{"train_loss": 1.5087718963623047, "global_step": 0, "epoch": 0} {"train_loss": 1.4584381580352783, "global_step": 1, "epoch": 0} {"train_loss": 1.4783220291137695, "global_step": 2, "epoch": 0} {"train_loss": 1.4505091905593872, "global_step": 3, "epoch": 0} {"train_loss": 1.3869550228118896, "global_step": 4, "epoch": 0} {"train_loss": 1.406092882156372, "global_step": 5, "epoch": 0} {"train_loss": 1.4631831645965576, "global_step": 6, "epoch": 0} {"train_loss": 1.413604736328125, "global_step": 7, "epoch": 0} {"train_loss": 1.3581793308258057, "global_step": 8, "epoch": 0} {"train_loss": 1.4041811227798462, "global_step": 9, "epoch": 0} {"train_loss": 1.288745403289795, "global_step": 10, "epoch": 0} {"train_loss": 1.3315072059631348, "global_step": 11, "epoch": 0} {"train_loss": 1.2144817113876343, "global_step": 12, "epoch": 0} {"train_loss": 1.1534671783447266, "global_step": 13, "epoch": 0} {"train_loss": 1.0852725505828857, "global_step": 14, "epoch": 0} {"train_loss": 1.1183756589889526, "global_step": 15, "epoch": 0} {"train_loss": 1.0588183403015137, "global_step": 16, "epoch": 0} {"train_loss": 1.019811987876892, "global_step": 17, "epoch": 0} {"train_loss": 0.9561283588409424, "global_step": 18, "epoch": 0} {"train_loss": 0.8956657648086548, "global_step": 19, "epoch": 0} {"train_loss": 0.8760327100753784, "global_step": 20, "epoch": 0} {"train_loss": 0.9600043892860413, "global_step": 21, "epoch": 0} {"train_loss": 0.7029733657836914, "global_step": 22, "epoch": 0} {"train_loss": 0.9969518184661865, "global_step": 23, "epoch": 0} {"train_loss": 0.7588522434234619, "global_step": 24, "epoch": 0} {"train_loss": 0.817291259765625, "global_step": 25, "epoch": 0} {"train_loss": 0.6722921133041382, "global_step": 26, "epoch": 0} {"train_loss": 0.6817041635513306, "global_step": 27, "epoch": 0} {"train_loss": 0.6301188468933105, "global_step": 28, "epoch": 0} {"train_loss": 0.5396246314048767, "global_step": 29, "epoch": 0} {"train_loss": 0.6999680995941162, "global_step": 30, "epoch": 0} {"train_loss": 0.6341136693954468, "global_step": 31, "epoch": 0} {"train_loss": 0.5358619689941406, "global_step": 32, "epoch": 0} {"train_loss": 0.387822687625885, "global_step": 33, "epoch": 0} {"train_loss": 0.4448048174381256, "global_step": 34, "epoch": 0} {"train_loss": 0.39631956815719604, "global_step": 35, "epoch": 0} {"train_loss": 0.26184067130088806, "global_step": 36, "epoch": 0} {"train_loss": 0.31087827682495117, "global_step": 37, "epoch": 0} {"train_loss": 0.41964221000671387, "global_step": 38, "epoch": 0} {"train_loss": 0.32992303371429443, "global_step": 39, "epoch": 0} {"train_loss": 0.2072918862104416, "global_step": 40, "epoch": 0} {"train_loss": 0.3637232184410095, "global_step": 41, "epoch": 0} {"train_loss": 0.1354846954345703, "global_step": 42, "epoch": 0} {"train_loss": 0.047817062586545944, "global_step": 43, "epoch": 0} {"train_loss": 0.12100528180599213, "global_step": 44, "epoch": 0} {"train_loss": -0.006403852254152298, "global_step": 45, "epoch": 0} {"train_loss": 0.1032082736492157, "global_step": 46, "epoch": 0} {"train_loss": 0.23585966229438782, "global_step": 47, "epoch": 0} {"train_loss": 0.20327983796596527, "global_step": 48, "epoch": 0} {"train_loss": 0.08528599143028259, "global_step": 49, "epoch": 0} {"train_loss": 0.2018631547689438, "global_step": 50, "epoch": 0} {"train_loss": -0.06802370399236679, "global_step": 51, "epoch": 0} {"train_loss": 0.04879593104124069, "global_step": 52, "epoch": 0} {"train_loss": -0.11218555271625519, "global_step": 53, "epoch": 0} {"train_loss": -0.07999765872955322, "global_step": 54, "epoch": 0} {"train_loss": -0.1807730495929718, "global_step": 55, "epoch": 0} {"train_loss": -0.14366403222084045, "global_step": 56, "epoch": 0} {"train_loss": -0.09867854416370392, "global_step": 57, "epoch": 0} {"train_loss": 0.07588060945272446, "global_step": 58, "epoch": 0} {"train_loss": -0.17300957441329956, "global_step": 59, "epoch": 0} {"train_loss": 0.01140158623456955, "global_step": 60, "epoch": 0} {"train_loss": -0.17359279096126556, "global_step": 61, "epoch": 0} {"train_loss": -0.004780083894729614, "global_step": 62, "epoch": 0} {"train_loss": -0.28423428535461426, "global_step": 63, "epoch": 0} {"train_loss": -0.20598968863487244, "global_step": 64, "epoch": 0} {"train_loss": -0.06629925221204758, "global_step": 65, "epoch": 0} {"train_loss": -0.18043455481529236, "global_step": 66, "epoch": 0} {"train_loss": -0.30981719493865967, "global_step": 67, "epoch": 0} {"train_loss": -0.3481934070587158, "global_step": 68, "epoch": 0} {"train_loss": -0.31916704773902893, "global_step": 69, "epoch": 0} {"train_loss": -0.2521877586841583, "global_step": 70, "epoch": 0} {"train_loss": -0.33896055817604065, "global_step": 71, "epoch": 0} {"train_loss": -0.5653420686721802, "global_step": 72, "epoch": 0} {"train_loss": -0.4393523931503296, "global_step": 73, "epoch": 0} {"train_loss": -0.3115609884262085, "global_step": 74, "epoch": 0} {"train_loss": -0.35493898391723633, "global_step": 75, "epoch": 0} {"train_loss": -0.4762752652168274, "global_step": 76, "epoch": 0} {"train_loss": -0.48015356063842773, "global_step": 77, "epoch": 0} {"train_loss": -0.39580410718917847, "global_step": 78, "epoch": 0} {"train_loss": -0.4199918508529663, "global_step": 79, "epoch": 0} {"train_loss": -0.5526270866394043, "global_step": 80, "epoch": 0} {"train_loss": -0.591464638710022, "global_step": 81, "epoch": 0} {"train_loss": -0.51606285572052, "global_step": 82, "epoch": 0} {"train_loss": -0.36256158351898193, "global_step": 83, "epoch": 0} {"train_loss": -0.39092594385147095, "global_step": 84, "epoch": 0} {"train_loss": -0.6266883611679077, "global_step": 85, "epoch": 0} {"train_loss": -0.48104554414749146, "global_step": 86, "epoch": 0} {"train_loss": -0.5656797885894775, "global_step": 87, "epoch": 0} {"train_loss": -0.6143358945846558, "global_step": 88, "epoch": 0} {"train_loss": -0.5248814821243286, "global_step": 89, "epoch": 0} {"train_loss": -0.6010569334030151, "global_step": 90, "epoch": 0} {"train_loss": -0.6949605941772461, "global_step": 91, "epoch": 0} {"train_loss": -0.4470926523208618, "global_step": 92, "epoch": 0} {"train_loss": -0.6324076056480408, "global_step": 93, "epoch": 0} {"train_loss": -0.7955647706985474, "global_step": 94, "epoch": 0} {"train_loss": -0.6675386428833008, "global_step": 95, "epoch": 0} {"train_loss": -0.5612695217132568, "global_step": 96, "epoch": 0} {"train_loss": -0.6988252401351929, "global_step": 97, "epoch": 0} {"train_loss": -0.5883594751358032, "global_step": 98, "epoch": 0} {"train_loss": -0.5599271059036255, "global_step": 99, "epoch": 0} {"train_loss": -0.8687881231307983, "global_step": 100, "epoch": 0} {"train_loss": -0.8209240436553955, "global_step": 101, "epoch": 0} {"train_loss": -0.7897267937660217, "global_step": 102, "epoch": 0} {"train_loss": -0.726331353187561, "global_step": 103, "epoch": 0} {"train_loss": -0.6948161125183105, "global_step": 104, "epoch": 0} {"train_loss": -0.7220853567123413, "global_step": 105, "epoch": 0} {"train_loss": -0.7996761798858643, "global_step": 106, "epoch": 0} {"train_loss": -0.5834689140319824, "global_step": 107, "epoch": 0} {"train_loss": -0.751915693283081, "global_step": 108, "epoch": 0} {"train_loss": -0.7228044271469116, "global_step": 109, "epoch": 0} {"train_loss": -0.833527147769928, "global_step": 110, "epoch": 0} {"train_loss": -0.7962908744812012, "global_step": 111, "epoch": 0} {"train_loss": -0.8994631767272949, "global_step": 112, "epoch": 0} {"train_loss": -0.8258957862854004, "global_step": 113, "epoch": 0} {"train_loss": -0.8768336772918701, "global_step": 114, "epoch": 0} {"train_loss": -0.8860517740249634, "global_step": 115, "epoch": 0} {"train_loss": -0.7363309860229492, "global_step": 116, "epoch": 0} {"train_loss": -0.8442221283912659, "global_step": 117, "epoch": 0} {"train_loss": -1.0594865083694458, "global_step": 118, "epoch": 0} {"train_loss": -0.8243080377578735, "global_step": 119, "epoch": 0} {"train_loss": -0.9572869539260864, "global_step": 120, "epoch": 0} {"train_loss": -0.9892432689666748, "global_step": 121, "epoch": 0} {"train_loss": -1.050072193145752, "global_step": 122, "epoch": 0} {"train_loss": -0.9509185552597046, "global_step": 123, "epoch": 0} {"train_loss": -0.9121131300926208, "global_step": 124, "epoch": 0} {"train_loss": -1.226387619972229, "global_step": 125, "epoch": 0} {"train_loss": -1.00144362449646, "global_step": 126, "epoch": 0} {"train_loss": -1.2508180141448975, "global_step": 127, "epoch": 0} {"train_loss": -1.1033155918121338, "global_step": 128, "epoch": 0} {"train_loss": -1.3794710636138916, "global_step": 129, "epoch": 0} {"train_loss": -1.2452914714813232, "global_step": 130, "epoch": 0} {"train_loss": -1.0750125646591187, "global_step": 131, "epoch": 0} {"train_loss": -1.1262290477752686, "global_step": 132, "epoch": 0} {"train_loss": -1.2072091102600098, "global_step": 133, "epoch": 0} {"train_loss": -1.128203272819519, "global_step": 134, "epoch": 0} {"train_loss": -1.1805670261383057, "global_step": 135, "epoch": 0} {"train_loss": -1.1813242435455322, "global_step": 136, "epoch": 0} {"train_loss": -0.8670884370803833, "global_step": 137, "epoch": 0} {"train_loss": -1.1490604877471924, "global_step": 138, "epoch": 0} {"train_loss": -1.2029123306274414, "global_step": 139, "epoch": 0} {"train_loss": -1.324493646621704, "global_step": 140, "epoch": 0} {"train_loss": -1.256986379623413, "global_step": 141, "epoch": 0} {"train_loss": -1.256711483001709, "global_step": 142, "epoch": 0} {"train_loss": -1.3856455087661743, "global_step": 143, "epoch": 0} {"train_loss": -1.0993661880493164, "global_step": 144, "epoch": 0} {"train_loss": -1.4225125312805176, "global_step": 145, "epoch": 0} {"train_loss": -1.069793939590454, "global_step": 146, "epoch": 0} {"train_loss": -1.3527542352676392, "global_step": 147, "epoch": 0} {"train_loss": -1.4029438495635986, "global_step": 148, "epoch": 0} {"train_loss": -1.331639051437378, "global_step": 149, "epoch": 0} {"train_loss": -1.4642915725708008, "global_step": 150, "epoch": 0} {"train_loss": -1.2504582405090332, "global_step": 151, "epoch": 0} {"train_loss": -1.1785904169082642, "global_step": 152, "epoch": 0} {"train_loss": -1.2735402584075928, "global_step": 153, "epoch": 0} {"train_loss": -1.0775964260101318, "global_step": 154, "epoch": 0} {"train_loss": -1.2439266443252563, "global_step": 155, "epoch": 0} {"train_loss": -1.48312509059906, "global_step": 156, "epoch": 0} {"train_loss": -1.4836031198501587, "global_step": 157, "epoch": 0} {"train_loss": -1.2549155950546265, "global_step": 158, "epoch": 0} {"train_loss": -1.1323167085647583, "global_step": 159, "epoch": 0} {"train_loss": -1.4264878034591675, "global_step": 160, "epoch": 0} {"train_loss": -1.1216394901275635, "global_step": 161, "epoch": 0} {"train_loss": -1.322833776473999, "global_step": 162, "epoch": 0} {"train_loss": -1.4028620719909668, "global_step": 163, "epoch": 0} {"train_loss": -1.2620995044708252, "global_step": 164, "epoch": 0} {"train_loss": -1.3881202936172485, "global_step": 165, "epoch": 0} {"train_loss": -1.5292819738388062, "global_step": 166, "epoch": 0} {"train_loss": -0.3198353834450245, "global_step": 167, "epoch": 0, "train/sim_max_reward_0": 0.2779087111461216, "train/sim_max_reward_1": 0.0006754812217992413, "train/sim_max_reward_2": 0.07618318709334786, "train/sim_max_reward_3": 0.44378783972848646, "train/sim_max_reward_4": 0.009503307570729362, "train/sim_max_reward_5": 0.51998533625086, "test/sim_max_reward_4400000": 0.08842786286054531, "test/sim_max_reward_4400001": 0.02549233263417755, "test/sim_max_reward_4400002": 0.04562221830354945, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.4808675168593215, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.30074379696400344, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.6071408112689617, "test/sim_max_reward_4400009": 0.031802151166831855, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.09297838756913566, "test/sim_max_reward_4400012": 0.14110722128947978, "test/sim_max_reward_4400013": 0.05569209882391426, "test/sim_max_reward_4400014": 0.0, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.8660475341365231, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.0005738315151986002, "test/sim_max_reward_4400024": 0.09996677568478458, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.48420145433045814, "test/sim_max_reward_4400028": 0.23280134335762884, "test/sim_max_reward_4400029": 0.02304704985098891, "test/sim_max_reward_4400030": 0.12382565423950331, "test/sim_max_reward_4400031": 0.00014962808613646573, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.11402047723020733, "test/sim_max_reward_4400034": 0.1454819325219592, "test/sim_max_reward_4400035": 0.33186262730927857, "test/sim_max_reward_4400036": 0.7688023719075899, "test/sim_max_reward_4400037": 0.0, "test/sim_max_reward_4400038": 0.0, "test/sim_max_reward_4400039": 0.5122579448356623, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.020099807521350335, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.0, "test/sim_max_reward_4400044": 0.013163128360347526, "test/sim_max_reward_4400045": 0.0, "test/sim_max_reward_4400046": 0.06556291296305793, "test/sim_max_reward_4400047": 0.1677796773541897, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.2213406438352241, "test/mean_score": 0.12850751419076384, "val_loss": 1833446.375, "train_action_mse_error": 1485.6846923828125} {"train_loss": -1.3598692417144775, "global_step": 168, "epoch": 1} {"train_loss": -1.4496160745620728, "global_step": 169, "epoch": 1} {"train_loss": -1.3597972393035889, "global_step": 170, "epoch": 1} {"train_loss": -1.6327488422393799, "global_step": 171, "epoch": 1} {"train_loss": -1.7488259077072144, "global_step": 172, "epoch": 1} {"train_loss": -1.4609339237213135, "global_step": 173, "epoch": 1} {"train_loss": -1.4462120532989502, "global_step": 174, "epoch": 1} {"train_loss": -1.3871572017669678, "global_step": 175, "epoch": 1} {"train_loss": -1.4353067874908447, "global_step": 176, "epoch": 1} {"train_loss": -1.5144940614700317, "global_step": 177, "epoch": 1} {"train_loss": -1.608506679534912, "global_step": 178, "epoch": 1} {"train_loss": -1.6530671119689941, "global_step": 179, "epoch": 1} {"train_loss": -1.4405710697174072, "global_step": 180, "epoch": 1} {"train_loss": -1.6300896406173706, "global_step": 181, "epoch": 1} {"train_loss": -1.7026863098144531, "global_step": 182, "epoch": 1} {"train_loss": -1.6308269500732422, "global_step": 183, "epoch": 1} {"train_loss": -1.429593801498413, "global_step": 184, "epoch": 1} {"train_loss": -1.6034858226776123, "global_step": 185, "epoch": 1} {"train_loss": -1.4558175802230835, "global_step": 186, "epoch": 1} {"train_loss": -1.6746017932891846, "global_step": 187, "epoch": 1} {"train_loss": -1.8102772235870361, "global_step": 188, "epoch": 1} {"train_loss": -1.6927173137664795, "global_step": 189, "epoch": 1} {"train_loss": -1.8286772966384888, "global_step": 190, "epoch": 1} {"train_loss": -1.748167872428894, "global_step": 191, "epoch": 1} {"train_loss": -1.5609480142593384, "global_step": 192, "epoch": 1} {"train_loss": -1.5072981119155884, "global_step": 193, "epoch": 1} {"train_loss": -1.589348554611206, "global_step": 194, "epoch": 1} {"train_loss": -1.4498474597930908, "global_step": 195, "epoch": 1} {"train_loss": -1.5574045181274414, "global_step": 196, "epoch": 1} {"train_loss": -1.4188933372497559, "global_step": 197, "epoch": 1} {"train_loss": -1.7106208801269531, "global_step": 198, "epoch": 1} {"train_loss": -1.6535495519638062, "global_step": 199, "epoch": 1} {"train_loss": -1.5345757007598877, "global_step": 200, "epoch": 1} {"train_loss": -1.4043222665786743, "global_step": 201, "epoch": 1} {"train_loss": -1.4552586078643799, "global_step": 202, "epoch": 1} {"train_loss": -1.8873157501220703, "global_step": 203, "epoch": 1} {"train_loss": -1.7487945556640625, "global_step": 204, "epoch": 1} {"train_loss": -2.013289213180542, "global_step": 205, "epoch": 1} {"train_loss": -1.619728684425354, "global_step": 206, "epoch": 1} {"train_loss": -1.6848623752593994, "global_step": 207, "epoch": 1} {"train_loss": -1.5255602598190308, "global_step": 208, "epoch": 1} {"train_loss": -1.7421411275863647, "global_step": 209, "epoch": 1} {"train_loss": -1.7284663915634155, "global_step": 210, "epoch": 1} {"train_loss": -1.505733847618103, "global_step": 211, "epoch": 1} {"train_loss": -1.8556926250457764, "global_step": 212, "epoch": 1} {"train_loss": -1.8713186979293823, "global_step": 213, "epoch": 1} {"train_loss": -1.747480034828186, "global_step": 214, "epoch": 1} {"train_loss": -1.930232048034668, "global_step": 215, "epoch": 1} {"train_loss": -1.7645152807235718, "global_step": 216, "epoch": 1} {"train_loss": -1.9419960975646973, "global_step": 217, "epoch": 1} {"train_loss": -1.7982711791992188, "global_step": 218, "epoch": 1} {"train_loss": -1.9899412393569946, "global_step": 219, "epoch": 1} {"train_loss": -1.943830132484436, "global_step": 220, "epoch": 1} {"train_loss": -1.4508169889450073, "global_step": 221, "epoch": 1} {"train_loss": -1.774566411972046, "global_step": 222, "epoch": 1} {"train_loss": -1.6008213758468628, "global_step": 223, "epoch": 1} {"train_loss": -2.0493383407592773, "global_step": 224, "epoch": 1} {"train_loss": -1.831601619720459, "global_step": 225, "epoch": 1} {"train_loss": -1.8670445680618286, "global_step": 226, "epoch": 1} {"train_loss": -1.824142336845398, "global_step": 227, "epoch": 1} {"train_loss": -1.9116251468658447, "global_step": 228, "epoch": 1} {"train_loss": -1.6276719570159912, "global_step": 229, "epoch": 1} {"train_loss": -1.8946930170059204, "global_step": 230, "epoch": 1} {"train_loss": -1.7703466415405273, "global_step": 231, "epoch": 1} {"train_loss": -2.0053887367248535, "global_step": 232, "epoch": 1} {"train_loss": -1.724611520767212, "global_step": 233, "epoch": 1} {"train_loss": -1.5977721214294434, "global_step": 234, "epoch": 1} {"train_loss": -2.0065600872039795, "global_step": 235, "epoch": 1} {"train_loss": -1.7455713748931885, "global_step": 236, "epoch": 1} {"train_loss": -2.0899596214294434, "global_step": 237, "epoch": 1} {"train_loss": -2.043205738067627, "global_step": 238, "epoch": 1} {"train_loss": -1.9572803974151611, "global_step": 239, "epoch": 1} {"train_loss": -1.9207603931427002, "global_step": 240, "epoch": 1} {"train_loss": -2.078627586364746, "global_step": 241, "epoch": 1} {"train_loss": -2.026599645614624, "global_step": 242, "epoch": 1} {"train_loss": -2.1832337379455566, "global_step": 243, "epoch": 1} {"train_loss": -2.005675792694092, "global_step": 244, "epoch": 1} {"train_loss": -1.7490994930267334, "global_step": 245, "epoch": 1} {"train_loss": -1.811765432357788, "global_step": 246, "epoch": 1} {"train_loss": -1.994755744934082, "global_step": 247, "epoch": 1} {"train_loss": -2.056732177734375, "global_step": 248, "epoch": 1} {"train_loss": -2.0269923210144043, "global_step": 249, "epoch": 1} {"train_loss": -2.0325818061828613, "global_step": 250, "epoch": 1} {"train_loss": -2.172569751739502, "global_step": 251, "epoch": 1} {"train_loss": -1.6312507390975952, "global_step": 252, "epoch": 1} {"train_loss": -1.9306902885437012, "global_step": 253, "epoch": 1} {"train_loss": -2.018646717071533, "global_step": 254, "epoch": 1} {"train_loss": -1.8511478900909424, "global_step": 255, "epoch": 1} {"train_loss": -1.8746905326843262, "global_step": 256, "epoch": 1} {"train_loss": -2.0706119537353516, "global_step": 257, "epoch": 1} {"train_loss": -1.9489622116088867, "global_step": 258, "epoch": 1} {"train_loss": -2.1029131412506104, "global_step": 259, "epoch": 1} {"train_loss": -2.2886743545532227, "global_step": 260, "epoch": 1} {"train_loss": -2.1630191802978516, "global_step": 261, "epoch": 1} {"train_loss": -1.9424974918365479, "global_step": 262, "epoch": 1} {"train_loss": -1.808718204498291, "global_step": 263, "epoch": 1} {"train_loss": -2.1535441875457764, "global_step": 264, "epoch": 1} {"train_loss": -2.0700626373291016, "global_step": 265, "epoch": 1} {"train_loss": -1.9404470920562744, "global_step": 266, "epoch": 1} {"train_loss": -1.9082322120666504, "global_step": 267, "epoch": 1} {"train_loss": -1.9312211275100708, "global_step": 268, "epoch": 1} {"train_loss": -1.976647138595581, "global_step": 269, "epoch": 1} {"train_loss": -2.1786656379699707, "global_step": 270, "epoch": 1} {"train_loss": -2.0452823638916016, "global_step": 271, "epoch": 1} {"train_loss": -1.8709261417388916, "global_step": 272, "epoch": 1} {"train_loss": -2.001445770263672, "global_step": 273, "epoch": 1} {"train_loss": -1.8939439058303833, "global_step": 274, "epoch": 1} {"train_loss": -1.9498987197875977, "global_step": 275, "epoch": 1} {"train_loss": -2.172739028930664, "global_step": 276, "epoch": 1} {"train_loss": -2.087322235107422, "global_step": 277, "epoch": 1} {"train_loss": -2.075577974319458, "global_step": 278, "epoch": 1} {"train_loss": -2.0568315982818604, "global_step": 279, "epoch": 1} {"train_loss": -2.2769453525543213, "global_step": 280, "epoch": 1} {"train_loss": -1.8469315767288208, "global_step": 281, "epoch": 1} {"train_loss": -2.2025890350341797, "global_step": 282, "epoch": 1} {"train_loss": -2.396730422973633, "global_step": 283, "epoch": 1} {"train_loss": -2.291419267654419, "global_step": 284, "epoch": 1} {"train_loss": -2.4622669219970703, "global_step": 285, "epoch": 1} {"train_loss": -2.414064884185791, "global_step": 286, "epoch": 1} {"train_loss": -2.334080934524536, "global_step": 287, "epoch": 1} {"train_loss": -2.2530598640441895, "global_step": 288, "epoch": 1} {"train_loss": -2.1377599239349365, "global_step": 289, "epoch": 1} {"train_loss": -2.056934118270874, "global_step": 290, "epoch": 1} {"train_loss": -2.137889862060547, "global_step": 291, "epoch": 1} {"train_loss": -2.196019411087036, "global_step": 292, "epoch": 1} {"train_loss": -2.1262145042419434, "global_step": 293, "epoch": 1} {"train_loss": -2.1860275268554688, "global_step": 294, "epoch": 1} {"train_loss": -2.3955442905426025, "global_step": 295, "epoch": 1} {"train_loss": -2.307629108428955, "global_step": 296, "epoch": 1} {"train_loss": -2.314507007598877, "global_step": 297, "epoch": 1} {"train_loss": -2.2638840675354004, "global_step": 298, "epoch": 1} {"train_loss": -2.350703716278076, "global_step": 299, "epoch": 1} {"train_loss": -2.238921642303467, "global_step": 300, "epoch": 1} {"train_loss": -2.451801300048828, "global_step": 301, "epoch": 1} {"train_loss": -2.4046263694763184, "global_step": 302, "epoch": 1} {"train_loss": -2.5348494052886963, "global_step": 303, "epoch": 1} {"train_loss": -2.2022461891174316, "global_step": 304, "epoch": 1} {"train_loss": -1.927852749824524, "global_step": 305, "epoch": 1} {"train_loss": -2.1137681007385254, "global_step": 306, "epoch": 1} {"train_loss": -1.98025643825531, "global_step": 307, "epoch": 1} {"train_loss": -2.3765392303466797, "global_step": 308, "epoch": 1} {"train_loss": -2.306666851043701, "global_step": 309, "epoch": 1} {"train_loss": -2.3313357830047607, "global_step": 310, "epoch": 1} {"train_loss": -2.340686321258545, "global_step": 311, "epoch": 1} {"train_loss": -2.0926530361175537, "global_step": 312, "epoch": 1} {"train_loss": -2.488772392272949, "global_step": 313, "epoch": 1} {"train_loss": -2.189993381500244, "global_step": 314, "epoch": 1} {"train_loss": -2.264644145965576, "global_step": 315, "epoch": 1} {"train_loss": -2.3200302124023438, "global_step": 316, "epoch": 1} {"train_loss": -2.4379706382751465, "global_step": 317, "epoch": 1} {"train_loss": -1.8839027881622314, "global_step": 318, "epoch": 1} {"train_loss": -2.1577095985412598, "global_step": 319, "epoch": 1} {"train_loss": -2.21346378326416, "global_step": 320, "epoch": 1} {"train_loss": -2.449146032333374, "global_step": 321, "epoch": 1} {"train_loss": -2.4452388286590576, "global_step": 322, "epoch": 1} {"train_loss": -2.3796863555908203, "global_step": 323, "epoch": 1} {"train_loss": -2.553769588470459, "global_step": 324, "epoch": 1} {"train_loss": -2.392214775085449, "global_step": 325, "epoch": 1} {"train_loss": -2.3936493396759033, "global_step": 326, "epoch": 1} {"train_loss": -2.447667121887207, "global_step": 327, "epoch": 1} {"train_loss": -2.3123581409454346, "global_step": 328, "epoch": 1} {"train_loss": -2.4045159816741943, "global_step": 329, "epoch": 1} {"train_loss": -2.248748540878296, "global_step": 330, "epoch": 1} {"train_loss": -2.5025525093078613, "global_step": 331, "epoch": 1} {"train_loss": -2.25740909576416, "global_step": 332, "epoch": 1} {"train_loss": -2.462477684020996, "global_step": 333, "epoch": 1} {"train_loss": -2.2617347240448, "global_step": 334, "epoch": 1} {"train_loss": -1.9632131542478288, "global_step": 335, "epoch": 1, "val_loss": 720643.3125} {"train_loss": -2.5167880058288574, "global_step": 336, "epoch": 2} {"train_loss": -2.3803770542144775, "global_step": 337, "epoch": 2} {"train_loss": -2.552548408508301, "global_step": 338, "epoch": 2} {"train_loss": -2.1836328506469727, "global_step": 339, "epoch": 2} {"train_loss": -2.365513324737549, "global_step": 340, "epoch": 2} {"train_loss": -2.2233352661132812, "global_step": 341, "epoch": 2} {"train_loss": -1.802168846130371, "global_step": 342, "epoch": 2} {"train_loss": -2.2751636505126953, "global_step": 343, "epoch": 2} {"train_loss": -1.8257806301116943, "global_step": 344, "epoch": 2} {"train_loss": -2.15763521194458, "global_step": 345, "epoch": 2} {"train_loss": -2.3028674125671387, "global_step": 346, "epoch": 2} {"train_loss": -2.050912857055664, "global_step": 347, "epoch": 2} {"train_loss": -2.2652199268341064, "global_step": 348, "epoch": 2} {"train_loss": -2.4407870769500732, "global_step": 349, "epoch": 2} {"train_loss": -2.244523048400879, "global_step": 350, "epoch": 2} {"train_loss": -2.4323136806488037, "global_step": 351, "epoch": 2} {"train_loss": -2.3012194633483887, "global_step": 352, "epoch": 2} {"train_loss": -2.3684310913085938, "global_step": 353, "epoch": 2} {"train_loss": -2.324594497680664, "global_step": 354, "epoch": 2} {"train_loss": -2.482394218444824, "global_step": 355, "epoch": 2} {"train_loss": -2.21529483795166, "global_step": 356, "epoch": 2} {"train_loss": -2.340485095977783, "global_step": 357, "epoch": 2} {"train_loss": -2.0137887001037598, "global_step": 358, "epoch": 2} {"train_loss": -2.452545166015625, "global_step": 359, "epoch": 2} {"train_loss": -2.4052035808563232, "global_step": 360, "epoch": 2} {"train_loss": -2.4431474208831787, "global_step": 361, "epoch": 2} {"train_loss": -2.3780996799468994, "global_step": 362, "epoch": 2} {"train_loss": -2.298833131790161, "global_step": 363, "epoch": 2} {"train_loss": -2.1426689624786377, "global_step": 364, "epoch": 2} {"train_loss": -2.434645414352417, "global_step": 365, "epoch": 2} {"train_loss": -2.4183173179626465, "global_step": 366, "epoch": 2} {"train_loss": -2.6186490058898926, "global_step": 367, "epoch": 2} {"train_loss": -2.6786556243896484, "global_step": 368, "epoch": 2} {"train_loss": -2.659684419631958, "global_step": 369, "epoch": 2} {"train_loss": -2.523932933807373, "global_step": 370, "epoch": 2} {"train_loss": -2.962800979614258, "global_step": 371, "epoch": 2} {"train_loss": -2.285421371459961, "global_step": 372, "epoch": 2} {"train_loss": -2.485328435897827, "global_step": 373, "epoch": 2} {"train_loss": -1.8237860202789307, "global_step": 374, "epoch": 2} {"train_loss": -2.6503331661224365, "global_step": 375, "epoch": 2} {"train_loss": -2.172529458999634, "global_step": 376, "epoch": 2} {"train_loss": -2.116623640060425, "global_step": 377, "epoch": 2} {"train_loss": -2.3652210235595703, "global_step": 378, "epoch": 2} {"train_loss": -2.307748556137085, "global_step": 379, "epoch": 2} {"train_loss": -2.4942080974578857, "global_step": 380, "epoch": 2} {"train_loss": -2.2161002159118652, "global_step": 381, "epoch": 2} {"train_loss": -2.543195962905884, "global_step": 382, "epoch": 2} {"train_loss": -2.369582176208496, "global_step": 383, "epoch": 2} {"train_loss": -2.3772006034851074, "global_step": 384, "epoch": 2} {"train_loss": -2.411166191101074, "global_step": 385, "epoch": 2} {"train_loss": -2.463895320892334, "global_step": 386, "epoch": 2} {"train_loss": -2.456434726715088, "global_step": 387, "epoch": 2} {"train_loss": -2.4493610858917236, "global_step": 388, "epoch": 2} {"train_loss": -2.3457460403442383, "global_step": 389, "epoch": 2} {"train_loss": -2.5282251834869385, "global_step": 390, "epoch": 2} {"train_loss": -2.6334338188171387, "global_step": 391, "epoch": 2} {"train_loss": -2.656390905380249, "global_step": 392, "epoch": 2} {"train_loss": -2.515263557434082, "global_step": 393, "epoch": 2} {"train_loss": -2.422088861465454, "global_step": 394, "epoch": 2} {"train_loss": -2.541868209838867, "global_step": 395, "epoch": 2} {"train_loss": -2.6236331462860107, "global_step": 396, "epoch": 2} {"train_loss": -2.708270311355591, "global_step": 397, "epoch": 2} {"train_loss": -2.398536205291748, "global_step": 398, "epoch": 2} {"train_loss": -2.5796778202056885, "global_step": 399, "epoch": 2} {"train_loss": -2.2566733360290527, "global_step": 400, "epoch": 2} {"train_loss": -2.6794633865356445, "global_step": 401, "epoch": 2} {"train_loss": -2.274237632751465, "global_step": 402, "epoch": 2} {"train_loss": -2.5546112060546875, "global_step": 403, "epoch": 2} {"train_loss": -2.640723705291748, "global_step": 404, "epoch": 2} {"train_loss": -2.307218551635742, "global_step": 405, "epoch": 2} {"train_loss": -2.5707788467407227, "global_step": 406, "epoch": 2} {"train_loss": -2.534672260284424, "global_step": 407, "epoch": 2} {"train_loss": -2.699474334716797, "global_step": 408, "epoch": 2} {"train_loss": -2.5502920150756836, "global_step": 409, "epoch": 2} {"train_loss": -2.38810396194458, "global_step": 410, "epoch": 2} {"train_loss": -2.910095691680908, "global_step": 411, "epoch": 2} {"train_loss": -2.4610745906829834, "global_step": 412, "epoch": 2} {"train_loss": -2.5833778381347656, "global_step": 413, "epoch": 2} {"train_loss": -2.6041293144226074, "global_step": 414, "epoch": 2} {"train_loss": -2.601724863052368, "global_step": 415, "epoch": 2} {"train_loss": -2.331054449081421, "global_step": 416, "epoch": 2} {"train_loss": -2.9082865715026855, "global_step": 417, "epoch": 2} {"train_loss": -2.8828506469726562, "global_step": 418, "epoch": 2} {"train_loss": -2.7328262329101562, "global_step": 419, "epoch": 2} {"train_loss": -2.646165609359741, "global_step": 420, "epoch": 2} {"train_loss": -2.7264111042022705, "global_step": 421, "epoch": 2} {"train_loss": -2.4122371673583984, "global_step": 422, "epoch": 2} {"train_loss": -2.6840333938598633, "global_step": 423, "epoch": 2} {"train_loss": -2.369309902191162, "global_step": 424, "epoch": 2} {"train_loss": -2.785775661468506, "global_step": 425, "epoch": 2} {"train_loss": -2.9253010749816895, "global_step": 426, "epoch": 2} {"train_loss": -2.5050771236419678, "global_step": 427, "epoch": 2} {"train_loss": -2.485377311706543, "global_step": 428, "epoch": 2} {"train_loss": -2.4268686771392822, "global_step": 429, "epoch": 2} {"train_loss": -2.6916093826293945, "global_step": 430, "epoch": 2} {"train_loss": -2.1947388648986816, "global_step": 431, "epoch": 2} {"train_loss": -2.6189658641815186, "global_step": 432, "epoch": 2} {"train_loss": -2.1835036277770996, "global_step": 433, "epoch": 2} {"train_loss": -2.3655495643615723, "global_step": 434, "epoch": 2} {"train_loss": -2.611783742904663, "global_step": 435, "epoch": 2} {"train_loss": -2.49006986618042, "global_step": 436, "epoch": 2} {"train_loss": -2.6729111671447754, "global_step": 437, "epoch": 2} {"train_loss": -2.5609307289123535, "global_step": 438, "epoch": 2} {"train_loss": -2.6792263984680176, "global_step": 439, "epoch": 2} {"train_loss": -2.8776493072509766, "global_step": 440, "epoch": 2} {"train_loss": -2.6182701587677, "global_step": 441, "epoch": 2} {"train_loss": -2.9018120765686035, "global_step": 442, "epoch": 2} {"train_loss": -2.75728178024292, "global_step": 443, "epoch": 2} {"train_loss": -2.5735771656036377, "global_step": 444, "epoch": 2} {"train_loss": -2.720214366912842, "global_step": 445, "epoch": 2} {"train_loss": -2.811032772064209, "global_step": 446, "epoch": 2} {"train_loss": -2.864525556564331, "global_step": 447, "epoch": 2} {"train_loss": -2.8317224979400635, "global_step": 448, "epoch": 2} {"train_loss": -2.642911195755005, "global_step": 449, "epoch": 2} {"train_loss": -2.6829559803009033, "global_step": 450, "epoch": 2} {"train_loss": -2.7831802368164062, "global_step": 451, "epoch": 2} {"train_loss": -2.6250200271606445, "global_step": 452, "epoch": 2} {"train_loss": -2.701200008392334, "global_step": 453, "epoch": 2} {"train_loss": -2.8117918968200684, "global_step": 454, "epoch": 2} {"train_loss": -2.8525447845458984, "global_step": 455, "epoch": 2} {"train_loss": -3.0156261920928955, "global_step": 456, "epoch": 2} {"train_loss": -2.739560842514038, "global_step": 457, "epoch": 2} {"train_loss": -2.8226475715637207, "global_step": 458, "epoch": 2} {"train_loss": -2.8866629600524902, "global_step": 459, "epoch": 2} {"train_loss": -2.71044921875, "global_step": 460, "epoch": 2} {"train_loss": -2.949429988861084, "global_step": 461, "epoch": 2} {"train_loss": -2.848684310913086, "global_step": 462, "epoch": 2} {"train_loss": -2.8074004650115967, "global_step": 463, "epoch": 2} {"train_loss": -2.6196346282958984, "global_step": 464, "epoch": 2} {"train_loss": -2.881899356842041, "global_step": 465, "epoch": 2} {"train_loss": -2.953059673309326, "global_step": 466, "epoch": 2} {"train_loss": -2.917884349822998, "global_step": 467, "epoch": 2} {"train_loss": -2.863802433013916, "global_step": 468, "epoch": 2} {"train_loss": -2.8440299034118652, "global_step": 469, "epoch": 2} {"train_loss": -3.088217258453369, "global_step": 470, "epoch": 2} {"train_loss": -2.88631010055542, "global_step": 471, "epoch": 2} {"train_loss": -2.8346385955810547, "global_step": 472, "epoch": 2} {"train_loss": -3.1702418327331543, "global_step": 473, "epoch": 2} {"train_loss": -2.9571125507354736, "global_step": 474, "epoch": 2} {"train_loss": -2.986994504928589, "global_step": 475, "epoch": 2} {"train_loss": -2.916395425796509, "global_step": 476, "epoch": 2} {"train_loss": -2.891444683074951, "global_step": 477, "epoch": 2} {"train_loss": -2.664125919342041, "global_step": 478, "epoch": 2} {"train_loss": -2.081348419189453, "global_step": 479, "epoch": 2} {"train_loss": -2.2278499603271484, "global_step": 480, "epoch": 2} {"train_loss": -2.6185030937194824, "global_step": 481, "epoch": 2} {"train_loss": -2.613722324371338, "global_step": 482, "epoch": 2} {"train_loss": -2.7751903533935547, "global_step": 483, "epoch": 2} {"train_loss": -2.7640552520751953, "global_step": 484, "epoch": 2} {"train_loss": -2.8730080127716064, "global_step": 485, "epoch": 2} {"train_loss": -2.7282938957214355, "global_step": 486, "epoch": 2} {"train_loss": -2.805649757385254, "global_step": 487, "epoch": 2} {"train_loss": -2.546442985534668, "global_step": 488, "epoch": 2} {"train_loss": -2.8854103088378906, "global_step": 489, "epoch": 2} {"train_loss": -2.7650794982910156, "global_step": 490, "epoch": 2} {"train_loss": -2.8514513969421387, "global_step": 491, "epoch": 2} {"train_loss": -2.8441455364227295, "global_step": 492, "epoch": 2} {"train_loss": -2.967785358428955, "global_step": 493, "epoch": 2} {"train_loss": -2.918189525604248, "global_step": 494, "epoch": 2} {"train_loss": -2.738302707672119, "global_step": 495, "epoch": 2} {"train_loss": -3.1660354137420654, "global_step": 496, "epoch": 2} {"train_loss": -2.879246234893799, "global_step": 497, "epoch": 2} {"train_loss": -2.7829554080963135, "global_step": 498, "epoch": 2} {"train_loss": -2.9617626667022705, "global_step": 499, "epoch": 2} {"train_loss": -2.787513494491577, "global_step": 500, "epoch": 2} {"train_loss": -2.7785778045654297, "global_step": 501, "epoch": 2} {"train_loss": -2.828463315963745, "global_step": 502, "epoch": 2} {"train_loss": -2.5854526460170746, "global_step": 503, "epoch": 2, "val_loss": 420009.3125} {"train_loss": -2.8168060779571533, "global_step": 504, "epoch": 3} {"train_loss": -3.017777919769287, "global_step": 505, "epoch": 3} {"train_loss": -2.6285486221313477, "global_step": 506, "epoch": 3} {"train_loss": -3.159069061279297, "global_step": 507, "epoch": 3} {"train_loss": -3.10164213180542, "global_step": 508, "epoch": 3} {"train_loss": -2.830021858215332, "global_step": 509, "epoch": 3} {"train_loss": -2.988292694091797, "global_step": 510, "epoch": 3} {"train_loss": -2.8770532608032227, "global_step": 511, "epoch": 3} {"train_loss": -2.92657470703125, "global_step": 512, "epoch": 3} {"train_loss": -2.9141788482666016, "global_step": 513, "epoch": 3} {"train_loss": -3.1768617630004883, "global_step": 514, "epoch": 3} {"train_loss": -2.7336511611938477, "global_step": 515, "epoch": 3} {"train_loss": -3.041780948638916, "global_step": 516, "epoch": 3} {"train_loss": -2.5423178672790527, "global_step": 517, "epoch": 3} {"train_loss": -2.8881635665893555, "global_step": 518, "epoch": 3} {"train_loss": -3.1332130432128906, "global_step": 519, "epoch": 3} {"train_loss": -2.5530004501342773, "global_step": 520, "epoch": 3} {"train_loss": -3.0719895362854004, "global_step": 521, "epoch": 3} {"train_loss": -3.1323704719543457, "global_step": 522, "epoch": 3} {"train_loss": -3.2461295127868652, "global_step": 523, "epoch": 3} {"train_loss": -2.7555274963378906, "global_step": 524, "epoch": 3} {"train_loss": -2.8489203453063965, "global_step": 525, "epoch": 3} {"train_loss": -2.959353446960449, "global_step": 526, "epoch": 3} {"train_loss": -3.064724922180176, "global_step": 527, "epoch": 3} {"train_loss": -2.8779428005218506, "global_step": 528, "epoch": 3} {"train_loss": -2.9306185245513916, "global_step": 529, "epoch": 3} {"train_loss": -3.0218682289123535, "global_step": 530, "epoch": 3} {"train_loss": -3.0421953201293945, "global_step": 531, "epoch": 3} {"train_loss": -3.0403366088867188, "global_step": 532, "epoch": 3} {"train_loss": -2.951324939727783, "global_step": 533, "epoch": 3} {"train_loss": -2.9679465293884277, "global_step": 534, "epoch": 3} {"train_loss": -3.0592217445373535, "global_step": 535, "epoch": 3} {"train_loss": -3.0929722785949707, "global_step": 536, "epoch": 3} {"train_loss": -3.0335030555725098, "global_step": 537, "epoch": 3} {"train_loss": -3.044309139251709, "global_step": 538, "epoch": 3} {"train_loss": -3.1304383277893066, "global_step": 539, "epoch": 3} {"train_loss": -2.980663299560547, "global_step": 540, "epoch": 3} {"train_loss": -2.884859561920166, "global_step": 541, "epoch": 3} {"train_loss": -2.816767692565918, "global_step": 542, "epoch": 3} {"train_loss": -2.812729835510254, "global_step": 543, "epoch": 3} {"train_loss": -3.0171079635620117, "global_step": 544, "epoch": 3} {"train_loss": -2.8743958473205566, "global_step": 545, "epoch": 3} {"train_loss": -3.217015504837036, "global_step": 546, "epoch": 3} {"train_loss": -3.1228132247924805, "global_step": 547, "epoch": 3} {"train_loss": -2.811440944671631, "global_step": 548, "epoch": 3} {"train_loss": -2.984931468963623, "global_step": 549, "epoch": 3} {"train_loss": -3.06852388381958, "global_step": 550, "epoch": 3} {"train_loss": -2.7922492027282715, "global_step": 551, "epoch": 3} {"train_loss": -2.82167911529541, "global_step": 552, "epoch": 3} {"train_loss": -2.7020740509033203, "global_step": 553, "epoch": 3} {"train_loss": -2.7068443298339844, "global_step": 554, "epoch": 3} {"train_loss": -2.9575610160827637, "global_step": 555, "epoch": 3} {"train_loss": -2.793935775756836, "global_step": 556, "epoch": 3} {"train_loss": -2.926511287689209, "global_step": 557, "epoch": 3} {"train_loss": -2.8686180114746094, "global_step": 558, "epoch": 3} {"train_loss": -2.811612844467163, "global_step": 559, "epoch": 3} {"train_loss": -2.974187135696411, "global_step": 560, "epoch": 3} {"train_loss": -3.1092638969421387, "global_step": 561, "epoch": 3} {"train_loss": -2.9847588539123535, "global_step": 562, "epoch": 3} {"train_loss": -3.0772905349731445, "global_step": 563, "epoch": 3} {"train_loss": -3.050135612487793, "global_step": 564, "epoch": 3} {"train_loss": -2.9397597312927246, "global_step": 565, "epoch": 3} {"train_loss": -2.994197368621826, "global_step": 566, "epoch": 3} {"train_loss": -2.754859447479248, "global_step": 567, "epoch": 3} {"train_loss": -2.9251997470855713, "global_step": 568, "epoch": 3} {"train_loss": -2.791853904724121, "global_step": 569, "epoch": 3} {"train_loss": -3.1545891761779785, "global_step": 570, "epoch": 3} {"train_loss": -2.594761848449707, "global_step": 571, "epoch": 3} {"train_loss": -2.7426090240478516, "global_step": 572, "epoch": 3} {"train_loss": -2.7591545581817627, "global_step": 573, "epoch": 3} {"train_loss": -2.825033664703369, "global_step": 574, "epoch": 3} {"train_loss": -2.904027223587036, "global_step": 575, "epoch": 3} {"train_loss": -3.1614580154418945, "global_step": 576, "epoch": 3} {"train_loss": -2.858485698699951, "global_step": 577, "epoch": 3} {"train_loss": -2.9419546127319336, "global_step": 578, "epoch": 3} {"train_loss": -3.094590902328491, "global_step": 579, "epoch": 3} {"train_loss": -3.141177177429199, "global_step": 580, "epoch": 3} {"train_loss": -2.9159607887268066, "global_step": 581, "epoch": 3} {"train_loss": -2.9885828495025635, "global_step": 582, "epoch": 3} {"train_loss": -2.9516594409942627, "global_step": 583, "epoch": 3} {"train_loss": -3.144420623779297, "global_step": 584, "epoch": 3} {"train_loss": -3.089160919189453, "global_step": 585, "epoch": 3} {"train_loss": -3.0759243965148926, "global_step": 586, "epoch": 3} {"train_loss": -3.118767023086548, "global_step": 587, "epoch": 3} {"train_loss": -2.8556571006774902, "global_step": 588, "epoch": 3} {"train_loss": -3.1054205894470215, "global_step": 589, "epoch": 3} {"train_loss": -2.9769952297210693, "global_step": 590, "epoch": 3} {"train_loss": -2.8608336448669434, "global_step": 591, "epoch": 3} {"train_loss": -3.238659143447876, "global_step": 592, "epoch": 3} {"train_loss": -3.1077685356140137, "global_step": 593, "epoch": 3} {"train_loss": -3.2485663890838623, "global_step": 594, "epoch": 3} {"train_loss": -3.0973246097564697, "global_step": 595, "epoch": 3} {"train_loss": -3.0771408081054688, "global_step": 596, "epoch": 3} {"train_loss": -3.001382350921631, "global_step": 597, "epoch": 3} {"train_loss": -3.1184983253479004, "global_step": 598, "epoch": 3} {"train_loss": -3.210174322128296, "global_step": 599, "epoch": 3} {"train_loss": -3.252264976501465, "global_step": 600, "epoch": 3} {"train_loss": -2.94983172416687, "global_step": 601, "epoch": 3} {"train_loss": -3.134800910949707, "global_step": 602, "epoch": 3} {"train_loss": -3.108320713043213, "global_step": 603, "epoch": 3} {"train_loss": -3.017399549484253, "global_step": 604, "epoch": 3} {"train_loss": -3.065524101257324, "global_step": 605, "epoch": 3} {"train_loss": -3.2234697341918945, "global_step": 606, "epoch": 3} {"train_loss": -3.3878865242004395, "global_step": 607, "epoch": 3} {"train_loss": -2.5657901763916016, "global_step": 608, "epoch": 3} {"train_loss": -3.0589680671691895, "global_step": 609, "epoch": 3} {"train_loss": -3.251521110534668, "global_step": 610, "epoch": 3} {"train_loss": -2.933281898498535, "global_step": 611, "epoch": 3} {"train_loss": -3.31480073928833, "global_step": 612, "epoch": 3} {"train_loss": -2.871419906616211, "global_step": 613, "epoch": 3} {"train_loss": -3.004304885864258, "global_step": 614, "epoch": 3} {"train_loss": -3.084134340286255, "global_step": 615, "epoch": 3} {"train_loss": -3.046917676925659, "global_step": 616, "epoch": 3} {"train_loss": -3.012498378753662, "global_step": 617, "epoch": 3} {"train_loss": -2.6267762184143066, "global_step": 618, "epoch": 3} {"train_loss": -2.8123412132263184, "global_step": 619, "epoch": 3} {"train_loss": -3.0097105503082275, "global_step": 620, "epoch": 3} {"train_loss": -2.170727014541626, "global_step": 621, "epoch": 3} {"train_loss": -2.620262622833252, "global_step": 622, "epoch": 3} {"train_loss": -2.616929054260254, "global_step": 623, "epoch": 3} {"train_loss": -2.724966049194336, "global_step": 624, "epoch": 3} {"train_loss": -2.7783095836639404, "global_step": 625, "epoch": 3} {"train_loss": -2.7933616638183594, "global_step": 626, "epoch": 3} {"train_loss": -2.8168020248413086, "global_step": 627, "epoch": 3} {"train_loss": -2.9375436305999756, "global_step": 628, "epoch": 3} {"train_loss": -3.0509190559387207, "global_step": 629, "epoch": 3} {"train_loss": -2.9171371459960938, "global_step": 630, "epoch": 3} {"train_loss": -2.9921908378601074, "global_step": 631, "epoch": 3} {"train_loss": -2.9737071990966797, "global_step": 632, "epoch": 3} {"train_loss": -3.0021214485168457, "global_step": 633, "epoch": 3} {"train_loss": -2.871922492980957, "global_step": 634, "epoch": 3} {"train_loss": -2.821986198425293, "global_step": 635, "epoch": 3} {"train_loss": -2.94807505607605, "global_step": 636, "epoch": 3} {"train_loss": -2.998145580291748, "global_step": 637, "epoch": 3} {"train_loss": -2.9977431297302246, "global_step": 638, "epoch": 3} {"train_loss": -3.1033716201782227, "global_step": 639, "epoch": 3} {"train_loss": -3.083367347717285, "global_step": 640, "epoch": 3} {"train_loss": -3.1294169425964355, "global_step": 641, "epoch": 3} {"train_loss": -3.111475944519043, "global_step": 642, "epoch": 3} {"train_loss": -3.3685145378112793, "global_step": 643, "epoch": 3} {"train_loss": -3.1679422855377197, "global_step": 644, "epoch": 3} {"train_loss": -2.7082695960998535, "global_step": 645, "epoch": 3} {"train_loss": -3.185468912124634, "global_step": 646, "epoch": 3} {"train_loss": -2.9254977703094482, "global_step": 647, "epoch": 3} {"train_loss": -3.1218957901000977, "global_step": 648, "epoch": 3} {"train_loss": -3.242767810821533, "global_step": 649, "epoch": 3} {"train_loss": -3.027362108230591, "global_step": 650, "epoch": 3} {"train_loss": -2.7770280838012695, "global_step": 651, "epoch": 3} {"train_loss": -3.0901215076446533, "global_step": 652, "epoch": 3} {"train_loss": -2.8110756874084473, "global_step": 653, "epoch": 3} {"train_loss": -3.015901565551758, "global_step": 654, "epoch": 3} {"train_loss": -3.073847532272339, "global_step": 655, "epoch": 3} {"train_loss": -3.0047638416290283, "global_step": 656, "epoch": 3} {"train_loss": -2.916728973388672, "global_step": 657, "epoch": 3} {"train_loss": -2.9150185585021973, "global_step": 658, "epoch": 3} {"train_loss": -3.073759078979492, "global_step": 659, "epoch": 3} {"train_loss": -3.1827330589294434, "global_step": 660, "epoch": 3} {"train_loss": -3.358936309814453, "global_step": 661, "epoch": 3} {"train_loss": -3.374086618423462, "global_step": 662, "epoch": 3} {"train_loss": -3.1207621097564697, "global_step": 663, "epoch": 3} {"train_loss": -3.2672510147094727, "global_step": 664, "epoch": 3} {"train_loss": -3.1890618801116943, "global_step": 665, "epoch": 3} {"train_loss": -3.424450159072876, "global_step": 666, "epoch": 3} {"train_loss": -3.3445234298706055, "global_step": 667, "epoch": 3} {"train_loss": -3.1695313453674316, "global_step": 668, "epoch": 3} {"train_loss": -3.39066743850708, "global_step": 669, "epoch": 3} {"train_loss": -3.112700939178467, "global_step": 670, "epoch": 3} {"train_loss": -2.99201243690082, "global_step": 671, "epoch": 3, "val_loss": 363205.0} {"train_loss": -3.458651065826416, "global_step": 672, "epoch": 4} {"train_loss": -3.4564268589019775, "global_step": 673, "epoch": 4} {"train_loss": -3.359344482421875, "global_step": 674, "epoch": 4} {"train_loss": -2.949306011199951, "global_step": 675, "epoch": 4} {"train_loss": -3.1382687091827393, "global_step": 676, "epoch": 4} {"train_loss": -3.136481285095215, "global_step": 677, "epoch": 4} {"train_loss": -3.4459714889526367, "global_step": 678, "epoch": 4} {"train_loss": -3.408620834350586, "global_step": 679, "epoch": 4} {"train_loss": -3.124716281890869, "global_step": 680, "epoch": 4} {"train_loss": -3.1121268272399902, "global_step": 681, "epoch": 4} {"train_loss": -3.3470401763916016, "global_step": 682, "epoch": 4} {"train_loss": -3.3820462226867676, "global_step": 683, "epoch": 4} {"train_loss": -3.346364974975586, "global_step": 684, "epoch": 4} {"train_loss": -3.442190647125244, "global_step": 685, "epoch": 4} {"train_loss": -3.168097972869873, "global_step": 686, "epoch": 4} {"train_loss": -3.2644004821777344, "global_step": 687, "epoch": 4} {"train_loss": -2.9846811294555664, "global_step": 688, "epoch": 4} {"train_loss": -3.318624496459961, "global_step": 689, "epoch": 4} {"train_loss": -3.2489547729492188, "global_step": 690, "epoch": 4} {"train_loss": -3.294574499130249, "global_step": 691, "epoch": 4} {"train_loss": -3.173605442047119, "global_step": 692, "epoch": 4} {"train_loss": -3.1800315380096436, "global_step": 693, "epoch": 4} {"train_loss": -3.310641288757324, "global_step": 694, "epoch": 4} {"train_loss": -3.471156597137451, "global_step": 695, "epoch": 4} {"train_loss": -3.1578874588012695, "global_step": 696, "epoch": 4} {"train_loss": -3.246284008026123, "global_step": 697, "epoch": 4} {"train_loss": -3.563793897628784, "global_step": 698, "epoch": 4} {"train_loss": -3.259692907333374, "global_step": 699, "epoch": 4} {"train_loss": -3.0522029399871826, "global_step": 700, "epoch": 4} {"train_loss": -3.4683761596679688, "global_step": 701, "epoch": 4} {"train_loss": -3.044184923171997, "global_step": 702, "epoch": 4} {"train_loss": -3.229641914367676, "global_step": 703, "epoch": 4} {"train_loss": -3.129584789276123, "global_step": 704, "epoch": 4} {"train_loss": -3.068164825439453, "global_step": 705, "epoch": 4} {"train_loss": -3.262073040008545, "global_step": 706, "epoch": 4} {"train_loss": -3.294099807739258, "global_step": 707, "epoch": 4} {"train_loss": -3.2769389152526855, "global_step": 708, "epoch": 4} {"train_loss": -3.1537697315216064, "global_step": 709, "epoch": 4} {"train_loss": -3.229970932006836, "global_step": 710, "epoch": 4} {"train_loss": -2.9778857231140137, "global_step": 711, "epoch": 4} {"train_loss": -3.0502891540527344, "global_step": 712, "epoch": 4} {"train_loss": -2.913447380065918, "global_step": 713, "epoch": 4} {"train_loss": -2.8303027153015137, "global_step": 714, "epoch": 4} {"train_loss": -2.946258306503296, "global_step": 715, "epoch": 4} {"train_loss": -2.9060420989990234, "global_step": 716, "epoch": 4} {"train_loss": -3.1305551528930664, "global_step": 717, "epoch": 4} {"train_loss": -3.2946364879608154, "global_step": 718, "epoch": 4} {"train_loss": -3.0126454830169678, "global_step": 719, "epoch": 4} {"train_loss": -3.0865025520324707, "global_step": 720, "epoch": 4} {"train_loss": -3.219719171524048, "global_step": 721, "epoch": 4} {"train_loss": -3.082909107208252, "global_step": 722, "epoch": 4} {"train_loss": -2.990963935852051, "global_step": 723, "epoch": 4} {"train_loss": -3.090343713760376, "global_step": 724, "epoch": 4} {"train_loss": -3.0235352516174316, "global_step": 725, "epoch": 4} {"train_loss": -3.4291720390319824, "global_step": 726, "epoch": 4} {"train_loss": -2.9583678245544434, "global_step": 727, "epoch": 4} {"train_loss": -3.285034656524658, "global_step": 728, "epoch": 4} {"train_loss": -3.3032257556915283, "global_step": 729, "epoch": 4} {"train_loss": -3.003347873687744, "global_step": 730, "epoch": 4} {"train_loss": -3.3237831592559814, "global_step": 731, "epoch": 4} {"train_loss": -3.0316967964172363, "global_step": 732, "epoch": 4} {"train_loss": -3.0291595458984375, "global_step": 733, "epoch": 4} {"train_loss": -3.1034092903137207, "global_step": 734, "epoch": 4} {"train_loss": -3.142991065979004, "global_step": 735, "epoch": 4} {"train_loss": -3.307422161102295, "global_step": 736, "epoch": 4} {"train_loss": -3.4071199893951416, "global_step": 737, "epoch": 4} {"train_loss": -3.267335891723633, "global_step": 738, "epoch": 4} {"train_loss": -3.3194448947906494, "global_step": 739, "epoch": 4} {"train_loss": -3.09234619140625, "global_step": 740, "epoch": 4} {"train_loss": -3.235868215560913, "global_step": 741, "epoch": 4} {"train_loss": -3.385225296020508, "global_step": 742, "epoch": 4} {"train_loss": -3.256387233734131, "global_step": 743, "epoch": 4} {"train_loss": -3.369180917739868, "global_step": 744, "epoch": 4} {"train_loss": -3.340965747833252, "global_step": 745, "epoch": 4} {"train_loss": -3.347053050994873, "global_step": 746, "epoch": 4} {"train_loss": -3.404939651489258, "global_step": 747, "epoch": 4} {"train_loss": -3.419700860977173, "global_step": 748, "epoch": 4} {"train_loss": -3.5747036933898926, "global_step": 749, "epoch": 4} {"train_loss": -3.1358041763305664, "global_step": 750, "epoch": 4} {"train_loss": -3.398660182952881, "global_step": 751, "epoch": 4} {"train_loss": -3.189970016479492, "global_step": 752, "epoch": 4} {"train_loss": -2.9240660667419434, "global_step": 753, "epoch": 4} {"train_loss": -3.3742198944091797, "global_step": 754, "epoch": 4} {"train_loss": -3.339613914489746, "global_step": 755, "epoch": 4} {"train_loss": -3.177694797515869, "global_step": 756, "epoch": 4} {"train_loss": -3.279928684234619, "global_step": 757, "epoch": 4} {"train_loss": -3.356996536254883, "global_step": 758, "epoch": 4} {"train_loss": -3.532989025115967, "global_step": 759, "epoch": 4} {"train_loss": -3.2597718238830566, "global_step": 760, "epoch": 4} {"train_loss": -3.2956337928771973, "global_step": 761, "epoch": 4} {"train_loss": -2.8071341514587402, "global_step": 762, "epoch": 4} {"train_loss": -3.3384270668029785, "global_step": 763, "epoch": 4} {"train_loss": -3.322359800338745, "global_step": 764, "epoch": 4} {"train_loss": -3.090104579925537, "global_step": 765, "epoch": 4} {"train_loss": -3.2338318824768066, "global_step": 766, "epoch": 4} {"train_loss": -2.7931017875671387, "global_step": 767, "epoch": 4} {"train_loss": -3.1808104515075684, "global_step": 768, "epoch": 4} {"train_loss": -3.3825206756591797, "global_step": 769, "epoch": 4} {"train_loss": -3.466175079345703, "global_step": 770, "epoch": 4} {"train_loss": -3.5189738273620605, "global_step": 771, "epoch": 4} {"train_loss": -3.484158515930176, "global_step": 772, "epoch": 4} {"train_loss": -3.390928268432617, "global_step": 773, "epoch": 4} {"train_loss": -3.348257541656494, "global_step": 774, "epoch": 4} {"train_loss": -3.4677886962890625, "global_step": 775, "epoch": 4} {"train_loss": -3.4021925926208496, "global_step": 776, "epoch": 4} {"train_loss": -3.683522939682007, "global_step": 777, "epoch": 4} {"train_loss": -3.47031569480896, "global_step": 778, "epoch": 4} {"train_loss": -3.1085753440856934, "global_step": 779, "epoch": 4} {"train_loss": -3.30673885345459, "global_step": 780, "epoch": 4} {"train_loss": -3.2550466060638428, "global_step": 781, "epoch": 4} {"train_loss": -3.334798574447632, "global_step": 782, "epoch": 4} {"train_loss": -3.332432270050049, "global_step": 783, "epoch": 4} {"train_loss": -3.4177732467651367, "global_step": 784, "epoch": 4} {"train_loss": -3.221968650817871, "global_step": 785, "epoch": 4} {"train_loss": -3.3917970657348633, "global_step": 786, "epoch": 4} {"train_loss": -3.399200439453125, "global_step": 787, "epoch": 4} {"train_loss": -3.2361888885498047, "global_step": 788, "epoch": 4} {"train_loss": -3.3983445167541504, "global_step": 789, "epoch": 4} {"train_loss": -3.2721099853515625, "global_step": 790, "epoch": 4} {"train_loss": -3.4612340927124023, "global_step": 791, "epoch": 4} {"train_loss": -3.6207046508789062, "global_step": 792, "epoch": 4} {"train_loss": -3.181915521621704, "global_step": 793, "epoch": 4} {"train_loss": -3.3567399978637695, "global_step": 794, "epoch": 4} {"train_loss": -3.1864676475524902, "global_step": 795, "epoch": 4} {"train_loss": -3.2197530269622803, "global_step": 796, "epoch": 4} {"train_loss": -3.149223804473877, "global_step": 797, "epoch": 4} {"train_loss": -3.512144088745117, "global_step": 798, "epoch": 4} {"train_loss": -2.858201026916504, "global_step": 799, "epoch": 4} {"train_loss": -3.3035407066345215, "global_step": 800, "epoch": 4} {"train_loss": -3.2929165363311768, "global_step": 801, "epoch": 4} {"train_loss": -3.3673391342163086, "global_step": 802, "epoch": 4} {"train_loss": -3.564443349838257, "global_step": 803, "epoch": 4} {"train_loss": -3.516176700592041, "global_step": 804, "epoch": 4} {"train_loss": -3.2905454635620117, "global_step": 805, "epoch": 4} {"train_loss": -3.4895401000976562, "global_step": 806, "epoch": 4} {"train_loss": -3.178318500518799, "global_step": 807, "epoch": 4} {"train_loss": -3.4332151412963867, "global_step": 808, "epoch": 4} {"train_loss": -3.4575557708740234, "global_step": 809, "epoch": 4} {"train_loss": -3.168116331100464, "global_step": 810, "epoch": 4} {"train_loss": -3.3451318740844727, "global_step": 811, "epoch": 4} {"train_loss": -3.398591995239258, "global_step": 812, "epoch": 4} {"train_loss": -3.2508926391601562, "global_step": 813, "epoch": 4} {"train_loss": -3.6315560340881348, "global_step": 814, "epoch": 4} {"train_loss": -3.3888397216796875, "global_step": 815, "epoch": 4} {"train_loss": -3.303126335144043, "global_step": 816, "epoch": 4} {"train_loss": -3.361158847808838, "global_step": 817, "epoch": 4} {"train_loss": -3.109164237976074, "global_step": 818, "epoch": 4} {"train_loss": -3.486121654510498, "global_step": 819, "epoch": 4} {"train_loss": -3.4820022583007812, "global_step": 820, "epoch": 4} {"train_loss": -3.2649149894714355, "global_step": 821, "epoch": 4} {"train_loss": -3.2976274490356445, "global_step": 822, "epoch": 4} {"train_loss": -3.066558361053467, "global_step": 823, "epoch": 4} {"train_loss": -3.449214220046997, "global_step": 824, "epoch": 4} {"train_loss": -3.1519789695739746, "global_step": 825, "epoch": 4} {"train_loss": -3.511620283126831, "global_step": 826, "epoch": 4} {"train_loss": -3.4748120307922363, "global_step": 827, "epoch": 4} {"train_loss": -3.444343090057373, "global_step": 828, "epoch": 4} {"train_loss": -3.3881711959838867, "global_step": 829, "epoch": 4} {"train_loss": -3.1701793670654297, "global_step": 830, "epoch": 4} {"train_loss": -3.3513450622558594, "global_step": 831, "epoch": 4} {"train_loss": -3.226832866668701, "global_step": 832, "epoch": 4} {"train_loss": -3.5203537940979004, "global_step": 833, "epoch": 4} {"train_loss": -3.47857666015625, "global_step": 834, "epoch": 4} {"train_loss": -3.6700005531311035, "global_step": 835, "epoch": 4} {"train_loss": -3.64900803565979, "global_step": 836, "epoch": 4} {"train_loss": -3.1971943378448486, "global_step": 837, "epoch": 4} {"train_loss": -3.1898398399353027, "global_step": 838, "epoch": 4} {"train_loss": -3.275569893064953, "global_step": 839, "epoch": 4, "val_loss": 345144.1875} {"train_loss": -3.4618887901306152, "global_step": 840, "epoch": 5} {"train_loss": -3.4628639221191406, "global_step": 841, "epoch": 5} {"train_loss": -3.289128065109253, "global_step": 842, "epoch": 5} {"train_loss": -3.6900250911712646, "global_step": 843, "epoch": 5} {"train_loss": -3.4327588081359863, "global_step": 844, "epoch": 5} {"train_loss": -3.697441339492798, "global_step": 845, "epoch": 5} {"train_loss": -3.2849841117858887, "global_step": 846, "epoch": 5} {"train_loss": -3.711174488067627, "global_step": 847, "epoch": 5} {"train_loss": -3.4416773319244385, "global_step": 848, "epoch": 5} {"train_loss": -3.424652576446533, "global_step": 849, "epoch": 5} {"train_loss": -3.285458564758301, "global_step": 850, "epoch": 5} {"train_loss": -3.6612095832824707, "global_step": 851, "epoch": 5} {"train_loss": -3.623495578765869, "global_step": 852, "epoch": 5} {"train_loss": -3.2233877182006836, "global_step": 853, "epoch": 5} {"train_loss": -3.4090523719787598, "global_step": 854, "epoch": 5} {"train_loss": -3.3326315879821777, "global_step": 855, "epoch": 5} {"train_loss": -3.387454032897949, "global_step": 856, "epoch": 5} {"train_loss": -3.2856335639953613, "global_step": 857, "epoch": 5} {"train_loss": -3.3974826335906982, "global_step": 858, "epoch": 5} {"train_loss": -3.4751088619232178, "global_step": 859, "epoch": 5} {"train_loss": -3.5665745735168457, "global_step": 860, "epoch": 5} {"train_loss": -3.240781784057617, "global_step": 861, "epoch": 5} {"train_loss": -3.6468687057495117, "global_step": 862, "epoch": 5} {"train_loss": -2.915447950363159, "global_step": 863, "epoch": 5} {"train_loss": -3.524660110473633, "global_step": 864, "epoch": 5} {"train_loss": -3.028524398803711, "global_step": 865, "epoch": 5} {"train_loss": -3.2076573371887207, "global_step": 866, "epoch": 5} {"train_loss": -3.0901761054992676, "global_step": 867, "epoch": 5} {"train_loss": -3.2156286239624023, "global_step": 868, "epoch": 5} {"train_loss": -3.1438469886779785, "global_step": 869, "epoch": 5} {"train_loss": -3.115199327468872, "global_step": 870, "epoch": 5} {"train_loss": -2.8333168029785156, "global_step": 871, "epoch": 5} {"train_loss": -3.295804023742676, "global_step": 872, "epoch": 5} {"train_loss": -2.9221174716949463, "global_step": 873, "epoch": 5} {"train_loss": -3.259108066558838, "global_step": 874, "epoch": 5} {"train_loss": -2.9393787384033203, "global_step": 875, "epoch": 5} {"train_loss": -3.089219570159912, "global_step": 876, "epoch": 5} {"train_loss": -3.3077054023742676, "global_step": 877, "epoch": 5} {"train_loss": -3.3964552879333496, "global_step": 878, "epoch": 5} {"train_loss": -3.1701979637145996, "global_step": 879, "epoch": 5} {"train_loss": -3.2137067317962646, "global_step": 880, "epoch": 5} {"train_loss": -3.506352186203003, "global_step": 881, "epoch": 5} {"train_loss": -3.4923014640808105, "global_step": 882, "epoch": 5} {"train_loss": -3.2224855422973633, "global_step": 883, "epoch": 5} {"train_loss": -3.544672966003418, "global_step": 884, "epoch": 5} {"train_loss": -3.4084348678588867, "global_step": 885, "epoch": 5} {"train_loss": -3.6898670196533203, "global_step": 886, "epoch": 5} {"train_loss": -3.4787449836730957, "global_step": 887, "epoch": 5} {"train_loss": -3.4337775707244873, "global_step": 888, "epoch": 5} {"train_loss": -3.348020076751709, "global_step": 889, "epoch": 5} {"train_loss": -3.4108338356018066, "global_step": 890, "epoch": 5} {"train_loss": -3.580752372741699, "global_step": 891, "epoch": 5} {"train_loss": -3.5671255588531494, "global_step": 892, "epoch": 5} {"train_loss": -3.531163215637207, "global_step": 893, "epoch": 5} {"train_loss": -3.422699451446533, "global_step": 894, "epoch": 5} {"train_loss": -3.715951919555664, "global_step": 895, "epoch": 5} {"train_loss": -3.3170604705810547, "global_step": 896, "epoch": 5} {"train_loss": -3.694161891937256, "global_step": 897, "epoch": 5} {"train_loss": -3.2936978340148926, "global_step": 898, "epoch": 5} {"train_loss": -3.4295406341552734, "global_step": 899, "epoch": 5} {"train_loss": -3.5077414512634277, "global_step": 900, "epoch": 5} {"train_loss": -3.229052782058716, "global_step": 901, "epoch": 5} {"train_loss": -3.5520057678222656, "global_step": 902, "epoch": 5} {"train_loss": -3.3349108695983887, "global_step": 903, "epoch": 5} {"train_loss": -3.7656280994415283, "global_step": 904, "epoch": 5} {"train_loss": -3.6905081272125244, "global_step": 905, "epoch": 5} {"train_loss": -3.5387682914733887, "global_step": 906, "epoch": 5} {"train_loss": -3.229393482208252, "global_step": 907, "epoch": 5} {"train_loss": -3.374276638031006, "global_step": 908, "epoch": 5} {"train_loss": -3.527052879333496, "global_step": 909, "epoch": 5} {"train_loss": -3.4816713333129883, "global_step": 910, "epoch": 5} {"train_loss": -3.5845394134521484, "global_step": 911, "epoch": 5} {"train_loss": -3.5551862716674805, "global_step": 912, "epoch": 5} {"train_loss": -3.5425500869750977, "global_step": 913, "epoch": 5} {"train_loss": -3.5382168292999268, "global_step": 914, "epoch": 5} {"train_loss": -3.401312828063965, "global_step": 915, "epoch": 5} {"train_loss": -3.5186522006988525, "global_step": 916, "epoch": 5} {"train_loss": -3.3651137351989746, "global_step": 917, "epoch": 5} {"train_loss": -3.492600917816162, "global_step": 918, "epoch": 5} {"train_loss": -3.4779930114746094, "global_step": 919, "epoch": 5} {"train_loss": -3.6190690994262695, "global_step": 920, "epoch": 5} {"train_loss": -3.2825257778167725, "global_step": 921, "epoch": 5} {"train_loss": -3.248736619949341, "global_step": 922, "epoch": 5} {"train_loss": -3.3697118759155273, "global_step": 923, "epoch": 5} {"train_loss": -3.477470874786377, "global_step": 924, "epoch": 5} {"train_loss": -3.554053783416748, "global_step": 925, "epoch": 5} {"train_loss": -3.322577476501465, "global_step": 926, "epoch": 5} {"train_loss": -3.469841241836548, "global_step": 927, "epoch": 5} {"train_loss": -3.612312078475952, "global_step": 928, "epoch": 5} {"train_loss": -3.732146739959717, "global_step": 929, "epoch": 5} {"train_loss": -3.5232319831848145, "global_step": 930, "epoch": 5} {"train_loss": -3.2854456901550293, "global_step": 931, "epoch": 5} {"train_loss": -3.281980514526367, "global_step": 932, "epoch": 5} {"train_loss": -3.548795223236084, "global_step": 933, "epoch": 5} {"train_loss": -3.300961494445801, "global_step": 934, "epoch": 5} {"train_loss": -3.2734906673431396, "global_step": 935, "epoch": 5} {"train_loss": -3.4942264556884766, "global_step": 936, "epoch": 5} {"train_loss": -3.599307060241699, "global_step": 937, "epoch": 5} {"train_loss": -3.363931655883789, "global_step": 938, "epoch": 5} {"train_loss": -3.508450746536255, "global_step": 939, "epoch": 5} {"train_loss": -3.4990878105163574, "global_step": 940, "epoch": 5} {"train_loss": -3.406561851501465, "global_step": 941, "epoch": 5} {"train_loss": -3.5631871223449707, "global_step": 942, "epoch": 5} {"train_loss": -3.6627700328826904, "global_step": 943, "epoch": 5} {"train_loss": -3.426637649536133, "global_step": 944, "epoch": 5} {"train_loss": -3.82585072517395, "global_step": 945, "epoch": 5} {"train_loss": -3.383993625640869, "global_step": 946, "epoch": 5} {"train_loss": -3.7643277645111084, "global_step": 947, "epoch": 5} {"train_loss": -3.363917350769043, "global_step": 948, "epoch": 5} {"train_loss": -3.2883150577545166, "global_step": 949, "epoch": 5} {"train_loss": -3.3980154991149902, "global_step": 950, "epoch": 5} {"train_loss": -3.6603198051452637, "global_step": 951, "epoch": 5} {"train_loss": -3.412848472595215, "global_step": 952, "epoch": 5} {"train_loss": -3.622995615005493, "global_step": 953, "epoch": 5} {"train_loss": -3.6570658683776855, "global_step": 954, "epoch": 5} {"train_loss": -3.6474733352661133, "global_step": 955, "epoch": 5} {"train_loss": -3.684171199798584, "global_step": 956, "epoch": 5} {"train_loss": -3.4036619663238525, "global_step": 957, "epoch": 5} {"train_loss": -3.6085548400878906, "global_step": 958, "epoch": 5} {"train_loss": -3.4982099533081055, "global_step": 959, "epoch": 5} {"train_loss": -3.6738975048065186, "global_step": 960, "epoch": 5} {"train_loss": -3.252333164215088, "global_step": 961, "epoch": 5} {"train_loss": -3.644542932510376, "global_step": 962, "epoch": 5} {"train_loss": -3.774264335632324, "global_step": 963, "epoch": 5} {"train_loss": -3.2613704204559326, "global_step": 964, "epoch": 5} {"train_loss": -3.4633398056030273, "global_step": 965, "epoch": 5} {"train_loss": -3.649202346801758, "global_step": 966, "epoch": 5} {"train_loss": -3.800063133239746, "global_step": 967, "epoch": 5} {"train_loss": -3.240485668182373, "global_step": 968, "epoch": 5} {"train_loss": -3.3648247718811035, "global_step": 969, "epoch": 5} {"train_loss": -3.677638530731201, "global_step": 970, "epoch": 5} {"train_loss": -3.2811272144317627, "global_step": 971, "epoch": 5} {"train_loss": -3.6203088760375977, "global_step": 972, "epoch": 5} {"train_loss": -3.318455934524536, "global_step": 973, "epoch": 5} {"train_loss": -3.6518795490264893, "global_step": 974, "epoch": 5} {"train_loss": -3.730142593383789, "global_step": 975, "epoch": 5} {"train_loss": -3.6354596614837646, "global_step": 976, "epoch": 5} {"train_loss": -3.4358158111572266, "global_step": 977, "epoch": 5} {"train_loss": -3.164081573486328, "global_step": 978, "epoch": 5} {"train_loss": -3.585944175720215, "global_step": 979, "epoch": 5} {"train_loss": -3.598423957824707, "global_step": 980, "epoch": 5} {"train_loss": -3.2905995845794678, "global_step": 981, "epoch": 5} {"train_loss": -3.253932476043701, "global_step": 982, "epoch": 5} {"train_loss": -3.5109925270080566, "global_step": 983, "epoch": 5} {"train_loss": -3.4244778156280518, "global_step": 984, "epoch": 5} {"train_loss": -3.1643853187561035, "global_step": 985, "epoch": 5} {"train_loss": -3.5866641998291016, "global_step": 986, "epoch": 5} {"train_loss": -3.3211536407470703, "global_step": 987, "epoch": 5} {"train_loss": -3.419933319091797, "global_step": 988, "epoch": 5} {"train_loss": -3.529900550842285, "global_step": 989, "epoch": 5} {"train_loss": -3.151251792907715, "global_step": 990, "epoch": 5} {"train_loss": -3.353148937225342, "global_step": 991, "epoch": 5} {"train_loss": -3.0321133136749268, "global_step": 992, "epoch": 5} {"train_loss": -3.2896201610565186, "global_step": 993, "epoch": 5} {"train_loss": -3.3612794876098633, "global_step": 994, "epoch": 5} {"train_loss": -3.350975751876831, "global_step": 995, "epoch": 5} {"train_loss": -3.3045661449432373, "global_step": 996, "epoch": 5} {"train_loss": -3.353095531463623, "global_step": 997, "epoch": 5} {"train_loss": -3.5227136611938477, "global_step": 998, "epoch": 5} {"train_loss": -3.2422375679016113, "global_step": 999, "epoch": 5} {"train_loss": -3.556522846221924, "global_step": 1000, "epoch": 5} {"train_loss": -3.5079097747802734, "global_step": 1001, "epoch": 5} {"train_loss": -3.4548778533935547, "global_step": 1002, "epoch": 5} {"train_loss": -3.713099956512451, "global_step": 1003, "epoch": 5} {"train_loss": -3.5781638622283936, "global_step": 1004, "epoch": 5} {"train_loss": -3.600226879119873, "global_step": 1005, "epoch": 5} {"train_loss": -3.3627383708953857, "global_step": 1006, "epoch": 5} {"train_loss": -3.4353959418478466, "global_step": 1007, "epoch": 5, "val_loss": 322691.21875, "train_action_mse_error": 189.7544403076172} {"train_loss": -3.4286351203918457, "global_step": 1008, "epoch": 6} {"train_loss": -3.6688175201416016, "global_step": 1009, "epoch": 6} {"train_loss": -3.4362926483154297, "global_step": 1010, "epoch": 6} {"train_loss": -3.6843183040618896, "global_step": 1011, "epoch": 6} {"train_loss": -3.3274760246276855, "global_step": 1012, "epoch": 6} {"train_loss": -3.6135072708129883, "global_step": 1013, "epoch": 6} {"train_loss": -3.6922574043273926, "global_step": 1014, "epoch": 6} {"train_loss": -3.1272850036621094, "global_step": 1015, "epoch": 6} {"train_loss": -3.716749668121338, "global_step": 1016, "epoch": 6} {"train_loss": -3.5061147212982178, "global_step": 1017, "epoch": 6} {"train_loss": -3.6463241577148438, "global_step": 1018, "epoch": 6} {"train_loss": -3.6940879821777344, "global_step": 1019, "epoch": 6} {"train_loss": -3.6419363021850586, "global_step": 1020, "epoch": 6} {"train_loss": -3.811919689178467, "global_step": 1021, "epoch": 6} {"train_loss": -3.537548065185547, "global_step": 1022, "epoch": 6} {"train_loss": -3.613229513168335, "global_step": 1023, "epoch": 6} {"train_loss": -3.584923267364502, "global_step": 1024, "epoch": 6} {"train_loss": -3.582237482070923, "global_step": 1025, "epoch": 6} {"train_loss": -3.5371253490448, "global_step": 1026, "epoch": 6} {"train_loss": -3.4563543796539307, "global_step": 1027, "epoch": 6} {"train_loss": -3.283498525619507, "global_step": 1028, "epoch": 6} {"train_loss": -3.0416507720947266, "global_step": 1029, "epoch": 6} {"train_loss": -3.599522590637207, "global_step": 1030, "epoch": 6} {"train_loss": -3.4339871406555176, "global_step": 1031, "epoch": 6} {"train_loss": -3.3972504138946533, "global_step": 1032, "epoch": 6} {"train_loss": -3.6292591094970703, "global_step": 1033, "epoch": 6} {"train_loss": -3.6404054164886475, "global_step": 1034, "epoch": 6} {"train_loss": -3.334893226623535, "global_step": 1035, "epoch": 6} {"train_loss": -3.584784507751465, "global_step": 1036, "epoch": 6} {"train_loss": -3.448042392730713, "global_step": 1037, "epoch": 6} {"train_loss": -3.310652494430542, "global_step": 1038, "epoch": 6} {"train_loss": -3.4715776443481445, "global_step": 1039, "epoch": 6} {"train_loss": -3.540572166442871, "global_step": 1040, "epoch": 6} {"train_loss": -3.8011083602905273, "global_step": 1041, "epoch": 6} {"train_loss": -3.5199220180511475, "global_step": 1042, "epoch": 6} {"train_loss": -3.301123857498169, "global_step": 1043, "epoch": 6} {"train_loss": -3.5898773670196533, "global_step": 1044, "epoch": 6} {"train_loss": -3.451005458831787, "global_step": 1045, "epoch": 6} {"train_loss": -3.4826855659484863, "global_step": 1046, "epoch": 6} {"train_loss": -3.441148281097412, "global_step": 1047, "epoch": 6} {"train_loss": -3.2623021602630615, "global_step": 1048, "epoch": 6} {"train_loss": -3.426100730895996, "global_step": 1049, "epoch": 6} {"train_loss": -3.363354206085205, "global_step": 1050, "epoch": 6} {"train_loss": -3.5528929233551025, "global_step": 1051, "epoch": 6} {"train_loss": -3.4375967979431152, "global_step": 1052, "epoch": 6} {"train_loss": -3.324659585952759, "global_step": 1053, "epoch": 6} {"train_loss": -3.5824384689331055, "global_step": 1054, "epoch": 6} {"train_loss": -3.154557704925537, "global_step": 1055, "epoch": 6} {"train_loss": -3.8953495025634766, "global_step": 1056, "epoch": 6} {"train_loss": -3.576291799545288, "global_step": 1057, "epoch": 6} {"train_loss": -3.6653342247009277, "global_step": 1058, "epoch": 6} {"train_loss": -3.4761974811553955, "global_step": 1059, "epoch": 6} {"train_loss": -3.6412289142608643, "global_step": 1060, "epoch": 6} {"train_loss": -3.553898334503174, "global_step": 1061, "epoch": 6} {"train_loss": -3.6659698486328125, "global_step": 1062, "epoch": 6} {"train_loss": -3.445608615875244, "global_step": 1063, "epoch": 6} {"train_loss": -3.611262559890747, "global_step": 1064, "epoch": 6} {"train_loss": -3.571025848388672, "global_step": 1065, "epoch": 6} {"train_loss": -3.502103805541992, "global_step": 1066, "epoch": 6} {"train_loss": -3.4945201873779297, "global_step": 1067, "epoch": 6} {"train_loss": -3.798933506011963, "global_step": 1068, "epoch": 6} {"train_loss": -3.503631114959717, "global_step": 1069, "epoch": 6} {"train_loss": -3.6170504093170166, "global_step": 1070, "epoch": 6} {"train_loss": -3.7100377082824707, "global_step": 1071, "epoch": 6} {"train_loss": -3.63089919090271, "global_step": 1072, "epoch": 6} {"train_loss": -3.6829614639282227, "global_step": 1073, "epoch": 6} {"train_loss": -3.7640719413757324, "global_step": 1074, "epoch": 6} {"train_loss": -3.8270466327667236, "global_step": 1075, "epoch": 6} {"train_loss": -3.891697883605957, "global_step": 1076, "epoch": 6} {"train_loss": -3.7476272583007812, "global_step": 1077, "epoch": 6} {"train_loss": -3.602867603302002, "global_step": 1078, "epoch": 6} {"train_loss": -3.624541759490967, "global_step": 1079, "epoch": 6} {"train_loss": -3.615795612335205, "global_step": 1080, "epoch": 6} {"train_loss": -3.773183584213257, "global_step": 1081, "epoch": 6} {"train_loss": -3.574157476425171, "global_step": 1082, "epoch": 6} {"train_loss": -3.6103415489196777, "global_step": 1083, "epoch": 6} {"train_loss": -3.4077420234680176, "global_step": 1084, "epoch": 6} {"train_loss": -3.5247135162353516, "global_step": 1085, "epoch": 6} {"train_loss": -3.3597192764282227, "global_step": 1086, "epoch": 6} {"train_loss": -3.876758098602295, "global_step": 1087, "epoch": 6} {"train_loss": -3.782081127166748, "global_step": 1088, "epoch": 6} {"train_loss": -3.6998796463012695, "global_step": 1089, "epoch": 6} {"train_loss": -3.5812225341796875, "global_step": 1090, "epoch": 6} {"train_loss": -3.6544718742370605, "global_step": 1091, "epoch": 6} {"train_loss": -3.79058837890625, "global_step": 1092, "epoch": 6} {"train_loss": -3.8040060997009277, "global_step": 1093, "epoch": 6} {"train_loss": -3.682091236114502, "global_step": 1094, "epoch": 6} {"train_loss": -3.6030116081237793, "global_step": 1095, "epoch": 6} {"train_loss": -3.6611037254333496, "global_step": 1096, "epoch": 6} {"train_loss": -3.3858509063720703, "global_step": 1097, "epoch": 6} {"train_loss": -3.7914466857910156, "global_step": 1098, "epoch": 6} {"train_loss": -3.624101161956787, "global_step": 1099, "epoch": 6} {"train_loss": -3.8159000873565674, "global_step": 1100, "epoch": 6} {"train_loss": -3.4905431270599365, "global_step": 1101, "epoch": 6} {"train_loss": -3.941070556640625, "global_step": 1102, "epoch": 6} {"train_loss": -3.6377604007720947, "global_step": 1103, "epoch": 6} {"train_loss": -3.6722636222839355, "global_step": 1104, "epoch": 6} {"train_loss": -3.664900779724121, "global_step": 1105, "epoch": 6} {"train_loss": -3.400826930999756, "global_step": 1106, "epoch": 6} {"train_loss": -3.6268815994262695, "global_step": 1107, "epoch": 6} {"train_loss": -3.7698469161987305, "global_step": 1108, "epoch": 6} {"train_loss": -3.5586845874786377, "global_step": 1109, "epoch": 6} {"train_loss": -3.7091455459594727, "global_step": 1110, "epoch": 6} {"train_loss": -3.6909751892089844, "global_step": 1111, "epoch": 6} {"train_loss": -3.5449891090393066, "global_step": 1112, "epoch": 6} {"train_loss": -3.6264898777008057, "global_step": 1113, "epoch": 6} {"train_loss": -3.630486011505127, "global_step": 1114, "epoch": 6} {"train_loss": -3.7151198387145996, "global_step": 1115, "epoch": 6} {"train_loss": -3.4564123153686523, "global_step": 1116, "epoch": 6} {"train_loss": -3.5166521072387695, "global_step": 1117, "epoch": 6} {"train_loss": -3.792387008666992, "global_step": 1118, "epoch": 6} {"train_loss": -3.8348426818847656, "global_step": 1119, "epoch": 6} {"train_loss": -3.573838472366333, "global_step": 1120, "epoch": 6} {"train_loss": -3.783752918243408, "global_step": 1121, "epoch": 6} {"train_loss": -3.5464837551116943, "global_step": 1122, "epoch": 6} {"train_loss": -3.636794090270996, "global_step": 1123, "epoch": 6} {"train_loss": -3.4741108417510986, "global_step": 1124, "epoch": 6} {"train_loss": -3.592984676361084, "global_step": 1125, "epoch": 6} {"train_loss": -3.714315176010132, "global_step": 1126, "epoch": 6} {"train_loss": -3.807023048400879, "global_step": 1127, "epoch": 6} {"train_loss": -3.419003486633301, "global_step": 1128, "epoch": 6} {"train_loss": -3.860517978668213, "global_step": 1129, "epoch": 6} {"train_loss": -3.5050172805786133, "global_step": 1130, "epoch": 6} {"train_loss": -3.89915132522583, "global_step": 1131, "epoch": 6} {"train_loss": -3.4214673042297363, "global_step": 1132, "epoch": 6} {"train_loss": -3.6628968715667725, "global_step": 1133, "epoch": 6} {"train_loss": -3.6244242191314697, "global_step": 1134, "epoch": 6} {"train_loss": -3.8591437339782715, "global_step": 1135, "epoch": 6} {"train_loss": -3.5599489212036133, "global_step": 1136, "epoch": 6} {"train_loss": -3.725950241088867, "global_step": 1137, "epoch": 6} {"train_loss": -3.871220111846924, "global_step": 1138, "epoch": 6} {"train_loss": -3.789764881134033, "global_step": 1139, "epoch": 6} {"train_loss": -3.6471455097198486, "global_step": 1140, "epoch": 6} {"train_loss": -3.775696277618408, "global_step": 1141, "epoch": 6} {"train_loss": -3.6260738372802734, "global_step": 1142, "epoch": 6} {"train_loss": -3.558171272277832, "global_step": 1143, "epoch": 6} {"train_loss": -3.8639984130859375, "global_step": 1144, "epoch": 6} {"train_loss": -3.7154719829559326, "global_step": 1145, "epoch": 6} {"train_loss": -3.6456074714660645, "global_step": 1146, "epoch": 6} {"train_loss": -3.6973371505737305, "global_step": 1147, "epoch": 6} {"train_loss": -3.437265396118164, "global_step": 1148, "epoch": 6} {"train_loss": -3.898414373397827, "global_step": 1149, "epoch": 6} {"train_loss": -3.8453598022460938, "global_step": 1150, "epoch": 6} {"train_loss": -3.7955613136291504, "global_step": 1151, "epoch": 6} {"train_loss": -3.6498494148254395, "global_step": 1152, "epoch": 6} {"train_loss": -3.765993118286133, "global_step": 1153, "epoch": 6} {"train_loss": -3.648491621017456, "global_step": 1154, "epoch": 6} {"train_loss": -3.9961533546447754, "global_step": 1155, "epoch": 6} {"train_loss": -3.607900619506836, "global_step": 1156, "epoch": 6} {"train_loss": -3.8107218742370605, "global_step": 1157, "epoch": 6} {"train_loss": -3.663027763366699, "global_step": 1158, "epoch": 6} {"train_loss": -3.919450521469116, "global_step": 1159, "epoch": 6} {"train_loss": -3.7518341541290283, "global_step": 1160, "epoch": 6} {"train_loss": -3.669522285461426, "global_step": 1161, "epoch": 6} {"train_loss": -3.6299774646759033, "global_step": 1162, "epoch": 6} {"train_loss": -3.8817384243011475, "global_step": 1163, "epoch": 6} {"train_loss": -3.6965432167053223, "global_step": 1164, "epoch": 6} {"train_loss": -3.9755001068115234, "global_step": 1165, "epoch": 6} {"train_loss": -3.7863268852233887, "global_step": 1166, "epoch": 6} {"train_loss": -3.6840531826019287, "global_step": 1167, "epoch": 6} {"train_loss": -3.8497350215911865, "global_step": 1168, "epoch": 6} {"train_loss": -3.7974352836608887, "global_step": 1169, "epoch": 6} {"train_loss": -3.7786307334899902, "global_step": 1170, "epoch": 6} {"train_loss": -3.5561492443084717, "global_step": 1171, "epoch": 6} {"train_loss": -3.7806766033172607, "global_step": 1172, "epoch": 6} {"train_loss": -3.677406072616577, "global_step": 1173, "epoch": 6} {"train_loss": -3.623777151107788, "global_step": 1174, "epoch": 6} {"train_loss": -3.6250287223429907, "global_step": 1175, "epoch": 6, "val_loss": 261951.171875} {"train_loss": -3.8526992797851562, "global_step": 1176, "epoch": 7} {"train_loss": -3.836611270904541, "global_step": 1177, "epoch": 7} {"train_loss": -3.552149772644043, "global_step": 1178, "epoch": 7} {"train_loss": -3.3520185947418213, "global_step": 1179, "epoch": 7} {"train_loss": -4.04616641998291, "global_step": 1180, "epoch": 7} {"train_loss": -3.3672423362731934, "global_step": 1181, "epoch": 7} {"train_loss": -3.8873822689056396, "global_step": 1182, "epoch": 7} {"train_loss": -3.6523923873901367, "global_step": 1183, "epoch": 7} {"train_loss": -3.7983779907226562, "global_step": 1184, "epoch": 7} {"train_loss": -3.8421554565429688, "global_step": 1185, "epoch": 7} {"train_loss": -3.836026906967163, "global_step": 1186, "epoch": 7} {"train_loss": -4.084791660308838, "global_step": 1187, "epoch": 7} {"train_loss": -3.871978759765625, "global_step": 1188, "epoch": 7} {"train_loss": -3.7356815338134766, "global_step": 1189, "epoch": 7} {"train_loss": -3.7380592823028564, "global_step": 1190, "epoch": 7} {"train_loss": -3.792670726776123, "global_step": 1191, "epoch": 7} {"train_loss": -3.893324851989746, "global_step": 1192, "epoch": 7} {"train_loss": -3.775115489959717, "global_step": 1193, "epoch": 7} {"train_loss": -3.732595205307007, "global_step": 1194, "epoch": 7} {"train_loss": -3.611067295074463, "global_step": 1195, "epoch": 7} {"train_loss": -3.712099075317383, "global_step": 1196, "epoch": 7} {"train_loss": -3.610776901245117, "global_step": 1197, "epoch": 7} {"train_loss": -3.8575429916381836, "global_step": 1198, "epoch": 7} {"train_loss": -3.700035572052002, "global_step": 1199, "epoch": 7} {"train_loss": -3.542994976043701, "global_step": 1200, "epoch": 7} {"train_loss": -3.8574302196502686, "global_step": 1201, "epoch": 7} {"train_loss": -3.510225772857666, "global_step": 1202, "epoch": 7} {"train_loss": -3.614818572998047, "global_step": 1203, "epoch": 7} {"train_loss": -3.3641538619995117, "global_step": 1204, "epoch": 7} {"train_loss": -3.645874500274658, "global_step": 1205, "epoch": 7} {"train_loss": -3.7916665077209473, "global_step": 1206, "epoch": 7} {"train_loss": -3.4052484035491943, "global_step": 1207, "epoch": 7} {"train_loss": -3.7115225791931152, "global_step": 1208, "epoch": 7} {"train_loss": -3.878941059112549, "global_step": 1209, "epoch": 7} {"train_loss": -3.7337303161621094, "global_step": 1210, "epoch": 7} {"train_loss": -3.6014509201049805, "global_step": 1211, "epoch": 7} {"train_loss": -3.9543802738189697, "global_step": 1212, "epoch": 7} {"train_loss": -3.6790781021118164, "global_step": 1213, "epoch": 7} {"train_loss": -3.7364096641540527, "global_step": 1214, "epoch": 7} {"train_loss": -3.8403122425079346, "global_step": 1215, "epoch": 7} {"train_loss": -3.726029396057129, "global_step": 1216, "epoch": 7} {"train_loss": -3.604503631591797, "global_step": 1217, "epoch": 7} {"train_loss": -3.726381540298462, "global_step": 1218, "epoch": 7} {"train_loss": -3.5937929153442383, "global_step": 1219, "epoch": 7} {"train_loss": -3.4363183975219727, "global_step": 1220, "epoch": 7} {"train_loss": -3.5782928466796875, "global_step": 1221, "epoch": 7} {"train_loss": -3.620821475982666, "global_step": 1222, "epoch": 7} {"train_loss": -3.8069591522216797, "global_step": 1223, "epoch": 7} {"train_loss": -3.813720226287842, "global_step": 1224, "epoch": 7} {"train_loss": -3.7402524948120117, "global_step": 1225, "epoch": 7} {"train_loss": -3.839620351791382, "global_step": 1226, "epoch": 7} {"train_loss": -3.867403030395508, "global_step": 1227, "epoch": 7} {"train_loss": -3.9901676177978516, "global_step": 1228, "epoch": 7} {"train_loss": -3.6673216819763184, "global_step": 1229, "epoch": 7} {"train_loss": -3.981898784637451, "global_step": 1230, "epoch": 7} {"train_loss": -3.4958486557006836, "global_step": 1231, "epoch": 7} {"train_loss": -3.7480387687683105, "global_step": 1232, "epoch": 7} {"train_loss": -3.329942464828491, "global_step": 1233, "epoch": 7} {"train_loss": -3.492234468460083, "global_step": 1234, "epoch": 7} {"train_loss": -3.3963091373443604, "global_step": 1235, "epoch": 7} {"train_loss": -3.6944422721862793, "global_step": 1236, "epoch": 7} {"train_loss": -3.776132583618164, "global_step": 1237, "epoch": 7} {"train_loss": -3.69907283782959, "global_step": 1238, "epoch": 7} {"train_loss": -3.707648754119873, "global_step": 1239, "epoch": 7} {"train_loss": -3.6710212230682373, "global_step": 1240, "epoch": 7} {"train_loss": -3.7523441314697266, "global_step": 1241, "epoch": 7} {"train_loss": -3.5483932495117188, "global_step": 1242, "epoch": 7} {"train_loss": -3.632460832595825, "global_step": 1243, "epoch": 7} {"train_loss": -3.4840145111083984, "global_step": 1244, "epoch": 7} {"train_loss": -3.5053768157958984, "global_step": 1245, "epoch": 7} {"train_loss": -3.7401323318481445, "global_step": 1246, "epoch": 7} {"train_loss": -3.857846975326538, "global_step": 1247, "epoch": 7} {"train_loss": -3.6740822792053223, "global_step": 1248, "epoch": 7} {"train_loss": -3.8170275688171387, "global_step": 1249, "epoch": 7} {"train_loss": -3.3991293907165527, "global_step": 1250, "epoch": 7} {"train_loss": -3.5493454933166504, "global_step": 1251, "epoch": 7} {"train_loss": -3.714719295501709, "global_step": 1252, "epoch": 7} {"train_loss": -3.6918933391571045, "global_step": 1253, "epoch": 7} {"train_loss": -3.5882766246795654, "global_step": 1254, "epoch": 7} {"train_loss": -3.4780476093292236, "global_step": 1255, "epoch": 7} {"train_loss": -3.7084689140319824, "global_step": 1256, "epoch": 7} {"train_loss": -3.519794464111328, "global_step": 1257, "epoch": 7} {"train_loss": -3.7634165287017822, "global_step": 1258, "epoch": 7} {"train_loss": -3.8678340911865234, "global_step": 1259, "epoch": 7} {"train_loss": -3.5307064056396484, "global_step": 1260, "epoch": 7} {"train_loss": -3.696894645690918, "global_step": 1261, "epoch": 7} {"train_loss": -3.466566562652588, "global_step": 1262, "epoch": 7} {"train_loss": -3.803553581237793, "global_step": 1263, "epoch": 7} {"train_loss": -3.5155818462371826, "global_step": 1264, "epoch": 7} {"train_loss": -3.705251932144165, "global_step": 1265, "epoch": 7} {"train_loss": -3.625272750854492, "global_step": 1266, "epoch": 7} {"train_loss": -3.6437957286834717, "global_step": 1267, "epoch": 7} {"train_loss": -3.651780605316162, "global_step": 1268, "epoch": 7} {"train_loss": -3.66050386428833, "global_step": 1269, "epoch": 7} {"train_loss": -3.4613733291625977, "global_step": 1270, "epoch": 7} {"train_loss": -3.793311834335327, "global_step": 1271, "epoch": 7} {"train_loss": -3.5819692611694336, "global_step": 1272, "epoch": 7} {"train_loss": -3.6510682106018066, "global_step": 1273, "epoch": 7} {"train_loss": -3.8154845237731934, "global_step": 1274, "epoch": 7} {"train_loss": -3.6619086265563965, "global_step": 1275, "epoch": 7} {"train_loss": -3.934701919555664, "global_step": 1276, "epoch": 7} {"train_loss": -3.5555965900421143, "global_step": 1277, "epoch": 7} {"train_loss": -3.8974099159240723, "global_step": 1278, "epoch": 7} {"train_loss": -3.780008316040039, "global_step": 1279, "epoch": 7} {"train_loss": -3.7376441955566406, "global_step": 1280, "epoch": 7} {"train_loss": -3.5126829147338867, "global_step": 1281, "epoch": 7} {"train_loss": -3.9282479286193848, "global_step": 1282, "epoch": 7} {"train_loss": -3.575819253921509, "global_step": 1283, "epoch": 7} {"train_loss": -3.8139970302581787, "global_step": 1284, "epoch": 7} {"train_loss": -3.621124744415283, "global_step": 1285, "epoch": 7} {"train_loss": -3.8444814682006836, "global_step": 1286, "epoch": 7} {"train_loss": -4.124446868896484, "global_step": 1287, "epoch": 7} {"train_loss": -3.9921798706054688, "global_step": 1288, "epoch": 7} {"train_loss": -3.971116304397583, "global_step": 1289, "epoch": 7} {"train_loss": -3.584188938140869, "global_step": 1290, "epoch": 7} {"train_loss": -3.718498706817627, "global_step": 1291, "epoch": 7} {"train_loss": -4.047595024108887, "global_step": 1292, "epoch": 7} {"train_loss": -3.8975117206573486, "global_step": 1293, "epoch": 7} {"train_loss": -3.6985225677490234, "global_step": 1294, "epoch": 7} {"train_loss": -3.959589958190918, "global_step": 1295, "epoch": 7} {"train_loss": -3.455986261367798, "global_step": 1296, "epoch": 7} {"train_loss": -3.689983367919922, "global_step": 1297, "epoch": 7} {"train_loss": -3.780996322631836, "global_step": 1298, "epoch": 7} {"train_loss": -3.7568721771240234, "global_step": 1299, "epoch": 7} {"train_loss": -3.8511080741882324, "global_step": 1300, "epoch": 7} {"train_loss": -3.799503803253174, "global_step": 1301, "epoch": 7} {"train_loss": -3.92626953125, "global_step": 1302, "epoch": 7} {"train_loss": -3.659349203109741, "global_step": 1303, "epoch": 7} {"train_loss": -3.5984694957733154, "global_step": 1304, "epoch": 7} {"train_loss": -3.4762511253356934, "global_step": 1305, "epoch": 7} {"train_loss": -3.4851083755493164, "global_step": 1306, "epoch": 7} {"train_loss": -3.6416573524475098, "global_step": 1307, "epoch": 7} {"train_loss": -3.239450693130493, "global_step": 1308, "epoch": 7} {"train_loss": -3.503520965576172, "global_step": 1309, "epoch": 7} {"train_loss": -3.5857512950897217, "global_step": 1310, "epoch": 7} {"train_loss": -3.247995615005493, "global_step": 1311, "epoch": 7} {"train_loss": -3.511106014251709, "global_step": 1312, "epoch": 7} {"train_loss": -3.8097918033599854, "global_step": 1313, "epoch": 7} {"train_loss": -3.183166980743408, "global_step": 1314, "epoch": 7} {"train_loss": -3.74888277053833, "global_step": 1315, "epoch": 7} {"train_loss": -3.7500979900360107, "global_step": 1316, "epoch": 7} {"train_loss": -3.4014244079589844, "global_step": 1317, "epoch": 7} {"train_loss": -3.6227567195892334, "global_step": 1318, "epoch": 7} {"train_loss": -3.613352060317993, "global_step": 1319, "epoch": 7} {"train_loss": -3.724632740020752, "global_step": 1320, "epoch": 7} {"train_loss": -3.9654762744903564, "global_step": 1321, "epoch": 7} {"train_loss": -3.6873581409454346, "global_step": 1322, "epoch": 7} {"train_loss": -3.841271162033081, "global_step": 1323, "epoch": 7} {"train_loss": -3.7656030654907227, "global_step": 1324, "epoch": 7} {"train_loss": -3.794109344482422, "global_step": 1325, "epoch": 7} {"train_loss": -3.690657138824463, "global_step": 1326, "epoch": 7} {"train_loss": -3.5761969089508057, "global_step": 1327, "epoch": 7} {"train_loss": -3.5566020011901855, "global_step": 1328, "epoch": 7} {"train_loss": -3.9462785720825195, "global_step": 1329, "epoch": 7} {"train_loss": -3.738412618637085, "global_step": 1330, "epoch": 7} {"train_loss": -3.55306339263916, "global_step": 1331, "epoch": 7} {"train_loss": -3.8735251426696777, "global_step": 1332, "epoch": 7} {"train_loss": -3.5932610034942627, "global_step": 1333, "epoch": 7} {"train_loss": -3.8217391967773438, "global_step": 1334, "epoch": 7} {"train_loss": -3.589107036590576, "global_step": 1335, "epoch": 7} {"train_loss": -3.727811574935913, "global_step": 1336, "epoch": 7} {"train_loss": -3.811157703399658, "global_step": 1337, "epoch": 7} {"train_loss": -3.783405065536499, "global_step": 1338, "epoch": 7} {"train_loss": -3.994737148284912, "global_step": 1339, "epoch": 7} {"train_loss": -3.849921226501465, "global_step": 1340, "epoch": 7} {"train_loss": -3.7154622077941895, "global_step": 1341, "epoch": 7} {"train_loss": -3.7681925296783447, "global_step": 1342, "epoch": 7} {"train_loss": -3.7000716825326285, "global_step": 1343, "epoch": 7, "val_loss": 266691.59375} {"train_loss": -3.4598312377929688, "global_step": 1344, "epoch": 8} {"train_loss": -3.7926318645477295, "global_step": 1345, "epoch": 8} {"train_loss": -3.536482572555542, "global_step": 1346, "epoch": 8} {"train_loss": -3.9386980533599854, "global_step": 1347, "epoch": 8} {"train_loss": -3.743163585662842, "global_step": 1348, "epoch": 8} {"train_loss": -3.5474486351013184, "global_step": 1349, "epoch": 8} {"train_loss": -3.494474172592163, "global_step": 1350, "epoch": 8} {"train_loss": -3.673863410949707, "global_step": 1351, "epoch": 8} {"train_loss": -3.7116289138793945, "global_step": 1352, "epoch": 8} {"train_loss": -3.60806941986084, "global_step": 1353, "epoch": 8} {"train_loss": -3.6036806106567383, "global_step": 1354, "epoch": 8} {"train_loss": -3.6344900131225586, "global_step": 1355, "epoch": 8} {"train_loss": -3.5720911026000977, "global_step": 1356, "epoch": 8} {"train_loss": -3.5289573669433594, "global_step": 1357, "epoch": 8} {"train_loss": -3.737776279449463, "global_step": 1358, "epoch": 8} {"train_loss": -3.7179737091064453, "global_step": 1359, "epoch": 8} {"train_loss": -3.780569553375244, "global_step": 1360, "epoch": 8} {"train_loss": -3.749490737915039, "global_step": 1361, "epoch": 8} {"train_loss": -3.599125385284424, "global_step": 1362, "epoch": 8} {"train_loss": -3.7075700759887695, "global_step": 1363, "epoch": 8} {"train_loss": -3.774381399154663, "global_step": 1364, "epoch": 8} {"train_loss": -3.7393758296966553, "global_step": 1365, "epoch": 8} {"train_loss": -3.952239990234375, "global_step": 1366, "epoch": 8} {"train_loss": -3.766573905944824, "global_step": 1367, "epoch": 8} {"train_loss": -3.6657848358154297, "global_step": 1368, "epoch": 8} {"train_loss": -3.9350290298461914, "global_step": 1369, "epoch": 8} {"train_loss": -3.824763774871826, "global_step": 1370, "epoch": 8} {"train_loss": -3.960176706314087, "global_step": 1371, "epoch": 8} {"train_loss": -4.003488540649414, "global_step": 1372, "epoch": 8} {"train_loss": -3.785144329071045, "global_step": 1373, "epoch": 8} {"train_loss": -3.883237838745117, "global_step": 1374, "epoch": 8} {"train_loss": -3.763505697250366, "global_step": 1375, "epoch": 8} {"train_loss": -3.8480520248413086, "global_step": 1376, "epoch": 8} {"train_loss": -3.8200201988220215, "global_step": 1377, "epoch": 8} {"train_loss": -3.980416774749756, "global_step": 1378, "epoch": 8} {"train_loss": -3.5094940662384033, "global_step": 1379, "epoch": 8} {"train_loss": -3.865281105041504, "global_step": 1380, "epoch": 8} {"train_loss": -3.928800582885742, "global_step": 1381, "epoch": 8} {"train_loss": -3.7052369117736816, "global_step": 1382, "epoch": 8} {"train_loss": -3.6978399753570557, "global_step": 1383, "epoch": 8} {"train_loss": -3.959782838821411, "global_step": 1384, "epoch": 8} {"train_loss": -3.5692543983459473, "global_step": 1385, "epoch": 8} {"train_loss": -4.088478088378906, "global_step": 1386, "epoch": 8} {"train_loss": -3.775698661804199, "global_step": 1387, "epoch": 8} {"train_loss": -3.9287667274475098, "global_step": 1388, "epoch": 8} {"train_loss": -3.8075449466705322, "global_step": 1389, "epoch": 8} {"train_loss": -3.8137123584747314, "global_step": 1390, "epoch": 8} {"train_loss": -3.548311710357666, "global_step": 1391, "epoch": 8} {"train_loss": -3.9065465927124023, "global_step": 1392, "epoch": 8} {"train_loss": -3.804901361465454, "global_step": 1393, "epoch": 8} {"train_loss": -3.9824109077453613, "global_step": 1394, "epoch": 8} {"train_loss": -3.9343926906585693, "global_step": 1395, "epoch": 8} {"train_loss": -3.8002796173095703, "global_step": 1396, "epoch": 8} {"train_loss": -3.782560348510742, "global_step": 1397, "epoch": 8} {"train_loss": -3.973153591156006, "global_step": 1398, "epoch": 8} {"train_loss": -3.762495517730713, "global_step": 1399, "epoch": 8} {"train_loss": -3.9734342098236084, "global_step": 1400, "epoch": 8} {"train_loss": -3.702740430831909, "global_step": 1401, "epoch": 8} {"train_loss": -3.7500813007354736, "global_step": 1402, "epoch": 8} {"train_loss": -3.9852452278137207, "global_step": 1403, "epoch": 8} {"train_loss": -3.5215649604797363, "global_step": 1404, "epoch": 8} {"train_loss": -3.853229522705078, "global_step": 1405, "epoch": 8} {"train_loss": -3.7373337745666504, "global_step": 1406, "epoch": 8} {"train_loss": -3.8290414810180664, "global_step": 1407, "epoch": 8} {"train_loss": -3.7378740310668945, "global_step": 1408, "epoch": 8} {"train_loss": -3.6983280181884766, "global_step": 1409, "epoch": 8} {"train_loss": -3.726069450378418, "global_step": 1410, "epoch": 8} {"train_loss": -3.5162296295166016, "global_step": 1411, "epoch": 8} {"train_loss": -4.066926002502441, "global_step": 1412, "epoch": 8} {"train_loss": -3.6360645294189453, "global_step": 1413, "epoch": 8} {"train_loss": -3.792571544647217, "global_step": 1414, "epoch": 8} {"train_loss": -3.407501459121704, "global_step": 1415, "epoch": 8} {"train_loss": -3.6700639724731445, "global_step": 1416, "epoch": 8} {"train_loss": -3.875185489654541, "global_step": 1417, "epoch": 8} {"train_loss": -3.6607325077056885, "global_step": 1418, "epoch": 8} {"train_loss": -3.7531020641326904, "global_step": 1419, "epoch": 8} {"train_loss": -3.569570779800415, "global_step": 1420, "epoch": 8} {"train_loss": -3.697735548019409, "global_step": 1421, "epoch": 8} {"train_loss": -3.869692325592041, "global_step": 1422, "epoch": 8} {"train_loss": -3.549619197845459, "global_step": 1423, "epoch": 8} {"train_loss": -3.9206929206848145, "global_step": 1424, "epoch": 8} {"train_loss": -3.484440326690674, "global_step": 1425, "epoch": 8} {"train_loss": -3.5616891384124756, "global_step": 1426, "epoch": 8} {"train_loss": -3.5339460372924805, "global_step": 1427, "epoch": 8} {"train_loss": -3.3604519367218018, "global_step": 1428, "epoch": 8} {"train_loss": -3.6423349380493164, "global_step": 1429, "epoch": 8} {"train_loss": -3.5928468704223633, "global_step": 1430, "epoch": 8} {"train_loss": -3.6086199283599854, "global_step": 1431, "epoch": 8} {"train_loss": -3.807389736175537, "global_step": 1432, "epoch": 8} {"train_loss": -3.73350191116333, "global_step": 1433, "epoch": 8} {"train_loss": -3.771289825439453, "global_step": 1434, "epoch": 8} {"train_loss": -3.9689180850982666, "global_step": 1435, "epoch": 8} {"train_loss": -3.6954708099365234, "global_step": 1436, "epoch": 8} {"train_loss": -3.793022632598877, "global_step": 1437, "epoch": 8} {"train_loss": -3.9961538314819336, "global_step": 1438, "epoch": 8} {"train_loss": -3.703707695007324, "global_step": 1439, "epoch": 8} {"train_loss": -3.7667722702026367, "global_step": 1440, "epoch": 8} {"train_loss": -3.795215129852295, "global_step": 1441, "epoch": 8} {"train_loss": -3.589853286743164, "global_step": 1442, "epoch": 8} {"train_loss": -3.8053088188171387, "global_step": 1443, "epoch": 8} {"train_loss": -3.8004963397979736, "global_step": 1444, "epoch": 8} {"train_loss": -3.7170658111572266, "global_step": 1445, "epoch": 8} {"train_loss": -3.9218056201934814, "global_step": 1446, "epoch": 8} {"train_loss": -3.9684574604034424, "global_step": 1447, "epoch": 8} {"train_loss": -4.173877716064453, "global_step": 1448, "epoch": 8} {"train_loss": -3.7421741485595703, "global_step": 1449, "epoch": 8} {"train_loss": -3.8609628677368164, "global_step": 1450, "epoch": 8} {"train_loss": -4.072291374206543, "global_step": 1451, "epoch": 8} {"train_loss": -3.913527727127075, "global_step": 1452, "epoch": 8} {"train_loss": -4.033753395080566, "global_step": 1453, "epoch": 8} {"train_loss": -3.961669445037842, "global_step": 1454, "epoch": 8} {"train_loss": -4.033736228942871, "global_step": 1455, "epoch": 8} {"train_loss": -3.749525547027588, "global_step": 1456, "epoch": 8} {"train_loss": -3.9080276489257812, "global_step": 1457, "epoch": 8} {"train_loss": -3.988734006881714, "global_step": 1458, "epoch": 8} {"train_loss": -3.9553120136260986, "global_step": 1459, "epoch": 8} {"train_loss": -3.9683890342712402, "global_step": 1460, "epoch": 8} {"train_loss": -4.0547871589660645, "global_step": 1461, "epoch": 8} {"train_loss": -3.7499871253967285, "global_step": 1462, "epoch": 8} {"train_loss": -3.890869379043579, "global_step": 1463, "epoch": 8} {"train_loss": -3.837286949157715, "global_step": 1464, "epoch": 8} {"train_loss": -3.9054625034332275, "global_step": 1465, "epoch": 8} {"train_loss": -3.983182430267334, "global_step": 1466, "epoch": 8} {"train_loss": -3.8860111236572266, "global_step": 1467, "epoch": 8} {"train_loss": -4.006711959838867, "global_step": 1468, "epoch": 8} {"train_loss": -3.9635703563690186, "global_step": 1469, "epoch": 8} {"train_loss": -3.773707389831543, "global_step": 1470, "epoch": 8} {"train_loss": -4.21852970123291, "global_step": 1471, "epoch": 8} {"train_loss": -3.7722604274749756, "global_step": 1472, "epoch": 8} {"train_loss": -4.201207160949707, "global_step": 1473, "epoch": 8} {"train_loss": -3.9556732177734375, "global_step": 1474, "epoch": 8} {"train_loss": -3.8016538619995117, "global_step": 1475, "epoch": 8} {"train_loss": -4.005791187286377, "global_step": 1476, "epoch": 8} {"train_loss": -4.103182792663574, "global_step": 1477, "epoch": 8} {"train_loss": -3.9107139110565186, "global_step": 1478, "epoch": 8} {"train_loss": -3.6771931648254395, "global_step": 1479, "epoch": 8} {"train_loss": -3.4278430938720703, "global_step": 1480, "epoch": 8} {"train_loss": -3.8758392333984375, "global_step": 1481, "epoch": 8} {"train_loss": -3.6065783500671387, "global_step": 1482, "epoch": 8} {"train_loss": -3.824594497680664, "global_step": 1483, "epoch": 8} {"train_loss": -3.7987260818481445, "global_step": 1484, "epoch": 8} {"train_loss": -3.5695226192474365, "global_step": 1485, "epoch": 8} {"train_loss": -3.9286909103393555, "global_step": 1486, "epoch": 8} {"train_loss": -3.877272844314575, "global_step": 1487, "epoch": 8} {"train_loss": -3.7899906635284424, "global_step": 1488, "epoch": 8} {"train_loss": -3.8563952445983887, "global_step": 1489, "epoch": 8} {"train_loss": -3.631890296936035, "global_step": 1490, "epoch": 8} {"train_loss": -3.890346050262451, "global_step": 1491, "epoch": 8} {"train_loss": -3.786726474761963, "global_step": 1492, "epoch": 8} {"train_loss": -3.9660375118255615, "global_step": 1493, "epoch": 8} {"train_loss": -4.071378231048584, "global_step": 1494, "epoch": 8} {"train_loss": -3.88893461227417, "global_step": 1495, "epoch": 8} {"train_loss": -4.057715892791748, "global_step": 1496, "epoch": 8} {"train_loss": -4.017439842224121, "global_step": 1497, "epoch": 8} {"train_loss": -4.0149760246276855, "global_step": 1498, "epoch": 8} {"train_loss": -4.059401512145996, "global_step": 1499, "epoch": 8} {"train_loss": -4.01694393157959, "global_step": 1500, "epoch": 8} {"train_loss": -4.085827350616455, "global_step": 1501, "epoch": 8} {"train_loss": -3.9653637409210205, "global_step": 1502, "epoch": 8} {"train_loss": -4.047327041625977, "global_step": 1503, "epoch": 8} {"train_loss": -3.9098317623138428, "global_step": 1504, "epoch": 8} {"train_loss": -3.8257265090942383, "global_step": 1505, "epoch": 8} {"train_loss": -3.661372661590576, "global_step": 1506, "epoch": 8} {"train_loss": -3.9543473720550537, "global_step": 1507, "epoch": 8} {"train_loss": -3.6167545318603516, "global_step": 1508, "epoch": 8} {"train_loss": -3.99479603767395, "global_step": 1509, "epoch": 8} {"train_loss": -3.8381175994873047, "global_step": 1510, "epoch": 8} {"train_loss": -3.8094485018934523, "global_step": 1511, "epoch": 8, "val_loss": 269568.71875} {"train_loss": -3.807527542114258, "global_step": 1512, "epoch": 9} {"train_loss": -4.096004486083984, "global_step": 1513, "epoch": 9} {"train_loss": -4.056596279144287, "global_step": 1514, "epoch": 9} {"train_loss": -3.6579151153564453, "global_step": 1515, "epoch": 9} {"train_loss": -3.801020860671997, "global_step": 1516, "epoch": 9} {"train_loss": -4.0325517654418945, "global_step": 1517, "epoch": 9} {"train_loss": -3.9114303588867188, "global_step": 1518, "epoch": 9} {"train_loss": -3.642819404602051, "global_step": 1519, "epoch": 9} {"train_loss": -3.6314964294433594, "global_step": 1520, "epoch": 9} {"train_loss": -3.816072463989258, "global_step": 1521, "epoch": 9} {"train_loss": -3.8955373764038086, "global_step": 1522, "epoch": 9} {"train_loss": -3.9352316856384277, "global_step": 1523, "epoch": 9} {"train_loss": -3.876573324203491, "global_step": 1524, "epoch": 9} {"train_loss": -3.8488264083862305, "global_step": 1525, "epoch": 9} {"train_loss": -3.8694517612457275, "global_step": 1526, "epoch": 9} {"train_loss": -3.7841529846191406, "global_step": 1527, "epoch": 9} {"train_loss": -3.9593191146850586, "global_step": 1528, "epoch": 9} {"train_loss": -3.8730382919311523, "global_step": 1529, "epoch": 9} {"train_loss": -3.8910887241363525, "global_step": 1530, "epoch": 9} {"train_loss": -3.7067222595214844, "global_step": 1531, "epoch": 9} {"train_loss": -4.098026275634766, "global_step": 1532, "epoch": 9} {"train_loss": -4.009756565093994, "global_step": 1533, "epoch": 9} {"train_loss": -3.821566581726074, "global_step": 1534, "epoch": 9} {"train_loss": -3.7983808517456055, "global_step": 1535, "epoch": 9} {"train_loss": -3.876537799835205, "global_step": 1536, "epoch": 9} {"train_loss": -4.0250444412231445, "global_step": 1537, "epoch": 9} {"train_loss": -3.8329949378967285, "global_step": 1538, "epoch": 9} {"train_loss": -4.3778533935546875, "global_step": 1539, "epoch": 9} {"train_loss": -3.590026617050171, "global_step": 1540, "epoch": 9} {"train_loss": -3.8084940910339355, "global_step": 1541, "epoch": 9} {"train_loss": -3.723048210144043, "global_step": 1542, "epoch": 9} {"train_loss": -3.920102596282959, "global_step": 1543, "epoch": 9} {"train_loss": -3.9430079460144043, "global_step": 1544, "epoch": 9} {"train_loss": -3.8162689208984375, "global_step": 1545, "epoch": 9} {"train_loss": -3.9545271396636963, "global_step": 1546, "epoch": 9} {"train_loss": -3.6286613941192627, "global_step": 1547, "epoch": 9} {"train_loss": -4.0335893630981445, "global_step": 1548, "epoch": 9} {"train_loss": -3.9298744201660156, "global_step": 1549, "epoch": 9} {"train_loss": -3.839737892150879, "global_step": 1550, "epoch": 9} {"train_loss": -4.182364463806152, "global_step": 1551, "epoch": 9} {"train_loss": -4.0864152908325195, "global_step": 1552, "epoch": 9} {"train_loss": -3.9261813163757324, "global_step": 1553, "epoch": 9} {"train_loss": -4.138123512268066, "global_step": 1554, "epoch": 9} {"train_loss": -3.999986171722412, "global_step": 1555, "epoch": 9} {"train_loss": -4.093181610107422, "global_step": 1556, "epoch": 9} {"train_loss": -3.827096939086914, "global_step": 1557, "epoch": 9} {"train_loss": -4.169790267944336, "global_step": 1558, "epoch": 9} {"train_loss": -3.831965446472168, "global_step": 1559, "epoch": 9} {"train_loss": -4.2776899337768555, "global_step": 1560, "epoch": 9} {"train_loss": -4.23174524307251, "global_step": 1561, "epoch": 9} {"train_loss": -4.141733169555664, "global_step": 1562, "epoch": 9} {"train_loss": -3.995224952697754, "global_step": 1563, "epoch": 9} {"train_loss": -3.677985429763794, "global_step": 1564, "epoch": 9} {"train_loss": -3.9707436561584473, "global_step": 1565, "epoch": 9} {"train_loss": -4.007447242736816, "global_step": 1566, "epoch": 9} {"train_loss": -3.961336851119995, "global_step": 1567, "epoch": 9} {"train_loss": -4.034258842468262, "global_step": 1568, "epoch": 9} {"train_loss": -4.187648773193359, "global_step": 1569, "epoch": 9} {"train_loss": -3.704869270324707, "global_step": 1570, "epoch": 9} {"train_loss": -3.935048818588257, "global_step": 1571, "epoch": 9} {"train_loss": -3.571442127227783, "global_step": 1572, "epoch": 9} {"train_loss": -4.09410285949707, "global_step": 1573, "epoch": 9} {"train_loss": -3.9010753631591797, "global_step": 1574, "epoch": 9} {"train_loss": -3.5036609172821045, "global_step": 1575, "epoch": 9} {"train_loss": -3.7633793354034424, "global_step": 1576, "epoch": 9} {"train_loss": -3.890568256378174, "global_step": 1577, "epoch": 9} {"train_loss": -3.9664387702941895, "global_step": 1578, "epoch": 9} {"train_loss": -4.182929039001465, "global_step": 1579, "epoch": 9} {"train_loss": -3.9549777507781982, "global_step": 1580, "epoch": 9} {"train_loss": -3.788336992263794, "global_step": 1581, "epoch": 9} {"train_loss": -3.8075356483459473, "global_step": 1582, "epoch": 9} {"train_loss": -4.230879306793213, "global_step": 1583, "epoch": 9} {"train_loss": -4.1385016441345215, "global_step": 1584, "epoch": 9} {"train_loss": -3.9878880977630615, "global_step": 1585, "epoch": 9} {"train_loss": -3.9517688751220703, "global_step": 1586, "epoch": 9} {"train_loss": -3.747892379760742, "global_step": 1587, "epoch": 9} {"train_loss": -4.222344875335693, "global_step": 1588, "epoch": 9} {"train_loss": -3.929220199584961, "global_step": 1589, "epoch": 9} {"train_loss": -4.062360763549805, "global_step": 1590, "epoch": 9} {"train_loss": -4.208169937133789, "global_step": 1591, "epoch": 9} {"train_loss": -3.820160150527954, "global_step": 1592, "epoch": 9} {"train_loss": -3.8568477630615234, "global_step": 1593, "epoch": 9} {"train_loss": -4.027219772338867, "global_step": 1594, "epoch": 9} {"train_loss": -3.5209903717041016, "global_step": 1595, "epoch": 9} {"train_loss": -4.134140491485596, "global_step": 1596, "epoch": 9} {"train_loss": -4.014251708984375, "global_step": 1597, "epoch": 9} {"train_loss": -3.886580228805542, "global_step": 1598, "epoch": 9} {"train_loss": -3.85983943939209, "global_step": 1599, "epoch": 9} {"train_loss": -3.9216575622558594, "global_step": 1600, "epoch": 9} {"train_loss": -3.925083637237549, "global_step": 1601, "epoch": 9} {"train_loss": -3.5199368000030518, "global_step": 1602, "epoch": 9} {"train_loss": -4.060105323791504, "global_step": 1603, "epoch": 9} {"train_loss": -3.679149627685547, "global_step": 1604, "epoch": 9} {"train_loss": -3.7892045974731445, "global_step": 1605, "epoch": 9} {"train_loss": -3.444084644317627, "global_step": 1606, "epoch": 9} {"train_loss": -3.7681851387023926, "global_step": 1607, "epoch": 9} {"train_loss": -3.675936222076416, "global_step": 1608, "epoch": 9} {"train_loss": -3.9237277507781982, "global_step": 1609, "epoch": 9} {"train_loss": -3.5893993377685547, "global_step": 1610, "epoch": 9} {"train_loss": -3.909475326538086, "global_step": 1611, "epoch": 9} {"train_loss": -3.7112321853637695, "global_step": 1612, "epoch": 9} {"train_loss": -3.723310947418213, "global_step": 1613, "epoch": 9} {"train_loss": -3.9820284843444824, "global_step": 1614, "epoch": 9} {"train_loss": -3.6973891258239746, "global_step": 1615, "epoch": 9} {"train_loss": -3.9006505012512207, "global_step": 1616, "epoch": 9} {"train_loss": -3.858591079711914, "global_step": 1617, "epoch": 9} {"train_loss": -3.7675085067749023, "global_step": 1618, "epoch": 9} {"train_loss": -4.0270843505859375, "global_step": 1619, "epoch": 9} {"train_loss": -3.916835308074951, "global_step": 1620, "epoch": 9} {"train_loss": -4.077744007110596, "global_step": 1621, "epoch": 9} {"train_loss": -4.154749870300293, "global_step": 1622, "epoch": 9} {"train_loss": -4.1311845779418945, "global_step": 1623, "epoch": 9} {"train_loss": -3.875027894973755, "global_step": 1624, "epoch": 9} {"train_loss": -3.792703628540039, "global_step": 1625, "epoch": 9} {"train_loss": -3.915111780166626, "global_step": 1626, "epoch": 9} {"train_loss": -3.8052706718444824, "global_step": 1627, "epoch": 9} {"train_loss": -4.070924282073975, "global_step": 1628, "epoch": 9} {"train_loss": -3.755260944366455, "global_step": 1629, "epoch": 9} {"train_loss": -3.8463759422302246, "global_step": 1630, "epoch": 9} {"train_loss": -3.650529384613037, "global_step": 1631, "epoch": 9} {"train_loss": -3.971583843231201, "global_step": 1632, "epoch": 9} {"train_loss": -3.7763915061950684, "global_step": 1633, "epoch": 9} {"train_loss": -4.036785125732422, "global_step": 1634, "epoch": 9} {"train_loss": -4.0071330070495605, "global_step": 1635, "epoch": 9} {"train_loss": -4.109978675842285, "global_step": 1636, "epoch": 9} {"train_loss": -4.088686943054199, "global_step": 1637, "epoch": 9} {"train_loss": -3.7816145420074463, "global_step": 1638, "epoch": 9} {"train_loss": -3.714731454849243, "global_step": 1639, "epoch": 9} {"train_loss": -3.707638740539551, "global_step": 1640, "epoch": 9} {"train_loss": -4.233180046081543, "global_step": 1641, "epoch": 9} {"train_loss": -3.663165807723999, "global_step": 1642, "epoch": 9} {"train_loss": -4.110103130340576, "global_step": 1643, "epoch": 9} {"train_loss": -3.72592830657959, "global_step": 1644, "epoch": 9} {"train_loss": -3.844789505004883, "global_step": 1645, "epoch": 9} {"train_loss": -4.018572807312012, "global_step": 1646, "epoch": 9} {"train_loss": -3.9736557006835938, "global_step": 1647, "epoch": 9} {"train_loss": -3.789792060852051, "global_step": 1648, "epoch": 9} {"train_loss": -3.916806936264038, "global_step": 1649, "epoch": 9} {"train_loss": -4.074453353881836, "global_step": 1650, "epoch": 9} {"train_loss": -3.839158058166504, "global_step": 1651, "epoch": 9} {"train_loss": -3.9452500343322754, "global_step": 1652, "epoch": 9} {"train_loss": -3.791886806488037, "global_step": 1653, "epoch": 9} {"train_loss": -3.826702356338501, "global_step": 1654, "epoch": 9} {"train_loss": -4.003726005554199, "global_step": 1655, "epoch": 9} {"train_loss": -4.021979331970215, "global_step": 1656, "epoch": 9} {"train_loss": -3.7974610328674316, "global_step": 1657, "epoch": 9} {"train_loss": -3.8787407875061035, "global_step": 1658, "epoch": 9} {"train_loss": -4.014848709106445, "global_step": 1659, "epoch": 9} {"train_loss": -3.8518359661102295, "global_step": 1660, "epoch": 9} {"train_loss": -3.8708443641662598, "global_step": 1661, "epoch": 9} {"train_loss": -4.045660018920898, "global_step": 1662, "epoch": 9} {"train_loss": -4.268479347229004, "global_step": 1663, "epoch": 9} {"train_loss": -4.187398433685303, "global_step": 1664, "epoch": 9} {"train_loss": -3.960254192352295, "global_step": 1665, "epoch": 9} {"train_loss": -3.949321746826172, "global_step": 1666, "epoch": 9} {"train_loss": -4.019431114196777, "global_step": 1667, "epoch": 9} {"train_loss": -3.9118809700012207, "global_step": 1668, "epoch": 9} {"train_loss": -3.794241189956665, "global_step": 1669, "epoch": 9} {"train_loss": -3.861736297607422, "global_step": 1670, "epoch": 9} {"train_loss": -4.006294250488281, "global_step": 1671, "epoch": 9} {"train_loss": -3.9714090824127197, "global_step": 1672, "epoch": 9} {"train_loss": -3.950183391571045, "global_step": 1673, "epoch": 9} {"train_loss": -4.033970832824707, "global_step": 1674, "epoch": 9} {"train_loss": -3.8258326053619385, "global_step": 1675, "epoch": 9} {"train_loss": -3.7646143436431885, "global_step": 1676, "epoch": 9} {"train_loss": -3.7169108390808105, "global_step": 1677, "epoch": 9} {"train_loss": -3.91646671295166, "global_step": 1678, "epoch": 9} {"train_loss": -3.907073382820402, "global_step": 1679, "epoch": 9, "val_loss": 256764.890625} {"train_loss": -3.9151620864868164, "global_step": 1680, "epoch": 10} {"train_loss": -3.8542985916137695, "global_step": 1681, "epoch": 10} {"train_loss": -3.7502901554107666, "global_step": 1682, "epoch": 10} {"train_loss": -3.7889180183410645, "global_step": 1683, "epoch": 10} {"train_loss": -3.9129467010498047, "global_step": 1684, "epoch": 10} {"train_loss": -4.018871307373047, "global_step": 1685, "epoch": 10} {"train_loss": -4.230281829833984, "global_step": 1686, "epoch": 10} {"train_loss": -4.064146518707275, "global_step": 1687, "epoch": 10} {"train_loss": -3.9259567260742188, "global_step": 1688, "epoch": 10} {"train_loss": -3.914614677429199, "global_step": 1689, "epoch": 10} {"train_loss": -3.7178289890289307, "global_step": 1690, "epoch": 10} {"train_loss": -4.055736541748047, "global_step": 1691, "epoch": 10} {"train_loss": -4.011395454406738, "global_step": 1692, "epoch": 10} {"train_loss": -4.07987642288208, "global_step": 1693, "epoch": 10} {"train_loss": -4.19687557220459, "global_step": 1694, "epoch": 10} {"train_loss": -4.182513236999512, "global_step": 1695, "epoch": 10} {"train_loss": -4.146365165710449, "global_step": 1696, "epoch": 10} {"train_loss": -4.137470245361328, "global_step": 1697, "epoch": 10} {"train_loss": -4.164743423461914, "global_step": 1698, "epoch": 10} {"train_loss": -3.7966837882995605, "global_step": 1699, "epoch": 10} {"train_loss": -4.111848831176758, "global_step": 1700, "epoch": 10} {"train_loss": -4.019828796386719, "global_step": 1701, "epoch": 10} {"train_loss": -3.948306083679199, "global_step": 1702, "epoch": 10} {"train_loss": -3.962568759918213, "global_step": 1703, "epoch": 10} {"train_loss": -3.892972946166992, "global_step": 1704, "epoch": 10} {"train_loss": -4.00141716003418, "global_step": 1705, "epoch": 10} {"train_loss": -3.8501224517822266, "global_step": 1706, "epoch": 10} {"train_loss": -3.636951446533203, "global_step": 1707, "epoch": 10} {"train_loss": -3.877427101135254, "global_step": 1708, "epoch": 10} {"train_loss": -3.51259446144104, "global_step": 1709, "epoch": 10} {"train_loss": -3.7651102542877197, "global_step": 1710, "epoch": 10} {"train_loss": -3.9147164821624756, "global_step": 1711, "epoch": 10} {"train_loss": -3.905991315841675, "global_step": 1712, "epoch": 10} {"train_loss": -4.029265403747559, "global_step": 1713, "epoch": 10} {"train_loss": -4.10060977935791, "global_step": 1714, "epoch": 10} {"train_loss": -3.6961803436279297, "global_step": 1715, "epoch": 10} {"train_loss": -3.8558459281921387, "global_step": 1716, "epoch": 10} {"train_loss": -3.5296802520751953, "global_step": 1717, "epoch": 10} {"train_loss": -3.607666015625, "global_step": 1718, "epoch": 10} {"train_loss": -3.9264333248138428, "global_step": 1719, "epoch": 10} {"train_loss": -3.689415216445923, "global_step": 1720, "epoch": 10} {"train_loss": -3.7220523357391357, "global_step": 1721, "epoch": 10} {"train_loss": -3.9088664054870605, "global_step": 1722, "epoch": 10} {"train_loss": -3.904670476913452, "global_step": 1723, "epoch": 10} {"train_loss": -3.867905378341675, "global_step": 1724, "epoch": 10} {"train_loss": -3.8320634365081787, "global_step": 1725, "epoch": 10} {"train_loss": -4.089685916900635, "global_step": 1726, "epoch": 10} {"train_loss": -4.124944686889648, "global_step": 1727, "epoch": 10} {"train_loss": -3.788526773452759, "global_step": 1728, "epoch": 10} {"train_loss": -4.061182975769043, "global_step": 1729, "epoch": 10} {"train_loss": -3.9718990325927734, "global_step": 1730, "epoch": 10} {"train_loss": -3.705212116241455, "global_step": 1731, "epoch": 10} {"train_loss": -3.9361748695373535, "global_step": 1732, "epoch": 10} {"train_loss": -4.21625280380249, "global_step": 1733, "epoch": 10} {"train_loss": -4.036036491394043, "global_step": 1734, "epoch": 10} {"train_loss": -3.9389524459838867, "global_step": 1735, "epoch": 10} {"train_loss": -4.083911418914795, "global_step": 1736, "epoch": 10} {"train_loss": -4.299724578857422, "global_step": 1737, "epoch": 10} {"train_loss": -3.876465320587158, "global_step": 1738, "epoch": 10} {"train_loss": -3.622293472290039, "global_step": 1739, "epoch": 10} {"train_loss": -3.9917523860931396, "global_step": 1740, "epoch": 10} {"train_loss": -4.179668426513672, "global_step": 1741, "epoch": 10} {"train_loss": -4.168524742126465, "global_step": 1742, "epoch": 10} {"train_loss": -3.97471022605896, "global_step": 1743, "epoch": 10} {"train_loss": -3.6325175762176514, "global_step": 1744, "epoch": 10} {"train_loss": -3.8575217723846436, "global_step": 1745, "epoch": 10} {"train_loss": -3.7431235313415527, "global_step": 1746, "epoch": 10} {"train_loss": -3.7601280212402344, "global_step": 1747, "epoch": 10} {"train_loss": -3.545102119445801, "global_step": 1748, "epoch": 10} {"train_loss": -4.07609748840332, "global_step": 1749, "epoch": 10} {"train_loss": -3.6011505126953125, "global_step": 1750, "epoch": 10} {"train_loss": -3.861936092376709, "global_step": 1751, "epoch": 10} {"train_loss": -4.0781145095825195, "global_step": 1752, "epoch": 10} {"train_loss": -3.769473075866699, "global_step": 1753, "epoch": 10} {"train_loss": -3.6864113807678223, "global_step": 1754, "epoch": 10} {"train_loss": -4.027631759643555, "global_step": 1755, "epoch": 10} {"train_loss": -3.8582870960235596, "global_step": 1756, "epoch": 10} {"train_loss": -4.009984970092773, "global_step": 1757, "epoch": 10} {"train_loss": -4.038364410400391, "global_step": 1758, "epoch": 10} {"train_loss": -4.026357173919678, "global_step": 1759, "epoch": 10} {"train_loss": -3.776017427444458, "global_step": 1760, "epoch": 10} {"train_loss": -3.9669950008392334, "global_step": 1761, "epoch": 10} {"train_loss": -3.9169507026672363, "global_step": 1762, "epoch": 10} {"train_loss": -3.858438491821289, "global_step": 1763, "epoch": 10} {"train_loss": -4.0215277671813965, "global_step": 1764, "epoch": 10} {"train_loss": -4.0826263427734375, "global_step": 1765, "epoch": 10} {"train_loss": -4.075349807739258, "global_step": 1766, "epoch": 10} {"train_loss": -3.9706175327301025, "global_step": 1767, "epoch": 10} {"train_loss": -4.079729080200195, "global_step": 1768, "epoch": 10} {"train_loss": -4.07767915725708, "global_step": 1769, "epoch": 10} {"train_loss": -4.116049766540527, "global_step": 1770, "epoch": 10} {"train_loss": -4.044559478759766, "global_step": 1771, "epoch": 10} {"train_loss": -3.9489965438842773, "global_step": 1772, "epoch": 10} {"train_loss": -4.169892311096191, "global_step": 1773, "epoch": 10} {"train_loss": -3.886160135269165, "global_step": 1774, "epoch": 10} {"train_loss": -3.9946506023406982, "global_step": 1775, "epoch": 10} {"train_loss": -3.9145002365112305, "global_step": 1776, "epoch": 10} {"train_loss": -4.016796588897705, "global_step": 1777, "epoch": 10} {"train_loss": -3.8569438457489014, "global_step": 1778, "epoch": 10} {"train_loss": -4.069551467895508, "global_step": 1779, "epoch": 10} {"train_loss": -3.9111971855163574, "global_step": 1780, "epoch": 10} {"train_loss": -3.9277429580688477, "global_step": 1781, "epoch": 10} {"train_loss": -3.9360203742980957, "global_step": 1782, "epoch": 10} {"train_loss": -3.9820151329040527, "global_step": 1783, "epoch": 10} {"train_loss": -4.242025375366211, "global_step": 1784, "epoch": 10} {"train_loss": -3.997725009918213, "global_step": 1785, "epoch": 10} {"train_loss": -4.06558084487915, "global_step": 1786, "epoch": 10} {"train_loss": -4.182796001434326, "global_step": 1787, "epoch": 10} {"train_loss": -3.9736764430999756, "global_step": 1788, "epoch": 10} {"train_loss": -4.124909400939941, "global_step": 1789, "epoch": 10} {"train_loss": -3.9275054931640625, "global_step": 1790, "epoch": 10} {"train_loss": -4.002439498901367, "global_step": 1791, "epoch": 10} {"train_loss": -3.970211982727051, "global_step": 1792, "epoch": 10} {"train_loss": -4.093544006347656, "global_step": 1793, "epoch": 10} {"train_loss": -4.057793617248535, "global_step": 1794, "epoch": 10} {"train_loss": -3.9633536338806152, "global_step": 1795, "epoch": 10} {"train_loss": -4.124416351318359, "global_step": 1796, "epoch": 10} {"train_loss": -3.8622336387634277, "global_step": 1797, "epoch": 10} {"train_loss": -4.06983757019043, "global_step": 1798, "epoch": 10} {"train_loss": -3.710217237472534, "global_step": 1799, "epoch": 10} {"train_loss": -3.8812365531921387, "global_step": 1800, "epoch": 10} {"train_loss": -4.210254192352295, "global_step": 1801, "epoch": 10} {"train_loss": -4.231142997741699, "global_step": 1802, "epoch": 10} {"train_loss": -4.044520854949951, "global_step": 1803, "epoch": 10} {"train_loss": -3.972179412841797, "global_step": 1804, "epoch": 10} {"train_loss": -4.308139801025391, "global_step": 1805, "epoch": 10} {"train_loss": -4.238401412963867, "global_step": 1806, "epoch": 10} {"train_loss": -4.057077407836914, "global_step": 1807, "epoch": 10} {"train_loss": -4.006360054016113, "global_step": 1808, "epoch": 10} {"train_loss": -4.177865028381348, "global_step": 1809, "epoch": 10} {"train_loss": -4.159666061401367, "global_step": 1810, "epoch": 10} {"train_loss": -4.271895408630371, "global_step": 1811, "epoch": 10} {"train_loss": -4.052321434020996, "global_step": 1812, "epoch": 10} {"train_loss": -3.862929582595825, "global_step": 1813, "epoch": 10} {"train_loss": -4.297949314117432, "global_step": 1814, "epoch": 10} {"train_loss": -4.108016014099121, "global_step": 1815, "epoch": 10} {"train_loss": -4.176101207733154, "global_step": 1816, "epoch": 10} {"train_loss": -3.931051731109619, "global_step": 1817, "epoch": 10} {"train_loss": -3.806217670440674, "global_step": 1818, "epoch": 10} {"train_loss": -4.110786437988281, "global_step": 1819, "epoch": 10} {"train_loss": -3.972749710083008, "global_step": 1820, "epoch": 10} {"train_loss": -3.5594232082366943, "global_step": 1821, "epoch": 10} {"train_loss": -4.067147254943848, "global_step": 1822, "epoch": 10} {"train_loss": -3.7037978172302246, "global_step": 1823, "epoch": 10} {"train_loss": -3.920179843902588, "global_step": 1824, "epoch": 10} {"train_loss": -4.104921817779541, "global_step": 1825, "epoch": 10} {"train_loss": -3.9471728801727295, "global_step": 1826, "epoch": 10} {"train_loss": -3.899897336959839, "global_step": 1827, "epoch": 10} {"train_loss": -4.137454032897949, "global_step": 1828, "epoch": 10} {"train_loss": -3.9586682319641113, "global_step": 1829, "epoch": 10} {"train_loss": -4.240126609802246, "global_step": 1830, "epoch": 10} {"train_loss": -3.9513888359069824, "global_step": 1831, "epoch": 10} {"train_loss": -3.9553983211517334, "global_step": 1832, "epoch": 10} {"train_loss": -4.096225738525391, "global_step": 1833, "epoch": 10} {"train_loss": -3.588160514831543, "global_step": 1834, "epoch": 10} {"train_loss": -4.060840606689453, "global_step": 1835, "epoch": 10} {"train_loss": -3.5236587524414062, "global_step": 1836, "epoch": 10} {"train_loss": -3.643141746520996, "global_step": 1837, "epoch": 10} {"train_loss": -3.864447832107544, "global_step": 1838, "epoch": 10} {"train_loss": -3.6989846229553223, "global_step": 1839, "epoch": 10} {"train_loss": -3.6470603942871094, "global_step": 1840, "epoch": 10} {"train_loss": -3.7467944622039795, "global_step": 1841, "epoch": 10} {"train_loss": -3.911520004272461, "global_step": 1842, "epoch": 10} {"train_loss": -3.7037715911865234, "global_step": 1843, "epoch": 10} {"train_loss": -3.863504648208618, "global_step": 1844, "epoch": 10} {"train_loss": -3.989621639251709, "global_step": 1845, "epoch": 10} {"train_loss": -3.631396532058716, "global_step": 1846, "epoch": 10} {"train_loss": -3.9495155853884563, "global_step": 1847, "epoch": 10, "val_loss": 240042.9375, "train_action_mse_error": 204.16885375976562} {"train_loss": -3.6784141063690186, "global_step": 1848, "epoch": 11} {"train_loss": -3.851330518722534, "global_step": 1849, "epoch": 11} {"train_loss": -3.6987407207489014, "global_step": 1850, "epoch": 11} {"train_loss": -3.882537841796875, "global_step": 1851, "epoch": 11} {"train_loss": -3.979674816131592, "global_step": 1852, "epoch": 11} {"train_loss": -3.5631418228149414, "global_step": 1853, "epoch": 11} {"train_loss": -3.9519731998443604, "global_step": 1854, "epoch": 11} {"train_loss": -3.715200662612915, "global_step": 1855, "epoch": 11} {"train_loss": -3.864250659942627, "global_step": 1856, "epoch": 11} {"train_loss": -3.9936251640319824, "global_step": 1857, "epoch": 11} {"train_loss": -3.9890060424804688, "global_step": 1858, "epoch": 11} {"train_loss": -3.9876582622528076, "global_step": 1859, "epoch": 11} {"train_loss": -3.9482903480529785, "global_step": 1860, "epoch": 11} {"train_loss": -4.122727870941162, "global_step": 1861, "epoch": 11} {"train_loss": -4.178981781005859, "global_step": 1862, "epoch": 11} {"train_loss": -4.089273929595947, "global_step": 1863, "epoch": 11} {"train_loss": -4.2340803146362305, "global_step": 1864, "epoch": 11} {"train_loss": -3.9290788173675537, "global_step": 1865, "epoch": 11} {"train_loss": -3.7046844959259033, "global_step": 1866, "epoch": 11} {"train_loss": -3.819957733154297, "global_step": 1867, "epoch": 11} {"train_loss": -3.979976177215576, "global_step": 1868, "epoch": 11} {"train_loss": -4.180030822753906, "global_step": 1869, "epoch": 11} {"train_loss": -4.050643444061279, "global_step": 1870, "epoch": 11} {"train_loss": -4.190480709075928, "global_step": 1871, "epoch": 11} {"train_loss": -3.957505464553833, "global_step": 1872, "epoch": 11} {"train_loss": -4.3056793212890625, "global_step": 1873, "epoch": 11} {"train_loss": -4.0987043380737305, "global_step": 1874, "epoch": 11} {"train_loss": -3.914177656173706, "global_step": 1875, "epoch": 11} {"train_loss": -4.024566650390625, "global_step": 1876, "epoch": 11} {"train_loss": -3.8863701820373535, "global_step": 1877, "epoch": 11} {"train_loss": -4.142489433288574, "global_step": 1878, "epoch": 11} {"train_loss": -4.12974739074707, "global_step": 1879, "epoch": 11} {"train_loss": -4.201225757598877, "global_step": 1880, "epoch": 11} {"train_loss": -3.9421370029449463, "global_step": 1881, "epoch": 11} {"train_loss": -3.866208076477051, "global_step": 1882, "epoch": 11} {"train_loss": -4.055883884429932, "global_step": 1883, "epoch": 11} {"train_loss": -4.221070289611816, "global_step": 1884, "epoch": 11} {"train_loss": -4.051872253417969, "global_step": 1885, "epoch": 11} {"train_loss": -3.908571720123291, "global_step": 1886, "epoch": 11} {"train_loss": -3.8631844520568848, "global_step": 1887, "epoch": 11} {"train_loss": -3.9830098152160645, "global_step": 1888, "epoch": 11} {"train_loss": -3.727494955062866, "global_step": 1889, "epoch": 11} {"train_loss": -3.834583282470703, "global_step": 1890, "epoch": 11} {"train_loss": -3.9247350692749023, "global_step": 1891, "epoch": 11} {"train_loss": -3.852297306060791, "global_step": 1892, "epoch": 11} {"train_loss": -3.940912961959839, "global_step": 1893, "epoch": 11} {"train_loss": -3.974658966064453, "global_step": 1894, "epoch": 11} {"train_loss": -3.9129180908203125, "global_step": 1895, "epoch": 11} {"train_loss": -3.9249958992004395, "global_step": 1896, "epoch": 11} {"train_loss": -3.988461971282959, "global_step": 1897, "epoch": 11} {"train_loss": -4.169633865356445, "global_step": 1898, "epoch": 11} {"train_loss": -4.05960750579834, "global_step": 1899, "epoch": 11} {"train_loss": -3.6386287212371826, "global_step": 1900, "epoch": 11} {"train_loss": -3.9824938774108887, "global_step": 1901, "epoch": 11} {"train_loss": -3.773970127105713, "global_step": 1902, "epoch": 11} {"train_loss": -4.197198867797852, "global_step": 1903, "epoch": 11} {"train_loss": -3.934561252593994, "global_step": 1904, "epoch": 11} {"train_loss": -4.13150691986084, "global_step": 1905, "epoch": 11} {"train_loss": -4.14096736907959, "global_step": 1906, "epoch": 11} {"train_loss": -3.9489328861236572, "global_step": 1907, "epoch": 11} {"train_loss": -4.1944708824157715, "global_step": 1908, "epoch": 11} {"train_loss": -4.118913650512695, "global_step": 1909, "epoch": 11} {"train_loss": -4.050952911376953, "global_step": 1910, "epoch": 11} {"train_loss": -4.050030708312988, "global_step": 1911, "epoch": 11} {"train_loss": -4.288429260253906, "global_step": 1912, "epoch": 11} {"train_loss": -3.969146728515625, "global_step": 1913, "epoch": 11} {"train_loss": -4.318562030792236, "global_step": 1914, "epoch": 11} {"train_loss": -3.9228663444519043, "global_step": 1915, "epoch": 11} {"train_loss": -4.316908359527588, "global_step": 1916, "epoch": 11} {"train_loss": -3.896218776702881, "global_step": 1917, "epoch": 11} {"train_loss": -4.171399116516113, "global_step": 1918, "epoch": 11} {"train_loss": -3.8473904132843018, "global_step": 1919, "epoch": 11} {"train_loss": -4.247305870056152, "global_step": 1920, "epoch": 11} {"train_loss": -3.8050594329833984, "global_step": 1921, "epoch": 11} {"train_loss": -4.065265655517578, "global_step": 1922, "epoch": 11} {"train_loss": -4.013968467712402, "global_step": 1923, "epoch": 11} {"train_loss": -4.208213806152344, "global_step": 1924, "epoch": 11} {"train_loss": -3.7800822257995605, "global_step": 1925, "epoch": 11} {"train_loss": -4.008677959442139, "global_step": 1926, "epoch": 11} {"train_loss": -3.9948360919952393, "global_step": 1927, "epoch": 11} {"train_loss": -3.746915102005005, "global_step": 1928, "epoch": 11} {"train_loss": -4.02169942855835, "global_step": 1929, "epoch": 11} {"train_loss": -3.883392810821533, "global_step": 1930, "epoch": 11} {"train_loss": -3.938488006591797, "global_step": 1931, "epoch": 11} {"train_loss": -3.831015110015869, "global_step": 1932, "epoch": 11} {"train_loss": -3.840620517730713, "global_step": 1933, "epoch": 11} {"train_loss": -4.06225061416626, "global_step": 1934, "epoch": 11} {"train_loss": -4.10540771484375, "global_step": 1935, "epoch": 11} {"train_loss": -3.844514846801758, "global_step": 1936, "epoch": 11} {"train_loss": -3.778797149658203, "global_step": 1937, "epoch": 11} {"train_loss": -3.941030979156494, "global_step": 1938, "epoch": 11} {"train_loss": -4.024868011474609, "global_step": 1939, "epoch": 11} {"train_loss": -3.9192445278167725, "global_step": 1940, "epoch": 11} {"train_loss": -3.577052593231201, "global_step": 1941, "epoch": 11} {"train_loss": -4.008569717407227, "global_step": 1942, "epoch": 11} {"train_loss": -4.2316484451293945, "global_step": 1943, "epoch": 11} {"train_loss": -3.7955055236816406, "global_step": 1944, "epoch": 11} {"train_loss": -3.916112184524536, "global_step": 1945, "epoch": 11} {"train_loss": -3.7711310386657715, "global_step": 1946, "epoch": 11} {"train_loss": -3.8654584884643555, "global_step": 1947, "epoch": 11} {"train_loss": -4.233640670776367, "global_step": 1948, "epoch": 11} {"train_loss": -4.044142246246338, "global_step": 1949, "epoch": 11} {"train_loss": -4.055729866027832, "global_step": 1950, "epoch": 11} {"train_loss": -3.95770263671875, "global_step": 1951, "epoch": 11} {"train_loss": -4.068935871124268, "global_step": 1952, "epoch": 11} {"train_loss": -4.156808376312256, "global_step": 1953, "epoch": 11} {"train_loss": -3.975752353668213, "global_step": 1954, "epoch": 11} {"train_loss": -4.269307613372803, "global_step": 1955, "epoch": 11} {"train_loss": -4.1099138259887695, "global_step": 1956, "epoch": 11} {"train_loss": -3.9084696769714355, "global_step": 1957, "epoch": 11} {"train_loss": -4.023860454559326, "global_step": 1958, "epoch": 11} {"train_loss": -4.326362133026123, "global_step": 1959, "epoch": 11} {"train_loss": -4.002389907836914, "global_step": 1960, "epoch": 11} {"train_loss": -4.070073127746582, "global_step": 1961, "epoch": 11} {"train_loss": -3.992978096008301, "global_step": 1962, "epoch": 11} {"train_loss": -4.247861862182617, "global_step": 1963, "epoch": 11} {"train_loss": -4.0033063888549805, "global_step": 1964, "epoch": 11} {"train_loss": -4.31088924407959, "global_step": 1965, "epoch": 11} {"train_loss": -4.17197322845459, "global_step": 1966, "epoch": 11} {"train_loss": -4.302000045776367, "global_step": 1967, "epoch": 11} {"train_loss": -4.26485538482666, "global_step": 1968, "epoch": 11} {"train_loss": -4.20892333984375, "global_step": 1969, "epoch": 11} {"train_loss": -4.143745422363281, "global_step": 1970, "epoch": 11} {"train_loss": -3.9713351726531982, "global_step": 1971, "epoch": 11} {"train_loss": -4.019346714019775, "global_step": 1972, "epoch": 11} {"train_loss": -4.0835981369018555, "global_step": 1973, "epoch": 11} {"train_loss": -4.168508529663086, "global_step": 1974, "epoch": 11} {"train_loss": -4.106638431549072, "global_step": 1975, "epoch": 11} {"train_loss": -4.04111385345459, "global_step": 1976, "epoch": 11} {"train_loss": -3.9427223205566406, "global_step": 1977, "epoch": 11} {"train_loss": -4.4232587814331055, "global_step": 1978, "epoch": 11} {"train_loss": -4.057940483093262, "global_step": 1979, "epoch": 11} {"train_loss": -4.1809797286987305, "global_step": 1980, "epoch": 11} {"train_loss": -4.333186149597168, "global_step": 1981, "epoch": 11} {"train_loss": -4.1893510818481445, "global_step": 1982, "epoch": 11} {"train_loss": -3.922928810119629, "global_step": 1983, "epoch": 11} {"train_loss": -4.388012409210205, "global_step": 1984, "epoch": 11} {"train_loss": -4.116209983825684, "global_step": 1985, "epoch": 11} {"train_loss": -4.041595458984375, "global_step": 1986, "epoch": 11} {"train_loss": -4.29317569732666, "global_step": 1987, "epoch": 11} {"train_loss": -4.204603672027588, "global_step": 1988, "epoch": 11} {"train_loss": -4.204763412475586, "global_step": 1989, "epoch": 11} {"train_loss": -4.219451904296875, "global_step": 1990, "epoch": 11} {"train_loss": -4.076969623565674, "global_step": 1991, "epoch": 11} {"train_loss": -4.166176795959473, "global_step": 1992, "epoch": 11} {"train_loss": -4.091434955596924, "global_step": 1993, "epoch": 11} {"train_loss": -4.25706672668457, "global_step": 1994, "epoch": 11} {"train_loss": -4.249812602996826, "global_step": 1995, "epoch": 11} {"train_loss": -4.3400139808654785, "global_step": 1996, "epoch": 11} {"train_loss": -4.1196489334106445, "global_step": 1997, "epoch": 11} {"train_loss": -3.836981773376465, "global_step": 1998, "epoch": 11} {"train_loss": -3.839478015899658, "global_step": 1999, "epoch": 11} {"train_loss": -4.3192267417907715, "global_step": 2000, "epoch": 11} {"train_loss": -4.09878396987915, "global_step": 2001, "epoch": 11} {"train_loss": -3.928468704223633, "global_step": 2002, "epoch": 11} {"train_loss": -4.126962184906006, "global_step": 2003, "epoch": 11} {"train_loss": -3.7949070930480957, "global_step": 2004, "epoch": 11} {"train_loss": -4.189478874206543, "global_step": 2005, "epoch": 11} {"train_loss": -3.9067394733428955, "global_step": 2006, "epoch": 11} {"train_loss": -3.907860279083252, "global_step": 2007, "epoch": 11} {"train_loss": -3.8609228134155273, "global_step": 2008, "epoch": 11} {"train_loss": -3.527848243713379, "global_step": 2009, "epoch": 11} {"train_loss": -4.075297832489014, "global_step": 2010, "epoch": 11} {"train_loss": -3.9538087844848633, "global_step": 2011, "epoch": 11} {"train_loss": -3.8734638690948486, "global_step": 2012, "epoch": 11} {"train_loss": -3.8864197731018066, "global_step": 2013, "epoch": 11} {"train_loss": -3.863802433013916, "global_step": 2014, "epoch": 11} {"train_loss": -4.020293289706821, "global_step": 2015, "epoch": 11, "val_loss": 242984.109375} {"train_loss": -3.9672188758850098, "global_step": 2016, "epoch": 12} {"train_loss": -3.7545199394226074, "global_step": 2017, "epoch": 12} {"train_loss": -4.113480567932129, "global_step": 2018, "epoch": 12} {"train_loss": -4.030725955963135, "global_step": 2019, "epoch": 12} {"train_loss": -4.280576705932617, "global_step": 2020, "epoch": 12} {"train_loss": -4.23341178894043, "global_step": 2021, "epoch": 12} {"train_loss": -4.090368270874023, "global_step": 2022, "epoch": 12} {"train_loss": -3.7506518363952637, "global_step": 2023, "epoch": 12} {"train_loss": -4.306477069854736, "global_step": 2024, "epoch": 12} {"train_loss": -4.219043731689453, "global_step": 2025, "epoch": 12} {"train_loss": -4.3023681640625, "global_step": 2026, "epoch": 12} {"train_loss": -4.214219570159912, "global_step": 2027, "epoch": 12} {"train_loss": -4.29085636138916, "global_step": 2028, "epoch": 12} {"train_loss": -4.08585262298584, "global_step": 2029, "epoch": 12} {"train_loss": -4.045051097869873, "global_step": 2030, "epoch": 12} {"train_loss": -4.283222675323486, "global_step": 2031, "epoch": 12} {"train_loss": -4.102826118469238, "global_step": 2032, "epoch": 12} {"train_loss": -4.43364953994751, "global_step": 2033, "epoch": 12} {"train_loss": -3.8808836936950684, "global_step": 2034, "epoch": 12} {"train_loss": -4.513711929321289, "global_step": 2035, "epoch": 12} {"train_loss": -3.943453550338745, "global_step": 2036, "epoch": 12} {"train_loss": -4.1833295822143555, "global_step": 2037, "epoch": 12} {"train_loss": -4.179259300231934, "global_step": 2038, "epoch": 12} {"train_loss": -3.9766721725463867, "global_step": 2039, "epoch": 12} {"train_loss": -4.02512264251709, "global_step": 2040, "epoch": 12} {"train_loss": -3.9603192806243896, "global_step": 2041, "epoch": 12} {"train_loss": -4.388543128967285, "global_step": 2042, "epoch": 12} {"train_loss": -4.0173444747924805, "global_step": 2043, "epoch": 12} {"train_loss": -4.1486053466796875, "global_step": 2044, "epoch": 12} {"train_loss": -4.161818027496338, "global_step": 2045, "epoch": 12} {"train_loss": -4.15406608581543, "global_step": 2046, "epoch": 12} {"train_loss": -4.293270111083984, "global_step": 2047, "epoch": 12} {"train_loss": -4.113039970397949, "global_step": 2048, "epoch": 12} {"train_loss": -4.273224830627441, "global_step": 2049, "epoch": 12} {"train_loss": -4.249919414520264, "global_step": 2050, "epoch": 12} {"train_loss": -4.289178371429443, "global_step": 2051, "epoch": 12} {"train_loss": -4.336313724517822, "global_step": 2052, "epoch": 12} {"train_loss": -4.20076322555542, "global_step": 2053, "epoch": 12} {"train_loss": -4.415890693664551, "global_step": 2054, "epoch": 12} {"train_loss": -4.110076427459717, "global_step": 2055, "epoch": 12} {"train_loss": -4.547492027282715, "global_step": 2056, "epoch": 12} {"train_loss": -4.0606689453125, "global_step": 2057, "epoch": 12} {"train_loss": -4.214404582977295, "global_step": 2058, "epoch": 12} {"train_loss": -4.302628517150879, "global_step": 2059, "epoch": 12} {"train_loss": -4.158623218536377, "global_step": 2060, "epoch": 12} {"train_loss": -4.1682209968566895, "global_step": 2061, "epoch": 12} {"train_loss": -4.106508255004883, "global_step": 2062, "epoch": 12} {"train_loss": -4.239060401916504, "global_step": 2063, "epoch": 12} {"train_loss": -4.0931901931762695, "global_step": 2064, "epoch": 12} {"train_loss": -4.472626686096191, "global_step": 2065, "epoch": 12} {"train_loss": -4.258447647094727, "global_step": 2066, "epoch": 12} {"train_loss": -4.07304573059082, "global_step": 2067, "epoch": 12} {"train_loss": -3.9198482036590576, "global_step": 2068, "epoch": 12} {"train_loss": -4.21691370010376, "global_step": 2069, "epoch": 12} {"train_loss": -4.16196346282959, "global_step": 2070, "epoch": 12} {"train_loss": -4.270960807800293, "global_step": 2071, "epoch": 12} {"train_loss": -4.304688453674316, "global_step": 2072, "epoch": 12} {"train_loss": -4.341949462890625, "global_step": 2073, "epoch": 12} {"train_loss": -4.070101261138916, "global_step": 2074, "epoch": 12} {"train_loss": -4.25368595123291, "global_step": 2075, "epoch": 12} {"train_loss": -3.7434628009796143, "global_step": 2076, "epoch": 12} {"train_loss": -4.012060642242432, "global_step": 2077, "epoch": 12} {"train_loss": -3.9192914962768555, "global_step": 2078, "epoch": 12} {"train_loss": -4.1746015548706055, "global_step": 2079, "epoch": 12} {"train_loss": -3.7557668685913086, "global_step": 2080, "epoch": 12} {"train_loss": -3.9492385387420654, "global_step": 2081, "epoch": 12} {"train_loss": -3.7796058654785156, "global_step": 2082, "epoch": 12} {"train_loss": -4.052651405334473, "global_step": 2083, "epoch": 12} {"train_loss": -3.97129487991333, "global_step": 2084, "epoch": 12} {"train_loss": -3.9606194496154785, "global_step": 2085, "epoch": 12} {"train_loss": -4.0726213455200195, "global_step": 2086, "epoch": 12} {"train_loss": -4.1417388916015625, "global_step": 2087, "epoch": 12} {"train_loss": -3.9234113693237305, "global_step": 2088, "epoch": 12} {"train_loss": -4.194607734680176, "global_step": 2089, "epoch": 12} {"train_loss": -4.153473377227783, "global_step": 2090, "epoch": 12} {"train_loss": -3.8585801124572754, "global_step": 2091, "epoch": 12} {"train_loss": -3.953261613845825, "global_step": 2092, "epoch": 12} {"train_loss": -4.297515869140625, "global_step": 2093, "epoch": 12} {"train_loss": -4.294795989990234, "global_step": 2094, "epoch": 12} {"train_loss": -3.9577889442443848, "global_step": 2095, "epoch": 12} {"train_loss": -4.220590114593506, "global_step": 2096, "epoch": 12} {"train_loss": -4.267843246459961, "global_step": 2097, "epoch": 12} {"train_loss": -4.2332305908203125, "global_step": 2098, "epoch": 12} {"train_loss": -4.154448509216309, "global_step": 2099, "epoch": 12} {"train_loss": -4.283533573150635, "global_step": 2100, "epoch": 12} {"train_loss": -4.097330093383789, "global_step": 2101, "epoch": 12} {"train_loss": -4.355410099029541, "global_step": 2102, "epoch": 12} {"train_loss": -4.155041694641113, "global_step": 2103, "epoch": 12} {"train_loss": -4.423403263092041, "global_step": 2104, "epoch": 12} {"train_loss": -4.469622611999512, "global_step": 2105, "epoch": 12} {"train_loss": -4.203176498413086, "global_step": 2106, "epoch": 12} {"train_loss": -4.216029167175293, "global_step": 2107, "epoch": 12} {"train_loss": -4.290245056152344, "global_step": 2108, "epoch": 12} {"train_loss": -4.359107494354248, "global_step": 2109, "epoch": 12} {"train_loss": -4.190375328063965, "global_step": 2110, "epoch": 12} {"train_loss": -4.209286689758301, "global_step": 2111, "epoch": 12} {"train_loss": -4.032456398010254, "global_step": 2112, "epoch": 12} {"train_loss": -3.8473830223083496, "global_step": 2113, "epoch": 12} {"train_loss": -3.73185396194458, "global_step": 2114, "epoch": 12} {"train_loss": -4.157297134399414, "global_step": 2115, "epoch": 12} {"train_loss": -3.797414541244507, "global_step": 2116, "epoch": 12} {"train_loss": -4.397407531738281, "global_step": 2117, "epoch": 12} {"train_loss": -3.965028762817383, "global_step": 2118, "epoch": 12} {"train_loss": -3.9796195030212402, "global_step": 2119, "epoch": 12} {"train_loss": -4.238654613494873, "global_step": 2120, "epoch": 12} {"train_loss": -4.005229949951172, "global_step": 2121, "epoch": 12} {"train_loss": -4.1402482986450195, "global_step": 2122, "epoch": 12} {"train_loss": -4.120862007141113, "global_step": 2123, "epoch": 12} {"train_loss": -4.359551429748535, "global_step": 2124, "epoch": 12} {"train_loss": -4.442020416259766, "global_step": 2125, "epoch": 12} {"train_loss": -4.129939556121826, "global_step": 2126, "epoch": 12} {"train_loss": -4.246204853057861, "global_step": 2127, "epoch": 12} {"train_loss": -4.167975902557373, "global_step": 2128, "epoch": 12} {"train_loss": -4.399100303649902, "global_step": 2129, "epoch": 12} {"train_loss": -4.101304054260254, "global_step": 2130, "epoch": 12} {"train_loss": -4.355162620544434, "global_step": 2131, "epoch": 12} {"train_loss": -4.384517669677734, "global_step": 2132, "epoch": 12} {"train_loss": -4.2345356941223145, "global_step": 2133, "epoch": 12} {"train_loss": -4.124388694763184, "global_step": 2134, "epoch": 12} {"train_loss": -4.3085126876831055, "global_step": 2135, "epoch": 12} {"train_loss": -4.315561294555664, "global_step": 2136, "epoch": 12} {"train_loss": -4.259171009063721, "global_step": 2137, "epoch": 12} {"train_loss": -4.090472221374512, "global_step": 2138, "epoch": 12} {"train_loss": -4.4951276779174805, "global_step": 2139, "epoch": 12} {"train_loss": -4.427267551422119, "global_step": 2140, "epoch": 12} {"train_loss": -4.082444190979004, "global_step": 2141, "epoch": 12} {"train_loss": -4.221183776855469, "global_step": 2142, "epoch": 12} {"train_loss": -4.256678104400635, "global_step": 2143, "epoch": 12} {"train_loss": -4.213658332824707, "global_step": 2144, "epoch": 12} {"train_loss": -4.165343761444092, "global_step": 2145, "epoch": 12} {"train_loss": -4.113686561584473, "global_step": 2146, "epoch": 12} {"train_loss": -4.1889824867248535, "global_step": 2147, "epoch": 12} {"train_loss": -3.890578031539917, "global_step": 2148, "epoch": 12} {"train_loss": -4.308931350708008, "global_step": 2149, "epoch": 12} {"train_loss": -4.297706604003906, "global_step": 2150, "epoch": 12} {"train_loss": -4.098581314086914, "global_step": 2151, "epoch": 12} {"train_loss": -3.8454370498657227, "global_step": 2152, "epoch": 12} {"train_loss": -4.389897346496582, "global_step": 2153, "epoch": 12} {"train_loss": -4.306450843811035, "global_step": 2154, "epoch": 12} {"train_loss": -4.235595703125, "global_step": 2155, "epoch": 12} {"train_loss": -4.147835731506348, "global_step": 2156, "epoch": 12} {"train_loss": -4.184789657592773, "global_step": 2157, "epoch": 12} {"train_loss": -4.236210346221924, "global_step": 2158, "epoch": 12} {"train_loss": -4.098960876464844, "global_step": 2159, "epoch": 12} {"train_loss": -3.991358518600464, "global_step": 2160, "epoch": 12} {"train_loss": -4.158067226409912, "global_step": 2161, "epoch": 12} {"train_loss": -4.086742877960205, "global_step": 2162, "epoch": 12} {"train_loss": -4.237870216369629, "global_step": 2163, "epoch": 12} {"train_loss": -4.146341323852539, "global_step": 2164, "epoch": 12} {"train_loss": -4.436349868774414, "global_step": 2165, "epoch": 12} {"train_loss": -3.8005852699279785, "global_step": 2166, "epoch": 12} {"train_loss": -4.246521472930908, "global_step": 2167, "epoch": 12} {"train_loss": -4.036998748779297, "global_step": 2168, "epoch": 12} {"train_loss": -4.038470268249512, "global_step": 2169, "epoch": 12} {"train_loss": -4.42106294631958, "global_step": 2170, "epoch": 12} {"train_loss": -4.081550121307373, "global_step": 2171, "epoch": 12} {"train_loss": -4.192106246948242, "global_step": 2172, "epoch": 12} {"train_loss": -4.312106132507324, "global_step": 2173, "epoch": 12} {"train_loss": -4.013272762298584, "global_step": 2174, "epoch": 12} {"train_loss": -4.090073585510254, "global_step": 2175, "epoch": 12} {"train_loss": -4.236394882202148, "global_step": 2176, "epoch": 12} {"train_loss": -4.06154727935791, "global_step": 2177, "epoch": 12} {"train_loss": -4.187680244445801, "global_step": 2178, "epoch": 12} {"train_loss": -4.075437068939209, "global_step": 2179, "epoch": 12} {"train_loss": -4.381705284118652, "global_step": 2180, "epoch": 12} {"train_loss": -3.982600688934326, "global_step": 2181, "epoch": 12} {"train_loss": -3.8374440670013428, "global_step": 2182, "epoch": 12} {"train_loss": -4.1587631815955755, "global_step": 2183, "epoch": 12, "val_loss": 281588.59375} {"train_loss": -3.6801650524139404, "global_step": 2184, "epoch": 13} {"train_loss": -4.085201740264893, "global_step": 2185, "epoch": 13} {"train_loss": -3.9907827377319336, "global_step": 2186, "epoch": 13} {"train_loss": -4.1228861808776855, "global_step": 2187, "epoch": 13} {"train_loss": -4.096381664276123, "global_step": 2188, "epoch": 13} {"train_loss": -4.1154937744140625, "global_step": 2189, "epoch": 13} {"train_loss": -4.1882219314575195, "global_step": 2190, "epoch": 13} {"train_loss": -4.054685592651367, "global_step": 2191, "epoch": 13} {"train_loss": -4.166950225830078, "global_step": 2192, "epoch": 13} {"train_loss": -4.2111711502075195, "global_step": 2193, "epoch": 13} {"train_loss": -4.295660018920898, "global_step": 2194, "epoch": 13} {"train_loss": -4.0556840896606445, "global_step": 2195, "epoch": 13} {"train_loss": -4.236411094665527, "global_step": 2196, "epoch": 13} {"train_loss": -4.0659098625183105, "global_step": 2197, "epoch": 13} {"train_loss": -4.278862476348877, "global_step": 2198, "epoch": 13} {"train_loss": -4.123384952545166, "global_step": 2199, "epoch": 13} {"train_loss": -4.241946220397949, "global_step": 2200, "epoch": 13} {"train_loss": -4.184368133544922, "global_step": 2201, "epoch": 13} {"train_loss": -4.345683574676514, "global_step": 2202, "epoch": 13} {"train_loss": -4.221924781799316, "global_step": 2203, "epoch": 13} {"train_loss": -4.273950099945068, "global_step": 2204, "epoch": 13} {"train_loss": -4.375328063964844, "global_step": 2205, "epoch": 13} {"train_loss": -4.2159318923950195, "global_step": 2206, "epoch": 13} {"train_loss": -4.253580570220947, "global_step": 2207, "epoch": 13} {"train_loss": -4.30864143371582, "global_step": 2208, "epoch": 13} {"train_loss": -4.429868698120117, "global_step": 2209, "epoch": 13} {"train_loss": -4.197391510009766, "global_step": 2210, "epoch": 13} {"train_loss": -4.301506519317627, "global_step": 2211, "epoch": 13} {"train_loss": -4.248420715332031, "global_step": 2212, "epoch": 13} {"train_loss": -4.489989280700684, "global_step": 2213, "epoch": 13} {"train_loss": -4.088741302490234, "global_step": 2214, "epoch": 13} {"train_loss": -4.446834564208984, "global_step": 2215, "epoch": 13} {"train_loss": -4.097196578979492, "global_step": 2216, "epoch": 13} {"train_loss": -4.484055042266846, "global_step": 2217, "epoch": 13} {"train_loss": -4.2206268310546875, "global_step": 2218, "epoch": 13} {"train_loss": -4.252985000610352, "global_step": 2219, "epoch": 13} {"train_loss": -4.220568656921387, "global_step": 2220, "epoch": 13} {"train_loss": -4.214578151702881, "global_step": 2221, "epoch": 13} {"train_loss": -4.078028202056885, "global_step": 2222, "epoch": 13} {"train_loss": -4.205099582672119, "global_step": 2223, "epoch": 13} {"train_loss": -4.328524589538574, "global_step": 2224, "epoch": 13} {"train_loss": -4.312253952026367, "global_step": 2225, "epoch": 13} {"train_loss": -4.215144157409668, "global_step": 2226, "epoch": 13} {"train_loss": -4.574798107147217, "global_step": 2227, "epoch": 13} {"train_loss": -4.324629306793213, "global_step": 2228, "epoch": 13} {"train_loss": -4.480095863342285, "global_step": 2229, "epoch": 13} {"train_loss": -4.416068077087402, "global_step": 2230, "epoch": 13} {"train_loss": -4.287285804748535, "global_step": 2231, "epoch": 13} {"train_loss": -4.390876293182373, "global_step": 2232, "epoch": 13} {"train_loss": -4.5362725257873535, "global_step": 2233, "epoch": 13} {"train_loss": -4.3777570724487305, "global_step": 2234, "epoch": 13} {"train_loss": -4.016481399536133, "global_step": 2235, "epoch": 13} {"train_loss": -3.8539316654205322, "global_step": 2236, "epoch": 13} {"train_loss": -4.219684600830078, "global_step": 2237, "epoch": 13} {"train_loss": -4.250374794006348, "global_step": 2238, "epoch": 13} {"train_loss": -4.004883289337158, "global_step": 2239, "epoch": 13} {"train_loss": -4.000018119812012, "global_step": 2240, "epoch": 13} {"train_loss": -4.237355709075928, "global_step": 2241, "epoch": 13} {"train_loss": -4.223999500274658, "global_step": 2242, "epoch": 13} {"train_loss": -4.205466270446777, "global_step": 2243, "epoch": 13} {"train_loss": -4.3896484375, "global_step": 2244, "epoch": 13} {"train_loss": -4.024394989013672, "global_step": 2245, "epoch": 13} {"train_loss": -4.274271488189697, "global_step": 2246, "epoch": 13} {"train_loss": -4.269527435302734, "global_step": 2247, "epoch": 13} {"train_loss": -4.188678741455078, "global_step": 2248, "epoch": 13} {"train_loss": -3.936906337738037, "global_step": 2249, "epoch": 13} {"train_loss": -4.062251091003418, "global_step": 2250, "epoch": 13} {"train_loss": -4.205228328704834, "global_step": 2251, "epoch": 13} {"train_loss": -4.082958221435547, "global_step": 2252, "epoch": 13} {"train_loss": -4.25492000579834, "global_step": 2253, "epoch": 13} {"train_loss": -4.215513229370117, "global_step": 2254, "epoch": 13} {"train_loss": -4.147270679473877, "global_step": 2255, "epoch": 13} {"train_loss": -4.043430328369141, "global_step": 2256, "epoch": 13} {"train_loss": -4.308258056640625, "global_step": 2257, "epoch": 13} {"train_loss": -4.140743255615234, "global_step": 2258, "epoch": 13} {"train_loss": -4.1403608322143555, "global_step": 2259, "epoch": 13} {"train_loss": -4.424781322479248, "global_step": 2260, "epoch": 13} {"train_loss": -3.951854705810547, "global_step": 2261, "epoch": 13} {"train_loss": -4.416572093963623, "global_step": 2262, "epoch": 13} {"train_loss": -4.0667033195495605, "global_step": 2263, "epoch": 13} {"train_loss": -3.5854740142822266, "global_step": 2264, "epoch": 13} {"train_loss": -4.3747358322143555, "global_step": 2265, "epoch": 13} {"train_loss": -3.992715835571289, "global_step": 2266, "epoch": 13} {"train_loss": -4.265383720397949, "global_step": 2267, "epoch": 13} {"train_loss": -4.213216781616211, "global_step": 2268, "epoch": 13} {"train_loss": -4.286670684814453, "global_step": 2269, "epoch": 13} {"train_loss": -4.0464768409729, "global_step": 2270, "epoch": 13} {"train_loss": -4.17647123336792, "global_step": 2271, "epoch": 13} {"train_loss": -4.20594596862793, "global_step": 2272, "epoch": 13} {"train_loss": -4.168946266174316, "global_step": 2273, "epoch": 13} {"train_loss": -4.118181228637695, "global_step": 2274, "epoch": 13} {"train_loss": -4.335036277770996, "global_step": 2275, "epoch": 13} {"train_loss": -4.171270370483398, "global_step": 2276, "epoch": 13} {"train_loss": -4.3130998611450195, "global_step": 2277, "epoch": 13} {"train_loss": -3.89499568939209, "global_step": 2278, "epoch": 13} {"train_loss": -4.218542098999023, "global_step": 2279, "epoch": 13} {"train_loss": -4.019917011260986, "global_step": 2280, "epoch": 13} {"train_loss": -3.8912253379821777, "global_step": 2281, "epoch": 13} {"train_loss": -4.360649585723877, "global_step": 2282, "epoch": 13} {"train_loss": -3.9072632789611816, "global_step": 2283, "epoch": 13} {"train_loss": -4.4257402420043945, "global_step": 2284, "epoch": 13} {"train_loss": -4.262772560119629, "global_step": 2285, "epoch": 13} {"train_loss": -4.400082588195801, "global_step": 2286, "epoch": 13} {"train_loss": -4.1880950927734375, "global_step": 2287, "epoch": 13} {"train_loss": -4.345487594604492, "global_step": 2288, "epoch": 13} {"train_loss": -4.260023593902588, "global_step": 2289, "epoch": 13} {"train_loss": -4.258003234863281, "global_step": 2290, "epoch": 13} {"train_loss": -4.137403964996338, "global_step": 2291, "epoch": 13} {"train_loss": -4.220395088195801, "global_step": 2292, "epoch": 13} {"train_loss": -4.000157833099365, "global_step": 2293, "epoch": 13} {"train_loss": -4.379569053649902, "global_step": 2294, "epoch": 13} {"train_loss": -4.197965145111084, "global_step": 2295, "epoch": 13} {"train_loss": -3.9577338695526123, "global_step": 2296, "epoch": 13} {"train_loss": -4.124942779541016, "global_step": 2297, "epoch": 13} {"train_loss": -3.9552338123321533, "global_step": 2298, "epoch": 13} {"train_loss": -4.214651584625244, "global_step": 2299, "epoch": 13} {"train_loss": -4.042663097381592, "global_step": 2300, "epoch": 13} {"train_loss": -4.093070983886719, "global_step": 2301, "epoch": 13} {"train_loss": -4.320582389831543, "global_step": 2302, "epoch": 13} {"train_loss": -4.170968055725098, "global_step": 2303, "epoch": 13} {"train_loss": -4.323509693145752, "global_step": 2304, "epoch": 13} {"train_loss": -4.279961585998535, "global_step": 2305, "epoch": 13} {"train_loss": -4.127507209777832, "global_step": 2306, "epoch": 13} {"train_loss": -4.187895774841309, "global_step": 2307, "epoch": 13} {"train_loss": -4.2739410400390625, "global_step": 2308, "epoch": 13} {"train_loss": -4.300433158874512, "global_step": 2309, "epoch": 13} {"train_loss": -4.430790424346924, "global_step": 2310, "epoch": 13} {"train_loss": -4.357020854949951, "global_step": 2311, "epoch": 13} {"train_loss": -4.538177490234375, "global_step": 2312, "epoch": 13} {"train_loss": -4.4246015548706055, "global_step": 2313, "epoch": 13} {"train_loss": -4.412723064422607, "global_step": 2314, "epoch": 13} {"train_loss": -4.1217851638793945, "global_step": 2315, "epoch": 13} {"train_loss": -4.314530849456787, "global_step": 2316, "epoch": 13} {"train_loss": -4.435611724853516, "global_step": 2317, "epoch": 13} {"train_loss": -4.263217926025391, "global_step": 2318, "epoch": 13} {"train_loss": -4.31867790222168, "global_step": 2319, "epoch": 13} {"train_loss": -4.040849208831787, "global_step": 2320, "epoch": 13} {"train_loss": -4.196497917175293, "global_step": 2321, "epoch": 13} {"train_loss": -4.231064796447754, "global_step": 2322, "epoch": 13} {"train_loss": -3.915182113647461, "global_step": 2323, "epoch": 13} {"train_loss": -4.102101802825928, "global_step": 2324, "epoch": 13} {"train_loss": -4.435585975646973, "global_step": 2325, "epoch": 13} {"train_loss": -4.114475250244141, "global_step": 2326, "epoch": 13} {"train_loss": -3.683656692504883, "global_step": 2327, "epoch": 13} {"train_loss": -3.956387519836426, "global_step": 2328, "epoch": 13} {"train_loss": -3.9775447845458984, "global_step": 2329, "epoch": 13} {"train_loss": -4.003708839416504, "global_step": 2330, "epoch": 13} {"train_loss": -4.037900447845459, "global_step": 2331, "epoch": 13} {"train_loss": -4.173826694488525, "global_step": 2332, "epoch": 13} {"train_loss": -3.9679763317108154, "global_step": 2333, "epoch": 13} {"train_loss": -4.055586814880371, "global_step": 2334, "epoch": 13} {"train_loss": -3.70377254486084, "global_step": 2335, "epoch": 13} {"train_loss": -4.218770980834961, "global_step": 2336, "epoch": 13} {"train_loss": -3.9712069034576416, "global_step": 2337, "epoch": 13} {"train_loss": -3.9974546432495117, "global_step": 2338, "epoch": 13} {"train_loss": -4.079637050628662, "global_step": 2339, "epoch": 13} {"train_loss": -4.223532199859619, "global_step": 2340, "epoch": 13} {"train_loss": -4.1253581047058105, "global_step": 2341, "epoch": 13} {"train_loss": -4.004488945007324, "global_step": 2342, "epoch": 13} {"train_loss": -4.220503807067871, "global_step": 2343, "epoch": 13} {"train_loss": -4.103686332702637, "global_step": 2344, "epoch": 13} {"train_loss": -4.225944995880127, "global_step": 2345, "epoch": 13} {"train_loss": -3.9303789138793945, "global_step": 2346, "epoch": 13} {"train_loss": -4.338254928588867, "global_step": 2347, "epoch": 13} {"train_loss": -4.052005767822266, "global_step": 2348, "epoch": 13} {"train_loss": -4.399724006652832, "global_step": 2349, "epoch": 13} {"train_loss": -4.150445461273193, "global_step": 2350, "epoch": 13} {"train_loss": -4.1855959097544355, "global_step": 2351, "epoch": 13, "val_loss": 257897.328125} {"train_loss": -3.9783284664154053, "global_step": 2352, "epoch": 14} {"train_loss": -4.032235145568848, "global_step": 2353, "epoch": 14} {"train_loss": -4.151888370513916, "global_step": 2354, "epoch": 14} {"train_loss": -4.083957672119141, "global_step": 2355, "epoch": 14} {"train_loss": -4.235431671142578, "global_step": 2356, "epoch": 14} {"train_loss": -4.496025562286377, "global_step": 2357, "epoch": 14} {"train_loss": -4.218838691711426, "global_step": 2358, "epoch": 14} {"train_loss": -4.414633750915527, "global_step": 2359, "epoch": 14} {"train_loss": -4.262049674987793, "global_step": 2360, "epoch": 14} {"train_loss": -4.333505153656006, "global_step": 2361, "epoch": 14} {"train_loss": -4.306186676025391, "global_step": 2362, "epoch": 14} {"train_loss": -4.281063079833984, "global_step": 2363, "epoch": 14} {"train_loss": -4.331300735473633, "global_step": 2364, "epoch": 14} {"train_loss": -4.397115230560303, "global_step": 2365, "epoch": 14} {"train_loss": -4.38680362701416, "global_step": 2366, "epoch": 14} {"train_loss": -4.016755104064941, "global_step": 2367, "epoch": 14} {"train_loss": -4.5906219482421875, "global_step": 2368, "epoch": 14} {"train_loss": -4.184639930725098, "global_step": 2369, "epoch": 14} {"train_loss": -4.270667552947998, "global_step": 2370, "epoch": 14} {"train_loss": -4.335441589355469, "global_step": 2371, "epoch": 14} {"train_loss": -4.383812427520752, "global_step": 2372, "epoch": 14} {"train_loss": -4.1859025955200195, "global_step": 2373, "epoch": 14} {"train_loss": -4.027657508850098, "global_step": 2374, "epoch": 14} {"train_loss": -4.112617015838623, "global_step": 2375, "epoch": 14} {"train_loss": -4.399836540222168, "global_step": 2376, "epoch": 14} {"train_loss": -4.041875839233398, "global_step": 2377, "epoch": 14} {"train_loss": -3.7666525840759277, "global_step": 2378, "epoch": 14} {"train_loss": -4.268486499786377, "global_step": 2379, "epoch": 14} {"train_loss": -4.147111892700195, "global_step": 2380, "epoch": 14} {"train_loss": -3.5675904750823975, "global_step": 2381, "epoch": 14} {"train_loss": -4.16514778137207, "global_step": 2382, "epoch": 14} {"train_loss": -4.112743377685547, "global_step": 2383, "epoch": 14} {"train_loss": -4.264642715454102, "global_step": 2384, "epoch": 14} {"train_loss": -4.216953754425049, "global_step": 2385, "epoch": 14} {"train_loss": -4.007375717163086, "global_step": 2386, "epoch": 14} {"train_loss": -4.242607116699219, "global_step": 2387, "epoch": 14} {"train_loss": -4.072366714477539, "global_step": 2388, "epoch": 14} {"train_loss": -4.311248779296875, "global_step": 2389, "epoch": 14} {"train_loss": -4.269723892211914, "global_step": 2390, "epoch": 14} {"train_loss": -4.142852783203125, "global_step": 2391, "epoch": 14} {"train_loss": -4.445510387420654, "global_step": 2392, "epoch": 14} {"train_loss": -4.275078773498535, "global_step": 2393, "epoch": 14} {"train_loss": -4.3611955642700195, "global_step": 2394, "epoch": 14} {"train_loss": -4.367170333862305, "global_step": 2395, "epoch": 14} {"train_loss": -4.675009250640869, "global_step": 2396, "epoch": 14} {"train_loss": -4.093142509460449, "global_step": 2397, "epoch": 14} {"train_loss": -4.557460784912109, "global_step": 2398, "epoch": 14} {"train_loss": -4.151003837585449, "global_step": 2399, "epoch": 14} {"train_loss": -4.063860893249512, "global_step": 2400, "epoch": 14} {"train_loss": -4.18752384185791, "global_step": 2401, "epoch": 14} {"train_loss": -4.285465240478516, "global_step": 2402, "epoch": 14} {"train_loss": -4.513172149658203, "global_step": 2403, "epoch": 14} {"train_loss": -4.355216026306152, "global_step": 2404, "epoch": 14} {"train_loss": -4.476490020751953, "global_step": 2405, "epoch": 14} {"train_loss": -4.271157264709473, "global_step": 2406, "epoch": 14} {"train_loss": -4.003872871398926, "global_step": 2407, "epoch": 14} {"train_loss": -4.327754974365234, "global_step": 2408, "epoch": 14} {"train_loss": -4.483221054077148, "global_step": 2409, "epoch": 14} {"train_loss": -4.154201507568359, "global_step": 2410, "epoch": 14} {"train_loss": -4.154709815979004, "global_step": 2411, "epoch": 14} {"train_loss": -4.163719177246094, "global_step": 2412, "epoch": 14} {"train_loss": -4.326526641845703, "global_step": 2413, "epoch": 14} {"train_loss": -4.187936782836914, "global_step": 2414, "epoch": 14} {"train_loss": -4.199429512023926, "global_step": 2415, "epoch": 14} {"train_loss": -4.242245197296143, "global_step": 2416, "epoch": 14} {"train_loss": -4.071681976318359, "global_step": 2417, "epoch": 14} {"train_loss": -4.444255828857422, "global_step": 2418, "epoch": 14} {"train_loss": -4.307924747467041, "global_step": 2419, "epoch": 14} {"train_loss": -4.200172424316406, "global_step": 2420, "epoch": 14} {"train_loss": -4.21899938583374, "global_step": 2421, "epoch": 14} {"train_loss": -4.142996311187744, "global_step": 2422, "epoch": 14} {"train_loss": -4.419268608093262, "global_step": 2423, "epoch": 14} {"train_loss": -3.9412198066711426, "global_step": 2424, "epoch": 14} {"train_loss": -4.4571099281311035, "global_step": 2425, "epoch": 14} {"train_loss": -4.146084308624268, "global_step": 2426, "epoch": 14} {"train_loss": -4.074594497680664, "global_step": 2427, "epoch": 14} {"train_loss": -4.623453617095947, "global_step": 2428, "epoch": 14} {"train_loss": -4.266070365905762, "global_step": 2429, "epoch": 14} {"train_loss": -4.256824493408203, "global_step": 2430, "epoch": 14} {"train_loss": -4.118668556213379, "global_step": 2431, "epoch": 14} {"train_loss": -4.276072025299072, "global_step": 2432, "epoch": 14} {"train_loss": -4.221896648406982, "global_step": 2433, "epoch": 14} {"train_loss": -4.380025863647461, "global_step": 2434, "epoch": 14} {"train_loss": -4.505256652832031, "global_step": 2435, "epoch": 14} {"train_loss": -4.254858016967773, "global_step": 2436, "epoch": 14} {"train_loss": -4.309200286865234, "global_step": 2437, "epoch": 14} {"train_loss": -4.481884956359863, "global_step": 2438, "epoch": 14} {"train_loss": -4.056947708129883, "global_step": 2439, "epoch": 14} {"train_loss": -4.18317985534668, "global_step": 2440, "epoch": 14} {"train_loss": -4.185523986816406, "global_step": 2441, "epoch": 14} {"train_loss": -4.224082946777344, "global_step": 2442, "epoch": 14} {"train_loss": -4.498254299163818, "global_step": 2443, "epoch": 14} {"train_loss": -4.126918792724609, "global_step": 2444, "epoch": 14} {"train_loss": -4.586977481842041, "global_step": 2445, "epoch": 14} {"train_loss": -4.049422264099121, "global_step": 2446, "epoch": 14} {"train_loss": -4.065027236938477, "global_step": 2447, "epoch": 14} {"train_loss": -4.005024433135986, "global_step": 2448, "epoch": 14} {"train_loss": -4.247261047363281, "global_step": 2449, "epoch": 14} {"train_loss": -4.521691799163818, "global_step": 2450, "epoch": 14} {"train_loss": -3.9910459518432617, "global_step": 2451, "epoch": 14} {"train_loss": -4.396353244781494, "global_step": 2452, "epoch": 14} {"train_loss": -4.22711706161499, "global_step": 2453, "epoch": 14} {"train_loss": -4.201055526733398, "global_step": 2454, "epoch": 14} {"train_loss": -4.345840930938721, "global_step": 2455, "epoch": 14} {"train_loss": -4.2553205490112305, "global_step": 2456, "epoch": 14} {"train_loss": -4.4201884269714355, "global_step": 2457, "epoch": 14} {"train_loss": -4.386892318725586, "global_step": 2458, "epoch": 14} {"train_loss": -4.452005386352539, "global_step": 2459, "epoch": 14} {"train_loss": -4.380827903747559, "global_step": 2460, "epoch": 14} {"train_loss": -4.617512226104736, "global_step": 2461, "epoch": 14} {"train_loss": -4.230280876159668, "global_step": 2462, "epoch": 14} {"train_loss": -4.408239841461182, "global_step": 2463, "epoch": 14} {"train_loss": -4.437955379486084, "global_step": 2464, "epoch": 14} {"train_loss": -4.240748405456543, "global_step": 2465, "epoch": 14} {"train_loss": -4.48630428314209, "global_step": 2466, "epoch": 14} {"train_loss": -4.323582649230957, "global_step": 2467, "epoch": 14} {"train_loss": -4.125330924987793, "global_step": 2468, "epoch": 14} {"train_loss": -4.128464698791504, "global_step": 2469, "epoch": 14} {"train_loss": -4.442557334899902, "global_step": 2470, "epoch": 14} {"train_loss": -4.405771255493164, "global_step": 2471, "epoch": 14} {"train_loss": -4.2978596687316895, "global_step": 2472, "epoch": 14} {"train_loss": -4.583899021148682, "global_step": 2473, "epoch": 14} {"train_loss": -4.521421432495117, "global_step": 2474, "epoch": 14} {"train_loss": -4.236032009124756, "global_step": 2475, "epoch": 14} {"train_loss": -4.395251274108887, "global_step": 2476, "epoch": 14} {"train_loss": -4.301912307739258, "global_step": 2477, "epoch": 14} {"train_loss": -4.567963123321533, "global_step": 2478, "epoch": 14} {"train_loss": -4.421619892120361, "global_step": 2479, "epoch": 14} {"train_loss": -4.550609111785889, "global_step": 2480, "epoch": 14} {"train_loss": -4.545297622680664, "global_step": 2481, "epoch": 14} {"train_loss": -4.128163814544678, "global_step": 2482, "epoch": 14} {"train_loss": -4.195185661315918, "global_step": 2483, "epoch": 14} {"train_loss": -4.163146018981934, "global_step": 2484, "epoch": 14} {"train_loss": -4.173621654510498, "global_step": 2485, "epoch": 14} {"train_loss": -4.417514801025391, "global_step": 2486, "epoch": 14} {"train_loss": -4.352999687194824, "global_step": 2487, "epoch": 14} {"train_loss": -4.376091957092285, "global_step": 2488, "epoch": 14} {"train_loss": -4.021399974822998, "global_step": 2489, "epoch": 14} {"train_loss": -4.287129878997803, "global_step": 2490, "epoch": 14} {"train_loss": -4.266476154327393, "global_step": 2491, "epoch": 14} {"train_loss": -4.181878566741943, "global_step": 2492, "epoch": 14} {"train_loss": -4.325202465057373, "global_step": 2493, "epoch": 14} {"train_loss": -4.322131633758545, "global_step": 2494, "epoch": 14} {"train_loss": -4.258980751037598, "global_step": 2495, "epoch": 14} {"train_loss": -4.300610542297363, "global_step": 2496, "epoch": 14} {"train_loss": -4.275957107543945, "global_step": 2497, "epoch": 14} {"train_loss": -4.384763717651367, "global_step": 2498, "epoch": 14} {"train_loss": -4.497061729431152, "global_step": 2499, "epoch": 14} {"train_loss": -4.173750877380371, "global_step": 2500, "epoch": 14} {"train_loss": -4.253355979919434, "global_step": 2501, "epoch": 14} {"train_loss": -4.117956638336182, "global_step": 2502, "epoch": 14} {"train_loss": -4.630826950073242, "global_step": 2503, "epoch": 14} {"train_loss": -4.324596881866455, "global_step": 2504, "epoch": 14} {"train_loss": -4.293790817260742, "global_step": 2505, "epoch": 14} {"train_loss": -4.481855392456055, "global_step": 2506, "epoch": 14} {"train_loss": -4.54798698425293, "global_step": 2507, "epoch": 14} {"train_loss": -4.437901496887207, "global_step": 2508, "epoch": 14} {"train_loss": -4.427317142486572, "global_step": 2509, "epoch": 14} {"train_loss": -4.241605281829834, "global_step": 2510, "epoch": 14} {"train_loss": -4.364554405212402, "global_step": 2511, "epoch": 14} {"train_loss": -4.284031867980957, "global_step": 2512, "epoch": 14} {"train_loss": -4.370955944061279, "global_step": 2513, "epoch": 14} {"train_loss": -4.194436550140381, "global_step": 2514, "epoch": 14} {"train_loss": -4.408631324768066, "global_step": 2515, "epoch": 14} {"train_loss": -4.3791279792785645, "global_step": 2516, "epoch": 14} {"train_loss": -4.268064498901367, "global_step": 2517, "epoch": 14} {"train_loss": -4.425804615020752, "global_step": 2518, "epoch": 14} {"train_loss": -4.281475660346803, "global_step": 2519, "epoch": 14, "val_loss": 243176.90625} {"train_loss": -4.51182746887207, "global_step": 2520, "epoch": 15} {"train_loss": -4.211832046508789, "global_step": 2521, "epoch": 15} {"train_loss": -4.556320667266846, "global_step": 2522, "epoch": 15} {"train_loss": -4.50227165222168, "global_step": 2523, "epoch": 15} {"train_loss": -4.3485188484191895, "global_step": 2524, "epoch": 15} {"train_loss": -3.9297642707824707, "global_step": 2525, "epoch": 15} {"train_loss": -4.4027299880981445, "global_step": 2526, "epoch": 15} {"train_loss": -3.995135545730591, "global_step": 2527, "epoch": 15} {"train_loss": -4.061588287353516, "global_step": 2528, "epoch": 15} {"train_loss": -4.162204742431641, "global_step": 2529, "epoch": 15} {"train_loss": -4.3397722244262695, "global_step": 2530, "epoch": 15} {"train_loss": -4.38984489440918, "global_step": 2531, "epoch": 15} {"train_loss": -4.19028377532959, "global_step": 2532, "epoch": 15} {"train_loss": -4.3393707275390625, "global_step": 2533, "epoch": 15} {"train_loss": -3.8914787769317627, "global_step": 2534, "epoch": 15} {"train_loss": -4.0168657302856445, "global_step": 2535, "epoch": 15} {"train_loss": -4.025854110717773, "global_step": 2536, "epoch": 15} {"train_loss": -4.341557025909424, "global_step": 2537, "epoch": 15} {"train_loss": -4.196345329284668, "global_step": 2538, "epoch": 15} {"train_loss": -4.11004638671875, "global_step": 2539, "epoch": 15} {"train_loss": -3.80670166015625, "global_step": 2540, "epoch": 15} {"train_loss": -4.188011169433594, "global_step": 2541, "epoch": 15} {"train_loss": -4.287618637084961, "global_step": 2542, "epoch": 15} {"train_loss": -3.8549375534057617, "global_step": 2543, "epoch": 15} {"train_loss": -4.226889610290527, "global_step": 2544, "epoch": 15} {"train_loss": -4.1750640869140625, "global_step": 2545, "epoch": 15} {"train_loss": -4.099573135375977, "global_step": 2546, "epoch": 15} {"train_loss": -4.171835899353027, "global_step": 2547, "epoch": 15} {"train_loss": -4.0963592529296875, "global_step": 2548, "epoch": 15} {"train_loss": -3.7296619415283203, "global_step": 2549, "epoch": 15} {"train_loss": -4.206275463104248, "global_step": 2550, "epoch": 15} {"train_loss": -4.227357864379883, "global_step": 2551, "epoch": 15} {"train_loss": -4.203746318817139, "global_step": 2552, "epoch": 15} {"train_loss": -4.476858139038086, "global_step": 2553, "epoch": 15} {"train_loss": -4.239057540893555, "global_step": 2554, "epoch": 15} {"train_loss": -4.270323753356934, "global_step": 2555, "epoch": 15} {"train_loss": -4.387277603149414, "global_step": 2556, "epoch": 15} {"train_loss": -4.211944580078125, "global_step": 2557, "epoch": 15} {"train_loss": -4.300753593444824, "global_step": 2558, "epoch": 15} {"train_loss": -3.9762015342712402, "global_step": 2559, "epoch": 15} {"train_loss": -4.156436920166016, "global_step": 2560, "epoch": 15} {"train_loss": -4.258993148803711, "global_step": 2561, "epoch": 15} {"train_loss": -4.174302101135254, "global_step": 2562, "epoch": 15} {"train_loss": -4.213677883148193, "global_step": 2563, "epoch": 15} {"train_loss": -4.287492752075195, "global_step": 2564, "epoch": 15} {"train_loss": -4.231505393981934, "global_step": 2565, "epoch": 15} {"train_loss": -4.622641563415527, "global_step": 2566, "epoch": 15} {"train_loss": -4.407180309295654, "global_step": 2567, "epoch": 15} {"train_loss": -4.156238079071045, "global_step": 2568, "epoch": 15} {"train_loss": -4.432767868041992, "global_step": 2569, "epoch": 15} {"train_loss": -4.564348220825195, "global_step": 2570, "epoch": 15} {"train_loss": -4.51901388168335, "global_step": 2571, "epoch": 15} {"train_loss": -4.810464859008789, "global_step": 2572, "epoch": 15} {"train_loss": -4.12246561050415, "global_step": 2573, "epoch": 15} {"train_loss": -4.367925643920898, "global_step": 2574, "epoch": 15} {"train_loss": -4.087240219116211, "global_step": 2575, "epoch": 15} {"train_loss": -4.074409484863281, "global_step": 2576, "epoch": 15} {"train_loss": -4.166851043701172, "global_step": 2577, "epoch": 15} {"train_loss": -4.316273212432861, "global_step": 2578, "epoch": 15} {"train_loss": -4.446036338806152, "global_step": 2579, "epoch": 15} {"train_loss": -4.678617477416992, "global_step": 2580, "epoch": 15} {"train_loss": -4.246767997741699, "global_step": 2581, "epoch": 15} {"train_loss": -4.331655502319336, "global_step": 2582, "epoch": 15} {"train_loss": -4.543656349182129, "global_step": 2583, "epoch": 15} {"train_loss": -4.303814888000488, "global_step": 2584, "epoch": 15} {"train_loss": -4.094839096069336, "global_step": 2585, "epoch": 15} {"train_loss": -4.243383407592773, "global_step": 2586, "epoch": 15} {"train_loss": -4.199782371520996, "global_step": 2587, "epoch": 15} {"train_loss": -4.004629135131836, "global_step": 2588, "epoch": 15} {"train_loss": -3.9765779972076416, "global_step": 2589, "epoch": 15} {"train_loss": -4.0679168701171875, "global_step": 2590, "epoch": 15} {"train_loss": -4.3300886154174805, "global_step": 2591, "epoch": 15} {"train_loss": -4.391230583190918, "global_step": 2592, "epoch": 15} {"train_loss": -3.9995779991149902, "global_step": 2593, "epoch": 15} {"train_loss": -4.457583427429199, "global_step": 2594, "epoch": 15} {"train_loss": -4.214679718017578, "global_step": 2595, "epoch": 15} {"train_loss": -4.6537885665893555, "global_step": 2596, "epoch": 15} {"train_loss": -4.3185133934021, "global_step": 2597, "epoch": 15} {"train_loss": -4.505788803100586, "global_step": 2598, "epoch": 15} {"train_loss": -4.3525285720825195, "global_step": 2599, "epoch": 15} {"train_loss": -4.419958591461182, "global_step": 2600, "epoch": 15} {"train_loss": -4.268359661102295, "global_step": 2601, "epoch": 15} {"train_loss": -4.421361923217773, "global_step": 2602, "epoch": 15} {"train_loss": -4.231666564941406, "global_step": 2603, "epoch": 15} {"train_loss": -4.555174827575684, "global_step": 2604, "epoch": 15} {"train_loss": -4.538518905639648, "global_step": 2605, "epoch": 15} {"train_loss": -4.38877010345459, "global_step": 2606, "epoch": 15} {"train_loss": -4.213556289672852, "global_step": 2607, "epoch": 15} {"train_loss": -4.5947771072387695, "global_step": 2608, "epoch": 15} {"train_loss": -4.311751365661621, "global_step": 2609, "epoch": 15} {"train_loss": -4.325037956237793, "global_step": 2610, "epoch": 15} {"train_loss": -4.270750045776367, "global_step": 2611, "epoch": 15} {"train_loss": -4.318119049072266, "global_step": 2612, "epoch": 15} {"train_loss": -4.276427268981934, "global_step": 2613, "epoch": 15} {"train_loss": -4.250707626342773, "global_step": 2614, "epoch": 15} {"train_loss": -4.3493499755859375, "global_step": 2615, "epoch": 15} {"train_loss": -4.381612777709961, "global_step": 2616, "epoch": 15} {"train_loss": -4.245160102844238, "global_step": 2617, "epoch": 15} {"train_loss": -4.55335807800293, "global_step": 2618, "epoch": 15} {"train_loss": -3.9098949432373047, "global_step": 2619, "epoch": 15} {"train_loss": -4.437851905822754, "global_step": 2620, "epoch": 15} {"train_loss": -4.043299674987793, "global_step": 2621, "epoch": 15} {"train_loss": -4.424596786499023, "global_step": 2622, "epoch": 15} {"train_loss": -4.264798164367676, "global_step": 2623, "epoch": 15} {"train_loss": -4.426961421966553, "global_step": 2624, "epoch": 15} {"train_loss": -4.437068939208984, "global_step": 2625, "epoch": 15} {"train_loss": -4.233716011047363, "global_step": 2626, "epoch": 15} {"train_loss": -4.33290958404541, "global_step": 2627, "epoch": 15} {"train_loss": -4.446774482727051, "global_step": 2628, "epoch": 15} {"train_loss": -4.326654434204102, "global_step": 2629, "epoch": 15} {"train_loss": -4.557759761810303, "global_step": 2630, "epoch": 15} {"train_loss": -3.888967514038086, "global_step": 2631, "epoch": 15} {"train_loss": -4.125022888183594, "global_step": 2632, "epoch": 15} {"train_loss": -4.265249252319336, "global_step": 2633, "epoch": 15} {"train_loss": -4.551505088806152, "global_step": 2634, "epoch": 15} {"train_loss": -4.254302501678467, "global_step": 2635, "epoch": 15} {"train_loss": -4.236949920654297, "global_step": 2636, "epoch": 15} {"train_loss": -4.437352180480957, "global_step": 2637, "epoch": 15} {"train_loss": -4.300815105438232, "global_step": 2638, "epoch": 15} {"train_loss": -4.253286838531494, "global_step": 2639, "epoch": 15} {"train_loss": -4.140926837921143, "global_step": 2640, "epoch": 15} {"train_loss": -4.539838790893555, "global_step": 2641, "epoch": 15} {"train_loss": -4.168107032775879, "global_step": 2642, "epoch": 15} {"train_loss": -4.141722679138184, "global_step": 2643, "epoch": 15} {"train_loss": -4.4302167892456055, "global_step": 2644, "epoch": 15} {"train_loss": -4.473542213439941, "global_step": 2645, "epoch": 15} {"train_loss": -4.404294490814209, "global_step": 2646, "epoch": 15} {"train_loss": -4.2271199226379395, "global_step": 2647, "epoch": 15} {"train_loss": -4.406664848327637, "global_step": 2648, "epoch": 15} {"train_loss": -4.203728675842285, "global_step": 2649, "epoch": 15} {"train_loss": -4.319178104400635, "global_step": 2650, "epoch": 15} {"train_loss": -4.318349361419678, "global_step": 2651, "epoch": 15} {"train_loss": -4.561799049377441, "global_step": 2652, "epoch": 15} {"train_loss": -4.3426408767700195, "global_step": 2653, "epoch": 15} {"train_loss": -4.371198654174805, "global_step": 2654, "epoch": 15} {"train_loss": -4.4719953536987305, "global_step": 2655, "epoch": 15} {"train_loss": -4.303765296936035, "global_step": 2656, "epoch": 15} {"train_loss": -4.416398048400879, "global_step": 2657, "epoch": 15} {"train_loss": -4.135256767272949, "global_step": 2658, "epoch": 15} {"train_loss": -4.322097301483154, "global_step": 2659, "epoch": 15} {"train_loss": -4.29862117767334, "global_step": 2660, "epoch": 15} {"train_loss": -4.220178604125977, "global_step": 2661, "epoch": 15} {"train_loss": -4.356773376464844, "global_step": 2662, "epoch": 15} {"train_loss": -4.212976932525635, "global_step": 2663, "epoch": 15} {"train_loss": -3.94167423248291, "global_step": 2664, "epoch": 15} {"train_loss": -4.429498195648193, "global_step": 2665, "epoch": 15} {"train_loss": -4.348912715911865, "global_step": 2666, "epoch": 15} {"train_loss": -4.2454376220703125, "global_step": 2667, "epoch": 15} {"train_loss": -4.455744743347168, "global_step": 2668, "epoch": 15} {"train_loss": -4.390341758728027, "global_step": 2669, "epoch": 15} {"train_loss": -4.508594512939453, "global_step": 2670, "epoch": 15} {"train_loss": -4.452933311462402, "global_step": 2671, "epoch": 15} {"train_loss": -4.462437152862549, "global_step": 2672, "epoch": 15} {"train_loss": -4.492478847503662, "global_step": 2673, "epoch": 15} {"train_loss": -4.514036178588867, "global_step": 2674, "epoch": 15} {"train_loss": -4.2812700271606445, "global_step": 2675, "epoch": 15} {"train_loss": -4.416997909545898, "global_step": 2676, "epoch": 15} {"train_loss": -4.386036396026611, "global_step": 2677, "epoch": 15} {"train_loss": -4.449960708618164, "global_step": 2678, "epoch": 15} {"train_loss": -4.382081985473633, "global_step": 2679, "epoch": 15} {"train_loss": -4.258291721343994, "global_step": 2680, "epoch": 15} {"train_loss": -4.535799980163574, "global_step": 2681, "epoch": 15} {"train_loss": -4.533661842346191, "global_step": 2682, "epoch": 15} {"train_loss": -4.521286487579346, "global_step": 2683, "epoch": 15} {"train_loss": -4.257668495178223, "global_step": 2684, "epoch": 15} {"train_loss": -4.440241813659668, "global_step": 2685, "epoch": 15} {"train_loss": -4.287567138671875, "global_step": 2686, "epoch": 15} {"train_loss": -4.300731521277201, "global_step": 2687, "epoch": 15, "val_loss": 261337.96875, "train_action_mse_error": 103.1139907836914} {"train_loss": -4.3781962394714355, "global_step": 2688, "epoch": 16} {"train_loss": -4.126269340515137, "global_step": 2689, "epoch": 16} {"train_loss": -4.543447017669678, "global_step": 2690, "epoch": 16} {"train_loss": -4.345807075500488, "global_step": 2691, "epoch": 16} {"train_loss": -4.2995405197143555, "global_step": 2692, "epoch": 16} {"train_loss": -4.188053131103516, "global_step": 2693, "epoch": 16} {"train_loss": -4.445950508117676, "global_step": 2694, "epoch": 16} {"train_loss": -3.8501806259155273, "global_step": 2695, "epoch": 16} {"train_loss": -4.19228458404541, "global_step": 2696, "epoch": 16} {"train_loss": -4.3641862869262695, "global_step": 2697, "epoch": 16} {"train_loss": -4.161861419677734, "global_step": 2698, "epoch": 16} {"train_loss": -4.151289939880371, "global_step": 2699, "epoch": 16} {"train_loss": -4.4393839836120605, "global_step": 2700, "epoch": 16} {"train_loss": -4.676335334777832, "global_step": 2701, "epoch": 16} {"train_loss": -4.225545883178711, "global_step": 2702, "epoch": 16} {"train_loss": -4.544458389282227, "global_step": 2703, "epoch": 16} {"train_loss": -4.30071496963501, "global_step": 2704, "epoch": 16} {"train_loss": -4.424912452697754, "global_step": 2705, "epoch": 16} {"train_loss": -4.28077507019043, "global_step": 2706, "epoch": 16} {"train_loss": -4.381644248962402, "global_step": 2707, "epoch": 16} {"train_loss": -4.089731216430664, "global_step": 2708, "epoch": 16} {"train_loss": -4.341691970825195, "global_step": 2709, "epoch": 16} {"train_loss": -4.389915466308594, "global_step": 2710, "epoch": 16} {"train_loss": -4.245638847351074, "global_step": 2711, "epoch": 16} {"train_loss": -4.590841293334961, "global_step": 2712, "epoch": 16} {"train_loss": -4.38746976852417, "global_step": 2713, "epoch": 16} {"train_loss": -4.3772735595703125, "global_step": 2714, "epoch": 16} {"train_loss": -4.040035247802734, "global_step": 2715, "epoch": 16} {"train_loss": -4.180809020996094, "global_step": 2716, "epoch": 16} {"train_loss": -4.426772594451904, "global_step": 2717, "epoch": 16} {"train_loss": -4.259079456329346, "global_step": 2718, "epoch": 16} {"train_loss": -4.33509635925293, "global_step": 2719, "epoch": 16} {"train_loss": -4.531803131103516, "global_step": 2720, "epoch": 16} {"train_loss": -4.334742546081543, "global_step": 2721, "epoch": 16} {"train_loss": -4.446144104003906, "global_step": 2722, "epoch": 16} {"train_loss": -4.166618347167969, "global_step": 2723, "epoch": 16} {"train_loss": -4.190356254577637, "global_step": 2724, "epoch": 16} {"train_loss": -3.9420347213745117, "global_step": 2725, "epoch": 16} {"train_loss": -4.282961845397949, "global_step": 2726, "epoch": 16} {"train_loss": -3.9579660892486572, "global_step": 2727, "epoch": 16} {"train_loss": -3.8943910598754883, "global_step": 2728, "epoch": 16} {"train_loss": -4.125818252563477, "global_step": 2729, "epoch": 16} {"train_loss": -3.901517391204834, "global_step": 2730, "epoch": 16} {"train_loss": -4.225506782531738, "global_step": 2731, "epoch": 16} {"train_loss": -4.298519134521484, "global_step": 2732, "epoch": 16} {"train_loss": -4.361745357513428, "global_step": 2733, "epoch": 16} {"train_loss": -4.422496795654297, "global_step": 2734, "epoch": 16} {"train_loss": -4.04226016998291, "global_step": 2735, "epoch": 16} {"train_loss": -4.287498950958252, "global_step": 2736, "epoch": 16} {"train_loss": -4.473060607910156, "global_step": 2737, "epoch": 16} {"train_loss": -4.421303749084473, "global_step": 2738, "epoch": 16} {"train_loss": -4.432700157165527, "global_step": 2739, "epoch": 16} {"train_loss": -4.179027557373047, "global_step": 2740, "epoch": 16} {"train_loss": -4.569012641906738, "global_step": 2741, "epoch": 16} {"train_loss": -4.197548866271973, "global_step": 2742, "epoch": 16} {"train_loss": -4.287783145904541, "global_step": 2743, "epoch": 16} {"train_loss": -4.338849067687988, "global_step": 2744, "epoch": 16} {"train_loss": -4.496732234954834, "global_step": 2745, "epoch": 16} {"train_loss": -4.512823104858398, "global_step": 2746, "epoch": 16} {"train_loss": -4.379756927490234, "global_step": 2747, "epoch": 16} {"train_loss": -4.18368673324585, "global_step": 2748, "epoch": 16} {"train_loss": -4.251718521118164, "global_step": 2749, "epoch": 16} {"train_loss": -4.46066427230835, "global_step": 2750, "epoch": 16} {"train_loss": -4.722142219543457, "global_step": 2751, "epoch": 16} {"train_loss": -4.2617387771606445, "global_step": 2752, "epoch": 16} {"train_loss": -4.348967552185059, "global_step": 2753, "epoch": 16} {"train_loss": -4.319533348083496, "global_step": 2754, "epoch": 16} {"train_loss": -4.45816707611084, "global_step": 2755, "epoch": 16} {"train_loss": -4.520163536071777, "global_step": 2756, "epoch": 16} {"train_loss": -4.347297668457031, "global_step": 2757, "epoch": 16} {"train_loss": -4.571111679077148, "global_step": 2758, "epoch": 16} {"train_loss": -3.9530558586120605, "global_step": 2759, "epoch": 16} {"train_loss": -4.459108352661133, "global_step": 2760, "epoch": 16} {"train_loss": -4.102524757385254, "global_step": 2761, "epoch": 16} {"train_loss": -4.45530891418457, "global_step": 2762, "epoch": 16} {"train_loss": -4.442663192749023, "global_step": 2763, "epoch": 16} {"train_loss": -4.4085588455200195, "global_step": 2764, "epoch": 16} {"train_loss": -4.312373638153076, "global_step": 2765, "epoch": 16} {"train_loss": -4.443033695220947, "global_step": 2766, "epoch": 16} {"train_loss": -4.196584701538086, "global_step": 2767, "epoch": 16} {"train_loss": -4.18087100982666, "global_step": 2768, "epoch": 16} {"train_loss": -4.580526828765869, "global_step": 2769, "epoch": 16} {"train_loss": -4.361833095550537, "global_step": 2770, "epoch": 16} {"train_loss": -4.3053083419799805, "global_step": 2771, "epoch": 16} {"train_loss": -4.528133392333984, "global_step": 2772, "epoch": 16} {"train_loss": -4.171025276184082, "global_step": 2773, "epoch": 16} {"train_loss": -4.472560405731201, "global_step": 2774, "epoch": 16} {"train_loss": -4.319821834564209, "global_step": 2775, "epoch": 16} {"train_loss": -4.554821014404297, "global_step": 2776, "epoch": 16} {"train_loss": -4.180863857269287, "global_step": 2777, "epoch": 16} {"train_loss": -4.296726226806641, "global_step": 2778, "epoch": 16} {"train_loss": -4.492376327514648, "global_step": 2779, "epoch": 16} {"train_loss": -4.506109237670898, "global_step": 2780, "epoch": 16} {"train_loss": -4.345669746398926, "global_step": 2781, "epoch": 16} {"train_loss": -4.37738037109375, "global_step": 2782, "epoch": 16} {"train_loss": -4.256106376647949, "global_step": 2783, "epoch": 16} {"train_loss": -4.242866516113281, "global_step": 2784, "epoch": 16} {"train_loss": -4.291624069213867, "global_step": 2785, "epoch": 16} {"train_loss": -4.21781587600708, "global_step": 2786, "epoch": 16} {"train_loss": -4.021886825561523, "global_step": 2787, "epoch": 16} {"train_loss": -4.6676859855651855, "global_step": 2788, "epoch": 16} {"train_loss": -4.263871192932129, "global_step": 2789, "epoch": 16} {"train_loss": -4.452005863189697, "global_step": 2790, "epoch": 16} {"train_loss": -4.308338642120361, "global_step": 2791, "epoch": 16} {"train_loss": -4.568123817443848, "global_step": 2792, "epoch": 16} {"train_loss": -4.679256439208984, "global_step": 2793, "epoch": 16} {"train_loss": -4.367191791534424, "global_step": 2794, "epoch": 16} {"train_loss": -4.653304576873779, "global_step": 2795, "epoch": 16} {"train_loss": -4.506375312805176, "global_step": 2796, "epoch": 16} {"train_loss": -4.4279584884643555, "global_step": 2797, "epoch": 16} {"train_loss": -4.486900329589844, "global_step": 2798, "epoch": 16} {"train_loss": -4.498804092407227, "global_step": 2799, "epoch": 16} {"train_loss": -4.11099910736084, "global_step": 2800, "epoch": 16} {"train_loss": -4.521004676818848, "global_step": 2801, "epoch": 16} {"train_loss": -4.257718086242676, "global_step": 2802, "epoch": 16} {"train_loss": -4.39957332611084, "global_step": 2803, "epoch": 16} {"train_loss": -4.2260050773620605, "global_step": 2804, "epoch": 16} {"train_loss": -4.491839408874512, "global_step": 2805, "epoch": 16} {"train_loss": -4.32071590423584, "global_step": 2806, "epoch": 16} {"train_loss": -4.463201522827148, "global_step": 2807, "epoch": 16} {"train_loss": -4.262413501739502, "global_step": 2808, "epoch": 16} {"train_loss": -4.260611534118652, "global_step": 2809, "epoch": 16} {"train_loss": -4.278558731079102, "global_step": 2810, "epoch": 16} {"train_loss": -4.331340789794922, "global_step": 2811, "epoch": 16} {"train_loss": -4.411015033721924, "global_step": 2812, "epoch": 16} {"train_loss": -4.45628547668457, "global_step": 2813, "epoch": 16} {"train_loss": -4.300318717956543, "global_step": 2814, "epoch": 16} {"train_loss": -4.288482666015625, "global_step": 2815, "epoch": 16} {"train_loss": -4.315153121948242, "global_step": 2816, "epoch": 16} {"train_loss": -4.196569442749023, "global_step": 2817, "epoch": 16} {"train_loss": -4.219353675842285, "global_step": 2818, "epoch": 16} {"train_loss": -4.126965522766113, "global_step": 2819, "epoch": 16} {"train_loss": -4.492002487182617, "global_step": 2820, "epoch": 16} {"train_loss": -4.371631622314453, "global_step": 2821, "epoch": 16} {"train_loss": -4.360811233520508, "global_step": 2822, "epoch": 16} {"train_loss": -4.159110069274902, "global_step": 2823, "epoch": 16} {"train_loss": -4.498358726501465, "global_step": 2824, "epoch": 16} {"train_loss": -4.535816192626953, "global_step": 2825, "epoch": 16} {"train_loss": -4.663616180419922, "global_step": 2826, "epoch": 16} {"train_loss": -4.514723300933838, "global_step": 2827, "epoch": 16} {"train_loss": -4.456447601318359, "global_step": 2828, "epoch": 16} {"train_loss": -4.253052711486816, "global_step": 2829, "epoch": 16} {"train_loss": -4.390946388244629, "global_step": 2830, "epoch": 16} {"train_loss": -4.213584899902344, "global_step": 2831, "epoch": 16} {"train_loss": -4.526874542236328, "global_step": 2832, "epoch": 16} {"train_loss": -4.119675159454346, "global_step": 2833, "epoch": 16} {"train_loss": -4.637502193450928, "global_step": 2834, "epoch": 16} {"train_loss": -4.850825309753418, "global_step": 2835, "epoch": 16} {"train_loss": -4.394315719604492, "global_step": 2836, "epoch": 16} {"train_loss": -4.474007606506348, "global_step": 2837, "epoch": 16} {"train_loss": -4.19728946685791, "global_step": 2838, "epoch": 16} {"train_loss": -4.084226608276367, "global_step": 2839, "epoch": 16} {"train_loss": -4.312616348266602, "global_step": 2840, "epoch": 16} {"train_loss": -4.4445481300354, "global_step": 2841, "epoch": 16} {"train_loss": -4.4392266273498535, "global_step": 2842, "epoch": 16} {"train_loss": -4.4367265701293945, "global_step": 2843, "epoch": 16} {"train_loss": -4.318647384643555, "global_step": 2844, "epoch": 16} {"train_loss": -4.403160095214844, "global_step": 2845, "epoch": 16} {"train_loss": -4.708935737609863, "global_step": 2846, "epoch": 16} {"train_loss": -4.504556179046631, "global_step": 2847, "epoch": 16} {"train_loss": -4.451664924621582, "global_step": 2848, "epoch": 16} {"train_loss": -4.178701400756836, "global_step": 2849, "epoch": 16} {"train_loss": -4.531245231628418, "global_step": 2850, "epoch": 16} {"train_loss": -4.618279933929443, "global_step": 2851, "epoch": 16} {"train_loss": -4.399815082550049, "global_step": 2852, "epoch": 16} {"train_loss": -4.552494525909424, "global_step": 2853, "epoch": 16} {"train_loss": -4.468571662902832, "global_step": 2854, "epoch": 16} {"train_loss": -4.353159485828309, "global_step": 2855, "epoch": 16, "val_loss": 266526.9375} {"train_loss": -4.545527458190918, "global_step": 2856, "epoch": 17} {"train_loss": -4.517428398132324, "global_step": 2857, "epoch": 17} {"train_loss": -4.572417259216309, "global_step": 2858, "epoch": 17} {"train_loss": -4.546172142028809, "global_step": 2859, "epoch": 17} {"train_loss": -4.173004150390625, "global_step": 2860, "epoch": 17} {"train_loss": -4.60839319229126, "global_step": 2861, "epoch": 17} {"train_loss": -4.04304838180542, "global_step": 2862, "epoch": 17} {"train_loss": -4.083540916442871, "global_step": 2863, "epoch": 17} {"train_loss": -4.250823497772217, "global_step": 2864, "epoch": 17} {"train_loss": -4.313362121582031, "global_step": 2865, "epoch": 17} {"train_loss": -4.401893615722656, "global_step": 2866, "epoch": 17} {"train_loss": -4.216095924377441, "global_step": 2867, "epoch": 17} {"train_loss": -4.51544189453125, "global_step": 2868, "epoch": 17} {"train_loss": -4.418912410736084, "global_step": 2869, "epoch": 17} {"train_loss": -4.419548034667969, "global_step": 2870, "epoch": 17} {"train_loss": -4.567753791809082, "global_step": 2871, "epoch": 17} {"train_loss": -4.205449104309082, "global_step": 2872, "epoch": 17} {"train_loss": -4.419569969177246, "global_step": 2873, "epoch": 17} {"train_loss": -4.558494567871094, "global_step": 2874, "epoch": 17} {"train_loss": -4.412432670593262, "global_step": 2875, "epoch": 17} {"train_loss": -4.626011371612549, "global_step": 2876, "epoch": 17} {"train_loss": -4.527860641479492, "global_step": 2877, "epoch": 17} {"train_loss": -4.6504807472229, "global_step": 2878, "epoch": 17} {"train_loss": -4.591847896575928, "global_step": 2879, "epoch": 17} {"train_loss": -4.535830020904541, "global_step": 2880, "epoch": 17} {"train_loss": -4.574624538421631, "global_step": 2881, "epoch": 17} {"train_loss": -4.415908336639404, "global_step": 2882, "epoch": 17} {"train_loss": -4.339799880981445, "global_step": 2883, "epoch": 17} {"train_loss": -4.141720771789551, "global_step": 2884, "epoch": 17} {"train_loss": -4.568660736083984, "global_step": 2885, "epoch": 17} {"train_loss": -4.572390556335449, "global_step": 2886, "epoch": 17} {"train_loss": -4.621987819671631, "global_step": 2887, "epoch": 17} {"train_loss": -4.41813325881958, "global_step": 2888, "epoch": 17} {"train_loss": -4.80274772644043, "global_step": 2889, "epoch": 17} {"train_loss": -4.65402889251709, "global_step": 2890, "epoch": 17} {"train_loss": -4.459401607513428, "global_step": 2891, "epoch": 17} {"train_loss": -4.772276878356934, "global_step": 2892, "epoch": 17} {"train_loss": -4.677279949188232, "global_step": 2893, "epoch": 17} {"train_loss": -4.517395973205566, "global_step": 2894, "epoch": 17} {"train_loss": -4.446927070617676, "global_step": 2895, "epoch": 17} {"train_loss": -4.618546485900879, "global_step": 2896, "epoch": 17} {"train_loss": -4.218924522399902, "global_step": 2897, "epoch": 17} {"train_loss": -4.218460559844971, "global_step": 2898, "epoch": 17} {"train_loss": -4.074477672576904, "global_step": 2899, "epoch": 17} {"train_loss": -4.447820663452148, "global_step": 2900, "epoch": 17} {"train_loss": -4.353677272796631, "global_step": 2901, "epoch": 17} {"train_loss": -4.337838649749756, "global_step": 2902, "epoch": 17} {"train_loss": -4.2961859703063965, "global_step": 2903, "epoch": 17} {"train_loss": -4.264342784881592, "global_step": 2904, "epoch": 17} {"train_loss": -4.138715744018555, "global_step": 2905, "epoch": 17} {"train_loss": -4.464059829711914, "global_step": 2906, "epoch": 17} {"train_loss": -4.285893440246582, "global_step": 2907, "epoch": 17} {"train_loss": -4.471705913543701, "global_step": 2908, "epoch": 17} {"train_loss": -4.397340774536133, "global_step": 2909, "epoch": 17} {"train_loss": -4.578341960906982, "global_step": 2910, "epoch": 17} {"train_loss": -4.234307765960693, "global_step": 2911, "epoch": 17} {"train_loss": -4.290109157562256, "global_step": 2912, "epoch": 17} {"train_loss": -4.846437454223633, "global_step": 2913, "epoch": 17} {"train_loss": -4.421923637390137, "global_step": 2914, "epoch": 17} {"train_loss": -4.367499351501465, "global_step": 2915, "epoch": 17} {"train_loss": -4.600631237030029, "global_step": 2916, "epoch": 17} {"train_loss": -4.50673770904541, "global_step": 2917, "epoch": 17} {"train_loss": -4.21580696105957, "global_step": 2918, "epoch": 17} {"train_loss": -4.285155296325684, "global_step": 2919, "epoch": 17} {"train_loss": -4.502310276031494, "global_step": 2920, "epoch": 17} {"train_loss": -4.141268730163574, "global_step": 2921, "epoch": 17} {"train_loss": -4.521625518798828, "global_step": 2922, "epoch": 17} {"train_loss": -4.4488606452941895, "global_step": 2923, "epoch": 17} {"train_loss": -4.620239734649658, "global_step": 2924, "epoch": 17} {"train_loss": -4.581893444061279, "global_step": 2925, "epoch": 17} {"train_loss": -4.632937431335449, "global_step": 2926, "epoch": 17} {"train_loss": -4.42369270324707, "global_step": 2927, "epoch": 17} {"train_loss": -4.2600507736206055, "global_step": 2928, "epoch": 17} {"train_loss": -4.496260643005371, "global_step": 2929, "epoch": 17} {"train_loss": -4.269516468048096, "global_step": 2930, "epoch": 17} {"train_loss": -4.2206501960754395, "global_step": 2931, "epoch": 17} {"train_loss": -4.231114864349365, "global_step": 2932, "epoch": 17} {"train_loss": -4.5587358474731445, "global_step": 2933, "epoch": 17} {"train_loss": -4.300530910491943, "global_step": 2934, "epoch": 17} {"train_loss": -4.364182472229004, "global_step": 2935, "epoch": 17} {"train_loss": -4.315080165863037, "global_step": 2936, "epoch": 17} {"train_loss": -4.5100579261779785, "global_step": 2937, "epoch": 17} {"train_loss": -4.484894752502441, "global_step": 2938, "epoch": 17} {"train_loss": -4.611392974853516, "global_step": 2939, "epoch": 17} {"train_loss": -4.483885765075684, "global_step": 2940, "epoch": 17} {"train_loss": -4.524953842163086, "global_step": 2941, "epoch": 17} {"train_loss": -4.508607387542725, "global_step": 2942, "epoch": 17} {"train_loss": -4.461594581604004, "global_step": 2943, "epoch": 17} {"train_loss": -4.4893293380737305, "global_step": 2944, "epoch": 17} {"train_loss": -4.396878719329834, "global_step": 2945, "epoch": 17} {"train_loss": -4.258386611938477, "global_step": 2946, "epoch": 17} {"train_loss": -4.255507469177246, "global_step": 2947, "epoch": 17} {"train_loss": -4.034782409667969, "global_step": 2948, "epoch": 17} {"train_loss": -4.36341667175293, "global_step": 2949, "epoch": 17} {"train_loss": -4.390236854553223, "global_step": 2950, "epoch": 17} {"train_loss": -4.409989833831787, "global_step": 2951, "epoch": 17} {"train_loss": -4.595029830932617, "global_step": 2952, "epoch": 17} {"train_loss": -4.131198406219482, "global_step": 2953, "epoch": 17} {"train_loss": -4.0912675857543945, "global_step": 2954, "epoch": 17} {"train_loss": -4.390348434448242, "global_step": 2955, "epoch": 17} {"train_loss": -4.5048747062683105, "global_step": 2956, "epoch": 17} {"train_loss": -4.293440818786621, "global_step": 2957, "epoch": 17} {"train_loss": -4.19682502746582, "global_step": 2958, "epoch": 17} {"train_loss": -4.301656723022461, "global_step": 2959, "epoch": 17} {"train_loss": -4.3321123123168945, "global_step": 2960, "epoch": 17} {"train_loss": -4.338716506958008, "global_step": 2961, "epoch": 17} {"train_loss": -4.446475982666016, "global_step": 2962, "epoch": 17} {"train_loss": -4.249556064605713, "global_step": 2963, "epoch": 17} {"train_loss": -4.091768264770508, "global_step": 2964, "epoch": 17} {"train_loss": -4.270608901977539, "global_step": 2965, "epoch": 17} {"train_loss": -4.282868385314941, "global_step": 2966, "epoch": 17} {"train_loss": -4.093473434448242, "global_step": 2967, "epoch": 17} {"train_loss": -4.513250350952148, "global_step": 2968, "epoch": 17} {"train_loss": -4.086208343505859, "global_step": 2969, "epoch": 17} {"train_loss": -4.154731750488281, "global_step": 2970, "epoch": 17} {"train_loss": -4.303162574768066, "global_step": 2971, "epoch": 17} {"train_loss": -4.466401100158691, "global_step": 2972, "epoch": 17} {"train_loss": -4.360945224761963, "global_step": 2973, "epoch": 17} {"train_loss": -4.439548492431641, "global_step": 2974, "epoch": 17} {"train_loss": -4.484742164611816, "global_step": 2975, "epoch": 17} {"train_loss": -4.345582008361816, "global_step": 2976, "epoch": 17} {"train_loss": -4.302800178527832, "global_step": 2977, "epoch": 17} {"train_loss": -4.328986644744873, "global_step": 2978, "epoch": 17} {"train_loss": -4.665846347808838, "global_step": 2979, "epoch": 17} {"train_loss": -4.545246124267578, "global_step": 2980, "epoch": 17} {"train_loss": -4.4194016456604, "global_step": 2981, "epoch": 17} {"train_loss": -4.741343021392822, "global_step": 2982, "epoch": 17} {"train_loss": -4.180992126464844, "global_step": 2983, "epoch": 17} {"train_loss": -4.530433654785156, "global_step": 2984, "epoch": 17} {"train_loss": -4.499547004699707, "global_step": 2985, "epoch": 17} {"train_loss": -4.655378818511963, "global_step": 2986, "epoch": 17} {"train_loss": -4.662213325500488, "global_step": 2987, "epoch": 17} {"train_loss": -4.836451530456543, "global_step": 2988, "epoch": 17} {"train_loss": -4.472438812255859, "global_step": 2989, "epoch": 17} {"train_loss": -4.579705238342285, "global_step": 2990, "epoch": 17} {"train_loss": -4.654156684875488, "global_step": 2991, "epoch": 17} {"train_loss": -4.462121963500977, "global_step": 2992, "epoch": 17} {"train_loss": -4.797425270080566, "global_step": 2993, "epoch": 17} {"train_loss": -4.552535057067871, "global_step": 2994, "epoch": 17} {"train_loss": -4.574976444244385, "global_step": 2995, "epoch": 17} {"train_loss": -4.3060994148254395, "global_step": 2996, "epoch": 17} {"train_loss": -4.546175003051758, "global_step": 2997, "epoch": 17} {"train_loss": -4.566267013549805, "global_step": 2998, "epoch": 17} {"train_loss": -4.416411399841309, "global_step": 2999, "epoch": 17} {"train_loss": -4.740046977996826, "global_step": 3000, "epoch": 17} {"train_loss": -4.32454776763916, "global_step": 3001, "epoch": 17} {"train_loss": -4.164832592010498, "global_step": 3002, "epoch": 17} {"train_loss": -4.5400285720825195, "global_step": 3003, "epoch": 17} {"train_loss": -4.699962139129639, "global_step": 3004, "epoch": 17} {"train_loss": -4.555318355560303, "global_step": 3005, "epoch": 17} {"train_loss": -4.694222450256348, "global_step": 3006, "epoch": 17} {"train_loss": -4.723377227783203, "global_step": 3007, "epoch": 17} {"train_loss": -4.579379558563232, "global_step": 3008, "epoch": 17} {"train_loss": -4.877693176269531, "global_step": 3009, "epoch": 17} {"train_loss": -4.735759735107422, "global_step": 3010, "epoch": 17} {"train_loss": -4.2679595947265625, "global_step": 3011, "epoch": 17} {"train_loss": -4.472346305847168, "global_step": 3012, "epoch": 17} {"train_loss": -4.638062000274658, "global_step": 3013, "epoch": 17} {"train_loss": -4.291459083557129, "global_step": 3014, "epoch": 17} {"train_loss": -4.663556098937988, "global_step": 3015, "epoch": 17} {"train_loss": -4.378535270690918, "global_step": 3016, "epoch": 17} {"train_loss": -4.507621765136719, "global_step": 3017, "epoch": 17} {"train_loss": -4.570120811462402, "global_step": 3018, "epoch": 17} {"train_loss": -4.553164958953857, "global_step": 3019, "epoch": 17} {"train_loss": -4.4524149894714355, "global_step": 3020, "epoch": 17} {"train_loss": -4.390902519226074, "global_step": 3021, "epoch": 17} {"train_loss": -4.624547004699707, "global_step": 3022, "epoch": 17} {"train_loss": -4.43737044220879, "global_step": 3023, "epoch": 17, "val_loss": 264324.59375} {"train_loss": -4.6832275390625, "global_step": 3024, "epoch": 18} {"train_loss": -4.627919673919678, "global_step": 3025, "epoch": 18} {"train_loss": -4.642772197723389, "global_step": 3026, "epoch": 18} {"train_loss": -4.651820182800293, "global_step": 3027, "epoch": 18} {"train_loss": -4.535577774047852, "global_step": 3028, "epoch": 18} {"train_loss": -4.3572235107421875, "global_step": 3029, "epoch": 18} {"train_loss": -4.407338619232178, "global_step": 3030, "epoch": 18} {"train_loss": -4.238393306732178, "global_step": 3031, "epoch": 18} {"train_loss": -4.197447299957275, "global_step": 3032, "epoch": 18} {"train_loss": -4.358547210693359, "global_step": 3033, "epoch": 18} {"train_loss": -4.100028991699219, "global_step": 3034, "epoch": 18} {"train_loss": -4.505308628082275, "global_step": 3035, "epoch": 18} {"train_loss": -4.6370134353637695, "global_step": 3036, "epoch": 18} {"train_loss": -4.053577423095703, "global_step": 3037, "epoch": 18} {"train_loss": -4.571906089782715, "global_step": 3038, "epoch": 18} {"train_loss": -4.4283447265625, "global_step": 3039, "epoch": 18} {"train_loss": -4.3186235427856445, "global_step": 3040, "epoch": 18} {"train_loss": -4.57705020904541, "global_step": 3041, "epoch": 18} {"train_loss": -4.620999336242676, "global_step": 3042, "epoch": 18} {"train_loss": -4.14710807800293, "global_step": 3043, "epoch": 18} {"train_loss": -4.211379051208496, "global_step": 3044, "epoch": 18} {"train_loss": -4.648502826690674, "global_step": 3045, "epoch": 18} {"train_loss": -4.371737480163574, "global_step": 3046, "epoch": 18} {"train_loss": -4.4610443115234375, "global_step": 3047, "epoch": 18} {"train_loss": -4.358283996582031, "global_step": 3048, "epoch": 18} {"train_loss": -4.430519104003906, "global_step": 3049, "epoch": 18} {"train_loss": -4.287797451019287, "global_step": 3050, "epoch": 18} {"train_loss": -4.605594635009766, "global_step": 3051, "epoch": 18} {"train_loss": -4.523922920227051, "global_step": 3052, "epoch": 18} {"train_loss": -4.519546031951904, "global_step": 3053, "epoch": 18} {"train_loss": -4.754708290100098, "global_step": 3054, "epoch": 18} {"train_loss": -4.789636135101318, "global_step": 3055, "epoch": 18} {"train_loss": -4.6072211265563965, "global_step": 3056, "epoch": 18} {"train_loss": -4.215978622436523, "global_step": 3057, "epoch": 18} {"train_loss": -4.604975700378418, "global_step": 3058, "epoch": 18} {"train_loss": -4.685473442077637, "global_step": 3059, "epoch": 18} {"train_loss": -4.426519870758057, "global_step": 3060, "epoch": 18} {"train_loss": -4.321844577789307, "global_step": 3061, "epoch": 18} {"train_loss": -4.453767776489258, "global_step": 3062, "epoch": 18} {"train_loss": -4.519558429718018, "global_step": 3063, "epoch": 18} {"train_loss": -4.43715763092041, "global_step": 3064, "epoch": 18} {"train_loss": -4.522523403167725, "global_step": 3065, "epoch": 18} {"train_loss": -4.680014610290527, "global_step": 3066, "epoch": 18} {"train_loss": -4.6002888679504395, "global_step": 3067, "epoch": 18} {"train_loss": -4.596578598022461, "global_step": 3068, "epoch": 18} {"train_loss": -4.606959342956543, "global_step": 3069, "epoch": 18} {"train_loss": -4.3130035400390625, "global_step": 3070, "epoch": 18} {"train_loss": -4.706048011779785, "global_step": 3071, "epoch": 18} {"train_loss": -4.63533353805542, "global_step": 3072, "epoch": 18} {"train_loss": -4.783652305603027, "global_step": 3073, "epoch": 18} {"train_loss": -4.283965587615967, "global_step": 3074, "epoch": 18} {"train_loss": -4.709173202514648, "global_step": 3075, "epoch": 18} {"train_loss": -4.711368560791016, "global_step": 3076, "epoch": 18} {"train_loss": -4.596439361572266, "global_step": 3077, "epoch": 18} {"train_loss": -4.358799934387207, "global_step": 3078, "epoch": 18} {"train_loss": -4.490138530731201, "global_step": 3079, "epoch": 18} {"train_loss": -4.663286209106445, "global_step": 3080, "epoch": 18} {"train_loss": -4.6154303550720215, "global_step": 3081, "epoch": 18} {"train_loss": -4.291715145111084, "global_step": 3082, "epoch": 18} {"train_loss": -4.50330924987793, "global_step": 3083, "epoch": 18} {"train_loss": -4.5261359214782715, "global_step": 3084, "epoch": 18} {"train_loss": -4.767978191375732, "global_step": 3085, "epoch": 18} {"train_loss": -4.228771209716797, "global_step": 3086, "epoch": 18} {"train_loss": -4.723304748535156, "global_step": 3087, "epoch": 18} {"train_loss": -4.594332695007324, "global_step": 3088, "epoch": 18} {"train_loss": -4.613178253173828, "global_step": 3089, "epoch": 18} {"train_loss": -4.357234954833984, "global_step": 3090, "epoch": 18} {"train_loss": -4.5308637619018555, "global_step": 3091, "epoch": 18} {"train_loss": -4.663293361663818, "global_step": 3092, "epoch": 18} {"train_loss": -4.29325532913208, "global_step": 3093, "epoch": 18} {"train_loss": -4.305485725402832, "global_step": 3094, "epoch": 18} {"train_loss": -4.40112829208374, "global_step": 3095, "epoch": 18} {"train_loss": -4.692449569702148, "global_step": 3096, "epoch": 18} {"train_loss": -4.279809951782227, "global_step": 3097, "epoch": 18} {"train_loss": -4.692468166351318, "global_step": 3098, "epoch": 18} {"train_loss": -4.468644142150879, "global_step": 3099, "epoch": 18} {"train_loss": -4.466860771179199, "global_step": 3100, "epoch": 18} {"train_loss": -4.5825347900390625, "global_step": 3101, "epoch": 18} {"train_loss": -4.203375339508057, "global_step": 3102, "epoch": 18} {"train_loss": -4.916305065155029, "global_step": 3103, "epoch": 18} {"train_loss": -4.197792053222656, "global_step": 3104, "epoch": 18} {"train_loss": -4.670719146728516, "global_step": 3105, "epoch": 18} {"train_loss": -4.537515640258789, "global_step": 3106, "epoch": 18} {"train_loss": -4.262206077575684, "global_step": 3107, "epoch": 18} {"train_loss": -4.687288761138916, "global_step": 3108, "epoch": 18} {"train_loss": -4.234392166137695, "global_step": 3109, "epoch": 18} {"train_loss": -4.583493232727051, "global_step": 3110, "epoch": 18} {"train_loss": -4.238888740539551, "global_step": 3111, "epoch": 18} {"train_loss": -4.214635848999023, "global_step": 3112, "epoch": 18} {"train_loss": -4.4130425453186035, "global_step": 3113, "epoch": 18} {"train_loss": -4.512052059173584, "global_step": 3114, "epoch": 18} {"train_loss": -4.461651802062988, "global_step": 3115, "epoch": 18} {"train_loss": -4.482805252075195, "global_step": 3116, "epoch": 18} {"train_loss": -4.436904430389404, "global_step": 3117, "epoch": 18} {"train_loss": -4.404378890991211, "global_step": 3118, "epoch": 18} {"train_loss": -4.528691291809082, "global_step": 3119, "epoch": 18} {"train_loss": -4.5626325607299805, "global_step": 3120, "epoch": 18} {"train_loss": -4.445300102233887, "global_step": 3121, "epoch": 18} {"train_loss": -4.569719314575195, "global_step": 3122, "epoch": 18} {"train_loss": -4.54059362411499, "global_step": 3123, "epoch": 18} {"train_loss": -4.937798976898193, "global_step": 3124, "epoch": 18} {"train_loss": -4.717759609222412, "global_step": 3125, "epoch": 18} {"train_loss": -4.722929000854492, "global_step": 3126, "epoch": 18} {"train_loss": -4.8216094970703125, "global_step": 3127, "epoch": 18} {"train_loss": -4.621495246887207, "global_step": 3128, "epoch": 18} {"train_loss": -4.599818229675293, "global_step": 3129, "epoch": 18} {"train_loss": -4.512245178222656, "global_step": 3130, "epoch": 18} {"train_loss": -4.304197788238525, "global_step": 3131, "epoch": 18} {"train_loss": -4.700199127197266, "global_step": 3132, "epoch": 18} {"train_loss": -4.656930446624756, "global_step": 3133, "epoch": 18} {"train_loss": -4.678840160369873, "global_step": 3134, "epoch": 18} {"train_loss": -4.692035675048828, "global_step": 3135, "epoch": 18} {"train_loss": -4.3518266677856445, "global_step": 3136, "epoch": 18} {"train_loss": -4.508050918579102, "global_step": 3137, "epoch": 18} {"train_loss": -4.692333698272705, "global_step": 3138, "epoch": 18} {"train_loss": -4.635774612426758, "global_step": 3139, "epoch": 18} {"train_loss": -4.395282745361328, "global_step": 3140, "epoch": 18} {"train_loss": -4.6959943771362305, "global_step": 3141, "epoch": 18} {"train_loss": -4.359143257141113, "global_step": 3142, "epoch": 18} {"train_loss": -4.422950744628906, "global_step": 3143, "epoch": 18} {"train_loss": -4.211786270141602, "global_step": 3144, "epoch": 18} {"train_loss": -4.612481117248535, "global_step": 3145, "epoch": 18} {"train_loss": -4.318617820739746, "global_step": 3146, "epoch": 18} {"train_loss": -4.49405574798584, "global_step": 3147, "epoch": 18} {"train_loss": -4.582769393920898, "global_step": 3148, "epoch": 18} {"train_loss": -4.29495906829834, "global_step": 3149, "epoch": 18} {"train_loss": -4.326458930969238, "global_step": 3150, "epoch": 18} {"train_loss": -4.189729690551758, "global_step": 3151, "epoch": 18} {"train_loss": -4.47585391998291, "global_step": 3152, "epoch": 18} {"train_loss": -4.370959281921387, "global_step": 3153, "epoch": 18} {"train_loss": -4.313806056976318, "global_step": 3154, "epoch": 18} {"train_loss": -4.450943946838379, "global_step": 3155, "epoch": 18} {"train_loss": -4.421932220458984, "global_step": 3156, "epoch": 18} {"train_loss": -4.389779090881348, "global_step": 3157, "epoch": 18} {"train_loss": -4.47271728515625, "global_step": 3158, "epoch": 18} {"train_loss": -4.681590557098389, "global_step": 3159, "epoch": 18} {"train_loss": -4.555878639221191, "global_step": 3160, "epoch": 18} {"train_loss": -4.520315170288086, "global_step": 3161, "epoch": 18} {"train_loss": -4.671640396118164, "global_step": 3162, "epoch": 18} {"train_loss": -4.324613094329834, "global_step": 3163, "epoch": 18} {"train_loss": -4.6120524406433105, "global_step": 3164, "epoch": 18} {"train_loss": -4.496455192565918, "global_step": 3165, "epoch": 18} {"train_loss": -4.871349334716797, "global_step": 3166, "epoch": 18} {"train_loss": -4.731433868408203, "global_step": 3167, "epoch": 18} {"train_loss": -4.611191749572754, "global_step": 3168, "epoch": 18} {"train_loss": -4.220386028289795, "global_step": 3169, "epoch": 18} {"train_loss": -4.522069931030273, "global_step": 3170, "epoch": 18} {"train_loss": -4.818418025970459, "global_step": 3171, "epoch": 18} {"train_loss": -4.367130279541016, "global_step": 3172, "epoch": 18} {"train_loss": -4.590701580047607, "global_step": 3173, "epoch": 18} {"train_loss": -3.982182741165161, "global_step": 3174, "epoch": 18} {"train_loss": -4.596564292907715, "global_step": 3175, "epoch": 18} {"train_loss": -4.183716297149658, "global_step": 3176, "epoch": 18} {"train_loss": -4.306402206420898, "global_step": 3177, "epoch": 18} {"train_loss": -4.186690807342529, "global_step": 3178, "epoch": 18} {"train_loss": -4.511940002441406, "global_step": 3179, "epoch": 18} {"train_loss": -4.466148853302002, "global_step": 3180, "epoch": 18} {"train_loss": -4.367961406707764, "global_step": 3181, "epoch": 18} {"train_loss": -4.477757930755615, "global_step": 3182, "epoch": 18} {"train_loss": -4.574346542358398, "global_step": 3183, "epoch": 18} {"train_loss": -4.518824577331543, "global_step": 3184, "epoch": 18} {"train_loss": -4.410256385803223, "global_step": 3185, "epoch": 18} {"train_loss": -4.1696085929870605, "global_step": 3186, "epoch": 18} {"train_loss": -4.634420394897461, "global_step": 3187, "epoch": 18} {"train_loss": -4.413187026977539, "global_step": 3188, "epoch": 18} {"train_loss": -4.493928909301758, "global_step": 3189, "epoch": 18} {"train_loss": -4.3563127517700195, "global_step": 3190, "epoch": 18} {"train_loss": -4.4896051699206945, "global_step": 3191, "epoch": 18, "val_loss": 239033.359375} {"train_loss": -4.520230770111084, "global_step": 3192, "epoch": 19} {"train_loss": -4.392278671264648, "global_step": 3193, "epoch": 19} {"train_loss": -4.50886344909668, "global_step": 3194, "epoch": 19} {"train_loss": -4.564248085021973, "global_step": 3195, "epoch": 19} {"train_loss": -4.621893882751465, "global_step": 3196, "epoch": 19} {"train_loss": -4.680704116821289, "global_step": 3197, "epoch": 19} {"train_loss": -4.36281156539917, "global_step": 3198, "epoch": 19} {"train_loss": -4.472512245178223, "global_step": 3199, "epoch": 19} {"train_loss": -4.703393936157227, "global_step": 3200, "epoch": 19} {"train_loss": -4.511554718017578, "global_step": 3201, "epoch": 19} {"train_loss": -4.827201843261719, "global_step": 3202, "epoch": 19} {"train_loss": -4.286548614501953, "global_step": 3203, "epoch": 19} {"train_loss": -4.454434394836426, "global_step": 3204, "epoch": 19} {"train_loss": -4.426393508911133, "global_step": 3205, "epoch": 19} {"train_loss": -4.124286651611328, "global_step": 3206, "epoch": 19} {"train_loss": -4.419924736022949, "global_step": 3207, "epoch": 19} {"train_loss": -4.197272300720215, "global_step": 3208, "epoch": 19} {"train_loss": -4.562426567077637, "global_step": 3209, "epoch": 19} {"train_loss": -4.292896747589111, "global_step": 3210, "epoch": 19} {"train_loss": -4.4687042236328125, "global_step": 3211, "epoch": 19} {"train_loss": -4.374839782714844, "global_step": 3212, "epoch": 19} {"train_loss": -4.339010238647461, "global_step": 3213, "epoch": 19} {"train_loss": -4.546396732330322, "global_step": 3214, "epoch": 19} {"train_loss": -4.545617580413818, "global_step": 3215, "epoch": 19} {"train_loss": -4.518205642700195, "global_step": 3216, "epoch": 19} {"train_loss": -4.8475494384765625, "global_step": 3217, "epoch": 19} {"train_loss": -4.707683086395264, "global_step": 3218, "epoch": 19} {"train_loss": -4.485117435455322, "global_step": 3219, "epoch": 19} {"train_loss": -4.596517562866211, "global_step": 3220, "epoch": 19} {"train_loss": -4.337292671203613, "global_step": 3221, "epoch": 19} {"train_loss": -4.865056991577148, "global_step": 3222, "epoch": 19} {"train_loss": -4.318934440612793, "global_step": 3223, "epoch": 19} {"train_loss": -4.2833662033081055, "global_step": 3224, "epoch": 19} {"train_loss": -4.4403462409973145, "global_step": 3225, "epoch": 19} {"train_loss": -4.483495712280273, "global_step": 3226, "epoch": 19} {"train_loss": -4.705973148345947, "global_step": 3227, "epoch": 19} {"train_loss": -4.447395324707031, "global_step": 3228, "epoch": 19} {"train_loss": -4.540619850158691, "global_step": 3229, "epoch": 19} {"train_loss": -4.556075572967529, "global_step": 3230, "epoch": 19} {"train_loss": -4.356000900268555, "global_step": 3231, "epoch": 19} {"train_loss": -4.501983642578125, "global_step": 3232, "epoch": 19} {"train_loss": -4.327237129211426, "global_step": 3233, "epoch": 19} {"train_loss": -4.402406215667725, "global_step": 3234, "epoch": 19} {"train_loss": -4.398248672485352, "global_step": 3235, "epoch": 19} {"train_loss": -3.964630126953125, "global_step": 3236, "epoch": 19} {"train_loss": -4.282843589782715, "global_step": 3237, "epoch": 19} {"train_loss": -4.459090232849121, "global_step": 3238, "epoch": 19} {"train_loss": -4.312415599822998, "global_step": 3239, "epoch": 19} {"train_loss": -4.344150543212891, "global_step": 3240, "epoch": 19} {"train_loss": -4.409256935119629, "global_step": 3241, "epoch": 19} {"train_loss": -4.369417190551758, "global_step": 3242, "epoch": 19} {"train_loss": -4.436436653137207, "global_step": 3243, "epoch": 19} {"train_loss": -4.391909599304199, "global_step": 3244, "epoch": 19} {"train_loss": -4.482373237609863, "global_step": 3245, "epoch": 19} {"train_loss": -4.755329608917236, "global_step": 3246, "epoch": 19} {"train_loss": -4.615440368652344, "global_step": 3247, "epoch": 19} {"train_loss": -4.331899642944336, "global_step": 3248, "epoch": 19} {"train_loss": -4.275188446044922, "global_step": 3249, "epoch": 19} {"train_loss": -4.414009094238281, "global_step": 3250, "epoch": 19} {"train_loss": -4.529911994934082, "global_step": 3251, "epoch": 19} {"train_loss": -4.650515556335449, "global_step": 3252, "epoch": 19} {"train_loss": -4.6658148765563965, "global_step": 3253, "epoch": 19} {"train_loss": -4.6742658615112305, "global_step": 3254, "epoch": 19} {"train_loss": -4.202639102935791, "global_step": 3255, "epoch": 19} {"train_loss": -4.327755928039551, "global_step": 3256, "epoch": 19} {"train_loss": -4.34193229675293, "global_step": 3257, "epoch": 19} {"train_loss": -4.3626604080200195, "global_step": 3258, "epoch": 19} {"train_loss": -4.353984832763672, "global_step": 3259, "epoch": 19} {"train_loss": -4.536026954650879, "global_step": 3260, "epoch": 19} {"train_loss": -4.476104736328125, "global_step": 3261, "epoch": 19} {"train_loss": -4.413163661956787, "global_step": 3262, "epoch": 19} {"train_loss": -4.529400825500488, "global_step": 3263, "epoch": 19} {"train_loss": -4.5212931632995605, "global_step": 3264, "epoch": 19} {"train_loss": -4.450902938842773, "global_step": 3265, "epoch": 19} {"train_loss": -4.428922653198242, "global_step": 3266, "epoch": 19} {"train_loss": -4.312277793884277, "global_step": 3267, "epoch": 19} {"train_loss": -4.428431987762451, "global_step": 3268, "epoch": 19} {"train_loss": -4.042369365692139, "global_step": 3269, "epoch": 19} {"train_loss": -4.426130294799805, "global_step": 3270, "epoch": 19} {"train_loss": -4.473666191101074, "global_step": 3271, "epoch": 19} {"train_loss": -4.517519950866699, "global_step": 3272, "epoch": 19} {"train_loss": -4.6123857498168945, "global_step": 3273, "epoch": 19} {"train_loss": -4.370692729949951, "global_step": 3274, "epoch": 19} {"train_loss": -4.5044097900390625, "global_step": 3275, "epoch": 19} {"train_loss": -4.714856147766113, "global_step": 3276, "epoch": 19} {"train_loss": -4.647291660308838, "global_step": 3277, "epoch": 19} {"train_loss": -4.662405967712402, "global_step": 3278, "epoch": 19} {"train_loss": -4.325844764709473, "global_step": 3279, "epoch": 19} {"train_loss": -4.5953288078308105, "global_step": 3280, "epoch": 19} {"train_loss": -4.3372416496276855, "global_step": 3281, "epoch": 19} {"train_loss": -4.65007209777832, "global_step": 3282, "epoch": 19} {"train_loss": -4.535198211669922, "global_step": 3283, "epoch": 19} {"train_loss": -4.545273780822754, "global_step": 3284, "epoch": 19} {"train_loss": -4.579990386962891, "global_step": 3285, "epoch": 19} {"train_loss": -4.683789253234863, "global_step": 3286, "epoch": 19} {"train_loss": -4.531389236450195, "global_step": 3287, "epoch": 19} {"train_loss": -4.474214553833008, "global_step": 3288, "epoch": 19} {"train_loss": -4.430601119995117, "global_step": 3289, "epoch": 19} {"train_loss": -4.751394271850586, "global_step": 3290, "epoch": 19} {"train_loss": -4.5320868492126465, "global_step": 3291, "epoch": 19} {"train_loss": -4.56691837310791, "global_step": 3292, "epoch": 19} {"train_loss": -4.620738983154297, "global_step": 3293, "epoch": 19} {"train_loss": -4.667197227478027, "global_step": 3294, "epoch": 19} {"train_loss": -4.674549102783203, "global_step": 3295, "epoch": 19} {"train_loss": -4.67085075378418, "global_step": 3296, "epoch": 19} {"train_loss": -4.800633430480957, "global_step": 3297, "epoch": 19} {"train_loss": -4.596609592437744, "global_step": 3298, "epoch": 19} {"train_loss": -4.497563362121582, "global_step": 3299, "epoch": 19} {"train_loss": -4.525230407714844, "global_step": 3300, "epoch": 19} {"train_loss": -4.900222301483154, "global_step": 3301, "epoch": 19} {"train_loss": -4.5363054275512695, "global_step": 3302, "epoch": 19} {"train_loss": -4.48323917388916, "global_step": 3303, "epoch": 19} {"train_loss": -4.594040393829346, "global_step": 3304, "epoch": 19} {"train_loss": -4.591004371643066, "global_step": 3305, "epoch": 19} {"train_loss": -4.448369026184082, "global_step": 3306, "epoch": 19} {"train_loss": -4.4493088722229, "global_step": 3307, "epoch": 19} {"train_loss": -4.202142238616943, "global_step": 3308, "epoch": 19} {"train_loss": -4.78428840637207, "global_step": 3309, "epoch": 19} {"train_loss": -4.622970104217529, "global_step": 3310, "epoch": 19} {"train_loss": -4.723484516143799, "global_step": 3311, "epoch": 19} {"train_loss": -4.48574161529541, "global_step": 3312, "epoch": 19} {"train_loss": -4.396905899047852, "global_step": 3313, "epoch": 19} {"train_loss": -4.673812389373779, "global_step": 3314, "epoch": 19} {"train_loss": -4.325325012207031, "global_step": 3315, "epoch": 19} {"train_loss": -4.593557357788086, "global_step": 3316, "epoch": 19} {"train_loss": -4.70916223526001, "global_step": 3317, "epoch": 19} {"train_loss": -4.614931583404541, "global_step": 3318, "epoch": 19} {"train_loss": -4.482151031494141, "global_step": 3319, "epoch": 19} {"train_loss": -4.616731643676758, "global_step": 3320, "epoch": 19} {"train_loss": -4.7705302238464355, "global_step": 3321, "epoch": 19} {"train_loss": -4.510977745056152, "global_step": 3322, "epoch": 19} {"train_loss": -4.632963180541992, "global_step": 3323, "epoch": 19} {"train_loss": -4.450891971588135, "global_step": 3324, "epoch": 19} {"train_loss": -4.505947113037109, "global_step": 3325, "epoch": 19} {"train_loss": -4.555541515350342, "global_step": 3326, "epoch": 19} {"train_loss": -4.44858980178833, "global_step": 3327, "epoch": 19} {"train_loss": -4.468984603881836, "global_step": 3328, "epoch": 19} {"train_loss": -4.2098164558410645, "global_step": 3329, "epoch": 19} {"train_loss": -4.561949729919434, "global_step": 3330, "epoch": 19} {"train_loss": -4.430222988128662, "global_step": 3331, "epoch": 19} {"train_loss": -4.496228218078613, "global_step": 3332, "epoch": 19} {"train_loss": -4.366549491882324, "global_step": 3333, "epoch": 19} {"train_loss": -4.240154266357422, "global_step": 3334, "epoch": 19} {"train_loss": -4.772743225097656, "global_step": 3335, "epoch": 19} {"train_loss": -4.389549732208252, "global_step": 3336, "epoch": 19} {"train_loss": -4.553849220275879, "global_step": 3337, "epoch": 19} {"train_loss": -4.378789901733398, "global_step": 3338, "epoch": 19} {"train_loss": -4.61196231842041, "global_step": 3339, "epoch": 19} {"train_loss": -4.372166156768799, "global_step": 3340, "epoch": 19} {"train_loss": -4.618751525878906, "global_step": 3341, "epoch": 19} {"train_loss": -4.25908088684082, "global_step": 3342, "epoch": 19} {"train_loss": -4.826392650604248, "global_step": 3343, "epoch": 19} {"train_loss": -4.234706878662109, "global_step": 3344, "epoch": 19} {"train_loss": -4.604941368103027, "global_step": 3345, "epoch": 19} {"train_loss": -4.517002105712891, "global_step": 3346, "epoch": 19} {"train_loss": -4.618278980255127, "global_step": 3347, "epoch": 19} {"train_loss": -4.616261005401611, "global_step": 3348, "epoch": 19} {"train_loss": -4.457547664642334, "global_step": 3349, "epoch": 19} {"train_loss": -4.6422576904296875, "global_step": 3350, "epoch": 19} {"train_loss": -4.4157562255859375, "global_step": 3351, "epoch": 19} {"train_loss": -4.665463447570801, "global_step": 3352, "epoch": 19} {"train_loss": -4.502011299133301, "global_step": 3353, "epoch": 19} {"train_loss": -4.401389122009277, "global_step": 3354, "epoch": 19} {"train_loss": -4.604036331176758, "global_step": 3355, "epoch": 19} {"train_loss": -4.642146110534668, "global_step": 3356, "epoch": 19} {"train_loss": -4.765416622161865, "global_step": 3357, "epoch": 19} {"train_loss": -4.348974227905273, "global_step": 3358, "epoch": 19} {"train_loss": -4.4981154544012885, "global_step": 3359, "epoch": 19, "val_loss": 260738.734375} {"train_loss": -4.585947036743164, "global_step": 3360, "epoch": 20} {"train_loss": -4.615784168243408, "global_step": 3361, "epoch": 20} {"train_loss": -4.555540561676025, "global_step": 3362, "epoch": 20} {"train_loss": -4.734158992767334, "global_step": 3363, "epoch": 20} {"train_loss": -4.621584892272949, "global_step": 3364, "epoch": 20} {"train_loss": -4.73893404006958, "global_step": 3365, "epoch": 20} {"train_loss": -4.597097873687744, "global_step": 3366, "epoch": 20} {"train_loss": -4.6530961990356445, "global_step": 3367, "epoch": 20} {"train_loss": -4.4147467613220215, "global_step": 3368, "epoch": 20} {"train_loss": -4.4157562255859375, "global_step": 3369, "epoch": 20} {"train_loss": -4.520659446716309, "global_step": 3370, "epoch": 20} {"train_loss": -4.601641654968262, "global_step": 3371, "epoch": 20} {"train_loss": -4.456158638000488, "global_step": 3372, "epoch": 20} {"train_loss": -4.581774711608887, "global_step": 3373, "epoch": 20} {"train_loss": -4.779560089111328, "global_step": 3374, "epoch": 20} {"train_loss": -4.080920219421387, "global_step": 3375, "epoch": 20} {"train_loss": -4.430063247680664, "global_step": 3376, "epoch": 20} {"train_loss": -4.01777458190918, "global_step": 3377, "epoch": 20} {"train_loss": -3.9101076126098633, "global_step": 3378, "epoch": 20} {"train_loss": -4.3388237953186035, "global_step": 3379, "epoch": 20} {"train_loss": -4.205570220947266, "global_step": 3380, "epoch": 20} {"train_loss": -4.36554479598999, "global_step": 3381, "epoch": 20} {"train_loss": -4.041129112243652, "global_step": 3382, "epoch": 20} {"train_loss": -4.203215599060059, "global_step": 3383, "epoch": 20} {"train_loss": -4.357588768005371, "global_step": 3384, "epoch": 20} {"train_loss": -4.58986234664917, "global_step": 3385, "epoch": 20} {"train_loss": -4.415388107299805, "global_step": 3386, "epoch": 20} {"train_loss": -4.3876471519470215, "global_step": 3387, "epoch": 20} {"train_loss": -4.319431304931641, "global_step": 3388, "epoch": 20} {"train_loss": -4.586976051330566, "global_step": 3389, "epoch": 20} {"train_loss": -4.539963722229004, "global_step": 3390, "epoch": 20} {"train_loss": -4.470470428466797, "global_step": 3391, "epoch": 20} {"train_loss": -4.215684413909912, "global_step": 3392, "epoch": 20} {"train_loss": -4.478973388671875, "global_step": 3393, "epoch": 20} {"train_loss": -4.775116920471191, "global_step": 3394, "epoch": 20} {"train_loss": -4.786870956420898, "global_step": 3395, "epoch": 20} {"train_loss": -4.436488151550293, "global_step": 3396, "epoch": 20} {"train_loss": -4.674592018127441, "global_step": 3397, "epoch": 20} {"train_loss": -4.626533508300781, "global_step": 3398, "epoch": 20} {"train_loss": -4.712333679199219, "global_step": 3399, "epoch": 20} {"train_loss": -4.621485710144043, "global_step": 3400, "epoch": 20} {"train_loss": -4.608517646789551, "global_step": 3401, "epoch": 20} {"train_loss": -4.396331787109375, "global_step": 3402, "epoch": 20} {"train_loss": -4.342065811157227, "global_step": 3403, "epoch": 20} {"train_loss": -4.555868625640869, "global_step": 3404, "epoch": 20} {"train_loss": -4.497790336608887, "global_step": 3405, "epoch": 20} {"train_loss": -4.802524566650391, "global_step": 3406, "epoch": 20} {"train_loss": -4.812508583068848, "global_step": 3407, "epoch": 20} {"train_loss": -4.469874382019043, "global_step": 3408, "epoch": 20} {"train_loss": -4.801908016204834, "global_step": 3409, "epoch": 20} {"train_loss": -4.4263224601745605, "global_step": 3410, "epoch": 20} {"train_loss": -4.747647285461426, "global_step": 3411, "epoch": 20} {"train_loss": -4.477078437805176, "global_step": 3412, "epoch": 20} {"train_loss": -4.474077224731445, "global_step": 3413, "epoch": 20} {"train_loss": -4.573100566864014, "global_step": 3414, "epoch": 20} {"train_loss": -4.363482475280762, "global_step": 3415, "epoch": 20} {"train_loss": -4.869351863861084, "global_step": 3416, "epoch": 20} {"train_loss": -4.535055160522461, "global_step": 3417, "epoch": 20} {"train_loss": -4.614285469055176, "global_step": 3418, "epoch": 20} {"train_loss": -4.45247745513916, "global_step": 3419, "epoch": 20} {"train_loss": -4.205848217010498, "global_step": 3420, "epoch": 20} {"train_loss": -4.4762959480285645, "global_step": 3421, "epoch": 20} {"train_loss": -4.265357971191406, "global_step": 3422, "epoch": 20} {"train_loss": -4.231678009033203, "global_step": 3423, "epoch": 20} {"train_loss": -4.467517375946045, "global_step": 3424, "epoch": 20} {"train_loss": -4.448966026306152, "global_step": 3425, "epoch": 20} {"train_loss": -4.593050003051758, "global_step": 3426, "epoch": 20} {"train_loss": -4.599309921264648, "global_step": 3427, "epoch": 20} {"train_loss": -4.574390411376953, "global_step": 3428, "epoch": 20} {"train_loss": -4.499700546264648, "global_step": 3429, "epoch": 20} {"train_loss": -4.770042419433594, "global_step": 3430, "epoch": 20} {"train_loss": -4.583417892456055, "global_step": 3431, "epoch": 20} {"train_loss": -4.715160369873047, "global_step": 3432, "epoch": 20} {"train_loss": -4.697551727294922, "global_step": 3433, "epoch": 20} {"train_loss": -4.415927410125732, "global_step": 3434, "epoch": 20} {"train_loss": -4.583751678466797, "global_step": 3435, "epoch": 20} {"train_loss": -4.61178731918335, "global_step": 3436, "epoch": 20} {"train_loss": -4.183540344238281, "global_step": 3437, "epoch": 20} {"train_loss": -4.750244617462158, "global_step": 3438, "epoch": 20} {"train_loss": -4.569954872131348, "global_step": 3439, "epoch": 20} {"train_loss": -4.4992475509643555, "global_step": 3440, "epoch": 20} {"train_loss": -4.7157816886901855, "global_step": 3441, "epoch": 20} {"train_loss": -4.814581394195557, "global_step": 3442, "epoch": 20} {"train_loss": -4.620786666870117, "global_step": 3443, "epoch": 20} {"train_loss": -4.307897567749023, "global_step": 3444, "epoch": 20} {"train_loss": -4.631130218505859, "global_step": 3445, "epoch": 20} {"train_loss": -4.640800476074219, "global_step": 3446, "epoch": 20} {"train_loss": -4.5307183265686035, "global_step": 3447, "epoch": 20} {"train_loss": -4.581765651702881, "global_step": 3448, "epoch": 20} {"train_loss": -4.83922004699707, "global_step": 3449, "epoch": 20} {"train_loss": -4.933189392089844, "global_step": 3450, "epoch": 20} {"train_loss": -4.717870235443115, "global_step": 3451, "epoch": 20} {"train_loss": -4.847019195556641, "global_step": 3452, "epoch": 20} {"train_loss": -4.749058723449707, "global_step": 3453, "epoch": 20} {"train_loss": -4.477348327636719, "global_step": 3454, "epoch": 20} {"train_loss": -4.715326309204102, "global_step": 3455, "epoch": 20} {"train_loss": -4.682187080383301, "global_step": 3456, "epoch": 20} {"train_loss": -4.535911560058594, "global_step": 3457, "epoch": 20} {"train_loss": -4.519396781921387, "global_step": 3458, "epoch": 20} {"train_loss": -4.63163948059082, "global_step": 3459, "epoch": 20} {"train_loss": -4.640979766845703, "global_step": 3460, "epoch": 20} {"train_loss": -4.760454177856445, "global_step": 3461, "epoch": 20} {"train_loss": -4.636855602264404, "global_step": 3462, "epoch": 20} {"train_loss": -4.571613311767578, "global_step": 3463, "epoch": 20} {"train_loss": -4.8354668617248535, "global_step": 3464, "epoch": 20} {"train_loss": -4.491217613220215, "global_step": 3465, "epoch": 20} {"train_loss": -4.7663726806640625, "global_step": 3466, "epoch": 20} {"train_loss": -4.903898239135742, "global_step": 3467, "epoch": 20} {"train_loss": -4.464550971984863, "global_step": 3468, "epoch": 20} {"train_loss": -4.698225021362305, "global_step": 3469, "epoch": 20} {"train_loss": -4.280215740203857, "global_step": 3470, "epoch": 20} {"train_loss": -4.556605815887451, "global_step": 3471, "epoch": 20} {"train_loss": -4.670124053955078, "global_step": 3472, "epoch": 20} {"train_loss": -4.473649978637695, "global_step": 3473, "epoch": 20} {"train_loss": -4.5668182373046875, "global_step": 3474, "epoch": 20} {"train_loss": -4.8375396728515625, "global_step": 3475, "epoch": 20} {"train_loss": -4.592831134796143, "global_step": 3476, "epoch": 20} {"train_loss": -4.493380546569824, "global_step": 3477, "epoch": 20} {"train_loss": -4.414902687072754, "global_step": 3478, "epoch": 20} {"train_loss": -4.868045806884766, "global_step": 3479, "epoch": 20} {"train_loss": -4.4573540687561035, "global_step": 3480, "epoch": 20} {"train_loss": -4.713850498199463, "global_step": 3481, "epoch": 20} {"train_loss": -4.638609886169434, "global_step": 3482, "epoch": 20} {"train_loss": -4.411498069763184, "global_step": 3483, "epoch": 20} {"train_loss": -4.7657270431518555, "global_step": 3484, "epoch": 20} {"train_loss": -4.487302303314209, "global_step": 3485, "epoch": 20} {"train_loss": -4.898043155670166, "global_step": 3486, "epoch": 20} {"train_loss": -4.372603416442871, "global_step": 3487, "epoch": 20} {"train_loss": -4.7544145584106445, "global_step": 3488, "epoch": 20} {"train_loss": -4.809786319732666, "global_step": 3489, "epoch": 20} {"train_loss": -4.769227504730225, "global_step": 3490, "epoch": 20} {"train_loss": -4.586174011230469, "global_step": 3491, "epoch": 20} {"train_loss": -4.558609485626221, "global_step": 3492, "epoch": 20} {"train_loss": -4.769699573516846, "global_step": 3493, "epoch": 20} {"train_loss": -4.707614898681641, "global_step": 3494, "epoch": 20} {"train_loss": -5.006514549255371, "global_step": 3495, "epoch": 20} {"train_loss": -4.553550720214844, "global_step": 3496, "epoch": 20} {"train_loss": -4.722318649291992, "global_step": 3497, "epoch": 20} {"train_loss": -4.7114577293396, "global_step": 3498, "epoch": 20} {"train_loss": -4.490957736968994, "global_step": 3499, "epoch": 20} {"train_loss": -4.646703243255615, "global_step": 3500, "epoch": 20} {"train_loss": -4.668625831604004, "global_step": 3501, "epoch": 20} {"train_loss": -4.685145378112793, "global_step": 3502, "epoch": 20} {"train_loss": -4.739426612854004, "global_step": 3503, "epoch": 20} {"train_loss": -4.578330993652344, "global_step": 3504, "epoch": 20} {"train_loss": -4.716628074645996, "global_step": 3505, "epoch": 20} {"train_loss": -4.2017107009887695, "global_step": 3506, "epoch": 20} {"train_loss": -4.647604465484619, "global_step": 3507, "epoch": 20} {"train_loss": -4.734402179718018, "global_step": 3508, "epoch": 20} {"train_loss": -4.489593029022217, "global_step": 3509, "epoch": 20} {"train_loss": -4.556037902832031, "global_step": 3510, "epoch": 20} {"train_loss": -4.757213592529297, "global_step": 3511, "epoch": 20} {"train_loss": -4.686581611633301, "global_step": 3512, "epoch": 20} {"train_loss": -4.638956546783447, "global_step": 3513, "epoch": 20} {"train_loss": -4.675224304199219, "global_step": 3514, "epoch": 20} {"train_loss": -4.466745376586914, "global_step": 3515, "epoch": 20} {"train_loss": -4.583242416381836, "global_step": 3516, "epoch": 20} {"train_loss": -4.481471061706543, "global_step": 3517, "epoch": 20} {"train_loss": -4.920201301574707, "global_step": 3518, "epoch": 20} {"train_loss": -4.640600204467773, "global_step": 3519, "epoch": 20} {"train_loss": -4.8615570068359375, "global_step": 3520, "epoch": 20} {"train_loss": -4.598283290863037, "global_step": 3521, "epoch": 20} {"train_loss": -4.790544509887695, "global_step": 3522, "epoch": 20} {"train_loss": -4.544975280761719, "global_step": 3523, "epoch": 20} {"train_loss": -4.562159538269043, "global_step": 3524, "epoch": 20} {"train_loss": -4.414036750793457, "global_step": 3525, "epoch": 20} {"train_loss": -4.226842880249023, "global_step": 3526, "epoch": 20} {"train_loss": -4.571243297486078, "global_step": 3527, "epoch": 20, "val_loss": 254215.75, "train_action_mse_error": 88.78646850585938} {"train_loss": -4.508073806762695, "global_step": 3528, "epoch": 21} {"train_loss": -4.787806034088135, "global_step": 3529, "epoch": 21} {"train_loss": -4.299701690673828, "global_step": 3530, "epoch": 21} {"train_loss": -4.618988037109375, "global_step": 3531, "epoch": 21} {"train_loss": -4.797750473022461, "global_step": 3532, "epoch": 21} {"train_loss": -4.497709274291992, "global_step": 3533, "epoch": 21} {"train_loss": -4.525489807128906, "global_step": 3534, "epoch": 21} {"train_loss": -4.842680931091309, "global_step": 3535, "epoch": 21} {"train_loss": -4.481459617614746, "global_step": 3536, "epoch": 21} {"train_loss": -4.4093146324157715, "global_step": 3537, "epoch": 21} {"train_loss": -4.846853256225586, "global_step": 3538, "epoch": 21} {"train_loss": -4.4616498947143555, "global_step": 3539, "epoch": 21} {"train_loss": -4.469491004943848, "global_step": 3540, "epoch": 21} {"train_loss": -4.38599967956543, "global_step": 3541, "epoch": 21} {"train_loss": -4.626826286315918, "global_step": 3542, "epoch": 21} {"train_loss": -4.677602767944336, "global_step": 3543, "epoch": 21} {"train_loss": -4.564384460449219, "global_step": 3544, "epoch": 21} {"train_loss": -4.379533767700195, "global_step": 3545, "epoch": 21} {"train_loss": -4.547176837921143, "global_step": 3546, "epoch": 21} {"train_loss": -4.778575897216797, "global_step": 3547, "epoch": 21} {"train_loss": -4.564421653747559, "global_step": 3548, "epoch": 21} {"train_loss": -4.335693359375, "global_step": 3549, "epoch": 21} {"train_loss": -4.699044227600098, "global_step": 3550, "epoch": 21} {"train_loss": -4.742284297943115, "global_step": 3551, "epoch": 21} {"train_loss": -4.64472770690918, "global_step": 3552, "epoch": 21} {"train_loss": -4.75178337097168, "global_step": 3553, "epoch": 21} {"train_loss": -4.462671279907227, "global_step": 3554, "epoch": 21} {"train_loss": -4.500514030456543, "global_step": 3555, "epoch": 21} {"train_loss": -4.729666233062744, "global_step": 3556, "epoch": 21} {"train_loss": -4.806492328643799, "global_step": 3557, "epoch": 21} {"train_loss": -4.76479434967041, "global_step": 3558, "epoch": 21} {"train_loss": -4.606484413146973, "global_step": 3559, "epoch": 21} {"train_loss": -4.548795700073242, "global_step": 3560, "epoch": 21} {"train_loss": -4.624420166015625, "global_step": 3561, "epoch": 21} {"train_loss": -4.730337142944336, "global_step": 3562, "epoch": 21} {"train_loss": -4.604283809661865, "global_step": 3563, "epoch": 21} {"train_loss": -4.769330978393555, "global_step": 3564, "epoch": 21} {"train_loss": -4.641789436340332, "global_step": 3565, "epoch": 21} {"train_loss": -4.797451972961426, "global_step": 3566, "epoch": 21} {"train_loss": -4.560898303985596, "global_step": 3567, "epoch": 21} {"train_loss": -4.68572998046875, "global_step": 3568, "epoch": 21} {"train_loss": -4.4979658126831055, "global_step": 3569, "epoch": 21} {"train_loss": -4.842403888702393, "global_step": 3570, "epoch": 21} {"train_loss": -4.507120132446289, "global_step": 3571, "epoch": 21} {"train_loss": -4.611448287963867, "global_step": 3572, "epoch": 21} {"train_loss": -4.465888977050781, "global_step": 3573, "epoch": 21} {"train_loss": -4.630227088928223, "global_step": 3574, "epoch": 21} {"train_loss": -4.599409580230713, "global_step": 3575, "epoch": 21} {"train_loss": -4.723219871520996, "global_step": 3576, "epoch": 21} {"train_loss": -4.435143947601318, "global_step": 3577, "epoch": 21} {"train_loss": -4.645563125610352, "global_step": 3578, "epoch": 21} {"train_loss": -4.650564193725586, "global_step": 3579, "epoch": 21} {"train_loss": -4.381707668304443, "global_step": 3580, "epoch": 21} {"train_loss": -4.832451343536377, "global_step": 3581, "epoch": 21} {"train_loss": -4.5069732666015625, "global_step": 3582, "epoch": 21} {"train_loss": -4.885404109954834, "global_step": 3583, "epoch": 21} {"train_loss": -4.666545867919922, "global_step": 3584, "epoch": 21} {"train_loss": -4.6737165451049805, "global_step": 3585, "epoch": 21} {"train_loss": -4.663029670715332, "global_step": 3586, "epoch": 21} {"train_loss": -4.545474052429199, "global_step": 3587, "epoch": 21} {"train_loss": -4.895216941833496, "global_step": 3588, "epoch": 21} {"train_loss": -4.821102142333984, "global_step": 3589, "epoch": 21} {"train_loss": -4.8040266036987305, "global_step": 3590, "epoch": 21} {"train_loss": -4.895659446716309, "global_step": 3591, "epoch": 21} {"train_loss": -4.747565269470215, "global_step": 3592, "epoch": 21} {"train_loss": -5.018268585205078, "global_step": 3593, "epoch": 21} {"train_loss": -4.753754138946533, "global_step": 3594, "epoch": 21} {"train_loss": -5.056317329406738, "global_step": 3595, "epoch": 21} {"train_loss": -4.877111434936523, "global_step": 3596, "epoch": 21} {"train_loss": -4.426572322845459, "global_step": 3597, "epoch": 21} {"train_loss": -4.667567729949951, "global_step": 3598, "epoch": 21} {"train_loss": -4.486340522766113, "global_step": 3599, "epoch": 21} {"train_loss": -4.474438190460205, "global_step": 3600, "epoch": 21} {"train_loss": -4.523970603942871, "global_step": 3601, "epoch": 21} {"train_loss": -4.2781982421875, "global_step": 3602, "epoch": 21} {"train_loss": -4.355015277862549, "global_step": 3603, "epoch": 21} {"train_loss": -4.3997392654418945, "global_step": 3604, "epoch": 21} {"train_loss": -4.539578437805176, "global_step": 3605, "epoch": 21} {"train_loss": -4.503384590148926, "global_step": 3606, "epoch": 21} {"train_loss": -4.551501274108887, "global_step": 3607, "epoch": 21} {"train_loss": -4.590109825134277, "global_step": 3608, "epoch": 21} {"train_loss": -4.786858558654785, "global_step": 3609, "epoch": 21} {"train_loss": -4.348033905029297, "global_step": 3610, "epoch": 21} {"train_loss": -4.83345890045166, "global_step": 3611, "epoch": 21} {"train_loss": -4.443291664123535, "global_step": 3612, "epoch": 21} {"train_loss": -4.595086097717285, "global_step": 3613, "epoch": 21} {"train_loss": -4.5660810470581055, "global_step": 3614, "epoch": 21} {"train_loss": -4.426025390625, "global_step": 3615, "epoch": 21} {"train_loss": -4.430429458618164, "global_step": 3616, "epoch": 21} {"train_loss": -4.446110725402832, "global_step": 3617, "epoch": 21} {"train_loss": -4.553924560546875, "global_step": 3618, "epoch": 21} {"train_loss": -4.839251518249512, "global_step": 3619, "epoch": 21} {"train_loss": -4.561135292053223, "global_step": 3620, "epoch": 21} {"train_loss": -4.397356033325195, "global_step": 3621, "epoch": 21} {"train_loss": -4.548620223999023, "global_step": 3622, "epoch": 21} {"train_loss": -4.775172233581543, "global_step": 3623, "epoch": 21} {"train_loss": -4.899138450622559, "global_step": 3624, "epoch": 21} {"train_loss": -4.518035411834717, "global_step": 3625, "epoch": 21} {"train_loss": -4.530856132507324, "global_step": 3626, "epoch": 21} {"train_loss": -4.502650737762451, "global_step": 3627, "epoch": 21} {"train_loss": -4.873712062835693, "global_step": 3628, "epoch": 21} {"train_loss": -4.617203235626221, "global_step": 3629, "epoch": 21} {"train_loss": -4.584314823150635, "global_step": 3630, "epoch": 21} {"train_loss": -4.748291492462158, "global_step": 3631, "epoch": 21} {"train_loss": -4.676022052764893, "global_step": 3632, "epoch": 21} {"train_loss": -4.735421657562256, "global_step": 3633, "epoch": 21} {"train_loss": -4.741571426391602, "global_step": 3634, "epoch": 21} {"train_loss": -4.807995796203613, "global_step": 3635, "epoch": 21} {"train_loss": -4.558635711669922, "global_step": 3636, "epoch": 21} {"train_loss": -4.805346488952637, "global_step": 3637, "epoch": 21} {"train_loss": -4.553379535675049, "global_step": 3638, "epoch": 21} {"train_loss": -4.456969738006592, "global_step": 3639, "epoch": 21} {"train_loss": -4.8528008460998535, "global_step": 3640, "epoch": 21} {"train_loss": -4.50296688079834, "global_step": 3641, "epoch": 21} {"train_loss": -4.94843864440918, "global_step": 3642, "epoch": 21} {"train_loss": -4.801111221313477, "global_step": 3643, "epoch": 21} {"train_loss": -4.600366592407227, "global_step": 3644, "epoch": 21} {"train_loss": -4.642120838165283, "global_step": 3645, "epoch": 21} {"train_loss": -4.412282466888428, "global_step": 3646, "epoch": 21} {"train_loss": -4.461536884307861, "global_step": 3647, "epoch": 21} {"train_loss": -4.791667938232422, "global_step": 3648, "epoch": 21} {"train_loss": -4.554502487182617, "global_step": 3649, "epoch": 21} {"train_loss": -4.608844757080078, "global_step": 3650, "epoch": 21} {"train_loss": -4.516818046569824, "global_step": 3651, "epoch": 21} {"train_loss": -4.874542236328125, "global_step": 3652, "epoch": 21} {"train_loss": -4.453759670257568, "global_step": 3653, "epoch": 21} {"train_loss": -4.723043441772461, "global_step": 3654, "epoch": 21} {"train_loss": -4.919970512390137, "global_step": 3655, "epoch": 21} {"train_loss": -4.627049922943115, "global_step": 3656, "epoch": 21} {"train_loss": -4.545945167541504, "global_step": 3657, "epoch": 21} {"train_loss": -4.740396022796631, "global_step": 3658, "epoch": 21} {"train_loss": -4.632810592651367, "global_step": 3659, "epoch": 21} {"train_loss": -4.327698707580566, "global_step": 3660, "epoch": 21} {"train_loss": -4.725827217102051, "global_step": 3661, "epoch": 21} {"train_loss": -4.940839767456055, "global_step": 3662, "epoch": 21} {"train_loss": -4.770134925842285, "global_step": 3663, "epoch": 21} {"train_loss": -4.53474235534668, "global_step": 3664, "epoch": 21} {"train_loss": -4.747453689575195, "global_step": 3665, "epoch": 21} {"train_loss": -4.797785758972168, "global_step": 3666, "epoch": 21} {"train_loss": -4.911040306091309, "global_step": 3667, "epoch": 21} {"train_loss": -4.780002593994141, "global_step": 3668, "epoch": 21} {"train_loss": -4.762311935424805, "global_step": 3669, "epoch": 21} {"train_loss": -4.7420244216918945, "global_step": 3670, "epoch": 21} {"train_loss": -4.975291728973389, "global_step": 3671, "epoch": 21} {"train_loss": -4.686551094055176, "global_step": 3672, "epoch": 21} {"train_loss": -4.70673942565918, "global_step": 3673, "epoch": 21} {"train_loss": -4.735119819641113, "global_step": 3674, "epoch": 21} {"train_loss": -4.813089370727539, "global_step": 3675, "epoch": 21} {"train_loss": -4.677299499511719, "global_step": 3676, "epoch": 21} {"train_loss": -4.563215255737305, "global_step": 3677, "epoch": 21} {"train_loss": -4.447426795959473, "global_step": 3678, "epoch": 21} {"train_loss": -4.633397102355957, "global_step": 3679, "epoch": 21} {"train_loss": -4.503441333770752, "global_step": 3680, "epoch": 21} {"train_loss": -4.547593116760254, "global_step": 3681, "epoch": 21} {"train_loss": -4.554416656494141, "global_step": 3682, "epoch": 21} {"train_loss": -4.75763463973999, "global_step": 3683, "epoch": 21} {"train_loss": -4.560685157775879, "global_step": 3684, "epoch": 21} {"train_loss": -4.619035720825195, "global_step": 3685, "epoch": 21} {"train_loss": -4.507590293884277, "global_step": 3686, "epoch": 21} {"train_loss": -4.453274726867676, "global_step": 3687, "epoch": 21} {"train_loss": -4.319451332092285, "global_step": 3688, "epoch": 21} {"train_loss": -4.727473258972168, "global_step": 3689, "epoch": 21} {"train_loss": -4.295429706573486, "global_step": 3690, "epoch": 21} {"train_loss": -4.581607341766357, "global_step": 3691, "epoch": 21} {"train_loss": -4.096545219421387, "global_step": 3692, "epoch": 21} {"train_loss": -4.481484413146973, "global_step": 3693, "epoch": 21} {"train_loss": -4.524413585662842, "global_step": 3694, "epoch": 21} {"train_loss": -4.62552767708188, "global_step": 3695, "epoch": 21, "val_loss": 234204.984375} {"train_loss": -4.420502185821533, "global_step": 3696, "epoch": 22} {"train_loss": -4.4826459884643555, "global_step": 3697, "epoch": 22} {"train_loss": -4.664449691772461, "global_step": 3698, "epoch": 22} {"train_loss": -4.501029014587402, "global_step": 3699, "epoch": 22} {"train_loss": -4.624072551727295, "global_step": 3700, "epoch": 22} {"train_loss": -4.544350624084473, "global_step": 3701, "epoch": 22} {"train_loss": -4.568005561828613, "global_step": 3702, "epoch": 22} {"train_loss": -4.685369491577148, "global_step": 3703, "epoch": 22} {"train_loss": -4.669130325317383, "global_step": 3704, "epoch": 22} {"train_loss": -4.599031448364258, "global_step": 3705, "epoch": 22} {"train_loss": -4.64259147644043, "global_step": 3706, "epoch": 22} {"train_loss": -4.583054542541504, "global_step": 3707, "epoch": 22} {"train_loss": -4.716319561004639, "global_step": 3708, "epoch": 22} {"train_loss": -4.577906608581543, "global_step": 3709, "epoch": 22} {"train_loss": -4.794185638427734, "global_step": 3710, "epoch": 22} {"train_loss": -4.72021484375, "global_step": 3711, "epoch": 22} {"train_loss": -4.607235908508301, "global_step": 3712, "epoch": 22} {"train_loss": -4.649820327758789, "global_step": 3713, "epoch": 22} {"train_loss": -4.509599208831787, "global_step": 3714, "epoch": 22} {"train_loss": -4.494485378265381, "global_step": 3715, "epoch": 22} {"train_loss": -4.537681579589844, "global_step": 3716, "epoch": 22} {"train_loss": -4.481473445892334, "global_step": 3717, "epoch": 22} {"train_loss": -4.515651702880859, "global_step": 3718, "epoch": 22} {"train_loss": -4.1491804122924805, "global_step": 3719, "epoch": 22} {"train_loss": -4.4544878005981445, "global_step": 3720, "epoch": 22} {"train_loss": -4.564313888549805, "global_step": 3721, "epoch": 22} {"train_loss": -4.261988162994385, "global_step": 3722, "epoch": 22} {"train_loss": -4.456695556640625, "global_step": 3723, "epoch": 22} {"train_loss": -4.623387336730957, "global_step": 3724, "epoch": 22} {"train_loss": -4.698765754699707, "global_step": 3725, "epoch": 22} {"train_loss": -4.444356918334961, "global_step": 3726, "epoch": 22} {"train_loss": -4.602670669555664, "global_step": 3727, "epoch": 22} {"train_loss": -4.631732940673828, "global_step": 3728, "epoch": 22} {"train_loss": -4.732417106628418, "global_step": 3729, "epoch": 22} {"train_loss": -4.910409450531006, "global_step": 3730, "epoch": 22} {"train_loss": -4.599102020263672, "global_step": 3731, "epoch": 22} {"train_loss": -4.706018924713135, "global_step": 3732, "epoch": 22} {"train_loss": -4.514527320861816, "global_step": 3733, "epoch": 22} {"train_loss": -4.6706976890563965, "global_step": 3734, "epoch": 22} {"train_loss": -4.827245235443115, "global_step": 3735, "epoch": 22} {"train_loss": -4.617587566375732, "global_step": 3736, "epoch": 22} {"train_loss": -4.573351860046387, "global_step": 3737, "epoch": 22} {"train_loss": -4.773726940155029, "global_step": 3738, "epoch": 22} {"train_loss": -4.891419410705566, "global_step": 3739, "epoch": 22} {"train_loss": -4.7113494873046875, "global_step": 3740, "epoch": 22} {"train_loss": -4.846540451049805, "global_step": 3741, "epoch": 22} {"train_loss": -4.814154148101807, "global_step": 3742, "epoch": 22} {"train_loss": -4.452154159545898, "global_step": 3743, "epoch": 22} {"train_loss": -4.521486759185791, "global_step": 3744, "epoch": 22} {"train_loss": -4.7641448974609375, "global_step": 3745, "epoch": 22} {"train_loss": -4.6625165939331055, "global_step": 3746, "epoch": 22} {"train_loss": -4.700237274169922, "global_step": 3747, "epoch": 22} {"train_loss": -4.549553394317627, "global_step": 3748, "epoch": 22} {"train_loss": -4.635263442993164, "global_step": 3749, "epoch": 22} {"train_loss": -4.870484352111816, "global_step": 3750, "epoch": 22} {"train_loss": -4.831915855407715, "global_step": 3751, "epoch": 22} {"train_loss": -4.796051025390625, "global_step": 3752, "epoch": 22} {"train_loss": -4.720480442047119, "global_step": 3753, "epoch": 22} {"train_loss": -4.56941032409668, "global_step": 3754, "epoch": 22} {"train_loss": -4.757791519165039, "global_step": 3755, "epoch": 22} {"train_loss": -4.788124084472656, "global_step": 3756, "epoch": 22} {"train_loss": -4.661851406097412, "global_step": 3757, "epoch": 22} {"train_loss": -4.671795845031738, "global_step": 3758, "epoch": 22} {"train_loss": -4.933075904846191, "global_step": 3759, "epoch": 22} {"train_loss": -4.687494277954102, "global_step": 3760, "epoch": 22} {"train_loss": -4.722322940826416, "global_step": 3761, "epoch": 22} {"train_loss": -4.592875003814697, "global_step": 3762, "epoch": 22} {"train_loss": -4.482322692871094, "global_step": 3763, "epoch": 22} {"train_loss": -4.721083641052246, "global_step": 3764, "epoch": 22} {"train_loss": -4.814327239990234, "global_step": 3765, "epoch": 22} {"train_loss": -4.606346607208252, "global_step": 3766, "epoch": 22} {"train_loss": -4.698288917541504, "global_step": 3767, "epoch": 22} {"train_loss": -4.621715068817139, "global_step": 3768, "epoch": 22} {"train_loss": -4.76460075378418, "global_step": 3769, "epoch": 22} {"train_loss": -4.913066864013672, "global_step": 3770, "epoch": 22} {"train_loss": -4.672696590423584, "global_step": 3771, "epoch": 22} {"train_loss": -4.6426496505737305, "global_step": 3772, "epoch": 22} {"train_loss": -4.674249649047852, "global_step": 3773, "epoch": 22} {"train_loss": -4.622709274291992, "global_step": 3774, "epoch": 22} {"train_loss": -4.452927589416504, "global_step": 3775, "epoch": 22} {"train_loss": -4.413628578186035, "global_step": 3776, "epoch": 22} {"train_loss": -4.639691352844238, "global_step": 3777, "epoch": 22} {"train_loss": -4.490238189697266, "global_step": 3778, "epoch": 22} {"train_loss": -4.868499755859375, "global_step": 3779, "epoch": 22} {"train_loss": -4.530849456787109, "global_step": 3780, "epoch": 22} {"train_loss": -4.429128170013428, "global_step": 3781, "epoch": 22} {"train_loss": -4.814584255218506, "global_step": 3782, "epoch": 22} {"train_loss": -4.640707969665527, "global_step": 3783, "epoch": 22} {"train_loss": -4.4563164710998535, "global_step": 3784, "epoch": 22} {"train_loss": -4.45182466506958, "global_step": 3785, "epoch": 22} {"train_loss": -4.5643510818481445, "global_step": 3786, "epoch": 22} {"train_loss": -4.957301139831543, "global_step": 3787, "epoch": 22} {"train_loss": -4.47556209564209, "global_step": 3788, "epoch": 22} {"train_loss": -4.6689372062683105, "global_step": 3789, "epoch": 22} {"train_loss": -4.532905578613281, "global_step": 3790, "epoch": 22} {"train_loss": -4.696979999542236, "global_step": 3791, "epoch": 22} {"train_loss": -4.541815280914307, "global_step": 3792, "epoch": 22} {"train_loss": -4.38576078414917, "global_step": 3793, "epoch": 22} {"train_loss": -4.638903617858887, "global_step": 3794, "epoch": 22} {"train_loss": -4.876395225524902, "global_step": 3795, "epoch": 22} {"train_loss": -4.667771339416504, "global_step": 3796, "epoch": 22} {"train_loss": -4.849283218383789, "global_step": 3797, "epoch": 22} {"train_loss": -5.014860153198242, "global_step": 3798, "epoch": 22} {"train_loss": -4.535897254943848, "global_step": 3799, "epoch": 22} {"train_loss": -4.467679023742676, "global_step": 3800, "epoch": 22} {"train_loss": -4.583191394805908, "global_step": 3801, "epoch": 22} {"train_loss": -4.589499473571777, "global_step": 3802, "epoch": 22} {"train_loss": -4.89044189453125, "global_step": 3803, "epoch": 22} {"train_loss": -4.870748519897461, "global_step": 3804, "epoch": 22} {"train_loss": -4.6359357833862305, "global_step": 3805, "epoch": 22} {"train_loss": -4.674920082092285, "global_step": 3806, "epoch": 22} {"train_loss": -4.738212585449219, "global_step": 3807, "epoch": 22} {"train_loss": -4.688000679016113, "global_step": 3808, "epoch": 22} {"train_loss": -4.490300178527832, "global_step": 3809, "epoch": 22} {"train_loss": -4.553711891174316, "global_step": 3810, "epoch": 22} {"train_loss": -4.7954182624816895, "global_step": 3811, "epoch": 22} {"train_loss": -4.80918025970459, "global_step": 3812, "epoch": 22} {"train_loss": -4.910186767578125, "global_step": 3813, "epoch": 22} {"train_loss": -4.628601551055908, "global_step": 3814, "epoch": 22} {"train_loss": -4.5956950187683105, "global_step": 3815, "epoch": 22} {"train_loss": -5.013458251953125, "global_step": 3816, "epoch": 22} {"train_loss": -4.837721824645996, "global_step": 3817, "epoch": 22} {"train_loss": -4.941559791564941, "global_step": 3818, "epoch": 22} {"train_loss": -4.920679092407227, "global_step": 3819, "epoch": 22} {"train_loss": -4.372596740722656, "global_step": 3820, "epoch": 22} {"train_loss": -4.913771629333496, "global_step": 3821, "epoch": 22} {"train_loss": -4.646909713745117, "global_step": 3822, "epoch": 22} {"train_loss": -4.663674354553223, "global_step": 3823, "epoch": 22} {"train_loss": -4.698648452758789, "global_step": 3824, "epoch": 22} {"train_loss": -4.605159759521484, "global_step": 3825, "epoch": 22} {"train_loss": -4.714917182922363, "global_step": 3826, "epoch": 22} {"train_loss": -4.862551689147949, "global_step": 3827, "epoch": 22} {"train_loss": -4.632979869842529, "global_step": 3828, "epoch": 22} {"train_loss": -4.600736141204834, "global_step": 3829, "epoch": 22} {"train_loss": -4.697882175445557, "global_step": 3830, "epoch": 22} {"train_loss": -4.636794090270996, "global_step": 3831, "epoch": 22} {"train_loss": -4.530817985534668, "global_step": 3832, "epoch": 22} {"train_loss": -4.665256500244141, "global_step": 3833, "epoch": 22} {"train_loss": -4.4801740646362305, "global_step": 3834, "epoch": 22} {"train_loss": -4.414571762084961, "global_step": 3835, "epoch": 22} {"train_loss": -3.994089126586914, "global_step": 3836, "epoch": 22} {"train_loss": -4.478185653686523, "global_step": 3837, "epoch": 22} {"train_loss": -4.599767684936523, "global_step": 3838, "epoch": 22} {"train_loss": -4.517793655395508, "global_step": 3839, "epoch": 22} {"train_loss": -4.373197078704834, "global_step": 3840, "epoch": 22} {"train_loss": -4.534919261932373, "global_step": 3841, "epoch": 22} {"train_loss": -4.248764991760254, "global_step": 3842, "epoch": 22} {"train_loss": -4.456544399261475, "global_step": 3843, "epoch": 22} {"train_loss": -4.637406826019287, "global_step": 3844, "epoch": 22} {"train_loss": -4.5730509757995605, "global_step": 3845, "epoch": 22} {"train_loss": -4.354266166687012, "global_step": 3846, "epoch": 22} {"train_loss": -4.781620502471924, "global_step": 3847, "epoch": 22} {"train_loss": -4.684154987335205, "global_step": 3848, "epoch": 22} {"train_loss": -4.599112510681152, "global_step": 3849, "epoch": 22} {"train_loss": -4.690127372741699, "global_step": 3850, "epoch": 22} {"train_loss": -4.803339958190918, "global_step": 3851, "epoch": 22} {"train_loss": -4.778426170349121, "global_step": 3852, "epoch": 22} {"train_loss": -4.803927421569824, "global_step": 3853, "epoch": 22} {"train_loss": -4.668467998504639, "global_step": 3854, "epoch": 22} {"train_loss": -4.824470520019531, "global_step": 3855, "epoch": 22} {"train_loss": -4.67721700668335, "global_step": 3856, "epoch": 22} {"train_loss": -4.765744209289551, "global_step": 3857, "epoch": 22} {"train_loss": -4.622133255004883, "global_step": 3858, "epoch": 22} {"train_loss": -4.793427467346191, "global_step": 3859, "epoch": 22} {"train_loss": -4.450893402099609, "global_step": 3860, "epoch": 22} {"train_loss": -4.549293041229248, "global_step": 3861, "epoch": 22} {"train_loss": -4.673469543457031, "global_step": 3862, "epoch": 22} {"train_loss": -4.639565885066986, "global_step": 3863, "epoch": 22, "val_loss": 252966.296875} {"train_loss": -4.714336395263672, "global_step": 3864, "epoch": 23} {"train_loss": -4.59266471862793, "global_step": 3865, "epoch": 23} {"train_loss": -4.759437561035156, "global_step": 3866, "epoch": 23} {"train_loss": -4.752251625061035, "global_step": 3867, "epoch": 23} {"train_loss": -4.465363025665283, "global_step": 3868, "epoch": 23} {"train_loss": -4.75638484954834, "global_step": 3869, "epoch": 23} {"train_loss": -4.421265602111816, "global_step": 3870, "epoch": 23} {"train_loss": -4.353655815124512, "global_step": 3871, "epoch": 23} {"train_loss": -4.908334732055664, "global_step": 3872, "epoch": 23} {"train_loss": -4.540380477905273, "global_step": 3873, "epoch": 23} {"train_loss": -4.574797630310059, "global_step": 3874, "epoch": 23} {"train_loss": -4.620124816894531, "global_step": 3875, "epoch": 23} {"train_loss": -4.596124172210693, "global_step": 3876, "epoch": 23} {"train_loss": -4.736130714416504, "global_step": 3877, "epoch": 23} {"train_loss": -4.62336540222168, "global_step": 3878, "epoch": 23} {"train_loss": -4.461919784545898, "global_step": 3879, "epoch": 23} {"train_loss": -4.508886814117432, "global_step": 3880, "epoch": 23} {"train_loss": -4.747322082519531, "global_step": 3881, "epoch": 23} {"train_loss": -4.946751594543457, "global_step": 3882, "epoch": 23} {"train_loss": -4.748969078063965, "global_step": 3883, "epoch": 23} {"train_loss": -4.754240989685059, "global_step": 3884, "epoch": 23} {"train_loss": -4.668696403503418, "global_step": 3885, "epoch": 23} {"train_loss": -4.560712814331055, "global_step": 3886, "epoch": 23} {"train_loss": -4.744974136352539, "global_step": 3887, "epoch": 23} {"train_loss": -4.877851486206055, "global_step": 3888, "epoch": 23} {"train_loss": -4.628925323486328, "global_step": 3889, "epoch": 23} {"train_loss": -5.008167266845703, "global_step": 3890, "epoch": 23} {"train_loss": -4.649552345275879, "global_step": 3891, "epoch": 23} {"train_loss": -4.834137916564941, "global_step": 3892, "epoch": 23} {"train_loss": -4.507631301879883, "global_step": 3893, "epoch": 23} {"train_loss": -4.807791709899902, "global_step": 3894, "epoch": 23} {"train_loss": -4.638891220092773, "global_step": 3895, "epoch": 23} {"train_loss": -4.681671142578125, "global_step": 3896, "epoch": 23} {"train_loss": -4.63902473449707, "global_step": 3897, "epoch": 23} {"train_loss": -4.590794563293457, "global_step": 3898, "epoch": 23} {"train_loss": -4.643989562988281, "global_step": 3899, "epoch": 23} {"train_loss": -4.492277145385742, "global_step": 3900, "epoch": 23} {"train_loss": -4.941625595092773, "global_step": 3901, "epoch": 23} {"train_loss": -4.837655544281006, "global_step": 3902, "epoch": 23} {"train_loss": -4.693707466125488, "global_step": 3903, "epoch": 23} {"train_loss": -4.819967746734619, "global_step": 3904, "epoch": 23} {"train_loss": -4.959033012390137, "global_step": 3905, "epoch": 23} {"train_loss": -4.8019585609436035, "global_step": 3906, "epoch": 23} {"train_loss": -4.3116607666015625, "global_step": 3907, "epoch": 23} {"train_loss": -4.696203231811523, "global_step": 3908, "epoch": 23} {"train_loss": -4.357326030731201, "global_step": 3909, "epoch": 23} {"train_loss": -4.646396636962891, "global_step": 3910, "epoch": 23} {"train_loss": -4.357165813446045, "global_step": 3911, "epoch": 23} {"train_loss": -4.249135494232178, "global_step": 3912, "epoch": 23} {"train_loss": -4.493805885314941, "global_step": 3913, "epoch": 23} {"train_loss": -4.775204658508301, "global_step": 3914, "epoch": 23} {"train_loss": -4.522790431976318, "global_step": 3915, "epoch": 23} {"train_loss": -4.790457725524902, "global_step": 3916, "epoch": 23} {"train_loss": -4.790160179138184, "global_step": 3917, "epoch": 23} {"train_loss": -4.7029876708984375, "global_step": 3918, "epoch": 23} {"train_loss": -4.533006191253662, "global_step": 3919, "epoch": 23} {"train_loss": -4.758582592010498, "global_step": 3920, "epoch": 23} {"train_loss": -4.5768961906433105, "global_step": 3921, "epoch": 23} {"train_loss": -4.6272711753845215, "global_step": 3922, "epoch": 23} {"train_loss": -4.465738296508789, "global_step": 3923, "epoch": 23} {"train_loss": -4.523942947387695, "global_step": 3924, "epoch": 23} {"train_loss": -4.86640739440918, "global_step": 3925, "epoch": 23} {"train_loss": -4.88559627532959, "global_step": 3926, "epoch": 23} {"train_loss": -4.61082649230957, "global_step": 3927, "epoch": 23} {"train_loss": -4.80223274230957, "global_step": 3928, "epoch": 23} {"train_loss": -4.818611145019531, "global_step": 3929, "epoch": 23} {"train_loss": -4.81561279296875, "global_step": 3930, "epoch": 23} {"train_loss": -4.718568325042725, "global_step": 3931, "epoch": 23} {"train_loss": -4.777864456176758, "global_step": 3932, "epoch": 23} {"train_loss": -4.833755016326904, "global_step": 3933, "epoch": 23} {"train_loss": -4.785317897796631, "global_step": 3934, "epoch": 23} {"train_loss": -4.59359073638916, "global_step": 3935, "epoch": 23} {"train_loss": -4.6611104011535645, "global_step": 3936, "epoch": 23} {"train_loss": -4.7653021812438965, "global_step": 3937, "epoch": 23} {"train_loss": -4.750589370727539, "global_step": 3938, "epoch": 23} {"train_loss": -4.637564659118652, "global_step": 3939, "epoch": 23} {"train_loss": -4.743231773376465, "global_step": 3940, "epoch": 23} {"train_loss": -4.8144659996032715, "global_step": 3941, "epoch": 23} {"train_loss": -4.98494815826416, "global_step": 3942, "epoch": 23} {"train_loss": -4.945901870727539, "global_step": 3943, "epoch": 23} {"train_loss": -4.823514461517334, "global_step": 3944, "epoch": 23} {"train_loss": -4.7192254066467285, "global_step": 3945, "epoch": 23} {"train_loss": -4.880684852600098, "global_step": 3946, "epoch": 23} {"train_loss": -4.992088794708252, "global_step": 3947, "epoch": 23} {"train_loss": -4.99467658996582, "global_step": 3948, "epoch": 23} {"train_loss": -4.644931793212891, "global_step": 3949, "epoch": 23} {"train_loss": -4.819990158081055, "global_step": 3950, "epoch": 23} {"train_loss": -4.903128623962402, "global_step": 3951, "epoch": 23} {"train_loss": -4.886053562164307, "global_step": 3952, "epoch": 23} {"train_loss": -4.57327938079834, "global_step": 3953, "epoch": 23} {"train_loss": -5.044654846191406, "global_step": 3954, "epoch": 23} {"train_loss": -4.854414939880371, "global_step": 3955, "epoch": 23} {"train_loss": -4.748442649841309, "global_step": 3956, "epoch": 23} {"train_loss": -4.886510848999023, "global_step": 3957, "epoch": 23} {"train_loss": -4.836514472961426, "global_step": 3958, "epoch": 23} {"train_loss": -4.743654251098633, "global_step": 3959, "epoch": 23} {"train_loss": -4.678902626037598, "global_step": 3960, "epoch": 23} {"train_loss": -5.030837059020996, "global_step": 3961, "epoch": 23} {"train_loss": -4.703843593597412, "global_step": 3962, "epoch": 23} {"train_loss": -4.768636703491211, "global_step": 3963, "epoch": 23} {"train_loss": -4.92746639251709, "global_step": 3964, "epoch": 23} {"train_loss": -4.872644424438477, "global_step": 3965, "epoch": 23} {"train_loss": -4.766354560852051, "global_step": 3966, "epoch": 23} {"train_loss": -4.573368072509766, "global_step": 3967, "epoch": 23} {"train_loss": -4.938467502593994, "global_step": 3968, "epoch": 23} {"train_loss": -4.7926506996154785, "global_step": 3969, "epoch": 23} {"train_loss": -4.575352668762207, "global_step": 3970, "epoch": 23} {"train_loss": -4.92002010345459, "global_step": 3971, "epoch": 23} {"train_loss": -4.663995742797852, "global_step": 3972, "epoch": 23} {"train_loss": -4.617547512054443, "global_step": 3973, "epoch": 23} {"train_loss": -4.7433180809021, "global_step": 3974, "epoch": 23} {"train_loss": -4.980523109436035, "global_step": 3975, "epoch": 23} {"train_loss": -4.443158149719238, "global_step": 3976, "epoch": 23} {"train_loss": -4.814264297485352, "global_step": 3977, "epoch": 23} {"train_loss": -4.582000732421875, "global_step": 3978, "epoch": 23} {"train_loss": -4.659921646118164, "global_step": 3979, "epoch": 23} {"train_loss": -4.912292957305908, "global_step": 3980, "epoch": 23} {"train_loss": -4.493094444274902, "global_step": 3981, "epoch": 23} {"train_loss": -4.714155197143555, "global_step": 3982, "epoch": 23} {"train_loss": -4.789871692657471, "global_step": 3983, "epoch": 23} {"train_loss": -4.727847099304199, "global_step": 3984, "epoch": 23} {"train_loss": -4.5592546463012695, "global_step": 3985, "epoch": 23} {"train_loss": -4.640676498413086, "global_step": 3986, "epoch": 23} {"train_loss": -4.661361217498779, "global_step": 3987, "epoch": 23} {"train_loss": -4.923595428466797, "global_step": 3988, "epoch": 23} {"train_loss": -4.535396575927734, "global_step": 3989, "epoch": 23} {"train_loss": -4.862729072570801, "global_step": 3990, "epoch": 23} {"train_loss": -4.683479309082031, "global_step": 3991, "epoch": 23} {"train_loss": -4.786649227142334, "global_step": 3992, "epoch": 23} {"train_loss": -4.578676223754883, "global_step": 3993, "epoch": 23} {"train_loss": -4.351768493652344, "global_step": 3994, "epoch": 23} {"train_loss": -4.924761772155762, "global_step": 3995, "epoch": 23} {"train_loss": -4.621190547943115, "global_step": 3996, "epoch": 23} {"train_loss": -4.753025054931641, "global_step": 3997, "epoch": 23} {"train_loss": -4.772890090942383, "global_step": 3998, "epoch": 23} {"train_loss": -4.971697807312012, "global_step": 3999, "epoch": 23} {"train_loss": -4.921050071716309, "global_step": 4000, "epoch": 23} {"train_loss": -4.758460998535156, "global_step": 4001, "epoch": 23} {"train_loss": -4.817498207092285, "global_step": 4002, "epoch": 23} {"train_loss": -4.806148529052734, "global_step": 4003, "epoch": 23} {"train_loss": -4.716155052185059, "global_step": 4004, "epoch": 23} {"train_loss": -4.81711483001709, "global_step": 4005, "epoch": 23} {"train_loss": -4.8400139808654785, "global_step": 4006, "epoch": 23} {"train_loss": -4.485135078430176, "global_step": 4007, "epoch": 23} {"train_loss": -4.925463676452637, "global_step": 4008, "epoch": 23} {"train_loss": -4.569452285766602, "global_step": 4009, "epoch": 23} {"train_loss": -4.936802864074707, "global_step": 4010, "epoch": 23} {"train_loss": -4.63722038269043, "global_step": 4011, "epoch": 23} {"train_loss": -4.814265727996826, "global_step": 4012, "epoch": 23} {"train_loss": -4.586891174316406, "global_step": 4013, "epoch": 23} {"train_loss": -4.312190532684326, "global_step": 4014, "epoch": 23} {"train_loss": -4.965139389038086, "global_step": 4015, "epoch": 23} {"train_loss": -4.75698184967041, "global_step": 4016, "epoch": 23} {"train_loss": -4.5164875984191895, "global_step": 4017, "epoch": 23} {"train_loss": -4.851728439331055, "global_step": 4018, "epoch": 23} {"train_loss": -4.546668529510498, "global_step": 4019, "epoch": 23} {"train_loss": -4.845782279968262, "global_step": 4020, "epoch": 23} {"train_loss": -4.467713356018066, "global_step": 4021, "epoch": 23} {"train_loss": -4.770361423492432, "global_step": 4022, "epoch": 23} {"train_loss": -4.339639663696289, "global_step": 4023, "epoch": 23} {"train_loss": -4.522995948791504, "global_step": 4024, "epoch": 23} {"train_loss": -4.683725833892822, "global_step": 4025, "epoch": 23} {"train_loss": -4.591978549957275, "global_step": 4026, "epoch": 23} {"train_loss": -4.844927787780762, "global_step": 4027, "epoch": 23} {"train_loss": -4.7729291915893555, "global_step": 4028, "epoch": 23} {"train_loss": -4.454242706298828, "global_step": 4029, "epoch": 23} {"train_loss": -4.560608386993408, "global_step": 4030, "epoch": 23} {"train_loss": -4.710051701182411, "global_step": 4031, "epoch": 23, "val_loss": 261890.84375} {"train_loss": -4.573364734649658, "global_step": 4032, "epoch": 24} {"train_loss": -4.500032424926758, "global_step": 4033, "epoch": 24} {"train_loss": -4.751049995422363, "global_step": 4034, "epoch": 24} {"train_loss": -4.705296993255615, "global_step": 4035, "epoch": 24} {"train_loss": -4.786771297454834, "global_step": 4036, "epoch": 24} {"train_loss": -4.681614875793457, "global_step": 4037, "epoch": 24} {"train_loss": -4.848701477050781, "global_step": 4038, "epoch": 24} {"train_loss": -4.580751419067383, "global_step": 4039, "epoch": 24} {"train_loss": -4.840174674987793, "global_step": 4040, "epoch": 24} {"train_loss": -4.611476898193359, "global_step": 4041, "epoch": 24} {"train_loss": -4.847302436828613, "global_step": 4042, "epoch": 24} {"train_loss": -5.087834358215332, "global_step": 4043, "epoch": 24} {"train_loss": -4.592446327209473, "global_step": 4044, "epoch": 24} {"train_loss": -4.808716297149658, "global_step": 4045, "epoch": 24} {"train_loss": -4.771482467651367, "global_step": 4046, "epoch": 24} {"train_loss": -4.777955532073975, "global_step": 4047, "epoch": 24} {"train_loss": -4.785849571228027, "global_step": 4048, "epoch": 24} {"train_loss": -4.826819896697998, "global_step": 4049, "epoch": 24} {"train_loss": -4.832082271575928, "global_step": 4050, "epoch": 24} {"train_loss": -4.794234275817871, "global_step": 4051, "epoch": 24} {"train_loss": -4.867228031158447, "global_step": 4052, "epoch": 24} {"train_loss": -4.658010959625244, "global_step": 4053, "epoch": 24} {"train_loss": -4.913474082946777, "global_step": 4054, "epoch": 24} {"train_loss": -4.81510591506958, "global_step": 4055, "epoch": 24} {"train_loss": -4.747312545776367, "global_step": 4056, "epoch": 24} {"train_loss": -4.827896595001221, "global_step": 4057, "epoch": 24} {"train_loss": -4.51446533203125, "global_step": 4058, "epoch": 24} {"train_loss": -4.824485778808594, "global_step": 4059, "epoch": 24} {"train_loss": -4.399690628051758, "global_step": 4060, "epoch": 24} {"train_loss": -4.957269668579102, "global_step": 4061, "epoch": 24} {"train_loss": -4.387126445770264, "global_step": 4062, "epoch": 24} {"train_loss": -4.729370594024658, "global_step": 4063, "epoch": 24} {"train_loss": -4.825955390930176, "global_step": 4064, "epoch": 24} {"train_loss": -4.717182159423828, "global_step": 4065, "epoch": 24} {"train_loss": -4.908198833465576, "global_step": 4066, "epoch": 24} {"train_loss": -4.434401512145996, "global_step": 4067, "epoch": 24} {"train_loss": -4.677968978881836, "global_step": 4068, "epoch": 24} {"train_loss": -4.688259124755859, "global_step": 4069, "epoch": 24} {"train_loss": -4.449853897094727, "global_step": 4070, "epoch": 24} {"train_loss": -4.698735237121582, "global_step": 4071, "epoch": 24} {"train_loss": -4.8998260498046875, "global_step": 4072, "epoch": 24} {"train_loss": -4.874112129211426, "global_step": 4073, "epoch": 24} {"train_loss": -5.064230918884277, "global_step": 4074, "epoch": 24} {"train_loss": -4.870690822601318, "global_step": 4075, "epoch": 24} {"train_loss": -4.850611209869385, "global_step": 4076, "epoch": 24} {"train_loss": -4.747165679931641, "global_step": 4077, "epoch": 24} {"train_loss": -5.0433502197265625, "global_step": 4078, "epoch": 24} {"train_loss": -4.875207901000977, "global_step": 4079, "epoch": 24} {"train_loss": -4.659971714019775, "global_step": 4080, "epoch": 24} {"train_loss": -5.035418510437012, "global_step": 4081, "epoch": 24} {"train_loss": -4.600556373596191, "global_step": 4082, "epoch": 24} {"train_loss": -4.918515205383301, "global_step": 4083, "epoch": 24} {"train_loss": -4.733001708984375, "global_step": 4084, "epoch": 24} {"train_loss": -4.976907253265381, "global_step": 4085, "epoch": 24} {"train_loss": -4.9704389572143555, "global_step": 4086, "epoch": 24} {"train_loss": -4.660925388336182, "global_step": 4087, "epoch": 24} {"train_loss": -4.690007209777832, "global_step": 4088, "epoch": 24} {"train_loss": -4.7942585945129395, "global_step": 4089, "epoch": 24} {"train_loss": -4.62138032913208, "global_step": 4090, "epoch": 24} {"train_loss": -4.643038749694824, "global_step": 4091, "epoch": 24} {"train_loss": -4.588614463806152, "global_step": 4092, "epoch": 24} {"train_loss": -4.712305068969727, "global_step": 4093, "epoch": 24} {"train_loss": -4.823068141937256, "global_step": 4094, "epoch": 24} {"train_loss": -4.632597923278809, "global_step": 4095, "epoch": 24} {"train_loss": -4.929129600524902, "global_step": 4096, "epoch": 24} {"train_loss": -4.726443290710449, "global_step": 4097, "epoch": 24} {"train_loss": -4.936434745788574, "global_step": 4098, "epoch": 24} {"train_loss": -4.786451816558838, "global_step": 4099, "epoch": 24} {"train_loss": -4.40082311630249, "global_step": 4100, "epoch": 24} {"train_loss": -4.880873680114746, "global_step": 4101, "epoch": 24} {"train_loss": -4.574850559234619, "global_step": 4102, "epoch": 24} {"train_loss": -4.685924530029297, "global_step": 4103, "epoch": 24} {"train_loss": -4.71350622177124, "global_step": 4104, "epoch": 24} {"train_loss": -4.687417507171631, "global_step": 4105, "epoch": 24} {"train_loss": -4.987308025360107, "global_step": 4106, "epoch": 24} {"train_loss": -4.72998571395874, "global_step": 4107, "epoch": 24} {"train_loss": -4.999342918395996, "global_step": 4108, "epoch": 24} {"train_loss": -4.6889801025390625, "global_step": 4109, "epoch": 24} {"train_loss": -4.8755059242248535, "global_step": 4110, "epoch": 24} {"train_loss": -4.780474662780762, "global_step": 4111, "epoch": 24} {"train_loss": -4.817792892456055, "global_step": 4112, "epoch": 24} {"train_loss": -5.039706230163574, "global_step": 4113, "epoch": 24} {"train_loss": -4.893991470336914, "global_step": 4114, "epoch": 24} {"train_loss": -5.020554542541504, "global_step": 4115, "epoch": 24} {"train_loss": -4.527804851531982, "global_step": 4116, "epoch": 24} {"train_loss": -4.842242240905762, "global_step": 4117, "epoch": 24} {"train_loss": -4.629537105560303, "global_step": 4118, "epoch": 24} {"train_loss": -4.926776885986328, "global_step": 4119, "epoch": 24} {"train_loss": -4.727436065673828, "global_step": 4120, "epoch": 24} {"train_loss": -4.7075934410095215, "global_step": 4121, "epoch": 24} {"train_loss": -4.817762851715088, "global_step": 4122, "epoch": 24} {"train_loss": -4.294447898864746, "global_step": 4123, "epoch": 24} {"train_loss": -4.7883830070495605, "global_step": 4124, "epoch": 24} {"train_loss": -4.402541160583496, "global_step": 4125, "epoch": 24} {"train_loss": -4.346685409545898, "global_step": 4126, "epoch": 24} {"train_loss": -4.443319320678711, "global_step": 4127, "epoch": 24} {"train_loss": -4.642157077789307, "global_step": 4128, "epoch": 24} {"train_loss": -4.4612650871276855, "global_step": 4129, "epoch": 24} {"train_loss": -4.1454057693481445, "global_step": 4130, "epoch": 24} {"train_loss": -4.400472164154053, "global_step": 4131, "epoch": 24} {"train_loss": -4.492271423339844, "global_step": 4132, "epoch": 24} {"train_loss": -4.281617164611816, "global_step": 4133, "epoch": 24} {"train_loss": -4.330087184906006, "global_step": 4134, "epoch": 24} {"train_loss": -4.542065620422363, "global_step": 4135, "epoch": 24} {"train_loss": -4.569908142089844, "global_step": 4136, "epoch": 24} {"train_loss": -4.541250705718994, "global_step": 4137, "epoch": 24} {"train_loss": -4.3802971839904785, "global_step": 4138, "epoch": 24} {"train_loss": -4.51629638671875, "global_step": 4139, "epoch": 24} {"train_loss": -4.663906097412109, "global_step": 4140, "epoch": 24} {"train_loss": -4.7373456954956055, "global_step": 4141, "epoch": 24} {"train_loss": -4.884232521057129, "global_step": 4142, "epoch": 24} {"train_loss": -4.647111892700195, "global_step": 4143, "epoch": 24} {"train_loss": -4.671363830566406, "global_step": 4144, "epoch": 24} {"train_loss": -4.772821426391602, "global_step": 4145, "epoch": 24} {"train_loss": -4.904225826263428, "global_step": 4146, "epoch": 24} {"train_loss": -4.579505920410156, "global_step": 4147, "epoch": 24} {"train_loss": -4.9877166748046875, "global_step": 4148, "epoch": 24} {"train_loss": -4.85926628112793, "global_step": 4149, "epoch": 24} {"train_loss": -4.842668056488037, "global_step": 4150, "epoch": 24} {"train_loss": -4.843923568725586, "global_step": 4151, "epoch": 24} {"train_loss": -4.741402626037598, "global_step": 4152, "epoch": 24} {"train_loss": -5.015852928161621, "global_step": 4153, "epoch": 24} {"train_loss": -4.87957239151001, "global_step": 4154, "epoch": 24} {"train_loss": -5.065509796142578, "global_step": 4155, "epoch": 24} {"train_loss": -4.937350273132324, "global_step": 4156, "epoch": 24} {"train_loss": -4.467698097229004, "global_step": 4157, "epoch": 24} {"train_loss": -4.60535192489624, "global_step": 4158, "epoch": 24} {"train_loss": -4.616554260253906, "global_step": 4159, "epoch": 24} {"train_loss": -4.561603546142578, "global_step": 4160, "epoch": 24} {"train_loss": -4.846675872802734, "global_step": 4161, "epoch": 24} {"train_loss": -4.583142280578613, "global_step": 4162, "epoch": 24} {"train_loss": -4.2993693351745605, "global_step": 4163, "epoch": 24} {"train_loss": -4.77352237701416, "global_step": 4164, "epoch": 24} {"train_loss": -4.42758846282959, "global_step": 4165, "epoch": 24} {"train_loss": -4.461758613586426, "global_step": 4166, "epoch": 24} {"train_loss": -4.589260578155518, "global_step": 4167, "epoch": 24} {"train_loss": -4.287502288818359, "global_step": 4168, "epoch": 24} {"train_loss": -4.537735939025879, "global_step": 4169, "epoch": 24} {"train_loss": -4.59079647064209, "global_step": 4170, "epoch": 24} {"train_loss": -4.381504535675049, "global_step": 4171, "epoch": 24} {"train_loss": -4.529599666595459, "global_step": 4172, "epoch": 24} {"train_loss": -4.830924987792969, "global_step": 4173, "epoch": 24} {"train_loss": -4.556537628173828, "global_step": 4174, "epoch": 24} {"train_loss": -4.8333539962768555, "global_step": 4175, "epoch": 24} {"train_loss": -4.811386585235596, "global_step": 4176, "epoch": 24} {"train_loss": -4.629620552062988, "global_step": 4177, "epoch": 24} {"train_loss": -4.772822380065918, "global_step": 4178, "epoch": 24} {"train_loss": -4.96254825592041, "global_step": 4179, "epoch": 24} {"train_loss": -4.614141464233398, "global_step": 4180, "epoch": 24} {"train_loss": -4.884528636932373, "global_step": 4181, "epoch": 24} {"train_loss": -4.723569869995117, "global_step": 4182, "epoch": 24} {"train_loss": -5.0208659172058105, "global_step": 4183, "epoch": 24} {"train_loss": -4.743943691253662, "global_step": 4184, "epoch": 24} {"train_loss": -5.0169901847839355, "global_step": 4185, "epoch": 24} {"train_loss": -4.57627010345459, "global_step": 4186, "epoch": 24} {"train_loss": -4.764069557189941, "global_step": 4187, "epoch": 24} {"train_loss": -4.798561096191406, "global_step": 4188, "epoch": 24} {"train_loss": -4.814778804779053, "global_step": 4189, "epoch": 24} {"train_loss": -4.834500312805176, "global_step": 4190, "epoch": 24} {"train_loss": -5.010311126708984, "global_step": 4191, "epoch": 24} {"train_loss": -4.861546516418457, "global_step": 4192, "epoch": 24} {"train_loss": -4.913674354553223, "global_step": 4193, "epoch": 24} {"train_loss": -4.808320999145508, "global_step": 4194, "epoch": 24} {"train_loss": -4.838753700256348, "global_step": 4195, "epoch": 24} {"train_loss": -4.740417003631592, "global_step": 4196, "epoch": 24} {"train_loss": -4.998342990875244, "global_step": 4197, "epoch": 24} {"train_loss": -5.031744480133057, "global_step": 4198, "epoch": 24} {"train_loss": -4.727166822978428, "global_step": 4199, "epoch": 24, "val_loss": 276749.3125} {"train_loss": -4.536803722381592, "global_step": 4200, "epoch": 25} {"train_loss": -4.720818996429443, "global_step": 4201, "epoch": 25} {"train_loss": -4.748974323272705, "global_step": 4202, "epoch": 25} {"train_loss": -4.886219024658203, "global_step": 4203, "epoch": 25} {"train_loss": -4.690265655517578, "global_step": 4204, "epoch": 25} {"train_loss": -4.741269111633301, "global_step": 4205, "epoch": 25} {"train_loss": -4.7486677169799805, "global_step": 4206, "epoch": 25} {"train_loss": -4.4932780265808105, "global_step": 4207, "epoch": 25} {"train_loss": -4.571468353271484, "global_step": 4208, "epoch": 25} {"train_loss": -4.647595405578613, "global_step": 4209, "epoch": 25} {"train_loss": -4.680882453918457, "global_step": 4210, "epoch": 25} {"train_loss": -4.735918998718262, "global_step": 4211, "epoch": 25} {"train_loss": -4.726201057434082, "global_step": 4212, "epoch": 25} {"train_loss": -4.730663299560547, "global_step": 4213, "epoch": 25} {"train_loss": -4.766277313232422, "global_step": 4214, "epoch": 25} {"train_loss": -4.899891376495361, "global_step": 4215, "epoch": 25} {"train_loss": -4.800438404083252, "global_step": 4216, "epoch": 25} {"train_loss": -4.79670524597168, "global_step": 4217, "epoch": 25} {"train_loss": -4.768960952758789, "global_step": 4218, "epoch": 25} {"train_loss": -4.711528778076172, "global_step": 4219, "epoch": 25} {"train_loss": -4.700188636779785, "global_step": 4220, "epoch": 25} {"train_loss": -4.834735870361328, "global_step": 4221, "epoch": 25} {"train_loss": -4.861758232116699, "global_step": 4222, "epoch": 25} {"train_loss": -4.946568012237549, "global_step": 4223, "epoch": 25} {"train_loss": -4.926592826843262, "global_step": 4224, "epoch": 25} {"train_loss": -4.821907997131348, "global_step": 4225, "epoch": 25} {"train_loss": -4.777024745941162, "global_step": 4226, "epoch": 25} {"train_loss": -4.705661296844482, "global_step": 4227, "epoch": 25} {"train_loss": -4.419008731842041, "global_step": 4228, "epoch": 25} {"train_loss": -4.86761999130249, "global_step": 4229, "epoch": 25} {"train_loss": -4.6964521408081055, "global_step": 4230, "epoch": 25} {"train_loss": -4.879518508911133, "global_step": 4231, "epoch": 25} {"train_loss": -4.689650058746338, "global_step": 4232, "epoch": 25} {"train_loss": -4.773965358734131, "global_step": 4233, "epoch": 25} {"train_loss": -4.451543807983398, "global_step": 4234, "epoch": 25} {"train_loss": -4.6126251220703125, "global_step": 4235, "epoch": 25} {"train_loss": -4.927722930908203, "global_step": 4236, "epoch": 25} {"train_loss": -4.738330364227295, "global_step": 4237, "epoch": 25} {"train_loss": -4.539960861206055, "global_step": 4238, "epoch": 25} {"train_loss": -4.89399528503418, "global_step": 4239, "epoch": 25} {"train_loss": -4.709688186645508, "global_step": 4240, "epoch": 25} {"train_loss": -4.898719310760498, "global_step": 4241, "epoch": 25} {"train_loss": -4.822351455688477, "global_step": 4242, "epoch": 25} {"train_loss": -4.519706726074219, "global_step": 4243, "epoch": 25} {"train_loss": -4.953738212585449, "global_step": 4244, "epoch": 25} {"train_loss": -4.626125335693359, "global_step": 4245, "epoch": 25} {"train_loss": -4.991138458251953, "global_step": 4246, "epoch": 25} {"train_loss": -4.548370361328125, "global_step": 4247, "epoch": 25} {"train_loss": -4.9540534019470215, "global_step": 4248, "epoch": 25} {"train_loss": -4.886125564575195, "global_step": 4249, "epoch": 25} {"train_loss": -4.708639144897461, "global_step": 4250, "epoch": 25} {"train_loss": -4.943375587463379, "global_step": 4251, "epoch": 25} {"train_loss": -5.054365158081055, "global_step": 4252, "epoch": 25} {"train_loss": -4.983116626739502, "global_step": 4253, "epoch": 25} {"train_loss": -4.869879722595215, "global_step": 4254, "epoch": 25} {"train_loss": -5.049424648284912, "global_step": 4255, "epoch": 25} {"train_loss": -4.784822463989258, "global_step": 4256, "epoch": 25} {"train_loss": -4.803977966308594, "global_step": 4257, "epoch": 25} {"train_loss": -4.841239929199219, "global_step": 4258, "epoch": 25} {"train_loss": -4.855659008026123, "global_step": 4259, "epoch": 25} {"train_loss": -4.709577560424805, "global_step": 4260, "epoch": 25} {"train_loss": -4.821234703063965, "global_step": 4261, "epoch": 25} {"train_loss": -4.81959867477417, "global_step": 4262, "epoch": 25} {"train_loss": -4.949367046356201, "global_step": 4263, "epoch": 25} {"train_loss": -4.9254255294799805, "global_step": 4264, "epoch": 25} {"train_loss": -4.700044631958008, "global_step": 4265, "epoch": 25} {"train_loss": -4.694297790527344, "global_step": 4266, "epoch": 25} {"train_loss": -4.4154205322265625, "global_step": 4267, "epoch": 25} {"train_loss": -4.5667724609375, "global_step": 4268, "epoch": 25} {"train_loss": -4.382611274719238, "global_step": 4269, "epoch": 25} {"train_loss": -4.246845722198486, "global_step": 4270, "epoch": 25} {"train_loss": -4.5166850090026855, "global_step": 4271, "epoch": 25} {"train_loss": -4.586635589599609, "global_step": 4272, "epoch": 25} {"train_loss": -4.548443794250488, "global_step": 4273, "epoch": 25} {"train_loss": -5.035470962524414, "global_step": 4274, "epoch": 25} {"train_loss": -4.665953636169434, "global_step": 4275, "epoch": 25} {"train_loss": -4.637772560119629, "global_step": 4276, "epoch": 25} {"train_loss": -4.631381034851074, "global_step": 4277, "epoch": 25} {"train_loss": -4.359192848205566, "global_step": 4278, "epoch": 25} {"train_loss": -4.621890068054199, "global_step": 4279, "epoch": 25} {"train_loss": -4.8044939041137695, "global_step": 4280, "epoch": 25} {"train_loss": -4.554491996765137, "global_step": 4281, "epoch": 25} {"train_loss": -4.962077617645264, "global_step": 4282, "epoch": 25} {"train_loss": -4.828392028808594, "global_step": 4283, "epoch": 25} {"train_loss": -4.732670783996582, "global_step": 4284, "epoch": 25} {"train_loss": -5.089245796203613, "global_step": 4285, "epoch": 25} {"train_loss": -4.635422706604004, "global_step": 4286, "epoch": 25} {"train_loss": -4.591219902038574, "global_step": 4287, "epoch": 25} {"train_loss": -4.737203598022461, "global_step": 4288, "epoch": 25} {"train_loss": -4.599169731140137, "global_step": 4289, "epoch": 25} {"train_loss": -4.844027519226074, "global_step": 4290, "epoch": 25} {"train_loss": -4.60579776763916, "global_step": 4291, "epoch": 25} {"train_loss": -4.852656364440918, "global_step": 4292, "epoch": 25} {"train_loss": -5.033621788024902, "global_step": 4293, "epoch": 25} {"train_loss": -4.671750068664551, "global_step": 4294, "epoch": 25} {"train_loss": -4.65186882019043, "global_step": 4295, "epoch": 25} {"train_loss": -4.813647270202637, "global_step": 4296, "epoch": 25} {"train_loss": -4.83585262298584, "global_step": 4297, "epoch": 25} {"train_loss": -4.699593544006348, "global_step": 4298, "epoch": 25} {"train_loss": -4.993386268615723, "global_step": 4299, "epoch": 25} {"train_loss": -5.056015968322754, "global_step": 4300, "epoch": 25} {"train_loss": -4.769739151000977, "global_step": 4301, "epoch": 25} {"train_loss": -4.7905426025390625, "global_step": 4302, "epoch": 25} {"train_loss": -4.766830921173096, "global_step": 4303, "epoch": 25} {"train_loss": -4.959776878356934, "global_step": 4304, "epoch": 25} {"train_loss": -4.672986030578613, "global_step": 4305, "epoch": 25} {"train_loss": -4.798398494720459, "global_step": 4306, "epoch": 25} {"train_loss": -4.971560001373291, "global_step": 4307, "epoch": 25} {"train_loss": -4.970551490783691, "global_step": 4308, "epoch": 25} {"train_loss": -4.965212821960449, "global_step": 4309, "epoch": 25} {"train_loss": -4.82042121887207, "global_step": 4310, "epoch": 25} {"train_loss": -4.729243278503418, "global_step": 4311, "epoch": 25} {"train_loss": -4.817835807800293, "global_step": 4312, "epoch": 25} {"train_loss": -4.8608174324035645, "global_step": 4313, "epoch": 25} {"train_loss": -4.728995323181152, "global_step": 4314, "epoch": 25} {"train_loss": -4.889370441436768, "global_step": 4315, "epoch": 25} {"train_loss": -4.849643707275391, "global_step": 4316, "epoch": 25} {"train_loss": -4.7024736404418945, "global_step": 4317, "epoch": 25} {"train_loss": -4.497803688049316, "global_step": 4318, "epoch": 25} {"train_loss": -4.730324745178223, "global_step": 4319, "epoch": 25} {"train_loss": -4.795734405517578, "global_step": 4320, "epoch": 25} {"train_loss": -4.649873733520508, "global_step": 4321, "epoch": 25} {"train_loss": -4.673412322998047, "global_step": 4322, "epoch": 25} {"train_loss": -4.709802627563477, "global_step": 4323, "epoch": 25} {"train_loss": -4.912860870361328, "global_step": 4324, "epoch": 25} {"train_loss": -4.70530891418457, "global_step": 4325, "epoch": 25} {"train_loss": -4.899608612060547, "global_step": 4326, "epoch": 25} {"train_loss": -4.748307228088379, "global_step": 4327, "epoch": 25} {"train_loss": -4.468775749206543, "global_step": 4328, "epoch": 25} {"train_loss": -4.950483322143555, "global_step": 4329, "epoch": 25} {"train_loss": -4.803835868835449, "global_step": 4330, "epoch": 25} {"train_loss": -4.817598819732666, "global_step": 4331, "epoch": 25} {"train_loss": -4.929722785949707, "global_step": 4332, "epoch": 25} {"train_loss": -4.88799524307251, "global_step": 4333, "epoch": 25} {"train_loss": -4.687568664550781, "global_step": 4334, "epoch": 25} {"train_loss": -4.525033473968506, "global_step": 4335, "epoch": 25} {"train_loss": -4.721606731414795, "global_step": 4336, "epoch": 25} {"train_loss": -4.5911054611206055, "global_step": 4337, "epoch": 25} {"train_loss": -4.736800193786621, "global_step": 4338, "epoch": 25} {"train_loss": -4.803226470947266, "global_step": 4339, "epoch": 25} {"train_loss": -4.413235664367676, "global_step": 4340, "epoch": 25} {"train_loss": -4.714171409606934, "global_step": 4341, "epoch": 25} {"train_loss": -4.720253944396973, "global_step": 4342, "epoch": 25} {"train_loss": -4.760730743408203, "global_step": 4343, "epoch": 25} {"train_loss": -4.657210350036621, "global_step": 4344, "epoch": 25} {"train_loss": -4.597780227661133, "global_step": 4345, "epoch": 25} {"train_loss": -4.4327898025512695, "global_step": 4346, "epoch": 25} {"train_loss": -4.667346954345703, "global_step": 4347, "epoch": 25} {"train_loss": -4.8125128746032715, "global_step": 4348, "epoch": 25} {"train_loss": -4.347527027130127, "global_step": 4349, "epoch": 25} {"train_loss": -4.802062034606934, "global_step": 4350, "epoch": 25} {"train_loss": -4.642561912536621, "global_step": 4351, "epoch": 25} {"train_loss": -4.563050270080566, "global_step": 4352, "epoch": 25} {"train_loss": -4.920844554901123, "global_step": 4353, "epoch": 25} {"train_loss": -4.628207206726074, "global_step": 4354, "epoch": 25} {"train_loss": -4.473127365112305, "global_step": 4355, "epoch": 25} {"train_loss": -4.963411808013916, "global_step": 4356, "epoch": 25} {"train_loss": -4.278829574584961, "global_step": 4357, "epoch": 25} {"train_loss": -4.546299934387207, "global_step": 4358, "epoch": 25} {"train_loss": -4.712680339813232, "global_step": 4359, "epoch": 25} {"train_loss": -4.786443710327148, "global_step": 4360, "epoch": 25} {"train_loss": -4.273459434509277, "global_step": 4361, "epoch": 25} {"train_loss": -4.878017425537109, "global_step": 4362, "epoch": 25} {"train_loss": -4.613664150238037, "global_step": 4363, "epoch": 25} {"train_loss": -4.762298583984375, "global_step": 4364, "epoch": 25} {"train_loss": -4.614377021789551, "global_step": 4365, "epoch": 25} {"train_loss": -4.885007858276367, "global_step": 4366, "epoch": 25} {"train_loss": -4.738674410751888, "global_step": 4367, "epoch": 25, "val_loss": 261438.90625, "train_action_mse_error": 75.20230102539062} {"train_loss": -4.763487815856934, "global_step": 4368, "epoch": 26} {"train_loss": -5.085918426513672, "global_step": 4369, "epoch": 26} {"train_loss": -4.8607635498046875, "global_step": 4370, "epoch": 26} {"train_loss": -4.992392539978027, "global_step": 4371, "epoch": 26} {"train_loss": -4.806526184082031, "global_step": 4372, "epoch": 26} {"train_loss": -5.090452194213867, "global_step": 4373, "epoch": 26} {"train_loss": -4.792447566986084, "global_step": 4374, "epoch": 26} {"train_loss": -4.886140823364258, "global_step": 4375, "epoch": 26} {"train_loss": -4.804925918579102, "global_step": 4376, "epoch": 26} {"train_loss": -4.71502685546875, "global_step": 4377, "epoch": 26} {"train_loss": -4.880121231079102, "global_step": 4378, "epoch": 26} {"train_loss": -4.956836700439453, "global_step": 4379, "epoch": 26} {"train_loss": -4.880998611450195, "global_step": 4380, "epoch": 26} {"train_loss": -5.071423053741455, "global_step": 4381, "epoch": 26} {"train_loss": -4.89803409576416, "global_step": 4382, "epoch": 26} {"train_loss": -4.763432502746582, "global_step": 4383, "epoch": 26} {"train_loss": -5.0287041664123535, "global_step": 4384, "epoch": 26} {"train_loss": -4.743626594543457, "global_step": 4385, "epoch": 26} {"train_loss": -4.924064636230469, "global_step": 4386, "epoch": 26} {"train_loss": -4.787020683288574, "global_step": 4387, "epoch": 26} {"train_loss": -4.598844051361084, "global_step": 4388, "epoch": 26} {"train_loss": -4.8253326416015625, "global_step": 4389, "epoch": 26} {"train_loss": -4.895111083984375, "global_step": 4390, "epoch": 26} {"train_loss": -4.947663307189941, "global_step": 4391, "epoch": 26} {"train_loss": -5.001694679260254, "global_step": 4392, "epoch": 26} {"train_loss": -4.994241714477539, "global_step": 4393, "epoch": 26} {"train_loss": -4.503421783447266, "global_step": 4394, "epoch": 26} {"train_loss": -4.988934516906738, "global_step": 4395, "epoch": 26} {"train_loss": -5.1794939041137695, "global_step": 4396, "epoch": 26} {"train_loss": -4.820407390594482, "global_step": 4397, "epoch": 26} {"train_loss": -4.8502607345581055, "global_step": 4398, "epoch": 26} {"train_loss": -4.894932270050049, "global_step": 4399, "epoch": 26} {"train_loss": -5.10687255859375, "global_step": 4400, "epoch": 26} {"train_loss": -4.988034725189209, "global_step": 4401, "epoch": 26} {"train_loss": -4.990567207336426, "global_step": 4402, "epoch": 26} {"train_loss": -4.618796348571777, "global_step": 4403, "epoch": 26} {"train_loss": -5.030198097229004, "global_step": 4404, "epoch": 26} {"train_loss": -4.603043556213379, "global_step": 4405, "epoch": 26} {"train_loss": -4.888276100158691, "global_step": 4406, "epoch": 26} {"train_loss": -4.899329662322998, "global_step": 4407, "epoch": 26} {"train_loss": -4.750820159912109, "global_step": 4408, "epoch": 26} {"train_loss": -4.973895072937012, "global_step": 4409, "epoch": 26} {"train_loss": -4.803217887878418, "global_step": 4410, "epoch": 26} {"train_loss": -4.519667625427246, "global_step": 4411, "epoch": 26} {"train_loss": -5.199787616729736, "global_step": 4412, "epoch": 26} {"train_loss": -4.726799964904785, "global_step": 4413, "epoch": 26} {"train_loss": -4.877869606018066, "global_step": 4414, "epoch": 26} {"train_loss": -4.841535568237305, "global_step": 4415, "epoch": 26} {"train_loss": -4.788156509399414, "global_step": 4416, "epoch": 26} {"train_loss": -4.72872257232666, "global_step": 4417, "epoch": 26} {"train_loss": -4.9621052742004395, "global_step": 4418, "epoch": 26} {"train_loss": -5.005956649780273, "global_step": 4419, "epoch": 26} {"train_loss": -4.905389785766602, "global_step": 4420, "epoch": 26} {"train_loss": -4.716622352600098, "global_step": 4421, "epoch": 26} {"train_loss": -4.745453834533691, "global_step": 4422, "epoch": 26} {"train_loss": -4.766942977905273, "global_step": 4423, "epoch": 26} {"train_loss": -5.017143726348877, "global_step": 4424, "epoch": 26} {"train_loss": -4.89495849609375, "global_step": 4425, "epoch": 26} {"train_loss": -4.673520088195801, "global_step": 4426, "epoch": 26} {"train_loss": -4.898056983947754, "global_step": 4427, "epoch": 26} {"train_loss": -4.826685905456543, "global_step": 4428, "epoch": 26} {"train_loss": -4.826194763183594, "global_step": 4429, "epoch": 26} {"train_loss": -4.84200382232666, "global_step": 4430, "epoch": 26} {"train_loss": -4.960387229919434, "global_step": 4431, "epoch": 26} {"train_loss": -4.815214157104492, "global_step": 4432, "epoch": 26} {"train_loss": -4.771030426025391, "global_step": 4433, "epoch": 26} {"train_loss": -5.025163650512695, "global_step": 4434, "epoch": 26} {"train_loss": -4.6001129150390625, "global_step": 4435, "epoch": 26} {"train_loss": -4.766629695892334, "global_step": 4436, "epoch": 26} {"train_loss": -4.042108535766602, "global_step": 4437, "epoch": 26} {"train_loss": -5.041872024536133, "global_step": 4438, "epoch": 26} {"train_loss": -4.711791038513184, "global_step": 4439, "epoch": 26} {"train_loss": -4.695082664489746, "global_step": 4440, "epoch": 26} {"train_loss": -4.714313507080078, "global_step": 4441, "epoch": 26} {"train_loss": -4.5420308113098145, "global_step": 4442, "epoch": 26} {"train_loss": -4.767837047576904, "global_step": 4443, "epoch": 26} {"train_loss": -4.7961835861206055, "global_step": 4444, "epoch": 26} {"train_loss": -4.653660774230957, "global_step": 4445, "epoch": 26} {"train_loss": -4.823557376861572, "global_step": 4446, "epoch": 26} {"train_loss": -5.0033159255981445, "global_step": 4447, "epoch": 26} {"train_loss": -4.558306694030762, "global_step": 4448, "epoch": 26} {"train_loss": -4.818060874938965, "global_step": 4449, "epoch": 26} {"train_loss": -4.868475437164307, "global_step": 4450, "epoch": 26} {"train_loss": -4.7708048820495605, "global_step": 4451, "epoch": 26} {"train_loss": -4.879202365875244, "global_step": 4452, "epoch": 26} {"train_loss": -4.711451530456543, "global_step": 4453, "epoch": 26} {"train_loss": -4.740570068359375, "global_step": 4454, "epoch": 26} {"train_loss": -4.944765567779541, "global_step": 4455, "epoch": 26} {"train_loss": -4.632137298583984, "global_step": 4456, "epoch": 26} {"train_loss": -4.763956546783447, "global_step": 4457, "epoch": 26} {"train_loss": -4.782966613769531, "global_step": 4458, "epoch": 26} {"train_loss": -4.724410057067871, "global_step": 4459, "epoch": 26} {"train_loss": -4.854937553405762, "global_step": 4460, "epoch": 26} {"train_loss": -4.3327507972717285, "global_step": 4461, "epoch": 26} {"train_loss": -4.794000625610352, "global_step": 4462, "epoch": 26} {"train_loss": -4.596137046813965, "global_step": 4463, "epoch": 26} {"train_loss": -4.430544376373291, "global_step": 4464, "epoch": 26} {"train_loss": -4.8379058837890625, "global_step": 4465, "epoch": 26} {"train_loss": -4.643690586090088, "global_step": 4466, "epoch": 26} {"train_loss": -4.567929744720459, "global_step": 4467, "epoch": 26} {"train_loss": -4.961861610412598, "global_step": 4468, "epoch": 26} {"train_loss": -4.348385810852051, "global_step": 4469, "epoch": 26} {"train_loss": -4.70233154296875, "global_step": 4470, "epoch": 26} {"train_loss": -4.909924507141113, "global_step": 4471, "epoch": 26} {"train_loss": -4.723360061645508, "global_step": 4472, "epoch": 26} {"train_loss": -4.5985517501831055, "global_step": 4473, "epoch": 26} {"train_loss": -4.875866889953613, "global_step": 4474, "epoch": 26} {"train_loss": -4.737995147705078, "global_step": 4475, "epoch": 26} {"train_loss": -4.751922607421875, "global_step": 4476, "epoch": 26} {"train_loss": -4.86048698425293, "global_step": 4477, "epoch": 26} {"train_loss": -4.813880443572998, "global_step": 4478, "epoch": 26} {"train_loss": -4.818144798278809, "global_step": 4479, "epoch": 26} {"train_loss": -4.912790298461914, "global_step": 4480, "epoch": 26} {"train_loss": -4.80391788482666, "global_step": 4481, "epoch": 26} {"train_loss": -4.937198162078857, "global_step": 4482, "epoch": 26} {"train_loss": -4.866282939910889, "global_step": 4483, "epoch": 26} {"train_loss": -4.796841144561768, "global_step": 4484, "epoch": 26} {"train_loss": -4.657608985900879, "global_step": 4485, "epoch": 26} {"train_loss": -4.877817630767822, "global_step": 4486, "epoch": 26} {"train_loss": -4.828807353973389, "global_step": 4487, "epoch": 26} {"train_loss": -4.947270393371582, "global_step": 4488, "epoch": 26} {"train_loss": -4.903943061828613, "global_step": 4489, "epoch": 26} {"train_loss": -4.783926010131836, "global_step": 4490, "epoch": 26} {"train_loss": -4.757863998413086, "global_step": 4491, "epoch": 26} {"train_loss": -4.7828850746154785, "global_step": 4492, "epoch": 26} {"train_loss": -4.983924388885498, "global_step": 4493, "epoch": 26} {"train_loss": -4.9250335693359375, "global_step": 4494, "epoch": 26} {"train_loss": -4.803068161010742, "global_step": 4495, "epoch": 26} {"train_loss": -4.964363098144531, "global_step": 4496, "epoch": 26} {"train_loss": -4.528487682342529, "global_step": 4497, "epoch": 26} {"train_loss": -4.935493469238281, "global_step": 4498, "epoch": 26} {"train_loss": -4.898048400878906, "global_step": 4499, "epoch": 26} {"train_loss": -5.030844688415527, "global_step": 4500, "epoch": 26} {"train_loss": -4.779058456420898, "global_step": 4501, "epoch": 26} {"train_loss": -4.749115943908691, "global_step": 4502, "epoch": 26} {"train_loss": -4.839738368988037, "global_step": 4503, "epoch": 26} {"train_loss": -4.732734680175781, "global_step": 4504, "epoch": 26} {"train_loss": -4.759578704833984, "global_step": 4505, "epoch": 26} {"train_loss": -4.887122631072998, "global_step": 4506, "epoch": 26} {"train_loss": -4.702853679656982, "global_step": 4507, "epoch": 26} {"train_loss": -4.831871509552002, "global_step": 4508, "epoch": 26} {"train_loss": -4.425924301147461, "global_step": 4509, "epoch": 26} {"train_loss": -4.8938140869140625, "global_step": 4510, "epoch": 26} {"train_loss": -4.895773410797119, "global_step": 4511, "epoch": 26} {"train_loss": -4.998521327972412, "global_step": 4512, "epoch": 26} {"train_loss": -4.771024227142334, "global_step": 4513, "epoch": 26} {"train_loss": -4.981313705444336, "global_step": 4514, "epoch": 26} {"train_loss": -5.026270866394043, "global_step": 4515, "epoch": 26} {"train_loss": -4.869126319885254, "global_step": 4516, "epoch": 26} {"train_loss": -4.872697830200195, "global_step": 4517, "epoch": 26} {"train_loss": -4.433795928955078, "global_step": 4518, "epoch": 26} {"train_loss": -4.979092597961426, "global_step": 4519, "epoch": 26} {"train_loss": -4.802116870880127, "global_step": 4520, "epoch": 26} {"train_loss": -4.776934623718262, "global_step": 4521, "epoch": 26} {"train_loss": -4.846639156341553, "global_step": 4522, "epoch": 26} {"train_loss": -4.824799537658691, "global_step": 4523, "epoch": 26} {"train_loss": -4.963222026824951, "global_step": 4524, "epoch": 26} {"train_loss": -5.031580448150635, "global_step": 4525, "epoch": 26} {"train_loss": -4.835690498352051, "global_step": 4526, "epoch": 26} {"train_loss": -5.284759521484375, "global_step": 4527, "epoch": 26} {"train_loss": -4.796914100646973, "global_step": 4528, "epoch": 26} {"train_loss": -4.964235305786133, "global_step": 4529, "epoch": 26} {"train_loss": -4.788719177246094, "global_step": 4530, "epoch": 26} {"train_loss": -4.786280632019043, "global_step": 4531, "epoch": 26} {"train_loss": -4.53068733215332, "global_step": 4532, "epoch": 26} {"train_loss": -4.86472225189209, "global_step": 4533, "epoch": 26} {"train_loss": -4.602060317993164, "global_step": 4534, "epoch": 26} {"train_loss": -4.820926981312888, "global_step": 4535, "epoch": 26, "val_loss": 262942.53125} {"train_loss": -4.680269241333008, "global_step": 4536, "epoch": 27} {"train_loss": -4.785664081573486, "global_step": 4537, "epoch": 27} {"train_loss": -4.627650260925293, "global_step": 4538, "epoch": 27} {"train_loss": -5.021421432495117, "global_step": 4539, "epoch": 27} {"train_loss": -4.724440574645996, "global_step": 4540, "epoch": 27} {"train_loss": -4.761712074279785, "global_step": 4541, "epoch": 27} {"train_loss": -4.799373626708984, "global_step": 4542, "epoch": 27} {"train_loss": -4.8769330978393555, "global_step": 4543, "epoch": 27} {"train_loss": -4.663955211639404, "global_step": 4544, "epoch": 27} {"train_loss": -4.336411476135254, "global_step": 4545, "epoch": 27} {"train_loss": -4.734679698944092, "global_step": 4546, "epoch": 27} {"train_loss": -4.630373001098633, "global_step": 4547, "epoch": 27} {"train_loss": -4.442449569702148, "global_step": 4548, "epoch": 27} {"train_loss": -4.889020919799805, "global_step": 4549, "epoch": 27} {"train_loss": -4.878377914428711, "global_step": 4550, "epoch": 27} {"train_loss": -4.462942123413086, "global_step": 4551, "epoch": 27} {"train_loss": -4.732874870300293, "global_step": 4552, "epoch": 27} {"train_loss": -4.893038749694824, "global_step": 4553, "epoch": 27} {"train_loss": -4.973889350891113, "global_step": 4554, "epoch": 27} {"train_loss": -5.062013626098633, "global_step": 4555, "epoch": 27} {"train_loss": -4.700547218322754, "global_step": 4556, "epoch": 27} {"train_loss": -5.127933502197266, "global_step": 4557, "epoch": 27} {"train_loss": -5.306368827819824, "global_step": 4558, "epoch": 27} {"train_loss": -5.0549163818359375, "global_step": 4559, "epoch": 27} {"train_loss": -4.824522495269775, "global_step": 4560, "epoch": 27} {"train_loss": -5.09520959854126, "global_step": 4561, "epoch": 27} {"train_loss": -5.068580627441406, "global_step": 4562, "epoch": 27} {"train_loss": -5.023533344268799, "global_step": 4563, "epoch": 27} {"train_loss": -5.1476969718933105, "global_step": 4564, "epoch": 27} {"train_loss": -4.677863597869873, "global_step": 4565, "epoch": 27} {"train_loss": -4.961858749389648, "global_step": 4566, "epoch": 27} {"train_loss": -4.797976493835449, "global_step": 4567, "epoch": 27} {"train_loss": -5.127359390258789, "global_step": 4568, "epoch": 27} {"train_loss": -4.928301811218262, "global_step": 4569, "epoch": 27} {"train_loss": -4.989291667938232, "global_step": 4570, "epoch": 27} {"train_loss": -4.939326286315918, "global_step": 4571, "epoch": 27} {"train_loss": -4.964669227600098, "global_step": 4572, "epoch": 27} {"train_loss": -4.762575149536133, "global_step": 4573, "epoch": 27} {"train_loss": -4.599008560180664, "global_step": 4574, "epoch": 27} {"train_loss": -4.874924659729004, "global_step": 4575, "epoch": 27} {"train_loss": -4.668778896331787, "global_step": 4576, "epoch": 27} {"train_loss": -4.791184425354004, "global_step": 4577, "epoch": 27} {"train_loss": -5.1641130447387695, "global_step": 4578, "epoch": 27} {"train_loss": -4.836663246154785, "global_step": 4579, "epoch": 27} {"train_loss": -4.839914798736572, "global_step": 4580, "epoch": 27} {"train_loss": -4.9712324142456055, "global_step": 4581, "epoch": 27} {"train_loss": -5.0280280113220215, "global_step": 4582, "epoch": 27} {"train_loss": -5.1328253746032715, "global_step": 4583, "epoch": 27} {"train_loss": -4.987843036651611, "global_step": 4584, "epoch": 27} {"train_loss": -4.927354335784912, "global_step": 4585, "epoch": 27} {"train_loss": -5.006834983825684, "global_step": 4586, "epoch": 27} {"train_loss": -5.175652980804443, "global_step": 4587, "epoch": 27} {"train_loss": -4.92699670791626, "global_step": 4588, "epoch": 27} {"train_loss": -4.996682643890381, "global_step": 4589, "epoch": 27} {"train_loss": -4.663677215576172, "global_step": 4590, "epoch": 27} {"train_loss": -5.016942977905273, "global_step": 4591, "epoch": 27} {"train_loss": -4.551694393157959, "global_step": 4592, "epoch": 27} {"train_loss": -4.91159725189209, "global_step": 4593, "epoch": 27} {"train_loss": -4.52077579498291, "global_step": 4594, "epoch": 27} {"train_loss": -4.635473251342773, "global_step": 4595, "epoch": 27} {"train_loss": -4.897525310516357, "global_step": 4596, "epoch": 27} {"train_loss": -4.820568561553955, "global_step": 4597, "epoch": 27} {"train_loss": -4.978374481201172, "global_step": 4598, "epoch": 27} {"train_loss": -4.918411731719971, "global_step": 4599, "epoch": 27} {"train_loss": -4.918787479400635, "global_step": 4600, "epoch": 27} {"train_loss": -4.827008247375488, "global_step": 4601, "epoch": 27} {"train_loss": -4.893909454345703, "global_step": 4602, "epoch": 27} {"train_loss": -4.832942962646484, "global_step": 4603, "epoch": 27} {"train_loss": -4.752614974975586, "global_step": 4604, "epoch": 27} {"train_loss": -4.951757907867432, "global_step": 4605, "epoch": 27} {"train_loss": -4.88918399810791, "global_step": 4606, "epoch": 27} {"train_loss": -4.806853294372559, "global_step": 4607, "epoch": 27} {"train_loss": -4.673775672912598, "global_step": 4608, "epoch": 27} {"train_loss": -4.869228363037109, "global_step": 4609, "epoch": 27} {"train_loss": -4.714193344116211, "global_step": 4610, "epoch": 27} {"train_loss": -5.122165679931641, "global_step": 4611, "epoch": 27} {"train_loss": -4.711313247680664, "global_step": 4612, "epoch": 27} {"train_loss": -4.796985626220703, "global_step": 4613, "epoch": 27} {"train_loss": -4.8916015625, "global_step": 4614, "epoch": 27} {"train_loss": -4.875493049621582, "global_step": 4615, "epoch": 27} {"train_loss": -4.803134441375732, "global_step": 4616, "epoch": 27} {"train_loss": -5.181960105895996, "global_step": 4617, "epoch": 27} {"train_loss": -4.723911762237549, "global_step": 4618, "epoch": 27} {"train_loss": -4.755863666534424, "global_step": 4619, "epoch": 27} {"train_loss": -4.891598224639893, "global_step": 4620, "epoch": 27} {"train_loss": -5.123331069946289, "global_step": 4621, "epoch": 27} {"train_loss": -5.215142250061035, "global_step": 4622, "epoch": 27} {"train_loss": -4.961599349975586, "global_step": 4623, "epoch": 27} {"train_loss": -4.735125541687012, "global_step": 4624, "epoch": 27} {"train_loss": -4.883563041687012, "global_step": 4625, "epoch": 27} {"train_loss": -4.782564640045166, "global_step": 4626, "epoch": 27} {"train_loss": -5.045729637145996, "global_step": 4627, "epoch": 27} {"train_loss": -5.010486602783203, "global_step": 4628, "epoch": 27} {"train_loss": -5.034384727478027, "global_step": 4629, "epoch": 27} {"train_loss": -4.945491790771484, "global_step": 4630, "epoch": 27} {"train_loss": -4.303584098815918, "global_step": 4631, "epoch": 27} {"train_loss": -5.087096691131592, "global_step": 4632, "epoch": 27} {"train_loss": -5.001432418823242, "global_step": 4633, "epoch": 27} {"train_loss": -5.030667304992676, "global_step": 4634, "epoch": 27} {"train_loss": -4.949972152709961, "global_step": 4635, "epoch": 27} {"train_loss": -5.144892692565918, "global_step": 4636, "epoch": 27} {"train_loss": -4.776729106903076, "global_step": 4637, "epoch": 27} {"train_loss": -5.123537540435791, "global_step": 4638, "epoch": 27} {"train_loss": -5.279599189758301, "global_step": 4639, "epoch": 27} {"train_loss": -4.871621131896973, "global_step": 4640, "epoch": 27} {"train_loss": -5.002695083618164, "global_step": 4641, "epoch": 27} {"train_loss": -5.057474613189697, "global_step": 4642, "epoch": 27} {"train_loss": -5.0800886154174805, "global_step": 4643, "epoch": 27} {"train_loss": -5.042550563812256, "global_step": 4644, "epoch": 27} {"train_loss": -4.787600517272949, "global_step": 4645, "epoch": 27} {"train_loss": -4.709420204162598, "global_step": 4646, "epoch": 27} {"train_loss": -4.392939567565918, "global_step": 4647, "epoch": 27} {"train_loss": -4.990264892578125, "global_step": 4648, "epoch": 27} {"train_loss": -4.59912109375, "global_step": 4649, "epoch": 27} {"train_loss": -4.933524131774902, "global_step": 4650, "epoch": 27} {"train_loss": -4.930123329162598, "global_step": 4651, "epoch": 27} {"train_loss": -4.587563514709473, "global_step": 4652, "epoch": 27} {"train_loss": -4.941402435302734, "global_step": 4653, "epoch": 27} {"train_loss": -4.87706184387207, "global_step": 4654, "epoch": 27} {"train_loss": -4.849562168121338, "global_step": 4655, "epoch": 27} {"train_loss": -4.878668308258057, "global_step": 4656, "epoch": 27} {"train_loss": -4.738984107971191, "global_step": 4657, "epoch": 27} {"train_loss": -4.584643363952637, "global_step": 4658, "epoch": 27} {"train_loss": -4.666079521179199, "global_step": 4659, "epoch": 27} {"train_loss": -4.775693893432617, "global_step": 4660, "epoch": 27} {"train_loss": -4.710524559020996, "global_step": 4661, "epoch": 27} {"train_loss": -4.449174880981445, "global_step": 4662, "epoch": 27} {"train_loss": -5.034278869628906, "global_step": 4663, "epoch": 27} {"train_loss": -4.549311637878418, "global_step": 4664, "epoch": 27} {"train_loss": -4.6941022872924805, "global_step": 4665, "epoch": 27} {"train_loss": -4.961481094360352, "global_step": 4666, "epoch": 27} {"train_loss": -4.795692443847656, "global_step": 4667, "epoch": 27} {"train_loss": -4.973358154296875, "global_step": 4668, "epoch": 27} {"train_loss": -4.997991561889648, "global_step": 4669, "epoch": 27} {"train_loss": -4.654412269592285, "global_step": 4670, "epoch": 27} {"train_loss": -4.848540306091309, "global_step": 4671, "epoch": 27} {"train_loss": -5.063447952270508, "global_step": 4672, "epoch": 27} {"train_loss": -4.964146614074707, "global_step": 4673, "epoch": 27} {"train_loss": -4.97916316986084, "global_step": 4674, "epoch": 27} {"train_loss": -5.038918495178223, "global_step": 4675, "epoch": 27} {"train_loss": -4.692119598388672, "global_step": 4676, "epoch": 27} {"train_loss": -4.685212135314941, "global_step": 4677, "epoch": 27} {"train_loss": -4.733665943145752, "global_step": 4678, "epoch": 27} {"train_loss": -4.831438064575195, "global_step": 4679, "epoch": 27} {"train_loss": -4.811703681945801, "global_step": 4680, "epoch": 27} {"train_loss": -5.035552501678467, "global_step": 4681, "epoch": 27} {"train_loss": -4.86391019821167, "global_step": 4682, "epoch": 27} {"train_loss": -4.800755500793457, "global_step": 4683, "epoch": 27} {"train_loss": -4.7716522216796875, "global_step": 4684, "epoch": 27} {"train_loss": -5.034391403198242, "global_step": 4685, "epoch": 27} {"train_loss": -5.053445339202881, "global_step": 4686, "epoch": 27} {"train_loss": -4.798961639404297, "global_step": 4687, "epoch": 27} {"train_loss": -5.141299247741699, "global_step": 4688, "epoch": 27} {"train_loss": -5.0038676261901855, "global_step": 4689, "epoch": 27} {"train_loss": -4.895277976989746, "global_step": 4690, "epoch": 27} {"train_loss": -4.864463806152344, "global_step": 4691, "epoch": 27} {"train_loss": -4.944802284240723, "global_step": 4692, "epoch": 27} {"train_loss": -5.22605037689209, "global_step": 4693, "epoch": 27} {"train_loss": -4.884641647338867, "global_step": 4694, "epoch": 27} {"train_loss": -4.954805850982666, "global_step": 4695, "epoch": 27} {"train_loss": -5.058660984039307, "global_step": 4696, "epoch": 27} {"train_loss": -4.769827842712402, "global_step": 4697, "epoch": 27} {"train_loss": -5.082602500915527, "global_step": 4698, "epoch": 27} {"train_loss": -5.096148490905762, "global_step": 4699, "epoch": 27} {"train_loss": -5.1262125968933105, "global_step": 4700, "epoch": 27} {"train_loss": -4.708130836486816, "global_step": 4701, "epoch": 27} {"train_loss": -4.9632415771484375, "global_step": 4702, "epoch": 27} {"train_loss": -4.877645092351096, "global_step": 4703, "epoch": 27, "val_loss": 269322.53125} {"train_loss": -4.889632225036621, "global_step": 4704, "epoch": 28} {"train_loss": -4.750035762786865, "global_step": 4705, "epoch": 28} {"train_loss": -4.944921493530273, "global_step": 4706, "epoch": 28} {"train_loss": -4.935234546661377, "global_step": 4707, "epoch": 28} {"train_loss": -4.970885276794434, "global_step": 4708, "epoch": 28} {"train_loss": -5.062196731567383, "global_step": 4709, "epoch": 28} {"train_loss": -4.79996395111084, "global_step": 4710, "epoch": 28} {"train_loss": -5.042224407196045, "global_step": 4711, "epoch": 28} {"train_loss": -5.051802158355713, "global_step": 4712, "epoch": 28} {"train_loss": -4.855856418609619, "global_step": 4713, "epoch": 28} {"train_loss": -5.145308971405029, "global_step": 4714, "epoch": 28} {"train_loss": -5.024750709533691, "global_step": 4715, "epoch": 28} {"train_loss": -4.759243011474609, "global_step": 4716, "epoch": 28} {"train_loss": -4.9305243492126465, "global_step": 4717, "epoch": 28} {"train_loss": -5.196297645568848, "global_step": 4718, "epoch": 28} {"train_loss": -4.704307556152344, "global_step": 4719, "epoch": 28} {"train_loss": -4.867403507232666, "global_step": 4720, "epoch": 28} {"train_loss": -5.126975059509277, "global_step": 4721, "epoch": 28} {"train_loss": -4.814509391784668, "global_step": 4722, "epoch": 28} {"train_loss": -4.664772033691406, "global_step": 4723, "epoch": 28} {"train_loss": -4.899058818817139, "global_step": 4724, "epoch": 28} {"train_loss": -4.991665363311768, "global_step": 4725, "epoch": 28} {"train_loss": -4.827510833740234, "global_step": 4726, "epoch": 28} {"train_loss": -5.0030670166015625, "global_step": 4727, "epoch": 28} {"train_loss": -4.767159461975098, "global_step": 4728, "epoch": 28} {"train_loss": -4.853113174438477, "global_step": 4729, "epoch": 28} {"train_loss": -4.682858467102051, "global_step": 4730, "epoch": 28} {"train_loss": -4.960474491119385, "global_step": 4731, "epoch": 28} {"train_loss": -5.072576522827148, "global_step": 4732, "epoch": 28} {"train_loss": -4.871004104614258, "global_step": 4733, "epoch": 28} {"train_loss": -4.884137153625488, "global_step": 4734, "epoch": 28} {"train_loss": -4.90782356262207, "global_step": 4735, "epoch": 28} {"train_loss": -4.984475135803223, "global_step": 4736, "epoch": 28} {"train_loss": -4.92854118347168, "global_step": 4737, "epoch": 28} {"train_loss": -4.938352584838867, "global_step": 4738, "epoch": 28} {"train_loss": -4.9251484870910645, "global_step": 4739, "epoch": 28} {"train_loss": -4.990902900695801, "global_step": 4740, "epoch": 28} {"train_loss": -5.170367240905762, "global_step": 4741, "epoch": 28} {"train_loss": -5.248723983764648, "global_step": 4742, "epoch": 28} {"train_loss": -4.9062910079956055, "global_step": 4743, "epoch": 28} {"train_loss": -4.940803527832031, "global_step": 4744, "epoch": 28} {"train_loss": -4.996401786804199, "global_step": 4745, "epoch": 28} {"train_loss": -4.793446063995361, "global_step": 4746, "epoch": 28} {"train_loss": -5.003314018249512, "global_step": 4747, "epoch": 28} {"train_loss": -5.088271141052246, "global_step": 4748, "epoch": 28} {"train_loss": -4.986623287200928, "global_step": 4749, "epoch": 28} {"train_loss": -4.726609230041504, "global_step": 4750, "epoch": 28} {"train_loss": -4.918273448944092, "global_step": 4751, "epoch": 28} {"train_loss": -4.629768371582031, "global_step": 4752, "epoch": 28} {"train_loss": -4.9138288497924805, "global_step": 4753, "epoch": 28} {"train_loss": -4.926138877868652, "global_step": 4754, "epoch": 28} {"train_loss": -4.580894470214844, "global_step": 4755, "epoch": 28} {"train_loss": -4.983972072601318, "global_step": 4756, "epoch": 28} {"train_loss": -4.955321311950684, "global_step": 4757, "epoch": 28} {"train_loss": -4.957988262176514, "global_step": 4758, "epoch": 28} {"train_loss": -4.919342994689941, "global_step": 4759, "epoch": 28} {"train_loss": -4.863864898681641, "global_step": 4760, "epoch": 28} {"train_loss": -4.927041053771973, "global_step": 4761, "epoch": 28} {"train_loss": -5.1402740478515625, "global_step": 4762, "epoch": 28} {"train_loss": -4.723928928375244, "global_step": 4763, "epoch": 28} {"train_loss": -5.049063682556152, "global_step": 4764, "epoch": 28} {"train_loss": -5.079590320587158, "global_step": 4765, "epoch": 28} {"train_loss": -5.007245063781738, "global_step": 4766, "epoch": 28} {"train_loss": -5.213451862335205, "global_step": 4767, "epoch": 28} {"train_loss": -4.918759346008301, "global_step": 4768, "epoch": 28} {"train_loss": -5.344183444976807, "global_step": 4769, "epoch": 28} {"train_loss": -5.267058372497559, "global_step": 4770, "epoch": 28} {"train_loss": -4.943063735961914, "global_step": 4771, "epoch": 28} {"train_loss": -4.797849178314209, "global_step": 4772, "epoch": 28} {"train_loss": -4.361135482788086, "global_step": 4773, "epoch": 28} {"train_loss": -5.0339508056640625, "global_step": 4774, "epoch": 28} {"train_loss": -4.974697113037109, "global_step": 4775, "epoch": 28} {"train_loss": -5.020052909851074, "global_step": 4776, "epoch": 28} {"train_loss": -4.451803684234619, "global_step": 4777, "epoch": 28} {"train_loss": -4.890013217926025, "global_step": 4778, "epoch": 28} {"train_loss": -4.865610122680664, "global_step": 4779, "epoch": 28} {"train_loss": -4.9337310791015625, "global_step": 4780, "epoch": 28} {"train_loss": -4.928771018981934, "global_step": 4781, "epoch": 28} {"train_loss": -4.952078819274902, "global_step": 4782, "epoch": 28} {"train_loss": -5.028697967529297, "global_step": 4783, "epoch": 28} {"train_loss": -4.92310905456543, "global_step": 4784, "epoch": 28} {"train_loss": -5.047621726989746, "global_step": 4785, "epoch": 28} {"train_loss": -4.962282180786133, "global_step": 4786, "epoch": 28} {"train_loss": -4.823535919189453, "global_step": 4787, "epoch": 28} {"train_loss": -4.579988479614258, "global_step": 4788, "epoch": 28} {"train_loss": -4.9442362785339355, "global_step": 4789, "epoch": 28} {"train_loss": -5.044593334197998, "global_step": 4790, "epoch": 28} {"train_loss": -4.947745323181152, "global_step": 4791, "epoch": 28} {"train_loss": -4.953629970550537, "global_step": 4792, "epoch": 28} {"train_loss": -4.843889236450195, "global_step": 4793, "epoch": 28} {"train_loss": -4.961136817932129, "global_step": 4794, "epoch": 28} {"train_loss": -4.926379680633545, "global_step": 4795, "epoch": 28} {"train_loss": -4.820847511291504, "global_step": 4796, "epoch": 28} {"train_loss": -4.9506940841674805, "global_step": 4797, "epoch": 28} {"train_loss": -4.999245643615723, "global_step": 4798, "epoch": 28} {"train_loss": -5.083844184875488, "global_step": 4799, "epoch": 28} {"train_loss": -4.881192207336426, "global_step": 4800, "epoch": 28} {"train_loss": -5.033608436584473, "global_step": 4801, "epoch": 28} {"train_loss": -5.254372596740723, "global_step": 4802, "epoch": 28} {"train_loss": -5.04440975189209, "global_step": 4803, "epoch": 28} {"train_loss": -4.839481830596924, "global_step": 4804, "epoch": 28} {"train_loss": -4.800440788269043, "global_step": 4805, "epoch": 28} {"train_loss": -5.070369243621826, "global_step": 4806, "epoch": 28} {"train_loss": -4.886147499084473, "global_step": 4807, "epoch": 28} {"train_loss": -5.000162124633789, "global_step": 4808, "epoch": 28} {"train_loss": -5.176653861999512, "global_step": 4809, "epoch": 28} {"train_loss": -5.1241607666015625, "global_step": 4810, "epoch": 28} {"train_loss": -4.953749656677246, "global_step": 4811, "epoch": 28} {"train_loss": -4.834883213043213, "global_step": 4812, "epoch": 28} {"train_loss": -4.839996814727783, "global_step": 4813, "epoch": 28} {"train_loss": -5.234189987182617, "global_step": 4814, "epoch": 28} {"train_loss": -5.100761890411377, "global_step": 4815, "epoch": 28} {"train_loss": -4.9894256591796875, "global_step": 4816, "epoch": 28} {"train_loss": -4.893843650817871, "global_step": 4817, "epoch": 28} {"train_loss": -5.229974746704102, "global_step": 4818, "epoch": 28} {"train_loss": -4.875495910644531, "global_step": 4819, "epoch": 28} {"train_loss": -5.203113079071045, "global_step": 4820, "epoch": 28} {"train_loss": -4.641223907470703, "global_step": 4821, "epoch": 28} {"train_loss": -4.956300735473633, "global_step": 4822, "epoch": 28} {"train_loss": -5.062601089477539, "global_step": 4823, "epoch": 28} {"train_loss": -4.980656623840332, "global_step": 4824, "epoch": 28} {"train_loss": -5.072876930236816, "global_step": 4825, "epoch": 28} {"train_loss": -4.745702266693115, "global_step": 4826, "epoch": 28} {"train_loss": -5.016669273376465, "global_step": 4827, "epoch": 28} {"train_loss": -5.165496826171875, "global_step": 4828, "epoch": 28} {"train_loss": -5.105763912200928, "global_step": 4829, "epoch": 28} {"train_loss": -4.962418079376221, "global_step": 4830, "epoch": 28} {"train_loss": -5.039688587188721, "global_step": 4831, "epoch": 28} {"train_loss": -4.9545745849609375, "global_step": 4832, "epoch": 28} {"train_loss": -4.762595176696777, "global_step": 4833, "epoch": 28} {"train_loss": -4.636445045471191, "global_step": 4834, "epoch": 28} {"train_loss": -4.800801753997803, "global_step": 4835, "epoch": 28} {"train_loss": -4.880494117736816, "global_step": 4836, "epoch": 28} {"train_loss": -4.881902694702148, "global_step": 4837, "epoch": 28} {"train_loss": -4.767077445983887, "global_step": 4838, "epoch": 28} {"train_loss": -4.661882400512695, "global_step": 4839, "epoch": 28} {"train_loss": -4.79123067855835, "global_step": 4840, "epoch": 28} {"train_loss": -4.970274448394775, "global_step": 4841, "epoch": 28} {"train_loss": -4.883903503417969, "global_step": 4842, "epoch": 28} {"train_loss": -4.665403366088867, "global_step": 4843, "epoch": 28} {"train_loss": -4.965630531311035, "global_step": 4844, "epoch": 28} {"train_loss": -4.904300689697266, "global_step": 4845, "epoch": 28} {"train_loss": -4.579058647155762, "global_step": 4846, "epoch": 28} {"train_loss": -4.875529766082764, "global_step": 4847, "epoch": 28} {"train_loss": -4.863271236419678, "global_step": 4848, "epoch": 28} {"train_loss": -4.86659049987793, "global_step": 4849, "epoch": 28} {"train_loss": -5.177923202514648, "global_step": 4850, "epoch": 28} {"train_loss": -5.057162761688232, "global_step": 4851, "epoch": 28} {"train_loss": -4.819534778594971, "global_step": 4852, "epoch": 28} {"train_loss": -5.224184036254883, "global_step": 4853, "epoch": 28} {"train_loss": -4.976836204528809, "global_step": 4854, "epoch": 28} {"train_loss": -4.759868144989014, "global_step": 4855, "epoch": 28} {"train_loss": -4.961799621582031, "global_step": 4856, "epoch": 28} {"train_loss": -5.015233993530273, "global_step": 4857, "epoch": 28} {"train_loss": -5.231534004211426, "global_step": 4858, "epoch": 28} {"train_loss": -4.920851707458496, "global_step": 4859, "epoch": 28} {"train_loss": -4.932389259338379, "global_step": 4860, "epoch": 28} {"train_loss": -4.858407974243164, "global_step": 4861, "epoch": 28} {"train_loss": -4.631293296813965, "global_step": 4862, "epoch": 28} {"train_loss": -4.942560195922852, "global_step": 4863, "epoch": 28} {"train_loss": -4.740987300872803, "global_step": 4864, "epoch": 28} {"train_loss": -5.2612104415893555, "global_step": 4865, "epoch": 28} {"train_loss": -5.139766693115234, "global_step": 4866, "epoch": 28} {"train_loss": -4.978781223297119, "global_step": 4867, "epoch": 28} {"train_loss": -5.045781135559082, "global_step": 4868, "epoch": 28} {"train_loss": -5.052372932434082, "global_step": 4869, "epoch": 28} {"train_loss": -5.202115058898926, "global_step": 4870, "epoch": 28} {"train_loss": -4.941855609416962, "global_step": 4871, "epoch": 28, "val_loss": 283859.0} {"train_loss": -4.690382957458496, "global_step": 4872, "epoch": 29} {"train_loss": -5.080153465270996, "global_step": 4873, "epoch": 29} {"train_loss": -5.097672462463379, "global_step": 4874, "epoch": 29} {"train_loss": -5.0121588706970215, "global_step": 4875, "epoch": 29} {"train_loss": -4.9964470863342285, "global_step": 4876, "epoch": 29} {"train_loss": -4.895195007324219, "global_step": 4877, "epoch": 29} {"train_loss": -4.802158832550049, "global_step": 4878, "epoch": 29} {"train_loss": -5.099356651306152, "global_step": 4879, "epoch": 29} {"train_loss": -4.90875244140625, "global_step": 4880, "epoch": 29} {"train_loss": -4.881017684936523, "global_step": 4881, "epoch": 29} {"train_loss": -4.888154983520508, "global_step": 4882, "epoch": 29} {"train_loss": -4.905381679534912, "global_step": 4883, "epoch": 29} {"train_loss": -4.934223175048828, "global_step": 4884, "epoch": 29} {"train_loss": -5.128260135650635, "global_step": 4885, "epoch": 29} {"train_loss": -4.876441955566406, "global_step": 4886, "epoch": 29} {"train_loss": -4.948146343231201, "global_step": 4887, "epoch": 29} {"train_loss": -5.107519149780273, "global_step": 4888, "epoch": 29} {"train_loss": -4.8387651443481445, "global_step": 4889, "epoch": 29} {"train_loss": -5.016238689422607, "global_step": 4890, "epoch": 29} {"train_loss": -4.823882579803467, "global_step": 4891, "epoch": 29} {"train_loss": -5.159519672393799, "global_step": 4892, "epoch": 29} {"train_loss": -4.651960372924805, "global_step": 4893, "epoch": 29} {"train_loss": -4.881162643432617, "global_step": 4894, "epoch": 29} {"train_loss": -4.70064640045166, "global_step": 4895, "epoch": 29} {"train_loss": -4.749574661254883, "global_step": 4896, "epoch": 29} {"train_loss": -4.854924201965332, "global_step": 4897, "epoch": 29} {"train_loss": -4.996801376342773, "global_step": 4898, "epoch": 29} {"train_loss": -4.853930950164795, "global_step": 4899, "epoch": 29} {"train_loss": -4.7624921798706055, "global_step": 4900, "epoch": 29} {"train_loss": -4.8627824783325195, "global_step": 4901, "epoch": 29} {"train_loss": -4.99962043762207, "global_step": 4902, "epoch": 29} {"train_loss": -4.788318634033203, "global_step": 4903, "epoch": 29} {"train_loss": -4.740091323852539, "global_step": 4904, "epoch": 29} {"train_loss": -4.626914978027344, "global_step": 4905, "epoch": 29} {"train_loss": -5.079822063446045, "global_step": 4906, "epoch": 29} {"train_loss": -4.697055816650391, "global_step": 4907, "epoch": 29} {"train_loss": -4.952998161315918, "global_step": 4908, "epoch": 29} {"train_loss": -5.024123191833496, "global_step": 4909, "epoch": 29} {"train_loss": -5.175745964050293, "global_step": 4910, "epoch": 29} {"train_loss": -5.040935039520264, "global_step": 4911, "epoch": 29} {"train_loss": -5.095755577087402, "global_step": 4912, "epoch": 29} {"train_loss": -4.675479412078857, "global_step": 4913, "epoch": 29} {"train_loss": -4.936044692993164, "global_step": 4914, "epoch": 29} {"train_loss": -4.909732818603516, "global_step": 4915, "epoch": 29} {"train_loss": -4.881946086883545, "global_step": 4916, "epoch": 29} {"train_loss": -4.6758856773376465, "global_step": 4917, "epoch": 29} {"train_loss": -4.850415229797363, "global_step": 4918, "epoch": 29} {"train_loss": -4.905162334442139, "global_step": 4919, "epoch": 29} {"train_loss": -5.085230827331543, "global_step": 4920, "epoch": 29} {"train_loss": -4.943526744842529, "global_step": 4921, "epoch": 29} {"train_loss": -5.015583038330078, "global_step": 4922, "epoch": 29} {"train_loss": -5.124965190887451, "global_step": 4923, "epoch": 29} {"train_loss": -5.063161373138428, "global_step": 4924, "epoch": 29} {"train_loss": -4.872211933135986, "global_step": 4925, "epoch": 29} {"train_loss": -4.879585266113281, "global_step": 4926, "epoch": 29} {"train_loss": -4.986729145050049, "global_step": 4927, "epoch": 29} {"train_loss": -4.852643966674805, "global_step": 4928, "epoch": 29} {"train_loss": -4.979269027709961, "global_step": 4929, "epoch": 29} {"train_loss": -4.8607587814331055, "global_step": 4930, "epoch": 29} {"train_loss": -5.170605659484863, "global_step": 4931, "epoch": 29} {"train_loss": -5.130982398986816, "global_step": 4932, "epoch": 29} {"train_loss": -5.082104682922363, "global_step": 4933, "epoch": 29} {"train_loss": -4.864373683929443, "global_step": 4934, "epoch": 29} {"train_loss": -5.080671310424805, "global_step": 4935, "epoch": 29} {"train_loss": -4.604260444641113, "global_step": 4936, "epoch": 29} {"train_loss": -5.227786064147949, "global_step": 4937, "epoch": 29} {"train_loss": -4.637895107269287, "global_step": 4938, "epoch": 29} {"train_loss": -4.76075553894043, "global_step": 4939, "epoch": 29} {"train_loss": -4.719386100769043, "global_step": 4940, "epoch": 29} {"train_loss": -4.999658584594727, "global_step": 4941, "epoch": 29} {"train_loss": -4.658629417419434, "global_step": 4942, "epoch": 29} {"train_loss": -4.987616539001465, "global_step": 4943, "epoch": 29} {"train_loss": -4.698418617248535, "global_step": 4944, "epoch": 29} {"train_loss": -4.966640949249268, "global_step": 4945, "epoch": 29} {"train_loss": -4.788285255432129, "global_step": 4946, "epoch": 29} {"train_loss": -4.68367338180542, "global_step": 4947, "epoch": 29} {"train_loss": -4.727390289306641, "global_step": 4948, "epoch": 29} {"train_loss": -4.9210100173950195, "global_step": 4949, "epoch": 29} {"train_loss": -4.7463908195495605, "global_step": 4950, "epoch": 29} {"train_loss": -4.7824320793151855, "global_step": 4951, "epoch": 29} {"train_loss": -4.827327251434326, "global_step": 4952, "epoch": 29} {"train_loss": -5.0041608810424805, "global_step": 4953, "epoch": 29} {"train_loss": -4.5251970291137695, "global_step": 4954, "epoch": 29} {"train_loss": -4.844387054443359, "global_step": 4955, "epoch": 29} {"train_loss": -4.760998725891113, "global_step": 4956, "epoch": 29} {"train_loss": -4.849902153015137, "global_step": 4957, "epoch": 29} {"train_loss": -4.66408634185791, "global_step": 4958, "epoch": 29} {"train_loss": -4.708205699920654, "global_step": 4959, "epoch": 29} {"train_loss": -4.951267242431641, "global_step": 4960, "epoch": 29} {"train_loss": -4.967759132385254, "global_step": 4961, "epoch": 29} {"train_loss": -4.908481597900391, "global_step": 4962, "epoch": 29} {"train_loss": -5.100759983062744, "global_step": 4963, "epoch": 29} {"train_loss": -4.8271989822387695, "global_step": 4964, "epoch": 29} {"train_loss": -4.8646240234375, "global_step": 4965, "epoch": 29} {"train_loss": -4.760393142700195, "global_step": 4966, "epoch": 29} {"train_loss": -4.958041191101074, "global_step": 4967, "epoch": 29} {"train_loss": -5.034902095794678, "global_step": 4968, "epoch": 29} {"train_loss": -5.152629375457764, "global_step": 4969, "epoch": 29} {"train_loss": -5.215619087219238, "global_step": 4970, "epoch": 29} {"train_loss": -4.899890422821045, "global_step": 4971, "epoch": 29} {"train_loss": -4.704805374145508, "global_step": 4972, "epoch": 29} {"train_loss": -4.997776508331299, "global_step": 4973, "epoch": 29} {"train_loss": -4.99403715133667, "global_step": 4974, "epoch": 29} {"train_loss": -4.819167137145996, "global_step": 4975, "epoch": 29} {"train_loss": -5.082302093505859, "global_step": 4976, "epoch": 29} {"train_loss": -4.882360935211182, "global_step": 4977, "epoch": 29} {"train_loss": -4.968391418457031, "global_step": 4978, "epoch": 29} {"train_loss": -5.286916255950928, "global_step": 4979, "epoch": 29} {"train_loss": -4.882140159606934, "global_step": 4980, "epoch": 29} {"train_loss": -4.807613372802734, "global_step": 4981, "epoch": 29} {"train_loss": -5.066262245178223, "global_step": 4982, "epoch": 29} {"train_loss": -4.909793853759766, "global_step": 4983, "epoch": 29} {"train_loss": -5.1440749168396, "global_step": 4984, "epoch": 29} {"train_loss": -4.864844799041748, "global_step": 4985, "epoch": 29} {"train_loss": -5.338983535766602, "global_step": 4986, "epoch": 29} {"train_loss": -4.9358439445495605, "global_step": 4987, "epoch": 29} {"train_loss": -5.163861274719238, "global_step": 4988, "epoch": 29} {"train_loss": -4.678548812866211, "global_step": 4989, "epoch": 29} {"train_loss": -5.208438396453857, "global_step": 4990, "epoch": 29} {"train_loss": -4.891573905944824, "global_step": 4991, "epoch": 29} {"train_loss": -4.994077682495117, "global_step": 4992, "epoch": 29} {"train_loss": -4.96051025390625, "global_step": 4993, "epoch": 29} {"train_loss": -4.843464374542236, "global_step": 4994, "epoch": 29} {"train_loss": -5.108996391296387, "global_step": 4995, "epoch": 29} {"train_loss": -4.789752960205078, "global_step": 4996, "epoch": 29} {"train_loss": -4.93026876449585, "global_step": 4997, "epoch": 29} {"train_loss": -5.0788445472717285, "global_step": 4998, "epoch": 29} {"train_loss": -4.943232536315918, "global_step": 4999, "epoch": 29} {"train_loss": -4.8785223960876465, "global_step": 5000, "epoch": 29} {"train_loss": -5.087566375732422, "global_step": 5001, "epoch": 29} {"train_loss": -5.1667399406433105, "global_step": 5002, "epoch": 29} {"train_loss": -5.078979015350342, "global_step": 5003, "epoch": 29} {"train_loss": -4.895138740539551, "global_step": 5004, "epoch": 29} {"train_loss": -5.027645111083984, "global_step": 5005, "epoch": 29} {"train_loss": -5.0061445236206055, "global_step": 5006, "epoch": 29} {"train_loss": -5.01053524017334, "global_step": 5007, "epoch": 29} {"train_loss": -5.103074073791504, "global_step": 5008, "epoch": 29} {"train_loss": -5.052574157714844, "global_step": 5009, "epoch": 29} {"train_loss": -4.769584655761719, "global_step": 5010, "epoch": 29} {"train_loss": -5.02396297454834, "global_step": 5011, "epoch": 29} {"train_loss": -5.212606430053711, "global_step": 5012, "epoch": 29} {"train_loss": -5.035580635070801, "global_step": 5013, "epoch": 29} {"train_loss": -5.187526226043701, "global_step": 5014, "epoch": 29} {"train_loss": -5.129452705383301, "global_step": 5015, "epoch": 29} {"train_loss": -5.136476039886475, "global_step": 5016, "epoch": 29} {"train_loss": -5.106734752655029, "global_step": 5017, "epoch": 29} {"train_loss": -5.305422306060791, "global_step": 5018, "epoch": 29} {"train_loss": -5.009105205535889, "global_step": 5019, "epoch": 29} {"train_loss": -5.009189605712891, "global_step": 5020, "epoch": 29} {"train_loss": -5.167667388916016, "global_step": 5021, "epoch": 29} {"train_loss": -5.015472412109375, "global_step": 5022, "epoch": 29} {"train_loss": -5.033837795257568, "global_step": 5023, "epoch": 29} {"train_loss": -4.9703874588012695, "global_step": 5024, "epoch": 29} {"train_loss": -4.974837303161621, "global_step": 5025, "epoch": 29} {"train_loss": -5.059080123901367, "global_step": 5026, "epoch": 29} {"train_loss": -5.04160737991333, "global_step": 5027, "epoch": 29} {"train_loss": -5.104848861694336, "global_step": 5028, "epoch": 29} {"train_loss": -5.245894908905029, "global_step": 5029, "epoch": 29} {"train_loss": -5.246233940124512, "global_step": 5030, "epoch": 29} {"train_loss": -4.936042785644531, "global_step": 5031, "epoch": 29} {"train_loss": -4.7898359298706055, "global_step": 5032, "epoch": 29} {"train_loss": -4.847049713134766, "global_step": 5033, "epoch": 29} {"train_loss": -4.762349605560303, "global_step": 5034, "epoch": 29} {"train_loss": -4.579279899597168, "global_step": 5035, "epoch": 29} {"train_loss": -4.960186004638672, "global_step": 5036, "epoch": 29} {"train_loss": -4.688745498657227, "global_step": 5037, "epoch": 29} {"train_loss": -4.706982135772705, "global_step": 5038, "epoch": 29} {"train_loss": -4.939312968935285, "global_step": 5039, "epoch": 29, "val_loss": 271866.625} {"train_loss": -4.864267826080322, "global_step": 5040, "epoch": 30} {"train_loss": -4.596112251281738, "global_step": 5041, "epoch": 30} {"train_loss": -4.795721054077148, "global_step": 5042, "epoch": 30} {"train_loss": -4.7687883377075195, "global_step": 5043, "epoch": 30} {"train_loss": -4.836214542388916, "global_step": 5044, "epoch": 30} {"train_loss": -4.7756147384643555, "global_step": 5045, "epoch": 30} {"train_loss": -4.805769920349121, "global_step": 5046, "epoch": 30} {"train_loss": -5.200794219970703, "global_step": 5047, "epoch": 30} {"train_loss": -4.89000129699707, "global_step": 5048, "epoch": 30} {"train_loss": -5.159873962402344, "global_step": 5049, "epoch": 30} {"train_loss": -5.039872169494629, "global_step": 5050, "epoch": 30} {"train_loss": -4.8738813400268555, "global_step": 5051, "epoch": 30} {"train_loss": -4.977439880371094, "global_step": 5052, "epoch": 30} {"train_loss": -4.942877769470215, "global_step": 5053, "epoch": 30} {"train_loss": -4.968184471130371, "global_step": 5054, "epoch": 30} {"train_loss": -4.929721832275391, "global_step": 5055, "epoch": 30} {"train_loss": -5.212833404541016, "global_step": 5056, "epoch": 30} {"train_loss": -5.180217266082764, "global_step": 5057, "epoch": 30} {"train_loss": -4.653219223022461, "global_step": 5058, "epoch": 30} {"train_loss": -5.053459167480469, "global_step": 5059, "epoch": 30} {"train_loss": -5.100607872009277, "global_step": 5060, "epoch": 30} {"train_loss": -4.979177474975586, "global_step": 5061, "epoch": 30} {"train_loss": -4.959261894226074, "global_step": 5062, "epoch": 30} {"train_loss": -5.051051139831543, "global_step": 5063, "epoch": 30} {"train_loss": -5.248476028442383, "global_step": 5064, "epoch": 30} {"train_loss": -4.863306045532227, "global_step": 5065, "epoch": 30} {"train_loss": -4.985134124755859, "global_step": 5066, "epoch": 30} {"train_loss": -5.10805082321167, "global_step": 5067, "epoch": 30} {"train_loss": -5.108570098876953, "global_step": 5068, "epoch": 30} {"train_loss": -5.141674518585205, "global_step": 5069, "epoch": 30} {"train_loss": -4.871520042419434, "global_step": 5070, "epoch": 30} {"train_loss": -5.341644287109375, "global_step": 5071, "epoch": 30} {"train_loss": -5.155158042907715, "global_step": 5072, "epoch": 30} {"train_loss": -5.009818077087402, "global_step": 5073, "epoch": 30} {"train_loss": -4.977155685424805, "global_step": 5074, "epoch": 30} {"train_loss": -4.973568916320801, "global_step": 5075, "epoch": 30} {"train_loss": -5.241877555847168, "global_step": 5076, "epoch": 30} {"train_loss": -5.008533000946045, "global_step": 5077, "epoch": 30} {"train_loss": -5.1382246017456055, "global_step": 5078, "epoch": 30} {"train_loss": -5.059754848480225, "global_step": 5079, "epoch": 30} {"train_loss": -5.040574550628662, "global_step": 5080, "epoch": 30} {"train_loss": -4.760494232177734, "global_step": 5081, "epoch": 30} {"train_loss": -5.211070537567139, "global_step": 5082, "epoch": 30} {"train_loss": -5.298705101013184, "global_step": 5083, "epoch": 30} {"train_loss": -5.103693008422852, "global_step": 5084, "epoch": 30} {"train_loss": -4.997786521911621, "global_step": 5085, "epoch": 30} {"train_loss": -5.129354476928711, "global_step": 5086, "epoch": 30} {"train_loss": -5.372576713562012, "global_step": 5087, "epoch": 30} {"train_loss": -4.992589950561523, "global_step": 5088, "epoch": 30} {"train_loss": -4.869548797607422, "global_step": 5089, "epoch": 30} {"train_loss": -5.155875205993652, "global_step": 5090, "epoch": 30} {"train_loss": -4.641229152679443, "global_step": 5091, "epoch": 30} {"train_loss": -5.081752777099609, "global_step": 5092, "epoch": 30} {"train_loss": -4.932137489318848, "global_step": 5093, "epoch": 30} {"train_loss": -5.099590301513672, "global_step": 5094, "epoch": 30} {"train_loss": -4.700188159942627, "global_step": 5095, "epoch": 30} {"train_loss": -5.1040778160095215, "global_step": 5096, "epoch": 30} {"train_loss": -5.125211238861084, "global_step": 5097, "epoch": 30} {"train_loss": -5.264074325561523, "global_step": 5098, "epoch": 30} {"train_loss": -4.883857727050781, "global_step": 5099, "epoch": 30} {"train_loss": -4.864969730377197, "global_step": 5100, "epoch": 30} {"train_loss": -4.803558826446533, "global_step": 5101, "epoch": 30} {"train_loss": -4.918207168579102, "global_step": 5102, "epoch": 30} {"train_loss": -4.937737941741943, "global_step": 5103, "epoch": 30} {"train_loss": -4.777602195739746, "global_step": 5104, "epoch": 30} {"train_loss": -5.030680179595947, "global_step": 5105, "epoch": 30} {"train_loss": -5.253025054931641, "global_step": 5106, "epoch": 30} {"train_loss": -5.114420413970947, "global_step": 5107, "epoch": 30} {"train_loss": -5.2227678298950195, "global_step": 5108, "epoch": 30} {"train_loss": -4.851459503173828, "global_step": 5109, "epoch": 30} {"train_loss": -4.889603614807129, "global_step": 5110, "epoch": 30} {"train_loss": -4.907355308532715, "global_step": 5111, "epoch": 30} {"train_loss": -5.1198954582214355, "global_step": 5112, "epoch": 30} {"train_loss": -4.960104942321777, "global_step": 5113, "epoch": 30} {"train_loss": -5.260350227355957, "global_step": 5114, "epoch": 30} {"train_loss": -4.98549222946167, "global_step": 5115, "epoch": 30} {"train_loss": -4.852349281311035, "global_step": 5116, "epoch": 30} {"train_loss": -4.918955326080322, "global_step": 5117, "epoch": 30} {"train_loss": -4.869993209838867, "global_step": 5118, "epoch": 30} {"train_loss": -5.173917770385742, "global_step": 5119, "epoch": 30} {"train_loss": -4.726900100708008, "global_step": 5120, "epoch": 30} {"train_loss": -5.1165313720703125, "global_step": 5121, "epoch": 30} {"train_loss": -4.713376045227051, "global_step": 5122, "epoch": 30} {"train_loss": -5.007015228271484, "global_step": 5123, "epoch": 30} {"train_loss": -4.975678443908691, "global_step": 5124, "epoch": 30} {"train_loss": -4.869815826416016, "global_step": 5125, "epoch": 30} {"train_loss": -5.0514678955078125, "global_step": 5126, "epoch": 30} {"train_loss": -4.906278610229492, "global_step": 5127, "epoch": 30} {"train_loss": -5.0103888511657715, "global_step": 5128, "epoch": 30} {"train_loss": -4.759365081787109, "global_step": 5129, "epoch": 30} {"train_loss": -4.688311576843262, "global_step": 5130, "epoch": 30} {"train_loss": -5.241125106811523, "global_step": 5131, "epoch": 30} {"train_loss": -4.731509208679199, "global_step": 5132, "epoch": 30} {"train_loss": -5.015073299407959, "global_step": 5133, "epoch": 30} {"train_loss": -4.898755073547363, "global_step": 5134, "epoch": 30} {"train_loss": -4.520557403564453, "global_step": 5135, "epoch": 30} {"train_loss": -5.007539749145508, "global_step": 5136, "epoch": 30} {"train_loss": -4.248512268066406, "global_step": 5137, "epoch": 30} {"train_loss": -4.763436317443848, "global_step": 5138, "epoch": 30} {"train_loss": -5.014674186706543, "global_step": 5139, "epoch": 30} {"train_loss": -4.531902313232422, "global_step": 5140, "epoch": 30} {"train_loss": -4.527693748474121, "global_step": 5141, "epoch": 30} {"train_loss": -4.84096622467041, "global_step": 5142, "epoch": 30} {"train_loss": -4.783759117126465, "global_step": 5143, "epoch": 30} {"train_loss": -4.870612144470215, "global_step": 5144, "epoch": 30} {"train_loss": -4.770522117614746, "global_step": 5145, "epoch": 30} {"train_loss": -4.831541061401367, "global_step": 5146, "epoch": 30} {"train_loss": -5.015480995178223, "global_step": 5147, "epoch": 30} {"train_loss": -5.170334815979004, "global_step": 5148, "epoch": 30} {"train_loss": -4.823675155639648, "global_step": 5149, "epoch": 30} {"train_loss": -4.772136688232422, "global_step": 5150, "epoch": 30} {"train_loss": -5.07893705368042, "global_step": 5151, "epoch": 30} {"train_loss": -4.736547470092773, "global_step": 5152, "epoch": 30} {"train_loss": -5.105239391326904, "global_step": 5153, "epoch": 30} {"train_loss": -5.104807376861572, "global_step": 5154, "epoch": 30} {"train_loss": -4.746378421783447, "global_step": 5155, "epoch": 30} {"train_loss": -4.823612213134766, "global_step": 5156, "epoch": 30} {"train_loss": -5.219225883483887, "global_step": 5157, "epoch": 30} {"train_loss": -4.818070888519287, "global_step": 5158, "epoch": 30} {"train_loss": -5.186526298522949, "global_step": 5159, "epoch": 30} {"train_loss": -4.6254754066467285, "global_step": 5160, "epoch": 30} {"train_loss": -5.159811019897461, "global_step": 5161, "epoch": 30} {"train_loss": -4.898781776428223, "global_step": 5162, "epoch": 30} {"train_loss": -5.085474014282227, "global_step": 5163, "epoch": 30} {"train_loss": -4.6986083984375, "global_step": 5164, "epoch": 30} {"train_loss": -5.050371170043945, "global_step": 5165, "epoch": 30} {"train_loss": -5.040197372436523, "global_step": 5166, "epoch": 30} {"train_loss": -5.005162239074707, "global_step": 5167, "epoch": 30} {"train_loss": -5.073071479797363, "global_step": 5168, "epoch": 30} {"train_loss": -4.879411697387695, "global_step": 5169, "epoch": 30} {"train_loss": -5.025641441345215, "global_step": 5170, "epoch": 30} {"train_loss": -4.853549957275391, "global_step": 5171, "epoch": 30} {"train_loss": -5.030609607696533, "global_step": 5172, "epoch": 30} {"train_loss": -5.087399959564209, "global_step": 5173, "epoch": 30} {"train_loss": -4.888638496398926, "global_step": 5174, "epoch": 30} {"train_loss": -5.286717414855957, "global_step": 5175, "epoch": 30} {"train_loss": -4.982827186584473, "global_step": 5176, "epoch": 30} {"train_loss": -4.9228410720825195, "global_step": 5177, "epoch": 30} {"train_loss": -5.10862922668457, "global_step": 5178, "epoch": 30} {"train_loss": -5.1815619468688965, "global_step": 5179, "epoch": 30} {"train_loss": -5.260623455047607, "global_step": 5180, "epoch": 30} {"train_loss": -4.9153571128845215, "global_step": 5181, "epoch": 30} {"train_loss": -4.925603866577148, "global_step": 5182, "epoch": 30} {"train_loss": -5.069977760314941, "global_step": 5183, "epoch": 30} {"train_loss": -5.072081565856934, "global_step": 5184, "epoch": 30} {"train_loss": -4.817975997924805, "global_step": 5185, "epoch": 30} {"train_loss": -5.104248046875, "global_step": 5186, "epoch": 30} {"train_loss": -4.714404106140137, "global_step": 5187, "epoch": 30} {"train_loss": -4.920395851135254, "global_step": 5188, "epoch": 30} {"train_loss": -5.1119818687438965, "global_step": 5189, "epoch": 30} {"train_loss": -5.067631721496582, "global_step": 5190, "epoch": 30} {"train_loss": -5.089388370513916, "global_step": 5191, "epoch": 30} {"train_loss": -4.896735191345215, "global_step": 5192, "epoch": 30} {"train_loss": -4.855367183685303, "global_step": 5193, "epoch": 30} {"train_loss": -5.022417068481445, "global_step": 5194, "epoch": 30} {"train_loss": -4.969197750091553, "global_step": 5195, "epoch": 30} {"train_loss": -4.898346424102783, "global_step": 5196, "epoch": 30} {"train_loss": -4.714618682861328, "global_step": 5197, "epoch": 30} {"train_loss": -5.087874889373779, "global_step": 5198, "epoch": 30} {"train_loss": -5.190882682800293, "global_step": 5199, "epoch": 30} {"train_loss": -5.023647308349609, "global_step": 5200, "epoch": 30} {"train_loss": -4.939861297607422, "global_step": 5201, "epoch": 30} {"train_loss": -5.2576985359191895, "global_step": 5202, "epoch": 30} {"train_loss": -4.948512554168701, "global_step": 5203, "epoch": 30} {"train_loss": -5.095331192016602, "global_step": 5204, "epoch": 30} {"train_loss": -5.039825439453125, "global_step": 5205, "epoch": 30} {"train_loss": -5.157337188720703, "global_step": 5206, "epoch": 30} {"train_loss": -4.972941285087948, "global_step": 5207, "epoch": 30, "val_loss": 269777.71875, "train_action_mse_error": 68.4444580078125} {"train_loss": -5.082491874694824, "global_step": 5208, "epoch": 31} {"train_loss": -4.782100677490234, "global_step": 5209, "epoch": 31} {"train_loss": -5.11360502243042, "global_step": 5210, "epoch": 31} {"train_loss": -5.078716278076172, "global_step": 5211, "epoch": 31} {"train_loss": -4.949859619140625, "global_step": 5212, "epoch": 31} {"train_loss": -4.90177059173584, "global_step": 5213, "epoch": 31} {"train_loss": -4.9772233963012695, "global_step": 5214, "epoch": 31} {"train_loss": -5.212111473083496, "global_step": 5215, "epoch": 31} {"train_loss": -4.7178955078125, "global_step": 5216, "epoch": 31} {"train_loss": -4.986946105957031, "global_step": 5217, "epoch": 31} {"train_loss": -4.592686653137207, "global_step": 5218, "epoch": 31} {"train_loss": -4.9122490882873535, "global_step": 5219, "epoch": 31} {"train_loss": -5.012041091918945, "global_step": 5220, "epoch": 31} {"train_loss": -4.862932205200195, "global_step": 5221, "epoch": 31} {"train_loss": -4.931614398956299, "global_step": 5222, "epoch": 31} {"train_loss": -5.006543159484863, "global_step": 5223, "epoch": 31} {"train_loss": -5.299302577972412, "global_step": 5224, "epoch": 31} {"train_loss": -4.861678123474121, "global_step": 5225, "epoch": 31} {"train_loss": -5.1080827713012695, "global_step": 5226, "epoch": 31} {"train_loss": -4.71100378036499, "global_step": 5227, "epoch": 31} {"train_loss": -5.081751823425293, "global_step": 5228, "epoch": 31} {"train_loss": -5.188469886779785, "global_step": 5229, "epoch": 31} {"train_loss": -4.955568313598633, "global_step": 5230, "epoch": 31} {"train_loss": -5.150848388671875, "global_step": 5231, "epoch": 31} {"train_loss": -5.104214668273926, "global_step": 5232, "epoch": 31} {"train_loss": -5.063941478729248, "global_step": 5233, "epoch": 31} {"train_loss": -5.0261664390563965, "global_step": 5234, "epoch": 31} {"train_loss": -5.227019309997559, "global_step": 5235, "epoch": 31} {"train_loss": -5.1931376457214355, "global_step": 5236, "epoch": 31} {"train_loss": -5.058195114135742, "global_step": 5237, "epoch": 31} {"train_loss": -5.08967924118042, "global_step": 5238, "epoch": 31} {"train_loss": -5.072850227355957, "global_step": 5239, "epoch": 31} {"train_loss": -4.914767265319824, "global_step": 5240, "epoch": 31} {"train_loss": -4.909794807434082, "global_step": 5241, "epoch": 31} {"train_loss": -5.062046051025391, "global_step": 5242, "epoch": 31} {"train_loss": -4.919597625732422, "global_step": 5243, "epoch": 31} {"train_loss": -4.879339694976807, "global_step": 5244, "epoch": 31} {"train_loss": -5.008459091186523, "global_step": 5245, "epoch": 31} {"train_loss": -5.029694557189941, "global_step": 5246, "epoch": 31} {"train_loss": -5.1066741943359375, "global_step": 5247, "epoch": 31} {"train_loss": -4.867114067077637, "global_step": 5248, "epoch": 31} {"train_loss": -4.915920734405518, "global_step": 5249, "epoch": 31} {"train_loss": -5.203486442565918, "global_step": 5250, "epoch": 31} {"train_loss": -4.882155895233154, "global_step": 5251, "epoch": 31} {"train_loss": -4.9347639083862305, "global_step": 5252, "epoch": 31} {"train_loss": -5.016302108764648, "global_step": 5253, "epoch": 31} {"train_loss": -5.252605438232422, "global_step": 5254, "epoch": 31} {"train_loss": -5.117849349975586, "global_step": 5255, "epoch": 31} {"train_loss": -4.992153644561768, "global_step": 5256, "epoch": 31} {"train_loss": -4.978305816650391, "global_step": 5257, "epoch": 31} {"train_loss": -5.141348838806152, "global_step": 5258, "epoch": 31} {"train_loss": -5.203758239746094, "global_step": 5259, "epoch": 31} {"train_loss": -5.026001453399658, "global_step": 5260, "epoch": 31} {"train_loss": -5.139019966125488, "global_step": 5261, "epoch": 31} {"train_loss": -5.05626106262207, "global_step": 5262, "epoch": 31} {"train_loss": -5.110100746154785, "global_step": 5263, "epoch": 31} {"train_loss": -5.15233039855957, "global_step": 5264, "epoch": 31} {"train_loss": -4.996799468994141, "global_step": 5265, "epoch": 31} {"train_loss": -5.002427577972412, "global_step": 5266, "epoch": 31} {"train_loss": -5.146742820739746, "global_step": 5267, "epoch": 31} {"train_loss": -5.146932125091553, "global_step": 5268, "epoch": 31} {"train_loss": -4.812854290008545, "global_step": 5269, "epoch": 31} {"train_loss": -4.987685680389404, "global_step": 5270, "epoch": 31} {"train_loss": -4.958114147186279, "global_step": 5271, "epoch": 31} {"train_loss": -5.2369585037231445, "global_step": 5272, "epoch": 31} {"train_loss": -5.147848129272461, "global_step": 5273, "epoch": 31} {"train_loss": -5.202145099639893, "global_step": 5274, "epoch": 31} {"train_loss": -4.916445732116699, "global_step": 5275, "epoch": 31} {"train_loss": -5.043323516845703, "global_step": 5276, "epoch": 31} {"train_loss": -5.045877456665039, "global_step": 5277, "epoch": 31} {"train_loss": -4.8321051597595215, "global_step": 5278, "epoch": 31} {"train_loss": -4.934619426727295, "global_step": 5279, "epoch": 31} {"train_loss": -4.820522308349609, "global_step": 5280, "epoch": 31} {"train_loss": -5.041724681854248, "global_step": 5281, "epoch": 31} {"train_loss": -5.205894470214844, "global_step": 5282, "epoch": 31} {"train_loss": -5.081267356872559, "global_step": 5283, "epoch": 31} {"train_loss": -5.025288105010986, "global_step": 5284, "epoch": 31} {"train_loss": -5.225498199462891, "global_step": 5285, "epoch": 31} {"train_loss": -4.981842994689941, "global_step": 5286, "epoch": 31} {"train_loss": -5.356939792633057, "global_step": 5287, "epoch": 31} {"train_loss": -4.87358283996582, "global_step": 5288, "epoch": 31} {"train_loss": -5.108294486999512, "global_step": 5289, "epoch": 31} {"train_loss": -4.82832145690918, "global_step": 5290, "epoch": 31} {"train_loss": -4.797307968139648, "global_step": 5291, "epoch": 31} {"train_loss": -5.226426124572754, "global_step": 5292, "epoch": 31} {"train_loss": -4.687985420227051, "global_step": 5293, "epoch": 31} {"train_loss": -5.2721028327941895, "global_step": 5294, "epoch": 31} {"train_loss": -4.857713222503662, "global_step": 5295, "epoch": 31} {"train_loss": -5.091416358947754, "global_step": 5296, "epoch": 31} {"train_loss": -4.878437042236328, "global_step": 5297, "epoch": 31} {"train_loss": -4.612022399902344, "global_step": 5298, "epoch": 31} {"train_loss": -5.029605865478516, "global_step": 5299, "epoch": 31} {"train_loss": -4.920798301696777, "global_step": 5300, "epoch": 31} {"train_loss": -4.928431510925293, "global_step": 5301, "epoch": 31} {"train_loss": -5.0173492431640625, "global_step": 5302, "epoch": 31} {"train_loss": -4.802718162536621, "global_step": 5303, "epoch": 31} {"train_loss": -4.734116554260254, "global_step": 5304, "epoch": 31} {"train_loss": -4.987163543701172, "global_step": 5305, "epoch": 31} {"train_loss": -5.008628845214844, "global_step": 5306, "epoch": 31} {"train_loss": -4.763948917388916, "global_step": 5307, "epoch": 31} {"train_loss": -5.1069536209106445, "global_step": 5308, "epoch": 31} {"train_loss": -5.031950950622559, "global_step": 5309, "epoch": 31} {"train_loss": -4.7942118644714355, "global_step": 5310, "epoch": 31} {"train_loss": -5.002431869506836, "global_step": 5311, "epoch": 31} {"train_loss": -4.8821940422058105, "global_step": 5312, "epoch": 31} {"train_loss": -4.899546146392822, "global_step": 5313, "epoch": 31} {"train_loss": -4.924999237060547, "global_step": 5314, "epoch": 31} {"train_loss": -5.003689289093018, "global_step": 5315, "epoch": 31} {"train_loss": -5.0702643394470215, "global_step": 5316, "epoch": 31} {"train_loss": -4.801153182983398, "global_step": 5317, "epoch": 31} {"train_loss": -4.9558916091918945, "global_step": 5318, "epoch": 31} {"train_loss": -5.159203052520752, "global_step": 5319, "epoch": 31} {"train_loss": -5.078218460083008, "global_step": 5320, "epoch": 31} {"train_loss": -4.999526023864746, "global_step": 5321, "epoch": 31} {"train_loss": -5.097856044769287, "global_step": 5322, "epoch": 31} {"train_loss": -5.029550552368164, "global_step": 5323, "epoch": 31} {"train_loss": -5.015057563781738, "global_step": 5324, "epoch": 31} {"train_loss": -4.864468574523926, "global_step": 5325, "epoch": 31} {"train_loss": -4.971808910369873, "global_step": 5326, "epoch": 31} {"train_loss": -4.994060516357422, "global_step": 5327, "epoch": 31} {"train_loss": -4.851231575012207, "global_step": 5328, "epoch": 31} {"train_loss": -5.07518196105957, "global_step": 5329, "epoch": 31} {"train_loss": -4.863849639892578, "global_step": 5330, "epoch": 31} {"train_loss": -4.794310569763184, "global_step": 5331, "epoch": 31} {"train_loss": -5.132959365844727, "global_step": 5332, "epoch": 31} {"train_loss": -4.987653732299805, "global_step": 5333, "epoch": 31} {"train_loss": -5.20948600769043, "global_step": 5334, "epoch": 31} {"train_loss": -4.858414649963379, "global_step": 5335, "epoch": 31} {"train_loss": -4.8023271560668945, "global_step": 5336, "epoch": 31} {"train_loss": -5.198355674743652, "global_step": 5337, "epoch": 31} {"train_loss": -5.018660068511963, "global_step": 5338, "epoch": 31} {"train_loss": -5.192481994628906, "global_step": 5339, "epoch": 31} {"train_loss": -4.982885360717773, "global_step": 5340, "epoch": 31} {"train_loss": -5.144204139709473, "global_step": 5341, "epoch": 31} {"train_loss": -5.044308662414551, "global_step": 5342, "epoch": 31} {"train_loss": -5.070266246795654, "global_step": 5343, "epoch": 31} {"train_loss": -5.055767059326172, "global_step": 5344, "epoch": 31} {"train_loss": -5.0537567138671875, "global_step": 5345, "epoch": 31} {"train_loss": -5.128273010253906, "global_step": 5346, "epoch": 31} {"train_loss": -4.771824836730957, "global_step": 5347, "epoch": 31} {"train_loss": -5.08210563659668, "global_step": 5348, "epoch": 31} {"train_loss": -4.931999206542969, "global_step": 5349, "epoch": 31} {"train_loss": -5.037710189819336, "global_step": 5350, "epoch": 31} {"train_loss": -4.856868743896484, "global_step": 5351, "epoch": 31} {"train_loss": -4.951670169830322, "global_step": 5352, "epoch": 31} {"train_loss": -5.114630699157715, "global_step": 5353, "epoch": 31} {"train_loss": -5.015766620635986, "global_step": 5354, "epoch": 31} {"train_loss": -4.962891578674316, "global_step": 5355, "epoch": 31} {"train_loss": -5.0848846435546875, "global_step": 5356, "epoch": 31} {"train_loss": -4.815512657165527, "global_step": 5357, "epoch": 31} {"train_loss": -4.747371673583984, "global_step": 5358, "epoch": 31} {"train_loss": -4.898863792419434, "global_step": 5359, "epoch": 31} {"train_loss": -4.841188430786133, "global_step": 5360, "epoch": 31} {"train_loss": -5.035343170166016, "global_step": 5361, "epoch": 31} {"train_loss": -4.963996410369873, "global_step": 5362, "epoch": 31} {"train_loss": -4.950891494750977, "global_step": 5363, "epoch": 31} {"train_loss": -4.84495735168457, "global_step": 5364, "epoch": 31} {"train_loss": -4.996561527252197, "global_step": 5365, "epoch": 31} {"train_loss": -5.089151382446289, "global_step": 5366, "epoch": 31} {"train_loss": -5.106488227844238, "global_step": 5367, "epoch": 31} {"train_loss": -4.974207878112793, "global_step": 5368, "epoch": 31} {"train_loss": -5.0036492347717285, "global_step": 5369, "epoch": 31} {"train_loss": -4.998839855194092, "global_step": 5370, "epoch": 31} {"train_loss": -5.170904636383057, "global_step": 5371, "epoch": 31} {"train_loss": -5.036809921264648, "global_step": 5372, "epoch": 31} {"train_loss": -5.236715316772461, "global_step": 5373, "epoch": 31} {"train_loss": -4.9976701736450195, "global_step": 5374, "epoch": 31} {"train_loss": -5.003153236139388, "global_step": 5375, "epoch": 31, "val_loss": 254539.28125} {"train_loss": -4.719834327697754, "global_step": 5376, "epoch": 32} {"train_loss": -4.907806873321533, "global_step": 5377, "epoch": 32} {"train_loss": -5.167453765869141, "global_step": 5378, "epoch": 32} {"train_loss": -4.9032135009765625, "global_step": 5379, "epoch": 32} {"train_loss": -5.296268939971924, "global_step": 5380, "epoch": 32} {"train_loss": -5.014422416687012, "global_step": 5381, "epoch": 32} {"train_loss": -5.0916852951049805, "global_step": 5382, "epoch": 32} {"train_loss": -5.29245662689209, "global_step": 5383, "epoch": 32} {"train_loss": -4.885097503662109, "global_step": 5384, "epoch": 32} {"train_loss": -5.186535835266113, "global_step": 5385, "epoch": 32} {"train_loss": -5.147202491760254, "global_step": 5386, "epoch": 32} {"train_loss": -4.9706573486328125, "global_step": 5387, "epoch": 32} {"train_loss": -5.254281520843506, "global_step": 5388, "epoch": 32} {"train_loss": -4.808807849884033, "global_step": 5389, "epoch": 32} {"train_loss": -5.124387741088867, "global_step": 5390, "epoch": 32} {"train_loss": -4.692594528198242, "global_step": 5391, "epoch": 32} {"train_loss": -4.969635963439941, "global_step": 5392, "epoch": 32} {"train_loss": -4.980621814727783, "global_step": 5393, "epoch": 32} {"train_loss": -4.753104209899902, "global_step": 5394, "epoch": 32} {"train_loss": -5.073224067687988, "global_step": 5395, "epoch": 32} {"train_loss": -5.046634674072266, "global_step": 5396, "epoch": 32} {"train_loss": -4.996201515197754, "global_step": 5397, "epoch": 32} {"train_loss": -5.10988187789917, "global_step": 5398, "epoch": 32} {"train_loss": -5.070036888122559, "global_step": 5399, "epoch": 32} {"train_loss": -4.9008989334106445, "global_step": 5400, "epoch": 32} {"train_loss": -4.930689811706543, "global_step": 5401, "epoch": 32} {"train_loss": -5.1161909103393555, "global_step": 5402, "epoch": 32} {"train_loss": -5.122112274169922, "global_step": 5403, "epoch": 32} {"train_loss": -4.730266571044922, "global_step": 5404, "epoch": 32} {"train_loss": -4.890768527984619, "global_step": 5405, "epoch": 32} {"train_loss": -4.972169876098633, "global_step": 5406, "epoch": 32} {"train_loss": -4.8927178382873535, "global_step": 5407, "epoch": 32} {"train_loss": -5.09392786026001, "global_step": 5408, "epoch": 32} {"train_loss": -4.958159446716309, "global_step": 5409, "epoch": 32} {"train_loss": -4.7888360023498535, "global_step": 5410, "epoch": 32} {"train_loss": -5.138649940490723, "global_step": 5411, "epoch": 32} {"train_loss": -5.091484546661377, "global_step": 5412, "epoch": 32} {"train_loss": -5.096005916595459, "global_step": 5413, "epoch": 32} {"train_loss": -5.098606586456299, "global_step": 5414, "epoch": 32} {"train_loss": -5.285440444946289, "global_step": 5415, "epoch": 32} {"train_loss": -5.2375640869140625, "global_step": 5416, "epoch": 32} {"train_loss": -5.175357818603516, "global_step": 5417, "epoch": 32} {"train_loss": -5.143654823303223, "global_step": 5418, "epoch": 32} {"train_loss": -4.9532575607299805, "global_step": 5419, "epoch": 32} {"train_loss": -5.121870517730713, "global_step": 5420, "epoch": 32} {"train_loss": -5.0543317794799805, "global_step": 5421, "epoch": 32} {"train_loss": -4.963397979736328, "global_step": 5422, "epoch": 32} {"train_loss": -5.029843807220459, "global_step": 5423, "epoch": 32} {"train_loss": -5.188305854797363, "global_step": 5424, "epoch": 32} {"train_loss": -4.943833827972412, "global_step": 5425, "epoch": 32} {"train_loss": -4.7583208084106445, "global_step": 5426, "epoch": 32} {"train_loss": -5.16795539855957, "global_step": 5427, "epoch": 32} {"train_loss": -4.882874011993408, "global_step": 5428, "epoch": 32} {"train_loss": -5.248386383056641, "global_step": 5429, "epoch": 32} {"train_loss": -4.9728922843933105, "global_step": 5430, "epoch": 32} {"train_loss": -5.2707037925720215, "global_step": 5431, "epoch": 32} {"train_loss": -4.952876091003418, "global_step": 5432, "epoch": 32} {"train_loss": -5.229660987854004, "global_step": 5433, "epoch": 32} {"train_loss": -4.990634918212891, "global_step": 5434, "epoch": 32} {"train_loss": -5.182779312133789, "global_step": 5435, "epoch": 32} {"train_loss": -4.979914665222168, "global_step": 5436, "epoch": 32} {"train_loss": -5.09121561050415, "global_step": 5437, "epoch": 32} {"train_loss": -4.91648006439209, "global_step": 5438, "epoch": 32} {"train_loss": -5.07056188583374, "global_step": 5439, "epoch": 32} {"train_loss": -4.971773147583008, "global_step": 5440, "epoch": 32} {"train_loss": -4.976718902587891, "global_step": 5441, "epoch": 32} {"train_loss": -5.132651329040527, "global_step": 5442, "epoch": 32} {"train_loss": -5.066643714904785, "global_step": 5443, "epoch": 32} {"train_loss": -5.069818496704102, "global_step": 5444, "epoch": 32} {"train_loss": -4.932556629180908, "global_step": 5445, "epoch": 32} {"train_loss": -5.137943267822266, "global_step": 5446, "epoch": 32} {"train_loss": -4.9940080642700195, "global_step": 5447, "epoch": 32} {"train_loss": -4.918496608734131, "global_step": 5448, "epoch": 32} {"train_loss": -5.191813945770264, "global_step": 5449, "epoch": 32} {"train_loss": -5.057729721069336, "global_step": 5450, "epoch": 32} {"train_loss": -4.983550071716309, "global_step": 5451, "epoch": 32} {"train_loss": -4.872610092163086, "global_step": 5452, "epoch": 32} {"train_loss": -5.3474955558776855, "global_step": 5453, "epoch": 32} {"train_loss": -5.273702144622803, "global_step": 5454, "epoch": 32} {"train_loss": -5.214377403259277, "global_step": 5455, "epoch": 32} {"train_loss": -5.221768856048584, "global_step": 5456, "epoch": 32} {"train_loss": -5.350053310394287, "global_step": 5457, "epoch": 32} {"train_loss": -5.203248500823975, "global_step": 5458, "epoch": 32} {"train_loss": -5.299839019775391, "global_step": 5459, "epoch": 32} {"train_loss": -4.906739234924316, "global_step": 5460, "epoch": 32} {"train_loss": -5.048117637634277, "global_step": 5461, "epoch": 32} {"train_loss": -5.243422031402588, "global_step": 5462, "epoch": 32} {"train_loss": -5.547795295715332, "global_step": 5463, "epoch": 32} {"train_loss": -5.247034549713135, "global_step": 5464, "epoch": 32} {"train_loss": -5.147010326385498, "global_step": 5465, "epoch": 32} {"train_loss": -5.478689193725586, "global_step": 5466, "epoch": 32} {"train_loss": -5.063458442687988, "global_step": 5467, "epoch": 32} {"train_loss": -5.241667747497559, "global_step": 5468, "epoch": 32} {"train_loss": -5.190832614898682, "global_step": 5469, "epoch": 32} {"train_loss": -5.255083084106445, "global_step": 5470, "epoch": 32} {"train_loss": -4.966504096984863, "global_step": 5471, "epoch": 32} {"train_loss": -5.254024982452393, "global_step": 5472, "epoch": 32} {"train_loss": -5.303567886352539, "global_step": 5473, "epoch": 32} {"train_loss": -4.8715105056762695, "global_step": 5474, "epoch": 32} {"train_loss": -4.854564666748047, "global_step": 5475, "epoch": 32} {"train_loss": -4.99830436706543, "global_step": 5476, "epoch": 32} {"train_loss": -5.103517532348633, "global_step": 5477, "epoch": 32} {"train_loss": -4.750662326812744, "global_step": 5478, "epoch": 32} {"train_loss": -4.923234462738037, "global_step": 5479, "epoch": 32} {"train_loss": -4.9785661697387695, "global_step": 5480, "epoch": 32} {"train_loss": -4.810636043548584, "global_step": 5481, "epoch": 32} {"train_loss": -4.994142532348633, "global_step": 5482, "epoch": 32} {"train_loss": -4.4860429763793945, "global_step": 5483, "epoch": 32} {"train_loss": -5.056824684143066, "global_step": 5484, "epoch": 32} {"train_loss": -5.049263000488281, "global_step": 5485, "epoch": 32} {"train_loss": -4.980898857116699, "global_step": 5486, "epoch": 32} {"train_loss": -4.999547958374023, "global_step": 5487, "epoch": 32} {"train_loss": -4.9401984214782715, "global_step": 5488, "epoch": 32} {"train_loss": -4.856385707855225, "global_step": 5489, "epoch": 32} {"train_loss": -5.000308036804199, "global_step": 5490, "epoch": 32} {"train_loss": -4.884990692138672, "global_step": 5491, "epoch": 32} {"train_loss": -5.1602678298950195, "global_step": 5492, "epoch": 32} {"train_loss": -4.9971394538879395, "global_step": 5493, "epoch": 32} {"train_loss": -4.974908351898193, "global_step": 5494, "epoch": 32} {"train_loss": -5.296599388122559, "global_step": 5495, "epoch": 32} {"train_loss": -5.060517311096191, "global_step": 5496, "epoch": 32} {"train_loss": -5.174429893493652, "global_step": 5497, "epoch": 32} {"train_loss": -5.069210529327393, "global_step": 5498, "epoch": 32} {"train_loss": -5.050902366638184, "global_step": 5499, "epoch": 32} {"train_loss": -5.236037731170654, "global_step": 5500, "epoch": 32} {"train_loss": -4.98960542678833, "global_step": 5501, "epoch": 32} {"train_loss": -5.012418746948242, "global_step": 5502, "epoch": 32} {"train_loss": -5.247426986694336, "global_step": 5503, "epoch": 32} {"train_loss": -4.869270324707031, "global_step": 5504, "epoch": 32} {"train_loss": -4.757116317749023, "global_step": 5505, "epoch": 32} {"train_loss": -5.118201732635498, "global_step": 5506, "epoch": 32} {"train_loss": -4.874107837677002, "global_step": 5507, "epoch": 32} {"train_loss": -4.961543083190918, "global_step": 5508, "epoch": 32} {"train_loss": -5.416107177734375, "global_step": 5509, "epoch": 32} {"train_loss": -5.194609642028809, "global_step": 5510, "epoch": 32} {"train_loss": -5.061293601989746, "global_step": 5511, "epoch": 32} {"train_loss": -5.366617202758789, "global_step": 5512, "epoch": 32} {"train_loss": -4.958730220794678, "global_step": 5513, "epoch": 32} {"train_loss": -5.152899742126465, "global_step": 5514, "epoch": 32} {"train_loss": -5.134757041931152, "global_step": 5515, "epoch": 32} {"train_loss": -5.296623706817627, "global_step": 5516, "epoch": 32} {"train_loss": -4.951597213745117, "global_step": 5517, "epoch": 32} {"train_loss": -5.116749286651611, "global_step": 5518, "epoch": 32} {"train_loss": -5.320857048034668, "global_step": 5519, "epoch": 32} {"train_loss": -5.17716121673584, "global_step": 5520, "epoch": 32} {"train_loss": -4.946596145629883, "global_step": 5521, "epoch": 32} {"train_loss": -5.097963333129883, "global_step": 5522, "epoch": 32} {"train_loss": -4.993420600891113, "global_step": 5523, "epoch": 32} {"train_loss": -5.137269973754883, "global_step": 5524, "epoch": 32} {"train_loss": -5.116637229919434, "global_step": 5525, "epoch": 32} {"train_loss": -5.112930774688721, "global_step": 5526, "epoch": 32} {"train_loss": -4.95927619934082, "global_step": 5527, "epoch": 32} {"train_loss": -4.8152337074279785, "global_step": 5528, "epoch": 32} {"train_loss": -4.991257667541504, "global_step": 5529, "epoch": 32} {"train_loss": -4.958441734313965, "global_step": 5530, "epoch": 32} {"train_loss": -4.859044075012207, "global_step": 5531, "epoch": 32} {"train_loss": -5.128215789794922, "global_step": 5532, "epoch": 32} {"train_loss": -5.192586898803711, "global_step": 5533, "epoch": 32} {"train_loss": -5.209959983825684, "global_step": 5534, "epoch": 32} {"train_loss": -5.129736423492432, "global_step": 5535, "epoch": 32} {"train_loss": -5.168494701385498, "global_step": 5536, "epoch": 32} {"train_loss": -4.907310962677002, "global_step": 5537, "epoch": 32} {"train_loss": -4.993556976318359, "global_step": 5538, "epoch": 32} {"train_loss": -5.243089199066162, "global_step": 5539, "epoch": 32} {"train_loss": -5.284658432006836, "global_step": 5540, "epoch": 32} {"train_loss": -5.404839038848877, "global_step": 5541, "epoch": 32} {"train_loss": -5.1539812088012695, "global_step": 5542, "epoch": 32} {"train_loss": -5.061745388167245, "global_step": 5543, "epoch": 32, "val_loss": 262073.765625} {"train_loss": -5.017172813415527, "global_step": 5544, "epoch": 33} {"train_loss": -5.1891984939575195, "global_step": 5545, "epoch": 33} {"train_loss": -5.25258731842041, "global_step": 5546, "epoch": 33} {"train_loss": -5.192317008972168, "global_step": 5547, "epoch": 33} {"train_loss": -5.066683769226074, "global_step": 5548, "epoch": 33} {"train_loss": -5.0430073738098145, "global_step": 5549, "epoch": 33} {"train_loss": -4.975214958190918, "global_step": 5550, "epoch": 33} {"train_loss": -5.017394542694092, "global_step": 5551, "epoch": 33} {"train_loss": -5.172663688659668, "global_step": 5552, "epoch": 33} {"train_loss": -4.927982330322266, "global_step": 5553, "epoch": 33} {"train_loss": -5.066656112670898, "global_step": 5554, "epoch": 33} {"train_loss": -5.0998945236206055, "global_step": 5555, "epoch": 33} {"train_loss": -5.1287312507629395, "global_step": 5556, "epoch": 33} {"train_loss": -4.959162712097168, "global_step": 5557, "epoch": 33} {"train_loss": -5.219294548034668, "global_step": 5558, "epoch": 33} {"train_loss": -5.324949264526367, "global_step": 5559, "epoch": 33} {"train_loss": -5.243838787078857, "global_step": 5560, "epoch": 33} {"train_loss": -5.268064498901367, "global_step": 5561, "epoch": 33} {"train_loss": -5.444364070892334, "global_step": 5562, "epoch": 33} {"train_loss": -5.164116859436035, "global_step": 5563, "epoch": 33} {"train_loss": -5.295012474060059, "global_step": 5564, "epoch": 33} {"train_loss": -5.235538482666016, "global_step": 5565, "epoch": 33} {"train_loss": -5.004823684692383, "global_step": 5566, "epoch": 33} {"train_loss": -5.291670799255371, "global_step": 5567, "epoch": 33} {"train_loss": -5.169040679931641, "global_step": 5568, "epoch": 33} {"train_loss": -5.327840328216553, "global_step": 5569, "epoch": 33} {"train_loss": -5.034572601318359, "global_step": 5570, "epoch": 33} {"train_loss": -5.137485504150391, "global_step": 5571, "epoch": 33} {"train_loss": -4.919075012207031, "global_step": 5572, "epoch": 33} {"train_loss": -5.272286891937256, "global_step": 5573, "epoch": 33} {"train_loss": -5.083893775939941, "global_step": 5574, "epoch": 33} {"train_loss": -4.925553321838379, "global_step": 5575, "epoch": 33} {"train_loss": -5.058498382568359, "global_step": 5576, "epoch": 33} {"train_loss": -4.904735088348389, "global_step": 5577, "epoch": 33} {"train_loss": -5.197349548339844, "global_step": 5578, "epoch": 33} {"train_loss": -5.211235046386719, "global_step": 5579, "epoch": 33} {"train_loss": -5.061620712280273, "global_step": 5580, "epoch": 33} {"train_loss": -4.968273162841797, "global_step": 5581, "epoch": 33} {"train_loss": -5.21002197265625, "global_step": 5582, "epoch": 33} {"train_loss": -5.027558326721191, "global_step": 5583, "epoch": 33} {"train_loss": -5.030892372131348, "global_step": 5584, "epoch": 33} {"train_loss": -5.0787553787231445, "global_step": 5585, "epoch": 33} {"train_loss": -5.245691299438477, "global_step": 5586, "epoch": 33} {"train_loss": -4.9534101486206055, "global_step": 5587, "epoch": 33} {"train_loss": -5.131411552429199, "global_step": 5588, "epoch": 33} {"train_loss": -5.174202919006348, "global_step": 5589, "epoch": 33} {"train_loss": -5.090498447418213, "global_step": 5590, "epoch": 33} {"train_loss": -5.307162284851074, "global_step": 5591, "epoch": 33} {"train_loss": -5.1260199546813965, "global_step": 5592, "epoch": 33} {"train_loss": -5.2323808670043945, "global_step": 5593, "epoch": 33} {"train_loss": -5.177755355834961, "global_step": 5594, "epoch": 33} {"train_loss": -4.993870735168457, "global_step": 5595, "epoch": 33} {"train_loss": -4.973301887512207, "global_step": 5596, "epoch": 33} {"train_loss": -5.110668659210205, "global_step": 5597, "epoch": 33} {"train_loss": -4.9520769119262695, "global_step": 5598, "epoch": 33} {"train_loss": -5.1326398849487305, "global_step": 5599, "epoch": 33} {"train_loss": -5.028926849365234, "global_step": 5600, "epoch": 33} {"train_loss": -5.275558948516846, "global_step": 5601, "epoch": 33} {"train_loss": -4.916074275970459, "global_step": 5602, "epoch": 33} {"train_loss": -5.195470333099365, "global_step": 5603, "epoch": 33} {"train_loss": -5.2675018310546875, "global_step": 5604, "epoch": 33} {"train_loss": -4.902798652648926, "global_step": 5605, "epoch": 33} {"train_loss": -4.887328624725342, "global_step": 5606, "epoch": 33} {"train_loss": -5.417766571044922, "global_step": 5607, "epoch": 33} {"train_loss": -5.075777053833008, "global_step": 5608, "epoch": 33} {"train_loss": -5.1135101318359375, "global_step": 5609, "epoch": 33} {"train_loss": -5.1802520751953125, "global_step": 5610, "epoch": 33} {"train_loss": -4.950814247131348, "global_step": 5611, "epoch": 33} {"train_loss": -5.18613862991333, "global_step": 5612, "epoch": 33} {"train_loss": -4.9060211181640625, "global_step": 5613, "epoch": 33} {"train_loss": -5.03804874420166, "global_step": 5614, "epoch": 33} {"train_loss": -5.074059009552002, "global_step": 5615, "epoch": 33} {"train_loss": -4.801412105560303, "global_step": 5616, "epoch": 33} {"train_loss": -4.977965354919434, "global_step": 5617, "epoch": 33} {"train_loss": -5.156158447265625, "global_step": 5618, "epoch": 33} {"train_loss": -5.172967433929443, "global_step": 5619, "epoch": 33} {"train_loss": -4.887286186218262, "global_step": 5620, "epoch": 33} {"train_loss": -5.014761924743652, "global_step": 5621, "epoch": 33} {"train_loss": -5.163175582885742, "global_step": 5622, "epoch": 33} {"train_loss": -5.258474826812744, "global_step": 5623, "epoch": 33} {"train_loss": -5.103410243988037, "global_step": 5624, "epoch": 33} {"train_loss": -5.386270999908447, "global_step": 5625, "epoch": 33} {"train_loss": -5.039094924926758, "global_step": 5626, "epoch": 33} {"train_loss": -5.185310363769531, "global_step": 5627, "epoch": 33} {"train_loss": -4.864072322845459, "global_step": 5628, "epoch": 33} {"train_loss": -4.970183372497559, "global_step": 5629, "epoch": 33} {"train_loss": -4.833036422729492, "global_step": 5630, "epoch": 33} {"train_loss": -5.142758369445801, "global_step": 5631, "epoch": 33} {"train_loss": -5.1313300132751465, "global_step": 5632, "epoch": 33} {"train_loss": -4.987030029296875, "global_step": 5633, "epoch": 33} {"train_loss": -5.020545959472656, "global_step": 5634, "epoch": 33} {"train_loss": -4.996469497680664, "global_step": 5635, "epoch": 33} {"train_loss": -4.999958038330078, "global_step": 5636, "epoch": 33} {"train_loss": -4.981789588928223, "global_step": 5637, "epoch": 33} {"train_loss": -4.732903480529785, "global_step": 5638, "epoch": 33} {"train_loss": -5.062515735626221, "global_step": 5639, "epoch": 33} {"train_loss": -4.701709747314453, "global_step": 5640, "epoch": 33} {"train_loss": -4.943356990814209, "global_step": 5641, "epoch": 33} {"train_loss": -5.108994007110596, "global_step": 5642, "epoch": 33} {"train_loss": -4.995594024658203, "global_step": 5643, "epoch": 33} {"train_loss": -5.127671241760254, "global_step": 5644, "epoch": 33} {"train_loss": -4.780647277832031, "global_step": 5645, "epoch": 33} {"train_loss": -4.9680070877075195, "global_step": 5646, "epoch": 33} {"train_loss": -4.972297668457031, "global_step": 5647, "epoch": 33} {"train_loss": -5.034645080566406, "global_step": 5648, "epoch": 33} {"train_loss": -4.983659744262695, "global_step": 5649, "epoch": 33} {"train_loss": -5.179207801818848, "global_step": 5650, "epoch": 33} {"train_loss": -4.67452335357666, "global_step": 5651, "epoch": 33} {"train_loss": -4.9457902908325195, "global_step": 5652, "epoch": 33} {"train_loss": -5.237077236175537, "global_step": 5653, "epoch": 33} {"train_loss": -4.828624248504639, "global_step": 5654, "epoch": 33} {"train_loss": -5.029447555541992, "global_step": 5655, "epoch": 33} {"train_loss": -4.6265435218811035, "global_step": 5656, "epoch": 33} {"train_loss": -4.964789867401123, "global_step": 5657, "epoch": 33} {"train_loss": -5.258453369140625, "global_step": 5658, "epoch": 33} {"train_loss": -4.773911952972412, "global_step": 5659, "epoch": 33} {"train_loss": -5.180389881134033, "global_step": 5660, "epoch": 33} {"train_loss": -5.260626792907715, "global_step": 5661, "epoch": 33} {"train_loss": -5.22403621673584, "global_step": 5662, "epoch": 33} {"train_loss": -5.280796051025391, "global_step": 5663, "epoch": 33} {"train_loss": -5.294086933135986, "global_step": 5664, "epoch": 33} {"train_loss": -5.351391792297363, "global_step": 5665, "epoch": 33} {"train_loss": -5.202693462371826, "global_step": 5666, "epoch": 33} {"train_loss": -5.14210319519043, "global_step": 5667, "epoch": 33} {"train_loss": -4.904059886932373, "global_step": 5668, "epoch": 33} {"train_loss": -4.9112868309021, "global_step": 5669, "epoch": 33} {"train_loss": -5.093389511108398, "global_step": 5670, "epoch": 33} {"train_loss": -5.291069030761719, "global_step": 5671, "epoch": 33} {"train_loss": -5.343830108642578, "global_step": 5672, "epoch": 33} {"train_loss": -5.2227702140808105, "global_step": 5673, "epoch": 33} {"train_loss": -5.169377326965332, "global_step": 5674, "epoch": 33} {"train_loss": -4.926890850067139, "global_step": 5675, "epoch": 33} {"train_loss": -5.002199172973633, "global_step": 5676, "epoch": 33} {"train_loss": -5.118064880371094, "global_step": 5677, "epoch": 33} {"train_loss": -4.827672004699707, "global_step": 5678, "epoch": 33} {"train_loss": -5.385688304901123, "global_step": 5679, "epoch": 33} {"train_loss": -5.199836730957031, "global_step": 5680, "epoch": 33} {"train_loss": -4.9224677085876465, "global_step": 5681, "epoch": 33} {"train_loss": -4.999133110046387, "global_step": 5682, "epoch": 33} {"train_loss": -5.156495094299316, "global_step": 5683, "epoch": 33} {"train_loss": -4.964933395385742, "global_step": 5684, "epoch": 33} {"train_loss": -5.058815002441406, "global_step": 5685, "epoch": 33} {"train_loss": -4.71484375, "global_step": 5686, "epoch": 33} {"train_loss": -5.039892196655273, "global_step": 5687, "epoch": 33} {"train_loss": -5.130523681640625, "global_step": 5688, "epoch": 33} {"train_loss": -5.0711774826049805, "global_step": 5689, "epoch": 33} {"train_loss": -5.086820602416992, "global_step": 5690, "epoch": 33} {"train_loss": -4.89874267578125, "global_step": 5691, "epoch": 33} {"train_loss": -4.6909685134887695, "global_step": 5692, "epoch": 33} {"train_loss": -4.717010498046875, "global_step": 5693, "epoch": 33} {"train_loss": -4.7329277992248535, "global_step": 5694, "epoch": 33} {"train_loss": -5.140478134155273, "global_step": 5695, "epoch": 33} {"train_loss": -5.099202632904053, "global_step": 5696, "epoch": 33} {"train_loss": -4.890968322753906, "global_step": 5697, "epoch": 33} {"train_loss": -4.893265247344971, "global_step": 5698, "epoch": 33} {"train_loss": -4.792666435241699, "global_step": 5699, "epoch": 33} {"train_loss": -5.263812065124512, "global_step": 5700, "epoch": 33} {"train_loss": -4.81094217300415, "global_step": 5701, "epoch": 33} {"train_loss": -4.818411827087402, "global_step": 5702, "epoch": 33} {"train_loss": -5.165402412414551, "global_step": 5703, "epoch": 33} {"train_loss": -4.715251922607422, "global_step": 5704, "epoch": 33} {"train_loss": -5.14617919921875, "global_step": 5705, "epoch": 33} {"train_loss": -5.27906608581543, "global_step": 5706, "epoch": 33} {"train_loss": -5.011898994445801, "global_step": 5707, "epoch": 33} {"train_loss": -4.892136096954346, "global_step": 5708, "epoch": 33} {"train_loss": -5.181911468505859, "global_step": 5709, "epoch": 33} {"train_loss": -5.099238395690918, "global_step": 5710, "epoch": 33} {"train_loss": -5.065493282817659, "global_step": 5711, "epoch": 33, "val_loss": 276568.78125} {"train_loss": -5.193086624145508, "global_step": 5712, "epoch": 34} {"train_loss": -5.4051079750061035, "global_step": 5713, "epoch": 34} {"train_loss": -5.384856700897217, "global_step": 5714, "epoch": 34} {"train_loss": -5.060245990753174, "global_step": 5715, "epoch": 34} {"train_loss": -5.273406028747559, "global_step": 5716, "epoch": 34} {"train_loss": -5.237360954284668, "global_step": 5717, "epoch": 34} {"train_loss": -5.150501251220703, "global_step": 5718, "epoch": 34} {"train_loss": -4.836650848388672, "global_step": 5719, "epoch": 34} {"train_loss": -5.279453754425049, "global_step": 5720, "epoch": 34} {"train_loss": -5.23193883895874, "global_step": 5721, "epoch": 34} {"train_loss": -4.995155334472656, "global_step": 5722, "epoch": 34} {"train_loss": -4.892949104309082, "global_step": 5723, "epoch": 34} {"train_loss": -5.068431377410889, "global_step": 5724, "epoch": 34} {"train_loss": -5.244795322418213, "global_step": 5725, "epoch": 34} {"train_loss": -5.262942790985107, "global_step": 5726, "epoch": 34} {"train_loss": -5.047734260559082, "global_step": 5727, "epoch": 34} {"train_loss": -5.130031108856201, "global_step": 5728, "epoch": 34} {"train_loss": -5.061262607574463, "global_step": 5729, "epoch": 34} {"train_loss": -4.94191837310791, "global_step": 5730, "epoch": 34} {"train_loss": -5.17239236831665, "global_step": 5731, "epoch": 34} {"train_loss": -5.14943790435791, "global_step": 5732, "epoch": 34} {"train_loss": -4.943150043487549, "global_step": 5733, "epoch": 34} {"train_loss": -4.983808517456055, "global_step": 5734, "epoch": 34} {"train_loss": -5.203635215759277, "global_step": 5735, "epoch": 34} {"train_loss": -4.99002742767334, "global_step": 5736, "epoch": 34} {"train_loss": -5.189684867858887, "global_step": 5737, "epoch": 34} {"train_loss": -5.157425880432129, "global_step": 5738, "epoch": 34} {"train_loss": -5.167992115020752, "global_step": 5739, "epoch": 34} {"train_loss": -5.144749641418457, "global_step": 5740, "epoch": 34} {"train_loss": -5.1634721755981445, "global_step": 5741, "epoch": 34} {"train_loss": -5.173969745635986, "global_step": 5742, "epoch": 34} {"train_loss": -5.312592506408691, "global_step": 5743, "epoch": 34} {"train_loss": -5.103839874267578, "global_step": 5744, "epoch": 34} {"train_loss": -5.212149620056152, "global_step": 5745, "epoch": 34} {"train_loss": -5.3013153076171875, "global_step": 5746, "epoch": 34} {"train_loss": -5.001120090484619, "global_step": 5747, "epoch": 34} {"train_loss": -4.713506698608398, "global_step": 5748, "epoch": 34} {"train_loss": -5.09066104888916, "global_step": 5749, "epoch": 34} {"train_loss": -5.113545894622803, "global_step": 5750, "epoch": 34} {"train_loss": -5.0646772384643555, "global_step": 5751, "epoch": 34} {"train_loss": -5.113530158996582, "global_step": 5752, "epoch": 34} {"train_loss": -4.817166328430176, "global_step": 5753, "epoch": 34} {"train_loss": -5.15252685546875, "global_step": 5754, "epoch": 34} {"train_loss": -5.2016119956970215, "global_step": 5755, "epoch": 34} {"train_loss": -5.131324768066406, "global_step": 5756, "epoch": 34} {"train_loss": -5.032107353210449, "global_step": 5757, "epoch": 34} {"train_loss": -5.327895164489746, "global_step": 5758, "epoch": 34} {"train_loss": -5.047837257385254, "global_step": 5759, "epoch": 34} {"train_loss": -4.968924045562744, "global_step": 5760, "epoch": 34} {"train_loss": -5.218477249145508, "global_step": 5761, "epoch": 34} {"train_loss": -5.059849262237549, "global_step": 5762, "epoch": 34} {"train_loss": -5.365566253662109, "global_step": 5763, "epoch": 34} {"train_loss": -5.197609901428223, "global_step": 5764, "epoch": 34} {"train_loss": -5.3235297203063965, "global_step": 5765, "epoch": 34} {"train_loss": -5.002655982971191, "global_step": 5766, "epoch": 34} {"train_loss": -5.1184492111206055, "global_step": 5767, "epoch": 34} {"train_loss": -5.093752861022949, "global_step": 5768, "epoch": 34} {"train_loss": -5.148758888244629, "global_step": 5769, "epoch": 34} {"train_loss": -5.320634365081787, "global_step": 5770, "epoch": 34} {"train_loss": -5.013710021972656, "global_step": 5771, "epoch": 34} {"train_loss": -4.749759674072266, "global_step": 5772, "epoch": 34} {"train_loss": -5.004538536071777, "global_step": 5773, "epoch": 34} {"train_loss": -5.318509578704834, "global_step": 5774, "epoch": 34} {"train_loss": -5.140692710876465, "global_step": 5775, "epoch": 34} {"train_loss": -5.328212261199951, "global_step": 5776, "epoch": 34} {"train_loss": -5.220577239990234, "global_step": 5777, "epoch": 34} {"train_loss": -5.375413417816162, "global_step": 5778, "epoch": 34} {"train_loss": -5.097659111022949, "global_step": 5779, "epoch": 34} {"train_loss": -5.147696495056152, "global_step": 5780, "epoch": 34} {"train_loss": -5.326759338378906, "global_step": 5781, "epoch": 34} {"train_loss": -5.047025680541992, "global_step": 5782, "epoch": 34} {"train_loss": -5.273780345916748, "global_step": 5783, "epoch": 34} {"train_loss": -5.099701404571533, "global_step": 5784, "epoch": 34} {"train_loss": -5.1673431396484375, "global_step": 5785, "epoch": 34} {"train_loss": -5.138669967651367, "global_step": 5786, "epoch": 34} {"train_loss": -5.320274353027344, "global_step": 5787, "epoch": 34} {"train_loss": -5.193780422210693, "global_step": 5788, "epoch": 34} {"train_loss": -4.943542957305908, "global_step": 5789, "epoch": 34} {"train_loss": -5.175474166870117, "global_step": 5790, "epoch": 34} {"train_loss": -5.155794620513916, "global_step": 5791, "epoch": 34} {"train_loss": -5.154399871826172, "global_step": 5792, "epoch": 34} {"train_loss": -5.337924957275391, "global_step": 5793, "epoch": 34} {"train_loss": -5.2648420333862305, "global_step": 5794, "epoch": 34} {"train_loss": -5.312784671783447, "global_step": 5795, "epoch": 34} {"train_loss": -5.348798751831055, "global_step": 5796, "epoch": 34} {"train_loss": -5.417795658111572, "global_step": 5797, "epoch": 34} {"train_loss": -5.270528793334961, "global_step": 5798, "epoch": 34} {"train_loss": -5.423733711242676, "global_step": 5799, "epoch": 34} {"train_loss": -5.321352481842041, "global_step": 5800, "epoch": 34} {"train_loss": -5.356708526611328, "global_step": 5801, "epoch": 34} {"train_loss": -5.04986572265625, "global_step": 5802, "epoch": 34} {"train_loss": -5.164799690246582, "global_step": 5803, "epoch": 34} {"train_loss": -5.604802131652832, "global_step": 5804, "epoch": 34} {"train_loss": -5.1809892654418945, "global_step": 5805, "epoch": 34} {"train_loss": -5.108973979949951, "global_step": 5806, "epoch": 34} {"train_loss": -5.327781677246094, "global_step": 5807, "epoch": 34} {"train_loss": -5.451742172241211, "global_step": 5808, "epoch": 34} {"train_loss": -5.300075531005859, "global_step": 5809, "epoch": 34} {"train_loss": -5.283339977264404, "global_step": 5810, "epoch": 34} {"train_loss": -5.192103385925293, "global_step": 5811, "epoch": 34} {"train_loss": -5.328350067138672, "global_step": 5812, "epoch": 34} {"train_loss": -5.037337303161621, "global_step": 5813, "epoch": 34} {"train_loss": -5.232259750366211, "global_step": 5814, "epoch": 34} {"train_loss": -5.331722736358643, "global_step": 5815, "epoch": 34} {"train_loss": -4.793413162231445, "global_step": 5816, "epoch": 34} {"train_loss": -5.310163497924805, "global_step": 5817, "epoch": 34} {"train_loss": -5.216751575469971, "global_step": 5818, "epoch": 34} {"train_loss": -5.000223159790039, "global_step": 5819, "epoch": 34} {"train_loss": -4.906376838684082, "global_step": 5820, "epoch": 34} {"train_loss": -5.1892852783203125, "global_step": 5821, "epoch": 34} {"train_loss": -5.442619800567627, "global_step": 5822, "epoch": 34} {"train_loss": -5.080212593078613, "global_step": 5823, "epoch": 34} {"train_loss": -5.307647228240967, "global_step": 5824, "epoch": 34} {"train_loss": -5.05507755279541, "global_step": 5825, "epoch": 34} {"train_loss": -5.261012554168701, "global_step": 5826, "epoch": 34} {"train_loss": -5.013716220855713, "global_step": 5827, "epoch": 34} {"train_loss": -4.989200592041016, "global_step": 5828, "epoch": 34} {"train_loss": -5.285485744476318, "global_step": 5829, "epoch": 34} {"train_loss": -5.3003129959106445, "global_step": 5830, "epoch": 34} {"train_loss": -5.136669158935547, "global_step": 5831, "epoch": 34} {"train_loss": -4.962949275970459, "global_step": 5832, "epoch": 34} {"train_loss": -5.118609428405762, "global_step": 5833, "epoch": 34} {"train_loss": -5.1863555908203125, "global_step": 5834, "epoch": 34} {"train_loss": -5.0720601081848145, "global_step": 5835, "epoch": 34} {"train_loss": -4.9403839111328125, "global_step": 5836, "epoch": 34} {"train_loss": -5.244718551635742, "global_step": 5837, "epoch": 34} {"train_loss": -5.000221252441406, "global_step": 5838, "epoch": 34} {"train_loss": -5.25516939163208, "global_step": 5839, "epoch": 34} {"train_loss": -5.317248344421387, "global_step": 5840, "epoch": 34} {"train_loss": -4.846927642822266, "global_step": 5841, "epoch": 34} {"train_loss": -5.18018913269043, "global_step": 5842, "epoch": 34} {"train_loss": -4.997467994689941, "global_step": 5843, "epoch": 34} {"train_loss": -5.229645729064941, "global_step": 5844, "epoch": 34} {"train_loss": -5.193241596221924, "global_step": 5845, "epoch": 34} {"train_loss": -4.984652996063232, "global_step": 5846, "epoch": 34} {"train_loss": -5.383515357971191, "global_step": 5847, "epoch": 34} {"train_loss": -5.11928653717041, "global_step": 5848, "epoch": 34} {"train_loss": -5.268012523651123, "global_step": 5849, "epoch": 34} {"train_loss": -5.013218879699707, "global_step": 5850, "epoch": 34} {"train_loss": -4.773318767547607, "global_step": 5851, "epoch": 34} {"train_loss": -5.237437725067139, "global_step": 5852, "epoch": 34} {"train_loss": -4.999378204345703, "global_step": 5853, "epoch": 34} {"train_loss": -5.004230499267578, "global_step": 5854, "epoch": 34} {"train_loss": -4.914938449859619, "global_step": 5855, "epoch": 34} {"train_loss": -5.342188835144043, "global_step": 5856, "epoch": 34} {"train_loss": -5.284499645233154, "global_step": 5857, "epoch": 34} {"train_loss": -5.067790985107422, "global_step": 5858, "epoch": 34} {"train_loss": -5.192720890045166, "global_step": 5859, "epoch": 34} {"train_loss": -5.300827503204346, "global_step": 5860, "epoch": 34} {"train_loss": -5.256132125854492, "global_step": 5861, "epoch": 34} {"train_loss": -5.226244926452637, "global_step": 5862, "epoch": 34} {"train_loss": -5.220226287841797, "global_step": 5863, "epoch": 34} {"train_loss": -5.291894912719727, "global_step": 5864, "epoch": 34} {"train_loss": -4.815513610839844, "global_step": 5865, "epoch": 34} {"train_loss": -4.915497303009033, "global_step": 5866, "epoch": 34} {"train_loss": -4.80043888092041, "global_step": 5867, "epoch": 34} {"train_loss": -5.3408660888671875, "global_step": 5868, "epoch": 34} {"train_loss": -5.040805816650391, "global_step": 5869, "epoch": 34} {"train_loss": -5.201200008392334, "global_step": 5870, "epoch": 34} {"train_loss": -4.984402179718018, "global_step": 5871, "epoch": 34} {"train_loss": -5.0801005363464355, "global_step": 5872, "epoch": 34} {"train_loss": -5.050858497619629, "global_step": 5873, "epoch": 34} {"train_loss": -4.99607515335083, "global_step": 5874, "epoch": 34} {"train_loss": -5.184848785400391, "global_step": 5875, "epoch": 34} {"train_loss": -4.95123291015625, "global_step": 5876, "epoch": 34} {"train_loss": -4.92117166519165, "global_step": 5877, "epoch": 34} {"train_loss": -5.2595672607421875, "global_step": 5878, "epoch": 34} {"train_loss": -5.150412210396358, "global_step": 5879, "epoch": 34, "val_loss": 267149.03125} {"train_loss": -5.3466668128967285, "global_step": 5880, "epoch": 35} {"train_loss": -5.280484199523926, "global_step": 5881, "epoch": 35} {"train_loss": -4.9989471435546875, "global_step": 5882, "epoch": 35} {"train_loss": -5.101413249969482, "global_step": 5883, "epoch": 35} {"train_loss": -5.1981201171875, "global_step": 5884, "epoch": 35} {"train_loss": -5.069206237792969, "global_step": 5885, "epoch": 35} {"train_loss": -5.451202392578125, "global_step": 5886, "epoch": 35} {"train_loss": -5.23049783706665, "global_step": 5887, "epoch": 35} {"train_loss": -5.150769233703613, "global_step": 5888, "epoch": 35} {"train_loss": -5.166023254394531, "global_step": 5889, "epoch": 35} {"train_loss": -4.695725440979004, "global_step": 5890, "epoch": 35} {"train_loss": -5.1383514404296875, "global_step": 5891, "epoch": 35} {"train_loss": -4.896430015563965, "global_step": 5892, "epoch": 35} {"train_loss": -5.056017875671387, "global_step": 5893, "epoch": 35} {"train_loss": -5.186100482940674, "global_step": 5894, "epoch": 35} {"train_loss": -4.879549503326416, "global_step": 5895, "epoch": 35} {"train_loss": -5.235902786254883, "global_step": 5896, "epoch": 35} {"train_loss": -5.205913543701172, "global_step": 5897, "epoch": 35} {"train_loss": -5.199250221252441, "global_step": 5898, "epoch": 35} {"train_loss": -5.065523147583008, "global_step": 5899, "epoch": 35} {"train_loss": -5.102341651916504, "global_step": 5900, "epoch": 35} {"train_loss": -5.216930389404297, "global_step": 5901, "epoch": 35} {"train_loss": -5.047652244567871, "global_step": 5902, "epoch": 35} {"train_loss": -5.03565788269043, "global_step": 5903, "epoch": 35} {"train_loss": -5.001228332519531, "global_step": 5904, "epoch": 35} {"train_loss": -5.306272506713867, "global_step": 5905, "epoch": 35} {"train_loss": -5.277546405792236, "global_step": 5906, "epoch": 35} {"train_loss": -5.119626998901367, "global_step": 5907, "epoch": 35} {"train_loss": -5.156276702880859, "global_step": 5908, "epoch": 35} {"train_loss": -5.292466163635254, "global_step": 5909, "epoch": 35} {"train_loss": -5.319672107696533, "global_step": 5910, "epoch": 35} {"train_loss": -5.489141941070557, "global_step": 5911, "epoch": 35} {"train_loss": -5.222489356994629, "global_step": 5912, "epoch": 35} {"train_loss": -5.451568603515625, "global_step": 5913, "epoch": 35} {"train_loss": -5.296922206878662, "global_step": 5914, "epoch": 35} {"train_loss": -5.323373794555664, "global_step": 5915, "epoch": 35} {"train_loss": -5.378304958343506, "global_step": 5916, "epoch": 35} {"train_loss": -5.320493698120117, "global_step": 5917, "epoch": 35} {"train_loss": -5.259848594665527, "global_step": 5918, "epoch": 35} {"train_loss": -4.931781768798828, "global_step": 5919, "epoch": 35} {"train_loss": -5.148487567901611, "global_step": 5920, "epoch": 35} {"train_loss": -5.1330084800720215, "global_step": 5921, "epoch": 35} {"train_loss": -5.104032516479492, "global_step": 5922, "epoch": 35} {"train_loss": -5.236456394195557, "global_step": 5923, "epoch": 35} {"train_loss": -4.928680419921875, "global_step": 5924, "epoch": 35} {"train_loss": -5.385298728942871, "global_step": 5925, "epoch": 35} {"train_loss": -5.0078229904174805, "global_step": 5926, "epoch": 35} {"train_loss": -5.146857261657715, "global_step": 5927, "epoch": 35} {"train_loss": -4.931661605834961, "global_step": 5928, "epoch": 35} {"train_loss": -5.207578659057617, "global_step": 5929, "epoch": 35} {"train_loss": -5.0943779945373535, "global_step": 5930, "epoch": 35} {"train_loss": -5.131365776062012, "global_step": 5931, "epoch": 35} {"train_loss": -5.194396018981934, "global_step": 5932, "epoch": 35} {"train_loss": -4.9824700355529785, "global_step": 5933, "epoch": 35} {"train_loss": -5.0832133293151855, "global_step": 5934, "epoch": 35} {"train_loss": -5.192474365234375, "global_step": 5935, "epoch": 35} {"train_loss": -4.93536901473999, "global_step": 5936, "epoch": 35} {"train_loss": -5.417973518371582, "global_step": 5937, "epoch": 35} {"train_loss": -5.236184120178223, "global_step": 5938, "epoch": 35} {"train_loss": -5.064028263092041, "global_step": 5939, "epoch": 35} {"train_loss": -5.098106384277344, "global_step": 5940, "epoch": 35} {"train_loss": -5.002971649169922, "global_step": 5941, "epoch": 35} {"train_loss": -5.190151214599609, "global_step": 5942, "epoch": 35} {"train_loss": -4.8647894859313965, "global_step": 5943, "epoch": 35} {"train_loss": -5.05526065826416, "global_step": 5944, "epoch": 35} {"train_loss": -5.168094635009766, "global_step": 5945, "epoch": 35} {"train_loss": -5.262165069580078, "global_step": 5946, "epoch": 35} {"train_loss": -5.329066276550293, "global_step": 5947, "epoch": 35} {"train_loss": -5.073044776916504, "global_step": 5948, "epoch": 35} {"train_loss": -4.977150917053223, "global_step": 5949, "epoch": 35} {"train_loss": -5.301485538482666, "global_step": 5950, "epoch": 35} {"train_loss": -5.186285972595215, "global_step": 5951, "epoch": 35} {"train_loss": -5.057103157043457, "global_step": 5952, "epoch": 35} {"train_loss": -5.268030166625977, "global_step": 5953, "epoch": 35} {"train_loss": -5.223152160644531, "global_step": 5954, "epoch": 35} {"train_loss": -4.872691631317139, "global_step": 5955, "epoch": 35} {"train_loss": -4.952427864074707, "global_step": 5956, "epoch": 35} {"train_loss": -5.183013916015625, "global_step": 5957, "epoch": 35} {"train_loss": -5.306281566619873, "global_step": 5958, "epoch": 35} {"train_loss": -5.016103744506836, "global_step": 5959, "epoch": 35} {"train_loss": -5.131262302398682, "global_step": 5960, "epoch": 35} {"train_loss": -5.24822998046875, "global_step": 5961, "epoch": 35} {"train_loss": -5.149918556213379, "global_step": 5962, "epoch": 35} {"train_loss": -4.924254894256592, "global_step": 5963, "epoch": 35} {"train_loss": -5.112969398498535, "global_step": 5964, "epoch": 35} {"train_loss": -4.951661586761475, "global_step": 5965, "epoch": 35} {"train_loss": -5.122337341308594, "global_step": 5966, "epoch": 35} {"train_loss": -4.970455169677734, "global_step": 5967, "epoch": 35} {"train_loss": -5.190059185028076, "global_step": 5968, "epoch": 35} {"train_loss": -5.030202865600586, "global_step": 5969, "epoch": 35} {"train_loss": -4.807272434234619, "global_step": 5970, "epoch": 35} {"train_loss": -5.208224296569824, "global_step": 5971, "epoch": 35} {"train_loss": -4.94120454788208, "global_step": 5972, "epoch": 35} {"train_loss": -5.205760955810547, "global_step": 5973, "epoch": 35} {"train_loss": -5.153813362121582, "global_step": 5974, "epoch": 35} {"train_loss": -5.17018461227417, "global_step": 5975, "epoch": 35} {"train_loss": -5.222984790802002, "global_step": 5976, "epoch": 35} {"train_loss": -5.091696262359619, "global_step": 5977, "epoch": 35} {"train_loss": -5.3070831298828125, "global_step": 5978, "epoch": 35} {"train_loss": -5.386234283447266, "global_step": 5979, "epoch": 35} {"train_loss": -5.204343795776367, "global_step": 5980, "epoch": 35} {"train_loss": -5.245906829833984, "global_step": 5981, "epoch": 35} {"train_loss": -5.314462661743164, "global_step": 5982, "epoch": 35} {"train_loss": -5.266013145446777, "global_step": 5983, "epoch": 35} {"train_loss": -5.197518348693848, "global_step": 5984, "epoch": 35} {"train_loss": -5.406930923461914, "global_step": 5985, "epoch": 35} {"train_loss": -5.322140693664551, "global_step": 5986, "epoch": 35} {"train_loss": -5.342288494110107, "global_step": 5987, "epoch": 35} {"train_loss": -4.858404159545898, "global_step": 5988, "epoch": 35} {"train_loss": -4.984166145324707, "global_step": 5989, "epoch": 35} {"train_loss": -5.049859046936035, "global_step": 5990, "epoch": 35} {"train_loss": -4.851202011108398, "global_step": 5991, "epoch": 35} {"train_loss": -5.264887809753418, "global_step": 5992, "epoch": 35} {"train_loss": -4.956830024719238, "global_step": 5993, "epoch": 35} {"train_loss": -5.096682548522949, "global_step": 5994, "epoch": 35} {"train_loss": -5.065327167510986, "global_step": 5995, "epoch": 35} {"train_loss": -4.985211372375488, "global_step": 5996, "epoch": 35} {"train_loss": -4.950218200683594, "global_step": 5997, "epoch": 35} {"train_loss": -5.04167366027832, "global_step": 5998, "epoch": 35} {"train_loss": -4.864154815673828, "global_step": 5999, "epoch": 35} {"train_loss": -5.134236812591553, "global_step": 6000, "epoch": 35} {"train_loss": -5.072626113891602, "global_step": 6001, "epoch": 35} {"train_loss": -4.873191833496094, "global_step": 6002, "epoch": 35} {"train_loss": -4.864939212799072, "global_step": 6003, "epoch": 35} {"train_loss": -5.269178867340088, "global_step": 6004, "epoch": 35} {"train_loss": -4.708349704742432, "global_step": 6005, "epoch": 35} {"train_loss": -4.95181131362915, "global_step": 6006, "epoch": 35} {"train_loss": -5.351693153381348, "global_step": 6007, "epoch": 35} {"train_loss": -5.155023574829102, "global_step": 6008, "epoch": 35} {"train_loss": -5.040190696716309, "global_step": 6009, "epoch": 35} {"train_loss": -5.310498237609863, "global_step": 6010, "epoch": 35} {"train_loss": -5.111141204833984, "global_step": 6011, "epoch": 35} {"train_loss": -4.926945209503174, "global_step": 6012, "epoch": 35} {"train_loss": -5.038103103637695, "global_step": 6013, "epoch": 35} {"train_loss": -4.962952136993408, "global_step": 6014, "epoch": 35} {"train_loss": -5.393784523010254, "global_step": 6015, "epoch": 35} {"train_loss": -4.858220100402832, "global_step": 6016, "epoch": 35} {"train_loss": -5.231861114501953, "global_step": 6017, "epoch": 35} {"train_loss": -4.976138114929199, "global_step": 6018, "epoch": 35} {"train_loss": -5.027658462524414, "global_step": 6019, "epoch": 35} {"train_loss": -5.100830078125, "global_step": 6020, "epoch": 35} {"train_loss": -5.168149471282959, "global_step": 6021, "epoch": 35} {"train_loss": -4.873277187347412, "global_step": 6022, "epoch": 35} {"train_loss": -5.101535797119141, "global_step": 6023, "epoch": 35} {"train_loss": -5.219850540161133, "global_step": 6024, "epoch": 35} {"train_loss": -4.746078968048096, "global_step": 6025, "epoch": 35} {"train_loss": -5.18574333190918, "global_step": 6026, "epoch": 35} {"train_loss": -5.224004745483398, "global_step": 6027, "epoch": 35} {"train_loss": -4.870522499084473, "global_step": 6028, "epoch": 35} {"train_loss": -5.0122294425964355, "global_step": 6029, "epoch": 35} {"train_loss": -5.166481018066406, "global_step": 6030, "epoch": 35} {"train_loss": -5.306882858276367, "global_step": 6031, "epoch": 35} {"train_loss": -5.399350166320801, "global_step": 6032, "epoch": 35} {"train_loss": -5.252532958984375, "global_step": 6033, "epoch": 35} {"train_loss": -4.9236249923706055, "global_step": 6034, "epoch": 35} {"train_loss": -5.003643989562988, "global_step": 6035, "epoch": 35} {"train_loss": -5.137237548828125, "global_step": 6036, "epoch": 35} {"train_loss": -5.141190528869629, "global_step": 6037, "epoch": 35} {"train_loss": -4.974651336669922, "global_step": 6038, "epoch": 35} {"train_loss": -4.904336929321289, "global_step": 6039, "epoch": 35} {"train_loss": -5.29827356338501, "global_step": 6040, "epoch": 35} {"train_loss": -5.066493034362793, "global_step": 6041, "epoch": 35} {"train_loss": -5.183444023132324, "global_step": 6042, "epoch": 35} {"train_loss": -5.195589542388916, "global_step": 6043, "epoch": 35} {"train_loss": -5.138821125030518, "global_step": 6044, "epoch": 35} {"train_loss": -5.200571060180664, "global_step": 6045, "epoch": 35} {"train_loss": -4.9428300857543945, "global_step": 6046, "epoch": 35} {"train_loss": -5.1246278541428705, "global_step": 6047, "epoch": 35, "val_loss": 269721.25, "train_action_mse_error": 52.52206802368164} {"train_loss": -5.258600234985352, "global_step": 6048, "epoch": 36} {"train_loss": -5.268713474273682, "global_step": 6049, "epoch": 36} {"train_loss": -5.29526948928833, "global_step": 6050, "epoch": 36} {"train_loss": -5.146202087402344, "global_step": 6051, "epoch": 36} {"train_loss": -5.09835147857666, "global_step": 6052, "epoch": 36} {"train_loss": -5.187573432922363, "global_step": 6053, "epoch": 36} {"train_loss": -5.143767356872559, "global_step": 6054, "epoch": 36} {"train_loss": -4.971512317657471, "global_step": 6055, "epoch": 36} {"train_loss": -4.991097450256348, "global_step": 6056, "epoch": 36} {"train_loss": -5.178077697753906, "global_step": 6057, "epoch": 36} {"train_loss": -5.156411647796631, "global_step": 6058, "epoch": 36} {"train_loss": -4.991382598876953, "global_step": 6059, "epoch": 36} {"train_loss": -4.970505714416504, "global_step": 6060, "epoch": 36} {"train_loss": -4.964190483093262, "global_step": 6061, "epoch": 36} {"train_loss": -5.354100227355957, "global_step": 6062, "epoch": 36} {"train_loss": -5.174383163452148, "global_step": 6063, "epoch": 36} {"train_loss": -5.055150985717773, "global_step": 6064, "epoch": 36} {"train_loss": -5.10088586807251, "global_step": 6065, "epoch": 36} {"train_loss": -5.094759464263916, "global_step": 6066, "epoch": 36} {"train_loss": -5.118551254272461, "global_step": 6067, "epoch": 36} {"train_loss": -5.354602813720703, "global_step": 6068, "epoch": 36} {"train_loss": -5.302165508270264, "global_step": 6069, "epoch": 36} {"train_loss": -4.991677284240723, "global_step": 6070, "epoch": 36} {"train_loss": -5.181145191192627, "global_step": 6071, "epoch": 36} {"train_loss": -5.233087539672852, "global_step": 6072, "epoch": 36} {"train_loss": -5.211624622344971, "global_step": 6073, "epoch": 36} {"train_loss": -5.084216117858887, "global_step": 6074, "epoch": 36} {"train_loss": -5.306836128234863, "global_step": 6075, "epoch": 36} {"train_loss": -5.144730567932129, "global_step": 6076, "epoch": 36} {"train_loss": -5.391521453857422, "global_step": 6077, "epoch": 36} {"train_loss": -4.8956756591796875, "global_step": 6078, "epoch": 36} {"train_loss": -5.1811065673828125, "global_step": 6079, "epoch": 36} {"train_loss": -5.058603286743164, "global_step": 6080, "epoch": 36} {"train_loss": -5.2942399978637695, "global_step": 6081, "epoch": 36} {"train_loss": -5.058122634887695, "global_step": 6082, "epoch": 36} {"train_loss": -4.8518548011779785, "global_step": 6083, "epoch": 36} {"train_loss": -5.0032877922058105, "global_step": 6084, "epoch": 36} {"train_loss": -5.178943634033203, "global_step": 6085, "epoch": 36} {"train_loss": -4.7431817054748535, "global_step": 6086, "epoch": 36} {"train_loss": -4.997897148132324, "global_step": 6087, "epoch": 36} {"train_loss": -5.116348743438721, "global_step": 6088, "epoch": 36} {"train_loss": -4.83711051940918, "global_step": 6089, "epoch": 36} {"train_loss": -5.089178085327148, "global_step": 6090, "epoch": 36} {"train_loss": -5.294188499450684, "global_step": 6091, "epoch": 36} {"train_loss": -5.227988243103027, "global_step": 6092, "epoch": 36} {"train_loss": -5.079931259155273, "global_step": 6093, "epoch": 36} {"train_loss": -4.993044853210449, "global_step": 6094, "epoch": 36} {"train_loss": -5.2439727783203125, "global_step": 6095, "epoch": 36} {"train_loss": -5.356832504272461, "global_step": 6096, "epoch": 36} {"train_loss": -5.291584014892578, "global_step": 6097, "epoch": 36} {"train_loss": -5.225685119628906, "global_step": 6098, "epoch": 36} {"train_loss": -5.334262847900391, "global_step": 6099, "epoch": 36} {"train_loss": -5.175145626068115, "global_step": 6100, "epoch": 36} {"train_loss": -5.377399444580078, "global_step": 6101, "epoch": 36} {"train_loss": -5.178299427032471, "global_step": 6102, "epoch": 36} {"train_loss": -5.093672275543213, "global_step": 6103, "epoch": 36} {"train_loss": -5.05925989151001, "global_step": 6104, "epoch": 36} {"train_loss": -5.264011383056641, "global_step": 6105, "epoch": 36} {"train_loss": -4.882648468017578, "global_step": 6106, "epoch": 36} {"train_loss": -5.387751579284668, "global_step": 6107, "epoch": 36} {"train_loss": -4.890405654907227, "global_step": 6108, "epoch": 36} {"train_loss": -5.005104064941406, "global_step": 6109, "epoch": 36} {"train_loss": -5.237819671630859, "global_step": 6110, "epoch": 36} {"train_loss": -5.317984580993652, "global_step": 6111, "epoch": 36} {"train_loss": -4.856649398803711, "global_step": 6112, "epoch": 36} {"train_loss": -5.026456832885742, "global_step": 6113, "epoch": 36} {"train_loss": -5.106113433837891, "global_step": 6114, "epoch": 36} {"train_loss": -5.342114448547363, "global_step": 6115, "epoch": 36} {"train_loss": -5.257654190063477, "global_step": 6116, "epoch": 36} {"train_loss": -5.182847023010254, "global_step": 6117, "epoch": 36} {"train_loss": -4.982013702392578, "global_step": 6118, "epoch": 36} {"train_loss": -5.0844316482543945, "global_step": 6119, "epoch": 36} {"train_loss": -5.005138397216797, "global_step": 6120, "epoch": 36} {"train_loss": -5.186657905578613, "global_step": 6121, "epoch": 36} {"train_loss": -5.3220953941345215, "global_step": 6122, "epoch": 36} {"train_loss": -5.435232162475586, "global_step": 6123, "epoch": 36} {"train_loss": -5.270089626312256, "global_step": 6124, "epoch": 36} {"train_loss": -5.2872314453125, "global_step": 6125, "epoch": 36} {"train_loss": -5.2625274658203125, "global_step": 6126, "epoch": 36} {"train_loss": -5.47796630859375, "global_step": 6127, "epoch": 36} {"train_loss": -5.3057861328125, "global_step": 6128, "epoch": 36} {"train_loss": -4.854781627655029, "global_step": 6129, "epoch": 36} {"train_loss": -5.35921573638916, "global_step": 6130, "epoch": 36} {"train_loss": -5.386753559112549, "global_step": 6131, "epoch": 36} {"train_loss": -5.354435920715332, "global_step": 6132, "epoch": 36} {"train_loss": -5.346467018127441, "global_step": 6133, "epoch": 36} {"train_loss": -5.252547740936279, "global_step": 6134, "epoch": 36} {"train_loss": -5.323263645172119, "global_step": 6135, "epoch": 36} {"train_loss": -5.094285488128662, "global_step": 6136, "epoch": 36} {"train_loss": -5.137996673583984, "global_step": 6137, "epoch": 36} {"train_loss": -5.332060813903809, "global_step": 6138, "epoch": 36} {"train_loss": -5.3426384925842285, "global_step": 6139, "epoch": 36} {"train_loss": -5.281935691833496, "global_step": 6140, "epoch": 36} {"train_loss": -5.08823299407959, "global_step": 6141, "epoch": 36} {"train_loss": -5.005597114562988, "global_step": 6142, "epoch": 36} {"train_loss": -5.197854995727539, "global_step": 6143, "epoch": 36} {"train_loss": -5.233475685119629, "global_step": 6144, "epoch": 36} {"train_loss": -5.263366222381592, "global_step": 6145, "epoch": 36} {"train_loss": -5.10178279876709, "global_step": 6146, "epoch": 36} {"train_loss": -5.487605094909668, "global_step": 6147, "epoch": 36} {"train_loss": -5.13566780090332, "global_step": 6148, "epoch": 36} {"train_loss": -5.243117332458496, "global_step": 6149, "epoch": 36} {"train_loss": -5.414663314819336, "global_step": 6150, "epoch": 36} {"train_loss": -5.296118259429932, "global_step": 6151, "epoch": 36} {"train_loss": -5.268033504486084, "global_step": 6152, "epoch": 36} {"train_loss": -5.213481903076172, "global_step": 6153, "epoch": 36} {"train_loss": -5.312862873077393, "global_step": 6154, "epoch": 36} {"train_loss": -5.3074951171875, "global_step": 6155, "epoch": 36} {"train_loss": -5.185661315917969, "global_step": 6156, "epoch": 36} {"train_loss": -5.310572624206543, "global_step": 6157, "epoch": 36} {"train_loss": -5.353200912475586, "global_step": 6158, "epoch": 36} {"train_loss": -5.381775856018066, "global_step": 6159, "epoch": 36} {"train_loss": -5.139568328857422, "global_step": 6160, "epoch": 36} {"train_loss": -5.404387474060059, "global_step": 6161, "epoch": 36} {"train_loss": -4.874722480773926, "global_step": 6162, "epoch": 36} {"train_loss": -4.8067121505737305, "global_step": 6163, "epoch": 36} {"train_loss": -5.278820991516113, "global_step": 6164, "epoch": 36} {"train_loss": -4.97537899017334, "global_step": 6165, "epoch": 36} {"train_loss": -5.282865524291992, "global_step": 6166, "epoch": 36} {"train_loss": -4.9006147384643555, "global_step": 6167, "epoch": 36} {"train_loss": -5.292661190032959, "global_step": 6168, "epoch": 36} {"train_loss": -5.242730140686035, "global_step": 6169, "epoch": 36} {"train_loss": -5.131307125091553, "global_step": 6170, "epoch": 36} {"train_loss": -4.853708267211914, "global_step": 6171, "epoch": 36} {"train_loss": -4.752476692199707, "global_step": 6172, "epoch": 36} {"train_loss": -5.010030746459961, "global_step": 6173, "epoch": 36} {"train_loss": -5.3380818367004395, "global_step": 6174, "epoch": 36} {"train_loss": -5.159477233886719, "global_step": 6175, "epoch": 36} {"train_loss": -5.075203895568848, "global_step": 6176, "epoch": 36} {"train_loss": -5.24365234375, "global_step": 6177, "epoch": 36} {"train_loss": -4.97456169128418, "global_step": 6178, "epoch": 36} {"train_loss": -4.9376115798950195, "global_step": 6179, "epoch": 36} {"train_loss": -4.8519439697265625, "global_step": 6180, "epoch": 36} {"train_loss": -4.9858808517456055, "global_step": 6181, "epoch": 36} {"train_loss": -5.216946601867676, "global_step": 6182, "epoch": 36} {"train_loss": -5.034322738647461, "global_step": 6183, "epoch": 36} {"train_loss": -5.243884563446045, "global_step": 6184, "epoch": 36} {"train_loss": -5.08187198638916, "global_step": 6185, "epoch": 36} {"train_loss": -5.0063018798828125, "global_step": 6186, "epoch": 36} {"train_loss": -5.297379970550537, "global_step": 6187, "epoch": 36} {"train_loss": -5.2611188888549805, "global_step": 6188, "epoch": 36} {"train_loss": -4.989437103271484, "global_step": 6189, "epoch": 36} {"train_loss": -5.257069110870361, "global_step": 6190, "epoch": 36} {"train_loss": -5.0321526527404785, "global_step": 6191, "epoch": 36} {"train_loss": -5.233358860015869, "global_step": 6192, "epoch": 36} {"train_loss": -5.02398681640625, "global_step": 6193, "epoch": 36} {"train_loss": -4.994394302368164, "global_step": 6194, "epoch": 36} {"train_loss": -5.26423978805542, "global_step": 6195, "epoch": 36} {"train_loss": -4.960513114929199, "global_step": 6196, "epoch": 36} {"train_loss": -5.063571453094482, "global_step": 6197, "epoch": 36} {"train_loss": -5.1045684814453125, "global_step": 6198, "epoch": 36} {"train_loss": -5.160414695739746, "global_step": 6199, "epoch": 36} {"train_loss": -5.284392833709717, "global_step": 6200, "epoch": 36} {"train_loss": -4.890674591064453, "global_step": 6201, "epoch": 36} {"train_loss": -5.062639236450195, "global_step": 6202, "epoch": 36} {"train_loss": -4.840536117553711, "global_step": 6203, "epoch": 36} {"train_loss": -4.90311336517334, "global_step": 6204, "epoch": 36} {"train_loss": -5.334417343139648, "global_step": 6205, "epoch": 36} {"train_loss": -5.186184406280518, "global_step": 6206, "epoch": 36} {"train_loss": -5.052362442016602, "global_step": 6207, "epoch": 36} {"train_loss": -5.0860395431518555, "global_step": 6208, "epoch": 36} {"train_loss": -5.41635799407959, "global_step": 6209, "epoch": 36} {"train_loss": -5.0275349617004395, "global_step": 6210, "epoch": 36} {"train_loss": -5.00393533706665, "global_step": 6211, "epoch": 36} {"train_loss": -5.13167667388916, "global_step": 6212, "epoch": 36} {"train_loss": -5.072196960449219, "global_step": 6213, "epoch": 36} {"train_loss": -5.094772815704346, "global_step": 6214, "epoch": 36} {"train_loss": -5.150561752773466, "global_step": 6215, "epoch": 36, "val_loss": 251843.359375} {"train_loss": -5.118055820465088, "global_step": 6216, "epoch": 37} {"train_loss": -5.146484375, "global_step": 6217, "epoch": 37} {"train_loss": -5.224068641662598, "global_step": 6218, "epoch": 37} {"train_loss": -5.017351150512695, "global_step": 6219, "epoch": 37} {"train_loss": -5.492793083190918, "global_step": 6220, "epoch": 37} {"train_loss": -5.10018253326416, "global_step": 6221, "epoch": 37} {"train_loss": -5.051886558532715, "global_step": 6222, "epoch": 37} {"train_loss": -5.3667216300964355, "global_step": 6223, "epoch": 37} {"train_loss": -5.117491245269775, "global_step": 6224, "epoch": 37} {"train_loss": -5.152919769287109, "global_step": 6225, "epoch": 37} {"train_loss": -5.090393543243408, "global_step": 6226, "epoch": 37} {"train_loss": -5.179256439208984, "global_step": 6227, "epoch": 37} {"train_loss": -5.327812671661377, "global_step": 6228, "epoch": 37} {"train_loss": -5.341644763946533, "global_step": 6229, "epoch": 37} {"train_loss": -5.212437629699707, "global_step": 6230, "epoch": 37} {"train_loss": -4.9937639236450195, "global_step": 6231, "epoch": 37} {"train_loss": -5.418164253234863, "global_step": 6232, "epoch": 37} {"train_loss": -4.727017879486084, "global_step": 6233, "epoch": 37} {"train_loss": -5.139216899871826, "global_step": 6234, "epoch": 37} {"train_loss": -5.198141098022461, "global_step": 6235, "epoch": 37} {"train_loss": -5.24077033996582, "global_step": 6236, "epoch": 37} {"train_loss": -5.1042399406433105, "global_step": 6237, "epoch": 37} {"train_loss": -5.048502445220947, "global_step": 6238, "epoch": 37} {"train_loss": -5.404296875, "global_step": 6239, "epoch": 37} {"train_loss": -5.333355903625488, "global_step": 6240, "epoch": 37} {"train_loss": -5.328604698181152, "global_step": 6241, "epoch": 37} {"train_loss": -4.642022609710693, "global_step": 6242, "epoch": 37} {"train_loss": -4.990479469299316, "global_step": 6243, "epoch": 37} {"train_loss": -4.820501327514648, "global_step": 6244, "epoch": 37} {"train_loss": -5.204477310180664, "global_step": 6245, "epoch": 37} {"train_loss": -5.053876876831055, "global_step": 6246, "epoch": 37} {"train_loss": -5.292254447937012, "global_step": 6247, "epoch": 37} {"train_loss": -4.847962379455566, "global_step": 6248, "epoch": 37} {"train_loss": -5.361527442932129, "global_step": 6249, "epoch": 37} {"train_loss": -5.25147819519043, "global_step": 6250, "epoch": 37} {"train_loss": -5.067716121673584, "global_step": 6251, "epoch": 37} {"train_loss": -5.369669437408447, "global_step": 6252, "epoch": 37} {"train_loss": -5.022564888000488, "global_step": 6253, "epoch": 37} {"train_loss": -5.15616512298584, "global_step": 6254, "epoch": 37} {"train_loss": -5.1947784423828125, "global_step": 6255, "epoch": 37} {"train_loss": -5.000670433044434, "global_step": 6256, "epoch": 37} {"train_loss": -5.1643781661987305, "global_step": 6257, "epoch": 37} {"train_loss": -5.288395404815674, "global_step": 6258, "epoch": 37} {"train_loss": -5.0320563316345215, "global_step": 6259, "epoch": 37} {"train_loss": -5.281779766082764, "global_step": 6260, "epoch": 37} {"train_loss": -5.1020426750183105, "global_step": 6261, "epoch": 37} {"train_loss": -5.465464115142822, "global_step": 6262, "epoch": 37} {"train_loss": -5.046740531921387, "global_step": 6263, "epoch": 37} {"train_loss": -5.155268669128418, "global_step": 6264, "epoch": 37} {"train_loss": -5.087034225463867, "global_step": 6265, "epoch": 37} {"train_loss": -5.389081954956055, "global_step": 6266, "epoch": 37} {"train_loss": -5.133750915527344, "global_step": 6267, "epoch": 37} {"train_loss": -5.348213195800781, "global_step": 6268, "epoch": 37} {"train_loss": -5.239871025085449, "global_step": 6269, "epoch": 37} {"train_loss": -5.506691932678223, "global_step": 6270, "epoch": 37} {"train_loss": -5.428631782531738, "global_step": 6271, "epoch": 37} {"train_loss": -5.478425979614258, "global_step": 6272, "epoch": 37} {"train_loss": -5.684623718261719, "global_step": 6273, "epoch": 37} {"train_loss": -5.119444370269775, "global_step": 6274, "epoch": 37} {"train_loss": -5.211241722106934, "global_step": 6275, "epoch": 37} {"train_loss": -5.3196868896484375, "global_step": 6276, "epoch": 37} {"train_loss": -5.187976837158203, "global_step": 6277, "epoch": 37} {"train_loss": -5.184507369995117, "global_step": 6278, "epoch": 37} {"train_loss": -5.421499729156494, "global_step": 6279, "epoch": 37} {"train_loss": -5.156338691711426, "global_step": 6280, "epoch": 37} {"train_loss": -5.346015453338623, "global_step": 6281, "epoch": 37} {"train_loss": -5.293752193450928, "global_step": 6282, "epoch": 37} {"train_loss": -5.388114929199219, "global_step": 6283, "epoch": 37} {"train_loss": -5.136204719543457, "global_step": 6284, "epoch": 37} {"train_loss": -5.269134521484375, "global_step": 6285, "epoch": 37} {"train_loss": -5.358479022979736, "global_step": 6286, "epoch": 37} {"train_loss": -5.0693817138671875, "global_step": 6287, "epoch": 37} {"train_loss": -5.185790061950684, "global_step": 6288, "epoch": 37} {"train_loss": -5.020164966583252, "global_step": 6289, "epoch": 37} {"train_loss": -5.153934478759766, "global_step": 6290, "epoch": 37} {"train_loss": -5.253619194030762, "global_step": 6291, "epoch": 37} {"train_loss": -5.182323455810547, "global_step": 6292, "epoch": 37} {"train_loss": -5.406188011169434, "global_step": 6293, "epoch": 37} {"train_loss": -4.763738632202148, "global_step": 6294, "epoch": 37} {"train_loss": -4.993378639221191, "global_step": 6295, "epoch": 37} {"train_loss": -5.162058353424072, "global_step": 6296, "epoch": 37} {"train_loss": -5.302268028259277, "global_step": 6297, "epoch": 37} {"train_loss": -5.200915336608887, "global_step": 6298, "epoch": 37} {"train_loss": -5.2078537940979, "global_step": 6299, "epoch": 37} {"train_loss": -4.8661208152771, "global_step": 6300, "epoch": 37} {"train_loss": -5.043302536010742, "global_step": 6301, "epoch": 37} {"train_loss": -5.313345432281494, "global_step": 6302, "epoch": 37} {"train_loss": -5.3470306396484375, "global_step": 6303, "epoch": 37} {"train_loss": -5.514828681945801, "global_step": 6304, "epoch": 37} {"train_loss": -5.204174995422363, "global_step": 6305, "epoch": 37} {"train_loss": -5.102677822113037, "global_step": 6306, "epoch": 37} {"train_loss": -4.896124839782715, "global_step": 6307, "epoch": 37} {"train_loss": -5.099081516265869, "global_step": 6308, "epoch": 37} {"train_loss": -5.341968536376953, "global_step": 6309, "epoch": 37} {"train_loss": -5.345259666442871, "global_step": 6310, "epoch": 37} {"train_loss": -5.129974365234375, "global_step": 6311, "epoch": 37} {"train_loss": -5.41487979888916, "global_step": 6312, "epoch": 37} {"train_loss": -5.341538429260254, "global_step": 6313, "epoch": 37} {"train_loss": -5.277613162994385, "global_step": 6314, "epoch": 37} {"train_loss": -5.256069183349609, "global_step": 6315, "epoch": 37} {"train_loss": -4.981873035430908, "global_step": 6316, "epoch": 37} {"train_loss": -5.199216842651367, "global_step": 6317, "epoch": 37} {"train_loss": -5.002565383911133, "global_step": 6318, "epoch": 37} {"train_loss": -5.13006591796875, "global_step": 6319, "epoch": 37} {"train_loss": -5.08516788482666, "global_step": 6320, "epoch": 37} {"train_loss": -5.300235748291016, "global_step": 6321, "epoch": 37} {"train_loss": -5.045188903808594, "global_step": 6322, "epoch": 37} {"train_loss": -5.136914253234863, "global_step": 6323, "epoch": 37} {"train_loss": -5.0299530029296875, "global_step": 6324, "epoch": 37} {"train_loss": -5.25546932220459, "global_step": 6325, "epoch": 37} {"train_loss": -4.858230113983154, "global_step": 6326, "epoch": 37} {"train_loss": -5.361403465270996, "global_step": 6327, "epoch": 37} {"train_loss": -5.130384922027588, "global_step": 6328, "epoch": 37} {"train_loss": -5.265284538269043, "global_step": 6329, "epoch": 37} {"train_loss": -5.316754341125488, "global_step": 6330, "epoch": 37} {"train_loss": -5.254885196685791, "global_step": 6331, "epoch": 37} {"train_loss": -5.203345775604248, "global_step": 6332, "epoch": 37} {"train_loss": -5.438929557800293, "global_step": 6333, "epoch": 37} {"train_loss": -5.301698684692383, "global_step": 6334, "epoch": 37} {"train_loss": -5.24278450012207, "global_step": 6335, "epoch": 37} {"train_loss": -5.44321346282959, "global_step": 6336, "epoch": 37} {"train_loss": -5.391942977905273, "global_step": 6337, "epoch": 37} {"train_loss": -5.296110153198242, "global_step": 6338, "epoch": 37} {"train_loss": -5.239087104797363, "global_step": 6339, "epoch": 37} {"train_loss": -5.2221527099609375, "global_step": 6340, "epoch": 37} {"train_loss": -5.378524303436279, "global_step": 6341, "epoch": 37} {"train_loss": -5.200689315795898, "global_step": 6342, "epoch": 37} {"train_loss": -5.173861503601074, "global_step": 6343, "epoch": 37} {"train_loss": -5.2911882400512695, "global_step": 6344, "epoch": 37} {"train_loss": -5.137990951538086, "global_step": 6345, "epoch": 37} {"train_loss": -5.279487609863281, "global_step": 6346, "epoch": 37} {"train_loss": -5.183870792388916, "global_step": 6347, "epoch": 37} {"train_loss": -5.329903602600098, "global_step": 6348, "epoch": 37} {"train_loss": -5.1330976486206055, "global_step": 6349, "epoch": 37} {"train_loss": -5.4360809326171875, "global_step": 6350, "epoch": 37} {"train_loss": -5.325763702392578, "global_step": 6351, "epoch": 37} {"train_loss": -5.122171401977539, "global_step": 6352, "epoch": 37} {"train_loss": -5.4786529541015625, "global_step": 6353, "epoch": 37} {"train_loss": -5.682994365692139, "global_step": 6354, "epoch": 37} {"train_loss": -5.202461242675781, "global_step": 6355, "epoch": 37} {"train_loss": -5.15561580657959, "global_step": 6356, "epoch": 37} {"train_loss": -5.29512882232666, "global_step": 6357, "epoch": 37} {"train_loss": -5.093478202819824, "global_step": 6358, "epoch": 37} {"train_loss": -5.0269975662231445, "global_step": 6359, "epoch": 37} {"train_loss": -5.075078010559082, "global_step": 6360, "epoch": 37} {"train_loss": -5.309116840362549, "global_step": 6361, "epoch": 37} {"train_loss": -5.1370391845703125, "global_step": 6362, "epoch": 37} {"train_loss": -5.2283124923706055, "global_step": 6363, "epoch": 37} {"train_loss": -5.360723495483398, "global_step": 6364, "epoch": 37} {"train_loss": -5.4455437660217285, "global_step": 6365, "epoch": 37} {"train_loss": -5.179237365722656, "global_step": 6366, "epoch": 37} {"train_loss": -5.34029483795166, "global_step": 6367, "epoch": 37} {"train_loss": -5.326665878295898, "global_step": 6368, "epoch": 37} {"train_loss": -5.351949691772461, "global_step": 6369, "epoch": 37} {"train_loss": -5.133604049682617, "global_step": 6370, "epoch": 37} {"train_loss": -5.134490966796875, "global_step": 6371, "epoch": 37} {"train_loss": -5.259827613830566, "global_step": 6372, "epoch": 37} {"train_loss": -5.063804626464844, "global_step": 6373, "epoch": 37} {"train_loss": -4.637467384338379, "global_step": 6374, "epoch": 37} {"train_loss": -5.166268348693848, "global_step": 6375, "epoch": 37} {"train_loss": -5.161118984222412, "global_step": 6376, "epoch": 37} {"train_loss": -5.432452201843262, "global_step": 6377, "epoch": 37} {"train_loss": -5.138004302978516, "global_step": 6378, "epoch": 37} {"train_loss": -5.1402716636657715, "global_step": 6379, "epoch": 37} {"train_loss": -5.105747699737549, "global_step": 6380, "epoch": 37} {"train_loss": -5.16136360168457, "global_step": 6381, "epoch": 37} {"train_loss": -5.180708885192871, "global_step": 6382, "epoch": 37} {"train_loss": -5.205077747503917, "global_step": 6383, "epoch": 37, "val_loss": 260402.859375} {"train_loss": -5.476102828979492, "global_step": 6384, "epoch": 38} {"train_loss": -5.040920257568359, "global_step": 6385, "epoch": 38} {"train_loss": -4.953802108764648, "global_step": 6386, "epoch": 38} {"train_loss": -5.324945449829102, "global_step": 6387, "epoch": 38} {"train_loss": -5.209653854370117, "global_step": 6388, "epoch": 38} {"train_loss": -5.450244426727295, "global_step": 6389, "epoch": 38} {"train_loss": -5.316229820251465, "global_step": 6390, "epoch": 38} {"train_loss": -5.431424617767334, "global_step": 6391, "epoch": 38} {"train_loss": -5.116520404815674, "global_step": 6392, "epoch": 38} {"train_loss": -5.3063201904296875, "global_step": 6393, "epoch": 38} {"train_loss": -5.296878814697266, "global_step": 6394, "epoch": 38} {"train_loss": -5.088451862335205, "global_step": 6395, "epoch": 38} {"train_loss": -5.361711025238037, "global_step": 6396, "epoch": 38} {"train_loss": -5.137893199920654, "global_step": 6397, "epoch": 38} {"train_loss": -5.174289703369141, "global_step": 6398, "epoch": 38} {"train_loss": -4.908990859985352, "global_step": 6399, "epoch": 38} {"train_loss": -5.512895584106445, "global_step": 6400, "epoch": 38} {"train_loss": -4.848773956298828, "global_step": 6401, "epoch": 38} {"train_loss": -5.317944526672363, "global_step": 6402, "epoch": 38} {"train_loss": -5.327913284301758, "global_step": 6403, "epoch": 38} {"train_loss": -4.962368965148926, "global_step": 6404, "epoch": 38} {"train_loss": -5.197720050811768, "global_step": 6405, "epoch": 38} {"train_loss": -4.9912495613098145, "global_step": 6406, "epoch": 38} {"train_loss": -4.995361328125, "global_step": 6407, "epoch": 38} {"train_loss": -4.837203502655029, "global_step": 6408, "epoch": 38} {"train_loss": -4.8706769943237305, "global_step": 6409, "epoch": 38} {"train_loss": -5.058846473693848, "global_step": 6410, "epoch": 38} {"train_loss": -5.055782318115234, "global_step": 6411, "epoch": 38} {"train_loss": -4.99733829498291, "global_step": 6412, "epoch": 38} {"train_loss": -5.082695960998535, "global_step": 6413, "epoch": 38} {"train_loss": -5.204970359802246, "global_step": 6414, "epoch": 38} {"train_loss": -5.075350761413574, "global_step": 6415, "epoch": 38} {"train_loss": -5.039274215698242, "global_step": 6416, "epoch": 38} {"train_loss": -5.245628356933594, "global_step": 6417, "epoch": 38} {"train_loss": -4.956191062927246, "global_step": 6418, "epoch": 38} {"train_loss": -5.064528465270996, "global_step": 6419, "epoch": 38} {"train_loss": -5.215078353881836, "global_step": 6420, "epoch": 38} {"train_loss": -5.155368804931641, "global_step": 6421, "epoch": 38} {"train_loss": -5.006520748138428, "global_step": 6422, "epoch": 38} {"train_loss": -5.01969051361084, "global_step": 6423, "epoch": 38} {"train_loss": -5.274803638458252, "global_step": 6424, "epoch": 38} {"train_loss": -5.442264556884766, "global_step": 6425, "epoch": 38} {"train_loss": -5.390933513641357, "global_step": 6426, "epoch": 38} {"train_loss": -5.430539608001709, "global_step": 6427, "epoch": 38} {"train_loss": -5.281559467315674, "global_step": 6428, "epoch": 38} {"train_loss": -5.314472675323486, "global_step": 6429, "epoch": 38} {"train_loss": -5.624300956726074, "global_step": 6430, "epoch": 38} {"train_loss": -5.113883018493652, "global_step": 6431, "epoch": 38} {"train_loss": -5.571166038513184, "global_step": 6432, "epoch": 38} {"train_loss": -5.187414169311523, "global_step": 6433, "epoch": 38} {"train_loss": -5.326772689819336, "global_step": 6434, "epoch": 38} {"train_loss": -5.33687162399292, "global_step": 6435, "epoch": 38} {"train_loss": -5.501266956329346, "global_step": 6436, "epoch": 38} {"train_loss": -5.597805976867676, "global_step": 6437, "epoch": 38} {"train_loss": -5.369675636291504, "global_step": 6438, "epoch": 38} {"train_loss": -5.449077606201172, "global_step": 6439, "epoch": 38} {"train_loss": -5.273024559020996, "global_step": 6440, "epoch": 38} {"train_loss": -5.237259864807129, "global_step": 6441, "epoch": 38} {"train_loss": -5.562032699584961, "global_step": 6442, "epoch": 38} {"train_loss": -4.912145614624023, "global_step": 6443, "epoch": 38} {"train_loss": -5.572857856750488, "global_step": 6444, "epoch": 38} {"train_loss": -4.872035980224609, "global_step": 6445, "epoch": 38} {"train_loss": -5.242510795593262, "global_step": 6446, "epoch": 38} {"train_loss": -5.165005683898926, "global_step": 6447, "epoch": 38} {"train_loss": -5.163525581359863, "global_step": 6448, "epoch": 38} {"train_loss": -5.395627975463867, "global_step": 6449, "epoch": 38} {"train_loss": -5.046695709228516, "global_step": 6450, "epoch": 38} {"train_loss": -5.205808639526367, "global_step": 6451, "epoch": 38} {"train_loss": -5.341397285461426, "global_step": 6452, "epoch": 38} {"train_loss": -4.958146572113037, "global_step": 6453, "epoch": 38} {"train_loss": -5.447504997253418, "global_step": 6454, "epoch": 38} {"train_loss": -5.207676887512207, "global_step": 6455, "epoch": 38} {"train_loss": -5.361534118652344, "global_step": 6456, "epoch": 38} {"train_loss": -5.512446403503418, "global_step": 6457, "epoch": 38} {"train_loss": -5.211543083190918, "global_step": 6458, "epoch": 38} {"train_loss": -5.26821231842041, "global_step": 6459, "epoch": 38} {"train_loss": -5.174734592437744, "global_step": 6460, "epoch": 38} {"train_loss": -5.158759593963623, "global_step": 6461, "epoch": 38} {"train_loss": -5.495100975036621, "global_step": 6462, "epoch": 38} {"train_loss": -5.330228805541992, "global_step": 6463, "epoch": 38} {"train_loss": -5.474294662475586, "global_step": 6464, "epoch": 38} {"train_loss": -5.31978178024292, "global_step": 6465, "epoch": 38} {"train_loss": -5.541387557983398, "global_step": 6466, "epoch": 38} {"train_loss": -5.430927753448486, "global_step": 6467, "epoch": 38} {"train_loss": -5.2428998947143555, "global_step": 6468, "epoch": 38} {"train_loss": -5.289514541625977, "global_step": 6469, "epoch": 38} {"train_loss": -5.202931880950928, "global_step": 6470, "epoch": 38} {"train_loss": -5.315616130828857, "global_step": 6471, "epoch": 38} {"train_loss": -4.891660213470459, "global_step": 6472, "epoch": 38} {"train_loss": -5.629230499267578, "global_step": 6473, "epoch": 38} {"train_loss": -5.485020637512207, "global_step": 6474, "epoch": 38} {"train_loss": -5.423444747924805, "global_step": 6475, "epoch": 38} {"train_loss": -5.2393341064453125, "global_step": 6476, "epoch": 38} {"train_loss": -5.242116451263428, "global_step": 6477, "epoch": 38} {"train_loss": -5.64515495300293, "global_step": 6478, "epoch": 38} {"train_loss": -5.25303316116333, "global_step": 6479, "epoch": 38} {"train_loss": -5.337378025054932, "global_step": 6480, "epoch": 38} {"train_loss": -5.319275856018066, "global_step": 6481, "epoch": 38} {"train_loss": -5.203803062438965, "global_step": 6482, "epoch": 38} {"train_loss": -5.413362979888916, "global_step": 6483, "epoch": 38} {"train_loss": -5.345786094665527, "global_step": 6484, "epoch": 38} {"train_loss": -5.456790924072266, "global_step": 6485, "epoch": 38} {"train_loss": -5.4629435539245605, "global_step": 6486, "epoch": 38} {"train_loss": -4.930108070373535, "global_step": 6487, "epoch": 38} {"train_loss": -5.154727935791016, "global_step": 6488, "epoch": 38} {"train_loss": -4.958656311035156, "global_step": 6489, "epoch": 38} {"train_loss": -5.008747577667236, "global_step": 6490, "epoch": 38} {"train_loss": -5.143908977508545, "global_step": 6491, "epoch": 38} {"train_loss": -4.873498439788818, "global_step": 6492, "epoch": 38} {"train_loss": -5.325497627258301, "global_step": 6493, "epoch": 38} {"train_loss": -4.977500915527344, "global_step": 6494, "epoch": 38} {"train_loss": -5.3724045753479, "global_step": 6495, "epoch": 38} {"train_loss": -5.073787212371826, "global_step": 6496, "epoch": 38} {"train_loss": -5.137345314025879, "global_step": 6497, "epoch": 38} {"train_loss": -5.306896209716797, "global_step": 6498, "epoch": 38} {"train_loss": -4.988449573516846, "global_step": 6499, "epoch": 38} {"train_loss": -5.299178600311279, "global_step": 6500, "epoch": 38} {"train_loss": -5.288573265075684, "global_step": 6501, "epoch": 38} {"train_loss": -4.970508098602295, "global_step": 6502, "epoch": 38} {"train_loss": -5.311636924743652, "global_step": 6503, "epoch": 38} {"train_loss": -5.417585372924805, "global_step": 6504, "epoch": 38} {"train_loss": -5.1655778884887695, "global_step": 6505, "epoch": 38} {"train_loss": -5.414112091064453, "global_step": 6506, "epoch": 38} {"train_loss": -5.419101715087891, "global_step": 6507, "epoch": 38} {"train_loss": -5.428816795349121, "global_step": 6508, "epoch": 38} {"train_loss": -5.4215922355651855, "global_step": 6509, "epoch": 38} {"train_loss": -5.424307823181152, "global_step": 6510, "epoch": 38} {"train_loss": -5.419672966003418, "global_step": 6511, "epoch": 38} {"train_loss": -5.16729736328125, "global_step": 6512, "epoch": 38} {"train_loss": -5.387507438659668, "global_step": 6513, "epoch": 38} {"train_loss": -5.388183116912842, "global_step": 6514, "epoch": 38} {"train_loss": -5.109156131744385, "global_step": 6515, "epoch": 38} {"train_loss": -5.312356472015381, "global_step": 6516, "epoch": 38} {"train_loss": -5.6036248207092285, "global_step": 6517, "epoch": 38} {"train_loss": -5.604801654815674, "global_step": 6518, "epoch": 38} {"train_loss": -5.3798418045043945, "global_step": 6519, "epoch": 38} {"train_loss": -5.102360725402832, "global_step": 6520, "epoch": 38} {"train_loss": -5.282466888427734, "global_step": 6521, "epoch": 38} {"train_loss": -5.027008056640625, "global_step": 6522, "epoch": 38} {"train_loss": -5.02762508392334, "global_step": 6523, "epoch": 38} {"train_loss": -4.914726257324219, "global_step": 6524, "epoch": 38} {"train_loss": -5.3202362060546875, "global_step": 6525, "epoch": 38} {"train_loss": -5.242191791534424, "global_step": 6526, "epoch": 38} {"train_loss": -5.3139777183532715, "global_step": 6527, "epoch": 38} {"train_loss": -5.2701029777526855, "global_step": 6528, "epoch": 38} {"train_loss": -5.3848981857299805, "global_step": 6529, "epoch": 38} {"train_loss": -5.059209823608398, "global_step": 6530, "epoch": 38} {"train_loss": -5.380561828613281, "global_step": 6531, "epoch": 38} {"train_loss": -5.0938591957092285, "global_step": 6532, "epoch": 38} {"train_loss": -5.121819496154785, "global_step": 6533, "epoch": 38} {"train_loss": -5.227853298187256, "global_step": 6534, "epoch": 38} {"train_loss": -5.365190029144287, "global_step": 6535, "epoch": 38} {"train_loss": -5.043328285217285, "global_step": 6536, "epoch": 38} {"train_loss": -5.553762435913086, "global_step": 6537, "epoch": 38} {"train_loss": -5.208513259887695, "global_step": 6538, "epoch": 38} {"train_loss": -5.513839244842529, "global_step": 6539, "epoch": 38} {"train_loss": -5.351625919342041, "global_step": 6540, "epoch": 38} {"train_loss": -5.589050769805908, "global_step": 6541, "epoch": 38} {"train_loss": -5.265584945678711, "global_step": 6542, "epoch": 38} {"train_loss": -5.125160217285156, "global_step": 6543, "epoch": 38} {"train_loss": -4.95954704284668, "global_step": 6544, "epoch": 38} {"train_loss": -4.99489688873291, "global_step": 6545, "epoch": 38} {"train_loss": -5.074589252471924, "global_step": 6546, "epoch": 38} {"train_loss": -5.222070693969727, "global_step": 6547, "epoch": 38} {"train_loss": -5.360517501831055, "global_step": 6548, "epoch": 38} {"train_loss": -5.274219036102295, "global_step": 6549, "epoch": 38} {"train_loss": -5.2275238037109375, "global_step": 6550, "epoch": 38} {"train_loss": -5.2451994475864225, "global_step": 6551, "epoch": 38, "val_loss": 269778.1875} {"train_loss": -5.09818172454834, "global_step": 6552, "epoch": 39} {"train_loss": -5.2825469970703125, "global_step": 6553, "epoch": 39} {"train_loss": -5.277675628662109, "global_step": 6554, "epoch": 39} {"train_loss": -5.13397216796875, "global_step": 6555, "epoch": 39} {"train_loss": -5.040740966796875, "global_step": 6556, "epoch": 39} {"train_loss": -5.080170631408691, "global_step": 6557, "epoch": 39} {"train_loss": -5.3180341720581055, "global_step": 6558, "epoch": 39} {"train_loss": -5.064479351043701, "global_step": 6559, "epoch": 39} {"train_loss": -5.28122615814209, "global_step": 6560, "epoch": 39} {"train_loss": -5.001348495483398, "global_step": 6561, "epoch": 39} {"train_loss": -5.185521125793457, "global_step": 6562, "epoch": 39} {"train_loss": -5.283055305480957, "global_step": 6563, "epoch": 39} {"train_loss": -5.075987815856934, "global_step": 6564, "epoch": 39} {"train_loss": -5.227248191833496, "global_step": 6565, "epoch": 39} {"train_loss": -5.058113098144531, "global_step": 6566, "epoch": 39} {"train_loss": -5.0659003257751465, "global_step": 6567, "epoch": 39} {"train_loss": -5.251420974731445, "global_step": 6568, "epoch": 39} {"train_loss": -5.1649017333984375, "global_step": 6569, "epoch": 39} {"train_loss": -5.3035478591918945, "global_step": 6570, "epoch": 39} {"train_loss": -5.071577072143555, "global_step": 6571, "epoch": 39} {"train_loss": -5.345300674438477, "global_step": 6572, "epoch": 39} {"train_loss": -5.246397972106934, "global_step": 6573, "epoch": 39} {"train_loss": -5.411890029907227, "global_step": 6574, "epoch": 39} {"train_loss": -5.009214401245117, "global_step": 6575, "epoch": 39} {"train_loss": -5.375476837158203, "global_step": 6576, "epoch": 39} {"train_loss": -5.141894340515137, "global_step": 6577, "epoch": 39} {"train_loss": -5.057154655456543, "global_step": 6578, "epoch": 39} {"train_loss": -4.988883018493652, "global_step": 6579, "epoch": 39} {"train_loss": -5.413540840148926, "global_step": 6580, "epoch": 39} {"train_loss": -5.179384708404541, "global_step": 6581, "epoch": 39} {"train_loss": -5.416515827178955, "global_step": 6582, "epoch": 39} {"train_loss": -5.348505020141602, "global_step": 6583, "epoch": 39} {"train_loss": -5.443885803222656, "global_step": 6584, "epoch": 39} {"train_loss": -5.167030334472656, "global_step": 6585, "epoch": 39} {"train_loss": -5.3123955726623535, "global_step": 6586, "epoch": 39} {"train_loss": -5.3998613357543945, "global_step": 6587, "epoch": 39} {"train_loss": -5.284462928771973, "global_step": 6588, "epoch": 39} {"train_loss": -5.5046162605285645, "global_step": 6589, "epoch": 39} {"train_loss": -5.3470354080200195, "global_step": 6590, "epoch": 39} {"train_loss": -5.647482872009277, "global_step": 6591, "epoch": 39} {"train_loss": -5.1771063804626465, "global_step": 6592, "epoch": 39} {"train_loss": -5.508859634399414, "global_step": 6593, "epoch": 39} {"train_loss": -5.298055648803711, "global_step": 6594, "epoch": 39} {"train_loss": -5.507851600646973, "global_step": 6595, "epoch": 39} {"train_loss": -5.492583274841309, "global_step": 6596, "epoch": 39} {"train_loss": -5.390023231506348, "global_step": 6597, "epoch": 39} {"train_loss": -5.32398796081543, "global_step": 6598, "epoch": 39} {"train_loss": -5.497547626495361, "global_step": 6599, "epoch": 39} {"train_loss": -5.424990653991699, "global_step": 6600, "epoch": 39} {"train_loss": -5.149360656738281, "global_step": 6601, "epoch": 39} {"train_loss": -5.33782434463501, "global_step": 6602, "epoch": 39} {"train_loss": -5.546761989593506, "global_step": 6603, "epoch": 39} {"train_loss": -5.297207832336426, "global_step": 6604, "epoch": 39} {"train_loss": -5.076489448547363, "global_step": 6605, "epoch": 39} {"train_loss": -5.536170959472656, "global_step": 6606, "epoch": 39} {"train_loss": -5.412972450256348, "global_step": 6607, "epoch": 39} {"train_loss": -5.080228805541992, "global_step": 6608, "epoch": 39} {"train_loss": -5.155697345733643, "global_step": 6609, "epoch": 39} {"train_loss": -5.249387264251709, "global_step": 6610, "epoch": 39} {"train_loss": -5.134151458740234, "global_step": 6611, "epoch": 39} {"train_loss": -5.18808650970459, "global_step": 6612, "epoch": 39} {"train_loss": -5.128287315368652, "global_step": 6613, "epoch": 39} {"train_loss": -5.32562255859375, "global_step": 6614, "epoch": 39} {"train_loss": -5.1920294761657715, "global_step": 6615, "epoch": 39} {"train_loss": -5.468316078186035, "global_step": 6616, "epoch": 39} {"train_loss": -5.039838790893555, "global_step": 6617, "epoch": 39} {"train_loss": -5.31846809387207, "global_step": 6618, "epoch": 39} {"train_loss": -5.395294189453125, "global_step": 6619, "epoch": 39} {"train_loss": -5.35948371887207, "global_step": 6620, "epoch": 39} {"train_loss": -5.314696788787842, "global_step": 6621, "epoch": 39} {"train_loss": -5.338043689727783, "global_step": 6622, "epoch": 39} {"train_loss": -5.378963470458984, "global_step": 6623, "epoch": 39} {"train_loss": -5.464605331420898, "global_step": 6624, "epoch": 39} {"train_loss": -5.316706657409668, "global_step": 6625, "epoch": 39} {"train_loss": -5.399169921875, "global_step": 6626, "epoch": 39} {"train_loss": -5.499060153961182, "global_step": 6627, "epoch": 39} {"train_loss": -5.452339172363281, "global_step": 6628, "epoch": 39} {"train_loss": -5.477302074432373, "global_step": 6629, "epoch": 39} {"train_loss": -5.504580497741699, "global_step": 6630, "epoch": 39} {"train_loss": -5.598794937133789, "global_step": 6631, "epoch": 39} {"train_loss": -5.295914173126221, "global_step": 6632, "epoch": 39} {"train_loss": -5.346133708953857, "global_step": 6633, "epoch": 39} {"train_loss": -5.525206565856934, "global_step": 6634, "epoch": 39} {"train_loss": -5.211142539978027, "global_step": 6635, "epoch": 39} {"train_loss": -5.125085830688477, "global_step": 6636, "epoch": 39} {"train_loss": -5.075780868530273, "global_step": 6637, "epoch": 39} {"train_loss": -4.982000350952148, "global_step": 6638, "epoch": 39} {"train_loss": -4.909928321838379, "global_step": 6639, "epoch": 39} {"train_loss": -5.278986930847168, "global_step": 6640, "epoch": 39} {"train_loss": -5.207100868225098, "global_step": 6641, "epoch": 39} {"train_loss": -5.258432388305664, "global_step": 6642, "epoch": 39} {"train_loss": -4.984108924865723, "global_step": 6643, "epoch": 39} {"train_loss": -5.358477592468262, "global_step": 6644, "epoch": 39} {"train_loss": -5.2718095779418945, "global_step": 6645, "epoch": 39} {"train_loss": -5.352801322937012, "global_step": 6646, "epoch": 39} {"train_loss": -5.250206470489502, "global_step": 6647, "epoch": 39} {"train_loss": -5.3170881271362305, "global_step": 6648, "epoch": 39} {"train_loss": -5.466638088226318, "global_step": 6649, "epoch": 39} {"train_loss": -5.234143257141113, "global_step": 6650, "epoch": 39} {"train_loss": -5.124354362487793, "global_step": 6651, "epoch": 39} {"train_loss": -5.11253547668457, "global_step": 6652, "epoch": 39} {"train_loss": -5.488270282745361, "global_step": 6653, "epoch": 39} {"train_loss": -5.248840808868408, "global_step": 6654, "epoch": 39} {"train_loss": -5.352959156036377, "global_step": 6655, "epoch": 39} {"train_loss": -5.465449810028076, "global_step": 6656, "epoch": 39} {"train_loss": -5.232365131378174, "global_step": 6657, "epoch": 39} {"train_loss": -5.356005668640137, "global_step": 6658, "epoch": 39} {"train_loss": -5.290304183959961, "global_step": 6659, "epoch": 39} {"train_loss": -5.136328220367432, "global_step": 6660, "epoch": 39} {"train_loss": -5.31321907043457, "global_step": 6661, "epoch": 39} {"train_loss": -5.308950901031494, "global_step": 6662, "epoch": 39} {"train_loss": -5.252945899963379, "global_step": 6663, "epoch": 39} {"train_loss": -5.32849645614624, "global_step": 6664, "epoch": 39} {"train_loss": -5.480297088623047, "global_step": 6665, "epoch": 39} {"train_loss": -5.15231990814209, "global_step": 6666, "epoch": 39} {"train_loss": -5.119063854217529, "global_step": 6667, "epoch": 39} {"train_loss": -5.273210048675537, "global_step": 6668, "epoch": 39} {"train_loss": -5.362119674682617, "global_step": 6669, "epoch": 39} {"train_loss": -5.385063648223877, "global_step": 6670, "epoch": 39} {"train_loss": -5.40186071395874, "global_step": 6671, "epoch": 39} {"train_loss": -5.520514488220215, "global_step": 6672, "epoch": 39} {"train_loss": -5.163039684295654, "global_step": 6673, "epoch": 39} {"train_loss": -5.324439525604248, "global_step": 6674, "epoch": 39} {"train_loss": -5.234389305114746, "global_step": 6675, "epoch": 39} {"train_loss": -5.293964385986328, "global_step": 6676, "epoch": 39} {"train_loss": -5.463588714599609, "global_step": 6677, "epoch": 39} {"train_loss": -4.916217803955078, "global_step": 6678, "epoch": 39} {"train_loss": -5.3654913902282715, "global_step": 6679, "epoch": 39} {"train_loss": -5.305158615112305, "global_step": 6680, "epoch": 39} {"train_loss": -5.370838165283203, "global_step": 6681, "epoch": 39} {"train_loss": -5.286020278930664, "global_step": 6682, "epoch": 39} {"train_loss": -5.451898097991943, "global_step": 6683, "epoch": 39} {"train_loss": -5.239320755004883, "global_step": 6684, "epoch": 39} {"train_loss": -5.39188814163208, "global_step": 6685, "epoch": 39} {"train_loss": -5.446440696716309, "global_step": 6686, "epoch": 39} {"train_loss": -5.250415802001953, "global_step": 6687, "epoch": 39} {"train_loss": -5.104053020477295, "global_step": 6688, "epoch": 39} {"train_loss": -5.145871162414551, "global_step": 6689, "epoch": 39} {"train_loss": -5.134049892425537, "global_step": 6690, "epoch": 39} {"train_loss": -5.3470258712768555, "global_step": 6691, "epoch": 39} {"train_loss": -5.038924217224121, "global_step": 6692, "epoch": 39} {"train_loss": -5.147298336029053, "global_step": 6693, "epoch": 39} {"train_loss": -5.3136138916015625, "global_step": 6694, "epoch": 39} {"train_loss": -5.341195106506348, "global_step": 6695, "epoch": 39} {"train_loss": -5.383228778839111, "global_step": 6696, "epoch": 39} {"train_loss": -5.2905168533325195, "global_step": 6697, "epoch": 39} {"train_loss": -5.489272117614746, "global_step": 6698, "epoch": 39} {"train_loss": -4.994863033294678, "global_step": 6699, "epoch": 39} {"train_loss": -5.365705490112305, "global_step": 6700, "epoch": 39} {"train_loss": -5.4202141761779785, "global_step": 6701, "epoch": 39} {"train_loss": -5.3950066566467285, "global_step": 6702, "epoch": 39} {"train_loss": -5.386210918426514, "global_step": 6703, "epoch": 39} {"train_loss": -5.284669399261475, "global_step": 6704, "epoch": 39} {"train_loss": -5.304351806640625, "global_step": 6705, "epoch": 39} {"train_loss": -5.31099796295166, "global_step": 6706, "epoch": 39} {"train_loss": -5.2022294998168945, "global_step": 6707, "epoch": 39} {"train_loss": -5.05948543548584, "global_step": 6708, "epoch": 39} {"train_loss": -5.3783793449401855, "global_step": 6709, "epoch": 39} {"train_loss": -5.1591081619262695, "global_step": 6710, "epoch": 39} {"train_loss": -5.309737205505371, "global_step": 6711, "epoch": 39} {"train_loss": -5.303576469421387, "global_step": 6712, "epoch": 39} {"train_loss": -5.136466979980469, "global_step": 6713, "epoch": 39} {"train_loss": -5.083992004394531, "global_step": 6714, "epoch": 39} {"train_loss": -5.271770477294922, "global_step": 6715, "epoch": 39} {"train_loss": -5.439817428588867, "global_step": 6716, "epoch": 39} {"train_loss": -5.08249044418335, "global_step": 6717, "epoch": 39} {"train_loss": -5.348728179931641, "global_step": 6718, "epoch": 39} {"train_loss": -5.280803260349092, "global_step": 6719, "epoch": 39, "val_loss": 261251.265625} {"train_loss": -5.152502059936523, "global_step": 6720, "epoch": 40} {"train_loss": -5.332607746124268, "global_step": 6721, "epoch": 40} {"train_loss": -5.290782451629639, "global_step": 6722, "epoch": 40} {"train_loss": -5.354625225067139, "global_step": 6723, "epoch": 40} {"train_loss": -5.425295829772949, "global_step": 6724, "epoch": 40} {"train_loss": -5.32387113571167, "global_step": 6725, "epoch": 40} {"train_loss": -5.39154052734375, "global_step": 6726, "epoch": 40} {"train_loss": -5.346632957458496, "global_step": 6727, "epoch": 40} {"train_loss": -5.39103889465332, "global_step": 6728, "epoch": 40} {"train_loss": -5.136399269104004, "global_step": 6729, "epoch": 40} {"train_loss": -5.021479606628418, "global_step": 6730, "epoch": 40} {"train_loss": -5.289885520935059, "global_step": 6731, "epoch": 40} {"train_loss": -5.288820266723633, "global_step": 6732, "epoch": 40} {"train_loss": -5.449599266052246, "global_step": 6733, "epoch": 40} {"train_loss": -5.546179294586182, "global_step": 6734, "epoch": 40} {"train_loss": -5.316583633422852, "global_step": 6735, "epoch": 40} {"train_loss": -5.036409378051758, "global_step": 6736, "epoch": 40} {"train_loss": -5.279571533203125, "global_step": 6737, "epoch": 40} {"train_loss": -4.933052062988281, "global_step": 6738, "epoch": 40} {"train_loss": -4.962155342102051, "global_step": 6739, "epoch": 40} {"train_loss": -4.836598873138428, "global_step": 6740, "epoch": 40} {"train_loss": -5.078246116638184, "global_step": 6741, "epoch": 40} {"train_loss": -5.17119836807251, "global_step": 6742, "epoch": 40} {"train_loss": -5.203736305236816, "global_step": 6743, "epoch": 40} {"train_loss": -5.012874126434326, "global_step": 6744, "epoch": 40} {"train_loss": -5.269402503967285, "global_step": 6745, "epoch": 40} {"train_loss": -5.114672660827637, "global_step": 6746, "epoch": 40} {"train_loss": -5.127861022949219, "global_step": 6747, "epoch": 40} {"train_loss": -5.336543083190918, "global_step": 6748, "epoch": 40} {"train_loss": -5.15748929977417, "global_step": 6749, "epoch": 40} {"train_loss": -5.049771308898926, "global_step": 6750, "epoch": 40} {"train_loss": -5.320535659790039, "global_step": 6751, "epoch": 40} {"train_loss": -5.091754913330078, "global_step": 6752, "epoch": 40} {"train_loss": -5.392801761627197, "global_step": 6753, "epoch": 40} {"train_loss": -4.985618591308594, "global_step": 6754, "epoch": 40} {"train_loss": -5.166568756103516, "global_step": 6755, "epoch": 40} {"train_loss": -5.516603469848633, "global_step": 6756, "epoch": 40} {"train_loss": -5.331957817077637, "global_step": 6757, "epoch": 40} {"train_loss": -5.3815388679504395, "global_step": 6758, "epoch": 40} {"train_loss": -5.488017559051514, "global_step": 6759, "epoch": 40} {"train_loss": -5.43976354598999, "global_step": 6760, "epoch": 40} {"train_loss": -5.452359676361084, "global_step": 6761, "epoch": 40} {"train_loss": -5.436063289642334, "global_step": 6762, "epoch": 40} {"train_loss": -5.457029342651367, "global_step": 6763, "epoch": 40} {"train_loss": -5.486851215362549, "global_step": 6764, "epoch": 40} {"train_loss": -5.502599716186523, "global_step": 6765, "epoch": 40} {"train_loss": -5.305551528930664, "global_step": 6766, "epoch": 40} {"train_loss": -5.477867126464844, "global_step": 6767, "epoch": 40} {"train_loss": -5.349405288696289, "global_step": 6768, "epoch": 40} {"train_loss": -5.199871063232422, "global_step": 6769, "epoch": 40} {"train_loss": -5.388584136962891, "global_step": 6770, "epoch": 40} {"train_loss": -5.379354476928711, "global_step": 6771, "epoch": 40} {"train_loss": -5.303007125854492, "global_step": 6772, "epoch": 40} {"train_loss": -5.258731842041016, "global_step": 6773, "epoch": 40} {"train_loss": -5.142917156219482, "global_step": 6774, "epoch": 40} {"train_loss": -5.269595623016357, "global_step": 6775, "epoch": 40} {"train_loss": -5.3677659034729, "global_step": 6776, "epoch": 40} {"train_loss": -5.3091349601745605, "global_step": 6777, "epoch": 40} {"train_loss": -5.2243194580078125, "global_step": 6778, "epoch": 40} {"train_loss": -5.151312828063965, "global_step": 6779, "epoch": 40} {"train_loss": -5.413328647613525, "global_step": 6780, "epoch": 40} {"train_loss": -5.289498329162598, "global_step": 6781, "epoch": 40} {"train_loss": -5.317109107971191, "global_step": 6782, "epoch": 40} {"train_loss": -5.396556854248047, "global_step": 6783, "epoch": 40} {"train_loss": -5.193765640258789, "global_step": 6784, "epoch": 40} {"train_loss": -5.323615074157715, "global_step": 6785, "epoch": 40} {"train_loss": -5.262416362762451, "global_step": 6786, "epoch": 40} {"train_loss": -5.37382698059082, "global_step": 6787, "epoch": 40} {"train_loss": -5.235197067260742, "global_step": 6788, "epoch": 40} {"train_loss": -5.335953235626221, "global_step": 6789, "epoch": 40} {"train_loss": -5.210122585296631, "global_step": 6790, "epoch": 40} {"train_loss": -5.210260391235352, "global_step": 6791, "epoch": 40} {"train_loss": -5.124024868011475, "global_step": 6792, "epoch": 40} {"train_loss": -5.209368705749512, "global_step": 6793, "epoch": 40} {"train_loss": -5.23393440246582, "global_step": 6794, "epoch": 40} {"train_loss": -5.364961624145508, "global_step": 6795, "epoch": 40} {"train_loss": -5.092007637023926, "global_step": 6796, "epoch": 40} {"train_loss": -5.342016696929932, "global_step": 6797, "epoch": 40} {"train_loss": -5.466653823852539, "global_step": 6798, "epoch": 40} {"train_loss": -5.303332328796387, "global_step": 6799, "epoch": 40} {"train_loss": -5.373941898345947, "global_step": 6800, "epoch": 40} {"train_loss": -5.304747581481934, "global_step": 6801, "epoch": 40} {"train_loss": -5.5634379386901855, "global_step": 6802, "epoch": 40} {"train_loss": -5.000385284423828, "global_step": 6803, "epoch": 40} {"train_loss": -5.318361759185791, "global_step": 6804, "epoch": 40} {"train_loss": -5.233328819274902, "global_step": 6805, "epoch": 40} {"train_loss": -4.977121353149414, "global_step": 6806, "epoch": 40} {"train_loss": -5.637320518493652, "global_step": 6807, "epoch": 40} {"train_loss": -4.989741325378418, "global_step": 6808, "epoch": 40} {"train_loss": -5.291788578033447, "global_step": 6809, "epoch": 40} {"train_loss": -5.305271148681641, "global_step": 6810, "epoch": 40} {"train_loss": -5.022699356079102, "global_step": 6811, "epoch": 40} {"train_loss": -5.12906551361084, "global_step": 6812, "epoch": 40} {"train_loss": -5.338955879211426, "global_step": 6813, "epoch": 40} {"train_loss": -5.0782470703125, "global_step": 6814, "epoch": 40} {"train_loss": -5.160879611968994, "global_step": 6815, "epoch": 40} {"train_loss": -4.732333660125732, "global_step": 6816, "epoch": 40} {"train_loss": -4.797208786010742, "global_step": 6817, "epoch": 40} {"train_loss": -5.058734893798828, "global_step": 6818, "epoch": 40} {"train_loss": -4.8607940673828125, "global_step": 6819, "epoch": 40} {"train_loss": -4.783631324768066, "global_step": 6820, "epoch": 40} {"train_loss": -5.213482856750488, "global_step": 6821, "epoch": 40} {"train_loss": -5.032459259033203, "global_step": 6822, "epoch": 40} {"train_loss": -5.0790114402771, "global_step": 6823, "epoch": 40} {"train_loss": -5.166599273681641, "global_step": 6824, "epoch": 40} {"train_loss": -5.108905792236328, "global_step": 6825, "epoch": 40} {"train_loss": -4.942840576171875, "global_step": 6826, "epoch": 40} {"train_loss": -5.169682502746582, "global_step": 6827, "epoch": 40} {"train_loss": -5.163638114929199, "global_step": 6828, "epoch": 40} {"train_loss": -4.942913055419922, "global_step": 6829, "epoch": 40} {"train_loss": -5.127239227294922, "global_step": 6830, "epoch": 40} {"train_loss": -5.198648929595947, "global_step": 6831, "epoch": 40} {"train_loss": -5.155655860900879, "global_step": 6832, "epoch": 40} {"train_loss": -5.104630947113037, "global_step": 6833, "epoch": 40} {"train_loss": -5.157411575317383, "global_step": 6834, "epoch": 40} {"train_loss": -4.696770668029785, "global_step": 6835, "epoch": 40} {"train_loss": -5.206040382385254, "global_step": 6836, "epoch": 40} {"train_loss": -5.296832084655762, "global_step": 6837, "epoch": 40} {"train_loss": -5.199286460876465, "global_step": 6838, "epoch": 40} {"train_loss": -5.336781024932861, "global_step": 6839, "epoch": 40} {"train_loss": -5.252118110656738, "global_step": 6840, "epoch": 40} {"train_loss": -5.005612373352051, "global_step": 6841, "epoch": 40} {"train_loss": -5.159340858459473, "global_step": 6842, "epoch": 40} {"train_loss": -5.051478385925293, "global_step": 6843, "epoch": 40} {"train_loss": -5.084025859832764, "global_step": 6844, "epoch": 40} {"train_loss": -5.228320121765137, "global_step": 6845, "epoch": 40} {"train_loss": -5.238102912902832, "global_step": 6846, "epoch": 40} {"train_loss": -5.136351585388184, "global_step": 6847, "epoch": 40} {"train_loss": -5.2108845710754395, "global_step": 6848, "epoch": 40} {"train_loss": -5.02511739730835, "global_step": 6849, "epoch": 40} {"train_loss": -5.350748538970947, "global_step": 6850, "epoch": 40} {"train_loss": -5.362401962280273, "global_step": 6851, "epoch": 40} {"train_loss": -5.3467607498168945, "global_step": 6852, "epoch": 40} {"train_loss": -5.376861572265625, "global_step": 6853, "epoch": 40} {"train_loss": -5.191283226013184, "global_step": 6854, "epoch": 40} {"train_loss": -5.594095230102539, "global_step": 6855, "epoch": 40} {"train_loss": -5.5407609939575195, "global_step": 6856, "epoch": 40} {"train_loss": -5.39449405670166, "global_step": 6857, "epoch": 40} {"train_loss": -5.667495250701904, "global_step": 6858, "epoch": 40} {"train_loss": -5.2601752281188965, "global_step": 6859, "epoch": 40} {"train_loss": -5.549975872039795, "global_step": 6860, "epoch": 40} {"train_loss": -5.237985610961914, "global_step": 6861, "epoch": 40} {"train_loss": -5.289668083190918, "global_step": 6862, "epoch": 40} {"train_loss": -5.509433746337891, "global_step": 6863, "epoch": 40} {"train_loss": -5.456757068634033, "global_step": 6864, "epoch": 40} {"train_loss": -5.239723205566406, "global_step": 6865, "epoch": 40} {"train_loss": -5.372437953948975, "global_step": 6866, "epoch": 40} {"train_loss": -5.165495872497559, "global_step": 6867, "epoch": 40} {"train_loss": -5.473590850830078, "global_step": 6868, "epoch": 40} {"train_loss": -5.402045249938965, "global_step": 6869, "epoch": 40} {"train_loss": -5.38304328918457, "global_step": 6870, "epoch": 40} {"train_loss": -5.481544494628906, "global_step": 6871, "epoch": 40} {"train_loss": -5.0977067947387695, "global_step": 6872, "epoch": 40} {"train_loss": -5.304154872894287, "global_step": 6873, "epoch": 40} {"train_loss": -5.397464752197266, "global_step": 6874, "epoch": 40} {"train_loss": -5.335755348205566, "global_step": 6875, "epoch": 40} {"train_loss": -5.406715393066406, "global_step": 6876, "epoch": 40} {"train_loss": -5.486902236938477, "global_step": 6877, "epoch": 40} {"train_loss": -5.374457359313965, "global_step": 6878, "epoch": 40} {"train_loss": -5.509546279907227, "global_step": 6879, "epoch": 40} {"train_loss": -5.489069938659668, "global_step": 6880, "epoch": 40} {"train_loss": -5.598840713500977, "global_step": 6881, "epoch": 40} {"train_loss": -5.524032115936279, "global_step": 6882, "epoch": 40} {"train_loss": -5.384270668029785, "global_step": 6883, "epoch": 40} {"train_loss": -5.47227668762207, "global_step": 6884, "epoch": 40} {"train_loss": -5.44921875, "global_step": 6885, "epoch": 40} {"train_loss": -5.4613423347473145, "global_step": 6886, "epoch": 40} {"train_loss": -5.26125697294871, "global_step": 6887, "epoch": 40, "val_loss": 266169.28125, "train_action_mse_error": 61.21148681640625} {"train_loss": -5.466500282287598, "global_step": 6888, "epoch": 41} {"train_loss": -5.288735866546631, "global_step": 6889, "epoch": 41} {"train_loss": -5.1682209968566895, "global_step": 6890, "epoch": 41} {"train_loss": -5.409578323364258, "global_step": 6891, "epoch": 41} {"train_loss": -5.369016647338867, "global_step": 6892, "epoch": 41} {"train_loss": -5.101673603057861, "global_step": 6893, "epoch": 41} {"train_loss": -5.367875099182129, "global_step": 6894, "epoch": 41} {"train_loss": -5.418509483337402, "global_step": 6895, "epoch": 41} {"train_loss": -5.241875648498535, "global_step": 6896, "epoch": 41} {"train_loss": -5.473871231079102, "global_step": 6897, "epoch": 41} {"train_loss": -5.268659591674805, "global_step": 6898, "epoch": 41} {"train_loss": -5.47689151763916, "global_step": 6899, "epoch": 41} {"train_loss": -5.402041435241699, "global_step": 6900, "epoch": 41} {"train_loss": -5.255942344665527, "global_step": 6901, "epoch": 41} {"train_loss": -5.017274856567383, "global_step": 6902, "epoch": 41} {"train_loss": -5.377816200256348, "global_step": 6903, "epoch": 41} {"train_loss": -5.618483543395996, "global_step": 6904, "epoch": 41} {"train_loss": -5.288237571716309, "global_step": 6905, "epoch": 41} {"train_loss": -5.549397945404053, "global_step": 6906, "epoch": 41} {"train_loss": -5.4317216873168945, "global_step": 6907, "epoch": 41} {"train_loss": -5.4098920822143555, "global_step": 6908, "epoch": 41} {"train_loss": -5.170044422149658, "global_step": 6909, "epoch": 41} {"train_loss": -5.409189224243164, "global_step": 6910, "epoch": 41} {"train_loss": -5.3015007972717285, "global_step": 6911, "epoch": 41} {"train_loss": -5.2430644035339355, "global_step": 6912, "epoch": 41} {"train_loss": -5.3807220458984375, "global_step": 6913, "epoch": 41} {"train_loss": -5.400819778442383, "global_step": 6914, "epoch": 41} {"train_loss": -4.967304706573486, "global_step": 6915, "epoch": 41} {"train_loss": -4.8825531005859375, "global_step": 6916, "epoch": 41} {"train_loss": -5.215744972229004, "global_step": 6917, "epoch": 41} {"train_loss": -5.251562118530273, "global_step": 6918, "epoch": 41} {"train_loss": -5.44197940826416, "global_step": 6919, "epoch": 41} {"train_loss": -5.250056266784668, "global_step": 6920, "epoch": 41} {"train_loss": -5.418898582458496, "global_step": 6921, "epoch": 41} {"train_loss": -5.208944797515869, "global_step": 6922, "epoch": 41} {"train_loss": -5.37546443939209, "global_step": 6923, "epoch": 41} {"train_loss": -5.281167030334473, "global_step": 6924, "epoch": 41} {"train_loss": -5.113541603088379, "global_step": 6925, "epoch": 41} {"train_loss": -5.279830455780029, "global_step": 6926, "epoch": 41} {"train_loss": -5.216657638549805, "global_step": 6927, "epoch": 41} {"train_loss": -5.315167427062988, "global_step": 6928, "epoch": 41} {"train_loss": -5.046479225158691, "global_step": 6929, "epoch": 41} {"train_loss": -5.119542121887207, "global_step": 6930, "epoch": 41} {"train_loss": -5.317863464355469, "global_step": 6931, "epoch": 41} {"train_loss": -5.283041954040527, "global_step": 6932, "epoch": 41} {"train_loss": -5.08557653427124, "global_step": 6933, "epoch": 41} {"train_loss": -5.336222171783447, "global_step": 6934, "epoch": 41} {"train_loss": -5.202264785766602, "global_step": 6935, "epoch": 41} {"train_loss": -5.357540130615234, "global_step": 6936, "epoch": 41} {"train_loss": -5.204951763153076, "global_step": 6937, "epoch": 41} {"train_loss": -5.083989143371582, "global_step": 6938, "epoch": 41} {"train_loss": -5.439711570739746, "global_step": 6939, "epoch": 41} {"train_loss": -5.336167335510254, "global_step": 6940, "epoch": 41} {"train_loss": -5.330650806427002, "global_step": 6941, "epoch": 41} {"train_loss": -5.11395263671875, "global_step": 6942, "epoch": 41} {"train_loss": -5.375402927398682, "global_step": 6943, "epoch": 41} {"train_loss": -5.528725624084473, "global_step": 6944, "epoch": 41} {"train_loss": -5.44348669052124, "global_step": 6945, "epoch": 41} {"train_loss": -5.150188446044922, "global_step": 6946, "epoch": 41} {"train_loss": -5.380352973937988, "global_step": 6947, "epoch": 41} {"train_loss": -5.508937835693359, "global_step": 6948, "epoch": 41} {"train_loss": -5.428007125854492, "global_step": 6949, "epoch": 41} {"train_loss": -5.60957670211792, "global_step": 6950, "epoch": 41} {"train_loss": -5.403773307800293, "global_step": 6951, "epoch": 41} {"train_loss": -5.174369812011719, "global_step": 6952, "epoch": 41} {"train_loss": -5.370634078979492, "global_step": 6953, "epoch": 41} {"train_loss": -5.448315143585205, "global_step": 6954, "epoch": 41} {"train_loss": -5.070354461669922, "global_step": 6955, "epoch": 41} {"train_loss": -5.499821662902832, "global_step": 6956, "epoch": 41} {"train_loss": -5.353289604187012, "global_step": 6957, "epoch": 41} {"train_loss": -5.193154811859131, "global_step": 6958, "epoch": 41} {"train_loss": -5.219629287719727, "global_step": 6959, "epoch": 41} {"train_loss": -5.057472229003906, "global_step": 6960, "epoch": 41} {"train_loss": -5.399285316467285, "global_step": 6961, "epoch": 41} {"train_loss": -5.218475341796875, "global_step": 6962, "epoch": 41} {"train_loss": -5.436269760131836, "global_step": 6963, "epoch": 41} {"train_loss": -5.1772308349609375, "global_step": 6964, "epoch": 41} {"train_loss": -5.560479640960693, "global_step": 6965, "epoch": 41} {"train_loss": -5.271696090698242, "global_step": 6966, "epoch": 41} {"train_loss": -5.516772270202637, "global_step": 6967, "epoch": 41} {"train_loss": -5.330442428588867, "global_step": 6968, "epoch": 41} {"train_loss": -5.517577171325684, "global_step": 6969, "epoch": 41} {"train_loss": -5.441983222961426, "global_step": 6970, "epoch": 41} {"train_loss": -5.206927299499512, "global_step": 6971, "epoch": 41} {"train_loss": -5.610543727874756, "global_step": 6972, "epoch": 41} {"train_loss": -5.364028453826904, "global_step": 6973, "epoch": 41} {"train_loss": -5.2724199295043945, "global_step": 6974, "epoch": 41} {"train_loss": -5.407942295074463, "global_step": 6975, "epoch": 41} {"train_loss": -5.39301872253418, "global_step": 6976, "epoch": 41} {"train_loss": -5.5543975830078125, "global_step": 6977, "epoch": 41} {"train_loss": -5.126488208770752, "global_step": 6978, "epoch": 41} {"train_loss": -5.363651275634766, "global_step": 6979, "epoch": 41} {"train_loss": -5.267953872680664, "global_step": 6980, "epoch": 41} {"train_loss": -5.480441570281982, "global_step": 6981, "epoch": 41} {"train_loss": -5.272920608520508, "global_step": 6982, "epoch": 41} {"train_loss": -5.0697784423828125, "global_step": 6983, "epoch": 41} {"train_loss": -5.076486587524414, "global_step": 6984, "epoch": 41} {"train_loss": -5.135136127471924, "global_step": 6985, "epoch": 41} {"train_loss": -5.345224380493164, "global_step": 6986, "epoch": 41} {"train_loss": -5.425461292266846, "global_step": 6987, "epoch": 41} {"train_loss": -5.270743370056152, "global_step": 6988, "epoch": 41} {"train_loss": -5.436456680297852, "global_step": 6989, "epoch": 41} {"train_loss": -5.457244873046875, "global_step": 6990, "epoch": 41} {"train_loss": -5.0582733154296875, "global_step": 6991, "epoch": 41} {"train_loss": -5.302810192108154, "global_step": 6992, "epoch": 41} {"train_loss": -5.044194221496582, "global_step": 6993, "epoch": 41} {"train_loss": -5.458128929138184, "global_step": 6994, "epoch": 41} {"train_loss": -5.326977729797363, "global_step": 6995, "epoch": 41} {"train_loss": -5.491426467895508, "global_step": 6996, "epoch": 41} {"train_loss": -5.379826068878174, "global_step": 6997, "epoch": 41} {"train_loss": -5.391304969787598, "global_step": 6998, "epoch": 41} {"train_loss": -5.482090950012207, "global_step": 6999, "epoch": 41} {"train_loss": -5.514957904815674, "global_step": 7000, "epoch": 41} {"train_loss": -5.342599868774414, "global_step": 7001, "epoch": 41} {"train_loss": -5.437480449676514, "global_step": 7002, "epoch": 41} {"train_loss": -5.036985397338867, "global_step": 7003, "epoch": 41} {"train_loss": -5.328335762023926, "global_step": 7004, "epoch": 41} {"train_loss": -5.130026340484619, "global_step": 7005, "epoch": 41} {"train_loss": -5.474172115325928, "global_step": 7006, "epoch": 41} {"train_loss": -5.193331718444824, "global_step": 7007, "epoch": 41} {"train_loss": -5.437136650085449, "global_step": 7008, "epoch": 41} {"train_loss": -5.224822044372559, "global_step": 7009, "epoch": 41} {"train_loss": -5.321844100952148, "global_step": 7010, "epoch": 41} {"train_loss": -5.217486381530762, "global_step": 7011, "epoch": 41} {"train_loss": -5.203543663024902, "global_step": 7012, "epoch": 41} {"train_loss": -5.11016845703125, "global_step": 7013, "epoch": 41} {"train_loss": -5.142716407775879, "global_step": 7014, "epoch": 41} {"train_loss": -5.195063591003418, "global_step": 7015, "epoch": 41} {"train_loss": -5.100649833679199, "global_step": 7016, "epoch": 41} {"train_loss": -4.931378364562988, "global_step": 7017, "epoch": 41} {"train_loss": -5.105336666107178, "global_step": 7018, "epoch": 41} {"train_loss": -5.376140594482422, "global_step": 7019, "epoch": 41} {"train_loss": -5.3839569091796875, "global_step": 7020, "epoch": 41} {"train_loss": -5.222151756286621, "global_step": 7021, "epoch": 41} {"train_loss": -5.534109592437744, "global_step": 7022, "epoch": 41} {"train_loss": -5.325493335723877, "global_step": 7023, "epoch": 41} {"train_loss": -5.197725772857666, "global_step": 7024, "epoch": 41} {"train_loss": -5.07888650894165, "global_step": 7025, "epoch": 41} {"train_loss": -5.206047058105469, "global_step": 7026, "epoch": 41} {"train_loss": -5.198626518249512, "global_step": 7027, "epoch": 41} {"train_loss": -5.248296737670898, "global_step": 7028, "epoch": 41} {"train_loss": -5.121158599853516, "global_step": 7029, "epoch": 41} {"train_loss": -5.090259075164795, "global_step": 7030, "epoch": 41} {"train_loss": -5.373025894165039, "global_step": 7031, "epoch": 41} {"train_loss": -5.17974328994751, "global_step": 7032, "epoch": 41} {"train_loss": -5.319340229034424, "global_step": 7033, "epoch": 41} {"train_loss": -5.284788608551025, "global_step": 7034, "epoch": 41} {"train_loss": -5.450038909912109, "global_step": 7035, "epoch": 41} {"train_loss": -5.331211566925049, "global_step": 7036, "epoch": 41} {"train_loss": -5.212385654449463, "global_step": 7037, "epoch": 41} {"train_loss": -5.2751336097717285, "global_step": 7038, "epoch": 41} {"train_loss": -5.487321853637695, "global_step": 7039, "epoch": 41} {"train_loss": -5.328814506530762, "global_step": 7040, "epoch": 41} {"train_loss": -5.189897537231445, "global_step": 7041, "epoch": 41} {"train_loss": -5.491181373596191, "global_step": 7042, "epoch": 41} {"train_loss": -5.141525745391846, "global_step": 7043, "epoch": 41} {"train_loss": -5.713622093200684, "global_step": 7044, "epoch": 41} {"train_loss": -5.474040508270264, "global_step": 7045, "epoch": 41} {"train_loss": -5.141204833984375, "global_step": 7046, "epoch": 41} {"train_loss": -5.5037431716918945, "global_step": 7047, "epoch": 41} {"train_loss": -5.5162034034729, "global_step": 7048, "epoch": 41} {"train_loss": -5.430576801300049, "global_step": 7049, "epoch": 41} {"train_loss": -5.4370927810668945, "global_step": 7050, "epoch": 41} {"train_loss": -5.268795013427734, "global_step": 7051, "epoch": 41} {"train_loss": -5.256824970245361, "global_step": 7052, "epoch": 41} {"train_loss": -5.32174015045166, "global_step": 7053, "epoch": 41} {"train_loss": -5.217632293701172, "global_step": 7054, "epoch": 41} {"train_loss": -5.307593882083893, "global_step": 7055, "epoch": 41, "val_loss": 269461.0625} {"train_loss": -5.359731197357178, "global_step": 7056, "epoch": 42} {"train_loss": -5.379617214202881, "global_step": 7057, "epoch": 42} {"train_loss": -5.136905670166016, "global_step": 7058, "epoch": 42} {"train_loss": -5.303902626037598, "global_step": 7059, "epoch": 42} {"train_loss": -5.2818756103515625, "global_step": 7060, "epoch": 42} {"train_loss": -5.21434211730957, "global_step": 7061, "epoch": 42} {"train_loss": -5.3413848876953125, "global_step": 7062, "epoch": 42} {"train_loss": -5.347731590270996, "global_step": 7063, "epoch": 42} {"train_loss": -5.197388648986816, "global_step": 7064, "epoch": 42} {"train_loss": -5.403459548950195, "global_step": 7065, "epoch": 42} {"train_loss": -5.224324703216553, "global_step": 7066, "epoch": 42} {"train_loss": -5.370528221130371, "global_step": 7067, "epoch": 42} {"train_loss": -5.14633846282959, "global_step": 7068, "epoch": 42} {"train_loss": -5.140382766723633, "global_step": 7069, "epoch": 42} {"train_loss": -5.3929948806762695, "global_step": 7070, "epoch": 42} {"train_loss": -5.321198463439941, "global_step": 7071, "epoch": 42} {"train_loss": -5.133127689361572, "global_step": 7072, "epoch": 42} {"train_loss": -5.370278358459473, "global_step": 7073, "epoch": 42} {"train_loss": -5.507061004638672, "global_step": 7074, "epoch": 42} {"train_loss": -5.36119270324707, "global_step": 7075, "epoch": 42} {"train_loss": -5.401330471038818, "global_step": 7076, "epoch": 42} {"train_loss": -5.185821533203125, "global_step": 7077, "epoch": 42} {"train_loss": -5.178357124328613, "global_step": 7078, "epoch": 42} {"train_loss": -5.302361011505127, "global_step": 7079, "epoch": 42} {"train_loss": -5.3090715408325195, "global_step": 7080, "epoch": 42} {"train_loss": -5.445380687713623, "global_step": 7081, "epoch": 42} {"train_loss": -5.295349597930908, "global_step": 7082, "epoch": 42} {"train_loss": -5.333083629608154, "global_step": 7083, "epoch": 42} {"train_loss": -5.401278495788574, "global_step": 7084, "epoch": 42} {"train_loss": -5.49373197555542, "global_step": 7085, "epoch": 42} {"train_loss": -5.194398880004883, "global_step": 7086, "epoch": 42} {"train_loss": -5.181344509124756, "global_step": 7087, "epoch": 42} {"train_loss": -5.6358642578125, "global_step": 7088, "epoch": 42} {"train_loss": -5.148897647857666, "global_step": 7089, "epoch": 42} {"train_loss": -5.308613300323486, "global_step": 7090, "epoch": 42} {"train_loss": -5.172119140625, "global_step": 7091, "epoch": 42} {"train_loss": -5.2582879066467285, "global_step": 7092, "epoch": 42} {"train_loss": -5.469079494476318, "global_step": 7093, "epoch": 42} {"train_loss": -5.026915073394775, "global_step": 7094, "epoch": 42} {"train_loss": -5.617215633392334, "global_step": 7095, "epoch": 42} {"train_loss": -5.228457450866699, "global_step": 7096, "epoch": 42} {"train_loss": -5.288341045379639, "global_step": 7097, "epoch": 42} {"train_loss": -5.080778121948242, "global_step": 7098, "epoch": 42} {"train_loss": -5.335919380187988, "global_step": 7099, "epoch": 42} {"train_loss": -5.420716285705566, "global_step": 7100, "epoch": 42} {"train_loss": -5.457633972167969, "global_step": 7101, "epoch": 42} {"train_loss": -5.370959281921387, "global_step": 7102, "epoch": 42} {"train_loss": -5.473298072814941, "global_step": 7103, "epoch": 42} {"train_loss": -5.491808891296387, "global_step": 7104, "epoch": 42} {"train_loss": -5.313016891479492, "global_step": 7105, "epoch": 42} {"train_loss": -5.50499153137207, "global_step": 7106, "epoch": 42} {"train_loss": -5.482447624206543, "global_step": 7107, "epoch": 42} {"train_loss": -5.641277313232422, "global_step": 7108, "epoch": 42} {"train_loss": -5.217410087585449, "global_step": 7109, "epoch": 42} {"train_loss": -5.063019752502441, "global_step": 7110, "epoch": 42} {"train_loss": -5.335068225860596, "global_step": 7111, "epoch": 42} {"train_loss": -5.199000835418701, "global_step": 7112, "epoch": 42} {"train_loss": -5.407196044921875, "global_step": 7113, "epoch": 42} {"train_loss": -5.534609317779541, "global_step": 7114, "epoch": 42} {"train_loss": -5.482190132141113, "global_step": 7115, "epoch": 42} {"train_loss": -5.507896423339844, "global_step": 7116, "epoch": 42} {"train_loss": -5.613914489746094, "global_step": 7117, "epoch": 42} {"train_loss": -5.544034957885742, "global_step": 7118, "epoch": 42} {"train_loss": -5.41933536529541, "global_step": 7119, "epoch": 42} {"train_loss": -5.170625686645508, "global_step": 7120, "epoch": 42} {"train_loss": -5.287464141845703, "global_step": 7121, "epoch": 42} {"train_loss": -5.168939590454102, "global_step": 7122, "epoch": 42} {"train_loss": -5.236293315887451, "global_step": 7123, "epoch": 42} {"train_loss": -4.907721996307373, "global_step": 7124, "epoch": 42} {"train_loss": -5.168072700500488, "global_step": 7125, "epoch": 42} {"train_loss": -5.508660316467285, "global_step": 7126, "epoch": 42} {"train_loss": -5.259845733642578, "global_step": 7127, "epoch": 42} {"train_loss": -5.46187162399292, "global_step": 7128, "epoch": 42} {"train_loss": -5.523183822631836, "global_step": 7129, "epoch": 42} {"train_loss": -5.475952625274658, "global_step": 7130, "epoch": 42} {"train_loss": -5.426307678222656, "global_step": 7131, "epoch": 42} {"train_loss": -5.243306636810303, "global_step": 7132, "epoch": 42} {"train_loss": -5.4818267822265625, "global_step": 7133, "epoch": 42} {"train_loss": -5.161258220672607, "global_step": 7134, "epoch": 42} {"train_loss": -5.357161998748779, "global_step": 7135, "epoch": 42} {"train_loss": -5.372494697570801, "global_step": 7136, "epoch": 42} {"train_loss": -5.324493408203125, "global_step": 7137, "epoch": 42} {"train_loss": -5.3053812980651855, "global_step": 7138, "epoch": 42} {"train_loss": -5.251857757568359, "global_step": 7139, "epoch": 42} {"train_loss": -5.423172950744629, "global_step": 7140, "epoch": 42} {"train_loss": -5.431582927703857, "global_step": 7141, "epoch": 42} {"train_loss": -5.56096076965332, "global_step": 7142, "epoch": 42} {"train_loss": -5.673405647277832, "global_step": 7143, "epoch": 42} {"train_loss": -5.434447765350342, "global_step": 7144, "epoch": 42} {"train_loss": -5.325117111206055, "global_step": 7145, "epoch": 42} {"train_loss": -5.442591667175293, "global_step": 7146, "epoch": 42} {"train_loss": -5.636475086212158, "global_step": 7147, "epoch": 42} {"train_loss": -5.691230773925781, "global_step": 7148, "epoch": 42} {"train_loss": -5.473111152648926, "global_step": 7149, "epoch": 42} {"train_loss": -5.574819087982178, "global_step": 7150, "epoch": 42} {"train_loss": -5.440179824829102, "global_step": 7151, "epoch": 42} {"train_loss": -5.50408935546875, "global_step": 7152, "epoch": 42} {"train_loss": -5.7852020263671875, "global_step": 7153, "epoch": 42} {"train_loss": -5.336306571960449, "global_step": 7154, "epoch": 42} {"train_loss": -5.227578163146973, "global_step": 7155, "epoch": 42} {"train_loss": -5.254880905151367, "global_step": 7156, "epoch": 42} {"train_loss": -5.31411075592041, "global_step": 7157, "epoch": 42} {"train_loss": -5.1127166748046875, "global_step": 7158, "epoch": 42} {"train_loss": -5.447295188903809, "global_step": 7159, "epoch": 42} {"train_loss": -5.032337188720703, "global_step": 7160, "epoch": 42} {"train_loss": -5.23006534576416, "global_step": 7161, "epoch": 42} {"train_loss": -5.227535247802734, "global_step": 7162, "epoch": 42} {"train_loss": -5.119623184204102, "global_step": 7163, "epoch": 42} {"train_loss": -5.403851509094238, "global_step": 7164, "epoch": 42} {"train_loss": -5.119965076446533, "global_step": 7165, "epoch": 42} {"train_loss": -4.995002746582031, "global_step": 7166, "epoch": 42} {"train_loss": -5.167369365692139, "global_step": 7167, "epoch": 42} {"train_loss": -5.183952331542969, "global_step": 7168, "epoch": 42} {"train_loss": -5.143247604370117, "global_step": 7169, "epoch": 42} {"train_loss": -5.227994918823242, "global_step": 7170, "epoch": 42} {"train_loss": -5.2455525398254395, "global_step": 7171, "epoch": 42} {"train_loss": -5.324536323547363, "global_step": 7172, "epoch": 42} {"train_loss": -5.3868913650512695, "global_step": 7173, "epoch": 42} {"train_loss": -5.508331298828125, "global_step": 7174, "epoch": 42} {"train_loss": -4.97395133972168, "global_step": 7175, "epoch": 42} {"train_loss": -5.4395833015441895, "global_step": 7176, "epoch": 42} {"train_loss": -5.51658296585083, "global_step": 7177, "epoch": 42} {"train_loss": -5.399994850158691, "global_step": 7178, "epoch": 42} {"train_loss": -5.510617733001709, "global_step": 7179, "epoch": 42} {"train_loss": -5.487836837768555, "global_step": 7180, "epoch": 42} {"train_loss": -5.415851593017578, "global_step": 7181, "epoch": 42} {"train_loss": -5.08829402923584, "global_step": 7182, "epoch": 42} {"train_loss": -5.111826419830322, "global_step": 7183, "epoch": 42} {"train_loss": -5.255245208740234, "global_step": 7184, "epoch": 42} {"train_loss": -5.425777435302734, "global_step": 7185, "epoch": 42} {"train_loss": -5.5440754890441895, "global_step": 7186, "epoch": 42} {"train_loss": -5.141463279724121, "global_step": 7187, "epoch": 42} {"train_loss": -5.613399505615234, "global_step": 7188, "epoch": 42} {"train_loss": -5.307639122009277, "global_step": 7189, "epoch": 42} {"train_loss": -5.57905387878418, "global_step": 7190, "epoch": 42} {"train_loss": -5.333889007568359, "global_step": 7191, "epoch": 42} {"train_loss": -5.4746503829956055, "global_step": 7192, "epoch": 42} {"train_loss": -5.446733474731445, "global_step": 7193, "epoch": 42} {"train_loss": -5.446844100952148, "global_step": 7194, "epoch": 42} {"train_loss": -5.460178375244141, "global_step": 7195, "epoch": 42} {"train_loss": -5.549524307250977, "global_step": 7196, "epoch": 42} {"train_loss": -5.153187274932861, "global_step": 7197, "epoch": 42} {"train_loss": -5.481426239013672, "global_step": 7198, "epoch": 42} {"train_loss": -5.21376895904541, "global_step": 7199, "epoch": 42} {"train_loss": -5.475380897521973, "global_step": 7200, "epoch": 42} {"train_loss": -5.315983772277832, "global_step": 7201, "epoch": 42} {"train_loss": -5.200834274291992, "global_step": 7202, "epoch": 42} {"train_loss": -5.199125289916992, "global_step": 7203, "epoch": 42} {"train_loss": -5.013764381408691, "global_step": 7204, "epoch": 42} {"train_loss": -5.448328971862793, "global_step": 7205, "epoch": 42} {"train_loss": -5.5532684326171875, "global_step": 7206, "epoch": 42} {"train_loss": -5.21832799911499, "global_step": 7207, "epoch": 42} {"train_loss": -5.582385063171387, "global_step": 7208, "epoch": 42} {"train_loss": -5.260383605957031, "global_step": 7209, "epoch": 42} {"train_loss": -5.380997657775879, "global_step": 7210, "epoch": 42} {"train_loss": -5.186621189117432, "global_step": 7211, "epoch": 42} {"train_loss": -5.409521102905273, "global_step": 7212, "epoch": 42} {"train_loss": -5.229763984680176, "global_step": 7213, "epoch": 42} {"train_loss": -5.4447760581970215, "global_step": 7214, "epoch": 42} {"train_loss": -5.3448944091796875, "global_step": 7215, "epoch": 42} {"train_loss": -5.589223384857178, "global_step": 7216, "epoch": 42} {"train_loss": -5.296666622161865, "global_step": 7217, "epoch": 42} {"train_loss": -5.496304512023926, "global_step": 7218, "epoch": 42} {"train_loss": -5.553775310516357, "global_step": 7219, "epoch": 42} {"train_loss": -5.516671180725098, "global_step": 7220, "epoch": 42} {"train_loss": -5.546854019165039, "global_step": 7221, "epoch": 42} {"train_loss": -5.483160018920898, "global_step": 7222, "epoch": 42} {"train_loss": -5.350687827382769, "global_step": 7223, "epoch": 42, "val_loss": 268831.78125} {"train_loss": -5.312726974487305, "global_step": 7224, "epoch": 43} {"train_loss": -5.3879313468933105, "global_step": 7225, "epoch": 43} {"train_loss": -5.392333030700684, "global_step": 7226, "epoch": 43} {"train_loss": -5.462398529052734, "global_step": 7227, "epoch": 43} {"train_loss": -5.377891540527344, "global_step": 7228, "epoch": 43} {"train_loss": -5.211720943450928, "global_step": 7229, "epoch": 43} {"train_loss": -5.442410469055176, "global_step": 7230, "epoch": 43} {"train_loss": -5.232613563537598, "global_step": 7231, "epoch": 43} {"train_loss": -5.026291847229004, "global_step": 7232, "epoch": 43} {"train_loss": -5.3732008934021, "global_step": 7233, "epoch": 43} {"train_loss": -5.101515293121338, "global_step": 7234, "epoch": 43} {"train_loss": -5.252727508544922, "global_step": 7235, "epoch": 43} {"train_loss": -5.195121765136719, "global_step": 7236, "epoch": 43} {"train_loss": -5.386850357055664, "global_step": 7237, "epoch": 43} {"train_loss": -5.22611141204834, "global_step": 7238, "epoch": 43} {"train_loss": -5.154014587402344, "global_step": 7239, "epoch": 43} {"train_loss": -5.219888210296631, "global_step": 7240, "epoch": 43} {"train_loss": -5.4019622802734375, "global_step": 7241, "epoch": 43} {"train_loss": -5.375028133392334, "global_step": 7242, "epoch": 43} {"train_loss": -5.271028518676758, "global_step": 7243, "epoch": 43} {"train_loss": -5.477959632873535, "global_step": 7244, "epoch": 43} {"train_loss": -5.3329644203186035, "global_step": 7245, "epoch": 43} {"train_loss": -5.483855247497559, "global_step": 7246, "epoch": 43} {"train_loss": -5.551208019256592, "global_step": 7247, "epoch": 43} {"train_loss": -5.36799955368042, "global_step": 7248, "epoch": 43} {"train_loss": -5.375348091125488, "global_step": 7249, "epoch": 43} {"train_loss": -5.253715515136719, "global_step": 7250, "epoch": 43} {"train_loss": -5.143133163452148, "global_step": 7251, "epoch": 43} {"train_loss": -5.327028274536133, "global_step": 7252, "epoch": 43} {"train_loss": -5.1001057624816895, "global_step": 7253, "epoch": 43} {"train_loss": -5.376615047454834, "global_step": 7254, "epoch": 43} {"train_loss": -5.51732063293457, "global_step": 7255, "epoch": 43} {"train_loss": -5.394050598144531, "global_step": 7256, "epoch": 43} {"train_loss": -5.449891090393066, "global_step": 7257, "epoch": 43} {"train_loss": -5.354240894317627, "global_step": 7258, "epoch": 43} {"train_loss": -5.220625877380371, "global_step": 7259, "epoch": 43} {"train_loss": -5.234292030334473, "global_step": 7260, "epoch": 43} {"train_loss": -5.273486614227295, "global_step": 7261, "epoch": 43} {"train_loss": -5.352723598480225, "global_step": 7262, "epoch": 43} {"train_loss": -5.167448043823242, "global_step": 7263, "epoch": 43} {"train_loss": -5.537395477294922, "global_step": 7264, "epoch": 43} {"train_loss": -5.20280647277832, "global_step": 7265, "epoch": 43} {"train_loss": -5.1322922706604, "global_step": 7266, "epoch": 43} {"train_loss": -5.471449851989746, "global_step": 7267, "epoch": 43} {"train_loss": -5.461597442626953, "global_step": 7268, "epoch": 43} {"train_loss": -5.197287559509277, "global_step": 7269, "epoch": 43} {"train_loss": -5.114654064178467, "global_step": 7270, "epoch": 43} {"train_loss": -5.1080732345581055, "global_step": 7271, "epoch": 43} {"train_loss": -5.1808905601501465, "global_step": 7272, "epoch": 43} {"train_loss": -5.282027244567871, "global_step": 7273, "epoch": 43} {"train_loss": -5.248719215393066, "global_step": 7274, "epoch": 43} {"train_loss": -5.314533710479736, "global_step": 7275, "epoch": 43} {"train_loss": -5.142756462097168, "global_step": 7276, "epoch": 43} {"train_loss": -5.302178382873535, "global_step": 7277, "epoch": 43} {"train_loss": -5.185088157653809, "global_step": 7278, "epoch": 43} {"train_loss": -5.104987621307373, "global_step": 7279, "epoch": 43} {"train_loss": -5.098936080932617, "global_step": 7280, "epoch": 43} {"train_loss": -5.358842849731445, "global_step": 7281, "epoch": 43} {"train_loss": -5.335206031799316, "global_step": 7282, "epoch": 43} {"train_loss": -5.2615227699279785, "global_step": 7283, "epoch": 43} {"train_loss": -5.03758430480957, "global_step": 7284, "epoch": 43} {"train_loss": -5.035722255706787, "global_step": 7285, "epoch": 43} {"train_loss": -5.273155212402344, "global_step": 7286, "epoch": 43} {"train_loss": -5.374423027038574, "global_step": 7287, "epoch": 43} {"train_loss": -5.218656539916992, "global_step": 7288, "epoch": 43} {"train_loss": -5.402172565460205, "global_step": 7289, "epoch": 43} {"train_loss": -5.363880157470703, "global_step": 7290, "epoch": 43} {"train_loss": -5.50237512588501, "global_step": 7291, "epoch": 43} {"train_loss": -5.418335914611816, "global_step": 7292, "epoch": 43} {"train_loss": -5.365464687347412, "global_step": 7293, "epoch": 43} {"train_loss": -5.305377960205078, "global_step": 7294, "epoch": 43} {"train_loss": -5.422514915466309, "global_step": 7295, "epoch": 43} {"train_loss": -5.392608165740967, "global_step": 7296, "epoch": 43} {"train_loss": -5.3800272941589355, "global_step": 7297, "epoch": 43} {"train_loss": -5.505600452423096, "global_step": 7298, "epoch": 43} {"train_loss": -5.601041793823242, "global_step": 7299, "epoch": 43} {"train_loss": -5.615390777587891, "global_step": 7300, "epoch": 43} {"train_loss": -5.424171447753906, "global_step": 7301, "epoch": 43} {"train_loss": -5.2819504737854, "global_step": 7302, "epoch": 43} {"train_loss": -5.36380672454834, "global_step": 7303, "epoch": 43} {"train_loss": -5.7241621017456055, "global_step": 7304, "epoch": 43} {"train_loss": -5.5639448165893555, "global_step": 7305, "epoch": 43} {"train_loss": -5.544259548187256, "global_step": 7306, "epoch": 43} {"train_loss": -5.346352577209473, "global_step": 7307, "epoch": 43} {"train_loss": -5.606319427490234, "global_step": 7308, "epoch": 43} {"train_loss": -5.485235214233398, "global_step": 7309, "epoch": 43} {"train_loss": -5.388012886047363, "global_step": 7310, "epoch": 43} {"train_loss": -5.401636123657227, "global_step": 7311, "epoch": 43} {"train_loss": -5.254364490509033, "global_step": 7312, "epoch": 43} {"train_loss": -5.199290752410889, "global_step": 7313, "epoch": 43} {"train_loss": -5.292257308959961, "global_step": 7314, "epoch": 43} {"train_loss": -5.441441059112549, "global_step": 7315, "epoch": 43} {"train_loss": -5.221535682678223, "global_step": 7316, "epoch": 43} {"train_loss": -5.163697242736816, "global_step": 7317, "epoch": 43} {"train_loss": -5.309479236602783, "global_step": 7318, "epoch": 43} {"train_loss": -5.202264308929443, "global_step": 7319, "epoch": 43} {"train_loss": -5.490939140319824, "global_step": 7320, "epoch": 43} {"train_loss": -5.333675384521484, "global_step": 7321, "epoch": 43} {"train_loss": -5.210455894470215, "global_step": 7322, "epoch": 43} {"train_loss": -5.344034194946289, "global_step": 7323, "epoch": 43} {"train_loss": -5.511768341064453, "global_step": 7324, "epoch": 43} {"train_loss": -5.591945648193359, "global_step": 7325, "epoch": 43} {"train_loss": -5.384791374206543, "global_step": 7326, "epoch": 43} {"train_loss": -5.399408340454102, "global_step": 7327, "epoch": 43} {"train_loss": -5.531488418579102, "global_step": 7328, "epoch": 43} {"train_loss": -5.486067771911621, "global_step": 7329, "epoch": 43} {"train_loss": -5.294423580169678, "global_step": 7330, "epoch": 43} {"train_loss": -5.42165994644165, "global_step": 7331, "epoch": 43} {"train_loss": -5.224454879760742, "global_step": 7332, "epoch": 43} {"train_loss": -5.413887023925781, "global_step": 7333, "epoch": 43} {"train_loss": -5.287623405456543, "global_step": 7334, "epoch": 43} {"train_loss": -5.228025436401367, "global_step": 7335, "epoch": 43} {"train_loss": -5.488969802856445, "global_step": 7336, "epoch": 43} {"train_loss": -5.355292320251465, "global_step": 7337, "epoch": 43} {"train_loss": -5.284684658050537, "global_step": 7338, "epoch": 43} {"train_loss": -5.459221839904785, "global_step": 7339, "epoch": 43} {"train_loss": -5.088411331176758, "global_step": 7340, "epoch": 43} {"train_loss": -5.5339813232421875, "global_step": 7341, "epoch": 43} {"train_loss": -5.281435012817383, "global_step": 7342, "epoch": 43} {"train_loss": -5.398534774780273, "global_step": 7343, "epoch": 43} {"train_loss": -5.705848693847656, "global_step": 7344, "epoch": 43} {"train_loss": -5.395495414733887, "global_step": 7345, "epoch": 43} {"train_loss": -5.611120223999023, "global_step": 7346, "epoch": 43} {"train_loss": -5.42509126663208, "global_step": 7347, "epoch": 43} {"train_loss": -5.4872822761535645, "global_step": 7348, "epoch": 43} {"train_loss": -5.335980415344238, "global_step": 7349, "epoch": 43} {"train_loss": -5.2396745681762695, "global_step": 7350, "epoch": 43} {"train_loss": -5.366299629211426, "global_step": 7351, "epoch": 43} {"train_loss": -5.278392791748047, "global_step": 7352, "epoch": 43} {"train_loss": -5.44825553894043, "global_step": 7353, "epoch": 43} {"train_loss": -5.197516918182373, "global_step": 7354, "epoch": 43} {"train_loss": -5.251979351043701, "global_step": 7355, "epoch": 43} {"train_loss": -5.2644853591918945, "global_step": 7356, "epoch": 43} {"train_loss": -5.508062362670898, "global_step": 7357, "epoch": 43} {"train_loss": -5.510214805603027, "global_step": 7358, "epoch": 43} {"train_loss": -5.448213577270508, "global_step": 7359, "epoch": 43} {"train_loss": -5.224756240844727, "global_step": 7360, "epoch": 43} {"train_loss": -5.359006881713867, "global_step": 7361, "epoch": 43} {"train_loss": -5.558558464050293, "global_step": 7362, "epoch": 43} {"train_loss": -5.304117202758789, "global_step": 7363, "epoch": 43} {"train_loss": -5.491096496582031, "global_step": 7364, "epoch": 43} {"train_loss": -5.593508243560791, "global_step": 7365, "epoch": 43} {"train_loss": -5.506811141967773, "global_step": 7366, "epoch": 43} {"train_loss": -5.416429042816162, "global_step": 7367, "epoch": 43} {"train_loss": -5.4224042892456055, "global_step": 7368, "epoch": 43} {"train_loss": -5.362421035766602, "global_step": 7369, "epoch": 43} {"train_loss": -5.317810535430908, "global_step": 7370, "epoch": 43} {"train_loss": -5.638742446899414, "global_step": 7371, "epoch": 43} {"train_loss": -5.572368621826172, "global_step": 7372, "epoch": 43} {"train_loss": -5.7110137939453125, "global_step": 7373, "epoch": 43} {"train_loss": -5.161795616149902, "global_step": 7374, "epoch": 43} {"train_loss": -5.619739532470703, "global_step": 7375, "epoch": 43} {"train_loss": -5.394253253936768, "global_step": 7376, "epoch": 43} {"train_loss": -5.469598770141602, "global_step": 7377, "epoch": 43} {"train_loss": -5.451109886169434, "global_step": 7378, "epoch": 43} {"train_loss": -5.701850891113281, "global_step": 7379, "epoch": 43} {"train_loss": -5.402563095092773, "global_step": 7380, "epoch": 43} {"train_loss": -5.480604648590088, "global_step": 7381, "epoch": 43} {"train_loss": -5.39736270904541, "global_step": 7382, "epoch": 43} {"train_loss": -5.258585453033447, "global_step": 7383, "epoch": 43} {"train_loss": -5.503900051116943, "global_step": 7384, "epoch": 43} {"train_loss": -5.541164398193359, "global_step": 7385, "epoch": 43} {"train_loss": -5.2229461669921875, "global_step": 7386, "epoch": 43} {"train_loss": -5.229732513427734, "global_step": 7387, "epoch": 43} {"train_loss": -5.502664566040039, "global_step": 7388, "epoch": 43} {"train_loss": -5.327019691467285, "global_step": 7389, "epoch": 43} {"train_loss": -5.369728088378906, "global_step": 7390, "epoch": 43} {"train_loss": -5.357284069061279, "global_step": 7391, "epoch": 43, "val_loss": 285376.5625} {"train_loss": -5.0070295333862305, "global_step": 7392, "epoch": 44} {"train_loss": -5.1935906410217285, "global_step": 7393, "epoch": 44} {"train_loss": -5.472251892089844, "global_step": 7394, "epoch": 44} {"train_loss": -5.320627212524414, "global_step": 7395, "epoch": 44} {"train_loss": -5.490442276000977, "global_step": 7396, "epoch": 44} {"train_loss": -5.209288597106934, "global_step": 7397, "epoch": 44} {"train_loss": -5.369503974914551, "global_step": 7398, "epoch": 44} {"train_loss": -5.360966205596924, "global_step": 7399, "epoch": 44} {"train_loss": -5.116457939147949, "global_step": 7400, "epoch": 44} {"train_loss": -5.425629615783691, "global_step": 7401, "epoch": 44} {"train_loss": -5.350030899047852, "global_step": 7402, "epoch": 44} {"train_loss": -5.463270664215088, "global_step": 7403, "epoch": 44} {"train_loss": -5.447011947631836, "global_step": 7404, "epoch": 44} {"train_loss": -5.610966205596924, "global_step": 7405, "epoch": 44} {"train_loss": -5.568000316619873, "global_step": 7406, "epoch": 44} {"train_loss": -5.496084690093994, "global_step": 7407, "epoch": 44} {"train_loss": -5.3851094245910645, "global_step": 7408, "epoch": 44} {"train_loss": -5.159815788269043, "global_step": 7409, "epoch": 44} {"train_loss": -5.44459342956543, "global_step": 7410, "epoch": 44} {"train_loss": -5.4658427238464355, "global_step": 7411, "epoch": 44} {"train_loss": -5.444141864776611, "global_step": 7412, "epoch": 44} {"train_loss": -5.58438777923584, "global_step": 7413, "epoch": 44} {"train_loss": -5.274181365966797, "global_step": 7414, "epoch": 44} {"train_loss": -5.076476097106934, "global_step": 7415, "epoch": 44} {"train_loss": -5.465179443359375, "global_step": 7416, "epoch": 44} {"train_loss": -5.181907653808594, "global_step": 7417, "epoch": 44} {"train_loss": -5.445210933685303, "global_step": 7418, "epoch": 44} {"train_loss": -5.057693958282471, "global_step": 7419, "epoch": 44} {"train_loss": -5.345851421356201, "global_step": 7420, "epoch": 44} {"train_loss": -5.181629180908203, "global_step": 7421, "epoch": 44} {"train_loss": -5.064145088195801, "global_step": 7422, "epoch": 44} {"train_loss": -5.381314277648926, "global_step": 7423, "epoch": 44} {"train_loss": -5.116121292114258, "global_step": 7424, "epoch": 44} {"train_loss": -5.142759323120117, "global_step": 7425, "epoch": 44} {"train_loss": -5.480143070220947, "global_step": 7426, "epoch": 44} {"train_loss": -5.180029392242432, "global_step": 7427, "epoch": 44} {"train_loss": -5.359257221221924, "global_step": 7428, "epoch": 44} {"train_loss": -5.270316123962402, "global_step": 7429, "epoch": 44} {"train_loss": -5.229914665222168, "global_step": 7430, "epoch": 44} {"train_loss": -5.389644622802734, "global_step": 7431, "epoch": 44} {"train_loss": -5.224012851715088, "global_step": 7432, "epoch": 44} {"train_loss": -5.100090980529785, "global_step": 7433, "epoch": 44} {"train_loss": -5.103072643280029, "global_step": 7434, "epoch": 44} {"train_loss": -5.41801118850708, "global_step": 7435, "epoch": 44} {"train_loss": -5.719829559326172, "global_step": 7436, "epoch": 44} {"train_loss": -5.568483829498291, "global_step": 7437, "epoch": 44} {"train_loss": -5.499634742736816, "global_step": 7438, "epoch": 44} {"train_loss": -5.434913158416748, "global_step": 7439, "epoch": 44} {"train_loss": -5.5429229736328125, "global_step": 7440, "epoch": 44} {"train_loss": -5.6730570793151855, "global_step": 7441, "epoch": 44} {"train_loss": -5.584262371063232, "global_step": 7442, "epoch": 44} {"train_loss": -5.29240083694458, "global_step": 7443, "epoch": 44} {"train_loss": -5.317464828491211, "global_step": 7444, "epoch": 44} {"train_loss": -5.431891441345215, "global_step": 7445, "epoch": 44} {"train_loss": -5.229092597961426, "global_step": 7446, "epoch": 44} {"train_loss": -5.143683433532715, "global_step": 7447, "epoch": 44} {"train_loss": -5.555200099945068, "global_step": 7448, "epoch": 44} {"train_loss": -5.287563323974609, "global_step": 7449, "epoch": 44} {"train_loss": -5.392736911773682, "global_step": 7450, "epoch": 44} {"train_loss": -5.443538665771484, "global_step": 7451, "epoch": 44} {"train_loss": -5.29892635345459, "global_step": 7452, "epoch": 44} {"train_loss": -5.504504680633545, "global_step": 7453, "epoch": 44} {"train_loss": -5.2621002197265625, "global_step": 7454, "epoch": 44} {"train_loss": -5.291269302368164, "global_step": 7455, "epoch": 44} {"train_loss": -5.450397968292236, "global_step": 7456, "epoch": 44} {"train_loss": -5.367358207702637, "global_step": 7457, "epoch": 44} {"train_loss": -5.508780002593994, "global_step": 7458, "epoch": 44} {"train_loss": -5.413978576660156, "global_step": 7459, "epoch": 44} {"train_loss": -5.504494667053223, "global_step": 7460, "epoch": 44} {"train_loss": -5.427608013153076, "global_step": 7461, "epoch": 44} {"train_loss": -5.369651794433594, "global_step": 7462, "epoch": 44} {"train_loss": -5.464975833892822, "global_step": 7463, "epoch": 44} {"train_loss": -5.414898872375488, "global_step": 7464, "epoch": 44} {"train_loss": -5.566268444061279, "global_step": 7465, "epoch": 44} {"train_loss": -5.228135585784912, "global_step": 7466, "epoch": 44} {"train_loss": -5.6300482749938965, "global_step": 7467, "epoch": 44} {"train_loss": -5.759435176849365, "global_step": 7468, "epoch": 44} {"train_loss": -5.566076755523682, "global_step": 7469, "epoch": 44} {"train_loss": -5.305800914764404, "global_step": 7470, "epoch": 44} {"train_loss": -5.409740447998047, "global_step": 7471, "epoch": 44} {"train_loss": -5.282365798950195, "global_step": 7472, "epoch": 44} {"train_loss": -5.340660095214844, "global_step": 7473, "epoch": 44} {"train_loss": -5.343442916870117, "global_step": 7474, "epoch": 44} {"train_loss": -5.376072883605957, "global_step": 7475, "epoch": 44} {"train_loss": -5.332244873046875, "global_step": 7476, "epoch": 44} {"train_loss": -5.575436592102051, "global_step": 7477, "epoch": 44} {"train_loss": -5.628929138183594, "global_step": 7478, "epoch": 44} {"train_loss": -5.3095526695251465, "global_step": 7479, "epoch": 44} {"train_loss": -5.437079429626465, "global_step": 7480, "epoch": 44} {"train_loss": -5.668412685394287, "global_step": 7481, "epoch": 44} {"train_loss": -5.170083999633789, "global_step": 7482, "epoch": 44} {"train_loss": -5.337957382202148, "global_step": 7483, "epoch": 44} {"train_loss": -5.327996730804443, "global_step": 7484, "epoch": 44} {"train_loss": -5.2908220291137695, "global_step": 7485, "epoch": 44} {"train_loss": -5.196636199951172, "global_step": 7486, "epoch": 44} {"train_loss": -5.416955947875977, "global_step": 7487, "epoch": 44} {"train_loss": -5.384252548217773, "global_step": 7488, "epoch": 44} {"train_loss": -5.113615036010742, "global_step": 7489, "epoch": 44} {"train_loss": -5.582244873046875, "global_step": 7490, "epoch": 44} {"train_loss": -5.461592674255371, "global_step": 7491, "epoch": 44} {"train_loss": -5.60873556137085, "global_step": 7492, "epoch": 44} {"train_loss": -5.636899471282959, "global_step": 7493, "epoch": 44} {"train_loss": -5.451539039611816, "global_step": 7494, "epoch": 44} {"train_loss": -5.293464660644531, "global_step": 7495, "epoch": 44} {"train_loss": -5.373936653137207, "global_step": 7496, "epoch": 44} {"train_loss": -5.471733093261719, "global_step": 7497, "epoch": 44} {"train_loss": -5.468243598937988, "global_step": 7498, "epoch": 44} {"train_loss": -5.421365261077881, "global_step": 7499, "epoch": 44} {"train_loss": -5.291038513183594, "global_step": 7500, "epoch": 44} {"train_loss": -5.52598762512207, "global_step": 7501, "epoch": 44} {"train_loss": -5.35790491104126, "global_step": 7502, "epoch": 44} {"train_loss": -5.400722503662109, "global_step": 7503, "epoch": 44} {"train_loss": -5.567050933837891, "global_step": 7504, "epoch": 44} {"train_loss": -5.621166229248047, "global_step": 7505, "epoch": 44} {"train_loss": -5.741140365600586, "global_step": 7506, "epoch": 44} {"train_loss": -5.5120391845703125, "global_step": 7507, "epoch": 44} {"train_loss": -5.671368598937988, "global_step": 7508, "epoch": 44} {"train_loss": -5.420997142791748, "global_step": 7509, "epoch": 44} {"train_loss": -5.433826923370361, "global_step": 7510, "epoch": 44} {"train_loss": -5.435357093811035, "global_step": 7511, "epoch": 44} {"train_loss": -5.451683521270752, "global_step": 7512, "epoch": 44} {"train_loss": -5.268164157867432, "global_step": 7513, "epoch": 44} {"train_loss": -5.611313819885254, "global_step": 7514, "epoch": 44} {"train_loss": -5.231941223144531, "global_step": 7515, "epoch": 44} {"train_loss": -5.403817653656006, "global_step": 7516, "epoch": 44} {"train_loss": -5.471855163574219, "global_step": 7517, "epoch": 44} {"train_loss": -5.245638847351074, "global_step": 7518, "epoch": 44} {"train_loss": -5.492788791656494, "global_step": 7519, "epoch": 44} {"train_loss": -5.148711681365967, "global_step": 7520, "epoch": 44} {"train_loss": -5.381370544433594, "global_step": 7521, "epoch": 44} {"train_loss": -5.157046318054199, "global_step": 7522, "epoch": 44} {"train_loss": -5.191184997558594, "global_step": 7523, "epoch": 44} {"train_loss": -5.268514156341553, "global_step": 7524, "epoch": 44} {"train_loss": -5.198522567749023, "global_step": 7525, "epoch": 44} {"train_loss": -5.561131954193115, "global_step": 7526, "epoch": 44} {"train_loss": -5.309718132019043, "global_step": 7527, "epoch": 44} {"train_loss": -5.321621894836426, "global_step": 7528, "epoch": 44} {"train_loss": -5.453031063079834, "global_step": 7529, "epoch": 44} {"train_loss": -5.218795299530029, "global_step": 7530, "epoch": 44} {"train_loss": -5.269227504730225, "global_step": 7531, "epoch": 44} {"train_loss": -5.192470550537109, "global_step": 7532, "epoch": 44} {"train_loss": -5.446874141693115, "global_step": 7533, "epoch": 44} {"train_loss": -5.582215785980225, "global_step": 7534, "epoch": 44} {"train_loss": -5.078486442565918, "global_step": 7535, "epoch": 44} {"train_loss": -5.135114669799805, "global_step": 7536, "epoch": 44} {"train_loss": -5.176346302032471, "global_step": 7537, "epoch": 44} {"train_loss": -5.361114978790283, "global_step": 7538, "epoch": 44} {"train_loss": -5.146559715270996, "global_step": 7539, "epoch": 44} {"train_loss": -5.54950475692749, "global_step": 7540, "epoch": 44} {"train_loss": -5.38128662109375, "global_step": 7541, "epoch": 44} {"train_loss": -5.075037002563477, "global_step": 7542, "epoch": 44} {"train_loss": -5.553023338317871, "global_step": 7543, "epoch": 44} {"train_loss": -5.202845573425293, "global_step": 7544, "epoch": 44} {"train_loss": -5.403524398803711, "global_step": 7545, "epoch": 44} {"train_loss": -5.183824062347412, "global_step": 7546, "epoch": 44} {"train_loss": -5.1069440841674805, "global_step": 7547, "epoch": 44} {"train_loss": -5.612365245819092, "global_step": 7548, "epoch": 44} {"train_loss": -5.250786781311035, "global_step": 7549, "epoch": 44} {"train_loss": -5.375299453735352, "global_step": 7550, "epoch": 44} {"train_loss": -5.392195701599121, "global_step": 7551, "epoch": 44} {"train_loss": -5.082204341888428, "global_step": 7552, "epoch": 44} {"train_loss": -5.523547172546387, "global_step": 7553, "epoch": 44} {"train_loss": -5.306545257568359, "global_step": 7554, "epoch": 44} {"train_loss": -5.2720842361450195, "global_step": 7555, "epoch": 44} {"train_loss": -5.535708904266357, "global_step": 7556, "epoch": 44} {"train_loss": -5.372163772583008, "global_step": 7557, "epoch": 44} {"train_loss": -5.528221130371094, "global_step": 7558, "epoch": 44} {"train_loss": -5.374603223232996, "global_step": 7559, "epoch": 44, "val_loss": 279643.15625} {"train_loss": -5.423073768615723, "global_step": 7560, "epoch": 45} {"train_loss": -5.639662742614746, "global_step": 7561, "epoch": 45} {"train_loss": -5.2447381019592285, "global_step": 7562, "epoch": 45} {"train_loss": -5.458107948303223, "global_step": 7563, "epoch": 45} {"train_loss": -5.516107559204102, "global_step": 7564, "epoch": 45} {"train_loss": -5.193386077880859, "global_step": 7565, "epoch": 45} {"train_loss": -5.256125450134277, "global_step": 7566, "epoch": 45} {"train_loss": -5.335974216461182, "global_step": 7567, "epoch": 45} {"train_loss": -5.301870346069336, "global_step": 7568, "epoch": 45} {"train_loss": -5.8182525634765625, "global_step": 7569, "epoch": 45} {"train_loss": -5.432681083679199, "global_step": 7570, "epoch": 45} {"train_loss": -5.527902603149414, "global_step": 7571, "epoch": 45} {"train_loss": -5.62055778503418, "global_step": 7572, "epoch": 45} {"train_loss": -5.5857062339782715, "global_step": 7573, "epoch": 45} {"train_loss": -5.823480606079102, "global_step": 7574, "epoch": 45} {"train_loss": -5.506895065307617, "global_step": 7575, "epoch": 45} {"train_loss": -5.3765997886657715, "global_step": 7576, "epoch": 45} {"train_loss": -5.557900428771973, "global_step": 7577, "epoch": 45} {"train_loss": -5.297821998596191, "global_step": 7578, "epoch": 45} {"train_loss": -5.539761066436768, "global_step": 7579, "epoch": 45} {"train_loss": -5.409508228302002, "global_step": 7580, "epoch": 45} {"train_loss": -5.813387870788574, "global_step": 7581, "epoch": 45} {"train_loss": -5.600725173950195, "global_step": 7582, "epoch": 45} {"train_loss": -5.490776538848877, "global_step": 7583, "epoch": 45} {"train_loss": -5.6869354248046875, "global_step": 7584, "epoch": 45} {"train_loss": -5.679744720458984, "global_step": 7585, "epoch": 45} {"train_loss": -5.734429836273193, "global_step": 7586, "epoch": 45} {"train_loss": -5.43817663192749, "global_step": 7587, "epoch": 45} {"train_loss": -5.630763053894043, "global_step": 7588, "epoch": 45} {"train_loss": -5.458339214324951, "global_step": 7589, "epoch": 45} {"train_loss": -5.383845329284668, "global_step": 7590, "epoch": 45} {"train_loss": -5.4548540115356445, "global_step": 7591, "epoch": 45} {"train_loss": -5.510510444641113, "global_step": 7592, "epoch": 45} {"train_loss": -5.624044418334961, "global_step": 7593, "epoch": 45} {"train_loss": -5.672621250152588, "global_step": 7594, "epoch": 45} {"train_loss": -5.515478134155273, "global_step": 7595, "epoch": 45} {"train_loss": -5.455625534057617, "global_step": 7596, "epoch": 45} {"train_loss": -5.462646484375, "global_step": 7597, "epoch": 45} {"train_loss": -5.456268310546875, "global_step": 7598, "epoch": 45} {"train_loss": -5.3748273849487305, "global_step": 7599, "epoch": 45} {"train_loss": -5.613135814666748, "global_step": 7600, "epoch": 45} {"train_loss": -5.436232566833496, "global_step": 7601, "epoch": 45} {"train_loss": -5.654021739959717, "global_step": 7602, "epoch": 45} {"train_loss": -5.52555513381958, "global_step": 7603, "epoch": 45} {"train_loss": -5.673098564147949, "global_step": 7604, "epoch": 45} {"train_loss": -5.451999664306641, "global_step": 7605, "epoch": 45} {"train_loss": -5.423069000244141, "global_step": 7606, "epoch": 45} {"train_loss": -5.51327657699585, "global_step": 7607, "epoch": 45} {"train_loss": -5.267742156982422, "global_step": 7608, "epoch": 45} {"train_loss": -5.587306022644043, "global_step": 7609, "epoch": 45} {"train_loss": -5.71388053894043, "global_step": 7610, "epoch": 45} {"train_loss": -5.673750877380371, "global_step": 7611, "epoch": 45} {"train_loss": -5.457573890686035, "global_step": 7612, "epoch": 45} {"train_loss": -5.558322429656982, "global_step": 7613, "epoch": 45} {"train_loss": -5.732807159423828, "global_step": 7614, "epoch": 45} {"train_loss": -5.332569599151611, "global_step": 7615, "epoch": 45} {"train_loss": -5.629386901855469, "global_step": 7616, "epoch": 45} {"train_loss": -5.390527248382568, "global_step": 7617, "epoch": 45} {"train_loss": -5.795680999755859, "global_step": 7618, "epoch": 45} {"train_loss": -5.326549053192139, "global_step": 7619, "epoch": 45} {"train_loss": -5.581489562988281, "global_step": 7620, "epoch": 45} {"train_loss": -5.338046073913574, "global_step": 7621, "epoch": 45} {"train_loss": -5.289597511291504, "global_step": 7622, "epoch": 45} {"train_loss": -5.173214912414551, "global_step": 7623, "epoch": 45} {"train_loss": -5.373456954956055, "global_step": 7624, "epoch": 45} {"train_loss": -5.598964691162109, "global_step": 7625, "epoch": 45} {"train_loss": -5.124073505401611, "global_step": 7626, "epoch": 45} {"train_loss": -5.293176174163818, "global_step": 7627, "epoch": 45} {"train_loss": -5.0936479568481445, "global_step": 7628, "epoch": 45} {"train_loss": -5.401080131530762, "global_step": 7629, "epoch": 45} {"train_loss": -5.305022239685059, "global_step": 7630, "epoch": 45} {"train_loss": -5.157533645629883, "global_step": 7631, "epoch": 45} {"train_loss": -5.128495693206787, "global_step": 7632, "epoch": 45} {"train_loss": -5.227083206176758, "global_step": 7633, "epoch": 45} {"train_loss": -5.378450393676758, "global_step": 7634, "epoch": 45} {"train_loss": -5.034485816955566, "global_step": 7635, "epoch": 45} {"train_loss": -5.5343017578125, "global_step": 7636, "epoch": 45} {"train_loss": -5.308159828186035, "global_step": 7637, "epoch": 45} {"train_loss": -5.467192649841309, "global_step": 7638, "epoch": 45} {"train_loss": -5.699112892150879, "global_step": 7639, "epoch": 45} {"train_loss": -5.443355560302734, "global_step": 7640, "epoch": 45} {"train_loss": -5.381062030792236, "global_step": 7641, "epoch": 45} {"train_loss": -5.595271587371826, "global_step": 7642, "epoch": 45} {"train_loss": -5.798340797424316, "global_step": 7643, "epoch": 45} {"train_loss": -5.509171485900879, "global_step": 7644, "epoch": 45} {"train_loss": -5.5894999504089355, "global_step": 7645, "epoch": 45} {"train_loss": -5.338814735412598, "global_step": 7646, "epoch": 45} {"train_loss": -5.261900424957275, "global_step": 7647, "epoch": 45} {"train_loss": -5.562502861022949, "global_step": 7648, "epoch": 45} {"train_loss": -5.336794853210449, "global_step": 7649, "epoch": 45} {"train_loss": -5.751969814300537, "global_step": 7650, "epoch": 45} {"train_loss": -5.073791980743408, "global_step": 7651, "epoch": 45} {"train_loss": -5.435928821563721, "global_step": 7652, "epoch": 45} {"train_loss": -5.021542549133301, "global_step": 7653, "epoch": 45} {"train_loss": -5.309444427490234, "global_step": 7654, "epoch": 45} {"train_loss": -5.594149589538574, "global_step": 7655, "epoch": 45} {"train_loss": -5.277847766876221, "global_step": 7656, "epoch": 45} {"train_loss": -5.570367813110352, "global_step": 7657, "epoch": 45} {"train_loss": -5.2690110206604, "global_step": 7658, "epoch": 45} {"train_loss": -5.4023566246032715, "global_step": 7659, "epoch": 45} {"train_loss": -5.37373685836792, "global_step": 7660, "epoch": 45} {"train_loss": -5.384596824645996, "global_step": 7661, "epoch": 45} {"train_loss": -5.384480953216553, "global_step": 7662, "epoch": 45} {"train_loss": -5.655547618865967, "global_step": 7663, "epoch": 45} {"train_loss": -5.542701721191406, "global_step": 7664, "epoch": 45} {"train_loss": -5.453914642333984, "global_step": 7665, "epoch": 45} {"train_loss": -5.227574825286865, "global_step": 7666, "epoch": 45} {"train_loss": -5.678419589996338, "global_step": 7667, "epoch": 45} {"train_loss": -5.367453575134277, "global_step": 7668, "epoch": 45} {"train_loss": -5.2331037521362305, "global_step": 7669, "epoch": 45} {"train_loss": -5.524547576904297, "global_step": 7670, "epoch": 45} {"train_loss": -5.484607696533203, "global_step": 7671, "epoch": 45} {"train_loss": -5.455660343170166, "global_step": 7672, "epoch": 45} {"train_loss": -5.564245700836182, "global_step": 7673, "epoch": 45} {"train_loss": -5.545090675354004, "global_step": 7674, "epoch": 45} {"train_loss": -5.506757736206055, "global_step": 7675, "epoch": 45} {"train_loss": -5.45412015914917, "global_step": 7676, "epoch": 45} {"train_loss": -5.682347774505615, "global_step": 7677, "epoch": 45} {"train_loss": -5.465279579162598, "global_step": 7678, "epoch": 45} {"train_loss": -5.385133266448975, "global_step": 7679, "epoch": 45} {"train_loss": -5.252636909484863, "global_step": 7680, "epoch": 45} {"train_loss": -5.588361740112305, "global_step": 7681, "epoch": 45} {"train_loss": -5.373201370239258, "global_step": 7682, "epoch": 45} {"train_loss": -5.4090800285339355, "global_step": 7683, "epoch": 45} {"train_loss": -5.353545188903809, "global_step": 7684, "epoch": 45} {"train_loss": -5.55252742767334, "global_step": 7685, "epoch": 45} {"train_loss": -5.545940399169922, "global_step": 7686, "epoch": 45} {"train_loss": -5.313612937927246, "global_step": 7687, "epoch": 45} {"train_loss": -5.595478534698486, "global_step": 7688, "epoch": 45} {"train_loss": -5.537275791168213, "global_step": 7689, "epoch": 45} {"train_loss": -5.515726566314697, "global_step": 7690, "epoch": 45} {"train_loss": -5.348362922668457, "global_step": 7691, "epoch": 45} {"train_loss": -5.4225921630859375, "global_step": 7692, "epoch": 45} {"train_loss": -5.500033855438232, "global_step": 7693, "epoch": 45} {"train_loss": -5.298912525177002, "global_step": 7694, "epoch": 45} {"train_loss": -5.851110935211182, "global_step": 7695, "epoch": 45} {"train_loss": -5.357071399688721, "global_step": 7696, "epoch": 45} {"train_loss": -5.317582130432129, "global_step": 7697, "epoch": 45} {"train_loss": -5.661868095397949, "global_step": 7698, "epoch": 45} {"train_loss": -5.48140811920166, "global_step": 7699, "epoch": 45} {"train_loss": -5.5321760177612305, "global_step": 7700, "epoch": 45} {"train_loss": -5.430170059204102, "global_step": 7701, "epoch": 45} {"train_loss": -5.472938537597656, "global_step": 7702, "epoch": 45} {"train_loss": -5.391280174255371, "global_step": 7703, "epoch": 45} {"train_loss": -5.4811530113220215, "global_step": 7704, "epoch": 45} {"train_loss": -5.482567310333252, "global_step": 7705, "epoch": 45} {"train_loss": -5.392368316650391, "global_step": 7706, "epoch": 45} {"train_loss": -5.4252166748046875, "global_step": 7707, "epoch": 45} {"train_loss": -5.799716949462891, "global_step": 7708, "epoch": 45} {"train_loss": -5.475689888000488, "global_step": 7709, "epoch": 45} {"train_loss": -5.579672813415527, "global_step": 7710, "epoch": 45} {"train_loss": -5.568453788757324, "global_step": 7711, "epoch": 45} {"train_loss": -5.47477912902832, "global_step": 7712, "epoch": 45} {"train_loss": -5.4657392501831055, "global_step": 7713, "epoch": 45} {"train_loss": -5.307126998901367, "global_step": 7714, "epoch": 45} {"train_loss": -5.7036824226379395, "global_step": 7715, "epoch": 45} {"train_loss": -5.482250690460205, "global_step": 7716, "epoch": 45} {"train_loss": -5.264482498168945, "global_step": 7717, "epoch": 45} {"train_loss": -5.541767120361328, "global_step": 7718, "epoch": 45} {"train_loss": -5.38266658782959, "global_step": 7719, "epoch": 45} {"train_loss": -5.649374961853027, "global_step": 7720, "epoch": 45} {"train_loss": -5.048758506774902, "global_step": 7721, "epoch": 45} {"train_loss": -5.350157737731934, "global_step": 7722, "epoch": 45} {"train_loss": -5.461475372314453, "global_step": 7723, "epoch": 45} {"train_loss": -5.529488563537598, "global_step": 7724, "epoch": 45} {"train_loss": -5.703680038452148, "global_step": 7725, "epoch": 45} {"train_loss": -5.565491676330566, "global_step": 7726, "epoch": 45} {"train_loss": -5.466593004408336, "global_step": 7727, "epoch": 45, "val_loss": 273395.375, "train_action_mse_error": 48.408294677734375} {"train_loss": -5.63746452331543, "global_step": 7728, "epoch": 46} {"train_loss": -5.534084320068359, "global_step": 7729, "epoch": 46} {"train_loss": -5.235832214355469, "global_step": 7730, "epoch": 46} {"train_loss": -5.58070182800293, "global_step": 7731, "epoch": 46} {"train_loss": -5.526744842529297, "global_step": 7732, "epoch": 46} {"train_loss": -5.409370422363281, "global_step": 7733, "epoch": 46} {"train_loss": -5.314157009124756, "global_step": 7734, "epoch": 46} {"train_loss": -5.561323642730713, "global_step": 7735, "epoch": 46} {"train_loss": -5.502558708190918, "global_step": 7736, "epoch": 46} {"train_loss": -5.34408712387085, "global_step": 7737, "epoch": 46} {"train_loss": -5.244985103607178, "global_step": 7738, "epoch": 46} {"train_loss": -5.271932125091553, "global_step": 7739, "epoch": 46} {"train_loss": -5.576750755310059, "global_step": 7740, "epoch": 46} {"train_loss": -5.4057464599609375, "global_step": 7741, "epoch": 46} {"train_loss": -5.510907173156738, "global_step": 7742, "epoch": 46} {"train_loss": -5.225583553314209, "global_step": 7743, "epoch": 46} {"train_loss": -5.458578109741211, "global_step": 7744, "epoch": 46} {"train_loss": -5.52329683303833, "global_step": 7745, "epoch": 46} {"train_loss": -5.380288124084473, "global_step": 7746, "epoch": 46} {"train_loss": -5.203968524932861, "global_step": 7747, "epoch": 46} {"train_loss": -5.328301906585693, "global_step": 7748, "epoch": 46} {"train_loss": -5.506953239440918, "global_step": 7749, "epoch": 46} {"train_loss": -5.434423446655273, "global_step": 7750, "epoch": 46} {"train_loss": -5.451365947723389, "global_step": 7751, "epoch": 46} {"train_loss": -5.534558296203613, "global_step": 7752, "epoch": 46} {"train_loss": -5.433226585388184, "global_step": 7753, "epoch": 46} {"train_loss": -5.406648635864258, "global_step": 7754, "epoch": 46} {"train_loss": -5.306235313415527, "global_step": 7755, "epoch": 46} {"train_loss": -5.624412536621094, "global_step": 7756, "epoch": 46} {"train_loss": -5.357542514801025, "global_step": 7757, "epoch": 46} {"train_loss": -5.118706226348877, "global_step": 7758, "epoch": 46} {"train_loss": -5.397158622741699, "global_step": 7759, "epoch": 46} {"train_loss": -5.611601829528809, "global_step": 7760, "epoch": 46} {"train_loss": -5.281137466430664, "global_step": 7761, "epoch": 46} {"train_loss": -5.406681060791016, "global_step": 7762, "epoch": 46} {"train_loss": -5.319780349731445, "global_step": 7763, "epoch": 46} {"train_loss": -5.311830520629883, "global_step": 7764, "epoch": 46} {"train_loss": -5.253479957580566, "global_step": 7765, "epoch": 46} {"train_loss": -5.465429306030273, "global_step": 7766, "epoch": 46} {"train_loss": -5.263847827911377, "global_step": 7767, "epoch": 46} {"train_loss": -5.239595413208008, "global_step": 7768, "epoch": 46} {"train_loss": -5.3211846351623535, "global_step": 7769, "epoch": 46} {"train_loss": -5.3954315185546875, "global_step": 7770, "epoch": 46} {"train_loss": -5.405482769012451, "global_step": 7771, "epoch": 46} {"train_loss": -5.265567302703857, "global_step": 7772, "epoch": 46} {"train_loss": -5.261891841888428, "global_step": 7773, "epoch": 46} {"train_loss": -5.528987884521484, "global_step": 7774, "epoch": 46} {"train_loss": -5.623183250427246, "global_step": 7775, "epoch": 46} {"train_loss": -5.253043174743652, "global_step": 7776, "epoch": 46} {"train_loss": -5.294092655181885, "global_step": 7777, "epoch": 46} {"train_loss": -5.230103969573975, "global_step": 7778, "epoch": 46} {"train_loss": -5.552061557769775, "global_step": 7779, "epoch": 46} {"train_loss": -5.484806537628174, "global_step": 7780, "epoch": 46} {"train_loss": -5.475884437561035, "global_step": 7781, "epoch": 46} {"train_loss": -5.367464065551758, "global_step": 7782, "epoch": 46} {"train_loss": -5.586279392242432, "global_step": 7783, "epoch": 46} {"train_loss": -5.6542277336120605, "global_step": 7784, "epoch": 46} {"train_loss": -5.557904243469238, "global_step": 7785, "epoch": 46} {"train_loss": -5.408476829528809, "global_step": 7786, "epoch": 46} {"train_loss": -5.5305705070495605, "global_step": 7787, "epoch": 46} {"train_loss": -5.368282794952393, "global_step": 7788, "epoch": 46} {"train_loss": -5.614987850189209, "global_step": 7789, "epoch": 46} {"train_loss": -5.421781539916992, "global_step": 7790, "epoch": 46} {"train_loss": -5.456896781921387, "global_step": 7791, "epoch": 46} {"train_loss": -5.255213737487793, "global_step": 7792, "epoch": 46} {"train_loss": -5.433899879455566, "global_step": 7793, "epoch": 46} {"train_loss": -5.440889358520508, "global_step": 7794, "epoch": 46} {"train_loss": -5.217810153961182, "global_step": 7795, "epoch": 46} {"train_loss": -5.509726524353027, "global_step": 7796, "epoch": 46} {"train_loss": -5.286077976226807, "global_step": 7797, "epoch": 46} {"train_loss": -5.549567699432373, "global_step": 7798, "epoch": 46} {"train_loss": -5.53508186340332, "global_step": 7799, "epoch": 46} {"train_loss": -5.319186210632324, "global_step": 7800, "epoch": 46} {"train_loss": -5.622460842132568, "global_step": 7801, "epoch": 46} {"train_loss": -5.565452575683594, "global_step": 7802, "epoch": 46} {"train_loss": -5.229070663452148, "global_step": 7803, "epoch": 46} {"train_loss": -5.431573390960693, "global_step": 7804, "epoch": 46} {"train_loss": -5.396993637084961, "global_step": 7805, "epoch": 46} {"train_loss": -5.580732345581055, "global_step": 7806, "epoch": 46} {"train_loss": -5.519223213195801, "global_step": 7807, "epoch": 46} {"train_loss": -5.392322063446045, "global_step": 7808, "epoch": 46} {"train_loss": -5.592066764831543, "global_step": 7809, "epoch": 46} {"train_loss": -5.487998962402344, "global_step": 7810, "epoch": 46} {"train_loss": -5.194786071777344, "global_step": 7811, "epoch": 46} {"train_loss": -5.761566638946533, "global_step": 7812, "epoch": 46} {"train_loss": -5.559663772583008, "global_step": 7813, "epoch": 46} {"train_loss": -5.232173442840576, "global_step": 7814, "epoch": 46} {"train_loss": -5.393827438354492, "global_step": 7815, "epoch": 46} {"train_loss": -5.600126266479492, "global_step": 7816, "epoch": 46} {"train_loss": -5.459954261779785, "global_step": 7817, "epoch": 46} {"train_loss": -5.546106338500977, "global_step": 7818, "epoch": 46} {"train_loss": -5.475025653839111, "global_step": 7819, "epoch": 46} {"train_loss": -5.506705284118652, "global_step": 7820, "epoch": 46} {"train_loss": -5.514713764190674, "global_step": 7821, "epoch": 46} {"train_loss": -5.702329635620117, "global_step": 7822, "epoch": 46} {"train_loss": -5.701541900634766, "global_step": 7823, "epoch": 46} {"train_loss": -5.49803352355957, "global_step": 7824, "epoch": 46} {"train_loss": -5.435497283935547, "global_step": 7825, "epoch": 46} {"train_loss": -5.546867847442627, "global_step": 7826, "epoch": 46} {"train_loss": -5.3429436683654785, "global_step": 7827, "epoch": 46} {"train_loss": -5.52370548248291, "global_step": 7828, "epoch": 46} {"train_loss": -5.673436164855957, "global_step": 7829, "epoch": 46} {"train_loss": -5.239480972290039, "global_step": 7830, "epoch": 46} {"train_loss": -5.510985374450684, "global_step": 7831, "epoch": 46} {"train_loss": -5.754199028015137, "global_step": 7832, "epoch": 46} {"train_loss": -5.568693161010742, "global_step": 7833, "epoch": 46} {"train_loss": -5.713875770568848, "global_step": 7834, "epoch": 46} {"train_loss": -5.448718070983887, "global_step": 7835, "epoch": 46} {"train_loss": -5.4123430252075195, "global_step": 7836, "epoch": 46} {"train_loss": -5.271538257598877, "global_step": 7837, "epoch": 46} {"train_loss": -5.485190391540527, "global_step": 7838, "epoch": 46} {"train_loss": -5.025481224060059, "global_step": 7839, "epoch": 46} {"train_loss": -5.69647216796875, "global_step": 7840, "epoch": 46} {"train_loss": -5.459683418273926, "global_step": 7841, "epoch": 46} {"train_loss": -5.695932388305664, "global_step": 7842, "epoch": 46} {"train_loss": -5.524837970733643, "global_step": 7843, "epoch": 46} {"train_loss": -5.527864456176758, "global_step": 7844, "epoch": 46} {"train_loss": -5.529045581817627, "global_step": 7845, "epoch": 46} {"train_loss": -5.294103622436523, "global_step": 7846, "epoch": 46} {"train_loss": -5.437416076660156, "global_step": 7847, "epoch": 46} {"train_loss": -5.399198532104492, "global_step": 7848, "epoch": 46} {"train_loss": -5.479033946990967, "global_step": 7849, "epoch": 46} {"train_loss": -5.412457466125488, "global_step": 7850, "epoch": 46} {"train_loss": -5.470214366912842, "global_step": 7851, "epoch": 46} {"train_loss": -5.293740272521973, "global_step": 7852, "epoch": 46} {"train_loss": -5.660399436950684, "global_step": 7853, "epoch": 46} {"train_loss": -5.649609088897705, "global_step": 7854, "epoch": 46} {"train_loss": -5.431105613708496, "global_step": 7855, "epoch": 46} {"train_loss": -5.333892822265625, "global_step": 7856, "epoch": 46} {"train_loss": -5.492316246032715, "global_step": 7857, "epoch": 46} {"train_loss": -5.617922782897949, "global_step": 7858, "epoch": 46} {"train_loss": -5.247058868408203, "global_step": 7859, "epoch": 46} {"train_loss": -5.695568084716797, "global_step": 7860, "epoch": 46} {"train_loss": -5.468062400817871, "global_step": 7861, "epoch": 46} {"train_loss": -5.2856221199035645, "global_step": 7862, "epoch": 46} {"train_loss": -5.623593330383301, "global_step": 7863, "epoch": 46} {"train_loss": -5.221611976623535, "global_step": 7864, "epoch": 46} {"train_loss": -5.4828596115112305, "global_step": 7865, "epoch": 46} {"train_loss": -5.506950378417969, "global_step": 7866, "epoch": 46} {"train_loss": -5.351238250732422, "global_step": 7867, "epoch": 46} {"train_loss": -5.123105049133301, "global_step": 7868, "epoch": 46} {"train_loss": -5.160504341125488, "global_step": 7869, "epoch": 46} {"train_loss": -5.302838325500488, "global_step": 7870, "epoch": 46} {"train_loss": -5.463382720947266, "global_step": 7871, "epoch": 46} {"train_loss": -5.427071571350098, "global_step": 7872, "epoch": 46} {"train_loss": -5.245279312133789, "global_step": 7873, "epoch": 46} {"train_loss": -5.384668350219727, "global_step": 7874, "epoch": 46} {"train_loss": -5.043831825256348, "global_step": 7875, "epoch": 46} {"train_loss": -5.407067775726318, "global_step": 7876, "epoch": 46} {"train_loss": -5.1844377517700195, "global_step": 7877, "epoch": 46} {"train_loss": -5.39029598236084, "global_step": 7878, "epoch": 46} {"train_loss": -5.441959857940674, "global_step": 7879, "epoch": 46} {"train_loss": -5.367542266845703, "global_step": 7880, "epoch": 46} {"train_loss": -5.114296913146973, "global_step": 7881, "epoch": 46} {"train_loss": -5.417915344238281, "global_step": 7882, "epoch": 46} {"train_loss": -5.289336204528809, "global_step": 7883, "epoch": 46} {"train_loss": -5.303638458251953, "global_step": 7884, "epoch": 46} {"train_loss": -5.427406311035156, "global_step": 7885, "epoch": 46} {"train_loss": -5.509984970092773, "global_step": 7886, "epoch": 46} {"train_loss": -5.285648822784424, "global_step": 7887, "epoch": 46} {"train_loss": -5.2106828689575195, "global_step": 7888, "epoch": 46} {"train_loss": -5.145901679992676, "global_step": 7889, "epoch": 46} {"train_loss": -5.4786057472229, "global_step": 7890, "epoch": 46} {"train_loss": -5.253476142883301, "global_step": 7891, "epoch": 46} {"train_loss": -5.471745491027832, "global_step": 7892, "epoch": 46} {"train_loss": -5.581812858581543, "global_step": 7893, "epoch": 46} {"train_loss": -5.512253284454346, "global_step": 7894, "epoch": 46} {"train_loss": -5.426764153298878, "global_step": 7895, "epoch": 46, "val_loss": 261461.453125} {"train_loss": -5.531070232391357, "global_step": 7896, "epoch": 47} {"train_loss": -5.321584701538086, "global_step": 7897, "epoch": 47} {"train_loss": -5.449178695678711, "global_step": 7898, "epoch": 47} {"train_loss": -5.431807518005371, "global_step": 7899, "epoch": 47} {"train_loss": -5.376619815826416, "global_step": 7900, "epoch": 47} {"train_loss": -5.4696149826049805, "global_step": 7901, "epoch": 47} {"train_loss": -5.551994323730469, "global_step": 7902, "epoch": 47} {"train_loss": -5.75928258895874, "global_step": 7903, "epoch": 47} {"train_loss": -5.502392292022705, "global_step": 7904, "epoch": 47} {"train_loss": -5.406003952026367, "global_step": 7905, "epoch": 47} {"train_loss": -5.674882888793945, "global_step": 7906, "epoch": 47} {"train_loss": -5.385224342346191, "global_step": 7907, "epoch": 47} {"train_loss": -5.684333801269531, "global_step": 7908, "epoch": 47} {"train_loss": -5.344778537750244, "global_step": 7909, "epoch": 47} {"train_loss": -5.562122821807861, "global_step": 7910, "epoch": 47} {"train_loss": -5.306066513061523, "global_step": 7911, "epoch": 47} {"train_loss": -4.9926252365112305, "global_step": 7912, "epoch": 47} {"train_loss": -5.307440757751465, "global_step": 7913, "epoch": 47} {"train_loss": -5.264026165008545, "global_step": 7914, "epoch": 47} {"train_loss": -5.270534038543701, "global_step": 7915, "epoch": 47} {"train_loss": -5.709578514099121, "global_step": 7916, "epoch": 47} {"train_loss": -5.372714996337891, "global_step": 7917, "epoch": 47} {"train_loss": -5.459512710571289, "global_step": 7918, "epoch": 47} {"train_loss": -5.433588981628418, "global_step": 7919, "epoch": 47} {"train_loss": -5.660037517547607, "global_step": 7920, "epoch": 47} {"train_loss": -5.533393383026123, "global_step": 7921, "epoch": 47} {"train_loss": -5.530693531036377, "global_step": 7922, "epoch": 47} {"train_loss": -5.445263862609863, "global_step": 7923, "epoch": 47} {"train_loss": -5.660828590393066, "global_step": 7924, "epoch": 47} {"train_loss": -5.458309173583984, "global_step": 7925, "epoch": 47} {"train_loss": -5.644266605377197, "global_step": 7926, "epoch": 47} {"train_loss": -5.480519771575928, "global_step": 7927, "epoch": 47} {"train_loss": -5.483508110046387, "global_step": 7928, "epoch": 47} {"train_loss": -5.325641632080078, "global_step": 7929, "epoch": 47} {"train_loss": -5.37796688079834, "global_step": 7930, "epoch": 47} {"train_loss": -5.24592924118042, "global_step": 7931, "epoch": 47} {"train_loss": -5.551237106323242, "global_step": 7932, "epoch": 47} {"train_loss": -5.709183692932129, "global_step": 7933, "epoch": 47} {"train_loss": -5.468629360198975, "global_step": 7934, "epoch": 47} {"train_loss": -5.383702754974365, "global_step": 7935, "epoch": 47} {"train_loss": -5.591724395751953, "global_step": 7936, "epoch": 47} {"train_loss": -5.4794135093688965, "global_step": 7937, "epoch": 47} {"train_loss": -5.634954452514648, "global_step": 7938, "epoch": 47} {"train_loss": -5.254190921783447, "global_step": 7939, "epoch": 47} {"train_loss": -5.39161491394043, "global_step": 7940, "epoch": 47} {"train_loss": -5.6244378089904785, "global_step": 7941, "epoch": 47} {"train_loss": -5.524589538574219, "global_step": 7942, "epoch": 47} {"train_loss": -5.531371593475342, "global_step": 7943, "epoch": 47} {"train_loss": -5.4271650314331055, "global_step": 7944, "epoch": 47} {"train_loss": -5.338499069213867, "global_step": 7945, "epoch": 47} {"train_loss": -5.674469947814941, "global_step": 7946, "epoch": 47} {"train_loss": -5.40587043762207, "global_step": 7947, "epoch": 47} {"train_loss": -5.3532609939575195, "global_step": 7948, "epoch": 47} {"train_loss": -5.6574530601501465, "global_step": 7949, "epoch": 47} {"train_loss": -5.548079490661621, "global_step": 7950, "epoch": 47} {"train_loss": -5.380913734436035, "global_step": 7951, "epoch": 47} {"train_loss": -5.5497260093688965, "global_step": 7952, "epoch": 47} {"train_loss": -5.600642204284668, "global_step": 7953, "epoch": 47} {"train_loss": -5.7369184494018555, "global_step": 7954, "epoch": 47} {"train_loss": -5.375473976135254, "global_step": 7955, "epoch": 47} {"train_loss": -5.783997058868408, "global_step": 7956, "epoch": 47} {"train_loss": -5.392091274261475, "global_step": 7957, "epoch": 47} {"train_loss": -5.346840858459473, "global_step": 7958, "epoch": 47} {"train_loss": -5.563957691192627, "global_step": 7959, "epoch": 47} {"train_loss": -5.28420352935791, "global_step": 7960, "epoch": 47} {"train_loss": -5.53009033203125, "global_step": 7961, "epoch": 47} {"train_loss": -5.543659210205078, "global_step": 7962, "epoch": 47} {"train_loss": -5.374521255493164, "global_step": 7963, "epoch": 47} {"train_loss": -5.593438148498535, "global_step": 7964, "epoch": 47} {"train_loss": -5.677432537078857, "global_step": 7965, "epoch": 47} {"train_loss": -5.639130592346191, "global_step": 7966, "epoch": 47} {"train_loss": -5.7107014656066895, "global_step": 7967, "epoch": 47} {"train_loss": -5.462643623352051, "global_step": 7968, "epoch": 47} {"train_loss": -5.455126762390137, "global_step": 7969, "epoch": 47} {"train_loss": -5.330575942993164, "global_step": 7970, "epoch": 47} {"train_loss": -5.263408660888672, "global_step": 7971, "epoch": 47} {"train_loss": -5.622550964355469, "global_step": 7972, "epoch": 47} {"train_loss": -5.760074138641357, "global_step": 7973, "epoch": 47} {"train_loss": -5.687553882598877, "global_step": 7974, "epoch": 47} {"train_loss": -5.757798194885254, "global_step": 7975, "epoch": 47} {"train_loss": -5.412327766418457, "global_step": 7976, "epoch": 47} {"train_loss": -5.613363742828369, "global_step": 7977, "epoch": 47} {"train_loss": -5.523495674133301, "global_step": 7978, "epoch": 47} {"train_loss": -5.4204864501953125, "global_step": 7979, "epoch": 47} {"train_loss": -5.733607769012451, "global_step": 7980, "epoch": 47} {"train_loss": -5.380735397338867, "global_step": 7981, "epoch": 47} {"train_loss": -5.567623138427734, "global_step": 7982, "epoch": 47} {"train_loss": -4.977592945098877, "global_step": 7983, "epoch": 47} {"train_loss": -5.524234771728516, "global_step": 7984, "epoch": 47} {"train_loss": -5.577645301818848, "global_step": 7985, "epoch": 47} {"train_loss": -5.597288608551025, "global_step": 7986, "epoch": 47} {"train_loss": -5.482197284698486, "global_step": 7987, "epoch": 47} {"train_loss": -5.643275260925293, "global_step": 7988, "epoch": 47} {"train_loss": -5.101816654205322, "global_step": 7989, "epoch": 47} {"train_loss": -5.4285173416137695, "global_step": 7990, "epoch": 47} {"train_loss": -5.494572639465332, "global_step": 7991, "epoch": 47} {"train_loss": -5.471535682678223, "global_step": 7992, "epoch": 47} {"train_loss": -5.357127666473389, "global_step": 7993, "epoch": 47} {"train_loss": -5.6346845626831055, "global_step": 7994, "epoch": 47} {"train_loss": -5.376877784729004, "global_step": 7995, "epoch": 47} {"train_loss": -5.6215314865112305, "global_step": 7996, "epoch": 47} {"train_loss": -5.498420715332031, "global_step": 7997, "epoch": 47} {"train_loss": -5.539161205291748, "global_step": 7998, "epoch": 47} {"train_loss": -5.4625468254089355, "global_step": 7999, "epoch": 47} {"train_loss": -5.359805583953857, "global_step": 8000, "epoch": 47} {"train_loss": -5.582925319671631, "global_step": 8001, "epoch": 47} {"train_loss": -5.638611316680908, "global_step": 8002, "epoch": 47} {"train_loss": -5.404427528381348, "global_step": 8003, "epoch": 47} {"train_loss": -5.591274261474609, "global_step": 8004, "epoch": 47} {"train_loss": -5.468141555786133, "global_step": 8005, "epoch": 47} {"train_loss": -5.426981449127197, "global_step": 8006, "epoch": 47} {"train_loss": -5.722288131713867, "global_step": 8007, "epoch": 47} {"train_loss": -5.155257701873779, "global_step": 8008, "epoch": 47} {"train_loss": -5.522707939147949, "global_step": 8009, "epoch": 47} {"train_loss": -5.366054534912109, "global_step": 8010, "epoch": 47} {"train_loss": -5.2676496505737305, "global_step": 8011, "epoch": 47} {"train_loss": -5.443305015563965, "global_step": 8012, "epoch": 47} {"train_loss": -5.525331020355225, "global_step": 8013, "epoch": 47} {"train_loss": -5.613245010375977, "global_step": 8014, "epoch": 47} {"train_loss": -5.185565948486328, "global_step": 8015, "epoch": 47} {"train_loss": -5.551971912384033, "global_step": 8016, "epoch": 47} {"train_loss": -5.511871337890625, "global_step": 8017, "epoch": 47} {"train_loss": -5.5517578125, "global_step": 8018, "epoch": 47} {"train_loss": -5.863555908203125, "global_step": 8019, "epoch": 47} {"train_loss": -5.285778045654297, "global_step": 8020, "epoch": 47} {"train_loss": -5.389982223510742, "global_step": 8021, "epoch": 47} {"train_loss": -5.690155029296875, "global_step": 8022, "epoch": 47} {"train_loss": -5.338683128356934, "global_step": 8023, "epoch": 47} {"train_loss": -5.738712310791016, "global_step": 8024, "epoch": 47} {"train_loss": -5.467407703399658, "global_step": 8025, "epoch": 47} {"train_loss": -5.367294788360596, "global_step": 8026, "epoch": 47} {"train_loss": -5.480510234832764, "global_step": 8027, "epoch": 47} {"train_loss": -5.196165084838867, "global_step": 8028, "epoch": 47} {"train_loss": -5.620648384094238, "global_step": 8029, "epoch": 47} {"train_loss": -5.359243869781494, "global_step": 8030, "epoch": 47} {"train_loss": -5.557785511016846, "global_step": 8031, "epoch": 47} {"train_loss": -5.683923721313477, "global_step": 8032, "epoch": 47} {"train_loss": -5.688422203063965, "global_step": 8033, "epoch": 47} {"train_loss": -5.653933048248291, "global_step": 8034, "epoch": 47} {"train_loss": -5.7498273849487305, "global_step": 8035, "epoch": 47} {"train_loss": -5.435168266296387, "global_step": 8036, "epoch": 47} {"train_loss": -5.418923377990723, "global_step": 8037, "epoch": 47} {"train_loss": -5.649778842926025, "global_step": 8038, "epoch": 47} {"train_loss": -5.55668830871582, "global_step": 8039, "epoch": 47} {"train_loss": -5.163677215576172, "global_step": 8040, "epoch": 47} {"train_loss": -5.208207130432129, "global_step": 8041, "epoch": 47} {"train_loss": -5.373138427734375, "global_step": 8042, "epoch": 47} {"train_loss": -5.412479877471924, "global_step": 8043, "epoch": 47} {"train_loss": -5.307328224182129, "global_step": 8044, "epoch": 47} {"train_loss": -5.448265552520752, "global_step": 8045, "epoch": 47} {"train_loss": -5.495044708251953, "global_step": 8046, "epoch": 47} {"train_loss": -5.314202785491943, "global_step": 8047, "epoch": 47} {"train_loss": -5.528141021728516, "global_step": 8048, "epoch": 47} {"train_loss": -5.416557788848877, "global_step": 8049, "epoch": 47} {"train_loss": -5.4879655838012695, "global_step": 8050, "epoch": 47} {"train_loss": -5.4009599685668945, "global_step": 8051, "epoch": 47} {"train_loss": -5.462357044219971, "global_step": 8052, "epoch": 47} {"train_loss": -5.484752655029297, "global_step": 8053, "epoch": 47} {"train_loss": -5.46738862991333, "global_step": 8054, "epoch": 47} {"train_loss": -5.455173492431641, "global_step": 8055, "epoch": 47} {"train_loss": -5.516595363616943, "global_step": 8056, "epoch": 47} {"train_loss": -5.326449394226074, "global_step": 8057, "epoch": 47} {"train_loss": -5.5682220458984375, "global_step": 8058, "epoch": 47} {"train_loss": -5.583878993988037, "global_step": 8059, "epoch": 47} {"train_loss": -5.402092933654785, "global_step": 8060, "epoch": 47} {"train_loss": -5.385650634765625, "global_step": 8061, "epoch": 47} {"train_loss": -5.761987209320068, "global_step": 8062, "epoch": 47} {"train_loss": -5.484269241491954, "global_step": 8063, "epoch": 47, "val_loss": 265505.3125} {"train_loss": -5.417762279510498, "global_step": 8064, "epoch": 48} {"train_loss": -5.59993839263916, "global_step": 8065, "epoch": 48} {"train_loss": -5.543377876281738, "global_step": 8066, "epoch": 48} {"train_loss": -5.343014717102051, "global_step": 8067, "epoch": 48} {"train_loss": -5.769751071929932, "global_step": 8068, "epoch": 48} {"train_loss": -5.32958984375, "global_step": 8069, "epoch": 48} {"train_loss": -5.748790740966797, "global_step": 8070, "epoch": 48} {"train_loss": -5.314611911773682, "global_step": 8071, "epoch": 48} {"train_loss": -5.634625434875488, "global_step": 8072, "epoch": 48} {"train_loss": -5.3297882080078125, "global_step": 8073, "epoch": 48} {"train_loss": -5.766283988952637, "global_step": 8074, "epoch": 48} {"train_loss": -5.42978048324585, "global_step": 8075, "epoch": 48} {"train_loss": -5.446572780609131, "global_step": 8076, "epoch": 48} {"train_loss": -5.358644962310791, "global_step": 8077, "epoch": 48} {"train_loss": -5.792096138000488, "global_step": 8078, "epoch": 48} {"train_loss": -5.522330284118652, "global_step": 8079, "epoch": 48} {"train_loss": -5.230348587036133, "global_step": 8080, "epoch": 48} {"train_loss": -5.499716281890869, "global_step": 8081, "epoch": 48} {"train_loss": -5.581132888793945, "global_step": 8082, "epoch": 48} {"train_loss": -5.715620994567871, "global_step": 8083, "epoch": 48} {"train_loss": -5.712768077850342, "global_step": 8084, "epoch": 48} {"train_loss": -5.000309944152832, "global_step": 8085, "epoch": 48} {"train_loss": -5.478138446807861, "global_step": 8086, "epoch": 48} {"train_loss": -5.054967880249023, "global_step": 8087, "epoch": 48} {"train_loss": -5.286866664886475, "global_step": 8088, "epoch": 48} {"train_loss": -5.4083404541015625, "global_step": 8089, "epoch": 48} {"train_loss": -5.231036186218262, "global_step": 8090, "epoch": 48} {"train_loss": -5.189676284790039, "global_step": 8091, "epoch": 48} {"train_loss": -5.098456382751465, "global_step": 8092, "epoch": 48} {"train_loss": -5.311429500579834, "global_step": 8093, "epoch": 48} {"train_loss": -5.423768043518066, "global_step": 8094, "epoch": 48} {"train_loss": -5.271841049194336, "global_step": 8095, "epoch": 48} {"train_loss": -5.491868019104004, "global_step": 8096, "epoch": 48} {"train_loss": -5.138388633728027, "global_step": 8097, "epoch": 48} {"train_loss": -5.632787704467773, "global_step": 8098, "epoch": 48} {"train_loss": -5.44389533996582, "global_step": 8099, "epoch": 48} {"train_loss": -5.545703411102295, "global_step": 8100, "epoch": 48} {"train_loss": -5.510807991027832, "global_step": 8101, "epoch": 48} {"train_loss": -5.59116268157959, "global_step": 8102, "epoch": 48} {"train_loss": -5.584891319274902, "global_step": 8103, "epoch": 48} {"train_loss": -5.6228227615356445, "global_step": 8104, "epoch": 48} {"train_loss": -5.767529010772705, "global_step": 8105, "epoch": 48} {"train_loss": -5.490113258361816, "global_step": 8106, "epoch": 48} {"train_loss": -5.546823501586914, "global_step": 8107, "epoch": 48} {"train_loss": -5.265564918518066, "global_step": 8108, "epoch": 48} {"train_loss": -5.736391067504883, "global_step": 8109, "epoch": 48} {"train_loss": -5.541486740112305, "global_step": 8110, "epoch": 48} {"train_loss": -5.462976455688477, "global_step": 8111, "epoch": 48} {"train_loss": -5.500454902648926, "global_step": 8112, "epoch": 48} {"train_loss": -5.7683610916137695, "global_step": 8113, "epoch": 48} {"train_loss": -5.523597717285156, "global_step": 8114, "epoch": 48} {"train_loss": -5.558964252471924, "global_step": 8115, "epoch": 48} {"train_loss": -5.440791130065918, "global_step": 8116, "epoch": 48} {"train_loss": -5.739992141723633, "global_step": 8117, "epoch": 48} {"train_loss": -5.410677909851074, "global_step": 8118, "epoch": 48} {"train_loss": -5.504288673400879, "global_step": 8119, "epoch": 48} {"train_loss": -5.734929084777832, "global_step": 8120, "epoch": 48} {"train_loss": -5.530942916870117, "global_step": 8121, "epoch": 48} {"train_loss": -5.637354373931885, "global_step": 8122, "epoch": 48} {"train_loss": -5.446840286254883, "global_step": 8123, "epoch": 48} {"train_loss": -5.685818195343018, "global_step": 8124, "epoch": 48} {"train_loss": -5.402458190917969, "global_step": 8125, "epoch": 48} {"train_loss": -5.698052883148193, "global_step": 8126, "epoch": 48} {"train_loss": -5.568632125854492, "global_step": 8127, "epoch": 48} {"train_loss": -5.2867326736450195, "global_step": 8128, "epoch": 48} {"train_loss": -5.4559454917907715, "global_step": 8129, "epoch": 48} {"train_loss": -5.448805809020996, "global_step": 8130, "epoch": 48} {"train_loss": -5.524338722229004, "global_step": 8131, "epoch": 48} {"train_loss": -5.397651672363281, "global_step": 8132, "epoch": 48} {"train_loss": -5.568052768707275, "global_step": 8133, "epoch": 48} {"train_loss": -5.516602516174316, "global_step": 8134, "epoch": 48} {"train_loss": -5.33724308013916, "global_step": 8135, "epoch": 48} {"train_loss": -5.355607032775879, "global_step": 8136, "epoch": 48} {"train_loss": -5.336099624633789, "global_step": 8137, "epoch": 48} {"train_loss": -5.694108009338379, "global_step": 8138, "epoch": 48} {"train_loss": -5.454670429229736, "global_step": 8139, "epoch": 48} {"train_loss": -5.513205528259277, "global_step": 8140, "epoch": 48} {"train_loss": -5.206416130065918, "global_step": 8141, "epoch": 48} {"train_loss": -5.567475318908691, "global_step": 8142, "epoch": 48} {"train_loss": -5.5600905418396, "global_step": 8143, "epoch": 48} {"train_loss": -5.465789318084717, "global_step": 8144, "epoch": 48} {"train_loss": -5.541960716247559, "global_step": 8145, "epoch": 48} {"train_loss": -5.5809125900268555, "global_step": 8146, "epoch": 48} {"train_loss": -5.200682163238525, "global_step": 8147, "epoch": 48} {"train_loss": -5.613495826721191, "global_step": 8148, "epoch": 48} {"train_loss": -5.460691452026367, "global_step": 8149, "epoch": 48} {"train_loss": -5.543989658355713, "global_step": 8150, "epoch": 48} {"train_loss": -5.379883766174316, "global_step": 8151, "epoch": 48} {"train_loss": -5.38350248336792, "global_step": 8152, "epoch": 48} {"train_loss": -5.590266227722168, "global_step": 8153, "epoch": 48} {"train_loss": -5.595108509063721, "global_step": 8154, "epoch": 48} {"train_loss": -5.488116264343262, "global_step": 8155, "epoch": 48} {"train_loss": -5.574699878692627, "global_step": 8156, "epoch": 48} {"train_loss": -5.382406711578369, "global_step": 8157, "epoch": 48} {"train_loss": -5.5081892013549805, "global_step": 8158, "epoch": 48} {"train_loss": -5.713234901428223, "global_step": 8159, "epoch": 48} {"train_loss": -5.742090702056885, "global_step": 8160, "epoch": 48} {"train_loss": -5.6255035400390625, "global_step": 8161, "epoch": 48} {"train_loss": -5.38027286529541, "global_step": 8162, "epoch": 48} {"train_loss": -5.566673755645752, "global_step": 8163, "epoch": 48} {"train_loss": -5.546695709228516, "global_step": 8164, "epoch": 48} {"train_loss": -5.475754261016846, "global_step": 8165, "epoch": 48} {"train_loss": -5.733188629150391, "global_step": 8166, "epoch": 48} {"train_loss": -5.248887062072754, "global_step": 8167, "epoch": 48} {"train_loss": -5.357392311096191, "global_step": 8168, "epoch": 48} {"train_loss": -5.302288055419922, "global_step": 8169, "epoch": 48} {"train_loss": -5.628724575042725, "global_step": 8170, "epoch": 48} {"train_loss": -5.272913932800293, "global_step": 8171, "epoch": 48} {"train_loss": -5.483842849731445, "global_step": 8172, "epoch": 48} {"train_loss": -5.405691146850586, "global_step": 8173, "epoch": 48} {"train_loss": -5.365518569946289, "global_step": 8174, "epoch": 48} {"train_loss": -5.353039264678955, "global_step": 8175, "epoch": 48} {"train_loss": -5.2140045166015625, "global_step": 8176, "epoch": 48} {"train_loss": -5.561692237854004, "global_step": 8177, "epoch": 48} {"train_loss": -5.54688024520874, "global_step": 8178, "epoch": 48} {"train_loss": -5.513784408569336, "global_step": 8179, "epoch": 48} {"train_loss": -5.473752975463867, "global_step": 8180, "epoch": 48} {"train_loss": -5.430829048156738, "global_step": 8181, "epoch": 48} {"train_loss": -5.556886672973633, "global_step": 8182, "epoch": 48} {"train_loss": -5.266457557678223, "global_step": 8183, "epoch": 48} {"train_loss": -5.619414806365967, "global_step": 8184, "epoch": 48} {"train_loss": -5.059865474700928, "global_step": 8185, "epoch": 48} {"train_loss": -5.510992527008057, "global_step": 8186, "epoch": 48} {"train_loss": -5.049997329711914, "global_step": 8187, "epoch": 48} {"train_loss": -5.594034194946289, "global_step": 8188, "epoch": 48} {"train_loss": -5.290136337280273, "global_step": 8189, "epoch": 48} {"train_loss": -5.20939826965332, "global_step": 8190, "epoch": 48} {"train_loss": -5.114424705505371, "global_step": 8191, "epoch": 48} {"train_loss": -5.2688117027282715, "global_step": 8192, "epoch": 48} {"train_loss": -5.552265167236328, "global_step": 8193, "epoch": 48} {"train_loss": -5.5023322105407715, "global_step": 8194, "epoch": 48} {"train_loss": -5.1722307205200195, "global_step": 8195, "epoch": 48} {"train_loss": -5.486881256103516, "global_step": 8196, "epoch": 48} {"train_loss": -5.276876449584961, "global_step": 8197, "epoch": 48} {"train_loss": -5.338879585266113, "global_step": 8198, "epoch": 48} {"train_loss": -5.2843523025512695, "global_step": 8199, "epoch": 48} {"train_loss": -5.329787254333496, "global_step": 8200, "epoch": 48} {"train_loss": -5.163846015930176, "global_step": 8201, "epoch": 48} {"train_loss": -5.125040054321289, "global_step": 8202, "epoch": 48} {"train_loss": -5.518548011779785, "global_step": 8203, "epoch": 48} {"train_loss": -5.484833240509033, "global_step": 8204, "epoch": 48} {"train_loss": -5.656918525695801, "global_step": 8205, "epoch": 48} {"train_loss": -5.602119445800781, "global_step": 8206, "epoch": 48} {"train_loss": -5.479151248931885, "global_step": 8207, "epoch": 48} {"train_loss": -5.664176940917969, "global_step": 8208, "epoch": 48} {"train_loss": -5.619782447814941, "global_step": 8209, "epoch": 48} {"train_loss": -5.3751654624938965, "global_step": 8210, "epoch": 48} {"train_loss": -5.719267845153809, "global_step": 8211, "epoch": 48} {"train_loss": -5.63900089263916, "global_step": 8212, "epoch": 48} {"train_loss": -5.527095794677734, "global_step": 8213, "epoch": 48} {"train_loss": -5.849062919616699, "global_step": 8214, "epoch": 48} {"train_loss": -5.646494388580322, "global_step": 8215, "epoch": 48} {"train_loss": -5.389822483062744, "global_step": 8216, "epoch": 48} {"train_loss": -5.414960861206055, "global_step": 8217, "epoch": 48} {"train_loss": -5.74743127822876, "global_step": 8218, "epoch": 48} {"train_loss": -5.590904712677002, "global_step": 8219, "epoch": 48} {"train_loss": -5.664356708526611, "global_step": 8220, "epoch": 48} {"train_loss": -5.533358573913574, "global_step": 8221, "epoch": 48} {"train_loss": -5.72759485244751, "global_step": 8222, "epoch": 48} {"train_loss": -5.611004829406738, "global_step": 8223, "epoch": 48} {"train_loss": -5.553840637207031, "global_step": 8224, "epoch": 48} {"train_loss": -5.640892028808594, "global_step": 8225, "epoch": 48} {"train_loss": -5.4093732833862305, "global_step": 8226, "epoch": 48} {"train_loss": -5.098889350891113, "global_step": 8227, "epoch": 48} {"train_loss": -5.4626994132995605, "global_step": 8228, "epoch": 48} {"train_loss": -5.670205116271973, "global_step": 8229, "epoch": 48} {"train_loss": -5.460592269897461, "global_step": 8230, "epoch": 48} {"train_loss": -5.476570325238364, "global_step": 8231, "epoch": 48, "val_loss": 253914.375} {"train_loss": -5.283659934997559, "global_step": 8232, "epoch": 49} {"train_loss": -5.478267192840576, "global_step": 8233, "epoch": 49} {"train_loss": -5.352268218994141, "global_step": 8234, "epoch": 49} {"train_loss": -5.485081672668457, "global_step": 8235, "epoch": 49} {"train_loss": -5.466582298278809, "global_step": 8236, "epoch": 49} {"train_loss": -5.3057966232299805, "global_step": 8237, "epoch": 49} {"train_loss": -5.706915855407715, "global_step": 8238, "epoch": 49} {"train_loss": -5.245595932006836, "global_step": 8239, "epoch": 49} {"train_loss": -5.73616361618042, "global_step": 8240, "epoch": 49} {"train_loss": -5.562910079956055, "global_step": 8241, "epoch": 49} {"train_loss": -4.867076873779297, "global_step": 8242, "epoch": 49} {"train_loss": -5.54326057434082, "global_step": 8243, "epoch": 49} {"train_loss": -5.401444911956787, "global_step": 8244, "epoch": 49} {"train_loss": -5.237131118774414, "global_step": 8245, "epoch": 49} {"train_loss": -5.425017833709717, "global_step": 8246, "epoch": 49} {"train_loss": -5.470418930053711, "global_step": 8247, "epoch": 49} {"train_loss": -5.376341819763184, "global_step": 8248, "epoch": 49} {"train_loss": -5.168992042541504, "global_step": 8249, "epoch": 49} {"train_loss": -5.546922206878662, "global_step": 8250, "epoch": 49} {"train_loss": -5.240084648132324, "global_step": 8251, "epoch": 49} {"train_loss": -5.167604923248291, "global_step": 8252, "epoch": 49} {"train_loss": -5.373529434204102, "global_step": 8253, "epoch": 49} {"train_loss": -5.508623123168945, "global_step": 8254, "epoch": 49} {"train_loss": -5.182058334350586, "global_step": 8255, "epoch": 49} {"train_loss": -5.516378879547119, "global_step": 8256, "epoch": 49} {"train_loss": -5.278940200805664, "global_step": 8257, "epoch": 49} {"train_loss": -5.411279678344727, "global_step": 8258, "epoch": 49} {"train_loss": -5.5572075843811035, "global_step": 8259, "epoch": 49} {"train_loss": -5.437262535095215, "global_step": 8260, "epoch": 49} {"train_loss": -5.496257781982422, "global_step": 8261, "epoch": 49} {"train_loss": -5.374987602233887, "global_step": 8262, "epoch": 49} {"train_loss": -5.539441108703613, "global_step": 8263, "epoch": 49} {"train_loss": -5.454275131225586, "global_step": 8264, "epoch": 49} {"train_loss": -5.474031448364258, "global_step": 8265, "epoch": 49} {"train_loss": -5.739098072052002, "global_step": 8266, "epoch": 49} {"train_loss": -5.5227437019348145, "global_step": 8267, "epoch": 49} {"train_loss": -5.598254203796387, "global_step": 8268, "epoch": 49} {"train_loss": -5.775049209594727, "global_step": 8269, "epoch": 49} {"train_loss": -5.5329484939575195, "global_step": 8270, "epoch": 49} {"train_loss": -5.415339469909668, "global_step": 8271, "epoch": 49} {"train_loss": -5.4079132080078125, "global_step": 8272, "epoch": 49} {"train_loss": -5.599419593811035, "global_step": 8273, "epoch": 49} {"train_loss": -5.620238780975342, "global_step": 8274, "epoch": 49} {"train_loss": -5.533600330352783, "global_step": 8275, "epoch": 49} {"train_loss": -5.5812578201293945, "global_step": 8276, "epoch": 49} {"train_loss": -5.396611213684082, "global_step": 8277, "epoch": 49} {"train_loss": -5.636610984802246, "global_step": 8278, "epoch": 49} {"train_loss": -5.498633861541748, "global_step": 8279, "epoch": 49} {"train_loss": -5.523158550262451, "global_step": 8280, "epoch": 49} {"train_loss": -5.223153591156006, "global_step": 8281, "epoch": 49} {"train_loss": -5.241793632507324, "global_step": 8282, "epoch": 49} {"train_loss": -5.593730926513672, "global_step": 8283, "epoch": 49} {"train_loss": -5.367292404174805, "global_step": 8284, "epoch": 49} {"train_loss": -5.692483901977539, "global_step": 8285, "epoch": 49} {"train_loss": -5.301887035369873, "global_step": 8286, "epoch": 49} {"train_loss": -5.403025150299072, "global_step": 8287, "epoch": 49} {"train_loss": -5.768468379974365, "global_step": 8288, "epoch": 49} {"train_loss": -5.516538143157959, "global_step": 8289, "epoch": 49} {"train_loss": -5.71646785736084, "global_step": 8290, "epoch": 49} {"train_loss": -5.623090744018555, "global_step": 8291, "epoch": 49} {"train_loss": -5.597476482391357, "global_step": 8292, "epoch": 49} {"train_loss": -5.69444465637207, "global_step": 8293, "epoch": 49} {"train_loss": -5.765535354614258, "global_step": 8294, "epoch": 49} {"train_loss": -5.633077144622803, "global_step": 8295, "epoch": 49} {"train_loss": -5.886453151702881, "global_step": 8296, "epoch": 49} {"train_loss": -5.383737564086914, "global_step": 8297, "epoch": 49} {"train_loss": -5.780858039855957, "global_step": 8298, "epoch": 49} {"train_loss": -5.690839767456055, "global_step": 8299, "epoch": 49} {"train_loss": -5.683406829833984, "global_step": 8300, "epoch": 49} {"train_loss": -5.698892116546631, "global_step": 8301, "epoch": 49} {"train_loss": -5.7638726234436035, "global_step": 8302, "epoch": 49} {"train_loss": -5.809207916259766, "global_step": 8303, "epoch": 49} {"train_loss": -5.888455867767334, "global_step": 8304, "epoch": 49} {"train_loss": -5.536455154418945, "global_step": 8305, "epoch": 49} {"train_loss": -5.608989715576172, "global_step": 8306, "epoch": 49} {"train_loss": -5.63519287109375, "global_step": 8307, "epoch": 49} {"train_loss": -5.577851295471191, "global_step": 8308, "epoch": 49} {"train_loss": -5.67207670211792, "global_step": 8309, "epoch": 49} {"train_loss": -5.480976581573486, "global_step": 8310, "epoch": 49} {"train_loss": -5.346518039703369, "global_step": 8311, "epoch": 49} {"train_loss": -5.473251819610596, "global_step": 8312, "epoch": 49} {"train_loss": -5.37119197845459, "global_step": 8313, "epoch": 49} {"train_loss": -5.131925582885742, "global_step": 8314, "epoch": 49} {"train_loss": -5.624217510223389, "global_step": 8315, "epoch": 49} {"train_loss": -5.54081916809082, "global_step": 8316, "epoch": 49} {"train_loss": -5.335040092468262, "global_step": 8317, "epoch": 49} {"train_loss": -5.371274948120117, "global_step": 8318, "epoch": 49} {"train_loss": -5.557942867279053, "global_step": 8319, "epoch": 49} {"train_loss": -5.4187846183776855, "global_step": 8320, "epoch": 49} {"train_loss": -5.549315452575684, "global_step": 8321, "epoch": 49} {"train_loss": -5.387598991394043, "global_step": 8322, "epoch": 49} {"train_loss": -5.2248854637146, "global_step": 8323, "epoch": 49} {"train_loss": -5.295591354370117, "global_step": 8324, "epoch": 49} {"train_loss": -5.3083906173706055, "global_step": 8325, "epoch": 49} {"train_loss": -5.302272796630859, "global_step": 8326, "epoch": 49} {"train_loss": -5.505581855773926, "global_step": 8327, "epoch": 49} {"train_loss": -5.365701198577881, "global_step": 8328, "epoch": 49} {"train_loss": -5.352408409118652, "global_step": 8329, "epoch": 49} {"train_loss": -5.223929405212402, "global_step": 8330, "epoch": 49} {"train_loss": -5.776878356933594, "global_step": 8331, "epoch": 49} {"train_loss": -5.198671817779541, "global_step": 8332, "epoch": 49} {"train_loss": -5.419567584991455, "global_step": 8333, "epoch": 49} {"train_loss": -5.316624641418457, "global_step": 8334, "epoch": 49} {"train_loss": -5.427813529968262, "global_step": 8335, "epoch": 49} {"train_loss": -5.743096351623535, "global_step": 8336, "epoch": 49} {"train_loss": -5.3165764808654785, "global_step": 8337, "epoch": 49} {"train_loss": -5.480257034301758, "global_step": 8338, "epoch": 49} {"train_loss": -5.465073108673096, "global_step": 8339, "epoch": 49} {"train_loss": -5.565309524536133, "global_step": 8340, "epoch": 49} {"train_loss": -5.570495128631592, "global_step": 8341, "epoch": 49} {"train_loss": -5.453984260559082, "global_step": 8342, "epoch": 49} {"train_loss": -5.502723217010498, "global_step": 8343, "epoch": 49} {"train_loss": -5.493680953979492, "global_step": 8344, "epoch": 49} {"train_loss": -5.495736122131348, "global_step": 8345, "epoch": 49} {"train_loss": -5.641648292541504, "global_step": 8346, "epoch": 49} {"train_loss": -5.422421932220459, "global_step": 8347, "epoch": 49} {"train_loss": -5.443428039550781, "global_step": 8348, "epoch": 49} {"train_loss": -5.5975565910339355, "global_step": 8349, "epoch": 49} {"train_loss": -5.54262113571167, "global_step": 8350, "epoch": 49} {"train_loss": -5.434450149536133, "global_step": 8351, "epoch": 49} {"train_loss": -5.748470306396484, "global_step": 8352, "epoch": 49} {"train_loss": -5.563503265380859, "global_step": 8353, "epoch": 49} {"train_loss": -5.415164947509766, "global_step": 8354, "epoch": 49} {"train_loss": -5.590300559997559, "global_step": 8355, "epoch": 49} {"train_loss": -5.4001312255859375, "global_step": 8356, "epoch": 49} {"train_loss": -5.451466083526611, "global_step": 8357, "epoch": 49} {"train_loss": -5.460312366485596, "global_step": 8358, "epoch": 49} {"train_loss": -5.763734340667725, "global_step": 8359, "epoch": 49} {"train_loss": -5.482865333557129, "global_step": 8360, "epoch": 49} {"train_loss": -5.680583953857422, "global_step": 8361, "epoch": 49} {"train_loss": -5.692038059234619, "global_step": 8362, "epoch": 49} {"train_loss": -5.663424491882324, "global_step": 8363, "epoch": 49} {"train_loss": -5.72664737701416, "global_step": 8364, "epoch": 49} {"train_loss": -5.4522480964660645, "global_step": 8365, "epoch": 49} {"train_loss": -5.896565914154053, "global_step": 8366, "epoch": 49} {"train_loss": -5.68612003326416, "global_step": 8367, "epoch": 49} {"train_loss": -5.571462631225586, "global_step": 8368, "epoch": 49} {"train_loss": -5.397180557250977, "global_step": 8369, "epoch": 49} {"train_loss": -5.504807472229004, "global_step": 8370, "epoch": 49} {"train_loss": -5.572208404541016, "global_step": 8371, "epoch": 49} {"train_loss": -5.595368385314941, "global_step": 8372, "epoch": 49} {"train_loss": -5.739618301391602, "global_step": 8373, "epoch": 49} {"train_loss": -5.526688575744629, "global_step": 8374, "epoch": 49} {"train_loss": -5.64486026763916, "global_step": 8375, "epoch": 49} {"train_loss": -5.6060099601745605, "global_step": 8376, "epoch": 49} {"train_loss": -5.54779052734375, "global_step": 8377, "epoch": 49} {"train_loss": -5.690238952636719, "global_step": 8378, "epoch": 49} {"train_loss": -5.508998870849609, "global_step": 8379, "epoch": 49} {"train_loss": -5.594309329986572, "global_step": 8380, "epoch": 49} {"train_loss": -5.665196418762207, "global_step": 8381, "epoch": 49} {"train_loss": -5.462601661682129, "global_step": 8382, "epoch": 49} {"train_loss": -5.708076477050781, "global_step": 8383, "epoch": 49} {"train_loss": -5.515109062194824, "global_step": 8384, "epoch": 49} {"train_loss": -5.650715351104736, "global_step": 8385, "epoch": 49} {"train_loss": -5.654191970825195, "global_step": 8386, "epoch": 49} {"train_loss": -5.941359996795654, "global_step": 8387, "epoch": 49} {"train_loss": -5.522533416748047, "global_step": 8388, "epoch": 49} {"train_loss": -5.66831111907959, "global_step": 8389, "epoch": 49} {"train_loss": -5.696656703948975, "global_step": 8390, "epoch": 49} {"train_loss": -5.775014400482178, "global_step": 8391, "epoch": 49} {"train_loss": -5.5564751625061035, "global_step": 8392, "epoch": 49} {"train_loss": -5.748189926147461, "global_step": 8393, "epoch": 49} {"train_loss": -5.527322769165039, "global_step": 8394, "epoch": 49} {"train_loss": -5.597580909729004, "global_step": 8395, "epoch": 49} {"train_loss": -5.427407264709473, "global_step": 8396, "epoch": 49} {"train_loss": -5.612015247344971, "global_step": 8397, "epoch": 49} {"train_loss": -5.353360176086426, "global_step": 8398, "epoch": 49} {"train_loss": -5.518070638179779, "global_step": 8399, "epoch": 49, "val_loss": 262470.4375} {"train_loss": -5.690618991851807, "global_step": 8400, "epoch": 50} {"train_loss": -5.447423934936523, "global_step": 8401, "epoch": 50} {"train_loss": -5.529750823974609, "global_step": 8402, "epoch": 50} {"train_loss": -5.574784278869629, "global_step": 8403, "epoch": 50} {"train_loss": -5.396758079528809, "global_step": 8404, "epoch": 50} {"train_loss": -5.519435882568359, "global_step": 8405, "epoch": 50} {"train_loss": -5.691514015197754, "global_step": 8406, "epoch": 50} {"train_loss": -5.522989273071289, "global_step": 8407, "epoch": 50} {"train_loss": -5.69569206237793, "global_step": 8408, "epoch": 50} {"train_loss": -5.521004676818848, "global_step": 8409, "epoch": 50} {"train_loss": -5.590691089630127, "global_step": 8410, "epoch": 50} {"train_loss": -5.492221832275391, "global_step": 8411, "epoch": 50} {"train_loss": -5.152509689331055, "global_step": 8412, "epoch": 50} {"train_loss": -5.38392972946167, "global_step": 8413, "epoch": 50} {"train_loss": -5.397692680358887, "global_step": 8414, "epoch": 50} {"train_loss": -5.472830772399902, "global_step": 8415, "epoch": 50} {"train_loss": -5.295459747314453, "global_step": 8416, "epoch": 50} {"train_loss": -5.569109916687012, "global_step": 8417, "epoch": 50} {"train_loss": -5.671875953674316, "global_step": 8418, "epoch": 50} {"train_loss": -5.419573783874512, "global_step": 8419, "epoch": 50} {"train_loss": -5.6711835861206055, "global_step": 8420, "epoch": 50} {"train_loss": -5.5704216957092285, "global_step": 8421, "epoch": 50} {"train_loss": -5.439197540283203, "global_step": 8422, "epoch": 50} {"train_loss": -5.445977210998535, "global_step": 8423, "epoch": 50} {"train_loss": -5.710513114929199, "global_step": 8424, "epoch": 50} {"train_loss": -5.520302772521973, "global_step": 8425, "epoch": 50} {"train_loss": -5.471499443054199, "global_step": 8426, "epoch": 50} {"train_loss": -5.342874526977539, "global_step": 8427, "epoch": 50} {"train_loss": -5.391186714172363, "global_step": 8428, "epoch": 50} {"train_loss": -5.390345573425293, "global_step": 8429, "epoch": 50} {"train_loss": -5.231108665466309, "global_step": 8430, "epoch": 50} {"train_loss": -5.515698432922363, "global_step": 8431, "epoch": 50} {"train_loss": -5.690009117126465, "global_step": 8432, "epoch": 50} {"train_loss": -5.706203937530518, "global_step": 8433, "epoch": 50} {"train_loss": -5.3535475730896, "global_step": 8434, "epoch": 50} {"train_loss": -5.449808120727539, "global_step": 8435, "epoch": 50} {"train_loss": -5.510019302368164, "global_step": 8436, "epoch": 50} {"train_loss": -5.3546552658081055, "global_step": 8437, "epoch": 50} {"train_loss": -5.601433753967285, "global_step": 8438, "epoch": 50} {"train_loss": -5.301839351654053, "global_step": 8439, "epoch": 50} {"train_loss": -5.392570972442627, "global_step": 8440, "epoch": 50} {"train_loss": -5.814411163330078, "global_step": 8441, "epoch": 50} {"train_loss": -5.516025066375732, "global_step": 8442, "epoch": 50} {"train_loss": -5.501901149749756, "global_step": 8443, "epoch": 50} {"train_loss": -5.367306232452393, "global_step": 8444, "epoch": 50} {"train_loss": -5.502973556518555, "global_step": 8445, "epoch": 50} {"train_loss": -5.551386833190918, "global_step": 8446, "epoch": 50} {"train_loss": -5.448196887969971, "global_step": 8447, "epoch": 50} {"train_loss": -5.697061538696289, "global_step": 8448, "epoch": 50} {"train_loss": -5.444298267364502, "global_step": 8449, "epoch": 50} {"train_loss": -5.610033988952637, "global_step": 8450, "epoch": 50} {"train_loss": -5.606525421142578, "global_step": 8451, "epoch": 50} {"train_loss": -5.073641300201416, "global_step": 8452, "epoch": 50} {"train_loss": -5.32930850982666, "global_step": 8453, "epoch": 50} {"train_loss": -5.4112958908081055, "global_step": 8454, "epoch": 50} {"train_loss": -5.589005947113037, "global_step": 8455, "epoch": 50} {"train_loss": -5.4355573654174805, "global_step": 8456, "epoch": 50} {"train_loss": -5.536627769470215, "global_step": 8457, "epoch": 50} {"train_loss": -5.345157623291016, "global_step": 8458, "epoch": 50} {"train_loss": -5.461794853210449, "global_step": 8459, "epoch": 50} {"train_loss": -5.686007499694824, "global_step": 8460, "epoch": 50} {"train_loss": -5.349007606506348, "global_step": 8461, "epoch": 50} {"train_loss": -5.285482883453369, "global_step": 8462, "epoch": 50} {"train_loss": -5.4929704666137695, "global_step": 8463, "epoch": 50} {"train_loss": -5.218700408935547, "global_step": 8464, "epoch": 50} {"train_loss": -5.104689598083496, "global_step": 8465, "epoch": 50} {"train_loss": -5.352862358093262, "global_step": 8466, "epoch": 50} {"train_loss": -5.334418773651123, "global_step": 8467, "epoch": 50} {"train_loss": -5.391789436340332, "global_step": 8468, "epoch": 50} {"train_loss": -5.42303466796875, "global_step": 8469, "epoch": 50} {"train_loss": -5.370056629180908, "global_step": 8470, "epoch": 50} {"train_loss": -5.073302745819092, "global_step": 8471, "epoch": 50} {"train_loss": -5.4324212074279785, "global_step": 8472, "epoch": 50} {"train_loss": -5.344851493835449, "global_step": 8473, "epoch": 50} {"train_loss": -5.231266021728516, "global_step": 8474, "epoch": 50} {"train_loss": -5.163202285766602, "global_step": 8475, "epoch": 50} {"train_loss": -5.183571815490723, "global_step": 8476, "epoch": 50} {"train_loss": -5.296934127807617, "global_step": 8477, "epoch": 50} {"train_loss": -5.542395114898682, "global_step": 8478, "epoch": 50} {"train_loss": -5.435535430908203, "global_step": 8479, "epoch": 50} {"train_loss": -5.235443115234375, "global_step": 8480, "epoch": 50} {"train_loss": -5.617269515991211, "global_step": 8481, "epoch": 50} {"train_loss": -5.619932174682617, "global_step": 8482, "epoch": 50} {"train_loss": -5.33950138092041, "global_step": 8483, "epoch": 50} {"train_loss": -5.463755130767822, "global_step": 8484, "epoch": 50} {"train_loss": -5.549600124359131, "global_step": 8485, "epoch": 50} {"train_loss": -5.219696998596191, "global_step": 8486, "epoch": 50} {"train_loss": -5.419923782348633, "global_step": 8487, "epoch": 50} {"train_loss": -5.564794540405273, "global_step": 8488, "epoch": 50} {"train_loss": -5.635601043701172, "global_step": 8489, "epoch": 50} {"train_loss": -5.738163948059082, "global_step": 8490, "epoch": 50} {"train_loss": -5.4109954833984375, "global_step": 8491, "epoch": 50} {"train_loss": -5.664156913757324, "global_step": 8492, "epoch": 50} {"train_loss": -5.579310417175293, "global_step": 8493, "epoch": 50} {"train_loss": -5.565712928771973, "global_step": 8494, "epoch": 50} {"train_loss": -5.582866668701172, "global_step": 8495, "epoch": 50} {"train_loss": -5.525656700134277, "global_step": 8496, "epoch": 50} {"train_loss": -5.561398983001709, "global_step": 8497, "epoch": 50} {"train_loss": -5.589659690856934, "global_step": 8498, "epoch": 50} {"train_loss": -5.656212329864502, "global_step": 8499, "epoch": 50} {"train_loss": -5.635136127471924, "global_step": 8500, "epoch": 50} {"train_loss": -5.735342025756836, "global_step": 8501, "epoch": 50} {"train_loss": -5.504593849182129, "global_step": 8502, "epoch": 50} {"train_loss": -5.410068511962891, "global_step": 8503, "epoch": 50} {"train_loss": -5.500450611114502, "global_step": 8504, "epoch": 50} {"train_loss": -5.445666790008545, "global_step": 8505, "epoch": 50} {"train_loss": -5.66013240814209, "global_step": 8506, "epoch": 50} {"train_loss": -5.410453796386719, "global_step": 8507, "epoch": 50} {"train_loss": -5.2588958740234375, "global_step": 8508, "epoch": 50} {"train_loss": -5.726857662200928, "global_step": 8509, "epoch": 50} {"train_loss": -5.655882835388184, "global_step": 8510, "epoch": 50} {"train_loss": -5.298924446105957, "global_step": 8511, "epoch": 50} {"train_loss": -5.495485305786133, "global_step": 8512, "epoch": 50} {"train_loss": -5.463528156280518, "global_step": 8513, "epoch": 50} {"train_loss": -5.611722946166992, "global_step": 8514, "epoch": 50} {"train_loss": -5.532323837280273, "global_step": 8515, "epoch": 50} {"train_loss": -5.627327919006348, "global_step": 8516, "epoch": 50} {"train_loss": -5.54941463470459, "global_step": 8517, "epoch": 50} {"train_loss": -5.574240684509277, "global_step": 8518, "epoch": 50} {"train_loss": -5.539368152618408, "global_step": 8519, "epoch": 50} {"train_loss": -5.607471942901611, "global_step": 8520, "epoch": 50} {"train_loss": -5.650613784790039, "global_step": 8521, "epoch": 50} {"train_loss": -5.605206489562988, "global_step": 8522, "epoch": 50} {"train_loss": -5.577083587646484, "global_step": 8523, "epoch": 50} {"train_loss": -5.603346824645996, "global_step": 8524, "epoch": 50} {"train_loss": -5.881749153137207, "global_step": 8525, "epoch": 50} {"train_loss": -5.659665107727051, "global_step": 8526, "epoch": 50} {"train_loss": -5.94467830657959, "global_step": 8527, "epoch": 50} {"train_loss": -5.686431407928467, "global_step": 8528, "epoch": 50} {"train_loss": -5.607727527618408, "global_step": 8529, "epoch": 50} {"train_loss": -5.597396373748779, "global_step": 8530, "epoch": 50} {"train_loss": -5.686859607696533, "global_step": 8531, "epoch": 50} {"train_loss": -5.698744773864746, "global_step": 8532, "epoch": 50} {"train_loss": -5.73501443862915, "global_step": 8533, "epoch": 50} {"train_loss": -5.7516913414001465, "global_step": 8534, "epoch": 50} {"train_loss": -5.7846503257751465, "global_step": 8535, "epoch": 50} {"train_loss": -5.427371978759766, "global_step": 8536, "epoch": 50} {"train_loss": -5.505331993103027, "global_step": 8537, "epoch": 50} {"train_loss": -5.764021873474121, "global_step": 8538, "epoch": 50} {"train_loss": -5.587923049926758, "global_step": 8539, "epoch": 50} {"train_loss": -5.634366512298584, "global_step": 8540, "epoch": 50} {"train_loss": -5.508909225463867, "global_step": 8541, "epoch": 50} {"train_loss": -5.652875900268555, "global_step": 8542, "epoch": 50} {"train_loss": -5.472282409667969, "global_step": 8543, "epoch": 50} {"train_loss": -5.552691459655762, "global_step": 8544, "epoch": 50} {"train_loss": -5.846292972564697, "global_step": 8545, "epoch": 50} {"train_loss": -5.3701324462890625, "global_step": 8546, "epoch": 50} {"train_loss": -5.685722351074219, "global_step": 8547, "epoch": 50} {"train_loss": -5.655535697937012, "global_step": 8548, "epoch": 50} {"train_loss": -5.778811454772949, "global_step": 8549, "epoch": 50} {"train_loss": -5.451139450073242, "global_step": 8550, "epoch": 50} {"train_loss": -5.599173545837402, "global_step": 8551, "epoch": 50} {"train_loss": -5.412631511688232, "global_step": 8552, "epoch": 50} {"train_loss": -5.641348838806152, "global_step": 8553, "epoch": 50} {"train_loss": -5.498805999755859, "global_step": 8554, "epoch": 50} {"train_loss": -5.606035232543945, "global_step": 8555, "epoch": 50} {"train_loss": -5.460505962371826, "global_step": 8556, "epoch": 50} {"train_loss": -5.537533760070801, "global_step": 8557, "epoch": 50} {"train_loss": -5.481595993041992, "global_step": 8558, "epoch": 50} {"train_loss": -5.606528282165527, "global_step": 8559, "epoch": 50} {"train_loss": -5.4524030685424805, "global_step": 8560, "epoch": 50} {"train_loss": -5.62694787979126, "global_step": 8561, "epoch": 50} {"train_loss": -5.509327411651611, "global_step": 8562, "epoch": 50} {"train_loss": -5.575604438781738, "global_step": 8563, "epoch": 50} {"train_loss": -5.510466575622559, "global_step": 8564, "epoch": 50} {"train_loss": -5.367685317993164, "global_step": 8565, "epoch": 50} {"train_loss": -5.366747856140137, "global_step": 8566, "epoch": 50} {"train_loss": -5.511322064059121, "global_step": 8567, "epoch": 50, "train/sim_max_reward_0": 0.624770652924541, "train/sim_max_reward_1": 0.9981215349053315, "train/sim_max_reward_2": 0.9372548081009564, "train/sim_max_reward_3": 0.5941596640447865, "train/sim_max_reward_4": 0.9623019784358214, "train/sim_max_reward_5": 0.5128355340896555, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 0.055100884220027686, "test/sim_max_reward_4400003": 0.2971245594656171, "test/sim_max_reward_4400004": 0.41834023847246204, "test/sim_max_reward_4400005": 0.039270662726964056, "test/sim_max_reward_4400006": 0.3002847658079877, "test/sim_max_reward_4400007": 0.984033631220112, "test/sim_max_reward_4400008": 0.693097266014542, "test/sim_max_reward_4400009": 0.5736675187029104, "test/sim_max_reward_4400010": 0.2304435708565551, "test/sim_max_reward_4400011": 0.9570123097213447, "test/sim_max_reward_4400012": 0.9155544995828895, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.9119940036496265, "test/sim_max_reward_4400015": 0.37167361651717573, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.6268404355255899, "test/sim_max_reward_4400019": 0.2870744777019958, "test/sim_max_reward_4400020": 0.002078462520255241, "test/sim_max_reward_4400021": 0.4450270959651152, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.18832729275223006, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.47370603097036923, "test/sim_max_reward_4400026": 0.9149661720104412, "test/sim_max_reward_4400027": 0.4575363230952497, "test/sim_max_reward_4400028": 0.7134878474148431, "test/sim_max_reward_4400029": 0.5566660653322101, "test/sim_max_reward_4400030": 0.7843751977764557, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.21489478361302913, "test/sim_max_reward_4400033": 0.16480668567912088, "test/sim_max_reward_4400034": 0.671068260089701, "test/sim_max_reward_4400035": 0.4507784725734187, "test/sim_max_reward_4400036": 0.37661087702674506, "test/sim_max_reward_4400037": 0.9016189190552051, "test/sim_max_reward_4400038": 0.0, "test/sim_max_reward_4400039": 0.473807912129498, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.17634858758543262, "test/sim_max_reward_4400042": 0.9462714453107344, "test/sim_max_reward_4400043": 0.6137374666955189, "test/sim_max_reward_4400044": 0.27901634524800495, "test/sim_max_reward_4400045": 0.4768007923007933, "test/sim_max_reward_4400046": 0.470042104449788, "test/sim_max_reward_4400047": 0.61683034372063, "test/sim_max_reward_4400048": 0.544559370900444, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.771574028750182, "test/mean_score": 0.4734636388244535, "val_loss": 265274.9375, "train_action_mse_error": 53.05918884277344} {"train_loss": -5.594315528869629, "global_step": 8568, "epoch": 51} {"train_loss": -5.600322723388672, "global_step": 8569, "epoch": 51} {"train_loss": -5.417410850524902, "global_step": 8570, "epoch": 51} {"train_loss": -5.7215070724487305, "global_step": 8571, "epoch": 51} {"train_loss": -5.383009433746338, "global_step": 8572, "epoch": 51} {"train_loss": -5.604464054107666, "global_step": 8573, "epoch": 51} {"train_loss": -5.510404586791992, "global_step": 8574, "epoch": 51} {"train_loss": -5.629202842712402, "global_step": 8575, "epoch": 51} {"train_loss": -5.608698844909668, "global_step": 8576, "epoch": 51} {"train_loss": -5.4356303215026855, "global_step": 8577, "epoch": 51} {"train_loss": -5.478890419006348, "global_step": 8578, "epoch": 51} {"train_loss": -5.649942874908447, "global_step": 8579, "epoch": 51} {"train_loss": -5.704768180847168, "global_step": 8580, "epoch": 51} {"train_loss": -5.488443851470947, "global_step": 8581, "epoch": 51} {"train_loss": -5.834344387054443, "global_step": 8582, "epoch": 51} {"train_loss": -5.425482749938965, "global_step": 8583, "epoch": 51} {"train_loss": -5.5798444747924805, "global_step": 8584, "epoch": 51} {"train_loss": -5.254454612731934, "global_step": 8585, "epoch": 51} {"train_loss": -5.740865707397461, "global_step": 8586, "epoch": 51} {"train_loss": -5.486732482910156, "global_step": 8587, "epoch": 51} {"train_loss": -5.64364767074585, "global_step": 8588, "epoch": 51} {"train_loss": -5.647858619689941, "global_step": 8589, "epoch": 51} {"train_loss": -5.701751708984375, "global_step": 8590, "epoch": 51} {"train_loss": -5.673975467681885, "global_step": 8591, "epoch": 51} {"train_loss": -5.816610813140869, "global_step": 8592, "epoch": 51} {"train_loss": -5.443871021270752, "global_step": 8593, "epoch": 51} {"train_loss": -5.76627254486084, "global_step": 8594, "epoch": 51} {"train_loss": -5.614163398742676, "global_step": 8595, "epoch": 51} {"train_loss": -5.457676887512207, "global_step": 8596, "epoch": 51} {"train_loss": -5.566462993621826, "global_step": 8597, "epoch": 51} {"train_loss": -5.720439910888672, "global_step": 8598, "epoch": 51} {"train_loss": -5.5698676109313965, "global_step": 8599, "epoch": 51} {"train_loss": -5.57243013381958, "global_step": 8600, "epoch": 51} {"train_loss": -5.390631675720215, "global_step": 8601, "epoch": 51} {"train_loss": -5.925628185272217, "global_step": 8602, "epoch": 51} {"train_loss": -5.627311706542969, "global_step": 8603, "epoch": 51} {"train_loss": -5.521650314331055, "global_step": 8604, "epoch": 51} {"train_loss": -5.473268508911133, "global_step": 8605, "epoch": 51} {"train_loss": -5.442227363586426, "global_step": 8606, "epoch": 51} {"train_loss": -5.682468891143799, "global_step": 8607, "epoch": 51} {"train_loss": -5.636290073394775, "global_step": 8608, "epoch": 51} {"train_loss": -5.615865707397461, "global_step": 8609, "epoch": 51} {"train_loss": -5.748525142669678, "global_step": 8610, "epoch": 51} {"train_loss": -5.76668643951416, "global_step": 8611, "epoch": 51} {"train_loss": -5.530072212219238, "global_step": 8612, "epoch": 51} {"train_loss": -5.651156902313232, "global_step": 8613, "epoch": 51} {"train_loss": -5.688647270202637, "global_step": 8614, "epoch": 51} {"train_loss": -5.603420257568359, "global_step": 8615, "epoch": 51} {"train_loss": -5.570461273193359, "global_step": 8616, "epoch": 51} {"train_loss": -5.754090785980225, "global_step": 8617, "epoch": 51} {"train_loss": -5.931437015533447, "global_step": 8618, "epoch": 51} {"train_loss": -5.397922515869141, "global_step": 8619, "epoch": 51} {"train_loss": -5.5239667892456055, "global_step": 8620, "epoch": 51} {"train_loss": -5.666112899780273, "global_step": 8621, "epoch": 51} {"train_loss": -5.818300247192383, "global_step": 8622, "epoch": 51} {"train_loss": -5.67990255355835, "global_step": 8623, "epoch": 51} {"train_loss": -5.791272163391113, "global_step": 8624, "epoch": 51} {"train_loss": -5.6588335037231445, "global_step": 8625, "epoch": 51} {"train_loss": -5.683869361877441, "global_step": 8626, "epoch": 51} {"train_loss": -5.438239097595215, "global_step": 8627, "epoch": 51} {"train_loss": -5.476642608642578, "global_step": 8628, "epoch": 51} {"train_loss": -5.476921081542969, "global_step": 8629, "epoch": 51} {"train_loss": -5.630032539367676, "global_step": 8630, "epoch": 51} {"train_loss": -5.740166664123535, "global_step": 8631, "epoch": 51} {"train_loss": -5.6164374351501465, "global_step": 8632, "epoch": 51} {"train_loss": -5.4577555656433105, "global_step": 8633, "epoch": 51} {"train_loss": -5.538858413696289, "global_step": 8634, "epoch": 51} {"train_loss": -5.349781036376953, "global_step": 8635, "epoch": 51} {"train_loss": -5.7478766441345215, "global_step": 8636, "epoch": 51} {"train_loss": -5.743899345397949, "global_step": 8637, "epoch": 51} {"train_loss": -5.552254676818848, "global_step": 8638, "epoch": 51} {"train_loss": -5.436323642730713, "global_step": 8639, "epoch": 51} {"train_loss": -5.576972961425781, "global_step": 8640, "epoch": 51} {"train_loss": -5.515556335449219, "global_step": 8641, "epoch": 51} {"train_loss": -5.475229263305664, "global_step": 8642, "epoch": 51} {"train_loss": -5.718578815460205, "global_step": 8643, "epoch": 51} {"train_loss": -5.4495015144348145, "global_step": 8644, "epoch": 51} {"train_loss": -5.618574142456055, "global_step": 8645, "epoch": 51} {"train_loss": -5.5718994140625, "global_step": 8646, "epoch": 51} {"train_loss": -5.639104843139648, "global_step": 8647, "epoch": 51} {"train_loss": -5.580191135406494, "global_step": 8648, "epoch": 51} {"train_loss": -5.543042182922363, "global_step": 8649, "epoch": 51} {"train_loss": -5.637609958648682, "global_step": 8650, "epoch": 51} {"train_loss": -5.7499237060546875, "global_step": 8651, "epoch": 51} {"train_loss": -5.168545722961426, "global_step": 8652, "epoch": 51} {"train_loss": -5.413239479064941, "global_step": 8653, "epoch": 51} {"train_loss": -5.688002109527588, "global_step": 8654, "epoch": 51} {"train_loss": -5.533266544342041, "global_step": 8655, "epoch": 51} {"train_loss": -5.418437480926514, "global_step": 8656, "epoch": 51} {"train_loss": -5.469778060913086, "global_step": 8657, "epoch": 51} {"train_loss": -5.674156188964844, "global_step": 8658, "epoch": 51} {"train_loss": -5.514743804931641, "global_step": 8659, "epoch": 51} {"train_loss": -5.8877387046813965, "global_step": 8660, "epoch": 51} {"train_loss": -5.423218727111816, "global_step": 8661, "epoch": 51} {"train_loss": -5.34666633605957, "global_step": 8662, "epoch": 51} {"train_loss": -5.590173721313477, "global_step": 8663, "epoch": 51} {"train_loss": -5.6155619621276855, "global_step": 8664, "epoch": 51} {"train_loss": -5.74171257019043, "global_step": 8665, "epoch": 51} {"train_loss": -5.576509475708008, "global_step": 8666, "epoch": 51} {"train_loss": -5.447029113769531, "global_step": 8667, "epoch": 51} {"train_loss": -5.984707832336426, "global_step": 8668, "epoch": 51} {"train_loss": -5.637763977050781, "global_step": 8669, "epoch": 51} {"train_loss": -5.7281293869018555, "global_step": 8670, "epoch": 51} {"train_loss": -5.32047700881958, "global_step": 8671, "epoch": 51} {"train_loss": -5.3198161125183105, "global_step": 8672, "epoch": 51} {"train_loss": -5.5700483322143555, "global_step": 8673, "epoch": 51} {"train_loss": -5.269766330718994, "global_step": 8674, "epoch": 51} {"train_loss": -5.754550457000732, "global_step": 8675, "epoch": 51} {"train_loss": -5.59420108795166, "global_step": 8676, "epoch": 51} {"train_loss": -5.567496299743652, "global_step": 8677, "epoch": 51} {"train_loss": -5.718259334564209, "global_step": 8678, "epoch": 51} {"train_loss": -5.233624458312988, "global_step": 8679, "epoch": 51} {"train_loss": -5.702618598937988, "global_step": 8680, "epoch": 51} {"train_loss": -5.401955604553223, "global_step": 8681, "epoch": 51} {"train_loss": -5.4931182861328125, "global_step": 8682, "epoch": 51} {"train_loss": -5.492918014526367, "global_step": 8683, "epoch": 51} {"train_loss": -5.206212997436523, "global_step": 8684, "epoch": 51} {"train_loss": -5.777007102966309, "global_step": 8685, "epoch": 51} {"train_loss": -5.457242965698242, "global_step": 8686, "epoch": 51} {"train_loss": -5.31697940826416, "global_step": 8687, "epoch": 51} {"train_loss": -5.393433570861816, "global_step": 8688, "epoch": 51} {"train_loss": -5.514981746673584, "global_step": 8689, "epoch": 51} {"train_loss": -5.4219231605529785, "global_step": 8690, "epoch": 51} {"train_loss": -5.59160041809082, "global_step": 8691, "epoch": 51} {"train_loss": -5.37942361831665, "global_step": 8692, "epoch": 51} {"train_loss": -5.518712520599365, "global_step": 8693, "epoch": 51} {"train_loss": -5.680152893066406, "global_step": 8694, "epoch": 51} {"train_loss": -5.440215587615967, "global_step": 8695, "epoch": 51} {"train_loss": -5.571638584136963, "global_step": 8696, "epoch": 51} {"train_loss": -5.578586578369141, "global_step": 8697, "epoch": 51} {"train_loss": -5.700037002563477, "global_step": 8698, "epoch": 51} {"train_loss": -5.743776798248291, "global_step": 8699, "epoch": 51} {"train_loss": -5.6201171875, "global_step": 8700, "epoch": 51} {"train_loss": -5.446657657623291, "global_step": 8701, "epoch": 51} {"train_loss": -5.351888656616211, "global_step": 8702, "epoch": 51} {"train_loss": -5.445259094238281, "global_step": 8703, "epoch": 51} {"train_loss": -5.666038990020752, "global_step": 8704, "epoch": 51} {"train_loss": -5.579242706298828, "global_step": 8705, "epoch": 51} {"train_loss": -5.5824971199035645, "global_step": 8706, "epoch": 51} {"train_loss": -5.600442886352539, "global_step": 8707, "epoch": 51} {"train_loss": -5.544048309326172, "global_step": 8708, "epoch": 51} {"train_loss": -5.489194393157959, "global_step": 8709, "epoch": 51} {"train_loss": -5.552914142608643, "global_step": 8710, "epoch": 51} {"train_loss": -5.670033931732178, "global_step": 8711, "epoch": 51} {"train_loss": -5.830723762512207, "global_step": 8712, "epoch": 51} {"train_loss": -5.520730972290039, "global_step": 8713, "epoch": 51} {"train_loss": -5.707648277282715, "global_step": 8714, "epoch": 51} {"train_loss": -5.24827766418457, "global_step": 8715, "epoch": 51} {"train_loss": -5.867859840393066, "global_step": 8716, "epoch": 51} {"train_loss": -5.681873321533203, "global_step": 8717, "epoch": 51} {"train_loss": -5.6384053230285645, "global_step": 8718, "epoch": 51} {"train_loss": -5.556231498718262, "global_step": 8719, "epoch": 51} {"train_loss": -5.904041290283203, "global_step": 8720, "epoch": 51} {"train_loss": -5.717471122741699, "global_step": 8721, "epoch": 51} {"train_loss": -5.588205814361572, "global_step": 8722, "epoch": 51} {"train_loss": -5.449864387512207, "global_step": 8723, "epoch": 51} {"train_loss": -5.325414180755615, "global_step": 8724, "epoch": 51} {"train_loss": -5.653485298156738, "global_step": 8725, "epoch": 51} {"train_loss": -5.605907440185547, "global_step": 8726, "epoch": 51} {"train_loss": -5.466488361358643, "global_step": 8727, "epoch": 51} {"train_loss": -5.669062614440918, "global_step": 8728, "epoch": 51} {"train_loss": -5.759725570678711, "global_step": 8729, "epoch": 51} {"train_loss": -5.408928394317627, "global_step": 8730, "epoch": 51} {"train_loss": -5.502410888671875, "global_step": 8731, "epoch": 51} {"train_loss": -5.762282371520996, "global_step": 8732, "epoch": 51} {"train_loss": -5.405479431152344, "global_step": 8733, "epoch": 51} {"train_loss": -5.755695343017578, "global_step": 8734, "epoch": 51} {"train_loss": -5.577987202576229, "global_step": 8735, "epoch": 51, "val_loss": 281177.5625} {"train_loss": -5.8602213859558105, "global_step": 8736, "epoch": 52} {"train_loss": -5.602602958679199, "global_step": 8737, "epoch": 52} {"train_loss": -5.5015106201171875, "global_step": 8738, "epoch": 52} {"train_loss": -5.862978458404541, "global_step": 8739, "epoch": 52} {"train_loss": -5.422797203063965, "global_step": 8740, "epoch": 52} {"train_loss": -5.735293865203857, "global_step": 8741, "epoch": 52} {"train_loss": -5.671445846557617, "global_step": 8742, "epoch": 52} {"train_loss": -5.933493614196777, "global_step": 8743, "epoch": 52} {"train_loss": -5.545251369476318, "global_step": 8744, "epoch": 52} {"train_loss": -5.5296759605407715, "global_step": 8745, "epoch": 52} {"train_loss": -5.310594081878662, "global_step": 8746, "epoch": 52} {"train_loss": -5.439801216125488, "global_step": 8747, "epoch": 52} {"train_loss": -5.736800193786621, "global_step": 8748, "epoch": 52} {"train_loss": -5.788507461547852, "global_step": 8749, "epoch": 52} {"train_loss": -5.885636806488037, "global_step": 8750, "epoch": 52} {"train_loss": -5.815313339233398, "global_step": 8751, "epoch": 52} {"train_loss": -5.987051010131836, "global_step": 8752, "epoch": 52} {"train_loss": -5.681621551513672, "global_step": 8753, "epoch": 52} {"train_loss": -5.6895222663879395, "global_step": 8754, "epoch": 52} {"train_loss": -5.365674018859863, "global_step": 8755, "epoch": 52} {"train_loss": -5.619828701019287, "global_step": 8756, "epoch": 52} {"train_loss": -5.519366264343262, "global_step": 8757, "epoch": 52} {"train_loss": -5.790130138397217, "global_step": 8758, "epoch": 52} {"train_loss": -5.6689453125, "global_step": 8759, "epoch": 52} {"train_loss": -5.710640907287598, "global_step": 8760, "epoch": 52} {"train_loss": -5.55190896987915, "global_step": 8761, "epoch": 52} {"train_loss": -5.59257173538208, "global_step": 8762, "epoch": 52} {"train_loss": -5.664974689483643, "global_step": 8763, "epoch": 52} {"train_loss": -5.629372596740723, "global_step": 8764, "epoch": 52} {"train_loss": -5.771410942077637, "global_step": 8765, "epoch": 52} {"train_loss": -5.762246131896973, "global_step": 8766, "epoch": 52} {"train_loss": -5.374333381652832, "global_step": 8767, "epoch": 52} {"train_loss": -5.871685028076172, "global_step": 8768, "epoch": 52} {"train_loss": -5.586365699768066, "global_step": 8769, "epoch": 52} {"train_loss": -5.767596244812012, "global_step": 8770, "epoch": 52} {"train_loss": -5.764937877655029, "global_step": 8771, "epoch": 52} {"train_loss": -5.84405517578125, "global_step": 8772, "epoch": 52} {"train_loss": -5.487431526184082, "global_step": 8773, "epoch": 52} {"train_loss": -5.552543640136719, "global_step": 8774, "epoch": 52} {"train_loss": -5.828461647033691, "global_step": 8775, "epoch": 52} {"train_loss": -5.820866584777832, "global_step": 8776, "epoch": 52} {"train_loss": -5.473438739776611, "global_step": 8777, "epoch": 52} {"train_loss": -5.395525932312012, "global_step": 8778, "epoch": 52} {"train_loss": -5.505583763122559, "global_step": 8779, "epoch": 52} {"train_loss": -5.762752056121826, "global_step": 8780, "epoch": 52} {"train_loss": -5.359915733337402, "global_step": 8781, "epoch": 52} {"train_loss": -5.555028915405273, "global_step": 8782, "epoch": 52} {"train_loss": -5.525630950927734, "global_step": 8783, "epoch": 52} {"train_loss": -5.689243793487549, "global_step": 8784, "epoch": 52} {"train_loss": -5.712770938873291, "global_step": 8785, "epoch": 52} {"train_loss": -5.901319980621338, "global_step": 8786, "epoch": 52} {"train_loss": -5.747939586639404, "global_step": 8787, "epoch": 52} {"train_loss": -5.714578628540039, "global_step": 8788, "epoch": 52} {"train_loss": -5.651005268096924, "global_step": 8789, "epoch": 52} {"train_loss": -5.596505165100098, "global_step": 8790, "epoch": 52} {"train_loss": -5.727858543395996, "global_step": 8791, "epoch": 52} {"train_loss": -5.445464611053467, "global_step": 8792, "epoch": 52} {"train_loss": -5.773758411407471, "global_step": 8793, "epoch": 52} {"train_loss": -5.412081718444824, "global_step": 8794, "epoch": 52} {"train_loss": -5.7397379875183105, "global_step": 8795, "epoch": 52} {"train_loss": -5.6806230545043945, "global_step": 8796, "epoch": 52} {"train_loss": -5.680954933166504, "global_step": 8797, "epoch": 52} {"train_loss": -5.667975902557373, "global_step": 8798, "epoch": 52} {"train_loss": -5.582213401794434, "global_step": 8799, "epoch": 52} {"train_loss": -5.720217227935791, "global_step": 8800, "epoch": 52} {"train_loss": -5.6522111892700195, "global_step": 8801, "epoch": 52} {"train_loss": -5.750387191772461, "global_step": 8802, "epoch": 52} {"train_loss": -5.604904651641846, "global_step": 8803, "epoch": 52} {"train_loss": -5.837515830993652, "global_step": 8804, "epoch": 52} {"train_loss": -5.307085990905762, "global_step": 8805, "epoch": 52} {"train_loss": -5.524750709533691, "global_step": 8806, "epoch": 52} {"train_loss": -5.639148712158203, "global_step": 8807, "epoch": 52} {"train_loss": -5.67559814453125, "global_step": 8808, "epoch": 52} {"train_loss": -5.635516166687012, "global_step": 8809, "epoch": 52} {"train_loss": -5.681136131286621, "global_step": 8810, "epoch": 52} {"train_loss": -5.54929256439209, "global_step": 8811, "epoch": 52} {"train_loss": -5.720664978027344, "global_step": 8812, "epoch": 52} {"train_loss": -5.597819805145264, "global_step": 8813, "epoch": 52} {"train_loss": -5.438492774963379, "global_step": 8814, "epoch": 52} {"train_loss": -5.623673915863037, "global_step": 8815, "epoch": 52} {"train_loss": -5.548800945281982, "global_step": 8816, "epoch": 52} {"train_loss": -5.7078680992126465, "global_step": 8817, "epoch": 52} {"train_loss": -5.611241340637207, "global_step": 8818, "epoch": 52} {"train_loss": -5.460556983947754, "global_step": 8819, "epoch": 52} {"train_loss": -5.7322821617126465, "global_step": 8820, "epoch": 52} {"train_loss": -5.819409370422363, "global_step": 8821, "epoch": 52} {"train_loss": -5.376038551330566, "global_step": 8822, "epoch": 52} {"train_loss": -5.516224384307861, "global_step": 8823, "epoch": 52} {"train_loss": -5.573464870452881, "global_step": 8824, "epoch": 52} {"train_loss": -5.382590293884277, "global_step": 8825, "epoch": 52} {"train_loss": -5.80567741394043, "global_step": 8826, "epoch": 52} {"train_loss": -5.565777778625488, "global_step": 8827, "epoch": 52} {"train_loss": -5.49167537689209, "global_step": 8828, "epoch": 52} {"train_loss": -5.3507399559021, "global_step": 8829, "epoch": 52} {"train_loss": -5.437849998474121, "global_step": 8830, "epoch": 52} {"train_loss": -5.606369972229004, "global_step": 8831, "epoch": 52} {"train_loss": -5.557833671569824, "global_step": 8832, "epoch": 52} {"train_loss": -5.507722854614258, "global_step": 8833, "epoch": 52} {"train_loss": -5.513899803161621, "global_step": 8834, "epoch": 52} {"train_loss": -5.649293899536133, "global_step": 8835, "epoch": 52} {"train_loss": -5.515905857086182, "global_step": 8836, "epoch": 52} {"train_loss": -5.689993858337402, "global_step": 8837, "epoch": 52} {"train_loss": -5.492047309875488, "global_step": 8838, "epoch": 52} {"train_loss": -5.824146747589111, "global_step": 8839, "epoch": 52} {"train_loss": -5.4344940185546875, "global_step": 8840, "epoch": 52} {"train_loss": -5.4252166748046875, "global_step": 8841, "epoch": 52} {"train_loss": -5.649456024169922, "global_step": 8842, "epoch": 52} {"train_loss": -5.667595386505127, "global_step": 8843, "epoch": 52} {"train_loss": -5.459410190582275, "global_step": 8844, "epoch": 52} {"train_loss": -5.434963226318359, "global_step": 8845, "epoch": 52} {"train_loss": -5.511833667755127, "global_step": 8846, "epoch": 52} {"train_loss": -5.552124500274658, "global_step": 8847, "epoch": 52} {"train_loss": -5.6616363525390625, "global_step": 8848, "epoch": 52} {"train_loss": -5.514995574951172, "global_step": 8849, "epoch": 52} {"train_loss": -5.899747848510742, "global_step": 8850, "epoch": 52} {"train_loss": -5.517399311065674, "global_step": 8851, "epoch": 52} {"train_loss": -5.451866626739502, "global_step": 8852, "epoch": 52} {"train_loss": -5.538640975952148, "global_step": 8853, "epoch": 52} {"train_loss": -5.4266228675842285, "global_step": 8854, "epoch": 52} {"train_loss": -5.504085063934326, "global_step": 8855, "epoch": 52} {"train_loss": -5.290379524230957, "global_step": 8856, "epoch": 52} {"train_loss": -5.521679401397705, "global_step": 8857, "epoch": 52} {"train_loss": -5.671557426452637, "global_step": 8858, "epoch": 52} {"train_loss": -5.541622161865234, "global_step": 8859, "epoch": 52} {"train_loss": -5.6934685707092285, "global_step": 8860, "epoch": 52} {"train_loss": -5.501755714416504, "global_step": 8861, "epoch": 52} {"train_loss": -5.420223712921143, "global_step": 8862, "epoch": 52} {"train_loss": -5.891636848449707, "global_step": 8863, "epoch": 52} {"train_loss": -5.577262878417969, "global_step": 8864, "epoch": 52} {"train_loss": -5.554666042327881, "global_step": 8865, "epoch": 52} {"train_loss": -5.538959980010986, "global_step": 8866, "epoch": 52} {"train_loss": -5.797564506530762, "global_step": 8867, "epoch": 52} {"train_loss": -5.498488426208496, "global_step": 8868, "epoch": 52} {"train_loss": -5.559109687805176, "global_step": 8869, "epoch": 52} {"train_loss": -5.683861255645752, "global_step": 8870, "epoch": 52} {"train_loss": -5.618768692016602, "global_step": 8871, "epoch": 52} {"train_loss": -5.498252868652344, "global_step": 8872, "epoch": 52} {"train_loss": -5.73105525970459, "global_step": 8873, "epoch": 52} {"train_loss": -6.060283184051514, "global_step": 8874, "epoch": 52} {"train_loss": -5.671195030212402, "global_step": 8875, "epoch": 52} {"train_loss": -5.910592555999756, "global_step": 8876, "epoch": 52} {"train_loss": -5.346184730529785, "global_step": 8877, "epoch": 52} {"train_loss": -5.661558628082275, "global_step": 8878, "epoch": 52} {"train_loss": -5.6699538230896, "global_step": 8879, "epoch": 52} {"train_loss": -5.653231620788574, "global_step": 8880, "epoch": 52} {"train_loss": -5.827707290649414, "global_step": 8881, "epoch": 52} {"train_loss": -5.796261310577393, "global_step": 8882, "epoch": 52} {"train_loss": -5.767216682434082, "global_step": 8883, "epoch": 52} {"train_loss": -5.649641513824463, "global_step": 8884, "epoch": 52} {"train_loss": -5.939888954162598, "global_step": 8885, "epoch": 52} {"train_loss": -5.742763519287109, "global_step": 8886, "epoch": 52} {"train_loss": -5.543356895446777, "global_step": 8887, "epoch": 52} {"train_loss": -5.597466945648193, "global_step": 8888, "epoch": 52} {"train_loss": -5.724382400512695, "global_step": 8889, "epoch": 52} {"train_loss": -5.792877197265625, "global_step": 8890, "epoch": 52} {"train_loss": -5.747818470001221, "global_step": 8891, "epoch": 52} {"train_loss": -5.881383895874023, "global_step": 8892, "epoch": 52} {"train_loss": -5.502964973449707, "global_step": 8893, "epoch": 52} {"train_loss": -5.971935272216797, "global_step": 8894, "epoch": 52} {"train_loss": -5.521299839019775, "global_step": 8895, "epoch": 52} {"train_loss": -5.594521522521973, "global_step": 8896, "epoch": 52} {"train_loss": -5.6334075927734375, "global_step": 8897, "epoch": 52} {"train_loss": -5.535562515258789, "global_step": 8898, "epoch": 52} {"train_loss": -5.337864398956299, "global_step": 8899, "epoch": 52} {"train_loss": -5.800390243530273, "global_step": 8900, "epoch": 52} {"train_loss": -5.478996753692627, "global_step": 8901, "epoch": 52} {"train_loss": -5.6622633934021, "global_step": 8902, "epoch": 52} {"train_loss": -5.626816882973626, "global_step": 8903, "epoch": 52, "val_loss": 276374.25} {"train_loss": -5.646327495574951, "global_step": 8904, "epoch": 53} {"train_loss": -5.705408573150635, "global_step": 8905, "epoch": 53} {"train_loss": -5.679474830627441, "global_step": 8906, "epoch": 53} {"train_loss": -5.371132850646973, "global_step": 8907, "epoch": 53} {"train_loss": -5.61238956451416, "global_step": 8908, "epoch": 53} {"train_loss": -5.43914794921875, "global_step": 8909, "epoch": 53} {"train_loss": -5.747735023498535, "global_step": 8910, "epoch": 53} {"train_loss": -5.492892265319824, "global_step": 8911, "epoch": 53} {"train_loss": -5.4857659339904785, "global_step": 8912, "epoch": 53} {"train_loss": -5.650007724761963, "global_step": 8913, "epoch": 53} {"train_loss": -5.810755729675293, "global_step": 8914, "epoch": 53} {"train_loss": -5.67196798324585, "global_step": 8915, "epoch": 53} {"train_loss": -5.7178192138671875, "global_step": 8916, "epoch": 53} {"train_loss": -5.580317974090576, "global_step": 8917, "epoch": 53} {"train_loss": -5.641995429992676, "global_step": 8918, "epoch": 53} {"train_loss": -5.705728530883789, "global_step": 8919, "epoch": 53} {"train_loss": -5.881796836853027, "global_step": 8920, "epoch": 53} {"train_loss": -5.445342540740967, "global_step": 8921, "epoch": 53} {"train_loss": -5.572891712188721, "global_step": 8922, "epoch": 53} {"train_loss": -5.619174003601074, "global_step": 8923, "epoch": 53} {"train_loss": -5.683537483215332, "global_step": 8924, "epoch": 53} {"train_loss": -5.53125, "global_step": 8925, "epoch": 53} {"train_loss": -5.627962589263916, "global_step": 8926, "epoch": 53} {"train_loss": -5.657593250274658, "global_step": 8927, "epoch": 53} {"train_loss": -5.395938873291016, "global_step": 8928, "epoch": 53} {"train_loss": -5.710997581481934, "global_step": 8929, "epoch": 53} {"train_loss": -5.239723205566406, "global_step": 8930, "epoch": 53} {"train_loss": -5.72174072265625, "global_step": 8931, "epoch": 53} {"train_loss": -5.563161849975586, "global_step": 8932, "epoch": 53} {"train_loss": -5.493993282318115, "global_step": 8933, "epoch": 53} {"train_loss": -5.570453643798828, "global_step": 8934, "epoch": 53} {"train_loss": -5.443489074707031, "global_step": 8935, "epoch": 53} {"train_loss": -5.788050651550293, "global_step": 8936, "epoch": 53} {"train_loss": -5.708229064941406, "global_step": 8937, "epoch": 53} {"train_loss": -5.612756729125977, "global_step": 8938, "epoch": 53} {"train_loss": -5.754627227783203, "global_step": 8939, "epoch": 53} {"train_loss": -5.514671325683594, "global_step": 8940, "epoch": 53} {"train_loss": -5.708468437194824, "global_step": 8941, "epoch": 53} {"train_loss": -5.884435653686523, "global_step": 8942, "epoch": 53} {"train_loss": -5.709598064422607, "global_step": 8943, "epoch": 53} {"train_loss": -5.838565826416016, "global_step": 8944, "epoch": 53} {"train_loss": -5.605717182159424, "global_step": 8945, "epoch": 53} {"train_loss": -5.691054344177246, "global_step": 8946, "epoch": 53} {"train_loss": -5.579522132873535, "global_step": 8947, "epoch": 53} {"train_loss": -5.667989253997803, "global_step": 8948, "epoch": 53} {"train_loss": -5.757189750671387, "global_step": 8949, "epoch": 53} {"train_loss": -5.517574310302734, "global_step": 8950, "epoch": 53} {"train_loss": -5.652793884277344, "global_step": 8951, "epoch": 53} {"train_loss": -5.578941345214844, "global_step": 8952, "epoch": 53} {"train_loss": -5.735330104827881, "global_step": 8953, "epoch": 53} {"train_loss": -5.353326797485352, "global_step": 8954, "epoch": 53} {"train_loss": -5.63179874420166, "global_step": 8955, "epoch": 53} {"train_loss": -5.792717456817627, "global_step": 8956, "epoch": 53} {"train_loss": -5.4135637283325195, "global_step": 8957, "epoch": 53} {"train_loss": -5.556355953216553, "global_step": 8958, "epoch": 53} {"train_loss": -5.7423624992370605, "global_step": 8959, "epoch": 53} {"train_loss": -5.561661720275879, "global_step": 8960, "epoch": 53} {"train_loss": -5.598106384277344, "global_step": 8961, "epoch": 53} {"train_loss": -5.735340595245361, "global_step": 8962, "epoch": 53} {"train_loss": -5.448421478271484, "global_step": 8963, "epoch": 53} {"train_loss": -5.628574371337891, "global_step": 8964, "epoch": 53} {"train_loss": -5.395680904388428, "global_step": 8965, "epoch": 53} {"train_loss": -5.550463676452637, "global_step": 8966, "epoch": 53} {"train_loss": -5.523797035217285, "global_step": 8967, "epoch": 53} {"train_loss": -5.449235916137695, "global_step": 8968, "epoch": 53} {"train_loss": -5.599084854125977, "global_step": 8969, "epoch": 53} {"train_loss": -5.604142189025879, "global_step": 8970, "epoch": 53} {"train_loss": -5.608263969421387, "global_step": 8971, "epoch": 53} {"train_loss": -5.381656646728516, "global_step": 8972, "epoch": 53} {"train_loss": -5.727758407592773, "global_step": 8973, "epoch": 53} {"train_loss": -5.738043785095215, "global_step": 8974, "epoch": 53} {"train_loss": -5.576857566833496, "global_step": 8975, "epoch": 53} {"train_loss": -5.637486457824707, "global_step": 8976, "epoch": 53} {"train_loss": -5.616559028625488, "global_step": 8977, "epoch": 53} {"train_loss": -5.498701095581055, "global_step": 8978, "epoch": 53} {"train_loss": -5.800703525543213, "global_step": 8979, "epoch": 53} {"train_loss": -5.784552574157715, "global_step": 8980, "epoch": 53} {"train_loss": -5.821048736572266, "global_step": 8981, "epoch": 53} {"train_loss": -5.778476238250732, "global_step": 8982, "epoch": 53} {"train_loss": -5.683774948120117, "global_step": 8983, "epoch": 53} {"train_loss": -5.811676979064941, "global_step": 8984, "epoch": 53} {"train_loss": -5.467654228210449, "global_step": 8985, "epoch": 53} {"train_loss": -5.710262298583984, "global_step": 8986, "epoch": 53} {"train_loss": -5.493345260620117, "global_step": 8987, "epoch": 53} {"train_loss": -5.720181465148926, "global_step": 8988, "epoch": 53} {"train_loss": -5.793739318847656, "global_step": 8989, "epoch": 53} {"train_loss": -5.881622314453125, "global_step": 8990, "epoch": 53} {"train_loss": -5.431735992431641, "global_step": 8991, "epoch": 53} {"train_loss": -5.845794200897217, "global_step": 8992, "epoch": 53} {"train_loss": -5.6001105308532715, "global_step": 8993, "epoch": 53} {"train_loss": -5.668603897094727, "global_step": 8994, "epoch": 53} {"train_loss": -5.58558988571167, "global_step": 8995, "epoch": 53} {"train_loss": -5.7033162117004395, "global_step": 8996, "epoch": 53} {"train_loss": -5.393256664276123, "global_step": 8997, "epoch": 53} {"train_loss": -5.62967586517334, "global_step": 8998, "epoch": 53} {"train_loss": -5.698422431945801, "global_step": 8999, "epoch": 53} {"train_loss": -5.409150123596191, "global_step": 9000, "epoch": 53} {"train_loss": -5.653426170349121, "global_step": 9001, "epoch": 53} {"train_loss": -5.457143783569336, "global_step": 9002, "epoch": 53} {"train_loss": -5.448317527770996, "global_step": 9003, "epoch": 53} {"train_loss": -5.821502685546875, "global_step": 9004, "epoch": 53} {"train_loss": -5.187759876251221, "global_step": 9005, "epoch": 53} {"train_loss": -5.547625541687012, "global_step": 9006, "epoch": 53} {"train_loss": -5.614394187927246, "global_step": 9007, "epoch": 53} {"train_loss": -5.592748641967773, "global_step": 9008, "epoch": 53} {"train_loss": -5.817312717437744, "global_step": 9009, "epoch": 53} {"train_loss": -5.417015075683594, "global_step": 9010, "epoch": 53} {"train_loss": -5.626457214355469, "global_step": 9011, "epoch": 53} {"train_loss": -5.823428630828857, "global_step": 9012, "epoch": 53} {"train_loss": -5.681486129760742, "global_step": 9013, "epoch": 53} {"train_loss": -5.736876010894775, "global_step": 9014, "epoch": 53} {"train_loss": -5.760078430175781, "global_step": 9015, "epoch": 53} {"train_loss": -5.751889228820801, "global_step": 9016, "epoch": 53} {"train_loss": -5.812002658843994, "global_step": 9017, "epoch": 53} {"train_loss": -5.422154903411865, "global_step": 9018, "epoch": 53} {"train_loss": -5.793170928955078, "global_step": 9019, "epoch": 53} {"train_loss": -5.747283935546875, "global_step": 9020, "epoch": 53} {"train_loss": -5.715109825134277, "global_step": 9021, "epoch": 53} {"train_loss": -5.766925811767578, "global_step": 9022, "epoch": 53} {"train_loss": -5.769580841064453, "global_step": 9023, "epoch": 53} {"train_loss": -5.716606616973877, "global_step": 9024, "epoch": 53} {"train_loss": -5.66239070892334, "global_step": 9025, "epoch": 53} {"train_loss": -5.278143882751465, "global_step": 9026, "epoch": 53} {"train_loss": -5.471109390258789, "global_step": 9027, "epoch": 53} {"train_loss": -5.319122314453125, "global_step": 9028, "epoch": 53} {"train_loss": -5.583218574523926, "global_step": 9029, "epoch": 53} {"train_loss": -5.383275985717773, "global_step": 9030, "epoch": 53} {"train_loss": -5.502643585205078, "global_step": 9031, "epoch": 53} {"train_loss": -5.761301040649414, "global_step": 9032, "epoch": 53} {"train_loss": -5.477304935455322, "global_step": 9033, "epoch": 53} {"train_loss": -5.441772937774658, "global_step": 9034, "epoch": 53} {"train_loss": -5.652911186218262, "global_step": 9035, "epoch": 53} {"train_loss": -5.498356819152832, "global_step": 9036, "epoch": 53} {"train_loss": -5.735866069793701, "global_step": 9037, "epoch": 53} {"train_loss": -5.8628458976745605, "global_step": 9038, "epoch": 53} {"train_loss": -5.600114822387695, "global_step": 9039, "epoch": 53} {"train_loss": -5.611796855926514, "global_step": 9040, "epoch": 53} {"train_loss": -5.700013160705566, "global_step": 9041, "epoch": 53} {"train_loss": -5.543272018432617, "global_step": 9042, "epoch": 53} {"train_loss": -5.825778007507324, "global_step": 9043, "epoch": 53} {"train_loss": -5.646568298339844, "global_step": 9044, "epoch": 53} {"train_loss": -5.557361125946045, "global_step": 9045, "epoch": 53} {"train_loss": -5.899845600128174, "global_step": 9046, "epoch": 53} {"train_loss": -5.938229560852051, "global_step": 9047, "epoch": 53} {"train_loss": -5.704060077667236, "global_step": 9048, "epoch": 53} {"train_loss": -5.553791522979736, "global_step": 9049, "epoch": 53} {"train_loss": -5.769672393798828, "global_step": 9050, "epoch": 53} {"train_loss": -5.803159713745117, "global_step": 9051, "epoch": 53} {"train_loss": -5.815921306610107, "global_step": 9052, "epoch": 53} {"train_loss": -5.6282196044921875, "global_step": 9053, "epoch": 53} {"train_loss": -5.815472602844238, "global_step": 9054, "epoch": 53} {"train_loss": -5.405394554138184, "global_step": 9055, "epoch": 53} {"train_loss": -5.819399833679199, "global_step": 9056, "epoch": 53} {"train_loss": -5.6305365562438965, "global_step": 9057, "epoch": 53} {"train_loss": -5.628195762634277, "global_step": 9058, "epoch": 53} {"train_loss": -5.186951160430908, "global_step": 9059, "epoch": 53} {"train_loss": -5.514096260070801, "global_step": 9060, "epoch": 53} {"train_loss": -5.549736976623535, "global_step": 9061, "epoch": 53} {"train_loss": -5.806650638580322, "global_step": 9062, "epoch": 53} {"train_loss": -5.595550537109375, "global_step": 9063, "epoch": 53} {"train_loss": -5.538856029510498, "global_step": 9064, "epoch": 53} {"train_loss": -5.491670608520508, "global_step": 9065, "epoch": 53} {"train_loss": -5.441817283630371, "global_step": 9066, "epoch": 53} {"train_loss": -5.658289909362793, "global_step": 9067, "epoch": 53} {"train_loss": -5.228209972381592, "global_step": 9068, "epoch": 53} {"train_loss": -5.741409778594971, "global_step": 9069, "epoch": 53} {"train_loss": -5.613234519958496, "global_step": 9070, "epoch": 53} {"train_loss": -5.6215346938087825, "global_step": 9071, "epoch": 53, "val_loss": 269551.96875} {"train_loss": -5.497856140136719, "global_step": 9072, "epoch": 54} {"train_loss": -5.443115234375, "global_step": 9073, "epoch": 54} {"train_loss": -5.687409400939941, "global_step": 9074, "epoch": 54} {"train_loss": -5.721076011657715, "global_step": 9075, "epoch": 54} {"train_loss": -5.558442115783691, "global_step": 9076, "epoch": 54} {"train_loss": -5.680251598358154, "global_step": 9077, "epoch": 54} {"train_loss": -5.621943473815918, "global_step": 9078, "epoch": 54} {"train_loss": -5.427847862243652, "global_step": 9079, "epoch": 54} {"train_loss": -5.713078498840332, "global_step": 9080, "epoch": 54} {"train_loss": -5.620881080627441, "global_step": 9081, "epoch": 54} {"train_loss": -5.2216997146606445, "global_step": 9082, "epoch": 54} {"train_loss": -5.580056667327881, "global_step": 9083, "epoch": 54} {"train_loss": -5.354311943054199, "global_step": 9084, "epoch": 54} {"train_loss": -5.5290913581848145, "global_step": 9085, "epoch": 54} {"train_loss": -5.8220930099487305, "global_step": 9086, "epoch": 54} {"train_loss": -5.193785190582275, "global_step": 9087, "epoch": 54} {"train_loss": -5.517989158630371, "global_step": 9088, "epoch": 54} {"train_loss": -5.50577449798584, "global_step": 9089, "epoch": 54} {"train_loss": -5.3615946769714355, "global_step": 9090, "epoch": 54} {"train_loss": -5.613677978515625, "global_step": 9091, "epoch": 54} {"train_loss": -5.399197578430176, "global_step": 9092, "epoch": 54} {"train_loss": -5.186230659484863, "global_step": 9093, "epoch": 54} {"train_loss": -5.769198417663574, "global_step": 9094, "epoch": 54} {"train_loss": -5.469244003295898, "global_step": 9095, "epoch": 54} {"train_loss": -5.256743431091309, "global_step": 9096, "epoch": 54} {"train_loss": -5.496665000915527, "global_step": 9097, "epoch": 54} {"train_loss": -5.491544723510742, "global_step": 9098, "epoch": 54} {"train_loss": -5.741028308868408, "global_step": 9099, "epoch": 54} {"train_loss": -5.582210063934326, "global_step": 9100, "epoch": 54} {"train_loss": -5.786721229553223, "global_step": 9101, "epoch": 54} {"train_loss": -5.642228603363037, "global_step": 9102, "epoch": 54} {"train_loss": -5.634766578674316, "global_step": 9103, "epoch": 54} {"train_loss": -5.676969528198242, "global_step": 9104, "epoch": 54} {"train_loss": -5.910067558288574, "global_step": 9105, "epoch": 54} {"train_loss": -5.898734092712402, "global_step": 9106, "epoch": 54} {"train_loss": -5.53421688079834, "global_step": 9107, "epoch": 54} {"train_loss": -5.819607734680176, "global_step": 9108, "epoch": 54} {"train_loss": -5.826412200927734, "global_step": 9109, "epoch": 54} {"train_loss": -5.947664260864258, "global_step": 9110, "epoch": 54} {"train_loss": -5.738325119018555, "global_step": 9111, "epoch": 54} {"train_loss": -5.704902172088623, "global_step": 9112, "epoch": 54} {"train_loss": -5.676633834838867, "global_step": 9113, "epoch": 54} {"train_loss": -5.684612274169922, "global_step": 9114, "epoch": 54} {"train_loss": -5.79319953918457, "global_step": 9115, "epoch": 54} {"train_loss": -5.9467034339904785, "global_step": 9116, "epoch": 54} {"train_loss": -5.71185827255249, "global_step": 9117, "epoch": 54} {"train_loss": -5.572126388549805, "global_step": 9118, "epoch": 54} {"train_loss": -5.840996742248535, "global_step": 9119, "epoch": 54} {"train_loss": -5.447148323059082, "global_step": 9120, "epoch": 54} {"train_loss": -5.5946807861328125, "global_step": 9121, "epoch": 54} {"train_loss": -5.852076530456543, "global_step": 9122, "epoch": 54} {"train_loss": -5.500516891479492, "global_step": 9123, "epoch": 54} {"train_loss": -5.757659912109375, "global_step": 9124, "epoch": 54} {"train_loss": -5.5411529541015625, "global_step": 9125, "epoch": 54} {"train_loss": -5.98976993560791, "global_step": 9126, "epoch": 54} {"train_loss": -5.676849365234375, "global_step": 9127, "epoch": 54} {"train_loss": -5.744525909423828, "global_step": 9128, "epoch": 54} {"train_loss": -5.604940414428711, "global_step": 9129, "epoch": 54} {"train_loss": -5.141447067260742, "global_step": 9130, "epoch": 54} {"train_loss": -5.326125144958496, "global_step": 9131, "epoch": 54} {"train_loss": -5.685955047607422, "global_step": 9132, "epoch": 54} {"train_loss": -5.680870056152344, "global_step": 9133, "epoch": 54} {"train_loss": -5.721990585327148, "global_step": 9134, "epoch": 54} {"train_loss": -5.655069351196289, "global_step": 9135, "epoch": 54} {"train_loss": -5.506068229675293, "global_step": 9136, "epoch": 54} {"train_loss": -5.654735565185547, "global_step": 9137, "epoch": 54} {"train_loss": -5.668511390686035, "global_step": 9138, "epoch": 54} {"train_loss": -5.640810966491699, "global_step": 9139, "epoch": 54} {"train_loss": -5.986913681030273, "global_step": 9140, "epoch": 54} {"train_loss": -5.846774101257324, "global_step": 9141, "epoch": 54} {"train_loss": -5.750116348266602, "global_step": 9142, "epoch": 54} {"train_loss": -5.963274955749512, "global_step": 9143, "epoch": 54} {"train_loss": -5.541322231292725, "global_step": 9144, "epoch": 54} {"train_loss": -5.742453098297119, "global_step": 9145, "epoch": 54} {"train_loss": -5.683537483215332, "global_step": 9146, "epoch": 54} {"train_loss": -5.527726173400879, "global_step": 9147, "epoch": 54} {"train_loss": -5.602622032165527, "global_step": 9148, "epoch": 54} {"train_loss": -5.541637420654297, "global_step": 9149, "epoch": 54} {"train_loss": -5.8303751945495605, "global_step": 9150, "epoch": 54} {"train_loss": -5.464450359344482, "global_step": 9151, "epoch": 54} {"train_loss": -5.754619598388672, "global_step": 9152, "epoch": 54} {"train_loss": -5.665887832641602, "global_step": 9153, "epoch": 54} {"train_loss": -5.415717124938965, "global_step": 9154, "epoch": 54} {"train_loss": -5.539374351501465, "global_step": 9155, "epoch": 54} {"train_loss": -5.755372047424316, "global_step": 9156, "epoch": 54} {"train_loss": -5.6700897216796875, "global_step": 9157, "epoch": 54} {"train_loss": -5.581483840942383, "global_step": 9158, "epoch": 54} {"train_loss": -5.8745269775390625, "global_step": 9159, "epoch": 54} {"train_loss": -5.492646217346191, "global_step": 9160, "epoch": 54} {"train_loss": -5.622845649719238, "global_step": 9161, "epoch": 54} {"train_loss": -5.843055248260498, "global_step": 9162, "epoch": 54} {"train_loss": -5.646986961364746, "global_step": 9163, "epoch": 54} {"train_loss": -5.9132914543151855, "global_step": 9164, "epoch": 54} {"train_loss": -5.904745101928711, "global_step": 9165, "epoch": 54} {"train_loss": -5.6640944480896, "global_step": 9166, "epoch": 54} {"train_loss": -5.784372329711914, "global_step": 9167, "epoch": 54} {"train_loss": -5.578036308288574, "global_step": 9168, "epoch": 54} {"train_loss": -5.516429901123047, "global_step": 9169, "epoch": 54} {"train_loss": -5.85274076461792, "global_step": 9170, "epoch": 54} {"train_loss": -5.817342758178711, "global_step": 9171, "epoch": 54} {"train_loss": -5.92167854309082, "global_step": 9172, "epoch": 54} {"train_loss": -5.96083402633667, "global_step": 9173, "epoch": 54} {"train_loss": -5.877066612243652, "global_step": 9174, "epoch": 54} {"train_loss": -5.604497909545898, "global_step": 9175, "epoch": 54} {"train_loss": -5.3763885498046875, "global_step": 9176, "epoch": 54} {"train_loss": -5.72768497467041, "global_step": 9177, "epoch": 54} {"train_loss": -5.321608543395996, "global_step": 9178, "epoch": 54} {"train_loss": -5.515546798706055, "global_step": 9179, "epoch": 54} {"train_loss": -5.6423845291137695, "global_step": 9180, "epoch": 54} {"train_loss": -5.377647399902344, "global_step": 9181, "epoch": 54} {"train_loss": -5.63375186920166, "global_step": 9182, "epoch": 54} {"train_loss": -5.429293632507324, "global_step": 9183, "epoch": 54} {"train_loss": -5.54337215423584, "global_step": 9184, "epoch": 54} {"train_loss": -5.369828224182129, "global_step": 9185, "epoch": 54} {"train_loss": -5.562519550323486, "global_step": 9186, "epoch": 54} {"train_loss": -5.613396167755127, "global_step": 9187, "epoch": 54} {"train_loss": -5.653121471405029, "global_step": 9188, "epoch": 54} {"train_loss": -5.601583957672119, "global_step": 9189, "epoch": 54} {"train_loss": -5.771167755126953, "global_step": 9190, "epoch": 54} {"train_loss": -5.706298828125, "global_step": 9191, "epoch": 54} {"train_loss": -5.704825401306152, "global_step": 9192, "epoch": 54} {"train_loss": -5.810694694519043, "global_step": 9193, "epoch": 54} {"train_loss": -5.547009468078613, "global_step": 9194, "epoch": 54} {"train_loss": -5.706032752990723, "global_step": 9195, "epoch": 54} {"train_loss": -5.57261848449707, "global_step": 9196, "epoch": 54} {"train_loss": -5.398187637329102, "global_step": 9197, "epoch": 54} {"train_loss": -5.552592754364014, "global_step": 9198, "epoch": 54} {"train_loss": -5.407707691192627, "global_step": 9199, "epoch": 54} {"train_loss": -5.7282609939575195, "global_step": 9200, "epoch": 54} {"train_loss": -5.869348526000977, "global_step": 9201, "epoch": 54} {"train_loss": -5.646490097045898, "global_step": 9202, "epoch": 54} {"train_loss": -5.665502548217773, "global_step": 9203, "epoch": 54} {"train_loss": -5.6319122314453125, "global_step": 9204, "epoch": 54} {"train_loss": -5.806377410888672, "global_step": 9205, "epoch": 54} {"train_loss": -5.817695617675781, "global_step": 9206, "epoch": 54} {"train_loss": -5.420284271240234, "global_step": 9207, "epoch": 54} {"train_loss": -5.59013032913208, "global_step": 9208, "epoch": 54} {"train_loss": -5.7627716064453125, "global_step": 9209, "epoch": 54} {"train_loss": -5.497615814208984, "global_step": 9210, "epoch": 54} {"train_loss": -5.866584300994873, "global_step": 9211, "epoch": 54} {"train_loss": -5.777679920196533, "global_step": 9212, "epoch": 54} {"train_loss": -5.812066078186035, "global_step": 9213, "epoch": 54} {"train_loss": -5.47160530090332, "global_step": 9214, "epoch": 54} {"train_loss": -5.844466686248779, "global_step": 9215, "epoch": 54} {"train_loss": -5.84012508392334, "global_step": 9216, "epoch": 54} {"train_loss": -5.601731777191162, "global_step": 9217, "epoch": 54} {"train_loss": -5.68412971496582, "global_step": 9218, "epoch": 54} {"train_loss": -5.77738094329834, "global_step": 9219, "epoch": 54} {"train_loss": -5.559010028839111, "global_step": 9220, "epoch": 54} {"train_loss": -5.6853108406066895, "global_step": 9221, "epoch": 54} {"train_loss": -5.471789360046387, "global_step": 9222, "epoch": 54} {"train_loss": -5.372039794921875, "global_step": 9223, "epoch": 54} {"train_loss": -5.45421838760376, "global_step": 9224, "epoch": 54} {"train_loss": -5.621870040893555, "global_step": 9225, "epoch": 54} {"train_loss": -5.724331855773926, "global_step": 9226, "epoch": 54} {"train_loss": -5.592853546142578, "global_step": 9227, "epoch": 54} {"train_loss": -5.669485092163086, "global_step": 9228, "epoch": 54} {"train_loss": -5.497793197631836, "global_step": 9229, "epoch": 54} {"train_loss": -5.851950645446777, "global_step": 9230, "epoch": 54} {"train_loss": -5.6404924392700195, "global_step": 9231, "epoch": 54} {"train_loss": -5.653412818908691, "global_step": 9232, "epoch": 54} {"train_loss": -5.602919578552246, "global_step": 9233, "epoch": 54} {"train_loss": -5.509947776794434, "global_step": 9234, "epoch": 54} {"train_loss": -5.4476118087768555, "global_step": 9235, "epoch": 54} {"train_loss": -5.4503092765808105, "global_step": 9236, "epoch": 54} {"train_loss": -5.476472854614258, "global_step": 9237, "epoch": 54} {"train_loss": -6.033397197723389, "global_step": 9238, "epoch": 54} {"train_loss": -5.6382312547592885, "global_step": 9239, "epoch": 54, "val_loss": 260300.0} {"train_loss": -5.606760501861572, "global_step": 9240, "epoch": 55} {"train_loss": -5.222831726074219, "global_step": 9241, "epoch": 55} {"train_loss": -5.481358528137207, "global_step": 9242, "epoch": 55} {"train_loss": -5.612982749938965, "global_step": 9243, "epoch": 55} {"train_loss": -5.336911678314209, "global_step": 9244, "epoch": 55} {"train_loss": -5.466843605041504, "global_step": 9245, "epoch": 55} {"train_loss": -5.775064468383789, "global_step": 9246, "epoch": 55} {"train_loss": -5.4503278732299805, "global_step": 9247, "epoch": 55} {"train_loss": -5.618877410888672, "global_step": 9248, "epoch": 55} {"train_loss": -5.469076633453369, "global_step": 9249, "epoch": 55} {"train_loss": -5.683281898498535, "global_step": 9250, "epoch": 55} {"train_loss": -5.788554668426514, "global_step": 9251, "epoch": 55} {"train_loss": -5.698431968688965, "global_step": 9252, "epoch": 55} {"train_loss": -5.648834228515625, "global_step": 9253, "epoch": 55} {"train_loss": -5.612898826599121, "global_step": 9254, "epoch": 55} {"train_loss": -5.6704325675964355, "global_step": 9255, "epoch": 55} {"train_loss": -5.584794998168945, "global_step": 9256, "epoch": 55} {"train_loss": -5.62469482421875, "global_step": 9257, "epoch": 55} {"train_loss": -5.590609550476074, "global_step": 9258, "epoch": 55} {"train_loss": -5.824134826660156, "global_step": 9259, "epoch": 55} {"train_loss": -5.7624640464782715, "global_step": 9260, "epoch": 55} {"train_loss": -5.687892913818359, "global_step": 9261, "epoch": 55} {"train_loss": -5.479766368865967, "global_step": 9262, "epoch": 55} {"train_loss": -5.668201446533203, "global_step": 9263, "epoch": 55} {"train_loss": -5.615532875061035, "global_step": 9264, "epoch": 55} {"train_loss": -5.7295684814453125, "global_step": 9265, "epoch": 55} {"train_loss": -5.800503730773926, "global_step": 9266, "epoch": 55} {"train_loss": -5.577526569366455, "global_step": 9267, "epoch": 55} {"train_loss": -5.4347991943359375, "global_step": 9268, "epoch": 55} {"train_loss": -5.786349296569824, "global_step": 9269, "epoch": 55} {"train_loss": -5.6762919425964355, "global_step": 9270, "epoch": 55} {"train_loss": -5.618852138519287, "global_step": 9271, "epoch": 55} {"train_loss": -5.480360507965088, "global_step": 9272, "epoch": 55} {"train_loss": -5.52388334274292, "global_step": 9273, "epoch": 55} {"train_loss": -5.82563591003418, "global_step": 9274, "epoch": 55} {"train_loss": -5.64280366897583, "global_step": 9275, "epoch": 55} {"train_loss": -5.411828517913818, "global_step": 9276, "epoch": 55} {"train_loss": -5.455087661743164, "global_step": 9277, "epoch": 55} {"train_loss": -5.676102638244629, "global_step": 9278, "epoch": 55} {"train_loss": -5.641977310180664, "global_step": 9279, "epoch": 55} {"train_loss": -5.824771881103516, "global_step": 9280, "epoch": 55} {"train_loss": -5.704007148742676, "global_step": 9281, "epoch": 55} {"train_loss": -5.6823015213012695, "global_step": 9282, "epoch": 55} {"train_loss": -5.643237113952637, "global_step": 9283, "epoch": 55} {"train_loss": -5.66383171081543, "global_step": 9284, "epoch": 55} {"train_loss": -5.600627899169922, "global_step": 9285, "epoch": 55} {"train_loss": -5.478908538818359, "global_step": 9286, "epoch": 55} {"train_loss": -5.550540924072266, "global_step": 9287, "epoch": 55} {"train_loss": -5.744158744812012, "global_step": 9288, "epoch": 55} {"train_loss": -5.5857343673706055, "global_step": 9289, "epoch": 55} {"train_loss": -5.470184326171875, "global_step": 9290, "epoch": 55} {"train_loss": -5.872948169708252, "global_step": 9291, "epoch": 55} {"train_loss": -5.541072368621826, "global_step": 9292, "epoch": 55} {"train_loss": -5.842677116394043, "global_step": 9293, "epoch": 55} {"train_loss": -5.602657794952393, "global_step": 9294, "epoch": 55} {"train_loss": -5.762475490570068, "global_step": 9295, "epoch": 55} {"train_loss": -5.537777900695801, "global_step": 9296, "epoch": 55} {"train_loss": -5.615355014801025, "global_step": 9297, "epoch": 55} {"train_loss": -5.660967826843262, "global_step": 9298, "epoch": 55} {"train_loss": -5.824550628662109, "global_step": 9299, "epoch": 55} {"train_loss": -5.497411727905273, "global_step": 9300, "epoch": 55} {"train_loss": -5.720247745513916, "global_step": 9301, "epoch": 55} {"train_loss": -5.866870880126953, "global_step": 9302, "epoch": 55} {"train_loss": -5.940890312194824, "global_step": 9303, "epoch": 55} {"train_loss": -5.688116073608398, "global_step": 9304, "epoch": 55} {"train_loss": -5.72217321395874, "global_step": 9305, "epoch": 55} {"train_loss": -5.858456611633301, "global_step": 9306, "epoch": 55} {"train_loss": -5.629385948181152, "global_step": 9307, "epoch": 55} {"train_loss": -5.597975254058838, "global_step": 9308, "epoch": 55} {"train_loss": -5.897588729858398, "global_step": 9309, "epoch": 55} {"train_loss": -5.7260541915893555, "global_step": 9310, "epoch": 55} {"train_loss": -5.594526767730713, "global_step": 9311, "epoch": 55} {"train_loss": -5.514646053314209, "global_step": 9312, "epoch": 55} {"train_loss": -5.962909698486328, "global_step": 9313, "epoch": 55} {"train_loss": -5.661701202392578, "global_step": 9314, "epoch": 55} {"train_loss": -5.8111796379089355, "global_step": 9315, "epoch": 55} {"train_loss": -5.829464912414551, "global_step": 9316, "epoch": 55} {"train_loss": -5.5502777099609375, "global_step": 9317, "epoch": 55} {"train_loss": -5.590722560882568, "global_step": 9318, "epoch": 55} {"train_loss": -5.612123012542725, "global_step": 9319, "epoch": 55} {"train_loss": -5.632673740386963, "global_step": 9320, "epoch": 55} {"train_loss": -5.318145275115967, "global_step": 9321, "epoch": 55} {"train_loss": -5.392303466796875, "global_step": 9322, "epoch": 55} {"train_loss": -5.311217784881592, "global_step": 9323, "epoch": 55} {"train_loss": -5.84444522857666, "global_step": 9324, "epoch": 55} {"train_loss": -5.908257961273193, "global_step": 9325, "epoch": 55} {"train_loss": -5.617691993713379, "global_step": 9326, "epoch": 55} {"train_loss": -5.76151180267334, "global_step": 9327, "epoch": 55} {"train_loss": -5.823016166687012, "global_step": 9328, "epoch": 55} {"train_loss": -5.6782732009887695, "global_step": 9329, "epoch": 55} {"train_loss": -5.38361930847168, "global_step": 9330, "epoch": 55} {"train_loss": -5.790009498596191, "global_step": 9331, "epoch": 55} {"train_loss": -5.651304244995117, "global_step": 9332, "epoch": 55} {"train_loss": -5.715033531188965, "global_step": 9333, "epoch": 55} {"train_loss": -5.524618148803711, "global_step": 9334, "epoch": 55} {"train_loss": -5.685441017150879, "global_step": 9335, "epoch": 55} {"train_loss": -5.825658798217773, "global_step": 9336, "epoch": 55} {"train_loss": -5.164732933044434, "global_step": 9337, "epoch": 55} {"train_loss": -5.81442928314209, "global_step": 9338, "epoch": 55} {"train_loss": -5.424710273742676, "global_step": 9339, "epoch": 55} {"train_loss": -5.640602111816406, "global_step": 9340, "epoch": 55} {"train_loss": -5.8511810302734375, "global_step": 9341, "epoch": 55} {"train_loss": -5.714777946472168, "global_step": 9342, "epoch": 55} {"train_loss": -5.753643989562988, "global_step": 9343, "epoch": 55} {"train_loss": -5.819015979766846, "global_step": 9344, "epoch": 55} {"train_loss": -5.767291069030762, "global_step": 9345, "epoch": 55} {"train_loss": -5.680503845214844, "global_step": 9346, "epoch": 55} {"train_loss": -5.886768341064453, "global_step": 9347, "epoch": 55} {"train_loss": -5.767383575439453, "global_step": 9348, "epoch": 55} {"train_loss": -5.975880146026611, "global_step": 9349, "epoch": 55} {"train_loss": -5.502635955810547, "global_step": 9350, "epoch": 55} {"train_loss": -5.818851470947266, "global_step": 9351, "epoch": 55} {"train_loss": -5.612392425537109, "global_step": 9352, "epoch": 55} {"train_loss": -5.731343746185303, "global_step": 9353, "epoch": 55} {"train_loss": -5.8257975578308105, "global_step": 9354, "epoch": 55} {"train_loss": -5.781634330749512, "global_step": 9355, "epoch": 55} {"train_loss": -5.467441558837891, "global_step": 9356, "epoch": 55} {"train_loss": -5.881236553192139, "global_step": 9357, "epoch": 55} {"train_loss": -5.539566993713379, "global_step": 9358, "epoch": 55} {"train_loss": -5.952945709228516, "global_step": 9359, "epoch": 55} {"train_loss": -5.981096267700195, "global_step": 9360, "epoch": 55} {"train_loss": -5.747870445251465, "global_step": 9361, "epoch": 55} {"train_loss": -5.784778594970703, "global_step": 9362, "epoch": 55} {"train_loss": -5.849099636077881, "global_step": 9363, "epoch": 55} {"train_loss": -5.721408367156982, "global_step": 9364, "epoch": 55} {"train_loss": -5.666474342346191, "global_step": 9365, "epoch": 55} {"train_loss": -5.706674098968506, "global_step": 9366, "epoch": 55} {"train_loss": -5.586348533630371, "global_step": 9367, "epoch": 55} {"train_loss": -5.1739888191223145, "global_step": 9368, "epoch": 55} {"train_loss": -5.7014360427856445, "global_step": 9369, "epoch": 55} {"train_loss": -5.818451404571533, "global_step": 9370, "epoch": 55} {"train_loss": -5.694208145141602, "global_step": 9371, "epoch": 55} {"train_loss": -5.721541881561279, "global_step": 9372, "epoch": 55} {"train_loss": -5.5130767822265625, "global_step": 9373, "epoch": 55} {"train_loss": -5.964306831359863, "global_step": 9374, "epoch": 55} {"train_loss": -5.85399055480957, "global_step": 9375, "epoch": 55} {"train_loss": -5.7542524337768555, "global_step": 9376, "epoch": 55} {"train_loss": -5.616865634918213, "global_step": 9377, "epoch": 55} {"train_loss": -5.759018421173096, "global_step": 9378, "epoch": 55} {"train_loss": -5.702630043029785, "global_step": 9379, "epoch": 55} {"train_loss": -5.762266635894775, "global_step": 9380, "epoch": 55} {"train_loss": -5.669010162353516, "global_step": 9381, "epoch": 55} {"train_loss": -5.62979793548584, "global_step": 9382, "epoch": 55} {"train_loss": -5.578884124755859, "global_step": 9383, "epoch": 55} {"train_loss": -5.402149200439453, "global_step": 9384, "epoch": 55} {"train_loss": -5.7889404296875, "global_step": 9385, "epoch": 55} {"train_loss": -5.715756893157959, "global_step": 9386, "epoch": 55} {"train_loss": -5.549044132232666, "global_step": 9387, "epoch": 55} {"train_loss": -5.784046173095703, "global_step": 9388, "epoch": 55} {"train_loss": -5.523348331451416, "global_step": 9389, "epoch": 55} {"train_loss": -5.470700263977051, "global_step": 9390, "epoch": 55} {"train_loss": -5.738046646118164, "global_step": 9391, "epoch": 55} {"train_loss": -5.750437259674072, "global_step": 9392, "epoch": 55} {"train_loss": -5.812597751617432, "global_step": 9393, "epoch": 55} {"train_loss": -5.8534016609191895, "global_step": 9394, "epoch": 55} {"train_loss": -5.607665061950684, "global_step": 9395, "epoch": 55} {"train_loss": -6.008077621459961, "global_step": 9396, "epoch": 55} {"train_loss": -5.807241439819336, "global_step": 9397, "epoch": 55} {"train_loss": -5.693835258483887, "global_step": 9398, "epoch": 55} {"train_loss": -5.820567607879639, "global_step": 9399, "epoch": 55} {"train_loss": -5.696693420410156, "global_step": 9400, "epoch": 55} {"train_loss": -5.77748966217041, "global_step": 9401, "epoch": 55} {"train_loss": -5.605534553527832, "global_step": 9402, "epoch": 55} {"train_loss": -5.772297382354736, "global_step": 9403, "epoch": 55} {"train_loss": -5.676145076751709, "global_step": 9404, "epoch": 55} {"train_loss": -5.802403450012207, "global_step": 9405, "epoch": 55} {"train_loss": -5.7934489250183105, "global_step": 9406, "epoch": 55} {"train_loss": -5.671695922102247, "global_step": 9407, "epoch": 55, "val_loss": 260895.5, "train_action_mse_error": 42.88861846923828} {"train_loss": -5.9993743896484375, "global_step": 9408, "epoch": 56} {"train_loss": -5.793648719787598, "global_step": 9409, "epoch": 56} {"train_loss": -5.884222507476807, "global_step": 9410, "epoch": 56} {"train_loss": -5.543020248413086, "global_step": 9411, "epoch": 56} {"train_loss": -5.747038841247559, "global_step": 9412, "epoch": 56} {"train_loss": -5.813650131225586, "global_step": 9413, "epoch": 56} {"train_loss": -5.781656265258789, "global_step": 9414, "epoch": 56} {"train_loss": -5.689477443695068, "global_step": 9415, "epoch": 56} {"train_loss": -5.641840934753418, "global_step": 9416, "epoch": 56} {"train_loss": -5.597228050231934, "global_step": 9417, "epoch": 56} {"train_loss": -5.913642406463623, "global_step": 9418, "epoch": 56} {"train_loss": -5.416548252105713, "global_step": 9419, "epoch": 56} {"train_loss": -5.758816719055176, "global_step": 9420, "epoch": 56} {"train_loss": -5.555112838745117, "global_step": 9421, "epoch": 56} {"train_loss": -5.67676305770874, "global_step": 9422, "epoch": 56} {"train_loss": -5.405543327331543, "global_step": 9423, "epoch": 56} {"train_loss": -5.614257335662842, "global_step": 9424, "epoch": 56} {"train_loss": -5.3707661628723145, "global_step": 9425, "epoch": 56} {"train_loss": -5.697092056274414, "global_step": 9426, "epoch": 56} {"train_loss": -5.594239711761475, "global_step": 9427, "epoch": 56} {"train_loss": -5.744072437286377, "global_step": 9428, "epoch": 56} {"train_loss": -5.590255260467529, "global_step": 9429, "epoch": 56} {"train_loss": -5.392098426818848, "global_step": 9430, "epoch": 56} {"train_loss": -5.634559154510498, "global_step": 9431, "epoch": 56} {"train_loss": -5.716931343078613, "global_step": 9432, "epoch": 56} {"train_loss": -5.6355743408203125, "global_step": 9433, "epoch": 56} {"train_loss": -5.741567611694336, "global_step": 9434, "epoch": 56} {"train_loss": -5.357354164123535, "global_step": 9435, "epoch": 56} {"train_loss": -5.7413129806518555, "global_step": 9436, "epoch": 56} {"train_loss": -5.3913187980651855, "global_step": 9437, "epoch": 56} {"train_loss": -5.441701889038086, "global_step": 9438, "epoch": 56} {"train_loss": -5.6843719482421875, "global_step": 9439, "epoch": 56} {"train_loss": -5.4842963218688965, "global_step": 9440, "epoch": 56} {"train_loss": -5.699916839599609, "global_step": 9441, "epoch": 56} {"train_loss": -5.454863548278809, "global_step": 9442, "epoch": 56} {"train_loss": -5.798662185668945, "global_step": 9443, "epoch": 56} {"train_loss": -5.588901519775391, "global_step": 9444, "epoch": 56} {"train_loss": -5.519008636474609, "global_step": 9445, "epoch": 56} {"train_loss": -5.524377822875977, "global_step": 9446, "epoch": 56} {"train_loss": -5.633207321166992, "global_step": 9447, "epoch": 56} {"train_loss": -5.525300979614258, "global_step": 9448, "epoch": 56} {"train_loss": -5.614925861358643, "global_step": 9449, "epoch": 56} {"train_loss": -5.528354644775391, "global_step": 9450, "epoch": 56} {"train_loss": -5.668971538543701, "global_step": 9451, "epoch": 56} {"train_loss": -5.578851699829102, "global_step": 9452, "epoch": 56} {"train_loss": -5.687642574310303, "global_step": 9453, "epoch": 56} {"train_loss": -5.787930488586426, "global_step": 9454, "epoch": 56} {"train_loss": -6.017657279968262, "global_step": 9455, "epoch": 56} {"train_loss": -5.79966926574707, "global_step": 9456, "epoch": 56} {"train_loss": -5.687954425811768, "global_step": 9457, "epoch": 56} {"train_loss": -5.786056041717529, "global_step": 9458, "epoch": 56} {"train_loss": -5.522231578826904, "global_step": 9459, "epoch": 56} {"train_loss": -5.6858930587768555, "global_step": 9460, "epoch": 56} {"train_loss": -5.771276473999023, "global_step": 9461, "epoch": 56} {"train_loss": -5.916513442993164, "global_step": 9462, "epoch": 56} {"train_loss": -5.577090263366699, "global_step": 9463, "epoch": 56} {"train_loss": -5.534454822540283, "global_step": 9464, "epoch": 56} {"train_loss": -5.767721652984619, "global_step": 9465, "epoch": 56} {"train_loss": -5.682120323181152, "global_step": 9466, "epoch": 56} {"train_loss": -5.590814590454102, "global_step": 9467, "epoch": 56} {"train_loss": -5.6737871170043945, "global_step": 9468, "epoch": 56} {"train_loss": -5.363608360290527, "global_step": 9469, "epoch": 56} {"train_loss": -5.771695137023926, "global_step": 9470, "epoch": 56} {"train_loss": -5.386946201324463, "global_step": 9471, "epoch": 56} {"train_loss": -5.644412040710449, "global_step": 9472, "epoch": 56} {"train_loss": -5.663972854614258, "global_step": 9473, "epoch": 56} {"train_loss": -5.443284034729004, "global_step": 9474, "epoch": 56} {"train_loss": -5.7788543701171875, "global_step": 9475, "epoch": 56} {"train_loss": -5.74582576751709, "global_step": 9476, "epoch": 56} {"train_loss": -5.758349418640137, "global_step": 9477, "epoch": 56} {"train_loss": -5.538936614990234, "global_step": 9478, "epoch": 56} {"train_loss": -5.872707366943359, "global_step": 9479, "epoch": 56} {"train_loss": -5.831143379211426, "global_step": 9480, "epoch": 56} {"train_loss": -5.527253150939941, "global_step": 9481, "epoch": 56} {"train_loss": -5.900815963745117, "global_step": 9482, "epoch": 56} {"train_loss": -6.0376877784729, "global_step": 9483, "epoch": 56} {"train_loss": -5.796037197113037, "global_step": 9484, "epoch": 56} {"train_loss": -5.885232925415039, "global_step": 9485, "epoch": 56} {"train_loss": -5.951117992401123, "global_step": 9486, "epoch": 56} {"train_loss": -6.105037689208984, "global_step": 9487, "epoch": 56} {"train_loss": -5.7918596267700195, "global_step": 9488, "epoch": 56} {"train_loss": -5.643258094787598, "global_step": 9489, "epoch": 56} {"train_loss": -5.8420562744140625, "global_step": 9490, "epoch": 56} {"train_loss": -5.6140289306640625, "global_step": 9491, "epoch": 56} {"train_loss": -5.804198265075684, "global_step": 9492, "epoch": 56} {"train_loss": -5.641502380371094, "global_step": 9493, "epoch": 56} {"train_loss": -5.871297836303711, "global_step": 9494, "epoch": 56} {"train_loss": -5.378664016723633, "global_step": 9495, "epoch": 56} {"train_loss": -5.762211322784424, "global_step": 9496, "epoch": 56} {"train_loss": -5.5282487869262695, "global_step": 9497, "epoch": 56} {"train_loss": -5.519420623779297, "global_step": 9498, "epoch": 56} {"train_loss": -5.568666458129883, "global_step": 9499, "epoch": 56} {"train_loss": -5.296087741851807, "global_step": 9500, "epoch": 56} {"train_loss": -5.661658763885498, "global_step": 9501, "epoch": 56} {"train_loss": -5.478721618652344, "global_step": 9502, "epoch": 56} {"train_loss": -5.620314598083496, "global_step": 9503, "epoch": 56} {"train_loss": -5.66279935836792, "global_step": 9504, "epoch": 56} {"train_loss": -5.550248146057129, "global_step": 9505, "epoch": 56} {"train_loss": -5.810129165649414, "global_step": 9506, "epoch": 56} {"train_loss": -5.385830879211426, "global_step": 9507, "epoch": 56} {"train_loss": -5.675212860107422, "global_step": 9508, "epoch": 56} {"train_loss": -5.6235551834106445, "global_step": 9509, "epoch": 56} {"train_loss": -5.587151527404785, "global_step": 9510, "epoch": 56} {"train_loss": -5.773871421813965, "global_step": 9511, "epoch": 56} {"train_loss": -5.915701866149902, "global_step": 9512, "epoch": 56} {"train_loss": -5.575741767883301, "global_step": 9513, "epoch": 56} {"train_loss": -5.609373092651367, "global_step": 9514, "epoch": 56} {"train_loss": -5.605826377868652, "global_step": 9515, "epoch": 56} {"train_loss": -5.523550987243652, "global_step": 9516, "epoch": 56} {"train_loss": -5.633274078369141, "global_step": 9517, "epoch": 56} {"train_loss": -5.449570655822754, "global_step": 9518, "epoch": 56} {"train_loss": -5.572935104370117, "global_step": 9519, "epoch": 56} {"train_loss": -5.714758396148682, "global_step": 9520, "epoch": 56} {"train_loss": -5.826571464538574, "global_step": 9521, "epoch": 56} {"train_loss": -5.724695205688477, "global_step": 9522, "epoch": 56} {"train_loss": -5.636606216430664, "global_step": 9523, "epoch": 56} {"train_loss": -5.263500213623047, "global_step": 9524, "epoch": 56} {"train_loss": -5.559869289398193, "global_step": 9525, "epoch": 56} {"train_loss": -5.769341468811035, "global_step": 9526, "epoch": 56} {"train_loss": -5.6917877197265625, "global_step": 9527, "epoch": 56} {"train_loss": -5.8864593505859375, "global_step": 9528, "epoch": 56} {"train_loss": -5.506608009338379, "global_step": 9529, "epoch": 56} {"train_loss": -5.628573417663574, "global_step": 9530, "epoch": 56} {"train_loss": -5.479944229125977, "global_step": 9531, "epoch": 56} {"train_loss": -5.543402194976807, "global_step": 9532, "epoch": 56} {"train_loss": -5.544057846069336, "global_step": 9533, "epoch": 56} {"train_loss": -5.89955997467041, "global_step": 9534, "epoch": 56} {"train_loss": -5.421382427215576, "global_step": 9535, "epoch": 56} {"train_loss": -5.62247371673584, "global_step": 9536, "epoch": 56} {"train_loss": -5.693154335021973, "global_step": 9537, "epoch": 56} {"train_loss": -5.32125186920166, "global_step": 9538, "epoch": 56} {"train_loss": -5.8123602867126465, "global_step": 9539, "epoch": 56} {"train_loss": -5.547384262084961, "global_step": 9540, "epoch": 56} {"train_loss": -5.500349044799805, "global_step": 9541, "epoch": 56} {"train_loss": -5.505814552307129, "global_step": 9542, "epoch": 56} {"train_loss": -5.78486442565918, "global_step": 9543, "epoch": 56} {"train_loss": -5.729290962219238, "global_step": 9544, "epoch": 56} {"train_loss": -5.837420463562012, "global_step": 9545, "epoch": 56} {"train_loss": -5.76965856552124, "global_step": 9546, "epoch": 56} {"train_loss": -5.874220848083496, "global_step": 9547, "epoch": 56} {"train_loss": -5.775411605834961, "global_step": 9548, "epoch": 56} {"train_loss": -6.020412921905518, "global_step": 9549, "epoch": 56} {"train_loss": -5.705101013183594, "global_step": 9550, "epoch": 56} {"train_loss": -5.722348690032959, "global_step": 9551, "epoch": 56} {"train_loss": -5.900616645812988, "global_step": 9552, "epoch": 56} {"train_loss": -5.6447954177856445, "global_step": 9553, "epoch": 56} {"train_loss": -6.0225043296813965, "global_step": 9554, "epoch": 56} {"train_loss": -5.692561626434326, "global_step": 9555, "epoch": 56} {"train_loss": -5.720047950744629, "global_step": 9556, "epoch": 56} {"train_loss": -5.530975341796875, "global_step": 9557, "epoch": 56} {"train_loss": -5.546901702880859, "global_step": 9558, "epoch": 56} {"train_loss": -5.377544403076172, "global_step": 9559, "epoch": 56} {"train_loss": -5.512770652770996, "global_step": 9560, "epoch": 56} {"train_loss": -5.658967971801758, "global_step": 9561, "epoch": 56} {"train_loss": -5.825187683105469, "global_step": 9562, "epoch": 56} {"train_loss": -5.623802185058594, "global_step": 9563, "epoch": 56} {"train_loss": -5.553809642791748, "global_step": 9564, "epoch": 56} {"train_loss": -5.269801616668701, "global_step": 9565, "epoch": 56} {"train_loss": -5.514179706573486, "global_step": 9566, "epoch": 56} {"train_loss": -5.7542619705200195, "global_step": 9567, "epoch": 56} {"train_loss": -5.67323637008667, "global_step": 9568, "epoch": 56} {"train_loss": -5.8008713722229, "global_step": 9569, "epoch": 56} {"train_loss": -5.420441150665283, "global_step": 9570, "epoch": 56} {"train_loss": -5.208878517150879, "global_step": 9571, "epoch": 56} {"train_loss": -5.609165191650391, "global_step": 9572, "epoch": 56} {"train_loss": -5.865918159484863, "global_step": 9573, "epoch": 56} {"train_loss": -5.716756820678711, "global_step": 9574, "epoch": 56} {"train_loss": -5.655112774599166, "global_step": 9575, "epoch": 56, "val_loss": 261055.65625} {"train_loss": -5.6813225746154785, "global_step": 9576, "epoch": 57} {"train_loss": -5.917044639587402, "global_step": 9577, "epoch": 57} {"train_loss": -5.890315055847168, "global_step": 9578, "epoch": 57} {"train_loss": -6.010332107543945, "global_step": 9579, "epoch": 57} {"train_loss": -5.805233955383301, "global_step": 9580, "epoch": 57} {"train_loss": -5.498126983642578, "global_step": 9581, "epoch": 57} {"train_loss": -5.772157192230225, "global_step": 9582, "epoch": 57} {"train_loss": -5.750908374786377, "global_step": 9583, "epoch": 57} {"train_loss": -5.7841386795043945, "global_step": 9584, "epoch": 57} {"train_loss": -5.834173202514648, "global_step": 9585, "epoch": 57} {"train_loss": -5.960807800292969, "global_step": 9586, "epoch": 57} {"train_loss": -5.544251918792725, "global_step": 9587, "epoch": 57} {"train_loss": -5.766278266906738, "global_step": 9588, "epoch": 57} {"train_loss": -5.661574840545654, "global_step": 9589, "epoch": 57} {"train_loss": -5.929470539093018, "global_step": 9590, "epoch": 57} {"train_loss": -5.805377960205078, "global_step": 9591, "epoch": 57} {"train_loss": -5.599749565124512, "global_step": 9592, "epoch": 57} {"train_loss": -5.644160747528076, "global_step": 9593, "epoch": 57} {"train_loss": -5.729123115539551, "global_step": 9594, "epoch": 57} {"train_loss": -5.838192939758301, "global_step": 9595, "epoch": 57} {"train_loss": -5.714248180389404, "global_step": 9596, "epoch": 57} {"train_loss": -5.935779571533203, "global_step": 9597, "epoch": 57} {"train_loss": -5.708905220031738, "global_step": 9598, "epoch": 57} {"train_loss": -5.949088096618652, "global_step": 9599, "epoch": 57} {"train_loss": -5.844949245452881, "global_step": 9600, "epoch": 57} {"train_loss": -5.494697570800781, "global_step": 9601, "epoch": 57} {"train_loss": -5.783653736114502, "global_step": 9602, "epoch": 57} {"train_loss": -5.954375267028809, "global_step": 9603, "epoch": 57} {"train_loss": -5.798215866088867, "global_step": 9604, "epoch": 57} {"train_loss": -5.84231424331665, "global_step": 9605, "epoch": 57} {"train_loss": -5.662538051605225, "global_step": 9606, "epoch": 57} {"train_loss": -6.0154008865356445, "global_step": 9607, "epoch": 57} {"train_loss": -5.744053840637207, "global_step": 9608, "epoch": 57} {"train_loss": -5.90408992767334, "global_step": 9609, "epoch": 57} {"train_loss": -5.733348846435547, "global_step": 9610, "epoch": 57} {"train_loss": -5.670655727386475, "global_step": 9611, "epoch": 57} {"train_loss": -6.0908098220825195, "global_step": 9612, "epoch": 57} {"train_loss": -5.7488627433776855, "global_step": 9613, "epoch": 57} {"train_loss": -5.684154510498047, "global_step": 9614, "epoch": 57} {"train_loss": -5.793341636657715, "global_step": 9615, "epoch": 57} {"train_loss": -5.708743572235107, "global_step": 9616, "epoch": 57} {"train_loss": -5.619871616363525, "global_step": 9617, "epoch": 57} {"train_loss": -5.459074974060059, "global_step": 9618, "epoch": 57} {"train_loss": -5.948019504547119, "global_step": 9619, "epoch": 57} {"train_loss": -5.81082820892334, "global_step": 9620, "epoch": 57} {"train_loss": -5.852458953857422, "global_step": 9621, "epoch": 57} {"train_loss": -5.844740390777588, "global_step": 9622, "epoch": 57} {"train_loss": -5.775066375732422, "global_step": 9623, "epoch": 57} {"train_loss": -5.889338970184326, "global_step": 9624, "epoch": 57} {"train_loss": -5.646021842956543, "global_step": 9625, "epoch": 57} {"train_loss": -5.834084510803223, "global_step": 9626, "epoch": 57} {"train_loss": -5.771790504455566, "global_step": 9627, "epoch": 57} {"train_loss": -5.830665588378906, "global_step": 9628, "epoch": 57} {"train_loss": -5.7601094245910645, "global_step": 9629, "epoch": 57} {"train_loss": -5.527587890625, "global_step": 9630, "epoch": 57} {"train_loss": -5.761560440063477, "global_step": 9631, "epoch": 57} {"train_loss": -5.719235420227051, "global_step": 9632, "epoch": 57} {"train_loss": -5.658824920654297, "global_step": 9633, "epoch": 57} {"train_loss": -5.648096084594727, "global_step": 9634, "epoch": 57} {"train_loss": -5.692106246948242, "global_step": 9635, "epoch": 57} {"train_loss": -5.653639316558838, "global_step": 9636, "epoch": 57} {"train_loss": -5.630738258361816, "global_step": 9637, "epoch": 57} {"train_loss": -5.474837779998779, "global_step": 9638, "epoch": 57} {"train_loss": -5.3947577476501465, "global_step": 9639, "epoch": 57} {"train_loss": -5.834249496459961, "global_step": 9640, "epoch": 57} {"train_loss": -5.533507823944092, "global_step": 9641, "epoch": 57} {"train_loss": -5.733105659484863, "global_step": 9642, "epoch": 57} {"train_loss": -5.672035217285156, "global_step": 9643, "epoch": 57} {"train_loss": -5.70458984375, "global_step": 9644, "epoch": 57} {"train_loss": -5.694597244262695, "global_step": 9645, "epoch": 57} {"train_loss": -5.708778381347656, "global_step": 9646, "epoch": 57} {"train_loss": -5.527196884155273, "global_step": 9647, "epoch": 57} {"train_loss": -5.629133224487305, "global_step": 9648, "epoch": 57} {"train_loss": -5.5081400871276855, "global_step": 9649, "epoch": 57} {"train_loss": -5.649991989135742, "global_step": 9650, "epoch": 57} {"train_loss": -5.6515703201293945, "global_step": 9651, "epoch": 57} {"train_loss": -5.901504039764404, "global_step": 9652, "epoch": 57} {"train_loss": -5.653989791870117, "global_step": 9653, "epoch": 57} {"train_loss": -5.793329238891602, "global_step": 9654, "epoch": 57} {"train_loss": -5.55982780456543, "global_step": 9655, "epoch": 57} {"train_loss": -5.951816558837891, "global_step": 9656, "epoch": 57} {"train_loss": -5.5345330238342285, "global_step": 9657, "epoch": 57} {"train_loss": -5.540637016296387, "global_step": 9658, "epoch": 57} {"train_loss": -5.484722137451172, "global_step": 9659, "epoch": 57} {"train_loss": -5.5831298828125, "global_step": 9660, "epoch": 57} {"train_loss": -5.711665630340576, "global_step": 9661, "epoch": 57} {"train_loss": -5.517822742462158, "global_step": 9662, "epoch": 57} {"train_loss": -5.495752334594727, "global_step": 9663, "epoch": 57} {"train_loss": -5.510491371154785, "global_step": 9664, "epoch": 57} {"train_loss": -5.441084384918213, "global_step": 9665, "epoch": 57} {"train_loss": -5.5704345703125, "global_step": 9666, "epoch": 57} {"train_loss": -5.524506568908691, "global_step": 9667, "epoch": 57} {"train_loss": -5.711675643920898, "global_step": 9668, "epoch": 57} {"train_loss": -5.417425155639648, "global_step": 9669, "epoch": 57} {"train_loss": -5.8570098876953125, "global_step": 9670, "epoch": 57} {"train_loss": -5.639346122741699, "global_step": 9671, "epoch": 57} {"train_loss": -5.363908767700195, "global_step": 9672, "epoch": 57} {"train_loss": -5.531960487365723, "global_step": 9673, "epoch": 57} {"train_loss": -5.516053199768066, "global_step": 9674, "epoch": 57} {"train_loss": -5.5604777336120605, "global_step": 9675, "epoch": 57} {"train_loss": -5.512361526489258, "global_step": 9676, "epoch": 57} {"train_loss": -5.804721832275391, "global_step": 9677, "epoch": 57} {"train_loss": -5.684642791748047, "global_step": 9678, "epoch": 57} {"train_loss": -5.505194664001465, "global_step": 9679, "epoch": 57} {"train_loss": -5.569273471832275, "global_step": 9680, "epoch": 57} {"train_loss": -5.686495780944824, "global_step": 9681, "epoch": 57} {"train_loss": -5.6311235427856445, "global_step": 9682, "epoch": 57} {"train_loss": -5.716194152832031, "global_step": 9683, "epoch": 57} {"train_loss": -5.99520206451416, "global_step": 9684, "epoch": 57} {"train_loss": -5.842175483703613, "global_step": 9685, "epoch": 57} {"train_loss": -5.900765419006348, "global_step": 9686, "epoch": 57} {"train_loss": -5.788543224334717, "global_step": 9687, "epoch": 57} {"train_loss": -5.6880388259887695, "global_step": 9688, "epoch": 57} {"train_loss": -5.678638458251953, "global_step": 9689, "epoch": 57} {"train_loss": -5.651881694793701, "global_step": 9690, "epoch": 57} {"train_loss": -5.719593048095703, "global_step": 9691, "epoch": 57} {"train_loss": -5.559704780578613, "global_step": 9692, "epoch": 57} {"train_loss": -5.72274112701416, "global_step": 9693, "epoch": 57} {"train_loss": -5.400221824645996, "global_step": 9694, "epoch": 57} {"train_loss": -5.974975109100342, "global_step": 9695, "epoch": 57} {"train_loss": -5.731230735778809, "global_step": 9696, "epoch": 57} {"train_loss": -5.897808074951172, "global_step": 9697, "epoch": 57} {"train_loss": -5.661963939666748, "global_step": 9698, "epoch": 57} {"train_loss": -5.681569576263428, "global_step": 9699, "epoch": 57} {"train_loss": -5.865297317504883, "global_step": 9700, "epoch": 57} {"train_loss": -5.561936855316162, "global_step": 9701, "epoch": 57} {"train_loss": -5.754018783569336, "global_step": 9702, "epoch": 57} {"train_loss": -5.567656517028809, "global_step": 9703, "epoch": 57} {"train_loss": -5.372691631317139, "global_step": 9704, "epoch": 57} {"train_loss": -5.555388927459717, "global_step": 9705, "epoch": 57} {"train_loss": -5.522314071655273, "global_step": 9706, "epoch": 57} {"train_loss": -5.717431545257568, "global_step": 9707, "epoch": 57} {"train_loss": -5.7975263595581055, "global_step": 9708, "epoch": 57} {"train_loss": -5.827371597290039, "global_step": 9709, "epoch": 57} {"train_loss": -5.708359718322754, "global_step": 9710, "epoch": 57} {"train_loss": -5.7190961837768555, "global_step": 9711, "epoch": 57} {"train_loss": -5.797204971313477, "global_step": 9712, "epoch": 57} {"train_loss": -5.803834915161133, "global_step": 9713, "epoch": 57} {"train_loss": -6.024428367614746, "global_step": 9714, "epoch": 57} {"train_loss": -5.714249610900879, "global_step": 9715, "epoch": 57} {"train_loss": -5.631025314331055, "global_step": 9716, "epoch": 57} {"train_loss": -5.56755256652832, "global_step": 9717, "epoch": 57} {"train_loss": -5.386026382446289, "global_step": 9718, "epoch": 57} {"train_loss": -5.851434707641602, "global_step": 9719, "epoch": 57} {"train_loss": -5.579409599304199, "global_step": 9720, "epoch": 57} {"train_loss": -5.533509254455566, "global_step": 9721, "epoch": 57} {"train_loss": -5.683393955230713, "global_step": 9722, "epoch": 57} {"train_loss": -5.743105411529541, "global_step": 9723, "epoch": 57} {"train_loss": -5.594292163848877, "global_step": 9724, "epoch": 57} {"train_loss": -5.672643661499023, "global_step": 9725, "epoch": 57} {"train_loss": -5.549094200134277, "global_step": 9726, "epoch": 57} {"train_loss": -5.59484338760376, "global_step": 9727, "epoch": 57} {"train_loss": -5.927578449249268, "global_step": 9728, "epoch": 57} {"train_loss": -5.542365074157715, "global_step": 9729, "epoch": 57} {"train_loss": -5.582305908203125, "global_step": 9730, "epoch": 57} {"train_loss": -5.451533317565918, "global_step": 9731, "epoch": 57} {"train_loss": -5.607509613037109, "global_step": 9732, "epoch": 57} {"train_loss": -5.689630508422852, "global_step": 9733, "epoch": 57} {"train_loss": -5.851734161376953, "global_step": 9734, "epoch": 57} {"train_loss": -5.3967437744140625, "global_step": 9735, "epoch": 57} {"train_loss": -5.814216613769531, "global_step": 9736, "epoch": 57} {"train_loss": -5.653741836547852, "global_step": 9737, "epoch": 57} {"train_loss": -5.7520904541015625, "global_step": 9738, "epoch": 57} {"train_loss": -5.575468063354492, "global_step": 9739, "epoch": 57} {"train_loss": -5.579917907714844, "global_step": 9740, "epoch": 57} {"train_loss": -5.640431880950928, "global_step": 9741, "epoch": 57} {"train_loss": -5.815849304199219, "global_step": 9742, "epoch": 57} {"train_loss": -5.695456115972428, "global_step": 9743, "epoch": 57, "val_loss": 271878.53125} {"train_loss": -5.727410316467285, "global_step": 9744, "epoch": 58} {"train_loss": -5.764270305633545, "global_step": 9745, "epoch": 58} {"train_loss": -5.89943790435791, "global_step": 9746, "epoch": 58} {"train_loss": -5.910161972045898, "global_step": 9747, "epoch": 58} {"train_loss": -5.92117977142334, "global_step": 9748, "epoch": 58} {"train_loss": -5.514467239379883, "global_step": 9749, "epoch": 58} {"train_loss": -5.597364902496338, "global_step": 9750, "epoch": 58} {"train_loss": -5.8660736083984375, "global_step": 9751, "epoch": 58} {"train_loss": -6.037740707397461, "global_step": 9752, "epoch": 58} {"train_loss": -5.885165214538574, "global_step": 9753, "epoch": 58} {"train_loss": -5.984645366668701, "global_step": 9754, "epoch": 58} {"train_loss": -5.450547218322754, "global_step": 9755, "epoch": 58} {"train_loss": -5.805474281311035, "global_step": 9756, "epoch": 58} {"train_loss": -5.707452774047852, "global_step": 9757, "epoch": 58} {"train_loss": -5.795046806335449, "global_step": 9758, "epoch": 58} {"train_loss": -5.727178573608398, "global_step": 9759, "epoch": 58} {"train_loss": -5.937505722045898, "global_step": 9760, "epoch": 58} {"train_loss": -5.581451416015625, "global_step": 9761, "epoch": 58} {"train_loss": -5.44237756729126, "global_step": 9762, "epoch": 58} {"train_loss": -5.684985160827637, "global_step": 9763, "epoch": 58} {"train_loss": -5.868020534515381, "global_step": 9764, "epoch": 58} {"train_loss": -5.658736228942871, "global_step": 9765, "epoch": 58} {"train_loss": -5.611973762512207, "global_step": 9766, "epoch": 58} {"train_loss": -5.85122013092041, "global_step": 9767, "epoch": 58} {"train_loss": -5.632052421569824, "global_step": 9768, "epoch": 58} {"train_loss": -5.61556339263916, "global_step": 9769, "epoch": 58} {"train_loss": -5.627773761749268, "global_step": 9770, "epoch": 58} {"train_loss": -5.621262073516846, "global_step": 9771, "epoch": 58} {"train_loss": -5.7897257804870605, "global_step": 9772, "epoch": 58} {"train_loss": -5.906350135803223, "global_step": 9773, "epoch": 58} {"train_loss": -5.767212867736816, "global_step": 9774, "epoch": 58} {"train_loss": -5.551676273345947, "global_step": 9775, "epoch": 58} {"train_loss": -5.809167861938477, "global_step": 9776, "epoch": 58} {"train_loss": -5.447979927062988, "global_step": 9777, "epoch": 58} {"train_loss": -5.860080718994141, "global_step": 9778, "epoch": 58} {"train_loss": -5.629266738891602, "global_step": 9779, "epoch": 58} {"train_loss": -5.6561102867126465, "global_step": 9780, "epoch": 58} {"train_loss": -5.630893707275391, "global_step": 9781, "epoch": 58} {"train_loss": -5.4038987159729, "global_step": 9782, "epoch": 58} {"train_loss": -5.801263809204102, "global_step": 9783, "epoch": 58} {"train_loss": -5.367237567901611, "global_step": 9784, "epoch": 58} {"train_loss": -5.439314842224121, "global_step": 9785, "epoch": 58} {"train_loss": -5.562478065490723, "global_step": 9786, "epoch": 58} {"train_loss": -5.616642475128174, "global_step": 9787, "epoch": 58} {"train_loss": -5.508144378662109, "global_step": 9788, "epoch": 58} {"train_loss": -5.637709617614746, "global_step": 9789, "epoch": 58} {"train_loss": -5.601007461547852, "global_step": 9790, "epoch": 58} {"train_loss": -5.3993377685546875, "global_step": 9791, "epoch": 58} {"train_loss": -5.640727519989014, "global_step": 9792, "epoch": 58} {"train_loss": -5.487664699554443, "global_step": 9793, "epoch": 58} {"train_loss": -5.62462043762207, "global_step": 9794, "epoch": 58} {"train_loss": -5.693450927734375, "global_step": 9795, "epoch": 58} {"train_loss": -5.687938213348389, "global_step": 9796, "epoch": 58} {"train_loss": -5.566796779632568, "global_step": 9797, "epoch": 58} {"train_loss": -5.506008625030518, "global_step": 9798, "epoch": 58} {"train_loss": -5.588947296142578, "global_step": 9799, "epoch": 58} {"train_loss": -5.801392078399658, "global_step": 9800, "epoch": 58} {"train_loss": -5.800278663635254, "global_step": 9801, "epoch": 58} {"train_loss": -5.679537773132324, "global_step": 9802, "epoch": 58} {"train_loss": -5.631826400756836, "global_step": 9803, "epoch": 58} {"train_loss": -5.843991279602051, "global_step": 9804, "epoch": 58} {"train_loss": -5.901932716369629, "global_step": 9805, "epoch": 58} {"train_loss": -5.780097484588623, "global_step": 9806, "epoch": 58} {"train_loss": -5.902237892150879, "global_step": 9807, "epoch": 58} {"train_loss": -5.710087776184082, "global_step": 9808, "epoch": 58} {"train_loss": -5.8307204246521, "global_step": 9809, "epoch": 58} {"train_loss": -5.834088325500488, "global_step": 9810, "epoch": 58} {"train_loss": -5.578612804412842, "global_step": 9811, "epoch": 58} {"train_loss": -5.833156585693359, "global_step": 9812, "epoch": 58} {"train_loss": -6.078813552856445, "global_step": 9813, "epoch": 58} {"train_loss": -5.495356559753418, "global_step": 9814, "epoch": 58} {"train_loss": -5.825490951538086, "global_step": 9815, "epoch": 58} {"train_loss": -5.592889785766602, "global_step": 9816, "epoch": 58} {"train_loss": -5.677243709564209, "global_step": 9817, "epoch": 58} {"train_loss": -5.711939811706543, "global_step": 9818, "epoch": 58} {"train_loss": -5.684691905975342, "global_step": 9819, "epoch": 58} {"train_loss": -5.646134376525879, "global_step": 9820, "epoch": 58} {"train_loss": -5.428325653076172, "global_step": 9821, "epoch": 58} {"train_loss": -5.707248687744141, "global_step": 9822, "epoch": 58} {"train_loss": -5.747676372528076, "global_step": 9823, "epoch": 58} {"train_loss": -5.702814102172852, "global_step": 9824, "epoch": 58} {"train_loss": -5.759050369262695, "global_step": 9825, "epoch": 58} {"train_loss": -5.632585525512695, "global_step": 9826, "epoch": 58} {"train_loss": -5.8278584480285645, "global_step": 9827, "epoch": 58} {"train_loss": -5.8668060302734375, "global_step": 9828, "epoch": 58} {"train_loss": -5.569955825805664, "global_step": 9829, "epoch": 58} {"train_loss": -5.688742160797119, "global_step": 9830, "epoch": 58} {"train_loss": -5.7952117919921875, "global_step": 9831, "epoch": 58} {"train_loss": -5.845478057861328, "global_step": 9832, "epoch": 58} {"train_loss": -5.749887466430664, "global_step": 9833, "epoch": 58} {"train_loss": -5.490843296051025, "global_step": 9834, "epoch": 58} {"train_loss": -5.809858798980713, "global_step": 9835, "epoch": 58} {"train_loss": -5.770214080810547, "global_step": 9836, "epoch": 58} {"train_loss": -5.787106513977051, "global_step": 9837, "epoch": 58} {"train_loss": -5.761460304260254, "global_step": 9838, "epoch": 58} {"train_loss": -5.952582359313965, "global_step": 9839, "epoch": 58} {"train_loss": -6.025726318359375, "global_step": 9840, "epoch": 58} {"train_loss": -5.930184364318848, "global_step": 9841, "epoch": 58} {"train_loss": -6.020115852355957, "global_step": 9842, "epoch": 58} {"train_loss": -5.689665794372559, "global_step": 9843, "epoch": 58} {"train_loss": -5.973822116851807, "global_step": 9844, "epoch": 58} {"train_loss": -5.822258949279785, "global_step": 9845, "epoch": 58} {"train_loss": -5.811435699462891, "global_step": 9846, "epoch": 58} {"train_loss": -5.6275105476379395, "global_step": 9847, "epoch": 58} {"train_loss": -6.040153980255127, "global_step": 9848, "epoch": 58} {"train_loss": -5.79695463180542, "global_step": 9849, "epoch": 58} {"train_loss": -6.047818183898926, "global_step": 9850, "epoch": 58} {"train_loss": -5.32764196395874, "global_step": 9851, "epoch": 58} {"train_loss": -5.859601974487305, "global_step": 9852, "epoch": 58} {"train_loss": -5.618520736694336, "global_step": 9853, "epoch": 58} {"train_loss": -5.733915328979492, "global_step": 9854, "epoch": 58} {"train_loss": -5.372381687164307, "global_step": 9855, "epoch": 58} {"train_loss": -5.695403099060059, "global_step": 9856, "epoch": 58} {"train_loss": -5.939964294433594, "global_step": 9857, "epoch": 58} {"train_loss": -5.7053351402282715, "global_step": 9858, "epoch": 58} {"train_loss": -5.825829982757568, "global_step": 9859, "epoch": 58} {"train_loss": -5.6804022789001465, "global_step": 9860, "epoch": 58} {"train_loss": -6.003383636474609, "global_step": 9861, "epoch": 58} {"train_loss": -5.866311073303223, "global_step": 9862, "epoch": 58} {"train_loss": -5.671323299407959, "global_step": 9863, "epoch": 58} {"train_loss": -5.773414611816406, "global_step": 9864, "epoch": 58} {"train_loss": -5.612362861633301, "global_step": 9865, "epoch": 58} {"train_loss": -5.787999153137207, "global_step": 9866, "epoch": 58} {"train_loss": -5.79512882232666, "global_step": 9867, "epoch": 58} {"train_loss": -5.608089923858643, "global_step": 9868, "epoch": 58} {"train_loss": -5.823372840881348, "global_step": 9869, "epoch": 58} {"train_loss": -5.779946327209473, "global_step": 9870, "epoch": 58} {"train_loss": -5.810502052307129, "global_step": 9871, "epoch": 58} {"train_loss": -6.110916614532471, "global_step": 9872, "epoch": 58} {"train_loss": -5.910374164581299, "global_step": 9873, "epoch": 58} {"train_loss": -5.7809038162231445, "global_step": 9874, "epoch": 58} {"train_loss": -5.766491413116455, "global_step": 9875, "epoch": 58} {"train_loss": -5.783095836639404, "global_step": 9876, "epoch": 58} {"train_loss": -6.062054634094238, "global_step": 9877, "epoch": 58} {"train_loss": -5.963478088378906, "global_step": 9878, "epoch": 58} {"train_loss": -6.055368423461914, "global_step": 9879, "epoch": 58} {"train_loss": -5.905898571014404, "global_step": 9880, "epoch": 58} {"train_loss": -6.029679298400879, "global_step": 9881, "epoch": 58} {"train_loss": -5.75726842880249, "global_step": 9882, "epoch": 58} {"train_loss": -5.898460388183594, "global_step": 9883, "epoch": 58} {"train_loss": -5.818663597106934, "global_step": 9884, "epoch": 58} {"train_loss": -5.796289443969727, "global_step": 9885, "epoch": 58} {"train_loss": -5.688513278961182, "global_step": 9886, "epoch": 58} {"train_loss": -5.699106216430664, "global_step": 9887, "epoch": 58} {"train_loss": -5.781898021697998, "global_step": 9888, "epoch": 58} {"train_loss": -5.767974853515625, "global_step": 9889, "epoch": 58} {"train_loss": -5.860667705535889, "global_step": 9890, "epoch": 58} {"train_loss": -5.6465630531311035, "global_step": 9891, "epoch": 58} {"train_loss": -5.7962141036987305, "global_step": 9892, "epoch": 58} {"train_loss": -5.791802406311035, "global_step": 9893, "epoch": 58} {"train_loss": -5.921267509460449, "global_step": 9894, "epoch": 58} {"train_loss": -5.905146598815918, "global_step": 9895, "epoch": 58} {"train_loss": -5.772073268890381, "global_step": 9896, "epoch": 58} {"train_loss": -5.969745635986328, "global_step": 9897, "epoch": 58} {"train_loss": -5.85847282409668, "global_step": 9898, "epoch": 58} {"train_loss": -5.680481910705566, "global_step": 9899, "epoch": 58} {"train_loss": -5.688785552978516, "global_step": 9900, "epoch": 58} {"train_loss": -5.73481559753418, "global_step": 9901, "epoch": 58} {"train_loss": -5.675671577453613, "global_step": 9902, "epoch": 58} {"train_loss": -5.6503448486328125, "global_step": 9903, "epoch": 58} {"train_loss": -5.646155834197998, "global_step": 9904, "epoch": 58} {"train_loss": -6.009217262268066, "global_step": 9905, "epoch": 58} {"train_loss": -5.954869747161865, "global_step": 9906, "epoch": 58} {"train_loss": -5.93978214263916, "global_step": 9907, "epoch": 58} {"train_loss": -5.8093180656433105, "global_step": 9908, "epoch": 58} {"train_loss": -5.86883020401001, "global_step": 9909, "epoch": 58} {"train_loss": -5.893263816833496, "global_step": 9910, "epoch": 58} {"train_loss": -5.750503017788842, "global_step": 9911, "epoch": 58, "val_loss": 262937.03125} {"train_loss": -5.841152191162109, "global_step": 9912, "epoch": 59} {"train_loss": -5.789299964904785, "global_step": 9913, "epoch": 59} {"train_loss": -5.69381046295166, "global_step": 9914, "epoch": 59} {"train_loss": -5.68416690826416, "global_step": 9915, "epoch": 59} {"train_loss": -5.775511741638184, "global_step": 9916, "epoch": 59} {"train_loss": -5.78253173828125, "global_step": 9917, "epoch": 59} {"train_loss": -5.840879917144775, "global_step": 9918, "epoch": 59} {"train_loss": -5.583479404449463, "global_step": 9919, "epoch": 59} {"train_loss": -5.341930389404297, "global_step": 9920, "epoch": 59} {"train_loss": -5.975815773010254, "global_step": 9921, "epoch": 59} {"train_loss": -5.689170837402344, "global_step": 9922, "epoch": 59} {"train_loss": -5.710583686828613, "global_step": 9923, "epoch": 59} {"train_loss": -5.405384063720703, "global_step": 9924, "epoch": 59} {"train_loss": -5.7336225509643555, "global_step": 9925, "epoch": 59} {"train_loss": -5.391282081604004, "global_step": 9926, "epoch": 59} {"train_loss": -5.565506935119629, "global_step": 9927, "epoch": 59} {"train_loss": -5.476927757263184, "global_step": 9928, "epoch": 59} {"train_loss": -5.722261905670166, "global_step": 9929, "epoch": 59} {"train_loss": -5.780231475830078, "global_step": 9930, "epoch": 59} {"train_loss": -5.488575458526611, "global_step": 9931, "epoch": 59} {"train_loss": -5.789029121398926, "global_step": 9932, "epoch": 59} {"train_loss": -5.672708511352539, "global_step": 9933, "epoch": 59} {"train_loss": -5.85526180267334, "global_step": 9934, "epoch": 59} {"train_loss": -5.801003932952881, "global_step": 9935, "epoch": 59} {"train_loss": -5.660460472106934, "global_step": 9936, "epoch": 59} {"train_loss": -5.703508377075195, "global_step": 9937, "epoch": 59} {"train_loss": -5.369207382202148, "global_step": 9938, "epoch": 59} {"train_loss": -5.535417556762695, "global_step": 9939, "epoch": 59} {"train_loss": -5.672944068908691, "global_step": 9940, "epoch": 59} {"train_loss": -5.884037017822266, "global_step": 9941, "epoch": 59} {"train_loss": -5.648669719696045, "global_step": 9942, "epoch": 59} {"train_loss": -5.783805847167969, "global_step": 9943, "epoch": 59} {"train_loss": -5.766872882843018, "global_step": 9944, "epoch": 59} {"train_loss": -5.720604419708252, "global_step": 9945, "epoch": 59} {"train_loss": -5.686180114746094, "global_step": 9946, "epoch": 59} {"train_loss": -5.3738789558410645, "global_step": 9947, "epoch": 59} {"train_loss": -5.679263591766357, "global_step": 9948, "epoch": 59} {"train_loss": -5.810153007507324, "global_step": 9949, "epoch": 59} {"train_loss": -5.837489128112793, "global_step": 9950, "epoch": 59} {"train_loss": -5.6044135093688965, "global_step": 9951, "epoch": 59} {"train_loss": -5.796806812286377, "global_step": 9952, "epoch": 59} {"train_loss": -5.822794437408447, "global_step": 9953, "epoch": 59} {"train_loss": -5.550233840942383, "global_step": 9954, "epoch": 59} {"train_loss": -5.831080436706543, "global_step": 9955, "epoch": 59} {"train_loss": -5.629502773284912, "global_step": 9956, "epoch": 59} {"train_loss": -5.609311103820801, "global_step": 9957, "epoch": 59} {"train_loss": -5.990440368652344, "global_step": 9958, "epoch": 59} {"train_loss": -5.708627700805664, "global_step": 9959, "epoch": 59} {"train_loss": -5.74469518661499, "global_step": 9960, "epoch": 59} {"train_loss": -5.910408973693848, "global_step": 9961, "epoch": 59} {"train_loss": -5.715229034423828, "global_step": 9962, "epoch": 59} {"train_loss": -5.573677062988281, "global_step": 9963, "epoch": 59} {"train_loss": -5.7111663818359375, "global_step": 9964, "epoch": 59} {"train_loss": -5.929409027099609, "global_step": 9965, "epoch": 59} {"train_loss": -5.772668838500977, "global_step": 9966, "epoch": 59} {"train_loss": -5.734999656677246, "global_step": 9967, "epoch": 59} {"train_loss": -5.807823181152344, "global_step": 9968, "epoch": 59} {"train_loss": -5.766784191131592, "global_step": 9969, "epoch": 59} {"train_loss": -5.383445739746094, "global_step": 9970, "epoch": 59} {"train_loss": -5.974025726318359, "global_step": 9971, "epoch": 59} {"train_loss": -5.965989112854004, "global_step": 9972, "epoch": 59} {"train_loss": -5.661481857299805, "global_step": 9973, "epoch": 59} {"train_loss": -5.69903564453125, "global_step": 9974, "epoch": 59} {"train_loss": -5.6692328453063965, "global_step": 9975, "epoch": 59} {"train_loss": -5.853635787963867, "global_step": 9976, "epoch": 59} {"train_loss": -5.560469627380371, "global_step": 9977, "epoch": 59} {"train_loss": -5.721897602081299, "global_step": 9978, "epoch": 59} {"train_loss": -5.803742408752441, "global_step": 9979, "epoch": 59} {"train_loss": -5.786734580993652, "global_step": 9980, "epoch": 59} {"train_loss": -5.889291286468506, "global_step": 9981, "epoch": 59} {"train_loss": -5.92294454574585, "global_step": 9982, "epoch": 59} {"train_loss": -5.9734649658203125, "global_step": 9983, "epoch": 59} {"train_loss": -6.037219524383545, "global_step": 9984, "epoch": 59} {"train_loss": -6.0702409744262695, "global_step": 9985, "epoch": 59} {"train_loss": -5.95318078994751, "global_step": 9986, "epoch": 59} {"train_loss": -5.874700546264648, "global_step": 9987, "epoch": 59} {"train_loss": -5.827954292297363, "global_step": 9988, "epoch": 59} {"train_loss": -5.80377197265625, "global_step": 9989, "epoch": 59} {"train_loss": -5.814268112182617, "global_step": 9990, "epoch": 59} {"train_loss": -5.893679618835449, "global_step": 9991, "epoch": 59} {"train_loss": -6.0711259841918945, "global_step": 9992, "epoch": 59} {"train_loss": -5.892683029174805, "global_step": 9993, "epoch": 59} {"train_loss": -5.588687419891357, "global_step": 9994, "epoch": 59} {"train_loss": -5.8107590675354, "global_step": 9995, "epoch": 59} {"train_loss": -5.985003471374512, "global_step": 9996, "epoch": 59} {"train_loss": -5.822789192199707, "global_step": 9997, "epoch": 59} {"train_loss": -5.963252544403076, "global_step": 9998, "epoch": 59} {"train_loss": -5.993009567260742, "global_step": 9999, "epoch": 59} {"train_loss": -6.032876014709473, "global_step": 10000, "epoch": 59} {"train_loss": -5.5614776611328125, "global_step": 10001, "epoch": 59} {"train_loss": -5.800226211547852, "global_step": 10002, "epoch": 59} {"train_loss": -5.691801071166992, "global_step": 10003, "epoch": 59} {"train_loss": -5.8468546867370605, "global_step": 10004, "epoch": 59} {"train_loss": -5.644745826721191, "global_step": 10005, "epoch": 59} {"train_loss": -5.925596237182617, "global_step": 10006, "epoch": 59} {"train_loss": -5.856822967529297, "global_step": 10007, "epoch": 59} {"train_loss": -5.957627296447754, "global_step": 10008, "epoch": 59} {"train_loss": -5.765355110168457, "global_step": 10009, "epoch": 59} {"train_loss": -5.71964168548584, "global_step": 10010, "epoch": 59} {"train_loss": -5.709306716918945, "global_step": 10011, "epoch": 59} {"train_loss": -5.699036598205566, "global_step": 10012, "epoch": 59} {"train_loss": -5.886087417602539, "global_step": 10013, "epoch": 59} {"train_loss": -5.646434783935547, "global_step": 10014, "epoch": 59} {"train_loss": -5.534100532531738, "global_step": 10015, "epoch": 59} {"train_loss": -5.740023612976074, "global_step": 10016, "epoch": 59} {"train_loss": -5.615146636962891, "global_step": 10017, "epoch": 59} {"train_loss": -5.423727512359619, "global_step": 10018, "epoch": 59} {"train_loss": -5.583573341369629, "global_step": 10019, "epoch": 59} {"train_loss": -5.436445236206055, "global_step": 10020, "epoch": 59} {"train_loss": -5.667494773864746, "global_step": 10021, "epoch": 59} {"train_loss": -5.870336532592773, "global_step": 10022, "epoch": 59} {"train_loss": -5.699563980102539, "global_step": 10023, "epoch": 59} {"train_loss": -5.5275750160217285, "global_step": 10024, "epoch": 59} {"train_loss": -5.682567596435547, "global_step": 10025, "epoch": 59} {"train_loss": -5.5732221603393555, "global_step": 10026, "epoch": 59} {"train_loss": -5.7857208251953125, "global_step": 10027, "epoch": 59} {"train_loss": -5.520108222961426, "global_step": 10028, "epoch": 59} {"train_loss": -5.366656303405762, "global_step": 10029, "epoch": 59} {"train_loss": -5.459246635437012, "global_step": 10030, "epoch": 59} {"train_loss": -5.866194725036621, "global_step": 10031, "epoch": 59} {"train_loss": -5.552616119384766, "global_step": 10032, "epoch": 59} {"train_loss": -5.756217956542969, "global_step": 10033, "epoch": 59} {"train_loss": -5.521664619445801, "global_step": 10034, "epoch": 59} {"train_loss": -5.6575212478637695, "global_step": 10035, "epoch": 59} {"train_loss": -5.8643035888671875, "global_step": 10036, "epoch": 59} {"train_loss": -5.762277126312256, "global_step": 10037, "epoch": 59} {"train_loss": -5.526415824890137, "global_step": 10038, "epoch": 59} {"train_loss": -5.683065891265869, "global_step": 10039, "epoch": 59} {"train_loss": -5.926217079162598, "global_step": 10040, "epoch": 59} {"train_loss": -5.7397003173828125, "global_step": 10041, "epoch": 59} {"train_loss": -5.815303325653076, "global_step": 10042, "epoch": 59} {"train_loss": -5.698726654052734, "global_step": 10043, "epoch": 59} {"train_loss": -5.846276760101318, "global_step": 10044, "epoch": 59} {"train_loss": -5.884439945220947, "global_step": 10045, "epoch": 59} {"train_loss": -6.119748115539551, "global_step": 10046, "epoch": 59} {"train_loss": -6.067543029785156, "global_step": 10047, "epoch": 59} {"train_loss": -6.055804252624512, "global_step": 10048, "epoch": 59} {"train_loss": -5.976498126983643, "global_step": 10049, "epoch": 59} {"train_loss": -5.765188217163086, "global_step": 10050, "epoch": 59} {"train_loss": -6.035534858703613, "global_step": 10051, "epoch": 59} {"train_loss": -5.914677619934082, "global_step": 10052, "epoch": 59} {"train_loss": -5.604638576507568, "global_step": 10053, "epoch": 59} {"train_loss": -5.813103675842285, "global_step": 10054, "epoch": 59} {"train_loss": -5.932793617248535, "global_step": 10055, "epoch": 59} {"train_loss": -6.023423671722412, "global_step": 10056, "epoch": 59} {"train_loss": -5.921045303344727, "global_step": 10057, "epoch": 59} {"train_loss": -5.765838623046875, "global_step": 10058, "epoch": 59} {"train_loss": -5.699979305267334, "global_step": 10059, "epoch": 59} {"train_loss": -5.857084274291992, "global_step": 10060, "epoch": 59} {"train_loss": -5.78391695022583, "global_step": 10061, "epoch": 59} {"train_loss": -5.815733432769775, "global_step": 10062, "epoch": 59} {"train_loss": -5.9028778076171875, "global_step": 10063, "epoch": 59} {"train_loss": -5.576396942138672, "global_step": 10064, "epoch": 59} {"train_loss": -5.688843250274658, "global_step": 10065, "epoch": 59} {"train_loss": -5.844363689422607, "global_step": 10066, "epoch": 59} {"train_loss": -5.884469032287598, "global_step": 10067, "epoch": 59} {"train_loss": -6.031211853027344, "global_step": 10068, "epoch": 59} {"train_loss": -5.947212219238281, "global_step": 10069, "epoch": 59} {"train_loss": -5.862001419067383, "global_step": 10070, "epoch": 59} {"train_loss": -5.9854655265808105, "global_step": 10071, "epoch": 59} {"train_loss": -6.097268581390381, "global_step": 10072, "epoch": 59} {"train_loss": -5.7037153244018555, "global_step": 10073, "epoch": 59} {"train_loss": -5.716038703918457, "global_step": 10074, "epoch": 59} {"train_loss": -5.7475128173828125, "global_step": 10075, "epoch": 59} {"train_loss": -6.082298278808594, "global_step": 10076, "epoch": 59} {"train_loss": -5.739767551422119, "global_step": 10077, "epoch": 59} {"train_loss": -5.699376583099365, "global_step": 10078, "epoch": 59} {"train_loss": -5.758212237131028, "global_step": 10079, "epoch": 59, "val_loss": 261717.1875} {"train_loss": -5.857763290405273, "global_step": 10080, "epoch": 60} {"train_loss": -5.806525707244873, "global_step": 10081, "epoch": 60} {"train_loss": -5.847487449645996, "global_step": 10082, "epoch": 60} {"train_loss": -5.801547050476074, "global_step": 10083, "epoch": 60} {"train_loss": -5.5941925048828125, "global_step": 10084, "epoch": 60} {"train_loss": -5.762600421905518, "global_step": 10085, "epoch": 60} {"train_loss": -5.976383209228516, "global_step": 10086, "epoch": 60} {"train_loss": -5.393832206726074, "global_step": 10087, "epoch": 60} {"train_loss": -5.268308639526367, "global_step": 10088, "epoch": 60} {"train_loss": -5.9156813621521, "global_step": 10089, "epoch": 60} {"train_loss": -5.752910614013672, "global_step": 10090, "epoch": 60} {"train_loss": -5.59502649307251, "global_step": 10091, "epoch": 60} {"train_loss": -5.563920021057129, "global_step": 10092, "epoch": 60} {"train_loss": -5.829962730407715, "global_step": 10093, "epoch": 60} {"train_loss": -5.633849143981934, "global_step": 10094, "epoch": 60} {"train_loss": -5.756829261779785, "global_step": 10095, "epoch": 60} {"train_loss": -5.688597679138184, "global_step": 10096, "epoch": 60} {"train_loss": -5.45650053024292, "global_step": 10097, "epoch": 60} {"train_loss": -5.851865291595459, "global_step": 10098, "epoch": 60} {"train_loss": -5.628782272338867, "global_step": 10099, "epoch": 60} {"train_loss": -5.57796049118042, "global_step": 10100, "epoch": 60} {"train_loss": -5.306123733520508, "global_step": 10101, "epoch": 60} {"train_loss": -5.545953750610352, "global_step": 10102, "epoch": 60} {"train_loss": -5.6987833976745605, "global_step": 10103, "epoch": 60} {"train_loss": -5.927862167358398, "global_step": 10104, "epoch": 60} {"train_loss": -5.584442615509033, "global_step": 10105, "epoch": 60} {"train_loss": -5.796513080596924, "global_step": 10106, "epoch": 60} {"train_loss": -5.760585784912109, "global_step": 10107, "epoch": 60} {"train_loss": -5.884847640991211, "global_step": 10108, "epoch": 60} {"train_loss": -5.9541449546813965, "global_step": 10109, "epoch": 60} {"train_loss": -5.938774108886719, "global_step": 10110, "epoch": 60} {"train_loss": -5.629075050354004, "global_step": 10111, "epoch": 60} {"train_loss": -5.970349311828613, "global_step": 10112, "epoch": 60} {"train_loss": -5.908453941345215, "global_step": 10113, "epoch": 60} {"train_loss": -5.862244606018066, "global_step": 10114, "epoch": 60} {"train_loss": -5.781198501586914, "global_step": 10115, "epoch": 60} {"train_loss": -5.814178466796875, "global_step": 10116, "epoch": 60} {"train_loss": -5.496829509735107, "global_step": 10117, "epoch": 60} {"train_loss": -5.611549377441406, "global_step": 10118, "epoch": 60} {"train_loss": -5.832955360412598, "global_step": 10119, "epoch": 60} {"train_loss": -5.694352149963379, "global_step": 10120, "epoch": 60} {"train_loss": -5.704936981201172, "global_step": 10121, "epoch": 60} {"train_loss": -5.565806865692139, "global_step": 10122, "epoch": 60} {"train_loss": -5.800134658813477, "global_step": 10123, "epoch": 60} {"train_loss": -5.705822944641113, "global_step": 10124, "epoch": 60} {"train_loss": -5.728762626647949, "global_step": 10125, "epoch": 60} {"train_loss": -5.727615833282471, "global_step": 10126, "epoch": 60} {"train_loss": -6.018703460693359, "global_step": 10127, "epoch": 60} {"train_loss": -5.582616806030273, "global_step": 10128, "epoch": 60} {"train_loss": -5.699145793914795, "global_step": 10129, "epoch": 60} {"train_loss": -5.4777984619140625, "global_step": 10130, "epoch": 60} {"train_loss": -5.663189888000488, "global_step": 10131, "epoch": 60} {"train_loss": -5.929922103881836, "global_step": 10132, "epoch": 60} {"train_loss": -5.930405616760254, "global_step": 10133, "epoch": 60} {"train_loss": -5.987613201141357, "global_step": 10134, "epoch": 60} {"train_loss": -5.708793640136719, "global_step": 10135, "epoch": 60} {"train_loss": -5.9293622970581055, "global_step": 10136, "epoch": 60} {"train_loss": -5.914513111114502, "global_step": 10137, "epoch": 60} {"train_loss": -5.9787821769714355, "global_step": 10138, "epoch": 60} {"train_loss": -5.7588701248168945, "global_step": 10139, "epoch": 60} {"train_loss": -5.501869201660156, "global_step": 10140, "epoch": 60} {"train_loss": -5.550848960876465, "global_step": 10141, "epoch": 60} {"train_loss": -5.859968662261963, "global_step": 10142, "epoch": 60} {"train_loss": -5.935257434844971, "global_step": 10143, "epoch": 60} {"train_loss": -5.826612949371338, "global_step": 10144, "epoch": 60} {"train_loss": -5.770542621612549, "global_step": 10145, "epoch": 60} {"train_loss": -5.872603416442871, "global_step": 10146, "epoch": 60} {"train_loss": -5.806824684143066, "global_step": 10147, "epoch": 60} {"train_loss": -5.703612327575684, "global_step": 10148, "epoch": 60} {"train_loss": -5.899585247039795, "global_step": 10149, "epoch": 60} {"train_loss": -5.831067085266113, "global_step": 10150, "epoch": 60} {"train_loss": -5.812329292297363, "global_step": 10151, "epoch": 60} {"train_loss": -5.866074562072754, "global_step": 10152, "epoch": 60} {"train_loss": -5.844954013824463, "global_step": 10153, "epoch": 60} {"train_loss": -5.807252883911133, "global_step": 10154, "epoch": 60} {"train_loss": -6.002062797546387, "global_step": 10155, "epoch": 60} {"train_loss": -5.898497104644775, "global_step": 10156, "epoch": 60} {"train_loss": -5.836498737335205, "global_step": 10157, "epoch": 60} {"train_loss": -5.764651298522949, "global_step": 10158, "epoch": 60} {"train_loss": -5.688404083251953, "global_step": 10159, "epoch": 60} {"train_loss": -5.849237442016602, "global_step": 10160, "epoch": 60} {"train_loss": -5.780827522277832, "global_step": 10161, "epoch": 60} {"train_loss": -5.952871322631836, "global_step": 10162, "epoch": 60} {"train_loss": -5.615715026855469, "global_step": 10163, "epoch": 60} {"train_loss": -5.916504383087158, "global_step": 10164, "epoch": 60} {"train_loss": -5.831090927124023, "global_step": 10165, "epoch": 60} {"train_loss": -5.8918232917785645, "global_step": 10166, "epoch": 60} {"train_loss": -5.933438777923584, "global_step": 10167, "epoch": 60} {"train_loss": -5.722899913787842, "global_step": 10168, "epoch": 60} {"train_loss": -5.867123126983643, "global_step": 10169, "epoch": 60} {"train_loss": -5.803431987762451, "global_step": 10170, "epoch": 60} {"train_loss": -5.959259033203125, "global_step": 10171, "epoch": 60} {"train_loss": -6.075215816497803, "global_step": 10172, "epoch": 60} {"train_loss": -6.122647285461426, "global_step": 10173, "epoch": 60} {"train_loss": -5.962528228759766, "global_step": 10174, "epoch": 60} {"train_loss": -5.813995361328125, "global_step": 10175, "epoch": 60} {"train_loss": -5.798675060272217, "global_step": 10176, "epoch": 60} {"train_loss": -5.9324493408203125, "global_step": 10177, "epoch": 60} {"train_loss": -5.892064571380615, "global_step": 10178, "epoch": 60} {"train_loss": -5.881343841552734, "global_step": 10179, "epoch": 60} {"train_loss": -5.821420192718506, "global_step": 10180, "epoch": 60} {"train_loss": -5.847897529602051, "global_step": 10181, "epoch": 60} {"train_loss": -5.918858528137207, "global_step": 10182, "epoch": 60} {"train_loss": -5.820992469787598, "global_step": 10183, "epoch": 60} {"train_loss": -5.926568031311035, "global_step": 10184, "epoch": 60} {"train_loss": -5.641833305358887, "global_step": 10185, "epoch": 60} {"train_loss": -5.955508232116699, "global_step": 10186, "epoch": 60} {"train_loss": -6.0795111656188965, "global_step": 10187, "epoch": 60} {"train_loss": -5.895656585693359, "global_step": 10188, "epoch": 60} {"train_loss": -5.945525646209717, "global_step": 10189, "epoch": 60} {"train_loss": -5.994894504547119, "global_step": 10190, "epoch": 60} {"train_loss": -5.726497650146484, "global_step": 10191, "epoch": 60} {"train_loss": -6.113114356994629, "global_step": 10192, "epoch": 60} {"train_loss": -5.622568130493164, "global_step": 10193, "epoch": 60} {"train_loss": -5.976548671722412, "global_step": 10194, "epoch": 60} {"train_loss": -5.850757598876953, "global_step": 10195, "epoch": 60} {"train_loss": -5.958922863006592, "global_step": 10196, "epoch": 60} {"train_loss": -5.491302490234375, "global_step": 10197, "epoch": 60} {"train_loss": -5.718628406524658, "global_step": 10198, "epoch": 60} {"train_loss": -5.931689739227295, "global_step": 10199, "epoch": 60} {"train_loss": -5.8515729904174805, "global_step": 10200, "epoch": 60} {"train_loss": -5.961421012878418, "global_step": 10201, "epoch": 60} {"train_loss": -5.857491970062256, "global_step": 10202, "epoch": 60} {"train_loss": -5.664313316345215, "global_step": 10203, "epoch": 60} {"train_loss": -5.809816360473633, "global_step": 10204, "epoch": 60} {"train_loss": -5.597285270690918, "global_step": 10205, "epoch": 60} {"train_loss": -5.889951229095459, "global_step": 10206, "epoch": 60} {"train_loss": -5.718533515930176, "global_step": 10207, "epoch": 60} {"train_loss": -6.043408393859863, "global_step": 10208, "epoch": 60} {"train_loss": -5.701836109161377, "global_step": 10209, "epoch": 60} {"train_loss": -5.830564498901367, "global_step": 10210, "epoch": 60} {"train_loss": -5.954327583312988, "global_step": 10211, "epoch": 60} {"train_loss": -5.682065963745117, "global_step": 10212, "epoch": 60} {"train_loss": -6.110207557678223, "global_step": 10213, "epoch": 60} {"train_loss": -6.017746925354004, "global_step": 10214, "epoch": 60} {"train_loss": -5.790256023406982, "global_step": 10215, "epoch": 60} {"train_loss": -6.037336349487305, "global_step": 10216, "epoch": 60} {"train_loss": -5.840555667877197, "global_step": 10217, "epoch": 60} {"train_loss": -5.5739054679870605, "global_step": 10218, "epoch": 60} {"train_loss": -5.882656097412109, "global_step": 10219, "epoch": 60} {"train_loss": -5.836517810821533, "global_step": 10220, "epoch": 60} {"train_loss": -6.092348575592041, "global_step": 10221, "epoch": 60} {"train_loss": -5.8134050369262695, "global_step": 10222, "epoch": 60} {"train_loss": -5.933097839355469, "global_step": 10223, "epoch": 60} {"train_loss": -5.730585098266602, "global_step": 10224, "epoch": 60} {"train_loss": -5.690245628356934, "global_step": 10225, "epoch": 60} {"train_loss": -5.693548679351807, "global_step": 10226, "epoch": 60} {"train_loss": -5.732858657836914, "global_step": 10227, "epoch": 60} {"train_loss": -5.817782878875732, "global_step": 10228, "epoch": 60} {"train_loss": -5.851379871368408, "global_step": 10229, "epoch": 60} {"train_loss": -5.946742534637451, "global_step": 10230, "epoch": 60} {"train_loss": -5.684089183807373, "global_step": 10231, "epoch": 60} {"train_loss": -5.70499324798584, "global_step": 10232, "epoch": 60} {"train_loss": -5.8405609130859375, "global_step": 10233, "epoch": 60} {"train_loss": -5.730849266052246, "global_step": 10234, "epoch": 60} {"train_loss": -5.6742143630981445, "global_step": 10235, "epoch": 60} {"train_loss": -5.772464752197266, "global_step": 10236, "epoch": 60} {"train_loss": -5.735696792602539, "global_step": 10237, "epoch": 60} {"train_loss": -5.479922294616699, "global_step": 10238, "epoch": 60} {"train_loss": -5.771045207977295, "global_step": 10239, "epoch": 60} {"train_loss": -5.429324150085449, "global_step": 10240, "epoch": 60} {"train_loss": -5.736642837524414, "global_step": 10241, "epoch": 60} {"train_loss": -5.762734413146973, "global_step": 10242, "epoch": 60} {"train_loss": -5.669270038604736, "global_step": 10243, "epoch": 60} {"train_loss": -5.694599151611328, "global_step": 10244, "epoch": 60} {"train_loss": -5.803184509277344, "global_step": 10245, "epoch": 60} {"train_loss": -5.609004974365234, "global_step": 10246, "epoch": 60} {"train_loss": -5.793854855355763, "global_step": 10247, "epoch": 60, "val_loss": 262815.96875, "train_action_mse_error": 48.91304016113281} {"train_loss": -5.693825721740723, "global_step": 10248, "epoch": 61} {"train_loss": -5.87398099899292, "global_step": 10249, "epoch": 61} {"train_loss": -5.782767295837402, "global_step": 10250, "epoch": 61} {"train_loss": -5.636962413787842, "global_step": 10251, "epoch": 61} {"train_loss": -5.8980817794799805, "global_step": 10252, "epoch": 61} {"train_loss": -5.661549091339111, "global_step": 10253, "epoch": 61} {"train_loss": -5.324800491333008, "global_step": 10254, "epoch": 61} {"train_loss": -6.154723167419434, "global_step": 10255, "epoch": 61} {"train_loss": -5.842577934265137, "global_step": 10256, "epoch": 61} {"train_loss": -5.509406089782715, "global_step": 10257, "epoch": 61} {"train_loss": -5.7959885597229, "global_step": 10258, "epoch": 61} {"train_loss": -5.601945400238037, "global_step": 10259, "epoch": 61} {"train_loss": -6.039134979248047, "global_step": 10260, "epoch": 61} {"train_loss": -5.586938381195068, "global_step": 10261, "epoch": 61} {"train_loss": -5.720010280609131, "global_step": 10262, "epoch": 61} {"train_loss": -5.733416557312012, "global_step": 10263, "epoch": 61} {"train_loss": -5.836494445800781, "global_step": 10264, "epoch": 61} {"train_loss": -5.797583103179932, "global_step": 10265, "epoch": 61} {"train_loss": -5.56809139251709, "global_step": 10266, "epoch": 61} {"train_loss": -5.797153472900391, "global_step": 10267, "epoch": 61} {"train_loss": -5.882179260253906, "global_step": 10268, "epoch": 61} {"train_loss": -5.9091925621032715, "global_step": 10269, "epoch": 61} {"train_loss": -6.005802631378174, "global_step": 10270, "epoch": 61} {"train_loss": -5.763772964477539, "global_step": 10271, "epoch": 61} {"train_loss": -6.098794937133789, "global_step": 10272, "epoch": 61} {"train_loss": -5.882536888122559, "global_step": 10273, "epoch": 61} {"train_loss": -5.590132713317871, "global_step": 10274, "epoch": 61} {"train_loss": -5.971802711486816, "global_step": 10275, "epoch": 61} {"train_loss": -6.126705169677734, "global_step": 10276, "epoch": 61} {"train_loss": -6.009552955627441, "global_step": 10277, "epoch": 61} {"train_loss": -5.872754096984863, "global_step": 10278, "epoch": 61} {"train_loss": -6.044471740722656, "global_step": 10279, "epoch": 61} {"train_loss": -5.91269063949585, "global_step": 10280, "epoch": 61} {"train_loss": -5.8743977546691895, "global_step": 10281, "epoch": 61} {"train_loss": -5.6429548263549805, "global_step": 10282, "epoch": 61} {"train_loss": -5.976922988891602, "global_step": 10283, "epoch": 61} {"train_loss": -5.490874767303467, "global_step": 10284, "epoch": 61} {"train_loss": -5.588813304901123, "global_step": 10285, "epoch": 61} {"train_loss": -5.797340393066406, "global_step": 10286, "epoch": 61} {"train_loss": -5.586170196533203, "global_step": 10287, "epoch": 61} {"train_loss": -5.765312194824219, "global_step": 10288, "epoch": 61} {"train_loss": -5.732581615447998, "global_step": 10289, "epoch": 61} {"train_loss": -5.464568614959717, "global_step": 10290, "epoch": 61} {"train_loss": -5.923469543457031, "global_step": 10291, "epoch": 61} {"train_loss": -5.795819282531738, "global_step": 10292, "epoch": 61} {"train_loss": -5.7602362632751465, "global_step": 10293, "epoch": 61} {"train_loss": -5.624277591705322, "global_step": 10294, "epoch": 61} {"train_loss": -5.650493621826172, "global_step": 10295, "epoch": 61} {"train_loss": -5.622314929962158, "global_step": 10296, "epoch": 61} {"train_loss": -5.772111415863037, "global_step": 10297, "epoch": 61} {"train_loss": -5.565673351287842, "global_step": 10298, "epoch": 61} {"train_loss": -5.6598076820373535, "global_step": 10299, "epoch": 61} {"train_loss": -5.768158912658691, "global_step": 10300, "epoch": 61} {"train_loss": -5.352451801300049, "global_step": 10301, "epoch": 61} {"train_loss": -5.558834552764893, "global_step": 10302, "epoch": 61} {"train_loss": -5.461032867431641, "global_step": 10303, "epoch": 61} {"train_loss": -5.504602432250977, "global_step": 10304, "epoch": 61} {"train_loss": -5.674840450286865, "global_step": 10305, "epoch": 61} {"train_loss": -5.853034973144531, "global_step": 10306, "epoch": 61} {"train_loss": -5.7302141189575195, "global_step": 10307, "epoch": 61} {"train_loss": -5.836539268493652, "global_step": 10308, "epoch": 61} {"train_loss": -5.703248500823975, "global_step": 10309, "epoch": 61} {"train_loss": -5.884430885314941, "global_step": 10310, "epoch": 61} {"train_loss": -5.989081382751465, "global_step": 10311, "epoch": 61} {"train_loss": -5.5340423583984375, "global_step": 10312, "epoch": 61} {"train_loss": -5.783535003662109, "global_step": 10313, "epoch": 61} {"train_loss": -5.7138352394104, "global_step": 10314, "epoch": 61} {"train_loss": -5.720749855041504, "global_step": 10315, "epoch": 61} {"train_loss": -5.770666122436523, "global_step": 10316, "epoch": 61} {"train_loss": -5.76171875, "global_step": 10317, "epoch": 61} {"train_loss": -5.462263107299805, "global_step": 10318, "epoch": 61} {"train_loss": -6.100406646728516, "global_step": 10319, "epoch": 61} {"train_loss": -5.967241287231445, "global_step": 10320, "epoch": 61} {"train_loss": -5.729589939117432, "global_step": 10321, "epoch": 61} {"train_loss": -5.824723243713379, "global_step": 10322, "epoch": 61} {"train_loss": -5.735723495483398, "global_step": 10323, "epoch": 61} {"train_loss": -5.860762596130371, "global_step": 10324, "epoch": 61} {"train_loss": -5.833565711975098, "global_step": 10325, "epoch": 61} {"train_loss": -5.915548324584961, "global_step": 10326, "epoch": 61} {"train_loss": -5.786048889160156, "global_step": 10327, "epoch": 61} {"train_loss": -5.805090427398682, "global_step": 10328, "epoch": 61} {"train_loss": -5.953334331512451, "global_step": 10329, "epoch": 61} {"train_loss": -5.895187854766846, "global_step": 10330, "epoch": 61} {"train_loss": -5.974641799926758, "global_step": 10331, "epoch": 61} {"train_loss": -5.8719282150268555, "global_step": 10332, "epoch": 61} {"train_loss": -5.971548557281494, "global_step": 10333, "epoch": 61} {"train_loss": -6.13662052154541, "global_step": 10334, "epoch": 61} {"train_loss": -6.004110813140869, "global_step": 10335, "epoch": 61} {"train_loss": -6.030058860778809, "global_step": 10336, "epoch": 61} {"train_loss": -6.055792331695557, "global_step": 10337, "epoch": 61} {"train_loss": -6.171669960021973, "global_step": 10338, "epoch": 61} {"train_loss": -5.912946701049805, "global_step": 10339, "epoch": 61} {"train_loss": -6.22078275680542, "global_step": 10340, "epoch": 61} {"train_loss": -5.889822483062744, "global_step": 10341, "epoch": 61} {"train_loss": -5.711269378662109, "global_step": 10342, "epoch": 61} {"train_loss": -5.814766883850098, "global_step": 10343, "epoch": 61} {"train_loss": -5.876743316650391, "global_step": 10344, "epoch": 61} {"train_loss": -5.942440032958984, "global_step": 10345, "epoch": 61} {"train_loss": -5.617588996887207, "global_step": 10346, "epoch": 61} {"train_loss": -5.96632719039917, "global_step": 10347, "epoch": 61} {"train_loss": -5.633237838745117, "global_step": 10348, "epoch": 61} {"train_loss": -5.892629623413086, "global_step": 10349, "epoch": 61} {"train_loss": -5.495428085327148, "global_step": 10350, "epoch": 61} {"train_loss": -5.707201957702637, "global_step": 10351, "epoch": 61} {"train_loss": -5.687811851501465, "global_step": 10352, "epoch": 61} {"train_loss": -5.745811462402344, "global_step": 10353, "epoch": 61} {"train_loss": -5.811697483062744, "global_step": 10354, "epoch": 61} {"train_loss": -5.94047212600708, "global_step": 10355, "epoch": 61} {"train_loss": -5.56472110748291, "global_step": 10356, "epoch": 61} {"train_loss": -5.734840393066406, "global_step": 10357, "epoch": 61} {"train_loss": -5.892319679260254, "global_step": 10358, "epoch": 61} {"train_loss": -5.863514423370361, "global_step": 10359, "epoch": 61} {"train_loss": -5.834702491760254, "global_step": 10360, "epoch": 61} {"train_loss": -5.756685256958008, "global_step": 10361, "epoch": 61} {"train_loss": -5.683629989624023, "global_step": 10362, "epoch": 61} {"train_loss": -5.7049407958984375, "global_step": 10363, "epoch": 61} {"train_loss": -5.699613094329834, "global_step": 10364, "epoch": 61} {"train_loss": -5.81134033203125, "global_step": 10365, "epoch": 61} {"train_loss": -5.807216644287109, "global_step": 10366, "epoch": 61} {"train_loss": -5.601068019866943, "global_step": 10367, "epoch": 61} {"train_loss": -5.951885223388672, "global_step": 10368, "epoch": 61} {"train_loss": -5.7768096923828125, "global_step": 10369, "epoch": 61} {"train_loss": -6.074296951293945, "global_step": 10370, "epoch": 61} {"train_loss": -5.729104995727539, "global_step": 10371, "epoch": 61} {"train_loss": -5.919056415557861, "global_step": 10372, "epoch": 61} {"train_loss": -5.674427032470703, "global_step": 10373, "epoch": 61} {"train_loss": -5.5818772315979, "global_step": 10374, "epoch": 61} {"train_loss": -5.629594802856445, "global_step": 10375, "epoch": 61} {"train_loss": -5.763258934020996, "global_step": 10376, "epoch": 61} {"train_loss": -5.777043342590332, "global_step": 10377, "epoch": 61} {"train_loss": -5.5576958656311035, "global_step": 10378, "epoch": 61} {"train_loss": -5.719729423522949, "global_step": 10379, "epoch": 61} {"train_loss": -5.785163402557373, "global_step": 10380, "epoch": 61} {"train_loss": -5.612816333770752, "global_step": 10381, "epoch": 61} {"train_loss": -5.664524078369141, "global_step": 10382, "epoch": 61} {"train_loss": -5.604073524475098, "global_step": 10383, "epoch": 61} {"train_loss": -5.733432292938232, "global_step": 10384, "epoch": 61} {"train_loss": -5.85054874420166, "global_step": 10385, "epoch": 61} {"train_loss": -5.707838535308838, "global_step": 10386, "epoch": 61} {"train_loss": -5.7858734130859375, "global_step": 10387, "epoch": 61} {"train_loss": -5.526918411254883, "global_step": 10388, "epoch": 61} {"train_loss": -5.794768333435059, "global_step": 10389, "epoch": 61} {"train_loss": -5.886422157287598, "global_step": 10390, "epoch": 61} {"train_loss": -5.462520122528076, "global_step": 10391, "epoch": 61} {"train_loss": -6.073714256286621, "global_step": 10392, "epoch": 61} {"train_loss": -5.587108612060547, "global_step": 10393, "epoch": 61} {"train_loss": -5.742959976196289, "global_step": 10394, "epoch": 61} {"train_loss": -5.755485534667969, "global_step": 10395, "epoch": 61} {"train_loss": -5.646824836730957, "global_step": 10396, "epoch": 61} {"train_loss": -5.819383144378662, "global_step": 10397, "epoch": 61} {"train_loss": -5.704748153686523, "global_step": 10398, "epoch": 61} {"train_loss": -5.588944911956787, "global_step": 10399, "epoch": 61} {"train_loss": -5.851018905639648, "global_step": 10400, "epoch": 61} {"train_loss": -5.68338680267334, "global_step": 10401, "epoch": 61} {"train_loss": -5.584504127502441, "global_step": 10402, "epoch": 61} {"train_loss": -5.705104827880859, "global_step": 10403, "epoch": 61} {"train_loss": -6.030682563781738, "global_step": 10404, "epoch": 61} {"train_loss": -5.774106025695801, "global_step": 10405, "epoch": 61} {"train_loss": -6.116744041442871, "global_step": 10406, "epoch": 61} {"train_loss": -5.888765335083008, "global_step": 10407, "epoch": 61} {"train_loss": -5.832232475280762, "global_step": 10408, "epoch": 61} {"train_loss": -5.629261016845703, "global_step": 10409, "epoch": 61} {"train_loss": -5.83918571472168, "global_step": 10410, "epoch": 61} {"train_loss": -5.983759880065918, "global_step": 10411, "epoch": 61} {"train_loss": -5.791662693023682, "global_step": 10412, "epoch": 61} {"train_loss": -5.979543685913086, "global_step": 10413, "epoch": 61} {"train_loss": -5.794551372528076, "global_step": 10414, "epoch": 61} {"train_loss": -5.783122894309816, "global_step": 10415, "epoch": 61, "val_loss": 256043.921875} {"train_loss": -5.592499732971191, "global_step": 10416, "epoch": 62} {"train_loss": -5.860194206237793, "global_step": 10417, "epoch": 62} {"train_loss": -5.8845062255859375, "global_step": 10418, "epoch": 62} {"train_loss": -5.873106479644775, "global_step": 10419, "epoch": 62} {"train_loss": -5.841204643249512, "global_step": 10420, "epoch": 62} {"train_loss": -5.816366195678711, "global_step": 10421, "epoch": 62} {"train_loss": -5.690841197967529, "global_step": 10422, "epoch": 62} {"train_loss": -5.9397125244140625, "global_step": 10423, "epoch": 62} {"train_loss": -5.88074254989624, "global_step": 10424, "epoch": 62} {"train_loss": -5.866171836853027, "global_step": 10425, "epoch": 62} {"train_loss": -5.643153190612793, "global_step": 10426, "epoch": 62} {"train_loss": -5.763497829437256, "global_step": 10427, "epoch": 62} {"train_loss": -5.576492786407471, "global_step": 10428, "epoch": 62} {"train_loss": -5.658529281616211, "global_step": 10429, "epoch": 62} {"train_loss": -5.594038009643555, "global_step": 10430, "epoch": 62} {"train_loss": -5.916836738586426, "global_step": 10431, "epoch": 62} {"train_loss": -6.025718688964844, "global_step": 10432, "epoch": 62} {"train_loss": -5.533318042755127, "global_step": 10433, "epoch": 62} {"train_loss": -5.807531356811523, "global_step": 10434, "epoch": 62} {"train_loss": -5.888583183288574, "global_step": 10435, "epoch": 62} {"train_loss": -5.731523513793945, "global_step": 10436, "epoch": 62} {"train_loss": -5.658141613006592, "global_step": 10437, "epoch": 62} {"train_loss": -5.712386608123779, "global_step": 10438, "epoch": 62} {"train_loss": -5.9564714431762695, "global_step": 10439, "epoch": 62} {"train_loss": -5.571169853210449, "global_step": 10440, "epoch": 62} {"train_loss": -5.59804630279541, "global_step": 10441, "epoch": 62} {"train_loss": -5.6691412925720215, "global_step": 10442, "epoch": 62} {"train_loss": -5.750896453857422, "global_step": 10443, "epoch": 62} {"train_loss": -5.793845176696777, "global_step": 10444, "epoch": 62} {"train_loss": -5.770488739013672, "global_step": 10445, "epoch": 62} {"train_loss": -5.907290458679199, "global_step": 10446, "epoch": 62} {"train_loss": -5.875522136688232, "global_step": 10447, "epoch": 62} {"train_loss": -5.384816646575928, "global_step": 10448, "epoch": 62} {"train_loss": -5.7865214347839355, "global_step": 10449, "epoch": 62} {"train_loss": -5.650239944458008, "global_step": 10450, "epoch": 62} {"train_loss": -5.753106117248535, "global_step": 10451, "epoch": 62} {"train_loss": -5.921346664428711, "global_step": 10452, "epoch": 62} {"train_loss": -5.765652656555176, "global_step": 10453, "epoch": 62} {"train_loss": -5.777655124664307, "global_step": 10454, "epoch": 62} {"train_loss": -5.745172500610352, "global_step": 10455, "epoch": 62} {"train_loss": -5.894145965576172, "global_step": 10456, "epoch": 62} {"train_loss": -5.9720025062561035, "global_step": 10457, "epoch": 62} {"train_loss": -5.672694206237793, "global_step": 10458, "epoch": 62} {"train_loss": -5.572849273681641, "global_step": 10459, "epoch": 62} {"train_loss": -5.8961100578308105, "global_step": 10460, "epoch": 62} {"train_loss": -5.704429626464844, "global_step": 10461, "epoch": 62} {"train_loss": -6.0151214599609375, "global_step": 10462, "epoch": 62} {"train_loss": -5.776049613952637, "global_step": 10463, "epoch": 62} {"train_loss": -5.883479118347168, "global_step": 10464, "epoch": 62} {"train_loss": -5.850571155548096, "global_step": 10465, "epoch": 62} {"train_loss": -5.907379150390625, "global_step": 10466, "epoch": 62} {"train_loss": -5.7678422927856445, "global_step": 10467, "epoch": 62} {"train_loss": -5.5923357009887695, "global_step": 10468, "epoch": 62} {"train_loss": -5.793636322021484, "global_step": 10469, "epoch": 62} {"train_loss": -5.87868070602417, "global_step": 10470, "epoch": 62} {"train_loss": -5.813051700592041, "global_step": 10471, "epoch": 62} {"train_loss": -6.033205032348633, "global_step": 10472, "epoch": 62} {"train_loss": -5.66278076171875, "global_step": 10473, "epoch": 62} {"train_loss": -5.677358150482178, "global_step": 10474, "epoch": 62} {"train_loss": -6.029026031494141, "global_step": 10475, "epoch": 62} {"train_loss": -6.005558967590332, "global_step": 10476, "epoch": 62} {"train_loss": -5.991551399230957, "global_step": 10477, "epoch": 62} {"train_loss": -6.062263488769531, "global_step": 10478, "epoch": 62} {"train_loss": -5.958649635314941, "global_step": 10479, "epoch": 62} {"train_loss": -5.436473846435547, "global_step": 10480, "epoch": 62} {"train_loss": -5.8222198486328125, "global_step": 10481, "epoch": 62} {"train_loss": -5.804721832275391, "global_step": 10482, "epoch": 62} {"train_loss": -5.769701957702637, "global_step": 10483, "epoch": 62} {"train_loss": -6.022759914398193, "global_step": 10484, "epoch": 62} {"train_loss": -5.917539596557617, "global_step": 10485, "epoch": 62} {"train_loss": -5.530580520629883, "global_step": 10486, "epoch": 62} {"train_loss": -5.702829837799072, "global_step": 10487, "epoch": 62} {"train_loss": -6.011240482330322, "global_step": 10488, "epoch": 62} {"train_loss": -5.779092311859131, "global_step": 10489, "epoch": 62} {"train_loss": -5.888592720031738, "global_step": 10490, "epoch": 62} {"train_loss": -6.016005516052246, "global_step": 10491, "epoch": 62} {"train_loss": -5.644733428955078, "global_step": 10492, "epoch": 62} {"train_loss": -5.760727882385254, "global_step": 10493, "epoch": 62} {"train_loss": -5.80264949798584, "global_step": 10494, "epoch": 62} {"train_loss": -5.817411422729492, "global_step": 10495, "epoch": 62} {"train_loss": -5.748676300048828, "global_step": 10496, "epoch": 62} {"train_loss": -6.027256488800049, "global_step": 10497, "epoch": 62} {"train_loss": -5.836991786956787, "global_step": 10498, "epoch": 62} {"train_loss": -5.856295108795166, "global_step": 10499, "epoch": 62} {"train_loss": -5.837265968322754, "global_step": 10500, "epoch": 62} {"train_loss": -5.7575602531433105, "global_step": 10501, "epoch": 62} {"train_loss": -6.0335001945495605, "global_step": 10502, "epoch": 62} {"train_loss": -5.412096977233887, "global_step": 10503, "epoch": 62} {"train_loss": -5.857283592224121, "global_step": 10504, "epoch": 62} {"train_loss": -5.669909954071045, "global_step": 10505, "epoch": 62} {"train_loss": -5.752758026123047, "global_step": 10506, "epoch": 62} {"train_loss": -5.741433143615723, "global_step": 10507, "epoch": 62} {"train_loss": -5.569764137268066, "global_step": 10508, "epoch": 62} {"train_loss": -5.750031471252441, "global_step": 10509, "epoch": 62} {"train_loss": -5.840887546539307, "global_step": 10510, "epoch": 62} {"train_loss": -5.524999141693115, "global_step": 10511, "epoch": 62} {"train_loss": -5.642918586730957, "global_step": 10512, "epoch": 62} {"train_loss": -5.800329685211182, "global_step": 10513, "epoch": 62} {"train_loss": -5.856604099273682, "global_step": 10514, "epoch": 62} {"train_loss": -5.7356672286987305, "global_step": 10515, "epoch": 62} {"train_loss": -5.688967704772949, "global_step": 10516, "epoch": 62} {"train_loss": -5.705916404724121, "global_step": 10517, "epoch": 62} {"train_loss": -5.792898654937744, "global_step": 10518, "epoch": 62} {"train_loss": -5.7532196044921875, "global_step": 10519, "epoch": 62} {"train_loss": -5.53839111328125, "global_step": 10520, "epoch": 62} {"train_loss": -5.738042831420898, "global_step": 10521, "epoch": 62} {"train_loss": -6.003700256347656, "global_step": 10522, "epoch": 62} {"train_loss": -5.806205749511719, "global_step": 10523, "epoch": 62} {"train_loss": -6.001399040222168, "global_step": 10524, "epoch": 62} {"train_loss": -5.989621639251709, "global_step": 10525, "epoch": 62} {"train_loss": -5.7389750480651855, "global_step": 10526, "epoch": 62} {"train_loss": -6.004094123840332, "global_step": 10527, "epoch": 62} {"train_loss": -5.6263580322265625, "global_step": 10528, "epoch": 62} {"train_loss": -5.600424766540527, "global_step": 10529, "epoch": 62} {"train_loss": -5.776663780212402, "global_step": 10530, "epoch": 62} {"train_loss": -5.5410566329956055, "global_step": 10531, "epoch": 62} {"train_loss": -5.822706699371338, "global_step": 10532, "epoch": 62} {"train_loss": -5.6410369873046875, "global_step": 10533, "epoch": 62} {"train_loss": -6.008373737335205, "global_step": 10534, "epoch": 62} {"train_loss": -5.924205780029297, "global_step": 10535, "epoch": 62} {"train_loss": -5.624400615692139, "global_step": 10536, "epoch": 62} {"train_loss": -5.864524841308594, "global_step": 10537, "epoch": 62} {"train_loss": -5.940872669219971, "global_step": 10538, "epoch": 62} {"train_loss": -5.612839221954346, "global_step": 10539, "epoch": 62} {"train_loss": -5.6323089599609375, "global_step": 10540, "epoch": 62} {"train_loss": -5.658673286437988, "global_step": 10541, "epoch": 62} {"train_loss": -5.700290203094482, "global_step": 10542, "epoch": 62} {"train_loss": -5.888566970825195, "global_step": 10543, "epoch": 62} {"train_loss": -6.058755874633789, "global_step": 10544, "epoch": 62} {"train_loss": -5.641874313354492, "global_step": 10545, "epoch": 62} {"train_loss": -5.683150291442871, "global_step": 10546, "epoch": 62} {"train_loss": -5.650341510772705, "global_step": 10547, "epoch": 62} {"train_loss": -5.764404296875, "global_step": 10548, "epoch": 62} {"train_loss": -5.817371368408203, "global_step": 10549, "epoch": 62} {"train_loss": -5.714808464050293, "global_step": 10550, "epoch": 62} {"train_loss": -5.9815568923950195, "global_step": 10551, "epoch": 62} {"train_loss": -5.827714920043945, "global_step": 10552, "epoch": 62} {"train_loss": -5.77190637588501, "global_step": 10553, "epoch": 62} {"train_loss": -5.883740425109863, "global_step": 10554, "epoch": 62} {"train_loss": -5.860480308532715, "global_step": 10555, "epoch": 62} {"train_loss": -5.873621463775635, "global_step": 10556, "epoch": 62} {"train_loss": -5.922635078430176, "global_step": 10557, "epoch": 62} {"train_loss": -5.8480987548828125, "global_step": 10558, "epoch": 62} {"train_loss": -5.785140037536621, "global_step": 10559, "epoch": 62} {"train_loss": -5.498593330383301, "global_step": 10560, "epoch": 62} {"train_loss": -5.911052703857422, "global_step": 10561, "epoch": 62} {"train_loss": -5.9122114181518555, "global_step": 10562, "epoch": 62} {"train_loss": -6.083105087280273, "global_step": 10563, "epoch": 62} {"train_loss": -5.465986251831055, "global_step": 10564, "epoch": 62} {"train_loss": -5.9048051834106445, "global_step": 10565, "epoch": 62} {"train_loss": -5.733050346374512, "global_step": 10566, "epoch": 62} {"train_loss": -5.912814617156982, "global_step": 10567, "epoch": 62} {"train_loss": -5.779767036437988, "global_step": 10568, "epoch": 62} {"train_loss": -5.8280487060546875, "global_step": 10569, "epoch": 62} {"train_loss": -5.863138675689697, "global_step": 10570, "epoch": 62} {"train_loss": -5.9455461502075195, "global_step": 10571, "epoch": 62} {"train_loss": -5.951772689819336, "global_step": 10572, "epoch": 62} {"train_loss": -5.8712639808654785, "global_step": 10573, "epoch": 62} {"train_loss": -5.5696563720703125, "global_step": 10574, "epoch": 62} {"train_loss": -5.769181251525879, "global_step": 10575, "epoch": 62} {"train_loss": -5.558752059936523, "global_step": 10576, "epoch": 62} {"train_loss": -5.8741302490234375, "global_step": 10577, "epoch": 62} {"train_loss": -5.488920211791992, "global_step": 10578, "epoch": 62} {"train_loss": -5.725915908813477, "global_step": 10579, "epoch": 62} {"train_loss": -5.735991477966309, "global_step": 10580, "epoch": 62} {"train_loss": -5.829103469848633, "global_step": 10581, "epoch": 62} {"train_loss": -5.658588886260986, "global_step": 10582, "epoch": 62} {"train_loss": -5.787782109919048, "global_step": 10583, "epoch": 62, "val_loss": 262155.1875} {"train_loss": -5.887172222137451, "global_step": 10584, "epoch": 63} {"train_loss": -5.729313373565674, "global_step": 10585, "epoch": 63} {"train_loss": -5.927188396453857, "global_step": 10586, "epoch": 63} {"train_loss": -5.7382097244262695, "global_step": 10587, "epoch": 63} {"train_loss": -5.993569850921631, "global_step": 10588, "epoch": 63} {"train_loss": -5.833948612213135, "global_step": 10589, "epoch": 63} {"train_loss": -5.841623306274414, "global_step": 10590, "epoch": 63} {"train_loss": -5.79766845703125, "global_step": 10591, "epoch": 63} {"train_loss": -5.942587852478027, "global_step": 10592, "epoch": 63} {"train_loss": -5.636680603027344, "global_step": 10593, "epoch": 63} {"train_loss": -5.514194488525391, "global_step": 10594, "epoch": 63} {"train_loss": -5.682032585144043, "global_step": 10595, "epoch": 63} {"train_loss": -5.749530792236328, "global_step": 10596, "epoch": 63} {"train_loss": -5.978882789611816, "global_step": 10597, "epoch": 63} {"train_loss": -5.481223106384277, "global_step": 10598, "epoch": 63} {"train_loss": -5.588903903961182, "global_step": 10599, "epoch": 63} {"train_loss": -5.7823567390441895, "global_step": 10600, "epoch": 63} {"train_loss": -5.775307655334473, "global_step": 10601, "epoch": 63} {"train_loss": -5.880050182342529, "global_step": 10602, "epoch": 63} {"train_loss": -5.986058235168457, "global_step": 10603, "epoch": 63} {"train_loss": -6.190557479858398, "global_step": 10604, "epoch": 63} {"train_loss": -5.806709289550781, "global_step": 10605, "epoch": 63} {"train_loss": -5.833833694458008, "global_step": 10606, "epoch": 63} {"train_loss": -5.909231185913086, "global_step": 10607, "epoch": 63} {"train_loss": -5.897400856018066, "global_step": 10608, "epoch": 63} {"train_loss": -5.967206954956055, "global_step": 10609, "epoch": 63} {"train_loss": -6.08300256729126, "global_step": 10610, "epoch": 63} {"train_loss": -5.9288153648376465, "global_step": 10611, "epoch": 63} {"train_loss": -5.982247352600098, "global_step": 10612, "epoch": 63} {"train_loss": -5.875918865203857, "global_step": 10613, "epoch": 63} {"train_loss": -5.737811088562012, "global_step": 10614, "epoch": 63} {"train_loss": -5.75654411315918, "global_step": 10615, "epoch": 63} {"train_loss": -5.919363498687744, "global_step": 10616, "epoch": 63} {"train_loss": -5.619876861572266, "global_step": 10617, "epoch": 63} {"train_loss": -5.905961990356445, "global_step": 10618, "epoch": 63} {"train_loss": -5.980895519256592, "global_step": 10619, "epoch": 63} {"train_loss": -5.836968421936035, "global_step": 10620, "epoch": 63} {"train_loss": -6.264237880706787, "global_step": 10621, "epoch": 63} {"train_loss": -5.678501129150391, "global_step": 10622, "epoch": 63} {"train_loss": -5.946937561035156, "global_step": 10623, "epoch": 63} {"train_loss": -5.85054874420166, "global_step": 10624, "epoch": 63} {"train_loss": -5.859663009643555, "global_step": 10625, "epoch": 63} {"train_loss": -5.666496276855469, "global_step": 10626, "epoch": 63} {"train_loss": -5.708845138549805, "global_step": 10627, "epoch": 63} {"train_loss": -5.740266799926758, "global_step": 10628, "epoch": 63} {"train_loss": -5.7314252853393555, "global_step": 10629, "epoch": 63} {"train_loss": -5.571824073791504, "global_step": 10630, "epoch": 63} {"train_loss": -5.525491714477539, "global_step": 10631, "epoch": 63} {"train_loss": -5.831118106842041, "global_step": 10632, "epoch": 63} {"train_loss": -5.766829967498779, "global_step": 10633, "epoch": 63} {"train_loss": -5.805004596710205, "global_step": 10634, "epoch": 63} {"train_loss": -5.65915584564209, "global_step": 10635, "epoch": 63} {"train_loss": -5.650046348571777, "global_step": 10636, "epoch": 63} {"train_loss": -5.776989936828613, "global_step": 10637, "epoch": 63} {"train_loss": -5.8827924728393555, "global_step": 10638, "epoch": 63} {"train_loss": -5.80349063873291, "global_step": 10639, "epoch": 63} {"train_loss": -5.748076438903809, "global_step": 10640, "epoch": 63} {"train_loss": -6.0662946701049805, "global_step": 10641, "epoch": 63} {"train_loss": -5.914690971374512, "global_step": 10642, "epoch": 63} {"train_loss": -5.732155799865723, "global_step": 10643, "epoch": 63} {"train_loss": -6.0081682205200195, "global_step": 10644, "epoch": 63} {"train_loss": -5.898481369018555, "global_step": 10645, "epoch": 63} {"train_loss": -5.831259727478027, "global_step": 10646, "epoch": 63} {"train_loss": -5.801238536834717, "global_step": 10647, "epoch": 63} {"train_loss": -5.686309337615967, "global_step": 10648, "epoch": 63} {"train_loss": -5.845688819885254, "global_step": 10649, "epoch": 63} {"train_loss": -5.733124732971191, "global_step": 10650, "epoch": 63} {"train_loss": -6.047746181488037, "global_step": 10651, "epoch": 63} {"train_loss": -5.840730667114258, "global_step": 10652, "epoch": 63} {"train_loss": -5.89698600769043, "global_step": 10653, "epoch": 63} {"train_loss": -5.703179359436035, "global_step": 10654, "epoch": 63} {"train_loss": -6.041492462158203, "global_step": 10655, "epoch": 63} {"train_loss": -5.782502174377441, "global_step": 10656, "epoch": 63} {"train_loss": -5.994038105010986, "global_step": 10657, "epoch": 63} {"train_loss": -5.715982437133789, "global_step": 10658, "epoch": 63} {"train_loss": -5.764196395874023, "global_step": 10659, "epoch": 63} {"train_loss": -5.823786735534668, "global_step": 10660, "epoch": 63} {"train_loss": -5.910344123840332, "global_step": 10661, "epoch": 63} {"train_loss": -5.857200622558594, "global_step": 10662, "epoch": 63} {"train_loss": -5.843420028686523, "global_step": 10663, "epoch": 63} {"train_loss": -5.8675618171691895, "global_step": 10664, "epoch": 63} {"train_loss": -5.920231819152832, "global_step": 10665, "epoch": 63} {"train_loss": -6.06146240234375, "global_step": 10666, "epoch": 63} {"train_loss": -6.033466339111328, "global_step": 10667, "epoch": 63} {"train_loss": -5.9662184715271, "global_step": 10668, "epoch": 63} {"train_loss": -5.865328788757324, "global_step": 10669, "epoch": 63} {"train_loss": -6.043624401092529, "global_step": 10670, "epoch": 63} {"train_loss": -5.860808372497559, "global_step": 10671, "epoch": 63} {"train_loss": -5.749377250671387, "global_step": 10672, "epoch": 63} {"train_loss": -5.95735502243042, "global_step": 10673, "epoch": 63} {"train_loss": -5.906010627746582, "global_step": 10674, "epoch": 63} {"train_loss": -6.10370397567749, "global_step": 10675, "epoch": 63} {"train_loss": -5.966604232788086, "global_step": 10676, "epoch": 63} {"train_loss": -5.813803672790527, "global_step": 10677, "epoch": 63} {"train_loss": -5.893311023712158, "global_step": 10678, "epoch": 63} {"train_loss": -5.686427593231201, "global_step": 10679, "epoch": 63} {"train_loss": -5.497861862182617, "global_step": 10680, "epoch": 63} {"train_loss": -5.819533824920654, "global_step": 10681, "epoch": 63} {"train_loss": -5.885914325714111, "global_step": 10682, "epoch": 63} {"train_loss": -5.940737247467041, "global_step": 10683, "epoch": 63} {"train_loss": -5.74171257019043, "global_step": 10684, "epoch": 63} {"train_loss": -6.0602312088012695, "global_step": 10685, "epoch": 63} {"train_loss": -5.636064529418945, "global_step": 10686, "epoch": 63} {"train_loss": -5.8895745277404785, "global_step": 10687, "epoch": 63} {"train_loss": -5.7253851890563965, "global_step": 10688, "epoch": 63} {"train_loss": -5.91480016708374, "global_step": 10689, "epoch": 63} {"train_loss": -5.76798152923584, "global_step": 10690, "epoch": 63} {"train_loss": -6.034298896789551, "global_step": 10691, "epoch": 63} {"train_loss": -5.685370922088623, "global_step": 10692, "epoch": 63} {"train_loss": -5.773128509521484, "global_step": 10693, "epoch": 63} {"train_loss": -5.633152008056641, "global_step": 10694, "epoch": 63} {"train_loss": -5.874581336975098, "global_step": 10695, "epoch": 63} {"train_loss": -5.846517086029053, "global_step": 10696, "epoch": 63} {"train_loss": -5.678022384643555, "global_step": 10697, "epoch": 63} {"train_loss": -5.8434319496154785, "global_step": 10698, "epoch": 63} {"train_loss": -5.88192081451416, "global_step": 10699, "epoch": 63} {"train_loss": -5.824382781982422, "global_step": 10700, "epoch": 63} {"train_loss": -5.872048377990723, "global_step": 10701, "epoch": 63} {"train_loss": -5.980847358703613, "global_step": 10702, "epoch": 63} {"train_loss": -6.043662071228027, "global_step": 10703, "epoch": 63} {"train_loss": -5.860162258148193, "global_step": 10704, "epoch": 63} {"train_loss": -5.775728225708008, "global_step": 10705, "epoch": 63} {"train_loss": -5.696228504180908, "global_step": 10706, "epoch": 63} {"train_loss": -5.8649187088012695, "global_step": 10707, "epoch": 63} {"train_loss": -5.530398845672607, "global_step": 10708, "epoch": 63} {"train_loss": -6.0490007400512695, "global_step": 10709, "epoch": 63} {"train_loss": -5.814879417419434, "global_step": 10710, "epoch": 63} {"train_loss": -6.013533592224121, "global_step": 10711, "epoch": 63} {"train_loss": -5.942140102386475, "global_step": 10712, "epoch": 63} {"train_loss": -6.077047348022461, "global_step": 10713, "epoch": 63} {"train_loss": -5.962560176849365, "global_step": 10714, "epoch": 63} {"train_loss": -6.001742839813232, "global_step": 10715, "epoch": 63} {"train_loss": -5.962070465087891, "global_step": 10716, "epoch": 63} {"train_loss": -5.656975746154785, "global_step": 10717, "epoch": 63} {"train_loss": -5.881051063537598, "global_step": 10718, "epoch": 63} {"train_loss": -5.841820240020752, "global_step": 10719, "epoch": 63} {"train_loss": -6.0013041496276855, "global_step": 10720, "epoch": 63} {"train_loss": -5.567966461181641, "global_step": 10721, "epoch": 63} {"train_loss": -5.698328971862793, "global_step": 10722, "epoch": 63} {"train_loss": -6.005247592926025, "global_step": 10723, "epoch": 63} {"train_loss": -5.504795074462891, "global_step": 10724, "epoch": 63} {"train_loss": -5.791518211364746, "global_step": 10725, "epoch": 63} {"train_loss": -5.905844211578369, "global_step": 10726, "epoch": 63} {"train_loss": -5.7461981773376465, "global_step": 10727, "epoch": 63} {"train_loss": -5.962833404541016, "global_step": 10728, "epoch": 63} {"train_loss": -5.570971488952637, "global_step": 10729, "epoch": 63} {"train_loss": -6.081535816192627, "global_step": 10730, "epoch": 63} {"train_loss": -5.668062686920166, "global_step": 10731, "epoch": 63} {"train_loss": -6.116080284118652, "global_step": 10732, "epoch": 63} {"train_loss": -5.95406436920166, "global_step": 10733, "epoch": 63} {"train_loss": -5.781060218811035, "global_step": 10734, "epoch": 63} {"train_loss": -5.746843338012695, "global_step": 10735, "epoch": 63} {"train_loss": -5.7300591468811035, "global_step": 10736, "epoch": 63} {"train_loss": -6.017388343811035, "global_step": 10737, "epoch": 63} {"train_loss": -5.899877548217773, "global_step": 10738, "epoch": 63} {"train_loss": -6.014573097229004, "global_step": 10739, "epoch": 63} {"train_loss": -6.026602745056152, "global_step": 10740, "epoch": 63} {"train_loss": -5.719869613647461, "global_step": 10741, "epoch": 63} {"train_loss": -5.893893241882324, "global_step": 10742, "epoch": 63} {"train_loss": -6.0562543869018555, "global_step": 10743, "epoch": 63} {"train_loss": -6.228533744812012, "global_step": 10744, "epoch": 63} {"train_loss": -6.066917419433594, "global_step": 10745, "epoch": 63} {"train_loss": -5.916969299316406, "global_step": 10746, "epoch": 63} {"train_loss": -5.859922409057617, "global_step": 10747, "epoch": 63} {"train_loss": -5.6978960037231445, "global_step": 10748, "epoch": 63} {"train_loss": -5.9379963874816895, "global_step": 10749, "epoch": 63} {"train_loss": -5.971101760864258, "global_step": 10750, "epoch": 63} {"train_loss": -5.848140512193952, "global_step": 10751, "epoch": 63, "val_loss": 263846.8125} {"train_loss": -5.929694652557373, "global_step": 10752, "epoch": 64} {"train_loss": -5.879149436950684, "global_step": 10753, "epoch": 64} {"train_loss": -5.662842750549316, "global_step": 10754, "epoch": 64} {"train_loss": -5.66394567489624, "global_step": 10755, "epoch": 64} {"train_loss": -5.764831066131592, "global_step": 10756, "epoch": 64} {"train_loss": -5.785656929016113, "global_step": 10757, "epoch": 64} {"train_loss": -5.823925018310547, "global_step": 10758, "epoch": 64} {"train_loss": -5.806057929992676, "global_step": 10759, "epoch": 64} {"train_loss": -5.943471908569336, "global_step": 10760, "epoch": 64} {"train_loss": -5.708983421325684, "global_step": 10761, "epoch": 64} {"train_loss": -5.891186714172363, "global_step": 10762, "epoch": 64} {"train_loss": -5.616034030914307, "global_step": 10763, "epoch": 64} {"train_loss": -5.657281875610352, "global_step": 10764, "epoch": 64} {"train_loss": -5.569211006164551, "global_step": 10765, "epoch": 64} {"train_loss": -6.0160627365112305, "global_step": 10766, "epoch": 64} {"train_loss": -5.872190952301025, "global_step": 10767, "epoch": 64} {"train_loss": -5.8838043212890625, "global_step": 10768, "epoch": 64} {"train_loss": -5.483305931091309, "global_step": 10769, "epoch": 64} {"train_loss": -5.929658889770508, "global_step": 10770, "epoch": 64} {"train_loss": -5.776700973510742, "global_step": 10771, "epoch": 64} {"train_loss": -5.744354248046875, "global_step": 10772, "epoch": 64} {"train_loss": -5.75882625579834, "global_step": 10773, "epoch": 64} {"train_loss": -5.614154815673828, "global_step": 10774, "epoch": 64} {"train_loss": -5.76065731048584, "global_step": 10775, "epoch": 64} {"train_loss": -5.743656158447266, "global_step": 10776, "epoch": 64} {"train_loss": -5.815210342407227, "global_step": 10777, "epoch": 64} {"train_loss": -5.557292938232422, "global_step": 10778, "epoch": 64} {"train_loss": -5.7084150314331055, "global_step": 10779, "epoch": 64} {"train_loss": -5.877117156982422, "global_step": 10780, "epoch": 64} {"train_loss": -5.700738906860352, "global_step": 10781, "epoch": 64} {"train_loss": -5.790463447570801, "global_step": 10782, "epoch": 64} {"train_loss": -5.884768486022949, "global_step": 10783, "epoch": 64} {"train_loss": -5.918103218078613, "global_step": 10784, "epoch": 64} {"train_loss": -5.529224395751953, "global_step": 10785, "epoch": 64} {"train_loss": -5.626075744628906, "global_step": 10786, "epoch": 64} {"train_loss": -6.055768013000488, "global_step": 10787, "epoch": 64} {"train_loss": -5.8082475662231445, "global_step": 10788, "epoch": 64} {"train_loss": -5.713059902191162, "global_step": 10789, "epoch": 64} {"train_loss": -6.03539514541626, "global_step": 10790, "epoch": 64} {"train_loss": -5.866153240203857, "global_step": 10791, "epoch": 64} {"train_loss": -5.758936882019043, "global_step": 10792, "epoch": 64} {"train_loss": -5.793989181518555, "global_step": 10793, "epoch": 64} {"train_loss": -5.902681827545166, "global_step": 10794, "epoch": 64} {"train_loss": -5.870641708374023, "global_step": 10795, "epoch": 64} {"train_loss": -6.033281326293945, "global_step": 10796, "epoch": 64} {"train_loss": -5.672237396240234, "global_step": 10797, "epoch": 64} {"train_loss": -5.946411609649658, "global_step": 10798, "epoch": 64} {"train_loss": -5.9168925285339355, "global_step": 10799, "epoch": 64} {"train_loss": -6.013418197631836, "global_step": 10800, "epoch": 64} {"train_loss": -6.071557998657227, "global_step": 10801, "epoch": 64} {"train_loss": -6.1093573570251465, "global_step": 10802, "epoch": 64} {"train_loss": -5.690982818603516, "global_step": 10803, "epoch": 64} {"train_loss": -6.0487565994262695, "global_step": 10804, "epoch": 64} {"train_loss": -6.066300868988037, "global_step": 10805, "epoch": 64} {"train_loss": -5.957954406738281, "global_step": 10806, "epoch": 64} {"train_loss": -6.0278849601745605, "global_step": 10807, "epoch": 64} {"train_loss": -5.753805160522461, "global_step": 10808, "epoch": 64} {"train_loss": -5.896323204040527, "global_step": 10809, "epoch": 64} {"train_loss": -5.901947498321533, "global_step": 10810, "epoch": 64} {"train_loss": -6.141815662384033, "global_step": 10811, "epoch": 64} {"train_loss": -5.527961254119873, "global_step": 10812, "epoch": 64} {"train_loss": -5.660988807678223, "global_step": 10813, "epoch": 64} {"train_loss": -5.798428535461426, "global_step": 10814, "epoch": 64} {"train_loss": -5.582965850830078, "global_step": 10815, "epoch": 64} {"train_loss": -5.872382164001465, "global_step": 10816, "epoch": 64} {"train_loss": -5.836808681488037, "global_step": 10817, "epoch": 64} {"train_loss": -5.586294174194336, "global_step": 10818, "epoch": 64} {"train_loss": -5.646485328674316, "global_step": 10819, "epoch": 64} {"train_loss": -5.864260673522949, "global_step": 10820, "epoch": 64} {"train_loss": -6.074500560760498, "global_step": 10821, "epoch": 64} {"train_loss": -5.733068943023682, "global_step": 10822, "epoch": 64} {"train_loss": -5.780445575714111, "global_step": 10823, "epoch": 64} {"train_loss": -5.923523902893066, "global_step": 10824, "epoch": 64} {"train_loss": -5.940101623535156, "global_step": 10825, "epoch": 64} {"train_loss": -6.031771659851074, "global_step": 10826, "epoch": 64} {"train_loss": -5.817461967468262, "global_step": 10827, "epoch": 64} {"train_loss": -5.896312236785889, "global_step": 10828, "epoch": 64} {"train_loss": -5.805502891540527, "global_step": 10829, "epoch": 64} {"train_loss": -6.143979072570801, "global_step": 10830, "epoch": 64} {"train_loss": -5.687901020050049, "global_step": 10831, "epoch": 64} {"train_loss": -6.1269378662109375, "global_step": 10832, "epoch": 64} {"train_loss": -6.143413543701172, "global_step": 10833, "epoch": 64} {"train_loss": -5.658329963684082, "global_step": 10834, "epoch": 64} {"train_loss": -5.858656883239746, "global_step": 10835, "epoch": 64} {"train_loss": -5.814493179321289, "global_step": 10836, "epoch": 64} {"train_loss": -5.778069496154785, "global_step": 10837, "epoch": 64} {"train_loss": -5.985565185546875, "global_step": 10838, "epoch": 64} {"train_loss": -5.943826198577881, "global_step": 10839, "epoch": 64} {"train_loss": -5.9772138595581055, "global_step": 10840, "epoch": 64} {"train_loss": -5.923746585845947, "global_step": 10841, "epoch": 64} {"train_loss": -5.8267822265625, "global_step": 10842, "epoch": 64} {"train_loss": -5.936563014984131, "global_step": 10843, "epoch": 64} {"train_loss": -5.6293535232543945, "global_step": 10844, "epoch": 64} {"train_loss": -6.06414794921875, "global_step": 10845, "epoch": 64} {"train_loss": -5.817326068878174, "global_step": 10846, "epoch": 64} {"train_loss": -5.860991954803467, "global_step": 10847, "epoch": 64} {"train_loss": -5.912252426147461, "global_step": 10848, "epoch": 64} {"train_loss": -5.741445541381836, "global_step": 10849, "epoch": 64} {"train_loss": -5.848272323608398, "global_step": 10850, "epoch": 64} {"train_loss": -6.053793430328369, "global_step": 10851, "epoch": 64} {"train_loss": -5.829743385314941, "global_step": 10852, "epoch": 64} {"train_loss": -5.883550643920898, "global_step": 10853, "epoch": 64} {"train_loss": -6.016941070556641, "global_step": 10854, "epoch": 64} {"train_loss": -5.760558605194092, "global_step": 10855, "epoch": 64} {"train_loss": -6.045118808746338, "global_step": 10856, "epoch": 64} {"train_loss": -5.977078914642334, "global_step": 10857, "epoch": 64} {"train_loss": -5.963314056396484, "global_step": 10858, "epoch": 64} {"train_loss": -6.031179428100586, "global_step": 10859, "epoch": 64} {"train_loss": -6.101100444793701, "global_step": 10860, "epoch": 64} {"train_loss": -5.836584091186523, "global_step": 10861, "epoch": 64} {"train_loss": -5.884682655334473, "global_step": 10862, "epoch": 64} {"train_loss": -5.678644180297852, "global_step": 10863, "epoch": 64} {"train_loss": -5.881628513336182, "global_step": 10864, "epoch": 64} {"train_loss": -5.7783002853393555, "global_step": 10865, "epoch": 64} {"train_loss": -5.648804664611816, "global_step": 10866, "epoch": 64} {"train_loss": -5.893919944763184, "global_step": 10867, "epoch": 64} {"train_loss": -5.768961429595947, "global_step": 10868, "epoch": 64} {"train_loss": -5.618366241455078, "global_step": 10869, "epoch": 64} {"train_loss": -5.840255260467529, "global_step": 10870, "epoch": 64} {"train_loss": -5.72141170501709, "global_step": 10871, "epoch": 64} {"train_loss": -5.93589973449707, "global_step": 10872, "epoch": 64} {"train_loss": -5.897494316101074, "global_step": 10873, "epoch": 64} {"train_loss": -5.935158729553223, "global_step": 10874, "epoch": 64} {"train_loss": -5.989067554473877, "global_step": 10875, "epoch": 64} {"train_loss": -6.047374725341797, "global_step": 10876, "epoch": 64} {"train_loss": -5.908809661865234, "global_step": 10877, "epoch": 64} {"train_loss": -5.947150707244873, "global_step": 10878, "epoch": 64} {"train_loss": -5.812373161315918, "global_step": 10879, "epoch": 64} {"train_loss": -5.638327598571777, "global_step": 10880, "epoch": 64} {"train_loss": -6.104229927062988, "global_step": 10881, "epoch": 64} {"train_loss": -5.934928894042969, "global_step": 10882, "epoch": 64} {"train_loss": -5.72152042388916, "global_step": 10883, "epoch": 64} {"train_loss": -5.758991241455078, "global_step": 10884, "epoch": 64} {"train_loss": -6.076674938201904, "global_step": 10885, "epoch": 64} {"train_loss": -6.19572639465332, "global_step": 10886, "epoch": 64} {"train_loss": -5.580284595489502, "global_step": 10887, "epoch": 64} {"train_loss": -5.889896869659424, "global_step": 10888, "epoch": 64} {"train_loss": -5.9292168617248535, "global_step": 10889, "epoch": 64} {"train_loss": -5.978691101074219, "global_step": 10890, "epoch": 64} {"train_loss": -5.943004131317139, "global_step": 10891, "epoch": 64} {"train_loss": -5.9371771812438965, "global_step": 10892, "epoch": 64} {"train_loss": -5.893616676330566, "global_step": 10893, "epoch": 64} {"train_loss": -5.925493240356445, "global_step": 10894, "epoch": 64} {"train_loss": -5.909666061401367, "global_step": 10895, "epoch": 64} {"train_loss": -6.019536018371582, "global_step": 10896, "epoch": 64} {"train_loss": -5.919035911560059, "global_step": 10897, "epoch": 64} {"train_loss": -6.23239278793335, "global_step": 10898, "epoch": 64} {"train_loss": -5.8061652183532715, "global_step": 10899, "epoch": 64} {"train_loss": -6.052240371704102, "global_step": 10900, "epoch": 64} {"train_loss": -6.173545837402344, "global_step": 10901, "epoch": 64} {"train_loss": -5.720405101776123, "global_step": 10902, "epoch": 64} {"train_loss": -6.115226745605469, "global_step": 10903, "epoch": 64} {"train_loss": -5.864955902099609, "global_step": 10904, "epoch": 64} {"train_loss": -6.198495864868164, "global_step": 10905, "epoch": 64} {"train_loss": -5.789039134979248, "global_step": 10906, "epoch": 64} {"train_loss": -5.867273330688477, "global_step": 10907, "epoch": 64} {"train_loss": -5.862289905548096, "global_step": 10908, "epoch": 64} {"train_loss": -5.878349781036377, "global_step": 10909, "epoch": 64} {"train_loss": -5.203502178192139, "global_step": 10910, "epoch": 64} {"train_loss": -6.114133834838867, "global_step": 10911, "epoch": 64} {"train_loss": -5.756350517272949, "global_step": 10912, "epoch": 64} {"train_loss": -6.015650749206543, "global_step": 10913, "epoch": 64} {"train_loss": -5.812666893005371, "global_step": 10914, "epoch": 64} {"train_loss": -5.767233848571777, "global_step": 10915, "epoch": 64} {"train_loss": -6.004380702972412, "global_step": 10916, "epoch": 64} {"train_loss": -5.834641456604004, "global_step": 10917, "epoch": 64} {"train_loss": -5.977174758911133, "global_step": 10918, "epoch": 64} {"train_loss": -5.861934043112255, "global_step": 10919, "epoch": 64, "val_loss": 263390.71875} {"train_loss": -5.897512435913086, "global_step": 10920, "epoch": 65} {"train_loss": -5.89179801940918, "global_step": 10921, "epoch": 65} {"train_loss": -5.954297065734863, "global_step": 10922, "epoch": 65} {"train_loss": -5.680130958557129, "global_step": 10923, "epoch": 65} {"train_loss": -5.638066291809082, "global_step": 10924, "epoch": 65} {"train_loss": -5.892721176147461, "global_step": 10925, "epoch": 65} {"train_loss": -5.802364349365234, "global_step": 10926, "epoch": 65} {"train_loss": -5.766587257385254, "global_step": 10927, "epoch": 65} {"train_loss": -5.343987464904785, "global_step": 10928, "epoch": 65} {"train_loss": -5.7327399253845215, "global_step": 10929, "epoch": 65} {"train_loss": -5.760913848876953, "global_step": 10930, "epoch": 65} {"train_loss": -5.838439464569092, "global_step": 10931, "epoch": 65} {"train_loss": -5.912056922912598, "global_step": 10932, "epoch": 65} {"train_loss": -5.779217720031738, "global_step": 10933, "epoch": 65} {"train_loss": -5.787227153778076, "global_step": 10934, "epoch": 65} {"train_loss": -6.141323089599609, "global_step": 10935, "epoch": 65} {"train_loss": -5.755517482757568, "global_step": 10936, "epoch": 65} {"train_loss": -5.945770263671875, "global_step": 10937, "epoch": 65} {"train_loss": -5.994248867034912, "global_step": 10938, "epoch": 65} {"train_loss": -5.736008644104004, "global_step": 10939, "epoch": 65} {"train_loss": -6.075115203857422, "global_step": 10940, "epoch": 65} {"train_loss": -5.990233898162842, "global_step": 10941, "epoch": 65} {"train_loss": -5.603315353393555, "global_step": 10942, "epoch": 65} {"train_loss": -5.880806922912598, "global_step": 10943, "epoch": 65} {"train_loss": -5.587553977966309, "global_step": 10944, "epoch": 65} {"train_loss": -6.00125789642334, "global_step": 10945, "epoch": 65} {"train_loss": -5.885929107666016, "global_step": 10946, "epoch": 65} {"train_loss": -5.863677024841309, "global_step": 10947, "epoch": 65} {"train_loss": -6.017043113708496, "global_step": 10948, "epoch": 65} {"train_loss": -5.904342174530029, "global_step": 10949, "epoch": 65} {"train_loss": -5.752693176269531, "global_step": 10950, "epoch": 65} {"train_loss": -5.803253650665283, "global_step": 10951, "epoch": 65} {"train_loss": -5.8137102127075195, "global_step": 10952, "epoch": 65} {"train_loss": -5.68271541595459, "global_step": 10953, "epoch": 65} {"train_loss": -6.108933448791504, "global_step": 10954, "epoch": 65} {"train_loss": -5.737611770629883, "global_step": 10955, "epoch": 65} {"train_loss": -6.004858016967773, "global_step": 10956, "epoch": 65} {"train_loss": -5.838603496551514, "global_step": 10957, "epoch": 65} {"train_loss": -5.755623817443848, "global_step": 10958, "epoch": 65} {"train_loss": -5.7590532302856445, "global_step": 10959, "epoch": 65} {"train_loss": -5.8253936767578125, "global_step": 10960, "epoch": 65} {"train_loss": -5.850045204162598, "global_step": 10961, "epoch": 65} {"train_loss": -5.844067573547363, "global_step": 10962, "epoch": 65} {"train_loss": -5.891732215881348, "global_step": 10963, "epoch": 65} {"train_loss": -5.746107578277588, "global_step": 10964, "epoch": 65} {"train_loss": -5.563776969909668, "global_step": 10965, "epoch": 65} {"train_loss": -5.848450660705566, "global_step": 10966, "epoch": 65} {"train_loss": -5.973230361938477, "global_step": 10967, "epoch": 65} {"train_loss": -6.088611602783203, "global_step": 10968, "epoch": 65} {"train_loss": -5.989246845245361, "global_step": 10969, "epoch": 65} {"train_loss": -6.0419840812683105, "global_step": 10970, "epoch": 65} {"train_loss": -6.133082389831543, "global_step": 10971, "epoch": 65} {"train_loss": -5.691584587097168, "global_step": 10972, "epoch": 65} {"train_loss": -5.912519454956055, "global_step": 10973, "epoch": 65} {"train_loss": -5.803653717041016, "global_step": 10974, "epoch": 65} {"train_loss": -5.996458053588867, "global_step": 10975, "epoch": 65} {"train_loss": -6.147572040557861, "global_step": 10976, "epoch": 65} {"train_loss": -6.078536033630371, "global_step": 10977, "epoch": 65} {"train_loss": -5.817344665527344, "global_step": 10978, "epoch": 65} {"train_loss": -5.861583709716797, "global_step": 10979, "epoch": 65} {"train_loss": -5.9782633781433105, "global_step": 10980, "epoch": 65} {"train_loss": -5.887145042419434, "global_step": 10981, "epoch": 65} {"train_loss": -6.076066017150879, "global_step": 10982, "epoch": 65} {"train_loss": -5.997735977172852, "global_step": 10983, "epoch": 65} {"train_loss": -6.041616439819336, "global_step": 10984, "epoch": 65} {"train_loss": -5.882002353668213, "global_step": 10985, "epoch": 65} {"train_loss": -6.058351516723633, "global_step": 10986, "epoch": 65} {"train_loss": -6.096504211425781, "global_step": 10987, "epoch": 65} {"train_loss": -6.1605987548828125, "global_step": 10988, "epoch": 65} {"train_loss": -6.183290004730225, "global_step": 10989, "epoch": 65} {"train_loss": -5.854557991027832, "global_step": 10990, "epoch": 65} {"train_loss": -6.122880458831787, "global_step": 10991, "epoch": 65} {"train_loss": -5.853824615478516, "global_step": 10992, "epoch": 65} {"train_loss": -6.102433204650879, "global_step": 10993, "epoch": 65} {"train_loss": -5.893898010253906, "global_step": 10994, "epoch": 65} {"train_loss": -5.905734539031982, "global_step": 10995, "epoch": 65} {"train_loss": -6.159054756164551, "global_step": 10996, "epoch": 65} {"train_loss": -5.866482734680176, "global_step": 10997, "epoch": 65} {"train_loss": -5.809033393859863, "global_step": 10998, "epoch": 65} {"train_loss": -6.052569389343262, "global_step": 10999, "epoch": 65} {"train_loss": -5.734468460083008, "global_step": 11000, "epoch": 65} {"train_loss": -5.817500114440918, "global_step": 11001, "epoch": 65} {"train_loss": -5.897594451904297, "global_step": 11002, "epoch": 65} {"train_loss": -6.010027885437012, "global_step": 11003, "epoch": 65} {"train_loss": -6.034709930419922, "global_step": 11004, "epoch": 65} {"train_loss": -6.047431945800781, "global_step": 11005, "epoch": 65} {"train_loss": -5.865090370178223, "global_step": 11006, "epoch": 65} {"train_loss": -6.270288467407227, "global_step": 11007, "epoch": 65} {"train_loss": -5.802347183227539, "global_step": 11008, "epoch": 65} {"train_loss": -5.912890911102295, "global_step": 11009, "epoch": 65} {"train_loss": -5.9546661376953125, "global_step": 11010, "epoch": 65} {"train_loss": -5.729880332946777, "global_step": 11011, "epoch": 65} {"train_loss": -6.030841827392578, "global_step": 11012, "epoch": 65} {"train_loss": -5.696469306945801, "global_step": 11013, "epoch": 65} {"train_loss": -5.924785614013672, "global_step": 11014, "epoch": 65} {"train_loss": -5.655757904052734, "global_step": 11015, "epoch": 65} {"train_loss": -5.993897914886475, "global_step": 11016, "epoch": 65} {"train_loss": -5.9889655113220215, "global_step": 11017, "epoch": 65} {"train_loss": -5.8468828201293945, "global_step": 11018, "epoch": 65} {"train_loss": -5.777955055236816, "global_step": 11019, "epoch": 65} {"train_loss": -5.743460655212402, "global_step": 11020, "epoch": 65} {"train_loss": -5.674360275268555, "global_step": 11021, "epoch": 65} {"train_loss": -5.893507957458496, "global_step": 11022, "epoch": 65} {"train_loss": -5.861639976501465, "global_step": 11023, "epoch": 65} {"train_loss": -6.05452299118042, "global_step": 11024, "epoch": 65} {"train_loss": -6.150474548339844, "global_step": 11025, "epoch": 65} {"train_loss": -6.113648414611816, "global_step": 11026, "epoch": 65} {"train_loss": -5.620378017425537, "global_step": 11027, "epoch": 65} {"train_loss": -5.874024391174316, "global_step": 11028, "epoch": 65} {"train_loss": -5.856276512145996, "global_step": 11029, "epoch": 65} {"train_loss": -6.069153785705566, "global_step": 11030, "epoch": 65} {"train_loss": -6.0559186935424805, "global_step": 11031, "epoch": 65} {"train_loss": -5.742782115936279, "global_step": 11032, "epoch": 65} {"train_loss": -5.571746349334717, "global_step": 11033, "epoch": 65} {"train_loss": -5.847869873046875, "global_step": 11034, "epoch": 65} {"train_loss": -5.974884510040283, "global_step": 11035, "epoch": 65} {"train_loss": -6.124520301818848, "global_step": 11036, "epoch": 65} {"train_loss": -5.766148090362549, "global_step": 11037, "epoch": 65} {"train_loss": -5.559632778167725, "global_step": 11038, "epoch": 65} {"train_loss": -5.880549430847168, "global_step": 11039, "epoch": 65} {"train_loss": -5.878420829772949, "global_step": 11040, "epoch": 65} {"train_loss": -5.934759140014648, "global_step": 11041, "epoch": 65} {"train_loss": -5.652642250061035, "global_step": 11042, "epoch": 65} {"train_loss": -5.825288772583008, "global_step": 11043, "epoch": 65} {"train_loss": -5.557371616363525, "global_step": 11044, "epoch": 65} {"train_loss": -5.789323329925537, "global_step": 11045, "epoch": 65} {"train_loss": -6.111673355102539, "global_step": 11046, "epoch": 65} {"train_loss": -5.711706638336182, "global_step": 11047, "epoch": 65} {"train_loss": -5.6428117752075195, "global_step": 11048, "epoch": 65} {"train_loss": -5.735930442810059, "global_step": 11049, "epoch": 65} {"train_loss": -5.88394832611084, "global_step": 11050, "epoch": 65} {"train_loss": -5.955935955047607, "global_step": 11051, "epoch": 65} {"train_loss": -5.735837936401367, "global_step": 11052, "epoch": 65} {"train_loss": -5.841916084289551, "global_step": 11053, "epoch": 65} {"train_loss": -5.8313751220703125, "global_step": 11054, "epoch": 65} {"train_loss": -5.413664817810059, "global_step": 11055, "epoch": 65} {"train_loss": -5.734725475311279, "global_step": 11056, "epoch": 65} {"train_loss": -5.475543975830078, "global_step": 11057, "epoch": 65} {"train_loss": -5.716805458068848, "global_step": 11058, "epoch": 65} {"train_loss": -5.730679512023926, "global_step": 11059, "epoch": 65} {"train_loss": -5.412953853607178, "global_step": 11060, "epoch": 65} {"train_loss": -5.885991096496582, "global_step": 11061, "epoch": 65} {"train_loss": -5.565727233886719, "global_step": 11062, "epoch": 65} {"train_loss": -5.533152103424072, "global_step": 11063, "epoch": 65} {"train_loss": -5.831723213195801, "global_step": 11064, "epoch": 65} {"train_loss": -5.800739288330078, "global_step": 11065, "epoch": 65} {"train_loss": -5.752504825592041, "global_step": 11066, "epoch": 65} {"train_loss": -5.836687088012695, "global_step": 11067, "epoch": 65} {"train_loss": -5.761527061462402, "global_step": 11068, "epoch": 65} {"train_loss": -6.010093688964844, "global_step": 11069, "epoch": 65} {"train_loss": -5.866364002227783, "global_step": 11070, "epoch": 65} {"train_loss": -5.746124267578125, "global_step": 11071, "epoch": 65} {"train_loss": -5.737998008728027, "global_step": 11072, "epoch": 65} {"train_loss": -5.966300964355469, "global_step": 11073, "epoch": 65} {"train_loss": -5.858984470367432, "global_step": 11074, "epoch": 65} {"train_loss": -6.105340957641602, "global_step": 11075, "epoch": 65} {"train_loss": -5.836694240570068, "global_step": 11076, "epoch": 65} {"train_loss": -5.955145835876465, "global_step": 11077, "epoch": 65} {"train_loss": -5.945509910583496, "global_step": 11078, "epoch": 65} {"train_loss": -5.905808925628662, "global_step": 11079, "epoch": 65} {"train_loss": -5.725866317749023, "global_step": 11080, "epoch": 65} {"train_loss": -5.736708641052246, "global_step": 11081, "epoch": 65} {"train_loss": -5.737739562988281, "global_step": 11082, "epoch": 65} {"train_loss": -5.598775863647461, "global_step": 11083, "epoch": 65} {"train_loss": -5.714860439300537, "global_step": 11084, "epoch": 65} {"train_loss": -5.742146968841553, "global_step": 11085, "epoch": 65} {"train_loss": -5.731764793395996, "global_step": 11086, "epoch": 65} {"train_loss": -5.85665932723454, "global_step": 11087, "epoch": 65, "val_loss": 260852.4375, "train_action_mse_error": 46.51290512084961} {"train_loss": -5.693563938140869, "global_step": 11088, "epoch": 66} {"train_loss": -5.727133750915527, "global_step": 11089, "epoch": 66} {"train_loss": -6.031244277954102, "global_step": 11090, "epoch": 66} {"train_loss": -5.90863037109375, "global_step": 11091, "epoch": 66} {"train_loss": -5.6860198974609375, "global_step": 11092, "epoch": 66} {"train_loss": -5.55454683303833, "global_step": 11093, "epoch": 66} {"train_loss": -5.542829513549805, "global_step": 11094, "epoch": 66} {"train_loss": -5.902375221252441, "global_step": 11095, "epoch": 66} {"train_loss": -5.925004005432129, "global_step": 11096, "epoch": 66} {"train_loss": -5.868185043334961, "global_step": 11097, "epoch": 66} {"train_loss": -5.872066497802734, "global_step": 11098, "epoch": 66} {"train_loss": -5.811336517333984, "global_step": 11099, "epoch": 66} {"train_loss": -6.098044395446777, "global_step": 11100, "epoch": 66} {"train_loss": -6.150651931762695, "global_step": 11101, "epoch": 66} {"train_loss": -5.912766456604004, "global_step": 11102, "epoch": 66} {"train_loss": -5.90140438079834, "global_step": 11103, "epoch": 66} {"train_loss": -6.088335037231445, "global_step": 11104, "epoch": 66} {"train_loss": -5.679929256439209, "global_step": 11105, "epoch": 66} {"train_loss": -5.912864685058594, "global_step": 11106, "epoch": 66} {"train_loss": -5.813142776489258, "global_step": 11107, "epoch": 66} {"train_loss": -5.7603759765625, "global_step": 11108, "epoch": 66} {"train_loss": -5.968606948852539, "global_step": 11109, "epoch": 66} {"train_loss": -5.545925140380859, "global_step": 11110, "epoch": 66} {"train_loss": -6.23484992980957, "global_step": 11111, "epoch": 66} {"train_loss": -6.004567623138428, "global_step": 11112, "epoch": 66} {"train_loss": -5.959362983703613, "global_step": 11113, "epoch": 66} {"train_loss": -5.831228256225586, "global_step": 11114, "epoch": 66} {"train_loss": -6.035083770751953, "global_step": 11115, "epoch": 66} {"train_loss": -5.982115745544434, "global_step": 11116, "epoch": 66} {"train_loss": -6.071702003479004, "global_step": 11117, "epoch": 66} {"train_loss": -6.031304359436035, "global_step": 11118, "epoch": 66} {"train_loss": -6.133096218109131, "global_step": 11119, "epoch": 66} {"train_loss": -6.0503034591674805, "global_step": 11120, "epoch": 66} {"train_loss": -5.892582893371582, "global_step": 11121, "epoch": 66} {"train_loss": -5.597135543823242, "global_step": 11122, "epoch": 66} {"train_loss": -5.973227500915527, "global_step": 11123, "epoch": 66} {"train_loss": -5.73262882232666, "global_step": 11124, "epoch": 66} {"train_loss": -6.029748916625977, "global_step": 11125, "epoch": 66} {"train_loss": -6.009374618530273, "global_step": 11126, "epoch": 66} {"train_loss": -6.0522541999816895, "global_step": 11127, "epoch": 66} {"train_loss": -5.785815238952637, "global_step": 11128, "epoch": 66} {"train_loss": -6.0721940994262695, "global_step": 11129, "epoch": 66} {"train_loss": -5.956180572509766, "global_step": 11130, "epoch": 66} {"train_loss": -6.032074928283691, "global_step": 11131, "epoch": 66} {"train_loss": -5.860874652862549, "global_step": 11132, "epoch": 66} {"train_loss": -5.993464946746826, "global_step": 11133, "epoch": 66} {"train_loss": -6.072609901428223, "global_step": 11134, "epoch": 66} {"train_loss": -6.196566104888916, "global_step": 11135, "epoch": 66} {"train_loss": -5.784573078155518, "global_step": 11136, "epoch": 66} {"train_loss": -5.956298828125, "global_step": 11137, "epoch": 66} {"train_loss": -6.011639595031738, "global_step": 11138, "epoch": 66} {"train_loss": -6.140702247619629, "global_step": 11139, "epoch": 66} {"train_loss": -6.096126556396484, "global_step": 11140, "epoch": 66} {"train_loss": -5.751637935638428, "global_step": 11141, "epoch": 66} {"train_loss": -5.9811787605285645, "global_step": 11142, "epoch": 66} {"train_loss": -6.104987144470215, "global_step": 11143, "epoch": 66} {"train_loss": -6.174093723297119, "global_step": 11144, "epoch": 66} {"train_loss": -6.168417930603027, "global_step": 11145, "epoch": 66} {"train_loss": -6.0685648918151855, "global_step": 11146, "epoch": 66} {"train_loss": -6.023153305053711, "global_step": 11147, "epoch": 66} {"train_loss": -5.7958831787109375, "global_step": 11148, "epoch": 66} {"train_loss": -5.9683732986450195, "global_step": 11149, "epoch": 66} {"train_loss": -6.018576622009277, "global_step": 11150, "epoch": 66} {"train_loss": -5.88218355178833, "global_step": 11151, "epoch": 66} {"train_loss": -5.949751853942871, "global_step": 11152, "epoch": 66} {"train_loss": -6.062624931335449, "global_step": 11153, "epoch": 66} {"train_loss": -5.888905048370361, "global_step": 11154, "epoch": 66} {"train_loss": -5.808499336242676, "global_step": 11155, "epoch": 66} {"train_loss": -5.431809902191162, "global_step": 11156, "epoch": 66} {"train_loss": -5.8707356452941895, "global_step": 11157, "epoch": 66} {"train_loss": -5.739218711853027, "global_step": 11158, "epoch": 66} {"train_loss": -5.664247989654541, "global_step": 11159, "epoch": 66} {"train_loss": -5.90727424621582, "global_step": 11160, "epoch": 66} {"train_loss": -5.846818923950195, "global_step": 11161, "epoch": 66} {"train_loss": -5.7899298667907715, "global_step": 11162, "epoch": 66} {"train_loss": -5.398804664611816, "global_step": 11163, "epoch": 66} {"train_loss": -5.827644348144531, "global_step": 11164, "epoch": 66} {"train_loss": -5.9412736892700195, "global_step": 11165, "epoch": 66} {"train_loss": -5.890789985656738, "global_step": 11166, "epoch": 66} {"train_loss": -5.913433074951172, "global_step": 11167, "epoch": 66} {"train_loss": -5.994895935058594, "global_step": 11168, "epoch": 66} {"train_loss": -5.739062309265137, "global_step": 11169, "epoch": 66} {"train_loss": -5.8440656661987305, "global_step": 11170, "epoch": 66} {"train_loss": -5.912139892578125, "global_step": 11171, "epoch": 66} {"train_loss": -6.064102649688721, "global_step": 11172, "epoch": 66} {"train_loss": -6.014311790466309, "global_step": 11173, "epoch": 66} {"train_loss": -5.864985466003418, "global_step": 11174, "epoch": 66} {"train_loss": -6.183842658996582, "global_step": 11175, "epoch": 66} {"train_loss": -6.0494232177734375, "global_step": 11176, "epoch": 66} {"train_loss": -5.9227776527404785, "global_step": 11177, "epoch": 66} {"train_loss": -5.989229202270508, "global_step": 11178, "epoch": 66} {"train_loss": -5.828921318054199, "global_step": 11179, "epoch": 66} {"train_loss": -5.880403995513916, "global_step": 11180, "epoch": 66} {"train_loss": -6.032203674316406, "global_step": 11181, "epoch": 66} {"train_loss": -5.787296295166016, "global_step": 11182, "epoch": 66} {"train_loss": -5.536938190460205, "global_step": 11183, "epoch": 66} {"train_loss": -5.635168075561523, "global_step": 11184, "epoch": 66} {"train_loss": -5.573488712310791, "global_step": 11185, "epoch": 66} {"train_loss": -5.717327117919922, "global_step": 11186, "epoch": 66} {"train_loss": -5.881049633026123, "global_step": 11187, "epoch": 66} {"train_loss": -6.0212602615356445, "global_step": 11188, "epoch": 66} {"train_loss": -5.94986629486084, "global_step": 11189, "epoch": 66} {"train_loss": -5.918461799621582, "global_step": 11190, "epoch": 66} {"train_loss": -5.783666610717773, "global_step": 11191, "epoch": 66} {"train_loss": -5.7583794593811035, "global_step": 11192, "epoch": 66} {"train_loss": -5.8680548667907715, "global_step": 11193, "epoch": 66} {"train_loss": -5.954098701477051, "global_step": 11194, "epoch": 66} {"train_loss": -5.774173736572266, "global_step": 11195, "epoch": 66} {"train_loss": -5.920377731323242, "global_step": 11196, "epoch": 66} {"train_loss": -5.757046222686768, "global_step": 11197, "epoch": 66} {"train_loss": -5.567336559295654, "global_step": 11198, "epoch": 66} {"train_loss": -5.984835624694824, "global_step": 11199, "epoch": 66} {"train_loss": -5.98816442489624, "global_step": 11200, "epoch": 66} {"train_loss": -5.966373443603516, "global_step": 11201, "epoch": 66} {"train_loss": -6.015155792236328, "global_step": 11202, "epoch": 66} {"train_loss": -5.982684135437012, "global_step": 11203, "epoch": 66} {"train_loss": -5.994440078735352, "global_step": 11204, "epoch": 66} {"train_loss": -6.029821395874023, "global_step": 11205, "epoch": 66} {"train_loss": -6.241551876068115, "global_step": 11206, "epoch": 66} {"train_loss": -6.021083831787109, "global_step": 11207, "epoch": 66} {"train_loss": -6.047843933105469, "global_step": 11208, "epoch": 66} {"train_loss": -6.166443824768066, "global_step": 11209, "epoch": 66} {"train_loss": -5.668931007385254, "global_step": 11210, "epoch": 66} {"train_loss": -5.685197353363037, "global_step": 11211, "epoch": 66} {"train_loss": -5.677868843078613, "global_step": 11212, "epoch": 66} {"train_loss": -5.977914810180664, "global_step": 11213, "epoch": 66} {"train_loss": -5.8220534324646, "global_step": 11214, "epoch": 66} {"train_loss": -5.8377909660339355, "global_step": 11215, "epoch": 66} {"train_loss": -6.156848430633545, "global_step": 11216, "epoch": 66} {"train_loss": -5.992897033691406, "global_step": 11217, "epoch": 66} {"train_loss": -5.814067840576172, "global_step": 11218, "epoch": 66} {"train_loss": -6.239838600158691, "global_step": 11219, "epoch": 66} {"train_loss": -6.022336959838867, "global_step": 11220, "epoch": 66} {"train_loss": -6.191486358642578, "global_step": 11221, "epoch": 66} {"train_loss": -6.123585224151611, "global_step": 11222, "epoch": 66} {"train_loss": -6.099801540374756, "global_step": 11223, "epoch": 66} {"train_loss": -6.157827377319336, "global_step": 11224, "epoch": 66} {"train_loss": -5.989615440368652, "global_step": 11225, "epoch": 66} {"train_loss": -5.755560874938965, "global_step": 11226, "epoch": 66} {"train_loss": -6.18137788772583, "global_step": 11227, "epoch": 66} {"train_loss": -6.1257429122924805, "global_step": 11228, "epoch": 66} {"train_loss": -5.896843910217285, "global_step": 11229, "epoch": 66} {"train_loss": -5.852560043334961, "global_step": 11230, "epoch": 66} {"train_loss": -6.112614154815674, "global_step": 11231, "epoch": 66} {"train_loss": -6.052459239959717, "global_step": 11232, "epoch": 66} {"train_loss": -5.822992324829102, "global_step": 11233, "epoch": 66} {"train_loss": -5.875604629516602, "global_step": 11234, "epoch": 66} {"train_loss": -5.871033668518066, "global_step": 11235, "epoch": 66} {"train_loss": -5.853057384490967, "global_step": 11236, "epoch": 66} {"train_loss": -5.7485246658325195, "global_step": 11237, "epoch": 66} {"train_loss": -5.8983354568481445, "global_step": 11238, "epoch": 66} {"train_loss": -5.8873138427734375, "global_step": 11239, "epoch": 66} {"train_loss": -5.86845588684082, "global_step": 11240, "epoch": 66} {"train_loss": -5.543439865112305, "global_step": 11241, "epoch": 66} {"train_loss": -5.798890113830566, "global_step": 11242, "epoch": 66} {"train_loss": -5.851917743682861, "global_step": 11243, "epoch": 66} {"train_loss": -5.812191963195801, "global_step": 11244, "epoch": 66} {"train_loss": -5.949758052825928, "global_step": 11245, "epoch": 66} {"train_loss": -5.664433002471924, "global_step": 11246, "epoch": 66} {"train_loss": -6.064157009124756, "global_step": 11247, "epoch": 66} {"train_loss": -5.805977821350098, "global_step": 11248, "epoch": 66} {"train_loss": -5.888965606689453, "global_step": 11249, "epoch": 66} {"train_loss": -5.897822380065918, "global_step": 11250, "epoch": 66} {"train_loss": -5.731629848480225, "global_step": 11251, "epoch": 66} {"train_loss": -5.8661041259765625, "global_step": 11252, "epoch": 66} {"train_loss": -5.750338554382324, "global_step": 11253, "epoch": 66} {"train_loss": -6.0015339851379395, "global_step": 11254, "epoch": 66} {"train_loss": -5.910130988983881, "global_step": 11255, "epoch": 66, "val_loss": 259514.46875} {"train_loss": -5.682828903198242, "global_step": 11256, "epoch": 67} {"train_loss": -6.072146415710449, "global_step": 11257, "epoch": 67} {"train_loss": -6.007027626037598, "global_step": 11258, "epoch": 67} {"train_loss": -5.831625938415527, "global_step": 11259, "epoch": 67} {"train_loss": -6.1053972244262695, "global_step": 11260, "epoch": 67} {"train_loss": -6.202887535095215, "global_step": 11261, "epoch": 67} {"train_loss": -6.1439948081970215, "global_step": 11262, "epoch": 67} {"train_loss": -6.1429057121276855, "global_step": 11263, "epoch": 67} {"train_loss": -6.11265754699707, "global_step": 11264, "epoch": 67} {"train_loss": -5.864918231964111, "global_step": 11265, "epoch": 67} {"train_loss": -5.943544864654541, "global_step": 11266, "epoch": 67} {"train_loss": -5.37755012512207, "global_step": 11267, "epoch": 67} {"train_loss": -6.008275032043457, "global_step": 11268, "epoch": 67} {"train_loss": -5.430707931518555, "global_step": 11269, "epoch": 67} {"train_loss": -5.89851188659668, "global_step": 11270, "epoch": 67} {"train_loss": -5.93766975402832, "global_step": 11271, "epoch": 67} {"train_loss": -5.354564189910889, "global_step": 11272, "epoch": 67} {"train_loss": -5.762857913970947, "global_step": 11273, "epoch": 67} {"train_loss": -5.569533348083496, "global_step": 11274, "epoch": 67} {"train_loss": -5.434917449951172, "global_step": 11275, "epoch": 67} {"train_loss": -5.703221321105957, "global_step": 11276, "epoch": 67} {"train_loss": -5.8559346199035645, "global_step": 11277, "epoch": 67} {"train_loss": -5.700125694274902, "global_step": 11278, "epoch": 67} {"train_loss": -6.03419303894043, "global_step": 11279, "epoch": 67} {"train_loss": -5.788150787353516, "global_step": 11280, "epoch": 67} {"train_loss": -6.03237247467041, "global_step": 11281, "epoch": 67} {"train_loss": -5.776497840881348, "global_step": 11282, "epoch": 67} {"train_loss": -5.7512359619140625, "global_step": 11283, "epoch": 67} {"train_loss": -5.745640754699707, "global_step": 11284, "epoch": 67} {"train_loss": -6.0626115798950195, "global_step": 11285, "epoch": 67} {"train_loss": -5.895918369293213, "global_step": 11286, "epoch": 67} {"train_loss": -5.89621639251709, "global_step": 11287, "epoch": 67} {"train_loss": -6.002261638641357, "global_step": 11288, "epoch": 67} {"train_loss": -6.026946067810059, "global_step": 11289, "epoch": 67} {"train_loss": -5.869375228881836, "global_step": 11290, "epoch": 67} {"train_loss": -5.976574897766113, "global_step": 11291, "epoch": 67} {"train_loss": -6.028651237487793, "global_step": 11292, "epoch": 67} {"train_loss": -5.956653594970703, "global_step": 11293, "epoch": 67} {"train_loss": -5.76811408996582, "global_step": 11294, "epoch": 67} {"train_loss": -5.939715385437012, "global_step": 11295, "epoch": 67} {"train_loss": -6.067054748535156, "global_step": 11296, "epoch": 67} {"train_loss": -6.04137659072876, "global_step": 11297, "epoch": 67} {"train_loss": -6.023686408996582, "global_step": 11298, "epoch": 67} {"train_loss": -6.064359664916992, "global_step": 11299, "epoch": 67} {"train_loss": -5.91536808013916, "global_step": 11300, "epoch": 67} {"train_loss": -5.87009859085083, "global_step": 11301, "epoch": 67} {"train_loss": -6.206057548522949, "global_step": 11302, "epoch": 67} {"train_loss": -5.963271617889404, "global_step": 11303, "epoch": 67} {"train_loss": -6.0822906494140625, "global_step": 11304, "epoch": 67} {"train_loss": -5.695905685424805, "global_step": 11305, "epoch": 67} {"train_loss": -5.733752727508545, "global_step": 11306, "epoch": 67} {"train_loss": -5.955203056335449, "global_step": 11307, "epoch": 67} {"train_loss": -5.704624176025391, "global_step": 11308, "epoch": 67} {"train_loss": -5.665323257446289, "global_step": 11309, "epoch": 67} {"train_loss": -6.000258922576904, "global_step": 11310, "epoch": 67} {"train_loss": -5.938660621643066, "global_step": 11311, "epoch": 67} {"train_loss": -5.615387916564941, "global_step": 11312, "epoch": 67} {"train_loss": -5.880794048309326, "global_step": 11313, "epoch": 67} {"train_loss": -6.064326286315918, "global_step": 11314, "epoch": 67} {"train_loss": -6.040412902832031, "global_step": 11315, "epoch": 67} {"train_loss": -5.8180389404296875, "global_step": 11316, "epoch": 67} {"train_loss": -5.822605609893799, "global_step": 11317, "epoch": 67} {"train_loss": -5.718268394470215, "global_step": 11318, "epoch": 67} {"train_loss": -6.014521598815918, "global_step": 11319, "epoch": 67} {"train_loss": -6.0506696701049805, "global_step": 11320, "epoch": 67} {"train_loss": -5.840324401855469, "global_step": 11321, "epoch": 67} {"train_loss": -5.887187480926514, "global_step": 11322, "epoch": 67} {"train_loss": -5.865649700164795, "global_step": 11323, "epoch": 67} {"train_loss": -6.012801170349121, "global_step": 11324, "epoch": 67} {"train_loss": -5.692200183868408, "global_step": 11325, "epoch": 67} {"train_loss": -5.808342933654785, "global_step": 11326, "epoch": 67} {"train_loss": -5.732846260070801, "global_step": 11327, "epoch": 67} {"train_loss": -5.610973834991455, "global_step": 11328, "epoch": 67} {"train_loss": -5.77626895904541, "global_step": 11329, "epoch": 67} {"train_loss": -5.537931442260742, "global_step": 11330, "epoch": 67} {"train_loss": -5.8629536628723145, "global_step": 11331, "epoch": 67} {"train_loss": -5.792978763580322, "global_step": 11332, "epoch": 67} {"train_loss": -5.605996131896973, "global_step": 11333, "epoch": 67} {"train_loss": -5.88055944442749, "global_step": 11334, "epoch": 67} {"train_loss": -5.697035789489746, "global_step": 11335, "epoch": 67} {"train_loss": -5.741231441497803, "global_step": 11336, "epoch": 67} {"train_loss": -5.865591049194336, "global_step": 11337, "epoch": 67} {"train_loss": -5.799025058746338, "global_step": 11338, "epoch": 67} {"train_loss": -5.818540096282959, "global_step": 11339, "epoch": 67} {"train_loss": -6.150886058807373, "global_step": 11340, "epoch": 67} {"train_loss": -5.776228904724121, "global_step": 11341, "epoch": 67} {"train_loss": -6.045029640197754, "global_step": 11342, "epoch": 67} {"train_loss": -5.787893295288086, "global_step": 11343, "epoch": 67} {"train_loss": -5.947587490081787, "global_step": 11344, "epoch": 67} {"train_loss": -5.610321998596191, "global_step": 11345, "epoch": 67} {"train_loss": -6.072883129119873, "global_step": 11346, "epoch": 67} {"train_loss": -6.035251617431641, "global_step": 11347, "epoch": 67} {"train_loss": -5.990880489349365, "global_step": 11348, "epoch": 67} {"train_loss": -5.6543402671813965, "global_step": 11349, "epoch": 67} {"train_loss": -6.115209579467773, "global_step": 11350, "epoch": 67} {"train_loss": -5.9109296798706055, "global_step": 11351, "epoch": 67} {"train_loss": -6.090503215789795, "global_step": 11352, "epoch": 67} {"train_loss": -6.0550432205200195, "global_step": 11353, "epoch": 67} {"train_loss": -5.965356349945068, "global_step": 11354, "epoch": 67} {"train_loss": -5.931893348693848, "global_step": 11355, "epoch": 67} {"train_loss": -5.886727809906006, "global_step": 11356, "epoch": 67} {"train_loss": -6.134073257446289, "global_step": 11357, "epoch": 67} {"train_loss": -5.823972702026367, "global_step": 11358, "epoch": 67} {"train_loss": -5.910597324371338, "global_step": 11359, "epoch": 67} {"train_loss": -6.119684219360352, "global_step": 11360, "epoch": 67} {"train_loss": -6.15190315246582, "global_step": 11361, "epoch": 67} {"train_loss": -6.10114860534668, "global_step": 11362, "epoch": 67} {"train_loss": -6.128902912139893, "global_step": 11363, "epoch": 67} {"train_loss": -6.152792930603027, "global_step": 11364, "epoch": 67} {"train_loss": -6.034945487976074, "global_step": 11365, "epoch": 67} {"train_loss": -6.1347455978393555, "global_step": 11366, "epoch": 67} {"train_loss": -5.987140655517578, "global_step": 11367, "epoch": 67} {"train_loss": -6.006718158721924, "global_step": 11368, "epoch": 67} {"train_loss": -5.896685600280762, "global_step": 11369, "epoch": 67} {"train_loss": -5.87322473526001, "global_step": 11370, "epoch": 67} {"train_loss": -5.9698381423950195, "global_step": 11371, "epoch": 67} {"train_loss": -5.936156272888184, "global_step": 11372, "epoch": 67} {"train_loss": -5.974889755249023, "global_step": 11373, "epoch": 67} {"train_loss": -6.02606201171875, "global_step": 11374, "epoch": 67} {"train_loss": -5.937058925628662, "global_step": 11375, "epoch": 67} {"train_loss": -6.051505088806152, "global_step": 11376, "epoch": 67} {"train_loss": -5.758317947387695, "global_step": 11377, "epoch": 67} {"train_loss": -6.116069316864014, "global_step": 11378, "epoch": 67} {"train_loss": -5.828597068786621, "global_step": 11379, "epoch": 67} {"train_loss": -5.774470329284668, "global_step": 11380, "epoch": 67} {"train_loss": -6.008334159851074, "global_step": 11381, "epoch": 67} {"train_loss": -5.979096412658691, "global_step": 11382, "epoch": 67} {"train_loss": -5.7429680824279785, "global_step": 11383, "epoch": 67} {"train_loss": -5.921704292297363, "global_step": 11384, "epoch": 67} {"train_loss": -5.977245807647705, "global_step": 11385, "epoch": 67} {"train_loss": -5.968192100524902, "global_step": 11386, "epoch": 67} {"train_loss": -6.04232120513916, "global_step": 11387, "epoch": 67} {"train_loss": -5.989308834075928, "global_step": 11388, "epoch": 67} {"train_loss": -6.177811622619629, "global_step": 11389, "epoch": 67} {"train_loss": -6.225008964538574, "global_step": 11390, "epoch": 67} {"train_loss": -5.850161552429199, "global_step": 11391, "epoch": 67} {"train_loss": -5.911104202270508, "global_step": 11392, "epoch": 67} {"train_loss": -6.35427713394165, "global_step": 11393, "epoch": 67} {"train_loss": -5.830658912658691, "global_step": 11394, "epoch": 67} {"train_loss": -6.042757987976074, "global_step": 11395, "epoch": 67} {"train_loss": -5.986274242401123, "global_step": 11396, "epoch": 67} {"train_loss": -5.886065483093262, "global_step": 11397, "epoch": 67} {"train_loss": -6.071205139160156, "global_step": 11398, "epoch": 67} {"train_loss": -5.82729434967041, "global_step": 11399, "epoch": 67} {"train_loss": -6.100399494171143, "global_step": 11400, "epoch": 67} {"train_loss": -5.784771919250488, "global_step": 11401, "epoch": 67} {"train_loss": -5.7777910232543945, "global_step": 11402, "epoch": 67} {"train_loss": -5.932210922241211, "global_step": 11403, "epoch": 67} {"train_loss": -5.772650241851807, "global_step": 11404, "epoch": 67} {"train_loss": -5.8122406005859375, "global_step": 11405, "epoch": 67} {"train_loss": -5.621102333068848, "global_step": 11406, "epoch": 67} {"train_loss": -6.078886985778809, "global_step": 11407, "epoch": 67} {"train_loss": -5.62660551071167, "global_step": 11408, "epoch": 67} {"train_loss": -5.666815757751465, "global_step": 11409, "epoch": 67} {"train_loss": -5.941699981689453, "global_step": 11410, "epoch": 67} {"train_loss": -5.9660162925720215, "global_step": 11411, "epoch": 67} {"train_loss": -6.060285568237305, "global_step": 11412, "epoch": 67} {"train_loss": -5.697210311889648, "global_step": 11413, "epoch": 67} {"train_loss": -5.441170692443848, "global_step": 11414, "epoch": 67} {"train_loss": -5.467372894287109, "global_step": 11415, "epoch": 67} {"train_loss": -6.042843341827393, "global_step": 11416, "epoch": 67} {"train_loss": -5.8713579177856445, "global_step": 11417, "epoch": 67} {"train_loss": -5.619647026062012, "global_step": 11418, "epoch": 67} {"train_loss": -5.713465690612793, "global_step": 11419, "epoch": 67} {"train_loss": -5.851652145385742, "global_step": 11420, "epoch": 67} {"train_loss": -5.991729259490967, "global_step": 11421, "epoch": 67} {"train_loss": -5.943465709686279, "global_step": 11422, "epoch": 67} {"train_loss": -5.8966067887487865, "global_step": 11423, "epoch": 67, "val_loss": 258097.546875} {"train_loss": -5.7318806648254395, "global_step": 11424, "epoch": 68} {"train_loss": -5.921660423278809, "global_step": 11425, "epoch": 68} {"train_loss": -5.975055694580078, "global_step": 11426, "epoch": 68} {"train_loss": -6.204282283782959, "global_step": 11427, "epoch": 68} {"train_loss": -5.771763324737549, "global_step": 11428, "epoch": 68} {"train_loss": -6.086944103240967, "global_step": 11429, "epoch": 68} {"train_loss": -5.853729248046875, "global_step": 11430, "epoch": 68} {"train_loss": -5.9717116355896, "global_step": 11431, "epoch": 68} {"train_loss": -6.182074546813965, "global_step": 11432, "epoch": 68} {"train_loss": -5.861867904663086, "global_step": 11433, "epoch": 68} {"train_loss": -5.714076519012451, "global_step": 11434, "epoch": 68} {"train_loss": -5.920779228210449, "global_step": 11435, "epoch": 68} {"train_loss": -6.070296287536621, "global_step": 11436, "epoch": 68} {"train_loss": -6.0945916175842285, "global_step": 11437, "epoch": 68} {"train_loss": -6.171164512634277, "global_step": 11438, "epoch": 68} {"train_loss": -5.976409912109375, "global_step": 11439, "epoch": 68} {"train_loss": -5.857018947601318, "global_step": 11440, "epoch": 68} {"train_loss": -5.664951324462891, "global_step": 11441, "epoch": 68} {"train_loss": -5.830496788024902, "global_step": 11442, "epoch": 68} {"train_loss": -5.922466278076172, "global_step": 11443, "epoch": 68} {"train_loss": -5.9108076095581055, "global_step": 11444, "epoch": 68} {"train_loss": -6.092072010040283, "global_step": 11445, "epoch": 68} {"train_loss": -5.988232612609863, "global_step": 11446, "epoch": 68} {"train_loss": -5.994174480438232, "global_step": 11447, "epoch": 68} {"train_loss": -5.9014105796813965, "global_step": 11448, "epoch": 68} {"train_loss": -6.011219024658203, "global_step": 11449, "epoch": 68} {"train_loss": -5.911993026733398, "global_step": 11450, "epoch": 68} {"train_loss": -6.063878059387207, "global_step": 11451, "epoch": 68} {"train_loss": -5.952398300170898, "global_step": 11452, "epoch": 68} {"train_loss": -5.968807220458984, "global_step": 11453, "epoch": 68} {"train_loss": -6.151577949523926, "global_step": 11454, "epoch": 68} {"train_loss": -5.987001419067383, "global_step": 11455, "epoch": 68} {"train_loss": -6.0725626945495605, "global_step": 11456, "epoch": 68} {"train_loss": -5.9876203536987305, "global_step": 11457, "epoch": 68} {"train_loss": -5.802762031555176, "global_step": 11458, "epoch": 68} {"train_loss": -5.825287342071533, "global_step": 11459, "epoch": 68} {"train_loss": -5.803112030029297, "global_step": 11460, "epoch": 68} {"train_loss": -5.884670734405518, "global_step": 11461, "epoch": 68} {"train_loss": -6.035661697387695, "global_step": 11462, "epoch": 68} {"train_loss": -5.92060661315918, "global_step": 11463, "epoch": 68} {"train_loss": -5.776662349700928, "global_step": 11464, "epoch": 68} {"train_loss": -6.010707378387451, "global_step": 11465, "epoch": 68} {"train_loss": -6.149669647216797, "global_step": 11466, "epoch": 68} {"train_loss": -5.9482831954956055, "global_step": 11467, "epoch": 68} {"train_loss": -5.844038963317871, "global_step": 11468, "epoch": 68} {"train_loss": -5.928464412689209, "global_step": 11469, "epoch": 68} {"train_loss": -6.000998020172119, "global_step": 11470, "epoch": 68} {"train_loss": -6.037271499633789, "global_step": 11471, "epoch": 68} {"train_loss": -6.023080825805664, "global_step": 11472, "epoch": 68} {"train_loss": -6.233105659484863, "global_step": 11473, "epoch": 68} {"train_loss": -6.157967567443848, "global_step": 11474, "epoch": 68} {"train_loss": -5.956648826599121, "global_step": 11475, "epoch": 68} {"train_loss": -5.907961368560791, "global_step": 11476, "epoch": 68} {"train_loss": -5.69812536239624, "global_step": 11477, "epoch": 68} {"train_loss": -5.69683837890625, "global_step": 11478, "epoch": 68} {"train_loss": -6.005819320678711, "global_step": 11479, "epoch": 68} {"train_loss": -6.1691694259643555, "global_step": 11480, "epoch": 68} {"train_loss": -5.700078010559082, "global_step": 11481, "epoch": 68} {"train_loss": -6.131956100463867, "global_step": 11482, "epoch": 68} {"train_loss": -5.986448287963867, "global_step": 11483, "epoch": 68} {"train_loss": -5.904027938842773, "global_step": 11484, "epoch": 68} {"train_loss": -5.978411674499512, "global_step": 11485, "epoch": 68} {"train_loss": -6.152994155883789, "global_step": 11486, "epoch": 68} {"train_loss": -6.1053385734558105, "global_step": 11487, "epoch": 68} {"train_loss": -6.058976173400879, "global_step": 11488, "epoch": 68} {"train_loss": -6.0161285400390625, "global_step": 11489, "epoch": 68} {"train_loss": -5.947221755981445, "global_step": 11490, "epoch": 68} {"train_loss": -6.055194854736328, "global_step": 11491, "epoch": 68} {"train_loss": -5.944094181060791, "global_step": 11492, "epoch": 68} {"train_loss": -6.087985992431641, "global_step": 11493, "epoch": 68} {"train_loss": -6.093740463256836, "global_step": 11494, "epoch": 68} {"train_loss": -5.811199188232422, "global_step": 11495, "epoch": 68} {"train_loss": -5.771051406860352, "global_step": 11496, "epoch": 68} {"train_loss": -5.9759416580200195, "global_step": 11497, "epoch": 68} {"train_loss": -6.097269058227539, "global_step": 11498, "epoch": 68} {"train_loss": -5.882715225219727, "global_step": 11499, "epoch": 68} {"train_loss": -5.981448173522949, "global_step": 11500, "epoch": 68} {"train_loss": -5.838403701782227, "global_step": 11501, "epoch": 68} {"train_loss": -5.939033508300781, "global_step": 11502, "epoch": 68} {"train_loss": -5.832216262817383, "global_step": 11503, "epoch": 68} {"train_loss": -5.928039073944092, "global_step": 11504, "epoch": 68} {"train_loss": -5.992446422576904, "global_step": 11505, "epoch": 68} {"train_loss": -5.8959856033325195, "global_step": 11506, "epoch": 68} {"train_loss": -5.964805603027344, "global_step": 11507, "epoch": 68} {"train_loss": -5.969213485717773, "global_step": 11508, "epoch": 68} {"train_loss": -6.077353477478027, "global_step": 11509, "epoch": 68} {"train_loss": -5.963104248046875, "global_step": 11510, "epoch": 68} {"train_loss": -5.6910247802734375, "global_step": 11511, "epoch": 68} {"train_loss": -6.110700607299805, "global_step": 11512, "epoch": 68} {"train_loss": -6.100700855255127, "global_step": 11513, "epoch": 68} {"train_loss": -5.778655529022217, "global_step": 11514, "epoch": 68} {"train_loss": -5.843646049499512, "global_step": 11515, "epoch": 68} {"train_loss": -5.883084297180176, "global_step": 11516, "epoch": 68} {"train_loss": -6.106340408325195, "global_step": 11517, "epoch": 68} {"train_loss": -5.928908824920654, "global_step": 11518, "epoch": 68} {"train_loss": -6.1542463302612305, "global_step": 11519, "epoch": 68} {"train_loss": -6.056130409240723, "global_step": 11520, "epoch": 68} {"train_loss": -5.87093448638916, "global_step": 11521, "epoch": 68} {"train_loss": -6.051141738891602, "global_step": 11522, "epoch": 68} {"train_loss": -5.622496604919434, "global_step": 11523, "epoch": 68} {"train_loss": -5.909931182861328, "global_step": 11524, "epoch": 68} {"train_loss": -5.529777526855469, "global_step": 11525, "epoch": 68} {"train_loss": -6.175225257873535, "global_step": 11526, "epoch": 68} {"train_loss": -5.66881799697876, "global_step": 11527, "epoch": 68} {"train_loss": -5.794550895690918, "global_step": 11528, "epoch": 68} {"train_loss": -5.790785789489746, "global_step": 11529, "epoch": 68} {"train_loss": -5.684838771820068, "global_step": 11530, "epoch": 68} {"train_loss": -5.899588584899902, "global_step": 11531, "epoch": 68} {"train_loss": -5.969944000244141, "global_step": 11532, "epoch": 68} {"train_loss": -5.9028425216674805, "global_step": 11533, "epoch": 68} {"train_loss": -6.061925411224365, "global_step": 11534, "epoch": 68} {"train_loss": -5.9705915451049805, "global_step": 11535, "epoch": 68} {"train_loss": -6.197635650634766, "global_step": 11536, "epoch": 68} {"train_loss": -5.94465446472168, "global_step": 11537, "epoch": 68} {"train_loss": -5.879364967346191, "global_step": 11538, "epoch": 68} {"train_loss": -6.289822578430176, "global_step": 11539, "epoch": 68} {"train_loss": -5.5949296951293945, "global_step": 11540, "epoch": 68} {"train_loss": -6.005729675292969, "global_step": 11541, "epoch": 68} {"train_loss": -6.021370887756348, "global_step": 11542, "epoch": 68} {"train_loss": -5.987993240356445, "global_step": 11543, "epoch": 68} {"train_loss": -5.920701026916504, "global_step": 11544, "epoch": 68} {"train_loss": -5.67558479309082, "global_step": 11545, "epoch": 68} {"train_loss": -5.905422210693359, "global_step": 11546, "epoch": 68} {"train_loss": -5.837943077087402, "global_step": 11547, "epoch": 68} {"train_loss": -5.880352973937988, "global_step": 11548, "epoch": 68} {"train_loss": -5.610189437866211, "global_step": 11549, "epoch": 68} {"train_loss": -5.983822345733643, "global_step": 11550, "epoch": 68} {"train_loss": -5.8769073486328125, "global_step": 11551, "epoch": 68} {"train_loss": -5.775208473205566, "global_step": 11552, "epoch": 68} {"train_loss": -6.014899253845215, "global_step": 11553, "epoch": 68} {"train_loss": -6.06632137298584, "global_step": 11554, "epoch": 68} {"train_loss": -5.768474578857422, "global_step": 11555, "epoch": 68} {"train_loss": -5.986509799957275, "global_step": 11556, "epoch": 68} {"train_loss": -6.113812446594238, "global_step": 11557, "epoch": 68} {"train_loss": -6.165348052978516, "global_step": 11558, "epoch": 68} {"train_loss": -6.087383270263672, "global_step": 11559, "epoch": 68} {"train_loss": -5.74702787399292, "global_step": 11560, "epoch": 68} {"train_loss": -5.810061454772949, "global_step": 11561, "epoch": 68} {"train_loss": -5.765819549560547, "global_step": 11562, "epoch": 68} {"train_loss": -5.78262996673584, "global_step": 11563, "epoch": 68} {"train_loss": -5.889294624328613, "global_step": 11564, "epoch": 68} {"train_loss": -5.783496856689453, "global_step": 11565, "epoch": 68} {"train_loss": -5.605650901794434, "global_step": 11566, "epoch": 68} {"train_loss": -5.788211822509766, "global_step": 11567, "epoch": 68} {"train_loss": -5.562444686889648, "global_step": 11568, "epoch": 68} {"train_loss": -6.124795913696289, "global_step": 11569, "epoch": 68} {"train_loss": -5.464118003845215, "global_step": 11570, "epoch": 68} {"train_loss": -5.635793209075928, "global_step": 11571, "epoch": 68} {"train_loss": -5.963241100311279, "global_step": 11572, "epoch": 68} {"train_loss": -5.75344181060791, "global_step": 11573, "epoch": 68} {"train_loss": -5.71920919418335, "global_step": 11574, "epoch": 68} {"train_loss": -5.724475860595703, "global_step": 11575, "epoch": 68} {"train_loss": -5.786240577697754, "global_step": 11576, "epoch": 68} {"train_loss": -5.649332046508789, "global_step": 11577, "epoch": 68} {"train_loss": -5.904750347137451, "global_step": 11578, "epoch": 68} {"train_loss": -5.809842109680176, "global_step": 11579, "epoch": 68} {"train_loss": -5.885603904724121, "global_step": 11580, "epoch": 68} {"train_loss": -5.793776035308838, "global_step": 11581, "epoch": 68} {"train_loss": -5.772089958190918, "global_step": 11582, "epoch": 68} {"train_loss": -5.917398929595947, "global_step": 11583, "epoch": 68} {"train_loss": -5.93962287902832, "global_step": 11584, "epoch": 68} {"train_loss": -5.9344682693481445, "global_step": 11585, "epoch": 68} {"train_loss": -5.727331161499023, "global_step": 11586, "epoch": 68} {"train_loss": -5.745972156524658, "global_step": 11587, "epoch": 68} {"train_loss": -5.640578269958496, "global_step": 11588, "epoch": 68} {"train_loss": -5.884208679199219, "global_step": 11589, "epoch": 68} {"train_loss": -5.584638595581055, "global_step": 11590, "epoch": 68} {"train_loss": -5.9136102965899875, "global_step": 11591, "epoch": 68, "val_loss": 254975.8125} {"train_loss": -5.933602333068848, "global_step": 11592, "epoch": 69} {"train_loss": -5.817930221557617, "global_step": 11593, "epoch": 69} {"train_loss": -6.030360698699951, "global_step": 11594, "epoch": 69} {"train_loss": -5.972033977508545, "global_step": 11595, "epoch": 69} {"train_loss": -6.093320846557617, "global_step": 11596, "epoch": 69} {"train_loss": -6.049018859863281, "global_step": 11597, "epoch": 69} {"train_loss": -5.911736488342285, "global_step": 11598, "epoch": 69} {"train_loss": -5.966673851013184, "global_step": 11599, "epoch": 69} {"train_loss": -6.047689437866211, "global_step": 11600, "epoch": 69} {"train_loss": -5.685336589813232, "global_step": 11601, "epoch": 69} {"train_loss": -6.077564239501953, "global_step": 11602, "epoch": 69} {"train_loss": -5.8278727531433105, "global_step": 11603, "epoch": 69} {"train_loss": -6.164814472198486, "global_step": 11604, "epoch": 69} {"train_loss": -5.953248500823975, "global_step": 11605, "epoch": 69} {"train_loss": -5.828381538391113, "global_step": 11606, "epoch": 69} {"train_loss": -6.095213413238525, "global_step": 11607, "epoch": 69} {"train_loss": -6.285215377807617, "global_step": 11608, "epoch": 69} {"train_loss": -5.963959693908691, "global_step": 11609, "epoch": 69} {"train_loss": -6.111032485961914, "global_step": 11610, "epoch": 69} {"train_loss": -6.065911293029785, "global_step": 11611, "epoch": 69} {"train_loss": -5.972342491149902, "global_step": 11612, "epoch": 69} {"train_loss": -6.176248550415039, "global_step": 11613, "epoch": 69} {"train_loss": -6.0715742111206055, "global_step": 11614, "epoch": 69} {"train_loss": -5.931028366088867, "global_step": 11615, "epoch": 69} {"train_loss": -5.8643693923950195, "global_step": 11616, "epoch": 69} {"train_loss": -5.966794013977051, "global_step": 11617, "epoch": 69} {"train_loss": -6.04617166519165, "global_step": 11618, "epoch": 69} {"train_loss": -6.016119003295898, "global_step": 11619, "epoch": 69} {"train_loss": -5.906720161437988, "global_step": 11620, "epoch": 69} {"train_loss": -6.159401893615723, "global_step": 11621, "epoch": 69} {"train_loss": -5.93469762802124, "global_step": 11622, "epoch": 69} {"train_loss": -5.998648166656494, "global_step": 11623, "epoch": 69} {"train_loss": -5.77842903137207, "global_step": 11624, "epoch": 69} {"train_loss": -6.048500061035156, "global_step": 11625, "epoch": 69} {"train_loss": -5.841034889221191, "global_step": 11626, "epoch": 69} {"train_loss": -6.056729316711426, "global_step": 11627, "epoch": 69} {"train_loss": -6.002437114715576, "global_step": 11628, "epoch": 69} {"train_loss": -6.1611528396606445, "global_step": 11629, "epoch": 69} {"train_loss": -5.998175144195557, "global_step": 11630, "epoch": 69} {"train_loss": -6.260584831237793, "global_step": 11631, "epoch": 69} {"train_loss": -5.774919509887695, "global_step": 11632, "epoch": 69} {"train_loss": -5.7288126945495605, "global_step": 11633, "epoch": 69} {"train_loss": -6.139944076538086, "global_step": 11634, "epoch": 69} {"train_loss": -5.756732940673828, "global_step": 11635, "epoch": 69} {"train_loss": -6.112177848815918, "global_step": 11636, "epoch": 69} {"train_loss": -5.640295028686523, "global_step": 11637, "epoch": 69} {"train_loss": -5.924188137054443, "global_step": 11638, "epoch": 69} {"train_loss": -5.863073348999023, "global_step": 11639, "epoch": 69} {"train_loss": -5.759481430053711, "global_step": 11640, "epoch": 69} {"train_loss": -6.120785713195801, "global_step": 11641, "epoch": 69} {"train_loss": -6.142284393310547, "global_step": 11642, "epoch": 69} {"train_loss": -5.9301629066467285, "global_step": 11643, "epoch": 69} {"train_loss": -5.7464447021484375, "global_step": 11644, "epoch": 69} {"train_loss": -5.897548198699951, "global_step": 11645, "epoch": 69} {"train_loss": -6.178606033325195, "global_step": 11646, "epoch": 69} {"train_loss": -6.119243144989014, "global_step": 11647, "epoch": 69} {"train_loss": -5.957925796508789, "global_step": 11648, "epoch": 69} {"train_loss": -5.974917411804199, "global_step": 11649, "epoch": 69} {"train_loss": -5.977581977844238, "global_step": 11650, "epoch": 69} {"train_loss": -6.079154014587402, "global_step": 11651, "epoch": 69} {"train_loss": -5.8829731941223145, "global_step": 11652, "epoch": 69} {"train_loss": -6.140761852264404, "global_step": 11653, "epoch": 69} {"train_loss": -6.074604034423828, "global_step": 11654, "epoch": 69} {"train_loss": -5.868658542633057, "global_step": 11655, "epoch": 69} {"train_loss": -6.253176689147949, "global_step": 11656, "epoch": 69} {"train_loss": -6.024746894836426, "global_step": 11657, "epoch": 69} {"train_loss": -6.0331196784973145, "global_step": 11658, "epoch": 69} {"train_loss": -6.08575963973999, "global_step": 11659, "epoch": 69} {"train_loss": -5.904840469360352, "global_step": 11660, "epoch": 69} {"train_loss": -6.229626178741455, "global_step": 11661, "epoch": 69} {"train_loss": -6.073271751403809, "global_step": 11662, "epoch": 69} {"train_loss": -6.2876410484313965, "global_step": 11663, "epoch": 69} {"train_loss": -6.054285049438477, "global_step": 11664, "epoch": 69} {"train_loss": -6.106724739074707, "global_step": 11665, "epoch": 69} {"train_loss": -6.038355827331543, "global_step": 11666, "epoch": 69} {"train_loss": -6.381324768066406, "global_step": 11667, "epoch": 69} {"train_loss": -5.7469706535339355, "global_step": 11668, "epoch": 69} {"train_loss": -6.080163478851318, "global_step": 11669, "epoch": 69} {"train_loss": -5.9884772300720215, "global_step": 11670, "epoch": 69} {"train_loss": -5.862874984741211, "global_step": 11671, "epoch": 69} {"train_loss": -5.969346523284912, "global_step": 11672, "epoch": 69} {"train_loss": -5.8884782791137695, "global_step": 11673, "epoch": 69} {"train_loss": -5.582907199859619, "global_step": 11674, "epoch": 69} {"train_loss": -6.180690288543701, "global_step": 11675, "epoch": 69} {"train_loss": -5.898715972900391, "global_step": 11676, "epoch": 69} {"train_loss": -5.712307453155518, "global_step": 11677, "epoch": 69} {"train_loss": -5.910151958465576, "global_step": 11678, "epoch": 69} {"train_loss": -5.885786056518555, "global_step": 11679, "epoch": 69} {"train_loss": -5.984949111938477, "global_step": 11680, "epoch": 69} {"train_loss": -5.6916890144348145, "global_step": 11681, "epoch": 69} {"train_loss": -5.679432392120361, "global_step": 11682, "epoch": 69} {"train_loss": -5.9755330085754395, "global_step": 11683, "epoch": 69} {"train_loss": -5.834995746612549, "global_step": 11684, "epoch": 69} {"train_loss": -5.972054481506348, "global_step": 11685, "epoch": 69} {"train_loss": -5.91750955581665, "global_step": 11686, "epoch": 69} {"train_loss": -5.949370384216309, "global_step": 11687, "epoch": 69} {"train_loss": -5.8447370529174805, "global_step": 11688, "epoch": 69} {"train_loss": -6.268521308898926, "global_step": 11689, "epoch": 69} {"train_loss": -6.000929832458496, "global_step": 11690, "epoch": 69} {"train_loss": -6.1574883460998535, "global_step": 11691, "epoch": 69} {"train_loss": -5.98721981048584, "global_step": 11692, "epoch": 69} {"train_loss": -6.096634387969971, "global_step": 11693, "epoch": 69} {"train_loss": -5.853541374206543, "global_step": 11694, "epoch": 69} {"train_loss": -6.1255693435668945, "global_step": 11695, "epoch": 69} {"train_loss": -6.161181926727295, "global_step": 11696, "epoch": 69} {"train_loss": -5.798961639404297, "global_step": 11697, "epoch": 69} {"train_loss": -6.049156665802002, "global_step": 11698, "epoch": 69} {"train_loss": -5.883736610412598, "global_step": 11699, "epoch": 69} {"train_loss": -5.936716079711914, "global_step": 11700, "epoch": 69} {"train_loss": -6.021544456481934, "global_step": 11701, "epoch": 69} {"train_loss": -5.714623928070068, "global_step": 11702, "epoch": 69} {"train_loss": -6.2919087409973145, "global_step": 11703, "epoch": 69} {"train_loss": -5.94584846496582, "global_step": 11704, "epoch": 69} {"train_loss": -5.927966594696045, "global_step": 11705, "epoch": 69} {"train_loss": -5.837891101837158, "global_step": 11706, "epoch": 69} {"train_loss": -5.72592830657959, "global_step": 11707, "epoch": 69} {"train_loss": -5.916542053222656, "global_step": 11708, "epoch": 69} {"train_loss": -5.672260284423828, "global_step": 11709, "epoch": 69} {"train_loss": -5.855572700500488, "global_step": 11710, "epoch": 69} {"train_loss": -6.156920433044434, "global_step": 11711, "epoch": 69} {"train_loss": -5.812884330749512, "global_step": 11712, "epoch": 69} {"train_loss": -5.830870628356934, "global_step": 11713, "epoch": 69} {"train_loss": -5.871300220489502, "global_step": 11714, "epoch": 69} {"train_loss": -5.6722798347473145, "global_step": 11715, "epoch": 69} {"train_loss": -5.634294509887695, "global_step": 11716, "epoch": 69} {"train_loss": -6.084482192993164, "global_step": 11717, "epoch": 69} {"train_loss": -5.807666778564453, "global_step": 11718, "epoch": 69} {"train_loss": -6.0468668937683105, "global_step": 11719, "epoch": 69} {"train_loss": -5.601051330566406, "global_step": 11720, "epoch": 69} {"train_loss": -6.1564788818359375, "global_step": 11721, "epoch": 69} {"train_loss": -6.005177974700928, "global_step": 11722, "epoch": 69} {"train_loss": -6.026918888092041, "global_step": 11723, "epoch": 69} {"train_loss": -5.970428943634033, "global_step": 11724, "epoch": 69} {"train_loss": -6.129691123962402, "global_step": 11725, "epoch": 69} {"train_loss": -6.191985130310059, "global_step": 11726, "epoch": 69} {"train_loss": -5.687827110290527, "global_step": 11727, "epoch": 69} {"train_loss": -5.831854820251465, "global_step": 11728, "epoch": 69} {"train_loss": -5.806497097015381, "global_step": 11729, "epoch": 69} {"train_loss": -5.871555328369141, "global_step": 11730, "epoch": 69} {"train_loss": -5.710910797119141, "global_step": 11731, "epoch": 69} {"train_loss": -5.979808807373047, "global_step": 11732, "epoch": 69} {"train_loss": -6.016061305999756, "global_step": 11733, "epoch": 69} {"train_loss": -5.970395565032959, "global_step": 11734, "epoch": 69} {"train_loss": -6.011610984802246, "global_step": 11735, "epoch": 69} {"train_loss": -6.172239303588867, "global_step": 11736, "epoch": 69} {"train_loss": -5.843903541564941, "global_step": 11737, "epoch": 69} {"train_loss": -5.871504783630371, "global_step": 11738, "epoch": 69} {"train_loss": -6.273769378662109, "global_step": 11739, "epoch": 69} {"train_loss": -6.136133193969727, "global_step": 11740, "epoch": 69} {"train_loss": -6.150976181030273, "global_step": 11741, "epoch": 69} {"train_loss": -6.023272514343262, "global_step": 11742, "epoch": 69} {"train_loss": -6.164827346801758, "global_step": 11743, "epoch": 69} {"train_loss": -6.296396255493164, "global_step": 11744, "epoch": 69} {"train_loss": -5.876984596252441, "global_step": 11745, "epoch": 69} {"train_loss": -5.926933288574219, "global_step": 11746, "epoch": 69} {"train_loss": -6.017303466796875, "global_step": 11747, "epoch": 69} {"train_loss": -6.27589225769043, "global_step": 11748, "epoch": 69} {"train_loss": -6.298943996429443, "global_step": 11749, "epoch": 69} {"train_loss": -6.028148651123047, "global_step": 11750, "epoch": 69} {"train_loss": -6.042537689208984, "global_step": 11751, "epoch": 69} {"train_loss": -6.214502334594727, "global_step": 11752, "epoch": 69} {"train_loss": -6.280364036560059, "global_step": 11753, "epoch": 69} {"train_loss": -6.214921951293945, "global_step": 11754, "epoch": 69} {"train_loss": -6.0551605224609375, "global_step": 11755, "epoch": 69} {"train_loss": -6.4573822021484375, "global_step": 11756, "epoch": 69} {"train_loss": -6.551053524017334, "global_step": 11757, "epoch": 69} {"train_loss": -6.246879577636719, "global_step": 11758, "epoch": 69} {"train_loss": -5.992006843998318, "global_step": 11759, "epoch": 69, "val_loss": 258463.71875} {"train_loss": -6.4761505126953125, "global_step": 11760, "epoch": 70} {"train_loss": -6.086493492126465, "global_step": 11761, "epoch": 70} {"train_loss": -5.883162498474121, "global_step": 11762, "epoch": 70} {"train_loss": -6.063590049743652, "global_step": 11763, "epoch": 70} {"train_loss": -6.053191184997559, "global_step": 11764, "epoch": 70} {"train_loss": -6.053991317749023, "global_step": 11765, "epoch": 70} {"train_loss": -6.308809280395508, "global_step": 11766, "epoch": 70} {"train_loss": -5.852205276489258, "global_step": 11767, "epoch": 70} {"train_loss": -6.082947731018066, "global_step": 11768, "epoch": 70} {"train_loss": -5.737268447875977, "global_step": 11769, "epoch": 70} {"train_loss": -6.122001647949219, "global_step": 11770, "epoch": 70} {"train_loss": -5.92287540435791, "global_step": 11771, "epoch": 70} {"train_loss": -5.872637748718262, "global_step": 11772, "epoch": 70} {"train_loss": -6.161868095397949, "global_step": 11773, "epoch": 70} {"train_loss": -5.904435157775879, "global_step": 11774, "epoch": 70} {"train_loss": -6.138667106628418, "global_step": 11775, "epoch": 70} {"train_loss": -6.186407566070557, "global_step": 11776, "epoch": 70} {"train_loss": -6.169659614562988, "global_step": 11777, "epoch": 70} {"train_loss": -6.142476558685303, "global_step": 11778, "epoch": 70} {"train_loss": -5.866660118103027, "global_step": 11779, "epoch": 70} {"train_loss": -6.092097282409668, "global_step": 11780, "epoch": 70} {"train_loss": -5.973080635070801, "global_step": 11781, "epoch": 70} {"train_loss": -6.248279571533203, "global_step": 11782, "epoch": 70} {"train_loss": -6.045888900756836, "global_step": 11783, "epoch": 70} {"train_loss": -6.231452465057373, "global_step": 11784, "epoch": 70} {"train_loss": -6.39535665512085, "global_step": 11785, "epoch": 70} {"train_loss": -6.050490379333496, "global_step": 11786, "epoch": 70} {"train_loss": -6.15524959564209, "global_step": 11787, "epoch": 70} {"train_loss": -5.940439224243164, "global_step": 11788, "epoch": 70} {"train_loss": -6.2934088706970215, "global_step": 11789, "epoch": 70} {"train_loss": -6.298877716064453, "global_step": 11790, "epoch": 70} {"train_loss": -6.1927385330200195, "global_step": 11791, "epoch": 70} {"train_loss": -5.939840316772461, "global_step": 11792, "epoch": 70} {"train_loss": -6.230515956878662, "global_step": 11793, "epoch": 70} {"train_loss": -5.7681121826171875, "global_step": 11794, "epoch": 70} {"train_loss": -5.6959099769592285, "global_step": 11795, "epoch": 70} {"train_loss": -5.771331310272217, "global_step": 11796, "epoch": 70} {"train_loss": -5.968420028686523, "global_step": 11797, "epoch": 70} {"train_loss": -5.905058860778809, "global_step": 11798, "epoch": 70} {"train_loss": -5.725322723388672, "global_step": 11799, "epoch": 70} {"train_loss": -5.508440017700195, "global_step": 11800, "epoch": 70} {"train_loss": -5.906209468841553, "global_step": 11801, "epoch": 70} {"train_loss": -5.987692356109619, "global_step": 11802, "epoch": 70} {"train_loss": -5.7610249519348145, "global_step": 11803, "epoch": 70} {"train_loss": -6.069835662841797, "global_step": 11804, "epoch": 70} {"train_loss": -6.108992576599121, "global_step": 11805, "epoch": 70} {"train_loss": -6.051451683044434, "global_step": 11806, "epoch": 70} {"train_loss": -6.051570892333984, "global_step": 11807, "epoch": 70} {"train_loss": -6.043179988861084, "global_step": 11808, "epoch": 70} {"train_loss": -5.739213943481445, "global_step": 11809, "epoch": 70} {"train_loss": -5.951757431030273, "global_step": 11810, "epoch": 70} {"train_loss": -5.756277084350586, "global_step": 11811, "epoch": 70} {"train_loss": -6.046761512756348, "global_step": 11812, "epoch": 70} {"train_loss": -5.953899383544922, "global_step": 11813, "epoch": 70} {"train_loss": -5.851614475250244, "global_step": 11814, "epoch": 70} {"train_loss": -5.7528862953186035, "global_step": 11815, "epoch": 70} {"train_loss": -5.920994758605957, "global_step": 11816, "epoch": 70} {"train_loss": -6.031708240509033, "global_step": 11817, "epoch": 70} {"train_loss": -6.009040832519531, "global_step": 11818, "epoch": 70} {"train_loss": -6.063440322875977, "global_step": 11819, "epoch": 70} {"train_loss": -6.0425872802734375, "global_step": 11820, "epoch": 70} {"train_loss": -6.024478435516357, "global_step": 11821, "epoch": 70} {"train_loss": -5.899322986602783, "global_step": 11822, "epoch": 70} {"train_loss": -6.265553951263428, "global_step": 11823, "epoch": 70} {"train_loss": -5.971986293792725, "global_step": 11824, "epoch": 70} {"train_loss": -5.989065170288086, "global_step": 11825, "epoch": 70} {"train_loss": -6.052687168121338, "global_step": 11826, "epoch": 70} {"train_loss": -6.151651859283447, "global_step": 11827, "epoch": 70} {"train_loss": -6.107266902923584, "global_step": 11828, "epoch": 70} {"train_loss": -6.267518997192383, "global_step": 11829, "epoch": 70} {"train_loss": -6.09816312789917, "global_step": 11830, "epoch": 70} {"train_loss": -5.980312347412109, "global_step": 11831, "epoch": 70} {"train_loss": -6.00118350982666, "global_step": 11832, "epoch": 70} {"train_loss": -6.209250450134277, "global_step": 11833, "epoch": 70} {"train_loss": -6.027808666229248, "global_step": 11834, "epoch": 70} {"train_loss": -6.162318229675293, "global_step": 11835, "epoch": 70} {"train_loss": -6.148687362670898, "global_step": 11836, "epoch": 70} {"train_loss": -6.033378601074219, "global_step": 11837, "epoch": 70} {"train_loss": -5.814825057983398, "global_step": 11838, "epoch": 70} {"train_loss": -5.841643333435059, "global_step": 11839, "epoch": 70} {"train_loss": -5.9126691818237305, "global_step": 11840, "epoch": 70} {"train_loss": -6.008768081665039, "global_step": 11841, "epoch": 70} {"train_loss": -6.105969429016113, "global_step": 11842, "epoch": 70} {"train_loss": -6.158860206604004, "global_step": 11843, "epoch": 70} {"train_loss": -6.100910186767578, "global_step": 11844, "epoch": 70} {"train_loss": -6.0006232261657715, "global_step": 11845, "epoch": 70} {"train_loss": -5.995091915130615, "global_step": 11846, "epoch": 70} {"train_loss": -5.9998016357421875, "global_step": 11847, "epoch": 70} {"train_loss": -6.10745906829834, "global_step": 11848, "epoch": 70} {"train_loss": -6.014523506164551, "global_step": 11849, "epoch": 70} {"train_loss": -5.801520347595215, "global_step": 11850, "epoch": 70} {"train_loss": -6.142531394958496, "global_step": 11851, "epoch": 70} {"train_loss": -6.261148452758789, "global_step": 11852, "epoch": 70} {"train_loss": -5.845859527587891, "global_step": 11853, "epoch": 70} {"train_loss": -6.147601127624512, "global_step": 11854, "epoch": 70} {"train_loss": -6.110446453094482, "global_step": 11855, "epoch": 70} {"train_loss": -5.984536647796631, "global_step": 11856, "epoch": 70} {"train_loss": -6.347529411315918, "global_step": 11857, "epoch": 70} {"train_loss": -6.134329319000244, "global_step": 11858, "epoch": 70} {"train_loss": -6.111011505126953, "global_step": 11859, "epoch": 70} {"train_loss": -5.9081339836120605, "global_step": 11860, "epoch": 70} {"train_loss": -6.224546432495117, "global_step": 11861, "epoch": 70} {"train_loss": -6.117828369140625, "global_step": 11862, "epoch": 70} {"train_loss": -6.031120300292969, "global_step": 11863, "epoch": 70} {"train_loss": -6.166774749755859, "global_step": 11864, "epoch": 70} {"train_loss": -6.015027046203613, "global_step": 11865, "epoch": 70} {"train_loss": -6.227709770202637, "global_step": 11866, "epoch": 70} {"train_loss": -5.713799476623535, "global_step": 11867, "epoch": 70} {"train_loss": -6.134482383728027, "global_step": 11868, "epoch": 70} {"train_loss": -6.034239292144775, "global_step": 11869, "epoch": 70} {"train_loss": -5.963789463043213, "global_step": 11870, "epoch": 70} {"train_loss": -5.959620952606201, "global_step": 11871, "epoch": 70} {"train_loss": -5.92938232421875, "global_step": 11872, "epoch": 70} {"train_loss": -5.86422872543335, "global_step": 11873, "epoch": 70} {"train_loss": -6.0308380126953125, "global_step": 11874, "epoch": 70} {"train_loss": -6.103641033172607, "global_step": 11875, "epoch": 70} {"train_loss": -6.1455888748168945, "global_step": 11876, "epoch": 70} {"train_loss": -5.885837554931641, "global_step": 11877, "epoch": 70} {"train_loss": -6.211104869842529, "global_step": 11878, "epoch": 70} {"train_loss": -6.0321550369262695, "global_step": 11879, "epoch": 70} {"train_loss": -5.994629383087158, "global_step": 11880, "epoch": 70} {"train_loss": -5.996011257171631, "global_step": 11881, "epoch": 70} {"train_loss": -5.902162075042725, "global_step": 11882, "epoch": 70} {"train_loss": -6.028995990753174, "global_step": 11883, "epoch": 70} {"train_loss": -5.826294898986816, "global_step": 11884, "epoch": 70} {"train_loss": -5.7552666664123535, "global_step": 11885, "epoch": 70} {"train_loss": -5.964256286621094, "global_step": 11886, "epoch": 70} {"train_loss": -5.5416460037231445, "global_step": 11887, "epoch": 70} {"train_loss": -6.03466272354126, "global_step": 11888, "epoch": 70} {"train_loss": -5.833512306213379, "global_step": 11889, "epoch": 70} {"train_loss": -6.180722236633301, "global_step": 11890, "epoch": 70} {"train_loss": -5.786776065826416, "global_step": 11891, "epoch": 70} {"train_loss": -5.996606349945068, "global_step": 11892, "epoch": 70} {"train_loss": -6.013409614562988, "global_step": 11893, "epoch": 70} {"train_loss": -6.08740234375, "global_step": 11894, "epoch": 70} {"train_loss": -6.034677982330322, "global_step": 11895, "epoch": 70} {"train_loss": -6.0551042556762695, "global_step": 11896, "epoch": 70} {"train_loss": -5.960753440856934, "global_step": 11897, "epoch": 70} {"train_loss": -5.892234802246094, "global_step": 11898, "epoch": 70} {"train_loss": -6.095522403717041, "global_step": 11899, "epoch": 70} {"train_loss": -6.090635299682617, "global_step": 11900, "epoch": 70} {"train_loss": -5.717004776000977, "global_step": 11901, "epoch": 70} {"train_loss": -6.0964579582214355, "global_step": 11902, "epoch": 70} {"train_loss": -5.728986740112305, "global_step": 11903, "epoch": 70} {"train_loss": -5.9227213859558105, "global_step": 11904, "epoch": 70} {"train_loss": -5.899762153625488, "global_step": 11905, "epoch": 70} {"train_loss": -6.051052570343018, "global_step": 11906, "epoch": 70} {"train_loss": -6.144869804382324, "global_step": 11907, "epoch": 70} {"train_loss": -5.946910858154297, "global_step": 11908, "epoch": 70} {"train_loss": -6.048422813415527, "global_step": 11909, "epoch": 70} {"train_loss": -5.941020965576172, "global_step": 11910, "epoch": 70} {"train_loss": -6.039254188537598, "global_step": 11911, "epoch": 70} {"train_loss": -6.089138031005859, "global_step": 11912, "epoch": 70} {"train_loss": -5.864825248718262, "global_step": 11913, "epoch": 70} {"train_loss": -6.155521392822266, "global_step": 11914, "epoch": 70} {"train_loss": -6.328154563903809, "global_step": 11915, "epoch": 70} {"train_loss": -5.76605749130249, "global_step": 11916, "epoch": 70} {"train_loss": -6.0984392166137695, "global_step": 11917, "epoch": 70} {"train_loss": -5.898510456085205, "global_step": 11918, "epoch": 70} {"train_loss": -6.118361473083496, "global_step": 11919, "epoch": 70} {"train_loss": -5.984294891357422, "global_step": 11920, "epoch": 70} {"train_loss": -5.771259307861328, "global_step": 11921, "epoch": 70} {"train_loss": -5.971431732177734, "global_step": 11922, "epoch": 70} {"train_loss": -6.018932342529297, "global_step": 11923, "epoch": 70} {"train_loss": -5.6221923828125, "global_step": 11924, "epoch": 70} {"train_loss": -6.189704418182373, "global_step": 11925, "epoch": 70} {"train_loss": -5.5925517082214355, "global_step": 11926, "epoch": 70} {"train_loss": -6.0100513100624084, "global_step": 11927, "epoch": 70, "val_loss": 266234.4375, "train_action_mse_error": 40.269859313964844} {"train_loss": -5.956801891326904, "global_step": 11928, "epoch": 71} {"train_loss": -5.87808895111084, "global_step": 11929, "epoch": 71} {"train_loss": -5.983962059020996, "global_step": 11930, "epoch": 71} {"train_loss": -5.573912620544434, "global_step": 11931, "epoch": 71} {"train_loss": -5.914754867553711, "global_step": 11932, "epoch": 71} {"train_loss": -5.920225143432617, "global_step": 11933, "epoch": 71} {"train_loss": -5.914117813110352, "global_step": 11934, "epoch": 71} {"train_loss": -5.924461841583252, "global_step": 11935, "epoch": 71} {"train_loss": -5.880335330963135, "global_step": 11936, "epoch": 71} {"train_loss": -6.047386169433594, "global_step": 11937, "epoch": 71} {"train_loss": -5.882986068725586, "global_step": 11938, "epoch": 71} {"train_loss": -5.524660110473633, "global_step": 11939, "epoch": 71} {"train_loss": -6.060144424438477, "global_step": 11940, "epoch": 71} {"train_loss": -5.893551826477051, "global_step": 11941, "epoch": 71} {"train_loss": -5.800951957702637, "global_step": 11942, "epoch": 71} {"train_loss": -6.101373672485352, "global_step": 11943, "epoch": 71} {"train_loss": -5.676407814025879, "global_step": 11944, "epoch": 71} {"train_loss": -6.104073524475098, "global_step": 11945, "epoch": 71} {"train_loss": -5.9471635818481445, "global_step": 11946, "epoch": 71} {"train_loss": -5.692961692810059, "global_step": 11947, "epoch": 71} {"train_loss": -5.790369033813477, "global_step": 11948, "epoch": 71} {"train_loss": -6.073097229003906, "global_step": 11949, "epoch": 71} {"train_loss": -6.00625467300415, "global_step": 11950, "epoch": 71} {"train_loss": -5.887920379638672, "global_step": 11951, "epoch": 71} {"train_loss": -6.015273571014404, "global_step": 11952, "epoch": 71} {"train_loss": -5.858086585998535, "global_step": 11953, "epoch": 71} {"train_loss": -5.8266448974609375, "global_step": 11954, "epoch": 71} {"train_loss": -6.014028549194336, "global_step": 11955, "epoch": 71} {"train_loss": -5.880853652954102, "global_step": 11956, "epoch": 71} {"train_loss": -6.078489780426025, "global_step": 11957, "epoch": 71} {"train_loss": -6.0141921043396, "global_step": 11958, "epoch": 71} {"train_loss": -6.209148406982422, "global_step": 11959, "epoch": 71} {"train_loss": -5.8081889152526855, "global_step": 11960, "epoch": 71} {"train_loss": -6.238515377044678, "global_step": 11961, "epoch": 71} {"train_loss": -6.168457984924316, "global_step": 11962, "epoch": 71} {"train_loss": -5.8913445472717285, "global_step": 11963, "epoch": 71} {"train_loss": -6.0376152992248535, "global_step": 11964, "epoch": 71} {"train_loss": -6.122694969177246, "global_step": 11965, "epoch": 71} {"train_loss": -5.974358558654785, "global_step": 11966, "epoch": 71} {"train_loss": -6.000880718231201, "global_step": 11967, "epoch": 71} {"train_loss": -6.053035736083984, "global_step": 11968, "epoch": 71} {"train_loss": -5.8426618576049805, "global_step": 11969, "epoch": 71} {"train_loss": -5.818042278289795, "global_step": 11970, "epoch": 71} {"train_loss": -5.716326713562012, "global_step": 11971, "epoch": 71} {"train_loss": -6.178623199462891, "global_step": 11972, "epoch": 71} {"train_loss": -5.994080543518066, "global_step": 11973, "epoch": 71} {"train_loss": -5.959214210510254, "global_step": 11974, "epoch": 71} {"train_loss": -5.951997756958008, "global_step": 11975, "epoch": 71} {"train_loss": -5.990079402923584, "global_step": 11976, "epoch": 71} {"train_loss": -5.8324689865112305, "global_step": 11977, "epoch": 71} {"train_loss": -5.9786882400512695, "global_step": 11978, "epoch": 71} {"train_loss": -5.924757480621338, "global_step": 11979, "epoch": 71} {"train_loss": -6.059360980987549, "global_step": 11980, "epoch": 71} {"train_loss": -5.656940460205078, "global_step": 11981, "epoch": 71} {"train_loss": -6.194037437438965, "global_step": 11982, "epoch": 71} {"train_loss": -5.9001898765563965, "global_step": 11983, "epoch": 71} {"train_loss": -5.929598808288574, "global_step": 11984, "epoch": 71} {"train_loss": -5.981719970703125, "global_step": 11985, "epoch": 71} {"train_loss": -6.173171043395996, "global_step": 11986, "epoch": 71} {"train_loss": -5.932605266571045, "global_step": 11987, "epoch": 71} {"train_loss": -6.213833808898926, "global_step": 11988, "epoch": 71} {"train_loss": -6.042492389678955, "global_step": 11989, "epoch": 71} {"train_loss": -6.183933258056641, "global_step": 11990, "epoch": 71} {"train_loss": -6.076113700866699, "global_step": 11991, "epoch": 71} {"train_loss": -6.214933395385742, "global_step": 11992, "epoch": 71} {"train_loss": -6.170976638793945, "global_step": 11993, "epoch": 71} {"train_loss": -5.967594146728516, "global_step": 11994, "epoch": 71} {"train_loss": -6.358867645263672, "global_step": 11995, "epoch": 71} {"train_loss": -5.946664333343506, "global_step": 11996, "epoch": 71} {"train_loss": -6.214071273803711, "global_step": 11997, "epoch": 71} {"train_loss": -6.163954734802246, "global_step": 11998, "epoch": 71} {"train_loss": -6.179801940917969, "global_step": 11999, "epoch": 71} {"train_loss": -6.477004051208496, "global_step": 12000, "epoch": 71} {"train_loss": -6.327113151550293, "global_step": 12001, "epoch": 71} {"train_loss": -6.112488746643066, "global_step": 12002, "epoch": 71} {"train_loss": -6.01846981048584, "global_step": 12003, "epoch": 71} {"train_loss": -6.265316009521484, "global_step": 12004, "epoch": 71} {"train_loss": -5.754732131958008, "global_step": 12005, "epoch": 71} {"train_loss": -5.909768104553223, "global_step": 12006, "epoch": 71} {"train_loss": -5.934712886810303, "global_step": 12007, "epoch": 71} {"train_loss": -6.157840251922607, "global_step": 12008, "epoch": 71} {"train_loss": -5.7913289070129395, "global_step": 12009, "epoch": 71} {"train_loss": -5.81303596496582, "global_step": 12010, "epoch": 71} {"train_loss": -6.031256675720215, "global_step": 12011, "epoch": 71} {"train_loss": -5.904145240783691, "global_step": 12012, "epoch": 71} {"train_loss": -6.019894599914551, "global_step": 12013, "epoch": 71} {"train_loss": -5.951489448547363, "global_step": 12014, "epoch": 71} {"train_loss": -6.020936965942383, "global_step": 12015, "epoch": 71} {"train_loss": -6.062535285949707, "global_step": 12016, "epoch": 71} {"train_loss": -5.739486217498779, "global_step": 12017, "epoch": 71} {"train_loss": -5.976067543029785, "global_step": 12018, "epoch": 71} {"train_loss": -6.20489501953125, "global_step": 12019, "epoch": 71} {"train_loss": -6.255647659301758, "global_step": 12020, "epoch": 71} {"train_loss": -6.032907485961914, "global_step": 12021, "epoch": 71} {"train_loss": -5.882630348205566, "global_step": 12022, "epoch": 71} {"train_loss": -5.8820319175720215, "global_step": 12023, "epoch": 71} {"train_loss": -6.121450901031494, "global_step": 12024, "epoch": 71} {"train_loss": -5.859486103057861, "global_step": 12025, "epoch": 71} {"train_loss": -6.090492248535156, "global_step": 12026, "epoch": 71} {"train_loss": -5.797245979309082, "global_step": 12027, "epoch": 71} {"train_loss": -6.252072334289551, "global_step": 12028, "epoch": 71} {"train_loss": -5.856389045715332, "global_step": 12029, "epoch": 71} {"train_loss": -6.222405433654785, "global_step": 12030, "epoch": 71} {"train_loss": -6.073236465454102, "global_step": 12031, "epoch": 71} {"train_loss": -6.058552265167236, "global_step": 12032, "epoch": 71} {"train_loss": -5.85896110534668, "global_step": 12033, "epoch": 71} {"train_loss": -5.819016456604004, "global_step": 12034, "epoch": 71} {"train_loss": -6.038510322570801, "global_step": 12035, "epoch": 71} {"train_loss": -6.009920597076416, "global_step": 12036, "epoch": 71} {"train_loss": -6.131715297698975, "global_step": 12037, "epoch": 71} {"train_loss": -5.9429707527160645, "global_step": 12038, "epoch": 71} {"train_loss": -6.130740642547607, "global_step": 12039, "epoch": 71} {"train_loss": -6.0440216064453125, "global_step": 12040, "epoch": 71} {"train_loss": -6.135525226593018, "global_step": 12041, "epoch": 71} {"train_loss": -6.112009048461914, "global_step": 12042, "epoch": 71} {"train_loss": -6.088871955871582, "global_step": 12043, "epoch": 71} {"train_loss": -5.698422431945801, "global_step": 12044, "epoch": 71} {"train_loss": -6.003056526184082, "global_step": 12045, "epoch": 71} {"train_loss": -5.787906646728516, "global_step": 12046, "epoch": 71} {"train_loss": -6.026239395141602, "global_step": 12047, "epoch": 71} {"train_loss": -6.086835861206055, "global_step": 12048, "epoch": 71} {"train_loss": -6.153430938720703, "global_step": 12049, "epoch": 71} {"train_loss": -5.886448860168457, "global_step": 12050, "epoch": 71} {"train_loss": -6.184229373931885, "global_step": 12051, "epoch": 71} {"train_loss": -5.957696914672852, "global_step": 12052, "epoch": 71} {"train_loss": -5.992364883422852, "global_step": 12053, "epoch": 71} {"train_loss": -6.179098129272461, "global_step": 12054, "epoch": 71} {"train_loss": -6.171731472015381, "global_step": 12055, "epoch": 71} {"train_loss": -5.924386978149414, "global_step": 12056, "epoch": 71} {"train_loss": -5.7640380859375, "global_step": 12057, "epoch": 71} {"train_loss": -6.0110578536987305, "global_step": 12058, "epoch": 71} {"train_loss": -5.893957138061523, "global_step": 12059, "epoch": 71} {"train_loss": -5.835790634155273, "global_step": 12060, "epoch": 71} {"train_loss": -6.008425235748291, "global_step": 12061, "epoch": 71} {"train_loss": -6.1782612800598145, "global_step": 12062, "epoch": 71} {"train_loss": -6.075481414794922, "global_step": 12063, "epoch": 71} {"train_loss": -6.158356666564941, "global_step": 12064, "epoch": 71} {"train_loss": -6.138334274291992, "global_step": 12065, "epoch": 71} {"train_loss": -6.083456993103027, "global_step": 12066, "epoch": 71} {"train_loss": -6.2170820236206055, "global_step": 12067, "epoch": 71} {"train_loss": -5.9895100593566895, "global_step": 12068, "epoch": 71} {"train_loss": -6.222206115722656, "global_step": 12069, "epoch": 71} {"train_loss": -6.01613712310791, "global_step": 12070, "epoch": 71} {"train_loss": -6.122037887573242, "global_step": 12071, "epoch": 71} {"train_loss": -6.072845935821533, "global_step": 12072, "epoch": 71} {"train_loss": -6.3925251960754395, "global_step": 12073, "epoch": 71} {"train_loss": -6.026975154876709, "global_step": 12074, "epoch": 71} {"train_loss": -6.115810871124268, "global_step": 12075, "epoch": 71} {"train_loss": -6.293123245239258, "global_step": 12076, "epoch": 71} {"train_loss": -6.0283589363098145, "global_step": 12077, "epoch": 71} {"train_loss": -6.227272987365723, "global_step": 12078, "epoch": 71} {"train_loss": -5.9994425773620605, "global_step": 12079, "epoch": 71} {"train_loss": -6.019168853759766, "global_step": 12080, "epoch": 71} {"train_loss": -6.041110515594482, "global_step": 12081, "epoch": 71} {"train_loss": -6.115297317504883, "global_step": 12082, "epoch": 71} {"train_loss": -6.083492279052734, "global_step": 12083, "epoch": 71} {"train_loss": -6.316359996795654, "global_step": 12084, "epoch": 71} {"train_loss": -5.87965726852417, "global_step": 12085, "epoch": 71} {"train_loss": -5.907422065734863, "global_step": 12086, "epoch": 71} {"train_loss": -5.983340263366699, "global_step": 12087, "epoch": 71} {"train_loss": -6.09389066696167, "global_step": 12088, "epoch": 71} {"train_loss": -5.869913101196289, "global_step": 12089, "epoch": 71} {"train_loss": -5.832060813903809, "global_step": 12090, "epoch": 71} {"train_loss": -6.214697360992432, "global_step": 12091, "epoch": 71} {"train_loss": -6.068477153778076, "global_step": 12092, "epoch": 71} {"train_loss": -5.569108009338379, "global_step": 12093, "epoch": 71} {"train_loss": -6.027182579040527, "global_step": 12094, "epoch": 71} {"train_loss": -6.0083930889765425, "global_step": 12095, "epoch": 71, "val_loss": 271303.28125} {"train_loss": -5.831231117248535, "global_step": 12096, "epoch": 72} {"train_loss": -5.876125335693359, "global_step": 12097, "epoch": 72} {"train_loss": -6.283267974853516, "global_step": 12098, "epoch": 72} {"train_loss": -5.821504592895508, "global_step": 12099, "epoch": 72} {"train_loss": -5.854663848876953, "global_step": 12100, "epoch": 72} {"train_loss": -5.902235507965088, "global_step": 12101, "epoch": 72} {"train_loss": -6.158848762512207, "global_step": 12102, "epoch": 72} {"train_loss": -5.869001388549805, "global_step": 12103, "epoch": 72} {"train_loss": -5.992138862609863, "global_step": 12104, "epoch": 72} {"train_loss": -5.931044101715088, "global_step": 12105, "epoch": 72} {"train_loss": -5.969869613647461, "global_step": 12106, "epoch": 72} {"train_loss": -5.977443218231201, "global_step": 12107, "epoch": 72} {"train_loss": -6.2236480712890625, "global_step": 12108, "epoch": 72} {"train_loss": -6.04006814956665, "global_step": 12109, "epoch": 72} {"train_loss": -6.049621105194092, "global_step": 12110, "epoch": 72} {"train_loss": -6.169034957885742, "global_step": 12111, "epoch": 72} {"train_loss": -6.238510608673096, "global_step": 12112, "epoch": 72} {"train_loss": -5.747170448303223, "global_step": 12113, "epoch": 72} {"train_loss": -6.00972843170166, "global_step": 12114, "epoch": 72} {"train_loss": -5.9796142578125, "global_step": 12115, "epoch": 72} {"train_loss": -6.213799476623535, "global_step": 12116, "epoch": 72} {"train_loss": -5.929983139038086, "global_step": 12117, "epoch": 72} {"train_loss": -6.1723222732543945, "global_step": 12118, "epoch": 72} {"train_loss": -6.041955947875977, "global_step": 12119, "epoch": 72} {"train_loss": -6.024396896362305, "global_step": 12120, "epoch": 72} {"train_loss": -6.13329553604126, "global_step": 12121, "epoch": 72} {"train_loss": -6.061205863952637, "global_step": 12122, "epoch": 72} {"train_loss": -5.9672393798828125, "global_step": 12123, "epoch": 72} {"train_loss": -5.97250509262085, "global_step": 12124, "epoch": 72} {"train_loss": -6.06347131729126, "global_step": 12125, "epoch": 72} {"train_loss": -6.276547431945801, "global_step": 12126, "epoch": 72} {"train_loss": -5.920522689819336, "global_step": 12127, "epoch": 72} {"train_loss": -5.958248615264893, "global_step": 12128, "epoch": 72} {"train_loss": -6.108182907104492, "global_step": 12129, "epoch": 72} {"train_loss": -5.999102592468262, "global_step": 12130, "epoch": 72} {"train_loss": -6.006634712219238, "global_step": 12131, "epoch": 72} {"train_loss": -5.932746887207031, "global_step": 12132, "epoch": 72} {"train_loss": -6.025470733642578, "global_step": 12133, "epoch": 72} {"train_loss": -6.125246047973633, "global_step": 12134, "epoch": 72} {"train_loss": -5.913393974304199, "global_step": 12135, "epoch": 72} {"train_loss": -6.092275619506836, "global_step": 12136, "epoch": 72} {"train_loss": -5.81163215637207, "global_step": 12137, "epoch": 72} {"train_loss": -6.21981954574585, "global_step": 12138, "epoch": 72} {"train_loss": -6.166542053222656, "global_step": 12139, "epoch": 72} {"train_loss": -6.087522983551025, "global_step": 12140, "epoch": 72} {"train_loss": -5.887214660644531, "global_step": 12141, "epoch": 72} {"train_loss": -6.010110378265381, "global_step": 12142, "epoch": 72} {"train_loss": -6.280673027038574, "global_step": 12143, "epoch": 72} {"train_loss": -5.914350509643555, "global_step": 12144, "epoch": 72} {"train_loss": -6.040475845336914, "global_step": 12145, "epoch": 72} {"train_loss": -5.8642897605896, "global_step": 12146, "epoch": 72} {"train_loss": -6.264890193939209, "global_step": 12147, "epoch": 72} {"train_loss": -6.135560035705566, "global_step": 12148, "epoch": 72} {"train_loss": -6.131602764129639, "global_step": 12149, "epoch": 72} {"train_loss": -6.200930595397949, "global_step": 12150, "epoch": 72} {"train_loss": -6.19644832611084, "global_step": 12151, "epoch": 72} {"train_loss": -6.20943021774292, "global_step": 12152, "epoch": 72} {"train_loss": -6.007271766662598, "global_step": 12153, "epoch": 72} {"train_loss": -6.225282669067383, "global_step": 12154, "epoch": 72} {"train_loss": -6.066153049468994, "global_step": 12155, "epoch": 72} {"train_loss": -5.96395206451416, "global_step": 12156, "epoch": 72} {"train_loss": -6.020757675170898, "global_step": 12157, "epoch": 72} {"train_loss": -6.1371002197265625, "global_step": 12158, "epoch": 72} {"train_loss": -6.1266679763793945, "global_step": 12159, "epoch": 72} {"train_loss": -5.90726900100708, "global_step": 12160, "epoch": 72} {"train_loss": -6.006202220916748, "global_step": 12161, "epoch": 72} {"train_loss": -6.042880058288574, "global_step": 12162, "epoch": 72} {"train_loss": -5.852709770202637, "global_step": 12163, "epoch": 72} {"train_loss": -6.104962348937988, "global_step": 12164, "epoch": 72} {"train_loss": -5.9912543296813965, "global_step": 12165, "epoch": 72} {"train_loss": -5.914050102233887, "global_step": 12166, "epoch": 72} {"train_loss": -6.190186023712158, "global_step": 12167, "epoch": 72} {"train_loss": -6.091840744018555, "global_step": 12168, "epoch": 72} {"train_loss": -5.982027053833008, "global_step": 12169, "epoch": 72} {"train_loss": -6.014185905456543, "global_step": 12170, "epoch": 72} {"train_loss": -6.058493614196777, "global_step": 12171, "epoch": 72} {"train_loss": -6.1683759689331055, "global_step": 12172, "epoch": 72} {"train_loss": -6.268684387207031, "global_step": 12173, "epoch": 72} {"train_loss": -6.221715927124023, "global_step": 12174, "epoch": 72} {"train_loss": -5.721230506896973, "global_step": 12175, "epoch": 72} {"train_loss": -5.856637001037598, "global_step": 12176, "epoch": 72} {"train_loss": -6.040099143981934, "global_step": 12177, "epoch": 72} {"train_loss": -6.039565086364746, "global_step": 12178, "epoch": 72} {"train_loss": -6.088006973266602, "global_step": 12179, "epoch": 72} {"train_loss": -5.9560980796813965, "global_step": 12180, "epoch": 72} {"train_loss": -5.555530548095703, "global_step": 12181, "epoch": 72} {"train_loss": -6.0136566162109375, "global_step": 12182, "epoch": 72} {"train_loss": -5.9359893798828125, "global_step": 12183, "epoch": 72} {"train_loss": -6.294883728027344, "global_step": 12184, "epoch": 72} {"train_loss": -6.142926216125488, "global_step": 12185, "epoch": 72} {"train_loss": -6.176555633544922, "global_step": 12186, "epoch": 72} {"train_loss": -5.972631454467773, "global_step": 12187, "epoch": 72} {"train_loss": -6.016618728637695, "global_step": 12188, "epoch": 72} {"train_loss": -6.260770320892334, "global_step": 12189, "epoch": 72} {"train_loss": -6.142376899719238, "global_step": 12190, "epoch": 72} {"train_loss": -6.267573356628418, "global_step": 12191, "epoch": 72} {"train_loss": -6.450824737548828, "global_step": 12192, "epoch": 72} {"train_loss": -6.134744167327881, "global_step": 12193, "epoch": 72} {"train_loss": -6.2819695472717285, "global_step": 12194, "epoch": 72} {"train_loss": -6.057524681091309, "global_step": 12195, "epoch": 72} {"train_loss": -6.049152851104736, "global_step": 12196, "epoch": 72} {"train_loss": -6.086270332336426, "global_step": 12197, "epoch": 72} {"train_loss": -6.105670928955078, "global_step": 12198, "epoch": 72} {"train_loss": -5.90403413772583, "global_step": 12199, "epoch": 72} {"train_loss": -6.2440643310546875, "global_step": 12200, "epoch": 72} {"train_loss": -5.622795104980469, "global_step": 12201, "epoch": 72} {"train_loss": -5.98509407043457, "global_step": 12202, "epoch": 72} {"train_loss": -5.8785400390625, "global_step": 12203, "epoch": 72} {"train_loss": -6.203221321105957, "global_step": 12204, "epoch": 72} {"train_loss": -6.140514850616455, "global_step": 12205, "epoch": 72} {"train_loss": -6.078954696655273, "global_step": 12206, "epoch": 72} {"train_loss": -6.0577392578125, "global_step": 12207, "epoch": 72} {"train_loss": -6.00257682800293, "global_step": 12208, "epoch": 72} {"train_loss": -6.261388778686523, "global_step": 12209, "epoch": 72} {"train_loss": -6.058231353759766, "global_step": 12210, "epoch": 72} {"train_loss": -6.0674848556518555, "global_step": 12211, "epoch": 72} {"train_loss": -5.9135637283325195, "global_step": 12212, "epoch": 72} {"train_loss": -6.150256633758545, "global_step": 12213, "epoch": 72} {"train_loss": -5.996361255645752, "global_step": 12214, "epoch": 72} {"train_loss": -6.150311470031738, "global_step": 12215, "epoch": 72} {"train_loss": -6.060293674468994, "global_step": 12216, "epoch": 72} {"train_loss": -5.904745101928711, "global_step": 12217, "epoch": 72} {"train_loss": -6.289818286895752, "global_step": 12218, "epoch": 72} {"train_loss": -5.709491729736328, "global_step": 12219, "epoch": 72} {"train_loss": -6.256825923919678, "global_step": 12220, "epoch": 72} {"train_loss": -6.043383598327637, "global_step": 12221, "epoch": 72} {"train_loss": -6.119162082672119, "global_step": 12222, "epoch": 72} {"train_loss": -6.111282825469971, "global_step": 12223, "epoch": 72} {"train_loss": -5.948817253112793, "global_step": 12224, "epoch": 72} {"train_loss": -6.005244255065918, "global_step": 12225, "epoch": 72} {"train_loss": -6.004972457885742, "global_step": 12226, "epoch": 72} {"train_loss": -6.390412330627441, "global_step": 12227, "epoch": 72} {"train_loss": -5.991987228393555, "global_step": 12228, "epoch": 72} {"train_loss": -6.229026794433594, "global_step": 12229, "epoch": 72} {"train_loss": -5.96975040435791, "global_step": 12230, "epoch": 72} {"train_loss": -6.273077964782715, "global_step": 12231, "epoch": 72} {"train_loss": -6.075018405914307, "global_step": 12232, "epoch": 72} {"train_loss": -5.91110897064209, "global_step": 12233, "epoch": 72} {"train_loss": -5.7970051765441895, "global_step": 12234, "epoch": 72} {"train_loss": -6.197077751159668, "global_step": 12235, "epoch": 72} {"train_loss": -6.151103973388672, "global_step": 12236, "epoch": 72} {"train_loss": -6.14694881439209, "global_step": 12237, "epoch": 72} {"train_loss": -5.869965553283691, "global_step": 12238, "epoch": 72} {"train_loss": -6.063632488250732, "global_step": 12239, "epoch": 72} {"train_loss": -5.888421535491943, "global_step": 12240, "epoch": 72} {"train_loss": -6.031038761138916, "global_step": 12241, "epoch": 72} {"train_loss": -5.781649589538574, "global_step": 12242, "epoch": 72} {"train_loss": -6.05153751373291, "global_step": 12243, "epoch": 72} {"train_loss": -6.093425750732422, "global_step": 12244, "epoch": 72} {"train_loss": -5.809262275695801, "global_step": 12245, "epoch": 72} {"train_loss": -5.8566789627075195, "global_step": 12246, "epoch": 72} {"train_loss": -6.169053077697754, "global_step": 12247, "epoch": 72} {"train_loss": -6.276422023773193, "global_step": 12248, "epoch": 72} {"train_loss": -6.091960906982422, "global_step": 12249, "epoch": 72} {"train_loss": -6.011470794677734, "global_step": 12250, "epoch": 72} {"train_loss": -5.827626705169678, "global_step": 12251, "epoch": 72} {"train_loss": -6.048279762268066, "global_step": 12252, "epoch": 72} {"train_loss": -6.2790937423706055, "global_step": 12253, "epoch": 72} {"train_loss": -6.203907012939453, "global_step": 12254, "epoch": 72} {"train_loss": -5.910248756408691, "global_step": 12255, "epoch": 72} {"train_loss": -6.159902572631836, "global_step": 12256, "epoch": 72} {"train_loss": -6.11265230178833, "global_step": 12257, "epoch": 72} {"train_loss": -5.838299751281738, "global_step": 12258, "epoch": 72} {"train_loss": -6.0174055099487305, "global_step": 12259, "epoch": 72} {"train_loss": -5.961697578430176, "global_step": 12260, "epoch": 72} {"train_loss": -6.11199951171875, "global_step": 12261, "epoch": 72} {"train_loss": -6.226509094238281, "global_step": 12262, "epoch": 72} {"train_loss": -6.049155521960485, "global_step": 12263, "epoch": 72, "val_loss": 255977.859375} {"train_loss": -6.086194038391113, "global_step": 12264, "epoch": 73} {"train_loss": -5.945298194885254, "global_step": 12265, "epoch": 73} {"train_loss": -6.126404762268066, "global_step": 12266, "epoch": 73} {"train_loss": -6.013983249664307, "global_step": 12267, "epoch": 73} {"train_loss": -6.153151988983154, "global_step": 12268, "epoch": 73} {"train_loss": -6.094531059265137, "global_step": 12269, "epoch": 73} {"train_loss": -6.302168369293213, "global_step": 12270, "epoch": 73} {"train_loss": -5.907659530639648, "global_step": 12271, "epoch": 73} {"train_loss": -5.980461120605469, "global_step": 12272, "epoch": 73} {"train_loss": -6.211301803588867, "global_step": 12273, "epoch": 73} {"train_loss": -5.916116237640381, "global_step": 12274, "epoch": 73} {"train_loss": -6.419950008392334, "global_step": 12275, "epoch": 73} {"train_loss": -5.966048240661621, "global_step": 12276, "epoch": 73} {"train_loss": -6.329943656921387, "global_step": 12277, "epoch": 73} {"train_loss": -5.906655788421631, "global_step": 12278, "epoch": 73} {"train_loss": -6.166428565979004, "global_step": 12279, "epoch": 73} {"train_loss": -6.146056652069092, "global_step": 12280, "epoch": 73} {"train_loss": -6.040168762207031, "global_step": 12281, "epoch": 73} {"train_loss": -6.205685615539551, "global_step": 12282, "epoch": 73} {"train_loss": -6.025986671447754, "global_step": 12283, "epoch": 73} {"train_loss": -6.184584617614746, "global_step": 12284, "epoch": 73} {"train_loss": -6.306997299194336, "global_step": 12285, "epoch": 73} {"train_loss": -6.245869159698486, "global_step": 12286, "epoch": 73} {"train_loss": -6.101351737976074, "global_step": 12287, "epoch": 73} {"train_loss": -6.212282180786133, "global_step": 12288, "epoch": 73} {"train_loss": -6.452500343322754, "global_step": 12289, "epoch": 73} {"train_loss": -6.343405246734619, "global_step": 12290, "epoch": 73} {"train_loss": -6.329807281494141, "global_step": 12291, "epoch": 73} {"train_loss": -5.9706196784973145, "global_step": 12292, "epoch": 73} {"train_loss": -6.034249305725098, "global_step": 12293, "epoch": 73} {"train_loss": -6.335300445556641, "global_step": 12294, "epoch": 73} {"train_loss": -6.074132442474365, "global_step": 12295, "epoch": 73} {"train_loss": -5.947099685668945, "global_step": 12296, "epoch": 73} {"train_loss": -6.384936332702637, "global_step": 12297, "epoch": 73} {"train_loss": -6.066392421722412, "global_step": 12298, "epoch": 73} {"train_loss": -6.33124303817749, "global_step": 12299, "epoch": 73} {"train_loss": -6.3513407707214355, "global_step": 12300, "epoch": 73} {"train_loss": -6.204777240753174, "global_step": 12301, "epoch": 73} {"train_loss": -5.856705665588379, "global_step": 12302, "epoch": 73} {"train_loss": -6.148187637329102, "global_step": 12303, "epoch": 73} {"train_loss": -6.014407634735107, "global_step": 12304, "epoch": 73} {"train_loss": -5.766475677490234, "global_step": 12305, "epoch": 73} {"train_loss": -6.160489559173584, "global_step": 12306, "epoch": 73} {"train_loss": -5.8550004959106445, "global_step": 12307, "epoch": 73} {"train_loss": -5.9871907234191895, "global_step": 12308, "epoch": 73} {"train_loss": -5.8940839767456055, "global_step": 12309, "epoch": 73} {"train_loss": -5.942591190338135, "global_step": 12310, "epoch": 73} {"train_loss": -5.813682556152344, "global_step": 12311, "epoch": 73} {"train_loss": -6.00462532043457, "global_step": 12312, "epoch": 73} {"train_loss": -6.102749824523926, "global_step": 12313, "epoch": 73} {"train_loss": -6.01852560043335, "global_step": 12314, "epoch": 73} {"train_loss": -5.8553009033203125, "global_step": 12315, "epoch": 73} {"train_loss": -6.1087141036987305, "global_step": 12316, "epoch": 73} {"train_loss": -6.00277042388916, "global_step": 12317, "epoch": 73} {"train_loss": -6.299691200256348, "global_step": 12318, "epoch": 73} {"train_loss": -5.8373212814331055, "global_step": 12319, "epoch": 73} {"train_loss": -6.064626693725586, "global_step": 12320, "epoch": 73} {"train_loss": -5.987438201904297, "global_step": 12321, "epoch": 73} {"train_loss": -6.0236406326293945, "global_step": 12322, "epoch": 73} {"train_loss": -6.083952903747559, "global_step": 12323, "epoch": 73} {"train_loss": -5.983660697937012, "global_step": 12324, "epoch": 73} {"train_loss": -5.858067989349365, "global_step": 12325, "epoch": 73} {"train_loss": -5.942978858947754, "global_step": 12326, "epoch": 73} {"train_loss": -6.247374534606934, "global_step": 12327, "epoch": 73} {"train_loss": -5.899703502655029, "global_step": 12328, "epoch": 73} {"train_loss": -5.979267597198486, "global_step": 12329, "epoch": 73} {"train_loss": -6.058727264404297, "global_step": 12330, "epoch": 73} {"train_loss": -6.187290191650391, "global_step": 12331, "epoch": 73} {"train_loss": -6.305569648742676, "global_step": 12332, "epoch": 73} {"train_loss": -5.991513252258301, "global_step": 12333, "epoch": 73} {"train_loss": -6.253749370574951, "global_step": 12334, "epoch": 73} {"train_loss": -6.126617431640625, "global_step": 12335, "epoch": 73} {"train_loss": -6.182314872741699, "global_step": 12336, "epoch": 73} {"train_loss": -5.900326728820801, "global_step": 12337, "epoch": 73} {"train_loss": -6.283759593963623, "global_step": 12338, "epoch": 73} {"train_loss": -5.963604927062988, "global_step": 12339, "epoch": 73} {"train_loss": -6.247187614440918, "global_step": 12340, "epoch": 73} {"train_loss": -6.274713516235352, "global_step": 12341, "epoch": 73} {"train_loss": -6.166643142700195, "global_step": 12342, "epoch": 73} {"train_loss": -6.20050573348999, "global_step": 12343, "epoch": 73} {"train_loss": -6.441190719604492, "global_step": 12344, "epoch": 73} {"train_loss": -6.044164657592773, "global_step": 12345, "epoch": 73} {"train_loss": -6.338860988616943, "global_step": 12346, "epoch": 73} {"train_loss": -5.828563690185547, "global_step": 12347, "epoch": 73} {"train_loss": -6.226227283477783, "global_step": 12348, "epoch": 73} {"train_loss": -5.81720495223999, "global_step": 12349, "epoch": 73} {"train_loss": -6.316267967224121, "global_step": 12350, "epoch": 73} {"train_loss": -6.261418342590332, "global_step": 12351, "epoch": 73} {"train_loss": -6.07879638671875, "global_step": 12352, "epoch": 73} {"train_loss": -5.9827446937561035, "global_step": 12353, "epoch": 73} {"train_loss": -6.221163749694824, "global_step": 12354, "epoch": 73} {"train_loss": -6.208812713623047, "global_step": 12355, "epoch": 73} {"train_loss": -6.037186145782471, "global_step": 12356, "epoch": 73} {"train_loss": -6.189531326293945, "global_step": 12357, "epoch": 73} {"train_loss": -6.271883010864258, "global_step": 12358, "epoch": 73} {"train_loss": -6.376286506652832, "global_step": 12359, "epoch": 73} {"train_loss": -6.0884246826171875, "global_step": 12360, "epoch": 73} {"train_loss": -6.253996849060059, "global_step": 12361, "epoch": 73} {"train_loss": -6.062282562255859, "global_step": 12362, "epoch": 73} {"train_loss": -6.339967727661133, "global_step": 12363, "epoch": 73} {"train_loss": -5.964832305908203, "global_step": 12364, "epoch": 73} {"train_loss": -6.330014705657959, "global_step": 12365, "epoch": 73} {"train_loss": -5.886090278625488, "global_step": 12366, "epoch": 73} {"train_loss": -6.003369331359863, "global_step": 12367, "epoch": 73} {"train_loss": -6.00394344329834, "global_step": 12368, "epoch": 73} {"train_loss": -6.246249198913574, "global_step": 12369, "epoch": 73} {"train_loss": -5.968033313751221, "global_step": 12370, "epoch": 73} {"train_loss": -6.221398830413818, "global_step": 12371, "epoch": 73} {"train_loss": -5.966324806213379, "global_step": 12372, "epoch": 73} {"train_loss": -5.909536838531494, "global_step": 12373, "epoch": 73} {"train_loss": -5.99549674987793, "global_step": 12374, "epoch": 73} {"train_loss": -5.9762773513793945, "global_step": 12375, "epoch": 73} {"train_loss": -5.947948455810547, "global_step": 12376, "epoch": 73} {"train_loss": -6.071896553039551, "global_step": 12377, "epoch": 73} {"train_loss": -5.935491561889648, "global_step": 12378, "epoch": 73} {"train_loss": -5.702956199645996, "global_step": 12379, "epoch": 73} {"train_loss": -6.018423080444336, "global_step": 12380, "epoch": 73} {"train_loss": -5.843435287475586, "global_step": 12381, "epoch": 73} {"train_loss": -5.841464996337891, "global_step": 12382, "epoch": 73} {"train_loss": -6.0250349044799805, "global_step": 12383, "epoch": 73} {"train_loss": -6.134347915649414, "global_step": 12384, "epoch": 73} {"train_loss": -6.0283098220825195, "global_step": 12385, "epoch": 73} {"train_loss": -5.996245384216309, "global_step": 12386, "epoch": 73} {"train_loss": -5.9163713455200195, "global_step": 12387, "epoch": 73} {"train_loss": -5.892919540405273, "global_step": 12388, "epoch": 73} {"train_loss": -5.998434066772461, "global_step": 12389, "epoch": 73} {"train_loss": -5.991932392120361, "global_step": 12390, "epoch": 73} {"train_loss": -5.744955062866211, "global_step": 12391, "epoch": 73} {"train_loss": -6.171436786651611, "global_step": 12392, "epoch": 73} {"train_loss": -6.088566303253174, "global_step": 12393, "epoch": 73} {"train_loss": -5.965807914733887, "global_step": 12394, "epoch": 73} {"train_loss": -5.967153549194336, "global_step": 12395, "epoch": 73} {"train_loss": -5.9710164070129395, "global_step": 12396, "epoch": 73} {"train_loss": -6.285458564758301, "global_step": 12397, "epoch": 73} {"train_loss": -6.061251640319824, "global_step": 12398, "epoch": 73} {"train_loss": -5.955436706542969, "global_step": 12399, "epoch": 73} {"train_loss": -6.168149471282959, "global_step": 12400, "epoch": 73} {"train_loss": -6.248872756958008, "global_step": 12401, "epoch": 73} {"train_loss": -5.957460403442383, "global_step": 12402, "epoch": 73} {"train_loss": -6.071041107177734, "global_step": 12403, "epoch": 73} {"train_loss": -6.17637825012207, "global_step": 12404, "epoch": 73} {"train_loss": -5.956242561340332, "global_step": 12405, "epoch": 73} {"train_loss": -5.98176383972168, "global_step": 12406, "epoch": 73} {"train_loss": -6.137702465057373, "global_step": 12407, "epoch": 73} {"train_loss": -5.790470600128174, "global_step": 12408, "epoch": 73} {"train_loss": -6.014593124389648, "global_step": 12409, "epoch": 73} {"train_loss": -5.912484645843506, "global_step": 12410, "epoch": 73} {"train_loss": -6.283311367034912, "global_step": 12411, "epoch": 73} {"train_loss": -6.046050548553467, "global_step": 12412, "epoch": 73} {"train_loss": -6.252301216125488, "global_step": 12413, "epoch": 73} {"train_loss": -6.146007537841797, "global_step": 12414, "epoch": 73} {"train_loss": -6.241344451904297, "global_step": 12415, "epoch": 73} {"train_loss": -6.077741622924805, "global_step": 12416, "epoch": 73} {"train_loss": -6.305337905883789, "global_step": 12417, "epoch": 73} {"train_loss": -6.356438636779785, "global_step": 12418, "epoch": 73} {"train_loss": -6.268327713012695, "global_step": 12419, "epoch": 73} {"train_loss": -6.1421661376953125, "global_step": 12420, "epoch": 73} {"train_loss": -5.897014617919922, "global_step": 12421, "epoch": 73} {"train_loss": -5.853748321533203, "global_step": 12422, "epoch": 73} {"train_loss": -6.00752067565918, "global_step": 12423, "epoch": 73} {"train_loss": -6.034766674041748, "global_step": 12424, "epoch": 73} {"train_loss": -6.051222801208496, "global_step": 12425, "epoch": 73} {"train_loss": -5.929801940917969, "global_step": 12426, "epoch": 73} {"train_loss": -5.837337493896484, "global_step": 12427, "epoch": 73} {"train_loss": -6.286721706390381, "global_step": 12428, "epoch": 73} {"train_loss": -5.946145534515381, "global_step": 12429, "epoch": 73} {"train_loss": -5.792156219482422, "global_step": 12430, "epoch": 73} {"train_loss": -6.078076297328586, "global_step": 12431, "epoch": 73, "val_loss": 256950.828125} {"train_loss": -5.830734729766846, "global_step": 12432, "epoch": 74} {"train_loss": -6.013399124145508, "global_step": 12433, "epoch": 74} {"train_loss": -5.968359470367432, "global_step": 12434, "epoch": 74} {"train_loss": -6.125908851623535, "global_step": 12435, "epoch": 74} {"train_loss": -6.060554504394531, "global_step": 12436, "epoch": 74} {"train_loss": -6.134369850158691, "global_step": 12437, "epoch": 74} {"train_loss": -6.1142578125, "global_step": 12438, "epoch": 74} {"train_loss": -6.017932891845703, "global_step": 12439, "epoch": 74} {"train_loss": -6.058663368225098, "global_step": 12440, "epoch": 74} {"train_loss": -6.272213459014893, "global_step": 12441, "epoch": 74} {"train_loss": -6.017661094665527, "global_step": 12442, "epoch": 74} {"train_loss": -6.007916450500488, "global_step": 12443, "epoch": 74} {"train_loss": -6.234643936157227, "global_step": 12444, "epoch": 74} {"train_loss": -6.304830551147461, "global_step": 12445, "epoch": 74} {"train_loss": -5.952555179595947, "global_step": 12446, "epoch": 74} {"train_loss": -6.129031181335449, "global_step": 12447, "epoch": 74} {"train_loss": -6.344767093658447, "global_step": 12448, "epoch": 74} {"train_loss": -6.0297932624816895, "global_step": 12449, "epoch": 74} {"train_loss": -6.071957588195801, "global_step": 12450, "epoch": 74} {"train_loss": -6.192929267883301, "global_step": 12451, "epoch": 74} {"train_loss": -5.97679328918457, "global_step": 12452, "epoch": 74} {"train_loss": -6.3024001121521, "global_step": 12453, "epoch": 74} {"train_loss": -6.175047397613525, "global_step": 12454, "epoch": 74} {"train_loss": -5.972064018249512, "global_step": 12455, "epoch": 74} {"train_loss": -6.165114402770996, "global_step": 12456, "epoch": 74} {"train_loss": -6.2561564445495605, "global_step": 12457, "epoch": 74} {"train_loss": -6.303804874420166, "global_step": 12458, "epoch": 74} {"train_loss": -6.3447265625, "global_step": 12459, "epoch": 74} {"train_loss": -6.5220947265625, "global_step": 12460, "epoch": 74} {"train_loss": -6.123722553253174, "global_step": 12461, "epoch": 74} {"train_loss": -6.167862415313721, "global_step": 12462, "epoch": 74} {"train_loss": -5.820505142211914, "global_step": 12463, "epoch": 74} {"train_loss": -6.2386627197265625, "global_step": 12464, "epoch": 74} {"train_loss": -6.10990047454834, "global_step": 12465, "epoch": 74} {"train_loss": -6.339117527008057, "global_step": 12466, "epoch": 74} {"train_loss": -6.18095588684082, "global_step": 12467, "epoch": 74} {"train_loss": -6.449247360229492, "global_step": 12468, "epoch": 74} {"train_loss": -6.265495300292969, "global_step": 12469, "epoch": 74} {"train_loss": -6.460796356201172, "global_step": 12470, "epoch": 74} {"train_loss": -6.074317932128906, "global_step": 12471, "epoch": 74} {"train_loss": -6.224754333496094, "global_step": 12472, "epoch": 74} {"train_loss": -5.778652667999268, "global_step": 12473, "epoch": 74} {"train_loss": -6.298818588256836, "global_step": 12474, "epoch": 74} {"train_loss": -5.949879169464111, "global_step": 12475, "epoch": 74} {"train_loss": -6.158546447753906, "global_step": 12476, "epoch": 74} {"train_loss": -6.183006286621094, "global_step": 12477, "epoch": 74} {"train_loss": -5.850110054016113, "global_step": 12478, "epoch": 74} {"train_loss": -5.836723327636719, "global_step": 12479, "epoch": 74} {"train_loss": -6.003101348876953, "global_step": 12480, "epoch": 74} {"train_loss": -6.147950172424316, "global_step": 12481, "epoch": 74} {"train_loss": -6.034738540649414, "global_step": 12482, "epoch": 74} {"train_loss": -6.171322822570801, "global_step": 12483, "epoch": 74} {"train_loss": -5.927216529846191, "global_step": 12484, "epoch": 74} {"train_loss": -6.085659503936768, "global_step": 12485, "epoch": 74} {"train_loss": -6.022925853729248, "global_step": 12486, "epoch": 74} {"train_loss": -6.232707977294922, "global_step": 12487, "epoch": 74} {"train_loss": -6.16005802154541, "global_step": 12488, "epoch": 74} {"train_loss": -5.987821578979492, "global_step": 12489, "epoch": 74} {"train_loss": -5.791348457336426, "global_step": 12490, "epoch": 74} {"train_loss": -6.046390056610107, "global_step": 12491, "epoch": 74} {"train_loss": -5.956542015075684, "global_step": 12492, "epoch": 74} {"train_loss": -6.002490997314453, "global_step": 12493, "epoch": 74} {"train_loss": -6.1815948486328125, "global_step": 12494, "epoch": 74} {"train_loss": -6.2367262840271, "global_step": 12495, "epoch": 74} {"train_loss": -6.103592872619629, "global_step": 12496, "epoch": 74} {"train_loss": -5.983288764953613, "global_step": 12497, "epoch": 74} {"train_loss": -5.928613662719727, "global_step": 12498, "epoch": 74} {"train_loss": -5.797384262084961, "global_step": 12499, "epoch": 74} {"train_loss": -5.982748031616211, "global_step": 12500, "epoch": 74} {"train_loss": -6.017082214355469, "global_step": 12501, "epoch": 74} {"train_loss": -5.879931449890137, "global_step": 12502, "epoch": 74} {"train_loss": -5.93520450592041, "global_step": 12503, "epoch": 74} {"train_loss": -6.140777587890625, "global_step": 12504, "epoch": 74} {"train_loss": -6.122114181518555, "global_step": 12505, "epoch": 74} {"train_loss": -6.0955610275268555, "global_step": 12506, "epoch": 74} {"train_loss": -6.148926734924316, "global_step": 12507, "epoch": 74} {"train_loss": -5.954936981201172, "global_step": 12508, "epoch": 74} {"train_loss": -5.975987434387207, "global_step": 12509, "epoch": 74} {"train_loss": -5.902342319488525, "global_step": 12510, "epoch": 74} {"train_loss": -6.030395030975342, "global_step": 12511, "epoch": 74} {"train_loss": -6.024682521820068, "global_step": 12512, "epoch": 74} {"train_loss": -6.168495178222656, "global_step": 12513, "epoch": 74} {"train_loss": -6.068397045135498, "global_step": 12514, "epoch": 74} {"train_loss": -6.087502956390381, "global_step": 12515, "epoch": 74} {"train_loss": -6.110079765319824, "global_step": 12516, "epoch": 74} {"train_loss": -6.046687602996826, "global_step": 12517, "epoch": 74} {"train_loss": -6.311405181884766, "global_step": 12518, "epoch": 74} {"train_loss": -6.264482498168945, "global_step": 12519, "epoch": 74} {"train_loss": -6.007925033569336, "global_step": 12520, "epoch": 74} {"train_loss": -6.141228675842285, "global_step": 12521, "epoch": 74} {"train_loss": -5.863067626953125, "global_step": 12522, "epoch": 74} {"train_loss": -6.105274200439453, "global_step": 12523, "epoch": 74} {"train_loss": -6.161197662353516, "global_step": 12524, "epoch": 74} {"train_loss": -5.989996910095215, "global_step": 12525, "epoch": 74} {"train_loss": -6.038604736328125, "global_step": 12526, "epoch": 74} {"train_loss": -6.201236724853516, "global_step": 12527, "epoch": 74} {"train_loss": -6.076160430908203, "global_step": 12528, "epoch": 74} {"train_loss": -6.186037540435791, "global_step": 12529, "epoch": 74} {"train_loss": -6.052716255187988, "global_step": 12530, "epoch": 74} {"train_loss": -6.130916595458984, "global_step": 12531, "epoch": 74} {"train_loss": -6.049981117248535, "global_step": 12532, "epoch": 74} {"train_loss": -5.998190879821777, "global_step": 12533, "epoch": 74} {"train_loss": -6.159937381744385, "global_step": 12534, "epoch": 74} {"train_loss": -6.270876884460449, "global_step": 12535, "epoch": 74} {"train_loss": -5.840277194976807, "global_step": 12536, "epoch": 74} {"train_loss": -6.005539417266846, "global_step": 12537, "epoch": 74} {"train_loss": -5.802453517913818, "global_step": 12538, "epoch": 74} {"train_loss": -6.011307716369629, "global_step": 12539, "epoch": 74} {"train_loss": -6.11332893371582, "global_step": 12540, "epoch": 74} {"train_loss": -5.7448859214782715, "global_step": 12541, "epoch": 74} {"train_loss": -6.091851234436035, "global_step": 12542, "epoch": 74} {"train_loss": -5.932096481323242, "global_step": 12543, "epoch": 74} {"train_loss": -5.9208879470825195, "global_step": 12544, "epoch": 74} {"train_loss": -6.012665748596191, "global_step": 12545, "epoch": 74} {"train_loss": -6.034510612487793, "global_step": 12546, "epoch": 74} {"train_loss": -6.028459548950195, "global_step": 12547, "epoch": 74} {"train_loss": -6.0642547607421875, "global_step": 12548, "epoch": 74} {"train_loss": -6.191197395324707, "global_step": 12549, "epoch": 74} {"train_loss": -6.2100419998168945, "global_step": 12550, "epoch": 74} {"train_loss": -6.167933464050293, "global_step": 12551, "epoch": 74} {"train_loss": -6.014900207519531, "global_step": 12552, "epoch": 74} {"train_loss": -6.1314544677734375, "global_step": 12553, "epoch": 74} {"train_loss": -5.883405685424805, "global_step": 12554, "epoch": 74} {"train_loss": -6.006007194519043, "global_step": 12555, "epoch": 74} {"train_loss": -6.006769180297852, "global_step": 12556, "epoch": 74} {"train_loss": -6.136207103729248, "global_step": 12557, "epoch": 74} {"train_loss": -6.146212577819824, "global_step": 12558, "epoch": 74} {"train_loss": -5.985679626464844, "global_step": 12559, "epoch": 74} {"train_loss": -6.04780387878418, "global_step": 12560, "epoch": 74} {"train_loss": -6.190947532653809, "global_step": 12561, "epoch": 74} {"train_loss": -6.088515281677246, "global_step": 12562, "epoch": 74} {"train_loss": -6.247020721435547, "global_step": 12563, "epoch": 74} {"train_loss": -5.836908340454102, "global_step": 12564, "epoch": 74} {"train_loss": -6.123716354370117, "global_step": 12565, "epoch": 74} {"train_loss": -5.862928867340088, "global_step": 12566, "epoch": 74} {"train_loss": -6.110818862915039, "global_step": 12567, "epoch": 74} {"train_loss": -6.201406478881836, "global_step": 12568, "epoch": 74} {"train_loss": -6.247570991516113, "global_step": 12569, "epoch": 74} {"train_loss": -6.068540096282959, "global_step": 12570, "epoch": 74} {"train_loss": -6.198781967163086, "global_step": 12571, "epoch": 74} {"train_loss": -5.973567008972168, "global_step": 12572, "epoch": 74} {"train_loss": -5.979335784912109, "global_step": 12573, "epoch": 74} {"train_loss": -6.216749668121338, "global_step": 12574, "epoch": 74} {"train_loss": -5.92371940612793, "global_step": 12575, "epoch": 74} {"train_loss": -6.223441123962402, "global_step": 12576, "epoch": 74} {"train_loss": -6.105934143066406, "global_step": 12577, "epoch": 74} {"train_loss": -5.990322113037109, "global_step": 12578, "epoch": 74} {"train_loss": -6.109760284423828, "global_step": 12579, "epoch": 74} {"train_loss": -5.744849681854248, "global_step": 12580, "epoch": 74} {"train_loss": -5.936373710632324, "global_step": 12581, "epoch": 74} {"train_loss": -5.880195140838623, "global_step": 12582, "epoch": 74} {"train_loss": -5.707222938537598, "global_step": 12583, "epoch": 74} {"train_loss": -5.843256950378418, "global_step": 12584, "epoch": 74} {"train_loss": -6.028697967529297, "global_step": 12585, "epoch": 74} {"train_loss": -6.174783706665039, "global_step": 12586, "epoch": 74} {"train_loss": -6.113773345947266, "global_step": 12587, "epoch": 74} {"train_loss": -6.052431106567383, "global_step": 12588, "epoch": 74} {"train_loss": -5.7279157638549805, "global_step": 12589, "epoch": 74} {"train_loss": -6.022895812988281, "global_step": 12590, "epoch": 74} {"train_loss": -5.641444683074951, "global_step": 12591, "epoch": 74} {"train_loss": -6.022017478942871, "global_step": 12592, "epoch": 74} {"train_loss": -6.030776023864746, "global_step": 12593, "epoch": 74} {"train_loss": -6.185040473937988, "global_step": 12594, "epoch": 74} {"train_loss": -6.129159450531006, "global_step": 12595, "epoch": 74} {"train_loss": -6.020992279052734, "global_step": 12596, "epoch": 74} {"train_loss": -5.928353309631348, "global_step": 12597, "epoch": 74} {"train_loss": -6.094099521636963, "global_step": 12598, "epoch": 74} {"train_loss": -6.069124939895811, "global_step": 12599, "epoch": 74, "val_loss": 262113.65625} {"train_loss": -5.645050048828125, "global_step": 12600, "epoch": 75} {"train_loss": -6.090381622314453, "global_step": 12601, "epoch": 75} {"train_loss": -5.7898054122924805, "global_step": 12602, "epoch": 75} {"train_loss": -6.145191669464111, "global_step": 12603, "epoch": 75} {"train_loss": -5.6722493171691895, "global_step": 12604, "epoch": 75} {"train_loss": -6.125619888305664, "global_step": 12605, "epoch": 75} {"train_loss": -5.942822456359863, "global_step": 12606, "epoch": 75} {"train_loss": -6.007589817047119, "global_step": 12607, "epoch": 75} {"train_loss": -5.822744369506836, "global_step": 12608, "epoch": 75} {"train_loss": -5.976006507873535, "global_step": 12609, "epoch": 75} {"train_loss": -5.980485916137695, "global_step": 12610, "epoch": 75} {"train_loss": -5.864796161651611, "global_step": 12611, "epoch": 75} {"train_loss": -5.878079891204834, "global_step": 12612, "epoch": 75} {"train_loss": -5.881875991821289, "global_step": 12613, "epoch": 75} {"train_loss": -6.034746170043945, "global_step": 12614, "epoch": 75} {"train_loss": -5.857349395751953, "global_step": 12615, "epoch": 75} {"train_loss": -5.978891372680664, "global_step": 12616, "epoch": 75} {"train_loss": -6.05256462097168, "global_step": 12617, "epoch": 75} {"train_loss": -5.969202995300293, "global_step": 12618, "epoch": 75} {"train_loss": -6.095266819000244, "global_step": 12619, "epoch": 75} {"train_loss": -6.192442417144775, "global_step": 12620, "epoch": 75} {"train_loss": -6.01866340637207, "global_step": 12621, "epoch": 75} {"train_loss": -6.429696559906006, "global_step": 12622, "epoch": 75} {"train_loss": -5.702208995819092, "global_step": 12623, "epoch": 75} {"train_loss": -6.08722448348999, "global_step": 12624, "epoch": 75} {"train_loss": -6.079989910125732, "global_step": 12625, "epoch": 75} {"train_loss": -6.064657211303711, "global_step": 12626, "epoch": 75} {"train_loss": -5.871392250061035, "global_step": 12627, "epoch": 75} {"train_loss": -6.106304168701172, "global_step": 12628, "epoch": 75} {"train_loss": -6.136224746704102, "global_step": 12629, "epoch": 75} {"train_loss": -6.051603317260742, "global_step": 12630, "epoch": 75} {"train_loss": -6.366092205047607, "global_step": 12631, "epoch": 75} {"train_loss": -5.984691619873047, "global_step": 12632, "epoch": 75} {"train_loss": -6.244555950164795, "global_step": 12633, "epoch": 75} {"train_loss": -6.160849571228027, "global_step": 12634, "epoch": 75} {"train_loss": -6.0488104820251465, "global_step": 12635, "epoch": 75} {"train_loss": -5.882716178894043, "global_step": 12636, "epoch": 75} {"train_loss": -6.207938194274902, "global_step": 12637, "epoch": 75} {"train_loss": -6.17426872253418, "global_step": 12638, "epoch": 75} {"train_loss": -5.971588611602783, "global_step": 12639, "epoch": 75} {"train_loss": -6.022146701812744, "global_step": 12640, "epoch": 75} {"train_loss": -6.115446090698242, "global_step": 12641, "epoch": 75} {"train_loss": -5.894240379333496, "global_step": 12642, "epoch": 75} {"train_loss": -6.370421409606934, "global_step": 12643, "epoch": 75} {"train_loss": -6.280160427093506, "global_step": 12644, "epoch": 75} {"train_loss": -6.416426658630371, "global_step": 12645, "epoch": 75} {"train_loss": -6.229519844055176, "global_step": 12646, "epoch": 75} {"train_loss": -6.1004180908203125, "global_step": 12647, "epoch": 75} {"train_loss": -6.207759857177734, "global_step": 12648, "epoch": 75} {"train_loss": -6.074300765991211, "global_step": 12649, "epoch": 75} {"train_loss": -6.080090522766113, "global_step": 12650, "epoch": 75} {"train_loss": -6.292352199554443, "global_step": 12651, "epoch": 75} {"train_loss": -6.005829811096191, "global_step": 12652, "epoch": 75} {"train_loss": -5.801323413848877, "global_step": 12653, "epoch": 75} {"train_loss": -6.18076229095459, "global_step": 12654, "epoch": 75} {"train_loss": -6.163220405578613, "global_step": 12655, "epoch": 75} {"train_loss": -6.092019081115723, "global_step": 12656, "epoch": 75} {"train_loss": -6.221183776855469, "global_step": 12657, "epoch": 75} {"train_loss": -6.181829929351807, "global_step": 12658, "epoch": 75} {"train_loss": -6.237706184387207, "global_step": 12659, "epoch": 75} {"train_loss": -6.150643348693848, "global_step": 12660, "epoch": 75} {"train_loss": -6.052518844604492, "global_step": 12661, "epoch": 75} {"train_loss": -6.000493049621582, "global_step": 12662, "epoch": 75} {"train_loss": -5.758669853210449, "global_step": 12663, "epoch": 75} {"train_loss": -6.071594715118408, "global_step": 12664, "epoch": 75} {"train_loss": -5.917002201080322, "global_step": 12665, "epoch": 75} {"train_loss": -6.019634246826172, "global_step": 12666, "epoch": 75} {"train_loss": -6.013046741485596, "global_step": 12667, "epoch": 75} {"train_loss": -6.2327446937561035, "global_step": 12668, "epoch": 75} {"train_loss": -5.687098026275635, "global_step": 12669, "epoch": 75} {"train_loss": -6.036351203918457, "global_step": 12670, "epoch": 75} {"train_loss": -6.290661811828613, "global_step": 12671, "epoch": 75} {"train_loss": -5.838903903961182, "global_step": 12672, "epoch": 75} {"train_loss": -6.364178657531738, "global_step": 12673, "epoch": 75} {"train_loss": -5.83045768737793, "global_step": 12674, "epoch": 75} {"train_loss": -6.341863632202148, "global_step": 12675, "epoch": 75} {"train_loss": -6.065417289733887, "global_step": 12676, "epoch": 75} {"train_loss": -6.274191379547119, "global_step": 12677, "epoch": 75} {"train_loss": -6.068413734436035, "global_step": 12678, "epoch": 75} {"train_loss": -6.103548049926758, "global_step": 12679, "epoch": 75} {"train_loss": -5.5315842628479, "global_step": 12680, "epoch": 75} {"train_loss": -5.959511756896973, "global_step": 12681, "epoch": 75} {"train_loss": -5.743204116821289, "global_step": 12682, "epoch": 75} {"train_loss": -5.980345726013184, "global_step": 12683, "epoch": 75} {"train_loss": -6.16093635559082, "global_step": 12684, "epoch": 75} {"train_loss": -5.948088645935059, "global_step": 12685, "epoch": 75} {"train_loss": -6.211268424987793, "global_step": 12686, "epoch": 75} {"train_loss": -6.252601623535156, "global_step": 12687, "epoch": 75} {"train_loss": -6.063506126403809, "global_step": 12688, "epoch": 75} {"train_loss": -6.133900165557861, "global_step": 12689, "epoch": 75} {"train_loss": -5.9994659423828125, "global_step": 12690, "epoch": 75} {"train_loss": -5.7972540855407715, "global_step": 12691, "epoch": 75} {"train_loss": -5.6934309005737305, "global_step": 12692, "epoch": 75} {"train_loss": -5.889270782470703, "global_step": 12693, "epoch": 75} {"train_loss": -5.943882942199707, "global_step": 12694, "epoch": 75} {"train_loss": -6.067739963531494, "global_step": 12695, "epoch": 75} {"train_loss": -5.766919136047363, "global_step": 12696, "epoch": 75} {"train_loss": -6.030294418334961, "global_step": 12697, "epoch": 75} {"train_loss": -6.140625, "global_step": 12698, "epoch": 75} {"train_loss": -5.82505989074707, "global_step": 12699, "epoch": 75} {"train_loss": -6.111549377441406, "global_step": 12700, "epoch": 75} {"train_loss": -5.763378143310547, "global_step": 12701, "epoch": 75} {"train_loss": -6.16316032409668, "global_step": 12702, "epoch": 75} {"train_loss": -6.049530029296875, "global_step": 12703, "epoch": 75} {"train_loss": -5.815561294555664, "global_step": 12704, "epoch": 75} {"train_loss": -6.107211589813232, "global_step": 12705, "epoch": 75} {"train_loss": -5.910183429718018, "global_step": 12706, "epoch": 75} {"train_loss": -6.07624626159668, "global_step": 12707, "epoch": 75} {"train_loss": -6.283973693847656, "global_step": 12708, "epoch": 75} {"train_loss": -5.768380641937256, "global_step": 12709, "epoch": 75} {"train_loss": -5.829074859619141, "global_step": 12710, "epoch": 75} {"train_loss": -5.595468521118164, "global_step": 12711, "epoch": 75} {"train_loss": -6.167577266693115, "global_step": 12712, "epoch": 75} {"train_loss": -6.186175346374512, "global_step": 12713, "epoch": 75} {"train_loss": -6.15566349029541, "global_step": 12714, "epoch": 75} {"train_loss": -6.14866828918457, "global_step": 12715, "epoch": 75} {"train_loss": -6.21916389465332, "global_step": 12716, "epoch": 75} {"train_loss": -6.080591201782227, "global_step": 12717, "epoch": 75} {"train_loss": -5.793308258056641, "global_step": 12718, "epoch": 75} {"train_loss": -5.91196346282959, "global_step": 12719, "epoch": 75} {"train_loss": -6.229503154754639, "global_step": 12720, "epoch": 75} {"train_loss": -6.178563594818115, "global_step": 12721, "epoch": 75} {"train_loss": -6.202019691467285, "global_step": 12722, "epoch": 75} {"train_loss": -5.812900066375732, "global_step": 12723, "epoch": 75} {"train_loss": -6.1525092124938965, "global_step": 12724, "epoch": 75} {"train_loss": -6.264549732208252, "global_step": 12725, "epoch": 75} {"train_loss": -6.239882946014404, "global_step": 12726, "epoch": 75} {"train_loss": -6.28317928314209, "global_step": 12727, "epoch": 75} {"train_loss": -6.3291544914245605, "global_step": 12728, "epoch": 75} {"train_loss": -6.130724906921387, "global_step": 12729, "epoch": 75} {"train_loss": -6.297914981842041, "global_step": 12730, "epoch": 75} {"train_loss": -6.209112167358398, "global_step": 12731, "epoch": 75} {"train_loss": -6.231215953826904, "global_step": 12732, "epoch": 75} {"train_loss": -6.226223945617676, "global_step": 12733, "epoch": 75} {"train_loss": -6.186676025390625, "global_step": 12734, "epoch": 75} {"train_loss": -6.411944389343262, "global_step": 12735, "epoch": 75} {"train_loss": -6.053696632385254, "global_step": 12736, "epoch": 75} {"train_loss": -6.106673240661621, "global_step": 12737, "epoch": 75} {"train_loss": -6.113018035888672, "global_step": 12738, "epoch": 75} {"train_loss": -5.8918609619140625, "global_step": 12739, "epoch": 75} {"train_loss": -6.220300674438477, "global_step": 12740, "epoch": 75} {"train_loss": -5.717978477478027, "global_step": 12741, "epoch": 75} {"train_loss": -6.33051872253418, "global_step": 12742, "epoch": 75} {"train_loss": -5.572272300720215, "global_step": 12743, "epoch": 75} {"train_loss": -6.121371269226074, "global_step": 12744, "epoch": 75} {"train_loss": -5.750588417053223, "global_step": 12745, "epoch": 75} {"train_loss": -6.010653495788574, "global_step": 12746, "epoch": 75} {"train_loss": -5.837271690368652, "global_step": 12747, "epoch": 75} {"train_loss": -6.04925012588501, "global_step": 12748, "epoch": 75} {"train_loss": -6.288354396820068, "global_step": 12749, "epoch": 75} {"train_loss": -6.014735698699951, "global_step": 12750, "epoch": 75} {"train_loss": -6.214699745178223, "global_step": 12751, "epoch": 75} {"train_loss": -6.336219787597656, "global_step": 12752, "epoch": 75} {"train_loss": -5.927797317504883, "global_step": 12753, "epoch": 75} {"train_loss": -6.2034759521484375, "global_step": 12754, "epoch": 75} {"train_loss": -5.97191858291626, "global_step": 12755, "epoch": 75} {"train_loss": -6.240581512451172, "global_step": 12756, "epoch": 75} {"train_loss": -6.049505233764648, "global_step": 12757, "epoch": 75} {"train_loss": -6.229536056518555, "global_step": 12758, "epoch": 75} {"train_loss": -6.145832538604736, "global_step": 12759, "epoch": 75} {"train_loss": -5.944649696350098, "global_step": 12760, "epoch": 75} {"train_loss": -6.070029258728027, "global_step": 12761, "epoch": 75} {"train_loss": -6.0983991622924805, "global_step": 12762, "epoch": 75} {"train_loss": -5.91491174697876, "global_step": 12763, "epoch": 75} {"train_loss": -6.219171047210693, "global_step": 12764, "epoch": 75} {"train_loss": -6.16971492767334, "global_step": 12765, "epoch": 75} {"train_loss": -5.995265960693359, "global_step": 12766, "epoch": 75} {"train_loss": -6.053850602535975, "global_step": 12767, "epoch": 75, "val_loss": 252281.5, "train_action_mse_error": 40.290565490722656} {"train_loss": -6.040983200073242, "global_step": 12768, "epoch": 76} {"train_loss": -5.731512069702148, "global_step": 12769, "epoch": 76} {"train_loss": -6.191524505615234, "global_step": 12770, "epoch": 76} {"train_loss": -6.158601760864258, "global_step": 12771, "epoch": 76} {"train_loss": -6.206865310668945, "global_step": 12772, "epoch": 76} {"train_loss": -6.190430164337158, "global_step": 12773, "epoch": 76} {"train_loss": -5.964574813842773, "global_step": 12774, "epoch": 76} {"train_loss": -6.135412216186523, "global_step": 12775, "epoch": 76} {"train_loss": -5.986363410949707, "global_step": 12776, "epoch": 76} {"train_loss": -6.041103839874268, "global_step": 12777, "epoch": 76} {"train_loss": -6.229918003082275, "global_step": 12778, "epoch": 76} {"train_loss": -6.161611557006836, "global_step": 12779, "epoch": 76} {"train_loss": -6.2611541748046875, "global_step": 12780, "epoch": 76} {"train_loss": -5.9899678230285645, "global_step": 12781, "epoch": 76} {"train_loss": -5.958682060241699, "global_step": 12782, "epoch": 76} {"train_loss": -6.061737060546875, "global_step": 12783, "epoch": 76} {"train_loss": -5.988831520080566, "global_step": 12784, "epoch": 76} {"train_loss": -6.319395542144775, "global_step": 12785, "epoch": 76} {"train_loss": -6.2159528732299805, "global_step": 12786, "epoch": 76} {"train_loss": -6.199007034301758, "global_step": 12787, "epoch": 76} {"train_loss": -6.13577127456665, "global_step": 12788, "epoch": 76} {"train_loss": -6.3302812576293945, "global_step": 12789, "epoch": 76} {"train_loss": -6.212899208068848, "global_step": 12790, "epoch": 76} {"train_loss": -6.14459753036499, "global_step": 12791, "epoch": 76} {"train_loss": -6.2978363037109375, "global_step": 12792, "epoch": 76} {"train_loss": -6.256657600402832, "global_step": 12793, "epoch": 76} {"train_loss": -6.481006622314453, "global_step": 12794, "epoch": 76} {"train_loss": -6.052168846130371, "global_step": 12795, "epoch": 76} {"train_loss": -6.241479873657227, "global_step": 12796, "epoch": 76} {"train_loss": -6.382611274719238, "global_step": 12797, "epoch": 76} {"train_loss": -6.453182697296143, "global_step": 12798, "epoch": 76} {"train_loss": -6.155561447143555, "global_step": 12799, "epoch": 76} {"train_loss": -6.163773536682129, "global_step": 12800, "epoch": 76} {"train_loss": -6.312865734100342, "global_step": 12801, "epoch": 76} {"train_loss": -6.192193984985352, "global_step": 12802, "epoch": 76} {"train_loss": -6.102212905883789, "global_step": 12803, "epoch": 76} {"train_loss": -5.916160583496094, "global_step": 12804, "epoch": 76} {"train_loss": -6.137938499450684, "global_step": 12805, "epoch": 76} {"train_loss": -5.857155799865723, "global_step": 12806, "epoch": 76} {"train_loss": -6.243473052978516, "global_step": 12807, "epoch": 76} {"train_loss": -5.970165729522705, "global_step": 12808, "epoch": 76} {"train_loss": -6.051851272583008, "global_step": 12809, "epoch": 76} {"train_loss": -5.993458271026611, "global_step": 12810, "epoch": 76} {"train_loss": -5.8526930809021, "global_step": 12811, "epoch": 76} {"train_loss": -6.288315296173096, "global_step": 12812, "epoch": 76} {"train_loss": -6.121358871459961, "global_step": 12813, "epoch": 76} {"train_loss": -6.060137748718262, "global_step": 12814, "epoch": 76} {"train_loss": -6.000515937805176, "global_step": 12815, "epoch": 76} {"train_loss": -6.0768632888793945, "global_step": 12816, "epoch": 76} {"train_loss": -6.192357063293457, "global_step": 12817, "epoch": 76} {"train_loss": -6.23342227935791, "global_step": 12818, "epoch": 76} {"train_loss": -6.118649482727051, "global_step": 12819, "epoch": 76} {"train_loss": -6.239863395690918, "global_step": 12820, "epoch": 76} {"train_loss": -6.117222309112549, "global_step": 12821, "epoch": 76} {"train_loss": -5.6927900314331055, "global_step": 12822, "epoch": 76} {"train_loss": -6.117257595062256, "global_step": 12823, "epoch": 76} {"train_loss": -6.141001224517822, "global_step": 12824, "epoch": 76} {"train_loss": -6.3123064041137695, "global_step": 12825, "epoch": 76} {"train_loss": -6.304640769958496, "global_step": 12826, "epoch": 76} {"train_loss": -6.21635103225708, "global_step": 12827, "epoch": 76} {"train_loss": -6.2102155685424805, "global_step": 12828, "epoch": 76} {"train_loss": -6.447261810302734, "global_step": 12829, "epoch": 76} {"train_loss": -6.238316535949707, "global_step": 12830, "epoch": 76} {"train_loss": -6.35577392578125, "global_step": 12831, "epoch": 76} {"train_loss": -5.970959663391113, "global_step": 12832, "epoch": 76} {"train_loss": -6.367495059967041, "global_step": 12833, "epoch": 76} {"train_loss": -5.996311187744141, "global_step": 12834, "epoch": 76} {"train_loss": -5.740633964538574, "global_step": 12835, "epoch": 76} {"train_loss": -6.145133972167969, "global_step": 12836, "epoch": 76} {"train_loss": -5.764378547668457, "global_step": 12837, "epoch": 76} {"train_loss": -6.045894622802734, "global_step": 12838, "epoch": 76} {"train_loss": -5.754214763641357, "global_step": 12839, "epoch": 76} {"train_loss": -5.64831018447876, "global_step": 12840, "epoch": 76} {"train_loss": -5.885128498077393, "global_step": 12841, "epoch": 76} {"train_loss": -6.143453121185303, "global_step": 12842, "epoch": 76} {"train_loss": -5.94035530090332, "global_step": 12843, "epoch": 76} {"train_loss": -6.138423442840576, "global_step": 12844, "epoch": 76} {"train_loss": -5.9431047439575195, "global_step": 12845, "epoch": 76} {"train_loss": -6.164412498474121, "global_step": 12846, "epoch": 76} {"train_loss": -5.886399745941162, "global_step": 12847, "epoch": 76} {"train_loss": -5.755651473999023, "global_step": 12848, "epoch": 76} {"train_loss": -5.992780685424805, "global_step": 12849, "epoch": 76} {"train_loss": -6.053424835205078, "global_step": 12850, "epoch": 76} {"train_loss": -6.028857707977295, "global_step": 12851, "epoch": 76} {"train_loss": -6.0977301597595215, "global_step": 12852, "epoch": 76} {"train_loss": -6.255321502685547, "global_step": 12853, "epoch": 76} {"train_loss": -6.076320648193359, "global_step": 12854, "epoch": 76} {"train_loss": -5.889359951019287, "global_step": 12855, "epoch": 76} {"train_loss": -6.113509178161621, "global_step": 12856, "epoch": 76} {"train_loss": -6.286750793457031, "global_step": 12857, "epoch": 76} {"train_loss": -6.1321611404418945, "global_step": 12858, "epoch": 76} {"train_loss": -5.927168846130371, "global_step": 12859, "epoch": 76} {"train_loss": -6.02794075012207, "global_step": 12860, "epoch": 76} {"train_loss": -6.22006893157959, "global_step": 12861, "epoch": 76} {"train_loss": -6.165360450744629, "global_step": 12862, "epoch": 76} {"train_loss": -6.267341613769531, "global_step": 12863, "epoch": 76} {"train_loss": -6.200210094451904, "global_step": 12864, "epoch": 76} {"train_loss": -6.310276031494141, "global_step": 12865, "epoch": 76} {"train_loss": -6.011835098266602, "global_step": 12866, "epoch": 76} {"train_loss": -6.031122207641602, "global_step": 12867, "epoch": 76} {"train_loss": -6.231691360473633, "global_step": 12868, "epoch": 76} {"train_loss": -6.138852119445801, "global_step": 12869, "epoch": 76} {"train_loss": -6.135060787200928, "global_step": 12870, "epoch": 76} {"train_loss": -6.410820007324219, "global_step": 12871, "epoch": 76} {"train_loss": -6.174559593200684, "global_step": 12872, "epoch": 76} {"train_loss": -6.296895980834961, "global_step": 12873, "epoch": 76} {"train_loss": -6.253162860870361, "global_step": 12874, "epoch": 76} {"train_loss": -5.952523231506348, "global_step": 12875, "epoch": 76} {"train_loss": -6.191239356994629, "global_step": 12876, "epoch": 76} {"train_loss": -5.965185165405273, "global_step": 12877, "epoch": 76} {"train_loss": -6.027553558349609, "global_step": 12878, "epoch": 76} {"train_loss": -6.072179794311523, "global_step": 12879, "epoch": 76} {"train_loss": -6.217716217041016, "global_step": 12880, "epoch": 76} {"train_loss": -5.981649398803711, "global_step": 12881, "epoch": 76} {"train_loss": -6.234913349151611, "global_step": 12882, "epoch": 76} {"train_loss": -6.078401565551758, "global_step": 12883, "epoch": 76} {"train_loss": -6.180204391479492, "global_step": 12884, "epoch": 76} {"train_loss": -6.000460624694824, "global_step": 12885, "epoch": 76} {"train_loss": -5.990983009338379, "global_step": 12886, "epoch": 76} {"train_loss": -6.1702189445495605, "global_step": 12887, "epoch": 76} {"train_loss": -6.110410690307617, "global_step": 12888, "epoch": 76} {"train_loss": -5.935619831085205, "global_step": 12889, "epoch": 76} {"train_loss": -6.03354549407959, "global_step": 12890, "epoch": 76} {"train_loss": -6.056064128875732, "global_step": 12891, "epoch": 76} {"train_loss": -6.1375932693481445, "global_step": 12892, "epoch": 76} {"train_loss": -6.323830604553223, "global_step": 12893, "epoch": 76} {"train_loss": -6.089621067047119, "global_step": 12894, "epoch": 76} {"train_loss": -6.109997749328613, "global_step": 12895, "epoch": 76} {"train_loss": -6.469016075134277, "global_step": 12896, "epoch": 76} {"train_loss": -6.151149272918701, "global_step": 12897, "epoch": 76} {"train_loss": -6.087350368499756, "global_step": 12898, "epoch": 76} {"train_loss": -5.982109546661377, "global_step": 12899, "epoch": 76} {"train_loss": -6.353594779968262, "global_step": 12900, "epoch": 76} {"train_loss": -6.287243366241455, "global_step": 12901, "epoch": 76} {"train_loss": -6.028692722320557, "global_step": 12902, "epoch": 76} {"train_loss": -6.256956100463867, "global_step": 12903, "epoch": 76} {"train_loss": -6.077491760253906, "global_step": 12904, "epoch": 76} {"train_loss": -6.235115051269531, "global_step": 12905, "epoch": 76} {"train_loss": -5.935845851898193, "global_step": 12906, "epoch": 76} {"train_loss": -6.163846015930176, "global_step": 12907, "epoch": 76} {"train_loss": -6.259246349334717, "global_step": 12908, "epoch": 76} {"train_loss": -6.23002815246582, "global_step": 12909, "epoch": 76} {"train_loss": -6.244283199310303, "global_step": 12910, "epoch": 76} {"train_loss": -6.239577770233154, "global_step": 12911, "epoch": 76} {"train_loss": -6.050817489624023, "global_step": 12912, "epoch": 76} {"train_loss": -6.189985275268555, "global_step": 12913, "epoch": 76} {"train_loss": -6.424116134643555, "global_step": 12914, "epoch": 76} {"train_loss": -6.015718460083008, "global_step": 12915, "epoch": 76} {"train_loss": -6.034013748168945, "global_step": 12916, "epoch": 76} {"train_loss": -5.9744486808776855, "global_step": 12917, "epoch": 76} {"train_loss": -6.158451080322266, "global_step": 12918, "epoch": 76} {"train_loss": -6.1322712898254395, "global_step": 12919, "epoch": 76} {"train_loss": -5.8832597732543945, "global_step": 12920, "epoch": 76} {"train_loss": -5.948709487915039, "global_step": 12921, "epoch": 76} {"train_loss": -6.040773391723633, "global_step": 12922, "epoch": 76} {"train_loss": -6.230598449707031, "global_step": 12923, "epoch": 76} {"train_loss": -6.25655460357666, "global_step": 12924, "epoch": 76} {"train_loss": -6.313129425048828, "global_step": 12925, "epoch": 76} {"train_loss": -6.170652866363525, "global_step": 12926, "epoch": 76} {"train_loss": -6.151519298553467, "global_step": 12927, "epoch": 76} {"train_loss": -6.169833660125732, "global_step": 12928, "epoch": 76} {"train_loss": -5.944447994232178, "global_step": 12929, "epoch": 76} {"train_loss": -5.862109661102295, "global_step": 12930, "epoch": 76} {"train_loss": -5.894200325012207, "global_step": 12931, "epoch": 76} {"train_loss": -5.8555803298950195, "global_step": 12932, "epoch": 76} {"train_loss": -5.941776275634766, "global_step": 12933, "epoch": 76} {"train_loss": -5.819854736328125, "global_step": 12934, "epoch": 76} {"train_loss": -6.11270611059098, "global_step": 12935, "epoch": 76, "val_loss": 250778.859375} {"train_loss": -6.295382499694824, "global_step": 12936, "epoch": 77} {"train_loss": -5.812446594238281, "global_step": 12937, "epoch": 77} {"train_loss": -5.99555778503418, "global_step": 12938, "epoch": 77} {"train_loss": -5.863640785217285, "global_step": 12939, "epoch": 77} {"train_loss": -6.023159027099609, "global_step": 12940, "epoch": 77} {"train_loss": -6.018177032470703, "global_step": 12941, "epoch": 77} {"train_loss": -5.916380882263184, "global_step": 12942, "epoch": 77} {"train_loss": -6.205175399780273, "global_step": 12943, "epoch": 77} {"train_loss": -5.748370170593262, "global_step": 12944, "epoch": 77} {"train_loss": -6.0915985107421875, "global_step": 12945, "epoch": 77} {"train_loss": -6.028688907623291, "global_step": 12946, "epoch": 77} {"train_loss": -5.839767932891846, "global_step": 12947, "epoch": 77} {"train_loss": -5.974584579467773, "global_step": 12948, "epoch": 77} {"train_loss": -6.112269401550293, "global_step": 12949, "epoch": 77} {"train_loss": -6.02166748046875, "global_step": 12950, "epoch": 77} {"train_loss": -5.988043785095215, "global_step": 12951, "epoch": 77} {"train_loss": -6.196950912475586, "global_step": 12952, "epoch": 77} {"train_loss": -6.190314769744873, "global_step": 12953, "epoch": 77} {"train_loss": -6.313414573669434, "global_step": 12954, "epoch": 77} {"train_loss": -6.276796340942383, "global_step": 12955, "epoch": 77} {"train_loss": -6.215758323669434, "global_step": 12956, "epoch": 77} {"train_loss": -6.159116744995117, "global_step": 12957, "epoch": 77} {"train_loss": -6.138039588928223, "global_step": 12958, "epoch": 77} {"train_loss": -6.306830883026123, "global_step": 12959, "epoch": 77} {"train_loss": -6.148401260375977, "global_step": 12960, "epoch": 77} {"train_loss": -6.14599609375, "global_step": 12961, "epoch": 77} {"train_loss": -6.199073314666748, "global_step": 12962, "epoch": 77} {"train_loss": -6.051535606384277, "global_step": 12963, "epoch": 77} {"train_loss": -6.081795692443848, "global_step": 12964, "epoch": 77} {"train_loss": -6.055095672607422, "global_step": 12965, "epoch": 77} {"train_loss": -6.208006858825684, "global_step": 12966, "epoch": 77} {"train_loss": -6.136327266693115, "global_step": 12967, "epoch": 77} {"train_loss": -6.363516807556152, "global_step": 12968, "epoch": 77} {"train_loss": -6.025298118591309, "global_step": 12969, "epoch": 77} {"train_loss": -6.137353897094727, "global_step": 12970, "epoch": 77} {"train_loss": -6.227960109710693, "global_step": 12971, "epoch": 77} {"train_loss": -6.122101783752441, "global_step": 12972, "epoch": 77} {"train_loss": -6.2232818603515625, "global_step": 12973, "epoch": 77} {"train_loss": -6.190441608428955, "global_step": 12974, "epoch": 77} {"train_loss": -6.330368995666504, "global_step": 12975, "epoch": 77} {"train_loss": -6.4592132568359375, "global_step": 12976, "epoch": 77} {"train_loss": -6.026076316833496, "global_step": 12977, "epoch": 77} {"train_loss": -5.864012718200684, "global_step": 12978, "epoch": 77} {"train_loss": -6.041290283203125, "global_step": 12979, "epoch": 77} {"train_loss": -5.997436046600342, "global_step": 12980, "epoch": 77} {"train_loss": -6.1571173667907715, "global_step": 12981, "epoch": 77} {"train_loss": -6.228203773498535, "global_step": 12982, "epoch": 77} {"train_loss": -6.029146671295166, "global_step": 12983, "epoch": 77} {"train_loss": -6.068000793457031, "global_step": 12984, "epoch": 77} {"train_loss": -5.986034870147705, "global_step": 12985, "epoch": 77} {"train_loss": -6.1139984130859375, "global_step": 12986, "epoch": 77} {"train_loss": -6.1595001220703125, "global_step": 12987, "epoch": 77} {"train_loss": -6.008569240570068, "global_step": 12988, "epoch": 77} {"train_loss": -6.065366268157959, "global_step": 12989, "epoch": 77} {"train_loss": -6.111771583557129, "global_step": 12990, "epoch": 77} {"train_loss": -6.035421848297119, "global_step": 12991, "epoch": 77} {"train_loss": -6.030028343200684, "global_step": 12992, "epoch": 77} {"train_loss": -6.17863130569458, "global_step": 12993, "epoch": 77} {"train_loss": -6.0287885665893555, "global_step": 12994, "epoch": 77} {"train_loss": -6.012631416320801, "global_step": 12995, "epoch": 77} {"train_loss": -6.003500461578369, "global_step": 12996, "epoch": 77} {"train_loss": -6.046801567077637, "global_step": 12997, "epoch": 77} {"train_loss": -6.117160797119141, "global_step": 12998, "epoch": 77} {"train_loss": -5.901619911193848, "global_step": 12999, "epoch": 77} {"train_loss": -6.268516540527344, "global_step": 13000, "epoch": 77} {"train_loss": -5.743752479553223, "global_step": 13001, "epoch": 77} {"train_loss": -6.362429618835449, "global_step": 13002, "epoch": 77} {"train_loss": -5.867957592010498, "global_step": 13003, "epoch": 77} {"train_loss": -6.222498893737793, "global_step": 13004, "epoch": 77} {"train_loss": -6.080548286437988, "global_step": 13005, "epoch": 77} {"train_loss": -5.913808822631836, "global_step": 13006, "epoch": 77} {"train_loss": -6.216493606567383, "global_step": 13007, "epoch": 77} {"train_loss": -6.189887523651123, "global_step": 13008, "epoch": 77} {"train_loss": -6.224280834197998, "global_step": 13009, "epoch": 77} {"train_loss": -6.1153483390808105, "global_step": 13010, "epoch": 77} {"train_loss": -6.110645294189453, "global_step": 13011, "epoch": 77} {"train_loss": -6.239162921905518, "global_step": 13012, "epoch": 77} {"train_loss": -6.3113250732421875, "global_step": 13013, "epoch": 77} {"train_loss": -5.962160110473633, "global_step": 13014, "epoch": 77} {"train_loss": -6.252072334289551, "global_step": 13015, "epoch": 77} {"train_loss": -6.309259414672852, "global_step": 13016, "epoch": 77} {"train_loss": -6.161798477172852, "global_step": 13017, "epoch": 77} {"train_loss": -6.233272552490234, "global_step": 13018, "epoch": 77} {"train_loss": -6.310256004333496, "global_step": 13019, "epoch": 77} {"train_loss": -6.120762825012207, "global_step": 13020, "epoch": 77} {"train_loss": -6.314786911010742, "global_step": 13021, "epoch": 77} {"train_loss": -6.16416597366333, "global_step": 13022, "epoch": 77} {"train_loss": -6.222233295440674, "global_step": 13023, "epoch": 77} {"train_loss": -6.343681335449219, "global_step": 13024, "epoch": 77} {"train_loss": -6.261651039123535, "global_step": 13025, "epoch": 77} {"train_loss": -6.374686241149902, "global_step": 13026, "epoch": 77} {"train_loss": -6.260359764099121, "global_step": 13027, "epoch": 77} {"train_loss": -6.106988906860352, "global_step": 13028, "epoch": 77} {"train_loss": -6.266059875488281, "global_step": 13029, "epoch": 77} {"train_loss": -5.979121208190918, "global_step": 13030, "epoch": 77} {"train_loss": -6.373435020446777, "global_step": 13031, "epoch": 77} {"train_loss": -6.054124355316162, "global_step": 13032, "epoch": 77} {"train_loss": -6.0729570388793945, "global_step": 13033, "epoch": 77} {"train_loss": -6.143051624298096, "global_step": 13034, "epoch": 77} {"train_loss": -6.127392292022705, "global_step": 13035, "epoch": 77} {"train_loss": -6.192415237426758, "global_step": 13036, "epoch": 77} {"train_loss": -6.156064987182617, "global_step": 13037, "epoch": 77} {"train_loss": -6.325773239135742, "global_step": 13038, "epoch": 77} {"train_loss": -6.172513961791992, "global_step": 13039, "epoch": 77} {"train_loss": -6.270829200744629, "global_step": 13040, "epoch": 77} {"train_loss": -6.247397422790527, "global_step": 13041, "epoch": 77} {"train_loss": -5.914209365844727, "global_step": 13042, "epoch": 77} {"train_loss": -6.056417465209961, "global_step": 13043, "epoch": 77} {"train_loss": -5.796398162841797, "global_step": 13044, "epoch": 77} {"train_loss": -6.12904167175293, "global_step": 13045, "epoch": 77} {"train_loss": -6.052674293518066, "global_step": 13046, "epoch": 77} {"train_loss": -6.22968053817749, "global_step": 13047, "epoch": 77} {"train_loss": -6.083898544311523, "global_step": 13048, "epoch": 77} {"train_loss": -6.155238151550293, "global_step": 13049, "epoch": 77} {"train_loss": -5.8279571533203125, "global_step": 13050, "epoch": 77} {"train_loss": -5.9630842208862305, "global_step": 13051, "epoch": 77} {"train_loss": -5.912724494934082, "global_step": 13052, "epoch": 77} {"train_loss": -6.060660362243652, "global_step": 13053, "epoch": 77} {"train_loss": -5.925429344177246, "global_step": 13054, "epoch": 77} {"train_loss": -6.2731475830078125, "global_step": 13055, "epoch": 77} {"train_loss": -5.837714672088623, "global_step": 13056, "epoch": 77} {"train_loss": -6.222445011138916, "global_step": 13057, "epoch": 77} {"train_loss": -6.134089946746826, "global_step": 13058, "epoch": 77} {"train_loss": -6.302109718322754, "global_step": 13059, "epoch": 77} {"train_loss": -6.259688377380371, "global_step": 13060, "epoch": 77} {"train_loss": -6.275769233703613, "global_step": 13061, "epoch": 77} {"train_loss": -6.410368919372559, "global_step": 13062, "epoch": 77} {"train_loss": -6.338639259338379, "global_step": 13063, "epoch": 77} {"train_loss": -6.2159576416015625, "global_step": 13064, "epoch": 77} {"train_loss": -6.289631366729736, "global_step": 13065, "epoch": 77} {"train_loss": -5.96000862121582, "global_step": 13066, "epoch": 77} {"train_loss": -6.246331214904785, "global_step": 13067, "epoch": 77} {"train_loss": -6.031459331512451, "global_step": 13068, "epoch": 77} {"train_loss": -6.0723371505737305, "global_step": 13069, "epoch": 77} {"train_loss": -6.273432731628418, "global_step": 13070, "epoch": 77} {"train_loss": -6.226059913635254, "global_step": 13071, "epoch": 77} {"train_loss": -6.114675521850586, "global_step": 13072, "epoch": 77} {"train_loss": -6.182106971740723, "global_step": 13073, "epoch": 77} {"train_loss": -6.042890548706055, "global_step": 13074, "epoch": 77} {"train_loss": -6.030605792999268, "global_step": 13075, "epoch": 77} {"train_loss": -6.232238292694092, "global_step": 13076, "epoch": 77} {"train_loss": -6.243588447570801, "global_step": 13077, "epoch": 77} {"train_loss": -5.751028060913086, "global_step": 13078, "epoch": 77} {"train_loss": -6.336044788360596, "global_step": 13079, "epoch": 77} {"train_loss": -6.075428485870361, "global_step": 13080, "epoch": 77} {"train_loss": -5.972152233123779, "global_step": 13081, "epoch": 77} {"train_loss": -6.08527946472168, "global_step": 13082, "epoch": 77} {"train_loss": -6.205496311187744, "global_step": 13083, "epoch": 77} {"train_loss": -6.087055206298828, "global_step": 13084, "epoch": 77} {"train_loss": -6.2828874588012695, "global_step": 13085, "epoch": 77} {"train_loss": -6.234781265258789, "global_step": 13086, "epoch": 77} {"train_loss": -6.413339614868164, "global_step": 13087, "epoch": 77} {"train_loss": -6.291298866271973, "global_step": 13088, "epoch": 77} {"train_loss": -6.258334636688232, "global_step": 13089, "epoch": 77} {"train_loss": -6.130953788757324, "global_step": 13090, "epoch": 77} {"train_loss": -6.132060527801514, "global_step": 13091, "epoch": 77} {"train_loss": -5.939267635345459, "global_step": 13092, "epoch": 77} {"train_loss": -6.281949043273926, "global_step": 13093, "epoch": 77} {"train_loss": -6.227314472198486, "global_step": 13094, "epoch": 77} {"train_loss": -6.111027717590332, "global_step": 13095, "epoch": 77} {"train_loss": -6.030858039855957, "global_step": 13096, "epoch": 77} {"train_loss": -6.111964225769043, "global_step": 13097, "epoch": 77} {"train_loss": -6.146134853363037, "global_step": 13098, "epoch": 77} {"train_loss": -6.038782596588135, "global_step": 13099, "epoch": 77} {"train_loss": -6.1665849685668945, "global_step": 13100, "epoch": 77} {"train_loss": -6.1409101486206055, "global_step": 13101, "epoch": 77} {"train_loss": -5.713287830352783, "global_step": 13102, "epoch": 77} {"train_loss": -6.125960625353313, "global_step": 13103, "epoch": 77, "val_loss": 263621.3125} {"train_loss": -5.987815856933594, "global_step": 13104, "epoch": 78} {"train_loss": -6.047206878662109, "global_step": 13105, "epoch": 78} {"train_loss": -6.015163421630859, "global_step": 13106, "epoch": 78} {"train_loss": -6.12678337097168, "global_step": 13107, "epoch": 78} {"train_loss": -5.97019100189209, "global_step": 13108, "epoch": 78} {"train_loss": -6.138920783996582, "global_step": 13109, "epoch": 78} {"train_loss": -6.168848991394043, "global_step": 13110, "epoch": 78} {"train_loss": -5.951008319854736, "global_step": 13111, "epoch": 78} {"train_loss": -6.307692527770996, "global_step": 13112, "epoch": 78} {"train_loss": -6.097032070159912, "global_step": 13113, "epoch": 78} {"train_loss": -6.456387042999268, "global_step": 13114, "epoch": 78} {"train_loss": -6.141882419586182, "global_step": 13115, "epoch": 78} {"train_loss": -6.53153657913208, "global_step": 13116, "epoch": 78} {"train_loss": -6.014437198638916, "global_step": 13117, "epoch": 78} {"train_loss": -6.026128768920898, "global_step": 13118, "epoch": 78} {"train_loss": -6.092508316040039, "global_step": 13119, "epoch": 78} {"train_loss": -6.323768615722656, "global_step": 13120, "epoch": 78} {"train_loss": -6.174849987030029, "global_step": 13121, "epoch": 78} {"train_loss": -6.045100212097168, "global_step": 13122, "epoch": 78} {"train_loss": -6.298959255218506, "global_step": 13123, "epoch": 78} {"train_loss": -6.080881118774414, "global_step": 13124, "epoch": 78} {"train_loss": -6.204946994781494, "global_step": 13125, "epoch": 78} {"train_loss": -5.881613731384277, "global_step": 13126, "epoch": 78} {"train_loss": -6.035303115844727, "global_step": 13127, "epoch": 78} {"train_loss": -5.729508399963379, "global_step": 13128, "epoch": 78} {"train_loss": -6.1531596183776855, "global_step": 13129, "epoch": 78} {"train_loss": -6.156469345092773, "global_step": 13130, "epoch": 78} {"train_loss": -6.166286468505859, "global_step": 13131, "epoch": 78} {"train_loss": -6.180083274841309, "global_step": 13132, "epoch": 78} {"train_loss": -6.205300807952881, "global_step": 13133, "epoch": 78} {"train_loss": -5.907989501953125, "global_step": 13134, "epoch": 78} {"train_loss": -6.182110786437988, "global_step": 13135, "epoch": 78} {"train_loss": -6.06402063369751, "global_step": 13136, "epoch": 78} {"train_loss": -6.199527740478516, "global_step": 13137, "epoch": 78} {"train_loss": -6.079999923706055, "global_step": 13138, "epoch": 78} {"train_loss": -6.380931377410889, "global_step": 13139, "epoch": 78} {"train_loss": -6.029784202575684, "global_step": 13140, "epoch": 78} {"train_loss": -6.136214256286621, "global_step": 13141, "epoch": 78} {"train_loss": -6.031465530395508, "global_step": 13142, "epoch": 78} {"train_loss": -6.043848037719727, "global_step": 13143, "epoch": 78} {"train_loss": -5.8899383544921875, "global_step": 13144, "epoch": 78} {"train_loss": -6.015991687774658, "global_step": 13145, "epoch": 78} {"train_loss": -6.274479866027832, "global_step": 13146, "epoch": 78} {"train_loss": -6.159083366394043, "global_step": 13147, "epoch": 78} {"train_loss": -6.070290565490723, "global_step": 13148, "epoch": 78} {"train_loss": -6.085087299346924, "global_step": 13149, "epoch": 78} {"train_loss": -6.159214019775391, "global_step": 13150, "epoch": 78} {"train_loss": -6.173511505126953, "global_step": 13151, "epoch": 78} {"train_loss": -5.81392765045166, "global_step": 13152, "epoch": 78} {"train_loss": -6.325804710388184, "global_step": 13153, "epoch": 78} {"train_loss": -6.020194053649902, "global_step": 13154, "epoch": 78} {"train_loss": -6.181075572967529, "global_step": 13155, "epoch": 78} {"train_loss": -6.057113170623779, "global_step": 13156, "epoch": 78} {"train_loss": -6.080660820007324, "global_step": 13157, "epoch": 78} {"train_loss": -5.97471809387207, "global_step": 13158, "epoch": 78} {"train_loss": -5.957032203674316, "global_step": 13159, "epoch": 78} {"train_loss": -5.930728912353516, "global_step": 13160, "epoch": 78} {"train_loss": -6.07976770401001, "global_step": 13161, "epoch": 78} {"train_loss": -6.225935459136963, "global_step": 13162, "epoch": 78} {"train_loss": -6.042491436004639, "global_step": 13163, "epoch": 78} {"train_loss": -6.24126672744751, "global_step": 13164, "epoch": 78} {"train_loss": -6.197235107421875, "global_step": 13165, "epoch": 78} {"train_loss": -6.217449188232422, "global_step": 13166, "epoch": 78} {"train_loss": -6.172604560852051, "global_step": 13167, "epoch": 78} {"train_loss": -5.8184685707092285, "global_step": 13168, "epoch": 78} {"train_loss": -5.885148525238037, "global_step": 13169, "epoch": 78} {"train_loss": -6.177221298217773, "global_step": 13170, "epoch": 78} {"train_loss": -5.980621337890625, "global_step": 13171, "epoch": 78} {"train_loss": -6.371103286743164, "global_step": 13172, "epoch": 78} {"train_loss": -5.939911365509033, "global_step": 13173, "epoch": 78} {"train_loss": -6.170867443084717, "global_step": 13174, "epoch": 78} {"train_loss": -6.02885103225708, "global_step": 13175, "epoch": 78} {"train_loss": -6.178150177001953, "global_step": 13176, "epoch": 78} {"train_loss": -6.129833221435547, "global_step": 13177, "epoch": 78} {"train_loss": -5.837043285369873, "global_step": 13178, "epoch": 78} {"train_loss": -6.035831451416016, "global_step": 13179, "epoch": 78} {"train_loss": -5.978407859802246, "global_step": 13180, "epoch": 78} {"train_loss": -6.275537490844727, "global_step": 13181, "epoch": 78} {"train_loss": -6.125782489776611, "global_step": 13182, "epoch": 78} {"train_loss": -6.321341514587402, "global_step": 13183, "epoch": 78} {"train_loss": -6.181127548217773, "global_step": 13184, "epoch": 78} {"train_loss": -5.9006829261779785, "global_step": 13185, "epoch": 78} {"train_loss": -6.122669219970703, "global_step": 13186, "epoch": 78} {"train_loss": -6.141895771026611, "global_step": 13187, "epoch": 78} {"train_loss": -6.01076078414917, "global_step": 13188, "epoch": 78} {"train_loss": -6.140443801879883, "global_step": 13189, "epoch": 78} {"train_loss": -6.191435813903809, "global_step": 13190, "epoch": 78} {"train_loss": -6.20522403717041, "global_step": 13191, "epoch": 78} {"train_loss": -5.91626501083374, "global_step": 13192, "epoch": 78} {"train_loss": -6.153528213500977, "global_step": 13193, "epoch": 78} {"train_loss": -6.3548078536987305, "global_step": 13194, "epoch": 78} {"train_loss": -6.185904502868652, "global_step": 13195, "epoch": 78} {"train_loss": -6.018935203552246, "global_step": 13196, "epoch": 78} {"train_loss": -6.275854587554932, "global_step": 13197, "epoch": 78} {"train_loss": -6.095854759216309, "global_step": 13198, "epoch": 78} {"train_loss": -5.918674945831299, "global_step": 13199, "epoch": 78} {"train_loss": -6.127570629119873, "global_step": 13200, "epoch": 78} {"train_loss": -6.097744941711426, "global_step": 13201, "epoch": 78} {"train_loss": -6.339681148529053, "global_step": 13202, "epoch": 78} {"train_loss": -6.234107971191406, "global_step": 13203, "epoch": 78} {"train_loss": -6.392258644104004, "global_step": 13204, "epoch": 78} {"train_loss": -5.945896625518799, "global_step": 13205, "epoch": 78} {"train_loss": -6.23970365524292, "global_step": 13206, "epoch": 78} {"train_loss": -6.050673484802246, "global_step": 13207, "epoch": 78} {"train_loss": -6.1368255615234375, "global_step": 13208, "epoch": 78} {"train_loss": -6.142489433288574, "global_step": 13209, "epoch": 78} {"train_loss": -6.281004905700684, "global_step": 13210, "epoch": 78} {"train_loss": -6.188419818878174, "global_step": 13211, "epoch": 78} {"train_loss": -6.281688690185547, "global_step": 13212, "epoch": 78} {"train_loss": -6.16433048248291, "global_step": 13213, "epoch": 78} {"train_loss": -6.244865417480469, "global_step": 13214, "epoch": 78} {"train_loss": -6.196796894073486, "global_step": 13215, "epoch": 78} {"train_loss": -6.0134806632995605, "global_step": 13216, "epoch": 78} {"train_loss": -6.252745151519775, "global_step": 13217, "epoch": 78} {"train_loss": -6.214296340942383, "global_step": 13218, "epoch": 78} {"train_loss": -6.130898952484131, "global_step": 13219, "epoch": 78} {"train_loss": -6.2336812019348145, "global_step": 13220, "epoch": 78} {"train_loss": -6.128477096557617, "global_step": 13221, "epoch": 78} {"train_loss": -6.263251304626465, "global_step": 13222, "epoch": 78} {"train_loss": -6.075639724731445, "global_step": 13223, "epoch": 78} {"train_loss": -6.16346549987793, "global_step": 13224, "epoch": 78} {"train_loss": -6.226353645324707, "global_step": 13225, "epoch": 78} {"train_loss": -6.3011155128479, "global_step": 13226, "epoch": 78} {"train_loss": -6.270150184631348, "global_step": 13227, "epoch": 78} {"train_loss": -6.310745716094971, "global_step": 13228, "epoch": 78} {"train_loss": -6.345286846160889, "global_step": 13229, "epoch": 78} {"train_loss": -6.437429428100586, "global_step": 13230, "epoch": 78} {"train_loss": -6.055550575256348, "global_step": 13231, "epoch": 78} {"train_loss": -6.212320327758789, "global_step": 13232, "epoch": 78} {"train_loss": -6.4589948654174805, "global_step": 13233, "epoch": 78} {"train_loss": -6.428826332092285, "global_step": 13234, "epoch": 78} {"train_loss": -6.391008377075195, "global_step": 13235, "epoch": 78} {"train_loss": -6.142237663269043, "global_step": 13236, "epoch": 78} {"train_loss": -5.963074684143066, "global_step": 13237, "epoch": 78} {"train_loss": -5.906842231750488, "global_step": 13238, "epoch": 78} {"train_loss": -6.12106990814209, "global_step": 13239, "epoch": 78} {"train_loss": -6.257328987121582, "global_step": 13240, "epoch": 78} {"train_loss": -6.308277130126953, "global_step": 13241, "epoch": 78} {"train_loss": -5.950311183929443, "global_step": 13242, "epoch": 78} {"train_loss": -6.172387599945068, "global_step": 13243, "epoch": 78} {"train_loss": -6.0153632164001465, "global_step": 13244, "epoch": 78} {"train_loss": -6.093823432922363, "global_step": 13245, "epoch": 78} {"train_loss": -5.965351581573486, "global_step": 13246, "epoch": 78} {"train_loss": -6.026787281036377, "global_step": 13247, "epoch": 78} {"train_loss": -6.00370979309082, "global_step": 13248, "epoch": 78} {"train_loss": -6.307595252990723, "global_step": 13249, "epoch": 78} {"train_loss": -6.1852264404296875, "global_step": 13250, "epoch": 78} {"train_loss": -6.275212287902832, "global_step": 13251, "epoch": 78} {"train_loss": -5.989130973815918, "global_step": 13252, "epoch": 78} {"train_loss": -6.291550636291504, "global_step": 13253, "epoch": 78} {"train_loss": -6.1732940673828125, "global_step": 13254, "epoch": 78} {"train_loss": -6.16657018661499, "global_step": 13255, "epoch": 78} {"train_loss": -6.246277809143066, "global_step": 13256, "epoch": 78} {"train_loss": -6.166757583618164, "global_step": 13257, "epoch": 78} {"train_loss": -6.059521675109863, "global_step": 13258, "epoch": 78} {"train_loss": -6.108097076416016, "global_step": 13259, "epoch": 78} {"train_loss": -6.500453948974609, "global_step": 13260, "epoch": 78} {"train_loss": -6.345163345336914, "global_step": 13261, "epoch": 78} {"train_loss": -6.44025993347168, "global_step": 13262, "epoch": 78} {"train_loss": -6.1454644203186035, "global_step": 13263, "epoch": 78} {"train_loss": -6.232862949371338, "global_step": 13264, "epoch": 78} {"train_loss": -6.246618270874023, "global_step": 13265, "epoch": 78} {"train_loss": -6.456273078918457, "global_step": 13266, "epoch": 78} {"train_loss": -6.335852146148682, "global_step": 13267, "epoch": 78} {"train_loss": -6.122383117675781, "global_step": 13268, "epoch": 78} {"train_loss": -6.169696807861328, "global_step": 13269, "epoch": 78} {"train_loss": -6.0677947998046875, "global_step": 13270, "epoch": 78} {"train_loss": -6.144137266136351, "global_step": 13271, "epoch": 78, "val_loss": 248228.875} {"train_loss": -6.157020092010498, "global_step": 13272, "epoch": 79} {"train_loss": -6.128767013549805, "global_step": 13273, "epoch": 79} {"train_loss": -6.121116638183594, "global_step": 13274, "epoch": 79} {"train_loss": -6.011641979217529, "global_step": 13275, "epoch": 79} {"train_loss": -6.170735836029053, "global_step": 13276, "epoch": 79} {"train_loss": -5.695855140686035, "global_step": 13277, "epoch": 79} {"train_loss": -6.084691047668457, "global_step": 13278, "epoch": 79} {"train_loss": -5.9802141189575195, "global_step": 13279, "epoch": 79} {"train_loss": -5.806308269500732, "global_step": 13280, "epoch": 79} {"train_loss": -6.11822509765625, "global_step": 13281, "epoch": 79} {"train_loss": -6.08458137512207, "global_step": 13282, "epoch": 79} {"train_loss": -6.138373374938965, "global_step": 13283, "epoch": 79} {"train_loss": -6.37113094329834, "global_step": 13284, "epoch": 79} {"train_loss": -6.18983268737793, "global_step": 13285, "epoch": 79} {"train_loss": -6.254446983337402, "global_step": 13286, "epoch": 79} {"train_loss": -6.163182258605957, "global_step": 13287, "epoch": 79} {"train_loss": -6.06972599029541, "global_step": 13288, "epoch": 79} {"train_loss": -6.173144340515137, "global_step": 13289, "epoch": 79} {"train_loss": -6.130092620849609, "global_step": 13290, "epoch": 79} {"train_loss": -6.180534362792969, "global_step": 13291, "epoch": 79} {"train_loss": -6.175792694091797, "global_step": 13292, "epoch": 79} {"train_loss": -6.228067398071289, "global_step": 13293, "epoch": 79} {"train_loss": -6.123511791229248, "global_step": 13294, "epoch": 79} {"train_loss": -6.101263999938965, "global_step": 13295, "epoch": 79} {"train_loss": -6.140518665313721, "global_step": 13296, "epoch": 79} {"train_loss": -6.14378547668457, "global_step": 13297, "epoch": 79} {"train_loss": -6.2314910888671875, "global_step": 13298, "epoch": 79} {"train_loss": -5.946235656738281, "global_step": 13299, "epoch": 79} {"train_loss": -5.971895217895508, "global_step": 13300, "epoch": 79} {"train_loss": -6.033115863800049, "global_step": 13301, "epoch": 79} {"train_loss": -6.029407501220703, "global_step": 13302, "epoch": 79} {"train_loss": -6.238673210144043, "global_step": 13303, "epoch": 79} {"train_loss": -6.252460479736328, "global_step": 13304, "epoch": 79} {"train_loss": -6.022369384765625, "global_step": 13305, "epoch": 79} {"train_loss": -6.3781023025512695, "global_step": 13306, "epoch": 79} {"train_loss": -6.0956926345825195, "global_step": 13307, "epoch": 79} {"train_loss": -6.3453593254089355, "global_step": 13308, "epoch": 79} {"train_loss": -6.167365550994873, "global_step": 13309, "epoch": 79} {"train_loss": -5.9741129875183105, "global_step": 13310, "epoch": 79} {"train_loss": -6.1608147621154785, "global_step": 13311, "epoch": 79} {"train_loss": -6.098495006561279, "global_step": 13312, "epoch": 79} {"train_loss": -5.8823981285095215, "global_step": 13313, "epoch": 79} {"train_loss": -6.114157199859619, "global_step": 13314, "epoch": 79} {"train_loss": -6.038887023925781, "global_step": 13315, "epoch": 79} {"train_loss": -6.213927268981934, "global_step": 13316, "epoch": 79} {"train_loss": -6.122464179992676, "global_step": 13317, "epoch": 79} {"train_loss": -5.832831382751465, "global_step": 13318, "epoch": 79} {"train_loss": -5.88845682144165, "global_step": 13319, "epoch": 79} {"train_loss": -6.192699432373047, "global_step": 13320, "epoch": 79} {"train_loss": -5.9601826667785645, "global_step": 13321, "epoch": 79} {"train_loss": -6.034989833831787, "global_step": 13322, "epoch": 79} {"train_loss": -6.080936908721924, "global_step": 13323, "epoch": 79} {"train_loss": -5.795119285583496, "global_step": 13324, "epoch": 79} {"train_loss": -6.124233245849609, "global_step": 13325, "epoch": 79} {"train_loss": -5.700714111328125, "global_step": 13326, "epoch": 79} {"train_loss": -5.9358038902282715, "global_step": 13327, "epoch": 79} {"train_loss": -6.105626583099365, "global_step": 13328, "epoch": 79} {"train_loss": -6.09385871887207, "global_step": 13329, "epoch": 79} {"train_loss": -6.08421516418457, "global_step": 13330, "epoch": 79} {"train_loss": -6.196492671966553, "global_step": 13331, "epoch": 79} {"train_loss": -5.598810195922852, "global_step": 13332, "epoch": 79} {"train_loss": -6.158066749572754, "global_step": 13333, "epoch": 79} {"train_loss": -5.977642059326172, "global_step": 13334, "epoch": 79} {"train_loss": -6.255948066711426, "global_step": 13335, "epoch": 79} {"train_loss": -6.046674728393555, "global_step": 13336, "epoch": 79} {"train_loss": -6.011248588562012, "global_step": 13337, "epoch": 79} {"train_loss": -6.184434413909912, "global_step": 13338, "epoch": 79} {"train_loss": -5.999619483947754, "global_step": 13339, "epoch": 79} {"train_loss": -6.249484062194824, "global_step": 13340, "epoch": 79} {"train_loss": -5.844813346862793, "global_step": 13341, "epoch": 79} {"train_loss": -6.177000045776367, "global_step": 13342, "epoch": 79} {"train_loss": -5.976682186126709, "global_step": 13343, "epoch": 79} {"train_loss": -6.021055221557617, "global_step": 13344, "epoch": 79} {"train_loss": -6.14723014831543, "global_step": 13345, "epoch": 79} {"train_loss": -6.14847469329834, "global_step": 13346, "epoch": 79} {"train_loss": -6.250575542449951, "global_step": 13347, "epoch": 79} {"train_loss": -6.004316329956055, "global_step": 13348, "epoch": 79} {"train_loss": -6.095925331115723, "global_step": 13349, "epoch": 79} {"train_loss": -6.111623764038086, "global_step": 13350, "epoch": 79} {"train_loss": -6.2367401123046875, "global_step": 13351, "epoch": 79} {"train_loss": -5.834535598754883, "global_step": 13352, "epoch": 79} {"train_loss": -6.383694648742676, "global_step": 13353, "epoch": 79} {"train_loss": -6.257352828979492, "global_step": 13354, "epoch": 79} {"train_loss": -6.118102550506592, "global_step": 13355, "epoch": 79} {"train_loss": -6.3702311515808105, "global_step": 13356, "epoch": 79} {"train_loss": -6.082428932189941, "global_step": 13357, "epoch": 79} {"train_loss": -6.162708759307861, "global_step": 13358, "epoch": 79} {"train_loss": -6.189532279968262, "global_step": 13359, "epoch": 79} {"train_loss": -6.290859699249268, "global_step": 13360, "epoch": 79} {"train_loss": -6.233186721801758, "global_step": 13361, "epoch": 79} {"train_loss": -6.365335464477539, "global_step": 13362, "epoch": 79} {"train_loss": -6.188144207000732, "global_step": 13363, "epoch": 79} {"train_loss": -6.067474365234375, "global_step": 13364, "epoch": 79} {"train_loss": -6.011723518371582, "global_step": 13365, "epoch": 79} {"train_loss": -5.870418548583984, "global_step": 13366, "epoch": 79} {"train_loss": -5.782867908477783, "global_step": 13367, "epoch": 79} {"train_loss": -6.135968208312988, "global_step": 13368, "epoch": 79} {"train_loss": -6.012716770172119, "global_step": 13369, "epoch": 79} {"train_loss": -6.061002731323242, "global_step": 13370, "epoch": 79} {"train_loss": -6.058157920837402, "global_step": 13371, "epoch": 79} {"train_loss": -6.166769027709961, "global_step": 13372, "epoch": 79} {"train_loss": -6.089417934417725, "global_step": 13373, "epoch": 79} {"train_loss": -5.961997032165527, "global_step": 13374, "epoch": 79} {"train_loss": -6.103004455566406, "global_step": 13375, "epoch": 79} {"train_loss": -5.802251815795898, "global_step": 13376, "epoch": 79} {"train_loss": -6.026185989379883, "global_step": 13377, "epoch": 79} {"train_loss": -6.1033101081848145, "global_step": 13378, "epoch": 79} {"train_loss": -5.680590629577637, "global_step": 13379, "epoch": 79} {"train_loss": -6.109729766845703, "global_step": 13380, "epoch": 79} {"train_loss": -6.049130916595459, "global_step": 13381, "epoch": 79} {"train_loss": -6.140251159667969, "global_step": 13382, "epoch": 79} {"train_loss": -6.1175537109375, "global_step": 13383, "epoch": 79} {"train_loss": -6.059645652770996, "global_step": 13384, "epoch": 79} {"train_loss": -5.987093925476074, "global_step": 13385, "epoch": 79} {"train_loss": -6.24223518371582, "global_step": 13386, "epoch": 79} {"train_loss": -5.964587211608887, "global_step": 13387, "epoch": 79} {"train_loss": -6.011326789855957, "global_step": 13388, "epoch": 79} {"train_loss": -6.251854419708252, "global_step": 13389, "epoch": 79} {"train_loss": -5.977127552032471, "global_step": 13390, "epoch": 79} {"train_loss": -6.161468029022217, "global_step": 13391, "epoch": 79} {"train_loss": -6.115578651428223, "global_step": 13392, "epoch": 79} {"train_loss": -6.281658172607422, "global_step": 13393, "epoch": 79} {"train_loss": -6.088131427764893, "global_step": 13394, "epoch": 79} {"train_loss": -5.739405632019043, "global_step": 13395, "epoch": 79} {"train_loss": -6.086061954498291, "global_step": 13396, "epoch": 79} {"train_loss": -6.234159469604492, "global_step": 13397, "epoch": 79} {"train_loss": -6.107878684997559, "global_step": 13398, "epoch": 79} {"train_loss": -6.1871795654296875, "global_step": 13399, "epoch": 79} {"train_loss": -6.125189781188965, "global_step": 13400, "epoch": 79} {"train_loss": -5.941867828369141, "global_step": 13401, "epoch": 79} {"train_loss": -6.2104692459106445, "global_step": 13402, "epoch": 79} {"train_loss": -5.873723983764648, "global_step": 13403, "epoch": 79} {"train_loss": -6.040094375610352, "global_step": 13404, "epoch": 79} {"train_loss": -6.257946014404297, "global_step": 13405, "epoch": 79} {"train_loss": -5.955433368682861, "global_step": 13406, "epoch": 79} {"train_loss": -6.235509872436523, "global_step": 13407, "epoch": 79} {"train_loss": -6.10870885848999, "global_step": 13408, "epoch": 79} {"train_loss": -5.896460056304932, "global_step": 13409, "epoch": 79} {"train_loss": -6.063127517700195, "global_step": 13410, "epoch": 79} {"train_loss": -6.219524383544922, "global_step": 13411, "epoch": 79} {"train_loss": -6.175917625427246, "global_step": 13412, "epoch": 79} {"train_loss": -6.101759910583496, "global_step": 13413, "epoch": 79} {"train_loss": -5.962779998779297, "global_step": 13414, "epoch": 79} {"train_loss": -6.292737007141113, "global_step": 13415, "epoch": 79} {"train_loss": -6.251076698303223, "global_step": 13416, "epoch": 79} {"train_loss": -6.264319896697998, "global_step": 13417, "epoch": 79} {"train_loss": -6.407753944396973, "global_step": 13418, "epoch": 79} {"train_loss": -6.329160690307617, "global_step": 13419, "epoch": 79} {"train_loss": -6.251362323760986, "global_step": 13420, "epoch": 79} {"train_loss": -6.173635005950928, "global_step": 13421, "epoch": 79} {"train_loss": -5.992329120635986, "global_step": 13422, "epoch": 79} {"train_loss": -6.252409934997559, "global_step": 13423, "epoch": 79} {"train_loss": -6.406384468078613, "global_step": 13424, "epoch": 79} {"train_loss": -6.121084213256836, "global_step": 13425, "epoch": 79} {"train_loss": -6.033260345458984, "global_step": 13426, "epoch": 79} {"train_loss": -6.349841117858887, "global_step": 13427, "epoch": 79} {"train_loss": -6.321361541748047, "global_step": 13428, "epoch": 79} {"train_loss": -6.198602199554443, "global_step": 13429, "epoch": 79} {"train_loss": -6.343743801116943, "global_step": 13430, "epoch": 79} {"train_loss": -6.51133918762207, "global_step": 13431, "epoch": 79} {"train_loss": -6.146417140960693, "global_step": 13432, "epoch": 79} {"train_loss": -6.487880706787109, "global_step": 13433, "epoch": 79} {"train_loss": -6.242321014404297, "global_step": 13434, "epoch": 79} {"train_loss": -6.29261589050293, "global_step": 13435, "epoch": 79} {"train_loss": -6.303133964538574, "global_step": 13436, "epoch": 79} {"train_loss": -6.2562103271484375, "global_step": 13437, "epoch": 79} {"train_loss": -6.395620346069336, "global_step": 13438, "epoch": 79} {"train_loss": -6.112988982881818, "global_step": 13439, "epoch": 79, "val_loss": 253610.578125} {"train_loss": -6.117807865142822, "global_step": 13440, "epoch": 80} {"train_loss": -6.311669826507568, "global_step": 13441, "epoch": 80} {"train_loss": -5.996903896331787, "global_step": 13442, "epoch": 80} {"train_loss": -6.296072959899902, "global_step": 13443, "epoch": 80} {"train_loss": -6.338878154754639, "global_step": 13444, "epoch": 80} {"train_loss": -6.191437721252441, "global_step": 13445, "epoch": 80} {"train_loss": -6.38438081741333, "global_step": 13446, "epoch": 80} {"train_loss": -6.134214401245117, "global_step": 13447, "epoch": 80} {"train_loss": -6.114173889160156, "global_step": 13448, "epoch": 80} {"train_loss": -5.859879493713379, "global_step": 13449, "epoch": 80} {"train_loss": -6.26938533782959, "global_step": 13450, "epoch": 80} {"train_loss": -6.0087785720825195, "global_step": 13451, "epoch": 80} {"train_loss": -6.116620063781738, "global_step": 13452, "epoch": 80} {"train_loss": -5.977600574493408, "global_step": 13453, "epoch": 80} {"train_loss": -6.272056579589844, "global_step": 13454, "epoch": 80} {"train_loss": -6.1392130851745605, "global_step": 13455, "epoch": 80} {"train_loss": -5.9138617515563965, "global_step": 13456, "epoch": 80} {"train_loss": -6.2991838455200195, "global_step": 13457, "epoch": 80} {"train_loss": -6.258630752563477, "global_step": 13458, "epoch": 80} {"train_loss": -5.987002372741699, "global_step": 13459, "epoch": 80} {"train_loss": -6.180296897888184, "global_step": 13460, "epoch": 80} {"train_loss": -6.076037883758545, "global_step": 13461, "epoch": 80} {"train_loss": -6.278321743011475, "global_step": 13462, "epoch": 80} {"train_loss": -6.319782733917236, "global_step": 13463, "epoch": 80} {"train_loss": -5.98931884765625, "global_step": 13464, "epoch": 80} {"train_loss": -6.080905437469482, "global_step": 13465, "epoch": 80} {"train_loss": -6.2794694900512695, "global_step": 13466, "epoch": 80} {"train_loss": -6.170652389526367, "global_step": 13467, "epoch": 80} {"train_loss": -6.1026997566223145, "global_step": 13468, "epoch": 80} {"train_loss": -6.247515678405762, "global_step": 13469, "epoch": 80} {"train_loss": -6.534228324890137, "global_step": 13470, "epoch": 80} {"train_loss": -5.803361892700195, "global_step": 13471, "epoch": 80} {"train_loss": -5.967329978942871, "global_step": 13472, "epoch": 80} {"train_loss": -5.926451683044434, "global_step": 13473, "epoch": 80} {"train_loss": -5.915493011474609, "global_step": 13474, "epoch": 80} {"train_loss": -5.943630218505859, "global_step": 13475, "epoch": 80} {"train_loss": -6.079596519470215, "global_step": 13476, "epoch": 80} {"train_loss": -6.164987564086914, "global_step": 13477, "epoch": 80} {"train_loss": -6.194664001464844, "global_step": 13478, "epoch": 80} {"train_loss": -5.982085704803467, "global_step": 13479, "epoch": 80} {"train_loss": -5.89932918548584, "global_step": 13480, "epoch": 80} {"train_loss": -6.090442657470703, "global_step": 13481, "epoch": 80} {"train_loss": -6.00632381439209, "global_step": 13482, "epoch": 80} {"train_loss": -6.432854175567627, "global_step": 13483, "epoch": 80} {"train_loss": -6.140707492828369, "global_step": 13484, "epoch": 80} {"train_loss": -6.035708427429199, "global_step": 13485, "epoch": 80} {"train_loss": -6.17673397064209, "global_step": 13486, "epoch": 80} {"train_loss": -6.137470722198486, "global_step": 13487, "epoch": 80} {"train_loss": -6.240512847900391, "global_step": 13488, "epoch": 80} {"train_loss": -5.799115180969238, "global_step": 13489, "epoch": 80} {"train_loss": -6.410499572753906, "global_step": 13490, "epoch": 80} {"train_loss": -6.045753479003906, "global_step": 13491, "epoch": 80} {"train_loss": -6.277892112731934, "global_step": 13492, "epoch": 80} {"train_loss": -6.356470584869385, "global_step": 13493, "epoch": 80} {"train_loss": -6.361325263977051, "global_step": 13494, "epoch": 80} {"train_loss": -6.179096221923828, "global_step": 13495, "epoch": 80} {"train_loss": -6.284989356994629, "global_step": 13496, "epoch": 80} {"train_loss": -6.368200302124023, "global_step": 13497, "epoch": 80} {"train_loss": -6.111627578735352, "global_step": 13498, "epoch": 80} {"train_loss": -6.268184661865234, "global_step": 13499, "epoch": 80} {"train_loss": -6.33115291595459, "global_step": 13500, "epoch": 80} {"train_loss": -6.010124206542969, "global_step": 13501, "epoch": 80} {"train_loss": -6.124266147613525, "global_step": 13502, "epoch": 80} {"train_loss": -6.210378646850586, "global_step": 13503, "epoch": 80} {"train_loss": -6.135608673095703, "global_step": 13504, "epoch": 80} {"train_loss": -5.941196441650391, "global_step": 13505, "epoch": 80} {"train_loss": -5.760519504547119, "global_step": 13506, "epoch": 80} {"train_loss": -6.10943603515625, "global_step": 13507, "epoch": 80} {"train_loss": -6.238920211791992, "global_step": 13508, "epoch": 80} {"train_loss": -6.031777858734131, "global_step": 13509, "epoch": 80} {"train_loss": -5.889008045196533, "global_step": 13510, "epoch": 80} {"train_loss": -5.941666603088379, "global_step": 13511, "epoch": 80} {"train_loss": -6.113320827484131, "global_step": 13512, "epoch": 80} {"train_loss": -6.1814374923706055, "global_step": 13513, "epoch": 80} {"train_loss": -5.912647724151611, "global_step": 13514, "epoch": 80} {"train_loss": -6.132956504821777, "global_step": 13515, "epoch": 80} {"train_loss": -5.801382064819336, "global_step": 13516, "epoch": 80} {"train_loss": -5.9781904220581055, "global_step": 13517, "epoch": 80} {"train_loss": -6.172610759735107, "global_step": 13518, "epoch": 80} {"train_loss": -5.8766374588012695, "global_step": 13519, "epoch": 80} {"train_loss": -6.069180011749268, "global_step": 13520, "epoch": 80} {"train_loss": -6.23142671585083, "global_step": 13521, "epoch": 80} {"train_loss": -6.156035423278809, "global_step": 13522, "epoch": 80} {"train_loss": -6.307957649230957, "global_step": 13523, "epoch": 80} {"train_loss": -6.388162612915039, "global_step": 13524, "epoch": 80} {"train_loss": -6.314860820770264, "global_step": 13525, "epoch": 80} {"train_loss": -6.327811241149902, "global_step": 13526, "epoch": 80} {"train_loss": -6.088884353637695, "global_step": 13527, "epoch": 80} {"train_loss": -6.298285961151123, "global_step": 13528, "epoch": 80} {"train_loss": -6.469315528869629, "global_step": 13529, "epoch": 80} {"train_loss": -6.227621555328369, "global_step": 13530, "epoch": 80} {"train_loss": -6.354523658752441, "global_step": 13531, "epoch": 80} {"train_loss": -6.146055221557617, "global_step": 13532, "epoch": 80} {"train_loss": -6.317612648010254, "global_step": 13533, "epoch": 80} {"train_loss": -6.256348609924316, "global_step": 13534, "epoch": 80} {"train_loss": -6.287760257720947, "global_step": 13535, "epoch": 80} {"train_loss": -6.240601539611816, "global_step": 13536, "epoch": 80} {"train_loss": -6.148038864135742, "global_step": 13537, "epoch": 80} {"train_loss": -6.137415885925293, "global_step": 13538, "epoch": 80} {"train_loss": -6.21347188949585, "global_step": 13539, "epoch": 80} {"train_loss": -5.971343040466309, "global_step": 13540, "epoch": 80} {"train_loss": -6.20796012878418, "global_step": 13541, "epoch": 80} {"train_loss": -5.917112350463867, "global_step": 13542, "epoch": 80} {"train_loss": -6.185946464538574, "global_step": 13543, "epoch": 80} {"train_loss": -6.029425621032715, "global_step": 13544, "epoch": 80} {"train_loss": -6.191091060638428, "global_step": 13545, "epoch": 80} {"train_loss": -5.963201999664307, "global_step": 13546, "epoch": 80} {"train_loss": -5.79538106918335, "global_step": 13547, "epoch": 80} {"train_loss": -6.084889888763428, "global_step": 13548, "epoch": 80} {"train_loss": -6.009026527404785, "global_step": 13549, "epoch": 80} {"train_loss": -5.9106950759887695, "global_step": 13550, "epoch": 80} {"train_loss": -6.269745826721191, "global_step": 13551, "epoch": 80} {"train_loss": -6.068888187408447, "global_step": 13552, "epoch": 80} {"train_loss": -5.977059364318848, "global_step": 13553, "epoch": 80} {"train_loss": -6.133970260620117, "global_step": 13554, "epoch": 80} {"train_loss": -5.929366111755371, "global_step": 13555, "epoch": 80} {"train_loss": -5.76621150970459, "global_step": 13556, "epoch": 80} {"train_loss": -5.957798957824707, "global_step": 13557, "epoch": 80} {"train_loss": -6.132967948913574, "global_step": 13558, "epoch": 80} {"train_loss": -6.092385292053223, "global_step": 13559, "epoch": 80} {"train_loss": -5.992271900177002, "global_step": 13560, "epoch": 80} {"train_loss": -5.920849800109863, "global_step": 13561, "epoch": 80} {"train_loss": -6.148344993591309, "global_step": 13562, "epoch": 80} {"train_loss": -6.074369430541992, "global_step": 13563, "epoch": 80} {"train_loss": -6.323184013366699, "global_step": 13564, "epoch": 80} {"train_loss": -6.0904541015625, "global_step": 13565, "epoch": 80} {"train_loss": -6.080728530883789, "global_step": 13566, "epoch": 80} {"train_loss": -5.957824230194092, "global_step": 13567, "epoch": 80} {"train_loss": -5.931388854980469, "global_step": 13568, "epoch": 80} {"train_loss": -6.397820472717285, "global_step": 13569, "epoch": 80} {"train_loss": -5.698654651641846, "global_step": 13570, "epoch": 80} {"train_loss": -6.347451210021973, "global_step": 13571, "epoch": 80} {"train_loss": -6.129321098327637, "global_step": 13572, "epoch": 80} {"train_loss": -6.207867622375488, "global_step": 13573, "epoch": 80} {"train_loss": -5.991368293762207, "global_step": 13574, "epoch": 80} {"train_loss": -6.128078937530518, "global_step": 13575, "epoch": 80} {"train_loss": -5.904627799987793, "global_step": 13576, "epoch": 80} {"train_loss": -6.0700531005859375, "global_step": 13577, "epoch": 80} {"train_loss": -6.104037284851074, "global_step": 13578, "epoch": 80} {"train_loss": -5.986398220062256, "global_step": 13579, "epoch": 80} {"train_loss": -6.3124284744262695, "global_step": 13580, "epoch": 80} {"train_loss": -6.191578388214111, "global_step": 13581, "epoch": 80} {"train_loss": -6.092367172241211, "global_step": 13582, "epoch": 80} {"train_loss": -6.039055824279785, "global_step": 13583, "epoch": 80} {"train_loss": -6.1224365234375, "global_step": 13584, "epoch": 80} {"train_loss": -5.952689170837402, "global_step": 13585, "epoch": 80} {"train_loss": -6.301961421966553, "global_step": 13586, "epoch": 80} {"train_loss": -6.385141372680664, "global_step": 13587, "epoch": 80} {"train_loss": -6.063983917236328, "global_step": 13588, "epoch": 80} {"train_loss": -6.418259143829346, "global_step": 13589, "epoch": 80} {"train_loss": -6.1822614669799805, "global_step": 13590, "epoch": 80} {"train_loss": -6.444088935852051, "global_step": 13591, "epoch": 80} {"train_loss": -6.491150856018066, "global_step": 13592, "epoch": 80} {"train_loss": -6.221894264221191, "global_step": 13593, "epoch": 80} {"train_loss": -6.402632713317871, "global_step": 13594, "epoch": 80} {"train_loss": -6.437039375305176, "global_step": 13595, "epoch": 80} {"train_loss": -6.251579284667969, "global_step": 13596, "epoch": 80} {"train_loss": -6.413789749145508, "global_step": 13597, "epoch": 80} {"train_loss": -6.252338409423828, "global_step": 13598, "epoch": 80} {"train_loss": -6.386954307556152, "global_step": 13599, "epoch": 80} {"train_loss": -6.184171676635742, "global_step": 13600, "epoch": 80} {"train_loss": -6.455934524536133, "global_step": 13601, "epoch": 80} {"train_loss": -5.919899940490723, "global_step": 13602, "epoch": 80} {"train_loss": -6.290007591247559, "global_step": 13603, "epoch": 80} {"train_loss": -6.318381309509277, "global_step": 13604, "epoch": 80} {"train_loss": -6.006260871887207, "global_step": 13605, "epoch": 80} {"train_loss": -6.148872375488281, "global_step": 13606, "epoch": 80} {"train_loss": -6.142066424801236, "global_step": 13607, "epoch": 80, "val_loss": 249615.5, "train_action_mse_error": 48.69568634033203} {"train_loss": -5.931225776672363, "global_step": 13608, "epoch": 81} {"train_loss": -6.0040178298950195, "global_step": 13609, "epoch": 81} {"train_loss": -5.924093246459961, "global_step": 13610, "epoch": 81} {"train_loss": -5.904940128326416, "global_step": 13611, "epoch": 81} {"train_loss": -6.013278961181641, "global_step": 13612, "epoch": 81} {"train_loss": -6.010776519775391, "global_step": 13613, "epoch": 81} {"train_loss": -6.158056259155273, "global_step": 13614, "epoch": 81} {"train_loss": -6.1403489112854, "global_step": 13615, "epoch": 81} {"train_loss": -6.293465614318848, "global_step": 13616, "epoch": 81} {"train_loss": -5.862616062164307, "global_step": 13617, "epoch": 81} {"train_loss": -6.098915100097656, "global_step": 13618, "epoch": 81} {"train_loss": -5.939556121826172, "global_step": 13619, "epoch": 81} {"train_loss": -6.208217620849609, "global_step": 13620, "epoch": 81} {"train_loss": -6.275145530700684, "global_step": 13621, "epoch": 81} {"train_loss": -6.022200107574463, "global_step": 13622, "epoch": 81} {"train_loss": -5.916698455810547, "global_step": 13623, "epoch": 81} {"train_loss": -5.869230270385742, "global_step": 13624, "epoch": 81} {"train_loss": -6.140618324279785, "global_step": 13625, "epoch": 81} {"train_loss": -6.116976737976074, "global_step": 13626, "epoch": 81} {"train_loss": -6.089350700378418, "global_step": 13627, "epoch": 81} {"train_loss": -6.430251121520996, "global_step": 13628, "epoch": 81} {"train_loss": -6.110213279724121, "global_step": 13629, "epoch": 81} {"train_loss": -6.21754789352417, "global_step": 13630, "epoch": 81} {"train_loss": -5.919283390045166, "global_step": 13631, "epoch": 81} {"train_loss": -6.263808727264404, "global_step": 13632, "epoch": 81} {"train_loss": -6.200394630432129, "global_step": 13633, "epoch": 81} {"train_loss": -6.194549560546875, "global_step": 13634, "epoch": 81} {"train_loss": -6.126166343688965, "global_step": 13635, "epoch": 81} {"train_loss": -6.406235694885254, "global_step": 13636, "epoch": 81} {"train_loss": -6.442566394805908, "global_step": 13637, "epoch": 81} {"train_loss": -6.297015190124512, "global_step": 13638, "epoch": 81} {"train_loss": -6.146878719329834, "global_step": 13639, "epoch": 81} {"train_loss": -6.348113059997559, "global_step": 13640, "epoch": 81} {"train_loss": -6.4820709228515625, "global_step": 13641, "epoch": 81} {"train_loss": -6.253014087677002, "global_step": 13642, "epoch": 81} {"train_loss": -6.409976005554199, "global_step": 13643, "epoch": 81} {"train_loss": -6.4816460609436035, "global_step": 13644, "epoch": 81} {"train_loss": -6.388607025146484, "global_step": 13645, "epoch": 81} {"train_loss": -6.481202125549316, "global_step": 13646, "epoch": 81} {"train_loss": -6.426994800567627, "global_step": 13647, "epoch": 81} {"train_loss": -6.356651306152344, "global_step": 13648, "epoch": 81} {"train_loss": -6.452840805053711, "global_step": 13649, "epoch": 81} {"train_loss": -6.120991230010986, "global_step": 13650, "epoch": 81} {"train_loss": -6.341639518737793, "global_step": 13651, "epoch": 81} {"train_loss": -6.21507453918457, "global_step": 13652, "epoch": 81} {"train_loss": -6.503187656402588, "global_step": 13653, "epoch": 81} {"train_loss": -6.090936660766602, "global_step": 13654, "epoch": 81} {"train_loss": -6.382538795471191, "global_step": 13655, "epoch": 81} {"train_loss": -6.032909393310547, "global_step": 13656, "epoch": 81} {"train_loss": -6.1042890548706055, "global_step": 13657, "epoch": 81} {"train_loss": -6.293326377868652, "global_step": 13658, "epoch": 81} {"train_loss": -6.238585948944092, "global_step": 13659, "epoch": 81} {"train_loss": -6.225665092468262, "global_step": 13660, "epoch": 81} {"train_loss": -6.262400150299072, "global_step": 13661, "epoch": 81} {"train_loss": -6.135016441345215, "global_step": 13662, "epoch": 81} {"train_loss": -5.953299045562744, "global_step": 13663, "epoch": 81} {"train_loss": -6.074891090393066, "global_step": 13664, "epoch": 81} {"train_loss": -6.022585391998291, "global_step": 13665, "epoch": 81} {"train_loss": -6.380000114440918, "global_step": 13666, "epoch": 81} {"train_loss": -6.30831241607666, "global_step": 13667, "epoch": 81} {"train_loss": -6.186017990112305, "global_step": 13668, "epoch": 81} {"train_loss": -5.987949371337891, "global_step": 13669, "epoch": 81} {"train_loss": -6.138863563537598, "global_step": 13670, "epoch": 81} {"train_loss": -6.134984970092773, "global_step": 13671, "epoch": 81} {"train_loss": -6.210186958312988, "global_step": 13672, "epoch": 81} {"train_loss": -6.350530624389648, "global_step": 13673, "epoch": 81} {"train_loss": -6.201228618621826, "global_step": 13674, "epoch": 81} {"train_loss": -6.161250114440918, "global_step": 13675, "epoch": 81} {"train_loss": -6.327302932739258, "global_step": 13676, "epoch": 81} {"train_loss": -6.217792510986328, "global_step": 13677, "epoch": 81} {"train_loss": -6.320310592651367, "global_step": 13678, "epoch": 81} {"train_loss": -5.791154861450195, "global_step": 13679, "epoch": 81} {"train_loss": -5.975030422210693, "global_step": 13680, "epoch": 81} {"train_loss": -6.106773376464844, "global_step": 13681, "epoch": 81} {"train_loss": -6.037784576416016, "global_step": 13682, "epoch": 81} {"train_loss": -5.767368793487549, "global_step": 13683, "epoch": 81} {"train_loss": -6.055339813232422, "global_step": 13684, "epoch": 81} {"train_loss": -6.251096248626709, "global_step": 13685, "epoch": 81} {"train_loss": -6.17754602432251, "global_step": 13686, "epoch": 81} {"train_loss": -6.080333709716797, "global_step": 13687, "epoch": 81} {"train_loss": -6.106620788574219, "global_step": 13688, "epoch": 81} {"train_loss": -6.086524963378906, "global_step": 13689, "epoch": 81} {"train_loss": -6.375293731689453, "global_step": 13690, "epoch": 81} {"train_loss": -6.305965900421143, "global_step": 13691, "epoch": 81} {"train_loss": -6.3483076095581055, "global_step": 13692, "epoch": 81} {"train_loss": -6.46938419342041, "global_step": 13693, "epoch": 81} {"train_loss": -6.368818283081055, "global_step": 13694, "epoch": 81} {"train_loss": -6.387540817260742, "global_step": 13695, "epoch": 81} {"train_loss": -6.2552361488342285, "global_step": 13696, "epoch": 81} {"train_loss": -6.386011123657227, "global_step": 13697, "epoch": 81} {"train_loss": -6.194149017333984, "global_step": 13698, "epoch": 81} {"train_loss": -6.369793891906738, "global_step": 13699, "epoch": 81} {"train_loss": -6.281927108764648, "global_step": 13700, "epoch": 81} {"train_loss": -6.3374528884887695, "global_step": 13701, "epoch": 81} {"train_loss": -6.00484561920166, "global_step": 13702, "epoch": 81} {"train_loss": -6.6353983879089355, "global_step": 13703, "epoch": 81} {"train_loss": -6.241696357727051, "global_step": 13704, "epoch": 81} {"train_loss": -6.346301078796387, "global_step": 13705, "epoch": 81} {"train_loss": -6.268181324005127, "global_step": 13706, "epoch": 81} {"train_loss": -6.157580375671387, "global_step": 13707, "epoch": 81} {"train_loss": -5.743795871734619, "global_step": 13708, "epoch": 81} {"train_loss": -6.168663024902344, "global_step": 13709, "epoch": 81} {"train_loss": -6.024590492248535, "global_step": 13710, "epoch": 81} {"train_loss": -6.3554887771606445, "global_step": 13711, "epoch": 81} {"train_loss": -6.005795478820801, "global_step": 13712, "epoch": 81} {"train_loss": -5.944188117980957, "global_step": 13713, "epoch": 81} {"train_loss": -6.209192752838135, "global_step": 13714, "epoch": 81} {"train_loss": -6.136999607086182, "global_step": 13715, "epoch": 81} {"train_loss": -6.054782390594482, "global_step": 13716, "epoch": 81} {"train_loss": -5.999291896820068, "global_step": 13717, "epoch": 81} {"train_loss": -6.1756439208984375, "global_step": 13718, "epoch": 81} {"train_loss": -6.223014831542969, "global_step": 13719, "epoch": 81} {"train_loss": -6.141203880310059, "global_step": 13720, "epoch": 81} {"train_loss": -5.799380302429199, "global_step": 13721, "epoch": 81} {"train_loss": -6.067800521850586, "global_step": 13722, "epoch": 81} {"train_loss": -6.379321575164795, "global_step": 13723, "epoch": 81} {"train_loss": -6.143194198608398, "global_step": 13724, "epoch": 81} {"train_loss": -6.201841354370117, "global_step": 13725, "epoch": 81} {"train_loss": -6.053049087524414, "global_step": 13726, "epoch": 81} {"train_loss": -5.8404741287231445, "global_step": 13727, "epoch": 81} {"train_loss": -6.276092529296875, "global_step": 13728, "epoch": 81} {"train_loss": -5.509940147399902, "global_step": 13729, "epoch": 81} {"train_loss": -6.018747329711914, "global_step": 13730, "epoch": 81} {"train_loss": -5.840198516845703, "global_step": 13731, "epoch": 81} {"train_loss": -6.278094291687012, "global_step": 13732, "epoch": 81} {"train_loss": -5.945955276489258, "global_step": 13733, "epoch": 81} {"train_loss": -6.020364761352539, "global_step": 13734, "epoch": 81} {"train_loss": -5.958005905151367, "global_step": 13735, "epoch": 81} {"train_loss": -6.2497639656066895, "global_step": 13736, "epoch": 81} {"train_loss": -6.056819915771484, "global_step": 13737, "epoch": 81} {"train_loss": -6.169401168823242, "global_step": 13738, "epoch": 81} {"train_loss": -6.231029510498047, "global_step": 13739, "epoch": 81} {"train_loss": -6.263844013214111, "global_step": 13740, "epoch": 81} {"train_loss": -6.377066612243652, "global_step": 13741, "epoch": 81} {"train_loss": -6.108361721038818, "global_step": 13742, "epoch": 81} {"train_loss": -6.369688987731934, "global_step": 13743, "epoch": 81} {"train_loss": -6.451096534729004, "global_step": 13744, "epoch": 81} {"train_loss": -6.153227806091309, "global_step": 13745, "epoch": 81} {"train_loss": -6.248759746551514, "global_step": 13746, "epoch": 81} {"train_loss": -6.367678642272949, "global_step": 13747, "epoch": 81} {"train_loss": -6.0693840980529785, "global_step": 13748, "epoch": 81} {"train_loss": -6.224034309387207, "global_step": 13749, "epoch": 81} {"train_loss": -6.181279182434082, "global_step": 13750, "epoch": 81} {"train_loss": -6.429470062255859, "global_step": 13751, "epoch": 81} {"train_loss": -6.220869541168213, "global_step": 13752, "epoch": 81} {"train_loss": -6.181293487548828, "global_step": 13753, "epoch": 81} {"train_loss": -6.3721160888671875, "global_step": 13754, "epoch": 81} {"train_loss": -6.238069534301758, "global_step": 13755, "epoch": 81} {"train_loss": -6.394312858581543, "global_step": 13756, "epoch": 81} {"train_loss": -6.10816764831543, "global_step": 13757, "epoch": 81} {"train_loss": -6.252742290496826, "global_step": 13758, "epoch": 81} {"train_loss": -6.0762481689453125, "global_step": 13759, "epoch": 81} {"train_loss": -6.281723976135254, "global_step": 13760, "epoch": 81} {"train_loss": -6.250995635986328, "global_step": 13761, "epoch": 81} {"train_loss": -6.199411392211914, "global_step": 13762, "epoch": 81} {"train_loss": -6.13139009475708, "global_step": 13763, "epoch": 81} {"train_loss": -6.242650985717773, "global_step": 13764, "epoch": 81} {"train_loss": -6.337305068969727, "global_step": 13765, "epoch": 81} {"train_loss": -6.2225446701049805, "global_step": 13766, "epoch": 81} {"train_loss": -6.339256286621094, "global_step": 13767, "epoch": 81} {"train_loss": -6.054797172546387, "global_step": 13768, "epoch": 81} {"train_loss": -6.01884126663208, "global_step": 13769, "epoch": 81} {"train_loss": -5.9350385665893555, "global_step": 13770, "epoch": 81} {"train_loss": -6.139222621917725, "global_step": 13771, "epoch": 81} {"train_loss": -6.030402183532715, "global_step": 13772, "epoch": 81} {"train_loss": -6.299536228179932, "global_step": 13773, "epoch": 81} {"train_loss": -6.243513107299805, "global_step": 13774, "epoch": 81} {"train_loss": -6.180749010472071, "global_step": 13775, "epoch": 81, "val_loss": 245897.53125} {"train_loss": -6.251537799835205, "global_step": 13776, "epoch": 82} {"train_loss": -6.248659610748291, "global_step": 13777, "epoch": 82} {"train_loss": -6.301765441894531, "global_step": 13778, "epoch": 82} {"train_loss": -6.273101806640625, "global_step": 13779, "epoch": 82} {"train_loss": -6.09629487991333, "global_step": 13780, "epoch": 82} {"train_loss": -6.272741317749023, "global_step": 13781, "epoch": 82} {"train_loss": -6.455006122589111, "global_step": 13782, "epoch": 82} {"train_loss": -6.191705703735352, "global_step": 13783, "epoch": 82} {"train_loss": -6.222637176513672, "global_step": 13784, "epoch": 82} {"train_loss": -6.329172134399414, "global_step": 13785, "epoch": 82} {"train_loss": -6.37204647064209, "global_step": 13786, "epoch": 82} {"train_loss": -6.142533302307129, "global_step": 13787, "epoch": 82} {"train_loss": -6.2320780754089355, "global_step": 13788, "epoch": 82} {"train_loss": -6.168680667877197, "global_step": 13789, "epoch": 82} {"train_loss": -6.256555557250977, "global_step": 13790, "epoch": 82} {"train_loss": -6.31343412399292, "global_step": 13791, "epoch": 82} {"train_loss": -6.146048545837402, "global_step": 13792, "epoch": 82} {"train_loss": -6.4112043380737305, "global_step": 13793, "epoch": 82} {"train_loss": -6.313904285430908, "global_step": 13794, "epoch": 82} {"train_loss": -6.478010177612305, "global_step": 13795, "epoch": 82} {"train_loss": -6.359292984008789, "global_step": 13796, "epoch": 82} {"train_loss": -6.408236503601074, "global_step": 13797, "epoch": 82} {"train_loss": -6.227705955505371, "global_step": 13798, "epoch": 82} {"train_loss": -6.21189022064209, "global_step": 13799, "epoch": 82} {"train_loss": -6.565242290496826, "global_step": 13800, "epoch": 82} {"train_loss": -6.320504665374756, "global_step": 13801, "epoch": 82} {"train_loss": -6.469927787780762, "global_step": 13802, "epoch": 82} {"train_loss": -6.227275371551514, "global_step": 13803, "epoch": 82} {"train_loss": -6.215660095214844, "global_step": 13804, "epoch": 82} {"train_loss": -6.377448081970215, "global_step": 13805, "epoch": 82} {"train_loss": -6.572744369506836, "global_step": 13806, "epoch": 82} {"train_loss": -6.110700607299805, "global_step": 13807, "epoch": 82} {"train_loss": -6.213684558868408, "global_step": 13808, "epoch": 82} {"train_loss": -6.425281047821045, "global_step": 13809, "epoch": 82} {"train_loss": -6.263461112976074, "global_step": 13810, "epoch": 82} {"train_loss": -6.322844505310059, "global_step": 13811, "epoch": 82} {"train_loss": -6.3079376220703125, "global_step": 13812, "epoch": 82} {"train_loss": -6.422121524810791, "global_step": 13813, "epoch": 82} {"train_loss": -6.461655616760254, "global_step": 13814, "epoch": 82} {"train_loss": -5.974781036376953, "global_step": 13815, "epoch": 82} {"train_loss": -6.158629894256592, "global_step": 13816, "epoch": 82} {"train_loss": -6.3231706619262695, "global_step": 13817, "epoch": 82} {"train_loss": -6.230084419250488, "global_step": 13818, "epoch": 82} {"train_loss": -6.2995805740356445, "global_step": 13819, "epoch": 82} {"train_loss": -6.164850234985352, "global_step": 13820, "epoch": 82} {"train_loss": -6.363547325134277, "global_step": 13821, "epoch": 82} {"train_loss": -6.53940486907959, "global_step": 13822, "epoch": 82} {"train_loss": -6.457416534423828, "global_step": 13823, "epoch": 82} {"train_loss": -6.509394645690918, "global_step": 13824, "epoch": 82} {"train_loss": -6.328606605529785, "global_step": 13825, "epoch": 82} {"train_loss": -6.309972286224365, "global_step": 13826, "epoch": 82} {"train_loss": -6.255849838256836, "global_step": 13827, "epoch": 82} {"train_loss": -6.346432685852051, "global_step": 13828, "epoch": 82} {"train_loss": -6.084739685058594, "global_step": 13829, "epoch": 82} {"train_loss": -6.272808074951172, "global_step": 13830, "epoch": 82} {"train_loss": -6.235324859619141, "global_step": 13831, "epoch": 82} {"train_loss": -6.17924690246582, "global_step": 13832, "epoch": 82} {"train_loss": -6.219749450683594, "global_step": 13833, "epoch": 82} {"train_loss": -6.280753135681152, "global_step": 13834, "epoch": 82} {"train_loss": -6.452253341674805, "global_step": 13835, "epoch": 82} {"train_loss": -6.1128950119018555, "global_step": 13836, "epoch": 82} {"train_loss": -6.250907897949219, "global_step": 13837, "epoch": 82} {"train_loss": -6.253413200378418, "global_step": 13838, "epoch": 82} {"train_loss": -6.341222763061523, "global_step": 13839, "epoch": 82} {"train_loss": -6.034510612487793, "global_step": 13840, "epoch": 82} {"train_loss": -6.0059309005737305, "global_step": 13841, "epoch": 82} {"train_loss": -6.08309268951416, "global_step": 13842, "epoch": 82} {"train_loss": -6.264560699462891, "global_step": 13843, "epoch": 82} {"train_loss": -6.294513702392578, "global_step": 13844, "epoch": 82} {"train_loss": -5.998831748962402, "global_step": 13845, "epoch": 82} {"train_loss": -6.255555152893066, "global_step": 13846, "epoch": 82} {"train_loss": -6.104714393615723, "global_step": 13847, "epoch": 82} {"train_loss": -6.316760063171387, "global_step": 13848, "epoch": 82} {"train_loss": -6.372730731964111, "global_step": 13849, "epoch": 82} {"train_loss": -6.419822692871094, "global_step": 13850, "epoch": 82} {"train_loss": -6.326387405395508, "global_step": 13851, "epoch": 82} {"train_loss": -6.280163764953613, "global_step": 13852, "epoch": 82} {"train_loss": -6.241754531860352, "global_step": 13853, "epoch": 82} {"train_loss": -6.06425666809082, "global_step": 13854, "epoch": 82} {"train_loss": -6.453006267547607, "global_step": 13855, "epoch": 82} {"train_loss": -6.222056865692139, "global_step": 13856, "epoch": 82} {"train_loss": -6.4921159744262695, "global_step": 13857, "epoch": 82} {"train_loss": -6.383944511413574, "global_step": 13858, "epoch": 82} {"train_loss": -6.134842395782471, "global_step": 13859, "epoch": 82} {"train_loss": -6.164839744567871, "global_step": 13860, "epoch": 82} {"train_loss": -6.414614200592041, "global_step": 13861, "epoch": 82} {"train_loss": -6.277191162109375, "global_step": 13862, "epoch": 82} {"train_loss": -6.123414039611816, "global_step": 13863, "epoch": 82} {"train_loss": -6.248572826385498, "global_step": 13864, "epoch": 82} {"train_loss": -6.032055854797363, "global_step": 13865, "epoch": 82} {"train_loss": -6.294255256652832, "global_step": 13866, "epoch": 82} {"train_loss": -6.349367141723633, "global_step": 13867, "epoch": 82} {"train_loss": -6.323009014129639, "global_step": 13868, "epoch": 82} {"train_loss": -6.353429794311523, "global_step": 13869, "epoch": 82} {"train_loss": -6.358962059020996, "global_step": 13870, "epoch": 82} {"train_loss": -6.346090316772461, "global_step": 13871, "epoch": 82} {"train_loss": -6.403906345367432, "global_step": 13872, "epoch": 82} {"train_loss": -6.275753021240234, "global_step": 13873, "epoch": 82} {"train_loss": -6.394225120544434, "global_step": 13874, "epoch": 82} {"train_loss": -6.064457893371582, "global_step": 13875, "epoch": 82} {"train_loss": -6.344987392425537, "global_step": 13876, "epoch": 82} {"train_loss": -6.264162063598633, "global_step": 13877, "epoch": 82} {"train_loss": -6.078478813171387, "global_step": 13878, "epoch": 82} {"train_loss": -6.3978095054626465, "global_step": 13879, "epoch": 82} {"train_loss": -5.8850579261779785, "global_step": 13880, "epoch": 82} {"train_loss": -6.330051898956299, "global_step": 13881, "epoch": 82} {"train_loss": -5.993327617645264, "global_step": 13882, "epoch": 82} {"train_loss": -6.200413227081299, "global_step": 13883, "epoch": 82} {"train_loss": -6.041690826416016, "global_step": 13884, "epoch": 82} {"train_loss": -6.180731296539307, "global_step": 13885, "epoch": 82} {"train_loss": -6.371535301208496, "global_step": 13886, "epoch": 82} {"train_loss": -6.163858413696289, "global_step": 13887, "epoch": 82} {"train_loss": -6.119294166564941, "global_step": 13888, "epoch": 82} {"train_loss": -6.167663097381592, "global_step": 13889, "epoch": 82} {"train_loss": -6.448436737060547, "global_step": 13890, "epoch": 82} {"train_loss": -6.060783386230469, "global_step": 13891, "epoch": 82} {"train_loss": -6.347905158996582, "global_step": 13892, "epoch": 82} {"train_loss": -6.25787878036499, "global_step": 13893, "epoch": 82} {"train_loss": -6.0879292488098145, "global_step": 13894, "epoch": 82} {"train_loss": -6.1865925788879395, "global_step": 13895, "epoch": 82} {"train_loss": -6.287057876586914, "global_step": 13896, "epoch": 82} {"train_loss": -6.243486404418945, "global_step": 13897, "epoch": 82} {"train_loss": -6.352689743041992, "global_step": 13898, "epoch": 82} {"train_loss": -6.3212080001831055, "global_step": 13899, "epoch": 82} {"train_loss": -6.2824859619140625, "global_step": 13900, "epoch": 82} {"train_loss": -6.551053524017334, "global_step": 13901, "epoch": 82} {"train_loss": -5.812056541442871, "global_step": 13902, "epoch": 82} {"train_loss": -6.428648948669434, "global_step": 13903, "epoch": 82} {"train_loss": -6.108552932739258, "global_step": 13904, "epoch": 82} {"train_loss": -6.310172080993652, "global_step": 13905, "epoch": 82} {"train_loss": -6.205334663391113, "global_step": 13906, "epoch": 82} {"train_loss": -6.220767021179199, "global_step": 13907, "epoch": 82} {"train_loss": -6.207851409912109, "global_step": 13908, "epoch": 82} {"train_loss": -5.884140968322754, "global_step": 13909, "epoch": 82} {"train_loss": -6.209779262542725, "global_step": 13910, "epoch": 82} {"train_loss": -6.127435207366943, "global_step": 13911, "epoch": 82} {"train_loss": -5.98378324508667, "global_step": 13912, "epoch": 82} {"train_loss": -6.1286773681640625, "global_step": 13913, "epoch": 82} {"train_loss": -6.273384094238281, "global_step": 13914, "epoch": 82} {"train_loss": -5.759916305541992, "global_step": 13915, "epoch": 82} {"train_loss": -6.2781572341918945, "global_step": 13916, "epoch": 82} {"train_loss": -6.316706657409668, "global_step": 13917, "epoch": 82} {"train_loss": -6.113739967346191, "global_step": 13918, "epoch": 82} {"train_loss": -6.073845863342285, "global_step": 13919, "epoch": 82} {"train_loss": -5.907406806945801, "global_step": 13920, "epoch": 82} {"train_loss": -6.27289342880249, "global_step": 13921, "epoch": 82} {"train_loss": -5.942416667938232, "global_step": 13922, "epoch": 82} {"train_loss": -6.28190279006958, "global_step": 13923, "epoch": 82} {"train_loss": -5.984320640563965, "global_step": 13924, "epoch": 82} {"train_loss": -6.1499457359313965, "global_step": 13925, "epoch": 82} {"train_loss": -6.104303359985352, "global_step": 13926, "epoch": 82} {"train_loss": -6.218069076538086, "global_step": 13927, "epoch": 82} {"train_loss": -6.157250881195068, "global_step": 13928, "epoch": 82} {"train_loss": -6.023005485534668, "global_step": 13929, "epoch": 82} {"train_loss": -6.30417537689209, "global_step": 13930, "epoch": 82} {"train_loss": -6.139886379241943, "global_step": 13931, "epoch": 82} {"train_loss": -6.216237545013428, "global_step": 13932, "epoch": 82} {"train_loss": -6.206210613250732, "global_step": 13933, "epoch": 82} {"train_loss": -6.253207206726074, "global_step": 13934, "epoch": 82} {"train_loss": -5.940485000610352, "global_step": 13935, "epoch": 82} {"train_loss": -6.194673538208008, "global_step": 13936, "epoch": 82} {"train_loss": -5.888808727264404, "global_step": 13937, "epoch": 82} {"train_loss": -5.949799537658691, "global_step": 13938, "epoch": 82} {"train_loss": -6.18243408203125, "global_step": 13939, "epoch": 82} {"train_loss": -6.123045921325684, "global_step": 13940, "epoch": 82} {"train_loss": -6.122246265411377, "global_step": 13941, "epoch": 82} {"train_loss": -6.058772087097168, "global_step": 13942, "epoch": 82} {"train_loss": -6.2348857919375105, "global_step": 13943, "epoch": 82, "val_loss": 246203.453125} {"train_loss": -6.261482238769531, "global_step": 13944, "epoch": 83} {"train_loss": -6.228855133056641, "global_step": 13945, "epoch": 83} {"train_loss": -5.889989852905273, "global_step": 13946, "epoch": 83} {"train_loss": -6.070209503173828, "global_step": 13947, "epoch": 83} {"train_loss": -6.128962993621826, "global_step": 13948, "epoch": 83} {"train_loss": -6.036844253540039, "global_step": 13949, "epoch": 83} {"train_loss": -6.308297634124756, "global_step": 13950, "epoch": 83} {"train_loss": -5.984822750091553, "global_step": 13951, "epoch": 83} {"train_loss": -6.167749404907227, "global_step": 13952, "epoch": 83} {"train_loss": -6.2737627029418945, "global_step": 13953, "epoch": 83} {"train_loss": -6.183122634887695, "global_step": 13954, "epoch": 83} {"train_loss": -6.256947994232178, "global_step": 13955, "epoch": 83} {"train_loss": -6.263880729675293, "global_step": 13956, "epoch": 83} {"train_loss": -6.311260223388672, "global_step": 13957, "epoch": 83} {"train_loss": -6.275981426239014, "global_step": 13958, "epoch": 83} {"train_loss": -6.122167587280273, "global_step": 13959, "epoch": 83} {"train_loss": -6.212474822998047, "global_step": 13960, "epoch": 83} {"train_loss": -6.459971904754639, "global_step": 13961, "epoch": 83} {"train_loss": -6.099732398986816, "global_step": 13962, "epoch": 83} {"train_loss": -6.178778648376465, "global_step": 13963, "epoch": 83} {"train_loss": -5.9654340744018555, "global_step": 13964, "epoch": 83} {"train_loss": -6.150536060333252, "global_step": 13965, "epoch": 83} {"train_loss": -6.162320137023926, "global_step": 13966, "epoch": 83} {"train_loss": -6.104866981506348, "global_step": 13967, "epoch": 83} {"train_loss": -6.056344032287598, "global_step": 13968, "epoch": 83} {"train_loss": -6.0583367347717285, "global_step": 13969, "epoch": 83} {"train_loss": -6.274142265319824, "global_step": 13970, "epoch": 83} {"train_loss": -6.124478816986084, "global_step": 13971, "epoch": 83} {"train_loss": -6.02876091003418, "global_step": 13972, "epoch": 83} {"train_loss": -6.17332124710083, "global_step": 13973, "epoch": 83} {"train_loss": -5.841843605041504, "global_step": 13974, "epoch": 83} {"train_loss": -6.265302658081055, "global_step": 13975, "epoch": 83} {"train_loss": -6.220727920532227, "global_step": 13976, "epoch": 83} {"train_loss": -6.1801652908325195, "global_step": 13977, "epoch": 83} {"train_loss": -5.790409564971924, "global_step": 13978, "epoch": 83} {"train_loss": -6.216949462890625, "global_step": 13979, "epoch": 83} {"train_loss": -6.073705673217773, "global_step": 13980, "epoch": 83} {"train_loss": -6.016258239746094, "global_step": 13981, "epoch": 83} {"train_loss": -6.193763732910156, "global_step": 13982, "epoch": 83} {"train_loss": -6.1935224533081055, "global_step": 13983, "epoch": 83} {"train_loss": -6.02016544342041, "global_step": 13984, "epoch": 83} {"train_loss": -6.496572971343994, "global_step": 13985, "epoch": 83} {"train_loss": -6.3659539222717285, "global_step": 13986, "epoch": 83} {"train_loss": -6.291680335998535, "global_step": 13987, "epoch": 83} {"train_loss": -6.236979007720947, "global_step": 13988, "epoch": 83} {"train_loss": -6.407159328460693, "global_step": 13989, "epoch": 83} {"train_loss": -6.355086326599121, "global_step": 13990, "epoch": 83} {"train_loss": -6.376558303833008, "global_step": 13991, "epoch": 83} {"train_loss": -6.414015293121338, "global_step": 13992, "epoch": 83} {"train_loss": -6.423009872436523, "global_step": 13993, "epoch": 83} {"train_loss": -6.272121906280518, "global_step": 13994, "epoch": 83} {"train_loss": -6.320921897888184, "global_step": 13995, "epoch": 83} {"train_loss": -6.278354167938232, "global_step": 13996, "epoch": 83} {"train_loss": -6.2352495193481445, "global_step": 13997, "epoch": 83} {"train_loss": -6.148722171783447, "global_step": 13998, "epoch": 83} {"train_loss": -6.314553737640381, "global_step": 13999, "epoch": 83} {"train_loss": -6.424551010131836, "global_step": 14000, "epoch": 83} {"train_loss": -6.243694305419922, "global_step": 14001, "epoch": 83} {"train_loss": -6.455597877502441, "global_step": 14002, "epoch": 83} {"train_loss": -6.535680770874023, "global_step": 14003, "epoch": 83} {"train_loss": -6.353826522827148, "global_step": 14004, "epoch": 83} {"train_loss": -6.230144500732422, "global_step": 14005, "epoch": 83} {"train_loss": -6.354691505432129, "global_step": 14006, "epoch": 83} {"train_loss": -6.588579177856445, "global_step": 14007, "epoch": 83} {"train_loss": -5.9048004150390625, "global_step": 14008, "epoch": 83} {"train_loss": -6.137179374694824, "global_step": 14009, "epoch": 83} {"train_loss": -6.390558242797852, "global_step": 14010, "epoch": 83} {"train_loss": -6.23365592956543, "global_step": 14011, "epoch": 83} {"train_loss": -6.11219596862793, "global_step": 14012, "epoch": 83} {"train_loss": -6.232416152954102, "global_step": 14013, "epoch": 83} {"train_loss": -6.307761192321777, "global_step": 14014, "epoch": 83} {"train_loss": -6.3873186111450195, "global_step": 14015, "epoch": 83} {"train_loss": -6.213848114013672, "global_step": 14016, "epoch": 83} {"train_loss": -6.220292091369629, "global_step": 14017, "epoch": 83} {"train_loss": -6.083992004394531, "global_step": 14018, "epoch": 83} {"train_loss": -6.2900238037109375, "global_step": 14019, "epoch": 83} {"train_loss": -6.302154541015625, "global_step": 14020, "epoch": 83} {"train_loss": -6.086785316467285, "global_step": 14021, "epoch": 83} {"train_loss": -6.239345550537109, "global_step": 14022, "epoch": 83} {"train_loss": -6.377928256988525, "global_step": 14023, "epoch": 83} {"train_loss": -6.231714248657227, "global_step": 14024, "epoch": 83} {"train_loss": -5.875127792358398, "global_step": 14025, "epoch": 83} {"train_loss": -5.842568397521973, "global_step": 14026, "epoch": 83} {"train_loss": -5.740816116333008, "global_step": 14027, "epoch": 83} {"train_loss": -6.014005661010742, "global_step": 14028, "epoch": 83} {"train_loss": -6.002685546875, "global_step": 14029, "epoch": 83} {"train_loss": -6.17266321182251, "global_step": 14030, "epoch": 83} {"train_loss": -6.257997989654541, "global_step": 14031, "epoch": 83} {"train_loss": -6.1233320236206055, "global_step": 14032, "epoch": 83} {"train_loss": -6.468274116516113, "global_step": 14033, "epoch": 83} {"train_loss": -6.058083534240723, "global_step": 14034, "epoch": 83} {"train_loss": -5.958824157714844, "global_step": 14035, "epoch": 83} {"train_loss": -5.997471809387207, "global_step": 14036, "epoch": 83} {"train_loss": -6.145350456237793, "global_step": 14037, "epoch": 83} {"train_loss": -6.058305263519287, "global_step": 14038, "epoch": 83} {"train_loss": -6.205569267272949, "global_step": 14039, "epoch": 83} {"train_loss": -6.334124565124512, "global_step": 14040, "epoch": 83} {"train_loss": -5.993804931640625, "global_step": 14041, "epoch": 83} {"train_loss": -6.057319164276123, "global_step": 14042, "epoch": 83} {"train_loss": -5.9010009765625, "global_step": 14043, "epoch": 83} {"train_loss": -6.0917816162109375, "global_step": 14044, "epoch": 83} {"train_loss": -5.9078569412231445, "global_step": 14045, "epoch": 83} {"train_loss": -5.920046806335449, "global_step": 14046, "epoch": 83} {"train_loss": -6.048573017120361, "global_step": 14047, "epoch": 83} {"train_loss": -6.230001449584961, "global_step": 14048, "epoch": 83} {"train_loss": -6.289419174194336, "global_step": 14049, "epoch": 83} {"train_loss": -6.257514953613281, "global_step": 14050, "epoch": 83} {"train_loss": -6.297574520111084, "global_step": 14051, "epoch": 83} {"train_loss": -6.290459632873535, "global_step": 14052, "epoch": 83} {"train_loss": -6.149299621582031, "global_step": 14053, "epoch": 83} {"train_loss": -6.188753128051758, "global_step": 14054, "epoch": 83} {"train_loss": -6.303564071655273, "global_step": 14055, "epoch": 83} {"train_loss": -6.303707122802734, "global_step": 14056, "epoch": 83} {"train_loss": -6.263971328735352, "global_step": 14057, "epoch": 83} {"train_loss": -6.459262371063232, "global_step": 14058, "epoch": 83} {"train_loss": -6.102427959442139, "global_step": 14059, "epoch": 83} {"train_loss": -6.441751480102539, "global_step": 14060, "epoch": 83} {"train_loss": -6.288730621337891, "global_step": 14061, "epoch": 83} {"train_loss": -6.383357048034668, "global_step": 14062, "epoch": 83} {"train_loss": -6.1225104331970215, "global_step": 14063, "epoch": 83} {"train_loss": -6.198881149291992, "global_step": 14064, "epoch": 83} {"train_loss": -6.098793029785156, "global_step": 14065, "epoch": 83} {"train_loss": -6.194382667541504, "global_step": 14066, "epoch": 83} {"train_loss": -6.254063129425049, "global_step": 14067, "epoch": 83} {"train_loss": -6.409197807312012, "global_step": 14068, "epoch": 83} {"train_loss": -6.551178932189941, "global_step": 14069, "epoch": 83} {"train_loss": -6.255368709564209, "global_step": 14070, "epoch": 83} {"train_loss": -6.530716896057129, "global_step": 14071, "epoch": 83} {"train_loss": -6.294908046722412, "global_step": 14072, "epoch": 83} {"train_loss": -6.456628799438477, "global_step": 14073, "epoch": 83} {"train_loss": -6.0663652420043945, "global_step": 14074, "epoch": 83} {"train_loss": -6.307967185974121, "global_step": 14075, "epoch": 83} {"train_loss": -6.245414733886719, "global_step": 14076, "epoch": 83} {"train_loss": -6.305215358734131, "global_step": 14077, "epoch": 83} {"train_loss": -6.181611061096191, "global_step": 14078, "epoch": 83} {"train_loss": -6.364206314086914, "global_step": 14079, "epoch": 83} {"train_loss": -6.384277820587158, "global_step": 14080, "epoch": 83} {"train_loss": -6.072612762451172, "global_step": 14081, "epoch": 83} {"train_loss": -6.412834167480469, "global_step": 14082, "epoch": 83} {"train_loss": -5.998405456542969, "global_step": 14083, "epoch": 83} {"train_loss": -6.27117919921875, "global_step": 14084, "epoch": 83} {"train_loss": -6.267751216888428, "global_step": 14085, "epoch": 83} {"train_loss": -6.3296709060668945, "global_step": 14086, "epoch": 83} {"train_loss": -5.874281883239746, "global_step": 14087, "epoch": 83} {"train_loss": -6.216231822967529, "global_step": 14088, "epoch": 83} {"train_loss": -6.012376308441162, "global_step": 14089, "epoch": 83} {"train_loss": -6.188055992126465, "global_step": 14090, "epoch": 83} {"train_loss": -6.079148292541504, "global_step": 14091, "epoch": 83} {"train_loss": -6.199300765991211, "global_step": 14092, "epoch": 83} {"train_loss": -6.105520725250244, "global_step": 14093, "epoch": 83} {"train_loss": -6.322772979736328, "global_step": 14094, "epoch": 83} {"train_loss": -5.896156311035156, "global_step": 14095, "epoch": 83} {"train_loss": -6.201323986053467, "global_step": 14096, "epoch": 83} {"train_loss": -6.128927230834961, "global_step": 14097, "epoch": 83} {"train_loss": -6.1371660232543945, "global_step": 14098, "epoch": 83} {"train_loss": -6.112889766693115, "global_step": 14099, "epoch": 83} {"train_loss": -6.356433868408203, "global_step": 14100, "epoch": 83} {"train_loss": -6.126495361328125, "global_step": 14101, "epoch": 83} {"train_loss": -6.120414733886719, "global_step": 14102, "epoch": 83} {"train_loss": -5.957284927368164, "global_step": 14103, "epoch": 83} {"train_loss": -6.113633632659912, "global_step": 14104, "epoch": 83} {"train_loss": -6.169103145599365, "global_step": 14105, "epoch": 83} {"train_loss": -5.94139289855957, "global_step": 14106, "epoch": 83} {"train_loss": -6.434071063995361, "global_step": 14107, "epoch": 83} {"train_loss": -5.982639789581299, "global_step": 14108, "epoch": 83} {"train_loss": -6.393922805786133, "global_step": 14109, "epoch": 83} {"train_loss": -6.379680633544922, "global_step": 14110, "epoch": 83} {"train_loss": -6.19894403219223, "global_step": 14111, "epoch": 83, "val_loss": 248628.25} {"train_loss": -6.551758766174316, "global_step": 14112, "epoch": 84} {"train_loss": -6.309256553649902, "global_step": 14113, "epoch": 84} {"train_loss": -6.527790069580078, "global_step": 14114, "epoch": 84} {"train_loss": -6.449667930603027, "global_step": 14115, "epoch": 84} {"train_loss": -6.308392524719238, "global_step": 14116, "epoch": 84} {"train_loss": -6.200711250305176, "global_step": 14117, "epoch": 84} {"train_loss": -6.392190456390381, "global_step": 14118, "epoch": 84} {"train_loss": -6.500250816345215, "global_step": 14119, "epoch": 84} {"train_loss": -6.049144744873047, "global_step": 14120, "epoch": 84} {"train_loss": -6.448611736297607, "global_step": 14121, "epoch": 84} {"train_loss": -6.296713829040527, "global_step": 14122, "epoch": 84} {"train_loss": -6.399651527404785, "global_step": 14123, "epoch": 84} {"train_loss": -6.0402936935424805, "global_step": 14124, "epoch": 84} {"train_loss": -6.333514213562012, "global_step": 14125, "epoch": 84} {"train_loss": -6.12175178527832, "global_step": 14126, "epoch": 84} {"train_loss": -6.128037452697754, "global_step": 14127, "epoch": 84} {"train_loss": -6.253528594970703, "global_step": 14128, "epoch": 84} {"train_loss": -6.349207878112793, "global_step": 14129, "epoch": 84} {"train_loss": -6.265896797180176, "global_step": 14130, "epoch": 84} {"train_loss": -6.439701080322266, "global_step": 14131, "epoch": 84} {"train_loss": -6.1201887130737305, "global_step": 14132, "epoch": 84} {"train_loss": -6.52309513092041, "global_step": 14133, "epoch": 84} {"train_loss": -6.463098526000977, "global_step": 14134, "epoch": 84} {"train_loss": -6.433810710906982, "global_step": 14135, "epoch": 84} {"train_loss": -5.974114894866943, "global_step": 14136, "epoch": 84} {"train_loss": -6.426008224487305, "global_step": 14137, "epoch": 84} {"train_loss": -6.146585464477539, "global_step": 14138, "epoch": 84} {"train_loss": -6.228938102722168, "global_step": 14139, "epoch": 84} {"train_loss": -6.18056583404541, "global_step": 14140, "epoch": 84} {"train_loss": -6.40684700012207, "global_step": 14141, "epoch": 84} {"train_loss": -6.170963764190674, "global_step": 14142, "epoch": 84} {"train_loss": -6.577695846557617, "global_step": 14143, "epoch": 84} {"train_loss": -6.385776996612549, "global_step": 14144, "epoch": 84} {"train_loss": -6.28525447845459, "global_step": 14145, "epoch": 84} {"train_loss": -6.317938804626465, "global_step": 14146, "epoch": 84} {"train_loss": -6.053561210632324, "global_step": 14147, "epoch": 84} {"train_loss": -6.471367835998535, "global_step": 14148, "epoch": 84} {"train_loss": -6.365997791290283, "global_step": 14149, "epoch": 84} {"train_loss": -6.36845064163208, "global_step": 14150, "epoch": 84} {"train_loss": -6.267621994018555, "global_step": 14151, "epoch": 84} {"train_loss": -6.363003730773926, "global_step": 14152, "epoch": 84} {"train_loss": -6.405688285827637, "global_step": 14153, "epoch": 84} {"train_loss": -6.468752861022949, "global_step": 14154, "epoch": 84} {"train_loss": -6.189150810241699, "global_step": 14155, "epoch": 84} {"train_loss": -6.408560276031494, "global_step": 14156, "epoch": 84} {"train_loss": -6.530099868774414, "global_step": 14157, "epoch": 84} {"train_loss": -6.291365623474121, "global_step": 14158, "epoch": 84} {"train_loss": -6.270105361938477, "global_step": 14159, "epoch": 84} {"train_loss": -6.566326141357422, "global_step": 14160, "epoch": 84} {"train_loss": -6.300448894500732, "global_step": 14161, "epoch": 84} {"train_loss": -6.344451427459717, "global_step": 14162, "epoch": 84} {"train_loss": -6.306232452392578, "global_step": 14163, "epoch": 84} {"train_loss": -6.383981704711914, "global_step": 14164, "epoch": 84} {"train_loss": -6.636687278747559, "global_step": 14165, "epoch": 84} {"train_loss": -6.44968318939209, "global_step": 14166, "epoch": 84} {"train_loss": -6.485495567321777, "global_step": 14167, "epoch": 84} {"train_loss": -6.250247001647949, "global_step": 14168, "epoch": 84} {"train_loss": -6.496616363525391, "global_step": 14169, "epoch": 84} {"train_loss": -6.130139350891113, "global_step": 14170, "epoch": 84} {"train_loss": -6.422179698944092, "global_step": 14171, "epoch": 84} {"train_loss": -6.079315185546875, "global_step": 14172, "epoch": 84} {"train_loss": -6.255293846130371, "global_step": 14173, "epoch": 84} {"train_loss": -6.239185333251953, "global_step": 14174, "epoch": 84} {"train_loss": -6.303154945373535, "global_step": 14175, "epoch": 84} {"train_loss": -6.375564098358154, "global_step": 14176, "epoch": 84} {"train_loss": -6.218652725219727, "global_step": 14177, "epoch": 84} {"train_loss": -6.315196990966797, "global_step": 14178, "epoch": 84} {"train_loss": -6.350670337677002, "global_step": 14179, "epoch": 84} {"train_loss": -6.165894508361816, "global_step": 14180, "epoch": 84} {"train_loss": -6.278937339782715, "global_step": 14181, "epoch": 84} {"train_loss": -5.9962158203125, "global_step": 14182, "epoch": 84} {"train_loss": -6.303793430328369, "global_step": 14183, "epoch": 84} {"train_loss": -5.905591011047363, "global_step": 14184, "epoch": 84} {"train_loss": -5.955522537231445, "global_step": 14185, "epoch": 84} {"train_loss": -6.420344352722168, "global_step": 14186, "epoch": 84} {"train_loss": -5.95844841003418, "global_step": 14187, "epoch": 84} {"train_loss": -6.304311752319336, "global_step": 14188, "epoch": 84} {"train_loss": -6.306401252746582, "global_step": 14189, "epoch": 84} {"train_loss": -6.330408573150635, "global_step": 14190, "epoch": 84} {"train_loss": -6.58156156539917, "global_step": 14191, "epoch": 84} {"train_loss": -6.371036529541016, "global_step": 14192, "epoch": 84} {"train_loss": -6.335983753204346, "global_step": 14193, "epoch": 84} {"train_loss": -6.202241897583008, "global_step": 14194, "epoch": 84} {"train_loss": -6.475198745727539, "global_step": 14195, "epoch": 84} {"train_loss": -6.163323879241943, "global_step": 14196, "epoch": 84} {"train_loss": -6.329593658447266, "global_step": 14197, "epoch": 84} {"train_loss": -6.030902862548828, "global_step": 14198, "epoch": 84} {"train_loss": -6.480154037475586, "global_step": 14199, "epoch": 84} {"train_loss": -6.418789386749268, "global_step": 14200, "epoch": 84} {"train_loss": -6.497158527374268, "global_step": 14201, "epoch": 84} {"train_loss": -6.423635482788086, "global_step": 14202, "epoch": 84} {"train_loss": -6.2349653244018555, "global_step": 14203, "epoch": 84} {"train_loss": -6.554487228393555, "global_step": 14204, "epoch": 84} {"train_loss": -6.231935977935791, "global_step": 14205, "epoch": 84} {"train_loss": -6.385397911071777, "global_step": 14206, "epoch": 84} {"train_loss": -6.064538955688477, "global_step": 14207, "epoch": 84} {"train_loss": -6.415289878845215, "global_step": 14208, "epoch": 84} {"train_loss": -6.334975242614746, "global_step": 14209, "epoch": 84} {"train_loss": -6.038341045379639, "global_step": 14210, "epoch": 84} {"train_loss": -6.368037223815918, "global_step": 14211, "epoch": 84} {"train_loss": -6.168416500091553, "global_step": 14212, "epoch": 84} {"train_loss": -6.156033992767334, "global_step": 14213, "epoch": 84} {"train_loss": -6.023177623748779, "global_step": 14214, "epoch": 84} {"train_loss": -6.169930934906006, "global_step": 14215, "epoch": 84} {"train_loss": -6.24602746963501, "global_step": 14216, "epoch": 84} {"train_loss": -6.465789794921875, "global_step": 14217, "epoch": 84} {"train_loss": -6.441407203674316, "global_step": 14218, "epoch": 84} {"train_loss": -6.256767272949219, "global_step": 14219, "epoch": 84} {"train_loss": -6.271642684936523, "global_step": 14220, "epoch": 84} {"train_loss": -6.301852226257324, "global_step": 14221, "epoch": 84} {"train_loss": -6.144515514373779, "global_step": 14222, "epoch": 84} {"train_loss": -6.3194379806518555, "global_step": 14223, "epoch": 84} {"train_loss": -6.078578472137451, "global_step": 14224, "epoch": 84} {"train_loss": -6.261463165283203, "global_step": 14225, "epoch": 84} {"train_loss": -6.029582977294922, "global_step": 14226, "epoch": 84} {"train_loss": -6.529917240142822, "global_step": 14227, "epoch": 84} {"train_loss": -6.078993797302246, "global_step": 14228, "epoch": 84} {"train_loss": -6.3088555335998535, "global_step": 14229, "epoch": 84} {"train_loss": -6.232934474945068, "global_step": 14230, "epoch": 84} {"train_loss": -6.204442024230957, "global_step": 14231, "epoch": 84} {"train_loss": -6.175415515899658, "global_step": 14232, "epoch": 84} {"train_loss": -6.364501476287842, "global_step": 14233, "epoch": 84} {"train_loss": -6.382689476013184, "global_step": 14234, "epoch": 84} {"train_loss": -6.337721824645996, "global_step": 14235, "epoch": 84} {"train_loss": -6.268871307373047, "global_step": 14236, "epoch": 84} {"train_loss": -6.560236930847168, "global_step": 14237, "epoch": 84} {"train_loss": -6.559927940368652, "global_step": 14238, "epoch": 84} {"train_loss": -6.094329833984375, "global_step": 14239, "epoch": 84} {"train_loss": -6.37189245223999, "global_step": 14240, "epoch": 84} {"train_loss": -6.534324645996094, "global_step": 14241, "epoch": 84} {"train_loss": -6.362602233886719, "global_step": 14242, "epoch": 84} {"train_loss": -6.192885398864746, "global_step": 14243, "epoch": 84} {"train_loss": -6.275696277618408, "global_step": 14244, "epoch": 84} {"train_loss": -6.2518415451049805, "global_step": 14245, "epoch": 84} {"train_loss": -6.107617378234863, "global_step": 14246, "epoch": 84} {"train_loss": -6.244627952575684, "global_step": 14247, "epoch": 84} {"train_loss": -6.287772178649902, "global_step": 14248, "epoch": 84} {"train_loss": -6.363167762756348, "global_step": 14249, "epoch": 84} {"train_loss": -6.328122138977051, "global_step": 14250, "epoch": 84} {"train_loss": -6.473739147186279, "global_step": 14251, "epoch": 84} {"train_loss": -6.39088249206543, "global_step": 14252, "epoch": 84} {"train_loss": -6.449723720550537, "global_step": 14253, "epoch": 84} {"train_loss": -6.383687973022461, "global_step": 14254, "epoch": 84} {"train_loss": -6.376491069793701, "global_step": 14255, "epoch": 84} {"train_loss": -6.252097129821777, "global_step": 14256, "epoch": 84} {"train_loss": -6.526614189147949, "global_step": 14257, "epoch": 84} {"train_loss": -6.254944324493408, "global_step": 14258, "epoch": 84} {"train_loss": -6.226439476013184, "global_step": 14259, "epoch": 84} {"train_loss": -6.472872734069824, "global_step": 14260, "epoch": 84} {"train_loss": -6.381263256072998, "global_step": 14261, "epoch": 84} {"train_loss": -6.159292221069336, "global_step": 14262, "epoch": 84} {"train_loss": -6.176011085510254, "global_step": 14263, "epoch": 84} {"train_loss": -6.215726375579834, "global_step": 14264, "epoch": 84} {"train_loss": -6.231724739074707, "global_step": 14265, "epoch": 84} {"train_loss": -6.3495774269104, "global_step": 14266, "epoch": 84} {"train_loss": -6.260815620422363, "global_step": 14267, "epoch": 84} {"train_loss": -6.225078582763672, "global_step": 14268, "epoch": 84} {"train_loss": -6.077585697174072, "global_step": 14269, "epoch": 84} {"train_loss": -6.166528701782227, "global_step": 14270, "epoch": 84} {"train_loss": -6.262326717376709, "global_step": 14271, "epoch": 84} {"train_loss": -6.455000877380371, "global_step": 14272, "epoch": 84} {"train_loss": -6.541086196899414, "global_step": 14273, "epoch": 84} {"train_loss": -6.228092670440674, "global_step": 14274, "epoch": 84} {"train_loss": -6.282474517822266, "global_step": 14275, "epoch": 84} {"train_loss": -6.218381881713867, "global_step": 14276, "epoch": 84} {"train_loss": -6.216465473175049, "global_step": 14277, "epoch": 84} {"train_loss": -6.182078838348389, "global_step": 14278, "epoch": 84} {"train_loss": -6.3013372250965665, "global_step": 14279, "epoch": 84, "val_loss": 245316.46875} {"train_loss": -6.307282447814941, "global_step": 14280, "epoch": 85} {"train_loss": -6.474089622497559, "global_step": 14281, "epoch": 85} {"train_loss": -6.08194637298584, "global_step": 14282, "epoch": 85} {"train_loss": -6.176901817321777, "global_step": 14283, "epoch": 85} {"train_loss": -6.330811500549316, "global_step": 14284, "epoch": 85} {"train_loss": -6.052618980407715, "global_step": 14285, "epoch": 85} {"train_loss": -6.260470390319824, "global_step": 14286, "epoch": 85} {"train_loss": -6.201330661773682, "global_step": 14287, "epoch": 85} {"train_loss": -6.33130407333374, "global_step": 14288, "epoch": 85} {"train_loss": -6.049655914306641, "global_step": 14289, "epoch": 85} {"train_loss": -6.223747730255127, "global_step": 14290, "epoch": 85} {"train_loss": -6.104164123535156, "global_step": 14291, "epoch": 85} {"train_loss": -6.390801429748535, "global_step": 14292, "epoch": 85} {"train_loss": -6.432644844055176, "global_step": 14293, "epoch": 85} {"train_loss": -6.158359050750732, "global_step": 14294, "epoch": 85} {"train_loss": -5.935970306396484, "global_step": 14295, "epoch": 85} {"train_loss": -6.185085773468018, "global_step": 14296, "epoch": 85} {"train_loss": -6.34516716003418, "global_step": 14297, "epoch": 85} {"train_loss": -6.150286674499512, "global_step": 14298, "epoch": 85} {"train_loss": -6.428910255432129, "global_step": 14299, "epoch": 85} {"train_loss": -6.336163520812988, "global_step": 14300, "epoch": 85} {"train_loss": -6.1209211349487305, "global_step": 14301, "epoch": 85} {"train_loss": -6.297555923461914, "global_step": 14302, "epoch": 85} {"train_loss": -6.209246635437012, "global_step": 14303, "epoch": 85} {"train_loss": -6.466497421264648, "global_step": 14304, "epoch": 85} {"train_loss": -6.205710411071777, "global_step": 14305, "epoch": 85} {"train_loss": -6.41948938369751, "global_step": 14306, "epoch": 85} {"train_loss": -6.1445536613464355, "global_step": 14307, "epoch": 85} {"train_loss": -6.286468982696533, "global_step": 14308, "epoch": 85} {"train_loss": -6.231060981750488, "global_step": 14309, "epoch": 85} {"train_loss": -6.275672912597656, "global_step": 14310, "epoch": 85} {"train_loss": -6.302066802978516, "global_step": 14311, "epoch": 85} {"train_loss": -6.1620378494262695, "global_step": 14312, "epoch": 85} {"train_loss": -6.043328285217285, "global_step": 14313, "epoch": 85} {"train_loss": -6.219597339630127, "global_step": 14314, "epoch": 85} {"train_loss": -6.134014129638672, "global_step": 14315, "epoch": 85} {"train_loss": -6.4959187507629395, "global_step": 14316, "epoch": 85} {"train_loss": -6.3836493492126465, "global_step": 14317, "epoch": 85} {"train_loss": -6.443526268005371, "global_step": 14318, "epoch": 85} {"train_loss": -6.143139839172363, "global_step": 14319, "epoch": 85} {"train_loss": -6.3976874351501465, "global_step": 14320, "epoch": 85} {"train_loss": -5.971672058105469, "global_step": 14321, "epoch": 85} {"train_loss": -6.211345195770264, "global_step": 14322, "epoch": 85} {"train_loss": -6.432713985443115, "global_step": 14323, "epoch": 85} {"train_loss": -5.982974529266357, "global_step": 14324, "epoch": 85} {"train_loss": -5.951430320739746, "global_step": 14325, "epoch": 85} {"train_loss": -6.115200519561768, "global_step": 14326, "epoch": 85} {"train_loss": -6.181163311004639, "global_step": 14327, "epoch": 85} {"train_loss": -6.300783157348633, "global_step": 14328, "epoch": 85} {"train_loss": -6.140907287597656, "global_step": 14329, "epoch": 85} {"train_loss": -6.003631114959717, "global_step": 14330, "epoch": 85} {"train_loss": -6.141138553619385, "global_step": 14331, "epoch": 85} {"train_loss": -6.368744373321533, "global_step": 14332, "epoch": 85} {"train_loss": -6.295220375061035, "global_step": 14333, "epoch": 85} {"train_loss": -6.287191867828369, "global_step": 14334, "epoch": 85} {"train_loss": -6.289738655090332, "global_step": 14335, "epoch": 85} {"train_loss": -5.853767395019531, "global_step": 14336, "epoch": 85} {"train_loss": -6.275187969207764, "global_step": 14337, "epoch": 85} {"train_loss": -6.290648937225342, "global_step": 14338, "epoch": 85} {"train_loss": -6.090571403503418, "global_step": 14339, "epoch": 85} {"train_loss": -6.244999408721924, "global_step": 14340, "epoch": 85} {"train_loss": -6.230343818664551, "global_step": 14341, "epoch": 85} {"train_loss": -6.540583610534668, "global_step": 14342, "epoch": 85} {"train_loss": -6.110358715057373, "global_step": 14343, "epoch": 85} {"train_loss": -6.448480606079102, "global_step": 14344, "epoch": 85} {"train_loss": -6.313155174255371, "global_step": 14345, "epoch": 85} {"train_loss": -5.958648204803467, "global_step": 14346, "epoch": 85} {"train_loss": -6.375487327575684, "global_step": 14347, "epoch": 85} {"train_loss": -5.854673385620117, "global_step": 14348, "epoch": 85} {"train_loss": -6.226874351501465, "global_step": 14349, "epoch": 85} {"train_loss": -5.813094139099121, "global_step": 14350, "epoch": 85} {"train_loss": -6.238909721374512, "global_step": 14351, "epoch": 85} {"train_loss": -5.864020824432373, "global_step": 14352, "epoch": 85} {"train_loss": -5.983980655670166, "global_step": 14353, "epoch": 85} {"train_loss": -6.218379497528076, "global_step": 14354, "epoch": 85} {"train_loss": -5.8302106857299805, "global_step": 14355, "epoch": 85} {"train_loss": -6.047024726867676, "global_step": 14356, "epoch": 85} {"train_loss": -6.322868347167969, "global_step": 14357, "epoch": 85} {"train_loss": -6.216591835021973, "global_step": 14358, "epoch": 85} {"train_loss": -6.486985206604004, "global_step": 14359, "epoch": 85} {"train_loss": -6.176945686340332, "global_step": 14360, "epoch": 85} {"train_loss": -6.213600158691406, "global_step": 14361, "epoch": 85} {"train_loss": -5.880570411682129, "global_step": 14362, "epoch": 85} {"train_loss": -6.346987724304199, "global_step": 14363, "epoch": 85} {"train_loss": -6.270476341247559, "global_step": 14364, "epoch": 85} {"train_loss": -6.2065019607543945, "global_step": 14365, "epoch": 85} {"train_loss": -6.236876010894775, "global_step": 14366, "epoch": 85} {"train_loss": -6.354981899261475, "global_step": 14367, "epoch": 85} {"train_loss": -6.462923526763916, "global_step": 14368, "epoch": 85} {"train_loss": -6.108066082000732, "global_step": 14369, "epoch": 85} {"train_loss": -6.23330020904541, "global_step": 14370, "epoch": 85} {"train_loss": -6.444299697875977, "global_step": 14371, "epoch": 85} {"train_loss": -6.148370742797852, "global_step": 14372, "epoch": 85} {"train_loss": -6.162904739379883, "global_step": 14373, "epoch": 85} {"train_loss": -6.303244113922119, "global_step": 14374, "epoch": 85} {"train_loss": -6.289548397064209, "global_step": 14375, "epoch": 85} {"train_loss": -6.0342535972595215, "global_step": 14376, "epoch": 85} {"train_loss": -6.290393829345703, "global_step": 14377, "epoch": 85} {"train_loss": -5.952956199645996, "global_step": 14378, "epoch": 85} {"train_loss": -6.0268120765686035, "global_step": 14379, "epoch": 85} {"train_loss": -6.2254838943481445, "global_step": 14380, "epoch": 85} {"train_loss": -5.952089309692383, "global_step": 14381, "epoch": 85} {"train_loss": -6.288178443908691, "global_step": 14382, "epoch": 85} {"train_loss": -6.158906936645508, "global_step": 14383, "epoch": 85} {"train_loss": -6.431964874267578, "global_step": 14384, "epoch": 85} {"train_loss": -6.422410011291504, "global_step": 14385, "epoch": 85} {"train_loss": -6.069064617156982, "global_step": 14386, "epoch": 85} {"train_loss": -6.416092872619629, "global_step": 14387, "epoch": 85} {"train_loss": -6.244072437286377, "global_step": 14388, "epoch": 85} {"train_loss": -6.437892913818359, "global_step": 14389, "epoch": 85} {"train_loss": -6.244812965393066, "global_step": 14390, "epoch": 85} {"train_loss": -6.419025421142578, "global_step": 14391, "epoch": 85} {"train_loss": -6.454383373260498, "global_step": 14392, "epoch": 85} {"train_loss": -6.408872604370117, "global_step": 14393, "epoch": 85} {"train_loss": -6.443696975708008, "global_step": 14394, "epoch": 85} {"train_loss": -6.335179805755615, "global_step": 14395, "epoch": 85} {"train_loss": -6.460538864135742, "global_step": 14396, "epoch": 85} {"train_loss": -6.577376842498779, "global_step": 14397, "epoch": 85} {"train_loss": -6.274537563323975, "global_step": 14398, "epoch": 85} {"train_loss": -6.381590843200684, "global_step": 14399, "epoch": 85} {"train_loss": -6.359142303466797, "global_step": 14400, "epoch": 85} {"train_loss": -6.4725213050842285, "global_step": 14401, "epoch": 85} {"train_loss": -6.312057971954346, "global_step": 14402, "epoch": 85} {"train_loss": -6.694243431091309, "global_step": 14403, "epoch": 85} {"train_loss": -6.18873405456543, "global_step": 14404, "epoch": 85} {"train_loss": -6.255889892578125, "global_step": 14405, "epoch": 85} {"train_loss": -6.540788173675537, "global_step": 14406, "epoch": 85} {"train_loss": -6.35820198059082, "global_step": 14407, "epoch": 85} {"train_loss": -6.339826583862305, "global_step": 14408, "epoch": 85} {"train_loss": -6.068094253540039, "global_step": 14409, "epoch": 85} {"train_loss": -6.582676887512207, "global_step": 14410, "epoch": 85} {"train_loss": -6.086553573608398, "global_step": 14411, "epoch": 85} {"train_loss": -6.346607208251953, "global_step": 14412, "epoch": 85} {"train_loss": -6.096106052398682, "global_step": 14413, "epoch": 85} {"train_loss": -6.20755672454834, "global_step": 14414, "epoch": 85} {"train_loss": -6.124973297119141, "global_step": 14415, "epoch": 85} {"train_loss": -6.2801289558410645, "global_step": 14416, "epoch": 85} {"train_loss": -6.266274452209473, "global_step": 14417, "epoch": 85} {"train_loss": -5.811210632324219, "global_step": 14418, "epoch": 85} {"train_loss": -6.281984329223633, "global_step": 14419, "epoch": 85} {"train_loss": -6.465165138244629, "global_step": 14420, "epoch": 85} {"train_loss": -6.139107704162598, "global_step": 14421, "epoch": 85} {"train_loss": -6.222803592681885, "global_step": 14422, "epoch": 85} {"train_loss": -5.905543327331543, "global_step": 14423, "epoch": 85} {"train_loss": -6.197061538696289, "global_step": 14424, "epoch": 85} {"train_loss": -6.3205718994140625, "global_step": 14425, "epoch": 85} {"train_loss": -6.088214874267578, "global_step": 14426, "epoch": 85} {"train_loss": -6.4711456298828125, "global_step": 14427, "epoch": 85} {"train_loss": -6.34431266784668, "global_step": 14428, "epoch": 85} {"train_loss": -6.371233940124512, "global_step": 14429, "epoch": 85} {"train_loss": -6.270110130310059, "global_step": 14430, "epoch": 85} {"train_loss": -6.163858413696289, "global_step": 14431, "epoch": 85} {"train_loss": -6.249307632446289, "global_step": 14432, "epoch": 85} {"train_loss": -6.265140533447266, "global_step": 14433, "epoch": 85} {"train_loss": -6.116987705230713, "global_step": 14434, "epoch": 85} {"train_loss": -6.08260440826416, "global_step": 14435, "epoch": 85} {"train_loss": -6.362221717834473, "global_step": 14436, "epoch": 85} {"train_loss": -6.1079182624816895, "global_step": 14437, "epoch": 85} {"train_loss": -6.272971153259277, "global_step": 14438, "epoch": 85} {"train_loss": -6.416481971740723, "global_step": 14439, "epoch": 85} {"train_loss": -6.314708709716797, "global_step": 14440, "epoch": 85} {"train_loss": -6.2268781661987305, "global_step": 14441, "epoch": 85} {"train_loss": -6.328482151031494, "global_step": 14442, "epoch": 85} {"train_loss": -6.224117755889893, "global_step": 14443, "epoch": 85} {"train_loss": -6.189475059509277, "global_step": 14444, "epoch": 85} {"train_loss": -6.193741321563721, "global_step": 14445, "epoch": 85} {"train_loss": -6.369673728942871, "global_step": 14446, "epoch": 85} {"train_loss": -6.239128978479476, "global_step": 14447, "epoch": 85, "val_loss": 256249.328125, "train_action_mse_error": 27.5047607421875} {"train_loss": -6.322422027587891, "global_step": 14448, "epoch": 86} {"train_loss": -6.403960704803467, "global_step": 14449, "epoch": 86} {"train_loss": -6.282648086547852, "global_step": 14450, "epoch": 86} {"train_loss": -6.1420416831970215, "global_step": 14451, "epoch": 86} {"train_loss": -6.351421356201172, "global_step": 14452, "epoch": 86} {"train_loss": -6.140775680541992, "global_step": 14453, "epoch": 86} {"train_loss": -5.994217872619629, "global_step": 14454, "epoch": 86} {"train_loss": -6.048630714416504, "global_step": 14455, "epoch": 86} {"train_loss": -6.142042636871338, "global_step": 14456, "epoch": 86} {"train_loss": -6.280853748321533, "global_step": 14457, "epoch": 86} {"train_loss": -6.238351821899414, "global_step": 14458, "epoch": 86} {"train_loss": -5.895135879516602, "global_step": 14459, "epoch": 86} {"train_loss": -6.385612487792969, "global_step": 14460, "epoch": 86} {"train_loss": -6.264155864715576, "global_step": 14461, "epoch": 86} {"train_loss": -6.100977897644043, "global_step": 14462, "epoch": 86} {"train_loss": -6.090887069702148, "global_step": 14463, "epoch": 86} {"train_loss": -5.985207557678223, "global_step": 14464, "epoch": 86} {"train_loss": -6.554642200469971, "global_step": 14465, "epoch": 86} {"train_loss": -6.308638095855713, "global_step": 14466, "epoch": 86} {"train_loss": -6.208820343017578, "global_step": 14467, "epoch": 86} {"train_loss": -6.368293762207031, "global_step": 14468, "epoch": 86} {"train_loss": -6.27471923828125, "global_step": 14469, "epoch": 86} {"train_loss": -6.217676639556885, "global_step": 14470, "epoch": 86} {"train_loss": -6.119490623474121, "global_step": 14471, "epoch": 86} {"train_loss": -6.2480878829956055, "global_step": 14472, "epoch": 86} {"train_loss": -6.192779541015625, "global_step": 14473, "epoch": 86} {"train_loss": -6.503632545471191, "global_step": 14474, "epoch": 86} {"train_loss": -6.220404624938965, "global_step": 14475, "epoch": 86} {"train_loss": -6.410463333129883, "global_step": 14476, "epoch": 86} {"train_loss": -6.152368545532227, "global_step": 14477, "epoch": 86} {"train_loss": -6.327055931091309, "global_step": 14478, "epoch": 86} {"train_loss": -6.4532389640808105, "global_step": 14479, "epoch": 86} {"train_loss": -6.555269241333008, "global_step": 14480, "epoch": 86} {"train_loss": -6.35129451751709, "global_step": 14481, "epoch": 86} {"train_loss": -6.162817001342773, "global_step": 14482, "epoch": 86} {"train_loss": -6.289386749267578, "global_step": 14483, "epoch": 86} {"train_loss": -6.2992377281188965, "global_step": 14484, "epoch": 86} {"train_loss": -6.438821792602539, "global_step": 14485, "epoch": 86} {"train_loss": -6.335622787475586, "global_step": 14486, "epoch": 86} {"train_loss": -6.306707382202148, "global_step": 14487, "epoch": 86} {"train_loss": -6.034116744995117, "global_step": 14488, "epoch": 86} {"train_loss": -6.395810127258301, "global_step": 14489, "epoch": 86} {"train_loss": -6.24957275390625, "global_step": 14490, "epoch": 86} {"train_loss": -6.351434230804443, "global_step": 14491, "epoch": 86} {"train_loss": -6.136314392089844, "global_step": 14492, "epoch": 86} {"train_loss": -6.486330986022949, "global_step": 14493, "epoch": 86} {"train_loss": -6.033142566680908, "global_step": 14494, "epoch": 86} {"train_loss": -6.316342353820801, "global_step": 14495, "epoch": 86} {"train_loss": -6.416399955749512, "global_step": 14496, "epoch": 86} {"train_loss": -6.180410861968994, "global_step": 14497, "epoch": 86} {"train_loss": -6.354917526245117, "global_step": 14498, "epoch": 86} {"train_loss": -6.266506671905518, "global_step": 14499, "epoch": 86} {"train_loss": -6.366750240325928, "global_step": 14500, "epoch": 86} {"train_loss": -6.450508117675781, "global_step": 14501, "epoch": 86} {"train_loss": -6.244148254394531, "global_step": 14502, "epoch": 86} {"train_loss": -6.156067371368408, "global_step": 14503, "epoch": 86} {"train_loss": -6.186805725097656, "global_step": 14504, "epoch": 86} {"train_loss": -6.313725471496582, "global_step": 14505, "epoch": 86} {"train_loss": -6.207511901855469, "global_step": 14506, "epoch": 86} {"train_loss": -6.112392425537109, "global_step": 14507, "epoch": 86} {"train_loss": -6.38551139831543, "global_step": 14508, "epoch": 86} {"train_loss": -6.19450569152832, "global_step": 14509, "epoch": 86} {"train_loss": -6.533241271972656, "global_step": 14510, "epoch": 86} {"train_loss": -6.045362949371338, "global_step": 14511, "epoch": 86} {"train_loss": -6.519130706787109, "global_step": 14512, "epoch": 86} {"train_loss": -6.533164024353027, "global_step": 14513, "epoch": 86} {"train_loss": -6.339580535888672, "global_step": 14514, "epoch": 86} {"train_loss": -6.420963764190674, "global_step": 14515, "epoch": 86} {"train_loss": -6.5149617195129395, "global_step": 14516, "epoch": 86} {"train_loss": -6.192148685455322, "global_step": 14517, "epoch": 86} {"train_loss": -6.235391139984131, "global_step": 14518, "epoch": 86} {"train_loss": -6.216989040374756, "global_step": 14519, "epoch": 86} {"train_loss": -6.457152366638184, "global_step": 14520, "epoch": 86} {"train_loss": -6.320117473602295, "global_step": 14521, "epoch": 86} {"train_loss": -6.473637104034424, "global_step": 14522, "epoch": 86} {"train_loss": -6.293325424194336, "global_step": 14523, "epoch": 86} {"train_loss": -6.535369396209717, "global_step": 14524, "epoch": 86} {"train_loss": -6.321148872375488, "global_step": 14525, "epoch": 86} {"train_loss": -6.261735916137695, "global_step": 14526, "epoch": 86} {"train_loss": -6.418310165405273, "global_step": 14527, "epoch": 86} {"train_loss": -6.500406265258789, "global_step": 14528, "epoch": 86} {"train_loss": -6.310115814208984, "global_step": 14529, "epoch": 86} {"train_loss": -5.9236226081848145, "global_step": 14530, "epoch": 86} {"train_loss": -6.2074384689331055, "global_step": 14531, "epoch": 86} {"train_loss": -6.217340469360352, "global_step": 14532, "epoch": 86} {"train_loss": -6.314781188964844, "global_step": 14533, "epoch": 86} {"train_loss": -6.310492515563965, "global_step": 14534, "epoch": 86} {"train_loss": -6.176750183105469, "global_step": 14535, "epoch": 86} {"train_loss": -6.245572566986084, "global_step": 14536, "epoch": 86} {"train_loss": -6.165048122406006, "global_step": 14537, "epoch": 86} {"train_loss": -6.061578750610352, "global_step": 14538, "epoch": 86} {"train_loss": -6.638160228729248, "global_step": 14539, "epoch": 86} {"train_loss": -6.384358882904053, "global_step": 14540, "epoch": 86} {"train_loss": -6.206378936767578, "global_step": 14541, "epoch": 86} {"train_loss": -6.13417911529541, "global_step": 14542, "epoch": 86} {"train_loss": -6.163949966430664, "global_step": 14543, "epoch": 86} {"train_loss": -5.993570804595947, "global_step": 14544, "epoch": 86} {"train_loss": -6.0507025718688965, "global_step": 14545, "epoch": 86} {"train_loss": -6.2639312744140625, "global_step": 14546, "epoch": 86} {"train_loss": -6.037737846374512, "global_step": 14547, "epoch": 86} {"train_loss": -6.319429874420166, "global_step": 14548, "epoch": 86} {"train_loss": -6.243915557861328, "global_step": 14549, "epoch": 86} {"train_loss": -6.431238651275635, "global_step": 14550, "epoch": 86} {"train_loss": -6.343095779418945, "global_step": 14551, "epoch": 86} {"train_loss": -6.1255903244018555, "global_step": 14552, "epoch": 86} {"train_loss": -6.437294006347656, "global_step": 14553, "epoch": 86} {"train_loss": -5.991060256958008, "global_step": 14554, "epoch": 86} {"train_loss": -6.229107856750488, "global_step": 14555, "epoch": 86} {"train_loss": -6.528728485107422, "global_step": 14556, "epoch": 86} {"train_loss": -6.2688398361206055, "global_step": 14557, "epoch": 86} {"train_loss": -6.153777122497559, "global_step": 14558, "epoch": 86} {"train_loss": -6.3274407386779785, "global_step": 14559, "epoch": 86} {"train_loss": -6.291244983673096, "global_step": 14560, "epoch": 86} {"train_loss": -6.136648178100586, "global_step": 14561, "epoch": 86} {"train_loss": -6.2818450927734375, "global_step": 14562, "epoch": 86} {"train_loss": -6.272968292236328, "global_step": 14563, "epoch": 86} {"train_loss": -6.445189952850342, "global_step": 14564, "epoch": 86} {"train_loss": -6.3305463790893555, "global_step": 14565, "epoch": 86} {"train_loss": -6.18710994720459, "global_step": 14566, "epoch": 86} {"train_loss": -6.253582954406738, "global_step": 14567, "epoch": 86} {"train_loss": -6.509842395782471, "global_step": 14568, "epoch": 86} {"train_loss": -6.0497941970825195, "global_step": 14569, "epoch": 86} {"train_loss": -6.368897438049316, "global_step": 14570, "epoch": 86} {"train_loss": -6.400564193725586, "global_step": 14571, "epoch": 86} {"train_loss": -6.505406379699707, "global_step": 14572, "epoch": 86} {"train_loss": -6.349655628204346, "global_step": 14573, "epoch": 86} {"train_loss": -6.408065319061279, "global_step": 14574, "epoch": 86} {"train_loss": -6.378151893615723, "global_step": 14575, "epoch": 86} {"train_loss": -6.370272636413574, "global_step": 14576, "epoch": 86} {"train_loss": -6.479151248931885, "global_step": 14577, "epoch": 86} {"train_loss": -6.1908979415893555, "global_step": 14578, "epoch": 86} {"train_loss": -6.263303756713867, "global_step": 14579, "epoch": 86} {"train_loss": -6.40122127532959, "global_step": 14580, "epoch": 86} {"train_loss": -6.111013889312744, "global_step": 14581, "epoch": 86} {"train_loss": -6.164999961853027, "global_step": 14582, "epoch": 86} {"train_loss": -6.1276140213012695, "global_step": 14583, "epoch": 86} {"train_loss": -6.057789325714111, "global_step": 14584, "epoch": 86} {"train_loss": -6.42222785949707, "global_step": 14585, "epoch": 86} {"train_loss": -6.265993118286133, "global_step": 14586, "epoch": 86} {"train_loss": -6.150448799133301, "global_step": 14587, "epoch": 86} {"train_loss": -6.118809700012207, "global_step": 14588, "epoch": 86} {"train_loss": -6.064294815063477, "global_step": 14589, "epoch": 86} {"train_loss": -6.270429611206055, "global_step": 14590, "epoch": 86} {"train_loss": -6.140787601470947, "global_step": 14591, "epoch": 86} {"train_loss": -6.183123588562012, "global_step": 14592, "epoch": 86} {"train_loss": -6.056365966796875, "global_step": 14593, "epoch": 86} {"train_loss": -5.805026054382324, "global_step": 14594, "epoch": 86} {"train_loss": -6.094635963439941, "global_step": 14595, "epoch": 86} {"train_loss": -6.340856552124023, "global_step": 14596, "epoch": 86} {"train_loss": -6.268503189086914, "global_step": 14597, "epoch": 86} {"train_loss": -6.25917387008667, "global_step": 14598, "epoch": 86} {"train_loss": -6.339740753173828, "global_step": 14599, "epoch": 86} {"train_loss": -5.896823883056641, "global_step": 14600, "epoch": 86} {"train_loss": -6.353236198425293, "global_step": 14601, "epoch": 86} {"train_loss": -5.983892440795898, "global_step": 14602, "epoch": 86} {"train_loss": -6.293207168579102, "global_step": 14603, "epoch": 86} {"train_loss": -6.154526710510254, "global_step": 14604, "epoch": 86} {"train_loss": -6.405885219573975, "global_step": 14605, "epoch": 86} {"train_loss": -6.363134860992432, "global_step": 14606, "epoch": 86} {"train_loss": -6.466891288757324, "global_step": 14607, "epoch": 86} {"train_loss": -6.489901542663574, "global_step": 14608, "epoch": 86} {"train_loss": -6.210829734802246, "global_step": 14609, "epoch": 86} {"train_loss": -6.397916316986084, "global_step": 14610, "epoch": 86} {"train_loss": -6.499387741088867, "global_step": 14611, "epoch": 86} {"train_loss": -6.302216529846191, "global_step": 14612, "epoch": 86} {"train_loss": -6.373268127441406, "global_step": 14613, "epoch": 86} {"train_loss": -6.4291582107543945, "global_step": 14614, "epoch": 86} {"train_loss": -6.268401665346963, "global_step": 14615, "epoch": 86, "val_loss": 248491.015625} {"train_loss": -6.308618545532227, "global_step": 14616, "epoch": 87} {"train_loss": -6.33766508102417, "global_step": 14617, "epoch": 87} {"train_loss": -6.1927618980407715, "global_step": 14618, "epoch": 87} {"train_loss": -6.230128288269043, "global_step": 14619, "epoch": 87} {"train_loss": -6.29311990737915, "global_step": 14620, "epoch": 87} {"train_loss": -6.304910659790039, "global_step": 14621, "epoch": 87} {"train_loss": -6.066980361938477, "global_step": 14622, "epoch": 87} {"train_loss": -6.581981658935547, "global_step": 14623, "epoch": 87} {"train_loss": -6.254365921020508, "global_step": 14624, "epoch": 87} {"train_loss": -6.236347198486328, "global_step": 14625, "epoch": 87} {"train_loss": -6.247530937194824, "global_step": 14626, "epoch": 87} {"train_loss": -6.297054767608643, "global_step": 14627, "epoch": 87} {"train_loss": -6.260424613952637, "global_step": 14628, "epoch": 87} {"train_loss": -6.1716718673706055, "global_step": 14629, "epoch": 87} {"train_loss": -6.261599540710449, "global_step": 14630, "epoch": 87} {"train_loss": -6.436278343200684, "global_step": 14631, "epoch": 87} {"train_loss": -6.016456127166748, "global_step": 14632, "epoch": 87} {"train_loss": -6.280886650085449, "global_step": 14633, "epoch": 87} {"train_loss": -6.29646635055542, "global_step": 14634, "epoch": 87} {"train_loss": -6.492305755615234, "global_step": 14635, "epoch": 87} {"train_loss": -6.241769790649414, "global_step": 14636, "epoch": 87} {"train_loss": -6.207520961761475, "global_step": 14637, "epoch": 87} {"train_loss": -6.4309844970703125, "global_step": 14638, "epoch": 87} {"train_loss": -6.3827033042907715, "global_step": 14639, "epoch": 87} {"train_loss": -6.343876838684082, "global_step": 14640, "epoch": 87} {"train_loss": -6.618679046630859, "global_step": 14641, "epoch": 87} {"train_loss": -6.290965557098389, "global_step": 14642, "epoch": 87} {"train_loss": -6.106204032897949, "global_step": 14643, "epoch": 87} {"train_loss": -6.6444292068481445, "global_step": 14644, "epoch": 87} {"train_loss": -6.304807186126709, "global_step": 14645, "epoch": 87} {"train_loss": -6.441193103790283, "global_step": 14646, "epoch": 87} {"train_loss": -6.4973039627075195, "global_step": 14647, "epoch": 87} {"train_loss": -6.383904933929443, "global_step": 14648, "epoch": 87} {"train_loss": -6.502740859985352, "global_step": 14649, "epoch": 87} {"train_loss": -6.377873420715332, "global_step": 14650, "epoch": 87} {"train_loss": -6.233020782470703, "global_step": 14651, "epoch": 87} {"train_loss": -6.294818878173828, "global_step": 14652, "epoch": 87} {"train_loss": -6.168069839477539, "global_step": 14653, "epoch": 87} {"train_loss": -6.469321250915527, "global_step": 14654, "epoch": 87} {"train_loss": -6.182293891906738, "global_step": 14655, "epoch": 87} {"train_loss": -6.010137557983398, "global_step": 14656, "epoch": 87} {"train_loss": -6.361161231994629, "global_step": 14657, "epoch": 87} {"train_loss": -6.155271530151367, "global_step": 14658, "epoch": 87} {"train_loss": -6.234502792358398, "global_step": 14659, "epoch": 87} {"train_loss": -6.300907135009766, "global_step": 14660, "epoch": 87} {"train_loss": -6.221443176269531, "global_step": 14661, "epoch": 87} {"train_loss": -6.2878265380859375, "global_step": 14662, "epoch": 87} {"train_loss": -6.2986063957214355, "global_step": 14663, "epoch": 87} {"train_loss": -6.22943115234375, "global_step": 14664, "epoch": 87} {"train_loss": -6.441234588623047, "global_step": 14665, "epoch": 87} {"train_loss": -6.441459655761719, "global_step": 14666, "epoch": 87} {"train_loss": -6.345720291137695, "global_step": 14667, "epoch": 87} {"train_loss": -6.503652572631836, "global_step": 14668, "epoch": 87} {"train_loss": -6.267541885375977, "global_step": 14669, "epoch": 87} {"train_loss": -6.565263748168945, "global_step": 14670, "epoch": 87} {"train_loss": -6.251275062561035, "global_step": 14671, "epoch": 87} {"train_loss": -6.4094367027282715, "global_step": 14672, "epoch": 87} {"train_loss": -6.261150360107422, "global_step": 14673, "epoch": 87} {"train_loss": -6.406314849853516, "global_step": 14674, "epoch": 87} {"train_loss": -6.212085247039795, "global_step": 14675, "epoch": 87} {"train_loss": -6.4932756423950195, "global_step": 14676, "epoch": 87} {"train_loss": -6.2927374839782715, "global_step": 14677, "epoch": 87} {"train_loss": -6.383560657501221, "global_step": 14678, "epoch": 87} {"train_loss": -6.136626720428467, "global_step": 14679, "epoch": 87} {"train_loss": -6.209221839904785, "global_step": 14680, "epoch": 87} {"train_loss": -6.28640079498291, "global_step": 14681, "epoch": 87} {"train_loss": -6.3017988204956055, "global_step": 14682, "epoch": 87} {"train_loss": -6.2054643630981445, "global_step": 14683, "epoch": 87} {"train_loss": -6.256192684173584, "global_step": 14684, "epoch": 87} {"train_loss": -6.299141883850098, "global_step": 14685, "epoch": 87} {"train_loss": -6.568202495574951, "global_step": 14686, "epoch": 87} {"train_loss": -6.253036022186279, "global_step": 14687, "epoch": 87} {"train_loss": -6.359900951385498, "global_step": 14688, "epoch": 87} {"train_loss": -6.241764545440674, "global_step": 14689, "epoch": 87} {"train_loss": -6.246748924255371, "global_step": 14690, "epoch": 87} {"train_loss": -6.249865531921387, "global_step": 14691, "epoch": 87} {"train_loss": -6.395180702209473, "global_step": 14692, "epoch": 87} {"train_loss": -6.456371307373047, "global_step": 14693, "epoch": 87} {"train_loss": -6.3731465339660645, "global_step": 14694, "epoch": 87} {"train_loss": -6.275240898132324, "global_step": 14695, "epoch": 87} {"train_loss": -6.3346476554870605, "global_step": 14696, "epoch": 87} {"train_loss": -6.481909275054932, "global_step": 14697, "epoch": 87} {"train_loss": -6.213631629943848, "global_step": 14698, "epoch": 87} {"train_loss": -6.42219877243042, "global_step": 14699, "epoch": 87} {"train_loss": -6.519815444946289, "global_step": 14700, "epoch": 87} {"train_loss": -6.5333428382873535, "global_step": 14701, "epoch": 87} {"train_loss": -6.427218914031982, "global_step": 14702, "epoch": 87} {"train_loss": -6.602292537689209, "global_step": 14703, "epoch": 87} {"train_loss": -6.65285062789917, "global_step": 14704, "epoch": 87} {"train_loss": -6.506221771240234, "global_step": 14705, "epoch": 87} {"train_loss": -6.4950432777404785, "global_step": 14706, "epoch": 87} {"train_loss": -6.475473403930664, "global_step": 14707, "epoch": 87} {"train_loss": -6.183239936828613, "global_step": 14708, "epoch": 87} {"train_loss": -6.610165596008301, "global_step": 14709, "epoch": 87} {"train_loss": -6.3716349601745605, "global_step": 14710, "epoch": 87} {"train_loss": -6.4848198890686035, "global_step": 14711, "epoch": 87} {"train_loss": -6.554174423217773, "global_step": 14712, "epoch": 87} {"train_loss": -6.272454738616943, "global_step": 14713, "epoch": 87} {"train_loss": -6.383868217468262, "global_step": 14714, "epoch": 87} {"train_loss": -6.493703842163086, "global_step": 14715, "epoch": 87} {"train_loss": -6.405489921569824, "global_step": 14716, "epoch": 87} {"train_loss": -6.492542266845703, "global_step": 14717, "epoch": 87} {"train_loss": -6.580748558044434, "global_step": 14718, "epoch": 87} {"train_loss": -6.368593692779541, "global_step": 14719, "epoch": 87} {"train_loss": -6.364696502685547, "global_step": 14720, "epoch": 87} {"train_loss": -6.294339656829834, "global_step": 14721, "epoch": 87} {"train_loss": -6.415398597717285, "global_step": 14722, "epoch": 87} {"train_loss": -6.060267448425293, "global_step": 14723, "epoch": 87} {"train_loss": -6.393771171569824, "global_step": 14724, "epoch": 87} {"train_loss": -6.2281107902526855, "global_step": 14725, "epoch": 87} {"train_loss": -6.219069957733154, "global_step": 14726, "epoch": 87} {"train_loss": -6.124725818634033, "global_step": 14727, "epoch": 87} {"train_loss": -6.014960289001465, "global_step": 14728, "epoch": 87} {"train_loss": -6.368646621704102, "global_step": 14729, "epoch": 87} {"train_loss": -5.976428031921387, "global_step": 14730, "epoch": 87} {"train_loss": -6.18955135345459, "global_step": 14731, "epoch": 87} {"train_loss": -5.941872596740723, "global_step": 14732, "epoch": 87} {"train_loss": -5.953573226928711, "global_step": 14733, "epoch": 87} {"train_loss": -6.022826671600342, "global_step": 14734, "epoch": 87} {"train_loss": -5.884914398193359, "global_step": 14735, "epoch": 87} {"train_loss": -6.194202899932861, "global_step": 14736, "epoch": 87} {"train_loss": -6.041600227355957, "global_step": 14737, "epoch": 87} {"train_loss": -6.078834533691406, "global_step": 14738, "epoch": 87} {"train_loss": -6.0742387771606445, "global_step": 14739, "epoch": 87} {"train_loss": -6.029640197753906, "global_step": 14740, "epoch": 87} {"train_loss": -5.97703742980957, "global_step": 14741, "epoch": 87} {"train_loss": -6.377079963684082, "global_step": 14742, "epoch": 87} {"train_loss": -5.993712902069092, "global_step": 14743, "epoch": 87} {"train_loss": -6.351753234863281, "global_step": 14744, "epoch": 87} {"train_loss": -6.051658630371094, "global_step": 14745, "epoch": 87} {"train_loss": -6.135890483856201, "global_step": 14746, "epoch": 87} {"train_loss": -6.348515033721924, "global_step": 14747, "epoch": 87} {"train_loss": -6.3042497634887695, "global_step": 14748, "epoch": 87} {"train_loss": -6.075760841369629, "global_step": 14749, "epoch": 87} {"train_loss": -6.322242736816406, "global_step": 14750, "epoch": 87} {"train_loss": -6.171316146850586, "global_step": 14751, "epoch": 87} {"train_loss": -6.427884101867676, "global_step": 14752, "epoch": 87} {"train_loss": -6.471522331237793, "global_step": 14753, "epoch": 87} {"train_loss": -6.393364429473877, "global_step": 14754, "epoch": 87} {"train_loss": -6.154078483581543, "global_step": 14755, "epoch": 87} {"train_loss": -6.234955787658691, "global_step": 14756, "epoch": 87} {"train_loss": -6.0709967613220215, "global_step": 14757, "epoch": 87} {"train_loss": -6.432126045227051, "global_step": 14758, "epoch": 87} {"train_loss": -6.505159378051758, "global_step": 14759, "epoch": 87} {"train_loss": -6.431707382202148, "global_step": 14760, "epoch": 87} {"train_loss": -6.426387786865234, "global_step": 14761, "epoch": 87} {"train_loss": -6.126622200012207, "global_step": 14762, "epoch": 87} {"train_loss": -5.9916911125183105, "global_step": 14763, "epoch": 87} {"train_loss": -6.487271308898926, "global_step": 14764, "epoch": 87} {"train_loss": -6.305407524108887, "global_step": 14765, "epoch": 87} {"train_loss": -6.316417694091797, "global_step": 14766, "epoch": 87} {"train_loss": -6.385199546813965, "global_step": 14767, "epoch": 87} {"train_loss": -6.501192092895508, "global_step": 14768, "epoch": 87} {"train_loss": -6.374691963195801, "global_step": 14769, "epoch": 87} {"train_loss": -6.329567909240723, "global_step": 14770, "epoch": 87} {"train_loss": -6.224766254425049, "global_step": 14771, "epoch": 87} {"train_loss": -6.374727249145508, "global_step": 14772, "epoch": 87} {"train_loss": -6.070135116577148, "global_step": 14773, "epoch": 87} {"train_loss": -6.0618205070495605, "global_step": 14774, "epoch": 87} {"train_loss": -6.1885085105896, "global_step": 14775, "epoch": 87} {"train_loss": -6.423159599304199, "global_step": 14776, "epoch": 87} {"train_loss": -6.351235389709473, "global_step": 14777, "epoch": 87} {"train_loss": -6.304486274719238, "global_step": 14778, "epoch": 87} {"train_loss": -6.431210517883301, "global_step": 14779, "epoch": 87} {"train_loss": -6.405368804931641, "global_step": 14780, "epoch": 87} {"train_loss": -6.671306610107422, "global_step": 14781, "epoch": 87} {"train_loss": -6.292677879333496, "global_step": 14782, "epoch": 87} {"train_loss": -6.305343457630703, "global_step": 14783, "epoch": 87, "val_loss": 251693.671875} {"train_loss": -6.3277716636657715, "global_step": 14784, "epoch": 88} {"train_loss": -6.498715400695801, "global_step": 14785, "epoch": 88} {"train_loss": -6.147947788238525, "global_step": 14786, "epoch": 88} {"train_loss": -6.46278190612793, "global_step": 14787, "epoch": 88} {"train_loss": -6.173895359039307, "global_step": 14788, "epoch": 88} {"train_loss": -6.4172492027282715, "global_step": 14789, "epoch": 88} {"train_loss": -6.3698835372924805, "global_step": 14790, "epoch": 88} {"train_loss": -5.926521301269531, "global_step": 14791, "epoch": 88} {"train_loss": -6.193807601928711, "global_step": 14792, "epoch": 88} {"train_loss": -6.050982475280762, "global_step": 14793, "epoch": 88} {"train_loss": -6.412580490112305, "global_step": 14794, "epoch": 88} {"train_loss": -6.00933837890625, "global_step": 14795, "epoch": 88} {"train_loss": -6.21706485748291, "global_step": 14796, "epoch": 88} {"train_loss": -6.470139980316162, "global_step": 14797, "epoch": 88} {"train_loss": -6.077081680297852, "global_step": 14798, "epoch": 88} {"train_loss": -6.291367530822754, "global_step": 14799, "epoch": 88} {"train_loss": -6.34755802154541, "global_step": 14800, "epoch": 88} {"train_loss": -6.412288665771484, "global_step": 14801, "epoch": 88} {"train_loss": -6.282055377960205, "global_step": 14802, "epoch": 88} {"train_loss": -6.418460845947266, "global_step": 14803, "epoch": 88} {"train_loss": -6.249938488006592, "global_step": 14804, "epoch": 88} {"train_loss": -6.405752658843994, "global_step": 14805, "epoch": 88} {"train_loss": -6.4165568351745605, "global_step": 14806, "epoch": 88} {"train_loss": -6.290726661682129, "global_step": 14807, "epoch": 88} {"train_loss": -6.392574310302734, "global_step": 14808, "epoch": 88} {"train_loss": -6.240445137023926, "global_step": 14809, "epoch": 88} {"train_loss": -6.609055519104004, "global_step": 14810, "epoch": 88} {"train_loss": -6.626690864562988, "global_step": 14811, "epoch": 88} {"train_loss": -6.616707801818848, "global_step": 14812, "epoch": 88} {"train_loss": -6.415410041809082, "global_step": 14813, "epoch": 88} {"train_loss": -6.384328842163086, "global_step": 14814, "epoch": 88} {"train_loss": -6.371294021606445, "global_step": 14815, "epoch": 88} {"train_loss": -6.538703441619873, "global_step": 14816, "epoch": 88} {"train_loss": -6.5366926193237305, "global_step": 14817, "epoch": 88} {"train_loss": -6.339763164520264, "global_step": 14818, "epoch": 88} {"train_loss": -6.370418071746826, "global_step": 14819, "epoch": 88} {"train_loss": -6.177569389343262, "global_step": 14820, "epoch": 88} {"train_loss": -5.874645233154297, "global_step": 14821, "epoch": 88} {"train_loss": -6.265604019165039, "global_step": 14822, "epoch": 88} {"train_loss": -6.397060394287109, "global_step": 14823, "epoch": 88} {"train_loss": -6.287471771240234, "global_step": 14824, "epoch": 88} {"train_loss": -6.01987361907959, "global_step": 14825, "epoch": 88} {"train_loss": -6.38944149017334, "global_step": 14826, "epoch": 88} {"train_loss": -6.170368194580078, "global_step": 14827, "epoch": 88} {"train_loss": -6.401241779327393, "global_step": 14828, "epoch": 88} {"train_loss": -6.050974369049072, "global_step": 14829, "epoch": 88} {"train_loss": -6.383419513702393, "global_step": 14830, "epoch": 88} {"train_loss": -6.225334167480469, "global_step": 14831, "epoch": 88} {"train_loss": -6.180965900421143, "global_step": 14832, "epoch": 88} {"train_loss": -6.172046661376953, "global_step": 14833, "epoch": 88} {"train_loss": -6.256938934326172, "global_step": 14834, "epoch": 88} {"train_loss": -6.1616010665893555, "global_step": 14835, "epoch": 88} {"train_loss": -6.145583152770996, "global_step": 14836, "epoch": 88} {"train_loss": -6.423037528991699, "global_step": 14837, "epoch": 88} {"train_loss": -6.127383708953857, "global_step": 14838, "epoch": 88} {"train_loss": -6.330648422241211, "global_step": 14839, "epoch": 88} {"train_loss": -6.244294166564941, "global_step": 14840, "epoch": 88} {"train_loss": -6.399914741516113, "global_step": 14841, "epoch": 88} {"train_loss": -6.517602920532227, "global_step": 14842, "epoch": 88} {"train_loss": -6.291032314300537, "global_step": 14843, "epoch": 88} {"train_loss": -6.494774341583252, "global_step": 14844, "epoch": 88} {"train_loss": -6.349982738494873, "global_step": 14845, "epoch": 88} {"train_loss": -6.604862213134766, "global_step": 14846, "epoch": 88} {"train_loss": -6.389671325683594, "global_step": 14847, "epoch": 88} {"train_loss": -6.171987533569336, "global_step": 14848, "epoch": 88} {"train_loss": -6.434037208557129, "global_step": 14849, "epoch": 88} {"train_loss": -6.252545356750488, "global_step": 14850, "epoch": 88} {"train_loss": -6.403866291046143, "global_step": 14851, "epoch": 88} {"train_loss": -6.204830646514893, "global_step": 14852, "epoch": 88} {"train_loss": -6.2948126792907715, "global_step": 14853, "epoch": 88} {"train_loss": -6.340291500091553, "global_step": 14854, "epoch": 88} {"train_loss": -6.282349586486816, "global_step": 14855, "epoch": 88} {"train_loss": -6.239742279052734, "global_step": 14856, "epoch": 88} {"train_loss": -6.075616836547852, "global_step": 14857, "epoch": 88} {"train_loss": -6.532472610473633, "global_step": 14858, "epoch": 88} {"train_loss": -6.444079399108887, "global_step": 14859, "epoch": 88} {"train_loss": -6.3889031410217285, "global_step": 14860, "epoch": 88} {"train_loss": -6.257673740386963, "global_step": 14861, "epoch": 88} {"train_loss": -5.9918060302734375, "global_step": 14862, "epoch": 88} {"train_loss": -6.491257667541504, "global_step": 14863, "epoch": 88} {"train_loss": -5.829799652099609, "global_step": 14864, "epoch": 88} {"train_loss": -6.18861198425293, "global_step": 14865, "epoch": 88} {"train_loss": -6.1911234855651855, "global_step": 14866, "epoch": 88} {"train_loss": -6.469437599182129, "global_step": 14867, "epoch": 88} {"train_loss": -6.545821189880371, "global_step": 14868, "epoch": 88} {"train_loss": -6.398275375366211, "global_step": 14869, "epoch": 88} {"train_loss": -6.354554653167725, "global_step": 14870, "epoch": 88} {"train_loss": -6.443115234375, "global_step": 14871, "epoch": 88} {"train_loss": -6.134198188781738, "global_step": 14872, "epoch": 88} {"train_loss": -6.307666778564453, "global_step": 14873, "epoch": 88} {"train_loss": -6.12226676940918, "global_step": 14874, "epoch": 88} {"train_loss": -6.188745498657227, "global_step": 14875, "epoch": 88} {"train_loss": -6.048192977905273, "global_step": 14876, "epoch": 88} {"train_loss": -6.234295845031738, "global_step": 14877, "epoch": 88} {"train_loss": -6.239401817321777, "global_step": 14878, "epoch": 88} {"train_loss": -6.424012660980225, "global_step": 14879, "epoch": 88} {"train_loss": -6.2718424797058105, "global_step": 14880, "epoch": 88} {"train_loss": -6.351648807525635, "global_step": 14881, "epoch": 88} {"train_loss": -6.24678897857666, "global_step": 14882, "epoch": 88} {"train_loss": -6.157644271850586, "global_step": 14883, "epoch": 88} {"train_loss": -6.18755578994751, "global_step": 14884, "epoch": 88} {"train_loss": -6.12100887298584, "global_step": 14885, "epoch": 88} {"train_loss": -6.239123344421387, "global_step": 14886, "epoch": 88} {"train_loss": -6.21712589263916, "global_step": 14887, "epoch": 88} {"train_loss": -5.819015026092529, "global_step": 14888, "epoch": 88} {"train_loss": -6.3098673820495605, "global_step": 14889, "epoch": 88} {"train_loss": -6.1194963455200195, "global_step": 14890, "epoch": 88} {"train_loss": -6.153172492980957, "global_step": 14891, "epoch": 88} {"train_loss": -6.292963981628418, "global_step": 14892, "epoch": 88} {"train_loss": -6.124591827392578, "global_step": 14893, "epoch": 88} {"train_loss": -6.252133369445801, "global_step": 14894, "epoch": 88} {"train_loss": -6.340991973876953, "global_step": 14895, "epoch": 88} {"train_loss": -6.059348106384277, "global_step": 14896, "epoch": 88} {"train_loss": -6.185052871704102, "global_step": 14897, "epoch": 88} {"train_loss": -6.15715217590332, "global_step": 14898, "epoch": 88} {"train_loss": -6.3766326904296875, "global_step": 14899, "epoch": 88} {"train_loss": -6.43245792388916, "global_step": 14900, "epoch": 88} {"train_loss": -6.182455539703369, "global_step": 14901, "epoch": 88} {"train_loss": -6.275506019592285, "global_step": 14902, "epoch": 88} {"train_loss": -6.306517124176025, "global_step": 14903, "epoch": 88} {"train_loss": -6.385293960571289, "global_step": 14904, "epoch": 88} {"train_loss": -6.292108535766602, "global_step": 14905, "epoch": 88} {"train_loss": -6.231808185577393, "global_step": 14906, "epoch": 88} {"train_loss": -5.996345043182373, "global_step": 14907, "epoch": 88} {"train_loss": -6.534234046936035, "global_step": 14908, "epoch": 88} {"train_loss": -6.4062089920043945, "global_step": 14909, "epoch": 88} {"train_loss": -6.284747123718262, "global_step": 14910, "epoch": 88} {"train_loss": -6.407144546508789, "global_step": 14911, "epoch": 88} {"train_loss": -6.314719200134277, "global_step": 14912, "epoch": 88} {"train_loss": -6.3264875411987305, "global_step": 14913, "epoch": 88} {"train_loss": -6.108941078186035, "global_step": 14914, "epoch": 88} {"train_loss": -6.487985610961914, "global_step": 14915, "epoch": 88} {"train_loss": -6.207596778869629, "global_step": 14916, "epoch": 88} {"train_loss": -6.395102500915527, "global_step": 14917, "epoch": 88} {"train_loss": -6.146714210510254, "global_step": 14918, "epoch": 88} {"train_loss": -6.311656951904297, "global_step": 14919, "epoch": 88} {"train_loss": -6.466670513153076, "global_step": 14920, "epoch": 88} {"train_loss": -6.2507734298706055, "global_step": 14921, "epoch": 88} {"train_loss": -6.2448272705078125, "global_step": 14922, "epoch": 88} {"train_loss": -5.9788312911987305, "global_step": 14923, "epoch": 88} {"train_loss": -6.6987481117248535, "global_step": 14924, "epoch": 88} {"train_loss": -6.341737747192383, "global_step": 14925, "epoch": 88} {"train_loss": -6.371002674102783, "global_step": 14926, "epoch": 88} {"train_loss": -6.13930606842041, "global_step": 14927, "epoch": 88} {"train_loss": -6.339975357055664, "global_step": 14928, "epoch": 88} {"train_loss": -6.057703971862793, "global_step": 14929, "epoch": 88} {"train_loss": -6.364866733551025, "global_step": 14930, "epoch": 88} {"train_loss": -6.368339538574219, "global_step": 14931, "epoch": 88} {"train_loss": -6.169233322143555, "global_step": 14932, "epoch": 88} {"train_loss": -6.545732498168945, "global_step": 14933, "epoch": 88} {"train_loss": -6.5317559242248535, "global_step": 14934, "epoch": 88} {"train_loss": -6.464825630187988, "global_step": 14935, "epoch": 88} {"train_loss": -6.451623916625977, "global_step": 14936, "epoch": 88} {"train_loss": -6.449369430541992, "global_step": 14937, "epoch": 88} {"train_loss": -6.543702125549316, "global_step": 14938, "epoch": 88} {"train_loss": -6.310041904449463, "global_step": 14939, "epoch": 88} {"train_loss": -6.3185529708862305, "global_step": 14940, "epoch": 88} {"train_loss": -6.410600662231445, "global_step": 14941, "epoch": 88} {"train_loss": -6.561419486999512, "global_step": 14942, "epoch": 88} {"train_loss": -6.6042938232421875, "global_step": 14943, "epoch": 88} {"train_loss": -6.515556335449219, "global_step": 14944, "epoch": 88} {"train_loss": -6.339323997497559, "global_step": 14945, "epoch": 88} {"train_loss": -6.307872772216797, "global_step": 14946, "epoch": 88} {"train_loss": -6.2566351890563965, "global_step": 14947, "epoch": 88} {"train_loss": -5.986176490783691, "global_step": 14948, "epoch": 88} {"train_loss": -6.175275802612305, "global_step": 14949, "epoch": 88} {"train_loss": -6.228455066680908, "global_step": 14950, "epoch": 88} {"train_loss": -6.298234942413512, "global_step": 14951, "epoch": 88, "val_loss": 241507.203125} {"train_loss": -6.365978240966797, "global_step": 14952, "epoch": 89} {"train_loss": -6.31178092956543, "global_step": 14953, "epoch": 89} {"train_loss": -6.297918319702148, "global_step": 14954, "epoch": 89} {"train_loss": -6.424233436584473, "global_step": 14955, "epoch": 89} {"train_loss": -5.934447288513184, "global_step": 14956, "epoch": 89} {"train_loss": -6.454361915588379, "global_step": 14957, "epoch": 89} {"train_loss": -6.448976516723633, "global_step": 14958, "epoch": 89} {"train_loss": -6.465341567993164, "global_step": 14959, "epoch": 89} {"train_loss": -6.355426788330078, "global_step": 14960, "epoch": 89} {"train_loss": -6.522195816040039, "global_step": 14961, "epoch": 89} {"train_loss": -6.142395973205566, "global_step": 14962, "epoch": 89} {"train_loss": -6.358573913574219, "global_step": 14963, "epoch": 89} {"train_loss": -6.16908073425293, "global_step": 14964, "epoch": 89} {"train_loss": -6.394017219543457, "global_step": 14965, "epoch": 89} {"train_loss": -6.217392921447754, "global_step": 14966, "epoch": 89} {"train_loss": -6.212407112121582, "global_step": 14967, "epoch": 89} {"train_loss": -6.270063400268555, "global_step": 14968, "epoch": 89} {"train_loss": -6.38259220123291, "global_step": 14969, "epoch": 89} {"train_loss": -5.912210464477539, "global_step": 14970, "epoch": 89} {"train_loss": -6.321521282196045, "global_step": 14971, "epoch": 89} {"train_loss": -6.2164835929870605, "global_step": 14972, "epoch": 89} {"train_loss": -6.25894021987915, "global_step": 14973, "epoch": 89} {"train_loss": -6.350049018859863, "global_step": 14974, "epoch": 89} {"train_loss": -6.134524345397949, "global_step": 14975, "epoch": 89} {"train_loss": -6.330235481262207, "global_step": 14976, "epoch": 89} {"train_loss": -6.358078956604004, "global_step": 14977, "epoch": 89} {"train_loss": -6.385311126708984, "global_step": 14978, "epoch": 89} {"train_loss": -6.156184673309326, "global_step": 14979, "epoch": 89} {"train_loss": -6.481238842010498, "global_step": 14980, "epoch": 89} {"train_loss": -6.453482151031494, "global_step": 14981, "epoch": 89} {"train_loss": -6.458518028259277, "global_step": 14982, "epoch": 89} {"train_loss": -6.367311477661133, "global_step": 14983, "epoch": 89} {"train_loss": -6.380454063415527, "global_step": 14984, "epoch": 89} {"train_loss": -6.685094356536865, "global_step": 14985, "epoch": 89} {"train_loss": -6.351871967315674, "global_step": 14986, "epoch": 89} {"train_loss": -6.002816677093506, "global_step": 14987, "epoch": 89} {"train_loss": -6.274336814880371, "global_step": 14988, "epoch": 89} {"train_loss": -6.214804649353027, "global_step": 14989, "epoch": 89} {"train_loss": -6.063069820404053, "global_step": 14990, "epoch": 89} {"train_loss": -6.241665840148926, "global_step": 14991, "epoch": 89} {"train_loss": -6.301841735839844, "global_step": 14992, "epoch": 89} {"train_loss": -6.5743727684021, "global_step": 14993, "epoch": 89} {"train_loss": -6.213793754577637, "global_step": 14994, "epoch": 89} {"train_loss": -6.2761054039001465, "global_step": 14995, "epoch": 89} {"train_loss": -6.259904861450195, "global_step": 14996, "epoch": 89} {"train_loss": -6.173135757446289, "global_step": 14997, "epoch": 89} {"train_loss": -6.490545272827148, "global_step": 14998, "epoch": 89} {"train_loss": -6.335453033447266, "global_step": 14999, "epoch": 89} {"train_loss": -6.101061820983887, "global_step": 15000, "epoch": 89} {"train_loss": -6.517310619354248, "global_step": 15001, "epoch": 89} {"train_loss": -6.446599960327148, "global_step": 15002, "epoch": 89} {"train_loss": -6.424592018127441, "global_step": 15003, "epoch": 89} {"train_loss": -6.117132663726807, "global_step": 15004, "epoch": 89} {"train_loss": -6.634791374206543, "global_step": 15005, "epoch": 89} {"train_loss": -6.180977821350098, "global_step": 15006, "epoch": 89} {"train_loss": -6.195854187011719, "global_step": 15007, "epoch": 89} {"train_loss": -6.486640930175781, "global_step": 15008, "epoch": 89} {"train_loss": -6.330503463745117, "global_step": 15009, "epoch": 89} {"train_loss": -6.374027729034424, "global_step": 15010, "epoch": 89} {"train_loss": -6.416572570800781, "global_step": 15011, "epoch": 89} {"train_loss": -6.367484092712402, "global_step": 15012, "epoch": 89} {"train_loss": -6.217244625091553, "global_step": 15013, "epoch": 89} {"train_loss": -6.524374961853027, "global_step": 15014, "epoch": 89} {"train_loss": -6.411123275756836, "global_step": 15015, "epoch": 89} {"train_loss": -6.3876752853393555, "global_step": 15016, "epoch": 89} {"train_loss": -6.303701400756836, "global_step": 15017, "epoch": 89} {"train_loss": -6.167904853820801, "global_step": 15018, "epoch": 89} {"train_loss": -6.556066036224365, "global_step": 15019, "epoch": 89} {"train_loss": -6.272810935974121, "global_step": 15020, "epoch": 89} {"train_loss": -6.049513816833496, "global_step": 15021, "epoch": 89} {"train_loss": -6.168999671936035, "global_step": 15022, "epoch": 89} {"train_loss": -6.342039108276367, "global_step": 15023, "epoch": 89} {"train_loss": -6.393906593322754, "global_step": 15024, "epoch": 89} {"train_loss": -6.1798834800720215, "global_step": 15025, "epoch": 89} {"train_loss": -6.368518829345703, "global_step": 15026, "epoch": 89} {"train_loss": -6.249357223510742, "global_step": 15027, "epoch": 89} {"train_loss": -6.190563201904297, "global_step": 15028, "epoch": 89} {"train_loss": -6.440291404724121, "global_step": 15029, "epoch": 89} {"train_loss": -6.310554504394531, "global_step": 15030, "epoch": 89} {"train_loss": -6.15537166595459, "global_step": 15031, "epoch": 89} {"train_loss": -6.360476493835449, "global_step": 15032, "epoch": 89} {"train_loss": -6.29550313949585, "global_step": 15033, "epoch": 89} {"train_loss": -6.247696876525879, "global_step": 15034, "epoch": 89} {"train_loss": -6.378491401672363, "global_step": 15035, "epoch": 89} {"train_loss": -6.658359527587891, "global_step": 15036, "epoch": 89} {"train_loss": -6.27895450592041, "global_step": 15037, "epoch": 89} {"train_loss": -6.000471115112305, "global_step": 15038, "epoch": 89} {"train_loss": -6.441922187805176, "global_step": 15039, "epoch": 89} {"train_loss": -6.462867736816406, "global_step": 15040, "epoch": 89} {"train_loss": -6.533904552459717, "global_step": 15041, "epoch": 89} {"train_loss": -6.215914726257324, "global_step": 15042, "epoch": 89} {"train_loss": -6.346729278564453, "global_step": 15043, "epoch": 89} {"train_loss": -6.369460105895996, "global_step": 15044, "epoch": 89} {"train_loss": -6.352461814880371, "global_step": 15045, "epoch": 89} {"train_loss": -6.194021224975586, "global_step": 15046, "epoch": 89} {"train_loss": -6.483066558837891, "global_step": 15047, "epoch": 89} {"train_loss": -6.07029914855957, "global_step": 15048, "epoch": 89} {"train_loss": -6.418910980224609, "global_step": 15049, "epoch": 89} {"train_loss": -6.282243251800537, "global_step": 15050, "epoch": 89} {"train_loss": -6.329526901245117, "global_step": 15051, "epoch": 89} {"train_loss": -6.610647678375244, "global_step": 15052, "epoch": 89} {"train_loss": -6.480049133300781, "global_step": 15053, "epoch": 89} {"train_loss": -6.428794860839844, "global_step": 15054, "epoch": 89} {"train_loss": -6.442928314208984, "global_step": 15055, "epoch": 89} {"train_loss": -6.323787689208984, "global_step": 15056, "epoch": 89} {"train_loss": -6.578015327453613, "global_step": 15057, "epoch": 89} {"train_loss": -6.186779499053955, "global_step": 15058, "epoch": 89} {"train_loss": -6.481593132019043, "global_step": 15059, "epoch": 89} {"train_loss": -6.411846160888672, "global_step": 15060, "epoch": 89} {"train_loss": -6.2074995040893555, "global_step": 15061, "epoch": 89} {"train_loss": -6.467569351196289, "global_step": 15062, "epoch": 89} {"train_loss": -6.204416751861572, "global_step": 15063, "epoch": 89} {"train_loss": -6.326482772827148, "global_step": 15064, "epoch": 89} {"train_loss": -6.285391807556152, "global_step": 15065, "epoch": 89} {"train_loss": -6.344581604003906, "global_step": 15066, "epoch": 89} {"train_loss": -6.281101226806641, "global_step": 15067, "epoch": 89} {"train_loss": -6.288450717926025, "global_step": 15068, "epoch": 89} {"train_loss": -6.233660697937012, "global_step": 15069, "epoch": 89} {"train_loss": -6.2456254959106445, "global_step": 15070, "epoch": 89} {"train_loss": -6.35125732421875, "global_step": 15071, "epoch": 89} {"train_loss": -6.327267646789551, "global_step": 15072, "epoch": 89} {"train_loss": -6.378325462341309, "global_step": 15073, "epoch": 89} {"train_loss": -6.27808952331543, "global_step": 15074, "epoch": 89} {"train_loss": -6.485610008239746, "global_step": 15075, "epoch": 89} {"train_loss": -6.274574279785156, "global_step": 15076, "epoch": 89} {"train_loss": -6.335502624511719, "global_step": 15077, "epoch": 89} {"train_loss": -6.193601131439209, "global_step": 15078, "epoch": 89} {"train_loss": -6.3617706298828125, "global_step": 15079, "epoch": 89} {"train_loss": -6.53642463684082, "global_step": 15080, "epoch": 89} {"train_loss": -6.06541633605957, "global_step": 15081, "epoch": 89} {"train_loss": -6.342685222625732, "global_step": 15082, "epoch": 89} {"train_loss": -6.449834823608398, "global_step": 15083, "epoch": 89} {"train_loss": -6.4666948318481445, "global_step": 15084, "epoch": 89} {"train_loss": -6.462032318115234, "global_step": 15085, "epoch": 89} {"train_loss": -6.510199069976807, "global_step": 15086, "epoch": 89} {"train_loss": -6.42910623550415, "global_step": 15087, "epoch": 89} {"train_loss": -6.441022872924805, "global_step": 15088, "epoch": 89} {"train_loss": -6.445855140686035, "global_step": 15089, "epoch": 89} {"train_loss": -6.355652809143066, "global_step": 15090, "epoch": 89} {"train_loss": -6.386232852935791, "global_step": 15091, "epoch": 89} {"train_loss": -6.653262138366699, "global_step": 15092, "epoch": 89} {"train_loss": -6.578795433044434, "global_step": 15093, "epoch": 89} {"train_loss": -6.435218811035156, "global_step": 15094, "epoch": 89} {"train_loss": -6.842243671417236, "global_step": 15095, "epoch": 89} {"train_loss": -6.387250900268555, "global_step": 15096, "epoch": 89} {"train_loss": -6.669135093688965, "global_step": 15097, "epoch": 89} {"train_loss": -6.646627426147461, "global_step": 15098, "epoch": 89} {"train_loss": -6.402646064758301, "global_step": 15099, "epoch": 89} {"train_loss": -6.092778205871582, "global_step": 15100, "epoch": 89} {"train_loss": -6.49234676361084, "global_step": 15101, "epoch": 89} {"train_loss": -6.440094947814941, "global_step": 15102, "epoch": 89} {"train_loss": -6.357853889465332, "global_step": 15103, "epoch": 89} {"train_loss": -6.317682266235352, "global_step": 15104, "epoch": 89} {"train_loss": -6.167191028594971, "global_step": 15105, "epoch": 89} {"train_loss": -6.213069915771484, "global_step": 15106, "epoch": 89} {"train_loss": -6.257983207702637, "global_step": 15107, "epoch": 89} {"train_loss": -6.244525909423828, "global_step": 15108, "epoch": 89} {"train_loss": -6.284924507141113, "global_step": 15109, "epoch": 89} {"train_loss": -6.2921600341796875, "global_step": 15110, "epoch": 89} {"train_loss": -6.226095199584961, "global_step": 15111, "epoch": 89} {"train_loss": -6.263743877410889, "global_step": 15112, "epoch": 89} {"train_loss": -6.239426612854004, "global_step": 15113, "epoch": 89} {"train_loss": -6.179380416870117, "global_step": 15114, "epoch": 89} {"train_loss": -6.351033687591553, "global_step": 15115, "epoch": 89} {"train_loss": -6.085679531097412, "global_step": 15116, "epoch": 89} {"train_loss": -6.271873950958252, "global_step": 15117, "epoch": 89} {"train_loss": -6.142288684844971, "global_step": 15118, "epoch": 89} {"train_loss": -6.334428344454084, "global_step": 15119, "epoch": 89, "val_loss": 240539.015625} {"train_loss": -6.2895708084106445, "global_step": 15120, "epoch": 90} {"train_loss": -6.380348205566406, "global_step": 15121, "epoch": 90} {"train_loss": -6.417794227600098, "global_step": 15122, "epoch": 90} {"train_loss": -6.431385517120361, "global_step": 15123, "epoch": 90} {"train_loss": -6.282121658325195, "global_step": 15124, "epoch": 90} {"train_loss": -6.497082710266113, "global_step": 15125, "epoch": 90} {"train_loss": -6.448963642120361, "global_step": 15126, "epoch": 90} {"train_loss": -6.424046993255615, "global_step": 15127, "epoch": 90} {"train_loss": -6.010552406311035, "global_step": 15128, "epoch": 90} {"train_loss": -6.459416389465332, "global_step": 15129, "epoch": 90} {"train_loss": -6.469686985015869, "global_step": 15130, "epoch": 90} {"train_loss": -6.447042465209961, "global_step": 15131, "epoch": 90} {"train_loss": -6.385040283203125, "global_step": 15132, "epoch": 90} {"train_loss": -6.323083877563477, "global_step": 15133, "epoch": 90} {"train_loss": -5.844626426696777, "global_step": 15134, "epoch": 90} {"train_loss": -6.239400386810303, "global_step": 15135, "epoch": 90} {"train_loss": -6.337786674499512, "global_step": 15136, "epoch": 90} {"train_loss": -6.369192123413086, "global_step": 15137, "epoch": 90} {"train_loss": -5.97382926940918, "global_step": 15138, "epoch": 90} {"train_loss": -6.103249549865723, "global_step": 15139, "epoch": 90} {"train_loss": -6.187392234802246, "global_step": 15140, "epoch": 90} {"train_loss": -6.041324615478516, "global_step": 15141, "epoch": 90} {"train_loss": -6.195058822631836, "global_step": 15142, "epoch": 90} {"train_loss": -6.192956924438477, "global_step": 15143, "epoch": 90} {"train_loss": -6.45546817779541, "global_step": 15144, "epoch": 90} {"train_loss": -6.391153335571289, "global_step": 15145, "epoch": 90} {"train_loss": -6.1337890625, "global_step": 15146, "epoch": 90} {"train_loss": -6.393486022949219, "global_step": 15147, "epoch": 90} {"train_loss": -6.422574996948242, "global_step": 15148, "epoch": 90} {"train_loss": -6.403203010559082, "global_step": 15149, "epoch": 90} {"train_loss": -6.298516273498535, "global_step": 15150, "epoch": 90} {"train_loss": -6.278543949127197, "global_step": 15151, "epoch": 90} {"train_loss": -6.409981727600098, "global_step": 15152, "epoch": 90} {"train_loss": -6.57680606842041, "global_step": 15153, "epoch": 90} {"train_loss": -6.095658302307129, "global_step": 15154, "epoch": 90} {"train_loss": -6.364358901977539, "global_step": 15155, "epoch": 90} {"train_loss": -6.335859298706055, "global_step": 15156, "epoch": 90} {"train_loss": -6.262423992156982, "global_step": 15157, "epoch": 90} {"train_loss": -6.3152923583984375, "global_step": 15158, "epoch": 90} {"train_loss": -6.522058010101318, "global_step": 15159, "epoch": 90} {"train_loss": -6.303413391113281, "global_step": 15160, "epoch": 90} {"train_loss": -6.112627983093262, "global_step": 15161, "epoch": 90} {"train_loss": -6.159407615661621, "global_step": 15162, "epoch": 90} {"train_loss": -6.2840728759765625, "global_step": 15163, "epoch": 90} {"train_loss": -6.212177753448486, "global_step": 15164, "epoch": 90} {"train_loss": -6.313515663146973, "global_step": 15165, "epoch": 90} {"train_loss": -6.119688034057617, "global_step": 15166, "epoch": 90} {"train_loss": -6.294521331787109, "global_step": 15167, "epoch": 90} {"train_loss": -5.9910359382629395, "global_step": 15168, "epoch": 90} {"train_loss": -6.225958347320557, "global_step": 15169, "epoch": 90} {"train_loss": -6.159280776977539, "global_step": 15170, "epoch": 90} {"train_loss": -5.962344169616699, "global_step": 15171, "epoch": 90} {"train_loss": -6.2774810791015625, "global_step": 15172, "epoch": 90} {"train_loss": -5.955567359924316, "global_step": 15173, "epoch": 90} {"train_loss": -6.165327072143555, "global_step": 15174, "epoch": 90} {"train_loss": -6.541800498962402, "global_step": 15175, "epoch": 90} {"train_loss": -6.237541198730469, "global_step": 15176, "epoch": 90} {"train_loss": -6.1881303787231445, "global_step": 15177, "epoch": 90} {"train_loss": -6.292607307434082, "global_step": 15178, "epoch": 90} {"train_loss": -6.310563564300537, "global_step": 15179, "epoch": 90} {"train_loss": -6.048019886016846, "global_step": 15180, "epoch": 90} {"train_loss": -6.200125694274902, "global_step": 15181, "epoch": 90} {"train_loss": -6.161226272583008, "global_step": 15182, "epoch": 90} {"train_loss": -6.192099571228027, "global_step": 15183, "epoch": 90} {"train_loss": -6.223073959350586, "global_step": 15184, "epoch": 90} {"train_loss": -6.09525728225708, "global_step": 15185, "epoch": 90} {"train_loss": -6.35476016998291, "global_step": 15186, "epoch": 90} {"train_loss": -6.166830062866211, "global_step": 15187, "epoch": 90} {"train_loss": -6.469926834106445, "global_step": 15188, "epoch": 90} {"train_loss": -6.213123321533203, "global_step": 15189, "epoch": 90} {"train_loss": -6.650400638580322, "global_step": 15190, "epoch": 90} {"train_loss": -6.681488990783691, "global_step": 15191, "epoch": 90} {"train_loss": -6.455234527587891, "global_step": 15192, "epoch": 90} {"train_loss": -6.3989152908325195, "global_step": 15193, "epoch": 90} {"train_loss": -6.444638252258301, "global_step": 15194, "epoch": 90} {"train_loss": -6.480280876159668, "global_step": 15195, "epoch": 90} {"train_loss": -6.297117233276367, "global_step": 15196, "epoch": 90} {"train_loss": -6.488498687744141, "global_step": 15197, "epoch": 90} {"train_loss": -6.353753089904785, "global_step": 15198, "epoch": 90} {"train_loss": -6.547641754150391, "global_step": 15199, "epoch": 90} {"train_loss": -6.420896053314209, "global_step": 15200, "epoch": 90} {"train_loss": -6.565018653869629, "global_step": 15201, "epoch": 90} {"train_loss": -6.530559539794922, "global_step": 15202, "epoch": 90} {"train_loss": -6.449338912963867, "global_step": 15203, "epoch": 90} {"train_loss": -6.14650297164917, "global_step": 15204, "epoch": 90} {"train_loss": -6.604122161865234, "global_step": 15205, "epoch": 90} {"train_loss": -6.320064544677734, "global_step": 15206, "epoch": 90} {"train_loss": -6.380948066711426, "global_step": 15207, "epoch": 90} {"train_loss": -6.364587783813477, "global_step": 15208, "epoch": 90} {"train_loss": -6.257181644439697, "global_step": 15209, "epoch": 90} {"train_loss": -6.144498825073242, "global_step": 15210, "epoch": 90} {"train_loss": -6.455803871154785, "global_step": 15211, "epoch": 90} {"train_loss": -6.377354621887207, "global_step": 15212, "epoch": 90} {"train_loss": -6.292078018188477, "global_step": 15213, "epoch": 90} {"train_loss": -6.44164514541626, "global_step": 15214, "epoch": 90} {"train_loss": -6.264471054077148, "global_step": 15215, "epoch": 90} {"train_loss": -6.410421371459961, "global_step": 15216, "epoch": 90} {"train_loss": -6.432365417480469, "global_step": 15217, "epoch": 90} {"train_loss": -6.513321876525879, "global_step": 15218, "epoch": 90} {"train_loss": -6.364985466003418, "global_step": 15219, "epoch": 90} {"train_loss": -6.186911582946777, "global_step": 15220, "epoch": 90} {"train_loss": -6.444947719573975, "global_step": 15221, "epoch": 90} {"train_loss": -6.323186874389648, "global_step": 15222, "epoch": 90} {"train_loss": -6.474050521850586, "global_step": 15223, "epoch": 90} {"train_loss": -6.336149215698242, "global_step": 15224, "epoch": 90} {"train_loss": -6.5035905838012695, "global_step": 15225, "epoch": 90} {"train_loss": -6.512500762939453, "global_step": 15226, "epoch": 90} {"train_loss": -6.338301658630371, "global_step": 15227, "epoch": 90} {"train_loss": -6.436785697937012, "global_step": 15228, "epoch": 90} {"train_loss": -6.411464691162109, "global_step": 15229, "epoch": 90} {"train_loss": -6.361396789550781, "global_step": 15230, "epoch": 90} {"train_loss": -6.466124534606934, "global_step": 15231, "epoch": 90} {"train_loss": -6.199655055999756, "global_step": 15232, "epoch": 90} {"train_loss": -6.023020267486572, "global_step": 15233, "epoch": 90} {"train_loss": -6.334109306335449, "global_step": 15234, "epoch": 90} {"train_loss": -6.2687177658081055, "global_step": 15235, "epoch": 90} {"train_loss": -6.35920524597168, "global_step": 15236, "epoch": 90} {"train_loss": -6.322281360626221, "global_step": 15237, "epoch": 90} {"train_loss": -6.306774139404297, "global_step": 15238, "epoch": 90} {"train_loss": -6.249916076660156, "global_step": 15239, "epoch": 90} {"train_loss": -6.3759002685546875, "global_step": 15240, "epoch": 90} {"train_loss": -6.321988582611084, "global_step": 15241, "epoch": 90} {"train_loss": -6.456508636474609, "global_step": 15242, "epoch": 90} {"train_loss": -6.279570579528809, "global_step": 15243, "epoch": 90} {"train_loss": -6.053282737731934, "global_step": 15244, "epoch": 90} {"train_loss": -6.5366973876953125, "global_step": 15245, "epoch": 90} {"train_loss": -6.455990314483643, "global_step": 15246, "epoch": 90} {"train_loss": -6.416035175323486, "global_step": 15247, "epoch": 90} {"train_loss": -6.495484352111816, "global_step": 15248, "epoch": 90} {"train_loss": -6.44944953918457, "global_step": 15249, "epoch": 90} {"train_loss": -6.331368446350098, "global_step": 15250, "epoch": 90} {"train_loss": -6.48637580871582, "global_step": 15251, "epoch": 90} {"train_loss": -6.595851898193359, "global_step": 15252, "epoch": 90} {"train_loss": -6.202615737915039, "global_step": 15253, "epoch": 90} {"train_loss": -6.372333526611328, "global_step": 15254, "epoch": 90} {"train_loss": -6.431130409240723, "global_step": 15255, "epoch": 90} {"train_loss": -6.549005508422852, "global_step": 15256, "epoch": 90} {"train_loss": -6.28177547454834, "global_step": 15257, "epoch": 90} {"train_loss": -6.559682369232178, "global_step": 15258, "epoch": 90} {"train_loss": -6.492821216583252, "global_step": 15259, "epoch": 90} {"train_loss": -6.496889591217041, "global_step": 15260, "epoch": 90} {"train_loss": -6.564935684204102, "global_step": 15261, "epoch": 90} {"train_loss": -6.4843244552612305, "global_step": 15262, "epoch": 90} {"train_loss": -6.435659408569336, "global_step": 15263, "epoch": 90} {"train_loss": -6.572068214416504, "global_step": 15264, "epoch": 90} {"train_loss": -6.5477776527404785, "global_step": 15265, "epoch": 90} {"train_loss": -6.362309455871582, "global_step": 15266, "epoch": 90} {"train_loss": -6.517965316772461, "global_step": 15267, "epoch": 90} {"train_loss": -6.424003601074219, "global_step": 15268, "epoch": 90} {"train_loss": -6.486954689025879, "global_step": 15269, "epoch": 90} {"train_loss": -6.360231399536133, "global_step": 15270, "epoch": 90} {"train_loss": -6.411874771118164, "global_step": 15271, "epoch": 90} {"train_loss": -6.376875877380371, "global_step": 15272, "epoch": 90} {"train_loss": -6.254506587982178, "global_step": 15273, "epoch": 90} {"train_loss": -5.97172737121582, "global_step": 15274, "epoch": 90} {"train_loss": -6.0204057693481445, "global_step": 15275, "epoch": 90} {"train_loss": -6.375671863555908, "global_step": 15276, "epoch": 90} {"train_loss": -6.304720878601074, "global_step": 15277, "epoch": 90} {"train_loss": -6.2498087882995605, "global_step": 15278, "epoch": 90} {"train_loss": -6.264625549316406, "global_step": 15279, "epoch": 90} {"train_loss": -6.211853981018066, "global_step": 15280, "epoch": 90} {"train_loss": -6.295188903808594, "global_step": 15281, "epoch": 90} {"train_loss": -6.238323211669922, "global_step": 15282, "epoch": 90} {"train_loss": -6.340428352355957, "global_step": 15283, "epoch": 90} {"train_loss": -6.268768787384033, "global_step": 15284, "epoch": 90} {"train_loss": -5.994194030761719, "global_step": 15285, "epoch": 90} {"train_loss": -6.292333602905273, "global_step": 15286, "epoch": 90} {"train_loss": -6.331581402392614, "global_step": 15287, "epoch": 90, "val_loss": 243570.671875, "train_action_mse_error": 30.17244529724121} {"train_loss": -6.458629608154297, "global_step": 15288, "epoch": 91} {"train_loss": -6.360706329345703, "global_step": 15289, "epoch": 91} {"train_loss": -6.399523735046387, "global_step": 15290, "epoch": 91} {"train_loss": -6.382494926452637, "global_step": 15291, "epoch": 91} {"train_loss": -6.171610355377197, "global_step": 15292, "epoch": 91} {"train_loss": -5.857336044311523, "global_step": 15293, "epoch": 91} {"train_loss": -6.47383975982666, "global_step": 15294, "epoch": 91} {"train_loss": -6.481966018676758, "global_step": 15295, "epoch": 91} {"train_loss": -6.212353229522705, "global_step": 15296, "epoch": 91} {"train_loss": -6.158357620239258, "global_step": 15297, "epoch": 91} {"train_loss": -6.479917049407959, "global_step": 15298, "epoch": 91} {"train_loss": -6.335726737976074, "global_step": 15299, "epoch": 91} {"train_loss": -6.324283599853516, "global_step": 15300, "epoch": 91} {"train_loss": -6.449631214141846, "global_step": 15301, "epoch": 91} {"train_loss": -6.300539016723633, "global_step": 15302, "epoch": 91} {"train_loss": -6.419886112213135, "global_step": 15303, "epoch": 91} {"train_loss": -6.517842769622803, "global_step": 15304, "epoch": 91} {"train_loss": -6.5514020919799805, "global_step": 15305, "epoch": 91} {"train_loss": -6.44825553894043, "global_step": 15306, "epoch": 91} {"train_loss": -6.527048587799072, "global_step": 15307, "epoch": 91} {"train_loss": -6.587246894836426, "global_step": 15308, "epoch": 91} {"train_loss": -6.533323287963867, "global_step": 15309, "epoch": 91} {"train_loss": -6.517315864562988, "global_step": 15310, "epoch": 91} {"train_loss": -6.611075401306152, "global_step": 15311, "epoch": 91} {"train_loss": -6.643972396850586, "global_step": 15312, "epoch": 91} {"train_loss": -6.30256462097168, "global_step": 15313, "epoch": 91} {"train_loss": -6.242516040802002, "global_step": 15314, "epoch": 91} {"train_loss": -6.3951945304870605, "global_step": 15315, "epoch": 91} {"train_loss": -6.3560614585876465, "global_step": 15316, "epoch": 91} {"train_loss": -6.353595733642578, "global_step": 15317, "epoch": 91} {"train_loss": -6.325372695922852, "global_step": 15318, "epoch": 91} {"train_loss": -6.56956672668457, "global_step": 15319, "epoch": 91} {"train_loss": -6.558742046356201, "global_step": 15320, "epoch": 91} {"train_loss": -6.481704235076904, "global_step": 15321, "epoch": 91} {"train_loss": -6.366482734680176, "global_step": 15322, "epoch": 91} {"train_loss": -6.4204020500183105, "global_step": 15323, "epoch": 91} {"train_loss": -6.344919681549072, "global_step": 15324, "epoch": 91} {"train_loss": -6.395315647125244, "global_step": 15325, "epoch": 91} {"train_loss": -6.208168029785156, "global_step": 15326, "epoch": 91} {"train_loss": -6.430530548095703, "global_step": 15327, "epoch": 91} {"train_loss": -6.5286641120910645, "global_step": 15328, "epoch": 91} {"train_loss": -6.509421348571777, "global_step": 15329, "epoch": 91} {"train_loss": -6.301326751708984, "global_step": 15330, "epoch": 91} {"train_loss": -6.437012195587158, "global_step": 15331, "epoch": 91} {"train_loss": -6.51283073425293, "global_step": 15332, "epoch": 91} {"train_loss": -6.408871173858643, "global_step": 15333, "epoch": 91} {"train_loss": -6.221210479736328, "global_step": 15334, "epoch": 91} {"train_loss": -6.532193183898926, "global_step": 15335, "epoch": 91} {"train_loss": -6.535323143005371, "global_step": 15336, "epoch": 91} {"train_loss": -6.428311347961426, "global_step": 15337, "epoch": 91} {"train_loss": -6.160888671875, "global_step": 15338, "epoch": 91} {"train_loss": -6.634771347045898, "global_step": 15339, "epoch": 91} {"train_loss": -6.497533798217773, "global_step": 15340, "epoch": 91} {"train_loss": -6.4874067306518555, "global_step": 15341, "epoch": 91} {"train_loss": -6.243699073791504, "global_step": 15342, "epoch": 91} {"train_loss": -6.333020210266113, "global_step": 15343, "epoch": 91} {"train_loss": -6.551424026489258, "global_step": 15344, "epoch": 91} {"train_loss": -6.425079345703125, "global_step": 15345, "epoch": 91} {"train_loss": -6.331655025482178, "global_step": 15346, "epoch": 91} {"train_loss": -6.3119893074035645, "global_step": 15347, "epoch": 91} {"train_loss": -6.2436981201171875, "global_step": 15348, "epoch": 91} {"train_loss": -6.2536163330078125, "global_step": 15349, "epoch": 91} {"train_loss": -6.435430526733398, "global_step": 15350, "epoch": 91} {"train_loss": -6.336530685424805, "global_step": 15351, "epoch": 91} {"train_loss": -6.27574348449707, "global_step": 15352, "epoch": 91} {"train_loss": -6.363390922546387, "global_step": 15353, "epoch": 91} {"train_loss": -6.360935688018799, "global_step": 15354, "epoch": 91} {"train_loss": -6.117249488830566, "global_step": 15355, "epoch": 91} {"train_loss": -6.244998931884766, "global_step": 15356, "epoch": 91} {"train_loss": -6.288288116455078, "global_step": 15357, "epoch": 91} {"train_loss": -6.060774803161621, "global_step": 15358, "epoch": 91} {"train_loss": -6.15559196472168, "global_step": 15359, "epoch": 91} {"train_loss": -6.156217098236084, "global_step": 15360, "epoch": 91} {"train_loss": -6.298980712890625, "global_step": 15361, "epoch": 91} {"train_loss": -6.196004867553711, "global_step": 15362, "epoch": 91} {"train_loss": -6.209966659545898, "global_step": 15363, "epoch": 91} {"train_loss": -6.253261089324951, "global_step": 15364, "epoch": 91} {"train_loss": -6.30025577545166, "global_step": 15365, "epoch": 91} {"train_loss": -6.185593128204346, "global_step": 15366, "epoch": 91} {"train_loss": -6.159830093383789, "global_step": 15367, "epoch": 91} {"train_loss": -6.137745380401611, "global_step": 15368, "epoch": 91} {"train_loss": -6.134541988372803, "global_step": 15369, "epoch": 91} {"train_loss": -6.430323600769043, "global_step": 15370, "epoch": 91} {"train_loss": -6.152451992034912, "global_step": 15371, "epoch": 91} {"train_loss": -6.249950408935547, "global_step": 15372, "epoch": 91} {"train_loss": -6.199027061462402, "global_step": 15373, "epoch": 91} {"train_loss": -6.430319309234619, "global_step": 15374, "epoch": 91} {"train_loss": -6.5497941970825195, "global_step": 15375, "epoch": 91} {"train_loss": -6.468721866607666, "global_step": 15376, "epoch": 91} {"train_loss": -6.193239212036133, "global_step": 15377, "epoch": 91} {"train_loss": -6.479562759399414, "global_step": 15378, "epoch": 91} {"train_loss": -6.427568435668945, "global_step": 15379, "epoch": 91} {"train_loss": -6.237362384796143, "global_step": 15380, "epoch": 91} {"train_loss": -6.410165786743164, "global_step": 15381, "epoch": 91} {"train_loss": -6.427029132843018, "global_step": 15382, "epoch": 91} {"train_loss": -6.546234130859375, "global_step": 15383, "epoch": 91} {"train_loss": -6.415961265563965, "global_step": 15384, "epoch": 91} {"train_loss": -6.513355255126953, "global_step": 15385, "epoch": 91} {"train_loss": -6.481780052185059, "global_step": 15386, "epoch": 91} {"train_loss": -6.622631072998047, "global_step": 15387, "epoch": 91} {"train_loss": -6.56513786315918, "global_step": 15388, "epoch": 91} {"train_loss": -6.6413726806640625, "global_step": 15389, "epoch": 91} {"train_loss": -6.353724479675293, "global_step": 15390, "epoch": 91} {"train_loss": -6.448886871337891, "global_step": 15391, "epoch": 91} {"train_loss": -6.546357154846191, "global_step": 15392, "epoch": 91} {"train_loss": -6.465884208679199, "global_step": 15393, "epoch": 91} {"train_loss": -6.5490312576293945, "global_step": 15394, "epoch": 91} {"train_loss": -6.353286266326904, "global_step": 15395, "epoch": 91} {"train_loss": -6.502313137054443, "global_step": 15396, "epoch": 91} {"train_loss": -6.4358367919921875, "global_step": 15397, "epoch": 91} {"train_loss": -6.499327659606934, "global_step": 15398, "epoch": 91} {"train_loss": -6.492142200469971, "global_step": 15399, "epoch": 91} {"train_loss": -6.241757392883301, "global_step": 15400, "epoch": 91} {"train_loss": -6.38026762008667, "global_step": 15401, "epoch": 91} {"train_loss": -6.437793254852295, "global_step": 15402, "epoch": 91} {"train_loss": -6.451800346374512, "global_step": 15403, "epoch": 91} {"train_loss": -6.300572872161865, "global_step": 15404, "epoch": 91} {"train_loss": -6.510438919067383, "global_step": 15405, "epoch": 91} {"train_loss": -6.375003337860107, "global_step": 15406, "epoch": 91} {"train_loss": -6.227695465087891, "global_step": 15407, "epoch": 91} {"train_loss": -6.37799072265625, "global_step": 15408, "epoch": 91} {"train_loss": -6.454643249511719, "global_step": 15409, "epoch": 91} {"train_loss": -6.495584964752197, "global_step": 15410, "epoch": 91} {"train_loss": -6.509219169616699, "global_step": 15411, "epoch": 91} {"train_loss": -6.422162055969238, "global_step": 15412, "epoch": 91} {"train_loss": -6.107577323913574, "global_step": 15413, "epoch": 91} {"train_loss": -6.07587194442749, "global_step": 15414, "epoch": 91} {"train_loss": -6.401294708251953, "global_step": 15415, "epoch": 91} {"train_loss": -6.310878753662109, "global_step": 15416, "epoch": 91} {"train_loss": -6.2200927734375, "global_step": 15417, "epoch": 91} {"train_loss": -6.672231674194336, "global_step": 15418, "epoch": 91} {"train_loss": -6.378891944885254, "global_step": 15419, "epoch": 91} {"train_loss": -6.65308952331543, "global_step": 15420, "epoch": 91} {"train_loss": -6.464998245239258, "global_step": 15421, "epoch": 91} {"train_loss": -6.623396873474121, "global_step": 15422, "epoch": 91} {"train_loss": -6.499873161315918, "global_step": 15423, "epoch": 91} {"train_loss": -6.256626129150391, "global_step": 15424, "epoch": 91} {"train_loss": -6.301774978637695, "global_step": 15425, "epoch": 91} {"train_loss": -6.428722858428955, "global_step": 15426, "epoch": 91} {"train_loss": -6.416839122772217, "global_step": 15427, "epoch": 91} {"train_loss": -6.418791770935059, "global_step": 15428, "epoch": 91} {"train_loss": -6.536122798919678, "global_step": 15429, "epoch": 91} {"train_loss": -6.427577972412109, "global_step": 15430, "epoch": 91} {"train_loss": -6.5825910568237305, "global_step": 15431, "epoch": 91} {"train_loss": -6.536901473999023, "global_step": 15432, "epoch": 91} {"train_loss": -6.561680316925049, "global_step": 15433, "epoch": 91} {"train_loss": -6.355399131774902, "global_step": 15434, "epoch": 91} {"train_loss": -6.500757694244385, "global_step": 15435, "epoch": 91} {"train_loss": -6.330817222595215, "global_step": 15436, "epoch": 91} {"train_loss": -6.423562049865723, "global_step": 15437, "epoch": 91} {"train_loss": -6.399871349334717, "global_step": 15438, "epoch": 91} {"train_loss": -6.36981201171875, "global_step": 15439, "epoch": 91} {"train_loss": -6.365902900695801, "global_step": 15440, "epoch": 91} {"train_loss": -6.270586013793945, "global_step": 15441, "epoch": 91} {"train_loss": -6.3219313621521, "global_step": 15442, "epoch": 91} {"train_loss": -6.496231555938721, "global_step": 15443, "epoch": 91} {"train_loss": -6.5898542404174805, "global_step": 15444, "epoch": 91} {"train_loss": -6.57867956161499, "global_step": 15445, "epoch": 91} {"train_loss": -6.369831085205078, "global_step": 15446, "epoch": 91} {"train_loss": -6.166461944580078, "global_step": 15447, "epoch": 91} {"train_loss": -6.356196403503418, "global_step": 15448, "epoch": 91} {"train_loss": -6.338434219360352, "global_step": 15449, "epoch": 91} {"train_loss": -6.250516891479492, "global_step": 15450, "epoch": 91} {"train_loss": -6.516435623168945, "global_step": 15451, "epoch": 91} {"train_loss": -6.470628261566162, "global_step": 15452, "epoch": 91} {"train_loss": -6.332789421081543, "global_step": 15453, "epoch": 91} {"train_loss": -6.35378360748291, "global_step": 15454, "epoch": 91} {"train_loss": -6.3879734220958895, "global_step": 15455, "epoch": 91, "val_loss": 248462.203125} {"train_loss": -6.279513359069824, "global_step": 15456, "epoch": 92} {"train_loss": -6.30477237701416, "global_step": 15457, "epoch": 92} {"train_loss": -6.314027786254883, "global_step": 15458, "epoch": 92} {"train_loss": -6.339001655578613, "global_step": 15459, "epoch": 92} {"train_loss": -6.214939117431641, "global_step": 15460, "epoch": 92} {"train_loss": -6.372593402862549, "global_step": 15461, "epoch": 92} {"train_loss": -6.279865264892578, "global_step": 15462, "epoch": 92} {"train_loss": -6.220432281494141, "global_step": 15463, "epoch": 92} {"train_loss": -6.67562198638916, "global_step": 15464, "epoch": 92} {"train_loss": -6.371859550476074, "global_step": 15465, "epoch": 92} {"train_loss": -6.4455084800720215, "global_step": 15466, "epoch": 92} {"train_loss": -6.479197978973389, "global_step": 15467, "epoch": 92} {"train_loss": -6.362297058105469, "global_step": 15468, "epoch": 92} {"train_loss": -6.664681911468506, "global_step": 15469, "epoch": 92} {"train_loss": -6.532382011413574, "global_step": 15470, "epoch": 92} {"train_loss": -6.563016891479492, "global_step": 15471, "epoch": 92} {"train_loss": -6.518305778503418, "global_step": 15472, "epoch": 92} {"train_loss": -6.463864326477051, "global_step": 15473, "epoch": 92} {"train_loss": -6.514256954193115, "global_step": 15474, "epoch": 92} {"train_loss": -6.413619518280029, "global_step": 15475, "epoch": 92} {"train_loss": -6.437579154968262, "global_step": 15476, "epoch": 92} {"train_loss": -6.423783779144287, "global_step": 15477, "epoch": 92} {"train_loss": -6.463434219360352, "global_step": 15478, "epoch": 92} {"train_loss": -6.683192253112793, "global_step": 15479, "epoch": 92} {"train_loss": -6.620928764343262, "global_step": 15480, "epoch": 92} {"train_loss": -6.623625755310059, "global_step": 15481, "epoch": 92} {"train_loss": -6.201654434204102, "global_step": 15482, "epoch": 92} {"train_loss": -6.400146007537842, "global_step": 15483, "epoch": 92} {"train_loss": -6.569684028625488, "global_step": 15484, "epoch": 92} {"train_loss": -6.442899703979492, "global_step": 15485, "epoch": 92} {"train_loss": -6.754861354827881, "global_step": 15486, "epoch": 92} {"train_loss": -6.435478210449219, "global_step": 15487, "epoch": 92} {"train_loss": -6.471103668212891, "global_step": 15488, "epoch": 92} {"train_loss": -6.078880310058594, "global_step": 15489, "epoch": 92} {"train_loss": -6.541324615478516, "global_step": 15490, "epoch": 92} {"train_loss": -6.674659729003906, "global_step": 15491, "epoch": 92} {"train_loss": -6.509082794189453, "global_step": 15492, "epoch": 92} {"train_loss": -6.5286455154418945, "global_step": 15493, "epoch": 92} {"train_loss": -6.496457099914551, "global_step": 15494, "epoch": 92} {"train_loss": -6.475860118865967, "global_step": 15495, "epoch": 92} {"train_loss": -6.4091644287109375, "global_step": 15496, "epoch": 92} {"train_loss": -6.495906829833984, "global_step": 15497, "epoch": 92} {"train_loss": -6.653160572052002, "global_step": 15498, "epoch": 92} {"train_loss": -6.354135513305664, "global_step": 15499, "epoch": 92} {"train_loss": -6.496308326721191, "global_step": 15500, "epoch": 92} {"train_loss": -6.503893852233887, "global_step": 15501, "epoch": 92} {"train_loss": -6.577985763549805, "global_step": 15502, "epoch": 92} {"train_loss": -6.41999626159668, "global_step": 15503, "epoch": 92} {"train_loss": -6.309848785400391, "global_step": 15504, "epoch": 92} {"train_loss": -6.416388988494873, "global_step": 15505, "epoch": 92} {"train_loss": -6.3787689208984375, "global_step": 15506, "epoch": 92} {"train_loss": -6.143030166625977, "global_step": 15507, "epoch": 92} {"train_loss": -6.484185218811035, "global_step": 15508, "epoch": 92} {"train_loss": -6.107890605926514, "global_step": 15509, "epoch": 92} {"train_loss": -6.6684041023254395, "global_step": 15510, "epoch": 92} {"train_loss": -5.787447929382324, "global_step": 15511, "epoch": 92} {"train_loss": -6.43113374710083, "global_step": 15512, "epoch": 92} {"train_loss": -6.1281585693359375, "global_step": 15513, "epoch": 92} {"train_loss": -6.365061283111572, "global_step": 15514, "epoch": 92} {"train_loss": -6.265847682952881, "global_step": 15515, "epoch": 92} {"train_loss": -6.2166924476623535, "global_step": 15516, "epoch": 92} {"train_loss": -6.543881416320801, "global_step": 15517, "epoch": 92} {"train_loss": -6.348950386047363, "global_step": 15518, "epoch": 92} {"train_loss": -6.39024543762207, "global_step": 15519, "epoch": 92} {"train_loss": -6.292686462402344, "global_step": 15520, "epoch": 92} {"train_loss": -6.378487586975098, "global_step": 15521, "epoch": 92} {"train_loss": -5.969581604003906, "global_step": 15522, "epoch": 92} {"train_loss": -6.449760437011719, "global_step": 15523, "epoch": 92} {"train_loss": -6.347140312194824, "global_step": 15524, "epoch": 92} {"train_loss": -6.52562141418457, "global_step": 15525, "epoch": 92} {"train_loss": -6.456398963928223, "global_step": 15526, "epoch": 92} {"train_loss": -6.3217082023620605, "global_step": 15527, "epoch": 92} {"train_loss": -6.450883865356445, "global_step": 15528, "epoch": 92} {"train_loss": -6.2773332595825195, "global_step": 15529, "epoch": 92} {"train_loss": -6.1521124839782715, "global_step": 15530, "epoch": 92} {"train_loss": -6.188814163208008, "global_step": 15531, "epoch": 92} {"train_loss": -6.394614219665527, "global_step": 15532, "epoch": 92} {"train_loss": -6.526864528656006, "global_step": 15533, "epoch": 92} {"train_loss": -6.530491352081299, "global_step": 15534, "epoch": 92} {"train_loss": -6.4760260581970215, "global_step": 15535, "epoch": 92} {"train_loss": -6.184867858886719, "global_step": 15536, "epoch": 92} {"train_loss": -6.351605415344238, "global_step": 15537, "epoch": 92} {"train_loss": -6.456279754638672, "global_step": 15538, "epoch": 92} {"train_loss": -6.330376148223877, "global_step": 15539, "epoch": 92} {"train_loss": -6.600094795227051, "global_step": 15540, "epoch": 92} {"train_loss": -6.643589019775391, "global_step": 15541, "epoch": 92} {"train_loss": -6.321877956390381, "global_step": 15542, "epoch": 92} {"train_loss": -6.328319549560547, "global_step": 15543, "epoch": 92} {"train_loss": -6.33458137512207, "global_step": 15544, "epoch": 92} {"train_loss": -6.278659343719482, "global_step": 15545, "epoch": 92} {"train_loss": -6.326101779937744, "global_step": 15546, "epoch": 92} {"train_loss": -6.361076354980469, "global_step": 15547, "epoch": 92} {"train_loss": -6.3501200675964355, "global_step": 15548, "epoch": 92} {"train_loss": -6.6058454513549805, "global_step": 15549, "epoch": 92} {"train_loss": -6.607805252075195, "global_step": 15550, "epoch": 92} {"train_loss": -6.414112091064453, "global_step": 15551, "epoch": 92} {"train_loss": -6.446841239929199, "global_step": 15552, "epoch": 92} {"train_loss": -6.454161643981934, "global_step": 15553, "epoch": 92} {"train_loss": -6.472125053405762, "global_step": 15554, "epoch": 92} {"train_loss": -6.245805740356445, "global_step": 15555, "epoch": 92} {"train_loss": -6.371114730834961, "global_step": 15556, "epoch": 92} {"train_loss": -6.2752838134765625, "global_step": 15557, "epoch": 92} {"train_loss": -6.561859130859375, "global_step": 15558, "epoch": 92} {"train_loss": -6.500646114349365, "global_step": 15559, "epoch": 92} {"train_loss": -6.392151832580566, "global_step": 15560, "epoch": 92} {"train_loss": -6.5661773681640625, "global_step": 15561, "epoch": 92} {"train_loss": -6.233862400054932, "global_step": 15562, "epoch": 92} {"train_loss": -6.352712631225586, "global_step": 15563, "epoch": 92} {"train_loss": -6.29581880569458, "global_step": 15564, "epoch": 92} {"train_loss": -6.522003173828125, "global_step": 15565, "epoch": 92} {"train_loss": -6.429150581359863, "global_step": 15566, "epoch": 92} {"train_loss": -6.400339126586914, "global_step": 15567, "epoch": 92} {"train_loss": -6.283900260925293, "global_step": 15568, "epoch": 92} {"train_loss": -6.28156852722168, "global_step": 15569, "epoch": 92} {"train_loss": -6.386113166809082, "global_step": 15570, "epoch": 92} {"train_loss": -6.294836044311523, "global_step": 15571, "epoch": 92} {"train_loss": -6.513014793395996, "global_step": 15572, "epoch": 92} {"train_loss": -6.2743353843688965, "global_step": 15573, "epoch": 92} {"train_loss": -6.299653053283691, "global_step": 15574, "epoch": 92} {"train_loss": -6.024573802947998, "global_step": 15575, "epoch": 92} {"train_loss": -6.374455451965332, "global_step": 15576, "epoch": 92} {"train_loss": -6.183073997497559, "global_step": 15577, "epoch": 92} {"train_loss": -6.22651481628418, "global_step": 15578, "epoch": 92} {"train_loss": -6.479371547698975, "global_step": 15579, "epoch": 92} {"train_loss": -6.0150628089904785, "global_step": 15580, "epoch": 92} {"train_loss": -6.283578872680664, "global_step": 15581, "epoch": 92} {"train_loss": -5.826157569885254, "global_step": 15582, "epoch": 92} {"train_loss": -5.9886040687561035, "global_step": 15583, "epoch": 92} {"train_loss": -6.232785224914551, "global_step": 15584, "epoch": 92} {"train_loss": -6.073479652404785, "global_step": 15585, "epoch": 92} {"train_loss": -6.356632709503174, "global_step": 15586, "epoch": 92} {"train_loss": -6.195607662200928, "global_step": 15587, "epoch": 92} {"train_loss": -6.197617530822754, "global_step": 15588, "epoch": 92} {"train_loss": -6.446250915527344, "global_step": 15589, "epoch": 92} {"train_loss": -6.187638282775879, "global_step": 15590, "epoch": 92} {"train_loss": -6.554366111755371, "global_step": 15591, "epoch": 92} {"train_loss": -6.250912189483643, "global_step": 15592, "epoch": 92} {"train_loss": -6.179978370666504, "global_step": 15593, "epoch": 92} {"train_loss": -6.3849992752075195, "global_step": 15594, "epoch": 92} {"train_loss": -6.186145305633545, "global_step": 15595, "epoch": 92} {"train_loss": -6.665266036987305, "global_step": 15596, "epoch": 92} {"train_loss": -6.12954044342041, "global_step": 15597, "epoch": 92} {"train_loss": -6.413818359375, "global_step": 15598, "epoch": 92} {"train_loss": -6.495814800262451, "global_step": 15599, "epoch": 92} {"train_loss": -6.518881797790527, "global_step": 15600, "epoch": 92} {"train_loss": -6.108701705932617, "global_step": 15601, "epoch": 92} {"train_loss": -6.624323844909668, "global_step": 15602, "epoch": 92} {"train_loss": -6.582761764526367, "global_step": 15603, "epoch": 92} {"train_loss": -6.380959510803223, "global_step": 15604, "epoch": 92} {"train_loss": -6.492029190063477, "global_step": 15605, "epoch": 92} {"train_loss": -6.554599761962891, "global_step": 15606, "epoch": 92} {"train_loss": -6.31778621673584, "global_step": 15607, "epoch": 92} {"train_loss": -6.057879447937012, "global_step": 15608, "epoch": 92} {"train_loss": -6.0903520584106445, "global_step": 15609, "epoch": 92} {"train_loss": -6.548943519592285, "global_step": 15610, "epoch": 92} {"train_loss": -6.422384262084961, "global_step": 15611, "epoch": 92} {"train_loss": -6.5392351150512695, "global_step": 15612, "epoch": 92} {"train_loss": -6.321828842163086, "global_step": 15613, "epoch": 92} {"train_loss": -6.256659030914307, "global_step": 15614, "epoch": 92} {"train_loss": -6.62108039855957, "global_step": 15615, "epoch": 92} {"train_loss": -6.321030616760254, "global_step": 15616, "epoch": 92} {"train_loss": -6.566071510314941, "global_step": 15617, "epoch": 92} {"train_loss": -6.212388038635254, "global_step": 15618, "epoch": 92} {"train_loss": -6.201763153076172, "global_step": 15619, "epoch": 92} {"train_loss": -6.325035572052002, "global_step": 15620, "epoch": 92} {"train_loss": -6.590640068054199, "global_step": 15621, "epoch": 92} {"train_loss": -6.206300735473633, "global_step": 15622, "epoch": 92} {"train_loss": -6.381853691169193, "global_step": 15623, "epoch": 92, "val_loss": 243874.46875} {"train_loss": -6.467731952667236, "global_step": 15624, "epoch": 93} {"train_loss": -6.462123870849609, "global_step": 15625, "epoch": 93} {"train_loss": -6.385189056396484, "global_step": 15626, "epoch": 93} {"train_loss": -6.437525272369385, "global_step": 15627, "epoch": 93} {"train_loss": -6.3460469245910645, "global_step": 15628, "epoch": 93} {"train_loss": -6.513278961181641, "global_step": 15629, "epoch": 93} {"train_loss": -6.693127632141113, "global_step": 15630, "epoch": 93} {"train_loss": -6.241620063781738, "global_step": 15631, "epoch": 93} {"train_loss": -6.547685623168945, "global_step": 15632, "epoch": 93} {"train_loss": -6.652125358581543, "global_step": 15633, "epoch": 93} {"train_loss": -6.339422702789307, "global_step": 15634, "epoch": 93} {"train_loss": -6.514233112335205, "global_step": 15635, "epoch": 93} {"train_loss": -6.525765895843506, "global_step": 15636, "epoch": 93} {"train_loss": -6.380716323852539, "global_step": 15637, "epoch": 93} {"train_loss": -6.502317905426025, "global_step": 15638, "epoch": 93} {"train_loss": -6.4138922691345215, "global_step": 15639, "epoch": 93} {"train_loss": -6.387842178344727, "global_step": 15640, "epoch": 93} {"train_loss": -6.30838680267334, "global_step": 15641, "epoch": 93} {"train_loss": -6.411532402038574, "global_step": 15642, "epoch": 93} {"train_loss": -6.3380303382873535, "global_step": 15643, "epoch": 93} {"train_loss": -6.496434211730957, "global_step": 15644, "epoch": 93} {"train_loss": -6.534359455108643, "global_step": 15645, "epoch": 93} {"train_loss": -6.567852020263672, "global_step": 15646, "epoch": 93} {"train_loss": -6.691341400146484, "global_step": 15647, "epoch": 93} {"train_loss": -6.351469993591309, "global_step": 15648, "epoch": 93} {"train_loss": -6.47027587890625, "global_step": 15649, "epoch": 93} {"train_loss": -6.659095287322998, "global_step": 15650, "epoch": 93} {"train_loss": -6.621065139770508, "global_step": 15651, "epoch": 93} {"train_loss": -6.493260383605957, "global_step": 15652, "epoch": 93} {"train_loss": -6.306979179382324, "global_step": 15653, "epoch": 93} {"train_loss": -6.791007995605469, "global_step": 15654, "epoch": 93} {"train_loss": -6.449741363525391, "global_step": 15655, "epoch": 93} {"train_loss": -6.580756187438965, "global_step": 15656, "epoch": 93} {"train_loss": -6.341777801513672, "global_step": 15657, "epoch": 93} {"train_loss": -6.6495161056518555, "global_step": 15658, "epoch": 93} {"train_loss": -6.532985687255859, "global_step": 15659, "epoch": 93} {"train_loss": -6.267948150634766, "global_step": 15660, "epoch": 93} {"train_loss": -6.3850297927856445, "global_step": 15661, "epoch": 93} {"train_loss": -6.303654670715332, "global_step": 15662, "epoch": 93} {"train_loss": -6.556998252868652, "global_step": 15663, "epoch": 93} {"train_loss": -6.21522331237793, "global_step": 15664, "epoch": 93} {"train_loss": -6.286987781524658, "global_step": 15665, "epoch": 93} {"train_loss": -6.314718723297119, "global_step": 15666, "epoch": 93} {"train_loss": -6.511202812194824, "global_step": 15667, "epoch": 93} {"train_loss": -6.296754837036133, "global_step": 15668, "epoch": 93} {"train_loss": -6.405721664428711, "global_step": 15669, "epoch": 93} {"train_loss": -6.525035858154297, "global_step": 15670, "epoch": 93} {"train_loss": -6.577179908752441, "global_step": 15671, "epoch": 93} {"train_loss": -6.607026100158691, "global_step": 15672, "epoch": 93} {"train_loss": -6.24188756942749, "global_step": 15673, "epoch": 93} {"train_loss": -6.408108711242676, "global_step": 15674, "epoch": 93} {"train_loss": -6.304708957672119, "global_step": 15675, "epoch": 93} {"train_loss": -6.650717735290527, "global_step": 15676, "epoch": 93} {"train_loss": -6.195356845855713, "global_step": 15677, "epoch": 93} {"train_loss": -6.5362548828125, "global_step": 15678, "epoch": 93} {"train_loss": -6.364614009857178, "global_step": 15679, "epoch": 93} {"train_loss": -6.298120975494385, "global_step": 15680, "epoch": 93} {"train_loss": -6.484297752380371, "global_step": 15681, "epoch": 93} {"train_loss": -6.457607746124268, "global_step": 15682, "epoch": 93} {"train_loss": -6.557117938995361, "global_step": 15683, "epoch": 93} {"train_loss": -6.5691351890563965, "global_step": 15684, "epoch": 93} {"train_loss": -6.469971656799316, "global_step": 15685, "epoch": 93} {"train_loss": -6.409015655517578, "global_step": 15686, "epoch": 93} {"train_loss": -6.527083396911621, "global_step": 15687, "epoch": 93} {"train_loss": -6.113473892211914, "global_step": 15688, "epoch": 93} {"train_loss": -6.300759315490723, "global_step": 15689, "epoch": 93} {"train_loss": -6.342043876647949, "global_step": 15690, "epoch": 93} {"train_loss": -6.50826358795166, "global_step": 15691, "epoch": 93} {"train_loss": -6.514987468719482, "global_step": 15692, "epoch": 93} {"train_loss": -6.34681510925293, "global_step": 15693, "epoch": 93} {"train_loss": -6.695382118225098, "global_step": 15694, "epoch": 93} {"train_loss": -6.325460910797119, "global_step": 15695, "epoch": 93} {"train_loss": -6.278887748718262, "global_step": 15696, "epoch": 93} {"train_loss": -6.416836738586426, "global_step": 15697, "epoch": 93} {"train_loss": -6.591567039489746, "global_step": 15698, "epoch": 93} {"train_loss": -6.484479904174805, "global_step": 15699, "epoch": 93} {"train_loss": -6.465044021606445, "global_step": 15700, "epoch": 93} {"train_loss": -6.560152053833008, "global_step": 15701, "epoch": 93} {"train_loss": -6.433170318603516, "global_step": 15702, "epoch": 93} {"train_loss": -6.54780387878418, "global_step": 15703, "epoch": 93} {"train_loss": -6.596096992492676, "global_step": 15704, "epoch": 93} {"train_loss": -6.7290449142456055, "global_step": 15705, "epoch": 93} {"train_loss": -6.432053565979004, "global_step": 15706, "epoch": 93} {"train_loss": -6.511539459228516, "global_step": 15707, "epoch": 93} {"train_loss": -6.5917463302612305, "global_step": 15708, "epoch": 93} {"train_loss": -6.546004295349121, "global_step": 15709, "epoch": 93} {"train_loss": -6.542724132537842, "global_step": 15710, "epoch": 93} {"train_loss": -6.4274420738220215, "global_step": 15711, "epoch": 93} {"train_loss": -6.474149703979492, "global_step": 15712, "epoch": 93} {"train_loss": -6.478639602661133, "global_step": 15713, "epoch": 93} {"train_loss": -6.477112770080566, "global_step": 15714, "epoch": 93} {"train_loss": -6.521559715270996, "global_step": 15715, "epoch": 93} {"train_loss": -6.587900161743164, "global_step": 15716, "epoch": 93} {"train_loss": -6.454113006591797, "global_step": 15717, "epoch": 93} {"train_loss": -6.396112442016602, "global_step": 15718, "epoch": 93} {"train_loss": -6.509823799133301, "global_step": 15719, "epoch": 93} {"train_loss": -6.490863800048828, "global_step": 15720, "epoch": 93} {"train_loss": -6.359524726867676, "global_step": 15721, "epoch": 93} {"train_loss": -6.5814666748046875, "global_step": 15722, "epoch": 93} {"train_loss": -6.465281963348389, "global_step": 15723, "epoch": 93} {"train_loss": -6.438126564025879, "global_step": 15724, "epoch": 93} {"train_loss": -6.431131839752197, "global_step": 15725, "epoch": 93} {"train_loss": -6.541609287261963, "global_step": 15726, "epoch": 93} {"train_loss": -6.622949600219727, "global_step": 15727, "epoch": 93} {"train_loss": -6.3981757164001465, "global_step": 15728, "epoch": 93} {"train_loss": -6.418825149536133, "global_step": 15729, "epoch": 93} {"train_loss": -6.509786128997803, "global_step": 15730, "epoch": 93} {"train_loss": -6.309239864349365, "global_step": 15731, "epoch": 93} {"train_loss": -6.404783725738525, "global_step": 15732, "epoch": 93} {"train_loss": -6.349451541900635, "global_step": 15733, "epoch": 93} {"train_loss": -6.452009201049805, "global_step": 15734, "epoch": 93} {"train_loss": -6.2254180908203125, "global_step": 15735, "epoch": 93} {"train_loss": -6.591308116912842, "global_step": 15736, "epoch": 93} {"train_loss": -6.40071964263916, "global_step": 15737, "epoch": 93} {"train_loss": -6.458926200866699, "global_step": 15738, "epoch": 93} {"train_loss": -6.5085673332214355, "global_step": 15739, "epoch": 93} {"train_loss": -6.46138334274292, "global_step": 15740, "epoch": 93} {"train_loss": -6.721262454986572, "global_step": 15741, "epoch": 93} {"train_loss": -6.667990684509277, "global_step": 15742, "epoch": 93} {"train_loss": -6.391826629638672, "global_step": 15743, "epoch": 93} {"train_loss": -6.188685417175293, "global_step": 15744, "epoch": 93} {"train_loss": -6.4705328941345215, "global_step": 15745, "epoch": 93} {"train_loss": -6.24847936630249, "global_step": 15746, "epoch": 93} {"train_loss": -6.4394121170043945, "global_step": 15747, "epoch": 93} {"train_loss": -6.426169395446777, "global_step": 15748, "epoch": 93} {"train_loss": -6.316413879394531, "global_step": 15749, "epoch": 93} {"train_loss": -6.348462104797363, "global_step": 15750, "epoch": 93} {"train_loss": -6.2784104347229, "global_step": 15751, "epoch": 93} {"train_loss": -6.503435134887695, "global_step": 15752, "epoch": 93} {"train_loss": -6.344292640686035, "global_step": 15753, "epoch": 93} {"train_loss": -6.374030113220215, "global_step": 15754, "epoch": 93} {"train_loss": -6.490265369415283, "global_step": 15755, "epoch": 93} {"train_loss": -6.134410858154297, "global_step": 15756, "epoch": 93} {"train_loss": -6.426092147827148, "global_step": 15757, "epoch": 93} {"train_loss": -6.227001190185547, "global_step": 15758, "epoch": 93} {"train_loss": -6.610089302062988, "global_step": 15759, "epoch": 93} {"train_loss": -6.529477119445801, "global_step": 15760, "epoch": 93} {"train_loss": -6.467540264129639, "global_step": 15761, "epoch": 93} {"train_loss": -6.618104934692383, "global_step": 15762, "epoch": 93} {"train_loss": -6.410109043121338, "global_step": 15763, "epoch": 93} {"train_loss": -6.452225208282471, "global_step": 15764, "epoch": 93} {"train_loss": -6.524965286254883, "global_step": 15765, "epoch": 93} {"train_loss": -6.4826765060424805, "global_step": 15766, "epoch": 93} {"train_loss": -6.527769088745117, "global_step": 15767, "epoch": 93} {"train_loss": -6.439538478851318, "global_step": 15768, "epoch": 93} {"train_loss": -6.411017417907715, "global_step": 15769, "epoch": 93} {"train_loss": -6.255258560180664, "global_step": 15770, "epoch": 93} {"train_loss": -6.20014762878418, "global_step": 15771, "epoch": 93} {"train_loss": -6.285573959350586, "global_step": 15772, "epoch": 93} {"train_loss": -6.2576704025268555, "global_step": 15773, "epoch": 93} {"train_loss": -6.500452995300293, "global_step": 15774, "epoch": 93} {"train_loss": -6.18730354309082, "global_step": 15775, "epoch": 93} {"train_loss": -6.278183937072754, "global_step": 15776, "epoch": 93} {"train_loss": -6.532285690307617, "global_step": 15777, "epoch": 93} {"train_loss": -6.47313117980957, "global_step": 15778, "epoch": 93} {"train_loss": -6.528233528137207, "global_step": 15779, "epoch": 93} {"train_loss": -6.3845534324646, "global_step": 15780, "epoch": 93} {"train_loss": -6.589465618133545, "global_step": 15781, "epoch": 93} {"train_loss": -6.284541606903076, "global_step": 15782, "epoch": 93} {"train_loss": -6.589297294616699, "global_step": 15783, "epoch": 93} {"train_loss": -6.191925525665283, "global_step": 15784, "epoch": 93} {"train_loss": -6.457547664642334, "global_step": 15785, "epoch": 93} {"train_loss": -6.445195198059082, "global_step": 15786, "epoch": 93} {"train_loss": -6.644286155700684, "global_step": 15787, "epoch": 93} {"train_loss": -6.6099958419799805, "global_step": 15788, "epoch": 93} {"train_loss": -6.410812854766846, "global_step": 15789, "epoch": 93} {"train_loss": -6.763044357299805, "global_step": 15790, "epoch": 93} {"train_loss": -6.44923031046277, "global_step": 15791, "epoch": 93, "val_loss": 246170.953125} {"train_loss": -6.349001884460449, "global_step": 15792, "epoch": 94} {"train_loss": -6.510241985321045, "global_step": 15793, "epoch": 94} {"train_loss": -6.230751037597656, "global_step": 15794, "epoch": 94} {"train_loss": -6.016995429992676, "global_step": 15795, "epoch": 94} {"train_loss": -6.084368705749512, "global_step": 15796, "epoch": 94} {"train_loss": -6.424139022827148, "global_step": 15797, "epoch": 94} {"train_loss": -6.246426105499268, "global_step": 15798, "epoch": 94} {"train_loss": -6.520786762237549, "global_step": 15799, "epoch": 94} {"train_loss": -6.139094352722168, "global_step": 15800, "epoch": 94} {"train_loss": -6.425965309143066, "global_step": 15801, "epoch": 94} {"train_loss": -6.384130477905273, "global_step": 15802, "epoch": 94} {"train_loss": -6.2108869552612305, "global_step": 15803, "epoch": 94} {"train_loss": -6.374931335449219, "global_step": 15804, "epoch": 94} {"train_loss": -6.658384323120117, "global_step": 15805, "epoch": 94} {"train_loss": -6.156498908996582, "global_step": 15806, "epoch": 94} {"train_loss": -6.36570930480957, "global_step": 15807, "epoch": 94} {"train_loss": -6.415455341339111, "global_step": 15808, "epoch": 94} {"train_loss": -6.319263458251953, "global_step": 15809, "epoch": 94} {"train_loss": -6.498504638671875, "global_step": 15810, "epoch": 94} {"train_loss": -6.568931579589844, "global_step": 15811, "epoch": 94} {"train_loss": -6.535968780517578, "global_step": 15812, "epoch": 94} {"train_loss": -6.626895904541016, "global_step": 15813, "epoch": 94} {"train_loss": -6.563860893249512, "global_step": 15814, "epoch": 94} {"train_loss": -6.590794563293457, "global_step": 15815, "epoch": 94} {"train_loss": -6.598728179931641, "global_step": 15816, "epoch": 94} {"train_loss": -6.526257514953613, "global_step": 15817, "epoch": 94} {"train_loss": -6.574103832244873, "global_step": 15818, "epoch": 94} {"train_loss": -6.494231224060059, "global_step": 15819, "epoch": 94} {"train_loss": -6.2442307472229, "global_step": 15820, "epoch": 94} {"train_loss": -6.612967491149902, "global_step": 15821, "epoch": 94} {"train_loss": -6.399078845977783, "global_step": 15822, "epoch": 94} {"train_loss": -6.583749771118164, "global_step": 15823, "epoch": 94} {"train_loss": -6.207882404327393, "global_step": 15824, "epoch": 94} {"train_loss": -6.492696285247803, "global_step": 15825, "epoch": 94} {"train_loss": -6.469313621520996, "global_step": 15826, "epoch": 94} {"train_loss": -6.64954948425293, "global_step": 15827, "epoch": 94} {"train_loss": -6.176505088806152, "global_step": 15828, "epoch": 94} {"train_loss": -6.567683696746826, "global_step": 15829, "epoch": 94} {"train_loss": -6.625580787658691, "global_step": 15830, "epoch": 94} {"train_loss": -6.6150007247924805, "global_step": 15831, "epoch": 94} {"train_loss": -6.287356376647949, "global_step": 15832, "epoch": 94} {"train_loss": -6.652128219604492, "global_step": 15833, "epoch": 94} {"train_loss": -6.127507209777832, "global_step": 15834, "epoch": 94} {"train_loss": -6.639025688171387, "global_step": 15835, "epoch": 94} {"train_loss": -6.430849075317383, "global_step": 15836, "epoch": 94} {"train_loss": -6.354789733886719, "global_step": 15837, "epoch": 94} {"train_loss": -6.257281303405762, "global_step": 15838, "epoch": 94} {"train_loss": -6.523241996765137, "global_step": 15839, "epoch": 94} {"train_loss": -6.28536319732666, "global_step": 15840, "epoch": 94} {"train_loss": -6.4781084060668945, "global_step": 15841, "epoch": 94} {"train_loss": -6.445465564727783, "global_step": 15842, "epoch": 94} {"train_loss": -6.6610636711120605, "global_step": 15843, "epoch": 94} {"train_loss": -6.371220588684082, "global_step": 15844, "epoch": 94} {"train_loss": -6.379980564117432, "global_step": 15845, "epoch": 94} {"train_loss": -6.618175506591797, "global_step": 15846, "epoch": 94} {"train_loss": -6.383370399475098, "global_step": 15847, "epoch": 94} {"train_loss": -6.476440906524658, "global_step": 15848, "epoch": 94} {"train_loss": -6.635302543640137, "global_step": 15849, "epoch": 94} {"train_loss": -6.143057823181152, "global_step": 15850, "epoch": 94} {"train_loss": -6.452238082885742, "global_step": 15851, "epoch": 94} {"train_loss": -6.417517185211182, "global_step": 15852, "epoch": 94} {"train_loss": -6.62425422668457, "global_step": 15853, "epoch": 94} {"train_loss": -6.401427268981934, "global_step": 15854, "epoch": 94} {"train_loss": -6.21958589553833, "global_step": 15855, "epoch": 94} {"train_loss": -6.250715732574463, "global_step": 15856, "epoch": 94} {"train_loss": -6.421306610107422, "global_step": 15857, "epoch": 94} {"train_loss": -6.430484771728516, "global_step": 15858, "epoch": 94} {"train_loss": -6.413185119628906, "global_step": 15859, "epoch": 94} {"train_loss": -6.484623432159424, "global_step": 15860, "epoch": 94} {"train_loss": -6.316473007202148, "global_step": 15861, "epoch": 94} {"train_loss": -6.352826118469238, "global_step": 15862, "epoch": 94} {"train_loss": -6.49349308013916, "global_step": 15863, "epoch": 94} {"train_loss": -6.39412784576416, "global_step": 15864, "epoch": 94} {"train_loss": -6.6006855964660645, "global_step": 15865, "epoch": 94} {"train_loss": -6.274988174438477, "global_step": 15866, "epoch": 94} {"train_loss": -6.459707260131836, "global_step": 15867, "epoch": 94} {"train_loss": -6.491627216339111, "global_step": 15868, "epoch": 94} {"train_loss": -6.3363871574401855, "global_step": 15869, "epoch": 94} {"train_loss": -6.601030349731445, "global_step": 15870, "epoch": 94} {"train_loss": -6.1616411209106445, "global_step": 15871, "epoch": 94} {"train_loss": -6.513240814208984, "global_step": 15872, "epoch": 94} {"train_loss": -6.17132043838501, "global_step": 15873, "epoch": 94} {"train_loss": -6.49420166015625, "global_step": 15874, "epoch": 94} {"train_loss": -6.418237686157227, "global_step": 15875, "epoch": 94} {"train_loss": -6.3935441970825195, "global_step": 15876, "epoch": 94} {"train_loss": -6.587259292602539, "global_step": 15877, "epoch": 94} {"train_loss": -6.603518486022949, "global_step": 15878, "epoch": 94} {"train_loss": -6.71151065826416, "global_step": 15879, "epoch": 94} {"train_loss": -6.651062965393066, "global_step": 15880, "epoch": 94} {"train_loss": -6.7021870613098145, "global_step": 15881, "epoch": 94} {"train_loss": -6.441834449768066, "global_step": 15882, "epoch": 94} {"train_loss": -6.484166145324707, "global_step": 15883, "epoch": 94} {"train_loss": -6.602272033691406, "global_step": 15884, "epoch": 94} {"train_loss": -6.2851152420043945, "global_step": 15885, "epoch": 94} {"train_loss": -6.534774303436279, "global_step": 15886, "epoch": 94} {"train_loss": -6.642158508300781, "global_step": 15887, "epoch": 94} {"train_loss": -6.382357597351074, "global_step": 15888, "epoch": 94} {"train_loss": -6.67623233795166, "global_step": 15889, "epoch": 94} {"train_loss": -6.275214672088623, "global_step": 15890, "epoch": 94} {"train_loss": -6.485301971435547, "global_step": 15891, "epoch": 94} {"train_loss": -6.683520317077637, "global_step": 15892, "epoch": 94} {"train_loss": -6.672425746917725, "global_step": 15893, "epoch": 94} {"train_loss": -6.567455291748047, "global_step": 15894, "epoch": 94} {"train_loss": -6.550141334533691, "global_step": 15895, "epoch": 94} {"train_loss": -6.740619659423828, "global_step": 15896, "epoch": 94} {"train_loss": -6.416012763977051, "global_step": 15897, "epoch": 94} {"train_loss": -6.60706901550293, "global_step": 15898, "epoch": 94} {"train_loss": -6.327228546142578, "global_step": 15899, "epoch": 94} {"train_loss": -6.443581581115723, "global_step": 15900, "epoch": 94} {"train_loss": -6.513612747192383, "global_step": 15901, "epoch": 94} {"train_loss": -6.387075901031494, "global_step": 15902, "epoch": 94} {"train_loss": -6.480976581573486, "global_step": 15903, "epoch": 94} {"train_loss": -6.464910507202148, "global_step": 15904, "epoch": 94} {"train_loss": -6.6021575927734375, "global_step": 15905, "epoch": 94} {"train_loss": -6.379995346069336, "global_step": 15906, "epoch": 94} {"train_loss": -6.144282817840576, "global_step": 15907, "epoch": 94} {"train_loss": -6.449952125549316, "global_step": 15908, "epoch": 94} {"train_loss": -6.580494403839111, "global_step": 15909, "epoch": 94} {"train_loss": -6.695059776306152, "global_step": 15910, "epoch": 94} {"train_loss": -6.707701683044434, "global_step": 15911, "epoch": 94} {"train_loss": -6.581703186035156, "global_step": 15912, "epoch": 94} {"train_loss": -6.581291198730469, "global_step": 15913, "epoch": 94} {"train_loss": -6.489779949188232, "global_step": 15914, "epoch": 94} {"train_loss": -6.533514976501465, "global_step": 15915, "epoch": 94} {"train_loss": -6.571903228759766, "global_step": 15916, "epoch": 94} {"train_loss": -6.517726898193359, "global_step": 15917, "epoch": 94} {"train_loss": -6.243379592895508, "global_step": 15918, "epoch": 94} {"train_loss": -6.533058166503906, "global_step": 15919, "epoch": 94} {"train_loss": -6.497817516326904, "global_step": 15920, "epoch": 94} {"train_loss": -6.225775718688965, "global_step": 15921, "epoch": 94} {"train_loss": -6.297067642211914, "global_step": 15922, "epoch": 94} {"train_loss": -6.638956069946289, "global_step": 15923, "epoch": 94} {"train_loss": -6.358313083648682, "global_step": 15924, "epoch": 94} {"train_loss": -6.268716812133789, "global_step": 15925, "epoch": 94} {"train_loss": -6.394381046295166, "global_step": 15926, "epoch": 94} {"train_loss": -6.66880989074707, "global_step": 15927, "epoch": 94} {"train_loss": -6.647003650665283, "global_step": 15928, "epoch": 94} {"train_loss": -6.515103816986084, "global_step": 15929, "epoch": 94} {"train_loss": -6.219808578491211, "global_step": 15930, "epoch": 94} {"train_loss": -6.413931369781494, "global_step": 15931, "epoch": 94} {"train_loss": -6.635732650756836, "global_step": 15932, "epoch": 94} {"train_loss": -6.556291580200195, "global_step": 15933, "epoch": 94} {"train_loss": -6.447077751159668, "global_step": 15934, "epoch": 94} {"train_loss": -6.543806552886963, "global_step": 15935, "epoch": 94} {"train_loss": -6.491404056549072, "global_step": 15936, "epoch": 94} {"train_loss": -6.523169040679932, "global_step": 15937, "epoch": 94} {"train_loss": -6.335625171661377, "global_step": 15938, "epoch": 94} {"train_loss": -6.5785322189331055, "global_step": 15939, "epoch": 94} {"train_loss": -6.454476356506348, "global_step": 15940, "epoch": 94} {"train_loss": -6.447666645050049, "global_step": 15941, "epoch": 94} {"train_loss": -6.342407703399658, "global_step": 15942, "epoch": 94} {"train_loss": -6.427341461181641, "global_step": 15943, "epoch": 94} {"train_loss": -6.5415568351745605, "global_step": 15944, "epoch": 94} {"train_loss": -6.187943458557129, "global_step": 15945, "epoch": 94} {"train_loss": -6.516068935394287, "global_step": 15946, "epoch": 94} {"train_loss": -6.63946533203125, "global_step": 15947, "epoch": 94} {"train_loss": -6.4459638595581055, "global_step": 15948, "epoch": 94} {"train_loss": -6.3013505935668945, "global_step": 15949, "epoch": 94} {"train_loss": -6.379404067993164, "global_step": 15950, "epoch": 94} {"train_loss": -6.453347682952881, "global_step": 15951, "epoch": 94} {"train_loss": -6.474174499511719, "global_step": 15952, "epoch": 94} {"train_loss": -6.574810981750488, "global_step": 15953, "epoch": 94} {"train_loss": -6.486526012420654, "global_step": 15954, "epoch": 94} {"train_loss": -6.487768173217773, "global_step": 15955, "epoch": 94} {"train_loss": -6.300294399261475, "global_step": 15956, "epoch": 94} {"train_loss": -6.430365562438965, "global_step": 15957, "epoch": 94} {"train_loss": -6.398370265960693, "global_step": 15958, "epoch": 94} {"train_loss": -6.453957001368205, "global_step": 15959, "epoch": 94, "val_loss": 244389.25} {"train_loss": -6.555444717407227, "global_step": 15960, "epoch": 95} {"train_loss": -6.3535051345825195, "global_step": 15961, "epoch": 95} {"train_loss": -6.505399703979492, "global_step": 15962, "epoch": 95} {"train_loss": -6.458076477050781, "global_step": 15963, "epoch": 95} {"train_loss": -6.646512031555176, "global_step": 15964, "epoch": 95} {"train_loss": -6.557210922241211, "global_step": 15965, "epoch": 95} {"train_loss": -6.355114936828613, "global_step": 15966, "epoch": 95} {"train_loss": -6.408672332763672, "global_step": 15967, "epoch": 95} {"train_loss": -6.479040145874023, "global_step": 15968, "epoch": 95} {"train_loss": -6.350252151489258, "global_step": 15969, "epoch": 95} {"train_loss": -6.733542442321777, "global_step": 15970, "epoch": 95} {"train_loss": -6.45847225189209, "global_step": 15971, "epoch": 95} {"train_loss": -6.354773998260498, "global_step": 15972, "epoch": 95} {"train_loss": -6.51037073135376, "global_step": 15973, "epoch": 95} {"train_loss": -6.4497833251953125, "global_step": 15974, "epoch": 95} {"train_loss": -6.487042427062988, "global_step": 15975, "epoch": 95} {"train_loss": -6.742791175842285, "global_step": 15976, "epoch": 95} {"train_loss": -6.5614471435546875, "global_step": 15977, "epoch": 95} {"train_loss": -6.550602912902832, "global_step": 15978, "epoch": 95} {"train_loss": -6.341501712799072, "global_step": 15979, "epoch": 95} {"train_loss": -6.594305992126465, "global_step": 15980, "epoch": 95} {"train_loss": -6.269754886627197, "global_step": 15981, "epoch": 95} {"train_loss": -6.550343990325928, "global_step": 15982, "epoch": 95} {"train_loss": -6.189990043640137, "global_step": 15983, "epoch": 95} {"train_loss": -6.490378379821777, "global_step": 15984, "epoch": 95} {"train_loss": -6.345981597900391, "global_step": 15985, "epoch": 95} {"train_loss": -6.288758277893066, "global_step": 15986, "epoch": 95} {"train_loss": -6.013200759887695, "global_step": 15987, "epoch": 95} {"train_loss": -6.448709487915039, "global_step": 15988, "epoch": 95} {"train_loss": -6.392016410827637, "global_step": 15989, "epoch": 95} {"train_loss": -6.20998477935791, "global_step": 15990, "epoch": 95} {"train_loss": -6.401954650878906, "global_step": 15991, "epoch": 95} {"train_loss": -6.220322132110596, "global_step": 15992, "epoch": 95} {"train_loss": -6.023013114929199, "global_step": 15993, "epoch": 95} {"train_loss": -6.1685791015625, "global_step": 15994, "epoch": 95} {"train_loss": -6.398494720458984, "global_step": 15995, "epoch": 95} {"train_loss": -6.103303909301758, "global_step": 15996, "epoch": 95} {"train_loss": -6.413269996643066, "global_step": 15997, "epoch": 95} {"train_loss": -6.266617774963379, "global_step": 15998, "epoch": 95} {"train_loss": -6.370877265930176, "global_step": 15999, "epoch": 95} {"train_loss": -6.298017978668213, "global_step": 16000, "epoch": 95} {"train_loss": -6.185169219970703, "global_step": 16001, "epoch": 95} {"train_loss": -6.448596477508545, "global_step": 16002, "epoch": 95} {"train_loss": -6.509832382202148, "global_step": 16003, "epoch": 95} {"train_loss": -6.432584285736084, "global_step": 16004, "epoch": 95} {"train_loss": -6.446512222290039, "global_step": 16005, "epoch": 95} {"train_loss": -6.5131072998046875, "global_step": 16006, "epoch": 95} {"train_loss": -6.359808921813965, "global_step": 16007, "epoch": 95} {"train_loss": -6.475551605224609, "global_step": 16008, "epoch": 95} {"train_loss": -6.282584190368652, "global_step": 16009, "epoch": 95} {"train_loss": -6.4212799072265625, "global_step": 16010, "epoch": 95} {"train_loss": -6.456533432006836, "global_step": 16011, "epoch": 95} {"train_loss": -6.319912433624268, "global_step": 16012, "epoch": 95} {"train_loss": -6.4334540367126465, "global_step": 16013, "epoch": 95} {"train_loss": -6.4723920822143555, "global_step": 16014, "epoch": 95} {"train_loss": -6.323644161224365, "global_step": 16015, "epoch": 95} {"train_loss": -6.4989519119262695, "global_step": 16016, "epoch": 95} {"train_loss": -6.435736656188965, "global_step": 16017, "epoch": 95} {"train_loss": -6.518420696258545, "global_step": 16018, "epoch": 95} {"train_loss": -6.596017837524414, "global_step": 16019, "epoch": 95} {"train_loss": -6.373291969299316, "global_step": 16020, "epoch": 95} {"train_loss": -6.452293395996094, "global_step": 16021, "epoch": 95} {"train_loss": -6.213004112243652, "global_step": 16022, "epoch": 95} {"train_loss": -6.241158485412598, "global_step": 16023, "epoch": 95} {"train_loss": -6.175383567810059, "global_step": 16024, "epoch": 95} {"train_loss": -6.548428535461426, "global_step": 16025, "epoch": 95} {"train_loss": -6.218069076538086, "global_step": 16026, "epoch": 95} {"train_loss": -6.594814777374268, "global_step": 16027, "epoch": 95} {"train_loss": -6.319295883178711, "global_step": 16028, "epoch": 95} {"train_loss": -6.244868278503418, "global_step": 16029, "epoch": 95} {"train_loss": -6.140138149261475, "global_step": 16030, "epoch": 95} {"train_loss": -6.389101505279541, "global_step": 16031, "epoch": 95} {"train_loss": -6.601119041442871, "global_step": 16032, "epoch": 95} {"train_loss": -6.340664863586426, "global_step": 16033, "epoch": 95} {"train_loss": -6.641544342041016, "global_step": 16034, "epoch": 95} {"train_loss": -6.46834659576416, "global_step": 16035, "epoch": 95} {"train_loss": -6.440335273742676, "global_step": 16036, "epoch": 95} {"train_loss": -6.419935703277588, "global_step": 16037, "epoch": 95} {"train_loss": -6.019260406494141, "global_step": 16038, "epoch": 95} {"train_loss": -6.3384294509887695, "global_step": 16039, "epoch": 95} {"train_loss": -6.399905681610107, "global_step": 16040, "epoch": 95} {"train_loss": -6.340248107910156, "global_step": 16041, "epoch": 95} {"train_loss": -6.512738227844238, "global_step": 16042, "epoch": 95} {"train_loss": -5.969979286193848, "global_step": 16043, "epoch": 95} {"train_loss": -6.124166965484619, "global_step": 16044, "epoch": 95} {"train_loss": -6.285861968994141, "global_step": 16045, "epoch": 95} {"train_loss": -6.238592147827148, "global_step": 16046, "epoch": 95} {"train_loss": -6.398654460906982, "global_step": 16047, "epoch": 95} {"train_loss": -6.1888275146484375, "global_step": 16048, "epoch": 95} {"train_loss": -6.44825553894043, "global_step": 16049, "epoch": 95} {"train_loss": -6.38075065612793, "global_step": 16050, "epoch": 95} {"train_loss": -6.590707778930664, "global_step": 16051, "epoch": 95} {"train_loss": -6.430887222290039, "global_step": 16052, "epoch": 95} {"train_loss": -6.457154750823975, "global_step": 16053, "epoch": 95} {"train_loss": -6.752978801727295, "global_step": 16054, "epoch": 95} {"train_loss": -6.332869529724121, "global_step": 16055, "epoch": 95} {"train_loss": -6.609769344329834, "global_step": 16056, "epoch": 95} {"train_loss": -6.370419502258301, "global_step": 16057, "epoch": 95} {"train_loss": -6.558343887329102, "global_step": 16058, "epoch": 95} {"train_loss": -6.629794120788574, "global_step": 16059, "epoch": 95} {"train_loss": -6.299251556396484, "global_step": 16060, "epoch": 95} {"train_loss": -6.605205535888672, "global_step": 16061, "epoch": 95} {"train_loss": -6.416434288024902, "global_step": 16062, "epoch": 95} {"train_loss": -6.560020446777344, "global_step": 16063, "epoch": 95} {"train_loss": -6.4586591720581055, "global_step": 16064, "epoch": 95} {"train_loss": -6.676264762878418, "global_step": 16065, "epoch": 95} {"train_loss": -6.449405193328857, "global_step": 16066, "epoch": 95} {"train_loss": -6.596640586853027, "global_step": 16067, "epoch": 95} {"train_loss": -6.51364278793335, "global_step": 16068, "epoch": 95} {"train_loss": -6.449899673461914, "global_step": 16069, "epoch": 95} {"train_loss": -6.406542778015137, "global_step": 16070, "epoch": 95} {"train_loss": -6.355643272399902, "global_step": 16071, "epoch": 95} {"train_loss": -6.553283214569092, "global_step": 16072, "epoch": 95} {"train_loss": -6.417176723480225, "global_step": 16073, "epoch": 95} {"train_loss": -6.631400108337402, "global_step": 16074, "epoch": 95} {"train_loss": -6.446599960327148, "global_step": 16075, "epoch": 95} {"train_loss": -6.509469985961914, "global_step": 16076, "epoch": 95} {"train_loss": -6.423413276672363, "global_step": 16077, "epoch": 95} {"train_loss": -6.480699062347412, "global_step": 16078, "epoch": 95} {"train_loss": -6.752007961273193, "global_step": 16079, "epoch": 95} {"train_loss": -6.211984634399414, "global_step": 16080, "epoch": 95} {"train_loss": -6.545689582824707, "global_step": 16081, "epoch": 95} {"train_loss": -6.317239284515381, "global_step": 16082, "epoch": 95} {"train_loss": -6.665462493896484, "global_step": 16083, "epoch": 95} {"train_loss": -6.517999649047852, "global_step": 16084, "epoch": 95} {"train_loss": -6.4120988845825195, "global_step": 16085, "epoch": 95} {"train_loss": -6.400393486022949, "global_step": 16086, "epoch": 95} {"train_loss": -6.480241775512695, "global_step": 16087, "epoch": 95} {"train_loss": -6.505279541015625, "global_step": 16088, "epoch": 95} {"train_loss": -6.593047142028809, "global_step": 16089, "epoch": 95} {"train_loss": -6.47093391418457, "global_step": 16090, "epoch": 95} {"train_loss": -6.450250148773193, "global_step": 16091, "epoch": 95} {"train_loss": -6.532125473022461, "global_step": 16092, "epoch": 95} {"train_loss": -6.394967555999756, "global_step": 16093, "epoch": 95} {"train_loss": -6.539279937744141, "global_step": 16094, "epoch": 95} {"train_loss": -6.389702796936035, "global_step": 16095, "epoch": 95} {"train_loss": -6.587732315063477, "global_step": 16096, "epoch": 95} {"train_loss": -6.335284233093262, "global_step": 16097, "epoch": 95} {"train_loss": -6.4588236808776855, "global_step": 16098, "epoch": 95} {"train_loss": -6.550477504730225, "global_step": 16099, "epoch": 95} {"train_loss": -6.815487861633301, "global_step": 16100, "epoch": 95} {"train_loss": -6.577093124389648, "global_step": 16101, "epoch": 95} {"train_loss": -6.352154731750488, "global_step": 16102, "epoch": 95} {"train_loss": -6.348678112030029, "global_step": 16103, "epoch": 95} {"train_loss": -6.5206499099731445, "global_step": 16104, "epoch": 95} {"train_loss": -6.450403690338135, "global_step": 16105, "epoch": 95} {"train_loss": -6.479683876037598, "global_step": 16106, "epoch": 95} {"train_loss": -6.699324607849121, "global_step": 16107, "epoch": 95} {"train_loss": -6.653131484985352, "global_step": 16108, "epoch": 95} {"train_loss": -6.169848442077637, "global_step": 16109, "epoch": 95} {"train_loss": -6.44288444519043, "global_step": 16110, "epoch": 95} {"train_loss": -6.407271385192871, "global_step": 16111, "epoch": 95} {"train_loss": -6.430500030517578, "global_step": 16112, "epoch": 95} {"train_loss": -6.583477973937988, "global_step": 16113, "epoch": 95} {"train_loss": -6.379567623138428, "global_step": 16114, "epoch": 95} {"train_loss": -6.553580284118652, "global_step": 16115, "epoch": 95} {"train_loss": -6.528571605682373, "global_step": 16116, "epoch": 95} {"train_loss": -6.563318252563477, "global_step": 16117, "epoch": 95} {"train_loss": -6.608148574829102, "global_step": 16118, "epoch": 95} {"train_loss": -6.511999130249023, "global_step": 16119, "epoch": 95} {"train_loss": -6.446902275085449, "global_step": 16120, "epoch": 95} {"train_loss": -6.578392028808594, "global_step": 16121, "epoch": 95} {"train_loss": -6.46908712387085, "global_step": 16122, "epoch": 95} {"train_loss": -6.489766597747803, "global_step": 16123, "epoch": 95} {"train_loss": -6.50924015045166, "global_step": 16124, "epoch": 95} {"train_loss": -6.525541305541992, "global_step": 16125, "epoch": 95} {"train_loss": -6.408106803894043, "global_step": 16126, "epoch": 95} {"train_loss": -6.434130677155086, "global_step": 16127, "epoch": 95, "val_loss": 240803.34375, "train_action_mse_error": 31.07269287109375} {"train_loss": -6.181670665740967, "global_step": 16128, "epoch": 96} {"train_loss": -6.555315971374512, "global_step": 16129, "epoch": 96} {"train_loss": -6.4388427734375, "global_step": 16130, "epoch": 96} {"train_loss": -6.646241664886475, "global_step": 16131, "epoch": 96} {"train_loss": -6.4522199630737305, "global_step": 16132, "epoch": 96} {"train_loss": -6.475734710693359, "global_step": 16133, "epoch": 96} {"train_loss": -6.525331020355225, "global_step": 16134, "epoch": 96} {"train_loss": -6.442057132720947, "global_step": 16135, "epoch": 96} {"train_loss": -6.603790283203125, "global_step": 16136, "epoch": 96} {"train_loss": -6.5505242347717285, "global_step": 16137, "epoch": 96} {"train_loss": -6.584900856018066, "global_step": 16138, "epoch": 96} {"train_loss": -6.4752702713012695, "global_step": 16139, "epoch": 96} {"train_loss": -6.478582382202148, "global_step": 16140, "epoch": 96} {"train_loss": -6.516335487365723, "global_step": 16141, "epoch": 96} {"train_loss": -6.828444480895996, "global_step": 16142, "epoch": 96} {"train_loss": -6.351012229919434, "global_step": 16143, "epoch": 96} {"train_loss": -6.56483793258667, "global_step": 16144, "epoch": 96} {"train_loss": -6.497021675109863, "global_step": 16145, "epoch": 96} {"train_loss": -6.352044582366943, "global_step": 16146, "epoch": 96} {"train_loss": -6.494945526123047, "global_step": 16147, "epoch": 96} {"train_loss": -6.435577869415283, "global_step": 16148, "epoch": 96} {"train_loss": -6.616525650024414, "global_step": 16149, "epoch": 96} {"train_loss": -6.4280195236206055, "global_step": 16150, "epoch": 96} {"train_loss": -6.572221755981445, "global_step": 16151, "epoch": 96} {"train_loss": -6.613255500793457, "global_step": 16152, "epoch": 96} {"train_loss": -6.334228515625, "global_step": 16153, "epoch": 96} {"train_loss": -6.6483001708984375, "global_step": 16154, "epoch": 96} {"train_loss": -6.520763397216797, "global_step": 16155, "epoch": 96} {"train_loss": -6.375702857971191, "global_step": 16156, "epoch": 96} {"train_loss": -6.140018463134766, "global_step": 16157, "epoch": 96} {"train_loss": -6.344148635864258, "global_step": 16158, "epoch": 96} {"train_loss": -6.59105110168457, "global_step": 16159, "epoch": 96} {"train_loss": -6.331141471862793, "global_step": 16160, "epoch": 96} {"train_loss": -6.314506530761719, "global_step": 16161, "epoch": 96} {"train_loss": -6.280091285705566, "global_step": 16162, "epoch": 96} {"train_loss": -6.46186637878418, "global_step": 16163, "epoch": 96} {"train_loss": -6.408102989196777, "global_step": 16164, "epoch": 96} {"train_loss": -6.535924911499023, "global_step": 16165, "epoch": 96} {"train_loss": -6.636514186859131, "global_step": 16166, "epoch": 96} {"train_loss": -6.5734148025512695, "global_step": 16167, "epoch": 96} {"train_loss": -6.503437519073486, "global_step": 16168, "epoch": 96} {"train_loss": -6.634951591491699, "global_step": 16169, "epoch": 96} {"train_loss": -6.609590530395508, "global_step": 16170, "epoch": 96} {"train_loss": -6.3997087478637695, "global_step": 16171, "epoch": 96} {"train_loss": -6.1894378662109375, "global_step": 16172, "epoch": 96} {"train_loss": -6.491476058959961, "global_step": 16173, "epoch": 96} {"train_loss": -6.206530570983887, "global_step": 16174, "epoch": 96} {"train_loss": -6.485696792602539, "global_step": 16175, "epoch": 96} {"train_loss": -6.4154157638549805, "global_step": 16176, "epoch": 96} {"train_loss": -6.439871788024902, "global_step": 16177, "epoch": 96} {"train_loss": -6.490907192230225, "global_step": 16178, "epoch": 96} {"train_loss": -6.427655220031738, "global_step": 16179, "epoch": 96} {"train_loss": -6.640922546386719, "global_step": 16180, "epoch": 96} {"train_loss": -6.337212562561035, "global_step": 16181, "epoch": 96} {"train_loss": -6.329535484313965, "global_step": 16182, "epoch": 96} {"train_loss": -6.3504133224487305, "global_step": 16183, "epoch": 96} {"train_loss": -6.423976898193359, "global_step": 16184, "epoch": 96} {"train_loss": -6.313162803649902, "global_step": 16185, "epoch": 96} {"train_loss": -6.51900577545166, "global_step": 16186, "epoch": 96} {"train_loss": -6.305037498474121, "global_step": 16187, "epoch": 96} {"train_loss": -6.769634246826172, "global_step": 16188, "epoch": 96} {"train_loss": -6.288618087768555, "global_step": 16189, "epoch": 96} {"train_loss": -6.181153297424316, "global_step": 16190, "epoch": 96} {"train_loss": -6.514537334442139, "global_step": 16191, "epoch": 96} {"train_loss": -6.6132049560546875, "global_step": 16192, "epoch": 96} {"train_loss": -6.507025718688965, "global_step": 16193, "epoch": 96} {"train_loss": -6.410048484802246, "global_step": 16194, "epoch": 96} {"train_loss": -6.655677318572998, "global_step": 16195, "epoch": 96} {"train_loss": -6.033422946929932, "global_step": 16196, "epoch": 96} {"train_loss": -6.49088191986084, "global_step": 16197, "epoch": 96} {"train_loss": -6.101055145263672, "global_step": 16198, "epoch": 96} {"train_loss": -6.4750542640686035, "global_step": 16199, "epoch": 96} {"train_loss": -6.287248611450195, "global_step": 16200, "epoch": 96} {"train_loss": -6.043946266174316, "global_step": 16201, "epoch": 96} {"train_loss": -6.434355735778809, "global_step": 16202, "epoch": 96} {"train_loss": -6.416815757751465, "global_step": 16203, "epoch": 96} {"train_loss": -6.59685754776001, "global_step": 16204, "epoch": 96} {"train_loss": -6.2760910987854, "global_step": 16205, "epoch": 96} {"train_loss": -6.31656551361084, "global_step": 16206, "epoch": 96} {"train_loss": -6.385287761688232, "global_step": 16207, "epoch": 96} {"train_loss": -6.46097469329834, "global_step": 16208, "epoch": 96} {"train_loss": -6.449267387390137, "global_step": 16209, "epoch": 96} {"train_loss": -6.378390312194824, "global_step": 16210, "epoch": 96} {"train_loss": -6.4660258293151855, "global_step": 16211, "epoch": 96} {"train_loss": -6.478198528289795, "global_step": 16212, "epoch": 96} {"train_loss": -6.548344612121582, "global_step": 16213, "epoch": 96} {"train_loss": -6.441714763641357, "global_step": 16214, "epoch": 96} {"train_loss": -6.461758136749268, "global_step": 16215, "epoch": 96} {"train_loss": -6.452531814575195, "global_step": 16216, "epoch": 96} {"train_loss": -6.5688958168029785, "global_step": 16217, "epoch": 96} {"train_loss": -6.503129959106445, "global_step": 16218, "epoch": 96} {"train_loss": -6.432806491851807, "global_step": 16219, "epoch": 96} {"train_loss": -6.431432723999023, "global_step": 16220, "epoch": 96} {"train_loss": -6.371490478515625, "global_step": 16221, "epoch": 96} {"train_loss": -6.6775407791137695, "global_step": 16222, "epoch": 96} {"train_loss": -6.384974002838135, "global_step": 16223, "epoch": 96} {"train_loss": -6.501147747039795, "global_step": 16224, "epoch": 96} {"train_loss": -6.328090190887451, "global_step": 16225, "epoch": 96} {"train_loss": -6.314971446990967, "global_step": 16226, "epoch": 96} {"train_loss": -6.406635761260986, "global_step": 16227, "epoch": 96} {"train_loss": -6.520561218261719, "global_step": 16228, "epoch": 96} {"train_loss": -6.681694507598877, "global_step": 16229, "epoch": 96} {"train_loss": -6.3736467361450195, "global_step": 16230, "epoch": 96} {"train_loss": -6.500371932983398, "global_step": 16231, "epoch": 96} {"train_loss": -6.694519996643066, "global_step": 16232, "epoch": 96} {"train_loss": -6.574278354644775, "global_step": 16233, "epoch": 96} {"train_loss": -6.372427940368652, "global_step": 16234, "epoch": 96} {"train_loss": -6.682618141174316, "global_step": 16235, "epoch": 96} {"train_loss": -6.3587188720703125, "global_step": 16236, "epoch": 96} {"train_loss": -6.547804832458496, "global_step": 16237, "epoch": 96} {"train_loss": -6.4957194328308105, "global_step": 16238, "epoch": 96} {"train_loss": -6.336980819702148, "global_step": 16239, "epoch": 96} {"train_loss": -6.530416488647461, "global_step": 16240, "epoch": 96} {"train_loss": -6.616487503051758, "global_step": 16241, "epoch": 96} {"train_loss": -6.370196342468262, "global_step": 16242, "epoch": 96} {"train_loss": -6.4996795654296875, "global_step": 16243, "epoch": 96} {"train_loss": -6.592944145202637, "global_step": 16244, "epoch": 96} {"train_loss": -6.70337438583374, "global_step": 16245, "epoch": 96} {"train_loss": -6.54799747467041, "global_step": 16246, "epoch": 96} {"train_loss": -6.525276184082031, "global_step": 16247, "epoch": 96} {"train_loss": -6.749016761779785, "global_step": 16248, "epoch": 96} {"train_loss": -6.389015197753906, "global_step": 16249, "epoch": 96} {"train_loss": -6.952660083770752, "global_step": 16250, "epoch": 96} {"train_loss": -6.533709526062012, "global_step": 16251, "epoch": 96} {"train_loss": -6.488153457641602, "global_step": 16252, "epoch": 96} {"train_loss": -6.555062294006348, "global_step": 16253, "epoch": 96} {"train_loss": -6.541182518005371, "global_step": 16254, "epoch": 96} {"train_loss": -6.552157402038574, "global_step": 16255, "epoch": 96} {"train_loss": -6.265867233276367, "global_step": 16256, "epoch": 96} {"train_loss": -6.509483337402344, "global_step": 16257, "epoch": 96} {"train_loss": -6.454733848571777, "global_step": 16258, "epoch": 96} {"train_loss": -6.3670454025268555, "global_step": 16259, "epoch": 96} {"train_loss": -6.65275239944458, "global_step": 16260, "epoch": 96} {"train_loss": -6.7636542320251465, "global_step": 16261, "epoch": 96} {"train_loss": -6.411684989929199, "global_step": 16262, "epoch": 96} {"train_loss": -6.594201564788818, "global_step": 16263, "epoch": 96} {"train_loss": -6.619358062744141, "global_step": 16264, "epoch": 96} {"train_loss": -6.499439239501953, "global_step": 16265, "epoch": 96} {"train_loss": -6.435215950012207, "global_step": 16266, "epoch": 96} {"train_loss": -6.502534866333008, "global_step": 16267, "epoch": 96} {"train_loss": -6.750292778015137, "global_step": 16268, "epoch": 96} {"train_loss": -6.353000640869141, "global_step": 16269, "epoch": 96} {"train_loss": -6.643677711486816, "global_step": 16270, "epoch": 96} {"train_loss": -6.425063610076904, "global_step": 16271, "epoch": 96} {"train_loss": -6.380449295043945, "global_step": 16272, "epoch": 96} {"train_loss": -6.551007270812988, "global_step": 16273, "epoch": 96} {"train_loss": -6.513726711273193, "global_step": 16274, "epoch": 96} {"train_loss": -6.284358024597168, "global_step": 16275, "epoch": 96} {"train_loss": -6.425504207611084, "global_step": 16276, "epoch": 96} {"train_loss": -6.564913749694824, "global_step": 16277, "epoch": 96} {"train_loss": -6.245207786560059, "global_step": 16278, "epoch": 96} {"train_loss": -6.327639102935791, "global_step": 16279, "epoch": 96} {"train_loss": -6.465076446533203, "global_step": 16280, "epoch": 96} {"train_loss": -6.164907455444336, "global_step": 16281, "epoch": 96} {"train_loss": -6.603363990783691, "global_step": 16282, "epoch": 96} {"train_loss": -6.430572032928467, "global_step": 16283, "epoch": 96} {"train_loss": -6.479766845703125, "global_step": 16284, "epoch": 96} {"train_loss": -6.297296047210693, "global_step": 16285, "epoch": 96} {"train_loss": -6.599417686462402, "global_step": 16286, "epoch": 96} {"train_loss": -6.414645195007324, "global_step": 16287, "epoch": 96} {"train_loss": -6.307485103607178, "global_step": 16288, "epoch": 96} {"train_loss": -6.6501288414001465, "global_step": 16289, "epoch": 96} {"train_loss": -6.466192245483398, "global_step": 16290, "epoch": 96} {"train_loss": -6.375509262084961, "global_step": 16291, "epoch": 96} {"train_loss": -6.398089408874512, "global_step": 16292, "epoch": 96} {"train_loss": -6.533616542816162, "global_step": 16293, "epoch": 96} {"train_loss": -6.364328384399414, "global_step": 16294, "epoch": 96} {"train_loss": -6.464806846209934, "global_step": 16295, "epoch": 96, "val_loss": 232072.109375} {"train_loss": -6.674365043640137, "global_step": 16296, "epoch": 97} {"train_loss": -6.208865165710449, "global_step": 16297, "epoch": 97} {"train_loss": -6.787659645080566, "global_step": 16298, "epoch": 97} {"train_loss": -6.566197395324707, "global_step": 16299, "epoch": 97} {"train_loss": -6.734418869018555, "global_step": 16300, "epoch": 97} {"train_loss": -6.629302978515625, "global_step": 16301, "epoch": 97} {"train_loss": -6.554904460906982, "global_step": 16302, "epoch": 97} {"train_loss": -6.798975944519043, "global_step": 16303, "epoch": 97} {"train_loss": -6.765024662017822, "global_step": 16304, "epoch": 97} {"train_loss": -6.544554710388184, "global_step": 16305, "epoch": 97} {"train_loss": -6.580955982208252, "global_step": 16306, "epoch": 97} {"train_loss": -6.607649326324463, "global_step": 16307, "epoch": 97} {"train_loss": -6.750189781188965, "global_step": 16308, "epoch": 97} {"train_loss": -6.215265274047852, "global_step": 16309, "epoch": 97} {"train_loss": -6.4404296875, "global_step": 16310, "epoch": 97} {"train_loss": -6.309065818786621, "global_step": 16311, "epoch": 97} {"train_loss": -6.082370758056641, "global_step": 16312, "epoch": 97} {"train_loss": -6.417631149291992, "global_step": 16313, "epoch": 97} {"train_loss": -6.497305870056152, "global_step": 16314, "epoch": 97} {"train_loss": -6.615175247192383, "global_step": 16315, "epoch": 97} {"train_loss": -6.5817461013793945, "global_step": 16316, "epoch": 97} {"train_loss": -6.748668193817139, "global_step": 16317, "epoch": 97} {"train_loss": -6.575741767883301, "global_step": 16318, "epoch": 97} {"train_loss": -6.694777965545654, "global_step": 16319, "epoch": 97} {"train_loss": -6.623081207275391, "global_step": 16320, "epoch": 97} {"train_loss": -6.464611053466797, "global_step": 16321, "epoch": 97} {"train_loss": -6.7557854652404785, "global_step": 16322, "epoch": 97} {"train_loss": -6.465726375579834, "global_step": 16323, "epoch": 97} {"train_loss": -6.544660568237305, "global_step": 16324, "epoch": 97} {"train_loss": -6.297120094299316, "global_step": 16325, "epoch": 97} {"train_loss": -6.649827003479004, "global_step": 16326, "epoch": 97} {"train_loss": -6.415838241577148, "global_step": 16327, "epoch": 97} {"train_loss": -6.570048809051514, "global_step": 16328, "epoch": 97} {"train_loss": -6.306493282318115, "global_step": 16329, "epoch": 97} {"train_loss": -6.603923797607422, "global_step": 16330, "epoch": 97} {"train_loss": -6.35239315032959, "global_step": 16331, "epoch": 97} {"train_loss": -6.633056640625, "global_step": 16332, "epoch": 97} {"train_loss": -6.507544040679932, "global_step": 16333, "epoch": 97} {"train_loss": -6.729488372802734, "global_step": 16334, "epoch": 97} {"train_loss": -6.447253227233887, "global_step": 16335, "epoch": 97} {"train_loss": -6.691347122192383, "global_step": 16336, "epoch": 97} {"train_loss": -6.555755615234375, "global_step": 16337, "epoch": 97} {"train_loss": -6.472848892211914, "global_step": 16338, "epoch": 97} {"train_loss": -6.476350784301758, "global_step": 16339, "epoch": 97} {"train_loss": -6.3718414306640625, "global_step": 16340, "epoch": 97} {"train_loss": -6.146727561950684, "global_step": 16341, "epoch": 97} {"train_loss": -6.519585609436035, "global_step": 16342, "epoch": 97} {"train_loss": -6.560451507568359, "global_step": 16343, "epoch": 97} {"train_loss": -6.6719970703125, "global_step": 16344, "epoch": 97} {"train_loss": -6.5880584716796875, "global_step": 16345, "epoch": 97} {"train_loss": -6.584773063659668, "global_step": 16346, "epoch": 97} {"train_loss": -6.422369956970215, "global_step": 16347, "epoch": 97} {"train_loss": -6.44376802444458, "global_step": 16348, "epoch": 97} {"train_loss": -6.671291351318359, "global_step": 16349, "epoch": 97} {"train_loss": -6.132654666900635, "global_step": 16350, "epoch": 97} {"train_loss": -6.6707329750061035, "global_step": 16351, "epoch": 97} {"train_loss": -6.400947093963623, "global_step": 16352, "epoch": 97} {"train_loss": -6.482616424560547, "global_step": 16353, "epoch": 97} {"train_loss": -6.3056640625, "global_step": 16354, "epoch": 97} {"train_loss": -6.422940731048584, "global_step": 16355, "epoch": 97} {"train_loss": -6.717629432678223, "global_step": 16356, "epoch": 97} {"train_loss": -6.387751579284668, "global_step": 16357, "epoch": 97} {"train_loss": -6.644286155700684, "global_step": 16358, "epoch": 97} {"train_loss": -6.4455366134643555, "global_step": 16359, "epoch": 97} {"train_loss": -6.484196186065674, "global_step": 16360, "epoch": 97} {"train_loss": -6.50065803527832, "global_step": 16361, "epoch": 97} {"train_loss": -6.398701190948486, "global_step": 16362, "epoch": 97} {"train_loss": -6.73294734954834, "global_step": 16363, "epoch": 97} {"train_loss": -6.162874221801758, "global_step": 16364, "epoch": 97} {"train_loss": -6.6629204750061035, "global_step": 16365, "epoch": 97} {"train_loss": -6.253241539001465, "global_step": 16366, "epoch": 97} {"train_loss": -6.627605438232422, "global_step": 16367, "epoch": 97} {"train_loss": -6.49923038482666, "global_step": 16368, "epoch": 97} {"train_loss": -6.7096734046936035, "global_step": 16369, "epoch": 97} {"train_loss": -6.442852020263672, "global_step": 16370, "epoch": 97} {"train_loss": -6.796735763549805, "global_step": 16371, "epoch": 97} {"train_loss": -6.451360702514648, "global_step": 16372, "epoch": 97} {"train_loss": -6.451868534088135, "global_step": 16373, "epoch": 97} {"train_loss": -6.426255226135254, "global_step": 16374, "epoch": 97} {"train_loss": -6.499423027038574, "global_step": 16375, "epoch": 97} {"train_loss": -6.487070560455322, "global_step": 16376, "epoch": 97} {"train_loss": -6.334300994873047, "global_step": 16377, "epoch": 97} {"train_loss": -6.404536724090576, "global_step": 16378, "epoch": 97} {"train_loss": -6.549567699432373, "global_step": 16379, "epoch": 97} {"train_loss": -6.829682350158691, "global_step": 16380, "epoch": 97} {"train_loss": -6.449626922607422, "global_step": 16381, "epoch": 97} {"train_loss": -6.389094352722168, "global_step": 16382, "epoch": 97} {"train_loss": -6.639298439025879, "global_step": 16383, "epoch": 97} {"train_loss": -6.758530139923096, "global_step": 16384, "epoch": 97} {"train_loss": -6.4095563888549805, "global_step": 16385, "epoch": 97} {"train_loss": -6.553319931030273, "global_step": 16386, "epoch": 97} {"train_loss": -6.39023494720459, "global_step": 16387, "epoch": 97} {"train_loss": -6.518911838531494, "global_step": 16388, "epoch": 97} {"train_loss": -6.483857154846191, "global_step": 16389, "epoch": 97} {"train_loss": -6.347140312194824, "global_step": 16390, "epoch": 97} {"train_loss": -6.555050849914551, "global_step": 16391, "epoch": 97} {"train_loss": -6.2713518142700195, "global_step": 16392, "epoch": 97} {"train_loss": -6.611489295959473, "global_step": 16393, "epoch": 97} {"train_loss": -6.366748332977295, "global_step": 16394, "epoch": 97} {"train_loss": -6.916545867919922, "global_step": 16395, "epoch": 97} {"train_loss": -6.477298736572266, "global_step": 16396, "epoch": 97} {"train_loss": -6.390414714813232, "global_step": 16397, "epoch": 97} {"train_loss": -6.343704700469971, "global_step": 16398, "epoch": 97} {"train_loss": -6.241763114929199, "global_step": 16399, "epoch": 97} {"train_loss": -6.401497840881348, "global_step": 16400, "epoch": 97} {"train_loss": -6.5660858154296875, "global_step": 16401, "epoch": 97} {"train_loss": -6.38677978515625, "global_step": 16402, "epoch": 97} {"train_loss": -6.384185314178467, "global_step": 16403, "epoch": 97} {"train_loss": -6.568551063537598, "global_step": 16404, "epoch": 97} {"train_loss": -6.555747985839844, "global_step": 16405, "epoch": 97} {"train_loss": -6.511053085327148, "global_step": 16406, "epoch": 97} {"train_loss": -6.6171159744262695, "global_step": 16407, "epoch": 97} {"train_loss": -6.384369373321533, "global_step": 16408, "epoch": 97} {"train_loss": -6.3448333740234375, "global_step": 16409, "epoch": 97} {"train_loss": -6.233630180358887, "global_step": 16410, "epoch": 97} {"train_loss": -6.294505596160889, "global_step": 16411, "epoch": 97} {"train_loss": -6.7450337409973145, "global_step": 16412, "epoch": 97} {"train_loss": -6.369638442993164, "global_step": 16413, "epoch": 97} {"train_loss": -6.454042434692383, "global_step": 16414, "epoch": 97} {"train_loss": -6.356561183929443, "global_step": 16415, "epoch": 97} {"train_loss": -6.551552772521973, "global_step": 16416, "epoch": 97} {"train_loss": -6.557351112365723, "global_step": 16417, "epoch": 97} {"train_loss": -6.304566860198975, "global_step": 16418, "epoch": 97} {"train_loss": -6.483213424682617, "global_step": 16419, "epoch": 97} {"train_loss": -6.329693794250488, "global_step": 16420, "epoch": 97} {"train_loss": -6.3227410316467285, "global_step": 16421, "epoch": 97} {"train_loss": -6.655474662780762, "global_step": 16422, "epoch": 97} {"train_loss": -5.966585159301758, "global_step": 16423, "epoch": 97} {"train_loss": -6.494030952453613, "global_step": 16424, "epoch": 97} {"train_loss": -6.446126937866211, "global_step": 16425, "epoch": 97} {"train_loss": -6.189067840576172, "global_step": 16426, "epoch": 97} {"train_loss": -6.6248345375061035, "global_step": 16427, "epoch": 97} {"train_loss": -6.1636857986450195, "global_step": 16428, "epoch": 97} {"train_loss": -6.318121433258057, "global_step": 16429, "epoch": 97} {"train_loss": -6.4607343673706055, "global_step": 16430, "epoch": 97} {"train_loss": -6.232551097869873, "global_step": 16431, "epoch": 97} {"train_loss": -6.428660869598389, "global_step": 16432, "epoch": 97} {"train_loss": -6.511618614196777, "global_step": 16433, "epoch": 97} {"train_loss": -6.450568199157715, "global_step": 16434, "epoch": 97} {"train_loss": -6.618415832519531, "global_step": 16435, "epoch": 97} {"train_loss": -6.488051891326904, "global_step": 16436, "epoch": 97} {"train_loss": -6.6885881423950195, "global_step": 16437, "epoch": 97} {"train_loss": -6.508956432342529, "global_step": 16438, "epoch": 97} {"train_loss": -6.5642499923706055, "global_step": 16439, "epoch": 97} {"train_loss": -6.325874328613281, "global_step": 16440, "epoch": 97} {"train_loss": -6.532070159912109, "global_step": 16441, "epoch": 97} {"train_loss": -6.612090110778809, "global_step": 16442, "epoch": 97} {"train_loss": -6.388208389282227, "global_step": 16443, "epoch": 97} {"train_loss": -6.573359966278076, "global_step": 16444, "epoch": 97} {"train_loss": -6.626574516296387, "global_step": 16445, "epoch": 97} {"train_loss": -6.489772796630859, "global_step": 16446, "epoch": 97} {"train_loss": -6.346120834350586, "global_step": 16447, "epoch": 97} {"train_loss": -6.185564041137695, "global_step": 16448, "epoch": 97} {"train_loss": -6.40211296081543, "global_step": 16449, "epoch": 97} {"train_loss": -6.288351535797119, "global_step": 16450, "epoch": 97} {"train_loss": -6.737908363342285, "global_step": 16451, "epoch": 97} {"train_loss": -6.512861251831055, "global_step": 16452, "epoch": 97} {"train_loss": -6.514173984527588, "global_step": 16453, "epoch": 97} {"train_loss": -6.620765209197998, "global_step": 16454, "epoch": 97} {"train_loss": -6.653339385986328, "global_step": 16455, "epoch": 97} {"train_loss": -6.480574607849121, "global_step": 16456, "epoch": 97} {"train_loss": -6.614778995513916, "global_step": 16457, "epoch": 97} {"train_loss": -6.289263725280762, "global_step": 16458, "epoch": 97} {"train_loss": -6.606111526489258, "global_step": 16459, "epoch": 97} {"train_loss": -6.5182294845581055, "global_step": 16460, "epoch": 97} {"train_loss": -6.442281246185303, "global_step": 16461, "epoch": 97} {"train_loss": -6.624504089355469, "global_step": 16462, "epoch": 97} {"train_loss": -6.490394007591974, "global_step": 16463, "epoch": 97, "val_loss": 238392.609375} {"train_loss": -6.429375171661377, "global_step": 16464, "epoch": 98} {"train_loss": -6.396268844604492, "global_step": 16465, "epoch": 98} {"train_loss": -6.43428373336792, "global_step": 16466, "epoch": 98} {"train_loss": -6.496738910675049, "global_step": 16467, "epoch": 98} {"train_loss": -6.020209312438965, "global_step": 16468, "epoch": 98} {"train_loss": -6.325244426727295, "global_step": 16469, "epoch": 98} {"train_loss": -6.576428413391113, "global_step": 16470, "epoch": 98} {"train_loss": -6.492681503295898, "global_step": 16471, "epoch": 98} {"train_loss": -6.132887363433838, "global_step": 16472, "epoch": 98} {"train_loss": -6.3889288902282715, "global_step": 16473, "epoch": 98} {"train_loss": -6.1661272048950195, "global_step": 16474, "epoch": 98} {"train_loss": -6.404821395874023, "global_step": 16475, "epoch": 98} {"train_loss": -6.407162189483643, "global_step": 16476, "epoch": 98} {"train_loss": -6.372175216674805, "global_step": 16477, "epoch": 98} {"train_loss": -6.617400646209717, "global_step": 16478, "epoch": 98} {"train_loss": -6.277667045593262, "global_step": 16479, "epoch": 98} {"train_loss": -6.394546985626221, "global_step": 16480, "epoch": 98} {"train_loss": -6.524913787841797, "global_step": 16481, "epoch": 98} {"train_loss": -6.084033966064453, "global_step": 16482, "epoch": 98} {"train_loss": -6.770356178283691, "global_step": 16483, "epoch": 98} {"train_loss": -6.446493148803711, "global_step": 16484, "epoch": 98} {"train_loss": -6.57375955581665, "global_step": 16485, "epoch": 98} {"train_loss": -6.418412208557129, "global_step": 16486, "epoch": 98} {"train_loss": -6.092949867248535, "global_step": 16487, "epoch": 98} {"train_loss": -6.559675216674805, "global_step": 16488, "epoch": 98} {"train_loss": -6.406493663787842, "global_step": 16489, "epoch": 98} {"train_loss": -6.482278823852539, "global_step": 16490, "epoch": 98} {"train_loss": -6.307220458984375, "global_step": 16491, "epoch": 98} {"train_loss": -6.263327598571777, "global_step": 16492, "epoch": 98} {"train_loss": -6.437528610229492, "global_step": 16493, "epoch": 98} {"train_loss": -6.455465316772461, "global_step": 16494, "epoch": 98} {"train_loss": -6.308880805969238, "global_step": 16495, "epoch": 98} {"train_loss": -6.640947341918945, "global_step": 16496, "epoch": 98} {"train_loss": -6.242763519287109, "global_step": 16497, "epoch": 98} {"train_loss": -6.540145397186279, "global_step": 16498, "epoch": 98} {"train_loss": -6.391354560852051, "global_step": 16499, "epoch": 98} {"train_loss": -6.318140983581543, "global_step": 16500, "epoch": 98} {"train_loss": -6.487129211425781, "global_step": 16501, "epoch": 98} {"train_loss": -6.533124923706055, "global_step": 16502, "epoch": 98} {"train_loss": -6.508552551269531, "global_step": 16503, "epoch": 98} {"train_loss": -6.398796558380127, "global_step": 16504, "epoch": 98} {"train_loss": -6.356988906860352, "global_step": 16505, "epoch": 98} {"train_loss": -6.389732360839844, "global_step": 16506, "epoch": 98} {"train_loss": -6.341351509094238, "global_step": 16507, "epoch": 98} {"train_loss": -6.373895645141602, "global_step": 16508, "epoch": 98} {"train_loss": -6.42557430267334, "global_step": 16509, "epoch": 98} {"train_loss": -6.463737487792969, "global_step": 16510, "epoch": 98} {"train_loss": -6.438665390014648, "global_step": 16511, "epoch": 98} {"train_loss": -6.384479522705078, "global_step": 16512, "epoch": 98} {"train_loss": -6.34810733795166, "global_step": 16513, "epoch": 98} {"train_loss": -6.5197649002075195, "global_step": 16514, "epoch": 98} {"train_loss": -6.5461931228637695, "global_step": 16515, "epoch": 98} {"train_loss": -6.3496479988098145, "global_step": 16516, "epoch": 98} {"train_loss": -6.556110858917236, "global_step": 16517, "epoch": 98} {"train_loss": -6.534069061279297, "global_step": 16518, "epoch": 98} {"train_loss": -6.494940757751465, "global_step": 16519, "epoch": 98} {"train_loss": -6.400808811187744, "global_step": 16520, "epoch": 98} {"train_loss": -6.7429609298706055, "global_step": 16521, "epoch": 98} {"train_loss": -6.398393630981445, "global_step": 16522, "epoch": 98} {"train_loss": -6.4667277336120605, "global_step": 16523, "epoch": 98} {"train_loss": -6.569611072540283, "global_step": 16524, "epoch": 98} {"train_loss": -6.524033546447754, "global_step": 16525, "epoch": 98} {"train_loss": -6.358473300933838, "global_step": 16526, "epoch": 98} {"train_loss": -6.584608554840088, "global_step": 16527, "epoch": 98} {"train_loss": -6.5484700202941895, "global_step": 16528, "epoch": 98} {"train_loss": -6.54218864440918, "global_step": 16529, "epoch": 98} {"train_loss": -6.542900085449219, "global_step": 16530, "epoch": 98} {"train_loss": -6.614912033081055, "global_step": 16531, "epoch": 98} {"train_loss": -6.829080581665039, "global_step": 16532, "epoch": 98} {"train_loss": -6.597258567810059, "global_step": 16533, "epoch": 98} {"train_loss": -6.611964702606201, "global_step": 16534, "epoch": 98} {"train_loss": -6.671441078186035, "global_step": 16535, "epoch": 98} {"train_loss": -6.380197525024414, "global_step": 16536, "epoch": 98} {"train_loss": -6.586203575134277, "global_step": 16537, "epoch": 98} {"train_loss": -6.593317985534668, "global_step": 16538, "epoch": 98} {"train_loss": -6.782846450805664, "global_step": 16539, "epoch": 98} {"train_loss": -6.596607685089111, "global_step": 16540, "epoch": 98} {"train_loss": -6.459393501281738, "global_step": 16541, "epoch": 98} {"train_loss": -6.675872802734375, "global_step": 16542, "epoch": 98} {"train_loss": -6.535517692565918, "global_step": 16543, "epoch": 98} {"train_loss": -6.527005195617676, "global_step": 16544, "epoch": 98} {"train_loss": -6.708623886108398, "global_step": 16545, "epoch": 98} {"train_loss": -6.618094444274902, "global_step": 16546, "epoch": 98} {"train_loss": -6.604783535003662, "global_step": 16547, "epoch": 98} {"train_loss": -6.742107391357422, "global_step": 16548, "epoch": 98} {"train_loss": -6.732317924499512, "global_step": 16549, "epoch": 98} {"train_loss": -6.524043083190918, "global_step": 16550, "epoch": 98} {"train_loss": -6.606781482696533, "global_step": 16551, "epoch": 98} {"train_loss": -6.233621597290039, "global_step": 16552, "epoch": 98} {"train_loss": -6.812372207641602, "global_step": 16553, "epoch": 98} {"train_loss": -6.420379638671875, "global_step": 16554, "epoch": 98} {"train_loss": -6.4531474113464355, "global_step": 16555, "epoch": 98} {"train_loss": -6.473545074462891, "global_step": 16556, "epoch": 98} {"train_loss": -6.551075458526611, "global_step": 16557, "epoch": 98} {"train_loss": -6.684922218322754, "global_step": 16558, "epoch": 98} {"train_loss": -6.352406978607178, "global_step": 16559, "epoch": 98} {"train_loss": -6.573712348937988, "global_step": 16560, "epoch": 98} {"train_loss": -6.384550094604492, "global_step": 16561, "epoch": 98} {"train_loss": -6.460433006286621, "global_step": 16562, "epoch": 98} {"train_loss": -6.621474266052246, "global_step": 16563, "epoch": 98} {"train_loss": -6.558284759521484, "global_step": 16564, "epoch": 98} {"train_loss": -6.579807758331299, "global_step": 16565, "epoch": 98} {"train_loss": -6.60501766204834, "global_step": 16566, "epoch": 98} {"train_loss": -6.447476387023926, "global_step": 16567, "epoch": 98} {"train_loss": -6.441038608551025, "global_step": 16568, "epoch": 98} {"train_loss": -6.3170318603515625, "global_step": 16569, "epoch": 98} {"train_loss": -6.428540229797363, "global_step": 16570, "epoch": 98} {"train_loss": -6.625640869140625, "global_step": 16571, "epoch": 98} {"train_loss": -6.513785362243652, "global_step": 16572, "epoch": 98} {"train_loss": -6.427913665771484, "global_step": 16573, "epoch": 98} {"train_loss": -6.572497844696045, "global_step": 16574, "epoch": 98} {"train_loss": -6.308113098144531, "global_step": 16575, "epoch": 98} {"train_loss": -6.684243202209473, "global_step": 16576, "epoch": 98} {"train_loss": -6.591053009033203, "global_step": 16577, "epoch": 98} {"train_loss": -6.407628059387207, "global_step": 16578, "epoch": 98} {"train_loss": -6.640578746795654, "global_step": 16579, "epoch": 98} {"train_loss": -6.360347747802734, "global_step": 16580, "epoch": 98} {"train_loss": -6.455431938171387, "global_step": 16581, "epoch": 98} {"train_loss": -6.432518482208252, "global_step": 16582, "epoch": 98} {"train_loss": -6.57354736328125, "global_step": 16583, "epoch": 98} {"train_loss": -6.497335910797119, "global_step": 16584, "epoch": 98} {"train_loss": -6.670175075531006, "global_step": 16585, "epoch": 98} {"train_loss": -6.366344928741455, "global_step": 16586, "epoch": 98} {"train_loss": -6.596869945526123, "global_step": 16587, "epoch": 98} {"train_loss": -6.692239284515381, "global_step": 16588, "epoch": 98} {"train_loss": -6.364353179931641, "global_step": 16589, "epoch": 98} {"train_loss": -6.595355033874512, "global_step": 16590, "epoch": 98} {"train_loss": -6.605621337890625, "global_step": 16591, "epoch": 98} {"train_loss": -6.584075450897217, "global_step": 16592, "epoch": 98} {"train_loss": -6.307704925537109, "global_step": 16593, "epoch": 98} {"train_loss": -6.6791582107543945, "global_step": 16594, "epoch": 98} {"train_loss": -6.590548515319824, "global_step": 16595, "epoch": 98} {"train_loss": -6.688537120819092, "global_step": 16596, "epoch": 98} {"train_loss": -6.623743534088135, "global_step": 16597, "epoch": 98} {"train_loss": -6.643320083618164, "global_step": 16598, "epoch": 98} {"train_loss": -6.697874069213867, "global_step": 16599, "epoch": 98} {"train_loss": -6.736114978790283, "global_step": 16600, "epoch": 98} {"train_loss": -6.571843147277832, "global_step": 16601, "epoch": 98} {"train_loss": -6.432653427124023, "global_step": 16602, "epoch": 98} {"train_loss": -6.546459197998047, "global_step": 16603, "epoch": 98} {"train_loss": -6.605635643005371, "global_step": 16604, "epoch": 98} {"train_loss": -6.7253570556640625, "global_step": 16605, "epoch": 98} {"train_loss": -6.580239772796631, "global_step": 16606, "epoch": 98} {"train_loss": -6.8023681640625, "global_step": 16607, "epoch": 98} {"train_loss": -6.751482009887695, "global_step": 16608, "epoch": 98} {"train_loss": -6.325248718261719, "global_step": 16609, "epoch": 98} {"train_loss": -6.6412153244018555, "global_step": 16610, "epoch": 98} {"train_loss": -6.755657196044922, "global_step": 16611, "epoch": 98} {"train_loss": -6.580986976623535, "global_step": 16612, "epoch": 98} {"train_loss": -6.640720844268799, "global_step": 16613, "epoch": 98} {"train_loss": -6.438666820526123, "global_step": 16614, "epoch": 98} {"train_loss": -6.477373123168945, "global_step": 16615, "epoch": 98} {"train_loss": -6.526247978210449, "global_step": 16616, "epoch": 98} {"train_loss": -6.447068214416504, "global_step": 16617, "epoch": 98} {"train_loss": -6.503043174743652, "global_step": 16618, "epoch": 98} {"train_loss": -6.192341327667236, "global_step": 16619, "epoch": 98} {"train_loss": -6.6750078201293945, "global_step": 16620, "epoch": 98} {"train_loss": -6.534714221954346, "global_step": 16621, "epoch": 98} {"train_loss": -6.62630558013916, "global_step": 16622, "epoch": 98} {"train_loss": -6.687758445739746, "global_step": 16623, "epoch": 98} {"train_loss": -6.836452484130859, "global_step": 16624, "epoch": 98} {"train_loss": -6.485831260681152, "global_step": 16625, "epoch": 98} {"train_loss": -6.660001754760742, "global_step": 16626, "epoch": 98} {"train_loss": -6.689064979553223, "global_step": 16627, "epoch": 98} {"train_loss": -6.5022053718566895, "global_step": 16628, "epoch": 98} {"train_loss": -6.479251861572266, "global_step": 16629, "epoch": 98} {"train_loss": -6.637833118438721, "global_step": 16630, "epoch": 98} {"train_loss": -6.507862227303641, "global_step": 16631, "epoch": 98, "val_loss": 237745.4375} {"train_loss": -6.507542610168457, "global_step": 16632, "epoch": 99} {"train_loss": -6.380522727966309, "global_step": 16633, "epoch": 99} {"train_loss": -6.265374660491943, "global_step": 16634, "epoch": 99} {"train_loss": -6.520825386047363, "global_step": 16635, "epoch": 99} {"train_loss": -6.387840270996094, "global_step": 16636, "epoch": 99} {"train_loss": -6.351458549499512, "global_step": 16637, "epoch": 99} {"train_loss": -6.553558349609375, "global_step": 16638, "epoch": 99} {"train_loss": -6.476120471954346, "global_step": 16639, "epoch": 99} {"train_loss": -6.51212215423584, "global_step": 16640, "epoch": 99} {"train_loss": -6.4553351402282715, "global_step": 16641, "epoch": 99} {"train_loss": -6.625638961791992, "global_step": 16642, "epoch": 99} {"train_loss": -6.396289348602295, "global_step": 16643, "epoch": 99} {"train_loss": -6.61229133605957, "global_step": 16644, "epoch": 99} {"train_loss": -6.778857707977295, "global_step": 16645, "epoch": 99} {"train_loss": -6.601614952087402, "global_step": 16646, "epoch": 99} {"train_loss": -6.567659854888916, "global_step": 16647, "epoch": 99} {"train_loss": -6.521064758300781, "global_step": 16648, "epoch": 99} {"train_loss": -6.300264835357666, "global_step": 16649, "epoch": 99} {"train_loss": -6.66931676864624, "global_step": 16650, "epoch": 99} {"train_loss": -6.5515851974487305, "global_step": 16651, "epoch": 99} {"train_loss": -6.818110466003418, "global_step": 16652, "epoch": 99} {"train_loss": -6.836592197418213, "global_step": 16653, "epoch": 99} {"train_loss": -6.533316135406494, "global_step": 16654, "epoch": 99} {"train_loss": -6.4132795333862305, "global_step": 16655, "epoch": 99} {"train_loss": -6.548642158508301, "global_step": 16656, "epoch": 99} {"train_loss": -6.535520553588867, "global_step": 16657, "epoch": 99} {"train_loss": -6.654145240783691, "global_step": 16658, "epoch": 99} {"train_loss": -6.471039772033691, "global_step": 16659, "epoch": 99} {"train_loss": -6.322477340698242, "global_step": 16660, "epoch": 99} {"train_loss": -6.5877532958984375, "global_step": 16661, "epoch": 99} {"train_loss": -6.324775218963623, "global_step": 16662, "epoch": 99} {"train_loss": -6.557814598083496, "global_step": 16663, "epoch": 99} {"train_loss": -6.418196201324463, "global_step": 16664, "epoch": 99} {"train_loss": -6.590937614440918, "global_step": 16665, "epoch": 99} {"train_loss": -6.617875576019287, "global_step": 16666, "epoch": 99} {"train_loss": -6.636384963989258, "global_step": 16667, "epoch": 99} {"train_loss": -6.509112358093262, "global_step": 16668, "epoch": 99} {"train_loss": -6.675210952758789, "global_step": 16669, "epoch": 99} {"train_loss": -6.728302001953125, "global_step": 16670, "epoch": 99} {"train_loss": -6.8608479499816895, "global_step": 16671, "epoch": 99} {"train_loss": -6.6117024421691895, "global_step": 16672, "epoch": 99} {"train_loss": -6.511394500732422, "global_step": 16673, "epoch": 99} {"train_loss": -6.527520179748535, "global_step": 16674, "epoch": 99} {"train_loss": -6.768880844116211, "global_step": 16675, "epoch": 99} {"train_loss": -6.566999435424805, "global_step": 16676, "epoch": 99} {"train_loss": -6.489064693450928, "global_step": 16677, "epoch": 99} {"train_loss": -6.5124945640563965, "global_step": 16678, "epoch": 99} {"train_loss": -6.246561050415039, "global_step": 16679, "epoch": 99} {"train_loss": -6.232982635498047, "global_step": 16680, "epoch": 99} {"train_loss": -6.626654624938965, "global_step": 16681, "epoch": 99} {"train_loss": -6.388718605041504, "global_step": 16682, "epoch": 99} {"train_loss": -6.5107927322387695, "global_step": 16683, "epoch": 99} {"train_loss": -6.492915630340576, "global_step": 16684, "epoch": 99} {"train_loss": -6.114116668701172, "global_step": 16685, "epoch": 99} {"train_loss": -6.717026233673096, "global_step": 16686, "epoch": 99} {"train_loss": -6.564114570617676, "global_step": 16687, "epoch": 99} {"train_loss": -6.463080883026123, "global_step": 16688, "epoch": 99} {"train_loss": -6.716156005859375, "global_step": 16689, "epoch": 99} {"train_loss": -6.514442443847656, "global_step": 16690, "epoch": 99} {"train_loss": -6.143681049346924, "global_step": 16691, "epoch": 99} {"train_loss": -6.343080520629883, "global_step": 16692, "epoch": 99} {"train_loss": -6.534819602966309, "global_step": 16693, "epoch": 99} {"train_loss": -6.43928337097168, "global_step": 16694, "epoch": 99} {"train_loss": -6.358683109283447, "global_step": 16695, "epoch": 99} {"train_loss": -6.523007392883301, "global_step": 16696, "epoch": 99} {"train_loss": -6.692412376403809, "global_step": 16697, "epoch": 99} {"train_loss": -6.395267963409424, "global_step": 16698, "epoch": 99} {"train_loss": -6.188693523406982, "global_step": 16699, "epoch": 99} {"train_loss": -6.219744682312012, "global_step": 16700, "epoch": 99} {"train_loss": -6.357517719268799, "global_step": 16701, "epoch": 99} {"train_loss": -6.31461238861084, "global_step": 16702, "epoch": 99} {"train_loss": -6.255747318267822, "global_step": 16703, "epoch": 99} {"train_loss": -6.520430564880371, "global_step": 16704, "epoch": 99} {"train_loss": -6.238659858703613, "global_step": 16705, "epoch": 99} {"train_loss": -6.063058376312256, "global_step": 16706, "epoch": 99} {"train_loss": -6.418543338775635, "global_step": 16707, "epoch": 99} {"train_loss": -6.199563980102539, "global_step": 16708, "epoch": 99} {"train_loss": -6.219013690948486, "global_step": 16709, "epoch": 99} {"train_loss": -6.159303188323975, "global_step": 16710, "epoch": 99} {"train_loss": -6.156425476074219, "global_step": 16711, "epoch": 99} {"train_loss": -6.309185981750488, "global_step": 16712, "epoch": 99} {"train_loss": -6.387285232543945, "global_step": 16713, "epoch": 99} {"train_loss": -6.348188400268555, "global_step": 16714, "epoch": 99} {"train_loss": -6.442173004150391, "global_step": 16715, "epoch": 99} {"train_loss": -6.654641628265381, "global_step": 16716, "epoch": 99} {"train_loss": -6.390558242797852, "global_step": 16717, "epoch": 99} {"train_loss": -6.5472636222839355, "global_step": 16718, "epoch": 99} {"train_loss": -6.45890998840332, "global_step": 16719, "epoch": 99} {"train_loss": -6.145598888397217, "global_step": 16720, "epoch": 99} {"train_loss": -6.573241233825684, "global_step": 16721, "epoch": 99} {"train_loss": -6.555861473083496, "global_step": 16722, "epoch": 99} {"train_loss": -6.595667839050293, "global_step": 16723, "epoch": 99} {"train_loss": -6.673312187194824, "global_step": 16724, "epoch": 99} {"train_loss": -6.546656608581543, "global_step": 16725, "epoch": 99} {"train_loss": -6.542453765869141, "global_step": 16726, "epoch": 99} {"train_loss": -6.496508598327637, "global_step": 16727, "epoch": 99} {"train_loss": -6.553606033325195, "global_step": 16728, "epoch": 99} {"train_loss": -6.321677207946777, "global_step": 16729, "epoch": 99} {"train_loss": -6.512451171875, "global_step": 16730, "epoch": 99} {"train_loss": -6.684365272521973, "global_step": 16731, "epoch": 99} {"train_loss": -6.598944664001465, "global_step": 16732, "epoch": 99} {"train_loss": -6.5394439697265625, "global_step": 16733, "epoch": 99} {"train_loss": -6.567720890045166, "global_step": 16734, "epoch": 99} {"train_loss": -6.602099418640137, "global_step": 16735, "epoch": 99} {"train_loss": -6.763199806213379, "global_step": 16736, "epoch": 99} {"train_loss": -6.711574554443359, "global_step": 16737, "epoch": 99} {"train_loss": -6.610119819641113, "global_step": 16738, "epoch": 99} {"train_loss": -6.863422393798828, "global_step": 16739, "epoch": 99} {"train_loss": -6.43230676651001, "global_step": 16740, "epoch": 99} {"train_loss": -6.506716728210449, "global_step": 16741, "epoch": 99} {"train_loss": -6.455470085144043, "global_step": 16742, "epoch": 99} {"train_loss": -6.642765998840332, "global_step": 16743, "epoch": 99} {"train_loss": -6.374301910400391, "global_step": 16744, "epoch": 99} {"train_loss": -6.51010274887085, "global_step": 16745, "epoch": 99} {"train_loss": -6.4282402992248535, "global_step": 16746, "epoch": 99} {"train_loss": -6.585309028625488, "global_step": 16747, "epoch": 99} {"train_loss": -6.389549732208252, "global_step": 16748, "epoch": 99} {"train_loss": -6.451291084289551, "global_step": 16749, "epoch": 99} {"train_loss": -6.6208295822143555, "global_step": 16750, "epoch": 99} {"train_loss": -6.645547866821289, "global_step": 16751, "epoch": 99} {"train_loss": -6.573390007019043, "global_step": 16752, "epoch": 99} {"train_loss": -6.523476600646973, "global_step": 16753, "epoch": 99} {"train_loss": -6.554779052734375, "global_step": 16754, "epoch": 99} {"train_loss": -6.525004863739014, "global_step": 16755, "epoch": 99} {"train_loss": -6.490325927734375, "global_step": 16756, "epoch": 99} {"train_loss": -6.501873970031738, "global_step": 16757, "epoch": 99} {"train_loss": -6.49998664855957, "global_step": 16758, "epoch": 99} {"train_loss": -6.6282267570495605, "global_step": 16759, "epoch": 99} {"train_loss": -6.416779518127441, "global_step": 16760, "epoch": 99} {"train_loss": -6.641997337341309, "global_step": 16761, "epoch": 99} {"train_loss": -6.402169704437256, "global_step": 16762, "epoch": 99} {"train_loss": -6.626946449279785, "global_step": 16763, "epoch": 99} {"train_loss": -6.470894813537598, "global_step": 16764, "epoch": 99} {"train_loss": -6.529575347900391, "global_step": 16765, "epoch": 99} {"train_loss": -6.4804840087890625, "global_step": 16766, "epoch": 99} {"train_loss": -6.426441192626953, "global_step": 16767, "epoch": 99} {"train_loss": -6.782451152801514, "global_step": 16768, "epoch": 99} {"train_loss": -6.700427055358887, "global_step": 16769, "epoch": 99} {"train_loss": -6.416109561920166, "global_step": 16770, "epoch": 99} {"train_loss": -6.504025459289551, "global_step": 16771, "epoch": 99} {"train_loss": -6.146048545837402, "global_step": 16772, "epoch": 99} {"train_loss": -6.513556480407715, "global_step": 16773, "epoch": 99} {"train_loss": -6.409762382507324, "global_step": 16774, "epoch": 99} {"train_loss": -6.531806945800781, "global_step": 16775, "epoch": 99} {"train_loss": -6.493325233459473, "global_step": 16776, "epoch": 99} {"train_loss": -6.379177570343018, "global_step": 16777, "epoch": 99} {"train_loss": -6.4843430519104, "global_step": 16778, "epoch": 99} {"train_loss": -6.566605567932129, "global_step": 16779, "epoch": 99} {"train_loss": -6.635481834411621, "global_step": 16780, "epoch": 99} {"train_loss": -6.415871620178223, "global_step": 16781, "epoch": 99} {"train_loss": -6.636381149291992, "global_step": 16782, "epoch": 99} {"train_loss": -6.531972885131836, "global_step": 16783, "epoch": 99} {"train_loss": -6.438384056091309, "global_step": 16784, "epoch": 99} {"train_loss": -6.230414390563965, "global_step": 16785, "epoch": 99} {"train_loss": -6.639293670654297, "global_step": 16786, "epoch": 99} {"train_loss": -6.690373420715332, "global_step": 16787, "epoch": 99} {"train_loss": -6.603747367858887, "global_step": 16788, "epoch": 99} {"train_loss": -6.495052337646484, "global_step": 16789, "epoch": 99} {"train_loss": -6.335186004638672, "global_step": 16790, "epoch": 99} {"train_loss": -6.511300086975098, "global_step": 16791, "epoch": 99} {"train_loss": -6.485785484313965, "global_step": 16792, "epoch": 99} {"train_loss": -6.599698066711426, "global_step": 16793, "epoch": 99} {"train_loss": -6.626874923706055, "global_step": 16794, "epoch": 99} {"train_loss": -6.773236274719238, "global_step": 16795, "epoch": 99} {"train_loss": -6.726502895355225, "global_step": 16796, "epoch": 99} {"train_loss": -6.061669826507568, "global_step": 16797, "epoch": 99} {"train_loss": -6.71033239364624, "global_step": 16798, "epoch": 99} {"train_loss": -6.499603050095694, "global_step": 16799, "epoch": 99, "val_loss": 233236.515625} {"train_loss": -6.464791297912598, "global_step": 16800, "epoch": 100} {"train_loss": -6.662145137786865, "global_step": 16801, "epoch": 100} {"train_loss": -6.470248699188232, "global_step": 16802, "epoch": 100} {"train_loss": -6.769452095031738, "global_step": 16803, "epoch": 100} {"train_loss": -6.283234596252441, "global_step": 16804, "epoch": 100} {"train_loss": -6.554482460021973, "global_step": 16805, "epoch": 100} {"train_loss": -6.360553741455078, "global_step": 16806, "epoch": 100} {"train_loss": -6.626540660858154, "global_step": 16807, "epoch": 100} {"train_loss": -6.761560440063477, "global_step": 16808, "epoch": 100} {"train_loss": -6.686319351196289, "global_step": 16809, "epoch": 100} {"train_loss": -6.706593990325928, "global_step": 16810, "epoch": 100} {"train_loss": -6.624798774719238, "global_step": 16811, "epoch": 100} {"train_loss": -6.606390953063965, "global_step": 16812, "epoch": 100} {"train_loss": -6.672314643859863, "global_step": 16813, "epoch": 100} {"train_loss": -6.7529168128967285, "global_step": 16814, "epoch": 100} {"train_loss": -6.633853912353516, "global_step": 16815, "epoch": 100} {"train_loss": -6.535355567932129, "global_step": 16816, "epoch": 100} {"train_loss": -6.3072614669799805, "global_step": 16817, "epoch": 100} {"train_loss": -6.632911682128906, "global_step": 16818, "epoch": 100} {"train_loss": -6.423012733459473, "global_step": 16819, "epoch": 100} {"train_loss": -6.661272048950195, "global_step": 16820, "epoch": 100} {"train_loss": -6.337141513824463, "global_step": 16821, "epoch": 100} {"train_loss": -6.564589023590088, "global_step": 16822, "epoch": 100} {"train_loss": -6.513452529907227, "global_step": 16823, "epoch": 100} {"train_loss": -6.574862480163574, "global_step": 16824, "epoch": 100} {"train_loss": -6.818982124328613, "global_step": 16825, "epoch": 100} {"train_loss": -6.681779861450195, "global_step": 16826, "epoch": 100} {"train_loss": -6.556460857391357, "global_step": 16827, "epoch": 100} {"train_loss": -6.5386176109313965, "global_step": 16828, "epoch": 100} {"train_loss": -6.4553351402282715, "global_step": 16829, "epoch": 100} {"train_loss": -6.5063886642456055, "global_step": 16830, "epoch": 100} {"train_loss": -6.649940490722656, "global_step": 16831, "epoch": 100} {"train_loss": -6.39249324798584, "global_step": 16832, "epoch": 100} {"train_loss": -6.727700233459473, "global_step": 16833, "epoch": 100} {"train_loss": -6.164867401123047, "global_step": 16834, "epoch": 100} {"train_loss": -6.508810997009277, "global_step": 16835, "epoch": 100} {"train_loss": -6.477900505065918, "global_step": 16836, "epoch": 100} {"train_loss": -6.754388809204102, "global_step": 16837, "epoch": 100} {"train_loss": -6.182106971740723, "global_step": 16838, "epoch": 100} {"train_loss": -6.472545623779297, "global_step": 16839, "epoch": 100} {"train_loss": -6.28560209274292, "global_step": 16840, "epoch": 100} {"train_loss": -6.502367973327637, "global_step": 16841, "epoch": 100} {"train_loss": -6.440760612487793, "global_step": 16842, "epoch": 100} {"train_loss": -6.348234176635742, "global_step": 16843, "epoch": 100} {"train_loss": -6.486063480377197, "global_step": 16844, "epoch": 100} {"train_loss": -6.447988986968994, "global_step": 16845, "epoch": 100} {"train_loss": -6.603542804718018, "global_step": 16846, "epoch": 100} {"train_loss": -6.412046909332275, "global_step": 16847, "epoch": 100} {"train_loss": -6.416048049926758, "global_step": 16848, "epoch": 100} {"train_loss": -6.783418655395508, "global_step": 16849, "epoch": 100} {"train_loss": -6.449455261230469, "global_step": 16850, "epoch": 100} {"train_loss": -6.702254295349121, "global_step": 16851, "epoch": 100} {"train_loss": -6.552066802978516, "global_step": 16852, "epoch": 100} {"train_loss": -6.751547336578369, "global_step": 16853, "epoch": 100} {"train_loss": -6.729747772216797, "global_step": 16854, "epoch": 100} {"train_loss": -6.717288017272949, "global_step": 16855, "epoch": 100} {"train_loss": -6.7211761474609375, "global_step": 16856, "epoch": 100} {"train_loss": -6.502353668212891, "global_step": 16857, "epoch": 100} {"train_loss": -6.440090179443359, "global_step": 16858, "epoch": 100} {"train_loss": -6.658083915710449, "global_step": 16859, "epoch": 100} {"train_loss": -6.763723373413086, "global_step": 16860, "epoch": 100} {"train_loss": -6.6443376541137695, "global_step": 16861, "epoch": 100} {"train_loss": -6.681106090545654, "global_step": 16862, "epoch": 100} {"train_loss": -6.595032215118408, "global_step": 16863, "epoch": 100} {"train_loss": -6.7800092697143555, "global_step": 16864, "epoch": 100} {"train_loss": -6.533783912658691, "global_step": 16865, "epoch": 100} {"train_loss": -6.792324542999268, "global_step": 16866, "epoch": 100} {"train_loss": -6.616059303283691, "global_step": 16867, "epoch": 100} {"train_loss": -6.763922691345215, "global_step": 16868, "epoch": 100} {"train_loss": -6.623212814331055, "global_step": 16869, "epoch": 100} {"train_loss": -6.444446563720703, "global_step": 16870, "epoch": 100} {"train_loss": -6.549810409545898, "global_step": 16871, "epoch": 100} {"train_loss": -6.334805011749268, "global_step": 16872, "epoch": 100} {"train_loss": -6.581630706787109, "global_step": 16873, "epoch": 100} {"train_loss": -6.4631805419921875, "global_step": 16874, "epoch": 100} {"train_loss": -6.323338508605957, "global_step": 16875, "epoch": 100} {"train_loss": -6.33510684967041, "global_step": 16876, "epoch": 100} {"train_loss": -6.391175270080566, "global_step": 16877, "epoch": 100} {"train_loss": -6.496875762939453, "global_step": 16878, "epoch": 100} {"train_loss": -6.1830902099609375, "global_step": 16879, "epoch": 100} {"train_loss": -6.3930253982543945, "global_step": 16880, "epoch": 100} {"train_loss": -6.463312149047852, "global_step": 16881, "epoch": 100} {"train_loss": -6.531722068786621, "global_step": 16882, "epoch": 100} {"train_loss": -6.495209217071533, "global_step": 16883, "epoch": 100} {"train_loss": -6.378835201263428, "global_step": 16884, "epoch": 100} {"train_loss": -6.56949520111084, "global_step": 16885, "epoch": 100} {"train_loss": -6.566793918609619, "global_step": 16886, "epoch": 100} {"train_loss": -6.465116500854492, "global_step": 16887, "epoch": 100} {"train_loss": -6.4467267990112305, "global_step": 16888, "epoch": 100} {"train_loss": -6.570339202880859, "global_step": 16889, "epoch": 100} {"train_loss": -6.612010955810547, "global_step": 16890, "epoch": 100} {"train_loss": -6.476195812225342, "global_step": 16891, "epoch": 100} {"train_loss": -6.817481994628906, "global_step": 16892, "epoch": 100} {"train_loss": -6.6851654052734375, "global_step": 16893, "epoch": 100} {"train_loss": -6.877566337585449, "global_step": 16894, "epoch": 100} {"train_loss": -6.734900951385498, "global_step": 16895, "epoch": 100} {"train_loss": -6.87453556060791, "global_step": 16896, "epoch": 100} {"train_loss": -6.5475263595581055, "global_step": 16897, "epoch": 100} {"train_loss": -6.520983695983887, "global_step": 16898, "epoch": 100} {"train_loss": -6.842166423797607, "global_step": 16899, "epoch": 100} {"train_loss": -6.751466751098633, "global_step": 16900, "epoch": 100} {"train_loss": -6.402480125427246, "global_step": 16901, "epoch": 100} {"train_loss": -6.631138801574707, "global_step": 16902, "epoch": 100} {"train_loss": -6.674551010131836, "global_step": 16903, "epoch": 100} {"train_loss": -6.595853805541992, "global_step": 16904, "epoch": 100} {"train_loss": -6.603140354156494, "global_step": 16905, "epoch": 100} {"train_loss": -6.583036422729492, "global_step": 16906, "epoch": 100} {"train_loss": -6.461062431335449, "global_step": 16907, "epoch": 100} {"train_loss": -6.485002517700195, "global_step": 16908, "epoch": 100} {"train_loss": -6.266841411590576, "global_step": 16909, "epoch": 100} {"train_loss": -6.4088029861450195, "global_step": 16910, "epoch": 100} {"train_loss": -6.431488037109375, "global_step": 16911, "epoch": 100} {"train_loss": -6.161996841430664, "global_step": 16912, "epoch": 100} {"train_loss": -6.772851467132568, "global_step": 16913, "epoch": 100} {"train_loss": -6.394386291503906, "global_step": 16914, "epoch": 100} {"train_loss": -6.437864303588867, "global_step": 16915, "epoch": 100} {"train_loss": -6.558877468109131, "global_step": 16916, "epoch": 100} {"train_loss": -6.4359941482543945, "global_step": 16917, "epoch": 100} {"train_loss": -6.739034652709961, "global_step": 16918, "epoch": 100} {"train_loss": -6.633201599121094, "global_step": 16919, "epoch": 100} {"train_loss": -6.675925254821777, "global_step": 16920, "epoch": 100} {"train_loss": -6.720913887023926, "global_step": 16921, "epoch": 100} {"train_loss": -6.394340515136719, "global_step": 16922, "epoch": 100} {"train_loss": -6.424010276794434, "global_step": 16923, "epoch": 100} {"train_loss": -6.606825351715088, "global_step": 16924, "epoch": 100} {"train_loss": -6.7271504402160645, "global_step": 16925, "epoch": 100} {"train_loss": -6.563484191894531, "global_step": 16926, "epoch": 100} {"train_loss": -6.719804286956787, "global_step": 16927, "epoch": 100} {"train_loss": -6.713819980621338, "global_step": 16928, "epoch": 100} {"train_loss": -6.56588077545166, "global_step": 16929, "epoch": 100} {"train_loss": -6.634310245513916, "global_step": 16930, "epoch": 100} {"train_loss": -6.736065864562988, "global_step": 16931, "epoch": 100} {"train_loss": -6.628950119018555, "global_step": 16932, "epoch": 100} {"train_loss": -6.669943332672119, "global_step": 16933, "epoch": 100} {"train_loss": -6.696231842041016, "global_step": 16934, "epoch": 100} {"train_loss": -6.635778903961182, "global_step": 16935, "epoch": 100} {"train_loss": -6.525815963745117, "global_step": 16936, "epoch": 100} {"train_loss": -6.425924301147461, "global_step": 16937, "epoch": 100} {"train_loss": -6.653873443603516, "global_step": 16938, "epoch": 100} {"train_loss": -6.548701286315918, "global_step": 16939, "epoch": 100} {"train_loss": -6.572330474853516, "global_step": 16940, "epoch": 100} {"train_loss": -6.495776653289795, "global_step": 16941, "epoch": 100} {"train_loss": -6.473688125610352, "global_step": 16942, "epoch": 100} {"train_loss": -6.338338851928711, "global_step": 16943, "epoch": 100} {"train_loss": -6.291849136352539, "global_step": 16944, "epoch": 100} {"train_loss": -6.546521186828613, "global_step": 16945, "epoch": 100} {"train_loss": -6.523127555847168, "global_step": 16946, "epoch": 100} {"train_loss": -6.3731231689453125, "global_step": 16947, "epoch": 100} {"train_loss": -6.280253887176514, "global_step": 16948, "epoch": 100} {"train_loss": -6.3421783447265625, "global_step": 16949, "epoch": 100} {"train_loss": -6.408979415893555, "global_step": 16950, "epoch": 100} {"train_loss": -6.401835918426514, "global_step": 16951, "epoch": 100} {"train_loss": -6.312316417694092, "global_step": 16952, "epoch": 100} {"train_loss": -6.482386112213135, "global_step": 16953, "epoch": 100} {"train_loss": -6.476960182189941, "global_step": 16954, "epoch": 100} {"train_loss": -6.512858867645264, "global_step": 16955, "epoch": 100} {"train_loss": -6.6552958488464355, "global_step": 16956, "epoch": 100} {"train_loss": -6.482113838195801, "global_step": 16957, "epoch": 100} {"train_loss": -6.480666637420654, "global_step": 16958, "epoch": 100} {"train_loss": -6.305865287780762, "global_step": 16959, "epoch": 100} {"train_loss": -6.66107177734375, "global_step": 16960, "epoch": 100} {"train_loss": -6.578574180603027, "global_step": 16961, "epoch": 100} {"train_loss": -6.611309051513672, "global_step": 16962, "epoch": 100} {"train_loss": -6.471342086791992, "global_step": 16963, "epoch": 100} {"train_loss": -6.7796173095703125, "global_step": 16964, "epoch": 100} {"train_loss": -6.55355167388916, "global_step": 16965, "epoch": 100} {"train_loss": -6.311591148376465, "global_step": 16966, "epoch": 100} {"train_loss": -6.544959065460024, "global_step": 16967, "epoch": 100, "train/sim_max_reward_0": 0.9014813612399079, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.9687948603151705, "train/sim_max_reward_3": 0.6638690974962294, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.5614940199580066, "test/sim_max_reward_4400000": 0.9737333889287515, "test/sim_max_reward_4400001": 0.9409259356587647, "test/sim_max_reward_4400002": 0.9663587521790115, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.4238486153503816, "test/sim_max_reward_4400005": 0.8902571359764189, "test/sim_max_reward_4400006": 0.02296499692509576, "test/sim_max_reward_4400007": 0.6679328165209544, "test/sim_max_reward_4400008": 0.5886040163513789, "test/sim_max_reward_4400009": 0.44105283134367007, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.5746755114354053, "test/sim_max_reward_4400012": 0.9990235327287853, "test/sim_max_reward_4400013": 0.9902224411319711, "test/sim_max_reward_4400014": 0.9537142348673316, "test/sim_max_reward_4400015": 0.38652351024533943, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9481061633686021, "test/sim_max_reward_4400019": 0.7166591630871447, "test/sim_max_reward_4400020": 1.4768089205654875e-05, "test/sim_max_reward_4400021": 0.5396439535245564, "test/sim_max_reward_4400022": 0.9588619400381959, "test/sim_max_reward_4400023": 0.15263797236258975, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.6610345876808571, "test/sim_max_reward_4400026": 0.912149628183726, "test/sim_max_reward_4400027": 0.7430506982088435, "test/sim_max_reward_4400028": 0.7123475515047445, "test/sim_max_reward_4400029": 0.49099911514206673, "test/sim_max_reward_4400030": 0.9954527333444333, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.07453473220067336, "test/sim_max_reward_4400033": 0.15895591870090875, "test/sim_max_reward_4400034": 0.9938313808992622, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.37176302275357714, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.0, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.41682524437379403, "test/sim_max_reward_4400041": 0.37632511866127377, "test/sim_max_reward_4400042": 0.9864228401341059, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.9804139704759094, "test/sim_max_reward_4400045": 0.3563026148811053, "test/sim_max_reward_4400046": 0.9555627180259586, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.8492732231682191, "test/mean_score": 0.5645066867229326, "val_loss": 231163.53125, "train_action_mse_error": 27.859560012817383} {"train_loss": -6.331469535827637, "global_step": 16968, "epoch": 101} {"train_loss": -6.546533107757568, "global_step": 16969, "epoch": 101} {"train_loss": -6.329906940460205, "global_step": 16970, "epoch": 101} {"train_loss": -6.408241271972656, "global_step": 16971, "epoch": 101} {"train_loss": -6.411578178405762, "global_step": 16972, "epoch": 101} {"train_loss": -6.25166654586792, "global_step": 16973, "epoch": 101} {"train_loss": -6.554713249206543, "global_step": 16974, "epoch": 101} {"train_loss": -6.4365339279174805, "global_step": 16975, "epoch": 101} {"train_loss": -6.412658214569092, "global_step": 16976, "epoch": 101} {"train_loss": -6.587810516357422, "global_step": 16977, "epoch": 101} {"train_loss": -6.391112327575684, "global_step": 16978, "epoch": 101} {"train_loss": -6.42138671875, "global_step": 16979, "epoch": 101} {"train_loss": -6.7367262840271, "global_step": 16980, "epoch": 101} {"train_loss": -6.748480796813965, "global_step": 16981, "epoch": 101} {"train_loss": -6.56003475189209, "global_step": 16982, "epoch": 101} {"train_loss": -6.296871185302734, "global_step": 16983, "epoch": 101} {"train_loss": -6.66810417175293, "global_step": 16984, "epoch": 101} {"train_loss": -6.439043045043945, "global_step": 16985, "epoch": 101} {"train_loss": -6.511109352111816, "global_step": 16986, "epoch": 101} {"train_loss": -6.472195148468018, "global_step": 16987, "epoch": 101} {"train_loss": -6.559883117675781, "global_step": 16988, "epoch": 101} {"train_loss": -6.5132880210876465, "global_step": 16989, "epoch": 101} {"train_loss": -6.519249439239502, "global_step": 16990, "epoch": 101} {"train_loss": -6.675999641418457, "global_step": 16991, "epoch": 101} {"train_loss": -6.097167015075684, "global_step": 16992, "epoch": 101} {"train_loss": -6.686487197875977, "global_step": 16993, "epoch": 101} {"train_loss": -6.574466705322266, "global_step": 16994, "epoch": 101} {"train_loss": -6.653805732727051, "global_step": 16995, "epoch": 101} {"train_loss": -6.294988632202148, "global_step": 16996, "epoch": 101} {"train_loss": -6.538268089294434, "global_step": 16997, "epoch": 101} {"train_loss": -6.568708419799805, "global_step": 16998, "epoch": 101} {"train_loss": -6.559844970703125, "global_step": 16999, "epoch": 101} {"train_loss": -6.395698547363281, "global_step": 17000, "epoch": 101} {"train_loss": -6.622844219207764, "global_step": 17001, "epoch": 101} {"train_loss": -6.25902795791626, "global_step": 17002, "epoch": 101} {"train_loss": -6.568062782287598, "global_step": 17003, "epoch": 101} {"train_loss": -6.390771865844727, "global_step": 17004, "epoch": 101} {"train_loss": -6.448829650878906, "global_step": 17005, "epoch": 101} {"train_loss": -6.387330055236816, "global_step": 17006, "epoch": 101} {"train_loss": -6.268000602722168, "global_step": 17007, "epoch": 101} {"train_loss": -6.470950126647949, "global_step": 17008, "epoch": 101} {"train_loss": -6.52928352355957, "global_step": 17009, "epoch": 101} {"train_loss": -6.6042985916137695, "global_step": 17010, "epoch": 101} {"train_loss": -6.737282752990723, "global_step": 17011, "epoch": 101} {"train_loss": -6.605495452880859, "global_step": 17012, "epoch": 101} {"train_loss": -6.755387783050537, "global_step": 17013, "epoch": 101} {"train_loss": -6.544474124908447, "global_step": 17014, "epoch": 101} {"train_loss": -6.559599876403809, "global_step": 17015, "epoch": 101} {"train_loss": -6.5194010734558105, "global_step": 17016, "epoch": 101} {"train_loss": -6.577263355255127, "global_step": 17017, "epoch": 101} {"train_loss": -6.683592796325684, "global_step": 17018, "epoch": 101} {"train_loss": -6.653324604034424, "global_step": 17019, "epoch": 101} {"train_loss": -6.771958351135254, "global_step": 17020, "epoch": 101} {"train_loss": -6.510912895202637, "global_step": 17021, "epoch": 101} {"train_loss": -6.821589469909668, "global_step": 17022, "epoch": 101} {"train_loss": -6.38587760925293, "global_step": 17023, "epoch": 101} {"train_loss": -6.508538246154785, "global_step": 17024, "epoch": 101} {"train_loss": -6.412738800048828, "global_step": 17025, "epoch": 101} {"train_loss": -6.545462608337402, "global_step": 17026, "epoch": 101} {"train_loss": -6.590339183807373, "global_step": 17027, "epoch": 101} {"train_loss": -6.614838600158691, "global_step": 17028, "epoch": 101} {"train_loss": -6.124757766723633, "global_step": 17029, "epoch": 101} {"train_loss": -6.57895040512085, "global_step": 17030, "epoch": 101} {"train_loss": -6.42950439453125, "global_step": 17031, "epoch": 101} {"train_loss": -6.4821953773498535, "global_step": 17032, "epoch": 101} {"train_loss": -6.406560897827148, "global_step": 17033, "epoch": 101} {"train_loss": -6.556709289550781, "global_step": 17034, "epoch": 101} {"train_loss": -6.348476409912109, "global_step": 17035, "epoch": 101} {"train_loss": -6.419473648071289, "global_step": 17036, "epoch": 101} {"train_loss": -6.265407562255859, "global_step": 17037, "epoch": 101} {"train_loss": -6.5612897872924805, "global_step": 17038, "epoch": 101} {"train_loss": -6.315707206726074, "global_step": 17039, "epoch": 101} {"train_loss": -6.7088189125061035, "global_step": 17040, "epoch": 101} {"train_loss": -6.651627540588379, "global_step": 17041, "epoch": 101} {"train_loss": -6.320830821990967, "global_step": 17042, "epoch": 101} {"train_loss": -6.478672027587891, "global_step": 17043, "epoch": 101} {"train_loss": -6.388996124267578, "global_step": 17044, "epoch": 101} {"train_loss": -6.541220664978027, "global_step": 17045, "epoch": 101} {"train_loss": -6.427521705627441, "global_step": 17046, "epoch": 101} {"train_loss": -6.710202693939209, "global_step": 17047, "epoch": 101} {"train_loss": -6.324884414672852, "global_step": 17048, "epoch": 101} {"train_loss": -6.626910209655762, "global_step": 17049, "epoch": 101} {"train_loss": -6.47170352935791, "global_step": 17050, "epoch": 101} {"train_loss": -6.511744976043701, "global_step": 17051, "epoch": 101} {"train_loss": -6.430224418640137, "global_step": 17052, "epoch": 101} {"train_loss": -6.32158088684082, "global_step": 17053, "epoch": 101} {"train_loss": -6.685332298278809, "global_step": 17054, "epoch": 101} {"train_loss": -5.924775123596191, "global_step": 17055, "epoch": 101} {"train_loss": -6.643267631530762, "global_step": 17056, "epoch": 101} {"train_loss": -6.0593366622924805, "global_step": 17057, "epoch": 101} {"train_loss": -6.511878967285156, "global_step": 17058, "epoch": 101} {"train_loss": -6.221895217895508, "global_step": 17059, "epoch": 101} {"train_loss": -6.269956111907959, "global_step": 17060, "epoch": 101} {"train_loss": -6.497599124908447, "global_step": 17061, "epoch": 101} {"train_loss": -6.323554992675781, "global_step": 17062, "epoch": 101} {"train_loss": -6.293079376220703, "global_step": 17063, "epoch": 101} {"train_loss": -6.336523532867432, "global_step": 17064, "epoch": 101} {"train_loss": -6.610306739807129, "global_step": 17065, "epoch": 101} {"train_loss": -6.143518447875977, "global_step": 17066, "epoch": 101} {"train_loss": -6.408603668212891, "global_step": 17067, "epoch": 101} {"train_loss": -6.546573638916016, "global_step": 17068, "epoch": 101} {"train_loss": -6.331679821014404, "global_step": 17069, "epoch": 101} {"train_loss": -6.60767936706543, "global_step": 17070, "epoch": 101} {"train_loss": -6.637742519378662, "global_step": 17071, "epoch": 101} {"train_loss": -6.533604621887207, "global_step": 17072, "epoch": 101} {"train_loss": -6.683894634246826, "global_step": 17073, "epoch": 101} {"train_loss": -6.515698432922363, "global_step": 17074, "epoch": 101} {"train_loss": -6.559000015258789, "global_step": 17075, "epoch": 101} {"train_loss": -6.458873748779297, "global_step": 17076, "epoch": 101} {"train_loss": -6.508749961853027, "global_step": 17077, "epoch": 101} {"train_loss": -6.522188186645508, "global_step": 17078, "epoch": 101} {"train_loss": -6.435659885406494, "global_step": 17079, "epoch": 101} {"train_loss": -6.557674407958984, "global_step": 17080, "epoch": 101} {"train_loss": -6.452282905578613, "global_step": 17081, "epoch": 101} {"train_loss": -6.385469436645508, "global_step": 17082, "epoch": 101} {"train_loss": -6.4810380935668945, "global_step": 17083, "epoch": 101} {"train_loss": -6.360544204711914, "global_step": 17084, "epoch": 101} {"train_loss": -6.470556735992432, "global_step": 17085, "epoch": 101} {"train_loss": -6.41084098815918, "global_step": 17086, "epoch": 101} {"train_loss": -6.677432060241699, "global_step": 17087, "epoch": 101} {"train_loss": -6.333621978759766, "global_step": 17088, "epoch": 101} {"train_loss": -6.654193878173828, "global_step": 17089, "epoch": 101} {"train_loss": -6.360822677612305, "global_step": 17090, "epoch": 101} {"train_loss": -6.497648239135742, "global_step": 17091, "epoch": 101} {"train_loss": -6.363346099853516, "global_step": 17092, "epoch": 101} {"train_loss": -6.407263278961182, "global_step": 17093, "epoch": 101} {"train_loss": -6.516242504119873, "global_step": 17094, "epoch": 101} {"train_loss": -6.41718864440918, "global_step": 17095, "epoch": 101} {"train_loss": -6.451664924621582, "global_step": 17096, "epoch": 101} {"train_loss": -6.364969253540039, "global_step": 17097, "epoch": 101} {"train_loss": -6.283953666687012, "global_step": 17098, "epoch": 101} {"train_loss": -6.469025135040283, "global_step": 17099, "epoch": 101} {"train_loss": -6.558055877685547, "global_step": 17100, "epoch": 101} {"train_loss": -6.595256805419922, "global_step": 17101, "epoch": 101} {"train_loss": -6.717879295349121, "global_step": 17102, "epoch": 101} {"train_loss": -6.462679386138916, "global_step": 17103, "epoch": 101} {"train_loss": -6.481988906860352, "global_step": 17104, "epoch": 101} {"train_loss": -6.491433143615723, "global_step": 17105, "epoch": 101} {"train_loss": -6.499455451965332, "global_step": 17106, "epoch": 101} {"train_loss": -6.439947605133057, "global_step": 17107, "epoch": 101} {"train_loss": -6.661134719848633, "global_step": 17108, "epoch": 101} {"train_loss": -6.641851902008057, "global_step": 17109, "epoch": 101} {"train_loss": -6.792684078216553, "global_step": 17110, "epoch": 101} {"train_loss": -6.527473449707031, "global_step": 17111, "epoch": 101} {"train_loss": -6.5480451583862305, "global_step": 17112, "epoch": 101} {"train_loss": -6.363166809082031, "global_step": 17113, "epoch": 101} {"train_loss": -6.651671886444092, "global_step": 17114, "epoch": 101} {"train_loss": -6.384043216705322, "global_step": 17115, "epoch": 101} {"train_loss": -6.502735137939453, "global_step": 17116, "epoch": 101} {"train_loss": -6.291760444641113, "global_step": 17117, "epoch": 101} {"train_loss": -6.551741600036621, "global_step": 17118, "epoch": 101} {"train_loss": -6.537228584289551, "global_step": 17119, "epoch": 101} {"train_loss": -6.885067939758301, "global_step": 17120, "epoch": 101} {"train_loss": -6.105987548828125, "global_step": 17121, "epoch": 101} {"train_loss": -6.384706497192383, "global_step": 17122, "epoch": 101} {"train_loss": -6.463688373565674, "global_step": 17123, "epoch": 101} {"train_loss": -6.779962539672852, "global_step": 17124, "epoch": 101} {"train_loss": -6.52348518371582, "global_step": 17125, "epoch": 101} {"train_loss": -6.492568016052246, "global_step": 17126, "epoch": 101} {"train_loss": -6.409000396728516, "global_step": 17127, "epoch": 101} {"train_loss": -6.735183238983154, "global_step": 17128, "epoch": 101} {"train_loss": -6.591041564941406, "global_step": 17129, "epoch": 101} {"train_loss": -6.708749294281006, "global_step": 17130, "epoch": 101} {"train_loss": -6.53157377243042, "global_step": 17131, "epoch": 101} {"train_loss": -6.605269432067871, "global_step": 17132, "epoch": 101} {"train_loss": -6.761410713195801, "global_step": 17133, "epoch": 101} {"train_loss": -6.451715469360352, "global_step": 17134, "epoch": 101} {"train_loss": -6.4919721853165395, "global_step": 17135, "epoch": 101, "val_loss": 232162.34375} {"train_loss": -6.117295742034912, "global_step": 17136, "epoch": 102} {"train_loss": -6.590253829956055, "global_step": 17137, "epoch": 102} {"train_loss": -6.460200786590576, "global_step": 17138, "epoch": 102} {"train_loss": -6.666680335998535, "global_step": 17139, "epoch": 102} {"train_loss": -6.724556922912598, "global_step": 17140, "epoch": 102} {"train_loss": -6.602241516113281, "global_step": 17141, "epoch": 102} {"train_loss": -6.634259223937988, "global_step": 17142, "epoch": 102} {"train_loss": -6.421406269073486, "global_step": 17143, "epoch": 102} {"train_loss": -6.498419284820557, "global_step": 17144, "epoch": 102} {"train_loss": -6.846942901611328, "global_step": 17145, "epoch": 102} {"train_loss": -6.909446716308594, "global_step": 17146, "epoch": 102} {"train_loss": -6.5372090339660645, "global_step": 17147, "epoch": 102} {"train_loss": -6.718774795532227, "global_step": 17148, "epoch": 102} {"train_loss": -6.787579536437988, "global_step": 17149, "epoch": 102} {"train_loss": -6.518383026123047, "global_step": 17150, "epoch": 102} {"train_loss": -6.482669353485107, "global_step": 17151, "epoch": 102} {"train_loss": -6.5966877937316895, "global_step": 17152, "epoch": 102} {"train_loss": -6.645569324493408, "global_step": 17153, "epoch": 102} {"train_loss": -6.688294410705566, "global_step": 17154, "epoch": 102} {"train_loss": -6.8768510818481445, "global_step": 17155, "epoch": 102} {"train_loss": -6.758885383605957, "global_step": 17156, "epoch": 102} {"train_loss": -6.859436988830566, "global_step": 17157, "epoch": 102} {"train_loss": -6.5226545333862305, "global_step": 17158, "epoch": 102} {"train_loss": -6.820794105529785, "global_step": 17159, "epoch": 102} {"train_loss": -6.338108539581299, "global_step": 17160, "epoch": 102} {"train_loss": -6.805941581726074, "global_step": 17161, "epoch": 102} {"train_loss": -6.65945291519165, "global_step": 17162, "epoch": 102} {"train_loss": -6.7644195556640625, "global_step": 17163, "epoch": 102} {"train_loss": -6.517736911773682, "global_step": 17164, "epoch": 102} {"train_loss": -6.554612636566162, "global_step": 17165, "epoch": 102} {"train_loss": -6.709432125091553, "global_step": 17166, "epoch": 102} {"train_loss": -6.744809150695801, "global_step": 17167, "epoch": 102} {"train_loss": -6.682950019836426, "global_step": 17168, "epoch": 102} {"train_loss": -6.414149284362793, "global_step": 17169, "epoch": 102} {"train_loss": -6.636260032653809, "global_step": 17170, "epoch": 102} {"train_loss": -6.510170936584473, "global_step": 17171, "epoch": 102} {"train_loss": -6.4719133377075195, "global_step": 17172, "epoch": 102} {"train_loss": -6.346630096435547, "global_step": 17173, "epoch": 102} {"train_loss": -6.742103576660156, "global_step": 17174, "epoch": 102} {"train_loss": -6.284843444824219, "global_step": 17175, "epoch": 102} {"train_loss": -6.407048225402832, "global_step": 17176, "epoch": 102} {"train_loss": -6.535910129547119, "global_step": 17177, "epoch": 102} {"train_loss": -6.653926849365234, "global_step": 17178, "epoch": 102} {"train_loss": -6.568085670471191, "global_step": 17179, "epoch": 102} {"train_loss": -6.430058479309082, "global_step": 17180, "epoch": 102} {"train_loss": -6.658293724060059, "global_step": 17181, "epoch": 102} {"train_loss": -6.5304036140441895, "global_step": 17182, "epoch": 102} {"train_loss": -6.613763809204102, "global_step": 17183, "epoch": 102} {"train_loss": -6.786452293395996, "global_step": 17184, "epoch": 102} {"train_loss": -6.423303604125977, "global_step": 17185, "epoch": 102} {"train_loss": -6.7282819747924805, "global_step": 17186, "epoch": 102} {"train_loss": -6.705394268035889, "global_step": 17187, "epoch": 102} {"train_loss": -6.717251777648926, "global_step": 17188, "epoch": 102} {"train_loss": -6.335564136505127, "global_step": 17189, "epoch": 102} {"train_loss": -6.589351177215576, "global_step": 17190, "epoch": 102} {"train_loss": -6.710643291473389, "global_step": 17191, "epoch": 102} {"train_loss": -6.68408203125, "global_step": 17192, "epoch": 102} {"train_loss": -6.451746940612793, "global_step": 17193, "epoch": 102} {"train_loss": -6.643712043762207, "global_step": 17194, "epoch": 102} {"train_loss": -6.578282356262207, "global_step": 17195, "epoch": 102} {"train_loss": -6.679311752319336, "global_step": 17196, "epoch": 102} {"train_loss": -6.686392307281494, "global_step": 17197, "epoch": 102} {"train_loss": -6.559231758117676, "global_step": 17198, "epoch": 102} {"train_loss": -6.929980278015137, "global_step": 17199, "epoch": 102} {"train_loss": -6.446381568908691, "global_step": 17200, "epoch": 102} {"train_loss": -6.668844223022461, "global_step": 17201, "epoch": 102} {"train_loss": -6.721686363220215, "global_step": 17202, "epoch": 102} {"train_loss": -6.980849742889404, "global_step": 17203, "epoch": 102} {"train_loss": -6.63946008682251, "global_step": 17204, "epoch": 102} {"train_loss": -6.536012649536133, "global_step": 17205, "epoch": 102} {"train_loss": -6.335273742675781, "global_step": 17206, "epoch": 102} {"train_loss": -6.770260810852051, "global_step": 17207, "epoch": 102} {"train_loss": -6.395936012268066, "global_step": 17208, "epoch": 102} {"train_loss": -6.57855224609375, "global_step": 17209, "epoch": 102} {"train_loss": -6.590038776397705, "global_step": 17210, "epoch": 102} {"train_loss": -6.524970531463623, "global_step": 17211, "epoch": 102} {"train_loss": -6.720490455627441, "global_step": 17212, "epoch": 102} {"train_loss": -6.660094261169434, "global_step": 17213, "epoch": 102} {"train_loss": -6.59946870803833, "global_step": 17214, "epoch": 102} {"train_loss": -6.629995346069336, "global_step": 17215, "epoch": 102} {"train_loss": -6.579036235809326, "global_step": 17216, "epoch": 102} {"train_loss": -6.710842132568359, "global_step": 17217, "epoch": 102} {"train_loss": -6.964668273925781, "global_step": 17218, "epoch": 102} {"train_loss": -6.980363845825195, "global_step": 17219, "epoch": 102} {"train_loss": -6.847499370574951, "global_step": 17220, "epoch": 102} {"train_loss": -6.67704963684082, "global_step": 17221, "epoch": 102} {"train_loss": -6.745181560516357, "global_step": 17222, "epoch": 102} {"train_loss": -6.7122015953063965, "global_step": 17223, "epoch": 102} {"train_loss": -6.596158027648926, "global_step": 17224, "epoch": 102} {"train_loss": -6.599768161773682, "global_step": 17225, "epoch": 102} {"train_loss": -6.534564018249512, "global_step": 17226, "epoch": 102} {"train_loss": -6.501280307769775, "global_step": 17227, "epoch": 102} {"train_loss": -6.799842357635498, "global_step": 17228, "epoch": 102} {"train_loss": -6.5956621170043945, "global_step": 17229, "epoch": 102} {"train_loss": -6.620454788208008, "global_step": 17230, "epoch": 102} {"train_loss": -6.939243316650391, "global_step": 17231, "epoch": 102} {"train_loss": -6.791232585906982, "global_step": 17232, "epoch": 102} {"train_loss": -6.384057521820068, "global_step": 17233, "epoch": 102} {"train_loss": -6.47835111618042, "global_step": 17234, "epoch": 102} {"train_loss": -6.734271049499512, "global_step": 17235, "epoch": 102} {"train_loss": -6.442991256713867, "global_step": 17236, "epoch": 102} {"train_loss": -6.384860038757324, "global_step": 17237, "epoch": 102} {"train_loss": -6.714930057525635, "global_step": 17238, "epoch": 102} {"train_loss": -6.249061584472656, "global_step": 17239, "epoch": 102} {"train_loss": -6.409307956695557, "global_step": 17240, "epoch": 102} {"train_loss": -6.563168525695801, "global_step": 17241, "epoch": 102} {"train_loss": -6.1381025314331055, "global_step": 17242, "epoch": 102} {"train_loss": -6.811161041259766, "global_step": 17243, "epoch": 102} {"train_loss": -6.427492141723633, "global_step": 17244, "epoch": 102} {"train_loss": -6.444241523742676, "global_step": 17245, "epoch": 102} {"train_loss": -6.285195350646973, "global_step": 17246, "epoch": 102} {"train_loss": -6.165677070617676, "global_step": 17247, "epoch": 102} {"train_loss": -6.3857526779174805, "global_step": 17248, "epoch": 102} {"train_loss": -6.359194755554199, "global_step": 17249, "epoch": 102} {"train_loss": -6.453078746795654, "global_step": 17250, "epoch": 102} {"train_loss": -6.448707103729248, "global_step": 17251, "epoch": 102} {"train_loss": -6.457386493682861, "global_step": 17252, "epoch": 102} {"train_loss": -6.526595592498779, "global_step": 17253, "epoch": 102} {"train_loss": -6.425699710845947, "global_step": 17254, "epoch": 102} {"train_loss": -6.559338092803955, "global_step": 17255, "epoch": 102} {"train_loss": -6.343911170959473, "global_step": 17256, "epoch": 102} {"train_loss": -6.516910552978516, "global_step": 17257, "epoch": 102} {"train_loss": -6.383092880249023, "global_step": 17258, "epoch": 102} {"train_loss": -6.701625823974609, "global_step": 17259, "epoch": 102} {"train_loss": -6.75775671005249, "global_step": 17260, "epoch": 102} {"train_loss": -6.652441501617432, "global_step": 17261, "epoch": 102} {"train_loss": -6.437022686004639, "global_step": 17262, "epoch": 102} {"train_loss": -6.536063194274902, "global_step": 17263, "epoch": 102} {"train_loss": -6.627139568328857, "global_step": 17264, "epoch": 102} {"train_loss": -6.490407943725586, "global_step": 17265, "epoch": 102} {"train_loss": -6.721468448638916, "global_step": 17266, "epoch": 102} {"train_loss": -6.793880462646484, "global_step": 17267, "epoch": 102} {"train_loss": -6.867780685424805, "global_step": 17268, "epoch": 102} {"train_loss": -6.797669410705566, "global_step": 17269, "epoch": 102} {"train_loss": -6.59977388381958, "global_step": 17270, "epoch": 102} {"train_loss": -6.918503761291504, "global_step": 17271, "epoch": 102} {"train_loss": -6.794620513916016, "global_step": 17272, "epoch": 102} {"train_loss": -6.751564025878906, "global_step": 17273, "epoch": 102} {"train_loss": -6.607610702514648, "global_step": 17274, "epoch": 102} {"train_loss": -6.4414215087890625, "global_step": 17275, "epoch": 102} {"train_loss": -6.435563564300537, "global_step": 17276, "epoch": 102} {"train_loss": -6.543938636779785, "global_step": 17277, "epoch": 102} {"train_loss": -6.477582931518555, "global_step": 17278, "epoch": 102} {"train_loss": -6.261117458343506, "global_step": 17279, "epoch": 102} {"train_loss": -6.3444414138793945, "global_step": 17280, "epoch": 102} {"train_loss": -6.641368865966797, "global_step": 17281, "epoch": 102} {"train_loss": -6.340810775756836, "global_step": 17282, "epoch": 102} {"train_loss": -6.323033809661865, "global_step": 17283, "epoch": 102} {"train_loss": -6.571262359619141, "global_step": 17284, "epoch": 102} {"train_loss": -6.455277919769287, "global_step": 17285, "epoch": 102} {"train_loss": -6.464265823364258, "global_step": 17286, "epoch": 102} {"train_loss": -6.431056976318359, "global_step": 17287, "epoch": 102} {"train_loss": -6.484153747558594, "global_step": 17288, "epoch": 102} {"train_loss": -6.300879955291748, "global_step": 17289, "epoch": 102} {"train_loss": -6.407361030578613, "global_step": 17290, "epoch": 102} {"train_loss": -6.396446228027344, "global_step": 17291, "epoch": 102} {"train_loss": -6.674965858459473, "global_step": 17292, "epoch": 102} {"train_loss": -6.602924346923828, "global_step": 17293, "epoch": 102} {"train_loss": -6.706319808959961, "global_step": 17294, "epoch": 102} {"train_loss": -6.5904622077941895, "global_step": 17295, "epoch": 102} {"train_loss": -6.5744404792785645, "global_step": 17296, "epoch": 102} {"train_loss": -6.572890281677246, "global_step": 17297, "epoch": 102} {"train_loss": -6.7039408683776855, "global_step": 17298, "epoch": 102} {"train_loss": -6.614197254180908, "global_step": 17299, "epoch": 102} {"train_loss": -6.649101257324219, "global_step": 17300, "epoch": 102} {"train_loss": -6.467841625213623, "global_step": 17301, "epoch": 102} {"train_loss": -6.649083137512207, "global_step": 17302, "epoch": 102} {"train_loss": -6.584595370860327, "global_step": 17303, "epoch": 102, "val_loss": 231723.828125} {"train_loss": -6.550579071044922, "global_step": 17304, "epoch": 103} {"train_loss": -6.556704521179199, "global_step": 17305, "epoch": 103} {"train_loss": -6.377772331237793, "global_step": 17306, "epoch": 103} {"train_loss": -6.691619873046875, "global_step": 17307, "epoch": 103} {"train_loss": -6.318485260009766, "global_step": 17308, "epoch": 103} {"train_loss": -6.496586322784424, "global_step": 17309, "epoch": 103} {"train_loss": -6.331978797912598, "global_step": 17310, "epoch": 103} {"train_loss": -6.496172904968262, "global_step": 17311, "epoch": 103} {"train_loss": -6.348381519317627, "global_step": 17312, "epoch": 103} {"train_loss": -6.445661544799805, "global_step": 17313, "epoch": 103} {"train_loss": -6.079501152038574, "global_step": 17314, "epoch": 103} {"train_loss": -6.475711345672607, "global_step": 17315, "epoch": 103} {"train_loss": -6.360817909240723, "global_step": 17316, "epoch": 103} {"train_loss": -6.649042129516602, "global_step": 17317, "epoch": 103} {"train_loss": -6.451231002807617, "global_step": 17318, "epoch": 103} {"train_loss": -6.565303325653076, "global_step": 17319, "epoch": 103} {"train_loss": -6.566840171813965, "global_step": 17320, "epoch": 103} {"train_loss": -6.010397911071777, "global_step": 17321, "epoch": 103} {"train_loss": -6.557618618011475, "global_step": 17322, "epoch": 103} {"train_loss": -6.340590476989746, "global_step": 17323, "epoch": 103} {"train_loss": -6.478618621826172, "global_step": 17324, "epoch": 103} {"train_loss": -6.342658519744873, "global_step": 17325, "epoch": 103} {"train_loss": -6.439704895019531, "global_step": 17326, "epoch": 103} {"train_loss": -6.669686794281006, "global_step": 17327, "epoch": 103} {"train_loss": -6.559653282165527, "global_step": 17328, "epoch": 103} {"train_loss": -6.403846740722656, "global_step": 17329, "epoch": 103} {"train_loss": -6.3499040603637695, "global_step": 17330, "epoch": 103} {"train_loss": -6.526820659637451, "global_step": 17331, "epoch": 103} {"train_loss": -6.6126604080200195, "global_step": 17332, "epoch": 103} {"train_loss": -6.645043849945068, "global_step": 17333, "epoch": 103} {"train_loss": -6.568892478942871, "global_step": 17334, "epoch": 103} {"train_loss": -6.492297649383545, "global_step": 17335, "epoch": 103} {"train_loss": -6.516606330871582, "global_step": 17336, "epoch": 103} {"train_loss": -6.714449405670166, "global_step": 17337, "epoch": 103} {"train_loss": -6.623164176940918, "global_step": 17338, "epoch": 103} {"train_loss": -6.307114601135254, "global_step": 17339, "epoch": 103} {"train_loss": -6.6927900314331055, "global_step": 17340, "epoch": 103} {"train_loss": -6.516756534576416, "global_step": 17341, "epoch": 103} {"train_loss": -5.847066879272461, "global_step": 17342, "epoch": 103} {"train_loss": -6.523953437805176, "global_step": 17343, "epoch": 103} {"train_loss": -6.214962005615234, "global_step": 17344, "epoch": 103} {"train_loss": -6.463057994842529, "global_step": 17345, "epoch": 103} {"train_loss": -6.554958343505859, "global_step": 17346, "epoch": 103} {"train_loss": -6.169921875, "global_step": 17347, "epoch": 103} {"train_loss": -6.307040214538574, "global_step": 17348, "epoch": 103} {"train_loss": -6.627043724060059, "global_step": 17349, "epoch": 103} {"train_loss": -6.5523834228515625, "global_step": 17350, "epoch": 103} {"train_loss": -6.318234443664551, "global_step": 17351, "epoch": 103} {"train_loss": -6.331015110015869, "global_step": 17352, "epoch": 103} {"train_loss": -6.3619842529296875, "global_step": 17353, "epoch": 103} {"train_loss": -6.782279968261719, "global_step": 17354, "epoch": 103} {"train_loss": -6.396553039550781, "global_step": 17355, "epoch": 103} {"train_loss": -6.605562210083008, "global_step": 17356, "epoch": 103} {"train_loss": -6.454559326171875, "global_step": 17357, "epoch": 103} {"train_loss": -6.557738304138184, "global_step": 17358, "epoch": 103} {"train_loss": -6.576345920562744, "global_step": 17359, "epoch": 103} {"train_loss": -6.523359775543213, "global_step": 17360, "epoch": 103} {"train_loss": -6.441661357879639, "global_step": 17361, "epoch": 103} {"train_loss": -6.549590587615967, "global_step": 17362, "epoch": 103} {"train_loss": -6.538888931274414, "global_step": 17363, "epoch": 103} {"train_loss": -6.336081504821777, "global_step": 17364, "epoch": 103} {"train_loss": -6.260653972625732, "global_step": 17365, "epoch": 103} {"train_loss": -6.285774230957031, "global_step": 17366, "epoch": 103} {"train_loss": -6.276181697845459, "global_step": 17367, "epoch": 103} {"train_loss": -6.113473892211914, "global_step": 17368, "epoch": 103} {"train_loss": -6.31129264831543, "global_step": 17369, "epoch": 103} {"train_loss": -6.216857433319092, "global_step": 17370, "epoch": 103} {"train_loss": -6.543129920959473, "global_step": 17371, "epoch": 103} {"train_loss": -6.209782600402832, "global_step": 17372, "epoch": 103} {"train_loss": -6.229592323303223, "global_step": 17373, "epoch": 103} {"train_loss": -6.452755928039551, "global_step": 17374, "epoch": 103} {"train_loss": -6.353571891784668, "global_step": 17375, "epoch": 103} {"train_loss": -6.417324066162109, "global_step": 17376, "epoch": 103} {"train_loss": -6.383380889892578, "global_step": 17377, "epoch": 103} {"train_loss": -6.458371162414551, "global_step": 17378, "epoch": 103} {"train_loss": -6.699361801147461, "global_step": 17379, "epoch": 103} {"train_loss": -6.6260294914245605, "global_step": 17380, "epoch": 103} {"train_loss": -6.551856994628906, "global_step": 17381, "epoch": 103} {"train_loss": -6.830862045288086, "global_step": 17382, "epoch": 103} {"train_loss": -6.418585777282715, "global_step": 17383, "epoch": 103} {"train_loss": -6.8182501792907715, "global_step": 17384, "epoch": 103} {"train_loss": -6.647570610046387, "global_step": 17385, "epoch": 103} {"train_loss": -6.800578594207764, "global_step": 17386, "epoch": 103} {"train_loss": -6.700546741485596, "global_step": 17387, "epoch": 103} {"train_loss": -6.566839218139648, "global_step": 17388, "epoch": 103} {"train_loss": -6.578910827636719, "global_step": 17389, "epoch": 103} {"train_loss": -6.713283538818359, "global_step": 17390, "epoch": 103} {"train_loss": -6.757992744445801, "global_step": 17391, "epoch": 103} {"train_loss": -6.6188249588012695, "global_step": 17392, "epoch": 103} {"train_loss": -6.88842248916626, "global_step": 17393, "epoch": 103} {"train_loss": -6.705889701843262, "global_step": 17394, "epoch": 103} {"train_loss": -6.533720016479492, "global_step": 17395, "epoch": 103} {"train_loss": -6.650167942047119, "global_step": 17396, "epoch": 103} {"train_loss": -6.6737284660339355, "global_step": 17397, "epoch": 103} {"train_loss": -6.677602291107178, "global_step": 17398, "epoch": 103} {"train_loss": -6.511363506317139, "global_step": 17399, "epoch": 103} {"train_loss": -6.146513938903809, "global_step": 17400, "epoch": 103} {"train_loss": -6.686103820800781, "global_step": 17401, "epoch": 103} {"train_loss": -6.474015712738037, "global_step": 17402, "epoch": 103} {"train_loss": -6.658361434936523, "global_step": 17403, "epoch": 103} {"train_loss": -6.42912483215332, "global_step": 17404, "epoch": 103} {"train_loss": -6.619017601013184, "global_step": 17405, "epoch": 103} {"train_loss": -6.624227046966553, "global_step": 17406, "epoch": 103} {"train_loss": -6.512655258178711, "global_step": 17407, "epoch": 103} {"train_loss": -6.509092330932617, "global_step": 17408, "epoch": 103} {"train_loss": -6.537874221801758, "global_step": 17409, "epoch": 103} {"train_loss": -6.589937210083008, "global_step": 17410, "epoch": 103} {"train_loss": -6.463229179382324, "global_step": 17411, "epoch": 103} {"train_loss": -6.772028923034668, "global_step": 17412, "epoch": 103} {"train_loss": -6.50942325592041, "global_step": 17413, "epoch": 103} {"train_loss": -6.550965309143066, "global_step": 17414, "epoch": 103} {"train_loss": -6.440881729125977, "global_step": 17415, "epoch": 103} {"train_loss": -6.634293556213379, "global_step": 17416, "epoch": 103} {"train_loss": -6.50665283203125, "global_step": 17417, "epoch": 103} {"train_loss": -6.61814022064209, "global_step": 17418, "epoch": 103} {"train_loss": -6.640727519989014, "global_step": 17419, "epoch": 103} {"train_loss": -6.584514141082764, "global_step": 17420, "epoch": 103} {"train_loss": -6.641894340515137, "global_step": 17421, "epoch": 103} {"train_loss": -6.644470691680908, "global_step": 17422, "epoch": 103} {"train_loss": -6.768344402313232, "global_step": 17423, "epoch": 103} {"train_loss": -6.631077289581299, "global_step": 17424, "epoch": 103} {"train_loss": -6.805399417877197, "global_step": 17425, "epoch": 103} {"train_loss": -6.788269996643066, "global_step": 17426, "epoch": 103} {"train_loss": -6.6866607666015625, "global_step": 17427, "epoch": 103} {"train_loss": -6.483366966247559, "global_step": 17428, "epoch": 103} {"train_loss": -6.600487232208252, "global_step": 17429, "epoch": 103} {"train_loss": -6.516363143920898, "global_step": 17430, "epoch": 103} {"train_loss": -6.487480640411377, "global_step": 17431, "epoch": 103} {"train_loss": -6.768941402435303, "global_step": 17432, "epoch": 103} {"train_loss": -6.705265522003174, "global_step": 17433, "epoch": 103} {"train_loss": -6.672843933105469, "global_step": 17434, "epoch": 103} {"train_loss": -6.408102035522461, "global_step": 17435, "epoch": 103} {"train_loss": -6.654555320739746, "global_step": 17436, "epoch": 103} {"train_loss": -6.673402786254883, "global_step": 17437, "epoch": 103} {"train_loss": -6.383206367492676, "global_step": 17438, "epoch": 103} {"train_loss": -6.831801414489746, "global_step": 17439, "epoch": 103} {"train_loss": -6.497005939483643, "global_step": 17440, "epoch": 103} {"train_loss": -6.7009806632995605, "global_step": 17441, "epoch": 103} {"train_loss": -6.186349868774414, "global_step": 17442, "epoch": 103} {"train_loss": -6.654989242553711, "global_step": 17443, "epoch": 103} {"train_loss": -6.455461502075195, "global_step": 17444, "epoch": 103} {"train_loss": -6.497275352478027, "global_step": 17445, "epoch": 103} {"train_loss": -6.517022609710693, "global_step": 17446, "epoch": 103} {"train_loss": -6.489734649658203, "global_step": 17447, "epoch": 103} {"train_loss": -6.688622951507568, "global_step": 17448, "epoch": 103} {"train_loss": -6.470232009887695, "global_step": 17449, "epoch": 103} {"train_loss": -6.509683609008789, "global_step": 17450, "epoch": 103} {"train_loss": -6.360841751098633, "global_step": 17451, "epoch": 103} {"train_loss": -6.493297576904297, "global_step": 17452, "epoch": 103} {"train_loss": -6.536922454833984, "global_step": 17453, "epoch": 103} {"train_loss": -6.620230674743652, "global_step": 17454, "epoch": 103} {"train_loss": -6.5239973068237305, "global_step": 17455, "epoch": 103} {"train_loss": -6.627218246459961, "global_step": 17456, "epoch": 103} {"train_loss": -6.770814895629883, "global_step": 17457, "epoch": 103} {"train_loss": -6.490134239196777, "global_step": 17458, "epoch": 103} {"train_loss": -6.757158279418945, "global_step": 17459, "epoch": 103} {"train_loss": -6.357828140258789, "global_step": 17460, "epoch": 103} {"train_loss": -6.639690399169922, "global_step": 17461, "epoch": 103} {"train_loss": -6.500997066497803, "global_step": 17462, "epoch": 103} {"train_loss": -6.796911239624023, "global_step": 17463, "epoch": 103} {"train_loss": -6.103843688964844, "global_step": 17464, "epoch": 103} {"train_loss": -6.730171203613281, "global_step": 17465, "epoch": 103} {"train_loss": -6.323837757110596, "global_step": 17466, "epoch": 103} {"train_loss": -6.503276348114014, "global_step": 17467, "epoch": 103} {"train_loss": -6.4564032554626465, "global_step": 17468, "epoch": 103} {"train_loss": -6.683516502380371, "global_step": 17469, "epoch": 103} {"train_loss": -6.8140387535095215, "global_step": 17470, "epoch": 103} {"train_loss": -6.5218413557325094, "global_step": 17471, "epoch": 103, "val_loss": 228025.0} {"train_loss": -6.761808395385742, "global_step": 17472, "epoch": 104} {"train_loss": -6.661426544189453, "global_step": 17473, "epoch": 104} {"train_loss": -6.616125106811523, "global_step": 17474, "epoch": 104} {"train_loss": -6.47315788269043, "global_step": 17475, "epoch": 104} {"train_loss": -6.70602560043335, "global_step": 17476, "epoch": 104} {"train_loss": -6.547615051269531, "global_step": 17477, "epoch": 104} {"train_loss": -6.714745044708252, "global_step": 17478, "epoch": 104} {"train_loss": -6.655926704406738, "global_step": 17479, "epoch": 104} {"train_loss": -6.558636665344238, "global_step": 17480, "epoch": 104} {"train_loss": -6.73293399810791, "global_step": 17481, "epoch": 104} {"train_loss": -6.612119674682617, "global_step": 17482, "epoch": 104} {"train_loss": -6.640143394470215, "global_step": 17483, "epoch": 104} {"train_loss": -6.629177570343018, "global_step": 17484, "epoch": 104} {"train_loss": -6.673645496368408, "global_step": 17485, "epoch": 104} {"train_loss": -6.6456522941589355, "global_step": 17486, "epoch": 104} {"train_loss": -6.788092136383057, "global_step": 17487, "epoch": 104} {"train_loss": -6.436023712158203, "global_step": 17488, "epoch": 104} {"train_loss": -6.887020111083984, "global_step": 17489, "epoch": 104} {"train_loss": -6.800922393798828, "global_step": 17490, "epoch": 104} {"train_loss": -6.808566570281982, "global_step": 17491, "epoch": 104} {"train_loss": -6.7508320808410645, "global_step": 17492, "epoch": 104} {"train_loss": -6.6632866859436035, "global_step": 17493, "epoch": 104} {"train_loss": -6.458745002746582, "global_step": 17494, "epoch": 104} {"train_loss": -6.553004741668701, "global_step": 17495, "epoch": 104} {"train_loss": -6.734586238861084, "global_step": 17496, "epoch": 104} {"train_loss": -6.784914970397949, "global_step": 17497, "epoch": 104} {"train_loss": -6.6247453689575195, "global_step": 17498, "epoch": 104} {"train_loss": -6.329524993896484, "global_step": 17499, "epoch": 104} {"train_loss": -6.359992980957031, "global_step": 17500, "epoch": 104} {"train_loss": -6.111728668212891, "global_step": 17501, "epoch": 104} {"train_loss": -6.503584384918213, "global_step": 17502, "epoch": 104} {"train_loss": -6.180883884429932, "global_step": 17503, "epoch": 104} {"train_loss": -6.451498985290527, "global_step": 17504, "epoch": 104} {"train_loss": -6.72122049331665, "global_step": 17505, "epoch": 104} {"train_loss": -6.232717514038086, "global_step": 17506, "epoch": 104} {"train_loss": -6.298084259033203, "global_step": 17507, "epoch": 104} {"train_loss": -6.458565711975098, "global_step": 17508, "epoch": 104} {"train_loss": -6.607488632202148, "global_step": 17509, "epoch": 104} {"train_loss": -6.485317230224609, "global_step": 17510, "epoch": 104} {"train_loss": -6.626804351806641, "global_step": 17511, "epoch": 104} {"train_loss": -6.534903526306152, "global_step": 17512, "epoch": 104} {"train_loss": -6.398373603820801, "global_step": 17513, "epoch": 104} {"train_loss": -6.717460632324219, "global_step": 17514, "epoch": 104} {"train_loss": -6.4170098304748535, "global_step": 17515, "epoch": 104} {"train_loss": -6.760190010070801, "global_step": 17516, "epoch": 104} {"train_loss": -6.523385047912598, "global_step": 17517, "epoch": 104} {"train_loss": -6.605733394622803, "global_step": 17518, "epoch": 104} {"train_loss": -6.514245986938477, "global_step": 17519, "epoch": 104} {"train_loss": -6.523829460144043, "global_step": 17520, "epoch": 104} {"train_loss": -6.779921054840088, "global_step": 17521, "epoch": 104} {"train_loss": -6.695300102233887, "global_step": 17522, "epoch": 104} {"train_loss": -6.396853446960449, "global_step": 17523, "epoch": 104} {"train_loss": -6.699476718902588, "global_step": 17524, "epoch": 104} {"train_loss": -6.397366523742676, "global_step": 17525, "epoch": 104} {"train_loss": -6.669094562530518, "global_step": 17526, "epoch": 104} {"train_loss": -6.612862586975098, "global_step": 17527, "epoch": 104} {"train_loss": -6.777491569519043, "global_step": 17528, "epoch": 104} {"train_loss": -6.542972564697266, "global_step": 17529, "epoch": 104} {"train_loss": -6.580101013183594, "global_step": 17530, "epoch": 104} {"train_loss": -6.583699703216553, "global_step": 17531, "epoch": 104} {"train_loss": -6.253658294677734, "global_step": 17532, "epoch": 104} {"train_loss": -6.385833263397217, "global_step": 17533, "epoch": 104} {"train_loss": -6.686459541320801, "global_step": 17534, "epoch": 104} {"train_loss": -6.4667205810546875, "global_step": 17535, "epoch": 104} {"train_loss": -6.317473411560059, "global_step": 17536, "epoch": 104} {"train_loss": -6.558966636657715, "global_step": 17537, "epoch": 104} {"train_loss": -6.511897563934326, "global_step": 17538, "epoch": 104} {"train_loss": -6.282351493835449, "global_step": 17539, "epoch": 104} {"train_loss": -6.6510515213012695, "global_step": 17540, "epoch": 104} {"train_loss": -6.3950090408325195, "global_step": 17541, "epoch": 104} {"train_loss": -6.200031280517578, "global_step": 17542, "epoch": 104} {"train_loss": -6.676582336425781, "global_step": 17543, "epoch": 104} {"train_loss": -6.521419525146484, "global_step": 17544, "epoch": 104} {"train_loss": -6.672876358032227, "global_step": 17545, "epoch": 104} {"train_loss": -6.627716541290283, "global_step": 17546, "epoch": 104} {"train_loss": -6.662755966186523, "global_step": 17547, "epoch": 104} {"train_loss": -6.450643539428711, "global_step": 17548, "epoch": 104} {"train_loss": -6.730863571166992, "global_step": 17549, "epoch": 104} {"train_loss": -6.596333026885986, "global_step": 17550, "epoch": 104} {"train_loss": -6.80444860458374, "global_step": 17551, "epoch": 104} {"train_loss": -6.688127517700195, "global_step": 17552, "epoch": 104} {"train_loss": -6.531004905700684, "global_step": 17553, "epoch": 104} {"train_loss": -6.498149871826172, "global_step": 17554, "epoch": 104} {"train_loss": -6.775245666503906, "global_step": 17555, "epoch": 104} {"train_loss": -6.69893741607666, "global_step": 17556, "epoch": 104} {"train_loss": -6.824275970458984, "global_step": 17557, "epoch": 104} {"train_loss": -6.671672821044922, "global_step": 17558, "epoch": 104} {"train_loss": -6.476573944091797, "global_step": 17559, "epoch": 104} {"train_loss": -6.616393089294434, "global_step": 17560, "epoch": 104} {"train_loss": -6.523153305053711, "global_step": 17561, "epoch": 104} {"train_loss": -6.527891159057617, "global_step": 17562, "epoch": 104} {"train_loss": -6.542075157165527, "global_step": 17563, "epoch": 104} {"train_loss": -6.402578353881836, "global_step": 17564, "epoch": 104} {"train_loss": -6.494217395782471, "global_step": 17565, "epoch": 104} {"train_loss": -6.755767822265625, "global_step": 17566, "epoch": 104} {"train_loss": -6.644065856933594, "global_step": 17567, "epoch": 104} {"train_loss": -6.4483256340026855, "global_step": 17568, "epoch": 104} {"train_loss": -6.489044189453125, "global_step": 17569, "epoch": 104} {"train_loss": -6.425874710083008, "global_step": 17570, "epoch": 104} {"train_loss": -6.3978271484375, "global_step": 17571, "epoch": 104} {"train_loss": -6.347430229187012, "global_step": 17572, "epoch": 104} {"train_loss": -6.6261887550354, "global_step": 17573, "epoch": 104} {"train_loss": -6.732240676879883, "global_step": 17574, "epoch": 104} {"train_loss": -6.612559795379639, "global_step": 17575, "epoch": 104} {"train_loss": -6.585665702819824, "global_step": 17576, "epoch": 104} {"train_loss": -6.609050750732422, "global_step": 17577, "epoch": 104} {"train_loss": -6.757333278656006, "global_step": 17578, "epoch": 104} {"train_loss": -6.5301313400268555, "global_step": 17579, "epoch": 104} {"train_loss": -6.7489013671875, "global_step": 17580, "epoch": 104} {"train_loss": -6.681520462036133, "global_step": 17581, "epoch": 104} {"train_loss": -6.849948406219482, "global_step": 17582, "epoch": 104} {"train_loss": -6.385890007019043, "global_step": 17583, "epoch": 104} {"train_loss": -6.446709632873535, "global_step": 17584, "epoch": 104} {"train_loss": -6.429356575012207, "global_step": 17585, "epoch": 104} {"train_loss": -6.769708633422852, "global_step": 17586, "epoch": 104} {"train_loss": -6.801216125488281, "global_step": 17587, "epoch": 104} {"train_loss": -6.533401012420654, "global_step": 17588, "epoch": 104} {"train_loss": -6.73280668258667, "global_step": 17589, "epoch": 104} {"train_loss": -6.585912704467773, "global_step": 17590, "epoch": 104} {"train_loss": -6.6473493576049805, "global_step": 17591, "epoch": 104} {"train_loss": -6.680485725402832, "global_step": 17592, "epoch": 104} {"train_loss": -6.558633804321289, "global_step": 17593, "epoch": 104} {"train_loss": -6.561952590942383, "global_step": 17594, "epoch": 104} {"train_loss": -6.3477630615234375, "global_step": 17595, "epoch": 104} {"train_loss": -6.498420715332031, "global_step": 17596, "epoch": 104} {"train_loss": -6.44277286529541, "global_step": 17597, "epoch": 104} {"train_loss": -6.66969108581543, "global_step": 17598, "epoch": 104} {"train_loss": -6.540007591247559, "global_step": 17599, "epoch": 104} {"train_loss": -6.536810874938965, "global_step": 17600, "epoch": 104} {"train_loss": -6.644975662231445, "global_step": 17601, "epoch": 104} {"train_loss": -6.533880233764648, "global_step": 17602, "epoch": 104} {"train_loss": -6.438769340515137, "global_step": 17603, "epoch": 104} {"train_loss": -6.55770206451416, "global_step": 17604, "epoch": 104} {"train_loss": -6.449936866760254, "global_step": 17605, "epoch": 104} {"train_loss": -6.608431339263916, "global_step": 17606, "epoch": 104} {"train_loss": -6.4837965965271, "global_step": 17607, "epoch": 104} {"train_loss": -6.603711128234863, "global_step": 17608, "epoch": 104} {"train_loss": -6.580636024475098, "global_step": 17609, "epoch": 104} {"train_loss": -6.40463924407959, "global_step": 17610, "epoch": 104} {"train_loss": -6.545836448669434, "global_step": 17611, "epoch": 104} {"train_loss": -6.515902519226074, "global_step": 17612, "epoch": 104} {"train_loss": -6.76108980178833, "global_step": 17613, "epoch": 104} {"train_loss": -6.371592998504639, "global_step": 17614, "epoch": 104} {"train_loss": -6.429459571838379, "global_step": 17615, "epoch": 104} {"train_loss": -6.671231746673584, "global_step": 17616, "epoch": 104} {"train_loss": -6.601153373718262, "global_step": 17617, "epoch": 104} {"train_loss": -6.566822528839111, "global_step": 17618, "epoch": 104} {"train_loss": -6.319785118103027, "global_step": 17619, "epoch": 104} {"train_loss": -6.418102264404297, "global_step": 17620, "epoch": 104} {"train_loss": -6.384274959564209, "global_step": 17621, "epoch": 104} {"train_loss": -6.694029808044434, "global_step": 17622, "epoch": 104} {"train_loss": -6.549096584320068, "global_step": 17623, "epoch": 104} {"train_loss": -6.650559425354004, "global_step": 17624, "epoch": 104} {"train_loss": -6.620868682861328, "global_step": 17625, "epoch": 104} {"train_loss": -6.5695953369140625, "global_step": 17626, "epoch": 104} {"train_loss": -6.423195838928223, "global_step": 17627, "epoch": 104} {"train_loss": -6.562832832336426, "global_step": 17628, "epoch": 104} {"train_loss": -6.662308692932129, "global_step": 17629, "epoch": 104} {"train_loss": -6.554676055908203, "global_step": 17630, "epoch": 104} {"train_loss": -6.426285743713379, "global_step": 17631, "epoch": 104} {"train_loss": -6.680074214935303, "global_step": 17632, "epoch": 104} {"train_loss": -6.616620063781738, "global_step": 17633, "epoch": 104} {"train_loss": -6.629049301147461, "global_step": 17634, "epoch": 104} {"train_loss": -6.591281890869141, "global_step": 17635, "epoch": 104} {"train_loss": -6.562950611114502, "global_step": 17636, "epoch": 104} {"train_loss": -6.7642083168029785, "global_step": 17637, "epoch": 104} {"train_loss": -6.399570465087891, "global_step": 17638, "epoch": 104} {"train_loss": -6.568905867281414, "global_step": 17639, "epoch": 104, "val_loss": 230390.296875} {"train_loss": -6.249894142150879, "global_step": 17640, "epoch": 105} {"train_loss": -6.632662773132324, "global_step": 17641, "epoch": 105} {"train_loss": -6.679727077484131, "global_step": 17642, "epoch": 105} {"train_loss": -6.291476249694824, "global_step": 17643, "epoch": 105} {"train_loss": -6.564101696014404, "global_step": 17644, "epoch": 105} {"train_loss": -6.182816982269287, "global_step": 17645, "epoch": 105} {"train_loss": -6.4099225997924805, "global_step": 17646, "epoch": 105} {"train_loss": -6.612445831298828, "global_step": 17647, "epoch": 105} {"train_loss": -6.190345287322998, "global_step": 17648, "epoch": 105} {"train_loss": -6.02375602722168, "global_step": 17649, "epoch": 105} {"train_loss": -6.60657262802124, "global_step": 17650, "epoch": 105} {"train_loss": -6.192252159118652, "global_step": 17651, "epoch": 105} {"train_loss": -6.379271507263184, "global_step": 17652, "epoch": 105} {"train_loss": -6.447789192199707, "global_step": 17653, "epoch": 105} {"train_loss": -6.324944496154785, "global_step": 17654, "epoch": 105} {"train_loss": -6.516692161560059, "global_step": 17655, "epoch": 105} {"train_loss": -6.385195732116699, "global_step": 17656, "epoch": 105} {"train_loss": -6.458155155181885, "global_step": 17657, "epoch": 105} {"train_loss": -6.4188103675842285, "global_step": 17658, "epoch": 105} {"train_loss": -6.584567070007324, "global_step": 17659, "epoch": 105} {"train_loss": -6.395358085632324, "global_step": 17660, "epoch": 105} {"train_loss": -6.543195724487305, "global_step": 17661, "epoch": 105} {"train_loss": -6.4759521484375, "global_step": 17662, "epoch": 105} {"train_loss": -6.574440956115723, "global_step": 17663, "epoch": 105} {"train_loss": -6.398661136627197, "global_step": 17664, "epoch": 105} {"train_loss": -6.416542053222656, "global_step": 17665, "epoch": 105} {"train_loss": -6.597025394439697, "global_step": 17666, "epoch": 105} {"train_loss": -6.595019340515137, "global_step": 17667, "epoch": 105} {"train_loss": -6.490041732788086, "global_step": 17668, "epoch": 105} {"train_loss": -6.634933948516846, "global_step": 17669, "epoch": 105} {"train_loss": -6.483182907104492, "global_step": 17670, "epoch": 105} {"train_loss": -6.859332084655762, "global_step": 17671, "epoch": 105} {"train_loss": -6.413917541503906, "global_step": 17672, "epoch": 105} {"train_loss": -6.50714111328125, "global_step": 17673, "epoch": 105} {"train_loss": -6.53925085067749, "global_step": 17674, "epoch": 105} {"train_loss": -6.7313008308410645, "global_step": 17675, "epoch": 105} {"train_loss": -6.716785430908203, "global_step": 17676, "epoch": 105} {"train_loss": -6.543768405914307, "global_step": 17677, "epoch": 105} {"train_loss": -6.762285232543945, "global_step": 17678, "epoch": 105} {"train_loss": -6.581774711608887, "global_step": 17679, "epoch": 105} {"train_loss": -6.452875137329102, "global_step": 17680, "epoch": 105} {"train_loss": -6.712120056152344, "global_step": 17681, "epoch": 105} {"train_loss": -6.822599411010742, "global_step": 17682, "epoch": 105} {"train_loss": -6.545065879821777, "global_step": 17683, "epoch": 105} {"train_loss": -6.409296989440918, "global_step": 17684, "epoch": 105} {"train_loss": -6.709902286529541, "global_step": 17685, "epoch": 105} {"train_loss": -6.755007743835449, "global_step": 17686, "epoch": 105} {"train_loss": -6.864192008972168, "global_step": 17687, "epoch": 105} {"train_loss": -6.761754035949707, "global_step": 17688, "epoch": 105} {"train_loss": -6.723630905151367, "global_step": 17689, "epoch": 105} {"train_loss": -6.592550277709961, "global_step": 17690, "epoch": 105} {"train_loss": -6.475011825561523, "global_step": 17691, "epoch": 105} {"train_loss": -6.7482523918151855, "global_step": 17692, "epoch": 105} {"train_loss": -6.888330459594727, "global_step": 17693, "epoch": 105} {"train_loss": -6.776684761047363, "global_step": 17694, "epoch": 105} {"train_loss": -6.652047157287598, "global_step": 17695, "epoch": 105} {"train_loss": -6.774532318115234, "global_step": 17696, "epoch": 105} {"train_loss": -6.767467498779297, "global_step": 17697, "epoch": 105} {"train_loss": -6.614432334899902, "global_step": 17698, "epoch": 105} {"train_loss": -6.450323104858398, "global_step": 17699, "epoch": 105} {"train_loss": -6.353933334350586, "global_step": 17700, "epoch": 105} {"train_loss": -6.8104047775268555, "global_step": 17701, "epoch": 105} {"train_loss": -6.839611053466797, "global_step": 17702, "epoch": 105} {"train_loss": -6.479253768920898, "global_step": 17703, "epoch": 105} {"train_loss": -6.624699592590332, "global_step": 17704, "epoch": 105} {"train_loss": -6.653332710266113, "global_step": 17705, "epoch": 105} {"train_loss": -6.582003116607666, "global_step": 17706, "epoch": 105} {"train_loss": -6.624521255493164, "global_step": 17707, "epoch": 105} {"train_loss": -6.418545722961426, "global_step": 17708, "epoch": 105} {"train_loss": -6.670558929443359, "global_step": 17709, "epoch": 105} {"train_loss": -6.437353134155273, "global_step": 17710, "epoch": 105} {"train_loss": -6.665066719055176, "global_step": 17711, "epoch": 105} {"train_loss": -6.656187534332275, "global_step": 17712, "epoch": 105} {"train_loss": -6.369452476501465, "global_step": 17713, "epoch": 105} {"train_loss": -6.674357891082764, "global_step": 17714, "epoch": 105} {"train_loss": -6.458636283874512, "global_step": 17715, "epoch": 105} {"train_loss": -6.635897636413574, "global_step": 17716, "epoch": 105} {"train_loss": -6.806171417236328, "global_step": 17717, "epoch": 105} {"train_loss": -6.913137435913086, "global_step": 17718, "epoch": 105} {"train_loss": -6.3863348960876465, "global_step": 17719, "epoch": 105} {"train_loss": -6.502931594848633, "global_step": 17720, "epoch": 105} {"train_loss": -6.390045642852783, "global_step": 17721, "epoch": 105} {"train_loss": -6.82574987411499, "global_step": 17722, "epoch": 105} {"train_loss": -6.462460517883301, "global_step": 17723, "epoch": 105} {"train_loss": -6.830418586730957, "global_step": 17724, "epoch": 105} {"train_loss": -6.5919189453125, "global_step": 17725, "epoch": 105} {"train_loss": -6.554800033569336, "global_step": 17726, "epoch": 105} {"train_loss": -6.334352493286133, "global_step": 17727, "epoch": 105} {"train_loss": -6.681051254272461, "global_step": 17728, "epoch": 105} {"train_loss": -6.873164176940918, "global_step": 17729, "epoch": 105} {"train_loss": -6.3613386154174805, "global_step": 17730, "epoch": 105} {"train_loss": -6.638979911804199, "global_step": 17731, "epoch": 105} {"train_loss": -6.597177505493164, "global_step": 17732, "epoch": 105} {"train_loss": -6.748454570770264, "global_step": 17733, "epoch": 105} {"train_loss": -6.609248161315918, "global_step": 17734, "epoch": 105} {"train_loss": -6.738924503326416, "global_step": 17735, "epoch": 105} {"train_loss": -6.767475128173828, "global_step": 17736, "epoch": 105} {"train_loss": -6.548507213592529, "global_step": 17737, "epoch": 105} {"train_loss": -6.74997091293335, "global_step": 17738, "epoch": 105} {"train_loss": -6.851437568664551, "global_step": 17739, "epoch": 105} {"train_loss": -6.590236663818359, "global_step": 17740, "epoch": 105} {"train_loss": -6.7611403465271, "global_step": 17741, "epoch": 105} {"train_loss": -6.579056739807129, "global_step": 17742, "epoch": 105} {"train_loss": -6.821205139160156, "global_step": 17743, "epoch": 105} {"train_loss": -6.4314422607421875, "global_step": 17744, "epoch": 105} {"train_loss": -6.689925193786621, "global_step": 17745, "epoch": 105} {"train_loss": -6.615797519683838, "global_step": 17746, "epoch": 105} {"train_loss": -6.629731178283691, "global_step": 17747, "epoch": 105} {"train_loss": -6.692222595214844, "global_step": 17748, "epoch": 105} {"train_loss": -6.797579765319824, "global_step": 17749, "epoch": 105} {"train_loss": -6.706157684326172, "global_step": 17750, "epoch": 105} {"train_loss": -6.684149742126465, "global_step": 17751, "epoch": 105} {"train_loss": -6.680390357971191, "global_step": 17752, "epoch": 105} {"train_loss": -6.76641845703125, "global_step": 17753, "epoch": 105} {"train_loss": -6.591979026794434, "global_step": 17754, "epoch": 105} {"train_loss": -6.655633926391602, "global_step": 17755, "epoch": 105} {"train_loss": -6.789441108703613, "global_step": 17756, "epoch": 105} {"train_loss": -6.853633403778076, "global_step": 17757, "epoch": 105} {"train_loss": -6.636684417724609, "global_step": 17758, "epoch": 105} {"train_loss": -6.797024726867676, "global_step": 17759, "epoch": 105} {"train_loss": -6.266683578491211, "global_step": 17760, "epoch": 105} {"train_loss": -6.647969722747803, "global_step": 17761, "epoch": 105} {"train_loss": -6.478468418121338, "global_step": 17762, "epoch": 105} {"train_loss": -6.484807968139648, "global_step": 17763, "epoch": 105} {"train_loss": -6.519360065460205, "global_step": 17764, "epoch": 105} {"train_loss": -6.580370903015137, "global_step": 17765, "epoch": 105} {"train_loss": -6.693523406982422, "global_step": 17766, "epoch": 105} {"train_loss": -6.427073955535889, "global_step": 17767, "epoch": 105} {"train_loss": -6.661806106567383, "global_step": 17768, "epoch": 105} {"train_loss": -6.461357116699219, "global_step": 17769, "epoch": 105} {"train_loss": -6.5142436027526855, "global_step": 17770, "epoch": 105} {"train_loss": -6.132051944732666, "global_step": 17771, "epoch": 105} {"train_loss": -6.431140899658203, "global_step": 17772, "epoch": 105} {"train_loss": -6.531164169311523, "global_step": 17773, "epoch": 105} {"train_loss": -6.614405155181885, "global_step": 17774, "epoch": 105} {"train_loss": -6.326940536499023, "global_step": 17775, "epoch": 105} {"train_loss": -6.205502510070801, "global_step": 17776, "epoch": 105} {"train_loss": -6.401268005371094, "global_step": 17777, "epoch": 105} {"train_loss": -6.614023208618164, "global_step": 17778, "epoch": 105} {"train_loss": -6.533145427703857, "global_step": 17779, "epoch": 105} {"train_loss": -6.550398826599121, "global_step": 17780, "epoch": 105} {"train_loss": -6.702879905700684, "global_step": 17781, "epoch": 105} {"train_loss": -6.672924041748047, "global_step": 17782, "epoch": 105} {"train_loss": -6.319115161895752, "global_step": 17783, "epoch": 105} {"train_loss": -6.408021926879883, "global_step": 17784, "epoch": 105} {"train_loss": -6.610845565795898, "global_step": 17785, "epoch": 105} {"train_loss": -6.53355598449707, "global_step": 17786, "epoch": 105} {"train_loss": -6.434086799621582, "global_step": 17787, "epoch": 105} {"train_loss": -6.554139137268066, "global_step": 17788, "epoch": 105} {"train_loss": -6.493896484375, "global_step": 17789, "epoch": 105} {"train_loss": -6.362706661224365, "global_step": 17790, "epoch": 105} {"train_loss": -6.426006317138672, "global_step": 17791, "epoch": 105} {"train_loss": -6.489406585693359, "global_step": 17792, "epoch": 105} {"train_loss": -6.564679145812988, "global_step": 17793, "epoch": 105} {"train_loss": -6.607320785522461, "global_step": 17794, "epoch": 105} {"train_loss": -6.6087446212768555, "global_step": 17795, "epoch": 105} {"train_loss": -6.690842628479004, "global_step": 17796, "epoch": 105} {"train_loss": -6.67329740524292, "global_step": 17797, "epoch": 105} {"train_loss": -6.607283115386963, "global_step": 17798, "epoch": 105} {"train_loss": -6.596445083618164, "global_step": 17799, "epoch": 105} {"train_loss": -6.758472442626953, "global_step": 17800, "epoch": 105} {"train_loss": -6.604925632476807, "global_step": 17801, "epoch": 105} {"train_loss": -6.774370193481445, "global_step": 17802, "epoch": 105} {"train_loss": -6.5441813468933105, "global_step": 17803, "epoch": 105} {"train_loss": -6.702685356140137, "global_step": 17804, "epoch": 105} {"train_loss": -6.807586669921875, "global_step": 17805, "epoch": 105} {"train_loss": -6.775444030761719, "global_step": 17806, "epoch": 105} {"train_loss": -6.579382172652653, "global_step": 17807, "epoch": 105, "val_loss": 235998.421875, "train_action_mse_error": 23.473846435546875} {"train_loss": -6.437741756439209, "global_step": 17808, "epoch": 106} {"train_loss": -6.9831109046936035, "global_step": 17809, "epoch": 106} {"train_loss": -6.50797176361084, "global_step": 17810, "epoch": 106} {"train_loss": -6.652935028076172, "global_step": 17811, "epoch": 106} {"train_loss": -6.714135646820068, "global_step": 17812, "epoch": 106} {"train_loss": -6.716796875, "global_step": 17813, "epoch": 106} {"train_loss": -6.6876935958862305, "global_step": 17814, "epoch": 106} {"train_loss": -6.653546333312988, "global_step": 17815, "epoch": 106} {"train_loss": -6.65369176864624, "global_step": 17816, "epoch": 106} {"train_loss": -6.375639915466309, "global_step": 17817, "epoch": 106} {"train_loss": -6.7360005378723145, "global_step": 17818, "epoch": 106} {"train_loss": -6.47354793548584, "global_step": 17819, "epoch": 106} {"train_loss": -6.597598075866699, "global_step": 17820, "epoch": 106} {"train_loss": -6.652386665344238, "global_step": 17821, "epoch": 106} {"train_loss": -6.7525787353515625, "global_step": 17822, "epoch": 106} {"train_loss": -6.643628120422363, "global_step": 17823, "epoch": 106} {"train_loss": -6.709402084350586, "global_step": 17824, "epoch": 106} {"train_loss": -6.5708770751953125, "global_step": 17825, "epoch": 106} {"train_loss": -6.36022424697876, "global_step": 17826, "epoch": 106} {"train_loss": -6.759452819824219, "global_step": 17827, "epoch": 106} {"train_loss": -6.396918296813965, "global_step": 17828, "epoch": 106} {"train_loss": -6.86680793762207, "global_step": 17829, "epoch": 106} {"train_loss": -6.558022499084473, "global_step": 17830, "epoch": 106} {"train_loss": -6.455085754394531, "global_step": 17831, "epoch": 106} {"train_loss": -6.587434768676758, "global_step": 17832, "epoch": 106} {"train_loss": -6.46791410446167, "global_step": 17833, "epoch": 106} {"train_loss": -6.670308589935303, "global_step": 17834, "epoch": 106} {"train_loss": -6.524232864379883, "global_step": 17835, "epoch": 106} {"train_loss": -6.472174644470215, "global_step": 17836, "epoch": 106} {"train_loss": -6.763596534729004, "global_step": 17837, "epoch": 106} {"train_loss": -6.317299842834473, "global_step": 17838, "epoch": 106} {"train_loss": -6.560187339782715, "global_step": 17839, "epoch": 106} {"train_loss": -6.5708513259887695, "global_step": 17840, "epoch": 106} {"train_loss": -6.512398719787598, "global_step": 17841, "epoch": 106} {"train_loss": -6.486196517944336, "global_step": 17842, "epoch": 106} {"train_loss": -6.648996353149414, "global_step": 17843, "epoch": 106} {"train_loss": -6.670953750610352, "global_step": 17844, "epoch": 106} {"train_loss": -6.1760735511779785, "global_step": 17845, "epoch": 106} {"train_loss": -6.486698150634766, "global_step": 17846, "epoch": 106} {"train_loss": -6.26948356628418, "global_step": 17847, "epoch": 106} {"train_loss": -6.417514801025391, "global_step": 17848, "epoch": 106} {"train_loss": -6.570330619812012, "global_step": 17849, "epoch": 106} {"train_loss": -6.398654460906982, "global_step": 17850, "epoch": 106} {"train_loss": -6.436481475830078, "global_step": 17851, "epoch": 106} {"train_loss": -6.583885192871094, "global_step": 17852, "epoch": 106} {"train_loss": -6.498636722564697, "global_step": 17853, "epoch": 106} {"train_loss": -6.40559196472168, "global_step": 17854, "epoch": 106} {"train_loss": -6.538816452026367, "global_step": 17855, "epoch": 106} {"train_loss": -6.574075698852539, "global_step": 17856, "epoch": 106} {"train_loss": -6.442115783691406, "global_step": 17857, "epoch": 106} {"train_loss": -6.557361602783203, "global_step": 17858, "epoch": 106} {"train_loss": -6.4354472160339355, "global_step": 17859, "epoch": 106} {"train_loss": -6.674839496612549, "global_step": 17860, "epoch": 106} {"train_loss": -6.62196159362793, "global_step": 17861, "epoch": 106} {"train_loss": -6.832918167114258, "global_step": 17862, "epoch": 106} {"train_loss": -6.6094794273376465, "global_step": 17863, "epoch": 106} {"train_loss": -6.6922454833984375, "global_step": 17864, "epoch": 106} {"train_loss": -6.534183502197266, "global_step": 17865, "epoch": 106} {"train_loss": -6.721826553344727, "global_step": 17866, "epoch": 106} {"train_loss": -6.607610702514648, "global_step": 17867, "epoch": 106} {"train_loss": -6.677017688751221, "global_step": 17868, "epoch": 106} {"train_loss": -6.708118915557861, "global_step": 17869, "epoch": 106} {"train_loss": -6.655050754547119, "global_step": 17870, "epoch": 106} {"train_loss": -6.802845001220703, "global_step": 17871, "epoch": 106} {"train_loss": -6.549111843109131, "global_step": 17872, "epoch": 106} {"train_loss": -6.577016353607178, "global_step": 17873, "epoch": 106} {"train_loss": -6.721583366394043, "global_step": 17874, "epoch": 106} {"train_loss": -6.379395484924316, "global_step": 17875, "epoch": 106} {"train_loss": -6.722115516662598, "global_step": 17876, "epoch": 106} {"train_loss": -6.6303911209106445, "global_step": 17877, "epoch": 106} {"train_loss": -6.75662899017334, "global_step": 17878, "epoch": 106} {"train_loss": -6.7717132568359375, "global_step": 17879, "epoch": 106} {"train_loss": -6.925978660583496, "global_step": 17880, "epoch": 106} {"train_loss": -6.260225296020508, "global_step": 17881, "epoch": 106} {"train_loss": -6.67064905166626, "global_step": 17882, "epoch": 106} {"train_loss": -6.634884834289551, "global_step": 17883, "epoch": 106} {"train_loss": -6.867142200469971, "global_step": 17884, "epoch": 106} {"train_loss": -6.591815948486328, "global_step": 17885, "epoch": 106} {"train_loss": -6.963351249694824, "global_step": 17886, "epoch": 106} {"train_loss": -6.5397186279296875, "global_step": 17887, "epoch": 106} {"train_loss": -6.296762466430664, "global_step": 17888, "epoch": 106} {"train_loss": -6.785795211791992, "global_step": 17889, "epoch": 106} {"train_loss": -6.590576648712158, "global_step": 17890, "epoch": 106} {"train_loss": -6.662903785705566, "global_step": 17891, "epoch": 106} {"train_loss": -6.196969509124756, "global_step": 17892, "epoch": 106} {"train_loss": -6.347021102905273, "global_step": 17893, "epoch": 106} {"train_loss": -6.616692543029785, "global_step": 17894, "epoch": 106} {"train_loss": -6.737278461456299, "global_step": 17895, "epoch": 106} {"train_loss": -6.596596717834473, "global_step": 17896, "epoch": 106} {"train_loss": -6.612256050109863, "global_step": 17897, "epoch": 106} {"train_loss": -6.577587604522705, "global_step": 17898, "epoch": 106} {"train_loss": -6.746403217315674, "global_step": 17899, "epoch": 106} {"train_loss": -6.615292549133301, "global_step": 17900, "epoch": 106} {"train_loss": -6.616604804992676, "global_step": 17901, "epoch": 106} {"train_loss": -6.888577461242676, "global_step": 17902, "epoch": 106} {"train_loss": -6.479888916015625, "global_step": 17903, "epoch": 106} {"train_loss": -6.371335506439209, "global_step": 17904, "epoch": 106} {"train_loss": -6.449254989624023, "global_step": 17905, "epoch": 106} {"train_loss": -6.674837589263916, "global_step": 17906, "epoch": 106} {"train_loss": -6.513616561889648, "global_step": 17907, "epoch": 106} {"train_loss": -6.442909240722656, "global_step": 17908, "epoch": 106} {"train_loss": -6.433279514312744, "global_step": 17909, "epoch": 106} {"train_loss": -6.5051188468933105, "global_step": 17910, "epoch": 106} {"train_loss": -6.59307861328125, "global_step": 17911, "epoch": 106} {"train_loss": -6.770328521728516, "global_step": 17912, "epoch": 106} {"train_loss": -6.527931213378906, "global_step": 17913, "epoch": 106} {"train_loss": -6.719229221343994, "global_step": 17914, "epoch": 106} {"train_loss": -6.633339881896973, "global_step": 17915, "epoch": 106} {"train_loss": -6.605979919433594, "global_step": 17916, "epoch": 106} {"train_loss": -6.694863319396973, "global_step": 17917, "epoch": 106} {"train_loss": -6.671327590942383, "global_step": 17918, "epoch": 106} {"train_loss": -6.557134628295898, "global_step": 17919, "epoch": 106} {"train_loss": -6.4842448234558105, "global_step": 17920, "epoch": 106} {"train_loss": -6.7505083084106445, "global_step": 17921, "epoch": 106} {"train_loss": -6.785386562347412, "global_step": 17922, "epoch": 106} {"train_loss": -6.786514759063721, "global_step": 17923, "epoch": 106} {"train_loss": -6.44051456451416, "global_step": 17924, "epoch": 106} {"train_loss": -6.650505542755127, "global_step": 17925, "epoch": 106} {"train_loss": -6.233088970184326, "global_step": 17926, "epoch": 106} {"train_loss": -6.72233772277832, "global_step": 17927, "epoch": 106} {"train_loss": -6.47719144821167, "global_step": 17928, "epoch": 106} {"train_loss": -6.530234336853027, "global_step": 17929, "epoch": 106} {"train_loss": -6.525422096252441, "global_step": 17930, "epoch": 106} {"train_loss": -6.640450954437256, "global_step": 17931, "epoch": 106} {"train_loss": -6.8607635498046875, "global_step": 17932, "epoch": 106} {"train_loss": -6.632542610168457, "global_step": 17933, "epoch": 106} {"train_loss": -6.824014663696289, "global_step": 17934, "epoch": 106} {"train_loss": -6.746999263763428, "global_step": 17935, "epoch": 106} {"train_loss": -6.778435707092285, "global_step": 17936, "epoch": 106} {"train_loss": -6.403785705566406, "global_step": 17937, "epoch": 106} {"train_loss": -6.6002607345581055, "global_step": 17938, "epoch": 106} {"train_loss": -6.552183151245117, "global_step": 17939, "epoch": 106} {"train_loss": -6.808249473571777, "global_step": 17940, "epoch": 106} {"train_loss": -6.770055294036865, "global_step": 17941, "epoch": 106} {"train_loss": -6.852928638458252, "global_step": 17942, "epoch": 106} {"train_loss": -6.7069549560546875, "global_step": 17943, "epoch": 106} {"train_loss": -6.702205657958984, "global_step": 17944, "epoch": 106} {"train_loss": -6.6429595947265625, "global_step": 17945, "epoch": 106} {"train_loss": -6.714015007019043, "global_step": 17946, "epoch": 106} {"train_loss": -6.615265846252441, "global_step": 17947, "epoch": 106} {"train_loss": -6.7765021324157715, "global_step": 17948, "epoch": 106} {"train_loss": -6.677242755889893, "global_step": 17949, "epoch": 106} {"train_loss": -6.659754276275635, "global_step": 17950, "epoch": 106} {"train_loss": -6.588759899139404, "global_step": 17951, "epoch": 106} {"train_loss": -6.873106956481934, "global_step": 17952, "epoch": 106} {"train_loss": -6.8659563064575195, "global_step": 17953, "epoch": 106} {"train_loss": -6.798132419586182, "global_step": 17954, "epoch": 106} {"train_loss": -6.7362542152404785, "global_step": 17955, "epoch": 106} {"train_loss": -6.798323631286621, "global_step": 17956, "epoch": 106} {"train_loss": -6.619260787963867, "global_step": 17957, "epoch": 106} {"train_loss": -6.752843856811523, "global_step": 17958, "epoch": 106} {"train_loss": -6.532423973083496, "global_step": 17959, "epoch": 106} {"train_loss": -6.700362205505371, "global_step": 17960, "epoch": 106} {"train_loss": -6.693270683288574, "global_step": 17961, "epoch": 106} {"train_loss": -6.529850959777832, "global_step": 17962, "epoch": 106} {"train_loss": -6.508866310119629, "global_step": 17963, "epoch": 106} {"train_loss": -6.606639862060547, "global_step": 17964, "epoch": 106} {"train_loss": -6.452446937561035, "global_step": 17965, "epoch": 106} {"train_loss": -6.728137493133545, "global_step": 17966, "epoch": 106} {"train_loss": -6.564229965209961, "global_step": 17967, "epoch": 106} {"train_loss": -6.704555511474609, "global_step": 17968, "epoch": 106} {"train_loss": -6.362151145935059, "global_step": 17969, "epoch": 106} {"train_loss": -6.710229873657227, "global_step": 17970, "epoch": 106} {"train_loss": -6.441666603088379, "global_step": 17971, "epoch": 106} {"train_loss": -6.76003885269165, "global_step": 17972, "epoch": 106} {"train_loss": -6.471292018890381, "global_step": 17973, "epoch": 106} {"train_loss": -6.665148735046387, "global_step": 17974, "epoch": 106} {"train_loss": -6.608703389054253, "global_step": 17975, "epoch": 106, "val_loss": 220899.359375} {"train_loss": -6.321876525878906, "global_step": 17976, "epoch": 107} {"train_loss": -6.510231018066406, "global_step": 17977, "epoch": 107} {"train_loss": -6.345974445343018, "global_step": 17978, "epoch": 107} {"train_loss": -6.462010860443115, "global_step": 17979, "epoch": 107} {"train_loss": -6.131442070007324, "global_step": 17980, "epoch": 107} {"train_loss": -6.468592166900635, "global_step": 17981, "epoch": 107} {"train_loss": -6.4583740234375, "global_step": 17982, "epoch": 107} {"train_loss": -6.263816833496094, "global_step": 17983, "epoch": 107} {"train_loss": -6.582080364227295, "global_step": 17984, "epoch": 107} {"train_loss": -6.550412178039551, "global_step": 17985, "epoch": 107} {"train_loss": -6.339730262756348, "global_step": 17986, "epoch": 107} {"train_loss": -6.440264701843262, "global_step": 17987, "epoch": 107} {"train_loss": -6.499048709869385, "global_step": 17988, "epoch": 107} {"train_loss": -6.693734169006348, "global_step": 17989, "epoch": 107} {"train_loss": -6.366156101226807, "global_step": 17990, "epoch": 107} {"train_loss": -6.4870147705078125, "global_step": 17991, "epoch": 107} {"train_loss": -6.721034049987793, "global_step": 17992, "epoch": 107} {"train_loss": -6.536690711975098, "global_step": 17993, "epoch": 107} {"train_loss": -6.638206481933594, "global_step": 17994, "epoch": 107} {"train_loss": -6.571756839752197, "global_step": 17995, "epoch": 107} {"train_loss": -6.536863327026367, "global_step": 17996, "epoch": 107} {"train_loss": -6.732933044433594, "global_step": 17997, "epoch": 107} {"train_loss": -6.721148490905762, "global_step": 17998, "epoch": 107} {"train_loss": -6.704604148864746, "global_step": 17999, "epoch": 107} {"train_loss": -6.8018798828125, "global_step": 18000, "epoch": 107} {"train_loss": -6.360395431518555, "global_step": 18001, "epoch": 107} {"train_loss": -6.6378560066223145, "global_step": 18002, "epoch": 107} {"train_loss": -6.5847930908203125, "global_step": 18003, "epoch": 107} {"train_loss": -6.63185453414917, "global_step": 18004, "epoch": 107} {"train_loss": -6.487915992736816, "global_step": 18005, "epoch": 107} {"train_loss": -6.199950218200684, "global_step": 18006, "epoch": 107} {"train_loss": -6.830012321472168, "global_step": 18007, "epoch": 107} {"train_loss": -6.457162857055664, "global_step": 18008, "epoch": 107} {"train_loss": -6.710690498352051, "global_step": 18009, "epoch": 107} {"train_loss": -6.607513427734375, "global_step": 18010, "epoch": 107} {"train_loss": -6.4919281005859375, "global_step": 18011, "epoch": 107} {"train_loss": -6.787059783935547, "global_step": 18012, "epoch": 107} {"train_loss": -6.594554901123047, "global_step": 18013, "epoch": 107} {"train_loss": -6.527779579162598, "global_step": 18014, "epoch": 107} {"train_loss": -6.458461284637451, "global_step": 18015, "epoch": 107} {"train_loss": -6.620553970336914, "global_step": 18016, "epoch": 107} {"train_loss": -6.337564468383789, "global_step": 18017, "epoch": 107} {"train_loss": -6.6716694831848145, "global_step": 18018, "epoch": 107} {"train_loss": -6.551261901855469, "global_step": 18019, "epoch": 107} {"train_loss": -6.790769577026367, "global_step": 18020, "epoch": 107} {"train_loss": -6.520957946777344, "global_step": 18021, "epoch": 107} {"train_loss": -6.65341854095459, "global_step": 18022, "epoch": 107} {"train_loss": -6.522225379943848, "global_step": 18023, "epoch": 107} {"train_loss": -6.597509384155273, "global_step": 18024, "epoch": 107} {"train_loss": -6.889883995056152, "global_step": 18025, "epoch": 107} {"train_loss": -6.299722671508789, "global_step": 18026, "epoch": 107} {"train_loss": -6.604593276977539, "global_step": 18027, "epoch": 107} {"train_loss": -6.636206150054932, "global_step": 18028, "epoch": 107} {"train_loss": -6.656954765319824, "global_step": 18029, "epoch": 107} {"train_loss": -6.411842346191406, "global_step": 18030, "epoch": 107} {"train_loss": -6.609291076660156, "global_step": 18031, "epoch": 107} {"train_loss": -6.600505828857422, "global_step": 18032, "epoch": 107} {"train_loss": -6.582561492919922, "global_step": 18033, "epoch": 107} {"train_loss": -6.590323448181152, "global_step": 18034, "epoch": 107} {"train_loss": -6.44989538192749, "global_step": 18035, "epoch": 107} {"train_loss": -6.668095588684082, "global_step": 18036, "epoch": 107} {"train_loss": -6.667507171630859, "global_step": 18037, "epoch": 107} {"train_loss": -6.716860771179199, "global_step": 18038, "epoch": 107} {"train_loss": -6.662890434265137, "global_step": 18039, "epoch": 107} {"train_loss": -6.248603820800781, "global_step": 18040, "epoch": 107} {"train_loss": -6.552206993103027, "global_step": 18041, "epoch": 107} {"train_loss": -6.3404412269592285, "global_step": 18042, "epoch": 107} {"train_loss": -6.382008075714111, "global_step": 18043, "epoch": 107} {"train_loss": -6.388245582580566, "global_step": 18044, "epoch": 107} {"train_loss": -6.371040344238281, "global_step": 18045, "epoch": 107} {"train_loss": -6.549606800079346, "global_step": 18046, "epoch": 107} {"train_loss": -6.191989898681641, "global_step": 18047, "epoch": 107} {"train_loss": -6.672271251678467, "global_step": 18048, "epoch": 107} {"train_loss": -6.759963035583496, "global_step": 18049, "epoch": 107} {"train_loss": -6.393477439880371, "global_step": 18050, "epoch": 107} {"train_loss": -6.280043125152588, "global_step": 18051, "epoch": 107} {"train_loss": -6.571768760681152, "global_step": 18052, "epoch": 107} {"train_loss": -6.42179012298584, "global_step": 18053, "epoch": 107} {"train_loss": -6.6357316970825195, "global_step": 18054, "epoch": 107} {"train_loss": -6.626771926879883, "global_step": 18055, "epoch": 107} {"train_loss": -6.613280773162842, "global_step": 18056, "epoch": 107} {"train_loss": -6.602245807647705, "global_step": 18057, "epoch": 107} {"train_loss": -6.75405216217041, "global_step": 18058, "epoch": 107} {"train_loss": -6.6912455558776855, "global_step": 18059, "epoch": 107} {"train_loss": -6.644606590270996, "global_step": 18060, "epoch": 107} {"train_loss": -6.462806701660156, "global_step": 18061, "epoch": 107} {"train_loss": -6.94367790222168, "global_step": 18062, "epoch": 107} {"train_loss": -6.917982578277588, "global_step": 18063, "epoch": 107} {"train_loss": -6.738132476806641, "global_step": 18064, "epoch": 107} {"train_loss": -6.8968892097473145, "global_step": 18065, "epoch": 107} {"train_loss": -6.425719261169434, "global_step": 18066, "epoch": 107} {"train_loss": -6.627039909362793, "global_step": 18067, "epoch": 107} {"train_loss": -6.491398334503174, "global_step": 18068, "epoch": 107} {"train_loss": -6.574919700622559, "global_step": 18069, "epoch": 107} {"train_loss": -6.469597816467285, "global_step": 18070, "epoch": 107} {"train_loss": -6.671623229980469, "global_step": 18071, "epoch": 107} {"train_loss": -6.457921981811523, "global_step": 18072, "epoch": 107} {"train_loss": -6.283108711242676, "global_step": 18073, "epoch": 107} {"train_loss": -6.519996643066406, "global_step": 18074, "epoch": 107} {"train_loss": -6.585000038146973, "global_step": 18075, "epoch": 107} {"train_loss": -6.4837236404418945, "global_step": 18076, "epoch": 107} {"train_loss": -6.781621932983398, "global_step": 18077, "epoch": 107} {"train_loss": -6.905010223388672, "global_step": 18078, "epoch": 107} {"train_loss": -6.574019432067871, "global_step": 18079, "epoch": 107} {"train_loss": -6.834025859832764, "global_step": 18080, "epoch": 107} {"train_loss": -6.610593318939209, "global_step": 18081, "epoch": 107} {"train_loss": -6.806602478027344, "global_step": 18082, "epoch": 107} {"train_loss": -6.585419654846191, "global_step": 18083, "epoch": 107} {"train_loss": -6.521127223968506, "global_step": 18084, "epoch": 107} {"train_loss": -6.562530040740967, "global_step": 18085, "epoch": 107} {"train_loss": -6.540146827697754, "global_step": 18086, "epoch": 107} {"train_loss": -6.5128397941589355, "global_step": 18087, "epoch": 107} {"train_loss": -6.67262077331543, "global_step": 18088, "epoch": 107} {"train_loss": -6.746710777282715, "global_step": 18089, "epoch": 107} {"train_loss": -6.862215995788574, "global_step": 18090, "epoch": 107} {"train_loss": -6.470989227294922, "global_step": 18091, "epoch": 107} {"train_loss": -6.610620021820068, "global_step": 18092, "epoch": 107} {"train_loss": -6.392569541931152, "global_step": 18093, "epoch": 107} {"train_loss": -6.762213706970215, "global_step": 18094, "epoch": 107} {"train_loss": -6.578534126281738, "global_step": 18095, "epoch": 107} {"train_loss": -6.799189567565918, "global_step": 18096, "epoch": 107} {"train_loss": -6.723626613616943, "global_step": 18097, "epoch": 107} {"train_loss": -6.5608062744140625, "global_step": 18098, "epoch": 107} {"train_loss": -6.620633125305176, "global_step": 18099, "epoch": 107} {"train_loss": -6.7832417488098145, "global_step": 18100, "epoch": 107} {"train_loss": -6.757753372192383, "global_step": 18101, "epoch": 107} {"train_loss": -6.756657600402832, "global_step": 18102, "epoch": 107} {"train_loss": -6.548751354217529, "global_step": 18103, "epoch": 107} {"train_loss": -6.786466121673584, "global_step": 18104, "epoch": 107} {"train_loss": -6.834310531616211, "global_step": 18105, "epoch": 107} {"train_loss": -6.997929573059082, "global_step": 18106, "epoch": 107} {"train_loss": -6.716444492340088, "global_step": 18107, "epoch": 107} {"train_loss": -6.653506278991699, "global_step": 18108, "epoch": 107} {"train_loss": -6.814382076263428, "global_step": 18109, "epoch": 107} {"train_loss": -6.644797325134277, "global_step": 18110, "epoch": 107} {"train_loss": -6.698995590209961, "global_step": 18111, "epoch": 107} {"train_loss": -6.779526710510254, "global_step": 18112, "epoch": 107} {"train_loss": -6.781093120574951, "global_step": 18113, "epoch": 107} {"train_loss": -6.984469413757324, "global_step": 18114, "epoch": 107} {"train_loss": -6.712522029876709, "global_step": 18115, "epoch": 107} {"train_loss": -6.726593971252441, "global_step": 18116, "epoch": 107} {"train_loss": -6.823897838592529, "global_step": 18117, "epoch": 107} {"train_loss": -6.626412868499756, "global_step": 18118, "epoch": 107} {"train_loss": -6.778545379638672, "global_step": 18119, "epoch": 107} {"train_loss": -6.472765922546387, "global_step": 18120, "epoch": 107} {"train_loss": -6.855225086212158, "global_step": 18121, "epoch": 107} {"train_loss": -6.474750995635986, "global_step": 18122, "epoch": 107} {"train_loss": -6.442525386810303, "global_step": 18123, "epoch": 107} {"train_loss": -6.722052097320557, "global_step": 18124, "epoch": 107} {"train_loss": -6.71015739440918, "global_step": 18125, "epoch": 107} {"train_loss": -6.6751604080200195, "global_step": 18126, "epoch": 107} {"train_loss": -6.522871971130371, "global_step": 18127, "epoch": 107} {"train_loss": -6.849812984466553, "global_step": 18128, "epoch": 107} {"train_loss": -6.66315221786499, "global_step": 18129, "epoch": 107} {"train_loss": -6.364239692687988, "global_step": 18130, "epoch": 107} {"train_loss": -6.8635711669921875, "global_step": 18131, "epoch": 107} {"train_loss": -6.389226913452148, "global_step": 18132, "epoch": 107} {"train_loss": -6.528780937194824, "global_step": 18133, "epoch": 107} {"train_loss": -6.52879524230957, "global_step": 18134, "epoch": 107} {"train_loss": -6.549750804901123, "global_step": 18135, "epoch": 107} {"train_loss": -6.793302536010742, "global_step": 18136, "epoch": 107} {"train_loss": -6.442890644073486, "global_step": 18137, "epoch": 107} {"train_loss": -6.669497966766357, "global_step": 18138, "epoch": 107} {"train_loss": -6.586978435516357, "global_step": 18139, "epoch": 107} {"train_loss": -6.665467262268066, "global_step": 18140, "epoch": 107} {"train_loss": -6.627719879150391, "global_step": 18141, "epoch": 107} {"train_loss": -6.486446380615234, "global_step": 18142, "epoch": 107} {"train_loss": -6.596503709043775, "global_step": 18143, "epoch": 107, "val_loss": 228050.8125} {"train_loss": -6.511710166931152, "global_step": 18144, "epoch": 108} {"train_loss": -6.264235973358154, "global_step": 18145, "epoch": 108} {"train_loss": -6.7100348472595215, "global_step": 18146, "epoch": 108} {"train_loss": -6.437460899353027, "global_step": 18147, "epoch": 108} {"train_loss": -6.732270240783691, "global_step": 18148, "epoch": 108} {"train_loss": -6.721397399902344, "global_step": 18149, "epoch": 108} {"train_loss": -6.563999176025391, "global_step": 18150, "epoch": 108} {"train_loss": -6.685129165649414, "global_step": 18151, "epoch": 108} {"train_loss": -6.763017654418945, "global_step": 18152, "epoch": 108} {"train_loss": -6.514893531799316, "global_step": 18153, "epoch": 108} {"train_loss": -6.668432712554932, "global_step": 18154, "epoch": 108} {"train_loss": -6.956439971923828, "global_step": 18155, "epoch": 108} {"train_loss": -6.420426368713379, "global_step": 18156, "epoch": 108} {"train_loss": -6.747566223144531, "global_step": 18157, "epoch": 108} {"train_loss": -6.702879905700684, "global_step": 18158, "epoch": 108} {"train_loss": -6.721643447875977, "global_step": 18159, "epoch": 108} {"train_loss": -6.771572113037109, "global_step": 18160, "epoch": 108} {"train_loss": -6.684009552001953, "global_step": 18161, "epoch": 108} {"train_loss": -6.9554619789123535, "global_step": 18162, "epoch": 108} {"train_loss": -6.714511871337891, "global_step": 18163, "epoch": 108} {"train_loss": -6.663957595825195, "global_step": 18164, "epoch": 108} {"train_loss": -6.8272809982299805, "global_step": 18165, "epoch": 108} {"train_loss": -6.825446605682373, "global_step": 18166, "epoch": 108} {"train_loss": -6.753815174102783, "global_step": 18167, "epoch": 108} {"train_loss": -6.7595624923706055, "global_step": 18168, "epoch": 108} {"train_loss": -6.679429054260254, "global_step": 18169, "epoch": 108} {"train_loss": -6.31494140625, "global_step": 18170, "epoch": 108} {"train_loss": -6.658537864685059, "global_step": 18171, "epoch": 108} {"train_loss": -6.545136451721191, "global_step": 18172, "epoch": 108} {"train_loss": -6.421730041503906, "global_step": 18173, "epoch": 108} {"train_loss": -6.607885360717773, "global_step": 18174, "epoch": 108} {"train_loss": -6.4341535568237305, "global_step": 18175, "epoch": 108} {"train_loss": -6.409125328063965, "global_step": 18176, "epoch": 108} {"train_loss": -6.413775444030762, "global_step": 18177, "epoch": 108} {"train_loss": -6.320714950561523, "global_step": 18178, "epoch": 108} {"train_loss": -6.408024787902832, "global_step": 18179, "epoch": 108} {"train_loss": -6.427372932434082, "global_step": 18180, "epoch": 108} {"train_loss": -6.520620346069336, "global_step": 18181, "epoch": 108} {"train_loss": -6.2862772941589355, "global_step": 18182, "epoch": 108} {"train_loss": -6.600337028503418, "global_step": 18183, "epoch": 108} {"train_loss": -6.285140037536621, "global_step": 18184, "epoch": 108} {"train_loss": -6.532889366149902, "global_step": 18185, "epoch": 108} {"train_loss": -6.690219879150391, "global_step": 18186, "epoch": 108} {"train_loss": -6.600237846374512, "global_step": 18187, "epoch": 108} {"train_loss": -6.453492164611816, "global_step": 18188, "epoch": 108} {"train_loss": -6.571510314941406, "global_step": 18189, "epoch": 108} {"train_loss": -6.531435966491699, "global_step": 18190, "epoch": 108} {"train_loss": -6.694736480712891, "global_step": 18191, "epoch": 108} {"train_loss": -6.559896469116211, "global_step": 18192, "epoch": 108} {"train_loss": -6.734521865844727, "global_step": 18193, "epoch": 108} {"train_loss": -6.452922821044922, "global_step": 18194, "epoch": 108} {"train_loss": -6.567334175109863, "global_step": 18195, "epoch": 108} {"train_loss": -6.646579742431641, "global_step": 18196, "epoch": 108} {"train_loss": -6.676630973815918, "global_step": 18197, "epoch": 108} {"train_loss": -6.396339416503906, "global_step": 18198, "epoch": 108} {"train_loss": -6.640454292297363, "global_step": 18199, "epoch": 108} {"train_loss": -6.64670467376709, "global_step": 18200, "epoch": 108} {"train_loss": -6.743045806884766, "global_step": 18201, "epoch": 108} {"train_loss": -6.782650947570801, "global_step": 18202, "epoch": 108} {"train_loss": -6.718053817749023, "global_step": 18203, "epoch": 108} {"train_loss": -6.854957103729248, "global_step": 18204, "epoch": 108} {"train_loss": -6.607725143432617, "global_step": 18205, "epoch": 108} {"train_loss": -6.834923267364502, "global_step": 18206, "epoch": 108} {"train_loss": -6.787073612213135, "global_step": 18207, "epoch": 108} {"train_loss": -6.897028923034668, "global_step": 18208, "epoch": 108} {"train_loss": -6.7459330558776855, "global_step": 18209, "epoch": 108} {"train_loss": -6.764057159423828, "global_step": 18210, "epoch": 108} {"train_loss": -6.895517349243164, "global_step": 18211, "epoch": 108} {"train_loss": -6.664357662200928, "global_step": 18212, "epoch": 108} {"train_loss": -6.550996780395508, "global_step": 18213, "epoch": 108} {"train_loss": -6.598696231842041, "global_step": 18214, "epoch": 108} {"train_loss": -6.743533134460449, "global_step": 18215, "epoch": 108} {"train_loss": -6.769444465637207, "global_step": 18216, "epoch": 108} {"train_loss": -6.693920612335205, "global_step": 18217, "epoch": 108} {"train_loss": -6.652666091918945, "global_step": 18218, "epoch": 108} {"train_loss": -6.750182151794434, "global_step": 18219, "epoch": 108} {"train_loss": -6.68274450302124, "global_step": 18220, "epoch": 108} {"train_loss": -6.694498538970947, "global_step": 18221, "epoch": 108} {"train_loss": -6.699106216430664, "global_step": 18222, "epoch": 108} {"train_loss": -6.849837779998779, "global_step": 18223, "epoch": 108} {"train_loss": -6.5276007652282715, "global_step": 18224, "epoch": 108} {"train_loss": -6.593429088592529, "global_step": 18225, "epoch": 108} {"train_loss": -6.578350067138672, "global_step": 18226, "epoch": 108} {"train_loss": -6.794187545776367, "global_step": 18227, "epoch": 108} {"train_loss": -6.871357440948486, "global_step": 18228, "epoch": 108} {"train_loss": -6.681361198425293, "global_step": 18229, "epoch": 108} {"train_loss": -6.622068405151367, "global_step": 18230, "epoch": 108} {"train_loss": -6.3810224533081055, "global_step": 18231, "epoch": 108} {"train_loss": -6.870280742645264, "global_step": 18232, "epoch": 108} {"train_loss": -6.634657382965088, "global_step": 18233, "epoch": 108} {"train_loss": -6.480154037475586, "global_step": 18234, "epoch": 108} {"train_loss": -6.745566368103027, "global_step": 18235, "epoch": 108} {"train_loss": -6.895144462585449, "global_step": 18236, "epoch": 108} {"train_loss": -6.806859016418457, "global_step": 18237, "epoch": 108} {"train_loss": -6.735459327697754, "global_step": 18238, "epoch": 108} {"train_loss": -6.294278144836426, "global_step": 18239, "epoch": 108} {"train_loss": -6.760890960693359, "global_step": 18240, "epoch": 108} {"train_loss": -6.439592361450195, "global_step": 18241, "epoch": 108} {"train_loss": -6.522181510925293, "global_step": 18242, "epoch": 108} {"train_loss": -6.575871467590332, "global_step": 18243, "epoch": 108} {"train_loss": -6.455384254455566, "global_step": 18244, "epoch": 108} {"train_loss": -6.873860836029053, "global_step": 18245, "epoch": 108} {"train_loss": -6.350320816040039, "global_step": 18246, "epoch": 108} {"train_loss": -6.646988868713379, "global_step": 18247, "epoch": 108} {"train_loss": -6.708003997802734, "global_step": 18248, "epoch": 108} {"train_loss": -6.028059959411621, "global_step": 18249, "epoch": 108} {"train_loss": -6.715948104858398, "global_step": 18250, "epoch": 108} {"train_loss": -6.4131269454956055, "global_step": 18251, "epoch": 108} {"train_loss": -6.537713527679443, "global_step": 18252, "epoch": 108} {"train_loss": -6.436767578125, "global_step": 18253, "epoch": 108} {"train_loss": -6.299690246582031, "global_step": 18254, "epoch": 108} {"train_loss": -6.869577407836914, "global_step": 18255, "epoch": 108} {"train_loss": -6.9450483322143555, "global_step": 18256, "epoch": 108} {"train_loss": -6.586772918701172, "global_step": 18257, "epoch": 108} {"train_loss": -6.4879655838012695, "global_step": 18258, "epoch": 108} {"train_loss": -6.759160995483398, "global_step": 18259, "epoch": 108} {"train_loss": -6.658764839172363, "global_step": 18260, "epoch": 108} {"train_loss": -6.867841720581055, "global_step": 18261, "epoch": 108} {"train_loss": -6.865500450134277, "global_step": 18262, "epoch": 108} {"train_loss": -6.8229827880859375, "global_step": 18263, "epoch": 108} {"train_loss": -6.765824317932129, "global_step": 18264, "epoch": 108} {"train_loss": -6.727427959442139, "global_step": 18265, "epoch": 108} {"train_loss": -6.580082893371582, "global_step": 18266, "epoch": 108} {"train_loss": -6.722302436828613, "global_step": 18267, "epoch": 108} {"train_loss": -6.688932418823242, "global_step": 18268, "epoch": 108} {"train_loss": -6.593280792236328, "global_step": 18269, "epoch": 108} {"train_loss": -6.440536022186279, "global_step": 18270, "epoch": 108} {"train_loss": -6.929093360900879, "global_step": 18271, "epoch": 108} {"train_loss": -6.5418548583984375, "global_step": 18272, "epoch": 108} {"train_loss": -6.9165825843811035, "global_step": 18273, "epoch": 108} {"train_loss": -6.637598037719727, "global_step": 18274, "epoch": 108} {"train_loss": -6.676324844360352, "global_step": 18275, "epoch": 108} {"train_loss": -6.734746932983398, "global_step": 18276, "epoch": 108} {"train_loss": -6.477606296539307, "global_step": 18277, "epoch": 108} {"train_loss": -6.830238342285156, "global_step": 18278, "epoch": 108} {"train_loss": -6.315815448760986, "global_step": 18279, "epoch": 108} {"train_loss": -6.685610771179199, "global_step": 18280, "epoch": 108} {"train_loss": -6.744121551513672, "global_step": 18281, "epoch": 108} {"train_loss": -6.555074691772461, "global_step": 18282, "epoch": 108} {"train_loss": -6.678470611572266, "global_step": 18283, "epoch": 108} {"train_loss": -6.368074417114258, "global_step": 18284, "epoch": 108} {"train_loss": -6.726925373077393, "global_step": 18285, "epoch": 108} {"train_loss": -6.45857048034668, "global_step": 18286, "epoch": 108} {"train_loss": -6.594856262207031, "global_step": 18287, "epoch": 108} {"train_loss": -6.676461219787598, "global_step": 18288, "epoch": 108} {"train_loss": -6.619080066680908, "global_step": 18289, "epoch": 108} {"train_loss": -6.669749736785889, "global_step": 18290, "epoch": 108} {"train_loss": -6.612250328063965, "global_step": 18291, "epoch": 108} {"train_loss": -6.697404384613037, "global_step": 18292, "epoch": 108} {"train_loss": -6.712112903594971, "global_step": 18293, "epoch": 108} {"train_loss": -6.524375915527344, "global_step": 18294, "epoch": 108} {"train_loss": -6.613481521606445, "global_step": 18295, "epoch": 108} {"train_loss": -6.71353006362915, "global_step": 18296, "epoch": 108} {"train_loss": -6.886630058288574, "global_step": 18297, "epoch": 108} {"train_loss": -6.611889362335205, "global_step": 18298, "epoch": 108} {"train_loss": -6.697602272033691, "global_step": 18299, "epoch": 108} {"train_loss": -6.713558673858643, "global_step": 18300, "epoch": 108} {"train_loss": -6.977032661437988, "global_step": 18301, "epoch": 108} {"train_loss": -6.61799430847168, "global_step": 18302, "epoch": 108} {"train_loss": -6.764312744140625, "global_step": 18303, "epoch": 108} {"train_loss": -6.802749156951904, "global_step": 18304, "epoch": 108} {"train_loss": -6.799818992614746, "global_step": 18305, "epoch": 108} {"train_loss": -6.578669548034668, "global_step": 18306, "epoch": 108} {"train_loss": -6.829949378967285, "global_step": 18307, "epoch": 108} {"train_loss": -6.795263290405273, "global_step": 18308, "epoch": 108} {"train_loss": -6.996397972106934, "global_step": 18309, "epoch": 108} {"train_loss": -6.594246864318848, "global_step": 18310, "epoch": 108} {"train_loss": -6.64521743002392, "global_step": 18311, "epoch": 108, "val_loss": 224276.765625} {"train_loss": -6.571238040924072, "global_step": 18312, "epoch": 109} {"train_loss": -6.616937637329102, "global_step": 18313, "epoch": 109} {"train_loss": -6.65013313293457, "global_step": 18314, "epoch": 109} {"train_loss": -6.7643537521362305, "global_step": 18315, "epoch": 109} {"train_loss": -6.556743621826172, "global_step": 18316, "epoch": 109} {"train_loss": -6.778628349304199, "global_step": 18317, "epoch": 109} {"train_loss": -6.587101936340332, "global_step": 18318, "epoch": 109} {"train_loss": -6.663779258728027, "global_step": 18319, "epoch": 109} {"train_loss": -6.7347564697265625, "global_step": 18320, "epoch": 109} {"train_loss": -6.830783843994141, "global_step": 18321, "epoch": 109} {"train_loss": -6.50925350189209, "global_step": 18322, "epoch": 109} {"train_loss": -6.72618293762207, "global_step": 18323, "epoch": 109} {"train_loss": -6.7912211418151855, "global_step": 18324, "epoch": 109} {"train_loss": -6.673925399780273, "global_step": 18325, "epoch": 109} {"train_loss": -6.534339904785156, "global_step": 18326, "epoch": 109} {"train_loss": -6.773500442504883, "global_step": 18327, "epoch": 109} {"train_loss": -6.601900100708008, "global_step": 18328, "epoch": 109} {"train_loss": -6.767534255981445, "global_step": 18329, "epoch": 109} {"train_loss": -6.674215793609619, "global_step": 18330, "epoch": 109} {"train_loss": -6.676229953765869, "global_step": 18331, "epoch": 109} {"train_loss": -6.849514961242676, "global_step": 18332, "epoch": 109} {"train_loss": -6.5130720138549805, "global_step": 18333, "epoch": 109} {"train_loss": -6.774961471557617, "global_step": 18334, "epoch": 109} {"train_loss": -6.903348922729492, "global_step": 18335, "epoch": 109} {"train_loss": -6.690749168395996, "global_step": 18336, "epoch": 109} {"train_loss": -6.690469741821289, "global_step": 18337, "epoch": 109} {"train_loss": -6.706664562225342, "global_step": 18338, "epoch": 109} {"train_loss": -6.727277755737305, "global_step": 18339, "epoch": 109} {"train_loss": -6.748015403747559, "global_step": 18340, "epoch": 109} {"train_loss": -6.704273223876953, "global_step": 18341, "epoch": 109} {"train_loss": -6.804815292358398, "global_step": 18342, "epoch": 109} {"train_loss": -6.863921165466309, "global_step": 18343, "epoch": 109} {"train_loss": -6.822378635406494, "global_step": 18344, "epoch": 109} {"train_loss": -6.977841377258301, "global_step": 18345, "epoch": 109} {"train_loss": -6.633912086486816, "global_step": 18346, "epoch": 109} {"train_loss": -6.833739280700684, "global_step": 18347, "epoch": 109} {"train_loss": -6.570565700531006, "global_step": 18348, "epoch": 109} {"train_loss": -6.296222686767578, "global_step": 18349, "epoch": 109} {"train_loss": -6.760400772094727, "global_step": 18350, "epoch": 109} {"train_loss": -6.235900402069092, "global_step": 18351, "epoch": 109} {"train_loss": -6.117883682250977, "global_step": 18352, "epoch": 109} {"train_loss": -6.591728210449219, "global_step": 18353, "epoch": 109} {"train_loss": -6.606497764587402, "global_step": 18354, "epoch": 109} {"train_loss": -6.473842620849609, "global_step": 18355, "epoch": 109} {"train_loss": -6.46344518661499, "global_step": 18356, "epoch": 109} {"train_loss": -6.581553936004639, "global_step": 18357, "epoch": 109} {"train_loss": -6.401360988616943, "global_step": 18358, "epoch": 109} {"train_loss": -6.539405822753906, "global_step": 18359, "epoch": 109} {"train_loss": -6.542133331298828, "global_step": 18360, "epoch": 109} {"train_loss": -6.4752197265625, "global_step": 18361, "epoch": 109} {"train_loss": -6.4995856285095215, "global_step": 18362, "epoch": 109} {"train_loss": -6.785284042358398, "global_step": 18363, "epoch": 109} {"train_loss": -6.582729339599609, "global_step": 18364, "epoch": 109} {"train_loss": -6.579266548156738, "global_step": 18365, "epoch": 109} {"train_loss": -6.535798072814941, "global_step": 18366, "epoch": 109} {"train_loss": -6.67970085144043, "global_step": 18367, "epoch": 109} {"train_loss": -6.705814838409424, "global_step": 18368, "epoch": 109} {"train_loss": -6.669942855834961, "global_step": 18369, "epoch": 109} {"train_loss": -6.795017719268799, "global_step": 18370, "epoch": 109} {"train_loss": -6.829635143280029, "global_step": 18371, "epoch": 109} {"train_loss": -6.8051958084106445, "global_step": 18372, "epoch": 109} {"train_loss": -6.648130416870117, "global_step": 18373, "epoch": 109} {"train_loss": -6.628203392028809, "global_step": 18374, "epoch": 109} {"train_loss": -6.680906772613525, "global_step": 18375, "epoch": 109} {"train_loss": -6.648063659667969, "global_step": 18376, "epoch": 109} {"train_loss": -6.622998237609863, "global_step": 18377, "epoch": 109} {"train_loss": -6.685482025146484, "global_step": 18378, "epoch": 109} {"train_loss": -6.747824668884277, "global_step": 18379, "epoch": 109} {"train_loss": -6.79742431640625, "global_step": 18380, "epoch": 109} {"train_loss": -6.728001117706299, "global_step": 18381, "epoch": 109} {"train_loss": -6.58421516418457, "global_step": 18382, "epoch": 109} {"train_loss": -6.6744303703308105, "global_step": 18383, "epoch": 109} {"train_loss": -6.787750244140625, "global_step": 18384, "epoch": 109} {"train_loss": -6.90479850769043, "global_step": 18385, "epoch": 109} {"train_loss": -6.807197570800781, "global_step": 18386, "epoch": 109} {"train_loss": -6.757791519165039, "global_step": 18387, "epoch": 109} {"train_loss": -6.728144645690918, "global_step": 18388, "epoch": 109} {"train_loss": -6.896417617797852, "global_step": 18389, "epoch": 109} {"train_loss": -6.595670223236084, "global_step": 18390, "epoch": 109} {"train_loss": -6.661260604858398, "global_step": 18391, "epoch": 109} {"train_loss": -6.71776008605957, "global_step": 18392, "epoch": 109} {"train_loss": -6.582625389099121, "global_step": 18393, "epoch": 109} {"train_loss": -6.7001142501831055, "global_step": 18394, "epoch": 109} {"train_loss": -6.522853851318359, "global_step": 18395, "epoch": 109} {"train_loss": -6.864671230316162, "global_step": 18396, "epoch": 109} {"train_loss": -7.07100772857666, "global_step": 18397, "epoch": 109} {"train_loss": -6.73651123046875, "global_step": 18398, "epoch": 109} {"train_loss": -6.895547866821289, "global_step": 18399, "epoch": 109} {"train_loss": -6.8077392578125, "global_step": 18400, "epoch": 109} {"train_loss": -6.845211029052734, "global_step": 18401, "epoch": 109} {"train_loss": -6.577261447906494, "global_step": 18402, "epoch": 109} {"train_loss": -6.618721008300781, "global_step": 18403, "epoch": 109} {"train_loss": -6.578046798706055, "global_step": 18404, "epoch": 109} {"train_loss": -6.682671546936035, "global_step": 18405, "epoch": 109} {"train_loss": -6.833552360534668, "global_step": 18406, "epoch": 109} {"train_loss": -6.666525363922119, "global_step": 18407, "epoch": 109} {"train_loss": -6.697076320648193, "global_step": 18408, "epoch": 109} {"train_loss": -6.712800025939941, "global_step": 18409, "epoch": 109} {"train_loss": -6.71265983581543, "global_step": 18410, "epoch": 109} {"train_loss": -6.664225101470947, "global_step": 18411, "epoch": 109} {"train_loss": -6.763212203979492, "global_step": 18412, "epoch": 109} {"train_loss": -6.51579475402832, "global_step": 18413, "epoch": 109} {"train_loss": -6.559471607208252, "global_step": 18414, "epoch": 109} {"train_loss": -6.672905921936035, "global_step": 18415, "epoch": 109} {"train_loss": -6.720887184143066, "global_step": 18416, "epoch": 109} {"train_loss": -6.72243595123291, "global_step": 18417, "epoch": 109} {"train_loss": -6.382753849029541, "global_step": 18418, "epoch": 109} {"train_loss": -6.658395767211914, "global_step": 18419, "epoch": 109} {"train_loss": -6.766546726226807, "global_step": 18420, "epoch": 109} {"train_loss": -6.786291122436523, "global_step": 18421, "epoch": 109} {"train_loss": -6.610304832458496, "global_step": 18422, "epoch": 109} {"train_loss": -6.480616092681885, "global_step": 18423, "epoch": 109} {"train_loss": -6.686612129211426, "global_step": 18424, "epoch": 109} {"train_loss": -6.482622146606445, "global_step": 18425, "epoch": 109} {"train_loss": -6.60668420791626, "global_step": 18426, "epoch": 109} {"train_loss": -6.665959358215332, "global_step": 18427, "epoch": 109} {"train_loss": -6.681354999542236, "global_step": 18428, "epoch": 109} {"train_loss": -6.774995803833008, "global_step": 18429, "epoch": 109} {"train_loss": -6.820256233215332, "global_step": 18430, "epoch": 109} {"train_loss": -6.72846794128418, "global_step": 18431, "epoch": 109} {"train_loss": -6.7816386222839355, "global_step": 18432, "epoch": 109} {"train_loss": -6.582048416137695, "global_step": 18433, "epoch": 109} {"train_loss": -6.831420421600342, "global_step": 18434, "epoch": 109} {"train_loss": -6.8396759033203125, "global_step": 18435, "epoch": 109} {"train_loss": -6.910970687866211, "global_step": 18436, "epoch": 109} {"train_loss": -6.805781841278076, "global_step": 18437, "epoch": 109} {"train_loss": -6.669281959533691, "global_step": 18438, "epoch": 109} {"train_loss": -6.693443298339844, "global_step": 18439, "epoch": 109} {"train_loss": -6.670025825500488, "global_step": 18440, "epoch": 109} {"train_loss": -6.827259063720703, "global_step": 18441, "epoch": 109} {"train_loss": -6.677522659301758, "global_step": 18442, "epoch": 109} {"train_loss": -6.666836261749268, "global_step": 18443, "epoch": 109} {"train_loss": -6.672969818115234, "global_step": 18444, "epoch": 109} {"train_loss": -6.6859130859375, "global_step": 18445, "epoch": 109} {"train_loss": -6.574347972869873, "global_step": 18446, "epoch": 109} {"train_loss": -6.432077407836914, "global_step": 18447, "epoch": 109} {"train_loss": -6.73362922668457, "global_step": 18448, "epoch": 109} {"train_loss": -6.607860565185547, "global_step": 18449, "epoch": 109} {"train_loss": -6.570999622344971, "global_step": 18450, "epoch": 109} {"train_loss": -6.690526962280273, "global_step": 18451, "epoch": 109} {"train_loss": -6.1376471519470215, "global_step": 18452, "epoch": 109} {"train_loss": -6.663725852966309, "global_step": 18453, "epoch": 109} {"train_loss": -6.391438961029053, "global_step": 18454, "epoch": 109} {"train_loss": -6.732006072998047, "global_step": 18455, "epoch": 109} {"train_loss": -6.725486755371094, "global_step": 18456, "epoch": 109} {"train_loss": -6.422724723815918, "global_step": 18457, "epoch": 109} {"train_loss": -6.706530570983887, "global_step": 18458, "epoch": 109} {"train_loss": -6.446592807769775, "global_step": 18459, "epoch": 109} {"train_loss": -6.56625509262085, "global_step": 18460, "epoch": 109} {"train_loss": -6.664405822753906, "global_step": 18461, "epoch": 109} {"train_loss": -6.8652448654174805, "global_step": 18462, "epoch": 109} {"train_loss": -6.631753444671631, "global_step": 18463, "epoch": 109} {"train_loss": -6.681149005889893, "global_step": 18464, "epoch": 109} {"train_loss": -6.589870452880859, "global_step": 18465, "epoch": 109} {"train_loss": -6.649636268615723, "global_step": 18466, "epoch": 109} {"train_loss": -6.622033596038818, "global_step": 18467, "epoch": 109} {"train_loss": -6.702879905700684, "global_step": 18468, "epoch": 109} {"train_loss": -6.7437896728515625, "global_step": 18469, "epoch": 109} {"train_loss": -6.635746002197266, "global_step": 18470, "epoch": 109} {"train_loss": -6.781394004821777, "global_step": 18471, "epoch": 109} {"train_loss": -6.888247489929199, "global_step": 18472, "epoch": 109} {"train_loss": -6.781613349914551, "global_step": 18473, "epoch": 109} {"train_loss": -6.939000129699707, "global_step": 18474, "epoch": 109} {"train_loss": -6.752510070800781, "global_step": 18475, "epoch": 109} {"train_loss": -6.615915298461914, "global_step": 18476, "epoch": 109} {"train_loss": -6.593935012817383, "global_step": 18477, "epoch": 109} {"train_loss": -6.847324371337891, "global_step": 18478, "epoch": 109} {"train_loss": -6.675109318324497, "global_step": 18479, "epoch": 109, "val_loss": 222475.875} {"train_loss": -6.790358066558838, "global_step": 18480, "epoch": 110} {"train_loss": -6.946463108062744, "global_step": 18481, "epoch": 110} {"train_loss": -6.849516868591309, "global_step": 18482, "epoch": 110} {"train_loss": -6.521712779998779, "global_step": 18483, "epoch": 110} {"train_loss": -6.518889427185059, "global_step": 18484, "epoch": 110} {"train_loss": -6.535615921020508, "global_step": 18485, "epoch": 110} {"train_loss": -6.6444091796875, "global_step": 18486, "epoch": 110} {"train_loss": -6.597757339477539, "global_step": 18487, "epoch": 110} {"train_loss": -6.616263389587402, "global_step": 18488, "epoch": 110} {"train_loss": -6.637093544006348, "global_step": 18489, "epoch": 110} {"train_loss": -6.793868064880371, "global_step": 18490, "epoch": 110} {"train_loss": -6.622353553771973, "global_step": 18491, "epoch": 110} {"train_loss": -6.675070762634277, "global_step": 18492, "epoch": 110} {"train_loss": -6.700475215911865, "global_step": 18493, "epoch": 110} {"train_loss": -6.650620460510254, "global_step": 18494, "epoch": 110} {"train_loss": -6.457511901855469, "global_step": 18495, "epoch": 110} {"train_loss": -6.486761569976807, "global_step": 18496, "epoch": 110} {"train_loss": -6.6305952072143555, "global_step": 18497, "epoch": 110} {"train_loss": -6.611843109130859, "global_step": 18498, "epoch": 110} {"train_loss": -6.536666393280029, "global_step": 18499, "epoch": 110} {"train_loss": -6.537303924560547, "global_step": 18500, "epoch": 110} {"train_loss": -6.652203559875488, "global_step": 18501, "epoch": 110} {"train_loss": -6.665460586547852, "global_step": 18502, "epoch": 110} {"train_loss": -6.708311080932617, "global_step": 18503, "epoch": 110} {"train_loss": -6.704811096191406, "global_step": 18504, "epoch": 110} {"train_loss": -6.79848575592041, "global_step": 18505, "epoch": 110} {"train_loss": -6.697205066680908, "global_step": 18506, "epoch": 110} {"train_loss": -6.58749532699585, "global_step": 18507, "epoch": 110} {"train_loss": -6.778132438659668, "global_step": 18508, "epoch": 110} {"train_loss": -6.680859565734863, "global_step": 18509, "epoch": 110} {"train_loss": -6.629547595977783, "global_step": 18510, "epoch": 110} {"train_loss": -6.544089317321777, "global_step": 18511, "epoch": 110} {"train_loss": -6.839269638061523, "global_step": 18512, "epoch": 110} {"train_loss": -6.614668846130371, "global_step": 18513, "epoch": 110} {"train_loss": -6.640829563140869, "global_step": 18514, "epoch": 110} {"train_loss": -6.936638355255127, "global_step": 18515, "epoch": 110} {"train_loss": -6.632617473602295, "global_step": 18516, "epoch": 110} {"train_loss": -6.633069038391113, "global_step": 18517, "epoch": 110} {"train_loss": -6.644049644470215, "global_step": 18518, "epoch": 110} {"train_loss": -6.610709190368652, "global_step": 18519, "epoch": 110} {"train_loss": -6.529206275939941, "global_step": 18520, "epoch": 110} {"train_loss": -6.815098762512207, "global_step": 18521, "epoch": 110} {"train_loss": -6.810237884521484, "global_step": 18522, "epoch": 110} {"train_loss": -6.652311325073242, "global_step": 18523, "epoch": 110} {"train_loss": -7.017848014831543, "global_step": 18524, "epoch": 110} {"train_loss": -6.8250885009765625, "global_step": 18525, "epoch": 110} {"train_loss": -6.767089366912842, "global_step": 18526, "epoch": 110} {"train_loss": -6.679542064666748, "global_step": 18527, "epoch": 110} {"train_loss": -6.8633952140808105, "global_step": 18528, "epoch": 110} {"train_loss": -6.920845985412598, "global_step": 18529, "epoch": 110} {"train_loss": -6.715463638305664, "global_step": 18530, "epoch": 110} {"train_loss": -6.721892356872559, "global_step": 18531, "epoch": 110} {"train_loss": -6.640532970428467, "global_step": 18532, "epoch": 110} {"train_loss": -6.836068153381348, "global_step": 18533, "epoch": 110} {"train_loss": -6.81569766998291, "global_step": 18534, "epoch": 110} {"train_loss": -6.700374126434326, "global_step": 18535, "epoch": 110} {"train_loss": -6.898177623748779, "global_step": 18536, "epoch": 110} {"train_loss": -6.87563419342041, "global_step": 18537, "epoch": 110} {"train_loss": -6.647914886474609, "global_step": 18538, "epoch": 110} {"train_loss": -6.791792869567871, "global_step": 18539, "epoch": 110} {"train_loss": -6.975213050842285, "global_step": 18540, "epoch": 110} {"train_loss": -6.868387222290039, "global_step": 18541, "epoch": 110} {"train_loss": -6.791396141052246, "global_step": 18542, "epoch": 110} {"train_loss": -6.88999605178833, "global_step": 18543, "epoch": 110} {"train_loss": -6.770634174346924, "global_step": 18544, "epoch": 110} {"train_loss": -6.803701400756836, "global_step": 18545, "epoch": 110} {"train_loss": -6.719246864318848, "global_step": 18546, "epoch": 110} {"train_loss": -6.761981010437012, "global_step": 18547, "epoch": 110} {"train_loss": -6.604691505432129, "global_step": 18548, "epoch": 110} {"train_loss": -6.645909786224365, "global_step": 18549, "epoch": 110} {"train_loss": -6.730749130249023, "global_step": 18550, "epoch": 110} {"train_loss": -6.96929931640625, "global_step": 18551, "epoch": 110} {"train_loss": -6.89962100982666, "global_step": 18552, "epoch": 110} {"train_loss": -6.854673385620117, "global_step": 18553, "epoch": 110} {"train_loss": -6.861084938049316, "global_step": 18554, "epoch": 110} {"train_loss": -6.834372520446777, "global_step": 18555, "epoch": 110} {"train_loss": -6.970102310180664, "global_step": 18556, "epoch": 110} {"train_loss": -6.618745803833008, "global_step": 18557, "epoch": 110} {"train_loss": -6.782301425933838, "global_step": 18558, "epoch": 110} {"train_loss": -6.708670616149902, "global_step": 18559, "epoch": 110} {"train_loss": -6.682832717895508, "global_step": 18560, "epoch": 110} {"train_loss": -6.918040752410889, "global_step": 18561, "epoch": 110} {"train_loss": -6.660582542419434, "global_step": 18562, "epoch": 110} {"train_loss": -6.815211296081543, "global_step": 18563, "epoch": 110} {"train_loss": -6.297781944274902, "global_step": 18564, "epoch": 110} {"train_loss": -6.832360744476318, "global_step": 18565, "epoch": 110} {"train_loss": -6.791005611419678, "global_step": 18566, "epoch": 110} {"train_loss": -6.55808162689209, "global_step": 18567, "epoch": 110} {"train_loss": -6.592653274536133, "global_step": 18568, "epoch": 110} {"train_loss": -6.882856845855713, "global_step": 18569, "epoch": 110} {"train_loss": -6.4021406173706055, "global_step": 18570, "epoch": 110} {"train_loss": -6.569448947906494, "global_step": 18571, "epoch": 110} {"train_loss": -6.579279899597168, "global_step": 18572, "epoch": 110} {"train_loss": -6.730082035064697, "global_step": 18573, "epoch": 110} {"train_loss": -6.506148338317871, "global_step": 18574, "epoch": 110} {"train_loss": -6.636599063873291, "global_step": 18575, "epoch": 110} {"train_loss": -6.644099235534668, "global_step": 18576, "epoch": 110} {"train_loss": -6.367232322692871, "global_step": 18577, "epoch": 110} {"train_loss": -6.578928470611572, "global_step": 18578, "epoch": 110} {"train_loss": -6.29496955871582, "global_step": 18579, "epoch": 110} {"train_loss": -6.674014091491699, "global_step": 18580, "epoch": 110} {"train_loss": -6.624139308929443, "global_step": 18581, "epoch": 110} {"train_loss": -6.6538405418396, "global_step": 18582, "epoch": 110} {"train_loss": -6.519308090209961, "global_step": 18583, "epoch": 110} {"train_loss": -6.711481094360352, "global_step": 18584, "epoch": 110} {"train_loss": -6.694850921630859, "global_step": 18585, "epoch": 110} {"train_loss": -6.537734508514404, "global_step": 18586, "epoch": 110} {"train_loss": -6.6578049659729, "global_step": 18587, "epoch": 110} {"train_loss": -6.641758918762207, "global_step": 18588, "epoch": 110} {"train_loss": -6.514307975769043, "global_step": 18589, "epoch": 110} {"train_loss": -6.551739692687988, "global_step": 18590, "epoch": 110} {"train_loss": -6.583907604217529, "global_step": 18591, "epoch": 110} {"train_loss": -6.639952182769775, "global_step": 18592, "epoch": 110} {"train_loss": -6.485751152038574, "global_step": 18593, "epoch": 110} {"train_loss": -6.642167568206787, "global_step": 18594, "epoch": 110} {"train_loss": -6.783571243286133, "global_step": 18595, "epoch": 110} {"train_loss": -6.472614765167236, "global_step": 18596, "epoch": 110} {"train_loss": -6.706694602966309, "global_step": 18597, "epoch": 110} {"train_loss": -6.480930328369141, "global_step": 18598, "epoch": 110} {"train_loss": -6.420814514160156, "global_step": 18599, "epoch": 110} {"train_loss": -6.623987197875977, "global_step": 18600, "epoch": 110} {"train_loss": -6.566717147827148, "global_step": 18601, "epoch": 110} {"train_loss": -6.625615119934082, "global_step": 18602, "epoch": 110} {"train_loss": -6.582201957702637, "global_step": 18603, "epoch": 110} {"train_loss": -6.52254581451416, "global_step": 18604, "epoch": 110} {"train_loss": -6.509578704833984, "global_step": 18605, "epoch": 110} {"train_loss": -6.595986843109131, "global_step": 18606, "epoch": 110} {"train_loss": -6.68891716003418, "global_step": 18607, "epoch": 110} {"train_loss": -6.29601526260376, "global_step": 18608, "epoch": 110} {"train_loss": -6.311380386352539, "global_step": 18609, "epoch": 110} {"train_loss": -6.617321968078613, "global_step": 18610, "epoch": 110} {"train_loss": -6.676449775695801, "global_step": 18611, "epoch": 110} {"train_loss": -6.356775283813477, "global_step": 18612, "epoch": 110} {"train_loss": -6.507713317871094, "global_step": 18613, "epoch": 110} {"train_loss": -6.626075267791748, "global_step": 18614, "epoch": 110} {"train_loss": -6.402214050292969, "global_step": 18615, "epoch": 110} {"train_loss": -6.6092681884765625, "global_step": 18616, "epoch": 110} {"train_loss": -6.474055290222168, "global_step": 18617, "epoch": 110} {"train_loss": -6.463499069213867, "global_step": 18618, "epoch": 110} {"train_loss": -6.098799705505371, "global_step": 18619, "epoch": 110} {"train_loss": -6.291460037231445, "global_step": 18620, "epoch": 110} {"train_loss": -6.519678115844727, "global_step": 18621, "epoch": 110} {"train_loss": -6.544081211090088, "global_step": 18622, "epoch": 110} {"train_loss": -6.624551773071289, "global_step": 18623, "epoch": 110} {"train_loss": -6.513401985168457, "global_step": 18624, "epoch": 110} {"train_loss": -6.5353899002075195, "global_step": 18625, "epoch": 110} {"train_loss": -6.6922149658203125, "global_step": 18626, "epoch": 110} {"train_loss": -6.468021869659424, "global_step": 18627, "epoch": 110} {"train_loss": -6.62878942489624, "global_step": 18628, "epoch": 110} {"train_loss": -6.525639057159424, "global_step": 18629, "epoch": 110} {"train_loss": -6.687239646911621, "global_step": 18630, "epoch": 110} {"train_loss": -6.710770606994629, "global_step": 18631, "epoch": 110} {"train_loss": -6.605012893676758, "global_step": 18632, "epoch": 110} {"train_loss": -6.808177947998047, "global_step": 18633, "epoch": 110} {"train_loss": -6.538496017456055, "global_step": 18634, "epoch": 110} {"train_loss": -6.644138336181641, "global_step": 18635, "epoch": 110} {"train_loss": -6.66942024230957, "global_step": 18636, "epoch": 110} {"train_loss": -6.724644660949707, "global_step": 18637, "epoch": 110} {"train_loss": -6.6868815422058105, "global_step": 18638, "epoch": 110} {"train_loss": -6.62320613861084, "global_step": 18639, "epoch": 110} {"train_loss": -6.625744819641113, "global_step": 18640, "epoch": 110} {"train_loss": -6.72586727142334, "global_step": 18641, "epoch": 110} {"train_loss": -6.78668737411499, "global_step": 18642, "epoch": 110} {"train_loss": -6.668673515319824, "global_step": 18643, "epoch": 110} {"train_loss": -6.4574689865112305, "global_step": 18644, "epoch": 110} {"train_loss": -6.609050750732422, "global_step": 18645, "epoch": 110} {"train_loss": -6.4155426025390625, "global_step": 18646, "epoch": 110} {"train_loss": -6.65222309033076, "global_step": 18647, "epoch": 110, "val_loss": 228123.015625, "train_action_mse_error": 25.18844985961914} {"train_loss": -6.694845676422119, "global_step": 18648, "epoch": 111} {"train_loss": -6.783902645111084, "global_step": 18649, "epoch": 111} {"train_loss": -6.637740135192871, "global_step": 18650, "epoch": 111} {"train_loss": -6.461261749267578, "global_step": 18651, "epoch": 111} {"train_loss": -6.744998931884766, "global_step": 18652, "epoch": 111} {"train_loss": -6.570896625518799, "global_step": 18653, "epoch": 111} {"train_loss": -6.585868835449219, "global_step": 18654, "epoch": 111} {"train_loss": -6.762993812561035, "global_step": 18655, "epoch": 111} {"train_loss": -6.6846160888671875, "global_step": 18656, "epoch": 111} {"train_loss": -6.659663200378418, "global_step": 18657, "epoch": 111} {"train_loss": -6.380558967590332, "global_step": 18658, "epoch": 111} {"train_loss": -6.494718551635742, "global_step": 18659, "epoch": 111} {"train_loss": -6.411982536315918, "global_step": 18660, "epoch": 111} {"train_loss": -6.820294380187988, "global_step": 18661, "epoch": 111} {"train_loss": -6.725852012634277, "global_step": 18662, "epoch": 111} {"train_loss": -6.720846176147461, "global_step": 18663, "epoch": 111} {"train_loss": -6.362942695617676, "global_step": 18664, "epoch": 111} {"train_loss": -6.68424654006958, "global_step": 18665, "epoch": 111} {"train_loss": -6.742376327514648, "global_step": 18666, "epoch": 111} {"train_loss": -6.709599494934082, "global_step": 18667, "epoch": 111} {"train_loss": -6.56545352935791, "global_step": 18668, "epoch": 111} {"train_loss": -6.776945114135742, "global_step": 18669, "epoch": 111} {"train_loss": -6.560403823852539, "global_step": 18670, "epoch": 111} {"train_loss": -6.432974338531494, "global_step": 18671, "epoch": 111} {"train_loss": -6.733513832092285, "global_step": 18672, "epoch": 111} {"train_loss": -6.607254505157471, "global_step": 18673, "epoch": 111} {"train_loss": -6.763676643371582, "global_step": 18674, "epoch": 111} {"train_loss": -6.412475109100342, "global_step": 18675, "epoch": 111} {"train_loss": -6.541341781616211, "global_step": 18676, "epoch": 111} {"train_loss": -6.751784801483154, "global_step": 18677, "epoch": 111} {"train_loss": -6.639651775360107, "global_step": 18678, "epoch": 111} {"train_loss": -6.487970352172852, "global_step": 18679, "epoch": 111} {"train_loss": -6.703927040100098, "global_step": 18680, "epoch": 111} {"train_loss": -6.588029384613037, "global_step": 18681, "epoch": 111} {"train_loss": -6.673300743103027, "global_step": 18682, "epoch": 111} {"train_loss": -6.666807174682617, "global_step": 18683, "epoch": 111} {"train_loss": -6.631359100341797, "global_step": 18684, "epoch": 111} {"train_loss": -6.753734111785889, "global_step": 18685, "epoch": 111} {"train_loss": -6.558440208435059, "global_step": 18686, "epoch": 111} {"train_loss": -6.511005401611328, "global_step": 18687, "epoch": 111} {"train_loss": -6.530416488647461, "global_step": 18688, "epoch": 111} {"train_loss": -6.68863582611084, "global_step": 18689, "epoch": 111} {"train_loss": -6.724113941192627, "global_step": 18690, "epoch": 111} {"train_loss": -6.8009033203125, "global_step": 18691, "epoch": 111} {"train_loss": -6.5296735763549805, "global_step": 18692, "epoch": 111} {"train_loss": -6.808941841125488, "global_step": 18693, "epoch": 111} {"train_loss": -6.686374187469482, "global_step": 18694, "epoch": 111} {"train_loss": -6.750633716583252, "global_step": 18695, "epoch": 111} {"train_loss": -6.887435436248779, "global_step": 18696, "epoch": 111} {"train_loss": -6.631305694580078, "global_step": 18697, "epoch": 111} {"train_loss": -6.5812273025512695, "global_step": 18698, "epoch": 111} {"train_loss": -6.5593647956848145, "global_step": 18699, "epoch": 111} {"train_loss": -6.7784600257873535, "global_step": 18700, "epoch": 111} {"train_loss": -6.719653129577637, "global_step": 18701, "epoch": 111} {"train_loss": -6.754398345947266, "global_step": 18702, "epoch": 111} {"train_loss": -6.75403356552124, "global_step": 18703, "epoch": 111} {"train_loss": -6.744327545166016, "global_step": 18704, "epoch": 111} {"train_loss": -6.487383842468262, "global_step": 18705, "epoch": 111} {"train_loss": -6.7824554443359375, "global_step": 18706, "epoch": 111} {"train_loss": -6.607603073120117, "global_step": 18707, "epoch": 111} {"train_loss": -6.508282661437988, "global_step": 18708, "epoch": 111} {"train_loss": -6.767478942871094, "global_step": 18709, "epoch": 111} {"train_loss": -6.920060157775879, "global_step": 18710, "epoch": 111} {"train_loss": -6.621501922607422, "global_step": 18711, "epoch": 111} {"train_loss": -6.5981950759887695, "global_step": 18712, "epoch": 111} {"train_loss": -6.868008613586426, "global_step": 18713, "epoch": 111} {"train_loss": -6.387362003326416, "global_step": 18714, "epoch": 111} {"train_loss": -6.886059761047363, "global_step": 18715, "epoch": 111} {"train_loss": -6.6736907958984375, "global_step": 18716, "epoch": 111} {"train_loss": -6.938230037689209, "global_step": 18717, "epoch": 111} {"train_loss": -6.679780960083008, "global_step": 18718, "epoch": 111} {"train_loss": -6.7470173835754395, "global_step": 18719, "epoch": 111} {"train_loss": -7.036323547363281, "global_step": 18720, "epoch": 111} {"train_loss": -6.878215789794922, "global_step": 18721, "epoch": 111} {"train_loss": -6.557790756225586, "global_step": 18722, "epoch": 111} {"train_loss": -6.754281044006348, "global_step": 18723, "epoch": 111} {"train_loss": -6.687530994415283, "global_step": 18724, "epoch": 111} {"train_loss": -7.052750587463379, "global_step": 18725, "epoch": 111} {"train_loss": -6.796354293823242, "global_step": 18726, "epoch": 111} {"train_loss": -6.61480712890625, "global_step": 18727, "epoch": 111} {"train_loss": -6.941123008728027, "global_step": 18728, "epoch": 111} {"train_loss": -6.623130798339844, "global_step": 18729, "epoch": 111} {"train_loss": -6.5757951736450195, "global_step": 18730, "epoch": 111} {"train_loss": -6.765473365783691, "global_step": 18731, "epoch": 111} {"train_loss": -6.904109954833984, "global_step": 18732, "epoch": 111} {"train_loss": -6.778519630432129, "global_step": 18733, "epoch": 111} {"train_loss": -6.549372673034668, "global_step": 18734, "epoch": 111} {"train_loss": -6.7212700843811035, "global_step": 18735, "epoch": 111} {"train_loss": -6.748955726623535, "global_step": 18736, "epoch": 111} {"train_loss": -6.824265956878662, "global_step": 18737, "epoch": 111} {"train_loss": -6.499568939208984, "global_step": 18738, "epoch": 111} {"train_loss": -6.754877090454102, "global_step": 18739, "epoch": 111} {"train_loss": -6.639616966247559, "global_step": 18740, "epoch": 111} {"train_loss": -6.640438556671143, "global_step": 18741, "epoch": 111} {"train_loss": -6.7336344718933105, "global_step": 18742, "epoch": 111} {"train_loss": -6.862576484680176, "global_step": 18743, "epoch": 111} {"train_loss": -6.773068904876709, "global_step": 18744, "epoch": 111} {"train_loss": -6.645910263061523, "global_step": 18745, "epoch": 111} {"train_loss": -6.711843490600586, "global_step": 18746, "epoch": 111} {"train_loss": -6.828839302062988, "global_step": 18747, "epoch": 111} {"train_loss": -6.651142120361328, "global_step": 18748, "epoch": 111} {"train_loss": -6.761214733123779, "global_step": 18749, "epoch": 111} {"train_loss": -6.645847320556641, "global_step": 18750, "epoch": 111} {"train_loss": -6.520829200744629, "global_step": 18751, "epoch": 111} {"train_loss": -6.783048152923584, "global_step": 18752, "epoch": 111} {"train_loss": -6.713868141174316, "global_step": 18753, "epoch": 111} {"train_loss": -6.677288055419922, "global_step": 18754, "epoch": 111} {"train_loss": -6.503028869628906, "global_step": 18755, "epoch": 111} {"train_loss": -6.642702102661133, "global_step": 18756, "epoch": 111} {"train_loss": -6.585644721984863, "global_step": 18757, "epoch": 111} {"train_loss": -6.420769214630127, "global_step": 18758, "epoch": 111} {"train_loss": -6.448738098144531, "global_step": 18759, "epoch": 111} {"train_loss": -6.519326210021973, "global_step": 18760, "epoch": 111} {"train_loss": -6.329201698303223, "global_step": 18761, "epoch": 111} {"train_loss": -6.8111090660095215, "global_step": 18762, "epoch": 111} {"train_loss": -6.536121368408203, "global_step": 18763, "epoch": 111} {"train_loss": -6.524294853210449, "global_step": 18764, "epoch": 111} {"train_loss": -6.6825337409973145, "global_step": 18765, "epoch": 111} {"train_loss": -6.568063735961914, "global_step": 18766, "epoch": 111} {"train_loss": -6.4055023193359375, "global_step": 18767, "epoch": 111} {"train_loss": -6.806422233581543, "global_step": 18768, "epoch": 111} {"train_loss": -6.848196983337402, "global_step": 18769, "epoch": 111} {"train_loss": -6.864006042480469, "global_step": 18770, "epoch": 111} {"train_loss": -6.629594802856445, "global_step": 18771, "epoch": 111} {"train_loss": -6.690501689910889, "global_step": 18772, "epoch": 111} {"train_loss": -6.90470552444458, "global_step": 18773, "epoch": 111} {"train_loss": -6.776734828948975, "global_step": 18774, "epoch": 111} {"train_loss": -6.573861122131348, "global_step": 18775, "epoch": 111} {"train_loss": -6.574235916137695, "global_step": 18776, "epoch": 111} {"train_loss": -6.717022895812988, "global_step": 18777, "epoch": 111} {"train_loss": -6.492346286773682, "global_step": 18778, "epoch": 111} {"train_loss": -6.577589988708496, "global_step": 18779, "epoch": 111} {"train_loss": -6.737176418304443, "global_step": 18780, "epoch": 111} {"train_loss": -6.24707555770874, "global_step": 18781, "epoch": 111} {"train_loss": -6.606341361999512, "global_step": 18782, "epoch": 111} {"train_loss": -6.474177837371826, "global_step": 18783, "epoch": 111} {"train_loss": -6.752460479736328, "global_step": 18784, "epoch": 111} {"train_loss": -6.72956657409668, "global_step": 18785, "epoch": 111} {"train_loss": -6.699614524841309, "global_step": 18786, "epoch": 111} {"train_loss": -6.854089736938477, "global_step": 18787, "epoch": 111} {"train_loss": -6.675868988037109, "global_step": 18788, "epoch": 111} {"train_loss": -6.494770050048828, "global_step": 18789, "epoch": 111} {"train_loss": -6.663476467132568, "global_step": 18790, "epoch": 111} {"train_loss": -6.620441913604736, "global_step": 18791, "epoch": 111} {"train_loss": -6.709344387054443, "global_step": 18792, "epoch": 111} {"train_loss": -6.584163665771484, "global_step": 18793, "epoch": 111} {"train_loss": -6.7195000648498535, "global_step": 18794, "epoch": 111} {"train_loss": -6.581246852874756, "global_step": 18795, "epoch": 111} {"train_loss": -6.848838806152344, "global_step": 18796, "epoch": 111} {"train_loss": -6.735646724700928, "global_step": 18797, "epoch": 111} {"train_loss": -7.0178422927856445, "global_step": 18798, "epoch": 111} {"train_loss": -6.7931718826293945, "global_step": 18799, "epoch": 111} {"train_loss": -6.772026538848877, "global_step": 18800, "epoch": 111} {"train_loss": -6.750904560089111, "global_step": 18801, "epoch": 111} {"train_loss": -6.543249607086182, "global_step": 18802, "epoch": 111} {"train_loss": -6.803282737731934, "global_step": 18803, "epoch": 111} {"train_loss": -6.8709211349487305, "global_step": 18804, "epoch": 111} {"train_loss": -6.9352521896362305, "global_step": 18805, "epoch": 111} {"train_loss": -6.864065170288086, "global_step": 18806, "epoch": 111} {"train_loss": -6.904994964599609, "global_step": 18807, "epoch": 111} {"train_loss": -6.91925048828125, "global_step": 18808, "epoch": 111} {"train_loss": -6.818780899047852, "global_step": 18809, "epoch": 111} {"train_loss": -6.816481590270996, "global_step": 18810, "epoch": 111} {"train_loss": -6.84001350402832, "global_step": 18811, "epoch": 111} {"train_loss": -6.914310455322266, "global_step": 18812, "epoch": 111} {"train_loss": -6.874664306640625, "global_step": 18813, "epoch": 111} {"train_loss": -6.870964050292969, "global_step": 18814, "epoch": 111} {"train_loss": -6.684523795332227, "global_step": 18815, "epoch": 111, "val_loss": 222685.875} {"train_loss": -6.621391296386719, "global_step": 18816, "epoch": 112} {"train_loss": -6.7017974853515625, "global_step": 18817, "epoch": 112} {"train_loss": -6.544071197509766, "global_step": 18818, "epoch": 112} {"train_loss": -6.852428436279297, "global_step": 18819, "epoch": 112} {"train_loss": -6.650853157043457, "global_step": 18820, "epoch": 112} {"train_loss": -6.613097190856934, "global_step": 18821, "epoch": 112} {"train_loss": -7.041379928588867, "global_step": 18822, "epoch": 112} {"train_loss": -6.702461242675781, "global_step": 18823, "epoch": 112} {"train_loss": -6.795222759246826, "global_step": 18824, "epoch": 112} {"train_loss": -6.4213714599609375, "global_step": 18825, "epoch": 112} {"train_loss": -6.643898963928223, "global_step": 18826, "epoch": 112} {"train_loss": -6.482176780700684, "global_step": 18827, "epoch": 112} {"train_loss": -6.515839576721191, "global_step": 18828, "epoch": 112} {"train_loss": -6.3928985595703125, "global_step": 18829, "epoch": 112} {"train_loss": -6.689258575439453, "global_step": 18830, "epoch": 112} {"train_loss": -6.595774173736572, "global_step": 18831, "epoch": 112} {"train_loss": -6.762679100036621, "global_step": 18832, "epoch": 112} {"train_loss": -6.399646759033203, "global_step": 18833, "epoch": 112} {"train_loss": -6.446315765380859, "global_step": 18834, "epoch": 112} {"train_loss": -6.556739807128906, "global_step": 18835, "epoch": 112} {"train_loss": -6.377772808074951, "global_step": 18836, "epoch": 112} {"train_loss": -6.51405143737793, "global_step": 18837, "epoch": 112} {"train_loss": -6.696748733520508, "global_step": 18838, "epoch": 112} {"train_loss": -6.582764625549316, "global_step": 18839, "epoch": 112} {"train_loss": -6.838950157165527, "global_step": 18840, "epoch": 112} {"train_loss": -6.608396530151367, "global_step": 18841, "epoch": 112} {"train_loss": -6.545731067657471, "global_step": 18842, "epoch": 112} {"train_loss": -6.708617210388184, "global_step": 18843, "epoch": 112} {"train_loss": -6.374356746673584, "global_step": 18844, "epoch": 112} {"train_loss": -6.708357810974121, "global_step": 18845, "epoch": 112} {"train_loss": -6.578056812286377, "global_step": 18846, "epoch": 112} {"train_loss": -6.6655964851379395, "global_step": 18847, "epoch": 112} {"train_loss": -6.716938495635986, "global_step": 18848, "epoch": 112} {"train_loss": -6.760391712188721, "global_step": 18849, "epoch": 112} {"train_loss": -6.938528060913086, "global_step": 18850, "epoch": 112} {"train_loss": -6.837893486022949, "global_step": 18851, "epoch": 112} {"train_loss": -6.9372172355651855, "global_step": 18852, "epoch": 112} {"train_loss": -6.760339260101318, "global_step": 18853, "epoch": 112} {"train_loss": -6.6976776123046875, "global_step": 18854, "epoch": 112} {"train_loss": -7.02114725112915, "global_step": 18855, "epoch": 112} {"train_loss": -6.890317916870117, "global_step": 18856, "epoch": 112} {"train_loss": -6.862866401672363, "global_step": 18857, "epoch": 112} {"train_loss": -6.710590362548828, "global_step": 18858, "epoch": 112} {"train_loss": -6.835696697235107, "global_step": 18859, "epoch": 112} {"train_loss": -6.838911056518555, "global_step": 18860, "epoch": 112} {"train_loss": -6.618982315063477, "global_step": 18861, "epoch": 112} {"train_loss": -6.763184547424316, "global_step": 18862, "epoch": 112} {"train_loss": -6.712281227111816, "global_step": 18863, "epoch": 112} {"train_loss": -6.8966569900512695, "global_step": 18864, "epoch": 112} {"train_loss": -6.942206859588623, "global_step": 18865, "epoch": 112} {"train_loss": -6.9505767822265625, "global_step": 18866, "epoch": 112} {"train_loss": -6.774147987365723, "global_step": 18867, "epoch": 112} {"train_loss": -6.850612640380859, "global_step": 18868, "epoch": 112} {"train_loss": -6.8452959060668945, "global_step": 18869, "epoch": 112} {"train_loss": -6.873542785644531, "global_step": 18870, "epoch": 112} {"train_loss": -6.200740337371826, "global_step": 18871, "epoch": 112} {"train_loss": -6.649966239929199, "global_step": 18872, "epoch": 112} {"train_loss": -6.681971073150635, "global_step": 18873, "epoch": 112} {"train_loss": -6.801059722900391, "global_step": 18874, "epoch": 112} {"train_loss": -6.607809066772461, "global_step": 18875, "epoch": 112} {"train_loss": -6.941450119018555, "global_step": 18876, "epoch": 112} {"train_loss": -6.629119873046875, "global_step": 18877, "epoch": 112} {"train_loss": -6.68552827835083, "global_step": 18878, "epoch": 112} {"train_loss": -6.781519889831543, "global_step": 18879, "epoch": 112} {"train_loss": -6.822564125061035, "global_step": 18880, "epoch": 112} {"train_loss": -6.586271286010742, "global_step": 18881, "epoch": 112} {"train_loss": -6.709687232971191, "global_step": 18882, "epoch": 112} {"train_loss": -6.704736709594727, "global_step": 18883, "epoch": 112} {"train_loss": -6.709723472595215, "global_step": 18884, "epoch": 112} {"train_loss": -6.732253074645996, "global_step": 18885, "epoch": 112} {"train_loss": -6.974827766418457, "global_step": 18886, "epoch": 112} {"train_loss": -6.615224838256836, "global_step": 18887, "epoch": 112} {"train_loss": -6.807622909545898, "global_step": 18888, "epoch": 112} {"train_loss": -6.523632049560547, "global_step": 18889, "epoch": 112} {"train_loss": -6.8915629386901855, "global_step": 18890, "epoch": 112} {"train_loss": -6.435736656188965, "global_step": 18891, "epoch": 112} {"train_loss": -6.944203853607178, "global_step": 18892, "epoch": 112} {"train_loss": -6.823094367980957, "global_step": 18893, "epoch": 112} {"train_loss": -6.84207010269165, "global_step": 18894, "epoch": 112} {"train_loss": -6.711254596710205, "global_step": 18895, "epoch": 112} {"train_loss": -6.695713996887207, "global_step": 18896, "epoch": 112} {"train_loss": -6.783752918243408, "global_step": 18897, "epoch": 112} {"train_loss": -6.678223609924316, "global_step": 18898, "epoch": 112} {"train_loss": -7.123387336730957, "global_step": 18899, "epoch": 112} {"train_loss": -6.965504169464111, "global_step": 18900, "epoch": 112} {"train_loss": -6.741724014282227, "global_step": 18901, "epoch": 112} {"train_loss": -6.714580535888672, "global_step": 18902, "epoch": 112} {"train_loss": -6.652472496032715, "global_step": 18903, "epoch": 112} {"train_loss": -6.774218559265137, "global_step": 18904, "epoch": 112} {"train_loss": -6.792407035827637, "global_step": 18905, "epoch": 112} {"train_loss": -6.888696670532227, "global_step": 18906, "epoch": 112} {"train_loss": -6.838863849639893, "global_step": 18907, "epoch": 112} {"train_loss": -6.5832719802856445, "global_step": 18908, "epoch": 112} {"train_loss": -6.912454605102539, "global_step": 18909, "epoch": 112} {"train_loss": -6.832911491394043, "global_step": 18910, "epoch": 112} {"train_loss": -6.8207550048828125, "global_step": 18911, "epoch": 112} {"train_loss": -6.480255603790283, "global_step": 18912, "epoch": 112} {"train_loss": -6.724979877471924, "global_step": 18913, "epoch": 112} {"train_loss": -6.837924480438232, "global_step": 18914, "epoch": 112} {"train_loss": -6.821148872375488, "global_step": 18915, "epoch": 112} {"train_loss": -6.5649189949035645, "global_step": 18916, "epoch": 112} {"train_loss": -6.678476333618164, "global_step": 18917, "epoch": 112} {"train_loss": -6.840325355529785, "global_step": 18918, "epoch": 112} {"train_loss": -7.024501800537109, "global_step": 18919, "epoch": 112} {"train_loss": -6.743776321411133, "global_step": 18920, "epoch": 112} {"train_loss": -6.846976280212402, "global_step": 18921, "epoch": 112} {"train_loss": -7.132167816162109, "global_step": 18922, "epoch": 112} {"train_loss": -6.663012504577637, "global_step": 18923, "epoch": 112} {"train_loss": -6.941444396972656, "global_step": 18924, "epoch": 112} {"train_loss": -6.733997344970703, "global_step": 18925, "epoch": 112} {"train_loss": -6.775880813598633, "global_step": 18926, "epoch": 112} {"train_loss": -6.720067977905273, "global_step": 18927, "epoch": 112} {"train_loss": -6.833123683929443, "global_step": 18928, "epoch": 112} {"train_loss": -6.760376453399658, "global_step": 18929, "epoch": 112} {"train_loss": -6.8371663093566895, "global_step": 18930, "epoch": 112} {"train_loss": -6.579351425170898, "global_step": 18931, "epoch": 112} {"train_loss": -6.700254440307617, "global_step": 18932, "epoch": 112} {"train_loss": -6.680438995361328, "global_step": 18933, "epoch": 112} {"train_loss": -6.701798915863037, "global_step": 18934, "epoch": 112} {"train_loss": -6.68303108215332, "global_step": 18935, "epoch": 112} {"train_loss": -6.4977707862854, "global_step": 18936, "epoch": 112} {"train_loss": -6.800153732299805, "global_step": 18937, "epoch": 112} {"train_loss": -6.566263198852539, "global_step": 18938, "epoch": 112} {"train_loss": -6.901638507843018, "global_step": 18939, "epoch": 112} {"train_loss": -6.6343159675598145, "global_step": 18940, "epoch": 112} {"train_loss": -6.5386552810668945, "global_step": 18941, "epoch": 112} {"train_loss": -6.975459098815918, "global_step": 18942, "epoch": 112} {"train_loss": -6.9953765869140625, "global_step": 18943, "epoch": 112} {"train_loss": -6.725933074951172, "global_step": 18944, "epoch": 112} {"train_loss": -6.885626792907715, "global_step": 18945, "epoch": 112} {"train_loss": -6.877479553222656, "global_step": 18946, "epoch": 112} {"train_loss": -6.903860092163086, "global_step": 18947, "epoch": 112} {"train_loss": -6.910643577575684, "global_step": 18948, "epoch": 112} {"train_loss": -6.805348873138428, "global_step": 18949, "epoch": 112} {"train_loss": -6.833916664123535, "global_step": 18950, "epoch": 112} {"train_loss": -6.706252574920654, "global_step": 18951, "epoch": 112} {"train_loss": -6.816659927368164, "global_step": 18952, "epoch": 112} {"train_loss": -6.81126070022583, "global_step": 18953, "epoch": 112} {"train_loss": -6.582198143005371, "global_step": 18954, "epoch": 112} {"train_loss": -6.3508782386779785, "global_step": 18955, "epoch": 112} {"train_loss": -6.605352401733398, "global_step": 18956, "epoch": 112} {"train_loss": -6.544781684875488, "global_step": 18957, "epoch": 112} {"train_loss": -6.452874660491943, "global_step": 18958, "epoch": 112} {"train_loss": -6.495983123779297, "global_step": 18959, "epoch": 112} {"train_loss": -6.560665607452393, "global_step": 18960, "epoch": 112} {"train_loss": -6.778146266937256, "global_step": 18961, "epoch": 112} {"train_loss": -6.874354362487793, "global_step": 18962, "epoch": 112} {"train_loss": -6.663850784301758, "global_step": 18963, "epoch": 112} {"train_loss": -7.022670269012451, "global_step": 18964, "epoch": 112} {"train_loss": -6.623125076293945, "global_step": 18965, "epoch": 112} {"train_loss": -6.722683906555176, "global_step": 18966, "epoch": 112} {"train_loss": -6.471865177154541, "global_step": 18967, "epoch": 112} {"train_loss": -6.4154253005981445, "global_step": 18968, "epoch": 112} {"train_loss": -6.705582618713379, "global_step": 18969, "epoch": 112} {"train_loss": -6.541007041931152, "global_step": 18970, "epoch": 112} {"train_loss": -6.555149078369141, "global_step": 18971, "epoch": 112} {"train_loss": -6.572934150695801, "global_step": 18972, "epoch": 112} {"train_loss": -6.906172752380371, "global_step": 18973, "epoch": 112} {"train_loss": -6.542510986328125, "global_step": 18974, "epoch": 112} {"train_loss": -6.518101215362549, "global_step": 18975, "epoch": 112} {"train_loss": -6.600627422332764, "global_step": 18976, "epoch": 112} {"train_loss": -6.722338676452637, "global_step": 18977, "epoch": 112} {"train_loss": -6.661064147949219, "global_step": 18978, "epoch": 112} {"train_loss": -6.651415824890137, "global_step": 18979, "epoch": 112} {"train_loss": -6.7287797927856445, "global_step": 18980, "epoch": 112} {"train_loss": -7.02902889251709, "global_step": 18981, "epoch": 112} {"train_loss": -6.776336193084717, "global_step": 18982, "epoch": 112} {"train_loss": -6.721950011593955, "global_step": 18983, "epoch": 112, "val_loss": 220863.9375} {"train_loss": -6.893180847167969, "global_step": 18984, "epoch": 113} {"train_loss": -6.48477840423584, "global_step": 18985, "epoch": 113} {"train_loss": -6.710254192352295, "global_step": 18986, "epoch": 113} {"train_loss": -6.919095993041992, "global_step": 18987, "epoch": 113} {"train_loss": -6.729504108428955, "global_step": 18988, "epoch": 113} {"train_loss": -6.651508331298828, "global_step": 18989, "epoch": 113} {"train_loss": -6.730095863342285, "global_step": 18990, "epoch": 113} {"train_loss": -6.4902496337890625, "global_step": 18991, "epoch": 113} {"train_loss": -6.535686492919922, "global_step": 18992, "epoch": 113} {"train_loss": -6.432564735412598, "global_step": 18993, "epoch": 113} {"train_loss": -6.522318363189697, "global_step": 18994, "epoch": 113} {"train_loss": -6.540101051330566, "global_step": 18995, "epoch": 113} {"train_loss": -6.816704750061035, "global_step": 18996, "epoch": 113} {"train_loss": -6.691951751708984, "global_step": 18997, "epoch": 113} {"train_loss": -6.739864349365234, "global_step": 18998, "epoch": 113} {"train_loss": -6.784381866455078, "global_step": 18999, "epoch": 113} {"train_loss": -6.884425163269043, "global_step": 19000, "epoch": 113} {"train_loss": -6.751466751098633, "global_step": 19001, "epoch": 113} {"train_loss": -6.888911247253418, "global_step": 19002, "epoch": 113} {"train_loss": -6.531416416168213, "global_step": 19003, "epoch": 113} {"train_loss": -6.844215393066406, "global_step": 19004, "epoch": 113} {"train_loss": -6.656038284301758, "global_step": 19005, "epoch": 113} {"train_loss": -6.8991498947143555, "global_step": 19006, "epoch": 113} {"train_loss": -6.546464920043945, "global_step": 19007, "epoch": 113} {"train_loss": -6.908073902130127, "global_step": 19008, "epoch": 113} {"train_loss": -6.329215049743652, "global_step": 19009, "epoch": 113} {"train_loss": -6.779888153076172, "global_step": 19010, "epoch": 113} {"train_loss": -6.534060955047607, "global_step": 19011, "epoch": 113} {"train_loss": -6.528487205505371, "global_step": 19012, "epoch": 113} {"train_loss": -6.4277496337890625, "global_step": 19013, "epoch": 113} {"train_loss": -6.3524370193481445, "global_step": 19014, "epoch": 113} {"train_loss": -6.46087646484375, "global_step": 19015, "epoch": 113} {"train_loss": -6.3650712966918945, "global_step": 19016, "epoch": 113} {"train_loss": -6.604582786560059, "global_step": 19017, "epoch": 113} {"train_loss": -6.088386535644531, "global_step": 19018, "epoch": 113} {"train_loss": -6.324120998382568, "global_step": 19019, "epoch": 113} {"train_loss": -6.397072792053223, "global_step": 19020, "epoch": 113} {"train_loss": -6.220830917358398, "global_step": 19021, "epoch": 113} {"train_loss": -6.264762878417969, "global_step": 19022, "epoch": 113} {"train_loss": -6.634815216064453, "global_step": 19023, "epoch": 113} {"train_loss": -6.616384983062744, "global_step": 19024, "epoch": 113} {"train_loss": -6.594277858734131, "global_step": 19025, "epoch": 113} {"train_loss": -6.529071807861328, "global_step": 19026, "epoch": 113} {"train_loss": -6.480331897735596, "global_step": 19027, "epoch": 113} {"train_loss": -6.583019733428955, "global_step": 19028, "epoch": 113} {"train_loss": -6.60452938079834, "global_step": 19029, "epoch": 113} {"train_loss": -6.704888343811035, "global_step": 19030, "epoch": 113} {"train_loss": -6.540639877319336, "global_step": 19031, "epoch": 113} {"train_loss": -6.492537498474121, "global_step": 19032, "epoch": 113} {"train_loss": -6.90969181060791, "global_step": 19033, "epoch": 113} {"train_loss": -6.710020542144775, "global_step": 19034, "epoch": 113} {"train_loss": -6.78627872467041, "global_step": 19035, "epoch": 113} {"train_loss": -6.866767406463623, "global_step": 19036, "epoch": 113} {"train_loss": -6.645174980163574, "global_step": 19037, "epoch": 113} {"train_loss": -6.888799667358398, "global_step": 19038, "epoch": 113} {"train_loss": -6.709573268890381, "global_step": 19039, "epoch": 113} {"train_loss": -6.775286674499512, "global_step": 19040, "epoch": 113} {"train_loss": -6.718272686004639, "global_step": 19041, "epoch": 113} {"train_loss": -6.745231628417969, "global_step": 19042, "epoch": 113} {"train_loss": -6.7753705978393555, "global_step": 19043, "epoch": 113} {"train_loss": -6.763256072998047, "global_step": 19044, "epoch": 113} {"train_loss": -6.779444217681885, "global_step": 19045, "epoch": 113} {"train_loss": -6.971444129943848, "global_step": 19046, "epoch": 113} {"train_loss": -6.980621337890625, "global_step": 19047, "epoch": 113} {"train_loss": -6.629572868347168, "global_step": 19048, "epoch": 113} {"train_loss": -6.923032760620117, "global_step": 19049, "epoch": 113} {"train_loss": -6.811095714569092, "global_step": 19050, "epoch": 113} {"train_loss": -6.760169506072998, "global_step": 19051, "epoch": 113} {"train_loss": -6.8727264404296875, "global_step": 19052, "epoch": 113} {"train_loss": -6.715653896331787, "global_step": 19053, "epoch": 113} {"train_loss": -6.881233215332031, "global_step": 19054, "epoch": 113} {"train_loss": -6.706853866577148, "global_step": 19055, "epoch": 113} {"train_loss": -6.766380786895752, "global_step": 19056, "epoch": 113} {"train_loss": -6.737063407897949, "global_step": 19057, "epoch": 113} {"train_loss": -6.670565605163574, "global_step": 19058, "epoch": 113} {"train_loss": -6.764208793640137, "global_step": 19059, "epoch": 113} {"train_loss": -6.66248893737793, "global_step": 19060, "epoch": 113} {"train_loss": -6.945223331451416, "global_step": 19061, "epoch": 113} {"train_loss": -6.199079513549805, "global_step": 19062, "epoch": 113} {"train_loss": -6.937660217285156, "global_step": 19063, "epoch": 113} {"train_loss": -6.442543983459473, "global_step": 19064, "epoch": 113} {"train_loss": -6.574110984802246, "global_step": 19065, "epoch": 113} {"train_loss": -6.4442315101623535, "global_step": 19066, "epoch": 113} {"train_loss": -6.400394439697266, "global_step": 19067, "epoch": 113} {"train_loss": -6.668280124664307, "global_step": 19068, "epoch": 113} {"train_loss": -6.543305397033691, "global_step": 19069, "epoch": 113} {"train_loss": -6.469363689422607, "global_step": 19070, "epoch": 113} {"train_loss": -6.435088157653809, "global_step": 19071, "epoch": 113} {"train_loss": -6.381129264831543, "global_step": 19072, "epoch": 113} {"train_loss": -6.272470474243164, "global_step": 19073, "epoch": 113} {"train_loss": -6.460758209228516, "global_step": 19074, "epoch": 113} {"train_loss": -6.741466045379639, "global_step": 19075, "epoch": 113} {"train_loss": -6.83554744720459, "global_step": 19076, "epoch": 113} {"train_loss": -6.640295505523682, "global_step": 19077, "epoch": 113} {"train_loss": -6.669680595397949, "global_step": 19078, "epoch": 113} {"train_loss": -6.590482234954834, "global_step": 19079, "epoch": 113} {"train_loss": -6.530229568481445, "global_step": 19080, "epoch": 113} {"train_loss": -6.888308525085449, "global_step": 19081, "epoch": 113} {"train_loss": -6.602168560028076, "global_step": 19082, "epoch": 113} {"train_loss": -7.038246154785156, "global_step": 19083, "epoch": 113} {"train_loss": -6.625555038452148, "global_step": 19084, "epoch": 113} {"train_loss": -6.526390075683594, "global_step": 19085, "epoch": 113} {"train_loss": -6.691880702972412, "global_step": 19086, "epoch": 113} {"train_loss": -6.7292070388793945, "global_step": 19087, "epoch": 113} {"train_loss": -6.748796463012695, "global_step": 19088, "epoch": 113} {"train_loss": -6.555051803588867, "global_step": 19089, "epoch": 113} {"train_loss": -6.614575386047363, "global_step": 19090, "epoch": 113} {"train_loss": -6.787360191345215, "global_step": 19091, "epoch": 113} {"train_loss": -6.758028030395508, "global_step": 19092, "epoch": 113} {"train_loss": -6.55171537399292, "global_step": 19093, "epoch": 113} {"train_loss": -6.419198036193848, "global_step": 19094, "epoch": 113} {"train_loss": -6.619562149047852, "global_step": 19095, "epoch": 113} {"train_loss": -6.366498947143555, "global_step": 19096, "epoch": 113} {"train_loss": -6.479227066040039, "global_step": 19097, "epoch": 113} {"train_loss": -6.448490142822266, "global_step": 19098, "epoch": 113} {"train_loss": -6.801058769226074, "global_step": 19099, "epoch": 113} {"train_loss": -6.559938907623291, "global_step": 19100, "epoch": 113} {"train_loss": -6.6506547927856445, "global_step": 19101, "epoch": 113} {"train_loss": -6.8348588943481445, "global_step": 19102, "epoch": 113} {"train_loss": -6.568475723266602, "global_step": 19103, "epoch": 113} {"train_loss": -6.493093490600586, "global_step": 19104, "epoch": 113} {"train_loss": -6.671231269836426, "global_step": 19105, "epoch": 113} {"train_loss": -6.75400447845459, "global_step": 19106, "epoch": 113} {"train_loss": -6.4785261154174805, "global_step": 19107, "epoch": 113} {"train_loss": -6.826205730438232, "global_step": 19108, "epoch": 113} {"train_loss": -6.713657855987549, "global_step": 19109, "epoch": 113} {"train_loss": -6.462098121643066, "global_step": 19110, "epoch": 113} {"train_loss": -6.721097946166992, "global_step": 19111, "epoch": 113} {"train_loss": -6.584005355834961, "global_step": 19112, "epoch": 113} {"train_loss": -6.752605438232422, "global_step": 19113, "epoch": 113} {"train_loss": -6.7738447189331055, "global_step": 19114, "epoch": 113} {"train_loss": -7.016555309295654, "global_step": 19115, "epoch": 113} {"train_loss": -6.911450386047363, "global_step": 19116, "epoch": 113} {"train_loss": -7.022698402404785, "global_step": 19117, "epoch": 113} {"train_loss": -6.714969635009766, "global_step": 19118, "epoch": 113} {"train_loss": -6.838294982910156, "global_step": 19119, "epoch": 113} {"train_loss": -6.5788187980651855, "global_step": 19120, "epoch": 113} {"train_loss": -6.898850917816162, "global_step": 19121, "epoch": 113} {"train_loss": -6.90296745300293, "global_step": 19122, "epoch": 113} {"train_loss": -6.780418872833252, "global_step": 19123, "epoch": 113} {"train_loss": -6.8659868240356445, "global_step": 19124, "epoch": 113} {"train_loss": -6.725313186645508, "global_step": 19125, "epoch": 113} {"train_loss": -6.75327205657959, "global_step": 19126, "epoch": 113} {"train_loss": -6.668618202209473, "global_step": 19127, "epoch": 113} {"train_loss": -6.778230667114258, "global_step": 19128, "epoch": 113} {"train_loss": -6.830014228820801, "global_step": 19129, "epoch": 113} {"train_loss": -6.941991806030273, "global_step": 19130, "epoch": 113} {"train_loss": -6.744776725769043, "global_step": 19131, "epoch": 113} {"train_loss": -6.918267250061035, "global_step": 19132, "epoch": 113} {"train_loss": -6.881624221801758, "global_step": 19133, "epoch": 113} {"train_loss": -6.551454067230225, "global_step": 19134, "epoch": 113} {"train_loss": -6.666220188140869, "global_step": 19135, "epoch": 113} {"train_loss": -6.728558540344238, "global_step": 19136, "epoch": 113} {"train_loss": -6.993768215179443, "global_step": 19137, "epoch": 113} {"train_loss": -6.642648220062256, "global_step": 19138, "epoch": 113} {"train_loss": -7.027220726013184, "global_step": 19139, "epoch": 113} {"train_loss": -6.703771591186523, "global_step": 19140, "epoch": 113} {"train_loss": -6.49996280670166, "global_step": 19141, "epoch": 113} {"train_loss": -6.8011064529418945, "global_step": 19142, "epoch": 113} {"train_loss": -6.721124649047852, "global_step": 19143, "epoch": 113} {"train_loss": -6.751266002655029, "global_step": 19144, "epoch": 113} {"train_loss": -6.966498374938965, "global_step": 19145, "epoch": 113} {"train_loss": -6.7427849769592285, "global_step": 19146, "epoch": 113} {"train_loss": -6.991428375244141, "global_step": 19147, "epoch": 113} {"train_loss": -6.816290855407715, "global_step": 19148, "epoch": 113} {"train_loss": -6.594230651855469, "global_step": 19149, "epoch": 113} {"train_loss": -6.362473487854004, "global_step": 19150, "epoch": 113} {"train_loss": -6.675761344886961, "global_step": 19151, "epoch": 113, "val_loss": 220933.078125} {"train_loss": -6.507460594177246, "global_step": 19152, "epoch": 114} {"train_loss": -6.772359848022461, "global_step": 19153, "epoch": 114} {"train_loss": -6.560122489929199, "global_step": 19154, "epoch": 114} {"train_loss": -6.723768711090088, "global_step": 19155, "epoch": 114} {"train_loss": -6.640207767486572, "global_step": 19156, "epoch": 114} {"train_loss": -6.554275989532471, "global_step": 19157, "epoch": 114} {"train_loss": -6.628125190734863, "global_step": 19158, "epoch": 114} {"train_loss": -6.66411018371582, "global_step": 19159, "epoch": 114} {"train_loss": -6.684560775756836, "global_step": 19160, "epoch": 114} {"train_loss": -6.435111999511719, "global_step": 19161, "epoch": 114} {"train_loss": -6.311291694641113, "global_step": 19162, "epoch": 114} {"train_loss": -6.5334696769714355, "global_step": 19163, "epoch": 114} {"train_loss": -6.615579605102539, "global_step": 19164, "epoch": 114} {"train_loss": -6.567972183227539, "global_step": 19165, "epoch": 114} {"train_loss": -6.810284614562988, "global_step": 19166, "epoch": 114} {"train_loss": -6.642548561096191, "global_step": 19167, "epoch": 114} {"train_loss": -6.517594337463379, "global_step": 19168, "epoch": 114} {"train_loss": -6.266395092010498, "global_step": 19169, "epoch": 114} {"train_loss": -6.641798496246338, "global_step": 19170, "epoch": 114} {"train_loss": -6.672070503234863, "global_step": 19171, "epoch": 114} {"train_loss": -6.546951770782471, "global_step": 19172, "epoch": 114} {"train_loss": -6.394990921020508, "global_step": 19173, "epoch": 114} {"train_loss": -6.701977252960205, "global_step": 19174, "epoch": 114} {"train_loss": -6.811128616333008, "global_step": 19175, "epoch": 114} {"train_loss": -6.696481704711914, "global_step": 19176, "epoch": 114} {"train_loss": -6.784853935241699, "global_step": 19177, "epoch": 114} {"train_loss": -6.864538192749023, "global_step": 19178, "epoch": 114} {"train_loss": -6.60435676574707, "global_step": 19179, "epoch": 114} {"train_loss": -6.574365615844727, "global_step": 19180, "epoch": 114} {"train_loss": -6.844333648681641, "global_step": 19181, "epoch": 114} {"train_loss": -6.736883163452148, "global_step": 19182, "epoch": 114} {"train_loss": -6.765797138214111, "global_step": 19183, "epoch": 114} {"train_loss": -6.663302421569824, "global_step": 19184, "epoch": 114} {"train_loss": -6.633051872253418, "global_step": 19185, "epoch": 114} {"train_loss": -6.988915920257568, "global_step": 19186, "epoch": 114} {"train_loss": -6.809212684631348, "global_step": 19187, "epoch": 114} {"train_loss": -6.80354642868042, "global_step": 19188, "epoch": 114} {"train_loss": -6.662657737731934, "global_step": 19189, "epoch": 114} {"train_loss": -6.563447952270508, "global_step": 19190, "epoch": 114} {"train_loss": -6.462939739227295, "global_step": 19191, "epoch": 114} {"train_loss": -6.570492744445801, "global_step": 19192, "epoch": 114} {"train_loss": -6.532123565673828, "global_step": 19193, "epoch": 114} {"train_loss": -6.637385368347168, "global_step": 19194, "epoch": 114} {"train_loss": -6.670266151428223, "global_step": 19195, "epoch": 114} {"train_loss": -6.565023422241211, "global_step": 19196, "epoch": 114} {"train_loss": -6.448240756988525, "global_step": 19197, "epoch": 114} {"train_loss": -6.537027359008789, "global_step": 19198, "epoch": 114} {"train_loss": -6.784544467926025, "global_step": 19199, "epoch": 114} {"train_loss": -6.313920021057129, "global_step": 19200, "epoch": 114} {"train_loss": -6.4997944831848145, "global_step": 19201, "epoch": 114} {"train_loss": -6.693835258483887, "global_step": 19202, "epoch": 114} {"train_loss": -6.614563941955566, "global_step": 19203, "epoch": 114} {"train_loss": -6.556937217712402, "global_step": 19204, "epoch": 114} {"train_loss": -6.476734161376953, "global_step": 19205, "epoch": 114} {"train_loss": -6.576117038726807, "global_step": 19206, "epoch": 114} {"train_loss": -6.708856582641602, "global_step": 19207, "epoch": 114} {"train_loss": -6.746750831604004, "global_step": 19208, "epoch": 114} {"train_loss": -6.479061603546143, "global_step": 19209, "epoch": 114} {"train_loss": -6.809301376342773, "global_step": 19210, "epoch": 114} {"train_loss": -6.407291412353516, "global_step": 19211, "epoch": 114} {"train_loss": -6.455933570861816, "global_step": 19212, "epoch": 114} {"train_loss": -6.775413513183594, "global_step": 19213, "epoch": 114} {"train_loss": -6.886147499084473, "global_step": 19214, "epoch": 114} {"train_loss": -6.789283275604248, "global_step": 19215, "epoch": 114} {"train_loss": -6.834451675415039, "global_step": 19216, "epoch": 114} {"train_loss": -6.685443878173828, "global_step": 19217, "epoch": 114} {"train_loss": -6.801764965057373, "global_step": 19218, "epoch": 114} {"train_loss": -6.660528182983398, "global_step": 19219, "epoch": 114} {"train_loss": -6.6754560470581055, "global_step": 19220, "epoch": 114} {"train_loss": -6.528690338134766, "global_step": 19221, "epoch": 114} {"train_loss": -6.4387006759643555, "global_step": 19222, "epoch": 114} {"train_loss": -6.740809440612793, "global_step": 19223, "epoch": 114} {"train_loss": -6.636410236358643, "global_step": 19224, "epoch": 114} {"train_loss": -6.530816555023193, "global_step": 19225, "epoch": 114} {"train_loss": -6.627025604248047, "global_step": 19226, "epoch": 114} {"train_loss": -6.45613956451416, "global_step": 19227, "epoch": 114} {"train_loss": -6.528716087341309, "global_step": 19228, "epoch": 114} {"train_loss": -6.586385726928711, "global_step": 19229, "epoch": 114} {"train_loss": -6.668169975280762, "global_step": 19230, "epoch": 114} {"train_loss": -6.518946647644043, "global_step": 19231, "epoch": 114} {"train_loss": -6.3388142585754395, "global_step": 19232, "epoch": 114} {"train_loss": -6.458282470703125, "global_step": 19233, "epoch": 114} {"train_loss": -6.628126621246338, "global_step": 19234, "epoch": 114} {"train_loss": -6.585020065307617, "global_step": 19235, "epoch": 114} {"train_loss": -6.660454750061035, "global_step": 19236, "epoch": 114} {"train_loss": -6.592604637145996, "global_step": 19237, "epoch": 114} {"train_loss": -6.6304168701171875, "global_step": 19238, "epoch": 114} {"train_loss": -6.679080963134766, "global_step": 19239, "epoch": 114} {"train_loss": -6.258740425109863, "global_step": 19240, "epoch": 114} {"train_loss": -6.556689739227295, "global_step": 19241, "epoch": 114} {"train_loss": -6.5960235595703125, "global_step": 19242, "epoch": 114} {"train_loss": -6.660001754760742, "global_step": 19243, "epoch": 114} {"train_loss": -6.901761531829834, "global_step": 19244, "epoch": 114} {"train_loss": -6.635221481323242, "global_step": 19245, "epoch": 114} {"train_loss": -6.8041887283325195, "global_step": 19246, "epoch": 114} {"train_loss": -6.851963043212891, "global_step": 19247, "epoch": 114} {"train_loss": -6.659079074859619, "global_step": 19248, "epoch": 114} {"train_loss": -6.473233222961426, "global_step": 19249, "epoch": 114} {"train_loss": -6.6481733322143555, "global_step": 19250, "epoch": 114} {"train_loss": -6.701719760894775, "global_step": 19251, "epoch": 114} {"train_loss": -6.6234283447265625, "global_step": 19252, "epoch": 114} {"train_loss": -6.697951793670654, "global_step": 19253, "epoch": 114} {"train_loss": -6.846121788024902, "global_step": 19254, "epoch": 114} {"train_loss": -6.971253395080566, "global_step": 19255, "epoch": 114} {"train_loss": -6.887881278991699, "global_step": 19256, "epoch": 114} {"train_loss": -6.829416275024414, "global_step": 19257, "epoch": 114} {"train_loss": -6.833185195922852, "global_step": 19258, "epoch": 114} {"train_loss": -6.998525619506836, "global_step": 19259, "epoch": 114} {"train_loss": -6.839777946472168, "global_step": 19260, "epoch": 114} {"train_loss": -6.7111616134643555, "global_step": 19261, "epoch": 114} {"train_loss": -6.93760871887207, "global_step": 19262, "epoch": 114} {"train_loss": -6.662251949310303, "global_step": 19263, "epoch": 114} {"train_loss": -6.659556865692139, "global_step": 19264, "epoch": 114} {"train_loss": -6.69796895980835, "global_step": 19265, "epoch": 114} {"train_loss": -6.546261310577393, "global_step": 19266, "epoch": 114} {"train_loss": -6.793963432312012, "global_step": 19267, "epoch": 114} {"train_loss": -6.632329940795898, "global_step": 19268, "epoch": 114} {"train_loss": -6.747632026672363, "global_step": 19269, "epoch": 114} {"train_loss": -6.507136344909668, "global_step": 19270, "epoch": 114} {"train_loss": -6.713388442993164, "global_step": 19271, "epoch": 114} {"train_loss": -6.86777400970459, "global_step": 19272, "epoch": 114} {"train_loss": -6.9026780128479, "global_step": 19273, "epoch": 114} {"train_loss": -6.7807464599609375, "global_step": 19274, "epoch": 114} {"train_loss": -6.758396148681641, "global_step": 19275, "epoch": 114} {"train_loss": -6.805749416351318, "global_step": 19276, "epoch": 114} {"train_loss": -6.862470626831055, "global_step": 19277, "epoch": 114} {"train_loss": -6.597653388977051, "global_step": 19278, "epoch": 114} {"train_loss": -6.628972053527832, "global_step": 19279, "epoch": 114} {"train_loss": -6.830513954162598, "global_step": 19280, "epoch": 114} {"train_loss": -7.000419616699219, "global_step": 19281, "epoch": 114} {"train_loss": -6.694826602935791, "global_step": 19282, "epoch": 114} {"train_loss": -6.652037143707275, "global_step": 19283, "epoch": 114} {"train_loss": -6.625706672668457, "global_step": 19284, "epoch": 114} {"train_loss": -6.830872535705566, "global_step": 19285, "epoch": 114} {"train_loss": -6.761083126068115, "global_step": 19286, "epoch": 114} {"train_loss": -6.912941932678223, "global_step": 19287, "epoch": 114} {"train_loss": -6.46357536315918, "global_step": 19288, "epoch": 114} {"train_loss": -6.620025634765625, "global_step": 19289, "epoch": 114} {"train_loss": -6.696149826049805, "global_step": 19290, "epoch": 114} {"train_loss": -7.0072712898254395, "global_step": 19291, "epoch": 114} {"train_loss": -6.86954927444458, "global_step": 19292, "epoch": 114} {"train_loss": -6.848252296447754, "global_step": 19293, "epoch": 114} {"train_loss": -6.420903205871582, "global_step": 19294, "epoch": 114} {"train_loss": -6.929877281188965, "global_step": 19295, "epoch": 114} {"train_loss": -6.592545509338379, "global_step": 19296, "epoch": 114} {"train_loss": -6.61539363861084, "global_step": 19297, "epoch": 114} {"train_loss": -6.929367542266846, "global_step": 19298, "epoch": 114} {"train_loss": -6.533919811248779, "global_step": 19299, "epoch": 114} {"train_loss": -6.9273552894592285, "global_step": 19300, "epoch": 114} {"train_loss": -6.676595687866211, "global_step": 19301, "epoch": 114} {"train_loss": -6.744369983673096, "global_step": 19302, "epoch": 114} {"train_loss": -6.680555820465088, "global_step": 19303, "epoch": 114} {"train_loss": -6.845088958740234, "global_step": 19304, "epoch": 114} {"train_loss": -6.9223432540893555, "global_step": 19305, "epoch": 114} {"train_loss": -6.660588264465332, "global_step": 19306, "epoch": 114} {"train_loss": -6.797155857086182, "global_step": 19307, "epoch": 114} {"train_loss": -6.617863655090332, "global_step": 19308, "epoch": 114} {"train_loss": -6.855044841766357, "global_step": 19309, "epoch": 114} {"train_loss": -6.757272720336914, "global_step": 19310, "epoch": 114} {"train_loss": -6.742607116699219, "global_step": 19311, "epoch": 114} {"train_loss": -6.9615888595581055, "global_step": 19312, "epoch": 114} {"train_loss": -6.8301005363464355, "global_step": 19313, "epoch": 114} {"train_loss": -6.707199573516846, "global_step": 19314, "epoch": 114} {"train_loss": -6.993554592132568, "global_step": 19315, "epoch": 114} {"train_loss": -6.761068344116211, "global_step": 19316, "epoch": 114} {"train_loss": -6.443510055541992, "global_step": 19317, "epoch": 114} {"train_loss": -6.9730305671691895, "global_step": 19318, "epoch": 114} {"train_loss": -6.680342495441437, "global_step": 19319, "epoch": 114, "val_loss": 223014.15625} {"train_loss": -7.098371505737305, "global_step": 19320, "epoch": 115} {"train_loss": -6.774521827697754, "global_step": 19321, "epoch": 115} {"train_loss": -6.558358192443848, "global_step": 19322, "epoch": 115} {"train_loss": -6.94528865814209, "global_step": 19323, "epoch": 115} {"train_loss": -6.772453308105469, "global_step": 19324, "epoch": 115} {"train_loss": -6.863056182861328, "global_step": 19325, "epoch": 115} {"train_loss": -6.826090335845947, "global_step": 19326, "epoch": 115} {"train_loss": -6.931756019592285, "global_step": 19327, "epoch": 115} {"train_loss": -6.547720432281494, "global_step": 19328, "epoch": 115} {"train_loss": -6.8151984214782715, "global_step": 19329, "epoch": 115} {"train_loss": -6.666905403137207, "global_step": 19330, "epoch": 115} {"train_loss": -6.702093124389648, "global_step": 19331, "epoch": 115} {"train_loss": -6.5836968421936035, "global_step": 19332, "epoch": 115} {"train_loss": -6.736612319946289, "global_step": 19333, "epoch": 115} {"train_loss": -6.674372673034668, "global_step": 19334, "epoch": 115} {"train_loss": -6.482141494750977, "global_step": 19335, "epoch": 115} {"train_loss": -6.779321193695068, "global_step": 19336, "epoch": 115} {"train_loss": -6.592232704162598, "global_step": 19337, "epoch": 115} {"train_loss": -6.721362113952637, "global_step": 19338, "epoch": 115} {"train_loss": -6.656008720397949, "global_step": 19339, "epoch": 115} {"train_loss": -6.705596446990967, "global_step": 19340, "epoch": 115} {"train_loss": -6.732479095458984, "global_step": 19341, "epoch": 115} {"train_loss": -6.746679306030273, "global_step": 19342, "epoch": 115} {"train_loss": -6.667625427246094, "global_step": 19343, "epoch": 115} {"train_loss": -6.442869186401367, "global_step": 19344, "epoch": 115} {"train_loss": -6.666755676269531, "global_step": 19345, "epoch": 115} {"train_loss": -6.809391498565674, "global_step": 19346, "epoch": 115} {"train_loss": -6.5415239334106445, "global_step": 19347, "epoch": 115} {"train_loss": -6.676447868347168, "global_step": 19348, "epoch": 115} {"train_loss": -6.691115379333496, "global_step": 19349, "epoch": 115} {"train_loss": -6.6149821281433105, "global_step": 19350, "epoch": 115} {"train_loss": -6.840663909912109, "global_step": 19351, "epoch": 115} {"train_loss": -6.751567840576172, "global_step": 19352, "epoch": 115} {"train_loss": -6.698274612426758, "global_step": 19353, "epoch": 115} {"train_loss": -7.046316146850586, "global_step": 19354, "epoch": 115} {"train_loss": -6.870918273925781, "global_step": 19355, "epoch": 115} {"train_loss": -6.475114822387695, "global_step": 19356, "epoch": 115} {"train_loss": -6.84193229675293, "global_step": 19357, "epoch": 115} {"train_loss": -6.633518218994141, "global_step": 19358, "epoch": 115} {"train_loss": -6.890534400939941, "global_step": 19359, "epoch": 115} {"train_loss": -6.790195465087891, "global_step": 19360, "epoch": 115} {"train_loss": -6.699209213256836, "global_step": 19361, "epoch": 115} {"train_loss": -6.921814918518066, "global_step": 19362, "epoch": 115} {"train_loss": -6.72776460647583, "global_step": 19363, "epoch": 115} {"train_loss": -7.067293643951416, "global_step": 19364, "epoch": 115} {"train_loss": -6.578372955322266, "global_step": 19365, "epoch": 115} {"train_loss": -6.822457313537598, "global_step": 19366, "epoch": 115} {"train_loss": -6.774820327758789, "global_step": 19367, "epoch": 115} {"train_loss": -6.802408695220947, "global_step": 19368, "epoch": 115} {"train_loss": -6.884208679199219, "global_step": 19369, "epoch": 115} {"train_loss": -6.734151363372803, "global_step": 19370, "epoch": 115} {"train_loss": -6.787505149841309, "global_step": 19371, "epoch": 115} {"train_loss": -6.704680442810059, "global_step": 19372, "epoch": 115} {"train_loss": -6.810174942016602, "global_step": 19373, "epoch": 115} {"train_loss": -6.587580680847168, "global_step": 19374, "epoch": 115} {"train_loss": -6.7890238761901855, "global_step": 19375, "epoch": 115} {"train_loss": -6.439533233642578, "global_step": 19376, "epoch": 115} {"train_loss": -6.701992034912109, "global_step": 19377, "epoch": 115} {"train_loss": -6.5031352043151855, "global_step": 19378, "epoch": 115} {"train_loss": -6.744457244873047, "global_step": 19379, "epoch": 115} {"train_loss": -6.519692420959473, "global_step": 19380, "epoch": 115} {"train_loss": -6.906669616699219, "global_step": 19381, "epoch": 115} {"train_loss": -6.926191329956055, "global_step": 19382, "epoch": 115} {"train_loss": -6.812671184539795, "global_step": 19383, "epoch": 115} {"train_loss": -6.741261959075928, "global_step": 19384, "epoch": 115} {"train_loss": -6.588674068450928, "global_step": 19385, "epoch": 115} {"train_loss": -6.738112926483154, "global_step": 19386, "epoch": 115} {"train_loss": -6.873963356018066, "global_step": 19387, "epoch": 115} {"train_loss": -6.781044960021973, "global_step": 19388, "epoch": 115} {"train_loss": -6.654638767242432, "global_step": 19389, "epoch": 115} {"train_loss": -6.742513656616211, "global_step": 19390, "epoch": 115} {"train_loss": -6.587033748626709, "global_step": 19391, "epoch": 115} {"train_loss": -6.610060214996338, "global_step": 19392, "epoch": 115} {"train_loss": -6.688194274902344, "global_step": 19393, "epoch": 115} {"train_loss": -6.209225654602051, "global_step": 19394, "epoch": 115} {"train_loss": -6.772867202758789, "global_step": 19395, "epoch": 115} {"train_loss": -6.631056308746338, "global_step": 19396, "epoch": 115} {"train_loss": -6.640091896057129, "global_step": 19397, "epoch": 115} {"train_loss": -6.6053667068481445, "global_step": 19398, "epoch": 115} {"train_loss": -6.759458541870117, "global_step": 19399, "epoch": 115} {"train_loss": -6.756575584411621, "global_step": 19400, "epoch": 115} {"train_loss": -6.538632869720459, "global_step": 19401, "epoch": 115} {"train_loss": -6.666938304901123, "global_step": 19402, "epoch": 115} {"train_loss": -6.667189121246338, "global_step": 19403, "epoch": 115} {"train_loss": -6.584245204925537, "global_step": 19404, "epoch": 115} {"train_loss": -6.681035041809082, "global_step": 19405, "epoch": 115} {"train_loss": -6.473746299743652, "global_step": 19406, "epoch": 115} {"train_loss": -6.9812726974487305, "global_step": 19407, "epoch": 115} {"train_loss": -6.414753437042236, "global_step": 19408, "epoch": 115} {"train_loss": -6.316054344177246, "global_step": 19409, "epoch": 115} {"train_loss": -6.65079402923584, "global_step": 19410, "epoch": 115} {"train_loss": -6.593527793884277, "global_step": 19411, "epoch": 115} {"train_loss": -6.4479169845581055, "global_step": 19412, "epoch": 115} {"train_loss": -6.381716728210449, "global_step": 19413, "epoch": 115} {"train_loss": -6.772838115692139, "global_step": 19414, "epoch": 115} {"train_loss": -6.582415580749512, "global_step": 19415, "epoch": 115} {"train_loss": -6.743535995483398, "global_step": 19416, "epoch": 115} {"train_loss": -6.740556716918945, "global_step": 19417, "epoch": 115} {"train_loss": -6.561016082763672, "global_step": 19418, "epoch": 115} {"train_loss": -6.862675666809082, "global_step": 19419, "epoch": 115} {"train_loss": -6.789772033691406, "global_step": 19420, "epoch": 115} {"train_loss": -6.744545936584473, "global_step": 19421, "epoch": 115} {"train_loss": -6.599549770355225, "global_step": 19422, "epoch": 115} {"train_loss": -6.667980670928955, "global_step": 19423, "epoch": 115} {"train_loss": -6.742641448974609, "global_step": 19424, "epoch": 115} {"train_loss": -6.872898101806641, "global_step": 19425, "epoch": 115} {"train_loss": -6.613738059997559, "global_step": 19426, "epoch": 115} {"train_loss": -6.770005226135254, "global_step": 19427, "epoch": 115} {"train_loss": -6.782096862792969, "global_step": 19428, "epoch": 115} {"train_loss": -6.818652629852295, "global_step": 19429, "epoch": 115} {"train_loss": -6.915367126464844, "global_step": 19430, "epoch": 115} {"train_loss": -6.874603271484375, "global_step": 19431, "epoch": 115} {"train_loss": -6.883535861968994, "global_step": 19432, "epoch": 115} {"train_loss": -6.780484676361084, "global_step": 19433, "epoch": 115} {"train_loss": -6.931886672973633, "global_step": 19434, "epoch": 115} {"train_loss": -6.501520156860352, "global_step": 19435, "epoch": 115} {"train_loss": -6.915738105773926, "global_step": 19436, "epoch": 115} {"train_loss": -6.872026443481445, "global_step": 19437, "epoch": 115} {"train_loss": -7.068208694458008, "global_step": 19438, "epoch": 115} {"train_loss": -6.985723972320557, "global_step": 19439, "epoch": 115} {"train_loss": -6.844633102416992, "global_step": 19440, "epoch": 115} {"train_loss": -6.782125473022461, "global_step": 19441, "epoch": 115} {"train_loss": -6.7342987060546875, "global_step": 19442, "epoch": 115} {"train_loss": -6.815892696380615, "global_step": 19443, "epoch": 115} {"train_loss": -6.875494003295898, "global_step": 19444, "epoch": 115} {"train_loss": -6.846674919128418, "global_step": 19445, "epoch": 115} {"train_loss": -6.931037902832031, "global_step": 19446, "epoch": 115} {"train_loss": -6.680743217468262, "global_step": 19447, "epoch": 115} {"train_loss": -6.829460144042969, "global_step": 19448, "epoch": 115} {"train_loss": -6.750591278076172, "global_step": 19449, "epoch": 115} {"train_loss": -6.786563873291016, "global_step": 19450, "epoch": 115} {"train_loss": -6.700571060180664, "global_step": 19451, "epoch": 115} {"train_loss": -6.989893913269043, "global_step": 19452, "epoch": 115} {"train_loss": -6.720729827880859, "global_step": 19453, "epoch": 115} {"train_loss": -6.769352912902832, "global_step": 19454, "epoch": 115} {"train_loss": -6.695126056671143, "global_step": 19455, "epoch": 115} {"train_loss": -6.7885355949401855, "global_step": 19456, "epoch": 115} {"train_loss": -6.563527584075928, "global_step": 19457, "epoch": 115} {"train_loss": -6.671753406524658, "global_step": 19458, "epoch": 115} {"train_loss": -6.736737251281738, "global_step": 19459, "epoch": 115} {"train_loss": -6.769703388214111, "global_step": 19460, "epoch": 115} {"train_loss": -6.828563690185547, "global_step": 19461, "epoch": 115} {"train_loss": -6.6259050369262695, "global_step": 19462, "epoch": 115} {"train_loss": -6.698892593383789, "global_step": 19463, "epoch": 115} {"train_loss": -6.7733001708984375, "global_step": 19464, "epoch": 115} {"train_loss": -6.888097763061523, "global_step": 19465, "epoch": 115} {"train_loss": -6.676636695861816, "global_step": 19466, "epoch": 115} {"train_loss": -6.853407382965088, "global_step": 19467, "epoch": 115} {"train_loss": -6.818033218383789, "global_step": 19468, "epoch": 115} {"train_loss": -6.369306564331055, "global_step": 19469, "epoch": 115} {"train_loss": -6.755571365356445, "global_step": 19470, "epoch": 115} {"train_loss": -6.8266730308532715, "global_step": 19471, "epoch": 115} {"train_loss": -6.67966890335083, "global_step": 19472, "epoch": 115} {"train_loss": -6.32523250579834, "global_step": 19473, "epoch": 115} {"train_loss": -7.023867607116699, "global_step": 19474, "epoch": 115} {"train_loss": -6.95782470703125, "global_step": 19475, "epoch": 115} {"train_loss": -6.572535037994385, "global_step": 19476, "epoch": 115} {"train_loss": -6.653285980224609, "global_step": 19477, "epoch": 115} {"train_loss": -7.0391764640808105, "global_step": 19478, "epoch": 115} {"train_loss": -6.710799694061279, "global_step": 19479, "epoch": 115} {"train_loss": -6.759137153625488, "global_step": 19480, "epoch": 115} {"train_loss": -7.005366325378418, "global_step": 19481, "epoch": 115} {"train_loss": -6.675766944885254, "global_step": 19482, "epoch": 115} {"train_loss": -6.934320449829102, "global_step": 19483, "epoch": 115} {"train_loss": -6.865795135498047, "global_step": 19484, "epoch": 115} {"train_loss": -6.7830023765563965, "global_step": 19485, "epoch": 115} {"train_loss": -6.673435211181641, "global_step": 19486, "epoch": 115} {"train_loss": -6.7324356607028415, "global_step": 19487, "epoch": 115, "val_loss": 215465.171875, "train_action_mse_error": 21.615243911743164} {"train_loss": -6.522468566894531, "global_step": 19488, "epoch": 116} {"train_loss": -6.777706146240234, "global_step": 19489, "epoch": 116} {"train_loss": -6.87949275970459, "global_step": 19490, "epoch": 116} {"train_loss": -6.641966819763184, "global_step": 19491, "epoch": 116} {"train_loss": -6.878836631774902, "global_step": 19492, "epoch": 116} {"train_loss": -6.959424018859863, "global_step": 19493, "epoch": 116} {"train_loss": -6.760272979736328, "global_step": 19494, "epoch": 116} {"train_loss": -6.863295078277588, "global_step": 19495, "epoch": 116} {"train_loss": -6.634486198425293, "global_step": 19496, "epoch": 116} {"train_loss": -6.8264994621276855, "global_step": 19497, "epoch": 116} {"train_loss": -6.8087158203125, "global_step": 19498, "epoch": 116} {"train_loss": -7.171882629394531, "global_step": 19499, "epoch": 116} {"train_loss": -6.739716529846191, "global_step": 19500, "epoch": 116} {"train_loss": -6.942560195922852, "global_step": 19501, "epoch": 116} {"train_loss": -6.697517395019531, "global_step": 19502, "epoch": 116} {"train_loss": -6.771839141845703, "global_step": 19503, "epoch": 116} {"train_loss": -6.553740978240967, "global_step": 19504, "epoch": 116} {"train_loss": -6.757829666137695, "global_step": 19505, "epoch": 116} {"train_loss": -6.68256950378418, "global_step": 19506, "epoch": 116} {"train_loss": -6.913265228271484, "global_step": 19507, "epoch": 116} {"train_loss": -6.777629852294922, "global_step": 19508, "epoch": 116} {"train_loss": -6.911895275115967, "global_step": 19509, "epoch": 116} {"train_loss": -6.650261878967285, "global_step": 19510, "epoch": 116} {"train_loss": -6.6051025390625, "global_step": 19511, "epoch": 116} {"train_loss": -6.696926116943359, "global_step": 19512, "epoch": 116} {"train_loss": -6.745038986206055, "global_step": 19513, "epoch": 116} {"train_loss": -6.723187446594238, "global_step": 19514, "epoch": 116} {"train_loss": -6.772902488708496, "global_step": 19515, "epoch": 116} {"train_loss": -6.694053649902344, "global_step": 19516, "epoch": 116} {"train_loss": -6.888426780700684, "global_step": 19517, "epoch": 116} {"train_loss": -6.873313903808594, "global_step": 19518, "epoch": 116} {"train_loss": -6.832453727722168, "global_step": 19519, "epoch": 116} {"train_loss": -6.872000694274902, "global_step": 19520, "epoch": 116} {"train_loss": -6.439921855926514, "global_step": 19521, "epoch": 116} {"train_loss": -6.711203098297119, "global_step": 19522, "epoch": 116} {"train_loss": -6.809439659118652, "global_step": 19523, "epoch": 116} {"train_loss": -6.751991271972656, "global_step": 19524, "epoch": 116} {"train_loss": -6.833138465881348, "global_step": 19525, "epoch": 116} {"train_loss": -6.787609577178955, "global_step": 19526, "epoch": 116} {"train_loss": -6.632154941558838, "global_step": 19527, "epoch": 116} {"train_loss": -6.842574119567871, "global_step": 19528, "epoch": 116} {"train_loss": -6.881927490234375, "global_step": 19529, "epoch": 116} {"train_loss": -6.729321479797363, "global_step": 19530, "epoch": 116} {"train_loss": -6.7634782791137695, "global_step": 19531, "epoch": 116} {"train_loss": -6.6375932693481445, "global_step": 19532, "epoch": 116} {"train_loss": -6.812471866607666, "global_step": 19533, "epoch": 116} {"train_loss": -7.008552551269531, "global_step": 19534, "epoch": 116} {"train_loss": -6.7037577629089355, "global_step": 19535, "epoch": 116} {"train_loss": -6.730144500732422, "global_step": 19536, "epoch": 116} {"train_loss": -6.840091705322266, "global_step": 19537, "epoch": 116} {"train_loss": -6.801356315612793, "global_step": 19538, "epoch": 116} {"train_loss": -6.822941780090332, "global_step": 19539, "epoch": 116} {"train_loss": -6.568302154541016, "global_step": 19540, "epoch": 116} {"train_loss": -6.499565601348877, "global_step": 19541, "epoch": 116} {"train_loss": -6.448248386383057, "global_step": 19542, "epoch": 116} {"train_loss": -6.781852722167969, "global_step": 19543, "epoch": 116} {"train_loss": -6.7818217277526855, "global_step": 19544, "epoch": 116} {"train_loss": -6.699493885040283, "global_step": 19545, "epoch": 116} {"train_loss": -6.640910625457764, "global_step": 19546, "epoch": 116} {"train_loss": -6.753152847290039, "global_step": 19547, "epoch": 116} {"train_loss": -6.726271629333496, "global_step": 19548, "epoch": 116} {"train_loss": -6.639534950256348, "global_step": 19549, "epoch": 116} {"train_loss": -6.942354679107666, "global_step": 19550, "epoch": 116} {"train_loss": -7.038243770599365, "global_step": 19551, "epoch": 116} {"train_loss": -6.735934257507324, "global_step": 19552, "epoch": 116} {"train_loss": -6.793153762817383, "global_step": 19553, "epoch": 116} {"train_loss": -6.634016036987305, "global_step": 19554, "epoch": 116} {"train_loss": -6.9033331871032715, "global_step": 19555, "epoch": 116} {"train_loss": -6.760313987731934, "global_step": 19556, "epoch": 116} {"train_loss": -6.551787853240967, "global_step": 19557, "epoch": 116} {"train_loss": -6.664569854736328, "global_step": 19558, "epoch": 116} {"train_loss": -6.741271018981934, "global_step": 19559, "epoch": 116} {"train_loss": -6.612586975097656, "global_step": 19560, "epoch": 116} {"train_loss": -6.558467864990234, "global_step": 19561, "epoch": 116} {"train_loss": -6.5920491218566895, "global_step": 19562, "epoch": 116} {"train_loss": -6.529163837432861, "global_step": 19563, "epoch": 116} {"train_loss": -6.77349853515625, "global_step": 19564, "epoch": 116} {"train_loss": -6.726792335510254, "global_step": 19565, "epoch": 116} {"train_loss": -6.571073055267334, "global_step": 19566, "epoch": 116} {"train_loss": -6.757480621337891, "global_step": 19567, "epoch": 116} {"train_loss": -6.68733024597168, "global_step": 19568, "epoch": 116} {"train_loss": -6.72637939453125, "global_step": 19569, "epoch": 116} {"train_loss": -6.503924369812012, "global_step": 19570, "epoch": 116} {"train_loss": -6.589186191558838, "global_step": 19571, "epoch": 116} {"train_loss": -6.9086527824401855, "global_step": 19572, "epoch": 116} {"train_loss": -6.907475471496582, "global_step": 19573, "epoch": 116} {"train_loss": -6.996773719787598, "global_step": 19574, "epoch": 116} {"train_loss": -6.947257041931152, "global_step": 19575, "epoch": 116} {"train_loss": -6.933128356933594, "global_step": 19576, "epoch": 116} {"train_loss": -6.858660697937012, "global_step": 19577, "epoch": 116} {"train_loss": -6.539460182189941, "global_step": 19578, "epoch": 116} {"train_loss": -6.752354621887207, "global_step": 19579, "epoch": 116} {"train_loss": -6.806285858154297, "global_step": 19580, "epoch": 116} {"train_loss": -6.737296104431152, "global_step": 19581, "epoch": 116} {"train_loss": -6.854663848876953, "global_step": 19582, "epoch": 116} {"train_loss": -6.455537796020508, "global_step": 19583, "epoch": 116} {"train_loss": -6.771268844604492, "global_step": 19584, "epoch": 116} {"train_loss": -6.7561540603637695, "global_step": 19585, "epoch": 116} {"train_loss": -6.709770202636719, "global_step": 19586, "epoch": 116} {"train_loss": -6.530365467071533, "global_step": 19587, "epoch": 116} {"train_loss": -6.720231056213379, "global_step": 19588, "epoch": 116} {"train_loss": -6.865365028381348, "global_step": 19589, "epoch": 116} {"train_loss": -6.56902551651001, "global_step": 19590, "epoch": 116} {"train_loss": -6.755943298339844, "global_step": 19591, "epoch": 116} {"train_loss": -7.012879848480225, "global_step": 19592, "epoch": 116} {"train_loss": -6.858124732971191, "global_step": 19593, "epoch": 116} {"train_loss": -6.7516770362854, "global_step": 19594, "epoch": 116} {"train_loss": -7.008245468139648, "global_step": 19595, "epoch": 116} {"train_loss": -6.734368801116943, "global_step": 19596, "epoch": 116} {"train_loss": -6.838047027587891, "global_step": 19597, "epoch": 116} {"train_loss": -6.924617290496826, "global_step": 19598, "epoch": 116} {"train_loss": -6.886080741882324, "global_step": 19599, "epoch": 116} {"train_loss": -6.744736671447754, "global_step": 19600, "epoch": 116} {"train_loss": -6.802655220031738, "global_step": 19601, "epoch": 116} {"train_loss": -6.7845563888549805, "global_step": 19602, "epoch": 116} {"train_loss": -6.903208255767822, "global_step": 19603, "epoch": 116} {"train_loss": -6.489021301269531, "global_step": 19604, "epoch": 116} {"train_loss": -6.614119052886963, "global_step": 19605, "epoch": 116} {"train_loss": -6.870748996734619, "global_step": 19606, "epoch": 116} {"train_loss": -6.78082275390625, "global_step": 19607, "epoch": 116} {"train_loss": -6.7175750732421875, "global_step": 19608, "epoch": 116} {"train_loss": -6.663248062133789, "global_step": 19609, "epoch": 116} {"train_loss": -6.566033363342285, "global_step": 19610, "epoch": 116} {"train_loss": -7.034010887145996, "global_step": 19611, "epoch": 116} {"train_loss": -6.947155952453613, "global_step": 19612, "epoch": 116} {"train_loss": -6.968987464904785, "global_step": 19613, "epoch": 116} {"train_loss": -6.8723649978637695, "global_step": 19614, "epoch": 116} {"train_loss": -6.9509477615356445, "global_step": 19615, "epoch": 116} {"train_loss": -6.791354656219482, "global_step": 19616, "epoch": 116} {"train_loss": -6.639744758605957, "global_step": 19617, "epoch": 116} {"train_loss": -6.96600341796875, "global_step": 19618, "epoch": 116} {"train_loss": -6.832388877868652, "global_step": 19619, "epoch": 116} {"train_loss": -6.896947860717773, "global_step": 19620, "epoch": 116} {"train_loss": -6.492986679077148, "global_step": 19621, "epoch": 116} {"train_loss": -6.70632791519165, "global_step": 19622, "epoch": 116} {"train_loss": -6.6460065841674805, "global_step": 19623, "epoch": 116} {"train_loss": -6.648656845092773, "global_step": 19624, "epoch": 116} {"train_loss": -6.8205108642578125, "global_step": 19625, "epoch": 116} {"train_loss": -6.763998031616211, "global_step": 19626, "epoch": 116} {"train_loss": -6.968714237213135, "global_step": 19627, "epoch": 116} {"train_loss": -6.896852970123291, "global_step": 19628, "epoch": 116} {"train_loss": -6.8508453369140625, "global_step": 19629, "epoch": 116} {"train_loss": -6.951282501220703, "global_step": 19630, "epoch": 116} {"train_loss": -7.07113790512085, "global_step": 19631, "epoch": 116} {"train_loss": -6.7151947021484375, "global_step": 19632, "epoch": 116} {"train_loss": -6.831070899963379, "global_step": 19633, "epoch": 116} {"train_loss": -6.798415660858154, "global_step": 19634, "epoch": 116} {"train_loss": -6.721155166625977, "global_step": 19635, "epoch": 116} {"train_loss": -6.765550136566162, "global_step": 19636, "epoch": 116} {"train_loss": -6.6087141036987305, "global_step": 19637, "epoch": 116} {"train_loss": -7.006959438323975, "global_step": 19638, "epoch": 116} {"train_loss": -6.783731460571289, "global_step": 19639, "epoch": 116} {"train_loss": -6.9305419921875, "global_step": 19640, "epoch": 116} {"train_loss": -6.738121032714844, "global_step": 19641, "epoch": 116} {"train_loss": -6.8752241134643555, "global_step": 19642, "epoch": 116} {"train_loss": -7.156789302825928, "global_step": 19643, "epoch": 116} {"train_loss": -7.08792781829834, "global_step": 19644, "epoch": 116} {"train_loss": -6.868927955627441, "global_step": 19645, "epoch": 116} {"train_loss": -6.865049362182617, "global_step": 19646, "epoch": 116} {"train_loss": -6.838322639465332, "global_step": 19647, "epoch": 116} {"train_loss": -6.792725086212158, "global_step": 19648, "epoch": 116} {"train_loss": -6.911172389984131, "global_step": 19649, "epoch": 116} {"train_loss": -6.969112873077393, "global_step": 19650, "epoch": 116} {"train_loss": -6.813198089599609, "global_step": 19651, "epoch": 116} {"train_loss": -6.937585830688477, "global_step": 19652, "epoch": 116} {"train_loss": -6.654016494750977, "global_step": 19653, "epoch": 116} {"train_loss": -6.834290504455566, "global_step": 19654, "epoch": 116} {"train_loss": -6.779546828497024, "global_step": 19655, "epoch": 116, "val_loss": 220403.453125} {"train_loss": -6.991687774658203, "global_step": 19656, "epoch": 117} {"train_loss": -6.629214763641357, "global_step": 19657, "epoch": 117} {"train_loss": -6.7468342781066895, "global_step": 19658, "epoch": 117} {"train_loss": -6.909640312194824, "global_step": 19659, "epoch": 117} {"train_loss": -6.809966087341309, "global_step": 19660, "epoch": 117} {"train_loss": -6.734126091003418, "global_step": 19661, "epoch": 117} {"train_loss": -6.852245330810547, "global_step": 19662, "epoch": 117} {"train_loss": -7.07964563369751, "global_step": 19663, "epoch": 117} {"train_loss": -6.962435722351074, "global_step": 19664, "epoch": 117} {"train_loss": -6.886343002319336, "global_step": 19665, "epoch": 117} {"train_loss": -6.472966194152832, "global_step": 19666, "epoch": 117} {"train_loss": -6.753060817718506, "global_step": 19667, "epoch": 117} {"train_loss": -6.832932949066162, "global_step": 19668, "epoch": 117} {"train_loss": -6.689726829528809, "global_step": 19669, "epoch": 117} {"train_loss": -6.716282844543457, "global_step": 19670, "epoch": 117} {"train_loss": -6.665637016296387, "global_step": 19671, "epoch": 117} {"train_loss": -6.5637969970703125, "global_step": 19672, "epoch": 117} {"train_loss": -6.616932392120361, "global_step": 19673, "epoch": 117} {"train_loss": -6.565377235412598, "global_step": 19674, "epoch": 117} {"train_loss": -6.760631561279297, "global_step": 19675, "epoch": 117} {"train_loss": -6.641822814941406, "global_step": 19676, "epoch": 117} {"train_loss": -6.775129795074463, "global_step": 19677, "epoch": 117} {"train_loss": -6.789863109588623, "global_step": 19678, "epoch": 117} {"train_loss": -6.666938304901123, "global_step": 19679, "epoch": 117} {"train_loss": -6.6788177490234375, "global_step": 19680, "epoch": 117} {"train_loss": -6.983987808227539, "global_step": 19681, "epoch": 117} {"train_loss": -6.8297929763793945, "global_step": 19682, "epoch": 117} {"train_loss": -6.727090358734131, "global_step": 19683, "epoch": 117} {"train_loss": -6.822011470794678, "global_step": 19684, "epoch": 117} {"train_loss": -6.825516700744629, "global_step": 19685, "epoch": 117} {"train_loss": -6.582679748535156, "global_step": 19686, "epoch": 117} {"train_loss": -6.718108177185059, "global_step": 19687, "epoch": 117} {"train_loss": -7.098142623901367, "global_step": 19688, "epoch": 117} {"train_loss": -6.599400997161865, "global_step": 19689, "epoch": 117} {"train_loss": -6.9023895263671875, "global_step": 19690, "epoch": 117} {"train_loss": -6.661467552185059, "global_step": 19691, "epoch": 117} {"train_loss": -6.687103748321533, "global_step": 19692, "epoch": 117} {"train_loss": -6.720985412597656, "global_step": 19693, "epoch": 117} {"train_loss": -6.731832981109619, "global_step": 19694, "epoch": 117} {"train_loss": -6.5960564613342285, "global_step": 19695, "epoch": 117} {"train_loss": -6.9900617599487305, "global_step": 19696, "epoch": 117} {"train_loss": -6.881917953491211, "global_step": 19697, "epoch": 117} {"train_loss": -6.655452728271484, "global_step": 19698, "epoch": 117} {"train_loss": -7.09998893737793, "global_step": 19699, "epoch": 117} {"train_loss": -6.975325107574463, "global_step": 19700, "epoch": 117} {"train_loss": -6.961373805999756, "global_step": 19701, "epoch": 117} {"train_loss": -6.869405269622803, "global_step": 19702, "epoch": 117} {"train_loss": -6.864681243896484, "global_step": 19703, "epoch": 117} {"train_loss": -6.93721342086792, "global_step": 19704, "epoch": 117} {"train_loss": -6.665388584136963, "global_step": 19705, "epoch": 117} {"train_loss": -7.069772243499756, "global_step": 19706, "epoch": 117} {"train_loss": -6.652149200439453, "global_step": 19707, "epoch": 117} {"train_loss": -6.740426063537598, "global_step": 19708, "epoch": 117} {"train_loss": -6.97269344329834, "global_step": 19709, "epoch": 117} {"train_loss": -6.834040641784668, "global_step": 19710, "epoch": 117} {"train_loss": -6.743400573730469, "global_step": 19711, "epoch": 117} {"train_loss": -7.043213367462158, "global_step": 19712, "epoch": 117} {"train_loss": -6.831788539886475, "global_step": 19713, "epoch": 117} {"train_loss": -6.756887435913086, "global_step": 19714, "epoch": 117} {"train_loss": -6.944748878479004, "global_step": 19715, "epoch": 117} {"train_loss": -6.940315246582031, "global_step": 19716, "epoch": 117} {"train_loss": -6.769410610198975, "global_step": 19717, "epoch": 117} {"train_loss": -6.907130241394043, "global_step": 19718, "epoch": 117} {"train_loss": -6.834697723388672, "global_step": 19719, "epoch": 117} {"train_loss": -6.7488484382629395, "global_step": 19720, "epoch": 117} {"train_loss": -6.885133743286133, "global_step": 19721, "epoch": 117} {"train_loss": -6.849425315856934, "global_step": 19722, "epoch": 117} {"train_loss": -6.733312129974365, "global_step": 19723, "epoch": 117} {"train_loss": -6.715878486633301, "global_step": 19724, "epoch": 117} {"train_loss": -6.832775115966797, "global_step": 19725, "epoch": 117} {"train_loss": -6.9195942878723145, "global_step": 19726, "epoch": 117} {"train_loss": -6.593408584594727, "global_step": 19727, "epoch": 117} {"train_loss": -6.525430679321289, "global_step": 19728, "epoch": 117} {"train_loss": -7.097261905670166, "global_step": 19729, "epoch": 117} {"train_loss": -6.864898681640625, "global_step": 19730, "epoch": 117} {"train_loss": -6.747988224029541, "global_step": 19731, "epoch": 117} {"train_loss": -6.75008487701416, "global_step": 19732, "epoch": 117} {"train_loss": -6.921398162841797, "global_step": 19733, "epoch": 117} {"train_loss": -6.754374027252197, "global_step": 19734, "epoch": 117} {"train_loss": -6.542396068572998, "global_step": 19735, "epoch": 117} {"train_loss": -6.775526523590088, "global_step": 19736, "epoch": 117} {"train_loss": -6.625300407409668, "global_step": 19737, "epoch": 117} {"train_loss": -7.013384819030762, "global_step": 19738, "epoch": 117} {"train_loss": -6.836390495300293, "global_step": 19739, "epoch": 117} {"train_loss": -6.638706684112549, "global_step": 19740, "epoch": 117} {"train_loss": -6.738141059875488, "global_step": 19741, "epoch": 117} {"train_loss": -6.933257579803467, "global_step": 19742, "epoch": 117} {"train_loss": -6.779499053955078, "global_step": 19743, "epoch": 117} {"train_loss": -6.793947219848633, "global_step": 19744, "epoch": 117} {"train_loss": -6.800004482269287, "global_step": 19745, "epoch": 117} {"train_loss": -6.9618682861328125, "global_step": 19746, "epoch": 117} {"train_loss": -6.638071537017822, "global_step": 19747, "epoch": 117} {"train_loss": -6.578385353088379, "global_step": 19748, "epoch": 117} {"train_loss": -6.50042200088501, "global_step": 19749, "epoch": 117} {"train_loss": -6.550257205963135, "global_step": 19750, "epoch": 117} {"train_loss": -6.605193138122559, "global_step": 19751, "epoch": 117} {"train_loss": -6.522557258605957, "global_step": 19752, "epoch": 117} {"train_loss": -6.889797687530518, "global_step": 19753, "epoch": 117} {"train_loss": -6.391091346740723, "global_step": 19754, "epoch": 117} {"train_loss": -6.624063968658447, "global_step": 19755, "epoch": 117} {"train_loss": -6.796770095825195, "global_step": 19756, "epoch": 117} {"train_loss": -6.599658012390137, "global_step": 19757, "epoch": 117} {"train_loss": -6.5962066650390625, "global_step": 19758, "epoch": 117} {"train_loss": -6.478540420532227, "global_step": 19759, "epoch": 117} {"train_loss": -6.616036415100098, "global_step": 19760, "epoch": 117} {"train_loss": -6.834637641906738, "global_step": 19761, "epoch": 117} {"train_loss": -6.815420150756836, "global_step": 19762, "epoch": 117} {"train_loss": -6.764265060424805, "global_step": 19763, "epoch": 117} {"train_loss": -6.531041622161865, "global_step": 19764, "epoch": 117} {"train_loss": -6.596574783325195, "global_step": 19765, "epoch": 117} {"train_loss": -6.818968772888184, "global_step": 19766, "epoch": 117} {"train_loss": -6.565958023071289, "global_step": 19767, "epoch": 117} {"train_loss": -6.692849636077881, "global_step": 19768, "epoch": 117} {"train_loss": -6.745990753173828, "global_step": 19769, "epoch": 117} {"train_loss": -6.735759258270264, "global_step": 19770, "epoch": 117} {"train_loss": -6.695343971252441, "global_step": 19771, "epoch": 117} {"train_loss": -6.728145122528076, "global_step": 19772, "epoch": 117} {"train_loss": -6.849511623382568, "global_step": 19773, "epoch": 117} {"train_loss": -6.860879898071289, "global_step": 19774, "epoch": 117} {"train_loss": -6.7781548500061035, "global_step": 19775, "epoch": 117} {"train_loss": -6.912102222442627, "global_step": 19776, "epoch": 117} {"train_loss": -6.79445219039917, "global_step": 19777, "epoch": 117} {"train_loss": -6.8483686447143555, "global_step": 19778, "epoch": 117} {"train_loss": -6.800974369049072, "global_step": 19779, "epoch": 117} {"train_loss": -6.964593887329102, "global_step": 19780, "epoch": 117} {"train_loss": -6.978911399841309, "global_step": 19781, "epoch": 117} {"train_loss": -6.687162399291992, "global_step": 19782, "epoch": 117} {"train_loss": -6.892132759094238, "global_step": 19783, "epoch": 117} {"train_loss": -6.58185338973999, "global_step": 19784, "epoch": 117} {"train_loss": -6.901988983154297, "global_step": 19785, "epoch": 117} {"train_loss": -6.696218967437744, "global_step": 19786, "epoch": 117} {"train_loss": -6.857041835784912, "global_step": 19787, "epoch": 117} {"train_loss": -6.380682945251465, "global_step": 19788, "epoch": 117} {"train_loss": -6.8855390548706055, "global_step": 19789, "epoch": 117} {"train_loss": -6.69972038269043, "global_step": 19790, "epoch": 117} {"train_loss": -6.470884323120117, "global_step": 19791, "epoch": 117} {"train_loss": -6.508801460266113, "global_step": 19792, "epoch": 117} {"train_loss": -6.139704704284668, "global_step": 19793, "epoch": 117} {"train_loss": -6.876062393188477, "global_step": 19794, "epoch": 117} {"train_loss": -6.735544204711914, "global_step": 19795, "epoch": 117} {"train_loss": -6.709073543548584, "global_step": 19796, "epoch": 117} {"train_loss": -6.62364387512207, "global_step": 19797, "epoch": 117} {"train_loss": -6.309473991394043, "global_step": 19798, "epoch": 117} {"train_loss": -6.77679443359375, "global_step": 19799, "epoch": 117} {"train_loss": -6.737088203430176, "global_step": 19800, "epoch": 117} {"train_loss": -6.2854766845703125, "global_step": 19801, "epoch": 117} {"train_loss": -6.559603214263916, "global_step": 19802, "epoch": 117} {"train_loss": -6.628328323364258, "global_step": 19803, "epoch": 117} {"train_loss": -6.456112861633301, "global_step": 19804, "epoch": 117} {"train_loss": -6.452446937561035, "global_step": 19805, "epoch": 117} {"train_loss": -6.760403156280518, "global_step": 19806, "epoch": 117} {"train_loss": -6.605574131011963, "global_step": 19807, "epoch": 117} {"train_loss": -6.583939552307129, "global_step": 19808, "epoch": 117} {"train_loss": -6.497506141662598, "global_step": 19809, "epoch": 117} {"train_loss": -6.610223293304443, "global_step": 19810, "epoch": 117} {"train_loss": -6.671831130981445, "global_step": 19811, "epoch": 117} {"train_loss": -6.589951515197754, "global_step": 19812, "epoch": 117} {"train_loss": -6.9544172286987305, "global_step": 19813, "epoch": 117} {"train_loss": -7.041939735412598, "global_step": 19814, "epoch": 117} {"train_loss": -6.666730880737305, "global_step": 19815, "epoch": 117} {"train_loss": -6.83564567565918, "global_step": 19816, "epoch": 117} {"train_loss": -6.649361610412598, "global_step": 19817, "epoch": 117} {"train_loss": -6.718578815460205, "global_step": 19818, "epoch": 117} {"train_loss": -6.845447063446045, "global_step": 19819, "epoch": 117} {"train_loss": -6.803539752960205, "global_step": 19820, "epoch": 117} {"train_loss": -6.868450164794922, "global_step": 19821, "epoch": 117} {"train_loss": -6.576537132263184, "global_step": 19822, "epoch": 117} {"train_loss": -6.746211886405945, "global_step": 19823, "epoch": 117, "val_loss": 218335.171875} {"train_loss": -6.882905006408691, "global_step": 19824, "epoch": 118} {"train_loss": -6.871631145477295, "global_step": 19825, "epoch": 118} {"train_loss": -6.935583114624023, "global_step": 19826, "epoch": 118} {"train_loss": -6.787588119506836, "global_step": 19827, "epoch": 118} {"train_loss": -6.794907569885254, "global_step": 19828, "epoch": 118} {"train_loss": -6.675408363342285, "global_step": 19829, "epoch": 118} {"train_loss": -6.829839706420898, "global_step": 19830, "epoch": 118} {"train_loss": -6.554293632507324, "global_step": 19831, "epoch": 118} {"train_loss": -6.512625694274902, "global_step": 19832, "epoch": 118} {"train_loss": -6.444367408752441, "global_step": 19833, "epoch": 118} {"train_loss": -6.566269397735596, "global_step": 19834, "epoch": 118} {"train_loss": -6.407851219177246, "global_step": 19835, "epoch": 118} {"train_loss": -6.684725761413574, "global_step": 19836, "epoch": 118} {"train_loss": -6.495748519897461, "global_step": 19837, "epoch": 118} {"train_loss": -6.5165557861328125, "global_step": 19838, "epoch": 118} {"train_loss": -6.580949783325195, "global_step": 19839, "epoch": 118} {"train_loss": -6.520931243896484, "global_step": 19840, "epoch": 118} {"train_loss": -6.519488334655762, "global_step": 19841, "epoch": 118} {"train_loss": -6.732181549072266, "global_step": 19842, "epoch": 118} {"train_loss": -6.4999237060546875, "global_step": 19843, "epoch": 118} {"train_loss": -6.935986518859863, "global_step": 19844, "epoch": 118} {"train_loss": -6.7552385330200195, "global_step": 19845, "epoch": 118} {"train_loss": -6.752865791320801, "global_step": 19846, "epoch": 118} {"train_loss": -6.9977707862854, "global_step": 19847, "epoch": 118} {"train_loss": -6.800397872924805, "global_step": 19848, "epoch": 118} {"train_loss": -6.862954139709473, "global_step": 19849, "epoch": 118} {"train_loss": -6.845395088195801, "global_step": 19850, "epoch": 118} {"train_loss": -6.754735946655273, "global_step": 19851, "epoch": 118} {"train_loss": -6.8609819412231445, "global_step": 19852, "epoch": 118} {"train_loss": -6.87898063659668, "global_step": 19853, "epoch": 118} {"train_loss": -6.881833076477051, "global_step": 19854, "epoch": 118} {"train_loss": -6.769742012023926, "global_step": 19855, "epoch": 118} {"train_loss": -6.816961288452148, "global_step": 19856, "epoch": 118} {"train_loss": -6.629226207733154, "global_step": 19857, "epoch": 118} {"train_loss": -6.850245475769043, "global_step": 19858, "epoch": 118} {"train_loss": -6.803210735321045, "global_step": 19859, "epoch": 118} {"train_loss": -6.862020015716553, "global_step": 19860, "epoch": 118} {"train_loss": -6.631379127502441, "global_step": 19861, "epoch": 118} {"train_loss": -6.804438591003418, "global_step": 19862, "epoch": 118} {"train_loss": -7.035761833190918, "global_step": 19863, "epoch": 118} {"train_loss": -6.627805709838867, "global_step": 19864, "epoch": 118} {"train_loss": -6.877169132232666, "global_step": 19865, "epoch": 118} {"train_loss": -6.515040397644043, "global_step": 19866, "epoch": 118} {"train_loss": -6.796786308288574, "global_step": 19867, "epoch": 118} {"train_loss": -6.914979934692383, "global_step": 19868, "epoch": 118} {"train_loss": -6.7835164070129395, "global_step": 19869, "epoch": 118} {"train_loss": -6.763715744018555, "global_step": 19870, "epoch": 118} {"train_loss": -6.791240692138672, "global_step": 19871, "epoch": 118} {"train_loss": -7.0885820388793945, "global_step": 19872, "epoch": 118} {"train_loss": -7.064854145050049, "global_step": 19873, "epoch": 118} {"train_loss": -6.520921230316162, "global_step": 19874, "epoch": 118} {"train_loss": -6.823531150817871, "global_step": 19875, "epoch": 118} {"train_loss": -6.829136848449707, "global_step": 19876, "epoch": 118} {"train_loss": -6.928893089294434, "global_step": 19877, "epoch": 118} {"train_loss": -6.934228897094727, "global_step": 19878, "epoch": 118} {"train_loss": -6.780912399291992, "global_step": 19879, "epoch": 118} {"train_loss": -6.737099647521973, "global_step": 19880, "epoch": 118} {"train_loss": -6.6443328857421875, "global_step": 19881, "epoch": 118} {"train_loss": -6.830679893493652, "global_step": 19882, "epoch": 118} {"train_loss": -6.737944602966309, "global_step": 19883, "epoch": 118} {"train_loss": -6.711514949798584, "global_step": 19884, "epoch": 118} {"train_loss": -6.845235347747803, "global_step": 19885, "epoch": 118} {"train_loss": -6.7324934005737305, "global_step": 19886, "epoch": 118} {"train_loss": -6.692408561706543, "global_step": 19887, "epoch": 118} {"train_loss": -6.799221515655518, "global_step": 19888, "epoch": 118} {"train_loss": -6.69992208480835, "global_step": 19889, "epoch": 118} {"train_loss": -6.632364273071289, "global_step": 19890, "epoch": 118} {"train_loss": -6.544832229614258, "global_step": 19891, "epoch": 118} {"train_loss": -6.655455589294434, "global_step": 19892, "epoch": 118} {"train_loss": -6.757635116577148, "global_step": 19893, "epoch": 118} {"train_loss": -6.719621181488037, "global_step": 19894, "epoch": 118} {"train_loss": -6.595798492431641, "global_step": 19895, "epoch": 118} {"train_loss": -6.671586990356445, "global_step": 19896, "epoch": 118} {"train_loss": -6.7524261474609375, "global_step": 19897, "epoch": 118} {"train_loss": -6.728676795959473, "global_step": 19898, "epoch": 118} {"train_loss": -6.481305122375488, "global_step": 19899, "epoch": 118} {"train_loss": -6.6399383544921875, "global_step": 19900, "epoch": 118} {"train_loss": -6.851614952087402, "global_step": 19901, "epoch": 118} {"train_loss": -6.640784740447998, "global_step": 19902, "epoch": 118} {"train_loss": -6.75045108795166, "global_step": 19903, "epoch": 118} {"train_loss": -6.653694152832031, "global_step": 19904, "epoch": 118} {"train_loss": -6.559510231018066, "global_step": 19905, "epoch": 118} {"train_loss": -6.739384651184082, "global_step": 19906, "epoch": 118} {"train_loss": -6.697663307189941, "global_step": 19907, "epoch": 118} {"train_loss": -6.8184309005737305, "global_step": 19908, "epoch": 118} {"train_loss": -6.776833534240723, "global_step": 19909, "epoch": 118} {"train_loss": -6.801084518432617, "global_step": 19910, "epoch": 118} {"train_loss": -6.8772172927856445, "global_step": 19911, "epoch": 118} {"train_loss": -6.875988006591797, "global_step": 19912, "epoch": 118} {"train_loss": -6.949569225311279, "global_step": 19913, "epoch": 118} {"train_loss": -6.5221405029296875, "global_step": 19914, "epoch": 118} {"train_loss": -6.959883213043213, "global_step": 19915, "epoch": 118} {"train_loss": -6.641374588012695, "global_step": 19916, "epoch": 118} {"train_loss": -6.926836013793945, "global_step": 19917, "epoch": 118} {"train_loss": -6.801651954650879, "global_step": 19918, "epoch": 118} {"train_loss": -6.62020206451416, "global_step": 19919, "epoch": 118} {"train_loss": -6.717869281768799, "global_step": 19920, "epoch": 118} {"train_loss": -6.577469825744629, "global_step": 19921, "epoch": 118} {"train_loss": -6.893313884735107, "global_step": 19922, "epoch": 118} {"train_loss": -7.0187177658081055, "global_step": 19923, "epoch": 118} {"train_loss": -6.781622409820557, "global_step": 19924, "epoch": 118} {"train_loss": -6.853996276855469, "global_step": 19925, "epoch": 118} {"train_loss": -6.713731288909912, "global_step": 19926, "epoch": 118} {"train_loss": -6.8570709228515625, "global_step": 19927, "epoch": 118} {"train_loss": -6.691199779510498, "global_step": 19928, "epoch": 118} {"train_loss": -6.936103820800781, "global_step": 19929, "epoch": 118} {"train_loss": -7.052748680114746, "global_step": 19930, "epoch": 118} {"train_loss": -7.040119171142578, "global_step": 19931, "epoch": 118} {"train_loss": -6.732661247253418, "global_step": 19932, "epoch": 118} {"train_loss": -7.0830841064453125, "global_step": 19933, "epoch": 118} {"train_loss": -6.493991851806641, "global_step": 19934, "epoch": 118} {"train_loss": -6.9007768630981445, "global_step": 19935, "epoch": 118} {"train_loss": -6.79481315612793, "global_step": 19936, "epoch": 118} {"train_loss": -6.876134872436523, "global_step": 19937, "epoch": 118} {"train_loss": -6.923282623291016, "global_step": 19938, "epoch": 118} {"train_loss": -6.710237503051758, "global_step": 19939, "epoch": 118} {"train_loss": -6.740052700042725, "global_step": 19940, "epoch": 118} {"train_loss": -6.847752571105957, "global_step": 19941, "epoch": 118} {"train_loss": -6.725223541259766, "global_step": 19942, "epoch": 118} {"train_loss": -6.888667106628418, "global_step": 19943, "epoch": 118} {"train_loss": -6.9445037841796875, "global_step": 19944, "epoch": 118} {"train_loss": -6.885651111602783, "global_step": 19945, "epoch": 118} {"train_loss": -6.766087532043457, "global_step": 19946, "epoch": 118} {"train_loss": -6.878927230834961, "global_step": 19947, "epoch": 118} {"train_loss": -6.840221405029297, "global_step": 19948, "epoch": 118} {"train_loss": -6.908929824829102, "global_step": 19949, "epoch": 118} {"train_loss": -6.855836868286133, "global_step": 19950, "epoch": 118} {"train_loss": -7.047079563140869, "global_step": 19951, "epoch": 118} {"train_loss": -7.071814060211182, "global_step": 19952, "epoch": 118} {"train_loss": -7.058967113494873, "global_step": 19953, "epoch": 118} {"train_loss": -6.8987274169921875, "global_step": 19954, "epoch": 118} {"train_loss": -7.044104099273682, "global_step": 19955, "epoch": 118} {"train_loss": -7.099075794219971, "global_step": 19956, "epoch": 118} {"train_loss": -6.867740631103516, "global_step": 19957, "epoch": 118} {"train_loss": -6.948298931121826, "global_step": 19958, "epoch": 118} {"train_loss": -6.7024030685424805, "global_step": 19959, "epoch": 118} {"train_loss": -7.020151615142822, "global_step": 19960, "epoch": 118} {"train_loss": -6.641459941864014, "global_step": 19961, "epoch": 118} {"train_loss": -7.173101425170898, "global_step": 19962, "epoch": 118} {"train_loss": -7.025933265686035, "global_step": 19963, "epoch": 118} {"train_loss": -7.040023326873779, "global_step": 19964, "epoch": 118} {"train_loss": -6.889735221862793, "global_step": 19965, "epoch": 118} {"train_loss": -6.650297164916992, "global_step": 19966, "epoch": 118} {"train_loss": -6.890132427215576, "global_step": 19967, "epoch": 118} {"train_loss": -7.073142051696777, "global_step": 19968, "epoch": 118} {"train_loss": -6.914619445800781, "global_step": 19969, "epoch": 118} {"train_loss": -6.900346279144287, "global_step": 19970, "epoch": 118} {"train_loss": -6.639713764190674, "global_step": 19971, "epoch": 118} {"train_loss": -6.885835647583008, "global_step": 19972, "epoch": 118} {"train_loss": -6.879749298095703, "global_step": 19973, "epoch": 118} {"train_loss": -6.856717109680176, "global_step": 19974, "epoch": 118} {"train_loss": -6.4321722984313965, "global_step": 19975, "epoch": 118} {"train_loss": -6.992159843444824, "global_step": 19976, "epoch": 118} {"train_loss": -6.301014423370361, "global_step": 19977, "epoch": 118} {"train_loss": -6.638467788696289, "global_step": 19978, "epoch": 118} {"train_loss": -6.8854827880859375, "global_step": 19979, "epoch": 118} {"train_loss": -6.743615627288818, "global_step": 19980, "epoch": 118} {"train_loss": -6.731233596801758, "global_step": 19981, "epoch": 118} {"train_loss": -6.416799545288086, "global_step": 19982, "epoch": 118} {"train_loss": -6.805383682250977, "global_step": 19983, "epoch": 118} {"train_loss": -6.35307502746582, "global_step": 19984, "epoch": 118} {"train_loss": -6.619952201843262, "global_step": 19985, "epoch": 118} {"train_loss": -6.849505424499512, "global_step": 19986, "epoch": 118} {"train_loss": -6.722872257232666, "global_step": 19987, "epoch": 118} {"train_loss": -6.82254695892334, "global_step": 19988, "epoch": 118} {"train_loss": -6.534435272216797, "global_step": 19989, "epoch": 118} {"train_loss": -6.804598808288574, "global_step": 19990, "epoch": 118} {"train_loss": -6.77997624874115, "global_step": 19991, "epoch": 118, "val_loss": 216317.625} {"train_loss": -6.794987201690674, "global_step": 19992, "epoch": 119} {"train_loss": -6.94869327545166, "global_step": 19993, "epoch": 119} {"train_loss": -6.872130393981934, "global_step": 19994, "epoch": 119} {"train_loss": -6.6650872230529785, "global_step": 19995, "epoch": 119} {"train_loss": -6.747378349304199, "global_step": 19996, "epoch": 119} {"train_loss": -6.804610252380371, "global_step": 19997, "epoch": 119} {"train_loss": -6.086949348449707, "global_step": 19998, "epoch": 119} {"train_loss": -6.683264255523682, "global_step": 19999, "epoch": 119} {"train_loss": -6.696620941162109, "global_step": 20000, "epoch": 119} {"train_loss": -6.636549472808838, "global_step": 20001, "epoch": 119} {"train_loss": -6.529250621795654, "global_step": 20002, "epoch": 119} {"train_loss": -6.365532875061035, "global_step": 20003, "epoch": 119} {"train_loss": -7.1038055419921875, "global_step": 20004, "epoch": 119} {"train_loss": -6.632122039794922, "global_step": 20005, "epoch": 119} {"train_loss": -6.463732719421387, "global_step": 20006, "epoch": 119} {"train_loss": -6.70587158203125, "global_step": 20007, "epoch": 119} {"train_loss": -6.678997993469238, "global_step": 20008, "epoch": 119} {"train_loss": -6.73048210144043, "global_step": 20009, "epoch": 119} {"train_loss": -6.71978759765625, "global_step": 20010, "epoch": 119} {"train_loss": -6.849740028381348, "global_step": 20011, "epoch": 119} {"train_loss": -6.872533321380615, "global_step": 20012, "epoch": 119} {"train_loss": -6.724506378173828, "global_step": 20013, "epoch": 119} {"train_loss": -6.5973405838012695, "global_step": 20014, "epoch": 119} {"train_loss": -6.929256439208984, "global_step": 20015, "epoch": 119} {"train_loss": -6.646026611328125, "global_step": 20016, "epoch": 119} {"train_loss": -6.843690872192383, "global_step": 20017, "epoch": 119} {"train_loss": -6.952602863311768, "global_step": 20018, "epoch": 119} {"train_loss": -6.851019859313965, "global_step": 20019, "epoch": 119} {"train_loss": -6.912845611572266, "global_step": 20020, "epoch": 119} {"train_loss": -6.960699558258057, "global_step": 20021, "epoch": 119} {"train_loss": -6.838976860046387, "global_step": 20022, "epoch": 119} {"train_loss": -7.12508487701416, "global_step": 20023, "epoch": 119} {"train_loss": -7.036213397979736, "global_step": 20024, "epoch": 119} {"train_loss": -6.6010212898254395, "global_step": 20025, "epoch": 119} {"train_loss": -6.943730354309082, "global_step": 20026, "epoch": 119} {"train_loss": -6.9598164558410645, "global_step": 20027, "epoch": 119} {"train_loss": -7.07009220123291, "global_step": 20028, "epoch": 119} {"train_loss": -7.05107307434082, "global_step": 20029, "epoch": 119} {"train_loss": -6.942138671875, "global_step": 20030, "epoch": 119} {"train_loss": -6.8699259757995605, "global_step": 20031, "epoch": 119} {"train_loss": -6.8195624351501465, "global_step": 20032, "epoch": 119} {"train_loss": -7.004875659942627, "global_step": 20033, "epoch": 119} {"train_loss": -7.127788066864014, "global_step": 20034, "epoch": 119} {"train_loss": -6.938874244689941, "global_step": 20035, "epoch": 119} {"train_loss": -6.922904014587402, "global_step": 20036, "epoch": 119} {"train_loss": -6.776297569274902, "global_step": 20037, "epoch": 119} {"train_loss": -6.924290657043457, "global_step": 20038, "epoch": 119} {"train_loss": -6.994988918304443, "global_step": 20039, "epoch": 119} {"train_loss": -6.911772727966309, "global_step": 20040, "epoch": 119} {"train_loss": -7.054123878479004, "global_step": 20041, "epoch": 119} {"train_loss": -6.778317928314209, "global_step": 20042, "epoch": 119} {"train_loss": -6.9460835456848145, "global_step": 20043, "epoch": 119} {"train_loss": -6.946244716644287, "global_step": 20044, "epoch": 119} {"train_loss": -7.014501571655273, "global_step": 20045, "epoch": 119} {"train_loss": -6.8788251876831055, "global_step": 20046, "epoch": 119} {"train_loss": -6.745518684387207, "global_step": 20047, "epoch": 119} {"train_loss": -6.838095664978027, "global_step": 20048, "epoch": 119} {"train_loss": -6.690883636474609, "global_step": 20049, "epoch": 119} {"train_loss": -6.705367565155029, "global_step": 20050, "epoch": 119} {"train_loss": -6.628538608551025, "global_step": 20051, "epoch": 119} {"train_loss": -6.744172096252441, "global_step": 20052, "epoch": 119} {"train_loss": -6.431892395019531, "global_step": 20053, "epoch": 119} {"train_loss": -6.765366554260254, "global_step": 20054, "epoch": 119} {"train_loss": -6.596683502197266, "global_step": 20055, "epoch": 119} {"train_loss": -6.68632698059082, "global_step": 20056, "epoch": 119} {"train_loss": -6.4665069580078125, "global_step": 20057, "epoch": 119} {"train_loss": -6.819530010223389, "global_step": 20058, "epoch": 119} {"train_loss": -6.611091136932373, "global_step": 20059, "epoch": 119} {"train_loss": -6.726165771484375, "global_step": 20060, "epoch": 119} {"train_loss": -6.560577392578125, "global_step": 20061, "epoch": 119} {"train_loss": -6.627997398376465, "global_step": 20062, "epoch": 119} {"train_loss": -7.00654935836792, "global_step": 20063, "epoch": 119} {"train_loss": -6.704564094543457, "global_step": 20064, "epoch": 119} {"train_loss": -6.488332271575928, "global_step": 20065, "epoch": 119} {"train_loss": -6.5919342041015625, "global_step": 20066, "epoch": 119} {"train_loss": -6.449851989746094, "global_step": 20067, "epoch": 119} {"train_loss": -6.683494567871094, "global_step": 20068, "epoch": 119} {"train_loss": -6.704647064208984, "global_step": 20069, "epoch": 119} {"train_loss": -6.873335838317871, "global_step": 20070, "epoch": 119} {"train_loss": -6.681205749511719, "global_step": 20071, "epoch": 119} {"train_loss": -6.853128910064697, "global_step": 20072, "epoch": 119} {"train_loss": -6.965366840362549, "global_step": 20073, "epoch": 119} {"train_loss": -7.049317359924316, "global_step": 20074, "epoch": 119} {"train_loss": -6.705306529998779, "global_step": 20075, "epoch": 119} {"train_loss": -6.84480619430542, "global_step": 20076, "epoch": 119} {"train_loss": -7.007319450378418, "global_step": 20077, "epoch": 119} {"train_loss": -6.908613204956055, "global_step": 20078, "epoch": 119} {"train_loss": -7.224090576171875, "global_step": 20079, "epoch": 119} {"train_loss": -7.068795204162598, "global_step": 20080, "epoch": 119} {"train_loss": -6.843086242675781, "global_step": 20081, "epoch": 119} {"train_loss": -6.967134475708008, "global_step": 20082, "epoch": 119} {"train_loss": -6.969901084899902, "global_step": 20083, "epoch": 119} {"train_loss": -6.874782562255859, "global_step": 20084, "epoch": 119} {"train_loss": -6.894576072692871, "global_step": 20085, "epoch": 119} {"train_loss": -6.580543518066406, "global_step": 20086, "epoch": 119} {"train_loss": -6.971320152282715, "global_step": 20087, "epoch": 119} {"train_loss": -6.832842826843262, "global_step": 20088, "epoch": 119} {"train_loss": -6.6577887535095215, "global_step": 20089, "epoch": 119} {"train_loss": -6.884974956512451, "global_step": 20090, "epoch": 119} {"train_loss": -6.844164848327637, "global_step": 20091, "epoch": 119} {"train_loss": -6.6635589599609375, "global_step": 20092, "epoch": 119} {"train_loss": -6.544447898864746, "global_step": 20093, "epoch": 119} {"train_loss": -6.729247093200684, "global_step": 20094, "epoch": 119} {"train_loss": -6.524043560028076, "global_step": 20095, "epoch": 119} {"train_loss": -6.517453193664551, "global_step": 20096, "epoch": 119} {"train_loss": -6.476137638092041, "global_step": 20097, "epoch": 119} {"train_loss": -6.503654479980469, "global_step": 20098, "epoch": 119} {"train_loss": -6.667690753936768, "global_step": 20099, "epoch": 119} {"train_loss": -6.460827350616455, "global_step": 20100, "epoch": 119} {"train_loss": -6.5902605056762695, "global_step": 20101, "epoch": 119} {"train_loss": -6.6014628410339355, "global_step": 20102, "epoch": 119} {"train_loss": -6.672785758972168, "global_step": 20103, "epoch": 119} {"train_loss": -6.5675554275512695, "global_step": 20104, "epoch": 119} {"train_loss": -6.649864196777344, "global_step": 20105, "epoch": 119} {"train_loss": -6.742281436920166, "global_step": 20106, "epoch": 119} {"train_loss": -6.668465614318848, "global_step": 20107, "epoch": 119} {"train_loss": -6.73262357711792, "global_step": 20108, "epoch": 119} {"train_loss": -6.589801788330078, "global_step": 20109, "epoch": 119} {"train_loss": -6.827301025390625, "global_step": 20110, "epoch": 119} {"train_loss": -6.7547407150268555, "global_step": 20111, "epoch": 119} {"train_loss": -6.860149383544922, "global_step": 20112, "epoch": 119} {"train_loss": -6.830508232116699, "global_step": 20113, "epoch": 119} {"train_loss": -6.768722057342529, "global_step": 20114, "epoch": 119} {"train_loss": -6.756838798522949, "global_step": 20115, "epoch": 119} {"train_loss": -6.772211074829102, "global_step": 20116, "epoch": 119} {"train_loss": -6.8515167236328125, "global_step": 20117, "epoch": 119} {"train_loss": -6.601142883300781, "global_step": 20118, "epoch": 119} {"train_loss": -6.993494987487793, "global_step": 20119, "epoch": 119} {"train_loss": -6.862881660461426, "global_step": 20120, "epoch": 119} {"train_loss": -6.7867889404296875, "global_step": 20121, "epoch": 119} {"train_loss": -6.881626129150391, "global_step": 20122, "epoch": 119} {"train_loss": -6.900165557861328, "global_step": 20123, "epoch": 119} {"train_loss": -6.960299968719482, "global_step": 20124, "epoch": 119} {"train_loss": -6.65136194229126, "global_step": 20125, "epoch": 119} {"train_loss": -6.767561912536621, "global_step": 20126, "epoch": 119} {"train_loss": -6.800152778625488, "global_step": 20127, "epoch": 119} {"train_loss": -6.850407600402832, "global_step": 20128, "epoch": 119} {"train_loss": -6.898550033569336, "global_step": 20129, "epoch": 119} {"train_loss": -6.441840648651123, "global_step": 20130, "epoch": 119} {"train_loss": -6.788028240203857, "global_step": 20131, "epoch": 119} {"train_loss": -6.94858455657959, "global_step": 20132, "epoch": 119} {"train_loss": -6.647093772888184, "global_step": 20133, "epoch": 119} {"train_loss": -6.645604133605957, "global_step": 20134, "epoch": 119} {"train_loss": -6.956602096557617, "global_step": 20135, "epoch": 119} {"train_loss": -6.714832782745361, "global_step": 20136, "epoch": 119} {"train_loss": -6.548320770263672, "global_step": 20137, "epoch": 119} {"train_loss": -7.058945655822754, "global_step": 20138, "epoch": 119} {"train_loss": -6.827061653137207, "global_step": 20139, "epoch": 119} {"train_loss": -7.049901485443115, "global_step": 20140, "epoch": 119} {"train_loss": -6.79436731338501, "global_step": 20141, "epoch": 119} {"train_loss": -6.843941688537598, "global_step": 20142, "epoch": 119} {"train_loss": -6.903057098388672, "global_step": 20143, "epoch": 119} {"train_loss": -6.981779098510742, "global_step": 20144, "epoch": 119} {"train_loss": -6.82962703704834, "global_step": 20145, "epoch": 119} {"train_loss": -6.964715003967285, "global_step": 20146, "epoch": 119} {"train_loss": -6.7139458656311035, "global_step": 20147, "epoch": 119} {"train_loss": -7.004144668579102, "global_step": 20148, "epoch": 119} {"train_loss": -6.612129211425781, "global_step": 20149, "epoch": 119} {"train_loss": -7.116605758666992, "global_step": 20150, "epoch": 119} {"train_loss": -6.885796546936035, "global_step": 20151, "epoch": 119} {"train_loss": -6.853498935699463, "global_step": 20152, "epoch": 119} {"train_loss": -6.793968200683594, "global_step": 20153, "epoch": 119} {"train_loss": -6.875823497772217, "global_step": 20154, "epoch": 119} {"train_loss": -6.915900230407715, "global_step": 20155, "epoch": 119} {"train_loss": -7.040525436401367, "global_step": 20156, "epoch": 119} {"train_loss": -7.291051864624023, "global_step": 20157, "epoch": 119} {"train_loss": -6.839963912963867, "global_step": 20158, "epoch": 119} {"train_loss": -6.793706207048325, "global_step": 20159, "epoch": 119, "val_loss": 216056.65625} {"train_loss": -7.0025634765625, "global_step": 20160, "epoch": 120} {"train_loss": -7.12367582321167, "global_step": 20161, "epoch": 120} {"train_loss": -6.98970365524292, "global_step": 20162, "epoch": 120} {"train_loss": -7.06223201751709, "global_step": 20163, "epoch": 120} {"train_loss": -6.8821563720703125, "global_step": 20164, "epoch": 120} {"train_loss": -6.7696733474731445, "global_step": 20165, "epoch": 120} {"train_loss": -6.576077938079834, "global_step": 20166, "epoch": 120} {"train_loss": -7.019864082336426, "global_step": 20167, "epoch": 120} {"train_loss": -7.03698205947876, "global_step": 20168, "epoch": 120} {"train_loss": -6.726256370544434, "global_step": 20169, "epoch": 120} {"train_loss": -6.957203388214111, "global_step": 20170, "epoch": 120} {"train_loss": -6.8176398277282715, "global_step": 20171, "epoch": 120} {"train_loss": -7.0313568115234375, "global_step": 20172, "epoch": 120} {"train_loss": -6.813836097717285, "global_step": 20173, "epoch": 120} {"train_loss": -6.710756778717041, "global_step": 20174, "epoch": 120} {"train_loss": -6.940397262573242, "global_step": 20175, "epoch": 120} {"train_loss": -6.634526252746582, "global_step": 20176, "epoch": 120} {"train_loss": -6.907535552978516, "global_step": 20177, "epoch": 120} {"train_loss": -6.620478630065918, "global_step": 20178, "epoch": 120} {"train_loss": -6.764649868011475, "global_step": 20179, "epoch": 120} {"train_loss": -6.566418647766113, "global_step": 20180, "epoch": 120} {"train_loss": -6.785730361938477, "global_step": 20181, "epoch": 120} {"train_loss": -6.7316179275512695, "global_step": 20182, "epoch": 120} {"train_loss": -6.964686393737793, "global_step": 20183, "epoch": 120} {"train_loss": -6.940603733062744, "global_step": 20184, "epoch": 120} {"train_loss": -6.796075820922852, "global_step": 20185, "epoch": 120} {"train_loss": -6.773385047912598, "global_step": 20186, "epoch": 120} {"train_loss": -6.850194931030273, "global_step": 20187, "epoch": 120} {"train_loss": -6.9149370193481445, "global_step": 20188, "epoch": 120} {"train_loss": -6.790780067443848, "global_step": 20189, "epoch": 120} {"train_loss": -6.973687648773193, "global_step": 20190, "epoch": 120} {"train_loss": -6.834907054901123, "global_step": 20191, "epoch": 120} {"train_loss": -6.9936628341674805, "global_step": 20192, "epoch": 120} {"train_loss": -6.8511152267456055, "global_step": 20193, "epoch": 120} {"train_loss": -6.928894519805908, "global_step": 20194, "epoch": 120} {"train_loss": -6.8409905433654785, "global_step": 20195, "epoch": 120} {"train_loss": -6.936034202575684, "global_step": 20196, "epoch": 120} {"train_loss": -6.913359642028809, "global_step": 20197, "epoch": 120} {"train_loss": -7.11992073059082, "global_step": 20198, "epoch": 120} {"train_loss": -6.750507831573486, "global_step": 20199, "epoch": 120} {"train_loss": -6.890962600708008, "global_step": 20200, "epoch": 120} {"train_loss": -6.754308700561523, "global_step": 20201, "epoch": 120} {"train_loss": -7.004996299743652, "global_step": 20202, "epoch": 120} {"train_loss": -6.719233512878418, "global_step": 20203, "epoch": 120} {"train_loss": -6.808497428894043, "global_step": 20204, "epoch": 120} {"train_loss": -6.670499801635742, "global_step": 20205, "epoch": 120} {"train_loss": -6.809426307678223, "global_step": 20206, "epoch": 120} {"train_loss": -6.614113807678223, "global_step": 20207, "epoch": 120} {"train_loss": -6.688087463378906, "global_step": 20208, "epoch": 120} {"train_loss": -6.876988410949707, "global_step": 20209, "epoch": 120} {"train_loss": -6.698017597198486, "global_step": 20210, "epoch": 120} {"train_loss": -6.879575252532959, "global_step": 20211, "epoch": 120} {"train_loss": -7.017683982849121, "global_step": 20212, "epoch": 120} {"train_loss": -6.8813982009887695, "global_step": 20213, "epoch": 120} {"train_loss": -6.6145477294921875, "global_step": 20214, "epoch": 120} {"train_loss": -6.7179412841796875, "global_step": 20215, "epoch": 120} {"train_loss": -6.713343620300293, "global_step": 20216, "epoch": 120} {"train_loss": -6.592791557312012, "global_step": 20217, "epoch": 120} {"train_loss": -6.846947193145752, "global_step": 20218, "epoch": 120} {"train_loss": -6.756246566772461, "global_step": 20219, "epoch": 120} {"train_loss": -6.840025424957275, "global_step": 20220, "epoch": 120} {"train_loss": -6.753378391265869, "global_step": 20221, "epoch": 120} {"train_loss": -6.806131362915039, "global_step": 20222, "epoch": 120} {"train_loss": -6.74995231628418, "global_step": 20223, "epoch": 120} {"train_loss": -7.042680740356445, "global_step": 20224, "epoch": 120} {"train_loss": -6.771844863891602, "global_step": 20225, "epoch": 120} {"train_loss": -6.943234920501709, "global_step": 20226, "epoch": 120} {"train_loss": -6.672359943389893, "global_step": 20227, "epoch": 120} {"train_loss": -6.519791126251221, "global_step": 20228, "epoch": 120} {"train_loss": -6.860411167144775, "global_step": 20229, "epoch": 120} {"train_loss": -6.621488571166992, "global_step": 20230, "epoch": 120} {"train_loss": -6.9147233963012695, "global_step": 20231, "epoch": 120} {"train_loss": -6.758070945739746, "global_step": 20232, "epoch": 120} {"train_loss": -6.807854175567627, "global_step": 20233, "epoch": 120} {"train_loss": -6.817020416259766, "global_step": 20234, "epoch": 120} {"train_loss": -6.507399559020996, "global_step": 20235, "epoch": 120} {"train_loss": -6.609508514404297, "global_step": 20236, "epoch": 120} {"train_loss": -6.701348304748535, "global_step": 20237, "epoch": 120} {"train_loss": -6.822996616363525, "global_step": 20238, "epoch": 120} {"train_loss": -6.734651565551758, "global_step": 20239, "epoch": 120} {"train_loss": -6.685521125793457, "global_step": 20240, "epoch": 120} {"train_loss": -6.825044631958008, "global_step": 20241, "epoch": 120} {"train_loss": -6.728351593017578, "global_step": 20242, "epoch": 120} {"train_loss": -6.695472240447998, "global_step": 20243, "epoch": 120} {"train_loss": -6.85118293762207, "global_step": 20244, "epoch": 120} {"train_loss": -6.98077392578125, "global_step": 20245, "epoch": 120} {"train_loss": -6.917410373687744, "global_step": 20246, "epoch": 120} {"train_loss": -6.96733283996582, "global_step": 20247, "epoch": 120} {"train_loss": -6.56083869934082, "global_step": 20248, "epoch": 120} {"train_loss": -6.910665035247803, "global_step": 20249, "epoch": 120} {"train_loss": -6.559902191162109, "global_step": 20250, "epoch": 120} {"train_loss": -6.653751373291016, "global_step": 20251, "epoch": 120} {"train_loss": -6.755883693695068, "global_step": 20252, "epoch": 120} {"train_loss": -6.760481357574463, "global_step": 20253, "epoch": 120} {"train_loss": -6.816612243652344, "global_step": 20254, "epoch": 120} {"train_loss": -6.582046031951904, "global_step": 20255, "epoch": 120} {"train_loss": -6.823025703430176, "global_step": 20256, "epoch": 120} {"train_loss": -7.011990070343018, "global_step": 20257, "epoch": 120} {"train_loss": -6.669673919677734, "global_step": 20258, "epoch": 120} {"train_loss": -6.898586273193359, "global_step": 20259, "epoch": 120} {"train_loss": -7.0123443603515625, "global_step": 20260, "epoch": 120} {"train_loss": -6.836164474487305, "global_step": 20261, "epoch": 120} {"train_loss": -6.9533185958862305, "global_step": 20262, "epoch": 120} {"train_loss": -6.644591331481934, "global_step": 20263, "epoch": 120} {"train_loss": -6.862676620483398, "global_step": 20264, "epoch": 120} {"train_loss": -6.908699989318848, "global_step": 20265, "epoch": 120} {"train_loss": -6.966306686401367, "global_step": 20266, "epoch": 120} {"train_loss": -6.836933135986328, "global_step": 20267, "epoch": 120} {"train_loss": -6.881389617919922, "global_step": 20268, "epoch": 120} {"train_loss": -6.85609245300293, "global_step": 20269, "epoch": 120} {"train_loss": -6.833902835845947, "global_step": 20270, "epoch": 120} {"train_loss": -6.820271968841553, "global_step": 20271, "epoch": 120} {"train_loss": -6.961321830749512, "global_step": 20272, "epoch": 120} {"train_loss": -7.082693099975586, "global_step": 20273, "epoch": 120} {"train_loss": -6.913288116455078, "global_step": 20274, "epoch": 120} {"train_loss": -7.0421953201293945, "global_step": 20275, "epoch": 120} {"train_loss": -6.6054158210754395, "global_step": 20276, "epoch": 120} {"train_loss": -7.009402275085449, "global_step": 20277, "epoch": 120} {"train_loss": -6.30430793762207, "global_step": 20278, "epoch": 120} {"train_loss": -6.88758659362793, "global_step": 20279, "epoch": 120} {"train_loss": -6.437558650970459, "global_step": 20280, "epoch": 120} {"train_loss": -6.572858810424805, "global_step": 20281, "epoch": 120} {"train_loss": -6.585182189941406, "global_step": 20282, "epoch": 120} {"train_loss": -6.45161247253418, "global_step": 20283, "epoch": 120} {"train_loss": -6.325399875640869, "global_step": 20284, "epoch": 120} {"train_loss": -6.74766731262207, "global_step": 20285, "epoch": 120} {"train_loss": -6.593564033508301, "global_step": 20286, "epoch": 120} {"train_loss": -7.013472080230713, "global_step": 20287, "epoch": 120} {"train_loss": -6.716619491577148, "global_step": 20288, "epoch": 120} {"train_loss": -6.676003932952881, "global_step": 20289, "epoch": 120} {"train_loss": -6.781425476074219, "global_step": 20290, "epoch": 120} {"train_loss": -6.748159408569336, "global_step": 20291, "epoch": 120} {"train_loss": -6.733027458190918, "global_step": 20292, "epoch": 120} {"train_loss": -6.899572849273682, "global_step": 20293, "epoch": 120} {"train_loss": -6.616273403167725, "global_step": 20294, "epoch": 120} {"train_loss": -6.840015411376953, "global_step": 20295, "epoch": 120} {"train_loss": -6.827540874481201, "global_step": 20296, "epoch": 120} {"train_loss": -6.84025239944458, "global_step": 20297, "epoch": 120} {"train_loss": -6.8882293701171875, "global_step": 20298, "epoch": 120} {"train_loss": -6.8162431716918945, "global_step": 20299, "epoch": 120} {"train_loss": -6.988221645355225, "global_step": 20300, "epoch": 120} {"train_loss": -6.999041557312012, "global_step": 20301, "epoch": 120} {"train_loss": -6.935148239135742, "global_step": 20302, "epoch": 120} {"train_loss": -6.910728454589844, "global_step": 20303, "epoch": 120} {"train_loss": -7.092076301574707, "global_step": 20304, "epoch": 120} {"train_loss": -6.841087341308594, "global_step": 20305, "epoch": 120} {"train_loss": -6.918522834777832, "global_step": 20306, "epoch": 120} {"train_loss": -6.938965797424316, "global_step": 20307, "epoch": 120} {"train_loss": -6.989279747009277, "global_step": 20308, "epoch": 120} {"train_loss": -6.992191314697266, "global_step": 20309, "epoch": 120} {"train_loss": -7.086656093597412, "global_step": 20310, "epoch": 120} {"train_loss": -6.948746681213379, "global_step": 20311, "epoch": 120} {"train_loss": -6.877614498138428, "global_step": 20312, "epoch": 120} {"train_loss": -7.1771087646484375, "global_step": 20313, "epoch": 120} {"train_loss": -6.771540641784668, "global_step": 20314, "epoch": 120} {"train_loss": -6.9317779541015625, "global_step": 20315, "epoch": 120} {"train_loss": -6.7733988761901855, "global_step": 20316, "epoch": 120} {"train_loss": -6.868383407592773, "global_step": 20317, "epoch": 120} {"train_loss": -6.994166374206543, "global_step": 20318, "epoch": 120} {"train_loss": -6.699892520904541, "global_step": 20319, "epoch": 120} {"train_loss": -7.053235054016113, "global_step": 20320, "epoch": 120} {"train_loss": -6.761690139770508, "global_step": 20321, "epoch": 120} {"train_loss": -6.994289398193359, "global_step": 20322, "epoch": 120} {"train_loss": -6.645627021789551, "global_step": 20323, "epoch": 120} {"train_loss": -6.870605945587158, "global_step": 20324, "epoch": 120} {"train_loss": -6.908487319946289, "global_step": 20325, "epoch": 120} {"train_loss": -6.897497177124023, "global_step": 20326, "epoch": 120} {"train_loss": -6.8232701278868175, "global_step": 20327, "epoch": 120, "val_loss": 209661.59375, "train_action_mse_error": 20.377803802490234} {"train_loss": -6.9219160079956055, "global_step": 20328, "epoch": 121} {"train_loss": -6.709592819213867, "global_step": 20329, "epoch": 121} {"train_loss": -6.896526336669922, "global_step": 20330, "epoch": 121} {"train_loss": -6.83665657043457, "global_step": 20331, "epoch": 121} {"train_loss": -6.9133806228637695, "global_step": 20332, "epoch": 121} {"train_loss": -6.78373908996582, "global_step": 20333, "epoch": 121} {"train_loss": -6.875073432922363, "global_step": 20334, "epoch": 121} {"train_loss": -7.244611740112305, "global_step": 20335, "epoch": 121} {"train_loss": -6.580626487731934, "global_step": 20336, "epoch": 121} {"train_loss": -6.918396472930908, "global_step": 20337, "epoch": 121} {"train_loss": -6.5823469161987305, "global_step": 20338, "epoch": 121} {"train_loss": -6.683198928833008, "global_step": 20339, "epoch": 121} {"train_loss": -6.60354471206665, "global_step": 20340, "epoch": 121} {"train_loss": -6.58515739440918, "global_step": 20341, "epoch": 121} {"train_loss": -6.728365898132324, "global_step": 20342, "epoch": 121} {"train_loss": -6.857634544372559, "global_step": 20343, "epoch": 121} {"train_loss": -6.6470184326171875, "global_step": 20344, "epoch": 121} {"train_loss": -6.875768661499023, "global_step": 20345, "epoch": 121} {"train_loss": -6.550838470458984, "global_step": 20346, "epoch": 121} {"train_loss": -6.98017692565918, "global_step": 20347, "epoch": 121} {"train_loss": -6.622351169586182, "global_step": 20348, "epoch": 121} {"train_loss": -6.628222465515137, "global_step": 20349, "epoch": 121} {"train_loss": -6.750574111938477, "global_step": 20350, "epoch": 121} {"train_loss": -6.7711639404296875, "global_step": 20351, "epoch": 121} {"train_loss": -6.767358303070068, "global_step": 20352, "epoch": 121} {"train_loss": -6.674894332885742, "global_step": 20353, "epoch": 121} {"train_loss": -7.008051872253418, "global_step": 20354, "epoch": 121} {"train_loss": -6.727588653564453, "global_step": 20355, "epoch": 121} {"train_loss": -7.016722679138184, "global_step": 20356, "epoch": 121} {"train_loss": -6.742318153381348, "global_step": 20357, "epoch": 121} {"train_loss": -7.004063606262207, "global_step": 20358, "epoch": 121} {"train_loss": -6.663502216339111, "global_step": 20359, "epoch": 121} {"train_loss": -6.846060276031494, "global_step": 20360, "epoch": 121} {"train_loss": -7.105867385864258, "global_step": 20361, "epoch": 121} {"train_loss": -6.919615745544434, "global_step": 20362, "epoch": 121} {"train_loss": -6.751626968383789, "global_step": 20363, "epoch": 121} {"train_loss": -6.93369197845459, "global_step": 20364, "epoch": 121} {"train_loss": -6.838040828704834, "global_step": 20365, "epoch": 121} {"train_loss": -6.876187801361084, "global_step": 20366, "epoch": 121} {"train_loss": -6.709136486053467, "global_step": 20367, "epoch": 121} {"train_loss": -6.8710222244262695, "global_step": 20368, "epoch": 121} {"train_loss": -6.962890625, "global_step": 20369, "epoch": 121} {"train_loss": -6.846456050872803, "global_step": 20370, "epoch": 121} {"train_loss": -6.989480972290039, "global_step": 20371, "epoch": 121} {"train_loss": -6.8067827224731445, "global_step": 20372, "epoch": 121} {"train_loss": -6.565620422363281, "global_step": 20373, "epoch": 121} {"train_loss": -6.904146671295166, "global_step": 20374, "epoch": 121} {"train_loss": -6.737985134124756, "global_step": 20375, "epoch": 121} {"train_loss": -6.717452526092529, "global_step": 20376, "epoch": 121} {"train_loss": -6.7433648109436035, "global_step": 20377, "epoch": 121} {"train_loss": -6.935330867767334, "global_step": 20378, "epoch": 121} {"train_loss": -6.865816116333008, "global_step": 20379, "epoch": 121} {"train_loss": -6.863537788391113, "global_step": 20380, "epoch": 121} {"train_loss": -6.701824188232422, "global_step": 20381, "epoch": 121} {"train_loss": -6.991774559020996, "global_step": 20382, "epoch": 121} {"train_loss": -6.821044921875, "global_step": 20383, "epoch": 121} {"train_loss": -6.968554973602295, "global_step": 20384, "epoch": 121} {"train_loss": -6.997472763061523, "global_step": 20385, "epoch": 121} {"train_loss": -6.926865100860596, "global_step": 20386, "epoch": 121} {"train_loss": -6.777483940124512, "global_step": 20387, "epoch": 121} {"train_loss": -7.089139461517334, "global_step": 20388, "epoch": 121} {"train_loss": -6.961386203765869, "global_step": 20389, "epoch": 121} {"train_loss": -6.931026935577393, "global_step": 20390, "epoch": 121} {"train_loss": -6.835973739624023, "global_step": 20391, "epoch": 121} {"train_loss": -6.878787040710449, "global_step": 20392, "epoch": 121} {"train_loss": -6.765066146850586, "global_step": 20393, "epoch": 121} {"train_loss": -6.83318567276001, "global_step": 20394, "epoch": 121} {"train_loss": -6.656425476074219, "global_step": 20395, "epoch": 121} {"train_loss": -6.709206581115723, "global_step": 20396, "epoch": 121} {"train_loss": -6.5499372482299805, "global_step": 20397, "epoch": 121} {"train_loss": -6.904742240905762, "global_step": 20398, "epoch": 121} {"train_loss": -6.736132621765137, "global_step": 20399, "epoch": 121} {"train_loss": -6.675609111785889, "global_step": 20400, "epoch": 121} {"train_loss": -6.576571941375732, "global_step": 20401, "epoch": 121} {"train_loss": -6.527438163757324, "global_step": 20402, "epoch": 121} {"train_loss": -6.6652421951293945, "global_step": 20403, "epoch": 121} {"train_loss": -6.663721084594727, "global_step": 20404, "epoch": 121} {"train_loss": -6.79743766784668, "global_step": 20405, "epoch": 121} {"train_loss": -6.7988691329956055, "global_step": 20406, "epoch": 121} {"train_loss": -6.8162970542907715, "global_step": 20407, "epoch": 121} {"train_loss": -6.902999401092529, "global_step": 20408, "epoch": 121} {"train_loss": -6.5992937088012695, "global_step": 20409, "epoch": 121} {"train_loss": -6.739959239959717, "global_step": 20410, "epoch": 121} {"train_loss": -6.765967845916748, "global_step": 20411, "epoch": 121} {"train_loss": -6.675644397735596, "global_step": 20412, "epoch": 121} {"train_loss": -6.701937675476074, "global_step": 20413, "epoch": 121} {"train_loss": -6.890259742736816, "global_step": 20414, "epoch": 121} {"train_loss": -6.8607683181762695, "global_step": 20415, "epoch": 121} {"train_loss": -6.6424455642700195, "global_step": 20416, "epoch": 121} {"train_loss": -6.714824676513672, "global_step": 20417, "epoch": 121} {"train_loss": -7.150250434875488, "global_step": 20418, "epoch": 121} {"train_loss": -7.056014537811279, "global_step": 20419, "epoch": 121} {"train_loss": -6.758517742156982, "global_step": 20420, "epoch": 121} {"train_loss": -6.705869674682617, "global_step": 20421, "epoch": 121} {"train_loss": -6.87100887298584, "global_step": 20422, "epoch": 121} {"train_loss": -7.013747215270996, "global_step": 20423, "epoch": 121} {"train_loss": -6.919528961181641, "global_step": 20424, "epoch": 121} {"train_loss": -6.90497350692749, "global_step": 20425, "epoch": 121} {"train_loss": -6.939689636230469, "global_step": 20426, "epoch": 121} {"train_loss": -6.905562400817871, "global_step": 20427, "epoch": 121} {"train_loss": -7.110837459564209, "global_step": 20428, "epoch": 121} {"train_loss": -7.149816513061523, "global_step": 20429, "epoch": 121} {"train_loss": -7.004825592041016, "global_step": 20430, "epoch": 121} {"train_loss": -7.025254249572754, "global_step": 20431, "epoch": 121} {"train_loss": -7.0635905265808105, "global_step": 20432, "epoch": 121} {"train_loss": -6.9290876388549805, "global_step": 20433, "epoch": 121} {"train_loss": -6.716744899749756, "global_step": 20434, "epoch": 121} {"train_loss": -6.963935852050781, "global_step": 20435, "epoch": 121} {"train_loss": -6.745480537414551, "global_step": 20436, "epoch": 121} {"train_loss": -6.91220760345459, "global_step": 20437, "epoch": 121} {"train_loss": -6.757790565490723, "global_step": 20438, "epoch": 121} {"train_loss": -6.8074870109558105, "global_step": 20439, "epoch": 121} {"train_loss": -6.846630096435547, "global_step": 20440, "epoch": 121} {"train_loss": -6.855133056640625, "global_step": 20441, "epoch": 121} {"train_loss": -6.942073822021484, "global_step": 20442, "epoch": 121} {"train_loss": -6.792056083679199, "global_step": 20443, "epoch": 121} {"train_loss": -6.806204795837402, "global_step": 20444, "epoch": 121} {"train_loss": -6.804065704345703, "global_step": 20445, "epoch": 121} {"train_loss": -6.828208923339844, "global_step": 20446, "epoch": 121} {"train_loss": -6.848538875579834, "global_step": 20447, "epoch": 121} {"train_loss": -6.917261123657227, "global_step": 20448, "epoch": 121} {"train_loss": -6.951650142669678, "global_step": 20449, "epoch": 121} {"train_loss": -6.713810443878174, "global_step": 20450, "epoch": 121} {"train_loss": -6.903909683227539, "global_step": 20451, "epoch": 121} {"train_loss": -7.043179035186768, "global_step": 20452, "epoch": 121} {"train_loss": -6.991626739501953, "global_step": 20453, "epoch": 121} {"train_loss": -6.647088050842285, "global_step": 20454, "epoch": 121} {"train_loss": -6.624014854431152, "global_step": 20455, "epoch": 121} {"train_loss": -6.981240272521973, "global_step": 20456, "epoch": 121} {"train_loss": -6.9014387130737305, "global_step": 20457, "epoch": 121} {"train_loss": -7.025940895080566, "global_step": 20458, "epoch": 121} {"train_loss": -7.017953395843506, "global_step": 20459, "epoch": 121} {"train_loss": -6.986179351806641, "global_step": 20460, "epoch": 121} {"train_loss": -6.991283416748047, "global_step": 20461, "epoch": 121} {"train_loss": -6.873349189758301, "global_step": 20462, "epoch": 121} {"train_loss": -6.890798568725586, "global_step": 20463, "epoch": 121} {"train_loss": -6.898469924926758, "global_step": 20464, "epoch": 121} {"train_loss": -6.989327907562256, "global_step": 20465, "epoch": 121} {"train_loss": -6.950225353240967, "global_step": 20466, "epoch": 121} {"train_loss": -7.070913314819336, "global_step": 20467, "epoch": 121} {"train_loss": -7.083930015563965, "global_step": 20468, "epoch": 121} {"train_loss": -6.942487716674805, "global_step": 20469, "epoch": 121} {"train_loss": -7.016658782958984, "global_step": 20470, "epoch": 121} {"train_loss": -6.8062896728515625, "global_step": 20471, "epoch": 121} {"train_loss": -6.815312385559082, "global_step": 20472, "epoch": 121} {"train_loss": -7.01507568359375, "global_step": 20473, "epoch": 121} {"train_loss": -6.805994033813477, "global_step": 20474, "epoch": 121} {"train_loss": -6.97605037689209, "global_step": 20475, "epoch": 121} {"train_loss": -6.629029750823975, "global_step": 20476, "epoch": 121} {"train_loss": -6.909201622009277, "global_step": 20477, "epoch": 121} {"train_loss": -6.826670169830322, "global_step": 20478, "epoch": 121} {"train_loss": -7.173691272735596, "global_step": 20479, "epoch": 121} {"train_loss": -6.912326812744141, "global_step": 20480, "epoch": 121} {"train_loss": -7.04994010925293, "global_step": 20481, "epoch": 121} {"train_loss": -6.867000579833984, "global_step": 20482, "epoch": 121} {"train_loss": -6.936861991882324, "global_step": 20483, "epoch": 121} {"train_loss": -6.854830741882324, "global_step": 20484, "epoch": 121} {"train_loss": -7.07223653793335, "global_step": 20485, "epoch": 121} {"train_loss": -6.793800354003906, "global_step": 20486, "epoch": 121} {"train_loss": -6.835968971252441, "global_step": 20487, "epoch": 121} {"train_loss": -6.470725059509277, "global_step": 20488, "epoch": 121} {"train_loss": -6.591858863830566, "global_step": 20489, "epoch": 121} {"train_loss": -6.752084732055664, "global_step": 20490, "epoch": 121} {"train_loss": -6.638875961303711, "global_step": 20491, "epoch": 121} {"train_loss": -6.665596961975098, "global_step": 20492, "epoch": 121} {"train_loss": -6.599890232086182, "global_step": 20493, "epoch": 121} {"train_loss": -6.554311275482178, "global_step": 20494, "epoch": 121} {"train_loss": -6.837869190034413, "global_step": 20495, "epoch": 121, "val_loss": 216642.25} {"train_loss": -6.692181587219238, "global_step": 20496, "epoch": 122} {"train_loss": -6.7701616287231445, "global_step": 20497, "epoch": 122} {"train_loss": -6.773083686828613, "global_step": 20498, "epoch": 122} {"train_loss": -6.7152204513549805, "global_step": 20499, "epoch": 122} {"train_loss": -6.775712013244629, "global_step": 20500, "epoch": 122} {"train_loss": -6.651252269744873, "global_step": 20501, "epoch": 122} {"train_loss": -6.495192050933838, "global_step": 20502, "epoch": 122} {"train_loss": -6.698170185089111, "global_step": 20503, "epoch": 122} {"train_loss": -6.627497673034668, "global_step": 20504, "epoch": 122} {"train_loss": -6.785037994384766, "global_step": 20505, "epoch": 122} {"train_loss": -6.852382183074951, "global_step": 20506, "epoch": 122} {"train_loss": -6.570104598999023, "global_step": 20507, "epoch": 122} {"train_loss": -6.807735443115234, "global_step": 20508, "epoch": 122} {"train_loss": -6.917722702026367, "global_step": 20509, "epoch": 122} {"train_loss": -7.004575729370117, "global_step": 20510, "epoch": 122} {"train_loss": -6.723193168640137, "global_step": 20511, "epoch": 122} {"train_loss": -6.870200157165527, "global_step": 20512, "epoch": 122} {"train_loss": -6.828361511230469, "global_step": 20513, "epoch": 122} {"train_loss": -6.93690299987793, "global_step": 20514, "epoch": 122} {"train_loss": -6.880665302276611, "global_step": 20515, "epoch": 122} {"train_loss": -6.651078701019287, "global_step": 20516, "epoch": 122} {"train_loss": -6.795702934265137, "global_step": 20517, "epoch": 122} {"train_loss": -6.932461261749268, "global_step": 20518, "epoch": 122} {"train_loss": -6.879497528076172, "global_step": 20519, "epoch": 122} {"train_loss": -6.749590873718262, "global_step": 20520, "epoch": 122} {"train_loss": -6.860579490661621, "global_step": 20521, "epoch": 122} {"train_loss": -6.968579292297363, "global_step": 20522, "epoch": 122} {"train_loss": -6.859692573547363, "global_step": 20523, "epoch": 122} {"train_loss": -6.985592842102051, "global_step": 20524, "epoch": 122} {"train_loss": -6.9315185546875, "global_step": 20525, "epoch": 122} {"train_loss": -6.944523811340332, "global_step": 20526, "epoch": 122} {"train_loss": -6.973969459533691, "global_step": 20527, "epoch": 122} {"train_loss": -6.921299934387207, "global_step": 20528, "epoch": 122} {"train_loss": -6.863297462463379, "global_step": 20529, "epoch": 122} {"train_loss": -7.019112586975098, "global_step": 20530, "epoch": 122} {"train_loss": -6.90863037109375, "global_step": 20531, "epoch": 122} {"train_loss": -6.896450996398926, "global_step": 20532, "epoch": 122} {"train_loss": -6.9230637550354, "global_step": 20533, "epoch": 122} {"train_loss": -6.9051055908203125, "global_step": 20534, "epoch": 122} {"train_loss": -7.114599227905273, "global_step": 20535, "epoch": 122} {"train_loss": -7.020905017852783, "global_step": 20536, "epoch": 122} {"train_loss": -6.840848922729492, "global_step": 20537, "epoch": 122} {"train_loss": -6.862131118774414, "global_step": 20538, "epoch": 122} {"train_loss": -6.846057891845703, "global_step": 20539, "epoch": 122} {"train_loss": -6.740179538726807, "global_step": 20540, "epoch": 122} {"train_loss": -6.750973224639893, "global_step": 20541, "epoch": 122} {"train_loss": -6.878233909606934, "global_step": 20542, "epoch": 122} {"train_loss": -6.809101581573486, "global_step": 20543, "epoch": 122} {"train_loss": -6.947155952453613, "global_step": 20544, "epoch": 122} {"train_loss": -7.0861310958862305, "global_step": 20545, "epoch": 122} {"train_loss": -6.81173038482666, "global_step": 20546, "epoch": 122} {"train_loss": -6.907557487487793, "global_step": 20547, "epoch": 122} {"train_loss": -6.997681140899658, "global_step": 20548, "epoch": 122} {"train_loss": -7.160660743713379, "global_step": 20549, "epoch": 122} {"train_loss": -6.807882785797119, "global_step": 20550, "epoch": 122} {"train_loss": -6.922938346862793, "global_step": 20551, "epoch": 122} {"train_loss": -7.04640007019043, "global_step": 20552, "epoch": 122} {"train_loss": -6.694025993347168, "global_step": 20553, "epoch": 122} {"train_loss": -6.810688495635986, "global_step": 20554, "epoch": 122} {"train_loss": -6.73793888092041, "global_step": 20555, "epoch": 122} {"train_loss": -6.799342155456543, "global_step": 20556, "epoch": 122} {"train_loss": -6.8712968826293945, "global_step": 20557, "epoch": 122} {"train_loss": -6.9662580490112305, "global_step": 20558, "epoch": 122} {"train_loss": -6.606184959411621, "global_step": 20559, "epoch": 122} {"train_loss": -6.990267753601074, "global_step": 20560, "epoch": 122} {"train_loss": -6.6908464431762695, "global_step": 20561, "epoch": 122} {"train_loss": -7.0534234046936035, "global_step": 20562, "epoch": 122} {"train_loss": -6.839288711547852, "global_step": 20563, "epoch": 122} {"train_loss": -6.819890975952148, "global_step": 20564, "epoch": 122} {"train_loss": -6.8551025390625, "global_step": 20565, "epoch": 122} {"train_loss": -7.1150288581848145, "global_step": 20566, "epoch": 122} {"train_loss": -6.825554370880127, "global_step": 20567, "epoch": 122} {"train_loss": -6.933197498321533, "global_step": 20568, "epoch": 122} {"train_loss": -6.797920227050781, "global_step": 20569, "epoch": 122} {"train_loss": -6.948982238769531, "global_step": 20570, "epoch": 122} {"train_loss": -6.932700157165527, "global_step": 20571, "epoch": 122} {"train_loss": -6.614587783813477, "global_step": 20572, "epoch": 122} {"train_loss": -6.744381427764893, "global_step": 20573, "epoch": 122} {"train_loss": -6.958527565002441, "global_step": 20574, "epoch": 122} {"train_loss": -6.86521053314209, "global_step": 20575, "epoch": 122} {"train_loss": -6.842231750488281, "global_step": 20576, "epoch": 122} {"train_loss": -6.9227190017700195, "global_step": 20577, "epoch": 122} {"train_loss": -7.0235161781311035, "global_step": 20578, "epoch": 122} {"train_loss": -6.911102294921875, "global_step": 20579, "epoch": 122} {"train_loss": -6.968320846557617, "global_step": 20580, "epoch": 122} {"train_loss": -7.067939758300781, "global_step": 20581, "epoch": 122} {"train_loss": -6.9017839431762695, "global_step": 20582, "epoch": 122} {"train_loss": -7.006383895874023, "global_step": 20583, "epoch": 122} {"train_loss": -7.019013404846191, "global_step": 20584, "epoch": 122} {"train_loss": -6.852147102355957, "global_step": 20585, "epoch": 122} {"train_loss": -6.930505752563477, "global_step": 20586, "epoch": 122} {"train_loss": -6.8829545974731445, "global_step": 20587, "epoch": 122} {"train_loss": -7.088822364807129, "global_step": 20588, "epoch": 122} {"train_loss": -6.484540939331055, "global_step": 20589, "epoch": 122} {"train_loss": -6.829148292541504, "global_step": 20590, "epoch": 122} {"train_loss": -6.753149032592773, "global_step": 20591, "epoch": 122} {"train_loss": -6.823468208312988, "global_step": 20592, "epoch": 122} {"train_loss": -6.946145057678223, "global_step": 20593, "epoch": 122} {"train_loss": -6.795648574829102, "global_step": 20594, "epoch": 122} {"train_loss": -6.654365539550781, "global_step": 20595, "epoch": 122} {"train_loss": -6.849092483520508, "global_step": 20596, "epoch": 122} {"train_loss": -6.698339939117432, "global_step": 20597, "epoch": 122} {"train_loss": -7.039165496826172, "global_step": 20598, "epoch": 122} {"train_loss": -6.740573883056641, "global_step": 20599, "epoch": 122} {"train_loss": -6.912569046020508, "global_step": 20600, "epoch": 122} {"train_loss": -6.60897970199585, "global_step": 20601, "epoch": 122} {"train_loss": -6.868908882141113, "global_step": 20602, "epoch": 122} {"train_loss": -6.851898670196533, "global_step": 20603, "epoch": 122} {"train_loss": -6.758342266082764, "global_step": 20604, "epoch": 122} {"train_loss": -6.748163223266602, "global_step": 20605, "epoch": 122} {"train_loss": -6.890769004821777, "global_step": 20606, "epoch": 122} {"train_loss": -6.839078426361084, "global_step": 20607, "epoch": 122} {"train_loss": -6.873635292053223, "global_step": 20608, "epoch": 122} {"train_loss": -6.480451583862305, "global_step": 20609, "epoch": 122} {"train_loss": -6.812941074371338, "global_step": 20610, "epoch": 122} {"train_loss": -6.795796871185303, "global_step": 20611, "epoch": 122} {"train_loss": -7.008884429931641, "global_step": 20612, "epoch": 122} {"train_loss": -6.879576683044434, "global_step": 20613, "epoch": 122} {"train_loss": -7.001410484313965, "global_step": 20614, "epoch": 122} {"train_loss": -6.846731185913086, "global_step": 20615, "epoch": 122} {"train_loss": -6.877121925354004, "global_step": 20616, "epoch": 122} {"train_loss": -6.794529914855957, "global_step": 20617, "epoch": 122} {"train_loss": -6.665781021118164, "global_step": 20618, "epoch": 122} {"train_loss": -7.00757360458374, "global_step": 20619, "epoch": 122} {"train_loss": -6.675534248352051, "global_step": 20620, "epoch": 122} {"train_loss": -7.094124794006348, "global_step": 20621, "epoch": 122} {"train_loss": -6.7612128257751465, "global_step": 20622, "epoch": 122} {"train_loss": -7.049431324005127, "global_step": 20623, "epoch": 122} {"train_loss": -6.824056625366211, "global_step": 20624, "epoch": 122} {"train_loss": -6.77952766418457, "global_step": 20625, "epoch": 122} {"train_loss": -6.91853141784668, "global_step": 20626, "epoch": 122} {"train_loss": -6.755105972290039, "global_step": 20627, "epoch": 122} {"train_loss": -7.061654090881348, "global_step": 20628, "epoch": 122} {"train_loss": -6.854978561401367, "global_step": 20629, "epoch": 122} {"train_loss": -7.007595062255859, "global_step": 20630, "epoch": 122} {"train_loss": -6.981182098388672, "global_step": 20631, "epoch": 122} {"train_loss": -6.86166524887085, "global_step": 20632, "epoch": 122} {"train_loss": -6.909458160400391, "global_step": 20633, "epoch": 122} {"train_loss": -6.933213710784912, "global_step": 20634, "epoch": 122} {"train_loss": -6.761596202850342, "global_step": 20635, "epoch": 122} {"train_loss": -6.736196994781494, "global_step": 20636, "epoch": 122} {"train_loss": -6.890218257904053, "global_step": 20637, "epoch": 122} {"train_loss": -7.083391189575195, "global_step": 20638, "epoch": 122} {"train_loss": -6.938414096832275, "global_step": 20639, "epoch": 122} {"train_loss": -6.726186752319336, "global_step": 20640, "epoch": 122} {"train_loss": -6.85389518737793, "global_step": 20641, "epoch": 122} {"train_loss": -6.881579399108887, "global_step": 20642, "epoch": 122} {"train_loss": -6.816364288330078, "global_step": 20643, "epoch": 122} {"train_loss": -6.715015888214111, "global_step": 20644, "epoch": 122} {"train_loss": -6.9030656814575195, "global_step": 20645, "epoch": 122} {"train_loss": -6.927488327026367, "global_step": 20646, "epoch": 122} {"train_loss": -6.80807638168335, "global_step": 20647, "epoch": 122} {"train_loss": -6.7500457763671875, "global_step": 20648, "epoch": 122} {"train_loss": -6.698136329650879, "global_step": 20649, "epoch": 122} {"train_loss": -6.982087135314941, "global_step": 20650, "epoch": 122} {"train_loss": -7.03443717956543, "global_step": 20651, "epoch": 122} {"train_loss": -6.882755756378174, "global_step": 20652, "epoch": 122} {"train_loss": -6.788575172424316, "global_step": 20653, "epoch": 122} {"train_loss": -6.8704376220703125, "global_step": 20654, "epoch": 122} {"train_loss": -6.990145683288574, "global_step": 20655, "epoch": 122} {"train_loss": -6.832032203674316, "global_step": 20656, "epoch": 122} {"train_loss": -6.906604290008545, "global_step": 20657, "epoch": 122} {"train_loss": -7.00044584274292, "global_step": 20658, "epoch": 122} {"train_loss": -6.943700313568115, "global_step": 20659, "epoch": 122} {"train_loss": -6.958988189697266, "global_step": 20660, "epoch": 122} {"train_loss": -7.1424641609191895, "global_step": 20661, "epoch": 122} {"train_loss": -6.690910339355469, "global_step": 20662, "epoch": 122} {"train_loss": -6.862597369012379, "global_step": 20663, "epoch": 122, "val_loss": 212985.21875} {"train_loss": -6.936679363250732, "global_step": 20664, "epoch": 123} {"train_loss": -6.831979751586914, "global_step": 20665, "epoch": 123} {"train_loss": -6.7948079109191895, "global_step": 20666, "epoch": 123} {"train_loss": -6.617740631103516, "global_step": 20667, "epoch": 123} {"train_loss": -6.783641815185547, "global_step": 20668, "epoch": 123} {"train_loss": -6.547309875488281, "global_step": 20669, "epoch": 123} {"train_loss": -6.756686210632324, "global_step": 20670, "epoch": 123} {"train_loss": -6.574489593505859, "global_step": 20671, "epoch": 123} {"train_loss": -6.847040176391602, "global_step": 20672, "epoch": 123} {"train_loss": -6.990839958190918, "global_step": 20673, "epoch": 123} {"train_loss": -6.732309341430664, "global_step": 20674, "epoch": 123} {"train_loss": -6.88889217376709, "global_step": 20675, "epoch": 123} {"train_loss": -6.709989070892334, "global_step": 20676, "epoch": 123} {"train_loss": -6.640686988830566, "global_step": 20677, "epoch": 123} {"train_loss": -6.708729267120361, "global_step": 20678, "epoch": 123} {"train_loss": -6.699481964111328, "global_step": 20679, "epoch": 123} {"train_loss": -6.703645706176758, "global_step": 20680, "epoch": 123} {"train_loss": -6.9180073738098145, "global_step": 20681, "epoch": 123} {"train_loss": -6.755058288574219, "global_step": 20682, "epoch": 123} {"train_loss": -6.620176315307617, "global_step": 20683, "epoch": 123} {"train_loss": -7.054569244384766, "global_step": 20684, "epoch": 123} {"train_loss": -6.912479877471924, "global_step": 20685, "epoch": 123} {"train_loss": -6.891904830932617, "global_step": 20686, "epoch": 123} {"train_loss": -6.737456321716309, "global_step": 20687, "epoch": 123} {"train_loss": -6.826253890991211, "global_step": 20688, "epoch": 123} {"train_loss": -6.929758071899414, "global_step": 20689, "epoch": 123} {"train_loss": -6.521634101867676, "global_step": 20690, "epoch": 123} {"train_loss": -7.035175800323486, "global_step": 20691, "epoch": 123} {"train_loss": -6.776387691497803, "global_step": 20692, "epoch": 123} {"train_loss": -6.98612642288208, "global_step": 20693, "epoch": 123} {"train_loss": -6.901921272277832, "global_step": 20694, "epoch": 123} {"train_loss": -6.85536527633667, "global_step": 20695, "epoch": 123} {"train_loss": -6.624898910522461, "global_step": 20696, "epoch": 123} {"train_loss": -7.124073505401611, "global_step": 20697, "epoch": 123} {"train_loss": -6.676295280456543, "global_step": 20698, "epoch": 123} {"train_loss": -6.839242935180664, "global_step": 20699, "epoch": 123} {"train_loss": -6.6890459060668945, "global_step": 20700, "epoch": 123} {"train_loss": -6.95442533493042, "global_step": 20701, "epoch": 123} {"train_loss": -6.584561347961426, "global_step": 20702, "epoch": 123} {"train_loss": -7.00840425491333, "global_step": 20703, "epoch": 123} {"train_loss": -6.655865669250488, "global_step": 20704, "epoch": 123} {"train_loss": -6.731396675109863, "global_step": 20705, "epoch": 123} {"train_loss": -6.573551177978516, "global_step": 20706, "epoch": 123} {"train_loss": -6.904065132141113, "global_step": 20707, "epoch": 123} {"train_loss": -6.780298233032227, "global_step": 20708, "epoch": 123} {"train_loss": -6.849896430969238, "global_step": 20709, "epoch": 123} {"train_loss": -6.933265686035156, "global_step": 20710, "epoch": 123} {"train_loss": -7.008790969848633, "global_step": 20711, "epoch": 123} {"train_loss": -6.819387912750244, "global_step": 20712, "epoch": 123} {"train_loss": -6.884562969207764, "global_step": 20713, "epoch": 123} {"train_loss": -6.617941379547119, "global_step": 20714, "epoch": 123} {"train_loss": -7.011112213134766, "global_step": 20715, "epoch": 123} {"train_loss": -6.790537357330322, "global_step": 20716, "epoch": 123} {"train_loss": -7.090393543243408, "global_step": 20717, "epoch": 123} {"train_loss": -6.739760398864746, "global_step": 20718, "epoch": 123} {"train_loss": -6.7905592918396, "global_step": 20719, "epoch": 123} {"train_loss": -7.0052900314331055, "global_step": 20720, "epoch": 123} {"train_loss": -6.75503396987915, "global_step": 20721, "epoch": 123} {"train_loss": -6.723133563995361, "global_step": 20722, "epoch": 123} {"train_loss": -6.938924789428711, "global_step": 20723, "epoch": 123} {"train_loss": -6.980280876159668, "global_step": 20724, "epoch": 123} {"train_loss": -6.928305625915527, "global_step": 20725, "epoch": 123} {"train_loss": -6.7696919441223145, "global_step": 20726, "epoch": 123} {"train_loss": -6.8438920974731445, "global_step": 20727, "epoch": 123} {"train_loss": -6.743223190307617, "global_step": 20728, "epoch": 123} {"train_loss": -6.929624080657959, "global_step": 20729, "epoch": 123} {"train_loss": -6.813311576843262, "global_step": 20730, "epoch": 123} {"train_loss": -6.96287727355957, "global_step": 20731, "epoch": 123} {"train_loss": -6.539572715759277, "global_step": 20732, "epoch": 123} {"train_loss": -6.879168510437012, "global_step": 20733, "epoch": 123} {"train_loss": -6.999951362609863, "global_step": 20734, "epoch": 123} {"train_loss": -6.839613914489746, "global_step": 20735, "epoch": 123} {"train_loss": -6.894888877868652, "global_step": 20736, "epoch": 123} {"train_loss": -6.973419666290283, "global_step": 20737, "epoch": 123} {"train_loss": -6.90509033203125, "global_step": 20738, "epoch": 123} {"train_loss": -6.881679534912109, "global_step": 20739, "epoch": 123} {"train_loss": -6.824704170227051, "global_step": 20740, "epoch": 123} {"train_loss": -6.688665866851807, "global_step": 20741, "epoch": 123} {"train_loss": -6.759903907775879, "global_step": 20742, "epoch": 123} {"train_loss": -6.936395168304443, "global_step": 20743, "epoch": 123} {"train_loss": -7.048325061798096, "global_step": 20744, "epoch": 123} {"train_loss": -7.083120346069336, "global_step": 20745, "epoch": 123} {"train_loss": -6.87908935546875, "global_step": 20746, "epoch": 123} {"train_loss": -6.847487449645996, "global_step": 20747, "epoch": 123} {"train_loss": -7.042989730834961, "global_step": 20748, "epoch": 123} {"train_loss": -6.995401382446289, "global_step": 20749, "epoch": 123} {"train_loss": -6.695817947387695, "global_step": 20750, "epoch": 123} {"train_loss": -6.858345985412598, "global_step": 20751, "epoch": 123} {"train_loss": -6.680593490600586, "global_step": 20752, "epoch": 123} {"train_loss": -6.928391933441162, "global_step": 20753, "epoch": 123} {"train_loss": -6.824917793273926, "global_step": 20754, "epoch": 123} {"train_loss": -6.985030174255371, "global_step": 20755, "epoch": 123} {"train_loss": -7.1233320236206055, "global_step": 20756, "epoch": 123} {"train_loss": -6.965312957763672, "global_step": 20757, "epoch": 123} {"train_loss": -6.9266252517700195, "global_step": 20758, "epoch": 123} {"train_loss": -6.975203990936279, "global_step": 20759, "epoch": 123} {"train_loss": -7.035475730895996, "global_step": 20760, "epoch": 123} {"train_loss": -6.890141010284424, "global_step": 20761, "epoch": 123} {"train_loss": -7.054243564605713, "global_step": 20762, "epoch": 123} {"train_loss": -7.031155586242676, "global_step": 20763, "epoch": 123} {"train_loss": -6.679483413696289, "global_step": 20764, "epoch": 123} {"train_loss": -7.030494213104248, "global_step": 20765, "epoch": 123} {"train_loss": -7.108590126037598, "global_step": 20766, "epoch": 123} {"train_loss": -6.892078399658203, "global_step": 20767, "epoch": 123} {"train_loss": -7.1498188972473145, "global_step": 20768, "epoch": 123} {"train_loss": -6.849487781524658, "global_step": 20769, "epoch": 123} {"train_loss": -6.841352462768555, "global_step": 20770, "epoch": 123} {"train_loss": -6.923056602478027, "global_step": 20771, "epoch": 123} {"train_loss": -6.881856918334961, "global_step": 20772, "epoch": 123} {"train_loss": -6.853869438171387, "global_step": 20773, "epoch": 123} {"train_loss": -7.120941162109375, "global_step": 20774, "epoch": 123} {"train_loss": -6.503669261932373, "global_step": 20775, "epoch": 123} {"train_loss": -6.82566499710083, "global_step": 20776, "epoch": 123} {"train_loss": -6.754443168640137, "global_step": 20777, "epoch": 123} {"train_loss": -6.9519147872924805, "global_step": 20778, "epoch": 123} {"train_loss": -6.799017429351807, "global_step": 20779, "epoch": 123} {"train_loss": -6.937902450561523, "global_step": 20780, "epoch": 123} {"train_loss": -6.651267051696777, "global_step": 20781, "epoch": 123} {"train_loss": -6.990622043609619, "global_step": 20782, "epoch": 123} {"train_loss": -6.794862747192383, "global_step": 20783, "epoch": 123} {"train_loss": -6.674403190612793, "global_step": 20784, "epoch": 123} {"train_loss": -6.761392593383789, "global_step": 20785, "epoch": 123} {"train_loss": -6.750575542449951, "global_step": 20786, "epoch": 123} {"train_loss": -6.815242767333984, "global_step": 20787, "epoch": 123} {"train_loss": -6.808376312255859, "global_step": 20788, "epoch": 123} {"train_loss": -6.907806396484375, "global_step": 20789, "epoch": 123} {"train_loss": -6.862423419952393, "global_step": 20790, "epoch": 123} {"train_loss": -6.684881210327148, "global_step": 20791, "epoch": 123} {"train_loss": -6.775907516479492, "global_step": 20792, "epoch": 123} {"train_loss": -6.726305961608887, "global_step": 20793, "epoch": 123} {"train_loss": -6.884769439697266, "global_step": 20794, "epoch": 123} {"train_loss": -6.4202375411987305, "global_step": 20795, "epoch": 123} {"train_loss": -6.777262210845947, "global_step": 20796, "epoch": 123} {"train_loss": -6.683713912963867, "global_step": 20797, "epoch": 123} {"train_loss": -6.557753562927246, "global_step": 20798, "epoch": 123} {"train_loss": -6.797816753387451, "global_step": 20799, "epoch": 123} {"train_loss": -6.680540084838867, "global_step": 20800, "epoch": 123} {"train_loss": -6.6963210105896, "global_step": 20801, "epoch": 123} {"train_loss": -6.641242027282715, "global_step": 20802, "epoch": 123} {"train_loss": -6.750454902648926, "global_step": 20803, "epoch": 123} {"train_loss": -6.888001441955566, "global_step": 20804, "epoch": 123} {"train_loss": -6.885235786437988, "global_step": 20805, "epoch": 123} {"train_loss": -6.6533050537109375, "global_step": 20806, "epoch": 123} {"train_loss": -6.985276699066162, "global_step": 20807, "epoch": 123} {"train_loss": -6.856401443481445, "global_step": 20808, "epoch": 123} {"train_loss": -6.924599647521973, "global_step": 20809, "epoch": 123} {"train_loss": -6.935782432556152, "global_step": 20810, "epoch": 123} {"train_loss": -6.981932640075684, "global_step": 20811, "epoch": 123} {"train_loss": -6.983057975769043, "global_step": 20812, "epoch": 123} {"train_loss": -6.846830368041992, "global_step": 20813, "epoch": 123} {"train_loss": -6.902772903442383, "global_step": 20814, "epoch": 123} {"train_loss": -6.928436279296875, "global_step": 20815, "epoch": 123} {"train_loss": -6.900918960571289, "global_step": 20816, "epoch": 123} {"train_loss": -7.219475269317627, "global_step": 20817, "epoch": 123} {"train_loss": -7.300079345703125, "global_step": 20818, "epoch": 123} {"train_loss": -7.1237945556640625, "global_step": 20819, "epoch": 123} {"train_loss": -7.2614641189575195, "global_step": 20820, "epoch": 123} {"train_loss": -7.162424087524414, "global_step": 20821, "epoch": 123} {"train_loss": -7.045746326446533, "global_step": 20822, "epoch": 123} {"train_loss": -6.891449451446533, "global_step": 20823, "epoch": 123} {"train_loss": -6.895808219909668, "global_step": 20824, "epoch": 123} {"train_loss": -6.73237419128418, "global_step": 20825, "epoch": 123} {"train_loss": -6.899588584899902, "global_step": 20826, "epoch": 123} {"train_loss": -6.899041175842285, "global_step": 20827, "epoch": 123} {"train_loss": -6.736917495727539, "global_step": 20828, "epoch": 123} {"train_loss": -6.835880279541016, "global_step": 20829, "epoch": 123} {"train_loss": -6.771761894226074, "global_step": 20830, "epoch": 123} {"train_loss": -6.851055494376591, "global_step": 20831, "epoch": 123, "val_loss": 210330.84375} {"train_loss": -7.001544952392578, "global_step": 20832, "epoch": 124} {"train_loss": -6.830904006958008, "global_step": 20833, "epoch": 124} {"train_loss": -6.794573783874512, "global_step": 20834, "epoch": 124} {"train_loss": -6.791747570037842, "global_step": 20835, "epoch": 124} {"train_loss": -7.006356239318848, "global_step": 20836, "epoch": 124} {"train_loss": -6.844295501708984, "global_step": 20837, "epoch": 124} {"train_loss": -6.52225399017334, "global_step": 20838, "epoch": 124} {"train_loss": -6.874018669128418, "global_step": 20839, "epoch": 124} {"train_loss": -6.758588790893555, "global_step": 20840, "epoch": 124} {"train_loss": -7.042745113372803, "global_step": 20841, "epoch": 124} {"train_loss": -6.7383341789245605, "global_step": 20842, "epoch": 124} {"train_loss": -6.694516181945801, "global_step": 20843, "epoch": 124} {"train_loss": -6.8835649490356445, "global_step": 20844, "epoch": 124} {"train_loss": -6.6668500900268555, "global_step": 20845, "epoch": 124} {"train_loss": -6.969651222229004, "global_step": 20846, "epoch": 124} {"train_loss": -6.735901832580566, "global_step": 20847, "epoch": 124} {"train_loss": -6.772756576538086, "global_step": 20848, "epoch": 124} {"train_loss": -6.982269287109375, "global_step": 20849, "epoch": 124} {"train_loss": -6.697295188903809, "global_step": 20850, "epoch": 124} {"train_loss": -6.820071697235107, "global_step": 20851, "epoch": 124} {"train_loss": -6.905689239501953, "global_step": 20852, "epoch": 124} {"train_loss": -6.818828105926514, "global_step": 20853, "epoch": 124} {"train_loss": -6.91886568069458, "global_step": 20854, "epoch": 124} {"train_loss": -6.998808860778809, "global_step": 20855, "epoch": 124} {"train_loss": -6.956042766571045, "global_step": 20856, "epoch": 124} {"train_loss": -6.874176979064941, "global_step": 20857, "epoch": 124} {"train_loss": -6.992313385009766, "global_step": 20858, "epoch": 124} {"train_loss": -6.967506408691406, "global_step": 20859, "epoch": 124} {"train_loss": -7.128416538238525, "global_step": 20860, "epoch": 124} {"train_loss": -6.8985114097595215, "global_step": 20861, "epoch": 124} {"train_loss": -6.905050754547119, "global_step": 20862, "epoch": 124} {"train_loss": -6.787518501281738, "global_step": 20863, "epoch": 124} {"train_loss": -7.061655044555664, "global_step": 20864, "epoch": 124} {"train_loss": -7.039705276489258, "global_step": 20865, "epoch": 124} {"train_loss": -6.905594825744629, "global_step": 20866, "epoch": 124} {"train_loss": -6.986645698547363, "global_step": 20867, "epoch": 124} {"train_loss": -7.051614761352539, "global_step": 20868, "epoch": 124} {"train_loss": -6.8275251388549805, "global_step": 20869, "epoch": 124} {"train_loss": -7.2010602951049805, "global_step": 20870, "epoch": 124} {"train_loss": -6.868490219116211, "global_step": 20871, "epoch": 124} {"train_loss": -6.954203128814697, "global_step": 20872, "epoch": 124} {"train_loss": -6.9384894371032715, "global_step": 20873, "epoch": 124} {"train_loss": -6.854342937469482, "global_step": 20874, "epoch": 124} {"train_loss": -7.091130256652832, "global_step": 20875, "epoch": 124} {"train_loss": -6.622357368469238, "global_step": 20876, "epoch": 124} {"train_loss": -6.870150089263916, "global_step": 20877, "epoch": 124} {"train_loss": -7.091168403625488, "global_step": 20878, "epoch": 124} {"train_loss": -6.891137599945068, "global_step": 20879, "epoch": 124} {"train_loss": -6.806482315063477, "global_step": 20880, "epoch": 124} {"train_loss": -6.942981243133545, "global_step": 20881, "epoch": 124} {"train_loss": -7.053568363189697, "global_step": 20882, "epoch": 124} {"train_loss": -6.841620922088623, "global_step": 20883, "epoch": 124} {"train_loss": -6.927797317504883, "global_step": 20884, "epoch": 124} {"train_loss": -7.153071880340576, "global_step": 20885, "epoch": 124} {"train_loss": -6.881097793579102, "global_step": 20886, "epoch": 124} {"train_loss": -6.89272403717041, "global_step": 20887, "epoch": 124} {"train_loss": -7.10123872756958, "global_step": 20888, "epoch": 124} {"train_loss": -6.918643474578857, "global_step": 20889, "epoch": 124} {"train_loss": -6.782387733459473, "global_step": 20890, "epoch": 124} {"train_loss": -6.758908271789551, "global_step": 20891, "epoch": 124} {"train_loss": -6.942304611206055, "global_step": 20892, "epoch": 124} {"train_loss": -6.927493095397949, "global_step": 20893, "epoch": 124} {"train_loss": -6.85203218460083, "global_step": 20894, "epoch": 124} {"train_loss": -6.81050968170166, "global_step": 20895, "epoch": 124} {"train_loss": -6.8124494552612305, "global_step": 20896, "epoch": 124} {"train_loss": -7.26357889175415, "global_step": 20897, "epoch": 124} {"train_loss": -6.821177959442139, "global_step": 20898, "epoch": 124} {"train_loss": -6.989815711975098, "global_step": 20899, "epoch": 124} {"train_loss": -6.985023021697998, "global_step": 20900, "epoch": 124} {"train_loss": -7.101531028747559, "global_step": 20901, "epoch": 124} {"train_loss": -6.8685712814331055, "global_step": 20902, "epoch": 124} {"train_loss": -6.874996662139893, "global_step": 20903, "epoch": 124} {"train_loss": -6.706323623657227, "global_step": 20904, "epoch": 124} {"train_loss": -7.147604942321777, "global_step": 20905, "epoch": 124} {"train_loss": -6.6292805671691895, "global_step": 20906, "epoch": 124} {"train_loss": -7.091383934020996, "global_step": 20907, "epoch": 124} {"train_loss": -6.621681213378906, "global_step": 20908, "epoch": 124} {"train_loss": -6.587800979614258, "global_step": 20909, "epoch": 124} {"train_loss": -6.890416145324707, "global_step": 20910, "epoch": 124} {"train_loss": -6.672324180603027, "global_step": 20911, "epoch": 124} {"train_loss": -6.820708274841309, "global_step": 20912, "epoch": 124} {"train_loss": -6.860489845275879, "global_step": 20913, "epoch": 124} {"train_loss": -7.102095603942871, "global_step": 20914, "epoch": 124} {"train_loss": -6.84720516204834, "global_step": 20915, "epoch": 124} {"train_loss": -6.858266830444336, "global_step": 20916, "epoch": 124} {"train_loss": -6.685860633850098, "global_step": 20917, "epoch": 124} {"train_loss": -6.759424209594727, "global_step": 20918, "epoch": 124} {"train_loss": -6.859683990478516, "global_step": 20919, "epoch": 124} {"train_loss": -6.792346000671387, "global_step": 20920, "epoch": 124} {"train_loss": -6.643955230712891, "global_step": 20921, "epoch": 124} {"train_loss": -6.73849630355835, "global_step": 20922, "epoch": 124} {"train_loss": -6.740364074707031, "global_step": 20923, "epoch": 124} {"train_loss": -6.776696681976318, "global_step": 20924, "epoch": 124} {"train_loss": -6.689866065979004, "global_step": 20925, "epoch": 124} {"train_loss": -7.030850887298584, "global_step": 20926, "epoch": 124} {"train_loss": -6.7393269538879395, "global_step": 20927, "epoch": 124} {"train_loss": -6.880014419555664, "global_step": 20928, "epoch": 124} {"train_loss": -6.894313812255859, "global_step": 20929, "epoch": 124} {"train_loss": -6.771622657775879, "global_step": 20930, "epoch": 124} {"train_loss": -7.100399971008301, "global_step": 20931, "epoch": 124} {"train_loss": -6.819690704345703, "global_step": 20932, "epoch": 124} {"train_loss": -7.005565643310547, "global_step": 20933, "epoch": 124} {"train_loss": -7.068748474121094, "global_step": 20934, "epoch": 124} {"train_loss": -6.877487659454346, "global_step": 20935, "epoch": 124} {"train_loss": -6.703033447265625, "global_step": 20936, "epoch": 124} {"train_loss": -6.975208282470703, "global_step": 20937, "epoch": 124} {"train_loss": -6.537986755371094, "global_step": 20938, "epoch": 124} {"train_loss": -7.0741729736328125, "global_step": 20939, "epoch": 124} {"train_loss": -6.832135200500488, "global_step": 20940, "epoch": 124} {"train_loss": -6.809269905090332, "global_step": 20941, "epoch": 124} {"train_loss": -7.103224754333496, "global_step": 20942, "epoch": 124} {"train_loss": -6.957324981689453, "global_step": 20943, "epoch": 124} {"train_loss": -7.024614334106445, "global_step": 20944, "epoch": 124} {"train_loss": -6.977789402008057, "global_step": 20945, "epoch": 124} {"train_loss": -7.00714111328125, "global_step": 20946, "epoch": 124} {"train_loss": -7.009428977966309, "global_step": 20947, "epoch": 124} {"train_loss": -7.040064334869385, "global_step": 20948, "epoch": 124} {"train_loss": -7.127068519592285, "global_step": 20949, "epoch": 124} {"train_loss": -6.944441795349121, "global_step": 20950, "epoch": 124} {"train_loss": -7.026317596435547, "global_step": 20951, "epoch": 124} {"train_loss": -6.831098556518555, "global_step": 20952, "epoch": 124} {"train_loss": -6.7959794998168945, "global_step": 20953, "epoch": 124} {"train_loss": -6.842591762542725, "global_step": 20954, "epoch": 124} {"train_loss": -7.102240562438965, "global_step": 20955, "epoch": 124} {"train_loss": -6.892393112182617, "global_step": 20956, "epoch": 124} {"train_loss": -6.670963287353516, "global_step": 20957, "epoch": 124} {"train_loss": -6.7163615226745605, "global_step": 20958, "epoch": 124} {"train_loss": -6.915719985961914, "global_step": 20959, "epoch": 124} {"train_loss": -6.977593898773193, "global_step": 20960, "epoch": 124} {"train_loss": -6.7154083251953125, "global_step": 20961, "epoch": 124} {"train_loss": -6.911826133728027, "global_step": 20962, "epoch": 124} {"train_loss": -7.035714149475098, "global_step": 20963, "epoch": 124} {"train_loss": -7.071006774902344, "global_step": 20964, "epoch": 124} {"train_loss": -6.629667282104492, "global_step": 20965, "epoch": 124} {"train_loss": -6.973028182983398, "global_step": 20966, "epoch": 124} {"train_loss": -7.0148210525512695, "global_step": 20967, "epoch": 124} {"train_loss": -6.763912677764893, "global_step": 20968, "epoch": 124} {"train_loss": -6.566051006317139, "global_step": 20969, "epoch": 124} {"train_loss": -6.922009468078613, "global_step": 20970, "epoch": 124} {"train_loss": -6.896143913269043, "global_step": 20971, "epoch": 124} {"train_loss": -6.965349197387695, "global_step": 20972, "epoch": 124} {"train_loss": -6.921226501464844, "global_step": 20973, "epoch": 124} {"train_loss": -6.81364107131958, "global_step": 20974, "epoch": 124} {"train_loss": -6.852720260620117, "global_step": 20975, "epoch": 124} {"train_loss": -6.797987937927246, "global_step": 20976, "epoch": 124} {"train_loss": -7.055451393127441, "global_step": 20977, "epoch": 124} {"train_loss": -6.994521141052246, "global_step": 20978, "epoch": 124} {"train_loss": -7.016175746917725, "global_step": 20979, "epoch": 124} {"train_loss": -6.886136054992676, "global_step": 20980, "epoch": 124} {"train_loss": -6.937565803527832, "global_step": 20981, "epoch": 124} {"train_loss": -6.967655181884766, "global_step": 20982, "epoch": 124} {"train_loss": -6.646116256713867, "global_step": 20983, "epoch": 124} {"train_loss": -6.799007415771484, "global_step": 20984, "epoch": 124} {"train_loss": -6.793700218200684, "global_step": 20985, "epoch": 124} {"train_loss": -6.678732872009277, "global_step": 20986, "epoch": 124} {"train_loss": -6.702052116394043, "global_step": 20987, "epoch": 124} {"train_loss": -6.840899467468262, "global_step": 20988, "epoch": 124} {"train_loss": -6.775074005126953, "global_step": 20989, "epoch": 124} {"train_loss": -6.782359600067139, "global_step": 20990, "epoch": 124} {"train_loss": -6.928189277648926, "global_step": 20991, "epoch": 124} {"train_loss": -6.709056377410889, "global_step": 20992, "epoch": 124} {"train_loss": -7.034762859344482, "global_step": 20993, "epoch": 124} {"train_loss": -6.700169086456299, "global_step": 20994, "epoch": 124} {"train_loss": -6.840966701507568, "global_step": 20995, "epoch": 124} {"train_loss": -6.93550443649292, "global_step": 20996, "epoch": 124} {"train_loss": -7.0694169998168945, "global_step": 20997, "epoch": 124} {"train_loss": -7.0125579833984375, "global_step": 20998, "epoch": 124} {"train_loss": -6.885197602567219, "global_step": 20999, "epoch": 124, "val_loss": 209880.8125} {"train_loss": -7.061739444732666, "global_step": 21000, "epoch": 125} {"train_loss": -7.0720930099487305, "global_step": 21001, "epoch": 125} {"train_loss": -7.0438923835754395, "global_step": 21002, "epoch": 125} {"train_loss": -6.956618785858154, "global_step": 21003, "epoch": 125} {"train_loss": -6.908202171325684, "global_step": 21004, "epoch": 125} {"train_loss": -6.6523542404174805, "global_step": 21005, "epoch": 125} {"train_loss": -6.748444557189941, "global_step": 21006, "epoch": 125} {"train_loss": -7.006272315979004, "global_step": 21007, "epoch": 125} {"train_loss": -6.63180685043335, "global_step": 21008, "epoch": 125} {"train_loss": -7.054873943328857, "global_step": 21009, "epoch": 125} {"train_loss": -7.007644176483154, "global_step": 21010, "epoch": 125} {"train_loss": -6.758065223693848, "global_step": 21011, "epoch": 125} {"train_loss": -7.098499774932861, "global_step": 21012, "epoch": 125} {"train_loss": -6.722718715667725, "global_step": 21013, "epoch": 125} {"train_loss": -6.8103532791137695, "global_step": 21014, "epoch": 125} {"train_loss": -6.8191914558410645, "global_step": 21015, "epoch": 125} {"train_loss": -6.8889641761779785, "global_step": 21016, "epoch": 125} {"train_loss": -6.688999176025391, "global_step": 21017, "epoch": 125} {"train_loss": -7.028802871704102, "global_step": 21018, "epoch": 125} {"train_loss": -6.629356384277344, "global_step": 21019, "epoch": 125} {"train_loss": -7.051653861999512, "global_step": 21020, "epoch": 125} {"train_loss": -6.709079265594482, "global_step": 21021, "epoch": 125} {"train_loss": -6.855449676513672, "global_step": 21022, "epoch": 125} {"train_loss": -6.777321815490723, "global_step": 21023, "epoch": 125} {"train_loss": -6.69600772857666, "global_step": 21024, "epoch": 125} {"train_loss": -6.806532859802246, "global_step": 21025, "epoch": 125} {"train_loss": -7.00759220123291, "global_step": 21026, "epoch": 125} {"train_loss": -6.733337879180908, "global_step": 21027, "epoch": 125} {"train_loss": -6.687838554382324, "global_step": 21028, "epoch": 125} {"train_loss": -6.758179664611816, "global_step": 21029, "epoch": 125} {"train_loss": -6.875213623046875, "global_step": 21030, "epoch": 125} {"train_loss": -6.749560356140137, "global_step": 21031, "epoch": 125} {"train_loss": -6.470929145812988, "global_step": 21032, "epoch": 125} {"train_loss": -6.5337395668029785, "global_step": 21033, "epoch": 125} {"train_loss": -6.91974401473999, "global_step": 21034, "epoch": 125} {"train_loss": -6.565284729003906, "global_step": 21035, "epoch": 125} {"train_loss": -6.700355052947998, "global_step": 21036, "epoch": 125} {"train_loss": -6.868244171142578, "global_step": 21037, "epoch": 125} {"train_loss": -6.491146564483643, "global_step": 21038, "epoch": 125} {"train_loss": -6.768697261810303, "global_step": 21039, "epoch": 125} {"train_loss": -6.721230983734131, "global_step": 21040, "epoch": 125} {"train_loss": -6.634791374206543, "global_step": 21041, "epoch": 125} {"train_loss": -6.728255271911621, "global_step": 21042, "epoch": 125} {"train_loss": -6.6102752685546875, "global_step": 21043, "epoch": 125} {"train_loss": -6.897923469543457, "global_step": 21044, "epoch": 125} {"train_loss": -6.763571262359619, "global_step": 21045, "epoch": 125} {"train_loss": -6.780611038208008, "global_step": 21046, "epoch": 125} {"train_loss": -6.996556282043457, "global_step": 21047, "epoch": 125} {"train_loss": -6.563285827636719, "global_step": 21048, "epoch": 125} {"train_loss": -6.685373783111572, "global_step": 21049, "epoch": 125} {"train_loss": -7.024876594543457, "global_step": 21050, "epoch": 125} {"train_loss": -6.788006782531738, "global_step": 21051, "epoch": 125} {"train_loss": -7.053367614746094, "global_step": 21052, "epoch": 125} {"train_loss": -6.7934675216674805, "global_step": 21053, "epoch": 125} {"train_loss": -6.674350738525391, "global_step": 21054, "epoch": 125} {"train_loss": -6.966339111328125, "global_step": 21055, "epoch": 125} {"train_loss": -6.868514060974121, "global_step": 21056, "epoch": 125} {"train_loss": -6.927730560302734, "global_step": 21057, "epoch": 125} {"train_loss": -6.871735095977783, "global_step": 21058, "epoch": 125} {"train_loss": -7.195213317871094, "global_step": 21059, "epoch": 125} {"train_loss": -7.094263076782227, "global_step": 21060, "epoch": 125} {"train_loss": -6.556209087371826, "global_step": 21061, "epoch": 125} {"train_loss": -6.910651206970215, "global_step": 21062, "epoch": 125} {"train_loss": -6.702271461486816, "global_step": 21063, "epoch": 125} {"train_loss": -6.889922142028809, "global_step": 21064, "epoch": 125} {"train_loss": -6.73454475402832, "global_step": 21065, "epoch": 125} {"train_loss": -6.723168849945068, "global_step": 21066, "epoch": 125} {"train_loss": -7.032406806945801, "global_step": 21067, "epoch": 125} {"train_loss": -6.886480331420898, "global_step": 21068, "epoch": 125} {"train_loss": -6.882596015930176, "global_step": 21069, "epoch": 125} {"train_loss": -6.811404705047607, "global_step": 21070, "epoch": 125} {"train_loss": -6.764181137084961, "global_step": 21071, "epoch": 125} {"train_loss": -6.901026725769043, "global_step": 21072, "epoch": 125} {"train_loss": -6.743622779846191, "global_step": 21073, "epoch": 125} {"train_loss": -7.083446502685547, "global_step": 21074, "epoch": 125} {"train_loss": -6.837418556213379, "global_step": 21075, "epoch": 125} {"train_loss": -7.014467239379883, "global_step": 21076, "epoch": 125} {"train_loss": -6.894108772277832, "global_step": 21077, "epoch": 125} {"train_loss": -6.859185695648193, "global_step": 21078, "epoch": 125} {"train_loss": -6.683450698852539, "global_step": 21079, "epoch": 125} {"train_loss": -6.792703628540039, "global_step": 21080, "epoch": 125} {"train_loss": -6.860048770904541, "global_step": 21081, "epoch": 125} {"train_loss": -6.962027549743652, "global_step": 21082, "epoch": 125} {"train_loss": -6.886771202087402, "global_step": 21083, "epoch": 125} {"train_loss": -6.939957618713379, "global_step": 21084, "epoch": 125} {"train_loss": -6.759488105773926, "global_step": 21085, "epoch": 125} {"train_loss": -6.978758811950684, "global_step": 21086, "epoch": 125} {"train_loss": -6.889318466186523, "global_step": 21087, "epoch": 125} {"train_loss": -7.087738037109375, "global_step": 21088, "epoch": 125} {"train_loss": -6.883683681488037, "global_step": 21089, "epoch": 125} {"train_loss": -6.721290588378906, "global_step": 21090, "epoch": 125} {"train_loss": -7.019469738006592, "global_step": 21091, "epoch": 125} {"train_loss": -7.00340461730957, "global_step": 21092, "epoch": 125} {"train_loss": -6.735705375671387, "global_step": 21093, "epoch": 125} {"train_loss": -6.740450859069824, "global_step": 21094, "epoch": 125} {"train_loss": -6.913358211517334, "global_step": 21095, "epoch": 125} {"train_loss": -6.738288879394531, "global_step": 21096, "epoch": 125} {"train_loss": -7.021405220031738, "global_step": 21097, "epoch": 125} {"train_loss": -6.717129707336426, "global_step": 21098, "epoch": 125} {"train_loss": -7.000115394592285, "global_step": 21099, "epoch": 125} {"train_loss": -6.973521709442139, "global_step": 21100, "epoch": 125} {"train_loss": -6.765059947967529, "global_step": 21101, "epoch": 125} {"train_loss": -6.665652275085449, "global_step": 21102, "epoch": 125} {"train_loss": -6.845755577087402, "global_step": 21103, "epoch": 125} {"train_loss": -6.700648307800293, "global_step": 21104, "epoch": 125} {"train_loss": -6.789613246917725, "global_step": 21105, "epoch": 125} {"train_loss": -6.9290924072265625, "global_step": 21106, "epoch": 125} {"train_loss": -6.881627082824707, "global_step": 21107, "epoch": 125} {"train_loss": -7.0394697189331055, "global_step": 21108, "epoch": 125} {"train_loss": -6.920982360839844, "global_step": 21109, "epoch": 125} {"train_loss": -6.844131946563721, "global_step": 21110, "epoch": 125} {"train_loss": -6.976588249206543, "global_step": 21111, "epoch": 125} {"train_loss": -6.990102767944336, "global_step": 21112, "epoch": 125} {"train_loss": -6.682458400726318, "global_step": 21113, "epoch": 125} {"train_loss": -7.189336776733398, "global_step": 21114, "epoch": 125} {"train_loss": -7.0790252685546875, "global_step": 21115, "epoch": 125} {"train_loss": -6.987982749938965, "global_step": 21116, "epoch": 125} {"train_loss": -6.898444652557373, "global_step": 21117, "epoch": 125} {"train_loss": -6.723076820373535, "global_step": 21118, "epoch": 125} {"train_loss": -6.997816562652588, "global_step": 21119, "epoch": 125} {"train_loss": -6.75974702835083, "global_step": 21120, "epoch": 125} {"train_loss": -6.812411308288574, "global_step": 21121, "epoch": 125} {"train_loss": -6.945801734924316, "global_step": 21122, "epoch": 125} {"train_loss": -6.91652774810791, "global_step": 21123, "epoch": 125} {"train_loss": -6.943837642669678, "global_step": 21124, "epoch": 125} {"train_loss": -6.754516124725342, "global_step": 21125, "epoch": 125} {"train_loss": -7.016909599304199, "global_step": 21126, "epoch": 125} {"train_loss": -6.802753925323486, "global_step": 21127, "epoch": 125} {"train_loss": -6.916913986206055, "global_step": 21128, "epoch": 125} {"train_loss": -6.651324272155762, "global_step": 21129, "epoch": 125} {"train_loss": -6.744292736053467, "global_step": 21130, "epoch": 125} {"train_loss": -6.851137161254883, "global_step": 21131, "epoch": 125} {"train_loss": -7.15218448638916, "global_step": 21132, "epoch": 125} {"train_loss": -6.717399597167969, "global_step": 21133, "epoch": 125} {"train_loss": -6.729700565338135, "global_step": 21134, "epoch": 125} {"train_loss": -6.880364418029785, "global_step": 21135, "epoch": 125} {"train_loss": -6.662945747375488, "global_step": 21136, "epoch": 125} {"train_loss": -6.895563125610352, "global_step": 21137, "epoch": 125} {"train_loss": -6.58966064453125, "global_step": 21138, "epoch": 125} {"train_loss": -6.958259582519531, "global_step": 21139, "epoch": 125} {"train_loss": -6.810891151428223, "global_step": 21140, "epoch": 125} {"train_loss": -6.638818740844727, "global_step": 21141, "epoch": 125} {"train_loss": -7.113872528076172, "global_step": 21142, "epoch": 125} {"train_loss": -6.950417518615723, "global_step": 21143, "epoch": 125} {"train_loss": -7.017662525177002, "global_step": 21144, "epoch": 125} {"train_loss": -6.683625221252441, "global_step": 21145, "epoch": 125} {"train_loss": -6.937385559082031, "global_step": 21146, "epoch": 125} {"train_loss": -6.873666763305664, "global_step": 21147, "epoch": 125} {"train_loss": -6.668025016784668, "global_step": 21148, "epoch": 125} {"train_loss": -7.064477920532227, "global_step": 21149, "epoch": 125} {"train_loss": -7.003293991088867, "global_step": 21150, "epoch": 125} {"train_loss": -6.942481994628906, "global_step": 21151, "epoch": 125} {"train_loss": -6.944333076477051, "global_step": 21152, "epoch": 125} {"train_loss": -6.9419965744018555, "global_step": 21153, "epoch": 125} {"train_loss": -6.885641098022461, "global_step": 21154, "epoch": 125} {"train_loss": -6.840948581695557, "global_step": 21155, "epoch": 125} {"train_loss": -7.006710052490234, "global_step": 21156, "epoch": 125} {"train_loss": -7.105706214904785, "global_step": 21157, "epoch": 125} {"train_loss": -6.986583709716797, "global_step": 21158, "epoch": 125} {"train_loss": -7.0361528396606445, "global_step": 21159, "epoch": 125} {"train_loss": -6.989255905151367, "global_step": 21160, "epoch": 125} {"train_loss": -6.715274333953857, "global_step": 21161, "epoch": 125} {"train_loss": -6.8161492347717285, "global_step": 21162, "epoch": 125} {"train_loss": -6.886364936828613, "global_step": 21163, "epoch": 125} {"train_loss": -6.98355770111084, "global_step": 21164, "epoch": 125} {"train_loss": -6.92600679397583, "global_step": 21165, "epoch": 125} {"train_loss": -6.888771057128906, "global_step": 21166, "epoch": 125} {"train_loss": -6.856995273204077, "global_step": 21167, "epoch": 125, "val_loss": 212488.125, "train_action_mse_error": 19.68688201904297} {"train_loss": -6.954009056091309, "global_step": 21168, "epoch": 126} {"train_loss": -6.988325119018555, "global_step": 21169, "epoch": 126} {"train_loss": -6.934626579284668, "global_step": 21170, "epoch": 126} {"train_loss": -7.183027744293213, "global_step": 21171, "epoch": 126} {"train_loss": -6.778107643127441, "global_step": 21172, "epoch": 126} {"train_loss": -6.867230415344238, "global_step": 21173, "epoch": 126} {"train_loss": -6.922420978546143, "global_step": 21174, "epoch": 126} {"train_loss": -7.003222942352295, "global_step": 21175, "epoch": 126} {"train_loss": -6.810205459594727, "global_step": 21176, "epoch": 126} {"train_loss": -6.841880798339844, "global_step": 21177, "epoch": 126} {"train_loss": -6.831604957580566, "global_step": 21178, "epoch": 126} {"train_loss": -6.986715316772461, "global_step": 21179, "epoch": 126} {"train_loss": -6.939004898071289, "global_step": 21180, "epoch": 126} {"train_loss": -6.929499626159668, "global_step": 21181, "epoch": 126} {"train_loss": -6.8846540451049805, "global_step": 21182, "epoch": 126} {"train_loss": -6.860653877258301, "global_step": 21183, "epoch": 126} {"train_loss": -6.675901889801025, "global_step": 21184, "epoch": 126} {"train_loss": -6.792572021484375, "global_step": 21185, "epoch": 126} {"train_loss": -6.745709419250488, "global_step": 21186, "epoch": 126} {"train_loss": -7.093959808349609, "global_step": 21187, "epoch": 126} {"train_loss": -6.732780456542969, "global_step": 21188, "epoch": 126} {"train_loss": -6.752973556518555, "global_step": 21189, "epoch": 126} {"train_loss": -6.744582176208496, "global_step": 21190, "epoch": 126} {"train_loss": -7.081314563751221, "global_step": 21191, "epoch": 126} {"train_loss": -6.94866943359375, "global_step": 21192, "epoch": 126} {"train_loss": -6.722787857055664, "global_step": 21193, "epoch": 126} {"train_loss": -7.039117813110352, "global_step": 21194, "epoch": 126} {"train_loss": -6.740108966827393, "global_step": 21195, "epoch": 126} {"train_loss": -7.108431816101074, "global_step": 21196, "epoch": 126} {"train_loss": -6.895852088928223, "global_step": 21197, "epoch": 126} {"train_loss": -6.81243371963501, "global_step": 21198, "epoch": 126} {"train_loss": -7.184655666351318, "global_step": 21199, "epoch": 126} {"train_loss": -6.66227388381958, "global_step": 21200, "epoch": 126} {"train_loss": -6.9599480628967285, "global_step": 21201, "epoch": 126} {"train_loss": -6.907763957977295, "global_step": 21202, "epoch": 126} {"train_loss": -6.968352317810059, "global_step": 21203, "epoch": 126} {"train_loss": -6.734950065612793, "global_step": 21204, "epoch": 126} {"train_loss": -6.972481727600098, "global_step": 21205, "epoch": 126} {"train_loss": -6.823163986206055, "global_step": 21206, "epoch": 126} {"train_loss": -6.937267303466797, "global_step": 21207, "epoch": 126} {"train_loss": -7.129717826843262, "global_step": 21208, "epoch": 126} {"train_loss": -6.638400077819824, "global_step": 21209, "epoch": 126} {"train_loss": -6.937627792358398, "global_step": 21210, "epoch": 126} {"train_loss": -6.744065284729004, "global_step": 21211, "epoch": 126} {"train_loss": -6.903380393981934, "global_step": 21212, "epoch": 126} {"train_loss": -6.604152679443359, "global_step": 21213, "epoch": 126} {"train_loss": -6.922369956970215, "global_step": 21214, "epoch": 126} {"train_loss": -6.762875556945801, "global_step": 21215, "epoch": 126} {"train_loss": -6.697670936584473, "global_step": 21216, "epoch": 126} {"train_loss": -6.87144136428833, "global_step": 21217, "epoch": 126} {"train_loss": -6.801927089691162, "global_step": 21218, "epoch": 126} {"train_loss": -6.854863166809082, "global_step": 21219, "epoch": 126} {"train_loss": -7.258382797241211, "global_step": 21220, "epoch": 126} {"train_loss": -6.968984603881836, "global_step": 21221, "epoch": 126} {"train_loss": -6.921168804168701, "global_step": 21222, "epoch": 126} {"train_loss": -7.07326602935791, "global_step": 21223, "epoch": 126} {"train_loss": -7.115753650665283, "global_step": 21224, "epoch": 126} {"train_loss": -6.898140907287598, "global_step": 21225, "epoch": 126} {"train_loss": -7.077585697174072, "global_step": 21226, "epoch": 126} {"train_loss": -6.803720474243164, "global_step": 21227, "epoch": 126} {"train_loss": -7.063369274139404, "global_step": 21228, "epoch": 126} {"train_loss": -6.977039337158203, "global_step": 21229, "epoch": 126} {"train_loss": -7.030196189880371, "global_step": 21230, "epoch": 126} {"train_loss": -6.5766096115112305, "global_step": 21231, "epoch": 126} {"train_loss": -6.67647647857666, "global_step": 21232, "epoch": 126} {"train_loss": -6.744745254516602, "global_step": 21233, "epoch": 126} {"train_loss": -6.8092451095581055, "global_step": 21234, "epoch": 126} {"train_loss": -6.741240501403809, "global_step": 21235, "epoch": 126} {"train_loss": -6.744029521942139, "global_step": 21236, "epoch": 126} {"train_loss": -6.893841743469238, "global_step": 21237, "epoch": 126} {"train_loss": -6.709993362426758, "global_step": 21238, "epoch": 126} {"train_loss": -6.770414352416992, "global_step": 21239, "epoch": 126} {"train_loss": -6.780892372131348, "global_step": 21240, "epoch": 126} {"train_loss": -6.925458908081055, "global_step": 21241, "epoch": 126} {"train_loss": -7.0267863273620605, "global_step": 21242, "epoch": 126} {"train_loss": -6.739867210388184, "global_step": 21243, "epoch": 126} {"train_loss": -6.715287208557129, "global_step": 21244, "epoch": 126} {"train_loss": -6.894981861114502, "global_step": 21245, "epoch": 126} {"train_loss": -7.09178352355957, "global_step": 21246, "epoch": 126} {"train_loss": -7.071403503417969, "global_step": 21247, "epoch": 126} {"train_loss": -6.872941017150879, "global_step": 21248, "epoch": 126} {"train_loss": -6.738816738128662, "global_step": 21249, "epoch": 126} {"train_loss": -6.927717685699463, "global_step": 21250, "epoch": 126} {"train_loss": -6.522356033325195, "global_step": 21251, "epoch": 126} {"train_loss": -6.758363723754883, "global_step": 21252, "epoch": 126} {"train_loss": -6.860757827758789, "global_step": 21253, "epoch": 126} {"train_loss": -6.947963714599609, "global_step": 21254, "epoch": 126} {"train_loss": -6.784239292144775, "global_step": 21255, "epoch": 126} {"train_loss": -6.833264350891113, "global_step": 21256, "epoch": 126} {"train_loss": -7.168834686279297, "global_step": 21257, "epoch": 126} {"train_loss": -6.891298294067383, "global_step": 21258, "epoch": 126} {"train_loss": -6.960712432861328, "global_step": 21259, "epoch": 126} {"train_loss": -7.089951515197754, "global_step": 21260, "epoch": 126} {"train_loss": -6.724483489990234, "global_step": 21261, "epoch": 126} {"train_loss": -7.020404815673828, "global_step": 21262, "epoch": 126} {"train_loss": -7.028110980987549, "global_step": 21263, "epoch": 126} {"train_loss": -6.864853858947754, "global_step": 21264, "epoch": 126} {"train_loss": -6.823945045471191, "global_step": 21265, "epoch": 126} {"train_loss": -6.973848342895508, "global_step": 21266, "epoch": 126} {"train_loss": -6.702727794647217, "global_step": 21267, "epoch": 126} {"train_loss": -6.823016166687012, "global_step": 21268, "epoch": 126} {"train_loss": -6.951696395874023, "global_step": 21269, "epoch": 126} {"train_loss": -6.806422233581543, "global_step": 21270, "epoch": 126} {"train_loss": -7.115355491638184, "global_step": 21271, "epoch": 126} {"train_loss": -7.05855655670166, "global_step": 21272, "epoch": 126} {"train_loss": -6.928053379058838, "global_step": 21273, "epoch": 126} {"train_loss": -6.898217678070068, "global_step": 21274, "epoch": 126} {"train_loss": -7.050436019897461, "global_step": 21275, "epoch": 126} {"train_loss": -6.899444580078125, "global_step": 21276, "epoch": 126} {"train_loss": -7.131222248077393, "global_step": 21277, "epoch": 126} {"train_loss": -7.061077117919922, "global_step": 21278, "epoch": 126} {"train_loss": -6.80302095413208, "global_step": 21279, "epoch": 126} {"train_loss": -6.966241836547852, "global_step": 21280, "epoch": 126} {"train_loss": -7.050844669342041, "global_step": 21281, "epoch": 126} {"train_loss": -6.974127769470215, "global_step": 21282, "epoch": 126} {"train_loss": -7.169137954711914, "global_step": 21283, "epoch": 126} {"train_loss": -7.033530235290527, "global_step": 21284, "epoch": 126} {"train_loss": -7.150634288787842, "global_step": 21285, "epoch": 126} {"train_loss": -6.951396942138672, "global_step": 21286, "epoch": 126} {"train_loss": -6.980322360992432, "global_step": 21287, "epoch": 126} {"train_loss": -6.812294960021973, "global_step": 21288, "epoch": 126} {"train_loss": -7.110627174377441, "global_step": 21289, "epoch": 126} {"train_loss": -6.726261615753174, "global_step": 21290, "epoch": 126} {"train_loss": -7.030519485473633, "global_step": 21291, "epoch": 126} {"train_loss": -7.111401557922363, "global_step": 21292, "epoch": 126} {"train_loss": -6.718985557556152, "global_step": 21293, "epoch": 126} {"train_loss": -7.160797595977783, "global_step": 21294, "epoch": 126} {"train_loss": -6.675604343414307, "global_step": 21295, "epoch": 126} {"train_loss": -7.061450481414795, "global_step": 21296, "epoch": 126} {"train_loss": -6.786105155944824, "global_step": 21297, "epoch": 126} {"train_loss": -7.076658248901367, "global_step": 21298, "epoch": 126} {"train_loss": -7.150402069091797, "global_step": 21299, "epoch": 126} {"train_loss": -6.96093225479126, "global_step": 21300, "epoch": 126} {"train_loss": -6.819671154022217, "global_step": 21301, "epoch": 126} {"train_loss": -7.131898880004883, "global_step": 21302, "epoch": 126} {"train_loss": -6.920734405517578, "global_step": 21303, "epoch": 126} {"train_loss": -6.747420310974121, "global_step": 21304, "epoch": 126} {"train_loss": -7.179814338684082, "global_step": 21305, "epoch": 126} {"train_loss": -7.00541353225708, "global_step": 21306, "epoch": 126} {"train_loss": -6.82023811340332, "global_step": 21307, "epoch": 126} {"train_loss": -6.985185623168945, "global_step": 21308, "epoch": 126} {"train_loss": -7.1788434982299805, "global_step": 21309, "epoch": 126} {"train_loss": -7.183884620666504, "global_step": 21310, "epoch": 126} {"train_loss": -6.876033782958984, "global_step": 21311, "epoch": 126} {"train_loss": -7.16139030456543, "global_step": 21312, "epoch": 126} {"train_loss": -7.123899459838867, "global_step": 21313, "epoch": 126} {"train_loss": -6.9852142333984375, "global_step": 21314, "epoch": 126} {"train_loss": -6.967690467834473, "global_step": 21315, "epoch": 126} {"train_loss": -6.749338150024414, "global_step": 21316, "epoch": 126} {"train_loss": -7.2342119216918945, "global_step": 21317, "epoch": 126} {"train_loss": -6.688628673553467, "global_step": 21318, "epoch": 126} {"train_loss": -6.710618019104004, "global_step": 21319, "epoch": 126} {"train_loss": -7.1141252517700195, "global_step": 21320, "epoch": 126} {"train_loss": -6.9953718185424805, "global_step": 21321, "epoch": 126} {"train_loss": -6.930645942687988, "global_step": 21322, "epoch": 126} {"train_loss": -7.0832719802856445, "global_step": 21323, "epoch": 126} {"train_loss": -7.232109069824219, "global_step": 21324, "epoch": 126} {"train_loss": -7.128185749053955, "global_step": 21325, "epoch": 126} {"train_loss": -7.1387810707092285, "global_step": 21326, "epoch": 126} {"train_loss": -6.993902683258057, "global_step": 21327, "epoch": 126} {"train_loss": -6.972810745239258, "global_step": 21328, "epoch": 126} {"train_loss": -6.907787322998047, "global_step": 21329, "epoch": 126} {"train_loss": -7.071380615234375, "global_step": 21330, "epoch": 126} {"train_loss": -6.7752909660339355, "global_step": 21331, "epoch": 126} {"train_loss": -6.86318302154541, "global_step": 21332, "epoch": 126} {"train_loss": -7.045015811920166, "global_step": 21333, "epoch": 126} {"train_loss": -6.829804420471191, "global_step": 21334, "epoch": 126} {"train_loss": -6.921182666506086, "global_step": 21335, "epoch": 126, "val_loss": 212527.078125} {"train_loss": -6.994752407073975, "global_step": 21336, "epoch": 127} {"train_loss": -6.985062122344971, "global_step": 21337, "epoch": 127} {"train_loss": -7.064087867736816, "global_step": 21338, "epoch": 127} {"train_loss": -6.890140533447266, "global_step": 21339, "epoch": 127} {"train_loss": -7.028964996337891, "global_step": 21340, "epoch": 127} {"train_loss": -6.961148738861084, "global_step": 21341, "epoch": 127} {"train_loss": -6.794981956481934, "global_step": 21342, "epoch": 127} {"train_loss": -6.55186653137207, "global_step": 21343, "epoch": 127} {"train_loss": -6.85939884185791, "global_step": 21344, "epoch": 127} {"train_loss": -6.664477348327637, "global_step": 21345, "epoch": 127} {"train_loss": -6.915652751922607, "global_step": 21346, "epoch": 127} {"train_loss": -6.848463535308838, "global_step": 21347, "epoch": 127} {"train_loss": -6.790154457092285, "global_step": 21348, "epoch": 127} {"train_loss": -6.890067100524902, "global_step": 21349, "epoch": 127} {"train_loss": -6.933295249938965, "global_step": 21350, "epoch": 127} {"train_loss": -7.0043745040893555, "global_step": 21351, "epoch": 127} {"train_loss": -6.989545822143555, "global_step": 21352, "epoch": 127} {"train_loss": -6.906477928161621, "global_step": 21353, "epoch": 127} {"train_loss": -6.831830978393555, "global_step": 21354, "epoch": 127} {"train_loss": -6.772071361541748, "global_step": 21355, "epoch": 127} {"train_loss": -7.137869834899902, "global_step": 21356, "epoch": 127} {"train_loss": -7.1976494789123535, "global_step": 21357, "epoch": 127} {"train_loss": -6.871036529541016, "global_step": 21358, "epoch": 127} {"train_loss": -7.2116007804870605, "global_step": 21359, "epoch": 127} {"train_loss": -6.785656452178955, "global_step": 21360, "epoch": 127} {"train_loss": -6.991178512573242, "global_step": 21361, "epoch": 127} {"train_loss": -7.220339775085449, "global_step": 21362, "epoch": 127} {"train_loss": -6.965945720672607, "global_step": 21363, "epoch": 127} {"train_loss": -7.102677822113037, "global_step": 21364, "epoch": 127} {"train_loss": -6.870248794555664, "global_step": 21365, "epoch": 127} {"train_loss": -6.773850917816162, "global_step": 21366, "epoch": 127} {"train_loss": -6.82008171081543, "global_step": 21367, "epoch": 127} {"train_loss": -6.7159857749938965, "global_step": 21368, "epoch": 127} {"train_loss": -6.881131172180176, "global_step": 21369, "epoch": 127} {"train_loss": -7.080380439758301, "global_step": 21370, "epoch": 127} {"train_loss": -6.882763385772705, "global_step": 21371, "epoch": 127} {"train_loss": -6.819285869598389, "global_step": 21372, "epoch": 127} {"train_loss": -6.942290782928467, "global_step": 21373, "epoch": 127} {"train_loss": -6.803150653839111, "global_step": 21374, "epoch": 127} {"train_loss": -7.0281572341918945, "global_step": 21375, "epoch": 127} {"train_loss": -6.705021858215332, "global_step": 21376, "epoch": 127} {"train_loss": -6.878685474395752, "global_step": 21377, "epoch": 127} {"train_loss": -6.657807350158691, "global_step": 21378, "epoch": 127} {"train_loss": -6.92140007019043, "global_step": 21379, "epoch": 127} {"train_loss": -6.804184913635254, "global_step": 21380, "epoch": 127} {"train_loss": -6.954587936401367, "global_step": 21381, "epoch": 127} {"train_loss": -6.851839065551758, "global_step": 21382, "epoch": 127} {"train_loss": -7.065141677856445, "global_step": 21383, "epoch": 127} {"train_loss": -6.8047285079956055, "global_step": 21384, "epoch": 127} {"train_loss": -6.903704643249512, "global_step": 21385, "epoch": 127} {"train_loss": -7.111710548400879, "global_step": 21386, "epoch": 127} {"train_loss": -6.713612079620361, "global_step": 21387, "epoch": 127} {"train_loss": -6.925834655761719, "global_step": 21388, "epoch": 127} {"train_loss": -6.732168197631836, "global_step": 21389, "epoch": 127} {"train_loss": -7.003792762756348, "global_step": 21390, "epoch": 127} {"train_loss": -6.907230854034424, "global_step": 21391, "epoch": 127} {"train_loss": -6.798257827758789, "global_step": 21392, "epoch": 127} {"train_loss": -7.010140419006348, "global_step": 21393, "epoch": 127} {"train_loss": -7.0120086669921875, "global_step": 21394, "epoch": 127} {"train_loss": -6.921515464782715, "global_step": 21395, "epoch": 127} {"train_loss": -7.0216569900512695, "global_step": 21396, "epoch": 127} {"train_loss": -6.867283344268799, "global_step": 21397, "epoch": 127} {"train_loss": -6.698395729064941, "global_step": 21398, "epoch": 127} {"train_loss": -7.00240421295166, "global_step": 21399, "epoch": 127} {"train_loss": -7.21650505065918, "global_step": 21400, "epoch": 127} {"train_loss": -6.999114036560059, "global_step": 21401, "epoch": 127} {"train_loss": -7.046264171600342, "global_step": 21402, "epoch": 127} {"train_loss": -7.0721025466918945, "global_step": 21403, "epoch": 127} {"train_loss": -7.135509967803955, "global_step": 21404, "epoch": 127} {"train_loss": -7.049740791320801, "global_step": 21405, "epoch": 127} {"train_loss": -7.189605712890625, "global_step": 21406, "epoch": 127} {"train_loss": -6.957948207855225, "global_step": 21407, "epoch": 127} {"train_loss": -6.8275146484375, "global_step": 21408, "epoch": 127} {"train_loss": -6.908970355987549, "global_step": 21409, "epoch": 127} {"train_loss": -6.85080623626709, "global_step": 21410, "epoch": 127} {"train_loss": -6.579987525939941, "global_step": 21411, "epoch": 127} {"train_loss": -7.029208660125732, "global_step": 21412, "epoch": 127} {"train_loss": -6.932154655456543, "global_step": 21413, "epoch": 127} {"train_loss": -6.999285697937012, "global_step": 21414, "epoch": 127} {"train_loss": -6.960594654083252, "global_step": 21415, "epoch": 127} {"train_loss": -7.033468723297119, "global_step": 21416, "epoch": 127} {"train_loss": -6.829288482666016, "global_step": 21417, "epoch": 127} {"train_loss": -7.023125648498535, "global_step": 21418, "epoch": 127} {"train_loss": -7.130834579467773, "global_step": 21419, "epoch": 127} {"train_loss": -6.846429824829102, "global_step": 21420, "epoch": 127} {"train_loss": -6.789401054382324, "global_step": 21421, "epoch": 127} {"train_loss": -7.050314426422119, "global_step": 21422, "epoch": 127} {"train_loss": -6.814977169036865, "global_step": 21423, "epoch": 127} {"train_loss": -6.990180015563965, "global_step": 21424, "epoch": 127} {"train_loss": -6.929619789123535, "global_step": 21425, "epoch": 127} {"train_loss": -6.936644554138184, "global_step": 21426, "epoch": 127} {"train_loss": -7.078527450561523, "global_step": 21427, "epoch": 127} {"train_loss": -6.819820404052734, "global_step": 21428, "epoch": 127} {"train_loss": -6.999971389770508, "global_step": 21429, "epoch": 127} {"train_loss": -6.985909938812256, "global_step": 21430, "epoch": 127} {"train_loss": -7.071127414703369, "global_step": 21431, "epoch": 127} {"train_loss": -7.055328845977783, "global_step": 21432, "epoch": 127} {"train_loss": -6.988867282867432, "global_step": 21433, "epoch": 127} {"train_loss": -6.7485833168029785, "global_step": 21434, "epoch": 127} {"train_loss": -6.806765556335449, "global_step": 21435, "epoch": 127} {"train_loss": -6.526584625244141, "global_step": 21436, "epoch": 127} {"train_loss": -7.019876956939697, "global_step": 21437, "epoch": 127} {"train_loss": -6.93629789352417, "global_step": 21438, "epoch": 127} {"train_loss": -6.997134208679199, "global_step": 21439, "epoch": 127} {"train_loss": -7.0888285636901855, "global_step": 21440, "epoch": 127} {"train_loss": -6.92646598815918, "global_step": 21441, "epoch": 127} {"train_loss": -6.880002021789551, "global_step": 21442, "epoch": 127} {"train_loss": -6.782673358917236, "global_step": 21443, "epoch": 127} {"train_loss": -7.169365882873535, "global_step": 21444, "epoch": 127} {"train_loss": -7.121018409729004, "global_step": 21445, "epoch": 127} {"train_loss": -7.1005024909973145, "global_step": 21446, "epoch": 127} {"train_loss": -7.012094497680664, "global_step": 21447, "epoch": 127} {"train_loss": -6.733899116516113, "global_step": 21448, "epoch": 127} {"train_loss": -6.944784164428711, "global_step": 21449, "epoch": 127} {"train_loss": -6.78371000289917, "global_step": 21450, "epoch": 127} {"train_loss": -7.110902309417725, "global_step": 21451, "epoch": 127} {"train_loss": -6.948451042175293, "global_step": 21452, "epoch": 127} {"train_loss": -7.178958415985107, "global_step": 21453, "epoch": 127} {"train_loss": -6.808485984802246, "global_step": 21454, "epoch": 127} {"train_loss": -7.042438983917236, "global_step": 21455, "epoch": 127} {"train_loss": -6.965407371520996, "global_step": 21456, "epoch": 127} {"train_loss": -6.946649074554443, "global_step": 21457, "epoch": 127} {"train_loss": -7.215854644775391, "global_step": 21458, "epoch": 127} {"train_loss": -6.978139400482178, "global_step": 21459, "epoch": 127} {"train_loss": -6.910869121551514, "global_step": 21460, "epoch": 127} {"train_loss": -6.9733686447143555, "global_step": 21461, "epoch": 127} {"train_loss": -6.998945236206055, "global_step": 21462, "epoch": 127} {"train_loss": -7.012124538421631, "global_step": 21463, "epoch": 127} {"train_loss": -6.875007629394531, "global_step": 21464, "epoch": 127} {"train_loss": -7.11885929107666, "global_step": 21465, "epoch": 127} {"train_loss": -6.978761672973633, "global_step": 21466, "epoch": 127} {"train_loss": -7.00167179107666, "global_step": 21467, "epoch": 127} {"train_loss": -7.030936241149902, "global_step": 21468, "epoch": 127} {"train_loss": -6.947118282318115, "global_step": 21469, "epoch": 127} {"train_loss": -6.790401935577393, "global_step": 21470, "epoch": 127} {"train_loss": -7.036920547485352, "global_step": 21471, "epoch": 127} {"train_loss": -6.884886741638184, "global_step": 21472, "epoch": 127} {"train_loss": -6.870550155639648, "global_step": 21473, "epoch": 127} {"train_loss": -7.0327558517456055, "global_step": 21474, "epoch": 127} {"train_loss": -6.741411209106445, "global_step": 21475, "epoch": 127} {"train_loss": -6.878077507019043, "global_step": 21476, "epoch": 127} {"train_loss": -6.860408306121826, "global_step": 21477, "epoch": 127} {"train_loss": -6.921477317810059, "global_step": 21478, "epoch": 127} {"train_loss": -6.827097415924072, "global_step": 21479, "epoch": 127} {"train_loss": -6.875511169433594, "global_step": 21480, "epoch": 127} {"train_loss": -7.02334451675415, "global_step": 21481, "epoch": 127} {"train_loss": -6.952192306518555, "global_step": 21482, "epoch": 127} {"train_loss": -7.108809471130371, "global_step": 21483, "epoch": 127} {"train_loss": -6.907243728637695, "global_step": 21484, "epoch": 127} {"train_loss": -7.114707946777344, "global_step": 21485, "epoch": 127} {"train_loss": -6.860172748565674, "global_step": 21486, "epoch": 127} {"train_loss": -6.906431198120117, "global_step": 21487, "epoch": 127} {"train_loss": -6.9276885986328125, "global_step": 21488, "epoch": 127} {"train_loss": -6.736504077911377, "global_step": 21489, "epoch": 127} {"train_loss": -6.845315933227539, "global_step": 21490, "epoch": 127} {"train_loss": -7.082792282104492, "global_step": 21491, "epoch": 127} {"train_loss": -6.837429046630859, "global_step": 21492, "epoch": 127} {"train_loss": -6.927474021911621, "global_step": 21493, "epoch": 127} {"train_loss": -7.054042339324951, "global_step": 21494, "epoch": 127} {"train_loss": -6.638166427612305, "global_step": 21495, "epoch": 127} {"train_loss": -6.9192681312561035, "global_step": 21496, "epoch": 127} {"train_loss": -6.581646919250488, "global_step": 21497, "epoch": 127} {"train_loss": -6.668994426727295, "global_step": 21498, "epoch": 127} {"train_loss": -6.498395919799805, "global_step": 21499, "epoch": 127} {"train_loss": -6.641583442687988, "global_step": 21500, "epoch": 127} {"train_loss": -6.986328125, "global_step": 21501, "epoch": 127} {"train_loss": -6.638361930847168, "global_step": 21502, "epoch": 127} {"train_loss": -6.924549224830809, "global_step": 21503, "epoch": 127, "val_loss": 208191.796875} {"train_loss": -6.912308692932129, "global_step": 21504, "epoch": 128} {"train_loss": -6.851051330566406, "global_step": 21505, "epoch": 128} {"train_loss": -6.930116653442383, "global_step": 21506, "epoch": 128} {"train_loss": -6.893135070800781, "global_step": 21507, "epoch": 128} {"train_loss": -7.040068626403809, "global_step": 21508, "epoch": 128} {"train_loss": -6.946482181549072, "global_step": 21509, "epoch": 128} {"train_loss": -6.944554328918457, "global_step": 21510, "epoch": 128} {"train_loss": -7.179581165313721, "global_step": 21511, "epoch": 128} {"train_loss": -6.812654495239258, "global_step": 21512, "epoch": 128} {"train_loss": -6.797898292541504, "global_step": 21513, "epoch": 128} {"train_loss": -7.000738143920898, "global_step": 21514, "epoch": 128} {"train_loss": -6.841885089874268, "global_step": 21515, "epoch": 128} {"train_loss": -7.00541877746582, "global_step": 21516, "epoch": 128} {"train_loss": -6.946758270263672, "global_step": 21517, "epoch": 128} {"train_loss": -6.890036582946777, "global_step": 21518, "epoch": 128} {"train_loss": -7.01707649230957, "global_step": 21519, "epoch": 128} {"train_loss": -6.847001075744629, "global_step": 21520, "epoch": 128} {"train_loss": -6.762924671173096, "global_step": 21521, "epoch": 128} {"train_loss": -7.103211402893066, "global_step": 21522, "epoch": 128} {"train_loss": -6.828947067260742, "global_step": 21523, "epoch": 128} {"train_loss": -7.020416736602783, "global_step": 21524, "epoch": 128} {"train_loss": -6.766463279724121, "global_step": 21525, "epoch": 128} {"train_loss": -6.9508748054504395, "global_step": 21526, "epoch": 128} {"train_loss": -6.770266056060791, "global_step": 21527, "epoch": 128} {"train_loss": -6.844630241394043, "global_step": 21528, "epoch": 128} {"train_loss": -6.801987171173096, "global_step": 21529, "epoch": 128} {"train_loss": -6.85422945022583, "global_step": 21530, "epoch": 128} {"train_loss": -6.914633274078369, "global_step": 21531, "epoch": 128} {"train_loss": -6.957437515258789, "global_step": 21532, "epoch": 128} {"train_loss": -6.793773651123047, "global_step": 21533, "epoch": 128} {"train_loss": -6.929831504821777, "global_step": 21534, "epoch": 128} {"train_loss": -7.059909820556641, "global_step": 21535, "epoch": 128} {"train_loss": -7.011969566345215, "global_step": 21536, "epoch": 128} {"train_loss": -7.0886430740356445, "global_step": 21537, "epoch": 128} {"train_loss": -7.055574417114258, "global_step": 21538, "epoch": 128} {"train_loss": -6.932103157043457, "global_step": 21539, "epoch": 128} {"train_loss": -6.920823097229004, "global_step": 21540, "epoch": 128} {"train_loss": -7.130428314208984, "global_step": 21541, "epoch": 128} {"train_loss": -6.9556684494018555, "global_step": 21542, "epoch": 128} {"train_loss": -6.717886924743652, "global_step": 21543, "epoch": 128} {"train_loss": -6.900954723358154, "global_step": 21544, "epoch": 128} {"train_loss": -7.009120464324951, "global_step": 21545, "epoch": 128} {"train_loss": -7.172730445861816, "global_step": 21546, "epoch": 128} {"train_loss": -6.96806526184082, "global_step": 21547, "epoch": 128} {"train_loss": -7.0218658447265625, "global_step": 21548, "epoch": 128} {"train_loss": -7.124477386474609, "global_step": 21549, "epoch": 128} {"train_loss": -6.973273277282715, "global_step": 21550, "epoch": 128} {"train_loss": -7.073647499084473, "global_step": 21551, "epoch": 128} {"train_loss": -7.017158031463623, "global_step": 21552, "epoch": 128} {"train_loss": -6.9928436279296875, "global_step": 21553, "epoch": 128} {"train_loss": -6.8233489990234375, "global_step": 21554, "epoch": 128} {"train_loss": -7.365800380706787, "global_step": 21555, "epoch": 128} {"train_loss": -6.952332973480225, "global_step": 21556, "epoch": 128} {"train_loss": -7.06425666809082, "global_step": 21557, "epoch": 128} {"train_loss": -6.885706901550293, "global_step": 21558, "epoch": 128} {"train_loss": -6.965096473693848, "global_step": 21559, "epoch": 128} {"train_loss": -6.972869396209717, "global_step": 21560, "epoch": 128} {"train_loss": -6.799003601074219, "global_step": 21561, "epoch": 128} {"train_loss": -6.88552188873291, "global_step": 21562, "epoch": 128} {"train_loss": -6.923834323883057, "global_step": 21563, "epoch": 128} {"train_loss": -7.132377624511719, "global_step": 21564, "epoch": 128} {"train_loss": -7.0991668701171875, "global_step": 21565, "epoch": 128} {"train_loss": -7.044184684753418, "global_step": 21566, "epoch": 128} {"train_loss": -7.204163074493408, "global_step": 21567, "epoch": 128} {"train_loss": -6.780348777770996, "global_step": 21568, "epoch": 128} {"train_loss": -6.997668743133545, "global_step": 21569, "epoch": 128} {"train_loss": -6.836531639099121, "global_step": 21570, "epoch": 128} {"train_loss": -6.913066387176514, "global_step": 21571, "epoch": 128} {"train_loss": -6.9251885414123535, "global_step": 21572, "epoch": 128} {"train_loss": -6.580696105957031, "global_step": 21573, "epoch": 128} {"train_loss": -6.927762985229492, "global_step": 21574, "epoch": 128} {"train_loss": -6.879256248474121, "global_step": 21575, "epoch": 128} {"train_loss": -6.855943202972412, "global_step": 21576, "epoch": 128} {"train_loss": -6.7879533767700195, "global_step": 21577, "epoch": 128} {"train_loss": -6.731870651245117, "global_step": 21578, "epoch": 128} {"train_loss": -6.906285285949707, "global_step": 21579, "epoch": 128} {"train_loss": -6.465334415435791, "global_step": 21580, "epoch": 128} {"train_loss": -6.920828819274902, "global_step": 21581, "epoch": 128} {"train_loss": -6.855959892272949, "global_step": 21582, "epoch": 128} {"train_loss": -7.001185894012451, "global_step": 21583, "epoch": 128} {"train_loss": -6.94484806060791, "global_step": 21584, "epoch": 128} {"train_loss": -7.018401145935059, "global_step": 21585, "epoch": 128} {"train_loss": -6.943838119506836, "global_step": 21586, "epoch": 128} {"train_loss": -7.025144577026367, "global_step": 21587, "epoch": 128} {"train_loss": -7.160772323608398, "global_step": 21588, "epoch": 128} {"train_loss": -6.937239170074463, "global_step": 21589, "epoch": 128} {"train_loss": -7.143854141235352, "global_step": 21590, "epoch": 128} {"train_loss": -6.748928070068359, "global_step": 21591, "epoch": 128} {"train_loss": -6.969006061553955, "global_step": 21592, "epoch": 128} {"train_loss": -7.029620170593262, "global_step": 21593, "epoch": 128} {"train_loss": -6.970831394195557, "global_step": 21594, "epoch": 128} {"train_loss": -6.916990280151367, "global_step": 21595, "epoch": 128} {"train_loss": -6.860684394836426, "global_step": 21596, "epoch": 128} {"train_loss": -7.027072906494141, "global_step": 21597, "epoch": 128} {"train_loss": -6.676604270935059, "global_step": 21598, "epoch": 128} {"train_loss": -6.915223121643066, "global_step": 21599, "epoch": 128} {"train_loss": -6.88123083114624, "global_step": 21600, "epoch": 128} {"train_loss": -7.005834579467773, "global_step": 21601, "epoch": 128} {"train_loss": -7.009106636047363, "global_step": 21602, "epoch": 128} {"train_loss": -6.997652053833008, "global_step": 21603, "epoch": 128} {"train_loss": -6.935199737548828, "global_step": 21604, "epoch": 128} {"train_loss": -7.0046844482421875, "global_step": 21605, "epoch": 128} {"train_loss": -6.864171504974365, "global_step": 21606, "epoch": 128} {"train_loss": -6.799233436584473, "global_step": 21607, "epoch": 128} {"train_loss": -7.184285640716553, "global_step": 21608, "epoch": 128} {"train_loss": -6.795947074890137, "global_step": 21609, "epoch": 128} {"train_loss": -7.155422210693359, "global_step": 21610, "epoch": 128} {"train_loss": -6.892414093017578, "global_step": 21611, "epoch": 128} {"train_loss": -6.901686668395996, "global_step": 21612, "epoch": 128} {"train_loss": -6.730475425720215, "global_step": 21613, "epoch": 128} {"train_loss": -6.839259624481201, "global_step": 21614, "epoch": 128} {"train_loss": -6.620927810668945, "global_step": 21615, "epoch": 128} {"train_loss": -6.763744354248047, "global_step": 21616, "epoch": 128} {"train_loss": -6.7999162673950195, "global_step": 21617, "epoch": 128} {"train_loss": -6.718758583068848, "global_step": 21618, "epoch": 128} {"train_loss": -6.60885763168335, "global_step": 21619, "epoch": 128} {"train_loss": -6.603201866149902, "global_step": 21620, "epoch": 128} {"train_loss": -6.831079483032227, "global_step": 21621, "epoch": 128} {"train_loss": -6.731334686279297, "global_step": 21622, "epoch": 128} {"train_loss": -6.622928619384766, "global_step": 21623, "epoch": 128} {"train_loss": -6.893281936645508, "global_step": 21624, "epoch": 128} {"train_loss": -6.821476936340332, "global_step": 21625, "epoch": 128} {"train_loss": -6.858386039733887, "global_step": 21626, "epoch": 128} {"train_loss": -6.881980895996094, "global_step": 21627, "epoch": 128} {"train_loss": -6.837182998657227, "global_step": 21628, "epoch": 128} {"train_loss": -6.6125311851501465, "global_step": 21629, "epoch": 128} {"train_loss": -6.799964904785156, "global_step": 21630, "epoch": 128} {"train_loss": -6.889351844787598, "global_step": 21631, "epoch": 128} {"train_loss": -6.748818874359131, "global_step": 21632, "epoch": 128} {"train_loss": -6.580706596374512, "global_step": 21633, "epoch": 128} {"train_loss": -6.764994144439697, "global_step": 21634, "epoch": 128} {"train_loss": -7.05278205871582, "global_step": 21635, "epoch": 128} {"train_loss": -6.594142913818359, "global_step": 21636, "epoch": 128} {"train_loss": -6.7098388671875, "global_step": 21637, "epoch": 128} {"train_loss": -7.105197429656982, "global_step": 21638, "epoch": 128} {"train_loss": -6.953207969665527, "global_step": 21639, "epoch": 128} {"train_loss": -6.9428815841674805, "global_step": 21640, "epoch": 128} {"train_loss": -6.682173728942871, "global_step": 21641, "epoch": 128} {"train_loss": -7.062212944030762, "global_step": 21642, "epoch": 128} {"train_loss": -6.821136951446533, "global_step": 21643, "epoch": 128} {"train_loss": -6.779138565063477, "global_step": 21644, "epoch": 128} {"train_loss": -7.0845136642456055, "global_step": 21645, "epoch": 128} {"train_loss": -6.932743549346924, "global_step": 21646, "epoch": 128} {"train_loss": -6.956480026245117, "global_step": 21647, "epoch": 128} {"train_loss": -7.029875755310059, "global_step": 21648, "epoch": 128} {"train_loss": -6.853692531585693, "global_step": 21649, "epoch": 128} {"train_loss": -6.84439754486084, "global_step": 21650, "epoch": 128} {"train_loss": -6.9110002517700195, "global_step": 21651, "epoch": 128} {"train_loss": -6.938731670379639, "global_step": 21652, "epoch": 128} {"train_loss": -7.045167922973633, "global_step": 21653, "epoch": 128} {"train_loss": -7.077700138092041, "global_step": 21654, "epoch": 128} {"train_loss": -7.0179643630981445, "global_step": 21655, "epoch": 128} {"train_loss": -6.942198753356934, "global_step": 21656, "epoch": 128} {"train_loss": -7.1334381103515625, "global_step": 21657, "epoch": 128} {"train_loss": -7.060135841369629, "global_step": 21658, "epoch": 128} {"train_loss": -7.194675922393799, "global_step": 21659, "epoch": 128} {"train_loss": -7.1005859375, "global_step": 21660, "epoch": 128} {"train_loss": -7.182909965515137, "global_step": 21661, "epoch": 128} {"train_loss": -6.765178203582764, "global_step": 21662, "epoch": 128} {"train_loss": -6.900483131408691, "global_step": 21663, "epoch": 128} {"train_loss": -7.0515947341918945, "global_step": 21664, "epoch": 128} {"train_loss": -7.069883346557617, "global_step": 21665, "epoch": 128} {"train_loss": -7.0460004806518555, "global_step": 21666, "epoch": 128} {"train_loss": -6.891860485076904, "global_step": 21667, "epoch": 128} {"train_loss": -7.0580339431762695, "global_step": 21668, "epoch": 128} {"train_loss": -6.866514205932617, "global_step": 21669, "epoch": 128} {"train_loss": -7.058632850646973, "global_step": 21670, "epoch": 128} {"train_loss": -6.920563902173724, "global_step": 21671, "epoch": 128, "val_loss": 208592.296875} {"train_loss": -7.001150608062744, "global_step": 21672, "epoch": 129} {"train_loss": -6.9274396896362305, "global_step": 21673, "epoch": 129} {"train_loss": -6.842032432556152, "global_step": 21674, "epoch": 129} {"train_loss": -6.923695087432861, "global_step": 21675, "epoch": 129} {"train_loss": -7.0235700607299805, "global_step": 21676, "epoch": 129} {"train_loss": -6.992351531982422, "global_step": 21677, "epoch": 129} {"train_loss": -6.75175666809082, "global_step": 21678, "epoch": 129} {"train_loss": -6.8116936683654785, "global_step": 21679, "epoch": 129} {"train_loss": -6.91762113571167, "global_step": 21680, "epoch": 129} {"train_loss": -6.893328666687012, "global_step": 21681, "epoch": 129} {"train_loss": -6.821467399597168, "global_step": 21682, "epoch": 129} {"train_loss": -6.995052337646484, "global_step": 21683, "epoch": 129} {"train_loss": -6.791123867034912, "global_step": 21684, "epoch": 129} {"train_loss": -7.017080307006836, "global_step": 21685, "epoch": 129} {"train_loss": -6.965175628662109, "global_step": 21686, "epoch": 129} {"train_loss": -6.5613322257995605, "global_step": 21687, "epoch": 129} {"train_loss": -6.857610702514648, "global_step": 21688, "epoch": 129} {"train_loss": -6.883541107177734, "global_step": 21689, "epoch": 129} {"train_loss": -6.926238536834717, "global_step": 21690, "epoch": 129} {"train_loss": -6.856623649597168, "global_step": 21691, "epoch": 129} {"train_loss": -6.992642402648926, "global_step": 21692, "epoch": 129} {"train_loss": -6.996055603027344, "global_step": 21693, "epoch": 129} {"train_loss": -7.218873023986816, "global_step": 21694, "epoch": 129} {"train_loss": -7.061641693115234, "global_step": 21695, "epoch": 129} {"train_loss": -7.215816497802734, "global_step": 21696, "epoch": 129} {"train_loss": -6.945700645446777, "global_step": 21697, "epoch": 129} {"train_loss": -6.990416526794434, "global_step": 21698, "epoch": 129} {"train_loss": -7.162966251373291, "global_step": 21699, "epoch": 129} {"train_loss": -7.170948028564453, "global_step": 21700, "epoch": 129} {"train_loss": -6.9976806640625, "global_step": 21701, "epoch": 129} {"train_loss": -7.192356109619141, "global_step": 21702, "epoch": 129} {"train_loss": -7.1866536140441895, "global_step": 21703, "epoch": 129} {"train_loss": -6.8946123123168945, "global_step": 21704, "epoch": 129} {"train_loss": -6.72802734375, "global_step": 21705, "epoch": 129} {"train_loss": -6.830642223358154, "global_step": 21706, "epoch": 129} {"train_loss": -6.856613636016846, "global_step": 21707, "epoch": 129} {"train_loss": -7.135663032531738, "global_step": 21708, "epoch": 129} {"train_loss": -7.030093669891357, "global_step": 21709, "epoch": 129} {"train_loss": -6.895703315734863, "global_step": 21710, "epoch": 129} {"train_loss": -7.142170429229736, "global_step": 21711, "epoch": 129} {"train_loss": -7.131382942199707, "global_step": 21712, "epoch": 129} {"train_loss": -6.801396369934082, "global_step": 21713, "epoch": 129} {"train_loss": -7.195539951324463, "global_step": 21714, "epoch": 129} {"train_loss": -6.9949259757995605, "global_step": 21715, "epoch": 129} {"train_loss": -6.506045341491699, "global_step": 21716, "epoch": 129} {"train_loss": -7.053605556488037, "global_step": 21717, "epoch": 129} {"train_loss": -6.934935569763184, "global_step": 21718, "epoch": 129} {"train_loss": -6.92067289352417, "global_step": 21719, "epoch": 129} {"train_loss": -6.785292625427246, "global_step": 21720, "epoch": 129} {"train_loss": -6.842231273651123, "global_step": 21721, "epoch": 129} {"train_loss": -6.870927333831787, "global_step": 21722, "epoch": 129} {"train_loss": -7.042917251586914, "global_step": 21723, "epoch": 129} {"train_loss": -6.970798492431641, "global_step": 21724, "epoch": 129} {"train_loss": -7.040032386779785, "global_step": 21725, "epoch": 129} {"train_loss": -6.852138519287109, "global_step": 21726, "epoch": 129} {"train_loss": -6.928617477416992, "global_step": 21727, "epoch": 129} {"train_loss": -6.861550331115723, "global_step": 21728, "epoch": 129} {"train_loss": -6.917308807373047, "global_step": 21729, "epoch": 129} {"train_loss": -6.848589897155762, "global_step": 21730, "epoch": 129} {"train_loss": -6.935766696929932, "global_step": 21731, "epoch": 129} {"train_loss": -6.971113204956055, "global_step": 21732, "epoch": 129} {"train_loss": -6.913871765136719, "global_step": 21733, "epoch": 129} {"train_loss": -6.815292835235596, "global_step": 21734, "epoch": 129} {"train_loss": -7.12268590927124, "global_step": 21735, "epoch": 129} {"train_loss": -6.912421703338623, "global_step": 21736, "epoch": 129} {"train_loss": -6.895951747894287, "global_step": 21737, "epoch": 129} {"train_loss": -7.097105503082275, "global_step": 21738, "epoch": 129} {"train_loss": -6.969680309295654, "global_step": 21739, "epoch": 129} {"train_loss": -6.820173263549805, "global_step": 21740, "epoch": 129} {"train_loss": -7.099163055419922, "global_step": 21741, "epoch": 129} {"train_loss": -6.986732482910156, "global_step": 21742, "epoch": 129} {"train_loss": -7.086055755615234, "global_step": 21743, "epoch": 129} {"train_loss": -6.829510688781738, "global_step": 21744, "epoch": 129} {"train_loss": -7.121502876281738, "global_step": 21745, "epoch": 129} {"train_loss": -6.895183563232422, "global_step": 21746, "epoch": 129} {"train_loss": -6.917455673217773, "global_step": 21747, "epoch": 129} {"train_loss": -6.982711315155029, "global_step": 21748, "epoch": 129} {"train_loss": -6.937321662902832, "global_step": 21749, "epoch": 129} {"train_loss": -6.959817409515381, "global_step": 21750, "epoch": 129} {"train_loss": -7.05997371673584, "global_step": 21751, "epoch": 129} {"train_loss": -7.0639495849609375, "global_step": 21752, "epoch": 129} {"train_loss": -6.92792272567749, "global_step": 21753, "epoch": 129} {"train_loss": -7.067356109619141, "global_step": 21754, "epoch": 129} {"train_loss": -7.017661094665527, "global_step": 21755, "epoch": 129} {"train_loss": -7.038309097290039, "global_step": 21756, "epoch": 129} {"train_loss": -7.097578525543213, "global_step": 21757, "epoch": 129} {"train_loss": -6.7629899978637695, "global_step": 21758, "epoch": 129} {"train_loss": -7.2268171310424805, "global_step": 21759, "epoch": 129} {"train_loss": -6.786214828491211, "global_step": 21760, "epoch": 129} {"train_loss": -6.996063709259033, "global_step": 21761, "epoch": 129} {"train_loss": -6.701411247253418, "global_step": 21762, "epoch": 129} {"train_loss": -6.815948009490967, "global_step": 21763, "epoch": 129} {"train_loss": -6.858707427978516, "global_step": 21764, "epoch": 129} {"train_loss": -6.631677627563477, "global_step": 21765, "epoch": 129} {"train_loss": -6.994154930114746, "global_step": 21766, "epoch": 129} {"train_loss": -6.860987186431885, "global_step": 21767, "epoch": 129} {"train_loss": -6.67383337020874, "global_step": 21768, "epoch": 129} {"train_loss": -6.828376770019531, "global_step": 21769, "epoch": 129} {"train_loss": -6.977092742919922, "global_step": 21770, "epoch": 129} {"train_loss": -7.074218273162842, "global_step": 21771, "epoch": 129} {"train_loss": -6.907752990722656, "global_step": 21772, "epoch": 129} {"train_loss": -6.887537002563477, "global_step": 21773, "epoch": 129} {"train_loss": -6.8495330810546875, "global_step": 21774, "epoch": 129} {"train_loss": -6.648812294006348, "global_step": 21775, "epoch": 129} {"train_loss": -6.720157623291016, "global_step": 21776, "epoch": 129} {"train_loss": -6.682864665985107, "global_step": 21777, "epoch": 129} {"train_loss": -7.074687957763672, "global_step": 21778, "epoch": 129} {"train_loss": -6.6251220703125, "global_step": 21779, "epoch": 129} {"train_loss": -6.77072811126709, "global_step": 21780, "epoch": 129} {"train_loss": -6.889365196228027, "global_step": 21781, "epoch": 129} {"train_loss": -7.008536338806152, "global_step": 21782, "epoch": 129} {"train_loss": -6.716091156005859, "global_step": 21783, "epoch": 129} {"train_loss": -6.9988508224487305, "global_step": 21784, "epoch": 129} {"train_loss": -6.960287094116211, "global_step": 21785, "epoch": 129} {"train_loss": -7.157927989959717, "global_step": 21786, "epoch": 129} {"train_loss": -6.919614791870117, "global_step": 21787, "epoch": 129} {"train_loss": -6.935276031494141, "global_step": 21788, "epoch": 129} {"train_loss": -6.975283622741699, "global_step": 21789, "epoch": 129} {"train_loss": -6.912380218505859, "global_step": 21790, "epoch": 129} {"train_loss": -6.868727207183838, "global_step": 21791, "epoch": 129} {"train_loss": -7.122182846069336, "global_step": 21792, "epoch": 129} {"train_loss": -6.881913661956787, "global_step": 21793, "epoch": 129} {"train_loss": -7.018313407897949, "global_step": 21794, "epoch": 129} {"train_loss": -6.980963706970215, "global_step": 21795, "epoch": 129} {"train_loss": -7.186766147613525, "global_step": 21796, "epoch": 129} {"train_loss": -7.155925750732422, "global_step": 21797, "epoch": 129} {"train_loss": -7.034375190734863, "global_step": 21798, "epoch": 129} {"train_loss": -7.212100982666016, "global_step": 21799, "epoch": 129} {"train_loss": -7.0934858322143555, "global_step": 21800, "epoch": 129} {"train_loss": -7.173820495605469, "global_step": 21801, "epoch": 129} {"train_loss": -7.1533708572387695, "global_step": 21802, "epoch": 129} {"train_loss": -6.868755340576172, "global_step": 21803, "epoch": 129} {"train_loss": -7.108139991760254, "global_step": 21804, "epoch": 129} {"train_loss": -7.114559173583984, "global_step": 21805, "epoch": 129} {"train_loss": -6.860793113708496, "global_step": 21806, "epoch": 129} {"train_loss": -6.978104591369629, "global_step": 21807, "epoch": 129} {"train_loss": -6.958857536315918, "global_step": 21808, "epoch": 129} {"train_loss": -7.114768028259277, "global_step": 21809, "epoch": 129} {"train_loss": -6.940009117126465, "global_step": 21810, "epoch": 129} {"train_loss": -6.961034297943115, "global_step": 21811, "epoch": 129} {"train_loss": -6.930665016174316, "global_step": 21812, "epoch": 129} {"train_loss": -7.109001159667969, "global_step": 21813, "epoch": 129} {"train_loss": -6.920956611633301, "global_step": 21814, "epoch": 129} {"train_loss": -6.999301910400391, "global_step": 21815, "epoch": 129} {"train_loss": -7.142060279846191, "global_step": 21816, "epoch": 129} {"train_loss": -6.9012861251831055, "global_step": 21817, "epoch": 129} {"train_loss": -6.929804801940918, "global_step": 21818, "epoch": 129} {"train_loss": -6.8559064865112305, "global_step": 21819, "epoch": 129} {"train_loss": -6.958584785461426, "global_step": 21820, "epoch": 129} {"train_loss": -6.9978837966918945, "global_step": 21821, "epoch": 129} {"train_loss": -7.051425933837891, "global_step": 21822, "epoch": 129} {"train_loss": -6.957158088684082, "global_step": 21823, "epoch": 129} {"train_loss": -6.657832145690918, "global_step": 21824, "epoch": 129} {"train_loss": -7.007410049438477, "global_step": 21825, "epoch": 129} {"train_loss": -6.7736592292785645, "global_step": 21826, "epoch": 129} {"train_loss": -6.778100490570068, "global_step": 21827, "epoch": 129} {"train_loss": -6.880489349365234, "global_step": 21828, "epoch": 129} {"train_loss": -6.840923309326172, "global_step": 21829, "epoch": 129} {"train_loss": -6.574396133422852, "global_step": 21830, "epoch": 129} {"train_loss": -6.80612850189209, "global_step": 21831, "epoch": 129} {"train_loss": -6.824762344360352, "global_step": 21832, "epoch": 129} {"train_loss": -6.7404632568359375, "global_step": 21833, "epoch": 129} {"train_loss": -6.90595006942749, "global_step": 21834, "epoch": 129} {"train_loss": -6.626697540283203, "global_step": 21835, "epoch": 129} {"train_loss": -6.62446403503418, "global_step": 21836, "epoch": 129} {"train_loss": -6.7904205322265625, "global_step": 21837, "epoch": 129} {"train_loss": -6.7031989097595215, "global_step": 21838, "epoch": 129} {"train_loss": -6.935020364466167, "global_step": 21839, "epoch": 129, "val_loss": 210287.875} {"train_loss": -6.7321882247924805, "global_step": 21840, "epoch": 130} {"train_loss": -6.8397932052612305, "global_step": 21841, "epoch": 130} {"train_loss": -6.9744873046875, "global_step": 21842, "epoch": 130} {"train_loss": -6.726431846618652, "global_step": 21843, "epoch": 130} {"train_loss": -6.7198805809021, "global_step": 21844, "epoch": 130} {"train_loss": -6.700438499450684, "global_step": 21845, "epoch": 130} {"train_loss": -6.998562812805176, "global_step": 21846, "epoch": 130} {"train_loss": -6.6814751625061035, "global_step": 21847, "epoch": 130} {"train_loss": -6.932156085968018, "global_step": 21848, "epoch": 130} {"train_loss": -6.938176155090332, "global_step": 21849, "epoch": 130} {"train_loss": -6.967369079589844, "global_step": 21850, "epoch": 130} {"train_loss": -6.849113464355469, "global_step": 21851, "epoch": 130} {"train_loss": -6.773709297180176, "global_step": 21852, "epoch": 130} {"train_loss": -6.929675102233887, "global_step": 21853, "epoch": 130} {"train_loss": -7.019254684448242, "global_step": 21854, "epoch": 130} {"train_loss": -7.067425727844238, "global_step": 21855, "epoch": 130} {"train_loss": -7.150016784667969, "global_step": 21856, "epoch": 130} {"train_loss": -7.193049430847168, "global_step": 21857, "epoch": 130} {"train_loss": -7.045701026916504, "global_step": 21858, "epoch": 130} {"train_loss": -6.9965410232543945, "global_step": 21859, "epoch": 130} {"train_loss": -7.16777229309082, "global_step": 21860, "epoch": 130} {"train_loss": -7.020800590515137, "global_step": 21861, "epoch": 130} {"train_loss": -6.9064764976501465, "global_step": 21862, "epoch": 130} {"train_loss": -7.154160976409912, "global_step": 21863, "epoch": 130} {"train_loss": -7.221428871154785, "global_step": 21864, "epoch": 130} {"train_loss": -7.11952018737793, "global_step": 21865, "epoch": 130} {"train_loss": -6.9623122215271, "global_step": 21866, "epoch": 130} {"train_loss": -7.107683181762695, "global_step": 21867, "epoch": 130} {"train_loss": -6.921974182128906, "global_step": 21868, "epoch": 130} {"train_loss": -7.116620063781738, "global_step": 21869, "epoch": 130} {"train_loss": -6.814836502075195, "global_step": 21870, "epoch": 130} {"train_loss": -6.994080543518066, "global_step": 21871, "epoch": 130} {"train_loss": -6.816625595092773, "global_step": 21872, "epoch": 130} {"train_loss": -6.920034408569336, "global_step": 21873, "epoch": 130} {"train_loss": -6.695590019226074, "global_step": 21874, "epoch": 130} {"train_loss": -6.936643600463867, "global_step": 21875, "epoch": 130} {"train_loss": -6.939029216766357, "global_step": 21876, "epoch": 130} {"train_loss": -6.974637031555176, "global_step": 21877, "epoch": 130} {"train_loss": -6.841099739074707, "global_step": 21878, "epoch": 130} {"train_loss": -7.008536338806152, "global_step": 21879, "epoch": 130} {"train_loss": -6.935215473175049, "global_step": 21880, "epoch": 130} {"train_loss": -7.197457790374756, "global_step": 21881, "epoch": 130} {"train_loss": -7.220252990722656, "global_step": 21882, "epoch": 130} {"train_loss": -6.814332962036133, "global_step": 21883, "epoch": 130} {"train_loss": -6.72432804107666, "global_step": 21884, "epoch": 130} {"train_loss": -7.157979965209961, "global_step": 21885, "epoch": 130} {"train_loss": -6.999630928039551, "global_step": 21886, "epoch": 130} {"train_loss": -7.043882369995117, "global_step": 21887, "epoch": 130} {"train_loss": -7.031020641326904, "global_step": 21888, "epoch": 130} {"train_loss": -7.0514421463012695, "global_step": 21889, "epoch": 130} {"train_loss": -6.778853416442871, "global_step": 21890, "epoch": 130} {"train_loss": -6.887743949890137, "global_step": 21891, "epoch": 130} {"train_loss": -6.794920921325684, "global_step": 21892, "epoch": 130} {"train_loss": -6.754575729370117, "global_step": 21893, "epoch": 130} {"train_loss": -6.902976989746094, "global_step": 21894, "epoch": 130} {"train_loss": -6.793817043304443, "global_step": 21895, "epoch": 130} {"train_loss": -6.8335957527160645, "global_step": 21896, "epoch": 130} {"train_loss": -6.561603546142578, "global_step": 21897, "epoch": 130} {"train_loss": -6.925999164581299, "global_step": 21898, "epoch": 130} {"train_loss": -6.681699752807617, "global_step": 21899, "epoch": 130} {"train_loss": -6.722472190856934, "global_step": 21900, "epoch": 130} {"train_loss": -7.034168243408203, "global_step": 21901, "epoch": 130} {"train_loss": -6.812751770019531, "global_step": 21902, "epoch": 130} {"train_loss": -6.951570510864258, "global_step": 21903, "epoch": 130} {"train_loss": -6.970498085021973, "global_step": 21904, "epoch": 130} {"train_loss": -6.691037178039551, "global_step": 21905, "epoch": 130} {"train_loss": -6.876296043395996, "global_step": 21906, "epoch": 130} {"train_loss": -6.659316062927246, "global_step": 21907, "epoch": 130} {"train_loss": -6.9360127449035645, "global_step": 21908, "epoch": 130} {"train_loss": -6.818751335144043, "global_step": 21909, "epoch": 130} {"train_loss": -6.695926189422607, "global_step": 21910, "epoch": 130} {"train_loss": -6.955605506896973, "global_step": 21911, "epoch": 130} {"train_loss": -6.771696090698242, "global_step": 21912, "epoch": 130} {"train_loss": -6.945273399353027, "global_step": 21913, "epoch": 130} {"train_loss": -6.935889720916748, "global_step": 21914, "epoch": 130} {"train_loss": -6.93405818939209, "global_step": 21915, "epoch": 130} {"train_loss": -6.990764617919922, "global_step": 21916, "epoch": 130} {"train_loss": -7.081914901733398, "global_step": 21917, "epoch": 130} {"train_loss": -7.0254974365234375, "global_step": 21918, "epoch": 130} {"train_loss": -6.917935371398926, "global_step": 21919, "epoch": 130} {"train_loss": -7.029082298278809, "global_step": 21920, "epoch": 130} {"train_loss": -7.004536151885986, "global_step": 21921, "epoch": 130} {"train_loss": -6.804490089416504, "global_step": 21922, "epoch": 130} {"train_loss": -7.2214250564575195, "global_step": 21923, "epoch": 130} {"train_loss": -6.871434688568115, "global_step": 21924, "epoch": 130} {"train_loss": -6.998451232910156, "global_step": 21925, "epoch": 130} {"train_loss": -6.9013190269470215, "global_step": 21926, "epoch": 130} {"train_loss": -7.059730529785156, "global_step": 21927, "epoch": 130} {"train_loss": -7.037361145019531, "global_step": 21928, "epoch": 130} {"train_loss": -6.987837314605713, "global_step": 21929, "epoch": 130} {"train_loss": -7.009506702423096, "global_step": 21930, "epoch": 130} {"train_loss": -6.891414165496826, "global_step": 21931, "epoch": 130} {"train_loss": -6.925312519073486, "global_step": 21932, "epoch": 130} {"train_loss": -6.841131687164307, "global_step": 21933, "epoch": 130} {"train_loss": -6.996382236480713, "global_step": 21934, "epoch": 130} {"train_loss": -7.108030319213867, "global_step": 21935, "epoch": 130} {"train_loss": -7.1505446434021, "global_step": 21936, "epoch": 130} {"train_loss": -6.996002674102783, "global_step": 21937, "epoch": 130} {"train_loss": -6.871297359466553, "global_step": 21938, "epoch": 130} {"train_loss": -6.711091995239258, "global_step": 21939, "epoch": 130} {"train_loss": -7.093274116516113, "global_step": 21940, "epoch": 130} {"train_loss": -6.996332168579102, "global_step": 21941, "epoch": 130} {"train_loss": -6.934534549713135, "global_step": 21942, "epoch": 130} {"train_loss": -6.987705230712891, "global_step": 21943, "epoch": 130} {"train_loss": -7.137243270874023, "global_step": 21944, "epoch": 130} {"train_loss": -6.883440017700195, "global_step": 21945, "epoch": 130} {"train_loss": -6.750565528869629, "global_step": 21946, "epoch": 130} {"train_loss": -6.863198280334473, "global_step": 21947, "epoch": 130} {"train_loss": -7.221290588378906, "global_step": 21948, "epoch": 130} {"train_loss": -7.170105934143066, "global_step": 21949, "epoch": 130} {"train_loss": -6.980765342712402, "global_step": 21950, "epoch": 130} {"train_loss": -7.073655605316162, "global_step": 21951, "epoch": 130} {"train_loss": -6.9643025398254395, "global_step": 21952, "epoch": 130} {"train_loss": -6.770122528076172, "global_step": 21953, "epoch": 130} {"train_loss": -7.058296203613281, "global_step": 21954, "epoch": 130} {"train_loss": -7.130556106567383, "global_step": 21955, "epoch": 130} {"train_loss": -7.00726842880249, "global_step": 21956, "epoch": 130} {"train_loss": -6.967990398406982, "global_step": 21957, "epoch": 130} {"train_loss": -7.09824275970459, "global_step": 21958, "epoch": 130} {"train_loss": -6.68740701675415, "global_step": 21959, "epoch": 130} {"train_loss": -7.024299621582031, "global_step": 21960, "epoch": 130} {"train_loss": -6.801968574523926, "global_step": 21961, "epoch": 130} {"train_loss": -6.915675163269043, "global_step": 21962, "epoch": 130} {"train_loss": -6.93150520324707, "global_step": 21963, "epoch": 130} {"train_loss": -7.021866798400879, "global_step": 21964, "epoch": 130} {"train_loss": -6.776699542999268, "global_step": 21965, "epoch": 130} {"train_loss": -6.847969055175781, "global_step": 21966, "epoch": 130} {"train_loss": -6.965633869171143, "global_step": 21967, "epoch": 130} {"train_loss": -6.948809623718262, "global_step": 21968, "epoch": 130} {"train_loss": -6.914922714233398, "global_step": 21969, "epoch": 130} {"train_loss": -7.1185808181762695, "global_step": 21970, "epoch": 130} {"train_loss": -7.082196235656738, "global_step": 21971, "epoch": 130} {"train_loss": -7.065296173095703, "global_step": 21972, "epoch": 130} {"train_loss": -6.8140153884887695, "global_step": 21973, "epoch": 130} {"train_loss": -7.056823253631592, "global_step": 21974, "epoch": 130} {"train_loss": -6.949646472930908, "global_step": 21975, "epoch": 130} {"train_loss": -7.025528907775879, "global_step": 21976, "epoch": 130} {"train_loss": -6.896020889282227, "global_step": 21977, "epoch": 130} {"train_loss": -7.094235420227051, "global_step": 21978, "epoch": 130} {"train_loss": -7.200686454772949, "global_step": 21979, "epoch": 130} {"train_loss": -6.978299140930176, "global_step": 21980, "epoch": 130} {"train_loss": -7.1290693283081055, "global_step": 21981, "epoch": 130} {"train_loss": -6.974374294281006, "global_step": 21982, "epoch": 130} {"train_loss": -7.121030330657959, "global_step": 21983, "epoch": 130} {"train_loss": -7.246002197265625, "global_step": 21984, "epoch": 130} {"train_loss": -7.119811534881592, "global_step": 21985, "epoch": 130} {"train_loss": -7.190686225891113, "global_step": 21986, "epoch": 130} {"train_loss": -6.815866470336914, "global_step": 21987, "epoch": 130} {"train_loss": -7.0768232345581055, "global_step": 21988, "epoch": 130} {"train_loss": -6.947844982147217, "global_step": 21989, "epoch": 130} {"train_loss": -7.0495452880859375, "global_step": 21990, "epoch": 130} {"train_loss": -7.19447135925293, "global_step": 21991, "epoch": 130} {"train_loss": -6.810568809509277, "global_step": 21992, "epoch": 130} {"train_loss": -6.80232048034668, "global_step": 21993, "epoch": 130} {"train_loss": -6.819248199462891, "global_step": 21994, "epoch": 130} {"train_loss": -7.161534309387207, "global_step": 21995, "epoch": 130} {"train_loss": -6.781925201416016, "global_step": 21996, "epoch": 130} {"train_loss": -7.068119525909424, "global_step": 21997, "epoch": 130} {"train_loss": -7.092535972595215, "global_step": 21998, "epoch": 130} {"train_loss": -7.11099910736084, "global_step": 21999, "epoch": 130} {"train_loss": -7.157916069030762, "global_step": 22000, "epoch": 130} {"train_loss": -7.163501739501953, "global_step": 22001, "epoch": 130} {"train_loss": -7.022015571594238, "global_step": 22002, "epoch": 130} {"train_loss": -7.014057159423828, "global_step": 22003, "epoch": 130} {"train_loss": -7.135174751281738, "global_step": 22004, "epoch": 130} {"train_loss": -6.9239501953125, "global_step": 22005, "epoch": 130} {"train_loss": -7.22717809677124, "global_step": 22006, "epoch": 130} {"train_loss": -6.960322899477823, "global_step": 22007, "epoch": 130, "val_loss": 207191.609375, "train_action_mse_error": 17.236934661865234} {"train_loss": -6.90673303604126, "global_step": 22008, "epoch": 131} {"train_loss": -7.096652030944824, "global_step": 22009, "epoch": 131} {"train_loss": -7.238639831542969, "global_step": 22010, "epoch": 131} {"train_loss": -7.066357135772705, "global_step": 22011, "epoch": 131} {"train_loss": -7.044203758239746, "global_step": 22012, "epoch": 131} {"train_loss": -6.794123649597168, "global_step": 22013, "epoch": 131} {"train_loss": -6.82984733581543, "global_step": 22014, "epoch": 131} {"train_loss": -6.841920852661133, "global_step": 22015, "epoch": 131} {"train_loss": -7.069462776184082, "global_step": 22016, "epoch": 131} {"train_loss": -6.994170188903809, "global_step": 22017, "epoch": 131} {"train_loss": -7.051924705505371, "global_step": 22018, "epoch": 131} {"train_loss": -6.817123889923096, "global_step": 22019, "epoch": 131} {"train_loss": -6.786097526550293, "global_step": 22020, "epoch": 131} {"train_loss": -6.934542179107666, "global_step": 22021, "epoch": 131} {"train_loss": -6.79513692855835, "global_step": 22022, "epoch": 131} {"train_loss": -7.123311996459961, "global_step": 22023, "epoch": 131} {"train_loss": -6.932342529296875, "global_step": 22024, "epoch": 131} {"train_loss": -6.9322509765625, "global_step": 22025, "epoch": 131} {"train_loss": -7.0462446212768555, "global_step": 22026, "epoch": 131} {"train_loss": -6.9260053634643555, "global_step": 22027, "epoch": 131} {"train_loss": -6.96653413772583, "global_step": 22028, "epoch": 131} {"train_loss": -6.927772521972656, "global_step": 22029, "epoch": 131} {"train_loss": -7.017329216003418, "global_step": 22030, "epoch": 131} {"train_loss": -6.502623081207275, "global_step": 22031, "epoch": 131} {"train_loss": -6.926706314086914, "global_step": 22032, "epoch": 131} {"train_loss": -6.876953125, "global_step": 22033, "epoch": 131} {"train_loss": -7.09827184677124, "global_step": 22034, "epoch": 131} {"train_loss": -6.825016021728516, "global_step": 22035, "epoch": 131} {"train_loss": -6.940952777862549, "global_step": 22036, "epoch": 131} {"train_loss": -7.037489891052246, "global_step": 22037, "epoch": 131} {"train_loss": -7.04908561706543, "global_step": 22038, "epoch": 131} {"train_loss": -7.106014728546143, "global_step": 22039, "epoch": 131} {"train_loss": -7.104905128479004, "global_step": 22040, "epoch": 131} {"train_loss": -6.803240776062012, "global_step": 22041, "epoch": 131} {"train_loss": -7.037042617797852, "global_step": 22042, "epoch": 131} {"train_loss": -6.919747352600098, "global_step": 22043, "epoch": 131} {"train_loss": -7.182928085327148, "global_step": 22044, "epoch": 131} {"train_loss": -7.060041427612305, "global_step": 22045, "epoch": 131} {"train_loss": -6.987335681915283, "global_step": 22046, "epoch": 131} {"train_loss": -6.959400177001953, "global_step": 22047, "epoch": 131} {"train_loss": -7.0268235206604, "global_step": 22048, "epoch": 131} {"train_loss": -6.784083366394043, "global_step": 22049, "epoch": 131} {"train_loss": -6.79847526550293, "global_step": 22050, "epoch": 131} {"train_loss": -6.828060150146484, "global_step": 22051, "epoch": 131} {"train_loss": -6.80309534072876, "global_step": 22052, "epoch": 131} {"train_loss": -6.662580490112305, "global_step": 22053, "epoch": 131} {"train_loss": -6.753469944000244, "global_step": 22054, "epoch": 131} {"train_loss": -6.602216720581055, "global_step": 22055, "epoch": 131} {"train_loss": -6.9637556076049805, "global_step": 22056, "epoch": 131} {"train_loss": -6.647538185119629, "global_step": 22057, "epoch": 131} {"train_loss": -7.0376081466674805, "global_step": 22058, "epoch": 131} {"train_loss": -6.870494842529297, "global_step": 22059, "epoch": 131} {"train_loss": -6.531192779541016, "global_step": 22060, "epoch": 131} {"train_loss": -6.94361686706543, "global_step": 22061, "epoch": 131} {"train_loss": -6.609895706176758, "global_step": 22062, "epoch": 131} {"train_loss": -6.610291004180908, "global_step": 22063, "epoch": 131} {"train_loss": -6.501697063446045, "global_step": 22064, "epoch": 131} {"train_loss": -6.964914321899414, "global_step": 22065, "epoch": 131} {"train_loss": -6.841293811798096, "global_step": 22066, "epoch": 131} {"train_loss": -6.90313720703125, "global_step": 22067, "epoch": 131} {"train_loss": -6.728829383850098, "global_step": 22068, "epoch": 131} {"train_loss": -6.71173095703125, "global_step": 22069, "epoch": 131} {"train_loss": -6.807980537414551, "global_step": 22070, "epoch": 131} {"train_loss": -6.707957744598389, "global_step": 22071, "epoch": 131} {"train_loss": -6.847530364990234, "global_step": 22072, "epoch": 131} {"train_loss": -6.940808296203613, "global_step": 22073, "epoch": 131} {"train_loss": -6.612013816833496, "global_step": 22074, "epoch": 131} {"train_loss": -6.8763556480407715, "global_step": 22075, "epoch": 131} {"train_loss": -6.871766090393066, "global_step": 22076, "epoch": 131} {"train_loss": -6.946394920349121, "global_step": 22077, "epoch": 131} {"train_loss": -6.782292366027832, "global_step": 22078, "epoch": 131} {"train_loss": -7.093816757202148, "global_step": 22079, "epoch": 131} {"train_loss": -7.169771194458008, "global_step": 22080, "epoch": 131} {"train_loss": -6.933791160583496, "global_step": 22081, "epoch": 131} {"train_loss": -6.98946475982666, "global_step": 22082, "epoch": 131} {"train_loss": -6.928896903991699, "global_step": 22083, "epoch": 131} {"train_loss": -7.064782619476318, "global_step": 22084, "epoch": 131} {"train_loss": -7.156330585479736, "global_step": 22085, "epoch": 131} {"train_loss": -7.143258571624756, "global_step": 22086, "epoch": 131} {"train_loss": -6.982405185699463, "global_step": 22087, "epoch": 131} {"train_loss": -6.980473518371582, "global_step": 22088, "epoch": 131} {"train_loss": -7.134078025817871, "global_step": 22089, "epoch": 131} {"train_loss": -6.99668550491333, "global_step": 22090, "epoch": 131} {"train_loss": -7.209151744842529, "global_step": 22091, "epoch": 131} {"train_loss": -7.090691566467285, "global_step": 22092, "epoch": 131} {"train_loss": -7.055787086486816, "global_step": 22093, "epoch": 131} {"train_loss": -7.1066083908081055, "global_step": 22094, "epoch": 131} {"train_loss": -6.796125411987305, "global_step": 22095, "epoch": 131} {"train_loss": -6.936283588409424, "global_step": 22096, "epoch": 131} {"train_loss": -7.148019790649414, "global_step": 22097, "epoch": 131} {"train_loss": -7.082886695861816, "global_step": 22098, "epoch": 131} {"train_loss": -7.033565521240234, "global_step": 22099, "epoch": 131} {"train_loss": -7.142024040222168, "global_step": 22100, "epoch": 131} {"train_loss": -6.968722343444824, "global_step": 22101, "epoch": 131} {"train_loss": -7.071866989135742, "global_step": 22102, "epoch": 131} {"train_loss": -6.915803909301758, "global_step": 22103, "epoch": 131} {"train_loss": -6.984040260314941, "global_step": 22104, "epoch": 131} {"train_loss": -6.874269962310791, "global_step": 22105, "epoch": 131} {"train_loss": -6.938204765319824, "global_step": 22106, "epoch": 131} {"train_loss": -6.7919769287109375, "global_step": 22107, "epoch": 131} {"train_loss": -7.082331657409668, "global_step": 22108, "epoch": 131} {"train_loss": -6.948474884033203, "global_step": 22109, "epoch": 131} {"train_loss": -6.849113464355469, "global_step": 22110, "epoch": 131} {"train_loss": -6.78225040435791, "global_step": 22111, "epoch": 131} {"train_loss": -7.087491989135742, "global_step": 22112, "epoch": 131} {"train_loss": -7.038423538208008, "global_step": 22113, "epoch": 131} {"train_loss": -7.006484031677246, "global_step": 22114, "epoch": 131} {"train_loss": -6.847560882568359, "global_step": 22115, "epoch": 131} {"train_loss": -6.879046440124512, "global_step": 22116, "epoch": 131} {"train_loss": -6.992620944976807, "global_step": 22117, "epoch": 131} {"train_loss": -7.140254020690918, "global_step": 22118, "epoch": 131} {"train_loss": -7.069374084472656, "global_step": 22119, "epoch": 131} {"train_loss": -6.967476844787598, "global_step": 22120, "epoch": 131} {"train_loss": -6.969130039215088, "global_step": 22121, "epoch": 131} {"train_loss": -6.961658477783203, "global_step": 22122, "epoch": 131} {"train_loss": -7.264391899108887, "global_step": 22123, "epoch": 131} {"train_loss": -6.7983903884887695, "global_step": 22124, "epoch": 131} {"train_loss": -6.833826541900635, "global_step": 22125, "epoch": 131} {"train_loss": -7.078490257263184, "global_step": 22126, "epoch": 131} {"train_loss": -6.683382511138916, "global_step": 22127, "epoch": 131} {"train_loss": -6.862591743469238, "global_step": 22128, "epoch": 131} {"train_loss": -7.0584540367126465, "global_step": 22129, "epoch": 131} {"train_loss": -7.013801574707031, "global_step": 22130, "epoch": 131} {"train_loss": -7.125561714172363, "global_step": 22131, "epoch": 131} {"train_loss": -6.943048477172852, "global_step": 22132, "epoch": 131} {"train_loss": -6.754092216491699, "global_step": 22133, "epoch": 131} {"train_loss": -6.98887825012207, "global_step": 22134, "epoch": 131} {"train_loss": -6.679834842681885, "global_step": 22135, "epoch": 131} {"train_loss": -6.928171157836914, "global_step": 22136, "epoch": 131} {"train_loss": -6.577291011810303, "global_step": 22137, "epoch": 131} {"train_loss": -6.582220077514648, "global_step": 22138, "epoch": 131} {"train_loss": -6.534077167510986, "global_step": 22139, "epoch": 131} {"train_loss": -6.897165298461914, "global_step": 22140, "epoch": 131} {"train_loss": -6.810133934020996, "global_step": 22141, "epoch": 131} {"train_loss": -6.675116539001465, "global_step": 22142, "epoch": 131} {"train_loss": -6.919890880584717, "global_step": 22143, "epoch": 131} {"train_loss": -6.833497047424316, "global_step": 22144, "epoch": 131} {"train_loss": -7.070282936096191, "global_step": 22145, "epoch": 131} {"train_loss": -7.036518573760986, "global_step": 22146, "epoch": 131} {"train_loss": -6.995494365692139, "global_step": 22147, "epoch": 131} {"train_loss": -7.038479804992676, "global_step": 22148, "epoch": 131} {"train_loss": -6.763734817504883, "global_step": 22149, "epoch": 131} {"train_loss": -6.922671318054199, "global_step": 22150, "epoch": 131} {"train_loss": -6.860188961029053, "global_step": 22151, "epoch": 131} {"train_loss": -6.882350921630859, "global_step": 22152, "epoch": 131} {"train_loss": -6.9197797775268555, "global_step": 22153, "epoch": 131} {"train_loss": -6.83590030670166, "global_step": 22154, "epoch": 131} {"train_loss": -7.1324872970581055, "global_step": 22155, "epoch": 131} {"train_loss": -6.926321029663086, "global_step": 22156, "epoch": 131} {"train_loss": -7.092185974121094, "global_step": 22157, "epoch": 131} {"train_loss": -7.217272758483887, "global_step": 22158, "epoch": 131} {"train_loss": -6.9288530349731445, "global_step": 22159, "epoch": 131} {"train_loss": -7.12042236328125, "global_step": 22160, "epoch": 131} {"train_loss": -6.797892093658447, "global_step": 22161, "epoch": 131} {"train_loss": -6.959191799163818, "global_step": 22162, "epoch": 131} {"train_loss": -6.782773494720459, "global_step": 22163, "epoch": 131} {"train_loss": -6.8406596183776855, "global_step": 22164, "epoch": 131} {"train_loss": -6.889956474304199, "global_step": 22165, "epoch": 131} {"train_loss": -6.904594421386719, "global_step": 22166, "epoch": 131} {"train_loss": -6.85122013092041, "global_step": 22167, "epoch": 131} {"train_loss": -6.747477054595947, "global_step": 22168, "epoch": 131} {"train_loss": -6.923206329345703, "global_step": 22169, "epoch": 131} {"train_loss": -6.7893805503845215, "global_step": 22170, "epoch": 131} {"train_loss": -6.977499008178711, "global_step": 22171, "epoch": 131} {"train_loss": -6.526590347290039, "global_step": 22172, "epoch": 131} {"train_loss": -6.875906467437744, "global_step": 22173, "epoch": 131} {"train_loss": -6.965798377990723, "global_step": 22174, "epoch": 131} {"train_loss": -6.921293028763363, "global_step": 22175, "epoch": 131, "val_loss": 207243.84375} {"train_loss": -6.898859977722168, "global_step": 22176, "epoch": 132} {"train_loss": -6.7433624267578125, "global_step": 22177, "epoch": 132} {"train_loss": -6.745782852172852, "global_step": 22178, "epoch": 132} {"train_loss": -6.876806735992432, "global_step": 22179, "epoch": 132} {"train_loss": -6.925373077392578, "global_step": 22180, "epoch": 132} {"train_loss": -6.694868087768555, "global_step": 22181, "epoch": 132} {"train_loss": -6.8846540451049805, "global_step": 22182, "epoch": 132} {"train_loss": -6.873700141906738, "global_step": 22183, "epoch": 132} {"train_loss": -6.995187759399414, "global_step": 22184, "epoch": 132} {"train_loss": -7.040082931518555, "global_step": 22185, "epoch": 132} {"train_loss": -6.885132789611816, "global_step": 22186, "epoch": 132} {"train_loss": -6.956789016723633, "global_step": 22187, "epoch": 132} {"train_loss": -7.04397439956665, "global_step": 22188, "epoch": 132} {"train_loss": -7.093428134918213, "global_step": 22189, "epoch": 132} {"train_loss": -6.961523056030273, "global_step": 22190, "epoch": 132} {"train_loss": -7.033324718475342, "global_step": 22191, "epoch": 132} {"train_loss": -6.980032920837402, "global_step": 22192, "epoch": 132} {"train_loss": -7.07596492767334, "global_step": 22193, "epoch": 132} {"train_loss": -6.943723678588867, "global_step": 22194, "epoch": 132} {"train_loss": -6.940978527069092, "global_step": 22195, "epoch": 132} {"train_loss": -7.1265411376953125, "global_step": 22196, "epoch": 132} {"train_loss": -7.140244960784912, "global_step": 22197, "epoch": 132} {"train_loss": -6.668646812438965, "global_step": 22198, "epoch": 132} {"train_loss": -6.983621597290039, "global_step": 22199, "epoch": 132} {"train_loss": -6.791711807250977, "global_step": 22200, "epoch": 132} {"train_loss": -7.1531982421875, "global_step": 22201, "epoch": 132} {"train_loss": -6.629644393920898, "global_step": 22202, "epoch": 132} {"train_loss": -6.725191116333008, "global_step": 22203, "epoch": 132} {"train_loss": -6.822696685791016, "global_step": 22204, "epoch": 132} {"train_loss": -6.845211029052734, "global_step": 22205, "epoch": 132} {"train_loss": -6.757414817810059, "global_step": 22206, "epoch": 132} {"train_loss": -7.083517551422119, "global_step": 22207, "epoch": 132} {"train_loss": -7.001829624176025, "global_step": 22208, "epoch": 132} {"train_loss": -6.922999382019043, "global_step": 22209, "epoch": 132} {"train_loss": -6.88039493560791, "global_step": 22210, "epoch": 132} {"train_loss": -6.902031898498535, "global_step": 22211, "epoch": 132} {"train_loss": -6.74335241317749, "global_step": 22212, "epoch": 132} {"train_loss": -6.888479232788086, "global_step": 22213, "epoch": 132} {"train_loss": -6.785023212432861, "global_step": 22214, "epoch": 132} {"train_loss": -6.979957103729248, "global_step": 22215, "epoch": 132} {"train_loss": -6.777552604675293, "global_step": 22216, "epoch": 132} {"train_loss": -7.054896831512451, "global_step": 22217, "epoch": 132} {"train_loss": -6.742439270019531, "global_step": 22218, "epoch": 132} {"train_loss": -6.9847412109375, "global_step": 22219, "epoch": 132} {"train_loss": -7.128004550933838, "global_step": 22220, "epoch": 132} {"train_loss": -6.9720072746276855, "global_step": 22221, "epoch": 132} {"train_loss": -6.920400619506836, "global_step": 22222, "epoch": 132} {"train_loss": -7.204432487487793, "global_step": 22223, "epoch": 132} {"train_loss": -6.905993938446045, "global_step": 22224, "epoch": 132} {"train_loss": -6.993098258972168, "global_step": 22225, "epoch": 132} {"train_loss": -7.115176200866699, "global_step": 22226, "epoch": 132} {"train_loss": -7.184627056121826, "global_step": 22227, "epoch": 132} {"train_loss": -7.098178863525391, "global_step": 22228, "epoch": 132} {"train_loss": -7.041059970855713, "global_step": 22229, "epoch": 132} {"train_loss": -7.039809703826904, "global_step": 22230, "epoch": 132} {"train_loss": -7.0887346267700195, "global_step": 22231, "epoch": 132} {"train_loss": -7.055340766906738, "global_step": 22232, "epoch": 132} {"train_loss": -7.172880172729492, "global_step": 22233, "epoch": 132} {"train_loss": -7.193179130554199, "global_step": 22234, "epoch": 132} {"train_loss": -7.052732467651367, "global_step": 22235, "epoch": 132} {"train_loss": -7.163824081420898, "global_step": 22236, "epoch": 132} {"train_loss": -6.999558448791504, "global_step": 22237, "epoch": 132} {"train_loss": -7.200189590454102, "global_step": 22238, "epoch": 132} {"train_loss": -6.812497138977051, "global_step": 22239, "epoch": 132} {"train_loss": -6.777166366577148, "global_step": 22240, "epoch": 132} {"train_loss": -6.994578838348389, "global_step": 22241, "epoch": 132} {"train_loss": -7.201688289642334, "global_step": 22242, "epoch": 132} {"train_loss": -7.08035135269165, "global_step": 22243, "epoch": 132} {"train_loss": -6.961248397827148, "global_step": 22244, "epoch": 132} {"train_loss": -7.163885116577148, "global_step": 22245, "epoch": 132} {"train_loss": -7.051461219787598, "global_step": 22246, "epoch": 132} {"train_loss": -6.794900894165039, "global_step": 22247, "epoch": 132} {"train_loss": -6.831573486328125, "global_step": 22248, "epoch": 132} {"train_loss": -7.075262546539307, "global_step": 22249, "epoch": 132} {"train_loss": -6.824636936187744, "global_step": 22250, "epoch": 132} {"train_loss": -7.026515960693359, "global_step": 22251, "epoch": 132} {"train_loss": -6.956231117248535, "global_step": 22252, "epoch": 132} {"train_loss": -6.939431190490723, "global_step": 22253, "epoch": 132} {"train_loss": -6.965952396392822, "global_step": 22254, "epoch": 132} {"train_loss": -7.003849506378174, "global_step": 22255, "epoch": 132} {"train_loss": -7.036820411682129, "global_step": 22256, "epoch": 132} {"train_loss": -6.939640998840332, "global_step": 22257, "epoch": 132} {"train_loss": -7.011518955230713, "global_step": 22258, "epoch": 132} {"train_loss": -6.934511184692383, "global_step": 22259, "epoch": 132} {"train_loss": -7.0296173095703125, "global_step": 22260, "epoch": 132} {"train_loss": -7.01658821105957, "global_step": 22261, "epoch": 132} {"train_loss": -7.151484489440918, "global_step": 22262, "epoch": 132} {"train_loss": -6.9853644371032715, "global_step": 22263, "epoch": 132} {"train_loss": -7.076116561889648, "global_step": 22264, "epoch": 132} {"train_loss": -6.8970465660095215, "global_step": 22265, "epoch": 132} {"train_loss": -6.855007648468018, "global_step": 22266, "epoch": 132} {"train_loss": -6.871880531311035, "global_step": 22267, "epoch": 132} {"train_loss": -6.935279846191406, "global_step": 22268, "epoch": 132} {"train_loss": -6.856489181518555, "global_step": 22269, "epoch": 132} {"train_loss": -6.9505615234375, "global_step": 22270, "epoch": 132} {"train_loss": -7.124706745147705, "global_step": 22271, "epoch": 132} {"train_loss": -6.755205154418945, "global_step": 22272, "epoch": 132} {"train_loss": -7.17525577545166, "global_step": 22273, "epoch": 132} {"train_loss": -7.090317726135254, "global_step": 22274, "epoch": 132} {"train_loss": -6.8254499435424805, "global_step": 22275, "epoch": 132} {"train_loss": -6.79998254776001, "global_step": 22276, "epoch": 132} {"train_loss": -6.744168281555176, "global_step": 22277, "epoch": 132} {"train_loss": -7.247797012329102, "global_step": 22278, "epoch": 132} {"train_loss": -6.851245880126953, "global_step": 22279, "epoch": 132} {"train_loss": -6.978287696838379, "global_step": 22280, "epoch": 132} {"train_loss": -7.125782012939453, "global_step": 22281, "epoch": 132} {"train_loss": -7.012531280517578, "global_step": 22282, "epoch": 132} {"train_loss": -6.867495536804199, "global_step": 22283, "epoch": 132} {"train_loss": -7.104551792144775, "global_step": 22284, "epoch": 132} {"train_loss": -7.067077159881592, "global_step": 22285, "epoch": 132} {"train_loss": -6.8778533935546875, "global_step": 22286, "epoch": 132} {"train_loss": -6.910028457641602, "global_step": 22287, "epoch": 132} {"train_loss": -7.013744831085205, "global_step": 22288, "epoch": 132} {"train_loss": -6.831342697143555, "global_step": 22289, "epoch": 132} {"train_loss": -6.836198329925537, "global_step": 22290, "epoch": 132} {"train_loss": -6.971294403076172, "global_step": 22291, "epoch": 132} {"train_loss": -7.129824638366699, "global_step": 22292, "epoch": 132} {"train_loss": -7.082737445831299, "global_step": 22293, "epoch": 132} {"train_loss": -7.02003288269043, "global_step": 22294, "epoch": 132} {"train_loss": -7.337608337402344, "global_step": 22295, "epoch": 132} {"train_loss": -7.037679672241211, "global_step": 22296, "epoch": 132} {"train_loss": -7.026383399963379, "global_step": 22297, "epoch": 132} {"train_loss": -7.104118824005127, "global_step": 22298, "epoch": 132} {"train_loss": -6.92745304107666, "global_step": 22299, "epoch": 132} {"train_loss": -7.04551887512207, "global_step": 22300, "epoch": 132} {"train_loss": -7.115909576416016, "global_step": 22301, "epoch": 132} {"train_loss": -7.08786678314209, "global_step": 22302, "epoch": 132} {"train_loss": -7.226931095123291, "global_step": 22303, "epoch": 132} {"train_loss": -7.25684928894043, "global_step": 22304, "epoch": 132} {"train_loss": -7.027724266052246, "global_step": 22305, "epoch": 132} {"train_loss": -7.107426643371582, "global_step": 22306, "epoch": 132} {"train_loss": -7.0821733474731445, "global_step": 22307, "epoch": 132} {"train_loss": -7.11196756362915, "global_step": 22308, "epoch": 132} {"train_loss": -7.224088668823242, "global_step": 22309, "epoch": 132} {"train_loss": -6.864279747009277, "global_step": 22310, "epoch": 132} {"train_loss": -7.178610324859619, "global_step": 22311, "epoch": 132} {"train_loss": -7.075860500335693, "global_step": 22312, "epoch": 132} {"train_loss": -7.084423065185547, "global_step": 22313, "epoch": 132} {"train_loss": -7.139124393463135, "global_step": 22314, "epoch": 132} {"train_loss": -6.851487159729004, "global_step": 22315, "epoch": 132} {"train_loss": -7.0190277099609375, "global_step": 22316, "epoch": 132} {"train_loss": -7.0508856773376465, "global_step": 22317, "epoch": 132} {"train_loss": -6.818602561950684, "global_step": 22318, "epoch": 132} {"train_loss": -6.885122299194336, "global_step": 22319, "epoch": 132} {"train_loss": -7.040999412536621, "global_step": 22320, "epoch": 132} {"train_loss": -6.8018388748168945, "global_step": 22321, "epoch": 132} {"train_loss": -6.927611827850342, "global_step": 22322, "epoch": 132} {"train_loss": -6.895593643188477, "global_step": 22323, "epoch": 132} {"train_loss": -7.039754390716553, "global_step": 22324, "epoch": 132} {"train_loss": -6.996820449829102, "global_step": 22325, "epoch": 132} {"train_loss": -7.011063575744629, "global_step": 22326, "epoch": 132} {"train_loss": -7.004669189453125, "global_step": 22327, "epoch": 132} {"train_loss": -7.024343490600586, "global_step": 22328, "epoch": 132} {"train_loss": -7.09378719329834, "global_step": 22329, "epoch": 132} {"train_loss": -7.028736114501953, "global_step": 22330, "epoch": 132} {"train_loss": -6.960788726806641, "global_step": 22331, "epoch": 132} {"train_loss": -6.987358570098877, "global_step": 22332, "epoch": 132} {"train_loss": -6.745439529418945, "global_step": 22333, "epoch": 132} {"train_loss": -7.124261856079102, "global_step": 22334, "epoch": 132} {"train_loss": -6.72130823135376, "global_step": 22335, "epoch": 132} {"train_loss": -6.971319198608398, "global_step": 22336, "epoch": 132} {"train_loss": -6.9358720779418945, "global_step": 22337, "epoch": 132} {"train_loss": -7.0944600105285645, "global_step": 22338, "epoch": 132} {"train_loss": -7.16292667388916, "global_step": 22339, "epoch": 132} {"train_loss": -7.06580114364624, "global_step": 22340, "epoch": 132} {"train_loss": -7.141518592834473, "global_step": 22341, "epoch": 132} {"train_loss": -7.260998725891113, "global_step": 22342, "epoch": 132} {"train_loss": -6.986513486930302, "global_step": 22343, "epoch": 132, "val_loss": 205617.171875} {"train_loss": -7.014651298522949, "global_step": 22344, "epoch": 133} {"train_loss": -7.307533264160156, "global_step": 22345, "epoch": 133} {"train_loss": -6.973302364349365, "global_step": 22346, "epoch": 133} {"train_loss": -6.99202823638916, "global_step": 22347, "epoch": 133} {"train_loss": -7.024227142333984, "global_step": 22348, "epoch": 133} {"train_loss": -7.091529846191406, "global_step": 22349, "epoch": 133} {"train_loss": -7.190514087677002, "global_step": 22350, "epoch": 133} {"train_loss": -6.806424140930176, "global_step": 22351, "epoch": 133} {"train_loss": -7.062933444976807, "global_step": 22352, "epoch": 133} {"train_loss": -7.083495616912842, "global_step": 22353, "epoch": 133} {"train_loss": -6.822759628295898, "global_step": 22354, "epoch": 133} {"train_loss": -6.945779323577881, "global_step": 22355, "epoch": 133} {"train_loss": -6.753595352172852, "global_step": 22356, "epoch": 133} {"train_loss": -7.031598091125488, "global_step": 22357, "epoch": 133} {"train_loss": -7.00455379486084, "global_step": 22358, "epoch": 133} {"train_loss": -7.153372764587402, "global_step": 22359, "epoch": 133} {"train_loss": -7.128264904022217, "global_step": 22360, "epoch": 133} {"train_loss": -6.554891586303711, "global_step": 22361, "epoch": 133} {"train_loss": -6.948960304260254, "global_step": 22362, "epoch": 133} {"train_loss": -7.215381622314453, "global_step": 22363, "epoch": 133} {"train_loss": -7.042322158813477, "global_step": 22364, "epoch": 133} {"train_loss": -6.942015647888184, "global_step": 22365, "epoch": 133} {"train_loss": -6.72263240814209, "global_step": 22366, "epoch": 133} {"train_loss": -6.933913230895996, "global_step": 22367, "epoch": 133} {"train_loss": -7.143438339233398, "global_step": 22368, "epoch": 133} {"train_loss": -7.005306720733643, "global_step": 22369, "epoch": 133} {"train_loss": -6.8992085456848145, "global_step": 22370, "epoch": 133} {"train_loss": -6.950127601623535, "global_step": 22371, "epoch": 133} {"train_loss": -6.987343788146973, "global_step": 22372, "epoch": 133} {"train_loss": -6.692285537719727, "global_step": 22373, "epoch": 133} {"train_loss": -6.707162857055664, "global_step": 22374, "epoch": 133} {"train_loss": -6.445404052734375, "global_step": 22375, "epoch": 133} {"train_loss": -6.966452598571777, "global_step": 22376, "epoch": 133} {"train_loss": -6.399370193481445, "global_step": 22377, "epoch": 133} {"train_loss": -6.9191365242004395, "global_step": 22378, "epoch": 133} {"train_loss": -6.727151870727539, "global_step": 22379, "epoch": 133} {"train_loss": -6.582062721252441, "global_step": 22380, "epoch": 133} {"train_loss": -6.9445624351501465, "global_step": 22381, "epoch": 133} {"train_loss": -6.8291916847229, "global_step": 22382, "epoch": 133} {"train_loss": -6.773068428039551, "global_step": 22383, "epoch": 133} {"train_loss": -6.939571380615234, "global_step": 22384, "epoch": 133} {"train_loss": -6.624320983886719, "global_step": 22385, "epoch": 133} {"train_loss": -6.747286796569824, "global_step": 22386, "epoch": 133} {"train_loss": -7.12702751159668, "global_step": 22387, "epoch": 133} {"train_loss": -6.780684471130371, "global_step": 22388, "epoch": 133} {"train_loss": -6.823774337768555, "global_step": 22389, "epoch": 133} {"train_loss": -6.800863265991211, "global_step": 22390, "epoch": 133} {"train_loss": -6.862130165100098, "global_step": 22391, "epoch": 133} {"train_loss": -7.110705375671387, "global_step": 22392, "epoch": 133} {"train_loss": -6.746434211730957, "global_step": 22393, "epoch": 133} {"train_loss": -6.904336929321289, "global_step": 22394, "epoch": 133} {"train_loss": -6.93411922454834, "global_step": 22395, "epoch": 133} {"train_loss": -7.089507102966309, "global_step": 22396, "epoch": 133} {"train_loss": -6.777707099914551, "global_step": 22397, "epoch": 133} {"train_loss": -7.123295307159424, "global_step": 22398, "epoch": 133} {"train_loss": -6.780191898345947, "global_step": 22399, "epoch": 133} {"train_loss": -7.2577619552612305, "global_step": 22400, "epoch": 133} {"train_loss": -7.039434432983398, "global_step": 22401, "epoch": 133} {"train_loss": -7.1377339363098145, "global_step": 22402, "epoch": 133} {"train_loss": -7.052175521850586, "global_step": 22403, "epoch": 133} {"train_loss": -6.624917984008789, "global_step": 22404, "epoch": 133} {"train_loss": -6.869654655456543, "global_step": 22405, "epoch": 133} {"train_loss": -6.5884904861450195, "global_step": 22406, "epoch": 133} {"train_loss": -6.953909397125244, "global_step": 22407, "epoch": 133} {"train_loss": -6.77938985824585, "global_step": 22408, "epoch": 133} {"train_loss": -6.94680118560791, "global_step": 22409, "epoch": 133} {"train_loss": -6.84299373626709, "global_step": 22410, "epoch": 133} {"train_loss": -6.751931190490723, "global_step": 22411, "epoch": 133} {"train_loss": -6.832592010498047, "global_step": 22412, "epoch": 133} {"train_loss": -6.853001594543457, "global_step": 22413, "epoch": 133} {"train_loss": -6.822253227233887, "global_step": 22414, "epoch": 133} {"train_loss": -6.9902777671813965, "global_step": 22415, "epoch": 133} {"train_loss": -7.030043125152588, "global_step": 22416, "epoch": 133} {"train_loss": -6.881633758544922, "global_step": 22417, "epoch": 133} {"train_loss": -6.995553016662598, "global_step": 22418, "epoch": 133} {"train_loss": -6.630354881286621, "global_step": 22419, "epoch": 133} {"train_loss": -6.997156143188477, "global_step": 22420, "epoch": 133} {"train_loss": -6.819048881530762, "global_step": 22421, "epoch": 133} {"train_loss": -6.919261932373047, "global_step": 22422, "epoch": 133} {"train_loss": -6.725809097290039, "global_step": 22423, "epoch": 133} {"train_loss": -6.923548698425293, "global_step": 22424, "epoch": 133} {"train_loss": -7.003579139709473, "global_step": 22425, "epoch": 133} {"train_loss": -7.0893707275390625, "global_step": 22426, "epoch": 133} {"train_loss": -6.90776252746582, "global_step": 22427, "epoch": 133} {"train_loss": -7.144613265991211, "global_step": 22428, "epoch": 133} {"train_loss": -6.97104549407959, "global_step": 22429, "epoch": 133} {"train_loss": -6.9722089767456055, "global_step": 22430, "epoch": 133} {"train_loss": -6.74950647354126, "global_step": 22431, "epoch": 133} {"train_loss": -6.952381134033203, "global_step": 22432, "epoch": 133} {"train_loss": -6.858132362365723, "global_step": 22433, "epoch": 133} {"train_loss": -7.314919471740723, "global_step": 22434, "epoch": 133} {"train_loss": -7.150346755981445, "global_step": 22435, "epoch": 133} {"train_loss": -6.945371627807617, "global_step": 22436, "epoch": 133} {"train_loss": -7.167886734008789, "global_step": 22437, "epoch": 133} {"train_loss": -7.074307918548584, "global_step": 22438, "epoch": 133} {"train_loss": -6.953226566314697, "global_step": 22439, "epoch": 133} {"train_loss": -6.982088088989258, "global_step": 22440, "epoch": 133} {"train_loss": -7.009942054748535, "global_step": 22441, "epoch": 133} {"train_loss": -7.140332221984863, "global_step": 22442, "epoch": 133} {"train_loss": -7.015979766845703, "global_step": 22443, "epoch": 133} {"train_loss": -7.072865009307861, "global_step": 22444, "epoch": 133} {"train_loss": -7.151124477386475, "global_step": 22445, "epoch": 133} {"train_loss": -7.165892601013184, "global_step": 22446, "epoch": 133} {"train_loss": -7.226064205169678, "global_step": 22447, "epoch": 133} {"train_loss": -6.993432998657227, "global_step": 22448, "epoch": 133} {"train_loss": -7.132219314575195, "global_step": 22449, "epoch": 133} {"train_loss": -7.092031955718994, "global_step": 22450, "epoch": 133} {"train_loss": -7.011872291564941, "global_step": 22451, "epoch": 133} {"train_loss": -7.1349053382873535, "global_step": 22452, "epoch": 133} {"train_loss": -7.114806175231934, "global_step": 22453, "epoch": 133} {"train_loss": -7.145739555358887, "global_step": 22454, "epoch": 133} {"train_loss": -7.132641792297363, "global_step": 22455, "epoch": 133} {"train_loss": -7.091362953186035, "global_step": 22456, "epoch": 133} {"train_loss": -7.15775728225708, "global_step": 22457, "epoch": 133} {"train_loss": -6.85760498046875, "global_step": 22458, "epoch": 133} {"train_loss": -6.8467559814453125, "global_step": 22459, "epoch": 133} {"train_loss": -6.7598876953125, "global_step": 22460, "epoch": 133} {"train_loss": -6.96909761428833, "global_step": 22461, "epoch": 133} {"train_loss": -6.630267143249512, "global_step": 22462, "epoch": 133} {"train_loss": -6.87103271484375, "global_step": 22463, "epoch": 133} {"train_loss": -7.069182395935059, "global_step": 22464, "epoch": 133} {"train_loss": -6.495760440826416, "global_step": 22465, "epoch": 133} {"train_loss": -6.8415374755859375, "global_step": 22466, "epoch": 133} {"train_loss": -6.838940143585205, "global_step": 22467, "epoch": 133} {"train_loss": -6.733960151672363, "global_step": 22468, "epoch": 133} {"train_loss": -6.914312362670898, "global_step": 22469, "epoch": 133} {"train_loss": -7.037265777587891, "global_step": 22470, "epoch": 133} {"train_loss": -6.68319034576416, "global_step": 22471, "epoch": 133} {"train_loss": -6.850774765014648, "global_step": 22472, "epoch": 133} {"train_loss": -6.867520332336426, "global_step": 22473, "epoch": 133} {"train_loss": -7.065696716308594, "global_step": 22474, "epoch": 133} {"train_loss": -7.01005744934082, "global_step": 22475, "epoch": 133} {"train_loss": -6.971482276916504, "global_step": 22476, "epoch": 133} {"train_loss": -7.04319953918457, "global_step": 22477, "epoch": 133} {"train_loss": -7.04473876953125, "global_step": 22478, "epoch": 133} {"train_loss": -6.86445426940918, "global_step": 22479, "epoch": 133} {"train_loss": -7.2033538818359375, "global_step": 22480, "epoch": 133} {"train_loss": -7.07310676574707, "global_step": 22481, "epoch": 133} {"train_loss": -7.000367641448975, "global_step": 22482, "epoch": 133} {"train_loss": -7.287763595581055, "global_step": 22483, "epoch": 133} {"train_loss": -7.075395584106445, "global_step": 22484, "epoch": 133} {"train_loss": -6.9902143478393555, "global_step": 22485, "epoch": 133} {"train_loss": -6.870469570159912, "global_step": 22486, "epoch": 133} {"train_loss": -7.19391393661499, "global_step": 22487, "epoch": 133} {"train_loss": -7.0702056884765625, "global_step": 22488, "epoch": 133} {"train_loss": -7.00697135925293, "global_step": 22489, "epoch": 133} {"train_loss": -6.848484516143799, "global_step": 22490, "epoch": 133} {"train_loss": -7.008900165557861, "global_step": 22491, "epoch": 133} {"train_loss": -7.00686502456665, "global_step": 22492, "epoch": 133} {"train_loss": -7.01649284362793, "global_step": 22493, "epoch": 133} {"train_loss": -7.012853145599365, "global_step": 22494, "epoch": 133} {"train_loss": -6.947963237762451, "global_step": 22495, "epoch": 133} {"train_loss": -6.99831485748291, "global_step": 22496, "epoch": 133} {"train_loss": -7.130277156829834, "global_step": 22497, "epoch": 133} {"train_loss": -6.864941120147705, "global_step": 22498, "epoch": 133} {"train_loss": -6.735148906707764, "global_step": 22499, "epoch": 133} {"train_loss": -6.988051414489746, "global_step": 22500, "epoch": 133} {"train_loss": -6.867276668548584, "global_step": 22501, "epoch": 133} {"train_loss": -6.774236679077148, "global_step": 22502, "epoch": 133} {"train_loss": -6.810527801513672, "global_step": 22503, "epoch": 133} {"train_loss": -6.825375080108643, "global_step": 22504, "epoch": 133} {"train_loss": -6.703237533569336, "global_step": 22505, "epoch": 133} {"train_loss": -6.947220802307129, "global_step": 22506, "epoch": 133} {"train_loss": -6.608641624450684, "global_step": 22507, "epoch": 133} {"train_loss": -6.873016357421875, "global_step": 22508, "epoch": 133} {"train_loss": -6.656948566436768, "global_step": 22509, "epoch": 133} {"train_loss": -6.900574684143066, "global_step": 22510, "epoch": 133} {"train_loss": -6.936848969686599, "global_step": 22511, "epoch": 133, "val_loss": 206253.453125} {"train_loss": -6.853684425354004, "global_step": 22512, "epoch": 134} {"train_loss": -6.955327033996582, "global_step": 22513, "epoch": 134} {"train_loss": -6.745546817779541, "global_step": 22514, "epoch": 134} {"train_loss": -6.6757283210754395, "global_step": 22515, "epoch": 134} {"train_loss": -7.126089096069336, "global_step": 22516, "epoch": 134} {"train_loss": -7.046717643737793, "global_step": 22517, "epoch": 134} {"train_loss": -6.752305507659912, "global_step": 22518, "epoch": 134} {"train_loss": -6.840630531311035, "global_step": 22519, "epoch": 134} {"train_loss": -6.684828758239746, "global_step": 22520, "epoch": 134} {"train_loss": -6.872011184692383, "global_step": 22521, "epoch": 134} {"train_loss": -6.533987522125244, "global_step": 22522, "epoch": 134} {"train_loss": -6.696634769439697, "global_step": 22523, "epoch": 134} {"train_loss": -6.999616622924805, "global_step": 22524, "epoch": 134} {"train_loss": -6.761174201965332, "global_step": 22525, "epoch": 134} {"train_loss": -6.579771041870117, "global_step": 22526, "epoch": 134} {"train_loss": -6.934660911560059, "global_step": 22527, "epoch": 134} {"train_loss": -6.9029035568237305, "global_step": 22528, "epoch": 134} {"train_loss": -6.9454145431518555, "global_step": 22529, "epoch": 134} {"train_loss": -6.919164657592773, "global_step": 22530, "epoch": 134} {"train_loss": -7.21701717376709, "global_step": 22531, "epoch": 134} {"train_loss": -6.842461585998535, "global_step": 22532, "epoch": 134} {"train_loss": -6.929075717926025, "global_step": 22533, "epoch": 134} {"train_loss": -7.091158866882324, "global_step": 22534, "epoch": 134} {"train_loss": -6.9822235107421875, "global_step": 22535, "epoch": 134} {"train_loss": -7.0562310218811035, "global_step": 22536, "epoch": 134} {"train_loss": -7.275712013244629, "global_step": 22537, "epoch": 134} {"train_loss": -7.202505111694336, "global_step": 22538, "epoch": 134} {"train_loss": -7.229404926300049, "global_step": 22539, "epoch": 134} {"train_loss": -7.032123565673828, "global_step": 22540, "epoch": 134} {"train_loss": -7.195128917694092, "global_step": 22541, "epoch": 134} {"train_loss": -7.181234836578369, "global_step": 22542, "epoch": 134} {"train_loss": -6.998207092285156, "global_step": 22543, "epoch": 134} {"train_loss": -7.158599376678467, "global_step": 22544, "epoch": 134} {"train_loss": -7.116983890533447, "global_step": 22545, "epoch": 134} {"train_loss": -6.880645275115967, "global_step": 22546, "epoch": 134} {"train_loss": -7.1829633712768555, "global_step": 22547, "epoch": 134} {"train_loss": -6.827198028564453, "global_step": 22548, "epoch": 134} {"train_loss": -7.258545398712158, "global_step": 22549, "epoch": 134} {"train_loss": -6.885464668273926, "global_step": 22550, "epoch": 134} {"train_loss": -7.083685874938965, "global_step": 22551, "epoch": 134} {"train_loss": -6.8977460861206055, "global_step": 22552, "epoch": 134} {"train_loss": -6.930632591247559, "global_step": 22553, "epoch": 134} {"train_loss": -7.137274742126465, "global_step": 22554, "epoch": 134} {"train_loss": -7.172581672668457, "global_step": 22555, "epoch": 134} {"train_loss": -6.828065872192383, "global_step": 22556, "epoch": 134} {"train_loss": -7.016476154327393, "global_step": 22557, "epoch": 134} {"train_loss": -7.016361236572266, "global_step": 22558, "epoch": 134} {"train_loss": -6.956874847412109, "global_step": 22559, "epoch": 134} {"train_loss": -6.967773914337158, "global_step": 22560, "epoch": 134} {"train_loss": -6.881494045257568, "global_step": 22561, "epoch": 134} {"train_loss": -6.880882263183594, "global_step": 22562, "epoch": 134} {"train_loss": -6.925112247467041, "global_step": 22563, "epoch": 134} {"train_loss": -7.0371904373168945, "global_step": 22564, "epoch": 134} {"train_loss": -6.965115547180176, "global_step": 22565, "epoch": 134} {"train_loss": -7.01181697845459, "global_step": 22566, "epoch": 134} {"train_loss": -7.165029525756836, "global_step": 22567, "epoch": 134} {"train_loss": -6.91281795501709, "global_step": 22568, "epoch": 134} {"train_loss": -7.068855285644531, "global_step": 22569, "epoch": 134} {"train_loss": -6.9975481033325195, "global_step": 22570, "epoch": 134} {"train_loss": -7.148972511291504, "global_step": 22571, "epoch": 134} {"train_loss": -6.989307880401611, "global_step": 22572, "epoch": 134} {"train_loss": -6.994081497192383, "global_step": 22573, "epoch": 134} {"train_loss": -6.989426612854004, "global_step": 22574, "epoch": 134} {"train_loss": -6.848127841949463, "global_step": 22575, "epoch": 134} {"train_loss": -7.185102462768555, "global_step": 22576, "epoch": 134} {"train_loss": -7.058752059936523, "global_step": 22577, "epoch": 134} {"train_loss": -6.889993190765381, "global_step": 22578, "epoch": 134} {"train_loss": -7.274487495422363, "global_step": 22579, "epoch": 134} {"train_loss": -7.004919052124023, "global_step": 22580, "epoch": 134} {"train_loss": -7.28074836730957, "global_step": 22581, "epoch": 134} {"train_loss": -7.258009910583496, "global_step": 22582, "epoch": 134} {"train_loss": -7.033851146697998, "global_step": 22583, "epoch": 134} {"train_loss": -7.037124156951904, "global_step": 22584, "epoch": 134} {"train_loss": -7.073879718780518, "global_step": 22585, "epoch": 134} {"train_loss": -7.109199523925781, "global_step": 22586, "epoch": 134} {"train_loss": -7.1059465408325195, "global_step": 22587, "epoch": 134} {"train_loss": -7.203364849090576, "global_step": 22588, "epoch": 134} {"train_loss": -6.903107166290283, "global_step": 22589, "epoch": 134} {"train_loss": -7.1540093421936035, "global_step": 22590, "epoch": 134} {"train_loss": -6.553493976593018, "global_step": 22591, "epoch": 134} {"train_loss": -6.971573829650879, "global_step": 22592, "epoch": 134} {"train_loss": -6.7297043800354, "global_step": 22593, "epoch": 134} {"train_loss": -6.588671684265137, "global_step": 22594, "epoch": 134} {"train_loss": -6.786769390106201, "global_step": 22595, "epoch": 134} {"train_loss": -6.754311561584473, "global_step": 22596, "epoch": 134} {"train_loss": -7.093781471252441, "global_step": 22597, "epoch": 134} {"train_loss": -6.886405944824219, "global_step": 22598, "epoch": 134} {"train_loss": -6.973325729370117, "global_step": 22599, "epoch": 134} {"train_loss": -6.853798866271973, "global_step": 22600, "epoch": 134} {"train_loss": -6.980220317840576, "global_step": 22601, "epoch": 134} {"train_loss": -6.9663591384887695, "global_step": 22602, "epoch": 134} {"train_loss": -6.886812686920166, "global_step": 22603, "epoch": 134} {"train_loss": -6.996892929077148, "global_step": 22604, "epoch": 134} {"train_loss": -6.8844099044799805, "global_step": 22605, "epoch": 134} {"train_loss": -7.021788120269775, "global_step": 22606, "epoch": 134} {"train_loss": -6.948758602142334, "global_step": 22607, "epoch": 134} {"train_loss": -7.123135566711426, "global_step": 22608, "epoch": 134} {"train_loss": -7.174331188201904, "global_step": 22609, "epoch": 134} {"train_loss": -6.956240653991699, "global_step": 22610, "epoch": 134} {"train_loss": -7.156054496765137, "global_step": 22611, "epoch": 134} {"train_loss": -6.908915996551514, "global_step": 22612, "epoch": 134} {"train_loss": -6.891533374786377, "global_step": 22613, "epoch": 134} {"train_loss": -6.998430252075195, "global_step": 22614, "epoch": 134} {"train_loss": -7.086031913757324, "global_step": 22615, "epoch": 134} {"train_loss": -7.171931743621826, "global_step": 22616, "epoch": 134} {"train_loss": -7.217161655426025, "global_step": 22617, "epoch": 134} {"train_loss": -7.2172369956970215, "global_step": 22618, "epoch": 134} {"train_loss": -6.874074935913086, "global_step": 22619, "epoch": 134} {"train_loss": -6.915706634521484, "global_step": 22620, "epoch": 134} {"train_loss": -7.257318496704102, "global_step": 22621, "epoch": 134} {"train_loss": -7.069279193878174, "global_step": 22622, "epoch": 134} {"train_loss": -7.074360370635986, "global_step": 22623, "epoch": 134} {"train_loss": -7.197709083557129, "global_step": 22624, "epoch": 134} {"train_loss": -7.204311847686768, "global_step": 22625, "epoch": 134} {"train_loss": -7.151185512542725, "global_step": 22626, "epoch": 134} {"train_loss": -6.957755088806152, "global_step": 22627, "epoch": 134} {"train_loss": -7.157069683074951, "global_step": 22628, "epoch": 134} {"train_loss": -7.051663398742676, "global_step": 22629, "epoch": 134} {"train_loss": -7.063802719116211, "global_step": 22630, "epoch": 134} {"train_loss": -6.795999526977539, "global_step": 22631, "epoch": 134} {"train_loss": -6.892705917358398, "global_step": 22632, "epoch": 134} {"train_loss": -6.473537445068359, "global_step": 22633, "epoch": 134} {"train_loss": -6.835505962371826, "global_step": 22634, "epoch": 134} {"train_loss": -6.804598808288574, "global_step": 22635, "epoch": 134} {"train_loss": -6.411045074462891, "global_step": 22636, "epoch": 134} {"train_loss": -6.8462138175964355, "global_step": 22637, "epoch": 134} {"train_loss": -6.638495445251465, "global_step": 22638, "epoch": 134} {"train_loss": -6.652953147888184, "global_step": 22639, "epoch": 134} {"train_loss": -6.7986369132995605, "global_step": 22640, "epoch": 134} {"train_loss": -6.494874000549316, "global_step": 22641, "epoch": 134} {"train_loss": -6.739251613616943, "global_step": 22642, "epoch": 134} {"train_loss": -6.355030059814453, "global_step": 22643, "epoch": 134} {"train_loss": -6.722455978393555, "global_step": 22644, "epoch": 134} {"train_loss": -6.619408130645752, "global_step": 22645, "epoch": 134} {"train_loss": -6.534670352935791, "global_step": 22646, "epoch": 134} {"train_loss": -6.589978218078613, "global_step": 22647, "epoch": 134} {"train_loss": -6.671111106872559, "global_step": 22648, "epoch": 134} {"train_loss": -6.547107219696045, "global_step": 22649, "epoch": 134} {"train_loss": -6.864588737487793, "global_step": 22650, "epoch": 134} {"train_loss": -6.58825159072876, "global_step": 22651, "epoch": 134} {"train_loss": -6.66133975982666, "global_step": 22652, "epoch": 134} {"train_loss": -6.7766618728637695, "global_step": 22653, "epoch": 134} {"train_loss": -6.894191741943359, "global_step": 22654, "epoch": 134} {"train_loss": -6.81350040435791, "global_step": 22655, "epoch": 134} {"train_loss": -6.9180588722229, "global_step": 22656, "epoch": 134} {"train_loss": -7.0149126052856445, "global_step": 22657, "epoch": 134} {"train_loss": -6.946369171142578, "global_step": 22658, "epoch": 134} {"train_loss": -6.804255962371826, "global_step": 22659, "epoch": 134} {"train_loss": -7.195529937744141, "global_step": 22660, "epoch": 134} {"train_loss": -6.936530113220215, "global_step": 22661, "epoch": 134} {"train_loss": -7.021199703216553, "global_step": 22662, "epoch": 134} {"train_loss": -7.1082258224487305, "global_step": 22663, "epoch": 134} {"train_loss": -7.144299507141113, "global_step": 22664, "epoch": 134} {"train_loss": -7.082645416259766, "global_step": 22665, "epoch": 134} {"train_loss": -7.019476890563965, "global_step": 22666, "epoch": 134} {"train_loss": -7.114073276519775, "global_step": 22667, "epoch": 134} {"train_loss": -6.790361404418945, "global_step": 22668, "epoch": 134} {"train_loss": -7.060122489929199, "global_step": 22669, "epoch": 134} {"train_loss": -6.717309474945068, "global_step": 22670, "epoch": 134} {"train_loss": -6.870370388031006, "global_step": 22671, "epoch": 134} {"train_loss": -6.819238662719727, "global_step": 22672, "epoch": 134} {"train_loss": -7.187314033508301, "global_step": 22673, "epoch": 134} {"train_loss": -6.675868034362793, "global_step": 22674, "epoch": 134} {"train_loss": -6.787749290466309, "global_step": 22675, "epoch": 134} {"train_loss": -6.550561904907227, "global_step": 22676, "epoch": 134} {"train_loss": -6.884734153747559, "global_step": 22677, "epoch": 134} {"train_loss": -6.5389204025268555, "global_step": 22678, "epoch": 134} {"train_loss": -6.936039694717953, "global_step": 22679, "epoch": 134, "val_loss": 205485.390625} {"train_loss": -6.658273696899414, "global_step": 22680, "epoch": 135} {"train_loss": -6.622434616088867, "global_step": 22681, "epoch": 135} {"train_loss": -6.746838569641113, "global_step": 22682, "epoch": 135} {"train_loss": -7.106075286865234, "global_step": 22683, "epoch": 135} {"train_loss": -6.789546012878418, "global_step": 22684, "epoch": 135} {"train_loss": -6.959187030792236, "global_step": 22685, "epoch": 135} {"train_loss": -6.828880310058594, "global_step": 22686, "epoch": 135} {"train_loss": -6.748476505279541, "global_step": 22687, "epoch": 135} {"train_loss": -6.923674583435059, "global_step": 22688, "epoch": 135} {"train_loss": -6.70047664642334, "global_step": 22689, "epoch": 135} {"train_loss": -6.968007564544678, "global_step": 22690, "epoch": 135} {"train_loss": -7.05251932144165, "global_step": 22691, "epoch": 135} {"train_loss": -6.763646602630615, "global_step": 22692, "epoch": 135} {"train_loss": -7.026350975036621, "global_step": 22693, "epoch": 135} {"train_loss": -6.850523471832275, "global_step": 22694, "epoch": 135} {"train_loss": -6.790182113647461, "global_step": 22695, "epoch": 135} {"train_loss": -6.832211494445801, "global_step": 22696, "epoch": 135} {"train_loss": -7.0079193115234375, "global_step": 22697, "epoch": 135} {"train_loss": -7.042140960693359, "global_step": 22698, "epoch": 135} {"train_loss": -6.739202499389648, "global_step": 22699, "epoch": 135} {"train_loss": -7.103880405426025, "global_step": 22700, "epoch": 135} {"train_loss": -6.817429542541504, "global_step": 22701, "epoch": 135} {"train_loss": -6.980508804321289, "global_step": 22702, "epoch": 135} {"train_loss": -6.924736022949219, "global_step": 22703, "epoch": 135} {"train_loss": -6.909382343292236, "global_step": 22704, "epoch": 135} {"train_loss": -7.181442737579346, "global_step": 22705, "epoch": 135} {"train_loss": -7.028003692626953, "global_step": 22706, "epoch": 135} {"train_loss": -7.079415321350098, "global_step": 22707, "epoch": 135} {"train_loss": -6.95982551574707, "global_step": 22708, "epoch": 135} {"train_loss": -7.190866470336914, "global_step": 22709, "epoch": 135} {"train_loss": -7.135490894317627, "global_step": 22710, "epoch": 135} {"train_loss": -7.053881645202637, "global_step": 22711, "epoch": 135} {"train_loss": -7.212940692901611, "global_step": 22712, "epoch": 135} {"train_loss": -7.0297956466674805, "global_step": 22713, "epoch": 135} {"train_loss": -7.084515571594238, "global_step": 22714, "epoch": 135} {"train_loss": -7.1723432540893555, "global_step": 22715, "epoch": 135} {"train_loss": -7.21427059173584, "global_step": 22716, "epoch": 135} {"train_loss": -7.121971130371094, "global_step": 22717, "epoch": 135} {"train_loss": -6.874796390533447, "global_step": 22718, "epoch": 135} {"train_loss": -6.97416877746582, "global_step": 22719, "epoch": 135} {"train_loss": -7.144913673400879, "global_step": 22720, "epoch": 135} {"train_loss": -7.03128719329834, "global_step": 22721, "epoch": 135} {"train_loss": -6.880918502807617, "global_step": 22722, "epoch": 135} {"train_loss": -7.00053596496582, "global_step": 22723, "epoch": 135} {"train_loss": -6.750739097595215, "global_step": 22724, "epoch": 135} {"train_loss": -7.021666049957275, "global_step": 22725, "epoch": 135} {"train_loss": -6.534510612487793, "global_step": 22726, "epoch": 135} {"train_loss": -6.591659069061279, "global_step": 22727, "epoch": 135} {"train_loss": -6.93077278137207, "global_step": 22728, "epoch": 135} {"train_loss": -6.6947479248046875, "global_step": 22729, "epoch": 135} {"train_loss": -6.8847246170043945, "global_step": 22730, "epoch": 135} {"train_loss": -6.68010139465332, "global_step": 22731, "epoch": 135} {"train_loss": -6.74189567565918, "global_step": 22732, "epoch": 135} {"train_loss": -6.835363388061523, "global_step": 22733, "epoch": 135} {"train_loss": -6.444211006164551, "global_step": 22734, "epoch": 135} {"train_loss": -6.961071968078613, "global_step": 22735, "epoch": 135} {"train_loss": -6.727025985717773, "global_step": 22736, "epoch": 135} {"train_loss": -6.535680294036865, "global_step": 22737, "epoch": 135} {"train_loss": -6.911035537719727, "global_step": 22738, "epoch": 135} {"train_loss": -6.710108757019043, "global_step": 22739, "epoch": 135} {"train_loss": -6.782917499542236, "global_step": 22740, "epoch": 135} {"train_loss": -6.847354888916016, "global_step": 22741, "epoch": 135} {"train_loss": -6.725366592407227, "global_step": 22742, "epoch": 135} {"train_loss": -6.782426834106445, "global_step": 22743, "epoch": 135} {"train_loss": -6.991644859313965, "global_step": 22744, "epoch": 135} {"train_loss": -6.8422112464904785, "global_step": 22745, "epoch": 135} {"train_loss": -6.700361251831055, "global_step": 22746, "epoch": 135} {"train_loss": -6.871612071990967, "global_step": 22747, "epoch": 135} {"train_loss": -6.898105621337891, "global_step": 22748, "epoch": 135} {"train_loss": -7.207052230834961, "global_step": 22749, "epoch": 135} {"train_loss": -6.983598709106445, "global_step": 22750, "epoch": 135} {"train_loss": -7.084061145782471, "global_step": 22751, "epoch": 135} {"train_loss": -7.1202592849731445, "global_step": 22752, "epoch": 135} {"train_loss": -6.971343994140625, "global_step": 22753, "epoch": 135} {"train_loss": -7.053489685058594, "global_step": 22754, "epoch": 135} {"train_loss": -7.009300708770752, "global_step": 22755, "epoch": 135} {"train_loss": -7.002613067626953, "global_step": 22756, "epoch": 135} {"train_loss": -7.102651119232178, "global_step": 22757, "epoch": 135} {"train_loss": -7.045836448669434, "global_step": 22758, "epoch": 135} {"train_loss": -6.996608734130859, "global_step": 22759, "epoch": 135} {"train_loss": -6.950319290161133, "global_step": 22760, "epoch": 135} {"train_loss": -7.019815921783447, "global_step": 22761, "epoch": 135} {"train_loss": -6.96230411529541, "global_step": 22762, "epoch": 135} {"train_loss": -7.020367622375488, "global_step": 22763, "epoch": 135} {"train_loss": -7.183445930480957, "global_step": 22764, "epoch": 135} {"train_loss": -7.111756324768066, "global_step": 22765, "epoch": 135} {"train_loss": -7.117029190063477, "global_step": 22766, "epoch": 135} {"train_loss": -7.323777198791504, "global_step": 22767, "epoch": 135} {"train_loss": -7.137908935546875, "global_step": 22768, "epoch": 135} {"train_loss": -6.896107196807861, "global_step": 22769, "epoch": 135} {"train_loss": -6.734894752502441, "global_step": 22770, "epoch": 135} {"train_loss": -7.124920845031738, "global_step": 22771, "epoch": 135} {"train_loss": -7.1239542961120605, "global_step": 22772, "epoch": 135} {"train_loss": -6.979095458984375, "global_step": 22773, "epoch": 135} {"train_loss": -6.803349018096924, "global_step": 22774, "epoch": 135} {"train_loss": -6.971162796020508, "global_step": 22775, "epoch": 135} {"train_loss": -6.693891525268555, "global_step": 22776, "epoch": 135} {"train_loss": -6.924310684204102, "global_step": 22777, "epoch": 135} {"train_loss": -6.939273834228516, "global_step": 22778, "epoch": 135} {"train_loss": -6.716335773468018, "global_step": 22779, "epoch": 135} {"train_loss": -6.886693000793457, "global_step": 22780, "epoch": 135} {"train_loss": -6.754447937011719, "global_step": 22781, "epoch": 135} {"train_loss": -6.813695907592773, "global_step": 22782, "epoch": 135} {"train_loss": -6.824881553649902, "global_step": 22783, "epoch": 135} {"train_loss": -6.89349365234375, "global_step": 22784, "epoch": 135} {"train_loss": -6.821199417114258, "global_step": 22785, "epoch": 135} {"train_loss": -7.068384170532227, "global_step": 22786, "epoch": 135} {"train_loss": -6.910623550415039, "global_step": 22787, "epoch": 135} {"train_loss": -7.131796360015869, "global_step": 22788, "epoch": 135} {"train_loss": -7.141056060791016, "global_step": 22789, "epoch": 135} {"train_loss": -7.220817565917969, "global_step": 22790, "epoch": 135} {"train_loss": -6.699321746826172, "global_step": 22791, "epoch": 135} {"train_loss": -6.87432861328125, "global_step": 22792, "epoch": 135} {"train_loss": -6.954263687133789, "global_step": 22793, "epoch": 135} {"train_loss": -7.064558982849121, "global_step": 22794, "epoch": 135} {"train_loss": -6.960775852203369, "global_step": 22795, "epoch": 135} {"train_loss": -7.21334171295166, "global_step": 22796, "epoch": 135} {"train_loss": -6.772414684295654, "global_step": 22797, "epoch": 135} {"train_loss": -6.872653961181641, "global_step": 22798, "epoch": 135} {"train_loss": -7.088349342346191, "global_step": 22799, "epoch": 135} {"train_loss": -6.789005279541016, "global_step": 22800, "epoch": 135} {"train_loss": -7.100128173828125, "global_step": 22801, "epoch": 135} {"train_loss": -6.841888904571533, "global_step": 22802, "epoch": 135} {"train_loss": -6.9978132247924805, "global_step": 22803, "epoch": 135} {"train_loss": -6.8418145179748535, "global_step": 22804, "epoch": 135} {"train_loss": -6.914638519287109, "global_step": 22805, "epoch": 135} {"train_loss": -6.822048187255859, "global_step": 22806, "epoch": 135} {"train_loss": -6.788536071777344, "global_step": 22807, "epoch": 135} {"train_loss": -6.908188819885254, "global_step": 22808, "epoch": 135} {"train_loss": -6.8888678550720215, "global_step": 22809, "epoch": 135} {"train_loss": -7.111553192138672, "global_step": 22810, "epoch": 135} {"train_loss": -6.803267955780029, "global_step": 22811, "epoch": 135} {"train_loss": -7.138929843902588, "global_step": 22812, "epoch": 135} {"train_loss": -7.1869659423828125, "global_step": 22813, "epoch": 135} {"train_loss": -7.131588935852051, "global_step": 22814, "epoch": 135} {"train_loss": -7.118353366851807, "global_step": 22815, "epoch": 135} {"train_loss": -6.906031608581543, "global_step": 22816, "epoch": 135} {"train_loss": -7.003025054931641, "global_step": 22817, "epoch": 135} {"train_loss": -7.148845672607422, "global_step": 22818, "epoch": 135} {"train_loss": -6.921511650085449, "global_step": 22819, "epoch": 135} {"train_loss": -6.98922872543335, "global_step": 22820, "epoch": 135} {"train_loss": -6.932045936584473, "global_step": 22821, "epoch": 135} {"train_loss": -7.142762184143066, "global_step": 22822, "epoch": 135} {"train_loss": -7.092267036437988, "global_step": 22823, "epoch": 135} {"train_loss": -7.159921169281006, "global_step": 22824, "epoch": 135} {"train_loss": -6.827458381652832, "global_step": 22825, "epoch": 135} {"train_loss": -7.0873284339904785, "global_step": 22826, "epoch": 135} {"train_loss": -7.02114200592041, "global_step": 22827, "epoch": 135} {"train_loss": -7.026393413543701, "global_step": 22828, "epoch": 135} {"train_loss": -7.076223373413086, "global_step": 22829, "epoch": 135} {"train_loss": -7.194973945617676, "global_step": 22830, "epoch": 135} {"train_loss": -7.070766925811768, "global_step": 22831, "epoch": 135} {"train_loss": -6.730339527130127, "global_step": 22832, "epoch": 135} {"train_loss": -7.063161849975586, "global_step": 22833, "epoch": 135} {"train_loss": -7.1065826416015625, "global_step": 22834, "epoch": 135} {"train_loss": -6.98374080657959, "global_step": 22835, "epoch": 135} {"train_loss": -7.007290363311768, "global_step": 22836, "epoch": 135} {"train_loss": -6.824087619781494, "global_step": 22837, "epoch": 135} {"train_loss": -7.097838878631592, "global_step": 22838, "epoch": 135} {"train_loss": -7.027157306671143, "global_step": 22839, "epoch": 135} {"train_loss": -6.986003398895264, "global_step": 22840, "epoch": 135} {"train_loss": -6.949519634246826, "global_step": 22841, "epoch": 135} {"train_loss": -7.130830764770508, "global_step": 22842, "epoch": 135} {"train_loss": -7.041803359985352, "global_step": 22843, "epoch": 135} {"train_loss": -6.924957275390625, "global_step": 22844, "epoch": 135} {"train_loss": -6.777046203613281, "global_step": 22845, "epoch": 135} {"train_loss": -6.949761867523193, "global_step": 22846, "epoch": 135} {"train_loss": -6.948565065860748, "global_step": 22847, "epoch": 135, "val_loss": 204369.796875, "train_action_mse_error": 14.408960342407227} {"train_loss": -6.966876983642578, "global_step": 22848, "epoch": 136} {"train_loss": -6.936758041381836, "global_step": 22849, "epoch": 136} {"train_loss": -7.144536018371582, "global_step": 22850, "epoch": 136} {"train_loss": -7.067506790161133, "global_step": 22851, "epoch": 136} {"train_loss": -7.182987213134766, "global_step": 22852, "epoch": 136} {"train_loss": -6.887925624847412, "global_step": 22853, "epoch": 136} {"train_loss": -7.21064567565918, "global_step": 22854, "epoch": 136} {"train_loss": -7.146883964538574, "global_step": 22855, "epoch": 136} {"train_loss": -7.046142578125, "global_step": 22856, "epoch": 136} {"train_loss": -6.7955427169799805, "global_step": 22857, "epoch": 136} {"train_loss": -7.013833999633789, "global_step": 22858, "epoch": 136} {"train_loss": -7.033409118652344, "global_step": 22859, "epoch": 136} {"train_loss": -6.927577018737793, "global_step": 22860, "epoch": 136} {"train_loss": -6.9902849197387695, "global_step": 22861, "epoch": 136} {"train_loss": -7.073280334472656, "global_step": 22862, "epoch": 136} {"train_loss": -6.887968063354492, "global_step": 22863, "epoch": 136} {"train_loss": -7.258281230926514, "global_step": 22864, "epoch": 136} {"train_loss": -6.868014812469482, "global_step": 22865, "epoch": 136} {"train_loss": -6.785004615783691, "global_step": 22866, "epoch": 136} {"train_loss": -6.881813049316406, "global_step": 22867, "epoch": 136} {"train_loss": -6.689680576324463, "global_step": 22868, "epoch": 136} {"train_loss": -6.859204292297363, "global_step": 22869, "epoch": 136} {"train_loss": -6.839678764343262, "global_step": 22870, "epoch": 136} {"train_loss": -6.901583671569824, "global_step": 22871, "epoch": 136} {"train_loss": -7.211090087890625, "global_step": 22872, "epoch": 136} {"train_loss": -6.937158107757568, "global_step": 22873, "epoch": 136} {"train_loss": -6.948468208312988, "global_step": 22874, "epoch": 136} {"train_loss": -6.971138000488281, "global_step": 22875, "epoch": 136} {"train_loss": -7.055516242980957, "global_step": 22876, "epoch": 136} {"train_loss": -7.189338207244873, "global_step": 22877, "epoch": 136} {"train_loss": -6.873386383056641, "global_step": 22878, "epoch": 136} {"train_loss": -7.207573890686035, "global_step": 22879, "epoch": 136} {"train_loss": -7.123186111450195, "global_step": 22880, "epoch": 136} {"train_loss": -7.046078681945801, "global_step": 22881, "epoch": 136} {"train_loss": -7.022643566131592, "global_step": 22882, "epoch": 136} {"train_loss": -7.171895980834961, "global_step": 22883, "epoch": 136} {"train_loss": -7.103024959564209, "global_step": 22884, "epoch": 136} {"train_loss": -7.091100692749023, "global_step": 22885, "epoch": 136} {"train_loss": -7.068314552307129, "global_step": 22886, "epoch": 136} {"train_loss": -7.088614463806152, "global_step": 22887, "epoch": 136} {"train_loss": -7.0206685066223145, "global_step": 22888, "epoch": 136} {"train_loss": -7.0696516036987305, "global_step": 22889, "epoch": 136} {"train_loss": -7.463198661804199, "global_step": 22890, "epoch": 136} {"train_loss": -7.251589298248291, "global_step": 22891, "epoch": 136} {"train_loss": -7.172928810119629, "global_step": 22892, "epoch": 136} {"train_loss": -7.248269081115723, "global_step": 22893, "epoch": 136} {"train_loss": -7.12618350982666, "global_step": 22894, "epoch": 136} {"train_loss": -7.031583309173584, "global_step": 22895, "epoch": 136} {"train_loss": -6.793967247009277, "global_step": 22896, "epoch": 136} {"train_loss": -6.677619457244873, "global_step": 22897, "epoch": 136} {"train_loss": -6.934545993804932, "global_step": 22898, "epoch": 136} {"train_loss": -6.947725296020508, "global_step": 22899, "epoch": 136} {"train_loss": -6.927605628967285, "global_step": 22900, "epoch": 136} {"train_loss": -6.684647560119629, "global_step": 22901, "epoch": 136} {"train_loss": -6.322900295257568, "global_step": 22902, "epoch": 136} {"train_loss": -6.821122169494629, "global_step": 22903, "epoch": 136} {"train_loss": -6.684281349182129, "global_step": 22904, "epoch": 136} {"train_loss": -6.757556915283203, "global_step": 22905, "epoch": 136} {"train_loss": -6.800113677978516, "global_step": 22906, "epoch": 136} {"train_loss": -6.718896865844727, "global_step": 22907, "epoch": 136} {"train_loss": -6.780416488647461, "global_step": 22908, "epoch": 136} {"train_loss": -6.448745250701904, "global_step": 22909, "epoch": 136} {"train_loss": -6.898731708526611, "global_step": 22910, "epoch": 136} {"train_loss": -6.820255279541016, "global_step": 22911, "epoch": 136} {"train_loss": -6.647050857543945, "global_step": 22912, "epoch": 136} {"train_loss": -6.677629470825195, "global_step": 22913, "epoch": 136} {"train_loss": -6.716464519500732, "global_step": 22914, "epoch": 136} {"train_loss": -6.608377456665039, "global_step": 22915, "epoch": 136} {"train_loss": -7.078824043273926, "global_step": 22916, "epoch": 136} {"train_loss": -6.876859664916992, "global_step": 22917, "epoch": 136} {"train_loss": -6.662039756774902, "global_step": 22918, "epoch": 136} {"train_loss": -6.822576522827148, "global_step": 22919, "epoch": 136} {"train_loss": -6.827407360076904, "global_step": 22920, "epoch": 136} {"train_loss": -6.833038330078125, "global_step": 22921, "epoch": 136} {"train_loss": -6.7915568351745605, "global_step": 22922, "epoch": 136} {"train_loss": -6.920258045196533, "global_step": 22923, "epoch": 136} {"train_loss": -7.036755084991455, "global_step": 22924, "epoch": 136} {"train_loss": -7.15341329574585, "global_step": 22925, "epoch": 136} {"train_loss": -6.962040901184082, "global_step": 22926, "epoch": 136} {"train_loss": -6.889081954956055, "global_step": 22927, "epoch": 136} {"train_loss": -6.966940879821777, "global_step": 22928, "epoch": 136} {"train_loss": -7.098938941955566, "global_step": 22929, "epoch": 136} {"train_loss": -6.91506814956665, "global_step": 22930, "epoch": 136} {"train_loss": -7.018019676208496, "global_step": 22931, "epoch": 136} {"train_loss": -7.261252403259277, "global_step": 22932, "epoch": 136} {"train_loss": -6.9023332595825195, "global_step": 22933, "epoch": 136} {"train_loss": -6.9904375076293945, "global_step": 22934, "epoch": 136} {"train_loss": -6.836824893951416, "global_step": 22935, "epoch": 136} {"train_loss": -7.251253604888916, "global_step": 22936, "epoch": 136} {"train_loss": -7.18678617477417, "global_step": 22937, "epoch": 136} {"train_loss": -7.053529739379883, "global_step": 22938, "epoch": 136} {"train_loss": -7.052580833435059, "global_step": 22939, "epoch": 136} {"train_loss": -7.263293266296387, "global_step": 22940, "epoch": 136} {"train_loss": -7.125194072723389, "global_step": 22941, "epoch": 136} {"train_loss": -7.042344093322754, "global_step": 22942, "epoch": 136} {"train_loss": -7.031857490539551, "global_step": 22943, "epoch": 136} {"train_loss": -6.977745056152344, "global_step": 22944, "epoch": 136} {"train_loss": -6.651965141296387, "global_step": 22945, "epoch": 136} {"train_loss": -7.119834899902344, "global_step": 22946, "epoch": 136} {"train_loss": -6.938960552215576, "global_step": 22947, "epoch": 136} {"train_loss": -7.155474662780762, "global_step": 22948, "epoch": 136} {"train_loss": -6.7701568603515625, "global_step": 22949, "epoch": 136} {"train_loss": -6.967134475708008, "global_step": 22950, "epoch": 136} {"train_loss": -6.707950115203857, "global_step": 22951, "epoch": 136} {"train_loss": -7.110404014587402, "global_step": 22952, "epoch": 136} {"train_loss": -6.946044921875, "global_step": 22953, "epoch": 136} {"train_loss": -7.055093288421631, "global_step": 22954, "epoch": 136} {"train_loss": -6.9501729011535645, "global_step": 22955, "epoch": 136} {"train_loss": -6.864864826202393, "global_step": 22956, "epoch": 136} {"train_loss": -6.986708641052246, "global_step": 22957, "epoch": 136} {"train_loss": -7.060297966003418, "global_step": 22958, "epoch": 136} {"train_loss": -7.168679237365723, "global_step": 22959, "epoch": 136} {"train_loss": -6.992282867431641, "global_step": 22960, "epoch": 136} {"train_loss": -7.26784610748291, "global_step": 22961, "epoch": 136} {"train_loss": -7.015613079071045, "global_step": 22962, "epoch": 136} {"train_loss": -7.084164619445801, "global_step": 22963, "epoch": 136} {"train_loss": -7.085977554321289, "global_step": 22964, "epoch": 136} {"train_loss": -7.116249084472656, "global_step": 22965, "epoch": 136} {"train_loss": -7.066205024719238, "global_step": 22966, "epoch": 136} {"train_loss": -7.031888484954834, "global_step": 22967, "epoch": 136} {"train_loss": -7.122504711151123, "global_step": 22968, "epoch": 136} {"train_loss": -7.02767276763916, "global_step": 22969, "epoch": 136} {"train_loss": -7.218206405639648, "global_step": 22970, "epoch": 136} {"train_loss": -7.198781967163086, "global_step": 22971, "epoch": 136} {"train_loss": -6.864206314086914, "global_step": 22972, "epoch": 136} {"train_loss": -6.880647659301758, "global_step": 22973, "epoch": 136} {"train_loss": -7.194648742675781, "global_step": 22974, "epoch": 136} {"train_loss": -7.0509934425354, "global_step": 22975, "epoch": 136} {"train_loss": -7.133658409118652, "global_step": 22976, "epoch": 136} {"train_loss": -7.25831413269043, "global_step": 22977, "epoch": 136} {"train_loss": -7.209942817687988, "global_step": 22978, "epoch": 136} {"train_loss": -6.886785507202148, "global_step": 22979, "epoch": 136} {"train_loss": -7.289953708648682, "global_step": 22980, "epoch": 136} {"train_loss": -7.069793224334717, "global_step": 22981, "epoch": 136} {"train_loss": -7.077847480773926, "global_step": 22982, "epoch": 136} {"train_loss": -7.1148200035095215, "global_step": 22983, "epoch": 136} {"train_loss": -6.92161750793457, "global_step": 22984, "epoch": 136} {"train_loss": -7.131028652191162, "global_step": 22985, "epoch": 136} {"train_loss": -7.161877155303955, "global_step": 22986, "epoch": 136} {"train_loss": -7.259289741516113, "global_step": 22987, "epoch": 136} {"train_loss": -7.299385070800781, "global_step": 22988, "epoch": 136} {"train_loss": -7.251073837280273, "global_step": 22989, "epoch": 136} {"train_loss": -7.05307674407959, "global_step": 22990, "epoch": 136} {"train_loss": -6.968777656555176, "global_step": 22991, "epoch": 136} {"train_loss": -7.276114463806152, "global_step": 22992, "epoch": 136} {"train_loss": -7.160394191741943, "global_step": 22993, "epoch": 136} {"train_loss": -7.17288875579834, "global_step": 22994, "epoch": 136} {"train_loss": -7.105404853820801, "global_step": 22995, "epoch": 136} {"train_loss": -7.023265838623047, "global_step": 22996, "epoch": 136} {"train_loss": -7.184451580047607, "global_step": 22997, "epoch": 136} {"train_loss": -7.415729522705078, "global_step": 22998, "epoch": 136} {"train_loss": -6.963210582733154, "global_step": 22999, "epoch": 136} {"train_loss": -7.058858394622803, "global_step": 23000, "epoch": 136} {"train_loss": -7.026424407958984, "global_step": 23001, "epoch": 136} {"train_loss": -7.013416290283203, "global_step": 23002, "epoch": 136} {"train_loss": -6.972215175628662, "global_step": 23003, "epoch": 136} {"train_loss": -7.312976837158203, "global_step": 23004, "epoch": 136} {"train_loss": -6.943295478820801, "global_step": 23005, "epoch": 136} {"train_loss": -6.841859340667725, "global_step": 23006, "epoch": 136} {"train_loss": -7.185074806213379, "global_step": 23007, "epoch": 136} {"train_loss": -6.89088773727417, "global_step": 23008, "epoch": 136} {"train_loss": -7.081026077270508, "global_step": 23009, "epoch": 136} {"train_loss": -7.185596466064453, "global_step": 23010, "epoch": 136} {"train_loss": -7.080172538757324, "global_step": 23011, "epoch": 136} {"train_loss": -6.9482574462890625, "global_step": 23012, "epoch": 136} {"train_loss": -7.030011177062988, "global_step": 23013, "epoch": 136} {"train_loss": -7.038625717163086, "global_step": 23014, "epoch": 136} {"train_loss": -7.004811491285052, "global_step": 23015, "epoch": 136, "val_loss": 206641.1875} {"train_loss": -6.605517387390137, "global_step": 23016, "epoch": 137} {"train_loss": -7.176212787628174, "global_step": 23017, "epoch": 137} {"train_loss": -7.270705223083496, "global_step": 23018, "epoch": 137} {"train_loss": -6.924063682556152, "global_step": 23019, "epoch": 137} {"train_loss": -7.026650905609131, "global_step": 23020, "epoch": 137} {"train_loss": -6.867258071899414, "global_step": 23021, "epoch": 137} {"train_loss": -7.112117767333984, "global_step": 23022, "epoch": 137} {"train_loss": -7.060956954956055, "global_step": 23023, "epoch": 137} {"train_loss": -6.876005172729492, "global_step": 23024, "epoch": 137} {"train_loss": -6.957305908203125, "global_step": 23025, "epoch": 137} {"train_loss": -7.234636306762695, "global_step": 23026, "epoch": 137} {"train_loss": -7.076229095458984, "global_step": 23027, "epoch": 137} {"train_loss": -7.022713661193848, "global_step": 23028, "epoch": 137} {"train_loss": -7.1494269371032715, "global_step": 23029, "epoch": 137} {"train_loss": -7.040850639343262, "global_step": 23030, "epoch": 137} {"train_loss": -6.995709419250488, "global_step": 23031, "epoch": 137} {"train_loss": -7.217822074890137, "global_step": 23032, "epoch": 137} {"train_loss": -6.83685827255249, "global_step": 23033, "epoch": 137} {"train_loss": -7.180816650390625, "global_step": 23034, "epoch": 137} {"train_loss": -6.96311092376709, "global_step": 23035, "epoch": 137} {"train_loss": -6.9654083251953125, "global_step": 23036, "epoch": 137} {"train_loss": -6.487709999084473, "global_step": 23037, "epoch": 137} {"train_loss": -7.009631156921387, "global_step": 23038, "epoch": 137} {"train_loss": -6.8139801025390625, "global_step": 23039, "epoch": 137} {"train_loss": -6.933535575866699, "global_step": 23040, "epoch": 137} {"train_loss": -6.820531845092773, "global_step": 23041, "epoch": 137} {"train_loss": -7.155125617980957, "global_step": 23042, "epoch": 137} {"train_loss": -6.782806396484375, "global_step": 23043, "epoch": 137} {"train_loss": -6.802227973937988, "global_step": 23044, "epoch": 137} {"train_loss": -7.209391117095947, "global_step": 23045, "epoch": 137} {"train_loss": -7.019508361816406, "global_step": 23046, "epoch": 137} {"train_loss": -6.913696765899658, "global_step": 23047, "epoch": 137} {"train_loss": -6.8495330810546875, "global_step": 23048, "epoch": 137} {"train_loss": -7.120874404907227, "global_step": 23049, "epoch": 137} {"train_loss": -6.749433517456055, "global_step": 23050, "epoch": 137} {"train_loss": -7.108365058898926, "global_step": 23051, "epoch": 137} {"train_loss": -6.977190017700195, "global_step": 23052, "epoch": 137} {"train_loss": -6.917043685913086, "global_step": 23053, "epoch": 137} {"train_loss": -7.092181205749512, "global_step": 23054, "epoch": 137} {"train_loss": -6.910021781921387, "global_step": 23055, "epoch": 137} {"train_loss": -7.018845558166504, "global_step": 23056, "epoch": 137} {"train_loss": -7.003366947174072, "global_step": 23057, "epoch": 137} {"train_loss": -6.728505611419678, "global_step": 23058, "epoch": 137} {"train_loss": -6.899123191833496, "global_step": 23059, "epoch": 137} {"train_loss": -6.56799840927124, "global_step": 23060, "epoch": 137} {"train_loss": -6.923279762268066, "global_step": 23061, "epoch": 137} {"train_loss": -7.033951759338379, "global_step": 23062, "epoch": 137} {"train_loss": -7.01373291015625, "global_step": 23063, "epoch": 137} {"train_loss": -7.014699459075928, "global_step": 23064, "epoch": 137} {"train_loss": -7.069126605987549, "global_step": 23065, "epoch": 137} {"train_loss": -6.93818473815918, "global_step": 23066, "epoch": 137} {"train_loss": -7.161584377288818, "global_step": 23067, "epoch": 137} {"train_loss": -7.012063026428223, "global_step": 23068, "epoch": 137} {"train_loss": -7.25031852722168, "global_step": 23069, "epoch": 137} {"train_loss": -7.312370777130127, "global_step": 23070, "epoch": 137} {"train_loss": -7.1616716384887695, "global_step": 23071, "epoch": 137} {"train_loss": -7.162316799163818, "global_step": 23072, "epoch": 137} {"train_loss": -7.160796165466309, "global_step": 23073, "epoch": 137} {"train_loss": -7.166223049163818, "global_step": 23074, "epoch": 137} {"train_loss": -7.161887168884277, "global_step": 23075, "epoch": 137} {"train_loss": -7.061978340148926, "global_step": 23076, "epoch": 137} {"train_loss": -7.130603790283203, "global_step": 23077, "epoch": 137} {"train_loss": -7.163780212402344, "global_step": 23078, "epoch": 137} {"train_loss": -6.812356472015381, "global_step": 23079, "epoch": 137} {"train_loss": -7.1157026290893555, "global_step": 23080, "epoch": 137} {"train_loss": -6.990602493286133, "global_step": 23081, "epoch": 137} {"train_loss": -7.023633003234863, "global_step": 23082, "epoch": 137} {"train_loss": -6.999174118041992, "global_step": 23083, "epoch": 137} {"train_loss": -6.8928327560424805, "global_step": 23084, "epoch": 137} {"train_loss": -6.960202217102051, "global_step": 23085, "epoch": 137} {"train_loss": -6.855564594268799, "global_step": 23086, "epoch": 137} {"train_loss": -7.087740898132324, "global_step": 23087, "epoch": 137} {"train_loss": -7.0526227951049805, "global_step": 23088, "epoch": 137} {"train_loss": -6.963291645050049, "global_step": 23089, "epoch": 137} {"train_loss": -7.139897346496582, "global_step": 23090, "epoch": 137} {"train_loss": -7.072955131530762, "global_step": 23091, "epoch": 137} {"train_loss": -7.226445198059082, "global_step": 23092, "epoch": 137} {"train_loss": -7.225017070770264, "global_step": 23093, "epoch": 137} {"train_loss": -6.971523761749268, "global_step": 23094, "epoch": 137} {"train_loss": -7.062934398651123, "global_step": 23095, "epoch": 137} {"train_loss": -7.127923965454102, "global_step": 23096, "epoch": 137} {"train_loss": -7.425393104553223, "global_step": 23097, "epoch": 137} {"train_loss": -7.244901180267334, "global_step": 23098, "epoch": 137} {"train_loss": -7.139383316040039, "global_step": 23099, "epoch": 137} {"train_loss": -7.161545753479004, "global_step": 23100, "epoch": 137} {"train_loss": -7.1447625160217285, "global_step": 23101, "epoch": 137} {"train_loss": -7.230525493621826, "global_step": 23102, "epoch": 137} {"train_loss": -6.98384428024292, "global_step": 23103, "epoch": 137} {"train_loss": -7.145709037780762, "global_step": 23104, "epoch": 137} {"train_loss": -6.895364761352539, "global_step": 23105, "epoch": 137} {"train_loss": -7.234728813171387, "global_step": 23106, "epoch": 137} {"train_loss": -6.976490020751953, "global_step": 23107, "epoch": 137} {"train_loss": -7.401647567749023, "global_step": 23108, "epoch": 137} {"train_loss": -7.225343704223633, "global_step": 23109, "epoch": 137} {"train_loss": -7.242391109466553, "global_step": 23110, "epoch": 137} {"train_loss": -7.1590576171875, "global_step": 23111, "epoch": 137} {"train_loss": -7.066814422607422, "global_step": 23112, "epoch": 137} {"train_loss": -7.094388008117676, "global_step": 23113, "epoch": 137} {"train_loss": -7.003257751464844, "global_step": 23114, "epoch": 137} {"train_loss": -7.137483596801758, "global_step": 23115, "epoch": 137} {"train_loss": -7.191921710968018, "global_step": 23116, "epoch": 137} {"train_loss": -7.117663383483887, "global_step": 23117, "epoch": 137} {"train_loss": -7.168369293212891, "global_step": 23118, "epoch": 137} {"train_loss": -6.929854869842529, "global_step": 23119, "epoch": 137} {"train_loss": -7.156318664550781, "global_step": 23120, "epoch": 137} {"train_loss": -6.968581199645996, "global_step": 23121, "epoch": 137} {"train_loss": -7.047509670257568, "global_step": 23122, "epoch": 137} {"train_loss": -7.211024284362793, "global_step": 23123, "epoch": 137} {"train_loss": -7.047801971435547, "global_step": 23124, "epoch": 137} {"train_loss": -6.963422775268555, "global_step": 23125, "epoch": 137} {"train_loss": -7.039733409881592, "global_step": 23126, "epoch": 137} {"train_loss": -7.141862392425537, "global_step": 23127, "epoch": 137} {"train_loss": -7.1254754066467285, "global_step": 23128, "epoch": 137} {"train_loss": -7.031240463256836, "global_step": 23129, "epoch": 137} {"train_loss": -7.017192840576172, "global_step": 23130, "epoch": 137} {"train_loss": -6.928618431091309, "global_step": 23131, "epoch": 137} {"train_loss": -7.113641262054443, "global_step": 23132, "epoch": 137} {"train_loss": -6.985950469970703, "global_step": 23133, "epoch": 137} {"train_loss": -7.221125602722168, "global_step": 23134, "epoch": 137} {"train_loss": -7.034702301025391, "global_step": 23135, "epoch": 137} {"train_loss": -7.135327339172363, "global_step": 23136, "epoch": 137} {"train_loss": -7.108205795288086, "global_step": 23137, "epoch": 137} {"train_loss": -6.895617485046387, "global_step": 23138, "epoch": 137} {"train_loss": -7.043020248413086, "global_step": 23139, "epoch": 137} {"train_loss": -7.090735912322998, "global_step": 23140, "epoch": 137} {"train_loss": -7.072796821594238, "global_step": 23141, "epoch": 137} {"train_loss": -7.079242706298828, "global_step": 23142, "epoch": 137} {"train_loss": -7.116793155670166, "global_step": 23143, "epoch": 137} {"train_loss": -7.168161392211914, "global_step": 23144, "epoch": 137} {"train_loss": -7.125357627868652, "global_step": 23145, "epoch": 137} {"train_loss": -7.054657459259033, "global_step": 23146, "epoch": 137} {"train_loss": -6.9860334396362305, "global_step": 23147, "epoch": 137} {"train_loss": -7.170973300933838, "global_step": 23148, "epoch": 137} {"train_loss": -7.077001094818115, "global_step": 23149, "epoch": 137} {"train_loss": -7.167943000793457, "global_step": 23150, "epoch": 137} {"train_loss": -7.236705780029297, "global_step": 23151, "epoch": 137} {"train_loss": -7.2015485763549805, "global_step": 23152, "epoch": 137} {"train_loss": -7.082683563232422, "global_step": 23153, "epoch": 137} {"train_loss": -6.88420295715332, "global_step": 23154, "epoch": 137} {"train_loss": -7.101327896118164, "global_step": 23155, "epoch": 137} {"train_loss": -6.920960426330566, "global_step": 23156, "epoch": 137} {"train_loss": -7.152588844299316, "global_step": 23157, "epoch": 137} {"train_loss": -7.025562286376953, "global_step": 23158, "epoch": 137} {"train_loss": -7.002725601196289, "global_step": 23159, "epoch": 137} {"train_loss": -7.193951606750488, "global_step": 23160, "epoch": 137} {"train_loss": -6.8900837898254395, "global_step": 23161, "epoch": 137} {"train_loss": -7.022995471954346, "global_step": 23162, "epoch": 137} {"train_loss": -7.095965385437012, "global_step": 23163, "epoch": 137} {"train_loss": -7.20847225189209, "global_step": 23164, "epoch": 137} {"train_loss": -6.9202752113342285, "global_step": 23165, "epoch": 137} {"train_loss": -7.152678489685059, "global_step": 23166, "epoch": 137} {"train_loss": -7.04069709777832, "global_step": 23167, "epoch": 137} {"train_loss": -6.950658798217773, "global_step": 23168, "epoch": 137} {"train_loss": -7.0015788078308105, "global_step": 23169, "epoch": 137} {"train_loss": -6.951136589050293, "global_step": 23170, "epoch": 137} {"train_loss": -6.909430980682373, "global_step": 23171, "epoch": 137} {"train_loss": -6.888759136199951, "global_step": 23172, "epoch": 137} {"train_loss": -7.104057312011719, "global_step": 23173, "epoch": 137} {"train_loss": -7.050249099731445, "global_step": 23174, "epoch": 137} {"train_loss": -6.967652797698975, "global_step": 23175, "epoch": 137} {"train_loss": -6.985786437988281, "global_step": 23176, "epoch": 137} {"train_loss": -6.981264114379883, "global_step": 23177, "epoch": 137} {"train_loss": -6.92022705078125, "global_step": 23178, "epoch": 137} {"train_loss": -6.947362899780273, "global_step": 23179, "epoch": 137} {"train_loss": -6.853064060211182, "global_step": 23180, "epoch": 137} {"train_loss": -6.9111223220825195, "global_step": 23181, "epoch": 137} {"train_loss": -6.779021739959717, "global_step": 23182, "epoch": 137} {"train_loss": -7.039750167301723, "global_step": 23183, "epoch": 137, "val_loss": 201376.640625} {"train_loss": -6.970358848571777, "global_step": 23184, "epoch": 138} {"train_loss": -6.783148765563965, "global_step": 23185, "epoch": 138} {"train_loss": -7.065326690673828, "global_step": 23186, "epoch": 138} {"train_loss": -7.004117488861084, "global_step": 23187, "epoch": 138} {"train_loss": -6.810506820678711, "global_step": 23188, "epoch": 138} {"train_loss": -6.9142279624938965, "global_step": 23189, "epoch": 138} {"train_loss": -7.0545783042907715, "global_step": 23190, "epoch": 138} {"train_loss": -6.930980205535889, "global_step": 23191, "epoch": 138} {"train_loss": -6.734316825866699, "global_step": 23192, "epoch": 138} {"train_loss": -7.0732526779174805, "global_step": 23193, "epoch": 138} {"train_loss": -6.79725980758667, "global_step": 23194, "epoch": 138} {"train_loss": -7.132794380187988, "global_step": 23195, "epoch": 138} {"train_loss": -6.901233196258545, "global_step": 23196, "epoch": 138} {"train_loss": -7.154661178588867, "global_step": 23197, "epoch": 138} {"train_loss": -7.054538249969482, "global_step": 23198, "epoch": 138} {"train_loss": -6.932869911193848, "global_step": 23199, "epoch": 138} {"train_loss": -7.11899471282959, "global_step": 23200, "epoch": 138} {"train_loss": -7.3103346824646, "global_step": 23201, "epoch": 138} {"train_loss": -6.941508769989014, "global_step": 23202, "epoch": 138} {"train_loss": -7.0597944259643555, "global_step": 23203, "epoch": 138} {"train_loss": -7.089882850646973, "global_step": 23204, "epoch": 138} {"train_loss": -7.107085704803467, "global_step": 23205, "epoch": 138} {"train_loss": -6.958769798278809, "global_step": 23206, "epoch": 138} {"train_loss": -7.104433059692383, "global_step": 23207, "epoch": 138} {"train_loss": -7.08089542388916, "global_step": 23208, "epoch": 138} {"train_loss": -7.09184455871582, "global_step": 23209, "epoch": 138} {"train_loss": -7.074281215667725, "global_step": 23210, "epoch": 138} {"train_loss": -7.176381587982178, "global_step": 23211, "epoch": 138} {"train_loss": -7.260661602020264, "global_step": 23212, "epoch": 138} {"train_loss": -7.068028450012207, "global_step": 23213, "epoch": 138} {"train_loss": -6.818196773529053, "global_step": 23214, "epoch": 138} {"train_loss": -6.915843963623047, "global_step": 23215, "epoch": 138} {"train_loss": -6.9547271728515625, "global_step": 23216, "epoch": 138} {"train_loss": -7.301568031311035, "global_step": 23217, "epoch": 138} {"train_loss": -7.145307540893555, "global_step": 23218, "epoch": 138} {"train_loss": -7.176604270935059, "global_step": 23219, "epoch": 138} {"train_loss": -7.096278667449951, "global_step": 23220, "epoch": 138} {"train_loss": -7.202397346496582, "global_step": 23221, "epoch": 138} {"train_loss": -7.104886531829834, "global_step": 23222, "epoch": 138} {"train_loss": -7.288968086242676, "global_step": 23223, "epoch": 138} {"train_loss": -7.204357147216797, "global_step": 23224, "epoch": 138} {"train_loss": -7.129486560821533, "global_step": 23225, "epoch": 138} {"train_loss": -6.973600387573242, "global_step": 23226, "epoch": 138} {"train_loss": -7.232544898986816, "global_step": 23227, "epoch": 138} {"train_loss": -7.019954681396484, "global_step": 23228, "epoch": 138} {"train_loss": -7.054996967315674, "global_step": 23229, "epoch": 138} {"train_loss": -7.259323596954346, "global_step": 23230, "epoch": 138} {"train_loss": -7.294750690460205, "global_step": 23231, "epoch": 138} {"train_loss": -6.910400390625, "global_step": 23232, "epoch": 138} {"train_loss": -7.097604751586914, "global_step": 23233, "epoch": 138} {"train_loss": -7.032718181610107, "global_step": 23234, "epoch": 138} {"train_loss": -7.1856842041015625, "global_step": 23235, "epoch": 138} {"train_loss": -7.027186393737793, "global_step": 23236, "epoch": 138} {"train_loss": -7.215210914611816, "global_step": 23237, "epoch": 138} {"train_loss": -6.978850841522217, "global_step": 23238, "epoch": 138} {"train_loss": -7.265523433685303, "global_step": 23239, "epoch": 138} {"train_loss": -6.721069812774658, "global_step": 23240, "epoch": 138} {"train_loss": -7.2312750816345215, "global_step": 23241, "epoch": 138} {"train_loss": -6.701325416564941, "global_step": 23242, "epoch": 138} {"train_loss": -7.129561424255371, "global_step": 23243, "epoch": 138} {"train_loss": -7.045402526855469, "global_step": 23244, "epoch": 138} {"train_loss": -6.791545391082764, "global_step": 23245, "epoch": 138} {"train_loss": -6.881716728210449, "global_step": 23246, "epoch": 138} {"train_loss": -6.691451072692871, "global_step": 23247, "epoch": 138} {"train_loss": -6.922473430633545, "global_step": 23248, "epoch": 138} {"train_loss": -6.935020446777344, "global_step": 23249, "epoch": 138} {"train_loss": -7.024335861206055, "global_step": 23250, "epoch": 138} {"train_loss": -7.017061233520508, "global_step": 23251, "epoch": 138} {"train_loss": -7.038886070251465, "global_step": 23252, "epoch": 138} {"train_loss": -6.946529388427734, "global_step": 23253, "epoch": 138} {"train_loss": -6.768184185028076, "global_step": 23254, "epoch": 138} {"train_loss": -7.033101558685303, "global_step": 23255, "epoch": 138} {"train_loss": -7.044835090637207, "global_step": 23256, "epoch": 138} {"train_loss": -6.81801700592041, "global_step": 23257, "epoch": 138} {"train_loss": -7.251273155212402, "global_step": 23258, "epoch": 138} {"train_loss": -6.977198123931885, "global_step": 23259, "epoch": 138} {"train_loss": -6.763139724731445, "global_step": 23260, "epoch": 138} {"train_loss": -7.20826530456543, "global_step": 23261, "epoch": 138} {"train_loss": -7.008683681488037, "global_step": 23262, "epoch": 138} {"train_loss": -6.98198938369751, "global_step": 23263, "epoch": 138} {"train_loss": -7.065277099609375, "global_step": 23264, "epoch": 138} {"train_loss": -7.171141624450684, "global_step": 23265, "epoch": 138} {"train_loss": -6.85988187789917, "global_step": 23266, "epoch": 138} {"train_loss": -7.106554985046387, "global_step": 23267, "epoch": 138} {"train_loss": -7.115758895874023, "global_step": 23268, "epoch": 138} {"train_loss": -6.751217365264893, "global_step": 23269, "epoch": 138} {"train_loss": -7.116477012634277, "global_step": 23270, "epoch": 138} {"train_loss": -6.938468933105469, "global_step": 23271, "epoch": 138} {"train_loss": -7.010103225708008, "global_step": 23272, "epoch": 138} {"train_loss": -7.140977382659912, "global_step": 23273, "epoch": 138} {"train_loss": -7.161965370178223, "global_step": 23274, "epoch": 138} {"train_loss": -6.93681526184082, "global_step": 23275, "epoch": 138} {"train_loss": -7.022184371948242, "global_step": 23276, "epoch": 138} {"train_loss": -7.122373580932617, "global_step": 23277, "epoch": 138} {"train_loss": -7.081145286560059, "global_step": 23278, "epoch": 138} {"train_loss": -6.924142360687256, "global_step": 23279, "epoch": 138} {"train_loss": -7.188209533691406, "global_step": 23280, "epoch": 138} {"train_loss": -6.879088878631592, "global_step": 23281, "epoch": 138} {"train_loss": -7.008209228515625, "global_step": 23282, "epoch": 138} {"train_loss": -6.935166835784912, "global_step": 23283, "epoch": 138} {"train_loss": -6.914420127868652, "global_step": 23284, "epoch": 138} {"train_loss": -6.989140510559082, "global_step": 23285, "epoch": 138} {"train_loss": -7.032297134399414, "global_step": 23286, "epoch": 138} {"train_loss": -7.225543022155762, "global_step": 23287, "epoch": 138} {"train_loss": -6.996298313140869, "global_step": 23288, "epoch": 138} {"train_loss": -7.009145736694336, "global_step": 23289, "epoch": 138} {"train_loss": -6.7963948249816895, "global_step": 23290, "epoch": 138} {"train_loss": -7.080558776855469, "global_step": 23291, "epoch": 138} {"train_loss": -7.254089832305908, "global_step": 23292, "epoch": 138} {"train_loss": -7.037475109100342, "global_step": 23293, "epoch": 138} {"train_loss": -7.183163166046143, "global_step": 23294, "epoch": 138} {"train_loss": -7.415713310241699, "global_step": 23295, "epoch": 138} {"train_loss": -7.259348392486572, "global_step": 23296, "epoch": 138} {"train_loss": -7.247171401977539, "global_step": 23297, "epoch": 138} {"train_loss": -7.036517143249512, "global_step": 23298, "epoch": 138} {"train_loss": -7.08756160736084, "global_step": 23299, "epoch": 138} {"train_loss": -7.121888160705566, "global_step": 23300, "epoch": 138} {"train_loss": -7.335289478302002, "global_step": 23301, "epoch": 138} {"train_loss": -7.149622917175293, "global_step": 23302, "epoch": 138} {"train_loss": -7.103653907775879, "global_step": 23303, "epoch": 138} {"train_loss": -7.3444366455078125, "global_step": 23304, "epoch": 138} {"train_loss": -7.145747661590576, "global_step": 23305, "epoch": 138} {"train_loss": -7.062651634216309, "global_step": 23306, "epoch": 138} {"train_loss": -7.119688987731934, "global_step": 23307, "epoch": 138} {"train_loss": -7.285701751708984, "global_step": 23308, "epoch": 138} {"train_loss": -7.185554504394531, "global_step": 23309, "epoch": 138} {"train_loss": -7.09013557434082, "global_step": 23310, "epoch": 138} {"train_loss": -6.976974964141846, "global_step": 23311, "epoch": 138} {"train_loss": -6.699124336242676, "global_step": 23312, "epoch": 138} {"train_loss": -7.1716227531433105, "global_step": 23313, "epoch": 138} {"train_loss": -7.126381874084473, "global_step": 23314, "epoch": 138} {"train_loss": -7.112460136413574, "global_step": 23315, "epoch": 138} {"train_loss": -7.084755897521973, "global_step": 23316, "epoch": 138} {"train_loss": -7.296303749084473, "global_step": 23317, "epoch": 138} {"train_loss": -7.190267562866211, "global_step": 23318, "epoch": 138} {"train_loss": -7.158154487609863, "global_step": 23319, "epoch": 138} {"train_loss": -6.984596252441406, "global_step": 23320, "epoch": 138} {"train_loss": -7.353967666625977, "global_step": 23321, "epoch": 138} {"train_loss": -7.196354866027832, "global_step": 23322, "epoch": 138} {"train_loss": -7.13538932800293, "global_step": 23323, "epoch": 138} {"train_loss": -7.005805492401123, "global_step": 23324, "epoch": 138} {"train_loss": -7.014721870422363, "global_step": 23325, "epoch": 138} {"train_loss": -6.949077129364014, "global_step": 23326, "epoch": 138} {"train_loss": -7.1708455085754395, "global_step": 23327, "epoch": 138} {"train_loss": -7.090206146240234, "global_step": 23328, "epoch": 138} {"train_loss": -6.9633636474609375, "global_step": 23329, "epoch": 138} {"train_loss": -7.032423973083496, "global_step": 23330, "epoch": 138} {"train_loss": -7.247520923614502, "global_step": 23331, "epoch": 138} {"train_loss": -6.962512969970703, "global_step": 23332, "epoch": 138} {"train_loss": -7.099310874938965, "global_step": 23333, "epoch": 138} {"train_loss": -7.368109703063965, "global_step": 23334, "epoch": 138} {"train_loss": -7.141173362731934, "global_step": 23335, "epoch": 138} {"train_loss": -7.408465385437012, "global_step": 23336, "epoch": 138} {"train_loss": -7.08631706237793, "global_step": 23337, "epoch": 138} {"train_loss": -7.1269731521606445, "global_step": 23338, "epoch": 138} {"train_loss": -7.149493217468262, "global_step": 23339, "epoch": 138} {"train_loss": -6.840686321258545, "global_step": 23340, "epoch": 138} {"train_loss": -7.273979187011719, "global_step": 23341, "epoch": 138} {"train_loss": -7.185380935668945, "global_step": 23342, "epoch": 138} {"train_loss": -7.184021949768066, "global_step": 23343, "epoch": 138} {"train_loss": -7.045989990234375, "global_step": 23344, "epoch": 138} {"train_loss": -7.089768409729004, "global_step": 23345, "epoch": 138} {"train_loss": -6.98323917388916, "global_step": 23346, "epoch": 138} {"train_loss": -7.153694152832031, "global_step": 23347, "epoch": 138} {"train_loss": -6.9152727127075195, "global_step": 23348, "epoch": 138} {"train_loss": -7.092123985290527, "global_step": 23349, "epoch": 138} {"train_loss": -6.956452369689941, "global_step": 23350, "epoch": 138} {"train_loss": -7.064522209621611, "global_step": 23351, "epoch": 138, "val_loss": 205957.34375} {"train_loss": -6.783066749572754, "global_step": 23352, "epoch": 139} {"train_loss": -7.1306352615356445, "global_step": 23353, "epoch": 139} {"train_loss": -6.759749889373779, "global_step": 23354, "epoch": 139} {"train_loss": -7.019132614135742, "global_step": 23355, "epoch": 139} {"train_loss": -6.963949680328369, "global_step": 23356, "epoch": 139} {"train_loss": -7.0323805809021, "global_step": 23357, "epoch": 139} {"train_loss": -7.091946125030518, "global_step": 23358, "epoch": 139} {"train_loss": -6.922062397003174, "global_step": 23359, "epoch": 139} {"train_loss": -6.9190850257873535, "global_step": 23360, "epoch": 139} {"train_loss": -7.065576076507568, "global_step": 23361, "epoch": 139} {"train_loss": -6.895441055297852, "global_step": 23362, "epoch": 139} {"train_loss": -6.980935096740723, "global_step": 23363, "epoch": 139} {"train_loss": -7.00042724609375, "global_step": 23364, "epoch": 139} {"train_loss": -6.967864036560059, "global_step": 23365, "epoch": 139} {"train_loss": -7.007184028625488, "global_step": 23366, "epoch": 139} {"train_loss": -6.706242561340332, "global_step": 23367, "epoch": 139} {"train_loss": -7.118572235107422, "global_step": 23368, "epoch": 139} {"train_loss": -6.568582534790039, "global_step": 23369, "epoch": 139} {"train_loss": -6.894513130187988, "global_step": 23370, "epoch": 139} {"train_loss": -7.034610748291016, "global_step": 23371, "epoch": 139} {"train_loss": -6.812324523925781, "global_step": 23372, "epoch": 139} {"train_loss": -7.020442485809326, "global_step": 23373, "epoch": 139} {"train_loss": -6.7386016845703125, "global_step": 23374, "epoch": 139} {"train_loss": -6.698180198669434, "global_step": 23375, "epoch": 139} {"train_loss": -6.69101095199585, "global_step": 23376, "epoch": 139} {"train_loss": -6.906504154205322, "global_step": 23377, "epoch": 139} {"train_loss": -6.963223457336426, "global_step": 23378, "epoch": 139} {"train_loss": -6.699041366577148, "global_step": 23379, "epoch": 139} {"train_loss": -6.897411346435547, "global_step": 23380, "epoch": 139} {"train_loss": -7.000147819519043, "global_step": 23381, "epoch": 139} {"train_loss": -7.042964935302734, "global_step": 23382, "epoch": 139} {"train_loss": -6.910323143005371, "global_step": 23383, "epoch": 139} {"train_loss": -7.126409530639648, "global_step": 23384, "epoch": 139} {"train_loss": -6.808689117431641, "global_step": 23385, "epoch": 139} {"train_loss": -6.943474769592285, "global_step": 23386, "epoch": 139} {"train_loss": -7.023481369018555, "global_step": 23387, "epoch": 139} {"train_loss": -6.924454689025879, "global_step": 23388, "epoch": 139} {"train_loss": -7.044795989990234, "global_step": 23389, "epoch": 139} {"train_loss": -7.105429649353027, "global_step": 23390, "epoch": 139} {"train_loss": -7.224587440490723, "global_step": 23391, "epoch": 139} {"train_loss": -7.089478015899658, "global_step": 23392, "epoch": 139} {"train_loss": -7.283637523651123, "global_step": 23393, "epoch": 139} {"train_loss": -7.069450378417969, "global_step": 23394, "epoch": 139} {"train_loss": -7.0956854820251465, "global_step": 23395, "epoch": 139} {"train_loss": -6.88192081451416, "global_step": 23396, "epoch": 139} {"train_loss": -7.176777362823486, "global_step": 23397, "epoch": 139} {"train_loss": -6.712560653686523, "global_step": 23398, "epoch": 139} {"train_loss": -6.936254024505615, "global_step": 23399, "epoch": 139} {"train_loss": -6.863097190856934, "global_step": 23400, "epoch": 139} {"train_loss": -6.769510269165039, "global_step": 23401, "epoch": 139} {"train_loss": -6.889245510101318, "global_step": 23402, "epoch": 139} {"train_loss": -7.00594425201416, "global_step": 23403, "epoch": 139} {"train_loss": -6.977408409118652, "global_step": 23404, "epoch": 139} {"train_loss": -6.906279563903809, "global_step": 23405, "epoch": 139} {"train_loss": -6.939081192016602, "global_step": 23406, "epoch": 139} {"train_loss": -6.820987701416016, "global_step": 23407, "epoch": 139} {"train_loss": -6.898368835449219, "global_step": 23408, "epoch": 139} {"train_loss": -6.948482990264893, "global_step": 23409, "epoch": 139} {"train_loss": -6.850690841674805, "global_step": 23410, "epoch": 139} {"train_loss": -6.935000419616699, "global_step": 23411, "epoch": 139} {"train_loss": -6.950099945068359, "global_step": 23412, "epoch": 139} {"train_loss": -7.143954277038574, "global_step": 23413, "epoch": 139} {"train_loss": -6.938632011413574, "global_step": 23414, "epoch": 139} {"train_loss": -7.123899459838867, "global_step": 23415, "epoch": 139} {"train_loss": -6.982362747192383, "global_step": 23416, "epoch": 139} {"train_loss": -6.980762481689453, "global_step": 23417, "epoch": 139} {"train_loss": -6.978442192077637, "global_step": 23418, "epoch": 139} {"train_loss": -6.784178256988525, "global_step": 23419, "epoch": 139} {"train_loss": -7.100661277770996, "global_step": 23420, "epoch": 139} {"train_loss": -6.9546732902526855, "global_step": 23421, "epoch": 139} {"train_loss": -6.963988304138184, "global_step": 23422, "epoch": 139} {"train_loss": -6.958400726318359, "global_step": 23423, "epoch": 139} {"train_loss": -7.132918834686279, "global_step": 23424, "epoch": 139} {"train_loss": -6.8895440101623535, "global_step": 23425, "epoch": 139} {"train_loss": -6.912039279937744, "global_step": 23426, "epoch": 139} {"train_loss": -7.113199234008789, "global_step": 23427, "epoch": 139} {"train_loss": -7.140997886657715, "global_step": 23428, "epoch": 139} {"train_loss": -7.009666442871094, "global_step": 23429, "epoch": 139} {"train_loss": -7.251349925994873, "global_step": 23430, "epoch": 139} {"train_loss": -7.068886756896973, "global_step": 23431, "epoch": 139} {"train_loss": -6.873315811157227, "global_step": 23432, "epoch": 139} {"train_loss": -6.999715805053711, "global_step": 23433, "epoch": 139} {"train_loss": -6.9540791511535645, "global_step": 23434, "epoch": 139} {"train_loss": -7.240732192993164, "global_step": 23435, "epoch": 139} {"train_loss": -6.759587287902832, "global_step": 23436, "epoch": 139} {"train_loss": -7.2506232261657715, "global_step": 23437, "epoch": 139} {"train_loss": -6.72271728515625, "global_step": 23438, "epoch": 139} {"train_loss": -7.147176265716553, "global_step": 23439, "epoch": 139} {"train_loss": -6.861060619354248, "global_step": 23440, "epoch": 139} {"train_loss": -6.9261579513549805, "global_step": 23441, "epoch": 139} {"train_loss": -7.052725791931152, "global_step": 23442, "epoch": 139} {"train_loss": -6.729006767272949, "global_step": 23443, "epoch": 139} {"train_loss": -6.961337566375732, "global_step": 23444, "epoch": 139} {"train_loss": -6.780566692352295, "global_step": 23445, "epoch": 139} {"train_loss": -6.816016674041748, "global_step": 23446, "epoch": 139} {"train_loss": -6.937929630279541, "global_step": 23447, "epoch": 139} {"train_loss": -7.154409408569336, "global_step": 23448, "epoch": 139} {"train_loss": -6.861346244812012, "global_step": 23449, "epoch": 139} {"train_loss": -7.170553207397461, "global_step": 23450, "epoch": 139} {"train_loss": -7.0443315505981445, "global_step": 23451, "epoch": 139} {"train_loss": -6.845930099487305, "global_step": 23452, "epoch": 139} {"train_loss": -6.872828960418701, "global_step": 23453, "epoch": 139} {"train_loss": -7.088411808013916, "global_step": 23454, "epoch": 139} {"train_loss": -7.125195503234863, "global_step": 23455, "epoch": 139} {"train_loss": -7.079351902008057, "global_step": 23456, "epoch": 139} {"train_loss": -7.146203994750977, "global_step": 23457, "epoch": 139} {"train_loss": -7.334347248077393, "global_step": 23458, "epoch": 139} {"train_loss": -7.1013970375061035, "global_step": 23459, "epoch": 139} {"train_loss": -7.152968406677246, "global_step": 23460, "epoch": 139} {"train_loss": -7.139312744140625, "global_step": 23461, "epoch": 139} {"train_loss": -7.222142219543457, "global_step": 23462, "epoch": 139} {"train_loss": -7.051547050476074, "global_step": 23463, "epoch": 139} {"train_loss": -7.156673431396484, "global_step": 23464, "epoch": 139} {"train_loss": -7.053203582763672, "global_step": 23465, "epoch": 139} {"train_loss": -7.091451644897461, "global_step": 23466, "epoch": 139} {"train_loss": -7.255348205566406, "global_step": 23467, "epoch": 139} {"train_loss": -7.190267562866211, "global_step": 23468, "epoch": 139} {"train_loss": -6.98379373550415, "global_step": 23469, "epoch": 139} {"train_loss": -7.151097297668457, "global_step": 23470, "epoch": 139} {"train_loss": -7.026871204376221, "global_step": 23471, "epoch": 139} {"train_loss": -7.093686103820801, "global_step": 23472, "epoch": 139} {"train_loss": -7.318544864654541, "global_step": 23473, "epoch": 139} {"train_loss": -6.924442291259766, "global_step": 23474, "epoch": 139} {"train_loss": -7.178803443908691, "global_step": 23475, "epoch": 139} {"train_loss": -6.904707431793213, "global_step": 23476, "epoch": 139} {"train_loss": -7.023321628570557, "global_step": 23477, "epoch": 139} {"train_loss": -7.228182315826416, "global_step": 23478, "epoch": 139} {"train_loss": -7.041165351867676, "global_step": 23479, "epoch": 139} {"train_loss": -7.317347526550293, "global_step": 23480, "epoch": 139} {"train_loss": -7.223638534545898, "global_step": 23481, "epoch": 139} {"train_loss": -7.027956962585449, "global_step": 23482, "epoch": 139} {"train_loss": -6.947269439697266, "global_step": 23483, "epoch": 139} {"train_loss": -6.849807262420654, "global_step": 23484, "epoch": 139} {"train_loss": -6.868047714233398, "global_step": 23485, "epoch": 139} {"train_loss": -7.175508499145508, "global_step": 23486, "epoch": 139} {"train_loss": -6.578780174255371, "global_step": 23487, "epoch": 139} {"train_loss": -6.853981971740723, "global_step": 23488, "epoch": 139} {"train_loss": -6.82232666015625, "global_step": 23489, "epoch": 139} {"train_loss": -6.984128475189209, "global_step": 23490, "epoch": 139} {"train_loss": -7.155064582824707, "global_step": 23491, "epoch": 139} {"train_loss": -6.968099117279053, "global_step": 23492, "epoch": 139} {"train_loss": -6.975667476654053, "global_step": 23493, "epoch": 139} {"train_loss": -6.7629714012146, "global_step": 23494, "epoch": 139} {"train_loss": -7.01296854019165, "global_step": 23495, "epoch": 139} {"train_loss": -6.834794521331787, "global_step": 23496, "epoch": 139} {"train_loss": -6.92234992980957, "global_step": 23497, "epoch": 139} {"train_loss": -6.926268577575684, "global_step": 23498, "epoch": 139} {"train_loss": -7.063015937805176, "global_step": 23499, "epoch": 139} {"train_loss": -7.027550220489502, "global_step": 23500, "epoch": 139} {"train_loss": -6.757652282714844, "global_step": 23501, "epoch": 139} {"train_loss": -7.009313106536865, "global_step": 23502, "epoch": 139} {"train_loss": -6.921992301940918, "global_step": 23503, "epoch": 139} {"train_loss": -6.99366569519043, "global_step": 23504, "epoch": 139} {"train_loss": -6.803119659423828, "global_step": 23505, "epoch": 139} {"train_loss": -7.184191703796387, "global_step": 23506, "epoch": 139} {"train_loss": -7.169037818908691, "global_step": 23507, "epoch": 139} {"train_loss": -7.1524810791015625, "global_step": 23508, "epoch": 139} {"train_loss": -7.0943098068237305, "global_step": 23509, "epoch": 139} {"train_loss": -6.8952202796936035, "global_step": 23510, "epoch": 139} {"train_loss": -7.207253456115723, "global_step": 23511, "epoch": 139} {"train_loss": -7.255437850952148, "global_step": 23512, "epoch": 139} {"train_loss": -7.351646423339844, "global_step": 23513, "epoch": 139} {"train_loss": -6.84259033203125, "global_step": 23514, "epoch": 139} {"train_loss": -6.911044120788574, "global_step": 23515, "epoch": 139} {"train_loss": -7.1064772605896, "global_step": 23516, "epoch": 139} {"train_loss": -7.0229997634887695, "global_step": 23517, "epoch": 139} {"train_loss": -7.269286155700684, "global_step": 23518, "epoch": 139} {"train_loss": -6.995686982359205, "global_step": 23519, "epoch": 139, "val_loss": 203543.390625} {"train_loss": -6.919339656829834, "global_step": 23520, "epoch": 140} {"train_loss": -7.265804290771484, "global_step": 23521, "epoch": 140} {"train_loss": -6.889955520629883, "global_step": 23522, "epoch": 140} {"train_loss": -7.140859603881836, "global_step": 23523, "epoch": 140} {"train_loss": -6.912093162536621, "global_step": 23524, "epoch": 140} {"train_loss": -7.073380470275879, "global_step": 23525, "epoch": 140} {"train_loss": -7.05071496963501, "global_step": 23526, "epoch": 140} {"train_loss": -6.9322404861450195, "global_step": 23527, "epoch": 140} {"train_loss": -6.878601551055908, "global_step": 23528, "epoch": 140} {"train_loss": -6.924614429473877, "global_step": 23529, "epoch": 140} {"train_loss": -6.995304107666016, "global_step": 23530, "epoch": 140} {"train_loss": -6.796897888183594, "global_step": 23531, "epoch": 140} {"train_loss": -7.074074745178223, "global_step": 23532, "epoch": 140} {"train_loss": -6.9477691650390625, "global_step": 23533, "epoch": 140} {"train_loss": -7.021846771240234, "global_step": 23534, "epoch": 140} {"train_loss": -7.14113712310791, "global_step": 23535, "epoch": 140} {"train_loss": -6.99280309677124, "global_step": 23536, "epoch": 140} {"train_loss": -7.139081954956055, "global_step": 23537, "epoch": 140} {"train_loss": -7.161588191986084, "global_step": 23538, "epoch": 140} {"train_loss": -6.779197692871094, "global_step": 23539, "epoch": 140} {"train_loss": -7.157985687255859, "global_step": 23540, "epoch": 140} {"train_loss": -7.101822376251221, "global_step": 23541, "epoch": 140} {"train_loss": -7.274839878082275, "global_step": 23542, "epoch": 140} {"train_loss": -7.041602611541748, "global_step": 23543, "epoch": 140} {"train_loss": -7.104329586029053, "global_step": 23544, "epoch": 140} {"train_loss": -7.224852561950684, "global_step": 23545, "epoch": 140} {"train_loss": -7.160658836364746, "global_step": 23546, "epoch": 140} {"train_loss": -7.124605178833008, "global_step": 23547, "epoch": 140} {"train_loss": -7.130321502685547, "global_step": 23548, "epoch": 140} {"train_loss": -7.342703819274902, "global_step": 23549, "epoch": 140} {"train_loss": -7.089925289154053, "global_step": 23550, "epoch": 140} {"train_loss": -7.108055114746094, "global_step": 23551, "epoch": 140} {"train_loss": -6.939702033996582, "global_step": 23552, "epoch": 140} {"train_loss": -6.957907676696777, "global_step": 23553, "epoch": 140} {"train_loss": -7.00285530090332, "global_step": 23554, "epoch": 140} {"train_loss": -7.100518226623535, "global_step": 23555, "epoch": 140} {"train_loss": -6.995173454284668, "global_step": 23556, "epoch": 140} {"train_loss": -6.807751178741455, "global_step": 23557, "epoch": 140} {"train_loss": -7.048298358917236, "global_step": 23558, "epoch": 140} {"train_loss": -7.1729631423950195, "global_step": 23559, "epoch": 140} {"train_loss": -7.173990726470947, "global_step": 23560, "epoch": 140} {"train_loss": -7.208126068115234, "global_step": 23561, "epoch": 140} {"train_loss": -6.9647111892700195, "global_step": 23562, "epoch": 140} {"train_loss": -7.189658164978027, "global_step": 23563, "epoch": 140} {"train_loss": -7.037619113922119, "global_step": 23564, "epoch": 140} {"train_loss": -7.043105125427246, "global_step": 23565, "epoch": 140} {"train_loss": -7.165340423583984, "global_step": 23566, "epoch": 140} {"train_loss": -7.317747592926025, "global_step": 23567, "epoch": 140} {"train_loss": -6.879512786865234, "global_step": 23568, "epoch": 140} {"train_loss": -7.078244209289551, "global_step": 23569, "epoch": 140} {"train_loss": -7.034440040588379, "global_step": 23570, "epoch": 140} {"train_loss": -7.225016117095947, "global_step": 23571, "epoch": 140} {"train_loss": -7.1282501220703125, "global_step": 23572, "epoch": 140} {"train_loss": -7.088741779327393, "global_step": 23573, "epoch": 140} {"train_loss": -7.035444259643555, "global_step": 23574, "epoch": 140} {"train_loss": -6.880563735961914, "global_step": 23575, "epoch": 140} {"train_loss": -6.843876361846924, "global_step": 23576, "epoch": 140} {"train_loss": -7.263615131378174, "global_step": 23577, "epoch": 140} {"train_loss": -6.98856258392334, "global_step": 23578, "epoch": 140} {"train_loss": -6.9621782302856445, "global_step": 23579, "epoch": 140} {"train_loss": -6.930936813354492, "global_step": 23580, "epoch": 140} {"train_loss": -6.961418151855469, "global_step": 23581, "epoch": 140} {"train_loss": -7.026512145996094, "global_step": 23582, "epoch": 140} {"train_loss": -6.965178489685059, "global_step": 23583, "epoch": 140} {"train_loss": -7.194829940795898, "global_step": 23584, "epoch": 140} {"train_loss": -7.301767349243164, "global_step": 23585, "epoch": 140} {"train_loss": -6.995884895324707, "global_step": 23586, "epoch": 140} {"train_loss": -7.141807556152344, "global_step": 23587, "epoch": 140} {"train_loss": -7.05449914932251, "global_step": 23588, "epoch": 140} {"train_loss": -7.029026985168457, "global_step": 23589, "epoch": 140} {"train_loss": -7.060290813446045, "global_step": 23590, "epoch": 140} {"train_loss": -7.07352876663208, "global_step": 23591, "epoch": 140} {"train_loss": -7.27252197265625, "global_step": 23592, "epoch": 140} {"train_loss": -7.177211761474609, "global_step": 23593, "epoch": 140} {"train_loss": -7.118283271789551, "global_step": 23594, "epoch": 140} {"train_loss": -7.087031364440918, "global_step": 23595, "epoch": 140} {"train_loss": -7.078301429748535, "global_step": 23596, "epoch": 140} {"train_loss": -7.0540289878845215, "global_step": 23597, "epoch": 140} {"train_loss": -7.13144063949585, "global_step": 23598, "epoch": 140} {"train_loss": -7.150120735168457, "global_step": 23599, "epoch": 140} {"train_loss": -6.923783302307129, "global_step": 23600, "epoch": 140} {"train_loss": -7.061491966247559, "global_step": 23601, "epoch": 140} {"train_loss": -7.134072780609131, "global_step": 23602, "epoch": 140} {"train_loss": -7.173120498657227, "global_step": 23603, "epoch": 140} {"train_loss": -7.098125457763672, "global_step": 23604, "epoch": 140} {"train_loss": -7.046707630157471, "global_step": 23605, "epoch": 140} {"train_loss": -7.0980706214904785, "global_step": 23606, "epoch": 140} {"train_loss": -6.885256767272949, "global_step": 23607, "epoch": 140} {"train_loss": -7.197366237640381, "global_step": 23608, "epoch": 140} {"train_loss": -7.094705104827881, "global_step": 23609, "epoch": 140} {"train_loss": -7.171988487243652, "global_step": 23610, "epoch": 140} {"train_loss": -7.048003196716309, "global_step": 23611, "epoch": 140} {"train_loss": -7.177150726318359, "global_step": 23612, "epoch": 140} {"train_loss": -7.363891124725342, "global_step": 23613, "epoch": 140} {"train_loss": -6.814704895019531, "global_step": 23614, "epoch": 140} {"train_loss": -7.248547554016113, "global_step": 23615, "epoch": 140} {"train_loss": -7.037972927093506, "global_step": 23616, "epoch": 140} {"train_loss": -7.2313995361328125, "global_step": 23617, "epoch": 140} {"train_loss": -6.999544143676758, "global_step": 23618, "epoch": 140} {"train_loss": -7.282985687255859, "global_step": 23619, "epoch": 140} {"train_loss": -7.214359283447266, "global_step": 23620, "epoch": 140} {"train_loss": -7.161276817321777, "global_step": 23621, "epoch": 140} {"train_loss": -7.141003131866455, "global_step": 23622, "epoch": 140} {"train_loss": -6.940528392791748, "global_step": 23623, "epoch": 140} {"train_loss": -7.198213577270508, "global_step": 23624, "epoch": 140} {"train_loss": -7.368241786956787, "global_step": 23625, "epoch": 140} {"train_loss": -7.105010986328125, "global_step": 23626, "epoch": 140} {"train_loss": -7.196723937988281, "global_step": 23627, "epoch": 140} {"train_loss": -7.465811729431152, "global_step": 23628, "epoch": 140} {"train_loss": -7.211629867553711, "global_step": 23629, "epoch": 140} {"train_loss": -7.287538051605225, "global_step": 23630, "epoch": 140} {"train_loss": -7.318193435668945, "global_step": 23631, "epoch": 140} {"train_loss": -7.009528160095215, "global_step": 23632, "epoch": 140} {"train_loss": -7.272690296173096, "global_step": 23633, "epoch": 140} {"train_loss": -6.951346397399902, "global_step": 23634, "epoch": 140} {"train_loss": -7.238022327423096, "global_step": 23635, "epoch": 140} {"train_loss": -6.881399154663086, "global_step": 23636, "epoch": 140} {"train_loss": -7.173811912536621, "global_step": 23637, "epoch": 140} {"train_loss": -6.970659255981445, "global_step": 23638, "epoch": 140} {"train_loss": -7.009617805480957, "global_step": 23639, "epoch": 140} {"train_loss": -7.091861724853516, "global_step": 23640, "epoch": 140} {"train_loss": -6.919900417327881, "global_step": 23641, "epoch": 140} {"train_loss": -6.895573616027832, "global_step": 23642, "epoch": 140} {"train_loss": -6.7919745445251465, "global_step": 23643, "epoch": 140} {"train_loss": -7.026601791381836, "global_step": 23644, "epoch": 140} {"train_loss": -6.9686598777771, "global_step": 23645, "epoch": 140} {"train_loss": -6.947111129760742, "global_step": 23646, "epoch": 140} {"train_loss": -6.933778762817383, "global_step": 23647, "epoch": 140} {"train_loss": -6.979856014251709, "global_step": 23648, "epoch": 140} {"train_loss": -6.6678924560546875, "global_step": 23649, "epoch": 140} {"train_loss": -6.718695640563965, "global_step": 23650, "epoch": 140} {"train_loss": -7.015490531921387, "global_step": 23651, "epoch": 140} {"train_loss": -6.874643325805664, "global_step": 23652, "epoch": 140} {"train_loss": -7.2095842361450195, "global_step": 23653, "epoch": 140} {"train_loss": -6.96424674987793, "global_step": 23654, "epoch": 140} {"train_loss": -7.095139980316162, "global_step": 23655, "epoch": 140} {"train_loss": -7.176266670227051, "global_step": 23656, "epoch": 140} {"train_loss": -6.933724403381348, "global_step": 23657, "epoch": 140} {"train_loss": -7.0223388671875, "global_step": 23658, "epoch": 140} {"train_loss": -7.153393745422363, "global_step": 23659, "epoch": 140} {"train_loss": -7.211084365844727, "global_step": 23660, "epoch": 140} {"train_loss": -7.1445441246032715, "global_step": 23661, "epoch": 140} {"train_loss": -7.026325702667236, "global_step": 23662, "epoch": 140} {"train_loss": -7.236670017242432, "global_step": 23663, "epoch": 140} {"train_loss": -6.995697021484375, "global_step": 23664, "epoch": 140} {"train_loss": -7.1343302726745605, "global_step": 23665, "epoch": 140} {"train_loss": -7.22067403793335, "global_step": 23666, "epoch": 140} {"train_loss": -7.230225563049316, "global_step": 23667, "epoch": 140} {"train_loss": -7.083563804626465, "global_step": 23668, "epoch": 140} {"train_loss": -6.967720985412598, "global_step": 23669, "epoch": 140} {"train_loss": -6.95829439163208, "global_step": 23670, "epoch": 140} {"train_loss": -6.970341682434082, "global_step": 23671, "epoch": 140} {"train_loss": -6.955404281616211, "global_step": 23672, "epoch": 140} {"train_loss": -6.898867607116699, "global_step": 23673, "epoch": 140} {"train_loss": -7.115163803100586, "global_step": 23674, "epoch": 140} {"train_loss": -6.797204971313477, "global_step": 23675, "epoch": 140} {"train_loss": -7.221658706665039, "global_step": 23676, "epoch": 140} {"train_loss": -6.887665748596191, "global_step": 23677, "epoch": 140} {"train_loss": -7.059025764465332, "global_step": 23678, "epoch": 140} {"train_loss": -7.084592819213867, "global_step": 23679, "epoch": 140} {"train_loss": -7.1277055740356445, "global_step": 23680, "epoch": 140} {"train_loss": -7.038114547729492, "global_step": 23681, "epoch": 140} {"train_loss": -6.860378742218018, "global_step": 23682, "epoch": 140} {"train_loss": -6.926031112670898, "global_step": 23683, "epoch": 140} {"train_loss": -7.1947760581970215, "global_step": 23684, "epoch": 140} {"train_loss": -6.784770965576172, "global_step": 23685, "epoch": 140} {"train_loss": -7.004865646362305, "global_step": 23686, "epoch": 140} {"train_loss": -7.0644573512531466, "global_step": 23687, "epoch": 140, "val_loss": 204238.109375, "train_action_mse_error": 17.77992057800293} {"train_loss": -6.93431282043457, "global_step": 23688, "epoch": 141} {"train_loss": -6.60821533203125, "global_step": 23689, "epoch": 141} {"train_loss": -6.9408464431762695, "global_step": 23690, "epoch": 141} {"train_loss": -6.831232070922852, "global_step": 23691, "epoch": 141} {"train_loss": -6.522538185119629, "global_step": 23692, "epoch": 141} {"train_loss": -7.146257400512695, "global_step": 23693, "epoch": 141} {"train_loss": -6.580810546875, "global_step": 23694, "epoch": 141} {"train_loss": -7.004956245422363, "global_step": 23695, "epoch": 141} {"train_loss": -6.6428303718566895, "global_step": 23696, "epoch": 141} {"train_loss": -6.710050582885742, "global_step": 23697, "epoch": 141} {"train_loss": -6.9850358963012695, "global_step": 23698, "epoch": 141} {"train_loss": -6.899280548095703, "global_step": 23699, "epoch": 141} {"train_loss": -6.939597129821777, "global_step": 23700, "epoch": 141} {"train_loss": -6.9700446128845215, "global_step": 23701, "epoch": 141} {"train_loss": -6.787487983703613, "global_step": 23702, "epoch": 141} {"train_loss": -7.108616828918457, "global_step": 23703, "epoch": 141} {"train_loss": -6.8480682373046875, "global_step": 23704, "epoch": 141} {"train_loss": -6.971117973327637, "global_step": 23705, "epoch": 141} {"train_loss": -7.196001052856445, "global_step": 23706, "epoch": 141} {"train_loss": -6.772594928741455, "global_step": 23707, "epoch": 141} {"train_loss": -7.014132499694824, "global_step": 23708, "epoch": 141} {"train_loss": -6.907894134521484, "global_step": 23709, "epoch": 141} {"train_loss": -7.026537895202637, "global_step": 23710, "epoch": 141} {"train_loss": -7.021102428436279, "global_step": 23711, "epoch": 141} {"train_loss": -6.765931129455566, "global_step": 23712, "epoch": 141} {"train_loss": -6.918771266937256, "global_step": 23713, "epoch": 141} {"train_loss": -6.993854522705078, "global_step": 23714, "epoch": 141} {"train_loss": -6.85709285736084, "global_step": 23715, "epoch": 141} {"train_loss": -7.098156929016113, "global_step": 23716, "epoch": 141} {"train_loss": -7.092276573181152, "global_step": 23717, "epoch": 141} {"train_loss": -7.093606948852539, "global_step": 23718, "epoch": 141} {"train_loss": -7.078656196594238, "global_step": 23719, "epoch": 141} {"train_loss": -7.0353899002075195, "global_step": 23720, "epoch": 141} {"train_loss": -6.873812675476074, "global_step": 23721, "epoch": 141} {"train_loss": -7.162328243255615, "global_step": 23722, "epoch": 141} {"train_loss": -7.081352710723877, "global_step": 23723, "epoch": 141} {"train_loss": -6.890671253204346, "global_step": 23724, "epoch": 141} {"train_loss": -7.262325763702393, "global_step": 23725, "epoch": 141} {"train_loss": -6.875514030456543, "global_step": 23726, "epoch": 141} {"train_loss": -7.19476318359375, "global_step": 23727, "epoch": 141} {"train_loss": -6.9777140617370605, "global_step": 23728, "epoch": 141} {"train_loss": -6.9958391189575195, "global_step": 23729, "epoch": 141} {"train_loss": -7.021204471588135, "global_step": 23730, "epoch": 141} {"train_loss": -6.96644926071167, "global_step": 23731, "epoch": 141} {"train_loss": -7.240998268127441, "global_step": 23732, "epoch": 141} {"train_loss": -7.013216972351074, "global_step": 23733, "epoch": 141} {"train_loss": -6.671463966369629, "global_step": 23734, "epoch": 141} {"train_loss": -6.872788429260254, "global_step": 23735, "epoch": 141} {"train_loss": -7.112066268920898, "global_step": 23736, "epoch": 141} {"train_loss": -7.108391284942627, "global_step": 23737, "epoch": 141} {"train_loss": -6.612102508544922, "global_step": 23738, "epoch": 141} {"train_loss": -6.936590194702148, "global_step": 23739, "epoch": 141} {"train_loss": -6.829626083374023, "global_step": 23740, "epoch": 141} {"train_loss": -7.078092098236084, "global_step": 23741, "epoch": 141} {"train_loss": -7.098024368286133, "global_step": 23742, "epoch": 141} {"train_loss": -7.0964813232421875, "global_step": 23743, "epoch": 141} {"train_loss": -7.184759140014648, "global_step": 23744, "epoch": 141} {"train_loss": -6.977137565612793, "global_step": 23745, "epoch": 141} {"train_loss": -6.9118266105651855, "global_step": 23746, "epoch": 141} {"train_loss": -7.078039169311523, "global_step": 23747, "epoch": 141} {"train_loss": -7.182003021240234, "global_step": 23748, "epoch": 141} {"train_loss": -7.12740421295166, "global_step": 23749, "epoch": 141} {"train_loss": -7.239510536193848, "global_step": 23750, "epoch": 141} {"train_loss": -7.02509880065918, "global_step": 23751, "epoch": 141} {"train_loss": -7.292335510253906, "global_step": 23752, "epoch": 141} {"train_loss": -6.9918012619018555, "global_step": 23753, "epoch": 141} {"train_loss": -7.019684791564941, "global_step": 23754, "epoch": 141} {"train_loss": -7.110449314117432, "global_step": 23755, "epoch": 141} {"train_loss": -7.088871002197266, "global_step": 23756, "epoch": 141} {"train_loss": -7.043495178222656, "global_step": 23757, "epoch": 141} {"train_loss": -7.199134349822998, "global_step": 23758, "epoch": 141} {"train_loss": -7.160405158996582, "global_step": 23759, "epoch": 141} {"train_loss": -7.212122917175293, "global_step": 23760, "epoch": 141} {"train_loss": -6.919929504394531, "global_step": 23761, "epoch": 141} {"train_loss": -7.093116283416748, "global_step": 23762, "epoch": 141} {"train_loss": -7.097431182861328, "global_step": 23763, "epoch": 141} {"train_loss": -7.0826544761657715, "global_step": 23764, "epoch": 141} {"train_loss": -7.184789657592773, "global_step": 23765, "epoch": 141} {"train_loss": -6.834705829620361, "global_step": 23766, "epoch": 141} {"train_loss": -7.082803249359131, "global_step": 23767, "epoch": 141} {"train_loss": -7.110712051391602, "global_step": 23768, "epoch": 141} {"train_loss": -7.045130252838135, "global_step": 23769, "epoch": 141} {"train_loss": -7.248109340667725, "global_step": 23770, "epoch": 141} {"train_loss": -7.248892307281494, "global_step": 23771, "epoch": 141} {"train_loss": -7.1587419509887695, "global_step": 23772, "epoch": 141} {"train_loss": -7.104440212249756, "global_step": 23773, "epoch": 141} {"train_loss": -7.176333427429199, "global_step": 23774, "epoch": 141} {"train_loss": -7.116206645965576, "global_step": 23775, "epoch": 141} {"train_loss": -7.134893894195557, "global_step": 23776, "epoch": 141} {"train_loss": -6.970648765563965, "global_step": 23777, "epoch": 141} {"train_loss": -7.123690605163574, "global_step": 23778, "epoch": 141} {"train_loss": -7.156908988952637, "global_step": 23779, "epoch": 141} {"train_loss": -7.196020126342773, "global_step": 23780, "epoch": 141} {"train_loss": -7.206620693206787, "global_step": 23781, "epoch": 141} {"train_loss": -7.158700942993164, "global_step": 23782, "epoch": 141} {"train_loss": -7.144140243530273, "global_step": 23783, "epoch": 141} {"train_loss": -6.967301845550537, "global_step": 23784, "epoch": 141} {"train_loss": -7.224819660186768, "global_step": 23785, "epoch": 141} {"train_loss": -7.158264636993408, "global_step": 23786, "epoch": 141} {"train_loss": -7.287074565887451, "global_step": 23787, "epoch": 141} {"train_loss": -7.140341281890869, "global_step": 23788, "epoch": 141} {"train_loss": -7.184138774871826, "global_step": 23789, "epoch": 141} {"train_loss": -7.132046699523926, "global_step": 23790, "epoch": 141} {"train_loss": -7.0487494468688965, "global_step": 23791, "epoch": 141} {"train_loss": -6.9952850341796875, "global_step": 23792, "epoch": 141} {"train_loss": -7.117332935333252, "global_step": 23793, "epoch": 141} {"train_loss": -7.074519157409668, "global_step": 23794, "epoch": 141} {"train_loss": -7.104307651519775, "global_step": 23795, "epoch": 141} {"train_loss": -7.020218849182129, "global_step": 23796, "epoch": 141} {"train_loss": -6.972655773162842, "global_step": 23797, "epoch": 141} {"train_loss": -7.132422924041748, "global_step": 23798, "epoch": 141} {"train_loss": -7.036245346069336, "global_step": 23799, "epoch": 141} {"train_loss": -7.024798393249512, "global_step": 23800, "epoch": 141} {"train_loss": -7.0392045974731445, "global_step": 23801, "epoch": 141} {"train_loss": -7.091494560241699, "global_step": 23802, "epoch": 141} {"train_loss": -7.190800666809082, "global_step": 23803, "epoch": 141} {"train_loss": -7.254306793212891, "global_step": 23804, "epoch": 141} {"train_loss": -7.2767510414123535, "global_step": 23805, "epoch": 141} {"train_loss": -6.874903678894043, "global_step": 23806, "epoch": 141} {"train_loss": -7.0241899490356445, "global_step": 23807, "epoch": 141} {"train_loss": -7.012668609619141, "global_step": 23808, "epoch": 141} {"train_loss": -7.209327697753906, "global_step": 23809, "epoch": 141} {"train_loss": -6.812443256378174, "global_step": 23810, "epoch": 141} {"train_loss": -7.042543411254883, "global_step": 23811, "epoch": 141} {"train_loss": -6.917244911193848, "global_step": 23812, "epoch": 141} {"train_loss": -6.964715480804443, "global_step": 23813, "epoch": 141} {"train_loss": -6.980103015899658, "global_step": 23814, "epoch": 141} {"train_loss": -7.013303756713867, "global_step": 23815, "epoch": 141} {"train_loss": -7.236618518829346, "global_step": 23816, "epoch": 141} {"train_loss": -6.971327781677246, "global_step": 23817, "epoch": 141} {"train_loss": -7.166659355163574, "global_step": 23818, "epoch": 141} {"train_loss": -7.15036678314209, "global_step": 23819, "epoch": 141} {"train_loss": -7.18789529800415, "global_step": 23820, "epoch": 141} {"train_loss": -7.008478164672852, "global_step": 23821, "epoch": 141} {"train_loss": -7.168387413024902, "global_step": 23822, "epoch": 141} {"train_loss": -7.310277938842773, "global_step": 23823, "epoch": 141} {"train_loss": -7.068238258361816, "global_step": 23824, "epoch": 141} {"train_loss": -7.3496832847595215, "global_step": 23825, "epoch": 141} {"train_loss": -7.339655876159668, "global_step": 23826, "epoch": 141} {"train_loss": -7.167659759521484, "global_step": 23827, "epoch": 141} {"train_loss": -7.130645751953125, "global_step": 23828, "epoch": 141} {"train_loss": -7.281513214111328, "global_step": 23829, "epoch": 141} {"train_loss": -7.181605339050293, "global_step": 23830, "epoch": 141} {"train_loss": -6.706129550933838, "global_step": 23831, "epoch": 141} {"train_loss": -7.003854751586914, "global_step": 23832, "epoch": 141} {"train_loss": -6.840866565704346, "global_step": 23833, "epoch": 141} {"train_loss": -7.228423118591309, "global_step": 23834, "epoch": 141} {"train_loss": -6.996603012084961, "global_step": 23835, "epoch": 141} {"train_loss": -6.805842399597168, "global_step": 23836, "epoch": 141} {"train_loss": -6.996227264404297, "global_step": 23837, "epoch": 141} {"train_loss": -6.911151885986328, "global_step": 23838, "epoch": 141} {"train_loss": -7.161046504974365, "global_step": 23839, "epoch": 141} {"train_loss": -7.11673641204834, "global_step": 23840, "epoch": 141} {"train_loss": -6.939785957336426, "global_step": 23841, "epoch": 141} {"train_loss": -6.713568687438965, "global_step": 23842, "epoch": 141} {"train_loss": -6.731522560119629, "global_step": 23843, "epoch": 141} {"train_loss": -6.856173038482666, "global_step": 23844, "epoch": 141} {"train_loss": -7.048072814941406, "global_step": 23845, "epoch": 141} {"train_loss": -6.719666481018066, "global_step": 23846, "epoch": 141} {"train_loss": -6.796053886413574, "global_step": 23847, "epoch": 141} {"train_loss": -6.784214973449707, "global_step": 23848, "epoch": 141} {"train_loss": -6.403817653656006, "global_step": 23849, "epoch": 141} {"train_loss": -6.920622825622559, "global_step": 23850, "epoch": 141} {"train_loss": -6.820436000823975, "global_step": 23851, "epoch": 141} {"train_loss": -6.862759113311768, "global_step": 23852, "epoch": 141} {"train_loss": -7.0235185623168945, "global_step": 23853, "epoch": 141} {"train_loss": -7.0681352615356445, "global_step": 23854, "epoch": 141} {"train_loss": -7.023117738110678, "global_step": 23855, "epoch": 141, "val_loss": 203763.5} {"train_loss": -6.887012481689453, "global_step": 23856, "epoch": 142} {"train_loss": -6.7762651443481445, "global_step": 23857, "epoch": 142} {"train_loss": -6.873291969299316, "global_step": 23858, "epoch": 142} {"train_loss": -7.119864463806152, "global_step": 23859, "epoch": 142} {"train_loss": -7.18140983581543, "global_step": 23860, "epoch": 142} {"train_loss": -7.007754802703857, "global_step": 23861, "epoch": 142} {"train_loss": -7.213936805725098, "global_step": 23862, "epoch": 142} {"train_loss": -7.067849159240723, "global_step": 23863, "epoch": 142} {"train_loss": -7.142642021179199, "global_step": 23864, "epoch": 142} {"train_loss": -7.2686591148376465, "global_step": 23865, "epoch": 142} {"train_loss": -7.209975242614746, "global_step": 23866, "epoch": 142} {"train_loss": -7.213191032409668, "global_step": 23867, "epoch": 142} {"train_loss": -7.266839027404785, "global_step": 23868, "epoch": 142} {"train_loss": -7.227909088134766, "global_step": 23869, "epoch": 142} {"train_loss": -7.19677734375, "global_step": 23870, "epoch": 142} {"train_loss": -7.138241767883301, "global_step": 23871, "epoch": 142} {"train_loss": -7.263110160827637, "global_step": 23872, "epoch": 142} {"train_loss": -7.228678226470947, "global_step": 23873, "epoch": 142} {"train_loss": -7.154462814331055, "global_step": 23874, "epoch": 142} {"train_loss": -7.272064208984375, "global_step": 23875, "epoch": 142} {"train_loss": -6.757650375366211, "global_step": 23876, "epoch": 142} {"train_loss": -7.146709442138672, "global_step": 23877, "epoch": 142} {"train_loss": -6.920102119445801, "global_step": 23878, "epoch": 142} {"train_loss": -6.818436622619629, "global_step": 23879, "epoch": 142} {"train_loss": -6.801644325256348, "global_step": 23880, "epoch": 142} {"train_loss": -6.852619171142578, "global_step": 23881, "epoch": 142} {"train_loss": -6.756597518920898, "global_step": 23882, "epoch": 142} {"train_loss": -6.786559581756592, "global_step": 23883, "epoch": 142} {"train_loss": -7.013291358947754, "global_step": 23884, "epoch": 142} {"train_loss": -7.045525550842285, "global_step": 23885, "epoch": 142} {"train_loss": -6.740447998046875, "global_step": 23886, "epoch": 142} {"train_loss": -6.976178169250488, "global_step": 23887, "epoch": 142} {"train_loss": -6.91391658782959, "global_step": 23888, "epoch": 142} {"train_loss": -7.0411834716796875, "global_step": 23889, "epoch": 142} {"train_loss": -6.945882797241211, "global_step": 23890, "epoch": 142} {"train_loss": -7.083234786987305, "global_step": 23891, "epoch": 142} {"train_loss": -7.036840915679932, "global_step": 23892, "epoch": 142} {"train_loss": -7.117041110992432, "global_step": 23893, "epoch": 142} {"train_loss": -7.110263347625732, "global_step": 23894, "epoch": 142} {"train_loss": -6.885819435119629, "global_step": 23895, "epoch": 142} {"train_loss": -7.0439958572387695, "global_step": 23896, "epoch": 142} {"train_loss": -7.028962135314941, "global_step": 23897, "epoch": 142} {"train_loss": -7.135197162628174, "global_step": 23898, "epoch": 142} {"train_loss": -7.090637683868408, "global_step": 23899, "epoch": 142} {"train_loss": -7.148172855377197, "global_step": 23900, "epoch": 142} {"train_loss": -7.067281723022461, "global_step": 23901, "epoch": 142} {"train_loss": -7.239875793457031, "global_step": 23902, "epoch": 142} {"train_loss": -7.300816535949707, "global_step": 23903, "epoch": 142} {"train_loss": -7.199613094329834, "global_step": 23904, "epoch": 142} {"train_loss": -7.287369728088379, "global_step": 23905, "epoch": 142} {"train_loss": -7.281766414642334, "global_step": 23906, "epoch": 142} {"train_loss": -7.14691686630249, "global_step": 23907, "epoch": 142} {"train_loss": -7.314643859863281, "global_step": 23908, "epoch": 142} {"train_loss": -7.064579486846924, "global_step": 23909, "epoch": 142} {"train_loss": -7.2827467918396, "global_step": 23910, "epoch": 142} {"train_loss": -7.321616172790527, "global_step": 23911, "epoch": 142} {"train_loss": -7.304806709289551, "global_step": 23912, "epoch": 142} {"train_loss": -7.171136856079102, "global_step": 23913, "epoch": 142} {"train_loss": -7.186583995819092, "global_step": 23914, "epoch": 142} {"train_loss": -7.215447425842285, "global_step": 23915, "epoch": 142} {"train_loss": -7.055111408233643, "global_step": 23916, "epoch": 142} {"train_loss": -7.198803901672363, "global_step": 23917, "epoch": 142} {"train_loss": -7.319965362548828, "global_step": 23918, "epoch": 142} {"train_loss": -6.852356433868408, "global_step": 23919, "epoch": 142} {"train_loss": -6.907536506652832, "global_step": 23920, "epoch": 142} {"train_loss": -6.838731288909912, "global_step": 23921, "epoch": 142} {"train_loss": -7.015323162078857, "global_step": 23922, "epoch": 142} {"train_loss": -6.879952430725098, "global_step": 23923, "epoch": 142} {"train_loss": -7.047055244445801, "global_step": 23924, "epoch": 142} {"train_loss": -6.878702640533447, "global_step": 23925, "epoch": 142} {"train_loss": -7.148849964141846, "global_step": 23926, "epoch": 142} {"train_loss": -7.059839725494385, "global_step": 23927, "epoch": 142} {"train_loss": -7.3375043869018555, "global_step": 23928, "epoch": 142} {"train_loss": -7.151086807250977, "global_step": 23929, "epoch": 142} {"train_loss": -6.887475490570068, "global_step": 23930, "epoch": 142} {"train_loss": -7.200534343719482, "global_step": 23931, "epoch": 142} {"train_loss": -6.981651306152344, "global_step": 23932, "epoch": 142} {"train_loss": -7.315445899963379, "global_step": 23933, "epoch": 142} {"train_loss": -6.833315372467041, "global_step": 23934, "epoch": 142} {"train_loss": -7.243906497955322, "global_step": 23935, "epoch": 142} {"train_loss": -7.013132572174072, "global_step": 23936, "epoch": 142} {"train_loss": -7.182714462280273, "global_step": 23937, "epoch": 142} {"train_loss": -7.280113220214844, "global_step": 23938, "epoch": 142} {"train_loss": -6.908019065856934, "global_step": 23939, "epoch": 142} {"train_loss": -7.083255290985107, "global_step": 23940, "epoch": 142} {"train_loss": -7.029513835906982, "global_step": 23941, "epoch": 142} {"train_loss": -7.146092414855957, "global_step": 23942, "epoch": 142} {"train_loss": -6.836193084716797, "global_step": 23943, "epoch": 142} {"train_loss": -7.193790912628174, "global_step": 23944, "epoch": 142} {"train_loss": -6.959115505218506, "global_step": 23945, "epoch": 142} {"train_loss": -7.177933692932129, "global_step": 23946, "epoch": 142} {"train_loss": -7.13864803314209, "global_step": 23947, "epoch": 142} {"train_loss": -7.105531215667725, "global_step": 23948, "epoch": 142} {"train_loss": -6.969823837280273, "global_step": 23949, "epoch": 142} {"train_loss": -7.141858100891113, "global_step": 23950, "epoch": 142} {"train_loss": -7.1145172119140625, "global_step": 23951, "epoch": 142} {"train_loss": -7.1567487716674805, "global_step": 23952, "epoch": 142} {"train_loss": -6.930111885070801, "global_step": 23953, "epoch": 142} {"train_loss": -6.909627914428711, "global_step": 23954, "epoch": 142} {"train_loss": -6.953710079193115, "global_step": 23955, "epoch": 142} {"train_loss": -6.741414546966553, "global_step": 23956, "epoch": 142} {"train_loss": -6.790958404541016, "global_step": 23957, "epoch": 142} {"train_loss": -6.941702842712402, "global_step": 23958, "epoch": 142} {"train_loss": -6.955634117126465, "global_step": 23959, "epoch": 142} {"train_loss": -6.891994476318359, "global_step": 23960, "epoch": 142} {"train_loss": -7.008133411407471, "global_step": 23961, "epoch": 142} {"train_loss": -7.132983207702637, "global_step": 23962, "epoch": 142} {"train_loss": -7.131529808044434, "global_step": 23963, "epoch": 142} {"train_loss": -7.072512626647949, "global_step": 23964, "epoch": 142} {"train_loss": -7.117086410522461, "global_step": 23965, "epoch": 142} {"train_loss": -7.337027549743652, "global_step": 23966, "epoch": 142} {"train_loss": -6.946876525878906, "global_step": 23967, "epoch": 142} {"train_loss": -7.220648288726807, "global_step": 23968, "epoch": 142} {"train_loss": -7.059560775756836, "global_step": 23969, "epoch": 142} {"train_loss": -7.216824531555176, "global_step": 23970, "epoch": 142} {"train_loss": -7.1221394538879395, "global_step": 23971, "epoch": 142} {"train_loss": -7.194384574890137, "global_step": 23972, "epoch": 142} {"train_loss": -7.0418477058410645, "global_step": 23973, "epoch": 142} {"train_loss": -7.150923728942871, "global_step": 23974, "epoch": 142} {"train_loss": -7.124776363372803, "global_step": 23975, "epoch": 142} {"train_loss": -7.056020736694336, "global_step": 23976, "epoch": 142} {"train_loss": -7.2104902267456055, "global_step": 23977, "epoch": 142} {"train_loss": -6.872194290161133, "global_step": 23978, "epoch": 142} {"train_loss": -7.2430853843688965, "global_step": 23979, "epoch": 142} {"train_loss": -7.177645683288574, "global_step": 23980, "epoch": 142} {"train_loss": -7.323416233062744, "global_step": 23981, "epoch": 142} {"train_loss": -7.028907299041748, "global_step": 23982, "epoch": 142} {"train_loss": -6.895879745483398, "global_step": 23983, "epoch": 142} {"train_loss": -6.991558074951172, "global_step": 23984, "epoch": 142} {"train_loss": -6.946883201599121, "global_step": 23985, "epoch": 142} {"train_loss": -7.0155839920043945, "global_step": 23986, "epoch": 142} {"train_loss": -7.007394790649414, "global_step": 23987, "epoch": 142} {"train_loss": -7.02356481552124, "global_step": 23988, "epoch": 142} {"train_loss": -7.097816467285156, "global_step": 23989, "epoch": 142} {"train_loss": -6.777118682861328, "global_step": 23990, "epoch": 142} {"train_loss": -7.1302809715271, "global_step": 23991, "epoch": 142} {"train_loss": -6.993397235870361, "global_step": 23992, "epoch": 142} {"train_loss": -6.9921793937683105, "global_step": 23993, "epoch": 142} {"train_loss": -6.994491100311279, "global_step": 23994, "epoch": 142} {"train_loss": -7.206911087036133, "global_step": 23995, "epoch": 142} {"train_loss": -7.173488140106201, "global_step": 23996, "epoch": 142} {"train_loss": -6.854887962341309, "global_step": 23997, "epoch": 142} {"train_loss": -7.0090789794921875, "global_step": 23998, "epoch": 142} {"train_loss": -7.236251354217529, "global_step": 23999, "epoch": 142} {"train_loss": -7.273136615753174, "global_step": 24000, "epoch": 142} {"train_loss": -7.114444255828857, "global_step": 24001, "epoch": 142} {"train_loss": -7.083310127258301, "global_step": 24002, "epoch": 142} {"train_loss": -7.19069242477417, "global_step": 24003, "epoch": 142} {"train_loss": -7.065978527069092, "global_step": 24004, "epoch": 142} {"train_loss": -6.991736888885498, "global_step": 24005, "epoch": 142} {"train_loss": -7.1726179122924805, "global_step": 24006, "epoch": 142} {"train_loss": -7.208024978637695, "global_step": 24007, "epoch": 142} {"train_loss": -7.187220096588135, "global_step": 24008, "epoch": 142} {"train_loss": -7.220489978790283, "global_step": 24009, "epoch": 142} {"train_loss": -7.285017967224121, "global_step": 24010, "epoch": 142} {"train_loss": -7.1681599617004395, "global_step": 24011, "epoch": 142} {"train_loss": -7.209682464599609, "global_step": 24012, "epoch": 142} {"train_loss": -6.955483913421631, "global_step": 24013, "epoch": 142} {"train_loss": -7.288229942321777, "global_step": 24014, "epoch": 142} {"train_loss": -7.291831970214844, "global_step": 24015, "epoch": 142} {"train_loss": -7.139185428619385, "global_step": 24016, "epoch": 142} {"train_loss": -7.0475616455078125, "global_step": 24017, "epoch": 142} {"train_loss": -7.373546600341797, "global_step": 24018, "epoch": 142} {"train_loss": -7.205317497253418, "global_step": 24019, "epoch": 142} {"train_loss": -7.203902244567871, "global_step": 24020, "epoch": 142} {"train_loss": -7.17329740524292, "global_step": 24021, "epoch": 142} {"train_loss": -7.167787551879883, "global_step": 24022, "epoch": 142} {"train_loss": -7.085454060917809, "global_step": 24023, "epoch": 142, "val_loss": 201803.5625} {"train_loss": -7.020180702209473, "global_step": 24024, "epoch": 143} {"train_loss": -7.285857200622559, "global_step": 24025, "epoch": 143} {"train_loss": -7.032954692840576, "global_step": 24026, "epoch": 143} {"train_loss": -7.054365158081055, "global_step": 24027, "epoch": 143} {"train_loss": -6.947970390319824, "global_step": 24028, "epoch": 143} {"train_loss": -7.068353652954102, "global_step": 24029, "epoch": 143} {"train_loss": -6.706073760986328, "global_step": 24030, "epoch": 143} {"train_loss": -6.876579284667969, "global_step": 24031, "epoch": 143} {"train_loss": -6.950050354003906, "global_step": 24032, "epoch": 143} {"train_loss": -7.084789276123047, "global_step": 24033, "epoch": 143} {"train_loss": -6.827858924865723, "global_step": 24034, "epoch": 143} {"train_loss": -6.945088863372803, "global_step": 24035, "epoch": 143} {"train_loss": -7.069664478302002, "global_step": 24036, "epoch": 143} {"train_loss": -7.113914489746094, "global_step": 24037, "epoch": 143} {"train_loss": -6.819415092468262, "global_step": 24038, "epoch": 143} {"train_loss": -6.773802280426025, "global_step": 24039, "epoch": 143} {"train_loss": -7.120938301086426, "global_step": 24040, "epoch": 143} {"train_loss": -7.0000786781311035, "global_step": 24041, "epoch": 143} {"train_loss": -7.067183494567871, "global_step": 24042, "epoch": 143} {"train_loss": -7.0626220703125, "global_step": 24043, "epoch": 143} {"train_loss": -7.07283878326416, "global_step": 24044, "epoch": 143} {"train_loss": -6.874702453613281, "global_step": 24045, "epoch": 143} {"train_loss": -7.0260820388793945, "global_step": 24046, "epoch": 143} {"train_loss": -7.13349723815918, "global_step": 24047, "epoch": 143} {"train_loss": -7.085198879241943, "global_step": 24048, "epoch": 143} {"train_loss": -7.116724967956543, "global_step": 24049, "epoch": 143} {"train_loss": -6.91049861907959, "global_step": 24050, "epoch": 143} {"train_loss": -7.0517191886901855, "global_step": 24051, "epoch": 143} {"train_loss": -7.117262363433838, "global_step": 24052, "epoch": 143} {"train_loss": -7.23982048034668, "global_step": 24053, "epoch": 143} {"train_loss": -6.9136576652526855, "global_step": 24054, "epoch": 143} {"train_loss": -7.159273147583008, "global_step": 24055, "epoch": 143} {"train_loss": -7.245292663574219, "global_step": 24056, "epoch": 143} {"train_loss": -6.988096237182617, "global_step": 24057, "epoch": 143} {"train_loss": -6.958986282348633, "global_step": 24058, "epoch": 143} {"train_loss": -7.228470802307129, "global_step": 24059, "epoch": 143} {"train_loss": -7.061756134033203, "global_step": 24060, "epoch": 143} {"train_loss": -7.036270618438721, "global_step": 24061, "epoch": 143} {"train_loss": -7.173816204071045, "global_step": 24062, "epoch": 143} {"train_loss": -7.0767340660095215, "global_step": 24063, "epoch": 143} {"train_loss": -7.241152763366699, "global_step": 24064, "epoch": 143} {"train_loss": -6.762864112854004, "global_step": 24065, "epoch": 143} {"train_loss": -6.844729423522949, "global_step": 24066, "epoch": 143} {"train_loss": -6.769707679748535, "global_step": 24067, "epoch": 143} {"train_loss": -6.789107799530029, "global_step": 24068, "epoch": 143} {"train_loss": -7.123466491699219, "global_step": 24069, "epoch": 143} {"train_loss": -6.905855178833008, "global_step": 24070, "epoch": 143} {"train_loss": -7.130058288574219, "global_step": 24071, "epoch": 143} {"train_loss": -6.990482807159424, "global_step": 24072, "epoch": 143} {"train_loss": -6.8572998046875, "global_step": 24073, "epoch": 143} {"train_loss": -7.164364337921143, "global_step": 24074, "epoch": 143} {"train_loss": -6.907784461975098, "global_step": 24075, "epoch": 143} {"train_loss": -7.120059967041016, "global_step": 24076, "epoch": 143} {"train_loss": -6.963161468505859, "global_step": 24077, "epoch": 143} {"train_loss": -7.264667510986328, "global_step": 24078, "epoch": 143} {"train_loss": -7.110611438751221, "global_step": 24079, "epoch": 143} {"train_loss": -7.01885461807251, "global_step": 24080, "epoch": 143} {"train_loss": -7.075583457946777, "global_step": 24081, "epoch": 143} {"train_loss": -7.1724042892456055, "global_step": 24082, "epoch": 143} {"train_loss": -7.1909589767456055, "global_step": 24083, "epoch": 143} {"train_loss": -6.975625514984131, "global_step": 24084, "epoch": 143} {"train_loss": -7.169114589691162, "global_step": 24085, "epoch": 143} {"train_loss": -7.090768814086914, "global_step": 24086, "epoch": 143} {"train_loss": -7.191215515136719, "global_step": 24087, "epoch": 143} {"train_loss": -7.044093132019043, "global_step": 24088, "epoch": 143} {"train_loss": -7.0571699142456055, "global_step": 24089, "epoch": 143} {"train_loss": -6.913521766662598, "global_step": 24090, "epoch": 143} {"train_loss": -7.145354747772217, "global_step": 24091, "epoch": 143} {"train_loss": -7.038488388061523, "global_step": 24092, "epoch": 143} {"train_loss": -7.118233680725098, "global_step": 24093, "epoch": 143} {"train_loss": -7.343603610992432, "global_step": 24094, "epoch": 143} {"train_loss": -7.118570327758789, "global_step": 24095, "epoch": 143} {"train_loss": -7.206362247467041, "global_step": 24096, "epoch": 143} {"train_loss": -7.113470077514648, "global_step": 24097, "epoch": 143} {"train_loss": -6.971306324005127, "global_step": 24098, "epoch": 143} {"train_loss": -7.152030944824219, "global_step": 24099, "epoch": 143} {"train_loss": -7.20079231262207, "global_step": 24100, "epoch": 143} {"train_loss": -7.192270278930664, "global_step": 24101, "epoch": 143} {"train_loss": -7.029942035675049, "global_step": 24102, "epoch": 143} {"train_loss": -7.011665344238281, "global_step": 24103, "epoch": 143} {"train_loss": -7.312934398651123, "global_step": 24104, "epoch": 143} {"train_loss": -6.8674163818359375, "global_step": 24105, "epoch": 143} {"train_loss": -7.38681173324585, "global_step": 24106, "epoch": 143} {"train_loss": -7.141181945800781, "global_step": 24107, "epoch": 143} {"train_loss": -7.210261344909668, "global_step": 24108, "epoch": 143} {"train_loss": -7.165588855743408, "global_step": 24109, "epoch": 143} {"train_loss": -7.243273735046387, "global_step": 24110, "epoch": 143} {"train_loss": -7.0335187911987305, "global_step": 24111, "epoch": 143} {"train_loss": -7.160315036773682, "global_step": 24112, "epoch": 143} {"train_loss": -7.069817543029785, "global_step": 24113, "epoch": 143} {"train_loss": -7.01206111907959, "global_step": 24114, "epoch": 143} {"train_loss": -7.039974212646484, "global_step": 24115, "epoch": 143} {"train_loss": -7.067684173583984, "global_step": 24116, "epoch": 143} {"train_loss": -6.968609809875488, "global_step": 24117, "epoch": 143} {"train_loss": -7.322515964508057, "global_step": 24118, "epoch": 143} {"train_loss": -7.097796440124512, "global_step": 24119, "epoch": 143} {"train_loss": -7.11912727355957, "global_step": 24120, "epoch": 143} {"train_loss": -7.134889602661133, "global_step": 24121, "epoch": 143} {"train_loss": -7.167637825012207, "global_step": 24122, "epoch": 143} {"train_loss": -7.34773063659668, "global_step": 24123, "epoch": 143} {"train_loss": -7.157623291015625, "global_step": 24124, "epoch": 143} {"train_loss": -7.097522735595703, "global_step": 24125, "epoch": 143} {"train_loss": -7.134702682495117, "global_step": 24126, "epoch": 143} {"train_loss": -7.312233924865723, "global_step": 24127, "epoch": 143} {"train_loss": -7.25883674621582, "global_step": 24128, "epoch": 143} {"train_loss": -7.055957794189453, "global_step": 24129, "epoch": 143} {"train_loss": -7.138526439666748, "global_step": 24130, "epoch": 143} {"train_loss": -6.940696716308594, "global_step": 24131, "epoch": 143} {"train_loss": -7.362791061401367, "global_step": 24132, "epoch": 143} {"train_loss": -7.3008503913879395, "global_step": 24133, "epoch": 143} {"train_loss": -7.166576385498047, "global_step": 24134, "epoch": 143} {"train_loss": -7.176823616027832, "global_step": 24135, "epoch": 143} {"train_loss": -7.069265842437744, "global_step": 24136, "epoch": 143} {"train_loss": -7.188199520111084, "global_step": 24137, "epoch": 143} {"train_loss": -7.079266548156738, "global_step": 24138, "epoch": 143} {"train_loss": -7.403730392456055, "global_step": 24139, "epoch": 143} {"train_loss": -7.076187610626221, "global_step": 24140, "epoch": 143} {"train_loss": -6.956387519836426, "global_step": 24141, "epoch": 143} {"train_loss": -7.067384719848633, "global_step": 24142, "epoch": 143} {"train_loss": -7.23923397064209, "global_step": 24143, "epoch": 143} {"train_loss": -7.006167411804199, "global_step": 24144, "epoch": 143} {"train_loss": -7.129288196563721, "global_step": 24145, "epoch": 143} {"train_loss": -6.9932146072387695, "global_step": 24146, "epoch": 143} {"train_loss": -7.1287946701049805, "global_step": 24147, "epoch": 143} {"train_loss": -7.075405120849609, "global_step": 24148, "epoch": 143} {"train_loss": -7.134824752807617, "global_step": 24149, "epoch": 143} {"train_loss": -6.978508949279785, "global_step": 24150, "epoch": 143} {"train_loss": -7.072745323181152, "global_step": 24151, "epoch": 143} {"train_loss": -7.289112091064453, "global_step": 24152, "epoch": 143} {"train_loss": -6.752720832824707, "global_step": 24153, "epoch": 143} {"train_loss": -7.210533142089844, "global_step": 24154, "epoch": 143} {"train_loss": -6.863299369812012, "global_step": 24155, "epoch": 143} {"train_loss": -7.110340595245361, "global_step": 24156, "epoch": 143} {"train_loss": -6.80763053894043, "global_step": 24157, "epoch": 143} {"train_loss": -6.8937273025512695, "global_step": 24158, "epoch": 143} {"train_loss": -6.878292560577393, "global_step": 24159, "epoch": 143} {"train_loss": -6.894228935241699, "global_step": 24160, "epoch": 143} {"train_loss": -6.953444480895996, "global_step": 24161, "epoch": 143} {"train_loss": -7.161172866821289, "global_step": 24162, "epoch": 143} {"train_loss": -6.9103264808654785, "global_step": 24163, "epoch": 143} {"train_loss": -7.23552131652832, "global_step": 24164, "epoch": 143} {"train_loss": -7.103198528289795, "global_step": 24165, "epoch": 143} {"train_loss": -7.124420166015625, "global_step": 24166, "epoch": 143} {"train_loss": -6.920268535614014, "global_step": 24167, "epoch": 143} {"train_loss": -6.901236534118652, "global_step": 24168, "epoch": 143} {"train_loss": -7.089493751525879, "global_step": 24169, "epoch": 143} {"train_loss": -7.080588340759277, "global_step": 24170, "epoch": 143} {"train_loss": -7.329735279083252, "global_step": 24171, "epoch": 143} {"train_loss": -7.021142959594727, "global_step": 24172, "epoch": 143} {"train_loss": -7.268526554107666, "global_step": 24173, "epoch": 143} {"train_loss": -7.276035308837891, "global_step": 24174, "epoch": 143} {"train_loss": -7.007381439208984, "global_step": 24175, "epoch": 143} {"train_loss": -7.200037479400635, "global_step": 24176, "epoch": 143} {"train_loss": -7.237896919250488, "global_step": 24177, "epoch": 143} {"train_loss": -7.248018264770508, "global_step": 24178, "epoch": 143} {"train_loss": -7.38145637512207, "global_step": 24179, "epoch": 143} {"train_loss": -7.218466758728027, "global_step": 24180, "epoch": 143} {"train_loss": -7.347947120666504, "global_step": 24181, "epoch": 143} {"train_loss": -7.161373138427734, "global_step": 24182, "epoch": 143} {"train_loss": -7.283108711242676, "global_step": 24183, "epoch": 143} {"train_loss": -7.368354797363281, "global_step": 24184, "epoch": 143} {"train_loss": -7.082942962646484, "global_step": 24185, "epoch": 143} {"train_loss": -7.160390853881836, "global_step": 24186, "epoch": 143} {"train_loss": -7.34202241897583, "global_step": 24187, "epoch": 143} {"train_loss": -7.133944511413574, "global_step": 24188, "epoch": 143} {"train_loss": -7.284457206726074, "global_step": 24189, "epoch": 143} {"train_loss": -7.208388328552246, "global_step": 24190, "epoch": 143} {"train_loss": -7.091547239394415, "global_step": 24191, "epoch": 143, "val_loss": 202561.421875} {"train_loss": -7.218387603759766, "global_step": 24192, "epoch": 144} {"train_loss": -7.161896705627441, "global_step": 24193, "epoch": 144} {"train_loss": -7.1948561668396, "global_step": 24194, "epoch": 144} {"train_loss": -7.287519454956055, "global_step": 24195, "epoch": 144} {"train_loss": -7.071032524108887, "global_step": 24196, "epoch": 144} {"train_loss": -7.247420310974121, "global_step": 24197, "epoch": 144} {"train_loss": -7.2265238761901855, "global_step": 24198, "epoch": 144} {"train_loss": -7.224590301513672, "global_step": 24199, "epoch": 144} {"train_loss": -7.3161725997924805, "global_step": 24200, "epoch": 144} {"train_loss": -7.377704620361328, "global_step": 24201, "epoch": 144} {"train_loss": -7.144903659820557, "global_step": 24202, "epoch": 144} {"train_loss": -7.229108810424805, "global_step": 24203, "epoch": 144} {"train_loss": -7.322197437286377, "global_step": 24204, "epoch": 144} {"train_loss": -7.27055025100708, "global_step": 24205, "epoch": 144} {"train_loss": -7.064846992492676, "global_step": 24206, "epoch": 144} {"train_loss": -7.233485221862793, "global_step": 24207, "epoch": 144} {"train_loss": -7.142117977142334, "global_step": 24208, "epoch": 144} {"train_loss": -7.207448482513428, "global_step": 24209, "epoch": 144} {"train_loss": -7.192698955535889, "global_step": 24210, "epoch": 144} {"train_loss": -7.158346176147461, "global_step": 24211, "epoch": 144} {"train_loss": -7.523199081420898, "global_step": 24212, "epoch": 144} {"train_loss": -7.400824546813965, "global_step": 24213, "epoch": 144} {"train_loss": -7.130107879638672, "global_step": 24214, "epoch": 144} {"train_loss": -7.328691482543945, "global_step": 24215, "epoch": 144} {"train_loss": -7.072400093078613, "global_step": 24216, "epoch": 144} {"train_loss": -7.336489677429199, "global_step": 24217, "epoch": 144} {"train_loss": -7.249783992767334, "global_step": 24218, "epoch": 144} {"train_loss": -7.136618137359619, "global_step": 24219, "epoch": 144} {"train_loss": -7.257872581481934, "global_step": 24220, "epoch": 144} {"train_loss": -7.2740631103515625, "global_step": 24221, "epoch": 144} {"train_loss": -7.178463935852051, "global_step": 24222, "epoch": 144} {"train_loss": -7.201909065246582, "global_step": 24223, "epoch": 144} {"train_loss": -6.97976541519165, "global_step": 24224, "epoch": 144} {"train_loss": -7.2251996994018555, "global_step": 24225, "epoch": 144} {"train_loss": -7.008461952209473, "global_step": 24226, "epoch": 144} {"train_loss": -7.265194892883301, "global_step": 24227, "epoch": 144} {"train_loss": -7.250329971313477, "global_step": 24228, "epoch": 144} {"train_loss": -7.213976860046387, "global_step": 24229, "epoch": 144} {"train_loss": -7.2899580001831055, "global_step": 24230, "epoch": 144} {"train_loss": -7.151193141937256, "global_step": 24231, "epoch": 144} {"train_loss": -7.228253364562988, "global_step": 24232, "epoch": 144} {"train_loss": -7.40708065032959, "global_step": 24233, "epoch": 144} {"train_loss": -7.316110610961914, "global_step": 24234, "epoch": 144} {"train_loss": -7.160979747772217, "global_step": 24235, "epoch": 144} {"train_loss": -7.119335174560547, "global_step": 24236, "epoch": 144} {"train_loss": -7.061013221740723, "global_step": 24237, "epoch": 144} {"train_loss": -7.158695220947266, "global_step": 24238, "epoch": 144} {"train_loss": -7.104347229003906, "global_step": 24239, "epoch": 144} {"train_loss": -6.628903388977051, "global_step": 24240, "epoch": 144} {"train_loss": -7.025644302368164, "global_step": 24241, "epoch": 144} {"train_loss": -6.880167484283447, "global_step": 24242, "epoch": 144} {"train_loss": -7.222231864929199, "global_step": 24243, "epoch": 144} {"train_loss": -6.84171199798584, "global_step": 24244, "epoch": 144} {"train_loss": -6.914972305297852, "global_step": 24245, "epoch": 144} {"train_loss": -6.909541606903076, "global_step": 24246, "epoch": 144} {"train_loss": -7.181081771850586, "global_step": 24247, "epoch": 144} {"train_loss": -7.0839948654174805, "global_step": 24248, "epoch": 144} {"train_loss": -7.12888765335083, "global_step": 24249, "epoch": 144} {"train_loss": -7.181480884552002, "global_step": 24250, "epoch": 144} {"train_loss": -7.1915388107299805, "global_step": 24251, "epoch": 144} {"train_loss": -7.307975769042969, "global_step": 24252, "epoch": 144} {"train_loss": -6.950356483459473, "global_step": 24253, "epoch": 144} {"train_loss": -7.26637077331543, "global_step": 24254, "epoch": 144} {"train_loss": -6.930020332336426, "global_step": 24255, "epoch": 144} {"train_loss": -7.277412414550781, "global_step": 24256, "epoch": 144} {"train_loss": -7.092219352722168, "global_step": 24257, "epoch": 144} {"train_loss": -7.204290390014648, "global_step": 24258, "epoch": 144} {"train_loss": -7.035619735717773, "global_step": 24259, "epoch": 144} {"train_loss": -7.114246368408203, "global_step": 24260, "epoch": 144} {"train_loss": -7.198815822601318, "global_step": 24261, "epoch": 144} {"train_loss": -7.042619705200195, "global_step": 24262, "epoch": 144} {"train_loss": -7.176095008850098, "global_step": 24263, "epoch": 144} {"train_loss": -7.167531967163086, "global_step": 24264, "epoch": 144} {"train_loss": -7.1313066482543945, "global_step": 24265, "epoch": 144} {"train_loss": -7.251885414123535, "global_step": 24266, "epoch": 144} {"train_loss": -7.169200897216797, "global_step": 24267, "epoch": 144} {"train_loss": -7.107793807983398, "global_step": 24268, "epoch": 144} {"train_loss": -7.125327110290527, "global_step": 24269, "epoch": 144} {"train_loss": -7.152858257293701, "global_step": 24270, "epoch": 144} {"train_loss": -6.826357841491699, "global_step": 24271, "epoch": 144} {"train_loss": -7.176420211791992, "global_step": 24272, "epoch": 144} {"train_loss": -7.288702487945557, "global_step": 24273, "epoch": 144} {"train_loss": -7.208734512329102, "global_step": 24274, "epoch": 144} {"train_loss": -7.2339396476745605, "global_step": 24275, "epoch": 144} {"train_loss": -7.3449859619140625, "global_step": 24276, "epoch": 144} {"train_loss": -7.146267414093018, "global_step": 24277, "epoch": 144} {"train_loss": -6.925343990325928, "global_step": 24278, "epoch": 144} {"train_loss": -7.42676305770874, "global_step": 24279, "epoch": 144} {"train_loss": -6.848575115203857, "global_step": 24280, "epoch": 144} {"train_loss": -7.083669662475586, "global_step": 24281, "epoch": 144} {"train_loss": -7.110528469085693, "global_step": 24282, "epoch": 144} {"train_loss": -7.112943649291992, "global_step": 24283, "epoch": 144} {"train_loss": -7.131882667541504, "global_step": 24284, "epoch": 144} {"train_loss": -6.854869842529297, "global_step": 24285, "epoch": 144} {"train_loss": -6.942582130432129, "global_step": 24286, "epoch": 144} {"train_loss": -6.7736711502075195, "global_step": 24287, "epoch": 144} {"train_loss": -6.942263126373291, "global_step": 24288, "epoch": 144} {"train_loss": -7.071179389953613, "global_step": 24289, "epoch": 144} {"train_loss": -7.116697788238525, "global_step": 24290, "epoch": 144} {"train_loss": -7.018477916717529, "global_step": 24291, "epoch": 144} {"train_loss": -6.87902307510376, "global_step": 24292, "epoch": 144} {"train_loss": -7.199822902679443, "global_step": 24293, "epoch": 144} {"train_loss": -7.124170303344727, "global_step": 24294, "epoch": 144} {"train_loss": -7.263449192047119, "global_step": 24295, "epoch": 144} {"train_loss": -7.1914567947387695, "global_step": 24296, "epoch": 144} {"train_loss": -7.301059722900391, "global_step": 24297, "epoch": 144} {"train_loss": -7.146745204925537, "global_step": 24298, "epoch": 144} {"train_loss": -7.031691074371338, "global_step": 24299, "epoch": 144} {"train_loss": -7.147948741912842, "global_step": 24300, "epoch": 144} {"train_loss": -7.131750106811523, "global_step": 24301, "epoch": 144} {"train_loss": -7.119851589202881, "global_step": 24302, "epoch": 144} {"train_loss": -7.072002410888672, "global_step": 24303, "epoch": 144} {"train_loss": -6.998983860015869, "global_step": 24304, "epoch": 144} {"train_loss": -7.427047252655029, "global_step": 24305, "epoch": 144} {"train_loss": -7.250173568725586, "global_step": 24306, "epoch": 144} {"train_loss": -7.33680534362793, "global_step": 24307, "epoch": 144} {"train_loss": -7.1038408279418945, "global_step": 24308, "epoch": 144} {"train_loss": -7.308459281921387, "global_step": 24309, "epoch": 144} {"train_loss": -7.045698642730713, "global_step": 24310, "epoch": 144} {"train_loss": -7.356373310089111, "global_step": 24311, "epoch": 144} {"train_loss": -7.1319732666015625, "global_step": 24312, "epoch": 144} {"train_loss": -7.339672565460205, "global_step": 24313, "epoch": 144} {"train_loss": -6.812064170837402, "global_step": 24314, "epoch": 144} {"train_loss": -7.224435806274414, "global_step": 24315, "epoch": 144} {"train_loss": -7.408294677734375, "global_step": 24316, "epoch": 144} {"train_loss": -6.962846279144287, "global_step": 24317, "epoch": 144} {"train_loss": -7.106306076049805, "global_step": 24318, "epoch": 144} {"train_loss": -7.07351541519165, "global_step": 24319, "epoch": 144} {"train_loss": -7.087893486022949, "global_step": 24320, "epoch": 144} {"train_loss": -7.1528143882751465, "global_step": 24321, "epoch": 144} {"train_loss": -6.950614929199219, "global_step": 24322, "epoch": 144} {"train_loss": -6.913954734802246, "global_step": 24323, "epoch": 144} {"train_loss": -6.979467868804932, "global_step": 24324, "epoch": 144} {"train_loss": -7.1193013191223145, "global_step": 24325, "epoch": 144} {"train_loss": -6.780070781707764, "global_step": 24326, "epoch": 144} {"train_loss": -6.957019805908203, "global_step": 24327, "epoch": 144} {"train_loss": -6.999876976013184, "global_step": 24328, "epoch": 144} {"train_loss": -7.135756015777588, "global_step": 24329, "epoch": 144} {"train_loss": -7.223257064819336, "global_step": 24330, "epoch": 144} {"train_loss": -6.875555038452148, "global_step": 24331, "epoch": 144} {"train_loss": -6.846502780914307, "global_step": 24332, "epoch": 144} {"train_loss": -6.797910690307617, "global_step": 24333, "epoch": 144} {"train_loss": -7.037491798400879, "global_step": 24334, "epoch": 144} {"train_loss": -7.158030033111572, "global_step": 24335, "epoch": 144} {"train_loss": -7.123453140258789, "global_step": 24336, "epoch": 144} {"train_loss": -7.032319068908691, "global_step": 24337, "epoch": 144} {"train_loss": -7.063191890716553, "global_step": 24338, "epoch": 144} {"train_loss": -7.29105806350708, "global_step": 24339, "epoch": 144} {"train_loss": -7.268185138702393, "global_step": 24340, "epoch": 144} {"train_loss": -7.187509059906006, "global_step": 24341, "epoch": 144} {"train_loss": -7.24445104598999, "global_step": 24342, "epoch": 144} {"train_loss": -7.100529670715332, "global_step": 24343, "epoch": 144} {"train_loss": -6.952011585235596, "global_step": 24344, "epoch": 144} {"train_loss": -7.247762680053711, "global_step": 24345, "epoch": 144} {"train_loss": -7.098053932189941, "global_step": 24346, "epoch": 144} {"train_loss": -7.1502180099487305, "global_step": 24347, "epoch": 144} {"train_loss": -7.278417587280273, "global_step": 24348, "epoch": 144} {"train_loss": -7.3523478507995605, "global_step": 24349, "epoch": 144} {"train_loss": -7.137105464935303, "global_step": 24350, "epoch": 144} {"train_loss": -7.229626178741455, "global_step": 24351, "epoch": 144} {"train_loss": -7.11264181137085, "global_step": 24352, "epoch": 144} {"train_loss": -7.167473793029785, "global_step": 24353, "epoch": 144} {"train_loss": -7.317640781402588, "global_step": 24354, "epoch": 144} {"train_loss": -7.300938606262207, "global_step": 24355, "epoch": 144} {"train_loss": -7.017317771911621, "global_step": 24356, "epoch": 144} {"train_loss": -7.037016868591309, "global_step": 24357, "epoch": 144} {"train_loss": -7.375186920166016, "global_step": 24358, "epoch": 144} {"train_loss": -7.140182963439396, "global_step": 24359, "epoch": 144, "val_loss": 203478.859375} {"train_loss": -7.21223258972168, "global_step": 24360, "epoch": 145} {"train_loss": -7.065478801727295, "global_step": 24361, "epoch": 145} {"train_loss": -7.093376159667969, "global_step": 24362, "epoch": 145} {"train_loss": -7.461489677429199, "global_step": 24363, "epoch": 145} {"train_loss": -7.376828670501709, "global_step": 24364, "epoch": 145} {"train_loss": -7.413958549499512, "global_step": 24365, "epoch": 145} {"train_loss": -7.254623889923096, "global_step": 24366, "epoch": 145} {"train_loss": -7.076067924499512, "global_step": 24367, "epoch": 145} {"train_loss": -7.474721908569336, "global_step": 24368, "epoch": 145} {"train_loss": -7.358150005340576, "global_step": 24369, "epoch": 145} {"train_loss": -7.225946426391602, "global_step": 24370, "epoch": 145} {"train_loss": -7.156478404998779, "global_step": 24371, "epoch": 145} {"train_loss": -7.330171585083008, "global_step": 24372, "epoch": 145} {"train_loss": -7.126370906829834, "global_step": 24373, "epoch": 145} {"train_loss": -7.016529083251953, "global_step": 24374, "epoch": 145} {"train_loss": -7.208065986633301, "global_step": 24375, "epoch": 145} {"train_loss": -7.208410263061523, "global_step": 24376, "epoch": 145} {"train_loss": -7.089197158813477, "global_step": 24377, "epoch": 145} {"train_loss": -7.15483283996582, "global_step": 24378, "epoch": 145} {"train_loss": -7.232269763946533, "global_step": 24379, "epoch": 145} {"train_loss": -7.204631328582764, "global_step": 24380, "epoch": 145} {"train_loss": -7.114774227142334, "global_step": 24381, "epoch": 145} {"train_loss": -6.993434429168701, "global_step": 24382, "epoch": 145} {"train_loss": -7.026692867279053, "global_step": 24383, "epoch": 145} {"train_loss": -7.2565717697143555, "global_step": 24384, "epoch": 145} {"train_loss": -7.301965236663818, "global_step": 24385, "epoch": 145} {"train_loss": -7.092246055603027, "global_step": 24386, "epoch": 145} {"train_loss": -7.137930870056152, "global_step": 24387, "epoch": 145} {"train_loss": -7.181819915771484, "global_step": 24388, "epoch": 145} {"train_loss": -7.16963005065918, "global_step": 24389, "epoch": 145} {"train_loss": -6.634515762329102, "global_step": 24390, "epoch": 145} {"train_loss": -7.120631217956543, "global_step": 24391, "epoch": 145} {"train_loss": -6.897045135498047, "global_step": 24392, "epoch": 145} {"train_loss": -6.879713535308838, "global_step": 24393, "epoch": 145} {"train_loss": -6.945716857910156, "global_step": 24394, "epoch": 145} {"train_loss": -6.979011535644531, "global_step": 24395, "epoch": 145} {"train_loss": -7.121638298034668, "global_step": 24396, "epoch": 145} {"train_loss": -7.0761590003967285, "global_step": 24397, "epoch": 145} {"train_loss": -7.203551292419434, "global_step": 24398, "epoch": 145} {"train_loss": -6.918428421020508, "global_step": 24399, "epoch": 145} {"train_loss": -6.904171466827393, "global_step": 24400, "epoch": 145} {"train_loss": -6.958868026733398, "global_step": 24401, "epoch": 145} {"train_loss": -7.132624626159668, "global_step": 24402, "epoch": 145} {"train_loss": -7.132153034210205, "global_step": 24403, "epoch": 145} {"train_loss": -7.219789505004883, "global_step": 24404, "epoch": 145} {"train_loss": -7.219391822814941, "global_step": 24405, "epoch": 145} {"train_loss": -7.075713157653809, "global_step": 24406, "epoch": 145} {"train_loss": -7.108704090118408, "global_step": 24407, "epoch": 145} {"train_loss": -7.270961761474609, "global_step": 24408, "epoch": 145} {"train_loss": -7.203258991241455, "global_step": 24409, "epoch": 145} {"train_loss": -7.105194091796875, "global_step": 24410, "epoch": 145} {"train_loss": -7.137197017669678, "global_step": 24411, "epoch": 145} {"train_loss": -7.335558891296387, "global_step": 24412, "epoch": 145} {"train_loss": -7.0959954261779785, "global_step": 24413, "epoch": 145} {"train_loss": -6.982807636260986, "global_step": 24414, "epoch": 145} {"train_loss": -7.260431289672852, "global_step": 24415, "epoch": 145} {"train_loss": -7.352232456207275, "global_step": 24416, "epoch": 145} {"train_loss": -7.16590690612793, "global_step": 24417, "epoch": 145} {"train_loss": -7.2138566970825195, "global_step": 24418, "epoch": 145} {"train_loss": -7.230140686035156, "global_step": 24419, "epoch": 145} {"train_loss": -7.0546770095825195, "global_step": 24420, "epoch": 145} {"train_loss": -7.348143577575684, "global_step": 24421, "epoch": 145} {"train_loss": -7.339875221252441, "global_step": 24422, "epoch": 145} {"train_loss": -6.952899932861328, "global_step": 24423, "epoch": 145} {"train_loss": -7.180829048156738, "global_step": 24424, "epoch": 145} {"train_loss": -7.13960075378418, "global_step": 24425, "epoch": 145} {"train_loss": -7.197544097900391, "global_step": 24426, "epoch": 145} {"train_loss": -7.096360206604004, "global_step": 24427, "epoch": 145} {"train_loss": -7.244449615478516, "global_step": 24428, "epoch": 145} {"train_loss": -6.690162658691406, "global_step": 24429, "epoch": 145} {"train_loss": -7.011800765991211, "global_step": 24430, "epoch": 145} {"train_loss": -7.174061298370361, "global_step": 24431, "epoch": 145} {"train_loss": -7.043078422546387, "global_step": 24432, "epoch": 145} {"train_loss": -7.005678653717041, "global_step": 24433, "epoch": 145} {"train_loss": -7.0802507400512695, "global_step": 24434, "epoch": 145} {"train_loss": -7.212962627410889, "global_step": 24435, "epoch": 145} {"train_loss": -7.203418731689453, "global_step": 24436, "epoch": 145} {"train_loss": -7.166059494018555, "global_step": 24437, "epoch": 145} {"train_loss": -6.945621490478516, "global_step": 24438, "epoch": 145} {"train_loss": -7.055778980255127, "global_step": 24439, "epoch": 145} {"train_loss": -7.029372692108154, "global_step": 24440, "epoch": 145} {"train_loss": -7.042539596557617, "global_step": 24441, "epoch": 145} {"train_loss": -7.142522811889648, "global_step": 24442, "epoch": 145} {"train_loss": -6.885855674743652, "global_step": 24443, "epoch": 145} {"train_loss": -7.016220569610596, "global_step": 24444, "epoch": 145} {"train_loss": -7.157718181610107, "global_step": 24445, "epoch": 145} {"train_loss": -7.04571533203125, "global_step": 24446, "epoch": 145} {"train_loss": -7.034858703613281, "global_step": 24447, "epoch": 145} {"train_loss": -7.301050186157227, "global_step": 24448, "epoch": 145} {"train_loss": -6.975588798522949, "global_step": 24449, "epoch": 145} {"train_loss": -7.146355628967285, "global_step": 24450, "epoch": 145} {"train_loss": -7.096277713775635, "global_step": 24451, "epoch": 145} {"train_loss": -7.129620552062988, "global_step": 24452, "epoch": 145} {"train_loss": -7.144589900970459, "global_step": 24453, "epoch": 145} {"train_loss": -7.07401180267334, "global_step": 24454, "epoch": 145} {"train_loss": -7.070125579833984, "global_step": 24455, "epoch": 145} {"train_loss": -6.96854305267334, "global_step": 24456, "epoch": 145} {"train_loss": -7.095467567443848, "global_step": 24457, "epoch": 145} {"train_loss": -7.155940055847168, "global_step": 24458, "epoch": 145} {"train_loss": -6.979434967041016, "global_step": 24459, "epoch": 145} {"train_loss": -7.092440128326416, "global_step": 24460, "epoch": 145} {"train_loss": -6.979867935180664, "global_step": 24461, "epoch": 145} {"train_loss": -7.278051376342773, "global_step": 24462, "epoch": 145} {"train_loss": -6.976097106933594, "global_step": 24463, "epoch": 145} {"train_loss": -7.223339080810547, "global_step": 24464, "epoch": 145} {"train_loss": -7.081204414367676, "global_step": 24465, "epoch": 145} {"train_loss": -7.217413425445557, "global_step": 24466, "epoch": 145} {"train_loss": -7.118181228637695, "global_step": 24467, "epoch": 145} {"train_loss": -7.31158447265625, "global_step": 24468, "epoch": 145} {"train_loss": -7.092933654785156, "global_step": 24469, "epoch": 145} {"train_loss": -7.29484748840332, "global_step": 24470, "epoch": 145} {"train_loss": -7.370259761810303, "global_step": 24471, "epoch": 145} {"train_loss": -7.341759204864502, "global_step": 24472, "epoch": 145} {"train_loss": -7.197748184204102, "global_step": 24473, "epoch": 145} {"train_loss": -7.235811233520508, "global_step": 24474, "epoch": 145} {"train_loss": -7.264771461486816, "global_step": 24475, "epoch": 145} {"train_loss": -6.997215270996094, "global_step": 24476, "epoch": 145} {"train_loss": -7.321831226348877, "global_step": 24477, "epoch": 145} {"train_loss": -7.031898498535156, "global_step": 24478, "epoch": 145} {"train_loss": -7.168041229248047, "global_step": 24479, "epoch": 145} {"train_loss": -6.958022117614746, "global_step": 24480, "epoch": 145} {"train_loss": -7.161147117614746, "global_step": 24481, "epoch": 145} {"train_loss": -7.082437515258789, "global_step": 24482, "epoch": 145} {"train_loss": -6.949418067932129, "global_step": 24483, "epoch": 145} {"train_loss": -6.949174880981445, "global_step": 24484, "epoch": 145} {"train_loss": -6.872544288635254, "global_step": 24485, "epoch": 145} {"train_loss": -7.149386405944824, "global_step": 24486, "epoch": 145} {"train_loss": -6.973599433898926, "global_step": 24487, "epoch": 145} {"train_loss": -6.922669410705566, "global_step": 24488, "epoch": 145} {"train_loss": -7.187631130218506, "global_step": 24489, "epoch": 145} {"train_loss": -6.892816543579102, "global_step": 24490, "epoch": 145} {"train_loss": -7.027990341186523, "global_step": 24491, "epoch": 145} {"train_loss": -7.079588413238525, "global_step": 24492, "epoch": 145} {"train_loss": -7.059678077697754, "global_step": 24493, "epoch": 145} {"train_loss": -7.162378311157227, "global_step": 24494, "epoch": 145} {"train_loss": -6.887333869934082, "global_step": 24495, "epoch": 145} {"train_loss": -7.173091888427734, "global_step": 24496, "epoch": 145} {"train_loss": -6.840221405029297, "global_step": 24497, "epoch": 145} {"train_loss": -7.022524833679199, "global_step": 24498, "epoch": 145} {"train_loss": -6.945376396179199, "global_step": 24499, "epoch": 145} {"train_loss": -7.027947425842285, "global_step": 24500, "epoch": 145} {"train_loss": -6.826021194458008, "global_step": 24501, "epoch": 145} {"train_loss": -6.64564323425293, "global_step": 24502, "epoch": 145} {"train_loss": -7.10169792175293, "global_step": 24503, "epoch": 145} {"train_loss": -6.913027763366699, "global_step": 24504, "epoch": 145} {"train_loss": -7.193688869476318, "global_step": 24505, "epoch": 145} {"train_loss": -6.936455726623535, "global_step": 24506, "epoch": 145} {"train_loss": -6.797618865966797, "global_step": 24507, "epoch": 145} {"train_loss": -7.129486083984375, "global_step": 24508, "epoch": 145} {"train_loss": -6.814756393432617, "global_step": 24509, "epoch": 145} {"train_loss": -7.20517110824585, "global_step": 24510, "epoch": 145} {"train_loss": -6.919556617736816, "global_step": 24511, "epoch": 145} {"train_loss": -7.032573699951172, "global_step": 24512, "epoch": 145} {"train_loss": -7.144631385803223, "global_step": 24513, "epoch": 145} {"train_loss": -6.886902809143066, "global_step": 24514, "epoch": 145} {"train_loss": -7.137923717498779, "global_step": 24515, "epoch": 145} {"train_loss": -7.029079914093018, "global_step": 24516, "epoch": 145} {"train_loss": -6.920637130737305, "global_step": 24517, "epoch": 145} {"train_loss": -6.8339643478393555, "global_step": 24518, "epoch": 145} {"train_loss": -6.9183502197265625, "global_step": 24519, "epoch": 145} {"train_loss": -6.944547653198242, "global_step": 24520, "epoch": 145} {"train_loss": -6.741019248962402, "global_step": 24521, "epoch": 145} {"train_loss": -7.160757064819336, "global_step": 24522, "epoch": 145} {"train_loss": -6.773253917694092, "global_step": 24523, "epoch": 145} {"train_loss": -6.873745441436768, "global_step": 24524, "epoch": 145} {"train_loss": -6.8788275718688965, "global_step": 24525, "epoch": 145} {"train_loss": -7.007995128631592, "global_step": 24526, "epoch": 145} {"train_loss": -7.089205239500318, "global_step": 24527, "epoch": 145, "val_loss": 209331.96875, "train_action_mse_error": 13.110509872436523} {"train_loss": -6.638376235961914, "global_step": 24528, "epoch": 146} {"train_loss": -6.842922210693359, "global_step": 24529, "epoch": 146} {"train_loss": -6.892876625061035, "global_step": 24530, "epoch": 146} {"train_loss": -6.961352348327637, "global_step": 24531, "epoch": 146} {"train_loss": -6.9223198890686035, "global_step": 24532, "epoch": 146} {"train_loss": -6.8885908126831055, "global_step": 24533, "epoch": 146} {"train_loss": -7.021764755249023, "global_step": 24534, "epoch": 146} {"train_loss": -7.119421482086182, "global_step": 24535, "epoch": 146} {"train_loss": -6.9806108474731445, "global_step": 24536, "epoch": 146} {"train_loss": -6.873465538024902, "global_step": 24537, "epoch": 146} {"train_loss": -6.852748394012451, "global_step": 24538, "epoch": 146} {"train_loss": -7.153878211975098, "global_step": 24539, "epoch": 146} {"train_loss": -7.382585525512695, "global_step": 24540, "epoch": 146} {"train_loss": -7.002266883850098, "global_step": 24541, "epoch": 146} {"train_loss": -7.240522384643555, "global_step": 24542, "epoch": 146} {"train_loss": -7.148497581481934, "global_step": 24543, "epoch": 146} {"train_loss": -7.093871116638184, "global_step": 24544, "epoch": 146} {"train_loss": -7.2128071784973145, "global_step": 24545, "epoch": 146} {"train_loss": -7.2831292152404785, "global_step": 24546, "epoch": 146} {"train_loss": -7.2021989822387695, "global_step": 24547, "epoch": 146} {"train_loss": -7.082898139953613, "global_step": 24548, "epoch": 146} {"train_loss": -7.191701889038086, "global_step": 24549, "epoch": 146} {"train_loss": -7.002678394317627, "global_step": 24550, "epoch": 146} {"train_loss": -7.206159591674805, "global_step": 24551, "epoch": 146} {"train_loss": -7.422484397888184, "global_step": 24552, "epoch": 146} {"train_loss": -7.1003923416137695, "global_step": 24553, "epoch": 146} {"train_loss": -7.125679969787598, "global_step": 24554, "epoch": 146} {"train_loss": -7.343099594116211, "global_step": 24555, "epoch": 146} {"train_loss": -7.069762706756592, "global_step": 24556, "epoch": 146} {"train_loss": -7.204806327819824, "global_step": 24557, "epoch": 146} {"train_loss": -7.225889205932617, "global_step": 24558, "epoch": 146} {"train_loss": -7.0785298347473145, "global_step": 24559, "epoch": 146} {"train_loss": -7.079929828643799, "global_step": 24560, "epoch": 146} {"train_loss": -7.364885330200195, "global_step": 24561, "epoch": 146} {"train_loss": -6.995116233825684, "global_step": 24562, "epoch": 146} {"train_loss": -7.243188858032227, "global_step": 24563, "epoch": 146} {"train_loss": -7.368931293487549, "global_step": 24564, "epoch": 146} {"train_loss": -7.137508869171143, "global_step": 24565, "epoch": 146} {"train_loss": -7.254118919372559, "global_step": 24566, "epoch": 146} {"train_loss": -7.195276260375977, "global_step": 24567, "epoch": 146} {"train_loss": -6.952462673187256, "global_step": 24568, "epoch": 146} {"train_loss": -7.327054500579834, "global_step": 24569, "epoch": 146} {"train_loss": -7.009552001953125, "global_step": 24570, "epoch": 146} {"train_loss": -7.324154376983643, "global_step": 24571, "epoch": 146} {"train_loss": -7.047092437744141, "global_step": 24572, "epoch": 146} {"train_loss": -6.991265296936035, "global_step": 24573, "epoch": 146} {"train_loss": -7.142551422119141, "global_step": 24574, "epoch": 146} {"train_loss": -7.136222839355469, "global_step": 24575, "epoch": 146} {"train_loss": -7.271300315856934, "global_step": 24576, "epoch": 146} {"train_loss": -6.969758987426758, "global_step": 24577, "epoch": 146} {"train_loss": -7.223717212677002, "global_step": 24578, "epoch": 146} {"train_loss": -7.011228561401367, "global_step": 24579, "epoch": 146} {"train_loss": -7.343920707702637, "global_step": 24580, "epoch": 146} {"train_loss": -7.238694190979004, "global_step": 24581, "epoch": 146} {"train_loss": -7.024186134338379, "global_step": 24582, "epoch": 146} {"train_loss": -7.348109245300293, "global_step": 24583, "epoch": 146} {"train_loss": -7.041048526763916, "global_step": 24584, "epoch": 146} {"train_loss": -7.382655143737793, "global_step": 24585, "epoch": 146} {"train_loss": -7.288787364959717, "global_step": 24586, "epoch": 146} {"train_loss": -7.157118797302246, "global_step": 24587, "epoch": 146} {"train_loss": -7.454204559326172, "global_step": 24588, "epoch": 146} {"train_loss": -7.188619136810303, "global_step": 24589, "epoch": 146} {"train_loss": -7.0825347900390625, "global_step": 24590, "epoch": 146} {"train_loss": -7.319473743438721, "global_step": 24591, "epoch": 146} {"train_loss": -7.009664535522461, "global_step": 24592, "epoch": 146} {"train_loss": -7.168582439422607, "global_step": 24593, "epoch": 146} {"train_loss": -7.033563613891602, "global_step": 24594, "epoch": 146} {"train_loss": -7.155707359313965, "global_step": 24595, "epoch": 146} {"train_loss": -6.868592739105225, "global_step": 24596, "epoch": 146} {"train_loss": -7.225854873657227, "global_step": 24597, "epoch": 146} {"train_loss": -7.085024833679199, "global_step": 24598, "epoch": 146} {"train_loss": -7.073884010314941, "global_step": 24599, "epoch": 146} {"train_loss": -7.078577995300293, "global_step": 24600, "epoch": 146} {"train_loss": -7.005949020385742, "global_step": 24601, "epoch": 146} {"train_loss": -7.038529396057129, "global_step": 24602, "epoch": 146} {"train_loss": -7.315711975097656, "global_step": 24603, "epoch": 146} {"train_loss": -7.020049095153809, "global_step": 24604, "epoch": 146} {"train_loss": -7.098817825317383, "global_step": 24605, "epoch": 146} {"train_loss": -7.018617630004883, "global_step": 24606, "epoch": 146} {"train_loss": -7.169810771942139, "global_step": 24607, "epoch": 146} {"train_loss": -7.108293056488037, "global_step": 24608, "epoch": 146} {"train_loss": -7.316742897033691, "global_step": 24609, "epoch": 146} {"train_loss": -7.233439922332764, "global_step": 24610, "epoch": 146} {"train_loss": -7.377234935760498, "global_step": 24611, "epoch": 146} {"train_loss": -7.210912227630615, "global_step": 24612, "epoch": 146} {"train_loss": -7.0528564453125, "global_step": 24613, "epoch": 146} {"train_loss": -7.146921634674072, "global_step": 24614, "epoch": 146} {"train_loss": -7.127285480499268, "global_step": 24615, "epoch": 146} {"train_loss": -7.33372688293457, "global_step": 24616, "epoch": 146} {"train_loss": -7.328325271606445, "global_step": 24617, "epoch": 146} {"train_loss": -7.153406143188477, "global_step": 24618, "epoch": 146} {"train_loss": -7.016748905181885, "global_step": 24619, "epoch": 146} {"train_loss": -7.083104133605957, "global_step": 24620, "epoch": 146} {"train_loss": -7.376810550689697, "global_step": 24621, "epoch": 146} {"train_loss": -6.966846466064453, "global_step": 24622, "epoch": 146} {"train_loss": -7.16171932220459, "global_step": 24623, "epoch": 146} {"train_loss": -6.878700256347656, "global_step": 24624, "epoch": 146} {"train_loss": -7.250948429107666, "global_step": 24625, "epoch": 146} {"train_loss": -7.069780349731445, "global_step": 24626, "epoch": 146} {"train_loss": -7.0179643630981445, "global_step": 24627, "epoch": 146} {"train_loss": -6.879904270172119, "global_step": 24628, "epoch": 146} {"train_loss": -6.963366985321045, "global_step": 24629, "epoch": 146} {"train_loss": -7.158192157745361, "global_step": 24630, "epoch": 146} {"train_loss": -6.7725372314453125, "global_step": 24631, "epoch": 146} {"train_loss": -7.24642276763916, "global_step": 24632, "epoch": 146} {"train_loss": -7.165463924407959, "global_step": 24633, "epoch": 146} {"train_loss": -7.411012649536133, "global_step": 24634, "epoch": 146} {"train_loss": -7.28131103515625, "global_step": 24635, "epoch": 146} {"train_loss": -7.143301486968994, "global_step": 24636, "epoch": 146} {"train_loss": -7.485742568969727, "global_step": 24637, "epoch": 146} {"train_loss": -7.2833476066589355, "global_step": 24638, "epoch": 146} {"train_loss": -7.0570478439331055, "global_step": 24639, "epoch": 146} {"train_loss": -7.2968220710754395, "global_step": 24640, "epoch": 146} {"train_loss": -7.135527610778809, "global_step": 24641, "epoch": 146} {"train_loss": -7.226268291473389, "global_step": 24642, "epoch": 146} {"train_loss": -7.189059257507324, "global_step": 24643, "epoch": 146} {"train_loss": -7.300663948059082, "global_step": 24644, "epoch": 146} {"train_loss": -7.203391075134277, "global_step": 24645, "epoch": 146} {"train_loss": -7.206604480743408, "global_step": 24646, "epoch": 146} {"train_loss": -7.067389965057373, "global_step": 24647, "epoch": 146} {"train_loss": -7.294099807739258, "global_step": 24648, "epoch": 146} {"train_loss": -6.8775787353515625, "global_step": 24649, "epoch": 146} {"train_loss": -7.318482398986816, "global_step": 24650, "epoch": 146} {"train_loss": -7.016025066375732, "global_step": 24651, "epoch": 146} {"train_loss": -7.187290191650391, "global_step": 24652, "epoch": 146} {"train_loss": -7.225743293762207, "global_step": 24653, "epoch": 146} {"train_loss": -7.374405860900879, "global_step": 24654, "epoch": 146} {"train_loss": -7.183284282684326, "global_step": 24655, "epoch": 146} {"train_loss": -7.416027545928955, "global_step": 24656, "epoch": 146} {"train_loss": -7.061404228210449, "global_step": 24657, "epoch": 146} {"train_loss": -7.231102466583252, "global_step": 24658, "epoch": 146} {"train_loss": -7.232461929321289, "global_step": 24659, "epoch": 146} {"train_loss": -7.292344570159912, "global_step": 24660, "epoch": 146} {"train_loss": -6.9463114738464355, "global_step": 24661, "epoch": 146} {"train_loss": -7.002444267272949, "global_step": 24662, "epoch": 146} {"train_loss": -6.952217102050781, "global_step": 24663, "epoch": 146} {"train_loss": -6.939770698547363, "global_step": 24664, "epoch": 146} {"train_loss": -7.028554916381836, "global_step": 24665, "epoch": 146} {"train_loss": -7.0578389167785645, "global_step": 24666, "epoch": 146} {"train_loss": -7.023556709289551, "global_step": 24667, "epoch": 146} {"train_loss": -6.886610984802246, "global_step": 24668, "epoch": 146} {"train_loss": -6.878370761871338, "global_step": 24669, "epoch": 146} {"train_loss": -6.9972381591796875, "global_step": 24670, "epoch": 146} {"train_loss": -7.076262950897217, "global_step": 24671, "epoch": 146} {"train_loss": -7.272643566131592, "global_step": 24672, "epoch": 146} {"train_loss": -6.805916786193848, "global_step": 24673, "epoch": 146} {"train_loss": -6.989904403686523, "global_step": 24674, "epoch": 146} {"train_loss": -7.100686550140381, "global_step": 24675, "epoch": 146} {"train_loss": -6.8907999992370605, "global_step": 24676, "epoch": 146} {"train_loss": -6.984580993652344, "global_step": 24677, "epoch": 146} {"train_loss": -6.896442413330078, "global_step": 24678, "epoch": 146} {"train_loss": -7.202312469482422, "global_step": 24679, "epoch": 146} {"train_loss": -7.104496002197266, "global_step": 24680, "epoch": 146} {"train_loss": -6.954412937164307, "global_step": 24681, "epoch": 146} {"train_loss": -7.240259647369385, "global_step": 24682, "epoch": 146} {"train_loss": -6.909898281097412, "global_step": 24683, "epoch": 146} {"train_loss": -7.278295040130615, "global_step": 24684, "epoch": 146} {"train_loss": -6.908324718475342, "global_step": 24685, "epoch": 146} {"train_loss": -7.076371192932129, "global_step": 24686, "epoch": 146} {"train_loss": -7.185778617858887, "global_step": 24687, "epoch": 146} {"train_loss": -6.970761775970459, "global_step": 24688, "epoch": 146} {"train_loss": -7.1506452560424805, "global_step": 24689, "epoch": 146} {"train_loss": -7.084236145019531, "global_step": 24690, "epoch": 146} {"train_loss": -7.141480445861816, "global_step": 24691, "epoch": 146} {"train_loss": -7.325399875640869, "global_step": 24692, "epoch": 146} {"train_loss": -7.115983486175537, "global_step": 24693, "epoch": 146} {"train_loss": -7.197204113006592, "global_step": 24694, "epoch": 146} {"train_loss": -7.127445547353654, "global_step": 24695, "epoch": 146, "val_loss": 200626.40625} {"train_loss": -7.1176581382751465, "global_step": 24696, "epoch": 147} {"train_loss": -7.1992669105529785, "global_step": 24697, "epoch": 147} {"train_loss": -7.303503513336182, "global_step": 24698, "epoch": 147} {"train_loss": -7.05806827545166, "global_step": 24699, "epoch": 147} {"train_loss": -7.100845813751221, "global_step": 24700, "epoch": 147} {"train_loss": -7.124368667602539, "global_step": 24701, "epoch": 147} {"train_loss": -7.200523376464844, "global_step": 24702, "epoch": 147} {"train_loss": -7.131531715393066, "global_step": 24703, "epoch": 147} {"train_loss": -6.990483283996582, "global_step": 24704, "epoch": 147} {"train_loss": -7.139413833618164, "global_step": 24705, "epoch": 147} {"train_loss": -6.993798732757568, "global_step": 24706, "epoch": 147} {"train_loss": -7.301982879638672, "global_step": 24707, "epoch": 147} {"train_loss": -7.514869689941406, "global_step": 24708, "epoch": 147} {"train_loss": -7.116089820861816, "global_step": 24709, "epoch": 147} {"train_loss": -7.304706573486328, "global_step": 24710, "epoch": 147} {"train_loss": -6.924582481384277, "global_step": 24711, "epoch": 147} {"train_loss": -6.9723405838012695, "global_step": 24712, "epoch": 147} {"train_loss": -7.368175983428955, "global_step": 24713, "epoch": 147} {"train_loss": -7.192403793334961, "global_step": 24714, "epoch": 147} {"train_loss": -7.004775524139404, "global_step": 24715, "epoch": 147} {"train_loss": -7.187536239624023, "global_step": 24716, "epoch": 147} {"train_loss": -7.080018997192383, "global_step": 24717, "epoch": 147} {"train_loss": -7.131028175354004, "global_step": 24718, "epoch": 147} {"train_loss": -7.161637783050537, "global_step": 24719, "epoch": 147} {"train_loss": -7.0887861251831055, "global_step": 24720, "epoch": 147} {"train_loss": -7.215633392333984, "global_step": 24721, "epoch": 147} {"train_loss": -7.173947334289551, "global_step": 24722, "epoch": 147} {"train_loss": -7.13893461227417, "global_step": 24723, "epoch": 147} {"train_loss": -6.960111618041992, "global_step": 24724, "epoch": 147} {"train_loss": -7.07154655456543, "global_step": 24725, "epoch": 147} {"train_loss": -7.296286582946777, "global_step": 24726, "epoch": 147} {"train_loss": -7.081376075744629, "global_step": 24727, "epoch": 147} {"train_loss": -7.277238368988037, "global_step": 24728, "epoch": 147} {"train_loss": -7.195402145385742, "global_step": 24729, "epoch": 147} {"train_loss": -7.0838751792907715, "global_step": 24730, "epoch": 147} {"train_loss": -7.437068939208984, "global_step": 24731, "epoch": 147} {"train_loss": -7.208364486694336, "global_step": 24732, "epoch": 147} {"train_loss": -7.172783851623535, "global_step": 24733, "epoch": 147} {"train_loss": -7.1089982986450195, "global_step": 24734, "epoch": 147} {"train_loss": -7.167471885681152, "global_step": 24735, "epoch": 147} {"train_loss": -7.336289405822754, "global_step": 24736, "epoch": 147} {"train_loss": -7.2064409255981445, "global_step": 24737, "epoch": 147} {"train_loss": -7.0427656173706055, "global_step": 24738, "epoch": 147} {"train_loss": -7.349365711212158, "global_step": 24739, "epoch": 147} {"train_loss": -7.24964714050293, "global_step": 24740, "epoch": 147} {"train_loss": -7.242222785949707, "global_step": 24741, "epoch": 147} {"train_loss": -7.469479084014893, "global_step": 24742, "epoch": 147} {"train_loss": -7.026977062225342, "global_step": 24743, "epoch": 147} {"train_loss": -7.030991077423096, "global_step": 24744, "epoch": 147} {"train_loss": -6.993380546569824, "global_step": 24745, "epoch": 147} {"train_loss": -6.976329803466797, "global_step": 24746, "epoch": 147} {"train_loss": -7.214849472045898, "global_step": 24747, "epoch": 147} {"train_loss": -7.089095115661621, "global_step": 24748, "epoch": 147} {"train_loss": -6.871436595916748, "global_step": 24749, "epoch": 147} {"train_loss": -7.148868560791016, "global_step": 24750, "epoch": 147} {"train_loss": -7.060225963592529, "global_step": 24751, "epoch": 147} {"train_loss": -7.052347660064697, "global_step": 24752, "epoch": 147} {"train_loss": -7.009685516357422, "global_step": 24753, "epoch": 147} {"train_loss": -7.102540969848633, "global_step": 24754, "epoch": 147} {"train_loss": -6.980696678161621, "global_step": 24755, "epoch": 147} {"train_loss": -7.258631706237793, "global_step": 24756, "epoch": 147} {"train_loss": -6.781769275665283, "global_step": 24757, "epoch": 147} {"train_loss": -6.997825622558594, "global_step": 24758, "epoch": 147} {"train_loss": -6.820472717285156, "global_step": 24759, "epoch": 147} {"train_loss": -7.027839183807373, "global_step": 24760, "epoch": 147} {"train_loss": -7.193750381469727, "global_step": 24761, "epoch": 147} {"train_loss": -7.010840892791748, "global_step": 24762, "epoch": 147} {"train_loss": -7.011743545532227, "global_step": 24763, "epoch": 147} {"train_loss": -6.9170918464660645, "global_step": 24764, "epoch": 147} {"train_loss": -7.1361870765686035, "global_step": 24765, "epoch": 147} {"train_loss": -7.124207019805908, "global_step": 24766, "epoch": 147} {"train_loss": -7.034626007080078, "global_step": 24767, "epoch": 147} {"train_loss": -7.061493873596191, "global_step": 24768, "epoch": 147} {"train_loss": -7.200480937957764, "global_step": 24769, "epoch": 147} {"train_loss": -7.035923004150391, "global_step": 24770, "epoch": 147} {"train_loss": -7.111284255981445, "global_step": 24771, "epoch": 147} {"train_loss": -6.694841384887695, "global_step": 24772, "epoch": 147} {"train_loss": -7.044100284576416, "global_step": 24773, "epoch": 147} {"train_loss": -6.992153167724609, "global_step": 24774, "epoch": 147} {"train_loss": -6.985813140869141, "global_step": 24775, "epoch": 147} {"train_loss": -7.220403671264648, "global_step": 24776, "epoch": 147} {"train_loss": -6.835927486419678, "global_step": 24777, "epoch": 147} {"train_loss": -6.947798728942871, "global_step": 24778, "epoch": 147} {"train_loss": -7.012641906738281, "global_step": 24779, "epoch": 147} {"train_loss": -6.877649307250977, "global_step": 24780, "epoch": 147} {"train_loss": -7.033891677856445, "global_step": 24781, "epoch": 147} {"train_loss": -7.025529861450195, "global_step": 24782, "epoch": 147} {"train_loss": -6.9667134284973145, "global_step": 24783, "epoch": 147} {"train_loss": -7.151357173919678, "global_step": 24784, "epoch": 147} {"train_loss": -7.014655590057373, "global_step": 24785, "epoch": 147} {"train_loss": -7.240045547485352, "global_step": 24786, "epoch": 147} {"train_loss": -7.184072017669678, "global_step": 24787, "epoch": 147} {"train_loss": -6.936470031738281, "global_step": 24788, "epoch": 147} {"train_loss": -7.213327884674072, "global_step": 24789, "epoch": 147} {"train_loss": -7.179167747497559, "global_step": 24790, "epoch": 147} {"train_loss": -7.058069229125977, "global_step": 24791, "epoch": 147} {"train_loss": -7.1453657150268555, "global_step": 24792, "epoch": 147} {"train_loss": -6.865666389465332, "global_step": 24793, "epoch": 147} {"train_loss": -6.977163314819336, "global_step": 24794, "epoch": 147} {"train_loss": -6.8873724937438965, "global_step": 24795, "epoch": 147} {"train_loss": -6.993013381958008, "global_step": 24796, "epoch": 147} {"train_loss": -7.288392543792725, "global_step": 24797, "epoch": 147} {"train_loss": -7.100275039672852, "global_step": 24798, "epoch": 147} {"train_loss": -7.258579254150391, "global_step": 24799, "epoch": 147} {"train_loss": -6.6771345138549805, "global_step": 24800, "epoch": 147} {"train_loss": -6.94727897644043, "global_step": 24801, "epoch": 147} {"train_loss": -7.250742435455322, "global_step": 24802, "epoch": 147} {"train_loss": -7.053524971008301, "global_step": 24803, "epoch": 147} {"train_loss": -7.151061058044434, "global_step": 24804, "epoch": 147} {"train_loss": -7.175861358642578, "global_step": 24805, "epoch": 147} {"train_loss": -7.248390197753906, "global_step": 24806, "epoch": 147} {"train_loss": -7.0870161056518555, "global_step": 24807, "epoch": 147} {"train_loss": -7.171676158905029, "global_step": 24808, "epoch": 147} {"train_loss": -7.20390510559082, "global_step": 24809, "epoch": 147} {"train_loss": -7.213155746459961, "global_step": 24810, "epoch": 147} {"train_loss": -7.1835222244262695, "global_step": 24811, "epoch": 147} {"train_loss": -7.388795375823975, "global_step": 24812, "epoch": 147} {"train_loss": -7.272170543670654, "global_step": 24813, "epoch": 147} {"train_loss": -7.168911933898926, "global_step": 24814, "epoch": 147} {"train_loss": -7.260931015014648, "global_step": 24815, "epoch": 147} {"train_loss": -7.153715133666992, "global_step": 24816, "epoch": 147} {"train_loss": -7.322043418884277, "global_step": 24817, "epoch": 147} {"train_loss": -7.1471357345581055, "global_step": 24818, "epoch": 147} {"train_loss": -7.1788787841796875, "global_step": 24819, "epoch": 147} {"train_loss": -7.157893180847168, "global_step": 24820, "epoch": 147} {"train_loss": -7.262368679046631, "global_step": 24821, "epoch": 147} {"train_loss": -7.052411079406738, "global_step": 24822, "epoch": 147} {"train_loss": -7.277387619018555, "global_step": 24823, "epoch": 147} {"train_loss": -7.154667377471924, "global_step": 24824, "epoch": 147} {"train_loss": -7.02449893951416, "global_step": 24825, "epoch": 147} {"train_loss": -7.307005405426025, "global_step": 24826, "epoch": 147} {"train_loss": -7.2418951988220215, "global_step": 24827, "epoch": 147} {"train_loss": -7.261620998382568, "global_step": 24828, "epoch": 147} {"train_loss": -7.498716354370117, "global_step": 24829, "epoch": 147} {"train_loss": -7.002635478973389, "global_step": 24830, "epoch": 147} {"train_loss": -7.1723432540893555, "global_step": 24831, "epoch": 147} {"train_loss": -7.1788835525512695, "global_step": 24832, "epoch": 147} {"train_loss": -7.21005392074585, "global_step": 24833, "epoch": 147} {"train_loss": -7.021913528442383, "global_step": 24834, "epoch": 147} {"train_loss": -7.256880283355713, "global_step": 24835, "epoch": 147} {"train_loss": -7.257794380187988, "global_step": 24836, "epoch": 147} {"train_loss": -7.229077339172363, "global_step": 24837, "epoch": 147} {"train_loss": -7.063337802886963, "global_step": 24838, "epoch": 147} {"train_loss": -7.2682600021362305, "global_step": 24839, "epoch": 147} {"train_loss": -7.171459674835205, "global_step": 24840, "epoch": 147} {"train_loss": -7.171286106109619, "global_step": 24841, "epoch": 147} {"train_loss": -7.21073055267334, "global_step": 24842, "epoch": 147} {"train_loss": -7.100895881652832, "global_step": 24843, "epoch": 147} {"train_loss": -7.10221529006958, "global_step": 24844, "epoch": 147} {"train_loss": -7.376813888549805, "global_step": 24845, "epoch": 147} {"train_loss": -7.182718276977539, "global_step": 24846, "epoch": 147} {"train_loss": -7.139578342437744, "global_step": 24847, "epoch": 147} {"train_loss": -7.245500087738037, "global_step": 24848, "epoch": 147} {"train_loss": -7.107240676879883, "global_step": 24849, "epoch": 147} {"train_loss": -7.04407262802124, "global_step": 24850, "epoch": 147} {"train_loss": -7.188458442687988, "global_step": 24851, "epoch": 147} {"train_loss": -7.2916059494018555, "global_step": 24852, "epoch": 147} {"train_loss": -7.105375289916992, "global_step": 24853, "epoch": 147} {"train_loss": -7.120441436767578, "global_step": 24854, "epoch": 147} {"train_loss": -7.287631034851074, "global_step": 24855, "epoch": 147} {"train_loss": -7.273445129394531, "global_step": 24856, "epoch": 147} {"train_loss": -7.2935638427734375, "global_step": 24857, "epoch": 147} {"train_loss": -7.299258232116699, "global_step": 24858, "epoch": 147} {"train_loss": -7.138898849487305, "global_step": 24859, "epoch": 147} {"train_loss": -7.103195667266846, "global_step": 24860, "epoch": 147} {"train_loss": -7.024815559387207, "global_step": 24861, "epoch": 147} {"train_loss": -7.235362529754639, "global_step": 24862, "epoch": 147} {"train_loss": -7.1314893166224165, "global_step": 24863, "epoch": 147, "val_loss": 199045.1875} {"train_loss": -7.079684257507324, "global_step": 24864, "epoch": 148} {"train_loss": -7.247984886169434, "global_step": 24865, "epoch": 148} {"train_loss": -7.033242702484131, "global_step": 24866, "epoch": 148} {"train_loss": -7.001699447631836, "global_step": 24867, "epoch": 148} {"train_loss": -7.036291599273682, "global_step": 24868, "epoch": 148} {"train_loss": -7.319552898406982, "global_step": 24869, "epoch": 148} {"train_loss": -7.050139427185059, "global_step": 24870, "epoch": 148} {"train_loss": -7.191535472869873, "global_step": 24871, "epoch": 148} {"train_loss": -6.902776718139648, "global_step": 24872, "epoch": 148} {"train_loss": -6.960996627807617, "global_step": 24873, "epoch": 148} {"train_loss": -6.801933765411377, "global_step": 24874, "epoch": 148} {"train_loss": -7.082066535949707, "global_step": 24875, "epoch": 148} {"train_loss": -6.83220100402832, "global_step": 24876, "epoch": 148} {"train_loss": -7.059608459472656, "global_step": 24877, "epoch": 148} {"train_loss": -6.928008556365967, "global_step": 24878, "epoch": 148} {"train_loss": -6.911520957946777, "global_step": 24879, "epoch": 148} {"train_loss": -7.01982307434082, "global_step": 24880, "epoch": 148} {"train_loss": -6.90025520324707, "global_step": 24881, "epoch": 148} {"train_loss": -7.18966007232666, "global_step": 24882, "epoch": 148} {"train_loss": -7.0890960693359375, "global_step": 24883, "epoch": 148} {"train_loss": -7.257735252380371, "global_step": 24884, "epoch": 148} {"train_loss": -7.044168472290039, "global_step": 24885, "epoch": 148} {"train_loss": -7.207344055175781, "global_step": 24886, "epoch": 148} {"train_loss": -6.9810709953308105, "global_step": 24887, "epoch": 148} {"train_loss": -6.972253799438477, "global_step": 24888, "epoch": 148} {"train_loss": -6.957202434539795, "global_step": 24889, "epoch": 148} {"train_loss": -7.027565002441406, "global_step": 24890, "epoch": 148} {"train_loss": -7.341521739959717, "global_step": 24891, "epoch": 148} {"train_loss": -6.90289831161499, "global_step": 24892, "epoch": 148} {"train_loss": -7.0609283447265625, "global_step": 24893, "epoch": 148} {"train_loss": -7.193629264831543, "global_step": 24894, "epoch": 148} {"train_loss": -7.245617389678955, "global_step": 24895, "epoch": 148} {"train_loss": -7.284983158111572, "global_step": 24896, "epoch": 148} {"train_loss": -7.021437644958496, "global_step": 24897, "epoch": 148} {"train_loss": -7.40052604675293, "global_step": 24898, "epoch": 148} {"train_loss": -7.360583305358887, "global_step": 24899, "epoch": 148} {"train_loss": -7.202338695526123, "global_step": 24900, "epoch": 148} {"train_loss": -7.176504611968994, "global_step": 24901, "epoch": 148} {"train_loss": -7.156134605407715, "global_step": 24902, "epoch": 148} {"train_loss": -7.2967023849487305, "global_step": 24903, "epoch": 148} {"train_loss": -7.088916778564453, "global_step": 24904, "epoch": 148} {"train_loss": -7.057819843292236, "global_step": 24905, "epoch": 148} {"train_loss": -7.004155158996582, "global_step": 24906, "epoch": 148} {"train_loss": -7.216869354248047, "global_step": 24907, "epoch": 148} {"train_loss": -7.032299041748047, "global_step": 24908, "epoch": 148} {"train_loss": -7.376132965087891, "global_step": 24909, "epoch": 148} {"train_loss": -6.989912033081055, "global_step": 24910, "epoch": 148} {"train_loss": -7.242923736572266, "global_step": 24911, "epoch": 148} {"train_loss": -7.0671467781066895, "global_step": 24912, "epoch": 148} {"train_loss": -6.982505798339844, "global_step": 24913, "epoch": 148} {"train_loss": -6.9816131591796875, "global_step": 24914, "epoch": 148} {"train_loss": -6.907292366027832, "global_step": 24915, "epoch": 148} {"train_loss": -6.770443439483643, "global_step": 24916, "epoch": 148} {"train_loss": -6.885372161865234, "global_step": 24917, "epoch": 148} {"train_loss": -6.697262287139893, "global_step": 24918, "epoch": 148} {"train_loss": -7.089678764343262, "global_step": 24919, "epoch": 148} {"train_loss": -7.099889755249023, "global_step": 24920, "epoch": 148} {"train_loss": -6.997003078460693, "global_step": 24921, "epoch": 148} {"train_loss": -7.126861095428467, "global_step": 24922, "epoch": 148} {"train_loss": -6.8978729248046875, "global_step": 24923, "epoch": 148} {"train_loss": -6.886969566345215, "global_step": 24924, "epoch": 148} {"train_loss": -7.108456611633301, "global_step": 24925, "epoch": 148} {"train_loss": -6.8110809326171875, "global_step": 24926, "epoch": 148} {"train_loss": -6.853758335113525, "global_step": 24927, "epoch": 148} {"train_loss": -7.069514751434326, "global_step": 24928, "epoch": 148} {"train_loss": -7.182241439819336, "global_step": 24929, "epoch": 148} {"train_loss": -6.896823883056641, "global_step": 24930, "epoch": 148} {"train_loss": -7.120760440826416, "global_step": 24931, "epoch": 148} {"train_loss": -6.986921787261963, "global_step": 24932, "epoch": 148} {"train_loss": -6.918122291564941, "global_step": 24933, "epoch": 148} {"train_loss": -7.124425888061523, "global_step": 24934, "epoch": 148} {"train_loss": -7.06342887878418, "global_step": 24935, "epoch": 148} {"train_loss": -7.116559982299805, "global_step": 24936, "epoch": 148} {"train_loss": -6.875246047973633, "global_step": 24937, "epoch": 148} {"train_loss": -6.986430644989014, "global_step": 24938, "epoch": 148} {"train_loss": -7.20216178894043, "global_step": 24939, "epoch": 148} {"train_loss": -7.0980610847473145, "global_step": 24940, "epoch": 148} {"train_loss": -7.333719730377197, "global_step": 24941, "epoch": 148} {"train_loss": -7.242001533508301, "global_step": 24942, "epoch": 148} {"train_loss": -7.115033149719238, "global_step": 24943, "epoch": 148} {"train_loss": -6.904977798461914, "global_step": 24944, "epoch": 148} {"train_loss": -7.008367538452148, "global_step": 24945, "epoch": 148} {"train_loss": -7.203683853149414, "global_step": 24946, "epoch": 148} {"train_loss": -7.25818395614624, "global_step": 24947, "epoch": 148} {"train_loss": -7.138694763183594, "global_step": 24948, "epoch": 148} {"train_loss": -7.279522895812988, "global_step": 24949, "epoch": 148} {"train_loss": -7.22731876373291, "global_step": 24950, "epoch": 148} {"train_loss": -7.287713050842285, "global_step": 24951, "epoch": 148} {"train_loss": -7.079893112182617, "global_step": 24952, "epoch": 148} {"train_loss": -7.3658223152160645, "global_step": 24953, "epoch": 148} {"train_loss": -6.882222652435303, "global_step": 24954, "epoch": 148} {"train_loss": -7.148680210113525, "global_step": 24955, "epoch": 148} {"train_loss": -7.242652416229248, "global_step": 24956, "epoch": 148} {"train_loss": -7.2302656173706055, "global_step": 24957, "epoch": 148} {"train_loss": -7.087590217590332, "global_step": 24958, "epoch": 148} {"train_loss": -7.414973735809326, "global_step": 24959, "epoch": 148} {"train_loss": -6.83921480178833, "global_step": 24960, "epoch": 148} {"train_loss": -7.209104061126709, "global_step": 24961, "epoch": 148} {"train_loss": -7.137529373168945, "global_step": 24962, "epoch": 148} {"train_loss": -7.030508518218994, "global_step": 24963, "epoch": 148} {"train_loss": -7.0985307693481445, "global_step": 24964, "epoch": 148} {"train_loss": -7.243687629699707, "global_step": 24965, "epoch": 148} {"train_loss": -7.129039764404297, "global_step": 24966, "epoch": 148} {"train_loss": -6.991578102111816, "global_step": 24967, "epoch": 148} {"train_loss": -7.308743476867676, "global_step": 24968, "epoch": 148} {"train_loss": -7.014463424682617, "global_step": 24969, "epoch": 148} {"train_loss": -7.422136306762695, "global_step": 24970, "epoch": 148} {"train_loss": -7.062067031860352, "global_step": 24971, "epoch": 148} {"train_loss": -7.011345386505127, "global_step": 24972, "epoch": 148} {"train_loss": -7.252313613891602, "global_step": 24973, "epoch": 148} {"train_loss": -7.1459245681762695, "global_step": 24974, "epoch": 148} {"train_loss": -7.282338619232178, "global_step": 24975, "epoch": 148} {"train_loss": -7.237942695617676, "global_step": 24976, "epoch": 148} {"train_loss": -7.201905250549316, "global_step": 24977, "epoch": 148} {"train_loss": -6.9836955070495605, "global_step": 24978, "epoch": 148} {"train_loss": -7.064465522766113, "global_step": 24979, "epoch": 148} {"train_loss": -6.888045310974121, "global_step": 24980, "epoch": 148} {"train_loss": -7.353147029876709, "global_step": 24981, "epoch": 148} {"train_loss": -6.987506866455078, "global_step": 24982, "epoch": 148} {"train_loss": -7.250655174255371, "global_step": 24983, "epoch": 148} {"train_loss": -7.009496688842773, "global_step": 24984, "epoch": 148} {"train_loss": -7.118922710418701, "global_step": 24985, "epoch": 148} {"train_loss": -7.427376747131348, "global_step": 24986, "epoch": 148} {"train_loss": -6.932648658752441, "global_step": 24987, "epoch": 148} {"train_loss": -7.212189674377441, "global_step": 24988, "epoch": 148} {"train_loss": -7.239129066467285, "global_step": 24989, "epoch": 148} {"train_loss": -7.254206657409668, "global_step": 24990, "epoch": 148} {"train_loss": -7.256594181060791, "global_step": 24991, "epoch": 148} {"train_loss": -7.163405418395996, "global_step": 24992, "epoch": 148} {"train_loss": -7.290961265563965, "global_step": 24993, "epoch": 148} {"train_loss": -7.23370361328125, "global_step": 24994, "epoch": 148} {"train_loss": -7.360435485839844, "global_step": 24995, "epoch": 148} {"train_loss": -6.952341556549072, "global_step": 24996, "epoch": 148} {"train_loss": -7.321077346801758, "global_step": 24997, "epoch": 148} {"train_loss": -7.205615043640137, "global_step": 24998, "epoch": 148} {"train_loss": -7.192106246948242, "global_step": 24999, "epoch": 148} {"train_loss": -6.949863433837891, "global_step": 25000, "epoch": 148} {"train_loss": -7.3046088218688965, "global_step": 25001, "epoch": 148} {"train_loss": -6.784046649932861, "global_step": 25002, "epoch": 148} {"train_loss": -7.309009552001953, "global_step": 25003, "epoch": 148} {"train_loss": -7.070898056030273, "global_step": 25004, "epoch": 148} {"train_loss": -6.901702880859375, "global_step": 25005, "epoch": 148} {"train_loss": -7.324535846710205, "global_step": 25006, "epoch": 148} {"train_loss": -6.841213703155518, "global_step": 25007, "epoch": 148} {"train_loss": -7.1988525390625, "global_step": 25008, "epoch": 148} {"train_loss": -7.00621223449707, "global_step": 25009, "epoch": 148} {"train_loss": -7.134097576141357, "global_step": 25010, "epoch": 148} {"train_loss": -7.001408576965332, "global_step": 25011, "epoch": 148} {"train_loss": -7.0032501220703125, "global_step": 25012, "epoch": 148} {"train_loss": -7.056103706359863, "global_step": 25013, "epoch": 148} {"train_loss": -7.111546516418457, "global_step": 25014, "epoch": 148} {"train_loss": -7.080009460449219, "global_step": 25015, "epoch": 148} {"train_loss": -7.3113813400268555, "global_step": 25016, "epoch": 148} {"train_loss": -6.98674201965332, "global_step": 25017, "epoch": 148} {"train_loss": -7.203056335449219, "global_step": 25018, "epoch": 148} {"train_loss": -7.030373573303223, "global_step": 25019, "epoch": 148} {"train_loss": -7.288351058959961, "global_step": 25020, "epoch": 148} {"train_loss": -6.837791442871094, "global_step": 25021, "epoch": 148} {"train_loss": -7.298072814941406, "global_step": 25022, "epoch": 148} {"train_loss": -7.094320297241211, "global_step": 25023, "epoch": 148} {"train_loss": -7.297322750091553, "global_step": 25024, "epoch": 148} {"train_loss": -7.15198278427124, "global_step": 25025, "epoch": 148} {"train_loss": -7.3154473304748535, "global_step": 25026, "epoch": 148} {"train_loss": -7.240026950836182, "global_step": 25027, "epoch": 148} {"train_loss": -7.323667526245117, "global_step": 25028, "epoch": 148} {"train_loss": -7.333984375, "global_step": 25029, "epoch": 148} {"train_loss": -7.308809280395508, "global_step": 25030, "epoch": 148} {"train_loss": -7.10927383956455, "global_step": 25031, "epoch": 148, "val_loss": 199632.421875} {"train_loss": -7.151378631591797, "global_step": 25032, "epoch": 149} {"train_loss": -6.788734436035156, "global_step": 25033, "epoch": 149} {"train_loss": -7.022830009460449, "global_step": 25034, "epoch": 149} {"train_loss": -7.031254768371582, "global_step": 25035, "epoch": 149} {"train_loss": -7.008003234863281, "global_step": 25036, "epoch": 149} {"train_loss": -7.3109211921691895, "global_step": 25037, "epoch": 149} {"train_loss": -7.121199131011963, "global_step": 25038, "epoch": 149} {"train_loss": -7.061502933502197, "global_step": 25039, "epoch": 149} {"train_loss": -7.155233383178711, "global_step": 25040, "epoch": 149} {"train_loss": -7.022250175476074, "global_step": 25041, "epoch": 149} {"train_loss": -7.211570739746094, "global_step": 25042, "epoch": 149} {"train_loss": -7.223772048950195, "global_step": 25043, "epoch": 149} {"train_loss": -7.209449291229248, "global_step": 25044, "epoch": 149} {"train_loss": -7.392675399780273, "global_step": 25045, "epoch": 149} {"train_loss": -7.140827178955078, "global_step": 25046, "epoch": 149} {"train_loss": -7.319048881530762, "global_step": 25047, "epoch": 149} {"train_loss": -7.321774005889893, "global_step": 25048, "epoch": 149} {"train_loss": -7.3256683349609375, "global_step": 25049, "epoch": 149} {"train_loss": -7.186596393585205, "global_step": 25050, "epoch": 149} {"train_loss": -7.223502159118652, "global_step": 25051, "epoch": 149} {"train_loss": -7.084498882293701, "global_step": 25052, "epoch": 149} {"train_loss": -7.05381965637207, "global_step": 25053, "epoch": 149} {"train_loss": -7.454022407531738, "global_step": 25054, "epoch": 149} {"train_loss": -7.302141189575195, "global_step": 25055, "epoch": 149} {"train_loss": -7.017838478088379, "global_step": 25056, "epoch": 149} {"train_loss": -7.221257209777832, "global_step": 25057, "epoch": 149} {"train_loss": -7.103928565979004, "global_step": 25058, "epoch": 149} {"train_loss": -7.123266220092773, "global_step": 25059, "epoch": 149} {"train_loss": -7.141188621520996, "global_step": 25060, "epoch": 149} {"train_loss": -7.188192844390869, "global_step": 25061, "epoch": 149} {"train_loss": -7.297632217407227, "global_step": 25062, "epoch": 149} {"train_loss": -7.060756206512451, "global_step": 25063, "epoch": 149} {"train_loss": -7.018294334411621, "global_step": 25064, "epoch": 149} {"train_loss": -7.163226127624512, "global_step": 25065, "epoch": 149} {"train_loss": -7.107097148895264, "global_step": 25066, "epoch": 149} {"train_loss": -7.071948051452637, "global_step": 25067, "epoch": 149} {"train_loss": -7.394536018371582, "global_step": 25068, "epoch": 149} {"train_loss": -6.904191970825195, "global_step": 25069, "epoch": 149} {"train_loss": -7.378841400146484, "global_step": 25070, "epoch": 149} {"train_loss": -6.932071685791016, "global_step": 25071, "epoch": 149} {"train_loss": -7.255184173583984, "global_step": 25072, "epoch": 149} {"train_loss": -7.156350135803223, "global_step": 25073, "epoch": 149} {"train_loss": -7.284246444702148, "global_step": 25074, "epoch": 149} {"train_loss": -7.3953166007995605, "global_step": 25075, "epoch": 149} {"train_loss": -7.383664131164551, "global_step": 25076, "epoch": 149} {"train_loss": -7.346692085266113, "global_step": 25077, "epoch": 149} {"train_loss": -7.199867248535156, "global_step": 25078, "epoch": 149} {"train_loss": -7.274615287780762, "global_step": 25079, "epoch": 149} {"train_loss": -7.249467849731445, "global_step": 25080, "epoch": 149} {"train_loss": -7.4150896072387695, "global_step": 25081, "epoch": 149} {"train_loss": -6.957395553588867, "global_step": 25082, "epoch": 149} {"train_loss": -7.314723491668701, "global_step": 25083, "epoch": 149} {"train_loss": -7.190672874450684, "global_step": 25084, "epoch": 149} {"train_loss": -7.237732887268066, "global_step": 25085, "epoch": 149} {"train_loss": -7.254508972167969, "global_step": 25086, "epoch": 149} {"train_loss": -7.094130039215088, "global_step": 25087, "epoch": 149} {"train_loss": -6.799498558044434, "global_step": 25088, "epoch": 149} {"train_loss": -7.091474533081055, "global_step": 25089, "epoch": 149} {"train_loss": -7.0561981201171875, "global_step": 25090, "epoch": 149} {"train_loss": -7.282891750335693, "global_step": 25091, "epoch": 149} {"train_loss": -6.978160858154297, "global_step": 25092, "epoch": 149} {"train_loss": -7.14257287979126, "global_step": 25093, "epoch": 149} {"train_loss": -6.984783172607422, "global_step": 25094, "epoch": 149} {"train_loss": -7.289938926696777, "global_step": 25095, "epoch": 149} {"train_loss": -7.236713409423828, "global_step": 25096, "epoch": 149} {"train_loss": -7.137584686279297, "global_step": 25097, "epoch": 149} {"train_loss": -7.180940628051758, "global_step": 25098, "epoch": 149} {"train_loss": -6.945730686187744, "global_step": 25099, "epoch": 149} {"train_loss": -7.5224480628967285, "global_step": 25100, "epoch": 149} {"train_loss": -7.157135009765625, "global_step": 25101, "epoch": 149} {"train_loss": -6.914878845214844, "global_step": 25102, "epoch": 149} {"train_loss": -7.071816921234131, "global_step": 25103, "epoch": 149} {"train_loss": -7.350381851196289, "global_step": 25104, "epoch": 149} {"train_loss": -7.266976833343506, "global_step": 25105, "epoch": 149} {"train_loss": -7.395382881164551, "global_step": 25106, "epoch": 149} {"train_loss": -7.346591949462891, "global_step": 25107, "epoch": 149} {"train_loss": -7.174081802368164, "global_step": 25108, "epoch": 149} {"train_loss": -7.063282489776611, "global_step": 25109, "epoch": 149} {"train_loss": -7.138942718505859, "global_step": 25110, "epoch": 149} {"train_loss": -7.10280179977417, "global_step": 25111, "epoch": 149} {"train_loss": -7.353575229644775, "global_step": 25112, "epoch": 149} {"train_loss": -7.253323554992676, "global_step": 25113, "epoch": 149} {"train_loss": -7.157682418823242, "global_step": 25114, "epoch": 149} {"train_loss": -7.3252458572387695, "global_step": 25115, "epoch": 149} {"train_loss": -7.3070831298828125, "global_step": 25116, "epoch": 149} {"train_loss": -7.1744184494018555, "global_step": 25117, "epoch": 149} {"train_loss": -7.129213333129883, "global_step": 25118, "epoch": 149} {"train_loss": -7.393284797668457, "global_step": 25119, "epoch": 149} {"train_loss": -7.270072937011719, "global_step": 25120, "epoch": 149} {"train_loss": -7.269740104675293, "global_step": 25121, "epoch": 149} {"train_loss": -6.934451103210449, "global_step": 25122, "epoch": 149} {"train_loss": -7.043842315673828, "global_step": 25123, "epoch": 149} {"train_loss": -7.021623611450195, "global_step": 25124, "epoch": 149} {"train_loss": -6.93936824798584, "global_step": 25125, "epoch": 149} {"train_loss": -7.103665828704834, "global_step": 25126, "epoch": 149} {"train_loss": -7.001076698303223, "global_step": 25127, "epoch": 149} {"train_loss": -7.263771057128906, "global_step": 25128, "epoch": 149} {"train_loss": -7.3008575439453125, "global_step": 25129, "epoch": 149} {"train_loss": -7.220235347747803, "global_step": 25130, "epoch": 149} {"train_loss": -7.3379645347595215, "global_step": 25131, "epoch": 149} {"train_loss": -7.1361799240112305, "global_step": 25132, "epoch": 149} {"train_loss": -7.174726486206055, "global_step": 25133, "epoch": 149} {"train_loss": -7.2545928955078125, "global_step": 25134, "epoch": 149} {"train_loss": -7.325891494750977, "global_step": 25135, "epoch": 149} {"train_loss": -7.343804359436035, "global_step": 25136, "epoch": 149} {"train_loss": -7.392681121826172, "global_step": 25137, "epoch": 149} {"train_loss": -7.393498420715332, "global_step": 25138, "epoch": 149} {"train_loss": -7.190534591674805, "global_step": 25139, "epoch": 149} {"train_loss": -7.20240592956543, "global_step": 25140, "epoch": 149} {"train_loss": -7.151541709899902, "global_step": 25141, "epoch": 149} {"train_loss": -7.37330436706543, "global_step": 25142, "epoch": 149} {"train_loss": -7.407015323638916, "global_step": 25143, "epoch": 149} {"train_loss": -7.1841583251953125, "global_step": 25144, "epoch": 149} {"train_loss": -7.297984600067139, "global_step": 25145, "epoch": 149} {"train_loss": -6.915747165679932, "global_step": 25146, "epoch": 149} {"train_loss": -7.114971160888672, "global_step": 25147, "epoch": 149} {"train_loss": -6.8230085372924805, "global_step": 25148, "epoch": 149} {"train_loss": -7.188104629516602, "global_step": 25149, "epoch": 149} {"train_loss": -6.871989727020264, "global_step": 25150, "epoch": 149} {"train_loss": -7.239912986755371, "global_step": 25151, "epoch": 149} {"train_loss": -7.0878448486328125, "global_step": 25152, "epoch": 149} {"train_loss": -7.048283100128174, "global_step": 25153, "epoch": 149} {"train_loss": -7.105769157409668, "global_step": 25154, "epoch": 149} {"train_loss": -7.057133674621582, "global_step": 25155, "epoch": 149} {"train_loss": -7.274233341217041, "global_step": 25156, "epoch": 149} {"train_loss": -6.873226165771484, "global_step": 25157, "epoch": 149} {"train_loss": -7.143789291381836, "global_step": 25158, "epoch": 149} {"train_loss": -7.206168174743652, "global_step": 25159, "epoch": 149} {"train_loss": -7.2167816162109375, "global_step": 25160, "epoch": 149} {"train_loss": -7.083887100219727, "global_step": 25161, "epoch": 149} {"train_loss": -7.153800964355469, "global_step": 25162, "epoch": 149} {"train_loss": -7.27801513671875, "global_step": 25163, "epoch": 149} {"train_loss": -7.223169326782227, "global_step": 25164, "epoch": 149} {"train_loss": -7.228521347045898, "global_step": 25165, "epoch": 149} {"train_loss": -7.360965728759766, "global_step": 25166, "epoch": 149} {"train_loss": -7.369840621948242, "global_step": 25167, "epoch": 149} {"train_loss": -7.067012786865234, "global_step": 25168, "epoch": 149} {"train_loss": -7.16756534576416, "global_step": 25169, "epoch": 149} {"train_loss": -6.896203994750977, "global_step": 25170, "epoch": 149} {"train_loss": -7.32118558883667, "global_step": 25171, "epoch": 149} {"train_loss": -7.27274227142334, "global_step": 25172, "epoch": 149} {"train_loss": -7.194718360900879, "global_step": 25173, "epoch": 149} {"train_loss": -7.173845291137695, "global_step": 25174, "epoch": 149} {"train_loss": -7.125282287597656, "global_step": 25175, "epoch": 149} {"train_loss": -6.984529972076416, "global_step": 25176, "epoch": 149} {"train_loss": -7.150134086608887, "global_step": 25177, "epoch": 149} {"train_loss": -7.165595531463623, "global_step": 25178, "epoch": 149} {"train_loss": -7.009071350097656, "global_step": 25179, "epoch": 149} {"train_loss": -7.446026802062988, "global_step": 25180, "epoch": 149} {"train_loss": -7.127897262573242, "global_step": 25181, "epoch": 149} {"train_loss": -7.17777681350708, "global_step": 25182, "epoch": 149} {"train_loss": -7.038106918334961, "global_step": 25183, "epoch": 149} {"train_loss": -7.367370128631592, "global_step": 25184, "epoch": 149} {"train_loss": -7.326706886291504, "global_step": 25185, "epoch": 149} {"train_loss": -7.296874523162842, "global_step": 25186, "epoch": 149} {"train_loss": -7.252552032470703, "global_step": 25187, "epoch": 149} {"train_loss": -7.07961368560791, "global_step": 25188, "epoch": 149} {"train_loss": -7.132626533508301, "global_step": 25189, "epoch": 149} {"train_loss": -7.16817045211792, "global_step": 25190, "epoch": 149} {"train_loss": -7.154144287109375, "global_step": 25191, "epoch": 149} {"train_loss": -7.3061676025390625, "global_step": 25192, "epoch": 149} {"train_loss": -6.9995574951171875, "global_step": 25193, "epoch": 149} {"train_loss": -7.258729934692383, "global_step": 25194, "epoch": 149} {"train_loss": -7.239594459533691, "global_step": 25195, "epoch": 149} {"train_loss": -7.178037166595459, "global_step": 25196, "epoch": 149} {"train_loss": -7.391583442687988, "global_step": 25197, "epoch": 149} {"train_loss": -7.295018196105957, "global_step": 25198, "epoch": 149} {"train_loss": -7.179603735605876, "global_step": 25199, "epoch": 149, "val_loss": 202674.046875} {"train_loss": -7.169445991516113, "global_step": 25200, "epoch": 150} {"train_loss": -7.267484664916992, "global_step": 25201, "epoch": 150} {"train_loss": -7.307092666625977, "global_step": 25202, "epoch": 150} {"train_loss": -7.3247528076171875, "global_step": 25203, "epoch": 150} {"train_loss": -7.1558685302734375, "global_step": 25204, "epoch": 150} {"train_loss": -7.161741256713867, "global_step": 25205, "epoch": 150} {"train_loss": -6.999528408050537, "global_step": 25206, "epoch": 150} {"train_loss": -6.8572187423706055, "global_step": 25207, "epoch": 150} {"train_loss": -7.05705451965332, "global_step": 25208, "epoch": 150} {"train_loss": -6.901609420776367, "global_step": 25209, "epoch": 150} {"train_loss": -7.106525421142578, "global_step": 25210, "epoch": 150} {"train_loss": -6.965973377227783, "global_step": 25211, "epoch": 150} {"train_loss": -7.00547456741333, "global_step": 25212, "epoch": 150} {"train_loss": -7.1726789474487305, "global_step": 25213, "epoch": 150} {"train_loss": -7.041570663452148, "global_step": 25214, "epoch": 150} {"train_loss": -7.097214221954346, "global_step": 25215, "epoch": 150} {"train_loss": -7.253265380859375, "global_step": 25216, "epoch": 150} {"train_loss": -6.620359420776367, "global_step": 25217, "epoch": 150} {"train_loss": -7.004756450653076, "global_step": 25218, "epoch": 150} {"train_loss": -7.093055725097656, "global_step": 25219, "epoch": 150} {"train_loss": -7.127740859985352, "global_step": 25220, "epoch": 150} {"train_loss": -6.960316181182861, "global_step": 25221, "epoch": 150} {"train_loss": -7.018950939178467, "global_step": 25222, "epoch": 150} {"train_loss": -7.234239101409912, "global_step": 25223, "epoch": 150} {"train_loss": -7.281253814697266, "global_step": 25224, "epoch": 150} {"train_loss": -7.122997283935547, "global_step": 25225, "epoch": 150} {"train_loss": -7.155394077301025, "global_step": 25226, "epoch": 150} {"train_loss": -7.048345565795898, "global_step": 25227, "epoch": 150} {"train_loss": -7.395349502563477, "global_step": 25228, "epoch": 150} {"train_loss": -7.008570671081543, "global_step": 25229, "epoch": 150} {"train_loss": -7.292060852050781, "global_step": 25230, "epoch": 150} {"train_loss": -6.927854537963867, "global_step": 25231, "epoch": 150} {"train_loss": -7.310833930969238, "global_step": 25232, "epoch": 150} {"train_loss": -7.076998710632324, "global_step": 25233, "epoch": 150} {"train_loss": -7.193977355957031, "global_step": 25234, "epoch": 150} {"train_loss": -7.085251808166504, "global_step": 25235, "epoch": 150} {"train_loss": -7.277626037597656, "global_step": 25236, "epoch": 150} {"train_loss": -7.029928207397461, "global_step": 25237, "epoch": 150} {"train_loss": -7.449462890625, "global_step": 25238, "epoch": 150} {"train_loss": -7.357928276062012, "global_step": 25239, "epoch": 150} {"train_loss": -7.258374214172363, "global_step": 25240, "epoch": 150} {"train_loss": -7.3251953125, "global_step": 25241, "epoch": 150} {"train_loss": -7.309330463409424, "global_step": 25242, "epoch": 150} {"train_loss": -7.345690727233887, "global_step": 25243, "epoch": 150} {"train_loss": -7.199944496154785, "global_step": 25244, "epoch": 150} {"train_loss": -7.520685195922852, "global_step": 25245, "epoch": 150} {"train_loss": -7.316812515258789, "global_step": 25246, "epoch": 150} {"train_loss": -7.244635581970215, "global_step": 25247, "epoch": 150} {"train_loss": -7.012538909912109, "global_step": 25248, "epoch": 150} {"train_loss": -7.049713611602783, "global_step": 25249, "epoch": 150} {"train_loss": -7.121476173400879, "global_step": 25250, "epoch": 150} {"train_loss": -7.303452491760254, "global_step": 25251, "epoch": 150} {"train_loss": -7.317452430725098, "global_step": 25252, "epoch": 150} {"train_loss": -7.163620948791504, "global_step": 25253, "epoch": 150} {"train_loss": -7.091088771820068, "global_step": 25254, "epoch": 150} {"train_loss": -7.099820137023926, "global_step": 25255, "epoch": 150} {"train_loss": -7.2056427001953125, "global_step": 25256, "epoch": 150} {"train_loss": -7.2472028732299805, "global_step": 25257, "epoch": 150} {"train_loss": -7.129494667053223, "global_step": 25258, "epoch": 150} {"train_loss": -6.901437759399414, "global_step": 25259, "epoch": 150} {"train_loss": -7.218501091003418, "global_step": 25260, "epoch": 150} {"train_loss": -6.993024826049805, "global_step": 25261, "epoch": 150} {"train_loss": -6.938419342041016, "global_step": 25262, "epoch": 150} {"train_loss": -7.151126861572266, "global_step": 25263, "epoch": 150} {"train_loss": -7.008686065673828, "global_step": 25264, "epoch": 150} {"train_loss": -7.218799591064453, "global_step": 25265, "epoch": 150} {"train_loss": -7.288025856018066, "global_step": 25266, "epoch": 150} {"train_loss": -7.096471786499023, "global_step": 25267, "epoch": 150} {"train_loss": -7.173158645629883, "global_step": 25268, "epoch": 150} {"train_loss": -7.21652364730835, "global_step": 25269, "epoch": 150} {"train_loss": -7.252270698547363, "global_step": 25270, "epoch": 150} {"train_loss": -7.238813400268555, "global_step": 25271, "epoch": 150} {"train_loss": -6.9687933921813965, "global_step": 25272, "epoch": 150} {"train_loss": -7.5051350593566895, "global_step": 25273, "epoch": 150} {"train_loss": -7.25449800491333, "global_step": 25274, "epoch": 150} {"train_loss": -7.30217170715332, "global_step": 25275, "epoch": 150} {"train_loss": -7.354567050933838, "global_step": 25276, "epoch": 150} {"train_loss": -7.154932022094727, "global_step": 25277, "epoch": 150} {"train_loss": -7.226839542388916, "global_step": 25278, "epoch": 150} {"train_loss": -7.339047431945801, "global_step": 25279, "epoch": 150} {"train_loss": -7.3825507164001465, "global_step": 25280, "epoch": 150} {"train_loss": -7.268994331359863, "global_step": 25281, "epoch": 150} {"train_loss": -6.9841108322143555, "global_step": 25282, "epoch": 150} {"train_loss": -7.282044410705566, "global_step": 25283, "epoch": 150} {"train_loss": -7.030816078186035, "global_step": 25284, "epoch": 150} {"train_loss": -7.061882972717285, "global_step": 25285, "epoch": 150} {"train_loss": -7.308747291564941, "global_step": 25286, "epoch": 150} {"train_loss": -7.066594123840332, "global_step": 25287, "epoch": 150} {"train_loss": -7.126694202423096, "global_step": 25288, "epoch": 150} {"train_loss": -7.2413225173950195, "global_step": 25289, "epoch": 150} {"train_loss": -7.08285665512085, "global_step": 25290, "epoch": 150} {"train_loss": -7.157374382019043, "global_step": 25291, "epoch": 150} {"train_loss": -7.255502700805664, "global_step": 25292, "epoch": 150} {"train_loss": -7.304441452026367, "global_step": 25293, "epoch": 150} {"train_loss": -7.082054138183594, "global_step": 25294, "epoch": 150} {"train_loss": -7.27854061126709, "global_step": 25295, "epoch": 150} {"train_loss": -7.219410419464111, "global_step": 25296, "epoch": 150} {"train_loss": -7.241133689880371, "global_step": 25297, "epoch": 150} {"train_loss": -7.031024932861328, "global_step": 25298, "epoch": 150} {"train_loss": -7.157024383544922, "global_step": 25299, "epoch": 150} {"train_loss": -7.356633186340332, "global_step": 25300, "epoch": 150} {"train_loss": -7.162755966186523, "global_step": 25301, "epoch": 150} {"train_loss": -7.201193809509277, "global_step": 25302, "epoch": 150} {"train_loss": -7.062571048736572, "global_step": 25303, "epoch": 150} {"train_loss": -7.294424057006836, "global_step": 25304, "epoch": 150} {"train_loss": -7.383788585662842, "global_step": 25305, "epoch": 150} {"train_loss": -7.441323280334473, "global_step": 25306, "epoch": 150} {"train_loss": -7.183490753173828, "global_step": 25307, "epoch": 150} {"train_loss": -7.537664413452148, "global_step": 25308, "epoch": 150} {"train_loss": -7.177896499633789, "global_step": 25309, "epoch": 150} {"train_loss": -7.220155715942383, "global_step": 25310, "epoch": 150} {"train_loss": -7.129565238952637, "global_step": 25311, "epoch": 150} {"train_loss": -7.351872444152832, "global_step": 25312, "epoch": 150} {"train_loss": -6.968252182006836, "global_step": 25313, "epoch": 150} {"train_loss": -7.195274353027344, "global_step": 25314, "epoch": 150} {"train_loss": -7.031031131744385, "global_step": 25315, "epoch": 150} {"train_loss": -7.021960258483887, "global_step": 25316, "epoch": 150} {"train_loss": -7.115513801574707, "global_step": 25317, "epoch": 150} {"train_loss": -7.148327827453613, "global_step": 25318, "epoch": 150} {"train_loss": -6.720362663269043, "global_step": 25319, "epoch": 150} {"train_loss": -7.075085639953613, "global_step": 25320, "epoch": 150} {"train_loss": -7.200622081756592, "global_step": 25321, "epoch": 150} {"train_loss": -7.12592887878418, "global_step": 25322, "epoch": 150} {"train_loss": -7.143265247344971, "global_step": 25323, "epoch": 150} {"train_loss": -7.008587837219238, "global_step": 25324, "epoch": 150} {"train_loss": -7.069281578063965, "global_step": 25325, "epoch": 150} {"train_loss": -6.839241981506348, "global_step": 25326, "epoch": 150} {"train_loss": -7.260629177093506, "global_step": 25327, "epoch": 150} {"train_loss": -7.057428359985352, "global_step": 25328, "epoch": 150} {"train_loss": -7.121859550476074, "global_step": 25329, "epoch": 150} {"train_loss": -6.98938512802124, "global_step": 25330, "epoch": 150} {"train_loss": -6.839472770690918, "global_step": 25331, "epoch": 150} {"train_loss": -7.069094657897949, "global_step": 25332, "epoch": 150} {"train_loss": -7.076788902282715, "global_step": 25333, "epoch": 150} {"train_loss": -7.105520248413086, "global_step": 25334, "epoch": 150} {"train_loss": -7.029262065887451, "global_step": 25335, "epoch": 150} {"train_loss": -7.368768215179443, "global_step": 25336, "epoch": 150} {"train_loss": -7.161464691162109, "global_step": 25337, "epoch": 150} {"train_loss": -7.337644100189209, "global_step": 25338, "epoch": 150} {"train_loss": -7.2332634925842285, "global_step": 25339, "epoch": 150} {"train_loss": -7.207846641540527, "global_step": 25340, "epoch": 150} {"train_loss": -7.283403396606445, "global_step": 25341, "epoch": 150} {"train_loss": -7.309808731079102, "global_step": 25342, "epoch": 150} {"train_loss": -7.214444160461426, "global_step": 25343, "epoch": 150} {"train_loss": -7.162864685058594, "global_step": 25344, "epoch": 150} {"train_loss": -7.421525001525879, "global_step": 25345, "epoch": 150} {"train_loss": -7.153892517089844, "global_step": 25346, "epoch": 150} {"train_loss": -7.289690971374512, "global_step": 25347, "epoch": 150} {"train_loss": -7.329883575439453, "global_step": 25348, "epoch": 150} {"train_loss": -7.240530014038086, "global_step": 25349, "epoch": 150} {"train_loss": -7.309124946594238, "global_step": 25350, "epoch": 150} {"train_loss": -7.461191177368164, "global_step": 25351, "epoch": 150} {"train_loss": -7.345619201660156, "global_step": 25352, "epoch": 150} {"train_loss": -7.252429962158203, "global_step": 25353, "epoch": 150} {"train_loss": -7.435715675354004, "global_step": 25354, "epoch": 150} {"train_loss": -7.543355941772461, "global_step": 25355, "epoch": 150} {"train_loss": -7.320219993591309, "global_step": 25356, "epoch": 150} {"train_loss": -7.615511417388916, "global_step": 25357, "epoch": 150} {"train_loss": -7.315657615661621, "global_step": 25358, "epoch": 150} {"train_loss": -7.344978332519531, "global_step": 25359, "epoch": 150} {"train_loss": -7.278857707977295, "global_step": 25360, "epoch": 150} {"train_loss": -7.483993053436279, "global_step": 25361, "epoch": 150} {"train_loss": -7.269504547119141, "global_step": 25362, "epoch": 150} {"train_loss": -7.5208258628845215, "global_step": 25363, "epoch": 150} {"train_loss": -7.348644733428955, "global_step": 25364, "epoch": 150} {"train_loss": -7.40211296081543, "global_step": 25365, "epoch": 150} {"train_loss": -7.19803524017334, "global_step": 25366, "epoch": 150} {"train_loss": -7.188692050320761, "global_step": 25367, "epoch": 150, "train/sim_max_reward_0": 0.9736111534934153, "train/sim_max_reward_1": 0.8399936722243704, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.9520185194274823, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.945507591117466, "test/sim_max_reward_4400000": 0.23073082109120602, "test/sim_max_reward_4400001": 0.9897650532021446, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.44219582221894543, "test/sim_max_reward_4400004": 0.9833266879656793, "test/sim_max_reward_4400005": 0.9632581944627643, "test/sim_max_reward_4400006": 0.8616326144131428, "test/sim_max_reward_4400007": 0.617089040841796, "test/sim_max_reward_4400008": 0.6130920196658207, "test/sim_max_reward_4400009": 0.5086112459321617, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 0.8118339131994011, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9037260350555916, "test/sim_max_reward_4400019": 0.9979603635979074, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.6517348096447447, "test/sim_max_reward_4400022": 0.9770838574521732, "test/sim_max_reward_4400023": 0.7757262258055123, "test/sim_max_reward_4400024": 0.428831840950386, "test/sim_max_reward_4400025": 0.7043078669140835, "test/sim_max_reward_4400026": 1.0, "test/sim_max_reward_4400027": 0.4773045765487776, "test/sim_max_reward_4400028": 0.7196103653626522, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9506594265773132, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.5848325039306513, "test/sim_max_reward_4400033": 0.4506498215798975, "test/sim_max_reward_4400034": 0.959984833059059, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.8089681058703849, "test/sim_max_reward_4400037": 0.9947963403708501, "test/sim_max_reward_4400038": 0.0, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.07130473668859068, "test/sim_max_reward_4400042": 0.01279519710182538, "test/sim_max_reward_4400043": 0.9194181881533032, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.9812789449160825, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 1.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.951855156043789, "test/mean_score": 0.673540909251024, "val_loss": 199152.734375, "train_action_mse_error": 17.34143829345703} {"train_loss": -7.452920913696289, "global_step": 25368, "epoch": 151} {"train_loss": -7.316361427307129, "global_step": 25369, "epoch": 151} {"train_loss": -7.326409816741943, "global_step": 25370, "epoch": 151} {"train_loss": -7.087673187255859, "global_step": 25371, "epoch": 151} {"train_loss": -7.231081008911133, "global_step": 25372, "epoch": 151} {"train_loss": -7.2628021240234375, "global_step": 25373, "epoch": 151} {"train_loss": -7.098443984985352, "global_step": 25374, "epoch": 151} {"train_loss": -7.116293907165527, "global_step": 25375, "epoch": 151} {"train_loss": -7.250086307525635, "global_step": 25376, "epoch": 151} {"train_loss": -7.0698771476745605, "global_step": 25377, "epoch": 151} {"train_loss": -7.1985368728637695, "global_step": 25378, "epoch": 151} {"train_loss": -7.15047550201416, "global_step": 25379, "epoch": 151} {"train_loss": -6.846401214599609, "global_step": 25380, "epoch": 151} {"train_loss": -7.099181652069092, "global_step": 25381, "epoch": 151} {"train_loss": -7.07127571105957, "global_step": 25382, "epoch": 151} {"train_loss": -7.040741920471191, "global_step": 25383, "epoch": 151} {"train_loss": -6.887015342712402, "global_step": 25384, "epoch": 151} {"train_loss": -7.065802574157715, "global_step": 25385, "epoch": 151} {"train_loss": -7.191615104675293, "global_step": 25386, "epoch": 151} {"train_loss": -7.019199371337891, "global_step": 25387, "epoch": 151} {"train_loss": -7.044905662536621, "global_step": 25388, "epoch": 151} {"train_loss": -6.923453330993652, "global_step": 25389, "epoch": 151} {"train_loss": -6.8991241455078125, "global_step": 25390, "epoch": 151} {"train_loss": -6.972500801086426, "global_step": 25391, "epoch": 151} {"train_loss": -7.093255519866943, "global_step": 25392, "epoch": 151} {"train_loss": -7.0969343185424805, "global_step": 25393, "epoch": 151} {"train_loss": -7.108724594116211, "global_step": 25394, "epoch": 151} {"train_loss": -7.165700912475586, "global_step": 25395, "epoch": 151} {"train_loss": -7.101998329162598, "global_step": 25396, "epoch": 151} {"train_loss": -7.260485649108887, "global_step": 25397, "epoch": 151} {"train_loss": -7.154256820678711, "global_step": 25398, "epoch": 151} {"train_loss": -7.141393661499023, "global_step": 25399, "epoch": 151} {"train_loss": -7.272758483886719, "global_step": 25400, "epoch": 151} {"train_loss": -7.3109283447265625, "global_step": 25401, "epoch": 151} {"train_loss": -7.339442729949951, "global_step": 25402, "epoch": 151} {"train_loss": -7.1264142990112305, "global_step": 25403, "epoch": 151} {"train_loss": -7.218317031860352, "global_step": 25404, "epoch": 151} {"train_loss": -7.101840972900391, "global_step": 25405, "epoch": 151} {"train_loss": -7.1746344566345215, "global_step": 25406, "epoch": 151} {"train_loss": -7.450631141662598, "global_step": 25407, "epoch": 151} {"train_loss": -7.285168647766113, "global_step": 25408, "epoch": 151} {"train_loss": -7.2992987632751465, "global_step": 25409, "epoch": 151} {"train_loss": -7.29569149017334, "global_step": 25410, "epoch": 151} {"train_loss": -7.0693840980529785, "global_step": 25411, "epoch": 151} {"train_loss": -7.273159503936768, "global_step": 25412, "epoch": 151} {"train_loss": -7.154409408569336, "global_step": 25413, "epoch": 151} {"train_loss": -7.292843341827393, "global_step": 25414, "epoch": 151} {"train_loss": -7.122325897216797, "global_step": 25415, "epoch": 151} {"train_loss": -7.2674760818481445, "global_step": 25416, "epoch": 151} {"train_loss": -7.063850402832031, "global_step": 25417, "epoch": 151} {"train_loss": -7.229134559631348, "global_step": 25418, "epoch": 151} {"train_loss": -6.951171875, "global_step": 25419, "epoch": 151} {"train_loss": -6.749506950378418, "global_step": 25420, "epoch": 151} {"train_loss": -7.131803512573242, "global_step": 25421, "epoch": 151} {"train_loss": -6.8054890632629395, "global_step": 25422, "epoch": 151} {"train_loss": -6.851121425628662, "global_step": 25423, "epoch": 151} {"train_loss": -7.167209148406982, "global_step": 25424, "epoch": 151} {"train_loss": -7.343916893005371, "global_step": 25425, "epoch": 151} {"train_loss": -7.08129358291626, "global_step": 25426, "epoch": 151} {"train_loss": -7.029830455780029, "global_step": 25427, "epoch": 151} {"train_loss": -7.2809648513793945, "global_step": 25428, "epoch": 151} {"train_loss": -7.16414737701416, "global_step": 25429, "epoch": 151} {"train_loss": -6.966372489929199, "global_step": 25430, "epoch": 151} {"train_loss": -7.148268699645996, "global_step": 25431, "epoch": 151} {"train_loss": -7.253399848937988, "global_step": 25432, "epoch": 151} {"train_loss": -7.177556991577148, "global_step": 25433, "epoch": 151} {"train_loss": -7.084665775299072, "global_step": 25434, "epoch": 151} {"train_loss": -7.219147682189941, "global_step": 25435, "epoch": 151} {"train_loss": -6.959221839904785, "global_step": 25436, "epoch": 151} {"train_loss": -7.148431301116943, "global_step": 25437, "epoch": 151} {"train_loss": -7.157076835632324, "global_step": 25438, "epoch": 151} {"train_loss": -7.094269752502441, "global_step": 25439, "epoch": 151} {"train_loss": -6.876874923706055, "global_step": 25440, "epoch": 151} {"train_loss": -7.19541597366333, "global_step": 25441, "epoch": 151} {"train_loss": -7.200103282928467, "global_step": 25442, "epoch": 151} {"train_loss": -7.302089691162109, "global_step": 25443, "epoch": 151} {"train_loss": -7.100275039672852, "global_step": 25444, "epoch": 151} {"train_loss": -7.53176212310791, "global_step": 25445, "epoch": 151} {"train_loss": -7.314270973205566, "global_step": 25446, "epoch": 151} {"train_loss": -7.418896675109863, "global_step": 25447, "epoch": 151} {"train_loss": -7.156895637512207, "global_step": 25448, "epoch": 151} {"train_loss": -7.419642448425293, "global_step": 25449, "epoch": 151} {"train_loss": -6.971926689147949, "global_step": 25450, "epoch": 151} {"train_loss": -7.367298603057861, "global_step": 25451, "epoch": 151} {"train_loss": -7.2750654220581055, "global_step": 25452, "epoch": 151} {"train_loss": -7.207526683807373, "global_step": 25453, "epoch": 151} {"train_loss": -7.354404926300049, "global_step": 25454, "epoch": 151} {"train_loss": -7.282758712768555, "global_step": 25455, "epoch": 151} {"train_loss": -7.267075061798096, "global_step": 25456, "epoch": 151} {"train_loss": -6.970660209655762, "global_step": 25457, "epoch": 151} {"train_loss": -7.44487190246582, "global_step": 25458, "epoch": 151} {"train_loss": -7.139788627624512, "global_step": 25459, "epoch": 151} {"train_loss": -7.212553977966309, "global_step": 25460, "epoch": 151} {"train_loss": -7.069433212280273, "global_step": 25461, "epoch": 151} {"train_loss": -7.131598472595215, "global_step": 25462, "epoch": 151} {"train_loss": -7.078677177429199, "global_step": 25463, "epoch": 151} {"train_loss": -7.007111072540283, "global_step": 25464, "epoch": 151} {"train_loss": -6.910700798034668, "global_step": 25465, "epoch": 151} {"train_loss": -7.007534027099609, "global_step": 25466, "epoch": 151} {"train_loss": -6.565192222595215, "global_step": 25467, "epoch": 151} {"train_loss": -6.831068992614746, "global_step": 25468, "epoch": 151} {"train_loss": -6.955480575561523, "global_step": 25469, "epoch": 151} {"train_loss": -6.579856872558594, "global_step": 25470, "epoch": 151} {"train_loss": -6.924158096313477, "global_step": 25471, "epoch": 151} {"train_loss": -7.273860931396484, "global_step": 25472, "epoch": 151} {"train_loss": -6.741203308105469, "global_step": 25473, "epoch": 151} {"train_loss": -6.871007919311523, "global_step": 25474, "epoch": 151} {"train_loss": -6.893049716949463, "global_step": 25475, "epoch": 151} {"train_loss": -6.931279182434082, "global_step": 25476, "epoch": 151} {"train_loss": -7.049830436706543, "global_step": 25477, "epoch": 151} {"train_loss": -6.888097763061523, "global_step": 25478, "epoch": 151} {"train_loss": -7.042142868041992, "global_step": 25479, "epoch": 151} {"train_loss": -7.2838592529296875, "global_step": 25480, "epoch": 151} {"train_loss": -7.248190879821777, "global_step": 25481, "epoch": 151} {"train_loss": -7.269343376159668, "global_step": 25482, "epoch": 151} {"train_loss": -7.2333149909973145, "global_step": 25483, "epoch": 151} {"train_loss": -7.103142738342285, "global_step": 25484, "epoch": 151} {"train_loss": -7.2156500816345215, "global_step": 25485, "epoch": 151} {"train_loss": -7.115451812744141, "global_step": 25486, "epoch": 151} {"train_loss": -7.526042938232422, "global_step": 25487, "epoch": 151} {"train_loss": -7.285489082336426, "global_step": 25488, "epoch": 151} {"train_loss": -7.257037162780762, "global_step": 25489, "epoch": 151} {"train_loss": -7.052372932434082, "global_step": 25490, "epoch": 151} {"train_loss": -7.119168281555176, "global_step": 25491, "epoch": 151} {"train_loss": -7.244420528411865, "global_step": 25492, "epoch": 151} {"train_loss": -7.261868476867676, "global_step": 25493, "epoch": 151} {"train_loss": -7.341451644897461, "global_step": 25494, "epoch": 151} {"train_loss": -7.291602611541748, "global_step": 25495, "epoch": 151} {"train_loss": -7.329831123352051, "global_step": 25496, "epoch": 151} {"train_loss": -7.605327606201172, "global_step": 25497, "epoch": 151} {"train_loss": -7.241363525390625, "global_step": 25498, "epoch": 151} {"train_loss": -7.300707817077637, "global_step": 25499, "epoch": 151} {"train_loss": -7.133173942565918, "global_step": 25500, "epoch": 151} {"train_loss": -7.06387996673584, "global_step": 25501, "epoch": 151} {"train_loss": -7.604256629943848, "global_step": 25502, "epoch": 151} {"train_loss": -7.326706409454346, "global_step": 25503, "epoch": 151} {"train_loss": -7.1620564460754395, "global_step": 25504, "epoch": 151} {"train_loss": -7.263465881347656, "global_step": 25505, "epoch": 151} {"train_loss": -6.954283237457275, "global_step": 25506, "epoch": 151} {"train_loss": -6.838709354400635, "global_step": 25507, "epoch": 151} {"train_loss": -7.170792579650879, "global_step": 25508, "epoch": 151} {"train_loss": -7.135857582092285, "global_step": 25509, "epoch": 151} {"train_loss": -6.911358833312988, "global_step": 25510, "epoch": 151} {"train_loss": -7.145379543304443, "global_step": 25511, "epoch": 151} {"train_loss": -6.829945087432861, "global_step": 25512, "epoch": 151} {"train_loss": -7.116662502288818, "global_step": 25513, "epoch": 151} {"train_loss": -7.033806800842285, "global_step": 25514, "epoch": 151} {"train_loss": -7.208036422729492, "global_step": 25515, "epoch": 151} {"train_loss": -7.275821685791016, "global_step": 25516, "epoch": 151} {"train_loss": -7.07484245300293, "global_step": 25517, "epoch": 151} {"train_loss": -7.167868614196777, "global_step": 25518, "epoch": 151} {"train_loss": -7.255983829498291, "global_step": 25519, "epoch": 151} {"train_loss": -7.345510482788086, "global_step": 25520, "epoch": 151} {"train_loss": -7.055584907531738, "global_step": 25521, "epoch": 151} {"train_loss": -7.151554107666016, "global_step": 25522, "epoch": 151} {"train_loss": -7.274443626403809, "global_step": 25523, "epoch": 151} {"train_loss": -7.2561140060424805, "global_step": 25524, "epoch": 151} {"train_loss": -7.362934112548828, "global_step": 25525, "epoch": 151} {"train_loss": -7.238064289093018, "global_step": 25526, "epoch": 151} {"train_loss": -6.938917636871338, "global_step": 25527, "epoch": 151} {"train_loss": -7.101997375488281, "global_step": 25528, "epoch": 151} {"train_loss": -7.106035232543945, "global_step": 25529, "epoch": 151} {"train_loss": -7.283685207366943, "global_step": 25530, "epoch": 151} {"train_loss": -6.934706687927246, "global_step": 25531, "epoch": 151} {"train_loss": -7.072000503540039, "global_step": 25532, "epoch": 151} {"train_loss": -7.387193202972412, "global_step": 25533, "epoch": 151} {"train_loss": -7.101970195770264, "global_step": 25534, "epoch": 151} {"train_loss": -7.1456654497555325, "global_step": 25535, "epoch": 151, "val_loss": 200572.734375} {"train_loss": -7.232532978057861, "global_step": 25536, "epoch": 152} {"train_loss": -6.892032146453857, "global_step": 25537, "epoch": 152} {"train_loss": -7.265575408935547, "global_step": 25538, "epoch": 152} {"train_loss": -7.19545841217041, "global_step": 25539, "epoch": 152} {"train_loss": -7.164093971252441, "global_step": 25540, "epoch": 152} {"train_loss": -7.04929256439209, "global_step": 25541, "epoch": 152} {"train_loss": -7.14615535736084, "global_step": 25542, "epoch": 152} {"train_loss": -7.139382362365723, "global_step": 25543, "epoch": 152} {"train_loss": -6.9593610763549805, "global_step": 25544, "epoch": 152} {"train_loss": -7.057918548583984, "global_step": 25545, "epoch": 152} {"train_loss": -7.2113542556762695, "global_step": 25546, "epoch": 152} {"train_loss": -6.978662014007568, "global_step": 25547, "epoch": 152} {"train_loss": -7.159576416015625, "global_step": 25548, "epoch": 152} {"train_loss": -7.011482238769531, "global_step": 25549, "epoch": 152} {"train_loss": -7.07294225692749, "global_step": 25550, "epoch": 152} {"train_loss": -7.244131565093994, "global_step": 25551, "epoch": 152} {"train_loss": -6.939743995666504, "global_step": 25552, "epoch": 152} {"train_loss": -7.0112080574035645, "global_step": 25553, "epoch": 152} {"train_loss": -7.163281440734863, "global_step": 25554, "epoch": 152} {"train_loss": -7.1390275955200195, "global_step": 25555, "epoch": 152} {"train_loss": -7.077703475952148, "global_step": 25556, "epoch": 152} {"train_loss": -7.001875877380371, "global_step": 25557, "epoch": 152} {"train_loss": -7.106050968170166, "global_step": 25558, "epoch": 152} {"train_loss": -7.284060955047607, "global_step": 25559, "epoch": 152} {"train_loss": -7.313088417053223, "global_step": 25560, "epoch": 152} {"train_loss": -7.2055559158325195, "global_step": 25561, "epoch": 152} {"train_loss": -6.910610198974609, "global_step": 25562, "epoch": 152} {"train_loss": -7.101655006408691, "global_step": 25563, "epoch": 152} {"train_loss": -7.008349895477295, "global_step": 25564, "epoch": 152} {"train_loss": -6.905352592468262, "global_step": 25565, "epoch": 152} {"train_loss": -7.320300102233887, "global_step": 25566, "epoch": 152} {"train_loss": -7.026203632354736, "global_step": 25567, "epoch": 152} {"train_loss": -7.29086971282959, "global_step": 25568, "epoch": 152} {"train_loss": -7.2549052238464355, "global_step": 25569, "epoch": 152} {"train_loss": -7.24220085144043, "global_step": 25570, "epoch": 152} {"train_loss": -7.131106853485107, "global_step": 25571, "epoch": 152} {"train_loss": -7.394491195678711, "global_step": 25572, "epoch": 152} {"train_loss": -7.348941326141357, "global_step": 25573, "epoch": 152} {"train_loss": -7.143512725830078, "global_step": 25574, "epoch": 152} {"train_loss": -7.397568225860596, "global_step": 25575, "epoch": 152} {"train_loss": -7.081239700317383, "global_step": 25576, "epoch": 152} {"train_loss": -7.1848554611206055, "global_step": 25577, "epoch": 152} {"train_loss": -7.2054243087768555, "global_step": 25578, "epoch": 152} {"train_loss": -7.288944244384766, "global_step": 25579, "epoch": 152} {"train_loss": -7.046028137207031, "global_step": 25580, "epoch": 152} {"train_loss": -7.23583984375, "global_step": 25581, "epoch": 152} {"train_loss": -6.922390937805176, "global_step": 25582, "epoch": 152} {"train_loss": -7.3727827072143555, "global_step": 25583, "epoch": 152} {"train_loss": -7.015736103057861, "global_step": 25584, "epoch": 152} {"train_loss": -7.240260601043701, "global_step": 25585, "epoch": 152} {"train_loss": -7.173299312591553, "global_step": 25586, "epoch": 152} {"train_loss": -7.044633865356445, "global_step": 25587, "epoch": 152} {"train_loss": -7.194550514221191, "global_step": 25588, "epoch": 152} {"train_loss": -7.003120422363281, "global_step": 25589, "epoch": 152} {"train_loss": -7.138772487640381, "global_step": 25590, "epoch": 152} {"train_loss": -7.2438225746154785, "global_step": 25591, "epoch": 152} {"train_loss": -7.074737548828125, "global_step": 25592, "epoch": 152} {"train_loss": -7.050532341003418, "global_step": 25593, "epoch": 152} {"train_loss": -7.187525749206543, "global_step": 25594, "epoch": 152} {"train_loss": -6.92421817779541, "global_step": 25595, "epoch": 152} {"train_loss": -7.198584079742432, "global_step": 25596, "epoch": 152} {"train_loss": -7.140202522277832, "global_step": 25597, "epoch": 152} {"train_loss": -7.223789215087891, "global_step": 25598, "epoch": 152} {"train_loss": -7.144443988800049, "global_step": 25599, "epoch": 152} {"train_loss": -6.907862186431885, "global_step": 25600, "epoch": 152} {"train_loss": -7.1117401123046875, "global_step": 25601, "epoch": 152} {"train_loss": -7.221804618835449, "global_step": 25602, "epoch": 152} {"train_loss": -7.057059288024902, "global_step": 25603, "epoch": 152} {"train_loss": -7.20521879196167, "global_step": 25604, "epoch": 152} {"train_loss": -7.162022590637207, "global_step": 25605, "epoch": 152} {"train_loss": -7.254693031311035, "global_step": 25606, "epoch": 152} {"train_loss": -7.323459148406982, "global_step": 25607, "epoch": 152} {"train_loss": -6.939031600952148, "global_step": 25608, "epoch": 152} {"train_loss": -7.025842189788818, "global_step": 25609, "epoch": 152} {"train_loss": -7.1889238357543945, "global_step": 25610, "epoch": 152} {"train_loss": -7.4741387367248535, "global_step": 25611, "epoch": 152} {"train_loss": -7.15760612487793, "global_step": 25612, "epoch": 152} {"train_loss": -7.177751541137695, "global_step": 25613, "epoch": 152} {"train_loss": -7.326475143432617, "global_step": 25614, "epoch": 152} {"train_loss": -7.266772747039795, "global_step": 25615, "epoch": 152} {"train_loss": -7.204633712768555, "global_step": 25616, "epoch": 152} {"train_loss": -7.184098243713379, "global_step": 25617, "epoch": 152} {"train_loss": -7.3134307861328125, "global_step": 25618, "epoch": 152} {"train_loss": -7.373211860656738, "global_step": 25619, "epoch": 152} {"train_loss": -7.193722724914551, "global_step": 25620, "epoch": 152} {"train_loss": -7.237048625946045, "global_step": 25621, "epoch": 152} {"train_loss": -7.608064651489258, "global_step": 25622, "epoch": 152} {"train_loss": -7.314364433288574, "global_step": 25623, "epoch": 152} {"train_loss": -7.013627529144287, "global_step": 25624, "epoch": 152} {"train_loss": -7.343897819519043, "global_step": 25625, "epoch": 152} {"train_loss": -7.2928290367126465, "global_step": 25626, "epoch": 152} {"train_loss": -7.4308342933654785, "global_step": 25627, "epoch": 152} {"train_loss": -7.309628009796143, "global_step": 25628, "epoch": 152} {"train_loss": -7.532244682312012, "global_step": 25629, "epoch": 152} {"train_loss": -7.305089950561523, "global_step": 25630, "epoch": 152} {"train_loss": -7.375152587890625, "global_step": 25631, "epoch": 152} {"train_loss": -7.497077465057373, "global_step": 25632, "epoch": 152} {"train_loss": -6.855032444000244, "global_step": 25633, "epoch": 152} {"train_loss": -7.264128684997559, "global_step": 25634, "epoch": 152} {"train_loss": -6.685070037841797, "global_step": 25635, "epoch": 152} {"train_loss": -7.330857276916504, "global_step": 25636, "epoch": 152} {"train_loss": -6.597073554992676, "global_step": 25637, "epoch": 152} {"train_loss": -7.304715156555176, "global_step": 25638, "epoch": 152} {"train_loss": -6.8299736976623535, "global_step": 25639, "epoch": 152} {"train_loss": -7.25671911239624, "global_step": 25640, "epoch": 152} {"train_loss": -6.906816482543945, "global_step": 25641, "epoch": 152} {"train_loss": -7.341297149658203, "global_step": 25642, "epoch": 152} {"train_loss": -7.255411148071289, "global_step": 25643, "epoch": 152} {"train_loss": -6.8819475173950195, "global_step": 25644, "epoch": 152} {"train_loss": -7.219151973724365, "global_step": 25645, "epoch": 152} {"train_loss": -7.122952938079834, "global_step": 25646, "epoch": 152} {"train_loss": -7.171830177307129, "global_step": 25647, "epoch": 152} {"train_loss": -7.235312461853027, "global_step": 25648, "epoch": 152} {"train_loss": -7.139368534088135, "global_step": 25649, "epoch": 152} {"train_loss": -7.2262115478515625, "global_step": 25650, "epoch": 152} {"train_loss": -7.06378173828125, "global_step": 25651, "epoch": 152} {"train_loss": -7.22318172454834, "global_step": 25652, "epoch": 152} {"train_loss": -6.8587751388549805, "global_step": 25653, "epoch": 152} {"train_loss": -7.264684677124023, "global_step": 25654, "epoch": 152} {"train_loss": -7.1026153564453125, "global_step": 25655, "epoch": 152} {"train_loss": -7.227328300476074, "global_step": 25656, "epoch": 152} {"train_loss": -7.347018241882324, "global_step": 25657, "epoch": 152} {"train_loss": -7.116189956665039, "global_step": 25658, "epoch": 152} {"train_loss": -7.27095890045166, "global_step": 25659, "epoch": 152} {"train_loss": -7.642107009887695, "global_step": 25660, "epoch": 152} {"train_loss": -7.265749931335449, "global_step": 25661, "epoch": 152} {"train_loss": -7.124699592590332, "global_step": 25662, "epoch": 152} {"train_loss": -7.27617883682251, "global_step": 25663, "epoch": 152} {"train_loss": -6.999650955200195, "global_step": 25664, "epoch": 152} {"train_loss": -6.913448333740234, "global_step": 25665, "epoch": 152} {"train_loss": -6.918012619018555, "global_step": 25666, "epoch": 152} {"train_loss": -7.134706497192383, "global_step": 25667, "epoch": 152} {"train_loss": -7.000514984130859, "global_step": 25668, "epoch": 152} {"train_loss": -7.293205261230469, "global_step": 25669, "epoch": 152} {"train_loss": -7.39476203918457, "global_step": 25670, "epoch": 152} {"train_loss": -6.888122081756592, "global_step": 25671, "epoch": 152} {"train_loss": -7.131474494934082, "global_step": 25672, "epoch": 152} {"train_loss": -6.901134014129639, "global_step": 25673, "epoch": 152} {"train_loss": -7.154059410095215, "global_step": 25674, "epoch": 152} {"train_loss": -6.942018508911133, "global_step": 25675, "epoch": 152} {"train_loss": -7.137556552886963, "global_step": 25676, "epoch": 152} {"train_loss": -7.119232177734375, "global_step": 25677, "epoch": 152} {"train_loss": -6.914746284484863, "global_step": 25678, "epoch": 152} {"train_loss": -7.187591075897217, "global_step": 25679, "epoch": 152} {"train_loss": -7.178339958190918, "global_step": 25680, "epoch": 152} {"train_loss": -7.047147750854492, "global_step": 25681, "epoch": 152} {"train_loss": -7.2481794357299805, "global_step": 25682, "epoch": 152} {"train_loss": -6.855480670928955, "global_step": 25683, "epoch": 152} {"train_loss": -7.175547122955322, "global_step": 25684, "epoch": 152} {"train_loss": -6.654539108276367, "global_step": 25685, "epoch": 152} {"train_loss": -7.142792224884033, "global_step": 25686, "epoch": 152} {"train_loss": -7.06110954284668, "global_step": 25687, "epoch": 152} {"train_loss": -7.161431312561035, "global_step": 25688, "epoch": 152} {"train_loss": -7.200658798217773, "global_step": 25689, "epoch": 152} {"train_loss": -7.112598419189453, "global_step": 25690, "epoch": 152} {"train_loss": -7.179888725280762, "global_step": 25691, "epoch": 152} {"train_loss": -7.313042163848877, "global_step": 25692, "epoch": 152} {"train_loss": -7.106599807739258, "global_step": 25693, "epoch": 152} {"train_loss": -7.182767868041992, "global_step": 25694, "epoch": 152} {"train_loss": -7.144472122192383, "global_step": 25695, "epoch": 152} {"train_loss": -7.317654609680176, "global_step": 25696, "epoch": 152} {"train_loss": -7.299013614654541, "global_step": 25697, "epoch": 152} {"train_loss": -7.392453193664551, "global_step": 25698, "epoch": 152} {"train_loss": -7.28549861907959, "global_step": 25699, "epoch": 152} {"train_loss": -7.315465450286865, "global_step": 25700, "epoch": 152} {"train_loss": -7.361408710479736, "global_step": 25701, "epoch": 152} {"train_loss": -7.209074020385742, "global_step": 25702, "epoch": 152} {"train_loss": -7.159591686157953, "global_step": 25703, "epoch": 152, "val_loss": 196878.234375} {"train_loss": -7.207841873168945, "global_step": 25704, "epoch": 153} {"train_loss": -7.195796012878418, "global_step": 25705, "epoch": 153} {"train_loss": -7.185703277587891, "global_step": 25706, "epoch": 153} {"train_loss": -7.410251617431641, "global_step": 25707, "epoch": 153} {"train_loss": -6.906293869018555, "global_step": 25708, "epoch": 153} {"train_loss": -7.117148399353027, "global_step": 25709, "epoch": 153} {"train_loss": -7.2364325523376465, "global_step": 25710, "epoch": 153} {"train_loss": -7.39113712310791, "global_step": 25711, "epoch": 153} {"train_loss": -7.092783451080322, "global_step": 25712, "epoch": 153} {"train_loss": -7.207096099853516, "global_step": 25713, "epoch": 153} {"train_loss": -7.266925811767578, "global_step": 25714, "epoch": 153} {"train_loss": -7.252188682556152, "global_step": 25715, "epoch": 153} {"train_loss": -7.188366889953613, "global_step": 25716, "epoch": 153} {"train_loss": -7.3218817710876465, "global_step": 25717, "epoch": 153} {"train_loss": -7.231779098510742, "global_step": 25718, "epoch": 153} {"train_loss": -6.847009658813477, "global_step": 25719, "epoch": 153} {"train_loss": -7.23675537109375, "global_step": 25720, "epoch": 153} {"train_loss": -6.968029975891113, "global_step": 25721, "epoch": 153} {"train_loss": -7.083063125610352, "global_step": 25722, "epoch": 153} {"train_loss": -6.952750205993652, "global_step": 25723, "epoch": 153} {"train_loss": -7.111243724822998, "global_step": 25724, "epoch": 153} {"train_loss": -7.138273239135742, "global_step": 25725, "epoch": 153} {"train_loss": -6.935303688049316, "global_step": 25726, "epoch": 153} {"train_loss": -7.036967754364014, "global_step": 25727, "epoch": 153} {"train_loss": -7.262772083282471, "global_step": 25728, "epoch": 153} {"train_loss": -7.178321838378906, "global_step": 25729, "epoch": 153} {"train_loss": -7.202561855316162, "global_step": 25730, "epoch": 153} {"train_loss": -7.328342437744141, "global_step": 25731, "epoch": 153} {"train_loss": -7.240124702453613, "global_step": 25732, "epoch": 153} {"train_loss": -7.160648345947266, "global_step": 25733, "epoch": 153} {"train_loss": -7.170966625213623, "global_step": 25734, "epoch": 153} {"train_loss": -7.156522750854492, "global_step": 25735, "epoch": 153} {"train_loss": -7.181841850280762, "global_step": 25736, "epoch": 153} {"train_loss": -7.314910411834717, "global_step": 25737, "epoch": 153} {"train_loss": -6.986742973327637, "global_step": 25738, "epoch": 153} {"train_loss": -7.2572712898254395, "global_step": 25739, "epoch": 153} {"train_loss": -6.967055797576904, "global_step": 25740, "epoch": 153} {"train_loss": -7.296975135803223, "global_step": 25741, "epoch": 153} {"train_loss": -7.310380458831787, "global_step": 25742, "epoch": 153} {"train_loss": -7.298203468322754, "global_step": 25743, "epoch": 153} {"train_loss": -7.128668785095215, "global_step": 25744, "epoch": 153} {"train_loss": -7.283916473388672, "global_step": 25745, "epoch": 153} {"train_loss": -7.430549621582031, "global_step": 25746, "epoch": 153} {"train_loss": -7.331029891967773, "global_step": 25747, "epoch": 153} {"train_loss": -7.365099906921387, "global_step": 25748, "epoch": 153} {"train_loss": -7.364875316619873, "global_step": 25749, "epoch": 153} {"train_loss": -7.405023097991943, "global_step": 25750, "epoch": 153} {"train_loss": -7.063718795776367, "global_step": 25751, "epoch": 153} {"train_loss": -7.331211090087891, "global_step": 25752, "epoch": 153} {"train_loss": -7.329952239990234, "global_step": 25753, "epoch": 153} {"train_loss": -7.230942726135254, "global_step": 25754, "epoch": 153} {"train_loss": -7.185792922973633, "global_step": 25755, "epoch": 153} {"train_loss": -7.117483139038086, "global_step": 25756, "epoch": 153} {"train_loss": -7.357152462005615, "global_step": 25757, "epoch": 153} {"train_loss": -7.4017438888549805, "global_step": 25758, "epoch": 153} {"train_loss": -7.293625831604004, "global_step": 25759, "epoch": 153} {"train_loss": -7.39061164855957, "global_step": 25760, "epoch": 153} {"train_loss": -7.262141227722168, "global_step": 25761, "epoch": 153} {"train_loss": -7.38428258895874, "global_step": 25762, "epoch": 153} {"train_loss": -7.0482378005981445, "global_step": 25763, "epoch": 153} {"train_loss": -7.1916680335998535, "global_step": 25764, "epoch": 153} {"train_loss": -6.910348892211914, "global_step": 25765, "epoch": 153} {"train_loss": -7.482224464416504, "global_step": 25766, "epoch": 153} {"train_loss": -7.215753555297852, "global_step": 25767, "epoch": 153} {"train_loss": -7.166412353515625, "global_step": 25768, "epoch": 153} {"train_loss": -7.026191711425781, "global_step": 25769, "epoch": 153} {"train_loss": -7.060441493988037, "global_step": 25770, "epoch": 153} {"train_loss": -6.916991233825684, "global_step": 25771, "epoch": 153} {"train_loss": -7.212344169616699, "global_step": 25772, "epoch": 153} {"train_loss": -7.011061191558838, "global_step": 25773, "epoch": 153} {"train_loss": -7.209351539611816, "global_step": 25774, "epoch": 153} {"train_loss": -6.916929721832275, "global_step": 25775, "epoch": 153} {"train_loss": -7.191787242889404, "global_step": 25776, "epoch": 153} {"train_loss": -7.17105770111084, "global_step": 25777, "epoch": 153} {"train_loss": -6.924277305603027, "global_step": 25778, "epoch": 153} {"train_loss": -6.960052967071533, "global_step": 25779, "epoch": 153} {"train_loss": -7.161108016967773, "global_step": 25780, "epoch": 153} {"train_loss": -6.87780237197876, "global_step": 25781, "epoch": 153} {"train_loss": -7.268407344818115, "global_step": 25782, "epoch": 153} {"train_loss": -7.147893905639648, "global_step": 25783, "epoch": 153} {"train_loss": -7.297018527984619, "global_step": 25784, "epoch": 153} {"train_loss": -7.0133957862854, "global_step": 25785, "epoch": 153} {"train_loss": -7.146567344665527, "global_step": 25786, "epoch": 153} {"train_loss": -7.090620994567871, "global_step": 25787, "epoch": 153} {"train_loss": -7.12955379486084, "global_step": 25788, "epoch": 153} {"train_loss": -7.138440132141113, "global_step": 25789, "epoch": 153} {"train_loss": -7.037968635559082, "global_step": 25790, "epoch": 153} {"train_loss": -7.318546295166016, "global_step": 25791, "epoch": 153} {"train_loss": -7.148674964904785, "global_step": 25792, "epoch": 153} {"train_loss": -7.113652229309082, "global_step": 25793, "epoch": 153} {"train_loss": -7.320575714111328, "global_step": 25794, "epoch": 153} {"train_loss": -7.282210826873779, "global_step": 25795, "epoch": 153} {"train_loss": -7.014919281005859, "global_step": 25796, "epoch": 153} {"train_loss": -7.192654609680176, "global_step": 25797, "epoch": 153} {"train_loss": -6.912540912628174, "global_step": 25798, "epoch": 153} {"train_loss": -7.176624298095703, "global_step": 25799, "epoch": 153} {"train_loss": -7.183115005493164, "global_step": 25800, "epoch": 153} {"train_loss": -7.042692184448242, "global_step": 25801, "epoch": 153} {"train_loss": -7.1873674392700195, "global_step": 25802, "epoch": 153} {"train_loss": -7.146157264709473, "global_step": 25803, "epoch": 153} {"train_loss": -7.193179130554199, "global_step": 25804, "epoch": 153} {"train_loss": -7.281829833984375, "global_step": 25805, "epoch": 153} {"train_loss": -7.165711402893066, "global_step": 25806, "epoch": 153} {"train_loss": -7.179823875427246, "global_step": 25807, "epoch": 153} {"train_loss": -7.11953592300415, "global_step": 25808, "epoch": 153} {"train_loss": -7.045160293579102, "global_step": 25809, "epoch": 153} {"train_loss": -7.098206520080566, "global_step": 25810, "epoch": 153} {"train_loss": -7.244585037231445, "global_step": 25811, "epoch": 153} {"train_loss": -7.228766441345215, "global_step": 25812, "epoch": 153} {"train_loss": -7.260711669921875, "global_step": 25813, "epoch": 153} {"train_loss": -7.367196083068848, "global_step": 25814, "epoch": 153} {"train_loss": -7.249807834625244, "global_step": 25815, "epoch": 153} {"train_loss": -7.453423500061035, "global_step": 25816, "epoch": 153} {"train_loss": -7.222019672393799, "global_step": 25817, "epoch": 153} {"train_loss": -7.250907897949219, "global_step": 25818, "epoch": 153} {"train_loss": -7.376873016357422, "global_step": 25819, "epoch": 153} {"train_loss": -7.45499849319458, "global_step": 25820, "epoch": 153} {"train_loss": -7.317309856414795, "global_step": 25821, "epoch": 153} {"train_loss": -7.084132194519043, "global_step": 25822, "epoch": 153} {"train_loss": -7.187890529632568, "global_step": 25823, "epoch": 153} {"train_loss": -7.19543981552124, "global_step": 25824, "epoch": 153} {"train_loss": -7.2521867752075195, "global_step": 25825, "epoch": 153} {"train_loss": -7.01228141784668, "global_step": 25826, "epoch": 153} {"train_loss": -7.3085174560546875, "global_step": 25827, "epoch": 153} {"train_loss": -7.257662296295166, "global_step": 25828, "epoch": 153} {"train_loss": -7.31954288482666, "global_step": 25829, "epoch": 153} {"train_loss": -7.167588233947754, "global_step": 25830, "epoch": 153} {"train_loss": -7.130739688873291, "global_step": 25831, "epoch": 153} {"train_loss": -7.062263488769531, "global_step": 25832, "epoch": 153} {"train_loss": -7.376740455627441, "global_step": 25833, "epoch": 153} {"train_loss": -7.189205169677734, "global_step": 25834, "epoch": 153} {"train_loss": -7.1948442459106445, "global_step": 25835, "epoch": 153} {"train_loss": -7.409768104553223, "global_step": 25836, "epoch": 153} {"train_loss": -7.069301605224609, "global_step": 25837, "epoch": 153} {"train_loss": -7.302717208862305, "global_step": 25838, "epoch": 153} {"train_loss": -7.13322639465332, "global_step": 25839, "epoch": 153} {"train_loss": -7.227031230926514, "global_step": 25840, "epoch": 153} {"train_loss": -7.4357709884643555, "global_step": 25841, "epoch": 153} {"train_loss": -7.397242069244385, "global_step": 25842, "epoch": 153} {"train_loss": -7.337968826293945, "global_step": 25843, "epoch": 153} {"train_loss": -7.18554162979126, "global_step": 25844, "epoch": 153} {"train_loss": -7.543338775634766, "global_step": 25845, "epoch": 153} {"train_loss": -7.184447288513184, "global_step": 25846, "epoch": 153} {"train_loss": -7.513956546783447, "global_step": 25847, "epoch": 153} {"train_loss": -7.368001937866211, "global_step": 25848, "epoch": 153} {"train_loss": -7.119877815246582, "global_step": 25849, "epoch": 153} {"train_loss": -7.251110553741455, "global_step": 25850, "epoch": 153} {"train_loss": -7.235090255737305, "global_step": 25851, "epoch": 153} {"train_loss": -7.317601680755615, "global_step": 25852, "epoch": 153} {"train_loss": -7.505257606506348, "global_step": 25853, "epoch": 153} {"train_loss": -7.226722240447998, "global_step": 25854, "epoch": 153} {"train_loss": -7.248152732849121, "global_step": 25855, "epoch": 153} {"train_loss": -7.3103532791137695, "global_step": 25856, "epoch": 153} {"train_loss": -7.370672225952148, "global_step": 25857, "epoch": 153} {"train_loss": -7.273983001708984, "global_step": 25858, "epoch": 153} {"train_loss": -7.568477630615234, "global_step": 25859, "epoch": 153} {"train_loss": -7.343174934387207, "global_step": 25860, "epoch": 153} {"train_loss": -7.296934127807617, "global_step": 25861, "epoch": 153} {"train_loss": -6.927143096923828, "global_step": 25862, "epoch": 153} {"train_loss": -7.055217266082764, "global_step": 25863, "epoch": 153} {"train_loss": -6.884597301483154, "global_step": 25864, "epoch": 153} {"train_loss": -7.087786674499512, "global_step": 25865, "epoch": 153} {"train_loss": -7.341058731079102, "global_step": 25866, "epoch": 153} {"train_loss": -7.261520862579346, "global_step": 25867, "epoch": 153} {"train_loss": -7.070672035217285, "global_step": 25868, "epoch": 153} {"train_loss": -7.374625205993652, "global_step": 25869, "epoch": 153} {"train_loss": -7.053620338439941, "global_step": 25870, "epoch": 153} {"train_loss": -7.204072083745684, "global_step": 25871, "epoch": 153, "val_loss": 197248.09375} {"train_loss": -7.228403091430664, "global_step": 25872, "epoch": 154} {"train_loss": -6.989928245544434, "global_step": 25873, "epoch": 154} {"train_loss": -7.092073440551758, "global_step": 25874, "epoch": 154} {"train_loss": -7.06346321105957, "global_step": 25875, "epoch": 154} {"train_loss": -7.038862705230713, "global_step": 25876, "epoch": 154} {"train_loss": -7.135396957397461, "global_step": 25877, "epoch": 154} {"train_loss": -7.1157708168029785, "global_step": 25878, "epoch": 154} {"train_loss": -7.070791721343994, "global_step": 25879, "epoch": 154} {"train_loss": -7.026968479156494, "global_step": 25880, "epoch": 154} {"train_loss": -7.192394256591797, "global_step": 25881, "epoch": 154} {"train_loss": -7.179011344909668, "global_step": 25882, "epoch": 154} {"train_loss": -7.240250587463379, "global_step": 25883, "epoch": 154} {"train_loss": -6.798232078552246, "global_step": 25884, "epoch": 154} {"train_loss": -6.9099016189575195, "global_step": 25885, "epoch": 154} {"train_loss": -6.896507263183594, "global_step": 25886, "epoch": 154} {"train_loss": -7.049105644226074, "global_step": 25887, "epoch": 154} {"train_loss": -7.226445198059082, "global_step": 25888, "epoch": 154} {"train_loss": -7.062772750854492, "global_step": 25889, "epoch": 154} {"train_loss": -7.190982818603516, "global_step": 25890, "epoch": 154} {"train_loss": -7.301498889923096, "global_step": 25891, "epoch": 154} {"train_loss": -7.196313858032227, "global_step": 25892, "epoch": 154} {"train_loss": -7.390743732452393, "global_step": 25893, "epoch": 154} {"train_loss": -7.157588481903076, "global_step": 25894, "epoch": 154} {"train_loss": -7.400494575500488, "global_step": 25895, "epoch": 154} {"train_loss": -7.397071838378906, "global_step": 25896, "epoch": 154} {"train_loss": -7.196257591247559, "global_step": 25897, "epoch": 154} {"train_loss": -7.0834574699401855, "global_step": 25898, "epoch": 154} {"train_loss": -7.155665397644043, "global_step": 25899, "epoch": 154} {"train_loss": -7.166102409362793, "global_step": 25900, "epoch": 154} {"train_loss": -7.184162139892578, "global_step": 25901, "epoch": 154} {"train_loss": -7.476746559143066, "global_step": 25902, "epoch": 154} {"train_loss": -7.265052795410156, "global_step": 25903, "epoch": 154} {"train_loss": -6.993623733520508, "global_step": 25904, "epoch": 154} {"train_loss": -7.200356483459473, "global_step": 25905, "epoch": 154} {"train_loss": -7.35465145111084, "global_step": 25906, "epoch": 154} {"train_loss": -7.291443824768066, "global_step": 25907, "epoch": 154} {"train_loss": -7.361056327819824, "global_step": 25908, "epoch": 154} {"train_loss": -7.141269683837891, "global_step": 25909, "epoch": 154} {"train_loss": -7.217473030090332, "global_step": 25910, "epoch": 154} {"train_loss": -7.014523506164551, "global_step": 25911, "epoch": 154} {"train_loss": -7.374430179595947, "global_step": 25912, "epoch": 154} {"train_loss": -7.256561279296875, "global_step": 25913, "epoch": 154} {"train_loss": -7.49708366394043, "global_step": 25914, "epoch": 154} {"train_loss": -7.173979759216309, "global_step": 25915, "epoch": 154} {"train_loss": -7.228677749633789, "global_step": 25916, "epoch": 154} {"train_loss": -7.310300827026367, "global_step": 25917, "epoch": 154} {"train_loss": -7.40036153793335, "global_step": 25918, "epoch": 154} {"train_loss": -7.305580139160156, "global_step": 25919, "epoch": 154} {"train_loss": -7.381443977355957, "global_step": 25920, "epoch": 154} {"train_loss": -7.263018608093262, "global_step": 25921, "epoch": 154} {"train_loss": -7.228843688964844, "global_step": 25922, "epoch": 154} {"train_loss": -7.331088542938232, "global_step": 25923, "epoch": 154} {"train_loss": -7.351164817810059, "global_step": 25924, "epoch": 154} {"train_loss": -7.202559471130371, "global_step": 25925, "epoch": 154} {"train_loss": -7.245722770690918, "global_step": 25926, "epoch": 154} {"train_loss": -7.273548603057861, "global_step": 25927, "epoch": 154} {"train_loss": -7.134373188018799, "global_step": 25928, "epoch": 154} {"train_loss": -7.345049858093262, "global_step": 25929, "epoch": 154} {"train_loss": -7.2368974685668945, "global_step": 25930, "epoch": 154} {"train_loss": -7.317052841186523, "global_step": 25931, "epoch": 154} {"train_loss": -7.182302951812744, "global_step": 25932, "epoch": 154} {"train_loss": -7.261271953582764, "global_step": 25933, "epoch": 154} {"train_loss": -7.1916937828063965, "global_step": 25934, "epoch": 154} {"train_loss": -7.268325328826904, "global_step": 25935, "epoch": 154} {"train_loss": -7.105502605438232, "global_step": 25936, "epoch": 154} {"train_loss": -7.251309871673584, "global_step": 25937, "epoch": 154} {"train_loss": -7.091615200042725, "global_step": 25938, "epoch": 154} {"train_loss": -7.177665710449219, "global_step": 25939, "epoch": 154} {"train_loss": -7.157591819763184, "global_step": 25940, "epoch": 154} {"train_loss": -7.034280300140381, "global_step": 25941, "epoch": 154} {"train_loss": -7.214400291442871, "global_step": 25942, "epoch": 154} {"train_loss": -7.146381855010986, "global_step": 25943, "epoch": 154} {"train_loss": -7.045382499694824, "global_step": 25944, "epoch": 154} {"train_loss": -7.105357646942139, "global_step": 25945, "epoch": 154} {"train_loss": -6.913193702697754, "global_step": 25946, "epoch": 154} {"train_loss": -7.189313888549805, "global_step": 25947, "epoch": 154} {"train_loss": -7.2260003089904785, "global_step": 25948, "epoch": 154} {"train_loss": -7.237414360046387, "global_step": 25949, "epoch": 154} {"train_loss": -7.30744743347168, "global_step": 25950, "epoch": 154} {"train_loss": -7.092462062835693, "global_step": 25951, "epoch": 154} {"train_loss": -7.137086868286133, "global_step": 25952, "epoch": 154} {"train_loss": -7.264604091644287, "global_step": 25953, "epoch": 154} {"train_loss": -7.317131996154785, "global_step": 25954, "epoch": 154} {"train_loss": -7.326594829559326, "global_step": 25955, "epoch": 154} {"train_loss": -7.12391996383667, "global_step": 25956, "epoch": 154} {"train_loss": -7.159086227416992, "global_step": 25957, "epoch": 154} {"train_loss": -7.054106712341309, "global_step": 25958, "epoch": 154} {"train_loss": -7.32216215133667, "global_step": 25959, "epoch": 154} {"train_loss": -7.353339195251465, "global_step": 25960, "epoch": 154} {"train_loss": -7.082835674285889, "global_step": 25961, "epoch": 154} {"train_loss": -7.050084114074707, "global_step": 25962, "epoch": 154} {"train_loss": -7.152401924133301, "global_step": 25963, "epoch": 154} {"train_loss": -7.338257789611816, "global_step": 25964, "epoch": 154} {"train_loss": -7.409966468811035, "global_step": 25965, "epoch": 154} {"train_loss": -7.304814338684082, "global_step": 25966, "epoch": 154} {"train_loss": -6.9382219314575195, "global_step": 25967, "epoch": 154} {"train_loss": -7.225113868713379, "global_step": 25968, "epoch": 154} {"train_loss": -7.107190132141113, "global_step": 25969, "epoch": 154} {"train_loss": -7.251621246337891, "global_step": 25970, "epoch": 154} {"train_loss": -7.193387031555176, "global_step": 25971, "epoch": 154} {"train_loss": -6.887416839599609, "global_step": 25972, "epoch": 154} {"train_loss": -7.0829572677612305, "global_step": 25973, "epoch": 154} {"train_loss": -7.175761699676514, "global_step": 25974, "epoch": 154} {"train_loss": -7.192202568054199, "global_step": 25975, "epoch": 154} {"train_loss": -7.209630966186523, "global_step": 25976, "epoch": 154} {"train_loss": -7.039821147918701, "global_step": 25977, "epoch": 154} {"train_loss": -7.200689315795898, "global_step": 25978, "epoch": 154} {"train_loss": -7.064183235168457, "global_step": 25979, "epoch": 154} {"train_loss": -6.950072288513184, "global_step": 25980, "epoch": 154} {"train_loss": -7.012420654296875, "global_step": 25981, "epoch": 154} {"train_loss": -7.329507827758789, "global_step": 25982, "epoch": 154} {"train_loss": -6.880807399749756, "global_step": 25983, "epoch": 154} {"train_loss": -7.116833209991455, "global_step": 25984, "epoch": 154} {"train_loss": -7.08659553527832, "global_step": 25985, "epoch": 154} {"train_loss": -7.228856086730957, "global_step": 25986, "epoch": 154} {"train_loss": -7.342498779296875, "global_step": 25987, "epoch": 154} {"train_loss": -7.165345191955566, "global_step": 25988, "epoch": 154} {"train_loss": -7.520390510559082, "global_step": 25989, "epoch": 154} {"train_loss": -7.292630195617676, "global_step": 25990, "epoch": 154} {"train_loss": -7.265410423278809, "global_step": 25991, "epoch": 154} {"train_loss": -7.309778213500977, "global_step": 25992, "epoch": 154} {"train_loss": -7.51348352432251, "global_step": 25993, "epoch": 154} {"train_loss": -7.420168876647949, "global_step": 25994, "epoch": 154} {"train_loss": -7.376721382141113, "global_step": 25995, "epoch": 154} {"train_loss": -7.490649700164795, "global_step": 25996, "epoch": 154} {"train_loss": -7.260799407958984, "global_step": 25997, "epoch": 154} {"train_loss": -6.991628170013428, "global_step": 25998, "epoch": 154} {"train_loss": -7.100384712219238, "global_step": 25999, "epoch": 154} {"train_loss": -7.100056171417236, "global_step": 26000, "epoch": 154} {"train_loss": -6.930911064147949, "global_step": 26001, "epoch": 154} {"train_loss": -6.855997562408447, "global_step": 26002, "epoch": 154} {"train_loss": -6.951051712036133, "global_step": 26003, "epoch": 154} {"train_loss": -7.165184020996094, "global_step": 26004, "epoch": 154} {"train_loss": -7.04481315612793, "global_step": 26005, "epoch": 154} {"train_loss": -6.91568660736084, "global_step": 26006, "epoch": 154} {"train_loss": -7.047501087188721, "global_step": 26007, "epoch": 154} {"train_loss": -7.10529899597168, "global_step": 26008, "epoch": 154} {"train_loss": -7.150417327880859, "global_step": 26009, "epoch": 154} {"train_loss": -7.093900680541992, "global_step": 26010, "epoch": 154} {"train_loss": -7.13025426864624, "global_step": 26011, "epoch": 154} {"train_loss": -7.075536727905273, "global_step": 26012, "epoch": 154} {"train_loss": -7.076102256774902, "global_step": 26013, "epoch": 154} {"train_loss": -7.246039390563965, "global_step": 26014, "epoch": 154} {"train_loss": -7.283379077911377, "global_step": 26015, "epoch": 154} {"train_loss": -7.363271713256836, "global_step": 26016, "epoch": 154} {"train_loss": -7.280994415283203, "global_step": 26017, "epoch": 154} {"train_loss": -7.199314594268799, "global_step": 26018, "epoch": 154} {"train_loss": -7.051853179931641, "global_step": 26019, "epoch": 154} {"train_loss": -7.252305030822754, "global_step": 26020, "epoch": 154} {"train_loss": -7.3418731689453125, "global_step": 26021, "epoch": 154} {"train_loss": -7.252424240112305, "global_step": 26022, "epoch": 154} {"train_loss": -7.246955394744873, "global_step": 26023, "epoch": 154} {"train_loss": -7.418424129486084, "global_step": 26024, "epoch": 154} {"train_loss": -7.351327896118164, "global_step": 26025, "epoch": 154} {"train_loss": -7.217902183532715, "global_step": 26026, "epoch": 154} {"train_loss": -7.568833827972412, "global_step": 26027, "epoch": 154} {"train_loss": -7.1352081298828125, "global_step": 26028, "epoch": 154} {"train_loss": -7.079038619995117, "global_step": 26029, "epoch": 154} {"train_loss": -7.246811866760254, "global_step": 26030, "epoch": 154} {"train_loss": -7.449377059936523, "global_step": 26031, "epoch": 154} {"train_loss": -7.381956577301025, "global_step": 26032, "epoch": 154} {"train_loss": -7.359073162078857, "global_step": 26033, "epoch": 154} {"train_loss": -7.214015960693359, "global_step": 26034, "epoch": 154} {"train_loss": -7.181344509124756, "global_step": 26035, "epoch": 154} {"train_loss": -7.342567443847656, "global_step": 26036, "epoch": 154} {"train_loss": -7.4375715255737305, "global_step": 26037, "epoch": 154} {"train_loss": -7.34030818939209, "global_step": 26038, "epoch": 154} {"train_loss": -7.200972381092253, "global_step": 26039, "epoch": 154, "val_loss": 198385.578125} {"train_loss": -7.2769927978515625, "global_step": 26040, "epoch": 155} {"train_loss": -7.312847137451172, "global_step": 26041, "epoch": 155} {"train_loss": -7.268575191497803, "global_step": 26042, "epoch": 155} {"train_loss": -7.328948020935059, "global_step": 26043, "epoch": 155} {"train_loss": -7.584561347961426, "global_step": 26044, "epoch": 155} {"train_loss": -7.476324081420898, "global_step": 26045, "epoch": 155} {"train_loss": -7.346095085144043, "global_step": 26046, "epoch": 155} {"train_loss": -7.268460273742676, "global_step": 26047, "epoch": 155} {"train_loss": -7.335500240325928, "global_step": 26048, "epoch": 155} {"train_loss": -7.244588375091553, "global_step": 26049, "epoch": 155} {"train_loss": -7.135978698730469, "global_step": 26050, "epoch": 155} {"train_loss": -7.467960834503174, "global_step": 26051, "epoch": 155} {"train_loss": -7.467156410217285, "global_step": 26052, "epoch": 155} {"train_loss": -7.223675727844238, "global_step": 26053, "epoch": 155} {"train_loss": -7.267983436584473, "global_step": 26054, "epoch": 155} {"train_loss": -7.122560501098633, "global_step": 26055, "epoch": 155} {"train_loss": -7.30872106552124, "global_step": 26056, "epoch": 155} {"train_loss": -7.174726486206055, "global_step": 26057, "epoch": 155} {"train_loss": -7.286680698394775, "global_step": 26058, "epoch": 155} {"train_loss": -7.305173397064209, "global_step": 26059, "epoch": 155} {"train_loss": -7.1408843994140625, "global_step": 26060, "epoch": 155} {"train_loss": -7.30494499206543, "global_step": 26061, "epoch": 155} {"train_loss": -7.46018648147583, "global_step": 26062, "epoch": 155} {"train_loss": -7.164637565612793, "global_step": 26063, "epoch": 155} {"train_loss": -7.351753234863281, "global_step": 26064, "epoch": 155} {"train_loss": -7.468387126922607, "global_step": 26065, "epoch": 155} {"train_loss": -7.441479682922363, "global_step": 26066, "epoch": 155} {"train_loss": -7.336295127868652, "global_step": 26067, "epoch": 155} {"train_loss": -7.397064685821533, "global_step": 26068, "epoch": 155} {"train_loss": -7.1596479415893555, "global_step": 26069, "epoch": 155} {"train_loss": -7.285891532897949, "global_step": 26070, "epoch": 155} {"train_loss": -7.518977165222168, "global_step": 26071, "epoch": 155} {"train_loss": -7.157607078552246, "global_step": 26072, "epoch": 155} {"train_loss": -7.3274712562561035, "global_step": 26073, "epoch": 155} {"train_loss": -7.301469802856445, "global_step": 26074, "epoch": 155} {"train_loss": -7.356082916259766, "global_step": 26075, "epoch": 155} {"train_loss": -7.139468669891357, "global_step": 26076, "epoch": 155} {"train_loss": -7.387811660766602, "global_step": 26077, "epoch": 155} {"train_loss": -7.211040496826172, "global_step": 26078, "epoch": 155} {"train_loss": -7.1568403244018555, "global_step": 26079, "epoch": 155} {"train_loss": -7.309822082519531, "global_step": 26080, "epoch": 155} {"train_loss": -6.968514919281006, "global_step": 26081, "epoch": 155} {"train_loss": -7.105190277099609, "global_step": 26082, "epoch": 155} {"train_loss": -6.641717910766602, "global_step": 26083, "epoch": 155} {"train_loss": -6.9401350021362305, "global_step": 26084, "epoch": 155} {"train_loss": -6.8559651374816895, "global_step": 26085, "epoch": 155} {"train_loss": -7.193071365356445, "global_step": 26086, "epoch": 155} {"train_loss": -7.120091438293457, "global_step": 26087, "epoch": 155} {"train_loss": -7.308967113494873, "global_step": 26088, "epoch": 155} {"train_loss": -7.252082824707031, "global_step": 26089, "epoch": 155} {"train_loss": -7.032349586486816, "global_step": 26090, "epoch": 155} {"train_loss": -7.103151321411133, "global_step": 26091, "epoch": 155} {"train_loss": -7.032859802246094, "global_step": 26092, "epoch": 155} {"train_loss": -7.124980926513672, "global_step": 26093, "epoch": 155} {"train_loss": -7.1515913009643555, "global_step": 26094, "epoch": 155} {"train_loss": -7.056231498718262, "global_step": 26095, "epoch": 155} {"train_loss": -7.203344821929932, "global_step": 26096, "epoch": 155} {"train_loss": -7.0381903648376465, "global_step": 26097, "epoch": 155} {"train_loss": -7.2220354080200195, "global_step": 26098, "epoch": 155} {"train_loss": -7.338393211364746, "global_step": 26099, "epoch": 155} {"train_loss": -7.216006755828857, "global_step": 26100, "epoch": 155} {"train_loss": -7.223176002502441, "global_step": 26101, "epoch": 155} {"train_loss": -7.191987037658691, "global_step": 26102, "epoch": 155} {"train_loss": -7.321359634399414, "global_step": 26103, "epoch": 155} {"train_loss": -7.187858581542969, "global_step": 26104, "epoch": 155} {"train_loss": -7.395652770996094, "global_step": 26105, "epoch": 155} {"train_loss": -7.285978317260742, "global_step": 26106, "epoch": 155} {"train_loss": -7.134149074554443, "global_step": 26107, "epoch": 155} {"train_loss": -7.359323024749756, "global_step": 26108, "epoch": 155} {"train_loss": -7.19635009765625, "global_step": 26109, "epoch": 155} {"train_loss": -7.1897430419921875, "global_step": 26110, "epoch": 155} {"train_loss": -7.34152889251709, "global_step": 26111, "epoch": 155} {"train_loss": -7.211429595947266, "global_step": 26112, "epoch": 155} {"train_loss": -7.3458147048950195, "global_step": 26113, "epoch": 155} {"train_loss": -7.415593147277832, "global_step": 26114, "epoch": 155} {"train_loss": -7.195874214172363, "global_step": 26115, "epoch": 155} {"train_loss": -7.273014068603516, "global_step": 26116, "epoch": 155} {"train_loss": -7.349959373474121, "global_step": 26117, "epoch": 155} {"train_loss": -7.157764434814453, "global_step": 26118, "epoch": 155} {"train_loss": -7.0286149978637695, "global_step": 26119, "epoch": 155} {"train_loss": -6.974152088165283, "global_step": 26120, "epoch": 155} {"train_loss": -7.196840763092041, "global_step": 26121, "epoch": 155} {"train_loss": -7.296237945556641, "global_step": 26122, "epoch": 155} {"train_loss": -7.277509689331055, "global_step": 26123, "epoch": 155} {"train_loss": -6.947068214416504, "global_step": 26124, "epoch": 155} {"train_loss": -7.131258010864258, "global_step": 26125, "epoch": 155} {"train_loss": -7.221094131469727, "global_step": 26126, "epoch": 155} {"train_loss": -7.1418843269348145, "global_step": 26127, "epoch": 155} {"train_loss": -7.020844459533691, "global_step": 26128, "epoch": 155} {"train_loss": -7.258163928985596, "global_step": 26129, "epoch": 155} {"train_loss": -7.219769477844238, "global_step": 26130, "epoch": 155} {"train_loss": -6.864932537078857, "global_step": 26131, "epoch": 155} {"train_loss": -7.1439208984375, "global_step": 26132, "epoch": 155} {"train_loss": -6.954954147338867, "global_step": 26133, "epoch": 155} {"train_loss": -6.91298246383667, "global_step": 26134, "epoch": 155} {"train_loss": -7.008902072906494, "global_step": 26135, "epoch": 155} {"train_loss": -7.0706377029418945, "global_step": 26136, "epoch": 155} {"train_loss": -7.078980922698975, "global_step": 26137, "epoch": 155} {"train_loss": -7.246914863586426, "global_step": 26138, "epoch": 155} {"train_loss": -7.147253036499023, "global_step": 26139, "epoch": 155} {"train_loss": -7.194772243499756, "global_step": 26140, "epoch": 155} {"train_loss": -7.053555488586426, "global_step": 26141, "epoch": 155} {"train_loss": -7.244644641876221, "global_step": 26142, "epoch": 155} {"train_loss": -7.074084281921387, "global_step": 26143, "epoch": 155} {"train_loss": -6.780879020690918, "global_step": 26144, "epoch": 155} {"train_loss": -7.131720066070557, "global_step": 26145, "epoch": 155} {"train_loss": -7.206361770629883, "global_step": 26146, "epoch": 155} {"train_loss": -7.214435577392578, "global_step": 26147, "epoch": 155} {"train_loss": -7.209089279174805, "global_step": 26148, "epoch": 155} {"train_loss": -7.307936191558838, "global_step": 26149, "epoch": 155} {"train_loss": -7.287346363067627, "global_step": 26150, "epoch": 155} {"train_loss": -7.288185119628906, "global_step": 26151, "epoch": 155} {"train_loss": -7.444027423858643, "global_step": 26152, "epoch": 155} {"train_loss": -7.119086742401123, "global_step": 26153, "epoch": 155} {"train_loss": -7.400218963623047, "global_step": 26154, "epoch": 155} {"train_loss": -7.192017555236816, "global_step": 26155, "epoch": 155} {"train_loss": -7.269284725189209, "global_step": 26156, "epoch": 155} {"train_loss": -7.215949058532715, "global_step": 26157, "epoch": 155} {"train_loss": -7.4124040603637695, "global_step": 26158, "epoch": 155} {"train_loss": -6.952022552490234, "global_step": 26159, "epoch": 155} {"train_loss": -7.530762672424316, "global_step": 26160, "epoch": 155} {"train_loss": -7.107666969299316, "global_step": 26161, "epoch": 155} {"train_loss": -7.144436836242676, "global_step": 26162, "epoch": 155} {"train_loss": -7.18520975112915, "global_step": 26163, "epoch": 155} {"train_loss": -7.16710090637207, "global_step": 26164, "epoch": 155} {"train_loss": -7.181315898895264, "global_step": 26165, "epoch": 155} {"train_loss": -7.324951171875, "global_step": 26166, "epoch": 155} {"train_loss": -7.349861145019531, "global_step": 26167, "epoch": 155} {"train_loss": -7.168497085571289, "global_step": 26168, "epoch": 155} {"train_loss": -7.394136428833008, "global_step": 26169, "epoch": 155} {"train_loss": -7.475997447967529, "global_step": 26170, "epoch": 155} {"train_loss": -7.053616046905518, "global_step": 26171, "epoch": 155} {"train_loss": -7.106381416320801, "global_step": 26172, "epoch": 155} {"train_loss": -7.343791961669922, "global_step": 26173, "epoch": 155} {"train_loss": -7.134267807006836, "global_step": 26174, "epoch": 155} {"train_loss": -7.381721496582031, "global_step": 26175, "epoch": 155} {"train_loss": -7.37993860244751, "global_step": 26176, "epoch": 155} {"train_loss": -7.135329723358154, "global_step": 26177, "epoch": 155} {"train_loss": -7.473398208618164, "global_step": 26178, "epoch": 155} {"train_loss": -6.93954610824585, "global_step": 26179, "epoch": 155} {"train_loss": -7.280270576477051, "global_step": 26180, "epoch": 155} {"train_loss": -6.9932451248168945, "global_step": 26181, "epoch": 155} {"train_loss": -7.070236682891846, "global_step": 26182, "epoch": 155} {"train_loss": -7.2261834144592285, "global_step": 26183, "epoch": 155} {"train_loss": -7.33012056350708, "global_step": 26184, "epoch": 155} {"train_loss": -7.180957794189453, "global_step": 26185, "epoch": 155} {"train_loss": -6.850574493408203, "global_step": 26186, "epoch": 155} {"train_loss": -6.948718070983887, "global_step": 26187, "epoch": 155} {"train_loss": -7.168216228485107, "global_step": 26188, "epoch": 155} {"train_loss": -7.298750877380371, "global_step": 26189, "epoch": 155} {"train_loss": -7.080044746398926, "global_step": 26190, "epoch": 155} {"train_loss": -7.206147193908691, "global_step": 26191, "epoch": 155} {"train_loss": -7.188615798950195, "global_step": 26192, "epoch": 155} {"train_loss": -7.23622989654541, "global_step": 26193, "epoch": 155} {"train_loss": -7.282561302185059, "global_step": 26194, "epoch": 155} {"train_loss": -7.042241096496582, "global_step": 26195, "epoch": 155} {"train_loss": -7.132861137390137, "global_step": 26196, "epoch": 155} {"train_loss": -6.887256622314453, "global_step": 26197, "epoch": 155} {"train_loss": -7.167738437652588, "global_step": 26198, "epoch": 155} {"train_loss": -7.126330375671387, "global_step": 26199, "epoch": 155} {"train_loss": -7.340181350708008, "global_step": 26200, "epoch": 155} {"train_loss": -6.982682228088379, "global_step": 26201, "epoch": 155} {"train_loss": -7.095999717712402, "global_step": 26202, "epoch": 155} {"train_loss": -7.022317886352539, "global_step": 26203, "epoch": 155} {"train_loss": -7.061105251312256, "global_step": 26204, "epoch": 155} {"train_loss": -6.988422870635986, "global_step": 26205, "epoch": 155} {"train_loss": -7.264532089233398, "global_step": 26206, "epoch": 155} {"train_loss": -7.2033105691274, "global_step": 26207, "epoch": 155, "val_loss": 195922.96875, "train_action_mse_error": 20.656375885009766} {"train_loss": -7.060744285583496, "global_step": 26208, "epoch": 156} {"train_loss": -7.308219909667969, "global_step": 26209, "epoch": 156} {"train_loss": -7.314172744750977, "global_step": 26210, "epoch": 156} {"train_loss": -7.266503810882568, "global_step": 26211, "epoch": 156} {"train_loss": -7.198459148406982, "global_step": 26212, "epoch": 156} {"train_loss": -7.391221046447754, "global_step": 26213, "epoch": 156} {"train_loss": -7.321658134460449, "global_step": 26214, "epoch": 156} {"train_loss": -7.072764873504639, "global_step": 26215, "epoch": 156} {"train_loss": -6.891414165496826, "global_step": 26216, "epoch": 156} {"train_loss": -7.444642066955566, "global_step": 26217, "epoch": 156} {"train_loss": -7.035330772399902, "global_step": 26218, "epoch": 156} {"train_loss": -7.179628372192383, "global_step": 26219, "epoch": 156} {"train_loss": -7.1627044677734375, "global_step": 26220, "epoch": 156} {"train_loss": -7.172629356384277, "global_step": 26221, "epoch": 156} {"train_loss": -7.456238746643066, "global_step": 26222, "epoch": 156} {"train_loss": -7.384528160095215, "global_step": 26223, "epoch": 156} {"train_loss": -7.425787925720215, "global_step": 26224, "epoch": 156} {"train_loss": -7.315336227416992, "global_step": 26225, "epoch": 156} {"train_loss": -7.266945838928223, "global_step": 26226, "epoch": 156} {"train_loss": -7.351539611816406, "global_step": 26227, "epoch": 156} {"train_loss": -7.231686592102051, "global_step": 26228, "epoch": 156} {"train_loss": -7.255692481994629, "global_step": 26229, "epoch": 156} {"train_loss": -7.336773872375488, "global_step": 26230, "epoch": 156} {"train_loss": -7.247329235076904, "global_step": 26231, "epoch": 156} {"train_loss": -7.320530891418457, "global_step": 26232, "epoch": 156} {"train_loss": -7.523188591003418, "global_step": 26233, "epoch": 156} {"train_loss": -7.235097408294678, "global_step": 26234, "epoch": 156} {"train_loss": -7.50353479385376, "global_step": 26235, "epoch": 156} {"train_loss": -7.547924995422363, "global_step": 26236, "epoch": 156} {"train_loss": -7.1747026443481445, "global_step": 26237, "epoch": 156} {"train_loss": -7.394796371459961, "global_step": 26238, "epoch": 156} {"train_loss": -7.154812335968018, "global_step": 26239, "epoch": 156} {"train_loss": -7.366812229156494, "global_step": 26240, "epoch": 156} {"train_loss": -7.156666278839111, "global_step": 26241, "epoch": 156} {"train_loss": -7.512129306793213, "global_step": 26242, "epoch": 156} {"train_loss": -7.245146751403809, "global_step": 26243, "epoch": 156} {"train_loss": -7.516781806945801, "global_step": 26244, "epoch": 156} {"train_loss": -7.252669334411621, "global_step": 26245, "epoch": 156} {"train_loss": -6.8967084884643555, "global_step": 26246, "epoch": 156} {"train_loss": -7.154261589050293, "global_step": 26247, "epoch": 156} {"train_loss": -7.102940082550049, "global_step": 26248, "epoch": 156} {"train_loss": -7.26414680480957, "global_step": 26249, "epoch": 156} {"train_loss": -7.117298126220703, "global_step": 26250, "epoch": 156} {"train_loss": -7.088640213012695, "global_step": 26251, "epoch": 156} {"train_loss": -7.298862934112549, "global_step": 26252, "epoch": 156} {"train_loss": -7.237349510192871, "global_step": 26253, "epoch": 156} {"train_loss": -7.2692155838012695, "global_step": 26254, "epoch": 156} {"train_loss": -7.391181468963623, "global_step": 26255, "epoch": 156} {"train_loss": -7.315489292144775, "global_step": 26256, "epoch": 156} {"train_loss": -7.349993705749512, "global_step": 26257, "epoch": 156} {"train_loss": -7.4486002922058105, "global_step": 26258, "epoch": 156} {"train_loss": -7.213615894317627, "global_step": 26259, "epoch": 156} {"train_loss": -7.13358211517334, "global_step": 26260, "epoch": 156} {"train_loss": -7.061225891113281, "global_step": 26261, "epoch": 156} {"train_loss": -7.255687236785889, "global_step": 26262, "epoch": 156} {"train_loss": -7.014045715332031, "global_step": 26263, "epoch": 156} {"train_loss": -7.226614952087402, "global_step": 26264, "epoch": 156} {"train_loss": -7.106107711791992, "global_step": 26265, "epoch": 156} {"train_loss": -7.133687973022461, "global_step": 26266, "epoch": 156} {"train_loss": -7.205238342285156, "global_step": 26267, "epoch": 156} {"train_loss": -7.4682207107543945, "global_step": 26268, "epoch": 156} {"train_loss": -7.240318298339844, "global_step": 26269, "epoch": 156} {"train_loss": -6.995927810668945, "global_step": 26270, "epoch": 156} {"train_loss": -7.364434242248535, "global_step": 26271, "epoch": 156} {"train_loss": -7.3717546463012695, "global_step": 26272, "epoch": 156} {"train_loss": -7.1510090827941895, "global_step": 26273, "epoch": 156} {"train_loss": -7.3030219078063965, "global_step": 26274, "epoch": 156} {"train_loss": -7.2533979415893555, "global_step": 26275, "epoch": 156} {"train_loss": -7.0687761306762695, "global_step": 26276, "epoch": 156} {"train_loss": -7.410741806030273, "global_step": 26277, "epoch": 156} {"train_loss": -7.131494998931885, "global_step": 26278, "epoch": 156} {"train_loss": -7.326162338256836, "global_step": 26279, "epoch": 156} {"train_loss": -7.1786699295043945, "global_step": 26280, "epoch": 156} {"train_loss": -7.43754243850708, "global_step": 26281, "epoch": 156} {"train_loss": -7.373568534851074, "global_step": 26282, "epoch": 156} {"train_loss": -7.335412979125977, "global_step": 26283, "epoch": 156} {"train_loss": -7.350963115692139, "global_step": 26284, "epoch": 156} {"train_loss": -7.450571060180664, "global_step": 26285, "epoch": 156} {"train_loss": -7.0296630859375, "global_step": 26286, "epoch": 156} {"train_loss": -7.023310661315918, "global_step": 26287, "epoch": 156} {"train_loss": -7.056110858917236, "global_step": 26288, "epoch": 156} {"train_loss": -7.364112854003906, "global_step": 26289, "epoch": 156} {"train_loss": -7.182304382324219, "global_step": 26290, "epoch": 156} {"train_loss": -7.359865188598633, "global_step": 26291, "epoch": 156} {"train_loss": -7.2403483390808105, "global_step": 26292, "epoch": 156} {"train_loss": -7.402037143707275, "global_step": 26293, "epoch": 156} {"train_loss": -7.098746299743652, "global_step": 26294, "epoch": 156} {"train_loss": -7.307668685913086, "global_step": 26295, "epoch": 156} {"train_loss": -6.947517395019531, "global_step": 26296, "epoch": 156} {"train_loss": -7.367291450500488, "global_step": 26297, "epoch": 156} {"train_loss": -7.0921807289123535, "global_step": 26298, "epoch": 156} {"train_loss": -7.066335678100586, "global_step": 26299, "epoch": 156} {"train_loss": -6.991793632507324, "global_step": 26300, "epoch": 156} {"train_loss": -6.816625595092773, "global_step": 26301, "epoch": 156} {"train_loss": -6.9509172439575195, "global_step": 26302, "epoch": 156} {"train_loss": -6.558032035827637, "global_step": 26303, "epoch": 156} {"train_loss": -7.121513366699219, "global_step": 26304, "epoch": 156} {"train_loss": -6.978690147399902, "global_step": 26305, "epoch": 156} {"train_loss": -7.104550361633301, "global_step": 26306, "epoch": 156} {"train_loss": -7.175807476043701, "global_step": 26307, "epoch": 156} {"train_loss": -7.209395885467529, "global_step": 26308, "epoch": 156} {"train_loss": -6.988061428070068, "global_step": 26309, "epoch": 156} {"train_loss": -7.3292999267578125, "global_step": 26310, "epoch": 156} {"train_loss": -7.088922500610352, "global_step": 26311, "epoch": 156} {"train_loss": -7.215485572814941, "global_step": 26312, "epoch": 156} {"train_loss": -7.1594085693359375, "global_step": 26313, "epoch": 156} {"train_loss": -7.081422805786133, "global_step": 26314, "epoch": 156} {"train_loss": -7.110108375549316, "global_step": 26315, "epoch": 156} {"train_loss": -7.175641059875488, "global_step": 26316, "epoch": 156} {"train_loss": -7.4477386474609375, "global_step": 26317, "epoch": 156} {"train_loss": -7.261706352233887, "global_step": 26318, "epoch": 156} {"train_loss": -7.475164890289307, "global_step": 26319, "epoch": 156} {"train_loss": -7.120970249176025, "global_step": 26320, "epoch": 156} {"train_loss": -7.134304046630859, "global_step": 26321, "epoch": 156} {"train_loss": -7.280540466308594, "global_step": 26322, "epoch": 156} {"train_loss": -7.211461067199707, "global_step": 26323, "epoch": 156} {"train_loss": -7.518054962158203, "global_step": 26324, "epoch": 156} {"train_loss": -7.377185344696045, "global_step": 26325, "epoch": 156} {"train_loss": -7.201985836029053, "global_step": 26326, "epoch": 156} {"train_loss": -7.147975921630859, "global_step": 26327, "epoch": 156} {"train_loss": -7.369247913360596, "global_step": 26328, "epoch": 156} {"train_loss": -7.458658218383789, "global_step": 26329, "epoch": 156} {"train_loss": -7.384333610534668, "global_step": 26330, "epoch": 156} {"train_loss": -7.395810604095459, "global_step": 26331, "epoch": 156} {"train_loss": -7.3057026863098145, "global_step": 26332, "epoch": 156} {"train_loss": -7.543135643005371, "global_step": 26333, "epoch": 156} {"train_loss": -7.309475421905518, "global_step": 26334, "epoch": 156} {"train_loss": -7.4521965980529785, "global_step": 26335, "epoch": 156} {"train_loss": -7.401531219482422, "global_step": 26336, "epoch": 156} {"train_loss": -7.266714096069336, "global_step": 26337, "epoch": 156} {"train_loss": -7.196799278259277, "global_step": 26338, "epoch": 156} {"train_loss": -7.288205146789551, "global_step": 26339, "epoch": 156} {"train_loss": -7.061598300933838, "global_step": 26340, "epoch": 156} {"train_loss": -7.063189506530762, "global_step": 26341, "epoch": 156} {"train_loss": -6.68022346496582, "global_step": 26342, "epoch": 156} {"train_loss": -7.245845317840576, "global_step": 26343, "epoch": 156} {"train_loss": -6.952857494354248, "global_step": 26344, "epoch": 156} {"train_loss": -7.273580551147461, "global_step": 26345, "epoch": 156} {"train_loss": -7.208499908447266, "global_step": 26346, "epoch": 156} {"train_loss": -7.108112335205078, "global_step": 26347, "epoch": 156} {"train_loss": -7.077156066894531, "global_step": 26348, "epoch": 156} {"train_loss": -7.195000648498535, "global_step": 26349, "epoch": 156} {"train_loss": -7.041014671325684, "global_step": 26350, "epoch": 156} {"train_loss": -6.919122695922852, "global_step": 26351, "epoch": 156} {"train_loss": -7.119010925292969, "global_step": 26352, "epoch": 156} {"train_loss": -7.033040523529053, "global_step": 26353, "epoch": 156} {"train_loss": -7.066829681396484, "global_step": 26354, "epoch": 156} {"train_loss": -7.040616512298584, "global_step": 26355, "epoch": 156} {"train_loss": -7.160616874694824, "global_step": 26356, "epoch": 156} {"train_loss": -7.0900373458862305, "global_step": 26357, "epoch": 156} {"train_loss": -7.092038154602051, "global_step": 26358, "epoch": 156} {"train_loss": -7.1690521240234375, "global_step": 26359, "epoch": 156} {"train_loss": -7.214987754821777, "global_step": 26360, "epoch": 156} {"train_loss": -7.324854850769043, "global_step": 26361, "epoch": 156} {"train_loss": -7.214718818664551, "global_step": 26362, "epoch": 156} {"train_loss": -6.949853897094727, "global_step": 26363, "epoch": 156} {"train_loss": -6.960254669189453, "global_step": 26364, "epoch": 156} {"train_loss": -7.261941909790039, "global_step": 26365, "epoch": 156} {"train_loss": -7.333695411682129, "global_step": 26366, "epoch": 156} {"train_loss": -7.129133701324463, "global_step": 26367, "epoch": 156} {"train_loss": -7.413366317749023, "global_step": 26368, "epoch": 156} {"train_loss": -7.192554473876953, "global_step": 26369, "epoch": 156} {"train_loss": -7.297509670257568, "global_step": 26370, "epoch": 156} {"train_loss": -7.36388635635376, "global_step": 26371, "epoch": 156} {"train_loss": -7.393680095672607, "global_step": 26372, "epoch": 156} {"train_loss": -7.251848220825195, "global_step": 26373, "epoch": 156} {"train_loss": -7.497093200683594, "global_step": 26374, "epoch": 156} {"train_loss": -7.2235027097520375, "global_step": 26375, "epoch": 156, "val_loss": 194124.984375} {"train_loss": -7.2047271728515625, "global_step": 26376, "epoch": 157} {"train_loss": -7.312961578369141, "global_step": 26377, "epoch": 157} {"train_loss": -7.395627975463867, "global_step": 26378, "epoch": 157} {"train_loss": -7.433244228363037, "global_step": 26379, "epoch": 157} {"train_loss": -7.430731773376465, "global_step": 26380, "epoch": 157} {"train_loss": -7.472660064697266, "global_step": 26381, "epoch": 157} {"train_loss": -7.327469348907471, "global_step": 26382, "epoch": 157} {"train_loss": -7.299802303314209, "global_step": 26383, "epoch": 157} {"train_loss": -7.365355491638184, "global_step": 26384, "epoch": 157} {"train_loss": -6.63936710357666, "global_step": 26385, "epoch": 157} {"train_loss": -7.323538303375244, "global_step": 26386, "epoch": 157} {"train_loss": -7.208817481994629, "global_step": 26387, "epoch": 157} {"train_loss": -7.009812831878662, "global_step": 26388, "epoch": 157} {"train_loss": -7.157660484313965, "global_step": 26389, "epoch": 157} {"train_loss": -6.927188396453857, "global_step": 26390, "epoch": 157} {"train_loss": -7.309438705444336, "global_step": 26391, "epoch": 157} {"train_loss": -6.815296173095703, "global_step": 26392, "epoch": 157} {"train_loss": -6.884616851806641, "global_step": 26393, "epoch": 157} {"train_loss": -7.069878101348877, "global_step": 26394, "epoch": 157} {"train_loss": -7.309537887573242, "global_step": 26395, "epoch": 157} {"train_loss": -6.94294548034668, "global_step": 26396, "epoch": 157} {"train_loss": -7.020031929016113, "global_step": 26397, "epoch": 157} {"train_loss": -7.139564514160156, "global_step": 26398, "epoch": 157} {"train_loss": -6.974637031555176, "global_step": 26399, "epoch": 157} {"train_loss": -7.199389457702637, "global_step": 26400, "epoch": 157} {"train_loss": -7.117137432098389, "global_step": 26401, "epoch": 157} {"train_loss": -7.330415725708008, "global_step": 26402, "epoch": 157} {"train_loss": -7.250262260437012, "global_step": 26403, "epoch": 157} {"train_loss": -6.834801197052002, "global_step": 26404, "epoch": 157} {"train_loss": -7.27949857711792, "global_step": 26405, "epoch": 157} {"train_loss": -7.236933708190918, "global_step": 26406, "epoch": 157} {"train_loss": -7.057708740234375, "global_step": 26407, "epoch": 157} {"train_loss": -7.005898475646973, "global_step": 26408, "epoch": 157} {"train_loss": -7.299803733825684, "global_step": 26409, "epoch": 157} {"train_loss": -7.318052768707275, "global_step": 26410, "epoch": 157} {"train_loss": -7.210211277008057, "global_step": 26411, "epoch": 157} {"train_loss": -7.419281005859375, "global_step": 26412, "epoch": 157} {"train_loss": -7.369871139526367, "global_step": 26413, "epoch": 157} {"train_loss": -7.3347487449646, "global_step": 26414, "epoch": 157} {"train_loss": -7.422901630401611, "global_step": 26415, "epoch": 157} {"train_loss": -7.408074378967285, "global_step": 26416, "epoch": 157} {"train_loss": -7.287563800811768, "global_step": 26417, "epoch": 157} {"train_loss": -7.410700798034668, "global_step": 26418, "epoch": 157} {"train_loss": -7.256583213806152, "global_step": 26419, "epoch": 157} {"train_loss": -7.41972541809082, "global_step": 26420, "epoch": 157} {"train_loss": -7.354418754577637, "global_step": 26421, "epoch": 157} {"train_loss": -7.199383735656738, "global_step": 26422, "epoch": 157} {"train_loss": -6.8722758293151855, "global_step": 26423, "epoch": 157} {"train_loss": -7.140462875366211, "global_step": 26424, "epoch": 157} {"train_loss": -7.375360488891602, "global_step": 26425, "epoch": 157} {"train_loss": -7.281362056732178, "global_step": 26426, "epoch": 157} {"train_loss": -7.175447940826416, "global_step": 26427, "epoch": 157} {"train_loss": -7.024336338043213, "global_step": 26428, "epoch": 157} {"train_loss": -7.218873023986816, "global_step": 26429, "epoch": 157} {"train_loss": -7.189871311187744, "global_step": 26430, "epoch": 157} {"train_loss": -7.026440620422363, "global_step": 26431, "epoch": 157} {"train_loss": -7.119726181030273, "global_step": 26432, "epoch": 157} {"train_loss": -6.788029670715332, "global_step": 26433, "epoch": 157} {"train_loss": -7.192409515380859, "global_step": 26434, "epoch": 157} {"train_loss": -6.672466278076172, "global_step": 26435, "epoch": 157} {"train_loss": -7.159708499908447, "global_step": 26436, "epoch": 157} {"train_loss": -7.051548957824707, "global_step": 26437, "epoch": 157} {"train_loss": -6.896492004394531, "global_step": 26438, "epoch": 157} {"train_loss": -7.202169418334961, "global_step": 26439, "epoch": 157} {"train_loss": -7.034969329833984, "global_step": 26440, "epoch": 157} {"train_loss": -7.111057281494141, "global_step": 26441, "epoch": 157} {"train_loss": -7.269109725952148, "global_step": 26442, "epoch": 157} {"train_loss": -7.101857662200928, "global_step": 26443, "epoch": 157} {"train_loss": -7.1819257736206055, "global_step": 26444, "epoch": 157} {"train_loss": -7.208808898925781, "global_step": 26445, "epoch": 157} {"train_loss": -7.294156074523926, "global_step": 26446, "epoch": 157} {"train_loss": -7.152039527893066, "global_step": 26447, "epoch": 157} {"train_loss": -7.0643534660339355, "global_step": 26448, "epoch": 157} {"train_loss": -7.251276016235352, "global_step": 26449, "epoch": 157} {"train_loss": -7.2655415534973145, "global_step": 26450, "epoch": 157} {"train_loss": -7.2991743087768555, "global_step": 26451, "epoch": 157} {"train_loss": -7.389917373657227, "global_step": 26452, "epoch": 157} {"train_loss": -7.164022445678711, "global_step": 26453, "epoch": 157} {"train_loss": -7.293743133544922, "global_step": 26454, "epoch": 157} {"train_loss": -7.111838340759277, "global_step": 26455, "epoch": 157} {"train_loss": -7.417863368988037, "global_step": 26456, "epoch": 157} {"train_loss": -7.133880615234375, "global_step": 26457, "epoch": 157} {"train_loss": -7.43281364440918, "global_step": 26458, "epoch": 157} {"train_loss": -7.4244279861450195, "global_step": 26459, "epoch": 157} {"train_loss": -7.410564422607422, "global_step": 26460, "epoch": 157} {"train_loss": -7.504701137542725, "global_step": 26461, "epoch": 157} {"train_loss": -7.493668556213379, "global_step": 26462, "epoch": 157} {"train_loss": -7.561211109161377, "global_step": 26463, "epoch": 157} {"train_loss": -7.339864730834961, "global_step": 26464, "epoch": 157} {"train_loss": -7.461036682128906, "global_step": 26465, "epoch": 157} {"train_loss": -7.406430721282959, "global_step": 26466, "epoch": 157} {"train_loss": -7.720063209533691, "global_step": 26467, "epoch": 157} {"train_loss": -7.451513290405273, "global_step": 26468, "epoch": 157} {"train_loss": -7.612083911895752, "global_step": 26469, "epoch": 157} {"train_loss": -7.203232288360596, "global_step": 26470, "epoch": 157} {"train_loss": -7.079305171966553, "global_step": 26471, "epoch": 157} {"train_loss": -7.301692008972168, "global_step": 26472, "epoch": 157} {"train_loss": -7.243609428405762, "global_step": 26473, "epoch": 157} {"train_loss": -7.174510955810547, "global_step": 26474, "epoch": 157} {"train_loss": -7.2770795822143555, "global_step": 26475, "epoch": 157} {"train_loss": -7.06507682800293, "global_step": 26476, "epoch": 157} {"train_loss": -7.305774211883545, "global_step": 26477, "epoch": 157} {"train_loss": -7.390121936798096, "global_step": 26478, "epoch": 157} {"train_loss": -7.378411293029785, "global_step": 26479, "epoch": 157} {"train_loss": -6.996257781982422, "global_step": 26480, "epoch": 157} {"train_loss": -7.122976303100586, "global_step": 26481, "epoch": 157} {"train_loss": -7.054008483886719, "global_step": 26482, "epoch": 157} {"train_loss": -6.974074363708496, "global_step": 26483, "epoch": 157} {"train_loss": -7.167325019836426, "global_step": 26484, "epoch": 157} {"train_loss": -7.260248184204102, "global_step": 26485, "epoch": 157} {"train_loss": -7.365049362182617, "global_step": 26486, "epoch": 157} {"train_loss": -7.1598310470581055, "global_step": 26487, "epoch": 157} {"train_loss": -7.338380813598633, "global_step": 26488, "epoch": 157} {"train_loss": -7.353775978088379, "global_step": 26489, "epoch": 157} {"train_loss": -7.213396072387695, "global_step": 26490, "epoch": 157} {"train_loss": -7.355192184448242, "global_step": 26491, "epoch": 157} {"train_loss": -7.239029884338379, "global_step": 26492, "epoch": 157} {"train_loss": -7.186470031738281, "global_step": 26493, "epoch": 157} {"train_loss": -6.851658821105957, "global_step": 26494, "epoch": 157} {"train_loss": -7.290262699127197, "global_step": 26495, "epoch": 157} {"train_loss": -7.151383399963379, "global_step": 26496, "epoch": 157} {"train_loss": -6.957126617431641, "global_step": 26497, "epoch": 157} {"train_loss": -7.336615085601807, "global_step": 26498, "epoch": 157} {"train_loss": -6.93803596496582, "global_step": 26499, "epoch": 157} {"train_loss": -7.161721706390381, "global_step": 26500, "epoch": 157} {"train_loss": -7.177398204803467, "global_step": 26501, "epoch": 157} {"train_loss": -7.207313060760498, "global_step": 26502, "epoch": 157} {"train_loss": -7.049044132232666, "global_step": 26503, "epoch": 157} {"train_loss": -7.262622833251953, "global_step": 26504, "epoch": 157} {"train_loss": -7.367371559143066, "global_step": 26505, "epoch": 157} {"train_loss": -7.1967854499816895, "global_step": 26506, "epoch": 157} {"train_loss": -7.246352672576904, "global_step": 26507, "epoch": 157} {"train_loss": -7.357147216796875, "global_step": 26508, "epoch": 157} {"train_loss": -7.308438777923584, "global_step": 26509, "epoch": 157} {"train_loss": -7.354063987731934, "global_step": 26510, "epoch": 157} {"train_loss": -7.301448822021484, "global_step": 26511, "epoch": 157} {"train_loss": -7.396204471588135, "global_step": 26512, "epoch": 157} {"train_loss": -7.520090103149414, "global_step": 26513, "epoch": 157} {"train_loss": -7.53432559967041, "global_step": 26514, "epoch": 157} {"train_loss": -7.212489128112793, "global_step": 26515, "epoch": 157} {"train_loss": -7.118363857269287, "global_step": 26516, "epoch": 157} {"train_loss": -7.118902206420898, "global_step": 26517, "epoch": 157} {"train_loss": -7.403565406799316, "global_step": 26518, "epoch": 157} {"train_loss": -6.808083534240723, "global_step": 26519, "epoch": 157} {"train_loss": -7.292815208435059, "global_step": 26520, "epoch": 157} {"train_loss": -6.714141368865967, "global_step": 26521, "epoch": 157} {"train_loss": -7.134650230407715, "global_step": 26522, "epoch": 157} {"train_loss": -6.842984199523926, "global_step": 26523, "epoch": 157} {"train_loss": -7.038647651672363, "global_step": 26524, "epoch": 157} {"train_loss": -7.084056854248047, "global_step": 26525, "epoch": 157} {"train_loss": -6.84091854095459, "global_step": 26526, "epoch": 157} {"train_loss": -7.019644737243652, "global_step": 26527, "epoch": 157} {"train_loss": -7.104534149169922, "global_step": 26528, "epoch": 157} {"train_loss": -7.0409040451049805, "global_step": 26529, "epoch": 157} {"train_loss": -7.150044918060303, "global_step": 26530, "epoch": 157} {"train_loss": -7.196267127990723, "global_step": 26531, "epoch": 157} {"train_loss": -6.990337371826172, "global_step": 26532, "epoch": 157} {"train_loss": -7.201230049133301, "global_step": 26533, "epoch": 157} {"train_loss": -7.093778610229492, "global_step": 26534, "epoch": 157} {"train_loss": -7.010916233062744, "global_step": 26535, "epoch": 157} {"train_loss": -7.165727615356445, "global_step": 26536, "epoch": 157} {"train_loss": -7.30183219909668, "global_step": 26537, "epoch": 157} {"train_loss": -7.206637382507324, "global_step": 26538, "epoch": 157} {"train_loss": -7.237941741943359, "global_step": 26539, "epoch": 157} {"train_loss": -7.153215408325195, "global_step": 26540, "epoch": 157} {"train_loss": -7.464385032653809, "global_step": 26541, "epoch": 157} {"train_loss": -7.245697498321533, "global_step": 26542, "epoch": 157} {"train_loss": -7.204354936168308, "global_step": 26543, "epoch": 157, "val_loss": 195736.90625} {"train_loss": -7.296651840209961, "global_step": 26544, "epoch": 158} {"train_loss": -7.161296844482422, "global_step": 26545, "epoch": 158} {"train_loss": -7.300217628479004, "global_step": 26546, "epoch": 158} {"train_loss": -7.268446445465088, "global_step": 26547, "epoch": 158} {"train_loss": -7.315445899963379, "global_step": 26548, "epoch": 158} {"train_loss": -7.2970685958862305, "global_step": 26549, "epoch": 158} {"train_loss": -7.317152976989746, "global_step": 26550, "epoch": 158} {"train_loss": -7.299062728881836, "global_step": 26551, "epoch": 158} {"train_loss": -7.06206750869751, "global_step": 26552, "epoch": 158} {"train_loss": -7.614712715148926, "global_step": 26553, "epoch": 158} {"train_loss": -7.235389709472656, "global_step": 26554, "epoch": 158} {"train_loss": -7.239412307739258, "global_step": 26555, "epoch": 158} {"train_loss": -7.259352207183838, "global_step": 26556, "epoch": 158} {"train_loss": -7.240224361419678, "global_step": 26557, "epoch": 158} {"train_loss": -7.236773490905762, "global_step": 26558, "epoch": 158} {"train_loss": -7.186867713928223, "global_step": 26559, "epoch": 158} {"train_loss": -7.335671901702881, "global_step": 26560, "epoch": 158} {"train_loss": -7.220944881439209, "global_step": 26561, "epoch": 158} {"train_loss": -7.412877082824707, "global_step": 26562, "epoch": 158} {"train_loss": -7.407442092895508, "global_step": 26563, "epoch": 158} {"train_loss": -7.202476501464844, "global_step": 26564, "epoch": 158} {"train_loss": -7.219307899475098, "global_step": 26565, "epoch": 158} {"train_loss": -7.249917030334473, "global_step": 26566, "epoch": 158} {"train_loss": -7.095264434814453, "global_step": 26567, "epoch": 158} {"train_loss": -7.262547492980957, "global_step": 26568, "epoch": 158} {"train_loss": -7.373318672180176, "global_step": 26569, "epoch": 158} {"train_loss": -7.290879249572754, "global_step": 26570, "epoch": 158} {"train_loss": -7.19148063659668, "global_step": 26571, "epoch": 158} {"train_loss": -7.090390205383301, "global_step": 26572, "epoch": 158} {"train_loss": -7.275731563568115, "global_step": 26573, "epoch": 158} {"train_loss": -7.229124546051025, "global_step": 26574, "epoch": 158} {"train_loss": -7.109728813171387, "global_step": 26575, "epoch": 158} {"train_loss": -7.246832847595215, "global_step": 26576, "epoch": 158} {"train_loss": -7.43928337097168, "global_step": 26577, "epoch": 158} {"train_loss": -7.059402942657471, "global_step": 26578, "epoch": 158} {"train_loss": -7.390708923339844, "global_step": 26579, "epoch": 158} {"train_loss": -7.146088600158691, "global_step": 26580, "epoch": 158} {"train_loss": -7.418713569641113, "global_step": 26581, "epoch": 158} {"train_loss": -7.129297256469727, "global_step": 26582, "epoch": 158} {"train_loss": -7.319361209869385, "global_step": 26583, "epoch": 158} {"train_loss": -7.164402484893799, "global_step": 26584, "epoch": 158} {"train_loss": -7.247504234313965, "global_step": 26585, "epoch": 158} {"train_loss": -7.308486461639404, "global_step": 26586, "epoch": 158} {"train_loss": -7.261468410491943, "global_step": 26587, "epoch": 158} {"train_loss": -7.362040996551514, "global_step": 26588, "epoch": 158} {"train_loss": -7.475289821624756, "global_step": 26589, "epoch": 158} {"train_loss": -7.269125938415527, "global_step": 26590, "epoch": 158} {"train_loss": -7.260077476501465, "global_step": 26591, "epoch": 158} {"train_loss": -7.304007530212402, "global_step": 26592, "epoch": 158} {"train_loss": -7.240715980529785, "global_step": 26593, "epoch": 158} {"train_loss": -7.376113414764404, "global_step": 26594, "epoch": 158} {"train_loss": -7.451352119445801, "global_step": 26595, "epoch": 158} {"train_loss": -7.424964904785156, "global_step": 26596, "epoch": 158} {"train_loss": -7.6087141036987305, "global_step": 26597, "epoch": 158} {"train_loss": -7.464014053344727, "global_step": 26598, "epoch": 158} {"train_loss": -7.098953723907471, "global_step": 26599, "epoch": 158} {"train_loss": -7.187932014465332, "global_step": 26600, "epoch": 158} {"train_loss": -7.31663703918457, "global_step": 26601, "epoch": 158} {"train_loss": -7.418537616729736, "global_step": 26602, "epoch": 158} {"train_loss": -7.369309425354004, "global_step": 26603, "epoch": 158} {"train_loss": -7.352034568786621, "global_step": 26604, "epoch": 158} {"train_loss": -7.214112281799316, "global_step": 26605, "epoch": 158} {"train_loss": -7.225971221923828, "global_step": 26606, "epoch": 158} {"train_loss": -7.104605674743652, "global_step": 26607, "epoch": 158} {"train_loss": -7.2507829666137695, "global_step": 26608, "epoch": 158} {"train_loss": -7.051612854003906, "global_step": 26609, "epoch": 158} {"train_loss": -7.042176246643066, "global_step": 26610, "epoch": 158} {"train_loss": -7.079159736633301, "global_step": 26611, "epoch": 158} {"train_loss": -7.219245910644531, "global_step": 26612, "epoch": 158} {"train_loss": -7.4831671714782715, "global_step": 26613, "epoch": 158} {"train_loss": -7.319218635559082, "global_step": 26614, "epoch": 158} {"train_loss": -7.047311782836914, "global_step": 26615, "epoch": 158} {"train_loss": -6.88370418548584, "global_step": 26616, "epoch": 158} {"train_loss": -7.273212432861328, "global_step": 26617, "epoch": 158} {"train_loss": -7.166929244995117, "global_step": 26618, "epoch": 158} {"train_loss": -7.192933082580566, "global_step": 26619, "epoch": 158} {"train_loss": -7.224087715148926, "global_step": 26620, "epoch": 158} {"train_loss": -7.048127174377441, "global_step": 26621, "epoch": 158} {"train_loss": -7.279299736022949, "global_step": 26622, "epoch": 158} {"train_loss": -7.102778434753418, "global_step": 26623, "epoch": 158} {"train_loss": -7.432593822479248, "global_step": 26624, "epoch": 158} {"train_loss": -7.289688587188721, "global_step": 26625, "epoch": 158} {"train_loss": -7.216706275939941, "global_step": 26626, "epoch": 158} {"train_loss": -7.404826641082764, "global_step": 26627, "epoch": 158} {"train_loss": -7.279658317565918, "global_step": 26628, "epoch": 158} {"train_loss": -7.313244819641113, "global_step": 26629, "epoch": 158} {"train_loss": -7.263212203979492, "global_step": 26630, "epoch": 158} {"train_loss": -7.2368316650390625, "global_step": 26631, "epoch": 158} {"train_loss": -7.512048244476318, "global_step": 26632, "epoch": 158} {"train_loss": -7.207664489746094, "global_step": 26633, "epoch": 158} {"train_loss": -7.26979398727417, "global_step": 26634, "epoch": 158} {"train_loss": -7.456009864807129, "global_step": 26635, "epoch": 158} {"train_loss": -7.161608695983887, "global_step": 26636, "epoch": 158} {"train_loss": -7.459573745727539, "global_step": 26637, "epoch": 158} {"train_loss": -7.2054009437561035, "global_step": 26638, "epoch": 158} {"train_loss": -7.3002166748046875, "global_step": 26639, "epoch": 158} {"train_loss": -7.060435771942139, "global_step": 26640, "epoch": 158} {"train_loss": -7.358913421630859, "global_step": 26641, "epoch": 158} {"train_loss": -7.248823642730713, "global_step": 26642, "epoch": 158} {"train_loss": -7.142034530639648, "global_step": 26643, "epoch": 158} {"train_loss": -7.368862628936768, "global_step": 26644, "epoch": 158} {"train_loss": -7.291142463684082, "global_step": 26645, "epoch": 158} {"train_loss": -7.450125694274902, "global_step": 26646, "epoch": 158} {"train_loss": -7.2135820388793945, "global_step": 26647, "epoch": 158} {"train_loss": -7.206325531005859, "global_step": 26648, "epoch": 158} {"train_loss": -7.325874328613281, "global_step": 26649, "epoch": 158} {"train_loss": -7.459235668182373, "global_step": 26650, "epoch": 158} {"train_loss": -7.207256317138672, "global_step": 26651, "epoch": 158} {"train_loss": -7.435675621032715, "global_step": 26652, "epoch": 158} {"train_loss": -7.262064456939697, "global_step": 26653, "epoch": 158} {"train_loss": -7.295373916625977, "global_step": 26654, "epoch": 158} {"train_loss": -7.166258811950684, "global_step": 26655, "epoch": 158} {"train_loss": -7.3876447677612305, "global_step": 26656, "epoch": 158} {"train_loss": -7.202754020690918, "global_step": 26657, "epoch": 158} {"train_loss": -7.401157855987549, "global_step": 26658, "epoch": 158} {"train_loss": -7.388937473297119, "global_step": 26659, "epoch": 158} {"train_loss": -7.296384811401367, "global_step": 26660, "epoch": 158} {"train_loss": -7.494028091430664, "global_step": 26661, "epoch": 158} {"train_loss": -7.2978901863098145, "global_step": 26662, "epoch": 158} {"train_loss": -7.115239143371582, "global_step": 26663, "epoch": 158} {"train_loss": -7.366331100463867, "global_step": 26664, "epoch": 158} {"train_loss": -7.343473434448242, "global_step": 26665, "epoch": 158} {"train_loss": -7.447728157043457, "global_step": 26666, "epoch": 158} {"train_loss": -7.271191596984863, "global_step": 26667, "epoch": 158} {"train_loss": -7.367501735687256, "global_step": 26668, "epoch": 158} {"train_loss": -7.435741424560547, "global_step": 26669, "epoch": 158} {"train_loss": -7.178173065185547, "global_step": 26670, "epoch": 158} {"train_loss": -7.378037452697754, "global_step": 26671, "epoch": 158} {"train_loss": -7.539712905883789, "global_step": 26672, "epoch": 158} {"train_loss": -7.373629570007324, "global_step": 26673, "epoch": 158} {"train_loss": -7.269252300262451, "global_step": 26674, "epoch": 158} {"train_loss": -7.227362632751465, "global_step": 26675, "epoch": 158} {"train_loss": -7.301116943359375, "global_step": 26676, "epoch": 158} {"train_loss": -7.300004959106445, "global_step": 26677, "epoch": 158} {"train_loss": -7.404946327209473, "global_step": 26678, "epoch": 158} {"train_loss": -7.33918571472168, "global_step": 26679, "epoch": 158} {"train_loss": -7.584590911865234, "global_step": 26680, "epoch": 158} {"train_loss": -7.496195316314697, "global_step": 26681, "epoch": 158} {"train_loss": -7.299368858337402, "global_step": 26682, "epoch": 158} {"train_loss": -7.046425819396973, "global_step": 26683, "epoch": 158} {"train_loss": -7.367680549621582, "global_step": 26684, "epoch": 158} {"train_loss": -7.452325820922852, "global_step": 26685, "epoch": 158} {"train_loss": -7.21074914932251, "global_step": 26686, "epoch": 158} {"train_loss": -7.527132034301758, "global_step": 26687, "epoch": 158} {"train_loss": -7.269369125366211, "global_step": 26688, "epoch": 158} {"train_loss": -7.3531599044799805, "global_step": 26689, "epoch": 158} {"train_loss": -7.168994426727295, "global_step": 26690, "epoch": 158} {"train_loss": -7.281351089477539, "global_step": 26691, "epoch": 158} {"train_loss": -7.360553741455078, "global_step": 26692, "epoch": 158} {"train_loss": -7.157724380493164, "global_step": 26693, "epoch": 158} {"train_loss": -7.3293609619140625, "global_step": 26694, "epoch": 158} {"train_loss": -7.47561502456665, "global_step": 26695, "epoch": 158} {"train_loss": -7.340271949768066, "global_step": 26696, "epoch": 158} {"train_loss": -7.278990268707275, "global_step": 26697, "epoch": 158} {"train_loss": -7.389737129211426, "global_step": 26698, "epoch": 158} {"train_loss": -6.99569845199585, "global_step": 26699, "epoch": 158} {"train_loss": -7.377765655517578, "global_step": 26700, "epoch": 158} {"train_loss": -7.256834030151367, "global_step": 26701, "epoch": 158} {"train_loss": -7.256261825561523, "global_step": 26702, "epoch": 158} {"train_loss": -7.343687534332275, "global_step": 26703, "epoch": 158} {"train_loss": -7.395021438598633, "global_step": 26704, "epoch": 158} {"train_loss": -7.137484550476074, "global_step": 26705, "epoch": 158} {"train_loss": -7.278077602386475, "global_step": 26706, "epoch": 158} {"train_loss": -7.318173885345459, "global_step": 26707, "epoch": 158} {"train_loss": -7.399354934692383, "global_step": 26708, "epoch": 158} {"train_loss": -7.169088840484619, "global_step": 26709, "epoch": 158} {"train_loss": -7.370782852172852, "global_step": 26710, "epoch": 158} {"train_loss": -7.287959521725064, "global_step": 26711, "epoch": 158, "val_loss": 192327.671875} {"train_loss": -7.369466781616211, "global_step": 26712, "epoch": 159} {"train_loss": -7.473052978515625, "global_step": 26713, "epoch": 159} {"train_loss": -7.223891735076904, "global_step": 26714, "epoch": 159} {"train_loss": -7.37861442565918, "global_step": 26715, "epoch": 159} {"train_loss": -7.291297912597656, "global_step": 26716, "epoch": 159} {"train_loss": -7.273890018463135, "global_step": 26717, "epoch": 159} {"train_loss": -7.354007720947266, "global_step": 26718, "epoch": 159} {"train_loss": -7.180414199829102, "global_step": 26719, "epoch": 159} {"train_loss": -7.348589897155762, "global_step": 26720, "epoch": 159} {"train_loss": -7.427052021026611, "global_step": 26721, "epoch": 159} {"train_loss": -7.20902156829834, "global_step": 26722, "epoch": 159} {"train_loss": -7.553690433502197, "global_step": 26723, "epoch": 159} {"train_loss": -7.1465654373168945, "global_step": 26724, "epoch": 159} {"train_loss": -7.2488112449646, "global_step": 26725, "epoch": 159} {"train_loss": -7.471869468688965, "global_step": 26726, "epoch": 159} {"train_loss": -7.397320747375488, "global_step": 26727, "epoch": 159} {"train_loss": -7.309971809387207, "global_step": 26728, "epoch": 159} {"train_loss": -6.942314147949219, "global_step": 26729, "epoch": 159} {"train_loss": -7.275905132293701, "global_step": 26730, "epoch": 159} {"train_loss": -7.463961601257324, "global_step": 26731, "epoch": 159} {"train_loss": -7.010457992553711, "global_step": 26732, "epoch": 159} {"train_loss": -7.50504207611084, "global_step": 26733, "epoch": 159} {"train_loss": -7.217850685119629, "global_step": 26734, "epoch": 159} {"train_loss": -7.383606910705566, "global_step": 26735, "epoch": 159} {"train_loss": -7.145120620727539, "global_step": 26736, "epoch": 159} {"train_loss": -7.351737976074219, "global_step": 26737, "epoch": 159} {"train_loss": -7.021761894226074, "global_step": 26738, "epoch": 159} {"train_loss": -7.393472671508789, "global_step": 26739, "epoch": 159} {"train_loss": -7.1951446533203125, "global_step": 26740, "epoch": 159} {"train_loss": -7.401602745056152, "global_step": 26741, "epoch": 159} {"train_loss": -7.252366542816162, "global_step": 26742, "epoch": 159} {"train_loss": -7.242922782897949, "global_step": 26743, "epoch": 159} {"train_loss": -7.085002899169922, "global_step": 26744, "epoch": 159} {"train_loss": -7.299412727355957, "global_step": 26745, "epoch": 159} {"train_loss": -7.179290771484375, "global_step": 26746, "epoch": 159} {"train_loss": -7.135988235473633, "global_step": 26747, "epoch": 159} {"train_loss": -7.152071475982666, "global_step": 26748, "epoch": 159} {"train_loss": -7.118490219116211, "global_step": 26749, "epoch": 159} {"train_loss": -7.208020210266113, "global_step": 26750, "epoch": 159} {"train_loss": -7.009400844573975, "global_step": 26751, "epoch": 159} {"train_loss": -7.356006145477295, "global_step": 26752, "epoch": 159} {"train_loss": -7.373667240142822, "global_step": 26753, "epoch": 159} {"train_loss": -7.183887481689453, "global_step": 26754, "epoch": 159} {"train_loss": -7.222184181213379, "global_step": 26755, "epoch": 159} {"train_loss": -7.297512054443359, "global_step": 26756, "epoch": 159} {"train_loss": -7.083197593688965, "global_step": 26757, "epoch": 159} {"train_loss": -7.36143684387207, "global_step": 26758, "epoch": 159} {"train_loss": -7.089387893676758, "global_step": 26759, "epoch": 159} {"train_loss": -7.461648941040039, "global_step": 26760, "epoch": 159} {"train_loss": -7.079395294189453, "global_step": 26761, "epoch": 159} {"train_loss": -7.487149238586426, "global_step": 26762, "epoch": 159} {"train_loss": -7.363354682922363, "global_step": 26763, "epoch": 159} {"train_loss": -7.33891487121582, "global_step": 26764, "epoch": 159} {"train_loss": -7.086735725402832, "global_step": 26765, "epoch": 159} {"train_loss": -7.173723220825195, "global_step": 26766, "epoch": 159} {"train_loss": -7.3031229972839355, "global_step": 26767, "epoch": 159} {"train_loss": -7.284117698669434, "global_step": 26768, "epoch": 159} {"train_loss": -7.3971147537231445, "global_step": 26769, "epoch": 159} {"train_loss": -7.237611770629883, "global_step": 26770, "epoch": 159} {"train_loss": -7.251656532287598, "global_step": 26771, "epoch": 159} {"train_loss": -7.237578392028809, "global_step": 26772, "epoch": 159} {"train_loss": -7.018580436706543, "global_step": 26773, "epoch": 159} {"train_loss": -7.012147426605225, "global_step": 26774, "epoch": 159} {"train_loss": -7.217339515686035, "global_step": 26775, "epoch": 159} {"train_loss": -7.0666584968566895, "global_step": 26776, "epoch": 159} {"train_loss": -7.5220627784729, "global_step": 26777, "epoch": 159} {"train_loss": -7.272199630737305, "global_step": 26778, "epoch": 159} {"train_loss": -7.131315231323242, "global_step": 26779, "epoch": 159} {"train_loss": -6.935427665710449, "global_step": 26780, "epoch": 159} {"train_loss": -7.246634483337402, "global_step": 26781, "epoch": 159} {"train_loss": -7.353255748748779, "global_step": 26782, "epoch": 159} {"train_loss": -7.148730278015137, "global_step": 26783, "epoch": 159} {"train_loss": -7.293719291687012, "global_step": 26784, "epoch": 159} {"train_loss": -7.151812553405762, "global_step": 26785, "epoch": 159} {"train_loss": -7.222080230712891, "global_step": 26786, "epoch": 159} {"train_loss": -7.388016700744629, "global_step": 26787, "epoch": 159} {"train_loss": -7.105714797973633, "global_step": 26788, "epoch": 159} {"train_loss": -7.403740882873535, "global_step": 26789, "epoch": 159} {"train_loss": -7.270902156829834, "global_step": 26790, "epoch": 159} {"train_loss": -7.230831146240234, "global_step": 26791, "epoch": 159} {"train_loss": -7.339221000671387, "global_step": 26792, "epoch": 159} {"train_loss": -7.279590129852295, "global_step": 26793, "epoch": 159} {"train_loss": -7.065181732177734, "global_step": 26794, "epoch": 159} {"train_loss": -7.451522350311279, "global_step": 26795, "epoch": 159} {"train_loss": -7.4020233154296875, "global_step": 26796, "epoch": 159} {"train_loss": -7.309148788452148, "global_step": 26797, "epoch": 159} {"train_loss": -7.410345077514648, "global_step": 26798, "epoch": 159} {"train_loss": -7.364648342132568, "global_step": 26799, "epoch": 159} {"train_loss": -7.336905002593994, "global_step": 26800, "epoch": 159} {"train_loss": -7.221045017242432, "global_step": 26801, "epoch": 159} {"train_loss": -7.387472152709961, "global_step": 26802, "epoch": 159} {"train_loss": -7.227770805358887, "global_step": 26803, "epoch": 159} {"train_loss": -7.206606864929199, "global_step": 26804, "epoch": 159} {"train_loss": -7.547215938568115, "global_step": 26805, "epoch": 159} {"train_loss": -7.23350715637207, "global_step": 26806, "epoch": 159} {"train_loss": -7.25726842880249, "global_step": 26807, "epoch": 159} {"train_loss": -7.191192626953125, "global_step": 26808, "epoch": 159} {"train_loss": -7.244461536407471, "global_step": 26809, "epoch": 159} {"train_loss": -7.26825475692749, "global_step": 26810, "epoch": 159} {"train_loss": -7.102224349975586, "global_step": 26811, "epoch": 159} {"train_loss": -7.236459255218506, "global_step": 26812, "epoch": 159} {"train_loss": -7.307094573974609, "global_step": 26813, "epoch": 159} {"train_loss": -7.191595077514648, "global_step": 26814, "epoch": 159} {"train_loss": -7.294721603393555, "global_step": 26815, "epoch": 159} {"train_loss": -7.233789443969727, "global_step": 26816, "epoch": 159} {"train_loss": -7.580646514892578, "global_step": 26817, "epoch": 159} {"train_loss": -7.3235368728637695, "global_step": 26818, "epoch": 159} {"train_loss": -7.342321872711182, "global_step": 26819, "epoch": 159} {"train_loss": -7.440779685974121, "global_step": 26820, "epoch": 159} {"train_loss": -7.059426784515381, "global_step": 26821, "epoch": 159} {"train_loss": -6.929924011230469, "global_step": 26822, "epoch": 159} {"train_loss": -7.4397687911987305, "global_step": 26823, "epoch": 159} {"train_loss": -6.861584663391113, "global_step": 26824, "epoch": 159} {"train_loss": -6.996054172515869, "global_step": 26825, "epoch": 159} {"train_loss": -7.046581268310547, "global_step": 26826, "epoch": 159} {"train_loss": -6.8950958251953125, "global_step": 26827, "epoch": 159} {"train_loss": -7.034717082977295, "global_step": 26828, "epoch": 159} {"train_loss": -6.8997297286987305, "global_step": 26829, "epoch": 159} {"train_loss": -6.968974590301514, "global_step": 26830, "epoch": 159} {"train_loss": -7.042799472808838, "global_step": 26831, "epoch": 159} {"train_loss": -7.073978424072266, "global_step": 26832, "epoch": 159} {"train_loss": -7.412207126617432, "global_step": 26833, "epoch": 159} {"train_loss": -7.142201900482178, "global_step": 26834, "epoch": 159} {"train_loss": -7.14181661605835, "global_step": 26835, "epoch": 159} {"train_loss": -7.244472980499268, "global_step": 26836, "epoch": 159} {"train_loss": -7.001768112182617, "global_step": 26837, "epoch": 159} {"train_loss": -7.113850116729736, "global_step": 26838, "epoch": 159} {"train_loss": -7.063464164733887, "global_step": 26839, "epoch": 159} {"train_loss": -7.450044631958008, "global_step": 26840, "epoch": 159} {"train_loss": -7.242944717407227, "global_step": 26841, "epoch": 159} {"train_loss": -7.135043144226074, "global_step": 26842, "epoch": 159} {"train_loss": -7.30410623550415, "global_step": 26843, "epoch": 159} {"train_loss": -7.280699729919434, "global_step": 26844, "epoch": 159} {"train_loss": -7.364167213439941, "global_step": 26845, "epoch": 159} {"train_loss": -7.359381675720215, "global_step": 26846, "epoch": 159} {"train_loss": -7.4646406173706055, "global_step": 26847, "epoch": 159} {"train_loss": -7.466528415679932, "global_step": 26848, "epoch": 159} {"train_loss": -7.390369415283203, "global_step": 26849, "epoch": 159} {"train_loss": -7.443619728088379, "global_step": 26850, "epoch": 159} {"train_loss": -7.320588111877441, "global_step": 26851, "epoch": 159} {"train_loss": -7.318176746368408, "global_step": 26852, "epoch": 159} {"train_loss": -7.612188339233398, "global_step": 26853, "epoch": 159} {"train_loss": -7.4322829246521, "global_step": 26854, "epoch": 159} {"train_loss": -7.424731731414795, "global_step": 26855, "epoch": 159} {"train_loss": -7.623507499694824, "global_step": 26856, "epoch": 159} {"train_loss": -7.200691223144531, "global_step": 26857, "epoch": 159} {"train_loss": -7.060789108276367, "global_step": 26858, "epoch": 159} {"train_loss": -7.184640884399414, "global_step": 26859, "epoch": 159} {"train_loss": -7.313016414642334, "global_step": 26860, "epoch": 159} {"train_loss": -7.558788299560547, "global_step": 26861, "epoch": 159} {"train_loss": -7.247440338134766, "global_step": 26862, "epoch": 159} {"train_loss": -7.336071968078613, "global_step": 26863, "epoch": 159} {"train_loss": -7.385648250579834, "global_step": 26864, "epoch": 159} {"train_loss": -7.467911243438721, "global_step": 26865, "epoch": 159} {"train_loss": -7.259186267852783, "global_step": 26866, "epoch": 159} {"train_loss": -7.34721565246582, "global_step": 26867, "epoch": 159} {"train_loss": -6.975489616394043, "global_step": 26868, "epoch": 159} {"train_loss": -7.480259895324707, "global_step": 26869, "epoch": 159} {"train_loss": -7.402159690856934, "global_step": 26870, "epoch": 159} {"train_loss": -7.40482234954834, "global_step": 26871, "epoch": 159} {"train_loss": -7.297139644622803, "global_step": 26872, "epoch": 159} {"train_loss": -7.465091705322266, "global_step": 26873, "epoch": 159} {"train_loss": -7.268088340759277, "global_step": 26874, "epoch": 159} {"train_loss": -7.498798370361328, "global_step": 26875, "epoch": 159} {"train_loss": -7.113258361816406, "global_step": 26876, "epoch": 159} {"train_loss": -7.393291473388672, "global_step": 26877, "epoch": 159} {"train_loss": -7.3204665184021, "global_step": 26878, "epoch": 159} {"train_loss": -7.265194200334095, "global_step": 26879, "epoch": 159, "val_loss": 193586.0625} {"train_loss": -7.330280303955078, "global_step": 26880, "epoch": 160} {"train_loss": -7.470505714416504, "global_step": 26881, "epoch": 160} {"train_loss": -7.159607887268066, "global_step": 26882, "epoch": 160} {"train_loss": -7.292407035827637, "global_step": 26883, "epoch": 160} {"train_loss": -7.122242450714111, "global_step": 26884, "epoch": 160} {"train_loss": -7.272975921630859, "global_step": 26885, "epoch": 160} {"train_loss": -7.401577949523926, "global_step": 26886, "epoch": 160} {"train_loss": -7.305751800537109, "global_step": 26887, "epoch": 160} {"train_loss": -7.39686393737793, "global_step": 26888, "epoch": 160} {"train_loss": -7.152656555175781, "global_step": 26889, "epoch": 160} {"train_loss": -7.318330764770508, "global_step": 26890, "epoch": 160} {"train_loss": -7.327861309051514, "global_step": 26891, "epoch": 160} {"train_loss": -7.4418721199035645, "global_step": 26892, "epoch": 160} {"train_loss": -7.214099407196045, "global_step": 26893, "epoch": 160} {"train_loss": -7.4552202224731445, "global_step": 26894, "epoch": 160} {"train_loss": -7.155196189880371, "global_step": 26895, "epoch": 160} {"train_loss": -7.46275520324707, "global_step": 26896, "epoch": 160} {"train_loss": -7.293953895568848, "global_step": 26897, "epoch": 160} {"train_loss": -7.559054374694824, "global_step": 26898, "epoch": 160} {"train_loss": -7.374449253082275, "global_step": 26899, "epoch": 160} {"train_loss": -7.364381790161133, "global_step": 26900, "epoch": 160} {"train_loss": -7.411724090576172, "global_step": 26901, "epoch": 160} {"train_loss": -7.558616638183594, "global_step": 26902, "epoch": 160} {"train_loss": -7.303703784942627, "global_step": 26903, "epoch": 160} {"train_loss": -7.408567905426025, "global_step": 26904, "epoch": 160} {"train_loss": -7.426125526428223, "global_step": 26905, "epoch": 160} {"train_loss": -7.385190963745117, "global_step": 26906, "epoch": 160} {"train_loss": -7.5779523849487305, "global_step": 26907, "epoch": 160} {"train_loss": -7.406500339508057, "global_step": 26908, "epoch": 160} {"train_loss": -7.415944576263428, "global_step": 26909, "epoch": 160} {"train_loss": -7.313868522644043, "global_step": 26910, "epoch": 160} {"train_loss": -7.422429084777832, "global_step": 26911, "epoch": 160} {"train_loss": -7.614816665649414, "global_step": 26912, "epoch": 160} {"train_loss": -7.366543769836426, "global_step": 26913, "epoch": 160} {"train_loss": -7.476245880126953, "global_step": 26914, "epoch": 160} {"train_loss": -7.251436233520508, "global_step": 26915, "epoch": 160} {"train_loss": -7.3749518394470215, "global_step": 26916, "epoch": 160} {"train_loss": -7.378533363342285, "global_step": 26917, "epoch": 160} {"train_loss": -7.444614887237549, "global_step": 26918, "epoch": 160} {"train_loss": -7.514838218688965, "global_step": 26919, "epoch": 160} {"train_loss": -7.5099334716796875, "global_step": 26920, "epoch": 160} {"train_loss": -7.278056621551514, "global_step": 26921, "epoch": 160} {"train_loss": -7.274731159210205, "global_step": 26922, "epoch": 160} {"train_loss": -7.069914817810059, "global_step": 26923, "epoch": 160} {"train_loss": -6.993983268737793, "global_step": 26924, "epoch": 160} {"train_loss": -7.033103942871094, "global_step": 26925, "epoch": 160} {"train_loss": -6.730169773101807, "global_step": 26926, "epoch": 160} {"train_loss": -6.939487457275391, "global_step": 26927, "epoch": 160} {"train_loss": -7.1141791343688965, "global_step": 26928, "epoch": 160} {"train_loss": -7.058259963989258, "global_step": 26929, "epoch": 160} {"train_loss": -7.109968185424805, "global_step": 26930, "epoch": 160} {"train_loss": -6.967947006225586, "global_step": 26931, "epoch": 160} {"train_loss": -7.128813743591309, "global_step": 26932, "epoch": 160} {"train_loss": -7.036551475524902, "global_step": 26933, "epoch": 160} {"train_loss": -6.984787464141846, "global_step": 26934, "epoch": 160} {"train_loss": -7.032313346862793, "global_step": 26935, "epoch": 160} {"train_loss": -7.205984115600586, "global_step": 26936, "epoch": 160} {"train_loss": -7.106556415557861, "global_step": 26937, "epoch": 160} {"train_loss": -7.202698707580566, "global_step": 26938, "epoch": 160} {"train_loss": -7.162294387817383, "global_step": 26939, "epoch": 160} {"train_loss": -7.220993995666504, "global_step": 26940, "epoch": 160} {"train_loss": -7.437716484069824, "global_step": 26941, "epoch": 160} {"train_loss": -7.351696968078613, "global_step": 26942, "epoch": 160} {"train_loss": -7.257138252258301, "global_step": 26943, "epoch": 160} {"train_loss": -7.061957359313965, "global_step": 26944, "epoch": 160} {"train_loss": -7.174685955047607, "global_step": 26945, "epoch": 160} {"train_loss": -7.428678512573242, "global_step": 26946, "epoch": 160} {"train_loss": -7.116366386413574, "global_step": 26947, "epoch": 160} {"train_loss": -7.300975799560547, "global_step": 26948, "epoch": 160} {"train_loss": -7.307477951049805, "global_step": 26949, "epoch": 160} {"train_loss": -7.297170639038086, "global_step": 26950, "epoch": 160} {"train_loss": -7.533511161804199, "global_step": 26951, "epoch": 160} {"train_loss": -7.0469818115234375, "global_step": 26952, "epoch": 160} {"train_loss": -7.357479095458984, "global_step": 26953, "epoch": 160} {"train_loss": -7.373541355133057, "global_step": 26954, "epoch": 160} {"train_loss": -7.4038615226745605, "global_step": 26955, "epoch": 160} {"train_loss": -7.3891682624816895, "global_step": 26956, "epoch": 160} {"train_loss": -7.317099571228027, "global_step": 26957, "epoch": 160} {"train_loss": -7.305630683898926, "global_step": 26958, "epoch": 160} {"train_loss": -7.125574111938477, "global_step": 26959, "epoch": 160} {"train_loss": -7.328877925872803, "global_step": 26960, "epoch": 160} {"train_loss": -7.175480365753174, "global_step": 26961, "epoch": 160} {"train_loss": -7.101937294006348, "global_step": 26962, "epoch": 160} {"train_loss": -7.251291275024414, "global_step": 26963, "epoch": 160} {"train_loss": -7.301620960235596, "global_step": 26964, "epoch": 160} {"train_loss": -7.060625076293945, "global_step": 26965, "epoch": 160} {"train_loss": -7.040983200073242, "global_step": 26966, "epoch": 160} {"train_loss": -7.229002952575684, "global_step": 26967, "epoch": 160} {"train_loss": -7.47402286529541, "global_step": 26968, "epoch": 160} {"train_loss": -7.199128150939941, "global_step": 26969, "epoch": 160} {"train_loss": -7.214779853820801, "global_step": 26970, "epoch": 160} {"train_loss": -6.9323930740356445, "global_step": 26971, "epoch": 160} {"train_loss": -7.196913242340088, "global_step": 26972, "epoch": 160} {"train_loss": -7.307432651519775, "global_step": 26973, "epoch": 160} {"train_loss": -6.84058952331543, "global_step": 26974, "epoch": 160} {"train_loss": -7.366602420806885, "global_step": 26975, "epoch": 160} {"train_loss": -7.123357772827148, "global_step": 26976, "epoch": 160} {"train_loss": -7.204140663146973, "global_step": 26977, "epoch": 160} {"train_loss": -7.132406711578369, "global_step": 26978, "epoch": 160} {"train_loss": -7.112850189208984, "global_step": 26979, "epoch": 160} {"train_loss": -6.90864896774292, "global_step": 26980, "epoch": 160} {"train_loss": -7.045716762542725, "global_step": 26981, "epoch": 160} {"train_loss": -7.317933559417725, "global_step": 26982, "epoch": 160} {"train_loss": -7.152155876159668, "global_step": 26983, "epoch": 160} {"train_loss": -6.86061429977417, "global_step": 26984, "epoch": 160} {"train_loss": -7.214631080627441, "global_step": 26985, "epoch": 160} {"train_loss": -7.068474292755127, "global_step": 26986, "epoch": 160} {"train_loss": -7.080358982086182, "global_step": 26987, "epoch": 160} {"train_loss": -7.118777275085449, "global_step": 26988, "epoch": 160} {"train_loss": -7.357275009155273, "global_step": 26989, "epoch": 160} {"train_loss": -7.051187038421631, "global_step": 26990, "epoch": 160} {"train_loss": -7.221652030944824, "global_step": 26991, "epoch": 160} {"train_loss": -7.131599426269531, "global_step": 26992, "epoch": 160} {"train_loss": -7.192261695861816, "global_step": 26993, "epoch": 160} {"train_loss": -7.314952850341797, "global_step": 26994, "epoch": 160} {"train_loss": -7.376368522644043, "global_step": 26995, "epoch": 160} {"train_loss": -7.619499206542969, "global_step": 26996, "epoch": 160} {"train_loss": -7.399420738220215, "global_step": 26997, "epoch": 160} {"train_loss": -7.326600074768066, "global_step": 26998, "epoch": 160} {"train_loss": -7.300239562988281, "global_step": 26999, "epoch": 160} {"train_loss": -7.206210136413574, "global_step": 27000, "epoch": 160} {"train_loss": -6.947283744812012, "global_step": 27001, "epoch": 160} {"train_loss": -7.30758810043335, "global_step": 27002, "epoch": 160} {"train_loss": -7.194892883300781, "global_step": 27003, "epoch": 160} {"train_loss": -7.049472808837891, "global_step": 27004, "epoch": 160} {"train_loss": -7.194551467895508, "global_step": 27005, "epoch": 160} {"train_loss": -7.019911766052246, "global_step": 27006, "epoch": 160} {"train_loss": -7.025206089019775, "global_step": 27007, "epoch": 160} {"train_loss": -7.058909893035889, "global_step": 27008, "epoch": 160} {"train_loss": -6.979545593261719, "global_step": 27009, "epoch": 160} {"train_loss": -7.401426792144775, "global_step": 27010, "epoch": 160} {"train_loss": -7.16053581237793, "global_step": 27011, "epoch": 160} {"train_loss": -7.27224063873291, "global_step": 27012, "epoch": 160} {"train_loss": -7.22928524017334, "global_step": 27013, "epoch": 160} {"train_loss": -7.054614067077637, "global_step": 27014, "epoch": 160} {"train_loss": -7.216456413269043, "global_step": 27015, "epoch": 160} {"train_loss": -7.4324493408203125, "global_step": 27016, "epoch": 160} {"train_loss": -7.192627906799316, "global_step": 27017, "epoch": 160} {"train_loss": -7.2380690574646, "global_step": 27018, "epoch": 160} {"train_loss": -7.286734580993652, "global_step": 27019, "epoch": 160} {"train_loss": -7.271664142608643, "global_step": 27020, "epoch": 160} {"train_loss": -7.208261966705322, "global_step": 27021, "epoch": 160} {"train_loss": -7.458568096160889, "global_step": 27022, "epoch": 160} {"train_loss": -7.4466376304626465, "global_step": 27023, "epoch": 160} {"train_loss": -7.14047384262085, "global_step": 27024, "epoch": 160} {"train_loss": -7.47125244140625, "global_step": 27025, "epoch": 160} {"train_loss": -7.275844573974609, "global_step": 27026, "epoch": 160} {"train_loss": -7.183590412139893, "global_step": 27027, "epoch": 160} {"train_loss": -7.353375434875488, "global_step": 27028, "epoch": 160} {"train_loss": -7.292109489440918, "global_step": 27029, "epoch": 160} {"train_loss": -7.670480251312256, "global_step": 27030, "epoch": 160} {"train_loss": -7.360180377960205, "global_step": 27031, "epoch": 160} {"train_loss": -7.662274360656738, "global_step": 27032, "epoch": 160} {"train_loss": -7.205445289611816, "global_step": 27033, "epoch": 160} {"train_loss": -7.3990373611450195, "global_step": 27034, "epoch": 160} {"train_loss": -7.146731376647949, "global_step": 27035, "epoch": 160} {"train_loss": -7.361286163330078, "global_step": 27036, "epoch": 160} {"train_loss": -7.371901035308838, "global_step": 27037, "epoch": 160} {"train_loss": -7.390020370483398, "global_step": 27038, "epoch": 160} {"train_loss": -7.247786521911621, "global_step": 27039, "epoch": 160} {"train_loss": -7.358100891113281, "global_step": 27040, "epoch": 160} {"train_loss": -7.110170364379883, "global_step": 27041, "epoch": 160} {"train_loss": -7.394961357116699, "global_step": 27042, "epoch": 160} {"train_loss": -7.2878875732421875, "global_step": 27043, "epoch": 160} {"train_loss": -7.495038032531738, "global_step": 27044, "epoch": 160} {"train_loss": -7.056790828704834, "global_step": 27045, "epoch": 160} {"train_loss": -7.477447986602783, "global_step": 27046, "epoch": 160} {"train_loss": -7.254078558513096, "global_step": 27047, "epoch": 160, "val_loss": 194149.078125, "train_action_mse_error": 12.08714485168457} {"train_loss": -7.239636421203613, "global_step": 27048, "epoch": 161} {"train_loss": -7.267924785614014, "global_step": 27049, "epoch": 161} {"train_loss": -6.936211109161377, "global_step": 27050, "epoch": 161} {"train_loss": -7.240510940551758, "global_step": 27051, "epoch": 161} {"train_loss": -7.082084655761719, "global_step": 27052, "epoch": 161} {"train_loss": -7.353806495666504, "global_step": 27053, "epoch": 161} {"train_loss": -7.24732780456543, "global_step": 27054, "epoch": 161} {"train_loss": -7.094913005828857, "global_step": 27055, "epoch": 161} {"train_loss": -7.152714252471924, "global_step": 27056, "epoch": 161} {"train_loss": -6.978396892547607, "global_step": 27057, "epoch": 161} {"train_loss": -7.056781768798828, "global_step": 27058, "epoch": 161} {"train_loss": -7.026361465454102, "global_step": 27059, "epoch": 161} {"train_loss": -7.251947402954102, "global_step": 27060, "epoch": 161} {"train_loss": -7.214426040649414, "global_step": 27061, "epoch": 161} {"train_loss": -7.073663711547852, "global_step": 27062, "epoch": 161} {"train_loss": -6.968395233154297, "global_step": 27063, "epoch": 161} {"train_loss": -7.361960411071777, "global_step": 27064, "epoch": 161} {"train_loss": -7.126780986785889, "global_step": 27065, "epoch": 161} {"train_loss": -7.278143882751465, "global_step": 27066, "epoch": 161} {"train_loss": -7.263575553894043, "global_step": 27067, "epoch": 161} {"train_loss": -7.30607795715332, "global_step": 27068, "epoch": 161} {"train_loss": -7.319278240203857, "global_step": 27069, "epoch": 161} {"train_loss": -7.249181747436523, "global_step": 27070, "epoch": 161} {"train_loss": -7.352512359619141, "global_step": 27071, "epoch": 161} {"train_loss": -7.3990373611450195, "global_step": 27072, "epoch": 161} {"train_loss": -7.452902793884277, "global_step": 27073, "epoch": 161} {"train_loss": -7.362942695617676, "global_step": 27074, "epoch": 161} {"train_loss": -7.426126480102539, "global_step": 27075, "epoch": 161} {"train_loss": -7.422834396362305, "global_step": 27076, "epoch": 161} {"train_loss": -7.388156414031982, "global_step": 27077, "epoch": 161} {"train_loss": -7.347198486328125, "global_step": 27078, "epoch": 161} {"train_loss": -7.205937385559082, "global_step": 27079, "epoch": 161} {"train_loss": -7.715827465057373, "global_step": 27080, "epoch": 161} {"train_loss": -7.348916053771973, "global_step": 27081, "epoch": 161} {"train_loss": -7.284657001495361, "global_step": 27082, "epoch": 161} {"train_loss": -7.363762855529785, "global_step": 27083, "epoch": 161} {"train_loss": -7.399035453796387, "global_step": 27084, "epoch": 161} {"train_loss": -7.148595809936523, "global_step": 27085, "epoch": 161} {"train_loss": -7.647095680236816, "global_step": 27086, "epoch": 161} {"train_loss": -7.532540321350098, "global_step": 27087, "epoch": 161} {"train_loss": -7.344912052154541, "global_step": 27088, "epoch": 161} {"train_loss": -7.49349308013916, "global_step": 27089, "epoch": 161} {"train_loss": -7.342705726623535, "global_step": 27090, "epoch": 161} {"train_loss": -7.197516441345215, "global_step": 27091, "epoch": 161} {"train_loss": -7.55148458480835, "global_step": 27092, "epoch": 161} {"train_loss": -7.142405033111572, "global_step": 27093, "epoch": 161} {"train_loss": -7.278433322906494, "global_step": 27094, "epoch": 161} {"train_loss": -7.4606781005859375, "global_step": 27095, "epoch": 161} {"train_loss": -7.221609115600586, "global_step": 27096, "epoch": 161} {"train_loss": -7.1258721351623535, "global_step": 27097, "epoch": 161} {"train_loss": -7.307010650634766, "global_step": 27098, "epoch": 161} {"train_loss": -6.884572505950928, "global_step": 27099, "epoch": 161} {"train_loss": -7.113003730773926, "global_step": 27100, "epoch": 161} {"train_loss": -7.032144546508789, "global_step": 27101, "epoch": 161} {"train_loss": -7.362973690032959, "global_step": 27102, "epoch": 161} {"train_loss": -7.191166400909424, "global_step": 27103, "epoch": 161} {"train_loss": -7.352142810821533, "global_step": 27104, "epoch": 161} {"train_loss": -7.354560852050781, "global_step": 27105, "epoch": 161} {"train_loss": -6.906318187713623, "global_step": 27106, "epoch": 161} {"train_loss": -7.195854187011719, "global_step": 27107, "epoch": 161} {"train_loss": -7.242896556854248, "global_step": 27108, "epoch": 161} {"train_loss": -6.995063304901123, "global_step": 27109, "epoch": 161} {"train_loss": -7.329676628112793, "global_step": 27110, "epoch": 161} {"train_loss": -7.008279800415039, "global_step": 27111, "epoch": 161} {"train_loss": -7.276537895202637, "global_step": 27112, "epoch": 161} {"train_loss": -7.017976760864258, "global_step": 27113, "epoch": 161} {"train_loss": -7.297763824462891, "global_step": 27114, "epoch": 161} {"train_loss": -7.275634288787842, "global_step": 27115, "epoch": 161} {"train_loss": -6.813725471496582, "global_step": 27116, "epoch": 161} {"train_loss": -7.418929100036621, "global_step": 27117, "epoch": 161} {"train_loss": -7.184632301330566, "global_step": 27118, "epoch": 161} {"train_loss": -7.1971893310546875, "global_step": 27119, "epoch": 161} {"train_loss": -7.404740810394287, "global_step": 27120, "epoch": 161} {"train_loss": -7.269558906555176, "global_step": 27121, "epoch": 161} {"train_loss": -7.248255729675293, "global_step": 27122, "epoch": 161} {"train_loss": -7.221895694732666, "global_step": 27123, "epoch": 161} {"train_loss": -7.493344306945801, "global_step": 27124, "epoch": 161} {"train_loss": -7.2962422370910645, "global_step": 27125, "epoch": 161} {"train_loss": -7.541477203369141, "global_step": 27126, "epoch": 161} {"train_loss": -7.3036627769470215, "global_step": 27127, "epoch": 161} {"train_loss": -7.212045192718506, "global_step": 27128, "epoch": 161} {"train_loss": -7.324090003967285, "global_step": 27129, "epoch": 161} {"train_loss": -7.290237903594971, "global_step": 27130, "epoch": 161} {"train_loss": -7.333539962768555, "global_step": 27131, "epoch": 161} {"train_loss": -7.0785064697265625, "global_step": 27132, "epoch": 161} {"train_loss": -7.255217552185059, "global_step": 27133, "epoch": 161} {"train_loss": -7.33521842956543, "global_step": 27134, "epoch": 161} {"train_loss": -7.389693737030029, "global_step": 27135, "epoch": 161} {"train_loss": -7.293635368347168, "global_step": 27136, "epoch": 161} {"train_loss": -7.2366790771484375, "global_step": 27137, "epoch": 161} {"train_loss": -7.331185340881348, "global_step": 27138, "epoch": 161} {"train_loss": -7.313926696777344, "global_step": 27139, "epoch": 161} {"train_loss": -7.253949165344238, "global_step": 27140, "epoch": 161} {"train_loss": -7.308187007904053, "global_step": 27141, "epoch": 161} {"train_loss": -7.27325439453125, "global_step": 27142, "epoch": 161} {"train_loss": -7.538748741149902, "global_step": 27143, "epoch": 161} {"train_loss": -7.219477653503418, "global_step": 27144, "epoch": 161} {"train_loss": -7.444746971130371, "global_step": 27145, "epoch": 161} {"train_loss": -7.426558494567871, "global_step": 27146, "epoch": 161} {"train_loss": -7.456800937652588, "global_step": 27147, "epoch": 161} {"train_loss": -7.376937389373779, "global_step": 27148, "epoch": 161} {"train_loss": -7.395771503448486, "global_step": 27149, "epoch": 161} {"train_loss": -7.152061462402344, "global_step": 27150, "epoch": 161} {"train_loss": -7.468343734741211, "global_step": 27151, "epoch": 161} {"train_loss": -7.214088439941406, "global_step": 27152, "epoch": 161} {"train_loss": -7.379517078399658, "global_step": 27153, "epoch": 161} {"train_loss": -7.025713920593262, "global_step": 27154, "epoch": 161} {"train_loss": -7.090655326843262, "global_step": 27155, "epoch": 161} {"train_loss": -7.448594093322754, "global_step": 27156, "epoch": 161} {"train_loss": -7.338480472564697, "global_step": 27157, "epoch": 161} {"train_loss": -7.3751630783081055, "global_step": 27158, "epoch": 161} {"train_loss": -7.324020862579346, "global_step": 27159, "epoch": 161} {"train_loss": -7.2068071365356445, "global_step": 27160, "epoch": 161} {"train_loss": -7.5810112953186035, "global_step": 27161, "epoch": 161} {"train_loss": -7.391934394836426, "global_step": 27162, "epoch": 161} {"train_loss": -7.527866363525391, "global_step": 27163, "epoch": 161} {"train_loss": -7.288814067840576, "global_step": 27164, "epoch": 161} {"train_loss": -7.260660171508789, "global_step": 27165, "epoch": 161} {"train_loss": -7.159353256225586, "global_step": 27166, "epoch": 161} {"train_loss": -7.354642391204834, "global_step": 27167, "epoch": 161} {"train_loss": -7.265021324157715, "global_step": 27168, "epoch": 161} {"train_loss": -7.4280595779418945, "global_step": 27169, "epoch": 161} {"train_loss": -7.217065334320068, "global_step": 27170, "epoch": 161} {"train_loss": -7.362421035766602, "global_step": 27171, "epoch": 161} {"train_loss": -7.302501678466797, "global_step": 27172, "epoch": 161} {"train_loss": -7.382120132446289, "global_step": 27173, "epoch": 161} {"train_loss": -6.647320747375488, "global_step": 27174, "epoch": 161} {"train_loss": -7.211241722106934, "global_step": 27175, "epoch": 161} {"train_loss": -7.366076469421387, "global_step": 27176, "epoch": 161} {"train_loss": -7.193607807159424, "global_step": 27177, "epoch": 161} {"train_loss": -7.098655700683594, "global_step": 27178, "epoch": 161} {"train_loss": -7.471972465515137, "global_step": 27179, "epoch": 161} {"train_loss": -7.342968940734863, "global_step": 27180, "epoch": 161} {"train_loss": -7.208989143371582, "global_step": 27181, "epoch": 161} {"train_loss": -7.221090793609619, "global_step": 27182, "epoch": 161} {"train_loss": -7.4559855461120605, "global_step": 27183, "epoch": 161} {"train_loss": -7.378711700439453, "global_step": 27184, "epoch": 161} {"train_loss": -7.065840244293213, "global_step": 27185, "epoch": 161} {"train_loss": -7.1331787109375, "global_step": 27186, "epoch": 161} {"train_loss": -7.498871326446533, "global_step": 27187, "epoch": 161} {"train_loss": -7.301029682159424, "global_step": 27188, "epoch": 161} {"train_loss": -7.407312870025635, "global_step": 27189, "epoch": 161} {"train_loss": -7.308553695678711, "global_step": 27190, "epoch": 161} {"train_loss": -7.255168914794922, "global_step": 27191, "epoch": 161} {"train_loss": -7.260125160217285, "global_step": 27192, "epoch": 161} {"train_loss": -7.498691558837891, "global_step": 27193, "epoch": 161} {"train_loss": -7.358855247497559, "global_step": 27194, "epoch": 161} {"train_loss": -7.297077178955078, "global_step": 27195, "epoch": 161} {"train_loss": -7.0713300704956055, "global_step": 27196, "epoch": 161} {"train_loss": -7.672540187835693, "global_step": 27197, "epoch": 161} {"train_loss": -7.201197624206543, "global_step": 27198, "epoch": 161} {"train_loss": -7.34724235534668, "global_step": 27199, "epoch": 161} {"train_loss": -7.165685176849365, "global_step": 27200, "epoch": 161} {"train_loss": -7.191741466522217, "global_step": 27201, "epoch": 161} {"train_loss": -7.031623363494873, "global_step": 27202, "epoch": 161} {"train_loss": -7.293656349182129, "global_step": 27203, "epoch": 161} {"train_loss": -7.165590286254883, "global_step": 27204, "epoch": 161} {"train_loss": -6.98107385635376, "global_step": 27205, "epoch": 161} {"train_loss": -6.85923433303833, "global_step": 27206, "epoch": 161} {"train_loss": -7.268828868865967, "global_step": 27207, "epoch": 161} {"train_loss": -7.044057846069336, "global_step": 27208, "epoch": 161} {"train_loss": -7.180689811706543, "global_step": 27209, "epoch": 161} {"train_loss": -7.370585918426514, "global_step": 27210, "epoch": 161} {"train_loss": -7.268491744995117, "global_step": 27211, "epoch": 161} {"train_loss": -7.314842224121094, "global_step": 27212, "epoch": 161} {"train_loss": -7.348325729370117, "global_step": 27213, "epoch": 161} {"train_loss": -7.313117027282715, "global_step": 27214, "epoch": 161} {"train_loss": -7.270180421216147, "global_step": 27215, "epoch": 161, "val_loss": 194883.078125} {"train_loss": -7.480969429016113, "global_step": 27216, "epoch": 162} {"train_loss": -7.228163719177246, "global_step": 27217, "epoch": 162} {"train_loss": -7.293159008026123, "global_step": 27218, "epoch": 162} {"train_loss": -7.094450950622559, "global_step": 27219, "epoch": 162} {"train_loss": -7.365128517150879, "global_step": 27220, "epoch": 162} {"train_loss": -7.323505878448486, "global_step": 27221, "epoch": 162} {"train_loss": -7.080102920532227, "global_step": 27222, "epoch": 162} {"train_loss": -7.18762731552124, "global_step": 27223, "epoch": 162} {"train_loss": -7.341361045837402, "global_step": 27224, "epoch": 162} {"train_loss": -7.204632759094238, "global_step": 27225, "epoch": 162} {"train_loss": -7.138486862182617, "global_step": 27226, "epoch": 162} {"train_loss": -7.218581199645996, "global_step": 27227, "epoch": 162} {"train_loss": -7.354216575622559, "global_step": 27228, "epoch": 162} {"train_loss": -7.284048080444336, "global_step": 27229, "epoch": 162} {"train_loss": -6.945003509521484, "global_step": 27230, "epoch": 162} {"train_loss": -7.322310447692871, "global_step": 27231, "epoch": 162} {"train_loss": -7.216076850891113, "global_step": 27232, "epoch": 162} {"train_loss": -7.403879642486572, "global_step": 27233, "epoch": 162} {"train_loss": -7.3176069259643555, "global_step": 27234, "epoch": 162} {"train_loss": -7.274765968322754, "global_step": 27235, "epoch": 162} {"train_loss": -7.495143890380859, "global_step": 27236, "epoch": 162} {"train_loss": -7.394990921020508, "global_step": 27237, "epoch": 162} {"train_loss": -7.192522048950195, "global_step": 27238, "epoch": 162} {"train_loss": -7.381744384765625, "global_step": 27239, "epoch": 162} {"train_loss": -7.375997066497803, "global_step": 27240, "epoch": 162} {"train_loss": -7.464278221130371, "global_step": 27241, "epoch": 162} {"train_loss": -7.4611310958862305, "global_step": 27242, "epoch": 162} {"train_loss": -7.552968978881836, "global_step": 27243, "epoch": 162} {"train_loss": -7.56585693359375, "global_step": 27244, "epoch": 162} {"train_loss": -7.384305000305176, "global_step": 27245, "epoch": 162} {"train_loss": -7.418708801269531, "global_step": 27246, "epoch": 162} {"train_loss": -7.305067539215088, "global_step": 27247, "epoch": 162} {"train_loss": -7.195690155029297, "global_step": 27248, "epoch": 162} {"train_loss": -7.382345199584961, "global_step": 27249, "epoch": 162} {"train_loss": -7.092803001403809, "global_step": 27250, "epoch": 162} {"train_loss": -7.131368637084961, "global_step": 27251, "epoch": 162} {"train_loss": -7.153008460998535, "global_step": 27252, "epoch": 162} {"train_loss": -7.279969215393066, "global_step": 27253, "epoch": 162} {"train_loss": -7.333439826965332, "global_step": 27254, "epoch": 162} {"train_loss": -7.419719219207764, "global_step": 27255, "epoch": 162} {"train_loss": -7.150739669799805, "global_step": 27256, "epoch": 162} {"train_loss": -7.184263229370117, "global_step": 27257, "epoch": 162} {"train_loss": -7.157842636108398, "global_step": 27258, "epoch": 162} {"train_loss": -7.4729766845703125, "global_step": 27259, "epoch": 162} {"train_loss": -7.553380966186523, "global_step": 27260, "epoch": 162} {"train_loss": -7.219854831695557, "global_step": 27261, "epoch": 162} {"train_loss": -7.2320237159729, "global_step": 27262, "epoch": 162} {"train_loss": -7.209554672241211, "global_step": 27263, "epoch": 162} {"train_loss": -7.331579208374023, "global_step": 27264, "epoch": 162} {"train_loss": -7.354543685913086, "global_step": 27265, "epoch": 162} {"train_loss": -7.171465873718262, "global_step": 27266, "epoch": 162} {"train_loss": -7.26154899597168, "global_step": 27267, "epoch": 162} {"train_loss": -7.177547454833984, "global_step": 27268, "epoch": 162} {"train_loss": -7.251108169555664, "global_step": 27269, "epoch": 162} {"train_loss": -7.3434224128723145, "global_step": 27270, "epoch": 162} {"train_loss": -7.1074604988098145, "global_step": 27271, "epoch": 162} {"train_loss": -7.134488105773926, "global_step": 27272, "epoch": 162} {"train_loss": -7.191648006439209, "global_step": 27273, "epoch": 162} {"train_loss": -6.817854881286621, "global_step": 27274, "epoch": 162} {"train_loss": -7.38516902923584, "global_step": 27275, "epoch": 162} {"train_loss": -6.924000263214111, "global_step": 27276, "epoch": 162} {"train_loss": -7.17013692855835, "global_step": 27277, "epoch": 162} {"train_loss": -7.537016868591309, "global_step": 27278, "epoch": 162} {"train_loss": -7.203000068664551, "global_step": 27279, "epoch": 162} {"train_loss": -7.310635089874268, "global_step": 27280, "epoch": 162} {"train_loss": -7.35135555267334, "global_step": 27281, "epoch": 162} {"train_loss": -7.305479526519775, "global_step": 27282, "epoch": 162} {"train_loss": -7.246792793273926, "global_step": 27283, "epoch": 162} {"train_loss": -7.393489360809326, "global_step": 27284, "epoch": 162} {"train_loss": -7.172991752624512, "global_step": 27285, "epoch": 162} {"train_loss": -7.351031303405762, "global_step": 27286, "epoch": 162} {"train_loss": -7.47335147857666, "global_step": 27287, "epoch": 162} {"train_loss": -7.579592227935791, "global_step": 27288, "epoch": 162} {"train_loss": -7.250119209289551, "global_step": 27289, "epoch": 162} {"train_loss": -7.205783367156982, "global_step": 27290, "epoch": 162} {"train_loss": -7.704445838928223, "global_step": 27291, "epoch": 162} {"train_loss": -6.8836565017700195, "global_step": 27292, "epoch": 162} {"train_loss": -7.146757125854492, "global_step": 27293, "epoch": 162} {"train_loss": -7.038614749908447, "global_step": 27294, "epoch": 162} {"train_loss": -7.249750137329102, "global_step": 27295, "epoch": 162} {"train_loss": -7.09615421295166, "global_step": 27296, "epoch": 162} {"train_loss": -7.516003608703613, "global_step": 27297, "epoch": 162} {"train_loss": -7.086728096008301, "global_step": 27298, "epoch": 162} {"train_loss": -7.046923637390137, "global_step": 27299, "epoch": 162} {"train_loss": -7.109570503234863, "global_step": 27300, "epoch": 162} {"train_loss": -7.163074493408203, "global_step": 27301, "epoch": 162} {"train_loss": -7.0887250900268555, "global_step": 27302, "epoch": 162} {"train_loss": -7.116452217102051, "global_step": 27303, "epoch": 162} {"train_loss": -7.103628635406494, "global_step": 27304, "epoch": 162} {"train_loss": -6.938567161560059, "global_step": 27305, "epoch": 162} {"train_loss": -7.411100387573242, "global_step": 27306, "epoch": 162} {"train_loss": -7.163815975189209, "global_step": 27307, "epoch": 162} {"train_loss": -7.311219215393066, "global_step": 27308, "epoch": 162} {"train_loss": -7.179569721221924, "global_step": 27309, "epoch": 162} {"train_loss": -7.297321796417236, "global_step": 27310, "epoch": 162} {"train_loss": -7.225879192352295, "global_step": 27311, "epoch": 162} {"train_loss": -7.3912553787231445, "global_step": 27312, "epoch": 162} {"train_loss": -7.074855804443359, "global_step": 27313, "epoch": 162} {"train_loss": -7.30047082901001, "global_step": 27314, "epoch": 162} {"train_loss": -7.20906925201416, "global_step": 27315, "epoch": 162} {"train_loss": -7.187268257141113, "global_step": 27316, "epoch": 162} {"train_loss": -7.299800872802734, "global_step": 27317, "epoch": 162} {"train_loss": -7.27321195602417, "global_step": 27318, "epoch": 162} {"train_loss": -7.308258056640625, "global_step": 27319, "epoch": 162} {"train_loss": -7.504171371459961, "global_step": 27320, "epoch": 162} {"train_loss": -7.294201850891113, "global_step": 27321, "epoch": 162} {"train_loss": -7.433109283447266, "global_step": 27322, "epoch": 162} {"train_loss": -7.399173259735107, "global_step": 27323, "epoch": 162} {"train_loss": -7.320491313934326, "global_step": 27324, "epoch": 162} {"train_loss": -7.250370025634766, "global_step": 27325, "epoch": 162} {"train_loss": -7.394148826599121, "global_step": 27326, "epoch": 162} {"train_loss": -7.562623023986816, "global_step": 27327, "epoch": 162} {"train_loss": -7.253391742706299, "global_step": 27328, "epoch": 162} {"train_loss": -7.221386432647705, "global_step": 27329, "epoch": 162} {"train_loss": -7.472867012023926, "global_step": 27330, "epoch": 162} {"train_loss": -7.261404991149902, "global_step": 27331, "epoch": 162} {"train_loss": -7.422909736633301, "global_step": 27332, "epoch": 162} {"train_loss": -7.311113357543945, "global_step": 27333, "epoch": 162} {"train_loss": -7.402620315551758, "global_step": 27334, "epoch": 162} {"train_loss": -7.341257572174072, "global_step": 27335, "epoch": 162} {"train_loss": -7.328518390655518, "global_step": 27336, "epoch": 162} {"train_loss": -7.355802536010742, "global_step": 27337, "epoch": 162} {"train_loss": -7.32900857925415, "global_step": 27338, "epoch": 162} {"train_loss": -7.3613433837890625, "global_step": 27339, "epoch": 162} {"train_loss": -7.327432632446289, "global_step": 27340, "epoch": 162} {"train_loss": -7.333970069885254, "global_step": 27341, "epoch": 162} {"train_loss": -7.464572906494141, "global_step": 27342, "epoch": 162} {"train_loss": -7.34651517868042, "global_step": 27343, "epoch": 162} {"train_loss": -7.077530860900879, "global_step": 27344, "epoch": 162} {"train_loss": -7.244637489318848, "global_step": 27345, "epoch": 162} {"train_loss": -7.411981582641602, "global_step": 27346, "epoch": 162} {"train_loss": -7.187858581542969, "global_step": 27347, "epoch": 162} {"train_loss": -7.051125526428223, "global_step": 27348, "epoch": 162} {"train_loss": -7.040465354919434, "global_step": 27349, "epoch": 162} {"train_loss": -7.331148147583008, "global_step": 27350, "epoch": 162} {"train_loss": -7.063604354858398, "global_step": 27351, "epoch": 162} {"train_loss": -7.0523834228515625, "global_step": 27352, "epoch": 162} {"train_loss": -7.224761486053467, "global_step": 27353, "epoch": 162} {"train_loss": -7.267088890075684, "global_step": 27354, "epoch": 162} {"train_loss": -7.289898872375488, "global_step": 27355, "epoch": 162} {"train_loss": -7.081106185913086, "global_step": 27356, "epoch": 162} {"train_loss": -7.211301803588867, "global_step": 27357, "epoch": 162} {"train_loss": -7.248586177825928, "global_step": 27358, "epoch": 162} {"train_loss": -7.108360290527344, "global_step": 27359, "epoch": 162} {"train_loss": -7.270584583282471, "global_step": 27360, "epoch": 162} {"train_loss": -7.250654220581055, "global_step": 27361, "epoch": 162} {"train_loss": -7.0882134437561035, "global_step": 27362, "epoch": 162} {"train_loss": -7.27687931060791, "global_step": 27363, "epoch": 162} {"train_loss": -7.554098129272461, "global_step": 27364, "epoch": 162} {"train_loss": -7.240176677703857, "global_step": 27365, "epoch": 162} {"train_loss": -7.3714141845703125, "global_step": 27366, "epoch": 162} {"train_loss": -7.156557083129883, "global_step": 27367, "epoch": 162} {"train_loss": -7.300571441650391, "global_step": 27368, "epoch": 162} {"train_loss": -7.166093349456787, "global_step": 27369, "epoch": 162} {"train_loss": -7.253259181976318, "global_step": 27370, "epoch": 162} {"train_loss": -7.361835956573486, "global_step": 27371, "epoch": 162} {"train_loss": -7.147647380828857, "global_step": 27372, "epoch": 162} {"train_loss": -7.228297233581543, "global_step": 27373, "epoch": 162} {"train_loss": -7.027966499328613, "global_step": 27374, "epoch": 162} {"train_loss": -7.230660438537598, "global_step": 27375, "epoch": 162} {"train_loss": -7.266354560852051, "global_step": 27376, "epoch": 162} {"train_loss": -7.390195369720459, "global_step": 27377, "epoch": 162} {"train_loss": -7.241923809051514, "global_step": 27378, "epoch": 162} {"train_loss": -7.344962120056152, "global_step": 27379, "epoch": 162} {"train_loss": -7.485033988952637, "global_step": 27380, "epoch": 162} {"train_loss": -7.270874500274658, "global_step": 27381, "epoch": 162} {"train_loss": -7.370297431945801, "global_step": 27382, "epoch": 162} {"train_loss": -7.269745449225108, "global_step": 27383, "epoch": 162, "val_loss": 197102.453125} {"train_loss": -7.506952285766602, "global_step": 27384, "epoch": 163} {"train_loss": -7.5327558517456055, "global_step": 27385, "epoch": 163} {"train_loss": -7.270411491394043, "global_step": 27386, "epoch": 163} {"train_loss": -7.317080497741699, "global_step": 27387, "epoch": 163} {"train_loss": -7.338615417480469, "global_step": 27388, "epoch": 163} {"train_loss": -7.36247444152832, "global_step": 27389, "epoch": 163} {"train_loss": -7.093862533569336, "global_step": 27390, "epoch": 163} {"train_loss": -7.512035369873047, "global_step": 27391, "epoch": 163} {"train_loss": -7.309350967407227, "global_step": 27392, "epoch": 163} {"train_loss": -7.310606479644775, "global_step": 27393, "epoch": 163} {"train_loss": -7.550207138061523, "global_step": 27394, "epoch": 163} {"train_loss": -7.195141792297363, "global_step": 27395, "epoch": 163} {"train_loss": -7.5238871574401855, "global_step": 27396, "epoch": 163} {"train_loss": -7.538033485412598, "global_step": 27397, "epoch": 163} {"train_loss": -7.227559566497803, "global_step": 27398, "epoch": 163} {"train_loss": -7.409880638122559, "global_step": 27399, "epoch": 163} {"train_loss": -7.364916801452637, "global_step": 27400, "epoch": 163} {"train_loss": -7.270920753479004, "global_step": 27401, "epoch": 163} {"train_loss": -7.448674201965332, "global_step": 27402, "epoch": 163} {"train_loss": -6.78317928314209, "global_step": 27403, "epoch": 163} {"train_loss": -7.270270347595215, "global_step": 27404, "epoch": 163} {"train_loss": -7.143946647644043, "global_step": 27405, "epoch": 163} {"train_loss": -7.30180549621582, "global_step": 27406, "epoch": 163} {"train_loss": -7.41465425491333, "global_step": 27407, "epoch": 163} {"train_loss": -7.3944292068481445, "global_step": 27408, "epoch": 163} {"train_loss": -7.328367233276367, "global_step": 27409, "epoch": 163} {"train_loss": -7.204384803771973, "global_step": 27410, "epoch": 163} {"train_loss": -7.41729736328125, "global_step": 27411, "epoch": 163} {"train_loss": -7.319878578186035, "global_step": 27412, "epoch": 163} {"train_loss": -7.255208492279053, "global_step": 27413, "epoch": 163} {"train_loss": -7.338635444641113, "global_step": 27414, "epoch": 163} {"train_loss": -7.349423885345459, "global_step": 27415, "epoch": 163} {"train_loss": -7.458808898925781, "global_step": 27416, "epoch": 163} {"train_loss": -7.456087112426758, "global_step": 27417, "epoch": 163} {"train_loss": -7.388144493103027, "global_step": 27418, "epoch": 163} {"train_loss": -7.142936706542969, "global_step": 27419, "epoch": 163} {"train_loss": -7.296049118041992, "global_step": 27420, "epoch": 163} {"train_loss": -7.1884565353393555, "global_step": 27421, "epoch": 163} {"train_loss": -7.374687194824219, "global_step": 27422, "epoch": 163} {"train_loss": -7.07119607925415, "global_step": 27423, "epoch": 163} {"train_loss": -7.3310675621032715, "global_step": 27424, "epoch": 163} {"train_loss": -7.241186141967773, "global_step": 27425, "epoch": 163} {"train_loss": -7.212437152862549, "global_step": 27426, "epoch": 163} {"train_loss": -7.052289009094238, "global_step": 27427, "epoch": 163} {"train_loss": -7.125617504119873, "global_step": 27428, "epoch": 163} {"train_loss": -6.8724589347839355, "global_step": 27429, "epoch": 163} {"train_loss": -7.244635105133057, "global_step": 27430, "epoch": 163} {"train_loss": -7.167584419250488, "global_step": 27431, "epoch": 163} {"train_loss": -7.263503551483154, "global_step": 27432, "epoch": 163} {"train_loss": -7.380378246307373, "global_step": 27433, "epoch": 163} {"train_loss": -7.150881767272949, "global_step": 27434, "epoch": 163} {"train_loss": -7.173521041870117, "global_step": 27435, "epoch": 163} {"train_loss": -7.407573699951172, "global_step": 27436, "epoch": 163} {"train_loss": -7.231939315795898, "global_step": 27437, "epoch": 163} {"train_loss": -7.302264213562012, "global_step": 27438, "epoch": 163} {"train_loss": -7.187238693237305, "global_step": 27439, "epoch": 163} {"train_loss": -7.364935874938965, "global_step": 27440, "epoch": 163} {"train_loss": -7.26527738571167, "global_step": 27441, "epoch": 163} {"train_loss": -7.188610553741455, "global_step": 27442, "epoch": 163} {"train_loss": -7.306029319763184, "global_step": 27443, "epoch": 163} {"train_loss": -7.356698989868164, "global_step": 27444, "epoch": 163} {"train_loss": -7.176626205444336, "global_step": 27445, "epoch": 163} {"train_loss": -7.231595993041992, "global_step": 27446, "epoch": 163} {"train_loss": -7.400264263153076, "global_step": 27447, "epoch": 163} {"train_loss": -7.270726203918457, "global_step": 27448, "epoch": 163} {"train_loss": -7.309605598449707, "global_step": 27449, "epoch": 163} {"train_loss": -7.288918495178223, "global_step": 27450, "epoch": 163} {"train_loss": -7.339897155761719, "global_step": 27451, "epoch": 163} {"train_loss": -7.329204559326172, "global_step": 27452, "epoch": 163} {"train_loss": -7.266947269439697, "global_step": 27453, "epoch": 163} {"train_loss": -7.167530059814453, "global_step": 27454, "epoch": 163} {"train_loss": -7.256441116333008, "global_step": 27455, "epoch": 163} {"train_loss": -7.389017105102539, "global_step": 27456, "epoch": 163} {"train_loss": -7.18263578414917, "global_step": 27457, "epoch": 163} {"train_loss": -7.215115070343018, "global_step": 27458, "epoch": 163} {"train_loss": -7.239163398742676, "global_step": 27459, "epoch": 163} {"train_loss": -7.428621292114258, "global_step": 27460, "epoch": 163} {"train_loss": -6.983409881591797, "global_step": 27461, "epoch": 163} {"train_loss": -7.277440071105957, "global_step": 27462, "epoch": 163} {"train_loss": -7.22053337097168, "global_step": 27463, "epoch": 163} {"train_loss": -7.106076240539551, "global_step": 27464, "epoch": 163} {"train_loss": -7.110334396362305, "global_step": 27465, "epoch": 163} {"train_loss": -7.055712699890137, "global_step": 27466, "epoch": 163} {"train_loss": -7.37424373626709, "global_step": 27467, "epoch": 163} {"train_loss": -7.290976047515869, "global_step": 27468, "epoch": 163} {"train_loss": -7.299468040466309, "global_step": 27469, "epoch": 163} {"train_loss": -7.246453285217285, "global_step": 27470, "epoch": 163} {"train_loss": -7.158389091491699, "global_step": 27471, "epoch": 163} {"train_loss": -7.47347354888916, "global_step": 27472, "epoch": 163} {"train_loss": -7.1601786613464355, "global_step": 27473, "epoch": 163} {"train_loss": -7.3378190994262695, "global_step": 27474, "epoch": 163} {"train_loss": -7.285589218139648, "global_step": 27475, "epoch": 163} {"train_loss": -7.5101318359375, "global_step": 27476, "epoch": 163} {"train_loss": -7.156428337097168, "global_step": 27477, "epoch": 163} {"train_loss": -7.1319580078125, "global_step": 27478, "epoch": 163} {"train_loss": -7.495902061462402, "global_step": 27479, "epoch": 163} {"train_loss": -7.172185897827148, "global_step": 27480, "epoch": 163} {"train_loss": -7.194119453430176, "global_step": 27481, "epoch": 163} {"train_loss": -7.5366973876953125, "global_step": 27482, "epoch": 163} {"train_loss": -7.342421531677246, "global_step": 27483, "epoch": 163} {"train_loss": -7.530648231506348, "global_step": 27484, "epoch": 163} {"train_loss": -7.461668968200684, "global_step": 27485, "epoch": 163} {"train_loss": -7.209540367126465, "global_step": 27486, "epoch": 163} {"train_loss": -7.300220966339111, "global_step": 27487, "epoch": 163} {"train_loss": -7.312950134277344, "global_step": 27488, "epoch": 163} {"train_loss": -7.354254722595215, "global_step": 27489, "epoch": 163} {"train_loss": -7.501139163970947, "global_step": 27490, "epoch": 163} {"train_loss": -7.3864641189575195, "global_step": 27491, "epoch": 163} {"train_loss": -7.340836524963379, "global_step": 27492, "epoch": 163} {"train_loss": -7.147414684295654, "global_step": 27493, "epoch": 163} {"train_loss": -7.582622528076172, "global_step": 27494, "epoch": 163} {"train_loss": -7.208894729614258, "global_step": 27495, "epoch": 163} {"train_loss": -7.395261764526367, "global_step": 27496, "epoch": 163} {"train_loss": -7.4523725509643555, "global_step": 27497, "epoch": 163} {"train_loss": -7.408946990966797, "global_step": 27498, "epoch": 163} {"train_loss": -7.4891276359558105, "global_step": 27499, "epoch": 163} {"train_loss": -7.436581134796143, "global_step": 27500, "epoch": 163} {"train_loss": -7.28983211517334, "global_step": 27501, "epoch": 163} {"train_loss": -7.359745979309082, "global_step": 27502, "epoch": 163} {"train_loss": -7.553761959075928, "global_step": 27503, "epoch": 163} {"train_loss": -7.554807662963867, "global_step": 27504, "epoch": 163} {"train_loss": -7.493826866149902, "global_step": 27505, "epoch": 163} {"train_loss": -7.417718887329102, "global_step": 27506, "epoch": 163} {"train_loss": -7.17515754699707, "global_step": 27507, "epoch": 163} {"train_loss": -7.418920516967773, "global_step": 27508, "epoch": 163} {"train_loss": -7.301265716552734, "global_step": 27509, "epoch": 163} {"train_loss": -7.207270622253418, "global_step": 27510, "epoch": 163} {"train_loss": -7.3189496994018555, "global_step": 27511, "epoch": 163} {"train_loss": -7.405123710632324, "global_step": 27512, "epoch": 163} {"train_loss": -7.406396865844727, "global_step": 27513, "epoch": 163} {"train_loss": -7.331487655639648, "global_step": 27514, "epoch": 163} {"train_loss": -7.210111141204834, "global_step": 27515, "epoch": 163} {"train_loss": -7.232978343963623, "global_step": 27516, "epoch": 163} {"train_loss": -7.280372619628906, "global_step": 27517, "epoch": 163} {"train_loss": -7.290953159332275, "global_step": 27518, "epoch": 163} {"train_loss": -7.271842002868652, "global_step": 27519, "epoch": 163} {"train_loss": -7.302618980407715, "global_step": 27520, "epoch": 163} {"train_loss": -7.306527137756348, "global_step": 27521, "epoch": 163} {"train_loss": -7.159481525421143, "global_step": 27522, "epoch": 163} {"train_loss": -7.166224956512451, "global_step": 27523, "epoch": 163} {"train_loss": -7.329471588134766, "global_step": 27524, "epoch": 163} {"train_loss": -7.380445957183838, "global_step": 27525, "epoch": 163} {"train_loss": -7.215085983276367, "global_step": 27526, "epoch": 163} {"train_loss": -7.329216480255127, "global_step": 27527, "epoch": 163} {"train_loss": -7.302760124206543, "global_step": 27528, "epoch": 163} {"train_loss": -7.297662734985352, "global_step": 27529, "epoch": 163} {"train_loss": -6.959737777709961, "global_step": 27530, "epoch": 163} {"train_loss": -7.485220909118652, "global_step": 27531, "epoch": 163} {"train_loss": -7.090692520141602, "global_step": 27532, "epoch": 163} {"train_loss": -7.253737449645996, "global_step": 27533, "epoch": 163} {"train_loss": -7.05635929107666, "global_step": 27534, "epoch": 163} {"train_loss": -7.108575820922852, "global_step": 27535, "epoch": 163} {"train_loss": -7.346525192260742, "global_step": 27536, "epoch": 163} {"train_loss": -7.133952617645264, "global_step": 27537, "epoch": 163} {"train_loss": -7.3608269691467285, "global_step": 27538, "epoch": 163} {"train_loss": -7.16804313659668, "global_step": 27539, "epoch": 163} {"train_loss": -7.03001070022583, "global_step": 27540, "epoch": 163} {"train_loss": -7.371427536010742, "global_step": 27541, "epoch": 163} {"train_loss": -6.824960708618164, "global_step": 27542, "epoch": 163} {"train_loss": -7.129489898681641, "global_step": 27543, "epoch": 163} {"train_loss": -6.7830705642700195, "global_step": 27544, "epoch": 163} {"train_loss": -7.000270843505859, "global_step": 27545, "epoch": 163} {"train_loss": -7.404977798461914, "global_step": 27546, "epoch": 163} {"train_loss": -7.198328495025635, "global_step": 27547, "epoch": 163} {"train_loss": -7.213810920715332, "global_step": 27548, "epoch": 163} {"train_loss": -6.916443347930908, "global_step": 27549, "epoch": 163} {"train_loss": -7.361363410949707, "global_step": 27550, "epoch": 163} {"train_loss": -7.2813163711911155, "global_step": 27551, "epoch": 163, "val_loss": 193447.84375} {"train_loss": -6.968145370483398, "global_step": 27552, "epoch": 164} {"train_loss": -7.214942932128906, "global_step": 27553, "epoch": 164} {"train_loss": -7.247866630554199, "global_step": 27554, "epoch": 164} {"train_loss": -7.11391544342041, "global_step": 27555, "epoch": 164} {"train_loss": -7.0698394775390625, "global_step": 27556, "epoch": 164} {"train_loss": -7.138644218444824, "global_step": 27557, "epoch": 164} {"train_loss": -7.213988780975342, "global_step": 27558, "epoch": 164} {"train_loss": -7.226243495941162, "global_step": 27559, "epoch": 164} {"train_loss": -7.180435657501221, "global_step": 27560, "epoch": 164} {"train_loss": -7.145265579223633, "global_step": 27561, "epoch": 164} {"train_loss": -7.1283416748046875, "global_step": 27562, "epoch": 164} {"train_loss": -7.347804069519043, "global_step": 27563, "epoch": 164} {"train_loss": -7.451021194458008, "global_step": 27564, "epoch": 164} {"train_loss": -7.331067085266113, "global_step": 27565, "epoch": 164} {"train_loss": -7.2559003829956055, "global_step": 27566, "epoch": 164} {"train_loss": -7.42267370223999, "global_step": 27567, "epoch": 164} {"train_loss": -7.324639320373535, "global_step": 27568, "epoch": 164} {"train_loss": -7.302347183227539, "global_step": 27569, "epoch": 164} {"train_loss": -7.275318145751953, "global_step": 27570, "epoch": 164} {"train_loss": -7.2725982666015625, "global_step": 27571, "epoch": 164} {"train_loss": -7.226885795593262, "global_step": 27572, "epoch": 164} {"train_loss": -7.1096391677856445, "global_step": 27573, "epoch": 164} {"train_loss": -7.338422775268555, "global_step": 27574, "epoch": 164} {"train_loss": -7.4638848304748535, "global_step": 27575, "epoch": 164} {"train_loss": -7.375566005706787, "global_step": 27576, "epoch": 164} {"train_loss": -7.6022047996521, "global_step": 27577, "epoch": 164} {"train_loss": -7.415652751922607, "global_step": 27578, "epoch": 164} {"train_loss": -7.434815406799316, "global_step": 27579, "epoch": 164} {"train_loss": -7.564302444458008, "global_step": 27580, "epoch": 164} {"train_loss": -7.478187561035156, "global_step": 27581, "epoch": 164} {"train_loss": -7.447823524475098, "global_step": 27582, "epoch": 164} {"train_loss": -7.250786781311035, "global_step": 27583, "epoch": 164} {"train_loss": -7.536941051483154, "global_step": 27584, "epoch": 164} {"train_loss": -7.332150459289551, "global_step": 27585, "epoch": 164} {"train_loss": -7.318014144897461, "global_step": 27586, "epoch": 164} {"train_loss": -7.378500461578369, "global_step": 27587, "epoch": 164} {"train_loss": -7.402289390563965, "global_step": 27588, "epoch": 164} {"train_loss": -7.455289840698242, "global_step": 27589, "epoch": 164} {"train_loss": -7.360572338104248, "global_step": 27590, "epoch": 164} {"train_loss": -7.433944225311279, "global_step": 27591, "epoch": 164} {"train_loss": -7.566910743713379, "global_step": 27592, "epoch": 164} {"train_loss": -7.31203556060791, "global_step": 27593, "epoch": 164} {"train_loss": -7.422698020935059, "global_step": 27594, "epoch": 164} {"train_loss": -7.28452205657959, "global_step": 27595, "epoch": 164} {"train_loss": -7.558771133422852, "global_step": 27596, "epoch": 164} {"train_loss": -7.18147087097168, "global_step": 27597, "epoch": 164} {"train_loss": -7.327445983886719, "global_step": 27598, "epoch": 164} {"train_loss": -7.034144878387451, "global_step": 27599, "epoch": 164} {"train_loss": -7.068170547485352, "global_step": 27600, "epoch": 164} {"train_loss": -7.13741397857666, "global_step": 27601, "epoch": 164} {"train_loss": -7.210302352905273, "global_step": 27602, "epoch": 164} {"train_loss": -7.417778968811035, "global_step": 27603, "epoch": 164} {"train_loss": -7.348156452178955, "global_step": 27604, "epoch": 164} {"train_loss": -7.331594467163086, "global_step": 27605, "epoch": 164} {"train_loss": -7.3488922119140625, "global_step": 27606, "epoch": 164} {"train_loss": -7.257324695587158, "global_step": 27607, "epoch": 164} {"train_loss": -7.338403701782227, "global_step": 27608, "epoch": 164} {"train_loss": -7.3918914794921875, "global_step": 27609, "epoch": 164} {"train_loss": -7.430556774139404, "global_step": 27610, "epoch": 164} {"train_loss": -7.4615478515625, "global_step": 27611, "epoch": 164} {"train_loss": -7.304742813110352, "global_step": 27612, "epoch": 164} {"train_loss": -7.379567623138428, "global_step": 27613, "epoch": 164} {"train_loss": -7.520168304443359, "global_step": 27614, "epoch": 164} {"train_loss": -7.4530439376831055, "global_step": 27615, "epoch": 164} {"train_loss": -7.077375888824463, "global_step": 27616, "epoch": 164} {"train_loss": -7.577629566192627, "global_step": 27617, "epoch": 164} {"train_loss": -7.077422142028809, "global_step": 27618, "epoch": 164} {"train_loss": -7.228848934173584, "global_step": 27619, "epoch": 164} {"train_loss": -7.088813304901123, "global_step": 27620, "epoch": 164} {"train_loss": -7.537668228149414, "global_step": 27621, "epoch": 164} {"train_loss": -7.032763481140137, "global_step": 27622, "epoch": 164} {"train_loss": -7.019524574279785, "global_step": 27623, "epoch": 164} {"train_loss": -7.553818225860596, "global_step": 27624, "epoch": 164} {"train_loss": -7.085006237030029, "global_step": 27625, "epoch": 164} {"train_loss": -6.969402313232422, "global_step": 27626, "epoch": 164} {"train_loss": -6.946045398712158, "global_step": 27627, "epoch": 164} {"train_loss": -7.404130935668945, "global_step": 27628, "epoch": 164} {"train_loss": -7.15806770324707, "global_step": 27629, "epoch": 164} {"train_loss": -7.028587341308594, "global_step": 27630, "epoch": 164} {"train_loss": -7.376954078674316, "global_step": 27631, "epoch": 164} {"train_loss": -7.393415451049805, "global_step": 27632, "epoch": 164} {"train_loss": -7.120753288269043, "global_step": 27633, "epoch": 164} {"train_loss": -7.358757019042969, "global_step": 27634, "epoch": 164} {"train_loss": -7.395650863647461, "global_step": 27635, "epoch": 164} {"train_loss": -7.366771697998047, "global_step": 27636, "epoch": 164} {"train_loss": -7.1783552169799805, "global_step": 27637, "epoch": 164} {"train_loss": -7.34471321105957, "global_step": 27638, "epoch": 164} {"train_loss": -7.541679859161377, "global_step": 27639, "epoch": 164} {"train_loss": -7.535762786865234, "global_step": 27640, "epoch": 164} {"train_loss": -7.251608848571777, "global_step": 27641, "epoch": 164} {"train_loss": -7.402768135070801, "global_step": 27642, "epoch": 164} {"train_loss": -7.424382209777832, "global_step": 27643, "epoch": 164} {"train_loss": -7.465339660644531, "global_step": 27644, "epoch": 164} {"train_loss": -7.437523365020752, "global_step": 27645, "epoch": 164} {"train_loss": -7.440648078918457, "global_step": 27646, "epoch": 164} {"train_loss": -7.296121597290039, "global_step": 27647, "epoch": 164} {"train_loss": -7.3182573318481445, "global_step": 27648, "epoch": 164} {"train_loss": -7.105312347412109, "global_step": 27649, "epoch": 164} {"train_loss": -7.436153411865234, "global_step": 27650, "epoch": 164} {"train_loss": -7.504726409912109, "global_step": 27651, "epoch": 164} {"train_loss": -7.413752555847168, "global_step": 27652, "epoch": 164} {"train_loss": -7.252531051635742, "global_step": 27653, "epoch": 164} {"train_loss": -7.157808780670166, "global_step": 27654, "epoch": 164} {"train_loss": -7.346290588378906, "global_step": 27655, "epoch": 164} {"train_loss": -7.357818603515625, "global_step": 27656, "epoch": 164} {"train_loss": -7.314521312713623, "global_step": 27657, "epoch": 164} {"train_loss": -7.203813552856445, "global_step": 27658, "epoch": 164} {"train_loss": -7.281110763549805, "global_step": 27659, "epoch": 164} {"train_loss": -7.233174800872803, "global_step": 27660, "epoch": 164} {"train_loss": -7.139023303985596, "global_step": 27661, "epoch": 164} {"train_loss": -7.122758388519287, "global_step": 27662, "epoch": 164} {"train_loss": -7.345990180969238, "global_step": 27663, "epoch": 164} {"train_loss": -7.0924882888793945, "global_step": 27664, "epoch": 164} {"train_loss": -7.081857681274414, "global_step": 27665, "epoch": 164} {"train_loss": -7.252198219299316, "global_step": 27666, "epoch": 164} {"train_loss": -7.143975257873535, "global_step": 27667, "epoch": 164} {"train_loss": -7.0827789306640625, "global_step": 27668, "epoch": 164} {"train_loss": -7.206205368041992, "global_step": 27669, "epoch": 164} {"train_loss": -6.834440231323242, "global_step": 27670, "epoch": 164} {"train_loss": -7.311077117919922, "global_step": 27671, "epoch": 164} {"train_loss": -7.225470542907715, "global_step": 27672, "epoch": 164} {"train_loss": -6.924643516540527, "global_step": 27673, "epoch": 164} {"train_loss": -6.820026874542236, "global_step": 27674, "epoch": 164} {"train_loss": -6.996883392333984, "global_step": 27675, "epoch": 164} {"train_loss": -7.016552448272705, "global_step": 27676, "epoch": 164} {"train_loss": -7.10847806930542, "global_step": 27677, "epoch": 164} {"train_loss": -7.015670299530029, "global_step": 27678, "epoch": 164} {"train_loss": -7.375914573669434, "global_step": 27679, "epoch": 164} {"train_loss": -7.008522987365723, "global_step": 27680, "epoch": 164} {"train_loss": -7.094919204711914, "global_step": 27681, "epoch": 164} {"train_loss": -7.337452411651611, "global_step": 27682, "epoch": 164} {"train_loss": -6.976499557495117, "global_step": 27683, "epoch": 164} {"train_loss": -7.148222923278809, "global_step": 27684, "epoch": 164} {"train_loss": -7.076852798461914, "global_step": 27685, "epoch": 164} {"train_loss": -6.809837341308594, "global_step": 27686, "epoch": 164} {"train_loss": -7.344908714294434, "global_step": 27687, "epoch": 164} {"train_loss": -7.36276912689209, "global_step": 27688, "epoch": 164} {"train_loss": -7.1561689376831055, "global_step": 27689, "epoch": 164} {"train_loss": -7.243036270141602, "global_step": 27690, "epoch": 164} {"train_loss": -7.21268367767334, "global_step": 27691, "epoch": 164} {"train_loss": -7.211770534515381, "global_step": 27692, "epoch": 164} {"train_loss": -7.4200639724731445, "global_step": 27693, "epoch": 164} {"train_loss": -7.158958911895752, "global_step": 27694, "epoch": 164} {"train_loss": -7.42216682434082, "global_step": 27695, "epoch": 164} {"train_loss": -7.490365982055664, "global_step": 27696, "epoch": 164} {"train_loss": -7.410675525665283, "global_step": 27697, "epoch": 164} {"train_loss": -7.481897354125977, "global_step": 27698, "epoch": 164} {"train_loss": -7.248091220855713, "global_step": 27699, "epoch": 164} {"train_loss": -7.468148231506348, "global_step": 27700, "epoch": 164} {"train_loss": -7.432371616363525, "global_step": 27701, "epoch": 164} {"train_loss": -7.40531063079834, "global_step": 27702, "epoch": 164} {"train_loss": -7.359102249145508, "global_step": 27703, "epoch": 164} {"train_loss": -7.610560417175293, "global_step": 27704, "epoch": 164} {"train_loss": -7.496522903442383, "global_step": 27705, "epoch": 164} {"train_loss": -7.480513572692871, "global_step": 27706, "epoch": 164} {"train_loss": -7.531960964202881, "global_step": 27707, "epoch": 164} {"train_loss": -7.44619083404541, "global_step": 27708, "epoch": 164} {"train_loss": -7.606624603271484, "global_step": 27709, "epoch": 164} {"train_loss": -7.62229061126709, "global_step": 27710, "epoch": 164} {"train_loss": -7.589150428771973, "global_step": 27711, "epoch": 164} {"train_loss": -7.139135360717773, "global_step": 27712, "epoch": 164} {"train_loss": -7.451369285583496, "global_step": 27713, "epoch": 164} {"train_loss": -7.494725227355957, "global_step": 27714, "epoch": 164} {"train_loss": -7.286930084228516, "global_step": 27715, "epoch": 164} {"train_loss": -7.515052318572998, "global_step": 27716, "epoch": 164} {"train_loss": -7.311036109924316, "global_step": 27717, "epoch": 164} {"train_loss": -7.545658111572266, "global_step": 27718, "epoch": 164} {"train_loss": -7.295128325621287, "global_step": 27719, "epoch": 164, "val_loss": 191606.921875} {"train_loss": -7.495179176330566, "global_step": 27720, "epoch": 165} {"train_loss": -7.642229080200195, "global_step": 27721, "epoch": 165} {"train_loss": -7.0350213050842285, "global_step": 27722, "epoch": 165} {"train_loss": -7.415800094604492, "global_step": 27723, "epoch": 165} {"train_loss": -7.328932285308838, "global_step": 27724, "epoch": 165} {"train_loss": -7.182246208190918, "global_step": 27725, "epoch": 165} {"train_loss": -7.2653350830078125, "global_step": 27726, "epoch": 165} {"train_loss": -7.3815741539001465, "global_step": 27727, "epoch": 165} {"train_loss": -7.428844451904297, "global_step": 27728, "epoch": 165} {"train_loss": -7.37006950378418, "global_step": 27729, "epoch": 165} {"train_loss": -7.310742378234863, "global_step": 27730, "epoch": 165} {"train_loss": -7.385571002960205, "global_step": 27731, "epoch": 165} {"train_loss": -7.3902363777160645, "global_step": 27732, "epoch": 165} {"train_loss": -7.104228496551514, "global_step": 27733, "epoch": 165} {"train_loss": -7.467965126037598, "global_step": 27734, "epoch": 165} {"train_loss": -7.460102081298828, "global_step": 27735, "epoch": 165} {"train_loss": -7.462307453155518, "global_step": 27736, "epoch": 165} {"train_loss": -6.995580673217773, "global_step": 27737, "epoch": 165} {"train_loss": -7.356014728546143, "global_step": 27738, "epoch": 165} {"train_loss": -7.575605392456055, "global_step": 27739, "epoch": 165} {"train_loss": -7.423061370849609, "global_step": 27740, "epoch": 165} {"train_loss": -7.559326171875, "global_step": 27741, "epoch": 165} {"train_loss": -7.272804260253906, "global_step": 27742, "epoch": 165} {"train_loss": -7.1685638427734375, "global_step": 27743, "epoch": 165} {"train_loss": -7.115564346313477, "global_step": 27744, "epoch": 165} {"train_loss": -7.279294013977051, "global_step": 27745, "epoch": 165} {"train_loss": -7.42031192779541, "global_step": 27746, "epoch": 165} {"train_loss": -7.321140289306641, "global_step": 27747, "epoch": 165} {"train_loss": -7.426756858825684, "global_step": 27748, "epoch": 165} {"train_loss": -7.2642645835876465, "global_step": 27749, "epoch": 165} {"train_loss": -7.16549015045166, "global_step": 27750, "epoch": 165} {"train_loss": -7.604687213897705, "global_step": 27751, "epoch": 165} {"train_loss": -7.679312705993652, "global_step": 27752, "epoch": 165} {"train_loss": -7.449687480926514, "global_step": 27753, "epoch": 165} {"train_loss": -7.256716728210449, "global_step": 27754, "epoch": 165} {"train_loss": -7.369895935058594, "global_step": 27755, "epoch": 165} {"train_loss": -7.453080654144287, "global_step": 27756, "epoch": 165} {"train_loss": -7.574629783630371, "global_step": 27757, "epoch": 165} {"train_loss": -7.395896911621094, "global_step": 27758, "epoch": 165} {"train_loss": -7.516565322875977, "global_step": 27759, "epoch": 165} {"train_loss": -7.420223236083984, "global_step": 27760, "epoch": 165} {"train_loss": -7.426613807678223, "global_step": 27761, "epoch": 165} {"train_loss": -7.435636043548584, "global_step": 27762, "epoch": 165} {"train_loss": -7.422584533691406, "global_step": 27763, "epoch": 165} {"train_loss": -7.344670295715332, "global_step": 27764, "epoch": 165} {"train_loss": -7.473829746246338, "global_step": 27765, "epoch": 165} {"train_loss": -7.286454200744629, "global_step": 27766, "epoch": 165} {"train_loss": -7.134902000427246, "global_step": 27767, "epoch": 165} {"train_loss": -7.415299892425537, "global_step": 27768, "epoch": 165} {"train_loss": -7.38723087310791, "global_step": 27769, "epoch": 165} {"train_loss": -7.37929105758667, "global_step": 27770, "epoch": 165} {"train_loss": -7.387545585632324, "global_step": 27771, "epoch": 165} {"train_loss": -7.184440612792969, "global_step": 27772, "epoch": 165} {"train_loss": -7.200751304626465, "global_step": 27773, "epoch": 165} {"train_loss": -7.15504264831543, "global_step": 27774, "epoch": 165} {"train_loss": -7.3013715744018555, "global_step": 27775, "epoch": 165} {"train_loss": -7.263927459716797, "global_step": 27776, "epoch": 165} {"train_loss": -7.2676777839660645, "global_step": 27777, "epoch": 165} {"train_loss": -7.3177361488342285, "global_step": 27778, "epoch": 165} {"train_loss": -7.236943244934082, "global_step": 27779, "epoch": 165} {"train_loss": -7.408080101013184, "global_step": 27780, "epoch": 165} {"train_loss": -7.391184329986572, "global_step": 27781, "epoch": 165} {"train_loss": -7.208347797393799, "global_step": 27782, "epoch": 165} {"train_loss": -7.159771919250488, "global_step": 27783, "epoch": 165} {"train_loss": -7.351093292236328, "global_step": 27784, "epoch": 165} {"train_loss": -7.381218910217285, "global_step": 27785, "epoch": 165} {"train_loss": -7.289433479309082, "global_step": 27786, "epoch": 165} {"train_loss": -7.173200607299805, "global_step": 27787, "epoch": 165} {"train_loss": -7.436567783355713, "global_step": 27788, "epoch": 165} {"train_loss": -7.184654235839844, "global_step": 27789, "epoch": 165} {"train_loss": -7.203038215637207, "global_step": 27790, "epoch": 165} {"train_loss": -7.388925552368164, "global_step": 27791, "epoch": 165} {"train_loss": -7.550173759460449, "global_step": 27792, "epoch": 165} {"train_loss": -7.411069869995117, "global_step": 27793, "epoch": 165} {"train_loss": -7.399025917053223, "global_step": 27794, "epoch": 165} {"train_loss": -7.396383285522461, "global_step": 27795, "epoch": 165} {"train_loss": -7.722633361816406, "global_step": 27796, "epoch": 165} {"train_loss": -7.466360569000244, "global_step": 27797, "epoch": 165} {"train_loss": -7.339348793029785, "global_step": 27798, "epoch": 165} {"train_loss": -7.40998649597168, "global_step": 27799, "epoch": 165} {"train_loss": -7.405298709869385, "global_step": 27800, "epoch": 165} {"train_loss": -7.68038272857666, "global_step": 27801, "epoch": 165} {"train_loss": -7.550868988037109, "global_step": 27802, "epoch": 165} {"train_loss": -7.326485633850098, "global_step": 27803, "epoch": 165} {"train_loss": -7.399164199829102, "global_step": 27804, "epoch": 165} {"train_loss": -7.378537178039551, "global_step": 27805, "epoch": 165} {"train_loss": -7.521300315856934, "global_step": 27806, "epoch": 165} {"train_loss": -7.355788230895996, "global_step": 27807, "epoch": 165} {"train_loss": -7.465826034545898, "global_step": 27808, "epoch": 165} {"train_loss": -7.2445068359375, "global_step": 27809, "epoch": 165} {"train_loss": -7.4149885177612305, "global_step": 27810, "epoch": 165} {"train_loss": -7.373017311096191, "global_step": 27811, "epoch": 165} {"train_loss": -7.088438987731934, "global_step": 27812, "epoch": 165} {"train_loss": -7.404963493347168, "global_step": 27813, "epoch": 165} {"train_loss": -7.206103324890137, "global_step": 27814, "epoch": 165} {"train_loss": -7.606680870056152, "global_step": 27815, "epoch": 165} {"train_loss": -7.328460693359375, "global_step": 27816, "epoch": 165} {"train_loss": -7.435953140258789, "global_step": 27817, "epoch": 165} {"train_loss": -7.263711452484131, "global_step": 27818, "epoch": 165} {"train_loss": -7.445888996124268, "global_step": 27819, "epoch": 165} {"train_loss": -7.097020149230957, "global_step": 27820, "epoch": 165} {"train_loss": -6.9333176612854, "global_step": 27821, "epoch": 165} {"train_loss": -7.338801383972168, "global_step": 27822, "epoch": 165} {"train_loss": -7.225625038146973, "global_step": 27823, "epoch": 165} {"train_loss": -7.284506797790527, "global_step": 27824, "epoch": 165} {"train_loss": -7.00197696685791, "global_step": 27825, "epoch": 165} {"train_loss": -7.4257493019104, "global_step": 27826, "epoch": 165} {"train_loss": -7.0350236892700195, "global_step": 27827, "epoch": 165} {"train_loss": -7.162881851196289, "global_step": 27828, "epoch": 165} {"train_loss": -7.378757476806641, "global_step": 27829, "epoch": 165} {"train_loss": -7.188967704772949, "global_step": 27830, "epoch": 165} {"train_loss": -7.256911277770996, "global_step": 27831, "epoch": 165} {"train_loss": -7.121208190917969, "global_step": 27832, "epoch": 165} {"train_loss": -7.080516338348389, "global_step": 27833, "epoch": 165} {"train_loss": -7.2432990074157715, "global_step": 27834, "epoch": 165} {"train_loss": -7.497317314147949, "global_step": 27835, "epoch": 165} {"train_loss": -7.150964736938477, "global_step": 27836, "epoch": 165} {"train_loss": -7.375614643096924, "global_step": 27837, "epoch": 165} {"train_loss": -7.4606451988220215, "global_step": 27838, "epoch": 165} {"train_loss": -7.3593854904174805, "global_step": 27839, "epoch": 165} {"train_loss": -7.478426456451416, "global_step": 27840, "epoch": 165} {"train_loss": -7.306360244750977, "global_step": 27841, "epoch": 165} {"train_loss": -7.352059841156006, "global_step": 27842, "epoch": 165} {"train_loss": -7.385555267333984, "global_step": 27843, "epoch": 165} {"train_loss": -7.2357587814331055, "global_step": 27844, "epoch": 165} {"train_loss": -7.218114376068115, "global_step": 27845, "epoch": 165} {"train_loss": -7.349710941314697, "global_step": 27846, "epoch": 165} {"train_loss": -6.871706962585449, "global_step": 27847, "epoch": 165} {"train_loss": -7.265255928039551, "global_step": 27848, "epoch": 165} {"train_loss": -7.029352188110352, "global_step": 27849, "epoch": 165} {"train_loss": -7.330990791320801, "global_step": 27850, "epoch": 165} {"train_loss": -7.335907936096191, "global_step": 27851, "epoch": 165} {"train_loss": -7.308435440063477, "global_step": 27852, "epoch": 165} {"train_loss": -7.19724178314209, "global_step": 27853, "epoch": 165} {"train_loss": -7.16325044631958, "global_step": 27854, "epoch": 165} {"train_loss": -7.39835786819458, "global_step": 27855, "epoch": 165} {"train_loss": -7.450736999511719, "global_step": 27856, "epoch": 165} {"train_loss": -7.43150520324707, "global_step": 27857, "epoch": 165} {"train_loss": -7.28591251373291, "global_step": 27858, "epoch": 165} {"train_loss": -7.28175687789917, "global_step": 27859, "epoch": 165} {"train_loss": -7.25573205947876, "global_step": 27860, "epoch": 165} {"train_loss": -7.104025840759277, "global_step": 27861, "epoch": 165} {"train_loss": -7.269881248474121, "global_step": 27862, "epoch": 165} {"train_loss": -7.219944953918457, "global_step": 27863, "epoch": 165} {"train_loss": -7.101932048797607, "global_step": 27864, "epoch": 165} {"train_loss": -6.991939544677734, "global_step": 27865, "epoch": 165} {"train_loss": -7.276159286499023, "global_step": 27866, "epoch": 165} {"train_loss": -7.085081577301025, "global_step": 27867, "epoch": 165} {"train_loss": -7.203248977661133, "global_step": 27868, "epoch": 165} {"train_loss": -7.067934036254883, "global_step": 27869, "epoch": 165} {"train_loss": -7.240209102630615, "global_step": 27870, "epoch": 165} {"train_loss": -7.255976676940918, "global_step": 27871, "epoch": 165} {"train_loss": -7.155841827392578, "global_step": 27872, "epoch": 165} {"train_loss": -7.343958377838135, "global_step": 27873, "epoch": 165} {"train_loss": -7.307076454162598, "global_step": 27874, "epoch": 165} {"train_loss": -7.31624174118042, "global_step": 27875, "epoch": 165} {"train_loss": -7.3930206298828125, "global_step": 27876, "epoch": 165} {"train_loss": -7.178937911987305, "global_step": 27877, "epoch": 165} {"train_loss": -7.319052696228027, "global_step": 27878, "epoch": 165} {"train_loss": -7.302045822143555, "global_step": 27879, "epoch": 165} {"train_loss": -7.225061416625977, "global_step": 27880, "epoch": 165} {"train_loss": -7.170836448669434, "global_step": 27881, "epoch": 165} {"train_loss": -7.196900367736816, "global_step": 27882, "epoch": 165} {"train_loss": -7.048106670379639, "global_step": 27883, "epoch": 165} {"train_loss": -7.281509876251221, "global_step": 27884, "epoch": 165} {"train_loss": -7.179991722106934, "global_step": 27885, "epoch": 165} {"train_loss": -7.353229999542236, "global_step": 27886, "epoch": 165} {"train_loss": -7.313367477485111, "global_step": 27887, "epoch": 165, "val_loss": 194836.765625, "train_action_mse_error": 12.344679832458496} {"train_loss": -7.136401176452637, "global_step": 27888, "epoch": 166} {"train_loss": -7.057376861572266, "global_step": 27889, "epoch": 166} {"train_loss": -7.20067834854126, "global_step": 27890, "epoch": 166} {"train_loss": -6.9758710861206055, "global_step": 27891, "epoch": 166} {"train_loss": -7.222052574157715, "global_step": 27892, "epoch": 166} {"train_loss": -7.023780822753906, "global_step": 27893, "epoch": 166} {"train_loss": -7.156650066375732, "global_step": 27894, "epoch": 166} {"train_loss": -7.229346752166748, "global_step": 27895, "epoch": 166} {"train_loss": -7.094396591186523, "global_step": 27896, "epoch": 166} {"train_loss": -7.260907173156738, "global_step": 27897, "epoch": 166} {"train_loss": -7.3016180992126465, "global_step": 27898, "epoch": 166} {"train_loss": -7.3548736572265625, "global_step": 27899, "epoch": 166} {"train_loss": -7.203392028808594, "global_step": 27900, "epoch": 166} {"train_loss": -7.190011978149414, "global_step": 27901, "epoch": 166} {"train_loss": -7.273923397064209, "global_step": 27902, "epoch": 166} {"train_loss": -7.29508113861084, "global_step": 27903, "epoch": 166} {"train_loss": -7.160240650177002, "global_step": 27904, "epoch": 166} {"train_loss": -7.378954887390137, "global_step": 27905, "epoch": 166} {"train_loss": -7.2342352867126465, "global_step": 27906, "epoch": 166} {"train_loss": -7.396463394165039, "global_step": 27907, "epoch": 166} {"train_loss": -7.345331192016602, "global_step": 27908, "epoch": 166} {"train_loss": -7.3128557205200195, "global_step": 27909, "epoch": 166} {"train_loss": -7.105031967163086, "global_step": 27910, "epoch": 166} {"train_loss": -7.2440080642700195, "global_step": 27911, "epoch": 166} {"train_loss": -7.353569984436035, "global_step": 27912, "epoch": 166} {"train_loss": -7.366610527038574, "global_step": 27913, "epoch": 166} {"train_loss": -7.169917106628418, "global_step": 27914, "epoch": 166} {"train_loss": -7.282993316650391, "global_step": 27915, "epoch": 166} {"train_loss": -7.518209457397461, "global_step": 27916, "epoch": 166} {"train_loss": -7.069619655609131, "global_step": 27917, "epoch": 166} {"train_loss": -7.374139308929443, "global_step": 27918, "epoch": 166} {"train_loss": -7.424775123596191, "global_step": 27919, "epoch": 166} {"train_loss": -7.272843360900879, "global_step": 27920, "epoch": 166} {"train_loss": -7.505545139312744, "global_step": 27921, "epoch": 166} {"train_loss": -7.54530143737793, "global_step": 27922, "epoch": 166} {"train_loss": -7.591448783874512, "global_step": 27923, "epoch": 166} {"train_loss": -7.306879997253418, "global_step": 27924, "epoch": 166} {"train_loss": -7.060772895812988, "global_step": 27925, "epoch": 166} {"train_loss": -7.401679992675781, "global_step": 27926, "epoch": 166} {"train_loss": -7.362418174743652, "global_step": 27927, "epoch": 166} {"train_loss": -7.267108917236328, "global_step": 27928, "epoch": 166} {"train_loss": -7.662961006164551, "global_step": 27929, "epoch": 166} {"train_loss": -7.321244239807129, "global_step": 27930, "epoch": 166} {"train_loss": -7.450704574584961, "global_step": 27931, "epoch": 166} {"train_loss": -7.436426162719727, "global_step": 27932, "epoch": 166} {"train_loss": -7.122024059295654, "global_step": 27933, "epoch": 166} {"train_loss": -7.4758830070495605, "global_step": 27934, "epoch": 166} {"train_loss": -7.540879726409912, "global_step": 27935, "epoch": 166} {"train_loss": -7.551907539367676, "global_step": 27936, "epoch": 166} {"train_loss": -7.369982719421387, "global_step": 27937, "epoch": 166} {"train_loss": -7.442938804626465, "global_step": 27938, "epoch": 166} {"train_loss": -7.582441806793213, "global_step": 27939, "epoch": 166} {"train_loss": -7.521944999694824, "global_step": 27940, "epoch": 166} {"train_loss": -7.646414756774902, "global_step": 27941, "epoch": 166} {"train_loss": -7.460014343261719, "global_step": 27942, "epoch": 166} {"train_loss": -7.727445602416992, "global_step": 27943, "epoch": 166} {"train_loss": -7.513186454772949, "global_step": 27944, "epoch": 166} {"train_loss": -7.7145538330078125, "global_step": 27945, "epoch": 166} {"train_loss": -7.248023986816406, "global_step": 27946, "epoch": 166} {"train_loss": -7.662348747253418, "global_step": 27947, "epoch": 166} {"train_loss": -7.3438215255737305, "global_step": 27948, "epoch": 166} {"train_loss": -7.155486106872559, "global_step": 27949, "epoch": 166} {"train_loss": -7.190958023071289, "global_step": 27950, "epoch": 166} {"train_loss": -7.313100337982178, "global_step": 27951, "epoch": 166} {"train_loss": -7.2321038246154785, "global_step": 27952, "epoch": 166} {"train_loss": -7.168210029602051, "global_step": 27953, "epoch": 166} {"train_loss": -7.477865695953369, "global_step": 27954, "epoch": 166} {"train_loss": -7.440090656280518, "global_step": 27955, "epoch": 166} {"train_loss": -7.408262729644775, "global_step": 27956, "epoch": 166} {"train_loss": -7.466551780700684, "global_step": 27957, "epoch": 166} {"train_loss": -7.264971733093262, "global_step": 27958, "epoch": 166} {"train_loss": -7.478041172027588, "global_step": 27959, "epoch": 166} {"train_loss": -7.418041706085205, "global_step": 27960, "epoch": 166} {"train_loss": -7.139678001403809, "global_step": 27961, "epoch": 166} {"train_loss": -7.411718845367432, "global_step": 27962, "epoch": 166} {"train_loss": -7.020479202270508, "global_step": 27963, "epoch": 166} {"train_loss": -7.240891456604004, "global_step": 27964, "epoch": 166} {"train_loss": -7.068365097045898, "global_step": 27965, "epoch": 166} {"train_loss": -7.1877336502075195, "global_step": 27966, "epoch": 166} {"train_loss": -7.35992431640625, "global_step": 27967, "epoch": 166} {"train_loss": -7.091896057128906, "global_step": 27968, "epoch": 166} {"train_loss": -7.556430339813232, "global_step": 27969, "epoch": 166} {"train_loss": -7.205389022827148, "global_step": 27970, "epoch": 166} {"train_loss": -7.249356269836426, "global_step": 27971, "epoch": 166} {"train_loss": -7.318363189697266, "global_step": 27972, "epoch": 166} {"train_loss": -7.196469783782959, "global_step": 27973, "epoch": 166} {"train_loss": -7.265741348266602, "global_step": 27974, "epoch": 166} {"train_loss": -7.065195560455322, "global_step": 27975, "epoch": 166} {"train_loss": -7.217392921447754, "global_step": 27976, "epoch": 166} {"train_loss": -7.344723701477051, "global_step": 27977, "epoch": 166} {"train_loss": -7.170265197753906, "global_step": 27978, "epoch": 166} {"train_loss": -7.263498306274414, "global_step": 27979, "epoch": 166} {"train_loss": -7.070284843444824, "global_step": 27980, "epoch": 166} {"train_loss": -7.091085433959961, "global_step": 27981, "epoch": 166} {"train_loss": -7.342372894287109, "global_step": 27982, "epoch": 166} {"train_loss": -7.028866291046143, "global_step": 27983, "epoch": 166} {"train_loss": -7.332421779632568, "global_step": 27984, "epoch": 166} {"train_loss": -7.061051368713379, "global_step": 27985, "epoch": 166} {"train_loss": -7.328634738922119, "global_step": 27986, "epoch": 166} {"train_loss": -7.128332138061523, "global_step": 27987, "epoch": 166} {"train_loss": -7.409714698791504, "global_step": 27988, "epoch": 166} {"train_loss": -7.333331108093262, "global_step": 27989, "epoch": 166} {"train_loss": -7.180728912353516, "global_step": 27990, "epoch": 166} {"train_loss": -7.380636215209961, "global_step": 27991, "epoch": 166} {"train_loss": -7.364773750305176, "global_step": 27992, "epoch": 166} {"train_loss": -7.4090166091918945, "global_step": 27993, "epoch": 166} {"train_loss": -7.440690040588379, "global_step": 27994, "epoch": 166} {"train_loss": -7.4359002113342285, "global_step": 27995, "epoch": 166} {"train_loss": -7.488415718078613, "global_step": 27996, "epoch": 166} {"train_loss": -7.328974723815918, "global_step": 27997, "epoch": 166} {"train_loss": -7.209877014160156, "global_step": 27998, "epoch": 166} {"train_loss": -7.109129905700684, "global_step": 27999, "epoch": 166} {"train_loss": -7.3641743659973145, "global_step": 28000, "epoch": 166} {"train_loss": -7.242004871368408, "global_step": 28001, "epoch": 166} {"train_loss": -7.544895172119141, "global_step": 28002, "epoch": 166} {"train_loss": -7.322711944580078, "global_step": 28003, "epoch": 166} {"train_loss": -7.495492458343506, "global_step": 28004, "epoch": 166} {"train_loss": -7.135138988494873, "global_step": 28005, "epoch": 166} {"train_loss": -7.385386943817139, "global_step": 28006, "epoch": 166} {"train_loss": -7.019794464111328, "global_step": 28007, "epoch": 166} {"train_loss": -7.369232177734375, "global_step": 28008, "epoch": 166} {"train_loss": -7.337343692779541, "global_step": 28009, "epoch": 166} {"train_loss": -7.422516822814941, "global_step": 28010, "epoch": 166} {"train_loss": -7.216617584228516, "global_step": 28011, "epoch": 166} {"train_loss": -7.486751079559326, "global_step": 28012, "epoch": 166} {"train_loss": -7.343015193939209, "global_step": 28013, "epoch": 166} {"train_loss": -7.3273162841796875, "global_step": 28014, "epoch": 166} {"train_loss": -7.385235786437988, "global_step": 28015, "epoch": 166} {"train_loss": -7.392043113708496, "global_step": 28016, "epoch": 166} {"train_loss": -7.352154731750488, "global_step": 28017, "epoch": 166} {"train_loss": -7.529955863952637, "global_step": 28018, "epoch": 166} {"train_loss": -7.612453937530518, "global_step": 28019, "epoch": 166} {"train_loss": -7.45413875579834, "global_step": 28020, "epoch": 166} {"train_loss": -7.4742431640625, "global_step": 28021, "epoch": 166} {"train_loss": -7.489072322845459, "global_step": 28022, "epoch": 166} {"train_loss": -7.256050109863281, "global_step": 28023, "epoch": 166} {"train_loss": -7.426625728607178, "global_step": 28024, "epoch": 166} {"train_loss": -7.50614070892334, "global_step": 28025, "epoch": 166} {"train_loss": -7.326682090759277, "global_step": 28026, "epoch": 166} {"train_loss": -7.312400817871094, "global_step": 28027, "epoch": 166} {"train_loss": -7.361659049987793, "global_step": 28028, "epoch": 166} {"train_loss": -7.3556809425354, "global_step": 28029, "epoch": 166} {"train_loss": -7.385080814361572, "global_step": 28030, "epoch": 166} {"train_loss": -7.398125648498535, "global_step": 28031, "epoch": 166} {"train_loss": -7.320644378662109, "global_step": 28032, "epoch": 166} {"train_loss": -7.39210319519043, "global_step": 28033, "epoch": 166} {"train_loss": -7.558562278747559, "global_step": 28034, "epoch": 166} {"train_loss": -7.399802207946777, "global_step": 28035, "epoch": 166} {"train_loss": -7.192873001098633, "global_step": 28036, "epoch": 166} {"train_loss": -7.387341022491455, "global_step": 28037, "epoch": 166} {"train_loss": -7.3431901931762695, "global_step": 28038, "epoch": 166} {"train_loss": -7.5608720779418945, "global_step": 28039, "epoch": 166} {"train_loss": -7.422360420227051, "global_step": 28040, "epoch": 166} {"train_loss": -7.404534339904785, "global_step": 28041, "epoch": 166} {"train_loss": -7.297558784484863, "global_step": 28042, "epoch": 166} {"train_loss": -7.400402069091797, "global_step": 28043, "epoch": 166} {"train_loss": -7.572354316711426, "global_step": 28044, "epoch": 166} {"train_loss": -7.391430377960205, "global_step": 28045, "epoch": 166} {"train_loss": -7.438810348510742, "global_step": 28046, "epoch": 166} {"train_loss": -7.3787922859191895, "global_step": 28047, "epoch": 166} {"train_loss": -7.190410614013672, "global_step": 28048, "epoch": 166} {"train_loss": -7.388273239135742, "global_step": 28049, "epoch": 166} {"train_loss": -7.31083869934082, "global_step": 28050, "epoch": 166} {"train_loss": -7.344963073730469, "global_step": 28051, "epoch": 166} {"train_loss": -7.365476131439209, "global_step": 28052, "epoch": 166} {"train_loss": -7.179422378540039, "global_step": 28053, "epoch": 166} {"train_loss": -7.211178779602051, "global_step": 28054, "epoch": 166} {"train_loss": -7.329240373202732, "global_step": 28055, "epoch": 166, "val_loss": 191235.671875} {"train_loss": -7.452728271484375, "global_step": 28056, "epoch": 167} {"train_loss": -7.11713171005249, "global_step": 28057, "epoch": 167} {"train_loss": -7.220349311828613, "global_step": 28058, "epoch": 167} {"train_loss": -7.313565254211426, "global_step": 28059, "epoch": 167} {"train_loss": -7.281065940856934, "global_step": 28060, "epoch": 167} {"train_loss": -7.319492816925049, "global_step": 28061, "epoch": 167} {"train_loss": -7.320030212402344, "global_step": 28062, "epoch": 167} {"train_loss": -7.4194536209106445, "global_step": 28063, "epoch": 167} {"train_loss": -7.20352840423584, "global_step": 28064, "epoch": 167} {"train_loss": -7.4476542472839355, "global_step": 28065, "epoch": 167} {"train_loss": -7.129897117614746, "global_step": 28066, "epoch": 167} {"train_loss": -7.439043045043945, "global_step": 28067, "epoch": 167} {"train_loss": -7.54404354095459, "global_step": 28068, "epoch": 167} {"train_loss": -7.201314449310303, "global_step": 28069, "epoch": 167} {"train_loss": -7.018744468688965, "global_step": 28070, "epoch": 167} {"train_loss": -7.280083656311035, "global_step": 28071, "epoch": 167} {"train_loss": -7.323735237121582, "global_step": 28072, "epoch": 167} {"train_loss": -7.547060489654541, "global_step": 28073, "epoch": 167} {"train_loss": -7.255906105041504, "global_step": 28074, "epoch": 167} {"train_loss": -7.445487976074219, "global_step": 28075, "epoch": 167} {"train_loss": -7.476127624511719, "global_step": 28076, "epoch": 167} {"train_loss": -7.600793838500977, "global_step": 28077, "epoch": 167} {"train_loss": -7.382303714752197, "global_step": 28078, "epoch": 167} {"train_loss": -7.417886734008789, "global_step": 28079, "epoch": 167} {"train_loss": -7.3724446296691895, "global_step": 28080, "epoch": 167} {"train_loss": -7.557518005371094, "global_step": 28081, "epoch": 167} {"train_loss": -7.234927654266357, "global_step": 28082, "epoch": 167} {"train_loss": -7.473532676696777, "global_step": 28083, "epoch": 167} {"train_loss": -7.301113605499268, "global_step": 28084, "epoch": 167} {"train_loss": -7.452846527099609, "global_step": 28085, "epoch": 167} {"train_loss": -7.1451005935668945, "global_step": 28086, "epoch": 167} {"train_loss": -7.358112335205078, "global_step": 28087, "epoch": 167} {"train_loss": -7.403314590454102, "global_step": 28088, "epoch": 167} {"train_loss": -7.441496849060059, "global_step": 28089, "epoch": 167} {"train_loss": -7.227422714233398, "global_step": 28090, "epoch": 167} {"train_loss": -7.430529594421387, "global_step": 28091, "epoch": 167} {"train_loss": -7.288043022155762, "global_step": 28092, "epoch": 167} {"train_loss": -7.260334014892578, "global_step": 28093, "epoch": 167} {"train_loss": -7.290410041809082, "global_step": 28094, "epoch": 167} {"train_loss": -7.235857009887695, "global_step": 28095, "epoch": 167} {"train_loss": -7.525707244873047, "global_step": 28096, "epoch": 167} {"train_loss": -7.357304573059082, "global_step": 28097, "epoch": 167} {"train_loss": -7.334033966064453, "global_step": 28098, "epoch": 167} {"train_loss": -7.536368370056152, "global_step": 28099, "epoch": 167} {"train_loss": -7.606232643127441, "global_step": 28100, "epoch": 167} {"train_loss": -7.5566229820251465, "global_step": 28101, "epoch": 167} {"train_loss": -7.112009525299072, "global_step": 28102, "epoch": 167} {"train_loss": -7.188899040222168, "global_step": 28103, "epoch": 167} {"train_loss": -7.339311599731445, "global_step": 28104, "epoch": 167} {"train_loss": -7.375700950622559, "global_step": 28105, "epoch": 167} {"train_loss": -7.187648773193359, "global_step": 28106, "epoch": 167} {"train_loss": -7.4502434730529785, "global_step": 28107, "epoch": 167} {"train_loss": -7.2159624099731445, "global_step": 28108, "epoch": 167} {"train_loss": -7.431055068969727, "global_step": 28109, "epoch": 167} {"train_loss": -7.337996006011963, "global_step": 28110, "epoch": 167} {"train_loss": -7.400783538818359, "global_step": 28111, "epoch": 167} {"train_loss": -7.357626914978027, "global_step": 28112, "epoch": 167} {"train_loss": -7.171841144561768, "global_step": 28113, "epoch": 167} {"train_loss": -7.4106903076171875, "global_step": 28114, "epoch": 167} {"train_loss": -6.927006721496582, "global_step": 28115, "epoch": 167} {"train_loss": -7.254589080810547, "global_step": 28116, "epoch": 167} {"train_loss": -7.0100812911987305, "global_step": 28117, "epoch": 167} {"train_loss": -7.09202766418457, "global_step": 28118, "epoch": 167} {"train_loss": -7.297934055328369, "global_step": 28119, "epoch": 167} {"train_loss": -7.158985137939453, "global_step": 28120, "epoch": 167} {"train_loss": -7.190518379211426, "global_step": 28121, "epoch": 167} {"train_loss": -7.132596015930176, "global_step": 28122, "epoch": 167} {"train_loss": -7.283022880554199, "global_step": 28123, "epoch": 167} {"train_loss": -7.38162899017334, "global_step": 28124, "epoch": 167} {"train_loss": -7.177983283996582, "global_step": 28125, "epoch": 167} {"train_loss": -7.2355732917785645, "global_step": 28126, "epoch": 167} {"train_loss": -7.317746162414551, "global_step": 28127, "epoch": 167} {"train_loss": -7.407530307769775, "global_step": 28128, "epoch": 167} {"train_loss": -7.209568977355957, "global_step": 28129, "epoch": 167} {"train_loss": -7.136336326599121, "global_step": 28130, "epoch": 167} {"train_loss": -7.376404762268066, "global_step": 28131, "epoch": 167} {"train_loss": -7.306509494781494, "global_step": 28132, "epoch": 167} {"train_loss": -7.108901023864746, "global_step": 28133, "epoch": 167} {"train_loss": -7.196011066436768, "global_step": 28134, "epoch": 167} {"train_loss": -7.571763038635254, "global_step": 28135, "epoch": 167} {"train_loss": -7.198695182800293, "global_step": 28136, "epoch": 167} {"train_loss": -7.335057258605957, "global_step": 28137, "epoch": 167} {"train_loss": -7.400379180908203, "global_step": 28138, "epoch": 167} {"train_loss": -7.08651065826416, "global_step": 28139, "epoch": 167} {"train_loss": -7.411219596862793, "global_step": 28140, "epoch": 167} {"train_loss": -7.612308502197266, "global_step": 28141, "epoch": 167} {"train_loss": -7.610470771789551, "global_step": 28142, "epoch": 167} {"train_loss": -7.445622444152832, "global_step": 28143, "epoch": 167} {"train_loss": -7.435670852661133, "global_step": 28144, "epoch": 167} {"train_loss": -7.439681053161621, "global_step": 28145, "epoch": 167} {"train_loss": -7.5347137451171875, "global_step": 28146, "epoch": 167} {"train_loss": -7.403036117553711, "global_step": 28147, "epoch": 167} {"train_loss": -7.4617600440979, "global_step": 28148, "epoch": 167} {"train_loss": -7.4056878089904785, "global_step": 28149, "epoch": 167} {"train_loss": -7.364565849304199, "global_step": 28150, "epoch": 167} {"train_loss": -7.258710861206055, "global_step": 28151, "epoch": 167} {"train_loss": -7.552553176879883, "global_step": 28152, "epoch": 167} {"train_loss": -7.564093589782715, "global_step": 28153, "epoch": 167} {"train_loss": -7.4056267738342285, "global_step": 28154, "epoch": 167} {"train_loss": -7.434118270874023, "global_step": 28155, "epoch": 167} {"train_loss": -7.659392356872559, "global_step": 28156, "epoch": 167} {"train_loss": -7.196789741516113, "global_step": 28157, "epoch": 167} {"train_loss": -7.529577732086182, "global_step": 28158, "epoch": 167} {"train_loss": -7.375418186187744, "global_step": 28159, "epoch": 167} {"train_loss": -7.483814239501953, "global_step": 28160, "epoch": 167} {"train_loss": -7.4793243408203125, "global_step": 28161, "epoch": 167} {"train_loss": -7.284211158752441, "global_step": 28162, "epoch": 167} {"train_loss": -7.493802070617676, "global_step": 28163, "epoch": 167} {"train_loss": -7.1817216873168945, "global_step": 28164, "epoch": 167} {"train_loss": -7.494607925415039, "global_step": 28165, "epoch": 167} {"train_loss": -7.551477432250977, "global_step": 28166, "epoch": 167} {"train_loss": -7.57268762588501, "global_step": 28167, "epoch": 167} {"train_loss": -7.369955062866211, "global_step": 28168, "epoch": 167} {"train_loss": -7.436159133911133, "global_step": 28169, "epoch": 167} {"train_loss": -7.36065673828125, "global_step": 28170, "epoch": 167} {"train_loss": -7.523305416107178, "global_step": 28171, "epoch": 167} {"train_loss": -7.633050441741943, "global_step": 28172, "epoch": 167} {"train_loss": -7.410411357879639, "global_step": 28173, "epoch": 167} {"train_loss": -7.357645034790039, "global_step": 28174, "epoch": 167} {"train_loss": -7.524935722351074, "global_step": 28175, "epoch": 167} {"train_loss": -7.205214500427246, "global_step": 28176, "epoch": 167} {"train_loss": -7.6034135818481445, "global_step": 28177, "epoch": 167} {"train_loss": -7.2301506996154785, "global_step": 28178, "epoch": 167} {"train_loss": -7.476069450378418, "global_step": 28179, "epoch": 167} {"train_loss": -7.478838920593262, "global_step": 28180, "epoch": 167} {"train_loss": -7.381501197814941, "global_step": 28181, "epoch": 167} {"train_loss": -7.352437973022461, "global_step": 28182, "epoch": 167} {"train_loss": -7.572809219360352, "global_step": 28183, "epoch": 167} {"train_loss": -7.374122619628906, "global_step": 28184, "epoch": 167} {"train_loss": -7.349959373474121, "global_step": 28185, "epoch": 167} {"train_loss": -7.394952297210693, "global_step": 28186, "epoch": 167} {"train_loss": -7.514977931976318, "global_step": 28187, "epoch": 167} {"train_loss": -7.340860366821289, "global_step": 28188, "epoch": 167} {"train_loss": -7.456676483154297, "global_step": 28189, "epoch": 167} {"train_loss": -7.548729419708252, "global_step": 28190, "epoch": 167} {"train_loss": -7.440443992614746, "global_step": 28191, "epoch": 167} {"train_loss": -7.640955924987793, "global_step": 28192, "epoch": 167} {"train_loss": -7.844388961791992, "global_step": 28193, "epoch": 167} {"train_loss": -7.498576641082764, "global_step": 28194, "epoch": 167} {"train_loss": -7.378802299499512, "global_step": 28195, "epoch": 167} {"train_loss": -7.7187910079956055, "global_step": 28196, "epoch": 167} {"train_loss": -7.448885440826416, "global_step": 28197, "epoch": 167} {"train_loss": -7.411617279052734, "global_step": 28198, "epoch": 167} {"train_loss": -7.257844924926758, "global_step": 28199, "epoch": 167} {"train_loss": -7.434175491333008, "global_step": 28200, "epoch": 167} {"train_loss": -7.5637407302856445, "global_step": 28201, "epoch": 167} {"train_loss": -7.418598175048828, "global_step": 28202, "epoch": 167} {"train_loss": -7.573188781738281, "global_step": 28203, "epoch": 167} {"train_loss": -7.2986249923706055, "global_step": 28204, "epoch": 167} {"train_loss": -7.3329973220825195, "global_step": 28205, "epoch": 167} {"train_loss": -7.272279739379883, "global_step": 28206, "epoch": 167} {"train_loss": -7.541136741638184, "global_step": 28207, "epoch": 167} {"train_loss": -7.532083511352539, "global_step": 28208, "epoch": 167} {"train_loss": -7.216132640838623, "global_step": 28209, "epoch": 167} {"train_loss": -7.334214687347412, "global_step": 28210, "epoch": 167} {"train_loss": -7.284625053405762, "global_step": 28211, "epoch": 167} {"train_loss": -7.121598243713379, "global_step": 28212, "epoch": 167} {"train_loss": -7.3486223220825195, "global_step": 28213, "epoch": 167} {"train_loss": -7.368535995483398, "global_step": 28214, "epoch": 167} {"train_loss": -7.244673728942871, "global_step": 28215, "epoch": 167} {"train_loss": -7.206659317016602, "global_step": 28216, "epoch": 167} {"train_loss": -7.206097602844238, "global_step": 28217, "epoch": 167} {"train_loss": -7.318565368652344, "global_step": 28218, "epoch": 167} {"train_loss": -7.215848445892334, "global_step": 28219, "epoch": 167} {"train_loss": -7.332714557647705, "global_step": 28220, "epoch": 167} {"train_loss": -7.309952735900879, "global_step": 28221, "epoch": 167} {"train_loss": -7.3271989822387695, "global_step": 28222, "epoch": 167} {"train_loss": -7.367877710433233, "global_step": 28223, "epoch": 167, "val_loss": 193177.21875} {"train_loss": -7.311556339263916, "global_step": 28224, "epoch": 168} {"train_loss": -7.522614002227783, "global_step": 28225, "epoch": 168} {"train_loss": -6.906994342803955, "global_step": 28226, "epoch": 168} {"train_loss": -7.647481918334961, "global_step": 28227, "epoch": 168} {"train_loss": -7.393042087554932, "global_step": 28228, "epoch": 168} {"train_loss": -7.499772548675537, "global_step": 28229, "epoch": 168} {"train_loss": -7.467213153839111, "global_step": 28230, "epoch": 168} {"train_loss": -7.287786483764648, "global_step": 28231, "epoch": 168} {"train_loss": -7.3783979415893555, "global_step": 28232, "epoch": 168} {"train_loss": -7.233598709106445, "global_step": 28233, "epoch": 168} {"train_loss": -7.274055480957031, "global_step": 28234, "epoch": 168} {"train_loss": -7.222898960113525, "global_step": 28235, "epoch": 168} {"train_loss": -7.455910682678223, "global_step": 28236, "epoch": 168} {"train_loss": -7.196111679077148, "global_step": 28237, "epoch": 168} {"train_loss": -7.0864973068237305, "global_step": 28238, "epoch": 168} {"train_loss": -7.042914390563965, "global_step": 28239, "epoch": 168} {"train_loss": -7.3611249923706055, "global_step": 28240, "epoch": 168} {"train_loss": -7.146866798400879, "global_step": 28241, "epoch": 168} {"train_loss": -7.229152679443359, "global_step": 28242, "epoch": 168} {"train_loss": -7.264060020446777, "global_step": 28243, "epoch": 168} {"train_loss": -7.532049655914307, "global_step": 28244, "epoch": 168} {"train_loss": -7.287233352661133, "global_step": 28245, "epoch": 168} {"train_loss": -7.486150741577148, "global_step": 28246, "epoch": 168} {"train_loss": -7.3588643074035645, "global_step": 28247, "epoch": 168} {"train_loss": -7.255307197570801, "global_step": 28248, "epoch": 168} {"train_loss": -7.244448184967041, "global_step": 28249, "epoch": 168} {"train_loss": -7.07481575012207, "global_step": 28250, "epoch": 168} {"train_loss": -7.356295585632324, "global_step": 28251, "epoch": 168} {"train_loss": -7.131560325622559, "global_step": 28252, "epoch": 168} {"train_loss": -7.447634696960449, "global_step": 28253, "epoch": 168} {"train_loss": -7.305082321166992, "global_step": 28254, "epoch": 168} {"train_loss": -7.394420623779297, "global_step": 28255, "epoch": 168} {"train_loss": -7.473755359649658, "global_step": 28256, "epoch": 168} {"train_loss": -7.237677574157715, "global_step": 28257, "epoch": 168} {"train_loss": -7.702203750610352, "global_step": 28258, "epoch": 168} {"train_loss": -7.13593053817749, "global_step": 28259, "epoch": 168} {"train_loss": -7.359388828277588, "global_step": 28260, "epoch": 168} {"train_loss": -7.341777801513672, "global_step": 28261, "epoch": 168} {"train_loss": -7.325815200805664, "global_step": 28262, "epoch": 168} {"train_loss": -7.250478744506836, "global_step": 28263, "epoch": 168} {"train_loss": -7.385284423828125, "global_step": 28264, "epoch": 168} {"train_loss": -7.425423622131348, "global_step": 28265, "epoch": 168} {"train_loss": -7.380815505981445, "global_step": 28266, "epoch": 168} {"train_loss": -7.471812725067139, "global_step": 28267, "epoch": 168} {"train_loss": -7.36870002746582, "global_step": 28268, "epoch": 168} {"train_loss": -7.534804821014404, "global_step": 28269, "epoch": 168} {"train_loss": -7.204898834228516, "global_step": 28270, "epoch": 168} {"train_loss": -7.52405309677124, "global_step": 28271, "epoch": 168} {"train_loss": -7.438654899597168, "global_step": 28272, "epoch": 168} {"train_loss": -7.318117141723633, "global_step": 28273, "epoch": 168} {"train_loss": -7.175917625427246, "global_step": 28274, "epoch": 168} {"train_loss": -7.375105857849121, "global_step": 28275, "epoch": 168} {"train_loss": -7.521203994750977, "global_step": 28276, "epoch": 168} {"train_loss": -7.27807092666626, "global_step": 28277, "epoch": 168} {"train_loss": -7.4328155517578125, "global_step": 28278, "epoch": 168} {"train_loss": -7.504877090454102, "global_step": 28279, "epoch": 168} {"train_loss": -7.428380012512207, "global_step": 28280, "epoch": 168} {"train_loss": -7.47653865814209, "global_step": 28281, "epoch": 168} {"train_loss": -7.350070476531982, "global_step": 28282, "epoch": 168} {"train_loss": -7.504376411437988, "global_step": 28283, "epoch": 168} {"train_loss": -7.4269866943359375, "global_step": 28284, "epoch": 168} {"train_loss": -7.216887474060059, "global_step": 28285, "epoch": 168} {"train_loss": -6.856548309326172, "global_step": 28286, "epoch": 168} {"train_loss": -7.662850379943848, "global_step": 28287, "epoch": 168} {"train_loss": -7.140293121337891, "global_step": 28288, "epoch": 168} {"train_loss": -7.132270812988281, "global_step": 28289, "epoch": 168} {"train_loss": -7.2277631759643555, "global_step": 28290, "epoch": 168} {"train_loss": -6.9986371994018555, "global_step": 28291, "epoch": 168} {"train_loss": -7.304059982299805, "global_step": 28292, "epoch": 168} {"train_loss": -7.304683208465576, "global_step": 28293, "epoch": 168} {"train_loss": -7.3192033767700195, "global_step": 28294, "epoch": 168} {"train_loss": -7.446972370147705, "global_step": 28295, "epoch": 168} {"train_loss": -7.272420406341553, "global_step": 28296, "epoch": 168} {"train_loss": -7.591673851013184, "global_step": 28297, "epoch": 168} {"train_loss": -7.487384796142578, "global_step": 28298, "epoch": 168} {"train_loss": -7.237112998962402, "global_step": 28299, "epoch": 168} {"train_loss": -7.556384086608887, "global_step": 28300, "epoch": 168} {"train_loss": -7.636457920074463, "global_step": 28301, "epoch": 168} {"train_loss": -7.415951728820801, "global_step": 28302, "epoch": 168} {"train_loss": -7.490112781524658, "global_step": 28303, "epoch": 168} {"train_loss": -7.565739631652832, "global_step": 28304, "epoch": 168} {"train_loss": -7.40622615814209, "global_step": 28305, "epoch": 168} {"train_loss": -7.5106048583984375, "global_step": 28306, "epoch": 168} {"train_loss": -7.479149341583252, "global_step": 28307, "epoch": 168} {"train_loss": -7.40543270111084, "global_step": 28308, "epoch": 168} {"train_loss": -7.585432529449463, "global_step": 28309, "epoch": 168} {"train_loss": -7.457887649536133, "global_step": 28310, "epoch": 168} {"train_loss": -7.525929927825928, "global_step": 28311, "epoch": 168} {"train_loss": -7.543360233306885, "global_step": 28312, "epoch": 168} {"train_loss": -7.554904937744141, "global_step": 28313, "epoch": 168} {"train_loss": -7.693064212799072, "global_step": 28314, "epoch": 168} {"train_loss": -7.553537368774414, "global_step": 28315, "epoch": 168} {"train_loss": -7.561769008636475, "global_step": 28316, "epoch": 168} {"train_loss": -7.555259704589844, "global_step": 28317, "epoch": 168} {"train_loss": -7.843484878540039, "global_step": 28318, "epoch": 168} {"train_loss": -7.626288890838623, "global_step": 28319, "epoch": 168} {"train_loss": -7.137206077575684, "global_step": 28320, "epoch": 168} {"train_loss": -7.040717124938965, "global_step": 28321, "epoch": 168} {"train_loss": -7.4302544593811035, "global_step": 28322, "epoch": 168} {"train_loss": -7.376517295837402, "global_step": 28323, "epoch": 168} {"train_loss": -7.458592891693115, "global_step": 28324, "epoch": 168} {"train_loss": -7.048058032989502, "global_step": 28325, "epoch": 168} {"train_loss": -7.089259147644043, "global_step": 28326, "epoch": 168} {"train_loss": -7.243040084838867, "global_step": 28327, "epoch": 168} {"train_loss": -7.197902679443359, "global_step": 28328, "epoch": 168} {"train_loss": -7.417584419250488, "global_step": 28329, "epoch": 168} {"train_loss": -7.192028999328613, "global_step": 28330, "epoch": 168} {"train_loss": -6.905636787414551, "global_step": 28331, "epoch": 168} {"train_loss": -7.303747177124023, "global_step": 28332, "epoch": 168} {"train_loss": -7.169328212738037, "global_step": 28333, "epoch": 168} {"train_loss": -7.491464614868164, "global_step": 28334, "epoch": 168} {"train_loss": -6.754547119140625, "global_step": 28335, "epoch": 168} {"train_loss": -7.505046844482422, "global_step": 28336, "epoch": 168} {"train_loss": -7.256455421447754, "global_step": 28337, "epoch": 168} {"train_loss": -7.306421279907227, "global_step": 28338, "epoch": 168} {"train_loss": -7.313320159912109, "global_step": 28339, "epoch": 168} {"train_loss": -7.215827465057373, "global_step": 28340, "epoch": 168} {"train_loss": -7.284938812255859, "global_step": 28341, "epoch": 168} {"train_loss": -7.224921703338623, "global_step": 28342, "epoch": 168} {"train_loss": -7.157349586486816, "global_step": 28343, "epoch": 168} {"train_loss": -7.187909126281738, "global_step": 28344, "epoch": 168} {"train_loss": -7.407736301422119, "global_step": 28345, "epoch": 168} {"train_loss": -7.092539310455322, "global_step": 28346, "epoch": 168} {"train_loss": -7.360043048858643, "global_step": 28347, "epoch": 168} {"train_loss": -7.134942531585693, "global_step": 28348, "epoch": 168} {"train_loss": -7.198936939239502, "global_step": 28349, "epoch": 168} {"train_loss": -7.3805460929870605, "global_step": 28350, "epoch": 168} {"train_loss": -7.169473648071289, "global_step": 28351, "epoch": 168} {"train_loss": -7.559242248535156, "global_step": 28352, "epoch": 168} {"train_loss": -7.395169734954834, "global_step": 28353, "epoch": 168} {"train_loss": -7.5274834632873535, "global_step": 28354, "epoch": 168} {"train_loss": -7.262698173522949, "global_step": 28355, "epoch": 168} {"train_loss": -7.481093406677246, "global_step": 28356, "epoch": 168} {"train_loss": -7.306873321533203, "global_step": 28357, "epoch": 168} {"train_loss": -7.498048782348633, "global_step": 28358, "epoch": 168} {"train_loss": -7.3036017417907715, "global_step": 28359, "epoch": 168} {"train_loss": -7.541858673095703, "global_step": 28360, "epoch": 168} {"train_loss": -7.374110221862793, "global_step": 28361, "epoch": 168} {"train_loss": -7.342367172241211, "global_step": 28362, "epoch": 168} {"train_loss": -7.220787048339844, "global_step": 28363, "epoch": 168} {"train_loss": -7.425307273864746, "global_step": 28364, "epoch": 168} {"train_loss": -7.529343605041504, "global_step": 28365, "epoch": 168} {"train_loss": -7.455483913421631, "global_step": 28366, "epoch": 168} {"train_loss": -7.361153602600098, "global_step": 28367, "epoch": 168} {"train_loss": -7.4229583740234375, "global_step": 28368, "epoch": 168} {"train_loss": -7.254623889923096, "global_step": 28369, "epoch": 168} {"train_loss": -7.282126426696777, "global_step": 28370, "epoch": 168} {"train_loss": -7.49759578704834, "global_step": 28371, "epoch": 168} {"train_loss": -7.319737911224365, "global_step": 28372, "epoch": 168} {"train_loss": -7.428491115570068, "global_step": 28373, "epoch": 168} {"train_loss": -7.435070037841797, "global_step": 28374, "epoch": 168} {"train_loss": -7.42009162902832, "global_step": 28375, "epoch": 168} {"train_loss": -7.429496765136719, "global_step": 28376, "epoch": 168} {"train_loss": -7.430444717407227, "global_step": 28377, "epoch": 168} {"train_loss": -7.35793399810791, "global_step": 28378, "epoch": 168} {"train_loss": -7.226767539978027, "global_step": 28379, "epoch": 168} {"train_loss": -7.314517021179199, "global_step": 28380, "epoch": 168} {"train_loss": -7.293849468231201, "global_step": 28381, "epoch": 168} {"train_loss": -7.663213729858398, "global_step": 28382, "epoch": 168} {"train_loss": -7.46588659286499, "global_step": 28383, "epoch": 168} {"train_loss": -7.479045867919922, "global_step": 28384, "epoch": 168} {"train_loss": -7.502224922180176, "global_step": 28385, "epoch": 168} {"train_loss": -7.5851664543151855, "global_step": 28386, "epoch": 168} {"train_loss": -7.1607770919799805, "global_step": 28387, "epoch": 168} {"train_loss": -7.397697448730469, "global_step": 28388, "epoch": 168} {"train_loss": -7.468318939208984, "global_step": 28389, "epoch": 168} {"train_loss": -7.519741535186768, "global_step": 28390, "epoch": 168} {"train_loss": -7.357167678219931, "global_step": 28391, "epoch": 168, "val_loss": 192640.875} {"train_loss": -7.440720558166504, "global_step": 28392, "epoch": 169} {"train_loss": -7.386985778808594, "global_step": 28393, "epoch": 169} {"train_loss": -7.521899223327637, "global_step": 28394, "epoch": 169} {"train_loss": -7.607217788696289, "global_step": 28395, "epoch": 169} {"train_loss": -7.167155742645264, "global_step": 28396, "epoch": 169} {"train_loss": -7.253091812133789, "global_step": 28397, "epoch": 169} {"train_loss": -7.435642242431641, "global_step": 28398, "epoch": 169} {"train_loss": -6.851329803466797, "global_step": 28399, "epoch": 169} {"train_loss": -7.37281608581543, "global_step": 28400, "epoch": 169} {"train_loss": -7.353799819946289, "global_step": 28401, "epoch": 169} {"train_loss": -7.158685684204102, "global_step": 28402, "epoch": 169} {"train_loss": -7.156949996948242, "global_step": 28403, "epoch": 169} {"train_loss": -7.0414934158325195, "global_step": 28404, "epoch": 169} {"train_loss": -7.07835578918457, "global_step": 28405, "epoch": 169} {"train_loss": -6.826620101928711, "global_step": 28406, "epoch": 169} {"train_loss": -7.216595649719238, "global_step": 28407, "epoch": 169} {"train_loss": -6.992058277130127, "global_step": 28408, "epoch": 169} {"train_loss": -6.890894889831543, "global_step": 28409, "epoch": 169} {"train_loss": -7.1089019775390625, "global_step": 28410, "epoch": 169} {"train_loss": -7.002569198608398, "global_step": 28411, "epoch": 169} {"train_loss": -7.1391448974609375, "global_step": 28412, "epoch": 169} {"train_loss": -7.217189788818359, "global_step": 28413, "epoch": 169} {"train_loss": -7.195530891418457, "global_step": 28414, "epoch": 169} {"train_loss": -7.099143981933594, "global_step": 28415, "epoch": 169} {"train_loss": -7.261849403381348, "global_step": 28416, "epoch": 169} {"train_loss": -7.239452362060547, "global_step": 28417, "epoch": 169} {"train_loss": -7.224691390991211, "global_step": 28418, "epoch": 169} {"train_loss": -7.2627949714660645, "global_step": 28419, "epoch": 169} {"train_loss": -7.478699684143066, "global_step": 28420, "epoch": 169} {"train_loss": -7.3109540939331055, "global_step": 28421, "epoch": 169} {"train_loss": -7.126555442810059, "global_step": 28422, "epoch": 169} {"train_loss": -7.350162506103516, "global_step": 28423, "epoch": 169} {"train_loss": -7.4243669509887695, "global_step": 28424, "epoch": 169} {"train_loss": -7.345705032348633, "global_step": 28425, "epoch": 169} {"train_loss": -7.311890602111816, "global_step": 28426, "epoch": 169} {"train_loss": -7.361978530883789, "global_step": 28427, "epoch": 169} {"train_loss": -7.524219989776611, "global_step": 28428, "epoch": 169} {"train_loss": -7.530575752258301, "global_step": 28429, "epoch": 169} {"train_loss": -7.491428375244141, "global_step": 28430, "epoch": 169} {"train_loss": -7.246527194976807, "global_step": 28431, "epoch": 169} {"train_loss": -7.384975433349609, "global_step": 28432, "epoch": 169} {"train_loss": -7.354569911956787, "global_step": 28433, "epoch": 169} {"train_loss": -7.563167095184326, "global_step": 28434, "epoch": 169} {"train_loss": -7.371834754943848, "global_step": 28435, "epoch": 169} {"train_loss": -7.346816062927246, "global_step": 28436, "epoch": 169} {"train_loss": -7.364199638366699, "global_step": 28437, "epoch": 169} {"train_loss": -7.319438457489014, "global_step": 28438, "epoch": 169} {"train_loss": -7.201479911804199, "global_step": 28439, "epoch": 169} {"train_loss": -7.271554946899414, "global_step": 28440, "epoch": 169} {"train_loss": -7.6288580894470215, "global_step": 28441, "epoch": 169} {"train_loss": -7.3004913330078125, "global_step": 28442, "epoch": 169} {"train_loss": -7.549576759338379, "global_step": 28443, "epoch": 169} {"train_loss": -7.499295711517334, "global_step": 28444, "epoch": 169} {"train_loss": -7.340573787689209, "global_step": 28445, "epoch": 169} {"train_loss": -7.356416702270508, "global_step": 28446, "epoch": 169} {"train_loss": -7.463226318359375, "global_step": 28447, "epoch": 169} {"train_loss": -7.316518783569336, "global_step": 28448, "epoch": 169} {"train_loss": -7.375082969665527, "global_step": 28449, "epoch": 169} {"train_loss": -7.610247611999512, "global_step": 28450, "epoch": 169} {"train_loss": -7.551383018493652, "global_step": 28451, "epoch": 169} {"train_loss": -7.355902671813965, "global_step": 28452, "epoch": 169} {"train_loss": -7.450750350952148, "global_step": 28453, "epoch": 169} {"train_loss": -7.703121185302734, "global_step": 28454, "epoch": 169} {"train_loss": -7.495485305786133, "global_step": 28455, "epoch": 169} {"train_loss": -7.52840518951416, "global_step": 28456, "epoch": 169} {"train_loss": -7.512956619262695, "global_step": 28457, "epoch": 169} {"train_loss": -7.63407039642334, "global_step": 28458, "epoch": 169} {"train_loss": -7.51432991027832, "global_step": 28459, "epoch": 169} {"train_loss": -7.554948806762695, "global_step": 28460, "epoch": 169} {"train_loss": -7.542784690856934, "global_step": 28461, "epoch": 169} {"train_loss": -7.418028831481934, "global_step": 28462, "epoch": 169} {"train_loss": -7.399028778076172, "global_step": 28463, "epoch": 169} {"train_loss": -7.576316833496094, "global_step": 28464, "epoch": 169} {"train_loss": -7.438807487487793, "global_step": 28465, "epoch": 169} {"train_loss": -7.616946220397949, "global_step": 28466, "epoch": 169} {"train_loss": -7.574395656585693, "global_step": 28467, "epoch": 169} {"train_loss": -7.521120071411133, "global_step": 28468, "epoch": 169} {"train_loss": -7.525678634643555, "global_step": 28469, "epoch": 169} {"train_loss": -7.620540618896484, "global_step": 28470, "epoch": 169} {"train_loss": -7.476665496826172, "global_step": 28471, "epoch": 169} {"train_loss": -7.599403381347656, "global_step": 28472, "epoch": 169} {"train_loss": -7.264599800109863, "global_step": 28473, "epoch": 169} {"train_loss": -7.470189571380615, "global_step": 28474, "epoch": 169} {"train_loss": -7.506511688232422, "global_step": 28475, "epoch": 169} {"train_loss": -7.369885444641113, "global_step": 28476, "epoch": 169} {"train_loss": -7.228500843048096, "global_step": 28477, "epoch": 169} {"train_loss": -7.503688812255859, "global_step": 28478, "epoch": 169} {"train_loss": -7.441266059875488, "global_step": 28479, "epoch": 169} {"train_loss": -7.604511260986328, "global_step": 28480, "epoch": 169} {"train_loss": -7.472428321838379, "global_step": 28481, "epoch": 169} {"train_loss": -7.210157871246338, "global_step": 28482, "epoch": 169} {"train_loss": -7.014103412628174, "global_step": 28483, "epoch": 169} {"train_loss": -7.330223560333252, "global_step": 28484, "epoch": 169} {"train_loss": -7.340239524841309, "global_step": 28485, "epoch": 169} {"train_loss": -7.602776527404785, "global_step": 28486, "epoch": 169} {"train_loss": -7.553230285644531, "global_step": 28487, "epoch": 169} {"train_loss": -7.486177921295166, "global_step": 28488, "epoch": 169} {"train_loss": -7.488313674926758, "global_step": 28489, "epoch": 169} {"train_loss": -7.167545318603516, "global_step": 28490, "epoch": 169} {"train_loss": -7.5799360275268555, "global_step": 28491, "epoch": 169} {"train_loss": -7.266787528991699, "global_step": 28492, "epoch": 169} {"train_loss": -7.450788497924805, "global_step": 28493, "epoch": 169} {"train_loss": -7.1932759284973145, "global_step": 28494, "epoch": 169} {"train_loss": -7.300425052642822, "global_step": 28495, "epoch": 169} {"train_loss": -7.365962028503418, "global_step": 28496, "epoch": 169} {"train_loss": -7.384662628173828, "global_step": 28497, "epoch": 169} {"train_loss": -7.551182270050049, "global_step": 28498, "epoch": 169} {"train_loss": -7.139017105102539, "global_step": 28499, "epoch": 169} {"train_loss": -7.020583629608154, "global_step": 28500, "epoch": 169} {"train_loss": -7.258293151855469, "global_step": 28501, "epoch": 169} {"train_loss": -7.374261379241943, "global_step": 28502, "epoch": 169} {"train_loss": -7.4801411628723145, "global_step": 28503, "epoch": 169} {"train_loss": -7.397207260131836, "global_step": 28504, "epoch": 169} {"train_loss": -7.472970008850098, "global_step": 28505, "epoch": 169} {"train_loss": -7.374788284301758, "global_step": 28506, "epoch": 169} {"train_loss": -7.544070720672607, "global_step": 28507, "epoch": 169} {"train_loss": -7.41970682144165, "global_step": 28508, "epoch": 169} {"train_loss": -7.438539505004883, "global_step": 28509, "epoch": 169} {"train_loss": -7.425885200500488, "global_step": 28510, "epoch": 169} {"train_loss": -7.418670177459717, "global_step": 28511, "epoch": 169} {"train_loss": -7.277523517608643, "global_step": 28512, "epoch": 169} {"train_loss": -7.365511894226074, "global_step": 28513, "epoch": 169} {"train_loss": -7.264659881591797, "global_step": 28514, "epoch": 169} {"train_loss": -7.543551445007324, "global_step": 28515, "epoch": 169} {"train_loss": -7.347653388977051, "global_step": 28516, "epoch": 169} {"train_loss": -7.24897575378418, "global_step": 28517, "epoch": 169} {"train_loss": -7.301420211791992, "global_step": 28518, "epoch": 169} {"train_loss": -7.203062057495117, "global_step": 28519, "epoch": 169} {"train_loss": -7.436153411865234, "global_step": 28520, "epoch": 169} {"train_loss": -7.229425430297852, "global_step": 28521, "epoch": 169} {"train_loss": -7.288533687591553, "global_step": 28522, "epoch": 169} {"train_loss": -7.527078628540039, "global_step": 28523, "epoch": 169} {"train_loss": -7.44489860534668, "global_step": 28524, "epoch": 169} {"train_loss": -7.422458171844482, "global_step": 28525, "epoch": 169} {"train_loss": -7.1625823974609375, "global_step": 28526, "epoch": 169} {"train_loss": -7.270235061645508, "global_step": 28527, "epoch": 169} {"train_loss": -7.185713768005371, "global_step": 28528, "epoch": 169} {"train_loss": -7.53764533996582, "global_step": 28529, "epoch": 169} {"train_loss": -7.547483444213867, "global_step": 28530, "epoch": 169} {"train_loss": -7.519317626953125, "global_step": 28531, "epoch": 169} {"train_loss": -7.413703918457031, "global_step": 28532, "epoch": 169} {"train_loss": -7.5351762771606445, "global_step": 28533, "epoch": 169} {"train_loss": -7.402560234069824, "global_step": 28534, "epoch": 169} {"train_loss": -7.506268501281738, "global_step": 28535, "epoch": 169} {"train_loss": -7.273705959320068, "global_step": 28536, "epoch": 169} {"train_loss": -7.417842864990234, "global_step": 28537, "epoch": 169} {"train_loss": -7.540627479553223, "global_step": 28538, "epoch": 169} {"train_loss": -7.59050178527832, "global_step": 28539, "epoch": 169} {"train_loss": -7.394395351409912, "global_step": 28540, "epoch": 169} {"train_loss": -7.397554874420166, "global_step": 28541, "epoch": 169} {"train_loss": -7.373475074768066, "global_step": 28542, "epoch": 169} {"train_loss": -7.525877952575684, "global_step": 28543, "epoch": 169} {"train_loss": -7.522668838500977, "global_step": 28544, "epoch": 169} {"train_loss": -7.636885643005371, "global_step": 28545, "epoch": 169} {"train_loss": -7.6592206954956055, "global_step": 28546, "epoch": 169} {"train_loss": -7.489606857299805, "global_step": 28547, "epoch": 169} {"train_loss": -7.383031845092773, "global_step": 28548, "epoch": 169} {"train_loss": -7.732868194580078, "global_step": 28549, "epoch": 169} {"train_loss": -7.5481438636779785, "global_step": 28550, "epoch": 169} {"train_loss": -7.459231376647949, "global_step": 28551, "epoch": 169} {"train_loss": -7.484315395355225, "global_step": 28552, "epoch": 169} {"train_loss": -7.642755508422852, "global_step": 28553, "epoch": 169} {"train_loss": -7.421606063842773, "global_step": 28554, "epoch": 169} {"train_loss": -7.3469414710998535, "global_step": 28555, "epoch": 169} {"train_loss": -7.13142204284668, "global_step": 28556, "epoch": 169} {"train_loss": -7.554308891296387, "global_step": 28557, "epoch": 169} {"train_loss": -7.367175579071045, "global_step": 28558, "epoch": 169} {"train_loss": -7.383750129313696, "global_step": 28559, "epoch": 169, "val_loss": 190810.015625} {"train_loss": -7.042492866516113, "global_step": 28560, "epoch": 170} {"train_loss": -7.604293346405029, "global_step": 28561, "epoch": 170} {"train_loss": -6.7531843185424805, "global_step": 28562, "epoch": 170} {"train_loss": -7.208810329437256, "global_step": 28563, "epoch": 170} {"train_loss": -6.887660026550293, "global_step": 28564, "epoch": 170} {"train_loss": -7.097895622253418, "global_step": 28565, "epoch": 170} {"train_loss": -7.168334007263184, "global_step": 28566, "epoch": 170} {"train_loss": -7.170022964477539, "global_step": 28567, "epoch": 170} {"train_loss": -7.4792585372924805, "global_step": 28568, "epoch": 170} {"train_loss": -7.253704071044922, "global_step": 28569, "epoch": 170} {"train_loss": -7.2606658935546875, "global_step": 28570, "epoch": 170} {"train_loss": -7.2045722007751465, "global_step": 28571, "epoch": 170} {"train_loss": -7.128541946411133, "global_step": 28572, "epoch": 170} {"train_loss": -7.426297187805176, "global_step": 28573, "epoch": 170} {"train_loss": -7.040910720825195, "global_step": 28574, "epoch": 170} {"train_loss": -7.033629894256592, "global_step": 28575, "epoch": 170} {"train_loss": -7.203277111053467, "global_step": 28576, "epoch": 170} {"train_loss": -7.154247283935547, "global_step": 28577, "epoch": 170} {"train_loss": -7.234816074371338, "global_step": 28578, "epoch": 170} {"train_loss": -7.116472244262695, "global_step": 28579, "epoch": 170} {"train_loss": -7.138678073883057, "global_step": 28580, "epoch": 170} {"train_loss": -7.179683685302734, "global_step": 28581, "epoch": 170} {"train_loss": -7.302868843078613, "global_step": 28582, "epoch": 170} {"train_loss": -7.252570629119873, "global_step": 28583, "epoch": 170} {"train_loss": -7.448716163635254, "global_step": 28584, "epoch": 170} {"train_loss": -7.305270195007324, "global_step": 28585, "epoch": 170} {"train_loss": -7.284489154815674, "global_step": 28586, "epoch": 170} {"train_loss": -7.39609956741333, "global_step": 28587, "epoch": 170} {"train_loss": -7.3871965408325195, "global_step": 28588, "epoch": 170} {"train_loss": -7.3346171379089355, "global_step": 28589, "epoch": 170} {"train_loss": -7.5550408363342285, "global_step": 28590, "epoch": 170} {"train_loss": -7.522878646850586, "global_step": 28591, "epoch": 170} {"train_loss": -7.482555389404297, "global_step": 28592, "epoch": 170} {"train_loss": -7.430352210998535, "global_step": 28593, "epoch": 170} {"train_loss": -7.36643123626709, "global_step": 28594, "epoch": 170} {"train_loss": -7.899860382080078, "global_step": 28595, "epoch": 170} {"train_loss": -7.5113959312438965, "global_step": 28596, "epoch": 170} {"train_loss": -7.37083101272583, "global_step": 28597, "epoch": 170} {"train_loss": -7.462496757507324, "global_step": 28598, "epoch": 170} {"train_loss": -7.453115463256836, "global_step": 28599, "epoch": 170} {"train_loss": -7.585536003112793, "global_step": 28600, "epoch": 170} {"train_loss": -7.85935640335083, "global_step": 28601, "epoch": 170} {"train_loss": -7.354662895202637, "global_step": 28602, "epoch": 170} {"train_loss": -7.5491132736206055, "global_step": 28603, "epoch": 170} {"train_loss": -7.355687141418457, "global_step": 28604, "epoch": 170} {"train_loss": -7.353549003601074, "global_step": 28605, "epoch": 170} {"train_loss": -7.565723419189453, "global_step": 28606, "epoch": 170} {"train_loss": -7.523367881774902, "global_step": 28607, "epoch": 170} {"train_loss": -7.428511142730713, "global_step": 28608, "epoch": 170} {"train_loss": -7.23039436340332, "global_step": 28609, "epoch": 170} {"train_loss": -7.339261531829834, "global_step": 28610, "epoch": 170} {"train_loss": -7.219989776611328, "global_step": 28611, "epoch": 170} {"train_loss": -7.585949897766113, "global_step": 28612, "epoch": 170} {"train_loss": -7.320910453796387, "global_step": 28613, "epoch": 170} {"train_loss": -7.585869789123535, "global_step": 28614, "epoch": 170} {"train_loss": -7.546424865722656, "global_step": 28615, "epoch": 170} {"train_loss": -7.502128601074219, "global_step": 28616, "epoch": 170} {"train_loss": -7.246344566345215, "global_step": 28617, "epoch": 170} {"train_loss": -7.5142502784729, "global_step": 28618, "epoch": 170} {"train_loss": -7.44145393371582, "global_step": 28619, "epoch": 170} {"train_loss": -7.206669807434082, "global_step": 28620, "epoch": 170} {"train_loss": -7.314792633056641, "global_step": 28621, "epoch": 170} {"train_loss": -7.102574348449707, "global_step": 28622, "epoch": 170} {"train_loss": -7.292994499206543, "global_step": 28623, "epoch": 170} {"train_loss": -7.04097843170166, "global_step": 28624, "epoch": 170} {"train_loss": -6.981551170349121, "global_step": 28625, "epoch": 170} {"train_loss": -7.4146928787231445, "global_step": 28626, "epoch": 170} {"train_loss": -7.011789798736572, "global_step": 28627, "epoch": 170} {"train_loss": -7.064405918121338, "global_step": 28628, "epoch": 170} {"train_loss": -7.142544746398926, "global_step": 28629, "epoch": 170} {"train_loss": -7.310935020446777, "global_step": 28630, "epoch": 170} {"train_loss": -7.366822242736816, "global_step": 28631, "epoch": 170} {"train_loss": -7.147826194763184, "global_step": 28632, "epoch": 170} {"train_loss": -7.353924751281738, "global_step": 28633, "epoch": 170} {"train_loss": -7.4218430519104, "global_step": 28634, "epoch": 170} {"train_loss": -7.06956672668457, "global_step": 28635, "epoch": 170} {"train_loss": -7.321686744689941, "global_step": 28636, "epoch": 170} {"train_loss": -7.158547878265381, "global_step": 28637, "epoch": 170} {"train_loss": -7.230823516845703, "global_step": 28638, "epoch": 170} {"train_loss": -7.263989448547363, "global_step": 28639, "epoch": 170} {"train_loss": -7.365622520446777, "global_step": 28640, "epoch": 170} {"train_loss": -7.428885459899902, "global_step": 28641, "epoch": 170} {"train_loss": -7.285754680633545, "global_step": 28642, "epoch": 170} {"train_loss": -7.511940002441406, "global_step": 28643, "epoch": 170} {"train_loss": -7.216680526733398, "global_step": 28644, "epoch": 170} {"train_loss": -7.5982232093811035, "global_step": 28645, "epoch": 170} {"train_loss": -7.3646392822265625, "global_step": 28646, "epoch": 170} {"train_loss": -7.3955078125, "global_step": 28647, "epoch": 170} {"train_loss": -7.3771162033081055, "global_step": 28648, "epoch": 170} {"train_loss": -7.445690155029297, "global_step": 28649, "epoch": 170} {"train_loss": -7.299564361572266, "global_step": 28650, "epoch": 170} {"train_loss": -7.536508083343506, "global_step": 28651, "epoch": 170} {"train_loss": -7.460570812225342, "global_step": 28652, "epoch": 170} {"train_loss": -7.537953853607178, "global_step": 28653, "epoch": 170} {"train_loss": -7.39046573638916, "global_step": 28654, "epoch": 170} {"train_loss": -7.3146538734436035, "global_step": 28655, "epoch": 170} {"train_loss": -7.428230285644531, "global_step": 28656, "epoch": 170} {"train_loss": -7.56588077545166, "global_step": 28657, "epoch": 170} {"train_loss": -7.380914688110352, "global_step": 28658, "epoch": 170} {"train_loss": -7.401758670806885, "global_step": 28659, "epoch": 170} {"train_loss": -7.5198259353637695, "global_step": 28660, "epoch": 170} {"train_loss": -7.377490043640137, "global_step": 28661, "epoch": 170} {"train_loss": -7.150272369384766, "global_step": 28662, "epoch": 170} {"train_loss": -7.530008792877197, "global_step": 28663, "epoch": 170} {"train_loss": -7.293168067932129, "global_step": 28664, "epoch": 170} {"train_loss": -7.32070255279541, "global_step": 28665, "epoch": 170} {"train_loss": -7.3551025390625, "global_step": 28666, "epoch": 170} {"train_loss": -7.485528945922852, "global_step": 28667, "epoch": 170} {"train_loss": -7.387334823608398, "global_step": 28668, "epoch": 170} {"train_loss": -7.530692100524902, "global_step": 28669, "epoch": 170} {"train_loss": -7.187570095062256, "global_step": 28670, "epoch": 170} {"train_loss": -7.362850189208984, "global_step": 28671, "epoch": 170} {"train_loss": -7.238432884216309, "global_step": 28672, "epoch": 170} {"train_loss": -7.323268890380859, "global_step": 28673, "epoch": 170} {"train_loss": -7.371013164520264, "global_step": 28674, "epoch": 170} {"train_loss": -7.432120323181152, "global_step": 28675, "epoch": 170} {"train_loss": -7.429476261138916, "global_step": 28676, "epoch": 170} {"train_loss": -6.945822715759277, "global_step": 28677, "epoch": 170} {"train_loss": -7.205175876617432, "global_step": 28678, "epoch": 170} {"train_loss": -7.084745407104492, "global_step": 28679, "epoch": 170} {"train_loss": -7.344479084014893, "global_step": 28680, "epoch": 170} {"train_loss": -7.184855937957764, "global_step": 28681, "epoch": 170} {"train_loss": -7.126936912536621, "global_step": 28682, "epoch": 170} {"train_loss": -7.102001667022705, "global_step": 28683, "epoch": 170} {"train_loss": -7.284156799316406, "global_step": 28684, "epoch": 170} {"train_loss": -7.174442291259766, "global_step": 28685, "epoch": 170} {"train_loss": -7.249398231506348, "global_step": 28686, "epoch": 170} {"train_loss": -7.280012607574463, "global_step": 28687, "epoch": 170} {"train_loss": -7.244241714477539, "global_step": 28688, "epoch": 170} {"train_loss": -7.212319374084473, "global_step": 28689, "epoch": 170} {"train_loss": -7.145590782165527, "global_step": 28690, "epoch": 170} {"train_loss": -7.28852653503418, "global_step": 28691, "epoch": 170} {"train_loss": -7.339079856872559, "global_step": 28692, "epoch": 170} {"train_loss": -7.10756778717041, "global_step": 28693, "epoch": 170} {"train_loss": -7.380559921264648, "global_step": 28694, "epoch": 170} {"train_loss": -7.199419975280762, "global_step": 28695, "epoch": 170} {"train_loss": -7.406782150268555, "global_step": 28696, "epoch": 170} {"train_loss": -7.400914192199707, "global_step": 28697, "epoch": 170} {"train_loss": -7.531139373779297, "global_step": 28698, "epoch": 170} {"train_loss": -7.4180803298950195, "global_step": 28699, "epoch": 170} {"train_loss": -7.482451438903809, "global_step": 28700, "epoch": 170} {"train_loss": -7.217763900756836, "global_step": 28701, "epoch": 170} {"train_loss": -7.383902549743652, "global_step": 28702, "epoch": 170} {"train_loss": -7.522263526916504, "global_step": 28703, "epoch": 170} {"train_loss": -7.6083984375, "global_step": 28704, "epoch": 170} {"train_loss": -7.68654203414917, "global_step": 28705, "epoch": 170} {"train_loss": -7.549720287322998, "global_step": 28706, "epoch": 170} {"train_loss": -7.685667514801025, "global_step": 28707, "epoch": 170} {"train_loss": -7.468398571014404, "global_step": 28708, "epoch": 170} {"train_loss": -7.593768119812012, "global_step": 28709, "epoch": 170} {"train_loss": -7.558595180511475, "global_step": 28710, "epoch": 170} {"train_loss": -7.518106460571289, "global_step": 28711, "epoch": 170} {"train_loss": -7.408212184906006, "global_step": 28712, "epoch": 170} {"train_loss": -7.333253860473633, "global_step": 28713, "epoch": 170} {"train_loss": -7.586410045623779, "global_step": 28714, "epoch": 170} {"train_loss": -7.376923084259033, "global_step": 28715, "epoch": 170} {"train_loss": -7.4275336265563965, "global_step": 28716, "epoch": 170} {"train_loss": -7.242349624633789, "global_step": 28717, "epoch": 170} {"train_loss": -7.372922897338867, "global_step": 28718, "epoch": 170} {"train_loss": -7.207755088806152, "global_step": 28719, "epoch": 170} {"train_loss": -7.077172756195068, "global_step": 28720, "epoch": 170} {"train_loss": -7.191235542297363, "global_step": 28721, "epoch": 170} {"train_loss": -7.325421333312988, "global_step": 28722, "epoch": 170} {"train_loss": -7.248401641845703, "global_step": 28723, "epoch": 170} {"train_loss": -7.316997528076172, "global_step": 28724, "epoch": 170} {"train_loss": -7.397778511047363, "global_step": 28725, "epoch": 170} {"train_loss": -7.16884708404541, "global_step": 28726, "epoch": 170} {"train_loss": -7.33586292323612, "global_step": 28727, "epoch": 170, "val_loss": 191635.546875, "train_action_mse_error": 18.46111488342285} {"train_loss": -7.335842609405518, "global_step": 28728, "epoch": 171} {"train_loss": -7.525591850280762, "global_step": 28729, "epoch": 171} {"train_loss": -7.246850490570068, "global_step": 28730, "epoch": 171} {"train_loss": -7.4333295822143555, "global_step": 28731, "epoch": 171} {"train_loss": -7.501169681549072, "global_step": 28732, "epoch": 171} {"train_loss": -7.5542449951171875, "global_step": 28733, "epoch": 171} {"train_loss": -7.299528121948242, "global_step": 28734, "epoch": 171} {"train_loss": -7.480060577392578, "global_step": 28735, "epoch": 171} {"train_loss": -7.563072681427002, "global_step": 28736, "epoch": 171} {"train_loss": -7.3372955322265625, "global_step": 28737, "epoch": 171} {"train_loss": -7.428005695343018, "global_step": 28738, "epoch": 171} {"train_loss": -7.536555767059326, "global_step": 28739, "epoch": 171} {"train_loss": -7.2795820236206055, "global_step": 28740, "epoch": 171} {"train_loss": -7.659996509552002, "global_step": 28741, "epoch": 171} {"train_loss": -7.317014694213867, "global_step": 28742, "epoch": 171} {"train_loss": -7.586726665496826, "global_step": 28743, "epoch": 171} {"train_loss": -7.526388168334961, "global_step": 28744, "epoch": 171} {"train_loss": -7.477967262268066, "global_step": 28745, "epoch": 171} {"train_loss": -7.287293434143066, "global_step": 28746, "epoch": 171} {"train_loss": -7.6281890869140625, "global_step": 28747, "epoch": 171} {"train_loss": -7.304887771606445, "global_step": 28748, "epoch": 171} {"train_loss": -7.535547256469727, "global_step": 28749, "epoch": 171} {"train_loss": -7.351191520690918, "global_step": 28750, "epoch": 171} {"train_loss": -7.402878761291504, "global_step": 28751, "epoch": 171} {"train_loss": -7.279292106628418, "global_step": 28752, "epoch": 171} {"train_loss": -7.576250076293945, "global_step": 28753, "epoch": 171} {"train_loss": -7.540164947509766, "global_step": 28754, "epoch": 171} {"train_loss": -7.606463432312012, "global_step": 28755, "epoch": 171} {"train_loss": -7.472329616546631, "global_step": 28756, "epoch": 171} {"train_loss": -7.364810466766357, "global_step": 28757, "epoch": 171} {"train_loss": -7.206381797790527, "global_step": 28758, "epoch": 171} {"train_loss": -7.487519264221191, "global_step": 28759, "epoch": 171} {"train_loss": -7.6516571044921875, "global_step": 28760, "epoch": 171} {"train_loss": -7.500909805297852, "global_step": 28761, "epoch": 171} {"train_loss": -7.452502250671387, "global_step": 28762, "epoch": 171} {"train_loss": -7.362653732299805, "global_step": 28763, "epoch": 171} {"train_loss": -7.520797252655029, "global_step": 28764, "epoch": 171} {"train_loss": -7.260288238525391, "global_step": 28765, "epoch": 171} {"train_loss": -7.293961524963379, "global_step": 28766, "epoch": 171} {"train_loss": -7.1067633628845215, "global_step": 28767, "epoch": 171} {"train_loss": -7.549454689025879, "global_step": 28768, "epoch": 171} {"train_loss": -7.351289749145508, "global_step": 28769, "epoch": 171} {"train_loss": -7.281196594238281, "global_step": 28770, "epoch": 171} {"train_loss": -7.384345054626465, "global_step": 28771, "epoch": 171} {"train_loss": -7.381290435791016, "global_step": 28772, "epoch": 171} {"train_loss": -7.283646583557129, "global_step": 28773, "epoch": 171} {"train_loss": -7.35975980758667, "global_step": 28774, "epoch": 171} {"train_loss": -7.409102439880371, "global_step": 28775, "epoch": 171} {"train_loss": -7.416912078857422, "global_step": 28776, "epoch": 171} {"train_loss": -7.477962970733643, "global_step": 28777, "epoch": 171} {"train_loss": -7.422688007354736, "global_step": 28778, "epoch": 171} {"train_loss": -7.625714302062988, "global_step": 28779, "epoch": 171} {"train_loss": -7.605226039886475, "global_step": 28780, "epoch": 171} {"train_loss": -7.594480037689209, "global_step": 28781, "epoch": 171} {"train_loss": -7.434519290924072, "global_step": 28782, "epoch": 171} {"train_loss": -7.735538482666016, "global_step": 28783, "epoch": 171} {"train_loss": -7.472719192504883, "global_step": 28784, "epoch": 171} {"train_loss": -7.733221054077148, "global_step": 28785, "epoch": 171} {"train_loss": -7.610363960266113, "global_step": 28786, "epoch": 171} {"train_loss": -7.58351469039917, "global_step": 28787, "epoch": 171} {"train_loss": -7.400309085845947, "global_step": 28788, "epoch": 171} {"train_loss": -7.435739517211914, "global_step": 28789, "epoch": 171} {"train_loss": -7.295408248901367, "global_step": 28790, "epoch": 171} {"train_loss": -7.416442394256592, "global_step": 28791, "epoch": 171} {"train_loss": -7.629825592041016, "global_step": 28792, "epoch": 171} {"train_loss": -7.2958478927612305, "global_step": 28793, "epoch": 171} {"train_loss": -7.561389446258545, "global_step": 28794, "epoch": 171} {"train_loss": -7.48764181137085, "global_step": 28795, "epoch": 171} {"train_loss": -7.375488758087158, "global_step": 28796, "epoch": 171} {"train_loss": -7.280306816101074, "global_step": 28797, "epoch": 171} {"train_loss": -7.402568817138672, "global_step": 28798, "epoch": 171} {"train_loss": -7.338461399078369, "global_step": 28799, "epoch": 171} {"train_loss": -7.598982810974121, "global_step": 28800, "epoch": 171} {"train_loss": -7.358415126800537, "global_step": 28801, "epoch": 171} {"train_loss": -7.454697608947754, "global_step": 28802, "epoch": 171} {"train_loss": -7.268310070037842, "global_step": 28803, "epoch": 171} {"train_loss": -7.248027801513672, "global_step": 28804, "epoch": 171} {"train_loss": -7.104763031005859, "global_step": 28805, "epoch": 171} {"train_loss": -7.180120468139648, "global_step": 28806, "epoch": 171} {"train_loss": -7.133566379547119, "global_step": 28807, "epoch": 171} {"train_loss": -7.070631980895996, "global_step": 28808, "epoch": 171} {"train_loss": -7.293972015380859, "global_step": 28809, "epoch": 171} {"train_loss": -7.103736877441406, "global_step": 28810, "epoch": 171} {"train_loss": -7.225849151611328, "global_step": 28811, "epoch": 171} {"train_loss": -7.323932647705078, "global_step": 28812, "epoch": 171} {"train_loss": -7.016070365905762, "global_step": 28813, "epoch": 171} {"train_loss": -7.147589683532715, "global_step": 28814, "epoch": 171} {"train_loss": -7.23866605758667, "global_step": 28815, "epoch": 171} {"train_loss": -7.258338928222656, "global_step": 28816, "epoch": 171} {"train_loss": -7.3714423179626465, "global_step": 28817, "epoch": 171} {"train_loss": -6.99930477142334, "global_step": 28818, "epoch": 171} {"train_loss": -7.330633163452148, "global_step": 28819, "epoch": 171} {"train_loss": -7.343270301818848, "global_step": 28820, "epoch": 171} {"train_loss": -7.327924728393555, "global_step": 28821, "epoch": 171} {"train_loss": -7.36562442779541, "global_step": 28822, "epoch": 171} {"train_loss": -7.599100112915039, "global_step": 28823, "epoch": 171} {"train_loss": -7.437695503234863, "global_step": 28824, "epoch": 171} {"train_loss": -7.419549942016602, "global_step": 28825, "epoch": 171} {"train_loss": -7.315253257751465, "global_step": 28826, "epoch": 171} {"train_loss": -7.609199047088623, "global_step": 28827, "epoch": 171} {"train_loss": -7.442256927490234, "global_step": 28828, "epoch": 171} {"train_loss": -7.45824670791626, "global_step": 28829, "epoch": 171} {"train_loss": -7.3662519454956055, "global_step": 28830, "epoch": 171} {"train_loss": -7.43675422668457, "global_step": 28831, "epoch": 171} {"train_loss": -7.530484676361084, "global_step": 28832, "epoch": 171} {"train_loss": -7.546404838562012, "global_step": 28833, "epoch": 171} {"train_loss": -7.245420455932617, "global_step": 28834, "epoch": 171} {"train_loss": -7.492565631866455, "global_step": 28835, "epoch": 171} {"train_loss": -7.397593975067139, "global_step": 28836, "epoch": 171} {"train_loss": -7.406493186950684, "global_step": 28837, "epoch": 171} {"train_loss": -7.348212242126465, "global_step": 28838, "epoch": 171} {"train_loss": -7.574406623840332, "global_step": 28839, "epoch": 171} {"train_loss": -7.449209213256836, "global_step": 28840, "epoch": 171} {"train_loss": -7.297178268432617, "global_step": 28841, "epoch": 171} {"train_loss": -7.381293296813965, "global_step": 28842, "epoch": 171} {"train_loss": -7.289274215698242, "global_step": 28843, "epoch": 171} {"train_loss": -7.564034461975098, "global_step": 28844, "epoch": 171} {"train_loss": -7.34669303894043, "global_step": 28845, "epoch": 171} {"train_loss": -7.460951328277588, "global_step": 28846, "epoch": 171} {"train_loss": -7.227704048156738, "global_step": 28847, "epoch": 171} {"train_loss": -7.431816101074219, "global_step": 28848, "epoch": 171} {"train_loss": -7.404888153076172, "global_step": 28849, "epoch": 171} {"train_loss": -7.413175582885742, "global_step": 28850, "epoch": 171} {"train_loss": -7.393502235412598, "global_step": 28851, "epoch": 171} {"train_loss": -7.419745445251465, "global_step": 28852, "epoch": 171} {"train_loss": -7.391442775726318, "global_step": 28853, "epoch": 171} {"train_loss": -7.370615005493164, "global_step": 28854, "epoch": 171} {"train_loss": -7.341081619262695, "global_step": 28855, "epoch": 171} {"train_loss": -7.440701961517334, "global_step": 28856, "epoch": 171} {"train_loss": -7.295829772949219, "global_step": 28857, "epoch": 171} {"train_loss": -7.424452781677246, "global_step": 28858, "epoch": 171} {"train_loss": -7.478903293609619, "global_step": 28859, "epoch": 171} {"train_loss": -7.416970252990723, "global_step": 28860, "epoch": 171} {"train_loss": -7.144773483276367, "global_step": 28861, "epoch": 171} {"train_loss": -7.606026649475098, "global_step": 28862, "epoch": 171} {"train_loss": -7.166884899139404, "global_step": 28863, "epoch": 171} {"train_loss": -7.539904594421387, "global_step": 28864, "epoch": 171} {"train_loss": -7.215910911560059, "global_step": 28865, "epoch": 171} {"train_loss": -7.326108932495117, "global_step": 28866, "epoch": 171} {"train_loss": -7.484647274017334, "global_step": 28867, "epoch": 171} {"train_loss": -7.195151329040527, "global_step": 28868, "epoch": 171} {"train_loss": -7.59282112121582, "global_step": 28869, "epoch": 171} {"train_loss": -7.136923313140869, "global_step": 28870, "epoch": 171} {"train_loss": -7.531161308288574, "global_step": 28871, "epoch": 171} {"train_loss": -7.533023357391357, "global_step": 28872, "epoch": 171} {"train_loss": -7.263798713684082, "global_step": 28873, "epoch": 171} {"train_loss": -7.266507148742676, "global_step": 28874, "epoch": 171} {"train_loss": -7.490355491638184, "global_step": 28875, "epoch": 171} {"train_loss": -7.412614822387695, "global_step": 28876, "epoch": 171} {"train_loss": -7.307679176330566, "global_step": 28877, "epoch": 171} {"train_loss": -7.310493469238281, "global_step": 28878, "epoch": 171} {"train_loss": -7.3199872970581055, "global_step": 28879, "epoch": 171} {"train_loss": -7.446499824523926, "global_step": 28880, "epoch": 171} {"train_loss": -7.481144428253174, "global_step": 28881, "epoch": 171} {"train_loss": -7.464098930358887, "global_step": 28882, "epoch": 171} {"train_loss": -7.393055438995361, "global_step": 28883, "epoch": 171} {"train_loss": -7.48281192779541, "global_step": 28884, "epoch": 171} {"train_loss": -7.315349578857422, "global_step": 28885, "epoch": 171} {"train_loss": -7.565074443817139, "global_step": 28886, "epoch": 171} {"train_loss": -7.525049209594727, "global_step": 28887, "epoch": 171} {"train_loss": -7.632730484008789, "global_step": 28888, "epoch": 171} {"train_loss": -7.575102806091309, "global_step": 28889, "epoch": 171} {"train_loss": -7.693345546722412, "global_step": 28890, "epoch": 171} {"train_loss": -7.6311492919921875, "global_step": 28891, "epoch": 171} {"train_loss": -7.495998859405518, "global_step": 28892, "epoch": 171} {"train_loss": -7.366287708282471, "global_step": 28893, "epoch": 171} {"train_loss": -7.5532636642456055, "global_step": 28894, "epoch": 171} {"train_loss": -7.40739996944155, "global_step": 28895, "epoch": 171, "val_loss": 191354.828125} {"train_loss": -7.478264808654785, "global_step": 28896, "epoch": 172} {"train_loss": -7.43411922454834, "global_step": 28897, "epoch": 172} {"train_loss": -7.6111860275268555, "global_step": 28898, "epoch": 172} {"train_loss": -7.351678371429443, "global_step": 28899, "epoch": 172} {"train_loss": -7.433776378631592, "global_step": 28900, "epoch": 172} {"train_loss": -7.526889324188232, "global_step": 28901, "epoch": 172} {"train_loss": -7.332154750823975, "global_step": 28902, "epoch": 172} {"train_loss": -7.369563102722168, "global_step": 28903, "epoch": 172} {"train_loss": -7.377772808074951, "global_step": 28904, "epoch": 172} {"train_loss": -7.153727054595947, "global_step": 28905, "epoch": 172} {"train_loss": -7.3811798095703125, "global_step": 28906, "epoch": 172} {"train_loss": -7.339366912841797, "global_step": 28907, "epoch": 172} {"train_loss": -7.340636253356934, "global_step": 28908, "epoch": 172} {"train_loss": -7.430736064910889, "global_step": 28909, "epoch": 172} {"train_loss": -7.217039108276367, "global_step": 28910, "epoch": 172} {"train_loss": -7.380157470703125, "global_step": 28911, "epoch": 172} {"train_loss": -7.317020416259766, "global_step": 28912, "epoch": 172} {"train_loss": -7.15982723236084, "global_step": 28913, "epoch": 172} {"train_loss": -7.417827129364014, "global_step": 28914, "epoch": 172} {"train_loss": -7.330794334411621, "global_step": 28915, "epoch": 172} {"train_loss": -7.327469825744629, "global_step": 28916, "epoch": 172} {"train_loss": -7.436000823974609, "global_step": 28917, "epoch": 172} {"train_loss": -7.365970134735107, "global_step": 28918, "epoch": 172} {"train_loss": -7.364781379699707, "global_step": 28919, "epoch": 172} {"train_loss": -7.300763130187988, "global_step": 28920, "epoch": 172} {"train_loss": -7.533039093017578, "global_step": 28921, "epoch": 172} {"train_loss": -7.699524879455566, "global_step": 28922, "epoch": 172} {"train_loss": -7.447615623474121, "global_step": 28923, "epoch": 172} {"train_loss": -7.359339714050293, "global_step": 28924, "epoch": 172} {"train_loss": -7.209660053253174, "global_step": 28925, "epoch": 172} {"train_loss": -7.285778999328613, "global_step": 28926, "epoch": 172} {"train_loss": -7.455008506774902, "global_step": 28927, "epoch": 172} {"train_loss": -7.411166667938232, "global_step": 28928, "epoch": 172} {"train_loss": -7.547638416290283, "global_step": 28929, "epoch": 172} {"train_loss": -7.5798234939575195, "global_step": 28930, "epoch": 172} {"train_loss": -7.464770317077637, "global_step": 28931, "epoch": 172} {"train_loss": -7.363491058349609, "global_step": 28932, "epoch": 172} {"train_loss": -7.459968566894531, "global_step": 28933, "epoch": 172} {"train_loss": -7.43668270111084, "global_step": 28934, "epoch": 172} {"train_loss": -7.295568466186523, "global_step": 28935, "epoch": 172} {"train_loss": -7.3235626220703125, "global_step": 28936, "epoch": 172} {"train_loss": -7.439082622528076, "global_step": 28937, "epoch": 172} {"train_loss": -7.499356746673584, "global_step": 28938, "epoch": 172} {"train_loss": -7.142595291137695, "global_step": 28939, "epoch": 172} {"train_loss": -7.5672926902771, "global_step": 28940, "epoch": 172} {"train_loss": -7.263596057891846, "global_step": 28941, "epoch": 172} {"train_loss": -7.797629356384277, "global_step": 28942, "epoch": 172} {"train_loss": -7.480072975158691, "global_step": 28943, "epoch": 172} {"train_loss": -7.2436370849609375, "global_step": 28944, "epoch": 172} {"train_loss": -7.790806770324707, "global_step": 28945, "epoch": 172} {"train_loss": -7.525979042053223, "global_step": 28946, "epoch": 172} {"train_loss": -7.651264190673828, "global_step": 28947, "epoch": 172} {"train_loss": -7.3860650062561035, "global_step": 28948, "epoch": 172} {"train_loss": -7.452435493469238, "global_step": 28949, "epoch": 172} {"train_loss": -7.256196022033691, "global_step": 28950, "epoch": 172} {"train_loss": -7.493633270263672, "global_step": 28951, "epoch": 172} {"train_loss": -7.110630035400391, "global_step": 28952, "epoch": 172} {"train_loss": -7.37487268447876, "global_step": 28953, "epoch": 172} {"train_loss": -7.202863693237305, "global_step": 28954, "epoch": 172} {"train_loss": -7.528464317321777, "global_step": 28955, "epoch": 172} {"train_loss": -7.280336380004883, "global_step": 28956, "epoch": 172} {"train_loss": -7.278253555297852, "global_step": 28957, "epoch": 172} {"train_loss": -7.127835750579834, "global_step": 28958, "epoch": 172} {"train_loss": -7.2981133460998535, "global_step": 28959, "epoch": 172} {"train_loss": -7.282133102416992, "global_step": 28960, "epoch": 172} {"train_loss": -7.225302219390869, "global_step": 28961, "epoch": 172} {"train_loss": -7.053542137145996, "global_step": 28962, "epoch": 172} {"train_loss": -7.3322367668151855, "global_step": 28963, "epoch": 172} {"train_loss": -7.080789089202881, "global_step": 28964, "epoch": 172} {"train_loss": -6.856986999511719, "global_step": 28965, "epoch": 172} {"train_loss": -7.189840316772461, "global_step": 28966, "epoch": 172} {"train_loss": -7.331887245178223, "global_step": 28967, "epoch": 172} {"train_loss": -7.419259071350098, "global_step": 28968, "epoch": 172} {"train_loss": -7.232671737670898, "global_step": 28969, "epoch": 172} {"train_loss": -7.35728645324707, "global_step": 28970, "epoch": 172} {"train_loss": -7.371140003204346, "global_step": 28971, "epoch": 172} {"train_loss": -7.54602575302124, "global_step": 28972, "epoch": 172} {"train_loss": -7.071315765380859, "global_step": 28973, "epoch": 172} {"train_loss": -7.3929338455200195, "global_step": 28974, "epoch": 172} {"train_loss": -7.410679817199707, "global_step": 28975, "epoch": 172} {"train_loss": -7.651485443115234, "global_step": 28976, "epoch": 172} {"train_loss": -7.2476606369018555, "global_step": 28977, "epoch": 172} {"train_loss": -7.567370414733887, "global_step": 28978, "epoch": 172} {"train_loss": -7.536870956420898, "global_step": 28979, "epoch": 172} {"train_loss": -7.540286064147949, "global_step": 28980, "epoch": 172} {"train_loss": -7.216707229614258, "global_step": 28981, "epoch": 172} {"train_loss": -7.387628555297852, "global_step": 28982, "epoch": 172} {"train_loss": -7.641353607177734, "global_step": 28983, "epoch": 172} {"train_loss": -7.427929878234863, "global_step": 28984, "epoch": 172} {"train_loss": -7.187086582183838, "global_step": 28985, "epoch": 172} {"train_loss": -7.543728351593018, "global_step": 28986, "epoch": 172} {"train_loss": -7.357346534729004, "global_step": 28987, "epoch": 172} {"train_loss": -7.3402509689331055, "global_step": 28988, "epoch": 172} {"train_loss": -7.392718315124512, "global_step": 28989, "epoch": 172} {"train_loss": -7.474634170532227, "global_step": 28990, "epoch": 172} {"train_loss": -7.343000888824463, "global_step": 28991, "epoch": 172} {"train_loss": -7.756474018096924, "global_step": 28992, "epoch": 172} {"train_loss": -7.505856037139893, "global_step": 28993, "epoch": 172} {"train_loss": -7.33591365814209, "global_step": 28994, "epoch": 172} {"train_loss": -7.393921852111816, "global_step": 28995, "epoch": 172} {"train_loss": -7.485660552978516, "global_step": 28996, "epoch": 172} {"train_loss": -7.47036075592041, "global_step": 28997, "epoch": 172} {"train_loss": -7.104094505310059, "global_step": 28998, "epoch": 172} {"train_loss": -7.4141411781311035, "global_step": 28999, "epoch": 172} {"train_loss": -7.405340671539307, "global_step": 29000, "epoch": 172} {"train_loss": -7.1667399406433105, "global_step": 29001, "epoch": 172} {"train_loss": -7.190319061279297, "global_step": 29002, "epoch": 172} {"train_loss": -7.43663215637207, "global_step": 29003, "epoch": 172} {"train_loss": -7.013568878173828, "global_step": 29004, "epoch": 172} {"train_loss": -7.302579879760742, "global_step": 29005, "epoch": 172} {"train_loss": -7.265317440032959, "global_step": 29006, "epoch": 172} {"train_loss": -7.40950345993042, "global_step": 29007, "epoch": 172} {"train_loss": -7.301540374755859, "global_step": 29008, "epoch": 172} {"train_loss": -7.374720573425293, "global_step": 29009, "epoch": 172} {"train_loss": -7.156280040740967, "global_step": 29010, "epoch": 172} {"train_loss": -6.67038631439209, "global_step": 29011, "epoch": 172} {"train_loss": -7.209733486175537, "global_step": 29012, "epoch": 172} {"train_loss": -7.2127461433410645, "global_step": 29013, "epoch": 172} {"train_loss": -7.105630874633789, "global_step": 29014, "epoch": 172} {"train_loss": -7.205380439758301, "global_step": 29015, "epoch": 172} {"train_loss": -7.265046119689941, "global_step": 29016, "epoch": 172} {"train_loss": -7.216236591339111, "global_step": 29017, "epoch": 172} {"train_loss": -7.325498104095459, "global_step": 29018, "epoch": 172} {"train_loss": -7.21502161026001, "global_step": 29019, "epoch": 172} {"train_loss": -7.308045864105225, "global_step": 29020, "epoch": 172} {"train_loss": -7.2438530921936035, "global_step": 29021, "epoch": 172} {"train_loss": -7.29767370223999, "global_step": 29022, "epoch": 172} {"train_loss": -7.563063144683838, "global_step": 29023, "epoch": 172} {"train_loss": -7.577382564544678, "global_step": 29024, "epoch": 172} {"train_loss": -7.4365620613098145, "global_step": 29025, "epoch": 172} {"train_loss": -7.361996650695801, "global_step": 29026, "epoch": 172} {"train_loss": -7.554398536682129, "global_step": 29027, "epoch": 172} {"train_loss": -7.307892799377441, "global_step": 29028, "epoch": 172} {"train_loss": -7.583438873291016, "global_step": 29029, "epoch": 172} {"train_loss": -7.421029567718506, "global_step": 29030, "epoch": 172} {"train_loss": -7.516399383544922, "global_step": 29031, "epoch": 172} {"train_loss": -7.529204368591309, "global_step": 29032, "epoch": 172} {"train_loss": -7.342861175537109, "global_step": 29033, "epoch": 172} {"train_loss": -7.471713542938232, "global_step": 29034, "epoch": 172} {"train_loss": -7.228824615478516, "global_step": 29035, "epoch": 172} {"train_loss": -7.581483840942383, "global_step": 29036, "epoch": 172} {"train_loss": -7.321903228759766, "global_step": 29037, "epoch": 172} {"train_loss": -7.389373779296875, "global_step": 29038, "epoch": 172} {"train_loss": -7.568586826324463, "global_step": 29039, "epoch": 172} {"train_loss": -7.439620494842529, "global_step": 29040, "epoch": 172} {"train_loss": -7.35004997253418, "global_step": 29041, "epoch": 172} {"train_loss": -6.621279716491699, "global_step": 29042, "epoch": 172} {"train_loss": -7.511164665222168, "global_step": 29043, "epoch": 172} {"train_loss": -6.947159767150879, "global_step": 29044, "epoch": 172} {"train_loss": -7.30385684967041, "global_step": 29045, "epoch": 172} {"train_loss": -7.3060760498046875, "global_step": 29046, "epoch": 172} {"train_loss": -7.379040718078613, "global_step": 29047, "epoch": 172} {"train_loss": -7.195518493652344, "global_step": 29048, "epoch": 172} {"train_loss": -7.340005397796631, "global_step": 29049, "epoch": 172} {"train_loss": -7.34696102142334, "global_step": 29050, "epoch": 172} {"train_loss": -7.3272199630737305, "global_step": 29051, "epoch": 172} {"train_loss": -7.199674606323242, "global_step": 29052, "epoch": 172} {"train_loss": -7.430227756500244, "global_step": 29053, "epoch": 172} {"train_loss": -7.559969902038574, "global_step": 29054, "epoch": 172} {"train_loss": -7.108402252197266, "global_step": 29055, "epoch": 172} {"train_loss": -7.332886695861816, "global_step": 29056, "epoch": 172} {"train_loss": -7.414478302001953, "global_step": 29057, "epoch": 172} {"train_loss": -7.149187088012695, "global_step": 29058, "epoch": 172} {"train_loss": -7.326131343841553, "global_step": 29059, "epoch": 172} {"train_loss": -7.347213268280029, "global_step": 29060, "epoch": 172} {"train_loss": -7.401362895965576, "global_step": 29061, "epoch": 172} {"train_loss": -7.369198322296143, "global_step": 29062, "epoch": 172} {"train_loss": -7.356268527961912, "global_step": 29063, "epoch": 172, "val_loss": 191730.671875} {"train_loss": -7.419449806213379, "global_step": 29064, "epoch": 173} {"train_loss": -7.539193153381348, "global_step": 29065, "epoch": 173} {"train_loss": -7.212397575378418, "global_step": 29066, "epoch": 173} {"train_loss": -7.308789253234863, "global_step": 29067, "epoch": 173} {"train_loss": -7.454803466796875, "global_step": 29068, "epoch": 173} {"train_loss": -7.3294758796691895, "global_step": 29069, "epoch": 173} {"train_loss": -7.557242393493652, "global_step": 29070, "epoch": 173} {"train_loss": -7.618049144744873, "global_step": 29071, "epoch": 173} {"train_loss": -7.39219856262207, "global_step": 29072, "epoch": 173} {"train_loss": -7.528770446777344, "global_step": 29073, "epoch": 173} {"train_loss": -7.557503700256348, "global_step": 29074, "epoch": 173} {"train_loss": -7.411191940307617, "global_step": 29075, "epoch": 173} {"train_loss": -7.674251079559326, "global_step": 29076, "epoch": 173} {"train_loss": -7.2157206535339355, "global_step": 29077, "epoch": 173} {"train_loss": -7.512674331665039, "global_step": 29078, "epoch": 173} {"train_loss": -7.032859802246094, "global_step": 29079, "epoch": 173} {"train_loss": -7.557119369506836, "global_step": 29080, "epoch": 173} {"train_loss": -7.221065998077393, "global_step": 29081, "epoch": 173} {"train_loss": -7.243062496185303, "global_step": 29082, "epoch": 173} {"train_loss": -7.40987491607666, "global_step": 29083, "epoch": 173} {"train_loss": -7.297976493835449, "global_step": 29084, "epoch": 173} {"train_loss": -7.25091552734375, "global_step": 29085, "epoch": 173} {"train_loss": -7.314219951629639, "global_step": 29086, "epoch": 173} {"train_loss": -7.352536201477051, "global_step": 29087, "epoch": 173} {"train_loss": -7.501469135284424, "global_step": 29088, "epoch": 173} {"train_loss": -7.451787948608398, "global_step": 29089, "epoch": 173} {"train_loss": -7.435771465301514, "global_step": 29090, "epoch": 173} {"train_loss": -7.32025146484375, "global_step": 29091, "epoch": 173} {"train_loss": -7.273908615112305, "global_step": 29092, "epoch": 173} {"train_loss": -7.445490837097168, "global_step": 29093, "epoch": 173} {"train_loss": -7.211536884307861, "global_step": 29094, "epoch": 173} {"train_loss": -7.294981956481934, "global_step": 29095, "epoch": 173} {"train_loss": -7.150041580200195, "global_step": 29096, "epoch": 173} {"train_loss": -6.990136623382568, "global_step": 29097, "epoch": 173} {"train_loss": -7.15742826461792, "global_step": 29098, "epoch": 173} {"train_loss": -7.35756778717041, "global_step": 29099, "epoch": 173} {"train_loss": -7.228593349456787, "global_step": 29100, "epoch": 173} {"train_loss": -7.316531181335449, "global_step": 29101, "epoch": 173} {"train_loss": -7.369981288909912, "global_step": 29102, "epoch": 173} {"train_loss": -7.242251396179199, "global_step": 29103, "epoch": 173} {"train_loss": -7.128222942352295, "global_step": 29104, "epoch": 173} {"train_loss": -7.285347938537598, "global_step": 29105, "epoch": 173} {"train_loss": -7.3129167556762695, "global_step": 29106, "epoch": 173} {"train_loss": -7.419826507568359, "global_step": 29107, "epoch": 173} {"train_loss": -7.344019889831543, "global_step": 29108, "epoch": 173} {"train_loss": -7.301544189453125, "global_step": 29109, "epoch": 173} {"train_loss": -7.351311683654785, "global_step": 29110, "epoch": 173} {"train_loss": -7.388073444366455, "global_step": 29111, "epoch": 173} {"train_loss": -7.395653247833252, "global_step": 29112, "epoch": 173} {"train_loss": -7.482857704162598, "global_step": 29113, "epoch": 173} {"train_loss": -7.266396522521973, "global_step": 29114, "epoch": 173} {"train_loss": -7.609055519104004, "global_step": 29115, "epoch": 173} {"train_loss": -7.411606788635254, "global_step": 29116, "epoch": 173} {"train_loss": -7.4242753982543945, "global_step": 29117, "epoch": 173} {"train_loss": -7.432778358459473, "global_step": 29118, "epoch": 173} {"train_loss": -7.498640537261963, "global_step": 29119, "epoch": 173} {"train_loss": -7.197778701782227, "global_step": 29120, "epoch": 173} {"train_loss": -7.373485565185547, "global_step": 29121, "epoch": 173} {"train_loss": -7.597898006439209, "global_step": 29122, "epoch": 173} {"train_loss": -7.408528804779053, "global_step": 29123, "epoch": 173} {"train_loss": -7.310914039611816, "global_step": 29124, "epoch": 173} {"train_loss": -7.534892559051514, "global_step": 29125, "epoch": 173} {"train_loss": -7.556583881378174, "global_step": 29126, "epoch": 173} {"train_loss": -7.728299140930176, "global_step": 29127, "epoch": 173} {"train_loss": -7.539974212646484, "global_step": 29128, "epoch": 173} {"train_loss": -7.633711814880371, "global_step": 29129, "epoch": 173} {"train_loss": -7.506416320800781, "global_step": 29130, "epoch": 173} {"train_loss": -7.746297836303711, "global_step": 29131, "epoch": 173} {"train_loss": -7.510260581970215, "global_step": 29132, "epoch": 173} {"train_loss": -7.33890438079834, "global_step": 29133, "epoch": 173} {"train_loss": -7.628725051879883, "global_step": 29134, "epoch": 173} {"train_loss": -7.647083282470703, "global_step": 29135, "epoch": 173} {"train_loss": -7.51317024230957, "global_step": 29136, "epoch": 173} {"train_loss": -7.402743339538574, "global_step": 29137, "epoch": 173} {"train_loss": -7.197096824645996, "global_step": 29138, "epoch": 173} {"train_loss": -7.597200393676758, "global_step": 29139, "epoch": 173} {"train_loss": -7.445711135864258, "global_step": 29140, "epoch": 173} {"train_loss": -7.474143981933594, "global_step": 29141, "epoch": 173} {"train_loss": -7.37467098236084, "global_step": 29142, "epoch": 173} {"train_loss": -7.187865734100342, "global_step": 29143, "epoch": 173} {"train_loss": -7.37747049331665, "global_step": 29144, "epoch": 173} {"train_loss": -7.339786052703857, "global_step": 29145, "epoch": 173} {"train_loss": -7.4211626052856445, "global_step": 29146, "epoch": 173} {"train_loss": -7.396428108215332, "global_step": 29147, "epoch": 173} {"train_loss": -7.244382381439209, "global_step": 29148, "epoch": 173} {"train_loss": -7.239116668701172, "global_step": 29149, "epoch": 173} {"train_loss": -7.362191200256348, "global_step": 29150, "epoch": 173} {"train_loss": -7.326938629150391, "global_step": 29151, "epoch": 173} {"train_loss": -7.316141128540039, "global_step": 29152, "epoch": 173} {"train_loss": -7.581076145172119, "global_step": 29153, "epoch": 173} {"train_loss": -7.357671737670898, "global_step": 29154, "epoch": 173} {"train_loss": -7.468828201293945, "global_step": 29155, "epoch": 173} {"train_loss": -7.518703460693359, "global_step": 29156, "epoch": 173} {"train_loss": -7.423328399658203, "global_step": 29157, "epoch": 173} {"train_loss": -7.561490535736084, "global_step": 29158, "epoch": 173} {"train_loss": -7.393438816070557, "global_step": 29159, "epoch": 173} {"train_loss": -7.437504291534424, "global_step": 29160, "epoch": 173} {"train_loss": -7.371089935302734, "global_step": 29161, "epoch": 173} {"train_loss": -7.703393936157227, "global_step": 29162, "epoch": 173} {"train_loss": -7.576176643371582, "global_step": 29163, "epoch": 173} {"train_loss": -7.455632209777832, "global_step": 29164, "epoch": 173} {"train_loss": -7.4545183181762695, "global_step": 29165, "epoch": 173} {"train_loss": -7.379928112030029, "global_step": 29166, "epoch": 173} {"train_loss": -7.362454414367676, "global_step": 29167, "epoch": 173} {"train_loss": -7.577400207519531, "global_step": 29168, "epoch": 173} {"train_loss": -7.64945650100708, "global_step": 29169, "epoch": 173} {"train_loss": -7.541385173797607, "global_step": 29170, "epoch": 173} {"train_loss": -7.267343521118164, "global_step": 29171, "epoch": 173} {"train_loss": -7.599964141845703, "global_step": 29172, "epoch": 173} {"train_loss": -7.510798454284668, "global_step": 29173, "epoch": 173} {"train_loss": -7.495593070983887, "global_step": 29174, "epoch": 173} {"train_loss": -7.600372314453125, "global_step": 29175, "epoch": 173} {"train_loss": -7.5713958740234375, "global_step": 29176, "epoch": 173} {"train_loss": -7.568328857421875, "global_step": 29177, "epoch": 173} {"train_loss": -7.601934432983398, "global_step": 29178, "epoch": 173} {"train_loss": -7.566348075866699, "global_step": 29179, "epoch": 173} {"train_loss": -7.775205612182617, "global_step": 29180, "epoch": 173} {"train_loss": -7.686546325683594, "global_step": 29181, "epoch": 173} {"train_loss": -7.509616851806641, "global_step": 29182, "epoch": 173} {"train_loss": -7.402651786804199, "global_step": 29183, "epoch": 173} {"train_loss": -7.709918022155762, "global_step": 29184, "epoch": 173} {"train_loss": -7.57267951965332, "global_step": 29185, "epoch": 173} {"train_loss": -7.213312149047852, "global_step": 29186, "epoch": 173} {"train_loss": -7.455235481262207, "global_step": 29187, "epoch": 173} {"train_loss": -7.634960174560547, "global_step": 29188, "epoch": 173} {"train_loss": -7.734233856201172, "global_step": 29189, "epoch": 173} {"train_loss": -7.6283721923828125, "global_step": 29190, "epoch": 173} {"train_loss": -7.321948051452637, "global_step": 29191, "epoch": 173} {"train_loss": -7.341418743133545, "global_step": 29192, "epoch": 173} {"train_loss": -7.492376804351807, "global_step": 29193, "epoch": 173} {"train_loss": -7.551688194274902, "global_step": 29194, "epoch": 173} {"train_loss": -7.392033576965332, "global_step": 29195, "epoch": 173} {"train_loss": -7.3593950271606445, "global_step": 29196, "epoch": 173} {"train_loss": -7.432610511779785, "global_step": 29197, "epoch": 173} {"train_loss": -7.340327262878418, "global_step": 29198, "epoch": 173} {"train_loss": -7.222304344177246, "global_step": 29199, "epoch": 173} {"train_loss": -7.328305244445801, "global_step": 29200, "epoch": 173} {"train_loss": -7.422826766967773, "global_step": 29201, "epoch": 173} {"train_loss": -7.2815446853637695, "global_step": 29202, "epoch": 173} {"train_loss": -7.352154731750488, "global_step": 29203, "epoch": 173} {"train_loss": -7.299507141113281, "global_step": 29204, "epoch": 173} {"train_loss": -7.508508682250977, "global_step": 29205, "epoch": 173} {"train_loss": -7.344172954559326, "global_step": 29206, "epoch": 173} {"train_loss": -7.385944366455078, "global_step": 29207, "epoch": 173} {"train_loss": -7.400291442871094, "global_step": 29208, "epoch": 173} {"train_loss": -7.2702789306640625, "global_step": 29209, "epoch": 173} {"train_loss": -7.407530784606934, "global_step": 29210, "epoch": 173} {"train_loss": -7.123746871948242, "global_step": 29211, "epoch": 173} {"train_loss": -7.457457542419434, "global_step": 29212, "epoch": 173} {"train_loss": -7.266376495361328, "global_step": 29213, "epoch": 173} {"train_loss": -7.579959869384766, "global_step": 29214, "epoch": 173} {"train_loss": -7.134612083435059, "global_step": 29215, "epoch": 173} {"train_loss": -7.325625419616699, "global_step": 29216, "epoch": 173} {"train_loss": -7.489027500152588, "global_step": 29217, "epoch": 173} {"train_loss": -7.266888618469238, "global_step": 29218, "epoch": 173} {"train_loss": -7.411370277404785, "global_step": 29219, "epoch": 173} {"train_loss": -7.240612983703613, "global_step": 29220, "epoch": 173} {"train_loss": -7.391668319702148, "global_step": 29221, "epoch": 173} {"train_loss": -7.4700093269348145, "global_step": 29222, "epoch": 173} {"train_loss": -7.397235870361328, "global_step": 29223, "epoch": 173} {"train_loss": -7.341965675354004, "global_step": 29224, "epoch": 173} {"train_loss": -7.109945297241211, "global_step": 29225, "epoch": 173} {"train_loss": -7.466280937194824, "global_step": 29226, "epoch": 173} {"train_loss": -7.211123466491699, "global_step": 29227, "epoch": 173} {"train_loss": -7.567795753479004, "global_step": 29228, "epoch": 173} {"train_loss": -7.3141984939575195, "global_step": 29229, "epoch": 173} {"train_loss": -7.254566192626953, "global_step": 29230, "epoch": 173} {"train_loss": -7.413647010212853, "global_step": 29231, "epoch": 173, "val_loss": 188897.4375} {"train_loss": -7.393669128417969, "global_step": 29232, "epoch": 174} {"train_loss": -7.357971668243408, "global_step": 29233, "epoch": 174} {"train_loss": -7.559081077575684, "global_step": 29234, "epoch": 174} {"train_loss": -7.367251873016357, "global_step": 29235, "epoch": 174} {"train_loss": -7.433087348937988, "global_step": 29236, "epoch": 174} {"train_loss": -7.477074146270752, "global_step": 29237, "epoch": 174} {"train_loss": -7.160818099975586, "global_step": 29238, "epoch": 174} {"train_loss": -7.309584617614746, "global_step": 29239, "epoch": 174} {"train_loss": -7.283166885375977, "global_step": 29240, "epoch": 174} {"train_loss": -7.328313827514648, "global_step": 29241, "epoch": 174} {"train_loss": -7.67678165435791, "global_step": 29242, "epoch": 174} {"train_loss": -7.469878673553467, "global_step": 29243, "epoch": 174} {"train_loss": -7.4053144454956055, "global_step": 29244, "epoch": 174} {"train_loss": -7.423275947570801, "global_step": 29245, "epoch": 174} {"train_loss": -7.584280967712402, "global_step": 29246, "epoch": 174} {"train_loss": -7.527190208435059, "global_step": 29247, "epoch": 174} {"train_loss": -7.641867160797119, "global_step": 29248, "epoch": 174} {"train_loss": -7.329431056976318, "global_step": 29249, "epoch": 174} {"train_loss": -7.766736030578613, "global_step": 29250, "epoch": 174} {"train_loss": -7.432703971862793, "global_step": 29251, "epoch": 174} {"train_loss": -7.629251480102539, "global_step": 29252, "epoch": 174} {"train_loss": -7.643180847167969, "global_step": 29253, "epoch": 174} {"train_loss": -7.539422988891602, "global_step": 29254, "epoch": 174} {"train_loss": -7.488764762878418, "global_step": 29255, "epoch": 174} {"train_loss": -7.574006080627441, "global_step": 29256, "epoch": 174} {"train_loss": -7.407578945159912, "global_step": 29257, "epoch": 174} {"train_loss": -7.505080699920654, "global_step": 29258, "epoch": 174} {"train_loss": -7.674544811248779, "global_step": 29259, "epoch": 174} {"train_loss": -7.621854305267334, "global_step": 29260, "epoch": 174} {"train_loss": -7.572096824645996, "global_step": 29261, "epoch": 174} {"train_loss": -7.664983749389648, "global_step": 29262, "epoch": 174} {"train_loss": -7.608280181884766, "global_step": 29263, "epoch": 174} {"train_loss": -7.56007719039917, "global_step": 29264, "epoch": 174} {"train_loss": -7.808803081512451, "global_step": 29265, "epoch": 174} {"train_loss": -7.366199493408203, "global_step": 29266, "epoch": 174} {"train_loss": -7.582339763641357, "global_step": 29267, "epoch": 174} {"train_loss": -7.004785537719727, "global_step": 29268, "epoch": 174} {"train_loss": -7.37669563293457, "global_step": 29269, "epoch": 174} {"train_loss": -7.60936164855957, "global_step": 29270, "epoch": 174} {"train_loss": -7.472150802612305, "global_step": 29271, "epoch": 174} {"train_loss": -7.373473167419434, "global_step": 29272, "epoch": 174} {"train_loss": -7.448113441467285, "global_step": 29273, "epoch": 174} {"train_loss": -7.390096187591553, "global_step": 29274, "epoch": 174} {"train_loss": -7.199479103088379, "global_step": 29275, "epoch": 174} {"train_loss": -7.510845184326172, "global_step": 29276, "epoch": 174} {"train_loss": -7.451132774353027, "global_step": 29277, "epoch": 174} {"train_loss": -7.294281005859375, "global_step": 29278, "epoch": 174} {"train_loss": -7.5276899337768555, "global_step": 29279, "epoch": 174} {"train_loss": -7.599789619445801, "global_step": 29280, "epoch": 174} {"train_loss": -7.395355701446533, "global_step": 29281, "epoch": 174} {"train_loss": -7.436351299285889, "global_step": 29282, "epoch": 174} {"train_loss": -7.323957443237305, "global_step": 29283, "epoch": 174} {"train_loss": -7.181681156158447, "global_step": 29284, "epoch": 174} {"train_loss": -7.432993412017822, "global_step": 29285, "epoch": 174} {"train_loss": -7.404187202453613, "global_step": 29286, "epoch": 174} {"train_loss": -7.1202497482299805, "global_step": 29287, "epoch": 174} {"train_loss": -7.2617902755737305, "global_step": 29288, "epoch": 174} {"train_loss": -7.347588539123535, "global_step": 29289, "epoch": 174} {"train_loss": -7.36160945892334, "global_step": 29290, "epoch": 174} {"train_loss": -7.5248942375183105, "global_step": 29291, "epoch": 174} {"train_loss": -7.3423004150390625, "global_step": 29292, "epoch": 174} {"train_loss": -7.493368148803711, "global_step": 29293, "epoch": 174} {"train_loss": -7.37158203125, "global_step": 29294, "epoch": 174} {"train_loss": -7.454959869384766, "global_step": 29295, "epoch": 174} {"train_loss": -7.547852039337158, "global_step": 29296, "epoch": 174} {"train_loss": -7.527340888977051, "global_step": 29297, "epoch": 174} {"train_loss": -7.442455291748047, "global_step": 29298, "epoch": 174} {"train_loss": -7.4038920402526855, "global_step": 29299, "epoch": 174} {"train_loss": -7.721917629241943, "global_step": 29300, "epoch": 174} {"train_loss": -7.486627578735352, "global_step": 29301, "epoch": 174} {"train_loss": -7.538753509521484, "global_step": 29302, "epoch": 174} {"train_loss": -7.521087646484375, "global_step": 29303, "epoch": 174} {"train_loss": -7.407925605773926, "global_step": 29304, "epoch": 174} {"train_loss": -7.333294868469238, "global_step": 29305, "epoch": 174} {"train_loss": -7.600472927093506, "global_step": 29306, "epoch": 174} {"train_loss": -7.362281799316406, "global_step": 29307, "epoch": 174} {"train_loss": -7.291735649108887, "global_step": 29308, "epoch": 174} {"train_loss": -7.372389316558838, "global_step": 29309, "epoch": 174} {"train_loss": -7.535635948181152, "global_step": 29310, "epoch": 174} {"train_loss": -7.5487565994262695, "global_step": 29311, "epoch": 174} {"train_loss": -7.433055877685547, "global_step": 29312, "epoch": 174} {"train_loss": -7.401169776916504, "global_step": 29313, "epoch": 174} {"train_loss": -7.3626275062561035, "global_step": 29314, "epoch": 174} {"train_loss": -7.5050530433654785, "global_step": 29315, "epoch": 174} {"train_loss": -7.676844596862793, "global_step": 29316, "epoch": 174} {"train_loss": -7.406630516052246, "global_step": 29317, "epoch": 174} {"train_loss": -7.3370232582092285, "global_step": 29318, "epoch": 174} {"train_loss": -7.602048397064209, "global_step": 29319, "epoch": 174} {"train_loss": -7.703745365142822, "global_step": 29320, "epoch": 174} {"train_loss": -7.500908851623535, "global_step": 29321, "epoch": 174} {"train_loss": -7.600336074829102, "global_step": 29322, "epoch": 174} {"train_loss": -7.426979064941406, "global_step": 29323, "epoch": 174} {"train_loss": -7.556482791900635, "global_step": 29324, "epoch": 174} {"train_loss": -7.619514465332031, "global_step": 29325, "epoch": 174} {"train_loss": -7.446983337402344, "global_step": 29326, "epoch": 174} {"train_loss": -7.622068405151367, "global_step": 29327, "epoch": 174} {"train_loss": -7.5299296379089355, "global_step": 29328, "epoch": 174} {"train_loss": -7.558423042297363, "global_step": 29329, "epoch": 174} {"train_loss": -7.553194999694824, "global_step": 29330, "epoch": 174} {"train_loss": -7.349712371826172, "global_step": 29331, "epoch": 174} {"train_loss": -7.51790714263916, "global_step": 29332, "epoch": 174} {"train_loss": -7.442379951477051, "global_step": 29333, "epoch": 174} {"train_loss": -7.391946792602539, "global_step": 29334, "epoch": 174} {"train_loss": -7.087245464324951, "global_step": 29335, "epoch": 174} {"train_loss": -7.278682231903076, "global_step": 29336, "epoch": 174} {"train_loss": -7.472245693206787, "global_step": 29337, "epoch": 174} {"train_loss": -7.536947250366211, "global_step": 29338, "epoch": 174} {"train_loss": -7.135509014129639, "global_step": 29339, "epoch": 174} {"train_loss": -7.401119232177734, "global_step": 29340, "epoch": 174} {"train_loss": -7.450927734375, "global_step": 29341, "epoch": 174} {"train_loss": -7.4905900955200195, "global_step": 29342, "epoch": 174} {"train_loss": -7.329672813415527, "global_step": 29343, "epoch": 174} {"train_loss": -7.619098663330078, "global_step": 29344, "epoch": 174} {"train_loss": -7.171156883239746, "global_step": 29345, "epoch": 174} {"train_loss": -7.5418009757995605, "global_step": 29346, "epoch": 174} {"train_loss": -7.4590654373168945, "global_step": 29347, "epoch": 174} {"train_loss": -7.3856096267700195, "global_step": 29348, "epoch": 174} {"train_loss": -7.3489580154418945, "global_step": 29349, "epoch": 174} {"train_loss": -7.3460893630981445, "global_step": 29350, "epoch": 174} {"train_loss": -7.5909318923950195, "global_step": 29351, "epoch": 174} {"train_loss": -7.250811576843262, "global_step": 29352, "epoch": 174} {"train_loss": -7.424807548522949, "global_step": 29353, "epoch": 174} {"train_loss": -7.594749927520752, "global_step": 29354, "epoch": 174} {"train_loss": -7.279029846191406, "global_step": 29355, "epoch": 174} {"train_loss": -7.627375602722168, "global_step": 29356, "epoch": 174} {"train_loss": -7.508449554443359, "global_step": 29357, "epoch": 174} {"train_loss": -7.608513832092285, "global_step": 29358, "epoch": 174} {"train_loss": -7.216815948486328, "global_step": 29359, "epoch": 174} {"train_loss": -7.571379661560059, "global_step": 29360, "epoch": 174} {"train_loss": -7.08975887298584, "global_step": 29361, "epoch": 174} {"train_loss": -7.534869194030762, "global_step": 29362, "epoch": 174} {"train_loss": -7.304375648498535, "global_step": 29363, "epoch": 174} {"train_loss": -7.225431442260742, "global_step": 29364, "epoch": 174} {"train_loss": -7.318641662597656, "global_step": 29365, "epoch": 174} {"train_loss": -7.454627990722656, "global_step": 29366, "epoch": 174} {"train_loss": -7.213467597961426, "global_step": 29367, "epoch": 174} {"train_loss": -7.540688514709473, "global_step": 29368, "epoch": 174} {"train_loss": -7.463063716888428, "global_step": 29369, "epoch": 174} {"train_loss": -7.293788909912109, "global_step": 29370, "epoch": 174} {"train_loss": -7.552374839782715, "global_step": 29371, "epoch": 174} {"train_loss": -7.416518211364746, "global_step": 29372, "epoch": 174} {"train_loss": -7.574855327606201, "global_step": 29373, "epoch": 174} {"train_loss": -7.365307807922363, "global_step": 29374, "epoch": 174} {"train_loss": -7.281097888946533, "global_step": 29375, "epoch": 174} {"train_loss": -7.277723789215088, "global_step": 29376, "epoch": 174} {"train_loss": -7.493985176086426, "global_step": 29377, "epoch": 174} {"train_loss": -7.2371110916137695, "global_step": 29378, "epoch": 174} {"train_loss": -7.461825370788574, "global_step": 29379, "epoch": 174} {"train_loss": -7.543368339538574, "global_step": 29380, "epoch": 174} {"train_loss": -7.284055709838867, "global_step": 29381, "epoch": 174} {"train_loss": -7.564182281494141, "global_step": 29382, "epoch": 174} {"train_loss": -7.524370193481445, "global_step": 29383, "epoch": 174} {"train_loss": -7.421088695526123, "global_step": 29384, "epoch": 174} {"train_loss": -7.516263961791992, "global_step": 29385, "epoch": 174} {"train_loss": -7.238282203674316, "global_step": 29386, "epoch": 174} {"train_loss": -7.432835578918457, "global_step": 29387, "epoch": 174} {"train_loss": -7.317376136779785, "global_step": 29388, "epoch": 174} {"train_loss": -7.42349910736084, "global_step": 29389, "epoch": 174} {"train_loss": -7.02400541305542, "global_step": 29390, "epoch": 174} {"train_loss": -7.385147571563721, "global_step": 29391, "epoch": 174} {"train_loss": -7.5569257736206055, "global_step": 29392, "epoch": 174} {"train_loss": -7.4982008934021, "global_step": 29393, "epoch": 174} {"train_loss": -7.4603986740112305, "global_step": 29394, "epoch": 174} {"train_loss": -7.49960994720459, "global_step": 29395, "epoch": 174} {"train_loss": -7.638791084289551, "global_step": 29396, "epoch": 174} {"train_loss": -7.327634811401367, "global_step": 29397, "epoch": 174} {"train_loss": -7.394719123840332, "global_step": 29398, "epoch": 174} {"train_loss": -7.441613759313311, "global_step": 29399, "epoch": 174, "val_loss": 189115.0} {"train_loss": -7.2534074783325195, "global_step": 29400, "epoch": 175} {"train_loss": -7.282106399536133, "global_step": 29401, "epoch": 175} {"train_loss": -7.42452335357666, "global_step": 29402, "epoch": 175} {"train_loss": -7.192712783813477, "global_step": 29403, "epoch": 175} {"train_loss": -7.036293983459473, "global_step": 29404, "epoch": 175} {"train_loss": -7.200414657592773, "global_step": 29405, "epoch": 175} {"train_loss": -7.369657039642334, "global_step": 29406, "epoch": 175} {"train_loss": -7.205959320068359, "global_step": 29407, "epoch": 175} {"train_loss": -7.406931400299072, "global_step": 29408, "epoch": 175} {"train_loss": -7.14069938659668, "global_step": 29409, "epoch": 175} {"train_loss": -7.287976264953613, "global_step": 29410, "epoch": 175} {"train_loss": -7.134693145751953, "global_step": 29411, "epoch": 175} {"train_loss": -7.362426280975342, "global_step": 29412, "epoch": 175} {"train_loss": -7.350297927856445, "global_step": 29413, "epoch": 175} {"train_loss": -7.305899620056152, "global_step": 29414, "epoch": 175} {"train_loss": -7.264688491821289, "global_step": 29415, "epoch": 175} {"train_loss": -7.137447834014893, "global_step": 29416, "epoch": 175} {"train_loss": -7.326835632324219, "global_step": 29417, "epoch": 175} {"train_loss": -7.114089012145996, "global_step": 29418, "epoch": 175} {"train_loss": -7.296232223510742, "global_step": 29419, "epoch": 175} {"train_loss": -7.180613994598389, "global_step": 29420, "epoch": 175} {"train_loss": -7.154600620269775, "global_step": 29421, "epoch": 175} {"train_loss": -6.8611602783203125, "global_step": 29422, "epoch": 175} {"train_loss": -7.152828216552734, "global_step": 29423, "epoch": 175} {"train_loss": -7.253652572631836, "global_step": 29424, "epoch": 175} {"train_loss": -7.21791410446167, "global_step": 29425, "epoch": 175} {"train_loss": -7.062309265136719, "global_step": 29426, "epoch": 175} {"train_loss": -7.314589500427246, "global_step": 29427, "epoch": 175} {"train_loss": -7.360818862915039, "global_step": 29428, "epoch": 175} {"train_loss": -7.202319622039795, "global_step": 29429, "epoch": 175} {"train_loss": -7.497533798217773, "global_step": 29430, "epoch": 175} {"train_loss": -7.374729633331299, "global_step": 29431, "epoch": 175} {"train_loss": -7.318401336669922, "global_step": 29432, "epoch": 175} {"train_loss": -7.3890790939331055, "global_step": 29433, "epoch": 175} {"train_loss": -7.329954147338867, "global_step": 29434, "epoch": 175} {"train_loss": -7.265576362609863, "global_step": 29435, "epoch": 175} {"train_loss": -7.39419412612915, "global_step": 29436, "epoch": 175} {"train_loss": -7.437185287475586, "global_step": 29437, "epoch": 175} {"train_loss": -7.285714149475098, "global_step": 29438, "epoch": 175} {"train_loss": -7.380113124847412, "global_step": 29439, "epoch": 175} {"train_loss": -7.540692329406738, "global_step": 29440, "epoch": 175} {"train_loss": -7.310601234436035, "global_step": 29441, "epoch": 175} {"train_loss": -7.441741466522217, "global_step": 29442, "epoch": 175} {"train_loss": -7.659296035766602, "global_step": 29443, "epoch": 175} {"train_loss": -7.4661359786987305, "global_step": 29444, "epoch": 175} {"train_loss": -7.56529426574707, "global_step": 29445, "epoch": 175} {"train_loss": -7.4929046630859375, "global_step": 29446, "epoch": 175} {"train_loss": -7.524425506591797, "global_step": 29447, "epoch": 175} {"train_loss": -7.484799385070801, "global_step": 29448, "epoch": 175} {"train_loss": -7.590514659881592, "global_step": 29449, "epoch": 175} {"train_loss": -7.752384185791016, "global_step": 29450, "epoch": 175} {"train_loss": -7.488175868988037, "global_step": 29451, "epoch": 175} {"train_loss": -7.85009241104126, "global_step": 29452, "epoch": 175} {"train_loss": -7.545047760009766, "global_step": 29453, "epoch": 175} {"train_loss": -7.474856853485107, "global_step": 29454, "epoch": 175} {"train_loss": -7.534079551696777, "global_step": 29455, "epoch": 175} {"train_loss": -7.808523178100586, "global_step": 29456, "epoch": 175} {"train_loss": -7.516533851623535, "global_step": 29457, "epoch": 175} {"train_loss": -7.653717994689941, "global_step": 29458, "epoch": 175} {"train_loss": -7.619631290435791, "global_step": 29459, "epoch": 175} {"train_loss": -7.628817558288574, "global_step": 29460, "epoch": 175} {"train_loss": -7.541565895080566, "global_step": 29461, "epoch": 175} {"train_loss": -7.533472061157227, "global_step": 29462, "epoch": 175} {"train_loss": -7.28635311126709, "global_step": 29463, "epoch": 175} {"train_loss": -7.612566947937012, "global_step": 29464, "epoch": 175} {"train_loss": -7.177541255950928, "global_step": 29465, "epoch": 175} {"train_loss": -7.263130187988281, "global_step": 29466, "epoch": 175} {"train_loss": -7.443619251251221, "global_step": 29467, "epoch": 175} {"train_loss": -7.263547897338867, "global_step": 29468, "epoch": 175} {"train_loss": -7.195271015167236, "global_step": 29469, "epoch": 175} {"train_loss": -7.253452301025391, "global_step": 29470, "epoch": 175} {"train_loss": -7.375544548034668, "global_step": 29471, "epoch": 175} {"train_loss": -7.3597846031188965, "global_step": 29472, "epoch": 175} {"train_loss": -7.2418975830078125, "global_step": 29473, "epoch": 175} {"train_loss": -7.442915439605713, "global_step": 29474, "epoch": 175} {"train_loss": -7.343741416931152, "global_step": 29475, "epoch": 175} {"train_loss": -7.396448135375977, "global_step": 29476, "epoch": 175} {"train_loss": -7.125371932983398, "global_step": 29477, "epoch": 175} {"train_loss": -7.2440385818481445, "global_step": 29478, "epoch": 175} {"train_loss": -7.193531036376953, "global_step": 29479, "epoch": 175} {"train_loss": -7.4973955154418945, "global_step": 29480, "epoch": 175} {"train_loss": -7.237397193908691, "global_step": 29481, "epoch": 175} {"train_loss": -7.286094665527344, "global_step": 29482, "epoch": 175} {"train_loss": -7.225358963012695, "global_step": 29483, "epoch": 175} {"train_loss": -7.20143985748291, "global_step": 29484, "epoch": 175} {"train_loss": -7.280368804931641, "global_step": 29485, "epoch": 175} {"train_loss": -7.598113059997559, "global_step": 29486, "epoch": 175} {"train_loss": -7.324521541595459, "global_step": 29487, "epoch": 175} {"train_loss": -7.417061805725098, "global_step": 29488, "epoch": 175} {"train_loss": -7.408389091491699, "global_step": 29489, "epoch": 175} {"train_loss": -7.432229995727539, "global_step": 29490, "epoch": 175} {"train_loss": -7.540894508361816, "global_step": 29491, "epoch": 175} {"train_loss": -7.598243713378906, "global_step": 29492, "epoch": 175} {"train_loss": -7.472004413604736, "global_step": 29493, "epoch": 175} {"train_loss": -7.394278526306152, "global_step": 29494, "epoch": 175} {"train_loss": -7.6290364265441895, "global_step": 29495, "epoch": 175} {"train_loss": -7.667361736297607, "global_step": 29496, "epoch": 175} {"train_loss": -7.5418877601623535, "global_step": 29497, "epoch": 175} {"train_loss": -7.501224994659424, "global_step": 29498, "epoch": 175} {"train_loss": -7.542927265167236, "global_step": 29499, "epoch": 175} {"train_loss": -7.326202869415283, "global_step": 29500, "epoch": 175} {"train_loss": -7.47429084777832, "global_step": 29501, "epoch": 175} {"train_loss": -7.355823516845703, "global_step": 29502, "epoch": 175} {"train_loss": -7.6066179275512695, "global_step": 29503, "epoch": 175} {"train_loss": -7.5418901443481445, "global_step": 29504, "epoch": 175} {"train_loss": -7.378787994384766, "global_step": 29505, "epoch": 175} {"train_loss": -7.509077072143555, "global_step": 29506, "epoch": 175} {"train_loss": -7.347395896911621, "global_step": 29507, "epoch": 175} {"train_loss": -7.480084419250488, "global_step": 29508, "epoch": 175} {"train_loss": -7.639406204223633, "global_step": 29509, "epoch": 175} {"train_loss": -7.431003570556641, "global_step": 29510, "epoch": 175} {"train_loss": -7.377993106842041, "global_step": 29511, "epoch": 175} {"train_loss": -7.4636030197143555, "global_step": 29512, "epoch": 175} {"train_loss": -7.451737403869629, "global_step": 29513, "epoch": 175} {"train_loss": -7.6480817794799805, "global_step": 29514, "epoch": 175} {"train_loss": -7.639314651489258, "global_step": 29515, "epoch": 175} {"train_loss": -7.657041072845459, "global_step": 29516, "epoch": 175} {"train_loss": -7.407155513763428, "global_step": 29517, "epoch": 175} {"train_loss": -7.547816276550293, "global_step": 29518, "epoch": 175} {"train_loss": -7.621349334716797, "global_step": 29519, "epoch": 175} {"train_loss": -7.4949188232421875, "global_step": 29520, "epoch": 175} {"train_loss": -7.418088912963867, "global_step": 29521, "epoch": 175} {"train_loss": -7.526721954345703, "global_step": 29522, "epoch": 175} {"train_loss": -7.398719310760498, "global_step": 29523, "epoch": 175} {"train_loss": -7.435011863708496, "global_step": 29524, "epoch": 175} {"train_loss": -7.665555000305176, "global_step": 29525, "epoch": 175} {"train_loss": -7.44536018371582, "global_step": 29526, "epoch": 175} {"train_loss": -7.440752029418945, "global_step": 29527, "epoch": 175} {"train_loss": -7.525548934936523, "global_step": 29528, "epoch": 175} {"train_loss": -7.522568702697754, "global_step": 29529, "epoch": 175} {"train_loss": -7.696600914001465, "global_step": 29530, "epoch": 175} {"train_loss": -7.425165176391602, "global_step": 29531, "epoch": 175} {"train_loss": -7.547512531280518, "global_step": 29532, "epoch": 175} {"train_loss": -7.507302284240723, "global_step": 29533, "epoch": 175} {"train_loss": -7.597161293029785, "global_step": 29534, "epoch": 175} {"train_loss": -7.5233235359191895, "global_step": 29535, "epoch": 175} {"train_loss": -7.344768524169922, "global_step": 29536, "epoch": 175} {"train_loss": -7.299411773681641, "global_step": 29537, "epoch": 175} {"train_loss": -7.642709732055664, "global_step": 29538, "epoch": 175} {"train_loss": -7.347358703613281, "global_step": 29539, "epoch": 175} {"train_loss": -7.4996657371521, "global_step": 29540, "epoch": 175} {"train_loss": -7.295907974243164, "global_step": 29541, "epoch": 175} {"train_loss": -7.497214317321777, "global_step": 29542, "epoch": 175} {"train_loss": -7.606090545654297, "global_step": 29543, "epoch": 175} {"train_loss": -7.608170509338379, "global_step": 29544, "epoch": 175} {"train_loss": -7.455636024475098, "global_step": 29545, "epoch": 175} {"train_loss": -7.317577362060547, "global_step": 29546, "epoch": 175} {"train_loss": -7.530976295471191, "global_step": 29547, "epoch": 175} {"train_loss": -7.363576412200928, "global_step": 29548, "epoch": 175} {"train_loss": -7.565730094909668, "global_step": 29549, "epoch": 175} {"train_loss": -7.549910068511963, "global_step": 29550, "epoch": 175} {"train_loss": -7.372653961181641, "global_step": 29551, "epoch": 175} {"train_loss": -7.75434684753418, "global_step": 29552, "epoch": 175} {"train_loss": -7.629175186157227, "global_step": 29553, "epoch": 175} {"train_loss": -7.54880428314209, "global_step": 29554, "epoch": 175} {"train_loss": -7.490163803100586, "global_step": 29555, "epoch": 175} {"train_loss": -7.471278190612793, "global_step": 29556, "epoch": 175} {"train_loss": -7.430196762084961, "global_step": 29557, "epoch": 175} {"train_loss": -7.418712615966797, "global_step": 29558, "epoch": 175} {"train_loss": -7.631339073181152, "global_step": 29559, "epoch": 175} {"train_loss": -7.564496994018555, "global_step": 29560, "epoch": 175} {"train_loss": -7.360908031463623, "global_step": 29561, "epoch": 175} {"train_loss": -7.396597862243652, "global_step": 29562, "epoch": 175} {"train_loss": -7.468809604644775, "global_step": 29563, "epoch": 175} {"train_loss": -7.561966896057129, "global_step": 29564, "epoch": 175} {"train_loss": -7.501476287841797, "global_step": 29565, "epoch": 175} {"train_loss": -7.394599914550781, "global_step": 29566, "epoch": 175} {"train_loss": -7.423114603474026, "global_step": 29567, "epoch": 175, "val_loss": 192858.03125, "train_action_mse_error": 8.657953262329102} {"train_loss": -7.507262706756592, "global_step": 29568, "epoch": 176} {"train_loss": -7.653730392456055, "global_step": 29569, "epoch": 176} {"train_loss": -7.172770977020264, "global_step": 29570, "epoch": 176} {"train_loss": -7.513894081115723, "global_step": 29571, "epoch": 176} {"train_loss": -7.642441749572754, "global_step": 29572, "epoch": 176} {"train_loss": -7.301092624664307, "global_step": 29573, "epoch": 176} {"train_loss": -7.124948978424072, "global_step": 29574, "epoch": 176} {"train_loss": -7.253572463989258, "global_step": 29575, "epoch": 176} {"train_loss": -7.375316143035889, "global_step": 29576, "epoch": 176} {"train_loss": -7.384138584136963, "global_step": 29577, "epoch": 176} {"train_loss": -7.431587219238281, "global_step": 29578, "epoch": 176} {"train_loss": -7.1280083656311035, "global_step": 29579, "epoch": 176} {"train_loss": -7.345941543579102, "global_step": 29580, "epoch": 176} {"train_loss": -7.521998405456543, "global_step": 29581, "epoch": 176} {"train_loss": -7.5078020095825195, "global_step": 29582, "epoch": 176} {"train_loss": -7.378596782684326, "global_step": 29583, "epoch": 176} {"train_loss": -7.176926612854004, "global_step": 29584, "epoch": 176} {"train_loss": -7.415568828582764, "global_step": 29585, "epoch": 176} {"train_loss": -7.204949378967285, "global_step": 29586, "epoch": 176} {"train_loss": -7.441525459289551, "global_step": 29587, "epoch": 176} {"train_loss": -7.261635780334473, "global_step": 29588, "epoch": 176} {"train_loss": -7.387534141540527, "global_step": 29589, "epoch": 176} {"train_loss": -7.267141342163086, "global_step": 29590, "epoch": 176} {"train_loss": -7.2622151374816895, "global_step": 29591, "epoch": 176} {"train_loss": -7.432617664337158, "global_step": 29592, "epoch": 176} {"train_loss": -7.248872756958008, "global_step": 29593, "epoch": 176} {"train_loss": -7.417361259460449, "global_step": 29594, "epoch": 176} {"train_loss": -7.669927597045898, "global_step": 29595, "epoch": 176} {"train_loss": -7.490705490112305, "global_step": 29596, "epoch": 176} {"train_loss": -7.578531265258789, "global_step": 29597, "epoch": 176} {"train_loss": -7.387576103210449, "global_step": 29598, "epoch": 176} {"train_loss": -7.43726921081543, "global_step": 29599, "epoch": 176} {"train_loss": -7.527745723724365, "global_step": 29600, "epoch": 176} {"train_loss": -7.387509822845459, "global_step": 29601, "epoch": 176} {"train_loss": -7.526622295379639, "global_step": 29602, "epoch": 176} {"train_loss": -7.468820095062256, "global_step": 29603, "epoch": 176} {"train_loss": -7.602181434631348, "global_step": 29604, "epoch": 176} {"train_loss": -7.617417335510254, "global_step": 29605, "epoch": 176} {"train_loss": -7.583747863769531, "global_step": 29606, "epoch": 176} {"train_loss": -7.472280502319336, "global_step": 29607, "epoch": 176} {"train_loss": -7.63266658782959, "global_step": 29608, "epoch": 176} {"train_loss": -7.4668989181518555, "global_step": 29609, "epoch": 176} {"train_loss": -7.481546878814697, "global_step": 29610, "epoch": 176} {"train_loss": -7.366382122039795, "global_step": 29611, "epoch": 176} {"train_loss": -7.474332332611084, "global_step": 29612, "epoch": 176} {"train_loss": -7.197437286376953, "global_step": 29613, "epoch": 176} {"train_loss": -7.40833044052124, "global_step": 29614, "epoch": 176} {"train_loss": -7.134449005126953, "global_step": 29615, "epoch": 176} {"train_loss": -7.554947376251221, "global_step": 29616, "epoch": 176} {"train_loss": -7.207904815673828, "global_step": 29617, "epoch": 176} {"train_loss": -7.607928276062012, "global_step": 29618, "epoch": 176} {"train_loss": -7.210560321807861, "global_step": 29619, "epoch": 176} {"train_loss": -7.246563911437988, "global_step": 29620, "epoch": 176} {"train_loss": -7.257285118103027, "global_step": 29621, "epoch": 176} {"train_loss": -7.303682327270508, "global_step": 29622, "epoch": 176} {"train_loss": -7.400350570678711, "global_step": 29623, "epoch": 176} {"train_loss": -7.706444263458252, "global_step": 29624, "epoch": 176} {"train_loss": -7.465428352355957, "global_step": 29625, "epoch": 176} {"train_loss": -7.441524505615234, "global_step": 29626, "epoch": 176} {"train_loss": -7.488338470458984, "global_step": 29627, "epoch": 176} {"train_loss": -7.580018043518066, "global_step": 29628, "epoch": 176} {"train_loss": -7.606141090393066, "global_step": 29629, "epoch": 176} {"train_loss": -7.510559558868408, "global_step": 29630, "epoch": 176} {"train_loss": -7.414645195007324, "global_step": 29631, "epoch": 176} {"train_loss": -7.447028160095215, "global_step": 29632, "epoch": 176} {"train_loss": -7.487067222595215, "global_step": 29633, "epoch": 176} {"train_loss": -7.495287895202637, "global_step": 29634, "epoch": 176} {"train_loss": -7.654940605163574, "global_step": 29635, "epoch": 176} {"train_loss": -7.530825138092041, "global_step": 29636, "epoch": 176} {"train_loss": -7.77542781829834, "global_step": 29637, "epoch": 176} {"train_loss": -7.537572383880615, "global_step": 29638, "epoch": 176} {"train_loss": -7.396533012390137, "global_step": 29639, "epoch": 176} {"train_loss": -7.569134712219238, "global_step": 29640, "epoch": 176} {"train_loss": -7.509891510009766, "global_step": 29641, "epoch": 176} {"train_loss": -7.379223346710205, "global_step": 29642, "epoch": 176} {"train_loss": -7.355897903442383, "global_step": 29643, "epoch": 176} {"train_loss": -7.534067153930664, "global_step": 29644, "epoch": 176} {"train_loss": -7.621971130371094, "global_step": 29645, "epoch": 176} {"train_loss": -7.159000873565674, "global_step": 29646, "epoch": 176} {"train_loss": -7.415853500366211, "global_step": 29647, "epoch": 176} {"train_loss": -7.4201788902282715, "global_step": 29648, "epoch": 176} {"train_loss": -7.427967071533203, "global_step": 29649, "epoch": 176} {"train_loss": -7.398151397705078, "global_step": 29650, "epoch": 176} {"train_loss": -7.555139541625977, "global_step": 29651, "epoch": 176} {"train_loss": -7.608004093170166, "global_step": 29652, "epoch": 176} {"train_loss": -7.603984832763672, "global_step": 29653, "epoch": 176} {"train_loss": -7.485655307769775, "global_step": 29654, "epoch": 176} {"train_loss": -7.140946388244629, "global_step": 29655, "epoch": 176} {"train_loss": -7.484305381774902, "global_step": 29656, "epoch": 176} {"train_loss": -7.664636611938477, "global_step": 29657, "epoch": 176} {"train_loss": -7.537222385406494, "global_step": 29658, "epoch": 176} {"train_loss": -7.692779541015625, "global_step": 29659, "epoch": 176} {"train_loss": -7.537328720092773, "global_step": 29660, "epoch": 176} {"train_loss": -7.56971549987793, "global_step": 29661, "epoch": 176} {"train_loss": -7.556900978088379, "global_step": 29662, "epoch": 176} {"train_loss": -7.548336029052734, "global_step": 29663, "epoch": 176} {"train_loss": -7.669801235198975, "global_step": 29664, "epoch": 176} {"train_loss": -7.683809280395508, "global_step": 29665, "epoch": 176} {"train_loss": -7.148142337799072, "global_step": 29666, "epoch": 176} {"train_loss": -7.5538225173950195, "global_step": 29667, "epoch": 176} {"train_loss": -7.311448097229004, "global_step": 29668, "epoch": 176} {"train_loss": -7.504855632781982, "global_step": 29669, "epoch": 176} {"train_loss": -7.579543113708496, "global_step": 29670, "epoch": 176} {"train_loss": -7.709184646606445, "global_step": 29671, "epoch": 176} {"train_loss": -7.153860092163086, "global_step": 29672, "epoch": 176} {"train_loss": -7.428990840911865, "global_step": 29673, "epoch": 176} {"train_loss": -7.430325031280518, "global_step": 29674, "epoch": 176} {"train_loss": -7.549103260040283, "global_step": 29675, "epoch": 176} {"train_loss": -7.481425762176514, "global_step": 29676, "epoch": 176} {"train_loss": -7.294320583343506, "global_step": 29677, "epoch": 176} {"train_loss": -7.463841438293457, "global_step": 29678, "epoch": 176} {"train_loss": -7.301405906677246, "global_step": 29679, "epoch": 176} {"train_loss": -7.409757137298584, "global_step": 29680, "epoch": 176} {"train_loss": -7.342303276062012, "global_step": 29681, "epoch": 176} {"train_loss": -7.532588005065918, "global_step": 29682, "epoch": 176} {"train_loss": -7.218827724456787, "global_step": 29683, "epoch": 176} {"train_loss": -7.170358180999756, "global_step": 29684, "epoch": 176} {"train_loss": -7.651869297027588, "global_step": 29685, "epoch": 176} {"train_loss": -7.5236310958862305, "global_step": 29686, "epoch": 176} {"train_loss": -7.662352561950684, "global_step": 29687, "epoch": 176} {"train_loss": -7.298779487609863, "global_step": 29688, "epoch": 176} {"train_loss": -7.573023319244385, "global_step": 29689, "epoch": 176} {"train_loss": -7.393585205078125, "global_step": 29690, "epoch": 176} {"train_loss": -7.281551837921143, "global_step": 29691, "epoch": 176} {"train_loss": -7.496358871459961, "global_step": 29692, "epoch": 176} {"train_loss": -7.326583385467529, "global_step": 29693, "epoch": 176} {"train_loss": -7.387618541717529, "global_step": 29694, "epoch": 176} {"train_loss": -7.418809413909912, "global_step": 29695, "epoch": 176} {"train_loss": -7.584228992462158, "global_step": 29696, "epoch": 176} {"train_loss": -7.394291877746582, "global_step": 29697, "epoch": 176} {"train_loss": -7.399795055389404, "global_step": 29698, "epoch": 176} {"train_loss": -7.336875915527344, "global_step": 29699, "epoch": 176} {"train_loss": -7.622512340545654, "global_step": 29700, "epoch": 176} {"train_loss": -7.341408729553223, "global_step": 29701, "epoch": 176} {"train_loss": -7.510286808013916, "global_step": 29702, "epoch": 176} {"train_loss": -7.362523078918457, "global_step": 29703, "epoch": 176} {"train_loss": -7.449810981750488, "global_step": 29704, "epoch": 176} {"train_loss": -7.280248641967773, "global_step": 29705, "epoch": 176} {"train_loss": -7.502089500427246, "global_step": 29706, "epoch": 176} {"train_loss": -7.303183555603027, "global_step": 29707, "epoch": 176} {"train_loss": -7.448535919189453, "global_step": 29708, "epoch": 176} {"train_loss": -7.289449214935303, "global_step": 29709, "epoch": 176} {"train_loss": -7.274001121520996, "global_step": 29710, "epoch": 176} {"train_loss": -7.299369812011719, "global_step": 29711, "epoch": 176} {"train_loss": -7.60205602645874, "global_step": 29712, "epoch": 176} {"train_loss": -7.564789295196533, "global_step": 29713, "epoch": 176} {"train_loss": -7.331792831420898, "global_step": 29714, "epoch": 176} {"train_loss": -7.560384750366211, "global_step": 29715, "epoch": 176} {"train_loss": -7.368444919586182, "global_step": 29716, "epoch": 176} {"train_loss": -7.254478931427002, "global_step": 29717, "epoch": 176} {"train_loss": -7.382940292358398, "global_step": 29718, "epoch": 176} {"train_loss": -7.399572372436523, "global_step": 29719, "epoch": 176} {"train_loss": -7.421387672424316, "global_step": 29720, "epoch": 176} {"train_loss": -7.262551307678223, "global_step": 29721, "epoch": 176} {"train_loss": -7.343661308288574, "global_step": 29722, "epoch": 176} {"train_loss": -7.3378777503967285, "global_step": 29723, "epoch": 176} {"train_loss": -7.604918479919434, "global_step": 29724, "epoch": 176} {"train_loss": -7.288086891174316, "global_step": 29725, "epoch": 176} {"train_loss": -7.516105651855469, "global_step": 29726, "epoch": 176} {"train_loss": -7.491295337677002, "global_step": 29727, "epoch": 176} {"train_loss": -7.431089401245117, "global_step": 29728, "epoch": 176} {"train_loss": -7.301642894744873, "global_step": 29729, "epoch": 176} {"train_loss": -7.586515426635742, "global_step": 29730, "epoch": 176} {"train_loss": -7.604376792907715, "global_step": 29731, "epoch": 176} {"train_loss": -7.304080009460449, "global_step": 29732, "epoch": 176} {"train_loss": -7.455682277679443, "global_step": 29733, "epoch": 176} {"train_loss": -7.387190818786621, "global_step": 29734, "epoch": 176} {"train_loss": -7.435924544220879, "global_step": 29735, "epoch": 176, "val_loss": 188102.3125} {"train_loss": -7.451650619506836, "global_step": 29736, "epoch": 177} {"train_loss": -7.111915588378906, "global_step": 29737, "epoch": 177} {"train_loss": -7.048666477203369, "global_step": 29738, "epoch": 177} {"train_loss": -7.416349411010742, "global_step": 29739, "epoch": 177} {"train_loss": -7.6126933097839355, "global_step": 29740, "epoch": 177} {"train_loss": -7.276519775390625, "global_step": 29741, "epoch": 177} {"train_loss": -7.450543403625488, "global_step": 29742, "epoch": 177} {"train_loss": -7.552614688873291, "global_step": 29743, "epoch": 177} {"train_loss": -7.595121383666992, "global_step": 29744, "epoch": 177} {"train_loss": -7.284761428833008, "global_step": 29745, "epoch": 177} {"train_loss": -7.408271312713623, "global_step": 29746, "epoch": 177} {"train_loss": -7.472527980804443, "global_step": 29747, "epoch": 177} {"train_loss": -7.4395294189453125, "global_step": 29748, "epoch": 177} {"train_loss": -7.5355329513549805, "global_step": 29749, "epoch": 177} {"train_loss": -7.487089157104492, "global_step": 29750, "epoch": 177} {"train_loss": -7.3299689292907715, "global_step": 29751, "epoch": 177} {"train_loss": -7.532418251037598, "global_step": 29752, "epoch": 177} {"train_loss": -7.434549808502197, "global_step": 29753, "epoch": 177} {"train_loss": -7.610177040100098, "global_step": 29754, "epoch": 177} {"train_loss": -7.282838821411133, "global_step": 29755, "epoch": 177} {"train_loss": -7.420745849609375, "global_step": 29756, "epoch": 177} {"train_loss": -7.441642761230469, "global_step": 29757, "epoch": 177} {"train_loss": -7.648104667663574, "global_step": 29758, "epoch": 177} {"train_loss": -7.416239261627197, "global_step": 29759, "epoch": 177} {"train_loss": -7.562439918518066, "global_step": 29760, "epoch": 177} {"train_loss": -7.361706256866455, "global_step": 29761, "epoch": 177} {"train_loss": -7.471960067749023, "global_step": 29762, "epoch": 177} {"train_loss": -7.403356552124023, "global_step": 29763, "epoch": 177} {"train_loss": -7.567197799682617, "global_step": 29764, "epoch": 177} {"train_loss": -7.789086818695068, "global_step": 29765, "epoch": 177} {"train_loss": -7.505398273468018, "global_step": 29766, "epoch": 177} {"train_loss": -7.576303482055664, "global_step": 29767, "epoch": 177} {"train_loss": -7.360469818115234, "global_step": 29768, "epoch": 177} {"train_loss": -7.788884162902832, "global_step": 29769, "epoch": 177} {"train_loss": -7.504134178161621, "global_step": 29770, "epoch": 177} {"train_loss": -7.681922912597656, "global_step": 29771, "epoch": 177} {"train_loss": -7.19249963760376, "global_step": 29772, "epoch": 177} {"train_loss": -7.509244441986084, "global_step": 29773, "epoch": 177} {"train_loss": -7.553343772888184, "global_step": 29774, "epoch": 177} {"train_loss": -7.440605163574219, "global_step": 29775, "epoch": 177} {"train_loss": -7.747339248657227, "global_step": 29776, "epoch": 177} {"train_loss": -7.256728172302246, "global_step": 29777, "epoch": 177} {"train_loss": -7.246870994567871, "global_step": 29778, "epoch": 177} {"train_loss": -7.386109828948975, "global_step": 29779, "epoch": 177} {"train_loss": -7.569225311279297, "global_step": 29780, "epoch": 177} {"train_loss": -7.4345703125, "global_step": 29781, "epoch": 177} {"train_loss": -7.378746032714844, "global_step": 29782, "epoch": 177} {"train_loss": -7.551326751708984, "global_step": 29783, "epoch": 177} {"train_loss": -7.506914138793945, "global_step": 29784, "epoch": 177} {"train_loss": -7.472872257232666, "global_step": 29785, "epoch": 177} {"train_loss": -7.494015216827393, "global_step": 29786, "epoch": 177} {"train_loss": -7.559709548950195, "global_step": 29787, "epoch": 177} {"train_loss": -7.588982105255127, "global_step": 29788, "epoch": 177} {"train_loss": -7.726874351501465, "global_step": 29789, "epoch": 177} {"train_loss": -7.526663303375244, "global_step": 29790, "epoch": 177} {"train_loss": -7.560800552368164, "global_step": 29791, "epoch": 177} {"train_loss": -7.180305480957031, "global_step": 29792, "epoch": 177} {"train_loss": -7.47272253036499, "global_step": 29793, "epoch": 177} {"train_loss": -7.370641708374023, "global_step": 29794, "epoch": 177} {"train_loss": -7.088484764099121, "global_step": 29795, "epoch": 177} {"train_loss": -7.488035202026367, "global_step": 29796, "epoch": 177} {"train_loss": -7.328697681427002, "global_step": 29797, "epoch": 177} {"train_loss": -7.418435096740723, "global_step": 29798, "epoch": 177} {"train_loss": -7.310065269470215, "global_step": 29799, "epoch": 177} {"train_loss": -7.493901252746582, "global_step": 29800, "epoch": 177} {"train_loss": -7.435858726501465, "global_step": 29801, "epoch": 177} {"train_loss": -7.399325370788574, "global_step": 29802, "epoch": 177} {"train_loss": -7.2867112159729, "global_step": 29803, "epoch": 177} {"train_loss": -7.449196815490723, "global_step": 29804, "epoch": 177} {"train_loss": -7.3173089027404785, "global_step": 29805, "epoch": 177} {"train_loss": -7.187245845794678, "global_step": 29806, "epoch": 177} {"train_loss": -7.309377670288086, "global_step": 29807, "epoch": 177} {"train_loss": -7.379932403564453, "global_step": 29808, "epoch": 177} {"train_loss": -7.390782833099365, "global_step": 29809, "epoch": 177} {"train_loss": -7.530385494232178, "global_step": 29810, "epoch": 177} {"train_loss": -7.636277675628662, "global_step": 29811, "epoch": 177} {"train_loss": -7.351743221282959, "global_step": 29812, "epoch": 177} {"train_loss": -7.501142501831055, "global_step": 29813, "epoch": 177} {"train_loss": -7.345444202423096, "global_step": 29814, "epoch": 177} {"train_loss": -7.429234981536865, "global_step": 29815, "epoch": 177} {"train_loss": -7.469915390014648, "global_step": 29816, "epoch": 177} {"train_loss": -7.445441722869873, "global_step": 29817, "epoch": 177} {"train_loss": -7.514413833618164, "global_step": 29818, "epoch": 177} {"train_loss": -7.398800849914551, "global_step": 29819, "epoch": 177} {"train_loss": -7.420328140258789, "global_step": 29820, "epoch": 177} {"train_loss": -7.626028060913086, "global_step": 29821, "epoch": 177} {"train_loss": -7.4054036140441895, "global_step": 29822, "epoch": 177} {"train_loss": -7.452815055847168, "global_step": 29823, "epoch": 177} {"train_loss": -7.777146339416504, "global_step": 29824, "epoch": 177} {"train_loss": -7.756237030029297, "global_step": 29825, "epoch": 177} {"train_loss": -7.597631454467773, "global_step": 29826, "epoch": 177} {"train_loss": -7.764634132385254, "global_step": 29827, "epoch": 177} {"train_loss": -7.4238996505737305, "global_step": 29828, "epoch": 177} {"train_loss": -7.266922950744629, "global_step": 29829, "epoch": 177} {"train_loss": -7.215334892272949, "global_step": 29830, "epoch": 177} {"train_loss": -7.483731269836426, "global_step": 29831, "epoch": 177} {"train_loss": -6.763617515563965, "global_step": 29832, "epoch": 177} {"train_loss": -7.395298957824707, "global_step": 29833, "epoch": 177} {"train_loss": -7.101857662200928, "global_step": 29834, "epoch": 177} {"train_loss": -7.2552876472473145, "global_step": 29835, "epoch": 177} {"train_loss": -7.095758438110352, "global_step": 29836, "epoch": 177} {"train_loss": -7.440668106079102, "global_step": 29837, "epoch": 177} {"train_loss": -7.072656631469727, "global_step": 29838, "epoch": 177} {"train_loss": -7.077528476715088, "global_step": 29839, "epoch": 177} {"train_loss": -7.205853462219238, "global_step": 29840, "epoch": 177} {"train_loss": -7.148490905761719, "global_step": 29841, "epoch": 177} {"train_loss": -7.490381240844727, "global_step": 29842, "epoch": 177} {"train_loss": -7.072441101074219, "global_step": 29843, "epoch": 177} {"train_loss": -7.045733451843262, "global_step": 29844, "epoch": 177} {"train_loss": -7.42917013168335, "global_step": 29845, "epoch": 177} {"train_loss": -7.207371711730957, "global_step": 29846, "epoch": 177} {"train_loss": -7.252023696899414, "global_step": 29847, "epoch": 177} {"train_loss": -7.276273250579834, "global_step": 29848, "epoch": 177} {"train_loss": -7.373388290405273, "global_step": 29849, "epoch": 177} {"train_loss": -7.232643127441406, "global_step": 29850, "epoch": 177} {"train_loss": -7.427209854125977, "global_step": 29851, "epoch": 177} {"train_loss": -7.507804870605469, "global_step": 29852, "epoch": 177} {"train_loss": -7.470863342285156, "global_step": 29853, "epoch": 177} {"train_loss": -7.448772430419922, "global_step": 29854, "epoch": 177} {"train_loss": -7.5110368728637695, "global_step": 29855, "epoch": 177} {"train_loss": -7.401586055755615, "global_step": 29856, "epoch": 177} {"train_loss": -7.380926132202148, "global_step": 29857, "epoch": 177} {"train_loss": -7.56654167175293, "global_step": 29858, "epoch": 177} {"train_loss": -7.211718559265137, "global_step": 29859, "epoch": 177} {"train_loss": -7.447960376739502, "global_step": 29860, "epoch": 177} {"train_loss": -7.663850784301758, "global_step": 29861, "epoch": 177} {"train_loss": -7.534687042236328, "global_step": 29862, "epoch": 177} {"train_loss": -7.391287803649902, "global_step": 29863, "epoch": 177} {"train_loss": -7.511725902557373, "global_step": 29864, "epoch": 177} {"train_loss": -7.6181840896606445, "global_step": 29865, "epoch": 177} {"train_loss": -7.401815414428711, "global_step": 29866, "epoch": 177} {"train_loss": -7.567030429840088, "global_step": 29867, "epoch": 177} {"train_loss": -7.354364395141602, "global_step": 29868, "epoch": 177} {"train_loss": -7.545557975769043, "global_step": 29869, "epoch": 177} {"train_loss": -7.3767194747924805, "global_step": 29870, "epoch": 177} {"train_loss": -7.120743751525879, "global_step": 29871, "epoch": 177} {"train_loss": -7.4322428703308105, "global_step": 29872, "epoch": 177} {"train_loss": -7.204809188842773, "global_step": 29873, "epoch": 177} {"train_loss": -7.446377277374268, "global_step": 29874, "epoch": 177} {"train_loss": -7.376606464385986, "global_step": 29875, "epoch": 177} {"train_loss": -7.3994646072387695, "global_step": 29876, "epoch": 177} {"train_loss": -7.006189823150635, "global_step": 29877, "epoch": 177} {"train_loss": -7.538429260253906, "global_step": 29878, "epoch": 177} {"train_loss": -7.378421783447266, "global_step": 29879, "epoch": 177} {"train_loss": -7.254673957824707, "global_step": 29880, "epoch": 177} {"train_loss": -7.296425819396973, "global_step": 29881, "epoch": 177} {"train_loss": -7.119287014007568, "global_step": 29882, "epoch": 177} {"train_loss": -7.524030685424805, "global_step": 29883, "epoch": 177} {"train_loss": -7.2610344886779785, "global_step": 29884, "epoch": 177} {"train_loss": -7.408602714538574, "global_step": 29885, "epoch": 177} {"train_loss": -7.4438018798828125, "global_step": 29886, "epoch": 177} {"train_loss": -7.295504093170166, "global_step": 29887, "epoch": 177} {"train_loss": -7.433669090270996, "global_step": 29888, "epoch": 177} {"train_loss": -7.3338727951049805, "global_step": 29889, "epoch": 177} {"train_loss": -7.003300666809082, "global_step": 29890, "epoch": 177} {"train_loss": -7.191746711730957, "global_step": 29891, "epoch": 177} {"train_loss": -7.423192024230957, "global_step": 29892, "epoch": 177} {"train_loss": -7.090751647949219, "global_step": 29893, "epoch": 177} {"train_loss": -7.256112098693848, "global_step": 29894, "epoch": 177} {"train_loss": -7.6033782958984375, "global_step": 29895, "epoch": 177} {"train_loss": -7.520075798034668, "global_step": 29896, "epoch": 177} {"train_loss": -7.4136152267456055, "global_step": 29897, "epoch": 177} {"train_loss": -7.298480987548828, "global_step": 29898, "epoch": 177} {"train_loss": -7.5291290283203125, "global_step": 29899, "epoch": 177} {"train_loss": -7.301115036010742, "global_step": 29900, "epoch": 177} {"train_loss": -7.313665390014648, "global_step": 29901, "epoch": 177} {"train_loss": -7.520301818847656, "global_step": 29902, "epoch": 177} {"train_loss": -7.405718823273976, "global_step": 29903, "epoch": 177, "val_loss": 190466.546875} {"train_loss": -7.437129497528076, "global_step": 29904, "epoch": 178} {"train_loss": -7.462597370147705, "global_step": 29905, "epoch": 178} {"train_loss": -7.208115577697754, "global_step": 29906, "epoch": 178} {"train_loss": -7.459395408630371, "global_step": 29907, "epoch": 178} {"train_loss": -7.093951225280762, "global_step": 29908, "epoch": 178} {"train_loss": -6.9713287353515625, "global_step": 29909, "epoch": 178} {"train_loss": -7.367106914520264, "global_step": 29910, "epoch": 178} {"train_loss": -6.8835673332214355, "global_step": 29911, "epoch": 178} {"train_loss": -7.0037384033203125, "global_step": 29912, "epoch": 178} {"train_loss": -7.087221145629883, "global_step": 29913, "epoch": 178} {"train_loss": -7.145780563354492, "global_step": 29914, "epoch": 178} {"train_loss": -7.0836310386657715, "global_step": 29915, "epoch": 178} {"train_loss": -7.181085586547852, "global_step": 29916, "epoch": 178} {"train_loss": -7.324924468994141, "global_step": 29917, "epoch": 178} {"train_loss": -7.334200859069824, "global_step": 29918, "epoch": 178} {"train_loss": -7.107178211212158, "global_step": 29919, "epoch": 178} {"train_loss": -7.1184916496276855, "global_step": 29920, "epoch": 178} {"train_loss": -7.377922058105469, "global_step": 29921, "epoch": 178} {"train_loss": -6.994982719421387, "global_step": 29922, "epoch": 178} {"train_loss": -7.327234745025635, "global_step": 29923, "epoch": 178} {"train_loss": -7.140220642089844, "global_step": 29924, "epoch": 178} {"train_loss": -7.2252326011657715, "global_step": 29925, "epoch": 178} {"train_loss": -7.424417495727539, "global_step": 29926, "epoch": 178} {"train_loss": -7.119285583496094, "global_step": 29927, "epoch": 178} {"train_loss": -7.218843460083008, "global_step": 29928, "epoch": 178} {"train_loss": -7.459753036499023, "global_step": 29929, "epoch": 178} {"train_loss": -7.402525424957275, "global_step": 29930, "epoch": 178} {"train_loss": -7.063357353210449, "global_step": 29931, "epoch": 178} {"train_loss": -7.414852619171143, "global_step": 29932, "epoch": 178} {"train_loss": -7.108076572418213, "global_step": 29933, "epoch": 178} {"train_loss": -7.015096664428711, "global_step": 29934, "epoch": 178} {"train_loss": -7.38770055770874, "global_step": 29935, "epoch": 178} {"train_loss": -7.490026473999023, "global_step": 29936, "epoch": 178} {"train_loss": -7.4465203285217285, "global_step": 29937, "epoch": 178} {"train_loss": -7.203483581542969, "global_step": 29938, "epoch": 178} {"train_loss": -7.37442684173584, "global_step": 29939, "epoch": 178} {"train_loss": -7.3771586418151855, "global_step": 29940, "epoch": 178} {"train_loss": -7.033626079559326, "global_step": 29941, "epoch": 178} {"train_loss": -7.288970947265625, "global_step": 29942, "epoch": 178} {"train_loss": -7.417436599731445, "global_step": 29943, "epoch": 178} {"train_loss": -7.239482879638672, "global_step": 29944, "epoch": 178} {"train_loss": -7.214670181274414, "global_step": 29945, "epoch": 178} {"train_loss": -7.264406204223633, "global_step": 29946, "epoch": 178} {"train_loss": -7.3760600090026855, "global_step": 29947, "epoch": 178} {"train_loss": -7.199207305908203, "global_step": 29948, "epoch": 178} {"train_loss": -7.333952903747559, "global_step": 29949, "epoch": 178} {"train_loss": -7.400204181671143, "global_step": 29950, "epoch": 178} {"train_loss": -7.467569351196289, "global_step": 29951, "epoch": 178} {"train_loss": -7.500201225280762, "global_step": 29952, "epoch": 178} {"train_loss": -7.422117233276367, "global_step": 29953, "epoch": 178} {"train_loss": -7.202066421508789, "global_step": 29954, "epoch": 178} {"train_loss": -7.405930519104004, "global_step": 29955, "epoch": 178} {"train_loss": -7.405743598937988, "global_step": 29956, "epoch": 178} {"train_loss": -7.611672401428223, "global_step": 29957, "epoch": 178} {"train_loss": -7.333553791046143, "global_step": 29958, "epoch": 178} {"train_loss": -7.49824857711792, "global_step": 29959, "epoch": 178} {"train_loss": -7.450160980224609, "global_step": 29960, "epoch": 178} {"train_loss": -7.291449069976807, "global_step": 29961, "epoch": 178} {"train_loss": -7.41574239730835, "global_step": 29962, "epoch": 178} {"train_loss": -7.6466264724731445, "global_step": 29963, "epoch": 178} {"train_loss": -7.335347652435303, "global_step": 29964, "epoch": 178} {"train_loss": -7.4637556076049805, "global_step": 29965, "epoch": 178} {"train_loss": -7.602364540100098, "global_step": 29966, "epoch": 178} {"train_loss": -7.5578718185424805, "global_step": 29967, "epoch": 178} {"train_loss": -7.554081916809082, "global_step": 29968, "epoch": 178} {"train_loss": -7.376347064971924, "global_step": 29969, "epoch": 178} {"train_loss": -7.6827497482299805, "global_step": 29970, "epoch": 178} {"train_loss": -7.325243949890137, "global_step": 29971, "epoch": 178} {"train_loss": -7.442354679107666, "global_step": 29972, "epoch": 178} {"train_loss": -7.696470737457275, "global_step": 29973, "epoch": 178} {"train_loss": -7.508444786071777, "global_step": 29974, "epoch": 178} {"train_loss": -7.478825092315674, "global_step": 29975, "epoch": 178} {"train_loss": -7.344845294952393, "global_step": 29976, "epoch": 178} {"train_loss": -7.709634780883789, "global_step": 29977, "epoch": 178} {"train_loss": -7.5168962478637695, "global_step": 29978, "epoch": 178} {"train_loss": -7.771150588989258, "global_step": 29979, "epoch": 178} {"train_loss": -7.4819536209106445, "global_step": 29980, "epoch": 178} {"train_loss": -7.610074996948242, "global_step": 29981, "epoch": 178} {"train_loss": -7.500199317932129, "global_step": 29982, "epoch": 178} {"train_loss": -7.746114730834961, "global_step": 29983, "epoch": 178} {"train_loss": -7.388246059417725, "global_step": 29984, "epoch": 178} {"train_loss": -7.502192497253418, "global_step": 29985, "epoch": 178} {"train_loss": -7.613757133483887, "global_step": 29986, "epoch": 178} {"train_loss": -7.406683921813965, "global_step": 29987, "epoch": 178} {"train_loss": -7.185809135437012, "global_step": 29988, "epoch": 178} {"train_loss": -7.558864593505859, "global_step": 29989, "epoch": 178} {"train_loss": -7.520053386688232, "global_step": 29990, "epoch": 178} {"train_loss": -7.782387733459473, "global_step": 29991, "epoch": 178} {"train_loss": -7.535486698150635, "global_step": 29992, "epoch": 178} {"train_loss": -7.469233512878418, "global_step": 29993, "epoch": 178} {"train_loss": -7.287375450134277, "global_step": 29994, "epoch": 178} {"train_loss": -7.472448348999023, "global_step": 29995, "epoch": 178} {"train_loss": -7.340169906616211, "global_step": 29996, "epoch": 178} {"train_loss": -7.645895957946777, "global_step": 29997, "epoch": 178} {"train_loss": -7.541374206542969, "global_step": 29998, "epoch": 178} {"train_loss": -7.349488735198975, "global_step": 29999, "epoch": 178} {"train_loss": -7.342230319976807, "global_step": 30000, "epoch": 178} {"train_loss": -7.409212589263916, "global_step": 30001, "epoch": 178} {"train_loss": -7.341495513916016, "global_step": 30002, "epoch": 178} {"train_loss": -7.628289222717285, "global_step": 30003, "epoch": 178} {"train_loss": -7.491940975189209, "global_step": 30004, "epoch": 178} {"train_loss": -7.59945011138916, "global_step": 30005, "epoch": 178} {"train_loss": -7.365811347961426, "global_step": 30006, "epoch": 178} {"train_loss": -7.588204860687256, "global_step": 30007, "epoch": 178} {"train_loss": -7.530479431152344, "global_step": 30008, "epoch": 178} {"train_loss": -7.330575942993164, "global_step": 30009, "epoch": 178} {"train_loss": -7.5960917472839355, "global_step": 30010, "epoch": 178} {"train_loss": -7.405189514160156, "global_step": 30011, "epoch": 178} {"train_loss": -7.659759521484375, "global_step": 30012, "epoch": 178} {"train_loss": -7.331223011016846, "global_step": 30013, "epoch": 178} {"train_loss": -7.505257606506348, "global_step": 30014, "epoch": 178} {"train_loss": -7.6984663009643555, "global_step": 30015, "epoch": 178} {"train_loss": -7.612264633178711, "global_step": 30016, "epoch": 178} {"train_loss": -7.5322723388671875, "global_step": 30017, "epoch": 178} {"train_loss": -7.57172966003418, "global_step": 30018, "epoch": 178} {"train_loss": -7.538812637329102, "global_step": 30019, "epoch": 178} {"train_loss": -7.53780460357666, "global_step": 30020, "epoch": 178} {"train_loss": -7.587581634521484, "global_step": 30021, "epoch": 178} {"train_loss": -7.540637969970703, "global_step": 30022, "epoch": 178} {"train_loss": -7.557556629180908, "global_step": 30023, "epoch": 178} {"train_loss": -7.538148403167725, "global_step": 30024, "epoch": 178} {"train_loss": -7.284444808959961, "global_step": 30025, "epoch": 178} {"train_loss": -7.388772964477539, "global_step": 30026, "epoch": 178} {"train_loss": -7.2461442947387695, "global_step": 30027, "epoch": 178} {"train_loss": -7.537856101989746, "global_step": 30028, "epoch": 178} {"train_loss": -7.32443904876709, "global_step": 30029, "epoch": 178} {"train_loss": -6.9805731773376465, "global_step": 30030, "epoch": 178} {"train_loss": -7.440598011016846, "global_step": 30031, "epoch": 178} {"train_loss": -7.48869514465332, "global_step": 30032, "epoch": 178} {"train_loss": -7.7409772872924805, "global_step": 30033, "epoch": 178} {"train_loss": -7.461106777191162, "global_step": 30034, "epoch": 178} {"train_loss": -7.4390974044799805, "global_step": 30035, "epoch": 178} {"train_loss": -7.549531936645508, "global_step": 30036, "epoch": 178} {"train_loss": -7.45279598236084, "global_step": 30037, "epoch": 178} {"train_loss": -7.236567497253418, "global_step": 30038, "epoch": 178} {"train_loss": -7.4841718673706055, "global_step": 30039, "epoch": 178} {"train_loss": -7.42195987701416, "global_step": 30040, "epoch": 178} {"train_loss": -7.458846092224121, "global_step": 30041, "epoch": 178} {"train_loss": -7.630645751953125, "global_step": 30042, "epoch": 178} {"train_loss": -7.529924392700195, "global_step": 30043, "epoch": 178} {"train_loss": -7.490300178527832, "global_step": 30044, "epoch": 178} {"train_loss": -7.5297698974609375, "global_step": 30045, "epoch": 178} {"train_loss": -7.258792877197266, "global_step": 30046, "epoch": 178} {"train_loss": -7.47675895690918, "global_step": 30047, "epoch": 178} {"train_loss": -7.6632304191589355, "global_step": 30048, "epoch": 178} {"train_loss": -7.547913074493408, "global_step": 30049, "epoch": 178} {"train_loss": -7.404585361480713, "global_step": 30050, "epoch": 178} {"train_loss": -7.553275108337402, "global_step": 30051, "epoch": 178} {"train_loss": -7.572869300842285, "global_step": 30052, "epoch": 178} {"train_loss": -7.425498008728027, "global_step": 30053, "epoch": 178} {"train_loss": -7.6278533935546875, "global_step": 30054, "epoch": 178} {"train_loss": -7.334743022918701, "global_step": 30055, "epoch": 178} {"train_loss": -7.53375244140625, "global_step": 30056, "epoch": 178} {"train_loss": -7.238424777984619, "global_step": 30057, "epoch": 178} {"train_loss": -7.593910217285156, "global_step": 30058, "epoch": 178} {"train_loss": -7.612642288208008, "global_step": 30059, "epoch": 178} {"train_loss": -7.5857744216918945, "global_step": 30060, "epoch": 178} {"train_loss": -7.5548248291015625, "global_step": 30061, "epoch": 178} {"train_loss": -7.536373138427734, "global_step": 30062, "epoch": 178} {"train_loss": -7.333282470703125, "global_step": 30063, "epoch": 178} {"train_loss": -7.231663703918457, "global_step": 30064, "epoch": 178} {"train_loss": -7.401866912841797, "global_step": 30065, "epoch": 178} {"train_loss": -7.162253379821777, "global_step": 30066, "epoch": 178} {"train_loss": -7.3659892082214355, "global_step": 30067, "epoch": 178} {"train_loss": -7.396210670471191, "global_step": 30068, "epoch": 178} {"train_loss": -7.386160373687744, "global_step": 30069, "epoch": 178} {"train_loss": -7.385103225708008, "global_step": 30070, "epoch": 178} {"train_loss": -7.410043424084073, "global_step": 30071, "epoch": 178, "val_loss": 187813.046875} {"train_loss": -7.4495038986206055, "global_step": 30072, "epoch": 179} {"train_loss": -7.3996171951293945, "global_step": 30073, "epoch": 179} {"train_loss": -7.3824872970581055, "global_step": 30074, "epoch": 179} {"train_loss": -7.454643249511719, "global_step": 30075, "epoch": 179} {"train_loss": -7.449730396270752, "global_step": 30076, "epoch": 179} {"train_loss": -7.460598468780518, "global_step": 30077, "epoch": 179} {"train_loss": -7.235019683837891, "global_step": 30078, "epoch": 179} {"train_loss": -7.539018154144287, "global_step": 30079, "epoch": 179} {"train_loss": -7.509804725646973, "global_step": 30080, "epoch": 179} {"train_loss": -7.327025890350342, "global_step": 30081, "epoch": 179} {"train_loss": -7.23482608795166, "global_step": 30082, "epoch": 179} {"train_loss": -7.545310020446777, "global_step": 30083, "epoch": 179} {"train_loss": -7.23400354385376, "global_step": 30084, "epoch": 179} {"train_loss": -7.612345218658447, "global_step": 30085, "epoch": 179} {"train_loss": -7.489336967468262, "global_step": 30086, "epoch": 179} {"train_loss": -7.396453857421875, "global_step": 30087, "epoch": 179} {"train_loss": -7.433088302612305, "global_step": 30088, "epoch": 179} {"train_loss": -7.465143203735352, "global_step": 30089, "epoch": 179} {"train_loss": -7.331607818603516, "global_step": 30090, "epoch": 179} {"train_loss": -7.443131446838379, "global_step": 30091, "epoch": 179} {"train_loss": -7.583249568939209, "global_step": 30092, "epoch": 179} {"train_loss": -7.308638572692871, "global_step": 30093, "epoch": 179} {"train_loss": -7.48994255065918, "global_step": 30094, "epoch": 179} {"train_loss": -7.252215385437012, "global_step": 30095, "epoch": 179} {"train_loss": -7.5473480224609375, "global_step": 30096, "epoch": 179} {"train_loss": -7.592905044555664, "global_step": 30097, "epoch": 179} {"train_loss": -7.64515495300293, "global_step": 30098, "epoch": 179} {"train_loss": -7.4845709800720215, "global_step": 30099, "epoch": 179} {"train_loss": -7.470798492431641, "global_step": 30100, "epoch": 179} {"train_loss": -7.262660980224609, "global_step": 30101, "epoch": 179} {"train_loss": -7.448182106018066, "global_step": 30102, "epoch": 179} {"train_loss": -7.407313823699951, "global_step": 30103, "epoch": 179} {"train_loss": -7.498229503631592, "global_step": 30104, "epoch": 179} {"train_loss": -7.298189163208008, "global_step": 30105, "epoch": 179} {"train_loss": -7.587244987487793, "global_step": 30106, "epoch": 179} {"train_loss": -7.750169277191162, "global_step": 30107, "epoch": 179} {"train_loss": -7.508337020874023, "global_step": 30108, "epoch": 179} {"train_loss": -7.5057477951049805, "global_step": 30109, "epoch": 179} {"train_loss": -7.513223648071289, "global_step": 30110, "epoch": 179} {"train_loss": -7.509006023406982, "global_step": 30111, "epoch": 179} {"train_loss": -7.37545108795166, "global_step": 30112, "epoch": 179} {"train_loss": -7.500042915344238, "global_step": 30113, "epoch": 179} {"train_loss": -7.492659568786621, "global_step": 30114, "epoch": 179} {"train_loss": -7.478814601898193, "global_step": 30115, "epoch": 179} {"train_loss": -7.138093948364258, "global_step": 30116, "epoch": 179} {"train_loss": -7.617745399475098, "global_step": 30117, "epoch": 179} {"train_loss": -7.564544677734375, "global_step": 30118, "epoch": 179} {"train_loss": -7.638849258422852, "global_step": 30119, "epoch": 179} {"train_loss": -7.580156326293945, "global_step": 30120, "epoch": 179} {"train_loss": -7.488309860229492, "global_step": 30121, "epoch": 179} {"train_loss": -7.344429969787598, "global_step": 30122, "epoch": 179} {"train_loss": -7.50471830368042, "global_step": 30123, "epoch": 179} {"train_loss": -7.529116630554199, "global_step": 30124, "epoch": 179} {"train_loss": -7.35493278503418, "global_step": 30125, "epoch": 179} {"train_loss": -7.462548732757568, "global_step": 30126, "epoch": 179} {"train_loss": -7.4973344802856445, "global_step": 30127, "epoch": 179} {"train_loss": -7.676689624786377, "global_step": 30128, "epoch": 179} {"train_loss": -7.335711479187012, "global_step": 30129, "epoch": 179} {"train_loss": -7.4563188552856445, "global_step": 30130, "epoch": 179} {"train_loss": -7.45590877532959, "global_step": 30131, "epoch": 179} {"train_loss": -7.422471523284912, "global_step": 30132, "epoch": 179} {"train_loss": -7.240597248077393, "global_step": 30133, "epoch": 179} {"train_loss": -7.394388198852539, "global_step": 30134, "epoch": 179} {"train_loss": -7.2704057693481445, "global_step": 30135, "epoch": 179} {"train_loss": -7.3947858810424805, "global_step": 30136, "epoch": 179} {"train_loss": -7.389660835266113, "global_step": 30137, "epoch": 179} {"train_loss": -7.144413471221924, "global_step": 30138, "epoch": 179} {"train_loss": -7.510757923126221, "global_step": 30139, "epoch": 179} {"train_loss": -7.165809154510498, "global_step": 30140, "epoch": 179} {"train_loss": -7.453814506530762, "global_step": 30141, "epoch": 179} {"train_loss": -7.344194412231445, "global_step": 30142, "epoch": 179} {"train_loss": -7.542225360870361, "global_step": 30143, "epoch": 179} {"train_loss": -7.416867256164551, "global_step": 30144, "epoch": 179} {"train_loss": -7.208090782165527, "global_step": 30145, "epoch": 179} {"train_loss": -7.485136032104492, "global_step": 30146, "epoch": 179} {"train_loss": -7.336746692657471, "global_step": 30147, "epoch": 179} {"train_loss": -7.4051618576049805, "global_step": 30148, "epoch": 179} {"train_loss": -7.559709072113037, "global_step": 30149, "epoch": 179} {"train_loss": -7.545874118804932, "global_step": 30150, "epoch": 179} {"train_loss": -7.528043270111084, "global_step": 30151, "epoch": 179} {"train_loss": -7.516373157501221, "global_step": 30152, "epoch": 179} {"train_loss": -7.468227386474609, "global_step": 30153, "epoch": 179} {"train_loss": -7.299114227294922, "global_step": 30154, "epoch": 179} {"train_loss": -7.45436954498291, "global_step": 30155, "epoch": 179} {"train_loss": -7.433751583099365, "global_step": 30156, "epoch": 179} {"train_loss": -7.462953567504883, "global_step": 30157, "epoch": 179} {"train_loss": -7.37063455581665, "global_step": 30158, "epoch": 179} {"train_loss": -7.609076499938965, "global_step": 30159, "epoch": 179} {"train_loss": -7.440545082092285, "global_step": 30160, "epoch": 179} {"train_loss": -7.604242324829102, "global_step": 30161, "epoch": 179} {"train_loss": -7.4607672691345215, "global_step": 30162, "epoch": 179} {"train_loss": -7.47041130065918, "global_step": 30163, "epoch": 179} {"train_loss": -7.463705062866211, "global_step": 30164, "epoch": 179} {"train_loss": -7.349377155303955, "global_step": 30165, "epoch": 179} {"train_loss": -7.50221061706543, "global_step": 30166, "epoch": 179} {"train_loss": -7.567710876464844, "global_step": 30167, "epoch": 179} {"train_loss": -7.561609268188477, "global_step": 30168, "epoch": 179} {"train_loss": -7.577768325805664, "global_step": 30169, "epoch": 179} {"train_loss": -7.239776611328125, "global_step": 30170, "epoch": 179} {"train_loss": -7.4410600662231445, "global_step": 30171, "epoch": 179} {"train_loss": -7.370029449462891, "global_step": 30172, "epoch": 179} {"train_loss": -7.453444957733154, "global_step": 30173, "epoch": 179} {"train_loss": -7.188978672027588, "global_step": 30174, "epoch": 179} {"train_loss": -7.603316307067871, "global_step": 30175, "epoch": 179} {"train_loss": -7.394251346588135, "global_step": 30176, "epoch": 179} {"train_loss": -7.353567123413086, "global_step": 30177, "epoch": 179} {"train_loss": -7.328259468078613, "global_step": 30178, "epoch": 179} {"train_loss": -7.150973320007324, "global_step": 30179, "epoch": 179} {"train_loss": -7.399880409240723, "global_step": 30180, "epoch": 179} {"train_loss": -7.518130302429199, "global_step": 30181, "epoch": 179} {"train_loss": -7.470040321350098, "global_step": 30182, "epoch": 179} {"train_loss": -7.346681118011475, "global_step": 30183, "epoch": 179} {"train_loss": -7.5725603103637695, "global_step": 30184, "epoch": 179} {"train_loss": -7.416346549987793, "global_step": 30185, "epoch": 179} {"train_loss": -7.571013927459717, "global_step": 30186, "epoch": 179} {"train_loss": -7.500517845153809, "global_step": 30187, "epoch": 179} {"train_loss": -7.393557548522949, "global_step": 30188, "epoch": 179} {"train_loss": -7.628666877746582, "global_step": 30189, "epoch": 179} {"train_loss": -7.404630184173584, "global_step": 30190, "epoch": 179} {"train_loss": -7.730257511138916, "global_step": 30191, "epoch": 179} {"train_loss": -7.499048233032227, "global_step": 30192, "epoch": 179} {"train_loss": -7.4364166259765625, "global_step": 30193, "epoch": 179} {"train_loss": -7.450868606567383, "global_step": 30194, "epoch": 179} {"train_loss": -7.545846939086914, "global_step": 30195, "epoch": 179} {"train_loss": -7.283405780792236, "global_step": 30196, "epoch": 179} {"train_loss": -7.632094383239746, "global_step": 30197, "epoch": 179} {"train_loss": -7.700617790222168, "global_step": 30198, "epoch": 179} {"train_loss": -7.524602890014648, "global_step": 30199, "epoch": 179} {"train_loss": -7.596136093139648, "global_step": 30200, "epoch": 179} {"train_loss": -7.627852916717529, "global_step": 30201, "epoch": 179} {"train_loss": -7.618846893310547, "global_step": 30202, "epoch": 179} {"train_loss": -7.464913368225098, "global_step": 30203, "epoch": 179} {"train_loss": -7.786707401275635, "global_step": 30204, "epoch": 179} {"train_loss": -7.315359115600586, "global_step": 30205, "epoch": 179} {"train_loss": -7.44101619720459, "global_step": 30206, "epoch": 179} {"train_loss": -7.740747928619385, "global_step": 30207, "epoch": 179} {"train_loss": -7.681051254272461, "global_step": 30208, "epoch": 179} {"train_loss": -7.581080436706543, "global_step": 30209, "epoch": 179} {"train_loss": -7.362771987915039, "global_step": 30210, "epoch": 179} {"train_loss": -7.665125370025635, "global_step": 30211, "epoch": 179} {"train_loss": -7.412120342254639, "global_step": 30212, "epoch": 179} {"train_loss": -7.397355079650879, "global_step": 30213, "epoch": 179} {"train_loss": -7.490860939025879, "global_step": 30214, "epoch": 179} {"train_loss": -7.531513690948486, "global_step": 30215, "epoch": 179} {"train_loss": -7.315907001495361, "global_step": 30216, "epoch": 179} {"train_loss": -7.74329948425293, "global_step": 30217, "epoch": 179} {"train_loss": -7.379518508911133, "global_step": 30218, "epoch": 179} {"train_loss": -7.311906337738037, "global_step": 30219, "epoch": 179} {"train_loss": -7.460709571838379, "global_step": 30220, "epoch": 179} {"train_loss": -7.227134704589844, "global_step": 30221, "epoch": 179} {"train_loss": -7.643387317657471, "global_step": 30222, "epoch": 179} {"train_loss": -7.2803544998168945, "global_step": 30223, "epoch": 179} {"train_loss": -7.452942371368408, "global_step": 30224, "epoch": 179} {"train_loss": -7.47346305847168, "global_step": 30225, "epoch": 179} {"train_loss": -7.1268205642700195, "global_step": 30226, "epoch": 179} {"train_loss": -7.538919448852539, "global_step": 30227, "epoch": 179} {"train_loss": -7.406498432159424, "global_step": 30228, "epoch": 179} {"train_loss": -7.562409400939941, "global_step": 30229, "epoch": 179} {"train_loss": -7.680114269256592, "global_step": 30230, "epoch": 179} {"train_loss": -7.459339141845703, "global_step": 30231, "epoch": 179} {"train_loss": -7.518426895141602, "global_step": 30232, "epoch": 179} {"train_loss": -7.500576972961426, "global_step": 30233, "epoch": 179} {"train_loss": -7.460630893707275, "global_step": 30234, "epoch": 179} {"train_loss": -7.396322250366211, "global_step": 30235, "epoch": 179} {"train_loss": -7.4738616943359375, "global_step": 30236, "epoch": 179} {"train_loss": -7.1469879150390625, "global_step": 30237, "epoch": 179} {"train_loss": -7.3394622802734375, "global_step": 30238, "epoch": 179} {"train_loss": -7.456700254054296, "global_step": 30239, "epoch": 179, "val_loss": 190330.953125} {"train_loss": -7.293188095092773, "global_step": 30240, "epoch": 180} {"train_loss": -7.669945240020752, "global_step": 30241, "epoch": 180} {"train_loss": -7.368810653686523, "global_step": 30242, "epoch": 180} {"train_loss": -7.530359268188477, "global_step": 30243, "epoch": 180} {"train_loss": -7.32561731338501, "global_step": 30244, "epoch": 180} {"train_loss": -7.232232093811035, "global_step": 30245, "epoch": 180} {"train_loss": -7.499683856964111, "global_step": 30246, "epoch": 180} {"train_loss": -7.386863708496094, "global_step": 30247, "epoch": 180} {"train_loss": -7.470035552978516, "global_step": 30248, "epoch": 180} {"train_loss": -7.291146755218506, "global_step": 30249, "epoch": 180} {"train_loss": -7.425576686859131, "global_step": 30250, "epoch": 180} {"train_loss": -7.459208011627197, "global_step": 30251, "epoch": 180} {"train_loss": -7.3826494216918945, "global_step": 30252, "epoch": 180} {"train_loss": -7.448456764221191, "global_step": 30253, "epoch": 180} {"train_loss": -7.446054458618164, "global_step": 30254, "epoch": 180} {"train_loss": -7.5806379318237305, "global_step": 30255, "epoch": 180} {"train_loss": -7.460816383361816, "global_step": 30256, "epoch": 180} {"train_loss": -7.625509262084961, "global_step": 30257, "epoch": 180} {"train_loss": -7.433180332183838, "global_step": 30258, "epoch": 180} {"train_loss": -7.174183368682861, "global_step": 30259, "epoch": 180} {"train_loss": -7.449375629425049, "global_step": 30260, "epoch": 180} {"train_loss": -7.571029186248779, "global_step": 30261, "epoch": 180} {"train_loss": -7.568365097045898, "global_step": 30262, "epoch": 180} {"train_loss": -7.546932220458984, "global_step": 30263, "epoch": 180} {"train_loss": -7.440701484680176, "global_step": 30264, "epoch": 180} {"train_loss": -7.618716239929199, "global_step": 30265, "epoch": 180} {"train_loss": -7.583010673522949, "global_step": 30266, "epoch": 180} {"train_loss": -7.747935771942139, "global_step": 30267, "epoch": 180} {"train_loss": -7.593193054199219, "global_step": 30268, "epoch": 180} {"train_loss": -7.466269016265869, "global_step": 30269, "epoch": 180} {"train_loss": -7.730963230133057, "global_step": 30270, "epoch": 180} {"train_loss": -7.686334133148193, "global_step": 30271, "epoch": 180} {"train_loss": -7.691849231719971, "global_step": 30272, "epoch": 180} {"train_loss": -7.583739757537842, "global_step": 30273, "epoch": 180} {"train_loss": -7.618808746337891, "global_step": 30274, "epoch": 180} {"train_loss": -7.594965934753418, "global_step": 30275, "epoch": 180} {"train_loss": -7.577718257904053, "global_step": 30276, "epoch": 180} {"train_loss": -7.533839225769043, "global_step": 30277, "epoch": 180} {"train_loss": -7.624303817749023, "global_step": 30278, "epoch": 180} {"train_loss": -7.313192844390869, "global_step": 30279, "epoch": 180} {"train_loss": -7.558545112609863, "global_step": 30280, "epoch": 180} {"train_loss": -7.473024368286133, "global_step": 30281, "epoch": 180} {"train_loss": -7.453535079956055, "global_step": 30282, "epoch": 180} {"train_loss": -7.426575660705566, "global_step": 30283, "epoch": 180} {"train_loss": -7.422999382019043, "global_step": 30284, "epoch": 180} {"train_loss": -7.331576347351074, "global_step": 30285, "epoch": 180} {"train_loss": -7.4301252365112305, "global_step": 30286, "epoch": 180} {"train_loss": -7.439214706420898, "global_step": 30287, "epoch": 180} {"train_loss": -7.427346229553223, "global_step": 30288, "epoch": 180} {"train_loss": -7.271207809448242, "global_step": 30289, "epoch": 180} {"train_loss": -7.56981086730957, "global_step": 30290, "epoch": 180} {"train_loss": -7.540401458740234, "global_step": 30291, "epoch": 180} {"train_loss": -7.719512939453125, "global_step": 30292, "epoch": 180} {"train_loss": -7.365663051605225, "global_step": 30293, "epoch": 180} {"train_loss": -7.677003860473633, "global_step": 30294, "epoch": 180} {"train_loss": -7.487517356872559, "global_step": 30295, "epoch": 180} {"train_loss": -7.655874252319336, "global_step": 30296, "epoch": 180} {"train_loss": -7.626945495605469, "global_step": 30297, "epoch": 180} {"train_loss": -7.526140213012695, "global_step": 30298, "epoch": 180} {"train_loss": -7.420645713806152, "global_step": 30299, "epoch": 180} {"train_loss": -7.533754825592041, "global_step": 30300, "epoch": 180} {"train_loss": -7.486552715301514, "global_step": 30301, "epoch": 180} {"train_loss": -7.56798791885376, "global_step": 30302, "epoch": 180} {"train_loss": -7.512452125549316, "global_step": 30303, "epoch": 180} {"train_loss": -7.551398277282715, "global_step": 30304, "epoch": 180} {"train_loss": -7.429502487182617, "global_step": 30305, "epoch": 180} {"train_loss": -7.1135759353637695, "global_step": 30306, "epoch": 180} {"train_loss": -7.44484806060791, "global_step": 30307, "epoch": 180} {"train_loss": -7.290775299072266, "global_step": 30308, "epoch": 180} {"train_loss": -7.334193229675293, "global_step": 30309, "epoch": 180} {"train_loss": -7.455345153808594, "global_step": 30310, "epoch": 180} {"train_loss": -7.456447601318359, "global_step": 30311, "epoch": 180} {"train_loss": -7.3752899169921875, "global_step": 30312, "epoch": 180} {"train_loss": -7.358276844024658, "global_step": 30313, "epoch": 180} {"train_loss": -7.523480415344238, "global_step": 30314, "epoch": 180} {"train_loss": -7.463329315185547, "global_step": 30315, "epoch": 180} {"train_loss": -7.412888526916504, "global_step": 30316, "epoch": 180} {"train_loss": -7.280913352966309, "global_step": 30317, "epoch": 180} {"train_loss": -7.411432266235352, "global_step": 30318, "epoch": 180} {"train_loss": -7.472517967224121, "global_step": 30319, "epoch": 180} {"train_loss": -7.506032943725586, "global_step": 30320, "epoch": 180} {"train_loss": -7.545151710510254, "global_step": 30321, "epoch": 180} {"train_loss": -7.379705429077148, "global_step": 30322, "epoch": 180} {"train_loss": -7.41873836517334, "global_step": 30323, "epoch": 180} {"train_loss": -7.640722274780273, "global_step": 30324, "epoch": 180} {"train_loss": -7.6991400718688965, "global_step": 30325, "epoch": 180} {"train_loss": -7.274270057678223, "global_step": 30326, "epoch": 180} {"train_loss": -7.598130702972412, "global_step": 30327, "epoch": 180} {"train_loss": -7.465100288391113, "global_step": 30328, "epoch": 180} {"train_loss": -7.354657173156738, "global_step": 30329, "epoch": 180} {"train_loss": -7.6288042068481445, "global_step": 30330, "epoch": 180} {"train_loss": -7.4761223793029785, "global_step": 30331, "epoch": 180} {"train_loss": -7.5160322189331055, "global_step": 30332, "epoch": 180} {"train_loss": -7.6914567947387695, "global_step": 30333, "epoch": 180} {"train_loss": -7.569482803344727, "global_step": 30334, "epoch": 180} {"train_loss": -7.449662208557129, "global_step": 30335, "epoch": 180} {"train_loss": -7.455587863922119, "global_step": 30336, "epoch": 180} {"train_loss": -7.4348626136779785, "global_step": 30337, "epoch": 180} {"train_loss": -7.444212436676025, "global_step": 30338, "epoch": 180} {"train_loss": -7.395597457885742, "global_step": 30339, "epoch": 180} {"train_loss": -7.322914123535156, "global_step": 30340, "epoch": 180} {"train_loss": -7.591105937957764, "global_step": 30341, "epoch": 180} {"train_loss": -7.0654296875, "global_step": 30342, "epoch": 180} {"train_loss": -7.3561692237854, "global_step": 30343, "epoch": 180} {"train_loss": -7.311046600341797, "global_step": 30344, "epoch": 180} {"train_loss": -7.225852966308594, "global_step": 30345, "epoch": 180} {"train_loss": -7.331226348876953, "global_step": 30346, "epoch": 180} {"train_loss": -7.391411304473877, "global_step": 30347, "epoch": 180} {"train_loss": -7.553122043609619, "global_step": 30348, "epoch": 180} {"train_loss": -7.505383491516113, "global_step": 30349, "epoch": 180} {"train_loss": -7.389792442321777, "global_step": 30350, "epoch": 180} {"train_loss": -7.684412956237793, "global_step": 30351, "epoch": 180} {"train_loss": -7.670853614807129, "global_step": 30352, "epoch": 180} {"train_loss": -7.429328918457031, "global_step": 30353, "epoch": 180} {"train_loss": -7.6114091873168945, "global_step": 30354, "epoch": 180} {"train_loss": -7.386867046356201, "global_step": 30355, "epoch": 180} {"train_loss": -7.3217363357543945, "global_step": 30356, "epoch": 180} {"train_loss": -7.489105224609375, "global_step": 30357, "epoch": 180} {"train_loss": -7.371316909790039, "global_step": 30358, "epoch": 180} {"train_loss": -7.762902736663818, "global_step": 30359, "epoch": 180} {"train_loss": -7.537630081176758, "global_step": 30360, "epoch": 180} {"train_loss": -7.525816917419434, "global_step": 30361, "epoch": 180} {"train_loss": -7.499228000640869, "global_step": 30362, "epoch": 180} {"train_loss": -7.480717658996582, "global_step": 30363, "epoch": 180} {"train_loss": -7.563825607299805, "global_step": 30364, "epoch": 180} {"train_loss": -7.60581636428833, "global_step": 30365, "epoch": 180} {"train_loss": -7.509190559387207, "global_step": 30366, "epoch": 180} {"train_loss": -7.636892318725586, "global_step": 30367, "epoch": 180} {"train_loss": -7.4061384201049805, "global_step": 30368, "epoch": 180} {"train_loss": -7.6447553634643555, "global_step": 30369, "epoch": 180} {"train_loss": -7.614900588989258, "global_step": 30370, "epoch": 180} {"train_loss": -7.6612138748168945, "global_step": 30371, "epoch": 180} {"train_loss": -7.5746355056762695, "global_step": 30372, "epoch": 180} {"train_loss": -7.102278709411621, "global_step": 30373, "epoch": 180} {"train_loss": -7.559417724609375, "global_step": 30374, "epoch": 180} {"train_loss": -7.407528877258301, "global_step": 30375, "epoch": 180} {"train_loss": -7.549350738525391, "global_step": 30376, "epoch": 180} {"train_loss": -7.320937156677246, "global_step": 30377, "epoch": 180} {"train_loss": -7.700790882110596, "global_step": 30378, "epoch": 180} {"train_loss": -7.50825309753418, "global_step": 30379, "epoch": 180} {"train_loss": -7.611575603485107, "global_step": 30380, "epoch": 180} {"train_loss": -7.509771347045898, "global_step": 30381, "epoch": 180} {"train_loss": -7.637809753417969, "global_step": 30382, "epoch": 180} {"train_loss": -7.340682029724121, "global_step": 30383, "epoch": 180} {"train_loss": -7.513291358947754, "global_step": 30384, "epoch": 180} {"train_loss": -7.258953094482422, "global_step": 30385, "epoch": 180} {"train_loss": -7.583588600158691, "global_step": 30386, "epoch": 180} {"train_loss": -7.537286758422852, "global_step": 30387, "epoch": 180} {"train_loss": -7.547220706939697, "global_step": 30388, "epoch": 180} {"train_loss": -7.439306259155273, "global_step": 30389, "epoch": 180} {"train_loss": -7.551302909851074, "global_step": 30390, "epoch": 180} {"train_loss": -7.409268856048584, "global_step": 30391, "epoch": 180} {"train_loss": -7.425158500671387, "global_step": 30392, "epoch": 180} {"train_loss": -7.56553316116333, "global_step": 30393, "epoch": 180} {"train_loss": -7.33837890625, "global_step": 30394, "epoch": 180} {"train_loss": -7.738101005554199, "global_step": 30395, "epoch": 180} {"train_loss": -7.559701919555664, "global_step": 30396, "epoch": 180} {"train_loss": -7.697466850280762, "global_step": 30397, "epoch": 180} {"train_loss": -7.7363505363464355, "global_step": 30398, "epoch": 180} {"train_loss": -7.632665157318115, "global_step": 30399, "epoch": 180} {"train_loss": -7.655425071716309, "global_step": 30400, "epoch": 180} {"train_loss": -7.340609550476074, "global_step": 30401, "epoch": 180} {"train_loss": -7.842462062835693, "global_step": 30402, "epoch": 180} {"train_loss": -7.647191524505615, "global_step": 30403, "epoch": 180} {"train_loss": -7.730792045593262, "global_step": 30404, "epoch": 180} {"train_loss": -7.771421909332275, "global_step": 30405, "epoch": 180} {"train_loss": -7.581783294677734, "global_step": 30406, "epoch": 180} {"train_loss": -7.495040428070795, "global_step": 30407, "epoch": 180, "val_loss": 188638.671875, "train_action_mse_error": 9.91887092590332} {"train_loss": -7.677008152008057, "global_step": 30408, "epoch": 181} {"train_loss": -7.664821624755859, "global_step": 30409, "epoch": 181} {"train_loss": -7.78226375579834, "global_step": 30410, "epoch": 181} {"train_loss": -7.587505340576172, "global_step": 30411, "epoch": 181} {"train_loss": -7.607732772827148, "global_step": 30412, "epoch": 181} {"train_loss": -7.612161636352539, "global_step": 30413, "epoch": 181} {"train_loss": -7.4825029373168945, "global_step": 30414, "epoch": 181} {"train_loss": -7.519065856933594, "global_step": 30415, "epoch": 181} {"train_loss": -7.480169296264648, "global_step": 30416, "epoch": 181} {"train_loss": -7.454867839813232, "global_step": 30417, "epoch": 181} {"train_loss": -7.43951416015625, "global_step": 30418, "epoch": 181} {"train_loss": -7.389862060546875, "global_step": 30419, "epoch": 181} {"train_loss": -7.412757873535156, "global_step": 30420, "epoch": 181} {"train_loss": -7.528182029724121, "global_step": 30421, "epoch": 181} {"train_loss": -7.508306503295898, "global_step": 30422, "epoch": 181} {"train_loss": -7.683406829833984, "global_step": 30423, "epoch": 181} {"train_loss": -7.352282524108887, "global_step": 30424, "epoch": 181} {"train_loss": -7.399425983428955, "global_step": 30425, "epoch": 181} {"train_loss": -7.298643112182617, "global_step": 30426, "epoch": 181} {"train_loss": -7.580768585205078, "global_step": 30427, "epoch": 181} {"train_loss": -7.315203666687012, "global_step": 30428, "epoch": 181} {"train_loss": -7.554941654205322, "global_step": 30429, "epoch": 181} {"train_loss": -7.355386734008789, "global_step": 30430, "epoch": 181} {"train_loss": -7.640798568725586, "global_step": 30431, "epoch": 181} {"train_loss": -7.383704662322998, "global_step": 30432, "epoch": 181} {"train_loss": -7.4853410720825195, "global_step": 30433, "epoch": 181} {"train_loss": -7.407695770263672, "global_step": 30434, "epoch": 181} {"train_loss": -7.533630847930908, "global_step": 30435, "epoch": 181} {"train_loss": -7.3765974044799805, "global_step": 30436, "epoch": 181} {"train_loss": -7.273406982421875, "global_step": 30437, "epoch": 181} {"train_loss": -7.464735984802246, "global_step": 30438, "epoch": 181} {"train_loss": -7.30405855178833, "global_step": 30439, "epoch": 181} {"train_loss": -7.480094909667969, "global_step": 30440, "epoch": 181} {"train_loss": -7.316570281982422, "global_step": 30441, "epoch": 181} {"train_loss": -7.450039386749268, "global_step": 30442, "epoch": 181} {"train_loss": -7.57540225982666, "global_step": 30443, "epoch": 181} {"train_loss": -7.451899528503418, "global_step": 30444, "epoch": 181} {"train_loss": -7.523990631103516, "global_step": 30445, "epoch": 181} {"train_loss": -7.562982559204102, "global_step": 30446, "epoch": 181} {"train_loss": -7.376219272613525, "global_step": 30447, "epoch": 181} {"train_loss": -7.731576919555664, "global_step": 30448, "epoch": 181} {"train_loss": -7.570296287536621, "global_step": 30449, "epoch": 181} {"train_loss": -7.629149436950684, "global_step": 30450, "epoch": 181} {"train_loss": -7.654506683349609, "global_step": 30451, "epoch": 181} {"train_loss": -7.839642524719238, "global_step": 30452, "epoch": 181} {"train_loss": -7.479345798492432, "global_step": 30453, "epoch": 181} {"train_loss": -7.619424819946289, "global_step": 30454, "epoch": 181} {"train_loss": -7.702014446258545, "global_step": 30455, "epoch": 181} {"train_loss": -7.389549255371094, "global_step": 30456, "epoch": 181} {"train_loss": -7.564317226409912, "global_step": 30457, "epoch": 181} {"train_loss": -7.495318412780762, "global_step": 30458, "epoch": 181} {"train_loss": -7.4341535568237305, "global_step": 30459, "epoch": 181} {"train_loss": -7.658717155456543, "global_step": 30460, "epoch": 181} {"train_loss": -7.503243446350098, "global_step": 30461, "epoch": 181} {"train_loss": -7.37017297744751, "global_step": 30462, "epoch": 181} {"train_loss": -7.333469867706299, "global_step": 30463, "epoch": 181} {"train_loss": -7.414338111877441, "global_step": 30464, "epoch": 181} {"train_loss": -7.689458847045898, "global_step": 30465, "epoch": 181} {"train_loss": -7.392930030822754, "global_step": 30466, "epoch": 181} {"train_loss": -7.445198059082031, "global_step": 30467, "epoch": 181} {"train_loss": -7.751023292541504, "global_step": 30468, "epoch": 181} {"train_loss": -7.590179443359375, "global_step": 30469, "epoch": 181} {"train_loss": -7.329111576080322, "global_step": 30470, "epoch": 181} {"train_loss": -7.668827056884766, "global_step": 30471, "epoch": 181} {"train_loss": -7.1855621337890625, "global_step": 30472, "epoch": 181} {"train_loss": -7.5135650634765625, "global_step": 30473, "epoch": 181} {"train_loss": -7.245782852172852, "global_step": 30474, "epoch": 181} {"train_loss": -7.5520124435424805, "global_step": 30475, "epoch": 181} {"train_loss": -7.328366279602051, "global_step": 30476, "epoch": 181} {"train_loss": -7.505915641784668, "global_step": 30477, "epoch": 181} {"train_loss": -7.722325325012207, "global_step": 30478, "epoch": 181} {"train_loss": -7.586160182952881, "global_step": 30479, "epoch": 181} {"train_loss": -7.54813289642334, "global_step": 30480, "epoch": 181} {"train_loss": -7.386404991149902, "global_step": 30481, "epoch": 181} {"train_loss": -7.541910171508789, "global_step": 30482, "epoch": 181} {"train_loss": -7.430539608001709, "global_step": 30483, "epoch": 181} {"train_loss": -7.426759243011475, "global_step": 30484, "epoch": 181} {"train_loss": -7.497237205505371, "global_step": 30485, "epoch": 181} {"train_loss": -7.687996864318848, "global_step": 30486, "epoch": 181} {"train_loss": -7.364999771118164, "global_step": 30487, "epoch": 181} {"train_loss": -7.528656005859375, "global_step": 30488, "epoch": 181} {"train_loss": -7.687820911407471, "global_step": 30489, "epoch": 181} {"train_loss": -7.578500270843506, "global_step": 30490, "epoch": 181} {"train_loss": -7.351546287536621, "global_step": 30491, "epoch": 181} {"train_loss": -7.438543796539307, "global_step": 30492, "epoch": 181} {"train_loss": -7.463787078857422, "global_step": 30493, "epoch": 181} {"train_loss": -7.435159683227539, "global_step": 30494, "epoch": 181} {"train_loss": -7.58685302734375, "global_step": 30495, "epoch": 181} {"train_loss": -7.459331035614014, "global_step": 30496, "epoch": 181} {"train_loss": -7.6941938400268555, "global_step": 30497, "epoch": 181} {"train_loss": -7.635866165161133, "global_step": 30498, "epoch": 181} {"train_loss": -7.598146438598633, "global_step": 30499, "epoch": 181} {"train_loss": -7.6187238693237305, "global_step": 30500, "epoch": 181} {"train_loss": -7.297788619995117, "global_step": 30501, "epoch": 181} {"train_loss": -7.615638732910156, "global_step": 30502, "epoch": 181} {"train_loss": -7.515706539154053, "global_step": 30503, "epoch": 181} {"train_loss": -7.589259147644043, "global_step": 30504, "epoch": 181} {"train_loss": -7.387602806091309, "global_step": 30505, "epoch": 181} {"train_loss": -7.5658721923828125, "global_step": 30506, "epoch": 181} {"train_loss": -7.7225022315979, "global_step": 30507, "epoch": 181} {"train_loss": -7.507927417755127, "global_step": 30508, "epoch": 181} {"train_loss": -7.334135055541992, "global_step": 30509, "epoch": 181} {"train_loss": -7.625871181488037, "global_step": 30510, "epoch": 181} {"train_loss": -7.795953750610352, "global_step": 30511, "epoch": 181} {"train_loss": -7.554899215698242, "global_step": 30512, "epoch": 181} {"train_loss": -7.701723098754883, "global_step": 30513, "epoch": 181} {"train_loss": -7.471640586853027, "global_step": 30514, "epoch": 181} {"train_loss": -7.138993740081787, "global_step": 30515, "epoch": 181} {"train_loss": -7.5982770919799805, "global_step": 30516, "epoch": 181} {"train_loss": -6.816868305206299, "global_step": 30517, "epoch": 181} {"train_loss": -7.348373889923096, "global_step": 30518, "epoch": 181} {"train_loss": -7.089759826660156, "global_step": 30519, "epoch": 181} {"train_loss": -7.4167351722717285, "global_step": 30520, "epoch": 181} {"train_loss": -7.2011308670043945, "global_step": 30521, "epoch": 181} {"train_loss": -7.21653938293457, "global_step": 30522, "epoch": 181} {"train_loss": -7.427550315856934, "global_step": 30523, "epoch": 181} {"train_loss": -7.3896260261535645, "global_step": 30524, "epoch": 181} {"train_loss": -7.335502624511719, "global_step": 30525, "epoch": 181} {"train_loss": -7.257590293884277, "global_step": 30526, "epoch": 181} {"train_loss": -7.324469566345215, "global_step": 30527, "epoch": 181} {"train_loss": -7.37171745300293, "global_step": 30528, "epoch": 181} {"train_loss": -7.401461601257324, "global_step": 30529, "epoch": 181} {"train_loss": -7.380336761474609, "global_step": 30530, "epoch": 181} {"train_loss": -7.410510063171387, "global_step": 30531, "epoch": 181} {"train_loss": -7.416858673095703, "global_step": 30532, "epoch": 181} {"train_loss": -7.177927017211914, "global_step": 30533, "epoch": 181} {"train_loss": -7.6482157707214355, "global_step": 30534, "epoch": 181} {"train_loss": -7.288934707641602, "global_step": 30535, "epoch": 181} {"train_loss": -7.43858003616333, "global_step": 30536, "epoch": 181} {"train_loss": -7.427446365356445, "global_step": 30537, "epoch": 181} {"train_loss": -7.368945121765137, "global_step": 30538, "epoch": 181} {"train_loss": -7.37032413482666, "global_step": 30539, "epoch": 181} {"train_loss": -7.573492527008057, "global_step": 30540, "epoch": 181} {"train_loss": -7.410294532775879, "global_step": 30541, "epoch": 181} {"train_loss": -7.398685932159424, "global_step": 30542, "epoch": 181} {"train_loss": -7.327698707580566, "global_step": 30543, "epoch": 181} {"train_loss": -7.398211479187012, "global_step": 30544, "epoch": 181} {"train_loss": -7.448673248291016, "global_step": 30545, "epoch": 181} {"train_loss": -7.393381595611572, "global_step": 30546, "epoch": 181} {"train_loss": -7.6710638999938965, "global_step": 30547, "epoch": 181} {"train_loss": -7.407382488250732, "global_step": 30548, "epoch": 181} {"train_loss": -7.631293773651123, "global_step": 30549, "epoch": 181} {"train_loss": -7.5146636962890625, "global_step": 30550, "epoch": 181} {"train_loss": -7.545600891113281, "global_step": 30551, "epoch": 181} {"train_loss": -7.412960529327393, "global_step": 30552, "epoch": 181} {"train_loss": -7.654324531555176, "global_step": 30553, "epoch": 181} {"train_loss": -7.352731227874756, "global_step": 30554, "epoch": 181} {"train_loss": -7.409855842590332, "global_step": 30555, "epoch": 181} {"train_loss": -7.618955612182617, "global_step": 30556, "epoch": 181} {"train_loss": -7.607606887817383, "global_step": 30557, "epoch": 181} {"train_loss": -7.464322566986084, "global_step": 30558, "epoch": 181} {"train_loss": -7.604866981506348, "global_step": 30559, "epoch": 181} {"train_loss": -7.662449836730957, "global_step": 30560, "epoch": 181} {"train_loss": -7.369794845581055, "global_step": 30561, "epoch": 181} {"train_loss": -7.41154670715332, "global_step": 30562, "epoch": 181} {"train_loss": -7.6175031661987305, "global_step": 30563, "epoch": 181} {"train_loss": -7.722818374633789, "global_step": 30564, "epoch": 181} {"train_loss": -7.377012729644775, "global_step": 30565, "epoch": 181} {"train_loss": -7.4325385093688965, "global_step": 30566, "epoch": 181} {"train_loss": -7.462552547454834, "global_step": 30567, "epoch": 181} {"train_loss": -7.5724101066589355, "global_step": 30568, "epoch": 181} {"train_loss": -7.657050132751465, "global_step": 30569, "epoch": 181} {"train_loss": -7.46431827545166, "global_step": 30570, "epoch": 181} {"train_loss": -7.45515775680542, "global_step": 30571, "epoch": 181} {"train_loss": -7.558139324188232, "global_step": 30572, "epoch": 181} {"train_loss": -7.507040023803711, "global_step": 30573, "epoch": 181} {"train_loss": -7.594008445739746, "global_step": 30574, "epoch": 181} {"train_loss": -7.484205183528719, "global_step": 30575, "epoch": 181, "val_loss": 191477.8125} {"train_loss": -7.2548136711120605, "global_step": 30576, "epoch": 182} {"train_loss": -7.34466552734375, "global_step": 30577, "epoch": 182} {"train_loss": -7.529974460601807, "global_step": 30578, "epoch": 182} {"train_loss": -7.375811576843262, "global_step": 30579, "epoch": 182} {"train_loss": -7.475006103515625, "global_step": 30580, "epoch": 182} {"train_loss": -7.177776336669922, "global_step": 30581, "epoch": 182} {"train_loss": -7.541900634765625, "global_step": 30582, "epoch": 182} {"train_loss": -7.32804012298584, "global_step": 30583, "epoch": 182} {"train_loss": -7.5495805740356445, "global_step": 30584, "epoch": 182} {"train_loss": -7.303513526916504, "global_step": 30585, "epoch": 182} {"train_loss": -7.230066299438477, "global_step": 30586, "epoch": 182} {"train_loss": -7.566727638244629, "global_step": 30587, "epoch": 182} {"train_loss": -7.246819496154785, "global_step": 30588, "epoch": 182} {"train_loss": -7.649692535400391, "global_step": 30589, "epoch": 182} {"train_loss": -7.267539978027344, "global_step": 30590, "epoch": 182} {"train_loss": -7.299909591674805, "global_step": 30591, "epoch": 182} {"train_loss": -7.361946105957031, "global_step": 30592, "epoch": 182} {"train_loss": -7.408511638641357, "global_step": 30593, "epoch": 182} {"train_loss": -7.467315673828125, "global_step": 30594, "epoch": 182} {"train_loss": -7.330780982971191, "global_step": 30595, "epoch": 182} {"train_loss": -7.388375282287598, "global_step": 30596, "epoch": 182} {"train_loss": -7.462926864624023, "global_step": 30597, "epoch": 182} {"train_loss": -7.426274299621582, "global_step": 30598, "epoch": 182} {"train_loss": -7.44842529296875, "global_step": 30599, "epoch": 182} {"train_loss": -7.6581926345825195, "global_step": 30600, "epoch": 182} {"train_loss": -7.734510898590088, "global_step": 30601, "epoch": 182} {"train_loss": -7.661847114562988, "global_step": 30602, "epoch": 182} {"train_loss": -7.480507850646973, "global_step": 30603, "epoch": 182} {"train_loss": -7.507580280303955, "global_step": 30604, "epoch": 182} {"train_loss": -7.559388160705566, "global_step": 30605, "epoch": 182} {"train_loss": -7.526944637298584, "global_step": 30606, "epoch": 182} {"train_loss": -7.502588272094727, "global_step": 30607, "epoch": 182} {"train_loss": -7.484798431396484, "global_step": 30608, "epoch": 182} {"train_loss": -7.19838809967041, "global_step": 30609, "epoch": 182} {"train_loss": -7.652371406555176, "global_step": 30610, "epoch": 182} {"train_loss": -7.384550094604492, "global_step": 30611, "epoch": 182} {"train_loss": -7.432330131530762, "global_step": 30612, "epoch": 182} {"train_loss": -7.295392990112305, "global_step": 30613, "epoch": 182} {"train_loss": -7.5428786277771, "global_step": 30614, "epoch": 182} {"train_loss": -7.44944953918457, "global_step": 30615, "epoch": 182} {"train_loss": -7.4098100662231445, "global_step": 30616, "epoch": 182} {"train_loss": -7.615694999694824, "global_step": 30617, "epoch": 182} {"train_loss": -7.43277645111084, "global_step": 30618, "epoch": 182} {"train_loss": -7.55009651184082, "global_step": 30619, "epoch": 182} {"train_loss": -7.719601631164551, "global_step": 30620, "epoch": 182} {"train_loss": -7.414443492889404, "global_step": 30621, "epoch": 182} {"train_loss": -7.789017677307129, "global_step": 30622, "epoch": 182} {"train_loss": -7.348512172698975, "global_step": 30623, "epoch": 182} {"train_loss": -7.553183555603027, "global_step": 30624, "epoch": 182} {"train_loss": -7.393350601196289, "global_step": 30625, "epoch": 182} {"train_loss": -7.762825965881348, "global_step": 30626, "epoch": 182} {"train_loss": -7.531694412231445, "global_step": 30627, "epoch": 182} {"train_loss": -7.601288795471191, "global_step": 30628, "epoch": 182} {"train_loss": -7.57704496383667, "global_step": 30629, "epoch": 182} {"train_loss": -7.607823371887207, "global_step": 30630, "epoch": 182} {"train_loss": -7.601640224456787, "global_step": 30631, "epoch": 182} {"train_loss": -7.551204681396484, "global_step": 30632, "epoch": 182} {"train_loss": -7.337592124938965, "global_step": 30633, "epoch": 182} {"train_loss": -7.457459449768066, "global_step": 30634, "epoch": 182} {"train_loss": -7.5572381019592285, "global_step": 30635, "epoch": 182} {"train_loss": -7.665136814117432, "global_step": 30636, "epoch": 182} {"train_loss": -7.707073211669922, "global_step": 30637, "epoch": 182} {"train_loss": -7.565895080566406, "global_step": 30638, "epoch": 182} {"train_loss": -7.684010028839111, "global_step": 30639, "epoch": 182} {"train_loss": -7.477384567260742, "global_step": 30640, "epoch": 182} {"train_loss": -7.589953422546387, "global_step": 30641, "epoch": 182} {"train_loss": -7.705650806427002, "global_step": 30642, "epoch": 182} {"train_loss": -7.392881393432617, "global_step": 30643, "epoch": 182} {"train_loss": -7.593101978302002, "global_step": 30644, "epoch": 182} {"train_loss": -7.5689377784729, "global_step": 30645, "epoch": 182} {"train_loss": -7.681571006774902, "global_step": 30646, "epoch": 182} {"train_loss": -7.773530006408691, "global_step": 30647, "epoch": 182} {"train_loss": -7.658003807067871, "global_step": 30648, "epoch": 182} {"train_loss": -7.486201286315918, "global_step": 30649, "epoch": 182} {"train_loss": -7.692049503326416, "global_step": 30650, "epoch": 182} {"train_loss": -7.473819732666016, "global_step": 30651, "epoch": 182} {"train_loss": -7.478877067565918, "global_step": 30652, "epoch": 182} {"train_loss": -7.687787055969238, "global_step": 30653, "epoch": 182} {"train_loss": -7.598814010620117, "global_step": 30654, "epoch": 182} {"train_loss": -7.3957133293151855, "global_step": 30655, "epoch": 182} {"train_loss": -7.706268310546875, "global_step": 30656, "epoch": 182} {"train_loss": -7.504741191864014, "global_step": 30657, "epoch": 182} {"train_loss": -7.291840553283691, "global_step": 30658, "epoch": 182} {"train_loss": -7.372179985046387, "global_step": 30659, "epoch": 182} {"train_loss": -7.433881759643555, "global_step": 30660, "epoch": 182} {"train_loss": -7.428213119506836, "global_step": 30661, "epoch": 182} {"train_loss": -7.397707939147949, "global_step": 30662, "epoch": 182} {"train_loss": -7.268256187438965, "global_step": 30663, "epoch": 182} {"train_loss": -7.497803688049316, "global_step": 30664, "epoch": 182} {"train_loss": -7.39035701751709, "global_step": 30665, "epoch": 182} {"train_loss": -7.521816253662109, "global_step": 30666, "epoch": 182} {"train_loss": -7.393057823181152, "global_step": 30667, "epoch": 182} {"train_loss": -7.377532005310059, "global_step": 30668, "epoch": 182} {"train_loss": -7.515807151794434, "global_step": 30669, "epoch": 182} {"train_loss": -7.436841011047363, "global_step": 30670, "epoch": 182} {"train_loss": -7.466250896453857, "global_step": 30671, "epoch": 182} {"train_loss": -7.72268009185791, "global_step": 30672, "epoch": 182} {"train_loss": -7.651430130004883, "global_step": 30673, "epoch": 182} {"train_loss": -7.557511329650879, "global_step": 30674, "epoch": 182} {"train_loss": -7.471370220184326, "global_step": 30675, "epoch": 182} {"train_loss": -7.526516914367676, "global_step": 30676, "epoch": 182} {"train_loss": -7.503523826599121, "global_step": 30677, "epoch": 182} {"train_loss": -7.394414901733398, "global_step": 30678, "epoch": 182} {"train_loss": -7.507512092590332, "global_step": 30679, "epoch": 182} {"train_loss": -7.567827224731445, "global_step": 30680, "epoch": 182} {"train_loss": -7.634915351867676, "global_step": 30681, "epoch": 182} {"train_loss": -7.415769577026367, "global_step": 30682, "epoch": 182} {"train_loss": -7.492768287658691, "global_step": 30683, "epoch": 182} {"train_loss": -7.661759376525879, "global_step": 30684, "epoch": 182} {"train_loss": -7.571897029876709, "global_step": 30685, "epoch": 182} {"train_loss": -7.563647747039795, "global_step": 30686, "epoch": 182} {"train_loss": -7.597672462463379, "global_step": 30687, "epoch": 182} {"train_loss": -7.468952655792236, "global_step": 30688, "epoch": 182} {"train_loss": -7.691634178161621, "global_step": 30689, "epoch": 182} {"train_loss": -7.438612937927246, "global_step": 30690, "epoch": 182} {"train_loss": -7.557421684265137, "global_step": 30691, "epoch": 182} {"train_loss": -7.489085674285889, "global_step": 30692, "epoch": 182} {"train_loss": -7.459312438964844, "global_step": 30693, "epoch": 182} {"train_loss": -7.313259124755859, "global_step": 30694, "epoch": 182} {"train_loss": -7.45738410949707, "global_step": 30695, "epoch": 182} {"train_loss": -7.503958702087402, "global_step": 30696, "epoch": 182} {"train_loss": -7.446749210357666, "global_step": 30697, "epoch": 182} {"train_loss": -7.3133649826049805, "global_step": 30698, "epoch": 182} {"train_loss": -7.047579765319824, "global_step": 30699, "epoch": 182} {"train_loss": -7.525406837463379, "global_step": 30700, "epoch": 182} {"train_loss": -7.2671966552734375, "global_step": 30701, "epoch": 182} {"train_loss": -7.713127613067627, "global_step": 30702, "epoch": 182} {"train_loss": -7.496122360229492, "global_step": 30703, "epoch": 182} {"train_loss": -7.36301326751709, "global_step": 30704, "epoch": 182} {"train_loss": -7.44715690612793, "global_step": 30705, "epoch": 182} {"train_loss": -7.422032356262207, "global_step": 30706, "epoch": 182} {"train_loss": -7.734990119934082, "global_step": 30707, "epoch": 182} {"train_loss": -7.452484607696533, "global_step": 30708, "epoch": 182} {"train_loss": -7.540654182434082, "global_step": 30709, "epoch": 182} {"train_loss": -7.611960411071777, "global_step": 30710, "epoch": 182} {"train_loss": -7.618312835693359, "global_step": 30711, "epoch": 182} {"train_loss": -7.580790042877197, "global_step": 30712, "epoch": 182} {"train_loss": -7.438023567199707, "global_step": 30713, "epoch": 182} {"train_loss": -7.513714790344238, "global_step": 30714, "epoch": 182} {"train_loss": -7.635550022125244, "global_step": 30715, "epoch": 182} {"train_loss": -7.41843843460083, "global_step": 30716, "epoch": 182} {"train_loss": -7.338265895843506, "global_step": 30717, "epoch": 182} {"train_loss": -7.521760940551758, "global_step": 30718, "epoch": 182} {"train_loss": -7.621220588684082, "global_step": 30719, "epoch": 182} {"train_loss": -7.688043594360352, "global_step": 30720, "epoch": 182} {"train_loss": -7.664409160614014, "global_step": 30721, "epoch": 182} {"train_loss": -7.381336688995361, "global_step": 30722, "epoch": 182} {"train_loss": -7.507958889007568, "global_step": 30723, "epoch": 182} {"train_loss": -7.347484111785889, "global_step": 30724, "epoch": 182} {"train_loss": -7.51597785949707, "global_step": 30725, "epoch": 182} {"train_loss": -7.453910827636719, "global_step": 30726, "epoch": 182} {"train_loss": -7.508200168609619, "global_step": 30727, "epoch": 182} {"train_loss": -7.590437889099121, "global_step": 30728, "epoch": 182} {"train_loss": -7.6496686935424805, "global_step": 30729, "epoch": 182} {"train_loss": -7.411674976348877, "global_step": 30730, "epoch": 182} {"train_loss": -7.711724281311035, "global_step": 30731, "epoch": 182} {"train_loss": -7.478560447692871, "global_step": 30732, "epoch": 182} {"train_loss": -7.53842830657959, "global_step": 30733, "epoch": 182} {"train_loss": -7.597829818725586, "global_step": 30734, "epoch": 182} {"train_loss": -7.500958442687988, "global_step": 30735, "epoch": 182} {"train_loss": -7.551907539367676, "global_step": 30736, "epoch": 182} {"train_loss": -7.512402534484863, "global_step": 30737, "epoch": 182} {"train_loss": -7.339361190795898, "global_step": 30738, "epoch": 182} {"train_loss": -7.558758735656738, "global_step": 30739, "epoch": 182} {"train_loss": -7.41827917098999, "global_step": 30740, "epoch": 182} {"train_loss": -7.324544906616211, "global_step": 30741, "epoch": 182} {"train_loss": -7.451504707336426, "global_step": 30742, "epoch": 182} {"train_loss": -7.49990055106935, "global_step": 30743, "epoch": 182, "val_loss": 190254.234375} {"train_loss": -6.990877151489258, "global_step": 30744, "epoch": 183} {"train_loss": -7.430051326751709, "global_step": 30745, "epoch": 183} {"train_loss": -7.282619476318359, "global_step": 30746, "epoch": 183} {"train_loss": -7.376899242401123, "global_step": 30747, "epoch": 183} {"train_loss": -7.193136692047119, "global_step": 30748, "epoch": 183} {"train_loss": -7.141801834106445, "global_step": 30749, "epoch": 183} {"train_loss": -7.325878143310547, "global_step": 30750, "epoch": 183} {"train_loss": -6.873147487640381, "global_step": 30751, "epoch": 183} {"train_loss": -7.2239532470703125, "global_step": 30752, "epoch": 183} {"train_loss": -7.299264907836914, "global_step": 30753, "epoch": 183} {"train_loss": -7.431155204772949, "global_step": 30754, "epoch": 183} {"train_loss": -7.097045421600342, "global_step": 30755, "epoch": 183} {"train_loss": -7.088163375854492, "global_step": 30756, "epoch": 183} {"train_loss": -7.391755104064941, "global_step": 30757, "epoch": 183} {"train_loss": -7.294541358947754, "global_step": 30758, "epoch": 183} {"train_loss": -7.289148330688477, "global_step": 30759, "epoch": 183} {"train_loss": -7.343493938446045, "global_step": 30760, "epoch": 183} {"train_loss": -7.390330791473389, "global_step": 30761, "epoch": 183} {"train_loss": -7.478277683258057, "global_step": 30762, "epoch": 183} {"train_loss": -7.301081657409668, "global_step": 30763, "epoch": 183} {"train_loss": -7.388635635375977, "global_step": 30764, "epoch": 183} {"train_loss": -7.1800994873046875, "global_step": 30765, "epoch": 183} {"train_loss": -7.460681915283203, "global_step": 30766, "epoch": 183} {"train_loss": -7.249669075012207, "global_step": 30767, "epoch": 183} {"train_loss": -7.388434410095215, "global_step": 30768, "epoch": 183} {"train_loss": -7.345759391784668, "global_step": 30769, "epoch": 183} {"train_loss": -7.385658264160156, "global_step": 30770, "epoch": 183} {"train_loss": -7.452813148498535, "global_step": 30771, "epoch": 183} {"train_loss": -7.267674446105957, "global_step": 30772, "epoch": 183} {"train_loss": -7.704828262329102, "global_step": 30773, "epoch": 183} {"train_loss": -7.1678786277771, "global_step": 30774, "epoch": 183} {"train_loss": -7.515762805938721, "global_step": 30775, "epoch": 183} {"train_loss": -7.549676895141602, "global_step": 30776, "epoch": 183} {"train_loss": -7.798099040985107, "global_step": 30777, "epoch": 183} {"train_loss": -7.368287086486816, "global_step": 30778, "epoch": 183} {"train_loss": -7.656646728515625, "global_step": 30779, "epoch": 183} {"train_loss": -7.356393814086914, "global_step": 30780, "epoch": 183} {"train_loss": -7.228816032409668, "global_step": 30781, "epoch": 183} {"train_loss": -7.4137163162231445, "global_step": 30782, "epoch": 183} {"train_loss": -7.5058274269104, "global_step": 30783, "epoch": 183} {"train_loss": -7.440224647521973, "global_step": 30784, "epoch": 183} {"train_loss": -7.525806427001953, "global_step": 30785, "epoch": 183} {"train_loss": -7.556611061096191, "global_step": 30786, "epoch": 183} {"train_loss": -7.479680061340332, "global_step": 30787, "epoch": 183} {"train_loss": -7.62010383605957, "global_step": 30788, "epoch": 183} {"train_loss": -7.505364418029785, "global_step": 30789, "epoch": 183} {"train_loss": -7.748693943023682, "global_step": 30790, "epoch": 183} {"train_loss": -7.577212333679199, "global_step": 30791, "epoch": 183} {"train_loss": -7.712812423706055, "global_step": 30792, "epoch": 183} {"train_loss": -7.59591817855835, "global_step": 30793, "epoch": 183} {"train_loss": -7.491852760314941, "global_step": 30794, "epoch": 183} {"train_loss": -7.6886749267578125, "global_step": 30795, "epoch": 183} {"train_loss": -7.620269775390625, "global_step": 30796, "epoch": 183} {"train_loss": -7.5949225425720215, "global_step": 30797, "epoch": 183} {"train_loss": -7.5769805908203125, "global_step": 30798, "epoch": 183} {"train_loss": -7.626483917236328, "global_step": 30799, "epoch": 183} {"train_loss": -7.7618727684021, "global_step": 30800, "epoch": 183} {"train_loss": -7.401975154876709, "global_step": 30801, "epoch": 183} {"train_loss": -7.381945610046387, "global_step": 30802, "epoch": 183} {"train_loss": -7.602110385894775, "global_step": 30803, "epoch": 183} {"train_loss": -7.555615425109863, "global_step": 30804, "epoch": 183} {"train_loss": -7.677920341491699, "global_step": 30805, "epoch": 183} {"train_loss": -7.509289741516113, "global_step": 30806, "epoch": 183} {"train_loss": -7.582026481628418, "global_step": 30807, "epoch": 183} {"train_loss": -7.491631507873535, "global_step": 30808, "epoch": 183} {"train_loss": -7.615553855895996, "global_step": 30809, "epoch": 183} {"train_loss": -7.393217086791992, "global_step": 30810, "epoch": 183} {"train_loss": -7.724335193634033, "global_step": 30811, "epoch": 183} {"train_loss": -7.303703784942627, "global_step": 30812, "epoch": 183} {"train_loss": -7.388214111328125, "global_step": 30813, "epoch": 183} {"train_loss": -7.4065141677856445, "global_step": 30814, "epoch": 183} {"train_loss": -7.566169261932373, "global_step": 30815, "epoch": 183} {"train_loss": -7.528790473937988, "global_step": 30816, "epoch": 183} {"train_loss": -7.576935768127441, "global_step": 30817, "epoch": 183} {"train_loss": -7.543583869934082, "global_step": 30818, "epoch": 183} {"train_loss": -7.614048004150391, "global_step": 30819, "epoch": 183} {"train_loss": -7.701272487640381, "global_step": 30820, "epoch": 183} {"train_loss": -7.429486274719238, "global_step": 30821, "epoch": 183} {"train_loss": -7.370241641998291, "global_step": 30822, "epoch": 183} {"train_loss": -7.380988597869873, "global_step": 30823, "epoch": 183} {"train_loss": -7.432371139526367, "global_step": 30824, "epoch": 183} {"train_loss": -7.57635498046875, "global_step": 30825, "epoch": 183} {"train_loss": -7.670344352722168, "global_step": 30826, "epoch": 183} {"train_loss": -7.590341091156006, "global_step": 30827, "epoch": 183} {"train_loss": -7.262243270874023, "global_step": 30828, "epoch": 183} {"train_loss": -7.599100112915039, "global_step": 30829, "epoch": 183} {"train_loss": -7.636680603027344, "global_step": 30830, "epoch": 183} {"train_loss": -7.64333963394165, "global_step": 30831, "epoch": 183} {"train_loss": -7.495369911193848, "global_step": 30832, "epoch": 183} {"train_loss": -7.493906497955322, "global_step": 30833, "epoch": 183} {"train_loss": -7.3345136642456055, "global_step": 30834, "epoch": 183} {"train_loss": -7.443194389343262, "global_step": 30835, "epoch": 183} {"train_loss": -7.514756202697754, "global_step": 30836, "epoch": 183} {"train_loss": -7.447288990020752, "global_step": 30837, "epoch": 183} {"train_loss": -7.315019130706787, "global_step": 30838, "epoch": 183} {"train_loss": -7.350075721740723, "global_step": 30839, "epoch": 183} {"train_loss": -7.639118671417236, "global_step": 30840, "epoch": 183} {"train_loss": -7.303159236907959, "global_step": 30841, "epoch": 183} {"train_loss": -7.376727104187012, "global_step": 30842, "epoch": 183} {"train_loss": -7.468584060668945, "global_step": 30843, "epoch": 183} {"train_loss": -7.327369689941406, "global_step": 30844, "epoch": 183} {"train_loss": -7.473056793212891, "global_step": 30845, "epoch": 183} {"train_loss": -7.45546817779541, "global_step": 30846, "epoch": 183} {"train_loss": -7.564141750335693, "global_step": 30847, "epoch": 183} {"train_loss": -7.491293430328369, "global_step": 30848, "epoch": 183} {"train_loss": -7.30364990234375, "global_step": 30849, "epoch": 183} {"train_loss": -7.393539905548096, "global_step": 30850, "epoch": 183} {"train_loss": -7.551312446594238, "global_step": 30851, "epoch": 183} {"train_loss": -7.452301502227783, "global_step": 30852, "epoch": 183} {"train_loss": -7.2657880783081055, "global_step": 30853, "epoch": 183} {"train_loss": -7.283857345581055, "global_step": 30854, "epoch": 183} {"train_loss": -7.465489387512207, "global_step": 30855, "epoch": 183} {"train_loss": -7.620168209075928, "global_step": 30856, "epoch": 183} {"train_loss": -7.251985549926758, "global_step": 30857, "epoch": 183} {"train_loss": -7.459956645965576, "global_step": 30858, "epoch": 183} {"train_loss": -7.39776611328125, "global_step": 30859, "epoch": 183} {"train_loss": -7.581093788146973, "global_step": 30860, "epoch": 183} {"train_loss": -7.422030448913574, "global_step": 30861, "epoch": 183} {"train_loss": -7.413289546966553, "global_step": 30862, "epoch": 183} {"train_loss": -7.5664753913879395, "global_step": 30863, "epoch": 183} {"train_loss": -7.561610221862793, "global_step": 30864, "epoch": 183} {"train_loss": -7.3479228019714355, "global_step": 30865, "epoch": 183} {"train_loss": -7.483632564544678, "global_step": 30866, "epoch": 183} {"train_loss": -7.527096748352051, "global_step": 30867, "epoch": 183} {"train_loss": -7.61473274230957, "global_step": 30868, "epoch": 183} {"train_loss": -7.648723602294922, "global_step": 30869, "epoch": 183} {"train_loss": -7.6261887550354, "global_step": 30870, "epoch": 183} {"train_loss": -7.529504776000977, "global_step": 30871, "epoch": 183} {"train_loss": -7.664126396179199, "global_step": 30872, "epoch": 183} {"train_loss": -7.503594398498535, "global_step": 30873, "epoch": 183} {"train_loss": -7.666555881500244, "global_step": 30874, "epoch": 183} {"train_loss": -7.436555862426758, "global_step": 30875, "epoch": 183} {"train_loss": -7.555245876312256, "global_step": 30876, "epoch": 183} {"train_loss": -7.478618621826172, "global_step": 30877, "epoch": 183} {"train_loss": -7.663910865783691, "global_step": 30878, "epoch": 183} {"train_loss": -7.586357116699219, "global_step": 30879, "epoch": 183} {"train_loss": -7.329334259033203, "global_step": 30880, "epoch": 183} {"train_loss": -7.464532852172852, "global_step": 30881, "epoch": 183} {"train_loss": -7.537189960479736, "global_step": 30882, "epoch": 183} {"train_loss": -7.495865345001221, "global_step": 30883, "epoch": 183} {"train_loss": -7.413088798522949, "global_step": 30884, "epoch": 183} {"train_loss": -7.793346405029297, "global_step": 30885, "epoch": 183} {"train_loss": -7.356212615966797, "global_step": 30886, "epoch": 183} {"train_loss": -7.448594093322754, "global_step": 30887, "epoch": 183} {"train_loss": -7.593111038208008, "global_step": 30888, "epoch": 183} {"train_loss": -7.386757850646973, "global_step": 30889, "epoch": 183} {"train_loss": -7.384324073791504, "global_step": 30890, "epoch": 183} {"train_loss": -7.560305595397949, "global_step": 30891, "epoch": 183} {"train_loss": -7.31348991394043, "global_step": 30892, "epoch": 183} {"train_loss": -7.681335926055908, "global_step": 30893, "epoch": 183} {"train_loss": -7.431668758392334, "global_step": 30894, "epoch": 183} {"train_loss": -7.560551166534424, "global_step": 30895, "epoch": 183} {"train_loss": -7.475155830383301, "global_step": 30896, "epoch": 183} {"train_loss": -7.62445592880249, "global_step": 30897, "epoch": 183} {"train_loss": -7.436943531036377, "global_step": 30898, "epoch": 183} {"train_loss": -7.423623561859131, "global_step": 30899, "epoch": 183} {"train_loss": -7.422807216644287, "global_step": 30900, "epoch": 183} {"train_loss": -7.234879970550537, "global_step": 30901, "epoch": 183} {"train_loss": -7.432379722595215, "global_step": 30902, "epoch": 183} {"train_loss": -7.35392951965332, "global_step": 30903, "epoch": 183} {"train_loss": -7.618499279022217, "global_step": 30904, "epoch": 183} {"train_loss": -7.260838031768799, "global_step": 30905, "epoch": 183} {"train_loss": -7.423445701599121, "global_step": 30906, "epoch": 183} {"train_loss": -7.338921546936035, "global_step": 30907, "epoch": 183} {"train_loss": -7.2873334884643555, "global_step": 30908, "epoch": 183} {"train_loss": -7.359813690185547, "global_step": 30909, "epoch": 183} {"train_loss": -7.611800193786621, "global_step": 30910, "epoch": 183} {"train_loss": -7.460248643443698, "global_step": 30911, "epoch": 183, "val_loss": 189355.171875} {"train_loss": -7.393685340881348, "global_step": 30912, "epoch": 184} {"train_loss": -7.6434550285339355, "global_step": 30913, "epoch": 184} {"train_loss": -7.314903259277344, "global_step": 30914, "epoch": 184} {"train_loss": -7.597604274749756, "global_step": 30915, "epoch": 184} {"train_loss": -7.415712356567383, "global_step": 30916, "epoch": 184} {"train_loss": -7.681343078613281, "global_step": 30917, "epoch": 184} {"train_loss": -7.2358503341674805, "global_step": 30918, "epoch": 184} {"train_loss": -7.346061706542969, "global_step": 30919, "epoch": 184} {"train_loss": -7.414253234863281, "global_step": 30920, "epoch": 184} {"train_loss": -7.289846420288086, "global_step": 30921, "epoch": 184} {"train_loss": -7.721386909484863, "global_step": 30922, "epoch": 184} {"train_loss": -7.574061393737793, "global_step": 30923, "epoch": 184} {"train_loss": -7.419381141662598, "global_step": 30924, "epoch": 184} {"train_loss": -7.6173529624938965, "global_step": 30925, "epoch": 184} {"train_loss": -7.445058345794678, "global_step": 30926, "epoch": 184} {"train_loss": -7.5814337730407715, "global_step": 30927, "epoch": 184} {"train_loss": -7.65709114074707, "global_step": 30928, "epoch": 184} {"train_loss": -7.393081188201904, "global_step": 30929, "epoch": 184} {"train_loss": -7.595223426818848, "global_step": 30930, "epoch": 184} {"train_loss": -7.600893497467041, "global_step": 30931, "epoch": 184} {"train_loss": -7.614038467407227, "global_step": 30932, "epoch": 184} {"train_loss": -7.714900016784668, "global_step": 30933, "epoch": 184} {"train_loss": -7.542919158935547, "global_step": 30934, "epoch": 184} {"train_loss": -7.610024929046631, "global_step": 30935, "epoch": 184} {"train_loss": -7.399582862854004, "global_step": 30936, "epoch": 184} {"train_loss": -7.483484268188477, "global_step": 30937, "epoch": 184} {"train_loss": -7.254173278808594, "global_step": 30938, "epoch": 184} {"train_loss": -7.367300033569336, "global_step": 30939, "epoch": 184} {"train_loss": -7.611194133758545, "global_step": 30940, "epoch": 184} {"train_loss": -7.495568752288818, "global_step": 30941, "epoch": 184} {"train_loss": -7.674790382385254, "global_step": 30942, "epoch": 184} {"train_loss": -7.5514726638793945, "global_step": 30943, "epoch": 184} {"train_loss": -7.543709754943848, "global_step": 30944, "epoch": 184} {"train_loss": -7.76230001449585, "global_step": 30945, "epoch": 184} {"train_loss": -7.401089668273926, "global_step": 30946, "epoch": 184} {"train_loss": -7.476629257202148, "global_step": 30947, "epoch": 184} {"train_loss": -7.709404468536377, "global_step": 30948, "epoch": 184} {"train_loss": -7.702212810516357, "global_step": 30949, "epoch": 184} {"train_loss": -7.350840091705322, "global_step": 30950, "epoch": 184} {"train_loss": -7.485245704650879, "global_step": 30951, "epoch": 184} {"train_loss": -7.553165435791016, "global_step": 30952, "epoch": 184} {"train_loss": -7.707710266113281, "global_step": 30953, "epoch": 184} {"train_loss": -7.537275314331055, "global_step": 30954, "epoch": 184} {"train_loss": -7.318096160888672, "global_step": 30955, "epoch": 184} {"train_loss": -7.55569314956665, "global_step": 30956, "epoch": 184} {"train_loss": -7.478050231933594, "global_step": 30957, "epoch": 184} {"train_loss": -7.368399620056152, "global_step": 30958, "epoch": 184} {"train_loss": -7.539423942565918, "global_step": 30959, "epoch": 184} {"train_loss": -7.360496997833252, "global_step": 30960, "epoch": 184} {"train_loss": -7.645949363708496, "global_step": 30961, "epoch": 184} {"train_loss": -7.340202808380127, "global_step": 30962, "epoch": 184} {"train_loss": -7.496190071105957, "global_step": 30963, "epoch": 184} {"train_loss": -7.547426223754883, "global_step": 30964, "epoch": 184} {"train_loss": -7.24008846282959, "global_step": 30965, "epoch": 184} {"train_loss": -7.485339164733887, "global_step": 30966, "epoch": 184} {"train_loss": -7.534301280975342, "global_step": 30967, "epoch": 184} {"train_loss": -7.220851898193359, "global_step": 30968, "epoch": 184} {"train_loss": -7.608607292175293, "global_step": 30969, "epoch": 184} {"train_loss": -7.374515533447266, "global_step": 30970, "epoch": 184} {"train_loss": -7.507987022399902, "global_step": 30971, "epoch": 184} {"train_loss": -7.506330490112305, "global_step": 30972, "epoch": 184} {"train_loss": -7.651069164276123, "global_step": 30973, "epoch": 184} {"train_loss": -7.584493637084961, "global_step": 30974, "epoch": 184} {"train_loss": -7.717368125915527, "global_step": 30975, "epoch": 184} {"train_loss": -7.388116836547852, "global_step": 30976, "epoch": 184} {"train_loss": -7.439964294433594, "global_step": 30977, "epoch": 184} {"train_loss": -7.346099376678467, "global_step": 30978, "epoch": 184} {"train_loss": -7.419342517852783, "global_step": 30979, "epoch": 184} {"train_loss": -7.433128833770752, "global_step": 30980, "epoch": 184} {"train_loss": -7.436835289001465, "global_step": 30981, "epoch": 184} {"train_loss": -7.370970249176025, "global_step": 30982, "epoch": 184} {"train_loss": -7.242889404296875, "global_step": 30983, "epoch": 184} {"train_loss": -7.37941312789917, "global_step": 30984, "epoch": 184} {"train_loss": -7.545948028564453, "global_step": 30985, "epoch": 184} {"train_loss": -7.399677753448486, "global_step": 30986, "epoch": 184} {"train_loss": -7.385251045227051, "global_step": 30987, "epoch": 184} {"train_loss": -7.620166778564453, "global_step": 30988, "epoch": 184} {"train_loss": -7.619918346405029, "global_step": 30989, "epoch": 184} {"train_loss": -7.429169654846191, "global_step": 30990, "epoch": 184} {"train_loss": -7.400518894195557, "global_step": 30991, "epoch": 184} {"train_loss": -7.440771102905273, "global_step": 30992, "epoch": 184} {"train_loss": -7.492082118988037, "global_step": 30993, "epoch": 184} {"train_loss": -7.372128009796143, "global_step": 30994, "epoch": 184} {"train_loss": -7.270845413208008, "global_step": 30995, "epoch": 184} {"train_loss": -7.40492582321167, "global_step": 30996, "epoch": 184} {"train_loss": -7.286866188049316, "global_step": 30997, "epoch": 184} {"train_loss": -7.479602813720703, "global_step": 30998, "epoch": 184} {"train_loss": -7.280585289001465, "global_step": 30999, "epoch": 184} {"train_loss": -7.403402805328369, "global_step": 31000, "epoch": 184} {"train_loss": -7.628886699676514, "global_step": 31001, "epoch": 184} {"train_loss": -7.284972190856934, "global_step": 31002, "epoch": 184} {"train_loss": -7.567190170288086, "global_step": 31003, "epoch": 184} {"train_loss": -7.211299896240234, "global_step": 31004, "epoch": 184} {"train_loss": -7.68607234954834, "global_step": 31005, "epoch": 184} {"train_loss": -7.519295692443848, "global_step": 31006, "epoch": 184} {"train_loss": -7.579802513122559, "global_step": 31007, "epoch": 184} {"train_loss": -7.5396270751953125, "global_step": 31008, "epoch": 184} {"train_loss": -7.569815158843994, "global_step": 31009, "epoch": 184} {"train_loss": -7.590036392211914, "global_step": 31010, "epoch": 184} {"train_loss": -7.299784183502197, "global_step": 31011, "epoch": 184} {"train_loss": -7.559939861297607, "global_step": 31012, "epoch": 184} {"train_loss": -7.458981990814209, "global_step": 31013, "epoch": 184} {"train_loss": -7.665489673614502, "global_step": 31014, "epoch": 184} {"train_loss": -7.604835510253906, "global_step": 31015, "epoch": 184} {"train_loss": -7.431665897369385, "global_step": 31016, "epoch": 184} {"train_loss": -7.485719680786133, "global_step": 31017, "epoch": 184} {"train_loss": -7.381605625152588, "global_step": 31018, "epoch": 184} {"train_loss": -7.5821852684021, "global_step": 31019, "epoch": 184} {"train_loss": -7.194439888000488, "global_step": 31020, "epoch": 184} {"train_loss": -7.614457607269287, "global_step": 31021, "epoch": 184} {"train_loss": -7.289389610290527, "global_step": 31022, "epoch": 184} {"train_loss": -7.450314998626709, "global_step": 31023, "epoch": 184} {"train_loss": -7.427403450012207, "global_step": 31024, "epoch": 184} {"train_loss": -7.581964015960693, "global_step": 31025, "epoch": 184} {"train_loss": -7.48593807220459, "global_step": 31026, "epoch": 184} {"train_loss": -7.588422775268555, "global_step": 31027, "epoch": 184} {"train_loss": -7.52025842666626, "global_step": 31028, "epoch": 184} {"train_loss": -7.57131290435791, "global_step": 31029, "epoch": 184} {"train_loss": -7.588405132293701, "global_step": 31030, "epoch": 184} {"train_loss": -7.661791801452637, "global_step": 31031, "epoch": 184} {"train_loss": -7.33317756652832, "global_step": 31032, "epoch": 184} {"train_loss": -7.507615566253662, "global_step": 31033, "epoch": 184} {"train_loss": -7.605330467224121, "global_step": 31034, "epoch": 184} {"train_loss": -7.485889434814453, "global_step": 31035, "epoch": 184} {"train_loss": -7.377986907958984, "global_step": 31036, "epoch": 184} {"train_loss": -7.698088645935059, "global_step": 31037, "epoch": 184} {"train_loss": -7.644448280334473, "global_step": 31038, "epoch": 184} {"train_loss": -7.488735198974609, "global_step": 31039, "epoch": 184} {"train_loss": -7.523774147033691, "global_step": 31040, "epoch": 184} {"train_loss": -7.6973981857299805, "global_step": 31041, "epoch": 184} {"train_loss": -7.600500106811523, "global_step": 31042, "epoch": 184} {"train_loss": -7.6060004234313965, "global_step": 31043, "epoch": 184} {"train_loss": -7.438889980316162, "global_step": 31044, "epoch": 184} {"train_loss": -7.698350429534912, "global_step": 31045, "epoch": 184} {"train_loss": -7.4400315284729, "global_step": 31046, "epoch": 184} {"train_loss": -7.627969741821289, "global_step": 31047, "epoch": 184} {"train_loss": -7.649141311645508, "global_step": 31048, "epoch": 184} {"train_loss": -7.594174385070801, "global_step": 31049, "epoch": 184} {"train_loss": -7.570879936218262, "global_step": 31050, "epoch": 184} {"train_loss": -7.550014019012451, "global_step": 31051, "epoch": 184} {"train_loss": -7.336342811584473, "global_step": 31052, "epoch": 184} {"train_loss": -7.34608268737793, "global_step": 31053, "epoch": 184} {"train_loss": -7.409483909606934, "global_step": 31054, "epoch": 184} {"train_loss": -7.3736042976379395, "global_step": 31055, "epoch": 184} {"train_loss": -7.7177581787109375, "global_step": 31056, "epoch": 184} {"train_loss": -7.532732963562012, "global_step": 31057, "epoch": 184} {"train_loss": -7.684365272521973, "global_step": 31058, "epoch": 184} {"train_loss": -7.448645114898682, "global_step": 31059, "epoch": 184} {"train_loss": -7.767649173736572, "global_step": 31060, "epoch": 184} {"train_loss": -7.413565635681152, "global_step": 31061, "epoch": 184} {"train_loss": -7.655447959899902, "global_step": 31062, "epoch": 184} {"train_loss": -7.377187728881836, "global_step": 31063, "epoch": 184} {"train_loss": -7.675365447998047, "global_step": 31064, "epoch": 184} {"train_loss": -7.74190616607666, "global_step": 31065, "epoch": 184} {"train_loss": -7.422730445861816, "global_step": 31066, "epoch": 184} {"train_loss": -7.630580902099609, "global_step": 31067, "epoch": 184} {"train_loss": -7.635376453399658, "global_step": 31068, "epoch": 184} {"train_loss": -7.561676979064941, "global_step": 31069, "epoch": 184} {"train_loss": -7.7689337730407715, "global_step": 31070, "epoch": 184} {"train_loss": -7.521421432495117, "global_step": 31071, "epoch": 184} {"train_loss": -7.461267471313477, "global_step": 31072, "epoch": 184} {"train_loss": -7.473576068878174, "global_step": 31073, "epoch": 184} {"train_loss": -7.272557735443115, "global_step": 31074, "epoch": 184} {"train_loss": -7.549020767211914, "global_step": 31075, "epoch": 184} {"train_loss": -7.37693977355957, "global_step": 31076, "epoch": 184} {"train_loss": -7.402411460876465, "global_step": 31077, "epoch": 184} {"train_loss": -7.384988784790039, "global_step": 31078, "epoch": 184} {"train_loss": -7.500041456449599, "global_step": 31079, "epoch": 184, "val_loss": 188248.953125} {"train_loss": -7.494984149932861, "global_step": 31080, "epoch": 185} {"train_loss": -7.392858982086182, "global_step": 31081, "epoch": 185} {"train_loss": -7.560647010803223, "global_step": 31082, "epoch": 185} {"train_loss": -7.381217956542969, "global_step": 31083, "epoch": 185} {"train_loss": -7.505525588989258, "global_step": 31084, "epoch": 185} {"train_loss": -7.602217674255371, "global_step": 31085, "epoch": 185} {"train_loss": -7.312912940979004, "global_step": 31086, "epoch": 185} {"train_loss": -7.673551082611084, "global_step": 31087, "epoch": 185} {"train_loss": -7.50001335144043, "global_step": 31088, "epoch": 185} {"train_loss": -7.5657958984375, "global_step": 31089, "epoch": 185} {"train_loss": -7.408441543579102, "global_step": 31090, "epoch": 185} {"train_loss": -7.411664009094238, "global_step": 31091, "epoch": 185} {"train_loss": -7.469150543212891, "global_step": 31092, "epoch": 185} {"train_loss": -7.4402875900268555, "global_step": 31093, "epoch": 185} {"train_loss": -7.545303821563721, "global_step": 31094, "epoch": 185} {"train_loss": -7.522745609283447, "global_step": 31095, "epoch": 185} {"train_loss": -7.560189247131348, "global_step": 31096, "epoch": 185} {"train_loss": -7.447165489196777, "global_step": 31097, "epoch": 185} {"train_loss": -7.606636047363281, "global_step": 31098, "epoch": 185} {"train_loss": -7.24948787689209, "global_step": 31099, "epoch": 185} {"train_loss": -7.8258466720581055, "global_step": 31100, "epoch": 185} {"train_loss": -7.346068382263184, "global_step": 31101, "epoch": 185} {"train_loss": -7.510937690734863, "global_step": 31102, "epoch": 185} {"train_loss": -6.952267646789551, "global_step": 31103, "epoch": 185} {"train_loss": -7.643416404724121, "global_step": 31104, "epoch": 185} {"train_loss": -7.522319793701172, "global_step": 31105, "epoch": 185} {"train_loss": -7.65156364440918, "global_step": 31106, "epoch": 185} {"train_loss": -7.398688793182373, "global_step": 31107, "epoch": 185} {"train_loss": -7.712741374969482, "global_step": 31108, "epoch": 185} {"train_loss": -7.717696666717529, "global_step": 31109, "epoch": 185} {"train_loss": -7.473369598388672, "global_step": 31110, "epoch": 185} {"train_loss": -7.639491081237793, "global_step": 31111, "epoch": 185} {"train_loss": -7.425907135009766, "global_step": 31112, "epoch": 185} {"train_loss": -7.247613906860352, "global_step": 31113, "epoch": 185} {"train_loss": -7.792827606201172, "global_step": 31114, "epoch": 185} {"train_loss": -7.548151969909668, "global_step": 31115, "epoch": 185} {"train_loss": -7.640270233154297, "global_step": 31116, "epoch": 185} {"train_loss": -7.376293182373047, "global_step": 31117, "epoch": 185} {"train_loss": -7.230733871459961, "global_step": 31118, "epoch": 185} {"train_loss": -7.450521945953369, "global_step": 31119, "epoch": 185} {"train_loss": -7.497580528259277, "global_step": 31120, "epoch": 185} {"train_loss": -7.37091064453125, "global_step": 31121, "epoch": 185} {"train_loss": -7.510292053222656, "global_step": 31122, "epoch": 185} {"train_loss": -7.424553871154785, "global_step": 31123, "epoch": 185} {"train_loss": -7.515610694885254, "global_step": 31124, "epoch": 185} {"train_loss": -7.52877140045166, "global_step": 31125, "epoch": 185} {"train_loss": -7.7559356689453125, "global_step": 31126, "epoch": 185} {"train_loss": -7.707803249359131, "global_step": 31127, "epoch": 185} {"train_loss": -7.7705864906311035, "global_step": 31128, "epoch": 185} {"train_loss": -7.286661148071289, "global_step": 31129, "epoch": 185} {"train_loss": -7.464320182800293, "global_step": 31130, "epoch": 185} {"train_loss": -7.482572555541992, "global_step": 31131, "epoch": 185} {"train_loss": -7.5831756591796875, "global_step": 31132, "epoch": 185} {"train_loss": -7.7217302322387695, "global_step": 31133, "epoch": 185} {"train_loss": -7.470003604888916, "global_step": 31134, "epoch": 185} {"train_loss": -7.680461406707764, "global_step": 31135, "epoch": 185} {"train_loss": -7.414373397827148, "global_step": 31136, "epoch": 185} {"train_loss": -7.5221710205078125, "global_step": 31137, "epoch": 185} {"train_loss": -7.722655296325684, "global_step": 31138, "epoch": 185} {"train_loss": -7.51075553894043, "global_step": 31139, "epoch": 185} {"train_loss": -7.257952690124512, "global_step": 31140, "epoch": 185} {"train_loss": -7.6831254959106445, "global_step": 31141, "epoch": 185} {"train_loss": -7.480956077575684, "global_step": 31142, "epoch": 185} {"train_loss": -7.603578567504883, "global_step": 31143, "epoch": 185} {"train_loss": -7.678164005279541, "global_step": 31144, "epoch": 185} {"train_loss": -7.782684326171875, "global_step": 31145, "epoch": 185} {"train_loss": -7.574772834777832, "global_step": 31146, "epoch": 185} {"train_loss": -7.625803470611572, "global_step": 31147, "epoch": 185} {"train_loss": -7.471218109130859, "global_step": 31148, "epoch": 185} {"train_loss": -7.6955485343933105, "global_step": 31149, "epoch": 185} {"train_loss": -7.376229286193848, "global_step": 31150, "epoch": 185} {"train_loss": -7.628018379211426, "global_step": 31151, "epoch": 185} {"train_loss": -7.458712100982666, "global_step": 31152, "epoch": 185} {"train_loss": -7.842846393585205, "global_step": 31153, "epoch": 185} {"train_loss": -7.393095970153809, "global_step": 31154, "epoch": 185} {"train_loss": -7.402457237243652, "global_step": 31155, "epoch": 185} {"train_loss": -7.618365287780762, "global_step": 31156, "epoch": 185} {"train_loss": -7.556471824645996, "global_step": 31157, "epoch": 185} {"train_loss": -7.582152843475342, "global_step": 31158, "epoch": 185} {"train_loss": -7.370145320892334, "global_step": 31159, "epoch": 185} {"train_loss": -7.440664768218994, "global_step": 31160, "epoch": 185} {"train_loss": -7.4205827713012695, "global_step": 31161, "epoch": 185} {"train_loss": -7.656862735748291, "global_step": 31162, "epoch": 185} {"train_loss": -7.399275779724121, "global_step": 31163, "epoch": 185} {"train_loss": -7.393980026245117, "global_step": 31164, "epoch": 185} {"train_loss": -7.49029541015625, "global_step": 31165, "epoch": 185} {"train_loss": -7.397202968597412, "global_step": 31166, "epoch": 185} {"train_loss": -7.448281288146973, "global_step": 31167, "epoch": 185} {"train_loss": -7.517927169799805, "global_step": 31168, "epoch": 185} {"train_loss": -7.360287666320801, "global_step": 31169, "epoch": 185} {"train_loss": -7.441884517669678, "global_step": 31170, "epoch": 185} {"train_loss": -7.277820587158203, "global_step": 31171, "epoch": 185} {"train_loss": -7.445345878601074, "global_step": 31172, "epoch": 185} {"train_loss": -7.46429967880249, "global_step": 31173, "epoch": 185} {"train_loss": -7.413043022155762, "global_step": 31174, "epoch": 185} {"train_loss": -7.532444000244141, "global_step": 31175, "epoch": 185} {"train_loss": -7.369184970855713, "global_step": 31176, "epoch": 185} {"train_loss": -7.512481689453125, "global_step": 31177, "epoch": 185} {"train_loss": -7.480254173278809, "global_step": 31178, "epoch": 185} {"train_loss": -7.529770851135254, "global_step": 31179, "epoch": 185} {"train_loss": -7.631216049194336, "global_step": 31180, "epoch": 185} {"train_loss": -7.4931745529174805, "global_step": 31181, "epoch": 185} {"train_loss": -7.559147834777832, "global_step": 31182, "epoch": 185} {"train_loss": -7.674267768859863, "global_step": 31183, "epoch": 185} {"train_loss": -7.641134738922119, "global_step": 31184, "epoch": 185} {"train_loss": -7.471689224243164, "global_step": 31185, "epoch": 185} {"train_loss": -7.6607985496521, "global_step": 31186, "epoch": 185} {"train_loss": -7.368029594421387, "global_step": 31187, "epoch": 185} {"train_loss": -7.44434928894043, "global_step": 31188, "epoch": 185} {"train_loss": -7.567242622375488, "global_step": 31189, "epoch": 185} {"train_loss": -7.423303604125977, "global_step": 31190, "epoch": 185} {"train_loss": -7.463647842407227, "global_step": 31191, "epoch": 185} {"train_loss": -7.571979522705078, "global_step": 31192, "epoch": 185} {"train_loss": -7.5338134765625, "global_step": 31193, "epoch": 185} {"train_loss": -7.513158798217773, "global_step": 31194, "epoch": 185} {"train_loss": -7.54252815246582, "global_step": 31195, "epoch": 185} {"train_loss": -7.462775230407715, "global_step": 31196, "epoch": 185} {"train_loss": -7.60029411315918, "global_step": 31197, "epoch": 185} {"train_loss": -7.340939521789551, "global_step": 31198, "epoch": 185} {"train_loss": -7.608711242675781, "global_step": 31199, "epoch": 185} {"train_loss": -7.606570243835449, "global_step": 31200, "epoch": 185} {"train_loss": -7.656794548034668, "global_step": 31201, "epoch": 185} {"train_loss": -7.499911308288574, "global_step": 31202, "epoch": 185} {"train_loss": -7.671605587005615, "global_step": 31203, "epoch": 185} {"train_loss": -7.649242401123047, "global_step": 31204, "epoch": 185} {"train_loss": -7.542235374450684, "global_step": 31205, "epoch": 185} {"train_loss": -7.559798240661621, "global_step": 31206, "epoch": 185} {"train_loss": -7.570111274719238, "global_step": 31207, "epoch": 185} {"train_loss": -7.480587005615234, "global_step": 31208, "epoch": 185} {"train_loss": -7.448185443878174, "global_step": 31209, "epoch": 185} {"train_loss": -7.4354658126831055, "global_step": 31210, "epoch": 185} {"train_loss": -7.707125186920166, "global_step": 31211, "epoch": 185} {"train_loss": -7.830314636230469, "global_step": 31212, "epoch": 185} {"train_loss": -7.553834915161133, "global_step": 31213, "epoch": 185} {"train_loss": -7.892914772033691, "global_step": 31214, "epoch": 185} {"train_loss": -7.454828262329102, "global_step": 31215, "epoch": 185} {"train_loss": -7.5629119873046875, "global_step": 31216, "epoch": 185} {"train_loss": -7.721327781677246, "global_step": 31217, "epoch": 185} {"train_loss": -7.830107688903809, "global_step": 31218, "epoch": 185} {"train_loss": -7.801892280578613, "global_step": 31219, "epoch": 185} {"train_loss": -7.786630630493164, "global_step": 31220, "epoch": 185} {"train_loss": -7.700211524963379, "global_step": 31221, "epoch": 185} {"train_loss": -7.735000133514404, "global_step": 31222, "epoch": 185} {"train_loss": -7.493760108947754, "global_step": 31223, "epoch": 185} {"train_loss": -7.289487838745117, "global_step": 31224, "epoch": 185} {"train_loss": -7.520190715789795, "global_step": 31225, "epoch": 185} {"train_loss": -7.37473201751709, "global_step": 31226, "epoch": 185} {"train_loss": -7.30291748046875, "global_step": 31227, "epoch": 185} {"train_loss": -7.450238227844238, "global_step": 31228, "epoch": 185} {"train_loss": -7.4033002853393555, "global_step": 31229, "epoch": 185} {"train_loss": -7.432534694671631, "global_step": 31230, "epoch": 185} {"train_loss": -7.371100902557373, "global_step": 31231, "epoch": 185} {"train_loss": -7.356451988220215, "global_step": 31232, "epoch": 185} {"train_loss": -7.385759353637695, "global_step": 31233, "epoch": 185} {"train_loss": -7.529750823974609, "global_step": 31234, "epoch": 185} {"train_loss": -7.584822654724121, "global_step": 31235, "epoch": 185} {"train_loss": -7.485466480255127, "global_step": 31236, "epoch": 185} {"train_loss": -7.41948938369751, "global_step": 31237, "epoch": 185} {"train_loss": -7.574114799499512, "global_step": 31238, "epoch": 185} {"train_loss": -7.575369834899902, "global_step": 31239, "epoch": 185} {"train_loss": -7.647050857543945, "global_step": 31240, "epoch": 185} {"train_loss": -7.463247299194336, "global_step": 31241, "epoch": 185} {"train_loss": -7.618498802185059, "global_step": 31242, "epoch": 185} {"train_loss": -7.4462995529174805, "global_step": 31243, "epoch": 185} {"train_loss": -7.729640483856201, "global_step": 31244, "epoch": 185} {"train_loss": -7.519759178161621, "global_step": 31245, "epoch": 185} {"train_loss": -7.2728776931762695, "global_step": 31246, "epoch": 185} {"train_loss": -7.519867332208724, "global_step": 31247, "epoch": 185, "val_loss": 190050.078125, "train_action_mse_error": 11.468997955322266} {"train_loss": -7.853036880493164, "global_step": 31248, "epoch": 186} {"train_loss": -7.434317111968994, "global_step": 31249, "epoch": 186} {"train_loss": -7.235868453979492, "global_step": 31250, "epoch": 186} {"train_loss": -7.615477561950684, "global_step": 31251, "epoch": 186} {"train_loss": -7.4908952713012695, "global_step": 31252, "epoch": 186} {"train_loss": -7.589713096618652, "global_step": 31253, "epoch": 186} {"train_loss": -7.182821273803711, "global_step": 31254, "epoch": 186} {"train_loss": -7.343494415283203, "global_step": 31255, "epoch": 186} {"train_loss": -7.5450897216796875, "global_step": 31256, "epoch": 186} {"train_loss": -7.44347620010376, "global_step": 31257, "epoch": 186} {"train_loss": -7.66409969329834, "global_step": 31258, "epoch": 186} {"train_loss": -7.320748329162598, "global_step": 31259, "epoch": 186} {"train_loss": -7.651900291442871, "global_step": 31260, "epoch": 186} {"train_loss": -7.344708442687988, "global_step": 31261, "epoch": 186} {"train_loss": -7.483010292053223, "global_step": 31262, "epoch": 186} {"train_loss": -7.498839855194092, "global_step": 31263, "epoch": 186} {"train_loss": -7.1785173416137695, "global_step": 31264, "epoch": 186} {"train_loss": -7.561014175415039, "global_step": 31265, "epoch": 186} {"train_loss": -7.276658535003662, "global_step": 31266, "epoch": 186} {"train_loss": -7.50344705581665, "global_step": 31267, "epoch": 186} {"train_loss": -7.608695030212402, "global_step": 31268, "epoch": 186} {"train_loss": -7.386904716491699, "global_step": 31269, "epoch": 186} {"train_loss": -7.41829252243042, "global_step": 31270, "epoch": 186} {"train_loss": -7.322644233703613, "global_step": 31271, "epoch": 186} {"train_loss": -7.294754505157471, "global_step": 31272, "epoch": 186} {"train_loss": -7.179291248321533, "global_step": 31273, "epoch": 186} {"train_loss": -7.400087356567383, "global_step": 31274, "epoch": 186} {"train_loss": -7.355389595031738, "global_step": 31275, "epoch": 186} {"train_loss": -7.421468734741211, "global_step": 31276, "epoch": 186} {"train_loss": -7.557485103607178, "global_step": 31277, "epoch": 186} {"train_loss": -7.476650714874268, "global_step": 31278, "epoch": 186} {"train_loss": -7.645878314971924, "global_step": 31279, "epoch": 186} {"train_loss": -7.599188804626465, "global_step": 31280, "epoch": 186} {"train_loss": -7.580038070678711, "global_step": 31281, "epoch": 186} {"train_loss": -7.580090522766113, "global_step": 31282, "epoch": 186} {"train_loss": -7.233054161071777, "global_step": 31283, "epoch": 186} {"train_loss": -7.282386302947998, "global_step": 31284, "epoch": 186} {"train_loss": -7.449932098388672, "global_step": 31285, "epoch": 186} {"train_loss": -7.701643943786621, "global_step": 31286, "epoch": 186} {"train_loss": -7.520058631896973, "global_step": 31287, "epoch": 186} {"train_loss": -7.4892401695251465, "global_step": 31288, "epoch": 186} {"train_loss": -7.341817855834961, "global_step": 31289, "epoch": 186} {"train_loss": -7.608033180236816, "global_step": 31290, "epoch": 186} {"train_loss": -7.682759761810303, "global_step": 31291, "epoch": 186} {"train_loss": -7.64985990524292, "global_step": 31292, "epoch": 186} {"train_loss": -7.519045829772949, "global_step": 31293, "epoch": 186} {"train_loss": -7.501796722412109, "global_step": 31294, "epoch": 186} {"train_loss": -7.536745548248291, "global_step": 31295, "epoch": 186} {"train_loss": -7.464922904968262, "global_step": 31296, "epoch": 186} {"train_loss": -7.547661781311035, "global_step": 31297, "epoch": 186} {"train_loss": -7.635923862457275, "global_step": 31298, "epoch": 186} {"train_loss": -7.450891494750977, "global_step": 31299, "epoch": 186} {"train_loss": -7.5070648193359375, "global_step": 31300, "epoch": 186} {"train_loss": -7.701780319213867, "global_step": 31301, "epoch": 186} {"train_loss": -7.333030700683594, "global_step": 31302, "epoch": 186} {"train_loss": -7.490612030029297, "global_step": 31303, "epoch": 186} {"train_loss": -7.486496925354004, "global_step": 31304, "epoch": 186} {"train_loss": -7.367201805114746, "global_step": 31305, "epoch": 186} {"train_loss": -7.631267547607422, "global_step": 31306, "epoch": 186} {"train_loss": -7.508376121520996, "global_step": 31307, "epoch": 186} {"train_loss": -7.385859966278076, "global_step": 31308, "epoch": 186} {"train_loss": -7.378301620483398, "global_step": 31309, "epoch": 186} {"train_loss": -7.488885879516602, "global_step": 31310, "epoch": 186} {"train_loss": -7.430517673492432, "global_step": 31311, "epoch": 186} {"train_loss": -7.580576419830322, "global_step": 31312, "epoch": 186} {"train_loss": -7.639686584472656, "global_step": 31313, "epoch": 186} {"train_loss": -7.629316329956055, "global_step": 31314, "epoch": 186} {"train_loss": -7.531390190124512, "global_step": 31315, "epoch": 186} {"train_loss": -7.622596740722656, "global_step": 31316, "epoch": 186} {"train_loss": -7.391623497009277, "global_step": 31317, "epoch": 186} {"train_loss": -7.517636299133301, "global_step": 31318, "epoch": 186} {"train_loss": -7.575963497161865, "global_step": 31319, "epoch": 186} {"train_loss": -7.733684539794922, "global_step": 31320, "epoch": 186} {"train_loss": -7.555438995361328, "global_step": 31321, "epoch": 186} {"train_loss": -7.363489151000977, "global_step": 31322, "epoch": 186} {"train_loss": -7.56793737411499, "global_step": 31323, "epoch": 186} {"train_loss": -7.616725921630859, "global_step": 31324, "epoch": 186} {"train_loss": -7.439918041229248, "global_step": 31325, "epoch": 186} {"train_loss": -7.685951232910156, "global_step": 31326, "epoch": 186} {"train_loss": -7.758723258972168, "global_step": 31327, "epoch": 186} {"train_loss": -7.511349678039551, "global_step": 31328, "epoch": 186} {"train_loss": -7.4469828605651855, "global_step": 31329, "epoch": 186} {"train_loss": -7.795112133026123, "global_step": 31330, "epoch": 186} {"train_loss": -7.558342456817627, "global_step": 31331, "epoch": 186} {"train_loss": -7.641804218292236, "global_step": 31332, "epoch": 186} {"train_loss": -7.55185604095459, "global_step": 31333, "epoch": 186} {"train_loss": -7.415340423583984, "global_step": 31334, "epoch": 186} {"train_loss": -7.376956462860107, "global_step": 31335, "epoch": 186} {"train_loss": -7.508184909820557, "global_step": 31336, "epoch": 186} {"train_loss": -7.56856107711792, "global_step": 31337, "epoch": 186} {"train_loss": -7.609770774841309, "global_step": 31338, "epoch": 186} {"train_loss": -7.45856237411499, "global_step": 31339, "epoch": 186} {"train_loss": -7.564531326293945, "global_step": 31340, "epoch": 186} {"train_loss": -7.561130523681641, "global_step": 31341, "epoch": 186} {"train_loss": -7.1922149658203125, "global_step": 31342, "epoch": 186} {"train_loss": -7.297774314880371, "global_step": 31343, "epoch": 186} {"train_loss": -7.708400726318359, "global_step": 31344, "epoch": 186} {"train_loss": -7.206543445587158, "global_step": 31345, "epoch": 186} {"train_loss": -7.442215919494629, "global_step": 31346, "epoch": 186} {"train_loss": -7.456556797027588, "global_step": 31347, "epoch": 186} {"train_loss": -7.625622749328613, "global_step": 31348, "epoch": 186} {"train_loss": -7.495164394378662, "global_step": 31349, "epoch": 186} {"train_loss": -7.424598693847656, "global_step": 31350, "epoch": 186} {"train_loss": -7.484714508056641, "global_step": 31351, "epoch": 186} {"train_loss": -7.3643574714660645, "global_step": 31352, "epoch": 186} {"train_loss": -7.651731491088867, "global_step": 31353, "epoch": 186} {"train_loss": -7.521337509155273, "global_step": 31354, "epoch": 186} {"train_loss": -7.648808479309082, "global_step": 31355, "epoch": 186} {"train_loss": -7.685891151428223, "global_step": 31356, "epoch": 186} {"train_loss": -7.437926292419434, "global_step": 31357, "epoch": 186} {"train_loss": -7.606603145599365, "global_step": 31358, "epoch": 186} {"train_loss": -7.624591827392578, "global_step": 31359, "epoch": 186} {"train_loss": -7.705501556396484, "global_step": 31360, "epoch": 186} {"train_loss": -7.718521595001221, "global_step": 31361, "epoch": 186} {"train_loss": -7.669907093048096, "global_step": 31362, "epoch": 186} {"train_loss": -7.548259735107422, "global_step": 31363, "epoch": 186} {"train_loss": -7.663735389709473, "global_step": 31364, "epoch": 186} {"train_loss": -7.614238739013672, "global_step": 31365, "epoch": 186} {"train_loss": -7.537070274353027, "global_step": 31366, "epoch": 186} {"train_loss": -7.768646717071533, "global_step": 31367, "epoch": 186} {"train_loss": -7.758217811584473, "global_step": 31368, "epoch": 186} {"train_loss": -7.59465217590332, "global_step": 31369, "epoch": 186} {"train_loss": -7.521184921264648, "global_step": 31370, "epoch": 186} {"train_loss": -7.571702003479004, "global_step": 31371, "epoch": 186} {"train_loss": -7.542687892913818, "global_step": 31372, "epoch": 186} {"train_loss": -7.117420673370361, "global_step": 31373, "epoch": 186} {"train_loss": -7.36074686050415, "global_step": 31374, "epoch": 186} {"train_loss": -7.361846923828125, "global_step": 31375, "epoch": 186} {"train_loss": -7.606778144836426, "global_step": 31376, "epoch": 186} {"train_loss": -7.643007278442383, "global_step": 31377, "epoch": 186} {"train_loss": -7.413573265075684, "global_step": 31378, "epoch": 186} {"train_loss": -7.729172706604004, "global_step": 31379, "epoch": 186} {"train_loss": -7.419159412384033, "global_step": 31380, "epoch": 186} {"train_loss": -7.5437140464782715, "global_step": 31381, "epoch": 186} {"train_loss": -7.452531337738037, "global_step": 31382, "epoch": 186} {"train_loss": -7.475478172302246, "global_step": 31383, "epoch": 186} {"train_loss": -7.639664649963379, "global_step": 31384, "epoch": 186} {"train_loss": -7.419335842132568, "global_step": 31385, "epoch": 186} {"train_loss": -7.493249893188477, "global_step": 31386, "epoch": 186} {"train_loss": -7.490086555480957, "global_step": 31387, "epoch": 186} {"train_loss": -7.663256645202637, "global_step": 31388, "epoch": 186} {"train_loss": -7.636695384979248, "global_step": 31389, "epoch": 186} {"train_loss": -7.680285453796387, "global_step": 31390, "epoch": 186} {"train_loss": -7.67484188079834, "global_step": 31391, "epoch": 186} {"train_loss": -7.359405517578125, "global_step": 31392, "epoch": 186} {"train_loss": -7.519536018371582, "global_step": 31393, "epoch": 186} {"train_loss": -7.605478763580322, "global_step": 31394, "epoch": 186} {"train_loss": -7.585541725158691, "global_step": 31395, "epoch": 186} {"train_loss": -7.6202898025512695, "global_step": 31396, "epoch": 186} {"train_loss": -7.746157646179199, "global_step": 31397, "epoch": 186} {"train_loss": -7.672955513000488, "global_step": 31398, "epoch": 186} {"train_loss": -7.612910270690918, "global_step": 31399, "epoch": 186} {"train_loss": -7.701234817504883, "global_step": 31400, "epoch": 186} {"train_loss": -7.302048683166504, "global_step": 31401, "epoch": 186} {"train_loss": -7.539112091064453, "global_step": 31402, "epoch": 186} {"train_loss": -7.678549766540527, "global_step": 31403, "epoch": 186} {"train_loss": -7.570124626159668, "global_step": 31404, "epoch": 186} {"train_loss": -7.599813461303711, "global_step": 31405, "epoch": 186} {"train_loss": -7.363157272338867, "global_step": 31406, "epoch": 186} {"train_loss": -7.476979732513428, "global_step": 31407, "epoch": 186} {"train_loss": -7.213532447814941, "global_step": 31408, "epoch": 186} {"train_loss": -7.418723106384277, "global_step": 31409, "epoch": 186} {"train_loss": -7.294985771179199, "global_step": 31410, "epoch": 186} {"train_loss": -7.3816046714782715, "global_step": 31411, "epoch": 186} {"train_loss": -7.426623344421387, "global_step": 31412, "epoch": 186} {"train_loss": -7.409073352813721, "global_step": 31413, "epoch": 186} {"train_loss": -7.542745113372803, "global_step": 31414, "epoch": 186} {"train_loss": -7.512774544102805, "global_step": 31415, "epoch": 186, "val_loss": 189215.390625} {"train_loss": -7.663357257843018, "global_step": 31416, "epoch": 187} {"train_loss": -7.270928382873535, "global_step": 31417, "epoch": 187} {"train_loss": -7.486140727996826, "global_step": 31418, "epoch": 187} {"train_loss": -7.231990337371826, "global_step": 31419, "epoch": 187} {"train_loss": -7.5243024826049805, "global_step": 31420, "epoch": 187} {"train_loss": -7.486231803894043, "global_step": 31421, "epoch": 187} {"train_loss": -7.206589221954346, "global_step": 31422, "epoch": 187} {"train_loss": -7.44933557510376, "global_step": 31423, "epoch": 187} {"train_loss": -7.455621719360352, "global_step": 31424, "epoch": 187} {"train_loss": -7.468105792999268, "global_step": 31425, "epoch": 187} {"train_loss": -7.43400764465332, "global_step": 31426, "epoch": 187} {"train_loss": -7.275950908660889, "global_step": 31427, "epoch": 187} {"train_loss": -7.224371910095215, "global_step": 31428, "epoch": 187} {"train_loss": -7.257857322692871, "global_step": 31429, "epoch": 187} {"train_loss": -7.517759323120117, "global_step": 31430, "epoch": 187} {"train_loss": -7.337228775024414, "global_step": 31431, "epoch": 187} {"train_loss": -7.46671724319458, "global_step": 31432, "epoch": 187} {"train_loss": -7.494350433349609, "global_step": 31433, "epoch": 187} {"train_loss": -7.693982124328613, "global_step": 31434, "epoch": 187} {"train_loss": -7.516406536102295, "global_step": 31435, "epoch": 187} {"train_loss": -7.5225510597229, "global_step": 31436, "epoch": 187} {"train_loss": -7.688990592956543, "global_step": 31437, "epoch": 187} {"train_loss": -7.772162914276123, "global_step": 31438, "epoch": 187} {"train_loss": -7.6937031745910645, "global_step": 31439, "epoch": 187} {"train_loss": -7.724205017089844, "global_step": 31440, "epoch": 187} {"train_loss": -7.5258026123046875, "global_step": 31441, "epoch": 187} {"train_loss": -7.573329925537109, "global_step": 31442, "epoch": 187} {"train_loss": -7.7317891120910645, "global_step": 31443, "epoch": 187} {"train_loss": -7.439244747161865, "global_step": 31444, "epoch": 187} {"train_loss": -7.811970233917236, "global_step": 31445, "epoch": 187} {"train_loss": -7.762938022613525, "global_step": 31446, "epoch": 187} {"train_loss": -7.814003944396973, "global_step": 31447, "epoch": 187} {"train_loss": -7.732007026672363, "global_step": 31448, "epoch": 187} {"train_loss": -7.4921722412109375, "global_step": 31449, "epoch": 187} {"train_loss": -7.531990051269531, "global_step": 31450, "epoch": 187} {"train_loss": -7.4672932624816895, "global_step": 31451, "epoch": 187} {"train_loss": -7.837285995483398, "global_step": 31452, "epoch": 187} {"train_loss": -7.6593451499938965, "global_step": 31453, "epoch": 187} {"train_loss": -7.868720054626465, "global_step": 31454, "epoch": 187} {"train_loss": -7.44840669631958, "global_step": 31455, "epoch": 187} {"train_loss": -7.739903450012207, "global_step": 31456, "epoch": 187} {"train_loss": -7.469008922576904, "global_step": 31457, "epoch": 187} {"train_loss": -7.487321853637695, "global_step": 31458, "epoch": 187} {"train_loss": -7.626276016235352, "global_step": 31459, "epoch": 187} {"train_loss": -7.425177574157715, "global_step": 31460, "epoch": 187} {"train_loss": -7.770810604095459, "global_step": 31461, "epoch": 187} {"train_loss": -7.564775466918945, "global_step": 31462, "epoch": 187} {"train_loss": -7.526821613311768, "global_step": 31463, "epoch": 187} {"train_loss": -7.581354141235352, "global_step": 31464, "epoch": 187} {"train_loss": -7.555023193359375, "global_step": 31465, "epoch": 187} {"train_loss": -7.426548004150391, "global_step": 31466, "epoch": 187} {"train_loss": -7.642514705657959, "global_step": 31467, "epoch": 187} {"train_loss": -7.3425445556640625, "global_step": 31468, "epoch": 187} {"train_loss": -7.693841934204102, "global_step": 31469, "epoch": 187} {"train_loss": -7.367836952209473, "global_step": 31470, "epoch": 187} {"train_loss": -7.598328590393066, "global_step": 31471, "epoch": 187} {"train_loss": -7.512044906616211, "global_step": 31472, "epoch": 187} {"train_loss": -7.705261707305908, "global_step": 31473, "epoch": 187} {"train_loss": -7.728114128112793, "global_step": 31474, "epoch": 187} {"train_loss": -7.513283729553223, "global_step": 31475, "epoch": 187} {"train_loss": -7.620938301086426, "global_step": 31476, "epoch": 187} {"train_loss": -7.2072062492370605, "global_step": 31477, "epoch": 187} {"train_loss": -7.574559211730957, "global_step": 31478, "epoch": 187} {"train_loss": -7.496175765991211, "global_step": 31479, "epoch": 187} {"train_loss": -7.476751327514648, "global_step": 31480, "epoch": 187} {"train_loss": -7.589262008666992, "global_step": 31481, "epoch": 187} {"train_loss": -7.473505973815918, "global_step": 31482, "epoch": 187} {"train_loss": -7.4669508934021, "global_step": 31483, "epoch": 187} {"train_loss": -7.670415878295898, "global_step": 31484, "epoch": 187} {"train_loss": -7.459900379180908, "global_step": 31485, "epoch": 187} {"train_loss": -7.594058513641357, "global_step": 31486, "epoch": 187} {"train_loss": -7.615044593811035, "global_step": 31487, "epoch": 187} {"train_loss": -7.27020263671875, "global_step": 31488, "epoch": 187} {"train_loss": -7.326476097106934, "global_step": 31489, "epoch": 187} {"train_loss": -7.578652858734131, "global_step": 31490, "epoch": 187} {"train_loss": -7.375216484069824, "global_step": 31491, "epoch": 187} {"train_loss": -7.409239768981934, "global_step": 31492, "epoch": 187} {"train_loss": -7.682497024536133, "global_step": 31493, "epoch": 187} {"train_loss": -7.5193376541137695, "global_step": 31494, "epoch": 187} {"train_loss": -7.418896675109863, "global_step": 31495, "epoch": 187} {"train_loss": -7.3253703117370605, "global_step": 31496, "epoch": 187} {"train_loss": -7.370943069458008, "global_step": 31497, "epoch": 187} {"train_loss": -7.661873817443848, "global_step": 31498, "epoch": 187} {"train_loss": -7.517107963562012, "global_step": 31499, "epoch": 187} {"train_loss": -7.351617336273193, "global_step": 31500, "epoch": 187} {"train_loss": -7.235689163208008, "global_step": 31501, "epoch": 187} {"train_loss": -7.553309440612793, "global_step": 31502, "epoch": 187} {"train_loss": -7.063661575317383, "global_step": 31503, "epoch": 187} {"train_loss": -7.463864326477051, "global_step": 31504, "epoch": 187} {"train_loss": -7.326056957244873, "global_step": 31505, "epoch": 187} {"train_loss": -7.39405632019043, "global_step": 31506, "epoch": 187} {"train_loss": -7.357868194580078, "global_step": 31507, "epoch": 187} {"train_loss": -7.3816633224487305, "global_step": 31508, "epoch": 187} {"train_loss": -7.626247406005859, "global_step": 31509, "epoch": 187} {"train_loss": -7.587431907653809, "global_step": 31510, "epoch": 187} {"train_loss": -7.667278289794922, "global_step": 31511, "epoch": 187} {"train_loss": -7.722873210906982, "global_step": 31512, "epoch": 187} {"train_loss": -7.582433700561523, "global_step": 31513, "epoch": 187} {"train_loss": -7.434597492218018, "global_step": 31514, "epoch": 187} {"train_loss": -7.574097633361816, "global_step": 31515, "epoch": 187} {"train_loss": -7.5794219970703125, "global_step": 31516, "epoch": 187} {"train_loss": -7.708660125732422, "global_step": 31517, "epoch": 187} {"train_loss": -7.528395652770996, "global_step": 31518, "epoch": 187} {"train_loss": -7.644725799560547, "global_step": 31519, "epoch": 187} {"train_loss": -7.50497579574585, "global_step": 31520, "epoch": 187} {"train_loss": -7.6561784744262695, "global_step": 31521, "epoch": 187} {"train_loss": -7.714008331298828, "global_step": 31522, "epoch": 187} {"train_loss": -7.3605637550354, "global_step": 31523, "epoch": 187} {"train_loss": -7.668407440185547, "global_step": 31524, "epoch": 187} {"train_loss": -7.327610969543457, "global_step": 31525, "epoch": 187} {"train_loss": -7.758593559265137, "global_step": 31526, "epoch": 187} {"train_loss": -7.432321548461914, "global_step": 31527, "epoch": 187} {"train_loss": -7.520877838134766, "global_step": 31528, "epoch": 187} {"train_loss": -7.461296558380127, "global_step": 31529, "epoch": 187} {"train_loss": -7.528158187866211, "global_step": 31530, "epoch": 187} {"train_loss": -7.833795547485352, "global_step": 31531, "epoch": 187} {"train_loss": -7.158976078033447, "global_step": 31532, "epoch": 187} {"train_loss": -7.424226760864258, "global_step": 31533, "epoch": 187} {"train_loss": -7.186267375946045, "global_step": 31534, "epoch": 187} {"train_loss": -7.165365695953369, "global_step": 31535, "epoch": 187} {"train_loss": -7.555906772613525, "global_step": 31536, "epoch": 187} {"train_loss": -6.968423843383789, "global_step": 31537, "epoch": 187} {"train_loss": -7.553213119506836, "global_step": 31538, "epoch": 187} {"train_loss": -7.291658401489258, "global_step": 31539, "epoch": 187} {"train_loss": -7.101123809814453, "global_step": 31540, "epoch": 187} {"train_loss": -7.494001388549805, "global_step": 31541, "epoch": 187} {"train_loss": -7.088418006896973, "global_step": 31542, "epoch": 187} {"train_loss": -7.110492706298828, "global_step": 31543, "epoch": 187} {"train_loss": -7.608346939086914, "global_step": 31544, "epoch": 187} {"train_loss": -7.260183811187744, "global_step": 31545, "epoch": 187} {"train_loss": -7.469902038574219, "global_step": 31546, "epoch": 187} {"train_loss": -7.498716354370117, "global_step": 31547, "epoch": 187} {"train_loss": -7.199976921081543, "global_step": 31548, "epoch": 187} {"train_loss": -7.35120964050293, "global_step": 31549, "epoch": 187} {"train_loss": -7.5402116775512695, "global_step": 31550, "epoch": 187} {"train_loss": -7.427166938781738, "global_step": 31551, "epoch": 187} {"train_loss": -7.470834732055664, "global_step": 31552, "epoch": 187} {"train_loss": -7.363170146942139, "global_step": 31553, "epoch": 187} {"train_loss": -7.456804275512695, "global_step": 31554, "epoch": 187} {"train_loss": -7.364058971405029, "global_step": 31555, "epoch": 187} {"train_loss": -7.383292198181152, "global_step": 31556, "epoch": 187} {"train_loss": -7.4748430252075195, "global_step": 31557, "epoch": 187} {"train_loss": -7.539393901824951, "global_step": 31558, "epoch": 187} {"train_loss": -7.2908477783203125, "global_step": 31559, "epoch": 187} {"train_loss": -7.453167915344238, "global_step": 31560, "epoch": 187} {"train_loss": -7.463520050048828, "global_step": 31561, "epoch": 187} {"train_loss": -7.434220314025879, "global_step": 31562, "epoch": 187} {"train_loss": -7.429708480834961, "global_step": 31563, "epoch": 187} {"train_loss": -7.316641807556152, "global_step": 31564, "epoch": 187} {"train_loss": -7.514023780822754, "global_step": 31565, "epoch": 187} {"train_loss": -7.488225936889648, "global_step": 31566, "epoch": 187} {"train_loss": -7.612674713134766, "global_step": 31567, "epoch": 187} {"train_loss": -7.490367889404297, "global_step": 31568, "epoch": 187} {"train_loss": -7.783375263214111, "global_step": 31569, "epoch": 187} {"train_loss": -7.415931701660156, "global_step": 31570, "epoch": 187} {"train_loss": -7.724614143371582, "global_step": 31571, "epoch": 187} {"train_loss": -7.767359256744385, "global_step": 31572, "epoch": 187} {"train_loss": -7.540142059326172, "global_step": 31573, "epoch": 187} {"train_loss": -7.672264099121094, "global_step": 31574, "epoch": 187} {"train_loss": -7.524257183074951, "global_step": 31575, "epoch": 187} {"train_loss": -7.766664505004883, "global_step": 31576, "epoch": 187} {"train_loss": -7.655845642089844, "global_step": 31577, "epoch": 187} {"train_loss": -7.777698993682861, "global_step": 31578, "epoch": 187} {"train_loss": -7.564796447753906, "global_step": 31579, "epoch": 187} {"train_loss": -7.574288845062256, "global_step": 31580, "epoch": 187} {"train_loss": -7.609651565551758, "global_step": 31581, "epoch": 187} {"train_loss": -7.814185619354248, "global_step": 31582, "epoch": 187} {"train_loss": -7.50671344711667, "global_step": 31583, "epoch": 187, "val_loss": 187630.109375} {"train_loss": -7.410229682922363, "global_step": 31584, "epoch": 188} {"train_loss": -7.402597427368164, "global_step": 31585, "epoch": 188} {"train_loss": -7.577988147735596, "global_step": 31586, "epoch": 188} {"train_loss": -7.667109489440918, "global_step": 31587, "epoch": 188} {"train_loss": -7.334244251251221, "global_step": 31588, "epoch": 188} {"train_loss": -7.749798774719238, "global_step": 31589, "epoch": 188} {"train_loss": -7.519340991973877, "global_step": 31590, "epoch": 188} {"train_loss": -7.252778053283691, "global_step": 31591, "epoch": 188} {"train_loss": -7.450346946716309, "global_step": 31592, "epoch": 188} {"train_loss": -7.693291664123535, "global_step": 31593, "epoch": 188} {"train_loss": -7.4588494300842285, "global_step": 31594, "epoch": 188} {"train_loss": -7.546355247497559, "global_step": 31595, "epoch": 188} {"train_loss": -7.555418014526367, "global_step": 31596, "epoch": 188} {"train_loss": -7.400030136108398, "global_step": 31597, "epoch": 188} {"train_loss": -7.376468181610107, "global_step": 31598, "epoch": 188} {"train_loss": -7.635452747344971, "global_step": 31599, "epoch": 188} {"train_loss": -7.595792770385742, "global_step": 31600, "epoch": 188} {"train_loss": -7.67896842956543, "global_step": 31601, "epoch": 188} {"train_loss": -7.62626314163208, "global_step": 31602, "epoch": 188} {"train_loss": -7.530742168426514, "global_step": 31603, "epoch": 188} {"train_loss": -7.648055076599121, "global_step": 31604, "epoch": 188} {"train_loss": -7.599058151245117, "global_step": 31605, "epoch": 188} {"train_loss": -7.542712211608887, "global_step": 31606, "epoch": 188} {"train_loss": -7.502833366394043, "global_step": 31607, "epoch": 188} {"train_loss": -7.347743034362793, "global_step": 31608, "epoch": 188} {"train_loss": -7.519404411315918, "global_step": 31609, "epoch": 188} {"train_loss": -7.90354061126709, "global_step": 31610, "epoch": 188} {"train_loss": -7.6345720291137695, "global_step": 31611, "epoch": 188} {"train_loss": -7.625166893005371, "global_step": 31612, "epoch": 188} {"train_loss": -7.756166458129883, "global_step": 31613, "epoch": 188} {"train_loss": -7.58232307434082, "global_step": 31614, "epoch": 188} {"train_loss": -7.716711044311523, "global_step": 31615, "epoch": 188} {"train_loss": -7.701992511749268, "global_step": 31616, "epoch": 188} {"train_loss": -7.295052528381348, "global_step": 31617, "epoch": 188} {"train_loss": -7.618697643280029, "global_step": 31618, "epoch": 188} {"train_loss": -7.380582332611084, "global_step": 31619, "epoch": 188} {"train_loss": -7.4913787841796875, "global_step": 31620, "epoch": 188} {"train_loss": -6.956511497497559, "global_step": 31621, "epoch": 188} {"train_loss": -7.426758289337158, "global_step": 31622, "epoch": 188} {"train_loss": -7.4905524253845215, "global_step": 31623, "epoch": 188} {"train_loss": -7.010469436645508, "global_step": 31624, "epoch": 188} {"train_loss": -7.505660057067871, "global_step": 31625, "epoch": 188} {"train_loss": -7.47463321685791, "global_step": 31626, "epoch": 188} {"train_loss": -7.228721618652344, "global_step": 31627, "epoch": 188} {"train_loss": -7.3629961013793945, "global_step": 31628, "epoch": 188} {"train_loss": -7.375182151794434, "global_step": 31629, "epoch": 188} {"train_loss": -7.219878196716309, "global_step": 31630, "epoch": 188} {"train_loss": -7.555506706237793, "global_step": 31631, "epoch": 188} {"train_loss": -7.415310859680176, "global_step": 31632, "epoch": 188} {"train_loss": -7.242894172668457, "global_step": 31633, "epoch": 188} {"train_loss": -7.418334007263184, "global_step": 31634, "epoch": 188} {"train_loss": -7.284049987792969, "global_step": 31635, "epoch": 188} {"train_loss": -7.562098979949951, "global_step": 31636, "epoch": 188} {"train_loss": -7.3794941902160645, "global_step": 31637, "epoch": 188} {"train_loss": -7.419516086578369, "global_step": 31638, "epoch": 188} {"train_loss": -7.459556579589844, "global_step": 31639, "epoch": 188} {"train_loss": -7.532791614532471, "global_step": 31640, "epoch": 188} {"train_loss": -7.582270622253418, "global_step": 31641, "epoch": 188} {"train_loss": -7.59058952331543, "global_step": 31642, "epoch": 188} {"train_loss": -7.5587158203125, "global_step": 31643, "epoch": 188} {"train_loss": -7.476687431335449, "global_step": 31644, "epoch": 188} {"train_loss": -7.644531726837158, "global_step": 31645, "epoch": 188} {"train_loss": -7.608997344970703, "global_step": 31646, "epoch": 188} {"train_loss": -7.542247772216797, "global_step": 31647, "epoch": 188} {"train_loss": -7.7587432861328125, "global_step": 31648, "epoch": 188} {"train_loss": -7.614253520965576, "global_step": 31649, "epoch": 188} {"train_loss": -7.313113212585449, "global_step": 31650, "epoch": 188} {"train_loss": -7.559156894683838, "global_step": 31651, "epoch": 188} {"train_loss": -7.647002220153809, "global_step": 31652, "epoch": 188} {"train_loss": -7.588052749633789, "global_step": 31653, "epoch": 188} {"train_loss": -7.607420444488525, "global_step": 31654, "epoch": 188} {"train_loss": -7.673008441925049, "global_step": 31655, "epoch": 188} {"train_loss": -7.769890308380127, "global_step": 31656, "epoch": 188} {"train_loss": -7.496908187866211, "global_step": 31657, "epoch": 188} {"train_loss": -7.388741493225098, "global_step": 31658, "epoch": 188} {"train_loss": -7.514355659484863, "global_step": 31659, "epoch": 188} {"train_loss": -7.719570159912109, "global_step": 31660, "epoch": 188} {"train_loss": -7.785900115966797, "global_step": 31661, "epoch": 188} {"train_loss": -7.739992141723633, "global_step": 31662, "epoch": 188} {"train_loss": -7.355669975280762, "global_step": 31663, "epoch": 188} {"train_loss": -7.590712070465088, "global_step": 31664, "epoch": 188} {"train_loss": -7.468878746032715, "global_step": 31665, "epoch": 188} {"train_loss": -7.665876388549805, "global_step": 31666, "epoch": 188} {"train_loss": -7.41038703918457, "global_step": 31667, "epoch": 188} {"train_loss": -7.4778008460998535, "global_step": 31668, "epoch": 188} {"train_loss": -7.656864643096924, "global_step": 31669, "epoch": 188} {"train_loss": -7.4951982498168945, "global_step": 31670, "epoch": 188} {"train_loss": -7.4906415939331055, "global_step": 31671, "epoch": 188} {"train_loss": -7.590917587280273, "global_step": 31672, "epoch": 188} {"train_loss": -7.518056869506836, "global_step": 31673, "epoch": 188} {"train_loss": -7.476517677307129, "global_step": 31674, "epoch": 188} {"train_loss": -7.376230239868164, "global_step": 31675, "epoch": 188} {"train_loss": -7.553678512573242, "global_step": 31676, "epoch": 188} {"train_loss": -7.731568336486816, "global_step": 31677, "epoch": 188} {"train_loss": -7.473910331726074, "global_step": 31678, "epoch": 188} {"train_loss": -7.571203231811523, "global_step": 31679, "epoch": 188} {"train_loss": -7.250216007232666, "global_step": 31680, "epoch": 188} {"train_loss": -7.5053606033325195, "global_step": 31681, "epoch": 188} {"train_loss": -7.309771537780762, "global_step": 31682, "epoch": 188} {"train_loss": -7.531757831573486, "global_step": 31683, "epoch": 188} {"train_loss": -7.479134559631348, "global_step": 31684, "epoch": 188} {"train_loss": -7.587224006652832, "global_step": 31685, "epoch": 188} {"train_loss": -7.617453575134277, "global_step": 31686, "epoch": 188} {"train_loss": -7.608198165893555, "global_step": 31687, "epoch": 188} {"train_loss": -7.478090763092041, "global_step": 31688, "epoch": 188} {"train_loss": -7.571277618408203, "global_step": 31689, "epoch": 188} {"train_loss": -7.226504325866699, "global_step": 31690, "epoch": 188} {"train_loss": -7.539977550506592, "global_step": 31691, "epoch": 188} {"train_loss": -7.625163555145264, "global_step": 31692, "epoch": 188} {"train_loss": -7.586877346038818, "global_step": 31693, "epoch": 188} {"train_loss": -7.3854570388793945, "global_step": 31694, "epoch": 188} {"train_loss": -7.72441291809082, "global_step": 31695, "epoch": 188} {"train_loss": -7.617427349090576, "global_step": 31696, "epoch": 188} {"train_loss": -7.769468307495117, "global_step": 31697, "epoch": 188} {"train_loss": -7.571404457092285, "global_step": 31698, "epoch": 188} {"train_loss": -7.606955051422119, "global_step": 31699, "epoch": 188} {"train_loss": -7.651540756225586, "global_step": 31700, "epoch": 188} {"train_loss": -7.735738754272461, "global_step": 31701, "epoch": 188} {"train_loss": -7.631951332092285, "global_step": 31702, "epoch": 188} {"train_loss": -7.48193883895874, "global_step": 31703, "epoch": 188} {"train_loss": -7.5142951011657715, "global_step": 31704, "epoch": 188} {"train_loss": -6.9649858474731445, "global_step": 31705, "epoch": 188} {"train_loss": -7.525698661804199, "global_step": 31706, "epoch": 188} {"train_loss": -7.078474998474121, "global_step": 31707, "epoch": 188} {"train_loss": -7.4066009521484375, "global_step": 31708, "epoch": 188} {"train_loss": -7.408483505249023, "global_step": 31709, "epoch": 188} {"train_loss": -7.5623884201049805, "global_step": 31710, "epoch": 188} {"train_loss": -7.627355098724365, "global_step": 31711, "epoch": 188} {"train_loss": -7.4632673263549805, "global_step": 31712, "epoch": 188} {"train_loss": -7.608588695526123, "global_step": 31713, "epoch": 188} {"train_loss": -7.551457405090332, "global_step": 31714, "epoch": 188} {"train_loss": -7.200933456420898, "global_step": 31715, "epoch": 188} {"train_loss": -7.465458869934082, "global_step": 31716, "epoch": 188} {"train_loss": -7.6785736083984375, "global_step": 31717, "epoch": 188} {"train_loss": -7.493393898010254, "global_step": 31718, "epoch": 188} {"train_loss": -7.514781951904297, "global_step": 31719, "epoch": 188} {"train_loss": -7.367481231689453, "global_step": 31720, "epoch": 188} {"train_loss": -7.650424957275391, "global_step": 31721, "epoch": 188} {"train_loss": -7.4295806884765625, "global_step": 31722, "epoch": 188} {"train_loss": -7.401474952697754, "global_step": 31723, "epoch": 188} {"train_loss": -7.222424507141113, "global_step": 31724, "epoch": 188} {"train_loss": -7.524010181427002, "global_step": 31725, "epoch": 188} {"train_loss": -7.491641044616699, "global_step": 31726, "epoch": 188} {"train_loss": -7.409087657928467, "global_step": 31727, "epoch": 188} {"train_loss": -7.716795921325684, "global_step": 31728, "epoch": 188} {"train_loss": -7.3667521476745605, "global_step": 31729, "epoch": 188} {"train_loss": -7.653809547424316, "global_step": 31730, "epoch": 188} {"train_loss": -7.564922332763672, "global_step": 31731, "epoch": 188} {"train_loss": -7.519141674041748, "global_step": 31732, "epoch": 188} {"train_loss": -7.6133599281311035, "global_step": 31733, "epoch": 188} {"train_loss": -7.567657470703125, "global_step": 31734, "epoch": 188} {"train_loss": -7.6843719482421875, "global_step": 31735, "epoch": 188} {"train_loss": -7.436315536499023, "global_step": 31736, "epoch": 188} {"train_loss": -7.5484795570373535, "global_step": 31737, "epoch": 188} {"train_loss": -7.613205432891846, "global_step": 31738, "epoch": 188} {"train_loss": -7.876483917236328, "global_step": 31739, "epoch": 188} {"train_loss": -7.709453582763672, "global_step": 31740, "epoch": 188} {"train_loss": -7.288107872009277, "global_step": 31741, "epoch": 188} {"train_loss": -7.446927547454834, "global_step": 31742, "epoch": 188} {"train_loss": -7.576342582702637, "global_step": 31743, "epoch": 188} {"train_loss": -7.467729568481445, "global_step": 31744, "epoch": 188} {"train_loss": -7.570962905883789, "global_step": 31745, "epoch": 188} {"train_loss": -7.242434501647949, "global_step": 31746, "epoch": 188} {"train_loss": -7.520450592041016, "global_step": 31747, "epoch": 188} {"train_loss": -7.420708656311035, "global_step": 31748, "epoch": 188} {"train_loss": -7.4095072746276855, "global_step": 31749, "epoch": 188} {"train_loss": -7.6607584953308105, "global_step": 31750, "epoch": 188} {"train_loss": -7.512526353200276, "global_step": 31751, "epoch": 188, "val_loss": 187484.515625} {"train_loss": -7.448194980621338, "global_step": 31752, "epoch": 189} {"train_loss": -7.561862945556641, "global_step": 31753, "epoch": 189} {"train_loss": -7.245337963104248, "global_step": 31754, "epoch": 189} {"train_loss": -7.519046783447266, "global_step": 31755, "epoch": 189} {"train_loss": -7.439803600311279, "global_step": 31756, "epoch": 189} {"train_loss": -7.741053581237793, "global_step": 31757, "epoch": 189} {"train_loss": -7.493283271789551, "global_step": 31758, "epoch": 189} {"train_loss": -7.444145202636719, "global_step": 31759, "epoch": 189} {"train_loss": -7.471957683563232, "global_step": 31760, "epoch": 189} {"train_loss": -7.329776763916016, "global_step": 31761, "epoch": 189} {"train_loss": -7.506535530090332, "global_step": 31762, "epoch": 189} {"train_loss": -7.544681549072266, "global_step": 31763, "epoch": 189} {"train_loss": -7.6397552490234375, "global_step": 31764, "epoch": 189} {"train_loss": -7.613544464111328, "global_step": 31765, "epoch": 189} {"train_loss": -7.668079376220703, "global_step": 31766, "epoch": 189} {"train_loss": -7.59528923034668, "global_step": 31767, "epoch": 189} {"train_loss": -7.371789932250977, "global_step": 31768, "epoch": 189} {"train_loss": -7.412373065948486, "global_step": 31769, "epoch": 189} {"train_loss": -7.630552291870117, "global_step": 31770, "epoch": 189} {"train_loss": -7.685475826263428, "global_step": 31771, "epoch": 189} {"train_loss": -7.654693603515625, "global_step": 31772, "epoch": 189} {"train_loss": -7.366542816162109, "global_step": 31773, "epoch": 189} {"train_loss": -7.77021598815918, "global_step": 31774, "epoch": 189} {"train_loss": -7.348902702331543, "global_step": 31775, "epoch": 189} {"train_loss": -7.629299163818359, "global_step": 31776, "epoch": 189} {"train_loss": -7.407407283782959, "global_step": 31777, "epoch": 189} {"train_loss": -7.514535903930664, "global_step": 31778, "epoch": 189} {"train_loss": -7.701776504516602, "global_step": 31779, "epoch": 189} {"train_loss": -7.4827880859375, "global_step": 31780, "epoch": 189} {"train_loss": -7.529707908630371, "global_step": 31781, "epoch": 189} {"train_loss": -7.566032886505127, "global_step": 31782, "epoch": 189} {"train_loss": -7.711688995361328, "global_step": 31783, "epoch": 189} {"train_loss": -7.259373664855957, "global_step": 31784, "epoch": 189} {"train_loss": -7.409923076629639, "global_step": 31785, "epoch": 189} {"train_loss": -7.436306476593018, "global_step": 31786, "epoch": 189} {"train_loss": -7.670811653137207, "global_step": 31787, "epoch": 189} {"train_loss": -7.574526786804199, "global_step": 31788, "epoch": 189} {"train_loss": -7.70781135559082, "global_step": 31789, "epoch": 189} {"train_loss": -7.511411190032959, "global_step": 31790, "epoch": 189} {"train_loss": -7.549548625946045, "global_step": 31791, "epoch": 189} {"train_loss": -7.5913262367248535, "global_step": 31792, "epoch": 189} {"train_loss": -7.67756462097168, "global_step": 31793, "epoch": 189} {"train_loss": -7.657290458679199, "global_step": 31794, "epoch": 189} {"train_loss": -7.772733211517334, "global_step": 31795, "epoch": 189} {"train_loss": -7.46297550201416, "global_step": 31796, "epoch": 189} {"train_loss": -7.669765472412109, "global_step": 31797, "epoch": 189} {"train_loss": -7.712345600128174, "global_step": 31798, "epoch": 189} {"train_loss": -7.707768440246582, "global_step": 31799, "epoch": 189} {"train_loss": -7.693042755126953, "global_step": 31800, "epoch": 189} {"train_loss": -7.7476277351379395, "global_step": 31801, "epoch": 189} {"train_loss": -7.491070747375488, "global_step": 31802, "epoch": 189} {"train_loss": -7.554091453552246, "global_step": 31803, "epoch": 189} {"train_loss": -7.6867356300354, "global_step": 31804, "epoch": 189} {"train_loss": -7.5732102394104, "global_step": 31805, "epoch": 189} {"train_loss": -7.640929222106934, "global_step": 31806, "epoch": 189} {"train_loss": -7.565225601196289, "global_step": 31807, "epoch": 189} {"train_loss": -7.623574256896973, "global_step": 31808, "epoch": 189} {"train_loss": -7.619270324707031, "global_step": 31809, "epoch": 189} {"train_loss": -7.492103099822998, "global_step": 31810, "epoch": 189} {"train_loss": -7.677879333496094, "global_step": 31811, "epoch": 189} {"train_loss": -7.599364757537842, "global_step": 31812, "epoch": 189} {"train_loss": -7.706339359283447, "global_step": 31813, "epoch": 189} {"train_loss": -7.5962066650390625, "global_step": 31814, "epoch": 189} {"train_loss": -7.753767967224121, "global_step": 31815, "epoch": 189} {"train_loss": -7.581825256347656, "global_step": 31816, "epoch": 189} {"train_loss": -7.605746269226074, "global_step": 31817, "epoch": 189} {"train_loss": -7.436046123504639, "global_step": 31818, "epoch": 189} {"train_loss": -7.782981872558594, "global_step": 31819, "epoch": 189} {"train_loss": -7.374852180480957, "global_step": 31820, "epoch": 189} {"train_loss": -7.725790977478027, "global_step": 31821, "epoch": 189} {"train_loss": -7.400821685791016, "global_step": 31822, "epoch": 189} {"train_loss": -7.373025417327881, "global_step": 31823, "epoch": 189} {"train_loss": -7.492351055145264, "global_step": 31824, "epoch": 189} {"train_loss": -7.606378078460693, "global_step": 31825, "epoch": 189} {"train_loss": -7.447816371917725, "global_step": 31826, "epoch": 189} {"train_loss": -7.762146949768066, "global_step": 31827, "epoch": 189} {"train_loss": -7.58206033706665, "global_step": 31828, "epoch": 189} {"train_loss": -7.670654773712158, "global_step": 31829, "epoch": 189} {"train_loss": -7.520530700683594, "global_step": 31830, "epoch": 189} {"train_loss": -7.5606608390808105, "global_step": 31831, "epoch": 189} {"train_loss": -7.428023338317871, "global_step": 31832, "epoch": 189} {"train_loss": -7.602381229400635, "global_step": 31833, "epoch": 189} {"train_loss": -7.850480079650879, "global_step": 31834, "epoch": 189} {"train_loss": -7.3817338943481445, "global_step": 31835, "epoch": 189} {"train_loss": -7.743685722351074, "global_step": 31836, "epoch": 189} {"train_loss": -7.405513763427734, "global_step": 31837, "epoch": 189} {"train_loss": -7.717353820800781, "global_step": 31838, "epoch": 189} {"train_loss": -7.382731914520264, "global_step": 31839, "epoch": 189} {"train_loss": -7.686236381530762, "global_step": 31840, "epoch": 189} {"train_loss": -7.549441337585449, "global_step": 31841, "epoch": 189} {"train_loss": -7.466470718383789, "global_step": 31842, "epoch": 189} {"train_loss": -7.499661922454834, "global_step": 31843, "epoch": 189} {"train_loss": -7.461637020111084, "global_step": 31844, "epoch": 189} {"train_loss": -7.672369956970215, "global_step": 31845, "epoch": 189} {"train_loss": -7.527170181274414, "global_step": 31846, "epoch": 189} {"train_loss": -7.464217662811279, "global_step": 31847, "epoch": 189} {"train_loss": -7.135645389556885, "global_step": 31848, "epoch": 189} {"train_loss": -7.519665241241455, "global_step": 31849, "epoch": 189} {"train_loss": -7.490152835845947, "global_step": 31850, "epoch": 189} {"train_loss": -7.11663818359375, "global_step": 31851, "epoch": 189} {"train_loss": -7.217546463012695, "global_step": 31852, "epoch": 189} {"train_loss": -6.932126045227051, "global_step": 31853, "epoch": 189} {"train_loss": -7.245866298675537, "global_step": 31854, "epoch": 189} {"train_loss": -7.153481483459473, "global_step": 31855, "epoch": 189} {"train_loss": -7.264651775360107, "global_step": 31856, "epoch": 189} {"train_loss": -7.458324432373047, "global_step": 31857, "epoch": 189} {"train_loss": -7.402988433837891, "global_step": 31858, "epoch": 189} {"train_loss": -7.32805061340332, "global_step": 31859, "epoch": 189} {"train_loss": -7.342957973480225, "global_step": 31860, "epoch": 189} {"train_loss": -7.314319610595703, "global_step": 31861, "epoch": 189} {"train_loss": -7.316650390625, "global_step": 31862, "epoch": 189} {"train_loss": -7.377926349639893, "global_step": 31863, "epoch": 189} {"train_loss": -7.426965713500977, "global_step": 31864, "epoch": 189} {"train_loss": -7.585659027099609, "global_step": 31865, "epoch": 189} {"train_loss": -7.415694713592529, "global_step": 31866, "epoch": 189} {"train_loss": -7.45497989654541, "global_step": 31867, "epoch": 189} {"train_loss": -7.613900661468506, "global_step": 31868, "epoch": 189} {"train_loss": -7.560791492462158, "global_step": 31869, "epoch": 189} {"train_loss": -7.435290813446045, "global_step": 31870, "epoch": 189} {"train_loss": -7.465277671813965, "global_step": 31871, "epoch": 189} {"train_loss": -7.504438400268555, "global_step": 31872, "epoch": 189} {"train_loss": -7.794095516204834, "global_step": 31873, "epoch": 189} {"train_loss": -7.632176876068115, "global_step": 31874, "epoch": 189} {"train_loss": -7.670494079589844, "global_step": 31875, "epoch": 189} {"train_loss": -7.645064353942871, "global_step": 31876, "epoch": 189} {"train_loss": -7.509936809539795, "global_step": 31877, "epoch": 189} {"train_loss": -7.382754325866699, "global_step": 31878, "epoch": 189} {"train_loss": -7.710541725158691, "global_step": 31879, "epoch": 189} {"train_loss": -7.583558082580566, "global_step": 31880, "epoch": 189} {"train_loss": -7.775518417358398, "global_step": 31881, "epoch": 189} {"train_loss": -7.7511725425720215, "global_step": 31882, "epoch": 189} {"train_loss": -7.697881698608398, "global_step": 31883, "epoch": 189} {"train_loss": -7.385982513427734, "global_step": 31884, "epoch": 189} {"train_loss": -7.8044538497924805, "global_step": 31885, "epoch": 189} {"train_loss": -7.773812770843506, "global_step": 31886, "epoch": 189} {"train_loss": -7.875680923461914, "global_step": 31887, "epoch": 189} {"train_loss": -7.735964775085449, "global_step": 31888, "epoch": 189} {"train_loss": -7.674991607666016, "global_step": 31889, "epoch": 189} {"train_loss": -7.499805450439453, "global_step": 31890, "epoch": 189} {"train_loss": -7.544761657714844, "global_step": 31891, "epoch": 189} {"train_loss": -7.508604526519775, "global_step": 31892, "epoch": 189} {"train_loss": -7.631547451019287, "global_step": 31893, "epoch": 189} {"train_loss": -7.164661407470703, "global_step": 31894, "epoch": 189} {"train_loss": -7.343788146972656, "global_step": 31895, "epoch": 189} {"train_loss": -7.523698806762695, "global_step": 31896, "epoch": 189} {"train_loss": -7.171058654785156, "global_step": 31897, "epoch": 189} {"train_loss": -7.328965187072754, "global_step": 31898, "epoch": 189} {"train_loss": -7.401218414306641, "global_step": 31899, "epoch": 189} {"train_loss": -7.217767715454102, "global_step": 31900, "epoch": 189} {"train_loss": -7.245108604431152, "global_step": 31901, "epoch": 189} {"train_loss": -7.555662155151367, "global_step": 31902, "epoch": 189} {"train_loss": -7.614660263061523, "global_step": 31903, "epoch": 189} {"train_loss": -7.458975315093994, "global_step": 31904, "epoch": 189} {"train_loss": -7.462392330169678, "global_step": 31905, "epoch": 189} {"train_loss": -7.530693054199219, "global_step": 31906, "epoch": 189} {"train_loss": -7.577630996704102, "global_step": 31907, "epoch": 189} {"train_loss": -7.4171528816223145, "global_step": 31908, "epoch": 189} {"train_loss": -7.51995325088501, "global_step": 31909, "epoch": 189} {"train_loss": -7.5272111892700195, "global_step": 31910, "epoch": 189} {"train_loss": -7.764797210693359, "global_step": 31911, "epoch": 189} {"train_loss": -7.416680812835693, "global_step": 31912, "epoch": 189} {"train_loss": -7.512384414672852, "global_step": 31913, "epoch": 189} {"train_loss": -7.641322135925293, "global_step": 31914, "epoch": 189} {"train_loss": -7.714976787567139, "global_step": 31915, "epoch": 189} {"train_loss": -7.47797966003418, "global_step": 31916, "epoch": 189} {"train_loss": -7.596104145050049, "global_step": 31917, "epoch": 189} {"train_loss": -7.6729631423950195, "global_step": 31918, "epoch": 189} {"train_loss": -7.532795715899694, "global_step": 31919, "epoch": 189, "val_loss": 188543.140625} {"train_loss": -7.489182472229004, "global_step": 31920, "epoch": 190} {"train_loss": -7.555655479431152, "global_step": 31921, "epoch": 190} {"train_loss": -7.650100231170654, "global_step": 31922, "epoch": 190} {"train_loss": -7.474802017211914, "global_step": 31923, "epoch": 190} {"train_loss": -7.383330345153809, "global_step": 31924, "epoch": 190} {"train_loss": -7.353976249694824, "global_step": 31925, "epoch": 190} {"train_loss": -7.641873359680176, "global_step": 31926, "epoch": 190} {"train_loss": -7.347873687744141, "global_step": 31927, "epoch": 190} {"train_loss": -7.792564392089844, "global_step": 31928, "epoch": 190} {"train_loss": -7.6887102127075195, "global_step": 31929, "epoch": 190} {"train_loss": -7.3226728439331055, "global_step": 31930, "epoch": 190} {"train_loss": -7.786728858947754, "global_step": 31931, "epoch": 190} {"train_loss": -7.6787638664245605, "global_step": 31932, "epoch": 190} {"train_loss": -7.427132606506348, "global_step": 31933, "epoch": 190} {"train_loss": -7.5432000160217285, "global_step": 31934, "epoch": 190} {"train_loss": -7.546089172363281, "global_step": 31935, "epoch": 190} {"train_loss": -7.37824821472168, "global_step": 31936, "epoch": 190} {"train_loss": -7.674083709716797, "global_step": 31937, "epoch": 190} {"train_loss": -7.471066951751709, "global_step": 31938, "epoch": 190} {"train_loss": -7.437109470367432, "global_step": 31939, "epoch": 190} {"train_loss": -7.432798385620117, "global_step": 31940, "epoch": 190} {"train_loss": -7.688371658325195, "global_step": 31941, "epoch": 190} {"train_loss": -7.482924461364746, "global_step": 31942, "epoch": 190} {"train_loss": -7.763876914978027, "global_step": 31943, "epoch": 190} {"train_loss": -7.359074592590332, "global_step": 31944, "epoch": 190} {"train_loss": -7.546966075897217, "global_step": 31945, "epoch": 190} {"train_loss": -7.508371829986572, "global_step": 31946, "epoch": 190} {"train_loss": -7.737624168395996, "global_step": 31947, "epoch": 190} {"train_loss": -7.278039932250977, "global_step": 31948, "epoch": 190} {"train_loss": -7.545145034790039, "global_step": 31949, "epoch": 190} {"train_loss": -7.558324337005615, "global_step": 31950, "epoch": 190} {"train_loss": -7.658307075500488, "global_step": 31951, "epoch": 190} {"train_loss": -7.659842491149902, "global_step": 31952, "epoch": 190} {"train_loss": -7.51893424987793, "global_step": 31953, "epoch": 190} {"train_loss": -7.737813472747803, "global_step": 31954, "epoch": 190} {"train_loss": -7.632500171661377, "global_step": 31955, "epoch": 190} {"train_loss": -7.600184440612793, "global_step": 31956, "epoch": 190} {"train_loss": -7.684318542480469, "global_step": 31957, "epoch": 190} {"train_loss": -7.469498634338379, "global_step": 31958, "epoch": 190} {"train_loss": -7.576233386993408, "global_step": 31959, "epoch": 190} {"train_loss": -7.542601585388184, "global_step": 31960, "epoch": 190} {"train_loss": -7.541679382324219, "global_step": 31961, "epoch": 190} {"train_loss": -7.90122127532959, "global_step": 31962, "epoch": 190} {"train_loss": -7.429820537567139, "global_step": 31963, "epoch": 190} {"train_loss": -7.691937446594238, "global_step": 31964, "epoch": 190} {"train_loss": -7.60440731048584, "global_step": 31965, "epoch": 190} {"train_loss": -7.564420700073242, "global_step": 31966, "epoch": 190} {"train_loss": -7.76097297668457, "global_step": 31967, "epoch": 190} {"train_loss": -7.566689491271973, "global_step": 31968, "epoch": 190} {"train_loss": -7.778281211853027, "global_step": 31969, "epoch": 190} {"train_loss": -7.675173282623291, "global_step": 31970, "epoch": 190} {"train_loss": -7.585102081298828, "global_step": 31971, "epoch": 190} {"train_loss": -7.530792236328125, "global_step": 31972, "epoch": 190} {"train_loss": -7.664080619812012, "global_step": 31973, "epoch": 190} {"train_loss": -7.592000484466553, "global_step": 31974, "epoch": 190} {"train_loss": -7.697275161743164, "global_step": 31975, "epoch": 190} {"train_loss": -7.710567474365234, "global_step": 31976, "epoch": 190} {"train_loss": -7.661794185638428, "global_step": 31977, "epoch": 190} {"train_loss": -7.66874885559082, "global_step": 31978, "epoch": 190} {"train_loss": -7.612796783447266, "global_step": 31979, "epoch": 190} {"train_loss": -7.556540012359619, "global_step": 31980, "epoch": 190} {"train_loss": -7.511987686157227, "global_step": 31981, "epoch": 190} {"train_loss": -7.4332170486450195, "global_step": 31982, "epoch": 190} {"train_loss": -7.567725658416748, "global_step": 31983, "epoch": 190} {"train_loss": -7.628929138183594, "global_step": 31984, "epoch": 190} {"train_loss": -7.567965984344482, "global_step": 31985, "epoch": 190} {"train_loss": -7.760669708251953, "global_step": 31986, "epoch": 190} {"train_loss": -7.666609764099121, "global_step": 31987, "epoch": 190} {"train_loss": -7.645974159240723, "global_step": 31988, "epoch": 190} {"train_loss": -7.367337226867676, "global_step": 31989, "epoch": 190} {"train_loss": -7.811919212341309, "global_step": 31990, "epoch": 190} {"train_loss": -7.281386852264404, "global_step": 31991, "epoch": 190} {"train_loss": -7.751363754272461, "global_step": 31992, "epoch": 190} {"train_loss": -7.577966690063477, "global_step": 31993, "epoch": 190} {"train_loss": -7.279490947723389, "global_step": 31994, "epoch": 190} {"train_loss": -7.407172203063965, "global_step": 31995, "epoch": 190} {"train_loss": -7.5580244064331055, "global_step": 31996, "epoch": 190} {"train_loss": -7.494173049926758, "global_step": 31997, "epoch": 190} {"train_loss": -7.57041597366333, "global_step": 31998, "epoch": 190} {"train_loss": -7.593870162963867, "global_step": 31999, "epoch": 190} {"train_loss": -7.494244575500488, "global_step": 32000, "epoch": 190} {"train_loss": -7.534761428833008, "global_step": 32001, "epoch": 190} {"train_loss": -7.504036903381348, "global_step": 32002, "epoch": 190} {"train_loss": -7.730461120605469, "global_step": 32003, "epoch": 190} {"train_loss": -7.669068336486816, "global_step": 32004, "epoch": 190} {"train_loss": -7.756598472595215, "global_step": 32005, "epoch": 190} {"train_loss": -7.575217247009277, "global_step": 32006, "epoch": 190} {"train_loss": -7.461893081665039, "global_step": 32007, "epoch": 190} {"train_loss": -7.7491559982299805, "global_step": 32008, "epoch": 190} {"train_loss": -7.504055023193359, "global_step": 32009, "epoch": 190} {"train_loss": -7.76542854309082, "global_step": 32010, "epoch": 190} {"train_loss": -7.617328643798828, "global_step": 32011, "epoch": 190} {"train_loss": -7.613931655883789, "global_step": 32012, "epoch": 190} {"train_loss": -7.688802719116211, "global_step": 32013, "epoch": 190} {"train_loss": -7.334290504455566, "global_step": 32014, "epoch": 190} {"train_loss": -7.243645668029785, "global_step": 32015, "epoch": 190} {"train_loss": -7.3369951248168945, "global_step": 32016, "epoch": 190} {"train_loss": -7.516970634460449, "global_step": 32017, "epoch": 190} {"train_loss": -7.365434169769287, "global_step": 32018, "epoch": 190} {"train_loss": -7.522904396057129, "global_step": 32019, "epoch": 190} {"train_loss": -7.484400272369385, "global_step": 32020, "epoch": 190} {"train_loss": -7.500889301300049, "global_step": 32021, "epoch": 190} {"train_loss": -7.399365425109863, "global_step": 32022, "epoch": 190} {"train_loss": -7.587789535522461, "global_step": 32023, "epoch": 190} {"train_loss": -7.642617225646973, "global_step": 32024, "epoch": 190} {"train_loss": -7.484061241149902, "global_step": 32025, "epoch": 190} {"train_loss": -7.530330657958984, "global_step": 32026, "epoch": 190} {"train_loss": -7.378809928894043, "global_step": 32027, "epoch": 190} {"train_loss": -7.50250768661499, "global_step": 32028, "epoch": 190} {"train_loss": -7.455818176269531, "global_step": 32029, "epoch": 190} {"train_loss": -7.628922462463379, "global_step": 32030, "epoch": 190} {"train_loss": -7.551519393920898, "global_step": 32031, "epoch": 190} {"train_loss": -7.521522521972656, "global_step": 32032, "epoch": 190} {"train_loss": -7.475907325744629, "global_step": 32033, "epoch": 190} {"train_loss": -7.628159999847412, "global_step": 32034, "epoch": 190} {"train_loss": -7.732237339019775, "global_step": 32035, "epoch": 190} {"train_loss": -7.526987075805664, "global_step": 32036, "epoch": 190} {"train_loss": -7.313012599945068, "global_step": 32037, "epoch": 190} {"train_loss": -7.528441429138184, "global_step": 32038, "epoch": 190} {"train_loss": -7.849641799926758, "global_step": 32039, "epoch": 190} {"train_loss": -7.54931640625, "global_step": 32040, "epoch": 190} {"train_loss": -7.632293224334717, "global_step": 32041, "epoch": 190} {"train_loss": -7.577598571777344, "global_step": 32042, "epoch": 190} {"train_loss": -7.620637893676758, "global_step": 32043, "epoch": 190} {"train_loss": -7.799371719360352, "global_step": 32044, "epoch": 190} {"train_loss": -7.646561145782471, "global_step": 32045, "epoch": 190} {"train_loss": -7.587766647338867, "global_step": 32046, "epoch": 190} {"train_loss": -7.525053024291992, "global_step": 32047, "epoch": 190} {"train_loss": -7.655267715454102, "global_step": 32048, "epoch": 190} {"train_loss": -7.897635459899902, "global_step": 32049, "epoch": 190} {"train_loss": -7.50831937789917, "global_step": 32050, "epoch": 190} {"train_loss": -7.438018798828125, "global_step": 32051, "epoch": 190} {"train_loss": -7.94434928894043, "global_step": 32052, "epoch": 190} {"train_loss": -7.6460394859313965, "global_step": 32053, "epoch": 190} {"train_loss": -7.821308612823486, "global_step": 32054, "epoch": 190} {"train_loss": -7.285962104797363, "global_step": 32055, "epoch": 190} {"train_loss": -7.486693382263184, "global_step": 32056, "epoch": 190} {"train_loss": -7.3802337646484375, "global_step": 32057, "epoch": 190} {"train_loss": -7.704000473022461, "global_step": 32058, "epoch": 190} {"train_loss": -7.698760032653809, "global_step": 32059, "epoch": 190} {"train_loss": -7.673669815063477, "global_step": 32060, "epoch": 190} {"train_loss": -7.477896690368652, "global_step": 32061, "epoch": 190} {"train_loss": -7.39901065826416, "global_step": 32062, "epoch": 190} {"train_loss": -7.750622749328613, "global_step": 32063, "epoch": 190} {"train_loss": -7.473772048950195, "global_step": 32064, "epoch": 190} {"train_loss": -7.709038734436035, "global_step": 32065, "epoch": 190} {"train_loss": -7.527714252471924, "global_step": 32066, "epoch": 190} {"train_loss": -7.466262340545654, "global_step": 32067, "epoch": 190} {"train_loss": -7.483188629150391, "global_step": 32068, "epoch": 190} {"train_loss": -7.459431171417236, "global_step": 32069, "epoch": 190} {"train_loss": -7.710559844970703, "global_step": 32070, "epoch": 190} {"train_loss": -7.852396011352539, "global_step": 32071, "epoch": 190} {"train_loss": -7.716623783111572, "global_step": 32072, "epoch": 190} {"train_loss": -7.588641166687012, "global_step": 32073, "epoch": 190} {"train_loss": -7.665076732635498, "global_step": 32074, "epoch": 190} {"train_loss": -7.757080078125, "global_step": 32075, "epoch": 190} {"train_loss": -7.621791839599609, "global_step": 32076, "epoch": 190} {"train_loss": -7.676517009735107, "global_step": 32077, "epoch": 190} {"train_loss": -7.567980766296387, "global_step": 32078, "epoch": 190} {"train_loss": -7.768392562866211, "global_step": 32079, "epoch": 190} {"train_loss": -7.557291507720947, "global_step": 32080, "epoch": 190} {"train_loss": -7.532112121582031, "global_step": 32081, "epoch": 190} {"train_loss": -7.79580545425415, "global_step": 32082, "epoch": 190} {"train_loss": -7.60886287689209, "global_step": 32083, "epoch": 190} {"train_loss": -7.65980339050293, "global_step": 32084, "epoch": 190} {"train_loss": -7.712301254272461, "global_step": 32085, "epoch": 190} {"train_loss": -7.64339542388916, "global_step": 32086, "epoch": 190} {"train_loss": -7.579766631126404, "global_step": 32087, "epoch": 190, "val_loss": 187913.3125, "train_action_mse_error": 12.631060600280762} {"train_loss": -7.831527233123779, "global_step": 32088, "epoch": 191} {"train_loss": -7.543510437011719, "global_step": 32089, "epoch": 191} {"train_loss": -7.639487266540527, "global_step": 32090, "epoch": 191} {"train_loss": -7.6006855964660645, "global_step": 32091, "epoch": 191} {"train_loss": -7.86805534362793, "global_step": 32092, "epoch": 191} {"train_loss": -7.548997402191162, "global_step": 32093, "epoch": 191} {"train_loss": -7.575971603393555, "global_step": 32094, "epoch": 191} {"train_loss": -7.667850494384766, "global_step": 32095, "epoch": 191} {"train_loss": -7.590525150299072, "global_step": 32096, "epoch": 191} {"train_loss": -7.739811420440674, "global_step": 32097, "epoch": 191} {"train_loss": -7.7673516273498535, "global_step": 32098, "epoch": 191} {"train_loss": -7.627096176147461, "global_step": 32099, "epoch": 191} {"train_loss": -7.855246543884277, "global_step": 32100, "epoch": 191} {"train_loss": -7.128708839416504, "global_step": 32101, "epoch": 191} {"train_loss": -7.659099102020264, "global_step": 32102, "epoch": 191} {"train_loss": -7.485039710998535, "global_step": 32103, "epoch": 191} {"train_loss": -7.717799663543701, "global_step": 32104, "epoch": 191} {"train_loss": -7.594580173492432, "global_step": 32105, "epoch": 191} {"train_loss": -7.750353813171387, "global_step": 32106, "epoch": 191} {"train_loss": -7.467231273651123, "global_step": 32107, "epoch": 191} {"train_loss": -7.739921569824219, "global_step": 32108, "epoch": 191} {"train_loss": -7.431146621704102, "global_step": 32109, "epoch": 191} {"train_loss": -7.645541191101074, "global_step": 32110, "epoch": 191} {"train_loss": -7.337332725524902, "global_step": 32111, "epoch": 191} {"train_loss": -7.644190788269043, "global_step": 32112, "epoch": 191} {"train_loss": -7.6325225830078125, "global_step": 32113, "epoch": 191} {"train_loss": -7.508459568023682, "global_step": 32114, "epoch": 191} {"train_loss": -7.661982536315918, "global_step": 32115, "epoch": 191} {"train_loss": -7.493756294250488, "global_step": 32116, "epoch": 191} {"train_loss": -7.582616806030273, "global_step": 32117, "epoch": 191} {"train_loss": -7.130695819854736, "global_step": 32118, "epoch": 191} {"train_loss": -7.450860977172852, "global_step": 32119, "epoch": 191} {"train_loss": -7.486354827880859, "global_step": 32120, "epoch": 191} {"train_loss": -7.669831275939941, "global_step": 32121, "epoch": 191} {"train_loss": -7.408463478088379, "global_step": 32122, "epoch": 191} {"train_loss": -7.738870620727539, "global_step": 32123, "epoch": 191} {"train_loss": -7.238966941833496, "global_step": 32124, "epoch": 191} {"train_loss": -7.716221809387207, "global_step": 32125, "epoch": 191} {"train_loss": -7.273540496826172, "global_step": 32126, "epoch": 191} {"train_loss": -7.585110664367676, "global_step": 32127, "epoch": 191} {"train_loss": -7.554812431335449, "global_step": 32128, "epoch": 191} {"train_loss": -7.375462532043457, "global_step": 32129, "epoch": 191} {"train_loss": -7.358076095581055, "global_step": 32130, "epoch": 191} {"train_loss": -7.714354515075684, "global_step": 32131, "epoch": 191} {"train_loss": -7.361301422119141, "global_step": 32132, "epoch": 191} {"train_loss": -7.26286506652832, "global_step": 32133, "epoch": 191} {"train_loss": -7.620880126953125, "global_step": 32134, "epoch": 191} {"train_loss": -7.700984954833984, "global_step": 32135, "epoch": 191} {"train_loss": -7.480317115783691, "global_step": 32136, "epoch": 191} {"train_loss": -7.395246982574463, "global_step": 32137, "epoch": 191} {"train_loss": -7.389410972595215, "global_step": 32138, "epoch": 191} {"train_loss": -7.481317520141602, "global_step": 32139, "epoch": 191} {"train_loss": -7.505843162536621, "global_step": 32140, "epoch": 191} {"train_loss": -7.563860893249512, "global_step": 32141, "epoch": 191} {"train_loss": -7.5255842208862305, "global_step": 32142, "epoch": 191} {"train_loss": -7.23930025100708, "global_step": 32143, "epoch": 191} {"train_loss": -7.605020999908447, "global_step": 32144, "epoch": 191} {"train_loss": -7.675528526306152, "global_step": 32145, "epoch": 191} {"train_loss": -7.592079162597656, "global_step": 32146, "epoch": 191} {"train_loss": -7.5951714515686035, "global_step": 32147, "epoch": 191} {"train_loss": -7.608798027038574, "global_step": 32148, "epoch": 191} {"train_loss": -7.479613780975342, "global_step": 32149, "epoch": 191} {"train_loss": -7.572373867034912, "global_step": 32150, "epoch": 191} {"train_loss": -7.415721893310547, "global_step": 32151, "epoch": 191} {"train_loss": -7.622251987457275, "global_step": 32152, "epoch": 191} {"train_loss": -7.579968452453613, "global_step": 32153, "epoch": 191} {"train_loss": -7.674742221832275, "global_step": 32154, "epoch": 191} {"train_loss": -7.628965377807617, "global_step": 32155, "epoch": 191} {"train_loss": -7.49746036529541, "global_step": 32156, "epoch": 191} {"train_loss": -7.606050491333008, "global_step": 32157, "epoch": 191} {"train_loss": -7.549572467803955, "global_step": 32158, "epoch": 191} {"train_loss": -7.5875244140625, "global_step": 32159, "epoch": 191} {"train_loss": -7.430292129516602, "global_step": 32160, "epoch": 191} {"train_loss": -7.740171432495117, "global_step": 32161, "epoch": 191} {"train_loss": -7.595369338989258, "global_step": 32162, "epoch": 191} {"train_loss": -7.72511100769043, "global_step": 32163, "epoch": 191} {"train_loss": -7.753911972045898, "global_step": 32164, "epoch": 191} {"train_loss": -7.660004615783691, "global_step": 32165, "epoch": 191} {"train_loss": -7.737051486968994, "global_step": 32166, "epoch": 191} {"train_loss": -7.461780548095703, "global_step": 32167, "epoch": 191} {"train_loss": -7.547871112823486, "global_step": 32168, "epoch": 191} {"train_loss": -7.67403507232666, "global_step": 32169, "epoch": 191} {"train_loss": -7.686483860015869, "global_step": 32170, "epoch": 191} {"train_loss": -7.515124320983887, "global_step": 32171, "epoch": 191} {"train_loss": -7.825863838195801, "global_step": 32172, "epoch": 191} {"train_loss": -7.606298923492432, "global_step": 32173, "epoch": 191} {"train_loss": -7.655578136444092, "global_step": 32174, "epoch": 191} {"train_loss": -7.782476425170898, "global_step": 32175, "epoch": 191} {"train_loss": -7.628923416137695, "global_step": 32176, "epoch": 191} {"train_loss": -7.670965194702148, "global_step": 32177, "epoch": 191} {"train_loss": -7.740346908569336, "global_step": 32178, "epoch": 191} {"train_loss": -7.569572448730469, "global_step": 32179, "epoch": 191} {"train_loss": -7.724952220916748, "global_step": 32180, "epoch": 191} {"train_loss": -7.821627140045166, "global_step": 32181, "epoch": 191} {"train_loss": -7.504737377166748, "global_step": 32182, "epoch": 191} {"train_loss": -7.318833827972412, "global_step": 32183, "epoch": 191} {"train_loss": -7.6337890625, "global_step": 32184, "epoch": 191} {"train_loss": -7.277245044708252, "global_step": 32185, "epoch": 191} {"train_loss": -7.686638832092285, "global_step": 32186, "epoch": 191} {"train_loss": -7.2202324867248535, "global_step": 32187, "epoch": 191} {"train_loss": -7.635442733764648, "global_step": 32188, "epoch": 191} {"train_loss": -7.337156295776367, "global_step": 32189, "epoch": 191} {"train_loss": -7.548382759094238, "global_step": 32190, "epoch": 191} {"train_loss": -7.408374786376953, "global_step": 32191, "epoch": 191} {"train_loss": -7.593928337097168, "global_step": 32192, "epoch": 191} {"train_loss": -7.601971626281738, "global_step": 32193, "epoch": 191} {"train_loss": -7.5244140625, "global_step": 32194, "epoch": 191} {"train_loss": -7.86840295791626, "global_step": 32195, "epoch": 191} {"train_loss": -7.54591178894043, "global_step": 32196, "epoch": 191} {"train_loss": -7.700461387634277, "global_step": 32197, "epoch": 191} {"train_loss": -7.658125877380371, "global_step": 32198, "epoch": 191} {"train_loss": -7.622100353240967, "global_step": 32199, "epoch": 191} {"train_loss": -7.676817417144775, "global_step": 32200, "epoch": 191} {"train_loss": -7.728745460510254, "global_step": 32201, "epoch": 191} {"train_loss": -7.709650039672852, "global_step": 32202, "epoch": 191} {"train_loss": -7.674987316131592, "global_step": 32203, "epoch": 191} {"train_loss": -7.673649787902832, "global_step": 32204, "epoch": 191} {"train_loss": -7.550601959228516, "global_step": 32205, "epoch": 191} {"train_loss": -7.474209308624268, "global_step": 32206, "epoch": 191} {"train_loss": -7.458713531494141, "global_step": 32207, "epoch": 191} {"train_loss": -7.306166172027588, "global_step": 32208, "epoch": 191} {"train_loss": -7.586583137512207, "global_step": 32209, "epoch": 191} {"train_loss": -7.147838592529297, "global_step": 32210, "epoch": 191} {"train_loss": -7.737468719482422, "global_step": 32211, "epoch": 191} {"train_loss": -7.165287971496582, "global_step": 32212, "epoch": 191} {"train_loss": -7.597355365753174, "global_step": 32213, "epoch": 191} {"train_loss": -7.480483055114746, "global_step": 32214, "epoch": 191} {"train_loss": -7.569720268249512, "global_step": 32215, "epoch": 191} {"train_loss": -7.758113861083984, "global_step": 32216, "epoch": 191} {"train_loss": -7.442421913146973, "global_step": 32217, "epoch": 191} {"train_loss": -7.726503849029541, "global_step": 32218, "epoch": 191} {"train_loss": -7.512276649475098, "global_step": 32219, "epoch": 191} {"train_loss": -7.680662155151367, "global_step": 32220, "epoch": 191} {"train_loss": -7.339974403381348, "global_step": 32221, "epoch": 191} {"train_loss": -7.443138122558594, "global_step": 32222, "epoch": 191} {"train_loss": -7.772043228149414, "global_step": 32223, "epoch": 191} {"train_loss": -7.341465950012207, "global_step": 32224, "epoch": 191} {"train_loss": -7.33266544342041, "global_step": 32225, "epoch": 191} {"train_loss": -7.670506477355957, "global_step": 32226, "epoch": 191} {"train_loss": -7.636970043182373, "global_step": 32227, "epoch": 191} {"train_loss": -7.662021636962891, "global_step": 32228, "epoch": 191} {"train_loss": -7.599303722381592, "global_step": 32229, "epoch": 191} {"train_loss": -7.443676471710205, "global_step": 32230, "epoch": 191} {"train_loss": -7.544656753540039, "global_step": 32231, "epoch": 191} {"train_loss": -7.742619037628174, "global_step": 32232, "epoch": 191} {"train_loss": -7.724459648132324, "global_step": 32233, "epoch": 191} {"train_loss": -7.715795993804932, "global_step": 32234, "epoch": 191} {"train_loss": -7.746126651763916, "global_step": 32235, "epoch": 191} {"train_loss": -7.617138862609863, "global_step": 32236, "epoch": 191} {"train_loss": -7.618335723876953, "global_step": 32237, "epoch": 191} {"train_loss": -7.429853439331055, "global_step": 32238, "epoch": 191} {"train_loss": -7.9501471519470215, "global_step": 32239, "epoch": 191} {"train_loss": -7.605998992919922, "global_step": 32240, "epoch": 191} {"train_loss": -7.601428031921387, "global_step": 32241, "epoch": 191} {"train_loss": -7.606114864349365, "global_step": 32242, "epoch": 191} {"train_loss": -7.571786880493164, "global_step": 32243, "epoch": 191} {"train_loss": -7.430995941162109, "global_step": 32244, "epoch": 191} {"train_loss": -7.717203140258789, "global_step": 32245, "epoch": 191} {"train_loss": -7.845119476318359, "global_step": 32246, "epoch": 191} {"train_loss": -7.656286716461182, "global_step": 32247, "epoch": 191} {"train_loss": -7.43814754486084, "global_step": 32248, "epoch": 191} {"train_loss": -7.379629611968994, "global_step": 32249, "epoch": 191} {"train_loss": -7.593903064727783, "global_step": 32250, "epoch": 191} {"train_loss": -7.662778854370117, "global_step": 32251, "epoch": 191} {"train_loss": -7.764331817626953, "global_step": 32252, "epoch": 191} {"train_loss": -7.856866359710693, "global_step": 32253, "epoch": 191} {"train_loss": -7.6677937507629395, "global_step": 32254, "epoch": 191} {"train_loss": -7.5796083978244235, "global_step": 32255, "epoch": 191, "val_loss": 186203.84375} {"train_loss": -7.705078125, "global_step": 32256, "epoch": 192} {"train_loss": -7.588223457336426, "global_step": 32257, "epoch": 192} {"train_loss": -7.423198223114014, "global_step": 32258, "epoch": 192} {"train_loss": -7.677459716796875, "global_step": 32259, "epoch": 192} {"train_loss": -7.541676998138428, "global_step": 32260, "epoch": 192} {"train_loss": -7.5914626121521, "global_step": 32261, "epoch": 192} {"train_loss": -7.610137939453125, "global_step": 32262, "epoch": 192} {"train_loss": -7.603211402893066, "global_step": 32263, "epoch": 192} {"train_loss": -7.571885108947754, "global_step": 32264, "epoch": 192} {"train_loss": -7.4271321296691895, "global_step": 32265, "epoch": 192} {"train_loss": -7.711507797241211, "global_step": 32266, "epoch": 192} {"train_loss": -7.3120012283325195, "global_step": 32267, "epoch": 192} {"train_loss": -7.441320419311523, "global_step": 32268, "epoch": 192} {"train_loss": -7.568437576293945, "global_step": 32269, "epoch": 192} {"train_loss": -7.540324687957764, "global_step": 32270, "epoch": 192} {"train_loss": -7.369650840759277, "global_step": 32271, "epoch": 192} {"train_loss": -7.714164733886719, "global_step": 32272, "epoch": 192} {"train_loss": -7.7596564292907715, "global_step": 32273, "epoch": 192} {"train_loss": -7.722109317779541, "global_step": 32274, "epoch": 192} {"train_loss": -7.557934761047363, "global_step": 32275, "epoch": 192} {"train_loss": -7.572020053863525, "global_step": 32276, "epoch": 192} {"train_loss": -7.714686393737793, "global_step": 32277, "epoch": 192} {"train_loss": -7.6067914962768555, "global_step": 32278, "epoch": 192} {"train_loss": -7.522274017333984, "global_step": 32279, "epoch": 192} {"train_loss": -7.745924949645996, "global_step": 32280, "epoch": 192} {"train_loss": -7.404020309448242, "global_step": 32281, "epoch": 192} {"train_loss": -7.786436557769775, "global_step": 32282, "epoch": 192} {"train_loss": -7.674256324768066, "global_step": 32283, "epoch": 192} {"train_loss": -7.52021598815918, "global_step": 32284, "epoch": 192} {"train_loss": -7.635561943054199, "global_step": 32285, "epoch": 192} {"train_loss": -7.649222373962402, "global_step": 32286, "epoch": 192} {"train_loss": -7.8169708251953125, "global_step": 32287, "epoch": 192} {"train_loss": -7.674385070800781, "global_step": 32288, "epoch": 192} {"train_loss": -7.753355979919434, "global_step": 32289, "epoch": 192} {"train_loss": -7.963254928588867, "global_step": 32290, "epoch": 192} {"train_loss": -7.898344993591309, "global_step": 32291, "epoch": 192} {"train_loss": -7.769583702087402, "global_step": 32292, "epoch": 192} {"train_loss": -7.655933856964111, "global_step": 32293, "epoch": 192} {"train_loss": -7.919008255004883, "global_step": 32294, "epoch": 192} {"train_loss": -7.71132755279541, "global_step": 32295, "epoch": 192} {"train_loss": -7.622824668884277, "global_step": 32296, "epoch": 192} {"train_loss": -7.899343490600586, "global_step": 32297, "epoch": 192} {"train_loss": -7.75022554397583, "global_step": 32298, "epoch": 192} {"train_loss": -7.632242202758789, "global_step": 32299, "epoch": 192} {"train_loss": -7.764126777648926, "global_step": 32300, "epoch": 192} {"train_loss": -7.479186534881592, "global_step": 32301, "epoch": 192} {"train_loss": -7.82967472076416, "global_step": 32302, "epoch": 192} {"train_loss": -7.763075828552246, "global_step": 32303, "epoch": 192} {"train_loss": -7.594548225402832, "global_step": 32304, "epoch": 192} {"train_loss": -7.471904754638672, "global_step": 32305, "epoch": 192} {"train_loss": -7.169844627380371, "global_step": 32306, "epoch": 192} {"train_loss": -7.463335990905762, "global_step": 32307, "epoch": 192} {"train_loss": -7.133599281311035, "global_step": 32308, "epoch": 192} {"train_loss": -7.4040937423706055, "global_step": 32309, "epoch": 192} {"train_loss": -7.176370620727539, "global_step": 32310, "epoch": 192} {"train_loss": -7.242048263549805, "global_step": 32311, "epoch": 192} {"train_loss": -7.336673259735107, "global_step": 32312, "epoch": 192} {"train_loss": -7.097506046295166, "global_step": 32313, "epoch": 192} {"train_loss": -6.994452476501465, "global_step": 32314, "epoch": 192} {"train_loss": -7.072986602783203, "global_step": 32315, "epoch": 192} {"train_loss": -7.132336616516113, "global_step": 32316, "epoch": 192} {"train_loss": -7.177896976470947, "global_step": 32317, "epoch": 192} {"train_loss": -7.133999824523926, "global_step": 32318, "epoch": 192} {"train_loss": -7.398375511169434, "global_step": 32319, "epoch": 192} {"train_loss": -7.207423210144043, "global_step": 32320, "epoch": 192} {"train_loss": -7.0767364501953125, "global_step": 32321, "epoch": 192} {"train_loss": -7.392364501953125, "global_step": 32322, "epoch": 192} {"train_loss": -7.193076133728027, "global_step": 32323, "epoch": 192} {"train_loss": -7.17585563659668, "global_step": 32324, "epoch": 192} {"train_loss": -7.2982025146484375, "global_step": 32325, "epoch": 192} {"train_loss": -7.3460307121276855, "global_step": 32326, "epoch": 192} {"train_loss": -7.454084396362305, "global_step": 32327, "epoch": 192} {"train_loss": -7.578982830047607, "global_step": 32328, "epoch": 192} {"train_loss": -7.541855335235596, "global_step": 32329, "epoch": 192} {"train_loss": -7.547877788543701, "global_step": 32330, "epoch": 192} {"train_loss": -7.584955215454102, "global_step": 32331, "epoch": 192} {"train_loss": -7.573666572570801, "global_step": 32332, "epoch": 192} {"train_loss": -7.399662971496582, "global_step": 32333, "epoch": 192} {"train_loss": -7.569706916809082, "global_step": 32334, "epoch": 192} {"train_loss": -7.509494781494141, "global_step": 32335, "epoch": 192} {"train_loss": -7.614080905914307, "global_step": 32336, "epoch": 192} {"train_loss": -7.5613932609558105, "global_step": 32337, "epoch": 192} {"train_loss": -7.759303569793701, "global_step": 32338, "epoch": 192} {"train_loss": -7.668241024017334, "global_step": 32339, "epoch": 192} {"train_loss": -7.540270805358887, "global_step": 32340, "epoch": 192} {"train_loss": -7.551850318908691, "global_step": 32341, "epoch": 192} {"train_loss": -7.846722602844238, "global_step": 32342, "epoch": 192} {"train_loss": -7.679586887359619, "global_step": 32343, "epoch": 192} {"train_loss": -7.7659196853637695, "global_step": 32344, "epoch": 192} {"train_loss": -7.638847351074219, "global_step": 32345, "epoch": 192} {"train_loss": -7.578702926635742, "global_step": 32346, "epoch": 192} {"train_loss": -7.543704986572266, "global_step": 32347, "epoch": 192} {"train_loss": -7.650832176208496, "global_step": 32348, "epoch": 192} {"train_loss": -7.656369209289551, "global_step": 32349, "epoch": 192} {"train_loss": -7.701759338378906, "global_step": 32350, "epoch": 192} {"train_loss": -7.52360200881958, "global_step": 32351, "epoch": 192} {"train_loss": -7.453899383544922, "global_step": 32352, "epoch": 192} {"train_loss": -7.612311363220215, "global_step": 32353, "epoch": 192} {"train_loss": -7.54160737991333, "global_step": 32354, "epoch": 192} {"train_loss": -7.819272041320801, "global_step": 32355, "epoch": 192} {"train_loss": -7.593339443206787, "global_step": 32356, "epoch": 192} {"train_loss": -7.678257465362549, "global_step": 32357, "epoch": 192} {"train_loss": -7.6475067138671875, "global_step": 32358, "epoch": 192} {"train_loss": -7.551369667053223, "global_step": 32359, "epoch": 192} {"train_loss": -7.680672645568848, "global_step": 32360, "epoch": 192} {"train_loss": -7.628680229187012, "global_step": 32361, "epoch": 192} {"train_loss": -7.6172990798950195, "global_step": 32362, "epoch": 192} {"train_loss": -7.312373638153076, "global_step": 32363, "epoch": 192} {"train_loss": -7.565324306488037, "global_step": 32364, "epoch": 192} {"train_loss": -7.499394416809082, "global_step": 32365, "epoch": 192} {"train_loss": -7.468401908874512, "global_step": 32366, "epoch": 192} {"train_loss": -7.437646865844727, "global_step": 32367, "epoch": 192} {"train_loss": -7.731971740722656, "global_step": 32368, "epoch": 192} {"train_loss": -7.472316741943359, "global_step": 32369, "epoch": 192} {"train_loss": -7.327256202697754, "global_step": 32370, "epoch": 192} {"train_loss": -7.680084228515625, "global_step": 32371, "epoch": 192} {"train_loss": -7.392406463623047, "global_step": 32372, "epoch": 192} {"train_loss": -7.824638843536377, "global_step": 32373, "epoch": 192} {"train_loss": -7.566132068634033, "global_step": 32374, "epoch": 192} {"train_loss": -7.383664608001709, "global_step": 32375, "epoch": 192} {"train_loss": -7.442142963409424, "global_step": 32376, "epoch": 192} {"train_loss": -7.485815048217773, "global_step": 32377, "epoch": 192} {"train_loss": -7.81049919128418, "global_step": 32378, "epoch": 192} {"train_loss": -7.378589630126953, "global_step": 32379, "epoch": 192} {"train_loss": -7.519522190093994, "global_step": 32380, "epoch": 192} {"train_loss": -7.595229625701904, "global_step": 32381, "epoch": 192} {"train_loss": -7.347150802612305, "global_step": 32382, "epoch": 192} {"train_loss": -7.408967971801758, "global_step": 32383, "epoch": 192} {"train_loss": -7.722007751464844, "global_step": 32384, "epoch": 192} {"train_loss": -7.494060516357422, "global_step": 32385, "epoch": 192} {"train_loss": -7.55204963684082, "global_step": 32386, "epoch": 192} {"train_loss": -7.4388041496276855, "global_step": 32387, "epoch": 192} {"train_loss": -7.3438005447387695, "global_step": 32388, "epoch": 192} {"train_loss": -7.541115760803223, "global_step": 32389, "epoch": 192} {"train_loss": -7.24747371673584, "global_step": 32390, "epoch": 192} {"train_loss": -7.629024505615234, "global_step": 32391, "epoch": 192} {"train_loss": -7.537148475646973, "global_step": 32392, "epoch": 192} {"train_loss": -7.475087642669678, "global_step": 32393, "epoch": 192} {"train_loss": -7.226596355438232, "global_step": 32394, "epoch": 192} {"train_loss": -7.4096479415893555, "global_step": 32395, "epoch": 192} {"train_loss": -7.627148628234863, "global_step": 32396, "epoch": 192} {"train_loss": -7.3467817306518555, "global_step": 32397, "epoch": 192} {"train_loss": -7.597622871398926, "global_step": 32398, "epoch": 192} {"train_loss": -7.584749221801758, "global_step": 32399, "epoch": 192} {"train_loss": -7.699583053588867, "global_step": 32400, "epoch": 192} {"train_loss": -7.445708274841309, "global_step": 32401, "epoch": 192} {"train_loss": -7.83261251449585, "global_step": 32402, "epoch": 192} {"train_loss": -7.63936710357666, "global_step": 32403, "epoch": 192} {"train_loss": -7.67841100692749, "global_step": 32404, "epoch": 192} {"train_loss": -7.545079231262207, "global_step": 32405, "epoch": 192} {"train_loss": -7.672617435455322, "global_step": 32406, "epoch": 192} {"train_loss": -7.52862548828125, "global_step": 32407, "epoch": 192} {"train_loss": -7.797596454620361, "global_step": 32408, "epoch": 192} {"train_loss": -7.48809814453125, "global_step": 32409, "epoch": 192} {"train_loss": -7.383100509643555, "global_step": 32410, "epoch": 192} {"train_loss": -7.361172676086426, "global_step": 32411, "epoch": 192} {"train_loss": -7.228736877441406, "global_step": 32412, "epoch": 192} {"train_loss": -7.560276508331299, "global_step": 32413, "epoch": 192} {"train_loss": -7.578714847564697, "global_step": 32414, "epoch": 192} {"train_loss": -7.72044563293457, "global_step": 32415, "epoch": 192} {"train_loss": -7.420234680175781, "global_step": 32416, "epoch": 192} {"train_loss": -7.588620185852051, "global_step": 32417, "epoch": 192} {"train_loss": -7.305396556854248, "global_step": 32418, "epoch": 192} {"train_loss": -7.320181846618652, "global_step": 32419, "epoch": 192} {"train_loss": -7.296422004699707, "global_step": 32420, "epoch": 192} {"train_loss": -7.492841720581055, "global_step": 32421, "epoch": 192} {"train_loss": -7.160144805908203, "global_step": 32422, "epoch": 192} {"train_loss": -7.531040736607143, "global_step": 32423, "epoch": 192, "val_loss": 187761.3125} {"train_loss": -7.717104434967041, "global_step": 32424, "epoch": 193} {"train_loss": -7.365148544311523, "global_step": 32425, "epoch": 193} {"train_loss": -7.627538204193115, "global_step": 32426, "epoch": 193} {"train_loss": -7.4219818115234375, "global_step": 32427, "epoch": 193} {"train_loss": -7.354802131652832, "global_step": 32428, "epoch": 193} {"train_loss": -7.494884014129639, "global_step": 32429, "epoch": 193} {"train_loss": -7.437532424926758, "global_step": 32430, "epoch": 193} {"train_loss": -7.532438278198242, "global_step": 32431, "epoch": 193} {"train_loss": -7.442625045776367, "global_step": 32432, "epoch": 193} {"train_loss": -7.4926652908325195, "global_step": 32433, "epoch": 193} {"train_loss": -7.511503219604492, "global_step": 32434, "epoch": 193} {"train_loss": -7.579672813415527, "global_step": 32435, "epoch": 193} {"train_loss": -7.577925682067871, "global_step": 32436, "epoch": 193} {"train_loss": -7.551468372344971, "global_step": 32437, "epoch": 193} {"train_loss": -7.5287909507751465, "global_step": 32438, "epoch": 193} {"train_loss": -7.7487077713012695, "global_step": 32439, "epoch": 193} {"train_loss": -7.751774787902832, "global_step": 32440, "epoch": 193} {"train_loss": -7.660390377044678, "global_step": 32441, "epoch": 193} {"train_loss": -7.705233573913574, "global_step": 32442, "epoch": 193} {"train_loss": -7.784342288970947, "global_step": 32443, "epoch": 193} {"train_loss": -7.941086769104004, "global_step": 32444, "epoch": 193} {"train_loss": -7.776702880859375, "global_step": 32445, "epoch": 193} {"train_loss": -8.003092765808105, "global_step": 32446, "epoch": 193} {"train_loss": -8.11038589477539, "global_step": 32447, "epoch": 193} {"train_loss": -7.576457500457764, "global_step": 32448, "epoch": 193} {"train_loss": -7.776314735412598, "global_step": 32449, "epoch": 193} {"train_loss": -7.457156181335449, "global_step": 32450, "epoch": 193} {"train_loss": -7.6359686851501465, "global_step": 32451, "epoch": 193} {"train_loss": -7.658321857452393, "global_step": 32452, "epoch": 193} {"train_loss": -6.946964263916016, "global_step": 32453, "epoch": 193} {"train_loss": -7.632038593292236, "global_step": 32454, "epoch": 193} {"train_loss": -7.3195600509643555, "global_step": 32455, "epoch": 193} {"train_loss": -7.391168594360352, "global_step": 32456, "epoch": 193} {"train_loss": -7.530858039855957, "global_step": 32457, "epoch": 193} {"train_loss": -7.276548385620117, "global_step": 32458, "epoch": 193} {"train_loss": -7.615888595581055, "global_step": 32459, "epoch": 193} {"train_loss": -7.302507400512695, "global_step": 32460, "epoch": 193} {"train_loss": -7.662190914154053, "global_step": 32461, "epoch": 193} {"train_loss": -7.4619293212890625, "global_step": 32462, "epoch": 193} {"train_loss": -7.470965385437012, "global_step": 32463, "epoch": 193} {"train_loss": -7.2561235427856445, "global_step": 32464, "epoch": 193} {"train_loss": -7.586180686950684, "global_step": 32465, "epoch": 193} {"train_loss": -7.497925758361816, "global_step": 32466, "epoch": 193} {"train_loss": -7.517496109008789, "global_step": 32467, "epoch": 193} {"train_loss": -7.386784076690674, "global_step": 32468, "epoch": 193} {"train_loss": -7.582772254943848, "global_step": 32469, "epoch": 193} {"train_loss": -7.722152233123779, "global_step": 32470, "epoch": 193} {"train_loss": -7.386392593383789, "global_step": 32471, "epoch": 193} {"train_loss": -7.406546115875244, "global_step": 32472, "epoch": 193} {"train_loss": -7.406289100646973, "global_step": 32473, "epoch": 193} {"train_loss": -7.239459991455078, "global_step": 32474, "epoch": 193} {"train_loss": -7.664219856262207, "global_step": 32475, "epoch": 193} {"train_loss": -7.473325252532959, "global_step": 32476, "epoch": 193} {"train_loss": -7.352900981903076, "global_step": 32477, "epoch": 193} {"train_loss": -7.553443431854248, "global_step": 32478, "epoch": 193} {"train_loss": -7.548801898956299, "global_step": 32479, "epoch": 193} {"train_loss": -7.711103439331055, "global_step": 32480, "epoch": 193} {"train_loss": -7.716330528259277, "global_step": 32481, "epoch": 193} {"train_loss": -7.4562201499938965, "global_step": 32482, "epoch": 193} {"train_loss": -7.682645320892334, "global_step": 32483, "epoch": 193} {"train_loss": -7.601192951202393, "global_step": 32484, "epoch": 193} {"train_loss": -7.675534248352051, "global_step": 32485, "epoch": 193} {"train_loss": -7.749958515167236, "global_step": 32486, "epoch": 193} {"train_loss": -7.706833839416504, "global_step": 32487, "epoch": 193} {"train_loss": -7.664428234100342, "global_step": 32488, "epoch": 193} {"train_loss": -7.560331344604492, "global_step": 32489, "epoch": 193} {"train_loss": -7.627569198608398, "global_step": 32490, "epoch": 193} {"train_loss": -7.536853790283203, "global_step": 32491, "epoch": 193} {"train_loss": -7.61423921585083, "global_step": 32492, "epoch": 193} {"train_loss": -7.277299880981445, "global_step": 32493, "epoch": 193} {"train_loss": -7.311393737792969, "global_step": 32494, "epoch": 193} {"train_loss": -7.907903671264648, "global_step": 32495, "epoch": 193} {"train_loss": -7.266772747039795, "global_step": 32496, "epoch": 193} {"train_loss": -7.627779006958008, "global_step": 32497, "epoch": 193} {"train_loss": -7.349454879760742, "global_step": 32498, "epoch": 193} {"train_loss": -7.573360919952393, "global_step": 32499, "epoch": 193} {"train_loss": -7.109133720397949, "global_step": 32500, "epoch": 193} {"train_loss": -7.584774971008301, "global_step": 32501, "epoch": 193} {"train_loss": -7.628230094909668, "global_step": 32502, "epoch": 193} {"train_loss": -7.2150702476501465, "global_step": 32503, "epoch": 193} {"train_loss": -7.588892936706543, "global_step": 32504, "epoch": 193} {"train_loss": -7.3231964111328125, "global_step": 32505, "epoch": 193} {"train_loss": -7.617947578430176, "global_step": 32506, "epoch": 193} {"train_loss": -7.365066051483154, "global_step": 32507, "epoch": 193} {"train_loss": -7.445969104766846, "global_step": 32508, "epoch": 193} {"train_loss": -7.616759300231934, "global_step": 32509, "epoch": 193} {"train_loss": -7.380677700042725, "global_step": 32510, "epoch": 193} {"train_loss": -7.582217216491699, "global_step": 32511, "epoch": 193} {"train_loss": -7.421877861022949, "global_step": 32512, "epoch": 193} {"train_loss": -7.392697811126709, "global_step": 32513, "epoch": 193} {"train_loss": -7.493634223937988, "global_step": 32514, "epoch": 193} {"train_loss": -7.42177677154541, "global_step": 32515, "epoch": 193} {"train_loss": -7.586005210876465, "global_step": 32516, "epoch": 193} {"train_loss": -7.5008039474487305, "global_step": 32517, "epoch": 193} {"train_loss": -7.455356121063232, "global_step": 32518, "epoch": 193} {"train_loss": -7.312431335449219, "global_step": 32519, "epoch": 193} {"train_loss": -7.502573490142822, "global_step": 32520, "epoch": 193} {"train_loss": -6.908198356628418, "global_step": 32521, "epoch": 193} {"train_loss": -7.508954048156738, "global_step": 32522, "epoch": 193} {"train_loss": -7.529524803161621, "global_step": 32523, "epoch": 193} {"train_loss": -7.287023544311523, "global_step": 32524, "epoch": 193} {"train_loss": -7.439971923828125, "global_step": 32525, "epoch": 193} {"train_loss": -7.611412048339844, "global_step": 32526, "epoch": 193} {"train_loss": -7.638413429260254, "global_step": 32527, "epoch": 193} {"train_loss": -7.598539352416992, "global_step": 32528, "epoch": 193} {"train_loss": -7.425461292266846, "global_step": 32529, "epoch": 193} {"train_loss": -7.578556060791016, "global_step": 32530, "epoch": 193} {"train_loss": -7.557978630065918, "global_step": 32531, "epoch": 193} {"train_loss": -7.408143043518066, "global_step": 32532, "epoch": 193} {"train_loss": -7.473638534545898, "global_step": 32533, "epoch": 193} {"train_loss": -7.798496246337891, "global_step": 32534, "epoch": 193} {"train_loss": -7.709403038024902, "global_step": 32535, "epoch": 193} {"train_loss": -7.572257995605469, "global_step": 32536, "epoch": 193} {"train_loss": -7.806875228881836, "global_step": 32537, "epoch": 193} {"train_loss": -7.814254283905029, "global_step": 32538, "epoch": 193} {"train_loss": -7.510274887084961, "global_step": 32539, "epoch": 193} {"train_loss": -7.597472190856934, "global_step": 32540, "epoch": 193} {"train_loss": -7.771892547607422, "global_step": 32541, "epoch": 193} {"train_loss": -7.764877796173096, "global_step": 32542, "epoch": 193} {"train_loss": -7.494214057922363, "global_step": 32543, "epoch": 193} {"train_loss": -7.928647041320801, "global_step": 32544, "epoch": 193} {"train_loss": -7.445075035095215, "global_step": 32545, "epoch": 193} {"train_loss": -7.7919464111328125, "global_step": 32546, "epoch": 193} {"train_loss": -7.423558235168457, "global_step": 32547, "epoch": 193} {"train_loss": -7.777498245239258, "global_step": 32548, "epoch": 193} {"train_loss": -7.660861968994141, "global_step": 32549, "epoch": 193} {"train_loss": -7.364509582519531, "global_step": 32550, "epoch": 193} {"train_loss": -7.626646041870117, "global_step": 32551, "epoch": 193} {"train_loss": -7.826669216156006, "global_step": 32552, "epoch": 193} {"train_loss": -7.553654670715332, "global_step": 32553, "epoch": 193} {"train_loss": -7.344101428985596, "global_step": 32554, "epoch": 193} {"train_loss": -7.4079461097717285, "global_step": 32555, "epoch": 193} {"train_loss": -7.567399024963379, "global_step": 32556, "epoch": 193} {"train_loss": -7.467140197753906, "global_step": 32557, "epoch": 193} {"train_loss": -7.390718936920166, "global_step": 32558, "epoch": 193} {"train_loss": -7.657432556152344, "global_step": 32559, "epoch": 193} {"train_loss": -7.486637115478516, "global_step": 32560, "epoch": 193} {"train_loss": -7.408143043518066, "global_step": 32561, "epoch": 193} {"train_loss": -7.4226555824279785, "global_step": 32562, "epoch": 193} {"train_loss": -7.342758655548096, "global_step": 32563, "epoch": 193} {"train_loss": -7.454934597015381, "global_step": 32564, "epoch": 193} {"train_loss": -7.567419052124023, "global_step": 32565, "epoch": 193} {"train_loss": -7.591847896575928, "global_step": 32566, "epoch": 193} {"train_loss": -7.618386268615723, "global_step": 32567, "epoch": 193} {"train_loss": -7.866733551025391, "global_step": 32568, "epoch": 193} {"train_loss": -7.565154552459717, "global_step": 32569, "epoch": 193} {"train_loss": -7.568675518035889, "global_step": 32570, "epoch": 193} {"train_loss": -7.724052429199219, "global_step": 32571, "epoch": 193} {"train_loss": -7.671889781951904, "global_step": 32572, "epoch": 193} {"train_loss": -7.430605888366699, "global_step": 32573, "epoch": 193} {"train_loss": -7.811264991760254, "global_step": 32574, "epoch": 193} {"train_loss": -7.450249671936035, "global_step": 32575, "epoch": 193} {"train_loss": -7.887804985046387, "global_step": 32576, "epoch": 193} {"train_loss": -7.79290771484375, "global_step": 32577, "epoch": 193} {"train_loss": -7.7370405197143555, "global_step": 32578, "epoch": 193} {"train_loss": -7.695489883422852, "global_step": 32579, "epoch": 193} {"train_loss": -7.781293869018555, "global_step": 32580, "epoch": 193} {"train_loss": -7.728033065795898, "global_step": 32581, "epoch": 193} {"train_loss": -7.355400562286377, "global_step": 32582, "epoch": 193} {"train_loss": -7.454925537109375, "global_step": 32583, "epoch": 193} {"train_loss": -7.328939914703369, "global_step": 32584, "epoch": 193} {"train_loss": -7.635040283203125, "global_step": 32585, "epoch": 193} {"train_loss": -7.505075931549072, "global_step": 32586, "epoch": 193} {"train_loss": -7.791781425476074, "global_step": 32587, "epoch": 193} {"train_loss": -7.475330352783203, "global_step": 32588, "epoch": 193} {"train_loss": -7.776102066040039, "global_step": 32589, "epoch": 193} {"train_loss": -7.628305435180664, "global_step": 32590, "epoch": 193} {"train_loss": -7.551385402679443, "global_step": 32591, "epoch": 193, "val_loss": 186654.328125} {"train_loss": -7.401946067810059, "global_step": 32592, "epoch": 194} {"train_loss": -7.857489109039307, "global_step": 32593, "epoch": 194} {"train_loss": -7.424550533294678, "global_step": 32594, "epoch": 194} {"train_loss": -7.631401062011719, "global_step": 32595, "epoch": 194} {"train_loss": -7.569985866546631, "global_step": 32596, "epoch": 194} {"train_loss": -7.547905445098877, "global_step": 32597, "epoch": 194} {"train_loss": -7.531081676483154, "global_step": 32598, "epoch": 194} {"train_loss": -7.424853801727295, "global_step": 32599, "epoch": 194} {"train_loss": -7.607913017272949, "global_step": 32600, "epoch": 194} {"train_loss": -7.270641326904297, "global_step": 32601, "epoch": 194} {"train_loss": -7.214781284332275, "global_step": 32602, "epoch": 194} {"train_loss": -7.5831451416015625, "global_step": 32603, "epoch": 194} {"train_loss": -7.291932106018066, "global_step": 32604, "epoch": 194} {"train_loss": -7.583403587341309, "global_step": 32605, "epoch": 194} {"train_loss": -7.4204206466674805, "global_step": 32606, "epoch": 194} {"train_loss": -7.447845458984375, "global_step": 32607, "epoch": 194} {"train_loss": -7.429348945617676, "global_step": 32608, "epoch": 194} {"train_loss": -7.450650215148926, "global_step": 32609, "epoch": 194} {"train_loss": -7.721606254577637, "global_step": 32610, "epoch": 194} {"train_loss": -7.606971740722656, "global_step": 32611, "epoch": 194} {"train_loss": -7.62445592880249, "global_step": 32612, "epoch": 194} {"train_loss": -7.4975762367248535, "global_step": 32613, "epoch": 194} {"train_loss": -7.584101676940918, "global_step": 32614, "epoch": 194} {"train_loss": -7.498517990112305, "global_step": 32615, "epoch": 194} {"train_loss": -7.389724254608154, "global_step": 32616, "epoch": 194} {"train_loss": -7.546743869781494, "global_step": 32617, "epoch": 194} {"train_loss": -7.794103622436523, "global_step": 32618, "epoch": 194} {"train_loss": -7.823486804962158, "global_step": 32619, "epoch": 194} {"train_loss": -7.4881181716918945, "global_step": 32620, "epoch": 194} {"train_loss": -7.564145565032959, "global_step": 32621, "epoch": 194} {"train_loss": -7.705409049987793, "global_step": 32622, "epoch": 194} {"train_loss": -7.756609916687012, "global_step": 32623, "epoch": 194} {"train_loss": -7.555037498474121, "global_step": 32624, "epoch": 194} {"train_loss": -7.717404842376709, "global_step": 32625, "epoch": 194} {"train_loss": -7.5899977684021, "global_step": 32626, "epoch": 194} {"train_loss": -7.719760894775391, "global_step": 32627, "epoch": 194} {"train_loss": -7.542572975158691, "global_step": 32628, "epoch": 194} {"train_loss": -7.574387073516846, "global_step": 32629, "epoch": 194} {"train_loss": -7.533921718597412, "global_step": 32630, "epoch": 194} {"train_loss": -7.603845596313477, "global_step": 32631, "epoch": 194} {"train_loss": -7.631003379821777, "global_step": 32632, "epoch": 194} {"train_loss": -7.858104705810547, "global_step": 32633, "epoch": 194} {"train_loss": -7.377277374267578, "global_step": 32634, "epoch": 194} {"train_loss": -7.557046890258789, "global_step": 32635, "epoch": 194} {"train_loss": -7.470305442810059, "global_step": 32636, "epoch": 194} {"train_loss": -7.627947807312012, "global_step": 32637, "epoch": 194} {"train_loss": -7.66279935836792, "global_step": 32638, "epoch": 194} {"train_loss": -7.823240280151367, "global_step": 32639, "epoch": 194} {"train_loss": -7.79504919052124, "global_step": 32640, "epoch": 194} {"train_loss": -7.753635883331299, "global_step": 32641, "epoch": 194} {"train_loss": -7.663754463195801, "global_step": 32642, "epoch": 194} {"train_loss": -7.766894817352295, "global_step": 32643, "epoch": 194} {"train_loss": -7.6860127449035645, "global_step": 32644, "epoch": 194} {"train_loss": -7.622176647186279, "global_step": 32645, "epoch": 194} {"train_loss": -7.5335187911987305, "global_step": 32646, "epoch": 194} {"train_loss": -7.690030097961426, "global_step": 32647, "epoch": 194} {"train_loss": -7.721243381500244, "global_step": 32648, "epoch": 194} {"train_loss": -7.541107177734375, "global_step": 32649, "epoch": 194} {"train_loss": -7.6598944664001465, "global_step": 32650, "epoch": 194} {"train_loss": -7.7325639724731445, "global_step": 32651, "epoch": 194} {"train_loss": -7.745957374572754, "global_step": 32652, "epoch": 194} {"train_loss": -7.705304145812988, "global_step": 32653, "epoch": 194} {"train_loss": -7.657226085662842, "global_step": 32654, "epoch": 194} {"train_loss": -7.628299713134766, "global_step": 32655, "epoch": 194} {"train_loss": -7.624456405639648, "global_step": 32656, "epoch": 194} {"train_loss": -7.770662307739258, "global_step": 32657, "epoch": 194} {"train_loss": -7.691542625427246, "global_step": 32658, "epoch": 194} {"train_loss": -7.503689289093018, "global_step": 32659, "epoch": 194} {"train_loss": -7.691927909851074, "global_step": 32660, "epoch": 194} {"train_loss": -7.7010498046875, "global_step": 32661, "epoch": 194} {"train_loss": -7.424961090087891, "global_step": 32662, "epoch": 194} {"train_loss": -7.373388290405273, "global_step": 32663, "epoch": 194} {"train_loss": -7.521298408508301, "global_step": 32664, "epoch": 194} {"train_loss": -7.696290969848633, "global_step": 32665, "epoch": 194} {"train_loss": -7.517663955688477, "global_step": 32666, "epoch": 194} {"train_loss": -7.368338584899902, "global_step": 32667, "epoch": 194} {"train_loss": -7.342218399047852, "global_step": 32668, "epoch": 194} {"train_loss": -7.550446510314941, "global_step": 32669, "epoch": 194} {"train_loss": -7.55246639251709, "global_step": 32670, "epoch": 194} {"train_loss": -7.499078273773193, "global_step": 32671, "epoch": 194} {"train_loss": -7.564973831176758, "global_step": 32672, "epoch": 194} {"train_loss": -7.6360063552856445, "global_step": 32673, "epoch": 194} {"train_loss": -7.486063003540039, "global_step": 32674, "epoch": 194} {"train_loss": -7.379964828491211, "global_step": 32675, "epoch": 194} {"train_loss": -7.468324661254883, "global_step": 32676, "epoch": 194} {"train_loss": -7.342312812805176, "global_step": 32677, "epoch": 194} {"train_loss": -7.4449615478515625, "global_step": 32678, "epoch": 194} {"train_loss": -7.255396366119385, "global_step": 32679, "epoch": 194} {"train_loss": -7.481515884399414, "global_step": 32680, "epoch": 194} {"train_loss": -7.271409034729004, "global_step": 32681, "epoch": 194} {"train_loss": -7.322822570800781, "global_step": 32682, "epoch": 194} {"train_loss": -7.499673366546631, "global_step": 32683, "epoch": 194} {"train_loss": -7.524467468261719, "global_step": 32684, "epoch": 194} {"train_loss": -7.684797763824463, "global_step": 32685, "epoch": 194} {"train_loss": -7.411384105682373, "global_step": 32686, "epoch": 194} {"train_loss": -7.563600540161133, "global_step": 32687, "epoch": 194} {"train_loss": -7.31640625, "global_step": 32688, "epoch": 194} {"train_loss": -7.615410327911377, "global_step": 32689, "epoch": 194} {"train_loss": -7.596997261047363, "global_step": 32690, "epoch": 194} {"train_loss": -7.613645553588867, "global_step": 32691, "epoch": 194} {"train_loss": -7.532559394836426, "global_step": 32692, "epoch": 194} {"train_loss": -7.577422142028809, "global_step": 32693, "epoch": 194} {"train_loss": -7.688318252563477, "global_step": 32694, "epoch": 194} {"train_loss": -7.831807613372803, "global_step": 32695, "epoch": 194} {"train_loss": -7.620389938354492, "global_step": 32696, "epoch": 194} {"train_loss": -7.661482810974121, "global_step": 32697, "epoch": 194} {"train_loss": -7.727228164672852, "global_step": 32698, "epoch": 194} {"train_loss": -7.75046968460083, "global_step": 32699, "epoch": 194} {"train_loss": -7.367690086364746, "global_step": 32700, "epoch": 194} {"train_loss": -7.542291164398193, "global_step": 32701, "epoch": 194} {"train_loss": -7.683687210083008, "global_step": 32702, "epoch": 194} {"train_loss": -7.78428316116333, "global_step": 32703, "epoch": 194} {"train_loss": -7.881628513336182, "global_step": 32704, "epoch": 194} {"train_loss": -7.692455291748047, "global_step": 32705, "epoch": 194} {"train_loss": -7.6705756187438965, "global_step": 32706, "epoch": 194} {"train_loss": -7.578390121459961, "global_step": 32707, "epoch": 194} {"train_loss": -7.640953540802002, "global_step": 32708, "epoch": 194} {"train_loss": -7.673122406005859, "global_step": 32709, "epoch": 194} {"train_loss": -7.85045051574707, "global_step": 32710, "epoch": 194} {"train_loss": -7.425021171569824, "global_step": 32711, "epoch": 194} {"train_loss": -7.527467727661133, "global_step": 32712, "epoch": 194} {"train_loss": -7.626090049743652, "global_step": 32713, "epoch": 194} {"train_loss": -7.587462425231934, "global_step": 32714, "epoch": 194} {"train_loss": -7.684908866882324, "global_step": 32715, "epoch": 194} {"train_loss": -7.670652389526367, "global_step": 32716, "epoch": 194} {"train_loss": -7.799701690673828, "global_step": 32717, "epoch": 194} {"train_loss": -7.883675575256348, "global_step": 32718, "epoch": 194} {"train_loss": -7.7261962890625, "global_step": 32719, "epoch": 194} {"train_loss": -7.692325592041016, "global_step": 32720, "epoch": 194} {"train_loss": -7.71483039855957, "global_step": 32721, "epoch": 194} {"train_loss": -7.6111016273498535, "global_step": 32722, "epoch": 194} {"train_loss": -7.627409934997559, "global_step": 32723, "epoch": 194} {"train_loss": -7.659948348999023, "global_step": 32724, "epoch": 194} {"train_loss": -7.85507345199585, "global_step": 32725, "epoch": 194} {"train_loss": -7.541367053985596, "global_step": 32726, "epoch": 194} {"train_loss": -7.789492130279541, "global_step": 32727, "epoch": 194} {"train_loss": -7.6279191970825195, "global_step": 32728, "epoch": 194} {"train_loss": -7.381582736968994, "global_step": 32729, "epoch": 194} {"train_loss": -7.783079624176025, "global_step": 32730, "epoch": 194} {"train_loss": -7.6252851486206055, "global_step": 32731, "epoch": 194} {"train_loss": -7.7983551025390625, "global_step": 32732, "epoch": 194} {"train_loss": -7.490190505981445, "global_step": 32733, "epoch": 194} {"train_loss": -7.891307830810547, "global_step": 32734, "epoch": 194} {"train_loss": -7.716020584106445, "global_step": 32735, "epoch": 194} {"train_loss": -7.716684341430664, "global_step": 32736, "epoch": 194} {"train_loss": -7.627435207366943, "global_step": 32737, "epoch": 194} {"train_loss": -7.635199546813965, "global_step": 32738, "epoch": 194} {"train_loss": -7.694796562194824, "global_step": 32739, "epoch": 194} {"train_loss": -7.621325969696045, "global_step": 32740, "epoch": 194} {"train_loss": -7.5337934494018555, "global_step": 32741, "epoch": 194} {"train_loss": -7.773035526275635, "global_step": 32742, "epoch": 194} {"train_loss": -7.363048553466797, "global_step": 32743, "epoch": 194} {"train_loss": -7.674036979675293, "global_step": 32744, "epoch": 194} {"train_loss": -7.3334856033325195, "global_step": 32745, "epoch": 194} {"train_loss": -7.550062656402588, "global_step": 32746, "epoch": 194} {"train_loss": -7.509252548217773, "global_step": 32747, "epoch": 194} {"train_loss": -7.5427327156066895, "global_step": 32748, "epoch": 194} {"train_loss": -7.399392127990723, "global_step": 32749, "epoch": 194} {"train_loss": -7.493339538574219, "global_step": 32750, "epoch": 194} {"train_loss": -7.641587257385254, "global_step": 32751, "epoch": 194} {"train_loss": -7.577564239501953, "global_step": 32752, "epoch": 194} {"train_loss": -7.4502692222595215, "global_step": 32753, "epoch": 194} {"train_loss": -7.496596813201904, "global_step": 32754, "epoch": 194} {"train_loss": -7.4664812088012695, "global_step": 32755, "epoch": 194} {"train_loss": -7.460987091064453, "global_step": 32756, "epoch": 194} {"train_loss": -7.746660232543945, "global_step": 32757, "epoch": 194} {"train_loss": -7.559219837188721, "global_step": 32758, "epoch": 194} {"train_loss": -7.592163270428067, "global_step": 32759, "epoch": 194, "val_loss": 185123.34375} {"train_loss": -7.825188636779785, "global_step": 32760, "epoch": 195} {"train_loss": -7.522719860076904, "global_step": 32761, "epoch": 195} {"train_loss": -7.565845489501953, "global_step": 32762, "epoch": 195} {"train_loss": -7.632814407348633, "global_step": 32763, "epoch": 195} {"train_loss": -7.4883012771606445, "global_step": 32764, "epoch": 195} {"train_loss": -7.828604698181152, "global_step": 32765, "epoch": 195} {"train_loss": -7.702722549438477, "global_step": 32766, "epoch": 195} {"train_loss": -7.645114421844482, "global_step": 32767, "epoch": 195} {"train_loss": -7.631078720092773, "global_step": 32768, "epoch": 195} {"train_loss": -7.8114333152771, "global_step": 32769, "epoch": 195} {"train_loss": -7.4860053062438965, "global_step": 32770, "epoch": 195} {"train_loss": -7.593216896057129, "global_step": 32771, "epoch": 195} {"train_loss": -7.615913391113281, "global_step": 32772, "epoch": 195} {"train_loss": -7.579827308654785, "global_step": 32773, "epoch": 195} {"train_loss": -7.476832389831543, "global_step": 32774, "epoch": 195} {"train_loss": -7.755128860473633, "global_step": 32775, "epoch": 195} {"train_loss": -7.425223350524902, "global_step": 32776, "epoch": 195} {"train_loss": -7.468952178955078, "global_step": 32777, "epoch": 195} {"train_loss": -7.637923717498779, "global_step": 32778, "epoch": 195} {"train_loss": -7.6052985191345215, "global_step": 32779, "epoch": 195} {"train_loss": -7.464317321777344, "global_step": 32780, "epoch": 195} {"train_loss": -7.578782081604004, "global_step": 32781, "epoch": 195} {"train_loss": -7.570676803588867, "global_step": 32782, "epoch": 195} {"train_loss": -7.568517208099365, "global_step": 32783, "epoch": 195} {"train_loss": -7.747938632965088, "global_step": 32784, "epoch": 195} {"train_loss": -7.272739410400391, "global_step": 32785, "epoch": 195} {"train_loss": -7.607041358947754, "global_step": 32786, "epoch": 195} {"train_loss": -7.684831619262695, "global_step": 32787, "epoch": 195} {"train_loss": -7.363406181335449, "global_step": 32788, "epoch": 195} {"train_loss": -7.551821708679199, "global_step": 32789, "epoch": 195} {"train_loss": -7.621639728546143, "global_step": 32790, "epoch": 195} {"train_loss": -7.526749134063721, "global_step": 32791, "epoch": 195} {"train_loss": -7.860743045806885, "global_step": 32792, "epoch": 195} {"train_loss": -7.639132499694824, "global_step": 32793, "epoch": 195} {"train_loss": -7.687702655792236, "global_step": 32794, "epoch": 195} {"train_loss": -7.50145149230957, "global_step": 32795, "epoch": 195} {"train_loss": -7.747450828552246, "global_step": 32796, "epoch": 195} {"train_loss": -7.711544990539551, "global_step": 32797, "epoch": 195} {"train_loss": -7.563319206237793, "global_step": 32798, "epoch": 195} {"train_loss": -7.123634338378906, "global_step": 32799, "epoch": 195} {"train_loss": -7.604529857635498, "global_step": 32800, "epoch": 195} {"train_loss": -7.557723045349121, "global_step": 32801, "epoch": 195} {"train_loss": -7.682018280029297, "global_step": 32802, "epoch": 195} {"train_loss": -7.703645706176758, "global_step": 32803, "epoch": 195} {"train_loss": -7.67858362197876, "global_step": 32804, "epoch": 195} {"train_loss": -7.563651084899902, "global_step": 32805, "epoch": 195} {"train_loss": -7.769810676574707, "global_step": 32806, "epoch": 195} {"train_loss": -7.800636291503906, "global_step": 32807, "epoch": 195} {"train_loss": -7.71511173248291, "global_step": 32808, "epoch": 195} {"train_loss": -7.645264148712158, "global_step": 32809, "epoch": 195} {"train_loss": -7.587117671966553, "global_step": 32810, "epoch": 195} {"train_loss": -7.7223052978515625, "global_step": 32811, "epoch": 195} {"train_loss": -7.6186394691467285, "global_step": 32812, "epoch": 195} {"train_loss": -7.426987171173096, "global_step": 32813, "epoch": 195} {"train_loss": -7.696816921234131, "global_step": 32814, "epoch": 195} {"train_loss": -7.512016296386719, "global_step": 32815, "epoch": 195} {"train_loss": -7.4590959548950195, "global_step": 32816, "epoch": 195} {"train_loss": -7.67381477355957, "global_step": 32817, "epoch": 195} {"train_loss": -7.6245436668396, "global_step": 32818, "epoch": 195} {"train_loss": -7.597438335418701, "global_step": 32819, "epoch": 195} {"train_loss": -7.733797550201416, "global_step": 32820, "epoch": 195} {"train_loss": -7.595710754394531, "global_step": 32821, "epoch": 195} {"train_loss": -7.473845958709717, "global_step": 32822, "epoch": 195} {"train_loss": -7.647769451141357, "global_step": 32823, "epoch": 195} {"train_loss": -7.748963356018066, "global_step": 32824, "epoch": 195} {"train_loss": -7.6276726722717285, "global_step": 32825, "epoch": 195} {"train_loss": -7.494665145874023, "global_step": 32826, "epoch": 195} {"train_loss": -7.581076145172119, "global_step": 32827, "epoch": 195} {"train_loss": -7.504510402679443, "global_step": 32828, "epoch": 195} {"train_loss": -7.626531600952148, "global_step": 32829, "epoch": 195} {"train_loss": -7.643664836883545, "global_step": 32830, "epoch": 195} {"train_loss": -7.516709327697754, "global_step": 32831, "epoch": 195} {"train_loss": -7.439713478088379, "global_step": 32832, "epoch": 195} {"train_loss": -7.56522274017334, "global_step": 32833, "epoch": 195} {"train_loss": -7.645356178283691, "global_step": 32834, "epoch": 195} {"train_loss": -7.664212703704834, "global_step": 32835, "epoch": 195} {"train_loss": -7.604340076446533, "global_step": 32836, "epoch": 195} {"train_loss": -7.7987961769104, "global_step": 32837, "epoch": 195} {"train_loss": -7.688766002655029, "global_step": 32838, "epoch": 195} {"train_loss": -7.61696195602417, "global_step": 32839, "epoch": 195} {"train_loss": -7.614870071411133, "global_step": 32840, "epoch": 195} {"train_loss": -7.656396865844727, "global_step": 32841, "epoch": 195} {"train_loss": -7.652769088745117, "global_step": 32842, "epoch": 195} {"train_loss": -7.713476181030273, "global_step": 32843, "epoch": 195} {"train_loss": -7.670833587646484, "global_step": 32844, "epoch": 195} {"train_loss": -7.890604019165039, "global_step": 32845, "epoch": 195} {"train_loss": -7.679860591888428, "global_step": 32846, "epoch": 195} {"train_loss": -7.544999122619629, "global_step": 32847, "epoch": 195} {"train_loss": -7.85203742980957, "global_step": 32848, "epoch": 195} {"train_loss": -7.769968509674072, "global_step": 32849, "epoch": 195} {"train_loss": -7.6530327796936035, "global_step": 32850, "epoch": 195} {"train_loss": -7.483176231384277, "global_step": 32851, "epoch": 195} {"train_loss": -7.541223049163818, "global_step": 32852, "epoch": 195} {"train_loss": -7.565498352050781, "global_step": 32853, "epoch": 195} {"train_loss": -7.72689151763916, "global_step": 32854, "epoch": 195} {"train_loss": -7.426763534545898, "global_step": 32855, "epoch": 195} {"train_loss": -7.664620399475098, "global_step": 32856, "epoch": 195} {"train_loss": -7.559874057769775, "global_step": 32857, "epoch": 195} {"train_loss": -7.883960723876953, "global_step": 32858, "epoch": 195} {"train_loss": -7.57135534286499, "global_step": 32859, "epoch": 195} {"train_loss": -7.621673583984375, "global_step": 32860, "epoch": 195} {"train_loss": -7.641947269439697, "global_step": 32861, "epoch": 195} {"train_loss": -7.790948867797852, "global_step": 32862, "epoch": 195} {"train_loss": -7.370006561279297, "global_step": 32863, "epoch": 195} {"train_loss": -7.698294639587402, "global_step": 32864, "epoch": 195} {"train_loss": -7.523322582244873, "global_step": 32865, "epoch": 195} {"train_loss": -7.884153366088867, "global_step": 32866, "epoch": 195} {"train_loss": -7.341994285583496, "global_step": 32867, "epoch": 195} {"train_loss": -7.457911491394043, "global_step": 32868, "epoch": 195} {"train_loss": -7.526860237121582, "global_step": 32869, "epoch": 195} {"train_loss": -7.528768539428711, "global_step": 32870, "epoch": 195} {"train_loss": -7.277718544006348, "global_step": 32871, "epoch": 195} {"train_loss": -7.435626029968262, "global_step": 32872, "epoch": 195} {"train_loss": -7.523596286773682, "global_step": 32873, "epoch": 195} {"train_loss": -7.397989273071289, "global_step": 32874, "epoch": 195} {"train_loss": -7.619078636169434, "global_step": 32875, "epoch": 195} {"train_loss": -7.600032329559326, "global_step": 32876, "epoch": 195} {"train_loss": -7.506227493286133, "global_step": 32877, "epoch": 195} {"train_loss": -7.660463333129883, "global_step": 32878, "epoch": 195} {"train_loss": -7.558150291442871, "global_step": 32879, "epoch": 195} {"train_loss": -7.607517719268799, "global_step": 32880, "epoch": 195} {"train_loss": -7.529847145080566, "global_step": 32881, "epoch": 195} {"train_loss": -7.447281837463379, "global_step": 32882, "epoch": 195} {"train_loss": -7.61433744430542, "global_step": 32883, "epoch": 195} {"train_loss": -7.532987594604492, "global_step": 32884, "epoch": 195} {"train_loss": -7.522497177124023, "global_step": 32885, "epoch": 195} {"train_loss": -7.489562034606934, "global_step": 32886, "epoch": 195} {"train_loss": -7.270528793334961, "global_step": 32887, "epoch": 195} {"train_loss": -7.4120869636535645, "global_step": 32888, "epoch": 195} {"train_loss": -7.91343879699707, "global_step": 32889, "epoch": 195} {"train_loss": -7.723572254180908, "global_step": 32890, "epoch": 195} {"train_loss": -7.656122207641602, "global_step": 32891, "epoch": 195} {"train_loss": -7.562880516052246, "global_step": 32892, "epoch": 195} {"train_loss": -7.6146721839904785, "global_step": 32893, "epoch": 195} {"train_loss": -7.68143367767334, "global_step": 32894, "epoch": 195} {"train_loss": -7.397728443145752, "global_step": 32895, "epoch": 195} {"train_loss": -7.710911750793457, "global_step": 32896, "epoch": 195} {"train_loss": -7.429411888122559, "global_step": 32897, "epoch": 195} {"train_loss": -7.750896453857422, "global_step": 32898, "epoch": 195} {"train_loss": -7.750067710876465, "global_step": 32899, "epoch": 195} {"train_loss": -7.5912628173828125, "global_step": 32900, "epoch": 195} {"train_loss": -7.703593730926514, "global_step": 32901, "epoch": 195} {"train_loss": -7.71913480758667, "global_step": 32902, "epoch": 195} {"train_loss": -7.642258167266846, "global_step": 32903, "epoch": 195} {"train_loss": -7.712226390838623, "global_step": 32904, "epoch": 195} {"train_loss": -7.794325828552246, "global_step": 32905, "epoch": 195} {"train_loss": -7.778426647186279, "global_step": 32906, "epoch": 195} {"train_loss": -7.597023010253906, "global_step": 32907, "epoch": 195} {"train_loss": -7.80613374710083, "global_step": 32908, "epoch": 195} {"train_loss": -7.499544143676758, "global_step": 32909, "epoch": 195} {"train_loss": -7.361103057861328, "global_step": 32910, "epoch": 195} {"train_loss": -7.7649455070495605, "global_step": 32911, "epoch": 195} {"train_loss": -7.649961471557617, "global_step": 32912, "epoch": 195} {"train_loss": -7.317822456359863, "global_step": 32913, "epoch": 195} {"train_loss": -7.615302085876465, "global_step": 32914, "epoch": 195} {"train_loss": -7.690460205078125, "global_step": 32915, "epoch": 195} {"train_loss": -7.3988847732543945, "global_step": 32916, "epoch": 195} {"train_loss": -7.452998161315918, "global_step": 32917, "epoch": 195} {"train_loss": -7.648614406585693, "global_step": 32918, "epoch": 195} {"train_loss": -7.612818717956543, "global_step": 32919, "epoch": 195} {"train_loss": -7.5338335037231445, "global_step": 32920, "epoch": 195} {"train_loss": -7.446719169616699, "global_step": 32921, "epoch": 195} {"train_loss": -7.505859375, "global_step": 32922, "epoch": 195} {"train_loss": -7.767168998718262, "global_step": 32923, "epoch": 195} {"train_loss": -7.73323917388916, "global_step": 32924, "epoch": 195} {"train_loss": -7.601483345031738, "global_step": 32925, "epoch": 195} {"train_loss": -7.546133518218994, "global_step": 32926, "epoch": 195} {"train_loss": -7.602726385706947, "global_step": 32927, "epoch": 195, "val_loss": 187872.65625, "train_action_mse_error": 15.389421463012695} {"train_loss": -7.678696632385254, "global_step": 32928, "epoch": 196} {"train_loss": -7.684815406799316, "global_step": 32929, "epoch": 196} {"train_loss": -7.680203437805176, "global_step": 32930, "epoch": 196} {"train_loss": -7.585467338562012, "global_step": 32931, "epoch": 196} {"train_loss": -7.621884346008301, "global_step": 32932, "epoch": 196} {"train_loss": -7.598203659057617, "global_step": 32933, "epoch": 196} {"train_loss": -7.5050835609436035, "global_step": 32934, "epoch": 196} {"train_loss": -7.817989349365234, "global_step": 32935, "epoch": 196} {"train_loss": -7.583962917327881, "global_step": 32936, "epoch": 196} {"train_loss": -7.723984241485596, "global_step": 32937, "epoch": 196} {"train_loss": -7.268796920776367, "global_step": 32938, "epoch": 196} {"train_loss": -7.732368469238281, "global_step": 32939, "epoch": 196} {"train_loss": -7.755305290222168, "global_step": 32940, "epoch": 196} {"train_loss": -7.589115142822266, "global_step": 32941, "epoch": 196} {"train_loss": -7.7715888023376465, "global_step": 32942, "epoch": 196} {"train_loss": -7.354556083679199, "global_step": 32943, "epoch": 196} {"train_loss": -7.681246757507324, "global_step": 32944, "epoch": 196} {"train_loss": -7.554229736328125, "global_step": 32945, "epoch": 196} {"train_loss": -7.670828819274902, "global_step": 32946, "epoch": 196} {"train_loss": -7.526389122009277, "global_step": 32947, "epoch": 196} {"train_loss": -7.361476898193359, "global_step": 32948, "epoch": 196} {"train_loss": -7.662296295166016, "global_step": 32949, "epoch": 196} {"train_loss": -7.5204973220825195, "global_step": 32950, "epoch": 196} {"train_loss": -7.726504325866699, "global_step": 32951, "epoch": 196} {"train_loss": -7.690626621246338, "global_step": 32952, "epoch": 196} {"train_loss": -7.720319747924805, "global_step": 32953, "epoch": 196} {"train_loss": -7.6663665771484375, "global_step": 32954, "epoch": 196} {"train_loss": -7.63001823425293, "global_step": 32955, "epoch": 196} {"train_loss": -7.829660892486572, "global_step": 32956, "epoch": 196} {"train_loss": -7.515952110290527, "global_step": 32957, "epoch": 196} {"train_loss": -7.568807125091553, "global_step": 32958, "epoch": 196} {"train_loss": -7.597251892089844, "global_step": 32959, "epoch": 196} {"train_loss": -7.547840595245361, "global_step": 32960, "epoch": 196} {"train_loss": -7.522274017333984, "global_step": 32961, "epoch": 196} {"train_loss": -7.572040557861328, "global_step": 32962, "epoch": 196} {"train_loss": -7.061122417449951, "global_step": 32963, "epoch": 196} {"train_loss": -7.424619674682617, "global_step": 32964, "epoch": 196} {"train_loss": -7.3981122970581055, "global_step": 32965, "epoch": 196} {"train_loss": -7.63193941116333, "global_step": 32966, "epoch": 196} {"train_loss": -7.367475509643555, "global_step": 32967, "epoch": 196} {"train_loss": -7.500353813171387, "global_step": 32968, "epoch": 196} {"train_loss": -7.375533580780029, "global_step": 32969, "epoch": 196} {"train_loss": -7.506962299346924, "global_step": 32970, "epoch": 196} {"train_loss": -7.60128116607666, "global_step": 32971, "epoch": 196} {"train_loss": -7.4017229080200195, "global_step": 32972, "epoch": 196} {"train_loss": -7.621452331542969, "global_step": 32973, "epoch": 196} {"train_loss": -7.319049835205078, "global_step": 32974, "epoch": 196} {"train_loss": -7.6265363693237305, "global_step": 32975, "epoch": 196} {"train_loss": -7.575957298278809, "global_step": 32976, "epoch": 196} {"train_loss": -7.6047258377075195, "global_step": 32977, "epoch": 196} {"train_loss": -7.603602886199951, "global_step": 32978, "epoch": 196} {"train_loss": -7.684727668762207, "global_step": 32979, "epoch": 196} {"train_loss": -7.5178728103637695, "global_step": 32980, "epoch": 196} {"train_loss": -7.61920690536499, "global_step": 32981, "epoch": 196} {"train_loss": -7.688918590545654, "global_step": 32982, "epoch": 196} {"train_loss": -7.583099365234375, "global_step": 32983, "epoch": 196} {"train_loss": -7.48497200012207, "global_step": 32984, "epoch": 196} {"train_loss": -7.655653953552246, "global_step": 32985, "epoch": 196} {"train_loss": -7.6919264793396, "global_step": 32986, "epoch": 196} {"train_loss": -7.78850793838501, "global_step": 32987, "epoch": 196} {"train_loss": -7.640726089477539, "global_step": 32988, "epoch": 196} {"train_loss": -7.875732421875, "global_step": 32989, "epoch": 196} {"train_loss": -7.4952392578125, "global_step": 32990, "epoch": 196} {"train_loss": -7.566370487213135, "global_step": 32991, "epoch": 196} {"train_loss": -7.509399890899658, "global_step": 32992, "epoch": 196} {"train_loss": -7.5892839431762695, "global_step": 32993, "epoch": 196} {"train_loss": -7.8251495361328125, "global_step": 32994, "epoch": 196} {"train_loss": -7.374242305755615, "global_step": 32995, "epoch": 196} {"train_loss": -7.813239097595215, "global_step": 32996, "epoch": 196} {"train_loss": -7.790754318237305, "global_step": 32997, "epoch": 196} {"train_loss": -7.444063663482666, "global_step": 32998, "epoch": 196} {"train_loss": -7.653285980224609, "global_step": 32999, "epoch": 196} {"train_loss": -7.420902252197266, "global_step": 33000, "epoch": 196} {"train_loss": -7.7328715324401855, "global_step": 33001, "epoch": 196} {"train_loss": -7.481527328491211, "global_step": 33002, "epoch": 196} {"train_loss": -7.53989315032959, "global_step": 33003, "epoch": 196} {"train_loss": -7.6068878173828125, "global_step": 33004, "epoch": 196} {"train_loss": -7.515222549438477, "global_step": 33005, "epoch": 196} {"train_loss": -7.633569717407227, "global_step": 33006, "epoch": 196} {"train_loss": -7.449428558349609, "global_step": 33007, "epoch": 196} {"train_loss": -7.7499189376831055, "global_step": 33008, "epoch": 196} {"train_loss": -7.570035934448242, "global_step": 33009, "epoch": 196} {"train_loss": -7.517226219177246, "global_step": 33010, "epoch": 196} {"train_loss": -7.434089660644531, "global_step": 33011, "epoch": 196} {"train_loss": -7.816220283508301, "global_step": 33012, "epoch": 196} {"train_loss": -7.406380653381348, "global_step": 33013, "epoch": 196} {"train_loss": -7.491867542266846, "global_step": 33014, "epoch": 196} {"train_loss": -7.862709999084473, "global_step": 33015, "epoch": 196} {"train_loss": -7.69492244720459, "global_step": 33016, "epoch": 196} {"train_loss": -7.583840847015381, "global_step": 33017, "epoch": 196} {"train_loss": -7.539031505584717, "global_step": 33018, "epoch": 196} {"train_loss": -7.460763931274414, "global_step": 33019, "epoch": 196} {"train_loss": -7.64223575592041, "global_step": 33020, "epoch": 196} {"train_loss": -7.56545877456665, "global_step": 33021, "epoch": 196} {"train_loss": -7.683825492858887, "global_step": 33022, "epoch": 196} {"train_loss": -7.522774696350098, "global_step": 33023, "epoch": 196} {"train_loss": -7.4755425453186035, "global_step": 33024, "epoch": 196} {"train_loss": -7.540510177612305, "global_step": 33025, "epoch": 196} {"train_loss": -7.618012428283691, "global_step": 33026, "epoch": 196} {"train_loss": -7.603653907775879, "global_step": 33027, "epoch": 196} {"train_loss": -7.617219924926758, "global_step": 33028, "epoch": 196} {"train_loss": -7.752283096313477, "global_step": 33029, "epoch": 196} {"train_loss": -7.4014129638671875, "global_step": 33030, "epoch": 196} {"train_loss": -7.605663299560547, "global_step": 33031, "epoch": 196} {"train_loss": -7.695537567138672, "global_step": 33032, "epoch": 196} {"train_loss": -7.74089241027832, "global_step": 33033, "epoch": 196} {"train_loss": -7.662603378295898, "global_step": 33034, "epoch": 196} {"train_loss": -7.592008590698242, "global_step": 33035, "epoch": 196} {"train_loss": -7.546136856079102, "global_step": 33036, "epoch": 196} {"train_loss": -7.6317524909973145, "global_step": 33037, "epoch": 196} {"train_loss": -7.734354019165039, "global_step": 33038, "epoch": 196} {"train_loss": -7.59578800201416, "global_step": 33039, "epoch": 196} {"train_loss": -7.689291000366211, "global_step": 33040, "epoch": 196} {"train_loss": -7.677549362182617, "global_step": 33041, "epoch": 196} {"train_loss": -7.929416656494141, "global_step": 33042, "epoch": 196} {"train_loss": -7.845198631286621, "global_step": 33043, "epoch": 196} {"train_loss": -7.682867050170898, "global_step": 33044, "epoch": 196} {"train_loss": -7.4953155517578125, "global_step": 33045, "epoch": 196} {"train_loss": -7.563967704772949, "global_step": 33046, "epoch": 196} {"train_loss": -7.592623233795166, "global_step": 33047, "epoch": 196} {"train_loss": -7.582100868225098, "global_step": 33048, "epoch": 196} {"train_loss": -7.670754432678223, "global_step": 33049, "epoch": 196} {"train_loss": -7.526825428009033, "global_step": 33050, "epoch": 196} {"train_loss": -7.600891590118408, "global_step": 33051, "epoch": 196} {"train_loss": -7.59628963470459, "global_step": 33052, "epoch": 196} {"train_loss": -7.7908453941345215, "global_step": 33053, "epoch": 196} {"train_loss": -7.516603946685791, "global_step": 33054, "epoch": 196} {"train_loss": -7.669999122619629, "global_step": 33055, "epoch": 196} {"train_loss": -7.77495002746582, "global_step": 33056, "epoch": 196} {"train_loss": -7.660174369812012, "global_step": 33057, "epoch": 196} {"train_loss": -7.457651615142822, "global_step": 33058, "epoch": 196} {"train_loss": -7.664705276489258, "global_step": 33059, "epoch": 196} {"train_loss": -7.504279613494873, "global_step": 33060, "epoch": 196} {"train_loss": -7.581609725952148, "global_step": 33061, "epoch": 196} {"train_loss": -7.462029457092285, "global_step": 33062, "epoch": 196} {"train_loss": -7.683908462524414, "global_step": 33063, "epoch": 196} {"train_loss": -7.5151143074035645, "global_step": 33064, "epoch": 196} {"train_loss": -7.777166366577148, "global_step": 33065, "epoch": 196} {"train_loss": -7.471404075622559, "global_step": 33066, "epoch": 196} {"train_loss": -7.774311542510986, "global_step": 33067, "epoch": 196} {"train_loss": -7.408297538757324, "global_step": 33068, "epoch": 196} {"train_loss": -7.5933027267456055, "global_step": 33069, "epoch": 196} {"train_loss": -7.4143853187561035, "global_step": 33070, "epoch": 196} {"train_loss": -7.828266143798828, "global_step": 33071, "epoch": 196} {"train_loss": -7.283454895019531, "global_step": 33072, "epoch": 196} {"train_loss": -7.789720058441162, "global_step": 33073, "epoch": 196} {"train_loss": -7.7496867179870605, "global_step": 33074, "epoch": 196} {"train_loss": -7.646924018859863, "global_step": 33075, "epoch": 196} {"train_loss": -7.753328800201416, "global_step": 33076, "epoch": 196} {"train_loss": -7.881096839904785, "global_step": 33077, "epoch": 196} {"train_loss": -7.70612907409668, "global_step": 33078, "epoch": 196} {"train_loss": -7.753353595733643, "global_step": 33079, "epoch": 196} {"train_loss": -7.572040557861328, "global_step": 33080, "epoch": 196} {"train_loss": -7.849903106689453, "global_step": 33081, "epoch": 196} {"train_loss": -7.85847282409668, "global_step": 33082, "epoch": 196} {"train_loss": -7.753180503845215, "global_step": 33083, "epoch": 196} {"train_loss": -7.864102363586426, "global_step": 33084, "epoch": 196} {"train_loss": -7.810985565185547, "global_step": 33085, "epoch": 196} {"train_loss": -7.817616939544678, "global_step": 33086, "epoch": 196} {"train_loss": -7.685585021972656, "global_step": 33087, "epoch": 196} {"train_loss": -7.659827709197998, "global_step": 33088, "epoch": 196} {"train_loss": -7.333010196685791, "global_step": 33089, "epoch": 196} {"train_loss": -7.676479816436768, "global_step": 33090, "epoch": 196} {"train_loss": -7.698425769805908, "global_step": 33091, "epoch": 196} {"train_loss": -7.501260757446289, "global_step": 33092, "epoch": 196} {"train_loss": -7.362974643707275, "global_step": 33093, "epoch": 196} {"train_loss": -7.623527526855469, "global_step": 33094, "epoch": 196} {"train_loss": -7.608803258055732, "global_step": 33095, "epoch": 196, "val_loss": 187938.734375} {"train_loss": -7.673925399780273, "global_step": 33096, "epoch": 197} {"train_loss": -7.9514360427856445, "global_step": 33097, "epoch": 197} {"train_loss": -7.669651985168457, "global_step": 33098, "epoch": 197} {"train_loss": -7.579520225524902, "global_step": 33099, "epoch": 197} {"train_loss": -7.6936235427856445, "global_step": 33100, "epoch": 197} {"train_loss": -7.6920671463012695, "global_step": 33101, "epoch": 197} {"train_loss": -7.538873672485352, "global_step": 33102, "epoch": 197} {"train_loss": -7.635857105255127, "global_step": 33103, "epoch": 197} {"train_loss": -7.6510467529296875, "global_step": 33104, "epoch": 197} {"train_loss": -7.52201509475708, "global_step": 33105, "epoch": 197} {"train_loss": -7.67551326751709, "global_step": 33106, "epoch": 197} {"train_loss": -7.599653244018555, "global_step": 33107, "epoch": 197} {"train_loss": -7.586188793182373, "global_step": 33108, "epoch": 197} {"train_loss": -7.588493824005127, "global_step": 33109, "epoch": 197} {"train_loss": -7.700442314147949, "global_step": 33110, "epoch": 197} {"train_loss": -7.623247146606445, "global_step": 33111, "epoch": 197} {"train_loss": -7.344975471496582, "global_step": 33112, "epoch": 197} {"train_loss": -7.651760101318359, "global_step": 33113, "epoch": 197} {"train_loss": -7.606754302978516, "global_step": 33114, "epoch": 197} {"train_loss": -7.561767101287842, "global_step": 33115, "epoch": 197} {"train_loss": -7.669371128082275, "global_step": 33116, "epoch": 197} {"train_loss": -7.624779224395752, "global_step": 33117, "epoch": 197} {"train_loss": -7.588657379150391, "global_step": 33118, "epoch": 197} {"train_loss": -7.571601390838623, "global_step": 33119, "epoch": 197} {"train_loss": -7.587021827697754, "global_step": 33120, "epoch": 197} {"train_loss": -7.456539154052734, "global_step": 33121, "epoch": 197} {"train_loss": -7.349907875061035, "global_step": 33122, "epoch": 197} {"train_loss": -7.561069488525391, "global_step": 33123, "epoch": 197} {"train_loss": -7.771955490112305, "global_step": 33124, "epoch": 197} {"train_loss": -7.263706207275391, "global_step": 33125, "epoch": 197} {"train_loss": -7.694906234741211, "global_step": 33126, "epoch": 197} {"train_loss": -7.702213287353516, "global_step": 33127, "epoch": 197} {"train_loss": -7.520503520965576, "global_step": 33128, "epoch": 197} {"train_loss": -7.636260032653809, "global_step": 33129, "epoch": 197} {"train_loss": -7.605076789855957, "global_step": 33130, "epoch": 197} {"train_loss": -7.524023056030273, "global_step": 33131, "epoch": 197} {"train_loss": -7.523111343383789, "global_step": 33132, "epoch": 197} {"train_loss": -7.533987522125244, "global_step": 33133, "epoch": 197} {"train_loss": -7.582511901855469, "global_step": 33134, "epoch": 197} {"train_loss": -7.363131046295166, "global_step": 33135, "epoch": 197} {"train_loss": -7.568876266479492, "global_step": 33136, "epoch": 197} {"train_loss": -7.748167991638184, "global_step": 33137, "epoch": 197} {"train_loss": -7.588576316833496, "global_step": 33138, "epoch": 197} {"train_loss": -7.394080638885498, "global_step": 33139, "epoch": 197} {"train_loss": -7.606942176818848, "global_step": 33140, "epoch": 197} {"train_loss": -7.468174934387207, "global_step": 33141, "epoch": 197} {"train_loss": -7.488001823425293, "global_step": 33142, "epoch": 197} {"train_loss": -7.578773021697998, "global_step": 33143, "epoch": 197} {"train_loss": -7.626059532165527, "global_step": 33144, "epoch": 197} {"train_loss": -7.455957412719727, "global_step": 33145, "epoch": 197} {"train_loss": -7.436648368835449, "global_step": 33146, "epoch": 197} {"train_loss": -7.6926093101501465, "global_step": 33147, "epoch": 197} {"train_loss": -7.731998443603516, "global_step": 33148, "epoch": 197} {"train_loss": -7.674083709716797, "global_step": 33149, "epoch": 197} {"train_loss": -7.6202569007873535, "global_step": 33150, "epoch": 197} {"train_loss": -7.598343849182129, "global_step": 33151, "epoch": 197} {"train_loss": -7.771706581115723, "global_step": 33152, "epoch": 197} {"train_loss": -7.530342102050781, "global_step": 33153, "epoch": 197} {"train_loss": -7.555593490600586, "global_step": 33154, "epoch": 197} {"train_loss": -7.661624908447266, "global_step": 33155, "epoch": 197} {"train_loss": -7.548125267028809, "global_step": 33156, "epoch": 197} {"train_loss": -7.426231861114502, "global_step": 33157, "epoch": 197} {"train_loss": -7.237520217895508, "global_step": 33158, "epoch": 197} {"train_loss": -7.4150238037109375, "global_step": 33159, "epoch": 197} {"train_loss": -7.433391571044922, "global_step": 33160, "epoch": 197} {"train_loss": -7.503594398498535, "global_step": 33161, "epoch": 197} {"train_loss": -7.587884426116943, "global_step": 33162, "epoch": 197} {"train_loss": -7.426612854003906, "global_step": 33163, "epoch": 197} {"train_loss": -7.502406120300293, "global_step": 33164, "epoch": 197} {"train_loss": -7.335624694824219, "global_step": 33165, "epoch": 197} {"train_loss": -7.71592903137207, "global_step": 33166, "epoch": 197} {"train_loss": -7.443846702575684, "global_step": 33167, "epoch": 197} {"train_loss": -7.326319217681885, "global_step": 33168, "epoch": 197} {"train_loss": -7.7875752449035645, "global_step": 33169, "epoch": 197} {"train_loss": -7.352439880371094, "global_step": 33170, "epoch": 197} {"train_loss": -7.490964412689209, "global_step": 33171, "epoch": 197} {"train_loss": -7.509111404418945, "global_step": 33172, "epoch": 197} {"train_loss": -7.547144889831543, "global_step": 33173, "epoch": 197} {"train_loss": -7.576728820800781, "global_step": 33174, "epoch": 197} {"train_loss": -7.27900505065918, "global_step": 33175, "epoch": 197} {"train_loss": -7.6103739738464355, "global_step": 33176, "epoch": 197} {"train_loss": -7.585091590881348, "global_step": 33177, "epoch": 197} {"train_loss": -7.555294990539551, "global_step": 33178, "epoch": 197} {"train_loss": -7.287334442138672, "global_step": 33179, "epoch": 197} {"train_loss": -7.598602294921875, "global_step": 33180, "epoch": 197} {"train_loss": -7.498927116394043, "global_step": 33181, "epoch": 197} {"train_loss": -7.543684959411621, "global_step": 33182, "epoch": 197} {"train_loss": -7.769540786743164, "global_step": 33183, "epoch": 197} {"train_loss": -7.396471977233887, "global_step": 33184, "epoch": 197} {"train_loss": -7.451958656311035, "global_step": 33185, "epoch": 197} {"train_loss": -7.462245464324951, "global_step": 33186, "epoch": 197} {"train_loss": -7.800255298614502, "global_step": 33187, "epoch": 197} {"train_loss": -7.629693508148193, "global_step": 33188, "epoch": 197} {"train_loss": -7.372105598449707, "global_step": 33189, "epoch": 197} {"train_loss": -7.56722354888916, "global_step": 33190, "epoch": 197} {"train_loss": -7.592009544372559, "global_step": 33191, "epoch": 197} {"train_loss": -7.58597469329834, "global_step": 33192, "epoch": 197} {"train_loss": -7.563510894775391, "global_step": 33193, "epoch": 197} {"train_loss": -7.607551097869873, "global_step": 33194, "epoch": 197} {"train_loss": -7.481527328491211, "global_step": 33195, "epoch": 197} {"train_loss": -7.535255432128906, "global_step": 33196, "epoch": 197} {"train_loss": -7.705593585968018, "global_step": 33197, "epoch": 197} {"train_loss": -7.879056930541992, "global_step": 33198, "epoch": 197} {"train_loss": -7.624263763427734, "global_step": 33199, "epoch": 197} {"train_loss": -7.659482955932617, "global_step": 33200, "epoch": 197} {"train_loss": -7.620932102203369, "global_step": 33201, "epoch": 197} {"train_loss": -7.675119876861572, "global_step": 33202, "epoch": 197} {"train_loss": -7.498554229736328, "global_step": 33203, "epoch": 197} {"train_loss": -7.709244728088379, "global_step": 33204, "epoch": 197} {"train_loss": -7.296918869018555, "global_step": 33205, "epoch": 197} {"train_loss": -7.689443588256836, "global_step": 33206, "epoch": 197} {"train_loss": -7.6216230392456055, "global_step": 33207, "epoch": 197} {"train_loss": -7.543894290924072, "global_step": 33208, "epoch": 197} {"train_loss": -7.767560005187988, "global_step": 33209, "epoch": 197} {"train_loss": -7.695910930633545, "global_step": 33210, "epoch": 197} {"train_loss": -7.740677356719971, "global_step": 33211, "epoch": 197} {"train_loss": -7.695394992828369, "global_step": 33212, "epoch": 197} {"train_loss": -7.594437599182129, "global_step": 33213, "epoch": 197} {"train_loss": -7.8538899421691895, "global_step": 33214, "epoch": 197} {"train_loss": -7.759356498718262, "global_step": 33215, "epoch": 197} {"train_loss": -7.509305953979492, "global_step": 33216, "epoch": 197} {"train_loss": -7.834986686706543, "global_step": 33217, "epoch": 197} {"train_loss": -7.765298366546631, "global_step": 33218, "epoch": 197} {"train_loss": -7.730987548828125, "global_step": 33219, "epoch": 197} {"train_loss": -7.675446510314941, "global_step": 33220, "epoch": 197} {"train_loss": -7.597101211547852, "global_step": 33221, "epoch": 197} {"train_loss": -7.927969932556152, "global_step": 33222, "epoch": 197} {"train_loss": -7.734019756317139, "global_step": 33223, "epoch": 197} {"train_loss": -7.754398345947266, "global_step": 33224, "epoch": 197} {"train_loss": -7.853939056396484, "global_step": 33225, "epoch": 197} {"train_loss": -7.754841327667236, "global_step": 33226, "epoch": 197} {"train_loss": -7.749879360198975, "global_step": 33227, "epoch": 197} {"train_loss": -7.652539253234863, "global_step": 33228, "epoch": 197} {"train_loss": -7.761351108551025, "global_step": 33229, "epoch": 197} {"train_loss": -7.836462497711182, "global_step": 33230, "epoch": 197} {"train_loss": -7.547938823699951, "global_step": 33231, "epoch": 197} {"train_loss": -7.925616264343262, "global_step": 33232, "epoch": 197} {"train_loss": -7.656195640563965, "global_step": 33233, "epoch": 197} {"train_loss": -7.762216567993164, "global_step": 33234, "epoch": 197} {"train_loss": -7.659308433532715, "global_step": 33235, "epoch": 197} {"train_loss": -7.657200813293457, "global_step": 33236, "epoch": 197} {"train_loss": -7.4215989112854, "global_step": 33237, "epoch": 197} {"train_loss": -7.691651344299316, "global_step": 33238, "epoch": 197} {"train_loss": -7.646154403686523, "global_step": 33239, "epoch": 197} {"train_loss": -7.143031120300293, "global_step": 33240, "epoch": 197} {"train_loss": -7.633288383483887, "global_step": 33241, "epoch": 197} {"train_loss": -7.587466239929199, "global_step": 33242, "epoch": 197} {"train_loss": -7.362981796264648, "global_step": 33243, "epoch": 197} {"train_loss": -7.485494136810303, "global_step": 33244, "epoch": 197} {"train_loss": -7.461381912231445, "global_step": 33245, "epoch": 197} {"train_loss": -7.61918830871582, "global_step": 33246, "epoch": 197} {"train_loss": -7.397919654846191, "global_step": 33247, "epoch": 197} {"train_loss": -7.334290504455566, "global_step": 33248, "epoch": 197} {"train_loss": -7.638613700866699, "global_step": 33249, "epoch": 197} {"train_loss": -7.66721248626709, "global_step": 33250, "epoch": 197} {"train_loss": -7.408536434173584, "global_step": 33251, "epoch": 197} {"train_loss": -7.353879928588867, "global_step": 33252, "epoch": 197} {"train_loss": -7.367433547973633, "global_step": 33253, "epoch": 197} {"train_loss": -7.524325370788574, "global_step": 33254, "epoch": 197} {"train_loss": -7.458788871765137, "global_step": 33255, "epoch": 197} {"train_loss": -7.449417591094971, "global_step": 33256, "epoch": 197} {"train_loss": -7.388525009155273, "global_step": 33257, "epoch": 197} {"train_loss": -7.467378616333008, "global_step": 33258, "epoch": 197} {"train_loss": -7.690584659576416, "global_step": 33259, "epoch": 197} {"train_loss": -7.598573207855225, "global_step": 33260, "epoch": 197} {"train_loss": -7.6906418800354, "global_step": 33261, "epoch": 197} {"train_loss": -7.576724052429199, "global_step": 33262, "epoch": 197} {"train_loss": -7.582136934711819, "global_step": 33263, "epoch": 197, "val_loss": 189217.3125} {"train_loss": -7.680905342102051, "global_step": 33264, "epoch": 198} {"train_loss": -7.517963409423828, "global_step": 33265, "epoch": 198} {"train_loss": -7.695944786071777, "global_step": 33266, "epoch": 198} {"train_loss": -7.778037071228027, "global_step": 33267, "epoch": 198} {"train_loss": -7.610956192016602, "global_step": 33268, "epoch": 198} {"train_loss": -7.83612585067749, "global_step": 33269, "epoch": 198} {"train_loss": -7.398118495941162, "global_step": 33270, "epoch": 198} {"train_loss": -7.76790714263916, "global_step": 33271, "epoch": 198} {"train_loss": -7.63584566116333, "global_step": 33272, "epoch": 198} {"train_loss": -7.8392133712768555, "global_step": 33273, "epoch": 198} {"train_loss": -7.58473014831543, "global_step": 33274, "epoch": 198} {"train_loss": -7.772137641906738, "global_step": 33275, "epoch": 198} {"train_loss": -7.701210975646973, "global_step": 33276, "epoch": 198} {"train_loss": -7.837038040161133, "global_step": 33277, "epoch": 198} {"train_loss": -7.416907787322998, "global_step": 33278, "epoch": 198} {"train_loss": -7.551609516143799, "global_step": 33279, "epoch": 198} {"train_loss": -7.820265769958496, "global_step": 33280, "epoch": 198} {"train_loss": -7.594204902648926, "global_step": 33281, "epoch": 198} {"train_loss": -7.696898460388184, "global_step": 33282, "epoch": 198} {"train_loss": -7.63163423538208, "global_step": 33283, "epoch": 198} {"train_loss": -7.628406047821045, "global_step": 33284, "epoch": 198} {"train_loss": -7.702810287475586, "global_step": 33285, "epoch": 198} {"train_loss": -7.789801597595215, "global_step": 33286, "epoch": 198} {"train_loss": -7.628746032714844, "global_step": 33287, "epoch": 198} {"train_loss": -7.616918563842773, "global_step": 33288, "epoch": 198} {"train_loss": -7.646378517150879, "global_step": 33289, "epoch": 198} {"train_loss": -7.661448955535889, "global_step": 33290, "epoch": 198} {"train_loss": -7.4979047775268555, "global_step": 33291, "epoch": 198} {"train_loss": -7.6636457443237305, "global_step": 33292, "epoch": 198} {"train_loss": -7.581869125366211, "global_step": 33293, "epoch": 198} {"train_loss": -7.817386627197266, "global_step": 33294, "epoch": 198} {"train_loss": -7.453293800354004, "global_step": 33295, "epoch": 198} {"train_loss": -7.673208713531494, "global_step": 33296, "epoch": 198} {"train_loss": -7.423288345336914, "global_step": 33297, "epoch": 198} {"train_loss": -7.553771018981934, "global_step": 33298, "epoch": 198} {"train_loss": -7.2578558921813965, "global_step": 33299, "epoch": 198} {"train_loss": -7.433333396911621, "global_step": 33300, "epoch": 198} {"train_loss": -7.180267333984375, "global_step": 33301, "epoch": 198} {"train_loss": -7.547204971313477, "global_step": 33302, "epoch": 198} {"train_loss": -7.263840198516846, "global_step": 33303, "epoch": 198} {"train_loss": -7.486087799072266, "global_step": 33304, "epoch": 198} {"train_loss": -6.9466142654418945, "global_step": 33305, "epoch": 198} {"train_loss": -7.308605670928955, "global_step": 33306, "epoch": 198} {"train_loss": -7.400732040405273, "global_step": 33307, "epoch": 198} {"train_loss": -6.9711432456970215, "global_step": 33308, "epoch": 198} {"train_loss": -7.555445671081543, "global_step": 33309, "epoch": 198} {"train_loss": -7.39234733581543, "global_step": 33310, "epoch": 198} {"train_loss": -7.504495143890381, "global_step": 33311, "epoch": 198} {"train_loss": -7.579519271850586, "global_step": 33312, "epoch": 198} {"train_loss": -7.276090621948242, "global_step": 33313, "epoch": 198} {"train_loss": -7.392888069152832, "global_step": 33314, "epoch": 198} {"train_loss": -7.55178689956665, "global_step": 33315, "epoch": 198} {"train_loss": -7.196896553039551, "global_step": 33316, "epoch": 198} {"train_loss": -7.381784439086914, "global_step": 33317, "epoch": 198} {"train_loss": -7.658478736877441, "global_step": 33318, "epoch": 198} {"train_loss": -7.572835445404053, "global_step": 33319, "epoch": 198} {"train_loss": -7.601032257080078, "global_step": 33320, "epoch": 198} {"train_loss": -7.563155651092529, "global_step": 33321, "epoch": 198} {"train_loss": -7.679420471191406, "global_step": 33322, "epoch": 198} {"train_loss": -7.835109710693359, "global_step": 33323, "epoch": 198} {"train_loss": -7.593477725982666, "global_step": 33324, "epoch": 198} {"train_loss": -7.705307483673096, "global_step": 33325, "epoch": 198} {"train_loss": -7.561809062957764, "global_step": 33326, "epoch": 198} {"train_loss": -7.691656112670898, "global_step": 33327, "epoch": 198} {"train_loss": -7.719253063201904, "global_step": 33328, "epoch": 198} {"train_loss": -7.936789035797119, "global_step": 33329, "epoch": 198} {"train_loss": -7.810151100158691, "global_step": 33330, "epoch": 198} {"train_loss": -7.810857772827148, "global_step": 33331, "epoch": 198} {"train_loss": -7.664080619812012, "global_step": 33332, "epoch": 198} {"train_loss": -7.7935943603515625, "global_step": 33333, "epoch": 198} {"train_loss": -7.588829040527344, "global_step": 33334, "epoch": 198} {"train_loss": -7.593319892883301, "global_step": 33335, "epoch": 198} {"train_loss": -7.6677422523498535, "global_step": 33336, "epoch": 198} {"train_loss": -7.488325119018555, "global_step": 33337, "epoch": 198} {"train_loss": -7.613130569458008, "global_step": 33338, "epoch": 198} {"train_loss": -7.665480613708496, "global_step": 33339, "epoch": 198} {"train_loss": -7.3389482498168945, "global_step": 33340, "epoch": 198} {"train_loss": -7.329425811767578, "global_step": 33341, "epoch": 198} {"train_loss": -7.699313163757324, "global_step": 33342, "epoch": 198} {"train_loss": -7.696866989135742, "global_step": 33343, "epoch": 198} {"train_loss": -7.468134880065918, "global_step": 33344, "epoch": 198} {"train_loss": -7.28629732131958, "global_step": 33345, "epoch": 198} {"train_loss": -7.676450729370117, "global_step": 33346, "epoch": 198} {"train_loss": -7.349254608154297, "global_step": 33347, "epoch": 198} {"train_loss": -7.493899345397949, "global_step": 33348, "epoch": 198} {"train_loss": -7.362115859985352, "global_step": 33349, "epoch": 198} {"train_loss": -7.797364234924316, "global_step": 33350, "epoch": 198} {"train_loss": -7.218234062194824, "global_step": 33351, "epoch": 198} {"train_loss": -7.615107536315918, "global_step": 33352, "epoch": 198} {"train_loss": -7.378056526184082, "global_step": 33353, "epoch": 198} {"train_loss": -7.5901641845703125, "global_step": 33354, "epoch": 198} {"train_loss": -7.600706577301025, "global_step": 33355, "epoch": 198} {"train_loss": -7.528423309326172, "global_step": 33356, "epoch": 198} {"train_loss": -7.403634071350098, "global_step": 33357, "epoch": 198} {"train_loss": -7.5558929443359375, "global_step": 33358, "epoch": 198} {"train_loss": -7.578792572021484, "global_step": 33359, "epoch": 198} {"train_loss": -7.421905517578125, "global_step": 33360, "epoch": 198} {"train_loss": -7.600367069244385, "global_step": 33361, "epoch": 198} {"train_loss": -7.5708723068237305, "global_step": 33362, "epoch": 198} {"train_loss": -7.5711541175842285, "global_step": 33363, "epoch": 198} {"train_loss": -7.529349327087402, "global_step": 33364, "epoch": 198} {"train_loss": -7.535351753234863, "global_step": 33365, "epoch": 198} {"train_loss": -7.631237983703613, "global_step": 33366, "epoch": 198} {"train_loss": -7.731772422790527, "global_step": 33367, "epoch": 198} {"train_loss": -7.6780266761779785, "global_step": 33368, "epoch": 198} {"train_loss": -7.6710052490234375, "global_step": 33369, "epoch": 198} {"train_loss": -7.634894371032715, "global_step": 33370, "epoch": 198} {"train_loss": -7.677938461303711, "global_step": 33371, "epoch": 198} {"train_loss": -7.595073699951172, "global_step": 33372, "epoch": 198} {"train_loss": -7.679434776306152, "global_step": 33373, "epoch": 198} {"train_loss": -7.615887641906738, "global_step": 33374, "epoch": 198} {"train_loss": -7.7699360847473145, "global_step": 33375, "epoch": 198} {"train_loss": -7.431807518005371, "global_step": 33376, "epoch": 198} {"train_loss": -7.923835277557373, "global_step": 33377, "epoch": 198} {"train_loss": -7.638909816741943, "global_step": 33378, "epoch": 198} {"train_loss": -7.741909980773926, "global_step": 33379, "epoch": 198} {"train_loss": -7.531688690185547, "global_step": 33380, "epoch": 198} {"train_loss": -7.738651275634766, "global_step": 33381, "epoch": 198} {"train_loss": -7.360831260681152, "global_step": 33382, "epoch": 198} {"train_loss": -7.609493255615234, "global_step": 33383, "epoch": 198} {"train_loss": -7.542019844055176, "global_step": 33384, "epoch": 198} {"train_loss": -7.754344463348389, "global_step": 33385, "epoch": 198} {"train_loss": -7.580959320068359, "global_step": 33386, "epoch": 198} {"train_loss": -7.464588165283203, "global_step": 33387, "epoch": 198} {"train_loss": -7.653514862060547, "global_step": 33388, "epoch": 198} {"train_loss": -7.601349830627441, "global_step": 33389, "epoch": 198} {"train_loss": -7.714045524597168, "global_step": 33390, "epoch": 198} {"train_loss": -7.52003288269043, "global_step": 33391, "epoch": 198} {"train_loss": -7.907477378845215, "global_step": 33392, "epoch": 198} {"train_loss": -7.235316276550293, "global_step": 33393, "epoch": 198} {"train_loss": -7.847556114196777, "global_step": 33394, "epoch": 198} {"train_loss": -7.49741268157959, "global_step": 33395, "epoch": 198} {"train_loss": -7.7490620613098145, "global_step": 33396, "epoch": 198} {"train_loss": -7.712034225463867, "global_step": 33397, "epoch": 198} {"train_loss": -7.924183368682861, "global_step": 33398, "epoch": 198} {"train_loss": -7.705369472503662, "global_step": 33399, "epoch": 198} {"train_loss": -7.7403035163879395, "global_step": 33400, "epoch": 198} {"train_loss": -7.623014450073242, "global_step": 33401, "epoch": 198} {"train_loss": -7.646564483642578, "global_step": 33402, "epoch": 198} {"train_loss": -7.748146057128906, "global_step": 33403, "epoch": 198} {"train_loss": -7.736586093902588, "global_step": 33404, "epoch": 198} {"train_loss": -7.72824764251709, "global_step": 33405, "epoch": 198} {"train_loss": -7.698780536651611, "global_step": 33406, "epoch": 198} {"train_loss": -7.622330665588379, "global_step": 33407, "epoch": 198} {"train_loss": -7.670024871826172, "global_step": 33408, "epoch": 198} {"train_loss": -7.756591320037842, "global_step": 33409, "epoch": 198} {"train_loss": -7.38873291015625, "global_step": 33410, "epoch": 198} {"train_loss": -7.836276054382324, "global_step": 33411, "epoch": 198} {"train_loss": -7.363326549530029, "global_step": 33412, "epoch": 198} {"train_loss": -7.775079727172852, "global_step": 33413, "epoch": 198} {"train_loss": -7.2390241622924805, "global_step": 33414, "epoch": 198} {"train_loss": -7.701394081115723, "global_step": 33415, "epoch": 198} {"train_loss": -7.3129119873046875, "global_step": 33416, "epoch": 198} {"train_loss": -7.370896816253662, "global_step": 33417, "epoch": 198} {"train_loss": -7.440325736999512, "global_step": 33418, "epoch": 198} {"train_loss": -7.58028507232666, "global_step": 33419, "epoch": 198} {"train_loss": -7.394028663635254, "global_step": 33420, "epoch": 198} {"train_loss": -7.619524002075195, "global_step": 33421, "epoch": 198} {"train_loss": -7.378724098205566, "global_step": 33422, "epoch": 198} {"train_loss": -7.308131694793701, "global_step": 33423, "epoch": 198} {"train_loss": -7.638579368591309, "global_step": 33424, "epoch": 198} {"train_loss": -7.37956428527832, "global_step": 33425, "epoch": 198} {"train_loss": -7.464111328125, "global_step": 33426, "epoch": 198} {"train_loss": -7.509092330932617, "global_step": 33427, "epoch": 198} {"train_loss": -7.507678031921387, "global_step": 33428, "epoch": 198} {"train_loss": -7.5790934562683105, "global_step": 33429, "epoch": 198} {"train_loss": -7.443936347961426, "global_step": 33430, "epoch": 198} {"train_loss": -7.579206475189754, "global_step": 33431, "epoch": 198, "val_loss": 185060.5} {"train_loss": -7.606606483459473, "global_step": 33432, "epoch": 199} {"train_loss": -7.563158988952637, "global_step": 33433, "epoch": 199} {"train_loss": -7.755043029785156, "global_step": 33434, "epoch": 199} {"train_loss": -7.787965774536133, "global_step": 33435, "epoch": 199} {"train_loss": -7.58696985244751, "global_step": 33436, "epoch": 199} {"train_loss": -7.683139801025391, "global_step": 33437, "epoch": 199} {"train_loss": -7.630127429962158, "global_step": 33438, "epoch": 199} {"train_loss": -7.522702217102051, "global_step": 33439, "epoch": 199} {"train_loss": -7.520630836486816, "global_step": 33440, "epoch": 199} {"train_loss": -7.761164665222168, "global_step": 33441, "epoch": 199} {"train_loss": -7.351376533508301, "global_step": 33442, "epoch": 199} {"train_loss": -7.551234245300293, "global_step": 33443, "epoch": 199} {"train_loss": -7.722248077392578, "global_step": 33444, "epoch": 199} {"train_loss": -7.529993057250977, "global_step": 33445, "epoch": 199} {"train_loss": -7.7077789306640625, "global_step": 33446, "epoch": 199} {"train_loss": -7.640206336975098, "global_step": 33447, "epoch": 199} {"train_loss": -7.563787460327148, "global_step": 33448, "epoch": 199} {"train_loss": -7.715117454528809, "global_step": 33449, "epoch": 199} {"train_loss": -7.707427978515625, "global_step": 33450, "epoch": 199} {"train_loss": -7.733054161071777, "global_step": 33451, "epoch": 199} {"train_loss": -7.837164878845215, "global_step": 33452, "epoch": 199} {"train_loss": -7.482907772064209, "global_step": 33453, "epoch": 199} {"train_loss": -7.738009452819824, "global_step": 33454, "epoch": 199} {"train_loss": -7.761974811553955, "global_step": 33455, "epoch": 199} {"train_loss": -7.786525726318359, "global_step": 33456, "epoch": 199} {"train_loss": -7.618349552154541, "global_step": 33457, "epoch": 199} {"train_loss": -7.71452522277832, "global_step": 33458, "epoch": 199} {"train_loss": -7.484493255615234, "global_step": 33459, "epoch": 199} {"train_loss": -7.614462852478027, "global_step": 33460, "epoch": 199} {"train_loss": -7.66593074798584, "global_step": 33461, "epoch": 199} {"train_loss": -7.649838447570801, "global_step": 33462, "epoch": 199} {"train_loss": -7.558756351470947, "global_step": 33463, "epoch": 199} {"train_loss": -7.853538990020752, "global_step": 33464, "epoch": 199} {"train_loss": -7.5035786628723145, "global_step": 33465, "epoch": 199} {"train_loss": -7.5745954513549805, "global_step": 33466, "epoch": 199} {"train_loss": -7.702008247375488, "global_step": 33467, "epoch": 199} {"train_loss": -7.792087554931641, "global_step": 33468, "epoch": 199} {"train_loss": -7.601465225219727, "global_step": 33469, "epoch": 199} {"train_loss": -7.69254732131958, "global_step": 33470, "epoch": 199} {"train_loss": -7.606675148010254, "global_step": 33471, "epoch": 199} {"train_loss": -7.638252258300781, "global_step": 33472, "epoch": 199} {"train_loss": -7.709160804748535, "global_step": 33473, "epoch": 199} {"train_loss": -7.490635871887207, "global_step": 33474, "epoch": 199} {"train_loss": -7.582272529602051, "global_step": 33475, "epoch": 199} {"train_loss": -7.757837295532227, "global_step": 33476, "epoch": 199} {"train_loss": -7.427214622497559, "global_step": 33477, "epoch": 199} {"train_loss": -7.365849018096924, "global_step": 33478, "epoch": 199} {"train_loss": -7.511943817138672, "global_step": 33479, "epoch": 199} {"train_loss": -7.822353363037109, "global_step": 33480, "epoch": 199} {"train_loss": -7.6228132247924805, "global_step": 33481, "epoch": 199} {"train_loss": -7.527218818664551, "global_step": 33482, "epoch": 199} {"train_loss": -7.511043548583984, "global_step": 33483, "epoch": 199} {"train_loss": -7.667729377746582, "global_step": 33484, "epoch": 199} {"train_loss": -7.811032295227051, "global_step": 33485, "epoch": 199} {"train_loss": -7.5072150230407715, "global_step": 33486, "epoch": 199} {"train_loss": -7.631024360656738, "global_step": 33487, "epoch": 199} {"train_loss": -7.48067569732666, "global_step": 33488, "epoch": 199} {"train_loss": -7.419611930847168, "global_step": 33489, "epoch": 199} {"train_loss": -7.574398040771484, "global_step": 33490, "epoch": 199} {"train_loss": -7.57952356338501, "global_step": 33491, "epoch": 199} {"train_loss": -7.738521575927734, "global_step": 33492, "epoch": 199} {"train_loss": -7.3559064865112305, "global_step": 33493, "epoch": 199} {"train_loss": -7.751044273376465, "global_step": 33494, "epoch": 199} {"train_loss": -7.589860439300537, "global_step": 33495, "epoch": 199} {"train_loss": -7.608897686004639, "global_step": 33496, "epoch": 199} {"train_loss": -7.59429931640625, "global_step": 33497, "epoch": 199} {"train_loss": -7.720488548278809, "global_step": 33498, "epoch": 199} {"train_loss": -7.724584579467773, "global_step": 33499, "epoch": 199} {"train_loss": -7.558170795440674, "global_step": 33500, "epoch": 199} {"train_loss": -7.786409854888916, "global_step": 33501, "epoch": 199} {"train_loss": -7.689460754394531, "global_step": 33502, "epoch": 199} {"train_loss": -7.700437545776367, "global_step": 33503, "epoch": 199} {"train_loss": -7.549990177154541, "global_step": 33504, "epoch": 199} {"train_loss": -7.460023880004883, "global_step": 33505, "epoch": 199} {"train_loss": -7.803017616271973, "global_step": 33506, "epoch": 199} {"train_loss": -7.142491340637207, "global_step": 33507, "epoch": 199} {"train_loss": -7.631399154663086, "global_step": 33508, "epoch": 199} {"train_loss": -7.82669734954834, "global_step": 33509, "epoch": 199} {"train_loss": -7.412839889526367, "global_step": 33510, "epoch": 199} {"train_loss": -7.696881294250488, "global_step": 33511, "epoch": 199} {"train_loss": -7.548246383666992, "global_step": 33512, "epoch": 199} {"train_loss": -7.621509075164795, "global_step": 33513, "epoch": 199} {"train_loss": -7.638759613037109, "global_step": 33514, "epoch": 199} {"train_loss": -7.454038619995117, "global_step": 33515, "epoch": 199} {"train_loss": -7.747657299041748, "global_step": 33516, "epoch": 199} {"train_loss": -7.289400100708008, "global_step": 33517, "epoch": 199} {"train_loss": -7.453534126281738, "global_step": 33518, "epoch": 199} {"train_loss": -7.426600933074951, "global_step": 33519, "epoch": 199} {"train_loss": -7.367098808288574, "global_step": 33520, "epoch": 199} {"train_loss": -7.4246625900268555, "global_step": 33521, "epoch": 199} {"train_loss": -7.344789028167725, "global_step": 33522, "epoch": 199} {"train_loss": -7.253107070922852, "global_step": 33523, "epoch": 199} {"train_loss": -7.515138626098633, "global_step": 33524, "epoch": 199} {"train_loss": -7.555206775665283, "global_step": 33525, "epoch": 199} {"train_loss": -7.404379367828369, "global_step": 33526, "epoch": 199} {"train_loss": -7.434864521026611, "global_step": 33527, "epoch": 199} {"train_loss": -7.530601501464844, "global_step": 33528, "epoch": 199} {"train_loss": -7.4511613845825195, "global_step": 33529, "epoch": 199} {"train_loss": -7.336181640625, "global_step": 33530, "epoch": 199} {"train_loss": -7.640171051025391, "global_step": 33531, "epoch": 199} {"train_loss": -7.72542667388916, "global_step": 33532, "epoch": 199} {"train_loss": -7.550884246826172, "global_step": 33533, "epoch": 199} {"train_loss": -7.437979698181152, "global_step": 33534, "epoch": 199} {"train_loss": -7.4495530128479, "global_step": 33535, "epoch": 199} {"train_loss": -7.487205505371094, "global_step": 33536, "epoch": 199} {"train_loss": -7.671394348144531, "global_step": 33537, "epoch": 199} {"train_loss": -7.512013912200928, "global_step": 33538, "epoch": 199} {"train_loss": -7.368191719055176, "global_step": 33539, "epoch": 199} {"train_loss": -7.602471351623535, "global_step": 33540, "epoch": 199} {"train_loss": -7.311574935913086, "global_step": 33541, "epoch": 199} {"train_loss": -7.696264266967773, "global_step": 33542, "epoch": 199} {"train_loss": -7.26344108581543, "global_step": 33543, "epoch": 199} {"train_loss": -7.6633758544921875, "global_step": 33544, "epoch": 199} {"train_loss": -7.432877540588379, "global_step": 33545, "epoch": 199} {"train_loss": -7.646940231323242, "global_step": 33546, "epoch": 199} {"train_loss": -7.356572151184082, "global_step": 33547, "epoch": 199} {"train_loss": -7.737859725952148, "global_step": 33548, "epoch": 199} {"train_loss": -7.600927829742432, "global_step": 33549, "epoch": 199} {"train_loss": -7.594583988189697, "global_step": 33550, "epoch": 199} {"train_loss": -7.489475250244141, "global_step": 33551, "epoch": 199} {"train_loss": -7.317044734954834, "global_step": 33552, "epoch": 199} {"train_loss": -7.664318084716797, "global_step": 33553, "epoch": 199} {"train_loss": -7.211833477020264, "global_step": 33554, "epoch": 199} {"train_loss": -7.5690717697143555, "global_step": 33555, "epoch": 199} {"train_loss": -7.319586753845215, "global_step": 33556, "epoch": 199} {"train_loss": -7.394321918487549, "global_step": 33557, "epoch": 199} {"train_loss": -7.53083610534668, "global_step": 33558, "epoch": 199} {"train_loss": -7.263550758361816, "global_step": 33559, "epoch": 199} {"train_loss": -7.442458152770996, "global_step": 33560, "epoch": 199} {"train_loss": -7.357824325561523, "global_step": 33561, "epoch": 199} {"train_loss": -7.259542465209961, "global_step": 33562, "epoch": 199} {"train_loss": -7.548735618591309, "global_step": 33563, "epoch": 199} {"train_loss": -7.560831546783447, "global_step": 33564, "epoch": 199} {"train_loss": -7.483253479003906, "global_step": 33565, "epoch": 199} {"train_loss": -7.317487716674805, "global_step": 33566, "epoch": 199} {"train_loss": -7.616673946380615, "global_step": 33567, "epoch": 199} {"train_loss": -7.606674671173096, "global_step": 33568, "epoch": 199} {"train_loss": -7.3074493408203125, "global_step": 33569, "epoch": 199} {"train_loss": -7.140162467956543, "global_step": 33570, "epoch": 199} {"train_loss": -7.678889274597168, "global_step": 33571, "epoch": 199} {"train_loss": -7.325033187866211, "global_step": 33572, "epoch": 199} {"train_loss": -7.203116416931152, "global_step": 33573, "epoch": 199} {"train_loss": -7.688876628875732, "global_step": 33574, "epoch": 199} {"train_loss": -7.508315086364746, "global_step": 33575, "epoch": 199} {"train_loss": -7.474371910095215, "global_step": 33576, "epoch": 199} {"train_loss": -7.425509452819824, "global_step": 33577, "epoch": 199} {"train_loss": -7.468356132507324, "global_step": 33578, "epoch": 199} {"train_loss": -7.728743553161621, "global_step": 33579, "epoch": 199} {"train_loss": -7.694793224334717, "global_step": 33580, "epoch": 199} {"train_loss": -7.6182427406311035, "global_step": 33581, "epoch": 199} {"train_loss": -7.5980024337768555, "global_step": 33582, "epoch": 199} {"train_loss": -7.606950283050537, "global_step": 33583, "epoch": 199} {"train_loss": -7.630913257598877, "global_step": 33584, "epoch": 199} {"train_loss": -7.626876354217529, "global_step": 33585, "epoch": 199} {"train_loss": -7.577669143676758, "global_step": 33586, "epoch": 199} {"train_loss": -7.68388557434082, "global_step": 33587, "epoch": 199} {"train_loss": -7.554409980773926, "global_step": 33588, "epoch": 199} {"train_loss": -7.699374198913574, "global_step": 33589, "epoch": 199} {"train_loss": -7.478630065917969, "global_step": 33590, "epoch": 199} {"train_loss": -7.688629627227783, "global_step": 33591, "epoch": 199} {"train_loss": -7.507939338684082, "global_step": 33592, "epoch": 199} {"train_loss": -7.6396026611328125, "global_step": 33593, "epoch": 199} {"train_loss": -7.496584892272949, "global_step": 33594, "epoch": 199} {"train_loss": -7.9331512451171875, "global_step": 33595, "epoch": 199} {"train_loss": -7.658401012420654, "global_step": 33596, "epoch": 199} {"train_loss": -7.71950626373291, "global_step": 33597, "epoch": 199} {"train_loss": -7.630311489105225, "global_step": 33598, "epoch": 199} {"train_loss": -7.565767662865775, "global_step": 33599, "epoch": 199, "val_loss": 185333.125} {"train_loss": -7.546998023986816, "global_step": 33600, "epoch": 200} {"train_loss": -7.786830902099609, "global_step": 33601, "epoch": 200} {"train_loss": -7.763011932373047, "global_step": 33602, "epoch": 200} {"train_loss": -7.756699562072754, "global_step": 33603, "epoch": 200} {"train_loss": -7.604426860809326, "global_step": 33604, "epoch": 200} {"train_loss": -7.854744911193848, "global_step": 33605, "epoch": 200} {"train_loss": -7.489034175872803, "global_step": 33606, "epoch": 200} {"train_loss": -7.697297096252441, "global_step": 33607, "epoch": 200} {"train_loss": -7.706587791442871, "global_step": 33608, "epoch": 200} {"train_loss": -7.6847429275512695, "global_step": 33609, "epoch": 200} {"train_loss": -7.60318660736084, "global_step": 33610, "epoch": 200} {"train_loss": -7.6642632484436035, "global_step": 33611, "epoch": 200} {"train_loss": -7.7422637939453125, "global_step": 33612, "epoch": 200} {"train_loss": -7.65058708190918, "global_step": 33613, "epoch": 200} {"train_loss": -7.495934009552002, "global_step": 33614, "epoch": 200} {"train_loss": -7.775954723358154, "global_step": 33615, "epoch": 200} {"train_loss": -7.390241622924805, "global_step": 33616, "epoch": 200} {"train_loss": -7.400574684143066, "global_step": 33617, "epoch": 200} {"train_loss": -7.5595927238464355, "global_step": 33618, "epoch": 200} {"train_loss": -7.823363304138184, "global_step": 33619, "epoch": 200} {"train_loss": -7.573016166687012, "global_step": 33620, "epoch": 200} {"train_loss": -7.730471611022949, "global_step": 33621, "epoch": 200} {"train_loss": -7.552570343017578, "global_step": 33622, "epoch": 200} {"train_loss": -7.547900199890137, "global_step": 33623, "epoch": 200} {"train_loss": -7.751856803894043, "global_step": 33624, "epoch": 200} {"train_loss": -7.680876731872559, "global_step": 33625, "epoch": 200} {"train_loss": -7.330434799194336, "global_step": 33626, "epoch": 200} {"train_loss": -7.517018795013428, "global_step": 33627, "epoch": 200} {"train_loss": -7.495419502258301, "global_step": 33628, "epoch": 200} {"train_loss": -7.4553351402282715, "global_step": 33629, "epoch": 200} {"train_loss": -7.58073616027832, "global_step": 33630, "epoch": 200} {"train_loss": -7.380908012390137, "global_step": 33631, "epoch": 200} {"train_loss": -7.600800514221191, "global_step": 33632, "epoch": 200} {"train_loss": -7.503972053527832, "global_step": 33633, "epoch": 200} {"train_loss": -7.664917469024658, "global_step": 33634, "epoch": 200} {"train_loss": -7.7386884689331055, "global_step": 33635, "epoch": 200} {"train_loss": -7.783602237701416, "global_step": 33636, "epoch": 200} {"train_loss": -7.688717365264893, "global_step": 33637, "epoch": 200} {"train_loss": -7.482579231262207, "global_step": 33638, "epoch": 200} {"train_loss": -7.717194557189941, "global_step": 33639, "epoch": 200} {"train_loss": -7.517645835876465, "global_step": 33640, "epoch": 200} {"train_loss": -7.626235485076904, "global_step": 33641, "epoch": 200} {"train_loss": -7.662527084350586, "global_step": 33642, "epoch": 200} {"train_loss": -7.629773139953613, "global_step": 33643, "epoch": 200} {"train_loss": -7.600941181182861, "global_step": 33644, "epoch": 200} {"train_loss": -7.7109880447387695, "global_step": 33645, "epoch": 200} {"train_loss": -7.683854103088379, "global_step": 33646, "epoch": 200} {"train_loss": -7.6504950523376465, "global_step": 33647, "epoch": 200} {"train_loss": -7.609768867492676, "global_step": 33648, "epoch": 200} {"train_loss": -7.673191070556641, "global_step": 33649, "epoch": 200} {"train_loss": -7.512969970703125, "global_step": 33650, "epoch": 200} {"train_loss": -7.495601654052734, "global_step": 33651, "epoch": 200} {"train_loss": -7.535073280334473, "global_step": 33652, "epoch": 200} {"train_loss": -7.595098495483398, "global_step": 33653, "epoch": 200} {"train_loss": -7.508944511413574, "global_step": 33654, "epoch": 200} {"train_loss": -7.594215393066406, "global_step": 33655, "epoch": 200} {"train_loss": -7.543521404266357, "global_step": 33656, "epoch": 200} {"train_loss": -7.732600212097168, "global_step": 33657, "epoch": 200} {"train_loss": -7.530186176300049, "global_step": 33658, "epoch": 200} {"train_loss": -7.804379463195801, "global_step": 33659, "epoch": 200} {"train_loss": -7.291082382202148, "global_step": 33660, "epoch": 200} {"train_loss": -7.595266819000244, "global_step": 33661, "epoch": 200} {"train_loss": -7.597386360168457, "global_step": 33662, "epoch": 200} {"train_loss": -7.7967987060546875, "global_step": 33663, "epoch": 200} {"train_loss": -7.640822410583496, "global_step": 33664, "epoch": 200} {"train_loss": -7.618879795074463, "global_step": 33665, "epoch": 200} {"train_loss": -7.52176570892334, "global_step": 33666, "epoch": 200} {"train_loss": -7.706105709075928, "global_step": 33667, "epoch": 200} {"train_loss": -7.687835693359375, "global_step": 33668, "epoch": 200} {"train_loss": -7.607606887817383, "global_step": 33669, "epoch": 200} {"train_loss": -7.593971252441406, "global_step": 33670, "epoch": 200} {"train_loss": -7.717558860778809, "global_step": 33671, "epoch": 200} {"train_loss": -7.739938735961914, "global_step": 33672, "epoch": 200} {"train_loss": -7.893526554107666, "global_step": 33673, "epoch": 200} {"train_loss": -7.690578460693359, "global_step": 33674, "epoch": 200} {"train_loss": -7.856158256530762, "global_step": 33675, "epoch": 200} {"train_loss": -7.588942527770996, "global_step": 33676, "epoch": 200} {"train_loss": -7.438110828399658, "global_step": 33677, "epoch": 200} {"train_loss": -7.712067127227783, "global_step": 33678, "epoch": 200} {"train_loss": -7.41225528717041, "global_step": 33679, "epoch": 200} {"train_loss": -7.468918800354004, "global_step": 33680, "epoch": 200} {"train_loss": -7.771450042724609, "global_step": 33681, "epoch": 200} {"train_loss": -7.855078220367432, "global_step": 33682, "epoch": 200} {"train_loss": -7.588488578796387, "global_step": 33683, "epoch": 200} {"train_loss": -7.740501880645752, "global_step": 33684, "epoch": 200} {"train_loss": -7.601490020751953, "global_step": 33685, "epoch": 200} {"train_loss": -7.935067176818848, "global_step": 33686, "epoch": 200} {"train_loss": -7.686024188995361, "global_step": 33687, "epoch": 200} {"train_loss": -7.70206356048584, "global_step": 33688, "epoch": 200} {"train_loss": -7.621630668640137, "global_step": 33689, "epoch": 200} {"train_loss": -7.5660529136657715, "global_step": 33690, "epoch": 200} {"train_loss": -7.486944198608398, "global_step": 33691, "epoch": 200} {"train_loss": -7.791149139404297, "global_step": 33692, "epoch": 200} {"train_loss": -7.595628261566162, "global_step": 33693, "epoch": 200} {"train_loss": -7.776167392730713, "global_step": 33694, "epoch": 200} {"train_loss": -7.925049781799316, "global_step": 33695, "epoch": 200} {"train_loss": -7.624134063720703, "global_step": 33696, "epoch": 200} {"train_loss": -7.7118024826049805, "global_step": 33697, "epoch": 200} {"train_loss": -7.602452754974365, "global_step": 33698, "epoch": 200} {"train_loss": -7.708486557006836, "global_step": 33699, "epoch": 200} {"train_loss": -7.55815315246582, "global_step": 33700, "epoch": 200} {"train_loss": -7.7584967613220215, "global_step": 33701, "epoch": 200} {"train_loss": -7.646902561187744, "global_step": 33702, "epoch": 200} {"train_loss": -7.6807661056518555, "global_step": 33703, "epoch": 200} {"train_loss": -7.497962951660156, "global_step": 33704, "epoch": 200} {"train_loss": -7.450484275817871, "global_step": 33705, "epoch": 200} {"train_loss": -7.476787567138672, "global_step": 33706, "epoch": 200} {"train_loss": -7.490597724914551, "global_step": 33707, "epoch": 200} {"train_loss": -7.46322774887085, "global_step": 33708, "epoch": 200} {"train_loss": -7.579483985900879, "global_step": 33709, "epoch": 200} {"train_loss": -7.628211498260498, "global_step": 33710, "epoch": 200} {"train_loss": -7.692682266235352, "global_step": 33711, "epoch": 200} {"train_loss": -7.471022129058838, "global_step": 33712, "epoch": 200} {"train_loss": -7.53447961807251, "global_step": 33713, "epoch": 200} {"train_loss": -7.5055928230285645, "global_step": 33714, "epoch": 200} {"train_loss": -7.609708786010742, "global_step": 33715, "epoch": 200} {"train_loss": -7.44661283493042, "global_step": 33716, "epoch": 200} {"train_loss": -7.530303001403809, "global_step": 33717, "epoch": 200} {"train_loss": -7.422026634216309, "global_step": 33718, "epoch": 200} {"train_loss": -7.622158050537109, "global_step": 33719, "epoch": 200} {"train_loss": -7.646703243255615, "global_step": 33720, "epoch": 200} {"train_loss": -7.75093936920166, "global_step": 33721, "epoch": 200} {"train_loss": -7.742836952209473, "global_step": 33722, "epoch": 200} {"train_loss": -7.740424156188965, "global_step": 33723, "epoch": 200} {"train_loss": -7.610309600830078, "global_step": 33724, "epoch": 200} {"train_loss": -7.716369152069092, "global_step": 33725, "epoch": 200} {"train_loss": -7.950179100036621, "global_step": 33726, "epoch": 200} {"train_loss": -7.470746994018555, "global_step": 33727, "epoch": 200} {"train_loss": -7.791282653808594, "global_step": 33728, "epoch": 200} {"train_loss": -7.531696319580078, "global_step": 33729, "epoch": 200} {"train_loss": -7.641143321990967, "global_step": 33730, "epoch": 200} {"train_loss": -7.692421913146973, "global_step": 33731, "epoch": 200} {"train_loss": -7.339123725891113, "global_step": 33732, "epoch": 200} {"train_loss": -7.288278102874756, "global_step": 33733, "epoch": 200} {"train_loss": -7.725371360778809, "global_step": 33734, "epoch": 200} {"train_loss": -7.364951133728027, "global_step": 33735, "epoch": 200} {"train_loss": -7.334766864776611, "global_step": 33736, "epoch": 200} {"train_loss": -7.316343307495117, "global_step": 33737, "epoch": 200} {"train_loss": -7.462662220001221, "global_step": 33738, "epoch": 200} {"train_loss": -7.522619247436523, "global_step": 33739, "epoch": 200} {"train_loss": -7.5236616134643555, "global_step": 33740, "epoch": 200} {"train_loss": -7.588315963745117, "global_step": 33741, "epoch": 200} {"train_loss": -7.40419864654541, "global_step": 33742, "epoch": 200} {"train_loss": -7.334317207336426, "global_step": 33743, "epoch": 200} {"train_loss": -7.1963114738464355, "global_step": 33744, "epoch": 200} {"train_loss": -7.681529998779297, "global_step": 33745, "epoch": 200} {"train_loss": -7.450411796569824, "global_step": 33746, "epoch": 200} {"train_loss": -7.610908508300781, "global_step": 33747, "epoch": 200} {"train_loss": -7.502891540527344, "global_step": 33748, "epoch": 200} {"train_loss": -7.414216995239258, "global_step": 33749, "epoch": 200} {"train_loss": -7.543416976928711, "global_step": 33750, "epoch": 200} {"train_loss": -7.636664390563965, "global_step": 33751, "epoch": 200} {"train_loss": -7.578542709350586, "global_step": 33752, "epoch": 200} {"train_loss": -7.4364776611328125, "global_step": 33753, "epoch": 200} {"train_loss": -7.396803379058838, "global_step": 33754, "epoch": 200} {"train_loss": -7.792793273925781, "global_step": 33755, "epoch": 200} {"train_loss": -7.669094085693359, "global_step": 33756, "epoch": 200} {"train_loss": -7.599818229675293, "global_step": 33757, "epoch": 200} {"train_loss": -7.5687971115112305, "global_step": 33758, "epoch": 200} {"train_loss": -7.618407249450684, "global_step": 33759, "epoch": 200} {"train_loss": -7.551513195037842, "global_step": 33760, "epoch": 200} {"train_loss": -7.5555524826049805, "global_step": 33761, "epoch": 200} {"train_loss": -7.863138198852539, "global_step": 33762, "epoch": 200} {"train_loss": -7.793916702270508, "global_step": 33763, "epoch": 200} {"train_loss": -7.840611457824707, "global_step": 33764, "epoch": 200} {"train_loss": -7.8182244300842285, "global_step": 33765, "epoch": 200} {"train_loss": -7.606999397277832, "global_step": 33766, "epoch": 200} {"train_loss": -7.61193908680053, "global_step": 33767, "epoch": 200, "train/sim_max_reward_0": 0.9873675868438904, "train/sim_max_reward_1": 0.9260117542867171, "train/sim_max_reward_2": 0.9514630487293456, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.9123705798096317, "test/sim_max_reward_4400000": 0.23028124423412982, "test/sim_max_reward_4400001": 0.9752157852634742, "test/sim_max_reward_4400002": 0.9963718676957137, "test/sim_max_reward_4400003": 0.9604883012848409, "test/sim_max_reward_4400004": 0.404075080123535, "test/sim_max_reward_4400005": 0.9915120566561901, "test/sim_max_reward_4400006": 0.3465918664641273, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 0.7133903241926283, "test/sim_max_reward_4400009": 0.4710123474740464, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 0.9522185429753444, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.9464918864227816, "test/sim_max_reward_4400014": 0.49975633845303735, "test/sim_max_reward_4400015": 0.3707687633761744, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.8909381254553502, "test/sim_max_reward_4400019": 0.17744672948481055, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 0.7084755503982102, "test/sim_max_reward_4400022": 0.9278797217283201, "test/sim_max_reward_4400023": 0.14877709299418007, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.6645646088848599, "test/sim_max_reward_4400026": 0.9871654145506251, "test/sim_max_reward_4400027": 0.4936146409316106, "test/sim_max_reward_4400028": 0.7270495386550458, "test/sim_max_reward_4400029": 0.4784733706338728, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.14133278492055978, "test/sim_max_reward_4400033": 0.16434811850867614, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.37910623013117734, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.40161529809194135, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.17590247886542426, "test/sim_max_reward_4400042": 0.008170911192914649, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.9475660928571992, "test/sim_max_reward_4400045": 0.7646628139175156, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 0.9925620442409171, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.9628688282782641, "test/mean_score": 0.5966400488100126, "val_loss": 187399.828125, "train_action_mse_error": 11.756834030151367} {"train_loss": -7.850240707397461, "global_step": 33768, "epoch": 201} {"train_loss": -7.756580829620361, "global_step": 33769, "epoch": 201} {"train_loss": -7.631640911102295, "global_step": 33770, "epoch": 201} {"train_loss": -7.774369239807129, "global_step": 33771, "epoch": 201} {"train_loss": -7.958287239074707, "global_step": 33772, "epoch": 201} {"train_loss": -7.568106651306152, "global_step": 33773, "epoch": 201} {"train_loss": -7.660264015197754, "global_step": 33774, "epoch": 201} {"train_loss": -7.553447723388672, "global_step": 33775, "epoch": 201} {"train_loss": -7.8339128494262695, "global_step": 33776, "epoch": 201} {"train_loss": -7.656871795654297, "global_step": 33777, "epoch": 201} {"train_loss": -7.63074254989624, "global_step": 33778, "epoch": 201} {"train_loss": -7.446225166320801, "global_step": 33779, "epoch": 201} {"train_loss": -7.564537048339844, "global_step": 33780, "epoch": 201} {"train_loss": -7.476212978363037, "global_step": 33781, "epoch": 201} {"train_loss": -7.521409511566162, "global_step": 33782, "epoch": 201} {"train_loss": -7.46199893951416, "global_step": 33783, "epoch": 201} {"train_loss": -7.605029106140137, "global_step": 33784, "epoch": 201} {"train_loss": -7.643789291381836, "global_step": 33785, "epoch": 201} {"train_loss": -7.341177940368652, "global_step": 33786, "epoch": 201} {"train_loss": -7.701776504516602, "global_step": 33787, "epoch": 201} {"train_loss": -7.740753650665283, "global_step": 33788, "epoch": 201} {"train_loss": -7.402779579162598, "global_step": 33789, "epoch": 201} {"train_loss": -7.488960266113281, "global_step": 33790, "epoch": 201} {"train_loss": -7.412328243255615, "global_step": 33791, "epoch": 201} {"train_loss": -7.474687576293945, "global_step": 33792, "epoch": 201} {"train_loss": -7.4171905517578125, "global_step": 33793, "epoch": 201} {"train_loss": -7.3855390548706055, "global_step": 33794, "epoch": 201} {"train_loss": -7.656801223754883, "global_step": 33795, "epoch": 201} {"train_loss": -7.571106910705566, "global_step": 33796, "epoch": 201} {"train_loss": -7.262217998504639, "global_step": 33797, "epoch": 201} {"train_loss": -7.7603840827941895, "global_step": 33798, "epoch": 201} {"train_loss": -7.706040382385254, "global_step": 33799, "epoch": 201} {"train_loss": -7.553241729736328, "global_step": 33800, "epoch": 201} {"train_loss": -7.762953758239746, "global_step": 33801, "epoch": 201} {"train_loss": -7.911046028137207, "global_step": 33802, "epoch": 201} {"train_loss": -7.80784273147583, "global_step": 33803, "epoch": 201} {"train_loss": -7.795021057128906, "global_step": 33804, "epoch": 201} {"train_loss": -7.653175354003906, "global_step": 33805, "epoch": 201} {"train_loss": -7.770424842834473, "global_step": 33806, "epoch": 201} {"train_loss": -7.728874206542969, "global_step": 33807, "epoch": 201} {"train_loss": -7.799962043762207, "global_step": 33808, "epoch": 201} {"train_loss": -7.645764350891113, "global_step": 33809, "epoch": 201} {"train_loss": -7.892678737640381, "global_step": 33810, "epoch": 201} {"train_loss": -7.818551540374756, "global_step": 33811, "epoch": 201} {"train_loss": -7.541805267333984, "global_step": 33812, "epoch": 201} {"train_loss": -7.622283935546875, "global_step": 33813, "epoch": 201} {"train_loss": -7.507475852966309, "global_step": 33814, "epoch": 201} {"train_loss": -7.508090019226074, "global_step": 33815, "epoch": 201} {"train_loss": -7.472530841827393, "global_step": 33816, "epoch": 201} {"train_loss": -7.826582908630371, "global_step": 33817, "epoch": 201} {"train_loss": -7.771478652954102, "global_step": 33818, "epoch": 201} {"train_loss": -7.585403919219971, "global_step": 33819, "epoch": 201} {"train_loss": -7.543817520141602, "global_step": 33820, "epoch": 201} {"train_loss": -7.596922874450684, "global_step": 33821, "epoch": 201} {"train_loss": -7.781867027282715, "global_step": 33822, "epoch": 201} {"train_loss": -7.536957740783691, "global_step": 33823, "epoch": 201} {"train_loss": -7.832546234130859, "global_step": 33824, "epoch": 201} {"train_loss": -7.798428058624268, "global_step": 33825, "epoch": 201} {"train_loss": -7.715148448944092, "global_step": 33826, "epoch": 201} {"train_loss": -7.825437545776367, "global_step": 33827, "epoch": 201} {"train_loss": -7.422139644622803, "global_step": 33828, "epoch": 201} {"train_loss": -7.7321014404296875, "global_step": 33829, "epoch": 201} {"train_loss": -7.458958148956299, "global_step": 33830, "epoch": 201} {"train_loss": -7.5724897384643555, "global_step": 33831, "epoch": 201} {"train_loss": -7.796262264251709, "global_step": 33832, "epoch": 201} {"train_loss": -7.551151275634766, "global_step": 33833, "epoch": 201} {"train_loss": -7.64902400970459, "global_step": 33834, "epoch": 201} {"train_loss": -7.521053791046143, "global_step": 33835, "epoch": 201} {"train_loss": -7.628575325012207, "global_step": 33836, "epoch": 201} {"train_loss": -7.457029342651367, "global_step": 33837, "epoch": 201} {"train_loss": -7.47006893157959, "global_step": 33838, "epoch": 201} {"train_loss": -7.744253158569336, "global_step": 33839, "epoch": 201} {"train_loss": -7.3011980056762695, "global_step": 33840, "epoch": 201} {"train_loss": -7.889184951782227, "global_step": 33841, "epoch": 201} {"train_loss": -7.576711177825928, "global_step": 33842, "epoch": 201} {"train_loss": -7.713558197021484, "global_step": 33843, "epoch": 201} {"train_loss": -7.419041633605957, "global_step": 33844, "epoch": 201} {"train_loss": -7.570347785949707, "global_step": 33845, "epoch": 201} {"train_loss": -7.5680084228515625, "global_step": 33846, "epoch": 201} {"train_loss": -7.449997425079346, "global_step": 33847, "epoch": 201} {"train_loss": -7.6358232498168945, "global_step": 33848, "epoch": 201} {"train_loss": -7.390159606933594, "global_step": 33849, "epoch": 201} {"train_loss": -7.844842910766602, "global_step": 33850, "epoch": 201} {"train_loss": -7.641132354736328, "global_step": 33851, "epoch": 201} {"train_loss": -7.764310836791992, "global_step": 33852, "epoch": 201} {"train_loss": -7.385818004608154, "global_step": 33853, "epoch": 201} {"train_loss": -7.633384704589844, "global_step": 33854, "epoch": 201} {"train_loss": -7.598135948181152, "global_step": 33855, "epoch": 201} {"train_loss": -7.594015121459961, "global_step": 33856, "epoch": 201} {"train_loss": -7.624693870544434, "global_step": 33857, "epoch": 201} {"train_loss": -7.604345321655273, "global_step": 33858, "epoch": 201} {"train_loss": -7.65626859664917, "global_step": 33859, "epoch": 201} {"train_loss": -7.58657169342041, "global_step": 33860, "epoch": 201} {"train_loss": -7.513991355895996, "global_step": 33861, "epoch": 201} {"train_loss": -7.35569429397583, "global_step": 33862, "epoch": 201} {"train_loss": -7.683023929595947, "global_step": 33863, "epoch": 201} {"train_loss": -7.5341033935546875, "global_step": 33864, "epoch": 201} {"train_loss": -7.390582084655762, "global_step": 33865, "epoch": 201} {"train_loss": -7.547406196594238, "global_step": 33866, "epoch": 201} {"train_loss": -7.451514720916748, "global_step": 33867, "epoch": 201} {"train_loss": -7.307879447937012, "global_step": 33868, "epoch": 201} {"train_loss": -7.464111804962158, "global_step": 33869, "epoch": 201} {"train_loss": -7.438889503479004, "global_step": 33870, "epoch": 201} {"train_loss": -7.611557960510254, "global_step": 33871, "epoch": 201} {"train_loss": -7.2493085861206055, "global_step": 33872, "epoch": 201} {"train_loss": -7.4602861404418945, "global_step": 33873, "epoch": 201} {"train_loss": -7.692971229553223, "global_step": 33874, "epoch": 201} {"train_loss": -7.481081008911133, "global_step": 33875, "epoch": 201} {"train_loss": -7.6221699714660645, "global_step": 33876, "epoch": 201} {"train_loss": -7.3609209060668945, "global_step": 33877, "epoch": 201} {"train_loss": -7.246857643127441, "global_step": 33878, "epoch": 201} {"train_loss": -7.736888885498047, "global_step": 33879, "epoch": 201} {"train_loss": -7.209868431091309, "global_step": 33880, "epoch": 201} {"train_loss": -7.7079267501831055, "global_step": 33881, "epoch": 201} {"train_loss": -7.571962356567383, "global_step": 33882, "epoch": 201} {"train_loss": -7.494927406311035, "global_step": 33883, "epoch": 201} {"train_loss": -7.747765064239502, "global_step": 33884, "epoch": 201} {"train_loss": -7.15660285949707, "global_step": 33885, "epoch": 201} {"train_loss": -7.647075653076172, "global_step": 33886, "epoch": 201} {"train_loss": -7.587521553039551, "global_step": 33887, "epoch": 201} {"train_loss": -7.420413494110107, "global_step": 33888, "epoch": 201} {"train_loss": -7.484635353088379, "global_step": 33889, "epoch": 201} {"train_loss": -7.409264087677002, "global_step": 33890, "epoch": 201} {"train_loss": -7.632861137390137, "global_step": 33891, "epoch": 201} {"train_loss": -7.52355432510376, "global_step": 33892, "epoch": 201} {"train_loss": -7.606207847595215, "global_step": 33893, "epoch": 201} {"train_loss": -7.728679180145264, "global_step": 33894, "epoch": 201} {"train_loss": -7.5839362144470215, "global_step": 33895, "epoch": 201} {"train_loss": -7.674136638641357, "global_step": 33896, "epoch": 201} {"train_loss": -7.460134506225586, "global_step": 33897, "epoch": 201} {"train_loss": -7.649388313293457, "global_step": 33898, "epoch": 201} {"train_loss": -7.4718546867370605, "global_step": 33899, "epoch": 201} {"train_loss": -7.523533821105957, "global_step": 33900, "epoch": 201} {"train_loss": -7.484198570251465, "global_step": 33901, "epoch": 201} {"train_loss": -7.619406700134277, "global_step": 33902, "epoch": 201} {"train_loss": -7.521975994110107, "global_step": 33903, "epoch": 201} {"train_loss": -7.512843132019043, "global_step": 33904, "epoch": 201} {"train_loss": -7.446206092834473, "global_step": 33905, "epoch": 201} {"train_loss": -7.475497245788574, "global_step": 33906, "epoch": 201} {"train_loss": -7.841373443603516, "global_step": 33907, "epoch": 201} {"train_loss": -7.433601379394531, "global_step": 33908, "epoch": 201} {"train_loss": -7.7146759033203125, "global_step": 33909, "epoch": 201} {"train_loss": -7.482759475708008, "global_step": 33910, "epoch": 201} {"train_loss": -7.855761528015137, "global_step": 33911, "epoch": 201} {"train_loss": -7.450193881988525, "global_step": 33912, "epoch": 201} {"train_loss": -7.615861892700195, "global_step": 33913, "epoch": 201} {"train_loss": -7.615575313568115, "global_step": 33914, "epoch": 201} {"train_loss": -7.58798360824585, "global_step": 33915, "epoch": 201} {"train_loss": -7.574709892272949, "global_step": 33916, "epoch": 201} {"train_loss": -7.401045322418213, "global_step": 33917, "epoch": 201} {"train_loss": -7.630162715911865, "global_step": 33918, "epoch": 201} {"train_loss": -7.823687553405762, "global_step": 33919, "epoch": 201} {"train_loss": -7.616432189941406, "global_step": 33920, "epoch": 201} {"train_loss": -7.687274932861328, "global_step": 33921, "epoch": 201} {"train_loss": -7.537619590759277, "global_step": 33922, "epoch": 201} {"train_loss": -7.759130477905273, "global_step": 33923, "epoch": 201} {"train_loss": -7.9142255783081055, "global_step": 33924, "epoch": 201} {"train_loss": -7.811196804046631, "global_step": 33925, "epoch": 201} {"train_loss": -7.7942657470703125, "global_step": 33926, "epoch": 201} {"train_loss": -7.674014091491699, "global_step": 33927, "epoch": 201} {"train_loss": -7.484460353851318, "global_step": 33928, "epoch": 201} {"train_loss": -7.78538703918457, "global_step": 33929, "epoch": 201} {"train_loss": -7.79144287109375, "global_step": 33930, "epoch": 201} {"train_loss": -7.974040985107422, "global_step": 33931, "epoch": 201} {"train_loss": -7.537047386169434, "global_step": 33932, "epoch": 201} {"train_loss": -7.681182861328125, "global_step": 33933, "epoch": 201} {"train_loss": -7.85888147354126, "global_step": 33934, "epoch": 201} {"train_loss": -7.602831993784223, "global_step": 33935, "epoch": 201, "val_loss": 186209.703125} {"train_loss": -7.791738510131836, "global_step": 33936, "epoch": 202} {"train_loss": -7.787853240966797, "global_step": 33937, "epoch": 202} {"train_loss": -7.7530646324157715, "global_step": 33938, "epoch": 202} {"train_loss": -7.603046894073486, "global_step": 33939, "epoch": 202} {"train_loss": -7.638148307800293, "global_step": 33940, "epoch": 202} {"train_loss": -7.796530723571777, "global_step": 33941, "epoch": 202} {"train_loss": -7.655649662017822, "global_step": 33942, "epoch": 202} {"train_loss": -7.482212543487549, "global_step": 33943, "epoch": 202} {"train_loss": -7.456056594848633, "global_step": 33944, "epoch": 202} {"train_loss": -7.591271877288818, "global_step": 33945, "epoch": 202} {"train_loss": -7.28151798248291, "global_step": 33946, "epoch": 202} {"train_loss": -7.689087867736816, "global_step": 33947, "epoch": 202} {"train_loss": -7.417758941650391, "global_step": 33948, "epoch": 202} {"train_loss": -7.77394962310791, "global_step": 33949, "epoch": 202} {"train_loss": -7.473730564117432, "global_step": 33950, "epoch": 202} {"train_loss": -7.553440570831299, "global_step": 33951, "epoch": 202} {"train_loss": -7.476864814758301, "global_step": 33952, "epoch": 202} {"train_loss": -7.397956848144531, "global_step": 33953, "epoch": 202} {"train_loss": -7.639123916625977, "global_step": 33954, "epoch": 202} {"train_loss": -7.584343910217285, "global_step": 33955, "epoch": 202} {"train_loss": -7.355747222900391, "global_step": 33956, "epoch": 202} {"train_loss": -7.512274265289307, "global_step": 33957, "epoch": 202} {"train_loss": -7.713637351989746, "global_step": 33958, "epoch": 202} {"train_loss": -7.6117353439331055, "global_step": 33959, "epoch": 202} {"train_loss": -7.324788570404053, "global_step": 33960, "epoch": 202} {"train_loss": -7.505097389221191, "global_step": 33961, "epoch": 202} {"train_loss": -7.591461181640625, "global_step": 33962, "epoch": 202} {"train_loss": -7.5499982833862305, "global_step": 33963, "epoch": 202} {"train_loss": -7.5324296951293945, "global_step": 33964, "epoch": 202} {"train_loss": -7.725069522857666, "global_step": 33965, "epoch": 202} {"train_loss": -7.653336524963379, "global_step": 33966, "epoch": 202} {"train_loss": -7.714822769165039, "global_step": 33967, "epoch": 202} {"train_loss": -7.586450576782227, "global_step": 33968, "epoch": 202} {"train_loss": -7.820005416870117, "global_step": 33969, "epoch": 202} {"train_loss": -7.840249061584473, "global_step": 33970, "epoch": 202} {"train_loss": -7.694961071014404, "global_step": 33971, "epoch": 202} {"train_loss": -7.513252258300781, "global_step": 33972, "epoch": 202} {"train_loss": -7.576891899108887, "global_step": 33973, "epoch": 202} {"train_loss": -7.46157169342041, "global_step": 33974, "epoch": 202} {"train_loss": -7.357949256896973, "global_step": 33975, "epoch": 202} {"train_loss": -7.58843469619751, "global_step": 33976, "epoch": 202} {"train_loss": -7.777774810791016, "global_step": 33977, "epoch": 202} {"train_loss": -7.519601821899414, "global_step": 33978, "epoch": 202} {"train_loss": -7.3831868171691895, "global_step": 33979, "epoch": 202} {"train_loss": -7.602790832519531, "global_step": 33980, "epoch": 202} {"train_loss": -7.626327991485596, "global_step": 33981, "epoch": 202} {"train_loss": -7.441482067108154, "global_step": 33982, "epoch": 202} {"train_loss": -7.5551958084106445, "global_step": 33983, "epoch": 202} {"train_loss": -7.858109474182129, "global_step": 33984, "epoch": 202} {"train_loss": -7.621641635894775, "global_step": 33985, "epoch": 202} {"train_loss": -7.701213836669922, "global_step": 33986, "epoch": 202} {"train_loss": -7.785635948181152, "global_step": 33987, "epoch": 202} {"train_loss": -7.596419334411621, "global_step": 33988, "epoch": 202} {"train_loss": -7.618695259094238, "global_step": 33989, "epoch": 202} {"train_loss": -7.443371772766113, "global_step": 33990, "epoch": 202} {"train_loss": -7.506293773651123, "global_step": 33991, "epoch": 202} {"train_loss": -7.443788528442383, "global_step": 33992, "epoch": 202} {"train_loss": -7.330381393432617, "global_step": 33993, "epoch": 202} {"train_loss": -7.701526165008545, "global_step": 33994, "epoch": 202} {"train_loss": -7.434242248535156, "global_step": 33995, "epoch": 202} {"train_loss": -7.651665210723877, "global_step": 33996, "epoch": 202} {"train_loss": -7.530590057373047, "global_step": 33997, "epoch": 202} {"train_loss": -7.6447343826293945, "global_step": 33998, "epoch": 202} {"train_loss": -7.515833377838135, "global_step": 33999, "epoch": 202} {"train_loss": -7.570484161376953, "global_step": 34000, "epoch": 202} {"train_loss": -7.740106582641602, "global_step": 34001, "epoch": 202} {"train_loss": -7.445585250854492, "global_step": 34002, "epoch": 202} {"train_loss": -7.504165172576904, "global_step": 34003, "epoch": 202} {"train_loss": -7.668770790100098, "global_step": 34004, "epoch": 202} {"train_loss": -7.623215198516846, "global_step": 34005, "epoch": 202} {"train_loss": -7.313321590423584, "global_step": 34006, "epoch": 202} {"train_loss": -7.588076591491699, "global_step": 34007, "epoch": 202} {"train_loss": -7.660216808319092, "global_step": 34008, "epoch": 202} {"train_loss": -7.529691219329834, "global_step": 34009, "epoch": 202} {"train_loss": -7.733636856079102, "global_step": 34010, "epoch": 202} {"train_loss": -7.719444274902344, "global_step": 34011, "epoch": 202} {"train_loss": -7.289724349975586, "global_step": 34012, "epoch": 202} {"train_loss": -7.775802135467529, "global_step": 34013, "epoch": 202} {"train_loss": -7.5196919441223145, "global_step": 34014, "epoch": 202} {"train_loss": -7.774753093719482, "global_step": 34015, "epoch": 202} {"train_loss": -7.516174793243408, "global_step": 34016, "epoch": 202} {"train_loss": -7.7560014724731445, "global_step": 34017, "epoch": 202} {"train_loss": -7.833850860595703, "global_step": 34018, "epoch": 202} {"train_loss": -7.782143592834473, "global_step": 34019, "epoch": 202} {"train_loss": -7.498756408691406, "global_step": 34020, "epoch": 202} {"train_loss": -7.383954048156738, "global_step": 34021, "epoch": 202} {"train_loss": -7.679364204406738, "global_step": 34022, "epoch": 202} {"train_loss": -7.613146781921387, "global_step": 34023, "epoch": 202} {"train_loss": -7.649470329284668, "global_step": 34024, "epoch": 202} {"train_loss": -7.7488298416137695, "global_step": 34025, "epoch": 202} {"train_loss": -7.525225639343262, "global_step": 34026, "epoch": 202} {"train_loss": -7.5224103927612305, "global_step": 34027, "epoch": 202} {"train_loss": -7.447307109832764, "global_step": 34028, "epoch": 202} {"train_loss": -7.415502548217773, "global_step": 34029, "epoch": 202} {"train_loss": -7.551936149597168, "global_step": 34030, "epoch": 202} {"train_loss": -7.480057716369629, "global_step": 34031, "epoch": 202} {"train_loss": -7.519099235534668, "global_step": 34032, "epoch": 202} {"train_loss": -7.631765842437744, "global_step": 34033, "epoch": 202} {"train_loss": -7.654248237609863, "global_step": 34034, "epoch": 202} {"train_loss": -7.6430158615112305, "global_step": 34035, "epoch": 202} {"train_loss": -7.679352283477783, "global_step": 34036, "epoch": 202} {"train_loss": -7.639774322509766, "global_step": 34037, "epoch": 202} {"train_loss": -7.520856857299805, "global_step": 34038, "epoch": 202} {"train_loss": -7.596203327178955, "global_step": 34039, "epoch": 202} {"train_loss": -7.533505439758301, "global_step": 34040, "epoch": 202} {"train_loss": -7.608841896057129, "global_step": 34041, "epoch": 202} {"train_loss": -7.543173789978027, "global_step": 34042, "epoch": 202} {"train_loss": -7.568055152893066, "global_step": 34043, "epoch": 202} {"train_loss": -7.746578693389893, "global_step": 34044, "epoch": 202} {"train_loss": -7.792719841003418, "global_step": 34045, "epoch": 202} {"train_loss": -7.659612655639648, "global_step": 34046, "epoch": 202} {"train_loss": -7.739127159118652, "global_step": 34047, "epoch": 202} {"train_loss": -7.711239814758301, "global_step": 34048, "epoch": 202} {"train_loss": -7.4830217361450195, "global_step": 34049, "epoch": 202} {"train_loss": -7.564639568328857, "global_step": 34050, "epoch": 202} {"train_loss": -7.5784783363342285, "global_step": 34051, "epoch": 202} {"train_loss": -7.7346038818359375, "global_step": 34052, "epoch": 202} {"train_loss": -7.690349578857422, "global_step": 34053, "epoch": 202} {"train_loss": -7.589240074157715, "global_step": 34054, "epoch": 202} {"train_loss": -7.591839790344238, "global_step": 34055, "epoch": 202} {"train_loss": -7.846834182739258, "global_step": 34056, "epoch": 202} {"train_loss": -7.7295684814453125, "global_step": 34057, "epoch": 202} {"train_loss": -7.686130523681641, "global_step": 34058, "epoch": 202} {"train_loss": -7.457970142364502, "global_step": 34059, "epoch": 202} {"train_loss": -7.6983842849731445, "global_step": 34060, "epoch": 202} {"train_loss": -7.792360782623291, "global_step": 34061, "epoch": 202} {"train_loss": -7.516345500946045, "global_step": 34062, "epoch": 202} {"train_loss": -7.778202056884766, "global_step": 34063, "epoch": 202} {"train_loss": -7.505236625671387, "global_step": 34064, "epoch": 202} {"train_loss": -7.539515018463135, "global_step": 34065, "epoch": 202} {"train_loss": -7.642602443695068, "global_step": 34066, "epoch": 202} {"train_loss": -7.592967987060547, "global_step": 34067, "epoch": 202} {"train_loss": -7.862600326538086, "global_step": 34068, "epoch": 202} {"train_loss": -7.709433555603027, "global_step": 34069, "epoch": 202} {"train_loss": -7.427378177642822, "global_step": 34070, "epoch": 202} {"train_loss": -7.815150737762451, "global_step": 34071, "epoch": 202} {"train_loss": -7.464607238769531, "global_step": 34072, "epoch": 202} {"train_loss": -7.720431804656982, "global_step": 34073, "epoch": 202} {"train_loss": -7.534633636474609, "global_step": 34074, "epoch": 202} {"train_loss": -7.73892879486084, "global_step": 34075, "epoch": 202} {"train_loss": -7.721735954284668, "global_step": 34076, "epoch": 202} {"train_loss": -7.647336483001709, "global_step": 34077, "epoch": 202} {"train_loss": -7.60304069519043, "global_step": 34078, "epoch": 202} {"train_loss": -7.35301399230957, "global_step": 34079, "epoch": 202} {"train_loss": -7.612693786621094, "global_step": 34080, "epoch": 202} {"train_loss": -7.648872375488281, "global_step": 34081, "epoch": 202} {"train_loss": -7.824796676635742, "global_step": 34082, "epoch": 202} {"train_loss": -7.532587051391602, "global_step": 34083, "epoch": 202} {"train_loss": -7.645176887512207, "global_step": 34084, "epoch": 202} {"train_loss": -7.7365312576293945, "global_step": 34085, "epoch": 202} {"train_loss": -7.704005241394043, "global_step": 34086, "epoch": 202} {"train_loss": -7.60408878326416, "global_step": 34087, "epoch": 202} {"train_loss": -7.671046257019043, "global_step": 34088, "epoch": 202} {"train_loss": -7.947960376739502, "global_step": 34089, "epoch": 202} {"train_loss": -7.781611442565918, "global_step": 34090, "epoch": 202} {"train_loss": -7.761205673217773, "global_step": 34091, "epoch": 202} {"train_loss": -7.852105140686035, "global_step": 34092, "epoch": 202} {"train_loss": -7.5890703201293945, "global_step": 34093, "epoch": 202} {"train_loss": -7.840672016143799, "global_step": 34094, "epoch": 202} {"train_loss": -7.749554634094238, "global_step": 34095, "epoch": 202} {"train_loss": -7.864346504211426, "global_step": 34096, "epoch": 202} {"train_loss": -7.662508010864258, "global_step": 34097, "epoch": 202} {"train_loss": -7.77817964553833, "global_step": 34098, "epoch": 202} {"train_loss": -7.7295637130737305, "global_step": 34099, "epoch": 202} {"train_loss": -7.9776835441589355, "global_step": 34100, "epoch": 202} {"train_loss": -7.904333591461182, "global_step": 34101, "epoch": 202} {"train_loss": -7.913510799407959, "global_step": 34102, "epoch": 202} {"train_loss": -7.62352914185751, "global_step": 34103, "epoch": 202, "val_loss": 188500.515625} {"train_loss": -7.8110198974609375, "global_step": 34104, "epoch": 203} {"train_loss": -7.811199188232422, "global_step": 34105, "epoch": 203} {"train_loss": -7.723242282867432, "global_step": 34106, "epoch": 203} {"train_loss": -7.811428070068359, "global_step": 34107, "epoch": 203} {"train_loss": -7.565838813781738, "global_step": 34108, "epoch": 203} {"train_loss": -7.710031509399414, "global_step": 34109, "epoch": 203} {"train_loss": -7.516537189483643, "global_step": 34110, "epoch": 203} {"train_loss": -7.481095314025879, "global_step": 34111, "epoch": 203} {"train_loss": -7.677862644195557, "global_step": 34112, "epoch": 203} {"train_loss": -7.532304763793945, "global_step": 34113, "epoch": 203} {"train_loss": -7.749573707580566, "global_step": 34114, "epoch": 203} {"train_loss": -7.5952253341674805, "global_step": 34115, "epoch": 203} {"train_loss": -7.847120761871338, "global_step": 34116, "epoch": 203} {"train_loss": -7.8346662521362305, "global_step": 34117, "epoch": 203} {"train_loss": -7.625763893127441, "global_step": 34118, "epoch": 203} {"train_loss": -7.619681358337402, "global_step": 34119, "epoch": 203} {"train_loss": -7.564144134521484, "global_step": 34120, "epoch": 203} {"train_loss": -7.533962249755859, "global_step": 34121, "epoch": 203} {"train_loss": -7.484766006469727, "global_step": 34122, "epoch": 203} {"train_loss": -7.424896240234375, "global_step": 34123, "epoch": 203} {"train_loss": -7.566247940063477, "global_step": 34124, "epoch": 203} {"train_loss": -7.607109546661377, "global_step": 34125, "epoch": 203} {"train_loss": -7.438665390014648, "global_step": 34126, "epoch": 203} {"train_loss": -7.553638935089111, "global_step": 34127, "epoch": 203} {"train_loss": -7.654088973999023, "global_step": 34128, "epoch": 203} {"train_loss": -7.703539848327637, "global_step": 34129, "epoch": 203} {"train_loss": -7.690563201904297, "global_step": 34130, "epoch": 203} {"train_loss": -7.7486467361450195, "global_step": 34131, "epoch": 203} {"train_loss": -7.713177680969238, "global_step": 34132, "epoch": 203} {"train_loss": -7.509507179260254, "global_step": 34133, "epoch": 203} {"train_loss": -7.78579568862915, "global_step": 34134, "epoch": 203} {"train_loss": -7.774848937988281, "global_step": 34135, "epoch": 203} {"train_loss": -7.7173027992248535, "global_step": 34136, "epoch": 203} {"train_loss": -7.739208221435547, "global_step": 34137, "epoch": 203} {"train_loss": -7.588467597961426, "global_step": 34138, "epoch": 203} {"train_loss": -7.96948766708374, "global_step": 34139, "epoch": 203} {"train_loss": -7.675495147705078, "global_step": 34140, "epoch": 203} {"train_loss": -7.821035385131836, "global_step": 34141, "epoch": 203} {"train_loss": -7.978523254394531, "global_step": 34142, "epoch": 203} {"train_loss": -7.540401458740234, "global_step": 34143, "epoch": 203} {"train_loss": -7.573099136352539, "global_step": 34144, "epoch": 203} {"train_loss": -7.866827487945557, "global_step": 34145, "epoch": 203} {"train_loss": -7.94996452331543, "global_step": 34146, "epoch": 203} {"train_loss": -7.671197414398193, "global_step": 34147, "epoch": 203} {"train_loss": -7.574451446533203, "global_step": 34148, "epoch": 203} {"train_loss": -7.534847736358643, "global_step": 34149, "epoch": 203} {"train_loss": -7.589689254760742, "global_step": 34150, "epoch": 203} {"train_loss": -7.653541564941406, "global_step": 34151, "epoch": 203} {"train_loss": -7.330242156982422, "global_step": 34152, "epoch": 203} {"train_loss": -7.816362380981445, "global_step": 34153, "epoch": 203} {"train_loss": -7.3634819984436035, "global_step": 34154, "epoch": 203} {"train_loss": -7.532993316650391, "global_step": 34155, "epoch": 203} {"train_loss": -7.514822959899902, "global_step": 34156, "epoch": 203} {"train_loss": -7.535180568695068, "global_step": 34157, "epoch": 203} {"train_loss": -7.400773525238037, "global_step": 34158, "epoch": 203} {"train_loss": -7.489518642425537, "global_step": 34159, "epoch": 203} {"train_loss": -7.585205078125, "global_step": 34160, "epoch": 203} {"train_loss": -7.55416202545166, "global_step": 34161, "epoch": 203} {"train_loss": -7.704005241394043, "global_step": 34162, "epoch": 203} {"train_loss": -7.632651329040527, "global_step": 34163, "epoch": 203} {"train_loss": -7.493206024169922, "global_step": 34164, "epoch": 203} {"train_loss": -7.582335472106934, "global_step": 34165, "epoch": 203} {"train_loss": -7.5987467765808105, "global_step": 34166, "epoch": 203} {"train_loss": -7.728035926818848, "global_step": 34167, "epoch": 203} {"train_loss": -7.71393346786499, "global_step": 34168, "epoch": 203} {"train_loss": -7.641908645629883, "global_step": 34169, "epoch": 203} {"train_loss": -7.876387596130371, "global_step": 34170, "epoch": 203} {"train_loss": -7.747833251953125, "global_step": 34171, "epoch": 203} {"train_loss": -7.6855010986328125, "global_step": 34172, "epoch": 203} {"train_loss": -7.773931503295898, "global_step": 34173, "epoch": 203} {"train_loss": -7.570947647094727, "global_step": 34174, "epoch": 203} {"train_loss": -7.7437005043029785, "global_step": 34175, "epoch": 203} {"train_loss": -7.790647506713867, "global_step": 34176, "epoch": 203} {"train_loss": -7.658803939819336, "global_step": 34177, "epoch": 203} {"train_loss": -7.83354377746582, "global_step": 34178, "epoch": 203} {"train_loss": -7.9464111328125, "global_step": 34179, "epoch": 203} {"train_loss": -7.604647636413574, "global_step": 34180, "epoch": 203} {"train_loss": -7.8065996170043945, "global_step": 34181, "epoch": 203} {"train_loss": -7.567239284515381, "global_step": 34182, "epoch": 203} {"train_loss": -8.02541732788086, "global_step": 34183, "epoch": 203} {"train_loss": -7.804992198944092, "global_step": 34184, "epoch": 203} {"train_loss": -7.740762710571289, "global_step": 34185, "epoch": 203} {"train_loss": -7.591156005859375, "global_step": 34186, "epoch": 203} {"train_loss": -7.532703399658203, "global_step": 34187, "epoch": 203} {"train_loss": -7.828473091125488, "global_step": 34188, "epoch": 203} {"train_loss": -7.604963302612305, "global_step": 34189, "epoch": 203} {"train_loss": -7.773807525634766, "global_step": 34190, "epoch": 203} {"train_loss": -7.503079891204834, "global_step": 34191, "epoch": 203} {"train_loss": -7.507830619812012, "global_step": 34192, "epoch": 203} {"train_loss": -7.627872467041016, "global_step": 34193, "epoch": 203} {"train_loss": -7.402135848999023, "global_step": 34194, "epoch": 203} {"train_loss": -7.619091987609863, "global_step": 34195, "epoch": 203} {"train_loss": -7.591038703918457, "global_step": 34196, "epoch": 203} {"train_loss": -7.659708023071289, "global_step": 34197, "epoch": 203} {"train_loss": -7.67938756942749, "global_step": 34198, "epoch": 203} {"train_loss": -7.460628509521484, "global_step": 34199, "epoch": 203} {"train_loss": -7.708228588104248, "global_step": 34200, "epoch": 203} {"train_loss": -7.6207427978515625, "global_step": 34201, "epoch": 203} {"train_loss": -7.670009613037109, "global_step": 34202, "epoch": 203} {"train_loss": -7.518846035003662, "global_step": 34203, "epoch": 203} {"train_loss": -7.598714351654053, "global_step": 34204, "epoch": 203} {"train_loss": -7.6265153884887695, "global_step": 34205, "epoch": 203} {"train_loss": -7.833559036254883, "global_step": 34206, "epoch": 203} {"train_loss": -7.57916784286499, "global_step": 34207, "epoch": 203} {"train_loss": -7.566174030303955, "global_step": 34208, "epoch": 203} {"train_loss": -7.511458396911621, "global_step": 34209, "epoch": 203} {"train_loss": -7.69526481628418, "global_step": 34210, "epoch": 203} {"train_loss": -7.665196418762207, "global_step": 34211, "epoch": 203} {"train_loss": -7.637325286865234, "global_step": 34212, "epoch": 203} {"train_loss": -7.393448352813721, "global_step": 34213, "epoch": 203} {"train_loss": -7.581006050109863, "global_step": 34214, "epoch": 203} {"train_loss": -7.569778919219971, "global_step": 34215, "epoch": 203} {"train_loss": -7.7201433181762695, "global_step": 34216, "epoch": 203} {"train_loss": -7.509485244750977, "global_step": 34217, "epoch": 203} {"train_loss": -7.310840129852295, "global_step": 34218, "epoch": 203} {"train_loss": -7.488059997558594, "global_step": 34219, "epoch": 203} {"train_loss": -7.379020690917969, "global_step": 34220, "epoch": 203} {"train_loss": -7.6905107498168945, "global_step": 34221, "epoch": 203} {"train_loss": -7.447258949279785, "global_step": 34222, "epoch": 203} {"train_loss": -7.42141056060791, "global_step": 34223, "epoch": 203} {"train_loss": -7.560333251953125, "global_step": 34224, "epoch": 203} {"train_loss": -7.511639595031738, "global_step": 34225, "epoch": 203} {"train_loss": -7.584771633148193, "global_step": 34226, "epoch": 203} {"train_loss": -7.617402076721191, "global_step": 34227, "epoch": 203} {"train_loss": -7.559745788574219, "global_step": 34228, "epoch": 203} {"train_loss": -7.580801010131836, "global_step": 34229, "epoch": 203} {"train_loss": -7.305640697479248, "global_step": 34230, "epoch": 203} {"train_loss": -7.339545249938965, "global_step": 34231, "epoch": 203} {"train_loss": -7.8101067543029785, "global_step": 34232, "epoch": 203} {"train_loss": -7.5484724044799805, "global_step": 34233, "epoch": 203} {"train_loss": -7.5021491050720215, "global_step": 34234, "epoch": 203} {"train_loss": -7.56351375579834, "global_step": 34235, "epoch": 203} {"train_loss": -7.760990142822266, "global_step": 34236, "epoch": 203} {"train_loss": -7.524805068969727, "global_step": 34237, "epoch": 203} {"train_loss": -7.643805503845215, "global_step": 34238, "epoch": 203} {"train_loss": -7.649314880371094, "global_step": 34239, "epoch": 203} {"train_loss": -7.67349100112915, "global_step": 34240, "epoch": 203} {"train_loss": -7.463925361633301, "global_step": 34241, "epoch": 203} {"train_loss": -7.700543403625488, "global_step": 34242, "epoch": 203} {"train_loss": -7.899611949920654, "global_step": 34243, "epoch": 203} {"train_loss": -7.755890846252441, "global_step": 34244, "epoch": 203} {"train_loss": -7.840886116027832, "global_step": 34245, "epoch": 203} {"train_loss": -7.8482770919799805, "global_step": 34246, "epoch": 203} {"train_loss": -7.900383472442627, "global_step": 34247, "epoch": 203} {"train_loss": -7.7304487228393555, "global_step": 34248, "epoch": 203} {"train_loss": -7.544854164123535, "global_step": 34249, "epoch": 203} {"train_loss": -7.707932472229004, "global_step": 34250, "epoch": 203} {"train_loss": -7.471010684967041, "global_step": 34251, "epoch": 203} {"train_loss": -7.530117034912109, "global_step": 34252, "epoch": 203} {"train_loss": -7.782012939453125, "global_step": 34253, "epoch": 203} {"train_loss": -7.570845127105713, "global_step": 34254, "epoch": 203} {"train_loss": -7.573912143707275, "global_step": 34255, "epoch": 203} {"train_loss": -7.651299953460693, "global_step": 34256, "epoch": 203} {"train_loss": -7.553976535797119, "global_step": 34257, "epoch": 203} {"train_loss": -7.446075439453125, "global_step": 34258, "epoch": 203} {"train_loss": -7.665214538574219, "global_step": 34259, "epoch": 203} {"train_loss": -7.698781967163086, "global_step": 34260, "epoch": 203} {"train_loss": -7.7360615730285645, "global_step": 34261, "epoch": 203} {"train_loss": -7.396592140197754, "global_step": 34262, "epoch": 203} {"train_loss": -7.8178815841674805, "global_step": 34263, "epoch": 203} {"train_loss": -7.691614151000977, "global_step": 34264, "epoch": 203} {"train_loss": -7.498228549957275, "global_step": 34265, "epoch": 203} {"train_loss": -7.547820091247559, "global_step": 34266, "epoch": 203} {"train_loss": -7.868310928344727, "global_step": 34267, "epoch": 203} {"train_loss": -8.129621505737305, "global_step": 34268, "epoch": 203} {"train_loss": -7.697815895080566, "global_step": 34269, "epoch": 203} {"train_loss": -7.5927863121032715, "global_step": 34270, "epoch": 203} {"train_loss": -7.640265368279957, "global_step": 34271, "epoch": 203, "val_loss": 187445.984375} {"train_loss": -7.758810997009277, "global_step": 34272, "epoch": 204} {"train_loss": -7.718349456787109, "global_step": 34273, "epoch": 204} {"train_loss": -7.454278469085693, "global_step": 34274, "epoch": 204} {"train_loss": -7.6514153480529785, "global_step": 34275, "epoch": 204} {"train_loss": -7.606264591217041, "global_step": 34276, "epoch": 204} {"train_loss": -7.685087203979492, "global_step": 34277, "epoch": 204} {"train_loss": -7.844604015350342, "global_step": 34278, "epoch": 204} {"train_loss": -7.676516532897949, "global_step": 34279, "epoch": 204} {"train_loss": -7.653552532196045, "global_step": 34280, "epoch": 204} {"train_loss": -7.717629432678223, "global_step": 34281, "epoch": 204} {"train_loss": -7.846118927001953, "global_step": 34282, "epoch": 204} {"train_loss": -7.814377307891846, "global_step": 34283, "epoch": 204} {"train_loss": -7.832484245300293, "global_step": 34284, "epoch": 204} {"train_loss": -7.950105667114258, "global_step": 34285, "epoch": 204} {"train_loss": -7.957145690917969, "global_step": 34286, "epoch": 204} {"train_loss": -7.716299533843994, "global_step": 34287, "epoch": 204} {"train_loss": -7.944293022155762, "global_step": 34288, "epoch": 204} {"train_loss": -7.775763511657715, "global_step": 34289, "epoch": 204} {"train_loss": -7.775548934936523, "global_step": 34290, "epoch": 204} {"train_loss": -7.907744884490967, "global_step": 34291, "epoch": 204} {"train_loss": -7.863524913787842, "global_step": 34292, "epoch": 204} {"train_loss": -7.632061004638672, "global_step": 34293, "epoch": 204} {"train_loss": -7.81648063659668, "global_step": 34294, "epoch": 204} {"train_loss": -7.995011806488037, "global_step": 34295, "epoch": 204} {"train_loss": -7.713877201080322, "global_step": 34296, "epoch": 204} {"train_loss": -7.786495685577393, "global_step": 34297, "epoch": 204} {"train_loss": -7.753200531005859, "global_step": 34298, "epoch": 204} {"train_loss": -7.892080307006836, "global_step": 34299, "epoch": 204} {"train_loss": -7.832676887512207, "global_step": 34300, "epoch": 204} {"train_loss": -7.486546993255615, "global_step": 34301, "epoch": 204} {"train_loss": -7.678082466125488, "global_step": 34302, "epoch": 204} {"train_loss": -7.641594886779785, "global_step": 34303, "epoch": 204} {"train_loss": -7.6942548751831055, "global_step": 34304, "epoch": 204} {"train_loss": -7.7830891609191895, "global_step": 34305, "epoch": 204} {"train_loss": -7.882112979888916, "global_step": 34306, "epoch": 204} {"train_loss": -7.87369441986084, "global_step": 34307, "epoch": 204} {"train_loss": -7.739200592041016, "global_step": 34308, "epoch": 204} {"train_loss": -7.6680426597595215, "global_step": 34309, "epoch": 204} {"train_loss": -7.677554607391357, "global_step": 34310, "epoch": 204} {"train_loss": -7.552171230316162, "global_step": 34311, "epoch": 204} {"train_loss": -7.793131351470947, "global_step": 34312, "epoch": 204} {"train_loss": -7.567925453186035, "global_step": 34313, "epoch": 204} {"train_loss": -7.526839256286621, "global_step": 34314, "epoch": 204} {"train_loss": -7.62031364440918, "global_step": 34315, "epoch": 204} {"train_loss": -7.59245491027832, "global_step": 34316, "epoch": 204} {"train_loss": -7.575798988342285, "global_step": 34317, "epoch": 204} {"train_loss": -7.669168472290039, "global_step": 34318, "epoch": 204} {"train_loss": -7.836491584777832, "global_step": 34319, "epoch": 204} {"train_loss": -7.623885154724121, "global_step": 34320, "epoch": 204} {"train_loss": -7.731399059295654, "global_step": 34321, "epoch": 204} {"train_loss": -7.298964500427246, "global_step": 34322, "epoch": 204} {"train_loss": -7.5527448654174805, "global_step": 34323, "epoch": 204} {"train_loss": -7.575754642486572, "global_step": 34324, "epoch": 204} {"train_loss": -7.73432731628418, "global_step": 34325, "epoch": 204} {"train_loss": -7.757868766784668, "global_step": 34326, "epoch": 204} {"train_loss": -7.645155906677246, "global_step": 34327, "epoch": 204} {"train_loss": -7.866985321044922, "global_step": 34328, "epoch": 204} {"train_loss": -7.482124328613281, "global_step": 34329, "epoch": 204} {"train_loss": -7.721290111541748, "global_step": 34330, "epoch": 204} {"train_loss": -7.940042495727539, "global_step": 34331, "epoch": 204} {"train_loss": -7.750454902648926, "global_step": 34332, "epoch": 204} {"train_loss": -7.435641288757324, "global_step": 34333, "epoch": 204} {"train_loss": -7.895014762878418, "global_step": 34334, "epoch": 204} {"train_loss": -7.7201080322265625, "global_step": 34335, "epoch": 204} {"train_loss": -7.732931137084961, "global_step": 34336, "epoch": 204} {"train_loss": -7.565178871154785, "global_step": 34337, "epoch": 204} {"train_loss": -7.805088043212891, "global_step": 34338, "epoch": 204} {"train_loss": -7.730190277099609, "global_step": 34339, "epoch": 204} {"train_loss": -7.857839584350586, "global_step": 34340, "epoch": 204} {"train_loss": -7.7365336418151855, "global_step": 34341, "epoch": 204} {"train_loss": -7.661625385284424, "global_step": 34342, "epoch": 204} {"train_loss": -7.721449851989746, "global_step": 34343, "epoch": 204} {"train_loss": -7.833911418914795, "global_step": 34344, "epoch": 204} {"train_loss": -7.972155570983887, "global_step": 34345, "epoch": 204} {"train_loss": -7.504451751708984, "global_step": 34346, "epoch": 204} {"train_loss": -7.913538455963135, "global_step": 34347, "epoch": 204} {"train_loss": -7.23004674911499, "global_step": 34348, "epoch": 204} {"train_loss": -7.592211723327637, "global_step": 34349, "epoch": 204} {"train_loss": -7.066570281982422, "global_step": 34350, "epoch": 204} {"train_loss": -7.543020248413086, "global_step": 34351, "epoch": 204} {"train_loss": -7.369915008544922, "global_step": 34352, "epoch": 204} {"train_loss": -7.715770244598389, "global_step": 34353, "epoch": 204} {"train_loss": -7.720536231994629, "global_step": 34354, "epoch": 204} {"train_loss": -7.741954326629639, "global_step": 34355, "epoch": 204} {"train_loss": -7.384940147399902, "global_step": 34356, "epoch": 204} {"train_loss": -7.695363998413086, "global_step": 34357, "epoch": 204} {"train_loss": -7.728857040405273, "global_step": 34358, "epoch": 204} {"train_loss": -7.645064830780029, "global_step": 34359, "epoch": 204} {"train_loss": -7.710178375244141, "global_step": 34360, "epoch": 204} {"train_loss": -7.541919708251953, "global_step": 34361, "epoch": 204} {"train_loss": -7.877466201782227, "global_step": 34362, "epoch": 204} {"train_loss": -7.221096038818359, "global_step": 34363, "epoch": 204} {"train_loss": -7.876208305358887, "global_step": 34364, "epoch": 204} {"train_loss": -7.51392936706543, "global_step": 34365, "epoch": 204} {"train_loss": -7.558419704437256, "global_step": 34366, "epoch": 204} {"train_loss": -7.444009780883789, "global_step": 34367, "epoch": 204} {"train_loss": -7.448728084564209, "global_step": 34368, "epoch": 204} {"train_loss": -7.42500638961792, "global_step": 34369, "epoch": 204} {"train_loss": -7.5663323402404785, "global_step": 34370, "epoch": 204} {"train_loss": -7.487215042114258, "global_step": 34371, "epoch": 204} {"train_loss": -7.599631309509277, "global_step": 34372, "epoch": 204} {"train_loss": -7.075558185577393, "global_step": 34373, "epoch": 204} {"train_loss": -7.569201946258545, "global_step": 34374, "epoch": 204} {"train_loss": -7.4355878829956055, "global_step": 34375, "epoch": 204} {"train_loss": -7.326118469238281, "global_step": 34376, "epoch": 204} {"train_loss": -7.595789909362793, "global_step": 34377, "epoch": 204} {"train_loss": -7.423780918121338, "global_step": 34378, "epoch": 204} {"train_loss": -7.838288307189941, "global_step": 34379, "epoch": 204} {"train_loss": -7.59981632232666, "global_step": 34380, "epoch": 204} {"train_loss": -7.569185256958008, "global_step": 34381, "epoch": 204} {"train_loss": -7.4565629959106445, "global_step": 34382, "epoch": 204} {"train_loss": -7.479577541351318, "global_step": 34383, "epoch": 204} {"train_loss": -7.727898597717285, "global_step": 34384, "epoch": 204} {"train_loss": -7.653892993927002, "global_step": 34385, "epoch": 204} {"train_loss": -7.7783660888671875, "global_step": 34386, "epoch": 204} {"train_loss": -7.423311710357666, "global_step": 34387, "epoch": 204} {"train_loss": -7.540816307067871, "global_step": 34388, "epoch": 204} {"train_loss": -7.510623931884766, "global_step": 34389, "epoch": 204} {"train_loss": -7.5247955322265625, "global_step": 34390, "epoch": 204} {"train_loss": -7.700020790100098, "global_step": 34391, "epoch": 204} {"train_loss": -7.154335021972656, "global_step": 34392, "epoch": 204} {"train_loss": -7.660209655761719, "global_step": 34393, "epoch": 204} {"train_loss": -7.360450744628906, "global_step": 34394, "epoch": 204} {"train_loss": -7.57802152633667, "global_step": 34395, "epoch": 204} {"train_loss": -7.65932559967041, "global_step": 34396, "epoch": 204} {"train_loss": -7.411924362182617, "global_step": 34397, "epoch": 204} {"train_loss": -7.652770042419434, "global_step": 34398, "epoch": 204} {"train_loss": -7.576602935791016, "global_step": 34399, "epoch": 204} {"train_loss": -7.88670015335083, "global_step": 34400, "epoch": 204} {"train_loss": -7.691082954406738, "global_step": 34401, "epoch": 204} {"train_loss": -7.671051979064941, "global_step": 34402, "epoch": 204} {"train_loss": -7.868193626403809, "global_step": 34403, "epoch": 204} {"train_loss": -7.531282424926758, "global_step": 34404, "epoch": 204} {"train_loss": -7.488678932189941, "global_step": 34405, "epoch": 204} {"train_loss": -7.500030517578125, "global_step": 34406, "epoch": 204} {"train_loss": -7.881319046020508, "global_step": 34407, "epoch": 204} {"train_loss": -7.713459014892578, "global_step": 34408, "epoch": 204} {"train_loss": -7.743921279907227, "global_step": 34409, "epoch": 204} {"train_loss": -7.462768077850342, "global_step": 34410, "epoch": 204} {"train_loss": -7.8183722496032715, "global_step": 34411, "epoch": 204} {"train_loss": -7.812234878540039, "global_step": 34412, "epoch": 204} {"train_loss": -7.58344841003418, "global_step": 34413, "epoch": 204} {"train_loss": -7.570080280303955, "global_step": 34414, "epoch": 204} {"train_loss": -7.732999801635742, "global_step": 34415, "epoch": 204} {"train_loss": -7.619602680206299, "global_step": 34416, "epoch": 204} {"train_loss": -7.687211990356445, "global_step": 34417, "epoch": 204} {"train_loss": -7.772636413574219, "global_step": 34418, "epoch": 204} {"train_loss": -7.553378105163574, "global_step": 34419, "epoch": 204} {"train_loss": -7.580406665802002, "global_step": 34420, "epoch": 204} {"train_loss": -7.857149124145508, "global_step": 34421, "epoch": 204} {"train_loss": -7.747018814086914, "global_step": 34422, "epoch": 204} {"train_loss": -7.859706401824951, "global_step": 34423, "epoch": 204} {"train_loss": -7.704488754272461, "global_step": 34424, "epoch": 204} {"train_loss": -7.698890209197998, "global_step": 34425, "epoch": 204} {"train_loss": -7.961150646209717, "global_step": 34426, "epoch": 204} {"train_loss": -7.861197471618652, "global_step": 34427, "epoch": 204} {"train_loss": -7.703997611999512, "global_step": 34428, "epoch": 204} {"train_loss": -7.778160095214844, "global_step": 34429, "epoch": 204} {"train_loss": -8.086308479309082, "global_step": 34430, "epoch": 204} {"train_loss": -7.915595054626465, "global_step": 34431, "epoch": 204} {"train_loss": -7.736706733703613, "global_step": 34432, "epoch": 204} {"train_loss": -7.797590255737305, "global_step": 34433, "epoch": 204} {"train_loss": -7.640996932983398, "global_step": 34434, "epoch": 204} {"train_loss": -7.460349082946777, "global_step": 34435, "epoch": 204} {"train_loss": -7.826848983764648, "global_step": 34436, "epoch": 204} {"train_loss": -7.682674407958984, "global_step": 34437, "epoch": 204} {"train_loss": -7.977535247802734, "global_step": 34438, "epoch": 204} {"train_loss": -7.669677751404898, "global_step": 34439, "epoch": 204, "val_loss": 186693.609375} {"train_loss": -7.572447776794434, "global_step": 34440, "epoch": 205} {"train_loss": -7.798405647277832, "global_step": 34441, "epoch": 205} {"train_loss": -7.656062126159668, "global_step": 34442, "epoch": 205} {"train_loss": -7.966471195220947, "global_step": 34443, "epoch": 205} {"train_loss": -7.741008758544922, "global_step": 34444, "epoch": 205} {"train_loss": -7.658364295959473, "global_step": 34445, "epoch": 205} {"train_loss": -7.2489166259765625, "global_step": 34446, "epoch": 205} {"train_loss": -7.506546497344971, "global_step": 34447, "epoch": 205} {"train_loss": -7.584660053253174, "global_step": 34448, "epoch": 205} {"train_loss": -7.459291458129883, "global_step": 34449, "epoch": 205} {"train_loss": -7.479094505310059, "global_step": 34450, "epoch": 205} {"train_loss": -7.514364242553711, "global_step": 34451, "epoch": 205} {"train_loss": -7.818851470947266, "global_step": 34452, "epoch": 205} {"train_loss": -7.547182083129883, "global_step": 34453, "epoch": 205} {"train_loss": -7.666611671447754, "global_step": 34454, "epoch": 205} {"train_loss": -7.650127410888672, "global_step": 34455, "epoch": 205} {"train_loss": -7.490991592407227, "global_step": 34456, "epoch": 205} {"train_loss": -7.763481140136719, "global_step": 34457, "epoch": 205} {"train_loss": -7.436575889587402, "global_step": 34458, "epoch": 205} {"train_loss": -7.500179290771484, "global_step": 34459, "epoch": 205} {"train_loss": -7.665114402770996, "global_step": 34460, "epoch": 205} {"train_loss": -7.631784915924072, "global_step": 34461, "epoch": 205} {"train_loss": -7.490923881530762, "global_step": 34462, "epoch": 205} {"train_loss": -7.683847904205322, "global_step": 34463, "epoch": 205} {"train_loss": -7.637977600097656, "global_step": 34464, "epoch": 205} {"train_loss": -7.671135902404785, "global_step": 34465, "epoch": 205} {"train_loss": -7.564148426055908, "global_step": 34466, "epoch": 205} {"train_loss": -7.873685836791992, "global_step": 34467, "epoch": 205} {"train_loss": -7.83395528793335, "global_step": 34468, "epoch": 205} {"train_loss": -7.607261657714844, "global_step": 34469, "epoch": 205} {"train_loss": -7.918694496154785, "global_step": 34470, "epoch": 205} {"train_loss": -7.785711288452148, "global_step": 34471, "epoch": 205} {"train_loss": -7.682844161987305, "global_step": 34472, "epoch": 205} {"train_loss": -7.748032093048096, "global_step": 34473, "epoch": 205} {"train_loss": -7.883746147155762, "global_step": 34474, "epoch": 205} {"train_loss": -7.834323406219482, "global_step": 34475, "epoch": 205} {"train_loss": -7.770698070526123, "global_step": 34476, "epoch": 205} {"train_loss": -7.436747074127197, "global_step": 34477, "epoch": 205} {"train_loss": -7.780084609985352, "global_step": 34478, "epoch": 205} {"train_loss": -7.489295482635498, "global_step": 34479, "epoch": 205} {"train_loss": -7.674779415130615, "global_step": 34480, "epoch": 205} {"train_loss": -7.640035629272461, "global_step": 34481, "epoch": 205} {"train_loss": -7.990199089050293, "global_step": 34482, "epoch": 205} {"train_loss": -7.727158069610596, "global_step": 34483, "epoch": 205} {"train_loss": -7.73935079574585, "global_step": 34484, "epoch": 205} {"train_loss": -7.736796855926514, "global_step": 34485, "epoch": 205} {"train_loss": -7.786769866943359, "global_step": 34486, "epoch": 205} {"train_loss": -7.600565433502197, "global_step": 34487, "epoch": 205} {"train_loss": -7.899250507354736, "global_step": 34488, "epoch": 205} {"train_loss": -7.7968058586120605, "global_step": 34489, "epoch": 205} {"train_loss": -7.839569091796875, "global_step": 34490, "epoch": 205} {"train_loss": -7.7091169357299805, "global_step": 34491, "epoch": 205} {"train_loss": -7.755580425262451, "global_step": 34492, "epoch": 205} {"train_loss": -7.889593124389648, "global_step": 34493, "epoch": 205} {"train_loss": -7.7166290283203125, "global_step": 34494, "epoch": 205} {"train_loss": -7.744663715362549, "global_step": 34495, "epoch": 205} {"train_loss": -7.718466758728027, "global_step": 34496, "epoch": 205} {"train_loss": -7.574418067932129, "global_step": 34497, "epoch": 205} {"train_loss": -7.476472854614258, "global_step": 34498, "epoch": 205} {"train_loss": -7.6127519607543945, "global_step": 34499, "epoch": 205} {"train_loss": -7.486104965209961, "global_step": 34500, "epoch": 205} {"train_loss": -7.679206371307373, "global_step": 34501, "epoch": 205} {"train_loss": -7.775577068328857, "global_step": 34502, "epoch": 205} {"train_loss": -7.771272659301758, "global_step": 34503, "epoch": 205} {"train_loss": -7.69080114364624, "global_step": 34504, "epoch": 205} {"train_loss": -7.379297256469727, "global_step": 34505, "epoch": 205} {"train_loss": -7.570951461791992, "global_step": 34506, "epoch": 205} {"train_loss": -7.661797523498535, "global_step": 34507, "epoch": 205} {"train_loss": -7.844424724578857, "global_step": 34508, "epoch": 205} {"train_loss": -7.865983009338379, "global_step": 34509, "epoch": 205} {"train_loss": -7.460378646850586, "global_step": 34510, "epoch": 205} {"train_loss": -7.400275707244873, "global_step": 34511, "epoch": 205} {"train_loss": -7.720044136047363, "global_step": 34512, "epoch": 205} {"train_loss": -7.40916633605957, "global_step": 34513, "epoch": 205} {"train_loss": -7.649267673492432, "global_step": 34514, "epoch": 205} {"train_loss": -7.736489295959473, "global_step": 34515, "epoch": 205} {"train_loss": -7.795869827270508, "global_step": 34516, "epoch": 205} {"train_loss": -7.663002967834473, "global_step": 34517, "epoch": 205} {"train_loss": -7.620716571807861, "global_step": 34518, "epoch": 205} {"train_loss": -7.7115020751953125, "global_step": 34519, "epoch": 205} {"train_loss": -7.408749580383301, "global_step": 34520, "epoch": 205} {"train_loss": -7.790657043457031, "global_step": 34521, "epoch": 205} {"train_loss": -7.918366432189941, "global_step": 34522, "epoch": 205} {"train_loss": -7.643258094787598, "global_step": 34523, "epoch": 205} {"train_loss": -7.624755859375, "global_step": 34524, "epoch": 205} {"train_loss": -7.766702651977539, "global_step": 34525, "epoch": 205} {"train_loss": -7.665040969848633, "global_step": 34526, "epoch": 205} {"train_loss": -7.59282112121582, "global_step": 34527, "epoch": 205} {"train_loss": -7.71194314956665, "global_step": 34528, "epoch": 205} {"train_loss": -7.9213361740112305, "global_step": 34529, "epoch": 205} {"train_loss": -7.605072021484375, "global_step": 34530, "epoch": 205} {"train_loss": -7.4115777015686035, "global_step": 34531, "epoch": 205} {"train_loss": -7.732596397399902, "global_step": 34532, "epoch": 205} {"train_loss": -7.576281547546387, "global_step": 34533, "epoch": 205} {"train_loss": -7.522465705871582, "global_step": 34534, "epoch": 205} {"train_loss": -7.6631879806518555, "global_step": 34535, "epoch": 205} {"train_loss": -7.405364036560059, "global_step": 34536, "epoch": 205} {"train_loss": -7.486815452575684, "global_step": 34537, "epoch": 205} {"train_loss": -7.404656410217285, "global_step": 34538, "epoch": 205} {"train_loss": -7.6101274490356445, "global_step": 34539, "epoch": 205} {"train_loss": -7.599490165710449, "global_step": 34540, "epoch": 205} {"train_loss": -7.247705459594727, "global_step": 34541, "epoch": 205} {"train_loss": -7.707335948944092, "global_step": 34542, "epoch": 205} {"train_loss": -7.164541244506836, "global_step": 34543, "epoch": 205} {"train_loss": -7.652626037597656, "global_step": 34544, "epoch": 205} {"train_loss": -7.536739349365234, "global_step": 34545, "epoch": 205} {"train_loss": -7.079248905181885, "global_step": 34546, "epoch": 205} {"train_loss": -7.734910011291504, "global_step": 34547, "epoch": 205} {"train_loss": -7.135920524597168, "global_step": 34548, "epoch": 205} {"train_loss": -7.364142894744873, "global_step": 34549, "epoch": 205} {"train_loss": -7.551889419555664, "global_step": 34550, "epoch": 205} {"train_loss": -7.327579021453857, "global_step": 34551, "epoch": 205} {"train_loss": -7.63651180267334, "global_step": 34552, "epoch": 205} {"train_loss": -7.406452655792236, "global_step": 34553, "epoch": 205} {"train_loss": -7.5501484870910645, "global_step": 34554, "epoch": 205} {"train_loss": -7.629812717437744, "global_step": 34555, "epoch": 205} {"train_loss": -7.631011009216309, "global_step": 34556, "epoch": 205} {"train_loss": -7.278960227966309, "global_step": 34557, "epoch": 205} {"train_loss": -7.68812370300293, "global_step": 34558, "epoch": 205} {"train_loss": -7.621601581573486, "global_step": 34559, "epoch": 205} {"train_loss": -7.630431652069092, "global_step": 34560, "epoch": 205} {"train_loss": -7.547014236450195, "global_step": 34561, "epoch": 205} {"train_loss": -7.621224403381348, "global_step": 34562, "epoch": 205} {"train_loss": -7.657968521118164, "global_step": 34563, "epoch": 205} {"train_loss": -7.689959526062012, "global_step": 34564, "epoch": 205} {"train_loss": -7.470149517059326, "global_step": 34565, "epoch": 205} {"train_loss": -7.580428123474121, "global_step": 34566, "epoch": 205} {"train_loss": -7.602251052856445, "global_step": 34567, "epoch": 205} {"train_loss": -7.892080783843994, "global_step": 34568, "epoch": 205} {"train_loss": -7.678346633911133, "global_step": 34569, "epoch": 205} {"train_loss": -7.55380392074585, "global_step": 34570, "epoch": 205} {"train_loss": -7.636603355407715, "global_step": 34571, "epoch": 205} {"train_loss": -7.5093183517456055, "global_step": 34572, "epoch": 205} {"train_loss": -7.766878128051758, "global_step": 34573, "epoch": 205} {"train_loss": -7.5544023513793945, "global_step": 34574, "epoch": 205} {"train_loss": -7.595858573913574, "global_step": 34575, "epoch": 205} {"train_loss": -7.477456569671631, "global_step": 34576, "epoch": 205} {"train_loss": -7.633140563964844, "global_step": 34577, "epoch": 205} {"train_loss": -7.52811336517334, "global_step": 34578, "epoch": 205} {"train_loss": -7.812182426452637, "global_step": 34579, "epoch": 205} {"train_loss": -7.670889854431152, "global_step": 34580, "epoch": 205} {"train_loss": -7.510123252868652, "global_step": 34581, "epoch": 205} {"train_loss": -7.466958045959473, "global_step": 34582, "epoch": 205} {"train_loss": -7.727145195007324, "global_step": 34583, "epoch": 205} {"train_loss": -7.503355979919434, "global_step": 34584, "epoch": 205} {"train_loss": -7.332314491271973, "global_step": 34585, "epoch": 205} {"train_loss": -7.8444929122924805, "global_step": 34586, "epoch": 205} {"train_loss": -7.360841751098633, "global_step": 34587, "epoch": 205} {"train_loss": -7.387937545776367, "global_step": 34588, "epoch": 205} {"train_loss": -7.450557708740234, "global_step": 34589, "epoch": 205} {"train_loss": -7.52653694152832, "global_step": 34590, "epoch": 205} {"train_loss": -7.242149829864502, "global_step": 34591, "epoch": 205} {"train_loss": -7.686534881591797, "global_step": 34592, "epoch": 205} {"train_loss": -7.6207475662231445, "global_step": 34593, "epoch": 205} {"train_loss": -7.786103248596191, "global_step": 34594, "epoch": 205} {"train_loss": -7.550344467163086, "global_step": 34595, "epoch": 205} {"train_loss": -7.6186723709106445, "global_step": 34596, "epoch": 205} {"train_loss": -7.554055690765381, "global_step": 34597, "epoch": 205} {"train_loss": -7.5819244384765625, "global_step": 34598, "epoch": 205} {"train_loss": -7.686735153198242, "global_step": 34599, "epoch": 205} {"train_loss": -7.750739574432373, "global_step": 34600, "epoch": 205} {"train_loss": -7.77836799621582, "global_step": 34601, "epoch": 205} {"train_loss": -7.714181900024414, "global_step": 34602, "epoch": 205} {"train_loss": -7.663516044616699, "global_step": 34603, "epoch": 205} {"train_loss": -7.44322395324707, "global_step": 34604, "epoch": 205} {"train_loss": -7.631035804748535, "global_step": 34605, "epoch": 205} {"train_loss": -7.62249755859375, "global_step": 34606, "epoch": 205} {"train_loss": -7.6229227383931475, "global_step": 34607, "epoch": 205, "val_loss": 186672.734375, "train_action_mse_error": 13.187006950378418} {"train_loss": -7.655713081359863, "global_step": 34608, "epoch": 206} {"train_loss": -7.721066474914551, "global_step": 34609, "epoch": 206} {"train_loss": -7.551959037780762, "global_step": 34610, "epoch": 206} {"train_loss": -7.822825908660889, "global_step": 34611, "epoch": 206} {"train_loss": -7.52985954284668, "global_step": 34612, "epoch": 206} {"train_loss": -7.858754634857178, "global_step": 34613, "epoch": 206} {"train_loss": -7.595136642456055, "global_step": 34614, "epoch": 206} {"train_loss": -7.984437942504883, "global_step": 34615, "epoch": 206} {"train_loss": -7.692877292633057, "global_step": 34616, "epoch": 206} {"train_loss": -7.631366729736328, "global_step": 34617, "epoch": 206} {"train_loss": -7.833089828491211, "global_step": 34618, "epoch": 206} {"train_loss": -7.838346481323242, "global_step": 34619, "epoch": 206} {"train_loss": -7.584283351898193, "global_step": 34620, "epoch": 206} {"train_loss": -7.853809356689453, "global_step": 34621, "epoch": 206} {"train_loss": -7.911135196685791, "global_step": 34622, "epoch": 206} {"train_loss": -7.780953407287598, "global_step": 34623, "epoch": 206} {"train_loss": -7.8636274337768555, "global_step": 34624, "epoch": 206} {"train_loss": -7.967164993286133, "global_step": 34625, "epoch": 206} {"train_loss": -7.987069606781006, "global_step": 34626, "epoch": 206} {"train_loss": -7.750583648681641, "global_step": 34627, "epoch": 206} {"train_loss": -7.8372626304626465, "global_step": 34628, "epoch": 206} {"train_loss": -8.066452980041504, "global_step": 34629, "epoch": 206} {"train_loss": -7.86602258682251, "global_step": 34630, "epoch": 206} {"train_loss": -7.883550643920898, "global_step": 34631, "epoch": 206} {"train_loss": -7.869905471801758, "global_step": 34632, "epoch": 206} {"train_loss": -7.954591751098633, "global_step": 34633, "epoch": 206} {"train_loss": -7.862689018249512, "global_step": 34634, "epoch": 206} {"train_loss": -7.856753349304199, "global_step": 34635, "epoch": 206} {"train_loss": -7.7412590980529785, "global_step": 34636, "epoch": 206} {"train_loss": -7.742496013641357, "global_step": 34637, "epoch": 206} {"train_loss": -7.766456604003906, "global_step": 34638, "epoch": 206} {"train_loss": -7.755513668060303, "global_step": 34639, "epoch": 206} {"train_loss": -7.616359710693359, "global_step": 34640, "epoch": 206} {"train_loss": -7.89508056640625, "global_step": 34641, "epoch": 206} {"train_loss": -7.693325996398926, "global_step": 34642, "epoch": 206} {"train_loss": -7.711752891540527, "global_step": 34643, "epoch": 206} {"train_loss": -7.6801276206970215, "global_step": 34644, "epoch": 206} {"train_loss": -7.61344575881958, "global_step": 34645, "epoch": 206} {"train_loss": -7.7180938720703125, "global_step": 34646, "epoch": 206} {"train_loss": -7.59536075592041, "global_step": 34647, "epoch": 206} {"train_loss": -7.5524139404296875, "global_step": 34648, "epoch": 206} {"train_loss": -7.815978527069092, "global_step": 34649, "epoch": 206} {"train_loss": -7.426774024963379, "global_step": 34650, "epoch": 206} {"train_loss": -7.55225944519043, "global_step": 34651, "epoch": 206} {"train_loss": -7.5333476066589355, "global_step": 34652, "epoch": 206} {"train_loss": -7.507954120635986, "global_step": 34653, "epoch": 206} {"train_loss": -7.6736555099487305, "global_step": 34654, "epoch": 206} {"train_loss": -7.761557579040527, "global_step": 34655, "epoch": 206} {"train_loss": -7.618896007537842, "global_step": 34656, "epoch": 206} {"train_loss": -7.634252548217773, "global_step": 34657, "epoch": 206} {"train_loss": -7.728837966918945, "global_step": 34658, "epoch": 206} {"train_loss": -7.785386562347412, "global_step": 34659, "epoch": 206} {"train_loss": -7.637556076049805, "global_step": 34660, "epoch": 206} {"train_loss": -7.761915683746338, "global_step": 34661, "epoch": 206} {"train_loss": -7.565115928649902, "global_step": 34662, "epoch": 206} {"train_loss": -7.870291709899902, "global_step": 34663, "epoch": 206} {"train_loss": -7.486875534057617, "global_step": 34664, "epoch": 206} {"train_loss": -7.866294860839844, "global_step": 34665, "epoch": 206} {"train_loss": -7.609877586364746, "global_step": 34666, "epoch": 206} {"train_loss": -7.786539077758789, "global_step": 34667, "epoch": 206} {"train_loss": -7.805811882019043, "global_step": 34668, "epoch": 206} {"train_loss": -7.578835964202881, "global_step": 34669, "epoch": 206} {"train_loss": -7.673224925994873, "global_step": 34670, "epoch": 206} {"train_loss": -7.74968147277832, "global_step": 34671, "epoch": 206} {"train_loss": -7.645534992218018, "global_step": 34672, "epoch": 206} {"train_loss": -7.807844638824463, "global_step": 34673, "epoch": 206} {"train_loss": -7.450445175170898, "global_step": 34674, "epoch": 206} {"train_loss": -7.94584321975708, "global_step": 34675, "epoch": 206} {"train_loss": -7.625549793243408, "global_step": 34676, "epoch": 206} {"train_loss": -7.939616680145264, "global_step": 34677, "epoch": 206} {"train_loss": -7.79594087600708, "global_step": 34678, "epoch": 206} {"train_loss": -7.770781517028809, "global_step": 34679, "epoch": 206} {"train_loss": -7.9195451736450195, "global_step": 34680, "epoch": 206} {"train_loss": -7.986579895019531, "global_step": 34681, "epoch": 206} {"train_loss": -7.752495288848877, "global_step": 34682, "epoch": 206} {"train_loss": -7.737354278564453, "global_step": 34683, "epoch": 206} {"train_loss": -7.787084579467773, "global_step": 34684, "epoch": 206} {"train_loss": -7.616393089294434, "global_step": 34685, "epoch": 206} {"train_loss": -7.701798439025879, "global_step": 34686, "epoch": 206} {"train_loss": -7.605934143066406, "global_step": 34687, "epoch": 206} {"train_loss": -7.717710494995117, "global_step": 34688, "epoch": 206} {"train_loss": -7.708726406097412, "global_step": 34689, "epoch": 206} {"train_loss": -7.741927146911621, "global_step": 34690, "epoch": 206} {"train_loss": -7.565990447998047, "global_step": 34691, "epoch": 206} {"train_loss": -7.695120334625244, "global_step": 34692, "epoch": 206} {"train_loss": -7.7297682762146, "global_step": 34693, "epoch": 206} {"train_loss": -7.692262649536133, "global_step": 34694, "epoch": 206} {"train_loss": -8.043610572814941, "global_step": 34695, "epoch": 206} {"train_loss": -7.491809844970703, "global_step": 34696, "epoch": 206} {"train_loss": -7.758028984069824, "global_step": 34697, "epoch": 206} {"train_loss": -7.6307830810546875, "global_step": 34698, "epoch": 206} {"train_loss": -7.8016252517700195, "global_step": 34699, "epoch": 206} {"train_loss": -7.8467817306518555, "global_step": 34700, "epoch": 206} {"train_loss": -7.772967338562012, "global_step": 34701, "epoch": 206} {"train_loss": -7.533714294433594, "global_step": 34702, "epoch": 206} {"train_loss": -7.575439453125, "global_step": 34703, "epoch": 206} {"train_loss": -7.593608856201172, "global_step": 34704, "epoch": 206} {"train_loss": -7.541326522827148, "global_step": 34705, "epoch": 206} {"train_loss": -7.738276481628418, "global_step": 34706, "epoch": 206} {"train_loss": -7.86735725402832, "global_step": 34707, "epoch": 206} {"train_loss": -7.458675384521484, "global_step": 34708, "epoch": 206} {"train_loss": -7.763213157653809, "global_step": 34709, "epoch": 206} {"train_loss": -7.723670482635498, "global_step": 34710, "epoch": 206} {"train_loss": -7.786297798156738, "global_step": 34711, "epoch": 206} {"train_loss": -7.773028373718262, "global_step": 34712, "epoch": 206} {"train_loss": -7.506349563598633, "global_step": 34713, "epoch": 206} {"train_loss": -7.804821014404297, "global_step": 34714, "epoch": 206} {"train_loss": -7.529674530029297, "global_step": 34715, "epoch": 206} {"train_loss": -7.7077436447143555, "global_step": 34716, "epoch": 206} {"train_loss": -7.480245590209961, "global_step": 34717, "epoch": 206} {"train_loss": -7.845239639282227, "global_step": 34718, "epoch": 206} {"train_loss": -7.742434024810791, "global_step": 34719, "epoch": 206} {"train_loss": -7.904053211212158, "global_step": 34720, "epoch": 206} {"train_loss": -7.715213775634766, "global_step": 34721, "epoch": 206} {"train_loss": -7.583839416503906, "global_step": 34722, "epoch": 206} {"train_loss": -7.432275295257568, "global_step": 34723, "epoch": 206} {"train_loss": -7.877374172210693, "global_step": 34724, "epoch": 206} {"train_loss": -7.6906867027282715, "global_step": 34725, "epoch": 206} {"train_loss": -7.760411262512207, "global_step": 34726, "epoch": 206} {"train_loss": -7.722629070281982, "global_step": 34727, "epoch": 206} {"train_loss": -7.621278762817383, "global_step": 34728, "epoch": 206} {"train_loss": -7.568902969360352, "global_step": 34729, "epoch": 206} {"train_loss": -7.88931941986084, "global_step": 34730, "epoch": 206} {"train_loss": -7.912607192993164, "global_step": 34731, "epoch": 206} {"train_loss": -7.588813781738281, "global_step": 34732, "epoch": 206} {"train_loss": -7.716682434082031, "global_step": 34733, "epoch": 206} {"train_loss": -7.650027275085449, "global_step": 34734, "epoch": 206} {"train_loss": -7.756717681884766, "global_step": 34735, "epoch": 206} {"train_loss": -7.6176300048828125, "global_step": 34736, "epoch": 206} {"train_loss": -7.670875549316406, "global_step": 34737, "epoch": 206} {"train_loss": -7.744266033172607, "global_step": 34738, "epoch": 206} {"train_loss": -7.734977722167969, "global_step": 34739, "epoch": 206} {"train_loss": -7.629857540130615, "global_step": 34740, "epoch": 206} {"train_loss": -7.725317001342773, "global_step": 34741, "epoch": 206} {"train_loss": -7.578577995300293, "global_step": 34742, "epoch": 206} {"train_loss": -7.481897830963135, "global_step": 34743, "epoch": 206} {"train_loss": -7.568253993988037, "global_step": 34744, "epoch": 206} {"train_loss": -7.379118919372559, "global_step": 34745, "epoch": 206} {"train_loss": -7.598196506500244, "global_step": 34746, "epoch": 206} {"train_loss": -7.454166412353516, "global_step": 34747, "epoch": 206} {"train_loss": -7.554774761199951, "global_step": 34748, "epoch": 206} {"train_loss": -7.485855579376221, "global_step": 34749, "epoch": 206} {"train_loss": -7.497808456420898, "global_step": 34750, "epoch": 206} {"train_loss": -7.630940914154053, "global_step": 34751, "epoch": 206} {"train_loss": -7.2285566329956055, "global_step": 34752, "epoch": 206} {"train_loss": -7.614536285400391, "global_step": 34753, "epoch": 206} {"train_loss": -7.451233863830566, "global_step": 34754, "epoch": 206} {"train_loss": -7.710912704467773, "global_step": 34755, "epoch": 206} {"train_loss": -7.574608325958252, "global_step": 34756, "epoch": 206} {"train_loss": -7.314257621765137, "global_step": 34757, "epoch": 206} {"train_loss": -7.5860185623168945, "global_step": 34758, "epoch": 206} {"train_loss": -7.70045280456543, "global_step": 34759, "epoch": 206} {"train_loss": -7.652819633483887, "global_step": 34760, "epoch": 206} {"train_loss": -7.60295295715332, "global_step": 34761, "epoch": 206} {"train_loss": -7.654160022735596, "global_step": 34762, "epoch": 206} {"train_loss": -7.589197635650635, "global_step": 34763, "epoch": 206} {"train_loss": -7.619161605834961, "global_step": 34764, "epoch": 206} {"train_loss": -7.766180038452148, "global_step": 34765, "epoch": 206} {"train_loss": -7.802126884460449, "global_step": 34766, "epoch": 206} {"train_loss": -7.7529144287109375, "global_step": 34767, "epoch": 206} {"train_loss": -7.900744915008545, "global_step": 34768, "epoch": 206} {"train_loss": -7.785484790802002, "global_step": 34769, "epoch": 206} {"train_loss": -7.574138641357422, "global_step": 34770, "epoch": 206} {"train_loss": -7.674535274505615, "global_step": 34771, "epoch": 206} {"train_loss": -7.851335048675537, "global_step": 34772, "epoch": 206} {"train_loss": -7.801361083984375, "global_step": 34773, "epoch": 206} {"train_loss": -7.909258842468262, "global_step": 34774, "epoch": 206} {"train_loss": -7.700999515397208, "global_step": 34775, "epoch": 206, "val_loss": 185222.03125} {"train_loss": -7.716137886047363, "global_step": 34776, "epoch": 207} {"train_loss": -7.7990922927856445, "global_step": 34777, "epoch": 207} {"train_loss": -7.8310394287109375, "global_step": 34778, "epoch": 207} {"train_loss": -7.805378437042236, "global_step": 34779, "epoch": 207} {"train_loss": -7.573300361633301, "global_step": 34780, "epoch": 207} {"train_loss": -7.929750919342041, "global_step": 34781, "epoch": 207} {"train_loss": -7.946333408355713, "global_step": 34782, "epoch": 207} {"train_loss": -7.76485013961792, "global_step": 34783, "epoch": 207} {"train_loss": -7.680761337280273, "global_step": 34784, "epoch": 207} {"train_loss": -7.6936492919921875, "global_step": 34785, "epoch": 207} {"train_loss": -7.4407758712768555, "global_step": 34786, "epoch": 207} {"train_loss": -7.949312686920166, "global_step": 34787, "epoch": 207} {"train_loss": -7.5862579345703125, "global_step": 34788, "epoch": 207} {"train_loss": -7.717671871185303, "global_step": 34789, "epoch": 207} {"train_loss": -7.4598846435546875, "global_step": 34790, "epoch": 207} {"train_loss": -7.5264997482299805, "global_step": 34791, "epoch": 207} {"train_loss": -7.3662872314453125, "global_step": 34792, "epoch": 207} {"train_loss": -7.886623859405518, "global_step": 34793, "epoch": 207} {"train_loss": -7.495794296264648, "global_step": 34794, "epoch": 207} {"train_loss": -7.505559921264648, "global_step": 34795, "epoch": 207} {"train_loss": -7.459296226501465, "global_step": 34796, "epoch": 207} {"train_loss": -7.6683526039123535, "global_step": 34797, "epoch": 207} {"train_loss": -7.352328300476074, "global_step": 34798, "epoch": 207} {"train_loss": -7.2206573486328125, "global_step": 34799, "epoch": 207} {"train_loss": -7.579314231872559, "global_step": 34800, "epoch": 207} {"train_loss": -7.5470781326293945, "global_step": 34801, "epoch": 207} {"train_loss": -7.399299621582031, "global_step": 34802, "epoch": 207} {"train_loss": -7.615649223327637, "global_step": 34803, "epoch": 207} {"train_loss": -7.492649078369141, "global_step": 34804, "epoch": 207} {"train_loss": -7.753120422363281, "global_step": 34805, "epoch": 207} {"train_loss": -7.533237457275391, "global_step": 34806, "epoch": 207} {"train_loss": -7.5152740478515625, "global_step": 34807, "epoch": 207} {"train_loss": -7.518430709838867, "global_step": 34808, "epoch": 207} {"train_loss": -7.459953784942627, "global_step": 34809, "epoch": 207} {"train_loss": -7.524776458740234, "global_step": 34810, "epoch": 207} {"train_loss": -7.518011093139648, "global_step": 34811, "epoch": 207} {"train_loss": -7.450878620147705, "global_step": 34812, "epoch": 207} {"train_loss": -7.6993913650512695, "global_step": 34813, "epoch": 207} {"train_loss": -7.5012078285217285, "global_step": 34814, "epoch": 207} {"train_loss": -7.561529636383057, "global_step": 34815, "epoch": 207} {"train_loss": -7.687278747558594, "global_step": 34816, "epoch": 207} {"train_loss": -7.677103519439697, "global_step": 34817, "epoch": 207} {"train_loss": -7.719006538391113, "global_step": 34818, "epoch": 207} {"train_loss": -7.566737174987793, "global_step": 34819, "epoch": 207} {"train_loss": -7.625153064727783, "global_step": 34820, "epoch": 207} {"train_loss": -7.805130481719971, "global_step": 34821, "epoch": 207} {"train_loss": -7.751513481140137, "global_step": 34822, "epoch": 207} {"train_loss": -7.698264122009277, "global_step": 34823, "epoch": 207} {"train_loss": -7.756354331970215, "global_step": 34824, "epoch": 207} {"train_loss": -7.625392913818359, "global_step": 34825, "epoch": 207} {"train_loss": -7.731199264526367, "global_step": 34826, "epoch": 207} {"train_loss": -7.740739822387695, "global_step": 34827, "epoch": 207} {"train_loss": -7.589142322540283, "global_step": 34828, "epoch": 207} {"train_loss": -7.749351501464844, "global_step": 34829, "epoch": 207} {"train_loss": -7.596737861633301, "global_step": 34830, "epoch": 207} {"train_loss": -7.614247798919678, "global_step": 34831, "epoch": 207} {"train_loss": -7.737015724182129, "global_step": 34832, "epoch": 207} {"train_loss": -7.513517379760742, "global_step": 34833, "epoch": 207} {"train_loss": -7.534249305725098, "global_step": 34834, "epoch": 207} {"train_loss": -7.692349910736084, "global_step": 34835, "epoch": 207} {"train_loss": -7.748824596405029, "global_step": 34836, "epoch": 207} {"train_loss": -7.505038738250732, "global_step": 34837, "epoch": 207} {"train_loss": -7.803814888000488, "global_step": 34838, "epoch": 207} {"train_loss": -7.607410430908203, "global_step": 34839, "epoch": 207} {"train_loss": -7.839032173156738, "global_step": 34840, "epoch": 207} {"train_loss": -7.889540195465088, "global_step": 34841, "epoch": 207} {"train_loss": -7.743043899536133, "global_step": 34842, "epoch": 207} {"train_loss": -7.684764385223389, "global_step": 34843, "epoch": 207} {"train_loss": -7.798942565917969, "global_step": 34844, "epoch": 207} {"train_loss": -7.7938714027404785, "global_step": 34845, "epoch": 207} {"train_loss": -7.587626934051514, "global_step": 34846, "epoch": 207} {"train_loss": -7.562806606292725, "global_step": 34847, "epoch": 207} {"train_loss": -7.500067710876465, "global_step": 34848, "epoch": 207} {"train_loss": -7.639009475708008, "global_step": 34849, "epoch": 207} {"train_loss": -7.637426376342773, "global_step": 34850, "epoch": 207} {"train_loss": -7.430850982666016, "global_step": 34851, "epoch": 207} {"train_loss": -7.627311706542969, "global_step": 34852, "epoch": 207} {"train_loss": -7.248218536376953, "global_step": 34853, "epoch": 207} {"train_loss": -7.711784839630127, "global_step": 34854, "epoch": 207} {"train_loss": -7.626895904541016, "global_step": 34855, "epoch": 207} {"train_loss": -7.501221656799316, "global_step": 34856, "epoch": 207} {"train_loss": -7.477242469787598, "global_step": 34857, "epoch": 207} {"train_loss": -7.591806411743164, "global_step": 34858, "epoch": 207} {"train_loss": -7.49156379699707, "global_step": 34859, "epoch": 207} {"train_loss": -7.421008110046387, "global_step": 34860, "epoch": 207} {"train_loss": -7.6310625076293945, "global_step": 34861, "epoch": 207} {"train_loss": -7.50726318359375, "global_step": 34862, "epoch": 207} {"train_loss": -7.619655132293701, "global_step": 34863, "epoch": 207} {"train_loss": -7.458296775817871, "global_step": 34864, "epoch": 207} {"train_loss": -7.637880802154541, "global_step": 34865, "epoch": 207} {"train_loss": -7.666991710662842, "global_step": 34866, "epoch": 207} {"train_loss": -7.580157279968262, "global_step": 34867, "epoch": 207} {"train_loss": -7.768893241882324, "global_step": 34868, "epoch": 207} {"train_loss": -7.770186901092529, "global_step": 34869, "epoch": 207} {"train_loss": -7.653054237365723, "global_step": 34870, "epoch": 207} {"train_loss": -7.85003662109375, "global_step": 34871, "epoch": 207} {"train_loss": -7.6208086013793945, "global_step": 34872, "epoch": 207} {"train_loss": -7.749273777008057, "global_step": 34873, "epoch": 207} {"train_loss": -7.613004684448242, "global_step": 34874, "epoch": 207} {"train_loss": -7.925201416015625, "global_step": 34875, "epoch": 207} {"train_loss": -7.87076997756958, "global_step": 34876, "epoch": 207} {"train_loss": -7.736196994781494, "global_step": 34877, "epoch": 207} {"train_loss": -7.650723457336426, "global_step": 34878, "epoch": 207} {"train_loss": -7.784451961517334, "global_step": 34879, "epoch": 207} {"train_loss": -7.871835231781006, "global_step": 34880, "epoch": 207} {"train_loss": -7.7481794357299805, "global_step": 34881, "epoch": 207} {"train_loss": -7.785905838012695, "global_step": 34882, "epoch": 207} {"train_loss": -7.8146562576293945, "global_step": 34883, "epoch": 207} {"train_loss": -7.856306076049805, "global_step": 34884, "epoch": 207} {"train_loss": -7.789783000946045, "global_step": 34885, "epoch": 207} {"train_loss": -7.738489627838135, "global_step": 34886, "epoch": 207} {"train_loss": -7.5984930992126465, "global_step": 34887, "epoch": 207} {"train_loss": -7.912502288818359, "global_step": 34888, "epoch": 207} {"train_loss": -7.773111820220947, "global_step": 34889, "epoch": 207} {"train_loss": -7.936925411224365, "global_step": 34890, "epoch": 207} {"train_loss": -7.822117805480957, "global_step": 34891, "epoch": 207} {"train_loss": -7.922054767608643, "global_step": 34892, "epoch": 207} {"train_loss": -7.5428924560546875, "global_step": 34893, "epoch": 207} {"train_loss": -7.662285327911377, "global_step": 34894, "epoch": 207} {"train_loss": -7.645542144775391, "global_step": 34895, "epoch": 207} {"train_loss": -7.8549017906188965, "global_step": 34896, "epoch": 207} {"train_loss": -7.619992256164551, "global_step": 34897, "epoch": 207} {"train_loss": -7.766469955444336, "global_step": 34898, "epoch": 207} {"train_loss": -7.573225975036621, "global_step": 34899, "epoch": 207} {"train_loss": -7.805167198181152, "global_step": 34900, "epoch": 207} {"train_loss": -7.568599700927734, "global_step": 34901, "epoch": 207} {"train_loss": -7.755544662475586, "global_step": 34902, "epoch": 207} {"train_loss": -7.652576923370361, "global_step": 34903, "epoch": 207} {"train_loss": -7.716892242431641, "global_step": 34904, "epoch": 207} {"train_loss": -7.6051554679870605, "global_step": 34905, "epoch": 207} {"train_loss": -7.689762115478516, "global_step": 34906, "epoch": 207} {"train_loss": -7.587650775909424, "global_step": 34907, "epoch": 207} {"train_loss": -7.633011817932129, "global_step": 34908, "epoch": 207} {"train_loss": -7.70732307434082, "global_step": 34909, "epoch": 207} {"train_loss": -7.819220542907715, "global_step": 34910, "epoch": 207} {"train_loss": -7.715915679931641, "global_step": 34911, "epoch": 207} {"train_loss": -7.750452041625977, "global_step": 34912, "epoch": 207} {"train_loss": -7.830461502075195, "global_step": 34913, "epoch": 207} {"train_loss": -7.757370948791504, "global_step": 34914, "epoch": 207} {"train_loss": -7.889183044433594, "global_step": 34915, "epoch": 207} {"train_loss": -7.930131912231445, "global_step": 34916, "epoch": 207} {"train_loss": -7.844208717346191, "global_step": 34917, "epoch": 207} {"train_loss": -7.721195220947266, "global_step": 34918, "epoch": 207} {"train_loss": -7.716697692871094, "global_step": 34919, "epoch": 207} {"train_loss": -7.991125583648682, "global_step": 34920, "epoch": 207} {"train_loss": -7.874467849731445, "global_step": 34921, "epoch": 207} {"train_loss": -7.658730506896973, "global_step": 34922, "epoch": 207} {"train_loss": -8.039581298828125, "global_step": 34923, "epoch": 207} {"train_loss": -7.838019371032715, "global_step": 34924, "epoch": 207} {"train_loss": -7.940752029418945, "global_step": 34925, "epoch": 207} {"train_loss": -7.751086235046387, "global_step": 34926, "epoch": 207} {"train_loss": -7.98079776763916, "global_step": 34927, "epoch": 207} {"train_loss": -7.9786505699157715, "global_step": 34928, "epoch": 207} {"train_loss": -7.749269485473633, "global_step": 34929, "epoch": 207} {"train_loss": -7.726902961730957, "global_step": 34930, "epoch": 207} {"train_loss": -7.974509239196777, "global_step": 34931, "epoch": 207} {"train_loss": -7.436851501464844, "global_step": 34932, "epoch": 207} {"train_loss": -8.01344108581543, "global_step": 34933, "epoch": 207} {"train_loss": -7.788765907287598, "global_step": 34934, "epoch": 207} {"train_loss": -8.024833679199219, "global_step": 34935, "epoch": 207} {"train_loss": -7.685835838317871, "global_step": 34936, "epoch": 207} {"train_loss": -7.782998085021973, "global_step": 34937, "epoch": 207} {"train_loss": -7.66661262512207, "global_step": 34938, "epoch": 207} {"train_loss": -7.81411075592041, "global_step": 34939, "epoch": 207} {"train_loss": -7.778965950012207, "global_step": 34940, "epoch": 207} {"train_loss": -7.764985084533691, "global_step": 34941, "epoch": 207} {"train_loss": -7.851343154907227, "global_step": 34942, "epoch": 207} {"train_loss": -7.690493461631593, "global_step": 34943, "epoch": 207, "val_loss": 182864.0625} {"train_loss": -7.832051753997803, "global_step": 34944, "epoch": 208} {"train_loss": -7.58793830871582, "global_step": 34945, "epoch": 208} {"train_loss": -7.686781406402588, "global_step": 34946, "epoch": 208} {"train_loss": -7.669654846191406, "global_step": 34947, "epoch": 208} {"train_loss": -7.417300224304199, "global_step": 34948, "epoch": 208} {"train_loss": -7.586835861206055, "global_step": 34949, "epoch": 208} {"train_loss": -7.246532917022705, "global_step": 34950, "epoch": 208} {"train_loss": -7.863161087036133, "global_step": 34951, "epoch": 208} {"train_loss": -7.5856804847717285, "global_step": 34952, "epoch": 208} {"train_loss": -7.575010776519775, "global_step": 34953, "epoch": 208} {"train_loss": -7.559047698974609, "global_step": 34954, "epoch": 208} {"train_loss": -7.8173017501831055, "global_step": 34955, "epoch": 208} {"train_loss": -7.848486423492432, "global_step": 34956, "epoch": 208} {"train_loss": -7.473568916320801, "global_step": 34957, "epoch": 208} {"train_loss": -7.70855712890625, "global_step": 34958, "epoch": 208} {"train_loss": -7.686338901519775, "global_step": 34959, "epoch": 208} {"train_loss": -7.549516677856445, "global_step": 34960, "epoch": 208} {"train_loss": -7.720893859863281, "global_step": 34961, "epoch": 208} {"train_loss": -7.33428955078125, "global_step": 34962, "epoch": 208} {"train_loss": -7.529820442199707, "global_step": 34963, "epoch": 208} {"train_loss": -7.646476745605469, "global_step": 34964, "epoch": 208} {"train_loss": -7.664125442504883, "global_step": 34965, "epoch": 208} {"train_loss": -7.627962112426758, "global_step": 34966, "epoch": 208} {"train_loss": -7.649576187133789, "global_step": 34967, "epoch": 208} {"train_loss": -7.694818496704102, "global_step": 34968, "epoch": 208} {"train_loss": -7.606725215911865, "global_step": 34969, "epoch": 208} {"train_loss": -7.654300212860107, "global_step": 34970, "epoch": 208} {"train_loss": -7.745760917663574, "global_step": 34971, "epoch": 208} {"train_loss": -7.722715377807617, "global_step": 34972, "epoch": 208} {"train_loss": -7.698882579803467, "global_step": 34973, "epoch": 208} {"train_loss": -7.722654342651367, "global_step": 34974, "epoch": 208} {"train_loss": -7.765883445739746, "global_step": 34975, "epoch": 208} {"train_loss": -7.759038925170898, "global_step": 34976, "epoch": 208} {"train_loss": -7.798393249511719, "global_step": 34977, "epoch": 208} {"train_loss": -7.612966060638428, "global_step": 34978, "epoch": 208} {"train_loss": -7.86534309387207, "global_step": 34979, "epoch": 208} {"train_loss": -7.860249042510986, "global_step": 34980, "epoch": 208} {"train_loss": -7.842710494995117, "global_step": 34981, "epoch": 208} {"train_loss": -7.960339069366455, "global_step": 34982, "epoch": 208} {"train_loss": -7.753854751586914, "global_step": 34983, "epoch": 208} {"train_loss": -7.763821601867676, "global_step": 34984, "epoch": 208} {"train_loss": -7.568863868713379, "global_step": 34985, "epoch": 208} {"train_loss": -7.9305806159973145, "global_step": 34986, "epoch": 208} {"train_loss": -7.844351768493652, "global_step": 34987, "epoch": 208} {"train_loss": -7.933850288391113, "global_step": 34988, "epoch": 208} {"train_loss": -7.521573543548584, "global_step": 34989, "epoch": 208} {"train_loss": -7.79737663269043, "global_step": 34990, "epoch": 208} {"train_loss": -7.473150730133057, "global_step": 34991, "epoch": 208} {"train_loss": -7.978490829467773, "global_step": 34992, "epoch": 208} {"train_loss": -7.452017784118652, "global_step": 34993, "epoch": 208} {"train_loss": -7.759254455566406, "global_step": 34994, "epoch": 208} {"train_loss": -7.554403781890869, "global_step": 34995, "epoch": 208} {"train_loss": -7.656190872192383, "global_step": 34996, "epoch": 208} {"train_loss": -7.745183944702148, "global_step": 34997, "epoch": 208} {"train_loss": -7.531163215637207, "global_step": 34998, "epoch": 208} {"train_loss": -7.916123390197754, "global_step": 34999, "epoch": 208} {"train_loss": -7.679872989654541, "global_step": 35000, "epoch": 208} {"train_loss": -7.488718032836914, "global_step": 35001, "epoch": 208} {"train_loss": -7.5003485679626465, "global_step": 35002, "epoch": 208} {"train_loss": -7.835203170776367, "global_step": 35003, "epoch": 208} {"train_loss": -7.371012210845947, "global_step": 35004, "epoch": 208} {"train_loss": -7.706360816955566, "global_step": 35005, "epoch": 208} {"train_loss": -7.509257793426514, "global_step": 35006, "epoch": 208} {"train_loss": -7.602071762084961, "global_step": 35007, "epoch": 208} {"train_loss": -7.782767295837402, "global_step": 35008, "epoch": 208} {"train_loss": -7.741885185241699, "global_step": 35009, "epoch": 208} {"train_loss": -7.720486640930176, "global_step": 35010, "epoch": 208} {"train_loss": -7.504457950592041, "global_step": 35011, "epoch": 208} {"train_loss": -7.804208755493164, "global_step": 35012, "epoch": 208} {"train_loss": -7.7458086013793945, "global_step": 35013, "epoch": 208} {"train_loss": -7.74476432800293, "global_step": 35014, "epoch": 208} {"train_loss": -7.730372428894043, "global_step": 35015, "epoch": 208} {"train_loss": -7.86277437210083, "global_step": 35016, "epoch": 208} {"train_loss": -7.740438461303711, "global_step": 35017, "epoch": 208} {"train_loss": -7.8017072677612305, "global_step": 35018, "epoch": 208} {"train_loss": -7.777182579040527, "global_step": 35019, "epoch": 208} {"train_loss": -7.722560882568359, "global_step": 35020, "epoch": 208} {"train_loss": -7.6532158851623535, "global_step": 35021, "epoch": 208} {"train_loss": -7.695888042449951, "global_step": 35022, "epoch": 208} {"train_loss": -7.753192901611328, "global_step": 35023, "epoch": 208} {"train_loss": -7.6500444412231445, "global_step": 35024, "epoch": 208} {"train_loss": -7.662594795227051, "global_step": 35025, "epoch": 208} {"train_loss": -7.519648551940918, "global_step": 35026, "epoch": 208} {"train_loss": -7.73961067199707, "global_step": 35027, "epoch": 208} {"train_loss": -7.628069877624512, "global_step": 35028, "epoch": 208} {"train_loss": -7.67041015625, "global_step": 35029, "epoch": 208} {"train_loss": -7.374277591705322, "global_step": 35030, "epoch": 208} {"train_loss": -7.759658336639404, "global_step": 35031, "epoch": 208} {"train_loss": -7.409533977508545, "global_step": 35032, "epoch": 208} {"train_loss": -7.471257209777832, "global_step": 35033, "epoch": 208} {"train_loss": -7.632197856903076, "global_step": 35034, "epoch": 208} {"train_loss": -7.742325782775879, "global_step": 35035, "epoch": 208} {"train_loss": -7.356940746307373, "global_step": 35036, "epoch": 208} {"train_loss": -7.68021297454834, "global_step": 35037, "epoch": 208} {"train_loss": -7.574650287628174, "global_step": 35038, "epoch": 208} {"train_loss": -7.719099521636963, "global_step": 35039, "epoch": 208} {"train_loss": -7.737246513366699, "global_step": 35040, "epoch": 208} {"train_loss": -7.717700004577637, "global_step": 35041, "epoch": 208} {"train_loss": -7.783427715301514, "global_step": 35042, "epoch": 208} {"train_loss": -7.949934482574463, "global_step": 35043, "epoch": 208} {"train_loss": -7.710278034210205, "global_step": 35044, "epoch": 208} {"train_loss": -7.693665027618408, "global_step": 35045, "epoch": 208} {"train_loss": -7.805413722991943, "global_step": 35046, "epoch": 208} {"train_loss": -7.774291038513184, "global_step": 35047, "epoch": 208} {"train_loss": -7.7850751876831055, "global_step": 35048, "epoch": 208} {"train_loss": -7.736115455627441, "global_step": 35049, "epoch": 208} {"train_loss": -7.827541351318359, "global_step": 35050, "epoch": 208} {"train_loss": -8.056325912475586, "global_step": 35051, "epoch": 208} {"train_loss": -7.790241241455078, "global_step": 35052, "epoch": 208} {"train_loss": -8.113511085510254, "global_step": 35053, "epoch": 208} {"train_loss": -7.725165367126465, "global_step": 35054, "epoch": 208} {"train_loss": -7.667013645172119, "global_step": 35055, "epoch": 208} {"train_loss": -7.749190807342529, "global_step": 35056, "epoch": 208} {"train_loss": -7.810868263244629, "global_step": 35057, "epoch": 208} {"train_loss": -7.636472225189209, "global_step": 35058, "epoch": 208} {"train_loss": -7.809125900268555, "global_step": 35059, "epoch": 208} {"train_loss": -7.563641548156738, "global_step": 35060, "epoch": 208} {"train_loss": -7.849440097808838, "global_step": 35061, "epoch": 208} {"train_loss": -7.807502746582031, "global_step": 35062, "epoch": 208} {"train_loss": -7.90801477432251, "global_step": 35063, "epoch": 208} {"train_loss": -7.66831636428833, "global_step": 35064, "epoch": 208} {"train_loss": -7.902660846710205, "global_step": 35065, "epoch": 208} {"train_loss": -7.77446174621582, "global_step": 35066, "epoch": 208} {"train_loss": -7.722112655639648, "global_step": 35067, "epoch": 208} {"train_loss": -7.891512393951416, "global_step": 35068, "epoch": 208} {"train_loss": -7.615623950958252, "global_step": 35069, "epoch": 208} {"train_loss": -7.482680320739746, "global_step": 35070, "epoch": 208} {"train_loss": -7.106602668762207, "global_step": 35071, "epoch": 208} {"train_loss": -7.328648567199707, "global_step": 35072, "epoch": 208} {"train_loss": -7.395990371704102, "global_step": 35073, "epoch": 208} {"train_loss": -7.276520252227783, "global_step": 35074, "epoch": 208} {"train_loss": -7.43420934677124, "global_step": 35075, "epoch": 208} {"train_loss": -7.5103759765625, "global_step": 35076, "epoch": 208} {"train_loss": -7.552889823913574, "global_step": 35077, "epoch": 208} {"train_loss": -7.46452522277832, "global_step": 35078, "epoch": 208} {"train_loss": -7.615335941314697, "global_step": 35079, "epoch": 208} {"train_loss": -7.674612045288086, "global_step": 35080, "epoch": 208} {"train_loss": -7.332651615142822, "global_step": 35081, "epoch": 208} {"train_loss": -7.611556529998779, "global_step": 35082, "epoch": 208} {"train_loss": -7.686569690704346, "global_step": 35083, "epoch": 208} {"train_loss": -7.635561943054199, "global_step": 35084, "epoch": 208} {"train_loss": -7.613051414489746, "global_step": 35085, "epoch": 208} {"train_loss": -7.720390796661377, "global_step": 35086, "epoch": 208} {"train_loss": -7.438191890716553, "global_step": 35087, "epoch": 208} {"train_loss": -7.598158836364746, "global_step": 35088, "epoch": 208} {"train_loss": -7.595880031585693, "global_step": 35089, "epoch": 208} {"train_loss": -7.695352554321289, "global_step": 35090, "epoch": 208} {"train_loss": -7.751911163330078, "global_step": 35091, "epoch": 208} {"train_loss": -7.69097900390625, "global_step": 35092, "epoch": 208} {"train_loss": -7.790655136108398, "global_step": 35093, "epoch": 208} {"train_loss": -7.803197383880615, "global_step": 35094, "epoch": 208} {"train_loss": -7.961887359619141, "global_step": 35095, "epoch": 208} {"train_loss": -7.641840934753418, "global_step": 35096, "epoch": 208} {"train_loss": -7.723723411560059, "global_step": 35097, "epoch": 208} {"train_loss": -7.823799133300781, "global_step": 35098, "epoch": 208} {"train_loss": -8.0392427444458, "global_step": 35099, "epoch": 208} {"train_loss": -7.795622825622559, "global_step": 35100, "epoch": 208} {"train_loss": -7.77186393737793, "global_step": 35101, "epoch": 208} {"train_loss": -7.898301124572754, "global_step": 35102, "epoch": 208} {"train_loss": -7.941688060760498, "global_step": 35103, "epoch": 208} {"train_loss": -7.911224365234375, "global_step": 35104, "epoch": 208} {"train_loss": -7.730086326599121, "global_step": 35105, "epoch": 208} {"train_loss": -7.805962562561035, "global_step": 35106, "epoch": 208} {"train_loss": -7.866835594177246, "global_step": 35107, "epoch": 208} {"train_loss": -7.771998405456543, "global_step": 35108, "epoch": 208} {"train_loss": -7.706396102905273, "global_step": 35109, "epoch": 208} {"train_loss": -7.599728584289551, "global_step": 35110, "epoch": 208} {"train_loss": -7.686820592199053, "global_step": 35111, "epoch": 208, "val_loss": 187316.984375} {"train_loss": -7.7769060134887695, "global_step": 35112, "epoch": 209} {"train_loss": -7.798118591308594, "global_step": 35113, "epoch": 209} {"train_loss": -7.864748001098633, "global_step": 35114, "epoch": 209} {"train_loss": -7.710572242736816, "global_step": 35115, "epoch": 209} {"train_loss": -7.663510322570801, "global_step": 35116, "epoch": 209} {"train_loss": -7.747908592224121, "global_step": 35117, "epoch": 209} {"train_loss": -7.580516815185547, "global_step": 35118, "epoch": 209} {"train_loss": -7.800784111022949, "global_step": 35119, "epoch": 209} {"train_loss": -7.683181285858154, "global_step": 35120, "epoch": 209} {"train_loss": -7.5856475830078125, "global_step": 35121, "epoch": 209} {"train_loss": -7.400832653045654, "global_step": 35122, "epoch": 209} {"train_loss": -7.800177097320557, "global_step": 35123, "epoch": 209} {"train_loss": -7.616220474243164, "global_step": 35124, "epoch": 209} {"train_loss": -7.627910614013672, "global_step": 35125, "epoch": 209} {"train_loss": -7.854439735412598, "global_step": 35126, "epoch": 209} {"train_loss": -7.750624656677246, "global_step": 35127, "epoch": 209} {"train_loss": -7.6037092208862305, "global_step": 35128, "epoch": 209} {"train_loss": -7.64829158782959, "global_step": 35129, "epoch": 209} {"train_loss": -7.587152481079102, "global_step": 35130, "epoch": 209} {"train_loss": -7.836743354797363, "global_step": 35131, "epoch": 209} {"train_loss": -7.552984237670898, "global_step": 35132, "epoch": 209} {"train_loss": -7.831932067871094, "global_step": 35133, "epoch": 209} {"train_loss": -7.835348606109619, "global_step": 35134, "epoch": 209} {"train_loss": -7.781984329223633, "global_step": 35135, "epoch": 209} {"train_loss": -7.660000801086426, "global_step": 35136, "epoch": 209} {"train_loss": -7.644954681396484, "global_step": 35137, "epoch": 209} {"train_loss": -7.845346450805664, "global_step": 35138, "epoch": 209} {"train_loss": -7.426124572753906, "global_step": 35139, "epoch": 209} {"train_loss": -7.728156089782715, "global_step": 35140, "epoch": 209} {"train_loss": -7.7871856689453125, "global_step": 35141, "epoch": 209} {"train_loss": -7.728598594665527, "global_step": 35142, "epoch": 209} {"train_loss": -7.601434230804443, "global_step": 35143, "epoch": 209} {"train_loss": -7.799149513244629, "global_step": 35144, "epoch": 209} {"train_loss": -7.631761074066162, "global_step": 35145, "epoch": 209} {"train_loss": -7.62520170211792, "global_step": 35146, "epoch": 209} {"train_loss": -7.6230244636535645, "global_step": 35147, "epoch": 209} {"train_loss": -7.58848762512207, "global_step": 35148, "epoch": 209} {"train_loss": -7.818545341491699, "global_step": 35149, "epoch": 209} {"train_loss": -7.4105048179626465, "global_step": 35150, "epoch": 209} {"train_loss": -7.849648952484131, "global_step": 35151, "epoch": 209} {"train_loss": -7.877296447753906, "global_step": 35152, "epoch": 209} {"train_loss": -7.901581764221191, "global_step": 35153, "epoch": 209} {"train_loss": -7.631318092346191, "global_step": 35154, "epoch": 209} {"train_loss": -7.709155082702637, "global_step": 35155, "epoch": 209} {"train_loss": -7.782628059387207, "global_step": 35156, "epoch": 209} {"train_loss": -7.6712799072265625, "global_step": 35157, "epoch": 209} {"train_loss": -7.674281597137451, "global_step": 35158, "epoch": 209} {"train_loss": -7.538558006286621, "global_step": 35159, "epoch": 209} {"train_loss": -7.697112083435059, "global_step": 35160, "epoch": 209} {"train_loss": -7.783581256866455, "global_step": 35161, "epoch": 209} {"train_loss": -7.603847980499268, "global_step": 35162, "epoch": 209} {"train_loss": -7.783421516418457, "global_step": 35163, "epoch": 209} {"train_loss": -7.428092956542969, "global_step": 35164, "epoch": 209} {"train_loss": -7.719977378845215, "global_step": 35165, "epoch": 209} {"train_loss": -7.286694526672363, "global_step": 35166, "epoch": 209} {"train_loss": -7.79706335067749, "global_step": 35167, "epoch": 209} {"train_loss": -7.547213077545166, "global_step": 35168, "epoch": 209} {"train_loss": -7.589792251586914, "global_step": 35169, "epoch": 209} {"train_loss": -7.546177864074707, "global_step": 35170, "epoch": 209} {"train_loss": -7.9112677574157715, "global_step": 35171, "epoch": 209} {"train_loss": -7.493660926818848, "global_step": 35172, "epoch": 209} {"train_loss": -7.517317295074463, "global_step": 35173, "epoch": 209} {"train_loss": -7.458819389343262, "global_step": 35174, "epoch": 209} {"train_loss": -7.549752235412598, "global_step": 35175, "epoch": 209} {"train_loss": -7.717925548553467, "global_step": 35176, "epoch": 209} {"train_loss": -7.641165733337402, "global_step": 35177, "epoch": 209} {"train_loss": -7.894474029541016, "global_step": 35178, "epoch": 209} {"train_loss": -7.848862648010254, "global_step": 35179, "epoch": 209} {"train_loss": -7.7643723487854, "global_step": 35180, "epoch": 209} {"train_loss": -7.753025531768799, "global_step": 35181, "epoch": 209} {"train_loss": -7.615235328674316, "global_step": 35182, "epoch": 209} {"train_loss": -7.967323303222656, "global_step": 35183, "epoch": 209} {"train_loss": -7.5737457275390625, "global_step": 35184, "epoch": 209} {"train_loss": -7.668505668640137, "global_step": 35185, "epoch": 209} {"train_loss": -7.655901908874512, "global_step": 35186, "epoch": 209} {"train_loss": -7.577638626098633, "global_step": 35187, "epoch": 209} {"train_loss": -7.664230823516846, "global_step": 35188, "epoch": 209} {"train_loss": -7.610284805297852, "global_step": 35189, "epoch": 209} {"train_loss": -7.486565113067627, "global_step": 35190, "epoch": 209} {"train_loss": -7.8552398681640625, "global_step": 35191, "epoch": 209} {"train_loss": -7.5294318199157715, "global_step": 35192, "epoch": 209} {"train_loss": -7.636845588684082, "global_step": 35193, "epoch": 209} {"train_loss": -7.750941276550293, "global_step": 35194, "epoch": 209} {"train_loss": -7.620024681091309, "global_step": 35195, "epoch": 209} {"train_loss": -7.5785698890686035, "global_step": 35196, "epoch": 209} {"train_loss": -7.593568801879883, "global_step": 35197, "epoch": 209} {"train_loss": -7.466477394104004, "global_step": 35198, "epoch": 209} {"train_loss": -7.724064826965332, "global_step": 35199, "epoch": 209} {"train_loss": -7.821920871734619, "global_step": 35200, "epoch": 209} {"train_loss": -7.694698333740234, "global_step": 35201, "epoch": 209} {"train_loss": -7.595606803894043, "global_step": 35202, "epoch": 209} {"train_loss": -7.729609966278076, "global_step": 35203, "epoch": 209} {"train_loss": -7.6270952224731445, "global_step": 35204, "epoch": 209} {"train_loss": -7.911998271942139, "global_step": 35205, "epoch": 209} {"train_loss": -7.827937126159668, "global_step": 35206, "epoch": 209} {"train_loss": -7.844918251037598, "global_step": 35207, "epoch": 209} {"train_loss": -7.652985572814941, "global_step": 35208, "epoch": 209} {"train_loss": -7.675148010253906, "global_step": 35209, "epoch": 209} {"train_loss": -7.795738697052002, "global_step": 35210, "epoch": 209} {"train_loss": -7.716402530670166, "global_step": 35211, "epoch": 209} {"train_loss": -7.909263610839844, "global_step": 35212, "epoch": 209} {"train_loss": -7.7723822593688965, "global_step": 35213, "epoch": 209} {"train_loss": -7.79901123046875, "global_step": 35214, "epoch": 209} {"train_loss": -7.812802314758301, "global_step": 35215, "epoch": 209} {"train_loss": -7.768407821655273, "global_step": 35216, "epoch": 209} {"train_loss": -7.479854583740234, "global_step": 35217, "epoch": 209} {"train_loss": -7.440058708190918, "global_step": 35218, "epoch": 209} {"train_loss": -7.6863932609558105, "global_step": 35219, "epoch": 209} {"train_loss": -7.50080680847168, "global_step": 35220, "epoch": 209} {"train_loss": -7.620423316955566, "global_step": 35221, "epoch": 209} {"train_loss": -7.561959266662598, "global_step": 35222, "epoch": 209} {"train_loss": -7.559625625610352, "global_step": 35223, "epoch": 209} {"train_loss": -7.675087928771973, "global_step": 35224, "epoch": 209} {"train_loss": -7.585718154907227, "global_step": 35225, "epoch": 209} {"train_loss": -7.777107238769531, "global_step": 35226, "epoch": 209} {"train_loss": -7.889143943786621, "global_step": 35227, "epoch": 209} {"train_loss": -7.676009178161621, "global_step": 35228, "epoch": 209} {"train_loss": -7.853424072265625, "global_step": 35229, "epoch": 209} {"train_loss": -7.875053882598877, "global_step": 35230, "epoch": 209} {"train_loss": -7.609482288360596, "global_step": 35231, "epoch": 209} {"train_loss": -7.741390228271484, "global_step": 35232, "epoch": 209} {"train_loss": -7.694256782531738, "global_step": 35233, "epoch": 209} {"train_loss": -7.979152679443359, "global_step": 35234, "epoch": 209} {"train_loss": -7.820708274841309, "global_step": 35235, "epoch": 209} {"train_loss": -7.797758102416992, "global_step": 35236, "epoch": 209} {"train_loss": -7.703118801116943, "global_step": 35237, "epoch": 209} {"train_loss": -7.925930976867676, "global_step": 35238, "epoch": 209} {"train_loss": -7.74523401260376, "global_step": 35239, "epoch": 209} {"train_loss": -7.772481918334961, "global_step": 35240, "epoch": 209} {"train_loss": -7.862730026245117, "global_step": 35241, "epoch": 209} {"train_loss": -8.043872833251953, "global_step": 35242, "epoch": 209} {"train_loss": -7.748791694641113, "global_step": 35243, "epoch": 209} {"train_loss": -7.8648481369018555, "global_step": 35244, "epoch": 209} {"train_loss": -7.7801194190979, "global_step": 35245, "epoch": 209} {"train_loss": -7.830966949462891, "global_step": 35246, "epoch": 209} {"train_loss": -7.3520588874816895, "global_step": 35247, "epoch": 209} {"train_loss": -7.806696891784668, "global_step": 35248, "epoch": 209} {"train_loss": -7.829935073852539, "global_step": 35249, "epoch": 209} {"train_loss": -7.805931091308594, "global_step": 35250, "epoch": 209} {"train_loss": -7.877832412719727, "global_step": 35251, "epoch": 209} {"train_loss": -7.814009666442871, "global_step": 35252, "epoch": 209} {"train_loss": -7.698741436004639, "global_step": 35253, "epoch": 209} {"train_loss": -7.893707275390625, "global_step": 35254, "epoch": 209} {"train_loss": -7.721810817718506, "global_step": 35255, "epoch": 209} {"train_loss": -7.6502461433410645, "global_step": 35256, "epoch": 209} {"train_loss": -7.51079797744751, "global_step": 35257, "epoch": 209} {"train_loss": -7.842370986938477, "global_step": 35258, "epoch": 209} {"train_loss": -7.463705062866211, "global_step": 35259, "epoch": 209} {"train_loss": -7.563327789306641, "global_step": 35260, "epoch": 209} {"train_loss": -7.3043928146362305, "global_step": 35261, "epoch": 209} {"train_loss": -7.529462814331055, "global_step": 35262, "epoch": 209} {"train_loss": -7.538266658782959, "global_step": 35263, "epoch": 209} {"train_loss": -7.469521522521973, "global_step": 35264, "epoch": 209} {"train_loss": -7.786659240722656, "global_step": 35265, "epoch": 209} {"train_loss": -7.6453752517700195, "global_step": 35266, "epoch": 209} {"train_loss": -7.598891258239746, "global_step": 35267, "epoch": 209} {"train_loss": -7.652178764343262, "global_step": 35268, "epoch": 209} {"train_loss": -7.671267509460449, "global_step": 35269, "epoch": 209} {"train_loss": -7.773525238037109, "global_step": 35270, "epoch": 209} {"train_loss": -7.712728500366211, "global_step": 35271, "epoch": 209} {"train_loss": -7.482151985168457, "global_step": 35272, "epoch": 209} {"train_loss": -7.820062637329102, "global_step": 35273, "epoch": 209} {"train_loss": -7.8966522216796875, "global_step": 35274, "epoch": 209} {"train_loss": -7.5884881019592285, "global_step": 35275, "epoch": 209} {"train_loss": -7.587462425231934, "global_step": 35276, "epoch": 209} {"train_loss": -7.720339298248291, "global_step": 35277, "epoch": 209} {"train_loss": -7.637745380401611, "global_step": 35278, "epoch": 209} {"train_loss": -7.691387852032979, "global_step": 35279, "epoch": 209, "val_loss": 183250.1875} {"train_loss": -7.624682426452637, "global_step": 35280, "epoch": 210} {"train_loss": -7.485849380493164, "global_step": 35281, "epoch": 210} {"train_loss": -7.527182102203369, "global_step": 35282, "epoch": 210} {"train_loss": -7.648287773132324, "global_step": 35283, "epoch": 210} {"train_loss": -7.563590049743652, "global_step": 35284, "epoch": 210} {"train_loss": -7.344625473022461, "global_step": 35285, "epoch": 210} {"train_loss": -7.624856948852539, "global_step": 35286, "epoch": 210} {"train_loss": -7.602584362030029, "global_step": 35287, "epoch": 210} {"train_loss": -7.5410871505737305, "global_step": 35288, "epoch": 210} {"train_loss": -7.662665843963623, "global_step": 35289, "epoch": 210} {"train_loss": -7.470898628234863, "global_step": 35290, "epoch": 210} {"train_loss": -7.801348686218262, "global_step": 35291, "epoch": 210} {"train_loss": -7.712850570678711, "global_step": 35292, "epoch": 210} {"train_loss": -7.810110092163086, "global_step": 35293, "epoch": 210} {"train_loss": -7.4721360206604, "global_step": 35294, "epoch": 210} {"train_loss": -7.743175506591797, "global_step": 35295, "epoch": 210} {"train_loss": -7.376749515533447, "global_step": 35296, "epoch": 210} {"train_loss": -7.530759334564209, "global_step": 35297, "epoch": 210} {"train_loss": -7.826292037963867, "global_step": 35298, "epoch": 210} {"train_loss": -7.385202407836914, "global_step": 35299, "epoch": 210} {"train_loss": -7.332766532897949, "global_step": 35300, "epoch": 210} {"train_loss": -7.636014938354492, "global_step": 35301, "epoch": 210} {"train_loss": -7.2910261154174805, "global_step": 35302, "epoch": 210} {"train_loss": -7.6822075843811035, "global_step": 35303, "epoch": 210} {"train_loss": -7.209495544433594, "global_step": 35304, "epoch": 210} {"train_loss": -7.473904132843018, "global_step": 35305, "epoch": 210} {"train_loss": -7.620940208435059, "global_step": 35306, "epoch": 210} {"train_loss": -7.4285359382629395, "global_step": 35307, "epoch": 210} {"train_loss": -7.55063009262085, "global_step": 35308, "epoch": 210} {"train_loss": -7.378586292266846, "global_step": 35309, "epoch": 210} {"train_loss": -7.406436920166016, "global_step": 35310, "epoch": 210} {"train_loss": -7.595606803894043, "global_step": 35311, "epoch": 210} {"train_loss": -7.484635353088379, "global_step": 35312, "epoch": 210} {"train_loss": -7.688708782196045, "global_step": 35313, "epoch": 210} {"train_loss": -7.65926456451416, "global_step": 35314, "epoch": 210} {"train_loss": -7.581254005432129, "global_step": 35315, "epoch": 210} {"train_loss": -7.608060836791992, "global_step": 35316, "epoch": 210} {"train_loss": -7.5821380615234375, "global_step": 35317, "epoch": 210} {"train_loss": -7.70521879196167, "global_step": 35318, "epoch": 210} {"train_loss": -7.740546226501465, "global_step": 35319, "epoch": 210} {"train_loss": -7.6884355545043945, "global_step": 35320, "epoch": 210} {"train_loss": -7.870635509490967, "global_step": 35321, "epoch": 210} {"train_loss": -7.733694553375244, "global_step": 35322, "epoch": 210} {"train_loss": -7.739441394805908, "global_step": 35323, "epoch": 210} {"train_loss": -7.707406997680664, "global_step": 35324, "epoch": 210} {"train_loss": -7.726223945617676, "global_step": 35325, "epoch": 210} {"train_loss": -7.880135536193848, "global_step": 35326, "epoch": 210} {"train_loss": -7.622527122497559, "global_step": 35327, "epoch": 210} {"train_loss": -7.783334732055664, "global_step": 35328, "epoch": 210} {"train_loss": -7.907892227172852, "global_step": 35329, "epoch": 210} {"train_loss": -7.977072715759277, "global_step": 35330, "epoch": 210} {"train_loss": -7.819095611572266, "global_step": 35331, "epoch": 210} {"train_loss": -7.709983825683594, "global_step": 35332, "epoch": 210} {"train_loss": -7.767644882202148, "global_step": 35333, "epoch": 210} {"train_loss": -7.804130554199219, "global_step": 35334, "epoch": 210} {"train_loss": -7.676997661590576, "global_step": 35335, "epoch": 210} {"train_loss": -7.798154830932617, "global_step": 35336, "epoch": 210} {"train_loss": -7.750229358673096, "global_step": 35337, "epoch": 210} {"train_loss": -7.8038105964660645, "global_step": 35338, "epoch": 210} {"train_loss": -8.024847030639648, "global_step": 35339, "epoch": 210} {"train_loss": -7.863461494445801, "global_step": 35340, "epoch": 210} {"train_loss": -7.861133575439453, "global_step": 35341, "epoch": 210} {"train_loss": -7.886434078216553, "global_step": 35342, "epoch": 210} {"train_loss": -7.66565465927124, "global_step": 35343, "epoch": 210} {"train_loss": -7.578816890716553, "global_step": 35344, "epoch": 210} {"train_loss": -7.822359085083008, "global_step": 35345, "epoch": 210} {"train_loss": -7.777246475219727, "global_step": 35346, "epoch": 210} {"train_loss": -7.626313209533691, "global_step": 35347, "epoch": 210} {"train_loss": -7.912870407104492, "global_step": 35348, "epoch": 210} {"train_loss": -7.593130111694336, "global_step": 35349, "epoch": 210} {"train_loss": -7.675541877746582, "global_step": 35350, "epoch": 210} {"train_loss": -7.723773002624512, "global_step": 35351, "epoch": 210} {"train_loss": -7.55002498626709, "global_step": 35352, "epoch": 210} {"train_loss": -7.695578575134277, "global_step": 35353, "epoch": 210} {"train_loss": -7.754147529602051, "global_step": 35354, "epoch": 210} {"train_loss": -7.365780830383301, "global_step": 35355, "epoch": 210} {"train_loss": -7.610414505004883, "global_step": 35356, "epoch": 210} {"train_loss": -7.291437149047852, "global_step": 35357, "epoch": 210} {"train_loss": -7.422701835632324, "global_step": 35358, "epoch": 210} {"train_loss": -7.377810478210449, "global_step": 35359, "epoch": 210} {"train_loss": -7.4816155433654785, "global_step": 35360, "epoch": 210} {"train_loss": -7.232988357543945, "global_step": 35361, "epoch": 210} {"train_loss": -7.219453811645508, "global_step": 35362, "epoch": 210} {"train_loss": -7.331228733062744, "global_step": 35363, "epoch": 210} {"train_loss": -7.378924369812012, "global_step": 35364, "epoch": 210} {"train_loss": -7.28689432144165, "global_step": 35365, "epoch": 210} {"train_loss": -7.261151313781738, "global_step": 35366, "epoch": 210} {"train_loss": -7.379797458648682, "global_step": 35367, "epoch": 210} {"train_loss": -7.519565582275391, "global_step": 35368, "epoch": 210} {"train_loss": -7.31242036819458, "global_step": 35369, "epoch": 210} {"train_loss": -7.381320953369141, "global_step": 35370, "epoch": 210} {"train_loss": -7.6322221755981445, "global_step": 35371, "epoch": 210} {"train_loss": -7.597652435302734, "global_step": 35372, "epoch": 210} {"train_loss": -7.508108139038086, "global_step": 35373, "epoch": 210} {"train_loss": -7.675925254821777, "global_step": 35374, "epoch": 210} {"train_loss": -7.629117012023926, "global_step": 35375, "epoch": 210} {"train_loss": -7.713200569152832, "global_step": 35376, "epoch": 210} {"train_loss": -7.669787883758545, "global_step": 35377, "epoch": 210} {"train_loss": -7.722254753112793, "global_step": 35378, "epoch": 210} {"train_loss": -7.962294101715088, "global_step": 35379, "epoch": 210} {"train_loss": -7.690417289733887, "global_step": 35380, "epoch": 210} {"train_loss": -7.943783760070801, "global_step": 35381, "epoch": 210} {"train_loss": -7.660094261169434, "global_step": 35382, "epoch": 210} {"train_loss": -7.717674255371094, "global_step": 35383, "epoch": 210} {"train_loss": -7.708573341369629, "global_step": 35384, "epoch": 210} {"train_loss": -7.529604911804199, "global_step": 35385, "epoch": 210} {"train_loss": -7.828453063964844, "global_step": 35386, "epoch": 210} {"train_loss": -7.568049430847168, "global_step": 35387, "epoch": 210} {"train_loss": -7.6622724533081055, "global_step": 35388, "epoch": 210} {"train_loss": -7.650099754333496, "global_step": 35389, "epoch": 210} {"train_loss": -7.819495677947998, "global_step": 35390, "epoch": 210} {"train_loss": -7.723835468292236, "global_step": 35391, "epoch": 210} {"train_loss": -7.782637596130371, "global_step": 35392, "epoch": 210} {"train_loss": -7.922540664672852, "global_step": 35393, "epoch": 210} {"train_loss": -7.497056007385254, "global_step": 35394, "epoch": 210} {"train_loss": -7.684562683105469, "global_step": 35395, "epoch": 210} {"train_loss": -7.50982141494751, "global_step": 35396, "epoch": 210} {"train_loss": -8.027591705322266, "global_step": 35397, "epoch": 210} {"train_loss": -7.607064247131348, "global_step": 35398, "epoch": 210} {"train_loss": -7.782003402709961, "global_step": 35399, "epoch": 210} {"train_loss": -7.617215156555176, "global_step": 35400, "epoch": 210} {"train_loss": -7.684108257293701, "global_step": 35401, "epoch": 210} {"train_loss": -7.67995548248291, "global_step": 35402, "epoch": 210} {"train_loss": -7.834597587585449, "global_step": 35403, "epoch": 210} {"train_loss": -7.595653533935547, "global_step": 35404, "epoch": 210} {"train_loss": -7.8985595703125, "global_step": 35405, "epoch": 210} {"train_loss": -7.702539920806885, "global_step": 35406, "epoch": 210} {"train_loss": -7.851579666137695, "global_step": 35407, "epoch": 210} {"train_loss": -7.854071617126465, "global_step": 35408, "epoch": 210} {"train_loss": -7.772416114807129, "global_step": 35409, "epoch": 210} {"train_loss": -7.839881896972656, "global_step": 35410, "epoch": 210} {"train_loss": -7.971567153930664, "global_step": 35411, "epoch": 210} {"train_loss": -7.707711219787598, "global_step": 35412, "epoch": 210} {"train_loss": -7.673215866088867, "global_step": 35413, "epoch": 210} {"train_loss": -7.869179725646973, "global_step": 35414, "epoch": 210} {"train_loss": -7.784736633300781, "global_step": 35415, "epoch": 210} {"train_loss": -7.712124824523926, "global_step": 35416, "epoch": 210} {"train_loss": -7.781442642211914, "global_step": 35417, "epoch": 210} {"train_loss": -7.970707893371582, "global_step": 35418, "epoch": 210} {"train_loss": -7.755936622619629, "global_step": 35419, "epoch": 210} {"train_loss": -7.971016883850098, "global_step": 35420, "epoch": 210} {"train_loss": -7.938849449157715, "global_step": 35421, "epoch": 210} {"train_loss": -7.829316139221191, "global_step": 35422, "epoch": 210} {"train_loss": -7.642261505126953, "global_step": 35423, "epoch": 210} {"train_loss": -7.623889923095703, "global_step": 35424, "epoch": 210} {"train_loss": -7.817652702331543, "global_step": 35425, "epoch": 210} {"train_loss": -7.685060501098633, "global_step": 35426, "epoch": 210} {"train_loss": -7.63527774810791, "global_step": 35427, "epoch": 210} {"train_loss": -7.860337734222412, "global_step": 35428, "epoch": 210} {"train_loss": -7.705410957336426, "global_step": 35429, "epoch": 210} {"train_loss": -7.799432277679443, "global_step": 35430, "epoch": 210} {"train_loss": -7.842309951782227, "global_step": 35431, "epoch": 210} {"train_loss": -7.997204303741455, "global_step": 35432, "epoch": 210} {"train_loss": -7.638567924499512, "global_step": 35433, "epoch": 210} {"train_loss": -7.906665325164795, "global_step": 35434, "epoch": 210} {"train_loss": -7.787448883056641, "global_step": 35435, "epoch": 210} {"train_loss": -7.800990104675293, "global_step": 35436, "epoch": 210} {"train_loss": -7.722794532775879, "global_step": 35437, "epoch": 210} {"train_loss": -7.8890533447265625, "global_step": 35438, "epoch": 210} {"train_loss": -7.592050552368164, "global_step": 35439, "epoch": 210} {"train_loss": -7.790650367736816, "global_step": 35440, "epoch": 210} {"train_loss": -7.882607936859131, "global_step": 35441, "epoch": 210} {"train_loss": -7.791450023651123, "global_step": 35442, "epoch": 210} {"train_loss": -7.805567741394043, "global_step": 35443, "epoch": 210} {"train_loss": -7.994812965393066, "global_step": 35444, "epoch": 210} {"train_loss": -7.660538673400879, "global_step": 35445, "epoch": 210} {"train_loss": -7.695528507232666, "global_step": 35446, "epoch": 210} {"train_loss": -7.673113462470827, "global_step": 35447, "epoch": 210, "val_loss": 185991.5, "train_action_mse_error": 17.716062545776367} {"train_loss": -7.88804817199707, "global_step": 35448, "epoch": 211} {"train_loss": -7.593776702880859, "global_step": 35449, "epoch": 211} {"train_loss": -7.758399963378906, "global_step": 35450, "epoch": 211} {"train_loss": -7.516116142272949, "global_step": 35451, "epoch": 211} {"train_loss": -7.709284782409668, "global_step": 35452, "epoch": 211} {"train_loss": -7.494162559509277, "global_step": 35453, "epoch": 211} {"train_loss": -7.704362392425537, "global_step": 35454, "epoch": 211} {"train_loss": -7.410924911499023, "global_step": 35455, "epoch": 211} {"train_loss": -7.904540538787842, "global_step": 35456, "epoch": 211} {"train_loss": -7.431546211242676, "global_step": 35457, "epoch": 211} {"train_loss": -7.728872299194336, "global_step": 35458, "epoch": 211} {"train_loss": -7.7429609298706055, "global_step": 35459, "epoch": 211} {"train_loss": -7.162565231323242, "global_step": 35460, "epoch": 211} {"train_loss": -7.754020690917969, "global_step": 35461, "epoch": 211} {"train_loss": -7.526233673095703, "global_step": 35462, "epoch": 211} {"train_loss": -7.433258533477783, "global_step": 35463, "epoch": 211} {"train_loss": -7.597694396972656, "global_step": 35464, "epoch": 211} {"train_loss": -7.414231777191162, "global_step": 35465, "epoch": 211} {"train_loss": -7.713170051574707, "global_step": 35466, "epoch": 211} {"train_loss": -7.595363140106201, "global_step": 35467, "epoch": 211} {"train_loss": -7.542503833770752, "global_step": 35468, "epoch": 211} {"train_loss": -7.539851665496826, "global_step": 35469, "epoch": 211} {"train_loss": -7.533858776092529, "global_step": 35470, "epoch": 211} {"train_loss": -7.758672714233398, "global_step": 35471, "epoch": 211} {"train_loss": -7.377443313598633, "global_step": 35472, "epoch": 211} {"train_loss": -7.649481296539307, "global_step": 35473, "epoch": 211} {"train_loss": -7.762103080749512, "global_step": 35474, "epoch": 211} {"train_loss": -7.557600975036621, "global_step": 35475, "epoch": 211} {"train_loss": -7.8049702644348145, "global_step": 35476, "epoch": 211} {"train_loss": -7.468911170959473, "global_step": 35477, "epoch": 211} {"train_loss": -7.662351131439209, "global_step": 35478, "epoch": 211} {"train_loss": -7.4542999267578125, "global_step": 35479, "epoch": 211} {"train_loss": -7.61752986907959, "global_step": 35480, "epoch": 211} {"train_loss": -7.319027423858643, "global_step": 35481, "epoch": 211} {"train_loss": -7.530740261077881, "global_step": 35482, "epoch": 211} {"train_loss": -7.247207164764404, "global_step": 35483, "epoch": 211} {"train_loss": -7.529874324798584, "global_step": 35484, "epoch": 211} {"train_loss": -7.564048767089844, "global_step": 35485, "epoch": 211} {"train_loss": -7.535309791564941, "global_step": 35486, "epoch": 211} {"train_loss": -7.6043195724487305, "global_step": 35487, "epoch": 211} {"train_loss": -7.533940315246582, "global_step": 35488, "epoch": 211} {"train_loss": -7.629380226135254, "global_step": 35489, "epoch": 211} {"train_loss": -7.614173412322998, "global_step": 35490, "epoch": 211} {"train_loss": -7.759609699249268, "global_step": 35491, "epoch": 211} {"train_loss": -7.615194320678711, "global_step": 35492, "epoch": 211} {"train_loss": -7.638723373413086, "global_step": 35493, "epoch": 211} {"train_loss": -7.642581939697266, "global_step": 35494, "epoch": 211} {"train_loss": -7.856457710266113, "global_step": 35495, "epoch": 211} {"train_loss": -7.679883003234863, "global_step": 35496, "epoch": 211} {"train_loss": -7.599163055419922, "global_step": 35497, "epoch": 211} {"train_loss": -7.318940162658691, "global_step": 35498, "epoch": 211} {"train_loss": -7.653142929077148, "global_step": 35499, "epoch": 211} {"train_loss": -7.376657485961914, "global_step": 35500, "epoch": 211} {"train_loss": -7.518332004547119, "global_step": 35501, "epoch": 211} {"train_loss": -7.718621253967285, "global_step": 35502, "epoch": 211} {"train_loss": -7.571922779083252, "global_step": 35503, "epoch": 211} {"train_loss": -7.6244893074035645, "global_step": 35504, "epoch": 211} {"train_loss": -7.703517436981201, "global_step": 35505, "epoch": 211} {"train_loss": -7.653266429901123, "global_step": 35506, "epoch": 211} {"train_loss": -7.830264568328857, "global_step": 35507, "epoch": 211} {"train_loss": -7.932960510253906, "global_step": 35508, "epoch": 211} {"train_loss": -7.948509216308594, "global_step": 35509, "epoch": 211} {"train_loss": -7.70413875579834, "global_step": 35510, "epoch": 211} {"train_loss": -7.790015697479248, "global_step": 35511, "epoch": 211} {"train_loss": -7.906396865844727, "global_step": 35512, "epoch": 211} {"train_loss": -7.82135009765625, "global_step": 35513, "epoch": 211} {"train_loss": -7.791118144989014, "global_step": 35514, "epoch": 211} {"train_loss": -7.81859016418457, "global_step": 35515, "epoch": 211} {"train_loss": -7.626338958740234, "global_step": 35516, "epoch": 211} {"train_loss": -8.013505935668945, "global_step": 35517, "epoch": 211} {"train_loss": -7.80961275100708, "global_step": 35518, "epoch": 211} {"train_loss": -7.956664562225342, "global_step": 35519, "epoch": 211} {"train_loss": -7.96141242980957, "global_step": 35520, "epoch": 211} {"train_loss": -7.983263969421387, "global_step": 35521, "epoch": 211} {"train_loss": -7.8907060623168945, "global_step": 35522, "epoch": 211} {"train_loss": -7.616332054138184, "global_step": 35523, "epoch": 211} {"train_loss": -7.78339958190918, "global_step": 35524, "epoch": 211} {"train_loss": -7.880070686340332, "global_step": 35525, "epoch": 211} {"train_loss": -7.964655876159668, "global_step": 35526, "epoch": 211} {"train_loss": -7.950041770935059, "global_step": 35527, "epoch": 211} {"train_loss": -7.86700439453125, "global_step": 35528, "epoch": 211} {"train_loss": -7.707657337188721, "global_step": 35529, "epoch": 211} {"train_loss": -7.861977577209473, "global_step": 35530, "epoch": 211} {"train_loss": -7.626864433288574, "global_step": 35531, "epoch": 211} {"train_loss": -7.896329402923584, "global_step": 35532, "epoch": 211} {"train_loss": -7.784765243530273, "global_step": 35533, "epoch": 211} {"train_loss": -7.833209991455078, "global_step": 35534, "epoch": 211} {"train_loss": -7.706199645996094, "global_step": 35535, "epoch": 211} {"train_loss": -7.819498062133789, "global_step": 35536, "epoch": 211} {"train_loss": -7.8684539794921875, "global_step": 35537, "epoch": 211} {"train_loss": -7.724617004394531, "global_step": 35538, "epoch": 211} {"train_loss": -7.781232833862305, "global_step": 35539, "epoch": 211} {"train_loss": -7.516199111938477, "global_step": 35540, "epoch": 211} {"train_loss": -7.785022735595703, "global_step": 35541, "epoch": 211} {"train_loss": -7.60156774520874, "global_step": 35542, "epoch": 211} {"train_loss": -7.794066905975342, "global_step": 35543, "epoch": 211} {"train_loss": -7.493978500366211, "global_step": 35544, "epoch": 211} {"train_loss": -7.828885078430176, "global_step": 35545, "epoch": 211} {"train_loss": -7.740995407104492, "global_step": 35546, "epoch": 211} {"train_loss": -7.8591108322143555, "global_step": 35547, "epoch": 211} {"train_loss": -7.861250400543213, "global_step": 35548, "epoch": 211} {"train_loss": -7.790250778198242, "global_step": 35549, "epoch": 211} {"train_loss": -7.9426655769348145, "global_step": 35550, "epoch": 211} {"train_loss": -7.657259941101074, "global_step": 35551, "epoch": 211} {"train_loss": -7.982714653015137, "global_step": 35552, "epoch": 211} {"train_loss": -7.767428398132324, "global_step": 35553, "epoch": 211} {"train_loss": -7.813575744628906, "global_step": 35554, "epoch": 211} {"train_loss": -7.610484600067139, "global_step": 35555, "epoch": 211} {"train_loss": -7.950968265533447, "global_step": 35556, "epoch": 211} {"train_loss": -7.75961446762085, "global_step": 35557, "epoch": 211} {"train_loss": -7.695666313171387, "global_step": 35558, "epoch": 211} {"train_loss": -7.732208728790283, "global_step": 35559, "epoch": 211} {"train_loss": -7.790648460388184, "global_step": 35560, "epoch": 211} {"train_loss": -7.576321601867676, "global_step": 35561, "epoch": 211} {"train_loss": -7.767766952514648, "global_step": 35562, "epoch": 211} {"train_loss": -7.495367050170898, "global_step": 35563, "epoch": 211} {"train_loss": -7.815440654754639, "global_step": 35564, "epoch": 211} {"train_loss": -7.688376426696777, "global_step": 35565, "epoch": 211} {"train_loss": -8.030496597290039, "global_step": 35566, "epoch": 211} {"train_loss": -7.841190338134766, "global_step": 35567, "epoch": 211} {"train_loss": -7.891737937927246, "global_step": 35568, "epoch": 211} {"train_loss": -7.651827812194824, "global_step": 35569, "epoch": 211} {"train_loss": -7.955807685852051, "global_step": 35570, "epoch": 211} {"train_loss": -7.632969856262207, "global_step": 35571, "epoch": 211} {"train_loss": -7.898154258728027, "global_step": 35572, "epoch": 211} {"train_loss": -7.230539321899414, "global_step": 35573, "epoch": 211} {"train_loss": -7.772315979003906, "global_step": 35574, "epoch": 211} {"train_loss": -7.670754432678223, "global_step": 35575, "epoch": 211} {"train_loss": -7.8110198974609375, "global_step": 35576, "epoch": 211} {"train_loss": -7.744988441467285, "global_step": 35577, "epoch": 211} {"train_loss": -7.923956394195557, "global_step": 35578, "epoch": 211} {"train_loss": -7.876384735107422, "global_step": 35579, "epoch": 211} {"train_loss": -7.953549385070801, "global_step": 35580, "epoch": 211} {"train_loss": -7.892313003540039, "global_step": 35581, "epoch": 211} {"train_loss": -7.770116329193115, "global_step": 35582, "epoch": 211} {"train_loss": -7.675166130065918, "global_step": 35583, "epoch": 211} {"train_loss": -7.938216209411621, "global_step": 35584, "epoch": 211} {"train_loss": -7.8035783767700195, "global_step": 35585, "epoch": 211} {"train_loss": -7.865966796875, "global_step": 35586, "epoch": 211} {"train_loss": -7.679058074951172, "global_step": 35587, "epoch": 211} {"train_loss": -7.6569976806640625, "global_step": 35588, "epoch": 211} {"train_loss": -7.573494911193848, "global_step": 35589, "epoch": 211} {"train_loss": -7.5574750900268555, "global_step": 35590, "epoch": 211} {"train_loss": -7.62298583984375, "global_step": 35591, "epoch": 211} {"train_loss": -7.761538505554199, "global_step": 35592, "epoch": 211} {"train_loss": -7.683494567871094, "global_step": 35593, "epoch": 211} {"train_loss": -7.873185634613037, "global_step": 35594, "epoch": 211} {"train_loss": -7.803738594055176, "global_step": 35595, "epoch": 211} {"train_loss": -7.718964576721191, "global_step": 35596, "epoch": 211} {"train_loss": -7.780221939086914, "global_step": 35597, "epoch": 211} {"train_loss": -7.591398239135742, "global_step": 35598, "epoch": 211} {"train_loss": -7.831496715545654, "global_step": 35599, "epoch": 211} {"train_loss": -7.748709201812744, "global_step": 35600, "epoch": 211} {"train_loss": -7.740461349487305, "global_step": 35601, "epoch": 211} {"train_loss": -7.764562606811523, "global_step": 35602, "epoch": 211} {"train_loss": -7.9194488525390625, "global_step": 35603, "epoch": 211} {"train_loss": -7.743121147155762, "global_step": 35604, "epoch": 211} {"train_loss": -7.445074081420898, "global_step": 35605, "epoch": 211} {"train_loss": -7.741096496582031, "global_step": 35606, "epoch": 211} {"train_loss": -7.932498455047607, "global_step": 35607, "epoch": 211} {"train_loss": -7.53134822845459, "global_step": 35608, "epoch": 211} {"train_loss": -7.682624816894531, "global_step": 35609, "epoch": 211} {"train_loss": -7.842841148376465, "global_step": 35610, "epoch": 211} {"train_loss": -7.632019996643066, "global_step": 35611, "epoch": 211} {"train_loss": -7.752469062805176, "global_step": 35612, "epoch": 211} {"train_loss": -7.740586280822754, "global_step": 35613, "epoch": 211} {"train_loss": -7.509066581726074, "global_step": 35614, "epoch": 211} {"train_loss": -7.70905693939754, "global_step": 35615, "epoch": 211, "val_loss": 185899.84375} {"train_loss": -7.7526726722717285, "global_step": 35616, "epoch": 212} {"train_loss": -7.736151218414307, "global_step": 35617, "epoch": 212} {"train_loss": -8.048534393310547, "global_step": 35618, "epoch": 212} {"train_loss": -7.943866729736328, "global_step": 35619, "epoch": 212} {"train_loss": -7.838552951812744, "global_step": 35620, "epoch": 212} {"train_loss": -8.093360900878906, "global_step": 35621, "epoch": 212} {"train_loss": -7.465500831604004, "global_step": 35622, "epoch": 212} {"train_loss": -7.677281856536865, "global_step": 35623, "epoch": 212} {"train_loss": -7.876639366149902, "global_step": 35624, "epoch": 212} {"train_loss": -7.543586254119873, "global_step": 35625, "epoch": 212} {"train_loss": -7.895907402038574, "global_step": 35626, "epoch": 212} {"train_loss": -7.782672882080078, "global_step": 35627, "epoch": 212} {"train_loss": -7.534219741821289, "global_step": 35628, "epoch": 212} {"train_loss": -7.930453777313232, "global_step": 35629, "epoch": 212} {"train_loss": -7.908980369567871, "global_step": 35630, "epoch": 212} {"train_loss": -7.786050796508789, "global_step": 35631, "epoch": 212} {"train_loss": -7.367374897003174, "global_step": 35632, "epoch": 212} {"train_loss": -7.7187933921813965, "global_step": 35633, "epoch": 212} {"train_loss": -7.534071922302246, "global_step": 35634, "epoch": 212} {"train_loss": -7.740486145019531, "global_step": 35635, "epoch": 212} {"train_loss": -7.686301231384277, "global_step": 35636, "epoch": 212} {"train_loss": -7.719542503356934, "global_step": 35637, "epoch": 212} {"train_loss": -7.709148406982422, "global_step": 35638, "epoch": 212} {"train_loss": -7.713252067565918, "global_step": 35639, "epoch": 212} {"train_loss": -7.734626770019531, "global_step": 35640, "epoch": 212} {"train_loss": -7.232934951782227, "global_step": 35641, "epoch": 212} {"train_loss": -7.734899997711182, "global_step": 35642, "epoch": 212} {"train_loss": -7.702029705047607, "global_step": 35643, "epoch": 212} {"train_loss": -7.662895202636719, "global_step": 35644, "epoch": 212} {"train_loss": -7.786600112915039, "global_step": 35645, "epoch": 212} {"train_loss": -7.482760906219482, "global_step": 35646, "epoch": 212} {"train_loss": -7.746659755706787, "global_step": 35647, "epoch": 212} {"train_loss": -7.872738838195801, "global_step": 35648, "epoch": 212} {"train_loss": -7.804659843444824, "global_step": 35649, "epoch": 212} {"train_loss": -7.662509918212891, "global_step": 35650, "epoch": 212} {"train_loss": -7.601070404052734, "global_step": 35651, "epoch": 212} {"train_loss": -7.570461273193359, "global_step": 35652, "epoch": 212} {"train_loss": -7.805253982543945, "global_step": 35653, "epoch": 212} {"train_loss": -7.696214199066162, "global_step": 35654, "epoch": 212} {"train_loss": -7.765845775604248, "global_step": 35655, "epoch": 212} {"train_loss": -7.971478462219238, "global_step": 35656, "epoch": 212} {"train_loss": -7.817910671234131, "global_step": 35657, "epoch": 212} {"train_loss": -7.862400531768799, "global_step": 35658, "epoch": 212} {"train_loss": -7.958531379699707, "global_step": 35659, "epoch": 212} {"train_loss": -7.8030686378479, "global_step": 35660, "epoch": 212} {"train_loss": -7.605660438537598, "global_step": 35661, "epoch": 212} {"train_loss": -7.834816932678223, "global_step": 35662, "epoch": 212} {"train_loss": -7.852883815765381, "global_step": 35663, "epoch": 212} {"train_loss": -7.963694095611572, "global_step": 35664, "epoch": 212} {"train_loss": -7.96583366394043, "global_step": 35665, "epoch": 212} {"train_loss": -7.641800880432129, "global_step": 35666, "epoch": 212} {"train_loss": -7.572188377380371, "global_step": 35667, "epoch": 212} {"train_loss": -7.809778690338135, "global_step": 35668, "epoch": 212} {"train_loss": -7.631091594696045, "global_step": 35669, "epoch": 212} {"train_loss": -7.880969047546387, "global_step": 35670, "epoch": 212} {"train_loss": -7.933654308319092, "global_step": 35671, "epoch": 212} {"train_loss": -7.792062759399414, "global_step": 35672, "epoch": 212} {"train_loss": -7.903108596801758, "global_step": 35673, "epoch": 212} {"train_loss": -7.518965244293213, "global_step": 35674, "epoch": 212} {"train_loss": -7.645648002624512, "global_step": 35675, "epoch": 212} {"train_loss": -7.7676286697387695, "global_step": 35676, "epoch": 212} {"train_loss": -7.396211624145508, "global_step": 35677, "epoch": 212} {"train_loss": -7.925802230834961, "global_step": 35678, "epoch": 212} {"train_loss": -7.420561790466309, "global_step": 35679, "epoch": 212} {"train_loss": -7.586420059204102, "global_step": 35680, "epoch": 212} {"train_loss": -7.6370649337768555, "global_step": 35681, "epoch": 212} {"train_loss": -7.681604385375977, "global_step": 35682, "epoch": 212} {"train_loss": -7.6017866134643555, "global_step": 35683, "epoch": 212} {"train_loss": -7.748722076416016, "global_step": 35684, "epoch": 212} {"train_loss": -7.640841960906982, "global_step": 35685, "epoch": 212} {"train_loss": -7.656588077545166, "global_step": 35686, "epoch": 212} {"train_loss": -7.651081085205078, "global_step": 35687, "epoch": 212} {"train_loss": -7.655671119689941, "global_step": 35688, "epoch": 212} {"train_loss": -7.662435054779053, "global_step": 35689, "epoch": 212} {"train_loss": -7.726573944091797, "global_step": 35690, "epoch": 212} {"train_loss": -7.62522029876709, "global_step": 35691, "epoch": 212} {"train_loss": -7.880898475646973, "global_step": 35692, "epoch": 212} {"train_loss": -7.621858596801758, "global_step": 35693, "epoch": 212} {"train_loss": -7.79909086227417, "global_step": 35694, "epoch": 212} {"train_loss": -7.832057952880859, "global_step": 35695, "epoch": 212} {"train_loss": -7.768711090087891, "global_step": 35696, "epoch": 212} {"train_loss": -7.603443145751953, "global_step": 35697, "epoch": 212} {"train_loss": -7.709118843078613, "global_step": 35698, "epoch": 212} {"train_loss": -7.656177520751953, "global_step": 35699, "epoch": 212} {"train_loss": -7.812241077423096, "global_step": 35700, "epoch": 212} {"train_loss": -7.844861030578613, "global_step": 35701, "epoch": 212} {"train_loss": -7.930906295776367, "global_step": 35702, "epoch": 212} {"train_loss": -7.742319107055664, "global_step": 35703, "epoch": 212} {"train_loss": -7.894705772399902, "global_step": 35704, "epoch": 212} {"train_loss": -7.692107200622559, "global_step": 35705, "epoch": 212} {"train_loss": -7.8802995681762695, "global_step": 35706, "epoch": 212} {"train_loss": -7.769662857055664, "global_step": 35707, "epoch": 212} {"train_loss": -7.708348751068115, "global_step": 35708, "epoch": 212} {"train_loss": -7.974570274353027, "global_step": 35709, "epoch": 212} {"train_loss": -7.992213249206543, "global_step": 35710, "epoch": 212} {"train_loss": -7.871303558349609, "global_step": 35711, "epoch": 212} {"train_loss": -7.916247844696045, "global_step": 35712, "epoch": 212} {"train_loss": -7.775832653045654, "global_step": 35713, "epoch": 212} {"train_loss": -7.675143241882324, "global_step": 35714, "epoch": 212} {"train_loss": -7.855390548706055, "global_step": 35715, "epoch": 212} {"train_loss": -7.855881214141846, "global_step": 35716, "epoch": 212} {"train_loss": -7.947359561920166, "global_step": 35717, "epoch": 212} {"train_loss": -7.948082447052002, "global_step": 35718, "epoch": 212} {"train_loss": -7.75468111038208, "global_step": 35719, "epoch": 212} {"train_loss": -7.796594142913818, "global_step": 35720, "epoch": 212} {"train_loss": -7.754560470581055, "global_step": 35721, "epoch": 212} {"train_loss": -7.8827714920043945, "global_step": 35722, "epoch": 212} {"train_loss": -7.86676549911499, "global_step": 35723, "epoch": 212} {"train_loss": -7.834988117218018, "global_step": 35724, "epoch": 212} {"train_loss": -7.846357822418213, "global_step": 35725, "epoch": 212} {"train_loss": -7.7121686935424805, "global_step": 35726, "epoch": 212} {"train_loss": -7.856652736663818, "global_step": 35727, "epoch": 212} {"train_loss": -7.735940933227539, "global_step": 35728, "epoch": 212} {"train_loss": -7.751981258392334, "global_step": 35729, "epoch": 212} {"train_loss": -7.700948715209961, "global_step": 35730, "epoch": 212} {"train_loss": -7.916428565979004, "global_step": 35731, "epoch": 212} {"train_loss": -7.887604713439941, "global_step": 35732, "epoch": 212} {"train_loss": -7.826475143432617, "global_step": 35733, "epoch": 212} {"train_loss": -7.839545249938965, "global_step": 35734, "epoch": 212} {"train_loss": -7.7789530754089355, "global_step": 35735, "epoch": 212} {"train_loss": -7.789515495300293, "global_step": 35736, "epoch": 212} {"train_loss": -7.739326477050781, "global_step": 35737, "epoch": 212} {"train_loss": -7.6714911460876465, "global_step": 35738, "epoch": 212} {"train_loss": -7.787569999694824, "global_step": 35739, "epoch": 212} {"train_loss": -7.699368476867676, "global_step": 35740, "epoch": 212} {"train_loss": -7.940596103668213, "global_step": 35741, "epoch": 212} {"train_loss": -7.805080890655518, "global_step": 35742, "epoch": 212} {"train_loss": -7.822495937347412, "global_step": 35743, "epoch": 212} {"train_loss": -7.836129188537598, "global_step": 35744, "epoch": 212} {"train_loss": -7.8323750495910645, "global_step": 35745, "epoch": 212} {"train_loss": -7.648252964019775, "global_step": 35746, "epoch": 212} {"train_loss": -7.701198577880859, "global_step": 35747, "epoch": 212} {"train_loss": -7.826162338256836, "global_step": 35748, "epoch": 212} {"train_loss": -7.616039752960205, "global_step": 35749, "epoch": 212} {"train_loss": -7.737353324890137, "global_step": 35750, "epoch": 212} {"train_loss": -7.536302089691162, "global_step": 35751, "epoch": 212} {"train_loss": -7.582959175109863, "global_step": 35752, "epoch": 212} {"train_loss": -7.893646240234375, "global_step": 35753, "epoch": 212} {"train_loss": -7.848136901855469, "global_step": 35754, "epoch": 212} {"train_loss": -7.673013210296631, "global_step": 35755, "epoch": 212} {"train_loss": -7.823893070220947, "global_step": 35756, "epoch": 212} {"train_loss": -7.816259384155273, "global_step": 35757, "epoch": 212} {"train_loss": -7.793323040008545, "global_step": 35758, "epoch": 212} {"train_loss": -7.66789436340332, "global_step": 35759, "epoch": 212} {"train_loss": -7.949460983276367, "global_step": 35760, "epoch": 212} {"train_loss": -7.744943141937256, "global_step": 35761, "epoch": 212} {"train_loss": -7.893203258514404, "global_step": 35762, "epoch": 212} {"train_loss": -7.830658912658691, "global_step": 35763, "epoch": 212} {"train_loss": -8.010505676269531, "global_step": 35764, "epoch": 212} {"train_loss": -7.891789436340332, "global_step": 35765, "epoch": 212} {"train_loss": -7.901937484741211, "global_step": 35766, "epoch": 212} {"train_loss": -8.14225959777832, "global_step": 35767, "epoch": 212} {"train_loss": -7.811282157897949, "global_step": 35768, "epoch": 212} {"train_loss": -7.842438697814941, "global_step": 35769, "epoch": 212} {"train_loss": -7.788277626037598, "global_step": 35770, "epoch": 212} {"train_loss": -7.627573490142822, "global_step": 35771, "epoch": 212} {"train_loss": -8.010865211486816, "global_step": 35772, "epoch": 212} {"train_loss": -7.7849321365356445, "global_step": 35773, "epoch": 212} {"train_loss": -7.924914360046387, "global_step": 35774, "epoch": 212} {"train_loss": -8.112735748291016, "global_step": 35775, "epoch": 212} {"train_loss": -7.717221260070801, "global_step": 35776, "epoch": 212} {"train_loss": -7.72103214263916, "global_step": 35777, "epoch": 212} {"train_loss": -7.658533573150635, "global_step": 35778, "epoch": 212} {"train_loss": -7.580598831176758, "global_step": 35779, "epoch": 212} {"train_loss": -7.662604808807373, "global_step": 35780, "epoch": 212} {"train_loss": -7.42857027053833, "global_step": 35781, "epoch": 212} {"train_loss": -7.446652412414551, "global_step": 35782, "epoch": 212} {"train_loss": -7.762726116748083, "global_step": 35783, "epoch": 212, "val_loss": 186168.125} {"train_loss": -7.94313907623291, "global_step": 35784, "epoch": 213} {"train_loss": -7.700198173522949, "global_step": 35785, "epoch": 213} {"train_loss": -7.753595352172852, "global_step": 35786, "epoch": 213} {"train_loss": -7.561432838439941, "global_step": 35787, "epoch": 213} {"train_loss": -7.727025985717773, "global_step": 35788, "epoch": 213} {"train_loss": -7.811870098114014, "global_step": 35789, "epoch": 213} {"train_loss": -7.566089630126953, "global_step": 35790, "epoch": 213} {"train_loss": -7.720499515533447, "global_step": 35791, "epoch": 213} {"train_loss": -7.603837966918945, "global_step": 35792, "epoch": 213} {"train_loss": -7.7798380851745605, "global_step": 35793, "epoch": 213} {"train_loss": -7.522590637207031, "global_step": 35794, "epoch": 213} {"train_loss": -8.027862548828125, "global_step": 35795, "epoch": 213} {"train_loss": -7.78816556930542, "global_step": 35796, "epoch": 213} {"train_loss": -7.796910762786865, "global_step": 35797, "epoch": 213} {"train_loss": -7.605320453643799, "global_step": 35798, "epoch": 213} {"train_loss": -7.857844352722168, "global_step": 35799, "epoch": 213} {"train_loss": -7.573019981384277, "global_step": 35800, "epoch": 213} {"train_loss": -7.747010231018066, "global_step": 35801, "epoch": 213} {"train_loss": -7.547339916229248, "global_step": 35802, "epoch": 213} {"train_loss": -7.808971881866455, "global_step": 35803, "epoch": 213} {"train_loss": -7.655384063720703, "global_step": 35804, "epoch": 213} {"train_loss": -7.78964900970459, "global_step": 35805, "epoch": 213} {"train_loss": -7.529908180236816, "global_step": 35806, "epoch": 213} {"train_loss": -7.8941826820373535, "global_step": 35807, "epoch": 213} {"train_loss": -7.682357311248779, "global_step": 35808, "epoch": 213} {"train_loss": -7.721495151519775, "global_step": 35809, "epoch": 213} {"train_loss": -7.994368076324463, "global_step": 35810, "epoch": 213} {"train_loss": -7.490082740783691, "global_step": 35811, "epoch": 213} {"train_loss": -7.95065975189209, "global_step": 35812, "epoch": 213} {"train_loss": -7.961843013763428, "global_step": 35813, "epoch": 213} {"train_loss": -7.797560691833496, "global_step": 35814, "epoch": 213} {"train_loss": -7.840723037719727, "global_step": 35815, "epoch": 213} {"train_loss": -8.023394584655762, "global_step": 35816, "epoch": 213} {"train_loss": -7.6942548751831055, "global_step": 35817, "epoch": 213} {"train_loss": -8.04783821105957, "global_step": 35818, "epoch": 213} {"train_loss": -7.806661605834961, "global_step": 35819, "epoch": 213} {"train_loss": -8.143671989440918, "global_step": 35820, "epoch": 213} {"train_loss": -7.6277899742126465, "global_step": 35821, "epoch": 213} {"train_loss": -7.942230224609375, "global_step": 35822, "epoch": 213} {"train_loss": -7.615747451782227, "global_step": 35823, "epoch": 213} {"train_loss": -7.530366897583008, "global_step": 35824, "epoch": 213} {"train_loss": -7.888801574707031, "global_step": 35825, "epoch": 213} {"train_loss": -7.7396559715271, "global_step": 35826, "epoch": 213} {"train_loss": -7.681840419769287, "global_step": 35827, "epoch": 213} {"train_loss": -7.530364036560059, "global_step": 35828, "epoch": 213} {"train_loss": -7.78143310546875, "global_step": 35829, "epoch": 213} {"train_loss": -7.81660270690918, "global_step": 35830, "epoch": 213} {"train_loss": -7.899900436401367, "global_step": 35831, "epoch": 213} {"train_loss": -7.763004302978516, "global_step": 35832, "epoch": 213} {"train_loss": -7.516613960266113, "global_step": 35833, "epoch": 213} {"train_loss": -7.975295066833496, "global_step": 35834, "epoch": 213} {"train_loss": -7.949026584625244, "global_step": 35835, "epoch": 213} {"train_loss": -7.68479061126709, "global_step": 35836, "epoch": 213} {"train_loss": -7.8273468017578125, "global_step": 35837, "epoch": 213} {"train_loss": -7.926520347595215, "global_step": 35838, "epoch": 213} {"train_loss": -7.640568256378174, "global_step": 35839, "epoch": 213} {"train_loss": -7.673612594604492, "global_step": 35840, "epoch": 213} {"train_loss": -7.785098075866699, "global_step": 35841, "epoch": 213} {"train_loss": -7.779754638671875, "global_step": 35842, "epoch": 213} {"train_loss": -7.400916576385498, "global_step": 35843, "epoch": 213} {"train_loss": -7.769056797027588, "global_step": 35844, "epoch": 213} {"train_loss": -7.485785961151123, "global_step": 35845, "epoch": 213} {"train_loss": -7.845615386962891, "global_step": 35846, "epoch": 213} {"train_loss": -7.508955955505371, "global_step": 35847, "epoch": 213} {"train_loss": -7.851686000823975, "global_step": 35848, "epoch": 213} {"train_loss": -7.65704345703125, "global_step": 35849, "epoch": 213} {"train_loss": -7.449554443359375, "global_step": 35850, "epoch": 213} {"train_loss": -7.598420143127441, "global_step": 35851, "epoch": 213} {"train_loss": -7.175820350646973, "global_step": 35852, "epoch": 213} {"train_loss": -7.7022385597229, "global_step": 35853, "epoch": 213} {"train_loss": -7.428655624389648, "global_step": 35854, "epoch": 213} {"train_loss": -7.831307888031006, "global_step": 35855, "epoch": 213} {"train_loss": -7.557175636291504, "global_step": 35856, "epoch": 213} {"train_loss": -7.239901542663574, "global_step": 35857, "epoch": 213} {"train_loss": -7.765013694763184, "global_step": 35858, "epoch": 213} {"train_loss": -7.375347137451172, "global_step": 35859, "epoch": 213} {"train_loss": -7.318813323974609, "global_step": 35860, "epoch": 213} {"train_loss": -7.523924350738525, "global_step": 35861, "epoch": 213} {"train_loss": -7.3718671798706055, "global_step": 35862, "epoch": 213} {"train_loss": -7.634413242340088, "global_step": 35863, "epoch": 213} {"train_loss": -7.820575714111328, "global_step": 35864, "epoch": 213} {"train_loss": -7.483524322509766, "global_step": 35865, "epoch": 213} {"train_loss": -7.759426116943359, "global_step": 35866, "epoch": 213} {"train_loss": -7.522198677062988, "global_step": 35867, "epoch": 213} {"train_loss": -7.704712390899658, "global_step": 35868, "epoch": 213} {"train_loss": -7.4269795417785645, "global_step": 35869, "epoch": 213} {"train_loss": -7.421948432922363, "global_step": 35870, "epoch": 213} {"train_loss": -7.70984411239624, "global_step": 35871, "epoch": 213} {"train_loss": -7.468413829803467, "global_step": 35872, "epoch": 213} {"train_loss": -7.69054651260376, "global_step": 35873, "epoch": 213} {"train_loss": -7.850632667541504, "global_step": 35874, "epoch": 213} {"train_loss": -7.720559120178223, "global_step": 35875, "epoch": 213} {"train_loss": -7.589836120605469, "global_step": 35876, "epoch": 213} {"train_loss": -7.9015984535217285, "global_step": 35877, "epoch": 213} {"train_loss": -7.6840410232543945, "global_step": 35878, "epoch": 213} {"train_loss": -7.698917388916016, "global_step": 35879, "epoch": 213} {"train_loss": -7.8431830406188965, "global_step": 35880, "epoch": 213} {"train_loss": -7.917513847351074, "global_step": 35881, "epoch": 213} {"train_loss": -7.614781379699707, "global_step": 35882, "epoch": 213} {"train_loss": -7.836676120758057, "global_step": 35883, "epoch": 213} {"train_loss": -7.977871894836426, "global_step": 35884, "epoch": 213} {"train_loss": -7.780252456665039, "global_step": 35885, "epoch": 213} {"train_loss": -7.863563537597656, "global_step": 35886, "epoch": 213} {"train_loss": -7.8118696212768555, "global_step": 35887, "epoch": 213} {"train_loss": -7.8465986251831055, "global_step": 35888, "epoch": 213} {"train_loss": -7.860565662384033, "global_step": 35889, "epoch": 213} {"train_loss": -7.744418621063232, "global_step": 35890, "epoch": 213} {"train_loss": -7.745300769805908, "global_step": 35891, "epoch": 213} {"train_loss": -7.841052055358887, "global_step": 35892, "epoch": 213} {"train_loss": -7.646218299865723, "global_step": 35893, "epoch": 213} {"train_loss": -7.7735185623168945, "global_step": 35894, "epoch": 213} {"train_loss": -7.823832035064697, "global_step": 35895, "epoch": 213} {"train_loss": -7.829410552978516, "global_step": 35896, "epoch": 213} {"train_loss": -7.981098175048828, "global_step": 35897, "epoch": 213} {"train_loss": -7.742502212524414, "global_step": 35898, "epoch": 213} {"train_loss": -7.833749294281006, "global_step": 35899, "epoch": 213} {"train_loss": -7.9985456466674805, "global_step": 35900, "epoch": 213} {"train_loss": -7.9221343994140625, "global_step": 35901, "epoch": 213} {"train_loss": -7.614522933959961, "global_step": 35902, "epoch": 213} {"train_loss": -7.749428749084473, "global_step": 35903, "epoch": 213} {"train_loss": -7.9123029708862305, "global_step": 35904, "epoch": 213} {"train_loss": -7.849159240722656, "global_step": 35905, "epoch": 213} {"train_loss": -7.59138822555542, "global_step": 35906, "epoch": 213} {"train_loss": -7.738544464111328, "global_step": 35907, "epoch": 213} {"train_loss": -7.750196933746338, "global_step": 35908, "epoch": 213} {"train_loss": -7.739588737487793, "global_step": 35909, "epoch": 213} {"train_loss": -7.907863140106201, "global_step": 35910, "epoch": 213} {"train_loss": -7.819216728210449, "global_step": 35911, "epoch": 213} {"train_loss": -7.754363059997559, "global_step": 35912, "epoch": 213} {"train_loss": -7.845318794250488, "global_step": 35913, "epoch": 213} {"train_loss": -7.715803146362305, "global_step": 35914, "epoch": 213} {"train_loss": -7.84946346282959, "global_step": 35915, "epoch": 213} {"train_loss": -7.705072402954102, "global_step": 35916, "epoch": 213} {"train_loss": -7.755133628845215, "global_step": 35917, "epoch": 213} {"train_loss": -7.686911582946777, "global_step": 35918, "epoch": 213} {"train_loss": -7.735418796539307, "global_step": 35919, "epoch": 213} {"train_loss": -7.729531288146973, "global_step": 35920, "epoch": 213} {"train_loss": -7.702132225036621, "global_step": 35921, "epoch": 213} {"train_loss": -7.774538993835449, "global_step": 35922, "epoch": 213} {"train_loss": -7.870938301086426, "global_step": 35923, "epoch": 213} {"train_loss": -8.098569869995117, "global_step": 35924, "epoch": 213} {"train_loss": -7.746360778808594, "global_step": 35925, "epoch": 213} {"train_loss": -7.952961444854736, "global_step": 35926, "epoch": 213} {"train_loss": -7.947005748748779, "global_step": 35927, "epoch": 213} {"train_loss": -7.829206943511963, "global_step": 35928, "epoch": 213} {"train_loss": -7.926034450531006, "global_step": 35929, "epoch": 213} {"train_loss": -7.89704704284668, "global_step": 35930, "epoch": 213} {"train_loss": -7.8064422607421875, "global_step": 35931, "epoch": 213} {"train_loss": -7.777659893035889, "global_step": 35932, "epoch": 213} {"train_loss": -7.827044486999512, "global_step": 35933, "epoch": 213} {"train_loss": -7.808518409729004, "global_step": 35934, "epoch": 213} {"train_loss": -7.790726661682129, "global_step": 35935, "epoch": 213} {"train_loss": -7.913678169250488, "global_step": 35936, "epoch": 213} {"train_loss": -8.073116302490234, "global_step": 35937, "epoch": 213} {"train_loss": -7.7806220054626465, "global_step": 35938, "epoch": 213} {"train_loss": -7.8655290603637695, "global_step": 35939, "epoch": 213} {"train_loss": -8.011966705322266, "global_step": 35940, "epoch": 213} {"train_loss": -7.748631000518799, "global_step": 35941, "epoch": 213} {"train_loss": -7.688251972198486, "global_step": 35942, "epoch": 213} {"train_loss": -7.731438636779785, "global_step": 35943, "epoch": 213} {"train_loss": -7.776247978210449, "global_step": 35944, "epoch": 213} {"train_loss": -7.962087154388428, "global_step": 35945, "epoch": 213} {"train_loss": -7.827975273132324, "global_step": 35946, "epoch": 213} {"train_loss": -7.668412685394287, "global_step": 35947, "epoch": 213} {"train_loss": -7.663080215454102, "global_step": 35948, "epoch": 213} {"train_loss": -7.923505783081055, "global_step": 35949, "epoch": 213} {"train_loss": -7.233353614807129, "global_step": 35950, "epoch": 213} {"train_loss": -7.744940320650737, "global_step": 35951, "epoch": 213, "val_loss": 187404.984375} {"train_loss": -7.477118968963623, "global_step": 35952, "epoch": 214} {"train_loss": -7.691633224487305, "global_step": 35953, "epoch": 214} {"train_loss": -7.375140190124512, "global_step": 35954, "epoch": 214} {"train_loss": -7.627555847167969, "global_step": 35955, "epoch": 214} {"train_loss": -7.376747131347656, "global_step": 35956, "epoch": 214} {"train_loss": -7.888683795928955, "global_step": 35957, "epoch": 214} {"train_loss": -7.571291446685791, "global_step": 35958, "epoch": 214} {"train_loss": -7.5511980056762695, "global_step": 35959, "epoch": 214} {"train_loss": -7.591397762298584, "global_step": 35960, "epoch": 214} {"train_loss": -7.392108917236328, "global_step": 35961, "epoch": 214} {"train_loss": -7.457056999206543, "global_step": 35962, "epoch": 214} {"train_loss": -7.508121490478516, "global_step": 35963, "epoch": 214} {"train_loss": -7.598144054412842, "global_step": 35964, "epoch": 214} {"train_loss": -7.619079113006592, "global_step": 35965, "epoch": 214} {"train_loss": -7.512456893920898, "global_step": 35966, "epoch": 214} {"train_loss": -7.663564682006836, "global_step": 35967, "epoch": 214} {"train_loss": -7.686948299407959, "global_step": 35968, "epoch": 214} {"train_loss": -7.6745171546936035, "global_step": 35969, "epoch": 214} {"train_loss": -7.684337615966797, "global_step": 35970, "epoch": 214} {"train_loss": -7.654257297515869, "global_step": 35971, "epoch": 214} {"train_loss": -7.748351097106934, "global_step": 35972, "epoch": 214} {"train_loss": -7.5085296630859375, "global_step": 35973, "epoch": 214} {"train_loss": -7.70688009262085, "global_step": 35974, "epoch": 214} {"train_loss": -7.779549598693848, "global_step": 35975, "epoch": 214} {"train_loss": -7.786799430847168, "global_step": 35976, "epoch": 214} {"train_loss": -7.7398529052734375, "global_step": 35977, "epoch": 214} {"train_loss": -7.74567985534668, "global_step": 35978, "epoch": 214} {"train_loss": -7.929142951965332, "global_step": 35979, "epoch": 214} {"train_loss": -7.813488960266113, "global_step": 35980, "epoch": 214} {"train_loss": -7.873661994934082, "global_step": 35981, "epoch": 214} {"train_loss": -7.586376190185547, "global_step": 35982, "epoch": 214} {"train_loss": -7.8218841552734375, "global_step": 35983, "epoch": 214} {"train_loss": -7.656745910644531, "global_step": 35984, "epoch": 214} {"train_loss": -7.684370517730713, "global_step": 35985, "epoch": 214} {"train_loss": -7.461562156677246, "global_step": 35986, "epoch": 214} {"train_loss": -7.556288719177246, "global_step": 35987, "epoch": 214} {"train_loss": -7.796279430389404, "global_step": 35988, "epoch": 214} {"train_loss": -7.415252685546875, "global_step": 35989, "epoch": 214} {"train_loss": -7.773237228393555, "global_step": 35990, "epoch": 214} {"train_loss": -7.891330718994141, "global_step": 35991, "epoch": 214} {"train_loss": -7.808990955352783, "global_step": 35992, "epoch": 214} {"train_loss": -7.640242576599121, "global_step": 35993, "epoch": 214} {"train_loss": -7.65467643737793, "global_step": 35994, "epoch": 214} {"train_loss": -7.7710466384887695, "global_step": 35995, "epoch": 214} {"train_loss": -7.398265838623047, "global_step": 35996, "epoch": 214} {"train_loss": -7.93519401550293, "global_step": 35997, "epoch": 214} {"train_loss": -7.6168646812438965, "global_step": 35998, "epoch": 214} {"train_loss": -7.5623931884765625, "global_step": 35999, "epoch": 214} {"train_loss": -7.931153774261475, "global_step": 36000, "epoch": 214} {"train_loss": -7.708621025085449, "global_step": 36001, "epoch": 214} {"train_loss": -7.359292984008789, "global_step": 36002, "epoch": 214} {"train_loss": -7.8809003829956055, "global_step": 36003, "epoch": 214} {"train_loss": -7.816975116729736, "global_step": 36004, "epoch": 214} {"train_loss": -7.7510881423950195, "global_step": 36005, "epoch": 214} {"train_loss": -7.677381992340088, "global_step": 36006, "epoch": 214} {"train_loss": -7.7675580978393555, "global_step": 36007, "epoch": 214} {"train_loss": -7.880099296569824, "global_step": 36008, "epoch": 214} {"train_loss": -7.89547061920166, "global_step": 36009, "epoch": 214} {"train_loss": -7.692696571350098, "global_step": 36010, "epoch": 214} {"train_loss": -7.889383792877197, "global_step": 36011, "epoch": 214} {"train_loss": -7.522819519042969, "global_step": 36012, "epoch": 214} {"train_loss": -7.608863830566406, "global_step": 36013, "epoch": 214} {"train_loss": -8.022369384765625, "global_step": 36014, "epoch": 214} {"train_loss": -7.7174859046936035, "global_step": 36015, "epoch": 214} {"train_loss": -7.392705917358398, "global_step": 36016, "epoch": 214} {"train_loss": -7.642302513122559, "global_step": 36017, "epoch": 214} {"train_loss": -7.445895195007324, "global_step": 36018, "epoch": 214} {"train_loss": -7.684497356414795, "global_step": 36019, "epoch": 214} {"train_loss": -7.867125511169434, "global_step": 36020, "epoch": 214} {"train_loss": -7.564627647399902, "global_step": 36021, "epoch": 214} {"train_loss": -7.57211446762085, "global_step": 36022, "epoch": 214} {"train_loss": -7.6308913230896, "global_step": 36023, "epoch": 214} {"train_loss": -7.795418739318848, "global_step": 36024, "epoch": 214} {"train_loss": -7.569850921630859, "global_step": 36025, "epoch": 214} {"train_loss": -7.727965831756592, "global_step": 36026, "epoch": 214} {"train_loss": -7.65201473236084, "global_step": 36027, "epoch": 214} {"train_loss": -7.564929485321045, "global_step": 36028, "epoch": 214} {"train_loss": -7.5090532302856445, "global_step": 36029, "epoch": 214} {"train_loss": -7.674562454223633, "global_step": 36030, "epoch": 214} {"train_loss": -7.756923675537109, "global_step": 36031, "epoch": 214} {"train_loss": -7.676641941070557, "global_step": 36032, "epoch": 214} {"train_loss": -7.689806938171387, "global_step": 36033, "epoch": 214} {"train_loss": -7.672810077667236, "global_step": 36034, "epoch": 214} {"train_loss": -7.73746395111084, "global_step": 36035, "epoch": 214} {"train_loss": -7.858266353607178, "global_step": 36036, "epoch": 214} {"train_loss": -7.926080703735352, "global_step": 36037, "epoch": 214} {"train_loss": -7.843512058258057, "global_step": 36038, "epoch": 214} {"train_loss": -7.764525413513184, "global_step": 36039, "epoch": 214} {"train_loss": -7.747393608093262, "global_step": 36040, "epoch": 214} {"train_loss": -7.634982109069824, "global_step": 36041, "epoch": 214} {"train_loss": -7.629141330718994, "global_step": 36042, "epoch": 214} {"train_loss": -7.764866352081299, "global_step": 36043, "epoch": 214} {"train_loss": -7.81425666809082, "global_step": 36044, "epoch": 214} {"train_loss": -7.969178199768066, "global_step": 36045, "epoch": 214} {"train_loss": -7.8153181076049805, "global_step": 36046, "epoch": 214} {"train_loss": -7.840231895446777, "global_step": 36047, "epoch": 214} {"train_loss": -7.913591384887695, "global_step": 36048, "epoch": 214} {"train_loss": -7.752219200134277, "global_step": 36049, "epoch": 214} {"train_loss": -7.762244701385498, "global_step": 36050, "epoch": 214} {"train_loss": -7.909032344818115, "global_step": 36051, "epoch": 214} {"train_loss": -7.793920516967773, "global_step": 36052, "epoch": 214} {"train_loss": -7.899033546447754, "global_step": 36053, "epoch": 214} {"train_loss": -7.906067848205566, "global_step": 36054, "epoch": 214} {"train_loss": -7.889284133911133, "global_step": 36055, "epoch": 214} {"train_loss": -7.892735481262207, "global_step": 36056, "epoch": 214} {"train_loss": -7.850709438323975, "global_step": 36057, "epoch": 214} {"train_loss": -7.904511451721191, "global_step": 36058, "epoch": 214} {"train_loss": -7.933547019958496, "global_step": 36059, "epoch": 214} {"train_loss": -7.814618110656738, "global_step": 36060, "epoch": 214} {"train_loss": -7.883902549743652, "global_step": 36061, "epoch": 214} {"train_loss": -7.48825740814209, "global_step": 36062, "epoch": 214} {"train_loss": -7.473083019256592, "global_step": 36063, "epoch": 214} {"train_loss": -7.677764415740967, "global_step": 36064, "epoch": 214} {"train_loss": -7.615026950836182, "global_step": 36065, "epoch": 214} {"train_loss": -7.712271690368652, "global_step": 36066, "epoch": 214} {"train_loss": -7.509764671325684, "global_step": 36067, "epoch": 214} {"train_loss": -7.626923561096191, "global_step": 36068, "epoch": 214} {"train_loss": -7.62238883972168, "global_step": 36069, "epoch": 214} {"train_loss": -7.8378753662109375, "global_step": 36070, "epoch": 214} {"train_loss": -7.81425666809082, "global_step": 36071, "epoch": 214} {"train_loss": -7.454873085021973, "global_step": 36072, "epoch": 214} {"train_loss": -7.692710876464844, "global_step": 36073, "epoch": 214} {"train_loss": -7.515405654907227, "global_step": 36074, "epoch": 214} {"train_loss": -7.747982501983643, "global_step": 36075, "epoch": 214} {"train_loss": -7.673642158508301, "global_step": 36076, "epoch": 214} {"train_loss": -7.64774751663208, "global_step": 36077, "epoch": 214} {"train_loss": -7.764752388000488, "global_step": 36078, "epoch": 214} {"train_loss": -7.862215042114258, "global_step": 36079, "epoch": 214} {"train_loss": -7.69118595123291, "global_step": 36080, "epoch": 214} {"train_loss": -7.820588111877441, "global_step": 36081, "epoch": 214} {"train_loss": -7.726559638977051, "global_step": 36082, "epoch": 214} {"train_loss": -7.7887139320373535, "global_step": 36083, "epoch": 214} {"train_loss": -7.723989486694336, "global_step": 36084, "epoch": 214} {"train_loss": -7.83234977722168, "global_step": 36085, "epoch": 214} {"train_loss": -7.735441207885742, "global_step": 36086, "epoch": 214} {"train_loss": -7.664638996124268, "global_step": 36087, "epoch": 214} {"train_loss": -7.855302810668945, "global_step": 36088, "epoch": 214} {"train_loss": -7.834040641784668, "global_step": 36089, "epoch": 214} {"train_loss": -7.8775787353515625, "global_step": 36090, "epoch": 214} {"train_loss": -7.807597637176514, "global_step": 36091, "epoch": 214} {"train_loss": -7.777082443237305, "global_step": 36092, "epoch": 214} {"train_loss": -7.649504661560059, "global_step": 36093, "epoch": 214} {"train_loss": -7.971203804016113, "global_step": 36094, "epoch": 214} {"train_loss": -7.976406097412109, "global_step": 36095, "epoch": 214} {"train_loss": -7.951922416687012, "global_step": 36096, "epoch": 214} {"train_loss": -7.785923004150391, "global_step": 36097, "epoch": 214} {"train_loss": -7.381499290466309, "global_step": 36098, "epoch": 214} {"train_loss": -7.744300842285156, "global_step": 36099, "epoch": 214} {"train_loss": -7.891876697540283, "global_step": 36100, "epoch": 214} {"train_loss": -7.728697776794434, "global_step": 36101, "epoch": 214} {"train_loss": -7.478869438171387, "global_step": 36102, "epoch": 214} {"train_loss": -7.903601169586182, "global_step": 36103, "epoch": 214} {"train_loss": -7.87741756439209, "global_step": 36104, "epoch": 214} {"train_loss": -7.481328964233398, "global_step": 36105, "epoch": 214} {"train_loss": -7.70140266418457, "global_step": 36106, "epoch": 214} {"train_loss": -7.502264976501465, "global_step": 36107, "epoch": 214} {"train_loss": -7.739535331726074, "global_step": 36108, "epoch": 214} {"train_loss": -7.228734016418457, "global_step": 36109, "epoch": 214} {"train_loss": -7.802728652954102, "global_step": 36110, "epoch": 214} {"train_loss": -7.344826698303223, "global_step": 36111, "epoch": 214} {"train_loss": -7.86915397644043, "global_step": 36112, "epoch": 214} {"train_loss": -7.709482192993164, "global_step": 36113, "epoch": 214} {"train_loss": -7.621015548706055, "global_step": 36114, "epoch": 214} {"train_loss": -7.544539451599121, "global_step": 36115, "epoch": 214} {"train_loss": -7.6429290771484375, "global_step": 36116, "epoch": 214} {"train_loss": -7.781655311584473, "global_step": 36117, "epoch": 214} {"train_loss": -7.647515296936035, "global_step": 36118, "epoch": 214} {"train_loss": -7.704886549995059, "global_step": 36119, "epoch": 214, "val_loss": 185711.609375} {"train_loss": -7.642365455627441, "global_step": 36120, "epoch": 215} {"train_loss": -7.9454193115234375, "global_step": 36121, "epoch": 215} {"train_loss": -7.842353820800781, "global_step": 36122, "epoch": 215} {"train_loss": -7.755350112915039, "global_step": 36123, "epoch": 215} {"train_loss": -7.7965922355651855, "global_step": 36124, "epoch": 215} {"train_loss": -7.606759071350098, "global_step": 36125, "epoch": 215} {"train_loss": -7.878625869750977, "global_step": 36126, "epoch": 215} {"train_loss": -7.880329132080078, "global_step": 36127, "epoch": 215} {"train_loss": -7.782883644104004, "global_step": 36128, "epoch": 215} {"train_loss": -7.847780227661133, "global_step": 36129, "epoch": 215} {"train_loss": -7.88767147064209, "global_step": 36130, "epoch": 215} {"train_loss": -7.796352386474609, "global_step": 36131, "epoch": 215} {"train_loss": -7.641237735748291, "global_step": 36132, "epoch": 215} {"train_loss": -7.628259658813477, "global_step": 36133, "epoch": 215} {"train_loss": -7.85261344909668, "global_step": 36134, "epoch": 215} {"train_loss": -7.76702356338501, "global_step": 36135, "epoch": 215} {"train_loss": -7.822781085968018, "global_step": 36136, "epoch": 215} {"train_loss": -7.9155192375183105, "global_step": 36137, "epoch": 215} {"train_loss": -7.794747829437256, "global_step": 36138, "epoch": 215} {"train_loss": -7.818040370941162, "global_step": 36139, "epoch": 215} {"train_loss": -7.931957721710205, "global_step": 36140, "epoch": 215} {"train_loss": -7.596691131591797, "global_step": 36141, "epoch": 215} {"train_loss": -7.765409469604492, "global_step": 36142, "epoch": 215} {"train_loss": -7.87686824798584, "global_step": 36143, "epoch": 215} {"train_loss": -7.578607559204102, "global_step": 36144, "epoch": 215} {"train_loss": -8.03805160522461, "global_step": 36145, "epoch": 215} {"train_loss": -8.012893676757812, "global_step": 36146, "epoch": 215} {"train_loss": -7.9702348709106445, "global_step": 36147, "epoch": 215} {"train_loss": -7.840227127075195, "global_step": 36148, "epoch": 215} {"train_loss": -7.999986171722412, "global_step": 36149, "epoch": 215} {"train_loss": -7.846645355224609, "global_step": 36150, "epoch": 215} {"train_loss": -7.774043083190918, "global_step": 36151, "epoch": 215} {"train_loss": -7.74034309387207, "global_step": 36152, "epoch": 215} {"train_loss": -7.822051048278809, "global_step": 36153, "epoch": 215} {"train_loss": -7.885668754577637, "global_step": 36154, "epoch": 215} {"train_loss": -7.833650588989258, "global_step": 36155, "epoch": 215} {"train_loss": -7.6661152839660645, "global_step": 36156, "epoch": 215} {"train_loss": -7.878744125366211, "global_step": 36157, "epoch": 215} {"train_loss": -7.634479522705078, "global_step": 36158, "epoch": 215} {"train_loss": -7.9650726318359375, "global_step": 36159, "epoch": 215} {"train_loss": -7.9398579597473145, "global_step": 36160, "epoch": 215} {"train_loss": -7.740849494934082, "global_step": 36161, "epoch": 215} {"train_loss": -7.852035045623779, "global_step": 36162, "epoch": 215} {"train_loss": -7.839541435241699, "global_step": 36163, "epoch": 215} {"train_loss": -7.853637218475342, "global_step": 36164, "epoch": 215} {"train_loss": -7.872278690338135, "global_step": 36165, "epoch": 215} {"train_loss": -7.652764320373535, "global_step": 36166, "epoch": 215} {"train_loss": -7.625749588012695, "global_step": 36167, "epoch": 215} {"train_loss": -7.896736145019531, "global_step": 36168, "epoch": 215} {"train_loss": -7.7205915451049805, "global_step": 36169, "epoch": 215} {"train_loss": -7.65594482421875, "global_step": 36170, "epoch": 215} {"train_loss": -7.750699520111084, "global_step": 36171, "epoch": 215} {"train_loss": -7.928106307983398, "global_step": 36172, "epoch": 215} {"train_loss": -7.514311790466309, "global_step": 36173, "epoch": 215} {"train_loss": -7.8152055740356445, "global_step": 36174, "epoch": 215} {"train_loss": -7.667834281921387, "global_step": 36175, "epoch": 215} {"train_loss": -7.616587162017822, "global_step": 36176, "epoch": 215} {"train_loss": -7.70196533203125, "global_step": 36177, "epoch": 215} {"train_loss": -7.797388076782227, "global_step": 36178, "epoch": 215} {"train_loss": -7.389904975891113, "global_step": 36179, "epoch": 215} {"train_loss": -7.80535888671875, "global_step": 36180, "epoch": 215} {"train_loss": -7.610383033752441, "global_step": 36181, "epoch": 215} {"train_loss": -7.7821855545043945, "global_step": 36182, "epoch": 215} {"train_loss": -7.891283988952637, "global_step": 36183, "epoch": 215} {"train_loss": -7.871113300323486, "global_step": 36184, "epoch": 215} {"train_loss": -7.825301647186279, "global_step": 36185, "epoch": 215} {"train_loss": -7.732940196990967, "global_step": 36186, "epoch": 215} {"train_loss": -7.738832473754883, "global_step": 36187, "epoch": 215} {"train_loss": -7.628207206726074, "global_step": 36188, "epoch": 215} {"train_loss": -7.598300933837891, "global_step": 36189, "epoch": 215} {"train_loss": -7.705638408660889, "global_step": 36190, "epoch": 215} {"train_loss": -7.888207912445068, "global_step": 36191, "epoch": 215} {"train_loss": -7.743140697479248, "global_step": 36192, "epoch": 215} {"train_loss": -7.668426990509033, "global_step": 36193, "epoch": 215} {"train_loss": -7.940731048583984, "global_step": 36194, "epoch": 215} {"train_loss": -7.7430853843688965, "global_step": 36195, "epoch": 215} {"train_loss": -7.71154260635376, "global_step": 36196, "epoch": 215} {"train_loss": -7.725960731506348, "global_step": 36197, "epoch": 215} {"train_loss": -7.676135063171387, "global_step": 36198, "epoch": 215} {"train_loss": -7.99550724029541, "global_step": 36199, "epoch": 215} {"train_loss": -7.794424057006836, "global_step": 36200, "epoch": 215} {"train_loss": -7.8558878898620605, "global_step": 36201, "epoch": 215} {"train_loss": -7.678579330444336, "global_step": 36202, "epoch": 215} {"train_loss": -7.919909477233887, "global_step": 36203, "epoch": 215} {"train_loss": -7.678230285644531, "global_step": 36204, "epoch": 215} {"train_loss": -7.805269718170166, "global_step": 36205, "epoch": 215} {"train_loss": -7.8882551193237305, "global_step": 36206, "epoch": 215} {"train_loss": -7.930625915527344, "global_step": 36207, "epoch": 215} {"train_loss": -7.617079734802246, "global_step": 36208, "epoch": 215} {"train_loss": -7.776986598968506, "global_step": 36209, "epoch": 215} {"train_loss": -7.719641208648682, "global_step": 36210, "epoch": 215} {"train_loss": -7.908009052276611, "global_step": 36211, "epoch": 215} {"train_loss": -7.942264080047607, "global_step": 36212, "epoch": 215} {"train_loss": -7.8624653816223145, "global_step": 36213, "epoch": 215} {"train_loss": -7.426715850830078, "global_step": 36214, "epoch": 215} {"train_loss": -7.867980480194092, "global_step": 36215, "epoch": 215} {"train_loss": -7.621049404144287, "global_step": 36216, "epoch": 215} {"train_loss": -7.2903032302856445, "global_step": 36217, "epoch": 215} {"train_loss": -7.754846096038818, "global_step": 36218, "epoch": 215} {"train_loss": -7.558032989501953, "global_step": 36219, "epoch": 215} {"train_loss": -7.367807388305664, "global_step": 36220, "epoch": 215} {"train_loss": -7.553551197052002, "global_step": 36221, "epoch": 215} {"train_loss": -7.6204962730407715, "global_step": 36222, "epoch": 215} {"train_loss": -7.381440162658691, "global_step": 36223, "epoch": 215} {"train_loss": -7.648087978363037, "global_step": 36224, "epoch": 215} {"train_loss": -7.611648082733154, "global_step": 36225, "epoch": 215} {"train_loss": -7.4959917068481445, "global_step": 36226, "epoch": 215} {"train_loss": -7.635986328125, "global_step": 36227, "epoch": 215} {"train_loss": -7.7531657218933105, "global_step": 36228, "epoch": 215} {"train_loss": -7.334112167358398, "global_step": 36229, "epoch": 215} {"train_loss": -7.498849868774414, "global_step": 36230, "epoch": 215} {"train_loss": -7.775474548339844, "global_step": 36231, "epoch": 215} {"train_loss": -7.576502799987793, "global_step": 36232, "epoch": 215} {"train_loss": -7.838671684265137, "global_step": 36233, "epoch": 215} {"train_loss": -7.58942174911499, "global_step": 36234, "epoch": 215} {"train_loss": -7.767099380493164, "global_step": 36235, "epoch": 215} {"train_loss": -7.508692741394043, "global_step": 36236, "epoch": 215} {"train_loss": -7.7534942626953125, "global_step": 36237, "epoch": 215} {"train_loss": -7.988943099975586, "global_step": 36238, "epoch": 215} {"train_loss": -7.828072547912598, "global_step": 36239, "epoch": 215} {"train_loss": -7.6850786209106445, "global_step": 36240, "epoch": 215} {"train_loss": -7.8017144203186035, "global_step": 36241, "epoch": 215} {"train_loss": -7.891448020935059, "global_step": 36242, "epoch": 215} {"train_loss": -7.571478843688965, "global_step": 36243, "epoch": 215} {"train_loss": -8.03453254699707, "global_step": 36244, "epoch": 215} {"train_loss": -7.752946853637695, "global_step": 36245, "epoch": 215} {"train_loss": -8.032812118530273, "global_step": 36246, "epoch": 215} {"train_loss": -7.639554977416992, "global_step": 36247, "epoch": 215} {"train_loss": -7.959219932556152, "global_step": 36248, "epoch": 215} {"train_loss": -8.071381568908691, "global_step": 36249, "epoch": 215} {"train_loss": -7.742278575897217, "global_step": 36250, "epoch": 215} {"train_loss": -8.074593544006348, "global_step": 36251, "epoch": 215} {"train_loss": -7.952231407165527, "global_step": 36252, "epoch": 215} {"train_loss": -8.03231430053711, "global_step": 36253, "epoch": 215} {"train_loss": -7.912101745605469, "global_step": 36254, "epoch": 215} {"train_loss": -7.931180477142334, "global_step": 36255, "epoch": 215} {"train_loss": -8.020163536071777, "global_step": 36256, "epoch": 215} {"train_loss": -8.094897270202637, "global_step": 36257, "epoch": 215} {"train_loss": -7.872689247131348, "global_step": 36258, "epoch": 215} {"train_loss": -7.731454849243164, "global_step": 36259, "epoch": 215} {"train_loss": -7.885472297668457, "global_step": 36260, "epoch": 215} {"train_loss": -7.858484745025635, "global_step": 36261, "epoch": 215} {"train_loss": -7.742197036743164, "global_step": 36262, "epoch": 215} {"train_loss": -7.951052665710449, "global_step": 36263, "epoch": 215} {"train_loss": -7.735864639282227, "global_step": 36264, "epoch": 215} {"train_loss": -7.927921295166016, "global_step": 36265, "epoch": 215} {"train_loss": -7.866395950317383, "global_step": 36266, "epoch": 215} {"train_loss": -7.646048545837402, "global_step": 36267, "epoch": 215} {"train_loss": -7.782122611999512, "global_step": 36268, "epoch": 215} {"train_loss": -7.795660018920898, "global_step": 36269, "epoch": 215} {"train_loss": -7.971196174621582, "global_step": 36270, "epoch": 215} {"train_loss": -7.634484767913818, "global_step": 36271, "epoch": 215} {"train_loss": -7.913654327392578, "global_step": 36272, "epoch": 215} {"train_loss": -7.5305376052856445, "global_step": 36273, "epoch": 215} {"train_loss": -7.615373611450195, "global_step": 36274, "epoch": 215} {"train_loss": -7.6622114181518555, "global_step": 36275, "epoch": 215} {"train_loss": -7.8532280921936035, "global_step": 36276, "epoch": 215} {"train_loss": -7.724339008331299, "global_step": 36277, "epoch": 215} {"train_loss": -7.77821683883667, "global_step": 36278, "epoch": 215} {"train_loss": -7.506257057189941, "global_step": 36279, "epoch": 215} {"train_loss": -7.482484340667725, "global_step": 36280, "epoch": 215} {"train_loss": -7.629815101623535, "global_step": 36281, "epoch": 215} {"train_loss": -7.745096206665039, "global_step": 36282, "epoch": 215} {"train_loss": -7.786198616027832, "global_step": 36283, "epoch": 215} {"train_loss": -7.639303207397461, "global_step": 36284, "epoch": 215} {"train_loss": -7.575592517852783, "global_step": 36285, "epoch": 215} {"train_loss": -7.615140914916992, "global_step": 36286, "epoch": 215} {"train_loss": -7.763981106735411, "global_step": 36287, "epoch": 215, "val_loss": 186525.765625, "train_action_mse_error": 9.46711540222168} {"train_loss": -7.4738993644714355, "global_step": 36288, "epoch": 216} {"train_loss": -7.567434787750244, "global_step": 36289, "epoch": 216} {"train_loss": -7.624846458435059, "global_step": 36290, "epoch": 216} {"train_loss": -7.7593183517456055, "global_step": 36291, "epoch": 216} {"train_loss": -7.731945037841797, "global_step": 36292, "epoch": 216} {"train_loss": -7.945234298706055, "global_step": 36293, "epoch": 216} {"train_loss": -7.848258972167969, "global_step": 36294, "epoch": 216} {"train_loss": -7.93703556060791, "global_step": 36295, "epoch": 216} {"train_loss": -7.823712348937988, "global_step": 36296, "epoch": 216} {"train_loss": -7.977878570556641, "global_step": 36297, "epoch": 216} {"train_loss": -7.794677734375, "global_step": 36298, "epoch": 216} {"train_loss": -7.80696964263916, "global_step": 36299, "epoch": 216} {"train_loss": -7.891848564147949, "global_step": 36300, "epoch": 216} {"train_loss": -7.726613998413086, "global_step": 36301, "epoch": 216} {"train_loss": -7.976874828338623, "global_step": 36302, "epoch": 216} {"train_loss": -7.8192291259765625, "global_step": 36303, "epoch": 216} {"train_loss": -7.9948883056640625, "global_step": 36304, "epoch": 216} {"train_loss": -7.599835395812988, "global_step": 36305, "epoch": 216} {"train_loss": -7.679032325744629, "global_step": 36306, "epoch": 216} {"train_loss": -7.663494110107422, "global_step": 36307, "epoch": 216} {"train_loss": -7.797065258026123, "global_step": 36308, "epoch": 216} {"train_loss": -7.907118797302246, "global_step": 36309, "epoch": 216} {"train_loss": -7.761906147003174, "global_step": 36310, "epoch": 216} {"train_loss": -7.883127689361572, "global_step": 36311, "epoch": 216} {"train_loss": -7.608636856079102, "global_step": 36312, "epoch": 216} {"train_loss": -7.644496917724609, "global_step": 36313, "epoch": 216} {"train_loss": -7.816819190979004, "global_step": 36314, "epoch": 216} {"train_loss": -7.724427223205566, "global_step": 36315, "epoch": 216} {"train_loss": -7.939937591552734, "global_step": 36316, "epoch": 216} {"train_loss": -7.8748459815979, "global_step": 36317, "epoch": 216} {"train_loss": -7.609506607055664, "global_step": 36318, "epoch": 216} {"train_loss": -7.692370891571045, "global_step": 36319, "epoch": 216} {"train_loss": -7.764093399047852, "global_step": 36320, "epoch": 216} {"train_loss": -7.664397239685059, "global_step": 36321, "epoch": 216} {"train_loss": -7.72014856338501, "global_step": 36322, "epoch": 216} {"train_loss": -7.761987209320068, "global_step": 36323, "epoch": 216} {"train_loss": -7.79611349105835, "global_step": 36324, "epoch": 216} {"train_loss": -7.837701320648193, "global_step": 36325, "epoch": 216} {"train_loss": -7.884725570678711, "global_step": 36326, "epoch": 216} {"train_loss": -7.683315277099609, "global_step": 36327, "epoch": 216} {"train_loss": -7.63064432144165, "global_step": 36328, "epoch": 216} {"train_loss": -7.814873695373535, "global_step": 36329, "epoch": 216} {"train_loss": -7.90708589553833, "global_step": 36330, "epoch": 216} {"train_loss": -7.739386558532715, "global_step": 36331, "epoch": 216} {"train_loss": -7.689430236816406, "global_step": 36332, "epoch": 216} {"train_loss": -7.628717422485352, "global_step": 36333, "epoch": 216} {"train_loss": -7.810918807983398, "global_step": 36334, "epoch": 216} {"train_loss": -7.417605400085449, "global_step": 36335, "epoch": 216} {"train_loss": -7.812031269073486, "global_step": 36336, "epoch": 216} {"train_loss": -7.696664810180664, "global_step": 36337, "epoch": 216} {"train_loss": -7.637117385864258, "global_step": 36338, "epoch": 216} {"train_loss": -7.452019691467285, "global_step": 36339, "epoch": 216} {"train_loss": -7.744011878967285, "global_step": 36340, "epoch": 216} {"train_loss": -7.780933380126953, "global_step": 36341, "epoch": 216} {"train_loss": -7.625779151916504, "global_step": 36342, "epoch": 216} {"train_loss": -7.908811092376709, "global_step": 36343, "epoch": 216} {"train_loss": -7.87769889831543, "global_step": 36344, "epoch": 216} {"train_loss": -7.745760917663574, "global_step": 36345, "epoch": 216} {"train_loss": -7.998875617980957, "global_step": 36346, "epoch": 216} {"train_loss": -7.916318893432617, "global_step": 36347, "epoch": 216} {"train_loss": -7.792723178863525, "global_step": 36348, "epoch": 216} {"train_loss": -7.7113847732543945, "global_step": 36349, "epoch": 216} {"train_loss": -7.620941162109375, "global_step": 36350, "epoch": 216} {"train_loss": -7.449991226196289, "global_step": 36351, "epoch": 216} {"train_loss": -7.893777370452881, "global_step": 36352, "epoch": 216} {"train_loss": -7.737215995788574, "global_step": 36353, "epoch": 216} {"train_loss": -7.843147277832031, "global_step": 36354, "epoch": 216} {"train_loss": -7.66843318939209, "global_step": 36355, "epoch": 216} {"train_loss": -7.704139709472656, "global_step": 36356, "epoch": 216} {"train_loss": -7.720527648925781, "global_step": 36357, "epoch": 216} {"train_loss": -7.840372562408447, "global_step": 36358, "epoch": 216} {"train_loss": -7.632083892822266, "global_step": 36359, "epoch": 216} {"train_loss": -7.7689433097839355, "global_step": 36360, "epoch": 216} {"train_loss": -7.924459934234619, "global_step": 36361, "epoch": 216} {"train_loss": -7.780545234680176, "global_step": 36362, "epoch": 216} {"train_loss": -7.787843227386475, "global_step": 36363, "epoch": 216} {"train_loss": -7.977208137512207, "global_step": 36364, "epoch": 216} {"train_loss": -7.975621700286865, "global_step": 36365, "epoch": 216} {"train_loss": -7.5221757888793945, "global_step": 36366, "epoch": 216} {"train_loss": -7.717255592346191, "global_step": 36367, "epoch": 216} {"train_loss": -8.010480880737305, "global_step": 36368, "epoch": 216} {"train_loss": -7.725396156311035, "global_step": 36369, "epoch": 216} {"train_loss": -7.782406806945801, "global_step": 36370, "epoch": 216} {"train_loss": -7.971814155578613, "global_step": 36371, "epoch": 216} {"train_loss": -7.927788257598877, "global_step": 36372, "epoch": 216} {"train_loss": -7.845847129821777, "global_step": 36373, "epoch": 216} {"train_loss": -7.756110191345215, "global_step": 36374, "epoch": 216} {"train_loss": -7.754206657409668, "global_step": 36375, "epoch": 216} {"train_loss": -7.735779285430908, "global_step": 36376, "epoch": 216} {"train_loss": -7.511533737182617, "global_step": 36377, "epoch": 216} {"train_loss": -7.669252395629883, "global_step": 36378, "epoch": 216} {"train_loss": -7.560659885406494, "global_step": 36379, "epoch": 216} {"train_loss": -7.528112411499023, "global_step": 36380, "epoch": 216} {"train_loss": -7.521686553955078, "global_step": 36381, "epoch": 216} {"train_loss": -7.797542572021484, "global_step": 36382, "epoch": 216} {"train_loss": -7.644078254699707, "global_step": 36383, "epoch": 216} {"train_loss": -7.877587795257568, "global_step": 36384, "epoch": 216} {"train_loss": -7.937454700469971, "global_step": 36385, "epoch": 216} {"train_loss": -7.796897888183594, "global_step": 36386, "epoch": 216} {"train_loss": -7.841874599456787, "global_step": 36387, "epoch": 216} {"train_loss": -7.84235143661499, "global_step": 36388, "epoch": 216} {"train_loss": -7.795893669128418, "global_step": 36389, "epoch": 216} {"train_loss": -7.899899005889893, "global_step": 36390, "epoch": 216} {"train_loss": -7.555146217346191, "global_step": 36391, "epoch": 216} {"train_loss": -7.832548141479492, "global_step": 36392, "epoch": 216} {"train_loss": -7.372271537780762, "global_step": 36393, "epoch": 216} {"train_loss": -7.625887393951416, "global_step": 36394, "epoch": 216} {"train_loss": -7.564998626708984, "global_step": 36395, "epoch": 216} {"train_loss": -7.560727119445801, "global_step": 36396, "epoch": 216} {"train_loss": -7.649953842163086, "global_step": 36397, "epoch": 216} {"train_loss": -7.510210037231445, "global_step": 36398, "epoch": 216} {"train_loss": -7.877704620361328, "global_step": 36399, "epoch": 216} {"train_loss": -7.585244178771973, "global_step": 36400, "epoch": 216} {"train_loss": -7.723755359649658, "global_step": 36401, "epoch": 216} {"train_loss": -7.70905065536499, "global_step": 36402, "epoch": 216} {"train_loss": -7.6524810791015625, "global_step": 36403, "epoch": 216} {"train_loss": -7.661153316497803, "global_step": 36404, "epoch": 216} {"train_loss": -7.795000076293945, "global_step": 36405, "epoch": 216} {"train_loss": -7.787359237670898, "global_step": 36406, "epoch": 216} {"train_loss": -7.855319023132324, "global_step": 36407, "epoch": 216} {"train_loss": -7.607885837554932, "global_step": 36408, "epoch": 216} {"train_loss": -7.875846862792969, "global_step": 36409, "epoch": 216} {"train_loss": -7.642531394958496, "global_step": 36410, "epoch": 216} {"train_loss": -7.517469882965088, "global_step": 36411, "epoch": 216} {"train_loss": -7.726359844207764, "global_step": 36412, "epoch": 216} {"train_loss": -7.581916809082031, "global_step": 36413, "epoch": 216} {"train_loss": -7.408759117126465, "global_step": 36414, "epoch": 216} {"train_loss": -7.738304615020752, "global_step": 36415, "epoch": 216} {"train_loss": -7.727438926696777, "global_step": 36416, "epoch": 216} {"train_loss": -7.5651679039001465, "global_step": 36417, "epoch": 216} {"train_loss": -7.792880535125732, "global_step": 36418, "epoch": 216} {"train_loss": -7.9447126388549805, "global_step": 36419, "epoch": 216} {"train_loss": -7.633989334106445, "global_step": 36420, "epoch": 216} {"train_loss": -7.589860916137695, "global_step": 36421, "epoch": 216} {"train_loss": -7.868697643280029, "global_step": 36422, "epoch": 216} {"train_loss": -7.855504512786865, "global_step": 36423, "epoch": 216} {"train_loss": -7.6804399490356445, "global_step": 36424, "epoch": 216} {"train_loss": -7.950109958648682, "global_step": 36425, "epoch": 216} {"train_loss": -8.023711204528809, "global_step": 36426, "epoch": 216} {"train_loss": -7.8283843994140625, "global_step": 36427, "epoch": 216} {"train_loss": -7.845979690551758, "global_step": 36428, "epoch": 216} {"train_loss": -8.09323501586914, "global_step": 36429, "epoch": 216} {"train_loss": -8.0382080078125, "global_step": 36430, "epoch": 216} {"train_loss": -7.95436954498291, "global_step": 36431, "epoch": 216} {"train_loss": -8.01685905456543, "global_step": 36432, "epoch": 216} {"train_loss": -8.044139862060547, "global_step": 36433, "epoch": 216} {"train_loss": -8.005399703979492, "global_step": 36434, "epoch": 216} {"train_loss": -7.934067726135254, "global_step": 36435, "epoch": 216} {"train_loss": -7.7560858726501465, "global_step": 36436, "epoch": 216} {"train_loss": -7.701089859008789, "global_step": 36437, "epoch": 216} {"train_loss": -7.96673583984375, "global_step": 36438, "epoch": 216} {"train_loss": -7.285392761230469, "global_step": 36439, "epoch": 216} {"train_loss": -8.006396293640137, "global_step": 36440, "epoch": 216} {"train_loss": -7.523510932922363, "global_step": 36441, "epoch": 216} {"train_loss": -7.969898223876953, "global_step": 36442, "epoch": 216} {"train_loss": -7.754091739654541, "global_step": 36443, "epoch": 216} {"train_loss": -8.079694747924805, "global_step": 36444, "epoch": 216} {"train_loss": -7.858088493347168, "global_step": 36445, "epoch": 216} {"train_loss": -7.678442001342773, "global_step": 36446, "epoch": 216} {"train_loss": -7.69180965423584, "global_step": 36447, "epoch": 216} {"train_loss": -7.743391990661621, "global_step": 36448, "epoch": 216} {"train_loss": -7.744043350219727, "global_step": 36449, "epoch": 216} {"train_loss": -7.959049224853516, "global_step": 36450, "epoch": 216} {"train_loss": -7.591423511505127, "global_step": 36451, "epoch": 216} {"train_loss": -7.851816177368164, "global_step": 36452, "epoch": 216} {"train_loss": -7.811150550842285, "global_step": 36453, "epoch": 216} {"train_loss": -7.713239669799805, "global_step": 36454, "epoch": 216} {"train_loss": -7.761531687918163, "global_step": 36455, "epoch": 216, "val_loss": 183437.0625} {"train_loss": -7.779479026794434, "global_step": 36456, "epoch": 217} {"train_loss": -8.23173999786377, "global_step": 36457, "epoch": 217} {"train_loss": -8.038509368896484, "global_step": 36458, "epoch": 217} {"train_loss": -7.891678810119629, "global_step": 36459, "epoch": 217} {"train_loss": -7.636828422546387, "global_step": 36460, "epoch": 217} {"train_loss": -7.916422367095947, "global_step": 36461, "epoch": 217} {"train_loss": -7.998307704925537, "global_step": 36462, "epoch": 217} {"train_loss": -7.900474548339844, "global_step": 36463, "epoch": 217} {"train_loss": -8.034968376159668, "global_step": 36464, "epoch": 217} {"train_loss": -7.963647842407227, "global_step": 36465, "epoch": 217} {"train_loss": -7.755702495574951, "global_step": 36466, "epoch": 217} {"train_loss": -7.969356536865234, "global_step": 36467, "epoch": 217} {"train_loss": -7.9860944747924805, "global_step": 36468, "epoch": 217} {"train_loss": -7.9144134521484375, "global_step": 36469, "epoch": 217} {"train_loss": -7.746777534484863, "global_step": 36470, "epoch": 217} {"train_loss": -7.716376304626465, "global_step": 36471, "epoch": 217} {"train_loss": -7.6671342849731445, "global_step": 36472, "epoch": 217} {"train_loss": -7.9826436042785645, "global_step": 36473, "epoch": 217} {"train_loss": -7.087602138519287, "global_step": 36474, "epoch": 217} {"train_loss": -7.135185241699219, "global_step": 36475, "epoch": 217} {"train_loss": -7.495694637298584, "global_step": 36476, "epoch": 217} {"train_loss": -7.330190658569336, "global_step": 36477, "epoch": 217} {"train_loss": -7.481210708618164, "global_step": 36478, "epoch": 217} {"train_loss": -7.151131629943848, "global_step": 36479, "epoch": 217} {"train_loss": -7.751817226409912, "global_step": 36480, "epoch": 217} {"train_loss": -7.100881576538086, "global_step": 36481, "epoch": 217} {"train_loss": -7.456730842590332, "global_step": 36482, "epoch": 217} {"train_loss": -7.546958923339844, "global_step": 36483, "epoch": 217} {"train_loss": -7.389996528625488, "global_step": 36484, "epoch": 217} {"train_loss": -7.265515327453613, "global_step": 36485, "epoch": 217} {"train_loss": -7.313749313354492, "global_step": 36486, "epoch": 217} {"train_loss": -7.6612629890441895, "global_step": 36487, "epoch": 217} {"train_loss": -7.3405351638793945, "global_step": 36488, "epoch": 217} {"train_loss": -7.351268768310547, "global_step": 36489, "epoch": 217} {"train_loss": -7.601778984069824, "global_step": 36490, "epoch": 217} {"train_loss": -7.790299415588379, "global_step": 36491, "epoch": 217} {"train_loss": -7.3213396072387695, "global_step": 36492, "epoch": 217} {"train_loss": -7.768764019012451, "global_step": 36493, "epoch": 217} {"train_loss": -7.634875297546387, "global_step": 36494, "epoch": 217} {"train_loss": -7.673579216003418, "global_step": 36495, "epoch": 217} {"train_loss": -7.548549175262451, "global_step": 36496, "epoch": 217} {"train_loss": -7.863413333892822, "global_step": 36497, "epoch": 217} {"train_loss": -7.857188701629639, "global_step": 36498, "epoch": 217} {"train_loss": -7.719351291656494, "global_step": 36499, "epoch": 217} {"train_loss": -7.789823055267334, "global_step": 36500, "epoch": 217} {"train_loss": -7.712503433227539, "global_step": 36501, "epoch": 217} {"train_loss": -7.668464183807373, "global_step": 36502, "epoch": 217} {"train_loss": -7.937873363494873, "global_step": 36503, "epoch": 217} {"train_loss": -7.876628875732422, "global_step": 36504, "epoch": 217} {"train_loss": -7.662755012512207, "global_step": 36505, "epoch": 217} {"train_loss": -7.941991806030273, "global_step": 36506, "epoch": 217} {"train_loss": -7.718992710113525, "global_step": 36507, "epoch": 217} {"train_loss": -7.784219264984131, "global_step": 36508, "epoch": 217} {"train_loss": -7.879108905792236, "global_step": 36509, "epoch": 217} {"train_loss": -7.934441566467285, "global_step": 36510, "epoch": 217} {"train_loss": -8.078861236572266, "global_step": 36511, "epoch": 217} {"train_loss": -7.608809471130371, "global_step": 36512, "epoch": 217} {"train_loss": -8.220061302185059, "global_step": 36513, "epoch": 217} {"train_loss": -7.656230926513672, "global_step": 36514, "epoch": 217} {"train_loss": -8.028244018554688, "global_step": 36515, "epoch": 217} {"train_loss": -7.8037872314453125, "global_step": 36516, "epoch": 217} {"train_loss": -8.012219429016113, "global_step": 36517, "epoch": 217} {"train_loss": -7.796380043029785, "global_step": 36518, "epoch": 217} {"train_loss": -7.952218055725098, "global_step": 36519, "epoch": 217} {"train_loss": -7.8459672927856445, "global_step": 36520, "epoch": 217} {"train_loss": -7.900384426116943, "global_step": 36521, "epoch": 217} {"train_loss": -7.924766540527344, "global_step": 36522, "epoch": 217} {"train_loss": -7.798490524291992, "global_step": 36523, "epoch": 217} {"train_loss": -7.880187034606934, "global_step": 36524, "epoch": 217} {"train_loss": -7.875343322753906, "global_step": 36525, "epoch": 217} {"train_loss": -7.69731330871582, "global_step": 36526, "epoch": 217} {"train_loss": -7.857744216918945, "global_step": 36527, "epoch": 217} {"train_loss": -7.652151107788086, "global_step": 36528, "epoch": 217} {"train_loss": -7.739405632019043, "global_step": 36529, "epoch": 217} {"train_loss": -7.320091247558594, "global_step": 36530, "epoch": 217} {"train_loss": -7.774365425109863, "global_step": 36531, "epoch": 217} {"train_loss": -7.681385040283203, "global_step": 36532, "epoch": 217} {"train_loss": -7.788464546203613, "global_step": 36533, "epoch": 217} {"train_loss": -7.5063958168029785, "global_step": 36534, "epoch": 217} {"train_loss": -7.699029922485352, "global_step": 36535, "epoch": 217} {"train_loss": -7.70192813873291, "global_step": 36536, "epoch": 217} {"train_loss": -8.076663970947266, "global_step": 36537, "epoch": 217} {"train_loss": -7.884345054626465, "global_step": 36538, "epoch": 217} {"train_loss": -7.78177547454834, "global_step": 36539, "epoch": 217} {"train_loss": -7.850078582763672, "global_step": 36540, "epoch": 217} {"train_loss": -7.83416748046875, "global_step": 36541, "epoch": 217} {"train_loss": -8.05852222442627, "global_step": 36542, "epoch": 217} {"train_loss": -7.908933639526367, "global_step": 36543, "epoch": 217} {"train_loss": -7.822247505187988, "global_step": 36544, "epoch": 217} {"train_loss": -7.908092498779297, "global_step": 36545, "epoch": 217} {"train_loss": -7.962594032287598, "global_step": 36546, "epoch": 217} {"train_loss": -7.808746337890625, "global_step": 36547, "epoch": 217} {"train_loss": -7.847670555114746, "global_step": 36548, "epoch": 217} {"train_loss": -7.810681343078613, "global_step": 36549, "epoch": 217} {"train_loss": -7.968358993530273, "global_step": 36550, "epoch": 217} {"train_loss": -7.875249862670898, "global_step": 36551, "epoch": 217} {"train_loss": -8.027863502502441, "global_step": 36552, "epoch": 217} {"train_loss": -7.928595542907715, "global_step": 36553, "epoch": 217} {"train_loss": -8.009283065795898, "global_step": 36554, "epoch": 217} {"train_loss": -7.7847514152526855, "global_step": 36555, "epoch": 217} {"train_loss": -7.797728538513184, "global_step": 36556, "epoch": 217} {"train_loss": -7.980720520019531, "global_step": 36557, "epoch": 217} {"train_loss": -7.626151084899902, "global_step": 36558, "epoch": 217} {"train_loss": -8.026092529296875, "global_step": 36559, "epoch": 217} {"train_loss": -7.597799301147461, "global_step": 36560, "epoch": 217} {"train_loss": -7.870518684387207, "global_step": 36561, "epoch": 217} {"train_loss": -7.723299026489258, "global_step": 36562, "epoch": 217} {"train_loss": -8.010248184204102, "global_step": 36563, "epoch": 217} {"train_loss": -7.66765022277832, "global_step": 36564, "epoch": 217} {"train_loss": -7.864999771118164, "global_step": 36565, "epoch": 217} {"train_loss": -7.90447998046875, "global_step": 36566, "epoch": 217} {"train_loss": -7.901787757873535, "global_step": 36567, "epoch": 217} {"train_loss": -7.81506872177124, "global_step": 36568, "epoch": 217} {"train_loss": -8.017436981201172, "global_step": 36569, "epoch": 217} {"train_loss": -7.799636363983154, "global_step": 36570, "epoch": 217} {"train_loss": -7.766808986663818, "global_step": 36571, "epoch": 217} {"train_loss": -7.8247761726379395, "global_step": 36572, "epoch": 217} {"train_loss": -7.883295059204102, "global_step": 36573, "epoch": 217} {"train_loss": -7.873987197875977, "global_step": 36574, "epoch": 217} {"train_loss": -7.675039291381836, "global_step": 36575, "epoch": 217} {"train_loss": -7.7889556884765625, "global_step": 36576, "epoch": 217} {"train_loss": -7.758344650268555, "global_step": 36577, "epoch": 217} {"train_loss": -7.831739902496338, "global_step": 36578, "epoch": 217} {"train_loss": -7.66895055770874, "global_step": 36579, "epoch": 217} {"train_loss": -7.701339244842529, "global_step": 36580, "epoch": 217} {"train_loss": -7.958873748779297, "global_step": 36581, "epoch": 217} {"train_loss": -7.510295391082764, "global_step": 36582, "epoch": 217} {"train_loss": -7.676948547363281, "global_step": 36583, "epoch": 217} {"train_loss": -7.663369178771973, "global_step": 36584, "epoch": 217} {"train_loss": -8.074335098266602, "global_step": 36585, "epoch": 217} {"train_loss": -7.753993988037109, "global_step": 36586, "epoch": 217} {"train_loss": -7.864224433898926, "global_step": 36587, "epoch": 217} {"train_loss": -7.8230743408203125, "global_step": 36588, "epoch": 217} {"train_loss": -7.752932071685791, "global_step": 36589, "epoch": 217} {"train_loss": -7.6835479736328125, "global_step": 36590, "epoch": 217} {"train_loss": -7.962669372558594, "global_step": 36591, "epoch": 217} {"train_loss": -7.885056018829346, "global_step": 36592, "epoch": 217} {"train_loss": -7.909373760223389, "global_step": 36593, "epoch": 217} {"train_loss": -7.791622161865234, "global_step": 36594, "epoch": 217} {"train_loss": -7.527961254119873, "global_step": 36595, "epoch": 217} {"train_loss": -7.635690689086914, "global_step": 36596, "epoch": 217} {"train_loss": -7.678356647491455, "global_step": 36597, "epoch": 217} {"train_loss": -7.756340980529785, "global_step": 36598, "epoch": 217} {"train_loss": -7.531418800354004, "global_step": 36599, "epoch": 217} {"train_loss": -7.93903112411499, "global_step": 36600, "epoch": 217} {"train_loss": -7.730828285217285, "global_step": 36601, "epoch": 217} {"train_loss": -7.7194647789001465, "global_step": 36602, "epoch": 217} {"train_loss": -7.970257759094238, "global_step": 36603, "epoch": 217} {"train_loss": -7.917232513427734, "global_step": 36604, "epoch": 217} {"train_loss": -7.820363521575928, "global_step": 36605, "epoch": 217} {"train_loss": -8.068887710571289, "global_step": 36606, "epoch": 217} {"train_loss": -7.772428035736084, "global_step": 36607, "epoch": 217} {"train_loss": -7.831042289733887, "global_step": 36608, "epoch": 217} {"train_loss": -7.767068862915039, "global_step": 36609, "epoch": 217} {"train_loss": -7.887505054473877, "global_step": 36610, "epoch": 217} {"train_loss": -7.820674419403076, "global_step": 36611, "epoch": 217} {"train_loss": -7.916791915893555, "global_step": 36612, "epoch": 217} {"train_loss": -7.914752006530762, "global_step": 36613, "epoch": 217} {"train_loss": -7.4033331871032715, "global_step": 36614, "epoch": 217} {"train_loss": -8.011903762817383, "global_step": 36615, "epoch": 217} {"train_loss": -7.602222442626953, "global_step": 36616, "epoch": 217} {"train_loss": -7.820468902587891, "global_step": 36617, "epoch": 217} {"train_loss": -7.6686811447143555, "global_step": 36618, "epoch": 217} {"train_loss": -7.605488300323486, "global_step": 36619, "epoch": 217} {"train_loss": -7.612483978271484, "global_step": 36620, "epoch": 217} {"train_loss": -7.426805019378662, "global_step": 36621, "epoch": 217} {"train_loss": -7.9206953048706055, "global_step": 36622, "epoch": 217} {"train_loss": -7.768559478578114, "global_step": 36623, "epoch": 217, "val_loss": 185140.78125} {"train_loss": -7.667832374572754, "global_step": 36624, "epoch": 218} {"train_loss": -7.604554653167725, "global_step": 36625, "epoch": 218} {"train_loss": -7.433953285217285, "global_step": 36626, "epoch": 218} {"train_loss": -7.840635299682617, "global_step": 36627, "epoch": 218} {"train_loss": -7.554172992706299, "global_step": 36628, "epoch": 218} {"train_loss": -7.665422439575195, "global_step": 36629, "epoch": 218} {"train_loss": -7.7602338790893555, "global_step": 36630, "epoch": 218} {"train_loss": -7.669321537017822, "global_step": 36631, "epoch": 218} {"train_loss": -7.754097938537598, "global_step": 36632, "epoch": 218} {"train_loss": -7.7167253494262695, "global_step": 36633, "epoch": 218} {"train_loss": -7.935042858123779, "global_step": 36634, "epoch": 218} {"train_loss": -7.873361587524414, "global_step": 36635, "epoch": 218} {"train_loss": -7.6244611740112305, "global_step": 36636, "epoch": 218} {"train_loss": -7.868419647216797, "global_step": 36637, "epoch": 218} {"train_loss": -7.736680030822754, "global_step": 36638, "epoch": 218} {"train_loss": -7.722112655639648, "global_step": 36639, "epoch": 218} {"train_loss": -7.668893337249756, "global_step": 36640, "epoch": 218} {"train_loss": -7.904024124145508, "global_step": 36641, "epoch": 218} {"train_loss": -7.9074506759643555, "global_step": 36642, "epoch": 218} {"train_loss": -7.749373435974121, "global_step": 36643, "epoch": 218} {"train_loss": -7.620937824249268, "global_step": 36644, "epoch": 218} {"train_loss": -7.876889228820801, "global_step": 36645, "epoch": 218} {"train_loss": -7.5700364112854, "global_step": 36646, "epoch": 218} {"train_loss": -7.754581451416016, "global_step": 36647, "epoch": 218} {"train_loss": -7.892012119293213, "global_step": 36648, "epoch": 218} {"train_loss": -8.02604866027832, "global_step": 36649, "epoch": 218} {"train_loss": -7.761482238769531, "global_step": 36650, "epoch": 218} {"train_loss": -8.043973922729492, "global_step": 36651, "epoch": 218} {"train_loss": -7.9124298095703125, "global_step": 36652, "epoch": 218} {"train_loss": -7.820981025695801, "global_step": 36653, "epoch": 218} {"train_loss": -7.921752452850342, "global_step": 36654, "epoch": 218} {"train_loss": -7.575459957122803, "global_step": 36655, "epoch": 218} {"train_loss": -7.7949323654174805, "global_step": 36656, "epoch": 218} {"train_loss": -7.862936973571777, "global_step": 36657, "epoch": 218} {"train_loss": -7.904621124267578, "global_step": 36658, "epoch": 218} {"train_loss": -7.769050121307373, "global_step": 36659, "epoch": 218} {"train_loss": -8.063774108886719, "global_step": 36660, "epoch": 218} {"train_loss": -8.054632186889648, "global_step": 36661, "epoch": 218} {"train_loss": -7.963479995727539, "global_step": 36662, "epoch": 218} {"train_loss": -7.9480977058410645, "global_step": 36663, "epoch": 218} {"train_loss": -8.010577201843262, "global_step": 36664, "epoch": 218} {"train_loss": -7.786853790283203, "global_step": 36665, "epoch": 218} {"train_loss": -7.900115013122559, "global_step": 36666, "epoch": 218} {"train_loss": -7.757220268249512, "global_step": 36667, "epoch": 218} {"train_loss": -7.772285461425781, "global_step": 36668, "epoch": 218} {"train_loss": -7.517355918884277, "global_step": 36669, "epoch": 218} {"train_loss": -7.704370975494385, "global_step": 36670, "epoch": 218} {"train_loss": -7.758715629577637, "global_step": 36671, "epoch": 218} {"train_loss": -7.687633514404297, "global_step": 36672, "epoch": 218} {"train_loss": -7.743088722229004, "global_step": 36673, "epoch": 218} {"train_loss": -7.493093490600586, "global_step": 36674, "epoch": 218} {"train_loss": -7.516355991363525, "global_step": 36675, "epoch": 218} {"train_loss": -7.923457145690918, "global_step": 36676, "epoch": 218} {"train_loss": -7.539119720458984, "global_step": 36677, "epoch": 218} {"train_loss": -7.362124919891357, "global_step": 36678, "epoch": 218} {"train_loss": -7.822787284851074, "global_step": 36679, "epoch": 218} {"train_loss": -7.6609416007995605, "global_step": 36680, "epoch": 218} {"train_loss": -7.77277946472168, "global_step": 36681, "epoch": 218} {"train_loss": -7.240281581878662, "global_step": 36682, "epoch": 218} {"train_loss": -7.651401519775391, "global_step": 36683, "epoch": 218} {"train_loss": -7.579547882080078, "global_step": 36684, "epoch": 218} {"train_loss": -7.713463306427002, "global_step": 36685, "epoch": 218} {"train_loss": -7.818165302276611, "global_step": 36686, "epoch": 218} {"train_loss": -7.726390361785889, "global_step": 36687, "epoch": 218} {"train_loss": -7.882710933685303, "global_step": 36688, "epoch": 218} {"train_loss": -7.714139938354492, "global_step": 36689, "epoch": 218} {"train_loss": -7.664282321929932, "global_step": 36690, "epoch": 218} {"train_loss": -7.6663103103637695, "global_step": 36691, "epoch": 218} {"train_loss": -7.690196514129639, "global_step": 36692, "epoch": 218} {"train_loss": -7.653837203979492, "global_step": 36693, "epoch": 218} {"train_loss": -7.801835060119629, "global_step": 36694, "epoch": 218} {"train_loss": -7.8750410079956055, "global_step": 36695, "epoch": 218} {"train_loss": -7.681312084197998, "global_step": 36696, "epoch": 218} {"train_loss": -7.97132682800293, "global_step": 36697, "epoch": 218} {"train_loss": -7.713327407836914, "global_step": 36698, "epoch": 218} {"train_loss": -7.721839904785156, "global_step": 36699, "epoch": 218} {"train_loss": -7.907620429992676, "global_step": 36700, "epoch": 218} {"train_loss": -7.714743614196777, "global_step": 36701, "epoch": 218} {"train_loss": -7.6588640213012695, "global_step": 36702, "epoch": 218} {"train_loss": -7.690032482147217, "global_step": 36703, "epoch": 218} {"train_loss": -7.936931610107422, "global_step": 36704, "epoch": 218} {"train_loss": -7.915900707244873, "global_step": 36705, "epoch": 218} {"train_loss": -7.728687286376953, "global_step": 36706, "epoch": 218} {"train_loss": -7.936549186706543, "global_step": 36707, "epoch": 218} {"train_loss": -7.740011215209961, "global_step": 36708, "epoch": 218} {"train_loss": -7.809715270996094, "global_step": 36709, "epoch": 218} {"train_loss": -7.69907283782959, "global_step": 36710, "epoch": 218} {"train_loss": -7.791640281677246, "global_step": 36711, "epoch": 218} {"train_loss": -7.8874616622924805, "global_step": 36712, "epoch": 218} {"train_loss": -8.044678688049316, "global_step": 36713, "epoch": 218} {"train_loss": -7.846948623657227, "global_step": 36714, "epoch": 218} {"train_loss": -7.900934219360352, "global_step": 36715, "epoch": 218} {"train_loss": -7.849713325500488, "global_step": 36716, "epoch": 218} {"train_loss": -7.864253044128418, "global_step": 36717, "epoch": 218} {"train_loss": -7.9126691818237305, "global_step": 36718, "epoch": 218} {"train_loss": -7.602900505065918, "global_step": 36719, "epoch": 218} {"train_loss": -7.863152503967285, "global_step": 36720, "epoch": 218} {"train_loss": -7.846048355102539, "global_step": 36721, "epoch": 218} {"train_loss": -7.902994155883789, "global_step": 36722, "epoch": 218} {"train_loss": -7.902373313903809, "global_step": 36723, "epoch": 218} {"train_loss": -8.063453674316406, "global_step": 36724, "epoch": 218} {"train_loss": -7.820558071136475, "global_step": 36725, "epoch": 218} {"train_loss": -7.8027472496032715, "global_step": 36726, "epoch": 218} {"train_loss": -7.67572021484375, "global_step": 36727, "epoch": 218} {"train_loss": -7.831274509429932, "global_step": 36728, "epoch": 218} {"train_loss": -7.724653244018555, "global_step": 36729, "epoch": 218} {"train_loss": -7.850106716156006, "global_step": 36730, "epoch": 218} {"train_loss": -8.014503479003906, "global_step": 36731, "epoch": 218} {"train_loss": -7.703585147857666, "global_step": 36732, "epoch": 218} {"train_loss": -7.798885345458984, "global_step": 36733, "epoch": 218} {"train_loss": -7.715485572814941, "global_step": 36734, "epoch": 218} {"train_loss": -7.738874912261963, "global_step": 36735, "epoch": 218} {"train_loss": -7.998829364776611, "global_step": 36736, "epoch": 218} {"train_loss": -7.7692365646362305, "global_step": 36737, "epoch": 218} {"train_loss": -7.780417442321777, "global_step": 36738, "epoch": 218} {"train_loss": -7.715653419494629, "global_step": 36739, "epoch": 218} {"train_loss": -7.834778785705566, "global_step": 36740, "epoch": 218} {"train_loss": -7.690793991088867, "global_step": 36741, "epoch": 218} {"train_loss": -7.681192398071289, "global_step": 36742, "epoch": 218} {"train_loss": -7.826251983642578, "global_step": 36743, "epoch": 218} {"train_loss": -7.976739406585693, "global_step": 36744, "epoch": 218} {"train_loss": -7.76561164855957, "global_step": 36745, "epoch": 218} {"train_loss": -7.71060848236084, "global_step": 36746, "epoch": 218} {"train_loss": -7.52392053604126, "global_step": 36747, "epoch": 218} {"train_loss": -7.815779685974121, "global_step": 36748, "epoch": 218} {"train_loss": -7.8247270584106445, "global_step": 36749, "epoch": 218} {"train_loss": -7.7591142654418945, "global_step": 36750, "epoch": 218} {"train_loss": -7.99031925201416, "global_step": 36751, "epoch": 218} {"train_loss": -7.815314292907715, "global_step": 36752, "epoch": 218} {"train_loss": -7.918178558349609, "global_step": 36753, "epoch": 218} {"train_loss": -7.606661796569824, "global_step": 36754, "epoch": 218} {"train_loss": -7.779363632202148, "global_step": 36755, "epoch": 218} {"train_loss": -7.422354221343994, "global_step": 36756, "epoch": 218} {"train_loss": -7.876297950744629, "global_step": 36757, "epoch": 218} {"train_loss": -7.422837257385254, "global_step": 36758, "epoch": 218} {"train_loss": -7.590114593505859, "global_step": 36759, "epoch": 218} {"train_loss": -7.5622334480285645, "global_step": 36760, "epoch": 218} {"train_loss": -7.55963659286499, "global_step": 36761, "epoch": 218} {"train_loss": -7.7058515548706055, "global_step": 36762, "epoch": 218} {"train_loss": -7.450241565704346, "global_step": 36763, "epoch": 218} {"train_loss": -7.672879219055176, "global_step": 36764, "epoch": 218} {"train_loss": -7.364622592926025, "global_step": 36765, "epoch": 218} {"train_loss": -7.758666515350342, "global_step": 36766, "epoch": 218} {"train_loss": -7.5693583488464355, "global_step": 36767, "epoch": 218} {"train_loss": -7.485359191894531, "global_step": 36768, "epoch": 218} {"train_loss": -7.91865348815918, "global_step": 36769, "epoch": 218} {"train_loss": -7.4791388511657715, "global_step": 36770, "epoch": 218} {"train_loss": -7.864518165588379, "global_step": 36771, "epoch": 218} {"train_loss": -7.636312007904053, "global_step": 36772, "epoch": 218} {"train_loss": -7.783729553222656, "global_step": 36773, "epoch": 218} {"train_loss": -7.84346342086792, "global_step": 36774, "epoch": 218} {"train_loss": -7.793505668640137, "global_step": 36775, "epoch": 218} {"train_loss": -7.6342644691467285, "global_step": 36776, "epoch": 218} {"train_loss": -7.803205490112305, "global_step": 36777, "epoch": 218} {"train_loss": -7.933754920959473, "global_step": 36778, "epoch": 218} {"train_loss": -7.582252025604248, "global_step": 36779, "epoch": 218} {"train_loss": -7.813290596008301, "global_step": 36780, "epoch": 218} {"train_loss": -7.8141608238220215, "global_step": 36781, "epoch": 218} {"train_loss": -7.980471611022949, "global_step": 36782, "epoch": 218} {"train_loss": -7.97843074798584, "global_step": 36783, "epoch": 218} {"train_loss": -8.022658348083496, "global_step": 36784, "epoch": 218} {"train_loss": -8.10025405883789, "global_step": 36785, "epoch": 218} {"train_loss": -8.027292251586914, "global_step": 36786, "epoch": 218} {"train_loss": -7.77315616607666, "global_step": 36787, "epoch": 218} {"train_loss": -7.843781471252441, "global_step": 36788, "epoch": 218} {"train_loss": -8.08735466003418, "global_step": 36789, "epoch": 218} {"train_loss": -7.961868762969971, "global_step": 36790, "epoch": 218} {"train_loss": -7.771904880092258, "global_step": 36791, "epoch": 218, "val_loss": 184544.46875} {"train_loss": -7.891690254211426, "global_step": 36792, "epoch": 219} {"train_loss": -7.682713508605957, "global_step": 36793, "epoch": 219} {"train_loss": -7.815540790557861, "global_step": 36794, "epoch": 219} {"train_loss": -7.814038276672363, "global_step": 36795, "epoch": 219} {"train_loss": -7.610674858093262, "global_step": 36796, "epoch": 219} {"train_loss": -7.4633307456970215, "global_step": 36797, "epoch": 219} {"train_loss": -7.740213394165039, "global_step": 36798, "epoch": 219} {"train_loss": -7.682977199554443, "global_step": 36799, "epoch": 219} {"train_loss": -7.610030174255371, "global_step": 36800, "epoch": 219} {"train_loss": -7.659401893615723, "global_step": 36801, "epoch": 219} {"train_loss": -7.7740044593811035, "global_step": 36802, "epoch": 219} {"train_loss": -7.651587963104248, "global_step": 36803, "epoch": 219} {"train_loss": -7.601626396179199, "global_step": 36804, "epoch": 219} {"train_loss": -7.733376502990723, "global_step": 36805, "epoch": 219} {"train_loss": -7.7911224365234375, "global_step": 36806, "epoch": 219} {"train_loss": -7.659567832946777, "global_step": 36807, "epoch": 219} {"train_loss": -7.835052490234375, "global_step": 36808, "epoch": 219} {"train_loss": -7.796258449554443, "global_step": 36809, "epoch": 219} {"train_loss": -7.713314056396484, "global_step": 36810, "epoch": 219} {"train_loss": -7.744048118591309, "global_step": 36811, "epoch": 219} {"train_loss": -7.7157087326049805, "global_step": 36812, "epoch": 219} {"train_loss": -7.633504867553711, "global_step": 36813, "epoch": 219} {"train_loss": -7.970531463623047, "global_step": 36814, "epoch": 219} {"train_loss": -7.980461597442627, "global_step": 36815, "epoch": 219} {"train_loss": -7.979391098022461, "global_step": 36816, "epoch": 219} {"train_loss": -7.807005882263184, "global_step": 36817, "epoch": 219} {"train_loss": -7.799228191375732, "global_step": 36818, "epoch": 219} {"train_loss": -7.7855987548828125, "global_step": 36819, "epoch": 219} {"train_loss": -8.09852409362793, "global_step": 36820, "epoch": 219} {"train_loss": -7.715684413909912, "global_step": 36821, "epoch": 219} {"train_loss": -7.868034362792969, "global_step": 36822, "epoch": 219} {"train_loss": -7.5908708572387695, "global_step": 36823, "epoch": 219} {"train_loss": -7.9209794998168945, "global_step": 36824, "epoch": 219} {"train_loss": -7.699078559875488, "global_step": 36825, "epoch": 219} {"train_loss": -7.93857479095459, "global_step": 36826, "epoch": 219} {"train_loss": -8.05463981628418, "global_step": 36827, "epoch": 219} {"train_loss": -7.844575881958008, "global_step": 36828, "epoch": 219} {"train_loss": -7.851933479309082, "global_step": 36829, "epoch": 219} {"train_loss": -7.892850875854492, "global_step": 36830, "epoch": 219} {"train_loss": -7.751230239868164, "global_step": 36831, "epoch": 219} {"train_loss": -7.88838529586792, "global_step": 36832, "epoch": 219} {"train_loss": -7.777577877044678, "global_step": 36833, "epoch": 219} {"train_loss": -7.641618728637695, "global_step": 36834, "epoch": 219} {"train_loss": -7.898777961730957, "global_step": 36835, "epoch": 219} {"train_loss": -7.894702434539795, "global_step": 36836, "epoch": 219} {"train_loss": -7.89508056640625, "global_step": 36837, "epoch": 219} {"train_loss": -8.052135467529297, "global_step": 36838, "epoch": 219} {"train_loss": -7.83893346786499, "global_step": 36839, "epoch": 219} {"train_loss": -7.8915581703186035, "global_step": 36840, "epoch": 219} {"train_loss": -8.004168510437012, "global_step": 36841, "epoch": 219} {"train_loss": -7.802367210388184, "global_step": 36842, "epoch": 219} {"train_loss": -7.941827297210693, "global_step": 36843, "epoch": 219} {"train_loss": -7.928859233856201, "global_step": 36844, "epoch": 219} {"train_loss": -8.021238327026367, "global_step": 36845, "epoch": 219} {"train_loss": -7.907757759094238, "global_step": 36846, "epoch": 219} {"train_loss": -7.786876678466797, "global_step": 36847, "epoch": 219} {"train_loss": -7.948248863220215, "global_step": 36848, "epoch": 219} {"train_loss": -7.904385089874268, "global_step": 36849, "epoch": 219} {"train_loss": -8.044172286987305, "global_step": 36850, "epoch": 219} {"train_loss": -8.088644027709961, "global_step": 36851, "epoch": 219} {"train_loss": -7.758971214294434, "global_step": 36852, "epoch": 219} {"train_loss": -7.7541046142578125, "global_step": 36853, "epoch": 219} {"train_loss": -7.62031888961792, "global_step": 36854, "epoch": 219} {"train_loss": -7.8323140144348145, "global_step": 36855, "epoch": 219} {"train_loss": -7.565654754638672, "global_step": 36856, "epoch": 219} {"train_loss": -7.923891067504883, "global_step": 36857, "epoch": 219} {"train_loss": -7.644743919372559, "global_step": 36858, "epoch": 219} {"train_loss": -7.738620281219482, "global_step": 36859, "epoch": 219} {"train_loss": -7.526534080505371, "global_step": 36860, "epoch": 219} {"train_loss": -7.772333145141602, "global_step": 36861, "epoch": 219} {"train_loss": -7.252575874328613, "global_step": 36862, "epoch": 219} {"train_loss": -7.705643653869629, "global_step": 36863, "epoch": 219} {"train_loss": -7.546416282653809, "global_step": 36864, "epoch": 219} {"train_loss": -7.348901271820068, "global_step": 36865, "epoch": 219} {"train_loss": -7.999991416931152, "global_step": 36866, "epoch": 219} {"train_loss": -7.4229536056518555, "global_step": 36867, "epoch": 219} {"train_loss": -7.704253196716309, "global_step": 36868, "epoch": 219} {"train_loss": -7.671960830688477, "global_step": 36869, "epoch": 219} {"train_loss": -7.842063903808594, "global_step": 36870, "epoch": 219} {"train_loss": -7.682246208190918, "global_step": 36871, "epoch": 219} {"train_loss": -7.801140785217285, "global_step": 36872, "epoch": 219} {"train_loss": -7.747104167938232, "global_step": 36873, "epoch": 219} {"train_loss": -7.9483842849731445, "global_step": 36874, "epoch": 219} {"train_loss": -7.819409370422363, "global_step": 36875, "epoch": 219} {"train_loss": -7.756972312927246, "global_step": 36876, "epoch": 219} {"train_loss": -7.732770919799805, "global_step": 36877, "epoch": 219} {"train_loss": -7.818783760070801, "global_step": 36878, "epoch": 219} {"train_loss": -7.893228054046631, "global_step": 36879, "epoch": 219} {"train_loss": -7.9774580001831055, "global_step": 36880, "epoch": 219} {"train_loss": -7.994452953338623, "global_step": 36881, "epoch": 219} {"train_loss": -7.773423194885254, "global_step": 36882, "epoch": 219} {"train_loss": -7.679714202880859, "global_step": 36883, "epoch": 219} {"train_loss": -7.9006500244140625, "global_step": 36884, "epoch": 219} {"train_loss": -7.835218906402588, "global_step": 36885, "epoch": 219} {"train_loss": -7.812936305999756, "global_step": 36886, "epoch": 219} {"train_loss": -7.6534881591796875, "global_step": 36887, "epoch": 219} {"train_loss": -7.818359851837158, "global_step": 36888, "epoch": 219} {"train_loss": -7.182883262634277, "global_step": 36889, "epoch": 219} {"train_loss": -7.803208351135254, "global_step": 36890, "epoch": 219} {"train_loss": -7.623401641845703, "global_step": 36891, "epoch": 219} {"train_loss": -7.700832843780518, "global_step": 36892, "epoch": 219} {"train_loss": -7.738345623016357, "global_step": 36893, "epoch": 219} {"train_loss": -7.723062992095947, "global_step": 36894, "epoch": 219} {"train_loss": -7.897017955780029, "global_step": 36895, "epoch": 219} {"train_loss": -7.835275650024414, "global_step": 36896, "epoch": 219} {"train_loss": -7.7450103759765625, "global_step": 36897, "epoch": 219} {"train_loss": -7.708011627197266, "global_step": 36898, "epoch": 219} {"train_loss": -7.79421854019165, "global_step": 36899, "epoch": 219} {"train_loss": -8.038461685180664, "global_step": 36900, "epoch": 219} {"train_loss": -7.7746992111206055, "global_step": 36901, "epoch": 219} {"train_loss": -7.862468242645264, "global_step": 36902, "epoch": 219} {"train_loss": -7.663928985595703, "global_step": 36903, "epoch": 219} {"train_loss": -7.860459327697754, "global_step": 36904, "epoch": 219} {"train_loss": -7.695987701416016, "global_step": 36905, "epoch": 219} {"train_loss": -7.858598709106445, "global_step": 36906, "epoch": 219} {"train_loss": -7.8695526123046875, "global_step": 36907, "epoch": 219} {"train_loss": -7.796722412109375, "global_step": 36908, "epoch": 219} {"train_loss": -7.864586353302002, "global_step": 36909, "epoch": 219} {"train_loss": -7.878986358642578, "global_step": 36910, "epoch": 219} {"train_loss": -7.9133758544921875, "global_step": 36911, "epoch": 219} {"train_loss": -7.907473564147949, "global_step": 36912, "epoch": 219} {"train_loss": -7.833423137664795, "global_step": 36913, "epoch": 219} {"train_loss": -7.750410079956055, "global_step": 36914, "epoch": 219} {"train_loss": -7.692736625671387, "global_step": 36915, "epoch": 219} {"train_loss": -7.863458633422852, "global_step": 36916, "epoch": 219} {"train_loss": -7.965885162353516, "global_step": 36917, "epoch": 219} {"train_loss": -8.06617546081543, "global_step": 36918, "epoch": 219} {"train_loss": -8.053271293640137, "global_step": 36919, "epoch": 219} {"train_loss": -7.871315002441406, "global_step": 36920, "epoch": 219} {"train_loss": -8.012899398803711, "global_step": 36921, "epoch": 219} {"train_loss": -7.677588939666748, "global_step": 36922, "epoch": 219} {"train_loss": -7.722775459289551, "global_step": 36923, "epoch": 219} {"train_loss": -7.956645488739014, "global_step": 36924, "epoch": 219} {"train_loss": -7.88372278213501, "global_step": 36925, "epoch": 219} {"train_loss": -7.842350959777832, "global_step": 36926, "epoch": 219} {"train_loss": -8.001349449157715, "global_step": 36927, "epoch": 219} {"train_loss": -7.777374267578125, "global_step": 36928, "epoch": 219} {"train_loss": -7.887679576873779, "global_step": 36929, "epoch": 219} {"train_loss": -7.648203372955322, "global_step": 36930, "epoch": 219} {"train_loss": -7.956499099731445, "global_step": 36931, "epoch": 219} {"train_loss": -7.73128604888916, "global_step": 36932, "epoch": 219} {"train_loss": -7.878841400146484, "global_step": 36933, "epoch": 219} {"train_loss": -7.9104461669921875, "global_step": 36934, "epoch": 219} {"train_loss": -7.946216106414795, "global_step": 36935, "epoch": 219} {"train_loss": -7.803012847900391, "global_step": 36936, "epoch": 219} {"train_loss": -8.00876522064209, "global_step": 36937, "epoch": 219} {"train_loss": -7.76569938659668, "global_step": 36938, "epoch": 219} {"train_loss": -8.0713472366333, "global_step": 36939, "epoch": 219} {"train_loss": -7.914032936096191, "global_step": 36940, "epoch": 219} {"train_loss": -8.03411865234375, "global_step": 36941, "epoch": 219} {"train_loss": -7.930169582366943, "global_step": 36942, "epoch": 219} {"train_loss": -7.809072971343994, "global_step": 36943, "epoch": 219} {"train_loss": -7.894827365875244, "global_step": 36944, "epoch": 219} {"train_loss": -7.846148490905762, "global_step": 36945, "epoch": 219} {"train_loss": -7.805919170379639, "global_step": 36946, "epoch": 219} {"train_loss": -7.917120456695557, "global_step": 36947, "epoch": 219} {"train_loss": -7.941193103790283, "global_step": 36948, "epoch": 219} {"train_loss": -7.78557014465332, "global_step": 36949, "epoch": 219} {"train_loss": -7.960496425628662, "global_step": 36950, "epoch": 219} {"train_loss": -7.682389259338379, "global_step": 36951, "epoch": 219} {"train_loss": -7.881102561950684, "global_step": 36952, "epoch": 219} {"train_loss": -7.612797737121582, "global_step": 36953, "epoch": 219} {"train_loss": -7.879449367523193, "global_step": 36954, "epoch": 219} {"train_loss": -7.843451499938965, "global_step": 36955, "epoch": 219} {"train_loss": -7.8304548263549805, "global_step": 36956, "epoch": 219} {"train_loss": -7.766539573669434, "global_step": 36957, "epoch": 219} {"train_loss": -7.505109786987305, "global_step": 36958, "epoch": 219} {"train_loss": -7.804221607389904, "global_step": 36959, "epoch": 219, "val_loss": 185593.25} {"train_loss": -7.5650315284729, "global_step": 36960, "epoch": 220} {"train_loss": -7.782059669494629, "global_step": 36961, "epoch": 220} {"train_loss": -7.610405921936035, "global_step": 36962, "epoch": 220} {"train_loss": -7.529975891113281, "global_step": 36963, "epoch": 220} {"train_loss": -7.51544189453125, "global_step": 36964, "epoch": 220} {"train_loss": -7.760605812072754, "global_step": 36965, "epoch": 220} {"train_loss": -7.665331840515137, "global_step": 36966, "epoch": 220} {"train_loss": -7.888947486877441, "global_step": 36967, "epoch": 220} {"train_loss": -7.673556327819824, "global_step": 36968, "epoch": 220} {"train_loss": -7.754514217376709, "global_step": 36969, "epoch": 220} {"train_loss": -7.652576446533203, "global_step": 36970, "epoch": 220} {"train_loss": -7.7614593505859375, "global_step": 36971, "epoch": 220} {"train_loss": -7.9430012702941895, "global_step": 36972, "epoch": 220} {"train_loss": -7.627829074859619, "global_step": 36973, "epoch": 220} {"train_loss": -7.506603240966797, "global_step": 36974, "epoch": 220} {"train_loss": -7.619600296020508, "global_step": 36975, "epoch": 220} {"train_loss": -7.8775529861450195, "global_step": 36976, "epoch": 220} {"train_loss": -7.585084915161133, "global_step": 36977, "epoch": 220} {"train_loss": -7.907696723937988, "global_step": 36978, "epoch": 220} {"train_loss": -7.638240814208984, "global_step": 36979, "epoch": 220} {"train_loss": -7.816934108734131, "global_step": 36980, "epoch": 220} {"train_loss": -7.907052993774414, "global_step": 36981, "epoch": 220} {"train_loss": -7.54805850982666, "global_step": 36982, "epoch": 220} {"train_loss": -7.775773048400879, "global_step": 36983, "epoch": 220} {"train_loss": -7.893643379211426, "global_step": 36984, "epoch": 220} {"train_loss": -8.055313110351562, "global_step": 36985, "epoch": 220} {"train_loss": -7.685007572174072, "global_step": 36986, "epoch": 220} {"train_loss": -7.795116424560547, "global_step": 36987, "epoch": 220} {"train_loss": -7.790886878967285, "global_step": 36988, "epoch": 220} {"train_loss": -7.758055686950684, "global_step": 36989, "epoch": 220} {"train_loss": -7.7207231521606445, "global_step": 36990, "epoch": 220} {"train_loss": -7.702035903930664, "global_step": 36991, "epoch": 220} {"train_loss": -7.822328090667725, "global_step": 36992, "epoch": 220} {"train_loss": -7.548407554626465, "global_step": 36993, "epoch": 220} {"train_loss": -7.816349029541016, "global_step": 36994, "epoch": 220} {"train_loss": -7.752170085906982, "global_step": 36995, "epoch": 220} {"train_loss": -7.807961463928223, "global_step": 36996, "epoch": 220} {"train_loss": -7.630269527435303, "global_step": 36997, "epoch": 220} {"train_loss": -7.668697357177734, "global_step": 36998, "epoch": 220} {"train_loss": -7.875751495361328, "global_step": 36999, "epoch": 220} {"train_loss": -7.795351982116699, "global_step": 37000, "epoch": 220} {"train_loss": -7.80374813079834, "global_step": 37001, "epoch": 220} {"train_loss": -7.828340530395508, "global_step": 37002, "epoch": 220} {"train_loss": -7.637073516845703, "global_step": 37003, "epoch": 220} {"train_loss": -7.7330427169799805, "global_step": 37004, "epoch": 220} {"train_loss": -7.797971248626709, "global_step": 37005, "epoch": 220} {"train_loss": -7.778255462646484, "global_step": 37006, "epoch": 220} {"train_loss": -7.69421911239624, "global_step": 37007, "epoch": 220} {"train_loss": -7.887126445770264, "global_step": 37008, "epoch": 220} {"train_loss": -7.762485027313232, "global_step": 37009, "epoch": 220} {"train_loss": -7.738832950592041, "global_step": 37010, "epoch": 220} {"train_loss": -7.6723833084106445, "global_step": 37011, "epoch": 220} {"train_loss": -7.842955589294434, "global_step": 37012, "epoch": 220} {"train_loss": -7.677090644836426, "global_step": 37013, "epoch": 220} {"train_loss": -8.153701782226562, "global_step": 37014, "epoch": 220} {"train_loss": -7.843546390533447, "global_step": 37015, "epoch": 220} {"train_loss": -7.520646095275879, "global_step": 37016, "epoch": 220} {"train_loss": -7.8197174072265625, "global_step": 37017, "epoch": 220} {"train_loss": -7.929468154907227, "global_step": 37018, "epoch": 220} {"train_loss": -7.796008110046387, "global_step": 37019, "epoch": 220} {"train_loss": -7.709647178649902, "global_step": 37020, "epoch": 220} {"train_loss": -7.844186782836914, "global_step": 37021, "epoch": 220} {"train_loss": -7.727180004119873, "global_step": 37022, "epoch": 220} {"train_loss": -7.747152328491211, "global_step": 37023, "epoch": 220} {"train_loss": -7.916904449462891, "global_step": 37024, "epoch": 220} {"train_loss": -8.036002159118652, "global_step": 37025, "epoch": 220} {"train_loss": -7.737480163574219, "global_step": 37026, "epoch": 220} {"train_loss": -7.9220428466796875, "global_step": 37027, "epoch": 220} {"train_loss": -7.864569664001465, "global_step": 37028, "epoch": 220} {"train_loss": -8.078431129455566, "global_step": 37029, "epoch": 220} {"train_loss": -7.975650787353516, "global_step": 37030, "epoch": 220} {"train_loss": -7.904024124145508, "global_step": 37031, "epoch": 220} {"train_loss": -7.665605545043945, "global_step": 37032, "epoch": 220} {"train_loss": -7.786479949951172, "global_step": 37033, "epoch": 220} {"train_loss": -8.025961875915527, "global_step": 37034, "epoch": 220} {"train_loss": -8.062726020812988, "global_step": 37035, "epoch": 220} {"train_loss": -7.940271377563477, "global_step": 37036, "epoch": 220} {"train_loss": -8.131288528442383, "global_step": 37037, "epoch": 220} {"train_loss": -7.865554332733154, "global_step": 37038, "epoch": 220} {"train_loss": -8.063315391540527, "global_step": 37039, "epoch": 220} {"train_loss": -7.916980743408203, "global_step": 37040, "epoch": 220} {"train_loss": -8.07093620300293, "global_step": 37041, "epoch": 220} {"train_loss": -7.9313249588012695, "global_step": 37042, "epoch": 220} {"train_loss": -7.904881477355957, "global_step": 37043, "epoch": 220} {"train_loss": -7.845188617706299, "global_step": 37044, "epoch": 220} {"train_loss": -7.793404579162598, "global_step": 37045, "epoch": 220} {"train_loss": -7.911725044250488, "global_step": 37046, "epoch": 220} {"train_loss": -7.7832112312316895, "global_step": 37047, "epoch": 220} {"train_loss": -7.750548362731934, "global_step": 37048, "epoch": 220} {"train_loss": -7.751519203186035, "global_step": 37049, "epoch": 220} {"train_loss": -7.993305206298828, "global_step": 37050, "epoch": 220} {"train_loss": -7.651731967926025, "global_step": 37051, "epoch": 220} {"train_loss": -8.008358001708984, "global_step": 37052, "epoch": 220} {"train_loss": -7.92078971862793, "global_step": 37053, "epoch": 220} {"train_loss": -8.010177612304688, "global_step": 37054, "epoch": 220} {"train_loss": -7.9287309646606445, "global_step": 37055, "epoch": 220} {"train_loss": -8.013794898986816, "global_step": 37056, "epoch": 220} {"train_loss": -7.797555923461914, "global_step": 37057, "epoch": 220} {"train_loss": -7.971541881561279, "global_step": 37058, "epoch": 220} {"train_loss": -7.590609550476074, "global_step": 37059, "epoch": 220} {"train_loss": -7.561885833740234, "global_step": 37060, "epoch": 220} {"train_loss": -7.506312370300293, "global_step": 37061, "epoch": 220} {"train_loss": -7.996769905090332, "global_step": 37062, "epoch": 220} {"train_loss": -7.624509811401367, "global_step": 37063, "epoch": 220} {"train_loss": -8.013922691345215, "global_step": 37064, "epoch": 220} {"train_loss": -7.657016754150391, "global_step": 37065, "epoch": 220} {"train_loss": -7.783604145050049, "global_step": 37066, "epoch": 220} {"train_loss": -7.539409637451172, "global_step": 37067, "epoch": 220} {"train_loss": -7.798402786254883, "global_step": 37068, "epoch": 220} {"train_loss": -7.713747024536133, "global_step": 37069, "epoch": 220} {"train_loss": -7.770671367645264, "global_step": 37070, "epoch": 220} {"train_loss": -7.681058883666992, "global_step": 37071, "epoch": 220} {"train_loss": -7.715204238891602, "global_step": 37072, "epoch": 220} {"train_loss": -7.798112869262695, "global_step": 37073, "epoch": 220} {"train_loss": -7.747931957244873, "global_step": 37074, "epoch": 220} {"train_loss": -7.884218215942383, "global_step": 37075, "epoch": 220} {"train_loss": -7.684541702270508, "global_step": 37076, "epoch": 220} {"train_loss": -7.826283931732178, "global_step": 37077, "epoch": 220} {"train_loss": -7.731627941131592, "global_step": 37078, "epoch": 220} {"train_loss": -7.6838836669921875, "global_step": 37079, "epoch": 220} {"train_loss": -7.938358783721924, "global_step": 37080, "epoch": 220} {"train_loss": -7.492094993591309, "global_step": 37081, "epoch": 220} {"train_loss": -7.924734115600586, "global_step": 37082, "epoch": 220} {"train_loss": -7.885492324829102, "global_step": 37083, "epoch": 220} {"train_loss": -7.807568073272705, "global_step": 37084, "epoch": 220} {"train_loss": -7.766898155212402, "global_step": 37085, "epoch": 220} {"train_loss": -7.595998764038086, "global_step": 37086, "epoch": 220} {"train_loss": -7.646326065063477, "global_step": 37087, "epoch": 220} {"train_loss": -7.937121868133545, "global_step": 37088, "epoch": 220} {"train_loss": -7.689700603485107, "global_step": 37089, "epoch": 220} {"train_loss": -7.706663131713867, "global_step": 37090, "epoch": 220} {"train_loss": -8.011588096618652, "global_step": 37091, "epoch": 220} {"train_loss": -7.72238826751709, "global_step": 37092, "epoch": 220} {"train_loss": -7.608388423919678, "global_step": 37093, "epoch": 220} {"train_loss": -7.939840316772461, "global_step": 37094, "epoch": 220} {"train_loss": -7.804572105407715, "global_step": 37095, "epoch": 220} {"train_loss": -7.910594940185547, "global_step": 37096, "epoch": 220} {"train_loss": -7.840550422668457, "global_step": 37097, "epoch": 220} {"train_loss": -7.758361339569092, "global_step": 37098, "epoch": 220} {"train_loss": -8.066271781921387, "global_step": 37099, "epoch": 220} {"train_loss": -8.108430862426758, "global_step": 37100, "epoch": 220} {"train_loss": -7.7035441398620605, "global_step": 37101, "epoch": 220} {"train_loss": -7.946221351623535, "global_step": 37102, "epoch": 220} {"train_loss": -7.785311698913574, "global_step": 37103, "epoch": 220} {"train_loss": -7.726411819458008, "global_step": 37104, "epoch": 220} {"train_loss": -7.799189567565918, "global_step": 37105, "epoch": 220} {"train_loss": -7.958917617797852, "global_step": 37106, "epoch": 220} {"train_loss": -7.62799072265625, "global_step": 37107, "epoch": 220} {"train_loss": -7.915809154510498, "global_step": 37108, "epoch": 220} {"train_loss": -7.818860054016113, "global_step": 37109, "epoch": 220} {"train_loss": -7.936491966247559, "global_step": 37110, "epoch": 220} {"train_loss": -7.784898281097412, "global_step": 37111, "epoch": 220} {"train_loss": -8.088861465454102, "global_step": 37112, "epoch": 220} {"train_loss": -8.084086418151855, "global_step": 37113, "epoch": 220} {"train_loss": -7.828366279602051, "global_step": 37114, "epoch": 220} {"train_loss": -7.763347625732422, "global_step": 37115, "epoch": 220} {"train_loss": -7.757307052612305, "global_step": 37116, "epoch": 220} {"train_loss": -7.5723676681518555, "global_step": 37117, "epoch": 220} {"train_loss": -7.496356010437012, "global_step": 37118, "epoch": 220} {"train_loss": -7.589761257171631, "global_step": 37119, "epoch": 220} {"train_loss": -7.754447937011719, "global_step": 37120, "epoch": 220} {"train_loss": -7.738447666168213, "global_step": 37121, "epoch": 220} {"train_loss": -7.815340042114258, "global_step": 37122, "epoch": 220} {"train_loss": -7.61666202545166, "global_step": 37123, "epoch": 220} {"train_loss": -7.746140480041504, "global_step": 37124, "epoch": 220} {"train_loss": -7.88397216796875, "global_step": 37125, "epoch": 220} {"train_loss": -7.85543966293335, "global_step": 37126, "epoch": 220} {"train_loss": -7.795653360230582, "global_step": 37127, "epoch": 220, "val_loss": 187844.4375, "train_action_mse_error": 15.189342498779297} {"train_loss": -7.915261268615723, "global_step": 37128, "epoch": 221} {"train_loss": -7.833708763122559, "global_step": 37129, "epoch": 221} {"train_loss": -7.77281379699707, "global_step": 37130, "epoch": 221} {"train_loss": -8.033369064331055, "global_step": 37131, "epoch": 221} {"train_loss": -7.964189052581787, "global_step": 37132, "epoch": 221} {"train_loss": -7.710066318511963, "global_step": 37133, "epoch": 221} {"train_loss": -7.848834991455078, "global_step": 37134, "epoch": 221} {"train_loss": -7.910562038421631, "global_step": 37135, "epoch": 221} {"train_loss": -7.835768699645996, "global_step": 37136, "epoch": 221} {"train_loss": -7.891366004943848, "global_step": 37137, "epoch": 221} {"train_loss": -8.033870697021484, "global_step": 37138, "epoch": 221} {"train_loss": -8.102306365966797, "global_step": 37139, "epoch": 221} {"train_loss": -8.086868286132812, "global_step": 37140, "epoch": 221} {"train_loss": -7.997537612915039, "global_step": 37141, "epoch": 221} {"train_loss": -7.752014636993408, "global_step": 37142, "epoch": 221} {"train_loss": -7.999792575836182, "global_step": 37143, "epoch": 221} {"train_loss": -7.908872604370117, "global_step": 37144, "epoch": 221} {"train_loss": -7.995808124542236, "global_step": 37145, "epoch": 221} {"train_loss": -8.311237335205078, "global_step": 37146, "epoch": 221} {"train_loss": -8.188257217407227, "global_step": 37147, "epoch": 221} {"train_loss": -7.929525375366211, "global_step": 37148, "epoch": 221} {"train_loss": -7.918168067932129, "global_step": 37149, "epoch": 221} {"train_loss": -8.066129684448242, "global_step": 37150, "epoch": 221} {"train_loss": -7.954087257385254, "global_step": 37151, "epoch": 221} {"train_loss": -7.815625190734863, "global_step": 37152, "epoch": 221} {"train_loss": -7.9984893798828125, "global_step": 37153, "epoch": 221} {"train_loss": -7.959304332733154, "global_step": 37154, "epoch": 221} {"train_loss": -8.17391300201416, "global_step": 37155, "epoch": 221} {"train_loss": -7.970077991485596, "global_step": 37156, "epoch": 221} {"train_loss": -8.064583778381348, "global_step": 37157, "epoch": 221} {"train_loss": -7.7439985275268555, "global_step": 37158, "epoch": 221} {"train_loss": -7.9704694747924805, "global_step": 37159, "epoch": 221} {"train_loss": -7.8273115158081055, "global_step": 37160, "epoch": 221} {"train_loss": -7.823904037475586, "global_step": 37161, "epoch": 221} {"train_loss": -7.974720001220703, "global_step": 37162, "epoch": 221} {"train_loss": -8.046321868896484, "global_step": 37163, "epoch": 221} {"train_loss": -7.943743705749512, "global_step": 37164, "epoch": 221} {"train_loss": -7.948369026184082, "global_step": 37165, "epoch": 221} {"train_loss": -7.945671558380127, "global_step": 37166, "epoch": 221} {"train_loss": -7.949003219604492, "global_step": 37167, "epoch": 221} {"train_loss": -7.798274040222168, "global_step": 37168, "epoch": 221} {"train_loss": -7.77878999710083, "global_step": 37169, "epoch": 221} {"train_loss": -7.787099361419678, "global_step": 37170, "epoch": 221} {"train_loss": -7.898255348205566, "global_step": 37171, "epoch": 221} {"train_loss": -7.845607280731201, "global_step": 37172, "epoch": 221} {"train_loss": -7.984786033630371, "global_step": 37173, "epoch": 221} {"train_loss": -7.885416507720947, "global_step": 37174, "epoch": 221} {"train_loss": -7.734131336212158, "global_step": 37175, "epoch": 221} {"train_loss": -7.78485107421875, "global_step": 37176, "epoch": 221} {"train_loss": -7.944203853607178, "global_step": 37177, "epoch": 221} {"train_loss": -7.773146629333496, "global_step": 37178, "epoch": 221} {"train_loss": -7.928664207458496, "global_step": 37179, "epoch": 221} {"train_loss": -7.892753601074219, "global_step": 37180, "epoch": 221} {"train_loss": -8.051984786987305, "global_step": 37181, "epoch": 221} {"train_loss": -7.993815898895264, "global_step": 37182, "epoch": 221} {"train_loss": -8.111759185791016, "global_step": 37183, "epoch": 221} {"train_loss": -7.859279632568359, "global_step": 37184, "epoch": 221} {"train_loss": -8.090544700622559, "global_step": 37185, "epoch": 221} {"train_loss": -7.809202194213867, "global_step": 37186, "epoch": 221} {"train_loss": -7.4822587966918945, "global_step": 37187, "epoch": 221} {"train_loss": -7.93554162979126, "global_step": 37188, "epoch": 221} {"train_loss": -7.723601341247559, "global_step": 37189, "epoch": 221} {"train_loss": -7.586343765258789, "global_step": 37190, "epoch": 221} {"train_loss": -7.661011695861816, "global_step": 37191, "epoch": 221} {"train_loss": -7.432030200958252, "global_step": 37192, "epoch": 221} {"train_loss": -7.833246231079102, "global_step": 37193, "epoch": 221} {"train_loss": -7.730517864227295, "global_step": 37194, "epoch": 221} {"train_loss": -7.782173156738281, "global_step": 37195, "epoch": 221} {"train_loss": -7.774758338928223, "global_step": 37196, "epoch": 221} {"train_loss": -7.42165470123291, "global_step": 37197, "epoch": 221} {"train_loss": -7.790220260620117, "global_step": 37198, "epoch": 221} {"train_loss": -7.794602394104004, "global_step": 37199, "epoch": 221} {"train_loss": -7.5815229415893555, "global_step": 37200, "epoch": 221} {"train_loss": -7.604092121124268, "global_step": 37201, "epoch": 221} {"train_loss": -7.977042198181152, "global_step": 37202, "epoch": 221} {"train_loss": -7.78525447845459, "global_step": 37203, "epoch": 221} {"train_loss": -7.714537620544434, "global_step": 37204, "epoch": 221} {"train_loss": -7.540436744689941, "global_step": 37205, "epoch": 221} {"train_loss": -7.828606605529785, "global_step": 37206, "epoch": 221} {"train_loss": -7.703652381896973, "global_step": 37207, "epoch": 221} {"train_loss": -7.7796549797058105, "global_step": 37208, "epoch": 221} {"train_loss": -7.863358974456787, "global_step": 37209, "epoch": 221} {"train_loss": -7.6368536949157715, "global_step": 37210, "epoch": 221} {"train_loss": -8.100812911987305, "global_step": 37211, "epoch": 221} {"train_loss": -7.715799331665039, "global_step": 37212, "epoch": 221} {"train_loss": -7.780359745025635, "global_step": 37213, "epoch": 221} {"train_loss": -7.589178562164307, "global_step": 37214, "epoch": 221} {"train_loss": -7.83140754699707, "global_step": 37215, "epoch": 221} {"train_loss": -7.641119956970215, "global_step": 37216, "epoch": 221} {"train_loss": -7.7046613693237305, "global_step": 37217, "epoch": 221} {"train_loss": -7.926858901977539, "global_step": 37218, "epoch": 221} {"train_loss": -7.828240394592285, "global_step": 37219, "epoch": 221} {"train_loss": -7.582170009613037, "global_step": 37220, "epoch": 221} {"train_loss": -7.9196295738220215, "global_step": 37221, "epoch": 221} {"train_loss": -7.711798667907715, "global_step": 37222, "epoch": 221} {"train_loss": -7.901365280151367, "global_step": 37223, "epoch": 221} {"train_loss": -7.8064680099487305, "global_step": 37224, "epoch": 221} {"train_loss": -7.971711158752441, "global_step": 37225, "epoch": 221} {"train_loss": -7.930098533630371, "global_step": 37226, "epoch": 221} {"train_loss": -7.948006629943848, "global_step": 37227, "epoch": 221} {"train_loss": -7.764749050140381, "global_step": 37228, "epoch": 221} {"train_loss": -7.861915588378906, "global_step": 37229, "epoch": 221} {"train_loss": -7.981644630432129, "global_step": 37230, "epoch": 221} {"train_loss": -8.022472381591797, "global_step": 37231, "epoch": 221} {"train_loss": -8.033347129821777, "global_step": 37232, "epoch": 221} {"train_loss": -7.961312294006348, "global_step": 37233, "epoch": 221} {"train_loss": -7.731401443481445, "global_step": 37234, "epoch": 221} {"train_loss": -7.956570625305176, "global_step": 37235, "epoch": 221} {"train_loss": -7.777785301208496, "global_step": 37236, "epoch": 221} {"train_loss": -8.061964988708496, "global_step": 37237, "epoch": 221} {"train_loss": -7.637655258178711, "global_step": 37238, "epoch": 221} {"train_loss": -8.007384300231934, "global_step": 37239, "epoch": 221} {"train_loss": -8.077154159545898, "global_step": 37240, "epoch": 221} {"train_loss": -7.703174591064453, "global_step": 37241, "epoch": 221} {"train_loss": -7.85613489151001, "global_step": 37242, "epoch": 221} {"train_loss": -7.440930366516113, "global_step": 37243, "epoch": 221} {"train_loss": -7.7994842529296875, "global_step": 37244, "epoch": 221} {"train_loss": -7.574009418487549, "global_step": 37245, "epoch": 221} {"train_loss": -7.851832389831543, "global_step": 37246, "epoch": 221} {"train_loss": -7.387609004974365, "global_step": 37247, "epoch": 221} {"train_loss": -7.833071708679199, "global_step": 37248, "epoch": 221} {"train_loss": -7.577624320983887, "global_step": 37249, "epoch": 221} {"train_loss": -7.634660243988037, "global_step": 37250, "epoch": 221} {"train_loss": -7.766861438751221, "global_step": 37251, "epoch": 221} {"train_loss": -7.677700996398926, "global_step": 37252, "epoch": 221} {"train_loss": -7.90904426574707, "global_step": 37253, "epoch": 221} {"train_loss": -7.74662971496582, "global_step": 37254, "epoch": 221} {"train_loss": -7.7767791748046875, "global_step": 37255, "epoch": 221} {"train_loss": -7.840036392211914, "global_step": 37256, "epoch": 221} {"train_loss": -7.8756608963012695, "global_step": 37257, "epoch": 221} {"train_loss": -7.8374528884887695, "global_step": 37258, "epoch": 221} {"train_loss": -7.668961524963379, "global_step": 37259, "epoch": 221} {"train_loss": -7.76844596862793, "global_step": 37260, "epoch": 221} {"train_loss": -7.696713447570801, "global_step": 37261, "epoch": 221} {"train_loss": -7.907969951629639, "global_step": 37262, "epoch": 221} {"train_loss": -7.602466106414795, "global_step": 37263, "epoch": 221} {"train_loss": -7.79327392578125, "global_step": 37264, "epoch": 221} {"train_loss": -7.63906717300415, "global_step": 37265, "epoch": 221} {"train_loss": -7.731454849243164, "global_step": 37266, "epoch": 221} {"train_loss": -7.61304235458374, "global_step": 37267, "epoch": 221} {"train_loss": -7.688365936279297, "global_step": 37268, "epoch": 221} {"train_loss": -7.529820442199707, "global_step": 37269, "epoch": 221} {"train_loss": -7.7341814041137695, "global_step": 37270, "epoch": 221} {"train_loss": -7.83503532409668, "global_step": 37271, "epoch": 221} {"train_loss": -7.941952705383301, "global_step": 37272, "epoch": 221} {"train_loss": -7.886502742767334, "global_step": 37273, "epoch": 221} {"train_loss": -7.750521659851074, "global_step": 37274, "epoch": 221} {"train_loss": -7.97762393951416, "global_step": 37275, "epoch": 221} {"train_loss": -7.9593729972839355, "global_step": 37276, "epoch": 221} {"train_loss": -7.9041290283203125, "global_step": 37277, "epoch": 221} {"train_loss": -7.696929931640625, "global_step": 37278, "epoch": 221} {"train_loss": -7.897035121917725, "global_step": 37279, "epoch": 221} {"train_loss": -7.7166428565979, "global_step": 37280, "epoch": 221} {"train_loss": -7.705934524536133, "global_step": 37281, "epoch": 221} {"train_loss": -7.747278213500977, "global_step": 37282, "epoch": 221} {"train_loss": -7.629673480987549, "global_step": 37283, "epoch": 221} {"train_loss": -7.967273712158203, "global_step": 37284, "epoch": 221} {"train_loss": -7.870146751403809, "global_step": 37285, "epoch": 221} {"train_loss": -7.992622375488281, "global_step": 37286, "epoch": 221} {"train_loss": -8.021427154541016, "global_step": 37287, "epoch": 221} {"train_loss": -7.884077072143555, "global_step": 37288, "epoch": 221} {"train_loss": -7.846386909484863, "global_step": 37289, "epoch": 221} {"train_loss": -7.974837303161621, "global_step": 37290, "epoch": 221} {"train_loss": -8.118013381958008, "global_step": 37291, "epoch": 221} {"train_loss": -7.872323989868164, "global_step": 37292, "epoch": 221} {"train_loss": -7.887203693389893, "global_step": 37293, "epoch": 221} {"train_loss": -7.910709857940674, "global_step": 37294, "epoch": 221} {"train_loss": -7.840674718221028, "global_step": 37295, "epoch": 221, "val_loss": 185332.125} {"train_loss": -7.611515998840332, "global_step": 37296, "epoch": 222} {"train_loss": -7.985809803009033, "global_step": 37297, "epoch": 222} {"train_loss": -7.533720016479492, "global_step": 37298, "epoch": 222} {"train_loss": -7.797751426696777, "global_step": 37299, "epoch": 222} {"train_loss": -7.937249660491943, "global_step": 37300, "epoch": 222} {"train_loss": -7.586094379425049, "global_step": 37301, "epoch": 222} {"train_loss": -7.830479621887207, "global_step": 37302, "epoch": 222} {"train_loss": -7.787481307983398, "global_step": 37303, "epoch": 222} {"train_loss": -7.809055328369141, "global_step": 37304, "epoch": 222} {"train_loss": -7.584909915924072, "global_step": 37305, "epoch": 222} {"train_loss": -7.829699993133545, "global_step": 37306, "epoch": 222} {"train_loss": -7.712491035461426, "global_step": 37307, "epoch": 222} {"train_loss": -7.78248405456543, "global_step": 37308, "epoch": 222} {"train_loss": -7.854761123657227, "global_step": 37309, "epoch": 222} {"train_loss": -7.7751312255859375, "global_step": 37310, "epoch": 222} {"train_loss": -7.51357364654541, "global_step": 37311, "epoch": 222} {"train_loss": -7.645059108734131, "global_step": 37312, "epoch": 222} {"train_loss": -7.555537700653076, "global_step": 37313, "epoch": 222} {"train_loss": -7.501460075378418, "global_step": 37314, "epoch": 222} {"train_loss": -7.525575637817383, "global_step": 37315, "epoch": 222} {"train_loss": -7.803995132446289, "global_step": 37316, "epoch": 222} {"train_loss": -7.748332500457764, "global_step": 37317, "epoch": 222} {"train_loss": -7.451930999755859, "global_step": 37318, "epoch": 222} {"train_loss": -7.755916595458984, "global_step": 37319, "epoch": 222} {"train_loss": -7.858388900756836, "global_step": 37320, "epoch": 222} {"train_loss": -7.653604507446289, "global_step": 37321, "epoch": 222} {"train_loss": -7.649787902832031, "global_step": 37322, "epoch": 222} {"train_loss": -7.4416046142578125, "global_step": 37323, "epoch": 222} {"train_loss": -7.8534674644470215, "global_step": 37324, "epoch": 222} {"train_loss": -7.466283321380615, "global_step": 37325, "epoch": 222} {"train_loss": -7.723660945892334, "global_step": 37326, "epoch": 222} {"train_loss": -7.77682638168335, "global_step": 37327, "epoch": 222} {"train_loss": -7.919036865234375, "global_step": 37328, "epoch": 222} {"train_loss": -7.828863143920898, "global_step": 37329, "epoch": 222} {"train_loss": -7.844359874725342, "global_step": 37330, "epoch": 222} {"train_loss": -7.847987174987793, "global_step": 37331, "epoch": 222} {"train_loss": -7.779603481292725, "global_step": 37332, "epoch": 222} {"train_loss": -7.78745174407959, "global_step": 37333, "epoch": 222} {"train_loss": -7.991970539093018, "global_step": 37334, "epoch": 222} {"train_loss": -7.868778705596924, "global_step": 37335, "epoch": 222} {"train_loss": -7.579514503479004, "global_step": 37336, "epoch": 222} {"train_loss": -7.472812652587891, "global_step": 37337, "epoch": 222} {"train_loss": -7.891084671020508, "global_step": 37338, "epoch": 222} {"train_loss": -7.73030948638916, "global_step": 37339, "epoch": 222} {"train_loss": -7.767658233642578, "global_step": 37340, "epoch": 222} {"train_loss": -7.8281779289245605, "global_step": 37341, "epoch": 222} {"train_loss": -7.926150321960449, "global_step": 37342, "epoch": 222} {"train_loss": -8.102715492248535, "global_step": 37343, "epoch": 222} {"train_loss": -7.877250671386719, "global_step": 37344, "epoch": 222} {"train_loss": -7.709321975708008, "global_step": 37345, "epoch": 222} {"train_loss": -7.7884721755981445, "global_step": 37346, "epoch": 222} {"train_loss": -7.64202880859375, "global_step": 37347, "epoch": 222} {"train_loss": -7.9252095222473145, "global_step": 37348, "epoch": 222} {"train_loss": -7.491997718811035, "global_step": 37349, "epoch": 222} {"train_loss": -7.867062091827393, "global_step": 37350, "epoch": 222} {"train_loss": -7.8618245124816895, "global_step": 37351, "epoch": 222} {"train_loss": -7.714703559875488, "global_step": 37352, "epoch": 222} {"train_loss": -7.846211910247803, "global_step": 37353, "epoch": 222} {"train_loss": -7.773009300231934, "global_step": 37354, "epoch": 222} {"train_loss": -7.908327102661133, "global_step": 37355, "epoch": 222} {"train_loss": -7.901388168334961, "global_step": 37356, "epoch": 222} {"train_loss": -7.724072456359863, "global_step": 37357, "epoch": 222} {"train_loss": -7.96173095703125, "global_step": 37358, "epoch": 222} {"train_loss": -7.639121055603027, "global_step": 37359, "epoch": 222} {"train_loss": -7.467649459838867, "global_step": 37360, "epoch": 222} {"train_loss": -7.661333084106445, "global_step": 37361, "epoch": 222} {"train_loss": -7.6469597816467285, "global_step": 37362, "epoch": 222} {"train_loss": -7.60347843170166, "global_step": 37363, "epoch": 222} {"train_loss": -7.841434478759766, "global_step": 37364, "epoch": 222} {"train_loss": -7.922910690307617, "global_step": 37365, "epoch": 222} {"train_loss": -7.765388011932373, "global_step": 37366, "epoch": 222} {"train_loss": -7.951634883880615, "global_step": 37367, "epoch": 222} {"train_loss": -7.9036030769348145, "global_step": 37368, "epoch": 222} {"train_loss": -7.745229721069336, "global_step": 37369, "epoch": 222} {"train_loss": -7.962337017059326, "global_step": 37370, "epoch": 222} {"train_loss": -7.72654390335083, "global_step": 37371, "epoch": 222} {"train_loss": -7.850869178771973, "global_step": 37372, "epoch": 222} {"train_loss": -7.854954719543457, "global_step": 37373, "epoch": 222} {"train_loss": -7.923912048339844, "global_step": 37374, "epoch": 222} {"train_loss": -7.973899841308594, "global_step": 37375, "epoch": 222} {"train_loss": -7.820634841918945, "global_step": 37376, "epoch": 222} {"train_loss": -7.691954612731934, "global_step": 37377, "epoch": 222} {"train_loss": -7.939944267272949, "global_step": 37378, "epoch": 222} {"train_loss": -7.633508682250977, "global_step": 37379, "epoch": 222} {"train_loss": -7.755373954772949, "global_step": 37380, "epoch": 222} {"train_loss": -7.718534469604492, "global_step": 37381, "epoch": 222} {"train_loss": -7.6242570877075195, "global_step": 37382, "epoch": 222} {"train_loss": -7.82217264175415, "global_step": 37383, "epoch": 222} {"train_loss": -7.66993522644043, "global_step": 37384, "epoch": 222} {"train_loss": -7.712102890014648, "global_step": 37385, "epoch": 222} {"train_loss": -7.8158183097839355, "global_step": 37386, "epoch": 222} {"train_loss": -7.810888290405273, "global_step": 37387, "epoch": 222} {"train_loss": -7.810030937194824, "global_step": 37388, "epoch": 222} {"train_loss": -7.7574381828308105, "global_step": 37389, "epoch": 222} {"train_loss": -7.7566447257995605, "global_step": 37390, "epoch": 222} {"train_loss": -7.687677383422852, "global_step": 37391, "epoch": 222} {"train_loss": -7.781364440917969, "global_step": 37392, "epoch": 222} {"train_loss": -7.806303977966309, "global_step": 37393, "epoch": 222} {"train_loss": -8.003963470458984, "global_step": 37394, "epoch": 222} {"train_loss": -7.655864715576172, "global_step": 37395, "epoch": 222} {"train_loss": -7.715150356292725, "global_step": 37396, "epoch": 222} {"train_loss": -7.73475456237793, "global_step": 37397, "epoch": 222} {"train_loss": -7.961669445037842, "global_step": 37398, "epoch": 222} {"train_loss": -7.667322635650635, "global_step": 37399, "epoch": 222} {"train_loss": -7.711421966552734, "global_step": 37400, "epoch": 222} {"train_loss": -7.726075172424316, "global_step": 37401, "epoch": 222} {"train_loss": -7.946066856384277, "global_step": 37402, "epoch": 222} {"train_loss": -7.595650672912598, "global_step": 37403, "epoch": 222} {"train_loss": -8.107053756713867, "global_step": 37404, "epoch": 222} {"train_loss": -7.734993934631348, "global_step": 37405, "epoch": 222} {"train_loss": -8.070213317871094, "global_step": 37406, "epoch": 222} {"train_loss": -7.876064777374268, "global_step": 37407, "epoch": 222} {"train_loss": -7.74497127532959, "global_step": 37408, "epoch": 222} {"train_loss": -7.817033767700195, "global_step": 37409, "epoch": 222} {"train_loss": -7.819372177124023, "global_step": 37410, "epoch": 222} {"train_loss": -7.855301856994629, "global_step": 37411, "epoch": 222} {"train_loss": -7.652558326721191, "global_step": 37412, "epoch": 222} {"train_loss": -7.625109672546387, "global_step": 37413, "epoch": 222} {"train_loss": -7.6254472732543945, "global_step": 37414, "epoch": 222} {"train_loss": -7.951037883758545, "global_step": 37415, "epoch": 222} {"train_loss": -7.626162052154541, "global_step": 37416, "epoch": 222} {"train_loss": -7.8058366775512695, "global_step": 37417, "epoch": 222} {"train_loss": -7.7321929931640625, "global_step": 37418, "epoch": 222} {"train_loss": -7.919751167297363, "global_step": 37419, "epoch": 222} {"train_loss": -7.475833892822266, "global_step": 37420, "epoch": 222} {"train_loss": -7.933143138885498, "global_step": 37421, "epoch": 222} {"train_loss": -7.9283857345581055, "global_step": 37422, "epoch": 222} {"train_loss": -7.650782585144043, "global_step": 37423, "epoch": 222} {"train_loss": -7.757583141326904, "global_step": 37424, "epoch": 222} {"train_loss": -8.074236869812012, "global_step": 37425, "epoch": 222} {"train_loss": -7.907529830932617, "global_step": 37426, "epoch": 222} {"train_loss": -7.807504653930664, "global_step": 37427, "epoch": 222} {"train_loss": -7.882580757141113, "global_step": 37428, "epoch": 222} {"train_loss": -7.676543712615967, "global_step": 37429, "epoch": 222} {"train_loss": -7.7814741134643555, "global_step": 37430, "epoch": 222} {"train_loss": -7.602354049682617, "global_step": 37431, "epoch": 222} {"train_loss": -7.828273773193359, "global_step": 37432, "epoch": 222} {"train_loss": -7.853858947753906, "global_step": 37433, "epoch": 222} {"train_loss": -7.76378870010376, "global_step": 37434, "epoch": 222} {"train_loss": -7.865424156188965, "global_step": 37435, "epoch": 222} {"train_loss": -7.536133289337158, "global_step": 37436, "epoch": 222} {"train_loss": -7.982501983642578, "global_step": 37437, "epoch": 222} {"train_loss": -7.562995910644531, "global_step": 37438, "epoch": 222} {"train_loss": -7.7980570793151855, "global_step": 37439, "epoch": 222} {"train_loss": -7.778995990753174, "global_step": 37440, "epoch": 222} {"train_loss": -7.805917263031006, "global_step": 37441, "epoch": 222} {"train_loss": -7.657498359680176, "global_step": 37442, "epoch": 222} {"train_loss": -7.873578071594238, "global_step": 37443, "epoch": 222} {"train_loss": -7.478403091430664, "global_step": 37444, "epoch": 222} {"train_loss": -7.890256404876709, "global_step": 37445, "epoch": 222} {"train_loss": -7.5913543701171875, "global_step": 37446, "epoch": 222} {"train_loss": -7.943849563598633, "global_step": 37447, "epoch": 222} {"train_loss": -7.885490417480469, "global_step": 37448, "epoch": 222} {"train_loss": -7.759068489074707, "global_step": 37449, "epoch": 222} {"train_loss": -7.696313381195068, "global_step": 37450, "epoch": 222} {"train_loss": -7.668389320373535, "global_step": 37451, "epoch": 222} {"train_loss": -7.979854583740234, "global_step": 37452, "epoch": 222} {"train_loss": -7.843750953674316, "global_step": 37453, "epoch": 222} {"train_loss": -7.593707084655762, "global_step": 37454, "epoch": 222} {"train_loss": -7.892925262451172, "global_step": 37455, "epoch": 222} {"train_loss": -7.896294116973877, "global_step": 37456, "epoch": 222} {"train_loss": -7.818004608154297, "global_step": 37457, "epoch": 222} {"train_loss": -7.960358619689941, "global_step": 37458, "epoch": 222} {"train_loss": -7.762662887573242, "global_step": 37459, "epoch": 222} {"train_loss": -7.657042503356934, "global_step": 37460, "epoch": 222} {"train_loss": -7.621700286865234, "global_step": 37461, "epoch": 222} {"train_loss": -7.864366054534912, "global_step": 37462, "epoch": 222} {"train_loss": -7.771577335539318, "global_step": 37463, "epoch": 222, "val_loss": 184460.0625} {"train_loss": -7.781498908996582, "global_step": 37464, "epoch": 223} {"train_loss": -7.811515808105469, "global_step": 37465, "epoch": 223} {"train_loss": -7.741305828094482, "global_step": 37466, "epoch": 223} {"train_loss": -7.695611000061035, "global_step": 37467, "epoch": 223} {"train_loss": -7.511028289794922, "global_step": 37468, "epoch": 223} {"train_loss": -7.5681986808776855, "global_step": 37469, "epoch": 223} {"train_loss": -7.818878650665283, "global_step": 37470, "epoch": 223} {"train_loss": -7.836949348449707, "global_step": 37471, "epoch": 223} {"train_loss": -7.6556396484375, "global_step": 37472, "epoch": 223} {"train_loss": -7.612730026245117, "global_step": 37473, "epoch": 223} {"train_loss": -7.7741498947143555, "global_step": 37474, "epoch": 223} {"train_loss": -7.832888603210449, "global_step": 37475, "epoch": 223} {"train_loss": -7.947707176208496, "global_step": 37476, "epoch": 223} {"train_loss": -7.709190368652344, "global_step": 37477, "epoch": 223} {"train_loss": -7.770775318145752, "global_step": 37478, "epoch": 223} {"train_loss": -8.017928123474121, "global_step": 37479, "epoch": 223} {"train_loss": -7.987128734588623, "global_step": 37480, "epoch": 223} {"train_loss": -7.702911376953125, "global_step": 37481, "epoch": 223} {"train_loss": -7.9735822677612305, "global_step": 37482, "epoch": 223} {"train_loss": -7.942418098449707, "global_step": 37483, "epoch": 223} {"train_loss": -7.913384437561035, "global_step": 37484, "epoch": 223} {"train_loss": -7.86451530456543, "global_step": 37485, "epoch": 223} {"train_loss": -7.882116317749023, "global_step": 37486, "epoch": 223} {"train_loss": -7.99812126159668, "global_step": 37487, "epoch": 223} {"train_loss": -7.896938800811768, "global_step": 37488, "epoch": 223} {"train_loss": -8.094083786010742, "global_step": 37489, "epoch": 223} {"train_loss": -7.908977031707764, "global_step": 37490, "epoch": 223} {"train_loss": -8.042991638183594, "global_step": 37491, "epoch": 223} {"train_loss": -8.034345626831055, "global_step": 37492, "epoch": 223} {"train_loss": -8.082159042358398, "global_step": 37493, "epoch": 223} {"train_loss": -7.750309944152832, "global_step": 37494, "epoch": 223} {"train_loss": -8.038031578063965, "global_step": 37495, "epoch": 223} {"train_loss": -7.8884172439575195, "global_step": 37496, "epoch": 223} {"train_loss": -7.981429100036621, "global_step": 37497, "epoch": 223} {"train_loss": -7.812889099121094, "global_step": 37498, "epoch": 223} {"train_loss": -7.614993572235107, "global_step": 37499, "epoch": 223} {"train_loss": -7.881475448608398, "global_step": 37500, "epoch": 223} {"train_loss": -7.5413665771484375, "global_step": 37501, "epoch": 223} {"train_loss": -7.8327860832214355, "global_step": 37502, "epoch": 223} {"train_loss": -7.735834121704102, "global_step": 37503, "epoch": 223} {"train_loss": -7.541942596435547, "global_step": 37504, "epoch": 223} {"train_loss": -7.738491535186768, "global_step": 37505, "epoch": 223} {"train_loss": -7.841078758239746, "global_step": 37506, "epoch": 223} {"train_loss": -7.494691848754883, "global_step": 37507, "epoch": 223} {"train_loss": -7.727991104125977, "global_step": 37508, "epoch": 223} {"train_loss": -7.671703338623047, "global_step": 37509, "epoch": 223} {"train_loss": -7.671961784362793, "global_step": 37510, "epoch": 223} {"train_loss": -7.339148044586182, "global_step": 37511, "epoch": 223} {"train_loss": -7.6883745193481445, "global_step": 37512, "epoch": 223} {"train_loss": -7.553363800048828, "global_step": 37513, "epoch": 223} {"train_loss": -7.676959991455078, "global_step": 37514, "epoch": 223} {"train_loss": -7.639646053314209, "global_step": 37515, "epoch": 223} {"train_loss": -7.655160903930664, "global_step": 37516, "epoch": 223} {"train_loss": -7.670294761657715, "global_step": 37517, "epoch": 223} {"train_loss": -7.60954475402832, "global_step": 37518, "epoch": 223} {"train_loss": -7.863574504852295, "global_step": 37519, "epoch": 223} {"train_loss": -7.631831169128418, "global_step": 37520, "epoch": 223} {"train_loss": -7.395210266113281, "global_step": 37521, "epoch": 223} {"train_loss": -7.833662033081055, "global_step": 37522, "epoch": 223} {"train_loss": -7.826176166534424, "global_step": 37523, "epoch": 223} {"train_loss": -7.789462089538574, "global_step": 37524, "epoch": 223} {"train_loss": -7.583641052246094, "global_step": 37525, "epoch": 223} {"train_loss": -7.802918910980225, "global_step": 37526, "epoch": 223} {"train_loss": -7.540812015533447, "global_step": 37527, "epoch": 223} {"train_loss": -7.684792995452881, "global_step": 37528, "epoch": 223} {"train_loss": -7.706334590911865, "global_step": 37529, "epoch": 223} {"train_loss": -7.8020172119140625, "global_step": 37530, "epoch": 223} {"train_loss": -7.858997344970703, "global_step": 37531, "epoch": 223} {"train_loss": -7.353984832763672, "global_step": 37532, "epoch": 223} {"train_loss": -7.784987449645996, "global_step": 37533, "epoch": 223} {"train_loss": -7.629401206970215, "global_step": 37534, "epoch": 223} {"train_loss": -7.799610137939453, "global_step": 37535, "epoch": 223} {"train_loss": -7.649167060852051, "global_step": 37536, "epoch": 223} {"train_loss": -7.758343696594238, "global_step": 37537, "epoch": 223} {"train_loss": -7.77766227722168, "global_step": 37538, "epoch": 223} {"train_loss": -7.628608703613281, "global_step": 37539, "epoch": 223} {"train_loss": -7.693567752838135, "global_step": 37540, "epoch": 223} {"train_loss": -7.667765140533447, "global_step": 37541, "epoch": 223} {"train_loss": -7.644265174865723, "global_step": 37542, "epoch": 223} {"train_loss": -7.617000579833984, "global_step": 37543, "epoch": 223} {"train_loss": -7.708529472351074, "global_step": 37544, "epoch": 223} {"train_loss": -7.902072906494141, "global_step": 37545, "epoch": 223} {"train_loss": -7.821451187133789, "global_step": 37546, "epoch": 223} {"train_loss": -7.767045974731445, "global_step": 37547, "epoch": 223} {"train_loss": -7.830255508422852, "global_step": 37548, "epoch": 223} {"train_loss": -7.818891525268555, "global_step": 37549, "epoch": 223} {"train_loss": -7.82525634765625, "global_step": 37550, "epoch": 223} {"train_loss": -7.779556751251221, "global_step": 37551, "epoch": 223} {"train_loss": -7.583456039428711, "global_step": 37552, "epoch": 223} {"train_loss": -7.892367362976074, "global_step": 37553, "epoch": 223} {"train_loss": -7.862338066101074, "global_step": 37554, "epoch": 223} {"train_loss": -7.8119001388549805, "global_step": 37555, "epoch": 223} {"train_loss": -7.859549522399902, "global_step": 37556, "epoch": 223} {"train_loss": -7.84685754776001, "global_step": 37557, "epoch": 223} {"train_loss": -7.899881362915039, "global_step": 37558, "epoch": 223} {"train_loss": -7.769919395446777, "global_step": 37559, "epoch": 223} {"train_loss": -7.833216667175293, "global_step": 37560, "epoch": 223} {"train_loss": -7.835580825805664, "global_step": 37561, "epoch": 223} {"train_loss": -7.742034912109375, "global_step": 37562, "epoch": 223} {"train_loss": -7.871874809265137, "global_step": 37563, "epoch": 223} {"train_loss": -7.978785991668701, "global_step": 37564, "epoch": 223} {"train_loss": -7.764294624328613, "global_step": 37565, "epoch": 223} {"train_loss": -7.791865825653076, "global_step": 37566, "epoch": 223} {"train_loss": -8.039266586303711, "global_step": 37567, "epoch": 223} {"train_loss": -7.401691436767578, "global_step": 37568, "epoch": 223} {"train_loss": -7.714433193206787, "global_step": 37569, "epoch": 223} {"train_loss": -7.50485897064209, "global_step": 37570, "epoch": 223} {"train_loss": -7.949832916259766, "global_step": 37571, "epoch": 223} {"train_loss": -7.64710807800293, "global_step": 37572, "epoch": 223} {"train_loss": -7.918172836303711, "global_step": 37573, "epoch": 223} {"train_loss": -7.734546184539795, "global_step": 37574, "epoch": 223} {"train_loss": -7.858914375305176, "global_step": 37575, "epoch": 223} {"train_loss": -7.800682544708252, "global_step": 37576, "epoch": 223} {"train_loss": -7.81038761138916, "global_step": 37577, "epoch": 223} {"train_loss": -7.930233955383301, "global_step": 37578, "epoch": 223} {"train_loss": -7.784197807312012, "global_step": 37579, "epoch": 223} {"train_loss": -7.819736480712891, "global_step": 37580, "epoch": 223} {"train_loss": -7.704045295715332, "global_step": 37581, "epoch": 223} {"train_loss": -7.76158332824707, "global_step": 37582, "epoch": 223} {"train_loss": -7.841591835021973, "global_step": 37583, "epoch": 223} {"train_loss": -7.862199783325195, "global_step": 37584, "epoch": 223} {"train_loss": -8.034546852111816, "global_step": 37585, "epoch": 223} {"train_loss": -7.898881912231445, "global_step": 37586, "epoch": 223} {"train_loss": -7.8934149742126465, "global_step": 37587, "epoch": 223} {"train_loss": -7.971437454223633, "global_step": 37588, "epoch": 223} {"train_loss": -7.963345527648926, "global_step": 37589, "epoch": 223} {"train_loss": -7.919363975524902, "global_step": 37590, "epoch": 223} {"train_loss": -8.075090408325195, "global_step": 37591, "epoch": 223} {"train_loss": -7.856180191040039, "global_step": 37592, "epoch": 223} {"train_loss": -7.844550132751465, "global_step": 37593, "epoch": 223} {"train_loss": -7.894709587097168, "global_step": 37594, "epoch": 223} {"train_loss": -7.906744003295898, "global_step": 37595, "epoch": 223} {"train_loss": -7.840978622436523, "global_step": 37596, "epoch": 223} {"train_loss": -7.761936664581299, "global_step": 37597, "epoch": 223} {"train_loss": -8.009206771850586, "global_step": 37598, "epoch": 223} {"train_loss": -7.9560041427612305, "global_step": 37599, "epoch": 223} {"train_loss": -8.014107704162598, "global_step": 37600, "epoch": 223} {"train_loss": -7.8516845703125, "global_step": 37601, "epoch": 223} {"train_loss": -7.823854446411133, "global_step": 37602, "epoch": 223} {"train_loss": -7.770759582519531, "global_step": 37603, "epoch": 223} {"train_loss": -7.730093002319336, "global_step": 37604, "epoch": 223} {"train_loss": -7.802580833435059, "global_step": 37605, "epoch": 223} {"train_loss": -7.818835258483887, "global_step": 37606, "epoch": 223} {"train_loss": -7.705089569091797, "global_step": 37607, "epoch": 223} {"train_loss": -7.742969989776611, "global_step": 37608, "epoch": 223} {"train_loss": -7.575674533843994, "global_step": 37609, "epoch": 223} {"train_loss": -7.892322540283203, "global_step": 37610, "epoch": 223} {"train_loss": -7.566450119018555, "global_step": 37611, "epoch": 223} {"train_loss": -7.262418746948242, "global_step": 37612, "epoch": 223} {"train_loss": -7.648425102233887, "global_step": 37613, "epoch": 223} {"train_loss": -7.4239044189453125, "global_step": 37614, "epoch": 223} {"train_loss": -7.792953968048096, "global_step": 37615, "epoch": 223} {"train_loss": -7.636893272399902, "global_step": 37616, "epoch": 223} {"train_loss": -7.595155239105225, "global_step": 37617, "epoch": 223} {"train_loss": -8.072080612182617, "global_step": 37618, "epoch": 223} {"train_loss": -7.72064733505249, "global_step": 37619, "epoch": 223} {"train_loss": -7.655731201171875, "global_step": 37620, "epoch": 223} {"train_loss": -7.559134483337402, "global_step": 37621, "epoch": 223} {"train_loss": -7.839476108551025, "global_step": 37622, "epoch": 223} {"train_loss": -7.703367233276367, "global_step": 37623, "epoch": 223} {"train_loss": -7.691969871520996, "global_step": 37624, "epoch": 223} {"train_loss": -7.947089672088623, "global_step": 37625, "epoch": 223} {"train_loss": -7.655421733856201, "global_step": 37626, "epoch": 223} {"train_loss": -7.730022430419922, "global_step": 37627, "epoch": 223} {"train_loss": -7.8058695793151855, "global_step": 37628, "epoch": 223} {"train_loss": -7.764960289001465, "global_step": 37629, "epoch": 223} {"train_loss": -7.903194427490234, "global_step": 37630, "epoch": 223} {"train_loss": -7.777236262957255, "global_step": 37631, "epoch": 223, "val_loss": 186756.984375} {"train_loss": -7.722975254058838, "global_step": 37632, "epoch": 224} {"train_loss": -7.90589714050293, "global_step": 37633, "epoch": 224} {"train_loss": -7.869463920593262, "global_step": 37634, "epoch": 224} {"train_loss": -7.965641021728516, "global_step": 37635, "epoch": 224} {"train_loss": -7.910400390625, "global_step": 37636, "epoch": 224} {"train_loss": -7.939598083496094, "global_step": 37637, "epoch": 224} {"train_loss": -7.812394618988037, "global_step": 37638, "epoch": 224} {"train_loss": -7.724303245544434, "global_step": 37639, "epoch": 224} {"train_loss": -7.874672889709473, "global_step": 37640, "epoch": 224} {"train_loss": -7.839632987976074, "global_step": 37641, "epoch": 224} {"train_loss": -7.952598571777344, "global_step": 37642, "epoch": 224} {"train_loss": -7.752188205718994, "global_step": 37643, "epoch": 224} {"train_loss": -7.924081325531006, "global_step": 37644, "epoch": 224} {"train_loss": -7.7392802238464355, "global_step": 37645, "epoch": 224} {"train_loss": -8.053133010864258, "global_step": 37646, "epoch": 224} {"train_loss": -8.049201011657715, "global_step": 37647, "epoch": 224} {"train_loss": -8.141443252563477, "global_step": 37648, "epoch": 224} {"train_loss": -8.073310852050781, "global_step": 37649, "epoch": 224} {"train_loss": -7.9585394859313965, "global_step": 37650, "epoch": 224} {"train_loss": -7.848757743835449, "global_step": 37651, "epoch": 224} {"train_loss": -7.781803131103516, "global_step": 37652, "epoch": 224} {"train_loss": -7.833280563354492, "global_step": 37653, "epoch": 224} {"train_loss": -7.901263236999512, "global_step": 37654, "epoch": 224} {"train_loss": -7.875310897827148, "global_step": 37655, "epoch": 224} {"train_loss": -7.841695785522461, "global_step": 37656, "epoch": 224} {"train_loss": -7.663076400756836, "global_step": 37657, "epoch": 224} {"train_loss": -7.942552089691162, "global_step": 37658, "epoch": 224} {"train_loss": -7.9704179763793945, "global_step": 37659, "epoch": 224} {"train_loss": -7.882193565368652, "global_step": 37660, "epoch": 224} {"train_loss": -8.065449714660645, "global_step": 37661, "epoch": 224} {"train_loss": -8.083629608154297, "global_step": 37662, "epoch": 224} {"train_loss": -7.965058326721191, "global_step": 37663, "epoch": 224} {"train_loss": -7.933289527893066, "global_step": 37664, "epoch": 224} {"train_loss": -7.989745616912842, "global_step": 37665, "epoch": 224} {"train_loss": -7.729615211486816, "global_step": 37666, "epoch": 224} {"train_loss": -7.826894283294678, "global_step": 37667, "epoch": 224} {"train_loss": -7.741692543029785, "global_step": 37668, "epoch": 224} {"train_loss": -7.692193031311035, "global_step": 37669, "epoch": 224} {"train_loss": -7.72216796875, "global_step": 37670, "epoch": 224} {"train_loss": -7.801627159118652, "global_step": 37671, "epoch": 224} {"train_loss": -7.726717948913574, "global_step": 37672, "epoch": 224} {"train_loss": -7.750699996948242, "global_step": 37673, "epoch": 224} {"train_loss": -7.723150253295898, "global_step": 37674, "epoch": 224} {"train_loss": -7.759739875793457, "global_step": 37675, "epoch": 224} {"train_loss": -7.858962535858154, "global_step": 37676, "epoch": 224} {"train_loss": -7.8130598068237305, "global_step": 37677, "epoch": 224} {"train_loss": -7.795475006103516, "global_step": 37678, "epoch": 224} {"train_loss": -7.773058891296387, "global_step": 37679, "epoch": 224} {"train_loss": -7.935455799102783, "global_step": 37680, "epoch": 224} {"train_loss": -7.620362758636475, "global_step": 37681, "epoch": 224} {"train_loss": -7.702946662902832, "global_step": 37682, "epoch": 224} {"train_loss": -7.576694488525391, "global_step": 37683, "epoch": 224} {"train_loss": -7.859328269958496, "global_step": 37684, "epoch": 224} {"train_loss": -7.7309770584106445, "global_step": 37685, "epoch": 224} {"train_loss": -7.734716415405273, "global_step": 37686, "epoch": 224} {"train_loss": -7.734654426574707, "global_step": 37687, "epoch": 224} {"train_loss": -7.568869590759277, "global_step": 37688, "epoch": 224} {"train_loss": -7.861746311187744, "global_step": 37689, "epoch": 224} {"train_loss": -7.489975929260254, "global_step": 37690, "epoch": 224} {"train_loss": -7.778253555297852, "global_step": 37691, "epoch": 224} {"train_loss": -7.5073771476745605, "global_step": 37692, "epoch": 224} {"train_loss": -7.718657493591309, "global_step": 37693, "epoch": 224} {"train_loss": -7.652843475341797, "global_step": 37694, "epoch": 224} {"train_loss": -7.520369529724121, "global_step": 37695, "epoch": 224} {"train_loss": -7.703008651733398, "global_step": 37696, "epoch": 224} {"train_loss": -7.820918083190918, "global_step": 37697, "epoch": 224} {"train_loss": -7.454128742218018, "global_step": 37698, "epoch": 224} {"train_loss": -7.8917036056518555, "global_step": 37699, "epoch": 224} {"train_loss": -7.657060623168945, "global_step": 37700, "epoch": 224} {"train_loss": -7.801283836364746, "global_step": 37701, "epoch": 224} {"train_loss": -8.00015640258789, "global_step": 37702, "epoch": 224} {"train_loss": -7.763082504272461, "global_step": 37703, "epoch": 224} {"train_loss": -7.878734588623047, "global_step": 37704, "epoch": 224} {"train_loss": -7.964624404907227, "global_step": 37705, "epoch": 224} {"train_loss": -8.096936225891113, "global_step": 37706, "epoch": 224} {"train_loss": -7.861766815185547, "global_step": 37707, "epoch": 224} {"train_loss": -7.96043586730957, "global_step": 37708, "epoch": 224} {"train_loss": -7.847416877746582, "global_step": 37709, "epoch": 224} {"train_loss": -7.814506530761719, "global_step": 37710, "epoch": 224} {"train_loss": -7.99894380569458, "global_step": 37711, "epoch": 224} {"train_loss": -7.740041732788086, "global_step": 37712, "epoch": 224} {"train_loss": -7.932013988494873, "global_step": 37713, "epoch": 224} {"train_loss": -7.793741226196289, "global_step": 37714, "epoch": 224} {"train_loss": -8.017000198364258, "global_step": 37715, "epoch": 224} {"train_loss": -7.747204780578613, "global_step": 37716, "epoch": 224} {"train_loss": -7.953896522521973, "global_step": 37717, "epoch": 224} {"train_loss": -7.847404479980469, "global_step": 37718, "epoch": 224} {"train_loss": -8.13610553741455, "global_step": 37719, "epoch": 224} {"train_loss": -7.875492095947266, "global_step": 37720, "epoch": 224} {"train_loss": -8.255424499511719, "global_step": 37721, "epoch": 224} {"train_loss": -7.998303413391113, "global_step": 37722, "epoch": 224} {"train_loss": -7.962857723236084, "global_step": 37723, "epoch": 224} {"train_loss": -7.740396499633789, "global_step": 37724, "epoch": 224} {"train_loss": -7.849451065063477, "global_step": 37725, "epoch": 224} {"train_loss": -7.9049296379089355, "global_step": 37726, "epoch": 224} {"train_loss": -8.11154556274414, "global_step": 37727, "epoch": 224} {"train_loss": -7.902379035949707, "global_step": 37728, "epoch": 224} {"train_loss": -8.030370712280273, "global_step": 37729, "epoch": 224} {"train_loss": -7.845272064208984, "global_step": 37730, "epoch": 224} {"train_loss": -7.903695106506348, "global_step": 37731, "epoch": 224} {"train_loss": -8.028142929077148, "global_step": 37732, "epoch": 224} {"train_loss": -7.841033458709717, "global_step": 37733, "epoch": 224} {"train_loss": -7.814483642578125, "global_step": 37734, "epoch": 224} {"train_loss": -7.943084239959717, "global_step": 37735, "epoch": 224} {"train_loss": -7.835859775543213, "global_step": 37736, "epoch": 224} {"train_loss": -7.70211124420166, "global_step": 37737, "epoch": 224} {"train_loss": -7.618722438812256, "global_step": 37738, "epoch": 224} {"train_loss": -7.932827949523926, "global_step": 37739, "epoch": 224} {"train_loss": -7.7540130615234375, "global_step": 37740, "epoch": 224} {"train_loss": -7.602683067321777, "global_step": 37741, "epoch": 224} {"train_loss": -7.803197383880615, "global_step": 37742, "epoch": 224} {"train_loss": -7.79600715637207, "global_step": 37743, "epoch": 224} {"train_loss": -7.521307468414307, "global_step": 37744, "epoch": 224} {"train_loss": -7.720727920532227, "global_step": 37745, "epoch": 224} {"train_loss": -7.824793338775635, "global_step": 37746, "epoch": 224} {"train_loss": -7.768487930297852, "global_step": 37747, "epoch": 224} {"train_loss": -7.805684566497803, "global_step": 37748, "epoch": 224} {"train_loss": -7.9384660720825195, "global_step": 37749, "epoch": 224} {"train_loss": -7.684282302856445, "global_step": 37750, "epoch": 224} {"train_loss": -8.128402709960938, "global_step": 37751, "epoch": 224} {"train_loss": -7.721548557281494, "global_step": 37752, "epoch": 224} {"train_loss": -8.047698020935059, "global_step": 37753, "epoch": 224} {"train_loss": -8.019355773925781, "global_step": 37754, "epoch": 224} {"train_loss": -7.682082176208496, "global_step": 37755, "epoch": 224} {"train_loss": -7.724186420440674, "global_step": 37756, "epoch": 224} {"train_loss": -8.066619873046875, "global_step": 37757, "epoch": 224} {"train_loss": -7.62897253036499, "global_step": 37758, "epoch": 224} {"train_loss": -7.9636640548706055, "global_step": 37759, "epoch": 224} {"train_loss": -8.054842948913574, "global_step": 37760, "epoch": 224} {"train_loss": -7.807772636413574, "global_step": 37761, "epoch": 224} {"train_loss": -7.933041095733643, "global_step": 37762, "epoch": 224} {"train_loss": -7.872335433959961, "global_step": 37763, "epoch": 224} {"train_loss": -7.893031597137451, "global_step": 37764, "epoch": 224} {"train_loss": -7.806249618530273, "global_step": 37765, "epoch": 224} {"train_loss": -7.637971878051758, "global_step": 37766, "epoch": 224} {"train_loss": -7.715252876281738, "global_step": 37767, "epoch": 224} {"train_loss": -8.187108039855957, "global_step": 37768, "epoch": 224} {"train_loss": -7.933038234710693, "global_step": 37769, "epoch": 224} {"train_loss": -7.78846549987793, "global_step": 37770, "epoch": 224} {"train_loss": -7.941859245300293, "global_step": 37771, "epoch": 224} {"train_loss": -7.93955135345459, "global_step": 37772, "epoch": 224} {"train_loss": -7.702822685241699, "global_step": 37773, "epoch": 224} {"train_loss": -7.981409072875977, "global_step": 37774, "epoch": 224} {"train_loss": -7.7076005935668945, "global_step": 37775, "epoch": 224} {"train_loss": -7.808290958404541, "global_step": 37776, "epoch": 224} {"train_loss": -7.4550909996032715, "global_step": 37777, "epoch": 224} {"train_loss": -7.731207847595215, "global_step": 37778, "epoch": 224} {"train_loss": -7.713499069213867, "global_step": 37779, "epoch": 224} {"train_loss": -7.875221252441406, "global_step": 37780, "epoch": 224} {"train_loss": -7.980307579040527, "global_step": 37781, "epoch": 224} {"train_loss": -7.614194393157959, "global_step": 37782, "epoch": 224} {"train_loss": -7.640957832336426, "global_step": 37783, "epoch": 224} {"train_loss": -7.862030506134033, "global_step": 37784, "epoch": 224} {"train_loss": -7.688442230224609, "global_step": 37785, "epoch": 224} {"train_loss": -7.829397201538086, "global_step": 37786, "epoch": 224} {"train_loss": -7.911261081695557, "global_step": 37787, "epoch": 224} {"train_loss": -7.891479969024658, "global_step": 37788, "epoch": 224} {"train_loss": -8.167543411254883, "global_step": 37789, "epoch": 224} {"train_loss": -7.897046089172363, "global_step": 37790, "epoch": 224} {"train_loss": -7.847533226013184, "global_step": 37791, "epoch": 224} {"train_loss": -7.956700801849365, "global_step": 37792, "epoch": 224} {"train_loss": -7.9380784034729, "global_step": 37793, "epoch": 224} {"train_loss": -7.946342468261719, "global_step": 37794, "epoch": 224} {"train_loss": -7.735555648803711, "global_step": 37795, "epoch": 224} {"train_loss": -7.910408973693848, "global_step": 37796, "epoch": 224} {"train_loss": -7.693212509155273, "global_step": 37797, "epoch": 224} {"train_loss": -8.044238090515137, "global_step": 37798, "epoch": 224} {"train_loss": -7.843120935417357, "global_step": 37799, "epoch": 224, "val_loss": 184790.578125} {"train_loss": -7.89998197555542, "global_step": 37800, "epoch": 225} {"train_loss": -7.709959983825684, "global_step": 37801, "epoch": 225} {"train_loss": -8.019688606262207, "global_step": 37802, "epoch": 225} {"train_loss": -7.7141008377075195, "global_step": 37803, "epoch": 225} {"train_loss": -7.71783447265625, "global_step": 37804, "epoch": 225} {"train_loss": -7.790790557861328, "global_step": 37805, "epoch": 225} {"train_loss": -7.723361015319824, "global_step": 37806, "epoch": 225} {"train_loss": -7.88116979598999, "global_step": 37807, "epoch": 225} {"train_loss": -7.864351272583008, "global_step": 37808, "epoch": 225} {"train_loss": -7.864928245544434, "global_step": 37809, "epoch": 225} {"train_loss": -7.734747886657715, "global_step": 37810, "epoch": 225} {"train_loss": -7.675342082977295, "global_step": 37811, "epoch": 225} {"train_loss": -7.695330619812012, "global_step": 37812, "epoch": 225} {"train_loss": -8.099383354187012, "global_step": 37813, "epoch": 225} {"train_loss": -7.839406490325928, "global_step": 37814, "epoch": 225} {"train_loss": -7.748342990875244, "global_step": 37815, "epoch": 225} {"train_loss": -7.767608642578125, "global_step": 37816, "epoch": 225} {"train_loss": -7.7776384353637695, "global_step": 37817, "epoch": 225} {"train_loss": -7.711236953735352, "global_step": 37818, "epoch": 225} {"train_loss": -7.614798545837402, "global_step": 37819, "epoch": 225} {"train_loss": -7.9747419357299805, "global_step": 37820, "epoch": 225} {"train_loss": -7.917401313781738, "global_step": 37821, "epoch": 225} {"train_loss": -8.016454696655273, "global_step": 37822, "epoch": 225} {"train_loss": -7.650200366973877, "global_step": 37823, "epoch": 225} {"train_loss": -7.868030071258545, "global_step": 37824, "epoch": 225} {"train_loss": -7.871568202972412, "global_step": 37825, "epoch": 225} {"train_loss": -7.882358074188232, "global_step": 37826, "epoch": 225} {"train_loss": -7.7127580642700195, "global_step": 37827, "epoch": 225} {"train_loss": -7.819948673248291, "global_step": 37828, "epoch": 225} {"train_loss": -8.083077430725098, "global_step": 37829, "epoch": 225} {"train_loss": -7.886413097381592, "global_step": 37830, "epoch": 225} {"train_loss": -7.949509620666504, "global_step": 37831, "epoch": 225} {"train_loss": -7.8239922523498535, "global_step": 37832, "epoch": 225} {"train_loss": -7.91177225112915, "global_step": 37833, "epoch": 225} {"train_loss": -7.910905838012695, "global_step": 37834, "epoch": 225} {"train_loss": -8.168148040771484, "global_step": 37835, "epoch": 225} {"train_loss": -7.576715469360352, "global_step": 37836, "epoch": 225} {"train_loss": -7.815877437591553, "global_step": 37837, "epoch": 225} {"train_loss": -7.8467512130737305, "global_step": 37838, "epoch": 225} {"train_loss": -7.767218589782715, "global_step": 37839, "epoch": 225} {"train_loss": -7.64636754989624, "global_step": 37840, "epoch": 225} {"train_loss": -7.809003829956055, "global_step": 37841, "epoch": 225} {"train_loss": -7.912447929382324, "global_step": 37842, "epoch": 225} {"train_loss": -7.673139572143555, "global_step": 37843, "epoch": 225} {"train_loss": -7.960790634155273, "global_step": 37844, "epoch": 225} {"train_loss": -8.020833969116211, "global_step": 37845, "epoch": 225} {"train_loss": -8.0811128616333, "global_step": 37846, "epoch": 225} {"train_loss": -7.962193012237549, "global_step": 37847, "epoch": 225} {"train_loss": -7.902885913848877, "global_step": 37848, "epoch": 225} {"train_loss": -7.956562042236328, "global_step": 37849, "epoch": 225} {"train_loss": -7.746698379516602, "global_step": 37850, "epoch": 225} {"train_loss": -8.00304889678955, "global_step": 37851, "epoch": 225} {"train_loss": -7.822120666503906, "global_step": 37852, "epoch": 225} {"train_loss": -7.805929660797119, "global_step": 37853, "epoch": 225} {"train_loss": -7.654270172119141, "global_step": 37854, "epoch": 225} {"train_loss": -7.935826301574707, "global_step": 37855, "epoch": 225} {"train_loss": -7.745234966278076, "global_step": 37856, "epoch": 225} {"train_loss": -7.949653625488281, "global_step": 37857, "epoch": 225} {"train_loss": -7.84285306930542, "global_step": 37858, "epoch": 225} {"train_loss": -7.992101192474365, "global_step": 37859, "epoch": 225} {"train_loss": -8.037246704101562, "global_step": 37860, "epoch": 225} {"train_loss": -7.669983863830566, "global_step": 37861, "epoch": 225} {"train_loss": -7.699673652648926, "global_step": 37862, "epoch": 225} {"train_loss": -7.8279218673706055, "global_step": 37863, "epoch": 225} {"train_loss": -7.571133613586426, "global_step": 37864, "epoch": 225} {"train_loss": -7.850040435791016, "global_step": 37865, "epoch": 225} {"train_loss": -7.89935302734375, "global_step": 37866, "epoch": 225} {"train_loss": -7.851019859313965, "global_step": 37867, "epoch": 225} {"train_loss": -7.782587051391602, "global_step": 37868, "epoch": 225} {"train_loss": -7.791068077087402, "global_step": 37869, "epoch": 225} {"train_loss": -7.649301052093506, "global_step": 37870, "epoch": 225} {"train_loss": -7.785667419433594, "global_step": 37871, "epoch": 225} {"train_loss": -7.771658420562744, "global_step": 37872, "epoch": 225} {"train_loss": -7.55442476272583, "global_step": 37873, "epoch": 225} {"train_loss": -7.6184539794921875, "global_step": 37874, "epoch": 225} {"train_loss": -7.924727439880371, "global_step": 37875, "epoch": 225} {"train_loss": -7.601194381713867, "global_step": 37876, "epoch": 225} {"train_loss": -7.4003448486328125, "global_step": 37877, "epoch": 225} {"train_loss": -7.620491027832031, "global_step": 37878, "epoch": 225} {"train_loss": -7.548343181610107, "global_step": 37879, "epoch": 225} {"train_loss": -7.481855392456055, "global_step": 37880, "epoch": 225} {"train_loss": -7.510817527770996, "global_step": 37881, "epoch": 225} {"train_loss": -7.834433078765869, "global_step": 37882, "epoch": 225} {"train_loss": -7.499473571777344, "global_step": 37883, "epoch": 225} {"train_loss": -7.8680524826049805, "global_step": 37884, "epoch": 225} {"train_loss": -7.705621719360352, "global_step": 37885, "epoch": 225} {"train_loss": -7.894901275634766, "global_step": 37886, "epoch": 225} {"train_loss": -7.8098602294921875, "global_step": 37887, "epoch": 225} {"train_loss": -7.716255187988281, "global_step": 37888, "epoch": 225} {"train_loss": -7.4643120765686035, "global_step": 37889, "epoch": 225} {"train_loss": -7.7231292724609375, "global_step": 37890, "epoch": 225} {"train_loss": -7.781805038452148, "global_step": 37891, "epoch": 225} {"train_loss": -7.829192161560059, "global_step": 37892, "epoch": 225} {"train_loss": -7.661584377288818, "global_step": 37893, "epoch": 225} {"train_loss": -7.8003644943237305, "global_step": 37894, "epoch": 225} {"train_loss": -8.021141052246094, "global_step": 37895, "epoch": 225} {"train_loss": -7.76357364654541, "global_step": 37896, "epoch": 225} {"train_loss": -7.861964225769043, "global_step": 37897, "epoch": 225} {"train_loss": -7.88275146484375, "global_step": 37898, "epoch": 225} {"train_loss": -7.886470317840576, "global_step": 37899, "epoch": 225} {"train_loss": -7.866351127624512, "global_step": 37900, "epoch": 225} {"train_loss": -7.965957164764404, "global_step": 37901, "epoch": 225} {"train_loss": -8.083542823791504, "global_step": 37902, "epoch": 225} {"train_loss": -8.015702247619629, "global_step": 37903, "epoch": 225} {"train_loss": -7.953760623931885, "global_step": 37904, "epoch": 225} {"train_loss": -8.081453323364258, "global_step": 37905, "epoch": 225} {"train_loss": -7.916742324829102, "global_step": 37906, "epoch": 225} {"train_loss": -7.820979595184326, "global_step": 37907, "epoch": 225} {"train_loss": -7.914618015289307, "global_step": 37908, "epoch": 225} {"train_loss": -8.000003814697266, "global_step": 37909, "epoch": 225} {"train_loss": -7.687892913818359, "global_step": 37910, "epoch": 225} {"train_loss": -7.844669342041016, "global_step": 37911, "epoch": 225} {"train_loss": -7.946935176849365, "global_step": 37912, "epoch": 225} {"train_loss": -7.957470893859863, "global_step": 37913, "epoch": 225} {"train_loss": -7.853658199310303, "global_step": 37914, "epoch": 225} {"train_loss": -7.334407806396484, "global_step": 37915, "epoch": 225} {"train_loss": -7.886247634887695, "global_step": 37916, "epoch": 225} {"train_loss": -7.7693352699279785, "global_step": 37917, "epoch": 225} {"train_loss": -7.86739444732666, "global_step": 37918, "epoch": 225} {"train_loss": -8.01081371307373, "global_step": 37919, "epoch": 225} {"train_loss": -7.81362247467041, "global_step": 37920, "epoch": 225} {"train_loss": -7.825185775756836, "global_step": 37921, "epoch": 225} {"train_loss": -7.798658847808838, "global_step": 37922, "epoch": 225} {"train_loss": -7.878857135772705, "global_step": 37923, "epoch": 225} {"train_loss": -8.003690719604492, "global_step": 37924, "epoch": 225} {"train_loss": -7.611435890197754, "global_step": 37925, "epoch": 225} {"train_loss": -7.557094097137451, "global_step": 37926, "epoch": 225} {"train_loss": -7.652735233306885, "global_step": 37927, "epoch": 225} {"train_loss": -7.653253555297852, "global_step": 37928, "epoch": 225} {"train_loss": -7.841431617736816, "global_step": 37929, "epoch": 225} {"train_loss": -7.558048725128174, "global_step": 37930, "epoch": 225} {"train_loss": -7.811863899230957, "global_step": 37931, "epoch": 225} {"train_loss": -7.76705265045166, "global_step": 37932, "epoch": 225} {"train_loss": -7.605303764343262, "global_step": 37933, "epoch": 225} {"train_loss": -7.621678352355957, "global_step": 37934, "epoch": 225} {"train_loss": -7.858750343322754, "global_step": 37935, "epoch": 225} {"train_loss": -7.756446838378906, "global_step": 37936, "epoch": 225} {"train_loss": -7.6421308517456055, "global_step": 37937, "epoch": 225} {"train_loss": -7.623705863952637, "global_step": 37938, "epoch": 225} {"train_loss": -7.4226908683776855, "global_step": 37939, "epoch": 225} {"train_loss": -7.806000232696533, "global_step": 37940, "epoch": 225} {"train_loss": -7.688850402832031, "global_step": 37941, "epoch": 225} {"train_loss": -7.696468353271484, "global_step": 37942, "epoch": 225} {"train_loss": -7.749303340911865, "global_step": 37943, "epoch": 225} {"train_loss": -7.784902572631836, "global_step": 37944, "epoch": 225} {"train_loss": -7.9568634033203125, "global_step": 37945, "epoch": 225} {"train_loss": -7.611145973205566, "global_step": 37946, "epoch": 225} {"train_loss": -7.723857879638672, "global_step": 37947, "epoch": 225} {"train_loss": -7.754697799682617, "global_step": 37948, "epoch": 225} {"train_loss": -7.6830925941467285, "global_step": 37949, "epoch": 225} {"train_loss": -7.820347785949707, "global_step": 37950, "epoch": 225} {"train_loss": -7.81597900390625, "global_step": 37951, "epoch": 225} {"train_loss": -7.66798210144043, "global_step": 37952, "epoch": 225} {"train_loss": -7.6494951248168945, "global_step": 37953, "epoch": 225} {"train_loss": -7.998812675476074, "global_step": 37954, "epoch": 225} {"train_loss": -7.90421199798584, "global_step": 37955, "epoch": 225} {"train_loss": -7.958061218261719, "global_step": 37956, "epoch": 225} {"train_loss": -7.690423011779785, "global_step": 37957, "epoch": 225} {"train_loss": -7.544275283813477, "global_step": 37958, "epoch": 225} {"train_loss": -7.7632856369018555, "global_step": 37959, "epoch": 225} {"train_loss": -7.493442058563232, "global_step": 37960, "epoch": 225} {"train_loss": -7.637984275817871, "global_step": 37961, "epoch": 225} {"train_loss": -7.94862174987793, "global_step": 37962, "epoch": 225} {"train_loss": -7.687418460845947, "global_step": 37963, "epoch": 225} {"train_loss": -7.754709720611572, "global_step": 37964, "epoch": 225} {"train_loss": -7.829843521118164, "global_step": 37965, "epoch": 225} {"train_loss": -7.794844627380371, "global_step": 37966, "epoch": 225} {"train_loss": -7.795115641185215, "global_step": 37967, "epoch": 225, "val_loss": 187330.96875, "train_action_mse_error": 9.693204879760742} {"train_loss": -7.751469612121582, "global_step": 37968, "epoch": 226} {"train_loss": -7.83963680267334, "global_step": 37969, "epoch": 226} {"train_loss": -7.777737140655518, "global_step": 37970, "epoch": 226} {"train_loss": -7.865507125854492, "global_step": 37971, "epoch": 226} {"train_loss": -7.647621154785156, "global_step": 37972, "epoch": 226} {"train_loss": -7.748278617858887, "global_step": 37973, "epoch": 226} {"train_loss": -7.67741584777832, "global_step": 37974, "epoch": 226} {"train_loss": -8.061309814453125, "global_step": 37975, "epoch": 226} {"train_loss": -7.8410468101501465, "global_step": 37976, "epoch": 226} {"train_loss": -7.993083953857422, "global_step": 37977, "epoch": 226} {"train_loss": -7.78029203414917, "global_step": 37978, "epoch": 226} {"train_loss": -7.897250175476074, "global_step": 37979, "epoch": 226} {"train_loss": -7.891606330871582, "global_step": 37980, "epoch": 226} {"train_loss": -7.7607879638671875, "global_step": 37981, "epoch": 226} {"train_loss": -7.955672740936279, "global_step": 37982, "epoch": 226} {"train_loss": -7.7153730392456055, "global_step": 37983, "epoch": 226} {"train_loss": -7.994220733642578, "global_step": 37984, "epoch": 226} {"train_loss": -7.7464799880981445, "global_step": 37985, "epoch": 226} {"train_loss": -7.853170394897461, "global_step": 37986, "epoch": 226} {"train_loss": -7.862103462219238, "global_step": 37987, "epoch": 226} {"train_loss": -7.689672470092773, "global_step": 37988, "epoch": 226} {"train_loss": -7.8346452713012695, "global_step": 37989, "epoch": 226} {"train_loss": -7.922384262084961, "global_step": 37990, "epoch": 226} {"train_loss": -7.8238935470581055, "global_step": 37991, "epoch": 226} {"train_loss": -7.735484600067139, "global_step": 37992, "epoch": 226} {"train_loss": -7.899548053741455, "global_step": 37993, "epoch": 226} {"train_loss": -7.769518852233887, "global_step": 37994, "epoch": 226} {"train_loss": -7.741865158081055, "global_step": 37995, "epoch": 226} {"train_loss": -7.960082054138184, "global_step": 37996, "epoch": 226} {"train_loss": -7.956305503845215, "global_step": 37997, "epoch": 226} {"train_loss": -7.721057415008545, "global_step": 37998, "epoch": 226} {"train_loss": -7.932155132293701, "global_step": 37999, "epoch": 226} {"train_loss": -7.80925178527832, "global_step": 38000, "epoch": 226} {"train_loss": -7.639856338500977, "global_step": 38001, "epoch": 226} {"train_loss": -7.8081207275390625, "global_step": 38002, "epoch": 226} {"train_loss": -7.797173023223877, "global_step": 38003, "epoch": 226} {"train_loss": -7.77869176864624, "global_step": 38004, "epoch": 226} {"train_loss": -7.932084083557129, "global_step": 38005, "epoch": 226} {"train_loss": -7.878690719604492, "global_step": 38006, "epoch": 226} {"train_loss": -8.068487167358398, "global_step": 38007, "epoch": 226} {"train_loss": -7.692330837249756, "global_step": 38008, "epoch": 226} {"train_loss": -7.9980950355529785, "global_step": 38009, "epoch": 226} {"train_loss": -7.788156986236572, "global_step": 38010, "epoch": 226} {"train_loss": -8.02446174621582, "global_step": 38011, "epoch": 226} {"train_loss": -8.010271072387695, "global_step": 38012, "epoch": 226} {"train_loss": -7.886720657348633, "global_step": 38013, "epoch": 226} {"train_loss": -7.904055595397949, "global_step": 38014, "epoch": 226} {"train_loss": -7.786256790161133, "global_step": 38015, "epoch": 226} {"train_loss": -7.897139549255371, "global_step": 38016, "epoch": 226} {"train_loss": -7.975466728210449, "global_step": 38017, "epoch": 226} {"train_loss": -7.989603042602539, "global_step": 38018, "epoch": 226} {"train_loss": -7.891700744628906, "global_step": 38019, "epoch": 226} {"train_loss": -8.008089065551758, "global_step": 38020, "epoch": 226} {"train_loss": -8.03600788116455, "global_step": 38021, "epoch": 226} {"train_loss": -7.901571273803711, "global_step": 38022, "epoch": 226} {"train_loss": -7.958120346069336, "global_step": 38023, "epoch": 226} {"train_loss": -7.740438938140869, "global_step": 38024, "epoch": 226} {"train_loss": -8.128706932067871, "global_step": 38025, "epoch": 226} {"train_loss": -7.790656089782715, "global_step": 38026, "epoch": 226} {"train_loss": -7.952500343322754, "global_step": 38027, "epoch": 226} {"train_loss": -8.017709732055664, "global_step": 38028, "epoch": 226} {"train_loss": -7.766167640686035, "global_step": 38029, "epoch": 226} {"train_loss": -7.857954978942871, "global_step": 38030, "epoch": 226} {"train_loss": -7.851787090301514, "global_step": 38031, "epoch": 226} {"train_loss": -7.660662651062012, "global_step": 38032, "epoch": 226} {"train_loss": -7.825323581695557, "global_step": 38033, "epoch": 226} {"train_loss": -7.755171298980713, "global_step": 38034, "epoch": 226} {"train_loss": -7.627723693847656, "global_step": 38035, "epoch": 226} {"train_loss": -7.6472578048706055, "global_step": 38036, "epoch": 226} {"train_loss": -7.641165733337402, "global_step": 38037, "epoch": 226} {"train_loss": -7.526239395141602, "global_step": 38038, "epoch": 226} {"train_loss": -7.670644760131836, "global_step": 38039, "epoch": 226} {"train_loss": -7.794586181640625, "global_step": 38040, "epoch": 226} {"train_loss": -7.7374725341796875, "global_step": 38041, "epoch": 226} {"train_loss": -7.641568183898926, "global_step": 38042, "epoch": 226} {"train_loss": -7.969118595123291, "global_step": 38043, "epoch": 226} {"train_loss": -7.626147747039795, "global_step": 38044, "epoch": 226} {"train_loss": -7.791834354400635, "global_step": 38045, "epoch": 226} {"train_loss": -7.829074859619141, "global_step": 38046, "epoch": 226} {"train_loss": -7.644486904144287, "global_step": 38047, "epoch": 226} {"train_loss": -7.6783928871154785, "global_step": 38048, "epoch": 226} {"train_loss": -7.721170902252197, "global_step": 38049, "epoch": 226} {"train_loss": -7.62912654876709, "global_step": 38050, "epoch": 226} {"train_loss": -7.711082935333252, "global_step": 38051, "epoch": 226} {"train_loss": -7.5847578048706055, "global_step": 38052, "epoch": 226} {"train_loss": -7.889314651489258, "global_step": 38053, "epoch": 226} {"train_loss": -7.847620010375977, "global_step": 38054, "epoch": 226} {"train_loss": -7.886585235595703, "global_step": 38055, "epoch": 226} {"train_loss": -7.852827548980713, "global_step": 38056, "epoch": 226} {"train_loss": -7.84329891204834, "global_step": 38057, "epoch": 226} {"train_loss": -7.943689346313477, "global_step": 38058, "epoch": 226} {"train_loss": -7.864912986755371, "global_step": 38059, "epoch": 226} {"train_loss": -7.864941596984863, "global_step": 38060, "epoch": 226} {"train_loss": -7.84290885925293, "global_step": 38061, "epoch": 226} {"train_loss": -7.684999465942383, "global_step": 38062, "epoch": 226} {"train_loss": -8.04704475402832, "global_step": 38063, "epoch": 226} {"train_loss": -7.842735290527344, "global_step": 38064, "epoch": 226} {"train_loss": -7.905359745025635, "global_step": 38065, "epoch": 226} {"train_loss": -7.933929443359375, "global_step": 38066, "epoch": 226} {"train_loss": -8.067216873168945, "global_step": 38067, "epoch": 226} {"train_loss": -7.7411932945251465, "global_step": 38068, "epoch": 226} {"train_loss": -7.719204902648926, "global_step": 38069, "epoch": 226} {"train_loss": -7.394257545471191, "global_step": 38070, "epoch": 226} {"train_loss": -7.773233413696289, "global_step": 38071, "epoch": 226} {"train_loss": -7.4198760986328125, "global_step": 38072, "epoch": 226} {"train_loss": -7.66646671295166, "global_step": 38073, "epoch": 226} {"train_loss": -7.778843402862549, "global_step": 38074, "epoch": 226} {"train_loss": -7.795015335083008, "global_step": 38075, "epoch": 226} {"train_loss": -7.652842044830322, "global_step": 38076, "epoch": 226} {"train_loss": -7.725922107696533, "global_step": 38077, "epoch": 226} {"train_loss": -7.2563018798828125, "global_step": 38078, "epoch": 226} {"train_loss": -7.703308582305908, "global_step": 38079, "epoch": 226} {"train_loss": -7.527624607086182, "global_step": 38080, "epoch": 226} {"train_loss": -7.878562927246094, "global_step": 38081, "epoch": 226} {"train_loss": -7.6758294105529785, "global_step": 38082, "epoch": 226} {"train_loss": -7.662563800811768, "global_step": 38083, "epoch": 226} {"train_loss": -7.699954986572266, "global_step": 38084, "epoch": 226} {"train_loss": -7.533502578735352, "global_step": 38085, "epoch": 226} {"train_loss": -7.788327217102051, "global_step": 38086, "epoch": 226} {"train_loss": -7.8374528884887695, "global_step": 38087, "epoch": 226} {"train_loss": -7.94382905960083, "global_step": 38088, "epoch": 226} {"train_loss": -7.681292533874512, "global_step": 38089, "epoch": 226} {"train_loss": -7.8942179679870605, "global_step": 38090, "epoch": 226} {"train_loss": -7.731599807739258, "global_step": 38091, "epoch": 226} {"train_loss": -8.05046272277832, "global_step": 38092, "epoch": 226} {"train_loss": -7.607593536376953, "global_step": 38093, "epoch": 226} {"train_loss": -7.942124366760254, "global_step": 38094, "epoch": 226} {"train_loss": -7.756927013397217, "global_step": 38095, "epoch": 226} {"train_loss": -7.98936653137207, "global_step": 38096, "epoch": 226} {"train_loss": -7.863554954528809, "global_step": 38097, "epoch": 226} {"train_loss": -7.855202674865723, "global_step": 38098, "epoch": 226} {"train_loss": -7.901442527770996, "global_step": 38099, "epoch": 226} {"train_loss": -7.838756561279297, "global_step": 38100, "epoch": 226} {"train_loss": -8.025579452514648, "global_step": 38101, "epoch": 226} {"train_loss": -7.966160774230957, "global_step": 38102, "epoch": 226} {"train_loss": -7.8874664306640625, "global_step": 38103, "epoch": 226} {"train_loss": -7.873090744018555, "global_step": 38104, "epoch": 226} {"train_loss": -7.85842752456665, "global_step": 38105, "epoch": 226} {"train_loss": -7.661519527435303, "global_step": 38106, "epoch": 226} {"train_loss": -7.7293500900268555, "global_step": 38107, "epoch": 226} {"train_loss": -8.071237564086914, "global_step": 38108, "epoch": 226} {"train_loss": -7.83120059967041, "global_step": 38109, "epoch": 226} {"train_loss": -7.97750997543335, "global_step": 38110, "epoch": 226} {"train_loss": -7.821235656738281, "global_step": 38111, "epoch": 226} {"train_loss": -7.988861083984375, "global_step": 38112, "epoch": 226} {"train_loss": -7.963354110717773, "global_step": 38113, "epoch": 226} {"train_loss": -8.03506088256836, "global_step": 38114, "epoch": 226} {"train_loss": -8.117944717407227, "global_step": 38115, "epoch": 226} {"train_loss": -8.024843215942383, "global_step": 38116, "epoch": 226} {"train_loss": -8.04222297668457, "global_step": 38117, "epoch": 226} {"train_loss": -7.741394519805908, "global_step": 38118, "epoch": 226} {"train_loss": -8.16618824005127, "global_step": 38119, "epoch": 226} {"train_loss": -7.7290544509887695, "global_step": 38120, "epoch": 226} {"train_loss": -7.989829063415527, "global_step": 38121, "epoch": 226} {"train_loss": -8.04619312286377, "global_step": 38122, "epoch": 226} {"train_loss": -7.858244895935059, "global_step": 38123, "epoch": 226} {"train_loss": -8.03207778930664, "global_step": 38124, "epoch": 226} {"train_loss": -7.746767997741699, "global_step": 38125, "epoch": 226} {"train_loss": -8.051399230957031, "global_step": 38126, "epoch": 226} {"train_loss": -7.848492622375488, "global_step": 38127, "epoch": 226} {"train_loss": -8.000255584716797, "global_step": 38128, "epoch": 226} {"train_loss": -7.901509761810303, "global_step": 38129, "epoch": 226} {"train_loss": -7.8499531745910645, "global_step": 38130, "epoch": 226} {"train_loss": -7.638564109802246, "global_step": 38131, "epoch": 226} {"train_loss": -8.004415512084961, "global_step": 38132, "epoch": 226} {"train_loss": -7.65440559387207, "global_step": 38133, "epoch": 226} {"train_loss": -7.87969970703125, "global_step": 38134, "epoch": 226} {"train_loss": -7.829281792754219, "global_step": 38135, "epoch": 226, "val_loss": 184743.921875} {"train_loss": -7.631237030029297, "global_step": 38136, "epoch": 227} {"train_loss": -7.523454666137695, "global_step": 38137, "epoch": 227} {"train_loss": -7.972060680389404, "global_step": 38138, "epoch": 227} {"train_loss": -7.65074348449707, "global_step": 38139, "epoch": 227} {"train_loss": -7.8589019775390625, "global_step": 38140, "epoch": 227} {"train_loss": -7.524883270263672, "global_step": 38141, "epoch": 227} {"train_loss": -7.61265754699707, "global_step": 38142, "epoch": 227} {"train_loss": -7.6921305656433105, "global_step": 38143, "epoch": 227} {"train_loss": -7.623899459838867, "global_step": 38144, "epoch": 227} {"train_loss": -7.954122543334961, "global_step": 38145, "epoch": 227} {"train_loss": -7.494098663330078, "global_step": 38146, "epoch": 227} {"train_loss": -7.627640724182129, "global_step": 38147, "epoch": 227} {"train_loss": -7.616291046142578, "global_step": 38148, "epoch": 227} {"train_loss": -7.753313064575195, "global_step": 38149, "epoch": 227} {"train_loss": -7.693904876708984, "global_step": 38150, "epoch": 227} {"train_loss": -7.793472766876221, "global_step": 38151, "epoch": 227} {"train_loss": -7.724931716918945, "global_step": 38152, "epoch": 227} {"train_loss": -7.771105766296387, "global_step": 38153, "epoch": 227} {"train_loss": -7.739812850952148, "global_step": 38154, "epoch": 227} {"train_loss": -7.755271911621094, "global_step": 38155, "epoch": 227} {"train_loss": -7.889259338378906, "global_step": 38156, "epoch": 227} {"train_loss": -7.861905097961426, "global_step": 38157, "epoch": 227} {"train_loss": -7.827663898468018, "global_step": 38158, "epoch": 227} {"train_loss": -7.954630374908447, "global_step": 38159, "epoch": 227} {"train_loss": -8.068674087524414, "global_step": 38160, "epoch": 227} {"train_loss": -8.039499282836914, "global_step": 38161, "epoch": 227} {"train_loss": -8.07082748413086, "global_step": 38162, "epoch": 227} {"train_loss": -7.760120391845703, "global_step": 38163, "epoch": 227} {"train_loss": -7.945802688598633, "global_step": 38164, "epoch": 227} {"train_loss": -7.674046516418457, "global_step": 38165, "epoch": 227} {"train_loss": -7.994848251342773, "global_step": 38166, "epoch": 227} {"train_loss": -7.880551338195801, "global_step": 38167, "epoch": 227} {"train_loss": -7.7104902267456055, "global_step": 38168, "epoch": 227} {"train_loss": -7.888551712036133, "global_step": 38169, "epoch": 227} {"train_loss": -7.796941757202148, "global_step": 38170, "epoch": 227} {"train_loss": -7.596002101898193, "global_step": 38171, "epoch": 227} {"train_loss": -7.678514003753662, "global_step": 38172, "epoch": 227} {"train_loss": -7.882746696472168, "global_step": 38173, "epoch": 227} {"train_loss": -7.809991836547852, "global_step": 38174, "epoch": 227} {"train_loss": -7.763434410095215, "global_step": 38175, "epoch": 227} {"train_loss": -8.121942520141602, "global_step": 38176, "epoch": 227} {"train_loss": -7.831793785095215, "global_step": 38177, "epoch": 227} {"train_loss": -7.764853000640869, "global_step": 38178, "epoch": 227} {"train_loss": -7.9976043701171875, "global_step": 38179, "epoch": 227} {"train_loss": -7.7410736083984375, "global_step": 38180, "epoch": 227} {"train_loss": -7.993871688842773, "global_step": 38181, "epoch": 227} {"train_loss": -7.848579406738281, "global_step": 38182, "epoch": 227} {"train_loss": -8.016586303710938, "global_step": 38183, "epoch": 227} {"train_loss": -8.052648544311523, "global_step": 38184, "epoch": 227} {"train_loss": -8.226884841918945, "global_step": 38185, "epoch": 227} {"train_loss": -7.7477827072143555, "global_step": 38186, "epoch": 227} {"train_loss": -7.8168134689331055, "global_step": 38187, "epoch": 227} {"train_loss": -7.788626670837402, "global_step": 38188, "epoch": 227} {"train_loss": -7.550640106201172, "global_step": 38189, "epoch": 227} {"train_loss": -7.9727349281311035, "global_step": 38190, "epoch": 227} {"train_loss": -7.835537910461426, "global_step": 38191, "epoch": 227} {"train_loss": -7.766378402709961, "global_step": 38192, "epoch": 227} {"train_loss": -7.979548931121826, "global_step": 38193, "epoch": 227} {"train_loss": -7.914376258850098, "global_step": 38194, "epoch": 227} {"train_loss": -7.8194580078125, "global_step": 38195, "epoch": 227} {"train_loss": -7.713094234466553, "global_step": 38196, "epoch": 227} {"train_loss": -7.94765043258667, "global_step": 38197, "epoch": 227} {"train_loss": -7.8046488761901855, "global_step": 38198, "epoch": 227} {"train_loss": -7.866682052612305, "global_step": 38199, "epoch": 227} {"train_loss": -7.670254707336426, "global_step": 38200, "epoch": 227} {"train_loss": -7.752180099487305, "global_step": 38201, "epoch": 227} {"train_loss": -7.809791564941406, "global_step": 38202, "epoch": 227} {"train_loss": -7.868908405303955, "global_step": 38203, "epoch": 227} {"train_loss": -7.704204559326172, "global_step": 38204, "epoch": 227} {"train_loss": -7.665158748626709, "global_step": 38205, "epoch": 227} {"train_loss": -7.516355037689209, "global_step": 38206, "epoch": 227} {"train_loss": -7.797982215881348, "global_step": 38207, "epoch": 227} {"train_loss": -7.490753173828125, "global_step": 38208, "epoch": 227} {"train_loss": -7.682352542877197, "global_step": 38209, "epoch": 227} {"train_loss": -7.646662712097168, "global_step": 38210, "epoch": 227} {"train_loss": -7.6119279861450195, "global_step": 38211, "epoch": 227} {"train_loss": -7.492730140686035, "global_step": 38212, "epoch": 227} {"train_loss": -7.677868843078613, "global_step": 38213, "epoch": 227} {"train_loss": -7.821952819824219, "global_step": 38214, "epoch": 227} {"train_loss": -7.688360691070557, "global_step": 38215, "epoch": 227} {"train_loss": -7.581640243530273, "global_step": 38216, "epoch": 227} {"train_loss": -7.787199974060059, "global_step": 38217, "epoch": 227} {"train_loss": -7.961092948913574, "global_step": 38218, "epoch": 227} {"train_loss": -7.7725396156311035, "global_step": 38219, "epoch": 227} {"train_loss": -7.808653831481934, "global_step": 38220, "epoch": 227} {"train_loss": -7.501964092254639, "global_step": 38221, "epoch": 227} {"train_loss": -7.899527549743652, "global_step": 38222, "epoch": 227} {"train_loss": -7.538913249969482, "global_step": 38223, "epoch": 227} {"train_loss": -7.90459680557251, "global_step": 38224, "epoch": 227} {"train_loss": -7.8400702476501465, "global_step": 38225, "epoch": 227} {"train_loss": -7.912350654602051, "global_step": 38226, "epoch": 227} {"train_loss": -7.648024082183838, "global_step": 38227, "epoch": 227} {"train_loss": -7.700559139251709, "global_step": 38228, "epoch": 227} {"train_loss": -7.863008975982666, "global_step": 38229, "epoch": 227} {"train_loss": -7.863749027252197, "global_step": 38230, "epoch": 227} {"train_loss": -8.136833190917969, "global_step": 38231, "epoch": 227} {"train_loss": -7.949149131774902, "global_step": 38232, "epoch": 227} {"train_loss": -8.031097412109375, "global_step": 38233, "epoch": 227} {"train_loss": -7.997679710388184, "global_step": 38234, "epoch": 227} {"train_loss": -7.990273952484131, "global_step": 38235, "epoch": 227} {"train_loss": -7.923276901245117, "global_step": 38236, "epoch": 227} {"train_loss": -7.6423659324646, "global_step": 38237, "epoch": 227} {"train_loss": -8.103675842285156, "global_step": 38238, "epoch": 227} {"train_loss": -7.741446495056152, "global_step": 38239, "epoch": 227} {"train_loss": -7.898631572723389, "global_step": 38240, "epoch": 227} {"train_loss": -8.001643180847168, "global_step": 38241, "epoch": 227} {"train_loss": -7.851361274719238, "global_step": 38242, "epoch": 227} {"train_loss": -7.894909858703613, "global_step": 38243, "epoch": 227} {"train_loss": -7.691286087036133, "global_step": 38244, "epoch": 227} {"train_loss": -7.780544757843018, "global_step": 38245, "epoch": 227} {"train_loss": -7.9109649658203125, "global_step": 38246, "epoch": 227} {"train_loss": -8.015823364257812, "global_step": 38247, "epoch": 227} {"train_loss": -7.835369110107422, "global_step": 38248, "epoch": 227} {"train_loss": -7.845331192016602, "global_step": 38249, "epoch": 227} {"train_loss": -7.768550395965576, "global_step": 38250, "epoch": 227} {"train_loss": -7.904129505157471, "global_step": 38251, "epoch": 227} {"train_loss": -7.771007061004639, "global_step": 38252, "epoch": 227} {"train_loss": -7.8914031982421875, "global_step": 38253, "epoch": 227} {"train_loss": -7.636750221252441, "global_step": 38254, "epoch": 227} {"train_loss": -7.60048770904541, "global_step": 38255, "epoch": 227} {"train_loss": -7.607883930206299, "global_step": 38256, "epoch": 227} {"train_loss": -8.013851165771484, "global_step": 38257, "epoch": 227} {"train_loss": -7.677996635437012, "global_step": 38258, "epoch": 227} {"train_loss": -7.768450736999512, "global_step": 38259, "epoch": 227} {"train_loss": -7.433274269104004, "global_step": 38260, "epoch": 227} {"train_loss": -7.909761428833008, "global_step": 38261, "epoch": 227} {"train_loss": -7.832117080688477, "global_step": 38262, "epoch": 227} {"train_loss": -7.48822021484375, "global_step": 38263, "epoch": 227} {"train_loss": -7.830149173736572, "global_step": 38264, "epoch": 227} {"train_loss": -7.854401111602783, "global_step": 38265, "epoch": 227} {"train_loss": -7.833961486816406, "global_step": 38266, "epoch": 227} {"train_loss": -7.839776992797852, "global_step": 38267, "epoch": 227} {"train_loss": -7.7576093673706055, "global_step": 38268, "epoch": 227} {"train_loss": -7.8673810958862305, "global_step": 38269, "epoch": 227} {"train_loss": -7.8190388679504395, "global_step": 38270, "epoch": 227} {"train_loss": -7.810501575469971, "global_step": 38271, "epoch": 227} {"train_loss": -7.976552486419678, "global_step": 38272, "epoch": 227} {"train_loss": -7.955511569976807, "global_step": 38273, "epoch": 227} {"train_loss": -8.07746696472168, "global_step": 38274, "epoch": 227} {"train_loss": -7.862483978271484, "global_step": 38275, "epoch": 227} {"train_loss": -8.047159194946289, "global_step": 38276, "epoch": 227} {"train_loss": -8.082746505737305, "global_step": 38277, "epoch": 227} {"train_loss": -7.852173805236816, "global_step": 38278, "epoch": 227} {"train_loss": -8.067643165588379, "global_step": 38279, "epoch": 227} {"train_loss": -7.958765983581543, "global_step": 38280, "epoch": 227} {"train_loss": -7.973109245300293, "global_step": 38281, "epoch": 227} {"train_loss": -7.939829349517822, "global_step": 38282, "epoch": 227} {"train_loss": -8.01718521118164, "global_step": 38283, "epoch": 227} {"train_loss": -8.06397819519043, "global_step": 38284, "epoch": 227} {"train_loss": -8.20235824584961, "global_step": 38285, "epoch": 227} {"train_loss": -8.083148956298828, "global_step": 38286, "epoch": 227} {"train_loss": -8.10529899597168, "global_step": 38287, "epoch": 227} {"train_loss": -7.922622203826904, "global_step": 38288, "epoch": 227} {"train_loss": -8.143148422241211, "global_step": 38289, "epoch": 227} {"train_loss": -8.00376033782959, "global_step": 38290, "epoch": 227} {"train_loss": -8.078520774841309, "global_step": 38291, "epoch": 227} {"train_loss": -8.008922576904297, "global_step": 38292, "epoch": 227} {"train_loss": -8.001704216003418, "global_step": 38293, "epoch": 227} {"train_loss": -7.941093444824219, "global_step": 38294, "epoch": 227} {"train_loss": -7.901426315307617, "global_step": 38295, "epoch": 227} {"train_loss": -7.947290420532227, "global_step": 38296, "epoch": 227} {"train_loss": -8.129894256591797, "global_step": 38297, "epoch": 227} {"train_loss": -8.19207763671875, "global_step": 38298, "epoch": 227} {"train_loss": -7.708774089813232, "global_step": 38299, "epoch": 227} {"train_loss": -7.993807315826416, "global_step": 38300, "epoch": 227} {"train_loss": -7.7816901206970215, "global_step": 38301, "epoch": 227} {"train_loss": -7.96392297744751, "global_step": 38302, "epoch": 227} {"train_loss": -7.834169132368905, "global_step": 38303, "epoch": 227, "val_loss": 187667.84375} {"train_loss": -7.482182502746582, "global_step": 38304, "epoch": 228} {"train_loss": -7.7374372482299805, "global_step": 38305, "epoch": 228} {"train_loss": -7.636945724487305, "global_step": 38306, "epoch": 228} {"train_loss": -7.791621208190918, "global_step": 38307, "epoch": 228} {"train_loss": -7.82400369644165, "global_step": 38308, "epoch": 228} {"train_loss": -7.802976608276367, "global_step": 38309, "epoch": 228} {"train_loss": -7.6229095458984375, "global_step": 38310, "epoch": 228} {"train_loss": -7.832035541534424, "global_step": 38311, "epoch": 228} {"train_loss": -7.857222557067871, "global_step": 38312, "epoch": 228} {"train_loss": -7.623353004455566, "global_step": 38313, "epoch": 228} {"train_loss": -7.970293045043945, "global_step": 38314, "epoch": 228} {"train_loss": -7.492801666259766, "global_step": 38315, "epoch": 228} {"train_loss": -7.74107551574707, "global_step": 38316, "epoch": 228} {"train_loss": -7.64448881149292, "global_step": 38317, "epoch": 228} {"train_loss": -7.98429536819458, "global_step": 38318, "epoch": 228} {"train_loss": -7.865720748901367, "global_step": 38319, "epoch": 228} {"train_loss": -8.000835418701172, "global_step": 38320, "epoch": 228} {"train_loss": -7.783657073974609, "global_step": 38321, "epoch": 228} {"train_loss": -7.752730369567871, "global_step": 38322, "epoch": 228} {"train_loss": -7.84287166595459, "global_step": 38323, "epoch": 228} {"train_loss": -7.778224945068359, "global_step": 38324, "epoch": 228} {"train_loss": -7.454283714294434, "global_step": 38325, "epoch": 228} {"train_loss": -7.74138879776001, "global_step": 38326, "epoch": 228} {"train_loss": -7.909951210021973, "global_step": 38327, "epoch": 228} {"train_loss": -7.615720748901367, "global_step": 38328, "epoch": 228} {"train_loss": -7.864768981933594, "global_step": 38329, "epoch": 228} {"train_loss": -7.764590740203857, "global_step": 38330, "epoch": 228} {"train_loss": -7.999094486236572, "global_step": 38331, "epoch": 228} {"train_loss": -8.042997360229492, "global_step": 38332, "epoch": 228} {"train_loss": -7.939104080200195, "global_step": 38333, "epoch": 228} {"train_loss": -7.876389503479004, "global_step": 38334, "epoch": 228} {"train_loss": -7.812139987945557, "global_step": 38335, "epoch": 228} {"train_loss": -7.5450639724731445, "global_step": 38336, "epoch": 228} {"train_loss": -7.71242094039917, "global_step": 38337, "epoch": 228} {"train_loss": -7.8735246658325195, "global_step": 38338, "epoch": 228} {"train_loss": -7.993330955505371, "global_step": 38339, "epoch": 228} {"train_loss": -7.905719757080078, "global_step": 38340, "epoch": 228} {"train_loss": -7.8881425857543945, "global_step": 38341, "epoch": 228} {"train_loss": -7.782999038696289, "global_step": 38342, "epoch": 228} {"train_loss": -7.646934509277344, "global_step": 38343, "epoch": 228} {"train_loss": -7.9247307777404785, "global_step": 38344, "epoch": 228} {"train_loss": -7.865757942199707, "global_step": 38345, "epoch": 228} {"train_loss": -7.969573974609375, "global_step": 38346, "epoch": 228} {"train_loss": -7.629016399383545, "global_step": 38347, "epoch": 228} {"train_loss": -7.708958625793457, "global_step": 38348, "epoch": 228} {"train_loss": -7.874720573425293, "global_step": 38349, "epoch": 228} {"train_loss": -8.076940536499023, "global_step": 38350, "epoch": 228} {"train_loss": -7.8308563232421875, "global_step": 38351, "epoch": 228} {"train_loss": -8.110387802124023, "global_step": 38352, "epoch": 228} {"train_loss": -7.851820468902588, "global_step": 38353, "epoch": 228} {"train_loss": -7.927221298217773, "global_step": 38354, "epoch": 228} {"train_loss": -7.804309368133545, "global_step": 38355, "epoch": 228} {"train_loss": -7.892791748046875, "global_step": 38356, "epoch": 228} {"train_loss": -7.710376739501953, "global_step": 38357, "epoch": 228} {"train_loss": -8.034364700317383, "global_step": 38358, "epoch": 228} {"train_loss": -7.730506896972656, "global_step": 38359, "epoch": 228} {"train_loss": -7.934687614440918, "global_step": 38360, "epoch": 228} {"train_loss": -7.99770450592041, "global_step": 38361, "epoch": 228} {"train_loss": -8.003830909729004, "global_step": 38362, "epoch": 228} {"train_loss": -7.828744411468506, "global_step": 38363, "epoch": 228} {"train_loss": -7.974224090576172, "global_step": 38364, "epoch": 228} {"train_loss": -7.9981560707092285, "global_step": 38365, "epoch": 228} {"train_loss": -7.611296653747559, "global_step": 38366, "epoch": 228} {"train_loss": -7.820367336273193, "global_step": 38367, "epoch": 228} {"train_loss": -7.8086442947387695, "global_step": 38368, "epoch": 228} {"train_loss": -7.754481315612793, "global_step": 38369, "epoch": 228} {"train_loss": -7.7002692222595215, "global_step": 38370, "epoch": 228} {"train_loss": -7.795801162719727, "global_step": 38371, "epoch": 228} {"train_loss": -7.8235764503479, "global_step": 38372, "epoch": 228} {"train_loss": -7.8523101806640625, "global_step": 38373, "epoch": 228} {"train_loss": -7.932188987731934, "global_step": 38374, "epoch": 228} {"train_loss": -7.914941787719727, "global_step": 38375, "epoch": 228} {"train_loss": -7.655185699462891, "global_step": 38376, "epoch": 228} {"train_loss": -7.994400501251221, "global_step": 38377, "epoch": 228} {"train_loss": -7.836267471313477, "global_step": 38378, "epoch": 228} {"train_loss": -8.008415222167969, "global_step": 38379, "epoch": 228} {"train_loss": -7.846935272216797, "global_step": 38380, "epoch": 228} {"train_loss": -7.612929344177246, "global_step": 38381, "epoch": 228} {"train_loss": -7.772383689880371, "global_step": 38382, "epoch": 228} {"train_loss": -7.972273826599121, "global_step": 38383, "epoch": 228} {"train_loss": -7.663069725036621, "global_step": 38384, "epoch": 228} {"train_loss": -7.714334487915039, "global_step": 38385, "epoch": 228} {"train_loss": -8.061909675598145, "global_step": 38386, "epoch": 228} {"train_loss": -7.769238471984863, "global_step": 38387, "epoch": 228} {"train_loss": -7.873649597167969, "global_step": 38388, "epoch": 228} {"train_loss": -7.903656959533691, "global_step": 38389, "epoch": 228} {"train_loss": -7.746640205383301, "global_step": 38390, "epoch": 228} {"train_loss": -7.461981773376465, "global_step": 38391, "epoch": 228} {"train_loss": -7.739097595214844, "global_step": 38392, "epoch": 228} {"train_loss": -7.531689167022705, "global_step": 38393, "epoch": 228} {"train_loss": -7.764255046844482, "global_step": 38394, "epoch": 228} {"train_loss": -7.933352947235107, "global_step": 38395, "epoch": 228} {"train_loss": -7.269526958465576, "global_step": 38396, "epoch": 228} {"train_loss": -7.878547668457031, "global_step": 38397, "epoch": 228} {"train_loss": -7.701988220214844, "global_step": 38398, "epoch": 228} {"train_loss": -7.5458526611328125, "global_step": 38399, "epoch": 228} {"train_loss": -7.594428539276123, "global_step": 38400, "epoch": 228} {"train_loss": -7.99171257019043, "global_step": 38401, "epoch": 228} {"train_loss": -7.650850296020508, "global_step": 38402, "epoch": 228} {"train_loss": -7.602062702178955, "global_step": 38403, "epoch": 228} {"train_loss": -7.728692054748535, "global_step": 38404, "epoch": 228} {"train_loss": -7.935375213623047, "global_step": 38405, "epoch": 228} {"train_loss": -8.001359939575195, "global_step": 38406, "epoch": 228} {"train_loss": -7.922159194946289, "global_step": 38407, "epoch": 228} {"train_loss": -7.835704803466797, "global_step": 38408, "epoch": 228} {"train_loss": -7.814419746398926, "global_step": 38409, "epoch": 228} {"train_loss": -7.829891681671143, "global_step": 38410, "epoch": 228} {"train_loss": -7.844844341278076, "global_step": 38411, "epoch": 228} {"train_loss": -7.866878509521484, "global_step": 38412, "epoch": 228} {"train_loss": -7.804405212402344, "global_step": 38413, "epoch": 228} {"train_loss": -7.850471496582031, "global_step": 38414, "epoch": 228} {"train_loss": -7.844670295715332, "global_step": 38415, "epoch": 228} {"train_loss": -7.857503890991211, "global_step": 38416, "epoch": 228} {"train_loss": -8.072663307189941, "global_step": 38417, "epoch": 228} {"train_loss": -7.996818542480469, "global_step": 38418, "epoch": 228} {"train_loss": -7.657244682312012, "global_step": 38419, "epoch": 228} {"train_loss": -7.882448196411133, "global_step": 38420, "epoch": 228} {"train_loss": -7.762657165527344, "global_step": 38421, "epoch": 228} {"train_loss": -7.73805046081543, "global_step": 38422, "epoch": 228} {"train_loss": -7.869856834411621, "global_step": 38423, "epoch": 228} {"train_loss": -7.941781044006348, "global_step": 38424, "epoch": 228} {"train_loss": -7.733300685882568, "global_step": 38425, "epoch": 228} {"train_loss": -8.014039993286133, "global_step": 38426, "epoch": 228} {"train_loss": -7.88301420211792, "global_step": 38427, "epoch": 228} {"train_loss": -7.637160301208496, "global_step": 38428, "epoch": 228} {"train_loss": -7.816037178039551, "global_step": 38429, "epoch": 228} {"train_loss": -7.7437214851379395, "global_step": 38430, "epoch": 228} {"train_loss": -7.690068244934082, "global_step": 38431, "epoch": 228} {"train_loss": -7.834808349609375, "global_step": 38432, "epoch": 228} {"train_loss": -7.925936222076416, "global_step": 38433, "epoch": 228} {"train_loss": -7.987097263336182, "global_step": 38434, "epoch": 228} {"train_loss": -7.8885040283203125, "global_step": 38435, "epoch": 228} {"train_loss": -7.6150126457214355, "global_step": 38436, "epoch": 228} {"train_loss": -7.939671039581299, "global_step": 38437, "epoch": 228} {"train_loss": -7.87285041809082, "global_step": 38438, "epoch": 228} {"train_loss": -7.75803279876709, "global_step": 38439, "epoch": 228} {"train_loss": -7.902912139892578, "global_step": 38440, "epoch": 228} {"train_loss": -7.887211799621582, "global_step": 38441, "epoch": 228} {"train_loss": -7.982851982116699, "global_step": 38442, "epoch": 228} {"train_loss": -8.012838363647461, "global_step": 38443, "epoch": 228} {"train_loss": -7.775639057159424, "global_step": 38444, "epoch": 228} {"train_loss": -7.938206672668457, "global_step": 38445, "epoch": 228} {"train_loss": -7.930400848388672, "global_step": 38446, "epoch": 228} {"train_loss": -7.912437438964844, "global_step": 38447, "epoch": 228} {"train_loss": -8.1272611618042, "global_step": 38448, "epoch": 228} {"train_loss": -7.613402366638184, "global_step": 38449, "epoch": 228} {"train_loss": -8.098493576049805, "global_step": 38450, "epoch": 228} {"train_loss": -7.862946510314941, "global_step": 38451, "epoch": 228} {"train_loss": -7.688455581665039, "global_step": 38452, "epoch": 228} {"train_loss": -7.838898181915283, "global_step": 38453, "epoch": 228} {"train_loss": -7.817355155944824, "global_step": 38454, "epoch": 228} {"train_loss": -7.887276649475098, "global_step": 38455, "epoch": 228} {"train_loss": -7.954873085021973, "global_step": 38456, "epoch": 228} {"train_loss": -7.980033874511719, "global_step": 38457, "epoch": 228} {"train_loss": -7.909206390380859, "global_step": 38458, "epoch": 228} {"train_loss": -7.979793548583984, "global_step": 38459, "epoch": 228} {"train_loss": -7.865757465362549, "global_step": 38460, "epoch": 228} {"train_loss": -7.99733304977417, "global_step": 38461, "epoch": 228} {"train_loss": -7.6928911209106445, "global_step": 38462, "epoch": 228} {"train_loss": -7.76951789855957, "global_step": 38463, "epoch": 228} {"train_loss": -7.63677453994751, "global_step": 38464, "epoch": 228} {"train_loss": -7.689355850219727, "global_step": 38465, "epoch": 228} {"train_loss": -7.88507604598999, "global_step": 38466, "epoch": 228} {"train_loss": -7.478996276855469, "global_step": 38467, "epoch": 228} {"train_loss": -7.841723442077637, "global_step": 38468, "epoch": 228} {"train_loss": -7.683082580566406, "global_step": 38469, "epoch": 228} {"train_loss": -7.946042060852051, "global_step": 38470, "epoch": 228} {"train_loss": -7.819798631327493, "global_step": 38471, "epoch": 228, "val_loss": 186991.265625} {"train_loss": -7.606352806091309, "global_step": 38472, "epoch": 229} {"train_loss": -7.842972278594971, "global_step": 38473, "epoch": 229} {"train_loss": -7.743618965148926, "global_step": 38474, "epoch": 229} {"train_loss": -7.6770148277282715, "global_step": 38475, "epoch": 229} {"train_loss": -7.9669880867004395, "global_step": 38476, "epoch": 229} {"train_loss": -7.726058006286621, "global_step": 38477, "epoch": 229} {"train_loss": -7.990660667419434, "global_step": 38478, "epoch": 229} {"train_loss": -7.8894195556640625, "global_step": 38479, "epoch": 229} {"train_loss": -7.9701032638549805, "global_step": 38480, "epoch": 229} {"train_loss": -7.974123001098633, "global_step": 38481, "epoch": 229} {"train_loss": -7.972326278686523, "global_step": 38482, "epoch": 229} {"train_loss": -7.766473770141602, "global_step": 38483, "epoch": 229} {"train_loss": -7.866873741149902, "global_step": 38484, "epoch": 229} {"train_loss": -7.962904930114746, "global_step": 38485, "epoch": 229} {"train_loss": -7.807876110076904, "global_step": 38486, "epoch": 229} {"train_loss": -7.877474784851074, "global_step": 38487, "epoch": 229} {"train_loss": -7.913058757781982, "global_step": 38488, "epoch": 229} {"train_loss": -7.729448318481445, "global_step": 38489, "epoch": 229} {"train_loss": -8.123661994934082, "global_step": 38490, "epoch": 229} {"train_loss": -7.864059925079346, "global_step": 38491, "epoch": 229} {"train_loss": -7.934074401855469, "global_step": 38492, "epoch": 229} {"train_loss": -8.041399955749512, "global_step": 38493, "epoch": 229} {"train_loss": -7.992598533630371, "global_step": 38494, "epoch": 229} {"train_loss": -8.09703254699707, "global_step": 38495, "epoch": 229} {"train_loss": -7.8116559982299805, "global_step": 38496, "epoch": 229} {"train_loss": -8.109546661376953, "global_step": 38497, "epoch": 229} {"train_loss": -7.8338775634765625, "global_step": 38498, "epoch": 229} {"train_loss": -7.8085432052612305, "global_step": 38499, "epoch": 229} {"train_loss": -7.84050178527832, "global_step": 38500, "epoch": 229} {"train_loss": -7.574509620666504, "global_step": 38501, "epoch": 229} {"train_loss": -8.023581504821777, "global_step": 38502, "epoch": 229} {"train_loss": -7.772862911224365, "global_step": 38503, "epoch": 229} {"train_loss": -7.852652549743652, "global_step": 38504, "epoch": 229} {"train_loss": -7.905674457550049, "global_step": 38505, "epoch": 229} {"train_loss": -7.635954856872559, "global_step": 38506, "epoch": 229} {"train_loss": -8.04580307006836, "global_step": 38507, "epoch": 229} {"train_loss": -7.727397441864014, "global_step": 38508, "epoch": 229} {"train_loss": -7.903467655181885, "global_step": 38509, "epoch": 229} {"train_loss": -7.650276184082031, "global_step": 38510, "epoch": 229} {"train_loss": -7.733865737915039, "global_step": 38511, "epoch": 229} {"train_loss": -7.964466094970703, "global_step": 38512, "epoch": 229} {"train_loss": -7.829680442810059, "global_step": 38513, "epoch": 229} {"train_loss": -7.844411849975586, "global_step": 38514, "epoch": 229} {"train_loss": -7.610989570617676, "global_step": 38515, "epoch": 229} {"train_loss": -7.926839828491211, "global_step": 38516, "epoch": 229} {"train_loss": -7.714762210845947, "global_step": 38517, "epoch": 229} {"train_loss": -7.686332702636719, "global_step": 38518, "epoch": 229} {"train_loss": -7.797607421875, "global_step": 38519, "epoch": 229} {"train_loss": -7.630977630615234, "global_step": 38520, "epoch": 229} {"train_loss": -8.016188621520996, "global_step": 38521, "epoch": 229} {"train_loss": -7.872920036315918, "global_step": 38522, "epoch": 229} {"train_loss": -7.700652122497559, "global_step": 38523, "epoch": 229} {"train_loss": -7.869889259338379, "global_step": 38524, "epoch": 229} {"train_loss": -7.792336463928223, "global_step": 38525, "epoch": 229} {"train_loss": -7.598442077636719, "global_step": 38526, "epoch": 229} {"train_loss": -7.984649658203125, "global_step": 38527, "epoch": 229} {"train_loss": -7.290854454040527, "global_step": 38528, "epoch": 229} {"train_loss": -7.8666229248046875, "global_step": 38529, "epoch": 229} {"train_loss": -7.624612331390381, "global_step": 38530, "epoch": 229} {"train_loss": -7.793056488037109, "global_step": 38531, "epoch": 229} {"train_loss": -7.719579696655273, "global_step": 38532, "epoch": 229} {"train_loss": -7.728964805603027, "global_step": 38533, "epoch": 229} {"train_loss": -7.590695381164551, "global_step": 38534, "epoch": 229} {"train_loss": -7.499927520751953, "global_step": 38535, "epoch": 229} {"train_loss": -7.706132888793945, "global_step": 38536, "epoch": 229} {"train_loss": -7.552023887634277, "global_step": 38537, "epoch": 229} {"train_loss": -7.689990997314453, "global_step": 38538, "epoch": 229} {"train_loss": -7.630406379699707, "global_step": 38539, "epoch": 229} {"train_loss": -7.9137282371521, "global_step": 38540, "epoch": 229} {"train_loss": -7.7494940757751465, "global_step": 38541, "epoch": 229} {"train_loss": -7.6152143478393555, "global_step": 38542, "epoch": 229} {"train_loss": -7.8211164474487305, "global_step": 38543, "epoch": 229} {"train_loss": -7.543951034545898, "global_step": 38544, "epoch": 229} {"train_loss": -7.82004451751709, "global_step": 38545, "epoch": 229} {"train_loss": -7.961750507354736, "global_step": 38546, "epoch": 229} {"train_loss": -7.705521583557129, "global_step": 38547, "epoch": 229} {"train_loss": -7.872047424316406, "global_step": 38548, "epoch": 229} {"train_loss": -7.712266445159912, "global_step": 38549, "epoch": 229} {"train_loss": -7.942418098449707, "global_step": 38550, "epoch": 229} {"train_loss": -7.737880706787109, "global_step": 38551, "epoch": 229} {"train_loss": -7.8444671630859375, "global_step": 38552, "epoch": 229} {"train_loss": -7.94941520690918, "global_step": 38553, "epoch": 229} {"train_loss": -7.79144811630249, "global_step": 38554, "epoch": 229} {"train_loss": -7.8750081062316895, "global_step": 38555, "epoch": 229} {"train_loss": -7.707355499267578, "global_step": 38556, "epoch": 229} {"train_loss": -8.02985954284668, "global_step": 38557, "epoch": 229} {"train_loss": -7.857801914215088, "global_step": 38558, "epoch": 229} {"train_loss": -8.068025588989258, "global_step": 38559, "epoch": 229} {"train_loss": -8.194722175598145, "global_step": 38560, "epoch": 229} {"train_loss": -7.657687664031982, "global_step": 38561, "epoch": 229} {"train_loss": -7.9019598960876465, "global_step": 38562, "epoch": 229} {"train_loss": -7.894533634185791, "global_step": 38563, "epoch": 229} {"train_loss": -7.948685169219971, "global_step": 38564, "epoch": 229} {"train_loss": -7.892491340637207, "global_step": 38565, "epoch": 229} {"train_loss": -7.810303211212158, "global_step": 38566, "epoch": 229} {"train_loss": -7.965452671051025, "global_step": 38567, "epoch": 229} {"train_loss": -7.880021572113037, "global_step": 38568, "epoch": 229} {"train_loss": -7.9665985107421875, "global_step": 38569, "epoch": 229} {"train_loss": -8.018856048583984, "global_step": 38570, "epoch": 229} {"train_loss": -7.95816707611084, "global_step": 38571, "epoch": 229} {"train_loss": -7.994673252105713, "global_step": 38572, "epoch": 229} {"train_loss": -8.008577346801758, "global_step": 38573, "epoch": 229} {"train_loss": -7.734868049621582, "global_step": 38574, "epoch": 229} {"train_loss": -8.13991928100586, "global_step": 38575, "epoch": 229} {"train_loss": -8.066089630126953, "global_step": 38576, "epoch": 229} {"train_loss": -7.919577121734619, "global_step": 38577, "epoch": 229} {"train_loss": -8.110107421875, "global_step": 38578, "epoch": 229} {"train_loss": -7.9600348472595215, "global_step": 38579, "epoch": 229} {"train_loss": -7.938058376312256, "global_step": 38580, "epoch": 229} {"train_loss": -7.919013023376465, "global_step": 38581, "epoch": 229} {"train_loss": -8.203392028808594, "global_step": 38582, "epoch": 229} {"train_loss": -7.880774974822998, "global_step": 38583, "epoch": 229} {"train_loss": -7.9941301345825195, "global_step": 38584, "epoch": 229} {"train_loss": -7.944105625152588, "global_step": 38585, "epoch": 229} {"train_loss": -7.873424530029297, "global_step": 38586, "epoch": 229} {"train_loss": -8.105936050415039, "global_step": 38587, "epoch": 229} {"train_loss": -8.009382247924805, "global_step": 38588, "epoch": 229} {"train_loss": -7.7908172607421875, "global_step": 38589, "epoch": 229} {"train_loss": -8.021839141845703, "global_step": 38590, "epoch": 229} {"train_loss": -8.121329307556152, "global_step": 38591, "epoch": 229} {"train_loss": -7.978788375854492, "global_step": 38592, "epoch": 229} {"train_loss": -8.026205062866211, "global_step": 38593, "epoch": 229} {"train_loss": -8.234127044677734, "global_step": 38594, "epoch": 229} {"train_loss": -7.969639778137207, "global_step": 38595, "epoch": 229} {"train_loss": -8.002887725830078, "global_step": 38596, "epoch": 229} {"train_loss": -7.684779644012451, "global_step": 38597, "epoch": 229} {"train_loss": -7.898465156555176, "global_step": 38598, "epoch": 229} {"train_loss": -7.879889488220215, "global_step": 38599, "epoch": 229} {"train_loss": -7.644159317016602, "global_step": 38600, "epoch": 229} {"train_loss": -7.871058464050293, "global_step": 38601, "epoch": 229} {"train_loss": -7.597239017486572, "global_step": 38602, "epoch": 229} {"train_loss": -7.842174053192139, "global_step": 38603, "epoch": 229} {"train_loss": -7.894186496734619, "global_step": 38604, "epoch": 229} {"train_loss": -7.694453716278076, "global_step": 38605, "epoch": 229} {"train_loss": -7.97612190246582, "global_step": 38606, "epoch": 229} {"train_loss": -7.835960388183594, "global_step": 38607, "epoch": 229} {"train_loss": -7.846072196960449, "global_step": 38608, "epoch": 229} {"train_loss": -7.9311676025390625, "global_step": 38609, "epoch": 229} {"train_loss": -7.892425537109375, "global_step": 38610, "epoch": 229} {"train_loss": -7.936296463012695, "global_step": 38611, "epoch": 229} {"train_loss": -7.851037979125977, "global_step": 38612, "epoch": 229} {"train_loss": -7.8880205154418945, "global_step": 38613, "epoch": 229} {"train_loss": -7.905510902404785, "global_step": 38614, "epoch": 229} {"train_loss": -7.855636119842529, "global_step": 38615, "epoch": 229} {"train_loss": -8.052658081054688, "global_step": 38616, "epoch": 229} {"train_loss": -7.718012809753418, "global_step": 38617, "epoch": 229} {"train_loss": -7.8899641036987305, "global_step": 38618, "epoch": 229} {"train_loss": -8.207714080810547, "global_step": 38619, "epoch": 229} {"train_loss": -7.873046875, "global_step": 38620, "epoch": 229} {"train_loss": -7.932976245880127, "global_step": 38621, "epoch": 229} {"train_loss": -7.862889289855957, "global_step": 38622, "epoch": 229} {"train_loss": -8.004850387573242, "global_step": 38623, "epoch": 229} {"train_loss": -7.856114864349365, "global_step": 38624, "epoch": 229} {"train_loss": -7.802790641784668, "global_step": 38625, "epoch": 229} {"train_loss": -7.799373149871826, "global_step": 38626, "epoch": 229} {"train_loss": -7.849013328552246, "global_step": 38627, "epoch": 229} {"train_loss": -7.802450180053711, "global_step": 38628, "epoch": 229} {"train_loss": -7.855726718902588, "global_step": 38629, "epoch": 229} {"train_loss": -7.823369979858398, "global_step": 38630, "epoch": 229} {"train_loss": -7.916739463806152, "global_step": 38631, "epoch": 229} {"train_loss": -7.636364936828613, "global_step": 38632, "epoch": 229} {"train_loss": -7.7568488121032715, "global_step": 38633, "epoch": 229} {"train_loss": -7.8414506912231445, "global_step": 38634, "epoch": 229} {"train_loss": -7.651639938354492, "global_step": 38635, "epoch": 229} {"train_loss": -8.015722274780273, "global_step": 38636, "epoch": 229} {"train_loss": -8.13383960723877, "global_step": 38637, "epoch": 229} {"train_loss": -7.998557090759277, "global_step": 38638, "epoch": 229} {"train_loss": -7.860902879919324, "global_step": 38639, "epoch": 229, "val_loss": 186754.8125} {"train_loss": -7.897643089294434, "global_step": 38640, "epoch": 230} {"train_loss": -7.81507682800293, "global_step": 38641, "epoch": 230} {"train_loss": -7.942588806152344, "global_step": 38642, "epoch": 230} {"train_loss": -7.805413722991943, "global_step": 38643, "epoch": 230} {"train_loss": -8.077542304992676, "global_step": 38644, "epoch": 230} {"train_loss": -7.852088928222656, "global_step": 38645, "epoch": 230} {"train_loss": -7.896485328674316, "global_step": 38646, "epoch": 230} {"train_loss": -7.881587505340576, "global_step": 38647, "epoch": 230} {"train_loss": -7.901151180267334, "global_step": 38648, "epoch": 230} {"train_loss": -7.77457332611084, "global_step": 38649, "epoch": 230} {"train_loss": -8.018209457397461, "global_step": 38650, "epoch": 230} {"train_loss": -7.856839656829834, "global_step": 38651, "epoch": 230} {"train_loss": -7.856531143188477, "global_step": 38652, "epoch": 230} {"train_loss": -7.896629333496094, "global_step": 38653, "epoch": 230} {"train_loss": -7.879122734069824, "global_step": 38654, "epoch": 230} {"train_loss": -7.511707782745361, "global_step": 38655, "epoch": 230} {"train_loss": -7.943301200866699, "global_step": 38656, "epoch": 230} {"train_loss": -7.653254508972168, "global_step": 38657, "epoch": 230} {"train_loss": -7.489364147186279, "global_step": 38658, "epoch": 230} {"train_loss": -7.898262023925781, "global_step": 38659, "epoch": 230} {"train_loss": -7.7699995040893555, "global_step": 38660, "epoch": 230} {"train_loss": -7.963410377502441, "global_step": 38661, "epoch": 230} {"train_loss": -7.573050498962402, "global_step": 38662, "epoch": 230} {"train_loss": -7.858530044555664, "global_step": 38663, "epoch": 230} {"train_loss": -7.938084602355957, "global_step": 38664, "epoch": 230} {"train_loss": -7.656066417694092, "global_step": 38665, "epoch": 230} {"train_loss": -8.07821273803711, "global_step": 38666, "epoch": 230} {"train_loss": -7.642175197601318, "global_step": 38667, "epoch": 230} {"train_loss": -7.798766136169434, "global_step": 38668, "epoch": 230} {"train_loss": -7.968620300292969, "global_step": 38669, "epoch": 230} {"train_loss": -7.805163860321045, "global_step": 38670, "epoch": 230} {"train_loss": -7.892007827758789, "global_step": 38671, "epoch": 230} {"train_loss": -7.937521457672119, "global_step": 38672, "epoch": 230} {"train_loss": -7.892722129821777, "global_step": 38673, "epoch": 230} {"train_loss": -7.766572952270508, "global_step": 38674, "epoch": 230} {"train_loss": -7.770659446716309, "global_step": 38675, "epoch": 230} {"train_loss": -8.015676498413086, "global_step": 38676, "epoch": 230} {"train_loss": -7.819248199462891, "global_step": 38677, "epoch": 230} {"train_loss": -7.855862617492676, "global_step": 38678, "epoch": 230} {"train_loss": -7.797540664672852, "global_step": 38679, "epoch": 230} {"train_loss": -7.8418192863464355, "global_step": 38680, "epoch": 230} {"train_loss": -8.024948120117188, "global_step": 38681, "epoch": 230} {"train_loss": -7.942676544189453, "global_step": 38682, "epoch": 230} {"train_loss": -7.959027290344238, "global_step": 38683, "epoch": 230} {"train_loss": -7.894984245300293, "global_step": 38684, "epoch": 230} {"train_loss": -7.983554363250732, "global_step": 38685, "epoch": 230} {"train_loss": -7.649428844451904, "global_step": 38686, "epoch": 230} {"train_loss": -8.006620407104492, "global_step": 38687, "epoch": 230} {"train_loss": -8.112174034118652, "global_step": 38688, "epoch": 230} {"train_loss": -7.902480125427246, "global_step": 38689, "epoch": 230} {"train_loss": -7.946897983551025, "global_step": 38690, "epoch": 230} {"train_loss": -7.997691631317139, "global_step": 38691, "epoch": 230} {"train_loss": -7.879612922668457, "global_step": 38692, "epoch": 230} {"train_loss": -7.772715091705322, "global_step": 38693, "epoch": 230} {"train_loss": -8.063679695129395, "global_step": 38694, "epoch": 230} {"train_loss": -7.9883317947387695, "global_step": 38695, "epoch": 230} {"train_loss": -7.742123603820801, "global_step": 38696, "epoch": 230} {"train_loss": -7.922128677368164, "global_step": 38697, "epoch": 230} {"train_loss": -7.840889930725098, "global_step": 38698, "epoch": 230} {"train_loss": -7.76574182510376, "global_step": 38699, "epoch": 230} {"train_loss": -7.898467063903809, "global_step": 38700, "epoch": 230} {"train_loss": -8.011195182800293, "global_step": 38701, "epoch": 230} {"train_loss": -8.076092720031738, "global_step": 38702, "epoch": 230} {"train_loss": -7.718221664428711, "global_step": 38703, "epoch": 230} {"train_loss": -7.811049461364746, "global_step": 38704, "epoch": 230} {"train_loss": -7.960588455200195, "global_step": 38705, "epoch": 230} {"train_loss": -7.736620903015137, "global_step": 38706, "epoch": 230} {"train_loss": -7.878072261810303, "global_step": 38707, "epoch": 230} {"train_loss": -7.930026054382324, "global_step": 38708, "epoch": 230} {"train_loss": -7.766404151916504, "global_step": 38709, "epoch": 230} {"train_loss": -7.900644302368164, "global_step": 38710, "epoch": 230} {"train_loss": -7.848094940185547, "global_step": 38711, "epoch": 230} {"train_loss": -7.587961673736572, "global_step": 38712, "epoch": 230} {"train_loss": -7.87448263168335, "global_step": 38713, "epoch": 230} {"train_loss": -7.951949119567871, "global_step": 38714, "epoch": 230} {"train_loss": -7.7633280754089355, "global_step": 38715, "epoch": 230} {"train_loss": -7.817074775695801, "global_step": 38716, "epoch": 230} {"train_loss": -7.941616058349609, "global_step": 38717, "epoch": 230} {"train_loss": -7.798087120056152, "global_step": 38718, "epoch": 230} {"train_loss": -7.716002464294434, "global_step": 38719, "epoch": 230} {"train_loss": -7.854876518249512, "global_step": 38720, "epoch": 230} {"train_loss": -7.796904563903809, "global_step": 38721, "epoch": 230} {"train_loss": -7.637857913970947, "global_step": 38722, "epoch": 230} {"train_loss": -7.903955936431885, "global_step": 38723, "epoch": 230} {"train_loss": -7.66777229309082, "global_step": 38724, "epoch": 230} {"train_loss": -7.699197769165039, "global_step": 38725, "epoch": 230} {"train_loss": -7.729769229888916, "global_step": 38726, "epoch": 230} {"train_loss": -7.858590126037598, "global_step": 38727, "epoch": 230} {"train_loss": -7.5787763595581055, "global_step": 38728, "epoch": 230} {"train_loss": -7.672391891479492, "global_step": 38729, "epoch": 230} {"train_loss": -7.812427520751953, "global_step": 38730, "epoch": 230} {"train_loss": -7.8338942527771, "global_step": 38731, "epoch": 230} {"train_loss": -7.719760417938232, "global_step": 38732, "epoch": 230} {"train_loss": -7.916020393371582, "global_step": 38733, "epoch": 230} {"train_loss": -7.782854080200195, "global_step": 38734, "epoch": 230} {"train_loss": -7.808817386627197, "global_step": 38735, "epoch": 230} {"train_loss": -7.879383087158203, "global_step": 38736, "epoch": 230} {"train_loss": -7.8755903244018555, "global_step": 38737, "epoch": 230} {"train_loss": -7.695528984069824, "global_step": 38738, "epoch": 230} {"train_loss": -7.721030235290527, "global_step": 38739, "epoch": 230} {"train_loss": -7.911366939544678, "global_step": 38740, "epoch": 230} {"train_loss": -7.899850845336914, "global_step": 38741, "epoch": 230} {"train_loss": -7.582057952880859, "global_step": 38742, "epoch": 230} {"train_loss": -7.874474048614502, "global_step": 38743, "epoch": 230} {"train_loss": -7.631696701049805, "global_step": 38744, "epoch": 230} {"train_loss": -7.8423309326171875, "global_step": 38745, "epoch": 230} {"train_loss": -7.674750804901123, "global_step": 38746, "epoch": 230} {"train_loss": -7.970250606536865, "global_step": 38747, "epoch": 230} {"train_loss": -8.06900405883789, "global_step": 38748, "epoch": 230} {"train_loss": -7.769442081451416, "global_step": 38749, "epoch": 230} {"train_loss": -7.7818450927734375, "global_step": 38750, "epoch": 230} {"train_loss": -7.841078758239746, "global_step": 38751, "epoch": 230} {"train_loss": -7.732212066650391, "global_step": 38752, "epoch": 230} {"train_loss": -7.923635005950928, "global_step": 38753, "epoch": 230} {"train_loss": -7.793149948120117, "global_step": 38754, "epoch": 230} {"train_loss": -8.17271614074707, "global_step": 38755, "epoch": 230} {"train_loss": -7.7547831535339355, "global_step": 38756, "epoch": 230} {"train_loss": -7.907061576843262, "global_step": 38757, "epoch": 230} {"train_loss": -8.070494651794434, "global_step": 38758, "epoch": 230} {"train_loss": -8.040353775024414, "global_step": 38759, "epoch": 230} {"train_loss": -7.92799711227417, "global_step": 38760, "epoch": 230} {"train_loss": -7.8997802734375, "global_step": 38761, "epoch": 230} {"train_loss": -8.044639587402344, "global_step": 38762, "epoch": 230} {"train_loss": -7.892514228820801, "global_step": 38763, "epoch": 230} {"train_loss": -7.891542434692383, "global_step": 38764, "epoch": 230} {"train_loss": -7.798323631286621, "global_step": 38765, "epoch": 230} {"train_loss": -8.014034271240234, "global_step": 38766, "epoch": 230} {"train_loss": -7.840818405151367, "global_step": 38767, "epoch": 230} {"train_loss": -8.136661529541016, "global_step": 38768, "epoch": 230} {"train_loss": -8.039799690246582, "global_step": 38769, "epoch": 230} {"train_loss": -7.95369291305542, "global_step": 38770, "epoch": 230} {"train_loss": -7.929838180541992, "global_step": 38771, "epoch": 230} {"train_loss": -8.056814193725586, "global_step": 38772, "epoch": 230} {"train_loss": -8.057771682739258, "global_step": 38773, "epoch": 230} {"train_loss": -7.831301689147949, "global_step": 38774, "epoch": 230} {"train_loss": -7.902585506439209, "global_step": 38775, "epoch": 230} {"train_loss": -7.8321380615234375, "global_step": 38776, "epoch": 230} {"train_loss": -8.102819442749023, "global_step": 38777, "epoch": 230} {"train_loss": -7.577056884765625, "global_step": 38778, "epoch": 230} {"train_loss": -7.976409435272217, "global_step": 38779, "epoch": 230} {"train_loss": -7.779720306396484, "global_step": 38780, "epoch": 230} {"train_loss": -8.023937225341797, "global_step": 38781, "epoch": 230} {"train_loss": -8.079519271850586, "global_step": 38782, "epoch": 230} {"train_loss": -7.784014701843262, "global_step": 38783, "epoch": 230} {"train_loss": -8.01048755645752, "global_step": 38784, "epoch": 230} {"train_loss": -7.831172943115234, "global_step": 38785, "epoch": 230} {"train_loss": -7.842982769012451, "global_step": 38786, "epoch": 230} {"train_loss": -7.810690879821777, "global_step": 38787, "epoch": 230} {"train_loss": -7.346435546875, "global_step": 38788, "epoch": 230} {"train_loss": -7.883260250091553, "global_step": 38789, "epoch": 230} {"train_loss": -7.563925743103027, "global_step": 38790, "epoch": 230} {"train_loss": -7.643177032470703, "global_step": 38791, "epoch": 230} {"train_loss": -7.972115516662598, "global_step": 38792, "epoch": 230} {"train_loss": -7.860692501068115, "global_step": 38793, "epoch": 230} {"train_loss": -7.734858989715576, "global_step": 38794, "epoch": 230} {"train_loss": -7.701343536376953, "global_step": 38795, "epoch": 230} {"train_loss": -8.035213470458984, "global_step": 38796, "epoch": 230} {"train_loss": -7.383022785186768, "global_step": 38797, "epoch": 230} {"train_loss": -7.664763927459717, "global_step": 38798, "epoch": 230} {"train_loss": -7.574371337890625, "global_step": 38799, "epoch": 230} {"train_loss": -7.965575695037842, "global_step": 38800, "epoch": 230} {"train_loss": -7.606036186218262, "global_step": 38801, "epoch": 230} {"train_loss": -7.699001312255859, "global_step": 38802, "epoch": 230} {"train_loss": -7.7947306632995605, "global_step": 38803, "epoch": 230} {"train_loss": -7.656938076019287, "global_step": 38804, "epoch": 230} {"train_loss": -7.612410068511963, "global_step": 38805, "epoch": 230} {"train_loss": -7.725480079650879, "global_step": 38806, "epoch": 230} {"train_loss": -7.841448849155789, "global_step": 38807, "epoch": 230, "val_loss": 185786.65625, "train_action_mse_error": 16.486595153808594} {"train_loss": -7.802035808563232, "global_step": 38808, "epoch": 231} {"train_loss": -7.452105522155762, "global_step": 38809, "epoch": 231} {"train_loss": -7.861289024353027, "global_step": 38810, "epoch": 231} {"train_loss": -7.864589214324951, "global_step": 38811, "epoch": 231} {"train_loss": -7.829724311828613, "global_step": 38812, "epoch": 231} {"train_loss": -7.889277935028076, "global_step": 38813, "epoch": 231} {"train_loss": -8.11960220336914, "global_step": 38814, "epoch": 231} {"train_loss": -7.742606163024902, "global_step": 38815, "epoch": 231} {"train_loss": -7.5474748611450195, "global_step": 38816, "epoch": 231} {"train_loss": -7.815115928649902, "global_step": 38817, "epoch": 231} {"train_loss": -7.940047740936279, "global_step": 38818, "epoch": 231} {"train_loss": -7.916957378387451, "global_step": 38819, "epoch": 231} {"train_loss": -7.952532768249512, "global_step": 38820, "epoch": 231} {"train_loss": -7.691099643707275, "global_step": 38821, "epoch": 231} {"train_loss": -7.895235061645508, "global_step": 38822, "epoch": 231} {"train_loss": -7.903998374938965, "global_step": 38823, "epoch": 231} {"train_loss": -7.944392204284668, "global_step": 38824, "epoch": 231} {"train_loss": -7.885861873626709, "global_step": 38825, "epoch": 231} {"train_loss": -7.722265243530273, "global_step": 38826, "epoch": 231} {"train_loss": -7.991033554077148, "global_step": 38827, "epoch": 231} {"train_loss": -7.739253997802734, "global_step": 38828, "epoch": 231} {"train_loss": -7.863950252532959, "global_step": 38829, "epoch": 231} {"train_loss": -8.035126686096191, "global_step": 38830, "epoch": 231} {"train_loss": -7.843168258666992, "global_step": 38831, "epoch": 231} {"train_loss": -7.937700271606445, "global_step": 38832, "epoch": 231} {"train_loss": -7.896150588989258, "global_step": 38833, "epoch": 231} {"train_loss": -7.824166774749756, "global_step": 38834, "epoch": 231} {"train_loss": -7.655967712402344, "global_step": 38835, "epoch": 231} {"train_loss": -8.015998840332031, "global_step": 38836, "epoch": 231} {"train_loss": -7.635420322418213, "global_step": 38837, "epoch": 231} {"train_loss": -7.867865085601807, "global_step": 38838, "epoch": 231} {"train_loss": -7.787142276763916, "global_step": 38839, "epoch": 231} {"train_loss": -7.82065486907959, "global_step": 38840, "epoch": 231} {"train_loss": -7.7765960693359375, "global_step": 38841, "epoch": 231} {"train_loss": -7.806955337524414, "global_step": 38842, "epoch": 231} {"train_loss": -7.937585353851318, "global_step": 38843, "epoch": 231} {"train_loss": -7.509885787963867, "global_step": 38844, "epoch": 231} {"train_loss": -7.9566545486450195, "global_step": 38845, "epoch": 231} {"train_loss": -7.815428733825684, "global_step": 38846, "epoch": 231} {"train_loss": -7.879965782165527, "global_step": 38847, "epoch": 231} {"train_loss": -7.906335830688477, "global_step": 38848, "epoch": 231} {"train_loss": -7.990799903869629, "global_step": 38849, "epoch": 231} {"train_loss": -7.672097206115723, "global_step": 38850, "epoch": 231} {"train_loss": -8.094099998474121, "global_step": 38851, "epoch": 231} {"train_loss": -8.024845123291016, "global_step": 38852, "epoch": 231} {"train_loss": -7.880308151245117, "global_step": 38853, "epoch": 231} {"train_loss": -8.133722305297852, "global_step": 38854, "epoch": 231} {"train_loss": -8.054115295410156, "global_step": 38855, "epoch": 231} {"train_loss": -8.000459671020508, "global_step": 38856, "epoch": 231} {"train_loss": -8.086320877075195, "global_step": 38857, "epoch": 231} {"train_loss": -8.089383125305176, "global_step": 38858, "epoch": 231} {"train_loss": -7.940102577209473, "global_step": 38859, "epoch": 231} {"train_loss": -8.017364501953125, "global_step": 38860, "epoch": 231} {"train_loss": -7.851264953613281, "global_step": 38861, "epoch": 231} {"train_loss": -7.84503698348999, "global_step": 38862, "epoch": 231} {"train_loss": -7.914181232452393, "global_step": 38863, "epoch": 231} {"train_loss": -7.709214210510254, "global_step": 38864, "epoch": 231} {"train_loss": -8.025964736938477, "global_step": 38865, "epoch": 231} {"train_loss": -8.048433303833008, "global_step": 38866, "epoch": 231} {"train_loss": -7.894078731536865, "global_step": 38867, "epoch": 231} {"train_loss": -7.873201370239258, "global_step": 38868, "epoch": 231} {"train_loss": -7.915432929992676, "global_step": 38869, "epoch": 231} {"train_loss": -7.749427795410156, "global_step": 38870, "epoch": 231} {"train_loss": -7.627035140991211, "global_step": 38871, "epoch": 231} {"train_loss": -8.001602172851562, "global_step": 38872, "epoch": 231} {"train_loss": -7.664013385772705, "global_step": 38873, "epoch": 231} {"train_loss": -8.003045082092285, "global_step": 38874, "epoch": 231} {"train_loss": -7.937819957733154, "global_step": 38875, "epoch": 231} {"train_loss": -7.772050857543945, "global_step": 38876, "epoch": 231} {"train_loss": -7.735558986663818, "global_step": 38877, "epoch": 231} {"train_loss": -8.047372817993164, "global_step": 38878, "epoch": 231} {"train_loss": -7.6145830154418945, "global_step": 38879, "epoch": 231} {"train_loss": -8.00475025177002, "global_step": 38880, "epoch": 231} {"train_loss": -7.705056190490723, "global_step": 38881, "epoch": 231} {"train_loss": -7.833693504333496, "global_step": 38882, "epoch": 231} {"train_loss": -7.881516933441162, "global_step": 38883, "epoch": 231} {"train_loss": -7.686539173126221, "global_step": 38884, "epoch": 231} {"train_loss": -7.8858113288879395, "global_step": 38885, "epoch": 231} {"train_loss": -7.754635810852051, "global_step": 38886, "epoch": 231} {"train_loss": -7.8797831535339355, "global_step": 38887, "epoch": 231} {"train_loss": -7.743721008300781, "global_step": 38888, "epoch": 231} {"train_loss": -7.911823272705078, "global_step": 38889, "epoch": 231} {"train_loss": -7.887765884399414, "global_step": 38890, "epoch": 231} {"train_loss": -7.744298934936523, "global_step": 38891, "epoch": 231} {"train_loss": -7.902285575866699, "global_step": 38892, "epoch": 231} {"train_loss": -7.703272819519043, "global_step": 38893, "epoch": 231} {"train_loss": -7.525919437408447, "global_step": 38894, "epoch": 231} {"train_loss": -7.900771617889404, "global_step": 38895, "epoch": 231} {"train_loss": -7.764121055603027, "global_step": 38896, "epoch": 231} {"train_loss": -7.901780605316162, "global_step": 38897, "epoch": 231} {"train_loss": -7.694337368011475, "global_step": 38898, "epoch": 231} {"train_loss": -7.916572570800781, "global_step": 38899, "epoch": 231} {"train_loss": -7.811139106750488, "global_step": 38900, "epoch": 231} {"train_loss": -7.889553070068359, "global_step": 38901, "epoch": 231} {"train_loss": -7.942544937133789, "global_step": 38902, "epoch": 231} {"train_loss": -7.6141486167907715, "global_step": 38903, "epoch": 231} {"train_loss": -7.889361381530762, "global_step": 38904, "epoch": 231} {"train_loss": -7.846333980560303, "global_step": 38905, "epoch": 231} {"train_loss": -8.009881019592285, "global_step": 38906, "epoch": 231} {"train_loss": -7.693811416625977, "global_step": 38907, "epoch": 231} {"train_loss": -8.06401252746582, "global_step": 38908, "epoch": 231} {"train_loss": -8.10084342956543, "global_step": 38909, "epoch": 231} {"train_loss": -7.721540927886963, "global_step": 38910, "epoch": 231} {"train_loss": -7.845520973205566, "global_step": 38911, "epoch": 231} {"train_loss": -7.9287896156311035, "global_step": 38912, "epoch": 231} {"train_loss": -7.837665557861328, "global_step": 38913, "epoch": 231} {"train_loss": -8.031366348266602, "global_step": 38914, "epoch": 231} {"train_loss": -7.885420799255371, "global_step": 38915, "epoch": 231} {"train_loss": -7.899863243103027, "global_step": 38916, "epoch": 231} {"train_loss": -7.955841541290283, "global_step": 38917, "epoch": 231} {"train_loss": -7.911525249481201, "global_step": 38918, "epoch": 231} {"train_loss": -8.07858657836914, "global_step": 38919, "epoch": 231} {"train_loss": -8.03786849975586, "global_step": 38920, "epoch": 231} {"train_loss": -7.793100833892822, "global_step": 38921, "epoch": 231} {"train_loss": -7.961464881896973, "global_step": 38922, "epoch": 231} {"train_loss": -7.930881023406982, "global_step": 38923, "epoch": 231} {"train_loss": -8.083585739135742, "global_step": 38924, "epoch": 231} {"train_loss": -7.796281337738037, "global_step": 38925, "epoch": 231} {"train_loss": -7.934189319610596, "global_step": 38926, "epoch": 231} {"train_loss": -7.983978271484375, "global_step": 38927, "epoch": 231} {"train_loss": -8.019740104675293, "global_step": 38928, "epoch": 231} {"train_loss": -8.056916236877441, "global_step": 38929, "epoch": 231} {"train_loss": -8.004518508911133, "global_step": 38930, "epoch": 231} {"train_loss": -7.894428730010986, "global_step": 38931, "epoch": 231} {"train_loss": -7.921932220458984, "global_step": 38932, "epoch": 231} {"train_loss": -7.834439754486084, "global_step": 38933, "epoch": 231} {"train_loss": -7.845426082611084, "global_step": 38934, "epoch": 231} {"train_loss": -7.866013526916504, "global_step": 38935, "epoch": 231} {"train_loss": -8.036877632141113, "global_step": 38936, "epoch": 231} {"train_loss": -7.990541458129883, "global_step": 38937, "epoch": 231} {"train_loss": -7.909356117248535, "global_step": 38938, "epoch": 231} {"train_loss": -7.845551490783691, "global_step": 38939, "epoch": 231} {"train_loss": -7.5926055908203125, "global_step": 38940, "epoch": 231} {"train_loss": -7.863532066345215, "global_step": 38941, "epoch": 231} {"train_loss": -7.838456153869629, "global_step": 38942, "epoch": 231} {"train_loss": -8.006019592285156, "global_step": 38943, "epoch": 231} {"train_loss": -7.951211929321289, "global_step": 38944, "epoch": 231} {"train_loss": -7.741565704345703, "global_step": 38945, "epoch": 231} {"train_loss": -7.839868068695068, "global_step": 38946, "epoch": 231} {"train_loss": -7.909013748168945, "global_step": 38947, "epoch": 231} {"train_loss": -8.085420608520508, "global_step": 38948, "epoch": 231} {"train_loss": -7.809056758880615, "global_step": 38949, "epoch": 231} {"train_loss": -8.032713890075684, "global_step": 38950, "epoch": 231} {"train_loss": -7.797567844390869, "global_step": 38951, "epoch": 231} {"train_loss": -7.949378490447998, "global_step": 38952, "epoch": 231} {"train_loss": -7.861762523651123, "global_step": 38953, "epoch": 231} {"train_loss": -8.020284652709961, "global_step": 38954, "epoch": 231} {"train_loss": -7.904860496520996, "global_step": 38955, "epoch": 231} {"train_loss": -7.9591827392578125, "global_step": 38956, "epoch": 231} {"train_loss": -7.908766746520996, "global_step": 38957, "epoch": 231} {"train_loss": -8.057781219482422, "global_step": 38958, "epoch": 231} {"train_loss": -7.856805801391602, "global_step": 38959, "epoch": 231} {"train_loss": -7.909255027770996, "global_step": 38960, "epoch": 231} {"train_loss": -7.589128494262695, "global_step": 38961, "epoch": 231} {"train_loss": -7.7294464111328125, "global_step": 38962, "epoch": 231} {"train_loss": -7.8153204917907715, "global_step": 38963, "epoch": 231} {"train_loss": -8.039809226989746, "global_step": 38964, "epoch": 231} {"train_loss": -7.9469313621521, "global_step": 38965, "epoch": 231} {"train_loss": -8.100030899047852, "global_step": 38966, "epoch": 231} {"train_loss": -8.101722717285156, "global_step": 38967, "epoch": 231} {"train_loss": -8.062015533447266, "global_step": 38968, "epoch": 231} {"train_loss": -7.837273120880127, "global_step": 38969, "epoch": 231} {"train_loss": -8.09559440612793, "global_step": 38970, "epoch": 231} {"train_loss": -7.920714378356934, "global_step": 38971, "epoch": 231} {"train_loss": -7.806371688842773, "global_step": 38972, "epoch": 231} {"train_loss": -7.890993595123291, "global_step": 38973, "epoch": 231} {"train_loss": -8.047455787658691, "global_step": 38974, "epoch": 231} {"train_loss": -7.8830807861827665, "global_step": 38975, "epoch": 231, "val_loss": 186975.265625} {"train_loss": -7.952773094177246, "global_step": 38976, "epoch": 232} {"train_loss": -7.83226203918457, "global_step": 38977, "epoch": 232} {"train_loss": -7.941163063049316, "global_step": 38978, "epoch": 232} {"train_loss": -7.565801620483398, "global_step": 38979, "epoch": 232} {"train_loss": -7.8954386711120605, "global_step": 38980, "epoch": 232} {"train_loss": -7.922069072723389, "global_step": 38981, "epoch": 232} {"train_loss": -8.14060115814209, "global_step": 38982, "epoch": 232} {"train_loss": -7.849210739135742, "global_step": 38983, "epoch": 232} {"train_loss": -7.910365104675293, "global_step": 38984, "epoch": 232} {"train_loss": -7.579547882080078, "global_step": 38985, "epoch": 232} {"train_loss": -7.999436378479004, "global_step": 38986, "epoch": 232} {"train_loss": -7.880781173706055, "global_step": 38987, "epoch": 232} {"train_loss": -7.885002613067627, "global_step": 38988, "epoch": 232} {"train_loss": -8.003519058227539, "global_step": 38989, "epoch": 232} {"train_loss": -8.008593559265137, "global_step": 38990, "epoch": 232} {"train_loss": -7.8288726806640625, "global_step": 38991, "epoch": 232} {"train_loss": -8.10737133026123, "global_step": 38992, "epoch": 232} {"train_loss": -7.966240406036377, "global_step": 38993, "epoch": 232} {"train_loss": -7.977584362030029, "global_step": 38994, "epoch": 232} {"train_loss": -7.979246139526367, "global_step": 38995, "epoch": 232} {"train_loss": -7.889180660247803, "global_step": 38996, "epoch": 232} {"train_loss": -7.94765567779541, "global_step": 38997, "epoch": 232} {"train_loss": -7.995023727416992, "global_step": 38998, "epoch": 232} {"train_loss": -8.007709503173828, "global_step": 38999, "epoch": 232} {"train_loss": -8.060577392578125, "global_step": 39000, "epoch": 232} {"train_loss": -8.096173286437988, "global_step": 39001, "epoch": 232} {"train_loss": -7.642324924468994, "global_step": 39002, "epoch": 232} {"train_loss": -7.924991130828857, "global_step": 39003, "epoch": 232} {"train_loss": -7.882781982421875, "global_step": 39004, "epoch": 232} {"train_loss": -8.011392593383789, "global_step": 39005, "epoch": 232} {"train_loss": -8.18400764465332, "global_step": 39006, "epoch": 232} {"train_loss": -8.108687400817871, "global_step": 39007, "epoch": 232} {"train_loss": -7.761498928070068, "global_step": 39008, "epoch": 232} {"train_loss": -7.882843017578125, "global_step": 39009, "epoch": 232} {"train_loss": -8.047175407409668, "global_step": 39010, "epoch": 232} {"train_loss": -7.928086757659912, "global_step": 39011, "epoch": 232} {"train_loss": -7.810744285583496, "global_step": 39012, "epoch": 232} {"train_loss": -8.257461547851562, "global_step": 39013, "epoch": 232} {"train_loss": -8.099225044250488, "global_step": 39014, "epoch": 232} {"train_loss": -8.09366226196289, "global_step": 39015, "epoch": 232} {"train_loss": -8.02331829071045, "global_step": 39016, "epoch": 232} {"train_loss": -7.991608619689941, "global_step": 39017, "epoch": 232} {"train_loss": -8.127412796020508, "global_step": 39018, "epoch": 232} {"train_loss": -7.870242118835449, "global_step": 39019, "epoch": 232} {"train_loss": -8.075834274291992, "global_step": 39020, "epoch": 232} {"train_loss": -7.883539199829102, "global_step": 39021, "epoch": 232} {"train_loss": -8.122980117797852, "global_step": 39022, "epoch": 232} {"train_loss": -7.96188497543335, "global_step": 39023, "epoch": 232} {"train_loss": -8.002582550048828, "global_step": 39024, "epoch": 232} {"train_loss": -7.854804515838623, "global_step": 39025, "epoch": 232} {"train_loss": -7.94337797164917, "global_step": 39026, "epoch": 232} {"train_loss": -8.033641815185547, "global_step": 39027, "epoch": 232} {"train_loss": -7.9773478507995605, "global_step": 39028, "epoch": 232} {"train_loss": -7.926412582397461, "global_step": 39029, "epoch": 232} {"train_loss": -7.649763107299805, "global_step": 39030, "epoch": 232} {"train_loss": -7.800570487976074, "global_step": 39031, "epoch": 232} {"train_loss": -8.082053184509277, "global_step": 39032, "epoch": 232} {"train_loss": -7.625069618225098, "global_step": 39033, "epoch": 232} {"train_loss": -8.031024932861328, "global_step": 39034, "epoch": 232} {"train_loss": -7.904453277587891, "global_step": 39035, "epoch": 232} {"train_loss": -7.9605817794799805, "global_step": 39036, "epoch": 232} {"train_loss": -8.01246166229248, "global_step": 39037, "epoch": 232} {"train_loss": -7.913614273071289, "global_step": 39038, "epoch": 232} {"train_loss": -8.032718658447266, "global_step": 39039, "epoch": 232} {"train_loss": -7.888742446899414, "global_step": 39040, "epoch": 232} {"train_loss": -7.688516139984131, "global_step": 39041, "epoch": 232} {"train_loss": -7.948144912719727, "global_step": 39042, "epoch": 232} {"train_loss": -7.760743141174316, "global_step": 39043, "epoch": 232} {"train_loss": -7.899824142456055, "global_step": 39044, "epoch": 232} {"train_loss": -7.685132026672363, "global_step": 39045, "epoch": 232} {"train_loss": -8.080366134643555, "global_step": 39046, "epoch": 232} {"train_loss": -7.758877754211426, "global_step": 39047, "epoch": 232} {"train_loss": -7.702051162719727, "global_step": 39048, "epoch": 232} {"train_loss": -7.821867942810059, "global_step": 39049, "epoch": 232} {"train_loss": -7.861482620239258, "global_step": 39050, "epoch": 232} {"train_loss": -7.744147300720215, "global_step": 39051, "epoch": 232} {"train_loss": -7.748995780944824, "global_step": 39052, "epoch": 232} {"train_loss": -7.937841415405273, "global_step": 39053, "epoch": 232} {"train_loss": -7.794531345367432, "global_step": 39054, "epoch": 232} {"train_loss": -7.900398254394531, "global_step": 39055, "epoch": 232} {"train_loss": -7.894434928894043, "global_step": 39056, "epoch": 232} {"train_loss": -7.816626071929932, "global_step": 39057, "epoch": 232} {"train_loss": -7.6560797691345215, "global_step": 39058, "epoch": 232} {"train_loss": -7.705807685852051, "global_step": 39059, "epoch": 232} {"train_loss": -7.831387519836426, "global_step": 39060, "epoch": 232} {"train_loss": -8.065170288085938, "global_step": 39061, "epoch": 232} {"train_loss": -7.972961902618408, "global_step": 39062, "epoch": 232} {"train_loss": -7.933108329772949, "global_step": 39063, "epoch": 232} {"train_loss": -7.971764087677002, "global_step": 39064, "epoch": 232} {"train_loss": -7.782602310180664, "global_step": 39065, "epoch": 232} {"train_loss": -7.915018558502197, "global_step": 39066, "epoch": 232} {"train_loss": -7.864323616027832, "global_step": 39067, "epoch": 232} {"train_loss": -8.03044319152832, "global_step": 39068, "epoch": 232} {"train_loss": -7.988246440887451, "global_step": 39069, "epoch": 232} {"train_loss": -7.803865909576416, "global_step": 39070, "epoch": 232} {"train_loss": -8.006444931030273, "global_step": 39071, "epoch": 232} {"train_loss": -8.077329635620117, "global_step": 39072, "epoch": 232} {"train_loss": -7.983938217163086, "global_step": 39073, "epoch": 232} {"train_loss": -7.938035488128662, "global_step": 39074, "epoch": 232} {"train_loss": -8.103019714355469, "global_step": 39075, "epoch": 232} {"train_loss": -7.966804504394531, "global_step": 39076, "epoch": 232} {"train_loss": -8.10639762878418, "global_step": 39077, "epoch": 232} {"train_loss": -7.927846908569336, "global_step": 39078, "epoch": 232} {"train_loss": -8.170794486999512, "global_step": 39079, "epoch": 232} {"train_loss": -8.088062286376953, "global_step": 39080, "epoch": 232} {"train_loss": -7.982020854949951, "global_step": 39081, "epoch": 232} {"train_loss": -7.9170732498168945, "global_step": 39082, "epoch": 232} {"train_loss": -7.979777812957764, "global_step": 39083, "epoch": 232} {"train_loss": -7.809296607971191, "global_step": 39084, "epoch": 232} {"train_loss": -7.770008563995361, "global_step": 39085, "epoch": 232} {"train_loss": -7.78388786315918, "global_step": 39086, "epoch": 232} {"train_loss": -8.022960662841797, "global_step": 39087, "epoch": 232} {"train_loss": -7.7865777015686035, "global_step": 39088, "epoch": 232} {"train_loss": -7.733558654785156, "global_step": 39089, "epoch": 232} {"train_loss": -7.9103851318359375, "global_step": 39090, "epoch": 232} {"train_loss": -7.945054054260254, "global_step": 39091, "epoch": 232} {"train_loss": -7.9454450607299805, "global_step": 39092, "epoch": 232} {"train_loss": -7.881495952606201, "global_step": 39093, "epoch": 232} {"train_loss": -7.929027080535889, "global_step": 39094, "epoch": 232} {"train_loss": -7.821893692016602, "global_step": 39095, "epoch": 232} {"train_loss": -7.796960353851318, "global_step": 39096, "epoch": 232} {"train_loss": -8.07791519165039, "global_step": 39097, "epoch": 232} {"train_loss": -7.90910530090332, "global_step": 39098, "epoch": 232} {"train_loss": -7.929269790649414, "global_step": 39099, "epoch": 232} {"train_loss": -7.778563976287842, "global_step": 39100, "epoch": 232} {"train_loss": -7.829198360443115, "global_step": 39101, "epoch": 232} {"train_loss": -7.892127990722656, "global_step": 39102, "epoch": 232} {"train_loss": -7.956650733947754, "global_step": 39103, "epoch": 232} {"train_loss": -7.865346908569336, "global_step": 39104, "epoch": 232} {"train_loss": -7.910251617431641, "global_step": 39105, "epoch": 232} {"train_loss": -7.890555381774902, "global_step": 39106, "epoch": 232} {"train_loss": -8.072793960571289, "global_step": 39107, "epoch": 232} {"train_loss": -7.812065124511719, "global_step": 39108, "epoch": 232} {"train_loss": -7.772510528564453, "global_step": 39109, "epoch": 232} {"train_loss": -7.800042629241943, "global_step": 39110, "epoch": 232} {"train_loss": -7.66885232925415, "global_step": 39111, "epoch": 232} {"train_loss": -8.026002883911133, "global_step": 39112, "epoch": 232} {"train_loss": -7.827073097229004, "global_step": 39113, "epoch": 232} {"train_loss": -8.101669311523438, "global_step": 39114, "epoch": 232} {"train_loss": -7.70783805847168, "global_step": 39115, "epoch": 232} {"train_loss": -7.961493492126465, "global_step": 39116, "epoch": 232} {"train_loss": -7.913863182067871, "global_step": 39117, "epoch": 232} {"train_loss": -8.02132797241211, "global_step": 39118, "epoch": 232} {"train_loss": -7.995511531829834, "global_step": 39119, "epoch": 232} {"train_loss": -7.90246057510376, "global_step": 39120, "epoch": 232} {"train_loss": -7.8754472732543945, "global_step": 39121, "epoch": 232} {"train_loss": -8.039113998413086, "global_step": 39122, "epoch": 232} {"train_loss": -7.868832588195801, "global_step": 39123, "epoch": 232} {"train_loss": -7.712434768676758, "global_step": 39124, "epoch": 232} {"train_loss": -8.005636215209961, "global_step": 39125, "epoch": 232} {"train_loss": -7.9162678718566895, "global_step": 39126, "epoch": 232} {"train_loss": -7.890499591827393, "global_step": 39127, "epoch": 232} {"train_loss": -8.025046348571777, "global_step": 39128, "epoch": 232} {"train_loss": -7.906389236450195, "global_step": 39129, "epoch": 232} {"train_loss": -7.992315292358398, "global_step": 39130, "epoch": 232} {"train_loss": -7.8405890464782715, "global_step": 39131, "epoch": 232} {"train_loss": -8.084916114807129, "global_step": 39132, "epoch": 232} {"train_loss": -7.6213531494140625, "global_step": 39133, "epoch": 232} {"train_loss": -8.003718376159668, "global_step": 39134, "epoch": 232} {"train_loss": -7.569665908813477, "global_step": 39135, "epoch": 232} {"train_loss": -7.737429141998291, "global_step": 39136, "epoch": 232} {"train_loss": -7.696703910827637, "global_step": 39137, "epoch": 232} {"train_loss": -7.895758152008057, "global_step": 39138, "epoch": 232} {"train_loss": -7.615881443023682, "global_step": 39139, "epoch": 232} {"train_loss": -7.956118583679199, "global_step": 39140, "epoch": 232} {"train_loss": -7.723803997039795, "global_step": 39141, "epoch": 232} {"train_loss": -7.847011566162109, "global_step": 39142, "epoch": 232} {"train_loss": -7.909598239830562, "global_step": 39143, "epoch": 232, "val_loss": 187841.296875} {"train_loss": -8.002772331237793, "global_step": 39144, "epoch": 233} {"train_loss": -7.816366672515869, "global_step": 39145, "epoch": 233} {"train_loss": -7.82413387298584, "global_step": 39146, "epoch": 233} {"train_loss": -7.664175033569336, "global_step": 39147, "epoch": 233} {"train_loss": -7.622994422912598, "global_step": 39148, "epoch": 233} {"train_loss": -7.465699195861816, "global_step": 39149, "epoch": 233} {"train_loss": -7.611456871032715, "global_step": 39150, "epoch": 233} {"train_loss": -8.013175964355469, "global_step": 39151, "epoch": 233} {"train_loss": -7.384063243865967, "global_step": 39152, "epoch": 233} {"train_loss": -7.4962029457092285, "global_step": 39153, "epoch": 233} {"train_loss": -7.627684116363525, "global_step": 39154, "epoch": 233} {"train_loss": -7.806517124176025, "global_step": 39155, "epoch": 233} {"train_loss": -7.700366973876953, "global_step": 39156, "epoch": 233} {"train_loss": -7.899840831756592, "global_step": 39157, "epoch": 233} {"train_loss": -7.736937522888184, "global_step": 39158, "epoch": 233} {"train_loss": -7.752771377563477, "global_step": 39159, "epoch": 233} {"train_loss": -7.902904987335205, "global_step": 39160, "epoch": 233} {"train_loss": -7.700957298278809, "global_step": 39161, "epoch": 233} {"train_loss": -7.881122589111328, "global_step": 39162, "epoch": 233} {"train_loss": -7.902796745300293, "global_step": 39163, "epoch": 233} {"train_loss": -7.9506072998046875, "global_step": 39164, "epoch": 233} {"train_loss": -7.733363628387451, "global_step": 39165, "epoch": 233} {"train_loss": -7.660414695739746, "global_step": 39166, "epoch": 233} {"train_loss": -7.677319526672363, "global_step": 39167, "epoch": 233} {"train_loss": -7.879215240478516, "global_step": 39168, "epoch": 233} {"train_loss": -7.679900169372559, "global_step": 39169, "epoch": 233} {"train_loss": -7.5969367027282715, "global_step": 39170, "epoch": 233} {"train_loss": -7.712564468383789, "global_step": 39171, "epoch": 233} {"train_loss": -7.756566047668457, "global_step": 39172, "epoch": 233} {"train_loss": -7.853409767150879, "global_step": 39173, "epoch": 233} {"train_loss": -7.70552921295166, "global_step": 39174, "epoch": 233} {"train_loss": -7.900689125061035, "global_step": 39175, "epoch": 233} {"train_loss": -7.787441253662109, "global_step": 39176, "epoch": 233} {"train_loss": -7.878330230712891, "global_step": 39177, "epoch": 233} {"train_loss": -8.035688400268555, "global_step": 39178, "epoch": 233} {"train_loss": -7.844608306884766, "global_step": 39179, "epoch": 233} {"train_loss": -7.784954071044922, "global_step": 39180, "epoch": 233} {"train_loss": -7.938211441040039, "global_step": 39181, "epoch": 233} {"train_loss": -8.034357070922852, "global_step": 39182, "epoch": 233} {"train_loss": -8.012447357177734, "global_step": 39183, "epoch": 233} {"train_loss": -8.048628807067871, "global_step": 39184, "epoch": 233} {"train_loss": -7.662904739379883, "global_step": 39185, "epoch": 233} {"train_loss": -7.881299018859863, "global_step": 39186, "epoch": 233} {"train_loss": -8.04123592376709, "global_step": 39187, "epoch": 233} {"train_loss": -7.985726833343506, "global_step": 39188, "epoch": 233} {"train_loss": -8.014039993286133, "global_step": 39189, "epoch": 233} {"train_loss": -7.812666893005371, "global_step": 39190, "epoch": 233} {"train_loss": -7.8697381019592285, "global_step": 39191, "epoch": 233} {"train_loss": -7.853979587554932, "global_step": 39192, "epoch": 233} {"train_loss": -7.934622287750244, "global_step": 39193, "epoch": 233} {"train_loss": -7.781550407409668, "global_step": 39194, "epoch": 233} {"train_loss": -7.944857120513916, "global_step": 39195, "epoch": 233} {"train_loss": -8.009535789489746, "global_step": 39196, "epoch": 233} {"train_loss": -7.733399868011475, "global_step": 39197, "epoch": 233} {"train_loss": -7.881991863250732, "global_step": 39198, "epoch": 233} {"train_loss": -7.697103500366211, "global_step": 39199, "epoch": 233} {"train_loss": -7.927994251251221, "global_step": 39200, "epoch": 233} {"train_loss": -7.882543563842773, "global_step": 39201, "epoch": 233} {"train_loss": -7.847048759460449, "global_step": 39202, "epoch": 233} {"train_loss": -7.920652866363525, "global_step": 39203, "epoch": 233} {"train_loss": -7.988321304321289, "global_step": 39204, "epoch": 233} {"train_loss": -8.018285751342773, "global_step": 39205, "epoch": 233} {"train_loss": -7.855835437774658, "global_step": 39206, "epoch": 233} {"train_loss": -7.808804512023926, "global_step": 39207, "epoch": 233} {"train_loss": -7.845678806304932, "global_step": 39208, "epoch": 233} {"train_loss": -7.854918479919434, "global_step": 39209, "epoch": 233} {"train_loss": -7.891051292419434, "global_step": 39210, "epoch": 233} {"train_loss": -7.736478328704834, "global_step": 39211, "epoch": 233} {"train_loss": -7.911064624786377, "global_step": 39212, "epoch": 233} {"train_loss": -7.964177131652832, "global_step": 39213, "epoch": 233} {"train_loss": -7.669524192810059, "global_step": 39214, "epoch": 233} {"train_loss": -7.7820258140563965, "global_step": 39215, "epoch": 233} {"train_loss": -7.59757661819458, "global_step": 39216, "epoch": 233} {"train_loss": -7.708130836486816, "global_step": 39217, "epoch": 233} {"train_loss": -7.6100053787231445, "global_step": 39218, "epoch": 233} {"train_loss": -7.751543998718262, "global_step": 39219, "epoch": 233} {"train_loss": -7.901342868804932, "global_step": 39220, "epoch": 233} {"train_loss": -7.652233123779297, "global_step": 39221, "epoch": 233} {"train_loss": -7.719084739685059, "global_step": 39222, "epoch": 233} {"train_loss": -7.7223052978515625, "global_step": 39223, "epoch": 233} {"train_loss": -7.882762908935547, "global_step": 39224, "epoch": 233} {"train_loss": -7.680805206298828, "global_step": 39225, "epoch": 233} {"train_loss": -7.931575775146484, "global_step": 39226, "epoch": 233} {"train_loss": -7.857304096221924, "global_step": 39227, "epoch": 233} {"train_loss": -7.811402320861816, "global_step": 39228, "epoch": 233} {"train_loss": -8.170011520385742, "global_step": 39229, "epoch": 233} {"train_loss": -7.822241306304932, "global_step": 39230, "epoch": 233} {"train_loss": -7.943944454193115, "global_step": 39231, "epoch": 233} {"train_loss": -7.87473201751709, "global_step": 39232, "epoch": 233} {"train_loss": -8.124028205871582, "global_step": 39233, "epoch": 233} {"train_loss": -8.112598419189453, "global_step": 39234, "epoch": 233} {"train_loss": -8.059530258178711, "global_step": 39235, "epoch": 233} {"train_loss": -7.836435317993164, "global_step": 39236, "epoch": 233} {"train_loss": -8.061286926269531, "global_step": 39237, "epoch": 233} {"train_loss": -7.908990383148193, "global_step": 39238, "epoch": 233} {"train_loss": -8.024118423461914, "global_step": 39239, "epoch": 233} {"train_loss": -8.154607772827148, "global_step": 39240, "epoch": 233} {"train_loss": -8.02761459350586, "global_step": 39241, "epoch": 233} {"train_loss": -8.140645980834961, "global_step": 39242, "epoch": 233} {"train_loss": -8.014936447143555, "global_step": 39243, "epoch": 233} {"train_loss": -8.069690704345703, "global_step": 39244, "epoch": 233} {"train_loss": -8.025489807128906, "global_step": 39245, "epoch": 233} {"train_loss": -8.174386978149414, "global_step": 39246, "epoch": 233} {"train_loss": -7.870674133300781, "global_step": 39247, "epoch": 233} {"train_loss": -7.7956342697143555, "global_step": 39248, "epoch": 233} {"train_loss": -8.1429443359375, "global_step": 39249, "epoch": 233} {"train_loss": -8.107301712036133, "global_step": 39250, "epoch": 233} {"train_loss": -8.03524398803711, "global_step": 39251, "epoch": 233} {"train_loss": -8.0513277053833, "global_step": 39252, "epoch": 233} {"train_loss": -7.9309468269348145, "global_step": 39253, "epoch": 233} {"train_loss": -7.770026206970215, "global_step": 39254, "epoch": 233} {"train_loss": -8.222431182861328, "global_step": 39255, "epoch": 233} {"train_loss": -7.762601852416992, "global_step": 39256, "epoch": 233} {"train_loss": -7.911924362182617, "global_step": 39257, "epoch": 233} {"train_loss": -8.015679359436035, "global_step": 39258, "epoch": 233} {"train_loss": -7.525307655334473, "global_step": 39259, "epoch": 233} {"train_loss": -7.709515571594238, "global_step": 39260, "epoch": 233} {"train_loss": -7.719488143920898, "global_step": 39261, "epoch": 233} {"train_loss": -7.4275078773498535, "global_step": 39262, "epoch": 233} {"train_loss": -7.874745845794678, "global_step": 39263, "epoch": 233} {"train_loss": -7.795012950897217, "global_step": 39264, "epoch": 233} {"train_loss": -7.670597076416016, "global_step": 39265, "epoch": 233} {"train_loss": -7.771707534790039, "global_step": 39266, "epoch": 233} {"train_loss": -7.938576698303223, "global_step": 39267, "epoch": 233} {"train_loss": -7.854750633239746, "global_step": 39268, "epoch": 233} {"train_loss": -7.64361572265625, "global_step": 39269, "epoch": 233} {"train_loss": -7.908099174499512, "global_step": 39270, "epoch": 233} {"train_loss": -7.953583717346191, "global_step": 39271, "epoch": 233} {"train_loss": -7.627575397491455, "global_step": 39272, "epoch": 233} {"train_loss": -7.965723991394043, "global_step": 39273, "epoch": 233} {"train_loss": -7.822970390319824, "global_step": 39274, "epoch": 233} {"train_loss": -7.905714988708496, "global_step": 39275, "epoch": 233} {"train_loss": -7.879228591918945, "global_step": 39276, "epoch": 233} {"train_loss": -8.134008407592773, "global_step": 39277, "epoch": 233} {"train_loss": -7.946078300476074, "global_step": 39278, "epoch": 233} {"train_loss": -7.964167594909668, "global_step": 39279, "epoch": 233} {"train_loss": -7.966019153594971, "global_step": 39280, "epoch": 233} {"train_loss": -7.963026523590088, "global_step": 39281, "epoch": 233} {"train_loss": -7.740899562835693, "global_step": 39282, "epoch": 233} {"train_loss": -8.11473274230957, "global_step": 39283, "epoch": 233} {"train_loss": -7.921302795410156, "global_step": 39284, "epoch": 233} {"train_loss": -7.9534711837768555, "global_step": 39285, "epoch": 233} {"train_loss": -7.706212043762207, "global_step": 39286, "epoch": 233} {"train_loss": -7.907474517822266, "global_step": 39287, "epoch": 233} {"train_loss": -8.058870315551758, "global_step": 39288, "epoch": 233} {"train_loss": -7.9283366203308105, "global_step": 39289, "epoch": 233} {"train_loss": -8.081911087036133, "global_step": 39290, "epoch": 233} {"train_loss": -7.901065826416016, "global_step": 39291, "epoch": 233} {"train_loss": -8.03388786315918, "global_step": 39292, "epoch": 233} {"train_loss": -7.75444221496582, "global_step": 39293, "epoch": 233} {"train_loss": -7.559669494628906, "global_step": 39294, "epoch": 233} {"train_loss": -8.021024703979492, "global_step": 39295, "epoch": 233} {"train_loss": -7.857146263122559, "global_step": 39296, "epoch": 233} {"train_loss": -7.864788055419922, "global_step": 39297, "epoch": 233} {"train_loss": -7.590151786804199, "global_step": 39298, "epoch": 233} {"train_loss": -7.919301986694336, "global_step": 39299, "epoch": 233} {"train_loss": -7.910830974578857, "global_step": 39300, "epoch": 233} {"train_loss": -7.710230827331543, "global_step": 39301, "epoch": 233} {"train_loss": -7.8919477462768555, "global_step": 39302, "epoch": 233} {"train_loss": -7.802017688751221, "global_step": 39303, "epoch": 233} {"train_loss": -7.976409912109375, "global_step": 39304, "epoch": 233} {"train_loss": -7.440521240234375, "global_step": 39305, "epoch": 233} {"train_loss": -7.909355163574219, "global_step": 39306, "epoch": 233} {"train_loss": -7.921531677246094, "global_step": 39307, "epoch": 233} {"train_loss": -7.9491071701049805, "global_step": 39308, "epoch": 233} {"train_loss": -7.77976131439209, "global_step": 39309, "epoch": 233} {"train_loss": -7.972991943359375, "global_step": 39310, "epoch": 233} {"train_loss": -7.858030427069891, "global_step": 39311, "epoch": 233, "val_loss": 188050.875} {"train_loss": -7.57327938079834, "global_step": 39312, "epoch": 234} {"train_loss": -8.043619155883789, "global_step": 39313, "epoch": 234} {"train_loss": -7.705137252807617, "global_step": 39314, "epoch": 234} {"train_loss": -7.928905487060547, "global_step": 39315, "epoch": 234} {"train_loss": -7.880675792694092, "global_step": 39316, "epoch": 234} {"train_loss": -7.880265712738037, "global_step": 39317, "epoch": 234} {"train_loss": -7.937780857086182, "global_step": 39318, "epoch": 234} {"train_loss": -8.082291603088379, "global_step": 39319, "epoch": 234} {"train_loss": -7.769296646118164, "global_step": 39320, "epoch": 234} {"train_loss": -7.806047439575195, "global_step": 39321, "epoch": 234} {"train_loss": -7.9537553787231445, "global_step": 39322, "epoch": 234} {"train_loss": -7.707033157348633, "global_step": 39323, "epoch": 234} {"train_loss": -7.873972415924072, "global_step": 39324, "epoch": 234} {"train_loss": -7.577754974365234, "global_step": 39325, "epoch": 234} {"train_loss": -8.090927124023438, "global_step": 39326, "epoch": 234} {"train_loss": -7.915585041046143, "global_step": 39327, "epoch": 234} {"train_loss": -7.668736934661865, "global_step": 39328, "epoch": 234} {"train_loss": -7.807710647583008, "global_step": 39329, "epoch": 234} {"train_loss": -7.914738178253174, "global_step": 39330, "epoch": 234} {"train_loss": -7.883333206176758, "global_step": 39331, "epoch": 234} {"train_loss": -7.972884178161621, "global_step": 39332, "epoch": 234} {"train_loss": -7.8860578536987305, "global_step": 39333, "epoch": 234} {"train_loss": -7.8459930419921875, "global_step": 39334, "epoch": 234} {"train_loss": -7.798815727233887, "global_step": 39335, "epoch": 234} {"train_loss": -8.060224533081055, "global_step": 39336, "epoch": 234} {"train_loss": -7.796561241149902, "global_step": 39337, "epoch": 234} {"train_loss": -7.671151161193848, "global_step": 39338, "epoch": 234} {"train_loss": -8.165316581726074, "global_step": 39339, "epoch": 234} {"train_loss": -7.944545269012451, "global_step": 39340, "epoch": 234} {"train_loss": -7.8523030281066895, "global_step": 39341, "epoch": 234} {"train_loss": -7.9658122062683105, "global_step": 39342, "epoch": 234} {"train_loss": -8.048686981201172, "global_step": 39343, "epoch": 234} {"train_loss": -8.072129249572754, "global_step": 39344, "epoch": 234} {"train_loss": -7.937227249145508, "global_step": 39345, "epoch": 234} {"train_loss": -8.035961151123047, "global_step": 39346, "epoch": 234} {"train_loss": -8.090311050415039, "global_step": 39347, "epoch": 234} {"train_loss": -7.950511932373047, "global_step": 39348, "epoch": 234} {"train_loss": -8.10982894897461, "global_step": 39349, "epoch": 234} {"train_loss": -8.12074089050293, "global_step": 39350, "epoch": 234} {"train_loss": -8.10319709777832, "global_step": 39351, "epoch": 234} {"train_loss": -8.150252342224121, "global_step": 39352, "epoch": 234} {"train_loss": -7.744762897491455, "global_step": 39353, "epoch": 234} {"train_loss": -7.930949687957764, "global_step": 39354, "epoch": 234} {"train_loss": -7.805952548980713, "global_step": 39355, "epoch": 234} {"train_loss": -8.001714706420898, "global_step": 39356, "epoch": 234} {"train_loss": -7.806509494781494, "global_step": 39357, "epoch": 234} {"train_loss": -7.594963550567627, "global_step": 39358, "epoch": 234} {"train_loss": -7.9618072509765625, "global_step": 39359, "epoch": 234} {"train_loss": -8.028550148010254, "global_step": 39360, "epoch": 234} {"train_loss": -7.887032985687256, "global_step": 39361, "epoch": 234} {"train_loss": -7.923147678375244, "global_step": 39362, "epoch": 234} {"train_loss": -7.813929557800293, "global_step": 39363, "epoch": 234} {"train_loss": -7.671407699584961, "global_step": 39364, "epoch": 234} {"train_loss": -7.843259811401367, "global_step": 39365, "epoch": 234} {"train_loss": -7.776391983032227, "global_step": 39366, "epoch": 234} {"train_loss": -7.788360595703125, "global_step": 39367, "epoch": 234} {"train_loss": -8.050643920898438, "global_step": 39368, "epoch": 234} {"train_loss": -7.696563720703125, "global_step": 39369, "epoch": 234} {"train_loss": -7.8712029457092285, "global_step": 39370, "epoch": 234} {"train_loss": -7.795161247253418, "global_step": 39371, "epoch": 234} {"train_loss": -7.872587203979492, "global_step": 39372, "epoch": 234} {"train_loss": -7.6922078132629395, "global_step": 39373, "epoch": 234} {"train_loss": -7.913261413574219, "global_step": 39374, "epoch": 234} {"train_loss": -7.667221546173096, "global_step": 39375, "epoch": 234} {"train_loss": -8.073759078979492, "global_step": 39376, "epoch": 234} {"train_loss": -7.967564105987549, "global_step": 39377, "epoch": 234} {"train_loss": -7.936010360717773, "global_step": 39378, "epoch": 234} {"train_loss": -7.649171829223633, "global_step": 39379, "epoch": 234} {"train_loss": -8.055554389953613, "global_step": 39380, "epoch": 234} {"train_loss": -7.883289337158203, "global_step": 39381, "epoch": 234} {"train_loss": -7.564362525939941, "global_step": 39382, "epoch": 234} {"train_loss": -7.707763195037842, "global_step": 39383, "epoch": 234} {"train_loss": -7.809028148651123, "global_step": 39384, "epoch": 234} {"train_loss": -7.848812103271484, "global_step": 39385, "epoch": 234} {"train_loss": -7.748687744140625, "global_step": 39386, "epoch": 234} {"train_loss": -7.849451065063477, "global_step": 39387, "epoch": 234} {"train_loss": -7.91577672958374, "global_step": 39388, "epoch": 234} {"train_loss": -8.067000389099121, "global_step": 39389, "epoch": 234} {"train_loss": -8.142095565795898, "global_step": 39390, "epoch": 234} {"train_loss": -8.000240325927734, "global_step": 39391, "epoch": 234} {"train_loss": -7.933950424194336, "global_step": 39392, "epoch": 234} {"train_loss": -7.789176940917969, "global_step": 39393, "epoch": 234} {"train_loss": -8.076193809509277, "global_step": 39394, "epoch": 234} {"train_loss": -7.966129302978516, "global_step": 39395, "epoch": 234} {"train_loss": -7.719448089599609, "global_step": 39396, "epoch": 234} {"train_loss": -8.067069053649902, "global_step": 39397, "epoch": 234} {"train_loss": -7.678199291229248, "global_step": 39398, "epoch": 234} {"train_loss": -7.968094348907471, "global_step": 39399, "epoch": 234} {"train_loss": -7.81904935836792, "global_step": 39400, "epoch": 234} {"train_loss": -8.015948295593262, "global_step": 39401, "epoch": 234} {"train_loss": -7.950555801391602, "global_step": 39402, "epoch": 234} {"train_loss": -8.007821083068848, "global_step": 39403, "epoch": 234} {"train_loss": -7.630234241485596, "global_step": 39404, "epoch": 234} {"train_loss": -7.753490447998047, "global_step": 39405, "epoch": 234} {"train_loss": -7.786283493041992, "global_step": 39406, "epoch": 234} {"train_loss": -7.8761887550354, "global_step": 39407, "epoch": 234} {"train_loss": -7.880915641784668, "global_step": 39408, "epoch": 234} {"train_loss": -7.818667888641357, "global_step": 39409, "epoch": 234} {"train_loss": -7.754344940185547, "global_step": 39410, "epoch": 234} {"train_loss": -7.903570175170898, "global_step": 39411, "epoch": 234} {"train_loss": -7.703358173370361, "global_step": 39412, "epoch": 234} {"train_loss": -7.9336700439453125, "global_step": 39413, "epoch": 234} {"train_loss": -7.8830766677856445, "global_step": 39414, "epoch": 234} {"train_loss": -7.861854553222656, "global_step": 39415, "epoch": 234} {"train_loss": -7.9035162925720215, "global_step": 39416, "epoch": 234} {"train_loss": -7.752618789672852, "global_step": 39417, "epoch": 234} {"train_loss": -7.7860918045043945, "global_step": 39418, "epoch": 234} {"train_loss": -7.678990364074707, "global_step": 39419, "epoch": 234} {"train_loss": -7.830672264099121, "global_step": 39420, "epoch": 234} {"train_loss": -7.957343578338623, "global_step": 39421, "epoch": 234} {"train_loss": -7.765878677368164, "global_step": 39422, "epoch": 234} {"train_loss": -7.637395858764648, "global_step": 39423, "epoch": 234} {"train_loss": -7.898813247680664, "global_step": 39424, "epoch": 234} {"train_loss": -7.976691246032715, "global_step": 39425, "epoch": 234} {"train_loss": -7.830942153930664, "global_step": 39426, "epoch": 234} {"train_loss": -7.762802600860596, "global_step": 39427, "epoch": 234} {"train_loss": -7.697970390319824, "global_step": 39428, "epoch": 234} {"train_loss": -8.037759780883789, "global_step": 39429, "epoch": 234} {"train_loss": -7.93312931060791, "global_step": 39430, "epoch": 234} {"train_loss": -7.85176420211792, "global_step": 39431, "epoch": 234} {"train_loss": -8.013771057128906, "global_step": 39432, "epoch": 234} {"train_loss": -7.913241386413574, "global_step": 39433, "epoch": 234} {"train_loss": -8.018636703491211, "global_step": 39434, "epoch": 234} {"train_loss": -8.029496192932129, "global_step": 39435, "epoch": 234} {"train_loss": -7.90910530090332, "global_step": 39436, "epoch": 234} {"train_loss": -8.034786224365234, "global_step": 39437, "epoch": 234} {"train_loss": -7.845256328582764, "global_step": 39438, "epoch": 234} {"train_loss": -7.7995147705078125, "global_step": 39439, "epoch": 234} {"train_loss": -7.951915740966797, "global_step": 39440, "epoch": 234} {"train_loss": -8.019994735717773, "global_step": 39441, "epoch": 234} {"train_loss": -8.027414321899414, "global_step": 39442, "epoch": 234} {"train_loss": -8.007341384887695, "global_step": 39443, "epoch": 234} {"train_loss": -8.02613353729248, "global_step": 39444, "epoch": 234} {"train_loss": -7.9410319328308105, "global_step": 39445, "epoch": 234} {"train_loss": -8.029555320739746, "global_step": 39446, "epoch": 234} {"train_loss": -7.998781681060791, "global_step": 39447, "epoch": 234} {"train_loss": -7.996236801147461, "global_step": 39448, "epoch": 234} {"train_loss": -8.000625610351562, "global_step": 39449, "epoch": 234} {"train_loss": -7.93996000289917, "global_step": 39450, "epoch": 234} {"train_loss": -8.097259521484375, "global_step": 39451, "epoch": 234} {"train_loss": -8.163025856018066, "global_step": 39452, "epoch": 234} {"train_loss": -8.05840015411377, "global_step": 39453, "epoch": 234} {"train_loss": -8.021217346191406, "global_step": 39454, "epoch": 234} {"train_loss": -8.146284103393555, "global_step": 39455, "epoch": 234} {"train_loss": -7.986555099487305, "global_step": 39456, "epoch": 234} {"train_loss": -7.990968704223633, "global_step": 39457, "epoch": 234} {"train_loss": -8.105226516723633, "global_step": 39458, "epoch": 234} {"train_loss": -8.014015197753906, "global_step": 39459, "epoch": 234} {"train_loss": -8.05633544921875, "global_step": 39460, "epoch": 234} {"train_loss": -8.102507591247559, "global_step": 39461, "epoch": 234} {"train_loss": -8.134817123413086, "global_step": 39462, "epoch": 234} {"train_loss": -7.923605918884277, "global_step": 39463, "epoch": 234} {"train_loss": -8.100956916809082, "global_step": 39464, "epoch": 234} {"train_loss": -8.0610933303833, "global_step": 39465, "epoch": 234} {"train_loss": -7.967012405395508, "global_step": 39466, "epoch": 234} {"train_loss": -8.074943542480469, "global_step": 39467, "epoch": 234} {"train_loss": -7.884047508239746, "global_step": 39468, "epoch": 234} {"train_loss": -8.160993576049805, "global_step": 39469, "epoch": 234} {"train_loss": -8.005359649658203, "global_step": 39470, "epoch": 234} {"train_loss": -7.535236835479736, "global_step": 39471, "epoch": 234} {"train_loss": -7.996944904327393, "global_step": 39472, "epoch": 234} {"train_loss": -7.725840091705322, "global_step": 39473, "epoch": 234} {"train_loss": -7.917593002319336, "global_step": 39474, "epoch": 234} {"train_loss": -8.084114074707031, "global_step": 39475, "epoch": 234} {"train_loss": -7.848641395568848, "global_step": 39476, "epoch": 234} {"train_loss": -7.609116554260254, "global_step": 39477, "epoch": 234} {"train_loss": -7.867003440856934, "global_step": 39478, "epoch": 234} {"train_loss": -7.9046008955864675, "global_step": 39479, "epoch": 234, "val_loss": 192505.03125} {"train_loss": -8.14148998260498, "global_step": 39480, "epoch": 235} {"train_loss": -7.940638065338135, "global_step": 39481, "epoch": 235} {"train_loss": -7.975125789642334, "global_step": 39482, "epoch": 235} {"train_loss": -8.012389183044434, "global_step": 39483, "epoch": 235} {"train_loss": -8.002665519714355, "global_step": 39484, "epoch": 235} {"train_loss": -7.929755210876465, "global_step": 39485, "epoch": 235} {"train_loss": -7.773975372314453, "global_step": 39486, "epoch": 235} {"train_loss": -7.97425651550293, "global_step": 39487, "epoch": 235} {"train_loss": -8.016249656677246, "global_step": 39488, "epoch": 235} {"train_loss": -7.904232978820801, "global_step": 39489, "epoch": 235} {"train_loss": -7.939125061035156, "global_step": 39490, "epoch": 235} {"train_loss": -7.861235618591309, "global_step": 39491, "epoch": 235} {"train_loss": -7.800380229949951, "global_step": 39492, "epoch": 235} {"train_loss": -7.8216400146484375, "global_step": 39493, "epoch": 235} {"train_loss": -8.025940895080566, "global_step": 39494, "epoch": 235} {"train_loss": -7.7087249755859375, "global_step": 39495, "epoch": 235} {"train_loss": -8.019948959350586, "global_step": 39496, "epoch": 235} {"train_loss": -7.558355331420898, "global_step": 39497, "epoch": 235} {"train_loss": -7.879205703735352, "global_step": 39498, "epoch": 235} {"train_loss": -7.518670082092285, "global_step": 39499, "epoch": 235} {"train_loss": -7.9873151779174805, "global_step": 39500, "epoch": 235} {"train_loss": -7.937043190002441, "global_step": 39501, "epoch": 235} {"train_loss": -7.8884992599487305, "global_step": 39502, "epoch": 235} {"train_loss": -7.5916571617126465, "global_step": 39503, "epoch": 235} {"train_loss": -7.49893856048584, "global_step": 39504, "epoch": 235} {"train_loss": -7.942006587982178, "global_step": 39505, "epoch": 235} {"train_loss": -7.9053053855896, "global_step": 39506, "epoch": 235} {"train_loss": -7.7694172859191895, "global_step": 39507, "epoch": 235} {"train_loss": -7.746844291687012, "global_step": 39508, "epoch": 235} {"train_loss": -7.886172771453857, "global_step": 39509, "epoch": 235} {"train_loss": -7.79201078414917, "global_step": 39510, "epoch": 235} {"train_loss": -7.579079627990723, "global_step": 39511, "epoch": 235} {"train_loss": -7.683894157409668, "global_step": 39512, "epoch": 235} {"train_loss": -7.901020050048828, "global_step": 39513, "epoch": 235} {"train_loss": -7.897229194641113, "global_step": 39514, "epoch": 235} {"train_loss": -7.680027961730957, "global_step": 39515, "epoch": 235} {"train_loss": -7.765641212463379, "global_step": 39516, "epoch": 235} {"train_loss": -8.090539932250977, "global_step": 39517, "epoch": 235} {"train_loss": -7.75700044631958, "global_step": 39518, "epoch": 235} {"train_loss": -7.8236188888549805, "global_step": 39519, "epoch": 235} {"train_loss": -7.807051181793213, "global_step": 39520, "epoch": 235} {"train_loss": -8.130239486694336, "global_step": 39521, "epoch": 235} {"train_loss": -7.817112922668457, "global_step": 39522, "epoch": 235} {"train_loss": -8.020880699157715, "global_step": 39523, "epoch": 235} {"train_loss": -8.002628326416016, "global_step": 39524, "epoch": 235} {"train_loss": -8.042717933654785, "global_step": 39525, "epoch": 235} {"train_loss": -7.931483745574951, "global_step": 39526, "epoch": 235} {"train_loss": -7.845876216888428, "global_step": 39527, "epoch": 235} {"train_loss": -7.854645252227783, "global_step": 39528, "epoch": 235} {"train_loss": -7.881381988525391, "global_step": 39529, "epoch": 235} {"train_loss": -7.9976701736450195, "global_step": 39530, "epoch": 235} {"train_loss": -7.986853122711182, "global_step": 39531, "epoch": 235} {"train_loss": -7.802374839782715, "global_step": 39532, "epoch": 235} {"train_loss": -7.892677307128906, "global_step": 39533, "epoch": 235} {"train_loss": -7.872326850891113, "global_step": 39534, "epoch": 235} {"train_loss": -7.773163795471191, "global_step": 39535, "epoch": 235} {"train_loss": -8.052682876586914, "global_step": 39536, "epoch": 235} {"train_loss": -7.8577880859375, "global_step": 39537, "epoch": 235} {"train_loss": -7.952281951904297, "global_step": 39538, "epoch": 235} {"train_loss": -7.886775970458984, "global_step": 39539, "epoch": 235} {"train_loss": -7.72514533996582, "global_step": 39540, "epoch": 235} {"train_loss": -7.913151264190674, "global_step": 39541, "epoch": 235} {"train_loss": -8.002398490905762, "global_step": 39542, "epoch": 235} {"train_loss": -7.853248596191406, "global_step": 39543, "epoch": 235} {"train_loss": -7.994744300842285, "global_step": 39544, "epoch": 235} {"train_loss": -7.949800968170166, "global_step": 39545, "epoch": 235} {"train_loss": -7.9432854652404785, "global_step": 39546, "epoch": 235} {"train_loss": -7.810632705688477, "global_step": 39547, "epoch": 235} {"train_loss": -7.90708589553833, "global_step": 39548, "epoch": 235} {"train_loss": -7.75180721282959, "global_step": 39549, "epoch": 235} {"train_loss": -8.007448196411133, "global_step": 39550, "epoch": 235} {"train_loss": -7.861649513244629, "global_step": 39551, "epoch": 235} {"train_loss": -7.920086860656738, "global_step": 39552, "epoch": 235} {"train_loss": -7.918170928955078, "global_step": 39553, "epoch": 235} {"train_loss": -8.299808502197266, "global_step": 39554, "epoch": 235} {"train_loss": -7.934728622436523, "global_step": 39555, "epoch": 235} {"train_loss": -8.021160125732422, "global_step": 39556, "epoch": 235} {"train_loss": -8.004718780517578, "global_step": 39557, "epoch": 235} {"train_loss": -8.040250778198242, "global_step": 39558, "epoch": 235} {"train_loss": -7.885171890258789, "global_step": 39559, "epoch": 235} {"train_loss": -8.035343170166016, "global_step": 39560, "epoch": 235} {"train_loss": -8.036182403564453, "global_step": 39561, "epoch": 235} {"train_loss": -7.929940223693848, "global_step": 39562, "epoch": 235} {"train_loss": -7.647201061248779, "global_step": 39563, "epoch": 235} {"train_loss": -8.053998947143555, "global_step": 39564, "epoch": 235} {"train_loss": -7.9103899002075195, "global_step": 39565, "epoch": 235} {"train_loss": -7.924630641937256, "global_step": 39566, "epoch": 235} {"train_loss": -8.091796875, "global_step": 39567, "epoch": 235} {"train_loss": -8.06981086730957, "global_step": 39568, "epoch": 235} {"train_loss": -8.353815078735352, "global_step": 39569, "epoch": 235} {"train_loss": -8.30732536315918, "global_step": 39570, "epoch": 235} {"train_loss": -8.016145706176758, "global_step": 39571, "epoch": 235} {"train_loss": -8.043991088867188, "global_step": 39572, "epoch": 235} {"train_loss": -7.875055313110352, "global_step": 39573, "epoch": 235} {"train_loss": -7.87172794342041, "global_step": 39574, "epoch": 235} {"train_loss": -8.090265274047852, "global_step": 39575, "epoch": 235} {"train_loss": -7.969538688659668, "global_step": 39576, "epoch": 235} {"train_loss": -7.6710052490234375, "global_step": 39577, "epoch": 235} {"train_loss": -7.926422595977783, "global_step": 39578, "epoch": 235} {"train_loss": -8.076696395874023, "global_step": 39579, "epoch": 235} {"train_loss": -7.907015800476074, "global_step": 39580, "epoch": 235} {"train_loss": -7.949485778808594, "global_step": 39581, "epoch": 235} {"train_loss": -8.125202178955078, "global_step": 39582, "epoch": 235} {"train_loss": -7.9917144775390625, "global_step": 39583, "epoch": 235} {"train_loss": -7.728302478790283, "global_step": 39584, "epoch": 235} {"train_loss": -8.048152923583984, "global_step": 39585, "epoch": 235} {"train_loss": -7.774482727050781, "global_step": 39586, "epoch": 235} {"train_loss": -7.978421211242676, "global_step": 39587, "epoch": 235} {"train_loss": -8.067638397216797, "global_step": 39588, "epoch": 235} {"train_loss": -8.012004852294922, "global_step": 39589, "epoch": 235} {"train_loss": -7.636223793029785, "global_step": 39590, "epoch": 235} {"train_loss": -7.941309452056885, "global_step": 39591, "epoch": 235} {"train_loss": -8.095682144165039, "global_step": 39592, "epoch": 235} {"train_loss": -8.092964172363281, "global_step": 39593, "epoch": 235} {"train_loss": -7.8024444580078125, "global_step": 39594, "epoch": 235} {"train_loss": -8.182001113891602, "global_step": 39595, "epoch": 235} {"train_loss": -7.902856826782227, "global_step": 39596, "epoch": 235} {"train_loss": -7.9256134033203125, "global_step": 39597, "epoch": 235} {"train_loss": -8.010551452636719, "global_step": 39598, "epoch": 235} {"train_loss": -7.854639053344727, "global_step": 39599, "epoch": 235} {"train_loss": -7.974410533905029, "global_step": 39600, "epoch": 235} {"train_loss": -7.902799606323242, "global_step": 39601, "epoch": 235} {"train_loss": -7.830577850341797, "global_step": 39602, "epoch": 235} {"train_loss": -7.88424015045166, "global_step": 39603, "epoch": 235} {"train_loss": -8.074902534484863, "global_step": 39604, "epoch": 235} {"train_loss": -7.653267860412598, "global_step": 39605, "epoch": 235} {"train_loss": -8.098861694335938, "global_step": 39606, "epoch": 235} {"train_loss": -7.75889253616333, "global_step": 39607, "epoch": 235} {"train_loss": -7.960616111755371, "global_step": 39608, "epoch": 235} {"train_loss": -7.696136474609375, "global_step": 39609, "epoch": 235} {"train_loss": -8.071349143981934, "global_step": 39610, "epoch": 235} {"train_loss": -7.962716102600098, "global_step": 39611, "epoch": 235} {"train_loss": -7.6724348068237305, "global_step": 39612, "epoch": 235} {"train_loss": -7.8025407791137695, "global_step": 39613, "epoch": 235} {"train_loss": -7.9218950271606445, "global_step": 39614, "epoch": 235} {"train_loss": -7.901831150054932, "global_step": 39615, "epoch": 235} {"train_loss": -7.636795997619629, "global_step": 39616, "epoch": 235} {"train_loss": -7.89262056350708, "global_step": 39617, "epoch": 235} {"train_loss": -7.940000534057617, "global_step": 39618, "epoch": 235} {"train_loss": -7.9526567459106445, "global_step": 39619, "epoch": 235} {"train_loss": -7.819726943969727, "global_step": 39620, "epoch": 235} {"train_loss": -7.853930473327637, "global_step": 39621, "epoch": 235} {"train_loss": -7.864145278930664, "global_step": 39622, "epoch": 235} {"train_loss": -8.03874397277832, "global_step": 39623, "epoch": 235} {"train_loss": -7.816237449645996, "global_step": 39624, "epoch": 235} {"train_loss": -7.654414653778076, "global_step": 39625, "epoch": 235} {"train_loss": -7.938078880310059, "global_step": 39626, "epoch": 235} {"train_loss": -7.620945930480957, "global_step": 39627, "epoch": 235} {"train_loss": -7.888387680053711, "global_step": 39628, "epoch": 235} {"train_loss": -7.940016746520996, "global_step": 39629, "epoch": 235} {"train_loss": -7.826732635498047, "global_step": 39630, "epoch": 235} {"train_loss": -7.872743606567383, "global_step": 39631, "epoch": 235} {"train_loss": -7.722516059875488, "global_step": 39632, "epoch": 235} {"train_loss": -7.988578796386719, "global_step": 39633, "epoch": 235} {"train_loss": -7.659209728240967, "global_step": 39634, "epoch": 235} {"train_loss": -7.992388725280762, "global_step": 39635, "epoch": 235} {"train_loss": -7.9405341148376465, "global_step": 39636, "epoch": 235} {"train_loss": -7.850411415100098, "global_step": 39637, "epoch": 235} {"train_loss": -7.766866207122803, "global_step": 39638, "epoch": 235} {"train_loss": -8.13074779510498, "global_step": 39639, "epoch": 235} {"train_loss": -7.730330467224121, "global_step": 39640, "epoch": 235} {"train_loss": -7.743896484375, "global_step": 39641, "epoch": 235} {"train_loss": -7.7693586349487305, "global_step": 39642, "epoch": 235} {"train_loss": -7.8132405281066895, "global_step": 39643, "epoch": 235} {"train_loss": -7.849647521972656, "global_step": 39644, "epoch": 235} {"train_loss": -8.030922889709473, "global_step": 39645, "epoch": 235} {"train_loss": -7.983574867248535, "global_step": 39646, "epoch": 235} {"train_loss": -7.901445999031975, "global_step": 39647, "epoch": 235, "val_loss": 183782.90625, "train_action_mse_error": 11.64102840423584} {"train_loss": -7.823999881744385, "global_step": 39648, "epoch": 236} {"train_loss": -8.059490203857422, "global_step": 39649, "epoch": 236} {"train_loss": -7.781113624572754, "global_step": 39650, "epoch": 236} {"train_loss": -7.898286819458008, "global_step": 39651, "epoch": 236} {"train_loss": -7.7750139236450195, "global_step": 39652, "epoch": 236} {"train_loss": -7.784641742706299, "global_step": 39653, "epoch": 236} {"train_loss": -7.6857452392578125, "global_step": 39654, "epoch": 236} {"train_loss": -7.9031548500061035, "global_step": 39655, "epoch": 236} {"train_loss": -7.719935417175293, "global_step": 39656, "epoch": 236} {"train_loss": -7.889628887176514, "global_step": 39657, "epoch": 236} {"train_loss": -7.854640483856201, "global_step": 39658, "epoch": 236} {"train_loss": -7.952866077423096, "global_step": 39659, "epoch": 236} {"train_loss": -7.689085483551025, "global_step": 39660, "epoch": 236} {"train_loss": -7.793124198913574, "global_step": 39661, "epoch": 236} {"train_loss": -7.997797966003418, "global_step": 39662, "epoch": 236} {"train_loss": -7.894808292388916, "global_step": 39663, "epoch": 236} {"train_loss": -8.017538070678711, "global_step": 39664, "epoch": 236} {"train_loss": -7.801774978637695, "global_step": 39665, "epoch": 236} {"train_loss": -8.05191707611084, "global_step": 39666, "epoch": 236} {"train_loss": -8.081592559814453, "global_step": 39667, "epoch": 236} {"train_loss": -7.825228691101074, "global_step": 39668, "epoch": 236} {"train_loss": -8.142210006713867, "global_step": 39669, "epoch": 236} {"train_loss": -7.862929821014404, "global_step": 39670, "epoch": 236} {"train_loss": -7.8977179527282715, "global_step": 39671, "epoch": 236} {"train_loss": -7.917651176452637, "global_step": 39672, "epoch": 236} {"train_loss": -7.836831092834473, "global_step": 39673, "epoch": 236} {"train_loss": -8.063177108764648, "global_step": 39674, "epoch": 236} {"train_loss": -8.001693725585938, "global_step": 39675, "epoch": 236} {"train_loss": -7.915489673614502, "global_step": 39676, "epoch": 236} {"train_loss": -7.865209579467773, "global_step": 39677, "epoch": 236} {"train_loss": -7.848247051239014, "global_step": 39678, "epoch": 236} {"train_loss": -7.994060039520264, "global_step": 39679, "epoch": 236} {"train_loss": -7.908925533294678, "global_step": 39680, "epoch": 236} {"train_loss": -7.888880252838135, "global_step": 39681, "epoch": 236} {"train_loss": -7.643764019012451, "global_step": 39682, "epoch": 236} {"train_loss": -7.880280494689941, "global_step": 39683, "epoch": 236} {"train_loss": -8.007508277893066, "global_step": 39684, "epoch": 236} {"train_loss": -7.800544261932373, "global_step": 39685, "epoch": 236} {"train_loss": -7.999710559844971, "global_step": 39686, "epoch": 236} {"train_loss": -7.905167102813721, "global_step": 39687, "epoch": 236} {"train_loss": -8.069108009338379, "global_step": 39688, "epoch": 236} {"train_loss": -7.8358612060546875, "global_step": 39689, "epoch": 236} {"train_loss": -7.752641677856445, "global_step": 39690, "epoch": 236} {"train_loss": -7.848371505737305, "global_step": 39691, "epoch": 236} {"train_loss": -7.771319389343262, "global_step": 39692, "epoch": 236} {"train_loss": -7.874341011047363, "global_step": 39693, "epoch": 236} {"train_loss": -7.830924987792969, "global_step": 39694, "epoch": 236} {"train_loss": -7.691596031188965, "global_step": 39695, "epoch": 236} {"train_loss": -7.847522735595703, "global_step": 39696, "epoch": 236} {"train_loss": -7.837872505187988, "global_step": 39697, "epoch": 236} {"train_loss": -8.052116394042969, "global_step": 39698, "epoch": 236} {"train_loss": -7.887910842895508, "global_step": 39699, "epoch": 236} {"train_loss": -7.730301380157471, "global_step": 39700, "epoch": 236} {"train_loss": -7.601165771484375, "global_step": 39701, "epoch": 236} {"train_loss": -8.091625213623047, "global_step": 39702, "epoch": 236} {"train_loss": -7.711277961730957, "global_step": 39703, "epoch": 236} {"train_loss": -7.928483486175537, "global_step": 39704, "epoch": 236} {"train_loss": -7.888053894042969, "global_step": 39705, "epoch": 236} {"train_loss": -8.081075668334961, "global_step": 39706, "epoch": 236} {"train_loss": -7.698348045349121, "global_step": 39707, "epoch": 236} {"train_loss": -7.966525077819824, "global_step": 39708, "epoch": 236} {"train_loss": -7.8084259033203125, "global_step": 39709, "epoch": 236} {"train_loss": -7.668550491333008, "global_step": 39710, "epoch": 236} {"train_loss": -7.888257026672363, "global_step": 39711, "epoch": 236} {"train_loss": -7.719344139099121, "global_step": 39712, "epoch": 236} {"train_loss": -8.041656494140625, "global_step": 39713, "epoch": 236} {"train_loss": -7.951051712036133, "global_step": 39714, "epoch": 236} {"train_loss": -7.995059967041016, "global_step": 39715, "epoch": 236} {"train_loss": -7.75916862487793, "global_step": 39716, "epoch": 236} {"train_loss": -7.987679958343506, "global_step": 39717, "epoch": 236} {"train_loss": -7.934335231781006, "global_step": 39718, "epoch": 236} {"train_loss": -7.898979187011719, "global_step": 39719, "epoch": 236} {"train_loss": -8.23614501953125, "global_step": 39720, "epoch": 236} {"train_loss": -8.123103141784668, "global_step": 39721, "epoch": 236} {"train_loss": -7.8857741355896, "global_step": 39722, "epoch": 236} {"train_loss": -7.869420051574707, "global_step": 39723, "epoch": 236} {"train_loss": -7.86691427230835, "global_step": 39724, "epoch": 236} {"train_loss": -7.76569938659668, "global_step": 39725, "epoch": 236} {"train_loss": -7.921728134155273, "global_step": 39726, "epoch": 236} {"train_loss": -8.031033515930176, "global_step": 39727, "epoch": 236} {"train_loss": -7.924079418182373, "global_step": 39728, "epoch": 236} {"train_loss": -8.020780563354492, "global_step": 39729, "epoch": 236} {"train_loss": -7.851477146148682, "global_step": 39730, "epoch": 236} {"train_loss": -8.18096923828125, "global_step": 39731, "epoch": 236} {"train_loss": -7.866347312927246, "global_step": 39732, "epoch": 236} {"train_loss": -8.008856773376465, "global_step": 39733, "epoch": 236} {"train_loss": -7.921971321105957, "global_step": 39734, "epoch": 236} {"train_loss": -7.7984619140625, "global_step": 39735, "epoch": 236} {"train_loss": -7.902284622192383, "global_step": 39736, "epoch": 236} {"train_loss": -8.220062255859375, "global_step": 39737, "epoch": 236} {"train_loss": -8.012537956237793, "global_step": 39738, "epoch": 236} {"train_loss": -7.95147180557251, "global_step": 39739, "epoch": 236} {"train_loss": -8.120485305786133, "global_step": 39740, "epoch": 236} {"train_loss": -8.079599380493164, "global_step": 39741, "epoch": 236} {"train_loss": -8.029491424560547, "global_step": 39742, "epoch": 236} {"train_loss": -8.042497634887695, "global_step": 39743, "epoch": 236} {"train_loss": -7.990077972412109, "global_step": 39744, "epoch": 236} {"train_loss": -7.7816362380981445, "global_step": 39745, "epoch": 236} {"train_loss": -8.088805198669434, "global_step": 39746, "epoch": 236} {"train_loss": -7.873403549194336, "global_step": 39747, "epoch": 236} {"train_loss": -7.957541465759277, "global_step": 39748, "epoch": 236} {"train_loss": -7.764047622680664, "global_step": 39749, "epoch": 236} {"train_loss": -7.629976272583008, "global_step": 39750, "epoch": 236} {"train_loss": -7.724964141845703, "global_step": 39751, "epoch": 236} {"train_loss": -7.837224006652832, "global_step": 39752, "epoch": 236} {"train_loss": -7.6054182052612305, "global_step": 39753, "epoch": 236} {"train_loss": -7.916654586791992, "global_step": 39754, "epoch": 236} {"train_loss": -7.863986015319824, "global_step": 39755, "epoch": 236} {"train_loss": -7.965559005737305, "global_step": 39756, "epoch": 236} {"train_loss": -7.816375732421875, "global_step": 39757, "epoch": 236} {"train_loss": -8.078967094421387, "global_step": 39758, "epoch": 236} {"train_loss": -7.935557842254639, "global_step": 39759, "epoch": 236} {"train_loss": -7.929626941680908, "global_step": 39760, "epoch": 236} {"train_loss": -7.953567028045654, "global_step": 39761, "epoch": 236} {"train_loss": -7.768889427185059, "global_step": 39762, "epoch": 236} {"train_loss": -7.588817119598389, "global_step": 39763, "epoch": 236} {"train_loss": -7.703587532043457, "global_step": 39764, "epoch": 236} {"train_loss": -7.822694778442383, "global_step": 39765, "epoch": 236} {"train_loss": -7.856917858123779, "global_step": 39766, "epoch": 236} {"train_loss": -7.894937515258789, "global_step": 39767, "epoch": 236} {"train_loss": -7.890035152435303, "global_step": 39768, "epoch": 236} {"train_loss": -7.882955551147461, "global_step": 39769, "epoch": 236} {"train_loss": -7.6404948234558105, "global_step": 39770, "epoch": 236} {"train_loss": -8.049219131469727, "global_step": 39771, "epoch": 236} {"train_loss": -8.020647048950195, "global_step": 39772, "epoch": 236} {"train_loss": -7.896628379821777, "global_step": 39773, "epoch": 236} {"train_loss": -7.649105548858643, "global_step": 39774, "epoch": 236} {"train_loss": -7.913380146026611, "global_step": 39775, "epoch": 236} {"train_loss": -7.7928266525268555, "global_step": 39776, "epoch": 236} {"train_loss": -7.6870646476745605, "global_step": 39777, "epoch": 236} {"train_loss": -8.044240951538086, "global_step": 39778, "epoch": 236} {"train_loss": -7.800360679626465, "global_step": 39779, "epoch": 236} {"train_loss": -7.709308624267578, "global_step": 39780, "epoch": 236} {"train_loss": -7.761143684387207, "global_step": 39781, "epoch": 236} {"train_loss": -7.958585262298584, "global_step": 39782, "epoch": 236} {"train_loss": -7.831034183502197, "global_step": 39783, "epoch": 236} {"train_loss": -7.843811511993408, "global_step": 39784, "epoch": 236} {"train_loss": -7.890345573425293, "global_step": 39785, "epoch": 236} {"train_loss": -7.977728366851807, "global_step": 39786, "epoch": 236} {"train_loss": -7.909160614013672, "global_step": 39787, "epoch": 236} {"train_loss": -7.878537178039551, "global_step": 39788, "epoch": 236} {"train_loss": -7.91252326965332, "global_step": 39789, "epoch": 236} {"train_loss": -7.789873123168945, "global_step": 39790, "epoch": 236} {"train_loss": -8.008944511413574, "global_step": 39791, "epoch": 236} {"train_loss": -7.9131927490234375, "global_step": 39792, "epoch": 236} {"train_loss": -7.908951759338379, "global_step": 39793, "epoch": 236} {"train_loss": -8.01728343963623, "global_step": 39794, "epoch": 236} {"train_loss": -7.8800811767578125, "global_step": 39795, "epoch": 236} {"train_loss": -7.7704267501831055, "global_step": 39796, "epoch": 236} {"train_loss": -8.015894889831543, "global_step": 39797, "epoch": 236} {"train_loss": -7.7720441818237305, "global_step": 39798, "epoch": 236} {"train_loss": -8.004847526550293, "global_step": 39799, "epoch": 236} {"train_loss": -7.702234268188477, "global_step": 39800, "epoch": 236} {"train_loss": -8.206395149230957, "global_step": 39801, "epoch": 236} {"train_loss": -7.752569198608398, "global_step": 39802, "epoch": 236} {"train_loss": -8.141630172729492, "global_step": 39803, "epoch": 236} {"train_loss": -7.678978443145752, "global_step": 39804, "epoch": 236} {"train_loss": -7.927807807922363, "global_step": 39805, "epoch": 236} {"train_loss": -8.182369232177734, "global_step": 39806, "epoch": 236} {"train_loss": -7.865268707275391, "global_step": 39807, "epoch": 236} {"train_loss": -7.822449684143066, "global_step": 39808, "epoch": 236} {"train_loss": -7.8046464920043945, "global_step": 39809, "epoch": 236} {"train_loss": -7.827581405639648, "global_step": 39810, "epoch": 236} {"train_loss": -7.878668785095215, "global_step": 39811, "epoch": 236} {"train_loss": -7.813323974609375, "global_step": 39812, "epoch": 236} {"train_loss": -7.660042762756348, "global_step": 39813, "epoch": 236} {"train_loss": -7.877378463745117, "global_step": 39814, "epoch": 236} {"train_loss": -7.8904435606229875, "global_step": 39815, "epoch": 236, "val_loss": 185413.34375} {"train_loss": -7.850518226623535, "global_step": 39816, "epoch": 237} {"train_loss": -7.942941665649414, "global_step": 39817, "epoch": 237} {"train_loss": -7.955665588378906, "global_step": 39818, "epoch": 237} {"train_loss": -8.016944885253906, "global_step": 39819, "epoch": 237} {"train_loss": -7.942817687988281, "global_step": 39820, "epoch": 237} {"train_loss": -7.715811252593994, "global_step": 39821, "epoch": 237} {"train_loss": -7.832857608795166, "global_step": 39822, "epoch": 237} {"train_loss": -7.943587303161621, "global_step": 39823, "epoch": 237} {"train_loss": -7.93489408493042, "global_step": 39824, "epoch": 237} {"train_loss": -7.485047340393066, "global_step": 39825, "epoch": 237} {"train_loss": -8.075236320495605, "global_step": 39826, "epoch": 237} {"train_loss": -7.6713337898254395, "global_step": 39827, "epoch": 237} {"train_loss": -7.9929704666137695, "global_step": 39828, "epoch": 237} {"train_loss": -7.505082130432129, "global_step": 39829, "epoch": 237} {"train_loss": -7.941810607910156, "global_step": 39830, "epoch": 237} {"train_loss": -7.719357967376709, "global_step": 39831, "epoch": 237} {"train_loss": -8.020339965820312, "global_step": 39832, "epoch": 237} {"train_loss": -8.047857284545898, "global_step": 39833, "epoch": 237} {"train_loss": -7.819695949554443, "global_step": 39834, "epoch": 237} {"train_loss": -7.927618980407715, "global_step": 39835, "epoch": 237} {"train_loss": -7.966219425201416, "global_step": 39836, "epoch": 237} {"train_loss": -7.736610412597656, "global_step": 39837, "epoch": 237} {"train_loss": -7.920668601989746, "global_step": 39838, "epoch": 237} {"train_loss": -7.884214401245117, "global_step": 39839, "epoch": 237} {"train_loss": -7.5684404373168945, "global_step": 39840, "epoch": 237} {"train_loss": -7.953399181365967, "global_step": 39841, "epoch": 237} {"train_loss": -7.834775447845459, "global_step": 39842, "epoch": 237} {"train_loss": -7.981682777404785, "global_step": 39843, "epoch": 237} {"train_loss": -7.984698295593262, "global_step": 39844, "epoch": 237} {"train_loss": -7.905271530151367, "global_step": 39845, "epoch": 237} {"train_loss": -7.884745121002197, "global_step": 39846, "epoch": 237} {"train_loss": -7.9254150390625, "global_step": 39847, "epoch": 237} {"train_loss": -7.81558895111084, "global_step": 39848, "epoch": 237} {"train_loss": -7.8717217445373535, "global_step": 39849, "epoch": 237} {"train_loss": -7.925326347351074, "global_step": 39850, "epoch": 237} {"train_loss": -7.574548721313477, "global_step": 39851, "epoch": 237} {"train_loss": -7.856939315795898, "global_step": 39852, "epoch": 237} {"train_loss": -7.958288192749023, "global_step": 39853, "epoch": 237} {"train_loss": -7.949049949645996, "global_step": 39854, "epoch": 237} {"train_loss": -7.728737831115723, "global_step": 39855, "epoch": 237} {"train_loss": -8.057394981384277, "global_step": 39856, "epoch": 237} {"train_loss": -8.021044731140137, "global_step": 39857, "epoch": 237} {"train_loss": -7.628684997558594, "global_step": 39858, "epoch": 237} {"train_loss": -8.155519485473633, "global_step": 39859, "epoch": 237} {"train_loss": -7.9837212562561035, "global_step": 39860, "epoch": 237} {"train_loss": -7.933276653289795, "global_step": 39861, "epoch": 237} {"train_loss": -7.981661796569824, "global_step": 39862, "epoch": 237} {"train_loss": -8.001900672912598, "global_step": 39863, "epoch": 237} {"train_loss": -7.860266208648682, "global_step": 39864, "epoch": 237} {"train_loss": -7.88471794128418, "global_step": 39865, "epoch": 237} {"train_loss": -8.133050918579102, "global_step": 39866, "epoch": 237} {"train_loss": -8.089083671569824, "global_step": 39867, "epoch": 237} {"train_loss": -8.131403923034668, "global_step": 39868, "epoch": 237} {"train_loss": -8.200603485107422, "global_step": 39869, "epoch": 237} {"train_loss": -8.070249557495117, "global_step": 39870, "epoch": 237} {"train_loss": -8.097280502319336, "global_step": 39871, "epoch": 237} {"train_loss": -8.17572021484375, "global_step": 39872, "epoch": 237} {"train_loss": -7.9233198165893555, "global_step": 39873, "epoch": 237} {"train_loss": -7.821713447570801, "global_step": 39874, "epoch": 237} {"train_loss": -7.85542106628418, "global_step": 39875, "epoch": 237} {"train_loss": -7.843628406524658, "global_step": 39876, "epoch": 237} {"train_loss": -8.147491455078125, "global_step": 39877, "epoch": 237} {"train_loss": -7.983369827270508, "global_step": 39878, "epoch": 237} {"train_loss": -7.823944568634033, "global_step": 39879, "epoch": 237} {"train_loss": -7.9796552658081055, "global_step": 39880, "epoch": 237} {"train_loss": -8.057191848754883, "global_step": 39881, "epoch": 237} {"train_loss": -8.15523910522461, "global_step": 39882, "epoch": 237} {"train_loss": -7.9198455810546875, "global_step": 39883, "epoch": 237} {"train_loss": -7.72087287902832, "global_step": 39884, "epoch": 237} {"train_loss": -8.031822204589844, "global_step": 39885, "epoch": 237} {"train_loss": -7.871644973754883, "global_step": 39886, "epoch": 237} {"train_loss": -7.926548957824707, "global_step": 39887, "epoch": 237} {"train_loss": -7.948068618774414, "global_step": 39888, "epoch": 237} {"train_loss": -7.622488021850586, "global_step": 39889, "epoch": 237} {"train_loss": -8.076763153076172, "global_step": 39890, "epoch": 237} {"train_loss": -7.850749969482422, "global_step": 39891, "epoch": 237} {"train_loss": -7.642180919647217, "global_step": 39892, "epoch": 237} {"train_loss": -7.411115646362305, "global_step": 39893, "epoch": 237} {"train_loss": -7.654125213623047, "global_step": 39894, "epoch": 237} {"train_loss": -7.65983772277832, "global_step": 39895, "epoch": 237} {"train_loss": -7.3762030601501465, "global_step": 39896, "epoch": 237} {"train_loss": -7.638772487640381, "global_step": 39897, "epoch": 237} {"train_loss": -7.581360816955566, "global_step": 39898, "epoch": 237} {"train_loss": -7.789094924926758, "global_step": 39899, "epoch": 237} {"train_loss": -7.660219192504883, "global_step": 39900, "epoch": 237} {"train_loss": -7.831755638122559, "global_step": 39901, "epoch": 237} {"train_loss": -7.793262958526611, "global_step": 39902, "epoch": 237} {"train_loss": -7.804368019104004, "global_step": 39903, "epoch": 237} {"train_loss": -7.635348320007324, "global_step": 39904, "epoch": 237} {"train_loss": -7.866569519042969, "global_step": 39905, "epoch": 237} {"train_loss": -7.732924461364746, "global_step": 39906, "epoch": 237} {"train_loss": -7.742546081542969, "global_step": 39907, "epoch": 237} {"train_loss": -7.834444046020508, "global_step": 39908, "epoch": 237} {"train_loss": -7.926490783691406, "global_step": 39909, "epoch": 237} {"train_loss": -7.885937690734863, "global_step": 39910, "epoch": 237} {"train_loss": -7.992118835449219, "global_step": 39911, "epoch": 237} {"train_loss": -7.880688667297363, "global_step": 39912, "epoch": 237} {"train_loss": -8.015464782714844, "global_step": 39913, "epoch": 237} {"train_loss": -7.7607927322387695, "global_step": 39914, "epoch": 237} {"train_loss": -8.02937126159668, "global_step": 39915, "epoch": 237} {"train_loss": -7.974935054779053, "global_step": 39916, "epoch": 237} {"train_loss": -7.8777055740356445, "global_step": 39917, "epoch": 237} {"train_loss": -7.9225053787231445, "global_step": 39918, "epoch": 237} {"train_loss": -7.718714714050293, "global_step": 39919, "epoch": 237} {"train_loss": -7.876440048217773, "global_step": 39920, "epoch": 237} {"train_loss": -7.867715835571289, "global_step": 39921, "epoch": 237} {"train_loss": -8.002798080444336, "global_step": 39922, "epoch": 237} {"train_loss": -7.772960662841797, "global_step": 39923, "epoch": 237} {"train_loss": -7.908010959625244, "global_step": 39924, "epoch": 237} {"train_loss": -7.839410781860352, "global_step": 39925, "epoch": 237} {"train_loss": -7.8610029220581055, "global_step": 39926, "epoch": 237} {"train_loss": -7.560091018676758, "global_step": 39927, "epoch": 237} {"train_loss": -7.8304290771484375, "global_step": 39928, "epoch": 237} {"train_loss": -7.575244903564453, "global_step": 39929, "epoch": 237} {"train_loss": -7.860655307769775, "global_step": 39930, "epoch": 237} {"train_loss": -7.73576545715332, "global_step": 39931, "epoch": 237} {"train_loss": -7.682927131652832, "global_step": 39932, "epoch": 237} {"train_loss": -7.701255798339844, "global_step": 39933, "epoch": 237} {"train_loss": -7.852375030517578, "global_step": 39934, "epoch": 237} {"train_loss": -7.674940586090088, "global_step": 39935, "epoch": 237} {"train_loss": -7.909244537353516, "global_step": 39936, "epoch": 237} {"train_loss": -7.788885116577148, "global_step": 39937, "epoch": 237} {"train_loss": -7.80947732925415, "global_step": 39938, "epoch": 237} {"train_loss": -7.878565788269043, "global_step": 39939, "epoch": 237} {"train_loss": -7.760168075561523, "global_step": 39940, "epoch": 237} {"train_loss": -7.990237236022949, "global_step": 39941, "epoch": 237} {"train_loss": -7.734265327453613, "global_step": 39942, "epoch": 237} {"train_loss": -8.014996528625488, "global_step": 39943, "epoch": 237} {"train_loss": -7.650338649749756, "global_step": 39944, "epoch": 237} {"train_loss": -7.9769721031188965, "global_step": 39945, "epoch": 237} {"train_loss": -7.8732709884643555, "global_step": 39946, "epoch": 237} {"train_loss": -7.964229583740234, "global_step": 39947, "epoch": 237} {"train_loss": -7.734580039978027, "global_step": 39948, "epoch": 237} {"train_loss": -7.831723213195801, "global_step": 39949, "epoch": 237} {"train_loss": -7.87493896484375, "global_step": 39950, "epoch": 237} {"train_loss": -7.741428852081299, "global_step": 39951, "epoch": 237} {"train_loss": -8.105899810791016, "global_step": 39952, "epoch": 237} {"train_loss": -7.859144687652588, "global_step": 39953, "epoch": 237} {"train_loss": -8.071374893188477, "global_step": 39954, "epoch": 237} {"train_loss": -7.915086269378662, "global_step": 39955, "epoch": 237} {"train_loss": -8.127154350280762, "global_step": 39956, "epoch": 237} {"train_loss": -7.771805763244629, "global_step": 39957, "epoch": 237} {"train_loss": -8.079155921936035, "global_step": 39958, "epoch": 237} {"train_loss": -7.806173324584961, "global_step": 39959, "epoch": 237} {"train_loss": -7.8748779296875, "global_step": 39960, "epoch": 237} {"train_loss": -7.726241111755371, "global_step": 39961, "epoch": 237} {"train_loss": -7.926490306854248, "global_step": 39962, "epoch": 237} {"train_loss": -8.060807228088379, "global_step": 39963, "epoch": 237} {"train_loss": -7.898818492889404, "global_step": 39964, "epoch": 237} {"train_loss": -7.831625938415527, "global_step": 39965, "epoch": 237} {"train_loss": -8.158186912536621, "global_step": 39966, "epoch": 237} {"train_loss": -8.010649681091309, "global_step": 39967, "epoch": 237} {"train_loss": -7.924311637878418, "global_step": 39968, "epoch": 237} {"train_loss": -7.947649955749512, "global_step": 39969, "epoch": 237} {"train_loss": -8.065526962280273, "global_step": 39970, "epoch": 237} {"train_loss": -7.9623236656188965, "global_step": 39971, "epoch": 237} {"train_loss": -7.997501373291016, "global_step": 39972, "epoch": 237} {"train_loss": -7.9124627113342285, "global_step": 39973, "epoch": 237} {"train_loss": -7.895944595336914, "global_step": 39974, "epoch": 237} {"train_loss": -7.849703311920166, "global_step": 39975, "epoch": 237} {"train_loss": -8.286839485168457, "global_step": 39976, "epoch": 237} {"train_loss": -7.887988090515137, "global_step": 39977, "epoch": 237} {"train_loss": -8.025384902954102, "global_step": 39978, "epoch": 237} {"train_loss": -7.932890892028809, "global_step": 39979, "epoch": 237} {"train_loss": -7.954563140869141, "global_step": 39980, "epoch": 237} {"train_loss": -7.936470031738281, "global_step": 39981, "epoch": 237} {"train_loss": -7.811777114868164, "global_step": 39982, "epoch": 237} {"train_loss": -7.880125809283483, "global_step": 39983, "epoch": 237, "val_loss": 187233.609375} {"train_loss": -7.726677894592285, "global_step": 39984, "epoch": 238} {"train_loss": -7.878742218017578, "global_step": 39985, "epoch": 238} {"train_loss": -7.802916526794434, "global_step": 39986, "epoch": 238} {"train_loss": -8.121635437011719, "global_step": 39987, "epoch": 238} {"train_loss": -7.837867736816406, "global_step": 39988, "epoch": 238} {"train_loss": -7.927063941955566, "global_step": 39989, "epoch": 238} {"train_loss": -7.788843154907227, "global_step": 39990, "epoch": 238} {"train_loss": -7.938381195068359, "global_step": 39991, "epoch": 238} {"train_loss": -7.808571815490723, "global_step": 39992, "epoch": 238} {"train_loss": -8.07490348815918, "global_step": 39993, "epoch": 238} {"train_loss": -7.683234691619873, "global_step": 39994, "epoch": 238} {"train_loss": -7.821680068969727, "global_step": 39995, "epoch": 238} {"train_loss": -7.862556457519531, "global_step": 39996, "epoch": 238} {"train_loss": -7.874672889709473, "global_step": 39997, "epoch": 238} {"train_loss": -8.04751205444336, "global_step": 39998, "epoch": 238} {"train_loss": -7.956208229064941, "global_step": 39999, "epoch": 238} {"train_loss": -8.178301811218262, "global_step": 40000, "epoch": 238} {"train_loss": -8.163382530212402, "global_step": 40001, "epoch": 238} {"train_loss": -8.043636322021484, "global_step": 40002, "epoch": 238} {"train_loss": -8.086935043334961, "global_step": 40003, "epoch": 238} {"train_loss": -7.84557580947876, "global_step": 40004, "epoch": 238} {"train_loss": -7.716734886169434, "global_step": 40005, "epoch": 238} {"train_loss": -8.09780502319336, "global_step": 40006, "epoch": 238} {"train_loss": -8.1744966506958, "global_step": 40007, "epoch": 238} {"train_loss": -7.9732770919799805, "global_step": 40008, "epoch": 238} {"train_loss": -7.984654426574707, "global_step": 40009, "epoch": 238} {"train_loss": -7.989816188812256, "global_step": 40010, "epoch": 238} {"train_loss": -8.064521789550781, "global_step": 40011, "epoch": 238} {"train_loss": -8.070423126220703, "global_step": 40012, "epoch": 238} {"train_loss": -8.140702247619629, "global_step": 40013, "epoch": 238} {"train_loss": -7.873666763305664, "global_step": 40014, "epoch": 238} {"train_loss": -8.15440559387207, "global_step": 40015, "epoch": 238} {"train_loss": -7.748290061950684, "global_step": 40016, "epoch": 238} {"train_loss": -7.933340072631836, "global_step": 40017, "epoch": 238} {"train_loss": -7.858890533447266, "global_step": 40018, "epoch": 238} {"train_loss": -8.292940139770508, "global_step": 40019, "epoch": 238} {"train_loss": -7.81184720993042, "global_step": 40020, "epoch": 238} {"train_loss": -8.070867538452148, "global_step": 40021, "epoch": 238} {"train_loss": -7.874207019805908, "global_step": 40022, "epoch": 238} {"train_loss": -8.141908645629883, "global_step": 40023, "epoch": 238} {"train_loss": -7.893672943115234, "global_step": 40024, "epoch": 238} {"train_loss": -7.9353742599487305, "global_step": 40025, "epoch": 238} {"train_loss": -7.871161460876465, "global_step": 40026, "epoch": 238} {"train_loss": -7.641086101531982, "global_step": 40027, "epoch": 238} {"train_loss": -8.016051292419434, "global_step": 40028, "epoch": 238} {"train_loss": -7.95035457611084, "global_step": 40029, "epoch": 238} {"train_loss": -7.951877593994141, "global_step": 40030, "epoch": 238} {"train_loss": -8.093894004821777, "global_step": 40031, "epoch": 238} {"train_loss": -7.768977165222168, "global_step": 40032, "epoch": 238} {"train_loss": -8.082383155822754, "global_step": 40033, "epoch": 238} {"train_loss": -8.11112117767334, "global_step": 40034, "epoch": 238} {"train_loss": -8.150287628173828, "global_step": 40035, "epoch": 238} {"train_loss": -7.980507850646973, "global_step": 40036, "epoch": 238} {"train_loss": -7.688566207885742, "global_step": 40037, "epoch": 238} {"train_loss": -7.892290115356445, "global_step": 40038, "epoch": 238} {"train_loss": -8.039985656738281, "global_step": 40039, "epoch": 238} {"train_loss": -7.771889686584473, "global_step": 40040, "epoch": 238} {"train_loss": -7.7614030838012695, "global_step": 40041, "epoch": 238} {"train_loss": -7.923009872436523, "global_step": 40042, "epoch": 238} {"train_loss": -7.811130523681641, "global_step": 40043, "epoch": 238} {"train_loss": -7.84733772277832, "global_step": 40044, "epoch": 238} {"train_loss": -8.102352142333984, "global_step": 40045, "epoch": 238} {"train_loss": -7.977345943450928, "global_step": 40046, "epoch": 238} {"train_loss": -7.787234306335449, "global_step": 40047, "epoch": 238} {"train_loss": -7.971334457397461, "global_step": 40048, "epoch": 238} {"train_loss": -8.034566879272461, "global_step": 40049, "epoch": 238} {"train_loss": -8.1239013671875, "global_step": 40050, "epoch": 238} {"train_loss": -7.941720962524414, "global_step": 40051, "epoch": 238} {"train_loss": -8.177148818969727, "global_step": 40052, "epoch": 238} {"train_loss": -7.734600067138672, "global_step": 40053, "epoch": 238} {"train_loss": -8.249441146850586, "global_step": 40054, "epoch": 238} {"train_loss": -7.926662445068359, "global_step": 40055, "epoch": 238} {"train_loss": -7.668656349182129, "global_step": 40056, "epoch": 238} {"train_loss": -7.968549728393555, "global_step": 40057, "epoch": 238} {"train_loss": -7.86680793762207, "global_step": 40058, "epoch": 238} {"train_loss": -8.083732604980469, "global_step": 40059, "epoch": 238} {"train_loss": -7.855915069580078, "global_step": 40060, "epoch": 238} {"train_loss": -7.918461322784424, "global_step": 40061, "epoch": 238} {"train_loss": -7.784758567810059, "global_step": 40062, "epoch": 238} {"train_loss": -7.990215301513672, "global_step": 40063, "epoch": 238} {"train_loss": -7.666823863983154, "global_step": 40064, "epoch": 238} {"train_loss": -7.980813503265381, "global_step": 40065, "epoch": 238} {"train_loss": -7.839826583862305, "global_step": 40066, "epoch": 238} {"train_loss": -7.809877872467041, "global_step": 40067, "epoch": 238} {"train_loss": -8.05337142944336, "global_step": 40068, "epoch": 238} {"train_loss": -8.081114768981934, "global_step": 40069, "epoch": 238} {"train_loss": -8.074507713317871, "global_step": 40070, "epoch": 238} {"train_loss": -8.0225830078125, "global_step": 40071, "epoch": 238} {"train_loss": -7.976779937744141, "global_step": 40072, "epoch": 238} {"train_loss": -8.161962509155273, "global_step": 40073, "epoch": 238} {"train_loss": -7.806604385375977, "global_step": 40074, "epoch": 238} {"train_loss": -7.778735160827637, "global_step": 40075, "epoch": 238} {"train_loss": -8.13076400756836, "global_step": 40076, "epoch": 238} {"train_loss": -7.760912895202637, "global_step": 40077, "epoch": 238} {"train_loss": -8.000972747802734, "global_step": 40078, "epoch": 238} {"train_loss": -7.769780158996582, "global_step": 40079, "epoch": 238} {"train_loss": -7.981875419616699, "global_step": 40080, "epoch": 238} {"train_loss": -7.839561462402344, "global_step": 40081, "epoch": 238} {"train_loss": -7.810628890991211, "global_step": 40082, "epoch": 238} {"train_loss": -7.925130367279053, "global_step": 40083, "epoch": 238} {"train_loss": -7.931297779083252, "global_step": 40084, "epoch": 238} {"train_loss": -7.862845420837402, "global_step": 40085, "epoch": 238} {"train_loss": -8.013474464416504, "global_step": 40086, "epoch": 238} {"train_loss": -7.990466117858887, "global_step": 40087, "epoch": 238} {"train_loss": -8.076408386230469, "global_step": 40088, "epoch": 238} {"train_loss": -7.77493953704834, "global_step": 40089, "epoch": 238} {"train_loss": -7.7153825759887695, "global_step": 40090, "epoch": 238} {"train_loss": -7.834897994995117, "global_step": 40091, "epoch": 238} {"train_loss": -7.983945846557617, "global_step": 40092, "epoch": 238} {"train_loss": -7.793829917907715, "global_step": 40093, "epoch": 238} {"train_loss": -7.9410905838012695, "global_step": 40094, "epoch": 238} {"train_loss": -8.028690338134766, "global_step": 40095, "epoch": 238} {"train_loss": -7.969785690307617, "global_step": 40096, "epoch": 238} {"train_loss": -8.146427154541016, "global_step": 40097, "epoch": 238} {"train_loss": -7.822164535522461, "global_step": 40098, "epoch": 238} {"train_loss": -7.950798988342285, "global_step": 40099, "epoch": 238} {"train_loss": -8.08839225769043, "global_step": 40100, "epoch": 238} {"train_loss": -8.20784854888916, "global_step": 40101, "epoch": 238} {"train_loss": -8.260974884033203, "global_step": 40102, "epoch": 238} {"train_loss": -8.219240188598633, "global_step": 40103, "epoch": 238} {"train_loss": -8.054335594177246, "global_step": 40104, "epoch": 238} {"train_loss": -7.987628936767578, "global_step": 40105, "epoch": 238} {"train_loss": -7.967859268188477, "global_step": 40106, "epoch": 238} {"train_loss": -8.008304595947266, "global_step": 40107, "epoch": 238} {"train_loss": -8.0740327835083, "global_step": 40108, "epoch": 238} {"train_loss": -8.161478996276855, "global_step": 40109, "epoch": 238} {"train_loss": -7.878293991088867, "global_step": 40110, "epoch": 238} {"train_loss": -8.065448760986328, "global_step": 40111, "epoch": 238} {"train_loss": -8.111204147338867, "global_step": 40112, "epoch": 238} {"train_loss": -8.023585319519043, "global_step": 40113, "epoch": 238} {"train_loss": -8.228550910949707, "global_step": 40114, "epoch": 238} {"train_loss": -7.803030967712402, "global_step": 40115, "epoch": 238} {"train_loss": -7.792182445526123, "global_step": 40116, "epoch": 238} {"train_loss": -7.919577598571777, "global_step": 40117, "epoch": 238} {"train_loss": -7.998269081115723, "global_step": 40118, "epoch": 238} {"train_loss": -7.855721950531006, "global_step": 40119, "epoch": 238} {"train_loss": -7.784438133239746, "global_step": 40120, "epoch": 238} {"train_loss": -8.183058738708496, "global_step": 40121, "epoch": 238} {"train_loss": -8.047249794006348, "global_step": 40122, "epoch": 238} {"train_loss": -8.059187889099121, "global_step": 40123, "epoch": 238} {"train_loss": -7.873961448669434, "global_step": 40124, "epoch": 238} {"train_loss": -8.164946556091309, "global_step": 40125, "epoch": 238} {"train_loss": -7.765603065490723, "global_step": 40126, "epoch": 238} {"train_loss": -7.940996170043945, "global_step": 40127, "epoch": 238} {"train_loss": -7.682586669921875, "global_step": 40128, "epoch": 238} {"train_loss": -7.920805931091309, "global_step": 40129, "epoch": 238} {"train_loss": -7.805205821990967, "global_step": 40130, "epoch": 238} {"train_loss": -7.966205596923828, "global_step": 40131, "epoch": 238} {"train_loss": -7.777345657348633, "global_step": 40132, "epoch": 238} {"train_loss": -8.103277206420898, "global_step": 40133, "epoch": 238} {"train_loss": -7.918632984161377, "global_step": 40134, "epoch": 238} {"train_loss": -7.959181785583496, "global_step": 40135, "epoch": 238} {"train_loss": -7.823045253753662, "global_step": 40136, "epoch": 238} {"train_loss": -7.834343910217285, "global_step": 40137, "epoch": 238} {"train_loss": -7.9491777420043945, "global_step": 40138, "epoch": 238} {"train_loss": -7.887844562530518, "global_step": 40139, "epoch": 238} {"train_loss": -7.990146160125732, "global_step": 40140, "epoch": 238} {"train_loss": -7.941129684448242, "global_step": 40141, "epoch": 238} {"train_loss": -7.692632675170898, "global_step": 40142, "epoch": 238} {"train_loss": -7.928843975067139, "global_step": 40143, "epoch": 238} {"train_loss": -7.663937091827393, "global_step": 40144, "epoch": 238} {"train_loss": -7.740792274475098, "global_step": 40145, "epoch": 238} {"train_loss": -7.888403415679932, "global_step": 40146, "epoch": 238} {"train_loss": -7.861458778381348, "global_step": 40147, "epoch": 238} {"train_loss": -7.989525318145752, "global_step": 40148, "epoch": 238} {"train_loss": -7.960266590118408, "global_step": 40149, "epoch": 238} {"train_loss": -7.982203483581543, "global_step": 40150, "epoch": 238} {"train_loss": -7.945252435547965, "global_step": 40151, "epoch": 238, "val_loss": 187476.8125} {"train_loss": -7.881770610809326, "global_step": 40152, "epoch": 239} {"train_loss": -7.802786827087402, "global_step": 40153, "epoch": 239} {"train_loss": -7.937549591064453, "global_step": 40154, "epoch": 239} {"train_loss": -7.878757476806641, "global_step": 40155, "epoch": 239} {"train_loss": -7.794585227966309, "global_step": 40156, "epoch": 239} {"train_loss": -8.0128173828125, "global_step": 40157, "epoch": 239} {"train_loss": -7.9202117919921875, "global_step": 40158, "epoch": 239} {"train_loss": -8.071348190307617, "global_step": 40159, "epoch": 239} {"train_loss": -8.100529670715332, "global_step": 40160, "epoch": 239} {"train_loss": -7.963708877563477, "global_step": 40161, "epoch": 239} {"train_loss": -7.724600315093994, "global_step": 40162, "epoch": 239} {"train_loss": -7.975137233734131, "global_step": 40163, "epoch": 239} {"train_loss": -7.6928300857543945, "global_step": 40164, "epoch": 239} {"train_loss": -8.125999450683594, "global_step": 40165, "epoch": 239} {"train_loss": -7.880516529083252, "global_step": 40166, "epoch": 239} {"train_loss": -7.9555535316467285, "global_step": 40167, "epoch": 239} {"train_loss": -7.925212860107422, "global_step": 40168, "epoch": 239} {"train_loss": -7.862727165222168, "global_step": 40169, "epoch": 239} {"train_loss": -7.742558479309082, "global_step": 40170, "epoch": 239} {"train_loss": -7.820252418518066, "global_step": 40171, "epoch": 239} {"train_loss": -7.860169410705566, "global_step": 40172, "epoch": 239} {"train_loss": -8.100870132446289, "global_step": 40173, "epoch": 239} {"train_loss": -8.14126205444336, "global_step": 40174, "epoch": 239} {"train_loss": -7.945224761962891, "global_step": 40175, "epoch": 239} {"train_loss": -8.020801544189453, "global_step": 40176, "epoch": 239} {"train_loss": -8.06346607208252, "global_step": 40177, "epoch": 239} {"train_loss": -7.985228061676025, "global_step": 40178, "epoch": 239} {"train_loss": -8.027511596679688, "global_step": 40179, "epoch": 239} {"train_loss": -7.837433338165283, "global_step": 40180, "epoch": 239} {"train_loss": -7.848684310913086, "global_step": 40181, "epoch": 239} {"train_loss": -7.455842971801758, "global_step": 40182, "epoch": 239} {"train_loss": -7.815395355224609, "global_step": 40183, "epoch": 239} {"train_loss": -7.499213218688965, "global_step": 40184, "epoch": 239} {"train_loss": -7.970656394958496, "global_step": 40185, "epoch": 239} {"train_loss": -7.960412502288818, "global_step": 40186, "epoch": 239} {"train_loss": -7.942582130432129, "global_step": 40187, "epoch": 239} {"train_loss": -7.8885321617126465, "global_step": 40188, "epoch": 239} {"train_loss": -7.933242321014404, "global_step": 40189, "epoch": 239} {"train_loss": -7.905668258666992, "global_step": 40190, "epoch": 239} {"train_loss": -7.886546611785889, "global_step": 40191, "epoch": 239} {"train_loss": -7.837134838104248, "global_step": 40192, "epoch": 239} {"train_loss": -8.067634582519531, "global_step": 40193, "epoch": 239} {"train_loss": -7.852686882019043, "global_step": 40194, "epoch": 239} {"train_loss": -7.763621807098389, "global_step": 40195, "epoch": 239} {"train_loss": -7.6884026527404785, "global_step": 40196, "epoch": 239} {"train_loss": -7.905755996704102, "global_step": 40197, "epoch": 239} {"train_loss": -7.788551330566406, "global_step": 40198, "epoch": 239} {"train_loss": -8.115768432617188, "global_step": 40199, "epoch": 239} {"train_loss": -8.171417236328125, "global_step": 40200, "epoch": 239} {"train_loss": -8.140050888061523, "global_step": 40201, "epoch": 239} {"train_loss": -8.1200590133667, "global_step": 40202, "epoch": 239} {"train_loss": -7.753125190734863, "global_step": 40203, "epoch": 239} {"train_loss": -7.880659580230713, "global_step": 40204, "epoch": 239} {"train_loss": -7.841010093688965, "global_step": 40205, "epoch": 239} {"train_loss": -7.766183376312256, "global_step": 40206, "epoch": 239} {"train_loss": -8.042194366455078, "global_step": 40207, "epoch": 239} {"train_loss": -7.559966087341309, "global_step": 40208, "epoch": 239} {"train_loss": -7.713675498962402, "global_step": 40209, "epoch": 239} {"train_loss": -7.593011856079102, "global_step": 40210, "epoch": 239} {"train_loss": -7.852003574371338, "global_step": 40211, "epoch": 239} {"train_loss": -7.513509273529053, "global_step": 40212, "epoch": 239} {"train_loss": -7.778918743133545, "global_step": 40213, "epoch": 239} {"train_loss": -7.836949348449707, "global_step": 40214, "epoch": 239} {"train_loss": -7.745851039886475, "global_step": 40215, "epoch": 239} {"train_loss": -7.578450679779053, "global_step": 40216, "epoch": 239} {"train_loss": -7.820943355560303, "global_step": 40217, "epoch": 239} {"train_loss": -8.128637313842773, "global_step": 40218, "epoch": 239} {"train_loss": -7.730725288391113, "global_step": 40219, "epoch": 239} {"train_loss": -7.7981157302856445, "global_step": 40220, "epoch": 239} {"train_loss": -7.868485450744629, "global_step": 40221, "epoch": 239} {"train_loss": -8.00473403930664, "global_step": 40222, "epoch": 239} {"train_loss": -7.801750659942627, "global_step": 40223, "epoch": 239} {"train_loss": -8.026857376098633, "global_step": 40224, "epoch": 239} {"train_loss": -7.949485778808594, "global_step": 40225, "epoch": 239} {"train_loss": -7.913114070892334, "global_step": 40226, "epoch": 239} {"train_loss": -7.946032524108887, "global_step": 40227, "epoch": 239} {"train_loss": -8.240278244018555, "global_step": 40228, "epoch": 239} {"train_loss": -8.016458511352539, "global_step": 40229, "epoch": 239} {"train_loss": -7.788654804229736, "global_step": 40230, "epoch": 239} {"train_loss": -7.883591175079346, "global_step": 40231, "epoch": 239} {"train_loss": -7.995638847351074, "global_step": 40232, "epoch": 239} {"train_loss": -8.092395782470703, "global_step": 40233, "epoch": 239} {"train_loss": -7.788220405578613, "global_step": 40234, "epoch": 239} {"train_loss": -8.186872482299805, "global_step": 40235, "epoch": 239} {"train_loss": -8.057920455932617, "global_step": 40236, "epoch": 239} {"train_loss": -8.023323059082031, "global_step": 40237, "epoch": 239} {"train_loss": -8.09887409210205, "global_step": 40238, "epoch": 239} {"train_loss": -7.807185649871826, "global_step": 40239, "epoch": 239} {"train_loss": -7.865823745727539, "global_step": 40240, "epoch": 239} {"train_loss": -7.820910453796387, "global_step": 40241, "epoch": 239} {"train_loss": -7.8387250900268555, "global_step": 40242, "epoch": 239} {"train_loss": -7.914161682128906, "global_step": 40243, "epoch": 239} {"train_loss": -7.779574871063232, "global_step": 40244, "epoch": 239} {"train_loss": -7.890723705291748, "global_step": 40245, "epoch": 239} {"train_loss": -8.096647262573242, "global_step": 40246, "epoch": 239} {"train_loss": -7.73813533782959, "global_step": 40247, "epoch": 239} {"train_loss": -7.88796854019165, "global_step": 40248, "epoch": 239} {"train_loss": -8.045836448669434, "global_step": 40249, "epoch": 239} {"train_loss": -7.840492248535156, "global_step": 40250, "epoch": 239} {"train_loss": -7.978966236114502, "global_step": 40251, "epoch": 239} {"train_loss": -8.071434020996094, "global_step": 40252, "epoch": 239} {"train_loss": -7.985486030578613, "global_step": 40253, "epoch": 239} {"train_loss": -7.993377685546875, "global_step": 40254, "epoch": 239} {"train_loss": -7.9778642654418945, "global_step": 40255, "epoch": 239} {"train_loss": -7.845996856689453, "global_step": 40256, "epoch": 239} {"train_loss": -8.005904197692871, "global_step": 40257, "epoch": 239} {"train_loss": -7.986189842224121, "global_step": 40258, "epoch": 239} {"train_loss": -8.134340286254883, "global_step": 40259, "epoch": 239} {"train_loss": -7.923521518707275, "global_step": 40260, "epoch": 239} {"train_loss": -8.093215942382812, "global_step": 40261, "epoch": 239} {"train_loss": -7.9706573486328125, "global_step": 40262, "epoch": 239} {"train_loss": -8.134061813354492, "global_step": 40263, "epoch": 239} {"train_loss": -7.927199363708496, "global_step": 40264, "epoch": 239} {"train_loss": -8.024723052978516, "global_step": 40265, "epoch": 239} {"train_loss": -8.07474136352539, "global_step": 40266, "epoch": 239} {"train_loss": -8.059917449951172, "global_step": 40267, "epoch": 239} {"train_loss": -8.295882225036621, "global_step": 40268, "epoch": 239} {"train_loss": -7.837555885314941, "global_step": 40269, "epoch": 239} {"train_loss": -8.190082550048828, "global_step": 40270, "epoch": 239} {"train_loss": -8.051552772521973, "global_step": 40271, "epoch": 239} {"train_loss": -8.026622772216797, "global_step": 40272, "epoch": 239} {"train_loss": -7.800003528594971, "global_step": 40273, "epoch": 239} {"train_loss": -8.301921844482422, "global_step": 40274, "epoch": 239} {"train_loss": -7.725050926208496, "global_step": 40275, "epoch": 239} {"train_loss": -8.115785598754883, "global_step": 40276, "epoch": 239} {"train_loss": -7.711910724639893, "global_step": 40277, "epoch": 239} {"train_loss": -7.840961456298828, "global_step": 40278, "epoch": 239} {"train_loss": -7.936985492706299, "global_step": 40279, "epoch": 239} {"train_loss": -7.809819221496582, "global_step": 40280, "epoch": 239} {"train_loss": -7.975314140319824, "global_step": 40281, "epoch": 239} {"train_loss": -7.650687217712402, "global_step": 40282, "epoch": 239} {"train_loss": -8.062692642211914, "global_step": 40283, "epoch": 239} {"train_loss": -7.59819221496582, "global_step": 40284, "epoch": 239} {"train_loss": -7.719809055328369, "global_step": 40285, "epoch": 239} {"train_loss": -7.9731831550598145, "global_step": 40286, "epoch": 239} {"train_loss": -7.608312129974365, "global_step": 40287, "epoch": 239} {"train_loss": -7.794661521911621, "global_step": 40288, "epoch": 239} {"train_loss": -7.998812675476074, "global_step": 40289, "epoch": 239} {"train_loss": -7.5909953117370605, "global_step": 40290, "epoch": 239} {"train_loss": -7.753121376037598, "global_step": 40291, "epoch": 239} {"train_loss": -7.688884735107422, "global_step": 40292, "epoch": 239} {"train_loss": -7.868366241455078, "global_step": 40293, "epoch": 239} {"train_loss": -7.687228202819824, "global_step": 40294, "epoch": 239} {"train_loss": -8.167919158935547, "global_step": 40295, "epoch": 239} {"train_loss": -7.59660530090332, "global_step": 40296, "epoch": 239} {"train_loss": -7.754044532775879, "global_step": 40297, "epoch": 239} {"train_loss": -7.767056941986084, "global_step": 40298, "epoch": 239} {"train_loss": -8.088712692260742, "global_step": 40299, "epoch": 239} {"train_loss": -7.8227386474609375, "global_step": 40300, "epoch": 239} {"train_loss": -7.9559431076049805, "global_step": 40301, "epoch": 239} {"train_loss": -7.807106971740723, "global_step": 40302, "epoch": 239} {"train_loss": -7.928398609161377, "global_step": 40303, "epoch": 239} {"train_loss": -7.977904319763184, "global_step": 40304, "epoch": 239} {"train_loss": -7.652217388153076, "global_step": 40305, "epoch": 239} {"train_loss": -8.255016326904297, "global_step": 40306, "epoch": 239} {"train_loss": -7.941687107086182, "global_step": 40307, "epoch": 239} {"train_loss": -7.6006083488464355, "global_step": 40308, "epoch": 239} {"train_loss": -7.82858943939209, "global_step": 40309, "epoch": 239} {"train_loss": -7.865285873413086, "global_step": 40310, "epoch": 239} {"train_loss": -8.00335693359375, "global_step": 40311, "epoch": 239} {"train_loss": -7.961727142333984, "global_step": 40312, "epoch": 239} {"train_loss": -7.767009735107422, "global_step": 40313, "epoch": 239} {"train_loss": -8.102989196777344, "global_step": 40314, "epoch": 239} {"train_loss": -7.997833251953125, "global_step": 40315, "epoch": 239} {"train_loss": -7.77694034576416, "global_step": 40316, "epoch": 239} {"train_loss": -8.003765106201172, "global_step": 40317, "epoch": 239} {"train_loss": -8.03414535522461, "global_step": 40318, "epoch": 239} {"train_loss": -7.905132231258211, "global_step": 40319, "epoch": 239, "val_loss": 188731.546875} {"train_loss": -7.781290054321289, "global_step": 40320, "epoch": 240} {"train_loss": -7.780482292175293, "global_step": 40321, "epoch": 240} {"train_loss": -7.679665565490723, "global_step": 40322, "epoch": 240} {"train_loss": -7.738595008850098, "global_step": 40323, "epoch": 240} {"train_loss": -7.867281913757324, "global_step": 40324, "epoch": 240} {"train_loss": -7.645960807800293, "global_step": 40325, "epoch": 240} {"train_loss": -7.904080867767334, "global_step": 40326, "epoch": 240} {"train_loss": -7.670772075653076, "global_step": 40327, "epoch": 240} {"train_loss": -7.768660068511963, "global_step": 40328, "epoch": 240} {"train_loss": -7.8419880867004395, "global_step": 40329, "epoch": 240} {"train_loss": -7.578505516052246, "global_step": 40330, "epoch": 240} {"train_loss": -8.071529388427734, "global_step": 40331, "epoch": 240} {"train_loss": -7.81915283203125, "global_step": 40332, "epoch": 240} {"train_loss": -7.845491886138916, "global_step": 40333, "epoch": 240} {"train_loss": -7.96165657043457, "global_step": 40334, "epoch": 240} {"train_loss": -7.826423645019531, "global_step": 40335, "epoch": 240} {"train_loss": -7.921228885650635, "global_step": 40336, "epoch": 240} {"train_loss": -7.802870273590088, "global_step": 40337, "epoch": 240} {"train_loss": -7.920322418212891, "global_step": 40338, "epoch": 240} {"train_loss": -7.9123101234436035, "global_step": 40339, "epoch": 240} {"train_loss": -7.959564685821533, "global_step": 40340, "epoch": 240} {"train_loss": -8.004980087280273, "global_step": 40341, "epoch": 240} {"train_loss": -7.775659561157227, "global_step": 40342, "epoch": 240} {"train_loss": -8.065709114074707, "global_step": 40343, "epoch": 240} {"train_loss": -7.917586326599121, "global_step": 40344, "epoch": 240} {"train_loss": -8.046172142028809, "global_step": 40345, "epoch": 240} {"train_loss": -7.772367000579834, "global_step": 40346, "epoch": 240} {"train_loss": -7.9983367919921875, "global_step": 40347, "epoch": 240} {"train_loss": -7.792026042938232, "global_step": 40348, "epoch": 240} {"train_loss": -7.946972370147705, "global_step": 40349, "epoch": 240} {"train_loss": -7.9783525466918945, "global_step": 40350, "epoch": 240} {"train_loss": -8.054194450378418, "global_step": 40351, "epoch": 240} {"train_loss": -7.752625465393066, "global_step": 40352, "epoch": 240} {"train_loss": -7.939655303955078, "global_step": 40353, "epoch": 240} {"train_loss": -8.168888092041016, "global_step": 40354, "epoch": 240} {"train_loss": -7.642010688781738, "global_step": 40355, "epoch": 240} {"train_loss": -7.90431022644043, "global_step": 40356, "epoch": 240} {"train_loss": -8.052129745483398, "global_step": 40357, "epoch": 240} {"train_loss": -8.048099517822266, "global_step": 40358, "epoch": 240} {"train_loss": -7.784394264221191, "global_step": 40359, "epoch": 240} {"train_loss": -8.257879257202148, "global_step": 40360, "epoch": 240} {"train_loss": -8.120059967041016, "global_step": 40361, "epoch": 240} {"train_loss": -8.084613800048828, "global_step": 40362, "epoch": 240} {"train_loss": -7.998828887939453, "global_step": 40363, "epoch": 240} {"train_loss": -8.115777969360352, "global_step": 40364, "epoch": 240} {"train_loss": -7.903883934020996, "global_step": 40365, "epoch": 240} {"train_loss": -7.9599127769470215, "global_step": 40366, "epoch": 240} {"train_loss": -8.156381607055664, "global_step": 40367, "epoch": 240} {"train_loss": -8.025285720825195, "global_step": 40368, "epoch": 240} {"train_loss": -8.03277587890625, "global_step": 40369, "epoch": 240} {"train_loss": -7.806882381439209, "global_step": 40370, "epoch": 240} {"train_loss": -8.003318786621094, "global_step": 40371, "epoch": 240} {"train_loss": -7.942726135253906, "global_step": 40372, "epoch": 240} {"train_loss": -7.914918899536133, "global_step": 40373, "epoch": 240} {"train_loss": -8.041425704956055, "global_step": 40374, "epoch": 240} {"train_loss": -8.06978988647461, "global_step": 40375, "epoch": 240} {"train_loss": -8.224884033203125, "global_step": 40376, "epoch": 240} {"train_loss": -8.07539176940918, "global_step": 40377, "epoch": 240} {"train_loss": -7.80714225769043, "global_step": 40378, "epoch": 240} {"train_loss": -8.077535629272461, "global_step": 40379, "epoch": 240} {"train_loss": -7.824554920196533, "global_step": 40380, "epoch": 240} {"train_loss": -7.876320838928223, "global_step": 40381, "epoch": 240} {"train_loss": -7.8520917892456055, "global_step": 40382, "epoch": 240} {"train_loss": -7.957942485809326, "global_step": 40383, "epoch": 240} {"train_loss": -8.19851303100586, "global_step": 40384, "epoch": 240} {"train_loss": -8.072028160095215, "global_step": 40385, "epoch": 240} {"train_loss": -8.029300689697266, "global_step": 40386, "epoch": 240} {"train_loss": -8.019418716430664, "global_step": 40387, "epoch": 240} {"train_loss": -7.968759059906006, "global_step": 40388, "epoch": 240} {"train_loss": -8.008913040161133, "global_step": 40389, "epoch": 240} {"train_loss": -7.863372802734375, "global_step": 40390, "epoch": 240} {"train_loss": -7.709939002990723, "global_step": 40391, "epoch": 240} {"train_loss": -7.9523420333862305, "global_step": 40392, "epoch": 240} {"train_loss": -8.093517303466797, "global_step": 40393, "epoch": 240} {"train_loss": -7.821094989776611, "global_step": 40394, "epoch": 240} {"train_loss": -7.681937217712402, "global_step": 40395, "epoch": 240} {"train_loss": -8.004066467285156, "global_step": 40396, "epoch": 240} {"train_loss": -7.843513488769531, "global_step": 40397, "epoch": 240} {"train_loss": -7.624955177307129, "global_step": 40398, "epoch": 240} {"train_loss": -7.924688339233398, "global_step": 40399, "epoch": 240} {"train_loss": -7.881239891052246, "global_step": 40400, "epoch": 240} {"train_loss": -7.943507671356201, "global_step": 40401, "epoch": 240} {"train_loss": -7.850917339324951, "global_step": 40402, "epoch": 240} {"train_loss": -7.8412933349609375, "global_step": 40403, "epoch": 240} {"train_loss": -7.922316074371338, "global_step": 40404, "epoch": 240} {"train_loss": -7.976918697357178, "global_step": 40405, "epoch": 240} {"train_loss": -7.844162940979004, "global_step": 40406, "epoch": 240} {"train_loss": -8.007177352905273, "global_step": 40407, "epoch": 240} {"train_loss": -8.043057441711426, "global_step": 40408, "epoch": 240} {"train_loss": -8.10251235961914, "global_step": 40409, "epoch": 240} {"train_loss": -7.753955841064453, "global_step": 40410, "epoch": 240} {"train_loss": -7.879016876220703, "global_step": 40411, "epoch": 240} {"train_loss": -7.937915802001953, "global_step": 40412, "epoch": 240} {"train_loss": -7.9647650718688965, "global_step": 40413, "epoch": 240} {"train_loss": -7.918268203735352, "global_step": 40414, "epoch": 240} {"train_loss": -8.053610801696777, "global_step": 40415, "epoch": 240} {"train_loss": -7.906450271606445, "global_step": 40416, "epoch": 240} {"train_loss": -7.970704555511475, "global_step": 40417, "epoch": 240} {"train_loss": -7.929503440856934, "global_step": 40418, "epoch": 240} {"train_loss": -8.128271102905273, "global_step": 40419, "epoch": 240} {"train_loss": -8.03579330444336, "global_step": 40420, "epoch": 240} {"train_loss": -7.819194793701172, "global_step": 40421, "epoch": 240} {"train_loss": -7.916934967041016, "global_step": 40422, "epoch": 240} {"train_loss": -7.663825511932373, "global_step": 40423, "epoch": 240} {"train_loss": -7.83154296875, "global_step": 40424, "epoch": 240} {"train_loss": -7.9098944664001465, "global_step": 40425, "epoch": 240} {"train_loss": -7.910984992980957, "global_step": 40426, "epoch": 240} {"train_loss": -7.871946334838867, "global_step": 40427, "epoch": 240} {"train_loss": -8.062323570251465, "global_step": 40428, "epoch": 240} {"train_loss": -7.754701137542725, "global_step": 40429, "epoch": 240} {"train_loss": -7.807106018066406, "global_step": 40430, "epoch": 240} {"train_loss": -7.791457653045654, "global_step": 40431, "epoch": 240} {"train_loss": -7.798587799072266, "global_step": 40432, "epoch": 240} {"train_loss": -7.960108757019043, "global_step": 40433, "epoch": 240} {"train_loss": -7.816949844360352, "global_step": 40434, "epoch": 240} {"train_loss": -7.861135959625244, "global_step": 40435, "epoch": 240} {"train_loss": -7.8965559005737305, "global_step": 40436, "epoch": 240} {"train_loss": -7.925837516784668, "global_step": 40437, "epoch": 240} {"train_loss": -7.650157928466797, "global_step": 40438, "epoch": 240} {"train_loss": -7.965440273284912, "global_step": 40439, "epoch": 240} {"train_loss": -7.632696151733398, "global_step": 40440, "epoch": 240} {"train_loss": -7.865542411804199, "global_step": 40441, "epoch": 240} {"train_loss": -7.985551357269287, "global_step": 40442, "epoch": 240} {"train_loss": -7.998369216918945, "global_step": 40443, "epoch": 240} {"train_loss": -7.754509925842285, "global_step": 40444, "epoch": 240} {"train_loss": -8.043262481689453, "global_step": 40445, "epoch": 240} {"train_loss": -8.049105644226074, "global_step": 40446, "epoch": 240} {"train_loss": -7.861473560333252, "global_step": 40447, "epoch": 240} {"train_loss": -8.001297950744629, "global_step": 40448, "epoch": 240} {"train_loss": -7.899987697601318, "global_step": 40449, "epoch": 240} {"train_loss": -7.619365692138672, "global_step": 40450, "epoch": 240} {"train_loss": -7.636050224304199, "global_step": 40451, "epoch": 240} {"train_loss": -8.08166217803955, "global_step": 40452, "epoch": 240} {"train_loss": -7.771061897277832, "global_step": 40453, "epoch": 240} {"train_loss": -7.631617546081543, "global_step": 40454, "epoch": 240} {"train_loss": -7.71624755859375, "global_step": 40455, "epoch": 240} {"train_loss": -7.853235244750977, "global_step": 40456, "epoch": 240} {"train_loss": -7.823687553405762, "global_step": 40457, "epoch": 240} {"train_loss": -8.06750202178955, "global_step": 40458, "epoch": 240} {"train_loss": -7.761652946472168, "global_step": 40459, "epoch": 240} {"train_loss": -7.949193954467773, "global_step": 40460, "epoch": 240} {"train_loss": -7.65943717956543, "global_step": 40461, "epoch": 240} {"train_loss": -7.7973833084106445, "global_step": 40462, "epoch": 240} {"train_loss": -7.820423126220703, "global_step": 40463, "epoch": 240} {"train_loss": -7.957604885101318, "global_step": 40464, "epoch": 240} {"train_loss": -7.849602222442627, "global_step": 40465, "epoch": 240} {"train_loss": -7.83012580871582, "global_step": 40466, "epoch": 240} {"train_loss": -7.579451560974121, "global_step": 40467, "epoch": 240} {"train_loss": -7.666938781738281, "global_step": 40468, "epoch": 240} {"train_loss": -7.939669609069824, "global_step": 40469, "epoch": 240} {"train_loss": -7.721292972564697, "global_step": 40470, "epoch": 240} {"train_loss": -8.011100769042969, "global_step": 40471, "epoch": 240} {"train_loss": -7.671767711639404, "global_step": 40472, "epoch": 240} {"train_loss": -7.974292278289795, "global_step": 40473, "epoch": 240} {"train_loss": -7.718291759490967, "global_step": 40474, "epoch": 240} {"train_loss": -7.965472221374512, "global_step": 40475, "epoch": 240} {"train_loss": -7.583104133605957, "global_step": 40476, "epoch": 240} {"train_loss": -7.906766891479492, "global_step": 40477, "epoch": 240} {"train_loss": -7.839458465576172, "global_step": 40478, "epoch": 240} {"train_loss": -8.022157669067383, "global_step": 40479, "epoch": 240} {"train_loss": -7.718679904937744, "global_step": 40480, "epoch": 240} {"train_loss": -7.904864311218262, "global_step": 40481, "epoch": 240} {"train_loss": -7.767005920410156, "global_step": 40482, "epoch": 240} {"train_loss": -7.809023857116699, "global_step": 40483, "epoch": 240} {"train_loss": -7.8989577293396, "global_step": 40484, "epoch": 240} {"train_loss": -7.578478813171387, "global_step": 40485, "epoch": 240} {"train_loss": -7.910754203796387, "global_step": 40486, "epoch": 240} {"train_loss": -7.893025290398371, "global_step": 40487, "epoch": 240, "val_loss": 189373.703125, "train_action_mse_error": 11.159969329833984} {"train_loss": -7.644116401672363, "global_step": 40488, "epoch": 241} {"train_loss": -8.00125789642334, "global_step": 40489, "epoch": 241} {"train_loss": -8.129897117614746, "global_step": 40490, "epoch": 241} {"train_loss": -7.724143981933594, "global_step": 40491, "epoch": 241} {"train_loss": -7.793337345123291, "global_step": 40492, "epoch": 241} {"train_loss": -8.092323303222656, "global_step": 40493, "epoch": 241} {"train_loss": -7.843240737915039, "global_step": 40494, "epoch": 241} {"train_loss": -7.912764549255371, "global_step": 40495, "epoch": 241} {"train_loss": -8.03457260131836, "global_step": 40496, "epoch": 241} {"train_loss": -7.893760681152344, "global_step": 40497, "epoch": 241} {"train_loss": -8.023541450500488, "global_step": 40498, "epoch": 241} {"train_loss": -7.953673362731934, "global_step": 40499, "epoch": 241} {"train_loss": -7.996337890625, "global_step": 40500, "epoch": 241} {"train_loss": -8.1641206741333, "global_step": 40501, "epoch": 241} {"train_loss": -7.89933967590332, "global_step": 40502, "epoch": 241} {"train_loss": -8.00659465789795, "global_step": 40503, "epoch": 241} {"train_loss": -8.042506217956543, "global_step": 40504, "epoch": 241} {"train_loss": -8.080536842346191, "global_step": 40505, "epoch": 241} {"train_loss": -7.975224018096924, "global_step": 40506, "epoch": 241} {"train_loss": -7.975910186767578, "global_step": 40507, "epoch": 241} {"train_loss": -8.151585578918457, "global_step": 40508, "epoch": 241} {"train_loss": -7.753520965576172, "global_step": 40509, "epoch": 241} {"train_loss": -7.850875377655029, "global_step": 40510, "epoch": 241} {"train_loss": -7.812421798706055, "global_step": 40511, "epoch": 241} {"train_loss": -7.899768352508545, "global_step": 40512, "epoch": 241} {"train_loss": -7.919756889343262, "global_step": 40513, "epoch": 241} {"train_loss": -7.929547309875488, "global_step": 40514, "epoch": 241} {"train_loss": -8.062148094177246, "global_step": 40515, "epoch": 241} {"train_loss": -7.7044219970703125, "global_step": 40516, "epoch": 241} {"train_loss": -7.871294975280762, "global_step": 40517, "epoch": 241} {"train_loss": -7.816223621368408, "global_step": 40518, "epoch": 241} {"train_loss": -7.792869567871094, "global_step": 40519, "epoch": 241} {"train_loss": -7.983151912689209, "global_step": 40520, "epoch": 241} {"train_loss": -7.6595611572265625, "global_step": 40521, "epoch": 241} {"train_loss": -7.673343658447266, "global_step": 40522, "epoch": 241} {"train_loss": -7.939266204833984, "global_step": 40523, "epoch": 241} {"train_loss": -7.760820388793945, "global_step": 40524, "epoch": 241} {"train_loss": -7.729341506958008, "global_step": 40525, "epoch": 241} {"train_loss": -7.556283950805664, "global_step": 40526, "epoch": 241} {"train_loss": -7.7275261878967285, "global_step": 40527, "epoch": 241} {"train_loss": -7.737672805786133, "global_step": 40528, "epoch": 241} {"train_loss": -7.704557418823242, "global_step": 40529, "epoch": 241} {"train_loss": -7.452620506286621, "global_step": 40530, "epoch": 241} {"train_loss": -7.783909320831299, "global_step": 40531, "epoch": 241} {"train_loss": -7.629303932189941, "global_step": 40532, "epoch": 241} {"train_loss": -7.602757930755615, "global_step": 40533, "epoch": 241} {"train_loss": -7.832091331481934, "global_step": 40534, "epoch": 241} {"train_loss": -7.635499000549316, "global_step": 40535, "epoch": 241} {"train_loss": -7.760364532470703, "global_step": 40536, "epoch": 241} {"train_loss": -7.880735874176025, "global_step": 40537, "epoch": 241} {"train_loss": -7.753719329833984, "global_step": 40538, "epoch": 241} {"train_loss": -7.981606483459473, "global_step": 40539, "epoch": 241} {"train_loss": -7.972689628601074, "global_step": 40540, "epoch": 241} {"train_loss": -8.077388763427734, "global_step": 40541, "epoch": 241} {"train_loss": -7.84072208404541, "global_step": 40542, "epoch": 241} {"train_loss": -7.763411045074463, "global_step": 40543, "epoch": 241} {"train_loss": -7.703700542449951, "global_step": 40544, "epoch": 241} {"train_loss": -7.931233882904053, "global_step": 40545, "epoch": 241} {"train_loss": -7.922384262084961, "global_step": 40546, "epoch": 241} {"train_loss": -8.005145072937012, "global_step": 40547, "epoch": 241} {"train_loss": -8.14714241027832, "global_step": 40548, "epoch": 241} {"train_loss": -8.085992813110352, "global_step": 40549, "epoch": 241} {"train_loss": -8.004708290100098, "global_step": 40550, "epoch": 241} {"train_loss": -8.126574516296387, "global_step": 40551, "epoch": 241} {"train_loss": -8.007795333862305, "global_step": 40552, "epoch": 241} {"train_loss": -8.00650405883789, "global_step": 40553, "epoch": 241} {"train_loss": -7.9150567054748535, "global_step": 40554, "epoch": 241} {"train_loss": -8.050033569335938, "global_step": 40555, "epoch": 241} {"train_loss": -8.139286041259766, "global_step": 40556, "epoch": 241} {"train_loss": -7.997785568237305, "global_step": 40557, "epoch": 241} {"train_loss": -7.936967372894287, "global_step": 40558, "epoch": 241} {"train_loss": -7.860389709472656, "global_step": 40559, "epoch": 241} {"train_loss": -8.37124252319336, "global_step": 40560, "epoch": 241} {"train_loss": -7.948859214782715, "global_step": 40561, "epoch": 241} {"train_loss": -8.13549518585205, "global_step": 40562, "epoch": 241} {"train_loss": -7.89419412612915, "global_step": 40563, "epoch": 241} {"train_loss": -8.034273147583008, "global_step": 40564, "epoch": 241} {"train_loss": -7.738238334655762, "global_step": 40565, "epoch": 241} {"train_loss": -8.077861785888672, "global_step": 40566, "epoch": 241} {"train_loss": -7.8445024490356445, "global_step": 40567, "epoch": 241} {"train_loss": -8.17585563659668, "global_step": 40568, "epoch": 241} {"train_loss": -7.885509014129639, "global_step": 40569, "epoch": 241} {"train_loss": -7.738007545471191, "global_step": 40570, "epoch": 241} {"train_loss": -7.918267250061035, "global_step": 40571, "epoch": 241} {"train_loss": -7.925841331481934, "global_step": 40572, "epoch": 241} {"train_loss": -8.089203834533691, "global_step": 40573, "epoch": 241} {"train_loss": -8.065067291259766, "global_step": 40574, "epoch": 241} {"train_loss": -7.73902702331543, "global_step": 40575, "epoch": 241} {"train_loss": -7.871903419494629, "global_step": 40576, "epoch": 241} {"train_loss": -7.996481895446777, "global_step": 40577, "epoch": 241} {"train_loss": -7.972832679748535, "global_step": 40578, "epoch": 241} {"train_loss": -7.92993688583374, "global_step": 40579, "epoch": 241} {"train_loss": -7.8033342361450195, "global_step": 40580, "epoch": 241} {"train_loss": -7.890748977661133, "global_step": 40581, "epoch": 241} {"train_loss": -8.063657760620117, "global_step": 40582, "epoch": 241} {"train_loss": -7.90399169921875, "global_step": 40583, "epoch": 241} {"train_loss": -7.9676337242126465, "global_step": 40584, "epoch": 241} {"train_loss": -7.923283576965332, "global_step": 40585, "epoch": 241} {"train_loss": -7.9363250732421875, "global_step": 40586, "epoch": 241} {"train_loss": -7.734402179718018, "global_step": 40587, "epoch": 241} {"train_loss": -8.03791618347168, "global_step": 40588, "epoch": 241} {"train_loss": -7.961371898651123, "global_step": 40589, "epoch": 241} {"train_loss": -7.864852428436279, "global_step": 40590, "epoch": 241} {"train_loss": -7.991907596588135, "global_step": 40591, "epoch": 241} {"train_loss": -8.056022644042969, "global_step": 40592, "epoch": 241} {"train_loss": -7.85638427734375, "global_step": 40593, "epoch": 241} {"train_loss": -7.876733779907227, "global_step": 40594, "epoch": 241} {"train_loss": -7.846360683441162, "global_step": 40595, "epoch": 241} {"train_loss": -8.029458999633789, "global_step": 40596, "epoch": 241} {"train_loss": -7.779297828674316, "global_step": 40597, "epoch": 241} {"train_loss": -7.904377460479736, "global_step": 40598, "epoch": 241} {"train_loss": -8.14434814453125, "global_step": 40599, "epoch": 241} {"train_loss": -7.93376350402832, "global_step": 40600, "epoch": 241} {"train_loss": -8.237360000610352, "global_step": 40601, "epoch": 241} {"train_loss": -8.006990432739258, "global_step": 40602, "epoch": 241} {"train_loss": -8.046101570129395, "global_step": 40603, "epoch": 241} {"train_loss": -8.068486213684082, "global_step": 40604, "epoch": 241} {"train_loss": -8.109405517578125, "global_step": 40605, "epoch": 241} {"train_loss": -8.17945671081543, "global_step": 40606, "epoch": 241} {"train_loss": -7.673638820648193, "global_step": 40607, "epoch": 241} {"train_loss": -8.107389450073242, "global_step": 40608, "epoch": 241} {"train_loss": -8.146924018859863, "global_step": 40609, "epoch": 241} {"train_loss": -7.9418158531188965, "global_step": 40610, "epoch": 241} {"train_loss": -7.725326061248779, "global_step": 40611, "epoch": 241} {"train_loss": -8.13711166381836, "global_step": 40612, "epoch": 241} {"train_loss": -7.9247918128967285, "global_step": 40613, "epoch": 241} {"train_loss": -8.081626892089844, "global_step": 40614, "epoch": 241} {"train_loss": -8.040067672729492, "global_step": 40615, "epoch": 241} {"train_loss": -7.966464519500732, "global_step": 40616, "epoch": 241} {"train_loss": -7.893311977386475, "global_step": 40617, "epoch": 241} {"train_loss": -7.9448089599609375, "global_step": 40618, "epoch": 241} {"train_loss": -7.914351463317871, "global_step": 40619, "epoch": 241} {"train_loss": -7.781818389892578, "global_step": 40620, "epoch": 241} {"train_loss": -7.657034873962402, "global_step": 40621, "epoch": 241} {"train_loss": -7.719320774078369, "global_step": 40622, "epoch": 241} {"train_loss": -7.718905448913574, "global_step": 40623, "epoch": 241} {"train_loss": -7.7968950271606445, "global_step": 40624, "epoch": 241} {"train_loss": -7.641573429107666, "global_step": 40625, "epoch": 241} {"train_loss": -7.832706451416016, "global_step": 40626, "epoch": 241} {"train_loss": -8.035202026367188, "global_step": 40627, "epoch": 241} {"train_loss": -7.710460662841797, "global_step": 40628, "epoch": 241} {"train_loss": -7.924041748046875, "global_step": 40629, "epoch": 241} {"train_loss": -7.9166789054870605, "global_step": 40630, "epoch": 241} {"train_loss": -7.971854209899902, "global_step": 40631, "epoch": 241} {"train_loss": -7.864678382873535, "global_step": 40632, "epoch": 241} {"train_loss": -8.058984756469727, "global_step": 40633, "epoch": 241} {"train_loss": -7.9397077560424805, "global_step": 40634, "epoch": 241} {"train_loss": -8.214393615722656, "global_step": 40635, "epoch": 241} {"train_loss": -7.957950592041016, "global_step": 40636, "epoch": 241} {"train_loss": -8.119473457336426, "global_step": 40637, "epoch": 241} {"train_loss": -7.638068199157715, "global_step": 40638, "epoch": 241} {"train_loss": -8.075724601745605, "global_step": 40639, "epoch": 241} {"train_loss": -8.1015625, "global_step": 40640, "epoch": 241} {"train_loss": -7.7295331954956055, "global_step": 40641, "epoch": 241} {"train_loss": -7.92022705078125, "global_step": 40642, "epoch": 241} {"train_loss": -8.054641723632812, "global_step": 40643, "epoch": 241} {"train_loss": -7.767012596130371, "global_step": 40644, "epoch": 241} {"train_loss": -7.835719108581543, "global_step": 40645, "epoch": 241} {"train_loss": -7.797390937805176, "global_step": 40646, "epoch": 241} {"train_loss": -8.033905982971191, "global_step": 40647, "epoch": 241} {"train_loss": -8.059240341186523, "global_step": 40648, "epoch": 241} {"train_loss": -7.749353885650635, "global_step": 40649, "epoch": 241} {"train_loss": -8.02245044708252, "global_step": 40650, "epoch": 241} {"train_loss": -8.02006721496582, "global_step": 40651, "epoch": 241} {"train_loss": -8.186507225036621, "global_step": 40652, "epoch": 241} {"train_loss": -8.094202995300293, "global_step": 40653, "epoch": 241} {"train_loss": -7.968794822692871, "global_step": 40654, "epoch": 241} {"train_loss": -7.920864721139272, "global_step": 40655, "epoch": 241, "val_loss": 183401.328125} {"train_loss": -8.022944450378418, "global_step": 40656, "epoch": 242} {"train_loss": -7.99960994720459, "global_step": 40657, "epoch": 242} {"train_loss": -8.087982177734375, "global_step": 40658, "epoch": 242} {"train_loss": -7.914507865905762, "global_step": 40659, "epoch": 242} {"train_loss": -8.121515274047852, "global_step": 40660, "epoch": 242} {"train_loss": -8.130755424499512, "global_step": 40661, "epoch": 242} {"train_loss": -7.923222064971924, "global_step": 40662, "epoch": 242} {"train_loss": -7.84787654876709, "global_step": 40663, "epoch": 242} {"train_loss": -8.140066146850586, "global_step": 40664, "epoch": 242} {"train_loss": -7.64880895614624, "global_step": 40665, "epoch": 242} {"train_loss": -7.706177711486816, "global_step": 40666, "epoch": 242} {"train_loss": -7.9463677406311035, "global_step": 40667, "epoch": 242} {"train_loss": -7.90770149230957, "global_step": 40668, "epoch": 242} {"train_loss": -7.8375749588012695, "global_step": 40669, "epoch": 242} {"train_loss": -7.804455757141113, "global_step": 40670, "epoch": 242} {"train_loss": -7.971592426300049, "global_step": 40671, "epoch": 242} {"train_loss": -7.81723165512085, "global_step": 40672, "epoch": 242} {"train_loss": -8.242198944091797, "global_step": 40673, "epoch": 242} {"train_loss": -8.110326766967773, "global_step": 40674, "epoch": 242} {"train_loss": -7.974549293518066, "global_step": 40675, "epoch": 242} {"train_loss": -7.939950942993164, "global_step": 40676, "epoch": 242} {"train_loss": -7.555035591125488, "global_step": 40677, "epoch": 242} {"train_loss": -7.63128662109375, "global_step": 40678, "epoch": 242} {"train_loss": -7.857564926147461, "global_step": 40679, "epoch": 242} {"train_loss": -7.880439758300781, "global_step": 40680, "epoch": 242} {"train_loss": -7.756309986114502, "global_step": 40681, "epoch": 242} {"train_loss": -7.8930253982543945, "global_step": 40682, "epoch": 242} {"train_loss": -7.705357551574707, "global_step": 40683, "epoch": 242} {"train_loss": -8.062621116638184, "global_step": 40684, "epoch": 242} {"train_loss": -7.891315460205078, "global_step": 40685, "epoch": 242} {"train_loss": -7.870327949523926, "global_step": 40686, "epoch": 242} {"train_loss": -7.99003267288208, "global_step": 40687, "epoch": 242} {"train_loss": -7.730867385864258, "global_step": 40688, "epoch": 242} {"train_loss": -7.785968780517578, "global_step": 40689, "epoch": 242} {"train_loss": -7.791090488433838, "global_step": 40690, "epoch": 242} {"train_loss": -8.18240737915039, "global_step": 40691, "epoch": 242} {"train_loss": -7.636423110961914, "global_step": 40692, "epoch": 242} {"train_loss": -8.043522834777832, "global_step": 40693, "epoch": 242} {"train_loss": -7.77099084854126, "global_step": 40694, "epoch": 242} {"train_loss": -8.034235000610352, "global_step": 40695, "epoch": 242} {"train_loss": -7.952786445617676, "global_step": 40696, "epoch": 242} {"train_loss": -7.858982563018799, "global_step": 40697, "epoch": 242} {"train_loss": -8.004899978637695, "global_step": 40698, "epoch": 242} {"train_loss": -7.723818778991699, "global_step": 40699, "epoch": 242} {"train_loss": -8.090581893920898, "global_step": 40700, "epoch": 242} {"train_loss": -7.492420196533203, "global_step": 40701, "epoch": 242} {"train_loss": -8.094239234924316, "global_step": 40702, "epoch": 242} {"train_loss": -7.8633222579956055, "global_step": 40703, "epoch": 242} {"train_loss": -7.86534309387207, "global_step": 40704, "epoch": 242} {"train_loss": -8.03498649597168, "global_step": 40705, "epoch": 242} {"train_loss": -8.164510726928711, "global_step": 40706, "epoch": 242} {"train_loss": -8.024711608886719, "global_step": 40707, "epoch": 242} {"train_loss": -7.93670129776001, "global_step": 40708, "epoch": 242} {"train_loss": -8.067387580871582, "global_step": 40709, "epoch": 242} {"train_loss": -7.949059963226318, "global_step": 40710, "epoch": 242} {"train_loss": -7.875957489013672, "global_step": 40711, "epoch": 242} {"train_loss": -8.122931480407715, "global_step": 40712, "epoch": 242} {"train_loss": -7.94374418258667, "global_step": 40713, "epoch": 242} {"train_loss": -8.207000732421875, "global_step": 40714, "epoch": 242} {"train_loss": -8.006047248840332, "global_step": 40715, "epoch": 242} {"train_loss": -8.150457382202148, "global_step": 40716, "epoch": 242} {"train_loss": -8.085108757019043, "global_step": 40717, "epoch": 242} {"train_loss": -8.008455276489258, "global_step": 40718, "epoch": 242} {"train_loss": -7.913887977600098, "global_step": 40719, "epoch": 242} {"train_loss": -8.068262100219727, "global_step": 40720, "epoch": 242} {"train_loss": -8.129983901977539, "global_step": 40721, "epoch": 242} {"train_loss": -8.210662841796875, "global_step": 40722, "epoch": 242} {"train_loss": -7.882833480834961, "global_step": 40723, "epoch": 242} {"train_loss": -8.12035083770752, "global_step": 40724, "epoch": 242} {"train_loss": -8.21589183807373, "global_step": 40725, "epoch": 242} {"train_loss": -8.038357734680176, "global_step": 40726, "epoch": 242} {"train_loss": -8.016075134277344, "global_step": 40727, "epoch": 242} {"train_loss": -7.92353630065918, "global_step": 40728, "epoch": 242} {"train_loss": -8.341038703918457, "global_step": 40729, "epoch": 242} {"train_loss": -8.096939086914062, "global_step": 40730, "epoch": 242} {"train_loss": -7.955758094787598, "global_step": 40731, "epoch": 242} {"train_loss": -8.210762023925781, "global_step": 40732, "epoch": 242} {"train_loss": -7.966073513031006, "global_step": 40733, "epoch": 242} {"train_loss": -8.133265495300293, "global_step": 40734, "epoch": 242} {"train_loss": -7.821633338928223, "global_step": 40735, "epoch": 242} {"train_loss": -7.752835273742676, "global_step": 40736, "epoch": 242} {"train_loss": -7.9072065353393555, "global_step": 40737, "epoch": 242} {"train_loss": -8.118881225585938, "global_step": 40738, "epoch": 242} {"train_loss": -7.97150993347168, "global_step": 40739, "epoch": 242} {"train_loss": -7.8262224197387695, "global_step": 40740, "epoch": 242} {"train_loss": -8.229546546936035, "global_step": 40741, "epoch": 242} {"train_loss": -7.843366622924805, "global_step": 40742, "epoch": 242} {"train_loss": -8.04024600982666, "global_step": 40743, "epoch": 242} {"train_loss": -7.797787666320801, "global_step": 40744, "epoch": 242} {"train_loss": -8.048826217651367, "global_step": 40745, "epoch": 242} {"train_loss": -7.910667896270752, "global_step": 40746, "epoch": 242} {"train_loss": -7.8762969970703125, "global_step": 40747, "epoch": 242} {"train_loss": -7.900030136108398, "global_step": 40748, "epoch": 242} {"train_loss": -7.746338844299316, "global_step": 40749, "epoch": 242} {"train_loss": -7.98752498626709, "global_step": 40750, "epoch": 242} {"train_loss": -7.605730056762695, "global_step": 40751, "epoch": 242} {"train_loss": -7.942959308624268, "global_step": 40752, "epoch": 242} {"train_loss": -7.581204414367676, "global_step": 40753, "epoch": 242} {"train_loss": -7.760957717895508, "global_step": 40754, "epoch": 242} {"train_loss": -7.972170829772949, "global_step": 40755, "epoch": 242} {"train_loss": -7.830936431884766, "global_step": 40756, "epoch": 242} {"train_loss": -7.948437690734863, "global_step": 40757, "epoch": 242} {"train_loss": -8.094620704650879, "global_step": 40758, "epoch": 242} {"train_loss": -8.190940856933594, "global_step": 40759, "epoch": 242} {"train_loss": -8.095314025878906, "global_step": 40760, "epoch": 242} {"train_loss": -7.984978675842285, "global_step": 40761, "epoch": 242} {"train_loss": -8.006352424621582, "global_step": 40762, "epoch": 242} {"train_loss": -8.06690788269043, "global_step": 40763, "epoch": 242} {"train_loss": -8.108758926391602, "global_step": 40764, "epoch": 242} {"train_loss": -7.9957170486450195, "global_step": 40765, "epoch": 242} {"train_loss": -7.9877214431762695, "global_step": 40766, "epoch": 242} {"train_loss": -8.244222640991211, "global_step": 40767, "epoch": 242} {"train_loss": -8.165367126464844, "global_step": 40768, "epoch": 242} {"train_loss": -8.014934539794922, "global_step": 40769, "epoch": 242} {"train_loss": -8.130684852600098, "global_step": 40770, "epoch": 242} {"train_loss": -8.147392272949219, "global_step": 40771, "epoch": 242} {"train_loss": -7.617507457733154, "global_step": 40772, "epoch": 242} {"train_loss": -7.789022922515869, "global_step": 40773, "epoch": 242} {"train_loss": -7.984626293182373, "global_step": 40774, "epoch": 242} {"train_loss": -7.9840922355651855, "global_step": 40775, "epoch": 242} {"train_loss": -7.943798065185547, "global_step": 40776, "epoch": 242} {"train_loss": -7.923092842102051, "global_step": 40777, "epoch": 242} {"train_loss": -7.79801082611084, "global_step": 40778, "epoch": 242} {"train_loss": -8.023218154907227, "global_step": 40779, "epoch": 242} {"train_loss": -7.942221164703369, "global_step": 40780, "epoch": 242} {"train_loss": -7.657417297363281, "global_step": 40781, "epoch": 242} {"train_loss": -7.85249137878418, "global_step": 40782, "epoch": 242} {"train_loss": -7.856420516967773, "global_step": 40783, "epoch": 242} {"train_loss": -7.908812999725342, "global_step": 40784, "epoch": 242} {"train_loss": -7.753952980041504, "global_step": 40785, "epoch": 242} {"train_loss": -7.879256248474121, "global_step": 40786, "epoch": 242} {"train_loss": -7.976406097412109, "global_step": 40787, "epoch": 242} {"train_loss": -7.396107196807861, "global_step": 40788, "epoch": 242} {"train_loss": -7.9468817710876465, "global_step": 40789, "epoch": 242} {"train_loss": -7.927080154418945, "global_step": 40790, "epoch": 242} {"train_loss": -7.782201766967773, "global_step": 40791, "epoch": 242} {"train_loss": -7.536159038543701, "global_step": 40792, "epoch": 242} {"train_loss": -7.868093490600586, "global_step": 40793, "epoch": 242} {"train_loss": -7.829343795776367, "global_step": 40794, "epoch": 242} {"train_loss": -7.7011613845825195, "global_step": 40795, "epoch": 242} {"train_loss": -7.935216903686523, "global_step": 40796, "epoch": 242} {"train_loss": -7.792356967926025, "global_step": 40797, "epoch": 242} {"train_loss": -7.804567337036133, "global_step": 40798, "epoch": 242} {"train_loss": -7.899028301239014, "global_step": 40799, "epoch": 242} {"train_loss": -7.6032609939575195, "global_step": 40800, "epoch": 242} {"train_loss": -7.823248863220215, "global_step": 40801, "epoch": 242} {"train_loss": -7.787446975708008, "global_step": 40802, "epoch": 242} {"train_loss": -7.87022590637207, "global_step": 40803, "epoch": 242} {"train_loss": -7.995116710662842, "global_step": 40804, "epoch": 242} {"train_loss": -7.7886528968811035, "global_step": 40805, "epoch": 242} {"train_loss": -8.046652793884277, "global_step": 40806, "epoch": 242} {"train_loss": -7.791177272796631, "global_step": 40807, "epoch": 242} {"train_loss": -7.696627616882324, "global_step": 40808, "epoch": 242} {"train_loss": -7.925173759460449, "global_step": 40809, "epoch": 242} {"train_loss": -7.87362003326416, "global_step": 40810, "epoch": 242} {"train_loss": -7.849611282348633, "global_step": 40811, "epoch": 242} {"train_loss": -7.954070568084717, "global_step": 40812, "epoch": 242} {"train_loss": -7.821146011352539, "global_step": 40813, "epoch": 242} {"train_loss": -8.060606956481934, "global_step": 40814, "epoch": 242} {"train_loss": -8.072524070739746, "global_step": 40815, "epoch": 242} {"train_loss": -8.145184516906738, "global_step": 40816, "epoch": 242} {"train_loss": -7.941625595092773, "global_step": 40817, "epoch": 242} {"train_loss": -8.165143013000488, "global_step": 40818, "epoch": 242} {"train_loss": -7.977136611938477, "global_step": 40819, "epoch": 242} {"train_loss": -8.115042686462402, "global_step": 40820, "epoch": 242} {"train_loss": -7.974878787994385, "global_step": 40821, "epoch": 242} {"train_loss": -8.05813980102539, "global_step": 40822, "epoch": 242} {"train_loss": -7.935277496065412, "global_step": 40823, "epoch": 242, "val_loss": 185077.578125} {"train_loss": -8.123533248901367, "global_step": 40824, "epoch": 243} {"train_loss": -7.758968830108643, "global_step": 40825, "epoch": 243} {"train_loss": -8.028959274291992, "global_step": 40826, "epoch": 243} {"train_loss": -8.018796920776367, "global_step": 40827, "epoch": 243} {"train_loss": -7.7171502113342285, "global_step": 40828, "epoch": 243} {"train_loss": -7.917917251586914, "global_step": 40829, "epoch": 243} {"train_loss": -7.747776985168457, "global_step": 40830, "epoch": 243} {"train_loss": -8.015487670898438, "global_step": 40831, "epoch": 243} {"train_loss": -8.080791473388672, "global_step": 40832, "epoch": 243} {"train_loss": -7.863040924072266, "global_step": 40833, "epoch": 243} {"train_loss": -8.021185874938965, "global_step": 40834, "epoch": 243} {"train_loss": -7.961965084075928, "global_step": 40835, "epoch": 243} {"train_loss": -8.007804870605469, "global_step": 40836, "epoch": 243} {"train_loss": -8.038997650146484, "global_step": 40837, "epoch": 243} {"train_loss": -7.920377254486084, "global_step": 40838, "epoch": 243} {"train_loss": -7.986467361450195, "global_step": 40839, "epoch": 243} {"train_loss": -7.78165864944458, "global_step": 40840, "epoch": 243} {"train_loss": -7.96442985534668, "global_step": 40841, "epoch": 243} {"train_loss": -7.742702960968018, "global_step": 40842, "epoch": 243} {"train_loss": -8.019566535949707, "global_step": 40843, "epoch": 243} {"train_loss": -7.908431529998779, "global_step": 40844, "epoch": 243} {"train_loss": -8.135141372680664, "global_step": 40845, "epoch": 243} {"train_loss": -8.00056266784668, "global_step": 40846, "epoch": 243} {"train_loss": -7.953831672668457, "global_step": 40847, "epoch": 243} {"train_loss": -8.105171203613281, "global_step": 40848, "epoch": 243} {"train_loss": -7.640995502471924, "global_step": 40849, "epoch": 243} {"train_loss": -8.151022911071777, "global_step": 40850, "epoch": 243} {"train_loss": -8.116083145141602, "global_step": 40851, "epoch": 243} {"train_loss": -8.05009651184082, "global_step": 40852, "epoch": 243} {"train_loss": -8.066276550292969, "global_step": 40853, "epoch": 243} {"train_loss": -8.154936790466309, "global_step": 40854, "epoch": 243} {"train_loss": -8.12801456451416, "global_step": 40855, "epoch": 243} {"train_loss": -8.150978088378906, "global_step": 40856, "epoch": 243} {"train_loss": -8.147502899169922, "global_step": 40857, "epoch": 243} {"train_loss": -8.232337951660156, "global_step": 40858, "epoch": 243} {"train_loss": -8.239385604858398, "global_step": 40859, "epoch": 243} {"train_loss": -8.104448318481445, "global_step": 40860, "epoch": 243} {"train_loss": -8.065991401672363, "global_step": 40861, "epoch": 243} {"train_loss": -7.97158670425415, "global_step": 40862, "epoch": 243} {"train_loss": -7.918554306030273, "global_step": 40863, "epoch": 243} {"train_loss": -8.008530616760254, "global_step": 40864, "epoch": 243} {"train_loss": -8.191210746765137, "global_step": 40865, "epoch": 243} {"train_loss": -8.140830993652344, "global_step": 40866, "epoch": 243} {"train_loss": -8.051551818847656, "global_step": 40867, "epoch": 243} {"train_loss": -8.199409484863281, "global_step": 40868, "epoch": 243} {"train_loss": -7.942469596862793, "global_step": 40869, "epoch": 243} {"train_loss": -7.917570114135742, "global_step": 40870, "epoch": 243} {"train_loss": -8.00358772277832, "global_step": 40871, "epoch": 243} {"train_loss": -7.6013031005859375, "global_step": 40872, "epoch": 243} {"train_loss": -8.010337829589844, "global_step": 40873, "epoch": 243} {"train_loss": -7.383788108825684, "global_step": 40874, "epoch": 243} {"train_loss": -7.841022491455078, "global_step": 40875, "epoch": 243} {"train_loss": -7.427006244659424, "global_step": 40876, "epoch": 243} {"train_loss": -7.673848628997803, "global_step": 40877, "epoch": 243} {"train_loss": -7.726805686950684, "global_step": 40878, "epoch": 243} {"train_loss": -7.9332098960876465, "global_step": 40879, "epoch": 243} {"train_loss": -7.7583465576171875, "global_step": 40880, "epoch": 243} {"train_loss": -7.838508605957031, "global_step": 40881, "epoch": 243} {"train_loss": -7.994579315185547, "global_step": 40882, "epoch": 243} {"train_loss": -7.775850296020508, "global_step": 40883, "epoch": 243} {"train_loss": -7.861382484436035, "global_step": 40884, "epoch": 243} {"train_loss": -7.775973320007324, "global_step": 40885, "epoch": 243} {"train_loss": -7.950093746185303, "global_step": 40886, "epoch": 243} {"train_loss": -7.819191932678223, "global_step": 40887, "epoch": 243} {"train_loss": -7.892764091491699, "global_step": 40888, "epoch": 243} {"train_loss": -7.716708183288574, "global_step": 40889, "epoch": 243} {"train_loss": -7.944830894470215, "global_step": 40890, "epoch": 243} {"train_loss": -8.03093147277832, "global_step": 40891, "epoch": 243} {"train_loss": -8.0278959274292, "global_step": 40892, "epoch": 243} {"train_loss": -8.007568359375, "global_step": 40893, "epoch": 243} {"train_loss": -8.02202033996582, "global_step": 40894, "epoch": 243} {"train_loss": -7.86453914642334, "global_step": 40895, "epoch": 243} {"train_loss": -7.932865142822266, "global_step": 40896, "epoch": 243} {"train_loss": -7.870456695556641, "global_step": 40897, "epoch": 243} {"train_loss": -7.925943851470947, "global_step": 40898, "epoch": 243} {"train_loss": -7.969968795776367, "global_step": 40899, "epoch": 243} {"train_loss": -7.830667018890381, "global_step": 40900, "epoch": 243} {"train_loss": -8.093696594238281, "global_step": 40901, "epoch": 243} {"train_loss": -7.706799507141113, "global_step": 40902, "epoch": 243} {"train_loss": -8.047218322753906, "global_step": 40903, "epoch": 243} {"train_loss": -7.887179851531982, "global_step": 40904, "epoch": 243} {"train_loss": -7.972805500030518, "global_step": 40905, "epoch": 243} {"train_loss": -7.755390167236328, "global_step": 40906, "epoch": 243} {"train_loss": -8.100854873657227, "global_step": 40907, "epoch": 243} {"train_loss": -8.132811546325684, "global_step": 40908, "epoch": 243} {"train_loss": -7.946152210235596, "global_step": 40909, "epoch": 243} {"train_loss": -8.074469566345215, "global_step": 40910, "epoch": 243} {"train_loss": -7.975471496582031, "global_step": 40911, "epoch": 243} {"train_loss": -7.940284252166748, "global_step": 40912, "epoch": 243} {"train_loss": -7.787932395935059, "global_step": 40913, "epoch": 243} {"train_loss": -8.066520690917969, "global_step": 40914, "epoch": 243} {"train_loss": -8.00925064086914, "global_step": 40915, "epoch": 243} {"train_loss": -8.14428997039795, "global_step": 40916, "epoch": 243} {"train_loss": -7.9826340675354, "global_step": 40917, "epoch": 243} {"train_loss": -8.069602966308594, "global_step": 40918, "epoch": 243} {"train_loss": -8.219408988952637, "global_step": 40919, "epoch": 243} {"train_loss": -7.793757438659668, "global_step": 40920, "epoch": 243} {"train_loss": -7.967465877532959, "global_step": 40921, "epoch": 243} {"train_loss": -7.774916648864746, "global_step": 40922, "epoch": 243} {"train_loss": -8.13349723815918, "global_step": 40923, "epoch": 243} {"train_loss": -7.917168617248535, "global_step": 40924, "epoch": 243} {"train_loss": -8.159991264343262, "global_step": 40925, "epoch": 243} {"train_loss": -7.886924743652344, "global_step": 40926, "epoch": 243} {"train_loss": -7.960926532745361, "global_step": 40927, "epoch": 243} {"train_loss": -7.901817798614502, "global_step": 40928, "epoch": 243} {"train_loss": -7.915763854980469, "global_step": 40929, "epoch": 243} {"train_loss": -7.870757102966309, "global_step": 40930, "epoch": 243} {"train_loss": -8.063825607299805, "global_step": 40931, "epoch": 243} {"train_loss": -8.109359741210938, "global_step": 40932, "epoch": 243} {"train_loss": -7.799881458282471, "global_step": 40933, "epoch": 243} {"train_loss": -7.909907341003418, "global_step": 40934, "epoch": 243} {"train_loss": -8.022054672241211, "global_step": 40935, "epoch": 243} {"train_loss": -7.926183700561523, "global_step": 40936, "epoch": 243} {"train_loss": -7.911468029022217, "global_step": 40937, "epoch": 243} {"train_loss": -7.870322227478027, "global_step": 40938, "epoch": 243} {"train_loss": -8.01537036895752, "global_step": 40939, "epoch": 243} {"train_loss": -7.990050315856934, "global_step": 40940, "epoch": 243} {"train_loss": -7.719557762145996, "global_step": 40941, "epoch": 243} {"train_loss": -7.786574363708496, "global_step": 40942, "epoch": 243} {"train_loss": -7.929666519165039, "global_step": 40943, "epoch": 243} {"train_loss": -7.634336471557617, "global_step": 40944, "epoch": 243} {"train_loss": -8.108034133911133, "global_step": 40945, "epoch": 243} {"train_loss": -7.903461456298828, "global_step": 40946, "epoch": 243} {"train_loss": -8.093996047973633, "global_step": 40947, "epoch": 243} {"train_loss": -7.962135314941406, "global_step": 40948, "epoch": 243} {"train_loss": -7.913315296173096, "global_step": 40949, "epoch": 243} {"train_loss": -7.8592305183410645, "global_step": 40950, "epoch": 243} {"train_loss": -7.663492202758789, "global_step": 40951, "epoch": 243} {"train_loss": -7.913103103637695, "global_step": 40952, "epoch": 243} {"train_loss": -7.731679916381836, "global_step": 40953, "epoch": 243} {"train_loss": -7.860510349273682, "global_step": 40954, "epoch": 243} {"train_loss": -7.732344627380371, "global_step": 40955, "epoch": 243} {"train_loss": -7.905731201171875, "global_step": 40956, "epoch": 243} {"train_loss": -7.986910820007324, "global_step": 40957, "epoch": 243} {"train_loss": -8.04520320892334, "global_step": 40958, "epoch": 243} {"train_loss": -8.012673377990723, "global_step": 40959, "epoch": 243} {"train_loss": -7.874073028564453, "global_step": 40960, "epoch": 243} {"train_loss": -8.094223022460938, "global_step": 40961, "epoch": 243} {"train_loss": -7.920723915100098, "global_step": 40962, "epoch": 243} {"train_loss": -7.943389892578125, "global_step": 40963, "epoch": 243} {"train_loss": -7.965303421020508, "global_step": 40964, "epoch": 243} {"train_loss": -7.774527072906494, "global_step": 40965, "epoch": 243} {"train_loss": -7.996926307678223, "global_step": 40966, "epoch": 243} {"train_loss": -7.657725811004639, "global_step": 40967, "epoch": 243} {"train_loss": -7.815806865692139, "global_step": 40968, "epoch": 243} {"train_loss": -7.792849540710449, "global_step": 40969, "epoch": 243} {"train_loss": -7.919710159301758, "global_step": 40970, "epoch": 243} {"train_loss": -8.134730339050293, "global_step": 40971, "epoch": 243} {"train_loss": -7.824871063232422, "global_step": 40972, "epoch": 243} {"train_loss": -8.1100492477417, "global_step": 40973, "epoch": 243} {"train_loss": -8.042445182800293, "global_step": 40974, "epoch": 243} {"train_loss": -8.146547317504883, "global_step": 40975, "epoch": 243} {"train_loss": -7.908167839050293, "global_step": 40976, "epoch": 243} {"train_loss": -7.756229400634766, "global_step": 40977, "epoch": 243} {"train_loss": -7.868428707122803, "global_step": 40978, "epoch": 243} {"train_loss": -7.9247307777404785, "global_step": 40979, "epoch": 243} {"train_loss": -8.20777702331543, "global_step": 40980, "epoch": 243} {"train_loss": -8.067334175109863, "global_step": 40981, "epoch": 243} {"train_loss": -8.079852104187012, "global_step": 40982, "epoch": 243} {"train_loss": -7.547102928161621, "global_step": 40983, "epoch": 243} {"train_loss": -8.086721420288086, "global_step": 40984, "epoch": 243} {"train_loss": -7.624104976654053, "global_step": 40985, "epoch": 243} {"train_loss": -7.924528121948242, "global_step": 40986, "epoch": 243} {"train_loss": -8.015069961547852, "global_step": 40987, "epoch": 243} {"train_loss": -7.843317985534668, "global_step": 40988, "epoch": 243} {"train_loss": -7.67463493347168, "global_step": 40989, "epoch": 243} {"train_loss": -7.897346496582031, "global_step": 40990, "epoch": 243} {"train_loss": -7.937766293684642, "global_step": 40991, "epoch": 243, "val_loss": 188080.46875} {"train_loss": -7.988940715789795, "global_step": 40992, "epoch": 244} {"train_loss": -8.037044525146484, "global_step": 40993, "epoch": 244} {"train_loss": -7.8508100509643555, "global_step": 40994, "epoch": 244} {"train_loss": -7.718520164489746, "global_step": 40995, "epoch": 244} {"train_loss": -7.908522605895996, "global_step": 40996, "epoch": 244} {"train_loss": -7.683565139770508, "global_step": 40997, "epoch": 244} {"train_loss": -7.734777927398682, "global_step": 40998, "epoch": 244} {"train_loss": -7.934680938720703, "global_step": 40999, "epoch": 244} {"train_loss": -7.487110137939453, "global_step": 41000, "epoch": 244} {"train_loss": -7.851889133453369, "global_step": 41001, "epoch": 244} {"train_loss": -7.6877970695495605, "global_step": 41002, "epoch": 244} {"train_loss": -7.605184555053711, "global_step": 41003, "epoch": 244} {"train_loss": -7.6729607582092285, "global_step": 41004, "epoch": 244} {"train_loss": -7.960272789001465, "global_step": 41005, "epoch": 244} {"train_loss": -7.4853515625, "global_step": 41006, "epoch": 244} {"train_loss": -8.072543144226074, "global_step": 41007, "epoch": 244} {"train_loss": -7.769401550292969, "global_step": 41008, "epoch": 244} {"train_loss": -7.942644119262695, "global_step": 41009, "epoch": 244} {"train_loss": -7.967323303222656, "global_step": 41010, "epoch": 244} {"train_loss": -7.960970878601074, "global_step": 41011, "epoch": 244} {"train_loss": -8.02795696258545, "global_step": 41012, "epoch": 244} {"train_loss": -8.011130332946777, "global_step": 41013, "epoch": 244} {"train_loss": -7.876452445983887, "global_step": 41014, "epoch": 244} {"train_loss": -7.968536376953125, "global_step": 41015, "epoch": 244} {"train_loss": -8.016302108764648, "global_step": 41016, "epoch": 244} {"train_loss": -7.894172668457031, "global_step": 41017, "epoch": 244} {"train_loss": -7.790585041046143, "global_step": 41018, "epoch": 244} {"train_loss": -8.071825981140137, "global_step": 41019, "epoch": 244} {"train_loss": -8.043416023254395, "global_step": 41020, "epoch": 244} {"train_loss": -8.105130195617676, "global_step": 41021, "epoch": 244} {"train_loss": -7.900310039520264, "global_step": 41022, "epoch": 244} {"train_loss": -8.039865493774414, "global_step": 41023, "epoch": 244} {"train_loss": -8.090612411499023, "global_step": 41024, "epoch": 244} {"train_loss": -8.116485595703125, "global_step": 41025, "epoch": 244} {"train_loss": -8.249007225036621, "global_step": 41026, "epoch": 244} {"train_loss": -7.967209815979004, "global_step": 41027, "epoch": 244} {"train_loss": -7.986390113830566, "global_step": 41028, "epoch": 244} {"train_loss": -8.065080642700195, "global_step": 41029, "epoch": 244} {"train_loss": -8.195131301879883, "global_step": 41030, "epoch": 244} {"train_loss": -8.066452026367188, "global_step": 41031, "epoch": 244} {"train_loss": -8.000650405883789, "global_step": 41032, "epoch": 244} {"train_loss": -7.992312908172607, "global_step": 41033, "epoch": 244} {"train_loss": -8.063920974731445, "global_step": 41034, "epoch": 244} {"train_loss": -7.753711223602295, "global_step": 41035, "epoch": 244} {"train_loss": -7.8690667152404785, "global_step": 41036, "epoch": 244} {"train_loss": -8.229042053222656, "global_step": 41037, "epoch": 244} {"train_loss": -8.025253295898438, "global_step": 41038, "epoch": 244} {"train_loss": -8.091390609741211, "global_step": 41039, "epoch": 244} {"train_loss": -8.087423324584961, "global_step": 41040, "epoch": 244} {"train_loss": -7.958981513977051, "global_step": 41041, "epoch": 244} {"train_loss": -8.008885383605957, "global_step": 41042, "epoch": 244} {"train_loss": -8.034367561340332, "global_step": 41043, "epoch": 244} {"train_loss": -7.724974632263184, "global_step": 41044, "epoch": 244} {"train_loss": -7.6743974685668945, "global_step": 41045, "epoch": 244} {"train_loss": -7.885426044464111, "global_step": 41046, "epoch": 244} {"train_loss": -7.941847801208496, "global_step": 41047, "epoch": 244} {"train_loss": -7.977902412414551, "global_step": 41048, "epoch": 244} {"train_loss": -7.802138328552246, "global_step": 41049, "epoch": 244} {"train_loss": -8.010257720947266, "global_step": 41050, "epoch": 244} {"train_loss": -7.826459884643555, "global_step": 41051, "epoch": 244} {"train_loss": -8.15721321105957, "global_step": 41052, "epoch": 244} {"train_loss": -8.020212173461914, "global_step": 41053, "epoch": 244} {"train_loss": -7.956849098205566, "global_step": 41054, "epoch": 244} {"train_loss": -8.006850242614746, "global_step": 41055, "epoch": 244} {"train_loss": -7.9217119216918945, "global_step": 41056, "epoch": 244} {"train_loss": -7.816102981567383, "global_step": 41057, "epoch": 244} {"train_loss": -7.862520217895508, "global_step": 41058, "epoch": 244} {"train_loss": -7.900302886962891, "global_step": 41059, "epoch": 244} {"train_loss": -7.912432670593262, "global_step": 41060, "epoch": 244} {"train_loss": -7.901391506195068, "global_step": 41061, "epoch": 244} {"train_loss": -8.137458801269531, "global_step": 41062, "epoch": 244} {"train_loss": -7.872972011566162, "global_step": 41063, "epoch": 244} {"train_loss": -7.905470848083496, "global_step": 41064, "epoch": 244} {"train_loss": -7.890280723571777, "global_step": 41065, "epoch": 244} {"train_loss": -7.796022415161133, "global_step": 41066, "epoch": 244} {"train_loss": -7.924355506896973, "global_step": 41067, "epoch": 244} {"train_loss": -7.935785293579102, "global_step": 41068, "epoch": 244} {"train_loss": -7.885115623474121, "global_step": 41069, "epoch": 244} {"train_loss": -7.96736478805542, "global_step": 41070, "epoch": 244} {"train_loss": -7.884468078613281, "global_step": 41071, "epoch": 244} {"train_loss": -7.503688812255859, "global_step": 41072, "epoch": 244} {"train_loss": -8.0204496383667, "global_step": 41073, "epoch": 244} {"train_loss": -7.737827777862549, "global_step": 41074, "epoch": 244} {"train_loss": -7.976091384887695, "global_step": 41075, "epoch": 244} {"train_loss": -7.915904521942139, "global_step": 41076, "epoch": 244} {"train_loss": -8.063331604003906, "global_step": 41077, "epoch": 244} {"train_loss": -7.842884063720703, "global_step": 41078, "epoch": 244} {"train_loss": -8.020683288574219, "global_step": 41079, "epoch": 244} {"train_loss": -7.964939117431641, "global_step": 41080, "epoch": 244} {"train_loss": -7.986636638641357, "global_step": 41081, "epoch": 244} {"train_loss": -7.693539619445801, "global_step": 41082, "epoch": 244} {"train_loss": -7.81752872467041, "global_step": 41083, "epoch": 244} {"train_loss": -7.887806415557861, "global_step": 41084, "epoch": 244} {"train_loss": -7.993887901306152, "global_step": 41085, "epoch": 244} {"train_loss": -8.030494689941406, "global_step": 41086, "epoch": 244} {"train_loss": -7.926284313201904, "global_step": 41087, "epoch": 244} {"train_loss": -8.133573532104492, "global_step": 41088, "epoch": 244} {"train_loss": -8.157447814941406, "global_step": 41089, "epoch": 244} {"train_loss": -8.218311309814453, "global_step": 41090, "epoch": 244} {"train_loss": -8.031530380249023, "global_step": 41091, "epoch": 244} {"train_loss": -7.977813243865967, "global_step": 41092, "epoch": 244} {"train_loss": -8.149054527282715, "global_step": 41093, "epoch": 244} {"train_loss": -8.276623725891113, "global_step": 41094, "epoch": 244} {"train_loss": -8.049485206604004, "global_step": 41095, "epoch": 244} {"train_loss": -8.270570755004883, "global_step": 41096, "epoch": 244} {"train_loss": -8.026740074157715, "global_step": 41097, "epoch": 244} {"train_loss": -8.25067138671875, "global_step": 41098, "epoch": 244} {"train_loss": -8.251714706420898, "global_step": 41099, "epoch": 244} {"train_loss": -7.932610988616943, "global_step": 41100, "epoch": 244} {"train_loss": -7.958178997039795, "global_step": 41101, "epoch": 244} {"train_loss": -7.88570499420166, "global_step": 41102, "epoch": 244} {"train_loss": -7.998269081115723, "global_step": 41103, "epoch": 244} {"train_loss": -8.100914001464844, "global_step": 41104, "epoch": 244} {"train_loss": -7.7946929931640625, "global_step": 41105, "epoch": 244} {"train_loss": -7.922224044799805, "global_step": 41106, "epoch": 244} {"train_loss": -8.251770973205566, "global_step": 41107, "epoch": 244} {"train_loss": -7.413125038146973, "global_step": 41108, "epoch": 244} {"train_loss": -7.792166709899902, "global_step": 41109, "epoch": 244} {"train_loss": -7.5795369148254395, "global_step": 41110, "epoch": 244} {"train_loss": -7.924582481384277, "global_step": 41111, "epoch": 244} {"train_loss": -7.344551086425781, "global_step": 41112, "epoch": 244} {"train_loss": -7.536164283752441, "global_step": 41113, "epoch": 244} {"train_loss": -7.492232799530029, "global_step": 41114, "epoch": 244} {"train_loss": -7.620846271514893, "global_step": 41115, "epoch": 244} {"train_loss": -7.609528541564941, "global_step": 41116, "epoch": 244} {"train_loss": -7.783895492553711, "global_step": 41117, "epoch": 244} {"train_loss": -7.481531143188477, "global_step": 41118, "epoch": 244} {"train_loss": -7.815959930419922, "global_step": 41119, "epoch": 244} {"train_loss": -7.667234420776367, "global_step": 41120, "epoch": 244} {"train_loss": -7.364112854003906, "global_step": 41121, "epoch": 244} {"train_loss": -7.650866985321045, "global_step": 41122, "epoch": 244} {"train_loss": -7.634827136993408, "global_step": 41123, "epoch": 244} {"train_loss": -7.555186748504639, "global_step": 41124, "epoch": 244} {"train_loss": -7.823263168334961, "global_step": 41125, "epoch": 244} {"train_loss": -7.859638690948486, "global_step": 41126, "epoch": 244} {"train_loss": -7.574067115783691, "global_step": 41127, "epoch": 244} {"train_loss": -7.763069152832031, "global_step": 41128, "epoch": 244} {"train_loss": -7.8204193115234375, "global_step": 41129, "epoch": 244} {"train_loss": -7.8353471755981445, "global_step": 41130, "epoch": 244} {"train_loss": -7.779886722564697, "global_step": 41131, "epoch": 244} {"train_loss": -7.7218451499938965, "global_step": 41132, "epoch": 244} {"train_loss": -8.084165573120117, "global_step": 41133, "epoch": 244} {"train_loss": -7.982161521911621, "global_step": 41134, "epoch": 244} {"train_loss": -7.978826522827148, "global_step": 41135, "epoch": 244} {"train_loss": -8.107450485229492, "global_step": 41136, "epoch": 244} {"train_loss": -8.113578796386719, "global_step": 41137, "epoch": 244} {"train_loss": -7.970757007598877, "global_step": 41138, "epoch": 244} {"train_loss": -8.025642395019531, "global_step": 41139, "epoch": 244} {"train_loss": -8.111852645874023, "global_step": 41140, "epoch": 244} {"train_loss": -8.046186447143555, "global_step": 41141, "epoch": 244} {"train_loss": -7.915616035461426, "global_step": 41142, "epoch": 244} {"train_loss": -8.08951473236084, "global_step": 41143, "epoch": 244} {"train_loss": -8.185111999511719, "global_step": 41144, "epoch": 244} {"train_loss": -8.197420120239258, "global_step": 41145, "epoch": 244} {"train_loss": -8.183347702026367, "global_step": 41146, "epoch": 244} {"train_loss": -8.305232048034668, "global_step": 41147, "epoch": 244} {"train_loss": -8.17036247253418, "global_step": 41148, "epoch": 244} {"train_loss": -8.304420471191406, "global_step": 41149, "epoch": 244} {"train_loss": -8.119516372680664, "global_step": 41150, "epoch": 244} {"train_loss": -8.27168083190918, "global_step": 41151, "epoch": 244} {"train_loss": -8.294707298278809, "global_step": 41152, "epoch": 244} {"train_loss": -8.096752166748047, "global_step": 41153, "epoch": 244} {"train_loss": -8.064098358154297, "global_step": 41154, "epoch": 244} {"train_loss": -7.716119766235352, "global_step": 41155, "epoch": 244} {"train_loss": -7.911520004272461, "global_step": 41156, "epoch": 244} {"train_loss": -7.949736595153809, "global_step": 41157, "epoch": 244} {"train_loss": -7.98567008972168, "global_step": 41158, "epoch": 244} {"train_loss": -7.930332178161258, "global_step": 41159, "epoch": 244, "val_loss": 185686.6875} {"train_loss": -8.17719841003418, "global_step": 41160, "epoch": 245} {"train_loss": -7.879090309143066, "global_step": 41161, "epoch": 245} {"train_loss": -7.748760223388672, "global_step": 41162, "epoch": 245} {"train_loss": -7.968562602996826, "global_step": 41163, "epoch": 245} {"train_loss": -7.66972541809082, "global_step": 41164, "epoch": 245} {"train_loss": -7.935691833496094, "global_step": 41165, "epoch": 245} {"train_loss": -7.691247463226318, "global_step": 41166, "epoch": 245} {"train_loss": -7.953916549682617, "global_step": 41167, "epoch": 245} {"train_loss": -7.815732002258301, "global_step": 41168, "epoch": 245} {"train_loss": -7.870239734649658, "global_step": 41169, "epoch": 245} {"train_loss": -7.501959800720215, "global_step": 41170, "epoch": 245} {"train_loss": -7.841592788696289, "global_step": 41171, "epoch": 245} {"train_loss": -7.854720115661621, "global_step": 41172, "epoch": 245} {"train_loss": -7.773689270019531, "global_step": 41173, "epoch": 245} {"train_loss": -7.639254570007324, "global_step": 41174, "epoch": 245} {"train_loss": -7.694554328918457, "global_step": 41175, "epoch": 245} {"train_loss": -7.727924823760986, "global_step": 41176, "epoch": 245} {"train_loss": -7.717381477355957, "global_step": 41177, "epoch": 245} {"train_loss": -7.856925010681152, "global_step": 41178, "epoch": 245} {"train_loss": -8.0198974609375, "global_step": 41179, "epoch": 245} {"train_loss": -7.703136920928955, "global_step": 41180, "epoch": 245} {"train_loss": -7.9960832595825195, "global_step": 41181, "epoch": 245} {"train_loss": -8.07150650024414, "global_step": 41182, "epoch": 245} {"train_loss": -7.984823703765869, "global_step": 41183, "epoch": 245} {"train_loss": -8.035696029663086, "global_step": 41184, "epoch": 245} {"train_loss": -7.800277233123779, "global_step": 41185, "epoch": 245} {"train_loss": -7.946697235107422, "global_step": 41186, "epoch": 245} {"train_loss": -8.076332092285156, "global_step": 41187, "epoch": 245} {"train_loss": -8.030923843383789, "global_step": 41188, "epoch": 245} {"train_loss": -7.980999946594238, "global_step": 41189, "epoch": 245} {"train_loss": -8.113612174987793, "global_step": 41190, "epoch": 245} {"train_loss": -8.017210006713867, "global_step": 41191, "epoch": 245} {"train_loss": -8.161112785339355, "global_step": 41192, "epoch": 245} {"train_loss": -8.196599960327148, "global_step": 41193, "epoch": 245} {"train_loss": -8.163055419921875, "global_step": 41194, "epoch": 245} {"train_loss": -8.030363082885742, "global_step": 41195, "epoch": 245} {"train_loss": -7.951273441314697, "global_step": 41196, "epoch": 245} {"train_loss": -7.807304382324219, "global_step": 41197, "epoch": 245} {"train_loss": -8.03158950805664, "global_step": 41198, "epoch": 245} {"train_loss": -7.896482944488525, "global_step": 41199, "epoch": 245} {"train_loss": -7.995630264282227, "global_step": 41200, "epoch": 245} {"train_loss": -7.885016441345215, "global_step": 41201, "epoch": 245} {"train_loss": -8.352022171020508, "global_step": 41202, "epoch": 245} {"train_loss": -7.974577903747559, "global_step": 41203, "epoch": 245} {"train_loss": -7.587926864624023, "global_step": 41204, "epoch": 245} {"train_loss": -8.256233215332031, "global_step": 41205, "epoch": 245} {"train_loss": -7.855405330657959, "global_step": 41206, "epoch": 245} {"train_loss": -7.875838756561279, "global_step": 41207, "epoch": 245} {"train_loss": -8.007918357849121, "global_step": 41208, "epoch": 245} {"train_loss": -8.264888763427734, "global_step": 41209, "epoch": 245} {"train_loss": -7.5748701095581055, "global_step": 41210, "epoch": 245} {"train_loss": -8.25776481628418, "global_step": 41211, "epoch": 245} {"train_loss": -7.471879959106445, "global_step": 41212, "epoch": 245} {"train_loss": -7.914804458618164, "global_step": 41213, "epoch": 245} {"train_loss": -7.821222305297852, "global_step": 41214, "epoch": 245} {"train_loss": -7.985940933227539, "global_step": 41215, "epoch": 245} {"train_loss": -7.671948432922363, "global_step": 41216, "epoch": 245} {"train_loss": -7.905439376831055, "global_step": 41217, "epoch": 245} {"train_loss": -7.878323078155518, "global_step": 41218, "epoch": 245} {"train_loss": -7.927182197570801, "global_step": 41219, "epoch": 245} {"train_loss": -8.07994270324707, "global_step": 41220, "epoch": 245} {"train_loss": -7.974343299865723, "global_step": 41221, "epoch": 245} {"train_loss": -8.042242050170898, "global_step": 41222, "epoch": 245} {"train_loss": -8.138509750366211, "global_step": 41223, "epoch": 245} {"train_loss": -7.877110481262207, "global_step": 41224, "epoch": 245} {"train_loss": -8.218465805053711, "global_step": 41225, "epoch": 245} {"train_loss": -8.077832221984863, "global_step": 41226, "epoch": 245} {"train_loss": -8.262186050415039, "global_step": 41227, "epoch": 245} {"train_loss": -7.752712249755859, "global_step": 41228, "epoch": 245} {"train_loss": -7.773625373840332, "global_step": 41229, "epoch": 245} {"train_loss": -7.655722141265869, "global_step": 41230, "epoch": 245} {"train_loss": -8.031913757324219, "global_step": 41231, "epoch": 245} {"train_loss": -7.983508586883545, "global_step": 41232, "epoch": 245} {"train_loss": -7.517364501953125, "global_step": 41233, "epoch": 245} {"train_loss": -7.311803817749023, "global_step": 41234, "epoch": 245} {"train_loss": -7.864195823669434, "global_step": 41235, "epoch": 245} {"train_loss": -7.3652262687683105, "global_step": 41236, "epoch": 245} {"train_loss": -7.518876552581787, "global_step": 41237, "epoch": 245} {"train_loss": -7.875758647918701, "global_step": 41238, "epoch": 245} {"train_loss": -7.684015274047852, "global_step": 41239, "epoch": 245} {"train_loss": -7.627906322479248, "global_step": 41240, "epoch": 245} {"train_loss": -7.760646820068359, "global_step": 41241, "epoch": 245} {"train_loss": -7.809248447418213, "global_step": 41242, "epoch": 245} {"train_loss": -7.794708728790283, "global_step": 41243, "epoch": 245} {"train_loss": -7.786219596862793, "global_step": 41244, "epoch": 245} {"train_loss": -7.969510078430176, "global_step": 41245, "epoch": 245} {"train_loss": -7.978994846343994, "global_step": 41246, "epoch": 245} {"train_loss": -7.902780532836914, "global_step": 41247, "epoch": 245} {"train_loss": -7.926738739013672, "global_step": 41248, "epoch": 245} {"train_loss": -7.920197010040283, "global_step": 41249, "epoch": 245} {"train_loss": -8.050419807434082, "global_step": 41250, "epoch": 245} {"train_loss": -7.730750560760498, "global_step": 41251, "epoch": 245} {"train_loss": -8.011589050292969, "global_step": 41252, "epoch": 245} {"train_loss": -7.869433403015137, "global_step": 41253, "epoch": 245} {"train_loss": -8.039655685424805, "global_step": 41254, "epoch": 245} {"train_loss": -7.777550220489502, "global_step": 41255, "epoch": 245} {"train_loss": -7.936607360839844, "global_step": 41256, "epoch": 245} {"train_loss": -8.133530616760254, "global_step": 41257, "epoch": 245} {"train_loss": -8.078874588012695, "global_step": 41258, "epoch": 245} {"train_loss": -7.980515956878662, "global_step": 41259, "epoch": 245} {"train_loss": -7.995423316955566, "global_step": 41260, "epoch": 245} {"train_loss": -8.108891487121582, "global_step": 41261, "epoch": 245} {"train_loss": -8.014745712280273, "global_step": 41262, "epoch": 245} {"train_loss": -7.978810787200928, "global_step": 41263, "epoch": 245} {"train_loss": -8.278084754943848, "global_step": 41264, "epoch": 245} {"train_loss": -8.01850414276123, "global_step": 41265, "epoch": 245} {"train_loss": -8.219978332519531, "global_step": 41266, "epoch": 245} {"train_loss": -7.826308250427246, "global_step": 41267, "epoch": 245} {"train_loss": -8.014188766479492, "global_step": 41268, "epoch": 245} {"train_loss": -8.261636734008789, "global_step": 41269, "epoch": 245} {"train_loss": -8.067495346069336, "global_step": 41270, "epoch": 245} {"train_loss": -8.015817642211914, "global_step": 41271, "epoch": 245} {"train_loss": -8.124731063842773, "global_step": 41272, "epoch": 245} {"train_loss": -8.145342826843262, "global_step": 41273, "epoch": 245} {"train_loss": -7.854554176330566, "global_step": 41274, "epoch": 245} {"train_loss": -7.909233093261719, "global_step": 41275, "epoch": 245} {"train_loss": -7.96812629699707, "global_step": 41276, "epoch": 245} {"train_loss": -7.9289655685424805, "global_step": 41277, "epoch": 245} {"train_loss": -8.252832412719727, "global_step": 41278, "epoch": 245} {"train_loss": -7.822763919830322, "global_step": 41279, "epoch": 245} {"train_loss": -8.208187103271484, "global_step": 41280, "epoch": 245} {"train_loss": -8.027623176574707, "global_step": 41281, "epoch": 245} {"train_loss": -8.002594947814941, "global_step": 41282, "epoch": 245} {"train_loss": -7.974361419677734, "global_step": 41283, "epoch": 245} {"train_loss": -8.03398609161377, "global_step": 41284, "epoch": 245} {"train_loss": -8.122011184692383, "global_step": 41285, "epoch": 245} {"train_loss": -8.198570251464844, "global_step": 41286, "epoch": 245} {"train_loss": -7.955105781555176, "global_step": 41287, "epoch": 245} {"train_loss": -8.078817367553711, "global_step": 41288, "epoch": 245} {"train_loss": -7.9546122550964355, "global_step": 41289, "epoch": 245} {"train_loss": -7.8700947761535645, "global_step": 41290, "epoch": 245} {"train_loss": -7.980914115905762, "global_step": 41291, "epoch": 245} {"train_loss": -7.734777927398682, "global_step": 41292, "epoch": 245} {"train_loss": -7.693392276763916, "global_step": 41293, "epoch": 245} {"train_loss": -7.978658199310303, "global_step": 41294, "epoch": 245} {"train_loss": -7.892280578613281, "global_step": 41295, "epoch": 245} {"train_loss": -8.129046440124512, "global_step": 41296, "epoch": 245} {"train_loss": -8.024709701538086, "global_step": 41297, "epoch": 245} {"train_loss": -8.037904739379883, "global_step": 41298, "epoch": 245} {"train_loss": -7.807260513305664, "global_step": 41299, "epoch": 245} {"train_loss": -8.043547630310059, "global_step": 41300, "epoch": 245} {"train_loss": -8.072032928466797, "global_step": 41301, "epoch": 245} {"train_loss": -8.04318904876709, "global_step": 41302, "epoch": 245} {"train_loss": -7.965680122375488, "global_step": 41303, "epoch": 245} {"train_loss": -7.949444770812988, "global_step": 41304, "epoch": 245} {"train_loss": -7.775268077850342, "global_step": 41305, "epoch": 245} {"train_loss": -7.852752208709717, "global_step": 41306, "epoch": 245} {"train_loss": -7.689084529876709, "global_step": 41307, "epoch": 245} {"train_loss": -7.738409519195557, "global_step": 41308, "epoch": 245} {"train_loss": -8.001631736755371, "global_step": 41309, "epoch": 245} {"train_loss": -8.04858112335205, "global_step": 41310, "epoch": 245} {"train_loss": -7.947646617889404, "global_step": 41311, "epoch": 245} {"train_loss": -7.844658851623535, "global_step": 41312, "epoch": 245} {"train_loss": -8.052499771118164, "global_step": 41313, "epoch": 245} {"train_loss": -7.931513786315918, "global_step": 41314, "epoch": 245} {"train_loss": -7.882171154022217, "global_step": 41315, "epoch": 245} {"train_loss": -7.998890399932861, "global_step": 41316, "epoch": 245} {"train_loss": -8.074527740478516, "global_step": 41317, "epoch": 245} {"train_loss": -8.018339157104492, "global_step": 41318, "epoch": 245} {"train_loss": -7.894081115722656, "global_step": 41319, "epoch": 245} {"train_loss": -7.882798194885254, "global_step": 41320, "epoch": 245} {"train_loss": -7.886431694030762, "global_step": 41321, "epoch": 245} {"train_loss": -8.010746002197266, "global_step": 41322, "epoch": 245} {"train_loss": -7.93461275100708, "global_step": 41323, "epoch": 245} {"train_loss": -7.861163139343262, "global_step": 41324, "epoch": 245} {"train_loss": -8.027458190917969, "global_step": 41325, "epoch": 245} {"train_loss": -8.2474365234375, "global_step": 41326, "epoch": 245} {"train_loss": -7.935975364276341, "global_step": 41327, "epoch": 245, "val_loss": 184955.65625, "train_action_mse_error": 11.9750394821167} {"train_loss": -7.941349983215332, "global_step": 41328, "epoch": 246} {"train_loss": -8.153400421142578, "global_step": 41329, "epoch": 246} {"train_loss": -8.121580123901367, "global_step": 41330, "epoch": 246} {"train_loss": -8.075298309326172, "global_step": 41331, "epoch": 246} {"train_loss": -7.943607330322266, "global_step": 41332, "epoch": 246} {"train_loss": -8.085443496704102, "global_step": 41333, "epoch": 246} {"train_loss": -8.20212459564209, "global_step": 41334, "epoch": 246} {"train_loss": -8.08041763305664, "global_step": 41335, "epoch": 246} {"train_loss": -7.964115619659424, "global_step": 41336, "epoch": 246} {"train_loss": -7.849666595458984, "global_step": 41337, "epoch": 246} {"train_loss": -7.969155788421631, "global_step": 41338, "epoch": 246} {"train_loss": -7.897290229797363, "global_step": 41339, "epoch": 246} {"train_loss": -7.969614505767822, "global_step": 41340, "epoch": 246} {"train_loss": -7.985397815704346, "global_step": 41341, "epoch": 246} {"train_loss": -8.086377143859863, "global_step": 41342, "epoch": 246} {"train_loss": -8.117757797241211, "global_step": 41343, "epoch": 246} {"train_loss": -7.842076301574707, "global_step": 41344, "epoch": 246} {"train_loss": -8.06084156036377, "global_step": 41345, "epoch": 246} {"train_loss": -7.943596363067627, "global_step": 41346, "epoch": 246} {"train_loss": -8.224531173706055, "global_step": 41347, "epoch": 246} {"train_loss": -7.926410675048828, "global_step": 41348, "epoch": 246} {"train_loss": -7.906808853149414, "global_step": 41349, "epoch": 246} {"train_loss": -7.9884538650512695, "global_step": 41350, "epoch": 246} {"train_loss": -8.177082061767578, "global_step": 41351, "epoch": 246} {"train_loss": -7.898530960083008, "global_step": 41352, "epoch": 246} {"train_loss": -7.87620735168457, "global_step": 41353, "epoch": 246} {"train_loss": -7.969181537628174, "global_step": 41354, "epoch": 246} {"train_loss": -7.904923915863037, "global_step": 41355, "epoch": 246} {"train_loss": -7.970138072967529, "global_step": 41356, "epoch": 246} {"train_loss": -8.00993537902832, "global_step": 41357, "epoch": 246} {"train_loss": -8.005287170410156, "global_step": 41358, "epoch": 246} {"train_loss": -8.06057357788086, "global_step": 41359, "epoch": 246} {"train_loss": -7.931491851806641, "global_step": 41360, "epoch": 246} {"train_loss": -8.06109619140625, "global_step": 41361, "epoch": 246} {"train_loss": -8.063105583190918, "global_step": 41362, "epoch": 246} {"train_loss": -7.860144138336182, "global_step": 41363, "epoch": 246} {"train_loss": -8.091439247131348, "global_step": 41364, "epoch": 246} {"train_loss": -7.931763648986816, "global_step": 41365, "epoch": 246} {"train_loss": -8.247650146484375, "global_step": 41366, "epoch": 246} {"train_loss": -7.915709495544434, "global_step": 41367, "epoch": 246} {"train_loss": -8.021310806274414, "global_step": 41368, "epoch": 246} {"train_loss": -7.958734512329102, "global_step": 41369, "epoch": 246} {"train_loss": -8.167865753173828, "global_step": 41370, "epoch": 246} {"train_loss": -7.8143229484558105, "global_step": 41371, "epoch": 246} {"train_loss": -7.973771572113037, "global_step": 41372, "epoch": 246} {"train_loss": -7.760030269622803, "global_step": 41373, "epoch": 246} {"train_loss": -7.969941139221191, "global_step": 41374, "epoch": 246} {"train_loss": -7.970699310302734, "global_step": 41375, "epoch": 246} {"train_loss": -7.717477798461914, "global_step": 41376, "epoch": 246} {"train_loss": -7.875176906585693, "global_step": 41377, "epoch": 246} {"train_loss": -7.836766719818115, "global_step": 41378, "epoch": 246} {"train_loss": -7.946460247039795, "global_step": 41379, "epoch": 246} {"train_loss": -8.012939453125, "global_step": 41380, "epoch": 246} {"train_loss": -7.832358360290527, "global_step": 41381, "epoch": 246} {"train_loss": -7.896106719970703, "global_step": 41382, "epoch": 246} {"train_loss": -7.847722053527832, "global_step": 41383, "epoch": 246} {"train_loss": -8.277898788452148, "global_step": 41384, "epoch": 246} {"train_loss": -7.82883358001709, "global_step": 41385, "epoch": 246} {"train_loss": -8.017577171325684, "global_step": 41386, "epoch": 246} {"train_loss": -8.094108581542969, "global_step": 41387, "epoch": 246} {"train_loss": -8.209112167358398, "global_step": 41388, "epoch": 246} {"train_loss": -7.963156700134277, "global_step": 41389, "epoch": 246} {"train_loss": -8.14133071899414, "global_step": 41390, "epoch": 246} {"train_loss": -8.104530334472656, "global_step": 41391, "epoch": 246} {"train_loss": -8.125486373901367, "global_step": 41392, "epoch": 246} {"train_loss": -8.16226577758789, "global_step": 41393, "epoch": 246} {"train_loss": -8.068536758422852, "global_step": 41394, "epoch": 246} {"train_loss": -7.9760942459106445, "global_step": 41395, "epoch": 246} {"train_loss": -7.873719215393066, "global_step": 41396, "epoch": 246} {"train_loss": -7.967528343200684, "global_step": 41397, "epoch": 246} {"train_loss": -8.36291217803955, "global_step": 41398, "epoch": 246} {"train_loss": -8.039979934692383, "global_step": 41399, "epoch": 246} {"train_loss": -7.879857063293457, "global_step": 41400, "epoch": 246} {"train_loss": -8.046775817871094, "global_step": 41401, "epoch": 246} {"train_loss": -8.264078140258789, "global_step": 41402, "epoch": 246} {"train_loss": -8.150882720947266, "global_step": 41403, "epoch": 246} {"train_loss": -8.253556251525879, "global_step": 41404, "epoch": 246} {"train_loss": -8.259653091430664, "global_step": 41405, "epoch": 246} {"train_loss": -8.134721755981445, "global_step": 41406, "epoch": 246} {"train_loss": -8.137432098388672, "global_step": 41407, "epoch": 246} {"train_loss": -8.316673278808594, "global_step": 41408, "epoch": 246} {"train_loss": -8.319591522216797, "global_step": 41409, "epoch": 246} {"train_loss": -8.052734375, "global_step": 41410, "epoch": 246} {"train_loss": -8.02347183227539, "global_step": 41411, "epoch": 246} {"train_loss": -8.215503692626953, "global_step": 41412, "epoch": 246} {"train_loss": -8.078744888305664, "global_step": 41413, "epoch": 246} {"train_loss": -8.23624038696289, "global_step": 41414, "epoch": 246} {"train_loss": -8.251903533935547, "global_step": 41415, "epoch": 246} {"train_loss": -7.899115085601807, "global_step": 41416, "epoch": 246} {"train_loss": -8.077594757080078, "global_step": 41417, "epoch": 246} {"train_loss": -8.04210090637207, "global_step": 41418, "epoch": 246} {"train_loss": -7.510804176330566, "global_step": 41419, "epoch": 246} {"train_loss": -8.02564811706543, "global_step": 41420, "epoch": 246} {"train_loss": -7.788455009460449, "global_step": 41421, "epoch": 246} {"train_loss": -7.719481945037842, "global_step": 41422, "epoch": 246} {"train_loss": -7.615518093109131, "global_step": 41423, "epoch": 246} {"train_loss": -7.776637077331543, "global_step": 41424, "epoch": 246} {"train_loss": -7.851895809173584, "global_step": 41425, "epoch": 246} {"train_loss": -7.894530296325684, "global_step": 41426, "epoch": 246} {"train_loss": -7.473883628845215, "global_step": 41427, "epoch": 246} {"train_loss": -7.633052825927734, "global_step": 41428, "epoch": 246} {"train_loss": -7.767848491668701, "global_step": 41429, "epoch": 246} {"train_loss": -7.6349639892578125, "global_step": 41430, "epoch": 246} {"train_loss": -7.764675140380859, "global_step": 41431, "epoch": 246} {"train_loss": -7.9522905349731445, "global_step": 41432, "epoch": 246} {"train_loss": -7.945430278778076, "global_step": 41433, "epoch": 246} {"train_loss": -7.775241374969482, "global_step": 41434, "epoch": 246} {"train_loss": -7.846790790557861, "global_step": 41435, "epoch": 246} {"train_loss": -8.004880905151367, "global_step": 41436, "epoch": 246} {"train_loss": -7.939013481140137, "global_step": 41437, "epoch": 246} {"train_loss": -7.836469650268555, "global_step": 41438, "epoch": 246} {"train_loss": -7.9167585372924805, "global_step": 41439, "epoch": 246} {"train_loss": -7.899127006530762, "global_step": 41440, "epoch": 246} {"train_loss": -7.611688613891602, "global_step": 41441, "epoch": 246} {"train_loss": -7.795957565307617, "global_step": 41442, "epoch": 246} {"train_loss": -7.87827205657959, "global_step": 41443, "epoch": 246} {"train_loss": -7.860065460205078, "global_step": 41444, "epoch": 246} {"train_loss": -8.012127876281738, "global_step": 41445, "epoch": 246} {"train_loss": -7.747119903564453, "global_step": 41446, "epoch": 246} {"train_loss": -8.040435791015625, "global_step": 41447, "epoch": 246} {"train_loss": -7.670246124267578, "global_step": 41448, "epoch": 246} {"train_loss": -7.862998008728027, "global_step": 41449, "epoch": 246} {"train_loss": -7.826475143432617, "global_step": 41450, "epoch": 246} {"train_loss": -7.652036666870117, "global_step": 41451, "epoch": 246} {"train_loss": -8.110895156860352, "global_step": 41452, "epoch": 246} {"train_loss": -7.784460067749023, "global_step": 41453, "epoch": 246} {"train_loss": -8.027259826660156, "global_step": 41454, "epoch": 246} {"train_loss": -7.814587116241455, "global_step": 41455, "epoch": 246} {"train_loss": -8.077792167663574, "global_step": 41456, "epoch": 246} {"train_loss": -7.8194427490234375, "global_step": 41457, "epoch": 246} {"train_loss": -8.299527168273926, "global_step": 41458, "epoch": 246} {"train_loss": -7.897054672241211, "global_step": 41459, "epoch": 246} {"train_loss": -8.026728630065918, "global_step": 41460, "epoch": 246} {"train_loss": -8.072792053222656, "global_step": 41461, "epoch": 246} {"train_loss": -7.954871654510498, "global_step": 41462, "epoch": 246} {"train_loss": -8.047134399414062, "global_step": 41463, "epoch": 246} {"train_loss": -8.226787567138672, "global_step": 41464, "epoch": 246} {"train_loss": -7.93814754486084, "global_step": 41465, "epoch": 246} {"train_loss": -8.023065567016602, "global_step": 41466, "epoch": 246} {"train_loss": -8.057629585266113, "global_step": 41467, "epoch": 246} {"train_loss": -8.11358642578125, "global_step": 41468, "epoch": 246} {"train_loss": -7.840325355529785, "global_step": 41469, "epoch": 246} {"train_loss": -8.058185577392578, "global_step": 41470, "epoch": 246} {"train_loss": -7.937300682067871, "global_step": 41471, "epoch": 246} {"train_loss": -7.907665252685547, "global_step": 41472, "epoch": 246} {"train_loss": -7.954197883605957, "global_step": 41473, "epoch": 246} {"train_loss": -8.182689666748047, "global_step": 41474, "epoch": 246} {"train_loss": -8.096266746520996, "global_step": 41475, "epoch": 246} {"train_loss": -7.876081466674805, "global_step": 41476, "epoch": 246} {"train_loss": -7.851103782653809, "global_step": 41477, "epoch": 246} {"train_loss": -8.021795272827148, "global_step": 41478, "epoch": 246} {"train_loss": -8.106698036193848, "global_step": 41479, "epoch": 246} {"train_loss": -7.747170925140381, "global_step": 41480, "epoch": 246} {"train_loss": -7.9871368408203125, "global_step": 41481, "epoch": 246} {"train_loss": -7.821184158325195, "global_step": 41482, "epoch": 246} {"train_loss": -8.259089469909668, "global_step": 41483, "epoch": 246} {"train_loss": -8.089101791381836, "global_step": 41484, "epoch": 246} {"train_loss": -7.835892677307129, "global_step": 41485, "epoch": 246} {"train_loss": -7.857641220092773, "global_step": 41486, "epoch": 246} {"train_loss": -7.927165985107422, "global_step": 41487, "epoch": 246} {"train_loss": -7.935745716094971, "global_step": 41488, "epoch": 246} {"train_loss": -8.083407402038574, "global_step": 41489, "epoch": 246} {"train_loss": -8.07861328125, "global_step": 41490, "epoch": 246} {"train_loss": -7.970771312713623, "global_step": 41491, "epoch": 246} {"train_loss": -8.099069595336914, "global_step": 41492, "epoch": 246} {"train_loss": -7.937814712524414, "global_step": 41493, "epoch": 246} {"train_loss": -7.86674690246582, "global_step": 41494, "epoch": 246} {"train_loss": -7.975366339797065, "global_step": 41495, "epoch": 246, "val_loss": 184736.03125} {"train_loss": -7.983422756195068, "global_step": 41496, "epoch": 247} {"train_loss": -7.8002238273620605, "global_step": 41497, "epoch": 247} {"train_loss": -8.233622550964355, "global_step": 41498, "epoch": 247} {"train_loss": -7.906685829162598, "global_step": 41499, "epoch": 247} {"train_loss": -7.882503032684326, "global_step": 41500, "epoch": 247} {"train_loss": -7.781105995178223, "global_step": 41501, "epoch": 247} {"train_loss": -7.751216411590576, "global_step": 41502, "epoch": 247} {"train_loss": -7.854053497314453, "global_step": 41503, "epoch": 247} {"train_loss": -7.995636940002441, "global_step": 41504, "epoch": 247} {"train_loss": -7.792629241943359, "global_step": 41505, "epoch": 247} {"train_loss": -7.984560012817383, "global_step": 41506, "epoch": 247} {"train_loss": -7.830635070800781, "global_step": 41507, "epoch": 247} {"train_loss": -7.71870756149292, "global_step": 41508, "epoch": 247} {"train_loss": -7.905978679656982, "global_step": 41509, "epoch": 247} {"train_loss": -7.878591537475586, "global_step": 41510, "epoch": 247} {"train_loss": -7.889259338378906, "global_step": 41511, "epoch": 247} {"train_loss": -7.873333930969238, "global_step": 41512, "epoch": 247} {"train_loss": -7.937507629394531, "global_step": 41513, "epoch": 247} {"train_loss": -8.091278076171875, "global_step": 41514, "epoch": 247} {"train_loss": -8.125310897827148, "global_step": 41515, "epoch": 247} {"train_loss": -8.121044158935547, "global_step": 41516, "epoch": 247} {"train_loss": -8.279526710510254, "global_step": 41517, "epoch": 247} {"train_loss": -8.208670616149902, "global_step": 41518, "epoch": 247} {"train_loss": -8.134918212890625, "global_step": 41519, "epoch": 247} {"train_loss": -8.050539016723633, "global_step": 41520, "epoch": 247} {"train_loss": -7.976365089416504, "global_step": 41521, "epoch": 247} {"train_loss": -8.24815845489502, "global_step": 41522, "epoch": 247} {"train_loss": -8.263214111328125, "global_step": 41523, "epoch": 247} {"train_loss": -8.169312477111816, "global_step": 41524, "epoch": 247} {"train_loss": -7.909665584564209, "global_step": 41525, "epoch": 247} {"train_loss": -8.156837463378906, "global_step": 41526, "epoch": 247} {"train_loss": -7.946063041687012, "global_step": 41527, "epoch": 247} {"train_loss": -8.221031188964844, "global_step": 41528, "epoch": 247} {"train_loss": -7.821457862854004, "global_step": 41529, "epoch": 247} {"train_loss": -8.243955612182617, "global_step": 41530, "epoch": 247} {"train_loss": -7.543149948120117, "global_step": 41531, "epoch": 247} {"train_loss": -8.042597770690918, "global_step": 41532, "epoch": 247} {"train_loss": -7.822576999664307, "global_step": 41533, "epoch": 247} {"train_loss": -7.884586334228516, "global_step": 41534, "epoch": 247} {"train_loss": -8.04937744140625, "global_step": 41535, "epoch": 247} {"train_loss": -8.103981018066406, "global_step": 41536, "epoch": 247} {"train_loss": -7.911008358001709, "global_step": 41537, "epoch": 247} {"train_loss": -7.991210460662842, "global_step": 41538, "epoch": 247} {"train_loss": -8.146448135375977, "global_step": 41539, "epoch": 247} {"train_loss": -7.962632179260254, "global_step": 41540, "epoch": 247} {"train_loss": -7.7482500076293945, "global_step": 41541, "epoch": 247} {"train_loss": -8.173455238342285, "global_step": 41542, "epoch": 247} {"train_loss": -7.7844014167785645, "global_step": 41543, "epoch": 247} {"train_loss": -7.870391845703125, "global_step": 41544, "epoch": 247} {"train_loss": -8.110631942749023, "global_step": 41545, "epoch": 247} {"train_loss": -7.770581245422363, "global_step": 41546, "epoch": 247} {"train_loss": -8.036710739135742, "global_step": 41547, "epoch": 247} {"train_loss": -7.734971523284912, "global_step": 41548, "epoch": 247} {"train_loss": -7.752612113952637, "global_step": 41549, "epoch": 247} {"train_loss": -7.709974765777588, "global_step": 41550, "epoch": 247} {"train_loss": -7.937417984008789, "global_step": 41551, "epoch": 247} {"train_loss": -7.910888195037842, "global_step": 41552, "epoch": 247} {"train_loss": -8.088147163391113, "global_step": 41553, "epoch": 247} {"train_loss": -7.6353302001953125, "global_step": 41554, "epoch": 247} {"train_loss": -7.759134769439697, "global_step": 41555, "epoch": 247} {"train_loss": -7.905447959899902, "global_step": 41556, "epoch": 247} {"train_loss": -7.494695663452148, "global_step": 41557, "epoch": 247} {"train_loss": -7.86189079284668, "global_step": 41558, "epoch": 247} {"train_loss": -8.143030166625977, "global_step": 41559, "epoch": 247} {"train_loss": -7.833075046539307, "global_step": 41560, "epoch": 247} {"train_loss": -7.74013614654541, "global_step": 41561, "epoch": 247} {"train_loss": -8.179729461669922, "global_step": 41562, "epoch": 247} {"train_loss": -7.816223621368408, "global_step": 41563, "epoch": 247} {"train_loss": -7.911829948425293, "global_step": 41564, "epoch": 247} {"train_loss": -7.80217170715332, "global_step": 41565, "epoch": 247} {"train_loss": -8.101614952087402, "global_step": 41566, "epoch": 247} {"train_loss": -7.91700553894043, "global_step": 41567, "epoch": 247} {"train_loss": -8.159379959106445, "global_step": 41568, "epoch": 247} {"train_loss": -8.162020683288574, "global_step": 41569, "epoch": 247} {"train_loss": -8.162668228149414, "global_step": 41570, "epoch": 247} {"train_loss": -8.125014305114746, "global_step": 41571, "epoch": 247} {"train_loss": -8.060285568237305, "global_step": 41572, "epoch": 247} {"train_loss": -8.25625228881836, "global_step": 41573, "epoch": 247} {"train_loss": -7.867074012756348, "global_step": 41574, "epoch": 247} {"train_loss": -7.988561153411865, "global_step": 41575, "epoch": 247} {"train_loss": -7.9201436042785645, "global_step": 41576, "epoch": 247} {"train_loss": -8.078039169311523, "global_step": 41577, "epoch": 247} {"train_loss": -7.960336685180664, "global_step": 41578, "epoch": 247} {"train_loss": -8.128665924072266, "global_step": 41579, "epoch": 247} {"train_loss": -8.07247543334961, "global_step": 41580, "epoch": 247} {"train_loss": -8.007364273071289, "global_step": 41581, "epoch": 247} {"train_loss": -7.865808486938477, "global_step": 41582, "epoch": 247} {"train_loss": -8.083455085754395, "global_step": 41583, "epoch": 247} {"train_loss": -8.126497268676758, "global_step": 41584, "epoch": 247} {"train_loss": -8.16756820678711, "global_step": 41585, "epoch": 247} {"train_loss": -8.063254356384277, "global_step": 41586, "epoch": 247} {"train_loss": -8.355599403381348, "global_step": 41587, "epoch": 247} {"train_loss": -8.10209846496582, "global_step": 41588, "epoch": 247} {"train_loss": -8.051987648010254, "global_step": 41589, "epoch": 247} {"train_loss": -8.056295394897461, "global_step": 41590, "epoch": 247} {"train_loss": -8.078777313232422, "global_step": 41591, "epoch": 247} {"train_loss": -8.0635347366333, "global_step": 41592, "epoch": 247} {"train_loss": -7.92123556137085, "global_step": 41593, "epoch": 247} {"train_loss": -7.7728800773620605, "global_step": 41594, "epoch": 247} {"train_loss": -8.152327537536621, "global_step": 41595, "epoch": 247} {"train_loss": -7.994582176208496, "global_step": 41596, "epoch": 247} {"train_loss": -7.85996150970459, "global_step": 41597, "epoch": 247} {"train_loss": -8.048370361328125, "global_step": 41598, "epoch": 247} {"train_loss": -8.191971778869629, "global_step": 41599, "epoch": 247} {"train_loss": -7.925966262817383, "global_step": 41600, "epoch": 247} {"train_loss": -8.082930564880371, "global_step": 41601, "epoch": 247} {"train_loss": -7.862405300140381, "global_step": 41602, "epoch": 247} {"train_loss": -8.062480926513672, "global_step": 41603, "epoch": 247} {"train_loss": -8.03510856628418, "global_step": 41604, "epoch": 247} {"train_loss": -8.007461547851562, "global_step": 41605, "epoch": 247} {"train_loss": -7.839519500732422, "global_step": 41606, "epoch": 247} {"train_loss": -7.965839862823486, "global_step": 41607, "epoch": 247} {"train_loss": -7.99860954284668, "global_step": 41608, "epoch": 247} {"train_loss": -8.155816078186035, "global_step": 41609, "epoch": 247} {"train_loss": -7.82395076751709, "global_step": 41610, "epoch": 247} {"train_loss": -8.100648880004883, "global_step": 41611, "epoch": 247} {"train_loss": -8.083686828613281, "global_step": 41612, "epoch": 247} {"train_loss": -8.043128967285156, "global_step": 41613, "epoch": 247} {"train_loss": -7.712949752807617, "global_step": 41614, "epoch": 247} {"train_loss": -7.841854572296143, "global_step": 41615, "epoch": 247} {"train_loss": -7.948349475860596, "global_step": 41616, "epoch": 247} {"train_loss": -7.759409427642822, "global_step": 41617, "epoch": 247} {"train_loss": -8.175735473632812, "global_step": 41618, "epoch": 247} {"train_loss": -7.904557228088379, "global_step": 41619, "epoch": 247} {"train_loss": -7.947245121002197, "global_step": 41620, "epoch": 247} {"train_loss": -7.789442539215088, "global_step": 41621, "epoch": 247} {"train_loss": -7.987844944000244, "global_step": 41622, "epoch": 247} {"train_loss": -7.739856719970703, "global_step": 41623, "epoch": 247} {"train_loss": -8.064311981201172, "global_step": 41624, "epoch": 247} {"train_loss": -7.996374130249023, "global_step": 41625, "epoch": 247} {"train_loss": -8.210055351257324, "global_step": 41626, "epoch": 247} {"train_loss": -8.003089904785156, "global_step": 41627, "epoch": 247} {"train_loss": -8.155182838439941, "global_step": 41628, "epoch": 247} {"train_loss": -7.756213665008545, "global_step": 41629, "epoch": 247} {"train_loss": -7.9773054122924805, "global_step": 41630, "epoch": 247} {"train_loss": -8.146217346191406, "global_step": 41631, "epoch": 247} {"train_loss": -7.942404747009277, "global_step": 41632, "epoch": 247} {"train_loss": -8.13758373260498, "global_step": 41633, "epoch": 247} {"train_loss": -8.306100845336914, "global_step": 41634, "epoch": 247} {"train_loss": -8.153039932250977, "global_step": 41635, "epoch": 247} {"train_loss": -8.090511322021484, "global_step": 41636, "epoch": 247} {"train_loss": -8.245282173156738, "global_step": 41637, "epoch": 247} {"train_loss": -8.023600578308105, "global_step": 41638, "epoch": 247} {"train_loss": -8.30390739440918, "global_step": 41639, "epoch": 247} {"train_loss": -8.339879989624023, "global_step": 41640, "epoch": 247} {"train_loss": -8.23063850402832, "global_step": 41641, "epoch": 247} {"train_loss": -7.96144437789917, "global_step": 41642, "epoch": 247} {"train_loss": -8.24398422241211, "global_step": 41643, "epoch": 247} {"train_loss": -8.13101863861084, "global_step": 41644, "epoch": 247} {"train_loss": -8.146442413330078, "global_step": 41645, "epoch": 247} {"train_loss": -7.997132301330566, "global_step": 41646, "epoch": 247} {"train_loss": -8.001015663146973, "global_step": 41647, "epoch": 247} {"train_loss": -7.996510982513428, "global_step": 41648, "epoch": 247} {"train_loss": -8.141766548156738, "global_step": 41649, "epoch": 247} {"train_loss": -7.990494728088379, "global_step": 41650, "epoch": 247} {"train_loss": -7.841007232666016, "global_step": 41651, "epoch": 247} {"train_loss": -7.851067543029785, "global_step": 41652, "epoch": 247} {"train_loss": -8.024441719055176, "global_step": 41653, "epoch": 247} {"train_loss": -8.04574203491211, "global_step": 41654, "epoch": 247} {"train_loss": -7.828159809112549, "global_step": 41655, "epoch": 247} {"train_loss": -8.181640625, "global_step": 41656, "epoch": 247} {"train_loss": -7.845885276794434, "global_step": 41657, "epoch": 247} {"train_loss": -7.942161560058594, "global_step": 41658, "epoch": 247} {"train_loss": -7.837188243865967, "global_step": 41659, "epoch": 247} {"train_loss": -8.256256103515625, "global_step": 41660, "epoch": 247} {"train_loss": -8.122159957885742, "global_step": 41661, "epoch": 247} {"train_loss": -7.925241947174072, "global_step": 41662, "epoch": 247} {"train_loss": -7.99394336768559, "global_step": 41663, "epoch": 247, "val_loss": 184564.171875} {"train_loss": -8.017019271850586, "global_step": 41664, "epoch": 248} {"train_loss": -7.68985652923584, "global_step": 41665, "epoch": 248} {"train_loss": -8.126477241516113, "global_step": 41666, "epoch": 248} {"train_loss": -8.03104019165039, "global_step": 41667, "epoch": 248} {"train_loss": -7.84907341003418, "global_step": 41668, "epoch": 248} {"train_loss": -7.752647399902344, "global_step": 41669, "epoch": 248} {"train_loss": -7.7560930252075195, "global_step": 41670, "epoch": 248} {"train_loss": -7.61345100402832, "global_step": 41671, "epoch": 248} {"train_loss": -7.742830276489258, "global_step": 41672, "epoch": 248} {"train_loss": -8.083266258239746, "global_step": 41673, "epoch": 248} {"train_loss": -8.02862548828125, "global_step": 41674, "epoch": 248} {"train_loss": -8.0462646484375, "global_step": 41675, "epoch": 248} {"train_loss": -7.771200180053711, "global_step": 41676, "epoch": 248} {"train_loss": -7.823853969573975, "global_step": 41677, "epoch": 248} {"train_loss": -7.896592140197754, "global_step": 41678, "epoch": 248} {"train_loss": -8.154597282409668, "global_step": 41679, "epoch": 248} {"train_loss": -7.973024368286133, "global_step": 41680, "epoch": 248} {"train_loss": -8.101959228515625, "global_step": 41681, "epoch": 248} {"train_loss": -8.037371635437012, "global_step": 41682, "epoch": 248} {"train_loss": -7.96480131149292, "global_step": 41683, "epoch": 248} {"train_loss": -7.692167282104492, "global_step": 41684, "epoch": 248} {"train_loss": -7.842006683349609, "global_step": 41685, "epoch": 248} {"train_loss": -8.035581588745117, "global_step": 41686, "epoch": 248} {"train_loss": -7.781701564788818, "global_step": 41687, "epoch": 248} {"train_loss": -7.875317573547363, "global_step": 41688, "epoch": 248} {"train_loss": -7.486958026885986, "global_step": 41689, "epoch": 248} {"train_loss": -7.844884872436523, "global_step": 41690, "epoch": 248} {"train_loss": -7.810276031494141, "global_step": 41691, "epoch": 248} {"train_loss": -7.953287124633789, "global_step": 41692, "epoch": 248} {"train_loss": -8.0892915725708, "global_step": 41693, "epoch": 248} {"train_loss": -7.855166912078857, "global_step": 41694, "epoch": 248} {"train_loss": -7.733310699462891, "global_step": 41695, "epoch": 248} {"train_loss": -8.10263729095459, "global_step": 41696, "epoch": 248} {"train_loss": -8.027837753295898, "global_step": 41697, "epoch": 248} {"train_loss": -8.04074764251709, "global_step": 41698, "epoch": 248} {"train_loss": -7.9799065589904785, "global_step": 41699, "epoch": 248} {"train_loss": -7.97168493270874, "global_step": 41700, "epoch": 248} {"train_loss": -8.106138229370117, "global_step": 41701, "epoch": 248} {"train_loss": -8.182345390319824, "global_step": 41702, "epoch": 248} {"train_loss": -8.070202827453613, "global_step": 41703, "epoch": 248} {"train_loss": -8.021644592285156, "global_step": 41704, "epoch": 248} {"train_loss": -7.988828659057617, "global_step": 41705, "epoch": 248} {"train_loss": -7.753214359283447, "global_step": 41706, "epoch": 248} {"train_loss": -8.143045425415039, "global_step": 41707, "epoch": 248} {"train_loss": -8.075889587402344, "global_step": 41708, "epoch": 248} {"train_loss": -8.109890937805176, "global_step": 41709, "epoch": 248} {"train_loss": -8.083282470703125, "global_step": 41710, "epoch": 248} {"train_loss": -8.016314506530762, "global_step": 41711, "epoch": 248} {"train_loss": -8.243526458740234, "global_step": 41712, "epoch": 248} {"train_loss": -8.170608520507812, "global_step": 41713, "epoch": 248} {"train_loss": -8.101106643676758, "global_step": 41714, "epoch": 248} {"train_loss": -8.098898887634277, "global_step": 41715, "epoch": 248} {"train_loss": -8.01099967956543, "global_step": 41716, "epoch": 248} {"train_loss": -8.07868766784668, "global_step": 41717, "epoch": 248} {"train_loss": -8.213578224182129, "global_step": 41718, "epoch": 248} {"train_loss": -8.09231185913086, "global_step": 41719, "epoch": 248} {"train_loss": -8.308455467224121, "global_step": 41720, "epoch": 248} {"train_loss": -8.08999252319336, "global_step": 41721, "epoch": 248} {"train_loss": -8.003615379333496, "global_step": 41722, "epoch": 248} {"train_loss": -8.117082595825195, "global_step": 41723, "epoch": 248} {"train_loss": -8.161022186279297, "global_step": 41724, "epoch": 248} {"train_loss": -8.043193817138672, "global_step": 41725, "epoch": 248} {"train_loss": -8.206670761108398, "global_step": 41726, "epoch": 248} {"train_loss": -8.094039916992188, "global_step": 41727, "epoch": 248} {"train_loss": -7.8919525146484375, "global_step": 41728, "epoch": 248} {"train_loss": -7.855685234069824, "global_step": 41729, "epoch": 248} {"train_loss": -7.925365447998047, "global_step": 41730, "epoch": 248} {"train_loss": -7.702822685241699, "global_step": 41731, "epoch": 248} {"train_loss": -7.901712894439697, "global_step": 41732, "epoch": 248} {"train_loss": -7.553784370422363, "global_step": 41733, "epoch": 248} {"train_loss": -8.090497970581055, "global_step": 41734, "epoch": 248} {"train_loss": -7.822697639465332, "global_step": 41735, "epoch": 248} {"train_loss": -7.829087257385254, "global_step": 41736, "epoch": 248} {"train_loss": -7.723658561706543, "global_step": 41737, "epoch": 248} {"train_loss": -7.662883758544922, "global_step": 41738, "epoch": 248} {"train_loss": -8.021514892578125, "global_step": 41739, "epoch": 248} {"train_loss": -7.804019927978516, "global_step": 41740, "epoch": 248} {"train_loss": -7.905086040496826, "global_step": 41741, "epoch": 248} {"train_loss": -7.784876823425293, "global_step": 41742, "epoch": 248} {"train_loss": -7.911618709564209, "global_step": 41743, "epoch": 248} {"train_loss": -7.488955020904541, "global_step": 41744, "epoch": 248} {"train_loss": -7.902987003326416, "global_step": 41745, "epoch": 248} {"train_loss": -8.003683090209961, "global_step": 41746, "epoch": 248} {"train_loss": -7.8040313720703125, "global_step": 41747, "epoch": 248} {"train_loss": -8.088274955749512, "global_step": 41748, "epoch": 248} {"train_loss": -7.992009162902832, "global_step": 41749, "epoch": 248} {"train_loss": -7.639157295227051, "global_step": 41750, "epoch": 248} {"train_loss": -8.014932632446289, "global_step": 41751, "epoch": 248} {"train_loss": -7.91572380065918, "global_step": 41752, "epoch": 248} {"train_loss": -7.7078633308410645, "global_step": 41753, "epoch": 248} {"train_loss": -7.866819381713867, "global_step": 41754, "epoch": 248} {"train_loss": -7.924612998962402, "global_step": 41755, "epoch": 248} {"train_loss": -7.887214183807373, "global_step": 41756, "epoch": 248} {"train_loss": -7.969249725341797, "global_step": 41757, "epoch": 248} {"train_loss": -8.078371047973633, "global_step": 41758, "epoch": 248} {"train_loss": -7.944803714752197, "global_step": 41759, "epoch": 248} {"train_loss": -8.069741249084473, "global_step": 41760, "epoch": 248} {"train_loss": -7.904715061187744, "global_step": 41761, "epoch": 248} {"train_loss": -7.941492080688477, "global_step": 41762, "epoch": 248} {"train_loss": -7.86450719833374, "global_step": 41763, "epoch": 248} {"train_loss": -8.035831451416016, "global_step": 41764, "epoch": 248} {"train_loss": -7.915600776672363, "global_step": 41765, "epoch": 248} {"train_loss": -7.901694297790527, "global_step": 41766, "epoch": 248} {"train_loss": -7.728816986083984, "global_step": 41767, "epoch": 248} {"train_loss": -8.031890869140625, "global_step": 41768, "epoch": 248} {"train_loss": -7.49615478515625, "global_step": 41769, "epoch": 248} {"train_loss": -7.8730316162109375, "global_step": 41770, "epoch": 248} {"train_loss": -7.656375885009766, "global_step": 41771, "epoch": 248} {"train_loss": -7.853543281555176, "global_step": 41772, "epoch": 248} {"train_loss": -7.939384460449219, "global_step": 41773, "epoch": 248} {"train_loss": -7.678602695465088, "global_step": 41774, "epoch": 248} {"train_loss": -8.008062362670898, "global_step": 41775, "epoch": 248} {"train_loss": -7.854868412017822, "global_step": 41776, "epoch": 248} {"train_loss": -8.089790344238281, "global_step": 41777, "epoch": 248} {"train_loss": -7.977784156799316, "global_step": 41778, "epoch": 248} {"train_loss": -7.8926849365234375, "global_step": 41779, "epoch": 248} {"train_loss": -7.731821537017822, "global_step": 41780, "epoch": 248} {"train_loss": -7.796226978302002, "global_step": 41781, "epoch": 248} {"train_loss": -7.973791599273682, "global_step": 41782, "epoch": 248} {"train_loss": -7.935288906097412, "global_step": 41783, "epoch": 248} {"train_loss": -7.890194416046143, "global_step": 41784, "epoch": 248} {"train_loss": -8.033946990966797, "global_step": 41785, "epoch": 248} {"train_loss": -8.030648231506348, "global_step": 41786, "epoch": 248} {"train_loss": -8.001381874084473, "global_step": 41787, "epoch": 248} {"train_loss": -8.01266860961914, "global_step": 41788, "epoch": 248} {"train_loss": -7.7984619140625, "global_step": 41789, "epoch": 248} {"train_loss": -8.061328887939453, "global_step": 41790, "epoch": 248} {"train_loss": -8.236621856689453, "global_step": 41791, "epoch": 248} {"train_loss": -7.901212692260742, "global_step": 41792, "epoch": 248} {"train_loss": -8.044398307800293, "global_step": 41793, "epoch": 248} {"train_loss": -7.875850677490234, "global_step": 41794, "epoch": 248} {"train_loss": -8.016752243041992, "global_step": 41795, "epoch": 248} {"train_loss": -7.962772369384766, "global_step": 41796, "epoch": 248} {"train_loss": -8.2631196975708, "global_step": 41797, "epoch": 248} {"train_loss": -8.109491348266602, "global_step": 41798, "epoch": 248} {"train_loss": -8.007930755615234, "global_step": 41799, "epoch": 248} {"train_loss": -7.960877418518066, "global_step": 41800, "epoch": 248} {"train_loss": -8.091255187988281, "global_step": 41801, "epoch": 248} {"train_loss": -7.718267440795898, "global_step": 41802, "epoch": 248} {"train_loss": -8.116945266723633, "global_step": 41803, "epoch": 248} {"train_loss": -7.879681587219238, "global_step": 41804, "epoch": 248} {"train_loss": -7.9238996505737305, "global_step": 41805, "epoch": 248} {"train_loss": -8.19041633605957, "global_step": 41806, "epoch": 248} {"train_loss": -8.023494720458984, "global_step": 41807, "epoch": 248} {"train_loss": -7.974749565124512, "global_step": 41808, "epoch": 248} {"train_loss": -8.157114028930664, "global_step": 41809, "epoch": 248} {"train_loss": -7.954273223876953, "global_step": 41810, "epoch": 248} {"train_loss": -8.446959495544434, "global_step": 41811, "epoch": 248} {"train_loss": -7.998006343841553, "global_step": 41812, "epoch": 248} {"train_loss": -8.099730491638184, "global_step": 41813, "epoch": 248} {"train_loss": -8.140785217285156, "global_step": 41814, "epoch": 248} {"train_loss": -7.932534217834473, "global_step": 41815, "epoch": 248} {"train_loss": -8.072543144226074, "global_step": 41816, "epoch": 248} {"train_loss": -8.197714805603027, "global_step": 41817, "epoch": 248} {"train_loss": -7.8550615310668945, "global_step": 41818, "epoch": 248} {"train_loss": -7.885466575622559, "global_step": 41819, "epoch": 248} {"train_loss": -8.01367473602295, "global_step": 41820, "epoch": 248} {"train_loss": -7.804941177368164, "global_step": 41821, "epoch": 248} {"train_loss": -7.965699195861816, "global_step": 41822, "epoch": 248} {"train_loss": -7.992510795593262, "global_step": 41823, "epoch": 248} {"train_loss": -8.209653854370117, "global_step": 41824, "epoch": 248} {"train_loss": -8.012274742126465, "global_step": 41825, "epoch": 248} {"train_loss": -8.105240821838379, "global_step": 41826, "epoch": 248} {"train_loss": -7.826127529144287, "global_step": 41827, "epoch": 248} {"train_loss": -7.902092933654785, "global_step": 41828, "epoch": 248} {"train_loss": -8.057722091674805, "global_step": 41829, "epoch": 248} {"train_loss": -8.137410163879395, "global_step": 41830, "epoch": 248} {"train_loss": -7.9568905262720016, "global_step": 41831, "epoch": 248, "val_loss": 182844.46875} {"train_loss": -7.973743438720703, "global_step": 41832, "epoch": 249} {"train_loss": -7.877828598022461, "global_step": 41833, "epoch": 249} {"train_loss": -7.914683818817139, "global_step": 41834, "epoch": 249} {"train_loss": -8.00942325592041, "global_step": 41835, "epoch": 249} {"train_loss": -8.14700984954834, "global_step": 41836, "epoch": 249} {"train_loss": -8.122283935546875, "global_step": 41837, "epoch": 249} {"train_loss": -8.044172286987305, "global_step": 41838, "epoch": 249} {"train_loss": -8.11895751953125, "global_step": 41839, "epoch": 249} {"train_loss": -7.873598575592041, "global_step": 41840, "epoch": 249} {"train_loss": -8.092496871948242, "global_step": 41841, "epoch": 249} {"train_loss": -7.638517379760742, "global_step": 41842, "epoch": 249} {"train_loss": -8.156097412109375, "global_step": 41843, "epoch": 249} {"train_loss": -8.177172660827637, "global_step": 41844, "epoch": 249} {"train_loss": -8.161279678344727, "global_step": 41845, "epoch": 249} {"train_loss": -8.098085403442383, "global_step": 41846, "epoch": 249} {"train_loss": -7.932476997375488, "global_step": 41847, "epoch": 249} {"train_loss": -8.153493881225586, "global_step": 41848, "epoch": 249} {"train_loss": -8.080360412597656, "global_step": 41849, "epoch": 249} {"train_loss": -8.196660041809082, "global_step": 41850, "epoch": 249} {"train_loss": -8.140572547912598, "global_step": 41851, "epoch": 249} {"train_loss": -8.23214340209961, "global_step": 41852, "epoch": 249} {"train_loss": -7.9865522384643555, "global_step": 41853, "epoch": 249} {"train_loss": -8.07927131652832, "global_step": 41854, "epoch": 249} {"train_loss": -8.156600952148438, "global_step": 41855, "epoch": 249} {"train_loss": -8.072416305541992, "global_step": 41856, "epoch": 249} {"train_loss": -8.018104553222656, "global_step": 41857, "epoch": 249} {"train_loss": -7.7296881675720215, "global_step": 41858, "epoch": 249} {"train_loss": -8.413877487182617, "global_step": 41859, "epoch": 249} {"train_loss": -7.994102478027344, "global_step": 41860, "epoch": 249} {"train_loss": -7.878866195678711, "global_step": 41861, "epoch": 249} {"train_loss": -7.870001316070557, "global_step": 41862, "epoch": 249} {"train_loss": -8.106714248657227, "global_step": 41863, "epoch": 249} {"train_loss": -7.946400165557861, "global_step": 41864, "epoch": 249} {"train_loss": -7.904329299926758, "global_step": 41865, "epoch": 249} {"train_loss": -8.056245803833008, "global_step": 41866, "epoch": 249} {"train_loss": -8.156341552734375, "global_step": 41867, "epoch": 249} {"train_loss": -8.048450469970703, "global_step": 41868, "epoch": 249} {"train_loss": -8.035802841186523, "global_step": 41869, "epoch": 249} {"train_loss": -7.93928337097168, "global_step": 41870, "epoch": 249} {"train_loss": -8.043469429016113, "global_step": 41871, "epoch": 249} {"train_loss": -7.856082916259766, "global_step": 41872, "epoch": 249} {"train_loss": -7.888101100921631, "global_step": 41873, "epoch": 249} {"train_loss": -7.853710651397705, "global_step": 41874, "epoch": 249} {"train_loss": -8.08049488067627, "global_step": 41875, "epoch": 249} {"train_loss": -7.633918762207031, "global_step": 41876, "epoch": 249} {"train_loss": -8.013100624084473, "global_step": 41877, "epoch": 249} {"train_loss": -7.91593599319458, "global_step": 41878, "epoch": 249} {"train_loss": -8.136970520019531, "global_step": 41879, "epoch": 249} {"train_loss": -8.095878601074219, "global_step": 41880, "epoch": 249} {"train_loss": -8.359508514404297, "global_step": 41881, "epoch": 249} {"train_loss": -8.203364372253418, "global_step": 41882, "epoch": 249} {"train_loss": -8.026130676269531, "global_step": 41883, "epoch": 249} {"train_loss": -7.987207412719727, "global_step": 41884, "epoch": 249} {"train_loss": -7.945126533508301, "global_step": 41885, "epoch": 249} {"train_loss": -8.018342018127441, "global_step": 41886, "epoch": 249} {"train_loss": -7.954009532928467, "global_step": 41887, "epoch": 249} {"train_loss": -8.03464126586914, "global_step": 41888, "epoch": 249} {"train_loss": -7.800686836242676, "global_step": 41889, "epoch": 249} {"train_loss": -8.018917083740234, "global_step": 41890, "epoch": 249} {"train_loss": -7.667468070983887, "global_step": 41891, "epoch": 249} {"train_loss": -7.924646377563477, "global_step": 41892, "epoch": 249} {"train_loss": -8.098823547363281, "global_step": 41893, "epoch": 249} {"train_loss": -7.865602016448975, "global_step": 41894, "epoch": 249} {"train_loss": -7.647310733795166, "global_step": 41895, "epoch": 249} {"train_loss": -7.948553085327148, "global_step": 41896, "epoch": 249} {"train_loss": -7.8257832527160645, "global_step": 41897, "epoch": 249} {"train_loss": -7.796327114105225, "global_step": 41898, "epoch": 249} {"train_loss": -8.11256217956543, "global_step": 41899, "epoch": 249} {"train_loss": -8.03439712524414, "global_step": 41900, "epoch": 249} {"train_loss": -8.020458221435547, "global_step": 41901, "epoch": 249} {"train_loss": -8.025039672851562, "global_step": 41902, "epoch": 249} {"train_loss": -7.947815895080566, "global_step": 41903, "epoch": 249} {"train_loss": -8.132743835449219, "global_step": 41904, "epoch": 249} {"train_loss": -8.008893966674805, "global_step": 41905, "epoch": 249} {"train_loss": -7.997382164001465, "global_step": 41906, "epoch": 249} {"train_loss": -7.964234352111816, "global_step": 41907, "epoch": 249} {"train_loss": -8.078451156616211, "global_step": 41908, "epoch": 249} {"train_loss": -7.949214458465576, "global_step": 41909, "epoch": 249} {"train_loss": -8.030696868896484, "global_step": 41910, "epoch": 249} {"train_loss": -7.948276519775391, "global_step": 41911, "epoch": 249} {"train_loss": -8.111971855163574, "global_step": 41912, "epoch": 249} {"train_loss": -7.838031768798828, "global_step": 41913, "epoch": 249} {"train_loss": -8.036699295043945, "global_step": 41914, "epoch": 249} {"train_loss": -8.023747444152832, "global_step": 41915, "epoch": 249} {"train_loss": -8.175294876098633, "global_step": 41916, "epoch": 249} {"train_loss": -7.978140354156494, "global_step": 41917, "epoch": 249} {"train_loss": -8.122758865356445, "global_step": 41918, "epoch": 249} {"train_loss": -8.163138389587402, "global_step": 41919, "epoch": 249} {"train_loss": -8.131036758422852, "global_step": 41920, "epoch": 249} {"train_loss": -8.0704984664917, "global_step": 41921, "epoch": 249} {"train_loss": -8.1993408203125, "global_step": 41922, "epoch": 249} {"train_loss": -8.237885475158691, "global_step": 41923, "epoch": 249} {"train_loss": -8.039438247680664, "global_step": 41924, "epoch": 249} {"train_loss": -8.325098037719727, "global_step": 41925, "epoch": 249} {"train_loss": -8.097382545471191, "global_step": 41926, "epoch": 249} {"train_loss": -8.355106353759766, "global_step": 41927, "epoch": 249} {"train_loss": -8.036718368530273, "global_step": 41928, "epoch": 249} {"train_loss": -8.108806610107422, "global_step": 41929, "epoch": 249} {"train_loss": -8.015457153320312, "global_step": 41930, "epoch": 249} {"train_loss": -8.298531532287598, "global_step": 41931, "epoch": 249} {"train_loss": -8.196731567382812, "global_step": 41932, "epoch": 249} {"train_loss": -8.021318435668945, "global_step": 41933, "epoch": 249} {"train_loss": -8.20628547668457, "global_step": 41934, "epoch": 249} {"train_loss": -8.262164115905762, "global_step": 41935, "epoch": 249} {"train_loss": -7.8550801277160645, "global_step": 41936, "epoch": 249} {"train_loss": -8.091079711914062, "global_step": 41937, "epoch": 249} {"train_loss": -8.166213989257812, "global_step": 41938, "epoch": 249} {"train_loss": -8.117729187011719, "global_step": 41939, "epoch": 249} {"train_loss": -8.291668891906738, "global_step": 41940, "epoch": 249} {"train_loss": -7.960836410522461, "global_step": 41941, "epoch": 249} {"train_loss": -7.956439018249512, "global_step": 41942, "epoch": 249} {"train_loss": -7.982205390930176, "global_step": 41943, "epoch": 249} {"train_loss": -7.956691741943359, "global_step": 41944, "epoch": 249} {"train_loss": -8.125974655151367, "global_step": 41945, "epoch": 249} {"train_loss": -8.087554931640625, "global_step": 41946, "epoch": 249} {"train_loss": -7.900540351867676, "global_step": 41947, "epoch": 249} {"train_loss": -7.914028167724609, "global_step": 41948, "epoch": 249} {"train_loss": -7.988260269165039, "global_step": 41949, "epoch": 249} {"train_loss": -7.961627960205078, "global_step": 41950, "epoch": 249} {"train_loss": -7.832433223724365, "global_step": 41951, "epoch": 249} {"train_loss": -8.080709457397461, "global_step": 41952, "epoch": 249} {"train_loss": -7.625826358795166, "global_step": 41953, "epoch": 249} {"train_loss": -7.825546741485596, "global_step": 41954, "epoch": 249} {"train_loss": -7.985883712768555, "global_step": 41955, "epoch": 249} {"train_loss": -7.978149890899658, "global_step": 41956, "epoch": 249} {"train_loss": -8.038457870483398, "global_step": 41957, "epoch": 249} {"train_loss": -7.700911521911621, "global_step": 41958, "epoch": 249} {"train_loss": -7.9236297607421875, "global_step": 41959, "epoch": 249} {"train_loss": -7.789022922515869, "global_step": 41960, "epoch": 249} {"train_loss": -7.786626815795898, "global_step": 41961, "epoch": 249} {"train_loss": -7.859282493591309, "global_step": 41962, "epoch": 249} {"train_loss": -7.960716247558594, "global_step": 41963, "epoch": 249} {"train_loss": -8.261148452758789, "global_step": 41964, "epoch": 249} {"train_loss": -7.857786178588867, "global_step": 41965, "epoch": 249} {"train_loss": -8.000740051269531, "global_step": 41966, "epoch": 249} {"train_loss": -8.042130470275879, "global_step": 41967, "epoch": 249} {"train_loss": -7.931880474090576, "global_step": 41968, "epoch": 249} {"train_loss": -7.895601272583008, "global_step": 41969, "epoch": 249} {"train_loss": -7.930643558502197, "global_step": 41970, "epoch": 249} {"train_loss": -7.888569355010986, "global_step": 41971, "epoch": 249} {"train_loss": -8.01141357421875, "global_step": 41972, "epoch": 249} {"train_loss": -8.187705039978027, "global_step": 41973, "epoch": 249} {"train_loss": -7.714066505432129, "global_step": 41974, "epoch": 249} {"train_loss": -8.015636444091797, "global_step": 41975, "epoch": 249} {"train_loss": -7.890734672546387, "global_step": 41976, "epoch": 249} {"train_loss": -8.077441215515137, "global_step": 41977, "epoch": 249} {"train_loss": -7.693544387817383, "global_step": 41978, "epoch": 249} {"train_loss": -8.061248779296875, "global_step": 41979, "epoch": 249} {"train_loss": -8.023656845092773, "global_step": 41980, "epoch": 249} {"train_loss": -7.98838472366333, "global_step": 41981, "epoch": 249} {"train_loss": -8.094048500061035, "global_step": 41982, "epoch": 249} {"train_loss": -8.027606964111328, "global_step": 41983, "epoch": 249} {"train_loss": -8.030314445495605, "global_step": 41984, "epoch": 249} {"train_loss": -7.785755634307861, "global_step": 41985, "epoch": 249} {"train_loss": -8.093318939208984, "global_step": 41986, "epoch": 249} {"train_loss": -8.189676284790039, "global_step": 41987, "epoch": 249} {"train_loss": -8.141456604003906, "global_step": 41988, "epoch": 249} {"train_loss": -8.087509155273438, "global_step": 41989, "epoch": 249} {"train_loss": -8.147974014282227, "global_step": 41990, "epoch": 249} {"train_loss": -8.05749225616455, "global_step": 41991, "epoch": 249} {"train_loss": -8.148950576782227, "global_step": 41992, "epoch": 249} {"train_loss": -7.988210678100586, "global_step": 41993, "epoch": 249} {"train_loss": -7.944209098815918, "global_step": 41994, "epoch": 249} {"train_loss": -8.16126537322998, "global_step": 41995, "epoch": 249} {"train_loss": -8.174966812133789, "global_step": 41996, "epoch": 249} {"train_loss": -8.088059425354004, "global_step": 41997, "epoch": 249} {"train_loss": -8.131604194641113, "global_step": 41998, "epoch": 249} {"train_loss": -8.01895100729806, "global_step": 41999, "epoch": 249, "val_loss": 182993.59375} {"train_loss": -8.275917053222656, "global_step": 42000, "epoch": 250} {"train_loss": -8.029215812683105, "global_step": 42001, "epoch": 250} {"train_loss": -8.244951248168945, "global_step": 42002, "epoch": 250} {"train_loss": -8.014070510864258, "global_step": 42003, "epoch": 250} {"train_loss": -8.479645729064941, "global_step": 42004, "epoch": 250} {"train_loss": -8.152288436889648, "global_step": 42005, "epoch": 250} {"train_loss": -8.059029579162598, "global_step": 42006, "epoch": 250} {"train_loss": -7.928412437438965, "global_step": 42007, "epoch": 250} {"train_loss": -8.077912330627441, "global_step": 42008, "epoch": 250} {"train_loss": -8.09976863861084, "global_step": 42009, "epoch": 250} {"train_loss": -8.046469688415527, "global_step": 42010, "epoch": 250} {"train_loss": -8.19252872467041, "global_step": 42011, "epoch": 250} {"train_loss": -8.10793685913086, "global_step": 42012, "epoch": 250} {"train_loss": -7.8993659019470215, "global_step": 42013, "epoch": 250} {"train_loss": -7.9838151931762695, "global_step": 42014, "epoch": 250} {"train_loss": -8.08802318572998, "global_step": 42015, "epoch": 250} {"train_loss": -8.080684661865234, "global_step": 42016, "epoch": 250} {"train_loss": -8.068059921264648, "global_step": 42017, "epoch": 250} {"train_loss": -8.119491577148438, "global_step": 42018, "epoch": 250} {"train_loss": -8.147157669067383, "global_step": 42019, "epoch": 250} {"train_loss": -7.973862648010254, "global_step": 42020, "epoch": 250} {"train_loss": -7.960418701171875, "global_step": 42021, "epoch": 250} {"train_loss": -8.106149673461914, "global_step": 42022, "epoch": 250} {"train_loss": -7.772916316986084, "global_step": 42023, "epoch": 250} {"train_loss": -8.18222713470459, "global_step": 42024, "epoch": 250} {"train_loss": -8.103919982910156, "global_step": 42025, "epoch": 250} {"train_loss": -7.921002388000488, "global_step": 42026, "epoch": 250} {"train_loss": -7.950638771057129, "global_step": 42027, "epoch": 250} {"train_loss": -7.9601569175720215, "global_step": 42028, "epoch": 250} {"train_loss": -8.095802307128906, "global_step": 42029, "epoch": 250} {"train_loss": -7.841998100280762, "global_step": 42030, "epoch": 250} {"train_loss": -8.105436325073242, "global_step": 42031, "epoch": 250} {"train_loss": -7.816291809082031, "global_step": 42032, "epoch": 250} {"train_loss": -7.9541826248168945, "global_step": 42033, "epoch": 250} {"train_loss": -8.204381942749023, "global_step": 42034, "epoch": 250} {"train_loss": -7.799612045288086, "global_step": 42035, "epoch": 250} {"train_loss": -8.101167678833008, "global_step": 42036, "epoch": 250} {"train_loss": -7.867341995239258, "global_step": 42037, "epoch": 250} {"train_loss": -8.086236953735352, "global_step": 42038, "epoch": 250} {"train_loss": -8.009498596191406, "global_step": 42039, "epoch": 250} {"train_loss": -8.191930770874023, "global_step": 42040, "epoch": 250} {"train_loss": -7.853479385375977, "global_step": 42041, "epoch": 250} {"train_loss": -8.144031524658203, "global_step": 42042, "epoch": 250} {"train_loss": -8.12397575378418, "global_step": 42043, "epoch": 250} {"train_loss": -8.053115844726562, "global_step": 42044, "epoch": 250} {"train_loss": -8.207099914550781, "global_step": 42045, "epoch": 250} {"train_loss": -8.004019737243652, "global_step": 42046, "epoch": 250} {"train_loss": -8.042830467224121, "global_step": 42047, "epoch": 250} {"train_loss": -8.09192180633545, "global_step": 42048, "epoch": 250} {"train_loss": -7.916082382202148, "global_step": 42049, "epoch": 250} {"train_loss": -8.258073806762695, "global_step": 42050, "epoch": 250} {"train_loss": -8.118961334228516, "global_step": 42051, "epoch": 250} {"train_loss": -8.106664657592773, "global_step": 42052, "epoch": 250} {"train_loss": -8.062044143676758, "global_step": 42053, "epoch": 250} {"train_loss": -7.960160255432129, "global_step": 42054, "epoch": 250} {"train_loss": -8.196929931640625, "global_step": 42055, "epoch": 250} {"train_loss": -8.169784545898438, "global_step": 42056, "epoch": 250} {"train_loss": -8.033255577087402, "global_step": 42057, "epoch": 250} {"train_loss": -8.001832962036133, "global_step": 42058, "epoch": 250} {"train_loss": -7.8299407958984375, "global_step": 42059, "epoch": 250} {"train_loss": -7.961145877838135, "global_step": 42060, "epoch": 250} {"train_loss": -7.85752534866333, "global_step": 42061, "epoch": 250} {"train_loss": -8.329151153564453, "global_step": 42062, "epoch": 250} {"train_loss": -7.948184490203857, "global_step": 42063, "epoch": 250} {"train_loss": -8.064425468444824, "global_step": 42064, "epoch": 250} {"train_loss": -8.30868148803711, "global_step": 42065, "epoch": 250} {"train_loss": -8.249669075012207, "global_step": 42066, "epoch": 250} {"train_loss": -7.944239616394043, "global_step": 42067, "epoch": 250} {"train_loss": -8.022053718566895, "global_step": 42068, "epoch": 250} {"train_loss": -8.182805061340332, "global_step": 42069, "epoch": 250} {"train_loss": -8.129350662231445, "global_step": 42070, "epoch": 250} {"train_loss": -7.992528915405273, "global_step": 42071, "epoch": 250} {"train_loss": -8.113946914672852, "global_step": 42072, "epoch": 250} {"train_loss": -8.074323654174805, "global_step": 42073, "epoch": 250} {"train_loss": -8.019064903259277, "global_step": 42074, "epoch": 250} {"train_loss": -7.99117374420166, "global_step": 42075, "epoch": 250} {"train_loss": -7.688330173492432, "global_step": 42076, "epoch": 250} {"train_loss": -7.922338485717773, "global_step": 42077, "epoch": 250} {"train_loss": -7.549120903015137, "global_step": 42078, "epoch": 250} {"train_loss": -7.612415790557861, "global_step": 42079, "epoch": 250} {"train_loss": -7.618841648101807, "global_step": 42080, "epoch": 250} {"train_loss": -7.570815086364746, "global_step": 42081, "epoch": 250} {"train_loss": -7.616641044616699, "global_step": 42082, "epoch": 250} {"train_loss": -7.489401817321777, "global_step": 42083, "epoch": 250} {"train_loss": -7.843686103820801, "global_step": 42084, "epoch": 250} {"train_loss": -7.495204925537109, "global_step": 42085, "epoch": 250} {"train_loss": -7.783107280731201, "global_step": 42086, "epoch": 250} {"train_loss": -7.955660343170166, "global_step": 42087, "epoch": 250} {"train_loss": -7.750953674316406, "global_step": 42088, "epoch": 250} {"train_loss": -7.794409275054932, "global_step": 42089, "epoch": 250} {"train_loss": -7.337429046630859, "global_step": 42090, "epoch": 250} {"train_loss": -7.780572891235352, "global_step": 42091, "epoch": 250} {"train_loss": -7.812685012817383, "global_step": 42092, "epoch": 250} {"train_loss": -7.422642707824707, "global_step": 42093, "epoch": 250} {"train_loss": -7.913228988647461, "global_step": 42094, "epoch": 250} {"train_loss": -7.776250839233398, "global_step": 42095, "epoch": 250} {"train_loss": -7.6555891036987305, "global_step": 42096, "epoch": 250} {"train_loss": -7.756330490112305, "global_step": 42097, "epoch": 250} {"train_loss": -7.859855651855469, "global_step": 42098, "epoch": 250} {"train_loss": -7.832145690917969, "global_step": 42099, "epoch": 250} {"train_loss": -7.952119827270508, "global_step": 42100, "epoch": 250} {"train_loss": -7.687426567077637, "global_step": 42101, "epoch": 250} {"train_loss": -7.941719055175781, "global_step": 42102, "epoch": 250} {"train_loss": -7.942859172821045, "global_step": 42103, "epoch": 250} {"train_loss": -8.05172348022461, "global_step": 42104, "epoch": 250} {"train_loss": -7.888505458831787, "global_step": 42105, "epoch": 250} {"train_loss": -8.078824996948242, "global_step": 42106, "epoch": 250} {"train_loss": -8.087987899780273, "global_step": 42107, "epoch": 250} {"train_loss": -7.973318099975586, "global_step": 42108, "epoch": 250} {"train_loss": -8.019449234008789, "global_step": 42109, "epoch": 250} {"train_loss": -8.192490577697754, "global_step": 42110, "epoch": 250} {"train_loss": -8.258247375488281, "global_step": 42111, "epoch": 250} {"train_loss": -7.884688377380371, "global_step": 42112, "epoch": 250} {"train_loss": -8.01933765411377, "global_step": 42113, "epoch": 250} {"train_loss": -8.272390365600586, "global_step": 42114, "epoch": 250} {"train_loss": -8.21123218536377, "global_step": 42115, "epoch": 250} {"train_loss": -8.196329116821289, "global_step": 42116, "epoch": 250} {"train_loss": -8.403461456298828, "global_step": 42117, "epoch": 250} {"train_loss": -8.10457706451416, "global_step": 42118, "epoch": 250} {"train_loss": -8.389047622680664, "global_step": 42119, "epoch": 250} {"train_loss": -8.228062629699707, "global_step": 42120, "epoch": 250} {"train_loss": -7.934670448303223, "global_step": 42121, "epoch": 250} {"train_loss": -8.175616264343262, "global_step": 42122, "epoch": 250} {"train_loss": -8.15416431427002, "global_step": 42123, "epoch": 250} {"train_loss": -8.301161766052246, "global_step": 42124, "epoch": 250} {"train_loss": -8.09520149230957, "global_step": 42125, "epoch": 250} {"train_loss": -8.131414413452148, "global_step": 42126, "epoch": 250} {"train_loss": -8.052326202392578, "global_step": 42127, "epoch": 250} {"train_loss": -7.963777542114258, "global_step": 42128, "epoch": 250} {"train_loss": -8.396659851074219, "global_step": 42129, "epoch": 250} {"train_loss": -8.04125690460205, "global_step": 42130, "epoch": 250} {"train_loss": -8.099908828735352, "global_step": 42131, "epoch": 250} {"train_loss": -7.561835289001465, "global_step": 42132, "epoch": 250} {"train_loss": -8.197571754455566, "global_step": 42133, "epoch": 250} {"train_loss": -7.58709192276001, "global_step": 42134, "epoch": 250} {"train_loss": -8.078959465026855, "global_step": 42135, "epoch": 250} {"train_loss": -7.910526275634766, "global_step": 42136, "epoch": 250} {"train_loss": -8.13140869140625, "global_step": 42137, "epoch": 250} {"train_loss": -7.715838432312012, "global_step": 42138, "epoch": 250} {"train_loss": -7.8528151512146, "global_step": 42139, "epoch": 250} {"train_loss": -7.985102653503418, "global_step": 42140, "epoch": 250} {"train_loss": -8.109964370727539, "global_step": 42141, "epoch": 250} {"train_loss": -7.725636005401611, "global_step": 42142, "epoch": 250} {"train_loss": -7.782251358032227, "global_step": 42143, "epoch": 250} {"train_loss": -7.939948081970215, "global_step": 42144, "epoch": 250} {"train_loss": -7.915582656860352, "global_step": 42145, "epoch": 250} {"train_loss": -8.061195373535156, "global_step": 42146, "epoch": 250} {"train_loss": -7.7427825927734375, "global_step": 42147, "epoch": 250} {"train_loss": -7.842977046966553, "global_step": 42148, "epoch": 250} {"train_loss": -7.75748348236084, "global_step": 42149, "epoch": 250} {"train_loss": -7.854503154754639, "global_step": 42150, "epoch": 250} {"train_loss": -8.054933547973633, "global_step": 42151, "epoch": 250} {"train_loss": -7.887044429779053, "global_step": 42152, "epoch": 250} {"train_loss": -8.058710098266602, "global_step": 42153, "epoch": 250} {"train_loss": -7.976025581359863, "global_step": 42154, "epoch": 250} {"train_loss": -8.092259407043457, "global_step": 42155, "epoch": 250} {"train_loss": -8.056316375732422, "global_step": 42156, "epoch": 250} {"train_loss": -7.778039455413818, "global_step": 42157, "epoch": 250} {"train_loss": -7.954410552978516, "global_step": 42158, "epoch": 250} {"train_loss": -7.90216588973999, "global_step": 42159, "epoch": 250} {"train_loss": -7.690672874450684, "global_step": 42160, "epoch": 250} {"train_loss": -8.094038009643555, "global_step": 42161, "epoch": 250} {"train_loss": -7.58000373840332, "global_step": 42162, "epoch": 250} {"train_loss": -8.068062782287598, "global_step": 42163, "epoch": 250} {"train_loss": -7.940622329711914, "global_step": 42164, "epoch": 250} {"train_loss": -7.9829840660095215, "global_step": 42165, "epoch": 250} {"train_loss": -7.906462669372559, "global_step": 42166, "epoch": 250} {"train_loss": -7.983416480677469, "global_step": 42167, "epoch": 250, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 0.9776028724813114, "train/sim_max_reward_2": 0.02296448517409193, "train/sim_max_reward_3": 0.7269137183985329, "train/sim_max_reward_4": 0.977014089938771, "train/sim_max_reward_5": 0.5448056790500082, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.34719767640830357, "test/sim_max_reward_4400002": 0.09305221582783174, "test/sim_max_reward_4400003": 0.6289019149394426, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 0.997877552978339, "test/sim_max_reward_4400006": 0.9988691282664363, "test/sim_max_reward_4400007": 0.9661414099806965, "test/sim_max_reward_4400008": 0.5990390770183126, "test/sim_max_reward_4400009": 0.5052438648907281, "test/sim_max_reward_4400010": 0.23079087970235812, "test/sim_max_reward_4400011": 0.2847211899237442, "test/sim_max_reward_4400012": 0.800621373452157, "test/sim_max_reward_4400013": 0.970439890209186, "test/sim_max_reward_4400014": 0.7807664239295631, "test/sim_max_reward_4400015": 0.4078932796822962, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.8753542199530222, "test/sim_max_reward_4400019": 0.16061051822202446, "test/sim_max_reward_4400020": 0.0013656102227512402, "test/sim_max_reward_4400021": 0.9653398725085701, "test/sim_max_reward_4400022": 0.9958927535777244, "test/sim_max_reward_4400023": 1.0, "test/sim_max_reward_4400024": 0.9910447496004603, "test/sim_max_reward_4400025": 0.6163211920123155, "test/sim_max_reward_4400026": 1.0, "test/sim_max_reward_4400027": 0.4880680123936909, "test/sim_max_reward_4400028": 0.7150704698440046, "test/sim_max_reward_4400029": 0.6205023702006853, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.99293221528843, "test/sim_max_reward_4400032": 0.057907996251265546, "test/sim_max_reward_4400033": 1.0, "test/sim_max_reward_4400034": 0.7250807465937574, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 1.0, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.637750972073781, "test/sim_max_reward_4400039": 0.973702717967276, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.2041005744336994, "test/sim_max_reward_4400042": 0.9326178204433713, "test/sim_max_reward_4400043": 0.9656657529629318, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.9550228480529007, "test/sim_max_reward_4400046": 0.9713862907241464, "test/sim_max_reward_4400047": 0.9797220946679658, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.7082168075071192, "test/mean_score": 0.6544268251915238, "val_loss": 185950.046875, "train_action_mse_error": 12.947421073913574} {"train_loss": -8.059913635253906, "global_step": 42168, "epoch": 251} {"train_loss": -8.225732803344727, "global_step": 42169, "epoch": 251} {"train_loss": -8.05838394165039, "global_step": 42170, "epoch": 251} {"train_loss": -8.05912971496582, "global_step": 42171, "epoch": 251} {"train_loss": -8.019804000854492, "global_step": 42172, "epoch": 251} {"train_loss": -8.304492950439453, "global_step": 42173, "epoch": 251} {"train_loss": -7.92091703414917, "global_step": 42174, "epoch": 251} {"train_loss": -8.233856201171875, "global_step": 42175, "epoch": 251} {"train_loss": -8.140165328979492, "global_step": 42176, "epoch": 251} {"train_loss": -8.151697158813477, "global_step": 42177, "epoch": 251} {"train_loss": -8.051279067993164, "global_step": 42178, "epoch": 251} {"train_loss": -7.961974143981934, "global_step": 42179, "epoch": 251} {"train_loss": -8.027185440063477, "global_step": 42180, "epoch": 251} {"train_loss": -8.188928604125977, "global_step": 42181, "epoch": 251} {"train_loss": -8.194150924682617, "global_step": 42182, "epoch": 251} {"train_loss": -7.868892192840576, "global_step": 42183, "epoch": 251} {"train_loss": -8.023361206054688, "global_step": 42184, "epoch": 251} {"train_loss": -8.085881233215332, "global_step": 42185, "epoch": 251} {"train_loss": -8.114921569824219, "global_step": 42186, "epoch": 251} {"train_loss": -8.065923690795898, "global_step": 42187, "epoch": 251} {"train_loss": -7.860577583312988, "global_step": 42188, "epoch": 251} {"train_loss": -8.017638206481934, "global_step": 42189, "epoch": 251} {"train_loss": -7.877833366394043, "global_step": 42190, "epoch": 251} {"train_loss": -8.070343017578125, "global_step": 42191, "epoch": 251} {"train_loss": -8.013014793395996, "global_step": 42192, "epoch": 251} {"train_loss": -8.221403121948242, "global_step": 42193, "epoch": 251} {"train_loss": -8.104910850524902, "global_step": 42194, "epoch": 251} {"train_loss": -8.11585807800293, "global_step": 42195, "epoch": 251} {"train_loss": -8.152339935302734, "global_step": 42196, "epoch": 251} {"train_loss": -7.863476276397705, "global_step": 42197, "epoch": 251} {"train_loss": -8.296024322509766, "global_step": 42198, "epoch": 251} {"train_loss": -8.236554145812988, "global_step": 42199, "epoch": 251} {"train_loss": -8.089273452758789, "global_step": 42200, "epoch": 251} {"train_loss": -8.051773071289062, "global_step": 42201, "epoch": 251} {"train_loss": -8.02448558807373, "global_step": 42202, "epoch": 251} {"train_loss": -7.857441425323486, "global_step": 42203, "epoch": 251} {"train_loss": -7.881897926330566, "global_step": 42204, "epoch": 251} {"train_loss": -7.77193021774292, "global_step": 42205, "epoch": 251} {"train_loss": -7.928860187530518, "global_step": 42206, "epoch": 251} {"train_loss": -8.086091995239258, "global_step": 42207, "epoch": 251} {"train_loss": -7.958381175994873, "global_step": 42208, "epoch": 251} {"train_loss": -8.01530647277832, "global_step": 42209, "epoch": 251} {"train_loss": -8.137422561645508, "global_step": 42210, "epoch": 251} {"train_loss": -8.035375595092773, "global_step": 42211, "epoch": 251} {"train_loss": -8.061945915222168, "global_step": 42212, "epoch": 251} {"train_loss": -7.817448616027832, "global_step": 42213, "epoch": 251} {"train_loss": -8.064075469970703, "global_step": 42214, "epoch": 251} {"train_loss": -8.121650695800781, "global_step": 42215, "epoch": 251} {"train_loss": -8.087970733642578, "global_step": 42216, "epoch": 251} {"train_loss": -8.139649391174316, "global_step": 42217, "epoch": 251} {"train_loss": -7.972892761230469, "global_step": 42218, "epoch": 251} {"train_loss": -8.115053176879883, "global_step": 42219, "epoch": 251} {"train_loss": -8.05827522277832, "global_step": 42220, "epoch": 251} {"train_loss": -7.908969879150391, "global_step": 42221, "epoch": 251} {"train_loss": -8.255821228027344, "global_step": 42222, "epoch": 251} {"train_loss": -8.163850784301758, "global_step": 42223, "epoch": 251} {"train_loss": -8.063997268676758, "global_step": 42224, "epoch": 251} {"train_loss": -8.16547966003418, "global_step": 42225, "epoch": 251} {"train_loss": -7.878984451293945, "global_step": 42226, "epoch": 251} {"train_loss": -8.244020462036133, "global_step": 42227, "epoch": 251} {"train_loss": -7.965821266174316, "global_step": 42228, "epoch": 251} {"train_loss": -8.069792747497559, "global_step": 42229, "epoch": 251} {"train_loss": -7.80915641784668, "global_step": 42230, "epoch": 251} {"train_loss": -7.959416389465332, "global_step": 42231, "epoch": 251} {"train_loss": -7.794329643249512, "global_step": 42232, "epoch": 251} {"train_loss": -8.096757888793945, "global_step": 42233, "epoch": 251} {"train_loss": -8.109273910522461, "global_step": 42234, "epoch": 251} {"train_loss": -8.117712020874023, "global_step": 42235, "epoch": 251} {"train_loss": -8.07691478729248, "global_step": 42236, "epoch": 251} {"train_loss": -7.881565093994141, "global_step": 42237, "epoch": 251} {"train_loss": -7.835918426513672, "global_step": 42238, "epoch": 251} {"train_loss": -8.086603164672852, "global_step": 42239, "epoch": 251} {"train_loss": -7.841960430145264, "global_step": 42240, "epoch": 251} {"train_loss": -8.103716850280762, "global_step": 42241, "epoch": 251} {"train_loss": -8.166101455688477, "global_step": 42242, "epoch": 251} {"train_loss": -7.946057319641113, "global_step": 42243, "epoch": 251} {"train_loss": -7.847722053527832, "global_step": 42244, "epoch": 251} {"train_loss": -7.992043972015381, "global_step": 42245, "epoch": 251} {"train_loss": -8.150408744812012, "global_step": 42246, "epoch": 251} {"train_loss": -8.384247779846191, "global_step": 42247, "epoch": 251} {"train_loss": -8.078969955444336, "global_step": 42248, "epoch": 251} {"train_loss": -8.001205444335938, "global_step": 42249, "epoch": 251} {"train_loss": -7.917620658874512, "global_step": 42250, "epoch": 251} {"train_loss": -7.983672618865967, "global_step": 42251, "epoch": 251} {"train_loss": -7.775132179260254, "global_step": 42252, "epoch": 251} {"train_loss": -8.040348052978516, "global_step": 42253, "epoch": 251} {"train_loss": -8.085151672363281, "global_step": 42254, "epoch": 251} {"train_loss": -8.05773639678955, "global_step": 42255, "epoch": 251} {"train_loss": -7.9992265701293945, "global_step": 42256, "epoch": 251} {"train_loss": -7.975496292114258, "global_step": 42257, "epoch": 251} {"train_loss": -8.216972351074219, "global_step": 42258, "epoch": 251} {"train_loss": -8.027742385864258, "global_step": 42259, "epoch": 251} {"train_loss": -8.313751220703125, "global_step": 42260, "epoch": 251} {"train_loss": -8.205013275146484, "global_step": 42261, "epoch": 251} {"train_loss": -8.159625053405762, "global_step": 42262, "epoch": 251} {"train_loss": -8.049676895141602, "global_step": 42263, "epoch": 251} {"train_loss": -8.045166015625, "global_step": 42264, "epoch": 251} {"train_loss": -8.110816955566406, "global_step": 42265, "epoch": 251} {"train_loss": -7.985992908477783, "global_step": 42266, "epoch": 251} {"train_loss": -8.231520652770996, "global_step": 42267, "epoch": 251} {"train_loss": -8.178296089172363, "global_step": 42268, "epoch": 251} {"train_loss": -7.793635368347168, "global_step": 42269, "epoch": 251} {"train_loss": -7.843687057495117, "global_step": 42270, "epoch": 251} {"train_loss": -8.229217529296875, "global_step": 42271, "epoch": 251} {"train_loss": -7.770840167999268, "global_step": 42272, "epoch": 251} {"train_loss": -7.906963348388672, "global_step": 42273, "epoch": 251} {"train_loss": -8.052871704101562, "global_step": 42274, "epoch": 251} {"train_loss": -7.9373250007629395, "global_step": 42275, "epoch": 251} {"train_loss": -7.9433913230896, "global_step": 42276, "epoch": 251} {"train_loss": -7.885791778564453, "global_step": 42277, "epoch": 251} {"train_loss": -8.12790298461914, "global_step": 42278, "epoch": 251} {"train_loss": -7.941799640655518, "global_step": 42279, "epoch": 251} {"train_loss": -7.7584004402160645, "global_step": 42280, "epoch": 251} {"train_loss": -8.025262832641602, "global_step": 42281, "epoch": 251} {"train_loss": -7.792101860046387, "global_step": 42282, "epoch": 251} {"train_loss": -7.942859649658203, "global_step": 42283, "epoch": 251} {"train_loss": -7.831084728240967, "global_step": 42284, "epoch": 251} {"train_loss": -8.04444408416748, "global_step": 42285, "epoch": 251} {"train_loss": -7.796448707580566, "global_step": 42286, "epoch": 251} {"train_loss": -7.73701286315918, "global_step": 42287, "epoch": 251} {"train_loss": -7.826558589935303, "global_step": 42288, "epoch": 251} {"train_loss": -8.154623031616211, "global_step": 42289, "epoch": 251} {"train_loss": -7.981943130493164, "global_step": 42290, "epoch": 251} {"train_loss": -8.110684394836426, "global_step": 42291, "epoch": 251} {"train_loss": -7.866312026977539, "global_step": 42292, "epoch": 251} {"train_loss": -8.07570743560791, "global_step": 42293, "epoch": 251} {"train_loss": -7.842655658721924, "global_step": 42294, "epoch": 251} {"train_loss": -8.026325225830078, "global_step": 42295, "epoch": 251} {"train_loss": -7.801889419555664, "global_step": 42296, "epoch": 251} {"train_loss": -7.8692121505737305, "global_step": 42297, "epoch": 251} {"train_loss": -7.925712585449219, "global_step": 42298, "epoch": 251} {"train_loss": -7.9993085861206055, "global_step": 42299, "epoch": 251} {"train_loss": -8.181143760681152, "global_step": 42300, "epoch": 251} {"train_loss": -7.927506446838379, "global_step": 42301, "epoch": 251} {"train_loss": -7.857021331787109, "global_step": 42302, "epoch": 251} {"train_loss": -7.926548004150391, "global_step": 42303, "epoch": 251} {"train_loss": -7.981173515319824, "global_step": 42304, "epoch": 251} {"train_loss": -7.980549335479736, "global_step": 42305, "epoch": 251} {"train_loss": -8.041471481323242, "global_step": 42306, "epoch": 251} {"train_loss": -8.198649406433105, "global_step": 42307, "epoch": 251} {"train_loss": -8.120161056518555, "global_step": 42308, "epoch": 251} {"train_loss": -7.923455238342285, "global_step": 42309, "epoch": 251} {"train_loss": -8.070656776428223, "global_step": 42310, "epoch": 251} {"train_loss": -8.232019424438477, "global_step": 42311, "epoch": 251} {"train_loss": -8.003868103027344, "global_step": 42312, "epoch": 251} {"train_loss": -8.07702922821045, "global_step": 42313, "epoch": 251} {"train_loss": -8.138343811035156, "global_step": 42314, "epoch": 251} {"train_loss": -7.950270652770996, "global_step": 42315, "epoch": 251} {"train_loss": -7.946307182312012, "global_step": 42316, "epoch": 251} {"train_loss": -7.879577159881592, "global_step": 42317, "epoch": 251} {"train_loss": -8.185604095458984, "global_step": 42318, "epoch": 251} {"train_loss": -8.025917053222656, "global_step": 42319, "epoch": 251} {"train_loss": -7.939242362976074, "global_step": 42320, "epoch": 251} {"train_loss": -8.004037857055664, "global_step": 42321, "epoch": 251} {"train_loss": -8.05747127532959, "global_step": 42322, "epoch": 251} {"train_loss": -8.18661117553711, "global_step": 42323, "epoch": 251} {"train_loss": -8.22314167022705, "global_step": 42324, "epoch": 251} {"train_loss": -8.352399826049805, "global_step": 42325, "epoch": 251} {"train_loss": -8.097650527954102, "global_step": 42326, "epoch": 251} {"train_loss": -8.159574508666992, "global_step": 42327, "epoch": 251} {"train_loss": -8.196075439453125, "global_step": 42328, "epoch": 251} {"train_loss": -8.075648307800293, "global_step": 42329, "epoch": 251} {"train_loss": -8.219319343566895, "global_step": 42330, "epoch": 251} {"train_loss": -8.056138038635254, "global_step": 42331, "epoch": 251} {"train_loss": -7.957439422607422, "global_step": 42332, "epoch": 251} {"train_loss": -7.972646236419678, "global_step": 42333, "epoch": 251} {"train_loss": -7.895196914672852, "global_step": 42334, "epoch": 251} {"train_loss": -8.030448924927484, "global_step": 42335, "epoch": 251, "val_loss": 187005.234375} {"train_loss": -8.217954635620117, "global_step": 42336, "epoch": 252} {"train_loss": -7.728133201599121, "global_step": 42337, "epoch": 252} {"train_loss": -7.897640705108643, "global_step": 42338, "epoch": 252} {"train_loss": -7.965755462646484, "global_step": 42339, "epoch": 252} {"train_loss": -8.273160934448242, "global_step": 42340, "epoch": 252} {"train_loss": -7.899251937866211, "global_step": 42341, "epoch": 252} {"train_loss": -7.943086624145508, "global_step": 42342, "epoch": 252} {"train_loss": -7.899674415588379, "global_step": 42343, "epoch": 252} {"train_loss": -7.9595513343811035, "global_step": 42344, "epoch": 252} {"train_loss": -7.930881977081299, "global_step": 42345, "epoch": 252} {"train_loss": -7.8234453201293945, "global_step": 42346, "epoch": 252} {"train_loss": -8.021939277648926, "global_step": 42347, "epoch": 252} {"train_loss": -8.092401504516602, "global_step": 42348, "epoch": 252} {"train_loss": -7.862771987915039, "global_step": 42349, "epoch": 252} {"train_loss": -7.790657043457031, "global_step": 42350, "epoch": 252} {"train_loss": -7.741400241851807, "global_step": 42351, "epoch": 252} {"train_loss": -8.264961242675781, "global_step": 42352, "epoch": 252} {"train_loss": -7.951335906982422, "global_step": 42353, "epoch": 252} {"train_loss": -8.087530136108398, "global_step": 42354, "epoch": 252} {"train_loss": -7.771340370178223, "global_step": 42355, "epoch": 252} {"train_loss": -8.078896522521973, "global_step": 42356, "epoch": 252} {"train_loss": -7.890547752380371, "global_step": 42357, "epoch": 252} {"train_loss": -7.849081039428711, "global_step": 42358, "epoch": 252} {"train_loss": -8.004450798034668, "global_step": 42359, "epoch": 252} {"train_loss": -8.021032333374023, "global_step": 42360, "epoch": 252} {"train_loss": -7.893533706665039, "global_step": 42361, "epoch": 252} {"train_loss": -7.965278625488281, "global_step": 42362, "epoch": 252} {"train_loss": -7.9991455078125, "global_step": 42363, "epoch": 252} {"train_loss": -8.023577690124512, "global_step": 42364, "epoch": 252} {"train_loss": -7.871020317077637, "global_step": 42365, "epoch": 252} {"train_loss": -8.108552932739258, "global_step": 42366, "epoch": 252} {"train_loss": -7.8161773681640625, "global_step": 42367, "epoch": 252} {"train_loss": -8.28542709350586, "global_step": 42368, "epoch": 252} {"train_loss": -8.299745559692383, "global_step": 42369, "epoch": 252} {"train_loss": -8.143863677978516, "global_step": 42370, "epoch": 252} {"train_loss": -8.078645706176758, "global_step": 42371, "epoch": 252} {"train_loss": -7.959506988525391, "global_step": 42372, "epoch": 252} {"train_loss": -7.983564376831055, "global_step": 42373, "epoch": 252} {"train_loss": -8.098581314086914, "global_step": 42374, "epoch": 252} {"train_loss": -8.181567192077637, "global_step": 42375, "epoch": 252} {"train_loss": -7.973630428314209, "global_step": 42376, "epoch": 252} {"train_loss": -8.131473541259766, "global_step": 42377, "epoch": 252} {"train_loss": -7.8734283447265625, "global_step": 42378, "epoch": 252} {"train_loss": -8.210704803466797, "global_step": 42379, "epoch": 252} {"train_loss": -8.048439025878906, "global_step": 42380, "epoch": 252} {"train_loss": -8.083526611328125, "global_step": 42381, "epoch": 252} {"train_loss": -7.96798038482666, "global_step": 42382, "epoch": 252} {"train_loss": -7.841609954833984, "global_step": 42383, "epoch": 252} {"train_loss": -8.415494918823242, "global_step": 42384, "epoch": 252} {"train_loss": -8.340753555297852, "global_step": 42385, "epoch": 252} {"train_loss": -8.058045387268066, "global_step": 42386, "epoch": 252} {"train_loss": -8.164701461791992, "global_step": 42387, "epoch": 252} {"train_loss": -8.09119987487793, "global_step": 42388, "epoch": 252} {"train_loss": -8.18366527557373, "global_step": 42389, "epoch": 252} {"train_loss": -8.347142219543457, "global_step": 42390, "epoch": 252} {"train_loss": -8.173471450805664, "global_step": 42391, "epoch": 252} {"train_loss": -7.931753158569336, "global_step": 42392, "epoch": 252} {"train_loss": -7.789332866668701, "global_step": 42393, "epoch": 252} {"train_loss": -8.194963455200195, "global_step": 42394, "epoch": 252} {"train_loss": -7.903353214263916, "global_step": 42395, "epoch": 252} {"train_loss": -8.037961959838867, "global_step": 42396, "epoch": 252} {"train_loss": -7.905117511749268, "global_step": 42397, "epoch": 252} {"train_loss": -7.848534107208252, "global_step": 42398, "epoch": 252} {"train_loss": -7.844564437866211, "global_step": 42399, "epoch": 252} {"train_loss": -8.150535583496094, "global_step": 42400, "epoch": 252} {"train_loss": -7.809171676635742, "global_step": 42401, "epoch": 252} {"train_loss": -7.748856544494629, "global_step": 42402, "epoch": 252} {"train_loss": -7.577066421508789, "global_step": 42403, "epoch": 252} {"train_loss": -7.8645405769348145, "global_step": 42404, "epoch": 252} {"train_loss": -7.806200981140137, "global_step": 42405, "epoch": 252} {"train_loss": -7.744890213012695, "global_step": 42406, "epoch": 252} {"train_loss": -8.03497314453125, "global_step": 42407, "epoch": 252} {"train_loss": -7.782958507537842, "global_step": 42408, "epoch": 252} {"train_loss": -7.873579978942871, "global_step": 42409, "epoch": 252} {"train_loss": -7.9154558181762695, "global_step": 42410, "epoch": 252} {"train_loss": -7.612903594970703, "global_step": 42411, "epoch": 252} {"train_loss": -8.06249713897705, "global_step": 42412, "epoch": 252} {"train_loss": -8.11472225189209, "global_step": 42413, "epoch": 252} {"train_loss": -8.080677032470703, "global_step": 42414, "epoch": 252} {"train_loss": -8.28818130493164, "global_step": 42415, "epoch": 252} {"train_loss": -8.041650772094727, "global_step": 42416, "epoch": 252} {"train_loss": -8.0111083984375, "global_step": 42417, "epoch": 252} {"train_loss": -8.17678451538086, "global_step": 42418, "epoch": 252} {"train_loss": -8.047558784484863, "global_step": 42419, "epoch": 252} {"train_loss": -8.044069290161133, "global_step": 42420, "epoch": 252} {"train_loss": -8.087355613708496, "global_step": 42421, "epoch": 252} {"train_loss": -8.027627944946289, "global_step": 42422, "epoch": 252} {"train_loss": -8.148179054260254, "global_step": 42423, "epoch": 252} {"train_loss": -7.999735355377197, "global_step": 42424, "epoch": 252} {"train_loss": -8.027216911315918, "global_step": 42425, "epoch": 252} {"train_loss": -8.049446105957031, "global_step": 42426, "epoch": 252} {"train_loss": -8.194783210754395, "global_step": 42427, "epoch": 252} {"train_loss": -7.999022006988525, "global_step": 42428, "epoch": 252} {"train_loss": -8.029973983764648, "global_step": 42429, "epoch": 252} {"train_loss": -8.08132553100586, "global_step": 42430, "epoch": 252} {"train_loss": -8.11337661743164, "global_step": 42431, "epoch": 252} {"train_loss": -8.13669490814209, "global_step": 42432, "epoch": 252} {"train_loss": -8.372098922729492, "global_step": 42433, "epoch": 252} {"train_loss": -8.274044036865234, "global_step": 42434, "epoch": 252} {"train_loss": -8.12812614440918, "global_step": 42435, "epoch": 252} {"train_loss": -8.00346565246582, "global_step": 42436, "epoch": 252} {"train_loss": -8.328866958618164, "global_step": 42437, "epoch": 252} {"train_loss": -7.976376533508301, "global_step": 42438, "epoch": 252} {"train_loss": -8.141338348388672, "global_step": 42439, "epoch": 252} {"train_loss": -7.884278297424316, "global_step": 42440, "epoch": 252} {"train_loss": -8.00816535949707, "global_step": 42441, "epoch": 252} {"train_loss": -8.067611694335938, "global_step": 42442, "epoch": 252} {"train_loss": -7.858635902404785, "global_step": 42443, "epoch": 252} {"train_loss": -7.919516563415527, "global_step": 42444, "epoch": 252} {"train_loss": -7.957931041717529, "global_step": 42445, "epoch": 252} {"train_loss": -7.899382591247559, "global_step": 42446, "epoch": 252} {"train_loss": -7.603806018829346, "global_step": 42447, "epoch": 252} {"train_loss": -8.058708190917969, "global_step": 42448, "epoch": 252} {"train_loss": -7.380039215087891, "global_step": 42449, "epoch": 252} {"train_loss": -7.991364002227783, "global_step": 42450, "epoch": 252} {"train_loss": -7.785643577575684, "global_step": 42451, "epoch": 252} {"train_loss": -7.784956455230713, "global_step": 42452, "epoch": 252} {"train_loss": -7.7423930168151855, "global_step": 42453, "epoch": 252} {"train_loss": -7.673382759094238, "global_step": 42454, "epoch": 252} {"train_loss": -8.143604278564453, "global_step": 42455, "epoch": 252} {"train_loss": -7.680163383483887, "global_step": 42456, "epoch": 252} {"train_loss": -7.921041488647461, "global_step": 42457, "epoch": 252} {"train_loss": -7.610761642456055, "global_step": 42458, "epoch": 252} {"train_loss": -7.7172956466674805, "global_step": 42459, "epoch": 252} {"train_loss": -7.959836959838867, "global_step": 42460, "epoch": 252} {"train_loss": -8.001672744750977, "global_step": 42461, "epoch": 252} {"train_loss": -8.145530700683594, "global_step": 42462, "epoch": 252} {"train_loss": -8.04995346069336, "global_step": 42463, "epoch": 252} {"train_loss": -7.93898344039917, "global_step": 42464, "epoch": 252} {"train_loss": -8.051050186157227, "global_step": 42465, "epoch": 252} {"train_loss": -7.93288516998291, "global_step": 42466, "epoch": 252} {"train_loss": -7.833306312561035, "global_step": 42467, "epoch": 252} {"train_loss": -8.027521133422852, "global_step": 42468, "epoch": 252} {"train_loss": -7.902958869934082, "global_step": 42469, "epoch": 252} {"train_loss": -7.667984962463379, "global_step": 42470, "epoch": 252} {"train_loss": -8.115568161010742, "global_step": 42471, "epoch": 252} {"train_loss": -7.913271903991699, "global_step": 42472, "epoch": 252} {"train_loss": -8.12490463256836, "global_step": 42473, "epoch": 252} {"train_loss": -8.116825103759766, "global_step": 42474, "epoch": 252} {"train_loss": -8.087321281433105, "global_step": 42475, "epoch": 252} {"train_loss": -8.045918464660645, "global_step": 42476, "epoch": 252} {"train_loss": -8.209507942199707, "global_step": 42477, "epoch": 252} {"train_loss": -8.232488632202148, "global_step": 42478, "epoch": 252} {"train_loss": -8.132923126220703, "global_step": 42479, "epoch": 252} {"train_loss": -8.01569938659668, "global_step": 42480, "epoch": 252} {"train_loss": -8.057844161987305, "global_step": 42481, "epoch": 252} {"train_loss": -8.076064109802246, "global_step": 42482, "epoch": 252} {"train_loss": -8.092279434204102, "global_step": 42483, "epoch": 252} {"train_loss": -8.031585693359375, "global_step": 42484, "epoch": 252} {"train_loss": -8.226181030273438, "global_step": 42485, "epoch": 252} {"train_loss": -7.875154495239258, "global_step": 42486, "epoch": 252} {"train_loss": -8.021202087402344, "global_step": 42487, "epoch": 252} {"train_loss": -7.98042631149292, "global_step": 42488, "epoch": 252} {"train_loss": -7.919379234313965, "global_step": 42489, "epoch": 252} {"train_loss": -7.927881240844727, "global_step": 42490, "epoch": 252} {"train_loss": -7.781277656555176, "global_step": 42491, "epoch": 252} {"train_loss": -7.937438488006592, "global_step": 42492, "epoch": 252} {"train_loss": -7.84942626953125, "global_step": 42493, "epoch": 252} {"train_loss": -7.846240997314453, "global_step": 42494, "epoch": 252} {"train_loss": -8.076078414916992, "global_step": 42495, "epoch": 252} {"train_loss": -7.829135894775391, "global_step": 42496, "epoch": 252} {"train_loss": -7.81696081161499, "global_step": 42497, "epoch": 252} {"train_loss": -8.05622673034668, "global_step": 42498, "epoch": 252} {"train_loss": -7.8696088790893555, "global_step": 42499, "epoch": 252} {"train_loss": -7.612245082855225, "global_step": 42500, "epoch": 252} {"train_loss": -7.8629841804504395, "global_step": 42501, "epoch": 252} {"train_loss": -7.631019592285156, "global_step": 42502, "epoch": 252} {"train_loss": -7.983580050014314, "global_step": 42503, "epoch": 252, "val_loss": 185296.90625} {"train_loss": -7.844018459320068, "global_step": 42504, "epoch": 253} {"train_loss": -7.953686237335205, "global_step": 42505, "epoch": 253} {"train_loss": -8.09576416015625, "global_step": 42506, "epoch": 253} {"train_loss": -7.793488502502441, "global_step": 42507, "epoch": 253} {"train_loss": -7.909765243530273, "global_step": 42508, "epoch": 253} {"train_loss": -7.8168182373046875, "global_step": 42509, "epoch": 253} {"train_loss": -7.906991958618164, "global_step": 42510, "epoch": 253} {"train_loss": -7.904444694519043, "global_step": 42511, "epoch": 253} {"train_loss": -7.980615615844727, "global_step": 42512, "epoch": 253} {"train_loss": -8.19870376586914, "global_step": 42513, "epoch": 253} {"train_loss": -8.020904541015625, "global_step": 42514, "epoch": 253} {"train_loss": -8.0491304397583, "global_step": 42515, "epoch": 253} {"train_loss": -8.050413131713867, "global_step": 42516, "epoch": 253} {"train_loss": -8.024646759033203, "global_step": 42517, "epoch": 253} {"train_loss": -8.00987434387207, "global_step": 42518, "epoch": 253} {"train_loss": -8.176164627075195, "global_step": 42519, "epoch": 253} {"train_loss": -8.075971603393555, "global_step": 42520, "epoch": 253} {"train_loss": -8.0970458984375, "global_step": 42521, "epoch": 253} {"train_loss": -8.054424285888672, "global_step": 42522, "epoch": 253} {"train_loss": -8.080345153808594, "global_step": 42523, "epoch": 253} {"train_loss": -7.814030170440674, "global_step": 42524, "epoch": 253} {"train_loss": -8.360173225402832, "global_step": 42525, "epoch": 253} {"train_loss": -7.965792655944824, "global_step": 42526, "epoch": 253} {"train_loss": -8.240401268005371, "global_step": 42527, "epoch": 253} {"train_loss": -7.965173721313477, "global_step": 42528, "epoch": 253} {"train_loss": -7.956698417663574, "global_step": 42529, "epoch": 253} {"train_loss": -8.008773803710938, "global_step": 42530, "epoch": 253} {"train_loss": -7.979303359985352, "global_step": 42531, "epoch": 253} {"train_loss": -8.126608848571777, "global_step": 42532, "epoch": 253} {"train_loss": -8.014851570129395, "global_step": 42533, "epoch": 253} {"train_loss": -8.193822860717773, "global_step": 42534, "epoch": 253} {"train_loss": -7.921483516693115, "global_step": 42535, "epoch": 253} {"train_loss": -8.329742431640625, "global_step": 42536, "epoch": 253} {"train_loss": -7.997224807739258, "global_step": 42537, "epoch": 253} {"train_loss": -7.997913360595703, "global_step": 42538, "epoch": 253} {"train_loss": -7.942400932312012, "global_step": 42539, "epoch": 253} {"train_loss": -7.882165431976318, "global_step": 42540, "epoch": 253} {"train_loss": -8.08608341217041, "global_step": 42541, "epoch": 253} {"train_loss": -8.014102935791016, "global_step": 42542, "epoch": 253} {"train_loss": -8.000253677368164, "global_step": 42543, "epoch": 253} {"train_loss": -7.816252708435059, "global_step": 42544, "epoch": 253} {"train_loss": -7.980598449707031, "global_step": 42545, "epoch": 253} {"train_loss": -7.789813041687012, "global_step": 42546, "epoch": 253} {"train_loss": -7.8583855628967285, "global_step": 42547, "epoch": 253} {"train_loss": -7.682403564453125, "global_step": 42548, "epoch": 253} {"train_loss": -7.227258682250977, "global_step": 42549, "epoch": 253} {"train_loss": -7.733865261077881, "global_step": 42550, "epoch": 253} {"train_loss": -7.6464667320251465, "global_step": 42551, "epoch": 253} {"train_loss": -7.729127883911133, "global_step": 42552, "epoch": 253} {"train_loss": -8.036309242248535, "global_step": 42553, "epoch": 253} {"train_loss": -7.652679443359375, "global_step": 42554, "epoch": 253} {"train_loss": -8.073369026184082, "global_step": 42555, "epoch": 253} {"train_loss": -7.83436393737793, "global_step": 42556, "epoch": 253} {"train_loss": -7.651962757110596, "global_step": 42557, "epoch": 253} {"train_loss": -7.756290435791016, "global_step": 42558, "epoch": 253} {"train_loss": -7.727741241455078, "global_step": 42559, "epoch": 253} {"train_loss": -7.896862030029297, "global_step": 42560, "epoch": 253} {"train_loss": -8.084178924560547, "global_step": 42561, "epoch": 253} {"train_loss": -7.9337992668151855, "global_step": 42562, "epoch": 253} {"train_loss": -8.113421440124512, "global_step": 42563, "epoch": 253} {"train_loss": -8.099935531616211, "global_step": 42564, "epoch": 253} {"train_loss": -8.092262268066406, "global_step": 42565, "epoch": 253} {"train_loss": -8.11225700378418, "global_step": 42566, "epoch": 253} {"train_loss": -8.064302444458008, "global_step": 42567, "epoch": 253} {"train_loss": -8.219276428222656, "global_step": 42568, "epoch": 253} {"train_loss": -8.133333206176758, "global_step": 42569, "epoch": 253} {"train_loss": -8.005019187927246, "global_step": 42570, "epoch": 253} {"train_loss": -8.108932495117188, "global_step": 42571, "epoch": 253} {"train_loss": -8.020415306091309, "global_step": 42572, "epoch": 253} {"train_loss": -8.086586952209473, "global_step": 42573, "epoch": 253} {"train_loss": -7.903501510620117, "global_step": 42574, "epoch": 253} {"train_loss": -8.14635181427002, "global_step": 42575, "epoch": 253} {"train_loss": -8.259787559509277, "global_step": 42576, "epoch": 253} {"train_loss": -7.919797897338867, "global_step": 42577, "epoch": 253} {"train_loss": -8.160021781921387, "global_step": 42578, "epoch": 253} {"train_loss": -8.109862327575684, "global_step": 42579, "epoch": 253} {"train_loss": -8.065473556518555, "global_step": 42580, "epoch": 253} {"train_loss": -7.977969169616699, "global_step": 42581, "epoch": 253} {"train_loss": -8.177698135375977, "global_step": 42582, "epoch": 253} {"train_loss": -8.041672706604004, "global_step": 42583, "epoch": 253} {"train_loss": -8.150264739990234, "global_step": 42584, "epoch": 253} {"train_loss": -8.079137802124023, "global_step": 42585, "epoch": 253} {"train_loss": -8.125123977661133, "global_step": 42586, "epoch": 253} {"train_loss": -7.79092264175415, "global_step": 42587, "epoch": 253} {"train_loss": -7.841897487640381, "global_step": 42588, "epoch": 253} {"train_loss": -7.769051551818848, "global_step": 42589, "epoch": 253} {"train_loss": -7.912593841552734, "global_step": 42590, "epoch": 253} {"train_loss": -7.797555923461914, "global_step": 42591, "epoch": 253} {"train_loss": -8.112308502197266, "global_step": 42592, "epoch": 253} {"train_loss": -7.714910507202148, "global_step": 42593, "epoch": 253} {"train_loss": -7.943295478820801, "global_step": 42594, "epoch": 253} {"train_loss": -7.8719611167907715, "global_step": 42595, "epoch": 253} {"train_loss": -8.035957336425781, "global_step": 42596, "epoch": 253} {"train_loss": -7.8340325355529785, "global_step": 42597, "epoch": 253} {"train_loss": -7.707065582275391, "global_step": 42598, "epoch": 253} {"train_loss": -7.936962127685547, "global_step": 42599, "epoch": 253} {"train_loss": -8.02573013305664, "global_step": 42600, "epoch": 253} {"train_loss": -7.978630065917969, "global_step": 42601, "epoch": 253} {"train_loss": -7.886127948760986, "global_step": 42602, "epoch": 253} {"train_loss": -7.939062118530273, "global_step": 42603, "epoch": 253} {"train_loss": -7.756231307983398, "global_step": 42604, "epoch": 253} {"train_loss": -8.00728988647461, "global_step": 42605, "epoch": 253} {"train_loss": -7.810842037200928, "global_step": 42606, "epoch": 253} {"train_loss": -8.072774887084961, "global_step": 42607, "epoch": 253} {"train_loss": -7.9664459228515625, "global_step": 42608, "epoch": 253} {"train_loss": -7.862110137939453, "global_step": 42609, "epoch": 253} {"train_loss": -8.080835342407227, "global_step": 42610, "epoch": 253} {"train_loss": -7.996288776397705, "global_step": 42611, "epoch": 253} {"train_loss": -8.042510032653809, "global_step": 42612, "epoch": 253} {"train_loss": -8.162449836730957, "global_step": 42613, "epoch": 253} {"train_loss": -8.139302253723145, "global_step": 42614, "epoch": 253} {"train_loss": -7.925654411315918, "global_step": 42615, "epoch": 253} {"train_loss": -8.033601760864258, "global_step": 42616, "epoch": 253} {"train_loss": -7.764491081237793, "global_step": 42617, "epoch": 253} {"train_loss": -7.964474678039551, "global_step": 42618, "epoch": 253} {"train_loss": -7.650341033935547, "global_step": 42619, "epoch": 253} {"train_loss": -8.096750259399414, "global_step": 42620, "epoch": 253} {"train_loss": -7.831899642944336, "global_step": 42621, "epoch": 253} {"train_loss": -7.761457443237305, "global_step": 42622, "epoch": 253} {"train_loss": -7.73642110824585, "global_step": 42623, "epoch": 253} {"train_loss": -8.101394653320312, "global_step": 42624, "epoch": 253} {"train_loss": -7.660266876220703, "global_step": 42625, "epoch": 253} {"train_loss": -7.844977378845215, "global_step": 42626, "epoch": 253} {"train_loss": -7.812668800354004, "global_step": 42627, "epoch": 253} {"train_loss": -7.820431232452393, "global_step": 42628, "epoch": 253} {"train_loss": -7.866442680358887, "global_step": 42629, "epoch": 253} {"train_loss": -7.98915958404541, "global_step": 42630, "epoch": 253} {"train_loss": -7.8907694816589355, "global_step": 42631, "epoch": 253} {"train_loss": -7.915871620178223, "global_step": 42632, "epoch": 253} {"train_loss": -7.900803565979004, "global_step": 42633, "epoch": 253} {"train_loss": -7.789538383483887, "global_step": 42634, "epoch": 253} {"train_loss": -8.00534439086914, "global_step": 42635, "epoch": 253} {"train_loss": -8.060632705688477, "global_step": 42636, "epoch": 253} {"train_loss": -7.909028053283691, "global_step": 42637, "epoch": 253} {"train_loss": -7.9166412353515625, "global_step": 42638, "epoch": 253} {"train_loss": -7.793207168579102, "global_step": 42639, "epoch": 253} {"train_loss": -8.007652282714844, "global_step": 42640, "epoch": 253} {"train_loss": -7.999759197235107, "global_step": 42641, "epoch": 253} {"train_loss": -8.21249008178711, "global_step": 42642, "epoch": 253} {"train_loss": -7.963428497314453, "global_step": 42643, "epoch": 253} {"train_loss": -8.158439636230469, "global_step": 42644, "epoch": 253} {"train_loss": -8.241655349731445, "global_step": 42645, "epoch": 253} {"train_loss": -8.275827407836914, "global_step": 42646, "epoch": 253} {"train_loss": -8.144166946411133, "global_step": 42647, "epoch": 253} {"train_loss": -8.436279296875, "global_step": 42648, "epoch": 253} {"train_loss": -8.169107437133789, "global_step": 42649, "epoch": 253} {"train_loss": -8.245813369750977, "global_step": 42650, "epoch": 253} {"train_loss": -8.255528450012207, "global_step": 42651, "epoch": 253} {"train_loss": -8.208797454833984, "global_step": 42652, "epoch": 253} {"train_loss": -8.167749404907227, "global_step": 42653, "epoch": 253} {"train_loss": -8.207425117492676, "global_step": 42654, "epoch": 253} {"train_loss": -8.236961364746094, "global_step": 42655, "epoch": 253} {"train_loss": -8.262319564819336, "global_step": 42656, "epoch": 253} {"train_loss": -8.207792282104492, "global_step": 42657, "epoch": 253} {"train_loss": -8.268455505371094, "global_step": 42658, "epoch": 253} {"train_loss": -8.153980255126953, "global_step": 42659, "epoch": 253} {"train_loss": -8.075300216674805, "global_step": 42660, "epoch": 253} {"train_loss": -8.035391807556152, "global_step": 42661, "epoch": 253} {"train_loss": -8.080865859985352, "global_step": 42662, "epoch": 253} {"train_loss": -7.975392818450928, "global_step": 42663, "epoch": 253} {"train_loss": -7.94969367980957, "global_step": 42664, "epoch": 253} {"train_loss": -7.963115692138672, "global_step": 42665, "epoch": 253} {"train_loss": -8.15019416809082, "global_step": 42666, "epoch": 253} {"train_loss": -8.18247127532959, "global_step": 42667, "epoch": 253} {"train_loss": -8.05311393737793, "global_step": 42668, "epoch": 253} {"train_loss": -8.111810684204102, "global_step": 42669, "epoch": 253} {"train_loss": -7.784990310668945, "global_step": 42670, "epoch": 253} {"train_loss": -7.9896331911995295, "global_step": 42671, "epoch": 253, "val_loss": 186486.703125} {"train_loss": -7.782743453979492, "global_step": 42672, "epoch": 254} {"train_loss": -7.98845911026001, "global_step": 42673, "epoch": 254} {"train_loss": -8.121395111083984, "global_step": 42674, "epoch": 254} {"train_loss": -7.999646186828613, "global_step": 42675, "epoch": 254} {"train_loss": -7.93434476852417, "global_step": 42676, "epoch": 254} {"train_loss": -7.980297565460205, "global_step": 42677, "epoch": 254} {"train_loss": -8.1226806640625, "global_step": 42678, "epoch": 254} {"train_loss": -7.855630874633789, "global_step": 42679, "epoch": 254} {"train_loss": -7.787757873535156, "global_step": 42680, "epoch": 254} {"train_loss": -8.114269256591797, "global_step": 42681, "epoch": 254} {"train_loss": -8.05853271484375, "global_step": 42682, "epoch": 254} {"train_loss": -7.897669315338135, "global_step": 42683, "epoch": 254} {"train_loss": -8.021738052368164, "global_step": 42684, "epoch": 254} {"train_loss": -7.963010311126709, "global_step": 42685, "epoch": 254} {"train_loss": -8.192386627197266, "global_step": 42686, "epoch": 254} {"train_loss": -7.9741716384887695, "global_step": 42687, "epoch": 254} {"train_loss": -8.114340782165527, "global_step": 42688, "epoch": 254} {"train_loss": -8.221412658691406, "global_step": 42689, "epoch": 254} {"train_loss": -8.271987915039062, "global_step": 42690, "epoch": 254} {"train_loss": -8.115240097045898, "global_step": 42691, "epoch": 254} {"train_loss": -8.035934448242188, "global_step": 42692, "epoch": 254} {"train_loss": -8.166211128234863, "global_step": 42693, "epoch": 254} {"train_loss": -8.190910339355469, "global_step": 42694, "epoch": 254} {"train_loss": -8.155837059020996, "global_step": 42695, "epoch": 254} {"train_loss": -7.928500652313232, "global_step": 42696, "epoch": 254} {"train_loss": -8.282083511352539, "global_step": 42697, "epoch": 254} {"train_loss": -8.312051773071289, "global_step": 42698, "epoch": 254} {"train_loss": -7.892364501953125, "global_step": 42699, "epoch": 254} {"train_loss": -8.245317459106445, "global_step": 42700, "epoch": 254} {"train_loss": -8.151583671569824, "global_step": 42701, "epoch": 254} {"train_loss": -8.137556076049805, "global_step": 42702, "epoch": 254} {"train_loss": -8.265596389770508, "global_step": 42703, "epoch": 254} {"train_loss": -8.105790138244629, "global_step": 42704, "epoch": 254} {"train_loss": -8.374492645263672, "global_step": 42705, "epoch": 254} {"train_loss": -7.924189567565918, "global_step": 42706, "epoch": 254} {"train_loss": -8.260185241699219, "global_step": 42707, "epoch": 254} {"train_loss": -8.14116382598877, "global_step": 42708, "epoch": 254} {"train_loss": -8.367403984069824, "global_step": 42709, "epoch": 254} {"train_loss": -8.022367477416992, "global_step": 42710, "epoch": 254} {"train_loss": -8.345514297485352, "global_step": 42711, "epoch": 254} {"train_loss": -8.314435958862305, "global_step": 42712, "epoch": 254} {"train_loss": -8.076074600219727, "global_step": 42713, "epoch": 254} {"train_loss": -8.162271499633789, "global_step": 42714, "epoch": 254} {"train_loss": -8.343582153320312, "global_step": 42715, "epoch": 254} {"train_loss": -8.252961158752441, "global_step": 42716, "epoch": 254} {"train_loss": -7.890633583068848, "global_step": 42717, "epoch": 254} {"train_loss": -7.968976020812988, "global_step": 42718, "epoch": 254} {"train_loss": -8.204782485961914, "global_step": 42719, "epoch": 254} {"train_loss": -8.124199867248535, "global_step": 42720, "epoch": 254} {"train_loss": -8.035962104797363, "global_step": 42721, "epoch": 254} {"train_loss": -8.033317565917969, "global_step": 42722, "epoch": 254} {"train_loss": -8.231809616088867, "global_step": 42723, "epoch": 254} {"train_loss": -8.074505805969238, "global_step": 42724, "epoch": 254} {"train_loss": -8.170854568481445, "global_step": 42725, "epoch": 254} {"train_loss": -8.04027271270752, "global_step": 42726, "epoch": 254} {"train_loss": -8.127842903137207, "global_step": 42727, "epoch": 254} {"train_loss": -8.281665802001953, "global_step": 42728, "epoch": 254} {"train_loss": -8.053728103637695, "global_step": 42729, "epoch": 254} {"train_loss": -7.950087547302246, "global_step": 42730, "epoch": 254} {"train_loss": -8.08220100402832, "global_step": 42731, "epoch": 254} {"train_loss": -8.119518280029297, "global_step": 42732, "epoch": 254} {"train_loss": -7.966862201690674, "global_step": 42733, "epoch": 254} {"train_loss": -7.9425859451293945, "global_step": 42734, "epoch": 254} {"train_loss": -7.8693156242370605, "global_step": 42735, "epoch": 254} {"train_loss": -7.77452278137207, "global_step": 42736, "epoch": 254} {"train_loss": -7.888835906982422, "global_step": 42737, "epoch": 254} {"train_loss": -8.077054977416992, "global_step": 42738, "epoch": 254} {"train_loss": -7.702626705169678, "global_step": 42739, "epoch": 254} {"train_loss": -7.951421737670898, "global_step": 42740, "epoch": 254} {"train_loss": -7.9761176109313965, "global_step": 42741, "epoch": 254} {"train_loss": -7.674851417541504, "global_step": 42742, "epoch": 254} {"train_loss": -8.023519515991211, "global_step": 42743, "epoch": 254} {"train_loss": -7.98781156539917, "global_step": 42744, "epoch": 254} {"train_loss": -7.959142684936523, "global_step": 42745, "epoch": 254} {"train_loss": -8.060659408569336, "global_step": 42746, "epoch": 254} {"train_loss": -7.967313766479492, "global_step": 42747, "epoch": 254} {"train_loss": -7.737822532653809, "global_step": 42748, "epoch": 254} {"train_loss": -7.971902370452881, "global_step": 42749, "epoch": 254} {"train_loss": -8.011693000793457, "global_step": 42750, "epoch": 254} {"train_loss": -8.035781860351562, "global_step": 42751, "epoch": 254} {"train_loss": -7.879342079162598, "global_step": 42752, "epoch": 254} {"train_loss": -7.882796287536621, "global_step": 42753, "epoch": 254} {"train_loss": -7.731769561767578, "global_step": 42754, "epoch": 254} {"train_loss": -8.029448509216309, "global_step": 42755, "epoch": 254} {"train_loss": -7.808099269866943, "global_step": 42756, "epoch": 254} {"train_loss": -7.866143226623535, "global_step": 42757, "epoch": 254} {"train_loss": -7.956724166870117, "global_step": 42758, "epoch": 254} {"train_loss": -7.882523536682129, "global_step": 42759, "epoch": 254} {"train_loss": -7.750914573669434, "global_step": 42760, "epoch": 254} {"train_loss": -8.146568298339844, "global_step": 42761, "epoch": 254} {"train_loss": -8.043634414672852, "global_step": 42762, "epoch": 254} {"train_loss": -7.949180603027344, "global_step": 42763, "epoch": 254} {"train_loss": -7.816536903381348, "global_step": 42764, "epoch": 254} {"train_loss": -7.884659767150879, "global_step": 42765, "epoch": 254} {"train_loss": -7.992660045623779, "global_step": 42766, "epoch": 254} {"train_loss": -8.104047775268555, "global_step": 42767, "epoch": 254} {"train_loss": -7.958856582641602, "global_step": 42768, "epoch": 254} {"train_loss": -8.139737129211426, "global_step": 42769, "epoch": 254} {"train_loss": -8.273504257202148, "global_step": 42770, "epoch": 254} {"train_loss": -8.097843170166016, "global_step": 42771, "epoch": 254} {"train_loss": -8.108882904052734, "global_step": 42772, "epoch": 254} {"train_loss": -7.786942481994629, "global_step": 42773, "epoch": 254} {"train_loss": -7.965048313140869, "global_step": 42774, "epoch": 254} {"train_loss": -7.766345977783203, "global_step": 42775, "epoch": 254} {"train_loss": -7.832069396972656, "global_step": 42776, "epoch": 254} {"train_loss": -8.205286026000977, "global_step": 42777, "epoch": 254} {"train_loss": -7.950689315795898, "global_step": 42778, "epoch": 254} {"train_loss": -8.213547706604004, "global_step": 42779, "epoch": 254} {"train_loss": -8.12783432006836, "global_step": 42780, "epoch": 254} {"train_loss": -7.909996032714844, "global_step": 42781, "epoch": 254} {"train_loss": -8.096759796142578, "global_step": 42782, "epoch": 254} {"train_loss": -8.129531860351562, "global_step": 42783, "epoch": 254} {"train_loss": -8.205678939819336, "global_step": 42784, "epoch": 254} {"train_loss": -8.266073226928711, "global_step": 42785, "epoch": 254} {"train_loss": -8.083052635192871, "global_step": 42786, "epoch": 254} {"train_loss": -8.141767501831055, "global_step": 42787, "epoch": 254} {"train_loss": -7.802822589874268, "global_step": 42788, "epoch": 254} {"train_loss": -8.000547409057617, "global_step": 42789, "epoch": 254} {"train_loss": -8.067865371704102, "global_step": 42790, "epoch": 254} {"train_loss": -8.114513397216797, "global_step": 42791, "epoch": 254} {"train_loss": -8.044540405273438, "global_step": 42792, "epoch": 254} {"train_loss": -8.112039566040039, "global_step": 42793, "epoch": 254} {"train_loss": -7.798691749572754, "global_step": 42794, "epoch": 254} {"train_loss": -8.114179611206055, "global_step": 42795, "epoch": 254} {"train_loss": -8.264509201049805, "global_step": 42796, "epoch": 254} {"train_loss": -8.091673851013184, "global_step": 42797, "epoch": 254} {"train_loss": -7.9455108642578125, "global_step": 42798, "epoch": 254} {"train_loss": -8.162651062011719, "global_step": 42799, "epoch": 254} {"train_loss": -8.095428466796875, "global_step": 42800, "epoch": 254} {"train_loss": -7.9901933670043945, "global_step": 42801, "epoch": 254} {"train_loss": -8.051875114440918, "global_step": 42802, "epoch": 254} {"train_loss": -7.882024765014648, "global_step": 42803, "epoch": 254} {"train_loss": -8.251546859741211, "global_step": 42804, "epoch": 254} {"train_loss": -8.33493709564209, "global_step": 42805, "epoch": 254} {"train_loss": -8.172680854797363, "global_step": 42806, "epoch": 254} {"train_loss": -7.965593338012695, "global_step": 42807, "epoch": 254} {"train_loss": -8.073572158813477, "global_step": 42808, "epoch": 254} {"train_loss": -8.102850914001465, "global_step": 42809, "epoch": 254} {"train_loss": -8.162012100219727, "global_step": 42810, "epoch": 254} {"train_loss": -8.164408683776855, "global_step": 42811, "epoch": 254} {"train_loss": -8.12757396697998, "global_step": 42812, "epoch": 254} {"train_loss": -7.943760871887207, "global_step": 42813, "epoch": 254} {"train_loss": -8.099761009216309, "global_step": 42814, "epoch": 254} {"train_loss": -7.84575080871582, "global_step": 42815, "epoch": 254} {"train_loss": -8.170707702636719, "global_step": 42816, "epoch": 254} {"train_loss": -8.208568572998047, "global_step": 42817, "epoch": 254} {"train_loss": -7.965920448303223, "global_step": 42818, "epoch": 254} {"train_loss": -7.880135536193848, "global_step": 42819, "epoch": 254} {"train_loss": -8.102263450622559, "global_step": 42820, "epoch": 254} {"train_loss": -7.862260341644287, "global_step": 42821, "epoch": 254} {"train_loss": -8.228280067443848, "global_step": 42822, "epoch": 254} {"train_loss": -7.994455337524414, "global_step": 42823, "epoch": 254} {"train_loss": -7.867616176605225, "global_step": 42824, "epoch": 254} {"train_loss": -8.234731674194336, "global_step": 42825, "epoch": 254} {"train_loss": -7.984255790710449, "global_step": 42826, "epoch": 254} {"train_loss": -8.031060218811035, "global_step": 42827, "epoch": 254} {"train_loss": -8.04056453704834, "global_step": 42828, "epoch": 254} {"train_loss": -7.970556259155273, "global_step": 42829, "epoch": 254} {"train_loss": -7.916793346405029, "global_step": 42830, "epoch": 254} {"train_loss": -8.102100372314453, "global_step": 42831, "epoch": 254} {"train_loss": -8.053154945373535, "global_step": 42832, "epoch": 254} {"train_loss": -7.927128791809082, "global_step": 42833, "epoch": 254} {"train_loss": -7.991968631744385, "global_step": 42834, "epoch": 254} {"train_loss": -8.185196876525879, "global_step": 42835, "epoch": 254} {"train_loss": -8.025758743286133, "global_step": 42836, "epoch": 254} {"train_loss": -8.139204978942871, "global_step": 42837, "epoch": 254} {"train_loss": -8.166244506835938, "global_step": 42838, "epoch": 254} {"train_loss": -8.046323532149906, "global_step": 42839, "epoch": 254, "val_loss": 185857.96875} {"train_loss": -8.1303071975708, "global_step": 42840, "epoch": 255} {"train_loss": -7.917172431945801, "global_step": 42841, "epoch": 255} {"train_loss": -8.106395721435547, "global_step": 42842, "epoch": 255} {"train_loss": -8.030734062194824, "global_step": 42843, "epoch": 255} {"train_loss": -8.117916107177734, "global_step": 42844, "epoch": 255} {"train_loss": -7.950915813446045, "global_step": 42845, "epoch": 255} {"train_loss": -8.160438537597656, "global_step": 42846, "epoch": 255} {"train_loss": -8.243402481079102, "global_step": 42847, "epoch": 255} {"train_loss": -8.07715892791748, "global_step": 42848, "epoch": 255} {"train_loss": -8.025547981262207, "global_step": 42849, "epoch": 255} {"train_loss": -8.275882720947266, "global_step": 42850, "epoch": 255} {"train_loss": -8.088171005249023, "global_step": 42851, "epoch": 255} {"train_loss": -7.975888252258301, "global_step": 42852, "epoch": 255} {"train_loss": -8.10623550415039, "global_step": 42853, "epoch": 255} {"train_loss": -8.061090469360352, "global_step": 42854, "epoch": 255} {"train_loss": -8.034322738647461, "global_step": 42855, "epoch": 255} {"train_loss": -8.086807250976562, "global_step": 42856, "epoch": 255} {"train_loss": -8.044670104980469, "global_step": 42857, "epoch": 255} {"train_loss": -7.99758243560791, "global_step": 42858, "epoch": 255} {"train_loss": -8.000194549560547, "global_step": 42859, "epoch": 255} {"train_loss": -8.072904586791992, "global_step": 42860, "epoch": 255} {"train_loss": -8.156030654907227, "global_step": 42861, "epoch": 255} {"train_loss": -8.047496795654297, "global_step": 42862, "epoch": 255} {"train_loss": -7.662217140197754, "global_step": 42863, "epoch": 255} {"train_loss": -7.998150825500488, "global_step": 42864, "epoch": 255} {"train_loss": -7.912724018096924, "global_step": 42865, "epoch": 255} {"train_loss": -8.136022567749023, "global_step": 42866, "epoch": 255} {"train_loss": -7.935107231140137, "global_step": 42867, "epoch": 255} {"train_loss": -8.034595489501953, "global_step": 42868, "epoch": 255} {"train_loss": -7.981067180633545, "global_step": 42869, "epoch": 255} {"train_loss": -7.701523303985596, "global_step": 42870, "epoch": 255} {"train_loss": -7.887211799621582, "global_step": 42871, "epoch": 255} {"train_loss": -7.9673590660095215, "global_step": 42872, "epoch": 255} {"train_loss": -7.794356822967529, "global_step": 42873, "epoch": 255} {"train_loss": -7.991302490234375, "global_step": 42874, "epoch": 255} {"train_loss": -7.480025768280029, "global_step": 42875, "epoch": 255} {"train_loss": -8.234943389892578, "global_step": 42876, "epoch": 255} {"train_loss": -7.5622711181640625, "global_step": 42877, "epoch": 255} {"train_loss": -8.19013500213623, "global_step": 42878, "epoch": 255} {"train_loss": -7.82856559753418, "global_step": 42879, "epoch": 255} {"train_loss": -7.750471115112305, "global_step": 42880, "epoch": 255} {"train_loss": -7.946935653686523, "global_step": 42881, "epoch": 255} {"train_loss": -7.919808387756348, "global_step": 42882, "epoch": 255} {"train_loss": -7.856884956359863, "global_step": 42883, "epoch": 255} {"train_loss": -8.016497611999512, "global_step": 42884, "epoch": 255} {"train_loss": -7.997119426727295, "global_step": 42885, "epoch": 255} {"train_loss": -7.8824968338012695, "global_step": 42886, "epoch": 255} {"train_loss": -7.769830703735352, "global_step": 42887, "epoch": 255} {"train_loss": -7.924957275390625, "global_step": 42888, "epoch": 255} {"train_loss": -8.233946800231934, "global_step": 42889, "epoch": 255} {"train_loss": -8.061979293823242, "global_step": 42890, "epoch": 255} {"train_loss": -7.9992570877075195, "global_step": 42891, "epoch": 255} {"train_loss": -7.927084922790527, "global_step": 42892, "epoch": 255} {"train_loss": -8.010851860046387, "global_step": 42893, "epoch": 255} {"train_loss": -8.14834213256836, "global_step": 42894, "epoch": 255} {"train_loss": -8.091962814331055, "global_step": 42895, "epoch": 255} {"train_loss": -8.06553840637207, "global_step": 42896, "epoch": 255} {"train_loss": -8.147623062133789, "global_step": 42897, "epoch": 255} {"train_loss": -8.083166122436523, "global_step": 42898, "epoch": 255} {"train_loss": -7.95616340637207, "global_step": 42899, "epoch": 255} {"train_loss": -8.099837303161621, "global_step": 42900, "epoch": 255} {"train_loss": -8.136215209960938, "global_step": 42901, "epoch": 255} {"train_loss": -8.19218635559082, "global_step": 42902, "epoch": 255} {"train_loss": -8.043989181518555, "global_step": 42903, "epoch": 255} {"train_loss": -8.173097610473633, "global_step": 42904, "epoch": 255} {"train_loss": -8.106775283813477, "global_step": 42905, "epoch": 255} {"train_loss": -8.177217483520508, "global_step": 42906, "epoch": 255} {"train_loss": -8.207425117492676, "global_step": 42907, "epoch": 255} {"train_loss": -7.909650802612305, "global_step": 42908, "epoch": 255} {"train_loss": -8.282463073730469, "global_step": 42909, "epoch": 255} {"train_loss": -8.138839721679688, "global_step": 42910, "epoch": 255} {"train_loss": -8.07852554321289, "global_step": 42911, "epoch": 255} {"train_loss": -8.10093879699707, "global_step": 42912, "epoch": 255} {"train_loss": -7.996216297149658, "global_step": 42913, "epoch": 255} {"train_loss": -7.9212775230407715, "global_step": 42914, "epoch": 255} {"train_loss": -8.321969985961914, "global_step": 42915, "epoch": 255} {"train_loss": -7.995914459228516, "global_step": 42916, "epoch": 255} {"train_loss": -8.025800704956055, "global_step": 42917, "epoch": 255} {"train_loss": -7.807308197021484, "global_step": 42918, "epoch": 255} {"train_loss": -7.855217933654785, "global_step": 42919, "epoch": 255} {"train_loss": -7.835273265838623, "global_step": 42920, "epoch": 255} {"train_loss": -8.038015365600586, "global_step": 42921, "epoch": 255} {"train_loss": -7.903134822845459, "global_step": 42922, "epoch": 255} {"train_loss": -8.082012176513672, "global_step": 42923, "epoch": 255} {"train_loss": -8.038421630859375, "global_step": 42924, "epoch": 255} {"train_loss": -7.9280829429626465, "global_step": 42925, "epoch": 255} {"train_loss": -7.888873100280762, "global_step": 42926, "epoch": 255} {"train_loss": -8.016324996948242, "global_step": 42927, "epoch": 255} {"train_loss": -7.8173370361328125, "global_step": 42928, "epoch": 255} {"train_loss": -7.678834915161133, "global_step": 42929, "epoch": 255} {"train_loss": -7.9829511642456055, "global_step": 42930, "epoch": 255} {"train_loss": -8.033203125, "global_step": 42931, "epoch": 255} {"train_loss": -7.923375129699707, "global_step": 42932, "epoch": 255} {"train_loss": -8.085472106933594, "global_step": 42933, "epoch": 255} {"train_loss": -7.991071701049805, "global_step": 42934, "epoch": 255} {"train_loss": -8.000743865966797, "global_step": 42935, "epoch": 255} {"train_loss": -7.961958885192871, "global_step": 42936, "epoch": 255} {"train_loss": -8.124091148376465, "global_step": 42937, "epoch": 255} {"train_loss": -8.008804321289062, "global_step": 42938, "epoch": 255} {"train_loss": -8.055078506469727, "global_step": 42939, "epoch": 255} {"train_loss": -7.8887481689453125, "global_step": 42940, "epoch": 255} {"train_loss": -8.069347381591797, "global_step": 42941, "epoch": 255} {"train_loss": -7.848402976989746, "global_step": 42942, "epoch": 255} {"train_loss": -8.233360290527344, "global_step": 42943, "epoch": 255} {"train_loss": -8.076480865478516, "global_step": 42944, "epoch": 255} {"train_loss": -8.025932312011719, "global_step": 42945, "epoch": 255} {"train_loss": -8.122695922851562, "global_step": 42946, "epoch": 255} {"train_loss": -8.356924057006836, "global_step": 42947, "epoch": 255} {"train_loss": -8.286705017089844, "global_step": 42948, "epoch": 255} {"train_loss": -8.090164184570312, "global_step": 42949, "epoch": 255} {"train_loss": -8.270787239074707, "global_step": 42950, "epoch": 255} {"train_loss": -8.385432243347168, "global_step": 42951, "epoch": 255} {"train_loss": -8.305095672607422, "global_step": 42952, "epoch": 255} {"train_loss": -8.134839057922363, "global_step": 42953, "epoch": 255} {"train_loss": -8.228466033935547, "global_step": 42954, "epoch": 255} {"train_loss": -8.207316398620605, "global_step": 42955, "epoch": 255} {"train_loss": -8.263147354125977, "global_step": 42956, "epoch": 255} {"train_loss": -7.8484296798706055, "global_step": 42957, "epoch": 255} {"train_loss": -8.414854049682617, "global_step": 42958, "epoch": 255} {"train_loss": -8.006097793579102, "global_step": 42959, "epoch": 255} {"train_loss": -8.114715576171875, "global_step": 42960, "epoch": 255} {"train_loss": -8.365921020507812, "global_step": 42961, "epoch": 255} {"train_loss": -8.27114486694336, "global_step": 42962, "epoch": 255} {"train_loss": -8.026778221130371, "global_step": 42963, "epoch": 255} {"train_loss": -8.036575317382812, "global_step": 42964, "epoch": 255} {"train_loss": -8.136509895324707, "global_step": 42965, "epoch": 255} {"train_loss": -8.18197250366211, "global_step": 42966, "epoch": 255} {"train_loss": -8.149255752563477, "global_step": 42967, "epoch": 255} {"train_loss": -7.9778947830200195, "global_step": 42968, "epoch": 255} {"train_loss": -8.14664363861084, "global_step": 42969, "epoch": 255} {"train_loss": -8.085280418395996, "global_step": 42970, "epoch": 255} {"train_loss": -8.202495574951172, "global_step": 42971, "epoch": 255} {"train_loss": -8.166975021362305, "global_step": 42972, "epoch": 255} {"train_loss": -8.238838195800781, "global_step": 42973, "epoch": 255} {"train_loss": -8.13300609588623, "global_step": 42974, "epoch": 255} {"train_loss": -8.098155975341797, "global_step": 42975, "epoch": 255} {"train_loss": -8.089399337768555, "global_step": 42976, "epoch": 255} {"train_loss": -8.168030738830566, "global_step": 42977, "epoch": 255} {"train_loss": -8.163627624511719, "global_step": 42978, "epoch": 255} {"train_loss": -8.12509536743164, "global_step": 42979, "epoch": 255} {"train_loss": -8.186266899108887, "global_step": 42980, "epoch": 255} {"train_loss": -8.147539138793945, "global_step": 42981, "epoch": 255} {"train_loss": -8.00655460357666, "global_step": 42982, "epoch": 255} {"train_loss": -7.971562385559082, "global_step": 42983, "epoch": 255} {"train_loss": -7.810666084289551, "global_step": 42984, "epoch": 255} {"train_loss": -8.082653999328613, "global_step": 42985, "epoch": 255} {"train_loss": -8.069245338439941, "global_step": 42986, "epoch": 255} {"train_loss": -8.142839431762695, "global_step": 42987, "epoch": 255} {"train_loss": -7.845945835113525, "global_step": 42988, "epoch": 255} {"train_loss": -7.861865997314453, "global_step": 42989, "epoch": 255} {"train_loss": -8.060709953308105, "global_step": 42990, "epoch": 255} {"train_loss": -7.980227470397949, "global_step": 42991, "epoch": 255} {"train_loss": -7.840398788452148, "global_step": 42992, "epoch": 255} {"train_loss": -8.00412368774414, "global_step": 42993, "epoch": 255} {"train_loss": -7.858757495880127, "global_step": 42994, "epoch": 255} {"train_loss": -7.446102142333984, "global_step": 42995, "epoch": 255} {"train_loss": -7.588488578796387, "global_step": 42996, "epoch": 255} {"train_loss": -8.137200355529785, "global_step": 42997, "epoch": 255} {"train_loss": -7.877906799316406, "global_step": 42998, "epoch": 255} {"train_loss": -7.990097999572754, "global_step": 42999, "epoch": 255} {"train_loss": -7.7068376541137695, "global_step": 43000, "epoch": 255} {"train_loss": -7.609400749206543, "global_step": 43001, "epoch": 255} {"train_loss": -7.764174461364746, "global_step": 43002, "epoch": 255} {"train_loss": -7.737622261047363, "global_step": 43003, "epoch": 255} {"train_loss": -7.913094997406006, "global_step": 43004, "epoch": 255} {"train_loss": -7.912731170654297, "global_step": 43005, "epoch": 255} {"train_loss": -8.088924407958984, "global_step": 43006, "epoch": 255} {"train_loss": -8.024078723930177, "global_step": 43007, "epoch": 255, "val_loss": 185828.515625, "train_action_mse_error": 7.131828784942627} {"train_loss": -7.9112372398376465, "global_step": 43008, "epoch": 256} {"train_loss": -7.810842037200928, "global_step": 43009, "epoch": 256} {"train_loss": -7.800811290740967, "global_step": 43010, "epoch": 256} {"train_loss": -7.753668785095215, "global_step": 43011, "epoch": 256} {"train_loss": -8.066893577575684, "global_step": 43012, "epoch": 256} {"train_loss": -7.64800500869751, "global_step": 43013, "epoch": 256} {"train_loss": -8.025832176208496, "global_step": 43014, "epoch": 256} {"train_loss": -8.039894104003906, "global_step": 43015, "epoch": 256} {"train_loss": -7.775361061096191, "global_step": 43016, "epoch": 256} {"train_loss": -7.786410331726074, "global_step": 43017, "epoch": 256} {"train_loss": -7.777805328369141, "global_step": 43018, "epoch": 256} {"train_loss": -7.8117547035217285, "global_step": 43019, "epoch": 256} {"train_loss": -7.978711128234863, "global_step": 43020, "epoch": 256} {"train_loss": -7.761229515075684, "global_step": 43021, "epoch": 256} {"train_loss": -7.784786224365234, "global_step": 43022, "epoch": 256} {"train_loss": -8.221148490905762, "global_step": 43023, "epoch": 256} {"train_loss": -8.160806655883789, "global_step": 43024, "epoch": 256} {"train_loss": -7.976052284240723, "global_step": 43025, "epoch": 256} {"train_loss": -7.990381240844727, "global_step": 43026, "epoch": 256} {"train_loss": -8.01914119720459, "global_step": 43027, "epoch": 256} {"train_loss": -7.941072463989258, "global_step": 43028, "epoch": 256} {"train_loss": -8.039888381958008, "global_step": 43029, "epoch": 256} {"train_loss": -7.672369480133057, "global_step": 43030, "epoch": 256} {"train_loss": -8.039283752441406, "global_step": 43031, "epoch": 256} {"train_loss": -7.854886054992676, "global_step": 43032, "epoch": 256} {"train_loss": -8.105667114257812, "global_step": 43033, "epoch": 256} {"train_loss": -7.963813304901123, "global_step": 43034, "epoch": 256} {"train_loss": -7.907017707824707, "global_step": 43035, "epoch": 256} {"train_loss": -7.942556381225586, "global_step": 43036, "epoch": 256} {"train_loss": -7.9447126388549805, "global_step": 43037, "epoch": 256} {"train_loss": -8.153512954711914, "global_step": 43038, "epoch": 256} {"train_loss": -8.02981948852539, "global_step": 43039, "epoch": 256} {"train_loss": -7.83611536026001, "global_step": 43040, "epoch": 256} {"train_loss": -8.117044448852539, "global_step": 43041, "epoch": 256} {"train_loss": -7.832801342010498, "global_step": 43042, "epoch": 256} {"train_loss": -8.005395889282227, "global_step": 43043, "epoch": 256} {"train_loss": -7.783207893371582, "global_step": 43044, "epoch": 256} {"train_loss": -8.12480640411377, "global_step": 43045, "epoch": 256} {"train_loss": -8.111948013305664, "global_step": 43046, "epoch": 256} {"train_loss": -7.941015243530273, "global_step": 43047, "epoch": 256} {"train_loss": -8.136547088623047, "global_step": 43048, "epoch": 256} {"train_loss": -8.153532028198242, "global_step": 43049, "epoch": 256} {"train_loss": -7.8867292404174805, "global_step": 43050, "epoch": 256} {"train_loss": -8.133727073669434, "global_step": 43051, "epoch": 256} {"train_loss": -8.125330924987793, "global_step": 43052, "epoch": 256} {"train_loss": -7.878629207611084, "global_step": 43053, "epoch": 256} {"train_loss": -8.018243789672852, "global_step": 43054, "epoch": 256} {"train_loss": -8.074224472045898, "global_step": 43055, "epoch": 256} {"train_loss": -7.922353744506836, "global_step": 43056, "epoch": 256} {"train_loss": -7.989188194274902, "global_step": 43057, "epoch": 256} {"train_loss": -7.918757438659668, "global_step": 43058, "epoch": 256} {"train_loss": -8.126411437988281, "global_step": 43059, "epoch": 256} {"train_loss": -8.09715747833252, "global_step": 43060, "epoch": 256} {"train_loss": -8.104074478149414, "global_step": 43061, "epoch": 256} {"train_loss": -7.9908576011657715, "global_step": 43062, "epoch": 256} {"train_loss": -7.961610317230225, "global_step": 43063, "epoch": 256} {"train_loss": -7.965044021606445, "global_step": 43064, "epoch": 256} {"train_loss": -8.091630935668945, "global_step": 43065, "epoch": 256} {"train_loss": -8.021221160888672, "global_step": 43066, "epoch": 256} {"train_loss": -7.908808708190918, "global_step": 43067, "epoch": 256} {"train_loss": -8.067399024963379, "global_step": 43068, "epoch": 256} {"train_loss": -8.049100875854492, "global_step": 43069, "epoch": 256} {"train_loss": -8.074827194213867, "global_step": 43070, "epoch": 256} {"train_loss": -8.01150131225586, "global_step": 43071, "epoch": 256} {"train_loss": -8.07293701171875, "global_step": 43072, "epoch": 256} {"train_loss": -8.218022346496582, "global_step": 43073, "epoch": 256} {"train_loss": -8.036369323730469, "global_step": 43074, "epoch": 256} {"train_loss": -8.126049041748047, "global_step": 43075, "epoch": 256} {"train_loss": -8.050284385681152, "global_step": 43076, "epoch": 256} {"train_loss": -8.070751190185547, "global_step": 43077, "epoch": 256} {"train_loss": -8.319668769836426, "global_step": 43078, "epoch": 256} {"train_loss": -8.411121368408203, "global_step": 43079, "epoch": 256} {"train_loss": -8.358131408691406, "global_step": 43080, "epoch": 256} {"train_loss": -8.16840648651123, "global_step": 43081, "epoch": 256} {"train_loss": -8.136716842651367, "global_step": 43082, "epoch": 256} {"train_loss": -8.180841445922852, "global_step": 43083, "epoch": 256} {"train_loss": -8.217628479003906, "global_step": 43084, "epoch": 256} {"train_loss": -8.229507446289062, "global_step": 43085, "epoch": 256} {"train_loss": -8.383678436279297, "global_step": 43086, "epoch": 256} {"train_loss": -8.255148887634277, "global_step": 43087, "epoch": 256} {"train_loss": -8.00990104675293, "global_step": 43088, "epoch": 256} {"train_loss": -8.003325462341309, "global_step": 43089, "epoch": 256} {"train_loss": -8.244794845581055, "global_step": 43090, "epoch": 256} {"train_loss": -8.154817581176758, "global_step": 43091, "epoch": 256} {"train_loss": -7.995354175567627, "global_step": 43092, "epoch": 256} {"train_loss": -8.246072769165039, "global_step": 43093, "epoch": 256} {"train_loss": -7.870978355407715, "global_step": 43094, "epoch": 256} {"train_loss": -8.111806869506836, "global_step": 43095, "epoch": 256} {"train_loss": -7.960968971252441, "global_step": 43096, "epoch": 256} {"train_loss": -7.883299827575684, "global_step": 43097, "epoch": 256} {"train_loss": -7.987899303436279, "global_step": 43098, "epoch": 256} {"train_loss": -7.9411234855651855, "global_step": 43099, "epoch": 256} {"train_loss": -7.779794692993164, "global_step": 43100, "epoch": 256} {"train_loss": -7.600852966308594, "global_step": 43101, "epoch": 256} {"train_loss": -8.017963409423828, "global_step": 43102, "epoch": 256} {"train_loss": -8.0064697265625, "global_step": 43103, "epoch": 256} {"train_loss": -8.129745483398438, "global_step": 43104, "epoch": 256} {"train_loss": -7.937178611755371, "global_step": 43105, "epoch": 256} {"train_loss": -7.9598307609558105, "global_step": 43106, "epoch": 256} {"train_loss": -7.975601673126221, "global_step": 43107, "epoch": 256} {"train_loss": -7.970612049102783, "global_step": 43108, "epoch": 256} {"train_loss": -8.097461700439453, "global_step": 43109, "epoch": 256} {"train_loss": -7.703413009643555, "global_step": 43110, "epoch": 256} {"train_loss": -8.023407936096191, "global_step": 43111, "epoch": 256} {"train_loss": -7.761563301086426, "global_step": 43112, "epoch": 256} {"train_loss": -7.816194534301758, "global_step": 43113, "epoch": 256} {"train_loss": -8.173397064208984, "global_step": 43114, "epoch": 256} {"train_loss": -7.891659736633301, "global_step": 43115, "epoch": 256} {"train_loss": -8.058725357055664, "global_step": 43116, "epoch": 256} {"train_loss": -8.043309211730957, "global_step": 43117, "epoch": 256} {"train_loss": -8.055733680725098, "global_step": 43118, "epoch": 256} {"train_loss": -8.208148002624512, "global_step": 43119, "epoch": 256} {"train_loss": -8.032483100891113, "global_step": 43120, "epoch": 256} {"train_loss": -8.300642013549805, "global_step": 43121, "epoch": 256} {"train_loss": -7.962634563446045, "global_step": 43122, "epoch": 256} {"train_loss": -8.145055770874023, "global_step": 43123, "epoch": 256} {"train_loss": -8.042036056518555, "global_step": 43124, "epoch": 256} {"train_loss": -8.237714767456055, "global_step": 43125, "epoch": 256} {"train_loss": -7.818774700164795, "global_step": 43126, "epoch": 256} {"train_loss": -8.024290084838867, "global_step": 43127, "epoch": 256} {"train_loss": -8.02285385131836, "global_step": 43128, "epoch": 256} {"train_loss": -8.04664421081543, "global_step": 43129, "epoch": 256} {"train_loss": -8.35232925415039, "global_step": 43130, "epoch": 256} {"train_loss": -8.258329391479492, "global_step": 43131, "epoch": 256} {"train_loss": -8.317532539367676, "global_step": 43132, "epoch": 256} {"train_loss": -8.108478546142578, "global_step": 43133, "epoch": 256} {"train_loss": -8.48190689086914, "global_step": 43134, "epoch": 256} {"train_loss": -8.359285354614258, "global_step": 43135, "epoch": 256} {"train_loss": -8.335409164428711, "global_step": 43136, "epoch": 256} {"train_loss": -7.962190628051758, "global_step": 43137, "epoch": 256} {"train_loss": -8.181013107299805, "global_step": 43138, "epoch": 256} {"train_loss": -8.149113655090332, "global_step": 43139, "epoch": 256} {"train_loss": -8.289396286010742, "global_step": 43140, "epoch": 256} {"train_loss": -8.022639274597168, "global_step": 43141, "epoch": 256} {"train_loss": -8.301764488220215, "global_step": 43142, "epoch": 256} {"train_loss": -8.130088806152344, "global_step": 43143, "epoch": 256} {"train_loss": -8.185851097106934, "global_step": 43144, "epoch": 256} {"train_loss": -8.271784782409668, "global_step": 43145, "epoch": 256} {"train_loss": -8.174661636352539, "global_step": 43146, "epoch": 256} {"train_loss": -8.217767715454102, "global_step": 43147, "epoch": 256} {"train_loss": -8.181459426879883, "global_step": 43148, "epoch": 256} {"train_loss": -8.035213470458984, "global_step": 43149, "epoch": 256} {"train_loss": -7.919837474822998, "global_step": 43150, "epoch": 256} {"train_loss": -8.016890525817871, "global_step": 43151, "epoch": 256} {"train_loss": -7.998481750488281, "global_step": 43152, "epoch": 256} {"train_loss": -7.871868133544922, "global_step": 43153, "epoch": 256} {"train_loss": -7.92584228515625, "global_step": 43154, "epoch": 256} {"train_loss": -7.716796875, "global_step": 43155, "epoch": 256} {"train_loss": -7.956180095672607, "global_step": 43156, "epoch": 256} {"train_loss": -7.658018589019775, "global_step": 43157, "epoch": 256} {"train_loss": -8.210826873779297, "global_step": 43158, "epoch": 256} {"train_loss": -8.03531265258789, "global_step": 43159, "epoch": 256} {"train_loss": -7.988541603088379, "global_step": 43160, "epoch": 256} {"train_loss": -8.041366577148438, "global_step": 43161, "epoch": 256} {"train_loss": -8.068717002868652, "global_step": 43162, "epoch": 256} {"train_loss": -7.891555309295654, "global_step": 43163, "epoch": 256} {"train_loss": -7.987465858459473, "global_step": 43164, "epoch": 256} {"train_loss": -7.897919654846191, "global_step": 43165, "epoch": 256} {"train_loss": -7.9146409034729, "global_step": 43166, "epoch": 256} {"train_loss": -7.98600959777832, "global_step": 43167, "epoch": 256} {"train_loss": -7.947719573974609, "global_step": 43168, "epoch": 256} {"train_loss": -7.893374443054199, "global_step": 43169, "epoch": 256} {"train_loss": -8.084636688232422, "global_step": 43170, "epoch": 256} {"train_loss": -8.096614837646484, "global_step": 43171, "epoch": 256} {"train_loss": -8.086484909057617, "global_step": 43172, "epoch": 256} {"train_loss": -8.085112571716309, "global_step": 43173, "epoch": 256} {"train_loss": -8.019947052001953, "global_step": 43174, "epoch": 256} {"train_loss": -8.031851152578989, "global_step": 43175, "epoch": 256, "val_loss": 188991.5625} {"train_loss": -8.063044548034668, "global_step": 43176, "epoch": 257} {"train_loss": -8.037744522094727, "global_step": 43177, "epoch": 257} {"train_loss": -7.974836826324463, "global_step": 43178, "epoch": 257} {"train_loss": -8.139689445495605, "global_step": 43179, "epoch": 257} {"train_loss": -8.134683609008789, "global_step": 43180, "epoch": 257} {"train_loss": -8.25407886505127, "global_step": 43181, "epoch": 257} {"train_loss": -8.190865516662598, "global_step": 43182, "epoch": 257} {"train_loss": -8.107677459716797, "global_step": 43183, "epoch": 257} {"train_loss": -8.021982192993164, "global_step": 43184, "epoch": 257} {"train_loss": -8.170902252197266, "global_step": 43185, "epoch": 257} {"train_loss": -8.084030151367188, "global_step": 43186, "epoch": 257} {"train_loss": -8.019691467285156, "global_step": 43187, "epoch": 257} {"train_loss": -7.910806179046631, "global_step": 43188, "epoch": 257} {"train_loss": -8.062381744384766, "global_step": 43189, "epoch": 257} {"train_loss": -7.9261794090271, "global_step": 43190, "epoch": 257} {"train_loss": -7.998950958251953, "global_step": 43191, "epoch": 257} {"train_loss": -7.678764343261719, "global_step": 43192, "epoch": 257} {"train_loss": -8.0425443649292, "global_step": 43193, "epoch": 257} {"train_loss": -7.779373645782471, "global_step": 43194, "epoch": 257} {"train_loss": -8.082786560058594, "global_step": 43195, "epoch": 257} {"train_loss": -7.750884056091309, "global_step": 43196, "epoch": 257} {"train_loss": -8.1729736328125, "global_step": 43197, "epoch": 257} {"train_loss": -7.782064437866211, "global_step": 43198, "epoch": 257} {"train_loss": -7.965023517608643, "global_step": 43199, "epoch": 257} {"train_loss": -8.016738891601562, "global_step": 43200, "epoch": 257} {"train_loss": -8.215389251708984, "global_step": 43201, "epoch": 257} {"train_loss": -8.008871078491211, "global_step": 43202, "epoch": 257} {"train_loss": -7.982673645019531, "global_step": 43203, "epoch": 257} {"train_loss": -7.856882095336914, "global_step": 43204, "epoch": 257} {"train_loss": -8.131155967712402, "global_step": 43205, "epoch": 257} {"train_loss": -8.034423828125, "global_step": 43206, "epoch": 257} {"train_loss": -8.063238143920898, "global_step": 43207, "epoch": 257} {"train_loss": -7.8424787521362305, "global_step": 43208, "epoch": 257} {"train_loss": -8.015931129455566, "global_step": 43209, "epoch": 257} {"train_loss": -8.0358247756958, "global_step": 43210, "epoch": 257} {"train_loss": -8.063268661499023, "global_step": 43211, "epoch": 257} {"train_loss": -7.774646282196045, "global_step": 43212, "epoch": 257} {"train_loss": -8.100540161132812, "global_step": 43213, "epoch": 257} {"train_loss": -8.005111694335938, "global_step": 43214, "epoch": 257} {"train_loss": -7.819860458374023, "global_step": 43215, "epoch": 257} {"train_loss": -8.05203914642334, "global_step": 43216, "epoch": 257} {"train_loss": -7.782964706420898, "global_step": 43217, "epoch": 257} {"train_loss": -8.179085731506348, "global_step": 43218, "epoch": 257} {"train_loss": -7.673799514770508, "global_step": 43219, "epoch": 257} {"train_loss": -8.011634826660156, "global_step": 43220, "epoch": 257} {"train_loss": -7.887584686279297, "global_step": 43221, "epoch": 257} {"train_loss": -7.9096479415893555, "global_step": 43222, "epoch": 257} {"train_loss": -7.9991912841796875, "global_step": 43223, "epoch": 257} {"train_loss": -7.87052583694458, "global_step": 43224, "epoch": 257} {"train_loss": -7.894081115722656, "global_step": 43225, "epoch": 257} {"train_loss": -7.915931701660156, "global_step": 43226, "epoch": 257} {"train_loss": -8.042458534240723, "global_step": 43227, "epoch": 257} {"train_loss": -8.000741958618164, "global_step": 43228, "epoch": 257} {"train_loss": -8.023191452026367, "global_step": 43229, "epoch": 257} {"train_loss": -8.085317611694336, "global_step": 43230, "epoch": 257} {"train_loss": -7.916847229003906, "global_step": 43231, "epoch": 257} {"train_loss": -8.06463623046875, "global_step": 43232, "epoch": 257} {"train_loss": -8.066572189331055, "global_step": 43233, "epoch": 257} {"train_loss": -8.040619850158691, "global_step": 43234, "epoch": 257} {"train_loss": -8.10722827911377, "global_step": 43235, "epoch": 257} {"train_loss": -7.890959739685059, "global_step": 43236, "epoch": 257} {"train_loss": -7.970623016357422, "global_step": 43237, "epoch": 257} {"train_loss": -8.132026672363281, "global_step": 43238, "epoch": 257} {"train_loss": -7.706618785858154, "global_step": 43239, "epoch": 257} {"train_loss": -8.167659759521484, "global_step": 43240, "epoch": 257} {"train_loss": -7.926825523376465, "global_step": 43241, "epoch": 257} {"train_loss": -8.060389518737793, "global_step": 43242, "epoch": 257} {"train_loss": -7.933669090270996, "global_step": 43243, "epoch": 257} {"train_loss": -8.060227394104004, "global_step": 43244, "epoch": 257} {"train_loss": -7.883199691772461, "global_step": 43245, "epoch": 257} {"train_loss": -7.873584747314453, "global_step": 43246, "epoch": 257} {"train_loss": -8.076692581176758, "global_step": 43247, "epoch": 257} {"train_loss": -8.072824478149414, "global_step": 43248, "epoch": 257} {"train_loss": -7.88252592086792, "global_step": 43249, "epoch": 257} {"train_loss": -8.075157165527344, "global_step": 43250, "epoch": 257} {"train_loss": -8.101114273071289, "global_step": 43251, "epoch": 257} {"train_loss": -7.999345302581787, "global_step": 43252, "epoch": 257} {"train_loss": -7.901012897491455, "global_step": 43253, "epoch": 257} {"train_loss": -8.170645713806152, "global_step": 43254, "epoch": 257} {"train_loss": -7.786015033721924, "global_step": 43255, "epoch": 257} {"train_loss": -8.217053413391113, "global_step": 43256, "epoch": 257} {"train_loss": -7.993515968322754, "global_step": 43257, "epoch": 257} {"train_loss": -8.126124382019043, "global_step": 43258, "epoch": 257} {"train_loss": -7.825936794281006, "global_step": 43259, "epoch": 257} {"train_loss": -8.109155654907227, "global_step": 43260, "epoch": 257} {"train_loss": -8.064773559570312, "global_step": 43261, "epoch": 257} {"train_loss": -8.28890609741211, "global_step": 43262, "epoch": 257} {"train_loss": -7.82291316986084, "global_step": 43263, "epoch": 257} {"train_loss": -8.234138488769531, "global_step": 43264, "epoch": 257} {"train_loss": -7.942794322967529, "global_step": 43265, "epoch": 257} {"train_loss": -8.272955894470215, "global_step": 43266, "epoch": 257} {"train_loss": -7.742181777954102, "global_step": 43267, "epoch": 257} {"train_loss": -8.042495727539062, "global_step": 43268, "epoch": 257} {"train_loss": -7.934133529663086, "global_step": 43269, "epoch": 257} {"train_loss": -8.046671867370605, "global_step": 43270, "epoch": 257} {"train_loss": -7.83821964263916, "global_step": 43271, "epoch": 257} {"train_loss": -7.879600524902344, "global_step": 43272, "epoch": 257} {"train_loss": -8.046914100646973, "global_step": 43273, "epoch": 257} {"train_loss": -7.989280700683594, "global_step": 43274, "epoch": 257} {"train_loss": -7.87089729309082, "global_step": 43275, "epoch": 257} {"train_loss": -7.934706687927246, "global_step": 43276, "epoch": 257} {"train_loss": -7.681077480316162, "global_step": 43277, "epoch": 257} {"train_loss": -7.993870735168457, "global_step": 43278, "epoch": 257} {"train_loss": -7.893650054931641, "global_step": 43279, "epoch": 257} {"train_loss": -7.85903787612915, "global_step": 43280, "epoch": 257} {"train_loss": -7.918722629547119, "global_step": 43281, "epoch": 257} {"train_loss": -8.048528671264648, "global_step": 43282, "epoch": 257} {"train_loss": -7.955591678619385, "global_step": 43283, "epoch": 257} {"train_loss": -7.981135368347168, "global_step": 43284, "epoch": 257} {"train_loss": -7.87314510345459, "global_step": 43285, "epoch": 257} {"train_loss": -8.07956314086914, "global_step": 43286, "epoch": 257} {"train_loss": -8.014711380004883, "global_step": 43287, "epoch": 257} {"train_loss": -8.245439529418945, "global_step": 43288, "epoch": 257} {"train_loss": -7.68222713470459, "global_step": 43289, "epoch": 257} {"train_loss": -8.078872680664062, "global_step": 43290, "epoch": 257} {"train_loss": -8.173255920410156, "global_step": 43291, "epoch": 257} {"train_loss": -8.02273941040039, "global_step": 43292, "epoch": 257} {"train_loss": -8.14728832244873, "global_step": 43293, "epoch": 257} {"train_loss": -8.060403823852539, "global_step": 43294, "epoch": 257} {"train_loss": -8.219449043273926, "global_step": 43295, "epoch": 257} {"train_loss": -8.14228343963623, "global_step": 43296, "epoch": 257} {"train_loss": -8.263660430908203, "global_step": 43297, "epoch": 257} {"train_loss": -8.169649124145508, "global_step": 43298, "epoch": 257} {"train_loss": -8.155139923095703, "global_step": 43299, "epoch": 257} {"train_loss": -8.060029983520508, "global_step": 43300, "epoch": 257} {"train_loss": -8.160661697387695, "global_step": 43301, "epoch": 257} {"train_loss": -7.982434272766113, "global_step": 43302, "epoch": 257} {"train_loss": -8.120931625366211, "global_step": 43303, "epoch": 257} {"train_loss": -8.031806945800781, "global_step": 43304, "epoch": 257} {"train_loss": -7.96518087387085, "global_step": 43305, "epoch": 257} {"train_loss": -8.037532806396484, "global_step": 43306, "epoch": 257} {"train_loss": -8.202102661132812, "global_step": 43307, "epoch": 257} {"train_loss": -7.775541305541992, "global_step": 43308, "epoch": 257} {"train_loss": -7.968430519104004, "global_step": 43309, "epoch": 257} {"train_loss": -8.111594200134277, "global_step": 43310, "epoch": 257} {"train_loss": -7.986415386199951, "global_step": 43311, "epoch": 257} {"train_loss": -8.103466033935547, "global_step": 43312, "epoch": 257} {"train_loss": -8.163698196411133, "global_step": 43313, "epoch": 257} {"train_loss": -7.935347557067871, "global_step": 43314, "epoch": 257} {"train_loss": -8.129365921020508, "global_step": 43315, "epoch": 257} {"train_loss": -8.13653564453125, "global_step": 43316, "epoch": 257} {"train_loss": -8.142566680908203, "global_step": 43317, "epoch": 257} {"train_loss": -8.140026092529297, "global_step": 43318, "epoch": 257} {"train_loss": -8.172708511352539, "global_step": 43319, "epoch": 257} {"train_loss": -8.20074462890625, "global_step": 43320, "epoch": 257} {"train_loss": -8.018437385559082, "global_step": 43321, "epoch": 257} {"train_loss": -8.022382736206055, "global_step": 43322, "epoch": 257} {"train_loss": -8.189265251159668, "global_step": 43323, "epoch": 257} {"train_loss": -8.167908668518066, "global_step": 43324, "epoch": 257} {"train_loss": -7.772156715393066, "global_step": 43325, "epoch": 257} {"train_loss": -7.975561618804932, "global_step": 43326, "epoch": 257} {"train_loss": -8.051475524902344, "global_step": 43327, "epoch": 257} {"train_loss": -7.893808364868164, "global_step": 43328, "epoch": 257} {"train_loss": -8.07401180267334, "global_step": 43329, "epoch": 257} {"train_loss": -7.8396100997924805, "global_step": 43330, "epoch": 257} {"train_loss": -8.040507316589355, "global_step": 43331, "epoch": 257} {"train_loss": -7.90161657333374, "global_step": 43332, "epoch": 257} {"train_loss": -8.151086807250977, "global_step": 43333, "epoch": 257} {"train_loss": -7.935262680053711, "global_step": 43334, "epoch": 257} {"train_loss": -8.045191764831543, "global_step": 43335, "epoch": 257} {"train_loss": -8.129810333251953, "global_step": 43336, "epoch": 257} {"train_loss": -8.109993934631348, "global_step": 43337, "epoch": 257} {"train_loss": -8.173739433288574, "global_step": 43338, "epoch": 257} {"train_loss": -8.128867149353027, "global_step": 43339, "epoch": 257} {"train_loss": -7.9709906578063965, "global_step": 43340, "epoch": 257} {"train_loss": -8.038257598876953, "global_step": 43341, "epoch": 257} {"train_loss": -8.20565414428711, "global_step": 43342, "epoch": 257} {"train_loss": -8.017386507420312, "global_step": 43343, "epoch": 257, "val_loss": 187433.859375} {"train_loss": -8.190220832824707, "global_step": 43344, "epoch": 258} {"train_loss": -8.136544227600098, "global_step": 43345, "epoch": 258} {"train_loss": -8.088055610656738, "global_step": 43346, "epoch": 258} {"train_loss": -8.330179214477539, "global_step": 43347, "epoch": 258} {"train_loss": -8.276590347290039, "global_step": 43348, "epoch": 258} {"train_loss": -7.860550880432129, "global_step": 43349, "epoch": 258} {"train_loss": -8.114641189575195, "global_step": 43350, "epoch": 258} {"train_loss": -8.33549976348877, "global_step": 43351, "epoch": 258} {"train_loss": -8.23878288269043, "global_step": 43352, "epoch": 258} {"train_loss": -8.098869323730469, "global_step": 43353, "epoch": 258} {"train_loss": -8.304988861083984, "global_step": 43354, "epoch": 258} {"train_loss": -8.083489418029785, "global_step": 43355, "epoch": 258} {"train_loss": -8.17294979095459, "global_step": 43356, "epoch": 258} {"train_loss": -8.055564880371094, "global_step": 43357, "epoch": 258} {"train_loss": -8.061826705932617, "global_step": 43358, "epoch": 258} {"train_loss": -7.957485198974609, "global_step": 43359, "epoch": 258} {"train_loss": -8.07107925415039, "global_step": 43360, "epoch": 258} {"train_loss": -7.810879707336426, "global_step": 43361, "epoch": 258} {"train_loss": -8.34136962890625, "global_step": 43362, "epoch": 258} {"train_loss": -8.081975936889648, "global_step": 43363, "epoch": 258} {"train_loss": -8.040031433105469, "global_step": 43364, "epoch": 258} {"train_loss": -8.21445369720459, "global_step": 43365, "epoch": 258} {"train_loss": -8.227191925048828, "global_step": 43366, "epoch": 258} {"train_loss": -8.320581436157227, "global_step": 43367, "epoch": 258} {"train_loss": -7.926596641540527, "global_step": 43368, "epoch": 258} {"train_loss": -7.977232933044434, "global_step": 43369, "epoch": 258} {"train_loss": -7.908473968505859, "global_step": 43370, "epoch": 258} {"train_loss": -7.9834747314453125, "global_step": 43371, "epoch": 258} {"train_loss": -7.785739898681641, "global_step": 43372, "epoch": 258} {"train_loss": -8.01620101928711, "global_step": 43373, "epoch": 258} {"train_loss": -7.80678129196167, "global_step": 43374, "epoch": 258} {"train_loss": -8.05905532836914, "global_step": 43375, "epoch": 258} {"train_loss": -7.7823486328125, "global_step": 43376, "epoch": 258} {"train_loss": -8.031760215759277, "global_step": 43377, "epoch": 258} {"train_loss": -7.6714582443237305, "global_step": 43378, "epoch": 258} {"train_loss": -7.84114933013916, "global_step": 43379, "epoch": 258} {"train_loss": -7.907403945922852, "global_step": 43380, "epoch": 258} {"train_loss": -7.9587178230285645, "global_step": 43381, "epoch": 258} {"train_loss": -7.758772850036621, "global_step": 43382, "epoch": 258} {"train_loss": -7.867079734802246, "global_step": 43383, "epoch": 258} {"train_loss": -7.991003513336182, "global_step": 43384, "epoch": 258} {"train_loss": -7.877333641052246, "global_step": 43385, "epoch": 258} {"train_loss": -7.712172508239746, "global_step": 43386, "epoch": 258} {"train_loss": -8.019229888916016, "global_step": 43387, "epoch": 258} {"train_loss": -7.662069797515869, "global_step": 43388, "epoch": 258} {"train_loss": -7.852341651916504, "global_step": 43389, "epoch": 258} {"train_loss": -7.876599311828613, "global_step": 43390, "epoch": 258} {"train_loss": -8.11802864074707, "global_step": 43391, "epoch": 258} {"train_loss": -7.821312427520752, "global_step": 43392, "epoch": 258} {"train_loss": -8.096420288085938, "global_step": 43393, "epoch": 258} {"train_loss": -7.985588073730469, "global_step": 43394, "epoch": 258} {"train_loss": -8.157593727111816, "global_step": 43395, "epoch": 258} {"train_loss": -8.061002731323242, "global_step": 43396, "epoch": 258} {"train_loss": -7.983673572540283, "global_step": 43397, "epoch": 258} {"train_loss": -7.915066242218018, "global_step": 43398, "epoch": 258} {"train_loss": -8.133861541748047, "global_step": 43399, "epoch": 258} {"train_loss": -8.380316734313965, "global_step": 43400, "epoch": 258} {"train_loss": -8.269516944885254, "global_step": 43401, "epoch": 258} {"train_loss": -8.205150604248047, "global_step": 43402, "epoch": 258} {"train_loss": -7.966362953186035, "global_step": 43403, "epoch": 258} {"train_loss": -8.324010848999023, "global_step": 43404, "epoch": 258} {"train_loss": -8.273760795593262, "global_step": 43405, "epoch": 258} {"train_loss": -8.248043060302734, "global_step": 43406, "epoch": 258} {"train_loss": -8.167384147644043, "global_step": 43407, "epoch": 258} {"train_loss": -8.32719612121582, "global_step": 43408, "epoch": 258} {"train_loss": -8.312007904052734, "global_step": 43409, "epoch": 258} {"train_loss": -7.957909107208252, "global_step": 43410, "epoch": 258} {"train_loss": -8.026069641113281, "global_step": 43411, "epoch": 258} {"train_loss": -8.133037567138672, "global_step": 43412, "epoch": 258} {"train_loss": -7.786301612854004, "global_step": 43413, "epoch": 258} {"train_loss": -8.196310043334961, "global_step": 43414, "epoch": 258} {"train_loss": -7.889695644378662, "global_step": 43415, "epoch": 258} {"train_loss": -8.15040111541748, "global_step": 43416, "epoch": 258} {"train_loss": -8.136818885803223, "global_step": 43417, "epoch": 258} {"train_loss": -8.17934513092041, "global_step": 43418, "epoch": 258} {"train_loss": -7.933664321899414, "global_step": 43419, "epoch": 258} {"train_loss": -8.061161994934082, "global_step": 43420, "epoch": 258} {"train_loss": -7.848784446716309, "global_step": 43421, "epoch": 258} {"train_loss": -8.080342292785645, "global_step": 43422, "epoch": 258} {"train_loss": -7.7610883712768555, "global_step": 43423, "epoch": 258} {"train_loss": -8.062195777893066, "global_step": 43424, "epoch": 258} {"train_loss": -7.9240312576293945, "global_step": 43425, "epoch": 258} {"train_loss": -7.772933006286621, "global_step": 43426, "epoch": 258} {"train_loss": -8.071817398071289, "global_step": 43427, "epoch": 258} {"train_loss": -8.332847595214844, "global_step": 43428, "epoch": 258} {"train_loss": -8.217620849609375, "global_step": 43429, "epoch": 258} {"train_loss": -7.982967376708984, "global_step": 43430, "epoch": 258} {"train_loss": -8.026066780090332, "global_step": 43431, "epoch": 258} {"train_loss": -7.809179782867432, "global_step": 43432, "epoch": 258} {"train_loss": -8.00326156616211, "global_step": 43433, "epoch": 258} {"train_loss": -7.904974937438965, "global_step": 43434, "epoch": 258} {"train_loss": -7.8627471923828125, "global_step": 43435, "epoch": 258} {"train_loss": -8.001627922058105, "global_step": 43436, "epoch": 258} {"train_loss": -8.064159393310547, "global_step": 43437, "epoch": 258} {"train_loss": -8.02348518371582, "global_step": 43438, "epoch": 258} {"train_loss": -8.033297538757324, "global_step": 43439, "epoch": 258} {"train_loss": -8.010393142700195, "global_step": 43440, "epoch": 258} {"train_loss": -7.677824974060059, "global_step": 43441, "epoch": 258} {"train_loss": -7.573320388793945, "global_step": 43442, "epoch": 258} {"train_loss": -8.134105682373047, "global_step": 43443, "epoch": 258} {"train_loss": -7.764407634735107, "global_step": 43444, "epoch": 258} {"train_loss": -7.9060468673706055, "global_step": 43445, "epoch": 258} {"train_loss": -8.18365478515625, "global_step": 43446, "epoch": 258} {"train_loss": -7.826223373413086, "global_step": 43447, "epoch": 258} {"train_loss": -7.965172290802002, "global_step": 43448, "epoch": 258} {"train_loss": -8.050789833068848, "global_step": 43449, "epoch": 258} {"train_loss": -7.9077959060668945, "global_step": 43450, "epoch": 258} {"train_loss": -8.013493537902832, "global_step": 43451, "epoch": 258} {"train_loss": -8.181048393249512, "global_step": 43452, "epoch": 258} {"train_loss": -8.074041366577148, "global_step": 43453, "epoch": 258} {"train_loss": -7.771652698516846, "global_step": 43454, "epoch": 258} {"train_loss": -8.311973571777344, "global_step": 43455, "epoch": 258} {"train_loss": -8.011518478393555, "global_step": 43456, "epoch": 258} {"train_loss": -8.020231246948242, "global_step": 43457, "epoch": 258} {"train_loss": -7.932059288024902, "global_step": 43458, "epoch": 258} {"train_loss": -8.132139205932617, "global_step": 43459, "epoch": 258} {"train_loss": -7.961590766906738, "global_step": 43460, "epoch": 258} {"train_loss": -8.063072204589844, "global_step": 43461, "epoch": 258} {"train_loss": -8.02302074432373, "global_step": 43462, "epoch": 258} {"train_loss": -7.773902893066406, "global_step": 43463, "epoch": 258} {"train_loss": -8.108185768127441, "global_step": 43464, "epoch": 258} {"train_loss": -7.503241539001465, "global_step": 43465, "epoch": 258} {"train_loss": -8.021958351135254, "global_step": 43466, "epoch": 258} {"train_loss": -7.7732696533203125, "global_step": 43467, "epoch": 258} {"train_loss": -7.758998870849609, "global_step": 43468, "epoch": 258} {"train_loss": -7.972862243652344, "global_step": 43469, "epoch": 258} {"train_loss": -7.848287582397461, "global_step": 43470, "epoch": 258} {"train_loss": -7.791969299316406, "global_step": 43471, "epoch": 258} {"train_loss": -8.019895553588867, "global_step": 43472, "epoch": 258} {"train_loss": -7.566647052764893, "global_step": 43473, "epoch": 258} {"train_loss": -8.156113624572754, "global_step": 43474, "epoch": 258} {"train_loss": -7.871616363525391, "global_step": 43475, "epoch": 258} {"train_loss": -7.7946085929870605, "global_step": 43476, "epoch": 258} {"train_loss": -7.944947242736816, "global_step": 43477, "epoch": 258} {"train_loss": -7.843674659729004, "global_step": 43478, "epoch": 258} {"train_loss": -7.99468469619751, "global_step": 43479, "epoch": 258} {"train_loss": -7.861261367797852, "global_step": 43480, "epoch": 258} {"train_loss": -7.860023021697998, "global_step": 43481, "epoch": 258} {"train_loss": -7.798346519470215, "global_step": 43482, "epoch": 258} {"train_loss": -7.794776916503906, "global_step": 43483, "epoch": 258} {"train_loss": -7.748228073120117, "global_step": 43484, "epoch": 258} {"train_loss": -7.859537124633789, "global_step": 43485, "epoch": 258} {"train_loss": -7.752857208251953, "global_step": 43486, "epoch": 258} {"train_loss": -7.888922214508057, "global_step": 43487, "epoch": 258} {"train_loss": -7.879175186157227, "global_step": 43488, "epoch": 258} {"train_loss": -7.792795181274414, "global_step": 43489, "epoch": 258} {"train_loss": -7.902976036071777, "global_step": 43490, "epoch": 258} {"train_loss": -7.864706039428711, "global_step": 43491, "epoch": 258} {"train_loss": -7.987179756164551, "global_step": 43492, "epoch": 258} {"train_loss": -7.893917083740234, "global_step": 43493, "epoch": 258} {"train_loss": -8.027877807617188, "global_step": 43494, "epoch": 258} {"train_loss": -7.884257793426514, "global_step": 43495, "epoch": 258} {"train_loss": -8.0848388671875, "global_step": 43496, "epoch": 258} {"train_loss": -7.463038444519043, "global_step": 43497, "epoch": 258} {"train_loss": -8.029221534729004, "global_step": 43498, "epoch": 258} {"train_loss": -8.0414400100708, "global_step": 43499, "epoch": 258} {"train_loss": -8.058197975158691, "global_step": 43500, "epoch": 258} {"train_loss": -7.943692207336426, "global_step": 43501, "epoch": 258} {"train_loss": -7.961347579956055, "global_step": 43502, "epoch": 258} {"train_loss": -7.920190811157227, "global_step": 43503, "epoch": 258} {"train_loss": -8.14323616027832, "global_step": 43504, "epoch": 258} {"train_loss": -7.92912483215332, "global_step": 43505, "epoch": 258} {"train_loss": -8.154176712036133, "global_step": 43506, "epoch": 258} {"train_loss": -7.889983654022217, "global_step": 43507, "epoch": 258} {"train_loss": -7.898420810699463, "global_step": 43508, "epoch": 258} {"train_loss": -8.046442031860352, "global_step": 43509, "epoch": 258} {"train_loss": -7.966249942779541, "global_step": 43510, "epoch": 258} {"train_loss": -7.989839729808626, "global_step": 43511, "epoch": 258, "val_loss": 184715.96875} {"train_loss": -7.722678184509277, "global_step": 43512, "epoch": 259} {"train_loss": -8.18691635131836, "global_step": 43513, "epoch": 259} {"train_loss": -7.8226318359375, "global_step": 43514, "epoch": 259} {"train_loss": -8.091202735900879, "global_step": 43515, "epoch": 259} {"train_loss": -7.839824676513672, "global_step": 43516, "epoch": 259} {"train_loss": -7.877805709838867, "global_step": 43517, "epoch": 259} {"train_loss": -8.059471130371094, "global_step": 43518, "epoch": 259} {"train_loss": -7.989316463470459, "global_step": 43519, "epoch": 259} {"train_loss": -8.054377555847168, "global_step": 43520, "epoch": 259} {"train_loss": -7.824085235595703, "global_step": 43521, "epoch": 259} {"train_loss": -7.980852127075195, "global_step": 43522, "epoch": 259} {"train_loss": -7.836195945739746, "global_step": 43523, "epoch": 259} {"train_loss": -8.149234771728516, "global_step": 43524, "epoch": 259} {"train_loss": -8.239107131958008, "global_step": 43525, "epoch": 259} {"train_loss": -8.152268409729004, "global_step": 43526, "epoch": 259} {"train_loss": -8.175994873046875, "global_step": 43527, "epoch": 259} {"train_loss": -8.159052848815918, "global_step": 43528, "epoch": 259} {"train_loss": -8.214656829833984, "global_step": 43529, "epoch": 259} {"train_loss": -8.172112464904785, "global_step": 43530, "epoch": 259} {"train_loss": -8.107420921325684, "global_step": 43531, "epoch": 259} {"train_loss": -8.138675689697266, "global_step": 43532, "epoch": 259} {"train_loss": -7.866254806518555, "global_step": 43533, "epoch": 259} {"train_loss": -8.1692476272583, "global_step": 43534, "epoch": 259} {"train_loss": -8.238607406616211, "global_step": 43535, "epoch": 259} {"train_loss": -8.152729034423828, "global_step": 43536, "epoch": 259} {"train_loss": -8.209829330444336, "global_step": 43537, "epoch": 259} {"train_loss": -7.80925178527832, "global_step": 43538, "epoch": 259} {"train_loss": -8.069402694702148, "global_step": 43539, "epoch": 259} {"train_loss": -7.963567733764648, "global_step": 43540, "epoch": 259} {"train_loss": -7.9833879470825195, "global_step": 43541, "epoch": 259} {"train_loss": -8.154661178588867, "global_step": 43542, "epoch": 259} {"train_loss": -8.046754837036133, "global_step": 43543, "epoch": 259} {"train_loss": -8.1378173828125, "global_step": 43544, "epoch": 259} {"train_loss": -8.199979782104492, "global_step": 43545, "epoch": 259} {"train_loss": -8.035112380981445, "global_step": 43546, "epoch": 259} {"train_loss": -8.041200637817383, "global_step": 43547, "epoch": 259} {"train_loss": -8.03812313079834, "global_step": 43548, "epoch": 259} {"train_loss": -8.10498332977295, "global_step": 43549, "epoch": 259} {"train_loss": -8.041915893554688, "global_step": 43550, "epoch": 259} {"train_loss": -8.295101165771484, "global_step": 43551, "epoch": 259} {"train_loss": -8.341469764709473, "global_step": 43552, "epoch": 259} {"train_loss": -8.152806282043457, "global_step": 43553, "epoch": 259} {"train_loss": -7.988831520080566, "global_step": 43554, "epoch": 259} {"train_loss": -8.27316665649414, "global_step": 43555, "epoch": 259} {"train_loss": -8.194043159484863, "global_step": 43556, "epoch": 259} {"train_loss": -8.079776763916016, "global_step": 43557, "epoch": 259} {"train_loss": -8.089567184448242, "global_step": 43558, "epoch": 259} {"train_loss": -8.094256401062012, "global_step": 43559, "epoch": 259} {"train_loss": -8.065767288208008, "global_step": 43560, "epoch": 259} {"train_loss": -8.220279693603516, "global_step": 43561, "epoch": 259} {"train_loss": -8.143753051757812, "global_step": 43562, "epoch": 259} {"train_loss": -8.280767440795898, "global_step": 43563, "epoch": 259} {"train_loss": -7.983497142791748, "global_step": 43564, "epoch": 259} {"train_loss": -7.906525135040283, "global_step": 43565, "epoch": 259} {"train_loss": -8.335023880004883, "global_step": 43566, "epoch": 259} {"train_loss": -8.078746795654297, "global_step": 43567, "epoch": 259} {"train_loss": -7.973085880279541, "global_step": 43568, "epoch": 259} {"train_loss": -8.152896881103516, "global_step": 43569, "epoch": 259} {"train_loss": -8.090017318725586, "global_step": 43570, "epoch": 259} {"train_loss": -7.992271423339844, "global_step": 43571, "epoch": 259} {"train_loss": -8.153846740722656, "global_step": 43572, "epoch": 259} {"train_loss": -8.230826377868652, "global_step": 43573, "epoch": 259} {"train_loss": -7.891660690307617, "global_step": 43574, "epoch": 259} {"train_loss": -7.950156211853027, "global_step": 43575, "epoch": 259} {"train_loss": -8.178314208984375, "global_step": 43576, "epoch": 259} {"train_loss": -8.2781343460083, "global_step": 43577, "epoch": 259} {"train_loss": -8.089887619018555, "global_step": 43578, "epoch": 259} {"train_loss": -8.098888397216797, "global_step": 43579, "epoch": 259} {"train_loss": -7.939358711242676, "global_step": 43580, "epoch": 259} {"train_loss": -8.272947311401367, "global_step": 43581, "epoch": 259} {"train_loss": -8.058335304260254, "global_step": 43582, "epoch": 259} {"train_loss": -8.213534355163574, "global_step": 43583, "epoch": 259} {"train_loss": -8.132335662841797, "global_step": 43584, "epoch": 259} {"train_loss": -8.129792213439941, "global_step": 43585, "epoch": 259} {"train_loss": -8.11191463470459, "global_step": 43586, "epoch": 259} {"train_loss": -8.085631370544434, "global_step": 43587, "epoch": 259} {"train_loss": -8.113283157348633, "global_step": 43588, "epoch": 259} {"train_loss": -8.36667251586914, "global_step": 43589, "epoch": 259} {"train_loss": -8.247294425964355, "global_step": 43590, "epoch": 259} {"train_loss": -8.332497596740723, "global_step": 43591, "epoch": 259} {"train_loss": -8.306992530822754, "global_step": 43592, "epoch": 259} {"train_loss": -8.232463836669922, "global_step": 43593, "epoch": 259} {"train_loss": -8.029247283935547, "global_step": 43594, "epoch": 259} {"train_loss": -8.152490615844727, "global_step": 43595, "epoch": 259} {"train_loss": -8.088382720947266, "global_step": 43596, "epoch": 259} {"train_loss": -8.323938369750977, "global_step": 43597, "epoch": 259} {"train_loss": -8.121726989746094, "global_step": 43598, "epoch": 259} {"train_loss": -8.308372497558594, "global_step": 43599, "epoch": 259} {"train_loss": -7.97519063949585, "global_step": 43600, "epoch": 259} {"train_loss": -8.195395469665527, "global_step": 43601, "epoch": 259} {"train_loss": -7.885951995849609, "global_step": 43602, "epoch": 259} {"train_loss": -8.168594360351562, "global_step": 43603, "epoch": 259} {"train_loss": -7.976188659667969, "global_step": 43604, "epoch": 259} {"train_loss": -8.088957786560059, "global_step": 43605, "epoch": 259} {"train_loss": -8.269683837890625, "global_step": 43606, "epoch": 259} {"train_loss": -8.1644287109375, "global_step": 43607, "epoch": 259} {"train_loss": -8.154375076293945, "global_step": 43608, "epoch": 259} {"train_loss": -8.17405891418457, "global_step": 43609, "epoch": 259} {"train_loss": -7.9831085205078125, "global_step": 43610, "epoch": 259} {"train_loss": -7.785912990570068, "global_step": 43611, "epoch": 259} {"train_loss": -7.919430255889893, "global_step": 43612, "epoch": 259} {"train_loss": -8.167228698730469, "global_step": 43613, "epoch": 259} {"train_loss": -8.109102249145508, "global_step": 43614, "epoch": 259} {"train_loss": -8.182937622070312, "global_step": 43615, "epoch": 259} {"train_loss": -8.171294212341309, "global_step": 43616, "epoch": 259} {"train_loss": -8.002655029296875, "global_step": 43617, "epoch": 259} {"train_loss": -8.218561172485352, "global_step": 43618, "epoch": 259} {"train_loss": -7.995532989501953, "global_step": 43619, "epoch": 259} {"train_loss": -7.998685359954834, "global_step": 43620, "epoch": 259} {"train_loss": -7.85880184173584, "global_step": 43621, "epoch": 259} {"train_loss": -8.100536346435547, "global_step": 43622, "epoch": 259} {"train_loss": -7.736900329589844, "global_step": 43623, "epoch": 259} {"train_loss": -7.893998622894287, "global_step": 43624, "epoch": 259} {"train_loss": -7.774661540985107, "global_step": 43625, "epoch": 259} {"train_loss": -8.134984016418457, "global_step": 43626, "epoch": 259} {"train_loss": -8.088475227355957, "global_step": 43627, "epoch": 259} {"train_loss": -7.934902191162109, "global_step": 43628, "epoch": 259} {"train_loss": -8.013481140136719, "global_step": 43629, "epoch": 259} {"train_loss": -7.916415214538574, "global_step": 43630, "epoch": 259} {"train_loss": -8.024999618530273, "global_step": 43631, "epoch": 259} {"train_loss": -8.152085304260254, "global_step": 43632, "epoch": 259} {"train_loss": -8.077163696289062, "global_step": 43633, "epoch": 259} {"train_loss": -7.9521589279174805, "global_step": 43634, "epoch": 259} {"train_loss": -7.949477195739746, "global_step": 43635, "epoch": 259} {"train_loss": -8.13564682006836, "global_step": 43636, "epoch": 259} {"train_loss": -8.231032371520996, "global_step": 43637, "epoch": 259} {"train_loss": -7.944210529327393, "global_step": 43638, "epoch": 259} {"train_loss": -8.238310813903809, "global_step": 43639, "epoch": 259} {"train_loss": -8.148900985717773, "global_step": 43640, "epoch": 259} {"train_loss": -7.963872909545898, "global_step": 43641, "epoch": 259} {"train_loss": -8.00786304473877, "global_step": 43642, "epoch": 259} {"train_loss": -8.156560897827148, "global_step": 43643, "epoch": 259} {"train_loss": -8.186622619628906, "global_step": 43644, "epoch": 259} {"train_loss": -7.974164962768555, "global_step": 43645, "epoch": 259} {"train_loss": -7.916555404663086, "global_step": 43646, "epoch": 259} {"train_loss": -8.251361846923828, "global_step": 43647, "epoch": 259} {"train_loss": -8.179641723632812, "global_step": 43648, "epoch": 259} {"train_loss": -8.39142894744873, "global_step": 43649, "epoch": 259} {"train_loss": -8.028742790222168, "global_step": 43650, "epoch": 259} {"train_loss": -8.171577453613281, "global_step": 43651, "epoch": 259} {"train_loss": -8.220852851867676, "global_step": 43652, "epoch": 259} {"train_loss": -8.060291290283203, "global_step": 43653, "epoch": 259} {"train_loss": -8.115309715270996, "global_step": 43654, "epoch": 259} {"train_loss": -7.896439075469971, "global_step": 43655, "epoch": 259} {"train_loss": -8.059433937072754, "global_step": 43656, "epoch": 259} {"train_loss": -8.206512451171875, "global_step": 43657, "epoch": 259} {"train_loss": -8.107361793518066, "global_step": 43658, "epoch": 259} {"train_loss": -8.013517379760742, "global_step": 43659, "epoch": 259} {"train_loss": -7.972347259521484, "global_step": 43660, "epoch": 259} {"train_loss": -8.125272750854492, "global_step": 43661, "epoch": 259} {"train_loss": -8.058334350585938, "global_step": 43662, "epoch": 259} {"train_loss": -8.180068969726562, "global_step": 43663, "epoch": 259} {"train_loss": -7.941948890686035, "global_step": 43664, "epoch": 259} {"train_loss": -8.10141658782959, "global_step": 43665, "epoch": 259} {"train_loss": -7.517329216003418, "global_step": 43666, "epoch": 259} {"train_loss": -8.245524406433105, "global_step": 43667, "epoch": 259} {"train_loss": -7.918794631958008, "global_step": 43668, "epoch": 259} {"train_loss": -7.972320556640625, "global_step": 43669, "epoch": 259} {"train_loss": -8.005756378173828, "global_step": 43670, "epoch": 259} {"train_loss": -8.227909088134766, "global_step": 43671, "epoch": 259} {"train_loss": -7.85503625869751, "global_step": 43672, "epoch": 259} {"train_loss": -7.632908821105957, "global_step": 43673, "epoch": 259} {"train_loss": -7.934909343719482, "global_step": 43674, "epoch": 259} {"train_loss": -7.906589984893799, "global_step": 43675, "epoch": 259} {"train_loss": -8.052035331726074, "global_step": 43676, "epoch": 259} {"train_loss": -8.03367805480957, "global_step": 43677, "epoch": 259} {"train_loss": -8.051008224487305, "global_step": 43678, "epoch": 259} {"train_loss": -8.078080884047917, "global_step": 43679, "epoch": 259, "val_loss": 185664.78125} {"train_loss": -8.091753005981445, "global_step": 43680, "epoch": 260} {"train_loss": -8.238042831420898, "global_step": 43681, "epoch": 260} {"train_loss": -8.123977661132812, "global_step": 43682, "epoch": 260} {"train_loss": -7.893618106842041, "global_step": 43683, "epoch": 260} {"train_loss": -8.157491683959961, "global_step": 43684, "epoch": 260} {"train_loss": -7.97999906539917, "global_step": 43685, "epoch": 260} {"train_loss": -7.975859642028809, "global_step": 43686, "epoch": 260} {"train_loss": -7.884753704071045, "global_step": 43687, "epoch": 260} {"train_loss": -8.092838287353516, "global_step": 43688, "epoch": 260} {"train_loss": -8.219470977783203, "global_step": 43689, "epoch": 260} {"train_loss": -8.16519546508789, "global_step": 43690, "epoch": 260} {"train_loss": -8.022689819335938, "global_step": 43691, "epoch": 260} {"train_loss": -8.185161590576172, "global_step": 43692, "epoch": 260} {"train_loss": -7.838980197906494, "global_step": 43693, "epoch": 260} {"train_loss": -8.112009048461914, "global_step": 43694, "epoch": 260} {"train_loss": -8.199631690979004, "global_step": 43695, "epoch": 260} {"train_loss": -8.057443618774414, "global_step": 43696, "epoch": 260} {"train_loss": -8.35373306274414, "global_step": 43697, "epoch": 260} {"train_loss": -8.299954414367676, "global_step": 43698, "epoch": 260} {"train_loss": -8.197833061218262, "global_step": 43699, "epoch": 260} {"train_loss": -8.023927688598633, "global_step": 43700, "epoch": 260} {"train_loss": -8.088977813720703, "global_step": 43701, "epoch": 260} {"train_loss": -8.315607070922852, "global_step": 43702, "epoch": 260} {"train_loss": -8.352121353149414, "global_step": 43703, "epoch": 260} {"train_loss": -8.313701629638672, "global_step": 43704, "epoch": 260} {"train_loss": -8.122042655944824, "global_step": 43705, "epoch": 260} {"train_loss": -8.155689239501953, "global_step": 43706, "epoch": 260} {"train_loss": -8.36740493774414, "global_step": 43707, "epoch": 260} {"train_loss": -8.234428405761719, "global_step": 43708, "epoch": 260} {"train_loss": -8.016664505004883, "global_step": 43709, "epoch": 260} {"train_loss": -8.095972061157227, "global_step": 43710, "epoch": 260} {"train_loss": -8.243902206420898, "global_step": 43711, "epoch": 260} {"train_loss": -8.485950469970703, "global_step": 43712, "epoch": 260} {"train_loss": -8.321884155273438, "global_step": 43713, "epoch": 260} {"train_loss": -8.186979293823242, "global_step": 43714, "epoch": 260} {"train_loss": -8.270683288574219, "global_step": 43715, "epoch": 260} {"train_loss": -8.10317611694336, "global_step": 43716, "epoch": 260} {"train_loss": -7.967379570007324, "global_step": 43717, "epoch": 260} {"train_loss": -8.295973777770996, "global_step": 43718, "epoch": 260} {"train_loss": -8.0506591796875, "global_step": 43719, "epoch": 260} {"train_loss": -8.031167984008789, "global_step": 43720, "epoch": 260} {"train_loss": -8.154643058776855, "global_step": 43721, "epoch": 260} {"train_loss": -8.171602249145508, "global_step": 43722, "epoch": 260} {"train_loss": -7.846240043640137, "global_step": 43723, "epoch": 260} {"train_loss": -7.552063465118408, "global_step": 43724, "epoch": 260} {"train_loss": -7.994816780090332, "global_step": 43725, "epoch": 260} {"train_loss": -7.96764612197876, "global_step": 43726, "epoch": 260} {"train_loss": -7.838526725769043, "global_step": 43727, "epoch": 260} {"train_loss": -7.7812042236328125, "global_step": 43728, "epoch": 260} {"train_loss": -7.691642761230469, "global_step": 43729, "epoch": 260} {"train_loss": -7.781524181365967, "global_step": 43730, "epoch": 260} {"train_loss": -7.906890869140625, "global_step": 43731, "epoch": 260} {"train_loss": -7.877310752868652, "global_step": 43732, "epoch": 260} {"train_loss": -7.882556915283203, "global_step": 43733, "epoch": 260} {"train_loss": -7.789512634277344, "global_step": 43734, "epoch": 260} {"train_loss": -8.053936004638672, "global_step": 43735, "epoch": 260} {"train_loss": -8.02913761138916, "global_step": 43736, "epoch": 260} {"train_loss": -7.880980968475342, "global_step": 43737, "epoch": 260} {"train_loss": -7.835442543029785, "global_step": 43738, "epoch": 260} {"train_loss": -8.16617202758789, "global_step": 43739, "epoch": 260} {"train_loss": -7.664556503295898, "global_step": 43740, "epoch": 260} {"train_loss": -8.091278076171875, "global_step": 43741, "epoch": 260} {"train_loss": -7.8871564865112305, "global_step": 43742, "epoch": 260} {"train_loss": -8.188638687133789, "global_step": 43743, "epoch": 260} {"train_loss": -8.043764114379883, "global_step": 43744, "epoch": 260} {"train_loss": -7.817739486694336, "global_step": 43745, "epoch": 260} {"train_loss": -7.810915946960449, "global_step": 43746, "epoch": 260} {"train_loss": -8.163885116577148, "global_step": 43747, "epoch": 260} {"train_loss": -7.925575256347656, "global_step": 43748, "epoch": 260} {"train_loss": -8.27476692199707, "global_step": 43749, "epoch": 260} {"train_loss": -8.162149429321289, "global_step": 43750, "epoch": 260} {"train_loss": -7.955790996551514, "global_step": 43751, "epoch": 260} {"train_loss": -8.04216194152832, "global_step": 43752, "epoch": 260} {"train_loss": -8.219009399414062, "global_step": 43753, "epoch": 260} {"train_loss": -8.328544616699219, "global_step": 43754, "epoch": 260} {"train_loss": -8.410699844360352, "global_step": 43755, "epoch": 260} {"train_loss": -7.935595512390137, "global_step": 43756, "epoch": 260} {"train_loss": -8.270624160766602, "global_step": 43757, "epoch": 260} {"train_loss": -8.11876106262207, "global_step": 43758, "epoch": 260} {"train_loss": -8.163158416748047, "global_step": 43759, "epoch": 260} {"train_loss": -8.06224250793457, "global_step": 43760, "epoch": 260} {"train_loss": -7.950948238372803, "global_step": 43761, "epoch": 260} {"train_loss": -8.091360092163086, "global_step": 43762, "epoch": 260} {"train_loss": -8.119491577148438, "global_step": 43763, "epoch": 260} {"train_loss": -8.07876968383789, "global_step": 43764, "epoch": 260} {"train_loss": -7.759926795959473, "global_step": 43765, "epoch": 260} {"train_loss": -8.041635513305664, "global_step": 43766, "epoch": 260} {"train_loss": -7.507761001586914, "global_step": 43767, "epoch": 260} {"train_loss": -7.803400993347168, "global_step": 43768, "epoch": 260} {"train_loss": -7.472243309020996, "global_step": 43769, "epoch": 260} {"train_loss": -7.933225154876709, "global_step": 43770, "epoch": 260} {"train_loss": -7.499310493469238, "global_step": 43771, "epoch": 260} {"train_loss": -7.73110294342041, "global_step": 43772, "epoch": 260} {"train_loss": -7.545070648193359, "global_step": 43773, "epoch": 260} {"train_loss": -7.7485761642456055, "global_step": 43774, "epoch": 260} {"train_loss": -7.890803813934326, "global_step": 43775, "epoch": 260} {"train_loss": -7.960633754730225, "global_step": 43776, "epoch": 260} {"train_loss": -7.600276947021484, "global_step": 43777, "epoch": 260} {"train_loss": -7.832140922546387, "global_step": 43778, "epoch": 260} {"train_loss": -7.815272331237793, "global_step": 43779, "epoch": 260} {"train_loss": -7.841473579406738, "global_step": 43780, "epoch": 260} {"train_loss": -7.6613240242004395, "global_step": 43781, "epoch": 260} {"train_loss": -7.76935338973999, "global_step": 43782, "epoch": 260} {"train_loss": -7.7872209548950195, "global_step": 43783, "epoch": 260} {"train_loss": -7.942286014556885, "global_step": 43784, "epoch": 260} {"train_loss": -7.9394731521606445, "global_step": 43785, "epoch": 260} {"train_loss": -7.870187759399414, "global_step": 43786, "epoch": 260} {"train_loss": -7.901894569396973, "global_step": 43787, "epoch": 260} {"train_loss": -8.189820289611816, "global_step": 43788, "epoch": 260} {"train_loss": -8.044461250305176, "global_step": 43789, "epoch": 260} {"train_loss": -8.10130500793457, "global_step": 43790, "epoch": 260} {"train_loss": -8.02684497833252, "global_step": 43791, "epoch": 260} {"train_loss": -7.975083827972412, "global_step": 43792, "epoch": 260} {"train_loss": -8.188009262084961, "global_step": 43793, "epoch": 260} {"train_loss": -7.884897232055664, "global_step": 43794, "epoch": 260} {"train_loss": -8.153764724731445, "global_step": 43795, "epoch": 260} {"train_loss": -7.755967140197754, "global_step": 43796, "epoch": 260} {"train_loss": -8.210607528686523, "global_step": 43797, "epoch": 260} {"train_loss": -8.021270751953125, "global_step": 43798, "epoch": 260} {"train_loss": -8.05831241607666, "global_step": 43799, "epoch": 260} {"train_loss": -8.220361709594727, "global_step": 43800, "epoch": 260} {"train_loss": -8.029707908630371, "global_step": 43801, "epoch": 260} {"train_loss": -8.204734802246094, "global_step": 43802, "epoch": 260} {"train_loss": -8.08218002319336, "global_step": 43803, "epoch": 260} {"train_loss": -8.260866165161133, "global_step": 43804, "epoch": 260} {"train_loss": -8.278106689453125, "global_step": 43805, "epoch": 260} {"train_loss": -8.41297721862793, "global_step": 43806, "epoch": 260} {"train_loss": -8.409197807312012, "global_step": 43807, "epoch": 260} {"train_loss": -8.112144470214844, "global_step": 43808, "epoch": 260} {"train_loss": -8.247690200805664, "global_step": 43809, "epoch": 260} {"train_loss": -7.737879753112793, "global_step": 43810, "epoch": 260} {"train_loss": -8.251094818115234, "global_step": 43811, "epoch": 260} {"train_loss": -7.961697578430176, "global_step": 43812, "epoch": 260} {"train_loss": -7.961371421813965, "global_step": 43813, "epoch": 260} {"train_loss": -8.066794395446777, "global_step": 43814, "epoch": 260} {"train_loss": -8.064149856567383, "global_step": 43815, "epoch": 260} {"train_loss": -7.762927055358887, "global_step": 43816, "epoch": 260} {"train_loss": -8.46331787109375, "global_step": 43817, "epoch": 260} {"train_loss": -7.830622673034668, "global_step": 43818, "epoch": 260} {"train_loss": -7.906892776489258, "global_step": 43819, "epoch": 260} {"train_loss": -8.212143898010254, "global_step": 43820, "epoch": 260} {"train_loss": -7.968838691711426, "global_step": 43821, "epoch": 260} {"train_loss": -8.123659133911133, "global_step": 43822, "epoch": 260} {"train_loss": -8.066649436950684, "global_step": 43823, "epoch": 260} {"train_loss": -7.875302791595459, "global_step": 43824, "epoch": 260} {"train_loss": -7.867374420166016, "global_step": 43825, "epoch": 260} {"train_loss": -7.899527549743652, "global_step": 43826, "epoch": 260} {"train_loss": -7.912471771240234, "global_step": 43827, "epoch": 260} {"train_loss": -7.877061367034912, "global_step": 43828, "epoch": 260} {"train_loss": -7.967996120452881, "global_step": 43829, "epoch": 260} {"train_loss": -7.810412406921387, "global_step": 43830, "epoch": 260} {"train_loss": -7.683259963989258, "global_step": 43831, "epoch": 260} {"train_loss": -7.830266952514648, "global_step": 43832, "epoch": 260} {"train_loss": -7.87739372253418, "global_step": 43833, "epoch": 260} {"train_loss": -7.933081150054932, "global_step": 43834, "epoch": 260} {"train_loss": -7.95806884765625, "global_step": 43835, "epoch": 260} {"train_loss": -8.014457702636719, "global_step": 43836, "epoch": 260} {"train_loss": -7.8576555252075195, "global_step": 43837, "epoch": 260} {"train_loss": -7.72797966003418, "global_step": 43838, "epoch": 260} {"train_loss": -8.020209312438965, "global_step": 43839, "epoch": 260} {"train_loss": -7.982722282409668, "global_step": 43840, "epoch": 260} {"train_loss": -7.920499324798584, "global_step": 43841, "epoch": 260} {"train_loss": -7.762194633483887, "global_step": 43842, "epoch": 260} {"train_loss": -8.105009078979492, "global_step": 43843, "epoch": 260} {"train_loss": -7.953815460205078, "global_step": 43844, "epoch": 260} {"train_loss": -7.898935317993164, "global_step": 43845, "epoch": 260} {"train_loss": -7.763498306274414, "global_step": 43846, "epoch": 260} {"train_loss": -8.010265333311898, "global_step": 43847, "epoch": 260, "val_loss": 185422.421875, "train_action_mse_error": 9.773441314697266} {"train_loss": -7.905378341674805, "global_step": 43848, "epoch": 261} {"train_loss": -7.767218589782715, "global_step": 43849, "epoch": 261} {"train_loss": -7.982969760894775, "global_step": 43850, "epoch": 261} {"train_loss": -7.994142532348633, "global_step": 43851, "epoch": 261} {"train_loss": -7.762114524841309, "global_step": 43852, "epoch": 261} {"train_loss": -7.86293363571167, "global_step": 43853, "epoch": 261} {"train_loss": -7.936878681182861, "global_step": 43854, "epoch": 261} {"train_loss": -8.035309791564941, "global_step": 43855, "epoch": 261} {"train_loss": -8.043146133422852, "global_step": 43856, "epoch": 261} {"train_loss": -7.947208404541016, "global_step": 43857, "epoch": 261} {"train_loss": -8.109429359436035, "global_step": 43858, "epoch": 261} {"train_loss": -8.161627769470215, "global_step": 43859, "epoch": 261} {"train_loss": -7.872134208679199, "global_step": 43860, "epoch": 261} {"train_loss": -7.931671142578125, "global_step": 43861, "epoch": 261} {"train_loss": -8.070199966430664, "global_step": 43862, "epoch": 261} {"train_loss": -8.04924488067627, "global_step": 43863, "epoch": 261} {"train_loss": -7.988988876342773, "global_step": 43864, "epoch": 261} {"train_loss": -7.884209632873535, "global_step": 43865, "epoch": 261} {"train_loss": -8.118840217590332, "global_step": 43866, "epoch": 261} {"train_loss": -7.950507640838623, "global_step": 43867, "epoch": 261} {"train_loss": -8.140593528747559, "global_step": 43868, "epoch": 261} {"train_loss": -8.086336135864258, "global_step": 43869, "epoch": 261} {"train_loss": -8.309185028076172, "global_step": 43870, "epoch": 261} {"train_loss": -8.058475494384766, "global_step": 43871, "epoch": 261} {"train_loss": -8.077899932861328, "global_step": 43872, "epoch": 261} {"train_loss": -8.263484954833984, "global_step": 43873, "epoch": 261} {"train_loss": -8.217024803161621, "global_step": 43874, "epoch": 261} {"train_loss": -8.039878845214844, "global_step": 43875, "epoch": 261} {"train_loss": -8.023982048034668, "global_step": 43876, "epoch": 261} {"train_loss": -8.069185256958008, "global_step": 43877, "epoch": 261} {"train_loss": -8.02151870727539, "global_step": 43878, "epoch": 261} {"train_loss": -7.821343421936035, "global_step": 43879, "epoch": 261} {"train_loss": -8.162480354309082, "global_step": 43880, "epoch": 261} {"train_loss": -8.072417259216309, "global_step": 43881, "epoch": 261} {"train_loss": -8.127744674682617, "global_step": 43882, "epoch": 261} {"train_loss": -8.267932891845703, "global_step": 43883, "epoch": 261} {"train_loss": -8.012382507324219, "global_step": 43884, "epoch": 261} {"train_loss": -8.16905403137207, "global_step": 43885, "epoch": 261} {"train_loss": -8.145920753479004, "global_step": 43886, "epoch": 261} {"train_loss": -8.054947853088379, "global_step": 43887, "epoch": 261} {"train_loss": -8.003820419311523, "global_step": 43888, "epoch": 261} {"train_loss": -8.281698226928711, "global_step": 43889, "epoch": 261} {"train_loss": -8.186141014099121, "global_step": 43890, "epoch": 261} {"train_loss": -7.997636795043945, "global_step": 43891, "epoch": 261} {"train_loss": -8.184459686279297, "global_step": 43892, "epoch": 261} {"train_loss": -8.212762832641602, "global_step": 43893, "epoch": 261} {"train_loss": -8.243011474609375, "global_step": 43894, "epoch": 261} {"train_loss": -8.130586624145508, "global_step": 43895, "epoch": 261} {"train_loss": -8.193143844604492, "global_step": 43896, "epoch": 261} {"train_loss": -8.011955261230469, "global_step": 43897, "epoch": 261} {"train_loss": -7.878937721252441, "global_step": 43898, "epoch": 261} {"train_loss": -8.215462684631348, "global_step": 43899, "epoch": 261} {"train_loss": -8.186671257019043, "global_step": 43900, "epoch": 261} {"train_loss": -8.123726844787598, "global_step": 43901, "epoch": 261} {"train_loss": -8.282261848449707, "global_step": 43902, "epoch": 261} {"train_loss": -8.159549713134766, "global_step": 43903, "epoch": 261} {"train_loss": -7.9920172691345215, "global_step": 43904, "epoch": 261} {"train_loss": -8.275925636291504, "global_step": 43905, "epoch": 261} {"train_loss": -8.244132995605469, "global_step": 43906, "epoch": 261} {"train_loss": -8.258363723754883, "global_step": 43907, "epoch": 261} {"train_loss": -8.385655403137207, "global_step": 43908, "epoch": 261} {"train_loss": -8.226523399353027, "global_step": 43909, "epoch": 261} {"train_loss": -8.101158142089844, "global_step": 43910, "epoch": 261} {"train_loss": -8.179756164550781, "global_step": 43911, "epoch": 261} {"train_loss": -8.078191757202148, "global_step": 43912, "epoch": 261} {"train_loss": -8.174270629882812, "global_step": 43913, "epoch": 261} {"train_loss": -8.250994682312012, "global_step": 43914, "epoch": 261} {"train_loss": -8.244024276733398, "global_step": 43915, "epoch": 261} {"train_loss": -8.237403869628906, "global_step": 43916, "epoch": 261} {"train_loss": -8.081351280212402, "global_step": 43917, "epoch": 261} {"train_loss": -8.444631576538086, "global_step": 43918, "epoch": 261} {"train_loss": -8.3359956741333, "global_step": 43919, "epoch": 261} {"train_loss": -7.948643207550049, "global_step": 43920, "epoch": 261} {"train_loss": -8.279927253723145, "global_step": 43921, "epoch": 261} {"train_loss": -7.941923141479492, "global_step": 43922, "epoch": 261} {"train_loss": -8.100774765014648, "global_step": 43923, "epoch": 261} {"train_loss": -8.005970001220703, "global_step": 43924, "epoch": 261} {"train_loss": -8.151273727416992, "global_step": 43925, "epoch": 261} {"train_loss": -8.032661437988281, "global_step": 43926, "epoch": 261} {"train_loss": -7.879039764404297, "global_step": 43927, "epoch": 261} {"train_loss": -8.151456832885742, "global_step": 43928, "epoch": 261} {"train_loss": -8.340188980102539, "global_step": 43929, "epoch": 261} {"train_loss": -8.061960220336914, "global_step": 43930, "epoch": 261} {"train_loss": -8.302553176879883, "global_step": 43931, "epoch": 261} {"train_loss": -7.991764068603516, "global_step": 43932, "epoch": 261} {"train_loss": -7.993136882781982, "global_step": 43933, "epoch": 261} {"train_loss": -7.9856672286987305, "global_step": 43934, "epoch": 261} {"train_loss": -8.028022766113281, "global_step": 43935, "epoch": 261} {"train_loss": -8.042522430419922, "global_step": 43936, "epoch": 261} {"train_loss": -8.006010055541992, "global_step": 43937, "epoch": 261} {"train_loss": -7.922102451324463, "global_step": 43938, "epoch": 261} {"train_loss": -7.988701343536377, "global_step": 43939, "epoch": 261} {"train_loss": -7.957491397857666, "global_step": 43940, "epoch": 261} {"train_loss": -7.8370256423950195, "global_step": 43941, "epoch": 261} {"train_loss": -7.993439197540283, "global_step": 43942, "epoch": 261} {"train_loss": -7.742176532745361, "global_step": 43943, "epoch": 261} {"train_loss": -8.227883338928223, "global_step": 43944, "epoch": 261} {"train_loss": -8.063650131225586, "global_step": 43945, "epoch": 261} {"train_loss": -8.04562759399414, "global_step": 43946, "epoch": 261} {"train_loss": -7.902168273925781, "global_step": 43947, "epoch": 261} {"train_loss": -7.857624530792236, "global_step": 43948, "epoch": 261} {"train_loss": -8.017017364501953, "global_step": 43949, "epoch": 261} {"train_loss": -8.113776206970215, "global_step": 43950, "epoch": 261} {"train_loss": -7.9987945556640625, "global_step": 43951, "epoch": 261} {"train_loss": -8.237736701965332, "global_step": 43952, "epoch": 261} {"train_loss": -8.259317398071289, "global_step": 43953, "epoch": 261} {"train_loss": -7.982874393463135, "global_step": 43954, "epoch": 261} {"train_loss": -7.817784309387207, "global_step": 43955, "epoch": 261} {"train_loss": -8.226268768310547, "global_step": 43956, "epoch": 261} {"train_loss": -8.014026641845703, "global_step": 43957, "epoch": 261} {"train_loss": -8.295235633850098, "global_step": 43958, "epoch": 261} {"train_loss": -7.929417610168457, "global_step": 43959, "epoch": 261} {"train_loss": -8.320697784423828, "global_step": 43960, "epoch": 261} {"train_loss": -7.936778545379639, "global_step": 43961, "epoch": 261} {"train_loss": -8.030418395996094, "global_step": 43962, "epoch": 261} {"train_loss": -7.922946453094482, "global_step": 43963, "epoch": 261} {"train_loss": -7.998246192932129, "global_step": 43964, "epoch": 261} {"train_loss": -7.914737701416016, "global_step": 43965, "epoch": 261} {"train_loss": -8.014289855957031, "global_step": 43966, "epoch": 261} {"train_loss": -8.120190620422363, "global_step": 43967, "epoch": 261} {"train_loss": -8.205649375915527, "global_step": 43968, "epoch": 261} {"train_loss": -8.052600860595703, "global_step": 43969, "epoch": 261} {"train_loss": -8.18138313293457, "global_step": 43970, "epoch": 261} {"train_loss": -8.186389923095703, "global_step": 43971, "epoch": 261} {"train_loss": -8.15470027923584, "global_step": 43972, "epoch": 261} {"train_loss": -8.165834426879883, "global_step": 43973, "epoch": 261} {"train_loss": -8.159607887268066, "global_step": 43974, "epoch": 261} {"train_loss": -8.07715129852295, "global_step": 43975, "epoch": 261} {"train_loss": -7.998010635375977, "global_step": 43976, "epoch": 261} {"train_loss": -8.152420043945312, "global_step": 43977, "epoch": 261} {"train_loss": -8.168106079101562, "global_step": 43978, "epoch": 261} {"train_loss": -7.985579490661621, "global_step": 43979, "epoch": 261} {"train_loss": -8.080482482910156, "global_step": 43980, "epoch": 261} {"train_loss": -8.227161407470703, "global_step": 43981, "epoch": 261} {"train_loss": -8.11815071105957, "global_step": 43982, "epoch": 261} {"train_loss": -8.158350944519043, "global_step": 43983, "epoch": 261} {"train_loss": -8.201323509216309, "global_step": 43984, "epoch": 261} {"train_loss": -8.077805519104004, "global_step": 43985, "epoch": 261} {"train_loss": -8.093402862548828, "global_step": 43986, "epoch": 261} {"train_loss": -8.231114387512207, "global_step": 43987, "epoch": 261} {"train_loss": -8.262203216552734, "global_step": 43988, "epoch": 261} {"train_loss": -8.029726028442383, "global_step": 43989, "epoch": 261} {"train_loss": -8.37997817993164, "global_step": 43990, "epoch": 261} {"train_loss": -8.160758972167969, "global_step": 43991, "epoch": 261} {"train_loss": -8.116132736206055, "global_step": 43992, "epoch": 261} {"train_loss": -8.270325660705566, "global_step": 43993, "epoch": 261} {"train_loss": -8.047575950622559, "global_step": 43994, "epoch": 261} {"train_loss": -8.317344665527344, "global_step": 43995, "epoch": 261} {"train_loss": -7.8310933113098145, "global_step": 43996, "epoch": 261} {"train_loss": -8.000319480895996, "global_step": 43997, "epoch": 261} {"train_loss": -8.141714096069336, "global_step": 43998, "epoch": 261} {"train_loss": -8.187508583068848, "global_step": 43999, "epoch": 261} {"train_loss": -8.022419929504395, "global_step": 44000, "epoch": 261} {"train_loss": -8.17629623413086, "global_step": 44001, "epoch": 261} {"train_loss": -7.9440016746521, "global_step": 44002, "epoch": 261} {"train_loss": -8.170455932617188, "global_step": 44003, "epoch": 261} {"train_loss": -8.099014282226562, "global_step": 44004, "epoch": 261} {"train_loss": -8.002671241760254, "global_step": 44005, "epoch": 261} {"train_loss": -8.071866989135742, "global_step": 44006, "epoch": 261} {"train_loss": -8.240251541137695, "global_step": 44007, "epoch": 261} {"train_loss": -8.062012672424316, "global_step": 44008, "epoch": 261} {"train_loss": -8.315282821655273, "global_step": 44009, "epoch": 261} {"train_loss": -8.056720733642578, "global_step": 44010, "epoch": 261} {"train_loss": -8.191999435424805, "global_step": 44011, "epoch": 261} {"train_loss": -8.07590103149414, "global_step": 44012, "epoch": 261} {"train_loss": -8.28615951538086, "global_step": 44013, "epoch": 261} {"train_loss": -7.841395378112793, "global_step": 44014, "epoch": 261} {"train_loss": -8.091215718360175, "global_step": 44015, "epoch": 261, "val_loss": 189190.9375} {"train_loss": -8.178455352783203, "global_step": 44016, "epoch": 262} {"train_loss": -8.209470748901367, "global_step": 44017, "epoch": 262} {"train_loss": -8.059671401977539, "global_step": 44018, "epoch": 262} {"train_loss": -7.696371078491211, "global_step": 44019, "epoch": 262} {"train_loss": -8.060227394104004, "global_step": 44020, "epoch": 262} {"train_loss": -8.083185195922852, "global_step": 44021, "epoch": 262} {"train_loss": -8.212076187133789, "global_step": 44022, "epoch": 262} {"train_loss": -8.219599723815918, "global_step": 44023, "epoch": 262} {"train_loss": -8.276415824890137, "global_step": 44024, "epoch": 262} {"train_loss": -8.140445709228516, "global_step": 44025, "epoch": 262} {"train_loss": -8.043306350708008, "global_step": 44026, "epoch": 262} {"train_loss": -8.299915313720703, "global_step": 44027, "epoch": 262} {"train_loss": -8.078239440917969, "global_step": 44028, "epoch": 262} {"train_loss": -8.21207046508789, "global_step": 44029, "epoch": 262} {"train_loss": -8.199712753295898, "global_step": 44030, "epoch": 262} {"train_loss": -8.012131690979004, "global_step": 44031, "epoch": 262} {"train_loss": -7.960273265838623, "global_step": 44032, "epoch": 262} {"train_loss": -8.098138809204102, "global_step": 44033, "epoch": 262} {"train_loss": -8.148730278015137, "global_step": 44034, "epoch": 262} {"train_loss": -8.23355484008789, "global_step": 44035, "epoch": 262} {"train_loss": -8.109498977661133, "global_step": 44036, "epoch": 262} {"train_loss": -8.003158569335938, "global_step": 44037, "epoch": 262} {"train_loss": -8.119853019714355, "global_step": 44038, "epoch": 262} {"train_loss": -8.120553016662598, "global_step": 44039, "epoch": 262} {"train_loss": -8.158628463745117, "global_step": 44040, "epoch": 262} {"train_loss": -8.074483871459961, "global_step": 44041, "epoch": 262} {"train_loss": -8.19028091430664, "global_step": 44042, "epoch": 262} {"train_loss": -8.186681747436523, "global_step": 44043, "epoch": 262} {"train_loss": -8.03380298614502, "global_step": 44044, "epoch": 262} {"train_loss": -8.175477981567383, "global_step": 44045, "epoch": 262} {"train_loss": -7.93352746963501, "global_step": 44046, "epoch": 262} {"train_loss": -8.070266723632812, "global_step": 44047, "epoch": 262} {"train_loss": -7.90374231338501, "global_step": 44048, "epoch": 262} {"train_loss": -8.02157974243164, "global_step": 44049, "epoch": 262} {"train_loss": -8.090287208557129, "global_step": 44050, "epoch": 262} {"train_loss": -7.8615617752075195, "global_step": 44051, "epoch": 262} {"train_loss": -8.034188270568848, "global_step": 44052, "epoch": 262} {"train_loss": -7.960501670837402, "global_step": 44053, "epoch": 262} {"train_loss": -8.046632766723633, "global_step": 44054, "epoch": 262} {"train_loss": -8.046187400817871, "global_step": 44055, "epoch": 262} {"train_loss": -8.045571327209473, "global_step": 44056, "epoch": 262} {"train_loss": -8.043495178222656, "global_step": 44057, "epoch": 262} {"train_loss": -7.72224235534668, "global_step": 44058, "epoch": 262} {"train_loss": -7.968620300292969, "global_step": 44059, "epoch": 262} {"train_loss": -7.842646598815918, "global_step": 44060, "epoch": 262} {"train_loss": -7.992417335510254, "global_step": 44061, "epoch": 262} {"train_loss": -7.801649570465088, "global_step": 44062, "epoch": 262} {"train_loss": -7.914633750915527, "global_step": 44063, "epoch": 262} {"train_loss": -7.384570121765137, "global_step": 44064, "epoch": 262} {"train_loss": -7.817868709564209, "global_step": 44065, "epoch": 262} {"train_loss": -7.639032363891602, "global_step": 44066, "epoch": 262} {"train_loss": -7.84354305267334, "global_step": 44067, "epoch": 262} {"train_loss": -7.736108779907227, "global_step": 44068, "epoch": 262} {"train_loss": -7.75711727142334, "global_step": 44069, "epoch": 262} {"train_loss": -7.975461959838867, "global_step": 44070, "epoch": 262} {"train_loss": -8.062276840209961, "global_step": 44071, "epoch": 262} {"train_loss": -7.789043426513672, "global_step": 44072, "epoch": 262} {"train_loss": -7.846035957336426, "global_step": 44073, "epoch": 262} {"train_loss": -8.04275131225586, "global_step": 44074, "epoch": 262} {"train_loss": -7.989063739776611, "global_step": 44075, "epoch": 262} {"train_loss": -8.061266899108887, "global_step": 44076, "epoch": 262} {"train_loss": -8.063543319702148, "global_step": 44077, "epoch": 262} {"train_loss": -7.999936103820801, "global_step": 44078, "epoch": 262} {"train_loss": -7.92609977722168, "global_step": 44079, "epoch": 262} {"train_loss": -8.099660873413086, "global_step": 44080, "epoch": 262} {"train_loss": -8.135611534118652, "global_step": 44081, "epoch": 262} {"train_loss": -7.817262649536133, "global_step": 44082, "epoch": 262} {"train_loss": -8.329574584960938, "global_step": 44083, "epoch": 262} {"train_loss": -7.995181083679199, "global_step": 44084, "epoch": 262} {"train_loss": -8.176456451416016, "global_step": 44085, "epoch": 262} {"train_loss": -8.090161323547363, "global_step": 44086, "epoch": 262} {"train_loss": -8.134374618530273, "global_step": 44087, "epoch": 262} {"train_loss": -8.068376541137695, "global_step": 44088, "epoch": 262} {"train_loss": -8.012598991394043, "global_step": 44089, "epoch": 262} {"train_loss": -8.040546417236328, "global_step": 44090, "epoch": 262} {"train_loss": -8.262413024902344, "global_step": 44091, "epoch": 262} {"train_loss": -8.186418533325195, "global_step": 44092, "epoch": 262} {"train_loss": -8.305390357971191, "global_step": 44093, "epoch": 262} {"train_loss": -8.213607788085938, "global_step": 44094, "epoch": 262} {"train_loss": -8.228081703186035, "global_step": 44095, "epoch": 262} {"train_loss": -7.951040267944336, "global_step": 44096, "epoch": 262} {"train_loss": -8.403909683227539, "global_step": 44097, "epoch": 262} {"train_loss": -8.316730499267578, "global_step": 44098, "epoch": 262} {"train_loss": -8.259291648864746, "global_step": 44099, "epoch": 262} {"train_loss": -8.409690856933594, "global_step": 44100, "epoch": 262} {"train_loss": -8.470625877380371, "global_step": 44101, "epoch": 262} {"train_loss": -7.935903549194336, "global_step": 44102, "epoch": 262} {"train_loss": -8.357126235961914, "global_step": 44103, "epoch": 262} {"train_loss": -8.041601181030273, "global_step": 44104, "epoch": 262} {"train_loss": -8.266559600830078, "global_step": 44105, "epoch": 262} {"train_loss": -8.267570495605469, "global_step": 44106, "epoch": 262} {"train_loss": -8.327924728393555, "global_step": 44107, "epoch": 262} {"train_loss": -8.156457901000977, "global_step": 44108, "epoch": 262} {"train_loss": -8.106922149658203, "global_step": 44109, "epoch": 262} {"train_loss": -8.198936462402344, "global_step": 44110, "epoch": 262} {"train_loss": -7.869690418243408, "global_step": 44111, "epoch": 262} {"train_loss": -8.234063148498535, "global_step": 44112, "epoch": 262} {"train_loss": -8.138635635375977, "global_step": 44113, "epoch": 262} {"train_loss": -8.000408172607422, "global_step": 44114, "epoch": 262} {"train_loss": -8.215202331542969, "global_step": 44115, "epoch": 262} {"train_loss": -8.414627075195312, "global_step": 44116, "epoch": 262} {"train_loss": -8.124247550964355, "global_step": 44117, "epoch": 262} {"train_loss": -8.215206146240234, "global_step": 44118, "epoch": 262} {"train_loss": -8.331087112426758, "global_step": 44119, "epoch": 262} {"train_loss": -7.856292724609375, "global_step": 44120, "epoch": 262} {"train_loss": -8.054903030395508, "global_step": 44121, "epoch": 262} {"train_loss": -8.170694351196289, "global_step": 44122, "epoch": 262} {"train_loss": -8.285530090332031, "global_step": 44123, "epoch": 262} {"train_loss": -8.081677436828613, "global_step": 44124, "epoch": 262} {"train_loss": -8.169746398925781, "global_step": 44125, "epoch": 262} {"train_loss": -8.088566780090332, "global_step": 44126, "epoch": 262} {"train_loss": -7.907935619354248, "global_step": 44127, "epoch": 262} {"train_loss": -7.958976745605469, "global_step": 44128, "epoch": 262} {"train_loss": -8.237940788269043, "global_step": 44129, "epoch": 262} {"train_loss": -8.063714027404785, "global_step": 44130, "epoch": 262} {"train_loss": -8.202049255371094, "global_step": 44131, "epoch": 262} {"train_loss": -8.172308921813965, "global_step": 44132, "epoch": 262} {"train_loss": -8.192327499389648, "global_step": 44133, "epoch": 262} {"train_loss": -8.131612777709961, "global_step": 44134, "epoch": 262} {"train_loss": -8.12496566772461, "global_step": 44135, "epoch": 262} {"train_loss": -7.891515731811523, "global_step": 44136, "epoch": 262} {"train_loss": -8.138521194458008, "global_step": 44137, "epoch": 262} {"train_loss": -8.302727699279785, "global_step": 44138, "epoch": 262} {"train_loss": -8.055776596069336, "global_step": 44139, "epoch": 262} {"train_loss": -8.115043640136719, "global_step": 44140, "epoch": 262} {"train_loss": -8.253320693969727, "global_step": 44141, "epoch": 262} {"train_loss": -8.136494636535645, "global_step": 44142, "epoch": 262} {"train_loss": -8.122383117675781, "global_step": 44143, "epoch": 262} {"train_loss": -8.144256591796875, "global_step": 44144, "epoch": 262} {"train_loss": -8.18375015258789, "global_step": 44145, "epoch": 262} {"train_loss": -8.040470123291016, "global_step": 44146, "epoch": 262} {"train_loss": -8.216463088989258, "global_step": 44147, "epoch": 262} {"train_loss": -8.060480117797852, "global_step": 44148, "epoch": 262} {"train_loss": -8.05455207824707, "global_step": 44149, "epoch": 262} {"train_loss": -8.254914283752441, "global_step": 44150, "epoch": 262} {"train_loss": -8.074990272521973, "global_step": 44151, "epoch": 262} {"train_loss": -7.991405487060547, "global_step": 44152, "epoch": 262} {"train_loss": -8.068644523620605, "global_step": 44153, "epoch": 262} {"train_loss": -8.2124662399292, "global_step": 44154, "epoch": 262} {"train_loss": -7.985347270965576, "global_step": 44155, "epoch": 262} {"train_loss": -7.849894046783447, "global_step": 44156, "epoch": 262} {"train_loss": -8.141743659973145, "global_step": 44157, "epoch": 262} {"train_loss": -8.054214477539062, "global_step": 44158, "epoch": 262} {"train_loss": -7.893463134765625, "global_step": 44159, "epoch": 262} {"train_loss": -8.036754608154297, "global_step": 44160, "epoch": 262} {"train_loss": -7.77601957321167, "global_step": 44161, "epoch": 262} {"train_loss": -7.907900333404541, "global_step": 44162, "epoch": 262} {"train_loss": -7.963803291320801, "global_step": 44163, "epoch": 262} {"train_loss": -7.908093452453613, "global_step": 44164, "epoch": 262} {"train_loss": -7.9023332595825195, "global_step": 44165, "epoch": 262} {"train_loss": -7.979406356811523, "global_step": 44166, "epoch": 262} {"train_loss": -7.863463401794434, "global_step": 44167, "epoch": 262} {"train_loss": -8.034965515136719, "global_step": 44168, "epoch": 262} {"train_loss": -8.094550132751465, "global_step": 44169, "epoch": 262} {"train_loss": -8.010784149169922, "global_step": 44170, "epoch": 262} {"train_loss": -8.173245429992676, "global_step": 44171, "epoch": 262} {"train_loss": -8.090034484863281, "global_step": 44172, "epoch": 262} {"train_loss": -8.357458114624023, "global_step": 44173, "epoch": 262} {"train_loss": -7.915376663208008, "global_step": 44174, "epoch": 262} {"train_loss": -8.071405410766602, "global_step": 44175, "epoch": 262} {"train_loss": -7.802505016326904, "global_step": 44176, "epoch": 262} {"train_loss": -8.106452941894531, "global_step": 44177, "epoch": 262} {"train_loss": -8.189441680908203, "global_step": 44178, "epoch": 262} {"train_loss": -8.021692276000977, "global_step": 44179, "epoch": 262} {"train_loss": -8.048521041870117, "global_step": 44180, "epoch": 262} {"train_loss": -8.439416885375977, "global_step": 44181, "epoch": 262} {"train_loss": -8.221445083618164, "global_step": 44182, "epoch": 262} {"train_loss": -8.077686102617355, "global_step": 44183, "epoch": 262, "val_loss": 185344.859375} {"train_loss": -8.057860374450684, "global_step": 44184, "epoch": 263} {"train_loss": -8.196405410766602, "global_step": 44185, "epoch": 263} {"train_loss": -8.075199127197266, "global_step": 44186, "epoch": 263} {"train_loss": -8.12337589263916, "global_step": 44187, "epoch": 263} {"train_loss": -8.264945983886719, "global_step": 44188, "epoch": 263} {"train_loss": -8.263784408569336, "global_step": 44189, "epoch": 263} {"train_loss": -7.947192192077637, "global_step": 44190, "epoch": 263} {"train_loss": -8.185215950012207, "global_step": 44191, "epoch": 263} {"train_loss": -8.115046501159668, "global_step": 44192, "epoch": 263} {"train_loss": -8.143027305603027, "global_step": 44193, "epoch": 263} {"train_loss": -7.925255298614502, "global_step": 44194, "epoch": 263} {"train_loss": -8.091955184936523, "global_step": 44195, "epoch": 263} {"train_loss": -8.229561805725098, "global_step": 44196, "epoch": 263} {"train_loss": -8.079782485961914, "global_step": 44197, "epoch": 263} {"train_loss": -8.222916603088379, "global_step": 44198, "epoch": 263} {"train_loss": -7.9352593421936035, "global_step": 44199, "epoch": 263} {"train_loss": -8.127670288085938, "global_step": 44200, "epoch": 263} {"train_loss": -8.210559844970703, "global_step": 44201, "epoch": 263} {"train_loss": -8.156597137451172, "global_step": 44202, "epoch": 263} {"train_loss": -8.341290473937988, "global_step": 44203, "epoch": 263} {"train_loss": -8.423675537109375, "global_step": 44204, "epoch": 263} {"train_loss": -8.342555046081543, "global_step": 44205, "epoch": 263} {"train_loss": -8.300762176513672, "global_step": 44206, "epoch": 263} {"train_loss": -8.198205947875977, "global_step": 44207, "epoch": 263} {"train_loss": -8.166749954223633, "global_step": 44208, "epoch": 263} {"train_loss": -8.130722045898438, "global_step": 44209, "epoch": 263} {"train_loss": -8.217992782592773, "global_step": 44210, "epoch": 263} {"train_loss": -8.198970794677734, "global_step": 44211, "epoch": 263} {"train_loss": -8.12209701538086, "global_step": 44212, "epoch": 263} {"train_loss": -8.100282669067383, "global_step": 44213, "epoch": 263} {"train_loss": -8.299885749816895, "global_step": 44214, "epoch": 263} {"train_loss": -8.255426406860352, "global_step": 44215, "epoch": 263} {"train_loss": -8.152626037597656, "global_step": 44216, "epoch": 263} {"train_loss": -8.152166366577148, "global_step": 44217, "epoch": 263} {"train_loss": -8.074942588806152, "global_step": 44218, "epoch": 263} {"train_loss": -8.205694198608398, "global_step": 44219, "epoch": 263} {"train_loss": -8.182376861572266, "global_step": 44220, "epoch": 263} {"train_loss": -7.965737342834473, "global_step": 44221, "epoch": 263} {"train_loss": -8.310114860534668, "global_step": 44222, "epoch": 263} {"train_loss": -8.039340019226074, "global_step": 44223, "epoch": 263} {"train_loss": -8.302056312561035, "global_step": 44224, "epoch": 263} {"train_loss": -8.094472885131836, "global_step": 44225, "epoch": 263} {"train_loss": -7.787813186645508, "global_step": 44226, "epoch": 263} {"train_loss": -8.195218086242676, "global_step": 44227, "epoch": 263} {"train_loss": -8.210342407226562, "global_step": 44228, "epoch": 263} {"train_loss": -8.138409614562988, "global_step": 44229, "epoch": 263} {"train_loss": -7.982619285583496, "global_step": 44230, "epoch": 263} {"train_loss": -8.236837387084961, "global_step": 44231, "epoch": 263} {"train_loss": -8.122140884399414, "global_step": 44232, "epoch": 263} {"train_loss": -8.330076217651367, "global_step": 44233, "epoch": 263} {"train_loss": -8.031216621398926, "global_step": 44234, "epoch": 263} {"train_loss": -8.016033172607422, "global_step": 44235, "epoch": 263} {"train_loss": -8.098175048828125, "global_step": 44236, "epoch": 263} {"train_loss": -8.268224716186523, "global_step": 44237, "epoch": 263} {"train_loss": -8.121232032775879, "global_step": 44238, "epoch": 263} {"train_loss": -8.29298210144043, "global_step": 44239, "epoch": 263} {"train_loss": -7.996922969818115, "global_step": 44240, "epoch": 263} {"train_loss": -8.282207489013672, "global_step": 44241, "epoch": 263} {"train_loss": -8.054168701171875, "global_step": 44242, "epoch": 263} {"train_loss": -8.311324119567871, "global_step": 44243, "epoch": 263} {"train_loss": -8.10060977935791, "global_step": 44244, "epoch": 263} {"train_loss": -8.32294750213623, "global_step": 44245, "epoch": 263} {"train_loss": -7.964055061340332, "global_step": 44246, "epoch": 263} {"train_loss": -8.159215927124023, "global_step": 44247, "epoch": 263} {"train_loss": -7.88417911529541, "global_step": 44248, "epoch": 263} {"train_loss": -7.968333721160889, "global_step": 44249, "epoch": 263} {"train_loss": -8.18824577331543, "global_step": 44250, "epoch": 263} {"train_loss": -8.25838851928711, "global_step": 44251, "epoch": 263} {"train_loss": -8.30569839477539, "global_step": 44252, "epoch": 263} {"train_loss": -8.311415672302246, "global_step": 44253, "epoch": 263} {"train_loss": -8.096010208129883, "global_step": 44254, "epoch": 263} {"train_loss": -8.326604843139648, "global_step": 44255, "epoch": 263} {"train_loss": -7.9256672859191895, "global_step": 44256, "epoch": 263} {"train_loss": -8.094087600708008, "global_step": 44257, "epoch": 263} {"train_loss": -7.965257167816162, "global_step": 44258, "epoch": 263} {"train_loss": -8.14405345916748, "global_step": 44259, "epoch": 263} {"train_loss": -7.992981910705566, "global_step": 44260, "epoch": 263} {"train_loss": -8.169189453125, "global_step": 44261, "epoch": 263} {"train_loss": -8.060089111328125, "global_step": 44262, "epoch": 263} {"train_loss": -7.969634532928467, "global_step": 44263, "epoch": 263} {"train_loss": -7.952276229858398, "global_step": 44264, "epoch": 263} {"train_loss": -7.927099227905273, "global_step": 44265, "epoch": 263} {"train_loss": -8.162683486938477, "global_step": 44266, "epoch": 263} {"train_loss": -7.914702415466309, "global_step": 44267, "epoch": 263} {"train_loss": -8.065122604370117, "global_step": 44268, "epoch": 263} {"train_loss": -7.918482780456543, "global_step": 44269, "epoch": 263} {"train_loss": -7.89651346206665, "global_step": 44270, "epoch": 263} {"train_loss": -7.910595417022705, "global_step": 44271, "epoch": 263} {"train_loss": -8.205055236816406, "global_step": 44272, "epoch": 263} {"train_loss": -8.173711776733398, "global_step": 44273, "epoch": 263} {"train_loss": -8.083284378051758, "global_step": 44274, "epoch": 263} {"train_loss": -7.949289798736572, "global_step": 44275, "epoch": 263} {"train_loss": -7.95817756652832, "global_step": 44276, "epoch": 263} {"train_loss": -8.096181869506836, "global_step": 44277, "epoch": 263} {"train_loss": -8.261678695678711, "global_step": 44278, "epoch": 263} {"train_loss": -8.171802520751953, "global_step": 44279, "epoch": 263} {"train_loss": -7.843700408935547, "global_step": 44280, "epoch": 263} {"train_loss": -8.14743423461914, "global_step": 44281, "epoch": 263} {"train_loss": -7.969002723693848, "global_step": 44282, "epoch": 263} {"train_loss": -8.375870704650879, "global_step": 44283, "epoch": 263} {"train_loss": -8.087271690368652, "global_step": 44284, "epoch": 263} {"train_loss": -8.232564926147461, "global_step": 44285, "epoch": 263} {"train_loss": -8.123076438903809, "global_step": 44286, "epoch": 263} {"train_loss": -8.133405685424805, "global_step": 44287, "epoch": 263} {"train_loss": -8.272563934326172, "global_step": 44288, "epoch": 263} {"train_loss": -8.392953872680664, "global_step": 44289, "epoch": 263} {"train_loss": -7.946549415588379, "global_step": 44290, "epoch": 263} {"train_loss": -8.316402435302734, "global_step": 44291, "epoch": 263} {"train_loss": -8.083602905273438, "global_step": 44292, "epoch": 263} {"train_loss": -8.132627487182617, "global_step": 44293, "epoch": 263} {"train_loss": -8.127131462097168, "global_step": 44294, "epoch": 263} {"train_loss": -8.216732025146484, "global_step": 44295, "epoch": 263} {"train_loss": -7.928877830505371, "global_step": 44296, "epoch": 263} {"train_loss": -7.9614715576171875, "global_step": 44297, "epoch": 263} {"train_loss": -7.829767227172852, "global_step": 44298, "epoch": 263} {"train_loss": -7.949798107147217, "global_step": 44299, "epoch": 263} {"train_loss": -8.064835548400879, "global_step": 44300, "epoch": 263} {"train_loss": -8.0518217086792, "global_step": 44301, "epoch": 263} {"train_loss": -7.991720676422119, "global_step": 44302, "epoch": 263} {"train_loss": -8.131745338439941, "global_step": 44303, "epoch": 263} {"train_loss": -8.055999755859375, "global_step": 44304, "epoch": 263} {"train_loss": -8.000287055969238, "global_step": 44305, "epoch": 263} {"train_loss": -7.922520637512207, "global_step": 44306, "epoch": 263} {"train_loss": -8.198898315429688, "global_step": 44307, "epoch": 263} {"train_loss": -7.914312839508057, "global_step": 44308, "epoch": 263} {"train_loss": -8.175046920776367, "global_step": 44309, "epoch": 263} {"train_loss": -7.834547996520996, "global_step": 44310, "epoch": 263} {"train_loss": -8.084172248840332, "global_step": 44311, "epoch": 263} {"train_loss": -7.967790126800537, "global_step": 44312, "epoch": 263} {"train_loss": -8.080554962158203, "global_step": 44313, "epoch": 263} {"train_loss": -7.899846076965332, "global_step": 44314, "epoch": 263} {"train_loss": -8.284133911132812, "global_step": 44315, "epoch": 263} {"train_loss": -8.002677917480469, "global_step": 44316, "epoch": 263} {"train_loss": -8.050219535827637, "global_step": 44317, "epoch": 263} {"train_loss": -8.202388763427734, "global_step": 44318, "epoch": 263} {"train_loss": -8.126946449279785, "global_step": 44319, "epoch": 263} {"train_loss": -8.155954360961914, "global_step": 44320, "epoch": 263} {"train_loss": -8.255172729492188, "global_step": 44321, "epoch": 263} {"train_loss": -8.332189559936523, "global_step": 44322, "epoch": 263} {"train_loss": -8.089287757873535, "global_step": 44323, "epoch": 263} {"train_loss": -8.228797912597656, "global_step": 44324, "epoch": 263} {"train_loss": -8.244548797607422, "global_step": 44325, "epoch": 263} {"train_loss": -8.21811294555664, "global_step": 44326, "epoch": 263} {"train_loss": -7.874358177185059, "global_step": 44327, "epoch": 263} {"train_loss": -8.097465515136719, "global_step": 44328, "epoch": 263} {"train_loss": -8.227692604064941, "global_step": 44329, "epoch": 263} {"train_loss": -8.318155288696289, "global_step": 44330, "epoch": 263} {"train_loss": -8.098938941955566, "global_step": 44331, "epoch": 263} {"train_loss": -8.124272346496582, "global_step": 44332, "epoch": 263} {"train_loss": -8.435477256774902, "global_step": 44333, "epoch": 263} {"train_loss": -8.301192283630371, "global_step": 44334, "epoch": 263} {"train_loss": -8.267574310302734, "global_step": 44335, "epoch": 263} {"train_loss": -8.15115737915039, "global_step": 44336, "epoch": 263} {"train_loss": -8.203543663024902, "global_step": 44337, "epoch": 263} {"train_loss": -7.888379096984863, "global_step": 44338, "epoch": 263} {"train_loss": -8.160306930541992, "global_step": 44339, "epoch": 263} {"train_loss": -8.095017433166504, "global_step": 44340, "epoch": 263} {"train_loss": -8.102266311645508, "global_step": 44341, "epoch": 263} {"train_loss": -7.953129768371582, "global_step": 44342, "epoch": 263} {"train_loss": -8.028005599975586, "global_step": 44343, "epoch": 263} {"train_loss": -7.987371444702148, "global_step": 44344, "epoch": 263} {"train_loss": -7.9699506759643555, "global_step": 44345, "epoch": 263} {"train_loss": -8.159113883972168, "global_step": 44346, "epoch": 263} {"train_loss": -7.83500862121582, "global_step": 44347, "epoch": 263} {"train_loss": -7.764285087585449, "global_step": 44348, "epoch": 263} {"train_loss": -7.951928615570068, "global_step": 44349, "epoch": 263} {"train_loss": -7.613804817199707, "global_step": 44350, "epoch": 263} {"train_loss": -8.110738371099744, "global_step": 44351, "epoch": 263, "val_loss": 185974.125} {"train_loss": -7.613639831542969, "global_step": 44352, "epoch": 264} {"train_loss": -8.090194702148438, "global_step": 44353, "epoch": 264} {"train_loss": -7.907436847686768, "global_step": 44354, "epoch": 264} {"train_loss": -8.044504165649414, "global_step": 44355, "epoch": 264} {"train_loss": -7.967806816101074, "global_step": 44356, "epoch": 264} {"train_loss": -7.953000545501709, "global_step": 44357, "epoch": 264} {"train_loss": -8.10476303100586, "global_step": 44358, "epoch": 264} {"train_loss": -8.02341365814209, "global_step": 44359, "epoch": 264} {"train_loss": -8.15740966796875, "global_step": 44360, "epoch": 264} {"train_loss": -7.954964637756348, "global_step": 44361, "epoch": 264} {"train_loss": -8.029718399047852, "global_step": 44362, "epoch": 264} {"train_loss": -7.938540935516357, "global_step": 44363, "epoch": 264} {"train_loss": -8.093748092651367, "global_step": 44364, "epoch": 264} {"train_loss": -8.124540328979492, "global_step": 44365, "epoch": 264} {"train_loss": -8.266956329345703, "global_step": 44366, "epoch": 264} {"train_loss": -8.034768104553223, "global_step": 44367, "epoch": 264} {"train_loss": -8.304930686950684, "global_step": 44368, "epoch": 264} {"train_loss": -8.133995056152344, "global_step": 44369, "epoch": 264} {"train_loss": -8.329644203186035, "global_step": 44370, "epoch": 264} {"train_loss": -8.26156997680664, "global_step": 44371, "epoch": 264} {"train_loss": -8.240612030029297, "global_step": 44372, "epoch": 264} {"train_loss": -8.123244285583496, "global_step": 44373, "epoch": 264} {"train_loss": -8.046443939208984, "global_step": 44374, "epoch": 264} {"train_loss": -8.170347213745117, "global_step": 44375, "epoch": 264} {"train_loss": -8.118904113769531, "global_step": 44376, "epoch": 264} {"train_loss": -8.022783279418945, "global_step": 44377, "epoch": 264} {"train_loss": -8.094958305358887, "global_step": 44378, "epoch": 264} {"train_loss": -7.92741584777832, "global_step": 44379, "epoch": 264} {"train_loss": -7.9875054359436035, "global_step": 44380, "epoch": 264} {"train_loss": -8.149393081665039, "global_step": 44381, "epoch": 264} {"train_loss": -8.123397827148438, "global_step": 44382, "epoch": 264} {"train_loss": -8.167943954467773, "global_step": 44383, "epoch": 264} {"train_loss": -8.026251792907715, "global_step": 44384, "epoch": 264} {"train_loss": -8.041421890258789, "global_step": 44385, "epoch": 264} {"train_loss": -7.839439392089844, "global_step": 44386, "epoch": 264} {"train_loss": -8.05418872833252, "global_step": 44387, "epoch": 264} {"train_loss": -8.171730995178223, "global_step": 44388, "epoch": 264} {"train_loss": -7.899374008178711, "global_step": 44389, "epoch": 264} {"train_loss": -7.980898380279541, "global_step": 44390, "epoch": 264} {"train_loss": -7.90778923034668, "global_step": 44391, "epoch": 264} {"train_loss": -8.099265098571777, "global_step": 44392, "epoch": 264} {"train_loss": -8.021963119506836, "global_step": 44393, "epoch": 264} {"train_loss": -8.04730224609375, "global_step": 44394, "epoch": 264} {"train_loss": -8.045366287231445, "global_step": 44395, "epoch": 264} {"train_loss": -8.12584114074707, "global_step": 44396, "epoch": 264} {"train_loss": -8.16668701171875, "global_step": 44397, "epoch": 264} {"train_loss": -8.20345687866211, "global_step": 44398, "epoch": 264} {"train_loss": -8.066421508789062, "global_step": 44399, "epoch": 264} {"train_loss": -8.190824508666992, "global_step": 44400, "epoch": 264} {"train_loss": -8.232365608215332, "global_step": 44401, "epoch": 264} {"train_loss": -8.021080017089844, "global_step": 44402, "epoch": 264} {"train_loss": -7.922578811645508, "global_step": 44403, "epoch": 264} {"train_loss": -8.064552307128906, "global_step": 44404, "epoch": 264} {"train_loss": -8.05637264251709, "global_step": 44405, "epoch": 264} {"train_loss": -8.23800277709961, "global_step": 44406, "epoch": 264} {"train_loss": -8.098912239074707, "global_step": 44407, "epoch": 264} {"train_loss": -8.122808456420898, "global_step": 44408, "epoch": 264} {"train_loss": -8.16395092010498, "global_step": 44409, "epoch": 264} {"train_loss": -8.275081634521484, "global_step": 44410, "epoch": 264} {"train_loss": -8.170127868652344, "global_step": 44411, "epoch": 264} {"train_loss": -8.225445747375488, "global_step": 44412, "epoch": 264} {"train_loss": -8.111759185791016, "global_step": 44413, "epoch": 264} {"train_loss": -7.98526668548584, "global_step": 44414, "epoch": 264} {"train_loss": -8.225359916687012, "global_step": 44415, "epoch": 264} {"train_loss": -7.933108329772949, "global_step": 44416, "epoch": 264} {"train_loss": -8.109317779541016, "global_step": 44417, "epoch": 264} {"train_loss": -8.137986183166504, "global_step": 44418, "epoch": 264} {"train_loss": -8.347454071044922, "global_step": 44419, "epoch": 264} {"train_loss": -8.12239933013916, "global_step": 44420, "epoch": 264} {"train_loss": -8.225473403930664, "global_step": 44421, "epoch": 264} {"train_loss": -8.171926498413086, "global_step": 44422, "epoch": 264} {"train_loss": -8.183728218078613, "global_step": 44423, "epoch": 264} {"train_loss": -8.27842903137207, "global_step": 44424, "epoch": 264} {"train_loss": -8.05224609375, "global_step": 44425, "epoch": 264} {"train_loss": -8.123018264770508, "global_step": 44426, "epoch": 264} {"train_loss": -7.967369556427002, "global_step": 44427, "epoch": 264} {"train_loss": -8.192455291748047, "global_step": 44428, "epoch": 264} {"train_loss": -8.222183227539062, "global_step": 44429, "epoch": 264} {"train_loss": -8.126943588256836, "global_step": 44430, "epoch": 264} {"train_loss": -8.006189346313477, "global_step": 44431, "epoch": 264} {"train_loss": -8.070283889770508, "global_step": 44432, "epoch": 264} {"train_loss": -8.123151779174805, "global_step": 44433, "epoch": 264} {"train_loss": -8.053529739379883, "global_step": 44434, "epoch": 264} {"train_loss": -8.201818466186523, "global_step": 44435, "epoch": 264} {"train_loss": -8.268006324768066, "global_step": 44436, "epoch": 264} {"train_loss": -8.001176834106445, "global_step": 44437, "epoch": 264} {"train_loss": -7.849810600280762, "global_step": 44438, "epoch": 264} {"train_loss": -8.078064918518066, "global_step": 44439, "epoch": 264} {"train_loss": -7.969003677368164, "global_step": 44440, "epoch": 264} {"train_loss": -8.072843551635742, "global_step": 44441, "epoch": 264} {"train_loss": -7.875925064086914, "global_step": 44442, "epoch": 264} {"train_loss": -7.902697563171387, "global_step": 44443, "epoch": 264} {"train_loss": -7.827953338623047, "global_step": 44444, "epoch": 264} {"train_loss": -8.06760025024414, "global_step": 44445, "epoch": 264} {"train_loss": -8.152767181396484, "global_step": 44446, "epoch": 264} {"train_loss": -7.840599060058594, "global_step": 44447, "epoch": 264} {"train_loss": -8.180282592773438, "global_step": 44448, "epoch": 264} {"train_loss": -8.088233947753906, "global_step": 44449, "epoch": 264} {"train_loss": -8.127965927124023, "global_step": 44450, "epoch": 264} {"train_loss": -8.13458251953125, "global_step": 44451, "epoch": 264} {"train_loss": -7.985370635986328, "global_step": 44452, "epoch": 264} {"train_loss": -8.19126033782959, "global_step": 44453, "epoch": 264} {"train_loss": -8.31668472290039, "global_step": 44454, "epoch": 264} {"train_loss": -8.043390274047852, "global_step": 44455, "epoch": 264} {"train_loss": -8.022945404052734, "global_step": 44456, "epoch": 264} {"train_loss": -8.25381088256836, "global_step": 44457, "epoch": 264} {"train_loss": -7.963188171386719, "global_step": 44458, "epoch": 264} {"train_loss": -8.122108459472656, "global_step": 44459, "epoch": 264} {"train_loss": -8.217488288879395, "global_step": 44460, "epoch": 264} {"train_loss": -7.952042579650879, "global_step": 44461, "epoch": 264} {"train_loss": -7.945855617523193, "global_step": 44462, "epoch": 264} {"train_loss": -8.176856994628906, "global_step": 44463, "epoch": 264} {"train_loss": -8.077369689941406, "global_step": 44464, "epoch": 264} {"train_loss": -8.33454704284668, "global_step": 44465, "epoch": 264} {"train_loss": -7.878256797790527, "global_step": 44466, "epoch": 264} {"train_loss": -7.960556507110596, "global_step": 44467, "epoch": 264} {"train_loss": -8.268637657165527, "global_step": 44468, "epoch": 264} {"train_loss": -7.878482818603516, "global_step": 44469, "epoch": 264} {"train_loss": -7.886637210845947, "global_step": 44470, "epoch": 264} {"train_loss": -7.792716026306152, "global_step": 44471, "epoch": 264} {"train_loss": -7.623857498168945, "global_step": 44472, "epoch": 264} {"train_loss": -7.74321985244751, "global_step": 44473, "epoch": 264} {"train_loss": -7.914338111877441, "global_step": 44474, "epoch": 264} {"train_loss": -7.7970781326293945, "global_step": 44475, "epoch": 264} {"train_loss": -7.875808238983154, "global_step": 44476, "epoch": 264} {"train_loss": -8.078200340270996, "global_step": 44477, "epoch": 264} {"train_loss": -8.124496459960938, "global_step": 44478, "epoch": 264} {"train_loss": -7.863275051116943, "global_step": 44479, "epoch": 264} {"train_loss": -8.089394569396973, "global_step": 44480, "epoch": 264} {"train_loss": -8.295934677124023, "global_step": 44481, "epoch": 264} {"train_loss": -8.162683486938477, "global_step": 44482, "epoch": 264} {"train_loss": -8.152329444885254, "global_step": 44483, "epoch": 264} {"train_loss": -8.07352066040039, "global_step": 44484, "epoch": 264} {"train_loss": -8.187682151794434, "global_step": 44485, "epoch": 264} {"train_loss": -8.085909843444824, "global_step": 44486, "epoch": 264} {"train_loss": -7.968480110168457, "global_step": 44487, "epoch": 264} {"train_loss": -8.278718948364258, "global_step": 44488, "epoch": 264} {"train_loss": -8.099135398864746, "global_step": 44489, "epoch": 264} {"train_loss": -8.024599075317383, "global_step": 44490, "epoch": 264} {"train_loss": -7.848630905151367, "global_step": 44491, "epoch": 264} {"train_loss": -8.140613555908203, "global_step": 44492, "epoch": 264} {"train_loss": -8.174747467041016, "global_step": 44493, "epoch": 264} {"train_loss": -8.055933952331543, "global_step": 44494, "epoch": 264} {"train_loss": -8.19752311706543, "global_step": 44495, "epoch": 264} {"train_loss": -8.321357727050781, "global_step": 44496, "epoch": 264} {"train_loss": -7.938769340515137, "global_step": 44497, "epoch": 264} {"train_loss": -8.052729606628418, "global_step": 44498, "epoch": 264} {"train_loss": -8.362759590148926, "global_step": 44499, "epoch": 264} {"train_loss": -8.121810913085938, "global_step": 44500, "epoch": 264} {"train_loss": -8.034133911132812, "global_step": 44501, "epoch": 264} {"train_loss": -8.287327766418457, "global_step": 44502, "epoch": 264} {"train_loss": -8.07322883605957, "global_step": 44503, "epoch": 264} {"train_loss": -8.216960906982422, "global_step": 44504, "epoch": 264} {"train_loss": -8.00281047821045, "global_step": 44505, "epoch": 264} {"train_loss": -8.28399658203125, "global_step": 44506, "epoch": 264} {"train_loss": -8.007335662841797, "global_step": 44507, "epoch": 264} {"train_loss": -7.973329544067383, "global_step": 44508, "epoch": 264} {"train_loss": -8.336271286010742, "global_step": 44509, "epoch": 264} {"train_loss": -8.142661094665527, "global_step": 44510, "epoch": 264} {"train_loss": -8.175496101379395, "global_step": 44511, "epoch": 264} {"train_loss": -8.302372932434082, "global_step": 44512, "epoch": 264} {"train_loss": -8.19089412689209, "global_step": 44513, "epoch": 264} {"train_loss": -8.148534774780273, "global_step": 44514, "epoch": 264} {"train_loss": -8.138790130615234, "global_step": 44515, "epoch": 264} {"train_loss": -8.344717025756836, "global_step": 44516, "epoch": 264} {"train_loss": -8.177082061767578, "global_step": 44517, "epoch": 264} {"train_loss": -8.141510009765625, "global_step": 44518, "epoch": 264} {"train_loss": -8.086775285857064, "global_step": 44519, "epoch": 264, "val_loss": 183990.21875} {"train_loss": -8.171333312988281, "global_step": 44520, "epoch": 265} {"train_loss": -8.272270202636719, "global_step": 44521, "epoch": 265} {"train_loss": -8.206682205200195, "global_step": 44522, "epoch": 265} {"train_loss": -8.27197551727295, "global_step": 44523, "epoch": 265} {"train_loss": -8.11332893371582, "global_step": 44524, "epoch": 265} {"train_loss": -7.762585163116455, "global_step": 44525, "epoch": 265} {"train_loss": -8.210558891296387, "global_step": 44526, "epoch": 265} {"train_loss": -7.598480224609375, "global_step": 44527, "epoch": 265} {"train_loss": -8.10794448852539, "global_step": 44528, "epoch": 265} {"train_loss": -7.9289960861206055, "global_step": 44529, "epoch": 265} {"train_loss": -8.009544372558594, "global_step": 44530, "epoch": 265} {"train_loss": -7.843365669250488, "global_step": 44531, "epoch": 265} {"train_loss": -7.95830774307251, "global_step": 44532, "epoch": 265} {"train_loss": -7.850252151489258, "global_step": 44533, "epoch": 265} {"train_loss": -7.667588233947754, "global_step": 44534, "epoch": 265} {"train_loss": -7.909183502197266, "global_step": 44535, "epoch": 265} {"train_loss": -7.863785743713379, "global_step": 44536, "epoch": 265} {"train_loss": -7.8455047607421875, "global_step": 44537, "epoch": 265} {"train_loss": -7.83564567565918, "global_step": 44538, "epoch": 265} {"train_loss": -7.590078353881836, "global_step": 44539, "epoch": 265} {"train_loss": -7.774975776672363, "global_step": 44540, "epoch": 265} {"train_loss": -7.922590255737305, "global_step": 44541, "epoch": 265} {"train_loss": -7.7703752517700195, "global_step": 44542, "epoch": 265} {"train_loss": -7.891007900238037, "global_step": 44543, "epoch": 265} {"train_loss": -7.886870384216309, "global_step": 44544, "epoch": 265} {"train_loss": -7.9673991203308105, "global_step": 44545, "epoch": 265} {"train_loss": -7.888473987579346, "global_step": 44546, "epoch": 265} {"train_loss": -7.772652626037598, "global_step": 44547, "epoch": 265} {"train_loss": -7.981781005859375, "global_step": 44548, "epoch": 265} {"train_loss": -7.825205326080322, "global_step": 44549, "epoch": 265} {"train_loss": -8.005857467651367, "global_step": 44550, "epoch": 265} {"train_loss": -7.903035640716553, "global_step": 44551, "epoch": 265} {"train_loss": -7.648831844329834, "global_step": 44552, "epoch": 265} {"train_loss": -8.12588882446289, "global_step": 44553, "epoch": 265} {"train_loss": -8.056509971618652, "global_step": 44554, "epoch": 265} {"train_loss": -8.09055233001709, "global_step": 44555, "epoch": 265} {"train_loss": -8.045366287231445, "global_step": 44556, "epoch": 265} {"train_loss": -8.277276992797852, "global_step": 44557, "epoch": 265} {"train_loss": -8.00345516204834, "global_step": 44558, "epoch": 265} {"train_loss": -8.236272811889648, "global_step": 44559, "epoch": 265} {"train_loss": -8.043313026428223, "global_step": 44560, "epoch": 265} {"train_loss": -8.293123245239258, "global_step": 44561, "epoch": 265} {"train_loss": -8.038166999816895, "global_step": 44562, "epoch": 265} {"train_loss": -8.111125946044922, "global_step": 44563, "epoch": 265} {"train_loss": -7.707438945770264, "global_step": 44564, "epoch": 265} {"train_loss": -8.287454605102539, "global_step": 44565, "epoch": 265} {"train_loss": -8.04385757446289, "global_step": 44566, "epoch": 265} {"train_loss": -8.160243034362793, "global_step": 44567, "epoch": 265} {"train_loss": -7.962422847747803, "global_step": 44568, "epoch": 265} {"train_loss": -8.023948669433594, "global_step": 44569, "epoch": 265} {"train_loss": -8.116619110107422, "global_step": 44570, "epoch": 265} {"train_loss": -7.982946872711182, "global_step": 44571, "epoch": 265} {"train_loss": -8.199971199035645, "global_step": 44572, "epoch": 265} {"train_loss": -8.148529052734375, "global_step": 44573, "epoch": 265} {"train_loss": -8.29635238647461, "global_step": 44574, "epoch": 265} {"train_loss": -8.30974006652832, "global_step": 44575, "epoch": 265} {"train_loss": -8.196687698364258, "global_step": 44576, "epoch": 265} {"train_loss": -8.237957954406738, "global_step": 44577, "epoch": 265} {"train_loss": -8.079964637756348, "global_step": 44578, "epoch": 265} {"train_loss": -8.36938762664795, "global_step": 44579, "epoch": 265} {"train_loss": -8.408889770507812, "global_step": 44580, "epoch": 265} {"train_loss": -8.511211395263672, "global_step": 44581, "epoch": 265} {"train_loss": -8.3504638671875, "global_step": 44582, "epoch": 265} {"train_loss": -8.000543594360352, "global_step": 44583, "epoch": 265} {"train_loss": -8.232024192810059, "global_step": 44584, "epoch": 265} {"train_loss": -8.12621021270752, "global_step": 44585, "epoch": 265} {"train_loss": -8.058809280395508, "global_step": 44586, "epoch": 265} {"train_loss": -8.497110366821289, "global_step": 44587, "epoch": 265} {"train_loss": -8.392033576965332, "global_step": 44588, "epoch": 265} {"train_loss": -8.209480285644531, "global_step": 44589, "epoch": 265} {"train_loss": -8.273451805114746, "global_step": 44590, "epoch": 265} {"train_loss": -8.210746765136719, "global_step": 44591, "epoch": 265} {"train_loss": -8.180961608886719, "global_step": 44592, "epoch": 265} {"train_loss": -8.014007568359375, "global_step": 44593, "epoch": 265} {"train_loss": -7.754979610443115, "global_step": 44594, "epoch": 265} {"train_loss": -7.863245010375977, "global_step": 44595, "epoch": 265} {"train_loss": -8.193245887756348, "global_step": 44596, "epoch": 265} {"train_loss": -7.952510833740234, "global_step": 44597, "epoch": 265} {"train_loss": -8.041280746459961, "global_step": 44598, "epoch": 265} {"train_loss": -7.779473304748535, "global_step": 44599, "epoch": 265} {"train_loss": -8.112760543823242, "global_step": 44600, "epoch": 265} {"train_loss": -8.068016052246094, "global_step": 44601, "epoch": 265} {"train_loss": -8.109219551086426, "global_step": 44602, "epoch": 265} {"train_loss": -7.775803565979004, "global_step": 44603, "epoch": 265} {"train_loss": -8.197735786437988, "global_step": 44604, "epoch": 265} {"train_loss": -8.062243461608887, "global_step": 44605, "epoch": 265} {"train_loss": -8.15147876739502, "global_step": 44606, "epoch": 265} {"train_loss": -7.941749095916748, "global_step": 44607, "epoch": 265} {"train_loss": -8.28773307800293, "global_step": 44608, "epoch": 265} {"train_loss": -8.007689476013184, "global_step": 44609, "epoch": 265} {"train_loss": -7.756726264953613, "global_step": 44610, "epoch": 265} {"train_loss": -8.071327209472656, "global_step": 44611, "epoch": 265} {"train_loss": -8.170433044433594, "global_step": 44612, "epoch": 265} {"train_loss": -7.912256240844727, "global_step": 44613, "epoch": 265} {"train_loss": -8.066169738769531, "global_step": 44614, "epoch": 265} {"train_loss": -8.005754470825195, "global_step": 44615, "epoch": 265} {"train_loss": -7.845348834991455, "global_step": 44616, "epoch": 265} {"train_loss": -8.28523063659668, "global_step": 44617, "epoch": 265} {"train_loss": -7.942171096801758, "global_step": 44618, "epoch": 265} {"train_loss": -8.192197799682617, "global_step": 44619, "epoch": 265} {"train_loss": -7.838676929473877, "global_step": 44620, "epoch": 265} {"train_loss": -8.035072326660156, "global_step": 44621, "epoch": 265} {"train_loss": -8.085387229919434, "global_step": 44622, "epoch": 265} {"train_loss": -7.996454238891602, "global_step": 44623, "epoch": 265} {"train_loss": -8.299796104431152, "global_step": 44624, "epoch": 265} {"train_loss": -8.033370971679688, "global_step": 44625, "epoch": 265} {"train_loss": -8.065674781799316, "global_step": 44626, "epoch": 265} {"train_loss": -7.901422500610352, "global_step": 44627, "epoch": 265} {"train_loss": -8.168252944946289, "global_step": 44628, "epoch": 265} {"train_loss": -8.031171798706055, "global_step": 44629, "epoch": 265} {"train_loss": -7.99652099609375, "global_step": 44630, "epoch": 265} {"train_loss": -7.8913421630859375, "global_step": 44631, "epoch": 265} {"train_loss": -8.1487398147583, "global_step": 44632, "epoch": 265} {"train_loss": -8.127952575683594, "global_step": 44633, "epoch": 265} {"train_loss": -8.059000968933105, "global_step": 44634, "epoch": 265} {"train_loss": -8.119274139404297, "global_step": 44635, "epoch": 265} {"train_loss": -8.325987815856934, "global_step": 44636, "epoch": 265} {"train_loss": -8.062217712402344, "global_step": 44637, "epoch": 265} {"train_loss": -8.235101699829102, "global_step": 44638, "epoch": 265} {"train_loss": -8.342353820800781, "global_step": 44639, "epoch": 265} {"train_loss": -8.15518569946289, "global_step": 44640, "epoch": 265} {"train_loss": -8.121301651000977, "global_step": 44641, "epoch": 265} {"train_loss": -7.969170093536377, "global_step": 44642, "epoch": 265} {"train_loss": -8.09414005279541, "global_step": 44643, "epoch": 265} {"train_loss": -8.207841873168945, "global_step": 44644, "epoch": 265} {"train_loss": -8.238500595092773, "global_step": 44645, "epoch": 265} {"train_loss": -8.220565795898438, "global_step": 44646, "epoch": 265} {"train_loss": -8.068561553955078, "global_step": 44647, "epoch": 265} {"train_loss": -8.217951774597168, "global_step": 44648, "epoch": 265} {"train_loss": -8.263328552246094, "global_step": 44649, "epoch": 265} {"train_loss": -8.296401977539062, "global_step": 44650, "epoch": 265} {"train_loss": -8.373538970947266, "global_step": 44651, "epoch": 265} {"train_loss": -8.10700798034668, "global_step": 44652, "epoch": 265} {"train_loss": -7.929367542266846, "global_step": 44653, "epoch": 265} {"train_loss": -8.088281631469727, "global_step": 44654, "epoch": 265} {"train_loss": -8.224907875061035, "global_step": 44655, "epoch": 265} {"train_loss": -7.642429351806641, "global_step": 44656, "epoch": 265} {"train_loss": -7.807839393615723, "global_step": 44657, "epoch": 265} {"train_loss": -7.842878341674805, "global_step": 44658, "epoch": 265} {"train_loss": -8.029351234436035, "global_step": 44659, "epoch": 265} {"train_loss": -7.6869611740112305, "global_step": 44660, "epoch": 265} {"train_loss": -7.951534271240234, "global_step": 44661, "epoch": 265} {"train_loss": -8.005970001220703, "global_step": 44662, "epoch": 265} {"train_loss": -7.927759170532227, "global_step": 44663, "epoch": 265} {"train_loss": -7.836606979370117, "global_step": 44664, "epoch": 265} {"train_loss": -8.084014892578125, "global_step": 44665, "epoch": 265} {"train_loss": -7.776553630828857, "global_step": 44666, "epoch": 265} {"train_loss": -7.949520111083984, "global_step": 44667, "epoch": 265} {"train_loss": -8.062929153442383, "global_step": 44668, "epoch": 265} {"train_loss": -7.764982223510742, "global_step": 44669, "epoch": 265} {"train_loss": -7.706668853759766, "global_step": 44670, "epoch": 265} {"train_loss": -7.9287261962890625, "global_step": 44671, "epoch": 265} {"train_loss": -8.047314643859863, "global_step": 44672, "epoch": 265} {"train_loss": -7.610637664794922, "global_step": 44673, "epoch": 265} {"train_loss": -8.330551147460938, "global_step": 44674, "epoch": 265} {"train_loss": -7.660722255706787, "global_step": 44675, "epoch": 265} {"train_loss": -8.251514434814453, "global_step": 44676, "epoch": 265} {"train_loss": -8.037595748901367, "global_step": 44677, "epoch": 265} {"train_loss": -7.907228469848633, "global_step": 44678, "epoch": 265} {"train_loss": -8.058695793151855, "global_step": 44679, "epoch": 265} {"train_loss": -7.944468021392822, "global_step": 44680, "epoch": 265} {"train_loss": -8.272139549255371, "global_step": 44681, "epoch": 265} {"train_loss": -7.949413299560547, "global_step": 44682, "epoch": 265} {"train_loss": -8.19365119934082, "global_step": 44683, "epoch": 265} {"train_loss": -7.849898338317871, "global_step": 44684, "epoch": 265} {"train_loss": -8.148480415344238, "global_step": 44685, "epoch": 265} {"train_loss": -8.212264060974121, "global_step": 44686, "epoch": 265} {"train_loss": -8.044290934290204, "global_step": 44687, "epoch": 265, "val_loss": 186223.390625, "train_action_mse_error": 8.471281051635742} {"train_loss": -8.008010864257812, "global_step": 44688, "epoch": 266} {"train_loss": -8.110925674438477, "global_step": 44689, "epoch": 266} {"train_loss": -8.018270492553711, "global_step": 44690, "epoch": 266} {"train_loss": -8.054102897644043, "global_step": 44691, "epoch": 266} {"train_loss": -8.042810440063477, "global_step": 44692, "epoch": 266} {"train_loss": -7.8288421630859375, "global_step": 44693, "epoch": 266} {"train_loss": -8.175929069519043, "global_step": 44694, "epoch": 266} {"train_loss": -7.810431480407715, "global_step": 44695, "epoch": 266} {"train_loss": -8.151422500610352, "global_step": 44696, "epoch": 266} {"train_loss": -7.955313682556152, "global_step": 44697, "epoch": 266} {"train_loss": -7.940415382385254, "global_step": 44698, "epoch": 266} {"train_loss": -8.263267517089844, "global_step": 44699, "epoch": 266} {"train_loss": -8.145635604858398, "global_step": 44700, "epoch": 266} {"train_loss": -8.21227741241455, "global_step": 44701, "epoch": 266} {"train_loss": -8.156597137451172, "global_step": 44702, "epoch": 266} {"train_loss": -8.284381866455078, "global_step": 44703, "epoch": 266} {"train_loss": -8.058854103088379, "global_step": 44704, "epoch": 266} {"train_loss": -8.104475975036621, "global_step": 44705, "epoch": 266} {"train_loss": -8.0531005859375, "global_step": 44706, "epoch": 266} {"train_loss": -8.112791061401367, "global_step": 44707, "epoch": 266} {"train_loss": -8.109628677368164, "global_step": 44708, "epoch": 266} {"train_loss": -8.06741714477539, "global_step": 44709, "epoch": 266} {"train_loss": -8.047176361083984, "global_step": 44710, "epoch": 266} {"train_loss": -8.179740905761719, "global_step": 44711, "epoch": 266} {"train_loss": -8.1874418258667, "global_step": 44712, "epoch": 266} {"train_loss": -8.156310081481934, "global_step": 44713, "epoch": 266} {"train_loss": -8.26978874206543, "global_step": 44714, "epoch": 266} {"train_loss": -8.124073028564453, "global_step": 44715, "epoch": 266} {"train_loss": -7.987008094787598, "global_step": 44716, "epoch": 266} {"train_loss": -8.123270034790039, "global_step": 44717, "epoch": 266} {"train_loss": -7.897956848144531, "global_step": 44718, "epoch": 266} {"train_loss": -8.215051651000977, "global_step": 44719, "epoch": 266} {"train_loss": -7.645075798034668, "global_step": 44720, "epoch": 266} {"train_loss": -8.254742622375488, "global_step": 44721, "epoch": 266} {"train_loss": -7.761479377746582, "global_step": 44722, "epoch": 266} {"train_loss": -7.849703788757324, "global_step": 44723, "epoch": 266} {"train_loss": -8.009631156921387, "global_step": 44724, "epoch": 266} {"train_loss": -7.857187747955322, "global_step": 44725, "epoch": 266} {"train_loss": -8.164674758911133, "global_step": 44726, "epoch": 266} {"train_loss": -7.876111030578613, "global_step": 44727, "epoch": 266} {"train_loss": -7.87541389465332, "global_step": 44728, "epoch": 266} {"train_loss": -8.117761611938477, "global_step": 44729, "epoch": 266} {"train_loss": -7.79263973236084, "global_step": 44730, "epoch": 266} {"train_loss": -7.820730209350586, "global_step": 44731, "epoch": 266} {"train_loss": -8.004636764526367, "global_step": 44732, "epoch": 266} {"train_loss": -8.070169448852539, "global_step": 44733, "epoch": 266} {"train_loss": -7.820720672607422, "global_step": 44734, "epoch": 266} {"train_loss": -7.985945701599121, "global_step": 44735, "epoch": 266} {"train_loss": -8.126033782958984, "global_step": 44736, "epoch": 266} {"train_loss": -8.319635391235352, "global_step": 44737, "epoch": 266} {"train_loss": -7.89666223526001, "global_step": 44738, "epoch": 266} {"train_loss": -8.364398002624512, "global_step": 44739, "epoch": 266} {"train_loss": -8.139156341552734, "global_step": 44740, "epoch": 266} {"train_loss": -8.226217269897461, "global_step": 44741, "epoch": 266} {"train_loss": -7.951169013977051, "global_step": 44742, "epoch": 266} {"train_loss": -8.175809860229492, "global_step": 44743, "epoch": 266} {"train_loss": -7.990450382232666, "global_step": 44744, "epoch": 266} {"train_loss": -8.057332992553711, "global_step": 44745, "epoch": 266} {"train_loss": -8.141558647155762, "global_step": 44746, "epoch": 266} {"train_loss": -8.211616516113281, "global_step": 44747, "epoch": 266} {"train_loss": -8.175950050354004, "global_step": 44748, "epoch": 266} {"train_loss": -8.035398483276367, "global_step": 44749, "epoch": 266} {"train_loss": -8.138537406921387, "global_step": 44750, "epoch": 266} {"train_loss": -8.02859115600586, "global_step": 44751, "epoch": 266} {"train_loss": -8.214903831481934, "global_step": 44752, "epoch": 266} {"train_loss": -7.872343063354492, "global_step": 44753, "epoch": 266} {"train_loss": -8.329888343811035, "global_step": 44754, "epoch": 266} {"train_loss": -8.19740104675293, "global_step": 44755, "epoch": 266} {"train_loss": -8.121562957763672, "global_step": 44756, "epoch": 266} {"train_loss": -8.107732772827148, "global_step": 44757, "epoch": 266} {"train_loss": -8.343826293945312, "global_step": 44758, "epoch": 266} {"train_loss": -7.995913505554199, "global_step": 44759, "epoch": 266} {"train_loss": -8.381288528442383, "global_step": 44760, "epoch": 266} {"train_loss": -8.157463073730469, "global_step": 44761, "epoch": 266} {"train_loss": -8.207803726196289, "global_step": 44762, "epoch": 266} {"train_loss": -8.205472946166992, "global_step": 44763, "epoch": 266} {"train_loss": -7.936802864074707, "global_step": 44764, "epoch": 266} {"train_loss": -8.245158195495605, "global_step": 44765, "epoch": 266} {"train_loss": -8.117332458496094, "global_step": 44766, "epoch": 266} {"train_loss": -8.126483917236328, "global_step": 44767, "epoch": 266} {"train_loss": -8.08378791809082, "global_step": 44768, "epoch": 266} {"train_loss": -8.081663131713867, "global_step": 44769, "epoch": 266} {"train_loss": -8.168903350830078, "global_step": 44770, "epoch": 266} {"train_loss": -8.103646278381348, "global_step": 44771, "epoch": 266} {"train_loss": -8.093639373779297, "global_step": 44772, "epoch": 266} {"train_loss": -7.837045192718506, "global_step": 44773, "epoch": 266} {"train_loss": -7.985905170440674, "global_step": 44774, "epoch": 266} {"train_loss": -8.024260520935059, "global_step": 44775, "epoch": 266} {"train_loss": -7.87064266204834, "global_step": 44776, "epoch": 266} {"train_loss": -7.917386054992676, "global_step": 44777, "epoch": 266} {"train_loss": -8.040508270263672, "global_step": 44778, "epoch": 266} {"train_loss": -8.01396369934082, "global_step": 44779, "epoch": 266} {"train_loss": -8.104572296142578, "global_step": 44780, "epoch": 266} {"train_loss": -7.678962707519531, "global_step": 44781, "epoch": 266} {"train_loss": -8.081727027893066, "global_step": 44782, "epoch": 266} {"train_loss": -7.711960792541504, "global_step": 44783, "epoch": 266} {"train_loss": -7.959372520446777, "global_step": 44784, "epoch": 266} {"train_loss": -7.728571891784668, "global_step": 44785, "epoch": 266} {"train_loss": -8.131805419921875, "global_step": 44786, "epoch": 266} {"train_loss": -7.855562686920166, "global_step": 44787, "epoch": 266} {"train_loss": -8.043764114379883, "global_step": 44788, "epoch": 266} {"train_loss": -8.028804779052734, "global_step": 44789, "epoch": 266} {"train_loss": -8.161299705505371, "global_step": 44790, "epoch": 266} {"train_loss": -8.018074035644531, "global_step": 44791, "epoch": 266} {"train_loss": -8.041043281555176, "global_step": 44792, "epoch": 266} {"train_loss": -8.042656898498535, "global_step": 44793, "epoch": 266} {"train_loss": -8.131253242492676, "global_step": 44794, "epoch": 266} {"train_loss": -8.261688232421875, "global_step": 44795, "epoch": 266} {"train_loss": -8.34056568145752, "global_step": 44796, "epoch": 266} {"train_loss": -8.118059158325195, "global_step": 44797, "epoch": 266} {"train_loss": -8.221745491027832, "global_step": 44798, "epoch": 266} {"train_loss": -8.0435152053833, "global_step": 44799, "epoch": 266} {"train_loss": -8.235872268676758, "global_step": 44800, "epoch": 266} {"train_loss": -8.306190490722656, "global_step": 44801, "epoch": 266} {"train_loss": -8.132997512817383, "global_step": 44802, "epoch": 266} {"train_loss": -8.236475944519043, "global_step": 44803, "epoch": 266} {"train_loss": -8.19157600402832, "global_step": 44804, "epoch": 266} {"train_loss": -8.388591766357422, "global_step": 44805, "epoch": 266} {"train_loss": -8.3442964553833, "global_step": 44806, "epoch": 266} {"train_loss": -8.227712631225586, "global_step": 44807, "epoch": 266} {"train_loss": -8.062137603759766, "global_step": 44808, "epoch": 266} {"train_loss": -8.400224685668945, "global_step": 44809, "epoch": 266} {"train_loss": -7.850554466247559, "global_step": 44810, "epoch": 266} {"train_loss": -7.986294746398926, "global_step": 44811, "epoch": 266} {"train_loss": -8.020355224609375, "global_step": 44812, "epoch": 266} {"train_loss": -8.161266326904297, "global_step": 44813, "epoch": 266} {"train_loss": -8.005542755126953, "global_step": 44814, "epoch": 266} {"train_loss": -7.773930549621582, "global_step": 44815, "epoch": 266} {"train_loss": -7.852982044219971, "global_step": 44816, "epoch": 266} {"train_loss": -7.9728684425354, "global_step": 44817, "epoch": 266} {"train_loss": -8.123764991760254, "global_step": 44818, "epoch": 266} {"train_loss": -7.902976036071777, "global_step": 44819, "epoch": 266} {"train_loss": -7.720066070556641, "global_step": 44820, "epoch": 266} {"train_loss": -7.9650750160217285, "global_step": 44821, "epoch": 266} {"train_loss": -8.216897964477539, "global_step": 44822, "epoch": 266} {"train_loss": -7.999759674072266, "global_step": 44823, "epoch": 266} {"train_loss": -7.926117897033691, "global_step": 44824, "epoch": 266} {"train_loss": -8.037019729614258, "global_step": 44825, "epoch": 266} {"train_loss": -7.8481011390686035, "global_step": 44826, "epoch": 266} {"train_loss": -8.016814231872559, "global_step": 44827, "epoch": 266} {"train_loss": -7.9393310546875, "global_step": 44828, "epoch": 266} {"train_loss": -7.947893142700195, "global_step": 44829, "epoch": 266} {"train_loss": -8.031309127807617, "global_step": 44830, "epoch": 266} {"train_loss": -8.025697708129883, "global_step": 44831, "epoch": 266} {"train_loss": -8.227415084838867, "global_step": 44832, "epoch": 266} {"train_loss": -8.062726974487305, "global_step": 44833, "epoch": 266} {"train_loss": -8.197492599487305, "global_step": 44834, "epoch": 266} {"train_loss": -8.024866104125977, "global_step": 44835, "epoch": 266} {"train_loss": -8.03233528137207, "global_step": 44836, "epoch": 266} {"train_loss": -7.954068660736084, "global_step": 44837, "epoch": 266} {"train_loss": -8.02841854095459, "global_step": 44838, "epoch": 266} {"train_loss": -8.03082275390625, "global_step": 44839, "epoch": 266} {"train_loss": -8.12777042388916, "global_step": 44840, "epoch": 266} {"train_loss": -8.349149703979492, "global_step": 44841, "epoch": 266} {"train_loss": -8.027196884155273, "global_step": 44842, "epoch": 266} {"train_loss": -8.253942489624023, "global_step": 44843, "epoch": 266} {"train_loss": -8.237662315368652, "global_step": 44844, "epoch": 266} {"train_loss": -7.915778160095215, "global_step": 44845, "epoch": 266} {"train_loss": -8.198683738708496, "global_step": 44846, "epoch": 266} {"train_loss": -8.050246238708496, "global_step": 44847, "epoch": 266} {"train_loss": -8.227924346923828, "global_step": 44848, "epoch": 266} {"train_loss": -8.062501907348633, "global_step": 44849, "epoch": 266} {"train_loss": -8.113700866699219, "global_step": 44850, "epoch": 266} {"train_loss": -7.938824653625488, "global_step": 44851, "epoch": 266} {"train_loss": -8.283611297607422, "global_step": 44852, "epoch": 266} {"train_loss": -8.143476486206055, "global_step": 44853, "epoch": 266} {"train_loss": -8.170852661132812, "global_step": 44854, "epoch": 266} {"train_loss": -8.071599577154432, "global_step": 44855, "epoch": 266, "val_loss": 184740.703125} {"train_loss": -8.167703628540039, "global_step": 44856, "epoch": 267} {"train_loss": -8.184889793395996, "global_step": 44857, "epoch": 267} {"train_loss": -8.204883575439453, "global_step": 44858, "epoch": 267} {"train_loss": -8.205448150634766, "global_step": 44859, "epoch": 267} {"train_loss": -8.241036415100098, "global_step": 44860, "epoch": 267} {"train_loss": -8.311994552612305, "global_step": 44861, "epoch": 267} {"train_loss": -7.975918769836426, "global_step": 44862, "epoch": 267} {"train_loss": -8.18923568725586, "global_step": 44863, "epoch": 267} {"train_loss": -8.161291122436523, "global_step": 44864, "epoch": 267} {"train_loss": -8.383750915527344, "global_step": 44865, "epoch": 267} {"train_loss": -8.235407829284668, "global_step": 44866, "epoch": 267} {"train_loss": -8.225041389465332, "global_step": 44867, "epoch": 267} {"train_loss": -8.154829025268555, "global_step": 44868, "epoch": 267} {"train_loss": -8.421892166137695, "global_step": 44869, "epoch": 267} {"train_loss": -8.304634094238281, "global_step": 44870, "epoch": 267} {"train_loss": -8.368191719055176, "global_step": 44871, "epoch": 267} {"train_loss": -8.248248100280762, "global_step": 44872, "epoch": 267} {"train_loss": -8.449705123901367, "global_step": 44873, "epoch": 267} {"train_loss": -8.268420219421387, "global_step": 44874, "epoch": 267} {"train_loss": -8.122831344604492, "global_step": 44875, "epoch": 267} {"train_loss": -8.252693176269531, "global_step": 44876, "epoch": 267} {"train_loss": -8.140640258789062, "global_step": 44877, "epoch": 267} {"train_loss": -8.158931732177734, "global_step": 44878, "epoch": 267} {"train_loss": -8.20689582824707, "global_step": 44879, "epoch": 267} {"train_loss": -7.934819221496582, "global_step": 44880, "epoch": 267} {"train_loss": -7.872590065002441, "global_step": 44881, "epoch": 267} {"train_loss": -8.074531555175781, "global_step": 44882, "epoch": 267} {"train_loss": -8.18073844909668, "global_step": 44883, "epoch": 267} {"train_loss": -8.092571258544922, "global_step": 44884, "epoch": 267} {"train_loss": -8.07380485534668, "global_step": 44885, "epoch": 267} {"train_loss": -8.307806968688965, "global_step": 44886, "epoch": 267} {"train_loss": -7.9624924659729, "global_step": 44887, "epoch": 267} {"train_loss": -8.243387222290039, "global_step": 44888, "epoch": 267} {"train_loss": -7.980188846588135, "global_step": 44889, "epoch": 267} {"train_loss": -7.932797908782959, "global_step": 44890, "epoch": 267} {"train_loss": -8.177652359008789, "global_step": 44891, "epoch": 267} {"train_loss": -7.999544620513916, "global_step": 44892, "epoch": 267} {"train_loss": -8.14245319366455, "global_step": 44893, "epoch": 267} {"train_loss": -7.940789222717285, "global_step": 44894, "epoch": 267} {"train_loss": -7.892231464385986, "global_step": 44895, "epoch": 267} {"train_loss": -8.111153602600098, "global_step": 44896, "epoch": 267} {"train_loss": -8.000654220581055, "global_step": 44897, "epoch": 267} {"train_loss": -7.926494598388672, "global_step": 44898, "epoch": 267} {"train_loss": -8.087495803833008, "global_step": 44899, "epoch": 267} {"train_loss": -8.266769409179688, "global_step": 44900, "epoch": 267} {"train_loss": -8.173343658447266, "global_step": 44901, "epoch": 267} {"train_loss": -7.971722602844238, "global_step": 44902, "epoch": 267} {"train_loss": -8.159668922424316, "global_step": 44903, "epoch": 267} {"train_loss": -8.072025299072266, "global_step": 44904, "epoch": 267} {"train_loss": -8.139141082763672, "global_step": 44905, "epoch": 267} {"train_loss": -8.353863716125488, "global_step": 44906, "epoch": 267} {"train_loss": -8.024148941040039, "global_step": 44907, "epoch": 267} {"train_loss": -8.231689453125, "global_step": 44908, "epoch": 267} {"train_loss": -8.180131912231445, "global_step": 44909, "epoch": 267} {"train_loss": -8.33561897277832, "global_step": 44910, "epoch": 267} {"train_loss": -8.26186752319336, "global_step": 44911, "epoch": 267} {"train_loss": -8.44437313079834, "global_step": 44912, "epoch": 267} {"train_loss": -8.309503555297852, "global_step": 44913, "epoch": 267} {"train_loss": -8.351764678955078, "global_step": 44914, "epoch": 267} {"train_loss": -8.054808616638184, "global_step": 44915, "epoch": 267} {"train_loss": -8.375753402709961, "global_step": 44916, "epoch": 267} {"train_loss": -8.110513687133789, "global_step": 44917, "epoch": 267} {"train_loss": -8.177679061889648, "global_step": 44918, "epoch": 267} {"train_loss": -8.029059410095215, "global_step": 44919, "epoch": 267} {"train_loss": -8.198068618774414, "global_step": 44920, "epoch": 267} {"train_loss": -7.838964939117432, "global_step": 44921, "epoch": 267} {"train_loss": -8.220056533813477, "global_step": 44922, "epoch": 267} {"train_loss": -8.06679630279541, "global_step": 44923, "epoch": 267} {"train_loss": -7.810230731964111, "global_step": 44924, "epoch": 267} {"train_loss": -8.24679946899414, "global_step": 44925, "epoch": 267} {"train_loss": -7.7807769775390625, "global_step": 44926, "epoch": 267} {"train_loss": -7.740030288696289, "global_step": 44927, "epoch": 267} {"train_loss": -8.016653060913086, "global_step": 44928, "epoch": 267} {"train_loss": -7.884622573852539, "global_step": 44929, "epoch": 267} {"train_loss": -8.144431114196777, "global_step": 44930, "epoch": 267} {"train_loss": -7.919614315032959, "global_step": 44931, "epoch": 267} {"train_loss": -7.978451251983643, "global_step": 44932, "epoch": 267} {"train_loss": -8.019013404846191, "global_step": 44933, "epoch": 267} {"train_loss": -7.997886657714844, "global_step": 44934, "epoch": 267} {"train_loss": -8.190409660339355, "global_step": 44935, "epoch": 267} {"train_loss": -8.001335144042969, "global_step": 44936, "epoch": 267} {"train_loss": -7.938291072845459, "global_step": 44937, "epoch": 267} {"train_loss": -7.966230392456055, "global_step": 44938, "epoch": 267} {"train_loss": -8.091716766357422, "global_step": 44939, "epoch": 267} {"train_loss": -7.8223652839660645, "global_step": 44940, "epoch": 267} {"train_loss": -8.135099411010742, "global_step": 44941, "epoch": 267} {"train_loss": -7.958682060241699, "global_step": 44942, "epoch": 267} {"train_loss": -8.136188507080078, "global_step": 44943, "epoch": 267} {"train_loss": -8.143503189086914, "global_step": 44944, "epoch": 267} {"train_loss": -7.970371246337891, "global_step": 44945, "epoch": 267} {"train_loss": -8.086992263793945, "global_step": 44946, "epoch": 267} {"train_loss": -7.816066741943359, "global_step": 44947, "epoch": 267} {"train_loss": -8.050981521606445, "global_step": 44948, "epoch": 267} {"train_loss": -7.915238857269287, "global_step": 44949, "epoch": 267} {"train_loss": -8.309765815734863, "global_step": 44950, "epoch": 267} {"train_loss": -7.9390177726745605, "global_step": 44951, "epoch": 267} {"train_loss": -8.182815551757812, "global_step": 44952, "epoch": 267} {"train_loss": -8.167619705200195, "global_step": 44953, "epoch": 267} {"train_loss": -7.928255081176758, "global_step": 44954, "epoch": 267} {"train_loss": -8.082500457763672, "global_step": 44955, "epoch": 267} {"train_loss": -8.08199691772461, "global_step": 44956, "epoch": 267} {"train_loss": -8.185327529907227, "global_step": 44957, "epoch": 267} {"train_loss": -8.056114196777344, "global_step": 44958, "epoch": 267} {"train_loss": -8.365730285644531, "global_step": 44959, "epoch": 267} {"train_loss": -8.106424331665039, "global_step": 44960, "epoch": 267} {"train_loss": -8.195245742797852, "global_step": 44961, "epoch": 267} {"train_loss": -8.060043334960938, "global_step": 44962, "epoch": 267} {"train_loss": -8.090726852416992, "global_step": 44963, "epoch": 267} {"train_loss": -8.169286727905273, "global_step": 44964, "epoch": 267} {"train_loss": -8.163129806518555, "global_step": 44965, "epoch": 267} {"train_loss": -7.887116432189941, "global_step": 44966, "epoch": 267} {"train_loss": -8.084171295166016, "global_step": 44967, "epoch": 267} {"train_loss": -8.30532169342041, "global_step": 44968, "epoch": 267} {"train_loss": -8.277880668640137, "global_step": 44969, "epoch": 267} {"train_loss": -7.994741439819336, "global_step": 44970, "epoch": 267} {"train_loss": -8.015619277954102, "global_step": 44971, "epoch": 267} {"train_loss": -7.964755535125732, "global_step": 44972, "epoch": 267} {"train_loss": -7.794803619384766, "global_step": 44973, "epoch": 267} {"train_loss": -7.9866943359375, "global_step": 44974, "epoch": 267} {"train_loss": -8.12812328338623, "global_step": 44975, "epoch": 267} {"train_loss": -8.198287963867188, "global_step": 44976, "epoch": 267} {"train_loss": -8.17037582397461, "global_step": 44977, "epoch": 267} {"train_loss": -8.068718910217285, "global_step": 44978, "epoch": 267} {"train_loss": -7.894375801086426, "global_step": 44979, "epoch": 267} {"train_loss": -7.8637824058532715, "global_step": 44980, "epoch": 267} {"train_loss": -8.065865516662598, "global_step": 44981, "epoch": 267} {"train_loss": -7.971545219421387, "global_step": 44982, "epoch": 267} {"train_loss": -8.202871322631836, "global_step": 44983, "epoch": 267} {"train_loss": -8.21125602722168, "global_step": 44984, "epoch": 267} {"train_loss": -8.25709342956543, "global_step": 44985, "epoch": 267} {"train_loss": -8.029731750488281, "global_step": 44986, "epoch": 267} {"train_loss": -8.032282829284668, "global_step": 44987, "epoch": 267} {"train_loss": -8.168931007385254, "global_step": 44988, "epoch": 267} {"train_loss": -8.212644577026367, "global_step": 44989, "epoch": 267} {"train_loss": -7.942342281341553, "global_step": 44990, "epoch": 267} {"train_loss": -8.080202102661133, "global_step": 44991, "epoch": 267} {"train_loss": -8.373998641967773, "global_step": 44992, "epoch": 267} {"train_loss": -8.08393669128418, "global_step": 44993, "epoch": 267} {"train_loss": -8.2479248046875, "global_step": 44994, "epoch": 267} {"train_loss": -7.958986282348633, "global_step": 44995, "epoch": 267} {"train_loss": -8.179037094116211, "global_step": 44996, "epoch": 267} {"train_loss": -8.14869499206543, "global_step": 44997, "epoch": 267} {"train_loss": -8.521520614624023, "global_step": 44998, "epoch": 267} {"train_loss": -8.09036636352539, "global_step": 44999, "epoch": 267} {"train_loss": -8.09581470489502, "global_step": 45000, "epoch": 267} {"train_loss": -8.217500686645508, "global_step": 45001, "epoch": 267} {"train_loss": -7.998327255249023, "global_step": 45002, "epoch": 267} {"train_loss": -8.058206558227539, "global_step": 45003, "epoch": 267} {"train_loss": -7.868980407714844, "global_step": 45004, "epoch": 267} {"train_loss": -8.214010238647461, "global_step": 45005, "epoch": 267} {"train_loss": -8.105512619018555, "global_step": 45006, "epoch": 267} {"train_loss": -8.236345291137695, "global_step": 45007, "epoch": 267} {"train_loss": -8.082416534423828, "global_step": 45008, "epoch": 267} {"train_loss": -8.235641479492188, "global_step": 45009, "epoch": 267} {"train_loss": -8.268049240112305, "global_step": 45010, "epoch": 267} {"train_loss": -8.236242294311523, "global_step": 45011, "epoch": 267} {"train_loss": -8.24970817565918, "global_step": 45012, "epoch": 267} {"train_loss": -7.973559379577637, "global_step": 45013, "epoch": 267} {"train_loss": -8.26656723022461, "global_step": 45014, "epoch": 267} {"train_loss": -8.056184768676758, "global_step": 45015, "epoch": 267} {"train_loss": -8.024470329284668, "global_step": 45016, "epoch": 267} {"train_loss": -8.207479476928711, "global_step": 45017, "epoch": 267} {"train_loss": -8.375555038452148, "global_step": 45018, "epoch": 267} {"train_loss": -8.132369995117188, "global_step": 45019, "epoch": 267} {"train_loss": -8.191217422485352, "global_step": 45020, "epoch": 267} {"train_loss": -8.122400283813477, "global_step": 45021, "epoch": 267} {"train_loss": -7.9368977546691895, "global_step": 45022, "epoch": 267} {"train_loss": -8.113610903422037, "global_step": 45023, "epoch": 267, "val_loss": 187224.03125} {"train_loss": -8.169732093811035, "global_step": 45024, "epoch": 268} {"train_loss": -8.105031967163086, "global_step": 45025, "epoch": 268} {"train_loss": -8.01961898803711, "global_step": 45026, "epoch": 268} {"train_loss": -7.641574859619141, "global_step": 45027, "epoch": 268} {"train_loss": -7.690134048461914, "global_step": 45028, "epoch": 268} {"train_loss": -8.068439483642578, "global_step": 45029, "epoch": 268} {"train_loss": -7.8360185623168945, "global_step": 45030, "epoch": 268} {"train_loss": -8.158438682556152, "global_step": 45031, "epoch": 268} {"train_loss": -8.065713882446289, "global_step": 45032, "epoch": 268} {"train_loss": -8.114243507385254, "global_step": 45033, "epoch": 268} {"train_loss": -8.023445129394531, "global_step": 45034, "epoch": 268} {"train_loss": -8.046382904052734, "global_step": 45035, "epoch": 268} {"train_loss": -7.835158824920654, "global_step": 45036, "epoch": 268} {"train_loss": -8.156111717224121, "global_step": 45037, "epoch": 268} {"train_loss": -7.883023262023926, "global_step": 45038, "epoch": 268} {"train_loss": -8.072877883911133, "global_step": 45039, "epoch": 268} {"train_loss": -7.873468399047852, "global_step": 45040, "epoch": 268} {"train_loss": -8.073532104492188, "global_step": 45041, "epoch": 268} {"train_loss": -7.952813625335693, "global_step": 45042, "epoch": 268} {"train_loss": -7.886725425720215, "global_step": 45043, "epoch": 268} {"train_loss": -8.224710464477539, "global_step": 45044, "epoch": 268} {"train_loss": -7.849868297576904, "global_step": 45045, "epoch": 268} {"train_loss": -8.157432556152344, "global_step": 45046, "epoch": 268} {"train_loss": -8.007369041442871, "global_step": 45047, "epoch": 268} {"train_loss": -7.959988117218018, "global_step": 45048, "epoch": 268} {"train_loss": -8.126449584960938, "global_step": 45049, "epoch": 268} {"train_loss": -7.815947532653809, "global_step": 45050, "epoch": 268} {"train_loss": -7.8625383377075195, "global_step": 45051, "epoch": 268} {"train_loss": -8.070043563842773, "global_step": 45052, "epoch": 268} {"train_loss": -7.9978790283203125, "global_step": 45053, "epoch": 268} {"train_loss": -8.026851654052734, "global_step": 45054, "epoch": 268} {"train_loss": -8.163799285888672, "global_step": 45055, "epoch": 268} {"train_loss": -7.880246162414551, "global_step": 45056, "epoch": 268} {"train_loss": -8.071464538574219, "global_step": 45057, "epoch": 268} {"train_loss": -8.031808853149414, "global_step": 45058, "epoch": 268} {"train_loss": -7.783977508544922, "global_step": 45059, "epoch": 268} {"train_loss": -7.779759407043457, "global_step": 45060, "epoch": 268} {"train_loss": -8.028160095214844, "global_step": 45061, "epoch": 268} {"train_loss": -7.748835563659668, "global_step": 45062, "epoch": 268} {"train_loss": -7.993326187133789, "global_step": 45063, "epoch": 268} {"train_loss": -7.909733772277832, "global_step": 45064, "epoch": 268} {"train_loss": -7.836021900177002, "global_step": 45065, "epoch": 268} {"train_loss": -7.86962366104126, "global_step": 45066, "epoch": 268} {"train_loss": -7.808238506317139, "global_step": 45067, "epoch": 268} {"train_loss": -7.808654308319092, "global_step": 45068, "epoch": 268} {"train_loss": -8.065253257751465, "global_step": 45069, "epoch": 268} {"train_loss": -7.9264116287231445, "global_step": 45070, "epoch": 268} {"train_loss": -7.93016242980957, "global_step": 45071, "epoch": 268} {"train_loss": -7.95368766784668, "global_step": 45072, "epoch": 268} {"train_loss": -7.9578046798706055, "global_step": 45073, "epoch": 268} {"train_loss": -7.944370269775391, "global_step": 45074, "epoch": 268} {"train_loss": -8.008605003356934, "global_step": 45075, "epoch": 268} {"train_loss": -7.9915361404418945, "global_step": 45076, "epoch": 268} {"train_loss": -7.980783462524414, "global_step": 45077, "epoch": 268} {"train_loss": -8.124691009521484, "global_step": 45078, "epoch": 268} {"train_loss": -7.904210567474365, "global_step": 45079, "epoch": 268} {"train_loss": -8.24148178100586, "global_step": 45080, "epoch": 268} {"train_loss": -8.096702575683594, "global_step": 45081, "epoch": 268} {"train_loss": -8.117264747619629, "global_step": 45082, "epoch": 268} {"train_loss": -8.174327850341797, "global_step": 45083, "epoch": 268} {"train_loss": -7.826354503631592, "global_step": 45084, "epoch": 268} {"train_loss": -8.062559127807617, "global_step": 45085, "epoch": 268} {"train_loss": -8.10814094543457, "global_step": 45086, "epoch": 268} {"train_loss": -8.04847526550293, "global_step": 45087, "epoch": 268} {"train_loss": -8.158257484436035, "global_step": 45088, "epoch": 268} {"train_loss": -8.057804107666016, "global_step": 45089, "epoch": 268} {"train_loss": -7.715313911437988, "global_step": 45090, "epoch": 268} {"train_loss": -8.31666088104248, "global_step": 45091, "epoch": 268} {"train_loss": -7.714584827423096, "global_step": 45092, "epoch": 268} {"train_loss": -8.088706970214844, "global_step": 45093, "epoch": 268} {"train_loss": -8.002077102661133, "global_step": 45094, "epoch": 268} {"train_loss": -8.132068634033203, "global_step": 45095, "epoch": 268} {"train_loss": -7.918122291564941, "global_step": 45096, "epoch": 268} {"train_loss": -8.221719741821289, "global_step": 45097, "epoch": 268} {"train_loss": -8.068755149841309, "global_step": 45098, "epoch": 268} {"train_loss": -8.097651481628418, "global_step": 45099, "epoch": 268} {"train_loss": -8.007802963256836, "global_step": 45100, "epoch": 268} {"train_loss": -8.059381484985352, "global_step": 45101, "epoch": 268} {"train_loss": -8.116445541381836, "global_step": 45102, "epoch": 268} {"train_loss": -8.213117599487305, "global_step": 45103, "epoch": 268} {"train_loss": -7.76469087600708, "global_step": 45104, "epoch": 268} {"train_loss": -8.25769329071045, "global_step": 45105, "epoch": 268} {"train_loss": -7.93381404876709, "global_step": 45106, "epoch": 268} {"train_loss": -7.959043979644775, "global_step": 45107, "epoch": 268} {"train_loss": -8.170075416564941, "global_step": 45108, "epoch": 268} {"train_loss": -8.146936416625977, "global_step": 45109, "epoch": 268} {"train_loss": -8.103233337402344, "global_step": 45110, "epoch": 268} {"train_loss": -8.043670654296875, "global_step": 45111, "epoch": 268} {"train_loss": -8.022733688354492, "global_step": 45112, "epoch": 268} {"train_loss": -8.271159172058105, "global_step": 45113, "epoch": 268} {"train_loss": -7.926294326782227, "global_step": 45114, "epoch": 268} {"train_loss": -8.218826293945312, "global_step": 45115, "epoch": 268} {"train_loss": -8.135358810424805, "global_step": 45116, "epoch": 268} {"train_loss": -8.075691223144531, "global_step": 45117, "epoch": 268} {"train_loss": -8.034032821655273, "global_step": 45118, "epoch": 268} {"train_loss": -8.059249877929688, "global_step": 45119, "epoch": 268} {"train_loss": -8.066125869750977, "global_step": 45120, "epoch": 268} {"train_loss": -8.083569526672363, "global_step": 45121, "epoch": 268} {"train_loss": -7.974042892456055, "global_step": 45122, "epoch": 268} {"train_loss": -8.185340881347656, "global_step": 45123, "epoch": 268} {"train_loss": -8.239917755126953, "global_step": 45124, "epoch": 268} {"train_loss": -8.046961784362793, "global_step": 45125, "epoch": 268} {"train_loss": -7.913775444030762, "global_step": 45126, "epoch": 268} {"train_loss": -8.282721519470215, "global_step": 45127, "epoch": 268} {"train_loss": -8.064346313476562, "global_step": 45128, "epoch": 268} {"train_loss": -8.147706985473633, "global_step": 45129, "epoch": 268} {"train_loss": -8.320449829101562, "global_step": 45130, "epoch": 268} {"train_loss": -8.121158599853516, "global_step": 45131, "epoch": 268} {"train_loss": -8.133655548095703, "global_step": 45132, "epoch": 268} {"train_loss": -8.199806213378906, "global_step": 45133, "epoch": 268} {"train_loss": -8.126585960388184, "global_step": 45134, "epoch": 268} {"train_loss": -8.52049732208252, "global_step": 45135, "epoch": 268} {"train_loss": -8.237527847290039, "global_step": 45136, "epoch": 268} {"train_loss": -8.156272888183594, "global_step": 45137, "epoch": 268} {"train_loss": -7.926982879638672, "global_step": 45138, "epoch": 268} {"train_loss": -8.128803253173828, "global_step": 45139, "epoch": 268} {"train_loss": -8.121212005615234, "global_step": 45140, "epoch": 268} {"train_loss": -7.836948394775391, "global_step": 45141, "epoch": 268} {"train_loss": -8.169193267822266, "global_step": 45142, "epoch": 268} {"train_loss": -8.038488388061523, "global_step": 45143, "epoch": 268} {"train_loss": -7.991790771484375, "global_step": 45144, "epoch": 268} {"train_loss": -8.158337593078613, "global_step": 45145, "epoch": 268} {"train_loss": -8.307876586914062, "global_step": 45146, "epoch": 268} {"train_loss": -7.959897518157959, "global_step": 45147, "epoch": 268} {"train_loss": -8.21047592163086, "global_step": 45148, "epoch": 268} {"train_loss": -7.8587751388549805, "global_step": 45149, "epoch": 268} {"train_loss": -8.142709732055664, "global_step": 45150, "epoch": 268} {"train_loss": -8.167024612426758, "global_step": 45151, "epoch": 268} {"train_loss": -8.237595558166504, "global_step": 45152, "epoch": 268} {"train_loss": -8.253225326538086, "global_step": 45153, "epoch": 268} {"train_loss": -8.155550003051758, "global_step": 45154, "epoch": 268} {"train_loss": -8.073317527770996, "global_step": 45155, "epoch": 268} {"train_loss": -8.125741958618164, "global_step": 45156, "epoch": 268} {"train_loss": -7.930803298950195, "global_step": 45157, "epoch": 268} {"train_loss": -8.001782417297363, "global_step": 45158, "epoch": 268} {"train_loss": -8.341191291809082, "global_step": 45159, "epoch": 268} {"train_loss": -7.9809417724609375, "global_step": 45160, "epoch": 268} {"train_loss": -8.39511489868164, "global_step": 45161, "epoch": 268} {"train_loss": -8.064629554748535, "global_step": 45162, "epoch": 268} {"train_loss": -8.115137100219727, "global_step": 45163, "epoch": 268} {"train_loss": -8.186829566955566, "global_step": 45164, "epoch": 268} {"train_loss": -8.186887741088867, "global_step": 45165, "epoch": 268} {"train_loss": -8.035511016845703, "global_step": 45166, "epoch": 268} {"train_loss": -7.884322643280029, "global_step": 45167, "epoch": 268} {"train_loss": -8.063104629516602, "global_step": 45168, "epoch": 268} {"train_loss": -7.848763942718506, "global_step": 45169, "epoch": 268} {"train_loss": -7.957150459289551, "global_step": 45170, "epoch": 268} {"train_loss": -8.310088157653809, "global_step": 45171, "epoch": 268} {"train_loss": -8.121212005615234, "global_step": 45172, "epoch": 268} {"train_loss": -8.012106895446777, "global_step": 45173, "epoch": 268} {"train_loss": -8.073960304260254, "global_step": 45174, "epoch": 268} {"train_loss": -8.184524536132812, "global_step": 45175, "epoch": 268} {"train_loss": -8.220783233642578, "global_step": 45176, "epoch": 268} {"train_loss": -8.292136192321777, "global_step": 45177, "epoch": 268} {"train_loss": -8.209680557250977, "global_step": 45178, "epoch": 268} {"train_loss": -8.190482139587402, "global_step": 45179, "epoch": 268} {"train_loss": -8.234949111938477, "global_step": 45180, "epoch": 268} {"train_loss": -8.147481918334961, "global_step": 45181, "epoch": 268} {"train_loss": -7.887112617492676, "global_step": 45182, "epoch": 268} {"train_loss": -8.192548751831055, "global_step": 45183, "epoch": 268} {"train_loss": -7.915173530578613, "global_step": 45184, "epoch": 268} {"train_loss": -8.347211837768555, "global_step": 45185, "epoch": 268} {"train_loss": -7.953073024749756, "global_step": 45186, "epoch": 268} {"train_loss": -8.232497215270996, "global_step": 45187, "epoch": 268} {"train_loss": -8.155228614807129, "global_step": 45188, "epoch": 268} {"train_loss": -8.245797157287598, "global_step": 45189, "epoch": 268} {"train_loss": -8.228338241577148, "global_step": 45190, "epoch": 268} {"train_loss": -8.058994551499685, "global_step": 45191, "epoch": 268, "val_loss": 185949.125} {"train_loss": -7.96529483795166, "global_step": 45192, "epoch": 269} {"train_loss": -8.108524322509766, "global_step": 45193, "epoch": 269} {"train_loss": -8.202947616577148, "global_step": 45194, "epoch": 269} {"train_loss": -7.972568511962891, "global_step": 45195, "epoch": 269} {"train_loss": -8.248041152954102, "global_step": 45196, "epoch": 269} {"train_loss": -7.961098670959473, "global_step": 45197, "epoch": 269} {"train_loss": -7.959595203399658, "global_step": 45198, "epoch": 269} {"train_loss": -7.960544586181641, "global_step": 45199, "epoch": 269} {"train_loss": -7.935517311096191, "global_step": 45200, "epoch": 269} {"train_loss": -8.051673889160156, "global_step": 45201, "epoch": 269} {"train_loss": -7.865890026092529, "global_step": 45202, "epoch": 269} {"train_loss": -8.143604278564453, "global_step": 45203, "epoch": 269} {"train_loss": -8.158405303955078, "global_step": 45204, "epoch": 269} {"train_loss": -8.056818008422852, "global_step": 45205, "epoch": 269} {"train_loss": -8.315604209899902, "global_step": 45206, "epoch": 269} {"train_loss": -8.190396308898926, "global_step": 45207, "epoch": 269} {"train_loss": -8.205574035644531, "global_step": 45208, "epoch": 269} {"train_loss": -8.284461975097656, "global_step": 45209, "epoch": 269} {"train_loss": -8.17243766784668, "global_step": 45210, "epoch": 269} {"train_loss": -8.483824729919434, "global_step": 45211, "epoch": 269} {"train_loss": -8.246244430541992, "global_step": 45212, "epoch": 269} {"train_loss": -8.438846588134766, "global_step": 45213, "epoch": 269} {"train_loss": -8.130111694335938, "global_step": 45214, "epoch": 269} {"train_loss": -8.005240440368652, "global_step": 45215, "epoch": 269} {"train_loss": -8.140716552734375, "global_step": 45216, "epoch": 269} {"train_loss": -8.22251033782959, "global_step": 45217, "epoch": 269} {"train_loss": -8.091075897216797, "global_step": 45218, "epoch": 269} {"train_loss": -7.994448661804199, "global_step": 45219, "epoch": 269} {"train_loss": -7.9244585037231445, "global_step": 45220, "epoch": 269} {"train_loss": -7.984188556671143, "global_step": 45221, "epoch": 269} {"train_loss": -8.212202072143555, "global_step": 45222, "epoch": 269} {"train_loss": -7.902754783630371, "global_step": 45223, "epoch": 269} {"train_loss": -7.9290971755981445, "global_step": 45224, "epoch": 269} {"train_loss": -8.000292778015137, "global_step": 45225, "epoch": 269} {"train_loss": -7.890312194824219, "global_step": 45226, "epoch": 269} {"train_loss": -7.961174011230469, "global_step": 45227, "epoch": 269} {"train_loss": -7.791838645935059, "global_step": 45228, "epoch": 269} {"train_loss": -7.733603000640869, "global_step": 45229, "epoch": 269} {"train_loss": -8.181661605834961, "global_step": 45230, "epoch": 269} {"train_loss": -8.158384323120117, "global_step": 45231, "epoch": 269} {"train_loss": -8.032358169555664, "global_step": 45232, "epoch": 269} {"train_loss": -8.104557991027832, "global_step": 45233, "epoch": 269} {"train_loss": -8.239434242248535, "global_step": 45234, "epoch": 269} {"train_loss": -8.042215347290039, "global_step": 45235, "epoch": 269} {"train_loss": -8.119483947753906, "global_step": 45236, "epoch": 269} {"train_loss": -8.274126052856445, "global_step": 45237, "epoch": 269} {"train_loss": -8.091394424438477, "global_step": 45238, "epoch": 269} {"train_loss": -8.142618179321289, "global_step": 45239, "epoch": 269} {"train_loss": -8.147075653076172, "global_step": 45240, "epoch": 269} {"train_loss": -8.047124862670898, "global_step": 45241, "epoch": 269} {"train_loss": -7.967520713806152, "global_step": 45242, "epoch": 269} {"train_loss": -8.0589599609375, "global_step": 45243, "epoch": 269} {"train_loss": -8.139708518981934, "global_step": 45244, "epoch": 269} {"train_loss": -8.110218048095703, "global_step": 45245, "epoch": 269} {"train_loss": -8.233837127685547, "global_step": 45246, "epoch": 269} {"train_loss": -7.973916053771973, "global_step": 45247, "epoch": 269} {"train_loss": -8.216854095458984, "global_step": 45248, "epoch": 269} {"train_loss": -8.122489929199219, "global_step": 45249, "epoch": 269} {"train_loss": -8.009525299072266, "global_step": 45250, "epoch": 269} {"train_loss": -8.192357063293457, "global_step": 45251, "epoch": 269} {"train_loss": -8.184537887573242, "global_step": 45252, "epoch": 269} {"train_loss": -8.39633560180664, "global_step": 45253, "epoch": 269} {"train_loss": -8.205236434936523, "global_step": 45254, "epoch": 269} {"train_loss": -8.299922943115234, "global_step": 45255, "epoch": 269} {"train_loss": -8.06323528289795, "global_step": 45256, "epoch": 269} {"train_loss": -8.075565338134766, "global_step": 45257, "epoch": 269} {"train_loss": -8.321001052856445, "global_step": 45258, "epoch": 269} {"train_loss": -8.559100151062012, "global_step": 45259, "epoch": 269} {"train_loss": -8.21397590637207, "global_step": 45260, "epoch": 269} {"train_loss": -8.241678237915039, "global_step": 45261, "epoch": 269} {"train_loss": -8.24327564239502, "global_step": 45262, "epoch": 269} {"train_loss": -8.072687149047852, "global_step": 45263, "epoch": 269} {"train_loss": -8.011215209960938, "global_step": 45264, "epoch": 269} {"train_loss": -7.885620594024658, "global_step": 45265, "epoch": 269} {"train_loss": -8.088048934936523, "global_step": 45266, "epoch": 269} {"train_loss": -8.06893539428711, "global_step": 45267, "epoch": 269} {"train_loss": -8.092239379882812, "global_step": 45268, "epoch": 269} {"train_loss": -8.184638977050781, "global_step": 45269, "epoch": 269} {"train_loss": -8.185394287109375, "global_step": 45270, "epoch": 269} {"train_loss": -8.096309661865234, "global_step": 45271, "epoch": 269} {"train_loss": -8.061220169067383, "global_step": 45272, "epoch": 269} {"train_loss": -8.123278617858887, "global_step": 45273, "epoch": 269} {"train_loss": -8.109092712402344, "global_step": 45274, "epoch": 269} {"train_loss": -8.108649253845215, "global_step": 45275, "epoch": 269} {"train_loss": -8.517223358154297, "global_step": 45276, "epoch": 269} {"train_loss": -7.979339122772217, "global_step": 45277, "epoch": 269} {"train_loss": -8.216682434082031, "global_step": 45278, "epoch": 269} {"train_loss": -8.201257705688477, "global_step": 45279, "epoch": 269} {"train_loss": -8.003782272338867, "global_step": 45280, "epoch": 269} {"train_loss": -7.976780891418457, "global_step": 45281, "epoch": 269} {"train_loss": -8.053594589233398, "global_step": 45282, "epoch": 269} {"train_loss": -7.986050605773926, "global_step": 45283, "epoch": 269} {"train_loss": -7.837703704833984, "global_step": 45284, "epoch": 269} {"train_loss": -8.174022674560547, "global_step": 45285, "epoch": 269} {"train_loss": -8.17790412902832, "global_step": 45286, "epoch": 269} {"train_loss": -7.772757530212402, "global_step": 45287, "epoch": 269} {"train_loss": -7.906573295593262, "global_step": 45288, "epoch": 269} {"train_loss": -8.028472900390625, "global_step": 45289, "epoch": 269} {"train_loss": -8.17219352722168, "global_step": 45290, "epoch": 269} {"train_loss": -8.277215957641602, "global_step": 45291, "epoch": 269} {"train_loss": -8.304010391235352, "global_step": 45292, "epoch": 269} {"train_loss": -8.02314567565918, "global_step": 45293, "epoch": 269} {"train_loss": -8.121481895446777, "global_step": 45294, "epoch": 269} {"train_loss": -7.959589958190918, "global_step": 45295, "epoch": 269} {"train_loss": -8.013999938964844, "global_step": 45296, "epoch": 269} {"train_loss": -7.844363212585449, "global_step": 45297, "epoch": 269} {"train_loss": -8.15916633605957, "global_step": 45298, "epoch": 269} {"train_loss": -7.9202117919921875, "global_step": 45299, "epoch": 269} {"train_loss": -8.084813117980957, "global_step": 45300, "epoch": 269} {"train_loss": -8.023232460021973, "global_step": 45301, "epoch": 269} {"train_loss": -7.869632720947266, "global_step": 45302, "epoch": 269} {"train_loss": -8.08052921295166, "global_step": 45303, "epoch": 269} {"train_loss": -7.907835483551025, "global_step": 45304, "epoch": 269} {"train_loss": -8.101634979248047, "global_step": 45305, "epoch": 269} {"train_loss": -7.895855903625488, "global_step": 45306, "epoch": 269} {"train_loss": -8.047493934631348, "global_step": 45307, "epoch": 269} {"train_loss": -8.001703262329102, "global_step": 45308, "epoch": 269} {"train_loss": -8.026834487915039, "global_step": 45309, "epoch": 269} {"train_loss": -8.147281646728516, "global_step": 45310, "epoch": 269} {"train_loss": -8.043107986450195, "global_step": 45311, "epoch": 269} {"train_loss": -8.17451286315918, "global_step": 45312, "epoch": 269} {"train_loss": -8.36968994140625, "global_step": 45313, "epoch": 269} {"train_loss": -8.137351989746094, "global_step": 45314, "epoch": 269} {"train_loss": -8.033467292785645, "global_step": 45315, "epoch": 269} {"train_loss": -8.077370643615723, "global_step": 45316, "epoch": 269} {"train_loss": -8.10062313079834, "global_step": 45317, "epoch": 269} {"train_loss": -8.122758865356445, "global_step": 45318, "epoch": 269} {"train_loss": -8.1635103225708, "global_step": 45319, "epoch": 269} {"train_loss": -8.112258911132812, "global_step": 45320, "epoch": 269} {"train_loss": -8.289886474609375, "global_step": 45321, "epoch": 269} {"train_loss": -8.058433532714844, "global_step": 45322, "epoch": 269} {"train_loss": -8.123358726501465, "global_step": 45323, "epoch": 269} {"train_loss": -8.021717071533203, "global_step": 45324, "epoch": 269} {"train_loss": -8.036361694335938, "global_step": 45325, "epoch": 269} {"train_loss": -8.27164077758789, "global_step": 45326, "epoch": 269} {"train_loss": -8.197196006774902, "global_step": 45327, "epoch": 269} {"train_loss": -8.095069885253906, "global_step": 45328, "epoch": 269} {"train_loss": -8.290287971496582, "global_step": 45329, "epoch": 269} {"train_loss": -8.372650146484375, "global_step": 45330, "epoch": 269} {"train_loss": -8.04460620880127, "global_step": 45331, "epoch": 269} {"train_loss": -8.317646026611328, "global_step": 45332, "epoch": 269} {"train_loss": -8.387310981750488, "global_step": 45333, "epoch": 269} {"train_loss": -8.120721817016602, "global_step": 45334, "epoch": 269} {"train_loss": -8.306963920593262, "global_step": 45335, "epoch": 269} {"train_loss": -8.213946342468262, "global_step": 45336, "epoch": 269} {"train_loss": -8.204560279846191, "global_step": 45337, "epoch": 269} {"train_loss": -8.107275009155273, "global_step": 45338, "epoch": 269} {"train_loss": -8.123964309692383, "global_step": 45339, "epoch": 269} {"train_loss": -8.451892852783203, "global_step": 45340, "epoch": 269} {"train_loss": -8.281686782836914, "global_step": 45341, "epoch": 269} {"train_loss": -8.373138427734375, "global_step": 45342, "epoch": 269} {"train_loss": -8.368719100952148, "global_step": 45343, "epoch": 269} {"train_loss": -8.334280014038086, "global_step": 45344, "epoch": 269} {"train_loss": -8.249105453491211, "global_step": 45345, "epoch": 269} {"train_loss": -8.237771987915039, "global_step": 45346, "epoch": 269} {"train_loss": -8.139406204223633, "global_step": 45347, "epoch": 269} {"train_loss": -8.031917572021484, "global_step": 45348, "epoch": 269} {"train_loss": -8.037651062011719, "global_step": 45349, "epoch": 269} {"train_loss": -7.929351329803467, "global_step": 45350, "epoch": 269} {"train_loss": -7.868101596832275, "global_step": 45351, "epoch": 269} {"train_loss": -7.45664119720459, "global_step": 45352, "epoch": 269} {"train_loss": -8.157639503479004, "global_step": 45353, "epoch": 269} {"train_loss": -8.099825859069824, "global_step": 45354, "epoch": 269} {"train_loss": -8.035257339477539, "global_step": 45355, "epoch": 269} {"train_loss": -8.002477645874023, "global_step": 45356, "epoch": 269} {"train_loss": -7.910172462463379, "global_step": 45357, "epoch": 269} {"train_loss": -7.931704521179199, "global_step": 45358, "epoch": 269} {"train_loss": -8.10718891450337, "global_step": 45359, "epoch": 269, "val_loss": 186210.90625} {"train_loss": -7.959600448608398, "global_step": 45360, "epoch": 270} {"train_loss": -7.920831680297852, "global_step": 45361, "epoch": 270} {"train_loss": -8.18006706237793, "global_step": 45362, "epoch": 270} {"train_loss": -7.822975158691406, "global_step": 45363, "epoch": 270} {"train_loss": -8.049760818481445, "global_step": 45364, "epoch": 270} {"train_loss": -8.105384826660156, "global_step": 45365, "epoch": 270} {"train_loss": -8.082212448120117, "global_step": 45366, "epoch": 270} {"train_loss": -8.184410095214844, "global_step": 45367, "epoch": 270} {"train_loss": -7.8041276931762695, "global_step": 45368, "epoch": 270} {"train_loss": -8.035707473754883, "global_step": 45369, "epoch": 270} {"train_loss": -7.763671875, "global_step": 45370, "epoch": 270} {"train_loss": -8.06584358215332, "global_step": 45371, "epoch": 270} {"train_loss": -8.013039588928223, "global_step": 45372, "epoch": 270} {"train_loss": -7.746129989624023, "global_step": 45373, "epoch": 270} {"train_loss": -8.103019714355469, "global_step": 45374, "epoch": 270} {"train_loss": -8.16818618774414, "global_step": 45375, "epoch": 270} {"train_loss": -8.022130966186523, "global_step": 45376, "epoch": 270} {"train_loss": -8.189773559570312, "global_step": 45377, "epoch": 270} {"train_loss": -7.958493232727051, "global_step": 45378, "epoch": 270} {"train_loss": -7.993524074554443, "global_step": 45379, "epoch": 270} {"train_loss": -8.248626708984375, "global_step": 45380, "epoch": 270} {"train_loss": -8.307795524597168, "global_step": 45381, "epoch": 270} {"train_loss": -8.204198837280273, "global_step": 45382, "epoch": 270} {"train_loss": -8.261067390441895, "global_step": 45383, "epoch": 270} {"train_loss": -8.279991149902344, "global_step": 45384, "epoch": 270} {"train_loss": -8.18492603302002, "global_step": 45385, "epoch": 270} {"train_loss": -8.393985748291016, "global_step": 45386, "epoch": 270} {"train_loss": -8.223756790161133, "global_step": 45387, "epoch": 270} {"train_loss": -8.363260269165039, "global_step": 45388, "epoch": 270} {"train_loss": -8.086114883422852, "global_step": 45389, "epoch": 270} {"train_loss": -8.403002738952637, "global_step": 45390, "epoch": 270} {"train_loss": -8.50916862487793, "global_step": 45391, "epoch": 270} {"train_loss": -8.328280448913574, "global_step": 45392, "epoch": 270} {"train_loss": -8.300317764282227, "global_step": 45393, "epoch": 270} {"train_loss": -8.19228744506836, "global_step": 45394, "epoch": 270} {"train_loss": -8.407434463500977, "global_step": 45395, "epoch": 270} {"train_loss": -8.256145477294922, "global_step": 45396, "epoch": 270} {"train_loss": -8.001097679138184, "global_step": 45397, "epoch": 270} {"train_loss": -8.308395385742188, "global_step": 45398, "epoch": 270} {"train_loss": -8.077451705932617, "global_step": 45399, "epoch": 270} {"train_loss": -8.177481651306152, "global_step": 45400, "epoch": 270} {"train_loss": -8.374154090881348, "global_step": 45401, "epoch": 270} {"train_loss": -7.87220573425293, "global_step": 45402, "epoch": 270} {"train_loss": -8.053435325622559, "global_step": 45403, "epoch": 270} {"train_loss": -8.183149337768555, "global_step": 45404, "epoch": 270} {"train_loss": -8.31353759765625, "global_step": 45405, "epoch": 270} {"train_loss": -8.04768180847168, "global_step": 45406, "epoch": 270} {"train_loss": -8.274894714355469, "global_step": 45407, "epoch": 270} {"train_loss": -8.032126426696777, "global_step": 45408, "epoch": 270} {"train_loss": -8.293466567993164, "global_step": 45409, "epoch": 270} {"train_loss": -8.109273910522461, "global_step": 45410, "epoch": 270} {"train_loss": -8.257097244262695, "global_step": 45411, "epoch": 270} {"train_loss": -7.926680564880371, "global_step": 45412, "epoch": 270} {"train_loss": -8.157809257507324, "global_step": 45413, "epoch": 270} {"train_loss": -7.999980449676514, "global_step": 45414, "epoch": 270} {"train_loss": -7.881994724273682, "global_step": 45415, "epoch": 270} {"train_loss": -8.247291564941406, "global_step": 45416, "epoch": 270} {"train_loss": -8.381050109863281, "global_step": 45417, "epoch": 270} {"train_loss": -8.163825988769531, "global_step": 45418, "epoch": 270} {"train_loss": -8.169279098510742, "global_step": 45419, "epoch": 270} {"train_loss": -8.180782318115234, "global_step": 45420, "epoch": 270} {"train_loss": -8.17855167388916, "global_step": 45421, "epoch": 270} {"train_loss": -8.194659233093262, "global_step": 45422, "epoch": 270} {"train_loss": -8.363170623779297, "global_step": 45423, "epoch": 270} {"train_loss": -8.27066421508789, "global_step": 45424, "epoch": 270} {"train_loss": -8.113266944885254, "global_step": 45425, "epoch": 270} {"train_loss": -8.257441520690918, "global_step": 45426, "epoch": 270} {"train_loss": -8.055997848510742, "global_step": 45427, "epoch": 270} {"train_loss": -8.336843490600586, "global_step": 45428, "epoch": 270} {"train_loss": -8.27188777923584, "global_step": 45429, "epoch": 270} {"train_loss": -8.086051940917969, "global_step": 45430, "epoch": 270} {"train_loss": -8.083202362060547, "global_step": 45431, "epoch": 270} {"train_loss": -8.343192100524902, "global_step": 45432, "epoch": 270} {"train_loss": -7.982712745666504, "global_step": 45433, "epoch": 270} {"train_loss": -8.107673645019531, "global_step": 45434, "epoch": 270} {"train_loss": -8.160412788391113, "global_step": 45435, "epoch": 270} {"train_loss": -8.28094482421875, "global_step": 45436, "epoch": 270} {"train_loss": -8.161005020141602, "global_step": 45437, "epoch": 270} {"train_loss": -8.318603515625, "global_step": 45438, "epoch": 270} {"train_loss": -8.091400146484375, "global_step": 45439, "epoch": 270} {"train_loss": -8.265225410461426, "global_step": 45440, "epoch": 270} {"train_loss": -8.222670555114746, "global_step": 45441, "epoch": 270} {"train_loss": -8.037826538085938, "global_step": 45442, "epoch": 270} {"train_loss": -8.251420021057129, "global_step": 45443, "epoch": 270} {"train_loss": -8.153676986694336, "global_step": 45444, "epoch": 270} {"train_loss": -8.269632339477539, "global_step": 45445, "epoch": 270} {"train_loss": -8.0771484375, "global_step": 45446, "epoch": 270} {"train_loss": -8.159917831420898, "global_step": 45447, "epoch": 270} {"train_loss": -8.187493324279785, "global_step": 45448, "epoch": 270} {"train_loss": -8.181051254272461, "global_step": 45449, "epoch": 270} {"train_loss": -8.235940933227539, "global_step": 45450, "epoch": 270} {"train_loss": -7.981992721557617, "global_step": 45451, "epoch": 270} {"train_loss": -8.203977584838867, "global_step": 45452, "epoch": 270} {"train_loss": -8.077465057373047, "global_step": 45453, "epoch": 270} {"train_loss": -8.058561325073242, "global_step": 45454, "epoch": 270} {"train_loss": -7.909188747406006, "global_step": 45455, "epoch": 270} {"train_loss": -8.122737884521484, "global_step": 45456, "epoch": 270} {"train_loss": -7.805963516235352, "global_step": 45457, "epoch": 270} {"train_loss": -8.027034759521484, "global_step": 45458, "epoch": 270} {"train_loss": -7.9905314445495605, "global_step": 45459, "epoch": 270} {"train_loss": -8.070388793945312, "global_step": 45460, "epoch": 270} {"train_loss": -8.091266632080078, "global_step": 45461, "epoch": 270} {"train_loss": -8.146852493286133, "global_step": 45462, "epoch": 270} {"train_loss": -8.253984451293945, "global_step": 45463, "epoch": 270} {"train_loss": -8.395853996276855, "global_step": 45464, "epoch": 270} {"train_loss": -8.252337455749512, "global_step": 45465, "epoch": 270} {"train_loss": -8.156880378723145, "global_step": 45466, "epoch": 270} {"train_loss": -8.390484809875488, "global_step": 45467, "epoch": 270} {"train_loss": -8.007179260253906, "global_step": 45468, "epoch": 270} {"train_loss": -8.356758117675781, "global_step": 45469, "epoch": 270} {"train_loss": -8.211442947387695, "global_step": 45470, "epoch": 270} {"train_loss": -8.232467651367188, "global_step": 45471, "epoch": 270} {"train_loss": -7.976404190063477, "global_step": 45472, "epoch": 270} {"train_loss": -8.309974670410156, "global_step": 45473, "epoch": 270} {"train_loss": -7.8176164627075195, "global_step": 45474, "epoch": 270} {"train_loss": -8.212570190429688, "global_step": 45475, "epoch": 270} {"train_loss": -8.13754653930664, "global_step": 45476, "epoch": 270} {"train_loss": -8.249951362609863, "global_step": 45477, "epoch": 270} {"train_loss": -8.1307373046875, "global_step": 45478, "epoch": 270} {"train_loss": -8.208955764770508, "global_step": 45479, "epoch": 270} {"train_loss": -8.146272659301758, "global_step": 45480, "epoch": 270} {"train_loss": -8.268540382385254, "global_step": 45481, "epoch": 270} {"train_loss": -8.127171516418457, "global_step": 45482, "epoch": 270} {"train_loss": -8.268353462219238, "global_step": 45483, "epoch": 270} {"train_loss": -8.20921802520752, "global_step": 45484, "epoch": 270} {"train_loss": -8.219562530517578, "global_step": 45485, "epoch": 270} {"train_loss": -7.944640159606934, "global_step": 45486, "epoch": 270} {"train_loss": -8.179365158081055, "global_step": 45487, "epoch": 270} {"train_loss": -8.214174270629883, "global_step": 45488, "epoch": 270} {"train_loss": -8.059873580932617, "global_step": 45489, "epoch": 270} {"train_loss": -8.393852233886719, "global_step": 45490, "epoch": 270} {"train_loss": -8.196260452270508, "global_step": 45491, "epoch": 270} {"train_loss": -8.045575141906738, "global_step": 45492, "epoch": 270} {"train_loss": -8.023672103881836, "global_step": 45493, "epoch": 270} {"train_loss": -7.960721492767334, "global_step": 45494, "epoch": 270} {"train_loss": -8.370811462402344, "global_step": 45495, "epoch": 270} {"train_loss": -8.195388793945312, "global_step": 45496, "epoch": 270} {"train_loss": -8.356691360473633, "global_step": 45497, "epoch": 270} {"train_loss": -8.145309448242188, "global_step": 45498, "epoch": 270} {"train_loss": -8.118257522583008, "global_step": 45499, "epoch": 270} {"train_loss": -8.197183609008789, "global_step": 45500, "epoch": 270} {"train_loss": -7.941515922546387, "global_step": 45501, "epoch": 270} {"train_loss": -7.82696533203125, "global_step": 45502, "epoch": 270} {"train_loss": -8.201780319213867, "global_step": 45503, "epoch": 270} {"train_loss": -8.057046890258789, "global_step": 45504, "epoch": 270} {"train_loss": -8.094393730163574, "global_step": 45505, "epoch": 270} {"train_loss": -8.19035530090332, "global_step": 45506, "epoch": 270} {"train_loss": -8.063145637512207, "global_step": 45507, "epoch": 270} {"train_loss": -7.8903326988220215, "global_step": 45508, "epoch": 270} {"train_loss": -8.176429748535156, "global_step": 45509, "epoch": 270} {"train_loss": -8.204505920410156, "global_step": 45510, "epoch": 270} {"train_loss": -8.30010986328125, "global_step": 45511, "epoch": 270} {"train_loss": -8.15049934387207, "global_step": 45512, "epoch": 270} {"train_loss": -8.126178741455078, "global_step": 45513, "epoch": 270} {"train_loss": -8.156927108764648, "global_step": 45514, "epoch": 270} {"train_loss": -7.916436672210693, "global_step": 45515, "epoch": 270} {"train_loss": -8.243946075439453, "global_step": 45516, "epoch": 270} {"train_loss": -8.019771575927734, "global_step": 45517, "epoch": 270} {"train_loss": -8.046956062316895, "global_step": 45518, "epoch": 270} {"train_loss": -8.087246894836426, "global_step": 45519, "epoch": 270} {"train_loss": -7.94516658782959, "global_step": 45520, "epoch": 270} {"train_loss": -7.850302696228027, "global_step": 45521, "epoch": 270} {"train_loss": -7.717911243438721, "global_step": 45522, "epoch": 270} {"train_loss": -8.100956916809082, "global_step": 45523, "epoch": 270} {"train_loss": -7.802224159240723, "global_step": 45524, "epoch": 270} {"train_loss": -8.029370307922363, "global_step": 45525, "epoch": 270} {"train_loss": -7.852025508880615, "global_step": 45526, "epoch": 270} {"train_loss": -8.134692382244836, "global_step": 45527, "epoch": 270, "val_loss": 188010.578125, "train_action_mse_error": 13.783391952514648} {"train_loss": -7.670371055603027, "global_step": 45528, "epoch": 271} {"train_loss": -7.659387111663818, "global_step": 45529, "epoch": 271} {"train_loss": -8.019671440124512, "global_step": 45530, "epoch": 271} {"train_loss": -7.8882975578308105, "global_step": 45531, "epoch": 271} {"train_loss": -7.9364776611328125, "global_step": 45532, "epoch": 271} {"train_loss": -7.9103498458862305, "global_step": 45533, "epoch": 271} {"train_loss": -8.010501861572266, "global_step": 45534, "epoch": 271} {"train_loss": -8.05030345916748, "global_step": 45535, "epoch": 271} {"train_loss": -7.989773750305176, "global_step": 45536, "epoch": 271} {"train_loss": -8.127546310424805, "global_step": 45537, "epoch": 271} {"train_loss": -8.135920524597168, "global_step": 45538, "epoch": 271} {"train_loss": -8.057114601135254, "global_step": 45539, "epoch": 271} {"train_loss": -8.067097663879395, "global_step": 45540, "epoch": 271} {"train_loss": -7.966508865356445, "global_step": 45541, "epoch": 271} {"train_loss": -7.879890441894531, "global_step": 45542, "epoch": 271} {"train_loss": -8.117753028869629, "global_step": 45543, "epoch": 271} {"train_loss": -7.952851295471191, "global_step": 45544, "epoch": 271} {"train_loss": -8.081880569458008, "global_step": 45545, "epoch": 271} {"train_loss": -8.061816215515137, "global_step": 45546, "epoch": 271} {"train_loss": -8.194143295288086, "global_step": 45547, "epoch": 271} {"train_loss": -8.156064987182617, "global_step": 45548, "epoch": 271} {"train_loss": -8.141317367553711, "global_step": 45549, "epoch": 271} {"train_loss": -8.080424308776855, "global_step": 45550, "epoch": 271} {"train_loss": -8.0546875, "global_step": 45551, "epoch": 271} {"train_loss": -8.146432876586914, "global_step": 45552, "epoch": 271} {"train_loss": -8.332697868347168, "global_step": 45553, "epoch": 271} {"train_loss": -8.081497192382812, "global_step": 45554, "epoch": 271} {"train_loss": -8.39556884765625, "global_step": 45555, "epoch": 271} {"train_loss": -8.203716278076172, "global_step": 45556, "epoch": 271} {"train_loss": -8.274627685546875, "global_step": 45557, "epoch": 271} {"train_loss": -8.111652374267578, "global_step": 45558, "epoch": 271} {"train_loss": -8.275276184082031, "global_step": 45559, "epoch": 271} {"train_loss": -8.19931697845459, "global_step": 45560, "epoch": 271} {"train_loss": -8.155143737792969, "global_step": 45561, "epoch": 271} {"train_loss": -8.209651947021484, "global_step": 45562, "epoch": 271} {"train_loss": -8.112114906311035, "global_step": 45563, "epoch": 271} {"train_loss": -8.313308715820312, "global_step": 45564, "epoch": 271} {"train_loss": -8.153802871704102, "global_step": 45565, "epoch": 271} {"train_loss": -8.332984924316406, "global_step": 45566, "epoch": 271} {"train_loss": -8.189790725708008, "global_step": 45567, "epoch": 271} {"train_loss": -8.171213150024414, "global_step": 45568, "epoch": 271} {"train_loss": -8.05655574798584, "global_step": 45569, "epoch": 271} {"train_loss": -8.185371398925781, "global_step": 45570, "epoch": 271} {"train_loss": -7.996241092681885, "global_step": 45571, "epoch": 271} {"train_loss": -8.143318176269531, "global_step": 45572, "epoch": 271} {"train_loss": -8.110456466674805, "global_step": 45573, "epoch": 271} {"train_loss": -8.077547073364258, "global_step": 45574, "epoch": 271} {"train_loss": -7.909191608428955, "global_step": 45575, "epoch": 271} {"train_loss": -8.013833999633789, "global_step": 45576, "epoch": 271} {"train_loss": -8.001290321350098, "global_step": 45577, "epoch": 271} {"train_loss": -8.228321075439453, "global_step": 45578, "epoch": 271} {"train_loss": -7.972609996795654, "global_step": 45579, "epoch": 271} {"train_loss": -8.102510452270508, "global_step": 45580, "epoch": 271} {"train_loss": -8.085912704467773, "global_step": 45581, "epoch": 271} {"train_loss": -8.12425422668457, "global_step": 45582, "epoch": 271} {"train_loss": -7.839601516723633, "global_step": 45583, "epoch": 271} {"train_loss": -8.055154800415039, "global_step": 45584, "epoch": 271} {"train_loss": -7.9977593421936035, "global_step": 45585, "epoch": 271} {"train_loss": -8.287322998046875, "global_step": 45586, "epoch": 271} {"train_loss": -8.129362106323242, "global_step": 45587, "epoch": 271} {"train_loss": -8.038982391357422, "global_step": 45588, "epoch": 271} {"train_loss": -8.324237823486328, "global_step": 45589, "epoch": 271} {"train_loss": -8.199764251708984, "global_step": 45590, "epoch": 271} {"train_loss": -8.166803359985352, "global_step": 45591, "epoch": 271} {"train_loss": -8.255399703979492, "global_step": 45592, "epoch": 271} {"train_loss": -8.238842010498047, "global_step": 45593, "epoch": 271} {"train_loss": -8.102224349975586, "global_step": 45594, "epoch": 271} {"train_loss": -8.181668281555176, "global_step": 45595, "epoch": 271} {"train_loss": -8.255661010742188, "global_step": 45596, "epoch": 271} {"train_loss": -8.173739433288574, "global_step": 45597, "epoch": 271} {"train_loss": -8.097799301147461, "global_step": 45598, "epoch": 271} {"train_loss": -8.100345611572266, "global_step": 45599, "epoch": 271} {"train_loss": -8.169620513916016, "global_step": 45600, "epoch": 271} {"train_loss": -8.193061828613281, "global_step": 45601, "epoch": 271} {"train_loss": -8.2351713180542, "global_step": 45602, "epoch": 271} {"train_loss": -8.24616813659668, "global_step": 45603, "epoch": 271} {"train_loss": -8.382427215576172, "global_step": 45604, "epoch": 271} {"train_loss": -8.295143127441406, "global_step": 45605, "epoch": 271} {"train_loss": -8.170513153076172, "global_step": 45606, "epoch": 271} {"train_loss": -8.205633163452148, "global_step": 45607, "epoch": 271} {"train_loss": -8.123791694641113, "global_step": 45608, "epoch": 271} {"train_loss": -8.283111572265625, "global_step": 45609, "epoch": 271} {"train_loss": -8.407087326049805, "global_step": 45610, "epoch": 271} {"train_loss": -8.20766544342041, "global_step": 45611, "epoch": 271} {"train_loss": -8.35579776763916, "global_step": 45612, "epoch": 271} {"train_loss": -8.105293273925781, "global_step": 45613, "epoch": 271} {"train_loss": -8.1170015335083, "global_step": 45614, "epoch": 271} {"train_loss": -7.874606132507324, "global_step": 45615, "epoch": 271} {"train_loss": -8.204292297363281, "global_step": 45616, "epoch": 271} {"train_loss": -7.98801851272583, "global_step": 45617, "epoch": 271} {"train_loss": -8.171045303344727, "global_step": 45618, "epoch": 271} {"train_loss": -7.857585430145264, "global_step": 45619, "epoch": 271} {"train_loss": -8.048933029174805, "global_step": 45620, "epoch": 271} {"train_loss": -7.984856128692627, "global_step": 45621, "epoch": 271} {"train_loss": -7.941309928894043, "global_step": 45622, "epoch": 271} {"train_loss": -8.157415390014648, "global_step": 45623, "epoch": 271} {"train_loss": -8.320338249206543, "global_step": 45624, "epoch": 271} {"train_loss": -8.020447731018066, "global_step": 45625, "epoch": 271} {"train_loss": -8.249358177185059, "global_step": 45626, "epoch": 271} {"train_loss": -8.204854965209961, "global_step": 45627, "epoch": 271} {"train_loss": -8.083770751953125, "global_step": 45628, "epoch": 271} {"train_loss": -8.197662353515625, "global_step": 45629, "epoch": 271} {"train_loss": -8.225950241088867, "global_step": 45630, "epoch": 271} {"train_loss": -8.223278045654297, "global_step": 45631, "epoch": 271} {"train_loss": -8.306681632995605, "global_step": 45632, "epoch": 271} {"train_loss": -8.129961967468262, "global_step": 45633, "epoch": 271} {"train_loss": -8.331018447875977, "global_step": 45634, "epoch": 271} {"train_loss": -8.139837265014648, "global_step": 45635, "epoch": 271} {"train_loss": -8.049007415771484, "global_step": 45636, "epoch": 271} {"train_loss": -8.139115333557129, "global_step": 45637, "epoch": 271} {"train_loss": -8.138972282409668, "global_step": 45638, "epoch": 271} {"train_loss": -8.32754898071289, "global_step": 45639, "epoch": 271} {"train_loss": -8.045764923095703, "global_step": 45640, "epoch": 271} {"train_loss": -8.486927032470703, "global_step": 45641, "epoch": 271} {"train_loss": -8.235135078430176, "global_step": 45642, "epoch": 271} {"train_loss": -8.145291328430176, "global_step": 45643, "epoch": 271} {"train_loss": -8.343409538269043, "global_step": 45644, "epoch": 271} {"train_loss": -8.384611129760742, "global_step": 45645, "epoch": 271} {"train_loss": -8.13200855255127, "global_step": 45646, "epoch": 271} {"train_loss": -8.278976440429688, "global_step": 45647, "epoch": 271} {"train_loss": -8.461201667785645, "global_step": 45648, "epoch": 271} {"train_loss": -8.317541122436523, "global_step": 45649, "epoch": 271} {"train_loss": -8.097487449645996, "global_step": 45650, "epoch": 271} {"train_loss": -8.225872039794922, "global_step": 45651, "epoch": 271} {"train_loss": -8.163888931274414, "global_step": 45652, "epoch": 271} {"train_loss": -8.263959884643555, "global_step": 45653, "epoch": 271} {"train_loss": -8.464887619018555, "global_step": 45654, "epoch": 271} {"train_loss": -8.357025146484375, "global_step": 45655, "epoch": 271} {"train_loss": -8.239151954650879, "global_step": 45656, "epoch": 271} {"train_loss": -8.164793968200684, "global_step": 45657, "epoch": 271} {"train_loss": -8.259608268737793, "global_step": 45658, "epoch": 271} {"train_loss": -8.323763847351074, "global_step": 45659, "epoch": 271} {"train_loss": -8.399402618408203, "global_step": 45660, "epoch": 271} {"train_loss": -8.260147094726562, "global_step": 45661, "epoch": 271} {"train_loss": -8.350122451782227, "global_step": 45662, "epoch": 271} {"train_loss": -8.17690658569336, "global_step": 45663, "epoch": 271} {"train_loss": -8.158143043518066, "global_step": 45664, "epoch": 271} {"train_loss": -7.982906818389893, "global_step": 45665, "epoch": 271} {"train_loss": -8.149425506591797, "global_step": 45666, "epoch": 271} {"train_loss": -8.10580062866211, "global_step": 45667, "epoch": 271} {"train_loss": -8.084247589111328, "global_step": 45668, "epoch": 271} {"train_loss": -8.193746566772461, "global_step": 45669, "epoch": 271} {"train_loss": -8.0017671585083, "global_step": 45670, "epoch": 271} {"train_loss": -8.090143203735352, "global_step": 45671, "epoch": 271} {"train_loss": -8.060749053955078, "global_step": 45672, "epoch": 271} {"train_loss": -8.226829528808594, "global_step": 45673, "epoch": 271} {"train_loss": -8.072877883911133, "global_step": 45674, "epoch": 271} {"train_loss": -8.293174743652344, "global_step": 45675, "epoch": 271} {"train_loss": -8.219356536865234, "global_step": 45676, "epoch": 271} {"train_loss": -8.27464485168457, "global_step": 45677, "epoch": 271} {"train_loss": -7.958401203155518, "global_step": 45678, "epoch": 271} {"train_loss": -8.418258666992188, "global_step": 45679, "epoch": 271} {"train_loss": -8.218742370605469, "global_step": 45680, "epoch": 271} {"train_loss": -8.325353622436523, "global_step": 45681, "epoch": 271} {"train_loss": -8.12086296081543, "global_step": 45682, "epoch": 271} {"train_loss": -8.180398941040039, "global_step": 45683, "epoch": 271} {"train_loss": -8.056809425354004, "global_step": 45684, "epoch": 271} {"train_loss": -8.141548156738281, "global_step": 45685, "epoch": 271} {"train_loss": -7.720534324645996, "global_step": 45686, "epoch": 271} {"train_loss": -8.220125198364258, "global_step": 45687, "epoch": 271} {"train_loss": -8.09969425201416, "global_step": 45688, "epoch": 271} {"train_loss": -7.915284156799316, "global_step": 45689, "epoch": 271} {"train_loss": -8.123641014099121, "global_step": 45690, "epoch": 271} {"train_loss": -8.174196243286133, "global_step": 45691, "epoch": 271} {"train_loss": -7.932868957519531, "global_step": 45692, "epoch": 271} {"train_loss": -8.254169464111328, "global_step": 45693, "epoch": 271} {"train_loss": -8.215771675109863, "global_step": 45694, "epoch": 271} {"train_loss": -8.149198449793316, "global_step": 45695, "epoch": 271, "val_loss": 187795.796875} {"train_loss": -8.151416778564453, "global_step": 45696, "epoch": 272} {"train_loss": -8.169158935546875, "global_step": 45697, "epoch": 272} {"train_loss": -8.333789825439453, "global_step": 45698, "epoch": 272} {"train_loss": -8.242549896240234, "global_step": 45699, "epoch": 272} {"train_loss": -8.068246841430664, "global_step": 45700, "epoch": 272} {"train_loss": -8.296062469482422, "global_step": 45701, "epoch": 272} {"train_loss": -7.9157395362854, "global_step": 45702, "epoch": 272} {"train_loss": -8.094322204589844, "global_step": 45703, "epoch": 272} {"train_loss": -8.172273635864258, "global_step": 45704, "epoch": 272} {"train_loss": -8.403786659240723, "global_step": 45705, "epoch": 272} {"train_loss": -8.401244163513184, "global_step": 45706, "epoch": 272} {"train_loss": -8.397371292114258, "global_step": 45707, "epoch": 272} {"train_loss": -8.299467086791992, "global_step": 45708, "epoch": 272} {"train_loss": -8.371816635131836, "global_step": 45709, "epoch": 272} {"train_loss": -8.436319351196289, "global_step": 45710, "epoch": 272} {"train_loss": -8.391461372375488, "global_step": 45711, "epoch": 272} {"train_loss": -8.277880668640137, "global_step": 45712, "epoch": 272} {"train_loss": -8.401735305786133, "global_step": 45713, "epoch": 272} {"train_loss": -8.251443862915039, "global_step": 45714, "epoch": 272} {"train_loss": -8.24478816986084, "global_step": 45715, "epoch": 272} {"train_loss": -8.347481727600098, "global_step": 45716, "epoch": 272} {"train_loss": -8.202742576599121, "global_step": 45717, "epoch": 272} {"train_loss": -8.276330947875977, "global_step": 45718, "epoch": 272} {"train_loss": -8.470071792602539, "global_step": 45719, "epoch": 272} {"train_loss": -8.139683723449707, "global_step": 45720, "epoch": 272} {"train_loss": -8.175886154174805, "global_step": 45721, "epoch": 272} {"train_loss": -8.403593063354492, "global_step": 45722, "epoch": 272} {"train_loss": -7.984668731689453, "global_step": 45723, "epoch": 272} {"train_loss": -8.010110855102539, "global_step": 45724, "epoch": 272} {"train_loss": -8.402987480163574, "global_step": 45725, "epoch": 272} {"train_loss": -8.029951095581055, "global_step": 45726, "epoch": 272} {"train_loss": -8.024177551269531, "global_step": 45727, "epoch": 272} {"train_loss": -8.07208251953125, "global_step": 45728, "epoch": 272} {"train_loss": -7.982645034790039, "global_step": 45729, "epoch": 272} {"train_loss": -7.971970558166504, "global_step": 45730, "epoch": 272} {"train_loss": -8.102333068847656, "global_step": 45731, "epoch": 272} {"train_loss": -8.109857559204102, "global_step": 45732, "epoch": 272} {"train_loss": -7.844010353088379, "global_step": 45733, "epoch": 272} {"train_loss": -8.10853385925293, "global_step": 45734, "epoch": 272} {"train_loss": -8.103068351745605, "global_step": 45735, "epoch": 272} {"train_loss": -8.037198066711426, "global_step": 45736, "epoch": 272} {"train_loss": -8.152326583862305, "global_step": 45737, "epoch": 272} {"train_loss": -8.090221405029297, "global_step": 45738, "epoch": 272} {"train_loss": -8.296077728271484, "global_step": 45739, "epoch": 272} {"train_loss": -8.162811279296875, "global_step": 45740, "epoch": 272} {"train_loss": -7.962630271911621, "global_step": 45741, "epoch": 272} {"train_loss": -8.32909870147705, "global_step": 45742, "epoch": 272} {"train_loss": -8.361519813537598, "global_step": 45743, "epoch": 272} {"train_loss": -8.378623008728027, "global_step": 45744, "epoch": 272} {"train_loss": -8.233423233032227, "global_step": 45745, "epoch": 272} {"train_loss": -8.054717063903809, "global_step": 45746, "epoch": 272} {"train_loss": -8.194829940795898, "global_step": 45747, "epoch": 272} {"train_loss": -8.30795669555664, "global_step": 45748, "epoch": 272} {"train_loss": -8.293514251708984, "global_step": 45749, "epoch": 272} {"train_loss": -8.249979972839355, "global_step": 45750, "epoch": 272} {"train_loss": -8.306669235229492, "global_step": 45751, "epoch": 272} {"train_loss": -8.203786849975586, "global_step": 45752, "epoch": 272} {"train_loss": -8.099955558776855, "global_step": 45753, "epoch": 272} {"train_loss": -8.27444076538086, "global_step": 45754, "epoch": 272} {"train_loss": -8.316145896911621, "global_step": 45755, "epoch": 272} {"train_loss": -8.357561111450195, "global_step": 45756, "epoch": 272} {"train_loss": -8.215557098388672, "global_step": 45757, "epoch": 272} {"train_loss": -8.28622817993164, "global_step": 45758, "epoch": 272} {"train_loss": -8.233798027038574, "global_step": 45759, "epoch": 272} {"train_loss": -8.171091079711914, "global_step": 45760, "epoch": 272} {"train_loss": -8.420069694519043, "global_step": 45761, "epoch": 272} {"train_loss": -8.207047462463379, "global_step": 45762, "epoch": 272} {"train_loss": -8.239646911621094, "global_step": 45763, "epoch": 272} {"train_loss": -7.785844802856445, "global_step": 45764, "epoch": 272} {"train_loss": -8.228189468383789, "global_step": 45765, "epoch": 272} {"train_loss": -7.723677635192871, "global_step": 45766, "epoch": 272} {"train_loss": -7.794719696044922, "global_step": 45767, "epoch": 272} {"train_loss": -8.304255485534668, "global_step": 45768, "epoch": 272} {"train_loss": -7.9518537521362305, "global_step": 45769, "epoch": 272} {"train_loss": -8.053291320800781, "global_step": 45770, "epoch": 272} {"train_loss": -7.9982829093933105, "global_step": 45771, "epoch": 272} {"train_loss": -7.955921173095703, "global_step": 45772, "epoch": 272} {"train_loss": -8.15930461883545, "global_step": 45773, "epoch": 272} {"train_loss": -8.261608123779297, "global_step": 45774, "epoch": 272} {"train_loss": -8.077537536621094, "global_step": 45775, "epoch": 272} {"train_loss": -8.165043830871582, "global_step": 45776, "epoch": 272} {"train_loss": -8.007553100585938, "global_step": 45777, "epoch": 272} {"train_loss": -8.15884780883789, "global_step": 45778, "epoch": 272} {"train_loss": -8.080906867980957, "global_step": 45779, "epoch": 272} {"train_loss": -8.050925254821777, "global_step": 45780, "epoch": 272} {"train_loss": -8.368051528930664, "global_step": 45781, "epoch": 272} {"train_loss": -7.990363121032715, "global_step": 45782, "epoch": 272} {"train_loss": -8.095220565795898, "global_step": 45783, "epoch": 272} {"train_loss": -8.427050590515137, "global_step": 45784, "epoch": 272} {"train_loss": -8.239059448242188, "global_step": 45785, "epoch": 272} {"train_loss": -8.283288955688477, "global_step": 45786, "epoch": 272} {"train_loss": -8.141357421875, "global_step": 45787, "epoch": 272} {"train_loss": -8.244945526123047, "global_step": 45788, "epoch": 272} {"train_loss": -8.37238883972168, "global_step": 45789, "epoch": 272} {"train_loss": -8.257709503173828, "global_step": 45790, "epoch": 272} {"train_loss": -8.305994033813477, "global_step": 45791, "epoch": 272} {"train_loss": -8.261951446533203, "global_step": 45792, "epoch": 272} {"train_loss": -8.441680908203125, "global_step": 45793, "epoch": 272} {"train_loss": -8.221749305725098, "global_step": 45794, "epoch": 272} {"train_loss": -8.029300689697266, "global_step": 45795, "epoch": 272} {"train_loss": -8.210151672363281, "global_step": 45796, "epoch": 272} {"train_loss": -8.24950885772705, "global_step": 45797, "epoch": 272} {"train_loss": -8.235308647155762, "global_step": 45798, "epoch": 272} {"train_loss": -8.235696792602539, "global_step": 45799, "epoch": 272} {"train_loss": -7.961647033691406, "global_step": 45800, "epoch": 272} {"train_loss": -8.1465425491333, "global_step": 45801, "epoch": 272} {"train_loss": -8.076327323913574, "global_step": 45802, "epoch": 272} {"train_loss": -8.217798233032227, "global_step": 45803, "epoch": 272} {"train_loss": -8.19415283203125, "global_step": 45804, "epoch": 272} {"train_loss": -8.378965377807617, "global_step": 45805, "epoch": 272} {"train_loss": -8.097314834594727, "global_step": 45806, "epoch": 272} {"train_loss": -8.04185676574707, "global_step": 45807, "epoch": 272} {"train_loss": -8.07379150390625, "global_step": 45808, "epoch": 272} {"train_loss": -8.130879402160645, "global_step": 45809, "epoch": 272} {"train_loss": -8.050029754638672, "global_step": 45810, "epoch": 272} {"train_loss": -8.237594604492188, "global_step": 45811, "epoch": 272} {"train_loss": -8.201457023620605, "global_step": 45812, "epoch": 272} {"train_loss": -8.11751651763916, "global_step": 45813, "epoch": 272} {"train_loss": -8.208093643188477, "global_step": 45814, "epoch": 272} {"train_loss": -8.187155723571777, "global_step": 45815, "epoch": 272} {"train_loss": -7.9985671043396, "global_step": 45816, "epoch": 272} {"train_loss": -8.351271629333496, "global_step": 45817, "epoch": 272} {"train_loss": -8.182621955871582, "global_step": 45818, "epoch": 272} {"train_loss": -8.163822174072266, "global_step": 45819, "epoch": 272} {"train_loss": -8.104574203491211, "global_step": 45820, "epoch": 272} {"train_loss": -8.174324989318848, "global_step": 45821, "epoch": 272} {"train_loss": -8.185226440429688, "global_step": 45822, "epoch": 272} {"train_loss": -8.227180480957031, "global_step": 45823, "epoch": 272} {"train_loss": -8.265789031982422, "global_step": 45824, "epoch": 272} {"train_loss": -7.866057395935059, "global_step": 45825, "epoch": 272} {"train_loss": -8.277508735656738, "global_step": 45826, "epoch": 272} {"train_loss": -8.123382568359375, "global_step": 45827, "epoch": 272} {"train_loss": -8.009111404418945, "global_step": 45828, "epoch": 272} {"train_loss": -8.33501148223877, "global_step": 45829, "epoch": 272} {"train_loss": -8.385028839111328, "global_step": 45830, "epoch": 272} {"train_loss": -7.931996822357178, "global_step": 45831, "epoch": 272} {"train_loss": -8.160697937011719, "global_step": 45832, "epoch": 272} {"train_loss": -8.157028198242188, "global_step": 45833, "epoch": 272} {"train_loss": -8.144376754760742, "global_step": 45834, "epoch": 272} {"train_loss": -8.153654098510742, "global_step": 45835, "epoch": 272} {"train_loss": -8.190229415893555, "global_step": 45836, "epoch": 272} {"train_loss": -8.381913185119629, "global_step": 45837, "epoch": 272} {"train_loss": -8.1650972366333, "global_step": 45838, "epoch": 272} {"train_loss": -8.323858261108398, "global_step": 45839, "epoch": 272} {"train_loss": -8.020912170410156, "global_step": 45840, "epoch": 272} {"train_loss": -8.0188627243042, "global_step": 45841, "epoch": 272} {"train_loss": -8.169315338134766, "global_step": 45842, "epoch": 272} {"train_loss": -8.085248947143555, "global_step": 45843, "epoch": 272} {"train_loss": -8.041848182678223, "global_step": 45844, "epoch": 272} {"train_loss": -8.379344940185547, "global_step": 45845, "epoch": 272} {"train_loss": -8.070730209350586, "global_step": 45846, "epoch": 272} {"train_loss": -8.193824768066406, "global_step": 45847, "epoch": 272} {"train_loss": -8.222123146057129, "global_step": 45848, "epoch": 272} {"train_loss": -8.339134216308594, "global_step": 45849, "epoch": 272} {"train_loss": -8.274734497070312, "global_step": 45850, "epoch": 272} {"train_loss": -8.202131271362305, "global_step": 45851, "epoch": 272} {"train_loss": -8.32784652709961, "global_step": 45852, "epoch": 272} {"train_loss": -8.152406692504883, "global_step": 45853, "epoch": 272} {"train_loss": -8.061028480529785, "global_step": 45854, "epoch": 272} {"train_loss": -8.482348442077637, "global_step": 45855, "epoch": 272} {"train_loss": -8.101473808288574, "global_step": 45856, "epoch": 272} {"train_loss": -8.363115310668945, "global_step": 45857, "epoch": 272} {"train_loss": -8.42348861694336, "global_step": 45858, "epoch": 272} {"train_loss": -8.22677993774414, "global_step": 45859, "epoch": 272} {"train_loss": -8.225549697875977, "global_step": 45860, "epoch": 272} {"train_loss": -8.403253555297852, "global_step": 45861, "epoch": 272} {"train_loss": -8.141039848327637, "global_step": 45862, "epoch": 272} {"train_loss": -8.189243231500898, "global_step": 45863, "epoch": 272, "val_loss": 185171.71875} {"train_loss": -8.182340621948242, "global_step": 45864, "epoch": 273} {"train_loss": -8.412422180175781, "global_step": 45865, "epoch": 273} {"train_loss": -8.102388381958008, "global_step": 45866, "epoch": 273} {"train_loss": -8.338090896606445, "global_step": 45867, "epoch": 273} {"train_loss": -8.231917381286621, "global_step": 45868, "epoch": 273} {"train_loss": -8.343181610107422, "global_step": 45869, "epoch": 273} {"train_loss": -8.304496765136719, "global_step": 45870, "epoch": 273} {"train_loss": -8.346529960632324, "global_step": 45871, "epoch": 273} {"train_loss": -8.304439544677734, "global_step": 45872, "epoch": 273} {"train_loss": -8.303085327148438, "global_step": 45873, "epoch": 273} {"train_loss": -8.197784423828125, "global_step": 45874, "epoch": 273} {"train_loss": -8.093221664428711, "global_step": 45875, "epoch": 273} {"train_loss": -8.15360164642334, "global_step": 45876, "epoch": 273} {"train_loss": -8.335859298706055, "global_step": 45877, "epoch": 273} {"train_loss": -8.182831764221191, "global_step": 45878, "epoch": 273} {"train_loss": -8.245201110839844, "global_step": 45879, "epoch": 273} {"train_loss": -8.103501319885254, "global_step": 45880, "epoch": 273} {"train_loss": -8.166261672973633, "global_step": 45881, "epoch": 273} {"train_loss": -8.076925277709961, "global_step": 45882, "epoch": 273} {"train_loss": -7.987007141113281, "global_step": 45883, "epoch": 273} {"train_loss": -7.868266582489014, "global_step": 45884, "epoch": 273} {"train_loss": -8.13541030883789, "global_step": 45885, "epoch": 273} {"train_loss": -7.9055681228637695, "global_step": 45886, "epoch": 273} {"train_loss": -8.0255708694458, "global_step": 45887, "epoch": 273} {"train_loss": -7.90878963470459, "global_step": 45888, "epoch": 273} {"train_loss": -8.075386047363281, "global_step": 45889, "epoch": 273} {"train_loss": -8.051138877868652, "global_step": 45890, "epoch": 273} {"train_loss": -8.210055351257324, "global_step": 45891, "epoch": 273} {"train_loss": -7.868127822875977, "global_step": 45892, "epoch": 273} {"train_loss": -8.262962341308594, "global_step": 45893, "epoch": 273} {"train_loss": -7.916957855224609, "global_step": 45894, "epoch": 273} {"train_loss": -7.798552513122559, "global_step": 45895, "epoch": 273} {"train_loss": -7.6882805824279785, "global_step": 45896, "epoch": 273} {"train_loss": -8.291492462158203, "global_step": 45897, "epoch": 273} {"train_loss": -8.209684371948242, "global_step": 45898, "epoch": 273} {"train_loss": -8.148516654968262, "global_step": 45899, "epoch": 273} {"train_loss": -8.126224517822266, "global_step": 45900, "epoch": 273} {"train_loss": -8.112390518188477, "global_step": 45901, "epoch": 273} {"train_loss": -8.340728759765625, "global_step": 45902, "epoch": 273} {"train_loss": -8.16417121887207, "global_step": 45903, "epoch": 273} {"train_loss": -8.049484252929688, "global_step": 45904, "epoch": 273} {"train_loss": -8.071433067321777, "global_step": 45905, "epoch": 273} {"train_loss": -8.333252906799316, "global_step": 45906, "epoch": 273} {"train_loss": -8.233190536499023, "global_step": 45907, "epoch": 273} {"train_loss": -8.360447883605957, "global_step": 45908, "epoch": 273} {"train_loss": -7.990113258361816, "global_step": 45909, "epoch": 273} {"train_loss": -8.211929321289062, "global_step": 45910, "epoch": 273} {"train_loss": -8.066152572631836, "global_step": 45911, "epoch": 273} {"train_loss": -8.416083335876465, "global_step": 45912, "epoch": 273} {"train_loss": -8.173416137695312, "global_step": 45913, "epoch": 273} {"train_loss": -8.064189910888672, "global_step": 45914, "epoch": 273} {"train_loss": -8.3124418258667, "global_step": 45915, "epoch": 273} {"train_loss": -8.31707763671875, "global_step": 45916, "epoch": 273} {"train_loss": -7.876091003417969, "global_step": 45917, "epoch": 273} {"train_loss": -8.183794021606445, "global_step": 45918, "epoch": 273} {"train_loss": -7.983625411987305, "global_step": 45919, "epoch": 273} {"train_loss": -8.111493110656738, "global_step": 45920, "epoch": 273} {"train_loss": -7.900735855102539, "global_step": 45921, "epoch": 273} {"train_loss": -8.160784721374512, "global_step": 45922, "epoch": 273} {"train_loss": -8.150118827819824, "global_step": 45923, "epoch": 273} {"train_loss": -7.777044296264648, "global_step": 45924, "epoch": 273} {"train_loss": -8.262664794921875, "global_step": 45925, "epoch": 273} {"train_loss": -7.997735023498535, "global_step": 45926, "epoch": 273} {"train_loss": -8.256568908691406, "global_step": 45927, "epoch": 273} {"train_loss": -7.790612697601318, "global_step": 45928, "epoch": 273} {"train_loss": -8.043569564819336, "global_step": 45929, "epoch": 273} {"train_loss": -7.754498481750488, "global_step": 45930, "epoch": 273} {"train_loss": -8.009133338928223, "global_step": 45931, "epoch": 273} {"train_loss": -8.063294410705566, "global_step": 45932, "epoch": 273} {"train_loss": -7.849948883056641, "global_step": 45933, "epoch": 273} {"train_loss": -7.905962944030762, "global_step": 45934, "epoch": 273} {"train_loss": -7.790948867797852, "global_step": 45935, "epoch": 273} {"train_loss": -8.150491714477539, "global_step": 45936, "epoch": 273} {"train_loss": -7.680130958557129, "global_step": 45937, "epoch": 273} {"train_loss": -7.963647842407227, "global_step": 45938, "epoch": 273} {"train_loss": -7.699806213378906, "global_step": 45939, "epoch": 273} {"train_loss": -7.860018730163574, "global_step": 45940, "epoch": 273} {"train_loss": -7.9087748527526855, "global_step": 45941, "epoch": 273} {"train_loss": -7.817148208618164, "global_step": 45942, "epoch": 273} {"train_loss": -8.117114067077637, "global_step": 45943, "epoch": 273} {"train_loss": -7.712669849395752, "global_step": 45944, "epoch": 273} {"train_loss": -7.895211219787598, "global_step": 45945, "epoch": 273} {"train_loss": -8.167681694030762, "global_step": 45946, "epoch": 273} {"train_loss": -7.932719707489014, "global_step": 45947, "epoch": 273} {"train_loss": -8.156811714172363, "global_step": 45948, "epoch": 273} {"train_loss": -7.978124618530273, "global_step": 45949, "epoch": 273} {"train_loss": -7.7172393798828125, "global_step": 45950, "epoch": 273} {"train_loss": -8.083724975585938, "global_step": 45951, "epoch": 273} {"train_loss": -7.688602447509766, "global_step": 45952, "epoch": 273} {"train_loss": -8.148247718811035, "global_step": 45953, "epoch": 273} {"train_loss": -8.197341918945312, "global_step": 45954, "epoch": 273} {"train_loss": -7.927976608276367, "global_step": 45955, "epoch": 273} {"train_loss": -8.242026329040527, "global_step": 45956, "epoch": 273} {"train_loss": -8.242912292480469, "global_step": 45957, "epoch": 273} {"train_loss": -8.286556243896484, "global_step": 45958, "epoch": 273} {"train_loss": -7.809667587280273, "global_step": 45959, "epoch": 273} {"train_loss": -8.093587875366211, "global_step": 45960, "epoch": 273} {"train_loss": -8.343809127807617, "global_step": 45961, "epoch": 273} {"train_loss": -8.307344436645508, "global_step": 45962, "epoch": 273} {"train_loss": -8.272276878356934, "global_step": 45963, "epoch": 273} {"train_loss": -8.087285995483398, "global_step": 45964, "epoch": 273} {"train_loss": -8.24097728729248, "global_step": 45965, "epoch": 273} {"train_loss": -8.080636024475098, "global_step": 45966, "epoch": 273} {"train_loss": -8.337181091308594, "global_step": 45967, "epoch": 273} {"train_loss": -8.105165481567383, "global_step": 45968, "epoch": 273} {"train_loss": -8.25865364074707, "global_step": 45969, "epoch": 273} {"train_loss": -8.337520599365234, "global_step": 45970, "epoch": 273} {"train_loss": -8.117388725280762, "global_step": 45971, "epoch": 273} {"train_loss": -8.201791763305664, "global_step": 45972, "epoch": 273} {"train_loss": -8.225077629089355, "global_step": 45973, "epoch": 273} {"train_loss": -8.179567337036133, "global_step": 45974, "epoch": 273} {"train_loss": -7.960236549377441, "global_step": 45975, "epoch": 273} {"train_loss": -8.067892074584961, "global_step": 45976, "epoch": 273} {"train_loss": -8.034941673278809, "global_step": 45977, "epoch": 273} {"train_loss": -8.263071060180664, "global_step": 45978, "epoch": 273} {"train_loss": -8.000665664672852, "global_step": 45979, "epoch": 273} {"train_loss": -8.088689804077148, "global_step": 45980, "epoch": 273} {"train_loss": -7.702986240386963, "global_step": 45981, "epoch": 273} {"train_loss": -8.14079761505127, "global_step": 45982, "epoch": 273} {"train_loss": -8.059784889221191, "global_step": 45983, "epoch": 273} {"train_loss": -7.839818000793457, "global_step": 45984, "epoch": 273} {"train_loss": -8.129695892333984, "global_step": 45985, "epoch": 273} {"train_loss": -8.19942855834961, "global_step": 45986, "epoch": 273} {"train_loss": -8.116695404052734, "global_step": 45987, "epoch": 273} {"train_loss": -7.922374248504639, "global_step": 45988, "epoch": 273} {"train_loss": -8.238471984863281, "global_step": 45989, "epoch": 273} {"train_loss": -7.697381019592285, "global_step": 45990, "epoch": 273} {"train_loss": -8.107988357543945, "global_step": 45991, "epoch": 273} {"train_loss": -7.932460784912109, "global_step": 45992, "epoch": 273} {"train_loss": -7.862122058868408, "global_step": 45993, "epoch": 273} {"train_loss": -8.132608413696289, "global_step": 45994, "epoch": 273} {"train_loss": -7.955631732940674, "global_step": 45995, "epoch": 273} {"train_loss": -8.237306594848633, "global_step": 45996, "epoch": 273} {"train_loss": -7.951351165771484, "global_step": 45997, "epoch": 273} {"train_loss": -7.951611518859863, "global_step": 45998, "epoch": 273} {"train_loss": -8.160369873046875, "global_step": 45999, "epoch": 273} {"train_loss": -8.13842487335205, "global_step": 46000, "epoch": 273} {"train_loss": -8.048724174499512, "global_step": 46001, "epoch": 273} {"train_loss": -8.034563064575195, "global_step": 46002, "epoch": 273} {"train_loss": -8.369253158569336, "global_step": 46003, "epoch": 273} {"train_loss": -8.1282958984375, "global_step": 46004, "epoch": 273} {"train_loss": -8.196502685546875, "global_step": 46005, "epoch": 273} {"train_loss": -8.392704010009766, "global_step": 46006, "epoch": 273} {"train_loss": -7.9890875816345215, "global_step": 46007, "epoch": 273} {"train_loss": -8.237081527709961, "global_step": 46008, "epoch": 273} {"train_loss": -8.216958999633789, "global_step": 46009, "epoch": 273} {"train_loss": -8.249090194702148, "global_step": 46010, "epoch": 273} {"train_loss": -8.122495651245117, "global_step": 46011, "epoch": 273} {"train_loss": -8.35200023651123, "global_step": 46012, "epoch": 273} {"train_loss": -8.13612174987793, "global_step": 46013, "epoch": 273} {"train_loss": -8.530423164367676, "global_step": 46014, "epoch": 273} {"train_loss": -8.337343215942383, "global_step": 46015, "epoch": 273} {"train_loss": -8.17238712310791, "global_step": 46016, "epoch": 273} {"train_loss": -8.319965362548828, "global_step": 46017, "epoch": 273} {"train_loss": -8.329412460327148, "global_step": 46018, "epoch": 273} {"train_loss": -7.999941825866699, "global_step": 46019, "epoch": 273} {"train_loss": -8.302727699279785, "global_step": 46020, "epoch": 273} {"train_loss": -8.300463676452637, "global_step": 46021, "epoch": 273} {"train_loss": -8.246601104736328, "global_step": 46022, "epoch": 273} {"train_loss": -8.329184532165527, "global_step": 46023, "epoch": 273} {"train_loss": -8.407234191894531, "global_step": 46024, "epoch": 273} {"train_loss": -8.341691970825195, "global_step": 46025, "epoch": 273} {"train_loss": -8.172552108764648, "global_step": 46026, "epoch": 273} {"train_loss": -8.368143081665039, "global_step": 46027, "epoch": 273} {"train_loss": -8.254292488098145, "global_step": 46028, "epoch": 273} {"train_loss": -7.917759895324707, "global_step": 46029, "epoch": 273} {"train_loss": -8.187735557556152, "global_step": 46030, "epoch": 273} {"train_loss": -8.111269993441445, "global_step": 46031, "epoch": 273, "val_loss": 186432.78125} {"train_loss": -7.973545551300049, "global_step": 46032, "epoch": 274} {"train_loss": -8.219385147094727, "global_step": 46033, "epoch": 274} {"train_loss": -8.13836669921875, "global_step": 46034, "epoch": 274} {"train_loss": -8.195060729980469, "global_step": 46035, "epoch": 274} {"train_loss": -7.7682366371154785, "global_step": 46036, "epoch": 274} {"train_loss": -8.101384162902832, "global_step": 46037, "epoch": 274} {"train_loss": -8.128324508666992, "global_step": 46038, "epoch": 274} {"train_loss": -8.239485740661621, "global_step": 46039, "epoch": 274} {"train_loss": -8.019428253173828, "global_step": 46040, "epoch": 274} {"train_loss": -8.190860748291016, "global_step": 46041, "epoch": 274} {"train_loss": -8.223896026611328, "global_step": 46042, "epoch": 274} {"train_loss": -8.149259567260742, "global_step": 46043, "epoch": 274} {"train_loss": -8.088184356689453, "global_step": 46044, "epoch": 274} {"train_loss": -8.150935173034668, "global_step": 46045, "epoch": 274} {"train_loss": -8.2340087890625, "global_step": 46046, "epoch": 274} {"train_loss": -7.985026836395264, "global_step": 46047, "epoch": 274} {"train_loss": -8.094953536987305, "global_step": 46048, "epoch": 274} {"train_loss": -8.103652954101562, "global_step": 46049, "epoch": 274} {"train_loss": -8.132448196411133, "global_step": 46050, "epoch": 274} {"train_loss": -8.06930160522461, "global_step": 46051, "epoch": 274} {"train_loss": -8.004150390625, "global_step": 46052, "epoch": 274} {"train_loss": -8.28740406036377, "global_step": 46053, "epoch": 274} {"train_loss": -8.232967376708984, "global_step": 46054, "epoch": 274} {"train_loss": -8.211884498596191, "global_step": 46055, "epoch": 274} {"train_loss": -8.158501625061035, "global_step": 46056, "epoch": 274} {"train_loss": -8.490697860717773, "global_step": 46057, "epoch": 274} {"train_loss": -8.03292179107666, "global_step": 46058, "epoch": 274} {"train_loss": -7.913724899291992, "global_step": 46059, "epoch": 274} {"train_loss": -8.35843563079834, "global_step": 46060, "epoch": 274} {"train_loss": -8.283173561096191, "global_step": 46061, "epoch": 274} {"train_loss": -8.161806106567383, "global_step": 46062, "epoch": 274} {"train_loss": -8.176776885986328, "global_step": 46063, "epoch": 274} {"train_loss": -8.238971710205078, "global_step": 46064, "epoch": 274} {"train_loss": -7.636693954467773, "global_step": 46065, "epoch": 274} {"train_loss": -8.564557075500488, "global_step": 46066, "epoch": 274} {"train_loss": -8.016206741333008, "global_step": 46067, "epoch": 274} {"train_loss": -8.251419067382812, "global_step": 46068, "epoch": 274} {"train_loss": -7.806083679199219, "global_step": 46069, "epoch": 274} {"train_loss": -8.284440040588379, "global_step": 46070, "epoch": 274} {"train_loss": -7.733427047729492, "global_step": 46071, "epoch": 274} {"train_loss": -8.11156940460205, "global_step": 46072, "epoch": 274} {"train_loss": -7.999459266662598, "global_step": 46073, "epoch": 274} {"train_loss": -8.112348556518555, "global_step": 46074, "epoch": 274} {"train_loss": -8.184494972229004, "global_step": 46075, "epoch": 274} {"train_loss": -8.03426456451416, "global_step": 46076, "epoch": 274} {"train_loss": -8.080491065979004, "global_step": 46077, "epoch": 274} {"train_loss": -7.971324920654297, "global_step": 46078, "epoch": 274} {"train_loss": -8.168787956237793, "global_step": 46079, "epoch": 274} {"train_loss": -7.932941436767578, "global_step": 46080, "epoch": 274} {"train_loss": -7.894052028656006, "global_step": 46081, "epoch": 274} {"train_loss": -7.887735366821289, "global_step": 46082, "epoch": 274} {"train_loss": -7.8444037437438965, "global_step": 46083, "epoch": 274} {"train_loss": -7.941854000091553, "global_step": 46084, "epoch": 274} {"train_loss": -8.039548873901367, "global_step": 46085, "epoch": 274} {"train_loss": -8.17805290222168, "global_step": 46086, "epoch": 274} {"train_loss": -8.019756317138672, "global_step": 46087, "epoch": 274} {"train_loss": -8.047496795654297, "global_step": 46088, "epoch": 274} {"train_loss": -8.030920028686523, "global_step": 46089, "epoch": 274} {"train_loss": -8.232338905334473, "global_step": 46090, "epoch": 274} {"train_loss": -8.271120071411133, "global_step": 46091, "epoch": 274} {"train_loss": -7.898544788360596, "global_step": 46092, "epoch": 274} {"train_loss": -8.032829284667969, "global_step": 46093, "epoch": 274} {"train_loss": -8.179193496704102, "global_step": 46094, "epoch": 274} {"train_loss": -8.274504661560059, "global_step": 46095, "epoch": 274} {"train_loss": -7.968667030334473, "global_step": 46096, "epoch": 274} {"train_loss": -8.07387924194336, "global_step": 46097, "epoch": 274} {"train_loss": -8.36082935333252, "global_step": 46098, "epoch": 274} {"train_loss": -8.280770301818848, "global_step": 46099, "epoch": 274} {"train_loss": -8.286453247070312, "global_step": 46100, "epoch": 274} {"train_loss": -8.111059188842773, "global_step": 46101, "epoch": 274} {"train_loss": -7.962831497192383, "global_step": 46102, "epoch": 274} {"train_loss": -8.279178619384766, "global_step": 46103, "epoch": 274} {"train_loss": -8.119953155517578, "global_step": 46104, "epoch": 274} {"train_loss": -8.125740051269531, "global_step": 46105, "epoch": 274} {"train_loss": -8.062372207641602, "global_step": 46106, "epoch": 274} {"train_loss": -8.241058349609375, "global_step": 46107, "epoch": 274} {"train_loss": -8.319385528564453, "global_step": 46108, "epoch": 274} {"train_loss": -8.19186782836914, "global_step": 46109, "epoch": 274} {"train_loss": -7.838311672210693, "global_step": 46110, "epoch": 274} {"train_loss": -8.280858993530273, "global_step": 46111, "epoch": 274} {"train_loss": -8.244603157043457, "global_step": 46112, "epoch": 274} {"train_loss": -8.278482437133789, "global_step": 46113, "epoch": 274} {"train_loss": -8.096695899963379, "global_step": 46114, "epoch": 274} {"train_loss": -8.288481712341309, "global_step": 46115, "epoch": 274} {"train_loss": -7.963732719421387, "global_step": 46116, "epoch": 274} {"train_loss": -8.21268367767334, "global_step": 46117, "epoch": 274} {"train_loss": -7.968873977661133, "global_step": 46118, "epoch": 274} {"train_loss": -8.229635238647461, "global_step": 46119, "epoch": 274} {"train_loss": -8.208951950073242, "global_step": 46120, "epoch": 274} {"train_loss": -7.872760772705078, "global_step": 46121, "epoch": 274} {"train_loss": -8.344145774841309, "global_step": 46122, "epoch": 274} {"train_loss": -8.080702781677246, "global_step": 46123, "epoch": 274} {"train_loss": -8.257994651794434, "global_step": 46124, "epoch": 274} {"train_loss": -8.346834182739258, "global_step": 46125, "epoch": 274} {"train_loss": -8.23383903503418, "global_step": 46126, "epoch": 274} {"train_loss": -8.171220779418945, "global_step": 46127, "epoch": 274} {"train_loss": -8.168210983276367, "global_step": 46128, "epoch": 274} {"train_loss": -8.214803695678711, "global_step": 46129, "epoch": 274} {"train_loss": -8.284631729125977, "global_step": 46130, "epoch": 274} {"train_loss": -8.331249237060547, "global_step": 46131, "epoch": 274} {"train_loss": -8.265745162963867, "global_step": 46132, "epoch": 274} {"train_loss": -8.22216510772705, "global_step": 46133, "epoch": 274} {"train_loss": -8.054194450378418, "global_step": 46134, "epoch": 274} {"train_loss": -8.279595375061035, "global_step": 46135, "epoch": 274} {"train_loss": -8.259485244750977, "global_step": 46136, "epoch": 274} {"train_loss": -8.200447082519531, "global_step": 46137, "epoch": 274} {"train_loss": -8.127725601196289, "global_step": 46138, "epoch": 274} {"train_loss": -8.441580772399902, "global_step": 46139, "epoch": 274} {"train_loss": -8.285353660583496, "global_step": 46140, "epoch": 274} {"train_loss": -8.228075981140137, "global_step": 46141, "epoch": 274} {"train_loss": -8.26237678527832, "global_step": 46142, "epoch": 274} {"train_loss": -8.262613296508789, "global_step": 46143, "epoch": 274} {"train_loss": -8.218463897705078, "global_step": 46144, "epoch": 274} {"train_loss": -8.250463485717773, "global_step": 46145, "epoch": 274} {"train_loss": -8.253896713256836, "global_step": 46146, "epoch": 274} {"train_loss": -8.405515670776367, "global_step": 46147, "epoch": 274} {"train_loss": -8.336505889892578, "global_step": 46148, "epoch": 274} {"train_loss": -8.320487976074219, "global_step": 46149, "epoch": 274} {"train_loss": -8.245193481445312, "global_step": 46150, "epoch": 274} {"train_loss": -8.230457305908203, "global_step": 46151, "epoch": 274} {"train_loss": -8.146282196044922, "global_step": 46152, "epoch": 274} {"train_loss": -8.329231262207031, "global_step": 46153, "epoch": 274} {"train_loss": -8.427776336669922, "global_step": 46154, "epoch": 274} {"train_loss": -8.297370910644531, "global_step": 46155, "epoch": 274} {"train_loss": -8.243156433105469, "global_step": 46156, "epoch": 274} {"train_loss": -8.350825309753418, "global_step": 46157, "epoch": 274} {"train_loss": -8.299857139587402, "global_step": 46158, "epoch": 274} {"train_loss": -8.085367202758789, "global_step": 46159, "epoch": 274} {"train_loss": -8.022965431213379, "global_step": 46160, "epoch": 274} {"train_loss": -8.269742965698242, "global_step": 46161, "epoch": 274} {"train_loss": -7.942074298858643, "global_step": 46162, "epoch": 274} {"train_loss": -8.233200073242188, "global_step": 46163, "epoch": 274} {"train_loss": -7.835015296936035, "global_step": 46164, "epoch": 274} {"train_loss": -8.025195121765137, "global_step": 46165, "epoch": 274} {"train_loss": -7.860904693603516, "global_step": 46166, "epoch": 274} {"train_loss": -8.309307098388672, "global_step": 46167, "epoch": 274} {"train_loss": -7.971188068389893, "global_step": 46168, "epoch": 274} {"train_loss": -7.977772235870361, "global_step": 46169, "epoch": 274} {"train_loss": -8.073795318603516, "global_step": 46170, "epoch": 274} {"train_loss": -8.231901168823242, "global_step": 46171, "epoch": 274} {"train_loss": -8.09960651397705, "global_step": 46172, "epoch": 274} {"train_loss": -7.910542011260986, "global_step": 46173, "epoch": 274} {"train_loss": -8.264612197875977, "global_step": 46174, "epoch": 274} {"train_loss": -8.205398559570312, "global_step": 46175, "epoch": 274} {"train_loss": -8.211299896240234, "global_step": 46176, "epoch": 274} {"train_loss": -8.095148086547852, "global_step": 46177, "epoch": 274} {"train_loss": -8.176803588867188, "global_step": 46178, "epoch": 274} {"train_loss": -8.203519821166992, "global_step": 46179, "epoch": 274} {"train_loss": -8.333976745605469, "global_step": 46180, "epoch": 274} {"train_loss": -8.216911315917969, "global_step": 46181, "epoch": 274} {"train_loss": -8.24347972869873, "global_step": 46182, "epoch": 274} {"train_loss": -8.013073921203613, "global_step": 46183, "epoch": 274} {"train_loss": -8.031597137451172, "global_step": 46184, "epoch": 274} {"train_loss": -8.125812530517578, "global_step": 46185, "epoch": 274} {"train_loss": -8.396631240844727, "global_step": 46186, "epoch": 274} {"train_loss": -8.113802909851074, "global_step": 46187, "epoch": 274} {"train_loss": -8.017784118652344, "global_step": 46188, "epoch": 274} {"train_loss": -8.289297103881836, "global_step": 46189, "epoch": 274} {"train_loss": -8.13335132598877, "global_step": 46190, "epoch": 274} {"train_loss": -7.986893653869629, "global_step": 46191, "epoch": 274} {"train_loss": -8.153104782104492, "global_step": 46192, "epoch": 274} {"train_loss": -8.123276710510254, "global_step": 46193, "epoch": 274} {"train_loss": -8.113737106323242, "global_step": 46194, "epoch": 274} {"train_loss": -8.242155075073242, "global_step": 46195, "epoch": 274} {"train_loss": -8.25901985168457, "global_step": 46196, "epoch": 274} {"train_loss": -8.308805465698242, "global_step": 46197, "epoch": 274} {"train_loss": -7.886148452758789, "global_step": 46198, "epoch": 274} {"train_loss": -8.147683560848236, "global_step": 46199, "epoch": 274, "val_loss": 184264.5} {"train_loss": -8.216283798217773, "global_step": 46200, "epoch": 275} {"train_loss": -8.2157621383667, "global_step": 46201, "epoch": 275} {"train_loss": -8.173334121704102, "global_step": 46202, "epoch": 275} {"train_loss": -8.163619041442871, "global_step": 46203, "epoch": 275} {"train_loss": -8.29460620880127, "global_step": 46204, "epoch": 275} {"train_loss": -8.170487403869629, "global_step": 46205, "epoch": 275} {"train_loss": -8.107503890991211, "global_step": 46206, "epoch": 275} {"train_loss": -8.214969635009766, "global_step": 46207, "epoch": 275} {"train_loss": -8.231081008911133, "global_step": 46208, "epoch": 275} {"train_loss": -8.246025085449219, "global_step": 46209, "epoch": 275} {"train_loss": -8.185774803161621, "global_step": 46210, "epoch": 275} {"train_loss": -8.235331535339355, "global_step": 46211, "epoch": 275} {"train_loss": -8.030804634094238, "global_step": 46212, "epoch": 275} {"train_loss": -8.31689739227295, "global_step": 46213, "epoch": 275} {"train_loss": -8.010580062866211, "global_step": 46214, "epoch": 275} {"train_loss": -8.149637222290039, "global_step": 46215, "epoch": 275} {"train_loss": -8.14531135559082, "global_step": 46216, "epoch": 275} {"train_loss": -8.215888023376465, "global_step": 46217, "epoch": 275} {"train_loss": -8.187589645385742, "global_step": 46218, "epoch": 275} {"train_loss": -8.29427433013916, "global_step": 46219, "epoch": 275} {"train_loss": -8.121416091918945, "global_step": 46220, "epoch": 275} {"train_loss": -8.315491676330566, "global_step": 46221, "epoch": 275} {"train_loss": -7.896854400634766, "global_step": 46222, "epoch": 275} {"train_loss": -7.995739459991455, "global_step": 46223, "epoch": 275} {"train_loss": -8.16517162322998, "global_step": 46224, "epoch": 275} {"train_loss": -8.064291000366211, "global_step": 46225, "epoch": 275} {"train_loss": -8.125516891479492, "global_step": 46226, "epoch": 275} {"train_loss": -8.176897048950195, "global_step": 46227, "epoch": 275} {"train_loss": -8.19720458984375, "global_step": 46228, "epoch": 275} {"train_loss": -8.005939483642578, "global_step": 46229, "epoch": 275} {"train_loss": -8.098031997680664, "global_step": 46230, "epoch": 275} {"train_loss": -8.198806762695312, "global_step": 46231, "epoch": 275} {"train_loss": -8.128622055053711, "global_step": 46232, "epoch": 275} {"train_loss": -8.086431503295898, "global_step": 46233, "epoch": 275} {"train_loss": -7.973254203796387, "global_step": 46234, "epoch": 275} {"train_loss": -8.195484161376953, "global_step": 46235, "epoch": 275} {"train_loss": -7.9631547927856445, "global_step": 46236, "epoch": 275} {"train_loss": -8.06981086730957, "global_step": 46237, "epoch": 275} {"train_loss": -8.025812149047852, "global_step": 46238, "epoch": 275} {"train_loss": -8.173519134521484, "global_step": 46239, "epoch": 275} {"train_loss": -8.12198257446289, "global_step": 46240, "epoch": 275} {"train_loss": -8.018501281738281, "global_step": 46241, "epoch": 275} {"train_loss": -8.116985321044922, "global_step": 46242, "epoch": 275} {"train_loss": -8.159390449523926, "global_step": 46243, "epoch": 275} {"train_loss": -8.258304595947266, "global_step": 46244, "epoch": 275} {"train_loss": -8.069326400756836, "global_step": 46245, "epoch": 275} {"train_loss": -8.170482635498047, "global_step": 46246, "epoch": 275} {"train_loss": -8.113566398620605, "global_step": 46247, "epoch": 275} {"train_loss": -8.256000518798828, "global_step": 46248, "epoch": 275} {"train_loss": -8.300537109375, "global_step": 46249, "epoch": 275} {"train_loss": -8.266191482543945, "global_step": 46250, "epoch": 275} {"train_loss": -8.17135238647461, "global_step": 46251, "epoch": 275} {"train_loss": -8.158735275268555, "global_step": 46252, "epoch": 275} {"train_loss": -8.354639053344727, "global_step": 46253, "epoch": 275} {"train_loss": -8.093413352966309, "global_step": 46254, "epoch": 275} {"train_loss": -8.247913360595703, "global_step": 46255, "epoch": 275} {"train_loss": -8.513347625732422, "global_step": 46256, "epoch": 275} {"train_loss": -8.123391151428223, "global_step": 46257, "epoch": 275} {"train_loss": -8.266393661499023, "global_step": 46258, "epoch": 275} {"train_loss": -8.322689056396484, "global_step": 46259, "epoch": 275} {"train_loss": -8.411901473999023, "global_step": 46260, "epoch": 275} {"train_loss": -8.304424285888672, "global_step": 46261, "epoch": 275} {"train_loss": -8.27291488647461, "global_step": 46262, "epoch": 275} {"train_loss": -8.376626968383789, "global_step": 46263, "epoch": 275} {"train_loss": -8.13303279876709, "global_step": 46264, "epoch": 275} {"train_loss": -8.288366317749023, "global_step": 46265, "epoch": 275} {"train_loss": -7.504038333892822, "global_step": 46266, "epoch": 275} {"train_loss": -8.163475036621094, "global_step": 46267, "epoch": 275} {"train_loss": -7.973773002624512, "global_step": 46268, "epoch": 275} {"train_loss": -7.6710405349731445, "global_step": 46269, "epoch": 275} {"train_loss": -7.676748275756836, "global_step": 46270, "epoch": 275} {"train_loss": -7.841638088226318, "global_step": 46271, "epoch": 275} {"train_loss": -7.688387870788574, "global_step": 46272, "epoch": 275} {"train_loss": -7.77853536605835, "global_step": 46273, "epoch": 275} {"train_loss": -7.719002723693848, "global_step": 46274, "epoch": 275} {"train_loss": -7.823712348937988, "global_step": 46275, "epoch": 275} {"train_loss": -7.65571928024292, "global_step": 46276, "epoch": 275} {"train_loss": -7.859304428100586, "global_step": 46277, "epoch": 275} {"train_loss": -7.887422561645508, "global_step": 46278, "epoch": 275} {"train_loss": -7.872589111328125, "global_step": 46279, "epoch": 275} {"train_loss": -7.817360877990723, "global_step": 46280, "epoch": 275} {"train_loss": -8.045555114746094, "global_step": 46281, "epoch": 275} {"train_loss": -7.953418254852295, "global_step": 46282, "epoch": 275} {"train_loss": -7.96785306930542, "global_step": 46283, "epoch": 275} {"train_loss": -7.839897155761719, "global_step": 46284, "epoch": 275} {"train_loss": -8.113313674926758, "global_step": 46285, "epoch": 275} {"train_loss": -7.94549560546875, "global_step": 46286, "epoch": 275} {"train_loss": -8.178838729858398, "global_step": 46287, "epoch": 275} {"train_loss": -8.004606246948242, "global_step": 46288, "epoch": 275} {"train_loss": -8.054215431213379, "global_step": 46289, "epoch": 275} {"train_loss": -8.138189315795898, "global_step": 46290, "epoch": 275} {"train_loss": -8.334909439086914, "global_step": 46291, "epoch": 275} {"train_loss": -8.003684043884277, "global_step": 46292, "epoch": 275} {"train_loss": -8.24767017364502, "global_step": 46293, "epoch": 275} {"train_loss": -8.147758483886719, "global_step": 46294, "epoch": 275} {"train_loss": -8.061921119689941, "global_step": 46295, "epoch": 275} {"train_loss": -8.144122123718262, "global_step": 46296, "epoch": 275} {"train_loss": -8.395313262939453, "global_step": 46297, "epoch": 275} {"train_loss": -8.211467742919922, "global_step": 46298, "epoch": 275} {"train_loss": -8.125066757202148, "global_step": 46299, "epoch": 275} {"train_loss": -8.221600532531738, "global_step": 46300, "epoch": 275} {"train_loss": -7.942570686340332, "global_step": 46301, "epoch": 275} {"train_loss": -8.222179412841797, "global_step": 46302, "epoch": 275} {"train_loss": -8.168937683105469, "global_step": 46303, "epoch": 275} {"train_loss": -8.24155044555664, "global_step": 46304, "epoch": 275} {"train_loss": -8.33454704284668, "global_step": 46305, "epoch": 275} {"train_loss": -8.247817993164062, "global_step": 46306, "epoch": 275} {"train_loss": -8.006580352783203, "global_step": 46307, "epoch": 275} {"train_loss": -8.398139953613281, "global_step": 46308, "epoch": 275} {"train_loss": -7.844928741455078, "global_step": 46309, "epoch": 275} {"train_loss": -8.383264541625977, "global_step": 46310, "epoch": 275} {"train_loss": -8.00675106048584, "global_step": 46311, "epoch": 275} {"train_loss": -8.450665473937988, "global_step": 46312, "epoch": 275} {"train_loss": -8.294940948486328, "global_step": 46313, "epoch": 275} {"train_loss": -8.084007263183594, "global_step": 46314, "epoch": 275} {"train_loss": -8.08720874786377, "global_step": 46315, "epoch": 275} {"train_loss": -8.174454689025879, "global_step": 46316, "epoch": 275} {"train_loss": -8.195660591125488, "global_step": 46317, "epoch": 275} {"train_loss": -8.085582733154297, "global_step": 46318, "epoch": 275} {"train_loss": -8.197357177734375, "global_step": 46319, "epoch": 275} {"train_loss": -8.239498138427734, "global_step": 46320, "epoch": 275} {"train_loss": -8.13079833984375, "global_step": 46321, "epoch": 275} {"train_loss": -8.161702156066895, "global_step": 46322, "epoch": 275} {"train_loss": -8.326411247253418, "global_step": 46323, "epoch": 275} {"train_loss": -7.938040256500244, "global_step": 46324, "epoch": 275} {"train_loss": -8.2474365234375, "global_step": 46325, "epoch": 275} {"train_loss": -7.990829944610596, "global_step": 46326, "epoch": 275} {"train_loss": -8.201155662536621, "global_step": 46327, "epoch": 275} {"train_loss": -8.216934204101562, "global_step": 46328, "epoch": 275} {"train_loss": -8.108217239379883, "global_step": 46329, "epoch": 275} {"train_loss": -8.000775337219238, "global_step": 46330, "epoch": 275} {"train_loss": -8.440254211425781, "global_step": 46331, "epoch": 275} {"train_loss": -8.046466827392578, "global_step": 46332, "epoch": 275} {"train_loss": -8.292930603027344, "global_step": 46333, "epoch": 275} {"train_loss": -8.024712562561035, "global_step": 46334, "epoch": 275} {"train_loss": -8.100324630737305, "global_step": 46335, "epoch": 275} {"train_loss": -8.10791015625, "global_step": 46336, "epoch": 275} {"train_loss": -8.161843299865723, "global_step": 46337, "epoch": 275} {"train_loss": -8.256619453430176, "global_step": 46338, "epoch": 275} {"train_loss": -8.17551040649414, "global_step": 46339, "epoch": 275} {"train_loss": -8.295635223388672, "global_step": 46340, "epoch": 275} {"train_loss": -8.131322860717773, "global_step": 46341, "epoch": 275} {"train_loss": -8.048418998718262, "global_step": 46342, "epoch": 275} {"train_loss": -8.146830558776855, "global_step": 46343, "epoch": 275} {"train_loss": -8.103145599365234, "global_step": 46344, "epoch": 275} {"train_loss": -8.19680404663086, "global_step": 46345, "epoch": 275} {"train_loss": -8.17707347869873, "global_step": 46346, "epoch": 275} {"train_loss": -8.36241340637207, "global_step": 46347, "epoch": 275} {"train_loss": -8.247085571289062, "global_step": 46348, "epoch": 275} {"train_loss": -8.11079216003418, "global_step": 46349, "epoch": 275} {"train_loss": -8.274026870727539, "global_step": 46350, "epoch": 275} {"train_loss": -8.404172897338867, "global_step": 46351, "epoch": 275} {"train_loss": -8.237009048461914, "global_step": 46352, "epoch": 275} {"train_loss": -8.239782333374023, "global_step": 46353, "epoch": 275} {"train_loss": -8.133771896362305, "global_step": 46354, "epoch": 275} {"train_loss": -8.358003616333008, "global_step": 46355, "epoch": 275} {"train_loss": -8.32097053527832, "global_step": 46356, "epoch": 275} {"train_loss": -8.203181266784668, "global_step": 46357, "epoch": 275} {"train_loss": -8.204835891723633, "global_step": 46358, "epoch": 275} {"train_loss": -8.351091384887695, "global_step": 46359, "epoch": 275} {"train_loss": -8.233163833618164, "global_step": 46360, "epoch": 275} {"train_loss": -8.26518726348877, "global_step": 46361, "epoch": 275} {"train_loss": -8.202038764953613, "global_step": 46362, "epoch": 275} {"train_loss": -8.398519515991211, "global_step": 46363, "epoch": 275} {"train_loss": -8.043254852294922, "global_step": 46364, "epoch": 275} {"train_loss": -8.079378128051758, "global_step": 46365, "epoch": 275} {"train_loss": -8.131210327148438, "global_step": 46366, "epoch": 275} {"train_loss": -8.138933650084905, "global_step": 46367, "epoch": 275, "val_loss": 187558.28125, "train_action_mse_error": 5.886517524719238} {"train_loss": -8.209569931030273, "global_step": 46368, "epoch": 276} {"train_loss": -7.783848762512207, "global_step": 46369, "epoch": 276} {"train_loss": -8.007552146911621, "global_step": 46370, "epoch": 276} {"train_loss": -8.14283275604248, "global_step": 46371, "epoch": 276} {"train_loss": -7.98894739151001, "global_step": 46372, "epoch": 276} {"train_loss": -8.118350982666016, "global_step": 46373, "epoch": 276} {"train_loss": -7.969951152801514, "global_step": 46374, "epoch": 276} {"train_loss": -7.855806827545166, "global_step": 46375, "epoch": 276} {"train_loss": -8.157670021057129, "global_step": 46376, "epoch": 276} {"train_loss": -8.000014305114746, "global_step": 46377, "epoch": 276} {"train_loss": -7.9297308921813965, "global_step": 46378, "epoch": 276} {"train_loss": -8.154088973999023, "global_step": 46379, "epoch": 276} {"train_loss": -8.107969284057617, "global_step": 46380, "epoch": 276} {"train_loss": -7.965876579284668, "global_step": 46381, "epoch": 276} {"train_loss": -7.960913181304932, "global_step": 46382, "epoch": 276} {"train_loss": -8.336248397827148, "global_step": 46383, "epoch": 276} {"train_loss": -8.208637237548828, "global_step": 46384, "epoch": 276} {"train_loss": -8.01959228515625, "global_step": 46385, "epoch": 276} {"train_loss": -8.100255966186523, "global_step": 46386, "epoch": 276} {"train_loss": -8.00016975402832, "global_step": 46387, "epoch": 276} {"train_loss": -7.818193435668945, "global_step": 46388, "epoch": 276} {"train_loss": -8.137153625488281, "global_step": 46389, "epoch": 276} {"train_loss": -7.992596626281738, "global_step": 46390, "epoch": 276} {"train_loss": -8.044575691223145, "global_step": 46391, "epoch": 276} {"train_loss": -7.413745403289795, "global_step": 46392, "epoch": 276} {"train_loss": -8.148528099060059, "global_step": 46393, "epoch": 276} {"train_loss": -7.696221351623535, "global_step": 46394, "epoch": 276} {"train_loss": -7.834558963775635, "global_step": 46395, "epoch": 276} {"train_loss": -8.08506965637207, "global_step": 46396, "epoch": 276} {"train_loss": -7.9520769119262695, "global_step": 46397, "epoch": 276} {"train_loss": -7.6876325607299805, "global_step": 46398, "epoch": 276} {"train_loss": -8.131013870239258, "global_step": 46399, "epoch": 276} {"train_loss": -7.94171142578125, "global_step": 46400, "epoch": 276} {"train_loss": -8.165140151977539, "global_step": 46401, "epoch": 276} {"train_loss": -7.851805686950684, "global_step": 46402, "epoch": 276} {"train_loss": -8.016485214233398, "global_step": 46403, "epoch": 276} {"train_loss": -8.068812370300293, "global_step": 46404, "epoch": 276} {"train_loss": -7.925841808319092, "global_step": 46405, "epoch": 276} {"train_loss": -8.195905685424805, "global_step": 46406, "epoch": 276} {"train_loss": -8.108635902404785, "global_step": 46407, "epoch": 276} {"train_loss": -8.140087127685547, "global_step": 46408, "epoch": 276} {"train_loss": -8.13290023803711, "global_step": 46409, "epoch": 276} {"train_loss": -7.967523574829102, "global_step": 46410, "epoch": 276} {"train_loss": -8.072774887084961, "global_step": 46411, "epoch": 276} {"train_loss": -7.7736663818359375, "global_step": 46412, "epoch": 276} {"train_loss": -8.124753952026367, "global_step": 46413, "epoch": 276} {"train_loss": -7.909886360168457, "global_step": 46414, "epoch": 276} {"train_loss": -8.092994689941406, "global_step": 46415, "epoch": 276} {"train_loss": -8.16804027557373, "global_step": 46416, "epoch": 276} {"train_loss": -8.013132095336914, "global_step": 46417, "epoch": 276} {"train_loss": -8.041597366333008, "global_step": 46418, "epoch": 276} {"train_loss": -8.136602401733398, "global_step": 46419, "epoch": 276} {"train_loss": -8.282552719116211, "global_step": 46420, "epoch": 276} {"train_loss": -8.19465446472168, "global_step": 46421, "epoch": 276} {"train_loss": -8.195472717285156, "global_step": 46422, "epoch": 276} {"train_loss": -8.233078002929688, "global_step": 46423, "epoch": 276} {"train_loss": -8.2925386428833, "global_step": 46424, "epoch": 276} {"train_loss": -8.356317520141602, "global_step": 46425, "epoch": 276} {"train_loss": -8.43755054473877, "global_step": 46426, "epoch": 276} {"train_loss": -8.299079895019531, "global_step": 46427, "epoch": 276} {"train_loss": -8.275965690612793, "global_step": 46428, "epoch": 276} {"train_loss": -8.136062622070312, "global_step": 46429, "epoch": 276} {"train_loss": -8.086174011230469, "global_step": 46430, "epoch": 276} {"train_loss": -8.315160751342773, "global_step": 46431, "epoch": 276} {"train_loss": -8.362530708312988, "global_step": 46432, "epoch": 276} {"train_loss": -8.15546989440918, "global_step": 46433, "epoch": 276} {"train_loss": -8.172496795654297, "global_step": 46434, "epoch": 276} {"train_loss": -8.090339660644531, "global_step": 46435, "epoch": 276} {"train_loss": -8.031091690063477, "global_step": 46436, "epoch": 276} {"train_loss": -8.17222785949707, "global_step": 46437, "epoch": 276} {"train_loss": -8.00278377532959, "global_step": 46438, "epoch": 276} {"train_loss": -7.88185977935791, "global_step": 46439, "epoch": 276} {"train_loss": -7.904301643371582, "global_step": 46440, "epoch": 276} {"train_loss": -8.269257545471191, "global_step": 46441, "epoch": 276} {"train_loss": -7.843019485473633, "global_step": 46442, "epoch": 276} {"train_loss": -7.994473934173584, "global_step": 46443, "epoch": 276} {"train_loss": -8.051593780517578, "global_step": 46444, "epoch": 276} {"train_loss": -7.977019309997559, "global_step": 46445, "epoch": 276} {"train_loss": -8.073838233947754, "global_step": 46446, "epoch": 276} {"train_loss": -8.00747299194336, "global_step": 46447, "epoch": 276} {"train_loss": -8.03311538696289, "global_step": 46448, "epoch": 276} {"train_loss": -7.996939182281494, "global_step": 46449, "epoch": 276} {"train_loss": -8.013944625854492, "global_step": 46450, "epoch": 276} {"train_loss": -7.837785720825195, "global_step": 46451, "epoch": 276} {"train_loss": -8.049476623535156, "global_step": 46452, "epoch": 276} {"train_loss": -8.188108444213867, "global_step": 46453, "epoch": 276} {"train_loss": -8.102129936218262, "global_step": 46454, "epoch": 276} {"train_loss": -8.032649993896484, "global_step": 46455, "epoch": 276} {"train_loss": -7.968939781188965, "global_step": 46456, "epoch": 276} {"train_loss": -8.051946640014648, "global_step": 46457, "epoch": 276} {"train_loss": -8.172798156738281, "global_step": 46458, "epoch": 276} {"train_loss": -8.172069549560547, "global_step": 46459, "epoch": 276} {"train_loss": -8.195777893066406, "global_step": 46460, "epoch": 276} {"train_loss": -8.237247467041016, "global_step": 46461, "epoch": 276} {"train_loss": -8.06116771697998, "global_step": 46462, "epoch": 276} {"train_loss": -8.255990982055664, "global_step": 46463, "epoch": 276} {"train_loss": -8.131369590759277, "global_step": 46464, "epoch": 276} {"train_loss": -8.308603286743164, "global_step": 46465, "epoch": 276} {"train_loss": -8.052001953125, "global_step": 46466, "epoch": 276} {"train_loss": -8.378114700317383, "global_step": 46467, "epoch": 276} {"train_loss": -8.237207412719727, "global_step": 46468, "epoch": 276} {"train_loss": -8.291207313537598, "global_step": 46469, "epoch": 276} {"train_loss": -8.364448547363281, "global_step": 46470, "epoch": 276} {"train_loss": -8.205914497375488, "global_step": 46471, "epoch": 276} {"train_loss": -8.40311336517334, "global_step": 46472, "epoch": 276} {"train_loss": -8.470954895019531, "global_step": 46473, "epoch": 276} {"train_loss": -8.244686126708984, "global_step": 46474, "epoch": 276} {"train_loss": -8.209551811218262, "global_step": 46475, "epoch": 276} {"train_loss": -8.02166748046875, "global_step": 46476, "epoch": 276} {"train_loss": -7.6294846534729, "global_step": 46477, "epoch": 276} {"train_loss": -8.286495208740234, "global_step": 46478, "epoch": 276} {"train_loss": -7.984961032867432, "global_step": 46479, "epoch": 276} {"train_loss": -8.099489212036133, "global_step": 46480, "epoch": 276} {"train_loss": -8.056143760681152, "global_step": 46481, "epoch": 276} {"train_loss": -8.41721248626709, "global_step": 46482, "epoch": 276} {"train_loss": -8.065542221069336, "global_step": 46483, "epoch": 276} {"train_loss": -8.355352401733398, "global_step": 46484, "epoch": 276} {"train_loss": -8.023148536682129, "global_step": 46485, "epoch": 276} {"train_loss": -8.186978340148926, "global_step": 46486, "epoch": 276} {"train_loss": -8.032320022583008, "global_step": 46487, "epoch": 276} {"train_loss": -8.09242057800293, "global_step": 46488, "epoch": 276} {"train_loss": -8.111991882324219, "global_step": 46489, "epoch": 276} {"train_loss": -7.963517189025879, "global_step": 46490, "epoch": 276} {"train_loss": -8.236495971679688, "global_step": 46491, "epoch": 276} {"train_loss": -8.203577995300293, "global_step": 46492, "epoch": 276} {"train_loss": -8.211512565612793, "global_step": 46493, "epoch": 276} {"train_loss": -7.950631618499756, "global_step": 46494, "epoch": 276} {"train_loss": -7.773906707763672, "global_step": 46495, "epoch": 276} {"train_loss": -8.07444953918457, "global_step": 46496, "epoch": 276} {"train_loss": -8.047910690307617, "global_step": 46497, "epoch": 276} {"train_loss": -8.10836124420166, "global_step": 46498, "epoch": 276} {"train_loss": -7.907164573669434, "global_step": 46499, "epoch": 276} {"train_loss": -7.98360538482666, "global_step": 46500, "epoch": 276} {"train_loss": -7.846733570098877, "global_step": 46501, "epoch": 276} {"train_loss": -7.770642280578613, "global_step": 46502, "epoch": 276} {"train_loss": -8.09640121459961, "global_step": 46503, "epoch": 276} {"train_loss": -7.853048324584961, "global_step": 46504, "epoch": 276} {"train_loss": -8.111970901489258, "global_step": 46505, "epoch": 276} {"train_loss": -8.06131649017334, "global_step": 46506, "epoch": 276} {"train_loss": -7.947442054748535, "global_step": 46507, "epoch": 276} {"train_loss": -8.055240631103516, "global_step": 46508, "epoch": 276} {"train_loss": -7.9905571937561035, "global_step": 46509, "epoch": 276} {"train_loss": -7.720308780670166, "global_step": 46510, "epoch": 276} {"train_loss": -7.9704999923706055, "global_step": 46511, "epoch": 276} {"train_loss": -7.8949127197265625, "global_step": 46512, "epoch": 276} {"train_loss": -8.017210006713867, "global_step": 46513, "epoch": 276} {"train_loss": -8.275742530822754, "global_step": 46514, "epoch": 276} {"train_loss": -8.269222259521484, "global_step": 46515, "epoch": 276} {"train_loss": -8.242416381835938, "global_step": 46516, "epoch": 276} {"train_loss": -8.092022895812988, "global_step": 46517, "epoch": 276} {"train_loss": -8.042755126953125, "global_step": 46518, "epoch": 276} {"train_loss": -8.179683685302734, "global_step": 46519, "epoch": 276} {"train_loss": -7.932906150817871, "global_step": 46520, "epoch": 276} {"train_loss": -8.343772888183594, "global_step": 46521, "epoch": 276} {"train_loss": -8.019896507263184, "global_step": 46522, "epoch": 276} {"train_loss": -8.224512100219727, "global_step": 46523, "epoch": 276} {"train_loss": -8.102783203125, "global_step": 46524, "epoch": 276} {"train_loss": -8.135172843933105, "global_step": 46525, "epoch": 276} {"train_loss": -7.996743202209473, "global_step": 46526, "epoch": 276} {"train_loss": -7.96455717086792, "global_step": 46527, "epoch": 276} {"train_loss": -8.37663745880127, "global_step": 46528, "epoch": 276} {"train_loss": -8.04804801940918, "global_step": 46529, "epoch": 276} {"train_loss": -8.168161392211914, "global_step": 46530, "epoch": 276} {"train_loss": -8.18150520324707, "global_step": 46531, "epoch": 276} {"train_loss": -8.059503555297852, "global_step": 46532, "epoch": 276} {"train_loss": -8.160094261169434, "global_step": 46533, "epoch": 276} {"train_loss": -8.373252868652344, "global_step": 46534, "epoch": 276} {"train_loss": -8.08453688451222, "global_step": 46535, "epoch": 276, "val_loss": 184832.734375} {"train_loss": -8.04747200012207, "global_step": 46536, "epoch": 277} {"train_loss": -8.078624725341797, "global_step": 46537, "epoch": 277} {"train_loss": -8.001067161560059, "global_step": 46538, "epoch": 277} {"train_loss": -8.118696212768555, "global_step": 46539, "epoch": 277} {"train_loss": -8.415499687194824, "global_step": 46540, "epoch": 277} {"train_loss": -8.096848487854004, "global_step": 46541, "epoch": 277} {"train_loss": -8.115365028381348, "global_step": 46542, "epoch": 277} {"train_loss": -8.170063972473145, "global_step": 46543, "epoch": 277} {"train_loss": -8.209046363830566, "global_step": 46544, "epoch": 277} {"train_loss": -8.31264877319336, "global_step": 46545, "epoch": 277} {"train_loss": -8.418388366699219, "global_step": 46546, "epoch": 277} {"train_loss": -8.208455085754395, "global_step": 46547, "epoch": 277} {"train_loss": -8.133644104003906, "global_step": 46548, "epoch": 277} {"train_loss": -8.23581314086914, "global_step": 46549, "epoch": 277} {"train_loss": -8.372947692871094, "global_step": 46550, "epoch": 277} {"train_loss": -8.467462539672852, "global_step": 46551, "epoch": 277} {"train_loss": -8.088554382324219, "global_step": 46552, "epoch": 277} {"train_loss": -8.271101951599121, "global_step": 46553, "epoch": 277} {"train_loss": -8.3989839553833, "global_step": 46554, "epoch": 277} {"train_loss": -8.375682830810547, "global_step": 46555, "epoch": 277} {"train_loss": -8.412460327148438, "global_step": 46556, "epoch": 277} {"train_loss": -8.264829635620117, "global_step": 46557, "epoch": 277} {"train_loss": -8.170438766479492, "global_step": 46558, "epoch": 277} {"train_loss": -8.245058059692383, "global_step": 46559, "epoch": 277} {"train_loss": -8.30982780456543, "global_step": 46560, "epoch": 277} {"train_loss": -8.251080513000488, "global_step": 46561, "epoch": 277} {"train_loss": -8.294071197509766, "global_step": 46562, "epoch": 277} {"train_loss": -8.213052749633789, "global_step": 46563, "epoch": 277} {"train_loss": -8.125375747680664, "global_step": 46564, "epoch": 277} {"train_loss": -8.513137817382812, "global_step": 46565, "epoch": 277} {"train_loss": -8.10706901550293, "global_step": 46566, "epoch": 277} {"train_loss": -8.393889427185059, "global_step": 46567, "epoch": 277} {"train_loss": -8.253125190734863, "global_step": 46568, "epoch": 277} {"train_loss": -8.214962005615234, "global_step": 46569, "epoch": 277} {"train_loss": -8.390218734741211, "global_step": 46570, "epoch": 277} {"train_loss": -7.966785430908203, "global_step": 46571, "epoch": 277} {"train_loss": -8.184873580932617, "global_step": 46572, "epoch": 277} {"train_loss": -8.394262313842773, "global_step": 46573, "epoch": 277} {"train_loss": -8.258808135986328, "global_step": 46574, "epoch": 277} {"train_loss": -8.008784294128418, "global_step": 46575, "epoch": 277} {"train_loss": -8.19432258605957, "global_step": 46576, "epoch": 277} {"train_loss": -8.404930114746094, "global_step": 46577, "epoch": 277} {"train_loss": -8.18997573852539, "global_step": 46578, "epoch": 277} {"train_loss": -8.137371063232422, "global_step": 46579, "epoch": 277} {"train_loss": -8.14833927154541, "global_step": 46580, "epoch": 277} {"train_loss": -8.099199295043945, "global_step": 46581, "epoch": 277} {"train_loss": -7.7802324295043945, "global_step": 46582, "epoch": 277} {"train_loss": -8.210756301879883, "global_step": 46583, "epoch": 277} {"train_loss": -8.214134216308594, "global_step": 46584, "epoch": 277} {"train_loss": -8.121240615844727, "global_step": 46585, "epoch": 277} {"train_loss": -8.349954605102539, "global_step": 46586, "epoch": 277} {"train_loss": -8.276939392089844, "global_step": 46587, "epoch": 277} {"train_loss": -8.002584457397461, "global_step": 46588, "epoch": 277} {"train_loss": -8.17591667175293, "global_step": 46589, "epoch": 277} {"train_loss": -8.344259262084961, "global_step": 46590, "epoch": 277} {"train_loss": -8.38700008392334, "global_step": 46591, "epoch": 277} {"train_loss": -8.117769241333008, "global_step": 46592, "epoch": 277} {"train_loss": -8.361831665039062, "global_step": 46593, "epoch": 277} {"train_loss": -8.206914901733398, "global_step": 46594, "epoch": 277} {"train_loss": -8.32781982421875, "global_step": 46595, "epoch": 277} {"train_loss": -8.274349212646484, "global_step": 46596, "epoch": 277} {"train_loss": -8.377460479736328, "global_step": 46597, "epoch": 277} {"train_loss": -8.253246307373047, "global_step": 46598, "epoch": 277} {"train_loss": -8.367916107177734, "global_step": 46599, "epoch": 277} {"train_loss": -8.310980796813965, "global_step": 46600, "epoch": 277} {"train_loss": -8.165534973144531, "global_step": 46601, "epoch": 277} {"train_loss": -8.188240051269531, "global_step": 46602, "epoch": 277} {"train_loss": -8.344386100769043, "global_step": 46603, "epoch": 277} {"train_loss": -8.240449905395508, "global_step": 46604, "epoch": 277} {"train_loss": -8.518884658813477, "global_step": 46605, "epoch": 277} {"train_loss": -8.015195846557617, "global_step": 46606, "epoch": 277} {"train_loss": -8.306692123413086, "global_step": 46607, "epoch": 277} {"train_loss": -8.234325408935547, "global_step": 46608, "epoch": 277} {"train_loss": -8.336629867553711, "global_step": 46609, "epoch": 277} {"train_loss": -8.008742332458496, "global_step": 46610, "epoch": 277} {"train_loss": -8.45480728149414, "global_step": 46611, "epoch": 277} {"train_loss": -8.341083526611328, "global_step": 46612, "epoch": 277} {"train_loss": -8.310020446777344, "global_step": 46613, "epoch": 277} {"train_loss": -7.990389823913574, "global_step": 46614, "epoch": 277} {"train_loss": -7.980275630950928, "global_step": 46615, "epoch": 277} {"train_loss": -8.251386642456055, "global_step": 46616, "epoch": 277} {"train_loss": -8.371292114257812, "global_step": 46617, "epoch": 277} {"train_loss": -8.230634689331055, "global_step": 46618, "epoch": 277} {"train_loss": -8.023557662963867, "global_step": 46619, "epoch": 277} {"train_loss": -8.16038703918457, "global_step": 46620, "epoch": 277} {"train_loss": -8.016630172729492, "global_step": 46621, "epoch": 277} {"train_loss": -8.242082595825195, "global_step": 46622, "epoch": 277} {"train_loss": -7.828296661376953, "global_step": 46623, "epoch": 277} {"train_loss": -8.189788818359375, "global_step": 46624, "epoch": 277} {"train_loss": -8.19383430480957, "global_step": 46625, "epoch": 277} {"train_loss": -8.364160537719727, "global_step": 46626, "epoch": 277} {"train_loss": -8.159171104431152, "global_step": 46627, "epoch": 277} {"train_loss": -8.458069801330566, "global_step": 46628, "epoch": 277} {"train_loss": -8.13854694366455, "global_step": 46629, "epoch": 277} {"train_loss": -8.144200325012207, "global_step": 46630, "epoch": 277} {"train_loss": -7.991593360900879, "global_step": 46631, "epoch": 277} {"train_loss": -8.170792579650879, "global_step": 46632, "epoch": 277} {"train_loss": -8.151456832885742, "global_step": 46633, "epoch": 277} {"train_loss": -7.964075088500977, "global_step": 46634, "epoch": 277} {"train_loss": -8.410419464111328, "global_step": 46635, "epoch": 277} {"train_loss": -7.752295017242432, "global_step": 46636, "epoch": 277} {"train_loss": -8.260016441345215, "global_step": 46637, "epoch": 277} {"train_loss": -8.046417236328125, "global_step": 46638, "epoch": 277} {"train_loss": -8.289369583129883, "global_step": 46639, "epoch": 277} {"train_loss": -8.229425430297852, "global_step": 46640, "epoch": 277} {"train_loss": -8.239845275878906, "global_step": 46641, "epoch": 277} {"train_loss": -8.178853988647461, "global_step": 46642, "epoch": 277} {"train_loss": -8.01930046081543, "global_step": 46643, "epoch": 277} {"train_loss": -8.073081970214844, "global_step": 46644, "epoch": 277} {"train_loss": -8.223896026611328, "global_step": 46645, "epoch": 277} {"train_loss": -8.292510986328125, "global_step": 46646, "epoch": 277} {"train_loss": -8.361978530883789, "global_step": 46647, "epoch": 277} {"train_loss": -8.187694549560547, "global_step": 46648, "epoch": 277} {"train_loss": -8.073283195495605, "global_step": 46649, "epoch": 277} {"train_loss": -8.190369606018066, "global_step": 46650, "epoch": 277} {"train_loss": -8.284629821777344, "global_step": 46651, "epoch": 277} {"train_loss": -7.930438995361328, "global_step": 46652, "epoch": 277} {"train_loss": -8.138213157653809, "global_step": 46653, "epoch": 277} {"train_loss": -8.245423316955566, "global_step": 46654, "epoch": 277} {"train_loss": -8.085317611694336, "global_step": 46655, "epoch": 277} {"train_loss": -8.12555980682373, "global_step": 46656, "epoch": 277} {"train_loss": -7.9147186279296875, "global_step": 46657, "epoch": 277} {"train_loss": -8.110139846801758, "global_step": 46658, "epoch": 277} {"train_loss": -8.011263847351074, "global_step": 46659, "epoch": 277} {"train_loss": -8.22834587097168, "global_step": 46660, "epoch": 277} {"train_loss": -8.16609001159668, "global_step": 46661, "epoch": 277} {"train_loss": -8.291675567626953, "global_step": 46662, "epoch": 277} {"train_loss": -8.065611839294434, "global_step": 46663, "epoch": 277} {"train_loss": -8.196371078491211, "global_step": 46664, "epoch": 277} {"train_loss": -8.055864334106445, "global_step": 46665, "epoch": 277} {"train_loss": -8.05384635925293, "global_step": 46666, "epoch": 277} {"train_loss": -8.155783653259277, "global_step": 46667, "epoch": 277} {"train_loss": -8.168548583984375, "global_step": 46668, "epoch": 277} {"train_loss": -8.084497451782227, "global_step": 46669, "epoch": 277} {"train_loss": -8.028839111328125, "global_step": 46670, "epoch": 277} {"train_loss": -8.20095443725586, "global_step": 46671, "epoch": 277} {"train_loss": -8.2041597366333, "global_step": 46672, "epoch": 277} {"train_loss": -8.223709106445312, "global_step": 46673, "epoch": 277} {"train_loss": -8.110289573669434, "global_step": 46674, "epoch": 277} {"train_loss": -8.244935989379883, "global_step": 46675, "epoch": 277} {"train_loss": -8.065642356872559, "global_step": 46676, "epoch": 277} {"train_loss": -8.145078659057617, "global_step": 46677, "epoch": 277} {"train_loss": -8.27939510345459, "global_step": 46678, "epoch": 277} {"train_loss": -8.169267654418945, "global_step": 46679, "epoch": 277} {"train_loss": -8.008691787719727, "global_step": 46680, "epoch": 277} {"train_loss": -8.27746295928955, "global_step": 46681, "epoch": 277} {"train_loss": -8.11369800567627, "global_step": 46682, "epoch": 277} {"train_loss": -8.105245590209961, "global_step": 46683, "epoch": 277} {"train_loss": -8.166295051574707, "global_step": 46684, "epoch": 277} {"train_loss": -8.248332977294922, "global_step": 46685, "epoch": 277} {"train_loss": -8.165102005004883, "global_step": 46686, "epoch": 277} {"train_loss": -8.065363883972168, "global_step": 46687, "epoch": 277} {"train_loss": -8.205997467041016, "global_step": 46688, "epoch": 277} {"train_loss": -8.167325019836426, "global_step": 46689, "epoch": 277} {"train_loss": -8.159296989440918, "global_step": 46690, "epoch": 277} {"train_loss": -8.099130630493164, "global_step": 46691, "epoch": 277} {"train_loss": -7.992968559265137, "global_step": 46692, "epoch": 277} {"train_loss": -8.261509895324707, "global_step": 46693, "epoch": 277} {"train_loss": -8.198213577270508, "global_step": 46694, "epoch": 277} {"train_loss": -8.265310287475586, "global_step": 46695, "epoch": 277} {"train_loss": -8.138557434082031, "global_step": 46696, "epoch": 277} {"train_loss": -8.28087043762207, "global_step": 46697, "epoch": 277} {"train_loss": -8.402955055236816, "global_step": 46698, "epoch": 277} {"train_loss": -8.226799011230469, "global_step": 46699, "epoch": 277} {"train_loss": -8.432498931884766, "global_step": 46700, "epoch": 277} {"train_loss": -8.15007209777832, "global_step": 46701, "epoch": 277} {"train_loss": -8.292879104614258, "global_step": 46702, "epoch": 277} {"train_loss": -8.195818401518322, "global_step": 46703, "epoch": 277, "val_loss": 188030.78125} {"train_loss": -7.956603527069092, "global_step": 46704, "epoch": 278} {"train_loss": -7.996353626251221, "global_step": 46705, "epoch": 278} {"train_loss": -8.176411628723145, "global_step": 46706, "epoch": 278} {"train_loss": -8.004996299743652, "global_step": 46707, "epoch": 278} {"train_loss": -8.213991165161133, "global_step": 46708, "epoch": 278} {"train_loss": -8.575684547424316, "global_step": 46709, "epoch": 278} {"train_loss": -8.28586483001709, "global_step": 46710, "epoch": 278} {"train_loss": -8.052132606506348, "global_step": 46711, "epoch": 278} {"train_loss": -8.157167434692383, "global_step": 46712, "epoch": 278} {"train_loss": -8.083605766296387, "global_step": 46713, "epoch": 278} {"train_loss": -8.236967086791992, "global_step": 46714, "epoch": 278} {"train_loss": -8.247159004211426, "global_step": 46715, "epoch": 278} {"train_loss": -8.327293395996094, "global_step": 46716, "epoch": 278} {"train_loss": -8.187904357910156, "global_step": 46717, "epoch": 278} {"train_loss": -8.249874114990234, "global_step": 46718, "epoch": 278} {"train_loss": -8.147077560424805, "global_step": 46719, "epoch": 278} {"train_loss": -8.058542251586914, "global_step": 46720, "epoch": 278} {"train_loss": -7.870364665985107, "global_step": 46721, "epoch": 278} {"train_loss": -8.180083274841309, "global_step": 46722, "epoch": 278} {"train_loss": -8.214876174926758, "global_step": 46723, "epoch": 278} {"train_loss": -7.866459369659424, "global_step": 46724, "epoch": 278} {"train_loss": -8.09316635131836, "global_step": 46725, "epoch": 278} {"train_loss": -8.239482879638672, "global_step": 46726, "epoch": 278} {"train_loss": -8.06387710571289, "global_step": 46727, "epoch": 278} {"train_loss": -8.13038444519043, "global_step": 46728, "epoch": 278} {"train_loss": -8.364116668701172, "global_step": 46729, "epoch": 278} {"train_loss": -8.193826675415039, "global_step": 46730, "epoch": 278} {"train_loss": -7.898487567901611, "global_step": 46731, "epoch": 278} {"train_loss": -8.157455444335938, "global_step": 46732, "epoch": 278} {"train_loss": -8.065998077392578, "global_step": 46733, "epoch": 278} {"train_loss": -8.238118171691895, "global_step": 46734, "epoch": 278} {"train_loss": -7.942413330078125, "global_step": 46735, "epoch": 278} {"train_loss": -8.355790138244629, "global_step": 46736, "epoch": 278} {"train_loss": -7.717121124267578, "global_step": 46737, "epoch": 278} {"train_loss": -7.924489974975586, "global_step": 46738, "epoch": 278} {"train_loss": -7.957101345062256, "global_step": 46739, "epoch": 278} {"train_loss": -8.124974250793457, "global_step": 46740, "epoch": 278} {"train_loss": -7.577841758728027, "global_step": 46741, "epoch": 278} {"train_loss": -7.771209716796875, "global_step": 46742, "epoch": 278} {"train_loss": -7.726071834564209, "global_step": 46743, "epoch": 278} {"train_loss": -8.14610481262207, "global_step": 46744, "epoch": 278} {"train_loss": -7.974895477294922, "global_step": 46745, "epoch": 278} {"train_loss": -7.825359344482422, "global_step": 46746, "epoch": 278} {"train_loss": -7.946783542633057, "global_step": 46747, "epoch": 278} {"train_loss": -7.978305816650391, "global_step": 46748, "epoch": 278} {"train_loss": -7.748231887817383, "global_step": 46749, "epoch": 278} {"train_loss": -8.093622207641602, "global_step": 46750, "epoch": 278} {"train_loss": -8.137128829956055, "global_step": 46751, "epoch": 278} {"train_loss": -8.141189575195312, "global_step": 46752, "epoch": 278} {"train_loss": -7.832062721252441, "global_step": 46753, "epoch": 278} {"train_loss": -8.249284744262695, "global_step": 46754, "epoch": 278} {"train_loss": -7.967365741729736, "global_step": 46755, "epoch": 278} {"train_loss": -8.155645370483398, "global_step": 46756, "epoch": 278} {"train_loss": -8.112340927124023, "global_step": 46757, "epoch": 278} {"train_loss": -8.184770584106445, "global_step": 46758, "epoch": 278} {"train_loss": -7.845947742462158, "global_step": 46759, "epoch": 278} {"train_loss": -8.190176010131836, "global_step": 46760, "epoch": 278} {"train_loss": -8.348037719726562, "global_step": 46761, "epoch": 278} {"train_loss": -8.146005630493164, "global_step": 46762, "epoch": 278} {"train_loss": -8.25102424621582, "global_step": 46763, "epoch": 278} {"train_loss": -8.160045623779297, "global_step": 46764, "epoch": 278} {"train_loss": -8.171468734741211, "global_step": 46765, "epoch": 278} {"train_loss": -8.137615203857422, "global_step": 46766, "epoch": 278} {"train_loss": -8.23198413848877, "global_step": 46767, "epoch": 278} {"train_loss": -8.363702774047852, "global_step": 46768, "epoch": 278} {"train_loss": -8.324724197387695, "global_step": 46769, "epoch": 278} {"train_loss": -8.520586967468262, "global_step": 46770, "epoch": 278} {"train_loss": -8.167741775512695, "global_step": 46771, "epoch": 278} {"train_loss": -8.247802734375, "global_step": 46772, "epoch": 278} {"train_loss": -8.198537826538086, "global_step": 46773, "epoch": 278} {"train_loss": -8.216409683227539, "global_step": 46774, "epoch": 278} {"train_loss": -8.090227127075195, "global_step": 46775, "epoch": 278} {"train_loss": -8.282936096191406, "global_step": 46776, "epoch": 278} {"train_loss": -7.9872965812683105, "global_step": 46777, "epoch": 278} {"train_loss": -8.161396026611328, "global_step": 46778, "epoch": 278} {"train_loss": -8.139163970947266, "global_step": 46779, "epoch": 278} {"train_loss": -8.376255989074707, "global_step": 46780, "epoch": 278} {"train_loss": -8.04845905303955, "global_step": 46781, "epoch": 278} {"train_loss": -8.032212257385254, "global_step": 46782, "epoch": 278} {"train_loss": -8.376068115234375, "global_step": 46783, "epoch": 278} {"train_loss": -7.774229526519775, "global_step": 46784, "epoch": 278} {"train_loss": -7.9264960289001465, "global_step": 46785, "epoch": 278} {"train_loss": -7.703897476196289, "global_step": 46786, "epoch": 278} {"train_loss": -7.901611328125, "global_step": 46787, "epoch": 278} {"train_loss": -8.018878936767578, "global_step": 46788, "epoch": 278} {"train_loss": -8.225738525390625, "global_step": 46789, "epoch": 278} {"train_loss": -7.816802024841309, "global_step": 46790, "epoch": 278} {"train_loss": -8.126495361328125, "global_step": 46791, "epoch": 278} {"train_loss": -7.8820929527282715, "global_step": 46792, "epoch": 278} {"train_loss": -7.930583953857422, "global_step": 46793, "epoch": 278} {"train_loss": -8.194351196289062, "global_step": 46794, "epoch": 278} {"train_loss": -8.085027694702148, "global_step": 46795, "epoch": 278} {"train_loss": -8.005661010742188, "global_step": 46796, "epoch": 278} {"train_loss": -8.106039047241211, "global_step": 46797, "epoch": 278} {"train_loss": -8.314638137817383, "global_step": 46798, "epoch": 278} {"train_loss": -8.029555320739746, "global_step": 46799, "epoch": 278} {"train_loss": -8.027253150939941, "global_step": 46800, "epoch": 278} {"train_loss": -8.268226623535156, "global_step": 46801, "epoch": 278} {"train_loss": -8.101927757263184, "global_step": 46802, "epoch": 278} {"train_loss": -8.082244873046875, "global_step": 46803, "epoch": 278} {"train_loss": -8.139177322387695, "global_step": 46804, "epoch": 278} {"train_loss": -8.236387252807617, "global_step": 46805, "epoch": 278} {"train_loss": -8.182024002075195, "global_step": 46806, "epoch": 278} {"train_loss": -8.141027450561523, "global_step": 46807, "epoch": 278} {"train_loss": -8.267385482788086, "global_step": 46808, "epoch": 278} {"train_loss": -8.112577438354492, "global_step": 46809, "epoch": 278} {"train_loss": -8.200494766235352, "global_step": 46810, "epoch": 278} {"train_loss": -8.4475679397583, "global_step": 46811, "epoch": 278} {"train_loss": -8.478498458862305, "global_step": 46812, "epoch": 278} {"train_loss": -8.309591293334961, "global_step": 46813, "epoch": 278} {"train_loss": -8.31365966796875, "global_step": 46814, "epoch": 278} {"train_loss": -8.213838577270508, "global_step": 46815, "epoch": 278} {"train_loss": -8.449335098266602, "global_step": 46816, "epoch": 278} {"train_loss": -8.040136337280273, "global_step": 46817, "epoch": 278} {"train_loss": -8.070837020874023, "global_step": 46818, "epoch": 278} {"train_loss": -7.8796868324279785, "global_step": 46819, "epoch": 278} {"train_loss": -8.057292938232422, "global_step": 46820, "epoch": 278} {"train_loss": -8.154626846313477, "global_step": 46821, "epoch": 278} {"train_loss": -8.216495513916016, "global_step": 46822, "epoch": 278} {"train_loss": -7.995278835296631, "global_step": 46823, "epoch": 278} {"train_loss": -8.248825073242188, "global_step": 46824, "epoch": 278} {"train_loss": -7.847067832946777, "global_step": 46825, "epoch": 278} {"train_loss": -7.846456527709961, "global_step": 46826, "epoch": 278} {"train_loss": -8.044039726257324, "global_step": 46827, "epoch": 278} {"train_loss": -7.789768218994141, "global_step": 46828, "epoch": 278} {"train_loss": -8.16519832611084, "global_step": 46829, "epoch": 278} {"train_loss": -7.895875930786133, "global_step": 46830, "epoch": 278} {"train_loss": -8.055314064025879, "global_step": 46831, "epoch": 278} {"train_loss": -7.831594467163086, "global_step": 46832, "epoch": 278} {"train_loss": -8.058185577392578, "global_step": 46833, "epoch": 278} {"train_loss": -8.001272201538086, "global_step": 46834, "epoch": 278} {"train_loss": -8.142417907714844, "global_step": 46835, "epoch": 278} {"train_loss": -7.955041885375977, "global_step": 46836, "epoch": 278} {"train_loss": -7.928513526916504, "global_step": 46837, "epoch": 278} {"train_loss": -8.183454513549805, "global_step": 46838, "epoch": 278} {"train_loss": -8.03371810913086, "global_step": 46839, "epoch": 278} {"train_loss": -8.30640983581543, "global_step": 46840, "epoch": 278} {"train_loss": -8.274940490722656, "global_step": 46841, "epoch": 278} {"train_loss": -8.059394836425781, "global_step": 46842, "epoch": 278} {"train_loss": -7.9502081871032715, "global_step": 46843, "epoch": 278} {"train_loss": -8.044066429138184, "global_step": 46844, "epoch": 278} {"train_loss": -8.001670837402344, "global_step": 46845, "epoch": 278} {"train_loss": -7.9485697746276855, "global_step": 46846, "epoch": 278} {"train_loss": -8.099855422973633, "global_step": 46847, "epoch": 278} {"train_loss": -7.893484115600586, "global_step": 46848, "epoch": 278} {"train_loss": -8.20120620727539, "global_step": 46849, "epoch": 278} {"train_loss": -8.01049518585205, "global_step": 46850, "epoch": 278} {"train_loss": -8.260438919067383, "global_step": 46851, "epoch": 278} {"train_loss": -8.216320037841797, "global_step": 46852, "epoch": 278} {"train_loss": -8.14986801147461, "global_step": 46853, "epoch": 278} {"train_loss": -8.281728744506836, "global_step": 46854, "epoch": 278} {"train_loss": -8.304313659667969, "global_step": 46855, "epoch": 278} {"train_loss": -8.450565338134766, "global_step": 46856, "epoch": 278} {"train_loss": -8.14571762084961, "global_step": 46857, "epoch": 278} {"train_loss": -8.229132652282715, "global_step": 46858, "epoch": 278} {"train_loss": -8.342880249023438, "global_step": 46859, "epoch": 278} {"train_loss": -8.300287246704102, "global_step": 46860, "epoch": 278} {"train_loss": -8.442209243774414, "global_step": 46861, "epoch": 278} {"train_loss": -8.38067626953125, "global_step": 46862, "epoch": 278} {"train_loss": -8.375791549682617, "global_step": 46863, "epoch": 278} {"train_loss": -8.229642868041992, "global_step": 46864, "epoch": 278} {"train_loss": -8.435237884521484, "global_step": 46865, "epoch": 278} {"train_loss": -8.298683166503906, "global_step": 46866, "epoch": 278} {"train_loss": -8.308126449584961, "global_step": 46867, "epoch": 278} {"train_loss": -8.010201454162598, "global_step": 46868, "epoch": 278} {"train_loss": -8.443056106567383, "global_step": 46869, "epoch": 278} {"train_loss": -8.470399856567383, "global_step": 46870, "epoch": 278} {"train_loss": -8.123001541410174, "global_step": 46871, "epoch": 278, "val_loss": 189078.515625} {"train_loss": -8.069665908813477, "global_step": 46872, "epoch": 279} {"train_loss": -7.857917785644531, "global_step": 46873, "epoch": 279} {"train_loss": -8.075811386108398, "global_step": 46874, "epoch": 279} {"train_loss": -8.011665344238281, "global_step": 46875, "epoch": 279} {"train_loss": -8.022144317626953, "global_step": 46876, "epoch": 279} {"train_loss": -8.177421569824219, "global_step": 46877, "epoch": 279} {"train_loss": -7.948109149932861, "global_step": 46878, "epoch": 279} {"train_loss": -8.014883995056152, "global_step": 46879, "epoch": 279} {"train_loss": -8.367338180541992, "global_step": 46880, "epoch": 279} {"train_loss": -7.929974555969238, "global_step": 46881, "epoch": 279} {"train_loss": -8.413209915161133, "global_step": 46882, "epoch": 279} {"train_loss": -7.919926643371582, "global_step": 46883, "epoch": 279} {"train_loss": -8.140341758728027, "global_step": 46884, "epoch": 279} {"train_loss": -7.991067886352539, "global_step": 46885, "epoch": 279} {"train_loss": -8.299381256103516, "global_step": 46886, "epoch": 279} {"train_loss": -7.879348278045654, "global_step": 46887, "epoch": 279} {"train_loss": -8.22946548461914, "global_step": 46888, "epoch": 279} {"train_loss": -8.35181999206543, "global_step": 46889, "epoch": 279} {"train_loss": -7.984289169311523, "global_step": 46890, "epoch": 279} {"train_loss": -8.368188858032227, "global_step": 46891, "epoch": 279} {"train_loss": -8.029077529907227, "global_step": 46892, "epoch": 279} {"train_loss": -8.19638729095459, "global_step": 46893, "epoch": 279} {"train_loss": -8.238005638122559, "global_step": 46894, "epoch": 279} {"train_loss": -8.28194808959961, "global_step": 46895, "epoch": 279} {"train_loss": -8.398633003234863, "global_step": 46896, "epoch": 279} {"train_loss": -8.187684059143066, "global_step": 46897, "epoch": 279} {"train_loss": -8.1134033203125, "global_step": 46898, "epoch": 279} {"train_loss": -7.872817039489746, "global_step": 46899, "epoch": 279} {"train_loss": -8.221920013427734, "global_step": 46900, "epoch": 279} {"train_loss": -8.124914169311523, "global_step": 46901, "epoch": 279} {"train_loss": -8.107946395874023, "global_step": 46902, "epoch": 279} {"train_loss": -8.162030220031738, "global_step": 46903, "epoch": 279} {"train_loss": -8.154656410217285, "global_step": 46904, "epoch": 279} {"train_loss": -8.023008346557617, "global_step": 46905, "epoch": 279} {"train_loss": -8.38974666595459, "global_step": 46906, "epoch": 279} {"train_loss": -8.18268871307373, "global_step": 46907, "epoch": 279} {"train_loss": -8.122817993164062, "global_step": 46908, "epoch": 279} {"train_loss": -8.300434112548828, "global_step": 46909, "epoch": 279} {"train_loss": -8.138492584228516, "global_step": 46910, "epoch": 279} {"train_loss": -8.107236862182617, "global_step": 46911, "epoch": 279} {"train_loss": -8.198249816894531, "global_step": 46912, "epoch": 279} {"train_loss": -7.999260425567627, "global_step": 46913, "epoch": 279} {"train_loss": -7.8690009117126465, "global_step": 46914, "epoch": 279} {"train_loss": -8.09060001373291, "global_step": 46915, "epoch": 279} {"train_loss": -7.848600387573242, "global_step": 46916, "epoch": 279} {"train_loss": -8.017446517944336, "global_step": 46917, "epoch": 279} {"train_loss": -7.614462852478027, "global_step": 46918, "epoch": 279} {"train_loss": -8.19094181060791, "global_step": 46919, "epoch": 279} {"train_loss": -7.722124099731445, "global_step": 46920, "epoch": 279} {"train_loss": -8.030561447143555, "global_step": 46921, "epoch": 279} {"train_loss": -7.879558563232422, "global_step": 46922, "epoch": 279} {"train_loss": -8.050962448120117, "global_step": 46923, "epoch": 279} {"train_loss": -8.162885665893555, "global_step": 46924, "epoch": 279} {"train_loss": -7.90425968170166, "global_step": 46925, "epoch": 279} {"train_loss": -8.140229225158691, "global_step": 46926, "epoch": 279} {"train_loss": -7.990694046020508, "global_step": 46927, "epoch": 279} {"train_loss": -8.08765697479248, "global_step": 46928, "epoch": 279} {"train_loss": -7.943199157714844, "global_step": 46929, "epoch": 279} {"train_loss": -7.858287811279297, "global_step": 46930, "epoch": 279} {"train_loss": -8.049760818481445, "global_step": 46931, "epoch": 279} {"train_loss": -8.118192672729492, "global_step": 46932, "epoch": 279} {"train_loss": -8.258260726928711, "global_step": 46933, "epoch": 279} {"train_loss": -8.179769515991211, "global_step": 46934, "epoch": 279} {"train_loss": -8.203765869140625, "global_step": 46935, "epoch": 279} {"train_loss": -7.900519847869873, "global_step": 46936, "epoch": 279} {"train_loss": -7.959229946136475, "global_step": 46937, "epoch": 279} {"train_loss": -8.224578857421875, "global_step": 46938, "epoch": 279} {"train_loss": -8.020191192626953, "global_step": 46939, "epoch": 279} {"train_loss": -8.209527015686035, "global_step": 46940, "epoch": 279} {"train_loss": -8.179984092712402, "global_step": 46941, "epoch": 279} {"train_loss": -8.405722618103027, "global_step": 46942, "epoch": 279} {"train_loss": -8.228890419006348, "global_step": 46943, "epoch": 279} {"train_loss": -8.132105827331543, "global_step": 46944, "epoch": 279} {"train_loss": -8.010656356811523, "global_step": 46945, "epoch": 279} {"train_loss": -8.152156829833984, "global_step": 46946, "epoch": 279} {"train_loss": -8.131625175476074, "global_step": 46947, "epoch": 279} {"train_loss": -8.177059173583984, "global_step": 46948, "epoch": 279} {"train_loss": -8.299708366394043, "global_step": 46949, "epoch": 279} {"train_loss": -8.328393936157227, "global_step": 46950, "epoch": 279} {"train_loss": -8.070310592651367, "global_step": 46951, "epoch": 279} {"train_loss": -8.182779312133789, "global_step": 46952, "epoch": 279} {"train_loss": -8.091861724853516, "global_step": 46953, "epoch": 279} {"train_loss": -8.221949577331543, "global_step": 46954, "epoch": 279} {"train_loss": -8.377245903015137, "global_step": 46955, "epoch": 279} {"train_loss": -8.347160339355469, "global_step": 46956, "epoch": 279} {"train_loss": -8.154539108276367, "global_step": 46957, "epoch": 279} {"train_loss": -8.214615821838379, "global_step": 46958, "epoch": 279} {"train_loss": -8.144890785217285, "global_step": 46959, "epoch": 279} {"train_loss": -8.253089904785156, "global_step": 46960, "epoch": 279} {"train_loss": -8.19481086730957, "global_step": 46961, "epoch": 279} {"train_loss": -8.161666870117188, "global_step": 46962, "epoch": 279} {"train_loss": -8.396056175231934, "global_step": 46963, "epoch": 279} {"train_loss": -8.39157485961914, "global_step": 46964, "epoch": 279} {"train_loss": -8.252313613891602, "global_step": 46965, "epoch": 279} {"train_loss": -8.087202072143555, "global_step": 46966, "epoch": 279} {"train_loss": -8.302967071533203, "global_step": 46967, "epoch": 279} {"train_loss": -8.240140914916992, "global_step": 46968, "epoch": 279} {"train_loss": -8.25719165802002, "global_step": 46969, "epoch": 279} {"train_loss": -8.379125595092773, "global_step": 46970, "epoch": 279} {"train_loss": -8.112675666809082, "global_step": 46971, "epoch": 279} {"train_loss": -8.150976181030273, "global_step": 46972, "epoch": 279} {"train_loss": -8.404321670532227, "global_step": 46973, "epoch": 279} {"train_loss": -8.01138687133789, "global_step": 46974, "epoch": 279} {"train_loss": -8.069082260131836, "global_step": 46975, "epoch": 279} {"train_loss": -8.33363151550293, "global_step": 46976, "epoch": 279} {"train_loss": -8.14543628692627, "global_step": 46977, "epoch": 279} {"train_loss": -8.186117172241211, "global_step": 46978, "epoch": 279} {"train_loss": -8.180773735046387, "global_step": 46979, "epoch": 279} {"train_loss": -8.23369026184082, "global_step": 46980, "epoch": 279} {"train_loss": -8.336282730102539, "global_step": 46981, "epoch": 279} {"train_loss": -8.28331470489502, "global_step": 46982, "epoch": 279} {"train_loss": -8.352392196655273, "global_step": 46983, "epoch": 279} {"train_loss": -8.16820240020752, "global_step": 46984, "epoch": 279} {"train_loss": -8.269909858703613, "global_step": 46985, "epoch": 279} {"train_loss": -8.418079376220703, "global_step": 46986, "epoch": 279} {"train_loss": -8.220584869384766, "global_step": 46987, "epoch": 279} {"train_loss": -8.383968353271484, "global_step": 46988, "epoch": 279} {"train_loss": -8.365949630737305, "global_step": 46989, "epoch": 279} {"train_loss": -8.10257625579834, "global_step": 46990, "epoch": 279} {"train_loss": -8.283634185791016, "global_step": 46991, "epoch": 279} {"train_loss": -8.326000213623047, "global_step": 46992, "epoch": 279} {"train_loss": -8.430351257324219, "global_step": 46993, "epoch": 279} {"train_loss": -8.323850631713867, "global_step": 46994, "epoch": 279} {"train_loss": -8.447101593017578, "global_step": 46995, "epoch": 279} {"train_loss": -8.476461410522461, "global_step": 46996, "epoch": 279} {"train_loss": -8.423973083496094, "global_step": 46997, "epoch": 279} {"train_loss": -8.193448066711426, "global_step": 46998, "epoch": 279} {"train_loss": -8.290458679199219, "global_step": 46999, "epoch": 279} {"train_loss": -8.460480690002441, "global_step": 47000, "epoch": 279} {"train_loss": -8.335445404052734, "global_step": 47001, "epoch": 279} {"train_loss": -8.32352066040039, "global_step": 47002, "epoch": 279} {"train_loss": -8.127557754516602, "global_step": 47003, "epoch": 279} {"train_loss": -8.41877269744873, "global_step": 47004, "epoch": 279} {"train_loss": -8.336408615112305, "global_step": 47005, "epoch": 279} {"train_loss": -8.226164817810059, "global_step": 47006, "epoch": 279} {"train_loss": -8.551922798156738, "global_step": 47007, "epoch": 279} {"train_loss": -8.30131721496582, "global_step": 47008, "epoch": 279} {"train_loss": -8.37562370300293, "global_step": 47009, "epoch": 279} {"train_loss": -8.312701225280762, "global_step": 47010, "epoch": 279} {"train_loss": -8.134654998779297, "global_step": 47011, "epoch": 279} {"train_loss": -8.277303695678711, "global_step": 47012, "epoch": 279} {"train_loss": -8.413616180419922, "global_step": 47013, "epoch": 279} {"train_loss": -7.763782024383545, "global_step": 47014, "epoch": 279} {"train_loss": -8.470928192138672, "global_step": 47015, "epoch": 279} {"train_loss": -7.912676811218262, "global_step": 47016, "epoch": 279} {"train_loss": -8.339859008789062, "global_step": 47017, "epoch": 279} {"train_loss": -8.114679336547852, "global_step": 47018, "epoch": 279} {"train_loss": -7.914068698883057, "global_step": 47019, "epoch": 279} {"train_loss": -8.230602264404297, "global_step": 47020, "epoch": 279} {"train_loss": -7.789865970611572, "global_step": 47021, "epoch": 279} {"train_loss": -8.179615020751953, "global_step": 47022, "epoch": 279} {"train_loss": -8.094637870788574, "global_step": 47023, "epoch": 279} {"train_loss": -7.831721305847168, "global_step": 47024, "epoch": 279} {"train_loss": -8.154499053955078, "global_step": 47025, "epoch": 279} {"train_loss": -8.16720962524414, "global_step": 47026, "epoch": 279} {"train_loss": -8.146482467651367, "global_step": 47027, "epoch": 279} {"train_loss": -8.19793701171875, "global_step": 47028, "epoch": 279} {"train_loss": -8.373102188110352, "global_step": 47029, "epoch": 279} {"train_loss": -8.006006240844727, "global_step": 47030, "epoch": 279} {"train_loss": -8.136201858520508, "global_step": 47031, "epoch": 279} {"train_loss": -7.976171493530273, "global_step": 47032, "epoch": 279} {"train_loss": -8.118513107299805, "global_step": 47033, "epoch": 279} {"train_loss": -8.27768325805664, "global_step": 47034, "epoch": 279} {"train_loss": -8.384933471679688, "global_step": 47035, "epoch": 279} {"train_loss": -8.124465942382812, "global_step": 47036, "epoch": 279} {"train_loss": -8.168595314025879, "global_step": 47037, "epoch": 279} {"train_loss": -8.231931686401367, "global_step": 47038, "epoch": 279} {"train_loss": -8.170202087788354, "global_step": 47039, "epoch": 279, "val_loss": 186458.203125} {"train_loss": -8.362619400024414, "global_step": 47040, "epoch": 280} {"train_loss": -8.171003341674805, "global_step": 47041, "epoch": 280} {"train_loss": -8.178508758544922, "global_step": 47042, "epoch": 280} {"train_loss": -7.905241966247559, "global_step": 47043, "epoch": 280} {"train_loss": -8.141636848449707, "global_step": 47044, "epoch": 280} {"train_loss": -8.11365032196045, "global_step": 47045, "epoch": 280} {"train_loss": -7.927164554595947, "global_step": 47046, "epoch": 280} {"train_loss": -8.151765823364258, "global_step": 47047, "epoch": 280} {"train_loss": -8.17959976196289, "global_step": 47048, "epoch": 280} {"train_loss": -8.372308731079102, "global_step": 47049, "epoch": 280} {"train_loss": -8.212217330932617, "global_step": 47050, "epoch": 280} {"train_loss": -8.232154846191406, "global_step": 47051, "epoch": 280} {"train_loss": -8.312051773071289, "global_step": 47052, "epoch": 280} {"train_loss": -8.329279899597168, "global_step": 47053, "epoch": 280} {"train_loss": -8.160962104797363, "global_step": 47054, "epoch": 280} {"train_loss": -8.340493202209473, "global_step": 47055, "epoch": 280} {"train_loss": -8.309574127197266, "global_step": 47056, "epoch": 280} {"train_loss": -8.294981956481934, "global_step": 47057, "epoch": 280} {"train_loss": -8.245827674865723, "global_step": 47058, "epoch": 280} {"train_loss": -8.245027542114258, "global_step": 47059, "epoch": 280} {"train_loss": -8.164278030395508, "global_step": 47060, "epoch": 280} {"train_loss": -8.301889419555664, "global_step": 47061, "epoch": 280} {"train_loss": -8.227088928222656, "global_step": 47062, "epoch": 280} {"train_loss": -8.371659278869629, "global_step": 47063, "epoch": 280} {"train_loss": -8.21766471862793, "global_step": 47064, "epoch": 280} {"train_loss": -8.061711311340332, "global_step": 47065, "epoch": 280} {"train_loss": -8.221399307250977, "global_step": 47066, "epoch": 280} {"train_loss": -8.075019836425781, "global_step": 47067, "epoch": 280} {"train_loss": -7.908885955810547, "global_step": 47068, "epoch": 280} {"train_loss": -8.368581771850586, "global_step": 47069, "epoch": 280} {"train_loss": -8.015090942382812, "global_step": 47070, "epoch": 280} {"train_loss": -8.276375770568848, "global_step": 47071, "epoch": 280} {"train_loss": -8.022980690002441, "global_step": 47072, "epoch": 280} {"train_loss": -8.253543853759766, "global_step": 47073, "epoch": 280} {"train_loss": -8.215202331542969, "global_step": 47074, "epoch": 280} {"train_loss": -8.09521484375, "global_step": 47075, "epoch": 280} {"train_loss": -8.113676071166992, "global_step": 47076, "epoch": 280} {"train_loss": -8.421323776245117, "global_step": 47077, "epoch": 280} {"train_loss": -8.150917053222656, "global_step": 47078, "epoch": 280} {"train_loss": -7.894883632659912, "global_step": 47079, "epoch": 280} {"train_loss": -8.146383285522461, "global_step": 47080, "epoch": 280} {"train_loss": -8.158086776733398, "global_step": 47081, "epoch": 280} {"train_loss": -8.004658699035645, "global_step": 47082, "epoch": 280} {"train_loss": -8.115684509277344, "global_step": 47083, "epoch": 280} {"train_loss": -8.426855087280273, "global_step": 47084, "epoch": 280} {"train_loss": -8.081210136413574, "global_step": 47085, "epoch": 280} {"train_loss": -8.21843147277832, "global_step": 47086, "epoch": 280} {"train_loss": -8.22045612335205, "global_step": 47087, "epoch": 280} {"train_loss": -8.315016746520996, "global_step": 47088, "epoch": 280} {"train_loss": -8.3075590133667, "global_step": 47089, "epoch": 280} {"train_loss": -8.002437591552734, "global_step": 47090, "epoch": 280} {"train_loss": -8.196234703063965, "global_step": 47091, "epoch": 280} {"train_loss": -8.164579391479492, "global_step": 47092, "epoch": 280} {"train_loss": -8.106821060180664, "global_step": 47093, "epoch": 280} {"train_loss": -8.437078475952148, "global_step": 47094, "epoch": 280} {"train_loss": -8.137080192565918, "global_step": 47095, "epoch": 280} {"train_loss": -8.380125045776367, "global_step": 47096, "epoch": 280} {"train_loss": -8.088119506835938, "global_step": 47097, "epoch": 280} {"train_loss": -8.177218437194824, "global_step": 47098, "epoch": 280} {"train_loss": -8.051819801330566, "global_step": 47099, "epoch": 280} {"train_loss": -8.190431594848633, "global_step": 47100, "epoch": 280} {"train_loss": -8.206952095031738, "global_step": 47101, "epoch": 280} {"train_loss": -8.131178855895996, "global_step": 47102, "epoch": 280} {"train_loss": -8.024919509887695, "global_step": 47103, "epoch": 280} {"train_loss": -7.769657135009766, "global_step": 47104, "epoch": 280} {"train_loss": -8.160842895507812, "global_step": 47105, "epoch": 280} {"train_loss": -8.120655059814453, "global_step": 47106, "epoch": 280} {"train_loss": -8.446557998657227, "global_step": 47107, "epoch": 280} {"train_loss": -8.000324249267578, "global_step": 47108, "epoch": 280} {"train_loss": -8.134557723999023, "global_step": 47109, "epoch": 280} {"train_loss": -8.363780975341797, "global_step": 47110, "epoch": 280} {"train_loss": -8.141717910766602, "global_step": 47111, "epoch": 280} {"train_loss": -8.175804138183594, "global_step": 47112, "epoch": 280} {"train_loss": -8.1536865234375, "global_step": 47113, "epoch": 280} {"train_loss": -8.34353256225586, "global_step": 47114, "epoch": 280} {"train_loss": -8.214799880981445, "global_step": 47115, "epoch": 280} {"train_loss": -8.168279647827148, "global_step": 47116, "epoch": 280} {"train_loss": -8.285486221313477, "global_step": 47117, "epoch": 280} {"train_loss": -8.047928810119629, "global_step": 47118, "epoch": 280} {"train_loss": -8.095636367797852, "global_step": 47119, "epoch": 280} {"train_loss": -8.010523796081543, "global_step": 47120, "epoch": 280} {"train_loss": -8.370028495788574, "global_step": 47121, "epoch": 280} {"train_loss": -8.308507919311523, "global_step": 47122, "epoch": 280} {"train_loss": -8.229131698608398, "global_step": 47123, "epoch": 280} {"train_loss": -8.302918434143066, "global_step": 47124, "epoch": 280} {"train_loss": -8.22542953491211, "global_step": 47125, "epoch": 280} {"train_loss": -8.217033386230469, "global_step": 47126, "epoch": 280} {"train_loss": -8.431268692016602, "global_step": 47127, "epoch": 280} {"train_loss": -8.241862297058105, "global_step": 47128, "epoch": 280} {"train_loss": -8.218347549438477, "global_step": 47129, "epoch": 280} {"train_loss": -8.126497268676758, "global_step": 47130, "epoch": 280} {"train_loss": -8.370312690734863, "global_step": 47131, "epoch": 280} {"train_loss": -7.954610347747803, "global_step": 47132, "epoch": 280} {"train_loss": -8.102102279663086, "global_step": 47133, "epoch": 280} {"train_loss": -8.247957229614258, "global_step": 47134, "epoch": 280} {"train_loss": -8.24004077911377, "global_step": 47135, "epoch": 280} {"train_loss": -8.099203109741211, "global_step": 47136, "epoch": 280} {"train_loss": -8.402785301208496, "global_step": 47137, "epoch": 280} {"train_loss": -8.235119819641113, "global_step": 47138, "epoch": 280} {"train_loss": -8.376869201660156, "global_step": 47139, "epoch": 280} {"train_loss": -8.42411994934082, "global_step": 47140, "epoch": 280} {"train_loss": -8.412679672241211, "global_step": 47141, "epoch": 280} {"train_loss": -8.264799118041992, "global_step": 47142, "epoch": 280} {"train_loss": -8.353407859802246, "global_step": 47143, "epoch": 280} {"train_loss": -8.455044746398926, "global_step": 47144, "epoch": 280} {"train_loss": -8.260751724243164, "global_step": 47145, "epoch": 280} {"train_loss": -8.221903800964355, "global_step": 47146, "epoch": 280} {"train_loss": -8.335918426513672, "global_step": 47147, "epoch": 280} {"train_loss": -8.279459953308105, "global_step": 47148, "epoch": 280} {"train_loss": -8.299459457397461, "global_step": 47149, "epoch": 280} {"train_loss": -8.335382461547852, "global_step": 47150, "epoch": 280} {"train_loss": -8.230679512023926, "global_step": 47151, "epoch": 280} {"train_loss": -8.397671699523926, "global_step": 47152, "epoch": 280} {"train_loss": -8.230361938476562, "global_step": 47153, "epoch": 280} {"train_loss": -8.320805549621582, "global_step": 47154, "epoch": 280} {"train_loss": -8.38322639465332, "global_step": 47155, "epoch": 280} {"train_loss": -8.219849586486816, "global_step": 47156, "epoch": 280} {"train_loss": -8.217611312866211, "global_step": 47157, "epoch": 280} {"train_loss": -8.235371589660645, "global_step": 47158, "epoch": 280} {"train_loss": -8.18836784362793, "global_step": 47159, "epoch": 280} {"train_loss": -8.268169403076172, "global_step": 47160, "epoch": 280} {"train_loss": -8.328656196594238, "global_step": 47161, "epoch": 280} {"train_loss": -8.21124267578125, "global_step": 47162, "epoch": 280} {"train_loss": -8.235666275024414, "global_step": 47163, "epoch": 280} {"train_loss": -8.424306869506836, "global_step": 47164, "epoch": 280} {"train_loss": -8.192048072814941, "global_step": 47165, "epoch": 280} {"train_loss": -8.366158485412598, "global_step": 47166, "epoch": 280} {"train_loss": -8.133272171020508, "global_step": 47167, "epoch": 280} {"train_loss": -8.3589448928833, "global_step": 47168, "epoch": 280} {"train_loss": -8.239004135131836, "global_step": 47169, "epoch": 280} {"train_loss": -8.350198745727539, "global_step": 47170, "epoch": 280} {"train_loss": -7.855180740356445, "global_step": 47171, "epoch": 280} {"train_loss": -8.307306289672852, "global_step": 47172, "epoch": 280} {"train_loss": -8.147929191589355, "global_step": 47173, "epoch": 280} {"train_loss": -8.159036636352539, "global_step": 47174, "epoch": 280} {"train_loss": -8.24322509765625, "global_step": 47175, "epoch": 280} {"train_loss": -8.299910545349121, "global_step": 47176, "epoch": 280} {"train_loss": -8.056989669799805, "global_step": 47177, "epoch": 280} {"train_loss": -8.206064224243164, "global_step": 47178, "epoch": 280} {"train_loss": -7.918783187866211, "global_step": 47179, "epoch": 280} {"train_loss": -8.143251419067383, "global_step": 47180, "epoch": 280} {"train_loss": -8.117889404296875, "global_step": 47181, "epoch": 280} {"train_loss": -8.052507400512695, "global_step": 47182, "epoch": 280} {"train_loss": -8.160710334777832, "global_step": 47183, "epoch": 280} {"train_loss": -8.11518383026123, "global_step": 47184, "epoch": 280} {"train_loss": -8.025890350341797, "global_step": 47185, "epoch": 280} {"train_loss": -8.209512710571289, "global_step": 47186, "epoch": 280} {"train_loss": -8.100997924804688, "global_step": 47187, "epoch": 280} {"train_loss": -7.891072750091553, "global_step": 47188, "epoch": 280} {"train_loss": -8.181480407714844, "global_step": 47189, "epoch": 280} {"train_loss": -8.289094924926758, "global_step": 47190, "epoch": 280} {"train_loss": -8.326963424682617, "global_step": 47191, "epoch": 280} {"train_loss": -8.05510139465332, "global_step": 47192, "epoch": 280} {"train_loss": -8.381787300109863, "global_step": 47193, "epoch": 280} {"train_loss": -8.241933822631836, "global_step": 47194, "epoch": 280} {"train_loss": -8.316631317138672, "global_step": 47195, "epoch": 280} {"train_loss": -8.237119674682617, "global_step": 47196, "epoch": 280} {"train_loss": -8.26728630065918, "global_step": 47197, "epoch": 280} {"train_loss": -8.441486358642578, "global_step": 47198, "epoch": 280} {"train_loss": -8.310808181762695, "global_step": 47199, "epoch": 280} {"train_loss": -8.303018569946289, "global_step": 47200, "epoch": 280} {"train_loss": -8.353738784790039, "global_step": 47201, "epoch": 280} {"train_loss": -8.303375244140625, "global_step": 47202, "epoch": 280} {"train_loss": -7.86894416809082, "global_step": 47203, "epoch": 280} {"train_loss": -8.262374877929688, "global_step": 47204, "epoch": 280} {"train_loss": -8.08365535736084, "global_step": 47205, "epoch": 280} {"train_loss": -8.039385795593262, "global_step": 47206, "epoch": 280} {"train_loss": -8.20680754525321, "global_step": 47207, "epoch": 280, "val_loss": 186219.5, "train_action_mse_error": 13.127471923828125} {"train_loss": -8.210259437561035, "global_step": 47208, "epoch": 281} {"train_loss": -8.221856117248535, "global_step": 47209, "epoch": 281} {"train_loss": -7.860095500946045, "global_step": 47210, "epoch": 281} {"train_loss": -7.879430294036865, "global_step": 47211, "epoch": 281} {"train_loss": -8.028060913085938, "global_step": 47212, "epoch": 281} {"train_loss": -7.957088470458984, "global_step": 47213, "epoch": 281} {"train_loss": -8.28000259399414, "global_step": 47214, "epoch": 281} {"train_loss": -7.764167785644531, "global_step": 47215, "epoch": 281} {"train_loss": -8.060783386230469, "global_step": 47216, "epoch": 281} {"train_loss": -8.056853294372559, "global_step": 47217, "epoch": 281} {"train_loss": -8.035143852233887, "global_step": 47218, "epoch": 281} {"train_loss": -8.073843002319336, "global_step": 47219, "epoch": 281} {"train_loss": -8.024066925048828, "global_step": 47220, "epoch": 281} {"train_loss": -8.097902297973633, "global_step": 47221, "epoch": 281} {"train_loss": -7.942106246948242, "global_step": 47222, "epoch": 281} {"train_loss": -7.887714862823486, "global_step": 47223, "epoch": 281} {"train_loss": -8.117460250854492, "global_step": 47224, "epoch": 281} {"train_loss": -8.169641494750977, "global_step": 47225, "epoch": 281} {"train_loss": -7.972219467163086, "global_step": 47226, "epoch": 281} {"train_loss": -8.116107940673828, "global_step": 47227, "epoch": 281} {"train_loss": -8.165003776550293, "global_step": 47228, "epoch": 281} {"train_loss": -8.28305435180664, "global_step": 47229, "epoch": 281} {"train_loss": -8.162038803100586, "global_step": 47230, "epoch": 281} {"train_loss": -8.339910507202148, "global_step": 47231, "epoch": 281} {"train_loss": -8.087761878967285, "global_step": 47232, "epoch": 281} {"train_loss": -8.25369930267334, "global_step": 47233, "epoch": 281} {"train_loss": -8.165732383728027, "global_step": 47234, "epoch": 281} {"train_loss": -8.338468551635742, "global_step": 47235, "epoch": 281} {"train_loss": -8.41700553894043, "global_step": 47236, "epoch": 281} {"train_loss": -8.337008476257324, "global_step": 47237, "epoch": 281} {"train_loss": -8.26487922668457, "global_step": 47238, "epoch": 281} {"train_loss": -8.224498748779297, "global_step": 47239, "epoch": 281} {"train_loss": -8.258888244628906, "global_step": 47240, "epoch": 281} {"train_loss": -8.10022258758545, "global_step": 47241, "epoch": 281} {"train_loss": -8.444316864013672, "global_step": 47242, "epoch": 281} {"train_loss": -8.289037704467773, "global_step": 47243, "epoch": 281} {"train_loss": -8.40121078491211, "global_step": 47244, "epoch": 281} {"train_loss": -8.51831340789795, "global_step": 47245, "epoch": 281} {"train_loss": -8.248274803161621, "global_step": 47246, "epoch": 281} {"train_loss": -8.484333038330078, "global_step": 47247, "epoch": 281} {"train_loss": -8.432868957519531, "global_step": 47248, "epoch": 281} {"train_loss": -8.327500343322754, "global_step": 47249, "epoch": 281} {"train_loss": -8.351156234741211, "global_step": 47250, "epoch": 281} {"train_loss": -8.336295127868652, "global_step": 47251, "epoch": 281} {"train_loss": -8.326375961303711, "global_step": 47252, "epoch": 281} {"train_loss": -8.398372650146484, "global_step": 47253, "epoch": 281} {"train_loss": -8.094768524169922, "global_step": 47254, "epoch": 281} {"train_loss": -8.271862030029297, "global_step": 47255, "epoch": 281} {"train_loss": -8.379491806030273, "global_step": 47256, "epoch": 281} {"train_loss": -8.240579605102539, "global_step": 47257, "epoch": 281} {"train_loss": -8.114246368408203, "global_step": 47258, "epoch": 281} {"train_loss": -8.483734130859375, "global_step": 47259, "epoch": 281} {"train_loss": -8.17038631439209, "global_step": 47260, "epoch": 281} {"train_loss": -8.333963394165039, "global_step": 47261, "epoch": 281} {"train_loss": -8.172430992126465, "global_step": 47262, "epoch": 281} {"train_loss": -8.35190200805664, "global_step": 47263, "epoch": 281} {"train_loss": -8.168395042419434, "global_step": 47264, "epoch": 281} {"train_loss": -8.257266998291016, "global_step": 47265, "epoch": 281} {"train_loss": -7.968965530395508, "global_step": 47266, "epoch": 281} {"train_loss": -8.026142120361328, "global_step": 47267, "epoch": 281} {"train_loss": -7.994832515716553, "global_step": 47268, "epoch": 281} {"train_loss": -8.083270072937012, "global_step": 47269, "epoch": 281} {"train_loss": -8.018253326416016, "global_step": 47270, "epoch": 281} {"train_loss": -8.304353713989258, "global_step": 47271, "epoch": 281} {"train_loss": -8.075037002563477, "global_step": 47272, "epoch": 281} {"train_loss": -8.035466194152832, "global_step": 47273, "epoch": 281} {"train_loss": -8.21548080444336, "global_step": 47274, "epoch": 281} {"train_loss": -8.328531265258789, "global_step": 47275, "epoch": 281} {"train_loss": -8.025415420532227, "global_step": 47276, "epoch": 281} {"train_loss": -8.17223072052002, "global_step": 47277, "epoch": 281} {"train_loss": -7.87685489654541, "global_step": 47278, "epoch": 281} {"train_loss": -7.925691604614258, "global_step": 47279, "epoch": 281} {"train_loss": -7.969663619995117, "global_step": 47280, "epoch": 281} {"train_loss": -8.324296951293945, "global_step": 47281, "epoch": 281} {"train_loss": -7.951091766357422, "global_step": 47282, "epoch": 281} {"train_loss": -8.253308296203613, "global_step": 47283, "epoch": 281} {"train_loss": -7.920286178588867, "global_step": 47284, "epoch": 281} {"train_loss": -8.120644569396973, "global_step": 47285, "epoch": 281} {"train_loss": -7.887402534484863, "global_step": 47286, "epoch": 281} {"train_loss": -8.267181396484375, "global_step": 47287, "epoch": 281} {"train_loss": -8.079668045043945, "global_step": 47288, "epoch": 281} {"train_loss": -7.976164817810059, "global_step": 47289, "epoch": 281} {"train_loss": -8.154147148132324, "global_step": 47290, "epoch": 281} {"train_loss": -7.910305976867676, "global_step": 47291, "epoch": 281} {"train_loss": -8.155447006225586, "global_step": 47292, "epoch": 281} {"train_loss": -8.05596923828125, "global_step": 47293, "epoch": 281} {"train_loss": -8.100798606872559, "global_step": 47294, "epoch": 281} {"train_loss": -7.8152594566345215, "global_step": 47295, "epoch": 281} {"train_loss": -8.055562973022461, "global_step": 47296, "epoch": 281} {"train_loss": -8.128244400024414, "global_step": 47297, "epoch": 281} {"train_loss": -7.850374698638916, "global_step": 47298, "epoch": 281} {"train_loss": -8.189397811889648, "global_step": 47299, "epoch": 281} {"train_loss": -8.081535339355469, "global_step": 47300, "epoch": 281} {"train_loss": -8.224584579467773, "global_step": 47301, "epoch": 281} {"train_loss": -7.967611789703369, "global_step": 47302, "epoch": 281} {"train_loss": -7.914833068847656, "global_step": 47303, "epoch": 281} {"train_loss": -8.322334289550781, "global_step": 47304, "epoch": 281} {"train_loss": -8.264887809753418, "global_step": 47305, "epoch": 281} {"train_loss": -7.998655319213867, "global_step": 47306, "epoch": 281} {"train_loss": -8.069257736206055, "global_step": 47307, "epoch": 281} {"train_loss": -8.110239028930664, "global_step": 47308, "epoch": 281} {"train_loss": -8.075494766235352, "global_step": 47309, "epoch": 281} {"train_loss": -8.213732719421387, "global_step": 47310, "epoch": 281} {"train_loss": -8.100860595703125, "global_step": 47311, "epoch": 281} {"train_loss": -8.095985412597656, "global_step": 47312, "epoch": 281} {"train_loss": -8.248995780944824, "global_step": 47313, "epoch": 281} {"train_loss": -8.29218864440918, "global_step": 47314, "epoch": 281} {"train_loss": -8.104798316955566, "global_step": 47315, "epoch": 281} {"train_loss": -8.427671432495117, "global_step": 47316, "epoch": 281} {"train_loss": -8.368928909301758, "global_step": 47317, "epoch": 281} {"train_loss": -8.35913372039795, "global_step": 47318, "epoch": 281} {"train_loss": -8.141693115234375, "global_step": 47319, "epoch": 281} {"train_loss": -8.212982177734375, "global_step": 47320, "epoch": 281} {"train_loss": -8.245040893554688, "global_step": 47321, "epoch": 281} {"train_loss": -8.130823135375977, "global_step": 47322, "epoch": 281} {"train_loss": -7.826972007751465, "global_step": 47323, "epoch": 281} {"train_loss": -8.488439559936523, "global_step": 47324, "epoch": 281} {"train_loss": -8.214029312133789, "global_step": 47325, "epoch": 281} {"train_loss": -8.09564208984375, "global_step": 47326, "epoch": 281} {"train_loss": -8.168033599853516, "global_step": 47327, "epoch": 281} {"train_loss": -7.789857864379883, "global_step": 47328, "epoch": 281} {"train_loss": -8.140545845031738, "global_step": 47329, "epoch": 281} {"train_loss": -8.123404502868652, "global_step": 47330, "epoch": 281} {"train_loss": -8.247915267944336, "global_step": 47331, "epoch": 281} {"train_loss": -7.825002193450928, "global_step": 47332, "epoch": 281} {"train_loss": -8.014898300170898, "global_step": 47333, "epoch": 281} {"train_loss": -7.998042583465576, "global_step": 47334, "epoch": 281} {"train_loss": -7.944702625274658, "global_step": 47335, "epoch": 281} {"train_loss": -8.1832275390625, "global_step": 47336, "epoch": 281} {"train_loss": -7.888030052185059, "global_step": 47337, "epoch": 281} {"train_loss": -7.8149285316467285, "global_step": 47338, "epoch": 281} {"train_loss": -7.887140274047852, "global_step": 47339, "epoch": 281} {"train_loss": -8.094402313232422, "global_step": 47340, "epoch": 281} {"train_loss": -8.136667251586914, "global_step": 47341, "epoch": 281} {"train_loss": -8.195561408996582, "global_step": 47342, "epoch": 281} {"train_loss": -8.0294771194458, "global_step": 47343, "epoch": 281} {"train_loss": -7.863123416900635, "global_step": 47344, "epoch": 281} {"train_loss": -8.159208297729492, "global_step": 47345, "epoch": 281} {"train_loss": -8.068460464477539, "global_step": 47346, "epoch": 281} {"train_loss": -8.245564460754395, "global_step": 47347, "epoch": 281} {"train_loss": -8.198104858398438, "global_step": 47348, "epoch": 281} {"train_loss": -8.445396423339844, "global_step": 47349, "epoch": 281} {"train_loss": -8.147533416748047, "global_step": 47350, "epoch": 281} {"train_loss": -7.97474479675293, "global_step": 47351, "epoch": 281} {"train_loss": -8.149859428405762, "global_step": 47352, "epoch": 281} {"train_loss": -8.384239196777344, "global_step": 47353, "epoch": 281} {"train_loss": -8.086566925048828, "global_step": 47354, "epoch": 281} {"train_loss": -8.048770904541016, "global_step": 47355, "epoch": 281} {"train_loss": -8.346294403076172, "global_step": 47356, "epoch": 281} {"train_loss": -7.995014190673828, "global_step": 47357, "epoch": 281} {"train_loss": -8.204113960266113, "global_step": 47358, "epoch": 281} {"train_loss": -8.221662521362305, "global_step": 47359, "epoch": 281} {"train_loss": -8.346766471862793, "global_step": 47360, "epoch": 281} {"train_loss": -8.17575454711914, "global_step": 47361, "epoch": 281} {"train_loss": -8.342374801635742, "global_step": 47362, "epoch": 281} {"train_loss": -8.348579406738281, "global_step": 47363, "epoch": 281} {"train_loss": -8.149456977844238, "global_step": 47364, "epoch": 281} {"train_loss": -8.421242713928223, "global_step": 47365, "epoch": 281} {"train_loss": -8.326225280761719, "global_step": 47366, "epoch": 281} {"train_loss": -8.126431465148926, "global_step": 47367, "epoch": 281} {"train_loss": -8.46904468536377, "global_step": 47368, "epoch": 281} {"train_loss": -8.374226570129395, "global_step": 47369, "epoch": 281} {"train_loss": -8.306476593017578, "global_step": 47370, "epoch": 281} {"train_loss": -8.247892379760742, "global_step": 47371, "epoch": 281} {"train_loss": -8.149181365966797, "global_step": 47372, "epoch": 281} {"train_loss": -8.262462615966797, "global_step": 47373, "epoch": 281} {"train_loss": -8.318683624267578, "global_step": 47374, "epoch": 281} {"train_loss": -8.157900168782188, "global_step": 47375, "epoch": 281, "val_loss": 186952.78125} {"train_loss": -8.268922805786133, "global_step": 47376, "epoch": 282} {"train_loss": -8.354534149169922, "global_step": 47377, "epoch": 282} {"train_loss": -8.475534439086914, "global_step": 47378, "epoch": 282} {"train_loss": -8.53771686553955, "global_step": 47379, "epoch": 282} {"train_loss": -8.346628189086914, "global_step": 47380, "epoch": 282} {"train_loss": -8.198602676391602, "global_step": 47381, "epoch": 282} {"train_loss": -8.228706359863281, "global_step": 47382, "epoch": 282} {"train_loss": -8.381665229797363, "global_step": 47383, "epoch": 282} {"train_loss": -8.43947982788086, "global_step": 47384, "epoch": 282} {"train_loss": -8.321637153625488, "global_step": 47385, "epoch": 282} {"train_loss": -8.391707420349121, "global_step": 47386, "epoch": 282} {"train_loss": -8.313870429992676, "global_step": 47387, "epoch": 282} {"train_loss": -8.416712760925293, "global_step": 47388, "epoch": 282} {"train_loss": -8.441959381103516, "global_step": 47389, "epoch": 282} {"train_loss": -8.128705024719238, "global_step": 47390, "epoch": 282} {"train_loss": -7.795686721801758, "global_step": 47391, "epoch": 282} {"train_loss": -8.410015106201172, "global_step": 47392, "epoch": 282} {"train_loss": -8.334943771362305, "global_step": 47393, "epoch": 282} {"train_loss": -8.116477012634277, "global_step": 47394, "epoch": 282} {"train_loss": -8.290811538696289, "global_step": 47395, "epoch": 282} {"train_loss": -8.283163070678711, "global_step": 47396, "epoch": 282} {"train_loss": -8.158053398132324, "global_step": 47397, "epoch": 282} {"train_loss": -8.242863655090332, "global_step": 47398, "epoch": 282} {"train_loss": -8.338164329528809, "global_step": 47399, "epoch": 282} {"train_loss": -8.092144012451172, "global_step": 47400, "epoch": 282} {"train_loss": -8.320465087890625, "global_step": 47401, "epoch": 282} {"train_loss": -8.235708236694336, "global_step": 47402, "epoch": 282} {"train_loss": -8.184515953063965, "global_step": 47403, "epoch": 282} {"train_loss": -8.136675834655762, "global_step": 47404, "epoch": 282} {"train_loss": -8.172085762023926, "global_step": 47405, "epoch": 282} {"train_loss": -8.339839935302734, "global_step": 47406, "epoch": 282} {"train_loss": -8.328310012817383, "global_step": 47407, "epoch": 282} {"train_loss": -8.240850448608398, "global_step": 47408, "epoch": 282} {"train_loss": -8.003643035888672, "global_step": 47409, "epoch": 282} {"train_loss": -8.146896362304688, "global_step": 47410, "epoch": 282} {"train_loss": -8.208817481994629, "global_step": 47411, "epoch": 282} {"train_loss": -8.193814277648926, "global_step": 47412, "epoch": 282} {"train_loss": -8.227166175842285, "global_step": 47413, "epoch": 282} {"train_loss": -8.10777473449707, "global_step": 47414, "epoch": 282} {"train_loss": -8.00763988494873, "global_step": 47415, "epoch": 282} {"train_loss": -8.29171371459961, "global_step": 47416, "epoch": 282} {"train_loss": -8.233146667480469, "global_step": 47417, "epoch": 282} {"train_loss": -8.189382553100586, "global_step": 47418, "epoch": 282} {"train_loss": -7.980036735534668, "global_step": 47419, "epoch": 282} {"train_loss": -8.287595748901367, "global_step": 47420, "epoch": 282} {"train_loss": -8.375102996826172, "global_step": 47421, "epoch": 282} {"train_loss": -8.327923774719238, "global_step": 47422, "epoch": 282} {"train_loss": -8.27195930480957, "global_step": 47423, "epoch": 282} {"train_loss": -8.438889503479004, "global_step": 47424, "epoch": 282} {"train_loss": -8.13228988647461, "global_step": 47425, "epoch": 282} {"train_loss": -8.207653045654297, "global_step": 47426, "epoch": 282} {"train_loss": -8.40206527709961, "global_step": 47427, "epoch": 282} {"train_loss": -8.102932929992676, "global_step": 47428, "epoch": 282} {"train_loss": -8.016622543334961, "global_step": 47429, "epoch": 282} {"train_loss": -8.044862747192383, "global_step": 47430, "epoch": 282} {"train_loss": -8.095319747924805, "global_step": 47431, "epoch": 282} {"train_loss": -8.217451095581055, "global_step": 47432, "epoch": 282} {"train_loss": -8.532175064086914, "global_step": 47433, "epoch": 282} {"train_loss": -7.780302047729492, "global_step": 47434, "epoch": 282} {"train_loss": -8.291509628295898, "global_step": 47435, "epoch": 282} {"train_loss": -8.001386642456055, "global_step": 47436, "epoch": 282} {"train_loss": -8.036935806274414, "global_step": 47437, "epoch": 282} {"train_loss": -8.223541259765625, "global_step": 47438, "epoch": 282} {"train_loss": -8.07002067565918, "global_step": 47439, "epoch": 282} {"train_loss": -8.241609573364258, "global_step": 47440, "epoch": 282} {"train_loss": -7.972754001617432, "global_step": 47441, "epoch": 282} {"train_loss": -8.124727249145508, "global_step": 47442, "epoch": 282} {"train_loss": -8.206684112548828, "global_step": 47443, "epoch": 282} {"train_loss": -8.227334022521973, "global_step": 47444, "epoch": 282} {"train_loss": -8.158018112182617, "global_step": 47445, "epoch": 282} {"train_loss": -8.121862411499023, "global_step": 47446, "epoch": 282} {"train_loss": -8.314729690551758, "global_step": 47447, "epoch": 282} {"train_loss": -8.095355987548828, "global_step": 47448, "epoch": 282} {"train_loss": -7.984315872192383, "global_step": 47449, "epoch": 282} {"train_loss": -8.383790969848633, "global_step": 47450, "epoch": 282} {"train_loss": -8.259176254272461, "global_step": 47451, "epoch": 282} {"train_loss": -8.391059875488281, "global_step": 47452, "epoch": 282} {"train_loss": -8.377342224121094, "global_step": 47453, "epoch": 282} {"train_loss": -8.40642261505127, "global_step": 47454, "epoch": 282} {"train_loss": -8.248098373413086, "global_step": 47455, "epoch": 282} {"train_loss": -8.448773384094238, "global_step": 47456, "epoch": 282} {"train_loss": -8.386383056640625, "global_step": 47457, "epoch": 282} {"train_loss": -8.346004486083984, "global_step": 47458, "epoch": 282} {"train_loss": -8.148195266723633, "global_step": 47459, "epoch": 282} {"train_loss": -8.20294189453125, "global_step": 47460, "epoch": 282} {"train_loss": -8.167688369750977, "global_step": 47461, "epoch": 282} {"train_loss": -8.164040565490723, "global_step": 47462, "epoch": 282} {"train_loss": -8.286152839660645, "global_step": 47463, "epoch": 282} {"train_loss": -8.402390480041504, "global_step": 47464, "epoch": 282} {"train_loss": -8.296061515808105, "global_step": 47465, "epoch": 282} {"train_loss": -8.347615242004395, "global_step": 47466, "epoch": 282} {"train_loss": -8.229731559753418, "global_step": 47467, "epoch": 282} {"train_loss": -8.144608497619629, "global_step": 47468, "epoch": 282} {"train_loss": -8.294576644897461, "global_step": 47469, "epoch": 282} {"train_loss": -8.194172859191895, "global_step": 47470, "epoch": 282} {"train_loss": -8.496170997619629, "global_step": 47471, "epoch": 282} {"train_loss": -7.835443019866943, "global_step": 47472, "epoch": 282} {"train_loss": -8.342266082763672, "global_step": 47473, "epoch": 282} {"train_loss": -8.111570358276367, "global_step": 47474, "epoch": 282} {"train_loss": -8.339076042175293, "global_step": 47475, "epoch": 282} {"train_loss": -8.191030502319336, "global_step": 47476, "epoch": 282} {"train_loss": -8.264091491699219, "global_step": 47477, "epoch": 282} {"train_loss": -7.854866981506348, "global_step": 47478, "epoch": 282} {"train_loss": -8.444541931152344, "global_step": 47479, "epoch": 282} {"train_loss": -8.025418281555176, "global_step": 47480, "epoch": 282} {"train_loss": -8.238104820251465, "global_step": 47481, "epoch": 282} {"train_loss": -8.065086364746094, "global_step": 47482, "epoch": 282} {"train_loss": -8.21273422241211, "global_step": 47483, "epoch": 282} {"train_loss": -8.123884201049805, "global_step": 47484, "epoch": 282} {"train_loss": -8.373969078063965, "global_step": 47485, "epoch": 282} {"train_loss": -7.964720726013184, "global_step": 47486, "epoch": 282} {"train_loss": -8.09622573852539, "global_step": 47487, "epoch": 282} {"train_loss": -8.250279426574707, "global_step": 47488, "epoch": 282} {"train_loss": -8.163179397583008, "global_step": 47489, "epoch": 282} {"train_loss": -8.047235488891602, "global_step": 47490, "epoch": 282} {"train_loss": -8.2135009765625, "global_step": 47491, "epoch": 282} {"train_loss": -8.023268699645996, "global_step": 47492, "epoch": 282} {"train_loss": -8.126058578491211, "global_step": 47493, "epoch": 282} {"train_loss": -8.408946990966797, "global_step": 47494, "epoch": 282} {"train_loss": -8.061573028564453, "global_step": 47495, "epoch": 282} {"train_loss": -8.031017303466797, "global_step": 47496, "epoch": 282} {"train_loss": -8.26624584197998, "global_step": 47497, "epoch": 282} {"train_loss": -8.219259262084961, "global_step": 47498, "epoch": 282} {"train_loss": -8.249212265014648, "global_step": 47499, "epoch": 282} {"train_loss": -8.01272201538086, "global_step": 47500, "epoch": 282} {"train_loss": -8.127163887023926, "global_step": 47501, "epoch": 282} {"train_loss": -8.01552963256836, "global_step": 47502, "epoch": 282} {"train_loss": -8.176968574523926, "global_step": 47503, "epoch": 282} {"train_loss": -8.242650985717773, "global_step": 47504, "epoch": 282} {"train_loss": -8.373846054077148, "global_step": 47505, "epoch": 282} {"train_loss": -7.954216957092285, "global_step": 47506, "epoch": 282} {"train_loss": -8.106658935546875, "global_step": 47507, "epoch": 282} {"train_loss": -7.9509782791137695, "global_step": 47508, "epoch": 282} {"train_loss": -7.929349422454834, "global_step": 47509, "epoch": 282} {"train_loss": -8.037701606750488, "global_step": 47510, "epoch": 282} {"train_loss": -7.804908752441406, "global_step": 47511, "epoch": 282} {"train_loss": -7.810312271118164, "global_step": 47512, "epoch": 282} {"train_loss": -7.893109321594238, "global_step": 47513, "epoch": 282} {"train_loss": -7.74383020401001, "global_step": 47514, "epoch": 282} {"train_loss": -8.034038543701172, "global_step": 47515, "epoch": 282} {"train_loss": -8.151845932006836, "global_step": 47516, "epoch": 282} {"train_loss": -7.96272087097168, "global_step": 47517, "epoch": 282} {"train_loss": -8.110502243041992, "global_step": 47518, "epoch": 282} {"train_loss": -8.165377616882324, "global_step": 47519, "epoch": 282} {"train_loss": -8.012650489807129, "global_step": 47520, "epoch": 282} {"train_loss": -8.111119270324707, "global_step": 47521, "epoch": 282} {"train_loss": -8.101729393005371, "global_step": 47522, "epoch": 282} {"train_loss": -8.126592636108398, "global_step": 47523, "epoch": 282} {"train_loss": -8.215667724609375, "global_step": 47524, "epoch": 282} {"train_loss": -8.134039878845215, "global_step": 47525, "epoch": 282} {"train_loss": -8.100497245788574, "global_step": 47526, "epoch": 282} {"train_loss": -8.197659492492676, "global_step": 47527, "epoch": 282} {"train_loss": -8.379408836364746, "global_step": 47528, "epoch": 282} {"train_loss": -8.183835983276367, "global_step": 47529, "epoch": 282} {"train_loss": -8.180770874023438, "global_step": 47530, "epoch": 282} {"train_loss": -8.19514274597168, "global_step": 47531, "epoch": 282} {"train_loss": -8.350019454956055, "global_step": 47532, "epoch": 282} {"train_loss": -8.153619766235352, "global_step": 47533, "epoch": 282} {"train_loss": -8.244706153869629, "global_step": 47534, "epoch": 282} {"train_loss": -8.351107597351074, "global_step": 47535, "epoch": 282} {"train_loss": -8.104665756225586, "global_step": 47536, "epoch": 282} {"train_loss": -8.36152458190918, "global_step": 47537, "epoch": 282} {"train_loss": -8.354142189025879, "global_step": 47538, "epoch": 282} {"train_loss": -8.277273178100586, "global_step": 47539, "epoch": 282} {"train_loss": -8.236915588378906, "global_step": 47540, "epoch": 282} {"train_loss": -8.324464797973633, "global_step": 47541, "epoch": 282} {"train_loss": -7.979012489318848, "global_step": 47542, "epoch": 282} {"train_loss": -8.196389760289874, "global_step": 47543, "epoch": 282, "val_loss": 189557.703125} {"train_loss": -8.050012588500977, "global_step": 47544, "epoch": 283} {"train_loss": -7.923040390014648, "global_step": 47545, "epoch": 283} {"train_loss": -8.287358283996582, "global_step": 47546, "epoch": 283} {"train_loss": -7.898815155029297, "global_step": 47547, "epoch": 283} {"train_loss": -8.051741600036621, "global_step": 47548, "epoch": 283} {"train_loss": -7.9998955726623535, "global_step": 47549, "epoch": 283} {"train_loss": -8.18083667755127, "global_step": 47550, "epoch": 283} {"train_loss": -7.788822174072266, "global_step": 47551, "epoch": 283} {"train_loss": -8.02652645111084, "global_step": 47552, "epoch": 283} {"train_loss": -7.997519016265869, "global_step": 47553, "epoch": 283} {"train_loss": -8.124824523925781, "global_step": 47554, "epoch": 283} {"train_loss": -7.8306708335876465, "global_step": 47555, "epoch": 283} {"train_loss": -8.084399223327637, "global_step": 47556, "epoch": 283} {"train_loss": -8.243146896362305, "global_step": 47557, "epoch": 283} {"train_loss": -8.005728721618652, "global_step": 47558, "epoch": 283} {"train_loss": -8.332380294799805, "global_step": 47559, "epoch": 283} {"train_loss": -8.293310165405273, "global_step": 47560, "epoch": 283} {"train_loss": -8.193944931030273, "global_step": 47561, "epoch": 283} {"train_loss": -8.047183990478516, "global_step": 47562, "epoch": 283} {"train_loss": -8.242801666259766, "global_step": 47563, "epoch": 283} {"train_loss": -8.001042366027832, "global_step": 47564, "epoch": 283} {"train_loss": -7.950332164764404, "global_step": 47565, "epoch": 283} {"train_loss": -8.190199851989746, "global_step": 47566, "epoch": 283} {"train_loss": -7.961633682250977, "global_step": 47567, "epoch": 283} {"train_loss": -8.284491539001465, "global_step": 47568, "epoch": 283} {"train_loss": -8.160621643066406, "global_step": 47569, "epoch": 283} {"train_loss": -8.119539260864258, "global_step": 47570, "epoch": 283} {"train_loss": -8.20969009399414, "global_step": 47571, "epoch": 283} {"train_loss": -8.308090209960938, "global_step": 47572, "epoch": 283} {"train_loss": -8.20167064666748, "global_step": 47573, "epoch": 283} {"train_loss": -8.170513153076172, "global_step": 47574, "epoch": 283} {"train_loss": -8.199945449829102, "global_step": 47575, "epoch": 283} {"train_loss": -8.25289535522461, "global_step": 47576, "epoch": 283} {"train_loss": -8.31063461303711, "global_step": 47577, "epoch": 283} {"train_loss": -8.404607772827148, "global_step": 47578, "epoch": 283} {"train_loss": -8.187512397766113, "global_step": 47579, "epoch": 283} {"train_loss": -8.355857849121094, "global_step": 47580, "epoch": 283} {"train_loss": -8.133028030395508, "global_step": 47581, "epoch": 283} {"train_loss": -8.599365234375, "global_step": 47582, "epoch": 283} {"train_loss": -8.277289390563965, "global_step": 47583, "epoch": 283} {"train_loss": -8.145342826843262, "global_step": 47584, "epoch": 283} {"train_loss": -8.422673225402832, "global_step": 47585, "epoch": 283} {"train_loss": -8.080215454101562, "global_step": 47586, "epoch": 283} {"train_loss": -8.246190071105957, "global_step": 47587, "epoch": 283} {"train_loss": -8.36107063293457, "global_step": 47588, "epoch": 283} {"train_loss": -8.33328628540039, "global_step": 47589, "epoch": 283} {"train_loss": -8.106773376464844, "global_step": 47590, "epoch": 283} {"train_loss": -7.990202903747559, "global_step": 47591, "epoch": 283} {"train_loss": -8.369858741760254, "global_step": 47592, "epoch": 283} {"train_loss": -8.1961088180542, "global_step": 47593, "epoch": 283} {"train_loss": -8.342308044433594, "global_step": 47594, "epoch": 283} {"train_loss": -8.276185989379883, "global_step": 47595, "epoch": 283} {"train_loss": -8.295007705688477, "global_step": 47596, "epoch": 283} {"train_loss": -7.853196620941162, "global_step": 47597, "epoch": 283} {"train_loss": -8.177236557006836, "global_step": 47598, "epoch": 283} {"train_loss": -7.7713847160339355, "global_step": 47599, "epoch": 283} {"train_loss": -8.088926315307617, "global_step": 47600, "epoch": 283} {"train_loss": -7.410887718200684, "global_step": 47601, "epoch": 283} {"train_loss": -7.928625106811523, "global_step": 47602, "epoch": 283} {"train_loss": -7.762721061706543, "global_step": 47603, "epoch": 283} {"train_loss": -8.062355995178223, "global_step": 47604, "epoch": 283} {"train_loss": -7.8045125007629395, "global_step": 47605, "epoch": 283} {"train_loss": -8.061121940612793, "global_step": 47606, "epoch": 283} {"train_loss": -8.036700248718262, "global_step": 47607, "epoch": 283} {"train_loss": -7.692586898803711, "global_step": 47608, "epoch": 283} {"train_loss": -8.297151565551758, "global_step": 47609, "epoch": 283} {"train_loss": -7.724992275238037, "global_step": 47610, "epoch": 283} {"train_loss": -8.164380073547363, "global_step": 47611, "epoch": 283} {"train_loss": -8.02052116394043, "global_step": 47612, "epoch": 283} {"train_loss": -8.168547630310059, "global_step": 47613, "epoch": 283} {"train_loss": -7.951765537261963, "global_step": 47614, "epoch": 283} {"train_loss": -7.853846549987793, "global_step": 47615, "epoch": 283} {"train_loss": -8.15080451965332, "global_step": 47616, "epoch": 283} {"train_loss": -8.056661605834961, "global_step": 47617, "epoch": 283} {"train_loss": -7.911802768707275, "global_step": 47618, "epoch": 283} {"train_loss": -8.26613998413086, "global_step": 47619, "epoch": 283} {"train_loss": -8.063364028930664, "global_step": 47620, "epoch": 283} {"train_loss": -8.127542495727539, "global_step": 47621, "epoch": 283} {"train_loss": -8.335314750671387, "global_step": 47622, "epoch": 283} {"train_loss": -8.097265243530273, "global_step": 47623, "epoch": 283} {"train_loss": -8.245967864990234, "global_step": 47624, "epoch": 283} {"train_loss": -8.224894523620605, "global_step": 47625, "epoch": 283} {"train_loss": -8.414268493652344, "global_step": 47626, "epoch": 283} {"train_loss": -8.337347030639648, "global_step": 47627, "epoch": 283} {"train_loss": -8.100342750549316, "global_step": 47628, "epoch": 283} {"train_loss": -7.957586288452148, "global_step": 47629, "epoch": 283} {"train_loss": -8.297672271728516, "global_step": 47630, "epoch": 283} {"train_loss": -8.242838859558105, "global_step": 47631, "epoch": 283} {"train_loss": -8.381009101867676, "global_step": 47632, "epoch": 283} {"train_loss": -8.178162574768066, "global_step": 47633, "epoch": 283} {"train_loss": -8.373619079589844, "global_step": 47634, "epoch": 283} {"train_loss": -7.897502899169922, "global_step": 47635, "epoch": 283} {"train_loss": -8.352420806884766, "global_step": 47636, "epoch": 283} {"train_loss": -8.240726470947266, "global_step": 47637, "epoch": 283} {"train_loss": -8.350513458251953, "global_step": 47638, "epoch": 283} {"train_loss": -8.210439682006836, "global_step": 47639, "epoch": 283} {"train_loss": -8.127361297607422, "global_step": 47640, "epoch": 283} {"train_loss": -8.076423645019531, "global_step": 47641, "epoch": 283} {"train_loss": -8.24810791015625, "global_step": 47642, "epoch": 283} {"train_loss": -8.1583833694458, "global_step": 47643, "epoch": 283} {"train_loss": -8.247676849365234, "global_step": 47644, "epoch": 283} {"train_loss": -8.289865493774414, "global_step": 47645, "epoch": 283} {"train_loss": -8.075154304504395, "global_step": 47646, "epoch": 283} {"train_loss": -8.356040000915527, "global_step": 47647, "epoch": 283} {"train_loss": -8.258872032165527, "global_step": 47648, "epoch": 283} {"train_loss": -8.255582809448242, "global_step": 47649, "epoch": 283} {"train_loss": -8.20991325378418, "global_step": 47650, "epoch": 283} {"train_loss": -8.545316696166992, "global_step": 47651, "epoch": 283} {"train_loss": -8.45327091217041, "global_step": 47652, "epoch": 283} {"train_loss": -8.55897045135498, "global_step": 47653, "epoch": 283} {"train_loss": -8.508978843688965, "global_step": 47654, "epoch": 283} {"train_loss": -8.228402137756348, "global_step": 47655, "epoch": 283} {"train_loss": -8.141351699829102, "global_step": 47656, "epoch": 283} {"train_loss": -8.30902099609375, "global_step": 47657, "epoch": 283} {"train_loss": -8.284412384033203, "global_step": 47658, "epoch": 283} {"train_loss": -8.368813514709473, "global_step": 47659, "epoch": 283} {"train_loss": -8.335034370422363, "global_step": 47660, "epoch": 283} {"train_loss": -8.207804679870605, "global_step": 47661, "epoch": 283} {"train_loss": -8.294757843017578, "global_step": 47662, "epoch": 283} {"train_loss": -8.378708839416504, "global_step": 47663, "epoch": 283} {"train_loss": -8.18167781829834, "global_step": 47664, "epoch": 283} {"train_loss": -8.143887519836426, "global_step": 47665, "epoch": 283} {"train_loss": -7.905333518981934, "global_step": 47666, "epoch": 283} {"train_loss": -8.403217315673828, "global_step": 47667, "epoch": 283} {"train_loss": -8.02880859375, "global_step": 47668, "epoch": 283} {"train_loss": -8.162416458129883, "global_step": 47669, "epoch": 283} {"train_loss": -8.295976638793945, "global_step": 47670, "epoch": 283} {"train_loss": -8.151588439941406, "global_step": 47671, "epoch": 283} {"train_loss": -8.243454933166504, "global_step": 47672, "epoch": 283} {"train_loss": -8.369413375854492, "global_step": 47673, "epoch": 283} {"train_loss": -8.167745590209961, "global_step": 47674, "epoch": 283} {"train_loss": -8.393166542053223, "global_step": 47675, "epoch": 283} {"train_loss": -8.312431335449219, "global_step": 47676, "epoch": 283} {"train_loss": -8.097434997558594, "global_step": 47677, "epoch": 283} {"train_loss": -7.969759464263916, "global_step": 47678, "epoch": 283} {"train_loss": -8.346893310546875, "global_step": 47679, "epoch": 283} {"train_loss": -7.998981475830078, "global_step": 47680, "epoch": 283} {"train_loss": -8.231207847595215, "global_step": 47681, "epoch": 283} {"train_loss": -8.220758438110352, "global_step": 47682, "epoch": 283} {"train_loss": -8.04820728302002, "global_step": 47683, "epoch": 283} {"train_loss": -8.243539810180664, "global_step": 47684, "epoch": 283} {"train_loss": -8.209230422973633, "global_step": 47685, "epoch": 283} {"train_loss": -8.165650367736816, "global_step": 47686, "epoch": 283} {"train_loss": -8.291990280151367, "global_step": 47687, "epoch": 283} {"train_loss": -8.245330810546875, "global_step": 47688, "epoch": 283} {"train_loss": -8.053844451904297, "global_step": 47689, "epoch": 283} {"train_loss": -8.18655014038086, "global_step": 47690, "epoch": 283} {"train_loss": -8.053733825683594, "global_step": 47691, "epoch": 283} {"train_loss": -8.190397262573242, "global_step": 47692, "epoch": 283} {"train_loss": -8.276780128479004, "global_step": 47693, "epoch": 283} {"train_loss": -8.21583080291748, "global_step": 47694, "epoch": 283} {"train_loss": -8.275554656982422, "global_step": 47695, "epoch": 283} {"train_loss": -8.36439323425293, "global_step": 47696, "epoch": 283} {"train_loss": -8.446778297424316, "global_step": 47697, "epoch": 283} {"train_loss": -8.432312965393066, "global_step": 47698, "epoch": 283} {"train_loss": -8.436903953552246, "global_step": 47699, "epoch": 283} {"train_loss": -8.535909652709961, "global_step": 47700, "epoch": 283} {"train_loss": -8.422194480895996, "global_step": 47701, "epoch": 283} {"train_loss": -8.349416732788086, "global_step": 47702, "epoch": 283} {"train_loss": -8.198055267333984, "global_step": 47703, "epoch": 283} {"train_loss": -8.364511489868164, "global_step": 47704, "epoch": 283} {"train_loss": -8.29726791381836, "global_step": 47705, "epoch": 283} {"train_loss": -8.104677200317383, "global_step": 47706, "epoch": 283} {"train_loss": -8.340657234191895, "global_step": 47707, "epoch": 283} {"train_loss": -8.039383888244629, "global_step": 47708, "epoch": 283} {"train_loss": -8.190458297729492, "global_step": 47709, "epoch": 283} {"train_loss": -8.18026351928711, "global_step": 47710, "epoch": 283} {"train_loss": -8.182541083721887, "global_step": 47711, "epoch": 283, "val_loss": 187846.046875} {"train_loss": -8.298219680786133, "global_step": 47712, "epoch": 284} {"train_loss": -8.239952087402344, "global_step": 47713, "epoch": 284} {"train_loss": -8.191985130310059, "global_step": 47714, "epoch": 284} {"train_loss": -8.535177230834961, "global_step": 47715, "epoch": 284} {"train_loss": -8.067453384399414, "global_step": 47716, "epoch": 284} {"train_loss": -8.467927932739258, "global_step": 47717, "epoch": 284} {"train_loss": -8.296602249145508, "global_step": 47718, "epoch": 284} {"train_loss": -8.144763946533203, "global_step": 47719, "epoch": 284} {"train_loss": -8.334272384643555, "global_step": 47720, "epoch": 284} {"train_loss": -8.103805541992188, "global_step": 47721, "epoch": 284} {"train_loss": -8.291828155517578, "global_step": 47722, "epoch": 284} {"train_loss": -8.244502067565918, "global_step": 47723, "epoch": 284} {"train_loss": -8.433647155761719, "global_step": 47724, "epoch": 284} {"train_loss": -8.187665939331055, "global_step": 47725, "epoch": 284} {"train_loss": -8.316030502319336, "global_step": 47726, "epoch": 284} {"train_loss": -8.012530326843262, "global_step": 47727, "epoch": 284} {"train_loss": -8.39814281463623, "global_step": 47728, "epoch": 284} {"train_loss": -8.101444244384766, "global_step": 47729, "epoch": 284} {"train_loss": -8.069571495056152, "global_step": 47730, "epoch": 284} {"train_loss": -8.078880310058594, "global_step": 47731, "epoch": 284} {"train_loss": -8.00400161743164, "global_step": 47732, "epoch": 284} {"train_loss": -7.8446550369262695, "global_step": 47733, "epoch": 284} {"train_loss": -8.025789260864258, "global_step": 47734, "epoch": 284} {"train_loss": -8.275402069091797, "global_step": 47735, "epoch": 284} {"train_loss": -8.08397388458252, "global_step": 47736, "epoch": 284} {"train_loss": -8.3540620803833, "global_step": 47737, "epoch": 284} {"train_loss": -8.1299467086792, "global_step": 47738, "epoch": 284} {"train_loss": -8.170825958251953, "global_step": 47739, "epoch": 284} {"train_loss": -8.168173789978027, "global_step": 47740, "epoch": 284} {"train_loss": -8.325074195861816, "global_step": 47741, "epoch": 284} {"train_loss": -7.925217151641846, "global_step": 47742, "epoch": 284} {"train_loss": -8.300355911254883, "global_step": 47743, "epoch": 284} {"train_loss": -8.136125564575195, "global_step": 47744, "epoch": 284} {"train_loss": -8.19676399230957, "global_step": 47745, "epoch": 284} {"train_loss": -8.073381423950195, "global_step": 47746, "epoch": 284} {"train_loss": -8.311115264892578, "global_step": 47747, "epoch": 284} {"train_loss": -7.9657979011535645, "global_step": 47748, "epoch": 284} {"train_loss": -8.282612800598145, "global_step": 47749, "epoch": 284} {"train_loss": -8.091615676879883, "global_step": 47750, "epoch": 284} {"train_loss": -8.139720916748047, "global_step": 47751, "epoch": 284} {"train_loss": -7.85888147354126, "global_step": 47752, "epoch": 284} {"train_loss": -8.313488006591797, "global_step": 47753, "epoch": 284} {"train_loss": -7.796526908874512, "global_step": 47754, "epoch": 284} {"train_loss": -8.130033493041992, "global_step": 47755, "epoch": 284} {"train_loss": -8.287927627563477, "global_step": 47756, "epoch": 284} {"train_loss": -8.414283752441406, "global_step": 47757, "epoch": 284} {"train_loss": -8.273439407348633, "global_step": 47758, "epoch": 284} {"train_loss": -8.33304500579834, "global_step": 47759, "epoch": 284} {"train_loss": -8.176431655883789, "global_step": 47760, "epoch": 284} {"train_loss": -8.22066879272461, "global_step": 47761, "epoch": 284} {"train_loss": -8.228349685668945, "global_step": 47762, "epoch": 284} {"train_loss": -8.365345001220703, "global_step": 47763, "epoch": 284} {"train_loss": -8.317383766174316, "global_step": 47764, "epoch": 284} {"train_loss": -8.349599838256836, "global_step": 47765, "epoch": 284} {"train_loss": -8.344043731689453, "global_step": 47766, "epoch": 284} {"train_loss": -8.241069793701172, "global_step": 47767, "epoch": 284} {"train_loss": -8.301979064941406, "global_step": 47768, "epoch": 284} {"train_loss": -8.275802612304688, "global_step": 47769, "epoch": 284} {"train_loss": -8.314403533935547, "global_step": 47770, "epoch": 284} {"train_loss": -8.287047386169434, "global_step": 47771, "epoch": 284} {"train_loss": -8.213927268981934, "global_step": 47772, "epoch": 284} {"train_loss": -8.44237995147705, "global_step": 47773, "epoch": 284} {"train_loss": -8.377130508422852, "global_step": 47774, "epoch": 284} {"train_loss": -8.3148193359375, "global_step": 47775, "epoch": 284} {"train_loss": -8.357754707336426, "global_step": 47776, "epoch": 284} {"train_loss": -8.135831832885742, "global_step": 47777, "epoch": 284} {"train_loss": -8.531431198120117, "global_step": 47778, "epoch": 284} {"train_loss": -8.134294509887695, "global_step": 47779, "epoch": 284} {"train_loss": -8.426179885864258, "global_step": 47780, "epoch": 284} {"train_loss": -7.939919471740723, "global_step": 47781, "epoch": 284} {"train_loss": -8.372184753417969, "global_step": 47782, "epoch": 284} {"train_loss": -8.081120491027832, "global_step": 47783, "epoch": 284} {"train_loss": -8.071447372436523, "global_step": 47784, "epoch": 284} {"train_loss": -8.178842544555664, "global_step": 47785, "epoch": 284} {"train_loss": -8.512899398803711, "global_step": 47786, "epoch": 284} {"train_loss": -8.48849868774414, "global_step": 47787, "epoch": 284} {"train_loss": -8.032682418823242, "global_step": 47788, "epoch": 284} {"train_loss": -8.150514602661133, "global_step": 47789, "epoch": 284} {"train_loss": -8.080150604248047, "global_step": 47790, "epoch": 284} {"train_loss": -8.235445022583008, "global_step": 47791, "epoch": 284} {"train_loss": -8.130131721496582, "global_step": 47792, "epoch": 284} {"train_loss": -8.239768981933594, "global_step": 47793, "epoch": 284} {"train_loss": -8.306114196777344, "global_step": 47794, "epoch": 284} {"train_loss": -8.049140930175781, "global_step": 47795, "epoch": 284} {"train_loss": -8.272144317626953, "global_step": 47796, "epoch": 284} {"train_loss": -8.330364227294922, "global_step": 47797, "epoch": 284} {"train_loss": -8.04301643371582, "global_step": 47798, "epoch": 284} {"train_loss": -8.243919372558594, "global_step": 47799, "epoch": 284} {"train_loss": -8.149378776550293, "global_step": 47800, "epoch": 284} {"train_loss": -8.384529113769531, "global_step": 47801, "epoch": 284} {"train_loss": -8.099161148071289, "global_step": 47802, "epoch": 284} {"train_loss": -8.188127517700195, "global_step": 47803, "epoch": 284} {"train_loss": -8.304006576538086, "global_step": 47804, "epoch": 284} {"train_loss": -8.34011459350586, "global_step": 47805, "epoch": 284} {"train_loss": -8.337162017822266, "global_step": 47806, "epoch": 284} {"train_loss": -8.006917953491211, "global_step": 47807, "epoch": 284} {"train_loss": -8.117145538330078, "global_step": 47808, "epoch": 284} {"train_loss": -8.255159378051758, "global_step": 47809, "epoch": 284} {"train_loss": -8.1829252243042, "global_step": 47810, "epoch": 284} {"train_loss": -8.393585205078125, "global_step": 47811, "epoch": 284} {"train_loss": -8.370473861694336, "global_step": 47812, "epoch": 284} {"train_loss": -8.054859161376953, "global_step": 47813, "epoch": 284} {"train_loss": -8.45744800567627, "global_step": 47814, "epoch": 284} {"train_loss": -8.196100234985352, "global_step": 47815, "epoch": 284} {"train_loss": -8.203483581542969, "global_step": 47816, "epoch": 284} {"train_loss": -8.133374214172363, "global_step": 47817, "epoch": 284} {"train_loss": -8.106842041015625, "global_step": 47818, "epoch": 284} {"train_loss": -8.216150283813477, "global_step": 47819, "epoch": 284} {"train_loss": -8.150246620178223, "global_step": 47820, "epoch": 284} {"train_loss": -8.09058952331543, "global_step": 47821, "epoch": 284} {"train_loss": -8.125097274780273, "global_step": 47822, "epoch": 284} {"train_loss": -8.160757064819336, "global_step": 47823, "epoch": 284} {"train_loss": -8.143562316894531, "global_step": 47824, "epoch": 284} {"train_loss": -7.886995792388916, "global_step": 47825, "epoch": 284} {"train_loss": -8.370086669921875, "global_step": 47826, "epoch": 284} {"train_loss": -8.304830551147461, "global_step": 47827, "epoch": 284} {"train_loss": -8.26329517364502, "global_step": 47828, "epoch": 284} {"train_loss": -8.244559288024902, "global_step": 47829, "epoch": 284} {"train_loss": -8.1899995803833, "global_step": 47830, "epoch": 284} {"train_loss": -7.904303550720215, "global_step": 47831, "epoch": 284} {"train_loss": -8.202978134155273, "global_step": 47832, "epoch": 284} {"train_loss": -8.003125190734863, "global_step": 47833, "epoch": 284} {"train_loss": -8.113597869873047, "global_step": 47834, "epoch": 284} {"train_loss": -7.9794721603393555, "global_step": 47835, "epoch": 284} {"train_loss": -7.842625617980957, "global_step": 47836, "epoch": 284} {"train_loss": -8.073403358459473, "global_step": 47837, "epoch": 284} {"train_loss": -8.26065444946289, "global_step": 47838, "epoch": 284} {"train_loss": -7.709568977355957, "global_step": 47839, "epoch": 284} {"train_loss": -8.166925430297852, "global_step": 47840, "epoch": 284} {"train_loss": -8.070491790771484, "global_step": 47841, "epoch": 284} {"train_loss": -8.178567886352539, "global_step": 47842, "epoch": 284} {"train_loss": -8.19696044921875, "global_step": 47843, "epoch": 284} {"train_loss": -8.314224243164062, "global_step": 47844, "epoch": 284} {"train_loss": -7.994943618774414, "global_step": 47845, "epoch": 284} {"train_loss": -8.373226165771484, "global_step": 47846, "epoch": 284} {"train_loss": -8.319441795349121, "global_step": 47847, "epoch": 284} {"train_loss": -8.304011344909668, "global_step": 47848, "epoch": 284} {"train_loss": -8.353364944458008, "global_step": 47849, "epoch": 284} {"train_loss": -8.327260971069336, "global_step": 47850, "epoch": 284} {"train_loss": -8.51143741607666, "global_step": 47851, "epoch": 284} {"train_loss": -8.224452018737793, "global_step": 47852, "epoch": 284} {"train_loss": -8.42746353149414, "global_step": 47853, "epoch": 284} {"train_loss": -8.383837699890137, "global_step": 47854, "epoch": 284} {"train_loss": -8.492362976074219, "global_step": 47855, "epoch": 284} {"train_loss": -8.390217781066895, "global_step": 47856, "epoch": 284} {"train_loss": -8.340717315673828, "global_step": 47857, "epoch": 284} {"train_loss": -8.335094451904297, "global_step": 47858, "epoch": 284} {"train_loss": -8.339693069458008, "global_step": 47859, "epoch": 284} {"train_loss": -8.08349323272705, "global_step": 47860, "epoch": 284} {"train_loss": -8.37322998046875, "global_step": 47861, "epoch": 284} {"train_loss": -8.249732971191406, "global_step": 47862, "epoch": 284} {"train_loss": -8.034737586975098, "global_step": 47863, "epoch": 284} {"train_loss": -8.31096076965332, "global_step": 47864, "epoch": 284} {"train_loss": -8.114226341247559, "global_step": 47865, "epoch": 284} {"train_loss": -7.963161945343018, "global_step": 47866, "epoch": 284} {"train_loss": -7.945549488067627, "global_step": 47867, "epoch": 284} {"train_loss": -7.975098609924316, "global_step": 47868, "epoch": 284} {"train_loss": -8.103382110595703, "global_step": 47869, "epoch": 284} {"train_loss": -8.060078620910645, "global_step": 47870, "epoch": 284} {"train_loss": -8.453285217285156, "global_step": 47871, "epoch": 284} {"train_loss": -7.836614608764648, "global_step": 47872, "epoch": 284} {"train_loss": -8.086261749267578, "global_step": 47873, "epoch": 284} {"train_loss": -8.148224830627441, "global_step": 47874, "epoch": 284} {"train_loss": -8.1343355178833, "global_step": 47875, "epoch": 284} {"train_loss": -8.291805267333984, "global_step": 47876, "epoch": 284} {"train_loss": -8.174848556518555, "global_step": 47877, "epoch": 284} {"train_loss": -8.31899642944336, "global_step": 47878, "epoch": 284} {"train_loss": -8.20599465143113, "global_step": 47879, "epoch": 284, "val_loss": 187980.125} {"train_loss": -8.240467071533203, "global_step": 47880, "epoch": 285} {"train_loss": -8.223100662231445, "global_step": 47881, "epoch": 285} {"train_loss": -8.304547309875488, "global_step": 47882, "epoch": 285} {"train_loss": -8.003928184509277, "global_step": 47883, "epoch": 285} {"train_loss": -8.487754821777344, "global_step": 47884, "epoch": 285} {"train_loss": -7.941706657409668, "global_step": 47885, "epoch": 285} {"train_loss": -8.422865867614746, "global_step": 47886, "epoch": 285} {"train_loss": -8.206277847290039, "global_step": 47887, "epoch": 285} {"train_loss": -8.338774681091309, "global_step": 47888, "epoch": 285} {"train_loss": -8.240995407104492, "global_step": 47889, "epoch": 285} {"train_loss": -8.243575096130371, "global_step": 47890, "epoch": 285} {"train_loss": -8.200151443481445, "global_step": 47891, "epoch": 285} {"train_loss": -8.451790809631348, "global_step": 47892, "epoch": 285} {"train_loss": -8.285417556762695, "global_step": 47893, "epoch": 285} {"train_loss": -8.48192024230957, "global_step": 47894, "epoch": 285} {"train_loss": -8.336042404174805, "global_step": 47895, "epoch": 285} {"train_loss": -8.393104553222656, "global_step": 47896, "epoch": 285} {"train_loss": -8.505302429199219, "global_step": 47897, "epoch": 285} {"train_loss": -8.23538589477539, "global_step": 47898, "epoch": 285} {"train_loss": -8.327573776245117, "global_step": 47899, "epoch": 285} {"train_loss": -8.487844467163086, "global_step": 47900, "epoch": 285} {"train_loss": -8.40934944152832, "global_step": 47901, "epoch": 285} {"train_loss": -8.338888168334961, "global_step": 47902, "epoch": 285} {"train_loss": -8.361917495727539, "global_step": 47903, "epoch": 285} {"train_loss": -8.44349193572998, "global_step": 47904, "epoch": 285} {"train_loss": -8.354209899902344, "global_step": 47905, "epoch": 285} {"train_loss": -8.43388557434082, "global_step": 47906, "epoch": 285} {"train_loss": -8.589622497558594, "global_step": 47907, "epoch": 285} {"train_loss": -8.114594459533691, "global_step": 47908, "epoch": 285} {"train_loss": -8.424046516418457, "global_step": 47909, "epoch": 285} {"train_loss": -8.441682815551758, "global_step": 47910, "epoch": 285} {"train_loss": -8.382472038269043, "global_step": 47911, "epoch": 285} {"train_loss": -8.471323013305664, "global_step": 47912, "epoch": 285} {"train_loss": -8.372540473937988, "global_step": 47913, "epoch": 285} {"train_loss": -8.449006080627441, "global_step": 47914, "epoch": 285} {"train_loss": -8.33767318725586, "global_step": 47915, "epoch": 285} {"train_loss": -8.271533966064453, "global_step": 47916, "epoch": 285} {"train_loss": -8.445099830627441, "global_step": 47917, "epoch": 285} {"train_loss": -8.1573486328125, "global_step": 47918, "epoch": 285} {"train_loss": -8.19406509399414, "global_step": 47919, "epoch": 285} {"train_loss": -8.547769546508789, "global_step": 47920, "epoch": 285} {"train_loss": -8.211145401000977, "global_step": 47921, "epoch": 285} {"train_loss": -8.32590103149414, "global_step": 47922, "epoch": 285} {"train_loss": -8.40462875366211, "global_step": 47923, "epoch": 285} {"train_loss": -8.208162307739258, "global_step": 47924, "epoch": 285} {"train_loss": -8.13022518157959, "global_step": 47925, "epoch": 285} {"train_loss": -8.301063537597656, "global_step": 47926, "epoch": 285} {"train_loss": -8.334678649902344, "global_step": 47927, "epoch": 285} {"train_loss": -8.246288299560547, "global_step": 47928, "epoch": 285} {"train_loss": -8.224555969238281, "global_step": 47929, "epoch": 285} {"train_loss": -8.170428276062012, "global_step": 47930, "epoch": 285} {"train_loss": -8.273422241210938, "global_step": 47931, "epoch": 285} {"train_loss": -8.249685287475586, "global_step": 47932, "epoch": 285} {"train_loss": -7.890320777893066, "global_step": 47933, "epoch": 285} {"train_loss": -8.495529174804688, "global_step": 47934, "epoch": 285} {"train_loss": -8.065783500671387, "global_step": 47935, "epoch": 285} {"train_loss": -8.16901969909668, "global_step": 47936, "epoch": 285} {"train_loss": -8.029878616333008, "global_step": 47937, "epoch": 285} {"train_loss": -8.170868873596191, "global_step": 47938, "epoch": 285} {"train_loss": -7.9846906661987305, "global_step": 47939, "epoch": 285} {"train_loss": -8.217415809631348, "global_step": 47940, "epoch": 285} {"train_loss": -8.079442977905273, "global_step": 47941, "epoch": 285} {"train_loss": -8.366175651550293, "global_step": 47942, "epoch": 285} {"train_loss": -8.216405868530273, "global_step": 47943, "epoch": 285} {"train_loss": -7.915375709533691, "global_step": 47944, "epoch": 285} {"train_loss": -7.951087951660156, "global_step": 47945, "epoch": 285} {"train_loss": -8.030599594116211, "global_step": 47946, "epoch": 285} {"train_loss": -8.336714744567871, "global_step": 47947, "epoch": 285} {"train_loss": -8.14975357055664, "global_step": 47948, "epoch": 285} {"train_loss": -8.183863639831543, "global_step": 47949, "epoch": 285} {"train_loss": -8.29056167602539, "global_step": 47950, "epoch": 285} {"train_loss": -7.897152900695801, "global_step": 47951, "epoch": 285} {"train_loss": -8.254804611206055, "global_step": 47952, "epoch": 285} {"train_loss": -8.061952590942383, "global_step": 47953, "epoch": 285} {"train_loss": -8.262826919555664, "global_step": 47954, "epoch": 285} {"train_loss": -8.277463912963867, "global_step": 47955, "epoch": 285} {"train_loss": -8.33928394317627, "global_step": 47956, "epoch": 285} {"train_loss": -8.272035598754883, "global_step": 47957, "epoch": 285} {"train_loss": -8.280171394348145, "global_step": 47958, "epoch": 285} {"train_loss": -8.262992858886719, "global_step": 47959, "epoch": 285} {"train_loss": -8.317582130432129, "global_step": 47960, "epoch": 285} {"train_loss": -8.30282974243164, "global_step": 47961, "epoch": 285} {"train_loss": -8.340900421142578, "global_step": 47962, "epoch": 285} {"train_loss": -8.318775177001953, "global_step": 47963, "epoch": 285} {"train_loss": -8.526006698608398, "global_step": 47964, "epoch": 285} {"train_loss": -8.199951171875, "global_step": 47965, "epoch": 285} {"train_loss": -8.260099411010742, "global_step": 47966, "epoch": 285} {"train_loss": -8.304571151733398, "global_step": 47967, "epoch": 285} {"train_loss": -8.110774040222168, "global_step": 47968, "epoch": 285} {"train_loss": -8.509895324707031, "global_step": 47969, "epoch": 285} {"train_loss": -8.357857704162598, "global_step": 47970, "epoch": 285} {"train_loss": -8.325216293334961, "global_step": 47971, "epoch": 285} {"train_loss": -8.300443649291992, "global_step": 47972, "epoch": 285} {"train_loss": -8.268943786621094, "global_step": 47973, "epoch": 285} {"train_loss": -8.278743743896484, "global_step": 47974, "epoch": 285} {"train_loss": -8.36882209777832, "global_step": 47975, "epoch": 285} {"train_loss": -8.078361511230469, "global_step": 47976, "epoch": 285} {"train_loss": -8.047126770019531, "global_step": 47977, "epoch": 285} {"train_loss": -8.418944358825684, "global_step": 47978, "epoch": 285} {"train_loss": -8.201189041137695, "global_step": 47979, "epoch": 285} {"train_loss": -8.318466186523438, "global_step": 47980, "epoch": 285} {"train_loss": -8.323880195617676, "global_step": 47981, "epoch": 285} {"train_loss": -8.190804481506348, "global_step": 47982, "epoch": 285} {"train_loss": -8.158502578735352, "global_step": 47983, "epoch": 285} {"train_loss": -8.261598587036133, "global_step": 47984, "epoch": 285} {"train_loss": -7.772050857543945, "global_step": 47985, "epoch": 285} {"train_loss": -8.345573425292969, "global_step": 47986, "epoch": 285} {"train_loss": -8.09614372253418, "global_step": 47987, "epoch": 285} {"train_loss": -8.20868968963623, "global_step": 47988, "epoch": 285} {"train_loss": -8.419002532958984, "global_step": 47989, "epoch": 285} {"train_loss": -8.103763580322266, "global_step": 47990, "epoch": 285} {"train_loss": -8.178024291992188, "global_step": 47991, "epoch": 285} {"train_loss": -8.335107803344727, "global_step": 47992, "epoch": 285} {"train_loss": -8.162602424621582, "global_step": 47993, "epoch": 285} {"train_loss": -8.177999496459961, "global_step": 47994, "epoch": 285} {"train_loss": -8.177366256713867, "global_step": 47995, "epoch": 285} {"train_loss": -8.02220344543457, "global_step": 47996, "epoch": 285} {"train_loss": -8.332498550415039, "global_step": 47997, "epoch": 285} {"train_loss": -8.260290145874023, "global_step": 47998, "epoch": 285} {"train_loss": -8.348989486694336, "global_step": 47999, "epoch": 285} {"train_loss": -7.919631004333496, "global_step": 48000, "epoch": 285} {"train_loss": -8.129899978637695, "global_step": 48001, "epoch": 285} {"train_loss": -8.126165390014648, "global_step": 48002, "epoch": 285} {"train_loss": -8.43841552734375, "global_step": 48003, "epoch": 285} {"train_loss": -7.994476318359375, "global_step": 48004, "epoch": 285} {"train_loss": -8.424108505249023, "global_step": 48005, "epoch": 285} {"train_loss": -8.111157417297363, "global_step": 48006, "epoch": 285} {"train_loss": -8.296125411987305, "global_step": 48007, "epoch": 285} {"train_loss": -8.206762313842773, "global_step": 48008, "epoch": 285} {"train_loss": -8.262544631958008, "global_step": 48009, "epoch": 285} {"train_loss": -8.174203872680664, "global_step": 48010, "epoch": 285} {"train_loss": -8.213988304138184, "global_step": 48011, "epoch": 285} {"train_loss": -8.18177604675293, "global_step": 48012, "epoch": 285} {"train_loss": -8.083562850952148, "global_step": 48013, "epoch": 285} {"train_loss": -8.149211883544922, "global_step": 48014, "epoch": 285} {"train_loss": -8.120826721191406, "global_step": 48015, "epoch": 285} {"train_loss": -7.978353023529053, "global_step": 48016, "epoch": 285} {"train_loss": -8.155664443969727, "global_step": 48017, "epoch": 285} {"train_loss": -8.120448112487793, "global_step": 48018, "epoch": 285} {"train_loss": -8.12278938293457, "global_step": 48019, "epoch": 285} {"train_loss": -8.377279281616211, "global_step": 48020, "epoch": 285} {"train_loss": -8.157927513122559, "global_step": 48021, "epoch": 285} {"train_loss": -8.288797378540039, "global_step": 48022, "epoch": 285} {"train_loss": -8.082808494567871, "global_step": 48023, "epoch": 285} {"train_loss": -8.091047286987305, "global_step": 48024, "epoch": 285} {"train_loss": -8.25360107421875, "global_step": 48025, "epoch": 285} {"train_loss": -8.104273796081543, "global_step": 48026, "epoch": 285} {"train_loss": -8.268169403076172, "global_step": 48027, "epoch": 285} {"train_loss": -7.93117094039917, "global_step": 48028, "epoch": 285} {"train_loss": -8.142548561096191, "global_step": 48029, "epoch": 285} {"train_loss": -8.256357192993164, "global_step": 48030, "epoch": 285} {"train_loss": -8.15231990814209, "global_step": 48031, "epoch": 285} {"train_loss": -8.15135669708252, "global_step": 48032, "epoch": 285} {"train_loss": -8.1148099899292, "global_step": 48033, "epoch": 285} {"train_loss": -8.013710021972656, "global_step": 48034, "epoch": 285} {"train_loss": -8.27806568145752, "global_step": 48035, "epoch": 285} {"train_loss": -8.275893211364746, "global_step": 48036, "epoch": 285} {"train_loss": -8.004554748535156, "global_step": 48037, "epoch": 285} {"train_loss": -8.295818328857422, "global_step": 48038, "epoch": 285} {"train_loss": -8.210195541381836, "global_step": 48039, "epoch": 285} {"train_loss": -8.251245498657227, "global_step": 48040, "epoch": 285} {"train_loss": -8.246487617492676, "global_step": 48041, "epoch": 285} {"train_loss": -8.336578369140625, "global_step": 48042, "epoch": 285} {"train_loss": -7.96553897857666, "global_step": 48043, "epoch": 285} {"train_loss": -8.287078857421875, "global_step": 48044, "epoch": 285} {"train_loss": -8.11172103881836, "global_step": 48045, "epoch": 285} {"train_loss": -8.180917739868164, "global_step": 48046, "epoch": 285} {"train_loss": -8.236619154612223, "global_step": 48047, "epoch": 285, "val_loss": 188668.46875, "train_action_mse_error": 7.20053243637085} {"train_loss": -8.207723617553711, "global_step": 48048, "epoch": 286} {"train_loss": -8.402313232421875, "global_step": 48049, "epoch": 286} {"train_loss": -8.101375579833984, "global_step": 48050, "epoch": 286} {"train_loss": -8.255376815795898, "global_step": 48051, "epoch": 286} {"train_loss": -7.8735527992248535, "global_step": 48052, "epoch": 286} {"train_loss": -8.275115013122559, "global_step": 48053, "epoch": 286} {"train_loss": -8.066547393798828, "global_step": 48054, "epoch": 286} {"train_loss": -7.861922264099121, "global_step": 48055, "epoch": 286} {"train_loss": -7.9545769691467285, "global_step": 48056, "epoch": 286} {"train_loss": -8.12074089050293, "global_step": 48057, "epoch": 286} {"train_loss": -8.013668060302734, "global_step": 48058, "epoch": 286} {"train_loss": -7.7025227546691895, "global_step": 48059, "epoch": 286} {"train_loss": -8.160645484924316, "global_step": 48060, "epoch": 286} {"train_loss": -7.971148490905762, "global_step": 48061, "epoch": 286} {"train_loss": -8.264579772949219, "global_step": 48062, "epoch": 286} {"train_loss": -8.19183349609375, "global_step": 48063, "epoch": 286} {"train_loss": -7.743836402893066, "global_step": 48064, "epoch": 286} {"train_loss": -8.217212677001953, "global_step": 48065, "epoch": 286} {"train_loss": -7.880652904510498, "global_step": 48066, "epoch": 286} {"train_loss": -8.107254028320312, "global_step": 48067, "epoch": 286} {"train_loss": -8.062494277954102, "global_step": 48068, "epoch": 286} {"train_loss": -8.198083877563477, "global_step": 48069, "epoch": 286} {"train_loss": -8.144500732421875, "global_step": 48070, "epoch": 286} {"train_loss": -8.104597091674805, "global_step": 48071, "epoch": 286} {"train_loss": -8.219217300415039, "global_step": 48072, "epoch": 286} {"train_loss": -8.397388458251953, "global_step": 48073, "epoch": 286} {"train_loss": -8.196577072143555, "global_step": 48074, "epoch": 286} {"train_loss": -8.380099296569824, "global_step": 48075, "epoch": 286} {"train_loss": -8.31623363494873, "global_step": 48076, "epoch": 286} {"train_loss": -8.185891151428223, "global_step": 48077, "epoch": 286} {"train_loss": -8.348146438598633, "global_step": 48078, "epoch": 286} {"train_loss": -8.582889556884766, "global_step": 48079, "epoch": 286} {"train_loss": -8.22656536102295, "global_step": 48080, "epoch": 286} {"train_loss": -8.32878303527832, "global_step": 48081, "epoch": 286} {"train_loss": -8.231639862060547, "global_step": 48082, "epoch": 286} {"train_loss": -8.496350288391113, "global_step": 48083, "epoch": 286} {"train_loss": -8.288469314575195, "global_step": 48084, "epoch": 286} {"train_loss": -8.337669372558594, "global_step": 48085, "epoch": 286} {"train_loss": -8.276086807250977, "global_step": 48086, "epoch": 286} {"train_loss": -8.367429733276367, "global_step": 48087, "epoch": 286} {"train_loss": -8.48410415649414, "global_step": 48088, "epoch": 286} {"train_loss": -8.534765243530273, "global_step": 48089, "epoch": 286} {"train_loss": -8.5682373046875, "global_step": 48090, "epoch": 286} {"train_loss": -8.206830978393555, "global_step": 48091, "epoch": 286} {"train_loss": -8.522977828979492, "global_step": 48092, "epoch": 286} {"train_loss": -8.421929359436035, "global_step": 48093, "epoch": 286} {"train_loss": -8.417118072509766, "global_step": 48094, "epoch": 286} {"train_loss": -8.22038459777832, "global_step": 48095, "epoch": 286} {"train_loss": -8.556795120239258, "global_step": 48096, "epoch": 286} {"train_loss": -8.469392776489258, "global_step": 48097, "epoch": 286} {"train_loss": -8.514229774475098, "global_step": 48098, "epoch": 286} {"train_loss": -8.47824764251709, "global_step": 48099, "epoch": 286} {"train_loss": -8.506662368774414, "global_step": 48100, "epoch": 286} {"train_loss": -8.58615493774414, "global_step": 48101, "epoch": 286} {"train_loss": -8.329916000366211, "global_step": 48102, "epoch": 286} {"train_loss": -8.32365608215332, "global_step": 48103, "epoch": 286} {"train_loss": -8.534734725952148, "global_step": 48104, "epoch": 286} {"train_loss": -8.009074211120605, "global_step": 48105, "epoch": 286} {"train_loss": -8.451041221618652, "global_step": 48106, "epoch": 286} {"train_loss": -8.25651741027832, "global_step": 48107, "epoch": 286} {"train_loss": -8.279107093811035, "global_step": 48108, "epoch": 286} {"train_loss": -8.054489135742188, "global_step": 48109, "epoch": 286} {"train_loss": -8.234864234924316, "global_step": 48110, "epoch": 286} {"train_loss": -7.726844310760498, "global_step": 48111, "epoch": 286} {"train_loss": -8.35066032409668, "global_step": 48112, "epoch": 286} {"train_loss": -8.257963180541992, "global_step": 48113, "epoch": 286} {"train_loss": -8.27880859375, "global_step": 48114, "epoch": 286} {"train_loss": -8.1262845993042, "global_step": 48115, "epoch": 286} {"train_loss": -8.228134155273438, "global_step": 48116, "epoch": 286} {"train_loss": -7.8819732666015625, "global_step": 48117, "epoch": 286} {"train_loss": -8.243053436279297, "global_step": 48118, "epoch": 286} {"train_loss": -7.999007225036621, "global_step": 48119, "epoch": 286} {"train_loss": -8.138757705688477, "global_step": 48120, "epoch": 286} {"train_loss": -8.032000541687012, "global_step": 48121, "epoch": 286} {"train_loss": -7.809450149536133, "global_step": 48122, "epoch": 286} {"train_loss": -8.298337936401367, "global_step": 48123, "epoch": 286} {"train_loss": -7.961431503295898, "global_step": 48124, "epoch": 286} {"train_loss": -8.009231567382812, "global_step": 48125, "epoch": 286} {"train_loss": -8.116352081298828, "global_step": 48126, "epoch": 286} {"train_loss": -8.303545951843262, "global_step": 48127, "epoch": 286} {"train_loss": -8.288619995117188, "global_step": 48128, "epoch": 286} {"train_loss": -8.165359497070312, "global_step": 48129, "epoch": 286} {"train_loss": -8.424070358276367, "global_step": 48130, "epoch": 286} {"train_loss": -8.33961009979248, "global_step": 48131, "epoch": 286} {"train_loss": -8.158227920532227, "global_step": 48132, "epoch": 286} {"train_loss": -8.331476211547852, "global_step": 48133, "epoch": 286} {"train_loss": -8.424235343933105, "global_step": 48134, "epoch": 286} {"train_loss": -8.34101676940918, "global_step": 48135, "epoch": 286} {"train_loss": -8.245335578918457, "global_step": 48136, "epoch": 286} {"train_loss": -8.350435256958008, "global_step": 48137, "epoch": 286} {"train_loss": -8.238544464111328, "global_step": 48138, "epoch": 286} {"train_loss": -8.216713905334473, "global_step": 48139, "epoch": 286} {"train_loss": -8.293818473815918, "global_step": 48140, "epoch": 286} {"train_loss": -8.300249099731445, "global_step": 48141, "epoch": 286} {"train_loss": -8.28098201751709, "global_step": 48142, "epoch": 286} {"train_loss": -8.248620986938477, "global_step": 48143, "epoch": 286} {"train_loss": -8.101744651794434, "global_step": 48144, "epoch": 286} {"train_loss": -7.920084476470947, "global_step": 48145, "epoch": 286} {"train_loss": -7.933647632598877, "global_step": 48146, "epoch": 286} {"train_loss": -8.25424575805664, "global_step": 48147, "epoch": 286} {"train_loss": -8.254908561706543, "global_step": 48148, "epoch": 286} {"train_loss": -8.322704315185547, "global_step": 48149, "epoch": 286} {"train_loss": -8.220327377319336, "global_step": 48150, "epoch": 286} {"train_loss": -8.155238151550293, "global_step": 48151, "epoch": 286} {"train_loss": -8.408982276916504, "global_step": 48152, "epoch": 286} {"train_loss": -8.197342872619629, "global_step": 48153, "epoch": 286} {"train_loss": -8.28331184387207, "global_step": 48154, "epoch": 286} {"train_loss": -8.245990753173828, "global_step": 48155, "epoch": 286} {"train_loss": -8.300410270690918, "global_step": 48156, "epoch": 286} {"train_loss": -8.26633071899414, "global_step": 48157, "epoch": 286} {"train_loss": -8.29351806640625, "global_step": 48158, "epoch": 286} {"train_loss": -8.017867088317871, "global_step": 48159, "epoch": 286} {"train_loss": -8.185796737670898, "global_step": 48160, "epoch": 286} {"train_loss": -8.235610961914062, "global_step": 48161, "epoch": 286} {"train_loss": -7.818230628967285, "global_step": 48162, "epoch": 286} {"train_loss": -8.408010482788086, "global_step": 48163, "epoch": 286} {"train_loss": -8.212159156799316, "global_step": 48164, "epoch": 286} {"train_loss": -8.169332504272461, "global_step": 48165, "epoch": 286} {"train_loss": -8.270200729370117, "global_step": 48166, "epoch": 286} {"train_loss": -8.197711944580078, "global_step": 48167, "epoch": 286} {"train_loss": -8.262897491455078, "global_step": 48168, "epoch": 286} {"train_loss": -8.081647872924805, "global_step": 48169, "epoch": 286} {"train_loss": -8.09262752532959, "global_step": 48170, "epoch": 286} {"train_loss": -8.281496047973633, "global_step": 48171, "epoch": 286} {"train_loss": -7.787172794342041, "global_step": 48172, "epoch": 286} {"train_loss": -8.143210411071777, "global_step": 48173, "epoch": 286} {"train_loss": -8.016651153564453, "global_step": 48174, "epoch": 286} {"train_loss": -8.329385757446289, "global_step": 48175, "epoch": 286} {"train_loss": -7.879833221435547, "global_step": 48176, "epoch": 286} {"train_loss": -8.282893180847168, "global_step": 48177, "epoch": 286} {"train_loss": -7.904632091522217, "global_step": 48178, "epoch": 286} {"train_loss": -8.26896858215332, "global_step": 48179, "epoch": 286} {"train_loss": -7.935483932495117, "global_step": 48180, "epoch": 286} {"train_loss": -8.083250999450684, "global_step": 48181, "epoch": 286} {"train_loss": -7.915586471557617, "global_step": 48182, "epoch": 286} {"train_loss": -8.039274215698242, "global_step": 48183, "epoch": 286} {"train_loss": -8.170797348022461, "global_step": 48184, "epoch": 286} {"train_loss": -7.91050386428833, "global_step": 48185, "epoch": 286} {"train_loss": -8.091456413269043, "global_step": 48186, "epoch": 286} {"train_loss": -7.9149885177612305, "global_step": 48187, "epoch": 286} {"train_loss": -8.154762268066406, "global_step": 48188, "epoch": 286} {"train_loss": -7.831460952758789, "global_step": 48189, "epoch": 286} {"train_loss": -7.925910949707031, "global_step": 48190, "epoch": 286} {"train_loss": -8.1614990234375, "global_step": 48191, "epoch": 286} {"train_loss": -8.120124816894531, "global_step": 48192, "epoch": 286} {"train_loss": -8.300329208374023, "global_step": 48193, "epoch": 286} {"train_loss": -8.206524848937988, "global_step": 48194, "epoch": 286} {"train_loss": -8.187784194946289, "global_step": 48195, "epoch": 286} {"train_loss": -8.142248153686523, "global_step": 48196, "epoch": 286} {"train_loss": -7.941573143005371, "global_step": 48197, "epoch": 286} {"train_loss": -8.177928924560547, "global_step": 48198, "epoch": 286} {"train_loss": -8.022014617919922, "global_step": 48199, "epoch": 286} {"train_loss": -8.323925971984863, "global_step": 48200, "epoch": 286} {"train_loss": -8.157585144042969, "global_step": 48201, "epoch": 286} {"train_loss": -8.35159969329834, "global_step": 48202, "epoch": 286} {"train_loss": -8.377254486083984, "global_step": 48203, "epoch": 286} {"train_loss": -8.06788444519043, "global_step": 48204, "epoch": 286} {"train_loss": -8.511528968811035, "global_step": 48205, "epoch": 286} {"train_loss": -8.172088623046875, "global_step": 48206, "epoch": 286} {"train_loss": -8.283187866210938, "global_step": 48207, "epoch": 286} {"train_loss": -8.49405288696289, "global_step": 48208, "epoch": 286} {"train_loss": -8.336071014404297, "global_step": 48209, "epoch": 286} {"train_loss": -8.385814666748047, "global_step": 48210, "epoch": 286} {"train_loss": -8.250908851623535, "global_step": 48211, "epoch": 286} {"train_loss": -8.368856430053711, "global_step": 48212, "epoch": 286} {"train_loss": -8.286516189575195, "global_step": 48213, "epoch": 286} {"train_loss": -8.149407386779785, "global_step": 48214, "epoch": 286} {"train_loss": -8.205145177387056, "global_step": 48215, "epoch": 286, "val_loss": 186820.6875} {"train_loss": -8.132967948913574, "global_step": 48216, "epoch": 287} {"train_loss": -8.12760066986084, "global_step": 48217, "epoch": 287} {"train_loss": -8.233996391296387, "global_step": 48218, "epoch": 287} {"train_loss": -7.976398468017578, "global_step": 48219, "epoch": 287} {"train_loss": -8.413599967956543, "global_step": 48220, "epoch": 287} {"train_loss": -8.22450065612793, "global_step": 48221, "epoch": 287} {"train_loss": -8.309375762939453, "global_step": 48222, "epoch": 287} {"train_loss": -8.415994644165039, "global_step": 48223, "epoch": 287} {"train_loss": -8.172503471374512, "global_step": 48224, "epoch": 287} {"train_loss": -8.463791847229004, "global_step": 48225, "epoch": 287} {"train_loss": -8.207643508911133, "global_step": 48226, "epoch": 287} {"train_loss": -8.335777282714844, "global_step": 48227, "epoch": 287} {"train_loss": -8.216596603393555, "global_step": 48228, "epoch": 287} {"train_loss": -8.165771484375, "global_step": 48229, "epoch": 287} {"train_loss": -8.343795776367188, "global_step": 48230, "epoch": 287} {"train_loss": -8.283769607543945, "global_step": 48231, "epoch": 287} {"train_loss": -8.122245788574219, "global_step": 48232, "epoch": 287} {"train_loss": -8.27414608001709, "global_step": 48233, "epoch": 287} {"train_loss": -8.40588665008545, "global_step": 48234, "epoch": 287} {"train_loss": -8.239828109741211, "global_step": 48235, "epoch": 287} {"train_loss": -8.269819259643555, "global_step": 48236, "epoch": 287} {"train_loss": -8.106593132019043, "global_step": 48237, "epoch": 287} {"train_loss": -8.179813385009766, "global_step": 48238, "epoch": 287} {"train_loss": -7.9967803955078125, "global_step": 48239, "epoch": 287} {"train_loss": -8.306815147399902, "global_step": 48240, "epoch": 287} {"train_loss": -7.718994617462158, "global_step": 48241, "epoch": 287} {"train_loss": -8.210247039794922, "global_step": 48242, "epoch": 287} {"train_loss": -8.052003860473633, "global_step": 48243, "epoch": 287} {"train_loss": -8.221888542175293, "global_step": 48244, "epoch": 287} {"train_loss": -8.146942138671875, "global_step": 48245, "epoch": 287} {"train_loss": -8.319375991821289, "global_step": 48246, "epoch": 287} {"train_loss": -8.186728477478027, "global_step": 48247, "epoch": 287} {"train_loss": -8.071682929992676, "global_step": 48248, "epoch": 287} {"train_loss": -8.300990104675293, "global_step": 48249, "epoch": 287} {"train_loss": -8.11345386505127, "global_step": 48250, "epoch": 287} {"train_loss": -8.303140640258789, "global_step": 48251, "epoch": 287} {"train_loss": -8.226090431213379, "global_step": 48252, "epoch": 287} {"train_loss": -8.419195175170898, "global_step": 48253, "epoch": 287} {"train_loss": -8.091348648071289, "global_step": 48254, "epoch": 287} {"train_loss": -8.274656295776367, "global_step": 48255, "epoch": 287} {"train_loss": -8.357758522033691, "global_step": 48256, "epoch": 287} {"train_loss": -8.31471061706543, "global_step": 48257, "epoch": 287} {"train_loss": -8.141260147094727, "global_step": 48258, "epoch": 287} {"train_loss": -8.129324913024902, "global_step": 48259, "epoch": 287} {"train_loss": -8.307575225830078, "global_step": 48260, "epoch": 287} {"train_loss": -8.22205924987793, "global_step": 48261, "epoch": 287} {"train_loss": -8.405282974243164, "global_step": 48262, "epoch": 287} {"train_loss": -8.226459503173828, "global_step": 48263, "epoch": 287} {"train_loss": -8.375479698181152, "global_step": 48264, "epoch": 287} {"train_loss": -8.343328475952148, "global_step": 48265, "epoch": 287} {"train_loss": -8.347981452941895, "global_step": 48266, "epoch": 287} {"train_loss": -8.258318901062012, "global_step": 48267, "epoch": 287} {"train_loss": -8.028692245483398, "global_step": 48268, "epoch": 287} {"train_loss": -8.221437454223633, "global_step": 48269, "epoch": 287} {"train_loss": -8.404841423034668, "global_step": 48270, "epoch": 287} {"train_loss": -8.105183601379395, "global_step": 48271, "epoch": 287} {"train_loss": -8.363792419433594, "global_step": 48272, "epoch": 287} {"train_loss": -8.346687316894531, "global_step": 48273, "epoch": 287} {"train_loss": -8.410707473754883, "global_step": 48274, "epoch": 287} {"train_loss": -8.446466445922852, "global_step": 48275, "epoch": 287} {"train_loss": -8.313913345336914, "global_step": 48276, "epoch": 287} {"train_loss": -8.292461395263672, "global_step": 48277, "epoch": 287} {"train_loss": -8.464286804199219, "global_step": 48278, "epoch": 287} {"train_loss": -8.042204856872559, "global_step": 48279, "epoch": 287} {"train_loss": -8.131025314331055, "global_step": 48280, "epoch": 287} {"train_loss": -8.084573745727539, "global_step": 48281, "epoch": 287} {"train_loss": -8.201278686523438, "global_step": 48282, "epoch": 287} {"train_loss": -7.999411582946777, "global_step": 48283, "epoch": 287} {"train_loss": -8.182557106018066, "global_step": 48284, "epoch": 287} {"train_loss": -8.003482818603516, "global_step": 48285, "epoch": 287} {"train_loss": -8.37370491027832, "global_step": 48286, "epoch": 287} {"train_loss": -8.125377655029297, "global_step": 48287, "epoch": 287} {"train_loss": -8.091585159301758, "global_step": 48288, "epoch": 287} {"train_loss": -8.090140342712402, "global_step": 48289, "epoch": 287} {"train_loss": -8.119680404663086, "global_step": 48290, "epoch": 287} {"train_loss": -8.309162139892578, "global_step": 48291, "epoch": 287} {"train_loss": -8.063782691955566, "global_step": 48292, "epoch": 287} {"train_loss": -8.205101013183594, "global_step": 48293, "epoch": 287} {"train_loss": -8.316961288452148, "global_step": 48294, "epoch": 287} {"train_loss": -8.163692474365234, "global_step": 48295, "epoch": 287} {"train_loss": -8.24952220916748, "global_step": 48296, "epoch": 287} {"train_loss": -8.403511047363281, "global_step": 48297, "epoch": 287} {"train_loss": -8.339153289794922, "global_step": 48298, "epoch": 287} {"train_loss": -8.226601600646973, "global_step": 48299, "epoch": 287} {"train_loss": -8.064433097839355, "global_step": 48300, "epoch": 287} {"train_loss": -8.093658447265625, "global_step": 48301, "epoch": 287} {"train_loss": -8.170204162597656, "global_step": 48302, "epoch": 287} {"train_loss": -8.14856243133545, "global_step": 48303, "epoch": 287} {"train_loss": -8.397638320922852, "global_step": 48304, "epoch": 287} {"train_loss": -8.1219482421875, "global_step": 48305, "epoch": 287} {"train_loss": -8.293285369873047, "global_step": 48306, "epoch": 287} {"train_loss": -8.07867431640625, "global_step": 48307, "epoch": 287} {"train_loss": -8.189473152160645, "global_step": 48308, "epoch": 287} {"train_loss": -8.25075912475586, "global_step": 48309, "epoch": 287} {"train_loss": -8.428979873657227, "global_step": 48310, "epoch": 287} {"train_loss": -8.171396255493164, "global_step": 48311, "epoch": 287} {"train_loss": -8.371953964233398, "global_step": 48312, "epoch": 287} {"train_loss": -8.282880783081055, "global_step": 48313, "epoch": 287} {"train_loss": -8.209858894348145, "global_step": 48314, "epoch": 287} {"train_loss": -8.36417007446289, "global_step": 48315, "epoch": 287} {"train_loss": -8.37340259552002, "global_step": 48316, "epoch": 287} {"train_loss": -8.34678840637207, "global_step": 48317, "epoch": 287} {"train_loss": -8.017526626586914, "global_step": 48318, "epoch": 287} {"train_loss": -8.124576568603516, "global_step": 48319, "epoch": 287} {"train_loss": -8.368465423583984, "global_step": 48320, "epoch": 287} {"train_loss": -8.162928581237793, "global_step": 48321, "epoch": 287} {"train_loss": -8.313610076904297, "global_step": 48322, "epoch": 287} {"train_loss": -8.261354446411133, "global_step": 48323, "epoch": 287} {"train_loss": -8.385894775390625, "global_step": 48324, "epoch": 287} {"train_loss": -8.134347915649414, "global_step": 48325, "epoch": 287} {"train_loss": -8.308530807495117, "global_step": 48326, "epoch": 287} {"train_loss": -8.369564056396484, "global_step": 48327, "epoch": 287} {"train_loss": -7.939330101013184, "global_step": 48328, "epoch": 287} {"train_loss": -8.276047706604004, "global_step": 48329, "epoch": 287} {"train_loss": -8.21414566040039, "global_step": 48330, "epoch": 287} {"train_loss": -8.101480484008789, "global_step": 48331, "epoch": 287} {"train_loss": -8.237224578857422, "global_step": 48332, "epoch": 287} {"train_loss": -8.245502471923828, "global_step": 48333, "epoch": 287} {"train_loss": -8.355852127075195, "global_step": 48334, "epoch": 287} {"train_loss": -8.346609115600586, "global_step": 48335, "epoch": 287} {"train_loss": -8.081995964050293, "global_step": 48336, "epoch": 287} {"train_loss": -8.173385620117188, "global_step": 48337, "epoch": 287} {"train_loss": -8.304060935974121, "global_step": 48338, "epoch": 287} {"train_loss": -8.29901123046875, "global_step": 48339, "epoch": 287} {"train_loss": -8.51125717163086, "global_step": 48340, "epoch": 287} {"train_loss": -8.324260711669922, "global_step": 48341, "epoch": 287} {"train_loss": -8.189699172973633, "global_step": 48342, "epoch": 287} {"train_loss": -8.173421859741211, "global_step": 48343, "epoch": 287} {"train_loss": -8.34621810913086, "global_step": 48344, "epoch": 287} {"train_loss": -8.327844619750977, "global_step": 48345, "epoch": 287} {"train_loss": -8.050239562988281, "global_step": 48346, "epoch": 287} {"train_loss": -8.229669570922852, "global_step": 48347, "epoch": 287} {"train_loss": -8.113101959228516, "global_step": 48348, "epoch": 287} {"train_loss": -8.195121765136719, "global_step": 48349, "epoch": 287} {"train_loss": -7.949172019958496, "global_step": 48350, "epoch": 287} {"train_loss": -8.355243682861328, "global_step": 48351, "epoch": 287} {"train_loss": -8.316246032714844, "global_step": 48352, "epoch": 287} {"train_loss": -8.226343154907227, "global_step": 48353, "epoch": 287} {"train_loss": -8.244834899902344, "global_step": 48354, "epoch": 287} {"train_loss": -8.088415145874023, "global_step": 48355, "epoch": 287} {"train_loss": -8.411178588867188, "global_step": 48356, "epoch": 287} {"train_loss": -8.30545425415039, "global_step": 48357, "epoch": 287} {"train_loss": -8.295316696166992, "global_step": 48358, "epoch": 287} {"train_loss": -8.2201566696167, "global_step": 48359, "epoch": 287} {"train_loss": -8.355411529541016, "global_step": 48360, "epoch": 287} {"train_loss": -8.176681518554688, "global_step": 48361, "epoch": 287} {"train_loss": -8.360334396362305, "global_step": 48362, "epoch": 287} {"train_loss": -8.452804565429688, "global_step": 48363, "epoch": 287} {"train_loss": -8.153688430786133, "global_step": 48364, "epoch": 287} {"train_loss": -8.367527961730957, "global_step": 48365, "epoch": 287} {"train_loss": -8.302257537841797, "global_step": 48366, "epoch": 287} {"train_loss": -8.366558074951172, "global_step": 48367, "epoch": 287} {"train_loss": -8.321700096130371, "global_step": 48368, "epoch": 287} {"train_loss": -8.508353233337402, "global_step": 48369, "epoch": 287} {"train_loss": -8.057099342346191, "global_step": 48370, "epoch": 287} {"train_loss": -8.49848747253418, "global_step": 48371, "epoch": 287} {"train_loss": -8.182875633239746, "global_step": 48372, "epoch": 287} {"train_loss": -8.42292308807373, "global_step": 48373, "epoch": 287} {"train_loss": -8.18562126159668, "global_step": 48374, "epoch": 287} {"train_loss": -8.267838478088379, "global_step": 48375, "epoch": 287} {"train_loss": -8.250160217285156, "global_step": 48376, "epoch": 287} {"train_loss": -8.089181900024414, "global_step": 48377, "epoch": 287} {"train_loss": -8.35322380065918, "global_step": 48378, "epoch": 287} {"train_loss": -8.45085334777832, "global_step": 48379, "epoch": 287} {"train_loss": -7.927909851074219, "global_step": 48380, "epoch": 287} {"train_loss": -8.281570434570312, "global_step": 48381, "epoch": 287} {"train_loss": -8.136110305786133, "global_step": 48382, "epoch": 287} {"train_loss": -8.23849044811158, "global_step": 48383, "epoch": 287, "val_loss": 187521.78125} {"train_loss": -8.425762176513672, "global_step": 48384, "epoch": 288} {"train_loss": -8.183626174926758, "global_step": 48385, "epoch": 288} {"train_loss": -8.562515258789062, "global_step": 48386, "epoch": 288} {"train_loss": -8.231642723083496, "global_step": 48387, "epoch": 288} {"train_loss": -8.249490737915039, "global_step": 48388, "epoch": 288} {"train_loss": -8.134130477905273, "global_step": 48389, "epoch": 288} {"train_loss": -8.381786346435547, "global_step": 48390, "epoch": 288} {"train_loss": -8.499351501464844, "global_step": 48391, "epoch": 288} {"train_loss": -7.903861045837402, "global_step": 48392, "epoch": 288} {"train_loss": -8.127540588378906, "global_step": 48393, "epoch": 288} {"train_loss": -8.265541076660156, "global_step": 48394, "epoch": 288} {"train_loss": -7.840235710144043, "global_step": 48395, "epoch": 288} {"train_loss": -8.004790306091309, "global_step": 48396, "epoch": 288} {"train_loss": -8.135540008544922, "global_step": 48397, "epoch": 288} {"train_loss": -7.996918678283691, "global_step": 48398, "epoch": 288} {"train_loss": -8.099127769470215, "global_step": 48399, "epoch": 288} {"train_loss": -7.850368499755859, "global_step": 48400, "epoch": 288} {"train_loss": -8.104570388793945, "global_step": 48401, "epoch": 288} {"train_loss": -7.756309509277344, "global_step": 48402, "epoch": 288} {"train_loss": -8.19847297668457, "global_step": 48403, "epoch": 288} {"train_loss": -8.181246757507324, "global_step": 48404, "epoch": 288} {"train_loss": -7.994659900665283, "global_step": 48405, "epoch": 288} {"train_loss": -7.9331865310668945, "global_step": 48406, "epoch": 288} {"train_loss": -7.87351131439209, "global_step": 48407, "epoch": 288} {"train_loss": -8.131646156311035, "global_step": 48408, "epoch": 288} {"train_loss": -8.109859466552734, "global_step": 48409, "epoch": 288} {"train_loss": -8.019638061523438, "global_step": 48410, "epoch": 288} {"train_loss": -8.017220497131348, "global_step": 48411, "epoch": 288} {"train_loss": -8.076618194580078, "global_step": 48412, "epoch": 288} {"train_loss": -8.039643287658691, "global_step": 48413, "epoch": 288} {"train_loss": -8.097297668457031, "global_step": 48414, "epoch": 288} {"train_loss": -8.187919616699219, "global_step": 48415, "epoch": 288} {"train_loss": -8.066350936889648, "global_step": 48416, "epoch": 288} {"train_loss": -8.056971549987793, "global_step": 48417, "epoch": 288} {"train_loss": -8.135330200195312, "global_step": 48418, "epoch": 288} {"train_loss": -8.375776290893555, "global_step": 48419, "epoch": 288} {"train_loss": -8.328544616699219, "global_step": 48420, "epoch": 288} {"train_loss": -8.264503479003906, "global_step": 48421, "epoch": 288} {"train_loss": -8.291139602661133, "global_step": 48422, "epoch": 288} {"train_loss": -8.20009708404541, "global_step": 48423, "epoch": 288} {"train_loss": -8.277725219726562, "global_step": 48424, "epoch": 288} {"train_loss": -8.222705841064453, "global_step": 48425, "epoch": 288} {"train_loss": -8.401298522949219, "global_step": 48426, "epoch": 288} {"train_loss": -8.380474090576172, "global_step": 48427, "epoch": 288} {"train_loss": -8.386423110961914, "global_step": 48428, "epoch": 288} {"train_loss": -8.298625946044922, "global_step": 48429, "epoch": 288} {"train_loss": -8.415584564208984, "global_step": 48430, "epoch": 288} {"train_loss": -8.390746116638184, "global_step": 48431, "epoch": 288} {"train_loss": -8.408738136291504, "global_step": 48432, "epoch": 288} {"train_loss": -8.343528747558594, "global_step": 48433, "epoch": 288} {"train_loss": -8.291221618652344, "global_step": 48434, "epoch": 288} {"train_loss": -8.483198165893555, "global_step": 48435, "epoch": 288} {"train_loss": -8.411514282226562, "global_step": 48436, "epoch": 288} {"train_loss": -8.450340270996094, "global_step": 48437, "epoch": 288} {"train_loss": -8.628541946411133, "global_step": 48438, "epoch": 288} {"train_loss": -8.24490737915039, "global_step": 48439, "epoch": 288} {"train_loss": -8.320818901062012, "global_step": 48440, "epoch": 288} {"train_loss": -8.46094799041748, "global_step": 48441, "epoch": 288} {"train_loss": -7.959268569946289, "global_step": 48442, "epoch": 288} {"train_loss": -8.287012100219727, "global_step": 48443, "epoch": 288} {"train_loss": -8.096867561340332, "global_step": 48444, "epoch": 288} {"train_loss": -7.6085405349731445, "global_step": 48445, "epoch": 288} {"train_loss": -7.904300689697266, "global_step": 48446, "epoch": 288} {"train_loss": -8.284988403320312, "global_step": 48447, "epoch": 288} {"train_loss": -7.810176849365234, "global_step": 48448, "epoch": 288} {"train_loss": -7.834539413452148, "global_step": 48449, "epoch": 288} {"train_loss": -8.09619426727295, "global_step": 48450, "epoch": 288} {"train_loss": -7.959607124328613, "global_step": 48451, "epoch": 288} {"train_loss": -8.107842445373535, "global_step": 48452, "epoch": 288} {"train_loss": -7.818337917327881, "global_step": 48453, "epoch": 288} {"train_loss": -8.13812255859375, "global_step": 48454, "epoch": 288} {"train_loss": -8.197786331176758, "global_step": 48455, "epoch": 288} {"train_loss": -7.830458641052246, "global_step": 48456, "epoch": 288} {"train_loss": -8.28316879272461, "global_step": 48457, "epoch": 288} {"train_loss": -8.324880599975586, "global_step": 48458, "epoch": 288} {"train_loss": -8.235184669494629, "global_step": 48459, "epoch": 288} {"train_loss": -8.32413387298584, "global_step": 48460, "epoch": 288} {"train_loss": -8.195233345031738, "global_step": 48461, "epoch": 288} {"train_loss": -8.263010025024414, "global_step": 48462, "epoch": 288} {"train_loss": -8.419973373413086, "global_step": 48463, "epoch": 288} {"train_loss": -8.10008430480957, "global_step": 48464, "epoch": 288} {"train_loss": -8.075571060180664, "global_step": 48465, "epoch": 288} {"train_loss": -8.076866149902344, "global_step": 48466, "epoch": 288} {"train_loss": -8.263802528381348, "global_step": 48467, "epoch": 288} {"train_loss": -8.034209251403809, "global_step": 48468, "epoch": 288} {"train_loss": -8.284445762634277, "global_step": 48469, "epoch": 288} {"train_loss": -8.16270637512207, "global_step": 48470, "epoch": 288} {"train_loss": -8.38664722442627, "global_step": 48471, "epoch": 288} {"train_loss": -8.005809783935547, "global_step": 48472, "epoch": 288} {"train_loss": -8.042549133300781, "global_step": 48473, "epoch": 288} {"train_loss": -8.085882186889648, "global_step": 48474, "epoch": 288} {"train_loss": -8.251922607421875, "global_step": 48475, "epoch": 288} {"train_loss": -8.266451835632324, "global_step": 48476, "epoch": 288} {"train_loss": -8.272224426269531, "global_step": 48477, "epoch": 288} {"train_loss": -8.113935470581055, "global_step": 48478, "epoch": 288} {"train_loss": -8.209464073181152, "global_step": 48479, "epoch": 288} {"train_loss": -8.27029037475586, "global_step": 48480, "epoch": 288} {"train_loss": -8.088379859924316, "global_step": 48481, "epoch": 288} {"train_loss": -8.429903030395508, "global_step": 48482, "epoch": 288} {"train_loss": -8.182510375976562, "global_step": 48483, "epoch": 288} {"train_loss": -8.084129333496094, "global_step": 48484, "epoch": 288} {"train_loss": -8.242514610290527, "global_step": 48485, "epoch": 288} {"train_loss": -8.557212829589844, "global_step": 48486, "epoch": 288} {"train_loss": -8.227678298950195, "global_step": 48487, "epoch": 288} {"train_loss": -8.306745529174805, "global_step": 48488, "epoch": 288} {"train_loss": -8.207783699035645, "global_step": 48489, "epoch": 288} {"train_loss": -8.379948616027832, "global_step": 48490, "epoch": 288} {"train_loss": -8.290857315063477, "global_step": 48491, "epoch": 288} {"train_loss": -8.553714752197266, "global_step": 48492, "epoch": 288} {"train_loss": -8.309061050415039, "global_step": 48493, "epoch": 288} {"train_loss": -8.425786972045898, "global_step": 48494, "epoch": 288} {"train_loss": -7.914121627807617, "global_step": 48495, "epoch": 288} {"train_loss": -8.383373260498047, "global_step": 48496, "epoch": 288} {"train_loss": -8.102560043334961, "global_step": 48497, "epoch": 288} {"train_loss": -8.045530319213867, "global_step": 48498, "epoch": 288} {"train_loss": -8.339656829833984, "global_step": 48499, "epoch": 288} {"train_loss": -8.06297492980957, "global_step": 48500, "epoch": 288} {"train_loss": -8.454742431640625, "global_step": 48501, "epoch": 288} {"train_loss": -8.05984878540039, "global_step": 48502, "epoch": 288} {"train_loss": -8.288430213928223, "global_step": 48503, "epoch": 288} {"train_loss": -8.239005088806152, "global_step": 48504, "epoch": 288} {"train_loss": -8.320785522460938, "global_step": 48505, "epoch": 288} {"train_loss": -8.049898147583008, "global_step": 48506, "epoch": 288} {"train_loss": -8.402170181274414, "global_step": 48507, "epoch": 288} {"train_loss": -8.084142684936523, "global_step": 48508, "epoch": 288} {"train_loss": -8.199186325073242, "global_step": 48509, "epoch": 288} {"train_loss": -8.369739532470703, "global_step": 48510, "epoch": 288} {"train_loss": -8.379070281982422, "global_step": 48511, "epoch": 288} {"train_loss": -8.137935638427734, "global_step": 48512, "epoch": 288} {"train_loss": -8.486642837524414, "global_step": 48513, "epoch": 288} {"train_loss": -8.290539741516113, "global_step": 48514, "epoch": 288} {"train_loss": -8.246444702148438, "global_step": 48515, "epoch": 288} {"train_loss": -8.29995346069336, "global_step": 48516, "epoch": 288} {"train_loss": -8.26912784576416, "global_step": 48517, "epoch": 288} {"train_loss": -8.433307647705078, "global_step": 48518, "epoch": 288} {"train_loss": -8.317928314208984, "global_step": 48519, "epoch": 288} {"train_loss": -8.315460205078125, "global_step": 48520, "epoch": 288} {"train_loss": -8.203712463378906, "global_step": 48521, "epoch": 288} {"train_loss": -8.299334526062012, "global_step": 48522, "epoch": 288} {"train_loss": -8.415380477905273, "global_step": 48523, "epoch": 288} {"train_loss": -8.395278930664062, "global_step": 48524, "epoch": 288} {"train_loss": -8.054595947265625, "global_step": 48525, "epoch": 288} {"train_loss": -8.350159645080566, "global_step": 48526, "epoch": 288} {"train_loss": -8.351637840270996, "global_step": 48527, "epoch": 288} {"train_loss": -8.419321060180664, "global_step": 48528, "epoch": 288} {"train_loss": -8.427706718444824, "global_step": 48529, "epoch": 288} {"train_loss": -8.162322998046875, "global_step": 48530, "epoch": 288} {"train_loss": -8.384029388427734, "global_step": 48531, "epoch": 288} {"train_loss": -8.294179916381836, "global_step": 48532, "epoch": 288} {"train_loss": -8.448638916015625, "global_step": 48533, "epoch": 288} {"train_loss": -8.29885196685791, "global_step": 48534, "epoch": 288} {"train_loss": -8.402700424194336, "global_step": 48535, "epoch": 288} {"train_loss": -8.352842330932617, "global_step": 48536, "epoch": 288} {"train_loss": -8.300470352172852, "global_step": 48537, "epoch": 288} {"train_loss": -8.20709228515625, "global_step": 48538, "epoch": 288} {"train_loss": -8.417150497436523, "global_step": 48539, "epoch": 288} {"train_loss": -8.25143051147461, "global_step": 48540, "epoch": 288} {"train_loss": -8.209318161010742, "global_step": 48541, "epoch": 288} {"train_loss": -8.328975677490234, "global_step": 48542, "epoch": 288} {"train_loss": -8.172853469848633, "global_step": 48543, "epoch": 288} {"train_loss": -8.134759902954102, "global_step": 48544, "epoch": 288} {"train_loss": -8.251011848449707, "global_step": 48545, "epoch": 288} {"train_loss": -8.050689697265625, "global_step": 48546, "epoch": 288} {"train_loss": -8.468559265136719, "global_step": 48547, "epoch": 288} {"train_loss": -8.058210372924805, "global_step": 48548, "epoch": 288} {"train_loss": -8.464215278625488, "global_step": 48549, "epoch": 288} {"train_loss": -8.313911437988281, "global_step": 48550, "epoch": 288} {"train_loss": -8.220631043116251, "global_step": 48551, "epoch": 288, "val_loss": 186058.875} {"train_loss": -8.063583374023438, "global_step": 48552, "epoch": 289} {"train_loss": -8.366752624511719, "global_step": 48553, "epoch": 289} {"train_loss": -7.970484256744385, "global_step": 48554, "epoch": 289} {"train_loss": -8.35519790649414, "global_step": 48555, "epoch": 289} {"train_loss": -7.9392828941345215, "global_step": 48556, "epoch": 289} {"train_loss": -8.33770751953125, "global_step": 48557, "epoch": 289} {"train_loss": -8.102095603942871, "global_step": 48558, "epoch": 289} {"train_loss": -8.079118728637695, "global_step": 48559, "epoch": 289} {"train_loss": -8.037663459777832, "global_step": 48560, "epoch": 289} {"train_loss": -8.36106014251709, "global_step": 48561, "epoch": 289} {"train_loss": -7.970944404602051, "global_step": 48562, "epoch": 289} {"train_loss": -8.162385940551758, "global_step": 48563, "epoch": 289} {"train_loss": -8.339884757995605, "global_step": 48564, "epoch": 289} {"train_loss": -8.162068367004395, "global_step": 48565, "epoch": 289} {"train_loss": -8.021583557128906, "global_step": 48566, "epoch": 289} {"train_loss": -8.398055076599121, "global_step": 48567, "epoch": 289} {"train_loss": -8.086984634399414, "global_step": 48568, "epoch": 289} {"train_loss": -7.851086139678955, "global_step": 48569, "epoch": 289} {"train_loss": -8.30394172668457, "global_step": 48570, "epoch": 289} {"train_loss": -8.218794822692871, "global_step": 48571, "epoch": 289} {"train_loss": -8.159034729003906, "global_step": 48572, "epoch": 289} {"train_loss": -8.181060791015625, "global_step": 48573, "epoch": 289} {"train_loss": -8.364424705505371, "global_step": 48574, "epoch": 289} {"train_loss": -8.138044357299805, "global_step": 48575, "epoch": 289} {"train_loss": -7.773444175720215, "global_step": 48576, "epoch": 289} {"train_loss": -8.210489273071289, "global_step": 48577, "epoch": 289} {"train_loss": -8.134737014770508, "global_step": 48578, "epoch": 289} {"train_loss": -8.173371315002441, "global_step": 48579, "epoch": 289} {"train_loss": -8.173772811889648, "global_step": 48580, "epoch": 289} {"train_loss": -8.162022590637207, "global_step": 48581, "epoch": 289} {"train_loss": -8.218233108520508, "global_step": 48582, "epoch": 289} {"train_loss": -8.01188850402832, "global_step": 48583, "epoch": 289} {"train_loss": -8.375377655029297, "global_step": 48584, "epoch": 289} {"train_loss": -8.404935836791992, "global_step": 48585, "epoch": 289} {"train_loss": -8.355598449707031, "global_step": 48586, "epoch": 289} {"train_loss": -8.35244369506836, "global_step": 48587, "epoch": 289} {"train_loss": -8.1428804397583, "global_step": 48588, "epoch": 289} {"train_loss": -8.25463581085205, "global_step": 48589, "epoch": 289} {"train_loss": -8.263970375061035, "global_step": 48590, "epoch": 289} {"train_loss": -8.367879867553711, "global_step": 48591, "epoch": 289} {"train_loss": -8.516580581665039, "global_step": 48592, "epoch": 289} {"train_loss": -8.372154235839844, "global_step": 48593, "epoch": 289} {"train_loss": -8.306028366088867, "global_step": 48594, "epoch": 289} {"train_loss": -8.341623306274414, "global_step": 48595, "epoch": 289} {"train_loss": -8.18226432800293, "global_step": 48596, "epoch": 289} {"train_loss": -8.292282104492188, "global_step": 48597, "epoch": 289} {"train_loss": -8.33307933807373, "global_step": 48598, "epoch": 289} {"train_loss": -8.478443145751953, "global_step": 48599, "epoch": 289} {"train_loss": -8.361339569091797, "global_step": 48600, "epoch": 289} {"train_loss": -8.24667739868164, "global_step": 48601, "epoch": 289} {"train_loss": -8.316377639770508, "global_step": 48602, "epoch": 289} {"train_loss": -8.123231887817383, "global_step": 48603, "epoch": 289} {"train_loss": -8.380960464477539, "global_step": 48604, "epoch": 289} {"train_loss": -8.321208953857422, "global_step": 48605, "epoch": 289} {"train_loss": -7.696088790893555, "global_step": 48606, "epoch": 289} {"train_loss": -8.22499942779541, "global_step": 48607, "epoch": 289} {"train_loss": -8.538981437683105, "global_step": 48608, "epoch": 289} {"train_loss": -8.410319328308105, "global_step": 48609, "epoch": 289} {"train_loss": -8.050065040588379, "global_step": 48610, "epoch": 289} {"train_loss": -8.212051391601562, "global_step": 48611, "epoch": 289} {"train_loss": -8.194421768188477, "global_step": 48612, "epoch": 289} {"train_loss": -8.123212814331055, "global_step": 48613, "epoch": 289} {"train_loss": -8.51728630065918, "global_step": 48614, "epoch": 289} {"train_loss": -7.808260440826416, "global_step": 48615, "epoch": 289} {"train_loss": -8.434319496154785, "global_step": 48616, "epoch": 289} {"train_loss": -8.161465644836426, "global_step": 48617, "epoch": 289} {"train_loss": -8.040945053100586, "global_step": 48618, "epoch": 289} {"train_loss": -8.209844589233398, "global_step": 48619, "epoch": 289} {"train_loss": -7.976826190948486, "global_step": 48620, "epoch": 289} {"train_loss": -8.11986255645752, "global_step": 48621, "epoch": 289} {"train_loss": -8.171113967895508, "global_step": 48622, "epoch": 289} {"train_loss": -8.185237884521484, "global_step": 48623, "epoch": 289} {"train_loss": -8.281960487365723, "global_step": 48624, "epoch": 289} {"train_loss": -8.238523483276367, "global_step": 48625, "epoch": 289} {"train_loss": -8.381206512451172, "global_step": 48626, "epoch": 289} {"train_loss": -8.099793434143066, "global_step": 48627, "epoch": 289} {"train_loss": -7.885064125061035, "global_step": 48628, "epoch": 289} {"train_loss": -8.112237930297852, "global_step": 48629, "epoch": 289} {"train_loss": -8.212787628173828, "global_step": 48630, "epoch": 289} {"train_loss": -8.09218692779541, "global_step": 48631, "epoch": 289} {"train_loss": -8.21776008605957, "global_step": 48632, "epoch": 289} {"train_loss": -8.155295372009277, "global_step": 48633, "epoch": 289} {"train_loss": -7.8949408531188965, "global_step": 48634, "epoch": 289} {"train_loss": -8.220829010009766, "global_step": 48635, "epoch": 289} {"train_loss": -7.9510321617126465, "global_step": 48636, "epoch": 289} {"train_loss": -8.19529914855957, "global_step": 48637, "epoch": 289} {"train_loss": -8.370211601257324, "global_step": 48638, "epoch": 289} {"train_loss": -8.082490921020508, "global_step": 48639, "epoch": 289} {"train_loss": -8.161040306091309, "global_step": 48640, "epoch": 289} {"train_loss": -8.03516674041748, "global_step": 48641, "epoch": 289} {"train_loss": -8.307172775268555, "global_step": 48642, "epoch": 289} {"train_loss": -8.04137897491455, "global_step": 48643, "epoch": 289} {"train_loss": -8.034093856811523, "global_step": 48644, "epoch": 289} {"train_loss": -8.156034469604492, "global_step": 48645, "epoch": 289} {"train_loss": -8.209798812866211, "global_step": 48646, "epoch": 289} {"train_loss": -8.160568237304688, "global_step": 48647, "epoch": 289} {"train_loss": -8.300785064697266, "global_step": 48648, "epoch": 289} {"train_loss": -8.14685344696045, "global_step": 48649, "epoch": 289} {"train_loss": -8.14275074005127, "global_step": 48650, "epoch": 289} {"train_loss": -8.181629180908203, "global_step": 48651, "epoch": 289} {"train_loss": -8.36838436126709, "global_step": 48652, "epoch": 289} {"train_loss": -8.461238861083984, "global_step": 48653, "epoch": 289} {"train_loss": -8.376500129699707, "global_step": 48654, "epoch": 289} {"train_loss": -8.347760200500488, "global_step": 48655, "epoch": 289} {"train_loss": -8.396417617797852, "global_step": 48656, "epoch": 289} {"train_loss": -8.506345748901367, "global_step": 48657, "epoch": 289} {"train_loss": -8.092586517333984, "global_step": 48658, "epoch": 289} {"train_loss": -8.292585372924805, "global_step": 48659, "epoch": 289} {"train_loss": -8.296573638916016, "global_step": 48660, "epoch": 289} {"train_loss": -8.505212783813477, "global_step": 48661, "epoch": 289} {"train_loss": -8.38379192352295, "global_step": 48662, "epoch": 289} {"train_loss": -8.28834056854248, "global_step": 48663, "epoch": 289} {"train_loss": -8.486101150512695, "global_step": 48664, "epoch": 289} {"train_loss": -8.271421432495117, "global_step": 48665, "epoch": 289} {"train_loss": -8.416901588439941, "global_step": 48666, "epoch": 289} {"train_loss": -8.433266639709473, "global_step": 48667, "epoch": 289} {"train_loss": -8.268911361694336, "global_step": 48668, "epoch": 289} {"train_loss": -8.409493446350098, "global_step": 48669, "epoch": 289} {"train_loss": -8.674501419067383, "global_step": 48670, "epoch": 289} {"train_loss": -8.343596458435059, "global_step": 48671, "epoch": 289} {"train_loss": -8.24785327911377, "global_step": 48672, "epoch": 289} {"train_loss": -8.597200393676758, "global_step": 48673, "epoch": 289} {"train_loss": -8.49651050567627, "global_step": 48674, "epoch": 289} {"train_loss": -8.636825561523438, "global_step": 48675, "epoch": 289} {"train_loss": -8.399099349975586, "global_step": 48676, "epoch": 289} {"train_loss": -8.27296257019043, "global_step": 48677, "epoch": 289} {"train_loss": -8.246997833251953, "global_step": 48678, "epoch": 289} {"train_loss": -8.347386360168457, "global_step": 48679, "epoch": 289} {"train_loss": -8.309907913208008, "global_step": 48680, "epoch": 289} {"train_loss": -7.763047218322754, "global_step": 48681, "epoch": 289} {"train_loss": -8.293343544006348, "global_step": 48682, "epoch": 289} {"train_loss": -8.081960678100586, "global_step": 48683, "epoch": 289} {"train_loss": -8.434432029724121, "global_step": 48684, "epoch": 289} {"train_loss": -8.330768585205078, "global_step": 48685, "epoch": 289} {"train_loss": -8.25886344909668, "global_step": 48686, "epoch": 289} {"train_loss": -8.425407409667969, "global_step": 48687, "epoch": 289} {"train_loss": -8.159997940063477, "global_step": 48688, "epoch": 289} {"train_loss": -8.256712913513184, "global_step": 48689, "epoch": 289} {"train_loss": -8.052068710327148, "global_step": 48690, "epoch": 289} {"train_loss": -8.487764358520508, "global_step": 48691, "epoch": 289} {"train_loss": -8.242513656616211, "global_step": 48692, "epoch": 289} {"train_loss": -8.321161270141602, "global_step": 48693, "epoch": 289} {"train_loss": -7.998400688171387, "global_step": 48694, "epoch": 289} {"train_loss": -8.30531120300293, "global_step": 48695, "epoch": 289} {"train_loss": -8.092058181762695, "global_step": 48696, "epoch": 289} {"train_loss": -8.27077865600586, "global_step": 48697, "epoch": 289} {"train_loss": -8.260772705078125, "global_step": 48698, "epoch": 289} {"train_loss": -8.30280876159668, "global_step": 48699, "epoch": 289} {"train_loss": -8.417539596557617, "global_step": 48700, "epoch": 289} {"train_loss": -8.259045600891113, "global_step": 48701, "epoch": 289} {"train_loss": -8.265115737915039, "global_step": 48702, "epoch": 289} {"train_loss": -8.450182914733887, "global_step": 48703, "epoch": 289} {"train_loss": -8.383312225341797, "global_step": 48704, "epoch": 289} {"train_loss": -8.373242378234863, "global_step": 48705, "epoch": 289} {"train_loss": -8.097823143005371, "global_step": 48706, "epoch": 289} {"train_loss": -8.41282844543457, "global_step": 48707, "epoch": 289} {"train_loss": -8.359673500061035, "global_step": 48708, "epoch": 289} {"train_loss": -8.47610092163086, "global_step": 48709, "epoch": 289} {"train_loss": -8.039651870727539, "global_step": 48710, "epoch": 289} {"train_loss": -8.256762504577637, "global_step": 48711, "epoch": 289} {"train_loss": -8.245291709899902, "global_step": 48712, "epoch": 289} {"train_loss": -8.425870895385742, "global_step": 48713, "epoch": 289} {"train_loss": -8.177225112915039, "global_step": 48714, "epoch": 289} {"train_loss": -8.498343467712402, "global_step": 48715, "epoch": 289} {"train_loss": -8.211455345153809, "global_step": 48716, "epoch": 289} {"train_loss": -8.402164459228516, "global_step": 48717, "epoch": 289} {"train_loss": -8.140478134155273, "global_step": 48718, "epoch": 289} {"train_loss": -8.243829196407681, "global_step": 48719, "epoch": 289, "val_loss": 189055.40625} {"train_loss": -8.191351890563965, "global_step": 48720, "epoch": 290} {"train_loss": -8.353161811828613, "global_step": 48721, "epoch": 290} {"train_loss": -8.34903335571289, "global_step": 48722, "epoch": 290} {"train_loss": -8.278772354125977, "global_step": 48723, "epoch": 290} {"train_loss": -8.474990844726562, "global_step": 48724, "epoch": 290} {"train_loss": -8.30421257019043, "global_step": 48725, "epoch": 290} {"train_loss": -8.111026763916016, "global_step": 48726, "epoch": 290} {"train_loss": -8.170919418334961, "global_step": 48727, "epoch": 290} {"train_loss": -8.414937973022461, "global_step": 48728, "epoch": 290} {"train_loss": -8.353864669799805, "global_step": 48729, "epoch": 290} {"train_loss": -8.344146728515625, "global_step": 48730, "epoch": 290} {"train_loss": -8.05606746673584, "global_step": 48731, "epoch": 290} {"train_loss": -8.373290061950684, "global_step": 48732, "epoch": 290} {"train_loss": -8.10301685333252, "global_step": 48733, "epoch": 290} {"train_loss": -8.321089744567871, "global_step": 48734, "epoch": 290} {"train_loss": -8.307710647583008, "global_step": 48735, "epoch": 290} {"train_loss": -8.283656120300293, "global_step": 48736, "epoch": 290} {"train_loss": -8.49160385131836, "global_step": 48737, "epoch": 290} {"train_loss": -8.355494499206543, "global_step": 48738, "epoch": 290} {"train_loss": -8.122784614562988, "global_step": 48739, "epoch": 290} {"train_loss": -8.082868576049805, "global_step": 48740, "epoch": 290} {"train_loss": -8.235502243041992, "global_step": 48741, "epoch": 290} {"train_loss": -8.227668762207031, "global_step": 48742, "epoch": 290} {"train_loss": -8.25866985321045, "global_step": 48743, "epoch": 290} {"train_loss": -8.024818420410156, "global_step": 48744, "epoch": 290} {"train_loss": -8.252155303955078, "global_step": 48745, "epoch": 290} {"train_loss": -8.192802429199219, "global_step": 48746, "epoch": 290} {"train_loss": -8.298053741455078, "global_step": 48747, "epoch": 290} {"train_loss": -8.300508499145508, "global_step": 48748, "epoch": 290} {"train_loss": -8.35750675201416, "global_step": 48749, "epoch": 290} {"train_loss": -8.122734069824219, "global_step": 48750, "epoch": 290} {"train_loss": -8.165450096130371, "global_step": 48751, "epoch": 290} {"train_loss": -8.349255561828613, "global_step": 48752, "epoch": 290} {"train_loss": -8.198860168457031, "global_step": 48753, "epoch": 290} {"train_loss": -8.426786422729492, "global_step": 48754, "epoch": 290} {"train_loss": -8.3012056350708, "global_step": 48755, "epoch": 290} {"train_loss": -8.425353050231934, "global_step": 48756, "epoch": 290} {"train_loss": -8.071460723876953, "global_step": 48757, "epoch": 290} {"train_loss": -8.290567398071289, "global_step": 48758, "epoch": 290} {"train_loss": -8.233095169067383, "global_step": 48759, "epoch": 290} {"train_loss": -8.318349838256836, "global_step": 48760, "epoch": 290} {"train_loss": -8.228937149047852, "global_step": 48761, "epoch": 290} {"train_loss": -8.28341293334961, "global_step": 48762, "epoch": 290} {"train_loss": -8.431497573852539, "global_step": 48763, "epoch": 290} {"train_loss": -8.339373588562012, "global_step": 48764, "epoch": 290} {"train_loss": -8.24445629119873, "global_step": 48765, "epoch": 290} {"train_loss": -8.378010749816895, "global_step": 48766, "epoch": 290} {"train_loss": -8.497465133666992, "global_step": 48767, "epoch": 290} {"train_loss": -8.461712837219238, "global_step": 48768, "epoch": 290} {"train_loss": -8.285292625427246, "global_step": 48769, "epoch": 290} {"train_loss": -8.379129409790039, "global_step": 48770, "epoch": 290} {"train_loss": -8.31869888305664, "global_step": 48771, "epoch": 290} {"train_loss": -8.241958618164062, "global_step": 48772, "epoch": 290} {"train_loss": -8.59591293334961, "global_step": 48773, "epoch": 290} {"train_loss": -8.34786605834961, "global_step": 48774, "epoch": 290} {"train_loss": -8.377067565917969, "global_step": 48775, "epoch": 290} {"train_loss": -8.0287446975708, "global_step": 48776, "epoch": 290} {"train_loss": -8.360115051269531, "global_step": 48777, "epoch": 290} {"train_loss": -8.102919578552246, "global_step": 48778, "epoch": 290} {"train_loss": -8.465763092041016, "global_step": 48779, "epoch": 290} {"train_loss": -8.191280364990234, "global_step": 48780, "epoch": 290} {"train_loss": -8.184873580932617, "global_step": 48781, "epoch": 290} {"train_loss": -8.112897872924805, "global_step": 48782, "epoch": 290} {"train_loss": -8.016189575195312, "global_step": 48783, "epoch": 290} {"train_loss": -8.518043518066406, "global_step": 48784, "epoch": 290} {"train_loss": -8.221792221069336, "global_step": 48785, "epoch": 290} {"train_loss": -8.344144821166992, "global_step": 48786, "epoch": 290} {"train_loss": -8.149866104125977, "global_step": 48787, "epoch": 290} {"train_loss": -8.275944709777832, "global_step": 48788, "epoch": 290} {"train_loss": -8.218944549560547, "global_step": 48789, "epoch": 290} {"train_loss": -8.300270080566406, "global_step": 48790, "epoch": 290} {"train_loss": -7.5871100425720215, "global_step": 48791, "epoch": 290} {"train_loss": -8.404637336730957, "global_step": 48792, "epoch": 290} {"train_loss": -8.111028671264648, "global_step": 48793, "epoch": 290} {"train_loss": -8.372836112976074, "global_step": 48794, "epoch": 290} {"train_loss": -8.145750045776367, "global_step": 48795, "epoch": 290} {"train_loss": -8.215855598449707, "global_step": 48796, "epoch": 290} {"train_loss": -8.174711227416992, "global_step": 48797, "epoch": 290} {"train_loss": -8.157148361206055, "global_step": 48798, "epoch": 290} {"train_loss": -8.24935245513916, "global_step": 48799, "epoch": 290} {"train_loss": -8.176346778869629, "global_step": 48800, "epoch": 290} {"train_loss": -8.408012390136719, "global_step": 48801, "epoch": 290} {"train_loss": -8.220529556274414, "global_step": 48802, "epoch": 290} {"train_loss": -8.491365432739258, "global_step": 48803, "epoch": 290} {"train_loss": -8.211606979370117, "global_step": 48804, "epoch": 290} {"train_loss": -8.290310859680176, "global_step": 48805, "epoch": 290} {"train_loss": -8.395682334899902, "global_step": 48806, "epoch": 290} {"train_loss": -8.313947677612305, "global_step": 48807, "epoch": 290} {"train_loss": -8.119194030761719, "global_step": 48808, "epoch": 290} {"train_loss": -8.300302505493164, "global_step": 48809, "epoch": 290} {"train_loss": -8.567235946655273, "global_step": 48810, "epoch": 290} {"train_loss": -8.349197387695312, "global_step": 48811, "epoch": 290} {"train_loss": -8.342328071594238, "global_step": 48812, "epoch": 290} {"train_loss": -8.458024978637695, "global_step": 48813, "epoch": 290} {"train_loss": -8.566312789916992, "global_step": 48814, "epoch": 290} {"train_loss": -8.613622665405273, "global_step": 48815, "epoch": 290} {"train_loss": -8.704277038574219, "global_step": 48816, "epoch": 290} {"train_loss": -8.344261169433594, "global_step": 48817, "epoch": 290} {"train_loss": -8.280746459960938, "global_step": 48818, "epoch": 290} {"train_loss": -8.373022079467773, "global_step": 48819, "epoch": 290} {"train_loss": -8.162403106689453, "global_step": 48820, "epoch": 290} {"train_loss": -8.389516830444336, "global_step": 48821, "epoch": 290} {"train_loss": -8.127626419067383, "global_step": 48822, "epoch": 290} {"train_loss": -8.314300537109375, "global_step": 48823, "epoch": 290} {"train_loss": -8.45865249633789, "global_step": 48824, "epoch": 290} {"train_loss": -8.174629211425781, "global_step": 48825, "epoch": 290} {"train_loss": -8.355527877807617, "global_step": 48826, "epoch": 290} {"train_loss": -8.314364433288574, "global_step": 48827, "epoch": 290} {"train_loss": -8.174023628234863, "global_step": 48828, "epoch": 290} {"train_loss": -8.288692474365234, "global_step": 48829, "epoch": 290} {"train_loss": -8.146413803100586, "global_step": 48830, "epoch": 290} {"train_loss": -8.072482109069824, "global_step": 48831, "epoch": 290} {"train_loss": -8.081438064575195, "global_step": 48832, "epoch": 290} {"train_loss": -8.368148803710938, "global_step": 48833, "epoch": 290} {"train_loss": -8.23135757446289, "global_step": 48834, "epoch": 290} {"train_loss": -8.05323600769043, "global_step": 48835, "epoch": 290} {"train_loss": -7.974116802215576, "global_step": 48836, "epoch": 290} {"train_loss": -7.711475849151611, "global_step": 48837, "epoch": 290} {"train_loss": -8.192129135131836, "global_step": 48838, "epoch": 290} {"train_loss": -7.788496017456055, "global_step": 48839, "epoch": 290} {"train_loss": -8.077001571655273, "global_step": 48840, "epoch": 290} {"train_loss": -8.005435943603516, "global_step": 48841, "epoch": 290} {"train_loss": -8.241619110107422, "global_step": 48842, "epoch": 290} {"train_loss": -8.11032485961914, "global_step": 48843, "epoch": 290} {"train_loss": -8.056723594665527, "global_step": 48844, "epoch": 290} {"train_loss": -8.300013542175293, "global_step": 48845, "epoch": 290} {"train_loss": -8.1233549118042, "global_step": 48846, "epoch": 290} {"train_loss": -8.273025512695312, "global_step": 48847, "epoch": 290} {"train_loss": -8.356393814086914, "global_step": 48848, "epoch": 290} {"train_loss": -8.194816589355469, "global_step": 48849, "epoch": 290} {"train_loss": -8.156944274902344, "global_step": 48850, "epoch": 290} {"train_loss": -8.135041236877441, "global_step": 48851, "epoch": 290} {"train_loss": -7.897561550140381, "global_step": 48852, "epoch": 290} {"train_loss": -8.163843154907227, "global_step": 48853, "epoch": 290} {"train_loss": -8.216846466064453, "global_step": 48854, "epoch": 290} {"train_loss": -8.087953567504883, "global_step": 48855, "epoch": 290} {"train_loss": -8.354080200195312, "global_step": 48856, "epoch": 290} {"train_loss": -8.144977569580078, "global_step": 48857, "epoch": 290} {"train_loss": -8.373748779296875, "global_step": 48858, "epoch": 290} {"train_loss": -8.426202774047852, "global_step": 48859, "epoch": 290} {"train_loss": -8.3238525390625, "global_step": 48860, "epoch": 290} {"train_loss": -8.360211372375488, "global_step": 48861, "epoch": 290} {"train_loss": -8.505754470825195, "global_step": 48862, "epoch": 290} {"train_loss": -8.292558670043945, "global_step": 48863, "epoch": 290} {"train_loss": -8.3783597946167, "global_step": 48864, "epoch": 290} {"train_loss": -8.215909957885742, "global_step": 48865, "epoch": 290} {"train_loss": -8.511768341064453, "global_step": 48866, "epoch": 290} {"train_loss": -8.449041366577148, "global_step": 48867, "epoch": 290} {"train_loss": -8.690396308898926, "global_step": 48868, "epoch": 290} {"train_loss": -8.317168235778809, "global_step": 48869, "epoch": 290} {"train_loss": -8.419076919555664, "global_step": 48870, "epoch": 290} {"train_loss": -8.251081466674805, "global_step": 48871, "epoch": 290} {"train_loss": -8.188283920288086, "global_step": 48872, "epoch": 290} {"train_loss": -8.459905624389648, "global_step": 48873, "epoch": 290} {"train_loss": -8.512002944946289, "global_step": 48874, "epoch": 290} {"train_loss": -8.199152946472168, "global_step": 48875, "epoch": 290} {"train_loss": -8.038166999816895, "global_step": 48876, "epoch": 290} {"train_loss": -8.395917892456055, "global_step": 48877, "epoch": 290} {"train_loss": -8.108039855957031, "global_step": 48878, "epoch": 290} {"train_loss": -8.2100830078125, "global_step": 48879, "epoch": 290} {"train_loss": -8.177738189697266, "global_step": 48880, "epoch": 290} {"train_loss": -8.285764694213867, "global_step": 48881, "epoch": 290} {"train_loss": -8.051164627075195, "global_step": 48882, "epoch": 290} {"train_loss": -7.700940132141113, "global_step": 48883, "epoch": 290} {"train_loss": -7.932174205780029, "global_step": 48884, "epoch": 290} {"train_loss": -7.55000638961792, "global_step": 48885, "epoch": 290} {"train_loss": -8.35920524597168, "global_step": 48886, "epoch": 290} {"train_loss": -8.252252766064235, "global_step": 48887, "epoch": 290, "val_loss": 187628.15625, "train_action_mse_error": 14.039340019226074} {"train_loss": -8.046682357788086, "global_step": 48888, "epoch": 291} {"train_loss": -7.944164276123047, "global_step": 48889, "epoch": 291} {"train_loss": -8.13851547241211, "global_step": 48890, "epoch": 291} {"train_loss": -8.056320190429688, "global_step": 48891, "epoch": 291} {"train_loss": -8.131447792053223, "global_step": 48892, "epoch": 291} {"train_loss": -8.099861145019531, "global_step": 48893, "epoch": 291} {"train_loss": -7.848278522491455, "global_step": 48894, "epoch": 291} {"train_loss": -8.161775588989258, "global_step": 48895, "epoch": 291} {"train_loss": -8.27652359008789, "global_step": 48896, "epoch": 291} {"train_loss": -8.048356056213379, "global_step": 48897, "epoch": 291} {"train_loss": -8.169508934020996, "global_step": 48898, "epoch": 291} {"train_loss": -8.025093078613281, "global_step": 48899, "epoch": 291} {"train_loss": -8.128310203552246, "global_step": 48900, "epoch": 291} {"train_loss": -8.361404418945312, "global_step": 48901, "epoch": 291} {"train_loss": -8.245397567749023, "global_step": 48902, "epoch": 291} {"train_loss": -8.471626281738281, "global_step": 48903, "epoch": 291} {"train_loss": -8.23614501953125, "global_step": 48904, "epoch": 291} {"train_loss": -8.269075393676758, "global_step": 48905, "epoch": 291} {"train_loss": -8.180953979492188, "global_step": 48906, "epoch": 291} {"train_loss": -8.059009552001953, "global_step": 48907, "epoch": 291} {"train_loss": -8.472746849060059, "global_step": 48908, "epoch": 291} {"train_loss": -8.324176788330078, "global_step": 48909, "epoch": 291} {"train_loss": -8.346189498901367, "global_step": 48910, "epoch": 291} {"train_loss": -8.09616470336914, "global_step": 48911, "epoch": 291} {"train_loss": -8.602731704711914, "global_step": 48912, "epoch": 291} {"train_loss": -8.316923141479492, "global_step": 48913, "epoch": 291} {"train_loss": -8.157737731933594, "global_step": 48914, "epoch": 291} {"train_loss": -8.404321670532227, "global_step": 48915, "epoch": 291} {"train_loss": -8.462991714477539, "global_step": 48916, "epoch": 291} {"train_loss": -8.18374252319336, "global_step": 48917, "epoch": 291} {"train_loss": -8.264812469482422, "global_step": 48918, "epoch": 291} {"train_loss": -8.244890213012695, "global_step": 48919, "epoch": 291} {"train_loss": -8.272825241088867, "global_step": 48920, "epoch": 291} {"train_loss": -8.346504211425781, "global_step": 48921, "epoch": 291} {"train_loss": -8.1956787109375, "global_step": 48922, "epoch": 291} {"train_loss": -8.195432662963867, "global_step": 48923, "epoch": 291} {"train_loss": -8.218822479248047, "global_step": 48924, "epoch": 291} {"train_loss": -8.274069786071777, "global_step": 48925, "epoch": 291} {"train_loss": -7.806825160980225, "global_step": 48926, "epoch": 291} {"train_loss": -8.214625358581543, "global_step": 48927, "epoch": 291} {"train_loss": -8.439468383789062, "global_step": 48928, "epoch": 291} {"train_loss": -8.016817092895508, "global_step": 48929, "epoch": 291} {"train_loss": -8.062423706054688, "global_step": 48930, "epoch": 291} {"train_loss": -8.313379287719727, "global_step": 48931, "epoch": 291} {"train_loss": -8.218801498413086, "global_step": 48932, "epoch": 291} {"train_loss": -8.251871109008789, "global_step": 48933, "epoch": 291} {"train_loss": -8.10746955871582, "global_step": 48934, "epoch": 291} {"train_loss": -8.086713790893555, "global_step": 48935, "epoch": 291} {"train_loss": -8.157705307006836, "global_step": 48936, "epoch": 291} {"train_loss": -8.055742263793945, "global_step": 48937, "epoch": 291} {"train_loss": -8.306953430175781, "global_step": 48938, "epoch": 291} {"train_loss": -8.29869270324707, "global_step": 48939, "epoch": 291} {"train_loss": -8.142578125, "global_step": 48940, "epoch": 291} {"train_loss": -8.088205337524414, "global_step": 48941, "epoch": 291} {"train_loss": -8.37564468383789, "global_step": 48942, "epoch": 291} {"train_loss": -8.399984359741211, "global_step": 48943, "epoch": 291} {"train_loss": -8.429688453674316, "global_step": 48944, "epoch": 291} {"train_loss": -8.133536338806152, "global_step": 48945, "epoch": 291} {"train_loss": -8.479351043701172, "global_step": 48946, "epoch": 291} {"train_loss": -8.0711669921875, "global_step": 48947, "epoch": 291} {"train_loss": -8.469818115234375, "global_step": 48948, "epoch": 291} {"train_loss": -8.449563980102539, "global_step": 48949, "epoch": 291} {"train_loss": -8.173120498657227, "global_step": 48950, "epoch": 291} {"train_loss": -8.468058586120605, "global_step": 48951, "epoch": 291} {"train_loss": -8.309804916381836, "global_step": 48952, "epoch": 291} {"train_loss": -8.255953788757324, "global_step": 48953, "epoch": 291} {"train_loss": -8.347354888916016, "global_step": 48954, "epoch": 291} {"train_loss": -8.353340148925781, "global_step": 48955, "epoch": 291} {"train_loss": -8.355375289916992, "global_step": 48956, "epoch": 291} {"train_loss": -8.443340301513672, "global_step": 48957, "epoch": 291} {"train_loss": -8.017455101013184, "global_step": 48958, "epoch": 291} {"train_loss": -8.307195663452148, "global_step": 48959, "epoch": 291} {"train_loss": -8.132563591003418, "global_step": 48960, "epoch": 291} {"train_loss": -8.445817947387695, "global_step": 48961, "epoch": 291} {"train_loss": -8.06117057800293, "global_step": 48962, "epoch": 291} {"train_loss": -8.256641387939453, "global_step": 48963, "epoch": 291} {"train_loss": -8.209992408752441, "global_step": 48964, "epoch": 291} {"train_loss": -8.281391143798828, "global_step": 48965, "epoch": 291} {"train_loss": -8.10142707824707, "global_step": 48966, "epoch": 291} {"train_loss": -8.256317138671875, "global_step": 48967, "epoch": 291} {"train_loss": -8.36666488647461, "global_step": 48968, "epoch": 291} {"train_loss": -8.208475112915039, "global_step": 48969, "epoch": 291} {"train_loss": -8.019685745239258, "global_step": 48970, "epoch": 291} {"train_loss": -8.434501647949219, "global_step": 48971, "epoch": 291} {"train_loss": -8.254358291625977, "global_step": 48972, "epoch": 291} {"train_loss": -8.304265022277832, "global_step": 48973, "epoch": 291} {"train_loss": -8.27957820892334, "global_step": 48974, "epoch": 291} {"train_loss": -8.027649879455566, "global_step": 48975, "epoch": 291} {"train_loss": -8.14299201965332, "global_step": 48976, "epoch": 291} {"train_loss": -7.941196918487549, "global_step": 48977, "epoch": 291} {"train_loss": -8.145151138305664, "global_step": 48978, "epoch": 291} {"train_loss": -8.238325119018555, "global_step": 48979, "epoch": 291} {"train_loss": -8.034369468688965, "global_step": 48980, "epoch": 291} {"train_loss": -8.034253120422363, "global_step": 48981, "epoch": 291} {"train_loss": -8.190690040588379, "global_step": 48982, "epoch": 291} {"train_loss": -8.175775527954102, "global_step": 48983, "epoch": 291} {"train_loss": -8.047940254211426, "global_step": 48984, "epoch": 291} {"train_loss": -8.095264434814453, "global_step": 48985, "epoch": 291} {"train_loss": -8.225606918334961, "global_step": 48986, "epoch": 291} {"train_loss": -8.120943069458008, "global_step": 48987, "epoch": 291} {"train_loss": -8.276802062988281, "global_step": 48988, "epoch": 291} {"train_loss": -8.088645935058594, "global_step": 48989, "epoch": 291} {"train_loss": -8.327988624572754, "global_step": 48990, "epoch": 291} {"train_loss": -8.183669090270996, "global_step": 48991, "epoch": 291} {"train_loss": -8.06840991973877, "global_step": 48992, "epoch": 291} {"train_loss": -8.173450469970703, "global_step": 48993, "epoch": 291} {"train_loss": -7.998453140258789, "global_step": 48994, "epoch": 291} {"train_loss": -8.14717960357666, "global_step": 48995, "epoch": 291} {"train_loss": -7.971269607543945, "global_step": 48996, "epoch": 291} {"train_loss": -8.397123336791992, "global_step": 48997, "epoch": 291} {"train_loss": -8.177332878112793, "global_step": 48998, "epoch": 291} {"train_loss": -8.410270690917969, "global_step": 48999, "epoch": 291} {"train_loss": -8.226197242736816, "global_step": 49000, "epoch": 291} {"train_loss": -8.36796760559082, "global_step": 49001, "epoch": 291} {"train_loss": -8.446493148803711, "global_step": 49002, "epoch": 291} {"train_loss": -8.099552154541016, "global_step": 49003, "epoch": 291} {"train_loss": -8.378486633300781, "global_step": 49004, "epoch": 291} {"train_loss": -8.394303321838379, "global_step": 49005, "epoch": 291} {"train_loss": -8.481035232543945, "global_step": 49006, "epoch": 291} {"train_loss": -8.44771957397461, "global_step": 49007, "epoch": 291} {"train_loss": -8.50361442565918, "global_step": 49008, "epoch": 291} {"train_loss": -8.43280029296875, "global_step": 49009, "epoch": 291} {"train_loss": -8.52943229675293, "global_step": 49010, "epoch": 291} {"train_loss": -8.567255020141602, "global_step": 49011, "epoch": 291} {"train_loss": -8.327787399291992, "global_step": 49012, "epoch": 291} {"train_loss": -8.038610458374023, "global_step": 49013, "epoch": 291} {"train_loss": -8.263704299926758, "global_step": 49014, "epoch": 291} {"train_loss": -8.155261039733887, "global_step": 49015, "epoch": 291} {"train_loss": -8.231775283813477, "global_step": 49016, "epoch": 291} {"train_loss": -7.84403133392334, "global_step": 49017, "epoch": 291} {"train_loss": -8.167617797851562, "global_step": 49018, "epoch": 291} {"train_loss": -8.21615219116211, "global_step": 49019, "epoch": 291} {"train_loss": -8.240856170654297, "global_step": 49020, "epoch": 291} {"train_loss": -8.076494216918945, "global_step": 49021, "epoch": 291} {"train_loss": -8.137884140014648, "global_step": 49022, "epoch": 291} {"train_loss": -8.240808486938477, "global_step": 49023, "epoch": 291} {"train_loss": -8.265050888061523, "global_step": 49024, "epoch": 291} {"train_loss": -8.13946533203125, "global_step": 49025, "epoch": 291} {"train_loss": -8.46093463897705, "global_step": 49026, "epoch": 291} {"train_loss": -8.426725387573242, "global_step": 49027, "epoch": 291} {"train_loss": -8.179580688476562, "global_step": 49028, "epoch": 291} {"train_loss": -8.221892356872559, "global_step": 49029, "epoch": 291} {"train_loss": -8.150186538696289, "global_step": 49030, "epoch": 291} {"train_loss": -8.295796394348145, "global_step": 49031, "epoch": 291} {"train_loss": -8.241495132446289, "global_step": 49032, "epoch": 291} {"train_loss": -8.408247947692871, "global_step": 49033, "epoch": 291} {"train_loss": -8.283329010009766, "global_step": 49034, "epoch": 291} {"train_loss": -8.308268547058105, "global_step": 49035, "epoch": 291} {"train_loss": -8.491467475891113, "global_step": 49036, "epoch": 291} {"train_loss": -8.39011287689209, "global_step": 49037, "epoch": 291} {"train_loss": -8.42261791229248, "global_step": 49038, "epoch": 291} {"train_loss": -8.053937911987305, "global_step": 49039, "epoch": 291} {"train_loss": -8.383045196533203, "global_step": 49040, "epoch": 291} {"train_loss": -8.226139068603516, "global_step": 49041, "epoch": 291} {"train_loss": -8.406002044677734, "global_step": 49042, "epoch": 291} {"train_loss": -8.312431335449219, "global_step": 49043, "epoch": 291} {"train_loss": -8.316816329956055, "global_step": 49044, "epoch": 291} {"train_loss": -8.405776023864746, "global_step": 49045, "epoch": 291} {"train_loss": -8.256977081298828, "global_step": 49046, "epoch": 291} {"train_loss": -8.341531753540039, "global_step": 49047, "epoch": 291} {"train_loss": -8.178256034851074, "global_step": 49048, "epoch": 291} {"train_loss": -8.237574577331543, "global_step": 49049, "epoch": 291} {"train_loss": -8.42210578918457, "global_step": 49050, "epoch": 291} {"train_loss": -8.317895889282227, "global_step": 49051, "epoch": 291} {"train_loss": -8.089645385742188, "global_step": 49052, "epoch": 291} {"train_loss": -8.417194366455078, "global_step": 49053, "epoch": 291} {"train_loss": -8.499860763549805, "global_step": 49054, "epoch": 291} {"train_loss": -8.241006195545197, "global_step": 49055, "epoch": 291, "val_loss": 186153.890625} {"train_loss": -8.503663063049316, "global_step": 49056, "epoch": 292} {"train_loss": -8.404696464538574, "global_step": 49057, "epoch": 292} {"train_loss": -8.263431549072266, "global_step": 49058, "epoch": 292} {"train_loss": -8.143270492553711, "global_step": 49059, "epoch": 292} {"train_loss": -8.366549491882324, "global_step": 49060, "epoch": 292} {"train_loss": -8.307302474975586, "global_step": 49061, "epoch": 292} {"train_loss": -8.383657455444336, "global_step": 49062, "epoch": 292} {"train_loss": -8.322212219238281, "global_step": 49063, "epoch": 292} {"train_loss": -8.38272476196289, "global_step": 49064, "epoch": 292} {"train_loss": -8.342155456542969, "global_step": 49065, "epoch": 292} {"train_loss": -8.406134605407715, "global_step": 49066, "epoch": 292} {"train_loss": -8.296814918518066, "global_step": 49067, "epoch": 292} {"train_loss": -8.446279525756836, "global_step": 49068, "epoch": 292} {"train_loss": -8.155426025390625, "global_step": 49069, "epoch": 292} {"train_loss": -8.349803924560547, "global_step": 49070, "epoch": 292} {"train_loss": -8.164993286132812, "global_step": 49071, "epoch": 292} {"train_loss": -8.192838668823242, "global_step": 49072, "epoch": 292} {"train_loss": -7.937592029571533, "global_step": 49073, "epoch": 292} {"train_loss": -8.263483047485352, "global_step": 49074, "epoch": 292} {"train_loss": -8.116445541381836, "global_step": 49075, "epoch": 292} {"train_loss": -8.03656005859375, "global_step": 49076, "epoch": 292} {"train_loss": -8.286550521850586, "global_step": 49077, "epoch": 292} {"train_loss": -8.32115364074707, "global_step": 49078, "epoch": 292} {"train_loss": -8.30534839630127, "global_step": 49079, "epoch": 292} {"train_loss": -8.361412048339844, "global_step": 49080, "epoch": 292} {"train_loss": -8.244845390319824, "global_step": 49081, "epoch": 292} {"train_loss": -8.39468765258789, "global_step": 49082, "epoch": 292} {"train_loss": -8.316658020019531, "global_step": 49083, "epoch": 292} {"train_loss": -8.32979965209961, "global_step": 49084, "epoch": 292} {"train_loss": -8.356380462646484, "global_step": 49085, "epoch": 292} {"train_loss": -8.190542221069336, "global_step": 49086, "epoch": 292} {"train_loss": -8.315138816833496, "global_step": 49087, "epoch": 292} {"train_loss": -8.414619445800781, "global_step": 49088, "epoch": 292} {"train_loss": -8.297858238220215, "global_step": 49089, "epoch": 292} {"train_loss": -8.295425415039062, "global_step": 49090, "epoch": 292} {"train_loss": -8.18834400177002, "global_step": 49091, "epoch": 292} {"train_loss": -8.335784912109375, "global_step": 49092, "epoch": 292} {"train_loss": -8.486827850341797, "global_step": 49093, "epoch": 292} {"train_loss": -8.323331832885742, "global_step": 49094, "epoch": 292} {"train_loss": -8.387014389038086, "global_step": 49095, "epoch": 292} {"train_loss": -8.386119842529297, "global_step": 49096, "epoch": 292} {"train_loss": -8.335844039916992, "global_step": 49097, "epoch": 292} {"train_loss": -8.254453659057617, "global_step": 49098, "epoch": 292} {"train_loss": -8.533660888671875, "global_step": 49099, "epoch": 292} {"train_loss": -8.174192428588867, "global_step": 49100, "epoch": 292} {"train_loss": -8.182616233825684, "global_step": 49101, "epoch": 292} {"train_loss": -8.32143783569336, "global_step": 49102, "epoch": 292} {"train_loss": -8.258987426757812, "global_step": 49103, "epoch": 292} {"train_loss": -8.180198669433594, "global_step": 49104, "epoch": 292} {"train_loss": -8.368551254272461, "global_step": 49105, "epoch": 292} {"train_loss": -8.45573616027832, "global_step": 49106, "epoch": 292} {"train_loss": -7.99645471572876, "global_step": 49107, "epoch": 292} {"train_loss": -8.241421699523926, "global_step": 49108, "epoch": 292} {"train_loss": -8.094680786132812, "global_step": 49109, "epoch": 292} {"train_loss": -8.048736572265625, "global_step": 49110, "epoch": 292} {"train_loss": -8.21197509765625, "global_step": 49111, "epoch": 292} {"train_loss": -8.239191055297852, "global_step": 49112, "epoch": 292} {"train_loss": -7.794770240783691, "global_step": 49113, "epoch": 292} {"train_loss": -8.239178657531738, "global_step": 49114, "epoch": 292} {"train_loss": -8.182571411132812, "global_step": 49115, "epoch": 292} {"train_loss": -8.309913635253906, "global_step": 49116, "epoch": 292} {"train_loss": -7.959256172180176, "global_step": 49117, "epoch": 292} {"train_loss": -8.210783004760742, "global_step": 49118, "epoch": 292} {"train_loss": -8.246379852294922, "global_step": 49119, "epoch": 292} {"train_loss": -7.9436540603637695, "global_step": 49120, "epoch": 292} {"train_loss": -8.093303680419922, "global_step": 49121, "epoch": 292} {"train_loss": -8.161964416503906, "global_step": 49122, "epoch": 292} {"train_loss": -8.195398330688477, "global_step": 49123, "epoch": 292} {"train_loss": -8.262825012207031, "global_step": 49124, "epoch": 292} {"train_loss": -8.249605178833008, "global_step": 49125, "epoch": 292} {"train_loss": -8.216608047485352, "global_step": 49126, "epoch": 292} {"train_loss": -8.403547286987305, "global_step": 49127, "epoch": 292} {"train_loss": -8.337247848510742, "global_step": 49128, "epoch": 292} {"train_loss": -8.357664108276367, "global_step": 49129, "epoch": 292} {"train_loss": -8.197587013244629, "global_step": 49130, "epoch": 292} {"train_loss": -8.253969192504883, "global_step": 49131, "epoch": 292} {"train_loss": -8.291568756103516, "global_step": 49132, "epoch": 292} {"train_loss": -8.334783554077148, "global_step": 49133, "epoch": 292} {"train_loss": -8.231246948242188, "global_step": 49134, "epoch": 292} {"train_loss": -8.41927719116211, "global_step": 49135, "epoch": 292} {"train_loss": -8.132492065429688, "global_step": 49136, "epoch": 292} {"train_loss": -8.338998794555664, "global_step": 49137, "epoch": 292} {"train_loss": -8.517510414123535, "global_step": 49138, "epoch": 292} {"train_loss": -8.395586013793945, "global_step": 49139, "epoch": 292} {"train_loss": -8.343974113464355, "global_step": 49140, "epoch": 292} {"train_loss": -8.373039245605469, "global_step": 49141, "epoch": 292} {"train_loss": -8.165621757507324, "global_step": 49142, "epoch": 292} {"train_loss": -7.985262870788574, "global_step": 49143, "epoch": 292} {"train_loss": -8.409494400024414, "global_step": 49144, "epoch": 292} {"train_loss": -8.148004531860352, "global_step": 49145, "epoch": 292} {"train_loss": -8.157978057861328, "global_step": 49146, "epoch": 292} {"train_loss": -8.251812934875488, "global_step": 49147, "epoch": 292} {"train_loss": -8.348734855651855, "global_step": 49148, "epoch": 292} {"train_loss": -7.9091339111328125, "global_step": 49149, "epoch": 292} {"train_loss": -8.479389190673828, "global_step": 49150, "epoch": 292} {"train_loss": -8.06161880493164, "global_step": 49151, "epoch": 292} {"train_loss": -8.122720718383789, "global_step": 49152, "epoch": 292} {"train_loss": -8.384432792663574, "global_step": 49153, "epoch": 292} {"train_loss": -8.4766845703125, "global_step": 49154, "epoch": 292} {"train_loss": -8.291414260864258, "global_step": 49155, "epoch": 292} {"train_loss": -8.484189987182617, "global_step": 49156, "epoch": 292} {"train_loss": -8.530372619628906, "global_step": 49157, "epoch": 292} {"train_loss": -8.339322090148926, "global_step": 49158, "epoch": 292} {"train_loss": -8.176556587219238, "global_step": 49159, "epoch": 292} {"train_loss": -8.496664047241211, "global_step": 49160, "epoch": 292} {"train_loss": -8.49081802368164, "global_step": 49161, "epoch": 292} {"train_loss": -8.370075225830078, "global_step": 49162, "epoch": 292} {"train_loss": -8.61413860321045, "global_step": 49163, "epoch": 292} {"train_loss": -8.208648681640625, "global_step": 49164, "epoch": 292} {"train_loss": -8.351156234741211, "global_step": 49165, "epoch": 292} {"train_loss": -8.359580039978027, "global_step": 49166, "epoch": 292} {"train_loss": -8.411867141723633, "global_step": 49167, "epoch": 292} {"train_loss": -8.600131034851074, "global_step": 49168, "epoch": 292} {"train_loss": -8.462736129760742, "global_step": 49169, "epoch": 292} {"train_loss": -8.278892517089844, "global_step": 49170, "epoch": 292} {"train_loss": -8.420633316040039, "global_step": 49171, "epoch": 292} {"train_loss": -8.377635955810547, "global_step": 49172, "epoch": 292} {"train_loss": -8.296842575073242, "global_step": 49173, "epoch": 292} {"train_loss": -8.309185028076172, "global_step": 49174, "epoch": 292} {"train_loss": -8.416715621948242, "global_step": 49175, "epoch": 292} {"train_loss": -8.44188117980957, "global_step": 49176, "epoch": 292} {"train_loss": -8.356206893920898, "global_step": 49177, "epoch": 292} {"train_loss": -8.418876647949219, "global_step": 49178, "epoch": 292} {"train_loss": -8.450966835021973, "global_step": 49179, "epoch": 292} {"train_loss": -8.457256317138672, "global_step": 49180, "epoch": 292} {"train_loss": -8.362348556518555, "global_step": 49181, "epoch": 292} {"train_loss": -8.32872486114502, "global_step": 49182, "epoch": 292} {"train_loss": -8.201138496398926, "global_step": 49183, "epoch": 292} {"train_loss": -8.32532787322998, "global_step": 49184, "epoch": 292} {"train_loss": -8.096308708190918, "global_step": 49185, "epoch": 292} {"train_loss": -8.381671905517578, "global_step": 49186, "epoch": 292} {"train_loss": -7.972587585449219, "global_step": 49187, "epoch": 292} {"train_loss": -8.131885528564453, "global_step": 49188, "epoch": 292} {"train_loss": -8.106094360351562, "global_step": 49189, "epoch": 292} {"train_loss": -8.127193450927734, "global_step": 49190, "epoch": 292} {"train_loss": -8.309713363647461, "global_step": 49191, "epoch": 292} {"train_loss": -8.370275497436523, "global_step": 49192, "epoch": 292} {"train_loss": -8.041454315185547, "global_step": 49193, "epoch": 292} {"train_loss": -8.069793701171875, "global_step": 49194, "epoch": 292} {"train_loss": -8.246774673461914, "global_step": 49195, "epoch": 292} {"train_loss": -8.211493492126465, "global_step": 49196, "epoch": 292} {"train_loss": -8.250005722045898, "global_step": 49197, "epoch": 292} {"train_loss": -8.196557998657227, "global_step": 49198, "epoch": 292} {"train_loss": -8.21681022644043, "global_step": 49199, "epoch": 292} {"train_loss": -7.8868727684021, "global_step": 49200, "epoch": 292} {"train_loss": -8.173881530761719, "global_step": 49201, "epoch": 292} {"train_loss": -8.342534065246582, "global_step": 49202, "epoch": 292} {"train_loss": -8.203149795532227, "global_step": 49203, "epoch": 292} {"train_loss": -8.062196731567383, "global_step": 49204, "epoch": 292} {"train_loss": -8.265034675598145, "global_step": 49205, "epoch": 292} {"train_loss": -8.213577270507812, "global_step": 49206, "epoch": 292} {"train_loss": -8.024752616882324, "global_step": 49207, "epoch": 292} {"train_loss": -8.431365013122559, "global_step": 49208, "epoch": 292} {"train_loss": -7.957881927490234, "global_step": 49209, "epoch": 292} {"train_loss": -8.364810943603516, "global_step": 49210, "epoch": 292} {"train_loss": -8.177221298217773, "global_step": 49211, "epoch": 292} {"train_loss": -8.454623222351074, "global_step": 49212, "epoch": 292} {"train_loss": -8.087603569030762, "global_step": 49213, "epoch": 292} {"train_loss": -8.307685852050781, "global_step": 49214, "epoch": 292} {"train_loss": -8.229085922241211, "global_step": 49215, "epoch": 292} {"train_loss": -8.284645080566406, "global_step": 49216, "epoch": 292} {"train_loss": -7.966391563415527, "global_step": 49217, "epoch": 292} {"train_loss": -8.2435302734375, "global_step": 49218, "epoch": 292} {"train_loss": -8.309738159179688, "global_step": 49219, "epoch": 292} {"train_loss": -8.085375785827637, "global_step": 49220, "epoch": 292} {"train_loss": -8.583002090454102, "global_step": 49221, "epoch": 292} {"train_loss": -8.12771224975586, "global_step": 49222, "epoch": 292} {"train_loss": -8.272816961719876, "global_step": 49223, "epoch": 292, "val_loss": 188105.78125} {"train_loss": -8.071244239807129, "global_step": 49224, "epoch": 293} {"train_loss": -8.277551651000977, "global_step": 49225, "epoch": 293} {"train_loss": -7.947336673736572, "global_step": 49226, "epoch": 293} {"train_loss": -8.252696990966797, "global_step": 49227, "epoch": 293} {"train_loss": -8.400703430175781, "global_step": 49228, "epoch": 293} {"train_loss": -8.305729866027832, "global_step": 49229, "epoch": 293} {"train_loss": -8.20192813873291, "global_step": 49230, "epoch": 293} {"train_loss": -8.099759101867676, "global_step": 49231, "epoch": 293} {"train_loss": -8.228082656860352, "global_step": 49232, "epoch": 293} {"train_loss": -8.030241012573242, "global_step": 49233, "epoch": 293} {"train_loss": -8.269679069519043, "global_step": 49234, "epoch": 293} {"train_loss": -8.168126106262207, "global_step": 49235, "epoch": 293} {"train_loss": -8.385188102722168, "global_step": 49236, "epoch": 293} {"train_loss": -8.158814430236816, "global_step": 49237, "epoch": 293} {"train_loss": -8.168962478637695, "global_step": 49238, "epoch": 293} {"train_loss": -8.246782302856445, "global_step": 49239, "epoch": 293} {"train_loss": -8.332862854003906, "global_step": 49240, "epoch": 293} {"train_loss": -7.901562690734863, "global_step": 49241, "epoch": 293} {"train_loss": -8.110132217407227, "global_step": 49242, "epoch": 293} {"train_loss": -8.326629638671875, "global_step": 49243, "epoch": 293} {"train_loss": -7.908205986022949, "global_step": 49244, "epoch": 293} {"train_loss": -7.92136287689209, "global_step": 49245, "epoch": 293} {"train_loss": -8.090412139892578, "global_step": 49246, "epoch": 293} {"train_loss": -8.40003490447998, "global_step": 49247, "epoch": 293} {"train_loss": -8.244720458984375, "global_step": 49248, "epoch": 293} {"train_loss": -8.353547096252441, "global_step": 49249, "epoch": 293} {"train_loss": -8.097942352294922, "global_step": 49250, "epoch": 293} {"train_loss": -8.419357299804688, "global_step": 49251, "epoch": 293} {"train_loss": -8.443300247192383, "global_step": 49252, "epoch": 293} {"train_loss": -8.197299003601074, "global_step": 49253, "epoch": 293} {"train_loss": -8.34018325805664, "global_step": 49254, "epoch": 293} {"train_loss": -8.344354629516602, "global_step": 49255, "epoch": 293} {"train_loss": -8.383369445800781, "global_step": 49256, "epoch": 293} {"train_loss": -8.260369300842285, "global_step": 49257, "epoch": 293} {"train_loss": -8.2994966506958, "global_step": 49258, "epoch": 293} {"train_loss": -8.481063842773438, "global_step": 49259, "epoch": 293} {"train_loss": -8.232114791870117, "global_step": 49260, "epoch": 293} {"train_loss": -8.396058082580566, "global_step": 49261, "epoch": 293} {"train_loss": -8.067052841186523, "global_step": 49262, "epoch": 293} {"train_loss": -8.379024505615234, "global_step": 49263, "epoch": 293} {"train_loss": -8.217568397521973, "global_step": 49264, "epoch": 293} {"train_loss": -8.209945678710938, "global_step": 49265, "epoch": 293} {"train_loss": -8.062530517578125, "global_step": 49266, "epoch": 293} {"train_loss": -8.265729904174805, "global_step": 49267, "epoch": 293} {"train_loss": -7.947288513183594, "global_step": 49268, "epoch": 293} {"train_loss": -8.268671035766602, "global_step": 49269, "epoch": 293} {"train_loss": -8.24412727355957, "global_step": 49270, "epoch": 293} {"train_loss": -8.333372116088867, "global_step": 49271, "epoch": 293} {"train_loss": -8.169539451599121, "global_step": 49272, "epoch": 293} {"train_loss": -8.209273338317871, "global_step": 49273, "epoch": 293} {"train_loss": -8.092599868774414, "global_step": 49274, "epoch": 293} {"train_loss": -8.369397163391113, "global_step": 49275, "epoch": 293} {"train_loss": -8.280667304992676, "global_step": 49276, "epoch": 293} {"train_loss": -8.502264976501465, "global_step": 49277, "epoch": 293} {"train_loss": -8.28554916381836, "global_step": 49278, "epoch": 293} {"train_loss": -8.415050506591797, "global_step": 49279, "epoch": 293} {"train_loss": -8.329916954040527, "global_step": 49280, "epoch": 293} {"train_loss": -8.402274131774902, "global_step": 49281, "epoch": 293} {"train_loss": -8.366485595703125, "global_step": 49282, "epoch": 293} {"train_loss": -8.47204875946045, "global_step": 49283, "epoch": 293} {"train_loss": -8.3817720413208, "global_step": 49284, "epoch": 293} {"train_loss": -8.479650497436523, "global_step": 49285, "epoch": 293} {"train_loss": -8.213141441345215, "global_step": 49286, "epoch": 293} {"train_loss": -8.459664344787598, "global_step": 49287, "epoch": 293} {"train_loss": -8.375770568847656, "global_step": 49288, "epoch": 293} {"train_loss": -8.554508209228516, "global_step": 49289, "epoch": 293} {"train_loss": -8.420548439025879, "global_step": 49290, "epoch": 293} {"train_loss": -8.463000297546387, "global_step": 49291, "epoch": 293} {"train_loss": -8.406646728515625, "global_step": 49292, "epoch": 293} {"train_loss": -8.441020965576172, "global_step": 49293, "epoch": 293} {"train_loss": -8.40376091003418, "global_step": 49294, "epoch": 293} {"train_loss": -8.339414596557617, "global_step": 49295, "epoch": 293} {"train_loss": -8.723014831542969, "global_step": 49296, "epoch": 293} {"train_loss": -8.427947998046875, "global_step": 49297, "epoch": 293} {"train_loss": -8.427776336669922, "global_step": 49298, "epoch": 293} {"train_loss": -8.248973846435547, "global_step": 49299, "epoch": 293} {"train_loss": -8.546119689941406, "global_step": 49300, "epoch": 293} {"train_loss": -8.330741882324219, "global_step": 49301, "epoch": 293} {"train_loss": -8.534499168395996, "global_step": 49302, "epoch": 293} {"train_loss": -8.566070556640625, "global_step": 49303, "epoch": 293} {"train_loss": -8.5770902633667, "global_step": 49304, "epoch": 293} {"train_loss": -8.5979585647583, "global_step": 49305, "epoch": 293} {"train_loss": -8.628759384155273, "global_step": 49306, "epoch": 293} {"train_loss": -8.480949401855469, "global_step": 49307, "epoch": 293} {"train_loss": -8.328689575195312, "global_step": 49308, "epoch": 293} {"train_loss": -8.404165267944336, "global_step": 49309, "epoch": 293} {"train_loss": -8.3865385055542, "global_step": 49310, "epoch": 293} {"train_loss": -8.322126388549805, "global_step": 49311, "epoch": 293} {"train_loss": -8.284225463867188, "global_step": 49312, "epoch": 293} {"train_loss": -8.52536392211914, "global_step": 49313, "epoch": 293} {"train_loss": -8.538583755493164, "global_step": 49314, "epoch": 293} {"train_loss": -8.236004829406738, "global_step": 49315, "epoch": 293} {"train_loss": -8.62044906616211, "global_step": 49316, "epoch": 293} {"train_loss": -8.180110931396484, "global_step": 49317, "epoch": 293} {"train_loss": -8.518364906311035, "global_step": 49318, "epoch": 293} {"train_loss": -8.377880096435547, "global_step": 49319, "epoch": 293} {"train_loss": -8.298604011535645, "global_step": 49320, "epoch": 293} {"train_loss": -8.298078536987305, "global_step": 49321, "epoch": 293} {"train_loss": -8.260377883911133, "global_step": 49322, "epoch": 293} {"train_loss": -8.136649131774902, "global_step": 49323, "epoch": 293} {"train_loss": -8.259934425354004, "global_step": 49324, "epoch": 293} {"train_loss": -8.25777816772461, "global_step": 49325, "epoch": 293} {"train_loss": -8.009781837463379, "global_step": 49326, "epoch": 293} {"train_loss": -8.247227668762207, "global_step": 49327, "epoch": 293} {"train_loss": -8.038509368896484, "global_step": 49328, "epoch": 293} {"train_loss": -8.405414581298828, "global_step": 49329, "epoch": 293} {"train_loss": -8.144020080566406, "global_step": 49330, "epoch": 293} {"train_loss": -8.375511169433594, "global_step": 49331, "epoch": 293} {"train_loss": -8.19321060180664, "global_step": 49332, "epoch": 293} {"train_loss": -8.2449312210083, "global_step": 49333, "epoch": 293} {"train_loss": -7.823727130889893, "global_step": 49334, "epoch": 293} {"train_loss": -8.200430870056152, "global_step": 49335, "epoch": 293} {"train_loss": -8.232324600219727, "global_step": 49336, "epoch": 293} {"train_loss": -8.350342750549316, "global_step": 49337, "epoch": 293} {"train_loss": -8.30664348602295, "global_step": 49338, "epoch": 293} {"train_loss": -8.269662857055664, "global_step": 49339, "epoch": 293} {"train_loss": -7.928347110748291, "global_step": 49340, "epoch": 293} {"train_loss": -8.036840438842773, "global_step": 49341, "epoch": 293} {"train_loss": -8.216987609863281, "global_step": 49342, "epoch": 293} {"train_loss": -8.316442489624023, "global_step": 49343, "epoch": 293} {"train_loss": -8.238977432250977, "global_step": 49344, "epoch": 293} {"train_loss": -8.31096076965332, "global_step": 49345, "epoch": 293} {"train_loss": -8.309700012207031, "global_step": 49346, "epoch": 293} {"train_loss": -8.414194107055664, "global_step": 49347, "epoch": 293} {"train_loss": -8.021041870117188, "global_step": 49348, "epoch": 293} {"train_loss": -8.244665145874023, "global_step": 49349, "epoch": 293} {"train_loss": -8.158720970153809, "global_step": 49350, "epoch": 293} {"train_loss": -8.235638618469238, "global_step": 49351, "epoch": 293} {"train_loss": -8.369649887084961, "global_step": 49352, "epoch": 293} {"train_loss": -8.359743118286133, "global_step": 49353, "epoch": 293} {"train_loss": -8.400375366210938, "global_step": 49354, "epoch": 293} {"train_loss": -8.33656120300293, "global_step": 49355, "epoch": 293} {"train_loss": -8.09971809387207, "global_step": 49356, "epoch": 293} {"train_loss": -8.251310348510742, "global_step": 49357, "epoch": 293} {"train_loss": -8.216794967651367, "global_step": 49358, "epoch": 293} {"train_loss": -8.611390113830566, "global_step": 49359, "epoch": 293} {"train_loss": -8.260737419128418, "global_step": 49360, "epoch": 293} {"train_loss": -8.399176597595215, "global_step": 49361, "epoch": 293} {"train_loss": -8.316832542419434, "global_step": 49362, "epoch": 293} {"train_loss": -8.356142044067383, "global_step": 49363, "epoch": 293} {"train_loss": -8.233835220336914, "global_step": 49364, "epoch": 293} {"train_loss": -8.201526641845703, "global_step": 49365, "epoch": 293} {"train_loss": -8.204353332519531, "global_step": 49366, "epoch": 293} {"train_loss": -8.145204544067383, "global_step": 49367, "epoch": 293} {"train_loss": -8.05960750579834, "global_step": 49368, "epoch": 293} {"train_loss": -8.087367057800293, "global_step": 49369, "epoch": 293} {"train_loss": -8.203017234802246, "global_step": 49370, "epoch": 293} {"train_loss": -8.095769882202148, "global_step": 49371, "epoch": 293} {"train_loss": -7.918522357940674, "global_step": 49372, "epoch": 293} {"train_loss": -7.965122699737549, "global_step": 49373, "epoch": 293} {"train_loss": -8.264884948730469, "global_step": 49374, "epoch": 293} {"train_loss": -7.94395637512207, "global_step": 49375, "epoch": 293} {"train_loss": -8.139286994934082, "global_step": 49376, "epoch": 293} {"train_loss": -8.14481258392334, "global_step": 49377, "epoch": 293} {"train_loss": -8.20646858215332, "global_step": 49378, "epoch": 293} {"train_loss": -8.152402877807617, "global_step": 49379, "epoch": 293} {"train_loss": -8.177144050598145, "global_step": 49380, "epoch": 293} {"train_loss": -8.233039855957031, "global_step": 49381, "epoch": 293} {"train_loss": -8.349607467651367, "global_step": 49382, "epoch": 293} {"train_loss": -8.388782501220703, "global_step": 49383, "epoch": 293} {"train_loss": -8.363115310668945, "global_step": 49384, "epoch": 293} {"train_loss": -8.137259483337402, "global_step": 49385, "epoch": 293} {"train_loss": -8.30014705657959, "global_step": 49386, "epoch": 293} {"train_loss": -8.249899864196777, "global_step": 49387, "epoch": 293} {"train_loss": -8.285928726196289, "global_step": 49388, "epoch": 293} {"train_loss": -8.283509254455566, "global_step": 49389, "epoch": 293} {"train_loss": -8.408010482788086, "global_step": 49390, "epoch": 293} {"train_loss": -8.277258047035762, "global_step": 49391, "epoch": 293, "val_loss": 186984.796875} {"train_loss": -8.243654251098633, "global_step": 49392, "epoch": 294} {"train_loss": -8.551209449768066, "global_step": 49393, "epoch": 294} {"train_loss": -8.353328704833984, "global_step": 49394, "epoch": 294} {"train_loss": -8.298053741455078, "global_step": 49395, "epoch": 294} {"train_loss": -8.323858261108398, "global_step": 49396, "epoch": 294} {"train_loss": -8.114089012145996, "global_step": 49397, "epoch": 294} {"train_loss": -8.358909606933594, "global_step": 49398, "epoch": 294} {"train_loss": -8.367981910705566, "global_step": 49399, "epoch": 294} {"train_loss": -8.403329849243164, "global_step": 49400, "epoch": 294} {"train_loss": -8.515568733215332, "global_step": 49401, "epoch": 294} {"train_loss": -8.441097259521484, "global_step": 49402, "epoch": 294} {"train_loss": -8.582124710083008, "global_step": 49403, "epoch": 294} {"train_loss": -8.550577163696289, "global_step": 49404, "epoch": 294} {"train_loss": -8.453113555908203, "global_step": 49405, "epoch": 294} {"train_loss": -8.525043487548828, "global_step": 49406, "epoch": 294} {"train_loss": -8.578577041625977, "global_step": 49407, "epoch": 294} {"train_loss": -8.429529190063477, "global_step": 49408, "epoch": 294} {"train_loss": -8.465287208557129, "global_step": 49409, "epoch": 294} {"train_loss": -8.608503341674805, "global_step": 49410, "epoch": 294} {"train_loss": -8.289615631103516, "global_step": 49411, "epoch": 294} {"train_loss": -8.508516311645508, "global_step": 49412, "epoch": 294} {"train_loss": -8.553627967834473, "global_step": 49413, "epoch": 294} {"train_loss": -8.33399772644043, "global_step": 49414, "epoch": 294} {"train_loss": -8.532360076904297, "global_step": 49415, "epoch": 294} {"train_loss": -8.274118423461914, "global_step": 49416, "epoch": 294} {"train_loss": -8.427722930908203, "global_step": 49417, "epoch": 294} {"train_loss": -8.420360565185547, "global_step": 49418, "epoch": 294} {"train_loss": -8.482803344726562, "global_step": 49419, "epoch": 294} {"train_loss": -8.481937408447266, "global_step": 49420, "epoch": 294} {"train_loss": -8.176109313964844, "global_step": 49421, "epoch": 294} {"train_loss": -8.325286865234375, "global_step": 49422, "epoch": 294} {"train_loss": -8.355379104614258, "global_step": 49423, "epoch": 294} {"train_loss": -8.288345336914062, "global_step": 49424, "epoch": 294} {"train_loss": -8.237814903259277, "global_step": 49425, "epoch": 294} {"train_loss": -8.33188533782959, "global_step": 49426, "epoch": 294} {"train_loss": -8.086530685424805, "global_step": 49427, "epoch": 294} {"train_loss": -8.264119148254395, "global_step": 49428, "epoch": 294} {"train_loss": -8.353073120117188, "global_step": 49429, "epoch": 294} {"train_loss": -7.974368572235107, "global_step": 49430, "epoch": 294} {"train_loss": -8.3336181640625, "global_step": 49431, "epoch": 294} {"train_loss": -8.040434837341309, "global_step": 49432, "epoch": 294} {"train_loss": -7.938360214233398, "global_step": 49433, "epoch": 294} {"train_loss": -8.24225902557373, "global_step": 49434, "epoch": 294} {"train_loss": -8.199198722839355, "global_step": 49435, "epoch": 294} {"train_loss": -8.317413330078125, "global_step": 49436, "epoch": 294} {"train_loss": -8.09961223602295, "global_step": 49437, "epoch": 294} {"train_loss": -8.15671157836914, "global_step": 49438, "epoch": 294} {"train_loss": -8.221295356750488, "global_step": 49439, "epoch": 294} {"train_loss": -8.532559394836426, "global_step": 49440, "epoch": 294} {"train_loss": -8.248468399047852, "global_step": 49441, "epoch": 294} {"train_loss": -8.145316123962402, "global_step": 49442, "epoch": 294} {"train_loss": -8.27922248840332, "global_step": 49443, "epoch": 294} {"train_loss": -8.241060256958008, "global_step": 49444, "epoch": 294} {"train_loss": -8.278697967529297, "global_step": 49445, "epoch": 294} {"train_loss": -8.341035842895508, "global_step": 49446, "epoch": 294} {"train_loss": -8.295211791992188, "global_step": 49447, "epoch": 294} {"train_loss": -8.08403205871582, "global_step": 49448, "epoch": 294} {"train_loss": -8.286346435546875, "global_step": 49449, "epoch": 294} {"train_loss": -8.015157699584961, "global_step": 49450, "epoch": 294} {"train_loss": -8.108762741088867, "global_step": 49451, "epoch": 294} {"train_loss": -8.30720329284668, "global_step": 49452, "epoch": 294} {"train_loss": -8.155660629272461, "global_step": 49453, "epoch": 294} {"train_loss": -8.160234451293945, "global_step": 49454, "epoch": 294} {"train_loss": -8.427997589111328, "global_step": 49455, "epoch": 294} {"train_loss": -7.858661651611328, "global_step": 49456, "epoch": 294} {"train_loss": -8.16827392578125, "global_step": 49457, "epoch": 294} {"train_loss": -7.831672668457031, "global_step": 49458, "epoch": 294} {"train_loss": -8.187345504760742, "global_step": 49459, "epoch": 294} {"train_loss": -8.185997009277344, "global_step": 49460, "epoch": 294} {"train_loss": -8.334236145019531, "global_step": 49461, "epoch": 294} {"train_loss": -8.252602577209473, "global_step": 49462, "epoch": 294} {"train_loss": -8.322477340698242, "global_step": 49463, "epoch": 294} {"train_loss": -8.042499542236328, "global_step": 49464, "epoch": 294} {"train_loss": -8.292369842529297, "global_step": 49465, "epoch": 294} {"train_loss": -8.408843994140625, "global_step": 49466, "epoch": 294} {"train_loss": -8.365306854248047, "global_step": 49467, "epoch": 294} {"train_loss": -8.232385635375977, "global_step": 49468, "epoch": 294} {"train_loss": -8.40222454071045, "global_step": 49469, "epoch": 294} {"train_loss": -8.421934127807617, "global_step": 49470, "epoch": 294} {"train_loss": -8.587575912475586, "global_step": 49471, "epoch": 294} {"train_loss": -8.318289756774902, "global_step": 49472, "epoch": 294} {"train_loss": -8.422891616821289, "global_step": 49473, "epoch": 294} {"train_loss": -7.8932013511657715, "global_step": 49474, "epoch": 294} {"train_loss": -8.264256477355957, "global_step": 49475, "epoch": 294} {"train_loss": -8.197033882141113, "global_step": 49476, "epoch": 294} {"train_loss": -7.7786149978637695, "global_step": 49477, "epoch": 294} {"train_loss": -8.086828231811523, "global_step": 49478, "epoch": 294} {"train_loss": -7.85070276260376, "global_step": 49479, "epoch": 294} {"train_loss": -8.057394027709961, "global_step": 49480, "epoch": 294} {"train_loss": -8.05704116821289, "global_step": 49481, "epoch": 294} {"train_loss": -7.912306785583496, "global_step": 49482, "epoch": 294} {"train_loss": -7.8276567459106445, "global_step": 49483, "epoch": 294} {"train_loss": -8.134359359741211, "global_step": 49484, "epoch": 294} {"train_loss": -7.908886909484863, "global_step": 49485, "epoch": 294} {"train_loss": -7.855959892272949, "global_step": 49486, "epoch": 294} {"train_loss": -8.211798667907715, "global_step": 49487, "epoch": 294} {"train_loss": -8.241094589233398, "global_step": 49488, "epoch": 294} {"train_loss": -8.135473251342773, "global_step": 49489, "epoch": 294} {"train_loss": -8.293478012084961, "global_step": 49490, "epoch": 294} {"train_loss": -8.237127304077148, "global_step": 49491, "epoch": 294} {"train_loss": -8.268915176391602, "global_step": 49492, "epoch": 294} {"train_loss": -8.351479530334473, "global_step": 49493, "epoch": 294} {"train_loss": -7.914185047149658, "global_step": 49494, "epoch": 294} {"train_loss": -8.197525024414062, "global_step": 49495, "epoch": 294} {"train_loss": -8.36752700805664, "global_step": 49496, "epoch": 294} {"train_loss": -7.874202728271484, "global_step": 49497, "epoch": 294} {"train_loss": -8.15469741821289, "global_step": 49498, "epoch": 294} {"train_loss": -8.44331169128418, "global_step": 49499, "epoch": 294} {"train_loss": -8.180704116821289, "global_step": 49500, "epoch": 294} {"train_loss": -8.05514907836914, "global_step": 49501, "epoch": 294} {"train_loss": -8.33050537109375, "global_step": 49502, "epoch": 294} {"train_loss": -8.065849304199219, "global_step": 49503, "epoch": 294} {"train_loss": -8.159690856933594, "global_step": 49504, "epoch": 294} {"train_loss": -8.26702880859375, "global_step": 49505, "epoch": 294} {"train_loss": -8.334981918334961, "global_step": 49506, "epoch": 294} {"train_loss": -8.248607635498047, "global_step": 49507, "epoch": 294} {"train_loss": -8.279489517211914, "global_step": 49508, "epoch": 294} {"train_loss": -8.362127304077148, "global_step": 49509, "epoch": 294} {"train_loss": -8.340190887451172, "global_step": 49510, "epoch": 294} {"train_loss": -8.289907455444336, "global_step": 49511, "epoch": 294} {"train_loss": -8.49677848815918, "global_step": 49512, "epoch": 294} {"train_loss": -8.305079460144043, "global_step": 49513, "epoch": 294} {"train_loss": -8.247762680053711, "global_step": 49514, "epoch": 294} {"train_loss": -8.449674606323242, "global_step": 49515, "epoch": 294} {"train_loss": -8.344764709472656, "global_step": 49516, "epoch": 294} {"train_loss": -8.484223365783691, "global_step": 49517, "epoch": 294} {"train_loss": -8.304618835449219, "global_step": 49518, "epoch": 294} {"train_loss": -8.711711883544922, "global_step": 49519, "epoch": 294} {"train_loss": -8.520964622497559, "global_step": 49520, "epoch": 294} {"train_loss": -8.510904312133789, "global_step": 49521, "epoch": 294} {"train_loss": -8.504316329956055, "global_step": 49522, "epoch": 294} {"train_loss": -8.374375343322754, "global_step": 49523, "epoch": 294} {"train_loss": -8.699911117553711, "global_step": 49524, "epoch": 294} {"train_loss": -8.518976211547852, "global_step": 49525, "epoch": 294} {"train_loss": -8.367155075073242, "global_step": 49526, "epoch": 294} {"train_loss": -8.430242538452148, "global_step": 49527, "epoch": 294} {"train_loss": -8.443225860595703, "global_step": 49528, "epoch": 294} {"train_loss": -8.466405868530273, "global_step": 49529, "epoch": 294} {"train_loss": -8.521965026855469, "global_step": 49530, "epoch": 294} {"train_loss": -8.384833335876465, "global_step": 49531, "epoch": 294} {"train_loss": -8.531760215759277, "global_step": 49532, "epoch": 294} {"train_loss": -8.417661666870117, "global_step": 49533, "epoch": 294} {"train_loss": -7.88372802734375, "global_step": 49534, "epoch": 294} {"train_loss": -8.4793701171875, "global_step": 49535, "epoch": 294} {"train_loss": -8.327000617980957, "global_step": 49536, "epoch": 294} {"train_loss": -7.976154804229736, "global_step": 49537, "epoch": 294} {"train_loss": -8.328924179077148, "global_step": 49538, "epoch": 294} {"train_loss": -8.27546501159668, "global_step": 49539, "epoch": 294} {"train_loss": -8.162696838378906, "global_step": 49540, "epoch": 294} {"train_loss": -8.372315406799316, "global_step": 49541, "epoch": 294} {"train_loss": -8.124359130859375, "global_step": 49542, "epoch": 294} {"train_loss": -7.968888759613037, "global_step": 49543, "epoch": 294} {"train_loss": -8.114628791809082, "global_step": 49544, "epoch": 294} {"train_loss": -8.219618797302246, "global_step": 49545, "epoch": 294} {"train_loss": -8.161293029785156, "global_step": 49546, "epoch": 294} {"train_loss": -8.176387786865234, "global_step": 49547, "epoch": 294} {"train_loss": -8.168317794799805, "global_step": 49548, "epoch": 294} {"train_loss": -8.327030181884766, "global_step": 49549, "epoch": 294} {"train_loss": -8.09921932220459, "global_step": 49550, "epoch": 294} {"train_loss": -8.24705696105957, "global_step": 49551, "epoch": 294} {"train_loss": -8.397900581359863, "global_step": 49552, "epoch": 294} {"train_loss": -8.22608470916748, "global_step": 49553, "epoch": 294} {"train_loss": -8.313304901123047, "global_step": 49554, "epoch": 294} {"train_loss": -8.24492359161377, "global_step": 49555, "epoch": 294} {"train_loss": -7.88243293762207, "global_step": 49556, "epoch": 294} {"train_loss": -8.17496109008789, "global_step": 49557, "epoch": 294} {"train_loss": -8.237792015075684, "global_step": 49558, "epoch": 294} {"train_loss": -8.268508823145003, "global_step": 49559, "epoch": 294, "val_loss": 189528.765625} {"train_loss": -7.9910688400268555, "global_step": 49560, "epoch": 295} {"train_loss": -8.329837799072266, "global_step": 49561, "epoch": 295} {"train_loss": -8.421502113342285, "global_step": 49562, "epoch": 295} {"train_loss": -8.174352645874023, "global_step": 49563, "epoch": 295} {"train_loss": -8.349151611328125, "global_step": 49564, "epoch": 295} {"train_loss": -8.318321228027344, "global_step": 49565, "epoch": 295} {"train_loss": -8.192408561706543, "global_step": 49566, "epoch": 295} {"train_loss": -8.04796028137207, "global_step": 49567, "epoch": 295} {"train_loss": -8.606327056884766, "global_step": 49568, "epoch": 295} {"train_loss": -8.428398132324219, "global_step": 49569, "epoch": 295} {"train_loss": -8.565913200378418, "global_step": 49570, "epoch": 295} {"train_loss": -8.251824378967285, "global_step": 49571, "epoch": 295} {"train_loss": -8.247036933898926, "global_step": 49572, "epoch": 295} {"train_loss": -8.524320602416992, "global_step": 49573, "epoch": 295} {"train_loss": -8.311811447143555, "global_step": 49574, "epoch": 295} {"train_loss": -8.508103370666504, "global_step": 49575, "epoch": 295} {"train_loss": -8.329099655151367, "global_step": 49576, "epoch": 295} {"train_loss": -8.010774612426758, "global_step": 49577, "epoch": 295} {"train_loss": -8.303918838500977, "global_step": 49578, "epoch": 295} {"train_loss": -8.205214500427246, "global_step": 49579, "epoch": 295} {"train_loss": -8.14307975769043, "global_step": 49580, "epoch": 295} {"train_loss": -8.513872146606445, "global_step": 49581, "epoch": 295} {"train_loss": -8.209379196166992, "global_step": 49582, "epoch": 295} {"train_loss": -8.076821327209473, "global_step": 49583, "epoch": 295} {"train_loss": -8.504576683044434, "global_step": 49584, "epoch": 295} {"train_loss": -8.336502075195312, "global_step": 49585, "epoch": 295} {"train_loss": -8.109130859375, "global_step": 49586, "epoch": 295} {"train_loss": -8.341558456420898, "global_step": 49587, "epoch": 295} {"train_loss": -8.089884757995605, "global_step": 49588, "epoch": 295} {"train_loss": -8.098821640014648, "global_step": 49589, "epoch": 295} {"train_loss": -8.301668167114258, "global_step": 49590, "epoch": 295} {"train_loss": -8.075765609741211, "global_step": 49591, "epoch": 295} {"train_loss": -8.229120254516602, "global_step": 49592, "epoch": 295} {"train_loss": -8.360786437988281, "global_step": 49593, "epoch": 295} {"train_loss": -8.05109977722168, "global_step": 49594, "epoch": 295} {"train_loss": -7.932956695556641, "global_step": 49595, "epoch": 295} {"train_loss": -8.031702995300293, "global_step": 49596, "epoch": 295} {"train_loss": -8.21308708190918, "global_step": 49597, "epoch": 295} {"train_loss": -8.126059532165527, "global_step": 49598, "epoch": 295} {"train_loss": -7.681983470916748, "global_step": 49599, "epoch": 295} {"train_loss": -8.323751449584961, "global_step": 49600, "epoch": 295} {"train_loss": -8.337027549743652, "global_step": 49601, "epoch": 295} {"train_loss": -7.962557792663574, "global_step": 49602, "epoch": 295} {"train_loss": -8.087137222290039, "global_step": 49603, "epoch": 295} {"train_loss": -8.432741165161133, "global_step": 49604, "epoch": 295} {"train_loss": -8.146267890930176, "global_step": 49605, "epoch": 295} {"train_loss": -7.817618370056152, "global_step": 49606, "epoch": 295} {"train_loss": -8.392330169677734, "global_step": 49607, "epoch": 295} {"train_loss": -8.24772834777832, "global_step": 49608, "epoch": 295} {"train_loss": -8.238982200622559, "global_step": 49609, "epoch": 295} {"train_loss": -8.489595413208008, "global_step": 49610, "epoch": 295} {"train_loss": -8.376323699951172, "global_step": 49611, "epoch": 295} {"train_loss": -8.20650577545166, "global_step": 49612, "epoch": 295} {"train_loss": -8.194729804992676, "global_step": 49613, "epoch": 295} {"train_loss": -8.259294509887695, "global_step": 49614, "epoch": 295} {"train_loss": -8.173833847045898, "global_step": 49615, "epoch": 295} {"train_loss": -8.338748931884766, "global_step": 49616, "epoch": 295} {"train_loss": -8.408842086791992, "global_step": 49617, "epoch": 295} {"train_loss": -8.418018341064453, "global_step": 49618, "epoch": 295} {"train_loss": -8.346229553222656, "global_step": 49619, "epoch": 295} {"train_loss": -8.463918685913086, "global_step": 49620, "epoch": 295} {"train_loss": -8.494531631469727, "global_step": 49621, "epoch": 295} {"train_loss": -8.443904876708984, "global_step": 49622, "epoch": 295} {"train_loss": -8.528183937072754, "global_step": 49623, "epoch": 295} {"train_loss": -8.414510726928711, "global_step": 49624, "epoch": 295} {"train_loss": -8.496194839477539, "global_step": 49625, "epoch": 295} {"train_loss": -8.331402778625488, "global_step": 49626, "epoch": 295} {"train_loss": -8.180183410644531, "global_step": 49627, "epoch": 295} {"train_loss": -8.300323486328125, "global_step": 49628, "epoch": 295} {"train_loss": -8.265764236450195, "global_step": 49629, "epoch": 295} {"train_loss": -8.518598556518555, "global_step": 49630, "epoch": 295} {"train_loss": -8.081828117370605, "global_step": 49631, "epoch": 295} {"train_loss": -8.563787460327148, "global_step": 49632, "epoch": 295} {"train_loss": -8.146833419799805, "global_step": 49633, "epoch": 295} {"train_loss": -8.036857604980469, "global_step": 49634, "epoch": 295} {"train_loss": -8.001995086669922, "global_step": 49635, "epoch": 295} {"train_loss": -7.788918495178223, "global_step": 49636, "epoch": 295} {"train_loss": -7.987113952636719, "global_step": 49637, "epoch": 295} {"train_loss": -7.8890180587768555, "global_step": 49638, "epoch": 295} {"train_loss": -7.945760726928711, "global_step": 49639, "epoch": 295} {"train_loss": -7.725212097167969, "global_step": 49640, "epoch": 295} {"train_loss": -7.8336567878723145, "global_step": 49641, "epoch": 295} {"train_loss": -7.913747787475586, "global_step": 49642, "epoch": 295} {"train_loss": -7.730349063873291, "global_step": 49643, "epoch": 295} {"train_loss": -8.092826843261719, "global_step": 49644, "epoch": 295} {"train_loss": -7.8796234130859375, "global_step": 49645, "epoch": 295} {"train_loss": -8.210108757019043, "global_step": 49646, "epoch": 295} {"train_loss": -7.8859782218933105, "global_step": 49647, "epoch": 295} {"train_loss": -7.9610114097595215, "global_step": 49648, "epoch": 295} {"train_loss": -8.058881759643555, "global_step": 49649, "epoch": 295} {"train_loss": -7.987248420715332, "global_step": 49650, "epoch": 295} {"train_loss": -8.104089736938477, "global_step": 49651, "epoch": 295} {"train_loss": -8.191903114318848, "global_step": 49652, "epoch": 295} {"train_loss": -8.06594467163086, "global_step": 49653, "epoch": 295} {"train_loss": -8.371065139770508, "global_step": 49654, "epoch": 295} {"train_loss": -8.228461265563965, "global_step": 49655, "epoch": 295} {"train_loss": -8.248531341552734, "global_step": 49656, "epoch": 295} {"train_loss": -8.243393898010254, "global_step": 49657, "epoch": 295} {"train_loss": -8.190620422363281, "global_step": 49658, "epoch": 295} {"train_loss": -8.25072956085205, "global_step": 49659, "epoch": 295} {"train_loss": -8.31103229522705, "global_step": 49660, "epoch": 295} {"train_loss": -8.21351432800293, "global_step": 49661, "epoch": 295} {"train_loss": -8.3487548828125, "global_step": 49662, "epoch": 295} {"train_loss": -8.297828674316406, "global_step": 49663, "epoch": 295} {"train_loss": -8.372469902038574, "global_step": 49664, "epoch": 295} {"train_loss": -8.255053520202637, "global_step": 49665, "epoch": 295} {"train_loss": -8.53078842163086, "global_step": 49666, "epoch": 295} {"train_loss": -8.534624099731445, "global_step": 49667, "epoch": 295} {"train_loss": -8.30637264251709, "global_step": 49668, "epoch": 295} {"train_loss": -8.581526756286621, "global_step": 49669, "epoch": 295} {"train_loss": -8.143658638000488, "global_step": 49670, "epoch": 295} {"train_loss": -8.43813705444336, "global_step": 49671, "epoch": 295} {"train_loss": -8.055595397949219, "global_step": 49672, "epoch": 295} {"train_loss": -8.409780502319336, "global_step": 49673, "epoch": 295} {"train_loss": -7.897736072540283, "global_step": 49674, "epoch": 295} {"train_loss": -8.27185344696045, "global_step": 49675, "epoch": 295} {"train_loss": -7.973919868469238, "global_step": 49676, "epoch": 295} {"train_loss": -8.0364990234375, "global_step": 49677, "epoch": 295} {"train_loss": -8.026790618896484, "global_step": 49678, "epoch": 295} {"train_loss": -8.019004821777344, "global_step": 49679, "epoch": 295} {"train_loss": -7.939089775085449, "global_step": 49680, "epoch": 295} {"train_loss": -8.216314315795898, "global_step": 49681, "epoch": 295} {"train_loss": -8.131851196289062, "global_step": 49682, "epoch": 295} {"train_loss": -8.015478134155273, "global_step": 49683, "epoch": 295} {"train_loss": -8.1785888671875, "global_step": 49684, "epoch": 295} {"train_loss": -8.186748504638672, "global_step": 49685, "epoch": 295} {"train_loss": -8.193485260009766, "global_step": 49686, "epoch": 295} {"train_loss": -8.083660125732422, "global_step": 49687, "epoch": 295} {"train_loss": -8.258255004882812, "global_step": 49688, "epoch": 295} {"train_loss": -8.254308700561523, "global_step": 49689, "epoch": 295} {"train_loss": -8.171966552734375, "global_step": 49690, "epoch": 295} {"train_loss": -8.194249153137207, "global_step": 49691, "epoch": 295} {"train_loss": -8.057634353637695, "global_step": 49692, "epoch": 295} {"train_loss": -8.115428924560547, "global_step": 49693, "epoch": 295} {"train_loss": -8.370248794555664, "global_step": 49694, "epoch": 295} {"train_loss": -8.331891059875488, "global_step": 49695, "epoch": 295} {"train_loss": -8.301459312438965, "global_step": 49696, "epoch": 295} {"train_loss": -8.355913162231445, "global_step": 49697, "epoch": 295} {"train_loss": -8.224895477294922, "global_step": 49698, "epoch": 295} {"train_loss": -8.1639986038208, "global_step": 49699, "epoch": 295} {"train_loss": -8.485648155212402, "global_step": 49700, "epoch": 295} {"train_loss": -8.301702499389648, "global_step": 49701, "epoch": 295} {"train_loss": -8.567588806152344, "global_step": 49702, "epoch": 295} {"train_loss": -8.169205665588379, "global_step": 49703, "epoch": 295} {"train_loss": -8.611812591552734, "global_step": 49704, "epoch": 295} {"train_loss": -8.425764083862305, "global_step": 49705, "epoch": 295} {"train_loss": -8.417367935180664, "global_step": 49706, "epoch": 295} {"train_loss": -8.39715576171875, "global_step": 49707, "epoch": 295} {"train_loss": -8.53614616394043, "global_step": 49708, "epoch": 295} {"train_loss": -8.454996109008789, "global_step": 49709, "epoch": 295} {"train_loss": -8.447561264038086, "global_step": 49710, "epoch": 295} {"train_loss": -8.609549522399902, "global_step": 49711, "epoch": 295} {"train_loss": -8.214178085327148, "global_step": 49712, "epoch": 295} {"train_loss": -8.495379447937012, "global_step": 49713, "epoch": 295} {"train_loss": -8.447153091430664, "global_step": 49714, "epoch": 295} {"train_loss": -8.656303405761719, "global_step": 49715, "epoch": 295} {"train_loss": -8.35065746307373, "global_step": 49716, "epoch": 295} {"train_loss": -8.380097389221191, "global_step": 49717, "epoch": 295} {"train_loss": -7.8686699867248535, "global_step": 49718, "epoch": 295} {"train_loss": -8.072304725646973, "global_step": 49719, "epoch": 295} {"train_loss": -8.228740692138672, "global_step": 49720, "epoch": 295} {"train_loss": -8.246406555175781, "global_step": 49721, "epoch": 295} {"train_loss": -8.027203559875488, "global_step": 49722, "epoch": 295} {"train_loss": -8.289261817932129, "global_step": 49723, "epoch": 295} {"train_loss": -8.432246208190918, "global_step": 49724, "epoch": 295} {"train_loss": -8.224363327026367, "global_step": 49725, "epoch": 295} {"train_loss": -8.25242805480957, "global_step": 49726, "epoch": 295} {"train_loss": -8.235396121229444, "global_step": 49727, "epoch": 295, "val_loss": 187669.609375, "train_action_mse_error": 8.06771469116211} {"train_loss": -8.17763614654541, "global_step": 49728, "epoch": 296} {"train_loss": -8.33759593963623, "global_step": 49729, "epoch": 296} {"train_loss": -8.409339904785156, "global_step": 49730, "epoch": 296} {"train_loss": -8.449777603149414, "global_step": 49731, "epoch": 296} {"train_loss": -8.327055931091309, "global_step": 49732, "epoch": 296} {"train_loss": -8.21629524230957, "global_step": 49733, "epoch": 296} {"train_loss": -8.368824005126953, "global_step": 49734, "epoch": 296} {"train_loss": -8.5385103225708, "global_step": 49735, "epoch": 296} {"train_loss": -8.691431045532227, "global_step": 49736, "epoch": 296} {"train_loss": -8.494357109069824, "global_step": 49737, "epoch": 296} {"train_loss": -8.233601570129395, "global_step": 49738, "epoch": 296} {"train_loss": -8.2625732421875, "global_step": 49739, "epoch": 296} {"train_loss": -8.155771255493164, "global_step": 49740, "epoch": 296} {"train_loss": -8.317913055419922, "global_step": 49741, "epoch": 296} {"train_loss": -8.431121826171875, "global_step": 49742, "epoch": 296} {"train_loss": -8.329233169555664, "global_step": 49743, "epoch": 296} {"train_loss": -8.405996322631836, "global_step": 49744, "epoch": 296} {"train_loss": -8.318658828735352, "global_step": 49745, "epoch": 296} {"train_loss": -8.520463943481445, "global_step": 49746, "epoch": 296} {"train_loss": -8.4367036819458, "global_step": 49747, "epoch": 296} {"train_loss": -8.09461784362793, "global_step": 49748, "epoch": 296} {"train_loss": -8.315682411193848, "global_step": 49749, "epoch": 296} {"train_loss": -8.337000846862793, "global_step": 49750, "epoch": 296} {"train_loss": -8.4267578125, "global_step": 49751, "epoch": 296} {"train_loss": -8.299032211303711, "global_step": 49752, "epoch": 296} {"train_loss": -8.35468578338623, "global_step": 49753, "epoch": 296} {"train_loss": -8.48385238647461, "global_step": 49754, "epoch": 296} {"train_loss": -8.412483215332031, "global_step": 49755, "epoch": 296} {"train_loss": -8.107094764709473, "global_step": 49756, "epoch": 296} {"train_loss": -8.249678611755371, "global_step": 49757, "epoch": 296} {"train_loss": -8.291528701782227, "global_step": 49758, "epoch": 296} {"train_loss": -8.127188682556152, "global_step": 49759, "epoch": 296} {"train_loss": -8.060847282409668, "global_step": 49760, "epoch": 296} {"train_loss": -8.214682579040527, "global_step": 49761, "epoch": 296} {"train_loss": -7.9811320304870605, "global_step": 49762, "epoch": 296} {"train_loss": -7.824868202209473, "global_step": 49763, "epoch": 296} {"train_loss": -8.339914321899414, "global_step": 49764, "epoch": 296} {"train_loss": -8.067115783691406, "global_step": 49765, "epoch": 296} {"train_loss": -8.143768310546875, "global_step": 49766, "epoch": 296} {"train_loss": -8.286195755004883, "global_step": 49767, "epoch": 296} {"train_loss": -8.171869277954102, "global_step": 49768, "epoch": 296} {"train_loss": -7.982836723327637, "global_step": 49769, "epoch": 296} {"train_loss": -8.118124008178711, "global_step": 49770, "epoch": 296} {"train_loss": -8.201400756835938, "global_step": 49771, "epoch": 296} {"train_loss": -8.360041618347168, "global_step": 49772, "epoch": 296} {"train_loss": -8.191783905029297, "global_step": 49773, "epoch": 296} {"train_loss": -8.363999366760254, "global_step": 49774, "epoch": 296} {"train_loss": -8.263225555419922, "global_step": 49775, "epoch": 296} {"train_loss": -8.229182243347168, "global_step": 49776, "epoch": 296} {"train_loss": -8.320899963378906, "global_step": 49777, "epoch": 296} {"train_loss": -8.373514175415039, "global_step": 49778, "epoch": 296} {"train_loss": -8.37191390991211, "global_step": 49779, "epoch": 296} {"train_loss": -8.167332649230957, "global_step": 49780, "epoch": 296} {"train_loss": -8.463403701782227, "global_step": 49781, "epoch": 296} {"train_loss": -8.480506896972656, "global_step": 49782, "epoch": 296} {"train_loss": -8.393390655517578, "global_step": 49783, "epoch": 296} {"train_loss": -8.329586029052734, "global_step": 49784, "epoch": 296} {"train_loss": -8.331511497497559, "global_step": 49785, "epoch": 296} {"train_loss": -8.497761726379395, "global_step": 49786, "epoch": 296} {"train_loss": -8.369877815246582, "global_step": 49787, "epoch": 296} {"train_loss": -8.560991287231445, "global_step": 49788, "epoch": 296} {"train_loss": -8.413594245910645, "global_step": 49789, "epoch": 296} {"train_loss": -8.516468048095703, "global_step": 49790, "epoch": 296} {"train_loss": -8.359496116638184, "global_step": 49791, "epoch": 296} {"train_loss": -8.46146011352539, "global_step": 49792, "epoch": 296} {"train_loss": -8.338869094848633, "global_step": 49793, "epoch": 296} {"train_loss": -8.519367218017578, "global_step": 49794, "epoch": 296} {"train_loss": -8.30570125579834, "global_step": 49795, "epoch": 296} {"train_loss": -8.560054779052734, "global_step": 49796, "epoch": 296} {"train_loss": -8.399322509765625, "global_step": 49797, "epoch": 296} {"train_loss": -8.450180053710938, "global_step": 49798, "epoch": 296} {"train_loss": -8.561275482177734, "global_step": 49799, "epoch": 296} {"train_loss": -8.468990325927734, "global_step": 49800, "epoch": 296} {"train_loss": -8.526522636413574, "global_step": 49801, "epoch": 296} {"train_loss": -8.380267143249512, "global_step": 49802, "epoch": 296} {"train_loss": -8.25943374633789, "global_step": 49803, "epoch": 296} {"train_loss": -8.41379165649414, "global_step": 49804, "epoch": 296} {"train_loss": -8.342470169067383, "global_step": 49805, "epoch": 296} {"train_loss": -7.894674301147461, "global_step": 49806, "epoch": 296} {"train_loss": -8.271366119384766, "global_step": 49807, "epoch": 296} {"train_loss": -7.987178802490234, "global_step": 49808, "epoch": 296} {"train_loss": -8.246947288513184, "global_step": 49809, "epoch": 296} {"train_loss": -8.266489028930664, "global_step": 49810, "epoch": 296} {"train_loss": -8.270004272460938, "global_step": 49811, "epoch": 296} {"train_loss": -8.133838653564453, "global_step": 49812, "epoch": 296} {"train_loss": -8.070718765258789, "global_step": 49813, "epoch": 296} {"train_loss": -8.21898078918457, "global_step": 49814, "epoch": 296} {"train_loss": -8.31917667388916, "global_step": 49815, "epoch": 296} {"train_loss": -8.467597961425781, "global_step": 49816, "epoch": 296} {"train_loss": -8.278952598571777, "global_step": 49817, "epoch": 296} {"train_loss": -8.1216402053833, "global_step": 49818, "epoch": 296} {"train_loss": -8.269487380981445, "global_step": 49819, "epoch": 296} {"train_loss": -8.570690155029297, "global_step": 49820, "epoch": 296} {"train_loss": -8.188748359680176, "global_step": 49821, "epoch": 296} {"train_loss": -8.432718276977539, "global_step": 49822, "epoch": 296} {"train_loss": -8.257255554199219, "global_step": 49823, "epoch": 296} {"train_loss": -8.357547760009766, "global_step": 49824, "epoch": 296} {"train_loss": -8.106348037719727, "global_step": 49825, "epoch": 296} {"train_loss": -7.95904541015625, "global_step": 49826, "epoch": 296} {"train_loss": -7.857187271118164, "global_step": 49827, "epoch": 296} {"train_loss": -8.182037353515625, "global_step": 49828, "epoch": 296} {"train_loss": -7.678947448730469, "global_step": 49829, "epoch": 296} {"train_loss": -7.876382350921631, "global_step": 49830, "epoch": 296} {"train_loss": -8.034687042236328, "global_step": 49831, "epoch": 296} {"train_loss": -7.981597900390625, "global_step": 49832, "epoch": 296} {"train_loss": -7.883086204528809, "global_step": 49833, "epoch": 296} {"train_loss": -7.9279632568359375, "global_step": 49834, "epoch": 296} {"train_loss": -8.125922203063965, "global_step": 49835, "epoch": 296} {"train_loss": -8.048999786376953, "global_step": 49836, "epoch": 296} {"train_loss": -8.260675430297852, "global_step": 49837, "epoch": 296} {"train_loss": -8.21902084350586, "global_step": 49838, "epoch": 296} {"train_loss": -8.148693084716797, "global_step": 49839, "epoch": 296} {"train_loss": -8.206350326538086, "global_step": 49840, "epoch": 296} {"train_loss": -8.310920715332031, "global_step": 49841, "epoch": 296} {"train_loss": -8.185566902160645, "global_step": 49842, "epoch": 296} {"train_loss": -8.386608123779297, "global_step": 49843, "epoch": 296} {"train_loss": -8.338600158691406, "global_step": 49844, "epoch": 296} {"train_loss": -8.160998344421387, "global_step": 49845, "epoch": 296} {"train_loss": -8.316471099853516, "global_step": 49846, "epoch": 296} {"train_loss": -8.269744873046875, "global_step": 49847, "epoch": 296} {"train_loss": -8.40019702911377, "global_step": 49848, "epoch": 296} {"train_loss": -8.125377655029297, "global_step": 49849, "epoch": 296} {"train_loss": -8.19926929473877, "global_step": 49850, "epoch": 296} {"train_loss": -8.381736755371094, "global_step": 49851, "epoch": 296} {"train_loss": -8.196839332580566, "global_step": 49852, "epoch": 296} {"train_loss": -8.245248794555664, "global_step": 49853, "epoch": 296} {"train_loss": -8.377035140991211, "global_step": 49854, "epoch": 296} {"train_loss": -8.256844520568848, "global_step": 49855, "epoch": 296} {"train_loss": -8.308650970458984, "global_step": 49856, "epoch": 296} {"train_loss": -8.346467018127441, "global_step": 49857, "epoch": 296} {"train_loss": -8.273824691772461, "global_step": 49858, "epoch": 296} {"train_loss": -8.405807495117188, "global_step": 49859, "epoch": 296} {"train_loss": -8.60604190826416, "global_step": 49860, "epoch": 296} {"train_loss": -8.340325355529785, "global_step": 49861, "epoch": 296} {"train_loss": -8.265987396240234, "global_step": 49862, "epoch": 296} {"train_loss": -8.10009479522705, "global_step": 49863, "epoch": 296} {"train_loss": -8.449944496154785, "global_step": 49864, "epoch": 296} {"train_loss": -8.121277809143066, "global_step": 49865, "epoch": 296} {"train_loss": -8.095428466796875, "global_step": 49866, "epoch": 296} {"train_loss": -8.188898086547852, "global_step": 49867, "epoch": 296} {"train_loss": -8.028207778930664, "global_step": 49868, "epoch": 296} {"train_loss": -8.104215621948242, "global_step": 49869, "epoch": 296} {"train_loss": -8.163063049316406, "global_step": 49870, "epoch": 296} {"train_loss": -7.917480945587158, "global_step": 49871, "epoch": 296} {"train_loss": -8.228948593139648, "global_step": 49872, "epoch": 296} {"train_loss": -7.892972469329834, "global_step": 49873, "epoch": 296} {"train_loss": -7.911066055297852, "global_step": 49874, "epoch": 296} {"train_loss": -7.750337600708008, "global_step": 49875, "epoch": 296} {"train_loss": -7.969769477844238, "global_step": 49876, "epoch": 296} {"train_loss": -7.973438739776611, "global_step": 49877, "epoch": 296} {"train_loss": -8.00639820098877, "global_step": 49878, "epoch": 296} {"train_loss": -7.85505485534668, "global_step": 49879, "epoch": 296} {"train_loss": -8.092522621154785, "global_step": 49880, "epoch": 296} {"train_loss": -8.080610275268555, "global_step": 49881, "epoch": 296} {"train_loss": -7.839635848999023, "global_step": 49882, "epoch": 296} {"train_loss": -8.168001174926758, "global_step": 49883, "epoch": 296} {"train_loss": -8.046085357666016, "global_step": 49884, "epoch": 296} {"train_loss": -7.963972568511963, "global_step": 49885, "epoch": 296} {"train_loss": -8.07876968383789, "global_step": 49886, "epoch": 296} {"train_loss": -8.118528366088867, "global_step": 49887, "epoch": 296} {"train_loss": -8.192373275756836, "global_step": 49888, "epoch": 296} {"train_loss": -8.323934555053711, "global_step": 49889, "epoch": 296} {"train_loss": -8.272157669067383, "global_step": 49890, "epoch": 296} {"train_loss": -8.327339172363281, "global_step": 49891, "epoch": 296} {"train_loss": -8.301380157470703, "global_step": 49892, "epoch": 296} {"train_loss": -8.271824836730957, "global_step": 49893, "epoch": 296} {"train_loss": -7.940920352935791, "global_step": 49894, "epoch": 296} {"train_loss": -8.24210489647729, "global_step": 49895, "epoch": 296, "val_loss": 188716.015625} {"train_loss": -8.412874221801758, "global_step": 49896, "epoch": 297} {"train_loss": -8.37510871887207, "global_step": 49897, "epoch": 297} {"train_loss": -8.350215911865234, "global_step": 49898, "epoch": 297} {"train_loss": -8.454158782958984, "global_step": 49899, "epoch": 297} {"train_loss": -8.115488052368164, "global_step": 49900, "epoch": 297} {"train_loss": -8.448628425598145, "global_step": 49901, "epoch": 297} {"train_loss": -8.03671932220459, "global_step": 49902, "epoch": 297} {"train_loss": -8.365259170532227, "global_step": 49903, "epoch": 297} {"train_loss": -8.319806098937988, "global_step": 49904, "epoch": 297} {"train_loss": -8.50611400604248, "global_step": 49905, "epoch": 297} {"train_loss": -8.446125030517578, "global_step": 49906, "epoch": 297} {"train_loss": -8.315441131591797, "global_step": 49907, "epoch": 297} {"train_loss": -8.477872848510742, "global_step": 49908, "epoch": 297} {"train_loss": -8.290326118469238, "global_step": 49909, "epoch": 297} {"train_loss": -8.500336647033691, "global_step": 49910, "epoch": 297} {"train_loss": -8.732041358947754, "global_step": 49911, "epoch": 297} {"train_loss": -8.349191665649414, "global_step": 49912, "epoch": 297} {"train_loss": -8.288053512573242, "global_step": 49913, "epoch": 297} {"train_loss": -8.222192764282227, "global_step": 49914, "epoch": 297} {"train_loss": -8.462603569030762, "global_step": 49915, "epoch": 297} {"train_loss": -8.462899208068848, "global_step": 49916, "epoch": 297} {"train_loss": -8.468412399291992, "global_step": 49917, "epoch": 297} {"train_loss": -8.422638893127441, "global_step": 49918, "epoch": 297} {"train_loss": -8.161274909973145, "global_step": 49919, "epoch": 297} {"train_loss": -8.332805633544922, "global_step": 49920, "epoch": 297} {"train_loss": -8.490477561950684, "global_step": 49921, "epoch": 297} {"train_loss": -8.440624237060547, "global_step": 49922, "epoch": 297} {"train_loss": -8.16232681274414, "global_step": 49923, "epoch": 297} {"train_loss": -8.311124801635742, "global_step": 49924, "epoch": 297} {"train_loss": -8.421039581298828, "global_step": 49925, "epoch": 297} {"train_loss": -8.334857940673828, "global_step": 49926, "epoch": 297} {"train_loss": -8.44371223449707, "global_step": 49927, "epoch": 297} {"train_loss": -8.50106430053711, "global_step": 49928, "epoch": 297} {"train_loss": -8.368365287780762, "global_step": 49929, "epoch": 297} {"train_loss": -8.333303451538086, "global_step": 49930, "epoch": 297} {"train_loss": -8.25168228149414, "global_step": 49931, "epoch": 297} {"train_loss": -8.38198184967041, "global_step": 49932, "epoch": 297} {"train_loss": -8.447344779968262, "global_step": 49933, "epoch": 297} {"train_loss": -8.487405776977539, "global_step": 49934, "epoch": 297} {"train_loss": -8.270669937133789, "global_step": 49935, "epoch": 297} {"train_loss": -8.329461097717285, "global_step": 49936, "epoch": 297} {"train_loss": -8.3983154296875, "global_step": 49937, "epoch": 297} {"train_loss": -8.14305305480957, "global_step": 49938, "epoch": 297} {"train_loss": -8.396240234375, "global_step": 49939, "epoch": 297} {"train_loss": -8.359853744506836, "global_step": 49940, "epoch": 297} {"train_loss": -8.368388175964355, "global_step": 49941, "epoch": 297} {"train_loss": -8.559365272521973, "global_step": 49942, "epoch": 297} {"train_loss": -8.279764175415039, "global_step": 49943, "epoch": 297} {"train_loss": -8.46908187866211, "global_step": 49944, "epoch": 297} {"train_loss": -8.300642013549805, "global_step": 49945, "epoch": 297} {"train_loss": -8.325117111206055, "global_step": 49946, "epoch": 297} {"train_loss": -8.33474349975586, "global_step": 49947, "epoch": 297} {"train_loss": -8.270832061767578, "global_step": 49948, "epoch": 297} {"train_loss": -8.160362243652344, "global_step": 49949, "epoch": 297} {"train_loss": -8.46094799041748, "global_step": 49950, "epoch": 297} {"train_loss": -8.334203720092773, "global_step": 49951, "epoch": 297} {"train_loss": -8.468376159667969, "global_step": 49952, "epoch": 297} {"train_loss": -8.28896713256836, "global_step": 49953, "epoch": 297} {"train_loss": -8.295902252197266, "global_step": 49954, "epoch": 297} {"train_loss": -8.384149551391602, "global_step": 49955, "epoch": 297} {"train_loss": -8.439410209655762, "global_step": 49956, "epoch": 297} {"train_loss": -8.329986572265625, "global_step": 49957, "epoch": 297} {"train_loss": -8.203140258789062, "global_step": 49958, "epoch": 297} {"train_loss": -8.385969161987305, "global_step": 49959, "epoch": 297} {"train_loss": -8.261225700378418, "global_step": 49960, "epoch": 297} {"train_loss": -8.423479080200195, "global_step": 49961, "epoch": 297} {"train_loss": -8.457082748413086, "global_step": 49962, "epoch": 297} {"train_loss": -8.266904830932617, "global_step": 49963, "epoch": 297} {"train_loss": -8.555805206298828, "global_step": 49964, "epoch": 297} {"train_loss": -8.213882446289062, "global_step": 49965, "epoch": 297} {"train_loss": -8.263978004455566, "global_step": 49966, "epoch": 297} {"train_loss": -8.60167121887207, "global_step": 49967, "epoch": 297} {"train_loss": -8.211085319519043, "global_step": 49968, "epoch": 297} {"train_loss": -8.44386100769043, "global_step": 49969, "epoch": 297} {"train_loss": -8.417240142822266, "global_step": 49970, "epoch": 297} {"train_loss": -8.10015869140625, "global_step": 49971, "epoch": 297} {"train_loss": -8.470670700073242, "global_step": 49972, "epoch": 297} {"train_loss": -7.718141555786133, "global_step": 49973, "epoch": 297} {"train_loss": -8.47443962097168, "global_step": 49974, "epoch": 297} {"train_loss": -8.024807929992676, "global_step": 49975, "epoch": 297} {"train_loss": -8.566558837890625, "global_step": 49976, "epoch": 297} {"train_loss": -8.389041900634766, "global_step": 49977, "epoch": 297} {"train_loss": -8.40183162689209, "global_step": 49978, "epoch": 297} {"train_loss": -8.375797271728516, "global_step": 49979, "epoch": 297} {"train_loss": -8.268499374389648, "global_step": 49980, "epoch": 297} {"train_loss": -8.273902893066406, "global_step": 49981, "epoch": 297} {"train_loss": -8.3964262008667, "global_step": 49982, "epoch": 297} {"train_loss": -8.08802604675293, "global_step": 49983, "epoch": 297} {"train_loss": -8.40771484375, "global_step": 49984, "epoch": 297} {"train_loss": -8.19617748260498, "global_step": 49985, "epoch": 297} {"train_loss": -8.389984130859375, "global_step": 49986, "epoch": 297} {"train_loss": -8.316680908203125, "global_step": 49987, "epoch": 297} {"train_loss": -8.247583389282227, "global_step": 49988, "epoch": 297} {"train_loss": -8.447650909423828, "global_step": 49989, "epoch": 297} {"train_loss": -8.114214897155762, "global_step": 49990, "epoch": 297} {"train_loss": -8.349308013916016, "global_step": 49991, "epoch": 297} {"train_loss": -8.31010913848877, "global_step": 49992, "epoch": 297} {"train_loss": -8.16512393951416, "global_step": 49993, "epoch": 297} {"train_loss": -8.133472442626953, "global_step": 49994, "epoch": 297} {"train_loss": -8.145662307739258, "global_step": 49995, "epoch": 297} {"train_loss": -8.084324836730957, "global_step": 49996, "epoch": 297} {"train_loss": -8.056892395019531, "global_step": 49997, "epoch": 297} {"train_loss": -8.144248962402344, "global_step": 49998, "epoch": 297} {"train_loss": -8.017251968383789, "global_step": 49999, "epoch": 297} {"train_loss": -7.926435470581055, "global_step": 50000, "epoch": 297} {"train_loss": -8.062373161315918, "global_step": 50001, "epoch": 297} {"train_loss": -8.030961990356445, "global_step": 50002, "epoch": 297} {"train_loss": -8.114409446716309, "global_step": 50003, "epoch": 297} {"train_loss": -8.14880657196045, "global_step": 50004, "epoch": 297} {"train_loss": -8.281455993652344, "global_step": 50005, "epoch": 297} {"train_loss": -8.153185844421387, "global_step": 50006, "epoch": 297} {"train_loss": -7.893227577209473, "global_step": 50007, "epoch": 297} {"train_loss": -8.258307456970215, "global_step": 50008, "epoch": 297} {"train_loss": -8.2166166305542, "global_step": 50009, "epoch": 297} {"train_loss": -8.329985618591309, "global_step": 50010, "epoch": 297} {"train_loss": -8.233770370483398, "global_step": 50011, "epoch": 297} {"train_loss": -8.282754898071289, "global_step": 50012, "epoch": 297} {"train_loss": -8.136959075927734, "global_step": 50013, "epoch": 297} {"train_loss": -8.211161613464355, "global_step": 50014, "epoch": 297} {"train_loss": -7.948705673217773, "global_step": 50015, "epoch": 297} {"train_loss": -7.848258018493652, "global_step": 50016, "epoch": 297} {"train_loss": -8.362984657287598, "global_step": 50017, "epoch": 297} {"train_loss": -8.370471954345703, "global_step": 50018, "epoch": 297} {"train_loss": -8.169698715209961, "global_step": 50019, "epoch": 297} {"train_loss": -8.30501651763916, "global_step": 50020, "epoch": 297} {"train_loss": -8.24926471710205, "global_step": 50021, "epoch": 297} {"train_loss": -8.42336654663086, "global_step": 50022, "epoch": 297} {"train_loss": -8.508282661437988, "global_step": 50023, "epoch": 297} {"train_loss": -8.379555702209473, "global_step": 50024, "epoch": 297} {"train_loss": -8.36334228515625, "global_step": 50025, "epoch": 297} {"train_loss": -8.335916519165039, "global_step": 50026, "epoch": 297} {"train_loss": -8.331189155578613, "global_step": 50027, "epoch": 297} {"train_loss": -8.456742286682129, "global_step": 50028, "epoch": 297} {"train_loss": -8.309625625610352, "global_step": 50029, "epoch": 297} {"train_loss": -8.290241241455078, "global_step": 50030, "epoch": 297} {"train_loss": -8.167642593383789, "global_step": 50031, "epoch": 297} {"train_loss": -8.359478950500488, "global_step": 50032, "epoch": 297} {"train_loss": -8.350691795349121, "global_step": 50033, "epoch": 297} {"train_loss": -8.055872917175293, "global_step": 50034, "epoch": 297} {"train_loss": -8.518915176391602, "global_step": 50035, "epoch": 297} {"train_loss": -8.060338020324707, "global_step": 50036, "epoch": 297} {"train_loss": -8.494064331054688, "global_step": 50037, "epoch": 297} {"train_loss": -8.058979034423828, "global_step": 50038, "epoch": 297} {"train_loss": -8.437092781066895, "global_step": 50039, "epoch": 297} {"train_loss": -8.019387245178223, "global_step": 50040, "epoch": 297} {"train_loss": -8.360984802246094, "global_step": 50041, "epoch": 297} {"train_loss": -8.147472381591797, "global_step": 50042, "epoch": 297} {"train_loss": -8.3840970993042, "global_step": 50043, "epoch": 297} {"train_loss": -8.2788724899292, "global_step": 50044, "epoch": 297} {"train_loss": -8.328593254089355, "global_step": 50045, "epoch": 297} {"train_loss": -8.351282119750977, "global_step": 50046, "epoch": 297} {"train_loss": -7.983669281005859, "global_step": 50047, "epoch": 297} {"train_loss": -7.98539924621582, "global_step": 50048, "epoch": 297} {"train_loss": -8.180777549743652, "global_step": 50049, "epoch": 297} {"train_loss": -8.21544075012207, "global_step": 50050, "epoch": 297} {"train_loss": -8.176477432250977, "global_step": 50051, "epoch": 297} {"train_loss": -7.998093605041504, "global_step": 50052, "epoch": 297} {"train_loss": -7.723006725311279, "global_step": 50053, "epoch": 297} {"train_loss": -8.458338737487793, "global_step": 50054, "epoch": 297} {"train_loss": -8.169471740722656, "global_step": 50055, "epoch": 297} {"train_loss": -8.434709548950195, "global_step": 50056, "epoch": 297} {"train_loss": -8.141910552978516, "global_step": 50057, "epoch": 297} {"train_loss": -8.20488166809082, "global_step": 50058, "epoch": 297} {"train_loss": -8.040826797485352, "global_step": 50059, "epoch": 297} {"train_loss": -8.18115234375, "global_step": 50060, "epoch": 297} {"train_loss": -8.266276359558105, "global_step": 50061, "epoch": 297} {"train_loss": -7.981210231781006, "global_step": 50062, "epoch": 297} {"train_loss": -8.286225642476763, "global_step": 50063, "epoch": 297, "val_loss": 186664.4375} {"train_loss": -8.272706031799316, "global_step": 50064, "epoch": 298} {"train_loss": -8.528549194335938, "global_step": 50065, "epoch": 298} {"train_loss": -8.376057624816895, "global_step": 50066, "epoch": 298} {"train_loss": -8.049368858337402, "global_step": 50067, "epoch": 298} {"train_loss": -8.494207382202148, "global_step": 50068, "epoch": 298} {"train_loss": -8.332178115844727, "global_step": 50069, "epoch": 298} {"train_loss": -8.38979721069336, "global_step": 50070, "epoch": 298} {"train_loss": -8.252538681030273, "global_step": 50071, "epoch": 298} {"train_loss": -8.348691940307617, "global_step": 50072, "epoch": 298} {"train_loss": -8.367491722106934, "global_step": 50073, "epoch": 298} {"train_loss": -8.20980167388916, "global_step": 50074, "epoch": 298} {"train_loss": -8.288522720336914, "global_step": 50075, "epoch": 298} {"train_loss": -8.159139633178711, "global_step": 50076, "epoch": 298} {"train_loss": -8.536951065063477, "global_step": 50077, "epoch": 298} {"train_loss": -8.521149635314941, "global_step": 50078, "epoch": 298} {"train_loss": -8.245080947875977, "global_step": 50079, "epoch": 298} {"train_loss": -8.436687469482422, "global_step": 50080, "epoch": 298} {"train_loss": -8.336549758911133, "global_step": 50081, "epoch": 298} {"train_loss": -8.254390716552734, "global_step": 50082, "epoch": 298} {"train_loss": -8.50517463684082, "global_step": 50083, "epoch": 298} {"train_loss": -8.255062103271484, "global_step": 50084, "epoch": 298} {"train_loss": -8.588140487670898, "global_step": 50085, "epoch": 298} {"train_loss": -8.226056098937988, "global_step": 50086, "epoch": 298} {"train_loss": -8.451764106750488, "global_step": 50087, "epoch": 298} {"train_loss": -8.002971649169922, "global_step": 50088, "epoch": 298} {"train_loss": -8.134645462036133, "global_step": 50089, "epoch": 298} {"train_loss": -8.239249229431152, "global_step": 50090, "epoch": 298} {"train_loss": -8.263010025024414, "global_step": 50091, "epoch": 298} {"train_loss": -8.184690475463867, "global_step": 50092, "epoch": 298} {"train_loss": -8.443299293518066, "global_step": 50093, "epoch": 298} {"train_loss": -8.244917869567871, "global_step": 50094, "epoch": 298} {"train_loss": -8.407941818237305, "global_step": 50095, "epoch": 298} {"train_loss": -8.339046478271484, "global_step": 50096, "epoch": 298} {"train_loss": -7.846166610717773, "global_step": 50097, "epoch": 298} {"train_loss": -8.132997512817383, "global_step": 50098, "epoch": 298} {"train_loss": -8.299020767211914, "global_step": 50099, "epoch": 298} {"train_loss": -8.290420532226562, "global_step": 50100, "epoch": 298} {"train_loss": -8.413727760314941, "global_step": 50101, "epoch": 298} {"train_loss": -8.496712684631348, "global_step": 50102, "epoch": 298} {"train_loss": -8.247054100036621, "global_step": 50103, "epoch": 298} {"train_loss": -8.271943092346191, "global_step": 50104, "epoch": 298} {"train_loss": -8.42037296295166, "global_step": 50105, "epoch": 298} {"train_loss": -8.293334007263184, "global_step": 50106, "epoch": 298} {"train_loss": -8.35542106628418, "global_step": 50107, "epoch": 298} {"train_loss": -8.258330345153809, "global_step": 50108, "epoch": 298} {"train_loss": -8.225433349609375, "global_step": 50109, "epoch": 298} {"train_loss": -7.976696014404297, "global_step": 50110, "epoch": 298} {"train_loss": -8.419261932373047, "global_step": 50111, "epoch": 298} {"train_loss": -7.910284996032715, "global_step": 50112, "epoch": 298} {"train_loss": -7.99946928024292, "global_step": 50113, "epoch": 298} {"train_loss": -7.996525287628174, "global_step": 50114, "epoch": 298} {"train_loss": -8.216507911682129, "global_step": 50115, "epoch": 298} {"train_loss": -8.165946960449219, "global_step": 50116, "epoch": 298} {"train_loss": -7.976949214935303, "global_step": 50117, "epoch": 298} {"train_loss": -8.03609561920166, "global_step": 50118, "epoch": 298} {"train_loss": -8.258686065673828, "global_step": 50119, "epoch": 298} {"train_loss": -8.012203216552734, "global_step": 50120, "epoch": 298} {"train_loss": -8.244775772094727, "global_step": 50121, "epoch": 298} {"train_loss": -8.292622566223145, "global_step": 50122, "epoch": 298} {"train_loss": -8.220606803894043, "global_step": 50123, "epoch": 298} {"train_loss": -8.106452941894531, "global_step": 50124, "epoch": 298} {"train_loss": -8.243012428283691, "global_step": 50125, "epoch": 298} {"train_loss": -8.436630249023438, "global_step": 50126, "epoch": 298} {"train_loss": -8.244751930236816, "global_step": 50127, "epoch": 298} {"train_loss": -8.169021606445312, "global_step": 50128, "epoch": 298} {"train_loss": -8.49868392944336, "global_step": 50129, "epoch": 298} {"train_loss": -8.312505722045898, "global_step": 50130, "epoch": 298} {"train_loss": -8.313335418701172, "global_step": 50131, "epoch": 298} {"train_loss": -8.362028121948242, "global_step": 50132, "epoch": 298} {"train_loss": -8.137003898620605, "global_step": 50133, "epoch": 298} {"train_loss": -8.381771087646484, "global_step": 50134, "epoch": 298} {"train_loss": -8.13796615600586, "global_step": 50135, "epoch": 298} {"train_loss": -8.429615020751953, "global_step": 50136, "epoch": 298} {"train_loss": -8.389436721801758, "global_step": 50137, "epoch": 298} {"train_loss": -8.458953857421875, "global_step": 50138, "epoch": 298} {"train_loss": -8.450241088867188, "global_step": 50139, "epoch": 298} {"train_loss": -8.330848693847656, "global_step": 50140, "epoch": 298} {"train_loss": -8.404101371765137, "global_step": 50141, "epoch": 298} {"train_loss": -8.469779968261719, "global_step": 50142, "epoch": 298} {"train_loss": -8.379250526428223, "global_step": 50143, "epoch": 298} {"train_loss": -8.382949829101562, "global_step": 50144, "epoch": 298} {"train_loss": -8.40573501586914, "global_step": 50145, "epoch": 298} {"train_loss": -8.473273277282715, "global_step": 50146, "epoch": 298} {"train_loss": -8.452705383300781, "global_step": 50147, "epoch": 298} {"train_loss": -8.374452590942383, "global_step": 50148, "epoch": 298} {"train_loss": -8.519216537475586, "global_step": 50149, "epoch": 298} {"train_loss": -8.440573692321777, "global_step": 50150, "epoch": 298} {"train_loss": -8.378483772277832, "global_step": 50151, "epoch": 298} {"train_loss": -8.32915210723877, "global_step": 50152, "epoch": 298} {"train_loss": -8.470458030700684, "global_step": 50153, "epoch": 298} {"train_loss": -8.468413352966309, "global_step": 50154, "epoch": 298} {"train_loss": -8.34282112121582, "global_step": 50155, "epoch": 298} {"train_loss": -8.304826736450195, "global_step": 50156, "epoch": 298} {"train_loss": -8.188301086425781, "global_step": 50157, "epoch": 298} {"train_loss": -8.351079940795898, "global_step": 50158, "epoch": 298} {"train_loss": -7.971782207489014, "global_step": 50159, "epoch": 298} {"train_loss": -8.073137283325195, "global_step": 50160, "epoch": 298} {"train_loss": -8.069101333618164, "global_step": 50161, "epoch": 298} {"train_loss": -7.640217304229736, "global_step": 50162, "epoch": 298} {"train_loss": -8.108617782592773, "global_step": 50163, "epoch": 298} {"train_loss": -7.998409271240234, "global_step": 50164, "epoch": 298} {"train_loss": -8.078065872192383, "global_step": 50165, "epoch": 298} {"train_loss": -7.914237022399902, "global_step": 50166, "epoch": 298} {"train_loss": -8.005860328674316, "global_step": 50167, "epoch": 298} {"train_loss": -8.062833786010742, "global_step": 50168, "epoch": 298} {"train_loss": -8.08321762084961, "global_step": 50169, "epoch": 298} {"train_loss": -8.1871976852417, "global_step": 50170, "epoch": 298} {"train_loss": -8.181376457214355, "global_step": 50171, "epoch": 298} {"train_loss": -7.9974775314331055, "global_step": 50172, "epoch": 298} {"train_loss": -8.086627960205078, "global_step": 50173, "epoch": 298} {"train_loss": -8.095626831054688, "global_step": 50174, "epoch": 298} {"train_loss": -8.166254043579102, "global_step": 50175, "epoch": 298} {"train_loss": -8.162507057189941, "global_step": 50176, "epoch": 298} {"train_loss": -8.236202239990234, "global_step": 50177, "epoch": 298} {"train_loss": -8.194729804992676, "global_step": 50178, "epoch": 298} {"train_loss": -8.135576248168945, "global_step": 50179, "epoch": 298} {"train_loss": -8.255084991455078, "global_step": 50180, "epoch": 298} {"train_loss": -8.128291130065918, "global_step": 50181, "epoch": 298} {"train_loss": -8.345846176147461, "global_step": 50182, "epoch": 298} {"train_loss": -8.222318649291992, "global_step": 50183, "epoch": 298} {"train_loss": -8.460572242736816, "global_step": 50184, "epoch": 298} {"train_loss": -8.21004867553711, "global_step": 50185, "epoch": 298} {"train_loss": -8.080021858215332, "global_step": 50186, "epoch": 298} {"train_loss": -8.450432777404785, "global_step": 50187, "epoch": 298} {"train_loss": -8.164185523986816, "global_step": 50188, "epoch": 298} {"train_loss": -8.479015350341797, "global_step": 50189, "epoch": 298} {"train_loss": -8.494304656982422, "global_step": 50190, "epoch": 298} {"train_loss": -8.395888328552246, "global_step": 50191, "epoch": 298} {"train_loss": -8.35434627532959, "global_step": 50192, "epoch": 298} {"train_loss": -8.39425277709961, "global_step": 50193, "epoch": 298} {"train_loss": -7.988951683044434, "global_step": 50194, "epoch": 298} {"train_loss": -8.252315521240234, "global_step": 50195, "epoch": 298} {"train_loss": -8.438241004943848, "global_step": 50196, "epoch": 298} {"train_loss": -8.290895462036133, "global_step": 50197, "epoch": 298} {"train_loss": -8.158050537109375, "global_step": 50198, "epoch": 298} {"train_loss": -8.265828132629395, "global_step": 50199, "epoch": 298} {"train_loss": -8.33305549621582, "global_step": 50200, "epoch": 298} {"train_loss": -8.283132553100586, "global_step": 50201, "epoch": 298} {"train_loss": -8.10236644744873, "global_step": 50202, "epoch": 298} {"train_loss": -8.403858184814453, "global_step": 50203, "epoch": 298} {"train_loss": -8.391712188720703, "global_step": 50204, "epoch": 298} {"train_loss": -8.267011642456055, "global_step": 50205, "epoch": 298} {"train_loss": -8.202154159545898, "global_step": 50206, "epoch": 298} {"train_loss": -8.26259708404541, "global_step": 50207, "epoch": 298} {"train_loss": -8.360838890075684, "global_step": 50208, "epoch": 298} {"train_loss": -8.2572021484375, "global_step": 50209, "epoch": 298} {"train_loss": -8.089668273925781, "global_step": 50210, "epoch": 298} {"train_loss": -8.375194549560547, "global_step": 50211, "epoch": 298} {"train_loss": -8.484203338623047, "global_step": 50212, "epoch": 298} {"train_loss": -8.422719955444336, "global_step": 50213, "epoch": 298} {"train_loss": -8.507655143737793, "global_step": 50214, "epoch": 298} {"train_loss": -8.446621894836426, "global_step": 50215, "epoch": 298} {"train_loss": -8.319490432739258, "global_step": 50216, "epoch": 298} {"train_loss": -8.528681755065918, "global_step": 50217, "epoch": 298} {"train_loss": -8.213062286376953, "global_step": 50218, "epoch": 298} {"train_loss": -8.448932647705078, "global_step": 50219, "epoch": 298} {"train_loss": -8.353921890258789, "global_step": 50220, "epoch": 298} {"train_loss": -8.299261093139648, "global_step": 50221, "epoch": 298} {"train_loss": -8.271458625793457, "global_step": 50222, "epoch": 298} {"train_loss": -8.264001846313477, "global_step": 50223, "epoch": 298} {"train_loss": -8.287741661071777, "global_step": 50224, "epoch": 298} {"train_loss": -8.156314849853516, "global_step": 50225, "epoch": 298} {"train_loss": -8.612319946289062, "global_step": 50226, "epoch": 298} {"train_loss": -8.313758850097656, "global_step": 50227, "epoch": 298} {"train_loss": -8.235617637634277, "global_step": 50228, "epoch": 298} {"train_loss": -8.287294387817383, "global_step": 50229, "epoch": 298} {"train_loss": -8.14336109161377, "global_step": 50230, "epoch": 298} {"train_loss": -8.272877009142013, "global_step": 50231, "epoch": 298, "val_loss": 188117.796875} {"train_loss": -8.270133018493652, "global_step": 50232, "epoch": 299} {"train_loss": -8.1826810836792, "global_step": 50233, "epoch": 299} {"train_loss": -8.099252700805664, "global_step": 50234, "epoch": 299} {"train_loss": -8.365306854248047, "global_step": 50235, "epoch": 299} {"train_loss": -8.020764350891113, "global_step": 50236, "epoch": 299} {"train_loss": -8.348569869995117, "global_step": 50237, "epoch": 299} {"train_loss": -8.26091480255127, "global_step": 50238, "epoch": 299} {"train_loss": -8.1666841506958, "global_step": 50239, "epoch": 299} {"train_loss": -8.22085189819336, "global_step": 50240, "epoch": 299} {"train_loss": -8.295525550842285, "global_step": 50241, "epoch": 299} {"train_loss": -8.112720489501953, "global_step": 50242, "epoch": 299} {"train_loss": -8.3701810836792, "global_step": 50243, "epoch": 299} {"train_loss": -8.253860473632812, "global_step": 50244, "epoch": 299} {"train_loss": -8.106962203979492, "global_step": 50245, "epoch": 299} {"train_loss": -8.102180480957031, "global_step": 50246, "epoch": 299} {"train_loss": -8.35263729095459, "global_step": 50247, "epoch": 299} {"train_loss": -8.35457992553711, "global_step": 50248, "epoch": 299} {"train_loss": -8.607458114624023, "global_step": 50249, "epoch": 299} {"train_loss": -8.402854919433594, "global_step": 50250, "epoch": 299} {"train_loss": -8.457420349121094, "global_step": 50251, "epoch": 299} {"train_loss": -8.183353424072266, "global_step": 50252, "epoch": 299} {"train_loss": -8.490126609802246, "global_step": 50253, "epoch": 299} {"train_loss": -8.531843185424805, "global_step": 50254, "epoch": 299} {"train_loss": -8.498786926269531, "global_step": 50255, "epoch": 299} {"train_loss": -8.454811096191406, "global_step": 50256, "epoch": 299} {"train_loss": -8.501175880432129, "global_step": 50257, "epoch": 299} {"train_loss": -8.32651424407959, "global_step": 50258, "epoch": 299} {"train_loss": -8.32973861694336, "global_step": 50259, "epoch": 299} {"train_loss": -8.675163269042969, "global_step": 50260, "epoch": 299} {"train_loss": -8.441970825195312, "global_step": 50261, "epoch": 299} {"train_loss": -8.337032318115234, "global_step": 50262, "epoch": 299} {"train_loss": -8.19196891784668, "global_step": 50263, "epoch": 299} {"train_loss": -8.650973320007324, "global_step": 50264, "epoch": 299} {"train_loss": -8.30058479309082, "global_step": 50265, "epoch": 299} {"train_loss": -8.475648880004883, "global_step": 50266, "epoch": 299} {"train_loss": -8.380453109741211, "global_step": 50267, "epoch": 299} {"train_loss": -8.56614875793457, "global_step": 50268, "epoch": 299} {"train_loss": -8.172245025634766, "global_step": 50269, "epoch": 299} {"train_loss": -8.577629089355469, "global_step": 50270, "epoch": 299} {"train_loss": -8.469110488891602, "global_step": 50271, "epoch": 299} {"train_loss": -8.589704513549805, "global_step": 50272, "epoch": 299} {"train_loss": -8.154315948486328, "global_step": 50273, "epoch": 299} {"train_loss": -8.535074234008789, "global_step": 50274, "epoch": 299} {"train_loss": -8.188005447387695, "global_step": 50275, "epoch": 299} {"train_loss": -8.602057456970215, "global_step": 50276, "epoch": 299} {"train_loss": -8.179638862609863, "global_step": 50277, "epoch": 299} {"train_loss": -8.181057929992676, "global_step": 50278, "epoch": 299} {"train_loss": -8.631937026977539, "global_step": 50279, "epoch": 299} {"train_loss": -8.319034576416016, "global_step": 50280, "epoch": 299} {"train_loss": -8.467264175415039, "global_step": 50281, "epoch": 299} {"train_loss": -8.24361801147461, "global_step": 50282, "epoch": 299} {"train_loss": -8.594029426574707, "global_step": 50283, "epoch": 299} {"train_loss": -8.334238052368164, "global_step": 50284, "epoch": 299} {"train_loss": -8.414445877075195, "global_step": 50285, "epoch": 299} {"train_loss": -8.438024520874023, "global_step": 50286, "epoch": 299} {"train_loss": -8.331745147705078, "global_step": 50287, "epoch": 299} {"train_loss": -8.167363166809082, "global_step": 50288, "epoch": 299} {"train_loss": -8.137182235717773, "global_step": 50289, "epoch": 299} {"train_loss": -8.208484649658203, "global_step": 50290, "epoch": 299} {"train_loss": -8.478910446166992, "global_step": 50291, "epoch": 299} {"train_loss": -8.499282836914062, "global_step": 50292, "epoch": 299} {"train_loss": -8.359987258911133, "global_step": 50293, "epoch": 299} {"train_loss": -8.49771499633789, "global_step": 50294, "epoch": 299} {"train_loss": -8.5602445602417, "global_step": 50295, "epoch": 299} {"train_loss": -8.492839813232422, "global_step": 50296, "epoch": 299} {"train_loss": -8.44996452331543, "global_step": 50297, "epoch": 299} {"train_loss": -8.387699127197266, "global_step": 50298, "epoch": 299} {"train_loss": -8.402748107910156, "global_step": 50299, "epoch": 299} {"train_loss": -8.463178634643555, "global_step": 50300, "epoch": 299} {"train_loss": -8.351593017578125, "global_step": 50301, "epoch": 299} {"train_loss": -8.394384384155273, "global_step": 50302, "epoch": 299} {"train_loss": -8.397407531738281, "global_step": 50303, "epoch": 299} {"train_loss": -8.41044807434082, "global_step": 50304, "epoch": 299} {"train_loss": -8.414274215698242, "global_step": 50305, "epoch": 299} {"train_loss": -8.387022972106934, "global_step": 50306, "epoch": 299} {"train_loss": -8.650634765625, "global_step": 50307, "epoch": 299} {"train_loss": -8.385847091674805, "global_step": 50308, "epoch": 299} {"train_loss": -8.41244125366211, "global_step": 50309, "epoch": 299} {"train_loss": -8.153219223022461, "global_step": 50310, "epoch": 299} {"train_loss": -8.52150821685791, "global_step": 50311, "epoch": 299} {"train_loss": -8.393486022949219, "global_step": 50312, "epoch": 299} {"train_loss": -8.224206924438477, "global_step": 50313, "epoch": 299} {"train_loss": -8.378360748291016, "global_step": 50314, "epoch": 299} {"train_loss": -8.342443466186523, "global_step": 50315, "epoch": 299} {"train_loss": -8.411144256591797, "global_step": 50316, "epoch": 299} {"train_loss": -8.330143928527832, "global_step": 50317, "epoch": 299} {"train_loss": -8.118270874023438, "global_step": 50318, "epoch": 299} {"train_loss": -8.137152671813965, "global_step": 50319, "epoch": 299} {"train_loss": -8.18156623840332, "global_step": 50320, "epoch": 299} {"train_loss": -8.513652801513672, "global_step": 50321, "epoch": 299} {"train_loss": -8.320354461669922, "global_step": 50322, "epoch": 299} {"train_loss": -8.518864631652832, "global_step": 50323, "epoch": 299} {"train_loss": -8.475221633911133, "global_step": 50324, "epoch": 299} {"train_loss": -8.116634368896484, "global_step": 50325, "epoch": 299} {"train_loss": -8.355928421020508, "global_step": 50326, "epoch": 299} {"train_loss": -8.300737380981445, "global_step": 50327, "epoch": 299} {"train_loss": -8.309539794921875, "global_step": 50328, "epoch": 299} {"train_loss": -8.544658660888672, "global_step": 50329, "epoch": 299} {"train_loss": -8.408308029174805, "global_step": 50330, "epoch": 299} {"train_loss": -8.368631362915039, "global_step": 50331, "epoch": 299} {"train_loss": -8.406000137329102, "global_step": 50332, "epoch": 299} {"train_loss": -8.641244888305664, "global_step": 50333, "epoch": 299} {"train_loss": -8.306285858154297, "global_step": 50334, "epoch": 299} {"train_loss": -8.48281478881836, "global_step": 50335, "epoch": 299} {"train_loss": -8.079031944274902, "global_step": 50336, "epoch": 299} {"train_loss": -8.492555618286133, "global_step": 50337, "epoch": 299} {"train_loss": -8.209243774414062, "global_step": 50338, "epoch": 299} {"train_loss": -8.349064826965332, "global_step": 50339, "epoch": 299} {"train_loss": -8.296676635742188, "global_step": 50340, "epoch": 299} {"train_loss": -8.493706703186035, "global_step": 50341, "epoch": 299} {"train_loss": -8.144262313842773, "global_step": 50342, "epoch": 299} {"train_loss": -8.187243461608887, "global_step": 50343, "epoch": 299} {"train_loss": -8.032081604003906, "global_step": 50344, "epoch": 299} {"train_loss": -8.218399047851562, "global_step": 50345, "epoch": 299} {"train_loss": -8.157150268554688, "global_step": 50346, "epoch": 299} {"train_loss": -7.720291614532471, "global_step": 50347, "epoch": 299} {"train_loss": -8.338741302490234, "global_step": 50348, "epoch": 299} {"train_loss": -8.266067504882812, "global_step": 50349, "epoch": 299} {"train_loss": -8.319717407226562, "global_step": 50350, "epoch": 299} {"train_loss": -8.077463150024414, "global_step": 50351, "epoch": 299} {"train_loss": -8.40478515625, "global_step": 50352, "epoch": 299} {"train_loss": -8.117658615112305, "global_step": 50353, "epoch": 299} {"train_loss": -8.161172866821289, "global_step": 50354, "epoch": 299} {"train_loss": -8.29800796508789, "global_step": 50355, "epoch": 299} {"train_loss": -8.381499290466309, "global_step": 50356, "epoch": 299} {"train_loss": -8.116415023803711, "global_step": 50357, "epoch": 299} {"train_loss": -8.133722305297852, "global_step": 50358, "epoch": 299} {"train_loss": -8.1187744140625, "global_step": 50359, "epoch": 299} {"train_loss": -8.203259468078613, "global_step": 50360, "epoch": 299} {"train_loss": -8.023528099060059, "global_step": 50361, "epoch": 299} {"train_loss": -8.245532989501953, "global_step": 50362, "epoch": 299} {"train_loss": -8.343810081481934, "global_step": 50363, "epoch": 299} {"train_loss": -8.225240707397461, "global_step": 50364, "epoch": 299} {"train_loss": -8.082493782043457, "global_step": 50365, "epoch": 299} {"train_loss": -8.189717292785645, "global_step": 50366, "epoch": 299} {"train_loss": -8.227344512939453, "global_step": 50367, "epoch": 299} {"train_loss": -8.065048217773438, "global_step": 50368, "epoch": 299} {"train_loss": -8.219240188598633, "global_step": 50369, "epoch": 299} {"train_loss": -8.164196014404297, "global_step": 50370, "epoch": 299} {"train_loss": -8.19866943359375, "global_step": 50371, "epoch": 299} {"train_loss": -8.146913528442383, "global_step": 50372, "epoch": 299} {"train_loss": -8.368989944458008, "global_step": 50373, "epoch": 299} {"train_loss": -7.985081195831299, "global_step": 50374, "epoch": 299} {"train_loss": -8.340448379516602, "global_step": 50375, "epoch": 299} {"train_loss": -8.372936248779297, "global_step": 50376, "epoch": 299} {"train_loss": -8.234952926635742, "global_step": 50377, "epoch": 299} {"train_loss": -8.179925918579102, "global_step": 50378, "epoch": 299} {"train_loss": -8.504650115966797, "global_step": 50379, "epoch": 299} {"train_loss": -8.288690567016602, "global_step": 50380, "epoch": 299} {"train_loss": -8.140668869018555, "global_step": 50381, "epoch": 299} {"train_loss": -8.286771774291992, "global_step": 50382, "epoch": 299} {"train_loss": -8.066174507141113, "global_step": 50383, "epoch": 299} {"train_loss": -8.365915298461914, "global_step": 50384, "epoch": 299} {"train_loss": -8.109121322631836, "global_step": 50385, "epoch": 299} {"train_loss": -8.379902839660645, "global_step": 50386, "epoch": 299} {"train_loss": -8.168907165527344, "global_step": 50387, "epoch": 299} {"train_loss": -8.335870742797852, "global_step": 50388, "epoch": 299} {"train_loss": -8.410768508911133, "global_step": 50389, "epoch": 299} {"train_loss": -8.252424240112305, "global_step": 50390, "epoch": 299} {"train_loss": -8.27222728729248, "global_step": 50391, "epoch": 299} {"train_loss": -8.059429168701172, "global_step": 50392, "epoch": 299} {"train_loss": -7.97659969329834, "global_step": 50393, "epoch": 299} {"train_loss": -8.24222183227539, "global_step": 50394, "epoch": 299} {"train_loss": -8.187578201293945, "global_step": 50395, "epoch": 299} {"train_loss": -8.256563186645508, "global_step": 50396, "epoch": 299} {"train_loss": -8.065863609313965, "global_step": 50397, "epoch": 299} {"train_loss": -7.907811641693115, "global_step": 50398, "epoch": 299} {"train_loss": -8.30657061224892, "global_step": 50399, "epoch": 299, "val_loss": 188864.890625} {"train_loss": -7.919926166534424, "global_step": 50400, "epoch": 300} {"train_loss": -8.221475601196289, "global_step": 50401, "epoch": 300} {"train_loss": -8.05849838256836, "global_step": 50402, "epoch": 300} {"train_loss": -8.092731475830078, "global_step": 50403, "epoch": 300} {"train_loss": -8.3262939453125, "global_step": 50404, "epoch": 300} {"train_loss": -8.14706802368164, "global_step": 50405, "epoch": 300} {"train_loss": -8.307903289794922, "global_step": 50406, "epoch": 300} {"train_loss": -8.341426849365234, "global_step": 50407, "epoch": 300} {"train_loss": -8.183028221130371, "global_step": 50408, "epoch": 300} {"train_loss": -8.482136726379395, "global_step": 50409, "epoch": 300} {"train_loss": -8.353862762451172, "global_step": 50410, "epoch": 300} {"train_loss": -8.356645584106445, "global_step": 50411, "epoch": 300} {"train_loss": -8.195748329162598, "global_step": 50412, "epoch": 300} {"train_loss": -8.423826217651367, "global_step": 50413, "epoch": 300} {"train_loss": -8.324188232421875, "global_step": 50414, "epoch": 300} {"train_loss": -8.282124519348145, "global_step": 50415, "epoch": 300} {"train_loss": -8.390242576599121, "global_step": 50416, "epoch": 300} {"train_loss": -8.579261779785156, "global_step": 50417, "epoch": 300} {"train_loss": -8.24435043334961, "global_step": 50418, "epoch": 300} {"train_loss": -8.505704879760742, "global_step": 50419, "epoch": 300} {"train_loss": -8.338061332702637, "global_step": 50420, "epoch": 300} {"train_loss": -8.475215911865234, "global_step": 50421, "epoch": 300} {"train_loss": -8.388607025146484, "global_step": 50422, "epoch": 300} {"train_loss": -8.495315551757812, "global_step": 50423, "epoch": 300} {"train_loss": -8.41992473602295, "global_step": 50424, "epoch": 300} {"train_loss": -8.471076965332031, "global_step": 50425, "epoch": 300} {"train_loss": -8.538093566894531, "global_step": 50426, "epoch": 300} {"train_loss": -8.329809188842773, "global_step": 50427, "epoch": 300} {"train_loss": -8.349370956420898, "global_step": 50428, "epoch": 300} {"train_loss": -8.255013465881348, "global_step": 50429, "epoch": 300} {"train_loss": -8.598116874694824, "global_step": 50430, "epoch": 300} {"train_loss": -8.286186218261719, "global_step": 50431, "epoch": 300} {"train_loss": -8.526020050048828, "global_step": 50432, "epoch": 300} {"train_loss": -8.431385040283203, "global_step": 50433, "epoch": 300} {"train_loss": -8.161972045898438, "global_step": 50434, "epoch": 300} {"train_loss": -8.448444366455078, "global_step": 50435, "epoch": 300} {"train_loss": -7.929699897766113, "global_step": 50436, "epoch": 300} {"train_loss": -8.55793571472168, "global_step": 50437, "epoch": 300} {"train_loss": -8.209218978881836, "global_step": 50438, "epoch": 300} {"train_loss": -8.35352897644043, "global_step": 50439, "epoch": 300} {"train_loss": -8.220197677612305, "global_step": 50440, "epoch": 300} {"train_loss": -8.244745254516602, "global_step": 50441, "epoch": 300} {"train_loss": -8.176578521728516, "global_step": 50442, "epoch": 300} {"train_loss": -8.404886245727539, "global_step": 50443, "epoch": 300} {"train_loss": -8.42437744140625, "global_step": 50444, "epoch": 300} {"train_loss": -8.286179542541504, "global_step": 50445, "epoch": 300} {"train_loss": -8.207717895507812, "global_step": 50446, "epoch": 300} {"train_loss": -8.526592254638672, "global_step": 50447, "epoch": 300} {"train_loss": -8.448358535766602, "global_step": 50448, "epoch": 300} {"train_loss": -8.24756145477295, "global_step": 50449, "epoch": 300} {"train_loss": -8.483818054199219, "global_step": 50450, "epoch": 300} {"train_loss": -8.484567642211914, "global_step": 50451, "epoch": 300} {"train_loss": -8.378671646118164, "global_step": 50452, "epoch": 300} {"train_loss": -8.253616333007812, "global_step": 50453, "epoch": 300} {"train_loss": -8.213061332702637, "global_step": 50454, "epoch": 300} {"train_loss": -8.346336364746094, "global_step": 50455, "epoch": 300} {"train_loss": -8.400650978088379, "global_step": 50456, "epoch": 300} {"train_loss": -8.339702606201172, "global_step": 50457, "epoch": 300} {"train_loss": -8.53855037689209, "global_step": 50458, "epoch": 300} {"train_loss": -8.340469360351562, "global_step": 50459, "epoch": 300} {"train_loss": -8.406488418579102, "global_step": 50460, "epoch": 300} {"train_loss": -8.363492965698242, "global_step": 50461, "epoch": 300} {"train_loss": -8.214713096618652, "global_step": 50462, "epoch": 300} {"train_loss": -8.225513458251953, "global_step": 50463, "epoch": 300} {"train_loss": -7.956510066986084, "global_step": 50464, "epoch": 300} {"train_loss": -8.26081657409668, "global_step": 50465, "epoch": 300} {"train_loss": -8.249284744262695, "global_step": 50466, "epoch": 300} {"train_loss": -8.326594352722168, "global_step": 50467, "epoch": 300} {"train_loss": -8.174663543701172, "global_step": 50468, "epoch": 300} {"train_loss": -8.278667449951172, "global_step": 50469, "epoch": 300} {"train_loss": -8.294904708862305, "global_step": 50470, "epoch": 300} {"train_loss": -8.118719100952148, "global_step": 50471, "epoch": 300} {"train_loss": -8.258509635925293, "global_step": 50472, "epoch": 300} {"train_loss": -8.31727409362793, "global_step": 50473, "epoch": 300} {"train_loss": -8.331321716308594, "global_step": 50474, "epoch": 300} {"train_loss": -8.381661415100098, "global_step": 50475, "epoch": 300} {"train_loss": -8.383047103881836, "global_step": 50476, "epoch": 300} {"train_loss": -8.248499870300293, "global_step": 50477, "epoch": 300} {"train_loss": -8.367268562316895, "global_step": 50478, "epoch": 300} {"train_loss": -8.542702674865723, "global_step": 50479, "epoch": 300} {"train_loss": -8.308295249938965, "global_step": 50480, "epoch": 300} {"train_loss": -8.299732208251953, "global_step": 50481, "epoch": 300} {"train_loss": -8.403480529785156, "global_step": 50482, "epoch": 300} {"train_loss": -8.280502319335938, "global_step": 50483, "epoch": 300} {"train_loss": -8.42762279510498, "global_step": 50484, "epoch": 300} {"train_loss": -8.476129531860352, "global_step": 50485, "epoch": 300} {"train_loss": -8.200542449951172, "global_step": 50486, "epoch": 300} {"train_loss": -8.652078628540039, "global_step": 50487, "epoch": 300} {"train_loss": -8.399351119995117, "global_step": 50488, "epoch": 300} {"train_loss": -8.224777221679688, "global_step": 50489, "epoch": 300} {"train_loss": -8.209943771362305, "global_step": 50490, "epoch": 300} {"train_loss": -8.37636947631836, "global_step": 50491, "epoch": 300} {"train_loss": -8.252431869506836, "global_step": 50492, "epoch": 300} {"train_loss": -8.133834838867188, "global_step": 50493, "epoch": 300} {"train_loss": -8.514408111572266, "global_step": 50494, "epoch": 300} {"train_loss": -8.45571231842041, "global_step": 50495, "epoch": 300} {"train_loss": -8.106998443603516, "global_step": 50496, "epoch": 300} {"train_loss": -8.443634033203125, "global_step": 50497, "epoch": 300} {"train_loss": -7.970695495605469, "global_step": 50498, "epoch": 300} {"train_loss": -8.241230010986328, "global_step": 50499, "epoch": 300} {"train_loss": -8.419835090637207, "global_step": 50500, "epoch": 300} {"train_loss": -8.433479309082031, "global_step": 50501, "epoch": 300} {"train_loss": -8.190035820007324, "global_step": 50502, "epoch": 300} {"train_loss": -8.412532806396484, "global_step": 50503, "epoch": 300} {"train_loss": -8.399150848388672, "global_step": 50504, "epoch": 300} {"train_loss": -8.304555892944336, "global_step": 50505, "epoch": 300} {"train_loss": -8.226275444030762, "global_step": 50506, "epoch": 300} {"train_loss": -8.309292793273926, "global_step": 50507, "epoch": 300} {"train_loss": -8.164986610412598, "global_step": 50508, "epoch": 300} {"train_loss": -8.382570266723633, "global_step": 50509, "epoch": 300} {"train_loss": -8.476160049438477, "global_step": 50510, "epoch": 300} {"train_loss": -8.222290992736816, "global_step": 50511, "epoch": 300} {"train_loss": -8.573492050170898, "global_step": 50512, "epoch": 300} {"train_loss": -8.203178405761719, "global_step": 50513, "epoch": 300} {"train_loss": -8.455341339111328, "global_step": 50514, "epoch": 300} {"train_loss": -8.40504264831543, "global_step": 50515, "epoch": 300} {"train_loss": -8.35373592376709, "global_step": 50516, "epoch": 300} {"train_loss": -8.37353515625, "global_step": 50517, "epoch": 300} {"train_loss": -8.237441062927246, "global_step": 50518, "epoch": 300} {"train_loss": -8.296151161193848, "global_step": 50519, "epoch": 300} {"train_loss": -8.352849960327148, "global_step": 50520, "epoch": 300} {"train_loss": -8.325169563293457, "global_step": 50521, "epoch": 300} {"train_loss": -8.327736854553223, "global_step": 50522, "epoch": 300} {"train_loss": -8.198711395263672, "global_step": 50523, "epoch": 300} {"train_loss": -8.379382133483887, "global_step": 50524, "epoch": 300} {"train_loss": -8.3721284866333, "global_step": 50525, "epoch": 300} {"train_loss": -8.48417854309082, "global_step": 50526, "epoch": 300} {"train_loss": -8.350286483764648, "global_step": 50527, "epoch": 300} {"train_loss": -8.39571762084961, "global_step": 50528, "epoch": 300} {"train_loss": -8.147293090820312, "global_step": 50529, "epoch": 300} {"train_loss": -8.446979522705078, "global_step": 50530, "epoch": 300} {"train_loss": -8.543427467346191, "global_step": 50531, "epoch": 300} {"train_loss": -8.589130401611328, "global_step": 50532, "epoch": 300} {"train_loss": -8.370061874389648, "global_step": 50533, "epoch": 300} {"train_loss": -8.394003868103027, "global_step": 50534, "epoch": 300} {"train_loss": -8.309955596923828, "global_step": 50535, "epoch": 300} {"train_loss": -8.470650672912598, "global_step": 50536, "epoch": 300} {"train_loss": -8.43792724609375, "global_step": 50537, "epoch": 300} {"train_loss": -8.102941513061523, "global_step": 50538, "epoch": 300} {"train_loss": -8.284844398498535, "global_step": 50539, "epoch": 300} {"train_loss": -8.26432991027832, "global_step": 50540, "epoch": 300} {"train_loss": -8.373311996459961, "global_step": 50541, "epoch": 300} {"train_loss": -8.283924102783203, "global_step": 50542, "epoch": 300} {"train_loss": -8.125532150268555, "global_step": 50543, "epoch": 300} {"train_loss": -8.261222839355469, "global_step": 50544, "epoch": 300} {"train_loss": -8.322185516357422, "global_step": 50545, "epoch": 300} {"train_loss": -8.332035064697266, "global_step": 50546, "epoch": 300} {"train_loss": -8.33669662475586, "global_step": 50547, "epoch": 300} {"train_loss": -8.154537200927734, "global_step": 50548, "epoch": 300} {"train_loss": -8.294463157653809, "global_step": 50549, "epoch": 300} {"train_loss": -8.203777313232422, "global_step": 50550, "epoch": 300} {"train_loss": -8.404112815856934, "global_step": 50551, "epoch": 300} {"train_loss": -8.26069450378418, "global_step": 50552, "epoch": 300} {"train_loss": -8.176807403564453, "global_step": 50553, "epoch": 300} {"train_loss": -8.393096923828125, "global_step": 50554, "epoch": 300} {"train_loss": -8.409065246582031, "global_step": 50555, "epoch": 300} {"train_loss": -8.280742645263672, "global_step": 50556, "epoch": 300} {"train_loss": -8.387884140014648, "global_step": 50557, "epoch": 300} {"train_loss": -8.335953712463379, "global_step": 50558, "epoch": 300} {"train_loss": -8.14062213897705, "global_step": 50559, "epoch": 300} {"train_loss": -8.647933959960938, "global_step": 50560, "epoch": 300} {"train_loss": -8.326409339904785, "global_step": 50561, "epoch": 300} {"train_loss": -8.32168197631836, "global_step": 50562, "epoch": 300} {"train_loss": -8.490742683410645, "global_step": 50563, "epoch": 300} {"train_loss": -8.429723739624023, "global_step": 50564, "epoch": 300} {"train_loss": -8.485784530639648, "global_step": 50565, "epoch": 300} {"train_loss": -8.501607894897461, "global_step": 50566, "epoch": 300} {"train_loss": -8.332184303374518, "global_step": 50567, "epoch": 300, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 0.9083381953404996, "train/sim_max_reward_2": 0.5030998453448113, "train/sim_max_reward_3": 0.6926404736906054, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.6622188974307697, "test/sim_max_reward_4400000": 0.9191227726868919, "test/sim_max_reward_4400001": 0.3584578422947146, "test/sim_max_reward_4400002": 0.07720407950735143, "test/sim_max_reward_4400003": 0.7220868425759306, "test/sim_max_reward_4400004": 0.40777496591432905, "test/sim_max_reward_4400005": 0.5489361748607887, "test/sim_max_reward_4400006": 0.9955043660303527, "test/sim_max_reward_4400007": 0.5059677732872351, "test/sim_max_reward_4400008": 0.7057774001271211, "test/sim_max_reward_4400009": 0.35316338767459515, "test/sim_max_reward_4400010": 0.9625796194744214, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 0.9916449275442181, "test/sim_max_reward_4400013": 0.9944696369800489, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 0.9902007582452375, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.963964452304762, "test/sim_max_reward_4400018": 0.9938910823824467, "test/sim_max_reward_4400019": 0.15695762730181234, "test/sim_max_reward_4400020": 0.0013588921609646758, "test/sim_max_reward_4400021": 0.6605321223255287, "test/sim_max_reward_4400022": 0.9986036810445782, "test/sim_max_reward_4400023": 0.1090614935255342, "test/sim_max_reward_4400024": 1.0, "test/sim_max_reward_4400025": 0.590920462211606, "test/sim_max_reward_4400026": 0.05256966205939263, "test/sim_max_reward_4400027": 0.9346666949310938, "test/sim_max_reward_4400028": 0.711412165791864, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.99671657353263, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.10893894438221152, "test/sim_max_reward_4400033": 0.399167346148518, "test/sim_max_reward_4400034": 0.685678374566143, "test/sim_max_reward_4400035": 0.9980323290019607, "test/sim_max_reward_4400036": 0.365043557182004, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.371974874707531, "test/sim_max_reward_4400039": 0.4117831704153246, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.40657939582060354, "test/sim_max_reward_4400042": 0.9419665258251237, "test/sim_max_reward_4400043": 0.9798383381560455, "test/sim_max_reward_4400044": 0.974326551521629, "test/sim_max_reward_4400045": 0.7170164021511526, "test/sim_max_reward_4400046": 0.9964326489361253, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.794382901967781, "test/mean_score": 0.6212064783117964, "val_loss": 188041.15625, "train_action_mse_error": 6.412772178649902} {"train_loss": -8.174304962158203, "global_step": 50568, "epoch": 301} {"train_loss": -8.01317024230957, "global_step": 50569, "epoch": 301} {"train_loss": -8.311278343200684, "global_step": 50570, "epoch": 301} {"train_loss": -8.229206085205078, "global_step": 50571, "epoch": 301} {"train_loss": -8.488887786865234, "global_step": 50572, "epoch": 301} {"train_loss": -8.09958267211914, "global_step": 50573, "epoch": 301} {"train_loss": -8.19589614868164, "global_step": 50574, "epoch": 301} {"train_loss": -8.351162910461426, "global_step": 50575, "epoch": 301} {"train_loss": -8.290528297424316, "global_step": 50576, "epoch": 301} {"train_loss": -8.274364471435547, "global_step": 50577, "epoch": 301} {"train_loss": -8.158333778381348, "global_step": 50578, "epoch": 301} {"train_loss": -8.164426803588867, "global_step": 50579, "epoch": 301} {"train_loss": -8.267452239990234, "global_step": 50580, "epoch": 301} {"train_loss": -7.978338241577148, "global_step": 50581, "epoch": 301} {"train_loss": -8.117616653442383, "global_step": 50582, "epoch": 301} {"train_loss": -8.338994979858398, "global_step": 50583, "epoch": 301} {"train_loss": -8.485662460327148, "global_step": 50584, "epoch": 301} {"train_loss": -7.9829816818237305, "global_step": 50585, "epoch": 301} {"train_loss": -8.228177070617676, "global_step": 50586, "epoch": 301} {"train_loss": -8.068424224853516, "global_step": 50587, "epoch": 301} {"train_loss": -8.198053359985352, "global_step": 50588, "epoch": 301} {"train_loss": -7.987076282501221, "global_step": 50589, "epoch": 301} {"train_loss": -8.196857452392578, "global_step": 50590, "epoch": 301} {"train_loss": -8.326980590820312, "global_step": 50591, "epoch": 301} {"train_loss": -8.383682250976562, "global_step": 50592, "epoch": 301} {"train_loss": -8.405734062194824, "global_step": 50593, "epoch": 301} {"train_loss": -8.424769401550293, "global_step": 50594, "epoch": 301} {"train_loss": -8.449684143066406, "global_step": 50595, "epoch": 301} {"train_loss": -8.059072494506836, "global_step": 50596, "epoch": 301} {"train_loss": -8.361096382141113, "global_step": 50597, "epoch": 301} {"train_loss": -8.226871490478516, "global_step": 50598, "epoch": 301} {"train_loss": -8.355968475341797, "global_step": 50599, "epoch": 301} {"train_loss": -8.412981986999512, "global_step": 50600, "epoch": 301} {"train_loss": -8.042201042175293, "global_step": 50601, "epoch": 301} {"train_loss": -8.128480911254883, "global_step": 50602, "epoch": 301} {"train_loss": -8.585006713867188, "global_step": 50603, "epoch": 301} {"train_loss": -8.11622142791748, "global_step": 50604, "epoch": 301} {"train_loss": -8.572235107421875, "global_step": 50605, "epoch": 301} {"train_loss": -8.219918251037598, "global_step": 50606, "epoch": 301} {"train_loss": -8.223296165466309, "global_step": 50607, "epoch": 301} {"train_loss": -8.359710693359375, "global_step": 50608, "epoch": 301} {"train_loss": -8.122380256652832, "global_step": 50609, "epoch": 301} {"train_loss": -8.060894012451172, "global_step": 50610, "epoch": 301} {"train_loss": -8.073324203491211, "global_step": 50611, "epoch": 301} {"train_loss": -8.194880485534668, "global_step": 50612, "epoch": 301} {"train_loss": -8.046088218688965, "global_step": 50613, "epoch": 301} {"train_loss": -8.368898391723633, "global_step": 50614, "epoch": 301} {"train_loss": -8.07423210144043, "global_step": 50615, "epoch": 301} {"train_loss": -8.096379280090332, "global_step": 50616, "epoch": 301} {"train_loss": -8.216636657714844, "global_step": 50617, "epoch": 301} {"train_loss": -8.311197280883789, "global_step": 50618, "epoch": 301} {"train_loss": -8.310481071472168, "global_step": 50619, "epoch": 301} {"train_loss": -8.377281188964844, "global_step": 50620, "epoch": 301} {"train_loss": -8.214365005493164, "global_step": 50621, "epoch": 301} {"train_loss": -8.389657974243164, "global_step": 50622, "epoch": 301} {"train_loss": -8.354540824890137, "global_step": 50623, "epoch": 301} {"train_loss": -8.31712818145752, "global_step": 50624, "epoch": 301} {"train_loss": -8.262528419494629, "global_step": 50625, "epoch": 301} {"train_loss": -8.298849105834961, "global_step": 50626, "epoch": 301} {"train_loss": -8.486970901489258, "global_step": 50627, "epoch": 301} {"train_loss": -8.365646362304688, "global_step": 50628, "epoch": 301} {"train_loss": -8.441208839416504, "global_step": 50629, "epoch": 301} {"train_loss": -8.312305450439453, "global_step": 50630, "epoch": 301} {"train_loss": -8.441232681274414, "global_step": 50631, "epoch": 301} {"train_loss": -8.16628646850586, "global_step": 50632, "epoch": 301} {"train_loss": -8.589197158813477, "global_step": 50633, "epoch": 301} {"train_loss": -8.182948112487793, "global_step": 50634, "epoch": 301} {"train_loss": -8.152036666870117, "global_step": 50635, "epoch": 301} {"train_loss": -8.40175724029541, "global_step": 50636, "epoch": 301} {"train_loss": -8.39277458190918, "global_step": 50637, "epoch": 301} {"train_loss": -8.241010665893555, "global_step": 50638, "epoch": 301} {"train_loss": -8.638240814208984, "global_step": 50639, "epoch": 301} {"train_loss": -8.530784606933594, "global_step": 50640, "epoch": 301} {"train_loss": -8.524436950683594, "global_step": 50641, "epoch": 301} {"train_loss": -8.299389839172363, "global_step": 50642, "epoch": 301} {"train_loss": -8.781110763549805, "global_step": 50643, "epoch": 301} {"train_loss": -8.286222457885742, "global_step": 50644, "epoch": 301} {"train_loss": -8.504838943481445, "global_step": 50645, "epoch": 301} {"train_loss": -8.299723625183105, "global_step": 50646, "epoch": 301} {"train_loss": -8.52536392211914, "global_step": 50647, "epoch": 301} {"train_loss": -8.470548629760742, "global_step": 50648, "epoch": 301} {"train_loss": -8.267627716064453, "global_step": 50649, "epoch": 301} {"train_loss": -8.566595077514648, "global_step": 50650, "epoch": 301} {"train_loss": -8.304101943969727, "global_step": 50651, "epoch": 301} {"train_loss": -8.537328720092773, "global_step": 50652, "epoch": 301} {"train_loss": -8.453573226928711, "global_step": 50653, "epoch": 301} {"train_loss": -8.371091842651367, "global_step": 50654, "epoch": 301} {"train_loss": -8.409151077270508, "global_step": 50655, "epoch": 301} {"train_loss": -8.658855438232422, "global_step": 50656, "epoch": 301} {"train_loss": -8.423759460449219, "global_step": 50657, "epoch": 301} {"train_loss": -8.049368858337402, "global_step": 50658, "epoch": 301} {"train_loss": -8.500633239746094, "global_step": 50659, "epoch": 301} {"train_loss": -7.996983528137207, "global_step": 50660, "epoch": 301} {"train_loss": -8.24958324432373, "global_step": 50661, "epoch": 301} {"train_loss": -8.143598556518555, "global_step": 50662, "epoch": 301} {"train_loss": -8.153922080993652, "global_step": 50663, "epoch": 301} {"train_loss": -8.272789001464844, "global_step": 50664, "epoch": 301} {"train_loss": -8.290904998779297, "global_step": 50665, "epoch": 301} {"train_loss": -8.208600997924805, "global_step": 50666, "epoch": 301} {"train_loss": -8.421687126159668, "global_step": 50667, "epoch": 301} {"train_loss": -8.501190185546875, "global_step": 50668, "epoch": 301} {"train_loss": -8.504955291748047, "global_step": 50669, "epoch": 301} {"train_loss": -8.285484313964844, "global_step": 50670, "epoch": 301} {"train_loss": -8.40617561340332, "global_step": 50671, "epoch": 301} {"train_loss": -8.470427513122559, "global_step": 50672, "epoch": 301} {"train_loss": -8.493026733398438, "global_step": 50673, "epoch": 301} {"train_loss": -8.249245643615723, "global_step": 50674, "epoch": 301} {"train_loss": -8.370415687561035, "global_step": 50675, "epoch": 301} {"train_loss": -8.424141883850098, "global_step": 50676, "epoch": 301} {"train_loss": -8.390287399291992, "global_step": 50677, "epoch": 301} {"train_loss": -8.428962707519531, "global_step": 50678, "epoch": 301} {"train_loss": -7.970299243927002, "global_step": 50679, "epoch": 301} {"train_loss": -8.10694694519043, "global_step": 50680, "epoch": 301} {"train_loss": -8.26257610321045, "global_step": 50681, "epoch": 301} {"train_loss": -8.302562713623047, "global_step": 50682, "epoch": 301} {"train_loss": -8.380170822143555, "global_step": 50683, "epoch": 301} {"train_loss": -8.1262788772583, "global_step": 50684, "epoch": 301} {"train_loss": -8.394430160522461, "global_step": 50685, "epoch": 301} {"train_loss": -8.306264877319336, "global_step": 50686, "epoch": 301} {"train_loss": -8.170723915100098, "global_step": 50687, "epoch": 301} {"train_loss": -8.376252174377441, "global_step": 50688, "epoch": 301} {"train_loss": -8.389004707336426, "global_step": 50689, "epoch": 301} {"train_loss": -8.30385684967041, "global_step": 50690, "epoch": 301} {"train_loss": -8.204080581665039, "global_step": 50691, "epoch": 301} {"train_loss": -8.386747360229492, "global_step": 50692, "epoch": 301} {"train_loss": -8.339839935302734, "global_step": 50693, "epoch": 301} {"train_loss": -7.936812877655029, "global_step": 50694, "epoch": 301} {"train_loss": -8.262764930725098, "global_step": 50695, "epoch": 301} {"train_loss": -7.98543119430542, "global_step": 50696, "epoch": 301} {"train_loss": -8.214469909667969, "global_step": 50697, "epoch": 301} {"train_loss": -8.038567543029785, "global_step": 50698, "epoch": 301} {"train_loss": -8.26435661315918, "global_step": 50699, "epoch": 301} {"train_loss": -8.066603660583496, "global_step": 50700, "epoch": 301} {"train_loss": -8.169837951660156, "global_step": 50701, "epoch": 301} {"train_loss": -8.280385971069336, "global_step": 50702, "epoch": 301} {"train_loss": -8.325187683105469, "global_step": 50703, "epoch": 301} {"train_loss": -8.197626113891602, "global_step": 50704, "epoch": 301} {"train_loss": -8.229384422302246, "global_step": 50705, "epoch": 301} {"train_loss": -8.147993087768555, "global_step": 50706, "epoch": 301} {"train_loss": -8.387529373168945, "global_step": 50707, "epoch": 301} {"train_loss": -8.402351379394531, "global_step": 50708, "epoch": 301} {"train_loss": -8.215675354003906, "global_step": 50709, "epoch": 301} {"train_loss": -8.270502090454102, "global_step": 50710, "epoch": 301} {"train_loss": -8.413543701171875, "global_step": 50711, "epoch": 301} {"train_loss": -8.31429386138916, "global_step": 50712, "epoch": 301} {"train_loss": -8.334718704223633, "global_step": 50713, "epoch": 301} {"train_loss": -8.177167892456055, "global_step": 50714, "epoch": 301} {"train_loss": -8.263679504394531, "global_step": 50715, "epoch": 301} {"train_loss": -8.106623649597168, "global_step": 50716, "epoch": 301} {"train_loss": -8.379388809204102, "global_step": 50717, "epoch": 301} {"train_loss": -8.287952423095703, "global_step": 50718, "epoch": 301} {"train_loss": -8.625768661499023, "global_step": 50719, "epoch": 301} {"train_loss": -8.326863288879395, "global_step": 50720, "epoch": 301} {"train_loss": -8.586189270019531, "global_step": 50721, "epoch": 301} {"train_loss": -8.608924865722656, "global_step": 50722, "epoch": 301} {"train_loss": -8.46786880493164, "global_step": 50723, "epoch": 301} {"train_loss": -8.542228698730469, "global_step": 50724, "epoch": 301} {"train_loss": -8.163808822631836, "global_step": 50725, "epoch": 301} {"train_loss": -8.430185317993164, "global_step": 50726, "epoch": 301} {"train_loss": -8.437028884887695, "global_step": 50727, "epoch": 301} {"train_loss": -8.610970497131348, "global_step": 50728, "epoch": 301} {"train_loss": -8.460664749145508, "global_step": 50729, "epoch": 301} {"train_loss": -8.525201797485352, "global_step": 50730, "epoch": 301} {"train_loss": -8.340829849243164, "global_step": 50731, "epoch": 301} {"train_loss": -8.470574378967285, "global_step": 50732, "epoch": 301} {"train_loss": -8.23286247253418, "global_step": 50733, "epoch": 301} {"train_loss": -8.571059226989746, "global_step": 50734, "epoch": 301} {"train_loss": -8.308007399241129, "global_step": 50735, "epoch": 301, "val_loss": 188704.0625} {"train_loss": -8.369522094726562, "global_step": 50736, "epoch": 302} {"train_loss": -8.641912460327148, "global_step": 50737, "epoch": 302} {"train_loss": -8.180914878845215, "global_step": 50738, "epoch": 302} {"train_loss": -8.272071838378906, "global_step": 50739, "epoch": 302} {"train_loss": -8.306341171264648, "global_step": 50740, "epoch": 302} {"train_loss": -8.155882835388184, "global_step": 50741, "epoch": 302} {"train_loss": -8.422724723815918, "global_step": 50742, "epoch": 302} {"train_loss": -8.153083801269531, "global_step": 50743, "epoch": 302} {"train_loss": -8.384438514709473, "global_step": 50744, "epoch": 302} {"train_loss": -8.400696754455566, "global_step": 50745, "epoch": 302} {"train_loss": -8.101998329162598, "global_step": 50746, "epoch": 302} {"train_loss": -8.295251846313477, "global_step": 50747, "epoch": 302} {"train_loss": -8.318866729736328, "global_step": 50748, "epoch": 302} {"train_loss": -8.475461959838867, "global_step": 50749, "epoch": 302} {"train_loss": -8.276846885681152, "global_step": 50750, "epoch": 302} {"train_loss": -8.443918228149414, "global_step": 50751, "epoch": 302} {"train_loss": -8.290874481201172, "global_step": 50752, "epoch": 302} {"train_loss": -8.351937294006348, "global_step": 50753, "epoch": 302} {"train_loss": -8.245233535766602, "global_step": 50754, "epoch": 302} {"train_loss": -8.386225700378418, "global_step": 50755, "epoch": 302} {"train_loss": -8.253862380981445, "global_step": 50756, "epoch": 302} {"train_loss": -8.275463104248047, "global_step": 50757, "epoch": 302} {"train_loss": -8.182632446289062, "global_step": 50758, "epoch": 302} {"train_loss": -8.173537254333496, "global_step": 50759, "epoch": 302} {"train_loss": -8.249191284179688, "global_step": 50760, "epoch": 302} {"train_loss": -8.468374252319336, "global_step": 50761, "epoch": 302} {"train_loss": -8.2503023147583, "global_step": 50762, "epoch": 302} {"train_loss": -8.171019554138184, "global_step": 50763, "epoch": 302} {"train_loss": -8.202709197998047, "global_step": 50764, "epoch": 302} {"train_loss": -8.49941635131836, "global_step": 50765, "epoch": 302} {"train_loss": -8.285987854003906, "global_step": 50766, "epoch": 302} {"train_loss": -7.9324188232421875, "global_step": 50767, "epoch": 302} {"train_loss": -8.236098289489746, "global_step": 50768, "epoch": 302} {"train_loss": -8.271371841430664, "global_step": 50769, "epoch": 302} {"train_loss": -8.083660125732422, "global_step": 50770, "epoch": 302} {"train_loss": -8.464629173278809, "global_step": 50771, "epoch": 302} {"train_loss": -8.555807113647461, "global_step": 50772, "epoch": 302} {"train_loss": -8.41180419921875, "global_step": 50773, "epoch": 302} {"train_loss": -8.26085090637207, "global_step": 50774, "epoch": 302} {"train_loss": -8.419900894165039, "global_step": 50775, "epoch": 302} {"train_loss": -8.35494613647461, "global_step": 50776, "epoch": 302} {"train_loss": -8.479296684265137, "global_step": 50777, "epoch": 302} {"train_loss": -8.512980461120605, "global_step": 50778, "epoch": 302} {"train_loss": -8.410340309143066, "global_step": 50779, "epoch": 302} {"train_loss": -8.419496536254883, "global_step": 50780, "epoch": 302} {"train_loss": -8.412202835083008, "global_step": 50781, "epoch": 302} {"train_loss": -8.582155227661133, "global_step": 50782, "epoch": 302} {"train_loss": -8.670639991760254, "global_step": 50783, "epoch": 302} {"train_loss": -8.285704612731934, "global_step": 50784, "epoch": 302} {"train_loss": -8.537721633911133, "global_step": 50785, "epoch": 302} {"train_loss": -8.35486125946045, "global_step": 50786, "epoch": 302} {"train_loss": -8.358999252319336, "global_step": 50787, "epoch": 302} {"train_loss": -8.569189071655273, "global_step": 50788, "epoch": 302} {"train_loss": -8.215887069702148, "global_step": 50789, "epoch": 302} {"train_loss": -8.026684761047363, "global_step": 50790, "epoch": 302} {"train_loss": -8.45920467376709, "global_step": 50791, "epoch": 302} {"train_loss": -8.196039199829102, "global_step": 50792, "epoch": 302} {"train_loss": -8.2791748046875, "global_step": 50793, "epoch": 302} {"train_loss": -8.467494010925293, "global_step": 50794, "epoch": 302} {"train_loss": -8.096461296081543, "global_step": 50795, "epoch": 302} {"train_loss": -8.044273376464844, "global_step": 50796, "epoch": 302} {"train_loss": -8.201865196228027, "global_step": 50797, "epoch": 302} {"train_loss": -8.49618911743164, "global_step": 50798, "epoch": 302} {"train_loss": -8.230901718139648, "global_step": 50799, "epoch": 302} {"train_loss": -8.369544982910156, "global_step": 50800, "epoch": 302} {"train_loss": -8.340462684631348, "global_step": 50801, "epoch": 302} {"train_loss": -8.262419700622559, "global_step": 50802, "epoch": 302} {"train_loss": -8.217638969421387, "global_step": 50803, "epoch": 302} {"train_loss": -8.229853630065918, "global_step": 50804, "epoch": 302} {"train_loss": -8.328102111816406, "global_step": 50805, "epoch": 302} {"train_loss": -8.521818161010742, "global_step": 50806, "epoch": 302} {"train_loss": -8.361446380615234, "global_step": 50807, "epoch": 302} {"train_loss": -8.428449630737305, "global_step": 50808, "epoch": 302} {"train_loss": -8.135091781616211, "global_step": 50809, "epoch": 302} {"train_loss": -8.467708587646484, "global_step": 50810, "epoch": 302} {"train_loss": -8.227228164672852, "global_step": 50811, "epoch": 302} {"train_loss": -8.34303092956543, "global_step": 50812, "epoch": 302} {"train_loss": -8.385725021362305, "global_step": 50813, "epoch": 302} {"train_loss": -8.364734649658203, "global_step": 50814, "epoch": 302} {"train_loss": -8.227684020996094, "global_step": 50815, "epoch": 302} {"train_loss": -8.042296409606934, "global_step": 50816, "epoch": 302} {"train_loss": -8.38861083984375, "global_step": 50817, "epoch": 302} {"train_loss": -7.758527755737305, "global_step": 50818, "epoch": 302} {"train_loss": -8.125055313110352, "global_step": 50819, "epoch": 302} {"train_loss": -7.680848598480225, "global_step": 50820, "epoch": 302} {"train_loss": -8.090778350830078, "global_step": 50821, "epoch": 302} {"train_loss": -8.108190536499023, "global_step": 50822, "epoch": 302} {"train_loss": -8.087898254394531, "global_step": 50823, "epoch": 302} {"train_loss": -8.148284912109375, "global_step": 50824, "epoch": 302} {"train_loss": -8.13386058807373, "global_step": 50825, "epoch": 302} {"train_loss": -8.056066513061523, "global_step": 50826, "epoch": 302} {"train_loss": -8.051227569580078, "global_step": 50827, "epoch": 302} {"train_loss": -8.405508041381836, "global_step": 50828, "epoch": 302} {"train_loss": -8.322125434875488, "global_step": 50829, "epoch": 302} {"train_loss": -8.229555130004883, "global_step": 50830, "epoch": 302} {"train_loss": -8.21866512298584, "global_step": 50831, "epoch": 302} {"train_loss": -8.32808780670166, "global_step": 50832, "epoch": 302} {"train_loss": -8.335348129272461, "global_step": 50833, "epoch": 302} {"train_loss": -8.42231559753418, "global_step": 50834, "epoch": 302} {"train_loss": -8.437823295593262, "global_step": 50835, "epoch": 302} {"train_loss": -8.410354614257812, "global_step": 50836, "epoch": 302} {"train_loss": -8.451581954956055, "global_step": 50837, "epoch": 302} {"train_loss": -8.352768898010254, "global_step": 50838, "epoch": 302} {"train_loss": -8.24195671081543, "global_step": 50839, "epoch": 302} {"train_loss": -8.362640380859375, "global_step": 50840, "epoch": 302} {"train_loss": -8.555042266845703, "global_step": 50841, "epoch": 302} {"train_loss": -8.412251472473145, "global_step": 50842, "epoch": 302} {"train_loss": -8.595945358276367, "global_step": 50843, "epoch": 302} {"train_loss": -8.416868209838867, "global_step": 50844, "epoch": 302} {"train_loss": -8.647529602050781, "global_step": 50845, "epoch": 302} {"train_loss": -8.405783653259277, "global_step": 50846, "epoch": 302} {"train_loss": -8.614641189575195, "global_step": 50847, "epoch": 302} {"train_loss": -8.407670974731445, "global_step": 50848, "epoch": 302} {"train_loss": -8.479926109313965, "global_step": 50849, "epoch": 302} {"train_loss": -8.61445140838623, "global_step": 50850, "epoch": 302} {"train_loss": -8.416959762573242, "global_step": 50851, "epoch": 302} {"train_loss": -8.35843276977539, "global_step": 50852, "epoch": 302} {"train_loss": -8.435213088989258, "global_step": 50853, "epoch": 302} {"train_loss": -8.371152877807617, "global_step": 50854, "epoch": 302} {"train_loss": -8.580451011657715, "global_step": 50855, "epoch": 302} {"train_loss": -8.3885498046875, "global_step": 50856, "epoch": 302} {"train_loss": -8.374933242797852, "global_step": 50857, "epoch": 302} {"train_loss": -8.363592147827148, "global_step": 50858, "epoch": 302} {"train_loss": -8.484678268432617, "global_step": 50859, "epoch": 302} {"train_loss": -8.638063430786133, "global_step": 50860, "epoch": 302} {"train_loss": -8.560474395751953, "global_step": 50861, "epoch": 302} {"train_loss": -8.335227012634277, "global_step": 50862, "epoch": 302} {"train_loss": -8.546939849853516, "global_step": 50863, "epoch": 302} {"train_loss": -8.20733642578125, "global_step": 50864, "epoch": 302} {"train_loss": -8.391929626464844, "global_step": 50865, "epoch": 302} {"train_loss": -8.19782829284668, "global_step": 50866, "epoch": 302} {"train_loss": -8.358399391174316, "global_step": 50867, "epoch": 302} {"train_loss": -8.207927703857422, "global_step": 50868, "epoch": 302} {"train_loss": -8.109809875488281, "global_step": 50869, "epoch": 302} {"train_loss": -8.39769458770752, "global_step": 50870, "epoch": 302} {"train_loss": -8.055574417114258, "global_step": 50871, "epoch": 302} {"train_loss": -8.292025566101074, "global_step": 50872, "epoch": 302} {"train_loss": -8.041509628295898, "global_step": 50873, "epoch": 302} {"train_loss": -8.46240520477295, "global_step": 50874, "epoch": 302} {"train_loss": -8.246478080749512, "global_step": 50875, "epoch": 302} {"train_loss": -8.377450942993164, "global_step": 50876, "epoch": 302} {"train_loss": -8.480953216552734, "global_step": 50877, "epoch": 302} {"train_loss": -8.053401947021484, "global_step": 50878, "epoch": 302} {"train_loss": -8.318889617919922, "global_step": 50879, "epoch": 302} {"train_loss": -8.370030403137207, "global_step": 50880, "epoch": 302} {"train_loss": -8.33008098602295, "global_step": 50881, "epoch": 302} {"train_loss": -8.209725379943848, "global_step": 50882, "epoch": 302} {"train_loss": -8.390643119812012, "global_step": 50883, "epoch": 302} {"train_loss": -8.289546966552734, "global_step": 50884, "epoch": 302} {"train_loss": -8.201517105102539, "global_step": 50885, "epoch": 302} {"train_loss": -8.386945724487305, "global_step": 50886, "epoch": 302} {"train_loss": -8.405641555786133, "global_step": 50887, "epoch": 302} {"train_loss": -8.038485527038574, "global_step": 50888, "epoch": 302} {"train_loss": -8.440156936645508, "global_step": 50889, "epoch": 302} {"train_loss": -8.039603233337402, "global_step": 50890, "epoch": 302} {"train_loss": -8.394655227661133, "global_step": 50891, "epoch": 302} {"train_loss": -8.446674346923828, "global_step": 50892, "epoch": 302} {"train_loss": -8.501758575439453, "global_step": 50893, "epoch": 302} {"train_loss": -8.388216018676758, "global_step": 50894, "epoch": 302} {"train_loss": -8.428470611572266, "global_step": 50895, "epoch": 302} {"train_loss": -8.471109390258789, "global_step": 50896, "epoch": 302} {"train_loss": -8.414505004882812, "global_step": 50897, "epoch": 302} {"train_loss": -8.100621223449707, "global_step": 50898, "epoch": 302} {"train_loss": -8.445635795593262, "global_step": 50899, "epoch": 302} {"train_loss": -8.268150329589844, "global_step": 50900, "epoch": 302} {"train_loss": -8.424600601196289, "global_step": 50901, "epoch": 302} {"train_loss": -8.557027816772461, "global_step": 50902, "epoch": 302} {"train_loss": -8.323941999957675, "global_step": 50903, "epoch": 302, "val_loss": 186968.8125} {"train_loss": -8.492589950561523, "global_step": 50904, "epoch": 303} {"train_loss": -8.35124683380127, "global_step": 50905, "epoch": 303} {"train_loss": -8.341978073120117, "global_step": 50906, "epoch": 303} {"train_loss": -8.325983047485352, "global_step": 50907, "epoch": 303} {"train_loss": -8.214200019836426, "global_step": 50908, "epoch": 303} {"train_loss": -8.251462936401367, "global_step": 50909, "epoch": 303} {"train_loss": -8.096647262573242, "global_step": 50910, "epoch": 303} {"train_loss": -8.499368667602539, "global_step": 50911, "epoch": 303} {"train_loss": -8.112628936767578, "global_step": 50912, "epoch": 303} {"train_loss": -8.419347763061523, "global_step": 50913, "epoch": 303} {"train_loss": -8.428080558776855, "global_step": 50914, "epoch": 303} {"train_loss": -8.253982543945312, "global_step": 50915, "epoch": 303} {"train_loss": -8.393842697143555, "global_step": 50916, "epoch": 303} {"train_loss": -8.335953712463379, "global_step": 50917, "epoch": 303} {"train_loss": -8.597904205322266, "global_step": 50918, "epoch": 303} {"train_loss": -8.425605773925781, "global_step": 50919, "epoch": 303} {"train_loss": -8.046907424926758, "global_step": 50920, "epoch": 303} {"train_loss": -8.289796829223633, "global_step": 50921, "epoch": 303} {"train_loss": -8.247941970825195, "global_step": 50922, "epoch": 303} {"train_loss": -8.08704948425293, "global_step": 50923, "epoch": 303} {"train_loss": -8.256853103637695, "global_step": 50924, "epoch": 303} {"train_loss": -8.281023025512695, "global_step": 50925, "epoch": 303} {"train_loss": -8.218792915344238, "global_step": 50926, "epoch": 303} {"train_loss": -8.487167358398438, "global_step": 50927, "epoch": 303} {"train_loss": -8.3318452835083, "global_step": 50928, "epoch": 303} {"train_loss": -8.093692779541016, "global_step": 50929, "epoch": 303} {"train_loss": -8.346687316894531, "global_step": 50930, "epoch": 303} {"train_loss": -8.289325714111328, "global_step": 50931, "epoch": 303} {"train_loss": -8.331710815429688, "global_step": 50932, "epoch": 303} {"train_loss": -8.38642406463623, "global_step": 50933, "epoch": 303} {"train_loss": -8.304004669189453, "global_step": 50934, "epoch": 303} {"train_loss": -8.282623291015625, "global_step": 50935, "epoch": 303} {"train_loss": -8.306608200073242, "global_step": 50936, "epoch": 303} {"train_loss": -8.313340187072754, "global_step": 50937, "epoch": 303} {"train_loss": -8.35141372680664, "global_step": 50938, "epoch": 303} {"train_loss": -8.421287536621094, "global_step": 50939, "epoch": 303} {"train_loss": -8.380352020263672, "global_step": 50940, "epoch": 303} {"train_loss": -8.53356647491455, "global_step": 50941, "epoch": 303} {"train_loss": -8.411800384521484, "global_step": 50942, "epoch": 303} {"train_loss": -8.339326858520508, "global_step": 50943, "epoch": 303} {"train_loss": -8.267297744750977, "global_step": 50944, "epoch": 303} {"train_loss": -8.292019844055176, "global_step": 50945, "epoch": 303} {"train_loss": -8.499664306640625, "global_step": 50946, "epoch": 303} {"train_loss": -8.111007690429688, "global_step": 50947, "epoch": 303} {"train_loss": -8.50191593170166, "global_step": 50948, "epoch": 303} {"train_loss": -8.268149375915527, "global_step": 50949, "epoch": 303} {"train_loss": -8.167197227478027, "global_step": 50950, "epoch": 303} {"train_loss": -8.433647155761719, "global_step": 50951, "epoch": 303} {"train_loss": -8.197912216186523, "global_step": 50952, "epoch": 303} {"train_loss": -8.582867622375488, "global_step": 50953, "epoch": 303} {"train_loss": -8.331903457641602, "global_step": 50954, "epoch": 303} {"train_loss": -8.497537612915039, "global_step": 50955, "epoch": 303} {"train_loss": -8.484912872314453, "global_step": 50956, "epoch": 303} {"train_loss": -8.219250679016113, "global_step": 50957, "epoch": 303} {"train_loss": -8.413044929504395, "global_step": 50958, "epoch": 303} {"train_loss": -8.371663093566895, "global_step": 50959, "epoch": 303} {"train_loss": -8.298444747924805, "global_step": 50960, "epoch": 303} {"train_loss": -8.53036880493164, "global_step": 50961, "epoch": 303} {"train_loss": -8.44920539855957, "global_step": 50962, "epoch": 303} {"train_loss": -8.371264457702637, "global_step": 50963, "epoch": 303} {"train_loss": -8.668517112731934, "global_step": 50964, "epoch": 303} {"train_loss": -8.514366149902344, "global_step": 50965, "epoch": 303} {"train_loss": -8.33338737487793, "global_step": 50966, "epoch": 303} {"train_loss": -8.572680473327637, "global_step": 50967, "epoch": 303} {"train_loss": -8.443620681762695, "global_step": 50968, "epoch": 303} {"train_loss": -8.194024085998535, "global_step": 50969, "epoch": 303} {"train_loss": -8.429390907287598, "global_step": 50970, "epoch": 303} {"train_loss": -8.412773132324219, "global_step": 50971, "epoch": 303} {"train_loss": -8.32730484008789, "global_step": 50972, "epoch": 303} {"train_loss": -8.605737686157227, "global_step": 50973, "epoch": 303} {"train_loss": -8.459000587463379, "global_step": 50974, "epoch": 303} {"train_loss": -8.457622528076172, "global_step": 50975, "epoch": 303} {"train_loss": -8.280618667602539, "global_step": 50976, "epoch": 303} {"train_loss": -8.426432609558105, "global_step": 50977, "epoch": 303} {"train_loss": -8.201757431030273, "global_step": 50978, "epoch": 303} {"train_loss": -8.163345336914062, "global_step": 50979, "epoch": 303} {"train_loss": -8.395591735839844, "global_step": 50980, "epoch": 303} {"train_loss": -8.214591979980469, "global_step": 50981, "epoch": 303} {"train_loss": -8.578920364379883, "global_step": 50982, "epoch": 303} {"train_loss": -8.081716537475586, "global_step": 50983, "epoch": 303} {"train_loss": -8.431282043457031, "global_step": 50984, "epoch": 303} {"train_loss": -8.502689361572266, "global_step": 50985, "epoch": 303} {"train_loss": -8.484658241271973, "global_step": 50986, "epoch": 303} {"train_loss": -8.62253189086914, "global_step": 50987, "epoch": 303} {"train_loss": -8.610641479492188, "global_step": 50988, "epoch": 303} {"train_loss": -8.459207534790039, "global_step": 50989, "epoch": 303} {"train_loss": -8.526968955993652, "global_step": 50990, "epoch": 303} {"train_loss": -8.548583030700684, "global_step": 50991, "epoch": 303} {"train_loss": -8.296855926513672, "global_step": 50992, "epoch": 303} {"train_loss": -8.468720436096191, "global_step": 50993, "epoch": 303} {"train_loss": -8.50757122039795, "global_step": 50994, "epoch": 303} {"train_loss": -8.482016563415527, "global_step": 50995, "epoch": 303} {"train_loss": -8.558271408081055, "global_step": 50996, "epoch": 303} {"train_loss": -8.221328735351562, "global_step": 50997, "epoch": 303} {"train_loss": -8.265427589416504, "global_step": 50998, "epoch": 303} {"train_loss": -8.43424129486084, "global_step": 50999, "epoch": 303} {"train_loss": -8.593567848205566, "global_step": 51000, "epoch": 303} {"train_loss": -8.34406566619873, "global_step": 51001, "epoch": 303} {"train_loss": -8.570013046264648, "global_step": 51002, "epoch": 303} {"train_loss": -8.526853561401367, "global_step": 51003, "epoch": 303} {"train_loss": -8.300768852233887, "global_step": 51004, "epoch": 303} {"train_loss": -8.5792236328125, "global_step": 51005, "epoch": 303} {"train_loss": -8.366874694824219, "global_step": 51006, "epoch": 303} {"train_loss": -8.436966896057129, "global_step": 51007, "epoch": 303} {"train_loss": -8.205324172973633, "global_step": 51008, "epoch": 303} {"train_loss": -8.12219524383545, "global_step": 51009, "epoch": 303} {"train_loss": -8.568536758422852, "global_step": 51010, "epoch": 303} {"train_loss": -8.100601196289062, "global_step": 51011, "epoch": 303} {"train_loss": -8.356280326843262, "global_step": 51012, "epoch": 303} {"train_loss": -8.128820419311523, "global_step": 51013, "epoch": 303} {"train_loss": -8.437590599060059, "global_step": 51014, "epoch": 303} {"train_loss": -8.128551483154297, "global_step": 51015, "epoch": 303} {"train_loss": -8.246789932250977, "global_step": 51016, "epoch": 303} {"train_loss": -8.308941841125488, "global_step": 51017, "epoch": 303} {"train_loss": -8.330493927001953, "global_step": 51018, "epoch": 303} {"train_loss": -8.068135261535645, "global_step": 51019, "epoch": 303} {"train_loss": -8.218488693237305, "global_step": 51020, "epoch": 303} {"train_loss": -8.200711250305176, "global_step": 51021, "epoch": 303} {"train_loss": -8.33230972290039, "global_step": 51022, "epoch": 303} {"train_loss": -8.38829231262207, "global_step": 51023, "epoch": 303} {"train_loss": -8.122346878051758, "global_step": 51024, "epoch": 303} {"train_loss": -8.563762664794922, "global_step": 51025, "epoch": 303} {"train_loss": -8.381948471069336, "global_step": 51026, "epoch": 303} {"train_loss": -8.404705047607422, "global_step": 51027, "epoch": 303} {"train_loss": -8.666841506958008, "global_step": 51028, "epoch": 303} {"train_loss": -8.491008758544922, "global_step": 51029, "epoch": 303} {"train_loss": -8.116118431091309, "global_step": 51030, "epoch": 303} {"train_loss": -8.640096664428711, "global_step": 51031, "epoch": 303} {"train_loss": -8.206153869628906, "global_step": 51032, "epoch": 303} {"train_loss": -8.257524490356445, "global_step": 51033, "epoch": 303} {"train_loss": -8.449785232543945, "global_step": 51034, "epoch": 303} {"train_loss": -8.375578880310059, "global_step": 51035, "epoch": 303} {"train_loss": -8.2424898147583, "global_step": 51036, "epoch": 303} {"train_loss": -8.462434768676758, "global_step": 51037, "epoch": 303} {"train_loss": -8.42796516418457, "global_step": 51038, "epoch": 303} {"train_loss": -8.547727584838867, "global_step": 51039, "epoch": 303} {"train_loss": -8.533766746520996, "global_step": 51040, "epoch": 303} {"train_loss": -8.57807731628418, "global_step": 51041, "epoch": 303} {"train_loss": -8.39614486694336, "global_step": 51042, "epoch": 303} {"train_loss": -8.46323013305664, "global_step": 51043, "epoch": 303} {"train_loss": -8.349843978881836, "global_step": 51044, "epoch": 303} {"train_loss": -8.390798568725586, "global_step": 51045, "epoch": 303} {"train_loss": -8.305129051208496, "global_step": 51046, "epoch": 303} {"train_loss": -8.468116760253906, "global_step": 51047, "epoch": 303} {"train_loss": -8.130146026611328, "global_step": 51048, "epoch": 303} {"train_loss": -8.532981872558594, "global_step": 51049, "epoch": 303} {"train_loss": -8.211727142333984, "global_step": 51050, "epoch": 303} {"train_loss": -8.199097633361816, "global_step": 51051, "epoch": 303} {"train_loss": -8.232240676879883, "global_step": 51052, "epoch": 303} {"train_loss": -8.262969970703125, "global_step": 51053, "epoch": 303} {"train_loss": -8.082477569580078, "global_step": 51054, "epoch": 303} {"train_loss": -8.344687461853027, "global_step": 51055, "epoch": 303} {"train_loss": -7.842331886291504, "global_step": 51056, "epoch": 303} {"train_loss": -8.378633499145508, "global_step": 51057, "epoch": 303} {"train_loss": -8.122552871704102, "global_step": 51058, "epoch": 303} {"train_loss": -8.220389366149902, "global_step": 51059, "epoch": 303} {"train_loss": -8.3099365234375, "global_step": 51060, "epoch": 303} {"train_loss": -8.37542724609375, "global_step": 51061, "epoch": 303} {"train_loss": -8.244705200195312, "global_step": 51062, "epoch": 303} {"train_loss": -8.242475509643555, "global_step": 51063, "epoch": 303} {"train_loss": -8.610750198364258, "global_step": 51064, "epoch": 303} {"train_loss": -8.457759857177734, "global_step": 51065, "epoch": 303} {"train_loss": -8.396190643310547, "global_step": 51066, "epoch": 303} {"train_loss": -8.587507247924805, "global_step": 51067, "epoch": 303} {"train_loss": -8.394323348999023, "global_step": 51068, "epoch": 303} {"train_loss": -8.504213333129883, "global_step": 51069, "epoch": 303} {"train_loss": -8.589309692382812, "global_step": 51070, "epoch": 303} {"train_loss": -8.361517718860082, "global_step": 51071, "epoch": 303, "val_loss": 188459.734375} {"train_loss": -8.18313980102539, "global_step": 51072, "epoch": 304} {"train_loss": -8.316619873046875, "global_step": 51073, "epoch": 304} {"train_loss": -8.584967613220215, "global_step": 51074, "epoch": 304} {"train_loss": -8.315893173217773, "global_step": 51075, "epoch": 304} {"train_loss": -8.345159530639648, "global_step": 51076, "epoch": 304} {"train_loss": -8.578950881958008, "global_step": 51077, "epoch": 304} {"train_loss": -8.682806968688965, "global_step": 51078, "epoch": 304} {"train_loss": -8.224699020385742, "global_step": 51079, "epoch": 304} {"train_loss": -8.201240539550781, "global_step": 51080, "epoch": 304} {"train_loss": -8.147913932800293, "global_step": 51081, "epoch": 304} {"train_loss": -8.381627082824707, "global_step": 51082, "epoch": 304} {"train_loss": -8.40500545501709, "global_step": 51083, "epoch": 304} {"train_loss": -8.471244812011719, "global_step": 51084, "epoch": 304} {"train_loss": -8.059589385986328, "global_step": 51085, "epoch": 304} {"train_loss": -8.567405700683594, "global_step": 51086, "epoch": 304} {"train_loss": -8.597471237182617, "global_step": 51087, "epoch": 304} {"train_loss": -8.234922409057617, "global_step": 51088, "epoch": 304} {"train_loss": -8.370203018188477, "global_step": 51089, "epoch": 304} {"train_loss": -8.378121376037598, "global_step": 51090, "epoch": 304} {"train_loss": -8.280864715576172, "global_step": 51091, "epoch": 304} {"train_loss": -8.317885398864746, "global_step": 51092, "epoch": 304} {"train_loss": -8.207208633422852, "global_step": 51093, "epoch": 304} {"train_loss": -8.419548988342285, "global_step": 51094, "epoch": 304} {"train_loss": -8.196954727172852, "global_step": 51095, "epoch": 304} {"train_loss": -8.138420104980469, "global_step": 51096, "epoch": 304} {"train_loss": -7.9839277267456055, "global_step": 51097, "epoch": 304} {"train_loss": -8.438741683959961, "global_step": 51098, "epoch": 304} {"train_loss": -8.260725975036621, "global_step": 51099, "epoch": 304} {"train_loss": -8.293214797973633, "global_step": 51100, "epoch": 304} {"train_loss": -8.325785636901855, "global_step": 51101, "epoch": 304} {"train_loss": -8.179132461547852, "global_step": 51102, "epoch": 304} {"train_loss": -8.280832290649414, "global_step": 51103, "epoch": 304} {"train_loss": -8.104042053222656, "global_step": 51104, "epoch": 304} {"train_loss": -8.381908416748047, "global_step": 51105, "epoch": 304} {"train_loss": -8.172365188598633, "global_step": 51106, "epoch": 304} {"train_loss": -8.115836143493652, "global_step": 51107, "epoch": 304} {"train_loss": -8.040185928344727, "global_step": 51108, "epoch": 304} {"train_loss": -8.566717147827148, "global_step": 51109, "epoch": 304} {"train_loss": -8.00759506225586, "global_step": 51110, "epoch": 304} {"train_loss": -8.051011085510254, "global_step": 51111, "epoch": 304} {"train_loss": -8.460256576538086, "global_step": 51112, "epoch": 304} {"train_loss": -8.47028636932373, "global_step": 51113, "epoch": 304} {"train_loss": -8.232572555541992, "global_step": 51114, "epoch": 304} {"train_loss": -8.383995056152344, "global_step": 51115, "epoch": 304} {"train_loss": -8.443089485168457, "global_step": 51116, "epoch": 304} {"train_loss": -8.332265853881836, "global_step": 51117, "epoch": 304} {"train_loss": -8.333663940429688, "global_step": 51118, "epoch": 304} {"train_loss": -8.407241821289062, "global_step": 51119, "epoch": 304} {"train_loss": -8.543780326843262, "global_step": 51120, "epoch": 304} {"train_loss": -8.13856315612793, "global_step": 51121, "epoch": 304} {"train_loss": -8.264270782470703, "global_step": 51122, "epoch": 304} {"train_loss": -8.429929733276367, "global_step": 51123, "epoch": 304} {"train_loss": -8.159071922302246, "global_step": 51124, "epoch": 304} {"train_loss": -8.434749603271484, "global_step": 51125, "epoch": 304} {"train_loss": -8.22864818572998, "global_step": 51126, "epoch": 304} {"train_loss": -8.354848861694336, "global_step": 51127, "epoch": 304} {"train_loss": -8.557296752929688, "global_step": 51128, "epoch": 304} {"train_loss": -8.63311767578125, "global_step": 51129, "epoch": 304} {"train_loss": -8.42026138305664, "global_step": 51130, "epoch": 304} {"train_loss": -8.259336471557617, "global_step": 51131, "epoch": 304} {"train_loss": -8.660737991333008, "global_step": 51132, "epoch": 304} {"train_loss": -8.143369674682617, "global_step": 51133, "epoch": 304} {"train_loss": -8.526665687561035, "global_step": 51134, "epoch": 304} {"train_loss": -8.261931419372559, "global_step": 51135, "epoch": 304} {"train_loss": -8.200979232788086, "global_step": 51136, "epoch": 304} {"train_loss": -8.26060676574707, "global_step": 51137, "epoch": 304} {"train_loss": -8.296524047851562, "global_step": 51138, "epoch": 304} {"train_loss": -8.031283378601074, "global_step": 51139, "epoch": 304} {"train_loss": -8.406084060668945, "global_step": 51140, "epoch": 304} {"train_loss": -8.153106689453125, "global_step": 51141, "epoch": 304} {"train_loss": -8.162723541259766, "global_step": 51142, "epoch": 304} {"train_loss": -8.214616775512695, "global_step": 51143, "epoch": 304} {"train_loss": -8.165107727050781, "global_step": 51144, "epoch": 304} {"train_loss": -8.402934074401855, "global_step": 51145, "epoch": 304} {"train_loss": -8.282018661499023, "global_step": 51146, "epoch": 304} {"train_loss": -8.351248741149902, "global_step": 51147, "epoch": 304} {"train_loss": -8.404325485229492, "global_step": 51148, "epoch": 304} {"train_loss": -8.25278091430664, "global_step": 51149, "epoch": 304} {"train_loss": -8.142866134643555, "global_step": 51150, "epoch": 304} {"train_loss": -8.384621620178223, "global_step": 51151, "epoch": 304} {"train_loss": -8.220722198486328, "global_step": 51152, "epoch": 304} {"train_loss": -8.303533554077148, "global_step": 51153, "epoch": 304} {"train_loss": -8.280954360961914, "global_step": 51154, "epoch": 304} {"train_loss": -8.249350547790527, "global_step": 51155, "epoch": 304} {"train_loss": -8.53914737701416, "global_step": 51156, "epoch": 304} {"train_loss": -8.316061019897461, "global_step": 51157, "epoch": 304} {"train_loss": -8.415180206298828, "global_step": 51158, "epoch": 304} {"train_loss": -8.136266708374023, "global_step": 51159, "epoch": 304} {"train_loss": -8.444378852844238, "global_step": 51160, "epoch": 304} {"train_loss": -8.479625701904297, "global_step": 51161, "epoch": 304} {"train_loss": -8.054546356201172, "global_step": 51162, "epoch": 304} {"train_loss": -8.396807670593262, "global_step": 51163, "epoch": 304} {"train_loss": -8.32339859008789, "global_step": 51164, "epoch": 304} {"train_loss": -8.369296073913574, "global_step": 51165, "epoch": 304} {"train_loss": -8.250441551208496, "global_step": 51166, "epoch": 304} {"train_loss": -8.498159408569336, "global_step": 51167, "epoch": 304} {"train_loss": -8.086706161499023, "global_step": 51168, "epoch": 304} {"train_loss": -8.44243049621582, "global_step": 51169, "epoch": 304} {"train_loss": -8.314032554626465, "global_step": 51170, "epoch": 304} {"train_loss": -8.423856735229492, "global_step": 51171, "epoch": 304} {"train_loss": -8.621289253234863, "global_step": 51172, "epoch": 304} {"train_loss": -8.539679527282715, "global_step": 51173, "epoch": 304} {"train_loss": -8.267322540283203, "global_step": 51174, "epoch": 304} {"train_loss": -8.501176834106445, "global_step": 51175, "epoch": 304} {"train_loss": -8.443685531616211, "global_step": 51176, "epoch": 304} {"train_loss": -8.150686264038086, "global_step": 51177, "epoch": 304} {"train_loss": -8.342375755310059, "global_step": 51178, "epoch": 304} {"train_loss": -8.344179153442383, "global_step": 51179, "epoch": 304} {"train_loss": -8.376808166503906, "global_step": 51180, "epoch": 304} {"train_loss": -8.108329772949219, "global_step": 51181, "epoch": 304} {"train_loss": -8.450199127197266, "global_step": 51182, "epoch": 304} {"train_loss": -8.476729393005371, "global_step": 51183, "epoch": 304} {"train_loss": -8.297931671142578, "global_step": 51184, "epoch": 304} {"train_loss": -8.09766674041748, "global_step": 51185, "epoch": 304} {"train_loss": -8.264619827270508, "global_step": 51186, "epoch": 304} {"train_loss": -8.237759590148926, "global_step": 51187, "epoch": 304} {"train_loss": -8.148151397705078, "global_step": 51188, "epoch": 304} {"train_loss": -8.48103141784668, "global_step": 51189, "epoch": 304} {"train_loss": -8.612977981567383, "global_step": 51190, "epoch": 304} {"train_loss": -8.287507057189941, "global_step": 51191, "epoch": 304} {"train_loss": -8.287973403930664, "global_step": 51192, "epoch": 304} {"train_loss": -8.434301376342773, "global_step": 51193, "epoch": 304} {"train_loss": -8.492246627807617, "global_step": 51194, "epoch": 304} {"train_loss": -8.46090030670166, "global_step": 51195, "epoch": 304} {"train_loss": -8.580066680908203, "global_step": 51196, "epoch": 304} {"train_loss": -8.491119384765625, "global_step": 51197, "epoch": 304} {"train_loss": -8.549060821533203, "global_step": 51198, "epoch": 304} {"train_loss": -8.482221603393555, "global_step": 51199, "epoch": 304} {"train_loss": -8.3968505859375, "global_step": 51200, "epoch": 304} {"train_loss": -8.310553550720215, "global_step": 51201, "epoch": 304} {"train_loss": -8.44292163848877, "global_step": 51202, "epoch": 304} {"train_loss": -8.347485542297363, "global_step": 51203, "epoch": 304} {"train_loss": -8.617362976074219, "global_step": 51204, "epoch": 304} {"train_loss": -8.504207611083984, "global_step": 51205, "epoch": 304} {"train_loss": -8.555023193359375, "global_step": 51206, "epoch": 304} {"train_loss": -8.55309772491455, "global_step": 51207, "epoch": 304} {"train_loss": -8.461649894714355, "global_step": 51208, "epoch": 304} {"train_loss": -8.528624534606934, "global_step": 51209, "epoch": 304} {"train_loss": -8.33271598815918, "global_step": 51210, "epoch": 304} {"train_loss": -8.524998664855957, "global_step": 51211, "epoch": 304} {"train_loss": -8.323406219482422, "global_step": 51212, "epoch": 304} {"train_loss": -8.571470260620117, "global_step": 51213, "epoch": 304} {"train_loss": -8.414796829223633, "global_step": 51214, "epoch": 304} {"train_loss": -8.3809814453125, "global_step": 51215, "epoch": 304} {"train_loss": -8.431588172912598, "global_step": 51216, "epoch": 304} {"train_loss": -8.64054012298584, "global_step": 51217, "epoch": 304} {"train_loss": -8.432595252990723, "global_step": 51218, "epoch": 304} {"train_loss": -8.366122245788574, "global_step": 51219, "epoch": 304} {"train_loss": -8.437260627746582, "global_step": 51220, "epoch": 304} {"train_loss": -8.334356307983398, "global_step": 51221, "epoch": 304} {"train_loss": -8.647692680358887, "global_step": 51222, "epoch": 304} {"train_loss": -8.633073806762695, "global_step": 51223, "epoch": 304} {"train_loss": -8.525638580322266, "global_step": 51224, "epoch": 304} {"train_loss": -8.399616241455078, "global_step": 51225, "epoch": 304} {"train_loss": -8.248916625976562, "global_step": 51226, "epoch": 304} {"train_loss": -8.350763320922852, "global_step": 51227, "epoch": 304} {"train_loss": -8.355140686035156, "global_step": 51228, "epoch": 304} {"train_loss": -8.248635292053223, "global_step": 51229, "epoch": 304} {"train_loss": -8.503252029418945, "global_step": 51230, "epoch": 304} {"train_loss": -8.364754676818848, "global_step": 51231, "epoch": 304} {"train_loss": -8.097967147827148, "global_step": 51232, "epoch": 304} {"train_loss": -8.25531005859375, "global_step": 51233, "epoch": 304} {"train_loss": -8.483890533447266, "global_step": 51234, "epoch": 304} {"train_loss": -8.488323211669922, "global_step": 51235, "epoch": 304} {"train_loss": -8.2706298828125, "global_step": 51236, "epoch": 304} {"train_loss": -8.558279037475586, "global_step": 51237, "epoch": 304} {"train_loss": -8.464017868041992, "global_step": 51238, "epoch": 304} {"train_loss": -8.35592289765676, "global_step": 51239, "epoch": 304, "val_loss": 188822.5} {"train_loss": -8.344070434570312, "global_step": 51240, "epoch": 305} {"train_loss": -8.408620834350586, "global_step": 51241, "epoch": 305} {"train_loss": -8.441438674926758, "global_step": 51242, "epoch": 305} {"train_loss": -8.397441864013672, "global_step": 51243, "epoch": 305} {"train_loss": -8.386722564697266, "global_step": 51244, "epoch": 305} {"train_loss": -7.9359941482543945, "global_step": 51245, "epoch": 305} {"train_loss": -8.30912971496582, "global_step": 51246, "epoch": 305} {"train_loss": -8.15088939666748, "global_step": 51247, "epoch": 305} {"train_loss": -8.438159942626953, "global_step": 51248, "epoch": 305} {"train_loss": -8.241998672485352, "global_step": 51249, "epoch": 305} {"train_loss": -8.206459045410156, "global_step": 51250, "epoch": 305} {"train_loss": -8.246135711669922, "global_step": 51251, "epoch": 305} {"train_loss": -8.280800819396973, "global_step": 51252, "epoch": 305} {"train_loss": -8.037147521972656, "global_step": 51253, "epoch": 305} {"train_loss": -8.05632209777832, "global_step": 51254, "epoch": 305} {"train_loss": -8.145625114440918, "global_step": 51255, "epoch": 305} {"train_loss": -8.199331283569336, "global_step": 51256, "epoch": 305} {"train_loss": -8.059118270874023, "global_step": 51257, "epoch": 305} {"train_loss": -8.22132682800293, "global_step": 51258, "epoch": 305} {"train_loss": -7.825538158416748, "global_step": 51259, "epoch": 305} {"train_loss": -8.229948043823242, "global_step": 51260, "epoch": 305} {"train_loss": -7.809597015380859, "global_step": 51261, "epoch": 305} {"train_loss": -8.247766494750977, "global_step": 51262, "epoch": 305} {"train_loss": -8.311206817626953, "global_step": 51263, "epoch": 305} {"train_loss": -8.234193801879883, "global_step": 51264, "epoch": 305} {"train_loss": -8.27260684967041, "global_step": 51265, "epoch": 305} {"train_loss": -8.005928039550781, "global_step": 51266, "epoch": 305} {"train_loss": -8.259740829467773, "global_step": 51267, "epoch": 305} {"train_loss": -8.263992309570312, "global_step": 51268, "epoch": 305} {"train_loss": -7.971266269683838, "global_step": 51269, "epoch": 305} {"train_loss": -8.223810195922852, "global_step": 51270, "epoch": 305} {"train_loss": -8.306449890136719, "global_step": 51271, "epoch": 305} {"train_loss": -8.253998756408691, "global_step": 51272, "epoch": 305} {"train_loss": -8.330020904541016, "global_step": 51273, "epoch": 305} {"train_loss": -8.26392936706543, "global_step": 51274, "epoch": 305} {"train_loss": -8.28764533996582, "global_step": 51275, "epoch": 305} {"train_loss": -8.272448539733887, "global_step": 51276, "epoch": 305} {"train_loss": -8.063417434692383, "global_step": 51277, "epoch": 305} {"train_loss": -8.373800277709961, "global_step": 51278, "epoch": 305} {"train_loss": -8.385498046875, "global_step": 51279, "epoch": 305} {"train_loss": -8.355761528015137, "global_step": 51280, "epoch": 305} {"train_loss": -8.154655456542969, "global_step": 51281, "epoch": 305} {"train_loss": -8.182966232299805, "global_step": 51282, "epoch": 305} {"train_loss": -8.141219139099121, "global_step": 51283, "epoch": 305} {"train_loss": -8.349275588989258, "global_step": 51284, "epoch": 305} {"train_loss": -8.423540115356445, "global_step": 51285, "epoch": 305} {"train_loss": -8.218124389648438, "global_step": 51286, "epoch": 305} {"train_loss": -8.419950485229492, "global_step": 51287, "epoch": 305} {"train_loss": -8.668135643005371, "global_step": 51288, "epoch": 305} {"train_loss": -8.506937026977539, "global_step": 51289, "epoch": 305} {"train_loss": -8.37824821472168, "global_step": 51290, "epoch": 305} {"train_loss": -8.352590560913086, "global_step": 51291, "epoch": 305} {"train_loss": -8.455081939697266, "global_step": 51292, "epoch": 305} {"train_loss": -8.333488464355469, "global_step": 51293, "epoch": 305} {"train_loss": -8.441941261291504, "global_step": 51294, "epoch": 305} {"train_loss": -8.429009437561035, "global_step": 51295, "epoch": 305} {"train_loss": -8.275507926940918, "global_step": 51296, "epoch": 305} {"train_loss": -8.561861038208008, "global_step": 51297, "epoch": 305} {"train_loss": -8.479582786560059, "global_step": 51298, "epoch": 305} {"train_loss": -8.406417846679688, "global_step": 51299, "epoch": 305} {"train_loss": -8.577054023742676, "global_step": 51300, "epoch": 305} {"train_loss": -8.580533981323242, "global_step": 51301, "epoch": 305} {"train_loss": -8.538829803466797, "global_step": 51302, "epoch": 305} {"train_loss": -8.32005500793457, "global_step": 51303, "epoch": 305} {"train_loss": -8.616477966308594, "global_step": 51304, "epoch": 305} {"train_loss": -8.567667007446289, "global_step": 51305, "epoch": 305} {"train_loss": -8.42973804473877, "global_step": 51306, "epoch": 305} {"train_loss": -8.5382080078125, "global_step": 51307, "epoch": 305} {"train_loss": -8.543785095214844, "global_step": 51308, "epoch": 305} {"train_loss": -8.696039199829102, "global_step": 51309, "epoch": 305} {"train_loss": -8.608413696289062, "global_step": 51310, "epoch": 305} {"train_loss": -8.281415939331055, "global_step": 51311, "epoch": 305} {"train_loss": -8.610912322998047, "global_step": 51312, "epoch": 305} {"train_loss": -8.547798156738281, "global_step": 51313, "epoch": 305} {"train_loss": -8.374029159545898, "global_step": 51314, "epoch": 305} {"train_loss": -8.465582847595215, "global_step": 51315, "epoch": 305} {"train_loss": -8.549297332763672, "global_step": 51316, "epoch": 305} {"train_loss": -8.428220748901367, "global_step": 51317, "epoch": 305} {"train_loss": -8.539986610412598, "global_step": 51318, "epoch": 305} {"train_loss": -8.668984413146973, "global_step": 51319, "epoch": 305} {"train_loss": -8.284245491027832, "global_step": 51320, "epoch": 305} {"train_loss": -8.239309310913086, "global_step": 51321, "epoch": 305} {"train_loss": -8.33319091796875, "global_step": 51322, "epoch": 305} {"train_loss": -8.150005340576172, "global_step": 51323, "epoch": 305} {"train_loss": -7.993517875671387, "global_step": 51324, "epoch": 305} {"train_loss": -7.9335479736328125, "global_step": 51325, "epoch": 305} {"train_loss": -7.64892578125, "global_step": 51326, "epoch": 305} {"train_loss": -8.075216293334961, "global_step": 51327, "epoch": 305} {"train_loss": -8.19908332824707, "global_step": 51328, "epoch": 305} {"train_loss": -8.313194274902344, "global_step": 51329, "epoch": 305} {"train_loss": -8.081398963928223, "global_step": 51330, "epoch": 305} {"train_loss": -8.114721298217773, "global_step": 51331, "epoch": 305} {"train_loss": -7.958130359649658, "global_step": 51332, "epoch": 305} {"train_loss": -8.092957496643066, "global_step": 51333, "epoch": 305} {"train_loss": -8.119519233703613, "global_step": 51334, "epoch": 305} {"train_loss": -8.129558563232422, "global_step": 51335, "epoch": 305} {"train_loss": -8.005504608154297, "global_step": 51336, "epoch": 305} {"train_loss": -8.197948455810547, "global_step": 51337, "epoch": 305} {"train_loss": -8.047460556030273, "global_step": 51338, "epoch": 305} {"train_loss": -8.212505340576172, "global_step": 51339, "epoch": 305} {"train_loss": -8.194791793823242, "global_step": 51340, "epoch": 305} {"train_loss": -8.230001449584961, "global_step": 51341, "epoch": 305} {"train_loss": -8.257721900939941, "global_step": 51342, "epoch": 305} {"train_loss": -8.072929382324219, "global_step": 51343, "epoch": 305} {"train_loss": -8.201141357421875, "global_step": 51344, "epoch": 305} {"train_loss": -8.297279357910156, "global_step": 51345, "epoch": 305} {"train_loss": -8.498048782348633, "global_step": 51346, "epoch": 305} {"train_loss": -8.249626159667969, "global_step": 51347, "epoch": 305} {"train_loss": -8.15570068359375, "global_step": 51348, "epoch": 305} {"train_loss": -8.484894752502441, "global_step": 51349, "epoch": 305} {"train_loss": -8.24606990814209, "global_step": 51350, "epoch": 305} {"train_loss": -8.642436981201172, "global_step": 51351, "epoch": 305} {"train_loss": -8.437494277954102, "global_step": 51352, "epoch": 305} {"train_loss": -8.41726016998291, "global_step": 51353, "epoch": 305} {"train_loss": -8.381233215332031, "global_step": 51354, "epoch": 305} {"train_loss": -8.131368637084961, "global_step": 51355, "epoch": 305} {"train_loss": -8.247793197631836, "global_step": 51356, "epoch": 305} {"train_loss": -8.377415657043457, "global_step": 51357, "epoch": 305} {"train_loss": -8.300149917602539, "global_step": 51358, "epoch": 305} {"train_loss": -8.568805694580078, "global_step": 51359, "epoch": 305} {"train_loss": -8.621925354003906, "global_step": 51360, "epoch": 305} {"train_loss": -8.464348793029785, "global_step": 51361, "epoch": 305} {"train_loss": -8.659639358520508, "global_step": 51362, "epoch": 305} {"train_loss": -8.611942291259766, "global_step": 51363, "epoch": 305} {"train_loss": -8.429676055908203, "global_step": 51364, "epoch": 305} {"train_loss": -8.64071273803711, "global_step": 51365, "epoch": 305} {"train_loss": -8.463465690612793, "global_step": 51366, "epoch": 305} {"train_loss": -8.465879440307617, "global_step": 51367, "epoch": 305} {"train_loss": -8.34199047088623, "global_step": 51368, "epoch": 305} {"train_loss": -8.555022239685059, "global_step": 51369, "epoch": 305} {"train_loss": -8.488283157348633, "global_step": 51370, "epoch": 305} {"train_loss": -8.42898178100586, "global_step": 51371, "epoch": 305} {"train_loss": -8.41838550567627, "global_step": 51372, "epoch": 305} {"train_loss": -8.31655502319336, "global_step": 51373, "epoch": 305} {"train_loss": -8.24984359741211, "global_step": 51374, "epoch": 305} {"train_loss": -8.064651489257812, "global_step": 51375, "epoch": 305} {"train_loss": -8.538368225097656, "global_step": 51376, "epoch": 305} {"train_loss": -8.245119094848633, "global_step": 51377, "epoch": 305} {"train_loss": -8.14055347442627, "global_step": 51378, "epoch": 305} {"train_loss": -8.190874099731445, "global_step": 51379, "epoch": 305} {"train_loss": -8.119230270385742, "global_step": 51380, "epoch": 305} {"train_loss": -8.062055587768555, "global_step": 51381, "epoch": 305} {"train_loss": -8.163002967834473, "global_step": 51382, "epoch": 305} {"train_loss": -8.231380462646484, "global_step": 51383, "epoch": 305} {"train_loss": -8.100584030151367, "global_step": 51384, "epoch": 305} {"train_loss": -7.826549530029297, "global_step": 51385, "epoch": 305} {"train_loss": -8.230749130249023, "global_step": 51386, "epoch": 305} {"train_loss": -8.016717910766602, "global_step": 51387, "epoch": 305} {"train_loss": -8.198689460754395, "global_step": 51388, "epoch": 305} {"train_loss": -8.319178581237793, "global_step": 51389, "epoch": 305} {"train_loss": -7.9627299308776855, "global_step": 51390, "epoch": 305} {"train_loss": -8.215713500976562, "global_step": 51391, "epoch": 305} {"train_loss": -8.314906120300293, "global_step": 51392, "epoch": 305} {"train_loss": -8.22795295715332, "global_step": 51393, "epoch": 305} {"train_loss": -8.301166534423828, "global_step": 51394, "epoch": 305} {"train_loss": -8.190374374389648, "global_step": 51395, "epoch": 305} {"train_loss": -8.444869995117188, "global_step": 51396, "epoch": 305} {"train_loss": -8.533885955810547, "global_step": 51397, "epoch": 305} {"train_loss": -8.146373748779297, "global_step": 51398, "epoch": 305} {"train_loss": -7.986722946166992, "global_step": 51399, "epoch": 305} {"train_loss": -8.317642211914062, "global_step": 51400, "epoch": 305} {"train_loss": -8.390602111816406, "global_step": 51401, "epoch": 305} {"train_loss": -8.268320083618164, "global_step": 51402, "epoch": 305} {"train_loss": -8.28689956665039, "global_step": 51403, "epoch": 305} {"train_loss": -8.099174499511719, "global_step": 51404, "epoch": 305} {"train_loss": -8.589336395263672, "global_step": 51405, "epoch": 305} {"train_loss": -8.246503829956055, "global_step": 51406, "epoch": 305} {"train_loss": -8.294665115220207, "global_step": 51407, "epoch": 305, "val_loss": 188441.765625, "train_action_mse_error": 10.31606674194336} {"train_loss": -8.320113182067871, "global_step": 51408, "epoch": 306} {"train_loss": -8.126195907592773, "global_step": 51409, "epoch": 306} {"train_loss": -8.448606491088867, "global_step": 51410, "epoch": 306} {"train_loss": -8.444960594177246, "global_step": 51411, "epoch": 306} {"train_loss": -8.568886756896973, "global_step": 51412, "epoch": 306} {"train_loss": -8.458128929138184, "global_step": 51413, "epoch": 306} {"train_loss": -8.41289234161377, "global_step": 51414, "epoch": 306} {"train_loss": -8.444299697875977, "global_step": 51415, "epoch": 306} {"train_loss": -8.255276679992676, "global_step": 51416, "epoch": 306} {"train_loss": -8.244462013244629, "global_step": 51417, "epoch": 306} {"train_loss": -8.483842849731445, "global_step": 51418, "epoch": 306} {"train_loss": -8.408242225646973, "global_step": 51419, "epoch": 306} {"train_loss": -8.308521270751953, "global_step": 51420, "epoch": 306} {"train_loss": -8.458490371704102, "global_step": 51421, "epoch": 306} {"train_loss": -8.331087112426758, "global_step": 51422, "epoch": 306} {"train_loss": -8.071547508239746, "global_step": 51423, "epoch": 306} {"train_loss": -8.603358268737793, "global_step": 51424, "epoch": 306} {"train_loss": -8.240394592285156, "global_step": 51425, "epoch": 306} {"train_loss": -8.235754013061523, "global_step": 51426, "epoch": 306} {"train_loss": -8.345466613769531, "global_step": 51427, "epoch": 306} {"train_loss": -8.468603134155273, "global_step": 51428, "epoch": 306} {"train_loss": -8.125423431396484, "global_step": 51429, "epoch": 306} {"train_loss": -8.381139755249023, "global_step": 51430, "epoch": 306} {"train_loss": -8.327886581420898, "global_step": 51431, "epoch": 306} {"train_loss": -8.396319389343262, "global_step": 51432, "epoch": 306} {"train_loss": -8.361138343811035, "global_step": 51433, "epoch": 306} {"train_loss": -8.581522941589355, "global_step": 51434, "epoch": 306} {"train_loss": -8.220056533813477, "global_step": 51435, "epoch": 306} {"train_loss": -8.337518692016602, "global_step": 51436, "epoch": 306} {"train_loss": -8.215365409851074, "global_step": 51437, "epoch": 306} {"train_loss": -8.482185363769531, "global_step": 51438, "epoch": 306} {"train_loss": -8.237839698791504, "global_step": 51439, "epoch": 306} {"train_loss": -8.448812484741211, "global_step": 51440, "epoch": 306} {"train_loss": -8.423130989074707, "global_step": 51441, "epoch": 306} {"train_loss": -8.149160385131836, "global_step": 51442, "epoch": 306} {"train_loss": -8.264795303344727, "global_step": 51443, "epoch": 306} {"train_loss": -8.256120681762695, "global_step": 51444, "epoch": 306} {"train_loss": -8.448362350463867, "global_step": 51445, "epoch": 306} {"train_loss": -8.491242408752441, "global_step": 51446, "epoch": 306} {"train_loss": -8.5010986328125, "global_step": 51447, "epoch": 306} {"train_loss": -8.52081298828125, "global_step": 51448, "epoch": 306} {"train_loss": -8.400285720825195, "global_step": 51449, "epoch": 306} {"train_loss": -8.367005348205566, "global_step": 51450, "epoch": 306} {"train_loss": -8.496435165405273, "global_step": 51451, "epoch": 306} {"train_loss": -8.511858940124512, "global_step": 51452, "epoch": 306} {"train_loss": -8.537246704101562, "global_step": 51453, "epoch": 306} {"train_loss": -8.362069129943848, "global_step": 51454, "epoch": 306} {"train_loss": -8.436073303222656, "global_step": 51455, "epoch": 306} {"train_loss": -8.642078399658203, "global_step": 51456, "epoch": 306} {"train_loss": -8.618062973022461, "global_step": 51457, "epoch": 306} {"train_loss": -8.442748069763184, "global_step": 51458, "epoch": 306} {"train_loss": -8.460693359375, "global_step": 51459, "epoch": 306} {"train_loss": -8.426057815551758, "global_step": 51460, "epoch": 306} {"train_loss": -8.562430381774902, "global_step": 51461, "epoch": 306} {"train_loss": -8.501269340515137, "global_step": 51462, "epoch": 306} {"train_loss": -8.434045791625977, "global_step": 51463, "epoch": 306} {"train_loss": -8.369865417480469, "global_step": 51464, "epoch": 306} {"train_loss": -8.586370468139648, "global_step": 51465, "epoch": 306} {"train_loss": -8.428077697753906, "global_step": 51466, "epoch": 306} {"train_loss": -8.416671752929688, "global_step": 51467, "epoch": 306} {"train_loss": -8.304557800292969, "global_step": 51468, "epoch": 306} {"train_loss": -8.515083312988281, "global_step": 51469, "epoch": 306} {"train_loss": -8.231337547302246, "global_step": 51470, "epoch": 306} {"train_loss": -8.176071166992188, "global_step": 51471, "epoch": 306} {"train_loss": -8.481182098388672, "global_step": 51472, "epoch": 306} {"train_loss": -8.218039512634277, "global_step": 51473, "epoch": 306} {"train_loss": -8.34245491027832, "global_step": 51474, "epoch": 306} {"train_loss": -8.377143859863281, "global_step": 51475, "epoch": 306} {"train_loss": -8.59992790222168, "global_step": 51476, "epoch": 306} {"train_loss": -8.578163146972656, "global_step": 51477, "epoch": 306} {"train_loss": -8.431184768676758, "global_step": 51478, "epoch": 306} {"train_loss": -8.456602096557617, "global_step": 51479, "epoch": 306} {"train_loss": -8.392702102661133, "global_step": 51480, "epoch": 306} {"train_loss": -8.491602897644043, "global_step": 51481, "epoch": 306} {"train_loss": -8.475231170654297, "global_step": 51482, "epoch": 306} {"train_loss": -8.48926067352295, "global_step": 51483, "epoch": 306} {"train_loss": -8.379146575927734, "global_step": 51484, "epoch": 306} {"train_loss": -8.474710464477539, "global_step": 51485, "epoch": 306} {"train_loss": -8.238231658935547, "global_step": 51486, "epoch": 306} {"train_loss": -8.291618347167969, "global_step": 51487, "epoch": 306} {"train_loss": -8.277966499328613, "global_step": 51488, "epoch": 306} {"train_loss": -8.445819854736328, "global_step": 51489, "epoch": 306} {"train_loss": -8.34965705871582, "global_step": 51490, "epoch": 306} {"train_loss": -8.22390365600586, "global_step": 51491, "epoch": 306} {"train_loss": -8.30653190612793, "global_step": 51492, "epoch": 306} {"train_loss": -8.505128860473633, "global_step": 51493, "epoch": 306} {"train_loss": -8.175243377685547, "global_step": 51494, "epoch": 306} {"train_loss": -8.311117172241211, "global_step": 51495, "epoch": 306} {"train_loss": -8.448680877685547, "global_step": 51496, "epoch": 306} {"train_loss": -8.447181701660156, "global_step": 51497, "epoch": 306} {"train_loss": -8.40754222869873, "global_step": 51498, "epoch": 306} {"train_loss": -8.232343673706055, "global_step": 51499, "epoch": 306} {"train_loss": -8.325105667114258, "global_step": 51500, "epoch": 306} {"train_loss": -8.181108474731445, "global_step": 51501, "epoch": 306} {"train_loss": -8.223318099975586, "global_step": 51502, "epoch": 306} {"train_loss": -8.436792373657227, "global_step": 51503, "epoch": 306} {"train_loss": -8.389355659484863, "global_step": 51504, "epoch": 306} {"train_loss": -8.363626480102539, "global_step": 51505, "epoch": 306} {"train_loss": -8.37299919128418, "global_step": 51506, "epoch": 306} {"train_loss": -8.457765579223633, "global_step": 51507, "epoch": 306} {"train_loss": -8.574151992797852, "global_step": 51508, "epoch": 306} {"train_loss": -8.480976104736328, "global_step": 51509, "epoch": 306} {"train_loss": -8.696802139282227, "global_step": 51510, "epoch": 306} {"train_loss": -8.451557159423828, "global_step": 51511, "epoch": 306} {"train_loss": -8.377911567687988, "global_step": 51512, "epoch": 306} {"train_loss": -8.484600067138672, "global_step": 51513, "epoch": 306} {"train_loss": -8.577634811401367, "global_step": 51514, "epoch": 306} {"train_loss": -8.54560375213623, "global_step": 51515, "epoch": 306} {"train_loss": -8.343005180358887, "global_step": 51516, "epoch": 306} {"train_loss": -8.62667179107666, "global_step": 51517, "epoch": 306} {"train_loss": -8.729379653930664, "global_step": 51518, "epoch": 306} {"train_loss": -8.361207962036133, "global_step": 51519, "epoch": 306} {"train_loss": -8.396897315979004, "global_step": 51520, "epoch": 306} {"train_loss": -8.156455993652344, "global_step": 51521, "epoch": 306} {"train_loss": -8.527179718017578, "global_step": 51522, "epoch": 306} {"train_loss": -8.347578048706055, "global_step": 51523, "epoch": 306} {"train_loss": -8.478147506713867, "global_step": 51524, "epoch": 306} {"train_loss": -8.438014030456543, "global_step": 51525, "epoch": 306} {"train_loss": -8.525856971740723, "global_step": 51526, "epoch": 306} {"train_loss": -8.300580978393555, "global_step": 51527, "epoch": 306} {"train_loss": -8.124117851257324, "global_step": 51528, "epoch": 306} {"train_loss": -8.101652145385742, "global_step": 51529, "epoch": 306} {"train_loss": -8.566006660461426, "global_step": 51530, "epoch": 306} {"train_loss": -8.15131950378418, "global_step": 51531, "epoch": 306} {"train_loss": -8.561253547668457, "global_step": 51532, "epoch": 306} {"train_loss": -8.44052791595459, "global_step": 51533, "epoch": 306} {"train_loss": -8.183062553405762, "global_step": 51534, "epoch": 306} {"train_loss": -8.478567123413086, "global_step": 51535, "epoch": 306} {"train_loss": -8.041694641113281, "global_step": 51536, "epoch": 306} {"train_loss": -8.290546417236328, "global_step": 51537, "epoch": 306} {"train_loss": -8.539023399353027, "global_step": 51538, "epoch": 306} {"train_loss": -8.270540237426758, "global_step": 51539, "epoch": 306} {"train_loss": -8.230524063110352, "global_step": 51540, "epoch": 306} {"train_loss": -8.147090911865234, "global_step": 51541, "epoch": 306} {"train_loss": -8.258668899536133, "global_step": 51542, "epoch": 306} {"train_loss": -8.358598709106445, "global_step": 51543, "epoch": 306} {"train_loss": -8.437704086303711, "global_step": 51544, "epoch": 306} {"train_loss": -8.276180267333984, "global_step": 51545, "epoch": 306} {"train_loss": -8.176515579223633, "global_step": 51546, "epoch": 306} {"train_loss": -8.361930847167969, "global_step": 51547, "epoch": 306} {"train_loss": -8.260098457336426, "global_step": 51548, "epoch": 306} {"train_loss": -8.221872329711914, "global_step": 51549, "epoch": 306} {"train_loss": -8.172114372253418, "global_step": 51550, "epoch": 306} {"train_loss": -8.330512046813965, "global_step": 51551, "epoch": 306} {"train_loss": -8.381678581237793, "global_step": 51552, "epoch": 306} {"train_loss": -8.32811164855957, "global_step": 51553, "epoch": 306} {"train_loss": -8.279226303100586, "global_step": 51554, "epoch": 306} {"train_loss": -8.528840065002441, "global_step": 51555, "epoch": 306} {"train_loss": -8.410103797912598, "global_step": 51556, "epoch": 306} {"train_loss": -8.409429550170898, "global_step": 51557, "epoch": 306} {"train_loss": -8.41173267364502, "global_step": 51558, "epoch": 306} {"train_loss": -8.549489974975586, "global_step": 51559, "epoch": 306} {"train_loss": -8.410774230957031, "global_step": 51560, "epoch": 306} {"train_loss": -8.497591018676758, "global_step": 51561, "epoch": 306} {"train_loss": -8.677490234375, "global_step": 51562, "epoch": 306} {"train_loss": -8.276969909667969, "global_step": 51563, "epoch": 306} {"train_loss": -8.488524436950684, "global_step": 51564, "epoch": 306} {"train_loss": -8.398411750793457, "global_step": 51565, "epoch": 306} {"train_loss": -8.587652206420898, "global_step": 51566, "epoch": 306} {"train_loss": -8.415822982788086, "global_step": 51567, "epoch": 306} {"train_loss": -8.268836975097656, "global_step": 51568, "epoch": 306} {"train_loss": -8.63833236694336, "global_step": 51569, "epoch": 306} {"train_loss": -8.122093200683594, "global_step": 51570, "epoch": 306} {"train_loss": -8.357551574707031, "global_step": 51571, "epoch": 306} {"train_loss": -8.509571075439453, "global_step": 51572, "epoch": 306} {"train_loss": -8.33306884765625, "global_step": 51573, "epoch": 306} {"train_loss": -8.522730827331543, "global_step": 51574, "epoch": 306} {"train_loss": -8.389240940411886, "global_step": 51575, "epoch": 306, "val_loss": 185700.625} {"train_loss": -8.212404251098633, "global_step": 51576, "epoch": 307} {"train_loss": -8.077142715454102, "global_step": 51577, "epoch": 307} {"train_loss": -8.028853416442871, "global_step": 51578, "epoch": 307} {"train_loss": -8.245157241821289, "global_step": 51579, "epoch": 307} {"train_loss": -8.043304443359375, "global_step": 51580, "epoch": 307} {"train_loss": -8.414295196533203, "global_step": 51581, "epoch": 307} {"train_loss": -8.203313827514648, "global_step": 51582, "epoch": 307} {"train_loss": -8.094810485839844, "global_step": 51583, "epoch": 307} {"train_loss": -8.269590377807617, "global_step": 51584, "epoch": 307} {"train_loss": -8.200765609741211, "global_step": 51585, "epoch": 307} {"train_loss": -8.15483283996582, "global_step": 51586, "epoch": 307} {"train_loss": -8.357873916625977, "global_step": 51587, "epoch": 307} {"train_loss": -8.252928733825684, "global_step": 51588, "epoch": 307} {"train_loss": -8.15467643737793, "global_step": 51589, "epoch": 307} {"train_loss": -8.261791229248047, "global_step": 51590, "epoch": 307} {"train_loss": -8.054561614990234, "global_step": 51591, "epoch": 307} {"train_loss": -7.9776201248168945, "global_step": 51592, "epoch": 307} {"train_loss": -8.16928482055664, "global_step": 51593, "epoch": 307} {"train_loss": -8.282014846801758, "global_step": 51594, "epoch": 307} {"train_loss": -7.992456912994385, "global_step": 51595, "epoch": 307} {"train_loss": -8.112178802490234, "global_step": 51596, "epoch": 307} {"train_loss": -8.473819732666016, "global_step": 51597, "epoch": 307} {"train_loss": -8.377935409545898, "global_step": 51598, "epoch": 307} {"train_loss": -8.414535522460938, "global_step": 51599, "epoch": 307} {"train_loss": -8.245574951171875, "global_step": 51600, "epoch": 307} {"train_loss": -8.355912208557129, "global_step": 51601, "epoch": 307} {"train_loss": -8.149368286132812, "global_step": 51602, "epoch": 307} {"train_loss": -8.44677734375, "global_step": 51603, "epoch": 307} {"train_loss": -8.306597709655762, "global_step": 51604, "epoch": 307} {"train_loss": -8.275358200073242, "global_step": 51605, "epoch": 307} {"train_loss": -8.179712295532227, "global_step": 51606, "epoch": 307} {"train_loss": -8.539214134216309, "global_step": 51607, "epoch": 307} {"train_loss": -8.360764503479004, "global_step": 51608, "epoch": 307} {"train_loss": -8.32432746887207, "global_step": 51609, "epoch": 307} {"train_loss": -8.367222785949707, "global_step": 51610, "epoch": 307} {"train_loss": -8.2105712890625, "global_step": 51611, "epoch": 307} {"train_loss": -8.371668815612793, "global_step": 51612, "epoch": 307} {"train_loss": -8.121809005737305, "global_step": 51613, "epoch": 307} {"train_loss": -8.60308837890625, "global_step": 51614, "epoch": 307} {"train_loss": -8.370965957641602, "global_step": 51615, "epoch": 307} {"train_loss": -8.34653091430664, "global_step": 51616, "epoch": 307} {"train_loss": -8.551944732666016, "global_step": 51617, "epoch": 307} {"train_loss": -8.702998161315918, "global_step": 51618, "epoch": 307} {"train_loss": -8.4921875, "global_step": 51619, "epoch": 307} {"train_loss": -8.571492195129395, "global_step": 51620, "epoch": 307} {"train_loss": -8.684713363647461, "global_step": 51621, "epoch": 307} {"train_loss": -8.497724533081055, "global_step": 51622, "epoch": 307} {"train_loss": -8.590408325195312, "global_step": 51623, "epoch": 307} {"train_loss": -8.38987922668457, "global_step": 51624, "epoch": 307} {"train_loss": -8.263543128967285, "global_step": 51625, "epoch": 307} {"train_loss": -8.127338409423828, "global_step": 51626, "epoch": 307} {"train_loss": -8.512547492980957, "global_step": 51627, "epoch": 307} {"train_loss": -7.9317402839660645, "global_step": 51628, "epoch": 307} {"train_loss": -8.098583221435547, "global_step": 51629, "epoch": 307} {"train_loss": -7.995165824890137, "global_step": 51630, "epoch": 307} {"train_loss": -8.026530265808105, "global_step": 51631, "epoch": 307} {"train_loss": -8.209131240844727, "global_step": 51632, "epoch": 307} {"train_loss": -8.313141822814941, "global_step": 51633, "epoch": 307} {"train_loss": -7.994792461395264, "global_step": 51634, "epoch": 307} {"train_loss": -8.091192245483398, "global_step": 51635, "epoch": 307} {"train_loss": -8.096793174743652, "global_step": 51636, "epoch": 307} {"train_loss": -7.87388277053833, "global_step": 51637, "epoch": 307} {"train_loss": -8.040142059326172, "global_step": 51638, "epoch": 307} {"train_loss": -8.065465927124023, "global_step": 51639, "epoch": 307} {"train_loss": -8.15550708770752, "global_step": 51640, "epoch": 307} {"train_loss": -8.21501636505127, "global_step": 51641, "epoch": 307} {"train_loss": -8.10532283782959, "global_step": 51642, "epoch": 307} {"train_loss": -8.327266693115234, "global_step": 51643, "epoch": 307} {"train_loss": -8.226354598999023, "global_step": 51644, "epoch": 307} {"train_loss": -8.241506576538086, "global_step": 51645, "epoch": 307} {"train_loss": -8.348775863647461, "global_step": 51646, "epoch": 307} {"train_loss": -8.475919723510742, "global_step": 51647, "epoch": 307} {"train_loss": -8.158590316772461, "global_step": 51648, "epoch": 307} {"train_loss": -8.292770385742188, "global_step": 51649, "epoch": 307} {"train_loss": -8.158208847045898, "global_step": 51650, "epoch": 307} {"train_loss": -8.464868545532227, "global_step": 51651, "epoch": 307} {"train_loss": -8.399297714233398, "global_step": 51652, "epoch": 307} {"train_loss": -7.916526794433594, "global_step": 51653, "epoch": 307} {"train_loss": -8.350137710571289, "global_step": 51654, "epoch": 307} {"train_loss": -8.32899284362793, "global_step": 51655, "epoch": 307} {"train_loss": -8.390480041503906, "global_step": 51656, "epoch": 307} {"train_loss": -8.298551559448242, "global_step": 51657, "epoch": 307} {"train_loss": -8.186372756958008, "global_step": 51658, "epoch": 307} {"train_loss": -8.436575889587402, "global_step": 51659, "epoch": 307} {"train_loss": -8.4158935546875, "global_step": 51660, "epoch": 307} {"train_loss": -8.369251251220703, "global_step": 51661, "epoch": 307} {"train_loss": -8.46947956085205, "global_step": 51662, "epoch": 307} {"train_loss": -8.466133117675781, "global_step": 51663, "epoch": 307} {"train_loss": -8.457352638244629, "global_step": 51664, "epoch": 307} {"train_loss": -8.406482696533203, "global_step": 51665, "epoch": 307} {"train_loss": -8.56259536743164, "global_step": 51666, "epoch": 307} {"train_loss": -8.584577560424805, "global_step": 51667, "epoch": 307} {"train_loss": -8.619146347045898, "global_step": 51668, "epoch": 307} {"train_loss": -8.516925811767578, "global_step": 51669, "epoch": 307} {"train_loss": -8.566505432128906, "global_step": 51670, "epoch": 307} {"train_loss": -8.518117904663086, "global_step": 51671, "epoch": 307} {"train_loss": -8.445980072021484, "global_step": 51672, "epoch": 307} {"train_loss": -8.456624984741211, "global_step": 51673, "epoch": 307} {"train_loss": -8.38528823852539, "global_step": 51674, "epoch": 307} {"train_loss": -8.530778884887695, "global_step": 51675, "epoch": 307} {"train_loss": -8.497809410095215, "global_step": 51676, "epoch": 307} {"train_loss": -8.221996307373047, "global_step": 51677, "epoch": 307} {"train_loss": -8.602952003479004, "global_step": 51678, "epoch": 307} {"train_loss": -8.38735580444336, "global_step": 51679, "epoch": 307} {"train_loss": -8.125953674316406, "global_step": 51680, "epoch": 307} {"train_loss": -8.29507827758789, "global_step": 51681, "epoch": 307} {"train_loss": -8.22789192199707, "global_step": 51682, "epoch": 307} {"train_loss": -8.350229263305664, "global_step": 51683, "epoch": 307} {"train_loss": -8.463878631591797, "global_step": 51684, "epoch": 307} {"train_loss": -8.087347984313965, "global_step": 51685, "epoch": 307} {"train_loss": -8.246277809143066, "global_step": 51686, "epoch": 307} {"train_loss": -7.481044769287109, "global_step": 51687, "epoch": 307} {"train_loss": -8.235121726989746, "global_step": 51688, "epoch": 307} {"train_loss": -7.759228706359863, "global_step": 51689, "epoch": 307} {"train_loss": -7.8897576332092285, "global_step": 51690, "epoch": 307} {"train_loss": -7.576757431030273, "global_step": 51691, "epoch": 307} {"train_loss": -7.661159992218018, "global_step": 51692, "epoch": 307} {"train_loss": -7.7502851486206055, "global_step": 51693, "epoch": 307} {"train_loss": -7.585573673248291, "global_step": 51694, "epoch": 307} {"train_loss": -7.7034125328063965, "global_step": 51695, "epoch": 307} {"train_loss": -7.7679243087768555, "global_step": 51696, "epoch": 307} {"train_loss": -7.712854385375977, "global_step": 51697, "epoch": 307} {"train_loss": -7.960357189178467, "global_step": 51698, "epoch": 307} {"train_loss": -7.91254997253418, "global_step": 51699, "epoch": 307} {"train_loss": -7.769295692443848, "global_step": 51700, "epoch": 307} {"train_loss": -7.993930339813232, "global_step": 51701, "epoch": 307} {"train_loss": -8.101398468017578, "global_step": 51702, "epoch": 307} {"train_loss": -7.910176753997803, "global_step": 51703, "epoch": 307} {"train_loss": -8.065069198608398, "global_step": 51704, "epoch": 307} {"train_loss": -8.010035514831543, "global_step": 51705, "epoch": 307} {"train_loss": -8.384846687316895, "global_step": 51706, "epoch": 307} {"train_loss": -8.243901252746582, "global_step": 51707, "epoch": 307} {"train_loss": -8.072151184082031, "global_step": 51708, "epoch": 307} {"train_loss": -8.136812210083008, "global_step": 51709, "epoch": 307} {"train_loss": -8.095781326293945, "global_step": 51710, "epoch": 307} {"train_loss": -8.16275691986084, "global_step": 51711, "epoch": 307} {"train_loss": -8.249307632446289, "global_step": 51712, "epoch": 307} {"train_loss": -8.008560180664062, "global_step": 51713, "epoch": 307} {"train_loss": -8.300858497619629, "global_step": 51714, "epoch": 307} {"train_loss": -8.391956329345703, "global_step": 51715, "epoch": 307} {"train_loss": -8.624914169311523, "global_step": 51716, "epoch": 307} {"train_loss": -8.513761520385742, "global_step": 51717, "epoch": 307} {"train_loss": -8.431984901428223, "global_step": 51718, "epoch": 307} {"train_loss": -8.526681900024414, "global_step": 51719, "epoch": 307} {"train_loss": -8.502690315246582, "global_step": 51720, "epoch": 307} {"train_loss": -8.58569622039795, "global_step": 51721, "epoch": 307} {"train_loss": -8.610137939453125, "global_step": 51722, "epoch": 307} {"train_loss": -8.560016632080078, "global_step": 51723, "epoch": 307} {"train_loss": -8.4916410446167, "global_step": 51724, "epoch": 307} {"train_loss": -8.398604393005371, "global_step": 51725, "epoch": 307} {"train_loss": -8.336690902709961, "global_step": 51726, "epoch": 307} {"train_loss": -8.287701606750488, "global_step": 51727, "epoch": 307} {"train_loss": -8.281684875488281, "global_step": 51728, "epoch": 307} {"train_loss": -8.139945983886719, "global_step": 51729, "epoch": 307} {"train_loss": -8.64141845703125, "global_step": 51730, "epoch": 307} {"train_loss": -8.31852912902832, "global_step": 51731, "epoch": 307} {"train_loss": -8.223115921020508, "global_step": 51732, "epoch": 307} {"train_loss": -8.707207679748535, "global_step": 51733, "epoch": 307} {"train_loss": -8.492155075073242, "global_step": 51734, "epoch": 307} {"train_loss": -8.148990631103516, "global_step": 51735, "epoch": 307} {"train_loss": -8.535164833068848, "global_step": 51736, "epoch": 307} {"train_loss": -8.331392288208008, "global_step": 51737, "epoch": 307} {"train_loss": -8.379304885864258, "global_step": 51738, "epoch": 307} {"train_loss": -8.530950546264648, "global_step": 51739, "epoch": 307} {"train_loss": -8.292035102844238, "global_step": 51740, "epoch": 307} {"train_loss": -8.054765701293945, "global_step": 51741, "epoch": 307} {"train_loss": -8.421548843383789, "global_step": 51742, "epoch": 307} {"train_loss": -8.260264251913343, "global_step": 51743, "epoch": 307, "val_loss": 185086.1875} {"train_loss": -8.222421646118164, "global_step": 51744, "epoch": 308} {"train_loss": -8.132365226745605, "global_step": 51745, "epoch": 308} {"train_loss": -8.090499877929688, "global_step": 51746, "epoch": 308} {"train_loss": -7.999063491821289, "global_step": 51747, "epoch": 308} {"train_loss": -8.40682315826416, "global_step": 51748, "epoch": 308} {"train_loss": -8.121395111083984, "global_step": 51749, "epoch": 308} {"train_loss": -8.537333488464355, "global_step": 51750, "epoch": 308} {"train_loss": -8.449686050415039, "global_step": 51751, "epoch": 308} {"train_loss": -8.277995109558105, "global_step": 51752, "epoch": 308} {"train_loss": -8.511077880859375, "global_step": 51753, "epoch": 308} {"train_loss": -8.316522598266602, "global_step": 51754, "epoch": 308} {"train_loss": -8.280271530151367, "global_step": 51755, "epoch": 308} {"train_loss": -8.42945671081543, "global_step": 51756, "epoch": 308} {"train_loss": -8.232206344604492, "global_step": 51757, "epoch": 308} {"train_loss": -8.297191619873047, "global_step": 51758, "epoch": 308} {"train_loss": -8.418190956115723, "global_step": 51759, "epoch": 308} {"train_loss": -8.313819885253906, "global_step": 51760, "epoch": 308} {"train_loss": -8.128082275390625, "global_step": 51761, "epoch": 308} {"train_loss": -8.150157928466797, "global_step": 51762, "epoch": 308} {"train_loss": -8.499176025390625, "global_step": 51763, "epoch": 308} {"train_loss": -8.389471054077148, "global_step": 51764, "epoch": 308} {"train_loss": -8.352746963500977, "global_step": 51765, "epoch": 308} {"train_loss": -8.256891250610352, "global_step": 51766, "epoch": 308} {"train_loss": -8.34429931640625, "global_step": 51767, "epoch": 308} {"train_loss": -8.427837371826172, "global_step": 51768, "epoch": 308} {"train_loss": -8.334936141967773, "global_step": 51769, "epoch": 308} {"train_loss": -8.39590835571289, "global_step": 51770, "epoch": 308} {"train_loss": -8.452169418334961, "global_step": 51771, "epoch": 308} {"train_loss": -8.553257942199707, "global_step": 51772, "epoch": 308} {"train_loss": -8.188920974731445, "global_step": 51773, "epoch": 308} {"train_loss": -8.53050422668457, "global_step": 51774, "epoch": 308} {"train_loss": -8.440869331359863, "global_step": 51775, "epoch": 308} {"train_loss": -8.539922714233398, "global_step": 51776, "epoch": 308} {"train_loss": -8.544737815856934, "global_step": 51777, "epoch": 308} {"train_loss": -8.286419868469238, "global_step": 51778, "epoch": 308} {"train_loss": -8.594259262084961, "global_step": 51779, "epoch": 308} {"train_loss": -8.529759407043457, "global_step": 51780, "epoch": 308} {"train_loss": -8.540017127990723, "global_step": 51781, "epoch": 308} {"train_loss": -8.216994285583496, "global_step": 51782, "epoch": 308} {"train_loss": -8.40325927734375, "global_step": 51783, "epoch": 308} {"train_loss": -8.37142562866211, "global_step": 51784, "epoch": 308} {"train_loss": -8.442022323608398, "global_step": 51785, "epoch": 308} {"train_loss": -8.182918548583984, "global_step": 51786, "epoch": 308} {"train_loss": -8.06821060180664, "global_step": 51787, "epoch": 308} {"train_loss": -8.342193603515625, "global_step": 51788, "epoch": 308} {"train_loss": -8.203882217407227, "global_step": 51789, "epoch": 308} {"train_loss": -8.299602508544922, "global_step": 51790, "epoch": 308} {"train_loss": -8.247245788574219, "global_step": 51791, "epoch": 308} {"train_loss": -8.222177505493164, "global_step": 51792, "epoch": 308} {"train_loss": -8.294647216796875, "global_step": 51793, "epoch": 308} {"train_loss": -8.07175350189209, "global_step": 51794, "epoch": 308} {"train_loss": -8.36570930480957, "global_step": 51795, "epoch": 308} {"train_loss": -8.48880386352539, "global_step": 51796, "epoch": 308} {"train_loss": -8.172325134277344, "global_step": 51797, "epoch": 308} {"train_loss": -8.483970642089844, "global_step": 51798, "epoch": 308} {"train_loss": -8.34228515625, "global_step": 51799, "epoch": 308} {"train_loss": -8.377185821533203, "global_step": 51800, "epoch": 308} {"train_loss": -8.47990608215332, "global_step": 51801, "epoch": 308} {"train_loss": -8.357412338256836, "global_step": 51802, "epoch": 308} {"train_loss": -8.518070220947266, "global_step": 51803, "epoch": 308} {"train_loss": -8.625638961791992, "global_step": 51804, "epoch": 308} {"train_loss": -8.315214157104492, "global_step": 51805, "epoch": 308} {"train_loss": -8.448738098144531, "global_step": 51806, "epoch": 308} {"train_loss": -8.530754089355469, "global_step": 51807, "epoch": 308} {"train_loss": -8.482112884521484, "global_step": 51808, "epoch": 308} {"train_loss": -8.574783325195312, "global_step": 51809, "epoch": 308} {"train_loss": -8.486371994018555, "global_step": 51810, "epoch": 308} {"train_loss": -8.429126739501953, "global_step": 51811, "epoch": 308} {"train_loss": -8.404953956604004, "global_step": 51812, "epoch": 308} {"train_loss": -8.351839065551758, "global_step": 51813, "epoch": 308} {"train_loss": -8.718016624450684, "global_step": 51814, "epoch": 308} {"train_loss": -8.556905746459961, "global_step": 51815, "epoch": 308} {"train_loss": -8.697328567504883, "global_step": 51816, "epoch": 308} {"train_loss": -8.227656364440918, "global_step": 51817, "epoch": 308} {"train_loss": -8.37908935546875, "global_step": 51818, "epoch": 308} {"train_loss": -8.42484188079834, "global_step": 51819, "epoch": 308} {"train_loss": -8.425625801086426, "global_step": 51820, "epoch": 308} {"train_loss": -8.562519073486328, "global_step": 51821, "epoch": 308} {"train_loss": -8.556482315063477, "global_step": 51822, "epoch": 308} {"train_loss": -8.404814720153809, "global_step": 51823, "epoch": 308} {"train_loss": -8.317842483520508, "global_step": 51824, "epoch": 308} {"train_loss": -8.507935523986816, "global_step": 51825, "epoch": 308} {"train_loss": -8.396982192993164, "global_step": 51826, "epoch": 308} {"train_loss": -8.660890579223633, "global_step": 51827, "epoch": 308} {"train_loss": -8.466514587402344, "global_step": 51828, "epoch": 308} {"train_loss": -8.264724731445312, "global_step": 51829, "epoch": 308} {"train_loss": -8.361837387084961, "global_step": 51830, "epoch": 308} {"train_loss": -8.17542839050293, "global_step": 51831, "epoch": 308} {"train_loss": -8.191606521606445, "global_step": 51832, "epoch": 308} {"train_loss": -8.573904037475586, "global_step": 51833, "epoch": 308} {"train_loss": -8.077296257019043, "global_step": 51834, "epoch": 308} {"train_loss": -8.64244270324707, "global_step": 51835, "epoch": 308} {"train_loss": -7.990699291229248, "global_step": 51836, "epoch": 308} {"train_loss": -8.306007385253906, "global_step": 51837, "epoch": 308} {"train_loss": -8.52352523803711, "global_step": 51838, "epoch": 308} {"train_loss": -8.26358413696289, "global_step": 51839, "epoch": 308} {"train_loss": -8.347270965576172, "global_step": 51840, "epoch": 308} {"train_loss": -8.298775672912598, "global_step": 51841, "epoch": 308} {"train_loss": -8.363187789916992, "global_step": 51842, "epoch": 308} {"train_loss": -8.22673225402832, "global_step": 51843, "epoch": 308} {"train_loss": -8.438599586486816, "global_step": 51844, "epoch": 308} {"train_loss": -8.43106460571289, "global_step": 51845, "epoch": 308} {"train_loss": -8.110441207885742, "global_step": 51846, "epoch": 308} {"train_loss": -8.16236400604248, "global_step": 51847, "epoch": 308} {"train_loss": -8.187990188598633, "global_step": 51848, "epoch": 308} {"train_loss": -8.177469253540039, "global_step": 51849, "epoch": 308} {"train_loss": -8.067788124084473, "global_step": 51850, "epoch": 308} {"train_loss": -8.381067276000977, "global_step": 51851, "epoch": 308} {"train_loss": -8.182516098022461, "global_step": 51852, "epoch": 308} {"train_loss": -8.414592742919922, "global_step": 51853, "epoch": 308} {"train_loss": -7.996588230133057, "global_step": 51854, "epoch": 308} {"train_loss": -8.273320198059082, "global_step": 51855, "epoch": 308} {"train_loss": -8.027421951293945, "global_step": 51856, "epoch": 308} {"train_loss": -8.265512466430664, "global_step": 51857, "epoch": 308} {"train_loss": -8.242534637451172, "global_step": 51858, "epoch": 308} {"train_loss": -8.125988006591797, "global_step": 51859, "epoch": 308} {"train_loss": -8.06466293334961, "global_step": 51860, "epoch": 308} {"train_loss": -8.099160194396973, "global_step": 51861, "epoch": 308} {"train_loss": -8.394441604614258, "global_step": 51862, "epoch": 308} {"train_loss": -8.346728324890137, "global_step": 51863, "epoch": 308} {"train_loss": -8.32959270477295, "global_step": 51864, "epoch": 308} {"train_loss": -8.306221008300781, "global_step": 51865, "epoch": 308} {"train_loss": -8.018721580505371, "global_step": 51866, "epoch": 308} {"train_loss": -8.453814506530762, "global_step": 51867, "epoch": 308} {"train_loss": -8.36783218383789, "global_step": 51868, "epoch": 308} {"train_loss": -8.389711380004883, "global_step": 51869, "epoch": 308} {"train_loss": -8.397954940795898, "global_step": 51870, "epoch": 308} {"train_loss": -8.28598690032959, "global_step": 51871, "epoch": 308} {"train_loss": -8.217698097229004, "global_step": 51872, "epoch": 308} {"train_loss": -8.465195655822754, "global_step": 51873, "epoch": 308} {"train_loss": -8.408820152282715, "global_step": 51874, "epoch": 308} {"train_loss": -8.25309944152832, "global_step": 51875, "epoch": 308} {"train_loss": -8.410801887512207, "global_step": 51876, "epoch": 308} {"train_loss": -8.444467544555664, "global_step": 51877, "epoch": 308} {"train_loss": -8.425281524658203, "global_step": 51878, "epoch": 308} {"train_loss": -8.431160926818848, "global_step": 51879, "epoch": 308} {"train_loss": -8.447380065917969, "global_step": 51880, "epoch": 308} {"train_loss": -8.312154769897461, "global_step": 51881, "epoch": 308} {"train_loss": -8.304560661315918, "global_step": 51882, "epoch": 308} {"train_loss": -8.421158790588379, "global_step": 51883, "epoch": 308} {"train_loss": -8.498069763183594, "global_step": 51884, "epoch": 308} {"train_loss": -8.292167663574219, "global_step": 51885, "epoch": 308} {"train_loss": -8.414259910583496, "global_step": 51886, "epoch": 308} {"train_loss": -8.223603248596191, "global_step": 51887, "epoch": 308} {"train_loss": -8.28680419921875, "global_step": 51888, "epoch": 308} {"train_loss": -8.433847427368164, "global_step": 51889, "epoch": 308} {"train_loss": -8.271849632263184, "global_step": 51890, "epoch": 308} {"train_loss": -8.453716278076172, "global_step": 51891, "epoch": 308} {"train_loss": -8.343055725097656, "global_step": 51892, "epoch": 308} {"train_loss": -8.374443054199219, "global_step": 51893, "epoch": 308} {"train_loss": -8.449665069580078, "global_step": 51894, "epoch": 308} {"train_loss": -8.479246139526367, "global_step": 51895, "epoch": 308} {"train_loss": -8.524629592895508, "global_step": 51896, "epoch": 308} {"train_loss": -8.15816879272461, "global_step": 51897, "epoch": 308} {"train_loss": -8.320003509521484, "global_step": 51898, "epoch": 308} {"train_loss": -8.47419548034668, "global_step": 51899, "epoch": 308} {"train_loss": -8.190549850463867, "global_step": 51900, "epoch": 308} {"train_loss": -8.414595603942871, "global_step": 51901, "epoch": 308} {"train_loss": -8.460741996765137, "global_step": 51902, "epoch": 308} {"train_loss": -8.633326530456543, "global_step": 51903, "epoch": 308} {"train_loss": -8.388885498046875, "global_step": 51904, "epoch": 308} {"train_loss": -8.606444358825684, "global_step": 51905, "epoch": 308} {"train_loss": -8.446840286254883, "global_step": 51906, "epoch": 308} {"train_loss": -8.34304141998291, "global_step": 51907, "epoch": 308} {"train_loss": -8.128564834594727, "global_step": 51908, "epoch": 308} {"train_loss": -8.488982200622559, "global_step": 51909, "epoch": 308} {"train_loss": -8.37187385559082, "global_step": 51910, "epoch": 308} {"train_loss": -8.353203029859634, "global_step": 51911, "epoch": 308, "val_loss": 186586.96875} {"train_loss": -8.038111686706543, "global_step": 51912, "epoch": 309} {"train_loss": -8.51284122467041, "global_step": 51913, "epoch": 309} {"train_loss": -7.6122355461120605, "global_step": 51914, "epoch": 309} {"train_loss": -8.471508026123047, "global_step": 51915, "epoch": 309} {"train_loss": -7.995342254638672, "global_step": 51916, "epoch": 309} {"train_loss": -8.150369644165039, "global_step": 51917, "epoch": 309} {"train_loss": -8.425557136535645, "global_step": 51918, "epoch": 309} {"train_loss": -8.438716888427734, "global_step": 51919, "epoch": 309} {"train_loss": -8.326974868774414, "global_step": 51920, "epoch": 309} {"train_loss": -8.399625778198242, "global_step": 51921, "epoch": 309} {"train_loss": -8.367936134338379, "global_step": 51922, "epoch": 309} {"train_loss": -8.239068984985352, "global_step": 51923, "epoch": 309} {"train_loss": -8.514030456542969, "global_step": 51924, "epoch": 309} {"train_loss": -8.203770637512207, "global_step": 51925, "epoch": 309} {"train_loss": -8.375669479370117, "global_step": 51926, "epoch": 309} {"train_loss": -8.38399887084961, "global_step": 51927, "epoch": 309} {"train_loss": -8.186293601989746, "global_step": 51928, "epoch": 309} {"train_loss": -8.65111255645752, "global_step": 51929, "epoch": 309} {"train_loss": -8.276300430297852, "global_step": 51930, "epoch": 309} {"train_loss": -8.461905479431152, "global_step": 51931, "epoch": 309} {"train_loss": -8.41415786743164, "global_step": 51932, "epoch": 309} {"train_loss": -8.466191291809082, "global_step": 51933, "epoch": 309} {"train_loss": -8.304878234863281, "global_step": 51934, "epoch": 309} {"train_loss": -8.393491744995117, "global_step": 51935, "epoch": 309} {"train_loss": -8.282061576843262, "global_step": 51936, "epoch": 309} {"train_loss": -8.607553482055664, "global_step": 51937, "epoch": 309} {"train_loss": -8.513548851013184, "global_step": 51938, "epoch": 309} {"train_loss": -8.514312744140625, "global_step": 51939, "epoch": 309} {"train_loss": -8.315645217895508, "global_step": 51940, "epoch": 309} {"train_loss": -8.484386444091797, "global_step": 51941, "epoch": 309} {"train_loss": -8.4747314453125, "global_step": 51942, "epoch": 309} {"train_loss": -8.249603271484375, "global_step": 51943, "epoch": 309} {"train_loss": -8.572347640991211, "global_step": 51944, "epoch": 309} {"train_loss": -8.327093124389648, "global_step": 51945, "epoch": 309} {"train_loss": -8.649881362915039, "global_step": 51946, "epoch": 309} {"train_loss": -8.193183898925781, "global_step": 51947, "epoch": 309} {"train_loss": -8.520946502685547, "global_step": 51948, "epoch": 309} {"train_loss": -8.20724105834961, "global_step": 51949, "epoch": 309} {"train_loss": -8.32078742980957, "global_step": 51950, "epoch": 309} {"train_loss": -8.240447044372559, "global_step": 51951, "epoch": 309} {"train_loss": -8.626641273498535, "global_step": 51952, "epoch": 309} {"train_loss": -8.220706939697266, "global_step": 51953, "epoch": 309} {"train_loss": -8.399001121520996, "global_step": 51954, "epoch": 309} {"train_loss": -8.294612884521484, "global_step": 51955, "epoch": 309} {"train_loss": -8.527948379516602, "global_step": 51956, "epoch": 309} {"train_loss": -8.138232231140137, "global_step": 51957, "epoch": 309} {"train_loss": -8.45314884185791, "global_step": 51958, "epoch": 309} {"train_loss": -8.369094848632812, "global_step": 51959, "epoch": 309} {"train_loss": -8.509272575378418, "global_step": 51960, "epoch": 309} {"train_loss": -8.281335830688477, "global_step": 51961, "epoch": 309} {"train_loss": -8.403095245361328, "global_step": 51962, "epoch": 309} {"train_loss": -8.270785331726074, "global_step": 51963, "epoch": 309} {"train_loss": -8.414854049682617, "global_step": 51964, "epoch": 309} {"train_loss": -8.15211296081543, "global_step": 51965, "epoch": 309} {"train_loss": -8.384134292602539, "global_step": 51966, "epoch": 309} {"train_loss": -8.330044746398926, "global_step": 51967, "epoch": 309} {"train_loss": -8.224027633666992, "global_step": 51968, "epoch": 309} {"train_loss": -8.41833209991455, "global_step": 51969, "epoch": 309} {"train_loss": -8.276849746704102, "global_step": 51970, "epoch": 309} {"train_loss": -8.308164596557617, "global_step": 51971, "epoch": 309} {"train_loss": -8.33951187133789, "global_step": 51972, "epoch": 309} {"train_loss": -8.312433242797852, "global_step": 51973, "epoch": 309} {"train_loss": -8.411369323730469, "global_step": 51974, "epoch": 309} {"train_loss": -8.492355346679688, "global_step": 51975, "epoch": 309} {"train_loss": -8.33333683013916, "global_step": 51976, "epoch": 309} {"train_loss": -8.498104095458984, "global_step": 51977, "epoch": 309} {"train_loss": -8.521035194396973, "global_step": 51978, "epoch": 309} {"train_loss": -8.549684524536133, "global_step": 51979, "epoch": 309} {"train_loss": -8.659880638122559, "global_step": 51980, "epoch": 309} {"train_loss": -8.405949592590332, "global_step": 51981, "epoch": 309} {"train_loss": -8.629707336425781, "global_step": 51982, "epoch": 309} {"train_loss": -8.531783103942871, "global_step": 51983, "epoch": 309} {"train_loss": -8.5628023147583, "global_step": 51984, "epoch": 309} {"train_loss": -8.37767505645752, "global_step": 51985, "epoch": 309} {"train_loss": -8.510476112365723, "global_step": 51986, "epoch": 309} {"train_loss": -8.290023803710938, "global_step": 51987, "epoch": 309} {"train_loss": -8.419696807861328, "global_step": 51988, "epoch": 309} {"train_loss": -8.502015113830566, "global_step": 51989, "epoch": 309} {"train_loss": -8.317327499389648, "global_step": 51990, "epoch": 309} {"train_loss": -8.500317573547363, "global_step": 51991, "epoch": 309} {"train_loss": -8.448488235473633, "global_step": 51992, "epoch": 309} {"train_loss": -8.452878952026367, "global_step": 51993, "epoch": 309} {"train_loss": -8.496686935424805, "global_step": 51994, "epoch": 309} {"train_loss": -8.636244773864746, "global_step": 51995, "epoch": 309} {"train_loss": -8.532065391540527, "global_step": 51996, "epoch": 309} {"train_loss": -8.605264663696289, "global_step": 51997, "epoch": 309} {"train_loss": -8.514373779296875, "global_step": 51998, "epoch": 309} {"train_loss": -8.490509033203125, "global_step": 51999, "epoch": 309} {"train_loss": -8.42054271697998, "global_step": 52000, "epoch": 309} {"train_loss": -8.334227561950684, "global_step": 52001, "epoch": 309} {"train_loss": -8.649776458740234, "global_step": 52002, "epoch": 309} {"train_loss": -8.602425575256348, "global_step": 52003, "epoch": 309} {"train_loss": -8.505428314208984, "global_step": 52004, "epoch": 309} {"train_loss": -8.470845222473145, "global_step": 52005, "epoch": 309} {"train_loss": -8.4573335647583, "global_step": 52006, "epoch": 309} {"train_loss": -8.35835075378418, "global_step": 52007, "epoch": 309} {"train_loss": -8.420906066894531, "global_step": 52008, "epoch": 309} {"train_loss": -8.484472274780273, "global_step": 52009, "epoch": 309} {"train_loss": -8.353727340698242, "global_step": 52010, "epoch": 309} {"train_loss": -8.370443344116211, "global_step": 52011, "epoch": 309} {"train_loss": -8.39518928527832, "global_step": 52012, "epoch": 309} {"train_loss": -8.394721984863281, "global_step": 52013, "epoch": 309} {"train_loss": -7.944447994232178, "global_step": 52014, "epoch": 309} {"train_loss": -8.538613319396973, "global_step": 52015, "epoch": 309} {"train_loss": -8.1768217086792, "global_step": 52016, "epoch": 309} {"train_loss": -8.55483627319336, "global_step": 52017, "epoch": 309} {"train_loss": -8.29556655883789, "global_step": 52018, "epoch": 309} {"train_loss": -8.20414924621582, "global_step": 52019, "epoch": 309} {"train_loss": -8.358325004577637, "global_step": 52020, "epoch": 309} {"train_loss": -8.224188804626465, "global_step": 52021, "epoch": 309} {"train_loss": -8.341751098632812, "global_step": 52022, "epoch": 309} {"train_loss": -8.48529052734375, "global_step": 52023, "epoch": 309} {"train_loss": -8.304475784301758, "global_step": 52024, "epoch": 309} {"train_loss": -8.530620574951172, "global_step": 52025, "epoch": 309} {"train_loss": -8.644266128540039, "global_step": 52026, "epoch": 309} {"train_loss": -8.46186637878418, "global_step": 52027, "epoch": 309} {"train_loss": -8.551431655883789, "global_step": 52028, "epoch": 309} {"train_loss": -8.444305419921875, "global_step": 52029, "epoch": 309} {"train_loss": -8.638113021850586, "global_step": 52030, "epoch": 309} {"train_loss": -8.358766555786133, "global_step": 52031, "epoch": 309} {"train_loss": -8.471195220947266, "global_step": 52032, "epoch": 309} {"train_loss": -8.48816204071045, "global_step": 52033, "epoch": 309} {"train_loss": -8.274967193603516, "global_step": 52034, "epoch": 309} {"train_loss": -8.597457885742188, "global_step": 52035, "epoch": 309} {"train_loss": -8.528868675231934, "global_step": 52036, "epoch": 309} {"train_loss": -8.420385360717773, "global_step": 52037, "epoch": 309} {"train_loss": -8.557425498962402, "global_step": 52038, "epoch": 309} {"train_loss": -8.645549774169922, "global_step": 52039, "epoch": 309} {"train_loss": -8.357540130615234, "global_step": 52040, "epoch": 309} {"train_loss": -8.492652893066406, "global_step": 52041, "epoch": 309} {"train_loss": -8.314535140991211, "global_step": 52042, "epoch": 309} {"train_loss": -8.436609268188477, "global_step": 52043, "epoch": 309} {"train_loss": -8.413909912109375, "global_step": 52044, "epoch": 309} {"train_loss": -8.310710906982422, "global_step": 52045, "epoch": 309} {"train_loss": -8.427684783935547, "global_step": 52046, "epoch": 309} {"train_loss": -7.821274757385254, "global_step": 52047, "epoch": 309} {"train_loss": -8.21899700164795, "global_step": 52048, "epoch": 309} {"train_loss": -8.080251693725586, "global_step": 52049, "epoch": 309} {"train_loss": -8.31035327911377, "global_step": 52050, "epoch": 309} {"train_loss": -7.843635559082031, "global_step": 52051, "epoch": 309} {"train_loss": -8.23396110534668, "global_step": 52052, "epoch": 309} {"train_loss": -8.005935668945312, "global_step": 52053, "epoch": 309} {"train_loss": -8.521297454833984, "global_step": 52054, "epoch": 309} {"train_loss": -8.072325706481934, "global_step": 52055, "epoch": 309} {"train_loss": -8.318524360656738, "global_step": 52056, "epoch": 309} {"train_loss": -8.43010139465332, "global_step": 52057, "epoch": 309} {"train_loss": -8.191670417785645, "global_step": 52058, "epoch": 309} {"train_loss": -8.313347816467285, "global_step": 52059, "epoch": 309} {"train_loss": -8.169963836669922, "global_step": 52060, "epoch": 309} {"train_loss": -8.440945625305176, "global_step": 52061, "epoch": 309} {"train_loss": -8.204154968261719, "global_step": 52062, "epoch": 309} {"train_loss": -8.166159629821777, "global_step": 52063, "epoch": 309} {"train_loss": -8.516292572021484, "global_step": 52064, "epoch": 309} {"train_loss": -8.10899543762207, "global_step": 52065, "epoch": 309} {"train_loss": -8.380867004394531, "global_step": 52066, "epoch": 309} {"train_loss": -8.143402099609375, "global_step": 52067, "epoch": 309} {"train_loss": -8.304525375366211, "global_step": 52068, "epoch": 309} {"train_loss": -8.30063247680664, "global_step": 52069, "epoch": 309} {"train_loss": -8.368927001953125, "global_step": 52070, "epoch": 309} {"train_loss": -8.373952865600586, "global_step": 52071, "epoch": 309} {"train_loss": -8.375431060791016, "global_step": 52072, "epoch": 309} {"train_loss": -8.312555313110352, "global_step": 52073, "epoch": 309} {"train_loss": -8.364688873291016, "global_step": 52074, "epoch": 309} {"train_loss": -8.257271766662598, "global_step": 52075, "epoch": 309} {"train_loss": -8.3448486328125, "global_step": 52076, "epoch": 309} {"train_loss": -8.451192855834961, "global_step": 52077, "epoch": 309} {"train_loss": -8.517053604125977, "global_step": 52078, "epoch": 309} {"train_loss": -8.376073036875043, "global_step": 52079, "epoch": 309, "val_loss": 188881.859375} {"train_loss": -8.242830276489258, "global_step": 52080, "epoch": 310} {"train_loss": -8.412217140197754, "global_step": 52081, "epoch": 310} {"train_loss": -8.20382308959961, "global_step": 52082, "epoch": 310} {"train_loss": -8.528800010681152, "global_step": 52083, "epoch": 310} {"train_loss": -8.127193450927734, "global_step": 52084, "epoch": 310} {"train_loss": -8.433067321777344, "global_step": 52085, "epoch": 310} {"train_loss": -8.21705150604248, "global_step": 52086, "epoch": 310} {"train_loss": -8.318096160888672, "global_step": 52087, "epoch": 310} {"train_loss": -7.93383264541626, "global_step": 52088, "epoch": 310} {"train_loss": -8.094978332519531, "global_step": 52089, "epoch": 310} {"train_loss": -8.152518272399902, "global_step": 52090, "epoch": 310} {"train_loss": -7.919750213623047, "global_step": 52091, "epoch": 310} {"train_loss": -7.790792465209961, "global_step": 52092, "epoch": 310} {"train_loss": -8.306190490722656, "global_step": 52093, "epoch": 310} {"train_loss": -7.833615303039551, "global_step": 52094, "epoch": 310} {"train_loss": -7.988153457641602, "global_step": 52095, "epoch": 310} {"train_loss": -7.96401834487915, "global_step": 52096, "epoch": 310} {"train_loss": -8.481074333190918, "global_step": 52097, "epoch": 310} {"train_loss": -8.227330207824707, "global_step": 52098, "epoch": 310} {"train_loss": -8.258146286010742, "global_step": 52099, "epoch": 310} {"train_loss": -8.11623477935791, "global_step": 52100, "epoch": 310} {"train_loss": -8.294119834899902, "global_step": 52101, "epoch": 310} {"train_loss": -8.20296859741211, "global_step": 52102, "epoch": 310} {"train_loss": -8.259557723999023, "global_step": 52103, "epoch": 310} {"train_loss": -8.400612831115723, "global_step": 52104, "epoch": 310} {"train_loss": -8.384941101074219, "global_step": 52105, "epoch": 310} {"train_loss": -8.376442909240723, "global_step": 52106, "epoch": 310} {"train_loss": -8.185840606689453, "global_step": 52107, "epoch": 310} {"train_loss": -8.616132736206055, "global_step": 52108, "epoch": 310} {"train_loss": -8.418529510498047, "global_step": 52109, "epoch": 310} {"train_loss": -8.364002227783203, "global_step": 52110, "epoch": 310} {"train_loss": -8.423730850219727, "global_step": 52111, "epoch": 310} {"train_loss": -8.660455703735352, "global_step": 52112, "epoch": 310} {"train_loss": -8.613629341125488, "global_step": 52113, "epoch": 310} {"train_loss": -8.716729164123535, "global_step": 52114, "epoch": 310} {"train_loss": -8.556463241577148, "global_step": 52115, "epoch": 310} {"train_loss": -8.359050750732422, "global_step": 52116, "epoch": 310} {"train_loss": -8.419347763061523, "global_step": 52117, "epoch": 310} {"train_loss": -8.722050666809082, "global_step": 52118, "epoch": 310} {"train_loss": -8.532014846801758, "global_step": 52119, "epoch": 310} {"train_loss": -8.248605728149414, "global_step": 52120, "epoch": 310} {"train_loss": -8.397038459777832, "global_step": 52121, "epoch": 310} {"train_loss": -8.657230377197266, "global_step": 52122, "epoch": 310} {"train_loss": -8.59024429321289, "global_step": 52123, "epoch": 310} {"train_loss": -8.559003829956055, "global_step": 52124, "epoch": 310} {"train_loss": -8.666872024536133, "global_step": 52125, "epoch": 310} {"train_loss": -8.693418502807617, "global_step": 52126, "epoch": 310} {"train_loss": -8.735072135925293, "global_step": 52127, "epoch": 310} {"train_loss": -8.731647491455078, "global_step": 52128, "epoch": 310} {"train_loss": -8.797283172607422, "global_step": 52129, "epoch": 310} {"train_loss": -8.452972412109375, "global_step": 52130, "epoch": 310} {"train_loss": -8.455591201782227, "global_step": 52131, "epoch": 310} {"train_loss": -8.512638092041016, "global_step": 52132, "epoch": 310} {"train_loss": -8.68631362915039, "global_step": 52133, "epoch": 310} {"train_loss": -8.532071113586426, "global_step": 52134, "epoch": 310} {"train_loss": -8.587162017822266, "global_step": 52135, "epoch": 310} {"train_loss": -8.503055572509766, "global_step": 52136, "epoch": 310} {"train_loss": -8.582101821899414, "global_step": 52137, "epoch": 310} {"train_loss": -8.679472923278809, "global_step": 52138, "epoch": 310} {"train_loss": -8.470051765441895, "global_step": 52139, "epoch": 310} {"train_loss": -8.52955150604248, "global_step": 52140, "epoch": 310} {"train_loss": -8.138198852539062, "global_step": 52141, "epoch": 310} {"train_loss": -8.247635841369629, "global_step": 52142, "epoch": 310} {"train_loss": -8.63961124420166, "global_step": 52143, "epoch": 310} {"train_loss": -8.301804542541504, "global_step": 52144, "epoch": 310} {"train_loss": -7.966322422027588, "global_step": 52145, "epoch": 310} {"train_loss": -8.440828323364258, "global_step": 52146, "epoch": 310} {"train_loss": -8.343117713928223, "global_step": 52147, "epoch": 310} {"train_loss": -8.264562606811523, "global_step": 52148, "epoch": 310} {"train_loss": -8.327926635742188, "global_step": 52149, "epoch": 310} {"train_loss": -8.599302291870117, "global_step": 52150, "epoch": 310} {"train_loss": -8.131474494934082, "global_step": 52151, "epoch": 310} {"train_loss": -8.120402336120605, "global_step": 52152, "epoch": 310} {"train_loss": -8.311765670776367, "global_step": 52153, "epoch": 310} {"train_loss": -8.345359802246094, "global_step": 52154, "epoch": 310} {"train_loss": -8.396622657775879, "global_step": 52155, "epoch": 310} {"train_loss": -8.546731948852539, "global_step": 52156, "epoch": 310} {"train_loss": -8.351262092590332, "global_step": 52157, "epoch": 310} {"train_loss": -8.512356758117676, "global_step": 52158, "epoch": 310} {"train_loss": -8.410754203796387, "global_step": 52159, "epoch": 310} {"train_loss": -8.45479679107666, "global_step": 52160, "epoch": 310} {"train_loss": -8.583209991455078, "global_step": 52161, "epoch": 310} {"train_loss": -8.420755386352539, "global_step": 52162, "epoch": 310} {"train_loss": -8.243467330932617, "global_step": 52163, "epoch": 310} {"train_loss": -8.576528549194336, "global_step": 52164, "epoch": 310} {"train_loss": -8.288925170898438, "global_step": 52165, "epoch": 310} {"train_loss": -8.646832466125488, "global_step": 52166, "epoch": 310} {"train_loss": -8.44342041015625, "global_step": 52167, "epoch": 310} {"train_loss": -8.49455451965332, "global_step": 52168, "epoch": 310} {"train_loss": -8.249513626098633, "global_step": 52169, "epoch": 310} {"train_loss": -8.595121383666992, "global_step": 52170, "epoch": 310} {"train_loss": -8.520830154418945, "global_step": 52171, "epoch": 310} {"train_loss": -8.612720489501953, "global_step": 52172, "epoch": 310} {"train_loss": -8.587915420532227, "global_step": 52173, "epoch": 310} {"train_loss": -8.484397888183594, "global_step": 52174, "epoch": 310} {"train_loss": -8.322457313537598, "global_step": 52175, "epoch": 310} {"train_loss": -8.480581283569336, "global_step": 52176, "epoch": 310} {"train_loss": -8.368739128112793, "global_step": 52177, "epoch": 310} {"train_loss": -8.228200912475586, "global_step": 52178, "epoch": 310} {"train_loss": -8.193117141723633, "global_step": 52179, "epoch": 310} {"train_loss": -8.391181945800781, "global_step": 52180, "epoch": 310} {"train_loss": -7.895937442779541, "global_step": 52181, "epoch": 310} {"train_loss": -8.332826614379883, "global_step": 52182, "epoch": 310} {"train_loss": -7.961477279663086, "global_step": 52183, "epoch": 310} {"train_loss": -7.935384750366211, "global_step": 52184, "epoch": 310} {"train_loss": -8.302268981933594, "global_step": 52185, "epoch": 310} {"train_loss": -7.941622734069824, "global_step": 52186, "epoch": 310} {"train_loss": -7.955112457275391, "global_step": 52187, "epoch": 310} {"train_loss": -8.226490020751953, "global_step": 52188, "epoch": 310} {"train_loss": -8.067419052124023, "global_step": 52189, "epoch": 310} {"train_loss": -8.449894905090332, "global_step": 52190, "epoch": 310} {"train_loss": -8.110407829284668, "global_step": 52191, "epoch": 310} {"train_loss": -8.144341468811035, "global_step": 52192, "epoch": 310} {"train_loss": -8.260533332824707, "global_step": 52193, "epoch": 310} {"train_loss": -8.209746360778809, "global_step": 52194, "epoch": 310} {"train_loss": -8.223928451538086, "global_step": 52195, "epoch": 310} {"train_loss": -8.074994087219238, "global_step": 52196, "epoch": 310} {"train_loss": -8.093835830688477, "global_step": 52197, "epoch": 310} {"train_loss": -8.229156494140625, "global_step": 52198, "epoch": 310} {"train_loss": -8.413601875305176, "global_step": 52199, "epoch": 310} {"train_loss": -8.337200164794922, "global_step": 52200, "epoch": 310} {"train_loss": -8.241632461547852, "global_step": 52201, "epoch": 310} {"train_loss": -8.280561447143555, "global_step": 52202, "epoch": 310} {"train_loss": -8.383440017700195, "global_step": 52203, "epoch": 310} {"train_loss": -8.233673095703125, "global_step": 52204, "epoch": 310} {"train_loss": -8.510164260864258, "global_step": 52205, "epoch": 310} {"train_loss": -8.301521301269531, "global_step": 52206, "epoch": 310} {"train_loss": -8.528812408447266, "global_step": 52207, "epoch": 310} {"train_loss": -8.535568237304688, "global_step": 52208, "epoch": 310} {"train_loss": -8.378059387207031, "global_step": 52209, "epoch": 310} {"train_loss": -8.332918167114258, "global_step": 52210, "epoch": 310} {"train_loss": -8.393621444702148, "global_step": 52211, "epoch": 310} {"train_loss": -8.523104667663574, "global_step": 52212, "epoch": 310} {"train_loss": -8.401662826538086, "global_step": 52213, "epoch": 310} {"train_loss": -8.49687385559082, "global_step": 52214, "epoch": 310} {"train_loss": -8.624349594116211, "global_step": 52215, "epoch": 310} {"train_loss": -8.647396087646484, "global_step": 52216, "epoch": 310} {"train_loss": -8.329004287719727, "global_step": 52217, "epoch": 310} {"train_loss": -8.577255249023438, "global_step": 52218, "epoch": 310} {"train_loss": -8.321879386901855, "global_step": 52219, "epoch": 310} {"train_loss": -8.718165397644043, "global_step": 52220, "epoch": 310} {"train_loss": -8.464859008789062, "global_step": 52221, "epoch": 310} {"train_loss": -8.210975646972656, "global_step": 52222, "epoch": 310} {"train_loss": -8.474185943603516, "global_step": 52223, "epoch": 310} {"train_loss": -8.038229942321777, "global_step": 52224, "epoch": 310} {"train_loss": -8.351058006286621, "global_step": 52225, "epoch": 310} {"train_loss": -8.167962074279785, "global_step": 52226, "epoch": 310} {"train_loss": -8.225212097167969, "global_step": 52227, "epoch": 310} {"train_loss": -8.051125526428223, "global_step": 52228, "epoch": 310} {"train_loss": -8.346193313598633, "global_step": 52229, "epoch": 310} {"train_loss": -8.181467056274414, "global_step": 52230, "epoch": 310} {"train_loss": -8.009393692016602, "global_step": 52231, "epoch": 310} {"train_loss": -8.319164276123047, "global_step": 52232, "epoch": 310} {"train_loss": -8.035581588745117, "global_step": 52233, "epoch": 310} {"train_loss": -8.168710708618164, "global_step": 52234, "epoch": 310} {"train_loss": -8.15247917175293, "global_step": 52235, "epoch": 310} {"train_loss": -8.038290023803711, "global_step": 52236, "epoch": 310} {"train_loss": -8.274099349975586, "global_step": 52237, "epoch": 310} {"train_loss": -8.22462272644043, "global_step": 52238, "epoch": 310} {"train_loss": -8.238012313842773, "global_step": 52239, "epoch": 310} {"train_loss": -8.333984375, "global_step": 52240, "epoch": 310} {"train_loss": -8.343345642089844, "global_step": 52241, "epoch": 310} {"train_loss": -8.275585174560547, "global_step": 52242, "epoch": 310} {"train_loss": -8.220634460449219, "global_step": 52243, "epoch": 310} {"train_loss": -8.54135799407959, "global_step": 52244, "epoch": 310} {"train_loss": -8.097275733947754, "global_step": 52245, "epoch": 310} {"train_loss": -8.44262409210205, "global_step": 52246, "epoch": 310} {"train_loss": -8.347232018198286, "global_step": 52247, "epoch": 310, "val_loss": 187864.8125, "train_action_mse_error": 8.54537296295166} {"train_loss": -8.4314603805542, "global_step": 52248, "epoch": 311} {"train_loss": -8.472328186035156, "global_step": 52249, "epoch": 311} {"train_loss": -8.373570442199707, "global_step": 52250, "epoch": 311} {"train_loss": -8.3491792678833, "global_step": 52251, "epoch": 311} {"train_loss": -8.552465438842773, "global_step": 52252, "epoch": 311} {"train_loss": -8.470512390136719, "global_step": 52253, "epoch": 311} {"train_loss": -8.599831581115723, "global_step": 52254, "epoch": 311} {"train_loss": -8.514749526977539, "global_step": 52255, "epoch": 311} {"train_loss": -8.577600479125977, "global_step": 52256, "epoch": 311} {"train_loss": -8.624191284179688, "global_step": 52257, "epoch": 311} {"train_loss": -8.674062728881836, "global_step": 52258, "epoch": 311} {"train_loss": -8.713092803955078, "global_step": 52259, "epoch": 311} {"train_loss": -8.682238578796387, "global_step": 52260, "epoch": 311} {"train_loss": -8.64095687866211, "global_step": 52261, "epoch": 311} {"train_loss": -8.581894874572754, "global_step": 52262, "epoch": 311} {"train_loss": -8.667778015136719, "global_step": 52263, "epoch": 311} {"train_loss": -8.461519241333008, "global_step": 52264, "epoch": 311} {"train_loss": -8.635173797607422, "global_step": 52265, "epoch": 311} {"train_loss": -8.554241180419922, "global_step": 52266, "epoch": 311} {"train_loss": -8.608747482299805, "global_step": 52267, "epoch": 311} {"train_loss": -8.547840118408203, "global_step": 52268, "epoch": 311} {"train_loss": -8.347663879394531, "global_step": 52269, "epoch": 311} {"train_loss": -8.724870681762695, "global_step": 52270, "epoch": 311} {"train_loss": -8.267881393432617, "global_step": 52271, "epoch": 311} {"train_loss": -8.175220489501953, "global_step": 52272, "epoch": 311} {"train_loss": -8.306140899658203, "global_step": 52273, "epoch": 311} {"train_loss": -8.477136611938477, "global_step": 52274, "epoch": 311} {"train_loss": -8.317047119140625, "global_step": 52275, "epoch": 311} {"train_loss": -8.044244766235352, "global_step": 52276, "epoch": 311} {"train_loss": -8.384185791015625, "global_step": 52277, "epoch": 311} {"train_loss": -8.15066909790039, "global_step": 52278, "epoch": 311} {"train_loss": -8.368609428405762, "global_step": 52279, "epoch": 311} {"train_loss": -8.531167984008789, "global_step": 52280, "epoch": 311} {"train_loss": -8.368095397949219, "global_step": 52281, "epoch": 311} {"train_loss": -8.4190673828125, "global_step": 52282, "epoch": 311} {"train_loss": -8.27924919128418, "global_step": 52283, "epoch": 311} {"train_loss": -8.262910842895508, "global_step": 52284, "epoch": 311} {"train_loss": -8.477436065673828, "global_step": 52285, "epoch": 311} {"train_loss": -8.22727108001709, "global_step": 52286, "epoch": 311} {"train_loss": -8.606457710266113, "global_step": 52287, "epoch": 311} {"train_loss": -8.199300765991211, "global_step": 52288, "epoch": 311} {"train_loss": -8.585816383361816, "global_step": 52289, "epoch": 311} {"train_loss": -8.46863079071045, "global_step": 52290, "epoch": 311} {"train_loss": -8.210079193115234, "global_step": 52291, "epoch": 311} {"train_loss": -8.18207836151123, "global_step": 52292, "epoch": 311} {"train_loss": -8.513547897338867, "global_step": 52293, "epoch": 311} {"train_loss": -8.504976272583008, "global_step": 52294, "epoch": 311} {"train_loss": -8.247641563415527, "global_step": 52295, "epoch": 311} {"train_loss": -8.216276168823242, "global_step": 52296, "epoch": 311} {"train_loss": -8.352832794189453, "global_step": 52297, "epoch": 311} {"train_loss": -8.289872169494629, "global_step": 52298, "epoch": 311} {"train_loss": -7.947410583496094, "global_step": 52299, "epoch": 311} {"train_loss": -8.407423973083496, "global_step": 52300, "epoch": 311} {"train_loss": -8.437573432922363, "global_step": 52301, "epoch": 311} {"train_loss": -8.490716934204102, "global_step": 52302, "epoch": 311} {"train_loss": -8.52126693725586, "global_step": 52303, "epoch": 311} {"train_loss": -8.568284034729004, "global_step": 52304, "epoch": 311} {"train_loss": -8.395527839660645, "global_step": 52305, "epoch": 311} {"train_loss": -8.095548629760742, "global_step": 52306, "epoch": 311} {"train_loss": -8.387060165405273, "global_step": 52307, "epoch": 311} {"train_loss": -8.438058853149414, "global_step": 52308, "epoch": 311} {"train_loss": -8.540729522705078, "global_step": 52309, "epoch": 311} {"train_loss": -8.522483825683594, "global_step": 52310, "epoch": 311} {"train_loss": -8.453991889953613, "global_step": 52311, "epoch": 311} {"train_loss": -8.454269409179688, "global_step": 52312, "epoch": 311} {"train_loss": -8.230257034301758, "global_step": 52313, "epoch": 311} {"train_loss": -8.008526802062988, "global_step": 52314, "epoch": 311} {"train_loss": -8.411242485046387, "global_step": 52315, "epoch": 311} {"train_loss": -8.199271202087402, "global_step": 52316, "epoch": 311} {"train_loss": -8.250441551208496, "global_step": 52317, "epoch": 311} {"train_loss": -8.00872802734375, "global_step": 52318, "epoch": 311} {"train_loss": -8.449094772338867, "global_step": 52319, "epoch": 311} {"train_loss": -8.242688179016113, "global_step": 52320, "epoch": 311} {"train_loss": -8.329580307006836, "global_step": 52321, "epoch": 311} {"train_loss": -8.459470748901367, "global_step": 52322, "epoch": 311} {"train_loss": -8.506125450134277, "global_step": 52323, "epoch": 311} {"train_loss": -8.2466402053833, "global_step": 52324, "epoch": 311} {"train_loss": -8.70423412322998, "global_step": 52325, "epoch": 311} {"train_loss": -8.318670272827148, "global_step": 52326, "epoch": 311} {"train_loss": -8.303986549377441, "global_step": 52327, "epoch": 311} {"train_loss": -8.248729705810547, "global_step": 52328, "epoch": 311} {"train_loss": -8.561300277709961, "global_step": 52329, "epoch": 311} {"train_loss": -8.168235778808594, "global_step": 52330, "epoch": 311} {"train_loss": -8.562864303588867, "global_step": 52331, "epoch": 311} {"train_loss": -8.481317520141602, "global_step": 52332, "epoch": 311} {"train_loss": -8.514052391052246, "global_step": 52333, "epoch": 311} {"train_loss": -8.584972381591797, "global_step": 52334, "epoch": 311} {"train_loss": -8.439630508422852, "global_step": 52335, "epoch": 311} {"train_loss": -8.343509674072266, "global_step": 52336, "epoch": 311} {"train_loss": -7.965265274047852, "global_step": 52337, "epoch": 311} {"train_loss": -8.456165313720703, "global_step": 52338, "epoch": 311} {"train_loss": -7.965121269226074, "global_step": 52339, "epoch": 311} {"train_loss": -8.227627754211426, "global_step": 52340, "epoch": 311} {"train_loss": -8.148191452026367, "global_step": 52341, "epoch": 311} {"train_loss": -8.268024444580078, "global_step": 52342, "epoch": 311} {"train_loss": -8.0282564163208, "global_step": 52343, "epoch": 311} {"train_loss": -8.398558616638184, "global_step": 52344, "epoch": 311} {"train_loss": -8.430509567260742, "global_step": 52345, "epoch": 311} {"train_loss": -8.106998443603516, "global_step": 52346, "epoch": 311} {"train_loss": -8.332357406616211, "global_step": 52347, "epoch": 311} {"train_loss": -8.203031539916992, "global_step": 52348, "epoch": 311} {"train_loss": -8.188852310180664, "global_step": 52349, "epoch": 311} {"train_loss": -8.347661972045898, "global_step": 52350, "epoch": 311} {"train_loss": -8.240227699279785, "global_step": 52351, "epoch": 311} {"train_loss": -8.13209342956543, "global_step": 52352, "epoch": 311} {"train_loss": -8.427919387817383, "global_step": 52353, "epoch": 311} {"train_loss": -8.392602920532227, "global_step": 52354, "epoch": 311} {"train_loss": -8.295906066894531, "global_step": 52355, "epoch": 311} {"train_loss": -8.362773895263672, "global_step": 52356, "epoch": 311} {"train_loss": -8.297035217285156, "global_step": 52357, "epoch": 311} {"train_loss": -8.364981651306152, "global_step": 52358, "epoch": 311} {"train_loss": -8.379232406616211, "global_step": 52359, "epoch": 311} {"train_loss": -8.41423225402832, "global_step": 52360, "epoch": 311} {"train_loss": -8.522378921508789, "global_step": 52361, "epoch": 311} {"train_loss": -8.528390884399414, "global_step": 52362, "epoch": 311} {"train_loss": -8.759820938110352, "global_step": 52363, "epoch": 311} {"train_loss": -8.344188690185547, "global_step": 52364, "epoch": 311} {"train_loss": -8.441227912902832, "global_step": 52365, "epoch": 311} {"train_loss": -8.411169052124023, "global_step": 52366, "epoch": 311} {"train_loss": -8.52824592590332, "global_step": 52367, "epoch": 311} {"train_loss": -8.338415145874023, "global_step": 52368, "epoch": 311} {"train_loss": -8.528862953186035, "global_step": 52369, "epoch": 311} {"train_loss": -8.275897026062012, "global_step": 52370, "epoch": 311} {"train_loss": -8.638689041137695, "global_step": 52371, "epoch": 311} {"train_loss": -8.181266784667969, "global_step": 52372, "epoch": 311} {"train_loss": -8.29050064086914, "global_step": 52373, "epoch": 311} {"train_loss": -8.430194854736328, "global_step": 52374, "epoch": 311} {"train_loss": -8.467777252197266, "global_step": 52375, "epoch": 311} {"train_loss": -8.589613914489746, "global_step": 52376, "epoch": 311} {"train_loss": -8.431966781616211, "global_step": 52377, "epoch": 311} {"train_loss": -8.631711959838867, "global_step": 52378, "epoch": 311} {"train_loss": -8.42593765258789, "global_step": 52379, "epoch": 311} {"train_loss": -8.598722457885742, "global_step": 52380, "epoch": 311} {"train_loss": -8.591229438781738, "global_step": 52381, "epoch": 311} {"train_loss": -8.451823234558105, "global_step": 52382, "epoch": 311} {"train_loss": -8.371508598327637, "global_step": 52383, "epoch": 311} {"train_loss": -8.421624183654785, "global_step": 52384, "epoch": 311} {"train_loss": -8.406940460205078, "global_step": 52385, "epoch": 311} {"train_loss": -8.340936660766602, "global_step": 52386, "epoch": 311} {"train_loss": -8.358859062194824, "global_step": 52387, "epoch": 311} {"train_loss": -8.426165580749512, "global_step": 52388, "epoch": 311} {"train_loss": -8.523833274841309, "global_step": 52389, "epoch": 311} {"train_loss": -8.400838851928711, "global_step": 52390, "epoch": 311} {"train_loss": -8.32148551940918, "global_step": 52391, "epoch": 311} {"train_loss": -8.323420524597168, "global_step": 52392, "epoch": 311} {"train_loss": -8.162858963012695, "global_step": 52393, "epoch": 311} {"train_loss": -8.16980266571045, "global_step": 52394, "epoch": 311} {"train_loss": -8.44943618774414, "global_step": 52395, "epoch": 311} {"train_loss": -8.295306205749512, "global_step": 52396, "epoch": 311} {"train_loss": -8.201403617858887, "global_step": 52397, "epoch": 311} {"train_loss": -8.153605461120605, "global_step": 52398, "epoch": 311} {"train_loss": -8.04479694366455, "global_step": 52399, "epoch": 311} {"train_loss": -8.381083488464355, "global_step": 52400, "epoch": 311} {"train_loss": -7.973689079284668, "global_step": 52401, "epoch": 311} {"train_loss": -8.198688507080078, "global_step": 52402, "epoch": 311} {"train_loss": -8.160245895385742, "global_step": 52403, "epoch": 311} {"train_loss": -7.90753173828125, "global_step": 52404, "epoch": 311} {"train_loss": -8.255961418151855, "global_step": 52405, "epoch": 311} {"train_loss": -8.296853065490723, "global_step": 52406, "epoch": 311} {"train_loss": -7.926736354827881, "global_step": 52407, "epoch": 311} {"train_loss": -8.229057312011719, "global_step": 52408, "epoch": 311} {"train_loss": -8.30449104309082, "global_step": 52409, "epoch": 311} {"train_loss": -8.065195083618164, "global_step": 52410, "epoch": 311} {"train_loss": -8.187175750732422, "global_step": 52411, "epoch": 311} {"train_loss": -8.238723754882812, "global_step": 52412, "epoch": 311} {"train_loss": -8.1476469039917, "global_step": 52413, "epoch": 311} {"train_loss": -8.485669136047363, "global_step": 52414, "epoch": 311} {"train_loss": -8.36772477342969, "global_step": 52415, "epoch": 311, "val_loss": 187058.78125} {"train_loss": -8.313407897949219, "global_step": 52416, "epoch": 312} {"train_loss": -8.237693786621094, "global_step": 52417, "epoch": 312} {"train_loss": -8.362217903137207, "global_step": 52418, "epoch": 312} {"train_loss": -8.416462898254395, "global_step": 52419, "epoch": 312} {"train_loss": -8.442441940307617, "global_step": 52420, "epoch": 312} {"train_loss": -8.33627986907959, "global_step": 52421, "epoch": 312} {"train_loss": -8.439190864562988, "global_step": 52422, "epoch": 312} {"train_loss": -8.464056015014648, "global_step": 52423, "epoch": 312} {"train_loss": -8.420940399169922, "global_step": 52424, "epoch": 312} {"train_loss": -8.361370086669922, "global_step": 52425, "epoch": 312} {"train_loss": -8.561210632324219, "global_step": 52426, "epoch": 312} {"train_loss": -8.499305725097656, "global_step": 52427, "epoch": 312} {"train_loss": -8.312994003295898, "global_step": 52428, "epoch": 312} {"train_loss": -8.416608810424805, "global_step": 52429, "epoch": 312} {"train_loss": -8.253740310668945, "global_step": 52430, "epoch": 312} {"train_loss": -8.4656982421875, "global_step": 52431, "epoch": 312} {"train_loss": -8.601880073547363, "global_step": 52432, "epoch": 312} {"train_loss": -8.645593643188477, "global_step": 52433, "epoch": 312} {"train_loss": -8.482135772705078, "global_step": 52434, "epoch": 312} {"train_loss": -8.668791770935059, "global_step": 52435, "epoch": 312} {"train_loss": -8.638553619384766, "global_step": 52436, "epoch": 312} {"train_loss": -8.689619064331055, "global_step": 52437, "epoch": 312} {"train_loss": -8.52400016784668, "global_step": 52438, "epoch": 312} {"train_loss": -8.633132934570312, "global_step": 52439, "epoch": 312} {"train_loss": -8.430997848510742, "global_step": 52440, "epoch": 312} {"train_loss": -8.316913604736328, "global_step": 52441, "epoch": 312} {"train_loss": -8.428750038146973, "global_step": 52442, "epoch": 312} {"train_loss": -8.182241439819336, "global_step": 52443, "epoch": 312} {"train_loss": -8.459498405456543, "global_step": 52444, "epoch": 312} {"train_loss": -8.378026962280273, "global_step": 52445, "epoch": 312} {"train_loss": -8.472412109375, "global_step": 52446, "epoch": 312} {"train_loss": -8.374959945678711, "global_step": 52447, "epoch": 312} {"train_loss": -8.697230339050293, "global_step": 52448, "epoch": 312} {"train_loss": -8.560209274291992, "global_step": 52449, "epoch": 312} {"train_loss": -8.348051071166992, "global_step": 52450, "epoch": 312} {"train_loss": -8.65597915649414, "global_step": 52451, "epoch": 312} {"train_loss": -8.391560554504395, "global_step": 52452, "epoch": 312} {"train_loss": -8.458236694335938, "global_step": 52453, "epoch": 312} {"train_loss": -8.574460983276367, "global_step": 52454, "epoch": 312} {"train_loss": -8.285015106201172, "global_step": 52455, "epoch": 312} {"train_loss": -8.203323364257812, "global_step": 52456, "epoch": 312} {"train_loss": -8.262292861938477, "global_step": 52457, "epoch": 312} {"train_loss": -8.388681411743164, "global_step": 52458, "epoch": 312} {"train_loss": -8.545265197753906, "global_step": 52459, "epoch": 312} {"train_loss": -8.466939926147461, "global_step": 52460, "epoch": 312} {"train_loss": -8.534239768981934, "global_step": 52461, "epoch": 312} {"train_loss": -8.391408920288086, "global_step": 52462, "epoch": 312} {"train_loss": -8.561307907104492, "global_step": 52463, "epoch": 312} {"train_loss": -8.681211471557617, "global_step": 52464, "epoch": 312} {"train_loss": -8.46975326538086, "global_step": 52465, "epoch": 312} {"train_loss": -8.207823753356934, "global_step": 52466, "epoch": 312} {"train_loss": -8.426931381225586, "global_step": 52467, "epoch": 312} {"train_loss": -8.578056335449219, "global_step": 52468, "epoch": 312} {"train_loss": -8.556099891662598, "global_step": 52469, "epoch": 312} {"train_loss": -8.670585632324219, "global_step": 52470, "epoch": 312} {"train_loss": -8.1643705368042, "global_step": 52471, "epoch": 312} {"train_loss": -8.322446823120117, "global_step": 52472, "epoch": 312} {"train_loss": -8.316730499267578, "global_step": 52473, "epoch": 312} {"train_loss": -8.298497200012207, "global_step": 52474, "epoch": 312} {"train_loss": -8.373805046081543, "global_step": 52475, "epoch": 312} {"train_loss": -8.485580444335938, "global_step": 52476, "epoch": 312} {"train_loss": -8.28679084777832, "global_step": 52477, "epoch": 312} {"train_loss": -8.421950340270996, "global_step": 52478, "epoch": 312} {"train_loss": -8.697161674499512, "global_step": 52479, "epoch": 312} {"train_loss": -8.272919654846191, "global_step": 52480, "epoch": 312} {"train_loss": -8.63907241821289, "global_step": 52481, "epoch": 312} {"train_loss": -8.452115058898926, "global_step": 52482, "epoch": 312} {"train_loss": -8.200538635253906, "global_step": 52483, "epoch": 312} {"train_loss": -8.405850410461426, "global_step": 52484, "epoch": 312} {"train_loss": -8.543487548828125, "global_step": 52485, "epoch": 312} {"train_loss": -8.489891052246094, "global_step": 52486, "epoch": 312} {"train_loss": -8.590785026550293, "global_step": 52487, "epoch": 312} {"train_loss": -8.376182556152344, "global_step": 52488, "epoch": 312} {"train_loss": -8.387995719909668, "global_step": 52489, "epoch": 312} {"train_loss": -8.528844833374023, "global_step": 52490, "epoch": 312} {"train_loss": -8.46356201171875, "global_step": 52491, "epoch": 312} {"train_loss": -8.476312637329102, "global_step": 52492, "epoch": 312} {"train_loss": -8.640417098999023, "global_step": 52493, "epoch": 312} {"train_loss": -8.608198165893555, "global_step": 52494, "epoch": 312} {"train_loss": -8.397096633911133, "global_step": 52495, "epoch": 312} {"train_loss": -8.444416046142578, "global_step": 52496, "epoch": 312} {"train_loss": -8.717292785644531, "global_step": 52497, "epoch": 312} {"train_loss": -8.551162719726562, "global_step": 52498, "epoch": 312} {"train_loss": -8.51323127746582, "global_step": 52499, "epoch": 312} {"train_loss": -8.557404518127441, "global_step": 52500, "epoch": 312} {"train_loss": -8.544376373291016, "global_step": 52501, "epoch": 312} {"train_loss": -8.247784614562988, "global_step": 52502, "epoch": 312} {"train_loss": -8.290632247924805, "global_step": 52503, "epoch": 312} {"train_loss": -8.507131576538086, "global_step": 52504, "epoch": 312} {"train_loss": -8.477267265319824, "global_step": 52505, "epoch": 312} {"train_loss": -8.345832824707031, "global_step": 52506, "epoch": 312} {"train_loss": -8.480284690856934, "global_step": 52507, "epoch": 312} {"train_loss": -8.215474128723145, "global_step": 52508, "epoch": 312} {"train_loss": -8.270405769348145, "global_step": 52509, "epoch": 312} {"train_loss": -8.736373901367188, "global_step": 52510, "epoch": 312} {"train_loss": -8.471445083618164, "global_step": 52511, "epoch": 312} {"train_loss": -8.409072875976562, "global_step": 52512, "epoch": 312} {"train_loss": -8.434551239013672, "global_step": 52513, "epoch": 312} {"train_loss": -8.33578109741211, "global_step": 52514, "epoch": 312} {"train_loss": -8.457836151123047, "global_step": 52515, "epoch": 312} {"train_loss": -8.355884552001953, "global_step": 52516, "epoch": 312} {"train_loss": -8.663726806640625, "global_step": 52517, "epoch": 312} {"train_loss": -8.394713401794434, "global_step": 52518, "epoch": 312} {"train_loss": -8.275965690612793, "global_step": 52519, "epoch": 312} {"train_loss": -8.30176830291748, "global_step": 52520, "epoch": 312} {"train_loss": -8.54853630065918, "global_step": 52521, "epoch": 312} {"train_loss": -8.727763175964355, "global_step": 52522, "epoch": 312} {"train_loss": -8.216840744018555, "global_step": 52523, "epoch": 312} {"train_loss": -8.565046310424805, "global_step": 52524, "epoch": 312} {"train_loss": -8.543978691101074, "global_step": 52525, "epoch": 312} {"train_loss": -8.483222961425781, "global_step": 52526, "epoch": 312} {"train_loss": -8.415844917297363, "global_step": 52527, "epoch": 312} {"train_loss": -8.313875198364258, "global_step": 52528, "epoch": 312} {"train_loss": -8.349372863769531, "global_step": 52529, "epoch": 312} {"train_loss": -8.081811904907227, "global_step": 52530, "epoch": 312} {"train_loss": -8.556640625, "global_step": 52531, "epoch": 312} {"train_loss": -7.41276741027832, "global_step": 52532, "epoch": 312} {"train_loss": -8.252591133117676, "global_step": 52533, "epoch": 312} {"train_loss": -8.181052207946777, "global_step": 52534, "epoch": 312} {"train_loss": -8.274490356445312, "global_step": 52535, "epoch": 312} {"train_loss": -8.053441047668457, "global_step": 52536, "epoch": 312} {"train_loss": -7.993879318237305, "global_step": 52537, "epoch": 312} {"train_loss": -8.147196769714355, "global_step": 52538, "epoch": 312} {"train_loss": -8.081198692321777, "global_step": 52539, "epoch": 312} {"train_loss": -8.213972091674805, "global_step": 52540, "epoch": 312} {"train_loss": -8.004307746887207, "global_step": 52541, "epoch": 312} {"train_loss": -8.282605171203613, "global_step": 52542, "epoch": 312} {"train_loss": -7.927254676818848, "global_step": 52543, "epoch": 312} {"train_loss": -8.188544273376465, "global_step": 52544, "epoch": 312} {"train_loss": -8.254871368408203, "global_step": 52545, "epoch": 312} {"train_loss": -8.295108795166016, "global_step": 52546, "epoch": 312} {"train_loss": -8.434066772460938, "global_step": 52547, "epoch": 312} {"train_loss": -8.236536026000977, "global_step": 52548, "epoch": 312} {"train_loss": -8.420114517211914, "global_step": 52549, "epoch": 312} {"train_loss": -8.355010986328125, "global_step": 52550, "epoch": 312} {"train_loss": -8.417287826538086, "global_step": 52551, "epoch": 312} {"train_loss": -8.345168113708496, "global_step": 52552, "epoch": 312} {"train_loss": -8.505971908569336, "global_step": 52553, "epoch": 312} {"train_loss": -8.295696258544922, "global_step": 52554, "epoch": 312} {"train_loss": -8.46310043334961, "global_step": 52555, "epoch": 312} {"train_loss": -8.519241333007812, "global_step": 52556, "epoch": 312} {"train_loss": -8.655776023864746, "global_step": 52557, "epoch": 312} {"train_loss": -8.567885398864746, "global_step": 52558, "epoch": 312} {"train_loss": -8.448204040527344, "global_step": 52559, "epoch": 312} {"train_loss": -8.545599937438965, "global_step": 52560, "epoch": 312} {"train_loss": -8.503217697143555, "global_step": 52561, "epoch": 312} {"train_loss": -8.275644302368164, "global_step": 52562, "epoch": 312} {"train_loss": -8.440023422241211, "global_step": 52563, "epoch": 312} {"train_loss": -8.363924026489258, "global_step": 52564, "epoch": 312} {"train_loss": -7.967452526092529, "global_step": 52565, "epoch": 312} {"train_loss": -8.419000625610352, "global_step": 52566, "epoch": 312} {"train_loss": -8.38180160522461, "global_step": 52567, "epoch": 312} {"train_loss": -8.138866424560547, "global_step": 52568, "epoch": 312} {"train_loss": -7.978075981140137, "global_step": 52569, "epoch": 312} {"train_loss": -8.54843521118164, "global_step": 52570, "epoch": 312} {"train_loss": -7.652266502380371, "global_step": 52571, "epoch": 312} {"train_loss": -8.161245346069336, "global_step": 52572, "epoch": 312} {"train_loss": -7.7855939865112305, "global_step": 52573, "epoch": 312} {"train_loss": -8.07592487335205, "global_step": 52574, "epoch": 312} {"train_loss": -7.8384294509887695, "global_step": 52575, "epoch": 312} {"train_loss": -8.009725570678711, "global_step": 52576, "epoch": 312} {"train_loss": -8.211366653442383, "global_step": 52577, "epoch": 312} {"train_loss": -8.179376602172852, "global_step": 52578, "epoch": 312} {"train_loss": -8.23916244506836, "global_step": 52579, "epoch": 312} {"train_loss": -7.9979352951049805, "global_step": 52580, "epoch": 312} {"train_loss": -8.13037109375, "global_step": 52581, "epoch": 312} {"train_loss": -8.301104545593262, "global_step": 52582, "epoch": 312} {"train_loss": -8.37671824012484, "global_step": 52583, "epoch": 312, "val_loss": 190782.421875} {"train_loss": -8.241643905639648, "global_step": 52584, "epoch": 313} {"train_loss": -8.344345092773438, "global_step": 52585, "epoch": 313} {"train_loss": -8.295124053955078, "global_step": 52586, "epoch": 313} {"train_loss": -8.24872875213623, "global_step": 52587, "epoch": 313} {"train_loss": -8.237499237060547, "global_step": 52588, "epoch": 313} {"train_loss": -8.330941200256348, "global_step": 52589, "epoch": 313} {"train_loss": -8.358028411865234, "global_step": 52590, "epoch": 313} {"train_loss": -8.342903137207031, "global_step": 52591, "epoch": 313} {"train_loss": -8.466233253479004, "global_step": 52592, "epoch": 313} {"train_loss": -8.39284610748291, "global_step": 52593, "epoch": 313} {"train_loss": -8.362457275390625, "global_step": 52594, "epoch": 313} {"train_loss": -8.16134262084961, "global_step": 52595, "epoch": 313} {"train_loss": -8.421466827392578, "global_step": 52596, "epoch": 313} {"train_loss": -8.368707656860352, "global_step": 52597, "epoch": 313} {"train_loss": -8.525745391845703, "global_step": 52598, "epoch": 313} {"train_loss": -8.352239608764648, "global_step": 52599, "epoch": 313} {"train_loss": -8.575302124023438, "global_step": 52600, "epoch": 313} {"train_loss": -8.291688919067383, "global_step": 52601, "epoch": 313} {"train_loss": -8.36282730102539, "global_step": 52602, "epoch": 313} {"train_loss": -8.210224151611328, "global_step": 52603, "epoch": 313} {"train_loss": -8.374034881591797, "global_step": 52604, "epoch": 313} {"train_loss": -8.065317153930664, "global_step": 52605, "epoch": 313} {"train_loss": -8.197219848632812, "global_step": 52606, "epoch": 313} {"train_loss": -7.7669148445129395, "global_step": 52607, "epoch": 313} {"train_loss": -8.314070701599121, "global_step": 52608, "epoch": 313} {"train_loss": -8.271931648254395, "global_step": 52609, "epoch": 313} {"train_loss": -8.334463119506836, "global_step": 52610, "epoch": 313} {"train_loss": -8.063837051391602, "global_step": 52611, "epoch": 313} {"train_loss": -8.33883285522461, "global_step": 52612, "epoch": 313} {"train_loss": -8.326007843017578, "global_step": 52613, "epoch": 313} {"train_loss": -8.430458068847656, "global_step": 52614, "epoch": 313} {"train_loss": -8.421217918395996, "global_step": 52615, "epoch": 313} {"train_loss": -8.329452514648438, "global_step": 52616, "epoch": 313} {"train_loss": -8.34338092803955, "global_step": 52617, "epoch": 313} {"train_loss": -8.182526588439941, "global_step": 52618, "epoch": 313} {"train_loss": -8.244274139404297, "global_step": 52619, "epoch": 313} {"train_loss": -8.253752708435059, "global_step": 52620, "epoch": 313} {"train_loss": -8.474872589111328, "global_step": 52621, "epoch": 313} {"train_loss": -8.30982494354248, "global_step": 52622, "epoch": 313} {"train_loss": -8.375709533691406, "global_step": 52623, "epoch": 313} {"train_loss": -8.48371696472168, "global_step": 52624, "epoch": 313} {"train_loss": -8.473771095275879, "global_step": 52625, "epoch": 313} {"train_loss": -8.470661163330078, "global_step": 52626, "epoch": 313} {"train_loss": -8.379365921020508, "global_step": 52627, "epoch": 313} {"train_loss": -8.441364288330078, "global_step": 52628, "epoch": 313} {"train_loss": -8.414798736572266, "global_step": 52629, "epoch": 313} {"train_loss": -8.118462562561035, "global_step": 52630, "epoch": 313} {"train_loss": -8.34377670288086, "global_step": 52631, "epoch": 313} {"train_loss": -8.39599609375, "global_step": 52632, "epoch": 313} {"train_loss": -8.477235794067383, "global_step": 52633, "epoch": 313} {"train_loss": -8.347043991088867, "global_step": 52634, "epoch": 313} {"train_loss": -8.508682250976562, "global_step": 52635, "epoch": 313} {"train_loss": -8.476287841796875, "global_step": 52636, "epoch": 313} {"train_loss": -8.067286491394043, "global_step": 52637, "epoch": 313} {"train_loss": -8.39858341217041, "global_step": 52638, "epoch": 313} {"train_loss": -8.514341354370117, "global_step": 52639, "epoch": 313} {"train_loss": -8.340829849243164, "global_step": 52640, "epoch": 313} {"train_loss": -8.267691612243652, "global_step": 52641, "epoch": 313} {"train_loss": -8.446969985961914, "global_step": 52642, "epoch": 313} {"train_loss": -8.308061599731445, "global_step": 52643, "epoch": 313} {"train_loss": -8.437737464904785, "global_step": 52644, "epoch": 313} {"train_loss": -8.482430458068848, "global_step": 52645, "epoch": 313} {"train_loss": -8.317748069763184, "global_step": 52646, "epoch": 313} {"train_loss": -8.374974250793457, "global_step": 52647, "epoch": 313} {"train_loss": -8.529123306274414, "global_step": 52648, "epoch": 313} {"train_loss": -8.63452434539795, "global_step": 52649, "epoch": 313} {"train_loss": -8.40998649597168, "global_step": 52650, "epoch": 313} {"train_loss": -8.412627220153809, "global_step": 52651, "epoch": 313} {"train_loss": -8.814350128173828, "global_step": 52652, "epoch": 313} {"train_loss": -8.03283977508545, "global_step": 52653, "epoch": 313} {"train_loss": -8.132110595703125, "global_step": 52654, "epoch": 313} {"train_loss": -8.362266540527344, "global_step": 52655, "epoch": 313} {"train_loss": -8.416777610778809, "global_step": 52656, "epoch": 313} {"train_loss": -8.223278045654297, "global_step": 52657, "epoch": 313} {"train_loss": -8.222695350646973, "global_step": 52658, "epoch": 313} {"train_loss": -8.354506492614746, "global_step": 52659, "epoch": 313} {"train_loss": -8.015481948852539, "global_step": 52660, "epoch": 313} {"train_loss": -8.057732582092285, "global_step": 52661, "epoch": 313} {"train_loss": -8.16800594329834, "global_step": 52662, "epoch": 313} {"train_loss": -8.133965492248535, "global_step": 52663, "epoch": 313} {"train_loss": -7.9717888832092285, "global_step": 52664, "epoch": 313} {"train_loss": -7.919232368469238, "global_step": 52665, "epoch": 313} {"train_loss": -8.127410888671875, "global_step": 52666, "epoch": 313} {"train_loss": -8.371339797973633, "global_step": 52667, "epoch": 313} {"train_loss": -8.078933715820312, "global_step": 52668, "epoch": 313} {"train_loss": -8.05418586730957, "global_step": 52669, "epoch": 313} {"train_loss": -7.980404376983643, "global_step": 52670, "epoch": 313} {"train_loss": -8.05972671508789, "global_step": 52671, "epoch": 313} {"train_loss": -8.034607887268066, "global_step": 52672, "epoch": 313} {"train_loss": -8.236391067504883, "global_step": 52673, "epoch": 313} {"train_loss": -8.430355072021484, "global_step": 52674, "epoch": 313} {"train_loss": -8.247346878051758, "global_step": 52675, "epoch": 313} {"train_loss": -8.208003997802734, "global_step": 52676, "epoch": 313} {"train_loss": -8.401761054992676, "global_step": 52677, "epoch": 313} {"train_loss": -8.355728149414062, "global_step": 52678, "epoch": 313} {"train_loss": -8.288378715515137, "global_step": 52679, "epoch": 313} {"train_loss": -8.380189895629883, "global_step": 52680, "epoch": 313} {"train_loss": -8.317161560058594, "global_step": 52681, "epoch": 313} {"train_loss": -8.366150856018066, "global_step": 52682, "epoch": 313} {"train_loss": -8.449522972106934, "global_step": 52683, "epoch": 313} {"train_loss": -8.474895477294922, "global_step": 52684, "epoch": 313} {"train_loss": -8.415109634399414, "global_step": 52685, "epoch": 313} {"train_loss": -8.42040729522705, "global_step": 52686, "epoch": 313} {"train_loss": -8.470006942749023, "global_step": 52687, "epoch": 313} {"train_loss": -8.356136322021484, "global_step": 52688, "epoch": 313} {"train_loss": -8.332870483398438, "global_step": 52689, "epoch": 313} {"train_loss": -8.224505424499512, "global_step": 52690, "epoch": 313} {"train_loss": -8.123459815979004, "global_step": 52691, "epoch": 313} {"train_loss": -8.358116149902344, "global_step": 52692, "epoch": 313} {"train_loss": -8.186868667602539, "global_step": 52693, "epoch": 313} {"train_loss": -8.221040725708008, "global_step": 52694, "epoch": 313} {"train_loss": -8.400415420532227, "global_step": 52695, "epoch": 313} {"train_loss": -8.314382553100586, "global_step": 52696, "epoch": 313} {"train_loss": -8.277917861938477, "global_step": 52697, "epoch": 313} {"train_loss": -8.420785903930664, "global_step": 52698, "epoch": 313} {"train_loss": -8.626140594482422, "global_step": 52699, "epoch": 313} {"train_loss": -8.420886039733887, "global_step": 52700, "epoch": 313} {"train_loss": -8.325128555297852, "global_step": 52701, "epoch": 313} {"train_loss": -8.455655097961426, "global_step": 52702, "epoch": 313} {"train_loss": -8.293900489807129, "global_step": 52703, "epoch": 313} {"train_loss": -8.638690948486328, "global_step": 52704, "epoch": 313} {"train_loss": -8.452978134155273, "global_step": 52705, "epoch": 313} {"train_loss": -8.615558624267578, "global_step": 52706, "epoch": 313} {"train_loss": -8.269853591918945, "global_step": 52707, "epoch": 313} {"train_loss": -8.240702629089355, "global_step": 52708, "epoch": 313} {"train_loss": -8.489228248596191, "global_step": 52709, "epoch": 313} {"train_loss": -8.313535690307617, "global_step": 52710, "epoch": 313} {"train_loss": -8.447187423706055, "global_step": 52711, "epoch": 313} {"train_loss": -8.33735179901123, "global_step": 52712, "epoch": 313} {"train_loss": -8.511109352111816, "global_step": 52713, "epoch": 313} {"train_loss": -8.625104904174805, "global_step": 52714, "epoch": 313} {"train_loss": -8.46422004699707, "global_step": 52715, "epoch": 313} {"train_loss": -8.366880416870117, "global_step": 52716, "epoch": 313} {"train_loss": -8.525390625, "global_step": 52717, "epoch": 313} {"train_loss": -8.442387580871582, "global_step": 52718, "epoch": 313} {"train_loss": -8.535796165466309, "global_step": 52719, "epoch": 313} {"train_loss": -8.638971328735352, "global_step": 52720, "epoch": 313} {"train_loss": -8.289304733276367, "global_step": 52721, "epoch": 313} {"train_loss": -8.611833572387695, "global_step": 52722, "epoch": 313} {"train_loss": -8.541559219360352, "global_step": 52723, "epoch": 313} {"train_loss": -8.356473922729492, "global_step": 52724, "epoch": 313} {"train_loss": -8.409156799316406, "global_step": 52725, "epoch": 313} {"train_loss": -8.646313667297363, "global_step": 52726, "epoch": 313} {"train_loss": -8.604976654052734, "global_step": 52727, "epoch": 313} {"train_loss": -8.609817504882812, "global_step": 52728, "epoch": 313} {"train_loss": -8.473608016967773, "global_step": 52729, "epoch": 313} {"train_loss": -8.411859512329102, "global_step": 52730, "epoch": 313} {"train_loss": -8.484602928161621, "global_step": 52731, "epoch": 313} {"train_loss": -8.506372451782227, "global_step": 52732, "epoch": 313} {"train_loss": -8.515140533447266, "global_step": 52733, "epoch": 313} {"train_loss": -8.669673919677734, "global_step": 52734, "epoch": 313} {"train_loss": -8.533679962158203, "global_step": 52735, "epoch": 313} {"train_loss": -8.755555152893066, "global_step": 52736, "epoch": 313} {"train_loss": -8.630937576293945, "global_step": 52737, "epoch": 313} {"train_loss": -8.206421852111816, "global_step": 52738, "epoch": 313} {"train_loss": -8.597204208374023, "global_step": 52739, "epoch": 313} {"train_loss": -8.51746940612793, "global_step": 52740, "epoch": 313} {"train_loss": -8.441405296325684, "global_step": 52741, "epoch": 313} {"train_loss": -8.263174057006836, "global_step": 52742, "epoch": 313} {"train_loss": -8.358097076416016, "global_step": 52743, "epoch": 313} {"train_loss": -8.497629165649414, "global_step": 52744, "epoch": 313} {"train_loss": -8.350786209106445, "global_step": 52745, "epoch": 313} {"train_loss": -8.418405532836914, "global_step": 52746, "epoch": 313} {"train_loss": -8.509231567382812, "global_step": 52747, "epoch": 313} {"train_loss": -8.342913627624512, "global_step": 52748, "epoch": 313} {"train_loss": -8.629104614257812, "global_step": 52749, "epoch": 313} {"train_loss": -8.5234956741333, "global_step": 52750, "epoch": 313} {"train_loss": -8.363257183915092, "global_step": 52751, "epoch": 313, "val_loss": 188429.6875} {"train_loss": -8.386686325073242, "global_step": 52752, "epoch": 314} {"train_loss": -8.216461181640625, "global_step": 52753, "epoch": 314} {"train_loss": -8.296697616577148, "global_step": 52754, "epoch": 314} {"train_loss": -8.54083251953125, "global_step": 52755, "epoch": 314} {"train_loss": -8.348673820495605, "global_step": 52756, "epoch": 314} {"train_loss": -8.483247756958008, "global_step": 52757, "epoch": 314} {"train_loss": -8.31657600402832, "global_step": 52758, "epoch": 314} {"train_loss": -8.367767333984375, "global_step": 52759, "epoch": 314} {"train_loss": -8.416313171386719, "global_step": 52760, "epoch": 314} {"train_loss": -8.222663879394531, "global_step": 52761, "epoch": 314} {"train_loss": -8.100135803222656, "global_step": 52762, "epoch": 314} {"train_loss": -8.087787628173828, "global_step": 52763, "epoch": 314} {"train_loss": -8.360336303710938, "global_step": 52764, "epoch": 314} {"train_loss": -8.289429664611816, "global_step": 52765, "epoch": 314} {"train_loss": -8.367732048034668, "global_step": 52766, "epoch": 314} {"train_loss": -8.3118896484375, "global_step": 52767, "epoch": 314} {"train_loss": -8.122991561889648, "global_step": 52768, "epoch": 314} {"train_loss": -8.254497528076172, "global_step": 52769, "epoch": 314} {"train_loss": -8.2314453125, "global_step": 52770, "epoch": 314} {"train_loss": -8.411556243896484, "global_step": 52771, "epoch": 314} {"train_loss": -8.39491081237793, "global_step": 52772, "epoch": 314} {"train_loss": -8.079313278198242, "global_step": 52773, "epoch": 314} {"train_loss": -8.426910400390625, "global_step": 52774, "epoch": 314} {"train_loss": -8.359082221984863, "global_step": 52775, "epoch": 314} {"train_loss": -8.147320747375488, "global_step": 52776, "epoch": 314} {"train_loss": -8.363981246948242, "global_step": 52777, "epoch": 314} {"train_loss": -8.299285888671875, "global_step": 52778, "epoch": 314} {"train_loss": -8.54306697845459, "global_step": 52779, "epoch": 314} {"train_loss": -8.27253532409668, "global_step": 52780, "epoch": 314} {"train_loss": -8.515337944030762, "global_step": 52781, "epoch": 314} {"train_loss": -8.292316436767578, "global_step": 52782, "epoch": 314} {"train_loss": -8.46172046661377, "global_step": 52783, "epoch": 314} {"train_loss": -8.271318435668945, "global_step": 52784, "epoch": 314} {"train_loss": -8.616840362548828, "global_step": 52785, "epoch": 314} {"train_loss": -8.341797828674316, "global_step": 52786, "epoch": 314} {"train_loss": -8.411239624023438, "global_step": 52787, "epoch": 314} {"train_loss": -8.509629249572754, "global_step": 52788, "epoch": 314} {"train_loss": -8.211423873901367, "global_step": 52789, "epoch": 314} {"train_loss": -8.447038650512695, "global_step": 52790, "epoch": 314} {"train_loss": -8.728527069091797, "global_step": 52791, "epoch": 314} {"train_loss": -8.411161422729492, "global_step": 52792, "epoch": 314} {"train_loss": -8.501091003417969, "global_step": 52793, "epoch": 314} {"train_loss": -8.564799308776855, "global_step": 52794, "epoch": 314} {"train_loss": -8.442293167114258, "global_step": 52795, "epoch": 314} {"train_loss": -8.501655578613281, "global_step": 52796, "epoch": 314} {"train_loss": -8.374519348144531, "global_step": 52797, "epoch": 314} {"train_loss": -8.418128967285156, "global_step": 52798, "epoch": 314} {"train_loss": -8.572975158691406, "global_step": 52799, "epoch": 314} {"train_loss": -8.718667984008789, "global_step": 52800, "epoch": 314} {"train_loss": -8.4720458984375, "global_step": 52801, "epoch": 314} {"train_loss": -8.38672924041748, "global_step": 52802, "epoch": 314} {"train_loss": -8.510770797729492, "global_step": 52803, "epoch": 314} {"train_loss": -8.477628707885742, "global_step": 52804, "epoch": 314} {"train_loss": -8.570271492004395, "global_step": 52805, "epoch": 314} {"train_loss": -8.459774017333984, "global_step": 52806, "epoch": 314} {"train_loss": -8.489105224609375, "global_step": 52807, "epoch": 314} {"train_loss": -8.358787536621094, "global_step": 52808, "epoch": 314} {"train_loss": -8.377802848815918, "global_step": 52809, "epoch": 314} {"train_loss": -8.177640914916992, "global_step": 52810, "epoch": 314} {"train_loss": -8.433448791503906, "global_step": 52811, "epoch": 314} {"train_loss": -8.217612266540527, "global_step": 52812, "epoch": 314} {"train_loss": -8.424774169921875, "global_step": 52813, "epoch": 314} {"train_loss": -8.237127304077148, "global_step": 52814, "epoch": 314} {"train_loss": -8.314261436462402, "global_step": 52815, "epoch": 314} {"train_loss": -8.28498649597168, "global_step": 52816, "epoch": 314} {"train_loss": -8.201656341552734, "global_step": 52817, "epoch": 314} {"train_loss": -8.43690013885498, "global_step": 52818, "epoch": 314} {"train_loss": -8.422661781311035, "global_step": 52819, "epoch": 314} {"train_loss": -8.299272537231445, "global_step": 52820, "epoch": 314} {"train_loss": -8.175695419311523, "global_step": 52821, "epoch": 314} {"train_loss": -8.361151695251465, "global_step": 52822, "epoch": 314} {"train_loss": -8.310827255249023, "global_step": 52823, "epoch": 314} {"train_loss": -8.513339042663574, "global_step": 52824, "epoch": 314} {"train_loss": -8.517528533935547, "global_step": 52825, "epoch": 314} {"train_loss": -8.452320098876953, "global_step": 52826, "epoch": 314} {"train_loss": -8.432768821716309, "global_step": 52827, "epoch": 314} {"train_loss": -8.423421859741211, "global_step": 52828, "epoch": 314} {"train_loss": -8.42306137084961, "global_step": 52829, "epoch": 314} {"train_loss": -8.407608032226562, "global_step": 52830, "epoch": 314} {"train_loss": -8.40457534790039, "global_step": 52831, "epoch": 314} {"train_loss": -8.45185661315918, "global_step": 52832, "epoch": 314} {"train_loss": -8.429366111755371, "global_step": 52833, "epoch": 314} {"train_loss": -8.628406524658203, "global_step": 52834, "epoch": 314} {"train_loss": -8.414875030517578, "global_step": 52835, "epoch": 314} {"train_loss": -8.526641845703125, "global_step": 52836, "epoch": 314} {"train_loss": -8.660453796386719, "global_step": 52837, "epoch": 314} {"train_loss": -8.264139175415039, "global_step": 52838, "epoch": 314} {"train_loss": -8.620710372924805, "global_step": 52839, "epoch": 314} {"train_loss": -8.394893646240234, "global_step": 52840, "epoch": 314} {"train_loss": -8.73000717163086, "global_step": 52841, "epoch": 314} {"train_loss": -8.617703437805176, "global_step": 52842, "epoch": 314} {"train_loss": -8.59992790222168, "global_step": 52843, "epoch": 314} {"train_loss": -8.484554290771484, "global_step": 52844, "epoch": 314} {"train_loss": -8.393362045288086, "global_step": 52845, "epoch": 314} {"train_loss": -8.726119995117188, "global_step": 52846, "epoch": 314} {"train_loss": -8.529006004333496, "global_step": 52847, "epoch": 314} {"train_loss": -8.321638107299805, "global_step": 52848, "epoch": 314} {"train_loss": -8.604616165161133, "global_step": 52849, "epoch": 314} {"train_loss": -8.417856216430664, "global_step": 52850, "epoch": 314} {"train_loss": -8.59898853302002, "global_step": 52851, "epoch": 314} {"train_loss": -8.50811767578125, "global_step": 52852, "epoch": 314} {"train_loss": -8.50938606262207, "global_step": 52853, "epoch": 314} {"train_loss": -8.49044132232666, "global_step": 52854, "epoch": 314} {"train_loss": -8.220846176147461, "global_step": 52855, "epoch": 314} {"train_loss": -8.192761421203613, "global_step": 52856, "epoch": 314} {"train_loss": -8.59099006652832, "global_step": 52857, "epoch": 314} {"train_loss": -8.600879669189453, "global_step": 52858, "epoch": 314} {"train_loss": -8.418024063110352, "global_step": 52859, "epoch": 314} {"train_loss": -8.484746932983398, "global_step": 52860, "epoch": 314} {"train_loss": -8.563629150390625, "global_step": 52861, "epoch": 314} {"train_loss": -8.459434509277344, "global_step": 52862, "epoch": 314} {"train_loss": -8.372304916381836, "global_step": 52863, "epoch": 314} {"train_loss": -8.298439979553223, "global_step": 52864, "epoch": 314} {"train_loss": -8.805749893188477, "global_step": 52865, "epoch": 314} {"train_loss": -8.394441604614258, "global_step": 52866, "epoch": 314} {"train_loss": -8.289300918579102, "global_step": 52867, "epoch": 314} {"train_loss": -8.521161079406738, "global_step": 52868, "epoch": 314} {"train_loss": -8.661025047302246, "global_step": 52869, "epoch": 314} {"train_loss": -8.423789978027344, "global_step": 52870, "epoch": 314} {"train_loss": -8.470149040222168, "global_step": 52871, "epoch": 314} {"train_loss": -8.512762069702148, "global_step": 52872, "epoch": 314} {"train_loss": -8.406597137451172, "global_step": 52873, "epoch": 314} {"train_loss": -8.33635425567627, "global_step": 52874, "epoch": 314} {"train_loss": -8.429403305053711, "global_step": 52875, "epoch": 314} {"train_loss": -8.503029823303223, "global_step": 52876, "epoch": 314} {"train_loss": -8.368767738342285, "global_step": 52877, "epoch": 314} {"train_loss": -8.660005569458008, "global_step": 52878, "epoch": 314} {"train_loss": -8.414595603942871, "global_step": 52879, "epoch": 314} {"train_loss": -8.50265884399414, "global_step": 52880, "epoch": 314} {"train_loss": -8.27537727355957, "global_step": 52881, "epoch": 314} {"train_loss": -8.368242263793945, "global_step": 52882, "epoch": 314} {"train_loss": -8.417583465576172, "global_step": 52883, "epoch": 314} {"train_loss": -8.531705856323242, "global_step": 52884, "epoch": 314} {"train_loss": -8.404726028442383, "global_step": 52885, "epoch": 314} {"train_loss": -8.2846040725708, "global_step": 52886, "epoch": 314} {"train_loss": -8.741377830505371, "global_step": 52887, "epoch": 314} {"train_loss": -8.4307861328125, "global_step": 52888, "epoch": 314} {"train_loss": -8.658883094787598, "global_step": 52889, "epoch": 314} {"train_loss": -8.51199722290039, "global_step": 52890, "epoch": 314} {"train_loss": -8.390246391296387, "global_step": 52891, "epoch": 314} {"train_loss": -8.68994426727295, "global_step": 52892, "epoch": 314} {"train_loss": -8.244207382202148, "global_step": 52893, "epoch": 314} {"train_loss": -8.442800521850586, "global_step": 52894, "epoch": 314} {"train_loss": -8.366445541381836, "global_step": 52895, "epoch": 314} {"train_loss": -8.440411567687988, "global_step": 52896, "epoch": 314} {"train_loss": -8.528315544128418, "global_step": 52897, "epoch": 314} {"train_loss": -8.576414108276367, "global_step": 52898, "epoch": 314} {"train_loss": -8.514657020568848, "global_step": 52899, "epoch": 314} {"train_loss": -8.678900718688965, "global_step": 52900, "epoch": 314} {"train_loss": -8.264307022094727, "global_step": 52901, "epoch": 314} {"train_loss": -8.378963470458984, "global_step": 52902, "epoch": 314} {"train_loss": -8.473175048828125, "global_step": 52903, "epoch": 314} {"train_loss": -8.424838066101074, "global_step": 52904, "epoch": 314} {"train_loss": -8.416748046875, "global_step": 52905, "epoch": 314} {"train_loss": -8.363290786743164, "global_step": 52906, "epoch": 314} {"train_loss": -8.244769096374512, "global_step": 52907, "epoch": 314} {"train_loss": -8.390332221984863, "global_step": 52908, "epoch": 314} {"train_loss": -8.539762496948242, "global_step": 52909, "epoch": 314} {"train_loss": -8.60177993774414, "global_step": 52910, "epoch": 314} {"train_loss": -8.537603378295898, "global_step": 52911, "epoch": 314} {"train_loss": -8.409309387207031, "global_step": 52912, "epoch": 314} {"train_loss": -8.584417343139648, "global_step": 52913, "epoch": 314} {"train_loss": -8.401333808898926, "global_step": 52914, "epoch": 314} {"train_loss": -8.415526390075684, "global_step": 52915, "epoch": 314} {"train_loss": -8.165054321289062, "global_step": 52916, "epoch": 314} {"train_loss": -8.396280288696289, "global_step": 52917, "epoch": 314} {"train_loss": -8.436050415039062, "global_step": 52918, "epoch": 314} {"train_loss": -8.426130680810838, "global_step": 52919, "epoch": 314, "val_loss": 190965.1875} {"train_loss": -8.229677200317383, "global_step": 52920, "epoch": 315} {"train_loss": -8.307088851928711, "global_step": 52921, "epoch": 315} {"train_loss": -8.256685256958008, "global_step": 52922, "epoch": 315} {"train_loss": -8.411507606506348, "global_step": 52923, "epoch": 315} {"train_loss": -8.41886043548584, "global_step": 52924, "epoch": 315} {"train_loss": -8.237895965576172, "global_step": 52925, "epoch": 315} {"train_loss": -8.278094291687012, "global_step": 52926, "epoch": 315} {"train_loss": -8.319173812866211, "global_step": 52927, "epoch": 315} {"train_loss": -8.374826431274414, "global_step": 52928, "epoch": 315} {"train_loss": -8.472203254699707, "global_step": 52929, "epoch": 315} {"train_loss": -8.19072151184082, "global_step": 52930, "epoch": 315} {"train_loss": -8.444129943847656, "global_step": 52931, "epoch": 315} {"train_loss": -8.177705764770508, "global_step": 52932, "epoch": 315} {"train_loss": -8.186429977416992, "global_step": 52933, "epoch": 315} {"train_loss": -7.952892303466797, "global_step": 52934, "epoch": 315} {"train_loss": -8.216747283935547, "global_step": 52935, "epoch": 315} {"train_loss": -8.291084289550781, "global_step": 52936, "epoch": 315} {"train_loss": -8.163854598999023, "global_step": 52937, "epoch": 315} {"train_loss": -8.171844482421875, "global_step": 52938, "epoch": 315} {"train_loss": -8.27076530456543, "global_step": 52939, "epoch": 315} {"train_loss": -8.139659881591797, "global_step": 52940, "epoch": 315} {"train_loss": -8.529199600219727, "global_step": 52941, "epoch": 315} {"train_loss": -8.203435897827148, "global_step": 52942, "epoch": 315} {"train_loss": -8.588081359863281, "global_step": 52943, "epoch": 315} {"train_loss": -8.23874568939209, "global_step": 52944, "epoch": 315} {"train_loss": -8.288263320922852, "global_step": 52945, "epoch": 315} {"train_loss": -8.231914520263672, "global_step": 52946, "epoch": 315} {"train_loss": -8.332816123962402, "global_step": 52947, "epoch": 315} {"train_loss": -8.248875617980957, "global_step": 52948, "epoch": 315} {"train_loss": -8.477288246154785, "global_step": 52949, "epoch": 315} {"train_loss": -8.31576919555664, "global_step": 52950, "epoch": 315} {"train_loss": -8.34782600402832, "global_step": 52951, "epoch": 315} {"train_loss": -8.307598114013672, "global_step": 52952, "epoch": 315} {"train_loss": -8.110733985900879, "global_step": 52953, "epoch": 315} {"train_loss": -8.431143760681152, "global_step": 52954, "epoch": 315} {"train_loss": -8.229949951171875, "global_step": 52955, "epoch": 315} {"train_loss": -8.325763702392578, "global_step": 52956, "epoch": 315} {"train_loss": -8.367008209228516, "global_step": 52957, "epoch": 315} {"train_loss": -8.336702346801758, "global_step": 52958, "epoch": 315} {"train_loss": -8.433366775512695, "global_step": 52959, "epoch": 315} {"train_loss": -8.316854476928711, "global_step": 52960, "epoch": 315} {"train_loss": -8.417279243469238, "global_step": 52961, "epoch": 315} {"train_loss": -8.62546443939209, "global_step": 52962, "epoch": 315} {"train_loss": -8.44733715057373, "global_step": 52963, "epoch": 315} {"train_loss": -8.515074729919434, "global_step": 52964, "epoch": 315} {"train_loss": -8.407163619995117, "global_step": 52965, "epoch": 315} {"train_loss": -8.48708724975586, "global_step": 52966, "epoch": 315} {"train_loss": -8.527120590209961, "global_step": 52967, "epoch": 315} {"train_loss": -8.264394760131836, "global_step": 52968, "epoch": 315} {"train_loss": -8.484189987182617, "global_step": 52969, "epoch": 315} {"train_loss": -8.31118392944336, "global_step": 52970, "epoch": 315} {"train_loss": -8.533742904663086, "global_step": 52971, "epoch": 315} {"train_loss": -8.36082935333252, "global_step": 52972, "epoch": 315} {"train_loss": -8.269850730895996, "global_step": 52973, "epoch": 315} {"train_loss": -8.477239608764648, "global_step": 52974, "epoch": 315} {"train_loss": -8.511075019836426, "global_step": 52975, "epoch": 315} {"train_loss": -8.306021690368652, "global_step": 52976, "epoch": 315} {"train_loss": -8.370887756347656, "global_step": 52977, "epoch": 315} {"train_loss": -8.369987487792969, "global_step": 52978, "epoch": 315} {"train_loss": -8.43832015991211, "global_step": 52979, "epoch": 315} {"train_loss": -8.527463912963867, "global_step": 52980, "epoch": 315} {"train_loss": -8.305441856384277, "global_step": 52981, "epoch": 315} {"train_loss": -8.543685913085938, "global_step": 52982, "epoch": 315} {"train_loss": -8.470315933227539, "global_step": 52983, "epoch": 315} {"train_loss": -8.511754989624023, "global_step": 52984, "epoch": 315} {"train_loss": -8.532894134521484, "global_step": 52985, "epoch": 315} {"train_loss": -8.497823715209961, "global_step": 52986, "epoch": 315} {"train_loss": -8.427251815795898, "global_step": 52987, "epoch": 315} {"train_loss": -8.538063049316406, "global_step": 52988, "epoch": 315} {"train_loss": -8.066276550292969, "global_step": 52989, "epoch": 315} {"train_loss": -8.415412902832031, "global_step": 52990, "epoch": 315} {"train_loss": -8.22852611541748, "global_step": 52991, "epoch": 315} {"train_loss": -8.117454528808594, "global_step": 52992, "epoch": 315} {"train_loss": -8.222644805908203, "global_step": 52993, "epoch": 315} {"train_loss": -8.22361946105957, "global_step": 52994, "epoch": 315} {"train_loss": -8.538810729980469, "global_step": 52995, "epoch": 315} {"train_loss": -8.299453735351562, "global_step": 52996, "epoch": 315} {"train_loss": -8.605897903442383, "global_step": 52997, "epoch": 315} {"train_loss": -8.381546020507812, "global_step": 52998, "epoch": 315} {"train_loss": -8.365730285644531, "global_step": 52999, "epoch": 315} {"train_loss": -8.382343292236328, "global_step": 53000, "epoch": 315} {"train_loss": -8.19768238067627, "global_step": 53001, "epoch": 315} {"train_loss": -8.20384407043457, "global_step": 53002, "epoch": 315} {"train_loss": -8.551355361938477, "global_step": 53003, "epoch": 315} {"train_loss": -8.413834571838379, "global_step": 53004, "epoch": 315} {"train_loss": -8.250019073486328, "global_step": 53005, "epoch": 315} {"train_loss": -8.49508285522461, "global_step": 53006, "epoch": 315} {"train_loss": -8.547208786010742, "global_step": 53007, "epoch": 315} {"train_loss": -8.551803588867188, "global_step": 53008, "epoch": 315} {"train_loss": -8.466667175292969, "global_step": 53009, "epoch": 315} {"train_loss": -8.595428466796875, "global_step": 53010, "epoch": 315} {"train_loss": -8.587228775024414, "global_step": 53011, "epoch": 315} {"train_loss": -8.367212295532227, "global_step": 53012, "epoch": 315} {"train_loss": -8.570985794067383, "global_step": 53013, "epoch": 315} {"train_loss": -8.51431941986084, "global_step": 53014, "epoch": 315} {"train_loss": -8.655946731567383, "global_step": 53015, "epoch": 315} {"train_loss": -8.560016632080078, "global_step": 53016, "epoch": 315} {"train_loss": -8.497540473937988, "global_step": 53017, "epoch": 315} {"train_loss": -8.647064208984375, "global_step": 53018, "epoch": 315} {"train_loss": -8.611246109008789, "global_step": 53019, "epoch": 315} {"train_loss": -8.70974349975586, "global_step": 53020, "epoch": 315} {"train_loss": -8.604388236999512, "global_step": 53021, "epoch": 315} {"train_loss": -8.61036491394043, "global_step": 53022, "epoch": 315} {"train_loss": -8.539153099060059, "global_step": 53023, "epoch": 315} {"train_loss": -8.194819450378418, "global_step": 53024, "epoch": 315} {"train_loss": -8.779339790344238, "global_step": 53025, "epoch": 315} {"train_loss": -8.225127220153809, "global_step": 53026, "epoch": 315} {"train_loss": -8.53659439086914, "global_step": 53027, "epoch": 315} {"train_loss": -8.349380493164062, "global_step": 53028, "epoch": 315} {"train_loss": -8.522266387939453, "global_step": 53029, "epoch": 315} {"train_loss": -8.432445526123047, "global_step": 53030, "epoch": 315} {"train_loss": -8.287572860717773, "global_step": 53031, "epoch": 315} {"train_loss": -8.511127471923828, "global_step": 53032, "epoch": 315} {"train_loss": -8.289632797241211, "global_step": 53033, "epoch": 315} {"train_loss": -8.310859680175781, "global_step": 53034, "epoch": 315} {"train_loss": -8.216329574584961, "global_step": 53035, "epoch": 315} {"train_loss": -8.349937438964844, "global_step": 53036, "epoch": 315} {"train_loss": -8.209455490112305, "global_step": 53037, "epoch": 315} {"train_loss": -8.386222839355469, "global_step": 53038, "epoch": 315} {"train_loss": -8.290494918823242, "global_step": 53039, "epoch": 315} {"train_loss": -8.587516784667969, "global_step": 53040, "epoch": 315} {"train_loss": -8.646871566772461, "global_step": 53041, "epoch": 315} {"train_loss": -8.674256324768066, "global_step": 53042, "epoch": 315} {"train_loss": -8.448075294494629, "global_step": 53043, "epoch": 315} {"train_loss": -8.581275939941406, "global_step": 53044, "epoch": 315} {"train_loss": -8.601008415222168, "global_step": 53045, "epoch": 315} {"train_loss": -8.575006484985352, "global_step": 53046, "epoch": 315} {"train_loss": -8.445917129516602, "global_step": 53047, "epoch": 315} {"train_loss": -8.607176780700684, "global_step": 53048, "epoch": 315} {"train_loss": -8.031106948852539, "global_step": 53049, "epoch": 315} {"train_loss": -8.45753288269043, "global_step": 53050, "epoch": 315} {"train_loss": -8.004817962646484, "global_step": 53051, "epoch": 315} {"train_loss": -8.374093055725098, "global_step": 53052, "epoch": 315} {"train_loss": -8.06393051147461, "global_step": 53053, "epoch": 315} {"train_loss": -8.377676010131836, "global_step": 53054, "epoch": 315} {"train_loss": -8.394088745117188, "global_step": 53055, "epoch": 315} {"train_loss": -8.090972900390625, "global_step": 53056, "epoch": 315} {"train_loss": -8.295022010803223, "global_step": 53057, "epoch": 315} {"train_loss": -8.317325592041016, "global_step": 53058, "epoch": 315} {"train_loss": -8.309684753417969, "global_step": 53059, "epoch": 315} {"train_loss": -8.380783081054688, "global_step": 53060, "epoch": 315} {"train_loss": -8.283738136291504, "global_step": 53061, "epoch": 315} {"train_loss": -8.384187698364258, "global_step": 53062, "epoch": 315} {"train_loss": -8.220224380493164, "global_step": 53063, "epoch": 315} {"train_loss": -8.31859302520752, "global_step": 53064, "epoch": 315} {"train_loss": -8.222734451293945, "global_step": 53065, "epoch": 315} {"train_loss": -8.378567695617676, "global_step": 53066, "epoch": 315} {"train_loss": -8.381362915039062, "global_step": 53067, "epoch": 315} {"train_loss": -8.079704284667969, "global_step": 53068, "epoch": 315} {"train_loss": -8.413830757141113, "global_step": 53069, "epoch": 315} {"train_loss": -8.157135009765625, "global_step": 53070, "epoch": 315} {"train_loss": -8.281277656555176, "global_step": 53071, "epoch": 315} {"train_loss": -8.402803421020508, "global_step": 53072, "epoch": 315} {"train_loss": -8.230045318603516, "global_step": 53073, "epoch": 315} {"train_loss": -8.366105079650879, "global_step": 53074, "epoch": 315} {"train_loss": -8.205245971679688, "global_step": 53075, "epoch": 315} {"train_loss": -8.363055229187012, "global_step": 53076, "epoch": 315} {"train_loss": -8.471446990966797, "global_step": 53077, "epoch": 315} {"train_loss": -8.509836196899414, "global_step": 53078, "epoch": 315} {"train_loss": -8.468881607055664, "global_step": 53079, "epoch": 315} {"train_loss": -8.470987319946289, "global_step": 53080, "epoch": 315} {"train_loss": -8.448158264160156, "global_step": 53081, "epoch": 315} {"train_loss": -8.425484657287598, "global_step": 53082, "epoch": 315} {"train_loss": -8.508028030395508, "global_step": 53083, "epoch": 315} {"train_loss": -8.387628555297852, "global_step": 53084, "epoch": 315} {"train_loss": -8.367148399353027, "global_step": 53085, "epoch": 315} {"train_loss": -8.48723030090332, "global_step": 53086, "epoch": 315} {"train_loss": -8.380472342173258, "global_step": 53087, "epoch": 315, "val_loss": 191095.890625, "train_action_mse_error": 16.296085357666016} {"train_loss": -8.265545845031738, "global_step": 53088, "epoch": 316} {"train_loss": -8.501255989074707, "global_step": 53089, "epoch": 316} {"train_loss": -8.374433517456055, "global_step": 53090, "epoch": 316} {"train_loss": -8.608003616333008, "global_step": 53091, "epoch": 316} {"train_loss": -8.294654846191406, "global_step": 53092, "epoch": 316} {"train_loss": -8.120147705078125, "global_step": 53093, "epoch": 316} {"train_loss": -8.48069953918457, "global_step": 53094, "epoch": 316} {"train_loss": -8.749198913574219, "global_step": 53095, "epoch": 316} {"train_loss": -8.311727523803711, "global_step": 53096, "epoch": 316} {"train_loss": -8.382018089294434, "global_step": 53097, "epoch": 316} {"train_loss": -8.244590759277344, "global_step": 53098, "epoch": 316} {"train_loss": -8.381063461303711, "global_step": 53099, "epoch": 316} {"train_loss": -8.459341049194336, "global_step": 53100, "epoch": 316} {"train_loss": -8.58596134185791, "global_step": 53101, "epoch": 316} {"train_loss": -8.355223655700684, "global_step": 53102, "epoch": 316} {"train_loss": -8.290098190307617, "global_step": 53103, "epoch": 316} {"train_loss": -8.624529838562012, "global_step": 53104, "epoch": 316} {"train_loss": -8.457879066467285, "global_step": 53105, "epoch": 316} {"train_loss": -8.276812553405762, "global_step": 53106, "epoch": 316} {"train_loss": -8.375033378601074, "global_step": 53107, "epoch": 316} {"train_loss": -8.599517822265625, "global_step": 53108, "epoch": 316} {"train_loss": -8.59533977508545, "global_step": 53109, "epoch": 316} {"train_loss": -8.567245483398438, "global_step": 53110, "epoch": 316} {"train_loss": -8.52459716796875, "global_step": 53111, "epoch": 316} {"train_loss": -8.58706283569336, "global_step": 53112, "epoch": 316} {"train_loss": -8.493332862854004, "global_step": 53113, "epoch": 316} {"train_loss": -8.550558090209961, "global_step": 53114, "epoch": 316} {"train_loss": -8.569822311401367, "global_step": 53115, "epoch": 316} {"train_loss": -8.567085266113281, "global_step": 53116, "epoch": 316} {"train_loss": -8.651348114013672, "global_step": 53117, "epoch": 316} {"train_loss": -8.545368194580078, "global_step": 53118, "epoch": 316} {"train_loss": -8.671306610107422, "global_step": 53119, "epoch": 316} {"train_loss": -8.585111618041992, "global_step": 53120, "epoch": 316} {"train_loss": -8.699491500854492, "global_step": 53121, "epoch": 316} {"train_loss": -8.525123596191406, "global_step": 53122, "epoch": 316} {"train_loss": -8.409957885742188, "global_step": 53123, "epoch": 316} {"train_loss": -8.533708572387695, "global_step": 53124, "epoch": 316} {"train_loss": -8.524392127990723, "global_step": 53125, "epoch": 316} {"train_loss": -8.2816162109375, "global_step": 53126, "epoch": 316} {"train_loss": -8.644123077392578, "global_step": 53127, "epoch": 316} {"train_loss": -8.683382987976074, "global_step": 53128, "epoch": 316} {"train_loss": -8.528582572937012, "global_step": 53129, "epoch": 316} {"train_loss": -8.730447769165039, "global_step": 53130, "epoch": 316} {"train_loss": -8.697286605834961, "global_step": 53131, "epoch": 316} {"train_loss": -8.518998146057129, "global_step": 53132, "epoch": 316} {"train_loss": -8.56760025024414, "global_step": 53133, "epoch": 316} {"train_loss": -8.601627349853516, "global_step": 53134, "epoch": 316} {"train_loss": -8.734535217285156, "global_step": 53135, "epoch": 316} {"train_loss": -8.606978416442871, "global_step": 53136, "epoch": 316} {"train_loss": -8.604955673217773, "global_step": 53137, "epoch": 316} {"train_loss": -8.580394744873047, "global_step": 53138, "epoch": 316} {"train_loss": -8.363873481750488, "global_step": 53139, "epoch": 316} {"train_loss": -8.782914161682129, "global_step": 53140, "epoch": 316} {"train_loss": -8.541553497314453, "global_step": 53141, "epoch": 316} {"train_loss": -8.61471176147461, "global_step": 53142, "epoch": 316} {"train_loss": -8.33285140991211, "global_step": 53143, "epoch": 316} {"train_loss": -8.469490051269531, "global_step": 53144, "epoch": 316} {"train_loss": -8.721670150756836, "global_step": 53145, "epoch": 316} {"train_loss": -8.6450777053833, "global_step": 53146, "epoch": 316} {"train_loss": -8.662137985229492, "global_step": 53147, "epoch": 316} {"train_loss": -8.422971725463867, "global_step": 53148, "epoch": 316} {"train_loss": -8.527704238891602, "global_step": 53149, "epoch": 316} {"train_loss": -8.567237854003906, "global_step": 53150, "epoch": 316} {"train_loss": -8.340484619140625, "global_step": 53151, "epoch": 316} {"train_loss": -8.391530990600586, "global_step": 53152, "epoch": 316} {"train_loss": -8.268535614013672, "global_step": 53153, "epoch": 316} {"train_loss": -8.35202407836914, "global_step": 53154, "epoch": 316} {"train_loss": -8.325124740600586, "global_step": 53155, "epoch": 316} {"train_loss": -8.57644271850586, "global_step": 53156, "epoch": 316} {"train_loss": -8.551847457885742, "global_step": 53157, "epoch": 316} {"train_loss": -8.573318481445312, "global_step": 53158, "epoch": 316} {"train_loss": -8.473479270935059, "global_step": 53159, "epoch": 316} {"train_loss": -8.63541316986084, "global_step": 53160, "epoch": 316} {"train_loss": -8.406719207763672, "global_step": 53161, "epoch": 316} {"train_loss": -8.511533737182617, "global_step": 53162, "epoch": 316} {"train_loss": -8.380926132202148, "global_step": 53163, "epoch": 316} {"train_loss": -8.483659744262695, "global_step": 53164, "epoch": 316} {"train_loss": -8.464554786682129, "global_step": 53165, "epoch": 316} {"train_loss": -8.565524101257324, "global_step": 53166, "epoch": 316} {"train_loss": -8.629802703857422, "global_step": 53167, "epoch": 316} {"train_loss": -8.454906463623047, "global_step": 53168, "epoch": 316} {"train_loss": -8.385126113891602, "global_step": 53169, "epoch": 316} {"train_loss": -8.614364624023438, "global_step": 53170, "epoch": 316} {"train_loss": -8.63370132446289, "global_step": 53171, "epoch": 316} {"train_loss": -8.527730941772461, "global_step": 53172, "epoch": 316} {"train_loss": -8.258195877075195, "global_step": 53173, "epoch": 316} {"train_loss": -8.310784339904785, "global_step": 53174, "epoch": 316} {"train_loss": -8.645898818969727, "global_step": 53175, "epoch": 316} {"train_loss": -8.60330581665039, "global_step": 53176, "epoch": 316} {"train_loss": -8.574135780334473, "global_step": 53177, "epoch": 316} {"train_loss": -8.693136215209961, "global_step": 53178, "epoch": 316} {"train_loss": -8.711661338806152, "global_step": 53179, "epoch": 316} {"train_loss": -8.503992080688477, "global_step": 53180, "epoch": 316} {"train_loss": -8.378929138183594, "global_step": 53181, "epoch": 316} {"train_loss": -8.38280963897705, "global_step": 53182, "epoch": 316} {"train_loss": -8.307512283325195, "global_step": 53183, "epoch": 316} {"train_loss": -8.498931884765625, "global_step": 53184, "epoch": 316} {"train_loss": -8.424195289611816, "global_step": 53185, "epoch": 316} {"train_loss": -8.403968811035156, "global_step": 53186, "epoch": 316} {"train_loss": -8.413154602050781, "global_step": 53187, "epoch": 316} {"train_loss": -8.60933780670166, "global_step": 53188, "epoch": 316} {"train_loss": -8.447400093078613, "global_step": 53189, "epoch": 316} {"train_loss": -8.324292182922363, "global_step": 53190, "epoch": 316} {"train_loss": -7.875774383544922, "global_step": 53191, "epoch": 316} {"train_loss": -8.691743850708008, "global_step": 53192, "epoch": 316} {"train_loss": -8.290582656860352, "global_step": 53193, "epoch": 316} {"train_loss": -8.491413116455078, "global_step": 53194, "epoch": 316} {"train_loss": -8.15506362915039, "global_step": 53195, "epoch": 316} {"train_loss": -8.189058303833008, "global_step": 53196, "epoch": 316} {"train_loss": -8.145861625671387, "global_step": 53197, "epoch": 316} {"train_loss": -7.882874488830566, "global_step": 53198, "epoch": 316} {"train_loss": -8.272428512573242, "global_step": 53199, "epoch": 316} {"train_loss": -8.046653747558594, "global_step": 53200, "epoch": 316} {"train_loss": -8.35201644897461, "global_step": 53201, "epoch": 316} {"train_loss": -8.14363956451416, "global_step": 53202, "epoch": 316} {"train_loss": -8.189000129699707, "global_step": 53203, "epoch": 316} {"train_loss": -8.451385498046875, "global_step": 53204, "epoch": 316} {"train_loss": -8.278085708618164, "global_step": 53205, "epoch": 316} {"train_loss": -8.547613143920898, "global_step": 53206, "epoch": 316} {"train_loss": -8.36659049987793, "global_step": 53207, "epoch": 316} {"train_loss": -8.10920238494873, "global_step": 53208, "epoch": 316} {"train_loss": -8.499643325805664, "global_step": 53209, "epoch": 316} {"train_loss": -7.8161211013793945, "global_step": 53210, "epoch": 316} {"train_loss": -8.47419548034668, "global_step": 53211, "epoch": 316} {"train_loss": -8.198027610778809, "global_step": 53212, "epoch": 316} {"train_loss": -8.36746883392334, "global_step": 53213, "epoch": 316} {"train_loss": -8.264988899230957, "global_step": 53214, "epoch": 316} {"train_loss": -8.362147331237793, "global_step": 53215, "epoch": 316} {"train_loss": -8.448114395141602, "global_step": 53216, "epoch": 316} {"train_loss": -8.404833793640137, "global_step": 53217, "epoch": 316} {"train_loss": -8.386764526367188, "global_step": 53218, "epoch": 316} {"train_loss": -8.472804069519043, "global_step": 53219, "epoch": 316} {"train_loss": -8.148341178894043, "global_step": 53220, "epoch": 316} {"train_loss": -8.593964576721191, "global_step": 53221, "epoch": 316} {"train_loss": -8.466054916381836, "global_step": 53222, "epoch": 316} {"train_loss": -8.29548454284668, "global_step": 53223, "epoch": 316} {"train_loss": -8.345575332641602, "global_step": 53224, "epoch": 316} {"train_loss": -8.61159610748291, "global_step": 53225, "epoch": 316} {"train_loss": -8.288021087646484, "global_step": 53226, "epoch": 316} {"train_loss": -8.536874771118164, "global_step": 53227, "epoch": 316} {"train_loss": -8.433615684509277, "global_step": 53228, "epoch": 316} {"train_loss": -8.318368911743164, "global_step": 53229, "epoch": 316} {"train_loss": -8.548376083374023, "global_step": 53230, "epoch": 316} {"train_loss": -8.394365310668945, "global_step": 53231, "epoch": 316} {"train_loss": -8.53884220123291, "global_step": 53232, "epoch": 316} {"train_loss": -8.667762756347656, "global_step": 53233, "epoch": 316} {"train_loss": -8.393758773803711, "global_step": 53234, "epoch": 316} {"train_loss": -8.369270324707031, "global_step": 53235, "epoch": 316} {"train_loss": -8.60822868347168, "global_step": 53236, "epoch": 316} {"train_loss": -8.194459915161133, "global_step": 53237, "epoch": 316} {"train_loss": -8.50831413269043, "global_step": 53238, "epoch": 316} {"train_loss": -8.686660766601562, "global_step": 53239, "epoch": 316} {"train_loss": -8.432758331298828, "global_step": 53240, "epoch": 316} {"train_loss": -8.575284004211426, "global_step": 53241, "epoch": 316} {"train_loss": -8.326658248901367, "global_step": 53242, "epoch": 316} {"train_loss": -8.533531188964844, "global_step": 53243, "epoch": 316} {"train_loss": -8.094444274902344, "global_step": 53244, "epoch": 316} {"train_loss": -8.6617431640625, "global_step": 53245, "epoch": 316} {"train_loss": -8.539515495300293, "global_step": 53246, "epoch": 316} {"train_loss": -8.03724193572998, "global_step": 53247, "epoch": 316} {"train_loss": -8.131072044372559, "global_step": 53248, "epoch": 316} {"train_loss": -8.283832550048828, "global_step": 53249, "epoch": 316} {"train_loss": -8.2555570602417, "global_step": 53250, "epoch": 316} {"train_loss": -8.284415245056152, "global_step": 53251, "epoch": 316} {"train_loss": -8.232404708862305, "global_step": 53252, "epoch": 316} {"train_loss": -8.580974578857422, "global_step": 53253, "epoch": 316} {"train_loss": -8.294075012207031, "global_step": 53254, "epoch": 316} {"train_loss": -8.445788014502753, "global_step": 53255, "epoch": 316, "val_loss": 187804.796875} {"train_loss": -8.569412231445312, "global_step": 53256, "epoch": 317} {"train_loss": -8.542572021484375, "global_step": 53257, "epoch": 317} {"train_loss": -8.437416076660156, "global_step": 53258, "epoch": 317} {"train_loss": -8.46672534942627, "global_step": 53259, "epoch": 317} {"train_loss": -8.544618606567383, "global_step": 53260, "epoch": 317} {"train_loss": -8.496316909790039, "global_step": 53261, "epoch": 317} {"train_loss": -8.557278633117676, "global_step": 53262, "epoch": 317} {"train_loss": -8.554088592529297, "global_step": 53263, "epoch": 317} {"train_loss": -8.591222763061523, "global_step": 53264, "epoch": 317} {"train_loss": -8.43440055847168, "global_step": 53265, "epoch": 317} {"train_loss": -8.536441802978516, "global_step": 53266, "epoch": 317} {"train_loss": -8.462210655212402, "global_step": 53267, "epoch": 317} {"train_loss": -8.524866104125977, "global_step": 53268, "epoch": 317} {"train_loss": -8.454111099243164, "global_step": 53269, "epoch": 317} {"train_loss": -8.472970008850098, "global_step": 53270, "epoch": 317} {"train_loss": -8.702366828918457, "global_step": 53271, "epoch": 317} {"train_loss": -8.498558044433594, "global_step": 53272, "epoch": 317} {"train_loss": -8.208011627197266, "global_step": 53273, "epoch": 317} {"train_loss": -8.348926544189453, "global_step": 53274, "epoch": 317} {"train_loss": -8.282405853271484, "global_step": 53275, "epoch": 317} {"train_loss": -8.323514938354492, "global_step": 53276, "epoch": 317} {"train_loss": -8.377446174621582, "global_step": 53277, "epoch": 317} {"train_loss": -8.137654304504395, "global_step": 53278, "epoch": 317} {"train_loss": -8.232134819030762, "global_step": 53279, "epoch": 317} {"train_loss": -8.099750518798828, "global_step": 53280, "epoch": 317} {"train_loss": -8.317076683044434, "global_step": 53281, "epoch": 317} {"train_loss": -8.459761619567871, "global_step": 53282, "epoch": 317} {"train_loss": -8.501359939575195, "global_step": 53283, "epoch": 317} {"train_loss": -8.370882034301758, "global_step": 53284, "epoch": 317} {"train_loss": -8.279694557189941, "global_step": 53285, "epoch": 317} {"train_loss": -8.434090614318848, "global_step": 53286, "epoch": 317} {"train_loss": -8.290765762329102, "global_step": 53287, "epoch": 317} {"train_loss": -8.507560729980469, "global_step": 53288, "epoch": 317} {"train_loss": -8.536026000976562, "global_step": 53289, "epoch": 317} {"train_loss": -8.150949478149414, "global_step": 53290, "epoch": 317} {"train_loss": -8.451667785644531, "global_step": 53291, "epoch": 317} {"train_loss": -8.370723724365234, "global_step": 53292, "epoch": 317} {"train_loss": -8.483526229858398, "global_step": 53293, "epoch": 317} {"train_loss": -8.393138885498047, "global_step": 53294, "epoch": 317} {"train_loss": -8.387727737426758, "global_step": 53295, "epoch": 317} {"train_loss": -8.340611457824707, "global_step": 53296, "epoch": 317} {"train_loss": -8.737192153930664, "global_step": 53297, "epoch": 317} {"train_loss": -8.505533218383789, "global_step": 53298, "epoch": 317} {"train_loss": -8.385780334472656, "global_step": 53299, "epoch": 317} {"train_loss": -8.52663803100586, "global_step": 53300, "epoch": 317} {"train_loss": -8.644986152648926, "global_step": 53301, "epoch": 317} {"train_loss": -8.543647766113281, "global_step": 53302, "epoch": 317} {"train_loss": -8.658058166503906, "global_step": 53303, "epoch": 317} {"train_loss": -8.725903511047363, "global_step": 53304, "epoch": 317} {"train_loss": -8.289841651916504, "global_step": 53305, "epoch": 317} {"train_loss": -8.466522216796875, "global_step": 53306, "epoch": 317} {"train_loss": -8.68648910522461, "global_step": 53307, "epoch": 317} {"train_loss": -8.674989700317383, "global_step": 53308, "epoch": 317} {"train_loss": -8.727214813232422, "global_step": 53309, "epoch": 317} {"train_loss": -8.511343002319336, "global_step": 53310, "epoch": 317} {"train_loss": -8.569026947021484, "global_step": 53311, "epoch": 317} {"train_loss": -8.521873474121094, "global_step": 53312, "epoch": 317} {"train_loss": -8.254406929016113, "global_step": 53313, "epoch": 317} {"train_loss": -8.386869430541992, "global_step": 53314, "epoch": 317} {"train_loss": -8.694855690002441, "global_step": 53315, "epoch": 317} {"train_loss": -8.295409202575684, "global_step": 53316, "epoch": 317} {"train_loss": -8.63912582397461, "global_step": 53317, "epoch": 317} {"train_loss": -8.670185089111328, "global_step": 53318, "epoch": 317} {"train_loss": -8.375604629516602, "global_step": 53319, "epoch": 317} {"train_loss": -8.626477241516113, "global_step": 53320, "epoch": 317} {"train_loss": -8.423065185546875, "global_step": 53321, "epoch": 317} {"train_loss": -8.656144142150879, "global_step": 53322, "epoch": 317} {"train_loss": -8.15872859954834, "global_step": 53323, "epoch": 317} {"train_loss": -8.672769546508789, "global_step": 53324, "epoch": 317} {"train_loss": -8.33323860168457, "global_step": 53325, "epoch": 317} {"train_loss": -8.657833099365234, "global_step": 53326, "epoch": 317} {"train_loss": -8.471363067626953, "global_step": 53327, "epoch": 317} {"train_loss": -8.494562149047852, "global_step": 53328, "epoch": 317} {"train_loss": -8.504202842712402, "global_step": 53329, "epoch": 317} {"train_loss": -8.343743324279785, "global_step": 53330, "epoch": 317} {"train_loss": -8.691658020019531, "global_step": 53331, "epoch": 317} {"train_loss": -8.343443870544434, "global_step": 53332, "epoch": 317} {"train_loss": -8.434470176696777, "global_step": 53333, "epoch": 317} {"train_loss": -8.131927490234375, "global_step": 53334, "epoch": 317} {"train_loss": -8.482699394226074, "global_step": 53335, "epoch": 317} {"train_loss": -8.465709686279297, "global_step": 53336, "epoch": 317} {"train_loss": -8.310375213623047, "global_step": 53337, "epoch": 317} {"train_loss": -8.421308517456055, "global_step": 53338, "epoch": 317} {"train_loss": -8.662027359008789, "global_step": 53339, "epoch": 317} {"train_loss": -8.32951831817627, "global_step": 53340, "epoch": 317} {"train_loss": -8.610294342041016, "global_step": 53341, "epoch": 317} {"train_loss": -8.344849586486816, "global_step": 53342, "epoch": 317} {"train_loss": -8.465513229370117, "global_step": 53343, "epoch": 317} {"train_loss": -8.330711364746094, "global_step": 53344, "epoch": 317} {"train_loss": -8.639419555664062, "global_step": 53345, "epoch": 317} {"train_loss": -8.448582649230957, "global_step": 53346, "epoch": 317} {"train_loss": -8.467327117919922, "global_step": 53347, "epoch": 317} {"train_loss": -8.582385063171387, "global_step": 53348, "epoch": 317} {"train_loss": -8.42857837677002, "global_step": 53349, "epoch": 317} {"train_loss": -8.669245719909668, "global_step": 53350, "epoch": 317} {"train_loss": -8.234367370605469, "global_step": 53351, "epoch": 317} {"train_loss": -8.499761581420898, "global_step": 53352, "epoch": 317} {"train_loss": -8.405864715576172, "global_step": 53353, "epoch": 317} {"train_loss": -8.401252746582031, "global_step": 53354, "epoch": 317} {"train_loss": -8.465751647949219, "global_step": 53355, "epoch": 317} {"train_loss": -8.444817543029785, "global_step": 53356, "epoch": 317} {"train_loss": -8.497743606567383, "global_step": 53357, "epoch": 317} {"train_loss": -8.681987762451172, "global_step": 53358, "epoch": 317} {"train_loss": -8.50447940826416, "global_step": 53359, "epoch": 317} {"train_loss": -8.628963470458984, "global_step": 53360, "epoch": 317} {"train_loss": -8.534394264221191, "global_step": 53361, "epoch": 317} {"train_loss": -8.56413459777832, "global_step": 53362, "epoch": 317} {"train_loss": -8.551692962646484, "global_step": 53363, "epoch": 317} {"train_loss": -8.445597648620605, "global_step": 53364, "epoch": 317} {"train_loss": -8.582860946655273, "global_step": 53365, "epoch": 317} {"train_loss": -8.5606050491333, "global_step": 53366, "epoch": 317} {"train_loss": -8.63160514831543, "global_step": 53367, "epoch": 317} {"train_loss": -8.393667221069336, "global_step": 53368, "epoch": 317} {"train_loss": -8.319961547851562, "global_step": 53369, "epoch": 317} {"train_loss": -8.415597915649414, "global_step": 53370, "epoch": 317} {"train_loss": -8.231141090393066, "global_step": 53371, "epoch": 317} {"train_loss": -8.41909408569336, "global_step": 53372, "epoch": 317} {"train_loss": -8.309414863586426, "global_step": 53373, "epoch": 317} {"train_loss": -8.479223251342773, "global_step": 53374, "epoch": 317} {"train_loss": -8.185302734375, "global_step": 53375, "epoch": 317} {"train_loss": -8.156449317932129, "global_step": 53376, "epoch": 317} {"train_loss": -8.540639877319336, "global_step": 53377, "epoch": 317} {"train_loss": -8.31373405456543, "global_step": 53378, "epoch": 317} {"train_loss": -8.407478332519531, "global_step": 53379, "epoch": 317} {"train_loss": -8.251483917236328, "global_step": 53380, "epoch": 317} {"train_loss": -8.402793884277344, "global_step": 53381, "epoch": 317} {"train_loss": -8.367584228515625, "global_step": 53382, "epoch": 317} {"train_loss": -8.361566543579102, "global_step": 53383, "epoch": 317} {"train_loss": -8.434350967407227, "global_step": 53384, "epoch": 317} {"train_loss": -8.562231063842773, "global_step": 53385, "epoch": 317} {"train_loss": -8.38733196258545, "global_step": 53386, "epoch": 317} {"train_loss": -8.261791229248047, "global_step": 53387, "epoch": 317} {"train_loss": -8.78348445892334, "global_step": 53388, "epoch": 317} {"train_loss": -8.570161819458008, "global_step": 53389, "epoch": 317} {"train_loss": -8.79243278503418, "global_step": 53390, "epoch": 317} {"train_loss": -8.423259735107422, "global_step": 53391, "epoch": 317} {"train_loss": -8.516836166381836, "global_step": 53392, "epoch": 317} {"train_loss": -8.579959869384766, "global_step": 53393, "epoch": 317} {"train_loss": -8.352714538574219, "global_step": 53394, "epoch": 317} {"train_loss": -8.542327880859375, "global_step": 53395, "epoch": 317} {"train_loss": -8.563610076904297, "global_step": 53396, "epoch": 317} {"train_loss": -8.600973129272461, "global_step": 53397, "epoch": 317} {"train_loss": -8.484699249267578, "global_step": 53398, "epoch": 317} {"train_loss": -8.75535774230957, "global_step": 53399, "epoch": 317} {"train_loss": -8.423731803894043, "global_step": 53400, "epoch": 317} {"train_loss": -8.418025970458984, "global_step": 53401, "epoch": 317} {"train_loss": -8.622962951660156, "global_step": 53402, "epoch": 317} {"train_loss": -8.506542205810547, "global_step": 53403, "epoch": 317} {"train_loss": -8.405885696411133, "global_step": 53404, "epoch": 317} {"train_loss": -8.58092212677002, "global_step": 53405, "epoch": 317} {"train_loss": -8.395030975341797, "global_step": 53406, "epoch": 317} {"train_loss": -8.461421966552734, "global_step": 53407, "epoch": 317} {"train_loss": -8.661836624145508, "global_step": 53408, "epoch": 317} {"train_loss": -8.594999313354492, "global_step": 53409, "epoch": 317} {"train_loss": -8.727975845336914, "global_step": 53410, "epoch": 317} {"train_loss": -8.520959854125977, "global_step": 53411, "epoch": 317} {"train_loss": -8.533380508422852, "global_step": 53412, "epoch": 317} {"train_loss": -8.56652545928955, "global_step": 53413, "epoch": 317} {"train_loss": -8.714338302612305, "global_step": 53414, "epoch": 317} {"train_loss": -8.683235168457031, "global_step": 53415, "epoch": 317} {"train_loss": -8.694246292114258, "global_step": 53416, "epoch": 317} {"train_loss": -8.720664024353027, "global_step": 53417, "epoch": 317} {"train_loss": -8.812498092651367, "global_step": 53418, "epoch": 317} {"train_loss": -8.757306098937988, "global_step": 53419, "epoch": 317} {"train_loss": -8.475934982299805, "global_step": 53420, "epoch": 317} {"train_loss": -8.618167877197266, "global_step": 53421, "epoch": 317} {"train_loss": -8.560674667358398, "global_step": 53422, "epoch": 317} {"train_loss": -8.48107009274619, "global_step": 53423, "epoch": 317, "val_loss": 186389.6875} {"train_loss": -8.280252456665039, "global_step": 53424, "epoch": 318} {"train_loss": -8.315292358398438, "global_step": 53425, "epoch": 318} {"train_loss": -8.298946380615234, "global_step": 53426, "epoch": 318} {"train_loss": -8.379396438598633, "global_step": 53427, "epoch": 318} {"train_loss": -8.37242317199707, "global_step": 53428, "epoch": 318} {"train_loss": -8.471345901489258, "global_step": 53429, "epoch": 318} {"train_loss": -8.535858154296875, "global_step": 53430, "epoch": 318} {"train_loss": -8.63221549987793, "global_step": 53431, "epoch": 318} {"train_loss": -8.413389205932617, "global_step": 53432, "epoch": 318} {"train_loss": -8.553274154663086, "global_step": 53433, "epoch": 318} {"train_loss": -8.377212524414062, "global_step": 53434, "epoch": 318} {"train_loss": -8.22695255279541, "global_step": 53435, "epoch": 318} {"train_loss": -8.213423728942871, "global_step": 53436, "epoch": 318} {"train_loss": -8.462425231933594, "global_step": 53437, "epoch": 318} {"train_loss": -8.348474502563477, "global_step": 53438, "epoch": 318} {"train_loss": -8.349355697631836, "global_step": 53439, "epoch": 318} {"train_loss": -7.929689884185791, "global_step": 53440, "epoch": 318} {"train_loss": -8.161316871643066, "global_step": 53441, "epoch": 318} {"train_loss": -8.285994529724121, "global_step": 53442, "epoch": 318} {"train_loss": -8.373076438903809, "global_step": 53443, "epoch": 318} {"train_loss": -8.273688316345215, "global_step": 53444, "epoch": 318} {"train_loss": -8.454026222229004, "global_step": 53445, "epoch": 318} {"train_loss": -8.449191093444824, "global_step": 53446, "epoch": 318} {"train_loss": -8.266319274902344, "global_step": 53447, "epoch": 318} {"train_loss": -8.53719711303711, "global_step": 53448, "epoch": 318} {"train_loss": -8.594616889953613, "global_step": 53449, "epoch": 318} {"train_loss": -8.605047225952148, "global_step": 53450, "epoch": 318} {"train_loss": -8.327096939086914, "global_step": 53451, "epoch": 318} {"train_loss": -8.357131004333496, "global_step": 53452, "epoch": 318} {"train_loss": -8.419437408447266, "global_step": 53453, "epoch": 318} {"train_loss": -8.667487144470215, "global_step": 53454, "epoch": 318} {"train_loss": -8.452913284301758, "global_step": 53455, "epoch": 318} {"train_loss": -8.503067970275879, "global_step": 53456, "epoch": 318} {"train_loss": -8.508674621582031, "global_step": 53457, "epoch": 318} {"train_loss": -8.482229232788086, "global_step": 53458, "epoch": 318} {"train_loss": -8.420199394226074, "global_step": 53459, "epoch": 318} {"train_loss": -8.349929809570312, "global_step": 53460, "epoch": 318} {"train_loss": -8.35063362121582, "global_step": 53461, "epoch": 318} {"train_loss": -8.398026466369629, "global_step": 53462, "epoch": 318} {"train_loss": -8.450376510620117, "global_step": 53463, "epoch": 318} {"train_loss": -8.545669555664062, "global_step": 53464, "epoch": 318} {"train_loss": -8.425558090209961, "global_step": 53465, "epoch": 318} {"train_loss": -8.331929206848145, "global_step": 53466, "epoch": 318} {"train_loss": -8.36384105682373, "global_step": 53467, "epoch": 318} {"train_loss": -8.608558654785156, "global_step": 53468, "epoch": 318} {"train_loss": -8.481351852416992, "global_step": 53469, "epoch": 318} {"train_loss": -8.30378532409668, "global_step": 53470, "epoch": 318} {"train_loss": -8.799459457397461, "global_step": 53471, "epoch": 318} {"train_loss": -8.474763870239258, "global_step": 53472, "epoch": 318} {"train_loss": -8.345455169677734, "global_step": 53473, "epoch": 318} {"train_loss": -8.636932373046875, "global_step": 53474, "epoch": 318} {"train_loss": -8.557826042175293, "global_step": 53475, "epoch": 318} {"train_loss": -8.469705581665039, "global_step": 53476, "epoch": 318} {"train_loss": -8.856135368347168, "global_step": 53477, "epoch": 318} {"train_loss": -8.266677856445312, "global_step": 53478, "epoch": 318} {"train_loss": -8.42668628692627, "global_step": 53479, "epoch": 318} {"train_loss": -8.522850036621094, "global_step": 53480, "epoch": 318} {"train_loss": -8.502320289611816, "global_step": 53481, "epoch": 318} {"train_loss": -8.716841697692871, "global_step": 53482, "epoch": 318} {"train_loss": -8.434228897094727, "global_step": 53483, "epoch": 318} {"train_loss": -8.476297378540039, "global_step": 53484, "epoch": 318} {"train_loss": -8.651535987854004, "global_step": 53485, "epoch": 318} {"train_loss": -8.657684326171875, "global_step": 53486, "epoch": 318} {"train_loss": -8.49660587310791, "global_step": 53487, "epoch": 318} {"train_loss": -8.634796142578125, "global_step": 53488, "epoch": 318} {"train_loss": -8.575373649597168, "global_step": 53489, "epoch": 318} {"train_loss": -8.596601486206055, "global_step": 53490, "epoch": 318} {"train_loss": -8.4957857131958, "global_step": 53491, "epoch": 318} {"train_loss": -8.405336380004883, "global_step": 53492, "epoch": 318} {"train_loss": -8.707106590270996, "global_step": 53493, "epoch": 318} {"train_loss": -8.433211326599121, "global_step": 53494, "epoch": 318} {"train_loss": -8.72358512878418, "global_step": 53495, "epoch": 318} {"train_loss": -8.519933700561523, "global_step": 53496, "epoch": 318} {"train_loss": -8.363422393798828, "global_step": 53497, "epoch": 318} {"train_loss": -8.704197883605957, "global_step": 53498, "epoch": 318} {"train_loss": -8.692157745361328, "global_step": 53499, "epoch": 318} {"train_loss": -8.400463104248047, "global_step": 53500, "epoch": 318} {"train_loss": -8.192415237426758, "global_step": 53501, "epoch": 318} {"train_loss": -8.500146865844727, "global_step": 53502, "epoch": 318} {"train_loss": -8.2308349609375, "global_step": 53503, "epoch": 318} {"train_loss": -8.590522766113281, "global_step": 53504, "epoch": 318} {"train_loss": -8.370574951171875, "global_step": 53505, "epoch": 318} {"train_loss": -8.608277320861816, "global_step": 53506, "epoch": 318} {"train_loss": -8.489919662475586, "global_step": 53507, "epoch": 318} {"train_loss": -8.589248657226562, "global_step": 53508, "epoch": 318} {"train_loss": -8.565895080566406, "global_step": 53509, "epoch": 318} {"train_loss": -8.448640823364258, "global_step": 53510, "epoch": 318} {"train_loss": -8.506942749023438, "global_step": 53511, "epoch": 318} {"train_loss": -8.361638069152832, "global_step": 53512, "epoch": 318} {"train_loss": -8.686574935913086, "global_step": 53513, "epoch": 318} {"train_loss": -8.50558853149414, "global_step": 53514, "epoch": 318} {"train_loss": -8.450225830078125, "global_step": 53515, "epoch": 318} {"train_loss": -8.43415355682373, "global_step": 53516, "epoch": 318} {"train_loss": -8.764764785766602, "global_step": 53517, "epoch": 318} {"train_loss": -8.515816688537598, "global_step": 53518, "epoch": 318} {"train_loss": -8.605749130249023, "global_step": 53519, "epoch": 318} {"train_loss": -8.727892875671387, "global_step": 53520, "epoch": 318} {"train_loss": -8.510393142700195, "global_step": 53521, "epoch": 318} {"train_loss": -8.441110610961914, "global_step": 53522, "epoch": 318} {"train_loss": -8.521535873413086, "global_step": 53523, "epoch": 318} {"train_loss": -8.436399459838867, "global_step": 53524, "epoch": 318} {"train_loss": -8.632161140441895, "global_step": 53525, "epoch": 318} {"train_loss": -8.644355773925781, "global_step": 53526, "epoch": 318} {"train_loss": -8.581361770629883, "global_step": 53527, "epoch": 318} {"train_loss": -8.378019332885742, "global_step": 53528, "epoch": 318} {"train_loss": -8.669820785522461, "global_step": 53529, "epoch": 318} {"train_loss": -8.688613891601562, "global_step": 53530, "epoch": 318} {"train_loss": -8.530838966369629, "global_step": 53531, "epoch": 318} {"train_loss": -8.535196304321289, "global_step": 53532, "epoch": 318} {"train_loss": -8.52914047241211, "global_step": 53533, "epoch": 318} {"train_loss": -8.206610679626465, "global_step": 53534, "epoch": 318} {"train_loss": -8.351402282714844, "global_step": 53535, "epoch": 318} {"train_loss": -8.223027229309082, "global_step": 53536, "epoch": 318} {"train_loss": -8.430110931396484, "global_step": 53537, "epoch": 318} {"train_loss": -8.439001083374023, "global_step": 53538, "epoch": 318} {"train_loss": -8.340205192565918, "global_step": 53539, "epoch": 318} {"train_loss": -8.349559783935547, "global_step": 53540, "epoch": 318} {"train_loss": -8.256658554077148, "global_step": 53541, "epoch": 318} {"train_loss": -8.316417694091797, "global_step": 53542, "epoch": 318} {"train_loss": -8.209186553955078, "global_step": 53543, "epoch": 318} {"train_loss": -8.248271942138672, "global_step": 53544, "epoch": 318} {"train_loss": -8.535057067871094, "global_step": 53545, "epoch": 318} {"train_loss": -8.255975723266602, "global_step": 53546, "epoch": 318} {"train_loss": -8.101547241210938, "global_step": 53547, "epoch": 318} {"train_loss": -8.31259536743164, "global_step": 53548, "epoch": 318} {"train_loss": -8.44295883178711, "global_step": 53549, "epoch": 318} {"train_loss": -8.117743492126465, "global_step": 53550, "epoch": 318} {"train_loss": -8.23163890838623, "global_step": 53551, "epoch": 318} {"train_loss": -8.360881805419922, "global_step": 53552, "epoch": 318} {"train_loss": -7.801616668701172, "global_step": 53553, "epoch": 318} {"train_loss": -8.313878059387207, "global_step": 53554, "epoch": 318} {"train_loss": -8.333343505859375, "global_step": 53555, "epoch": 318} {"train_loss": -8.429841995239258, "global_step": 53556, "epoch": 318} {"train_loss": -8.031839370727539, "global_step": 53557, "epoch": 318} {"train_loss": -8.353744506835938, "global_step": 53558, "epoch": 318} {"train_loss": -8.36659049987793, "global_step": 53559, "epoch": 318} {"train_loss": -8.328662872314453, "global_step": 53560, "epoch": 318} {"train_loss": -8.22730827331543, "global_step": 53561, "epoch": 318} {"train_loss": -8.228257179260254, "global_step": 53562, "epoch": 318} {"train_loss": -8.110654830932617, "global_step": 53563, "epoch": 318} {"train_loss": -8.380292892456055, "global_step": 53564, "epoch": 318} {"train_loss": -8.470780372619629, "global_step": 53565, "epoch": 318} {"train_loss": -8.308923721313477, "global_step": 53566, "epoch": 318} {"train_loss": -8.577080726623535, "global_step": 53567, "epoch": 318} {"train_loss": -8.477896690368652, "global_step": 53568, "epoch": 318} {"train_loss": -8.371488571166992, "global_step": 53569, "epoch": 318} {"train_loss": -8.635782241821289, "global_step": 53570, "epoch": 318} {"train_loss": -8.589799880981445, "global_step": 53571, "epoch": 318} {"train_loss": -8.440221786499023, "global_step": 53572, "epoch": 318} {"train_loss": -8.558243751525879, "global_step": 53573, "epoch": 318} {"train_loss": -8.46160888671875, "global_step": 53574, "epoch": 318} {"train_loss": -8.342066764831543, "global_step": 53575, "epoch": 318} {"train_loss": -8.553372383117676, "global_step": 53576, "epoch": 318} {"train_loss": -8.676300048828125, "global_step": 53577, "epoch": 318} {"train_loss": -8.354394912719727, "global_step": 53578, "epoch": 318} {"train_loss": -8.351261138916016, "global_step": 53579, "epoch": 318} {"train_loss": -8.661253929138184, "global_step": 53580, "epoch": 318} {"train_loss": -8.607830047607422, "global_step": 53581, "epoch": 318} {"train_loss": -8.526623725891113, "global_step": 53582, "epoch": 318} {"train_loss": -8.172307014465332, "global_step": 53583, "epoch": 318} {"train_loss": -8.505298614501953, "global_step": 53584, "epoch": 318} {"train_loss": -8.411725997924805, "global_step": 53585, "epoch": 318} {"train_loss": -8.441900253295898, "global_step": 53586, "epoch": 318} {"train_loss": -8.379598617553711, "global_step": 53587, "epoch": 318} {"train_loss": -8.525922775268555, "global_step": 53588, "epoch": 318} {"train_loss": -8.231273651123047, "global_step": 53589, "epoch": 318} {"train_loss": -8.498100280761719, "global_step": 53590, "epoch": 318} {"train_loss": -8.437418208235787, "global_step": 53591, "epoch": 318, "val_loss": 188428.703125} {"train_loss": -8.619243621826172, "global_step": 53592, "epoch": 319} {"train_loss": -8.67867660522461, "global_step": 53593, "epoch": 319} {"train_loss": -8.291675567626953, "global_step": 53594, "epoch": 319} {"train_loss": -8.274471282958984, "global_step": 53595, "epoch": 319} {"train_loss": -8.329671859741211, "global_step": 53596, "epoch": 319} {"train_loss": -8.436219215393066, "global_step": 53597, "epoch": 319} {"train_loss": -8.271453857421875, "global_step": 53598, "epoch": 319} {"train_loss": -8.26917552947998, "global_step": 53599, "epoch": 319} {"train_loss": -8.08703327178955, "global_step": 53600, "epoch": 319} {"train_loss": -8.06416130065918, "global_step": 53601, "epoch": 319} {"train_loss": -8.59902572631836, "global_step": 53602, "epoch": 319} {"train_loss": -8.241731643676758, "global_step": 53603, "epoch": 319} {"train_loss": -8.089936256408691, "global_step": 53604, "epoch": 319} {"train_loss": -8.105049133300781, "global_step": 53605, "epoch": 319} {"train_loss": -8.255258560180664, "global_step": 53606, "epoch": 319} {"train_loss": -8.32455062866211, "global_step": 53607, "epoch": 319} {"train_loss": -8.333858489990234, "global_step": 53608, "epoch": 319} {"train_loss": -8.325457572937012, "global_step": 53609, "epoch": 319} {"train_loss": -8.253204345703125, "global_step": 53610, "epoch": 319} {"train_loss": -8.331991195678711, "global_step": 53611, "epoch": 319} {"train_loss": -8.555795669555664, "global_step": 53612, "epoch": 319} {"train_loss": -8.564410209655762, "global_step": 53613, "epoch": 319} {"train_loss": -8.597673416137695, "global_step": 53614, "epoch": 319} {"train_loss": -8.281776428222656, "global_step": 53615, "epoch": 319} {"train_loss": -8.290634155273438, "global_step": 53616, "epoch": 319} {"train_loss": -8.506149291992188, "global_step": 53617, "epoch": 319} {"train_loss": -8.388075828552246, "global_step": 53618, "epoch": 319} {"train_loss": -8.141817092895508, "global_step": 53619, "epoch": 319} {"train_loss": -8.476747512817383, "global_step": 53620, "epoch": 319} {"train_loss": -8.4277925491333, "global_step": 53621, "epoch": 319} {"train_loss": -8.257148742675781, "global_step": 53622, "epoch": 319} {"train_loss": -8.510782241821289, "global_step": 53623, "epoch": 319} {"train_loss": -8.576380729675293, "global_step": 53624, "epoch": 319} {"train_loss": -8.330034255981445, "global_step": 53625, "epoch": 319} {"train_loss": -8.62153434753418, "global_step": 53626, "epoch": 319} {"train_loss": -8.674606323242188, "global_step": 53627, "epoch": 319} {"train_loss": -8.151411056518555, "global_step": 53628, "epoch": 319} {"train_loss": -8.479822158813477, "global_step": 53629, "epoch": 319} {"train_loss": -8.60635757446289, "global_step": 53630, "epoch": 319} {"train_loss": -8.424150466918945, "global_step": 53631, "epoch": 319} {"train_loss": -8.450265884399414, "global_step": 53632, "epoch": 319} {"train_loss": -8.323566436767578, "global_step": 53633, "epoch": 319} {"train_loss": -8.361895561218262, "global_step": 53634, "epoch": 319} {"train_loss": -8.298505783081055, "global_step": 53635, "epoch": 319} {"train_loss": -8.188005447387695, "global_step": 53636, "epoch": 319} {"train_loss": -8.591028213500977, "global_step": 53637, "epoch": 319} {"train_loss": -8.198887825012207, "global_step": 53638, "epoch": 319} {"train_loss": -8.269997596740723, "global_step": 53639, "epoch": 319} {"train_loss": -8.43946647644043, "global_step": 53640, "epoch": 319} {"train_loss": -8.103775024414062, "global_step": 53641, "epoch": 319} {"train_loss": -8.099992752075195, "global_step": 53642, "epoch": 319} {"train_loss": -8.257049560546875, "global_step": 53643, "epoch": 319} {"train_loss": -8.213751792907715, "global_step": 53644, "epoch": 319} {"train_loss": -8.584786415100098, "global_step": 53645, "epoch": 319} {"train_loss": -8.332418441772461, "global_step": 53646, "epoch": 319} {"train_loss": -8.38585090637207, "global_step": 53647, "epoch": 319} {"train_loss": -8.36509895324707, "global_step": 53648, "epoch": 319} {"train_loss": -8.334176063537598, "global_step": 53649, "epoch": 319} {"train_loss": -8.255550384521484, "global_step": 53650, "epoch": 319} {"train_loss": -8.420906066894531, "global_step": 53651, "epoch": 319} {"train_loss": -8.59330940246582, "global_step": 53652, "epoch": 319} {"train_loss": -8.444501876831055, "global_step": 53653, "epoch": 319} {"train_loss": -8.56729507446289, "global_step": 53654, "epoch": 319} {"train_loss": -8.532317161560059, "global_step": 53655, "epoch": 319} {"train_loss": -8.34350299835205, "global_step": 53656, "epoch": 319} {"train_loss": -8.539618492126465, "global_step": 53657, "epoch": 319} {"train_loss": -8.703500747680664, "global_step": 53658, "epoch": 319} {"train_loss": -8.48200798034668, "global_step": 53659, "epoch": 319} {"train_loss": -8.54723072052002, "global_step": 53660, "epoch": 319} {"train_loss": -8.651525497436523, "global_step": 53661, "epoch": 319} {"train_loss": -8.633386611938477, "global_step": 53662, "epoch": 319} {"train_loss": -8.622917175292969, "global_step": 53663, "epoch": 319} {"train_loss": -8.482171058654785, "global_step": 53664, "epoch": 319} {"train_loss": -8.518433570861816, "global_step": 53665, "epoch": 319} {"train_loss": -8.538825035095215, "global_step": 53666, "epoch": 319} {"train_loss": -8.647315979003906, "global_step": 53667, "epoch": 319} {"train_loss": -8.801040649414062, "global_step": 53668, "epoch": 319} {"train_loss": -8.575408935546875, "global_step": 53669, "epoch": 319} {"train_loss": -8.68635368347168, "global_step": 53670, "epoch": 319} {"train_loss": -8.632522583007812, "global_step": 53671, "epoch": 319} {"train_loss": -8.588120460510254, "global_step": 53672, "epoch": 319} {"train_loss": -8.511576652526855, "global_step": 53673, "epoch": 319} {"train_loss": -8.41010856628418, "global_step": 53674, "epoch": 319} {"train_loss": -8.726970672607422, "global_step": 53675, "epoch": 319} {"train_loss": -8.540227890014648, "global_step": 53676, "epoch": 319} {"train_loss": -8.60264778137207, "global_step": 53677, "epoch": 319} {"train_loss": -8.607462882995605, "global_step": 53678, "epoch": 319} {"train_loss": -8.604938507080078, "global_step": 53679, "epoch": 319} {"train_loss": -8.729214668273926, "global_step": 53680, "epoch": 319} {"train_loss": -8.520156860351562, "global_step": 53681, "epoch": 319} {"train_loss": -8.388395309448242, "global_step": 53682, "epoch": 319} {"train_loss": -8.510637283325195, "global_step": 53683, "epoch": 319} {"train_loss": -8.410691261291504, "global_step": 53684, "epoch": 319} {"train_loss": -8.414840698242188, "global_step": 53685, "epoch": 319} {"train_loss": -8.434701919555664, "global_step": 53686, "epoch": 319} {"train_loss": -8.438222885131836, "global_step": 53687, "epoch": 319} {"train_loss": -8.18805980682373, "global_step": 53688, "epoch": 319} {"train_loss": -8.408647537231445, "global_step": 53689, "epoch": 319} {"train_loss": -8.151583671569824, "global_step": 53690, "epoch": 319} {"train_loss": -8.639986038208008, "global_step": 53691, "epoch": 319} {"train_loss": -8.190048217773438, "global_step": 53692, "epoch": 319} {"train_loss": -8.5062255859375, "global_step": 53693, "epoch": 319} {"train_loss": -8.396785736083984, "global_step": 53694, "epoch": 319} {"train_loss": -8.193232536315918, "global_step": 53695, "epoch": 319} {"train_loss": -8.182903289794922, "global_step": 53696, "epoch": 319} {"train_loss": -8.21853256225586, "global_step": 53697, "epoch": 319} {"train_loss": -8.457674980163574, "global_step": 53698, "epoch": 319} {"train_loss": -8.215930938720703, "global_step": 53699, "epoch": 319} {"train_loss": -8.313325881958008, "global_step": 53700, "epoch": 319} {"train_loss": -8.16727066040039, "global_step": 53701, "epoch": 319} {"train_loss": -8.37784194946289, "global_step": 53702, "epoch": 319} {"train_loss": -8.149831771850586, "global_step": 53703, "epoch": 319} {"train_loss": -8.208248138427734, "global_step": 53704, "epoch": 319} {"train_loss": -8.473033905029297, "global_step": 53705, "epoch": 319} {"train_loss": -8.349987983703613, "global_step": 53706, "epoch": 319} {"train_loss": -8.391813278198242, "global_step": 53707, "epoch": 319} {"train_loss": -8.344362258911133, "global_step": 53708, "epoch": 319} {"train_loss": -8.318328857421875, "global_step": 53709, "epoch": 319} {"train_loss": -8.14909839630127, "global_step": 53710, "epoch": 319} {"train_loss": -8.47922134399414, "global_step": 53711, "epoch": 319} {"train_loss": -8.483835220336914, "global_step": 53712, "epoch": 319} {"train_loss": -8.324981689453125, "global_step": 53713, "epoch": 319} {"train_loss": -8.337554931640625, "global_step": 53714, "epoch": 319} {"train_loss": -8.416277885437012, "global_step": 53715, "epoch": 319} {"train_loss": -8.32278060913086, "global_step": 53716, "epoch": 319} {"train_loss": -8.407086372375488, "global_step": 53717, "epoch": 319} {"train_loss": -8.323653221130371, "global_step": 53718, "epoch": 319} {"train_loss": -8.398784637451172, "global_step": 53719, "epoch": 319} {"train_loss": -8.26423454284668, "global_step": 53720, "epoch": 319} {"train_loss": -8.650537490844727, "global_step": 53721, "epoch": 319} {"train_loss": -8.488468170166016, "global_step": 53722, "epoch": 319} {"train_loss": -8.411948204040527, "global_step": 53723, "epoch": 319} {"train_loss": -8.414491653442383, "global_step": 53724, "epoch": 319} {"train_loss": -8.531601905822754, "global_step": 53725, "epoch": 319} {"train_loss": -8.508052825927734, "global_step": 53726, "epoch": 319} {"train_loss": -8.501152038574219, "global_step": 53727, "epoch": 319} {"train_loss": -8.320474624633789, "global_step": 53728, "epoch": 319} {"train_loss": -8.41010856628418, "global_step": 53729, "epoch": 319} {"train_loss": -8.748781204223633, "global_step": 53730, "epoch": 319} {"train_loss": -8.420482635498047, "global_step": 53731, "epoch": 319} {"train_loss": -8.741743087768555, "global_step": 53732, "epoch": 319} {"train_loss": -8.460214614868164, "global_step": 53733, "epoch": 319} {"train_loss": -8.354843139648438, "global_step": 53734, "epoch": 319} {"train_loss": -8.663824081420898, "global_step": 53735, "epoch": 319} {"train_loss": -8.47786808013916, "global_step": 53736, "epoch": 319} {"train_loss": -8.453853607177734, "global_step": 53737, "epoch": 319} {"train_loss": -8.574024200439453, "global_step": 53738, "epoch": 319} {"train_loss": -8.621139526367188, "global_step": 53739, "epoch": 319} {"train_loss": -8.413995742797852, "global_step": 53740, "epoch": 319} {"train_loss": -8.693277359008789, "global_step": 53741, "epoch": 319} {"train_loss": -8.635116577148438, "global_step": 53742, "epoch": 319} {"train_loss": -8.47474479675293, "global_step": 53743, "epoch": 319} {"train_loss": -8.226390838623047, "global_step": 53744, "epoch": 319} {"train_loss": -8.610769271850586, "global_step": 53745, "epoch": 319} {"train_loss": -8.299139022827148, "global_step": 53746, "epoch": 319} {"train_loss": -8.38909912109375, "global_step": 53747, "epoch": 319} {"train_loss": -8.316431045532227, "global_step": 53748, "epoch": 319} {"train_loss": -8.310218811035156, "global_step": 53749, "epoch": 319} {"train_loss": -8.47645378112793, "global_step": 53750, "epoch": 319} {"train_loss": -8.702408790588379, "global_step": 53751, "epoch": 319} {"train_loss": -8.383194923400879, "global_step": 53752, "epoch": 319} {"train_loss": -8.376991271972656, "global_step": 53753, "epoch": 319} {"train_loss": -8.52091121673584, "global_step": 53754, "epoch": 319} {"train_loss": -8.233890533447266, "global_step": 53755, "epoch": 319} {"train_loss": -8.223957061767578, "global_step": 53756, "epoch": 319} {"train_loss": -8.165205955505371, "global_step": 53757, "epoch": 319} {"train_loss": -8.267671585083008, "global_step": 53758, "epoch": 319} {"train_loss": -8.415851990381876, "global_step": 53759, "epoch": 319, "val_loss": 185254.78125} {"train_loss": -8.29964828491211, "global_step": 53760, "epoch": 320} {"train_loss": -8.380660057067871, "global_step": 53761, "epoch": 320} {"train_loss": -8.15011215209961, "global_step": 53762, "epoch": 320} {"train_loss": -8.330338478088379, "global_step": 53763, "epoch": 320} {"train_loss": -8.326925277709961, "global_step": 53764, "epoch": 320} {"train_loss": -8.274471282958984, "global_step": 53765, "epoch": 320} {"train_loss": -8.353331565856934, "global_step": 53766, "epoch": 320} {"train_loss": -8.33112907409668, "global_step": 53767, "epoch": 320} {"train_loss": -8.402885437011719, "global_step": 53768, "epoch": 320} {"train_loss": -8.245172500610352, "global_step": 53769, "epoch": 320} {"train_loss": -8.337621688842773, "global_step": 53770, "epoch": 320} {"train_loss": -8.621124267578125, "global_step": 53771, "epoch": 320} {"train_loss": -8.480870246887207, "global_step": 53772, "epoch": 320} {"train_loss": -8.788469314575195, "global_step": 53773, "epoch": 320} {"train_loss": -8.513869285583496, "global_step": 53774, "epoch": 320} {"train_loss": -8.322074890136719, "global_step": 53775, "epoch": 320} {"train_loss": -8.395376205444336, "global_step": 53776, "epoch": 320} {"train_loss": -8.265804290771484, "global_step": 53777, "epoch": 320} {"train_loss": -8.397453308105469, "global_step": 53778, "epoch": 320} {"train_loss": -8.292237281799316, "global_step": 53779, "epoch": 320} {"train_loss": -8.515632629394531, "global_step": 53780, "epoch": 320} {"train_loss": -8.121633529663086, "global_step": 53781, "epoch": 320} {"train_loss": -8.564674377441406, "global_step": 53782, "epoch": 320} {"train_loss": -8.294034957885742, "global_step": 53783, "epoch": 320} {"train_loss": -8.637741088867188, "global_step": 53784, "epoch": 320} {"train_loss": -8.053096771240234, "global_step": 53785, "epoch": 320} {"train_loss": -8.373428344726562, "global_step": 53786, "epoch": 320} {"train_loss": -8.24599552154541, "global_step": 53787, "epoch": 320} {"train_loss": -8.442758560180664, "global_step": 53788, "epoch": 320} {"train_loss": -8.384132385253906, "global_step": 53789, "epoch": 320} {"train_loss": -8.49968147277832, "global_step": 53790, "epoch": 320} {"train_loss": -8.66423225402832, "global_step": 53791, "epoch": 320} {"train_loss": -8.53965950012207, "global_step": 53792, "epoch": 320} {"train_loss": -8.243636131286621, "global_step": 53793, "epoch": 320} {"train_loss": -8.413979530334473, "global_step": 53794, "epoch": 320} {"train_loss": -8.482666969299316, "global_step": 53795, "epoch": 320} {"train_loss": -8.419855117797852, "global_step": 53796, "epoch": 320} {"train_loss": -8.284263610839844, "global_step": 53797, "epoch": 320} {"train_loss": -8.613122940063477, "global_step": 53798, "epoch": 320} {"train_loss": -8.123651504516602, "global_step": 53799, "epoch": 320} {"train_loss": -8.51222038269043, "global_step": 53800, "epoch": 320} {"train_loss": -8.398340225219727, "global_step": 53801, "epoch": 320} {"train_loss": -8.44601058959961, "global_step": 53802, "epoch": 320} {"train_loss": -8.29154109954834, "global_step": 53803, "epoch": 320} {"train_loss": -8.500442504882812, "global_step": 53804, "epoch": 320} {"train_loss": -8.314922332763672, "global_step": 53805, "epoch": 320} {"train_loss": -8.149604797363281, "global_step": 53806, "epoch": 320} {"train_loss": -8.388269424438477, "global_step": 53807, "epoch": 320} {"train_loss": -8.189413070678711, "global_step": 53808, "epoch": 320} {"train_loss": -8.319952964782715, "global_step": 53809, "epoch": 320} {"train_loss": -8.585952758789062, "global_step": 53810, "epoch": 320} {"train_loss": -8.548090934753418, "global_step": 53811, "epoch": 320} {"train_loss": -8.4475736618042, "global_step": 53812, "epoch": 320} {"train_loss": -8.46327018737793, "global_step": 53813, "epoch": 320} {"train_loss": -8.20523738861084, "global_step": 53814, "epoch": 320} {"train_loss": -8.562731742858887, "global_step": 53815, "epoch": 320} {"train_loss": -8.270454406738281, "global_step": 53816, "epoch": 320} {"train_loss": -8.590625762939453, "global_step": 53817, "epoch": 320} {"train_loss": -8.294134140014648, "global_step": 53818, "epoch": 320} {"train_loss": -8.643468856811523, "global_step": 53819, "epoch": 320} {"train_loss": -8.209555625915527, "global_step": 53820, "epoch": 320} {"train_loss": -8.479373931884766, "global_step": 53821, "epoch": 320} {"train_loss": -8.137117385864258, "global_step": 53822, "epoch": 320} {"train_loss": -8.443107604980469, "global_step": 53823, "epoch": 320} {"train_loss": -8.358522415161133, "global_step": 53824, "epoch": 320} {"train_loss": -8.452759742736816, "global_step": 53825, "epoch": 320} {"train_loss": -8.304201126098633, "global_step": 53826, "epoch": 320} {"train_loss": -8.537528991699219, "global_step": 53827, "epoch": 320} {"train_loss": -8.50053882598877, "global_step": 53828, "epoch": 320} {"train_loss": -8.397872924804688, "global_step": 53829, "epoch": 320} {"train_loss": -8.606293678283691, "global_step": 53830, "epoch": 320} {"train_loss": -8.469861030578613, "global_step": 53831, "epoch": 320} {"train_loss": -8.339656829833984, "global_step": 53832, "epoch": 320} {"train_loss": -8.564790725708008, "global_step": 53833, "epoch": 320} {"train_loss": -8.285655975341797, "global_step": 53834, "epoch": 320} {"train_loss": -8.51539134979248, "global_step": 53835, "epoch": 320} {"train_loss": -8.666857719421387, "global_step": 53836, "epoch": 320} {"train_loss": -8.428646087646484, "global_step": 53837, "epoch": 320} {"train_loss": -8.402215957641602, "global_step": 53838, "epoch": 320} {"train_loss": -8.496304512023926, "global_step": 53839, "epoch": 320} {"train_loss": -8.547660827636719, "global_step": 53840, "epoch": 320} {"train_loss": -8.499134063720703, "global_step": 53841, "epoch": 320} {"train_loss": -8.329971313476562, "global_step": 53842, "epoch": 320} {"train_loss": -8.52595329284668, "global_step": 53843, "epoch": 320} {"train_loss": -8.413162231445312, "global_step": 53844, "epoch": 320} {"train_loss": -8.53674030303955, "global_step": 53845, "epoch": 320} {"train_loss": -8.457269668579102, "global_step": 53846, "epoch": 320} {"train_loss": -8.505623817443848, "global_step": 53847, "epoch": 320} {"train_loss": -8.48995590209961, "global_step": 53848, "epoch": 320} {"train_loss": -8.465428352355957, "global_step": 53849, "epoch": 320} {"train_loss": -8.499629974365234, "global_step": 53850, "epoch": 320} {"train_loss": -8.411067962646484, "global_step": 53851, "epoch": 320} {"train_loss": -8.403599739074707, "global_step": 53852, "epoch": 320} {"train_loss": -8.675220489501953, "global_step": 53853, "epoch": 320} {"train_loss": -8.258848190307617, "global_step": 53854, "epoch": 320} {"train_loss": -8.542778968811035, "global_step": 53855, "epoch": 320} {"train_loss": -8.354974746704102, "global_step": 53856, "epoch": 320} {"train_loss": -8.289093017578125, "global_step": 53857, "epoch": 320} {"train_loss": -8.209892272949219, "global_step": 53858, "epoch": 320} {"train_loss": -8.463034629821777, "global_step": 53859, "epoch": 320} {"train_loss": -8.441156387329102, "global_step": 53860, "epoch": 320} {"train_loss": -8.377408981323242, "global_step": 53861, "epoch": 320} {"train_loss": -8.422253608703613, "global_step": 53862, "epoch": 320} {"train_loss": -8.395402908325195, "global_step": 53863, "epoch": 320} {"train_loss": -8.476194381713867, "global_step": 53864, "epoch": 320} {"train_loss": -8.6058988571167, "global_step": 53865, "epoch": 320} {"train_loss": -8.421756744384766, "global_step": 53866, "epoch": 320} {"train_loss": -8.382080078125, "global_step": 53867, "epoch": 320} {"train_loss": -8.433883666992188, "global_step": 53868, "epoch": 320} {"train_loss": -8.750097274780273, "global_step": 53869, "epoch": 320} {"train_loss": -8.38521671295166, "global_step": 53870, "epoch": 320} {"train_loss": -8.438339233398438, "global_step": 53871, "epoch": 320} {"train_loss": -8.255448341369629, "global_step": 53872, "epoch": 320} {"train_loss": -8.615911483764648, "global_step": 53873, "epoch": 320} {"train_loss": -8.277891159057617, "global_step": 53874, "epoch": 320} {"train_loss": -8.456833839416504, "global_step": 53875, "epoch": 320} {"train_loss": -8.667158126831055, "global_step": 53876, "epoch": 320} {"train_loss": -8.55026912689209, "global_step": 53877, "epoch": 320} {"train_loss": -8.609121322631836, "global_step": 53878, "epoch": 320} {"train_loss": -8.244476318359375, "global_step": 53879, "epoch": 320} {"train_loss": -8.582536697387695, "global_step": 53880, "epoch": 320} {"train_loss": -8.699399948120117, "global_step": 53881, "epoch": 320} {"train_loss": -8.52877426147461, "global_step": 53882, "epoch": 320} {"train_loss": -8.391942977905273, "global_step": 53883, "epoch": 320} {"train_loss": -8.841296195983887, "global_step": 53884, "epoch": 320} {"train_loss": -8.553964614868164, "global_step": 53885, "epoch": 320} {"train_loss": -8.598808288574219, "global_step": 53886, "epoch": 320} {"train_loss": -8.629791259765625, "global_step": 53887, "epoch": 320} {"train_loss": -8.616545677185059, "global_step": 53888, "epoch": 320} {"train_loss": -8.42182445526123, "global_step": 53889, "epoch": 320} {"train_loss": -8.589143753051758, "global_step": 53890, "epoch": 320} {"train_loss": -8.253353118896484, "global_step": 53891, "epoch": 320} {"train_loss": -8.51332950592041, "global_step": 53892, "epoch": 320} {"train_loss": -8.560674667358398, "global_step": 53893, "epoch": 320} {"train_loss": -8.173225402832031, "global_step": 53894, "epoch": 320} {"train_loss": -8.51369571685791, "global_step": 53895, "epoch": 320} {"train_loss": -8.281196594238281, "global_step": 53896, "epoch": 320} {"train_loss": -8.291658401489258, "global_step": 53897, "epoch": 320} {"train_loss": -8.117456436157227, "global_step": 53898, "epoch": 320} {"train_loss": -8.435479164123535, "global_step": 53899, "epoch": 320} {"train_loss": -8.065135955810547, "global_step": 53900, "epoch": 320} {"train_loss": -8.366925239562988, "global_step": 53901, "epoch": 320} {"train_loss": -8.195667266845703, "global_step": 53902, "epoch": 320} {"train_loss": -8.319998741149902, "global_step": 53903, "epoch": 320} {"train_loss": -7.881050109863281, "global_step": 53904, "epoch": 320} {"train_loss": -8.284259796142578, "global_step": 53905, "epoch": 320} {"train_loss": -8.22706127166748, "global_step": 53906, "epoch": 320} {"train_loss": -8.172382354736328, "global_step": 53907, "epoch": 320} {"train_loss": -8.043837547302246, "global_step": 53908, "epoch": 320} {"train_loss": -8.315878868103027, "global_step": 53909, "epoch": 320} {"train_loss": -8.084732055664062, "global_step": 53910, "epoch": 320} {"train_loss": -8.144012451171875, "global_step": 53911, "epoch": 320} {"train_loss": -8.172229766845703, "global_step": 53912, "epoch": 320} {"train_loss": -8.046529769897461, "global_step": 53913, "epoch": 320} {"train_loss": -8.185430526733398, "global_step": 53914, "epoch": 320} {"train_loss": -7.89968204498291, "global_step": 53915, "epoch": 320} {"train_loss": -8.244314193725586, "global_step": 53916, "epoch": 320} {"train_loss": -8.13833999633789, "global_step": 53917, "epoch": 320} {"train_loss": -8.218345642089844, "global_step": 53918, "epoch": 320} {"train_loss": -8.31463623046875, "global_step": 53919, "epoch": 320} {"train_loss": -8.226411819458008, "global_step": 53920, "epoch": 320} {"train_loss": -8.395898818969727, "global_step": 53921, "epoch": 320} {"train_loss": -8.266697883605957, "global_step": 53922, "epoch": 320} {"train_loss": -8.178228378295898, "global_step": 53923, "epoch": 320} {"train_loss": -8.30531120300293, "global_step": 53924, "epoch": 320} {"train_loss": -8.3153076171875, "global_step": 53925, "epoch": 320} {"train_loss": -8.31690502166748, "global_step": 53926, "epoch": 320} {"train_loss": -8.390324240639096, "global_step": 53927, "epoch": 320, "val_loss": 189934.609375, "train_action_mse_error": 7.802302360534668} {"train_loss": -8.460702896118164, "global_step": 53928, "epoch": 321} {"train_loss": -8.419075012207031, "global_step": 53929, "epoch": 321} {"train_loss": -8.323265075683594, "global_step": 53930, "epoch": 321} {"train_loss": -8.442541122436523, "global_step": 53931, "epoch": 321} {"train_loss": -8.510602951049805, "global_step": 53932, "epoch": 321} {"train_loss": -8.505255699157715, "global_step": 53933, "epoch": 321} {"train_loss": -8.504806518554688, "global_step": 53934, "epoch": 321} {"train_loss": -8.322802543640137, "global_step": 53935, "epoch": 321} {"train_loss": -8.453137397766113, "global_step": 53936, "epoch": 321} {"train_loss": -8.42026138305664, "global_step": 53937, "epoch": 321} {"train_loss": -8.233360290527344, "global_step": 53938, "epoch": 321} {"train_loss": -8.424625396728516, "global_step": 53939, "epoch": 321} {"train_loss": -8.491498947143555, "global_step": 53940, "epoch": 321} {"train_loss": -8.218616485595703, "global_step": 53941, "epoch": 321} {"train_loss": -8.271244049072266, "global_step": 53942, "epoch": 321} {"train_loss": -8.177331924438477, "global_step": 53943, "epoch": 321} {"train_loss": -8.268298149108887, "global_step": 53944, "epoch": 321} {"train_loss": -8.341147422790527, "global_step": 53945, "epoch": 321} {"train_loss": -8.475545883178711, "global_step": 53946, "epoch": 321} {"train_loss": -8.650246620178223, "global_step": 53947, "epoch": 321} {"train_loss": -8.586860656738281, "global_step": 53948, "epoch": 321} {"train_loss": -8.553071022033691, "global_step": 53949, "epoch": 321} {"train_loss": -8.644723892211914, "global_step": 53950, "epoch": 321} {"train_loss": -8.420097351074219, "global_step": 53951, "epoch": 321} {"train_loss": -8.524306297302246, "global_step": 53952, "epoch": 321} {"train_loss": -8.609041213989258, "global_step": 53953, "epoch": 321} {"train_loss": -8.552506446838379, "global_step": 53954, "epoch": 321} {"train_loss": -8.325984954833984, "global_step": 53955, "epoch": 321} {"train_loss": -8.409614562988281, "global_step": 53956, "epoch": 321} {"train_loss": -8.031646728515625, "global_step": 53957, "epoch": 321} {"train_loss": -8.403812408447266, "global_step": 53958, "epoch": 321} {"train_loss": -8.268299102783203, "global_step": 53959, "epoch": 321} {"train_loss": -8.353948593139648, "global_step": 53960, "epoch": 321} {"train_loss": -8.391647338867188, "global_step": 53961, "epoch": 321} {"train_loss": -8.626753807067871, "global_step": 53962, "epoch": 321} {"train_loss": -8.348173141479492, "global_step": 53963, "epoch": 321} {"train_loss": -8.541099548339844, "global_step": 53964, "epoch": 321} {"train_loss": -8.56231689453125, "global_step": 53965, "epoch": 321} {"train_loss": -8.558815956115723, "global_step": 53966, "epoch": 321} {"train_loss": -8.486452102661133, "global_step": 53967, "epoch": 321} {"train_loss": -8.716523170471191, "global_step": 53968, "epoch": 321} {"train_loss": -8.708118438720703, "global_step": 53969, "epoch": 321} {"train_loss": -8.58150863647461, "global_step": 53970, "epoch": 321} {"train_loss": -8.760164260864258, "global_step": 53971, "epoch": 321} {"train_loss": -8.636348724365234, "global_step": 53972, "epoch": 321} {"train_loss": -8.58826732635498, "global_step": 53973, "epoch": 321} {"train_loss": -8.576908111572266, "global_step": 53974, "epoch": 321} {"train_loss": -8.581659317016602, "global_step": 53975, "epoch": 321} {"train_loss": -8.530250549316406, "global_step": 53976, "epoch": 321} {"train_loss": -8.666987419128418, "global_step": 53977, "epoch": 321} {"train_loss": -8.635488510131836, "global_step": 53978, "epoch": 321} {"train_loss": -8.859410285949707, "global_step": 53979, "epoch": 321} {"train_loss": -8.720502853393555, "global_step": 53980, "epoch": 321} {"train_loss": -8.315075874328613, "global_step": 53981, "epoch": 321} {"train_loss": -8.770679473876953, "global_step": 53982, "epoch": 321} {"train_loss": -8.416596412658691, "global_step": 53983, "epoch": 321} {"train_loss": -8.384007453918457, "global_step": 53984, "epoch": 321} {"train_loss": -8.594871520996094, "global_step": 53985, "epoch": 321} {"train_loss": -8.69070816040039, "global_step": 53986, "epoch": 321} {"train_loss": -8.163566589355469, "global_step": 53987, "epoch": 321} {"train_loss": -8.620855331420898, "global_step": 53988, "epoch": 321} {"train_loss": -7.957798957824707, "global_step": 53989, "epoch": 321} {"train_loss": -8.557354927062988, "global_step": 53990, "epoch": 321} {"train_loss": -8.152889251708984, "global_step": 53991, "epoch": 321} {"train_loss": -8.304481506347656, "global_step": 53992, "epoch": 321} {"train_loss": -8.420101165771484, "global_step": 53993, "epoch": 321} {"train_loss": -8.392663955688477, "global_step": 53994, "epoch": 321} {"train_loss": -8.3699369430542, "global_step": 53995, "epoch": 321} {"train_loss": -8.605368614196777, "global_step": 53996, "epoch": 321} {"train_loss": -8.677070617675781, "global_step": 53997, "epoch": 321} {"train_loss": -7.974052429199219, "global_step": 53998, "epoch": 321} {"train_loss": -8.263656616210938, "global_step": 53999, "epoch": 321} {"train_loss": -8.331462860107422, "global_step": 54000, "epoch": 321} {"train_loss": -8.298267364501953, "global_step": 54001, "epoch": 321} {"train_loss": -8.337255477905273, "global_step": 54002, "epoch": 321} {"train_loss": -8.491962432861328, "global_step": 54003, "epoch": 321} {"train_loss": -8.423480033874512, "global_step": 54004, "epoch": 321} {"train_loss": -8.401298522949219, "global_step": 54005, "epoch": 321} {"train_loss": -8.18233871459961, "global_step": 54006, "epoch": 321} {"train_loss": -8.39498233795166, "global_step": 54007, "epoch": 321} {"train_loss": -8.286840438842773, "global_step": 54008, "epoch": 321} {"train_loss": -8.292196273803711, "global_step": 54009, "epoch": 321} {"train_loss": -8.35189151763916, "global_step": 54010, "epoch": 321} {"train_loss": -8.415130615234375, "global_step": 54011, "epoch": 321} {"train_loss": -8.447964668273926, "global_step": 54012, "epoch": 321} {"train_loss": -8.527931213378906, "global_step": 54013, "epoch": 321} {"train_loss": -8.586793899536133, "global_step": 54014, "epoch": 321} {"train_loss": -8.291170120239258, "global_step": 54015, "epoch": 321} {"train_loss": -8.57046127319336, "global_step": 54016, "epoch": 321} {"train_loss": -8.534747123718262, "global_step": 54017, "epoch": 321} {"train_loss": -8.201762199401855, "global_step": 54018, "epoch": 321} {"train_loss": -8.564433097839355, "global_step": 54019, "epoch": 321} {"train_loss": -8.58806324005127, "global_step": 54020, "epoch": 321} {"train_loss": -8.510631561279297, "global_step": 54021, "epoch": 321} {"train_loss": -8.524423599243164, "global_step": 54022, "epoch": 321} {"train_loss": -8.486396789550781, "global_step": 54023, "epoch": 321} {"train_loss": -8.342557907104492, "global_step": 54024, "epoch": 321} {"train_loss": -8.633933067321777, "global_step": 54025, "epoch": 321} {"train_loss": -8.489211082458496, "global_step": 54026, "epoch": 321} {"train_loss": -8.564018249511719, "global_step": 54027, "epoch": 321} {"train_loss": -8.63533878326416, "global_step": 54028, "epoch": 321} {"train_loss": -8.252706527709961, "global_step": 54029, "epoch": 321} {"train_loss": -8.294139862060547, "global_step": 54030, "epoch": 321} {"train_loss": -8.648591041564941, "global_step": 54031, "epoch": 321} {"train_loss": -8.37444019317627, "global_step": 54032, "epoch": 321} {"train_loss": -8.634668350219727, "global_step": 54033, "epoch": 321} {"train_loss": -8.583815574645996, "global_step": 54034, "epoch": 321} {"train_loss": -8.626190185546875, "global_step": 54035, "epoch": 321} {"train_loss": -8.692927360534668, "global_step": 54036, "epoch": 321} {"train_loss": -8.550411224365234, "global_step": 54037, "epoch": 321} {"train_loss": -8.193655014038086, "global_step": 54038, "epoch": 321} {"train_loss": -8.52787971496582, "global_step": 54039, "epoch": 321} {"train_loss": -8.596464157104492, "global_step": 54040, "epoch": 321} {"train_loss": -8.598670959472656, "global_step": 54041, "epoch": 321} {"train_loss": -8.517169952392578, "global_step": 54042, "epoch": 321} {"train_loss": -8.767364501953125, "global_step": 54043, "epoch": 321} {"train_loss": -8.54448127746582, "global_step": 54044, "epoch": 321} {"train_loss": -8.472508430480957, "global_step": 54045, "epoch": 321} {"train_loss": -8.675033569335938, "global_step": 54046, "epoch": 321} {"train_loss": -8.535109519958496, "global_step": 54047, "epoch": 321} {"train_loss": -8.215553283691406, "global_step": 54048, "epoch": 321} {"train_loss": -8.554033279418945, "global_step": 54049, "epoch": 321} {"train_loss": -8.545942306518555, "global_step": 54050, "epoch": 321} {"train_loss": -8.46402359008789, "global_step": 54051, "epoch": 321} {"train_loss": -8.236135482788086, "global_step": 54052, "epoch": 321} {"train_loss": -8.54281234741211, "global_step": 54053, "epoch": 321} {"train_loss": -8.323463439941406, "global_step": 54054, "epoch": 321} {"train_loss": -8.371026992797852, "global_step": 54055, "epoch": 321} {"train_loss": -8.364676475524902, "global_step": 54056, "epoch": 321} {"train_loss": -8.62039566040039, "global_step": 54057, "epoch": 321} {"train_loss": -8.273796081542969, "global_step": 54058, "epoch": 321} {"train_loss": -8.347800254821777, "global_step": 54059, "epoch": 321} {"train_loss": -8.32988166809082, "global_step": 54060, "epoch": 321} {"train_loss": -8.102607727050781, "global_step": 54061, "epoch": 321} {"train_loss": -8.144660949707031, "global_step": 54062, "epoch": 321} {"train_loss": -8.332473754882812, "global_step": 54063, "epoch": 321} {"train_loss": -8.164926528930664, "global_step": 54064, "epoch": 321} {"train_loss": -8.061161041259766, "global_step": 54065, "epoch": 321} {"train_loss": -8.187990188598633, "global_step": 54066, "epoch": 321} {"train_loss": -8.214489936828613, "global_step": 54067, "epoch": 321} {"train_loss": -8.132303237915039, "global_step": 54068, "epoch": 321} {"train_loss": -8.127379417419434, "global_step": 54069, "epoch": 321} {"train_loss": -8.53443717956543, "global_step": 54070, "epoch": 321} {"train_loss": -8.220010757446289, "global_step": 54071, "epoch": 321} {"train_loss": -8.253173828125, "global_step": 54072, "epoch": 321} {"train_loss": -8.346393585205078, "global_step": 54073, "epoch": 321} {"train_loss": -8.213881492614746, "global_step": 54074, "epoch": 321} {"train_loss": -8.37044620513916, "global_step": 54075, "epoch": 321} {"train_loss": -8.361915588378906, "global_step": 54076, "epoch": 321} {"train_loss": -8.443685531616211, "global_step": 54077, "epoch": 321} {"train_loss": -8.369823455810547, "global_step": 54078, "epoch": 321} {"train_loss": -8.317647933959961, "global_step": 54079, "epoch": 321} {"train_loss": -8.18334674835205, "global_step": 54080, "epoch": 321} {"train_loss": -8.495538711547852, "global_step": 54081, "epoch": 321} {"train_loss": -8.349072456359863, "global_step": 54082, "epoch": 321} {"train_loss": -8.356027603149414, "global_step": 54083, "epoch": 321} {"train_loss": -8.611329078674316, "global_step": 54084, "epoch": 321} {"train_loss": -8.657218933105469, "global_step": 54085, "epoch": 321} {"train_loss": -8.579565048217773, "global_step": 54086, "epoch": 321} {"train_loss": -8.380928039550781, "global_step": 54087, "epoch": 321} {"train_loss": -8.513324737548828, "global_step": 54088, "epoch": 321} {"train_loss": -8.764955520629883, "global_step": 54089, "epoch": 321} {"train_loss": -8.316612243652344, "global_step": 54090, "epoch": 321} {"train_loss": -8.710718154907227, "global_step": 54091, "epoch": 321} {"train_loss": -8.693988800048828, "global_step": 54092, "epoch": 321} {"train_loss": -8.593855857849121, "global_step": 54093, "epoch": 321} {"train_loss": -8.67416763305664, "global_step": 54094, "epoch": 321} {"train_loss": -8.444611799149286, "global_step": 54095, "epoch": 321, "val_loss": 188320.421875} {"train_loss": -8.607686042785645, "global_step": 54096, "epoch": 322} {"train_loss": -8.714881896972656, "global_step": 54097, "epoch": 322} {"train_loss": -8.5333890914917, "global_step": 54098, "epoch": 322} {"train_loss": -8.550790786743164, "global_step": 54099, "epoch": 322} {"train_loss": -8.451972961425781, "global_step": 54100, "epoch": 322} {"train_loss": -8.642919540405273, "global_step": 54101, "epoch": 322} {"train_loss": -8.656982421875, "global_step": 54102, "epoch": 322} {"train_loss": -8.422332763671875, "global_step": 54103, "epoch": 322} {"train_loss": -8.208684921264648, "global_step": 54104, "epoch": 322} {"train_loss": -8.614228248596191, "global_step": 54105, "epoch": 322} {"train_loss": -8.316553115844727, "global_step": 54106, "epoch": 322} {"train_loss": -8.498069763183594, "global_step": 54107, "epoch": 322} {"train_loss": -8.437986373901367, "global_step": 54108, "epoch": 322} {"train_loss": -8.413032531738281, "global_step": 54109, "epoch": 322} {"train_loss": -8.361554145812988, "global_step": 54110, "epoch": 322} {"train_loss": -8.566421508789062, "global_step": 54111, "epoch": 322} {"train_loss": -8.574201583862305, "global_step": 54112, "epoch": 322} {"train_loss": -8.547402381896973, "global_step": 54113, "epoch": 322} {"train_loss": -8.52700424194336, "global_step": 54114, "epoch": 322} {"train_loss": -8.150936126708984, "global_step": 54115, "epoch": 322} {"train_loss": -8.199125289916992, "global_step": 54116, "epoch": 322} {"train_loss": -8.395971298217773, "global_step": 54117, "epoch": 322} {"train_loss": -8.23901081085205, "global_step": 54118, "epoch": 322} {"train_loss": -8.41514778137207, "global_step": 54119, "epoch": 322} {"train_loss": -8.085657119750977, "global_step": 54120, "epoch": 322} {"train_loss": -8.507560729980469, "global_step": 54121, "epoch": 322} {"train_loss": -8.465620994567871, "global_step": 54122, "epoch": 322} {"train_loss": -8.103706359863281, "global_step": 54123, "epoch": 322} {"train_loss": -8.58841323852539, "global_step": 54124, "epoch": 322} {"train_loss": -8.577699661254883, "global_step": 54125, "epoch": 322} {"train_loss": -8.660040855407715, "global_step": 54126, "epoch": 322} {"train_loss": -8.526514053344727, "global_step": 54127, "epoch": 322} {"train_loss": -8.658873558044434, "global_step": 54128, "epoch": 322} {"train_loss": -8.581171035766602, "global_step": 54129, "epoch": 322} {"train_loss": -8.538169860839844, "global_step": 54130, "epoch": 322} {"train_loss": -8.670989990234375, "global_step": 54131, "epoch": 322} {"train_loss": -8.290614128112793, "global_step": 54132, "epoch": 322} {"train_loss": -8.571155548095703, "global_step": 54133, "epoch": 322} {"train_loss": -8.586585998535156, "global_step": 54134, "epoch": 322} {"train_loss": -8.627233505249023, "global_step": 54135, "epoch": 322} {"train_loss": -8.736495971679688, "global_step": 54136, "epoch": 322} {"train_loss": -8.647701263427734, "global_step": 54137, "epoch": 322} {"train_loss": -8.529376983642578, "global_step": 54138, "epoch": 322} {"train_loss": -8.458614349365234, "global_step": 54139, "epoch": 322} {"train_loss": -8.254262924194336, "global_step": 54140, "epoch": 322} {"train_loss": -8.614564895629883, "global_step": 54141, "epoch": 322} {"train_loss": -8.662055969238281, "global_step": 54142, "epoch": 322} {"train_loss": -8.713860511779785, "global_step": 54143, "epoch": 322} {"train_loss": -8.458356857299805, "global_step": 54144, "epoch": 322} {"train_loss": -8.15591049194336, "global_step": 54145, "epoch": 322} {"train_loss": -8.31916618347168, "global_step": 54146, "epoch": 322} {"train_loss": -8.388824462890625, "global_step": 54147, "epoch": 322} {"train_loss": -8.362462997436523, "global_step": 54148, "epoch": 322} {"train_loss": -8.27299690246582, "global_step": 54149, "epoch": 322} {"train_loss": -8.326509475708008, "global_step": 54150, "epoch": 322} {"train_loss": -8.402660369873047, "global_step": 54151, "epoch": 322} {"train_loss": -8.170708656311035, "global_step": 54152, "epoch": 322} {"train_loss": -8.287176132202148, "global_step": 54153, "epoch": 322} {"train_loss": -8.34808349609375, "global_step": 54154, "epoch": 322} {"train_loss": -8.191722869873047, "global_step": 54155, "epoch": 322} {"train_loss": -8.412235260009766, "global_step": 54156, "epoch": 322} {"train_loss": -8.381759643554688, "global_step": 54157, "epoch": 322} {"train_loss": -8.52906608581543, "global_step": 54158, "epoch": 322} {"train_loss": -8.48793888092041, "global_step": 54159, "epoch": 322} {"train_loss": -8.201133728027344, "global_step": 54160, "epoch": 322} {"train_loss": -8.614546775817871, "global_step": 54161, "epoch": 322} {"train_loss": -8.5442476272583, "global_step": 54162, "epoch": 322} {"train_loss": -8.55543327331543, "global_step": 54163, "epoch": 322} {"train_loss": -8.607806205749512, "global_step": 54164, "epoch": 322} {"train_loss": -8.682799339294434, "global_step": 54165, "epoch": 322} {"train_loss": -8.410930633544922, "global_step": 54166, "epoch": 322} {"train_loss": -8.469748497009277, "global_step": 54167, "epoch": 322} {"train_loss": -8.287872314453125, "global_step": 54168, "epoch": 322} {"train_loss": -8.559328079223633, "global_step": 54169, "epoch": 322} {"train_loss": -8.276308059692383, "global_step": 54170, "epoch": 322} {"train_loss": -8.456457138061523, "global_step": 54171, "epoch": 322} {"train_loss": -8.626020431518555, "global_step": 54172, "epoch": 322} {"train_loss": -8.550081253051758, "global_step": 54173, "epoch": 322} {"train_loss": -8.249104499816895, "global_step": 54174, "epoch": 322} {"train_loss": -8.475664138793945, "global_step": 54175, "epoch": 322} {"train_loss": -8.43522834777832, "global_step": 54176, "epoch": 322} {"train_loss": -8.017923355102539, "global_step": 54177, "epoch": 322} {"train_loss": -8.232847213745117, "global_step": 54178, "epoch": 322} {"train_loss": -8.36403751373291, "global_step": 54179, "epoch": 322} {"train_loss": -8.358466148376465, "global_step": 54180, "epoch": 322} {"train_loss": -8.587837219238281, "global_step": 54181, "epoch": 322} {"train_loss": -8.195127487182617, "global_step": 54182, "epoch": 322} {"train_loss": -8.340648651123047, "global_step": 54183, "epoch": 322} {"train_loss": -8.12700366973877, "global_step": 54184, "epoch": 322} {"train_loss": -8.533341407775879, "global_step": 54185, "epoch": 322} {"train_loss": -8.4547758102417, "global_step": 54186, "epoch": 322} {"train_loss": -8.404409408569336, "global_step": 54187, "epoch": 322} {"train_loss": -8.347521781921387, "global_step": 54188, "epoch": 322} {"train_loss": -8.563044548034668, "global_step": 54189, "epoch": 322} {"train_loss": -8.458950996398926, "global_step": 54190, "epoch": 322} {"train_loss": -8.327845573425293, "global_step": 54191, "epoch": 322} {"train_loss": -8.388825416564941, "global_step": 54192, "epoch": 322} {"train_loss": -8.435449600219727, "global_step": 54193, "epoch": 322} {"train_loss": -8.320962905883789, "global_step": 54194, "epoch": 322} {"train_loss": -8.310247421264648, "global_step": 54195, "epoch": 322} {"train_loss": -8.619010925292969, "global_step": 54196, "epoch": 322} {"train_loss": -8.194415092468262, "global_step": 54197, "epoch": 322} {"train_loss": -8.55030345916748, "global_step": 54198, "epoch": 322} {"train_loss": -8.019540786743164, "global_step": 54199, "epoch": 322} {"train_loss": -8.501388549804688, "global_step": 54200, "epoch": 322} {"train_loss": -8.299997329711914, "global_step": 54201, "epoch": 322} {"train_loss": -8.670814514160156, "global_step": 54202, "epoch": 322} {"train_loss": -8.377726554870605, "global_step": 54203, "epoch": 322} {"train_loss": -8.609214782714844, "global_step": 54204, "epoch": 322} {"train_loss": -8.267906188964844, "global_step": 54205, "epoch": 322} {"train_loss": -8.356523513793945, "global_step": 54206, "epoch": 322} {"train_loss": -8.385862350463867, "global_step": 54207, "epoch": 322} {"train_loss": -8.153162002563477, "global_step": 54208, "epoch": 322} {"train_loss": -8.195796966552734, "global_step": 54209, "epoch": 322} {"train_loss": -7.939687728881836, "global_step": 54210, "epoch": 322} {"train_loss": -7.802498817443848, "global_step": 54211, "epoch": 322} {"train_loss": -7.939150810241699, "global_step": 54212, "epoch": 322} {"train_loss": -8.061505317687988, "global_step": 54213, "epoch": 322} {"train_loss": -8.246026992797852, "global_step": 54214, "epoch": 322} {"train_loss": -8.230205535888672, "global_step": 54215, "epoch": 322} {"train_loss": -8.228486061096191, "global_step": 54216, "epoch": 322} {"train_loss": -8.271547317504883, "global_step": 54217, "epoch": 322} {"train_loss": -8.468099594116211, "global_step": 54218, "epoch": 322} {"train_loss": -8.309527397155762, "global_step": 54219, "epoch": 322} {"train_loss": -8.437129974365234, "global_step": 54220, "epoch": 322} {"train_loss": -8.33651351928711, "global_step": 54221, "epoch": 322} {"train_loss": -8.309513092041016, "global_step": 54222, "epoch": 322} {"train_loss": -8.509925842285156, "global_step": 54223, "epoch": 322} {"train_loss": -8.129554748535156, "global_step": 54224, "epoch": 322} {"train_loss": -8.560295104980469, "global_step": 54225, "epoch": 322} {"train_loss": -8.614113807678223, "global_step": 54226, "epoch": 322} {"train_loss": -8.480810165405273, "global_step": 54227, "epoch": 322} {"train_loss": -8.687243461608887, "global_step": 54228, "epoch": 322} {"train_loss": -8.503156661987305, "global_step": 54229, "epoch": 322} {"train_loss": -8.481308937072754, "global_step": 54230, "epoch": 322} {"train_loss": -8.557855606079102, "global_step": 54231, "epoch": 322} {"train_loss": -8.52535629272461, "global_step": 54232, "epoch": 322} {"train_loss": -8.432267189025879, "global_step": 54233, "epoch": 322} {"train_loss": -8.464678764343262, "global_step": 54234, "epoch": 322} {"train_loss": -8.687335968017578, "global_step": 54235, "epoch": 322} {"train_loss": -8.588111877441406, "global_step": 54236, "epoch": 322} {"train_loss": -8.574018478393555, "global_step": 54237, "epoch": 322} {"train_loss": -8.686386108398438, "global_step": 54238, "epoch": 322} {"train_loss": -8.67230224609375, "global_step": 54239, "epoch": 322} {"train_loss": -8.68179702758789, "global_step": 54240, "epoch": 322} {"train_loss": -8.375420570373535, "global_step": 54241, "epoch": 322} {"train_loss": -8.403676986694336, "global_step": 54242, "epoch": 322} {"train_loss": -8.623377799987793, "global_step": 54243, "epoch": 322} {"train_loss": -8.445802688598633, "global_step": 54244, "epoch": 322} {"train_loss": -8.463592529296875, "global_step": 54245, "epoch": 322} {"train_loss": -8.521533966064453, "global_step": 54246, "epoch": 322} {"train_loss": -8.245543479919434, "global_step": 54247, "epoch": 322} {"train_loss": -8.276214599609375, "global_step": 54248, "epoch": 322} {"train_loss": -8.36798095703125, "global_step": 54249, "epoch": 322} {"train_loss": -8.213088989257812, "global_step": 54250, "epoch": 322} {"train_loss": -8.46340560913086, "global_step": 54251, "epoch": 322} {"train_loss": -8.366275787353516, "global_step": 54252, "epoch": 322} {"train_loss": -8.561522483825684, "global_step": 54253, "epoch": 322} {"train_loss": -8.298466682434082, "global_step": 54254, "epoch": 322} {"train_loss": -8.573530197143555, "global_step": 54255, "epoch": 322} {"train_loss": -8.060384750366211, "global_step": 54256, "epoch": 322} {"train_loss": -8.321749687194824, "global_step": 54257, "epoch": 322} {"train_loss": -8.114110946655273, "global_step": 54258, "epoch": 322} {"train_loss": -8.279840469360352, "global_step": 54259, "epoch": 322} {"train_loss": -7.963254928588867, "global_step": 54260, "epoch": 322} {"train_loss": -8.36380386352539, "global_step": 54261, "epoch": 322} {"train_loss": -8.421652793884277, "global_step": 54262, "epoch": 322} {"train_loss": -8.41382228192829, "global_step": 54263, "epoch": 322, "val_loss": 190435.453125} {"train_loss": -8.614995956420898, "global_step": 54264, "epoch": 323} {"train_loss": -8.314912796020508, "global_step": 54265, "epoch": 323} {"train_loss": -8.10806655883789, "global_step": 54266, "epoch": 323} {"train_loss": -8.375450134277344, "global_step": 54267, "epoch": 323} {"train_loss": -8.297832489013672, "global_step": 54268, "epoch": 323} {"train_loss": -8.072282791137695, "global_step": 54269, "epoch": 323} {"train_loss": -8.456645965576172, "global_step": 54270, "epoch": 323} {"train_loss": -8.551834106445312, "global_step": 54271, "epoch": 323} {"train_loss": -8.368671417236328, "global_step": 54272, "epoch": 323} {"train_loss": -8.327985763549805, "global_step": 54273, "epoch": 323} {"train_loss": -8.469080924987793, "global_step": 54274, "epoch": 323} {"train_loss": -8.3402738571167, "global_step": 54275, "epoch": 323} {"train_loss": -8.349922180175781, "global_step": 54276, "epoch": 323} {"train_loss": -8.467166900634766, "global_step": 54277, "epoch": 323} {"train_loss": -8.567865371704102, "global_step": 54278, "epoch": 323} {"train_loss": -8.20306396484375, "global_step": 54279, "epoch": 323} {"train_loss": -8.541605949401855, "global_step": 54280, "epoch": 323} {"train_loss": -8.480016708374023, "global_step": 54281, "epoch": 323} {"train_loss": -8.360783576965332, "global_step": 54282, "epoch": 323} {"train_loss": -8.438302993774414, "global_step": 54283, "epoch": 323} {"train_loss": -8.424676895141602, "global_step": 54284, "epoch": 323} {"train_loss": -8.34376335144043, "global_step": 54285, "epoch": 323} {"train_loss": -8.432453155517578, "global_step": 54286, "epoch": 323} {"train_loss": -8.641862869262695, "global_step": 54287, "epoch": 323} {"train_loss": -8.676117897033691, "global_step": 54288, "epoch": 323} {"train_loss": -8.47265625, "global_step": 54289, "epoch": 323} {"train_loss": -8.335371971130371, "global_step": 54290, "epoch": 323} {"train_loss": -8.638874053955078, "global_step": 54291, "epoch": 323} {"train_loss": -8.394640922546387, "global_step": 54292, "epoch": 323} {"train_loss": -8.449918746948242, "global_step": 54293, "epoch": 323} {"train_loss": -8.443845748901367, "global_step": 54294, "epoch": 323} {"train_loss": -8.620797157287598, "global_step": 54295, "epoch": 323} {"train_loss": -8.504419326782227, "global_step": 54296, "epoch": 323} {"train_loss": -8.493743896484375, "global_step": 54297, "epoch": 323} {"train_loss": -8.493671417236328, "global_step": 54298, "epoch": 323} {"train_loss": -8.493257522583008, "global_step": 54299, "epoch": 323} {"train_loss": -8.597713470458984, "global_step": 54300, "epoch": 323} {"train_loss": -8.392822265625, "global_step": 54301, "epoch": 323} {"train_loss": -8.36050796508789, "global_step": 54302, "epoch": 323} {"train_loss": -8.405144691467285, "global_step": 54303, "epoch": 323} {"train_loss": -8.387228965759277, "global_step": 54304, "epoch": 323} {"train_loss": -8.606959342956543, "global_step": 54305, "epoch": 323} {"train_loss": -8.475117683410645, "global_step": 54306, "epoch": 323} {"train_loss": -8.360581398010254, "global_step": 54307, "epoch": 323} {"train_loss": -8.422906875610352, "global_step": 54308, "epoch": 323} {"train_loss": -8.40810775756836, "global_step": 54309, "epoch": 323} {"train_loss": -8.482975959777832, "global_step": 54310, "epoch": 323} {"train_loss": -8.670616149902344, "global_step": 54311, "epoch": 323} {"train_loss": -8.316275596618652, "global_step": 54312, "epoch": 323} {"train_loss": -8.29842758178711, "global_step": 54313, "epoch": 323} {"train_loss": -8.804588317871094, "global_step": 54314, "epoch": 323} {"train_loss": -8.438691139221191, "global_step": 54315, "epoch": 323} {"train_loss": -8.550460815429688, "global_step": 54316, "epoch": 323} {"train_loss": -8.423856735229492, "global_step": 54317, "epoch": 323} {"train_loss": -8.531428337097168, "global_step": 54318, "epoch": 323} {"train_loss": -8.471296310424805, "global_step": 54319, "epoch": 323} {"train_loss": -8.591975212097168, "global_step": 54320, "epoch": 323} {"train_loss": -8.5233793258667, "global_step": 54321, "epoch": 323} {"train_loss": -8.588123321533203, "global_step": 54322, "epoch": 323} {"train_loss": -8.396371841430664, "global_step": 54323, "epoch": 323} {"train_loss": -8.443370819091797, "global_step": 54324, "epoch": 323} {"train_loss": -8.595696449279785, "global_step": 54325, "epoch": 323} {"train_loss": -8.411922454833984, "global_step": 54326, "epoch": 323} {"train_loss": -8.799772262573242, "global_step": 54327, "epoch": 323} {"train_loss": -8.567363739013672, "global_step": 54328, "epoch": 323} {"train_loss": -8.514055252075195, "global_step": 54329, "epoch": 323} {"train_loss": -8.748878479003906, "global_step": 54330, "epoch": 323} {"train_loss": -8.612214088439941, "global_step": 54331, "epoch": 323} {"train_loss": -8.68557357788086, "global_step": 54332, "epoch": 323} {"train_loss": -8.64758586883545, "global_step": 54333, "epoch": 323} {"train_loss": -8.66530704498291, "global_step": 54334, "epoch": 323} {"train_loss": -8.648189544677734, "global_step": 54335, "epoch": 323} {"train_loss": -8.582236289978027, "global_step": 54336, "epoch": 323} {"train_loss": -8.576656341552734, "global_step": 54337, "epoch": 323} {"train_loss": -8.405031204223633, "global_step": 54338, "epoch": 323} {"train_loss": -8.450857162475586, "global_step": 54339, "epoch": 323} {"train_loss": -8.349542617797852, "global_step": 54340, "epoch": 323} {"train_loss": -8.584991455078125, "global_step": 54341, "epoch": 323} {"train_loss": -8.461454391479492, "global_step": 54342, "epoch": 323} {"train_loss": -8.413049697875977, "global_step": 54343, "epoch": 323} {"train_loss": -8.16861343383789, "global_step": 54344, "epoch": 323} {"train_loss": -8.355575561523438, "global_step": 54345, "epoch": 323} {"train_loss": -8.279134750366211, "global_step": 54346, "epoch": 323} {"train_loss": -7.936999797821045, "global_step": 54347, "epoch": 323} {"train_loss": -8.500268936157227, "global_step": 54348, "epoch": 323} {"train_loss": -7.841022968292236, "global_step": 54349, "epoch": 323} {"train_loss": -8.30860424041748, "global_step": 54350, "epoch": 323} {"train_loss": -8.082135200500488, "global_step": 54351, "epoch": 323} {"train_loss": -8.245500564575195, "global_step": 54352, "epoch": 323} {"train_loss": -8.151286125183105, "global_step": 54353, "epoch": 323} {"train_loss": -8.291295051574707, "global_step": 54354, "epoch": 323} {"train_loss": -8.33814811706543, "global_step": 54355, "epoch": 323} {"train_loss": -8.402454376220703, "global_step": 54356, "epoch": 323} {"train_loss": -8.267794609069824, "global_step": 54357, "epoch": 323} {"train_loss": -8.33914852142334, "global_step": 54358, "epoch": 323} {"train_loss": -8.294981002807617, "global_step": 54359, "epoch": 323} {"train_loss": -8.363434791564941, "global_step": 54360, "epoch": 323} {"train_loss": -8.414939880371094, "global_step": 54361, "epoch": 323} {"train_loss": -8.224803924560547, "global_step": 54362, "epoch": 323} {"train_loss": -8.160865783691406, "global_step": 54363, "epoch": 323} {"train_loss": -8.204587936401367, "global_step": 54364, "epoch": 323} {"train_loss": -8.48877239227295, "global_step": 54365, "epoch": 323} {"train_loss": -8.209953308105469, "global_step": 54366, "epoch": 323} {"train_loss": -8.42004680633545, "global_step": 54367, "epoch": 323} {"train_loss": -8.08363151550293, "global_step": 54368, "epoch": 323} {"train_loss": -8.489542007446289, "global_step": 54369, "epoch": 323} {"train_loss": -8.547822952270508, "global_step": 54370, "epoch": 323} {"train_loss": -8.181598663330078, "global_step": 54371, "epoch": 323} {"train_loss": -8.45962142944336, "global_step": 54372, "epoch": 323} {"train_loss": -8.349020004272461, "global_step": 54373, "epoch": 323} {"train_loss": -8.642951965332031, "global_step": 54374, "epoch": 323} {"train_loss": -8.16171932220459, "global_step": 54375, "epoch": 323} {"train_loss": -8.722583770751953, "global_step": 54376, "epoch": 323} {"train_loss": -8.487984657287598, "global_step": 54377, "epoch": 323} {"train_loss": -8.582015037536621, "global_step": 54378, "epoch": 323} {"train_loss": -8.23416519165039, "global_step": 54379, "epoch": 323} {"train_loss": -8.306585311889648, "global_step": 54380, "epoch": 323} {"train_loss": -8.531632423400879, "global_step": 54381, "epoch": 323} {"train_loss": -8.423257827758789, "global_step": 54382, "epoch": 323} {"train_loss": -8.529885292053223, "global_step": 54383, "epoch": 323} {"train_loss": -8.422844886779785, "global_step": 54384, "epoch": 323} {"train_loss": -8.422323226928711, "global_step": 54385, "epoch": 323} {"train_loss": -8.471593856811523, "global_step": 54386, "epoch": 323} {"train_loss": -8.583520889282227, "global_step": 54387, "epoch": 323} {"train_loss": -8.674028396606445, "global_step": 54388, "epoch": 323} {"train_loss": -8.38066291809082, "global_step": 54389, "epoch": 323} {"train_loss": -8.537849426269531, "global_step": 54390, "epoch": 323} {"train_loss": -8.468482971191406, "global_step": 54391, "epoch": 323} {"train_loss": -8.230279922485352, "global_step": 54392, "epoch": 323} {"train_loss": -8.524483680725098, "global_step": 54393, "epoch": 323} {"train_loss": -8.370644569396973, "global_step": 54394, "epoch": 323} {"train_loss": -8.271493911743164, "global_step": 54395, "epoch": 323} {"train_loss": -8.237707138061523, "global_step": 54396, "epoch": 323} {"train_loss": -8.373485565185547, "global_step": 54397, "epoch": 323} {"train_loss": -7.9900803565979, "global_step": 54398, "epoch": 323} {"train_loss": -8.495269775390625, "global_step": 54399, "epoch": 323} {"train_loss": -8.308483123779297, "global_step": 54400, "epoch": 323} {"train_loss": -8.282148361206055, "global_step": 54401, "epoch": 323} {"train_loss": -8.255266189575195, "global_step": 54402, "epoch": 323} {"train_loss": -8.3948974609375, "global_step": 54403, "epoch": 323} {"train_loss": -8.37032699584961, "global_step": 54404, "epoch": 323} {"train_loss": -8.449368476867676, "global_step": 54405, "epoch": 323} {"train_loss": -8.276162147521973, "global_step": 54406, "epoch": 323} {"train_loss": -8.040756225585938, "global_step": 54407, "epoch": 323} {"train_loss": -8.551898002624512, "global_step": 54408, "epoch": 323} {"train_loss": -8.403342247009277, "global_step": 54409, "epoch": 323} {"train_loss": -8.338112831115723, "global_step": 54410, "epoch": 323} {"train_loss": -8.52723503112793, "global_step": 54411, "epoch": 323} {"train_loss": -8.266805648803711, "global_step": 54412, "epoch": 323} {"train_loss": -8.398374557495117, "global_step": 54413, "epoch": 323} {"train_loss": -8.515588760375977, "global_step": 54414, "epoch": 323} {"train_loss": -8.46784782409668, "global_step": 54415, "epoch": 323} {"train_loss": -8.629070281982422, "global_step": 54416, "epoch": 323} {"train_loss": -8.4749116897583, "global_step": 54417, "epoch": 323} {"train_loss": -8.394858360290527, "global_step": 54418, "epoch": 323} {"train_loss": -8.343449592590332, "global_step": 54419, "epoch": 323} {"train_loss": -8.50944709777832, "global_step": 54420, "epoch": 323} {"train_loss": -8.412697792053223, "global_step": 54421, "epoch": 323} {"train_loss": -8.694442749023438, "global_step": 54422, "epoch": 323} {"train_loss": -8.546443939208984, "global_step": 54423, "epoch": 323} {"train_loss": -8.618220329284668, "global_step": 54424, "epoch": 323} {"train_loss": -8.483804702758789, "global_step": 54425, "epoch": 323} {"train_loss": -8.5123929977417, "global_step": 54426, "epoch": 323} {"train_loss": -8.202362060546875, "global_step": 54427, "epoch": 323} {"train_loss": -8.283658981323242, "global_step": 54428, "epoch": 323} {"train_loss": -8.234106063842773, "global_step": 54429, "epoch": 323} {"train_loss": -8.308792114257812, "global_step": 54430, "epoch": 323} {"train_loss": -8.417893812769936, "global_step": 54431, "epoch": 323, "val_loss": 188401.671875} {"train_loss": -8.17840576171875, "global_step": 54432, "epoch": 324} {"train_loss": -8.024115562438965, "global_step": 54433, "epoch": 324} {"train_loss": -8.23677921295166, "global_step": 54434, "epoch": 324} {"train_loss": -7.871265411376953, "global_step": 54435, "epoch": 324} {"train_loss": -8.132704734802246, "global_step": 54436, "epoch": 324} {"train_loss": -8.10258960723877, "global_step": 54437, "epoch": 324} {"train_loss": -8.292634963989258, "global_step": 54438, "epoch": 324} {"train_loss": -8.07792854309082, "global_step": 54439, "epoch": 324} {"train_loss": -8.057830810546875, "global_step": 54440, "epoch": 324} {"train_loss": -8.228546142578125, "global_step": 54441, "epoch": 324} {"train_loss": -8.290817260742188, "global_step": 54442, "epoch": 324} {"train_loss": -8.44043254852295, "global_step": 54443, "epoch": 324} {"train_loss": -8.393381118774414, "global_step": 54444, "epoch": 324} {"train_loss": -8.279565811157227, "global_step": 54445, "epoch": 324} {"train_loss": -8.439664840698242, "global_step": 54446, "epoch": 324} {"train_loss": -8.430700302124023, "global_step": 54447, "epoch": 324} {"train_loss": -8.466039657592773, "global_step": 54448, "epoch": 324} {"train_loss": -8.357355117797852, "global_step": 54449, "epoch": 324} {"train_loss": -8.283967018127441, "global_step": 54450, "epoch": 324} {"train_loss": -8.470358848571777, "global_step": 54451, "epoch": 324} {"train_loss": -8.506692886352539, "global_step": 54452, "epoch": 324} {"train_loss": -8.291964530944824, "global_step": 54453, "epoch": 324} {"train_loss": -8.528213500976562, "global_step": 54454, "epoch": 324} {"train_loss": -8.39472770690918, "global_step": 54455, "epoch": 324} {"train_loss": -8.31443977355957, "global_step": 54456, "epoch": 324} {"train_loss": -8.435945510864258, "global_step": 54457, "epoch": 324} {"train_loss": -8.213776588439941, "global_step": 54458, "epoch": 324} {"train_loss": -8.125894546508789, "global_step": 54459, "epoch": 324} {"train_loss": -8.14533805847168, "global_step": 54460, "epoch": 324} {"train_loss": -8.372008323669434, "global_step": 54461, "epoch": 324} {"train_loss": -8.324918746948242, "global_step": 54462, "epoch": 324} {"train_loss": -8.298683166503906, "global_step": 54463, "epoch": 324} {"train_loss": -8.206944465637207, "global_step": 54464, "epoch": 324} {"train_loss": -8.494853973388672, "global_step": 54465, "epoch": 324} {"train_loss": -8.279925346374512, "global_step": 54466, "epoch": 324} {"train_loss": -8.486135482788086, "global_step": 54467, "epoch": 324} {"train_loss": -8.4617919921875, "global_step": 54468, "epoch": 324} {"train_loss": -8.030370712280273, "global_step": 54469, "epoch": 324} {"train_loss": -8.532848358154297, "global_step": 54470, "epoch": 324} {"train_loss": -8.505041122436523, "global_step": 54471, "epoch": 324} {"train_loss": -8.507444381713867, "global_step": 54472, "epoch": 324} {"train_loss": -8.395830154418945, "global_step": 54473, "epoch": 324} {"train_loss": -8.531150817871094, "global_step": 54474, "epoch": 324} {"train_loss": -8.965726852416992, "global_step": 54475, "epoch": 324} {"train_loss": -8.475109100341797, "global_step": 54476, "epoch": 324} {"train_loss": -8.694120407104492, "global_step": 54477, "epoch": 324} {"train_loss": -8.498251914978027, "global_step": 54478, "epoch": 324} {"train_loss": -8.855772972106934, "global_step": 54479, "epoch": 324} {"train_loss": -8.494319915771484, "global_step": 54480, "epoch": 324} {"train_loss": -8.473567008972168, "global_step": 54481, "epoch": 324} {"train_loss": -8.78088092803955, "global_step": 54482, "epoch": 324} {"train_loss": -8.36586856842041, "global_step": 54483, "epoch": 324} {"train_loss": -8.672492980957031, "global_step": 54484, "epoch": 324} {"train_loss": -8.552501678466797, "global_step": 54485, "epoch": 324} {"train_loss": -8.627727508544922, "global_step": 54486, "epoch": 324} {"train_loss": -8.48027229309082, "global_step": 54487, "epoch": 324} {"train_loss": -8.437542915344238, "global_step": 54488, "epoch": 324} {"train_loss": -8.486997604370117, "global_step": 54489, "epoch": 324} {"train_loss": -8.259637832641602, "global_step": 54490, "epoch": 324} {"train_loss": -8.657134056091309, "global_step": 54491, "epoch": 324} {"train_loss": -8.287369728088379, "global_step": 54492, "epoch": 324} {"train_loss": -8.128676414489746, "global_step": 54493, "epoch": 324} {"train_loss": -8.552202224731445, "global_step": 54494, "epoch": 324} {"train_loss": -8.274641036987305, "global_step": 54495, "epoch": 324} {"train_loss": -8.372356414794922, "global_step": 54496, "epoch": 324} {"train_loss": -8.357847213745117, "global_step": 54497, "epoch": 324} {"train_loss": -8.491600036621094, "global_step": 54498, "epoch": 324} {"train_loss": -8.148735046386719, "global_step": 54499, "epoch": 324} {"train_loss": -8.666170120239258, "global_step": 54500, "epoch": 324} {"train_loss": -8.493423461914062, "global_step": 54501, "epoch": 324} {"train_loss": -8.628360748291016, "global_step": 54502, "epoch": 324} {"train_loss": -8.476284980773926, "global_step": 54503, "epoch": 324} {"train_loss": -8.554540634155273, "global_step": 54504, "epoch": 324} {"train_loss": -8.317401885986328, "global_step": 54505, "epoch": 324} {"train_loss": -8.623860359191895, "global_step": 54506, "epoch": 324} {"train_loss": -8.668102264404297, "global_step": 54507, "epoch": 324} {"train_loss": -8.474384307861328, "global_step": 54508, "epoch": 324} {"train_loss": -8.466619491577148, "global_step": 54509, "epoch": 324} {"train_loss": -8.621017456054688, "global_step": 54510, "epoch": 324} {"train_loss": -8.46695327758789, "global_step": 54511, "epoch": 324} {"train_loss": -8.631989479064941, "global_step": 54512, "epoch": 324} {"train_loss": -8.455458641052246, "global_step": 54513, "epoch": 324} {"train_loss": -8.340410232543945, "global_step": 54514, "epoch": 324} {"train_loss": -8.61319351196289, "global_step": 54515, "epoch": 324} {"train_loss": -8.318766593933105, "global_step": 54516, "epoch": 324} {"train_loss": -8.609333038330078, "global_step": 54517, "epoch": 324} {"train_loss": -8.306051254272461, "global_step": 54518, "epoch": 324} {"train_loss": -8.452232360839844, "global_step": 54519, "epoch": 324} {"train_loss": -8.658801078796387, "global_step": 54520, "epoch": 324} {"train_loss": -8.613489151000977, "global_step": 54521, "epoch": 324} {"train_loss": -8.532773971557617, "global_step": 54522, "epoch": 324} {"train_loss": -8.638835906982422, "global_step": 54523, "epoch": 324} {"train_loss": -8.537616729736328, "global_step": 54524, "epoch": 324} {"train_loss": -7.800606727600098, "global_step": 54525, "epoch": 324} {"train_loss": -8.5641450881958, "global_step": 54526, "epoch": 324} {"train_loss": -7.781827926635742, "global_step": 54527, "epoch": 324} {"train_loss": -8.43883991241455, "global_step": 54528, "epoch": 324} {"train_loss": -8.086576461791992, "global_step": 54529, "epoch": 324} {"train_loss": -8.547263145446777, "global_step": 54530, "epoch": 324} {"train_loss": -7.852685928344727, "global_step": 54531, "epoch": 324} {"train_loss": -8.501242637634277, "global_step": 54532, "epoch": 324} {"train_loss": -7.904864311218262, "global_step": 54533, "epoch": 324} {"train_loss": -8.395095825195312, "global_step": 54534, "epoch": 324} {"train_loss": -8.425477981567383, "global_step": 54535, "epoch": 324} {"train_loss": -8.253762245178223, "global_step": 54536, "epoch": 324} {"train_loss": -8.139263153076172, "global_step": 54537, "epoch": 324} {"train_loss": -8.397212028503418, "global_step": 54538, "epoch": 324} {"train_loss": -8.276209831237793, "global_step": 54539, "epoch": 324} {"train_loss": -8.422452926635742, "global_step": 54540, "epoch": 324} {"train_loss": -8.235204696655273, "global_step": 54541, "epoch": 324} {"train_loss": -8.318017959594727, "global_step": 54542, "epoch": 324} {"train_loss": -8.374336242675781, "global_step": 54543, "epoch": 324} {"train_loss": -8.432889938354492, "global_step": 54544, "epoch": 324} {"train_loss": -8.278385162353516, "global_step": 54545, "epoch": 324} {"train_loss": -8.263924598693848, "global_step": 54546, "epoch": 324} {"train_loss": -8.414656639099121, "global_step": 54547, "epoch": 324} {"train_loss": -8.282090187072754, "global_step": 54548, "epoch": 324} {"train_loss": -8.282146453857422, "global_step": 54549, "epoch": 324} {"train_loss": -8.400006294250488, "global_step": 54550, "epoch": 324} {"train_loss": -8.119815826416016, "global_step": 54551, "epoch": 324} {"train_loss": -8.206852912902832, "global_step": 54552, "epoch": 324} {"train_loss": -8.405433654785156, "global_step": 54553, "epoch": 324} {"train_loss": -8.382391929626465, "global_step": 54554, "epoch": 324} {"train_loss": -8.410140991210938, "global_step": 54555, "epoch": 324} {"train_loss": -8.170963287353516, "global_step": 54556, "epoch": 324} {"train_loss": -8.304370880126953, "global_step": 54557, "epoch": 324} {"train_loss": -8.54865550994873, "global_step": 54558, "epoch": 324} {"train_loss": -8.354736328125, "global_step": 54559, "epoch": 324} {"train_loss": -8.548032760620117, "global_step": 54560, "epoch": 324} {"train_loss": -8.545266151428223, "global_step": 54561, "epoch": 324} {"train_loss": -8.485334396362305, "global_step": 54562, "epoch": 324} {"train_loss": -8.388238906860352, "global_step": 54563, "epoch": 324} {"train_loss": -8.526240348815918, "global_step": 54564, "epoch": 324} {"train_loss": -8.73084831237793, "global_step": 54565, "epoch": 324} {"train_loss": -8.627246856689453, "global_step": 54566, "epoch": 324} {"train_loss": -8.385093688964844, "global_step": 54567, "epoch": 324} {"train_loss": -8.870896339416504, "global_step": 54568, "epoch": 324} {"train_loss": -8.445671081542969, "global_step": 54569, "epoch": 324} {"train_loss": -8.624903678894043, "global_step": 54570, "epoch": 324} {"train_loss": -8.569415092468262, "global_step": 54571, "epoch": 324} {"train_loss": -8.494525909423828, "global_step": 54572, "epoch": 324} {"train_loss": -8.29821491241455, "global_step": 54573, "epoch": 324} {"train_loss": -8.75612735748291, "global_step": 54574, "epoch": 324} {"train_loss": -8.586591720581055, "global_step": 54575, "epoch": 324} {"train_loss": -8.442426681518555, "global_step": 54576, "epoch": 324} {"train_loss": -8.63669204711914, "global_step": 54577, "epoch": 324} {"train_loss": -8.389249801635742, "global_step": 54578, "epoch": 324} {"train_loss": -8.680327415466309, "global_step": 54579, "epoch": 324} {"train_loss": -8.521056175231934, "global_step": 54580, "epoch": 324} {"train_loss": -8.557373046875, "global_step": 54581, "epoch": 324} {"train_loss": -8.723466873168945, "global_step": 54582, "epoch": 324} {"train_loss": -8.510682106018066, "global_step": 54583, "epoch": 324} {"train_loss": -8.580299377441406, "global_step": 54584, "epoch": 324} {"train_loss": -8.188180923461914, "global_step": 54585, "epoch": 324} {"train_loss": -8.489463806152344, "global_step": 54586, "epoch": 324} {"train_loss": -8.582274436950684, "global_step": 54587, "epoch": 324} {"train_loss": -8.515161514282227, "global_step": 54588, "epoch": 324} {"train_loss": -8.506464958190918, "global_step": 54589, "epoch": 324} {"train_loss": -8.513788223266602, "global_step": 54590, "epoch": 324} {"train_loss": -8.789365768432617, "global_step": 54591, "epoch": 324} {"train_loss": -8.528234481811523, "global_step": 54592, "epoch": 324} {"train_loss": -8.42902946472168, "global_step": 54593, "epoch": 324} {"train_loss": -8.74144458770752, "global_step": 54594, "epoch": 324} {"train_loss": -8.461819648742676, "global_step": 54595, "epoch": 324} {"train_loss": -8.849571228027344, "global_step": 54596, "epoch": 324} {"train_loss": -8.55162525177002, "global_step": 54597, "epoch": 324} {"train_loss": -8.351709365844727, "global_step": 54598, "epoch": 324} {"train_loss": -8.421204629398527, "global_step": 54599, "epoch": 324, "val_loss": 186354.859375} {"train_loss": -8.515104293823242, "global_step": 54600, "epoch": 325} {"train_loss": -8.281333923339844, "global_step": 54601, "epoch": 325} {"train_loss": -8.283586502075195, "global_step": 54602, "epoch": 325} {"train_loss": -8.390090942382812, "global_step": 54603, "epoch": 325} {"train_loss": -8.542235374450684, "global_step": 54604, "epoch": 325} {"train_loss": -8.716333389282227, "global_step": 54605, "epoch": 325} {"train_loss": -8.612471580505371, "global_step": 54606, "epoch": 325} {"train_loss": -8.442296981811523, "global_step": 54607, "epoch": 325} {"train_loss": -8.466236114501953, "global_step": 54608, "epoch": 325} {"train_loss": -8.353963851928711, "global_step": 54609, "epoch": 325} {"train_loss": -8.5787353515625, "global_step": 54610, "epoch": 325} {"train_loss": -8.447988510131836, "global_step": 54611, "epoch": 325} {"train_loss": -8.497220993041992, "global_step": 54612, "epoch": 325} {"train_loss": -8.447120666503906, "global_step": 54613, "epoch": 325} {"train_loss": -8.294835090637207, "global_step": 54614, "epoch": 325} {"train_loss": -8.4644775390625, "global_step": 54615, "epoch": 325} {"train_loss": -8.410741806030273, "global_step": 54616, "epoch": 325} {"train_loss": -8.422052383422852, "global_step": 54617, "epoch": 325} {"train_loss": -8.308349609375, "global_step": 54618, "epoch": 325} {"train_loss": -8.410743713378906, "global_step": 54619, "epoch": 325} {"train_loss": -8.252702713012695, "global_step": 54620, "epoch": 325} {"train_loss": -8.740832328796387, "global_step": 54621, "epoch": 325} {"train_loss": -8.617330551147461, "global_step": 54622, "epoch": 325} {"train_loss": -8.539788246154785, "global_step": 54623, "epoch": 325} {"train_loss": -8.382352828979492, "global_step": 54624, "epoch": 325} {"train_loss": -8.645103454589844, "global_step": 54625, "epoch": 325} {"train_loss": -8.566183090209961, "global_step": 54626, "epoch": 325} {"train_loss": -8.9075927734375, "global_step": 54627, "epoch": 325} {"train_loss": -8.576417922973633, "global_step": 54628, "epoch": 325} {"train_loss": -8.610718727111816, "global_step": 54629, "epoch": 325} {"train_loss": -8.473564147949219, "global_step": 54630, "epoch": 325} {"train_loss": -8.236720085144043, "global_step": 54631, "epoch": 325} {"train_loss": -8.32270622253418, "global_step": 54632, "epoch": 325} {"train_loss": -8.323554992675781, "global_step": 54633, "epoch": 325} {"train_loss": -8.459442138671875, "global_step": 54634, "epoch": 325} {"train_loss": -8.28317928314209, "global_step": 54635, "epoch": 325} {"train_loss": -8.265762329101562, "global_step": 54636, "epoch": 325} {"train_loss": -8.556587219238281, "global_step": 54637, "epoch": 325} {"train_loss": -8.224615097045898, "global_step": 54638, "epoch": 325} {"train_loss": -8.448758125305176, "global_step": 54639, "epoch": 325} {"train_loss": -8.321517944335938, "global_step": 54640, "epoch": 325} {"train_loss": -8.522713661193848, "global_step": 54641, "epoch": 325} {"train_loss": -8.213560104370117, "global_step": 54642, "epoch": 325} {"train_loss": -8.425671577453613, "global_step": 54643, "epoch": 325} {"train_loss": -8.55615234375, "global_step": 54644, "epoch": 325} {"train_loss": -8.389482498168945, "global_step": 54645, "epoch": 325} {"train_loss": -8.498451232910156, "global_step": 54646, "epoch": 325} {"train_loss": -8.47117805480957, "global_step": 54647, "epoch": 325} {"train_loss": -8.655862808227539, "global_step": 54648, "epoch": 325} {"train_loss": -8.45840072631836, "global_step": 54649, "epoch": 325} {"train_loss": -8.565080642700195, "global_step": 54650, "epoch": 325} {"train_loss": -8.576241493225098, "global_step": 54651, "epoch": 325} {"train_loss": -8.392374038696289, "global_step": 54652, "epoch": 325} {"train_loss": -8.60403060913086, "global_step": 54653, "epoch": 325} {"train_loss": -8.471360206604004, "global_step": 54654, "epoch": 325} {"train_loss": -8.588239669799805, "global_step": 54655, "epoch": 325} {"train_loss": -8.47520637512207, "global_step": 54656, "epoch": 325} {"train_loss": -8.5341796875, "global_step": 54657, "epoch": 325} {"train_loss": -8.374371528625488, "global_step": 54658, "epoch": 325} {"train_loss": -8.616243362426758, "global_step": 54659, "epoch": 325} {"train_loss": -8.708304405212402, "global_step": 54660, "epoch": 325} {"train_loss": -8.616081237792969, "global_step": 54661, "epoch": 325} {"train_loss": -8.218884468078613, "global_step": 54662, "epoch": 325} {"train_loss": -8.58737564086914, "global_step": 54663, "epoch": 325} {"train_loss": -8.478349685668945, "global_step": 54664, "epoch": 325} {"train_loss": -8.662630081176758, "global_step": 54665, "epoch": 325} {"train_loss": -8.503795623779297, "global_step": 54666, "epoch": 325} {"train_loss": -8.772700309753418, "global_step": 54667, "epoch": 325} {"train_loss": -8.244976043701172, "global_step": 54668, "epoch": 325} {"train_loss": -8.609578132629395, "global_step": 54669, "epoch": 325} {"train_loss": -8.39567756652832, "global_step": 54670, "epoch": 325} {"train_loss": -8.398172378540039, "global_step": 54671, "epoch": 325} {"train_loss": -8.6128568649292, "global_step": 54672, "epoch": 325} {"train_loss": -8.137674331665039, "global_step": 54673, "epoch": 325} {"train_loss": -8.365252494812012, "global_step": 54674, "epoch": 325} {"train_loss": -8.410840034484863, "global_step": 54675, "epoch": 325} {"train_loss": -8.526750564575195, "global_step": 54676, "epoch": 325} {"train_loss": -8.32091999053955, "global_step": 54677, "epoch": 325} {"train_loss": -8.610947608947754, "global_step": 54678, "epoch": 325} {"train_loss": -8.291570663452148, "global_step": 54679, "epoch": 325} {"train_loss": -8.253881454467773, "global_step": 54680, "epoch": 325} {"train_loss": -8.582296371459961, "global_step": 54681, "epoch": 325} {"train_loss": -8.415111541748047, "global_step": 54682, "epoch": 325} {"train_loss": -8.40589714050293, "global_step": 54683, "epoch": 325} {"train_loss": -8.49838638305664, "global_step": 54684, "epoch": 325} {"train_loss": -8.393735885620117, "global_step": 54685, "epoch": 325} {"train_loss": -8.313304901123047, "global_step": 54686, "epoch": 325} {"train_loss": -8.448487281799316, "global_step": 54687, "epoch": 325} {"train_loss": -8.216367721557617, "global_step": 54688, "epoch": 325} {"train_loss": -8.617197036743164, "global_step": 54689, "epoch": 325} {"train_loss": -8.436311721801758, "global_step": 54690, "epoch": 325} {"train_loss": -8.250866889953613, "global_step": 54691, "epoch": 325} {"train_loss": -8.337593078613281, "global_step": 54692, "epoch": 325} {"train_loss": -8.440217018127441, "global_step": 54693, "epoch": 325} {"train_loss": -8.162590026855469, "global_step": 54694, "epoch": 325} {"train_loss": -8.494630813598633, "global_step": 54695, "epoch": 325} {"train_loss": -8.55941104888916, "global_step": 54696, "epoch": 325} {"train_loss": -8.558343887329102, "global_step": 54697, "epoch": 325} {"train_loss": -8.358169555664062, "global_step": 54698, "epoch": 325} {"train_loss": -8.469910621643066, "global_step": 54699, "epoch": 325} {"train_loss": -8.38942813873291, "global_step": 54700, "epoch": 325} {"train_loss": -8.592705726623535, "global_step": 54701, "epoch": 325} {"train_loss": -8.48714828491211, "global_step": 54702, "epoch": 325} {"train_loss": -8.36979866027832, "global_step": 54703, "epoch": 325} {"train_loss": -8.39857292175293, "global_step": 54704, "epoch": 325} {"train_loss": -8.471939086914062, "global_step": 54705, "epoch": 325} {"train_loss": -8.591094970703125, "global_step": 54706, "epoch": 325} {"train_loss": -8.591178894042969, "global_step": 54707, "epoch": 325} {"train_loss": -8.817544937133789, "global_step": 54708, "epoch": 325} {"train_loss": -8.442716598510742, "global_step": 54709, "epoch": 325} {"train_loss": -8.562117576599121, "global_step": 54710, "epoch": 325} {"train_loss": -8.561300277709961, "global_step": 54711, "epoch": 325} {"train_loss": -8.774806022644043, "global_step": 54712, "epoch": 325} {"train_loss": -8.559606552124023, "global_step": 54713, "epoch": 325} {"train_loss": -8.527083396911621, "global_step": 54714, "epoch": 325} {"train_loss": -8.76685905456543, "global_step": 54715, "epoch": 325} {"train_loss": -8.47596549987793, "global_step": 54716, "epoch": 325} {"train_loss": -8.619861602783203, "global_step": 54717, "epoch": 325} {"train_loss": -8.614013671875, "global_step": 54718, "epoch": 325} {"train_loss": -8.40149974822998, "global_step": 54719, "epoch": 325} {"train_loss": -8.499458312988281, "global_step": 54720, "epoch": 325} {"train_loss": -8.736153602600098, "global_step": 54721, "epoch": 325} {"train_loss": -8.7498140335083, "global_step": 54722, "epoch": 325} {"train_loss": -8.574357986450195, "global_step": 54723, "epoch": 325} {"train_loss": -8.40070915222168, "global_step": 54724, "epoch": 325} {"train_loss": -8.412418365478516, "global_step": 54725, "epoch": 325} {"train_loss": -8.517955780029297, "global_step": 54726, "epoch": 325} {"train_loss": -8.325121879577637, "global_step": 54727, "epoch": 325} {"train_loss": -8.434003829956055, "global_step": 54728, "epoch": 325} {"train_loss": -8.424165725708008, "global_step": 54729, "epoch": 325} {"train_loss": -8.474430084228516, "global_step": 54730, "epoch": 325} {"train_loss": -8.49605941772461, "global_step": 54731, "epoch": 325} {"train_loss": -8.17696762084961, "global_step": 54732, "epoch": 325} {"train_loss": -8.451337814331055, "global_step": 54733, "epoch": 325} {"train_loss": -8.601147651672363, "global_step": 54734, "epoch": 325} {"train_loss": -8.590544700622559, "global_step": 54735, "epoch": 325} {"train_loss": -8.423296928405762, "global_step": 54736, "epoch": 325} {"train_loss": -8.641735076904297, "global_step": 54737, "epoch": 325} {"train_loss": -8.157125473022461, "global_step": 54738, "epoch": 325} {"train_loss": -8.42793083190918, "global_step": 54739, "epoch": 325} {"train_loss": -8.094231605529785, "global_step": 54740, "epoch": 325} {"train_loss": -8.410832405090332, "global_step": 54741, "epoch": 325} {"train_loss": -7.832773208618164, "global_step": 54742, "epoch": 325} {"train_loss": -8.381021499633789, "global_step": 54743, "epoch": 325} {"train_loss": -8.391050338745117, "global_step": 54744, "epoch": 325} {"train_loss": -8.43557357788086, "global_step": 54745, "epoch": 325} {"train_loss": -8.339778900146484, "global_step": 54746, "epoch": 325} {"train_loss": -8.142082214355469, "global_step": 54747, "epoch": 325} {"train_loss": -8.459957122802734, "global_step": 54748, "epoch": 325} {"train_loss": -8.294907569885254, "global_step": 54749, "epoch": 325} {"train_loss": -8.346739768981934, "global_step": 54750, "epoch": 325} {"train_loss": -8.36077880859375, "global_step": 54751, "epoch": 325} {"train_loss": -8.630338668823242, "global_step": 54752, "epoch": 325} {"train_loss": -8.224363327026367, "global_step": 54753, "epoch": 325} {"train_loss": -8.293105125427246, "global_step": 54754, "epoch": 325} {"train_loss": -8.766088485717773, "global_step": 54755, "epoch": 325} {"train_loss": -8.401118278503418, "global_step": 54756, "epoch": 325} {"train_loss": -8.526188850402832, "global_step": 54757, "epoch": 325} {"train_loss": -8.56147575378418, "global_step": 54758, "epoch": 325} {"train_loss": -8.334738731384277, "global_step": 54759, "epoch": 325} {"train_loss": -8.307388305664062, "global_step": 54760, "epoch": 325} {"train_loss": -8.478148460388184, "global_step": 54761, "epoch": 325} {"train_loss": -8.239347457885742, "global_step": 54762, "epoch": 325} {"train_loss": -8.377676010131836, "global_step": 54763, "epoch": 325} {"train_loss": -8.709295272827148, "global_step": 54764, "epoch": 325} {"train_loss": -8.371190071105957, "global_step": 54765, "epoch": 325} {"train_loss": -8.538288116455078, "global_step": 54766, "epoch": 325} {"train_loss": -8.459400239444914, "global_step": 54767, "epoch": 325, "val_loss": 188713.921875, "train_action_mse_error": 5.700697422027588} {"train_loss": -8.448441505432129, "global_step": 54768, "epoch": 326} {"train_loss": -8.435969352722168, "global_step": 54769, "epoch": 326} {"train_loss": -8.641895294189453, "global_step": 54770, "epoch": 326} {"train_loss": -8.602228164672852, "global_step": 54771, "epoch": 326} {"train_loss": -8.628776550292969, "global_step": 54772, "epoch": 326} {"train_loss": -8.39583969116211, "global_step": 54773, "epoch": 326} {"train_loss": -8.459077835083008, "global_step": 54774, "epoch": 326} {"train_loss": -8.549966812133789, "global_step": 54775, "epoch": 326} {"train_loss": -8.610318183898926, "global_step": 54776, "epoch": 326} {"train_loss": -8.507396697998047, "global_step": 54777, "epoch": 326} {"train_loss": -8.633224487304688, "global_step": 54778, "epoch": 326} {"train_loss": -8.464824676513672, "global_step": 54779, "epoch": 326} {"train_loss": -8.622299194335938, "global_step": 54780, "epoch": 326} {"train_loss": -8.545014381408691, "global_step": 54781, "epoch": 326} {"train_loss": -8.50946044921875, "global_step": 54782, "epoch": 326} {"train_loss": -8.74324893951416, "global_step": 54783, "epoch": 326} {"train_loss": -8.657449722290039, "global_step": 54784, "epoch": 326} {"train_loss": -8.746274948120117, "global_step": 54785, "epoch": 326} {"train_loss": -8.797430038452148, "global_step": 54786, "epoch": 326} {"train_loss": -8.579330444335938, "global_step": 54787, "epoch": 326} {"train_loss": -8.638705253601074, "global_step": 54788, "epoch": 326} {"train_loss": -8.742801666259766, "global_step": 54789, "epoch": 326} {"train_loss": -8.840431213378906, "global_step": 54790, "epoch": 326} {"train_loss": -8.686729431152344, "global_step": 54791, "epoch": 326} {"train_loss": -8.429167747497559, "global_step": 54792, "epoch": 326} {"train_loss": -8.516484260559082, "global_step": 54793, "epoch": 326} {"train_loss": -8.331932067871094, "global_step": 54794, "epoch": 326} {"train_loss": -8.1168212890625, "global_step": 54795, "epoch": 326} {"train_loss": -8.668157577514648, "global_step": 54796, "epoch": 326} {"train_loss": -8.163823127746582, "global_step": 54797, "epoch": 326} {"train_loss": -8.19795036315918, "global_step": 54798, "epoch": 326} {"train_loss": -8.422974586486816, "global_step": 54799, "epoch": 326} {"train_loss": -8.445556640625, "global_step": 54800, "epoch": 326} {"train_loss": -8.616198539733887, "global_step": 54801, "epoch": 326} {"train_loss": -8.450822830200195, "global_step": 54802, "epoch": 326} {"train_loss": -8.436553955078125, "global_step": 54803, "epoch": 326} {"train_loss": -8.106925964355469, "global_step": 54804, "epoch": 326} {"train_loss": -8.605953216552734, "global_step": 54805, "epoch": 326} {"train_loss": -8.575474739074707, "global_step": 54806, "epoch": 326} {"train_loss": -8.43256664276123, "global_step": 54807, "epoch": 326} {"train_loss": -8.453922271728516, "global_step": 54808, "epoch": 326} {"train_loss": -8.555217742919922, "global_step": 54809, "epoch": 326} {"train_loss": -8.308677673339844, "global_step": 54810, "epoch": 326} {"train_loss": -8.37155818939209, "global_step": 54811, "epoch": 326} {"train_loss": -8.277486801147461, "global_step": 54812, "epoch": 326} {"train_loss": -8.492040634155273, "global_step": 54813, "epoch": 326} {"train_loss": -8.228130340576172, "global_step": 54814, "epoch": 326} {"train_loss": -8.25153923034668, "global_step": 54815, "epoch": 326} {"train_loss": -8.229181289672852, "global_step": 54816, "epoch": 326} {"train_loss": -8.478046417236328, "global_step": 54817, "epoch": 326} {"train_loss": -8.258768081665039, "global_step": 54818, "epoch": 326} {"train_loss": -8.320892333984375, "global_step": 54819, "epoch": 326} {"train_loss": -8.560300827026367, "global_step": 54820, "epoch": 326} {"train_loss": -8.189643859863281, "global_step": 54821, "epoch": 326} {"train_loss": -8.614585876464844, "global_step": 54822, "epoch": 326} {"train_loss": -8.390439987182617, "global_step": 54823, "epoch": 326} {"train_loss": -8.5471773147583, "global_step": 54824, "epoch": 326} {"train_loss": -8.479580879211426, "global_step": 54825, "epoch": 326} {"train_loss": -8.720571517944336, "global_step": 54826, "epoch": 326} {"train_loss": -8.320919036865234, "global_step": 54827, "epoch": 326} {"train_loss": -8.63729190826416, "global_step": 54828, "epoch": 326} {"train_loss": -8.450632095336914, "global_step": 54829, "epoch": 326} {"train_loss": -8.373636245727539, "global_step": 54830, "epoch": 326} {"train_loss": -8.2673921585083, "global_step": 54831, "epoch": 326} {"train_loss": -8.764888763427734, "global_step": 54832, "epoch": 326} {"train_loss": -8.413273811340332, "global_step": 54833, "epoch": 326} {"train_loss": -8.303849220275879, "global_step": 54834, "epoch": 326} {"train_loss": -8.281458854675293, "global_step": 54835, "epoch": 326} {"train_loss": -8.354913711547852, "global_step": 54836, "epoch": 326} {"train_loss": -8.234394073486328, "global_step": 54837, "epoch": 326} {"train_loss": -8.452241897583008, "global_step": 54838, "epoch": 326} {"train_loss": -8.270428657531738, "global_step": 54839, "epoch": 326} {"train_loss": -8.42996883392334, "global_step": 54840, "epoch": 326} {"train_loss": -8.284370422363281, "global_step": 54841, "epoch": 326} {"train_loss": -8.446321487426758, "global_step": 54842, "epoch": 326} {"train_loss": -8.288595199584961, "global_step": 54843, "epoch": 326} {"train_loss": -8.405709266662598, "global_step": 54844, "epoch": 326} {"train_loss": -8.420459747314453, "global_step": 54845, "epoch": 326} {"train_loss": -8.397102355957031, "global_step": 54846, "epoch": 326} {"train_loss": -8.574605941772461, "global_step": 54847, "epoch": 326} {"train_loss": -8.303230285644531, "global_step": 54848, "epoch": 326} {"train_loss": -8.517966270446777, "global_step": 54849, "epoch": 326} {"train_loss": -8.431442260742188, "global_step": 54850, "epoch": 326} {"train_loss": -8.37939739227295, "global_step": 54851, "epoch": 326} {"train_loss": -8.247757911682129, "global_step": 54852, "epoch": 326} {"train_loss": -8.311134338378906, "global_step": 54853, "epoch": 326} {"train_loss": -8.327749252319336, "global_step": 54854, "epoch": 326} {"train_loss": -8.220637321472168, "global_step": 54855, "epoch": 326} {"train_loss": -8.247775077819824, "global_step": 54856, "epoch": 326} {"train_loss": -8.278289794921875, "global_step": 54857, "epoch": 326} {"train_loss": -8.371273040771484, "global_step": 54858, "epoch": 326} {"train_loss": -8.296955108642578, "global_step": 54859, "epoch": 326} {"train_loss": -8.510856628417969, "global_step": 54860, "epoch": 326} {"train_loss": -8.306793212890625, "global_step": 54861, "epoch": 326} {"train_loss": -8.288538932800293, "global_step": 54862, "epoch": 326} {"train_loss": -8.226020812988281, "global_step": 54863, "epoch": 326} {"train_loss": -8.138181686401367, "global_step": 54864, "epoch": 326} {"train_loss": -8.589780807495117, "global_step": 54865, "epoch": 326} {"train_loss": -8.378608703613281, "global_step": 54866, "epoch": 326} {"train_loss": -8.441290855407715, "global_step": 54867, "epoch": 326} {"train_loss": -8.418587684631348, "global_step": 54868, "epoch": 326} {"train_loss": -8.135292053222656, "global_step": 54869, "epoch": 326} {"train_loss": -8.66353702545166, "global_step": 54870, "epoch": 326} {"train_loss": -8.18490219116211, "global_step": 54871, "epoch": 326} {"train_loss": -8.716796875, "global_step": 54872, "epoch": 326} {"train_loss": -8.333555221557617, "global_step": 54873, "epoch": 326} {"train_loss": -8.695455551147461, "global_step": 54874, "epoch": 326} {"train_loss": -8.395164489746094, "global_step": 54875, "epoch": 326} {"train_loss": -8.843994140625, "global_step": 54876, "epoch": 326} {"train_loss": -8.1662015914917, "global_step": 54877, "epoch": 326} {"train_loss": -8.715815544128418, "global_step": 54878, "epoch": 326} {"train_loss": -8.411064147949219, "global_step": 54879, "epoch": 326} {"train_loss": -8.807251930236816, "global_step": 54880, "epoch": 326} {"train_loss": -8.51391887664795, "global_step": 54881, "epoch": 326} {"train_loss": -8.709632873535156, "global_step": 54882, "epoch": 326} {"train_loss": -8.517171859741211, "global_step": 54883, "epoch": 326} {"train_loss": -8.421223640441895, "global_step": 54884, "epoch": 326} {"train_loss": -8.47895336151123, "global_step": 54885, "epoch": 326} {"train_loss": -8.596420288085938, "global_step": 54886, "epoch": 326} {"train_loss": -8.594314575195312, "global_step": 54887, "epoch": 326} {"train_loss": -8.427206039428711, "global_step": 54888, "epoch": 326} {"train_loss": -8.519515991210938, "global_step": 54889, "epoch": 326} {"train_loss": -8.749185562133789, "global_step": 54890, "epoch": 326} {"train_loss": -8.5384521484375, "global_step": 54891, "epoch": 326} {"train_loss": -8.820599555969238, "global_step": 54892, "epoch": 326} {"train_loss": -8.377662658691406, "global_step": 54893, "epoch": 326} {"train_loss": -8.404333114624023, "global_step": 54894, "epoch": 326} {"train_loss": -8.508106231689453, "global_step": 54895, "epoch": 326} {"train_loss": -8.438314437866211, "global_step": 54896, "epoch": 326} {"train_loss": -8.543863296508789, "global_step": 54897, "epoch": 326} {"train_loss": -8.4712495803833, "global_step": 54898, "epoch": 326} {"train_loss": -8.394171714782715, "global_step": 54899, "epoch": 326} {"train_loss": -8.60258674621582, "global_step": 54900, "epoch": 326} {"train_loss": -8.37588882446289, "global_step": 54901, "epoch": 326} {"train_loss": -8.567809104919434, "global_step": 54902, "epoch": 326} {"train_loss": -8.331719398498535, "global_step": 54903, "epoch": 326} {"train_loss": -8.338239669799805, "global_step": 54904, "epoch": 326} {"train_loss": -8.556376457214355, "global_step": 54905, "epoch": 326} {"train_loss": -8.522058486938477, "global_step": 54906, "epoch": 326} {"train_loss": -8.436826705932617, "global_step": 54907, "epoch": 326} {"train_loss": -8.509170532226562, "global_step": 54908, "epoch": 326} {"train_loss": -8.6537446975708, "global_step": 54909, "epoch": 326} {"train_loss": -8.585042953491211, "global_step": 54910, "epoch": 326} {"train_loss": -8.408040046691895, "global_step": 54911, "epoch": 326} {"train_loss": -8.376152038574219, "global_step": 54912, "epoch": 326} {"train_loss": -8.419358253479004, "global_step": 54913, "epoch": 326} {"train_loss": -8.60986042022705, "global_step": 54914, "epoch": 326} {"train_loss": -8.558481216430664, "global_step": 54915, "epoch": 326} {"train_loss": -8.603775024414062, "global_step": 54916, "epoch": 326} {"train_loss": -8.591382026672363, "global_step": 54917, "epoch": 326} {"train_loss": -8.567864418029785, "global_step": 54918, "epoch": 326} {"train_loss": -8.330696105957031, "global_step": 54919, "epoch": 326} {"train_loss": -8.344084739685059, "global_step": 54920, "epoch": 326} {"train_loss": -8.266798973083496, "global_step": 54921, "epoch": 326} {"train_loss": -8.549214363098145, "global_step": 54922, "epoch": 326} {"train_loss": -8.650747299194336, "global_step": 54923, "epoch": 326} {"train_loss": -8.458288192749023, "global_step": 54924, "epoch": 326} {"train_loss": -8.430221557617188, "global_step": 54925, "epoch": 326} {"train_loss": -8.512680053710938, "global_step": 54926, "epoch": 326} {"train_loss": -8.217660903930664, "global_step": 54927, "epoch": 326} {"train_loss": -8.495548248291016, "global_step": 54928, "epoch": 326} {"train_loss": -8.17477798461914, "global_step": 54929, "epoch": 326} {"train_loss": -8.55007266998291, "global_step": 54930, "epoch": 326} {"train_loss": -8.445085525512695, "global_step": 54931, "epoch": 326} {"train_loss": -8.497459411621094, "global_step": 54932, "epoch": 326} {"train_loss": -8.240442276000977, "global_step": 54933, "epoch": 326} {"train_loss": -8.63298225402832, "global_step": 54934, "epoch": 326} {"train_loss": -8.458660131409054, "global_step": 54935, "epoch": 326, "val_loss": 190862.5625} {"train_loss": -8.42808723449707, "global_step": 54936, "epoch": 327} {"train_loss": -8.382741928100586, "global_step": 54937, "epoch": 327} {"train_loss": -8.652587890625, "global_step": 54938, "epoch": 327} {"train_loss": -8.185271263122559, "global_step": 54939, "epoch": 327} {"train_loss": -8.564432144165039, "global_step": 54940, "epoch": 327} {"train_loss": -8.583337783813477, "global_step": 54941, "epoch": 327} {"train_loss": -8.421894073486328, "global_step": 54942, "epoch": 327} {"train_loss": -8.650102615356445, "global_step": 54943, "epoch": 327} {"train_loss": -8.543379783630371, "global_step": 54944, "epoch": 327} {"train_loss": -8.37663745880127, "global_step": 54945, "epoch": 327} {"train_loss": -8.654565811157227, "global_step": 54946, "epoch": 327} {"train_loss": -8.5333251953125, "global_step": 54947, "epoch": 327} {"train_loss": -8.23663330078125, "global_step": 54948, "epoch": 327} {"train_loss": -8.568435668945312, "global_step": 54949, "epoch": 327} {"train_loss": -8.535650253295898, "global_step": 54950, "epoch": 327} {"train_loss": -8.528465270996094, "global_step": 54951, "epoch": 327} {"train_loss": -8.480113983154297, "global_step": 54952, "epoch": 327} {"train_loss": -8.537637710571289, "global_step": 54953, "epoch": 327} {"train_loss": -8.717277526855469, "global_step": 54954, "epoch": 327} {"train_loss": -8.414152145385742, "global_step": 54955, "epoch": 327} {"train_loss": -8.61007022857666, "global_step": 54956, "epoch": 327} {"train_loss": -8.574140548706055, "global_step": 54957, "epoch": 327} {"train_loss": -8.356117248535156, "global_step": 54958, "epoch": 327} {"train_loss": -8.655776977539062, "global_step": 54959, "epoch": 327} {"train_loss": -8.587912559509277, "global_step": 54960, "epoch": 327} {"train_loss": -8.59684944152832, "global_step": 54961, "epoch": 327} {"train_loss": -8.63347339630127, "global_step": 54962, "epoch": 327} {"train_loss": -8.50413703918457, "global_step": 54963, "epoch": 327} {"train_loss": -8.663393020629883, "global_step": 54964, "epoch": 327} {"train_loss": -8.695837020874023, "global_step": 54965, "epoch": 327} {"train_loss": -8.517677307128906, "global_step": 54966, "epoch": 327} {"train_loss": -8.541093826293945, "global_step": 54967, "epoch": 327} {"train_loss": -8.735313415527344, "global_step": 54968, "epoch": 327} {"train_loss": -8.410856246948242, "global_step": 54969, "epoch": 327} {"train_loss": -8.421285629272461, "global_step": 54970, "epoch": 327} {"train_loss": -8.703840255737305, "global_step": 54971, "epoch": 327} {"train_loss": -8.49318790435791, "global_step": 54972, "epoch": 327} {"train_loss": -8.559759140014648, "global_step": 54973, "epoch": 327} {"train_loss": -8.27011775970459, "global_step": 54974, "epoch": 327} {"train_loss": -8.511041641235352, "global_step": 54975, "epoch": 327} {"train_loss": -8.399078369140625, "global_step": 54976, "epoch": 327} {"train_loss": -8.599239349365234, "global_step": 54977, "epoch": 327} {"train_loss": -8.633081436157227, "global_step": 54978, "epoch": 327} {"train_loss": -8.246009826660156, "global_step": 54979, "epoch": 327} {"train_loss": -8.739036560058594, "global_step": 54980, "epoch": 327} {"train_loss": -8.46894645690918, "global_step": 54981, "epoch": 327} {"train_loss": -8.332878112792969, "global_step": 54982, "epoch": 327} {"train_loss": -8.556924819946289, "global_step": 54983, "epoch": 327} {"train_loss": -8.558159828186035, "global_step": 54984, "epoch": 327} {"train_loss": -8.141304016113281, "global_step": 54985, "epoch": 327} {"train_loss": -8.602046012878418, "global_step": 54986, "epoch": 327} {"train_loss": -8.654437065124512, "global_step": 54987, "epoch": 327} {"train_loss": -8.410332679748535, "global_step": 54988, "epoch": 327} {"train_loss": -8.474867820739746, "global_step": 54989, "epoch": 327} {"train_loss": -8.394830703735352, "global_step": 54990, "epoch": 327} {"train_loss": -8.629457473754883, "global_step": 54991, "epoch": 327} {"train_loss": -8.512104034423828, "global_step": 54992, "epoch": 327} {"train_loss": -8.290201187133789, "global_step": 54993, "epoch": 327} {"train_loss": -8.537087440490723, "global_step": 54994, "epoch": 327} {"train_loss": -8.460907936096191, "global_step": 54995, "epoch": 327} {"train_loss": -8.563301086425781, "global_step": 54996, "epoch": 327} {"train_loss": -8.299297332763672, "global_step": 54997, "epoch": 327} {"train_loss": -8.433062553405762, "global_step": 54998, "epoch": 327} {"train_loss": -8.46236801147461, "global_step": 54999, "epoch": 327} {"train_loss": -8.632954597473145, "global_step": 55000, "epoch": 327} {"train_loss": -8.405488967895508, "global_step": 55001, "epoch": 327} {"train_loss": -8.530702590942383, "global_step": 55002, "epoch": 327} {"train_loss": -8.53962516784668, "global_step": 55003, "epoch": 327} {"train_loss": -8.417080879211426, "global_step": 55004, "epoch": 327} {"train_loss": -8.521199226379395, "global_step": 55005, "epoch": 327} {"train_loss": -8.654616355895996, "global_step": 55006, "epoch": 327} {"train_loss": -8.598794937133789, "global_step": 55007, "epoch": 327} {"train_loss": -8.611021041870117, "global_step": 55008, "epoch": 327} {"train_loss": -8.358362197875977, "global_step": 55009, "epoch": 327} {"train_loss": -8.612756729125977, "global_step": 55010, "epoch": 327} {"train_loss": -8.762616157531738, "global_step": 55011, "epoch": 327} {"train_loss": -8.380306243896484, "global_step": 55012, "epoch": 327} {"train_loss": -8.623910903930664, "global_step": 55013, "epoch": 327} {"train_loss": -8.682928085327148, "global_step": 55014, "epoch": 327} {"train_loss": -8.420578002929688, "global_step": 55015, "epoch": 327} {"train_loss": -8.656621932983398, "global_step": 55016, "epoch": 327} {"train_loss": -8.584056854248047, "global_step": 55017, "epoch": 327} {"train_loss": -8.655447959899902, "global_step": 55018, "epoch": 327} {"train_loss": -8.682130813598633, "global_step": 55019, "epoch": 327} {"train_loss": -8.682209968566895, "global_step": 55020, "epoch": 327} {"train_loss": -8.48137092590332, "global_step": 55021, "epoch": 327} {"train_loss": -8.793157577514648, "global_step": 55022, "epoch": 327} {"train_loss": -8.33187484741211, "global_step": 55023, "epoch": 327} {"train_loss": -8.846981048583984, "global_step": 55024, "epoch": 327} {"train_loss": -8.701833724975586, "global_step": 55025, "epoch": 327} {"train_loss": -8.559733390808105, "global_step": 55026, "epoch": 327} {"train_loss": -8.704556465148926, "global_step": 55027, "epoch": 327} {"train_loss": -8.625252723693848, "global_step": 55028, "epoch": 327} {"train_loss": -8.611473083496094, "global_step": 55029, "epoch": 327} {"train_loss": -8.718936920166016, "global_step": 55030, "epoch": 327} {"train_loss": -8.629032135009766, "global_step": 55031, "epoch": 327} {"train_loss": -8.37901496887207, "global_step": 55032, "epoch": 327} {"train_loss": -8.58206844329834, "global_step": 55033, "epoch": 327} {"train_loss": -8.460603713989258, "global_step": 55034, "epoch": 327} {"train_loss": -8.406070709228516, "global_step": 55035, "epoch": 327} {"train_loss": -8.447315216064453, "global_step": 55036, "epoch": 327} {"train_loss": -8.280982971191406, "global_step": 55037, "epoch": 327} {"train_loss": -8.388591766357422, "global_step": 55038, "epoch": 327} {"train_loss": -8.362781524658203, "global_step": 55039, "epoch": 327} {"train_loss": -8.667530059814453, "global_step": 55040, "epoch": 327} {"train_loss": -8.40268325805664, "global_step": 55041, "epoch": 327} {"train_loss": -8.34958553314209, "global_step": 55042, "epoch": 327} {"train_loss": -8.61408519744873, "global_step": 55043, "epoch": 327} {"train_loss": -8.282571792602539, "global_step": 55044, "epoch": 327} {"train_loss": -8.292302131652832, "global_step": 55045, "epoch": 327} {"train_loss": -8.446066856384277, "global_step": 55046, "epoch": 327} {"train_loss": -8.506195068359375, "global_step": 55047, "epoch": 327} {"train_loss": -8.331648826599121, "global_step": 55048, "epoch": 327} {"train_loss": -8.610490798950195, "global_step": 55049, "epoch": 327} {"train_loss": -8.59541130065918, "global_step": 55050, "epoch": 327} {"train_loss": -8.318998336791992, "global_step": 55051, "epoch": 327} {"train_loss": -8.435101509094238, "global_step": 55052, "epoch": 327} {"train_loss": -8.631917953491211, "global_step": 55053, "epoch": 327} {"train_loss": -8.514406204223633, "global_step": 55054, "epoch": 327} {"train_loss": -8.59004020690918, "global_step": 55055, "epoch": 327} {"train_loss": -8.431302070617676, "global_step": 55056, "epoch": 327} {"train_loss": -8.388797760009766, "global_step": 55057, "epoch": 327} {"train_loss": -8.550355911254883, "global_step": 55058, "epoch": 327} {"train_loss": -8.5211181640625, "global_step": 55059, "epoch": 327} {"train_loss": -8.606298446655273, "global_step": 55060, "epoch": 327} {"train_loss": -8.502211570739746, "global_step": 55061, "epoch": 327} {"train_loss": -8.60078239440918, "global_step": 55062, "epoch": 327} {"train_loss": -8.774896621704102, "global_step": 55063, "epoch": 327} {"train_loss": -8.547643661499023, "global_step": 55064, "epoch": 327} {"train_loss": -8.526653289794922, "global_step": 55065, "epoch": 327} {"train_loss": -8.600292205810547, "global_step": 55066, "epoch": 327} {"train_loss": -8.176612854003906, "global_step": 55067, "epoch": 327} {"train_loss": -8.297819137573242, "global_step": 55068, "epoch": 327} {"train_loss": -8.543205261230469, "global_step": 55069, "epoch": 327} {"train_loss": -7.881514549255371, "global_step": 55070, "epoch": 327} {"train_loss": -8.482105255126953, "global_step": 55071, "epoch": 327} {"train_loss": -8.191060066223145, "global_step": 55072, "epoch": 327} {"train_loss": -8.099334716796875, "global_step": 55073, "epoch": 327} {"train_loss": -8.59855842590332, "global_step": 55074, "epoch": 327} {"train_loss": -8.43333625793457, "global_step": 55075, "epoch": 327} {"train_loss": -8.44447135925293, "global_step": 55076, "epoch": 327} {"train_loss": -8.267717361450195, "global_step": 55077, "epoch": 327} {"train_loss": -8.496285438537598, "global_step": 55078, "epoch": 327} {"train_loss": -8.313586235046387, "global_step": 55079, "epoch": 327} {"train_loss": -8.515645027160645, "global_step": 55080, "epoch": 327} {"train_loss": -8.271777153015137, "global_step": 55081, "epoch": 327} {"train_loss": -8.583277702331543, "global_step": 55082, "epoch": 327} {"train_loss": -8.342547416687012, "global_step": 55083, "epoch": 327} {"train_loss": -8.359537124633789, "global_step": 55084, "epoch": 327} {"train_loss": -8.425264358520508, "global_step": 55085, "epoch": 327} {"train_loss": -8.30210018157959, "global_step": 55086, "epoch": 327} {"train_loss": -8.354497909545898, "global_step": 55087, "epoch": 327} {"train_loss": -8.565852165222168, "global_step": 55088, "epoch": 327} {"train_loss": -8.37646484375, "global_step": 55089, "epoch": 327} {"train_loss": -8.52435302734375, "global_step": 55090, "epoch": 327} {"train_loss": -8.562827110290527, "global_step": 55091, "epoch": 327} {"train_loss": -8.681537628173828, "global_step": 55092, "epoch": 327} {"train_loss": -8.474567413330078, "global_step": 55093, "epoch": 327} {"train_loss": -8.796867370605469, "global_step": 55094, "epoch": 327} {"train_loss": -8.75541877746582, "global_step": 55095, "epoch": 327} {"train_loss": -8.58047866821289, "global_step": 55096, "epoch": 327} {"train_loss": -8.601288795471191, "global_step": 55097, "epoch": 327} {"train_loss": -8.400527954101562, "global_step": 55098, "epoch": 327} {"train_loss": -8.839296340942383, "global_step": 55099, "epoch": 327} {"train_loss": -8.362974166870117, "global_step": 55100, "epoch": 327} {"train_loss": -8.376935958862305, "global_step": 55101, "epoch": 327} {"train_loss": -8.31331729888916, "global_step": 55102, "epoch": 327} {"train_loss": -8.500802823475428, "global_step": 55103, "epoch": 327, "val_loss": 189214.0625} {"train_loss": -8.371200561523438, "global_step": 55104, "epoch": 328} {"train_loss": -8.156204223632812, "global_step": 55105, "epoch": 328} {"train_loss": -8.081236839294434, "global_step": 55106, "epoch": 328} {"train_loss": -8.27621841430664, "global_step": 55107, "epoch": 328} {"train_loss": -8.5119047164917, "global_step": 55108, "epoch": 328} {"train_loss": -8.22596549987793, "global_step": 55109, "epoch": 328} {"train_loss": -8.331335067749023, "global_step": 55110, "epoch": 328} {"train_loss": -8.313992500305176, "global_step": 55111, "epoch": 328} {"train_loss": -8.285787582397461, "global_step": 55112, "epoch": 328} {"train_loss": -8.334798812866211, "global_step": 55113, "epoch": 328} {"train_loss": -8.632953643798828, "global_step": 55114, "epoch": 328} {"train_loss": -8.391974449157715, "global_step": 55115, "epoch": 328} {"train_loss": -8.503582000732422, "global_step": 55116, "epoch": 328} {"train_loss": -8.439457893371582, "global_step": 55117, "epoch": 328} {"train_loss": -8.222785949707031, "global_step": 55118, "epoch": 328} {"train_loss": -8.471511840820312, "global_step": 55119, "epoch": 328} {"train_loss": -8.459261894226074, "global_step": 55120, "epoch": 328} {"train_loss": -8.537612915039062, "global_step": 55121, "epoch": 328} {"train_loss": -8.133130073547363, "global_step": 55122, "epoch": 328} {"train_loss": -8.483397483825684, "global_step": 55123, "epoch": 328} {"train_loss": -8.301143646240234, "global_step": 55124, "epoch": 328} {"train_loss": -8.322872161865234, "global_step": 55125, "epoch": 328} {"train_loss": -8.548332214355469, "global_step": 55126, "epoch": 328} {"train_loss": -8.643871307373047, "global_step": 55127, "epoch": 328} {"train_loss": -8.66893196105957, "global_step": 55128, "epoch": 328} {"train_loss": -8.574580192565918, "global_step": 55129, "epoch": 328} {"train_loss": -8.570575714111328, "global_step": 55130, "epoch": 328} {"train_loss": -8.561819076538086, "global_step": 55131, "epoch": 328} {"train_loss": -8.559131622314453, "global_step": 55132, "epoch": 328} {"train_loss": -8.632511138916016, "global_step": 55133, "epoch": 328} {"train_loss": -8.562514305114746, "global_step": 55134, "epoch": 328} {"train_loss": -8.631813049316406, "global_step": 55135, "epoch": 328} {"train_loss": -8.514678001403809, "global_step": 55136, "epoch": 328} {"train_loss": -8.540145874023438, "global_step": 55137, "epoch": 328} {"train_loss": -8.36742877960205, "global_step": 55138, "epoch": 328} {"train_loss": -8.349061965942383, "global_step": 55139, "epoch": 328} {"train_loss": -8.47264575958252, "global_step": 55140, "epoch": 328} {"train_loss": -7.987976551055908, "global_step": 55141, "epoch": 328} {"train_loss": -8.627264022827148, "global_step": 55142, "epoch": 328} {"train_loss": -8.451189041137695, "global_step": 55143, "epoch": 328} {"train_loss": -8.157439231872559, "global_step": 55144, "epoch": 328} {"train_loss": -8.381681442260742, "global_step": 55145, "epoch": 328} {"train_loss": -8.36972427368164, "global_step": 55146, "epoch": 328} {"train_loss": -8.03880500793457, "global_step": 55147, "epoch": 328} {"train_loss": -8.165562629699707, "global_step": 55148, "epoch": 328} {"train_loss": -8.556442260742188, "global_step": 55149, "epoch": 328} {"train_loss": -8.390876770019531, "global_step": 55150, "epoch": 328} {"train_loss": -8.054342269897461, "global_step": 55151, "epoch": 328} {"train_loss": -8.38779354095459, "global_step": 55152, "epoch": 328} {"train_loss": -8.609058380126953, "global_step": 55153, "epoch": 328} {"train_loss": -8.267653465270996, "global_step": 55154, "epoch": 328} {"train_loss": -8.234355926513672, "global_step": 55155, "epoch": 328} {"train_loss": -8.393326759338379, "global_step": 55156, "epoch": 328} {"train_loss": -8.477134704589844, "global_step": 55157, "epoch": 328} {"train_loss": -8.202522277832031, "global_step": 55158, "epoch": 328} {"train_loss": -8.44069766998291, "global_step": 55159, "epoch": 328} {"train_loss": -8.680621147155762, "global_step": 55160, "epoch": 328} {"train_loss": -8.283356666564941, "global_step": 55161, "epoch": 328} {"train_loss": -8.133867263793945, "global_step": 55162, "epoch": 328} {"train_loss": -8.567558288574219, "global_step": 55163, "epoch": 328} {"train_loss": -8.543935775756836, "global_step": 55164, "epoch": 328} {"train_loss": -8.434728622436523, "global_step": 55165, "epoch": 328} {"train_loss": -8.069236755371094, "global_step": 55166, "epoch": 328} {"train_loss": -8.363587379455566, "global_step": 55167, "epoch": 328} {"train_loss": -8.267820358276367, "global_step": 55168, "epoch": 328} {"train_loss": -8.323148727416992, "global_step": 55169, "epoch": 328} {"train_loss": -8.310568809509277, "global_step": 55170, "epoch": 328} {"train_loss": -8.279459953308105, "global_step": 55171, "epoch": 328} {"train_loss": -8.420002937316895, "global_step": 55172, "epoch": 328} {"train_loss": -8.52839469909668, "global_step": 55173, "epoch": 328} {"train_loss": -8.574222564697266, "global_step": 55174, "epoch": 328} {"train_loss": -8.35002326965332, "global_step": 55175, "epoch": 328} {"train_loss": -8.116254806518555, "global_step": 55176, "epoch": 328} {"train_loss": -8.444051742553711, "global_step": 55177, "epoch": 328} {"train_loss": -8.30221176147461, "global_step": 55178, "epoch": 328} {"train_loss": -8.598230361938477, "global_step": 55179, "epoch": 328} {"train_loss": -8.061013221740723, "global_step": 55180, "epoch": 328} {"train_loss": -8.444955825805664, "global_step": 55181, "epoch": 328} {"train_loss": -8.508857727050781, "global_step": 55182, "epoch": 328} {"train_loss": -8.181450843811035, "global_step": 55183, "epoch": 328} {"train_loss": -8.59344482421875, "global_step": 55184, "epoch": 328} {"train_loss": -8.568574905395508, "global_step": 55185, "epoch": 328} {"train_loss": -8.479171752929688, "global_step": 55186, "epoch": 328} {"train_loss": -8.420660018920898, "global_step": 55187, "epoch": 328} {"train_loss": -8.380728721618652, "global_step": 55188, "epoch": 328} {"train_loss": -8.251734733581543, "global_step": 55189, "epoch": 328} {"train_loss": -8.174999237060547, "global_step": 55190, "epoch": 328} {"train_loss": -8.682496070861816, "global_step": 55191, "epoch": 328} {"train_loss": -8.135346412658691, "global_step": 55192, "epoch": 328} {"train_loss": -8.298835754394531, "global_step": 55193, "epoch": 328} {"train_loss": -8.425932884216309, "global_step": 55194, "epoch": 328} {"train_loss": -8.536330223083496, "global_step": 55195, "epoch": 328} {"train_loss": -8.459890365600586, "global_step": 55196, "epoch": 328} {"train_loss": -8.254006385803223, "global_step": 55197, "epoch": 328} {"train_loss": -8.479170799255371, "global_step": 55198, "epoch": 328} {"train_loss": -8.262002944946289, "global_step": 55199, "epoch": 328} {"train_loss": -8.467304229736328, "global_step": 55200, "epoch": 328} {"train_loss": -8.63942813873291, "global_step": 55201, "epoch": 328} {"train_loss": -8.415557861328125, "global_step": 55202, "epoch": 328} {"train_loss": -8.732403755187988, "global_step": 55203, "epoch": 328} {"train_loss": -8.858060836791992, "global_step": 55204, "epoch": 328} {"train_loss": -8.46103572845459, "global_step": 55205, "epoch": 328} {"train_loss": -8.693269729614258, "global_step": 55206, "epoch": 328} {"train_loss": -8.625980377197266, "global_step": 55207, "epoch": 328} {"train_loss": -8.606846809387207, "global_step": 55208, "epoch": 328} {"train_loss": -8.571653366088867, "global_step": 55209, "epoch": 328} {"train_loss": -8.618535041809082, "global_step": 55210, "epoch": 328} {"train_loss": -8.589813232421875, "global_step": 55211, "epoch": 328} {"train_loss": -8.37526798248291, "global_step": 55212, "epoch": 328} {"train_loss": -8.663322448730469, "global_step": 55213, "epoch": 328} {"train_loss": -8.633073806762695, "global_step": 55214, "epoch": 328} {"train_loss": -8.695140838623047, "global_step": 55215, "epoch": 328} {"train_loss": -8.652057647705078, "global_step": 55216, "epoch": 328} {"train_loss": -8.52277946472168, "global_step": 55217, "epoch": 328} {"train_loss": -8.707412719726562, "global_step": 55218, "epoch": 328} {"train_loss": -8.861879348754883, "global_step": 55219, "epoch": 328} {"train_loss": -8.610282897949219, "global_step": 55220, "epoch": 328} {"train_loss": -8.398890495300293, "global_step": 55221, "epoch": 328} {"train_loss": -8.596200942993164, "global_step": 55222, "epoch": 328} {"train_loss": -8.72789478302002, "global_step": 55223, "epoch": 328} {"train_loss": -8.589653015136719, "global_step": 55224, "epoch": 328} {"train_loss": -8.679217338562012, "global_step": 55225, "epoch": 328} {"train_loss": -8.682950973510742, "global_step": 55226, "epoch": 328} {"train_loss": -8.616930961608887, "global_step": 55227, "epoch": 328} {"train_loss": -8.562901496887207, "global_step": 55228, "epoch": 328} {"train_loss": -8.842655181884766, "global_step": 55229, "epoch": 328} {"train_loss": -8.502992630004883, "global_step": 55230, "epoch": 328} {"train_loss": -8.644428253173828, "global_step": 55231, "epoch": 328} {"train_loss": -8.676545143127441, "global_step": 55232, "epoch": 328} {"train_loss": -8.76569652557373, "global_step": 55233, "epoch": 328} {"train_loss": -8.695976257324219, "global_step": 55234, "epoch": 328} {"train_loss": -8.689555168151855, "global_step": 55235, "epoch": 328} {"train_loss": -8.676810264587402, "global_step": 55236, "epoch": 328} {"train_loss": -8.532559394836426, "global_step": 55237, "epoch": 328} {"train_loss": -8.833053588867188, "global_step": 55238, "epoch": 328} {"train_loss": -8.749853134155273, "global_step": 55239, "epoch": 328} {"train_loss": -8.734781265258789, "global_step": 55240, "epoch": 328} {"train_loss": -8.866308212280273, "global_step": 55241, "epoch": 328} {"train_loss": -8.596056938171387, "global_step": 55242, "epoch": 328} {"train_loss": -8.617656707763672, "global_step": 55243, "epoch": 328} {"train_loss": -8.419137001037598, "global_step": 55244, "epoch": 328} {"train_loss": -8.675925254821777, "global_step": 55245, "epoch": 328} {"train_loss": -8.637331008911133, "global_step": 55246, "epoch": 328} {"train_loss": -8.563398361206055, "global_step": 55247, "epoch": 328} {"train_loss": -8.613859176635742, "global_step": 55248, "epoch": 328} {"train_loss": -8.289667129516602, "global_step": 55249, "epoch": 328} {"train_loss": -8.61633014678955, "global_step": 55250, "epoch": 328} {"train_loss": -8.153045654296875, "global_step": 55251, "epoch": 328} {"train_loss": -8.543954849243164, "global_step": 55252, "epoch": 328} {"train_loss": -8.26064682006836, "global_step": 55253, "epoch": 328} {"train_loss": -8.114605903625488, "global_step": 55254, "epoch": 328} {"train_loss": -8.372432708740234, "global_step": 55255, "epoch": 328} {"train_loss": -8.165863037109375, "global_step": 55256, "epoch": 328} {"train_loss": -8.202644348144531, "global_step": 55257, "epoch": 328} {"train_loss": -8.213530540466309, "global_step": 55258, "epoch": 328} {"train_loss": -8.032793045043945, "global_step": 55259, "epoch": 328} {"train_loss": -8.242101669311523, "global_step": 55260, "epoch": 328} {"train_loss": -7.952038764953613, "global_step": 55261, "epoch": 328} {"train_loss": -8.208074569702148, "global_step": 55262, "epoch": 328} {"train_loss": -7.94156551361084, "global_step": 55263, "epoch": 328} {"train_loss": -8.362564086914062, "global_step": 55264, "epoch": 328} {"train_loss": -8.231040954589844, "global_step": 55265, "epoch": 328} {"train_loss": -8.03189754486084, "global_step": 55266, "epoch": 328} {"train_loss": -8.457237243652344, "global_step": 55267, "epoch": 328} {"train_loss": -8.116643905639648, "global_step": 55268, "epoch": 328} {"train_loss": -8.433324813842773, "global_step": 55269, "epoch": 328} {"train_loss": -8.347190856933594, "global_step": 55270, "epoch": 328} {"train_loss": -8.441310629958199, "global_step": 55271, "epoch": 328, "val_loss": 190679.703125} {"train_loss": -8.315699577331543, "global_step": 55272, "epoch": 329} {"train_loss": -8.381683349609375, "global_step": 55273, "epoch": 329} {"train_loss": -8.483711242675781, "global_step": 55274, "epoch": 329} {"train_loss": -8.439905166625977, "global_step": 55275, "epoch": 329} {"train_loss": -8.39720344543457, "global_step": 55276, "epoch": 329} {"train_loss": -8.462944030761719, "global_step": 55277, "epoch": 329} {"train_loss": -8.280458450317383, "global_step": 55278, "epoch": 329} {"train_loss": -8.301423072814941, "global_step": 55279, "epoch": 329} {"train_loss": -8.417000770568848, "global_step": 55280, "epoch": 329} {"train_loss": -8.601776123046875, "global_step": 55281, "epoch": 329} {"train_loss": -8.370811462402344, "global_step": 55282, "epoch": 329} {"train_loss": -8.340198516845703, "global_step": 55283, "epoch": 329} {"train_loss": -8.322721481323242, "global_step": 55284, "epoch": 329} {"train_loss": -8.570962905883789, "global_step": 55285, "epoch": 329} {"train_loss": -8.334613800048828, "global_step": 55286, "epoch": 329} {"train_loss": -8.661704063415527, "global_step": 55287, "epoch": 329} {"train_loss": -8.623085021972656, "global_step": 55288, "epoch": 329} {"train_loss": -8.731974601745605, "global_step": 55289, "epoch": 329} {"train_loss": -8.571956634521484, "global_step": 55290, "epoch": 329} {"train_loss": -8.633909225463867, "global_step": 55291, "epoch": 329} {"train_loss": -8.728425979614258, "global_step": 55292, "epoch": 329} {"train_loss": -8.637317657470703, "global_step": 55293, "epoch": 329} {"train_loss": -8.659032821655273, "global_step": 55294, "epoch": 329} {"train_loss": -8.523428916931152, "global_step": 55295, "epoch": 329} {"train_loss": -8.357590675354004, "global_step": 55296, "epoch": 329} {"train_loss": -8.579668998718262, "global_step": 55297, "epoch": 329} {"train_loss": -8.041093826293945, "global_step": 55298, "epoch": 329} {"train_loss": -8.566997528076172, "global_step": 55299, "epoch": 329} {"train_loss": -8.510555267333984, "global_step": 55300, "epoch": 329} {"train_loss": -8.363733291625977, "global_step": 55301, "epoch": 329} {"train_loss": -8.214113235473633, "global_step": 55302, "epoch": 329} {"train_loss": -8.394552230834961, "global_step": 55303, "epoch": 329} {"train_loss": -8.61221694946289, "global_step": 55304, "epoch": 329} {"train_loss": -8.409714698791504, "global_step": 55305, "epoch": 329} {"train_loss": -8.604108810424805, "global_step": 55306, "epoch": 329} {"train_loss": -8.406779289245605, "global_step": 55307, "epoch": 329} {"train_loss": -8.500880241394043, "global_step": 55308, "epoch": 329} {"train_loss": -8.278736114501953, "global_step": 55309, "epoch": 329} {"train_loss": -8.567399978637695, "global_step": 55310, "epoch": 329} {"train_loss": -8.560714721679688, "global_step": 55311, "epoch": 329} {"train_loss": -8.601783752441406, "global_step": 55312, "epoch": 329} {"train_loss": -8.505616188049316, "global_step": 55313, "epoch": 329} {"train_loss": -8.348132133483887, "global_step": 55314, "epoch": 329} {"train_loss": -8.521211624145508, "global_step": 55315, "epoch": 329} {"train_loss": -8.47091007232666, "global_step": 55316, "epoch": 329} {"train_loss": -8.504425048828125, "global_step": 55317, "epoch": 329} {"train_loss": -8.594350814819336, "global_step": 55318, "epoch": 329} {"train_loss": -8.414297103881836, "global_step": 55319, "epoch": 329} {"train_loss": -8.642721176147461, "global_step": 55320, "epoch": 329} {"train_loss": -8.599559783935547, "global_step": 55321, "epoch": 329} {"train_loss": -8.678337097167969, "global_step": 55322, "epoch": 329} {"train_loss": -8.249909400939941, "global_step": 55323, "epoch": 329} {"train_loss": -8.599300384521484, "global_step": 55324, "epoch": 329} {"train_loss": -8.462350845336914, "global_step": 55325, "epoch": 329} {"train_loss": -8.544506072998047, "global_step": 55326, "epoch": 329} {"train_loss": -8.274484634399414, "global_step": 55327, "epoch": 329} {"train_loss": -8.444002151489258, "global_step": 55328, "epoch": 329} {"train_loss": -8.278190612792969, "global_step": 55329, "epoch": 329} {"train_loss": -8.596266746520996, "global_step": 55330, "epoch": 329} {"train_loss": -8.234748840332031, "global_step": 55331, "epoch": 329} {"train_loss": -8.373188018798828, "global_step": 55332, "epoch": 329} {"train_loss": -8.553192138671875, "global_step": 55333, "epoch": 329} {"train_loss": -7.940954208374023, "global_step": 55334, "epoch": 329} {"train_loss": -8.79307746887207, "global_step": 55335, "epoch": 329} {"train_loss": -8.29495906829834, "global_step": 55336, "epoch": 329} {"train_loss": -8.616931915283203, "global_step": 55337, "epoch": 329} {"train_loss": -8.250543594360352, "global_step": 55338, "epoch": 329} {"train_loss": -8.513856887817383, "global_step": 55339, "epoch": 329} {"train_loss": -8.266806602478027, "global_step": 55340, "epoch": 329} {"train_loss": -8.55789566040039, "global_step": 55341, "epoch": 329} {"train_loss": -8.42745590209961, "global_step": 55342, "epoch": 329} {"train_loss": -8.293578147888184, "global_step": 55343, "epoch": 329} {"train_loss": -8.196290969848633, "global_step": 55344, "epoch": 329} {"train_loss": -8.412712097167969, "global_step": 55345, "epoch": 329} {"train_loss": -8.393255233764648, "global_step": 55346, "epoch": 329} {"train_loss": -8.542684555053711, "global_step": 55347, "epoch": 329} {"train_loss": -8.521710395812988, "global_step": 55348, "epoch": 329} {"train_loss": -8.38763427734375, "global_step": 55349, "epoch": 329} {"train_loss": -8.426950454711914, "global_step": 55350, "epoch": 329} {"train_loss": -8.279199600219727, "global_step": 55351, "epoch": 329} {"train_loss": -8.577977180480957, "global_step": 55352, "epoch": 329} {"train_loss": -8.379215240478516, "global_step": 55353, "epoch": 329} {"train_loss": -8.428133010864258, "global_step": 55354, "epoch": 329} {"train_loss": -8.415603637695312, "global_step": 55355, "epoch": 329} {"train_loss": -8.398475646972656, "global_step": 55356, "epoch": 329} {"train_loss": -8.68160629272461, "global_step": 55357, "epoch": 329} {"train_loss": -8.531764030456543, "global_step": 55358, "epoch": 329} {"train_loss": -8.545929908752441, "global_step": 55359, "epoch": 329} {"train_loss": -8.694573402404785, "global_step": 55360, "epoch": 329} {"train_loss": -8.614542961120605, "global_step": 55361, "epoch": 329} {"train_loss": -8.287989616394043, "global_step": 55362, "epoch": 329} {"train_loss": -8.50048828125, "global_step": 55363, "epoch": 329} {"train_loss": -8.177124977111816, "global_step": 55364, "epoch": 329} {"train_loss": -8.493471145629883, "global_step": 55365, "epoch": 329} {"train_loss": -8.43739128112793, "global_step": 55366, "epoch": 329} {"train_loss": -8.4019775390625, "global_step": 55367, "epoch": 329} {"train_loss": -8.442709922790527, "global_step": 55368, "epoch": 329} {"train_loss": -8.567502975463867, "global_step": 55369, "epoch": 329} {"train_loss": -8.509593963623047, "global_step": 55370, "epoch": 329} {"train_loss": -8.66242790222168, "global_step": 55371, "epoch": 329} {"train_loss": -8.484648704528809, "global_step": 55372, "epoch": 329} {"train_loss": -8.62432861328125, "global_step": 55373, "epoch": 329} {"train_loss": -8.16569709777832, "global_step": 55374, "epoch": 329} {"train_loss": -8.474706649780273, "global_step": 55375, "epoch": 329} {"train_loss": -8.199893951416016, "global_step": 55376, "epoch": 329} {"train_loss": -8.482414245605469, "global_step": 55377, "epoch": 329} {"train_loss": -8.21432113647461, "global_step": 55378, "epoch": 329} {"train_loss": -8.458486557006836, "global_step": 55379, "epoch": 329} {"train_loss": -8.343069076538086, "global_step": 55380, "epoch": 329} {"train_loss": -8.374699592590332, "global_step": 55381, "epoch": 329} {"train_loss": -8.236076354980469, "global_step": 55382, "epoch": 329} {"train_loss": -8.402706146240234, "global_step": 55383, "epoch": 329} {"train_loss": -8.580828666687012, "global_step": 55384, "epoch": 329} {"train_loss": -7.97610330581665, "global_step": 55385, "epoch": 329} {"train_loss": -8.48335075378418, "global_step": 55386, "epoch": 329} {"train_loss": -8.0072660446167, "global_step": 55387, "epoch": 329} {"train_loss": -8.155935287475586, "global_step": 55388, "epoch": 329} {"train_loss": -8.136735916137695, "global_step": 55389, "epoch": 329} {"train_loss": -8.216347694396973, "global_step": 55390, "epoch": 329} {"train_loss": -8.406913757324219, "global_step": 55391, "epoch": 329} {"train_loss": -8.202478408813477, "global_step": 55392, "epoch": 329} {"train_loss": -8.501160621643066, "global_step": 55393, "epoch": 329} {"train_loss": -8.381782531738281, "global_step": 55394, "epoch": 329} {"train_loss": -8.148895263671875, "global_step": 55395, "epoch": 329} {"train_loss": -8.614370346069336, "global_step": 55396, "epoch": 329} {"train_loss": -8.308140754699707, "global_step": 55397, "epoch": 329} {"train_loss": -8.377456665039062, "global_step": 55398, "epoch": 329} {"train_loss": -8.461505889892578, "global_step": 55399, "epoch": 329} {"train_loss": -8.425186157226562, "global_step": 55400, "epoch": 329} {"train_loss": -8.519453048706055, "global_step": 55401, "epoch": 329} {"train_loss": -8.39893627166748, "global_step": 55402, "epoch": 329} {"train_loss": -8.540122985839844, "global_step": 55403, "epoch": 329} {"train_loss": -8.31701946258545, "global_step": 55404, "epoch": 329} {"train_loss": -8.605487823486328, "global_step": 55405, "epoch": 329} {"train_loss": -8.459245681762695, "global_step": 55406, "epoch": 329} {"train_loss": -8.400538444519043, "global_step": 55407, "epoch": 329} {"train_loss": -8.413043975830078, "global_step": 55408, "epoch": 329} {"train_loss": -8.293703079223633, "global_step": 55409, "epoch": 329} {"train_loss": -8.485170364379883, "global_step": 55410, "epoch": 329} {"train_loss": -8.700190544128418, "global_step": 55411, "epoch": 329} {"train_loss": -8.404430389404297, "global_step": 55412, "epoch": 329} {"train_loss": -8.458824157714844, "global_step": 55413, "epoch": 329} {"train_loss": -8.48587417602539, "global_step": 55414, "epoch": 329} {"train_loss": -8.638763427734375, "global_step": 55415, "epoch": 329} {"train_loss": -8.461065292358398, "global_step": 55416, "epoch": 329} {"train_loss": -8.689533233642578, "global_step": 55417, "epoch": 329} {"train_loss": -8.553130149841309, "global_step": 55418, "epoch": 329} {"train_loss": -8.449604988098145, "global_step": 55419, "epoch": 329} {"train_loss": -8.641678810119629, "global_step": 55420, "epoch": 329} {"train_loss": -8.529614448547363, "global_step": 55421, "epoch": 329} {"train_loss": -8.62618350982666, "global_step": 55422, "epoch": 329} {"train_loss": -8.690805435180664, "global_step": 55423, "epoch": 329} {"train_loss": -8.59751033782959, "global_step": 55424, "epoch": 329} {"train_loss": -8.663471221923828, "global_step": 55425, "epoch": 329} {"train_loss": -8.317047119140625, "global_step": 55426, "epoch": 329} {"train_loss": -8.703554153442383, "global_step": 55427, "epoch": 329} {"train_loss": -8.697128295898438, "global_step": 55428, "epoch": 329} {"train_loss": -8.478893280029297, "global_step": 55429, "epoch": 329} {"train_loss": -8.745820999145508, "global_step": 55430, "epoch": 329} {"train_loss": -8.61333179473877, "global_step": 55431, "epoch": 329} {"train_loss": -8.639655113220215, "global_step": 55432, "epoch": 329} {"train_loss": -8.48879623413086, "global_step": 55433, "epoch": 329} {"train_loss": -8.851773262023926, "global_step": 55434, "epoch": 329} {"train_loss": -8.491198539733887, "global_step": 55435, "epoch": 329} {"train_loss": -8.397305488586426, "global_step": 55436, "epoch": 329} {"train_loss": -8.368632316589355, "global_step": 55437, "epoch": 329} {"train_loss": -8.658604621887207, "global_step": 55438, "epoch": 329} {"train_loss": -8.458311577637991, "global_step": 55439, "epoch": 329, "val_loss": 187964.09375} {"train_loss": -8.870540618896484, "global_step": 55440, "epoch": 330} {"train_loss": -8.543126106262207, "global_step": 55441, "epoch": 330} {"train_loss": -8.505622863769531, "global_step": 55442, "epoch": 330} {"train_loss": -8.30345344543457, "global_step": 55443, "epoch": 330} {"train_loss": -8.474037170410156, "global_step": 55444, "epoch": 330} {"train_loss": -8.69001579284668, "global_step": 55445, "epoch": 330} {"train_loss": -8.571414947509766, "global_step": 55446, "epoch": 330} {"train_loss": -8.42829704284668, "global_step": 55447, "epoch": 330} {"train_loss": -8.587438583374023, "global_step": 55448, "epoch": 330} {"train_loss": -8.259498596191406, "global_step": 55449, "epoch": 330} {"train_loss": -8.687070846557617, "global_step": 55450, "epoch": 330} {"train_loss": -8.663134574890137, "global_step": 55451, "epoch": 330} {"train_loss": -8.669686317443848, "global_step": 55452, "epoch": 330} {"train_loss": -8.762256622314453, "global_step": 55453, "epoch": 330} {"train_loss": -8.551156997680664, "global_step": 55454, "epoch": 330} {"train_loss": -8.23069953918457, "global_step": 55455, "epoch": 330} {"train_loss": -8.249374389648438, "global_step": 55456, "epoch": 330} {"train_loss": -8.330392837524414, "global_step": 55457, "epoch": 330} {"train_loss": -8.258541107177734, "global_step": 55458, "epoch": 330} {"train_loss": -8.604277610778809, "global_step": 55459, "epoch": 330} {"train_loss": -8.16008472442627, "global_step": 55460, "epoch": 330} {"train_loss": -8.597478866577148, "global_step": 55461, "epoch": 330} {"train_loss": -8.552682876586914, "global_step": 55462, "epoch": 330} {"train_loss": -8.433326721191406, "global_step": 55463, "epoch": 330} {"train_loss": -8.581487655639648, "global_step": 55464, "epoch": 330} {"train_loss": -8.480502128601074, "global_step": 55465, "epoch": 330} {"train_loss": -8.552302360534668, "global_step": 55466, "epoch": 330} {"train_loss": -8.449576377868652, "global_step": 55467, "epoch": 330} {"train_loss": -8.719770431518555, "global_step": 55468, "epoch": 330} {"train_loss": -8.47335147857666, "global_step": 55469, "epoch": 330} {"train_loss": -8.500968933105469, "global_step": 55470, "epoch": 330} {"train_loss": -8.482715606689453, "global_step": 55471, "epoch": 330} {"train_loss": -8.600555419921875, "global_step": 55472, "epoch": 330} {"train_loss": -8.265777587890625, "global_step": 55473, "epoch": 330} {"train_loss": -8.388901710510254, "global_step": 55474, "epoch": 330} {"train_loss": -8.534736633300781, "global_step": 55475, "epoch": 330} {"train_loss": -8.291463851928711, "global_step": 55476, "epoch": 330} {"train_loss": -8.289885520935059, "global_step": 55477, "epoch": 330} {"train_loss": -8.355428695678711, "global_step": 55478, "epoch": 330} {"train_loss": -8.256319999694824, "global_step": 55479, "epoch": 330} {"train_loss": -8.046589851379395, "global_step": 55480, "epoch": 330} {"train_loss": -8.394952774047852, "global_step": 55481, "epoch": 330} {"train_loss": -8.604437828063965, "global_step": 55482, "epoch": 330} {"train_loss": -8.490317344665527, "global_step": 55483, "epoch": 330} {"train_loss": -8.597127914428711, "global_step": 55484, "epoch": 330} {"train_loss": -8.515399932861328, "global_step": 55485, "epoch": 330} {"train_loss": -8.4921293258667, "global_step": 55486, "epoch": 330} {"train_loss": -8.492263793945312, "global_step": 55487, "epoch": 330} {"train_loss": -8.450973510742188, "global_step": 55488, "epoch": 330} {"train_loss": -8.641532897949219, "global_step": 55489, "epoch": 330} {"train_loss": -8.401576042175293, "global_step": 55490, "epoch": 330} {"train_loss": -8.467242240905762, "global_step": 55491, "epoch": 330} {"train_loss": -8.539308547973633, "global_step": 55492, "epoch": 330} {"train_loss": -8.668513298034668, "global_step": 55493, "epoch": 330} {"train_loss": -8.370481491088867, "global_step": 55494, "epoch": 330} {"train_loss": -8.464600563049316, "global_step": 55495, "epoch": 330} {"train_loss": -8.435453414916992, "global_step": 55496, "epoch": 330} {"train_loss": -8.542093276977539, "global_step": 55497, "epoch": 330} {"train_loss": -8.402448654174805, "global_step": 55498, "epoch": 330} {"train_loss": -8.602296829223633, "global_step": 55499, "epoch": 330} {"train_loss": -8.727853775024414, "global_step": 55500, "epoch": 330} {"train_loss": -8.69046401977539, "global_step": 55501, "epoch": 330} {"train_loss": -8.481216430664062, "global_step": 55502, "epoch": 330} {"train_loss": -8.523319244384766, "global_step": 55503, "epoch": 330} {"train_loss": -8.695211410522461, "global_step": 55504, "epoch": 330} {"train_loss": -8.494394302368164, "global_step": 55505, "epoch": 330} {"train_loss": -8.533019065856934, "global_step": 55506, "epoch": 330} {"train_loss": -8.731666564941406, "global_step": 55507, "epoch": 330} {"train_loss": -8.888965606689453, "global_step": 55508, "epoch": 330} {"train_loss": -8.48267936706543, "global_step": 55509, "epoch": 330} {"train_loss": -8.562836647033691, "global_step": 55510, "epoch": 330} {"train_loss": -8.511805534362793, "global_step": 55511, "epoch": 330} {"train_loss": -8.757685661315918, "global_step": 55512, "epoch": 330} {"train_loss": -8.524468421936035, "global_step": 55513, "epoch": 330} {"train_loss": -8.566920280456543, "global_step": 55514, "epoch": 330} {"train_loss": -8.492713928222656, "global_step": 55515, "epoch": 330} {"train_loss": -8.669832229614258, "global_step": 55516, "epoch": 330} {"train_loss": -8.557086944580078, "global_step": 55517, "epoch": 330} {"train_loss": -8.504020690917969, "global_step": 55518, "epoch": 330} {"train_loss": -8.624900817871094, "global_step": 55519, "epoch": 330} {"train_loss": -8.501949310302734, "global_step": 55520, "epoch": 330} {"train_loss": -8.469605445861816, "global_step": 55521, "epoch": 330} {"train_loss": -8.38494873046875, "global_step": 55522, "epoch": 330} {"train_loss": -8.459622383117676, "global_step": 55523, "epoch": 330} {"train_loss": -8.748271942138672, "global_step": 55524, "epoch": 330} {"train_loss": -8.645520210266113, "global_step": 55525, "epoch": 330} {"train_loss": -8.444185256958008, "global_step": 55526, "epoch": 330} {"train_loss": -8.421454429626465, "global_step": 55527, "epoch": 330} {"train_loss": -8.139226913452148, "global_step": 55528, "epoch": 330} {"train_loss": -8.532751083374023, "global_step": 55529, "epoch": 330} {"train_loss": -8.147893905639648, "global_step": 55530, "epoch": 330} {"train_loss": -8.533763885498047, "global_step": 55531, "epoch": 330} {"train_loss": -8.635412216186523, "global_step": 55532, "epoch": 330} {"train_loss": -8.197715759277344, "global_step": 55533, "epoch": 330} {"train_loss": -8.508034706115723, "global_step": 55534, "epoch": 330} {"train_loss": -8.558090209960938, "global_step": 55535, "epoch": 330} {"train_loss": -8.406044960021973, "global_step": 55536, "epoch": 330} {"train_loss": -8.27431869506836, "global_step": 55537, "epoch": 330} {"train_loss": -8.298710823059082, "global_step": 55538, "epoch": 330} {"train_loss": -8.594574928283691, "global_step": 55539, "epoch": 330} {"train_loss": -7.952134132385254, "global_step": 55540, "epoch": 330} {"train_loss": -8.564823150634766, "global_step": 55541, "epoch": 330} {"train_loss": -8.485748291015625, "global_step": 55542, "epoch": 330} {"train_loss": -8.364564895629883, "global_step": 55543, "epoch": 330} {"train_loss": -8.456144332885742, "global_step": 55544, "epoch": 330} {"train_loss": -8.677250862121582, "global_step": 55545, "epoch": 330} {"train_loss": -8.708074569702148, "global_step": 55546, "epoch": 330} {"train_loss": -8.468910217285156, "global_step": 55547, "epoch": 330} {"train_loss": -8.58375072479248, "global_step": 55548, "epoch": 330} {"train_loss": -8.642596244812012, "global_step": 55549, "epoch": 330} {"train_loss": -8.546674728393555, "global_step": 55550, "epoch": 330} {"train_loss": -8.747735977172852, "global_step": 55551, "epoch": 330} {"train_loss": -8.658473014831543, "global_step": 55552, "epoch": 330} {"train_loss": -8.703603744506836, "global_step": 55553, "epoch": 330} {"train_loss": -8.675604820251465, "global_step": 55554, "epoch": 330} {"train_loss": -8.584878921508789, "global_step": 55555, "epoch": 330} {"train_loss": -8.74078369140625, "global_step": 55556, "epoch": 330} {"train_loss": -8.699695587158203, "global_step": 55557, "epoch": 330} {"train_loss": -8.62853717803955, "global_step": 55558, "epoch": 330} {"train_loss": -8.801271438598633, "global_step": 55559, "epoch": 330} {"train_loss": -8.65735149383545, "global_step": 55560, "epoch": 330} {"train_loss": -8.662712097167969, "global_step": 55561, "epoch": 330} {"train_loss": -8.676959991455078, "global_step": 55562, "epoch": 330} {"train_loss": -8.453259468078613, "global_step": 55563, "epoch": 330} {"train_loss": -8.42878532409668, "global_step": 55564, "epoch": 330} {"train_loss": -8.147228240966797, "global_step": 55565, "epoch": 330} {"train_loss": -8.488222122192383, "global_step": 55566, "epoch": 330} {"train_loss": -8.386897087097168, "global_step": 55567, "epoch": 330} {"train_loss": -8.33462142944336, "global_step": 55568, "epoch": 330} {"train_loss": -8.403206825256348, "global_step": 55569, "epoch": 330} {"train_loss": -8.218815803527832, "global_step": 55570, "epoch": 330} {"train_loss": -8.213010787963867, "global_step": 55571, "epoch": 330} {"train_loss": -8.243642807006836, "global_step": 55572, "epoch": 330} {"train_loss": -8.350371360778809, "global_step": 55573, "epoch": 330} {"train_loss": -8.21214771270752, "global_step": 55574, "epoch": 330} {"train_loss": -8.156599044799805, "global_step": 55575, "epoch": 330} {"train_loss": -8.074551582336426, "global_step": 55576, "epoch": 330} {"train_loss": -8.195484161376953, "global_step": 55577, "epoch": 330} {"train_loss": -8.103134155273438, "global_step": 55578, "epoch": 330} {"train_loss": -8.298652648925781, "global_step": 55579, "epoch": 330} {"train_loss": -8.336141586303711, "global_step": 55580, "epoch": 330} {"train_loss": -8.363554000854492, "global_step": 55581, "epoch": 330} {"train_loss": -8.252113342285156, "global_step": 55582, "epoch": 330} {"train_loss": -8.287635803222656, "global_step": 55583, "epoch": 330} {"train_loss": -8.355096817016602, "global_step": 55584, "epoch": 330} {"train_loss": -8.295564651489258, "global_step": 55585, "epoch": 330} {"train_loss": -8.058477401733398, "global_step": 55586, "epoch": 330} {"train_loss": -8.407999038696289, "global_step": 55587, "epoch": 330} {"train_loss": -8.44947624206543, "global_step": 55588, "epoch": 330} {"train_loss": -8.27961540222168, "global_step": 55589, "epoch": 330} {"train_loss": -8.207844734191895, "global_step": 55590, "epoch": 330} {"train_loss": -8.462934494018555, "global_step": 55591, "epoch": 330} {"train_loss": -8.437556266784668, "global_step": 55592, "epoch": 330} {"train_loss": -8.2271089553833, "global_step": 55593, "epoch": 330} {"train_loss": -8.338618278503418, "global_step": 55594, "epoch": 330} {"train_loss": -8.392452239990234, "global_step": 55595, "epoch": 330} {"train_loss": -8.262121200561523, "global_step": 55596, "epoch": 330} {"train_loss": -8.491340637207031, "global_step": 55597, "epoch": 330} {"train_loss": -8.659574508666992, "global_step": 55598, "epoch": 330} {"train_loss": -8.433326721191406, "global_step": 55599, "epoch": 330} {"train_loss": -8.621161460876465, "global_step": 55600, "epoch": 330} {"train_loss": -8.586848258972168, "global_step": 55601, "epoch": 330} {"train_loss": -8.503828048706055, "global_step": 55602, "epoch": 330} {"train_loss": -8.57174015045166, "global_step": 55603, "epoch": 330} {"train_loss": -8.5440673828125, "global_step": 55604, "epoch": 330} {"train_loss": -8.727048873901367, "global_step": 55605, "epoch": 330} {"train_loss": -8.463489532470703, "global_step": 55606, "epoch": 330} {"train_loss": -8.474453999882652, "global_step": 55607, "epoch": 330, "val_loss": 191820.890625, "train_action_mse_error": 7.495290756225586} {"train_loss": -8.605793952941895, "global_step": 55608, "epoch": 331} {"train_loss": -8.60991096496582, "global_step": 55609, "epoch": 331} {"train_loss": -8.603513717651367, "global_step": 55610, "epoch": 331} {"train_loss": -8.638345718383789, "global_step": 55611, "epoch": 331} {"train_loss": -8.680326461791992, "global_step": 55612, "epoch": 331} {"train_loss": -8.584566116333008, "global_step": 55613, "epoch": 331} {"train_loss": -8.456025123596191, "global_step": 55614, "epoch": 331} {"train_loss": -8.690650939941406, "global_step": 55615, "epoch": 331} {"train_loss": -8.617534637451172, "global_step": 55616, "epoch": 331} {"train_loss": -8.508865356445312, "global_step": 55617, "epoch": 331} {"train_loss": -8.71155071258545, "global_step": 55618, "epoch": 331} {"train_loss": -8.484477043151855, "global_step": 55619, "epoch": 331} {"train_loss": -8.590901374816895, "global_step": 55620, "epoch": 331} {"train_loss": -8.51462173461914, "global_step": 55621, "epoch": 331} {"train_loss": -8.620054244995117, "global_step": 55622, "epoch": 331} {"train_loss": -8.294044494628906, "global_step": 55623, "epoch": 331} {"train_loss": -8.564029693603516, "global_step": 55624, "epoch": 331} {"train_loss": -8.637641906738281, "global_step": 55625, "epoch": 331} {"train_loss": -8.551055908203125, "global_step": 55626, "epoch": 331} {"train_loss": -8.592199325561523, "global_step": 55627, "epoch": 331} {"train_loss": -8.476125717163086, "global_step": 55628, "epoch": 331} {"train_loss": -8.619461059570312, "global_step": 55629, "epoch": 331} {"train_loss": -8.676473617553711, "global_step": 55630, "epoch": 331} {"train_loss": -8.492956161499023, "global_step": 55631, "epoch": 331} {"train_loss": -8.675872802734375, "global_step": 55632, "epoch": 331} {"train_loss": -8.4403657913208, "global_step": 55633, "epoch": 331} {"train_loss": -8.532564163208008, "global_step": 55634, "epoch": 331} {"train_loss": -8.400644302368164, "global_step": 55635, "epoch": 331} {"train_loss": -8.49105453491211, "global_step": 55636, "epoch": 331} {"train_loss": -8.659322738647461, "global_step": 55637, "epoch": 331} {"train_loss": -8.49592399597168, "global_step": 55638, "epoch": 331} {"train_loss": -8.77011489868164, "global_step": 55639, "epoch": 331} {"train_loss": -8.67808723449707, "global_step": 55640, "epoch": 331} {"train_loss": -8.421844482421875, "global_step": 55641, "epoch": 331} {"train_loss": -8.557647705078125, "global_step": 55642, "epoch": 331} {"train_loss": -8.114949226379395, "global_step": 55643, "epoch": 331} {"train_loss": -8.582839965820312, "global_step": 55644, "epoch": 331} {"train_loss": -7.999866008758545, "global_step": 55645, "epoch": 331} {"train_loss": -8.515820503234863, "global_step": 55646, "epoch": 331} {"train_loss": -8.361620903015137, "global_step": 55647, "epoch": 331} {"train_loss": -8.474050521850586, "global_step": 55648, "epoch": 331} {"train_loss": -8.350770950317383, "global_step": 55649, "epoch": 331} {"train_loss": -8.468997955322266, "global_step": 55650, "epoch": 331} {"train_loss": -8.331903457641602, "global_step": 55651, "epoch": 331} {"train_loss": -8.595974922180176, "global_step": 55652, "epoch": 331} {"train_loss": -8.390361785888672, "global_step": 55653, "epoch": 331} {"train_loss": -8.641246795654297, "global_step": 55654, "epoch": 331} {"train_loss": -8.362035751342773, "global_step": 55655, "epoch": 331} {"train_loss": -8.631874084472656, "global_step": 55656, "epoch": 331} {"train_loss": -8.173940658569336, "global_step": 55657, "epoch": 331} {"train_loss": -8.447583198547363, "global_step": 55658, "epoch": 331} {"train_loss": -8.623727798461914, "global_step": 55659, "epoch": 331} {"train_loss": -8.460525512695312, "global_step": 55660, "epoch": 331} {"train_loss": -8.615439414978027, "global_step": 55661, "epoch": 331} {"train_loss": -8.656927108764648, "global_step": 55662, "epoch": 331} {"train_loss": -8.49180793762207, "global_step": 55663, "epoch": 331} {"train_loss": -8.553254127502441, "global_step": 55664, "epoch": 331} {"train_loss": -8.800236701965332, "global_step": 55665, "epoch": 331} {"train_loss": -8.728967666625977, "global_step": 55666, "epoch": 331} {"train_loss": -8.56680679321289, "global_step": 55667, "epoch": 331} {"train_loss": -8.386015892028809, "global_step": 55668, "epoch": 331} {"train_loss": -8.601544380187988, "global_step": 55669, "epoch": 331} {"train_loss": -8.576272010803223, "global_step": 55670, "epoch": 331} {"train_loss": -8.571722984313965, "global_step": 55671, "epoch": 331} {"train_loss": -8.488298416137695, "global_step": 55672, "epoch": 331} {"train_loss": -8.611432075500488, "global_step": 55673, "epoch": 331} {"train_loss": -8.310277938842773, "global_step": 55674, "epoch": 331} {"train_loss": -8.538272857666016, "global_step": 55675, "epoch": 331} {"train_loss": -8.400442123413086, "global_step": 55676, "epoch": 331} {"train_loss": -8.779747009277344, "global_step": 55677, "epoch": 331} {"train_loss": -8.579964637756348, "global_step": 55678, "epoch": 331} {"train_loss": -8.382488250732422, "global_step": 55679, "epoch": 331} {"train_loss": -8.542947769165039, "global_step": 55680, "epoch": 331} {"train_loss": -8.58221435546875, "global_step": 55681, "epoch": 331} {"train_loss": -8.761198043823242, "global_step": 55682, "epoch": 331} {"train_loss": -8.663860321044922, "global_step": 55683, "epoch": 331} {"train_loss": -8.693187713623047, "global_step": 55684, "epoch": 331} {"train_loss": -8.709737777709961, "global_step": 55685, "epoch": 331} {"train_loss": -8.75105094909668, "global_step": 55686, "epoch": 331} {"train_loss": -8.673123359680176, "global_step": 55687, "epoch": 331} {"train_loss": -8.705829620361328, "global_step": 55688, "epoch": 331} {"train_loss": -8.57418441772461, "global_step": 55689, "epoch": 331} {"train_loss": -8.64558219909668, "global_step": 55690, "epoch": 331} {"train_loss": -8.609241485595703, "global_step": 55691, "epoch": 331} {"train_loss": -8.657779693603516, "global_step": 55692, "epoch": 331} {"train_loss": -8.695409774780273, "global_step": 55693, "epoch": 331} {"train_loss": -8.47503662109375, "global_step": 55694, "epoch": 331} {"train_loss": -8.296468734741211, "global_step": 55695, "epoch": 331} {"train_loss": -8.456802368164062, "global_step": 55696, "epoch": 331} {"train_loss": -8.611855506896973, "global_step": 55697, "epoch": 331} {"train_loss": -8.68097972869873, "global_step": 55698, "epoch": 331} {"train_loss": -8.375470161437988, "global_step": 55699, "epoch": 331} {"train_loss": -8.366687774658203, "global_step": 55700, "epoch": 331} {"train_loss": -8.54234504699707, "global_step": 55701, "epoch": 331} {"train_loss": -8.290053367614746, "global_step": 55702, "epoch": 331} {"train_loss": -8.101593017578125, "global_step": 55703, "epoch": 331} {"train_loss": -8.547562599182129, "global_step": 55704, "epoch": 331} {"train_loss": -8.157268524169922, "global_step": 55705, "epoch": 331} {"train_loss": -8.390063285827637, "global_step": 55706, "epoch": 331} {"train_loss": -8.283729553222656, "global_step": 55707, "epoch": 331} {"train_loss": -8.222793579101562, "global_step": 55708, "epoch": 331} {"train_loss": -8.150239944458008, "global_step": 55709, "epoch": 331} {"train_loss": -8.452780723571777, "global_step": 55710, "epoch": 331} {"train_loss": -8.339787483215332, "global_step": 55711, "epoch": 331} {"train_loss": -8.100586891174316, "global_step": 55712, "epoch": 331} {"train_loss": -8.15112590789795, "global_step": 55713, "epoch": 331} {"train_loss": -8.393739700317383, "global_step": 55714, "epoch": 331} {"train_loss": -8.31492805480957, "global_step": 55715, "epoch": 331} {"train_loss": -8.421972274780273, "global_step": 55716, "epoch": 331} {"train_loss": -8.552389144897461, "global_step": 55717, "epoch": 331} {"train_loss": -8.256790161132812, "global_step": 55718, "epoch": 331} {"train_loss": -8.300298690795898, "global_step": 55719, "epoch": 331} {"train_loss": -8.46373462677002, "global_step": 55720, "epoch": 331} {"train_loss": -8.318208694458008, "global_step": 55721, "epoch": 331} {"train_loss": -8.318321228027344, "global_step": 55722, "epoch": 331} {"train_loss": -8.40983772277832, "global_step": 55723, "epoch": 331} {"train_loss": -8.323578834533691, "global_step": 55724, "epoch": 331} {"train_loss": -8.480082511901855, "global_step": 55725, "epoch": 331} {"train_loss": -8.616767883300781, "global_step": 55726, "epoch": 331} {"train_loss": -8.670328140258789, "global_step": 55727, "epoch": 331} {"train_loss": -8.537450790405273, "global_step": 55728, "epoch": 331} {"train_loss": -8.563724517822266, "global_step": 55729, "epoch": 331} {"train_loss": -8.691080093383789, "global_step": 55730, "epoch": 331} {"train_loss": -8.343852043151855, "global_step": 55731, "epoch": 331} {"train_loss": -8.560345649719238, "global_step": 55732, "epoch": 331} {"train_loss": -8.550338745117188, "global_step": 55733, "epoch": 331} {"train_loss": -8.624197006225586, "global_step": 55734, "epoch": 331} {"train_loss": -8.563064575195312, "global_step": 55735, "epoch": 331} {"train_loss": -8.703643798828125, "global_step": 55736, "epoch": 331} {"train_loss": -8.374082565307617, "global_step": 55737, "epoch": 331} {"train_loss": -8.693785667419434, "global_step": 55738, "epoch": 331} {"train_loss": -8.61036491394043, "global_step": 55739, "epoch": 331} {"train_loss": -8.648574829101562, "global_step": 55740, "epoch": 331} {"train_loss": -8.665483474731445, "global_step": 55741, "epoch": 331} {"train_loss": -8.737987518310547, "global_step": 55742, "epoch": 331} {"train_loss": -8.549623489379883, "global_step": 55743, "epoch": 331} {"train_loss": -8.786476135253906, "global_step": 55744, "epoch": 331} {"train_loss": -8.575952529907227, "global_step": 55745, "epoch": 331} {"train_loss": -8.630130767822266, "global_step": 55746, "epoch": 331} {"train_loss": -8.340433120727539, "global_step": 55747, "epoch": 331} {"train_loss": -8.885071754455566, "global_step": 55748, "epoch": 331} {"train_loss": -8.499872207641602, "global_step": 55749, "epoch": 331} {"train_loss": -8.698553085327148, "global_step": 55750, "epoch": 331} {"train_loss": -8.310243606567383, "global_step": 55751, "epoch": 331} {"train_loss": -8.716804504394531, "global_step": 55752, "epoch": 331} {"train_loss": -8.847648620605469, "global_step": 55753, "epoch": 331} {"train_loss": -8.771650314331055, "global_step": 55754, "epoch": 331} {"train_loss": -8.604143142700195, "global_step": 55755, "epoch": 331} {"train_loss": -8.43142318725586, "global_step": 55756, "epoch": 331} {"train_loss": -8.372554779052734, "global_step": 55757, "epoch": 331} {"train_loss": -8.690208435058594, "global_step": 55758, "epoch": 331} {"train_loss": -8.733223915100098, "global_step": 55759, "epoch": 331} {"train_loss": -8.343008995056152, "global_step": 55760, "epoch": 331} {"train_loss": -8.737638473510742, "global_step": 55761, "epoch": 331} {"train_loss": -8.51189136505127, "global_step": 55762, "epoch": 331} {"train_loss": -8.556734085083008, "global_step": 55763, "epoch": 331} {"train_loss": -8.770983695983887, "global_step": 55764, "epoch": 331} {"train_loss": -8.585405349731445, "global_step": 55765, "epoch": 331} {"train_loss": -8.766630172729492, "global_step": 55766, "epoch": 331} {"train_loss": -8.623266220092773, "global_step": 55767, "epoch": 331} {"train_loss": -8.531509399414062, "global_step": 55768, "epoch": 331} {"train_loss": -8.630630493164062, "global_step": 55769, "epoch": 331} {"train_loss": -8.63803482055664, "global_step": 55770, "epoch": 331} {"train_loss": -8.406285285949707, "global_step": 55771, "epoch": 331} {"train_loss": -8.495674133300781, "global_step": 55772, "epoch": 331} {"train_loss": -8.540130615234375, "global_step": 55773, "epoch": 331} {"train_loss": -8.57583236694336, "global_step": 55774, "epoch": 331} {"train_loss": -8.52906315383457, "global_step": 55775, "epoch": 331, "val_loss": 189207.390625} {"train_loss": -8.38835334777832, "global_step": 55776, "epoch": 332} {"train_loss": -8.439144134521484, "global_step": 55777, "epoch": 332} {"train_loss": -8.425504684448242, "global_step": 55778, "epoch": 332} {"train_loss": -8.582366943359375, "global_step": 55779, "epoch": 332} {"train_loss": -8.43248176574707, "global_step": 55780, "epoch": 332} {"train_loss": -8.56568431854248, "global_step": 55781, "epoch": 332} {"train_loss": -8.255849838256836, "global_step": 55782, "epoch": 332} {"train_loss": -8.479161262512207, "global_step": 55783, "epoch": 332} {"train_loss": -8.652965545654297, "global_step": 55784, "epoch": 332} {"train_loss": -8.60720443725586, "global_step": 55785, "epoch": 332} {"train_loss": -8.655841827392578, "global_step": 55786, "epoch": 332} {"train_loss": -8.48272705078125, "global_step": 55787, "epoch": 332} {"train_loss": -8.538349151611328, "global_step": 55788, "epoch": 332} {"train_loss": -8.606842994689941, "global_step": 55789, "epoch": 332} {"train_loss": -8.411169052124023, "global_step": 55790, "epoch": 332} {"train_loss": -8.094561576843262, "global_step": 55791, "epoch": 332} {"train_loss": -8.591297149658203, "global_step": 55792, "epoch": 332} {"train_loss": -8.524904251098633, "global_step": 55793, "epoch": 332} {"train_loss": -8.490071296691895, "global_step": 55794, "epoch": 332} {"train_loss": -8.324533462524414, "global_step": 55795, "epoch": 332} {"train_loss": -8.177234649658203, "global_step": 55796, "epoch": 332} {"train_loss": -8.549723625183105, "global_step": 55797, "epoch": 332} {"train_loss": -8.408818244934082, "global_step": 55798, "epoch": 332} {"train_loss": -8.679661750793457, "global_step": 55799, "epoch": 332} {"train_loss": -8.441283226013184, "global_step": 55800, "epoch": 332} {"train_loss": -8.657447814941406, "global_step": 55801, "epoch": 332} {"train_loss": -8.545263290405273, "global_step": 55802, "epoch": 332} {"train_loss": -8.464513778686523, "global_step": 55803, "epoch": 332} {"train_loss": -8.572305679321289, "global_step": 55804, "epoch": 332} {"train_loss": -8.810418128967285, "global_step": 55805, "epoch": 332} {"train_loss": -8.52702522277832, "global_step": 55806, "epoch": 332} {"train_loss": -8.462666511535645, "global_step": 55807, "epoch": 332} {"train_loss": -8.48947525024414, "global_step": 55808, "epoch": 332} {"train_loss": -8.359312057495117, "global_step": 55809, "epoch": 332} {"train_loss": -8.623048782348633, "global_step": 55810, "epoch": 332} {"train_loss": -8.270185470581055, "global_step": 55811, "epoch": 332} {"train_loss": -8.195178985595703, "global_step": 55812, "epoch": 332} {"train_loss": -8.445099830627441, "global_step": 55813, "epoch": 332} {"train_loss": -8.435598373413086, "global_step": 55814, "epoch": 332} {"train_loss": -8.600175857543945, "global_step": 55815, "epoch": 332} {"train_loss": -8.446447372436523, "global_step": 55816, "epoch": 332} {"train_loss": -8.547220230102539, "global_step": 55817, "epoch": 332} {"train_loss": -8.361801147460938, "global_step": 55818, "epoch": 332} {"train_loss": -8.455320358276367, "global_step": 55819, "epoch": 332} {"train_loss": -8.452264785766602, "global_step": 55820, "epoch": 332} {"train_loss": -8.717531204223633, "global_step": 55821, "epoch": 332} {"train_loss": -8.474227905273438, "global_step": 55822, "epoch": 332} {"train_loss": -8.401823997497559, "global_step": 55823, "epoch": 332} {"train_loss": -8.550752639770508, "global_step": 55824, "epoch": 332} {"train_loss": -8.543144226074219, "global_step": 55825, "epoch": 332} {"train_loss": -8.639298439025879, "global_step": 55826, "epoch": 332} {"train_loss": -8.654056549072266, "global_step": 55827, "epoch": 332} {"train_loss": -8.691399574279785, "global_step": 55828, "epoch": 332} {"train_loss": -8.71851921081543, "global_step": 55829, "epoch": 332} {"train_loss": -8.71511459350586, "global_step": 55830, "epoch": 332} {"train_loss": -8.611797332763672, "global_step": 55831, "epoch": 332} {"train_loss": -8.645374298095703, "global_step": 55832, "epoch": 332} {"train_loss": -8.63909912109375, "global_step": 55833, "epoch": 332} {"train_loss": -8.721630096435547, "global_step": 55834, "epoch": 332} {"train_loss": -8.680767059326172, "global_step": 55835, "epoch": 332} {"train_loss": -8.672164916992188, "global_step": 55836, "epoch": 332} {"train_loss": -8.511089324951172, "global_step": 55837, "epoch": 332} {"train_loss": -8.73515510559082, "global_step": 55838, "epoch": 332} {"train_loss": -8.7681303024292, "global_step": 55839, "epoch": 332} {"train_loss": -8.689756393432617, "global_step": 55840, "epoch": 332} {"train_loss": -8.55829906463623, "global_step": 55841, "epoch": 332} {"train_loss": -8.772024154663086, "global_step": 55842, "epoch": 332} {"train_loss": -8.801071166992188, "global_step": 55843, "epoch": 332} {"train_loss": -8.53929328918457, "global_step": 55844, "epoch": 332} {"train_loss": -8.59871768951416, "global_step": 55845, "epoch": 332} {"train_loss": -8.756492614746094, "global_step": 55846, "epoch": 332} {"train_loss": -8.72743034362793, "global_step": 55847, "epoch": 332} {"train_loss": -8.768022537231445, "global_step": 55848, "epoch": 332} {"train_loss": -8.82805347442627, "global_step": 55849, "epoch": 332} {"train_loss": -8.632288932800293, "global_step": 55850, "epoch": 332} {"train_loss": -8.776090621948242, "global_step": 55851, "epoch": 332} {"train_loss": -8.684137344360352, "global_step": 55852, "epoch": 332} {"train_loss": -8.341224670410156, "global_step": 55853, "epoch": 332} {"train_loss": -8.627680778503418, "global_step": 55854, "epoch": 332} {"train_loss": -8.473047256469727, "global_step": 55855, "epoch": 332} {"train_loss": -8.655984878540039, "global_step": 55856, "epoch": 332} {"train_loss": -8.534591674804688, "global_step": 55857, "epoch": 332} {"train_loss": -8.494853973388672, "global_step": 55858, "epoch": 332} {"train_loss": -8.717339515686035, "global_step": 55859, "epoch": 332} {"train_loss": -8.500297546386719, "global_step": 55860, "epoch": 332} {"train_loss": -8.346380233764648, "global_step": 55861, "epoch": 332} {"train_loss": -8.36430835723877, "global_step": 55862, "epoch": 332} {"train_loss": -8.636805534362793, "global_step": 55863, "epoch": 332} {"train_loss": -8.405553817749023, "global_step": 55864, "epoch": 332} {"train_loss": -8.519200325012207, "global_step": 55865, "epoch": 332} {"train_loss": -8.562294006347656, "global_step": 55866, "epoch": 332} {"train_loss": -8.676794052124023, "global_step": 55867, "epoch": 332} {"train_loss": -8.396221160888672, "global_step": 55868, "epoch": 332} {"train_loss": -8.401641845703125, "global_step": 55869, "epoch": 332} {"train_loss": -8.547616958618164, "global_step": 55870, "epoch": 332} {"train_loss": -8.425182342529297, "global_step": 55871, "epoch": 332} {"train_loss": -8.345182418823242, "global_step": 55872, "epoch": 332} {"train_loss": -8.629044532775879, "global_step": 55873, "epoch": 332} {"train_loss": -8.208600044250488, "global_step": 55874, "epoch": 332} {"train_loss": -8.362286567687988, "global_step": 55875, "epoch": 332} {"train_loss": -8.462461471557617, "global_step": 55876, "epoch": 332} {"train_loss": -8.490033149719238, "global_step": 55877, "epoch": 332} {"train_loss": -8.28714370727539, "global_step": 55878, "epoch": 332} {"train_loss": -8.504950523376465, "global_step": 55879, "epoch": 332} {"train_loss": -8.644824028015137, "global_step": 55880, "epoch": 332} {"train_loss": -8.17072868347168, "global_step": 55881, "epoch": 332} {"train_loss": -8.486717224121094, "global_step": 55882, "epoch": 332} {"train_loss": -8.379899978637695, "global_step": 55883, "epoch": 332} {"train_loss": -8.326370239257812, "global_step": 55884, "epoch": 332} {"train_loss": -8.20051383972168, "global_step": 55885, "epoch": 332} {"train_loss": -8.13998031616211, "global_step": 55886, "epoch": 332} {"train_loss": -8.452590942382812, "global_step": 55887, "epoch": 332} {"train_loss": -8.189960479736328, "global_step": 55888, "epoch": 332} {"train_loss": -8.195542335510254, "global_step": 55889, "epoch": 332} {"train_loss": -8.337099075317383, "global_step": 55890, "epoch": 332} {"train_loss": -8.461891174316406, "global_step": 55891, "epoch": 332} {"train_loss": -8.41693115234375, "global_step": 55892, "epoch": 332} {"train_loss": -8.508256912231445, "global_step": 55893, "epoch": 332} {"train_loss": -8.302026748657227, "global_step": 55894, "epoch": 332} {"train_loss": -8.510276794433594, "global_step": 55895, "epoch": 332} {"train_loss": -8.311305046081543, "global_step": 55896, "epoch": 332} {"train_loss": -8.629793167114258, "global_step": 55897, "epoch": 332} {"train_loss": -8.602039337158203, "global_step": 55898, "epoch": 332} {"train_loss": -8.667882919311523, "global_step": 55899, "epoch": 332} {"train_loss": -8.531486511230469, "global_step": 55900, "epoch": 332} {"train_loss": -8.320662498474121, "global_step": 55901, "epoch": 332} {"train_loss": -8.638627052307129, "global_step": 55902, "epoch": 332} {"train_loss": -8.654865264892578, "global_step": 55903, "epoch": 332} {"train_loss": -8.686762809753418, "global_step": 55904, "epoch": 332} {"train_loss": -8.565725326538086, "global_step": 55905, "epoch": 332} {"train_loss": -8.529606819152832, "global_step": 55906, "epoch": 332} {"train_loss": -8.634902954101562, "global_step": 55907, "epoch": 332} {"train_loss": -8.601884841918945, "global_step": 55908, "epoch": 332} {"train_loss": -8.514446258544922, "global_step": 55909, "epoch": 332} {"train_loss": -8.69528579711914, "global_step": 55910, "epoch": 332} {"train_loss": -8.69508171081543, "global_step": 55911, "epoch": 332} {"train_loss": -8.544620513916016, "global_step": 55912, "epoch": 332} {"train_loss": -8.658575057983398, "global_step": 55913, "epoch": 332} {"train_loss": -8.426023483276367, "global_step": 55914, "epoch": 332} {"train_loss": -8.699335098266602, "global_step": 55915, "epoch": 332} {"train_loss": -8.615758895874023, "global_step": 55916, "epoch": 332} {"train_loss": -8.232582092285156, "global_step": 55917, "epoch": 332} {"train_loss": -8.675774574279785, "global_step": 55918, "epoch": 332} {"train_loss": -8.444236755371094, "global_step": 55919, "epoch": 332} {"train_loss": -8.47511100769043, "global_step": 55920, "epoch": 332} {"train_loss": -8.295364379882812, "global_step": 55921, "epoch": 332} {"train_loss": -8.687080383300781, "global_step": 55922, "epoch": 332} {"train_loss": -8.58360481262207, "global_step": 55923, "epoch": 332} {"train_loss": -8.771626472473145, "global_step": 55924, "epoch": 332} {"train_loss": -8.624326705932617, "global_step": 55925, "epoch": 332} {"train_loss": -8.59115219116211, "global_step": 55926, "epoch": 332} {"train_loss": -8.739832878112793, "global_step": 55927, "epoch": 332} {"train_loss": -8.514047622680664, "global_step": 55928, "epoch": 332} {"train_loss": -8.827325820922852, "global_step": 55929, "epoch": 332} {"train_loss": -8.61132526397705, "global_step": 55930, "epoch": 332} {"train_loss": -8.730838775634766, "global_step": 55931, "epoch": 332} {"train_loss": -8.671831130981445, "global_step": 55932, "epoch": 332} {"train_loss": -8.454498291015625, "global_step": 55933, "epoch": 332} {"train_loss": -8.731379508972168, "global_step": 55934, "epoch": 332} {"train_loss": -8.509525299072266, "global_step": 55935, "epoch": 332} {"train_loss": -8.689743041992188, "global_step": 55936, "epoch": 332} {"train_loss": -8.763017654418945, "global_step": 55937, "epoch": 332} {"train_loss": -8.523672103881836, "global_step": 55938, "epoch": 332} {"train_loss": -8.40610122680664, "global_step": 55939, "epoch": 332} {"train_loss": -8.484004974365234, "global_step": 55940, "epoch": 332} {"train_loss": -8.25042724609375, "global_step": 55941, "epoch": 332} {"train_loss": -7.954488754272461, "global_step": 55942, "epoch": 332} {"train_loss": -8.52612700916472, "global_step": 55943, "epoch": 332, "val_loss": 188868.265625} {"train_loss": -8.073533058166504, "global_step": 55944, "epoch": 333} {"train_loss": -7.805972576141357, "global_step": 55945, "epoch": 333} {"train_loss": -7.879593372344971, "global_step": 55946, "epoch": 333} {"train_loss": -7.913091659545898, "global_step": 55947, "epoch": 333} {"train_loss": -7.877476692199707, "global_step": 55948, "epoch": 333} {"train_loss": -8.301365852355957, "global_step": 55949, "epoch": 333} {"train_loss": -8.256092071533203, "global_step": 55950, "epoch": 333} {"train_loss": -7.990103721618652, "global_step": 55951, "epoch": 333} {"train_loss": -7.9554219245910645, "global_step": 55952, "epoch": 333} {"train_loss": -8.230801582336426, "global_step": 55953, "epoch": 333} {"train_loss": -8.201738357543945, "global_step": 55954, "epoch": 333} {"train_loss": -7.943368434906006, "global_step": 55955, "epoch": 333} {"train_loss": -7.948369026184082, "global_step": 55956, "epoch": 333} {"train_loss": -8.297882080078125, "global_step": 55957, "epoch": 333} {"train_loss": -8.128424644470215, "global_step": 55958, "epoch": 333} {"train_loss": -7.897801876068115, "global_step": 55959, "epoch": 333} {"train_loss": -7.952398300170898, "global_step": 55960, "epoch": 333} {"train_loss": -8.208723068237305, "global_step": 55961, "epoch": 333} {"train_loss": -8.150078773498535, "global_step": 55962, "epoch": 333} {"train_loss": -8.1559419631958, "global_step": 55963, "epoch": 333} {"train_loss": -8.274249076843262, "global_step": 55964, "epoch": 333} {"train_loss": -8.243066787719727, "global_step": 55965, "epoch": 333} {"train_loss": -8.354944229125977, "global_step": 55966, "epoch": 333} {"train_loss": -8.280381202697754, "global_step": 55967, "epoch": 333} {"train_loss": -8.30130386352539, "global_step": 55968, "epoch": 333} {"train_loss": -8.416526794433594, "global_step": 55969, "epoch": 333} {"train_loss": -8.481507301330566, "global_step": 55970, "epoch": 333} {"train_loss": -8.414506912231445, "global_step": 55971, "epoch": 333} {"train_loss": -8.642213821411133, "global_step": 55972, "epoch": 333} {"train_loss": -8.574275970458984, "global_step": 55973, "epoch": 333} {"train_loss": -8.306745529174805, "global_step": 55974, "epoch": 333} {"train_loss": -8.420063018798828, "global_step": 55975, "epoch": 333} {"train_loss": -8.552940368652344, "global_step": 55976, "epoch": 333} {"train_loss": -8.610427856445312, "global_step": 55977, "epoch": 333} {"train_loss": -8.481634140014648, "global_step": 55978, "epoch": 333} {"train_loss": -8.544695854187012, "global_step": 55979, "epoch": 333} {"train_loss": -8.37641716003418, "global_step": 55980, "epoch": 333} {"train_loss": -8.709624290466309, "global_step": 55981, "epoch": 333} {"train_loss": -8.244607925415039, "global_step": 55982, "epoch": 333} {"train_loss": -8.580239295959473, "global_step": 55983, "epoch": 333} {"train_loss": -8.533453941345215, "global_step": 55984, "epoch": 333} {"train_loss": -8.573869705200195, "global_step": 55985, "epoch": 333} {"train_loss": -8.539070129394531, "global_step": 55986, "epoch": 333} {"train_loss": -8.757497787475586, "global_step": 55987, "epoch": 333} {"train_loss": -8.3353910446167, "global_step": 55988, "epoch": 333} {"train_loss": -8.673535346984863, "global_step": 55989, "epoch": 333} {"train_loss": -8.389341354370117, "global_step": 55990, "epoch": 333} {"train_loss": -8.453782081604004, "global_step": 55991, "epoch": 333} {"train_loss": -8.384149551391602, "global_step": 55992, "epoch": 333} {"train_loss": -8.185745239257812, "global_step": 55993, "epoch": 333} {"train_loss": -8.384140014648438, "global_step": 55994, "epoch": 333} {"train_loss": -8.633769989013672, "global_step": 55995, "epoch": 333} {"train_loss": -8.151042938232422, "global_step": 55996, "epoch": 333} {"train_loss": -8.60393238067627, "global_step": 55997, "epoch": 333} {"train_loss": -8.074176788330078, "global_step": 55998, "epoch": 333} {"train_loss": -8.187675476074219, "global_step": 55999, "epoch": 333} {"train_loss": -8.265955924987793, "global_step": 56000, "epoch": 333} {"train_loss": -8.178764343261719, "global_step": 56001, "epoch": 333} {"train_loss": -8.432920455932617, "global_step": 56002, "epoch": 333} {"train_loss": -8.195194244384766, "global_step": 56003, "epoch": 333} {"train_loss": -8.482772827148438, "global_step": 56004, "epoch": 333} {"train_loss": -8.299354553222656, "global_step": 56005, "epoch": 333} {"train_loss": -8.29873275756836, "global_step": 56006, "epoch": 333} {"train_loss": -8.505489349365234, "global_step": 56007, "epoch": 333} {"train_loss": -8.260337829589844, "global_step": 56008, "epoch": 333} {"train_loss": -8.521415710449219, "global_step": 56009, "epoch": 333} {"train_loss": -8.429019927978516, "global_step": 56010, "epoch": 333} {"train_loss": -8.403152465820312, "global_step": 56011, "epoch": 333} {"train_loss": -8.419509887695312, "global_step": 56012, "epoch": 333} {"train_loss": -8.383943557739258, "global_step": 56013, "epoch": 333} {"train_loss": -8.494443893432617, "global_step": 56014, "epoch": 333} {"train_loss": -8.36033821105957, "global_step": 56015, "epoch": 333} {"train_loss": -8.8706693649292, "global_step": 56016, "epoch": 333} {"train_loss": -8.664493560791016, "global_step": 56017, "epoch": 333} {"train_loss": -8.554986953735352, "global_step": 56018, "epoch": 333} {"train_loss": -8.536109924316406, "global_step": 56019, "epoch": 333} {"train_loss": -8.522612571716309, "global_step": 56020, "epoch": 333} {"train_loss": -8.55765438079834, "global_step": 56021, "epoch": 333} {"train_loss": -8.865511894226074, "global_step": 56022, "epoch": 333} {"train_loss": -8.690923690795898, "global_step": 56023, "epoch": 333} {"train_loss": -8.669593811035156, "global_step": 56024, "epoch": 333} {"train_loss": -8.721475601196289, "global_step": 56025, "epoch": 333} {"train_loss": -8.80720329284668, "global_step": 56026, "epoch": 333} {"train_loss": -8.766240119934082, "global_step": 56027, "epoch": 333} {"train_loss": -8.722206115722656, "global_step": 56028, "epoch": 333} {"train_loss": -8.736028671264648, "global_step": 56029, "epoch": 333} {"train_loss": -8.84818172454834, "global_step": 56030, "epoch": 333} {"train_loss": -8.715764999389648, "global_step": 56031, "epoch": 333} {"train_loss": -8.599861145019531, "global_step": 56032, "epoch": 333} {"train_loss": -8.689982414245605, "global_step": 56033, "epoch": 333} {"train_loss": -8.480741500854492, "global_step": 56034, "epoch": 333} {"train_loss": -8.736854553222656, "global_step": 56035, "epoch": 333} {"train_loss": -8.815146446228027, "global_step": 56036, "epoch": 333} {"train_loss": -8.204652786254883, "global_step": 56037, "epoch": 333} {"train_loss": -8.623651504516602, "global_step": 56038, "epoch": 333} {"train_loss": -8.387674331665039, "global_step": 56039, "epoch": 333} {"train_loss": -8.372034072875977, "global_step": 56040, "epoch": 333} {"train_loss": -8.589117050170898, "global_step": 56041, "epoch": 333} {"train_loss": -8.353792190551758, "global_step": 56042, "epoch": 333} {"train_loss": -8.537628173828125, "global_step": 56043, "epoch": 333} {"train_loss": -8.329497337341309, "global_step": 56044, "epoch": 333} {"train_loss": -8.39597225189209, "global_step": 56045, "epoch": 333} {"train_loss": -8.669631958007812, "global_step": 56046, "epoch": 333} {"train_loss": -8.301790237426758, "global_step": 56047, "epoch": 333} {"train_loss": -8.350387573242188, "global_step": 56048, "epoch": 333} {"train_loss": -8.80523681640625, "global_step": 56049, "epoch": 333} {"train_loss": -8.396855354309082, "global_step": 56050, "epoch": 333} {"train_loss": -8.480508804321289, "global_step": 56051, "epoch": 333} {"train_loss": -8.625991821289062, "global_step": 56052, "epoch": 333} {"train_loss": -8.46938705444336, "global_step": 56053, "epoch": 333} {"train_loss": -8.469598770141602, "global_step": 56054, "epoch": 333} {"train_loss": -8.420503616333008, "global_step": 56055, "epoch": 333} {"train_loss": -8.519262313842773, "global_step": 56056, "epoch": 333} {"train_loss": -8.407413482666016, "global_step": 56057, "epoch": 333} {"train_loss": -8.305875778198242, "global_step": 56058, "epoch": 333} {"train_loss": -8.552253723144531, "global_step": 56059, "epoch": 333} {"train_loss": -8.424461364746094, "global_step": 56060, "epoch": 333} {"train_loss": -8.31904411315918, "global_step": 56061, "epoch": 333} {"train_loss": -8.70805549621582, "global_step": 56062, "epoch": 333} {"train_loss": -8.414463996887207, "global_step": 56063, "epoch": 333} {"train_loss": -8.492687225341797, "global_step": 56064, "epoch": 333} {"train_loss": -8.380546569824219, "global_step": 56065, "epoch": 333} {"train_loss": -8.447216987609863, "global_step": 56066, "epoch": 333} {"train_loss": -8.557788848876953, "global_step": 56067, "epoch": 333} {"train_loss": -8.620101928710938, "global_step": 56068, "epoch": 333} {"train_loss": -8.645249366760254, "global_step": 56069, "epoch": 333} {"train_loss": -8.294504165649414, "global_step": 56070, "epoch": 333} {"train_loss": -8.576156616210938, "global_step": 56071, "epoch": 333} {"train_loss": -8.71249771118164, "global_step": 56072, "epoch": 333} {"train_loss": -8.601879119873047, "global_step": 56073, "epoch": 333} {"train_loss": -8.763051986694336, "global_step": 56074, "epoch": 333} {"train_loss": -8.692911148071289, "global_step": 56075, "epoch": 333} {"train_loss": -8.802739143371582, "global_step": 56076, "epoch": 333} {"train_loss": -8.646234512329102, "global_step": 56077, "epoch": 333} {"train_loss": -8.791176795959473, "global_step": 56078, "epoch": 333} {"train_loss": -8.71606731414795, "global_step": 56079, "epoch": 333} {"train_loss": -8.589273452758789, "global_step": 56080, "epoch": 333} {"train_loss": -8.835620880126953, "global_step": 56081, "epoch": 333} {"train_loss": -8.63787841796875, "global_step": 56082, "epoch": 333} {"train_loss": -8.44019889831543, "global_step": 56083, "epoch": 333} {"train_loss": -8.584424018859863, "global_step": 56084, "epoch": 333} {"train_loss": -8.488605499267578, "global_step": 56085, "epoch": 333} {"train_loss": -8.74577522277832, "global_step": 56086, "epoch": 333} {"train_loss": -8.433956146240234, "global_step": 56087, "epoch": 333} {"train_loss": -8.629416465759277, "global_step": 56088, "epoch": 333} {"train_loss": -8.429940223693848, "global_step": 56089, "epoch": 333} {"train_loss": -8.532411575317383, "global_step": 56090, "epoch": 333} {"train_loss": -8.437725067138672, "global_step": 56091, "epoch": 333} {"train_loss": -8.526209831237793, "global_step": 56092, "epoch": 333} {"train_loss": -8.773714065551758, "global_step": 56093, "epoch": 333} {"train_loss": -8.485477447509766, "global_step": 56094, "epoch": 333} {"train_loss": -8.703714370727539, "global_step": 56095, "epoch": 333} {"train_loss": -8.725688934326172, "global_step": 56096, "epoch": 333} {"train_loss": -8.7935791015625, "global_step": 56097, "epoch": 333} {"train_loss": -8.66257381439209, "global_step": 56098, "epoch": 333} {"train_loss": -8.465499877929688, "global_step": 56099, "epoch": 333} {"train_loss": -8.380373001098633, "global_step": 56100, "epoch": 333} {"train_loss": -8.199726104736328, "global_step": 56101, "epoch": 333} {"train_loss": -8.611631393432617, "global_step": 56102, "epoch": 333} {"train_loss": -8.210882186889648, "global_step": 56103, "epoch": 333} {"train_loss": -8.450226783752441, "global_step": 56104, "epoch": 333} {"train_loss": -8.41879940032959, "global_step": 56105, "epoch": 333} {"train_loss": -8.368305206298828, "global_step": 56106, "epoch": 333} {"train_loss": -8.692584037780762, "global_step": 56107, "epoch": 333} {"train_loss": -8.565812110900879, "global_step": 56108, "epoch": 333} {"train_loss": -8.270190238952637, "global_step": 56109, "epoch": 333} {"train_loss": -8.46509075164795, "global_step": 56110, "epoch": 333} {"train_loss": -8.454017698764801, "global_step": 56111, "epoch": 333, "val_loss": 190663.9375} {"train_loss": -8.407571792602539, "global_step": 56112, "epoch": 334} {"train_loss": -8.707170486450195, "global_step": 56113, "epoch": 334} {"train_loss": -8.41281509399414, "global_step": 56114, "epoch": 334} {"train_loss": -8.35275650024414, "global_step": 56115, "epoch": 334} {"train_loss": -8.487064361572266, "global_step": 56116, "epoch": 334} {"train_loss": -8.237749099731445, "global_step": 56117, "epoch": 334} {"train_loss": -8.34280776977539, "global_step": 56118, "epoch": 334} {"train_loss": -8.528982162475586, "global_step": 56119, "epoch": 334} {"train_loss": -8.066354751586914, "global_step": 56120, "epoch": 334} {"train_loss": -8.494979858398438, "global_step": 56121, "epoch": 334} {"train_loss": -8.573478698730469, "global_step": 56122, "epoch": 334} {"train_loss": -8.36593246459961, "global_step": 56123, "epoch": 334} {"train_loss": -8.3922700881958, "global_step": 56124, "epoch": 334} {"train_loss": -8.319758415222168, "global_step": 56125, "epoch": 334} {"train_loss": -8.506258964538574, "global_step": 56126, "epoch": 334} {"train_loss": -8.41276741027832, "global_step": 56127, "epoch": 334} {"train_loss": -8.661839485168457, "global_step": 56128, "epoch": 334} {"train_loss": -8.348876953125, "global_step": 56129, "epoch": 334} {"train_loss": -8.268686294555664, "global_step": 56130, "epoch": 334} {"train_loss": -8.390636444091797, "global_step": 56131, "epoch": 334} {"train_loss": -8.500101089477539, "global_step": 56132, "epoch": 334} {"train_loss": -8.211872100830078, "global_step": 56133, "epoch": 334} {"train_loss": -8.346263885498047, "global_step": 56134, "epoch": 334} {"train_loss": -8.45687198638916, "global_step": 56135, "epoch": 334} {"train_loss": -8.498300552368164, "global_step": 56136, "epoch": 334} {"train_loss": -8.398904800415039, "global_step": 56137, "epoch": 334} {"train_loss": -8.169791221618652, "global_step": 56138, "epoch": 334} {"train_loss": -8.520370483398438, "global_step": 56139, "epoch": 334} {"train_loss": -8.339616775512695, "global_step": 56140, "epoch": 334} {"train_loss": -8.92326545715332, "global_step": 56141, "epoch": 334} {"train_loss": -8.372566223144531, "global_step": 56142, "epoch": 334} {"train_loss": -8.816278457641602, "global_step": 56143, "epoch": 334} {"train_loss": -8.62875747680664, "global_step": 56144, "epoch": 334} {"train_loss": -8.64056396484375, "global_step": 56145, "epoch": 334} {"train_loss": -8.513021469116211, "global_step": 56146, "epoch": 334} {"train_loss": -8.771517753601074, "global_step": 56147, "epoch": 334} {"train_loss": -8.38436508178711, "global_step": 56148, "epoch": 334} {"train_loss": -8.615789413452148, "global_step": 56149, "epoch": 334} {"train_loss": -8.65666389465332, "global_step": 56150, "epoch": 334} {"train_loss": -8.79495906829834, "global_step": 56151, "epoch": 334} {"train_loss": -8.588393211364746, "global_step": 56152, "epoch": 334} {"train_loss": -8.890312194824219, "global_step": 56153, "epoch": 334} {"train_loss": -8.79588508605957, "global_step": 56154, "epoch": 334} {"train_loss": -8.949531555175781, "global_step": 56155, "epoch": 334} {"train_loss": -8.616080284118652, "global_step": 56156, "epoch": 334} {"train_loss": -8.762386322021484, "global_step": 56157, "epoch": 334} {"train_loss": -8.785209655761719, "global_step": 56158, "epoch": 334} {"train_loss": -8.660633087158203, "global_step": 56159, "epoch": 334} {"train_loss": -8.700122833251953, "global_step": 56160, "epoch": 334} {"train_loss": -8.474187850952148, "global_step": 56161, "epoch": 334} {"train_loss": -8.630487442016602, "global_step": 56162, "epoch": 334} {"train_loss": -8.321846008300781, "global_step": 56163, "epoch": 334} {"train_loss": -8.392797470092773, "global_step": 56164, "epoch": 334} {"train_loss": -7.810434341430664, "global_step": 56165, "epoch": 334} {"train_loss": -8.195930480957031, "global_step": 56166, "epoch": 334} {"train_loss": -7.54075813293457, "global_step": 56167, "epoch": 334} {"train_loss": -7.951532363891602, "global_step": 56168, "epoch": 334} {"train_loss": -7.830148696899414, "global_step": 56169, "epoch": 334} {"train_loss": -8.17626667022705, "global_step": 56170, "epoch": 334} {"train_loss": -7.95872688293457, "global_step": 56171, "epoch": 334} {"train_loss": -8.22510814666748, "global_step": 56172, "epoch": 334} {"train_loss": -7.811053276062012, "global_step": 56173, "epoch": 334} {"train_loss": -8.34937858581543, "global_step": 56174, "epoch": 334} {"train_loss": -8.069594383239746, "global_step": 56175, "epoch": 334} {"train_loss": -8.028829574584961, "global_step": 56176, "epoch": 334} {"train_loss": -8.045221328735352, "global_step": 56177, "epoch": 334} {"train_loss": -8.27452564239502, "global_step": 56178, "epoch": 334} {"train_loss": -8.249640464782715, "global_step": 56179, "epoch": 334} {"train_loss": -8.369377136230469, "global_step": 56180, "epoch": 334} {"train_loss": -8.093220710754395, "global_step": 56181, "epoch": 334} {"train_loss": -8.203638076782227, "global_step": 56182, "epoch": 334} {"train_loss": -8.274343490600586, "global_step": 56183, "epoch": 334} {"train_loss": -8.240711212158203, "global_step": 56184, "epoch": 334} {"train_loss": -8.229169845581055, "global_step": 56185, "epoch": 334} {"train_loss": -8.312372207641602, "global_step": 56186, "epoch": 334} {"train_loss": -8.370047569274902, "global_step": 56187, "epoch": 334} {"train_loss": -8.329854965209961, "global_step": 56188, "epoch": 334} {"train_loss": -8.320088386535645, "global_step": 56189, "epoch": 334} {"train_loss": -8.192809104919434, "global_step": 56190, "epoch": 334} {"train_loss": -8.404233932495117, "global_step": 56191, "epoch": 334} {"train_loss": -8.333882331848145, "global_step": 56192, "epoch": 334} {"train_loss": -8.444923400878906, "global_step": 56193, "epoch": 334} {"train_loss": -8.483987808227539, "global_step": 56194, "epoch": 334} {"train_loss": -8.420511245727539, "global_step": 56195, "epoch": 334} {"train_loss": -8.37811279296875, "global_step": 56196, "epoch": 334} {"train_loss": -8.36677360534668, "global_step": 56197, "epoch": 334} {"train_loss": -8.570589065551758, "global_step": 56198, "epoch": 334} {"train_loss": -8.548733711242676, "global_step": 56199, "epoch": 334} {"train_loss": -8.228784561157227, "global_step": 56200, "epoch": 334} {"train_loss": -8.814008712768555, "global_step": 56201, "epoch": 334} {"train_loss": -8.600037574768066, "global_step": 56202, "epoch": 334} {"train_loss": -8.809715270996094, "global_step": 56203, "epoch": 334} {"train_loss": -8.640487670898438, "global_step": 56204, "epoch": 334} {"train_loss": -8.652822494506836, "global_step": 56205, "epoch": 334} {"train_loss": -8.535268783569336, "global_step": 56206, "epoch": 334} {"train_loss": -8.450262069702148, "global_step": 56207, "epoch": 334} {"train_loss": -8.542753219604492, "global_step": 56208, "epoch": 334} {"train_loss": -8.328596115112305, "global_step": 56209, "epoch": 334} {"train_loss": -8.34749984741211, "global_step": 56210, "epoch": 334} {"train_loss": -8.301878929138184, "global_step": 56211, "epoch": 334} {"train_loss": -8.56004524230957, "global_step": 56212, "epoch": 334} {"train_loss": -8.27866268157959, "global_step": 56213, "epoch": 334} {"train_loss": -8.171832084655762, "global_step": 56214, "epoch": 334} {"train_loss": -8.721699714660645, "global_step": 56215, "epoch": 334} {"train_loss": -8.261127471923828, "global_step": 56216, "epoch": 334} {"train_loss": -8.208612442016602, "global_step": 56217, "epoch": 334} {"train_loss": -8.653212547302246, "global_step": 56218, "epoch": 334} {"train_loss": -8.413875579833984, "global_step": 56219, "epoch": 334} {"train_loss": -8.633721351623535, "global_step": 56220, "epoch": 334} {"train_loss": -8.281116485595703, "global_step": 56221, "epoch": 334} {"train_loss": -8.414310455322266, "global_step": 56222, "epoch": 334} {"train_loss": -8.271461486816406, "global_step": 56223, "epoch": 334} {"train_loss": -8.454985618591309, "global_step": 56224, "epoch": 334} {"train_loss": -8.408096313476562, "global_step": 56225, "epoch": 334} {"train_loss": -8.602690696716309, "global_step": 56226, "epoch": 334} {"train_loss": -8.440454483032227, "global_step": 56227, "epoch": 334} {"train_loss": -8.426301956176758, "global_step": 56228, "epoch": 334} {"train_loss": -8.509807586669922, "global_step": 56229, "epoch": 334} {"train_loss": -8.312182426452637, "global_step": 56230, "epoch": 334} {"train_loss": -8.216771125793457, "global_step": 56231, "epoch": 334} {"train_loss": -8.699223518371582, "global_step": 56232, "epoch": 334} {"train_loss": -8.352787017822266, "global_step": 56233, "epoch": 334} {"train_loss": -8.513544082641602, "global_step": 56234, "epoch": 334} {"train_loss": -8.68113899230957, "global_step": 56235, "epoch": 334} {"train_loss": -8.444219589233398, "global_step": 56236, "epoch": 334} {"train_loss": -8.627999305725098, "global_step": 56237, "epoch": 334} {"train_loss": -8.437637329101562, "global_step": 56238, "epoch": 334} {"train_loss": -8.471976280212402, "global_step": 56239, "epoch": 334} {"train_loss": -8.545390129089355, "global_step": 56240, "epoch": 334} {"train_loss": -8.564632415771484, "global_step": 56241, "epoch": 334} {"train_loss": -8.372344970703125, "global_step": 56242, "epoch": 334} {"train_loss": -8.611207962036133, "global_step": 56243, "epoch": 334} {"train_loss": -8.664684295654297, "global_step": 56244, "epoch": 334} {"train_loss": -8.653181076049805, "global_step": 56245, "epoch": 334} {"train_loss": -8.652059555053711, "global_step": 56246, "epoch": 334} {"train_loss": -8.738717079162598, "global_step": 56247, "epoch": 334} {"train_loss": -8.571727752685547, "global_step": 56248, "epoch": 334} {"train_loss": -8.739081382751465, "global_step": 56249, "epoch": 334} {"train_loss": -8.498424530029297, "global_step": 56250, "epoch": 334} {"train_loss": -8.64137077331543, "global_step": 56251, "epoch": 334} {"train_loss": -8.55188274383545, "global_step": 56252, "epoch": 334} {"train_loss": -8.778787612915039, "global_step": 56253, "epoch": 334} {"train_loss": -8.484813690185547, "global_step": 56254, "epoch": 334} {"train_loss": -8.827866554260254, "global_step": 56255, "epoch": 334} {"train_loss": -8.671854019165039, "global_step": 56256, "epoch": 334} {"train_loss": -8.449592590332031, "global_step": 56257, "epoch": 334} {"train_loss": -8.827960968017578, "global_step": 56258, "epoch": 334} {"train_loss": -8.434516906738281, "global_step": 56259, "epoch": 334} {"train_loss": -8.734291076660156, "global_step": 56260, "epoch": 334} {"train_loss": -8.550899505615234, "global_step": 56261, "epoch": 334} {"train_loss": -8.586431503295898, "global_step": 56262, "epoch": 334} {"train_loss": -8.833626747131348, "global_step": 56263, "epoch": 334} {"train_loss": -8.676132202148438, "global_step": 56264, "epoch": 334} {"train_loss": -8.493610382080078, "global_step": 56265, "epoch": 334} {"train_loss": -8.50882339477539, "global_step": 56266, "epoch": 334} {"train_loss": -8.437832832336426, "global_step": 56267, "epoch": 334} {"train_loss": -8.352739334106445, "global_step": 56268, "epoch": 334} {"train_loss": -8.427385330200195, "global_step": 56269, "epoch": 334} {"train_loss": -8.3954496383667, "global_step": 56270, "epoch": 334} {"train_loss": -8.492798805236816, "global_step": 56271, "epoch": 334} {"train_loss": -8.163558959960938, "global_step": 56272, "epoch": 334} {"train_loss": -8.317167282104492, "global_step": 56273, "epoch": 334} {"train_loss": -8.167041778564453, "global_step": 56274, "epoch": 334} {"train_loss": -8.383988380432129, "global_step": 56275, "epoch": 334} {"train_loss": -8.342292785644531, "global_step": 56276, "epoch": 334} {"train_loss": -8.3606538772583, "global_step": 56277, "epoch": 334} {"train_loss": -8.58829402923584, "global_step": 56278, "epoch": 334} {"train_loss": -8.446096181869507, "global_step": 56279, "epoch": 334, "val_loss": 189382.671875} {"train_loss": -8.295143127441406, "global_step": 56280, "epoch": 335} {"train_loss": -8.393062591552734, "global_step": 56281, "epoch": 335} {"train_loss": -8.29325008392334, "global_step": 56282, "epoch": 335} {"train_loss": -8.287177085876465, "global_step": 56283, "epoch": 335} {"train_loss": -8.5278902053833, "global_step": 56284, "epoch": 335} {"train_loss": -8.351207733154297, "global_step": 56285, "epoch": 335} {"train_loss": -8.383136749267578, "global_step": 56286, "epoch": 335} {"train_loss": -8.247406959533691, "global_step": 56287, "epoch": 335} {"train_loss": -8.318374633789062, "global_step": 56288, "epoch": 335} {"train_loss": -8.398002624511719, "global_step": 56289, "epoch": 335} {"train_loss": -8.295820236206055, "global_step": 56290, "epoch": 335} {"train_loss": -8.522581100463867, "global_step": 56291, "epoch": 335} {"train_loss": -8.192668914794922, "global_step": 56292, "epoch": 335} {"train_loss": -8.519674301147461, "global_step": 56293, "epoch": 335} {"train_loss": -8.437694549560547, "global_step": 56294, "epoch": 335} {"train_loss": -8.550884246826172, "global_step": 56295, "epoch": 335} {"train_loss": -8.477119445800781, "global_step": 56296, "epoch": 335} {"train_loss": -8.76947021484375, "global_step": 56297, "epoch": 335} {"train_loss": -8.674459457397461, "global_step": 56298, "epoch": 335} {"train_loss": -8.545019149780273, "global_step": 56299, "epoch": 335} {"train_loss": -8.306204795837402, "global_step": 56300, "epoch": 335} {"train_loss": -8.676563262939453, "global_step": 56301, "epoch": 335} {"train_loss": -8.385163307189941, "global_step": 56302, "epoch": 335} {"train_loss": -8.52787971496582, "global_step": 56303, "epoch": 335} {"train_loss": -8.80825424194336, "global_step": 56304, "epoch": 335} {"train_loss": -8.725502967834473, "global_step": 56305, "epoch": 335} {"train_loss": -8.591534614562988, "global_step": 56306, "epoch": 335} {"train_loss": -8.797622680664062, "global_step": 56307, "epoch": 335} {"train_loss": -8.540060997009277, "global_step": 56308, "epoch": 335} {"train_loss": -8.570907592773438, "global_step": 56309, "epoch": 335} {"train_loss": -8.663515090942383, "global_step": 56310, "epoch": 335} {"train_loss": -8.926935195922852, "global_step": 56311, "epoch": 335} {"train_loss": -8.788299560546875, "global_step": 56312, "epoch": 335} {"train_loss": -8.670976638793945, "global_step": 56313, "epoch": 335} {"train_loss": -8.615325927734375, "global_step": 56314, "epoch": 335} {"train_loss": -8.868196487426758, "global_step": 56315, "epoch": 335} {"train_loss": -8.713390350341797, "global_step": 56316, "epoch": 335} {"train_loss": -8.56203842163086, "global_step": 56317, "epoch": 335} {"train_loss": -8.583940505981445, "global_step": 56318, "epoch": 335} {"train_loss": -8.507455825805664, "global_step": 56319, "epoch": 335} {"train_loss": -8.629718780517578, "global_step": 56320, "epoch": 335} {"train_loss": -8.581991195678711, "global_step": 56321, "epoch": 335} {"train_loss": -8.562814712524414, "global_step": 56322, "epoch": 335} {"train_loss": -8.507766723632812, "global_step": 56323, "epoch": 335} {"train_loss": -8.575477600097656, "global_step": 56324, "epoch": 335} {"train_loss": -8.561629295349121, "global_step": 56325, "epoch": 335} {"train_loss": -8.693124771118164, "global_step": 56326, "epoch": 335} {"train_loss": -8.592548370361328, "global_step": 56327, "epoch": 335} {"train_loss": -8.587508201599121, "global_step": 56328, "epoch": 335} {"train_loss": -8.547828674316406, "global_step": 56329, "epoch": 335} {"train_loss": -8.46669864654541, "global_step": 56330, "epoch": 335} {"train_loss": -8.37734317779541, "global_step": 56331, "epoch": 335} {"train_loss": -8.262094497680664, "global_step": 56332, "epoch": 335} {"train_loss": -8.553342819213867, "global_step": 56333, "epoch": 335} {"train_loss": -8.381640434265137, "global_step": 56334, "epoch": 335} {"train_loss": -8.630722045898438, "global_step": 56335, "epoch": 335} {"train_loss": -8.543071746826172, "global_step": 56336, "epoch": 335} {"train_loss": -8.749817848205566, "global_step": 56337, "epoch": 335} {"train_loss": -8.589102745056152, "global_step": 56338, "epoch": 335} {"train_loss": -8.640962600708008, "global_step": 56339, "epoch": 335} {"train_loss": -8.473186492919922, "global_step": 56340, "epoch": 335} {"train_loss": -8.36020278930664, "global_step": 56341, "epoch": 335} {"train_loss": -8.485608100891113, "global_step": 56342, "epoch": 335} {"train_loss": -8.56228256225586, "global_step": 56343, "epoch": 335} {"train_loss": -8.549583435058594, "global_step": 56344, "epoch": 335} {"train_loss": -8.595046997070312, "global_step": 56345, "epoch": 335} {"train_loss": -8.438802719116211, "global_step": 56346, "epoch": 335} {"train_loss": -8.416906356811523, "global_step": 56347, "epoch": 335} {"train_loss": -8.261922836303711, "global_step": 56348, "epoch": 335} {"train_loss": -8.152328491210938, "global_step": 56349, "epoch": 335} {"train_loss": -8.455060958862305, "global_step": 56350, "epoch": 335} {"train_loss": -8.36572551727295, "global_step": 56351, "epoch": 335} {"train_loss": -8.143956184387207, "global_step": 56352, "epoch": 335} {"train_loss": -8.568597793579102, "global_step": 56353, "epoch": 335} {"train_loss": -8.260093688964844, "global_step": 56354, "epoch": 335} {"train_loss": -8.53607177734375, "global_step": 56355, "epoch": 335} {"train_loss": -8.517499923706055, "global_step": 56356, "epoch": 335} {"train_loss": -8.504035949707031, "global_step": 56357, "epoch": 335} {"train_loss": -8.342373847961426, "global_step": 56358, "epoch": 335} {"train_loss": -8.292211532592773, "global_step": 56359, "epoch": 335} {"train_loss": -8.49926471710205, "global_step": 56360, "epoch": 335} {"train_loss": -8.693279266357422, "global_step": 56361, "epoch": 335} {"train_loss": -8.668252944946289, "global_step": 56362, "epoch": 335} {"train_loss": -8.414709091186523, "global_step": 56363, "epoch": 335} {"train_loss": -8.418922424316406, "global_step": 56364, "epoch": 335} {"train_loss": -8.597026824951172, "global_step": 56365, "epoch": 335} {"train_loss": -8.43310260772705, "global_step": 56366, "epoch": 335} {"train_loss": -8.439133644104004, "global_step": 56367, "epoch": 335} {"train_loss": -8.476155281066895, "global_step": 56368, "epoch": 335} {"train_loss": -8.856790542602539, "global_step": 56369, "epoch": 335} {"train_loss": -8.574769973754883, "global_step": 56370, "epoch": 335} {"train_loss": -8.621429443359375, "global_step": 56371, "epoch": 335} {"train_loss": -8.836430549621582, "global_step": 56372, "epoch": 335} {"train_loss": -8.482767105102539, "global_step": 56373, "epoch": 335} {"train_loss": -8.615148544311523, "global_step": 56374, "epoch": 335} {"train_loss": -8.489574432373047, "global_step": 56375, "epoch": 335} {"train_loss": -8.646893501281738, "global_step": 56376, "epoch": 335} {"train_loss": -8.479425430297852, "global_step": 56377, "epoch": 335} {"train_loss": -8.383304595947266, "global_step": 56378, "epoch": 335} {"train_loss": -8.58476734161377, "global_step": 56379, "epoch": 335} {"train_loss": -8.662940979003906, "global_step": 56380, "epoch": 335} {"train_loss": -8.534139633178711, "global_step": 56381, "epoch": 335} {"train_loss": -8.402052879333496, "global_step": 56382, "epoch": 335} {"train_loss": -8.348182678222656, "global_step": 56383, "epoch": 335} {"train_loss": -8.534232139587402, "global_step": 56384, "epoch": 335} {"train_loss": -8.47304916381836, "global_step": 56385, "epoch": 335} {"train_loss": -8.358494758605957, "global_step": 56386, "epoch": 335} {"train_loss": -8.433531761169434, "global_step": 56387, "epoch": 335} {"train_loss": -8.631158828735352, "global_step": 56388, "epoch": 335} {"train_loss": -8.426170349121094, "global_step": 56389, "epoch": 335} {"train_loss": -8.217653274536133, "global_step": 56390, "epoch": 335} {"train_loss": -8.661069869995117, "global_step": 56391, "epoch": 335} {"train_loss": -8.38370132446289, "global_step": 56392, "epoch": 335} {"train_loss": -8.669759750366211, "global_step": 56393, "epoch": 335} {"train_loss": -8.24886703491211, "global_step": 56394, "epoch": 335} {"train_loss": -8.479138374328613, "global_step": 56395, "epoch": 335} {"train_loss": -8.471858978271484, "global_step": 56396, "epoch": 335} {"train_loss": -8.509427070617676, "global_step": 56397, "epoch": 335} {"train_loss": -8.622920036315918, "global_step": 56398, "epoch": 335} {"train_loss": -8.639657974243164, "global_step": 56399, "epoch": 335} {"train_loss": -8.758871078491211, "global_step": 56400, "epoch": 335} {"train_loss": -8.460738182067871, "global_step": 56401, "epoch": 335} {"train_loss": -8.774101257324219, "global_step": 56402, "epoch": 335} {"train_loss": -8.48278522491455, "global_step": 56403, "epoch": 335} {"train_loss": -8.527239799499512, "global_step": 56404, "epoch": 335} {"train_loss": -8.380654335021973, "global_step": 56405, "epoch": 335} {"train_loss": -8.528172492980957, "global_step": 56406, "epoch": 335} {"train_loss": -8.518024444580078, "global_step": 56407, "epoch": 335} {"train_loss": -8.637138366699219, "global_step": 56408, "epoch": 335} {"train_loss": -8.586830139160156, "global_step": 56409, "epoch": 335} {"train_loss": -8.752252578735352, "global_step": 56410, "epoch": 335} {"train_loss": -8.749088287353516, "global_step": 56411, "epoch": 335} {"train_loss": -8.610553741455078, "global_step": 56412, "epoch": 335} {"train_loss": -8.668730735778809, "global_step": 56413, "epoch": 335} {"train_loss": -8.754398345947266, "global_step": 56414, "epoch": 335} {"train_loss": -8.421682357788086, "global_step": 56415, "epoch": 335} {"train_loss": -8.591232299804688, "global_step": 56416, "epoch": 335} {"train_loss": -8.672531127929688, "global_step": 56417, "epoch": 335} {"train_loss": -8.653961181640625, "global_step": 56418, "epoch": 335} {"train_loss": -8.545690536499023, "global_step": 56419, "epoch": 335} {"train_loss": -8.515905380249023, "global_step": 56420, "epoch": 335} {"train_loss": -8.535961151123047, "global_step": 56421, "epoch": 335} {"train_loss": -8.528382301330566, "global_step": 56422, "epoch": 335} {"train_loss": -8.48955249786377, "global_step": 56423, "epoch": 335} {"train_loss": -8.734050750732422, "global_step": 56424, "epoch": 335} {"train_loss": -8.572318077087402, "global_step": 56425, "epoch": 335} {"train_loss": -8.507533073425293, "global_step": 56426, "epoch": 335} {"train_loss": -8.557397842407227, "global_step": 56427, "epoch": 335} {"train_loss": -8.527326583862305, "global_step": 56428, "epoch": 335} {"train_loss": -8.662817001342773, "global_step": 56429, "epoch": 335} {"train_loss": -8.590767860412598, "global_step": 56430, "epoch": 335} {"train_loss": -8.596195220947266, "global_step": 56431, "epoch": 335} {"train_loss": -8.411983489990234, "global_step": 56432, "epoch": 335} {"train_loss": -8.741588592529297, "global_step": 56433, "epoch": 335} {"train_loss": -8.452961921691895, "global_step": 56434, "epoch": 335} {"train_loss": -8.480081558227539, "global_step": 56435, "epoch": 335} {"train_loss": -8.693960189819336, "global_step": 56436, "epoch": 335} {"train_loss": -8.494324684143066, "global_step": 56437, "epoch": 335} {"train_loss": -8.652036666870117, "global_step": 56438, "epoch": 335} {"train_loss": -8.349124908447266, "global_step": 56439, "epoch": 335} {"train_loss": -8.320734977722168, "global_step": 56440, "epoch": 335} {"train_loss": -8.457380294799805, "global_step": 56441, "epoch": 335} {"train_loss": -8.66899585723877, "global_step": 56442, "epoch": 335} {"train_loss": -8.544818878173828, "global_step": 56443, "epoch": 335} {"train_loss": -8.644721984863281, "global_step": 56444, "epoch": 335} {"train_loss": -8.570098876953125, "global_step": 56445, "epoch": 335} {"train_loss": -8.452285766601562, "global_step": 56446, "epoch": 335} {"train_loss": -8.530874774569558, "global_step": 56447, "epoch": 335, "val_loss": 190637.359375, "train_action_mse_error": 5.426090240478516} {"train_loss": -8.570213317871094, "global_step": 56448, "epoch": 336} {"train_loss": -8.736002922058105, "global_step": 56449, "epoch": 336} {"train_loss": -8.606456756591797, "global_step": 56450, "epoch": 336} {"train_loss": -8.673280715942383, "global_step": 56451, "epoch": 336} {"train_loss": -8.489086151123047, "global_step": 56452, "epoch": 336} {"train_loss": -8.77784538269043, "global_step": 56453, "epoch": 336} {"train_loss": -8.600244522094727, "global_step": 56454, "epoch": 336} {"train_loss": -8.569548606872559, "global_step": 56455, "epoch": 336} {"train_loss": -8.82919692993164, "global_step": 56456, "epoch": 336} {"train_loss": -8.695465087890625, "global_step": 56457, "epoch": 336} {"train_loss": -8.717199325561523, "global_step": 56458, "epoch": 336} {"train_loss": -8.693321228027344, "global_step": 56459, "epoch": 336} {"train_loss": -8.736488342285156, "global_step": 56460, "epoch": 336} {"train_loss": -8.838733673095703, "global_step": 56461, "epoch": 336} {"train_loss": -8.660009384155273, "global_step": 56462, "epoch": 336} {"train_loss": -8.649284362792969, "global_step": 56463, "epoch": 336} {"train_loss": -8.596529006958008, "global_step": 56464, "epoch": 336} {"train_loss": -8.4751615524292, "global_step": 56465, "epoch": 336} {"train_loss": -8.540277481079102, "global_step": 56466, "epoch": 336} {"train_loss": -8.526641845703125, "global_step": 56467, "epoch": 336} {"train_loss": -8.568346977233887, "global_step": 56468, "epoch": 336} {"train_loss": -8.486355781555176, "global_step": 56469, "epoch": 336} {"train_loss": -8.268855094909668, "global_step": 56470, "epoch": 336} {"train_loss": -8.53911018371582, "global_step": 56471, "epoch": 336} {"train_loss": -8.360811233520508, "global_step": 56472, "epoch": 336} {"train_loss": -8.457557678222656, "global_step": 56473, "epoch": 336} {"train_loss": -8.285907745361328, "global_step": 56474, "epoch": 336} {"train_loss": -8.589871406555176, "global_step": 56475, "epoch": 336} {"train_loss": -8.216053009033203, "global_step": 56476, "epoch": 336} {"train_loss": -8.871844291687012, "global_step": 56477, "epoch": 336} {"train_loss": -8.444013595581055, "global_step": 56478, "epoch": 336} {"train_loss": -8.494385719299316, "global_step": 56479, "epoch": 336} {"train_loss": -8.252678871154785, "global_step": 56480, "epoch": 336} {"train_loss": -8.294820785522461, "global_step": 56481, "epoch": 336} {"train_loss": -8.279422760009766, "global_step": 56482, "epoch": 336} {"train_loss": -8.480524063110352, "global_step": 56483, "epoch": 336} {"train_loss": -8.080192565917969, "global_step": 56484, "epoch": 336} {"train_loss": -8.451135635375977, "global_step": 56485, "epoch": 336} {"train_loss": -8.193103790283203, "global_step": 56486, "epoch": 336} {"train_loss": -8.296995162963867, "global_step": 56487, "epoch": 336} {"train_loss": -8.271705627441406, "global_step": 56488, "epoch": 336} {"train_loss": -8.371875762939453, "global_step": 56489, "epoch": 336} {"train_loss": -8.494283676147461, "global_step": 56490, "epoch": 336} {"train_loss": -8.335075378417969, "global_step": 56491, "epoch": 336} {"train_loss": -8.3718843460083, "global_step": 56492, "epoch": 336} {"train_loss": -8.355016708374023, "global_step": 56493, "epoch": 336} {"train_loss": -8.518239974975586, "global_step": 56494, "epoch": 336} {"train_loss": -8.274480819702148, "global_step": 56495, "epoch": 336} {"train_loss": -8.19040584564209, "global_step": 56496, "epoch": 336} {"train_loss": -8.400146484375, "global_step": 56497, "epoch": 336} {"train_loss": -8.302643775939941, "global_step": 56498, "epoch": 336} {"train_loss": -8.190607070922852, "global_step": 56499, "epoch": 336} {"train_loss": -8.277015686035156, "global_step": 56500, "epoch": 336} {"train_loss": -8.36744213104248, "global_step": 56501, "epoch": 336} {"train_loss": -8.316657066345215, "global_step": 56502, "epoch": 336} {"train_loss": -8.239812850952148, "global_step": 56503, "epoch": 336} {"train_loss": -8.507874488830566, "global_step": 56504, "epoch": 336} {"train_loss": -8.443071365356445, "global_step": 56505, "epoch": 336} {"train_loss": -8.321605682373047, "global_step": 56506, "epoch": 336} {"train_loss": -8.347494125366211, "global_step": 56507, "epoch": 336} {"train_loss": -8.591743469238281, "global_step": 56508, "epoch": 336} {"train_loss": -8.179141998291016, "global_step": 56509, "epoch": 336} {"train_loss": -8.428315162658691, "global_step": 56510, "epoch": 336} {"train_loss": -8.560820579528809, "global_step": 56511, "epoch": 336} {"train_loss": -8.455155372619629, "global_step": 56512, "epoch": 336} {"train_loss": -8.25965404510498, "global_step": 56513, "epoch": 336} {"train_loss": -8.338590621948242, "global_step": 56514, "epoch": 336} {"train_loss": -8.567985534667969, "global_step": 56515, "epoch": 336} {"train_loss": -8.461355209350586, "global_step": 56516, "epoch": 336} {"train_loss": -8.287425994873047, "global_step": 56517, "epoch": 336} {"train_loss": -8.790560722351074, "global_step": 56518, "epoch": 336} {"train_loss": -8.529617309570312, "global_step": 56519, "epoch": 336} {"train_loss": -8.590678215026855, "global_step": 56520, "epoch": 336} {"train_loss": -8.68746280670166, "global_step": 56521, "epoch": 336} {"train_loss": -8.470943450927734, "global_step": 56522, "epoch": 336} {"train_loss": -8.311899185180664, "global_step": 56523, "epoch": 336} {"train_loss": -8.499715805053711, "global_step": 56524, "epoch": 336} {"train_loss": -8.67445182800293, "global_step": 56525, "epoch": 336} {"train_loss": -8.276300430297852, "global_step": 56526, "epoch": 336} {"train_loss": -8.47315788269043, "global_step": 56527, "epoch": 336} {"train_loss": -8.386737823486328, "global_step": 56528, "epoch": 336} {"train_loss": -8.710521697998047, "global_step": 56529, "epoch": 336} {"train_loss": -8.302574157714844, "global_step": 56530, "epoch": 336} {"train_loss": -8.572941780090332, "global_step": 56531, "epoch": 336} {"train_loss": -8.42944049835205, "global_step": 56532, "epoch": 336} {"train_loss": -8.348411560058594, "global_step": 56533, "epoch": 336} {"train_loss": -8.803356170654297, "global_step": 56534, "epoch": 336} {"train_loss": -8.249603271484375, "global_step": 56535, "epoch": 336} {"train_loss": -8.697280883789062, "global_step": 56536, "epoch": 336} {"train_loss": -8.362855911254883, "global_step": 56537, "epoch": 336} {"train_loss": -8.446516036987305, "global_step": 56538, "epoch": 336} {"train_loss": -8.018475532531738, "global_step": 56539, "epoch": 336} {"train_loss": -8.711174011230469, "global_step": 56540, "epoch": 336} {"train_loss": -8.265088081359863, "global_step": 56541, "epoch": 336} {"train_loss": -8.430728912353516, "global_step": 56542, "epoch": 336} {"train_loss": -8.515357971191406, "global_step": 56543, "epoch": 336} {"train_loss": -8.34022331237793, "global_step": 56544, "epoch": 336} {"train_loss": -8.593814849853516, "global_step": 56545, "epoch": 336} {"train_loss": -8.67473030090332, "global_step": 56546, "epoch": 336} {"train_loss": -8.527068138122559, "global_step": 56547, "epoch": 336} {"train_loss": -8.37232494354248, "global_step": 56548, "epoch": 336} {"train_loss": -8.400035858154297, "global_step": 56549, "epoch": 336} {"train_loss": -8.21854019165039, "global_step": 56550, "epoch": 336} {"train_loss": -8.435781478881836, "global_step": 56551, "epoch": 336} {"train_loss": -8.461441040039062, "global_step": 56552, "epoch": 336} {"train_loss": -8.221321105957031, "global_step": 56553, "epoch": 336} {"train_loss": -8.412444114685059, "global_step": 56554, "epoch": 336} {"train_loss": -8.480302810668945, "global_step": 56555, "epoch": 336} {"train_loss": -8.446123123168945, "global_step": 56556, "epoch": 336} {"train_loss": -8.76181697845459, "global_step": 56557, "epoch": 336} {"train_loss": -8.623834609985352, "global_step": 56558, "epoch": 336} {"train_loss": -8.61886215209961, "global_step": 56559, "epoch": 336} {"train_loss": -8.353087425231934, "global_step": 56560, "epoch": 336} {"train_loss": -8.856501579284668, "global_step": 56561, "epoch": 336} {"train_loss": -8.459803581237793, "global_step": 56562, "epoch": 336} {"train_loss": -8.527923583984375, "global_step": 56563, "epoch": 336} {"train_loss": -8.567327499389648, "global_step": 56564, "epoch": 336} {"train_loss": -8.535110473632812, "global_step": 56565, "epoch": 336} {"train_loss": -8.461910247802734, "global_step": 56566, "epoch": 336} {"train_loss": -8.44730281829834, "global_step": 56567, "epoch": 336} {"train_loss": -8.673139572143555, "global_step": 56568, "epoch": 336} {"train_loss": -8.405616760253906, "global_step": 56569, "epoch": 336} {"train_loss": -8.618468284606934, "global_step": 56570, "epoch": 336} {"train_loss": -8.330987930297852, "global_step": 56571, "epoch": 336} {"train_loss": -8.656028747558594, "global_step": 56572, "epoch": 336} {"train_loss": -8.404815673828125, "global_step": 56573, "epoch": 336} {"train_loss": -8.578927993774414, "global_step": 56574, "epoch": 336} {"train_loss": -8.398475646972656, "global_step": 56575, "epoch": 336} {"train_loss": -8.419075965881348, "global_step": 56576, "epoch": 336} {"train_loss": -8.457967758178711, "global_step": 56577, "epoch": 336} {"train_loss": -8.586027145385742, "global_step": 56578, "epoch": 336} {"train_loss": -8.43121337890625, "global_step": 56579, "epoch": 336} {"train_loss": -8.425591468811035, "global_step": 56580, "epoch": 336} {"train_loss": -8.602324485778809, "global_step": 56581, "epoch": 336} {"train_loss": -8.585440635681152, "global_step": 56582, "epoch": 336} {"train_loss": -8.64300537109375, "global_step": 56583, "epoch": 336} {"train_loss": -8.633808135986328, "global_step": 56584, "epoch": 336} {"train_loss": -8.681622505187988, "global_step": 56585, "epoch": 336} {"train_loss": -8.32626724243164, "global_step": 56586, "epoch": 336} {"train_loss": -8.635357856750488, "global_step": 56587, "epoch": 336} {"train_loss": -8.567852020263672, "global_step": 56588, "epoch": 336} {"train_loss": -8.32080078125, "global_step": 56589, "epoch": 336} {"train_loss": -8.317960739135742, "global_step": 56590, "epoch": 336} {"train_loss": -8.648446083068848, "global_step": 56591, "epoch": 336} {"train_loss": -8.605876922607422, "global_step": 56592, "epoch": 336} {"train_loss": -8.365010261535645, "global_step": 56593, "epoch": 336} {"train_loss": -8.601566314697266, "global_step": 56594, "epoch": 336} {"train_loss": -8.689766883850098, "global_step": 56595, "epoch": 336} {"train_loss": -8.648195266723633, "global_step": 56596, "epoch": 336} {"train_loss": -8.660552978515625, "global_step": 56597, "epoch": 336} {"train_loss": -8.534323692321777, "global_step": 56598, "epoch": 336} {"train_loss": -8.58230972290039, "global_step": 56599, "epoch": 336} {"train_loss": -8.593400955200195, "global_step": 56600, "epoch": 336} {"train_loss": -8.472278594970703, "global_step": 56601, "epoch": 336} {"train_loss": -8.529096603393555, "global_step": 56602, "epoch": 336} {"train_loss": -8.160806655883789, "global_step": 56603, "epoch": 336} {"train_loss": -8.615793228149414, "global_step": 56604, "epoch": 336} {"train_loss": -8.620604515075684, "global_step": 56605, "epoch": 336} {"train_loss": -8.541523933410645, "global_step": 56606, "epoch": 336} {"train_loss": -8.482148170471191, "global_step": 56607, "epoch": 336} {"train_loss": -8.60495662689209, "global_step": 56608, "epoch": 336} {"train_loss": -8.327730178833008, "global_step": 56609, "epoch": 336} {"train_loss": -8.6636381149292, "global_step": 56610, "epoch": 336} {"train_loss": -8.504329681396484, "global_step": 56611, "epoch": 336} {"train_loss": -8.62788200378418, "global_step": 56612, "epoch": 336} {"train_loss": -8.588129043579102, "global_step": 56613, "epoch": 336} {"train_loss": -8.265419006347656, "global_step": 56614, "epoch": 336} {"train_loss": -8.484019949322654, "global_step": 56615, "epoch": 336, "val_loss": 187651.046875} {"train_loss": -8.548858642578125, "global_step": 56616, "epoch": 337} {"train_loss": -8.53110122680664, "global_step": 56617, "epoch": 337} {"train_loss": -8.51583480834961, "global_step": 56618, "epoch": 337} {"train_loss": -8.455994606018066, "global_step": 56619, "epoch": 337} {"train_loss": -8.741962432861328, "global_step": 56620, "epoch": 337} {"train_loss": -8.567081451416016, "global_step": 56621, "epoch": 337} {"train_loss": -8.67300796508789, "global_step": 56622, "epoch": 337} {"train_loss": -8.437896728515625, "global_step": 56623, "epoch": 337} {"train_loss": -8.821139335632324, "global_step": 56624, "epoch": 337} {"train_loss": -8.415729522705078, "global_step": 56625, "epoch": 337} {"train_loss": -8.83819580078125, "global_step": 56626, "epoch": 337} {"train_loss": -8.491386413574219, "global_step": 56627, "epoch": 337} {"train_loss": -8.718928337097168, "global_step": 56628, "epoch": 337} {"train_loss": -8.487046241760254, "global_step": 56629, "epoch": 337} {"train_loss": -8.41639518737793, "global_step": 56630, "epoch": 337} {"train_loss": -8.825597763061523, "global_step": 56631, "epoch": 337} {"train_loss": -8.684893608093262, "global_step": 56632, "epoch": 337} {"train_loss": -8.594060897827148, "global_step": 56633, "epoch": 337} {"train_loss": -8.592263221740723, "global_step": 56634, "epoch": 337} {"train_loss": -8.795682907104492, "global_step": 56635, "epoch": 337} {"train_loss": -8.583606719970703, "global_step": 56636, "epoch": 337} {"train_loss": -8.494709014892578, "global_step": 56637, "epoch": 337} {"train_loss": -8.652140617370605, "global_step": 56638, "epoch": 337} {"train_loss": -8.50278091430664, "global_step": 56639, "epoch": 337} {"train_loss": -8.449872970581055, "global_step": 56640, "epoch": 337} {"train_loss": -8.335927963256836, "global_step": 56641, "epoch": 337} {"train_loss": -8.63868236541748, "global_step": 56642, "epoch": 337} {"train_loss": -8.553089141845703, "global_step": 56643, "epoch": 337} {"train_loss": -8.552974700927734, "global_step": 56644, "epoch": 337} {"train_loss": -8.649271011352539, "global_step": 56645, "epoch": 337} {"train_loss": -8.5357666015625, "global_step": 56646, "epoch": 337} {"train_loss": -8.354183197021484, "global_step": 56647, "epoch": 337} {"train_loss": -8.438338279724121, "global_step": 56648, "epoch": 337} {"train_loss": -8.369590759277344, "global_step": 56649, "epoch": 337} {"train_loss": -8.53680419921875, "global_step": 56650, "epoch": 337} {"train_loss": -8.461554527282715, "global_step": 56651, "epoch": 337} {"train_loss": -8.471517562866211, "global_step": 56652, "epoch": 337} {"train_loss": -8.393760681152344, "global_step": 56653, "epoch": 337} {"train_loss": -8.65487003326416, "global_step": 56654, "epoch": 337} {"train_loss": -8.32050609588623, "global_step": 56655, "epoch": 337} {"train_loss": -8.368019104003906, "global_step": 56656, "epoch": 337} {"train_loss": -8.617985725402832, "global_step": 56657, "epoch": 337} {"train_loss": -8.423391342163086, "global_step": 56658, "epoch": 337} {"train_loss": -8.39775562286377, "global_step": 56659, "epoch": 337} {"train_loss": -8.396299362182617, "global_step": 56660, "epoch": 337} {"train_loss": -8.556264877319336, "global_step": 56661, "epoch": 337} {"train_loss": -8.431660652160645, "global_step": 56662, "epoch": 337} {"train_loss": -8.690631866455078, "global_step": 56663, "epoch": 337} {"train_loss": -8.38948917388916, "global_step": 56664, "epoch": 337} {"train_loss": -8.625173568725586, "global_step": 56665, "epoch": 337} {"train_loss": -8.500810623168945, "global_step": 56666, "epoch": 337} {"train_loss": -8.354286193847656, "global_step": 56667, "epoch": 337} {"train_loss": -8.646400451660156, "global_step": 56668, "epoch": 337} {"train_loss": -8.413039207458496, "global_step": 56669, "epoch": 337} {"train_loss": -8.601937294006348, "global_step": 56670, "epoch": 337} {"train_loss": -8.630056381225586, "global_step": 56671, "epoch": 337} {"train_loss": -8.637147903442383, "global_step": 56672, "epoch": 337} {"train_loss": -8.801990509033203, "global_step": 56673, "epoch": 337} {"train_loss": -8.607538223266602, "global_step": 56674, "epoch": 337} {"train_loss": -8.537002563476562, "global_step": 56675, "epoch": 337} {"train_loss": -8.763755798339844, "global_step": 56676, "epoch": 337} {"train_loss": -8.505414009094238, "global_step": 56677, "epoch": 337} {"train_loss": -8.834650039672852, "global_step": 56678, "epoch": 337} {"train_loss": -8.69127082824707, "global_step": 56679, "epoch": 337} {"train_loss": -8.616426467895508, "global_step": 56680, "epoch": 337} {"train_loss": -8.42486572265625, "global_step": 56681, "epoch": 337} {"train_loss": -8.527538299560547, "global_step": 56682, "epoch": 337} {"train_loss": -8.553445816040039, "global_step": 56683, "epoch": 337} {"train_loss": -8.76236343383789, "global_step": 56684, "epoch": 337} {"train_loss": -8.112544059753418, "global_step": 56685, "epoch": 337} {"train_loss": -8.954766273498535, "global_step": 56686, "epoch": 337} {"train_loss": -8.0226411819458, "global_step": 56687, "epoch": 337} {"train_loss": -8.615089416503906, "global_step": 56688, "epoch": 337} {"train_loss": -8.33807373046875, "global_step": 56689, "epoch": 337} {"train_loss": -8.55960464477539, "global_step": 56690, "epoch": 337} {"train_loss": -8.238479614257812, "global_step": 56691, "epoch": 337} {"train_loss": -8.397092819213867, "global_step": 56692, "epoch": 337} {"train_loss": -8.392101287841797, "global_step": 56693, "epoch": 337} {"train_loss": -8.560977935791016, "global_step": 56694, "epoch": 337} {"train_loss": -8.541674613952637, "global_step": 56695, "epoch": 337} {"train_loss": -8.634502410888672, "global_step": 56696, "epoch": 337} {"train_loss": -8.664384841918945, "global_step": 56697, "epoch": 337} {"train_loss": -8.247283935546875, "global_step": 56698, "epoch": 337} {"train_loss": -8.578563690185547, "global_step": 56699, "epoch": 337} {"train_loss": -8.55389404296875, "global_step": 56700, "epoch": 337} {"train_loss": -8.35440444946289, "global_step": 56701, "epoch": 337} {"train_loss": -8.581954956054688, "global_step": 56702, "epoch": 337} {"train_loss": -8.629982948303223, "global_step": 56703, "epoch": 337} {"train_loss": -8.460861206054688, "global_step": 56704, "epoch": 337} {"train_loss": -8.380691528320312, "global_step": 56705, "epoch": 337} {"train_loss": -8.554652214050293, "global_step": 56706, "epoch": 337} {"train_loss": -8.46377182006836, "global_step": 56707, "epoch": 337} {"train_loss": -8.388538360595703, "global_step": 56708, "epoch": 337} {"train_loss": -8.480878829956055, "global_step": 56709, "epoch": 337} {"train_loss": -8.539460182189941, "global_step": 56710, "epoch": 337} {"train_loss": -8.249385833740234, "global_step": 56711, "epoch": 337} {"train_loss": -8.408609390258789, "global_step": 56712, "epoch": 337} {"train_loss": -8.318020820617676, "global_step": 56713, "epoch": 337} {"train_loss": -8.50644302368164, "global_step": 56714, "epoch": 337} {"train_loss": -8.485255241394043, "global_step": 56715, "epoch": 337} {"train_loss": -8.511664390563965, "global_step": 56716, "epoch": 337} {"train_loss": -8.357477188110352, "global_step": 56717, "epoch": 337} {"train_loss": -8.659461975097656, "global_step": 56718, "epoch": 337} {"train_loss": -8.689712524414062, "global_step": 56719, "epoch": 337} {"train_loss": -8.667010307312012, "global_step": 56720, "epoch": 337} {"train_loss": -8.502885818481445, "global_step": 56721, "epoch": 337} {"train_loss": -8.504322052001953, "global_step": 56722, "epoch": 337} {"train_loss": -8.497100830078125, "global_step": 56723, "epoch": 337} {"train_loss": -8.49239444732666, "global_step": 56724, "epoch": 337} {"train_loss": -8.272748947143555, "global_step": 56725, "epoch": 337} {"train_loss": -8.452898025512695, "global_step": 56726, "epoch": 337} {"train_loss": -8.371901512145996, "global_step": 56727, "epoch": 337} {"train_loss": -8.450480461120605, "global_step": 56728, "epoch": 337} {"train_loss": -8.389554023742676, "global_step": 56729, "epoch": 337} {"train_loss": -8.44357967376709, "global_step": 56730, "epoch": 337} {"train_loss": -8.265926361083984, "global_step": 56731, "epoch": 337} {"train_loss": -8.660111427307129, "global_step": 56732, "epoch": 337} {"train_loss": -8.509634017944336, "global_step": 56733, "epoch": 337} {"train_loss": -8.280326843261719, "global_step": 56734, "epoch": 337} {"train_loss": -8.440692901611328, "global_step": 56735, "epoch": 337} {"train_loss": -8.41865062713623, "global_step": 56736, "epoch": 337} {"train_loss": -8.361594200134277, "global_step": 56737, "epoch": 337} {"train_loss": -8.338473320007324, "global_step": 56738, "epoch": 337} {"train_loss": -8.445961952209473, "global_step": 56739, "epoch": 337} {"train_loss": -8.221479415893555, "global_step": 56740, "epoch": 337} {"train_loss": -8.673070907592773, "global_step": 56741, "epoch": 337} {"train_loss": -8.596866607666016, "global_step": 56742, "epoch": 337} {"train_loss": -8.440143585205078, "global_step": 56743, "epoch": 337} {"train_loss": -8.450308799743652, "global_step": 56744, "epoch": 337} {"train_loss": -8.556697845458984, "global_step": 56745, "epoch": 337} {"train_loss": -8.403554916381836, "global_step": 56746, "epoch": 337} {"train_loss": -8.505760192871094, "global_step": 56747, "epoch": 337} {"train_loss": -8.630661964416504, "global_step": 56748, "epoch": 337} {"train_loss": -8.606433868408203, "global_step": 56749, "epoch": 337} {"train_loss": -8.534549713134766, "global_step": 56750, "epoch": 337} {"train_loss": -8.441034317016602, "global_step": 56751, "epoch": 337} {"train_loss": -8.504182815551758, "global_step": 56752, "epoch": 337} {"train_loss": -8.542182922363281, "global_step": 56753, "epoch": 337} {"train_loss": -8.420214653015137, "global_step": 56754, "epoch": 337} {"train_loss": -8.368691444396973, "global_step": 56755, "epoch": 337} {"train_loss": -8.455291748046875, "global_step": 56756, "epoch": 337} {"train_loss": -8.09109115600586, "global_step": 56757, "epoch": 337} {"train_loss": -8.261975288391113, "global_step": 56758, "epoch": 337} {"train_loss": -8.214362144470215, "global_step": 56759, "epoch": 337} {"train_loss": -7.759403228759766, "global_step": 56760, "epoch": 337} {"train_loss": -8.512075424194336, "global_step": 56761, "epoch": 337} {"train_loss": -8.157907485961914, "global_step": 56762, "epoch": 337} {"train_loss": -8.248432159423828, "global_step": 56763, "epoch": 337} {"train_loss": -8.259466171264648, "global_step": 56764, "epoch": 337} {"train_loss": -8.36080265045166, "global_step": 56765, "epoch": 337} {"train_loss": -8.490848541259766, "global_step": 56766, "epoch": 337} {"train_loss": -8.40673542022705, "global_step": 56767, "epoch": 337} {"train_loss": -8.266777992248535, "global_step": 56768, "epoch": 337} {"train_loss": -8.373186111450195, "global_step": 56769, "epoch": 337} {"train_loss": -8.545419692993164, "global_step": 56770, "epoch": 337} {"train_loss": -8.471609115600586, "global_step": 56771, "epoch": 337} {"train_loss": -8.64008903503418, "global_step": 56772, "epoch": 337} {"train_loss": -8.442853927612305, "global_step": 56773, "epoch": 337} {"train_loss": -8.332662582397461, "global_step": 56774, "epoch": 337} {"train_loss": -8.54560661315918, "global_step": 56775, "epoch": 337} {"train_loss": -8.569159507751465, "global_step": 56776, "epoch": 337} {"train_loss": -8.481847763061523, "global_step": 56777, "epoch": 337} {"train_loss": -8.429917335510254, "global_step": 56778, "epoch": 337} {"train_loss": -8.504430770874023, "global_step": 56779, "epoch": 337} {"train_loss": -8.524456024169922, "global_step": 56780, "epoch": 337} {"train_loss": -8.521133422851562, "global_step": 56781, "epoch": 337} {"train_loss": -8.4977388381958, "global_step": 56782, "epoch": 337} {"train_loss": -8.490259210268656, "global_step": 56783, "epoch": 337, "val_loss": 186938.1875} {"train_loss": -8.474346160888672, "global_step": 56784, "epoch": 338} {"train_loss": -8.78093433380127, "global_step": 56785, "epoch": 338} {"train_loss": -8.568428993225098, "global_step": 56786, "epoch": 338} {"train_loss": -8.589981079101562, "global_step": 56787, "epoch": 338} {"train_loss": -8.502392768859863, "global_step": 56788, "epoch": 338} {"train_loss": -8.640624046325684, "global_step": 56789, "epoch": 338} {"train_loss": -8.421663284301758, "global_step": 56790, "epoch": 338} {"train_loss": -8.480867385864258, "global_step": 56791, "epoch": 338} {"train_loss": -8.622005462646484, "global_step": 56792, "epoch": 338} {"train_loss": -8.75347900390625, "global_step": 56793, "epoch": 338} {"train_loss": -8.574624061584473, "global_step": 56794, "epoch": 338} {"train_loss": -8.414135932922363, "global_step": 56795, "epoch": 338} {"train_loss": -8.735701560974121, "global_step": 56796, "epoch": 338} {"train_loss": -8.349617004394531, "global_step": 56797, "epoch": 338} {"train_loss": -8.651166915893555, "global_step": 56798, "epoch": 338} {"train_loss": -8.202616691589355, "global_step": 56799, "epoch": 338} {"train_loss": -8.536118507385254, "global_step": 56800, "epoch": 338} {"train_loss": -8.52656078338623, "global_step": 56801, "epoch": 338} {"train_loss": -8.226617813110352, "global_step": 56802, "epoch": 338} {"train_loss": -8.563798904418945, "global_step": 56803, "epoch": 338} {"train_loss": -8.419576644897461, "global_step": 56804, "epoch": 338} {"train_loss": -8.597187042236328, "global_step": 56805, "epoch": 338} {"train_loss": -8.696442604064941, "global_step": 56806, "epoch": 338} {"train_loss": -8.523918151855469, "global_step": 56807, "epoch": 338} {"train_loss": -8.626495361328125, "global_step": 56808, "epoch": 338} {"train_loss": -8.55029582977295, "global_step": 56809, "epoch": 338} {"train_loss": -8.75282096862793, "global_step": 56810, "epoch": 338} {"train_loss": -8.733894348144531, "global_step": 56811, "epoch": 338} {"train_loss": -8.687944412231445, "global_step": 56812, "epoch": 338} {"train_loss": -8.449560165405273, "global_step": 56813, "epoch": 338} {"train_loss": -8.432262420654297, "global_step": 56814, "epoch": 338} {"train_loss": -8.60633373260498, "global_step": 56815, "epoch": 338} {"train_loss": -8.655889511108398, "global_step": 56816, "epoch": 338} {"train_loss": -8.601953506469727, "global_step": 56817, "epoch": 338} {"train_loss": -8.71269416809082, "global_step": 56818, "epoch": 338} {"train_loss": -8.594831466674805, "global_step": 56819, "epoch": 338} {"train_loss": -8.500154495239258, "global_step": 56820, "epoch": 338} {"train_loss": -8.394116401672363, "global_step": 56821, "epoch": 338} {"train_loss": -8.355873107910156, "global_step": 56822, "epoch": 338} {"train_loss": -8.410499572753906, "global_step": 56823, "epoch": 338} {"train_loss": -8.456289291381836, "global_step": 56824, "epoch": 338} {"train_loss": -8.44288158416748, "global_step": 56825, "epoch": 338} {"train_loss": -8.560567855834961, "global_step": 56826, "epoch": 338} {"train_loss": -8.265630722045898, "global_step": 56827, "epoch": 338} {"train_loss": -8.603788375854492, "global_step": 56828, "epoch": 338} {"train_loss": -8.356425285339355, "global_step": 56829, "epoch": 338} {"train_loss": -8.565953254699707, "global_step": 56830, "epoch": 338} {"train_loss": -8.615391731262207, "global_step": 56831, "epoch": 338} {"train_loss": -8.930608749389648, "global_step": 56832, "epoch": 338} {"train_loss": -8.447051048278809, "global_step": 56833, "epoch": 338} {"train_loss": -8.587686538696289, "global_step": 56834, "epoch": 338} {"train_loss": -8.459253311157227, "global_step": 56835, "epoch": 338} {"train_loss": -8.604330062866211, "global_step": 56836, "epoch": 338} {"train_loss": -8.617450714111328, "global_step": 56837, "epoch": 338} {"train_loss": -8.481291770935059, "global_step": 56838, "epoch": 338} {"train_loss": -8.783710479736328, "global_step": 56839, "epoch": 338} {"train_loss": -8.753532409667969, "global_step": 56840, "epoch": 338} {"train_loss": -8.624605178833008, "global_step": 56841, "epoch": 338} {"train_loss": -8.610150337219238, "global_step": 56842, "epoch": 338} {"train_loss": -8.544733047485352, "global_step": 56843, "epoch": 338} {"train_loss": -8.783825874328613, "global_step": 56844, "epoch": 338} {"train_loss": -8.642066955566406, "global_step": 56845, "epoch": 338} {"train_loss": -8.844871520996094, "global_step": 56846, "epoch": 338} {"train_loss": -8.734724044799805, "global_step": 56847, "epoch": 338} {"train_loss": -8.847513198852539, "global_step": 56848, "epoch": 338} {"train_loss": -8.545210838317871, "global_step": 56849, "epoch": 338} {"train_loss": -8.744182586669922, "global_step": 56850, "epoch": 338} {"train_loss": -8.820459365844727, "global_step": 56851, "epoch": 338} {"train_loss": -8.595521926879883, "global_step": 56852, "epoch": 338} {"train_loss": -8.470226287841797, "global_step": 56853, "epoch": 338} {"train_loss": -8.53412914276123, "global_step": 56854, "epoch": 338} {"train_loss": -8.541693687438965, "global_step": 56855, "epoch": 338} {"train_loss": -8.37578010559082, "global_step": 56856, "epoch": 338} {"train_loss": -8.62722110748291, "global_step": 56857, "epoch": 338} {"train_loss": -8.291800498962402, "global_step": 56858, "epoch": 338} {"train_loss": -8.744440078735352, "global_step": 56859, "epoch": 338} {"train_loss": -8.481998443603516, "global_step": 56860, "epoch": 338} {"train_loss": -8.602518081665039, "global_step": 56861, "epoch": 338} {"train_loss": -8.31338119506836, "global_step": 56862, "epoch": 338} {"train_loss": -8.326530456542969, "global_step": 56863, "epoch": 338} {"train_loss": -8.198593139648438, "global_step": 56864, "epoch": 338} {"train_loss": -8.826805114746094, "global_step": 56865, "epoch": 338} {"train_loss": -8.084137916564941, "global_step": 56866, "epoch": 338} {"train_loss": -8.294881820678711, "global_step": 56867, "epoch": 338} {"train_loss": -8.060980796813965, "global_step": 56868, "epoch": 338} {"train_loss": -8.171868324279785, "global_step": 56869, "epoch": 338} {"train_loss": -7.96500825881958, "global_step": 56870, "epoch": 338} {"train_loss": -8.319319725036621, "global_step": 56871, "epoch": 338} {"train_loss": -8.244376182556152, "global_step": 56872, "epoch": 338} {"train_loss": -8.1591215133667, "global_step": 56873, "epoch": 338} {"train_loss": -8.12501335144043, "global_step": 56874, "epoch": 338} {"train_loss": -8.397899627685547, "global_step": 56875, "epoch": 338} {"train_loss": -8.490684509277344, "global_step": 56876, "epoch": 338} {"train_loss": -8.329025268554688, "global_step": 56877, "epoch": 338} {"train_loss": -8.409090042114258, "global_step": 56878, "epoch": 338} {"train_loss": -8.552730560302734, "global_step": 56879, "epoch": 338} {"train_loss": -8.316926956176758, "global_step": 56880, "epoch": 338} {"train_loss": -8.393722534179688, "global_step": 56881, "epoch": 338} {"train_loss": -8.343295097351074, "global_step": 56882, "epoch": 338} {"train_loss": -8.431914329528809, "global_step": 56883, "epoch": 338} {"train_loss": -8.696037292480469, "global_step": 56884, "epoch": 338} {"train_loss": -8.37757396697998, "global_step": 56885, "epoch": 338} {"train_loss": -8.629928588867188, "global_step": 56886, "epoch": 338} {"train_loss": -8.67833137512207, "global_step": 56887, "epoch": 338} {"train_loss": -8.626537322998047, "global_step": 56888, "epoch": 338} {"train_loss": -8.648712158203125, "global_step": 56889, "epoch": 338} {"train_loss": -8.679841995239258, "global_step": 56890, "epoch": 338} {"train_loss": -8.58934211730957, "global_step": 56891, "epoch": 338} {"train_loss": -8.649866104125977, "global_step": 56892, "epoch": 338} {"train_loss": -8.456466674804688, "global_step": 56893, "epoch": 338} {"train_loss": -8.84994888305664, "global_step": 56894, "epoch": 338} {"train_loss": -8.625520706176758, "global_step": 56895, "epoch": 338} {"train_loss": -8.661931991577148, "global_step": 56896, "epoch": 338} {"train_loss": -8.645524978637695, "global_step": 56897, "epoch": 338} {"train_loss": -8.754345893859863, "global_step": 56898, "epoch": 338} {"train_loss": -8.485359191894531, "global_step": 56899, "epoch": 338} {"train_loss": -8.458807945251465, "global_step": 56900, "epoch": 338} {"train_loss": -8.342883110046387, "global_step": 56901, "epoch": 338} {"train_loss": -8.572174072265625, "global_step": 56902, "epoch": 338} {"train_loss": -8.515958786010742, "global_step": 56903, "epoch": 338} {"train_loss": -8.665771484375, "global_step": 56904, "epoch": 338} {"train_loss": -8.49763011932373, "global_step": 56905, "epoch": 338} {"train_loss": -8.762664794921875, "global_step": 56906, "epoch": 338} {"train_loss": -8.292654037475586, "global_step": 56907, "epoch": 338} {"train_loss": -8.65290355682373, "global_step": 56908, "epoch": 338} {"train_loss": -8.509827613830566, "global_step": 56909, "epoch": 338} {"train_loss": -8.791120529174805, "global_step": 56910, "epoch": 338} {"train_loss": -8.55555534362793, "global_step": 56911, "epoch": 338} {"train_loss": -8.518755912780762, "global_step": 56912, "epoch": 338} {"train_loss": -8.478710174560547, "global_step": 56913, "epoch": 338} {"train_loss": -8.806832313537598, "global_step": 56914, "epoch": 338} {"train_loss": -8.561603546142578, "global_step": 56915, "epoch": 338} {"train_loss": -8.645605087280273, "global_step": 56916, "epoch": 338} {"train_loss": -8.610157012939453, "global_step": 56917, "epoch": 338} {"train_loss": -8.48697566986084, "global_step": 56918, "epoch": 338} {"train_loss": -8.708285331726074, "global_step": 56919, "epoch": 338} {"train_loss": -8.441832542419434, "global_step": 56920, "epoch": 338} {"train_loss": -8.460291862487793, "global_step": 56921, "epoch": 338} {"train_loss": -8.332036972045898, "global_step": 56922, "epoch": 338} {"train_loss": -8.554588317871094, "global_step": 56923, "epoch": 338} {"train_loss": -8.11817741394043, "global_step": 56924, "epoch": 338} {"train_loss": -8.616044044494629, "global_step": 56925, "epoch": 338} {"train_loss": -8.655332565307617, "global_step": 56926, "epoch": 338} {"train_loss": -8.523804664611816, "global_step": 56927, "epoch": 338} {"train_loss": -8.545833587646484, "global_step": 56928, "epoch": 338} {"train_loss": -8.709216117858887, "global_step": 56929, "epoch": 338} {"train_loss": -8.49213981628418, "global_step": 56930, "epoch": 338} {"train_loss": -8.715173721313477, "global_step": 56931, "epoch": 338} {"train_loss": -8.429854393005371, "global_step": 56932, "epoch": 338} {"train_loss": -8.504056930541992, "global_step": 56933, "epoch": 338} {"train_loss": -8.528346061706543, "global_step": 56934, "epoch": 338} {"train_loss": -8.45173454284668, "global_step": 56935, "epoch": 338} {"train_loss": -8.178943634033203, "global_step": 56936, "epoch": 338} {"train_loss": -8.363033294677734, "global_step": 56937, "epoch": 338} {"train_loss": -8.289774894714355, "global_step": 56938, "epoch": 338} {"train_loss": -8.516308784484863, "global_step": 56939, "epoch": 338} {"train_loss": -8.376434326171875, "global_step": 56940, "epoch": 338} {"train_loss": -8.559274673461914, "global_step": 56941, "epoch": 338} {"train_loss": -8.684276580810547, "global_step": 56942, "epoch": 338} {"train_loss": -8.421091079711914, "global_step": 56943, "epoch": 338} {"train_loss": -8.672855377197266, "global_step": 56944, "epoch": 338} {"train_loss": -8.556818008422852, "global_step": 56945, "epoch": 338} {"train_loss": -8.50695514678955, "global_step": 56946, "epoch": 338} {"train_loss": -8.753641128540039, "global_step": 56947, "epoch": 338} {"train_loss": -8.748051643371582, "global_step": 56948, "epoch": 338} {"train_loss": -8.590557098388672, "global_step": 56949, "epoch": 338} {"train_loss": -8.603221893310547, "global_step": 56950, "epoch": 338} {"train_loss": -8.53105485155469, "global_step": 56951, "epoch": 338, "val_loss": 186327.671875} {"train_loss": -8.527800559997559, "global_step": 56952, "epoch": 339} {"train_loss": -8.525312423706055, "global_step": 56953, "epoch": 339} {"train_loss": -8.581972122192383, "global_step": 56954, "epoch": 339} {"train_loss": -8.809572219848633, "global_step": 56955, "epoch": 339} {"train_loss": -8.549613952636719, "global_step": 56956, "epoch": 339} {"train_loss": -8.720081329345703, "global_step": 56957, "epoch": 339} {"train_loss": -8.602394104003906, "global_step": 56958, "epoch": 339} {"train_loss": -8.473777770996094, "global_step": 56959, "epoch": 339} {"train_loss": -8.511401176452637, "global_step": 56960, "epoch": 339} {"train_loss": -8.600700378417969, "global_step": 56961, "epoch": 339} {"train_loss": -8.62450122833252, "global_step": 56962, "epoch": 339} {"train_loss": -8.675371170043945, "global_step": 56963, "epoch": 339} {"train_loss": -8.405498504638672, "global_step": 56964, "epoch": 339} {"train_loss": -8.610715866088867, "global_step": 56965, "epoch": 339} {"train_loss": -8.179192543029785, "global_step": 56966, "epoch": 339} {"train_loss": -8.32634162902832, "global_step": 56967, "epoch": 339} {"train_loss": -8.390801429748535, "global_step": 56968, "epoch": 339} {"train_loss": -8.732131958007812, "global_step": 56969, "epoch": 339} {"train_loss": -8.642083168029785, "global_step": 56970, "epoch": 339} {"train_loss": -8.464219093322754, "global_step": 56971, "epoch": 339} {"train_loss": -8.594018936157227, "global_step": 56972, "epoch": 339} {"train_loss": -8.58330249786377, "global_step": 56973, "epoch": 339} {"train_loss": -8.60285758972168, "global_step": 56974, "epoch": 339} {"train_loss": -8.469064712524414, "global_step": 56975, "epoch": 339} {"train_loss": -8.300004005432129, "global_step": 56976, "epoch": 339} {"train_loss": -8.808189392089844, "global_step": 56977, "epoch": 339} {"train_loss": -8.060800552368164, "global_step": 56978, "epoch": 339} {"train_loss": -8.584328651428223, "global_step": 56979, "epoch": 339} {"train_loss": -8.648025512695312, "global_step": 56980, "epoch": 339} {"train_loss": -8.428189277648926, "global_step": 56981, "epoch": 339} {"train_loss": -8.461906433105469, "global_step": 56982, "epoch": 339} {"train_loss": -8.673663139343262, "global_step": 56983, "epoch": 339} {"train_loss": -8.641792297363281, "global_step": 56984, "epoch": 339} {"train_loss": -8.694768905639648, "global_step": 56985, "epoch": 339} {"train_loss": -8.561380386352539, "global_step": 56986, "epoch": 339} {"train_loss": -8.563169479370117, "global_step": 56987, "epoch": 339} {"train_loss": -8.838440895080566, "global_step": 56988, "epoch": 339} {"train_loss": -8.76517391204834, "global_step": 56989, "epoch": 339} {"train_loss": -8.65786361694336, "global_step": 56990, "epoch": 339} {"train_loss": -8.508031845092773, "global_step": 56991, "epoch": 339} {"train_loss": -8.72227954864502, "global_step": 56992, "epoch": 339} {"train_loss": -8.552492141723633, "global_step": 56993, "epoch": 339} {"train_loss": -8.600347518920898, "global_step": 56994, "epoch": 339} {"train_loss": -8.697532653808594, "global_step": 56995, "epoch": 339} {"train_loss": -8.617986679077148, "global_step": 56996, "epoch": 339} {"train_loss": -8.754263877868652, "global_step": 56997, "epoch": 339} {"train_loss": -8.813684463500977, "global_step": 56998, "epoch": 339} {"train_loss": -8.326372146606445, "global_step": 56999, "epoch": 339} {"train_loss": -8.575878143310547, "global_step": 57000, "epoch": 339} {"train_loss": -8.70025634765625, "global_step": 57001, "epoch": 339} {"train_loss": -8.706374168395996, "global_step": 57002, "epoch": 339} {"train_loss": -8.363997459411621, "global_step": 57003, "epoch": 339} {"train_loss": -8.624076843261719, "global_step": 57004, "epoch": 339} {"train_loss": -8.570304870605469, "global_step": 57005, "epoch": 339} {"train_loss": -8.653104782104492, "global_step": 57006, "epoch": 339} {"train_loss": -8.471901893615723, "global_step": 57007, "epoch": 339} {"train_loss": -8.659990310668945, "global_step": 57008, "epoch": 339} {"train_loss": -8.669910430908203, "global_step": 57009, "epoch": 339} {"train_loss": -8.545736312866211, "global_step": 57010, "epoch": 339} {"train_loss": -8.589363098144531, "global_step": 57011, "epoch": 339} {"train_loss": -8.492981910705566, "global_step": 57012, "epoch": 339} {"train_loss": -8.739731788635254, "global_step": 57013, "epoch": 339} {"train_loss": -8.687568664550781, "global_step": 57014, "epoch": 339} {"train_loss": -8.425457000732422, "global_step": 57015, "epoch": 339} {"train_loss": -8.672173500061035, "global_step": 57016, "epoch": 339} {"train_loss": -8.38308334350586, "global_step": 57017, "epoch": 339} {"train_loss": -8.735055923461914, "global_step": 57018, "epoch": 339} {"train_loss": -8.32790756225586, "global_step": 57019, "epoch": 339} {"train_loss": -8.550992965698242, "global_step": 57020, "epoch": 339} {"train_loss": -8.514091491699219, "global_step": 57021, "epoch": 339} {"train_loss": -8.695755004882812, "global_step": 57022, "epoch": 339} {"train_loss": -8.476655960083008, "global_step": 57023, "epoch": 339} {"train_loss": -8.464128494262695, "global_step": 57024, "epoch": 339} {"train_loss": -8.510339736938477, "global_step": 57025, "epoch": 339} {"train_loss": -8.573683738708496, "global_step": 57026, "epoch": 339} {"train_loss": -8.650429725646973, "global_step": 57027, "epoch": 339} {"train_loss": -8.661140441894531, "global_step": 57028, "epoch": 339} {"train_loss": -8.635929107666016, "global_step": 57029, "epoch": 339} {"train_loss": -8.646417617797852, "global_step": 57030, "epoch": 339} {"train_loss": -8.462944984436035, "global_step": 57031, "epoch": 339} {"train_loss": -8.740682601928711, "global_step": 57032, "epoch": 339} {"train_loss": -8.464649200439453, "global_step": 57033, "epoch": 339} {"train_loss": -8.639562606811523, "global_step": 57034, "epoch": 339} {"train_loss": -8.375741958618164, "global_step": 57035, "epoch": 339} {"train_loss": -8.568345069885254, "global_step": 57036, "epoch": 339} {"train_loss": -8.604535102844238, "global_step": 57037, "epoch": 339} {"train_loss": -8.865021705627441, "global_step": 57038, "epoch": 339} {"train_loss": -8.630433082580566, "global_step": 57039, "epoch": 339} {"train_loss": -8.591755867004395, "global_step": 57040, "epoch": 339} {"train_loss": -8.782730102539062, "global_step": 57041, "epoch": 339} {"train_loss": -8.724531173706055, "global_step": 57042, "epoch": 339} {"train_loss": -8.524637222290039, "global_step": 57043, "epoch": 339} {"train_loss": -8.824178695678711, "global_step": 57044, "epoch": 339} {"train_loss": -8.715720176696777, "global_step": 57045, "epoch": 339} {"train_loss": -8.789855003356934, "global_step": 57046, "epoch": 339} {"train_loss": -8.782682418823242, "global_step": 57047, "epoch": 339} {"train_loss": -8.742925643920898, "global_step": 57048, "epoch": 339} {"train_loss": -8.70543384552002, "global_step": 57049, "epoch": 339} {"train_loss": -9.014023780822754, "global_step": 57050, "epoch": 339} {"train_loss": -8.756216049194336, "global_step": 57051, "epoch": 339} {"train_loss": -8.535971641540527, "global_step": 57052, "epoch": 339} {"train_loss": -8.68773078918457, "global_step": 57053, "epoch": 339} {"train_loss": -8.714126586914062, "global_step": 57054, "epoch": 339} {"train_loss": -8.821090698242188, "global_step": 57055, "epoch": 339} {"train_loss": -8.739093780517578, "global_step": 57056, "epoch": 339} {"train_loss": -8.82984733581543, "global_step": 57057, "epoch": 339} {"train_loss": -8.538152694702148, "global_step": 57058, "epoch": 339} {"train_loss": -8.80859375, "global_step": 57059, "epoch": 339} {"train_loss": -8.462583541870117, "global_step": 57060, "epoch": 339} {"train_loss": -7.855681419372559, "global_step": 57061, "epoch": 339} {"train_loss": -8.335782051086426, "global_step": 57062, "epoch": 339} {"train_loss": -8.385339736938477, "global_step": 57063, "epoch": 339} {"train_loss": -7.958854675292969, "global_step": 57064, "epoch": 339} {"train_loss": -8.041204452514648, "global_step": 57065, "epoch": 339} {"train_loss": -7.758360862731934, "global_step": 57066, "epoch": 339} {"train_loss": -8.288822174072266, "global_step": 57067, "epoch": 339} {"train_loss": -8.243896484375, "global_step": 57068, "epoch": 339} {"train_loss": -8.395336151123047, "global_step": 57069, "epoch": 339} {"train_loss": -8.271743774414062, "global_step": 57070, "epoch": 339} {"train_loss": -8.20144271850586, "global_step": 57071, "epoch": 339} {"train_loss": -8.444642066955566, "global_step": 57072, "epoch": 339} {"train_loss": -8.200176239013672, "global_step": 57073, "epoch": 339} {"train_loss": -8.321720123291016, "global_step": 57074, "epoch": 339} {"train_loss": -8.44741439819336, "global_step": 57075, "epoch": 339} {"train_loss": -8.346935272216797, "global_step": 57076, "epoch": 339} {"train_loss": -8.24144172668457, "global_step": 57077, "epoch": 339} {"train_loss": -8.277924537658691, "global_step": 57078, "epoch": 339} {"train_loss": -8.445573806762695, "global_step": 57079, "epoch": 339} {"train_loss": -8.12036418914795, "global_step": 57080, "epoch": 339} {"train_loss": -8.409008026123047, "global_step": 57081, "epoch": 339} {"train_loss": -8.491291046142578, "global_step": 57082, "epoch": 339} {"train_loss": -8.471338272094727, "global_step": 57083, "epoch": 339} {"train_loss": -8.529333114624023, "global_step": 57084, "epoch": 339} {"train_loss": -8.33071517944336, "global_step": 57085, "epoch": 339} {"train_loss": -8.430288314819336, "global_step": 57086, "epoch": 339} {"train_loss": -8.474116325378418, "global_step": 57087, "epoch": 339} {"train_loss": -8.336307525634766, "global_step": 57088, "epoch": 339} {"train_loss": -8.572824478149414, "global_step": 57089, "epoch": 339} {"train_loss": -8.205086708068848, "global_step": 57090, "epoch": 339} {"train_loss": -8.461343765258789, "global_step": 57091, "epoch": 339} {"train_loss": -8.597602844238281, "global_step": 57092, "epoch": 339} {"train_loss": -8.71818733215332, "global_step": 57093, "epoch": 339} {"train_loss": -8.37448787689209, "global_step": 57094, "epoch": 339} {"train_loss": -8.530006408691406, "global_step": 57095, "epoch": 339} {"train_loss": -8.647693634033203, "global_step": 57096, "epoch": 339} {"train_loss": -8.478001594543457, "global_step": 57097, "epoch": 339} {"train_loss": -8.547757148742676, "global_step": 57098, "epoch": 339} {"train_loss": -8.583282470703125, "global_step": 57099, "epoch": 339} {"train_loss": -8.572468757629395, "global_step": 57100, "epoch": 339} {"train_loss": -8.814687728881836, "global_step": 57101, "epoch": 339} {"train_loss": -8.668267250061035, "global_step": 57102, "epoch": 339} {"train_loss": -8.707003593444824, "global_step": 57103, "epoch": 339} {"train_loss": -8.708019256591797, "global_step": 57104, "epoch": 339} {"train_loss": -8.695779800415039, "global_step": 57105, "epoch": 339} {"train_loss": -8.522427558898926, "global_step": 57106, "epoch": 339} {"train_loss": -8.28374195098877, "global_step": 57107, "epoch": 339} {"train_loss": -8.704019546508789, "global_step": 57108, "epoch": 339} {"train_loss": -8.548371315002441, "global_step": 57109, "epoch": 339} {"train_loss": -8.466144561767578, "global_step": 57110, "epoch": 339} {"train_loss": -8.143829345703125, "global_step": 57111, "epoch": 339} {"train_loss": -8.568663597106934, "global_step": 57112, "epoch": 339} {"train_loss": -8.46838092803955, "global_step": 57113, "epoch": 339} {"train_loss": -8.45718765258789, "global_step": 57114, "epoch": 339} {"train_loss": -8.590473175048828, "global_step": 57115, "epoch": 339} {"train_loss": -8.034427642822266, "global_step": 57116, "epoch": 339} {"train_loss": -8.699199676513672, "global_step": 57117, "epoch": 339} {"train_loss": -8.324647903442383, "global_step": 57118, "epoch": 339} {"train_loss": -8.534972247623262, "global_step": 57119, "epoch": 339, "val_loss": 188004.953125} {"train_loss": -8.513895034790039, "global_step": 57120, "epoch": 340} {"train_loss": -8.548656463623047, "global_step": 57121, "epoch": 340} {"train_loss": -8.4549560546875, "global_step": 57122, "epoch": 340} {"train_loss": -8.463173866271973, "global_step": 57123, "epoch": 340} {"train_loss": -8.483402252197266, "global_step": 57124, "epoch": 340} {"train_loss": -8.568428039550781, "global_step": 57125, "epoch": 340} {"train_loss": -8.701833724975586, "global_step": 57126, "epoch": 340} {"train_loss": -8.76156234741211, "global_step": 57127, "epoch": 340} {"train_loss": -8.37690258026123, "global_step": 57128, "epoch": 340} {"train_loss": -8.425586700439453, "global_step": 57129, "epoch": 340} {"train_loss": -8.783157348632812, "global_step": 57130, "epoch": 340} {"train_loss": -8.58648681640625, "global_step": 57131, "epoch": 340} {"train_loss": -8.604487419128418, "global_step": 57132, "epoch": 340} {"train_loss": -8.409162521362305, "global_step": 57133, "epoch": 340} {"train_loss": -8.503702163696289, "global_step": 57134, "epoch": 340} {"train_loss": -8.68150520324707, "global_step": 57135, "epoch": 340} {"train_loss": -8.453182220458984, "global_step": 57136, "epoch": 340} {"train_loss": -8.722713470458984, "global_step": 57137, "epoch": 340} {"train_loss": -8.423470497131348, "global_step": 57138, "epoch": 340} {"train_loss": -8.729496002197266, "global_step": 57139, "epoch": 340} {"train_loss": -8.838764190673828, "global_step": 57140, "epoch": 340} {"train_loss": -8.43339729309082, "global_step": 57141, "epoch": 340} {"train_loss": -8.571260452270508, "global_step": 57142, "epoch": 340} {"train_loss": -8.651144027709961, "global_step": 57143, "epoch": 340} {"train_loss": -8.738842010498047, "global_step": 57144, "epoch": 340} {"train_loss": -8.650629043579102, "global_step": 57145, "epoch": 340} {"train_loss": -8.595769882202148, "global_step": 57146, "epoch": 340} {"train_loss": -8.4081449508667, "global_step": 57147, "epoch": 340} {"train_loss": -8.89033317565918, "global_step": 57148, "epoch": 340} {"train_loss": -8.762592315673828, "global_step": 57149, "epoch": 340} {"train_loss": -8.567869186401367, "global_step": 57150, "epoch": 340} {"train_loss": -8.62426471710205, "global_step": 57151, "epoch": 340} {"train_loss": -8.606598854064941, "global_step": 57152, "epoch": 340} {"train_loss": -8.5665283203125, "global_step": 57153, "epoch": 340} {"train_loss": -8.543333053588867, "global_step": 57154, "epoch": 340} {"train_loss": -8.686025619506836, "global_step": 57155, "epoch": 340} {"train_loss": -8.450727462768555, "global_step": 57156, "epoch": 340} {"train_loss": -8.530099868774414, "global_step": 57157, "epoch": 340} {"train_loss": -8.692767143249512, "global_step": 57158, "epoch": 340} {"train_loss": -8.441967010498047, "global_step": 57159, "epoch": 340} {"train_loss": -8.696846961975098, "global_step": 57160, "epoch": 340} {"train_loss": -8.535185813903809, "global_step": 57161, "epoch": 340} {"train_loss": -8.841482162475586, "global_step": 57162, "epoch": 340} {"train_loss": -8.255266189575195, "global_step": 57163, "epoch": 340} {"train_loss": -8.624340057373047, "global_step": 57164, "epoch": 340} {"train_loss": -8.56873893737793, "global_step": 57165, "epoch": 340} {"train_loss": -8.686193466186523, "global_step": 57166, "epoch": 340} {"train_loss": -8.163214683532715, "global_step": 57167, "epoch": 340} {"train_loss": -8.900720596313477, "global_step": 57168, "epoch": 340} {"train_loss": -8.218978881835938, "global_step": 57169, "epoch": 340} {"train_loss": -8.513668060302734, "global_step": 57170, "epoch": 340} {"train_loss": -7.920846939086914, "global_step": 57171, "epoch": 340} {"train_loss": -8.271249771118164, "global_step": 57172, "epoch": 340} {"train_loss": -8.537483215332031, "global_step": 57173, "epoch": 340} {"train_loss": -8.449640274047852, "global_step": 57174, "epoch": 340} {"train_loss": -8.421113967895508, "global_step": 57175, "epoch": 340} {"train_loss": -8.316255569458008, "global_step": 57176, "epoch": 340} {"train_loss": -8.019831657409668, "global_step": 57177, "epoch": 340} {"train_loss": -8.193756103515625, "global_step": 57178, "epoch": 340} {"train_loss": -8.52602767944336, "global_step": 57179, "epoch": 340} {"train_loss": -8.715813636779785, "global_step": 57180, "epoch": 340} {"train_loss": -8.237316131591797, "global_step": 57181, "epoch": 340} {"train_loss": -8.288299560546875, "global_step": 57182, "epoch": 340} {"train_loss": -8.474936485290527, "global_step": 57183, "epoch": 340} {"train_loss": -8.522858619689941, "global_step": 57184, "epoch": 340} {"train_loss": -8.34523868560791, "global_step": 57185, "epoch": 340} {"train_loss": -8.394655227661133, "global_step": 57186, "epoch": 340} {"train_loss": -8.657106399536133, "global_step": 57187, "epoch": 340} {"train_loss": -8.361169815063477, "global_step": 57188, "epoch": 340} {"train_loss": -8.620044708251953, "global_step": 57189, "epoch": 340} {"train_loss": -8.436705589294434, "global_step": 57190, "epoch": 340} {"train_loss": -8.759262084960938, "global_step": 57191, "epoch": 340} {"train_loss": -8.375205993652344, "global_step": 57192, "epoch": 340} {"train_loss": -8.547113418579102, "global_step": 57193, "epoch": 340} {"train_loss": -8.488507270812988, "global_step": 57194, "epoch": 340} {"train_loss": -8.573555946350098, "global_step": 57195, "epoch": 340} {"train_loss": -8.493913650512695, "global_step": 57196, "epoch": 340} {"train_loss": -8.732311248779297, "global_step": 57197, "epoch": 340} {"train_loss": -8.772099494934082, "global_step": 57198, "epoch": 340} {"train_loss": -8.637167930603027, "global_step": 57199, "epoch": 340} {"train_loss": -8.584013938903809, "global_step": 57200, "epoch": 340} {"train_loss": -8.527046203613281, "global_step": 57201, "epoch": 340} {"train_loss": -8.764933586120605, "global_step": 57202, "epoch": 340} {"train_loss": -8.699728012084961, "global_step": 57203, "epoch": 340} {"train_loss": -8.610271453857422, "global_step": 57204, "epoch": 340} {"train_loss": -8.64153003692627, "global_step": 57205, "epoch": 340} {"train_loss": -8.618921279907227, "global_step": 57206, "epoch": 340} {"train_loss": -8.496825218200684, "global_step": 57207, "epoch": 340} {"train_loss": -8.70872974395752, "global_step": 57208, "epoch": 340} {"train_loss": -8.386813163757324, "global_step": 57209, "epoch": 340} {"train_loss": -8.354602813720703, "global_step": 57210, "epoch": 340} {"train_loss": -8.398982048034668, "global_step": 57211, "epoch": 340} {"train_loss": -7.981578826904297, "global_step": 57212, "epoch": 340} {"train_loss": -8.564716339111328, "global_step": 57213, "epoch": 340} {"train_loss": -8.079339027404785, "global_step": 57214, "epoch": 340} {"train_loss": -8.14901351928711, "global_step": 57215, "epoch": 340} {"train_loss": -8.412542343139648, "global_step": 57216, "epoch": 340} {"train_loss": -8.32548999786377, "global_step": 57217, "epoch": 340} {"train_loss": -8.375393867492676, "global_step": 57218, "epoch": 340} {"train_loss": -8.381011962890625, "global_step": 57219, "epoch": 340} {"train_loss": -8.561038970947266, "global_step": 57220, "epoch": 340} {"train_loss": -8.354849815368652, "global_step": 57221, "epoch": 340} {"train_loss": -8.299083709716797, "global_step": 57222, "epoch": 340} {"train_loss": -8.440717697143555, "global_step": 57223, "epoch": 340} {"train_loss": -8.489147186279297, "global_step": 57224, "epoch": 340} {"train_loss": -8.396739959716797, "global_step": 57225, "epoch": 340} {"train_loss": -8.494852066040039, "global_step": 57226, "epoch": 340} {"train_loss": -8.462098121643066, "global_step": 57227, "epoch": 340} {"train_loss": -8.429637908935547, "global_step": 57228, "epoch": 340} {"train_loss": -8.616409301757812, "global_step": 57229, "epoch": 340} {"train_loss": -8.683286666870117, "global_step": 57230, "epoch": 340} {"train_loss": -8.819267272949219, "global_step": 57231, "epoch": 340} {"train_loss": -8.45964527130127, "global_step": 57232, "epoch": 340} {"train_loss": -8.614599227905273, "global_step": 57233, "epoch": 340} {"train_loss": -8.463579177856445, "global_step": 57234, "epoch": 340} {"train_loss": -8.648172378540039, "global_step": 57235, "epoch": 340} {"train_loss": -8.555644035339355, "global_step": 57236, "epoch": 340} {"train_loss": -8.55735969543457, "global_step": 57237, "epoch": 340} {"train_loss": -8.53786563873291, "global_step": 57238, "epoch": 340} {"train_loss": -8.600240707397461, "global_step": 57239, "epoch": 340} {"train_loss": -8.865289688110352, "global_step": 57240, "epoch": 340} {"train_loss": -8.596351623535156, "global_step": 57241, "epoch": 340} {"train_loss": -8.749082565307617, "global_step": 57242, "epoch": 340} {"train_loss": -8.768280029296875, "global_step": 57243, "epoch": 340} {"train_loss": -8.668105125427246, "global_step": 57244, "epoch": 340} {"train_loss": -8.683881759643555, "global_step": 57245, "epoch": 340} {"train_loss": -8.775941848754883, "global_step": 57246, "epoch": 340} {"train_loss": -8.488554000854492, "global_step": 57247, "epoch": 340} {"train_loss": -8.663084983825684, "global_step": 57248, "epoch": 340} {"train_loss": -8.588874816894531, "global_step": 57249, "epoch": 340} {"train_loss": -8.561909675598145, "global_step": 57250, "epoch": 340} {"train_loss": -8.785621643066406, "global_step": 57251, "epoch": 340} {"train_loss": -8.435469627380371, "global_step": 57252, "epoch": 340} {"train_loss": -8.50633430480957, "global_step": 57253, "epoch": 340} {"train_loss": -8.758050918579102, "global_step": 57254, "epoch": 340} {"train_loss": -8.605064392089844, "global_step": 57255, "epoch": 340} {"train_loss": -8.816383361816406, "global_step": 57256, "epoch": 340} {"train_loss": -8.368650436401367, "global_step": 57257, "epoch": 340} {"train_loss": -8.864363670349121, "global_step": 57258, "epoch": 340} {"train_loss": -8.348175048828125, "global_step": 57259, "epoch": 340} {"train_loss": -8.609792709350586, "global_step": 57260, "epoch": 340} {"train_loss": -8.616198539733887, "global_step": 57261, "epoch": 340} {"train_loss": -8.706411361694336, "global_step": 57262, "epoch": 340} {"train_loss": -8.759441375732422, "global_step": 57263, "epoch": 340} {"train_loss": -8.827960968017578, "global_step": 57264, "epoch": 340} {"train_loss": -8.500394821166992, "global_step": 57265, "epoch": 340} {"train_loss": -8.7643404006958, "global_step": 57266, "epoch": 340} {"train_loss": -8.571958541870117, "global_step": 57267, "epoch": 340} {"train_loss": -8.602092742919922, "global_step": 57268, "epoch": 340} {"train_loss": -8.651662826538086, "global_step": 57269, "epoch": 340} {"train_loss": -7.896284580230713, "global_step": 57270, "epoch": 340} {"train_loss": -8.54629898071289, "global_step": 57271, "epoch": 340} {"train_loss": -8.38248062133789, "global_step": 57272, "epoch": 340} {"train_loss": -8.623723983764648, "global_step": 57273, "epoch": 340} {"train_loss": -8.10115909576416, "global_step": 57274, "epoch": 340} {"train_loss": -8.520732879638672, "global_step": 57275, "epoch": 340} {"train_loss": -8.479284286499023, "global_step": 57276, "epoch": 340} {"train_loss": -8.394566535949707, "global_step": 57277, "epoch": 340} {"train_loss": -8.455038070678711, "global_step": 57278, "epoch": 340} {"train_loss": -8.328628540039062, "global_step": 57279, "epoch": 340} {"train_loss": -8.668941497802734, "global_step": 57280, "epoch": 340} {"train_loss": -8.625160217285156, "global_step": 57281, "epoch": 340} {"train_loss": -8.191661834716797, "global_step": 57282, "epoch": 340} {"train_loss": -8.515070915222168, "global_step": 57283, "epoch": 340} {"train_loss": -8.54965591430664, "global_step": 57284, "epoch": 340} {"train_loss": -8.604662895202637, "global_step": 57285, "epoch": 340} {"train_loss": -8.617269515991211, "global_step": 57286, "epoch": 340} {"train_loss": -8.533468067646027, "global_step": 57287, "epoch": 340, "val_loss": 189178.828125, "train_action_mse_error": 4.677340984344482} {"train_loss": -8.563108444213867, "global_step": 57288, "epoch": 341} {"train_loss": -8.438015937805176, "global_step": 57289, "epoch": 341} {"train_loss": -8.566463470458984, "global_step": 57290, "epoch": 341} {"train_loss": -8.520622253417969, "global_step": 57291, "epoch": 341} {"train_loss": -8.382915496826172, "global_step": 57292, "epoch": 341} {"train_loss": -8.366792678833008, "global_step": 57293, "epoch": 341} {"train_loss": -8.692255973815918, "global_step": 57294, "epoch": 341} {"train_loss": -8.424968719482422, "global_step": 57295, "epoch": 341} {"train_loss": -8.630334854125977, "global_step": 57296, "epoch": 341} {"train_loss": -8.557079315185547, "global_step": 57297, "epoch": 341} {"train_loss": -8.463743209838867, "global_step": 57298, "epoch": 341} {"train_loss": -8.472076416015625, "global_step": 57299, "epoch": 341} {"train_loss": -8.535093307495117, "global_step": 57300, "epoch": 341} {"train_loss": -8.532885551452637, "global_step": 57301, "epoch": 341} {"train_loss": -8.556039810180664, "global_step": 57302, "epoch": 341} {"train_loss": -8.602651596069336, "global_step": 57303, "epoch": 341} {"train_loss": -8.472442626953125, "global_step": 57304, "epoch": 341} {"train_loss": -8.467992782592773, "global_step": 57305, "epoch": 341} {"train_loss": -8.583438873291016, "global_step": 57306, "epoch": 341} {"train_loss": -8.52482795715332, "global_step": 57307, "epoch": 341} {"train_loss": -8.709207534790039, "global_step": 57308, "epoch": 341} {"train_loss": -8.449790954589844, "global_step": 57309, "epoch": 341} {"train_loss": -8.344968795776367, "global_step": 57310, "epoch": 341} {"train_loss": -8.76078987121582, "global_step": 57311, "epoch": 341} {"train_loss": -8.434279441833496, "global_step": 57312, "epoch": 341} {"train_loss": -8.810285568237305, "global_step": 57313, "epoch": 341} {"train_loss": -8.5228271484375, "global_step": 57314, "epoch": 341} {"train_loss": -8.63544750213623, "global_step": 57315, "epoch": 341} {"train_loss": -8.796192169189453, "global_step": 57316, "epoch": 341} {"train_loss": -8.50367546081543, "global_step": 57317, "epoch": 341} {"train_loss": -8.653268814086914, "global_step": 57318, "epoch": 341} {"train_loss": -8.730627059936523, "global_step": 57319, "epoch": 341} {"train_loss": -8.727472305297852, "global_step": 57320, "epoch": 341} {"train_loss": -8.60280990600586, "global_step": 57321, "epoch": 341} {"train_loss": -8.553610801696777, "global_step": 57322, "epoch": 341} {"train_loss": -8.401565551757812, "global_step": 57323, "epoch": 341} {"train_loss": -8.50935173034668, "global_step": 57324, "epoch": 341} {"train_loss": -8.901373863220215, "global_step": 57325, "epoch": 341} {"train_loss": -8.842740058898926, "global_step": 57326, "epoch": 341} {"train_loss": -8.542187690734863, "global_step": 57327, "epoch": 341} {"train_loss": -8.722230911254883, "global_step": 57328, "epoch": 341} {"train_loss": -8.633066177368164, "global_step": 57329, "epoch": 341} {"train_loss": -8.51594352722168, "global_step": 57330, "epoch": 341} {"train_loss": -8.604447364807129, "global_step": 57331, "epoch": 341} {"train_loss": -8.656484603881836, "global_step": 57332, "epoch": 341} {"train_loss": -8.505502700805664, "global_step": 57333, "epoch": 341} {"train_loss": -8.56049919128418, "global_step": 57334, "epoch": 341} {"train_loss": -8.788872718811035, "global_step": 57335, "epoch": 341} {"train_loss": -8.654520034790039, "global_step": 57336, "epoch": 341} {"train_loss": -8.583303451538086, "global_step": 57337, "epoch": 341} {"train_loss": -8.503046035766602, "global_step": 57338, "epoch": 341} {"train_loss": -8.392084121704102, "global_step": 57339, "epoch": 341} {"train_loss": -8.524675369262695, "global_step": 57340, "epoch": 341} {"train_loss": -8.319709777832031, "global_step": 57341, "epoch": 341} {"train_loss": -8.538488388061523, "global_step": 57342, "epoch": 341} {"train_loss": -8.471076965332031, "global_step": 57343, "epoch": 341} {"train_loss": -8.817503929138184, "global_step": 57344, "epoch": 341} {"train_loss": -8.296165466308594, "global_step": 57345, "epoch": 341} {"train_loss": -8.620548248291016, "global_step": 57346, "epoch": 341} {"train_loss": -8.301980972290039, "global_step": 57347, "epoch": 341} {"train_loss": -8.552350044250488, "global_step": 57348, "epoch": 341} {"train_loss": -8.456206321716309, "global_step": 57349, "epoch": 341} {"train_loss": -8.196569442749023, "global_step": 57350, "epoch": 341} {"train_loss": -8.645541191101074, "global_step": 57351, "epoch": 341} {"train_loss": -8.578195571899414, "global_step": 57352, "epoch": 341} {"train_loss": -8.476373672485352, "global_step": 57353, "epoch": 341} {"train_loss": -8.508292198181152, "global_step": 57354, "epoch": 341} {"train_loss": -8.545143127441406, "global_step": 57355, "epoch": 341} {"train_loss": -8.398721694946289, "global_step": 57356, "epoch": 341} {"train_loss": -8.524029731750488, "global_step": 57357, "epoch": 341} {"train_loss": -8.246377944946289, "global_step": 57358, "epoch": 341} {"train_loss": -8.644017219543457, "global_step": 57359, "epoch": 341} {"train_loss": -8.66511058807373, "global_step": 57360, "epoch": 341} {"train_loss": -8.489967346191406, "global_step": 57361, "epoch": 341} {"train_loss": -8.568446159362793, "global_step": 57362, "epoch": 341} {"train_loss": -8.61318588256836, "global_step": 57363, "epoch": 341} {"train_loss": -8.49571418762207, "global_step": 57364, "epoch": 341} {"train_loss": -8.310554504394531, "global_step": 57365, "epoch": 341} {"train_loss": -8.418011665344238, "global_step": 57366, "epoch": 341} {"train_loss": -8.4935884475708, "global_step": 57367, "epoch": 341} {"train_loss": -8.684345245361328, "global_step": 57368, "epoch": 341} {"train_loss": -8.541110038757324, "global_step": 57369, "epoch": 341} {"train_loss": -8.374456405639648, "global_step": 57370, "epoch": 341} {"train_loss": -8.316264152526855, "global_step": 57371, "epoch": 341} {"train_loss": -8.698436737060547, "global_step": 57372, "epoch": 341} {"train_loss": -8.485591888427734, "global_step": 57373, "epoch": 341} {"train_loss": -8.608360290527344, "global_step": 57374, "epoch": 341} {"train_loss": -8.5899019241333, "global_step": 57375, "epoch": 341} {"train_loss": -8.610126495361328, "global_step": 57376, "epoch": 341} {"train_loss": -8.554210662841797, "global_step": 57377, "epoch": 341} {"train_loss": -8.652872085571289, "global_step": 57378, "epoch": 341} {"train_loss": -8.477724075317383, "global_step": 57379, "epoch": 341} {"train_loss": -8.888237953186035, "global_step": 57380, "epoch": 341} {"train_loss": -8.834848403930664, "global_step": 57381, "epoch": 341} {"train_loss": -9.012596130371094, "global_step": 57382, "epoch": 341} {"train_loss": -8.890748023986816, "global_step": 57383, "epoch": 341} {"train_loss": -8.842031478881836, "global_step": 57384, "epoch": 341} {"train_loss": -8.654635429382324, "global_step": 57385, "epoch": 341} {"train_loss": -8.600194931030273, "global_step": 57386, "epoch": 341} {"train_loss": -8.609552383422852, "global_step": 57387, "epoch": 341} {"train_loss": -8.805646896362305, "global_step": 57388, "epoch": 341} {"train_loss": -8.586050033569336, "global_step": 57389, "epoch": 341} {"train_loss": -8.71500015258789, "global_step": 57390, "epoch": 341} {"train_loss": -8.60232162475586, "global_step": 57391, "epoch": 341} {"train_loss": -8.245500564575195, "global_step": 57392, "epoch": 341} {"train_loss": -8.637680053710938, "global_step": 57393, "epoch": 341} {"train_loss": -8.272125244140625, "global_step": 57394, "epoch": 341} {"train_loss": -8.65614128112793, "global_step": 57395, "epoch": 341} {"train_loss": -8.518482208251953, "global_step": 57396, "epoch": 341} {"train_loss": -8.676854133605957, "global_step": 57397, "epoch": 341} {"train_loss": -8.412622451782227, "global_step": 57398, "epoch": 341} {"train_loss": -8.680326461791992, "global_step": 57399, "epoch": 341} {"train_loss": -8.63017463684082, "global_step": 57400, "epoch": 341} {"train_loss": -8.562244415283203, "global_step": 57401, "epoch": 341} {"train_loss": -8.598821640014648, "global_step": 57402, "epoch": 341} {"train_loss": -8.517618179321289, "global_step": 57403, "epoch": 341} {"train_loss": -8.709694862365723, "global_step": 57404, "epoch": 341} {"train_loss": -8.663983345031738, "global_step": 57405, "epoch": 341} {"train_loss": -8.532922744750977, "global_step": 57406, "epoch": 341} {"train_loss": -8.493114471435547, "global_step": 57407, "epoch": 341} {"train_loss": -8.519124984741211, "global_step": 57408, "epoch": 341} {"train_loss": -8.26871109008789, "global_step": 57409, "epoch": 341} {"train_loss": -8.538759231567383, "global_step": 57410, "epoch": 341} {"train_loss": -8.438739776611328, "global_step": 57411, "epoch": 341} {"train_loss": -8.56122875213623, "global_step": 57412, "epoch": 341} {"train_loss": -8.195610046386719, "global_step": 57413, "epoch": 341} {"train_loss": -8.537714958190918, "global_step": 57414, "epoch": 341} {"train_loss": -8.492431640625, "global_step": 57415, "epoch": 341} {"train_loss": -8.220256805419922, "global_step": 57416, "epoch": 341} {"train_loss": -8.64735221862793, "global_step": 57417, "epoch": 341} {"train_loss": -8.47026538848877, "global_step": 57418, "epoch": 341} {"train_loss": -8.254559516906738, "global_step": 57419, "epoch": 341} {"train_loss": -8.790449142456055, "global_step": 57420, "epoch": 341} {"train_loss": -8.548452377319336, "global_step": 57421, "epoch": 341} {"train_loss": -8.540384292602539, "global_step": 57422, "epoch": 341} {"train_loss": -8.67548656463623, "global_step": 57423, "epoch": 341} {"train_loss": -8.398405075073242, "global_step": 57424, "epoch": 341} {"train_loss": -8.283382415771484, "global_step": 57425, "epoch": 341} {"train_loss": -8.486358642578125, "global_step": 57426, "epoch": 341} {"train_loss": -8.522674560546875, "global_step": 57427, "epoch": 341} {"train_loss": -8.587148666381836, "global_step": 57428, "epoch": 341} {"train_loss": -8.376300811767578, "global_step": 57429, "epoch": 341} {"train_loss": -8.438529968261719, "global_step": 57430, "epoch": 341} {"train_loss": -8.418882369995117, "global_step": 57431, "epoch": 341} {"train_loss": -8.550872802734375, "global_step": 57432, "epoch": 341} {"train_loss": -8.566856384277344, "global_step": 57433, "epoch": 341} {"train_loss": -8.3438081741333, "global_step": 57434, "epoch": 341} {"train_loss": -8.329448699951172, "global_step": 57435, "epoch": 341} {"train_loss": -8.38936996459961, "global_step": 57436, "epoch": 341} {"train_loss": -8.552648544311523, "global_step": 57437, "epoch": 341} {"train_loss": -8.453263282775879, "global_step": 57438, "epoch": 341} {"train_loss": -8.338171005249023, "global_step": 57439, "epoch": 341} {"train_loss": -8.295780181884766, "global_step": 57440, "epoch": 341} {"train_loss": -8.4359769821167, "global_step": 57441, "epoch": 341} {"train_loss": -8.608062744140625, "global_step": 57442, "epoch": 341} {"train_loss": -8.675323486328125, "global_step": 57443, "epoch": 341} {"train_loss": -8.415628433227539, "global_step": 57444, "epoch": 341} {"train_loss": -8.499308586120605, "global_step": 57445, "epoch": 341} {"train_loss": -8.459722518920898, "global_step": 57446, "epoch": 341} {"train_loss": -8.401784896850586, "global_step": 57447, "epoch": 341} {"train_loss": -8.337860107421875, "global_step": 57448, "epoch": 341} {"train_loss": -8.482039451599121, "global_step": 57449, "epoch": 341} {"train_loss": -8.649141311645508, "global_step": 57450, "epoch": 341} {"train_loss": -8.772244453430176, "global_step": 57451, "epoch": 341} {"train_loss": -8.515788078308105, "global_step": 57452, "epoch": 341} {"train_loss": -8.46626091003418, "global_step": 57453, "epoch": 341} {"train_loss": -8.686487197875977, "global_step": 57454, "epoch": 341} {"train_loss": -8.543053581601097, "global_step": 57455, "epoch": 341, "val_loss": 187038.546875} {"train_loss": -8.297149658203125, "global_step": 57456, "epoch": 342} {"train_loss": -8.715564727783203, "global_step": 57457, "epoch": 342} {"train_loss": -8.702997207641602, "global_step": 57458, "epoch": 342} {"train_loss": -8.676837921142578, "global_step": 57459, "epoch": 342} {"train_loss": -8.648820877075195, "global_step": 57460, "epoch": 342} {"train_loss": -8.633783340454102, "global_step": 57461, "epoch": 342} {"train_loss": -8.749062538146973, "global_step": 57462, "epoch": 342} {"train_loss": -8.571277618408203, "global_step": 57463, "epoch": 342} {"train_loss": -8.598502159118652, "global_step": 57464, "epoch": 342} {"train_loss": -8.712034225463867, "global_step": 57465, "epoch": 342} {"train_loss": -8.648107528686523, "global_step": 57466, "epoch": 342} {"train_loss": -8.546741485595703, "global_step": 57467, "epoch": 342} {"train_loss": -8.322881698608398, "global_step": 57468, "epoch": 342} {"train_loss": -8.463163375854492, "global_step": 57469, "epoch": 342} {"train_loss": -8.514863014221191, "global_step": 57470, "epoch": 342} {"train_loss": -8.571378707885742, "global_step": 57471, "epoch": 342} {"train_loss": -8.330184936523438, "global_step": 57472, "epoch": 342} {"train_loss": -8.410974502563477, "global_step": 57473, "epoch": 342} {"train_loss": -8.526025772094727, "global_step": 57474, "epoch": 342} {"train_loss": -8.616266250610352, "global_step": 57475, "epoch": 342} {"train_loss": -8.49277114868164, "global_step": 57476, "epoch": 342} {"train_loss": -8.83553409576416, "global_step": 57477, "epoch": 342} {"train_loss": -8.309144973754883, "global_step": 57478, "epoch": 342} {"train_loss": -8.56064224243164, "global_step": 57479, "epoch": 342} {"train_loss": -8.524589538574219, "global_step": 57480, "epoch": 342} {"train_loss": -8.506241798400879, "global_step": 57481, "epoch": 342} {"train_loss": -8.548992156982422, "global_step": 57482, "epoch": 342} {"train_loss": -8.471059799194336, "global_step": 57483, "epoch": 342} {"train_loss": -8.597137451171875, "global_step": 57484, "epoch": 342} {"train_loss": -8.630133628845215, "global_step": 57485, "epoch": 342} {"train_loss": -8.731880187988281, "global_step": 57486, "epoch": 342} {"train_loss": -8.477313995361328, "global_step": 57487, "epoch": 342} {"train_loss": -8.742627143859863, "global_step": 57488, "epoch": 342} {"train_loss": -8.728578567504883, "global_step": 57489, "epoch": 342} {"train_loss": -8.607522964477539, "global_step": 57490, "epoch": 342} {"train_loss": -8.70773696899414, "global_step": 57491, "epoch": 342} {"train_loss": -8.584524154663086, "global_step": 57492, "epoch": 342} {"train_loss": -8.673727035522461, "global_step": 57493, "epoch": 342} {"train_loss": -8.743841171264648, "global_step": 57494, "epoch": 342} {"train_loss": -8.532320022583008, "global_step": 57495, "epoch": 342} {"train_loss": -8.519268035888672, "global_step": 57496, "epoch": 342} {"train_loss": -8.863099098205566, "global_step": 57497, "epoch": 342} {"train_loss": -8.596860885620117, "global_step": 57498, "epoch": 342} {"train_loss": -8.418506622314453, "global_step": 57499, "epoch": 342} {"train_loss": -8.63463306427002, "global_step": 57500, "epoch": 342} {"train_loss": -8.505146026611328, "global_step": 57501, "epoch": 342} {"train_loss": -8.53803539276123, "global_step": 57502, "epoch": 342} {"train_loss": -8.727210998535156, "global_step": 57503, "epoch": 342} {"train_loss": -8.43083381652832, "global_step": 57504, "epoch": 342} {"train_loss": -8.590431213378906, "global_step": 57505, "epoch": 342} {"train_loss": -8.52695083618164, "global_step": 57506, "epoch": 342} {"train_loss": -8.470427513122559, "global_step": 57507, "epoch": 342} {"train_loss": -8.614591598510742, "global_step": 57508, "epoch": 342} {"train_loss": -8.619647026062012, "global_step": 57509, "epoch": 342} {"train_loss": -8.363911628723145, "global_step": 57510, "epoch": 342} {"train_loss": -8.440132141113281, "global_step": 57511, "epoch": 342} {"train_loss": -8.478377342224121, "global_step": 57512, "epoch": 342} {"train_loss": -8.540605545043945, "global_step": 57513, "epoch": 342} {"train_loss": -8.531803131103516, "global_step": 57514, "epoch": 342} {"train_loss": -8.385818481445312, "global_step": 57515, "epoch": 342} {"train_loss": -8.685701370239258, "global_step": 57516, "epoch": 342} {"train_loss": -8.637276649475098, "global_step": 57517, "epoch": 342} {"train_loss": -8.422819137573242, "global_step": 57518, "epoch": 342} {"train_loss": -8.490745544433594, "global_step": 57519, "epoch": 342} {"train_loss": -8.496397018432617, "global_step": 57520, "epoch": 342} {"train_loss": -8.378506660461426, "global_step": 57521, "epoch": 342} {"train_loss": -8.498104095458984, "global_step": 57522, "epoch": 342} {"train_loss": -8.814765930175781, "global_step": 57523, "epoch": 342} {"train_loss": -8.307844161987305, "global_step": 57524, "epoch": 342} {"train_loss": -8.522603988647461, "global_step": 57525, "epoch": 342} {"train_loss": -8.53231430053711, "global_step": 57526, "epoch": 342} {"train_loss": -8.395220756530762, "global_step": 57527, "epoch": 342} {"train_loss": -8.479423522949219, "global_step": 57528, "epoch": 342} {"train_loss": -8.60440731048584, "global_step": 57529, "epoch": 342} {"train_loss": -8.693941116333008, "global_step": 57530, "epoch": 342} {"train_loss": -8.629749298095703, "global_step": 57531, "epoch": 342} {"train_loss": -8.703104972839355, "global_step": 57532, "epoch": 342} {"train_loss": -8.58536148071289, "global_step": 57533, "epoch": 342} {"train_loss": -8.683945655822754, "global_step": 57534, "epoch": 342} {"train_loss": -8.777830123901367, "global_step": 57535, "epoch": 342} {"train_loss": -8.691267013549805, "global_step": 57536, "epoch": 342} {"train_loss": -8.756641387939453, "global_step": 57537, "epoch": 342} {"train_loss": -8.71291446685791, "global_step": 57538, "epoch": 342} {"train_loss": -8.598489761352539, "global_step": 57539, "epoch": 342} {"train_loss": -8.541654586791992, "global_step": 57540, "epoch": 342} {"train_loss": -8.824639320373535, "global_step": 57541, "epoch": 342} {"train_loss": -8.738000869750977, "global_step": 57542, "epoch": 342} {"train_loss": -8.713796615600586, "global_step": 57543, "epoch": 342} {"train_loss": -8.670555114746094, "global_step": 57544, "epoch": 342} {"train_loss": -8.722976684570312, "global_step": 57545, "epoch": 342} {"train_loss": -8.646340370178223, "global_step": 57546, "epoch": 342} {"train_loss": -8.831939697265625, "global_step": 57547, "epoch": 342} {"train_loss": -8.812746047973633, "global_step": 57548, "epoch": 342} {"train_loss": -8.564688682556152, "global_step": 57549, "epoch": 342} {"train_loss": -8.73585319519043, "global_step": 57550, "epoch": 342} {"train_loss": -8.467915534973145, "global_step": 57551, "epoch": 342} {"train_loss": -8.667799949645996, "global_step": 57552, "epoch": 342} {"train_loss": -8.541732788085938, "global_step": 57553, "epoch": 342} {"train_loss": -8.698790550231934, "global_step": 57554, "epoch": 342} {"train_loss": -8.699540138244629, "global_step": 57555, "epoch": 342} {"train_loss": -8.581100463867188, "global_step": 57556, "epoch": 342} {"train_loss": -8.497846603393555, "global_step": 57557, "epoch": 342} {"train_loss": -8.79732894897461, "global_step": 57558, "epoch": 342} {"train_loss": -8.382902145385742, "global_step": 57559, "epoch": 342} {"train_loss": -8.4888916015625, "global_step": 57560, "epoch": 342} {"train_loss": -8.360507011413574, "global_step": 57561, "epoch": 342} {"train_loss": -8.38121223449707, "global_step": 57562, "epoch": 342} {"train_loss": -8.45048999786377, "global_step": 57563, "epoch": 342} {"train_loss": -8.287662506103516, "global_step": 57564, "epoch": 342} {"train_loss": -8.676071166992188, "global_step": 57565, "epoch": 342} {"train_loss": -8.537927627563477, "global_step": 57566, "epoch": 342} {"train_loss": -8.331303596496582, "global_step": 57567, "epoch": 342} {"train_loss": -8.560765266418457, "global_step": 57568, "epoch": 342} {"train_loss": -8.390560150146484, "global_step": 57569, "epoch": 342} {"train_loss": -8.504934310913086, "global_step": 57570, "epoch": 342} {"train_loss": -8.450296401977539, "global_step": 57571, "epoch": 342} {"train_loss": -8.605202674865723, "global_step": 57572, "epoch": 342} {"train_loss": -8.452192306518555, "global_step": 57573, "epoch": 342} {"train_loss": -8.471855163574219, "global_step": 57574, "epoch": 342} {"train_loss": -8.386978149414062, "global_step": 57575, "epoch": 342} {"train_loss": -8.737466812133789, "global_step": 57576, "epoch": 342} {"train_loss": -8.58163833618164, "global_step": 57577, "epoch": 342} {"train_loss": -8.824087142944336, "global_step": 57578, "epoch": 342} {"train_loss": -8.769294738769531, "global_step": 57579, "epoch": 342} {"train_loss": -8.75606918334961, "global_step": 57580, "epoch": 342} {"train_loss": -8.774229049682617, "global_step": 57581, "epoch": 342} {"train_loss": -8.532773971557617, "global_step": 57582, "epoch": 342} {"train_loss": -8.747783660888672, "global_step": 57583, "epoch": 342} {"train_loss": -8.75341510772705, "global_step": 57584, "epoch": 342} {"train_loss": -8.615385055541992, "global_step": 57585, "epoch": 342} {"train_loss": -8.59309196472168, "global_step": 57586, "epoch": 342} {"train_loss": -8.727807998657227, "global_step": 57587, "epoch": 342} {"train_loss": -8.67226791381836, "global_step": 57588, "epoch": 342} {"train_loss": -8.333772659301758, "global_step": 57589, "epoch": 342} {"train_loss": -8.076990127563477, "global_step": 57590, "epoch": 342} {"train_loss": -8.797348976135254, "global_step": 57591, "epoch": 342} {"train_loss": -8.613458633422852, "global_step": 57592, "epoch": 342} {"train_loss": -8.681921005249023, "global_step": 57593, "epoch": 342} {"train_loss": -8.643045425415039, "global_step": 57594, "epoch": 342} {"train_loss": -8.552552223205566, "global_step": 57595, "epoch": 342} {"train_loss": -8.713071823120117, "global_step": 57596, "epoch": 342} {"train_loss": -8.613975524902344, "global_step": 57597, "epoch": 342} {"train_loss": -8.36004638671875, "global_step": 57598, "epoch": 342} {"train_loss": -8.682825088500977, "global_step": 57599, "epoch": 342} {"train_loss": -8.489480972290039, "global_step": 57600, "epoch": 342} {"train_loss": -8.51314640045166, "global_step": 57601, "epoch": 342} {"train_loss": -8.171091079711914, "global_step": 57602, "epoch": 342} {"train_loss": -8.316400527954102, "global_step": 57603, "epoch": 342} {"train_loss": -7.948540210723877, "global_step": 57604, "epoch": 342} {"train_loss": -8.546609878540039, "global_step": 57605, "epoch": 342} {"train_loss": -7.95984411239624, "global_step": 57606, "epoch": 342} {"train_loss": -8.526571273803711, "global_step": 57607, "epoch": 342} {"train_loss": -8.023075103759766, "global_step": 57608, "epoch": 342} {"train_loss": -8.405879974365234, "global_step": 57609, "epoch": 342} {"train_loss": -8.08134937286377, "global_step": 57610, "epoch": 342} {"train_loss": -8.494189262390137, "global_step": 57611, "epoch": 342} {"train_loss": -8.323919296264648, "global_step": 57612, "epoch": 342} {"train_loss": -8.071245193481445, "global_step": 57613, "epoch": 342} {"train_loss": -8.27186393737793, "global_step": 57614, "epoch": 342} {"train_loss": -8.389643669128418, "global_step": 57615, "epoch": 342} {"train_loss": -8.17662239074707, "global_step": 57616, "epoch": 342} {"train_loss": -8.363374710083008, "global_step": 57617, "epoch": 342} {"train_loss": -8.255083084106445, "global_step": 57618, "epoch": 342} {"train_loss": -8.43410873413086, "global_step": 57619, "epoch": 342} {"train_loss": -8.237060546875, "global_step": 57620, "epoch": 342} {"train_loss": -8.408345222473145, "global_step": 57621, "epoch": 342} {"train_loss": -8.478059768676758, "global_step": 57622, "epoch": 342} {"train_loss": -8.542287724358696, "global_step": 57623, "epoch": 342, "val_loss": 188485.484375} {"train_loss": -8.294502258300781, "global_step": 57624, "epoch": 343} {"train_loss": -8.545095443725586, "global_step": 57625, "epoch": 343} {"train_loss": -8.682197570800781, "global_step": 57626, "epoch": 343} {"train_loss": -8.665573120117188, "global_step": 57627, "epoch": 343} {"train_loss": -8.59221076965332, "global_step": 57628, "epoch": 343} {"train_loss": -8.486526489257812, "global_step": 57629, "epoch": 343} {"train_loss": -8.522713661193848, "global_step": 57630, "epoch": 343} {"train_loss": -8.572071075439453, "global_step": 57631, "epoch": 343} {"train_loss": -8.64381217956543, "global_step": 57632, "epoch": 343} {"train_loss": -8.445812225341797, "global_step": 57633, "epoch": 343} {"train_loss": -8.648967742919922, "global_step": 57634, "epoch": 343} {"train_loss": -8.406455993652344, "global_step": 57635, "epoch": 343} {"train_loss": -8.574024200439453, "global_step": 57636, "epoch": 343} {"train_loss": -8.650653839111328, "global_step": 57637, "epoch": 343} {"train_loss": -8.522079467773438, "global_step": 57638, "epoch": 343} {"train_loss": -8.239459991455078, "global_step": 57639, "epoch": 343} {"train_loss": -8.542034149169922, "global_step": 57640, "epoch": 343} {"train_loss": -8.430280685424805, "global_step": 57641, "epoch": 343} {"train_loss": -8.276957511901855, "global_step": 57642, "epoch": 343} {"train_loss": -8.301243782043457, "global_step": 57643, "epoch": 343} {"train_loss": -8.517977714538574, "global_step": 57644, "epoch": 343} {"train_loss": -8.530559539794922, "global_step": 57645, "epoch": 343} {"train_loss": -8.510703086853027, "global_step": 57646, "epoch": 343} {"train_loss": -8.502224922180176, "global_step": 57647, "epoch": 343} {"train_loss": -8.533706665039062, "global_step": 57648, "epoch": 343} {"train_loss": -8.64305591583252, "global_step": 57649, "epoch": 343} {"train_loss": -8.879796981811523, "global_step": 57650, "epoch": 343} {"train_loss": -8.752240180969238, "global_step": 57651, "epoch": 343} {"train_loss": -8.546546936035156, "global_step": 57652, "epoch": 343} {"train_loss": -8.52792739868164, "global_step": 57653, "epoch": 343} {"train_loss": -8.581932067871094, "global_step": 57654, "epoch": 343} {"train_loss": -8.694221496582031, "global_step": 57655, "epoch": 343} {"train_loss": -8.609397888183594, "global_step": 57656, "epoch": 343} {"train_loss": -8.651817321777344, "global_step": 57657, "epoch": 343} {"train_loss": -8.729546546936035, "global_step": 57658, "epoch": 343} {"train_loss": -8.590570449829102, "global_step": 57659, "epoch": 343} {"train_loss": -8.635991096496582, "global_step": 57660, "epoch": 343} {"train_loss": -8.465505599975586, "global_step": 57661, "epoch": 343} {"train_loss": -8.669944763183594, "global_step": 57662, "epoch": 343} {"train_loss": -8.628324508666992, "global_step": 57663, "epoch": 343} {"train_loss": -8.627666473388672, "global_step": 57664, "epoch": 343} {"train_loss": -8.771068572998047, "global_step": 57665, "epoch": 343} {"train_loss": -8.538926124572754, "global_step": 57666, "epoch": 343} {"train_loss": -8.696127891540527, "global_step": 57667, "epoch": 343} {"train_loss": -8.518058776855469, "global_step": 57668, "epoch": 343} {"train_loss": -8.503633499145508, "global_step": 57669, "epoch": 343} {"train_loss": -8.626860618591309, "global_step": 57670, "epoch": 343} {"train_loss": -8.52208423614502, "global_step": 57671, "epoch": 343} {"train_loss": -8.577289581298828, "global_step": 57672, "epoch": 343} {"train_loss": -8.695280075073242, "global_step": 57673, "epoch": 343} {"train_loss": -8.757095336914062, "global_step": 57674, "epoch": 343} {"train_loss": -8.723611831665039, "global_step": 57675, "epoch": 343} {"train_loss": -8.596307754516602, "global_step": 57676, "epoch": 343} {"train_loss": -8.306313514709473, "global_step": 57677, "epoch": 343} {"train_loss": -8.551523208618164, "global_step": 57678, "epoch": 343} {"train_loss": -8.748525619506836, "global_step": 57679, "epoch": 343} {"train_loss": -8.298791885375977, "global_step": 57680, "epoch": 343} {"train_loss": -8.620943069458008, "global_step": 57681, "epoch": 343} {"train_loss": -8.42419719696045, "global_step": 57682, "epoch": 343} {"train_loss": -8.748391151428223, "global_step": 57683, "epoch": 343} {"train_loss": -8.42154312133789, "global_step": 57684, "epoch": 343} {"train_loss": -8.866259574890137, "global_step": 57685, "epoch": 343} {"train_loss": -8.599635124206543, "global_step": 57686, "epoch": 343} {"train_loss": -8.420536994934082, "global_step": 57687, "epoch": 343} {"train_loss": -8.508441925048828, "global_step": 57688, "epoch": 343} {"train_loss": -8.786147117614746, "global_step": 57689, "epoch": 343} {"train_loss": -8.639429092407227, "global_step": 57690, "epoch": 343} {"train_loss": -8.64175033569336, "global_step": 57691, "epoch": 343} {"train_loss": -8.503093719482422, "global_step": 57692, "epoch": 343} {"train_loss": -8.595756530761719, "global_step": 57693, "epoch": 343} {"train_loss": -8.584327697753906, "global_step": 57694, "epoch": 343} {"train_loss": -8.377934455871582, "global_step": 57695, "epoch": 343} {"train_loss": -8.528779983520508, "global_step": 57696, "epoch": 343} {"train_loss": -8.799131393432617, "global_step": 57697, "epoch": 343} {"train_loss": -8.104896545410156, "global_step": 57698, "epoch": 343} {"train_loss": -8.664979934692383, "global_step": 57699, "epoch": 343} {"train_loss": -8.369056701660156, "global_step": 57700, "epoch": 343} {"train_loss": -8.483880043029785, "global_step": 57701, "epoch": 343} {"train_loss": -8.484434127807617, "global_step": 57702, "epoch": 343} {"train_loss": -8.567716598510742, "global_step": 57703, "epoch": 343} {"train_loss": -8.48642349243164, "global_step": 57704, "epoch": 343} {"train_loss": -8.533413887023926, "global_step": 57705, "epoch": 343} {"train_loss": -8.261900901794434, "global_step": 57706, "epoch": 343} {"train_loss": -8.542387962341309, "global_step": 57707, "epoch": 343} {"train_loss": -8.220128059387207, "global_step": 57708, "epoch": 343} {"train_loss": -8.564231872558594, "global_step": 57709, "epoch": 343} {"train_loss": -8.374195098876953, "global_step": 57710, "epoch": 343} {"train_loss": -8.503789901733398, "global_step": 57711, "epoch": 343} {"train_loss": -8.192212104797363, "global_step": 57712, "epoch": 343} {"train_loss": -8.472030639648438, "global_step": 57713, "epoch": 343} {"train_loss": -8.329960823059082, "global_step": 57714, "epoch": 343} {"train_loss": -8.736165046691895, "global_step": 57715, "epoch": 343} {"train_loss": -8.385047912597656, "global_step": 57716, "epoch": 343} {"train_loss": -8.498464584350586, "global_step": 57717, "epoch": 343} {"train_loss": -8.480266571044922, "global_step": 57718, "epoch": 343} {"train_loss": -8.740886688232422, "global_step": 57719, "epoch": 343} {"train_loss": -8.546056747436523, "global_step": 57720, "epoch": 343} {"train_loss": -8.767887115478516, "global_step": 57721, "epoch": 343} {"train_loss": -8.450211524963379, "global_step": 57722, "epoch": 343} {"train_loss": -8.640432357788086, "global_step": 57723, "epoch": 343} {"train_loss": -8.659740447998047, "global_step": 57724, "epoch": 343} {"train_loss": -8.815326690673828, "global_step": 57725, "epoch": 343} {"train_loss": -8.654808044433594, "global_step": 57726, "epoch": 343} {"train_loss": -8.516902923583984, "global_step": 57727, "epoch": 343} {"train_loss": -8.738792419433594, "global_step": 57728, "epoch": 343} {"train_loss": -8.853431701660156, "global_step": 57729, "epoch": 343} {"train_loss": -8.786786079406738, "global_step": 57730, "epoch": 343} {"train_loss": -8.929120063781738, "global_step": 57731, "epoch": 343} {"train_loss": -8.714363098144531, "global_step": 57732, "epoch": 343} {"train_loss": -8.615377426147461, "global_step": 57733, "epoch": 343} {"train_loss": -8.775262832641602, "global_step": 57734, "epoch": 343} {"train_loss": -8.775839805603027, "global_step": 57735, "epoch": 343} {"train_loss": -8.77951431274414, "global_step": 57736, "epoch": 343} {"train_loss": -8.841814041137695, "global_step": 57737, "epoch": 343} {"train_loss": -8.563896179199219, "global_step": 57738, "epoch": 343} {"train_loss": -8.557821273803711, "global_step": 57739, "epoch": 343} {"train_loss": -8.783466339111328, "global_step": 57740, "epoch": 343} {"train_loss": -8.701642990112305, "global_step": 57741, "epoch": 343} {"train_loss": -8.613472938537598, "global_step": 57742, "epoch": 343} {"train_loss": -8.638631820678711, "global_step": 57743, "epoch": 343} {"train_loss": -8.545494079589844, "global_step": 57744, "epoch": 343} {"train_loss": -8.564855575561523, "global_step": 57745, "epoch": 343} {"train_loss": -8.604700088500977, "global_step": 57746, "epoch": 343} {"train_loss": -8.7564058303833, "global_step": 57747, "epoch": 343} {"train_loss": -8.36895751953125, "global_step": 57748, "epoch": 343} {"train_loss": -8.736263275146484, "global_step": 57749, "epoch": 343} {"train_loss": -8.513368606567383, "global_step": 57750, "epoch": 343} {"train_loss": -8.655943870544434, "global_step": 57751, "epoch": 343} {"train_loss": -8.669939994812012, "global_step": 57752, "epoch": 343} {"train_loss": -8.455674171447754, "global_step": 57753, "epoch": 343} {"train_loss": -8.69586181640625, "global_step": 57754, "epoch": 343} {"train_loss": -8.631522178649902, "global_step": 57755, "epoch": 343} {"train_loss": -8.582816123962402, "global_step": 57756, "epoch": 343} {"train_loss": -8.512380599975586, "global_step": 57757, "epoch": 343} {"train_loss": -8.675642013549805, "global_step": 57758, "epoch": 343} {"train_loss": -8.609098434448242, "global_step": 57759, "epoch": 343} {"train_loss": -8.74874496459961, "global_step": 57760, "epoch": 343} {"train_loss": -8.794553756713867, "global_step": 57761, "epoch": 343} {"train_loss": -8.652303695678711, "global_step": 57762, "epoch": 343} {"train_loss": -8.511982917785645, "global_step": 57763, "epoch": 343} {"train_loss": -8.663604736328125, "global_step": 57764, "epoch": 343} {"train_loss": -8.686155319213867, "global_step": 57765, "epoch": 343} {"train_loss": -8.508190155029297, "global_step": 57766, "epoch": 343} {"train_loss": -8.549705505371094, "global_step": 57767, "epoch": 343} {"train_loss": -8.59416389465332, "global_step": 57768, "epoch": 343} {"train_loss": -8.695472717285156, "global_step": 57769, "epoch": 343} {"train_loss": -8.24859619140625, "global_step": 57770, "epoch": 343} {"train_loss": -8.614725112915039, "global_step": 57771, "epoch": 343} {"train_loss": -8.239691734313965, "global_step": 57772, "epoch": 343} {"train_loss": -8.58218765258789, "global_step": 57773, "epoch": 343} {"train_loss": -8.309141159057617, "global_step": 57774, "epoch": 343} {"train_loss": -8.70596694946289, "global_step": 57775, "epoch": 343} {"train_loss": -8.627928733825684, "global_step": 57776, "epoch": 343} {"train_loss": -8.510986328125, "global_step": 57777, "epoch": 343} {"train_loss": -8.562978744506836, "global_step": 57778, "epoch": 343} {"train_loss": -8.480969429016113, "global_step": 57779, "epoch": 343} {"train_loss": -8.685562133789062, "global_step": 57780, "epoch": 343} {"train_loss": -8.579344749450684, "global_step": 57781, "epoch": 343} {"train_loss": -8.759196281433105, "global_step": 57782, "epoch": 343} {"train_loss": -8.764114379882812, "global_step": 57783, "epoch": 343} {"train_loss": -8.489648818969727, "global_step": 57784, "epoch": 343} {"train_loss": -8.863008499145508, "global_step": 57785, "epoch": 343} {"train_loss": -8.48414421081543, "global_step": 57786, "epoch": 343} {"train_loss": -8.626858711242676, "global_step": 57787, "epoch": 343} {"train_loss": -8.517679214477539, "global_step": 57788, "epoch": 343} {"train_loss": -8.562650680541992, "global_step": 57789, "epoch": 343} {"train_loss": -8.768647193908691, "global_step": 57790, "epoch": 343} {"train_loss": -8.58165533202035, "global_step": 57791, "epoch": 343, "val_loss": 191982.21875} {"train_loss": -8.59153938293457, "global_step": 57792, "epoch": 344} {"train_loss": -8.446571350097656, "global_step": 57793, "epoch": 344} {"train_loss": -8.535515785217285, "global_step": 57794, "epoch": 344} {"train_loss": -8.751459121704102, "global_step": 57795, "epoch": 344} {"train_loss": -8.554117202758789, "global_step": 57796, "epoch": 344} {"train_loss": -8.672483444213867, "global_step": 57797, "epoch": 344} {"train_loss": -8.43597412109375, "global_step": 57798, "epoch": 344} {"train_loss": -8.614921569824219, "global_step": 57799, "epoch": 344} {"train_loss": -8.207378387451172, "global_step": 57800, "epoch": 344} {"train_loss": -8.28435230255127, "global_step": 57801, "epoch": 344} {"train_loss": -8.276161193847656, "global_step": 57802, "epoch": 344} {"train_loss": -8.546339988708496, "global_step": 57803, "epoch": 344} {"train_loss": -8.37346076965332, "global_step": 57804, "epoch": 344} {"train_loss": -8.015993118286133, "global_step": 57805, "epoch": 344} {"train_loss": -8.570524215698242, "global_step": 57806, "epoch": 344} {"train_loss": -8.397918701171875, "global_step": 57807, "epoch": 344} {"train_loss": -8.06906509399414, "global_step": 57808, "epoch": 344} {"train_loss": -8.63796329498291, "global_step": 57809, "epoch": 344} {"train_loss": -8.167537689208984, "global_step": 57810, "epoch": 344} {"train_loss": -8.331619262695312, "global_step": 57811, "epoch": 344} {"train_loss": -8.272722244262695, "global_step": 57812, "epoch": 344} {"train_loss": -8.348991394042969, "global_step": 57813, "epoch": 344} {"train_loss": -8.50737190246582, "global_step": 57814, "epoch": 344} {"train_loss": -8.501988410949707, "global_step": 57815, "epoch": 344} {"train_loss": -8.518047332763672, "global_step": 57816, "epoch": 344} {"train_loss": -8.266363143920898, "global_step": 57817, "epoch": 344} {"train_loss": -8.486137390136719, "global_step": 57818, "epoch": 344} {"train_loss": -8.366735458374023, "global_step": 57819, "epoch": 344} {"train_loss": -8.587627410888672, "global_step": 57820, "epoch": 344} {"train_loss": -8.781254768371582, "global_step": 57821, "epoch": 344} {"train_loss": -8.5504150390625, "global_step": 57822, "epoch": 344} {"train_loss": -8.421808242797852, "global_step": 57823, "epoch": 344} {"train_loss": -8.701951026916504, "global_step": 57824, "epoch": 344} {"train_loss": -8.706729888916016, "global_step": 57825, "epoch": 344} {"train_loss": -8.610980033874512, "global_step": 57826, "epoch": 344} {"train_loss": -8.393810272216797, "global_step": 57827, "epoch": 344} {"train_loss": -8.574928283691406, "global_step": 57828, "epoch": 344} {"train_loss": -8.710855484008789, "global_step": 57829, "epoch": 344} {"train_loss": -8.637887954711914, "global_step": 57830, "epoch": 344} {"train_loss": -8.676862716674805, "global_step": 57831, "epoch": 344} {"train_loss": -8.49066162109375, "global_step": 57832, "epoch": 344} {"train_loss": -8.470945358276367, "global_step": 57833, "epoch": 344} {"train_loss": -8.66469955444336, "global_step": 57834, "epoch": 344} {"train_loss": -8.678141593933105, "global_step": 57835, "epoch": 344} {"train_loss": -8.69149398803711, "global_step": 57836, "epoch": 344} {"train_loss": -8.627915382385254, "global_step": 57837, "epoch": 344} {"train_loss": -8.81391716003418, "global_step": 57838, "epoch": 344} {"train_loss": -8.645515441894531, "global_step": 57839, "epoch": 344} {"train_loss": -8.826250076293945, "global_step": 57840, "epoch": 344} {"train_loss": -8.676589965820312, "global_step": 57841, "epoch": 344} {"train_loss": -8.554086685180664, "global_step": 57842, "epoch": 344} {"train_loss": -8.318717002868652, "global_step": 57843, "epoch": 344} {"train_loss": -8.575719833374023, "global_step": 57844, "epoch": 344} {"train_loss": -8.07229232788086, "global_step": 57845, "epoch": 344} {"train_loss": -8.576712608337402, "global_step": 57846, "epoch": 344} {"train_loss": -8.372246742248535, "global_step": 57847, "epoch": 344} {"train_loss": -8.380516052246094, "global_step": 57848, "epoch": 344} {"train_loss": -8.60947322845459, "global_step": 57849, "epoch": 344} {"train_loss": -8.384002685546875, "global_step": 57850, "epoch": 344} {"train_loss": -8.311502456665039, "global_step": 57851, "epoch": 344} {"train_loss": -8.517858505249023, "global_step": 57852, "epoch": 344} {"train_loss": -8.426436424255371, "global_step": 57853, "epoch": 344} {"train_loss": -8.392339706420898, "global_step": 57854, "epoch": 344} {"train_loss": -8.386037826538086, "global_step": 57855, "epoch": 344} {"train_loss": -8.348867416381836, "global_step": 57856, "epoch": 344} {"train_loss": -8.342019081115723, "global_step": 57857, "epoch": 344} {"train_loss": -8.352256774902344, "global_step": 57858, "epoch": 344} {"train_loss": -8.51042366027832, "global_step": 57859, "epoch": 344} {"train_loss": -8.456544876098633, "global_step": 57860, "epoch": 344} {"train_loss": -8.180193901062012, "global_step": 57861, "epoch": 344} {"train_loss": -8.389013290405273, "global_step": 57862, "epoch": 344} {"train_loss": -8.639385223388672, "global_step": 57863, "epoch": 344} {"train_loss": -8.59646987915039, "global_step": 57864, "epoch": 344} {"train_loss": -8.463939666748047, "global_step": 57865, "epoch": 344} {"train_loss": -8.505680084228516, "global_step": 57866, "epoch": 344} {"train_loss": -8.326852798461914, "global_step": 57867, "epoch": 344} {"train_loss": -8.445555686950684, "global_step": 57868, "epoch": 344} {"train_loss": -8.221407890319824, "global_step": 57869, "epoch": 344} {"train_loss": -8.549720764160156, "global_step": 57870, "epoch": 344} {"train_loss": -8.404172897338867, "global_step": 57871, "epoch": 344} {"train_loss": -8.362603187561035, "global_step": 57872, "epoch": 344} {"train_loss": -8.531579971313477, "global_step": 57873, "epoch": 344} {"train_loss": -8.698564529418945, "global_step": 57874, "epoch": 344} {"train_loss": -8.498811721801758, "global_step": 57875, "epoch": 344} {"train_loss": -8.563133239746094, "global_step": 57876, "epoch": 344} {"train_loss": -8.716752052307129, "global_step": 57877, "epoch": 344} {"train_loss": -8.52596664428711, "global_step": 57878, "epoch": 344} {"train_loss": -8.573455810546875, "global_step": 57879, "epoch": 344} {"train_loss": -8.564233779907227, "global_step": 57880, "epoch": 344} {"train_loss": -8.977758407592773, "global_step": 57881, "epoch": 344} {"train_loss": -8.712035179138184, "global_step": 57882, "epoch": 344} {"train_loss": -8.667981147766113, "global_step": 57883, "epoch": 344} {"train_loss": -8.626501083374023, "global_step": 57884, "epoch": 344} {"train_loss": -8.611172676086426, "global_step": 57885, "epoch": 344} {"train_loss": -8.764877319335938, "global_step": 57886, "epoch": 344} {"train_loss": -8.429567337036133, "global_step": 57887, "epoch": 344} {"train_loss": -8.731571197509766, "global_step": 57888, "epoch": 344} {"train_loss": -8.629064559936523, "global_step": 57889, "epoch": 344} {"train_loss": -8.608936309814453, "global_step": 57890, "epoch": 344} {"train_loss": -8.591043472290039, "global_step": 57891, "epoch": 344} {"train_loss": -8.748262405395508, "global_step": 57892, "epoch": 344} {"train_loss": -8.788516998291016, "global_step": 57893, "epoch": 344} {"train_loss": -8.593664169311523, "global_step": 57894, "epoch": 344} {"train_loss": -8.851446151733398, "global_step": 57895, "epoch": 344} {"train_loss": -8.733766555786133, "global_step": 57896, "epoch": 344} {"train_loss": -8.715103149414062, "global_step": 57897, "epoch": 344} {"train_loss": -8.33207893371582, "global_step": 57898, "epoch": 344} {"train_loss": -8.573843002319336, "global_step": 57899, "epoch": 344} {"train_loss": -8.291566848754883, "global_step": 57900, "epoch": 344} {"train_loss": -8.504652976989746, "global_step": 57901, "epoch": 344} {"train_loss": -8.701821327209473, "global_step": 57902, "epoch": 344} {"train_loss": -8.61672306060791, "global_step": 57903, "epoch": 344} {"train_loss": -8.506170272827148, "global_step": 57904, "epoch": 344} {"train_loss": -8.574861526489258, "global_step": 57905, "epoch": 344} {"train_loss": -8.504551887512207, "global_step": 57906, "epoch": 344} {"train_loss": -8.608131408691406, "global_step": 57907, "epoch": 344} {"train_loss": -8.603507041931152, "global_step": 57908, "epoch": 344} {"train_loss": -8.813304901123047, "global_step": 57909, "epoch": 344} {"train_loss": -8.212230682373047, "global_step": 57910, "epoch": 344} {"train_loss": -8.751739501953125, "global_step": 57911, "epoch": 344} {"train_loss": -8.322235107421875, "global_step": 57912, "epoch": 344} {"train_loss": -8.215814590454102, "global_step": 57913, "epoch": 344} {"train_loss": -8.518827438354492, "global_step": 57914, "epoch": 344} {"train_loss": -8.446858406066895, "global_step": 57915, "epoch": 344} {"train_loss": -8.385475158691406, "global_step": 57916, "epoch": 344} {"train_loss": -8.467556953430176, "global_step": 57917, "epoch": 344} {"train_loss": -8.5467529296875, "global_step": 57918, "epoch": 344} {"train_loss": -8.738113403320312, "global_step": 57919, "epoch": 344} {"train_loss": -8.433326721191406, "global_step": 57920, "epoch": 344} {"train_loss": -8.537557601928711, "global_step": 57921, "epoch": 344} {"train_loss": -8.382064819335938, "global_step": 57922, "epoch": 344} {"train_loss": -8.59636116027832, "global_step": 57923, "epoch": 344} {"train_loss": -8.74197769165039, "global_step": 57924, "epoch": 344} {"train_loss": -8.598382949829102, "global_step": 57925, "epoch": 344} {"train_loss": -8.509805679321289, "global_step": 57926, "epoch": 344} {"train_loss": -8.384943008422852, "global_step": 57927, "epoch": 344} {"train_loss": -8.465370178222656, "global_step": 57928, "epoch": 344} {"train_loss": -8.487428665161133, "global_step": 57929, "epoch": 344} {"train_loss": -8.67442512512207, "global_step": 57930, "epoch": 344} {"train_loss": -8.480094909667969, "global_step": 57931, "epoch": 344} {"train_loss": -8.678893089294434, "global_step": 57932, "epoch": 344} {"train_loss": -8.65900993347168, "global_step": 57933, "epoch": 344} {"train_loss": -8.599065780639648, "global_step": 57934, "epoch": 344} {"train_loss": -8.550228118896484, "global_step": 57935, "epoch": 344} {"train_loss": -8.645914077758789, "global_step": 57936, "epoch": 344} {"train_loss": -8.592705726623535, "global_step": 57937, "epoch": 344} {"train_loss": -8.707967758178711, "global_step": 57938, "epoch": 344} {"train_loss": -8.743206977844238, "global_step": 57939, "epoch": 344} {"train_loss": -8.652448654174805, "global_step": 57940, "epoch": 344} {"train_loss": -9.079841613769531, "global_step": 57941, "epoch": 344} {"train_loss": -8.602468490600586, "global_step": 57942, "epoch": 344} {"train_loss": -8.384637832641602, "global_step": 57943, "epoch": 344} {"train_loss": -8.764243125915527, "global_step": 57944, "epoch": 344} {"train_loss": -8.55575942993164, "global_step": 57945, "epoch": 344} {"train_loss": -8.621805191040039, "global_step": 57946, "epoch": 344} {"train_loss": -8.268762588500977, "global_step": 57947, "epoch": 344} {"train_loss": -8.529888153076172, "global_step": 57948, "epoch": 344} {"train_loss": -8.34269905090332, "global_step": 57949, "epoch": 344} {"train_loss": -8.270291328430176, "global_step": 57950, "epoch": 344} {"train_loss": -8.372344970703125, "global_step": 57951, "epoch": 344} {"train_loss": -8.67642593383789, "global_step": 57952, "epoch": 344} {"train_loss": -8.45359992980957, "global_step": 57953, "epoch": 344} {"train_loss": -8.60036563873291, "global_step": 57954, "epoch": 344} {"train_loss": -8.335628509521484, "global_step": 57955, "epoch": 344} {"train_loss": -8.265575408935547, "global_step": 57956, "epoch": 344} {"train_loss": -8.538555145263672, "global_step": 57957, "epoch": 344} {"train_loss": -8.458441734313965, "global_step": 57958, "epoch": 344} {"train_loss": -8.522960645811898, "global_step": 57959, "epoch": 344, "val_loss": 187897.234375} {"train_loss": -8.513191223144531, "global_step": 57960, "epoch": 345} {"train_loss": -8.479825973510742, "global_step": 57961, "epoch": 345} {"train_loss": -8.129083633422852, "global_step": 57962, "epoch": 345} {"train_loss": -8.595233917236328, "global_step": 57963, "epoch": 345} {"train_loss": -8.497081756591797, "global_step": 57964, "epoch": 345} {"train_loss": -8.185907363891602, "global_step": 57965, "epoch": 345} {"train_loss": -8.441084861755371, "global_step": 57966, "epoch": 345} {"train_loss": -8.36213493347168, "global_step": 57967, "epoch": 345} {"train_loss": -8.359420776367188, "global_step": 57968, "epoch": 345} {"train_loss": -8.389208793640137, "global_step": 57969, "epoch": 345} {"train_loss": -8.27618408203125, "global_step": 57970, "epoch": 345} {"train_loss": -8.549674034118652, "global_step": 57971, "epoch": 345} {"train_loss": -8.360219955444336, "global_step": 57972, "epoch": 345} {"train_loss": -8.464127540588379, "global_step": 57973, "epoch": 345} {"train_loss": -8.379579544067383, "global_step": 57974, "epoch": 345} {"train_loss": -8.731916427612305, "global_step": 57975, "epoch": 345} {"train_loss": -8.49580192565918, "global_step": 57976, "epoch": 345} {"train_loss": -8.435323715209961, "global_step": 57977, "epoch": 345} {"train_loss": -8.55061149597168, "global_step": 57978, "epoch": 345} {"train_loss": -8.392794609069824, "global_step": 57979, "epoch": 345} {"train_loss": -8.711923599243164, "global_step": 57980, "epoch": 345} {"train_loss": -8.421638488769531, "global_step": 57981, "epoch": 345} {"train_loss": -8.527620315551758, "global_step": 57982, "epoch": 345} {"train_loss": -8.49140739440918, "global_step": 57983, "epoch": 345} {"train_loss": -8.723054885864258, "global_step": 57984, "epoch": 345} {"train_loss": -8.64120864868164, "global_step": 57985, "epoch": 345} {"train_loss": -8.596880912780762, "global_step": 57986, "epoch": 345} {"train_loss": -8.664176940917969, "global_step": 57987, "epoch": 345} {"train_loss": -8.794389724731445, "global_step": 57988, "epoch": 345} {"train_loss": -8.511292457580566, "global_step": 57989, "epoch": 345} {"train_loss": -8.767087936401367, "global_step": 57990, "epoch": 345} {"train_loss": -8.670605659484863, "global_step": 57991, "epoch": 345} {"train_loss": -8.602614402770996, "global_step": 57992, "epoch": 345} {"train_loss": -8.670905113220215, "global_step": 57993, "epoch": 345} {"train_loss": -8.594532012939453, "global_step": 57994, "epoch": 345} {"train_loss": -8.596273422241211, "global_step": 57995, "epoch": 345} {"train_loss": -8.24749755859375, "global_step": 57996, "epoch": 345} {"train_loss": -8.442039489746094, "global_step": 57997, "epoch": 345} {"train_loss": -8.497140884399414, "global_step": 57998, "epoch": 345} {"train_loss": -8.654714584350586, "global_step": 57999, "epoch": 345} {"train_loss": -8.416406631469727, "global_step": 58000, "epoch": 345} {"train_loss": -8.420395851135254, "global_step": 58001, "epoch": 345} {"train_loss": -8.887419700622559, "global_step": 58002, "epoch": 345} {"train_loss": -8.620260238647461, "global_step": 58003, "epoch": 345} {"train_loss": -8.553236961364746, "global_step": 58004, "epoch": 345} {"train_loss": -8.366209030151367, "global_step": 58005, "epoch": 345} {"train_loss": -8.547076225280762, "global_step": 58006, "epoch": 345} {"train_loss": -8.182822227478027, "global_step": 58007, "epoch": 345} {"train_loss": -8.392350196838379, "global_step": 58008, "epoch": 345} {"train_loss": -8.195083618164062, "global_step": 58009, "epoch": 345} {"train_loss": -8.617952346801758, "global_step": 58010, "epoch": 345} {"train_loss": -8.380630493164062, "global_step": 58011, "epoch": 345} {"train_loss": -8.609443664550781, "global_step": 58012, "epoch": 345} {"train_loss": -8.383096694946289, "global_step": 58013, "epoch": 345} {"train_loss": -8.678194046020508, "global_step": 58014, "epoch": 345} {"train_loss": -8.459491729736328, "global_step": 58015, "epoch": 345} {"train_loss": -8.445499420166016, "global_step": 58016, "epoch": 345} {"train_loss": -8.451336860656738, "global_step": 58017, "epoch": 345} {"train_loss": -8.459741592407227, "global_step": 58018, "epoch": 345} {"train_loss": -8.632976531982422, "global_step": 58019, "epoch": 345} {"train_loss": -8.642979621887207, "global_step": 58020, "epoch": 345} {"train_loss": -8.465025901794434, "global_step": 58021, "epoch": 345} {"train_loss": -8.51629638671875, "global_step": 58022, "epoch": 345} {"train_loss": -8.516277313232422, "global_step": 58023, "epoch": 345} {"train_loss": -8.691327095031738, "global_step": 58024, "epoch": 345} {"train_loss": -8.3659029006958, "global_step": 58025, "epoch": 345} {"train_loss": -8.251435279846191, "global_step": 58026, "epoch": 345} {"train_loss": -8.730328559875488, "global_step": 58027, "epoch": 345} {"train_loss": -8.60545825958252, "global_step": 58028, "epoch": 345} {"train_loss": -8.859062194824219, "global_step": 58029, "epoch": 345} {"train_loss": -8.606593132019043, "global_step": 58030, "epoch": 345} {"train_loss": -8.60222053527832, "global_step": 58031, "epoch": 345} {"train_loss": -8.598548889160156, "global_step": 58032, "epoch": 345} {"train_loss": -8.658584594726562, "global_step": 58033, "epoch": 345} {"train_loss": -8.6320219039917, "global_step": 58034, "epoch": 345} {"train_loss": -8.590191841125488, "global_step": 58035, "epoch": 345} {"train_loss": -8.553816795349121, "global_step": 58036, "epoch": 345} {"train_loss": -8.843011856079102, "global_step": 58037, "epoch": 345} {"train_loss": -8.766578674316406, "global_step": 58038, "epoch": 345} {"train_loss": -8.592787742614746, "global_step": 58039, "epoch": 345} {"train_loss": -8.53761100769043, "global_step": 58040, "epoch": 345} {"train_loss": -8.951892852783203, "global_step": 58041, "epoch": 345} {"train_loss": -8.563432693481445, "global_step": 58042, "epoch": 345} {"train_loss": -8.916898727416992, "global_step": 58043, "epoch": 345} {"train_loss": -8.281635284423828, "global_step": 58044, "epoch": 345} {"train_loss": -8.386795043945312, "global_step": 58045, "epoch": 345} {"train_loss": -8.484439849853516, "global_step": 58046, "epoch": 345} {"train_loss": -8.663946151733398, "global_step": 58047, "epoch": 345} {"train_loss": -8.393266677856445, "global_step": 58048, "epoch": 345} {"train_loss": -8.462390899658203, "global_step": 58049, "epoch": 345} {"train_loss": -8.201738357543945, "global_step": 58050, "epoch": 345} {"train_loss": -8.45154094696045, "global_step": 58051, "epoch": 345} {"train_loss": -8.21749496459961, "global_step": 58052, "epoch": 345} {"train_loss": -8.117971420288086, "global_step": 58053, "epoch": 345} {"train_loss": -8.340700149536133, "global_step": 58054, "epoch": 345} {"train_loss": -8.193613052368164, "global_step": 58055, "epoch": 345} {"train_loss": -8.384714126586914, "global_step": 58056, "epoch": 345} {"train_loss": -8.428712844848633, "global_step": 58057, "epoch": 345} {"train_loss": -8.28575325012207, "global_step": 58058, "epoch": 345} {"train_loss": -8.561149597167969, "global_step": 58059, "epoch": 345} {"train_loss": -8.469698905944824, "global_step": 58060, "epoch": 345} {"train_loss": -8.466049194335938, "global_step": 58061, "epoch": 345} {"train_loss": -8.28600788116455, "global_step": 58062, "epoch": 345} {"train_loss": -8.4652681350708, "global_step": 58063, "epoch": 345} {"train_loss": -8.516561508178711, "global_step": 58064, "epoch": 345} {"train_loss": -8.286750793457031, "global_step": 58065, "epoch": 345} {"train_loss": -8.474557876586914, "global_step": 58066, "epoch": 345} {"train_loss": -8.513561248779297, "global_step": 58067, "epoch": 345} {"train_loss": -8.171834945678711, "global_step": 58068, "epoch": 345} {"train_loss": -8.495596885681152, "global_step": 58069, "epoch": 345} {"train_loss": -8.321237564086914, "global_step": 58070, "epoch": 345} {"train_loss": -8.61322021484375, "global_step": 58071, "epoch": 345} {"train_loss": -8.329681396484375, "global_step": 58072, "epoch": 345} {"train_loss": -8.404613494873047, "global_step": 58073, "epoch": 345} {"train_loss": -8.487641334533691, "global_step": 58074, "epoch": 345} {"train_loss": -8.122848510742188, "global_step": 58075, "epoch": 345} {"train_loss": -8.469598770141602, "global_step": 58076, "epoch": 345} {"train_loss": -8.481696128845215, "global_step": 58077, "epoch": 345} {"train_loss": -8.517457008361816, "global_step": 58078, "epoch": 345} {"train_loss": -8.389554977416992, "global_step": 58079, "epoch": 345} {"train_loss": -8.23189926147461, "global_step": 58080, "epoch": 345} {"train_loss": -8.42007827758789, "global_step": 58081, "epoch": 345} {"train_loss": -8.537525177001953, "global_step": 58082, "epoch": 345} {"train_loss": -8.387007713317871, "global_step": 58083, "epoch": 345} {"train_loss": -8.416350364685059, "global_step": 58084, "epoch": 345} {"train_loss": -8.753849029541016, "global_step": 58085, "epoch": 345} {"train_loss": -8.498720169067383, "global_step": 58086, "epoch": 345} {"train_loss": -8.68522834777832, "global_step": 58087, "epoch": 345} {"train_loss": -8.604301452636719, "global_step": 58088, "epoch": 345} {"train_loss": -8.923742294311523, "global_step": 58089, "epoch": 345} {"train_loss": -8.521135330200195, "global_step": 58090, "epoch": 345} {"train_loss": -8.825055122375488, "global_step": 58091, "epoch": 345} {"train_loss": -8.852195739746094, "global_step": 58092, "epoch": 345} {"train_loss": -8.764904022216797, "global_step": 58093, "epoch": 345} {"train_loss": -8.733552932739258, "global_step": 58094, "epoch": 345} {"train_loss": -8.719551086425781, "global_step": 58095, "epoch": 345} {"train_loss": -8.681726455688477, "global_step": 58096, "epoch": 345} {"train_loss": -8.552810668945312, "global_step": 58097, "epoch": 345} {"train_loss": -8.713127136230469, "global_step": 58098, "epoch": 345} {"train_loss": -8.67719841003418, "global_step": 58099, "epoch": 345} {"train_loss": -8.383092880249023, "global_step": 58100, "epoch": 345} {"train_loss": -8.605705261230469, "global_step": 58101, "epoch": 345} {"train_loss": -8.802658081054688, "global_step": 58102, "epoch": 345} {"train_loss": -8.357483863830566, "global_step": 58103, "epoch": 345} {"train_loss": -8.7689847946167, "global_step": 58104, "epoch": 345} {"train_loss": -8.388689994812012, "global_step": 58105, "epoch": 345} {"train_loss": -8.44731330871582, "global_step": 58106, "epoch": 345} {"train_loss": -8.56257438659668, "global_step": 58107, "epoch": 345} {"train_loss": -8.48189926147461, "global_step": 58108, "epoch": 345} {"train_loss": -8.590391159057617, "global_step": 58109, "epoch": 345} {"train_loss": -8.30068302154541, "global_step": 58110, "epoch": 345} {"train_loss": -8.582059860229492, "global_step": 58111, "epoch": 345} {"train_loss": -8.179872512817383, "global_step": 58112, "epoch": 345} {"train_loss": -8.56480598449707, "global_step": 58113, "epoch": 345} {"train_loss": -8.246185302734375, "global_step": 58114, "epoch": 345} {"train_loss": -8.585640907287598, "global_step": 58115, "epoch": 345} {"train_loss": -8.432884216308594, "global_step": 58116, "epoch": 345} {"train_loss": -8.631326675415039, "global_step": 58117, "epoch": 345} {"train_loss": -8.453575134277344, "global_step": 58118, "epoch": 345} {"train_loss": -8.74474048614502, "global_step": 58119, "epoch": 345} {"train_loss": -8.365192413330078, "global_step": 58120, "epoch": 345} {"train_loss": -8.575105667114258, "global_step": 58121, "epoch": 345} {"train_loss": -8.52247142791748, "global_step": 58122, "epoch": 345} {"train_loss": -8.664859771728516, "global_step": 58123, "epoch": 345} {"train_loss": -8.455961227416992, "global_step": 58124, "epoch": 345} {"train_loss": -8.604280471801758, "global_step": 58125, "epoch": 345} {"train_loss": -8.598745346069336, "global_step": 58126, "epoch": 345} {"train_loss": -8.513344089190165, "global_step": 58127, "epoch": 345, "val_loss": 189356.34375, "train_action_mse_error": 7.012522220611572} {"train_loss": -8.602216720581055, "global_step": 58128, "epoch": 346} {"train_loss": -8.340473175048828, "global_step": 58129, "epoch": 346} {"train_loss": -8.693561553955078, "global_step": 58130, "epoch": 346} {"train_loss": -7.935810089111328, "global_step": 58131, "epoch": 346} {"train_loss": -8.482462882995605, "global_step": 58132, "epoch": 346} {"train_loss": -8.351336479187012, "global_step": 58133, "epoch": 346} {"train_loss": -8.567651748657227, "global_step": 58134, "epoch": 346} {"train_loss": -8.558236122131348, "global_step": 58135, "epoch": 346} {"train_loss": -8.376679420471191, "global_step": 58136, "epoch": 346} {"train_loss": -8.569173812866211, "global_step": 58137, "epoch": 346} {"train_loss": -8.555404663085938, "global_step": 58138, "epoch": 346} {"train_loss": -8.486928939819336, "global_step": 58139, "epoch": 346} {"train_loss": -8.794474601745605, "global_step": 58140, "epoch": 346} {"train_loss": -8.785505294799805, "global_step": 58141, "epoch": 346} {"train_loss": -8.5699462890625, "global_step": 58142, "epoch": 346} {"train_loss": -8.639405250549316, "global_step": 58143, "epoch": 346} {"train_loss": -8.504243850708008, "global_step": 58144, "epoch": 346} {"train_loss": -8.339550018310547, "global_step": 58145, "epoch": 346} {"train_loss": -8.468265533447266, "global_step": 58146, "epoch": 346} {"train_loss": -8.673473358154297, "global_step": 58147, "epoch": 346} {"train_loss": -8.518011093139648, "global_step": 58148, "epoch": 346} {"train_loss": -8.548585891723633, "global_step": 58149, "epoch": 346} {"train_loss": -8.432226181030273, "global_step": 58150, "epoch": 346} {"train_loss": -8.4562406539917, "global_step": 58151, "epoch": 346} {"train_loss": -8.363319396972656, "global_step": 58152, "epoch": 346} {"train_loss": -8.696695327758789, "global_step": 58153, "epoch": 346} {"train_loss": -8.318546295166016, "global_step": 58154, "epoch": 346} {"train_loss": -8.361682891845703, "global_step": 58155, "epoch": 346} {"train_loss": -8.564924240112305, "global_step": 58156, "epoch": 346} {"train_loss": -8.009552955627441, "global_step": 58157, "epoch": 346} {"train_loss": -8.530780792236328, "global_step": 58158, "epoch": 346} {"train_loss": -8.418722152709961, "global_step": 58159, "epoch": 346} {"train_loss": -8.474626541137695, "global_step": 58160, "epoch": 346} {"train_loss": -8.069936752319336, "global_step": 58161, "epoch": 346} {"train_loss": -8.44967269897461, "global_step": 58162, "epoch": 346} {"train_loss": -8.215778350830078, "global_step": 58163, "epoch": 346} {"train_loss": -8.26258659362793, "global_step": 58164, "epoch": 346} {"train_loss": -7.898947238922119, "global_step": 58165, "epoch": 346} {"train_loss": -8.129449844360352, "global_step": 58166, "epoch": 346} {"train_loss": -8.212932586669922, "global_step": 58167, "epoch": 346} {"train_loss": -8.23080062866211, "global_step": 58168, "epoch": 346} {"train_loss": -8.320404052734375, "global_step": 58169, "epoch": 346} {"train_loss": -8.32419204711914, "global_step": 58170, "epoch": 346} {"train_loss": -8.425985336303711, "global_step": 58171, "epoch": 346} {"train_loss": -8.373495101928711, "global_step": 58172, "epoch": 346} {"train_loss": -8.369997024536133, "global_step": 58173, "epoch": 346} {"train_loss": -8.377862930297852, "global_step": 58174, "epoch": 346} {"train_loss": -8.563653945922852, "global_step": 58175, "epoch": 346} {"train_loss": -8.537513732910156, "global_step": 58176, "epoch": 346} {"train_loss": -8.482934951782227, "global_step": 58177, "epoch": 346} {"train_loss": -8.420507431030273, "global_step": 58178, "epoch": 346} {"train_loss": -8.643034934997559, "global_step": 58179, "epoch": 346} {"train_loss": -8.531946182250977, "global_step": 58180, "epoch": 346} {"train_loss": -8.429643630981445, "global_step": 58181, "epoch": 346} {"train_loss": -8.440414428710938, "global_step": 58182, "epoch": 346} {"train_loss": -8.61270523071289, "global_step": 58183, "epoch": 346} {"train_loss": -8.50526237487793, "global_step": 58184, "epoch": 346} {"train_loss": -8.552485466003418, "global_step": 58185, "epoch": 346} {"train_loss": -8.539314270019531, "global_step": 58186, "epoch": 346} {"train_loss": -8.280533790588379, "global_step": 58187, "epoch": 346} {"train_loss": -8.548763275146484, "global_step": 58188, "epoch": 346} {"train_loss": -8.579105377197266, "global_step": 58189, "epoch": 346} {"train_loss": -8.382556915283203, "global_step": 58190, "epoch": 346} {"train_loss": -8.54568862915039, "global_step": 58191, "epoch": 346} {"train_loss": -8.724342346191406, "global_step": 58192, "epoch": 346} {"train_loss": -8.788277626037598, "global_step": 58193, "epoch": 346} {"train_loss": -8.503570556640625, "global_step": 58194, "epoch": 346} {"train_loss": -8.528645515441895, "global_step": 58195, "epoch": 346} {"train_loss": -8.671226501464844, "global_step": 58196, "epoch": 346} {"train_loss": -8.855217933654785, "global_step": 58197, "epoch": 346} {"train_loss": -8.763623237609863, "global_step": 58198, "epoch": 346} {"train_loss": -8.493844032287598, "global_step": 58199, "epoch": 346} {"train_loss": -8.864126205444336, "global_step": 58200, "epoch": 346} {"train_loss": -8.684816360473633, "global_step": 58201, "epoch": 346} {"train_loss": -8.727755546569824, "global_step": 58202, "epoch": 346} {"train_loss": -8.840353965759277, "global_step": 58203, "epoch": 346} {"train_loss": -8.713383674621582, "global_step": 58204, "epoch": 346} {"train_loss": -8.961402893066406, "global_step": 58205, "epoch": 346} {"train_loss": -8.62945556640625, "global_step": 58206, "epoch": 346} {"train_loss": -8.909968376159668, "global_step": 58207, "epoch": 346} {"train_loss": -8.780317306518555, "global_step": 58208, "epoch": 346} {"train_loss": -8.528578758239746, "global_step": 58209, "epoch": 346} {"train_loss": -8.764681816101074, "global_step": 58210, "epoch": 346} {"train_loss": -8.580301284790039, "global_step": 58211, "epoch": 346} {"train_loss": -8.556028366088867, "global_step": 58212, "epoch": 346} {"train_loss": -8.59597396850586, "global_step": 58213, "epoch": 346} {"train_loss": -8.86568832397461, "global_step": 58214, "epoch": 346} {"train_loss": -8.594175338745117, "global_step": 58215, "epoch": 346} {"train_loss": -8.349197387695312, "global_step": 58216, "epoch": 346} {"train_loss": -8.74606704711914, "global_step": 58217, "epoch": 346} {"train_loss": -8.285844802856445, "global_step": 58218, "epoch": 346} {"train_loss": -8.609525680541992, "global_step": 58219, "epoch": 346} {"train_loss": -8.278228759765625, "global_step": 58220, "epoch": 346} {"train_loss": -8.687429428100586, "global_step": 58221, "epoch": 346} {"train_loss": -8.48092269897461, "global_step": 58222, "epoch": 346} {"train_loss": -8.549925804138184, "global_step": 58223, "epoch": 346} {"train_loss": -8.699310302734375, "global_step": 58224, "epoch": 346} {"train_loss": -8.675355911254883, "global_step": 58225, "epoch": 346} {"train_loss": -8.690641403198242, "global_step": 58226, "epoch": 346} {"train_loss": -8.567835807800293, "global_step": 58227, "epoch": 346} {"train_loss": -8.17473030090332, "global_step": 58228, "epoch": 346} {"train_loss": -8.56009578704834, "global_step": 58229, "epoch": 346} {"train_loss": -8.41534423828125, "global_step": 58230, "epoch": 346} {"train_loss": -8.715045928955078, "global_step": 58231, "epoch": 346} {"train_loss": -8.571249008178711, "global_step": 58232, "epoch": 346} {"train_loss": -8.196229934692383, "global_step": 58233, "epoch": 346} {"train_loss": -8.595985412597656, "global_step": 58234, "epoch": 346} {"train_loss": -8.445228576660156, "global_step": 58235, "epoch": 346} {"train_loss": -8.360017776489258, "global_step": 58236, "epoch": 346} {"train_loss": -8.471683502197266, "global_step": 58237, "epoch": 346} {"train_loss": -8.318124771118164, "global_step": 58238, "epoch": 346} {"train_loss": -8.32503604888916, "global_step": 58239, "epoch": 346} {"train_loss": -8.341068267822266, "global_step": 58240, "epoch": 346} {"train_loss": -8.161820411682129, "global_step": 58241, "epoch": 346} {"train_loss": -8.2852783203125, "global_step": 58242, "epoch": 346} {"train_loss": -8.337272644042969, "global_step": 58243, "epoch": 346} {"train_loss": -8.306915283203125, "global_step": 58244, "epoch": 346} {"train_loss": -8.269645690917969, "global_step": 58245, "epoch": 346} {"train_loss": -8.283210754394531, "global_step": 58246, "epoch": 346} {"train_loss": -8.368829727172852, "global_step": 58247, "epoch": 346} {"train_loss": -8.258816719055176, "global_step": 58248, "epoch": 346} {"train_loss": -8.407953262329102, "global_step": 58249, "epoch": 346} {"train_loss": -8.370366096496582, "global_step": 58250, "epoch": 346} {"train_loss": -8.378658294677734, "global_step": 58251, "epoch": 346} {"train_loss": -8.475041389465332, "global_step": 58252, "epoch": 346} {"train_loss": -8.541691780090332, "global_step": 58253, "epoch": 346} {"train_loss": -8.445894241333008, "global_step": 58254, "epoch": 346} {"train_loss": -8.685985565185547, "global_step": 58255, "epoch": 346} {"train_loss": -8.598140716552734, "global_step": 58256, "epoch": 346} {"train_loss": -8.590721130371094, "global_step": 58257, "epoch": 346} {"train_loss": -8.548404693603516, "global_step": 58258, "epoch": 346} {"train_loss": -8.560171127319336, "global_step": 58259, "epoch": 346} {"train_loss": -8.74409294128418, "global_step": 58260, "epoch": 346} {"train_loss": -8.331384658813477, "global_step": 58261, "epoch": 346} {"train_loss": -8.791594505310059, "global_step": 58262, "epoch": 346} {"train_loss": -8.604660987854004, "global_step": 58263, "epoch": 346} {"train_loss": -8.697540283203125, "global_step": 58264, "epoch": 346} {"train_loss": -8.590679168701172, "global_step": 58265, "epoch": 346} {"train_loss": -8.717772483825684, "global_step": 58266, "epoch": 346} {"train_loss": -8.545124053955078, "global_step": 58267, "epoch": 346} {"train_loss": -8.475175857543945, "global_step": 58268, "epoch": 346} {"train_loss": -8.254011154174805, "global_step": 58269, "epoch": 346} {"train_loss": -8.977957725524902, "global_step": 58270, "epoch": 346} {"train_loss": -8.587479591369629, "global_step": 58271, "epoch": 346} {"train_loss": -8.72390079498291, "global_step": 58272, "epoch": 346} {"train_loss": -8.821072578430176, "global_step": 58273, "epoch": 346} {"train_loss": -8.743440628051758, "global_step": 58274, "epoch": 346} {"train_loss": -8.752857208251953, "global_step": 58275, "epoch": 346} {"train_loss": -8.638391494750977, "global_step": 58276, "epoch": 346} {"train_loss": -8.662433624267578, "global_step": 58277, "epoch": 346} {"train_loss": -8.556339263916016, "global_step": 58278, "epoch": 346} {"train_loss": -8.705402374267578, "global_step": 58279, "epoch": 346} {"train_loss": -8.83230972290039, "global_step": 58280, "epoch": 346} {"train_loss": -8.77448844909668, "global_step": 58281, "epoch": 346} {"train_loss": -8.527231216430664, "global_step": 58282, "epoch": 346} {"train_loss": -8.888763427734375, "global_step": 58283, "epoch": 346} {"train_loss": -8.730972290039062, "global_step": 58284, "epoch": 346} {"train_loss": -8.8164644241333, "global_step": 58285, "epoch": 346} {"train_loss": -8.628097534179688, "global_step": 58286, "epoch": 346} {"train_loss": -8.50059700012207, "global_step": 58287, "epoch": 346} {"train_loss": -8.663384437561035, "global_step": 58288, "epoch": 346} {"train_loss": -8.834646224975586, "global_step": 58289, "epoch": 346} {"train_loss": -8.618213653564453, "global_step": 58290, "epoch": 346} {"train_loss": -8.743289947509766, "global_step": 58291, "epoch": 346} {"train_loss": -8.586456298828125, "global_step": 58292, "epoch": 346} {"train_loss": -8.676130294799805, "global_step": 58293, "epoch": 346} {"train_loss": -8.6563138961792, "global_step": 58294, "epoch": 346} {"train_loss": -8.531429838566552, "global_step": 58295, "epoch": 346, "val_loss": 189223.1875} {"train_loss": -8.712461471557617, "global_step": 58296, "epoch": 347} {"train_loss": -8.603108406066895, "global_step": 58297, "epoch": 347} {"train_loss": -8.729989051818848, "global_step": 58298, "epoch": 347} {"train_loss": -8.730701446533203, "global_step": 58299, "epoch": 347} {"train_loss": -8.328869819641113, "global_step": 58300, "epoch": 347} {"train_loss": -8.711400032043457, "global_step": 58301, "epoch": 347} {"train_loss": -8.665501594543457, "global_step": 58302, "epoch": 347} {"train_loss": -8.270313262939453, "global_step": 58303, "epoch": 347} {"train_loss": -8.57435131072998, "global_step": 58304, "epoch": 347} {"train_loss": -8.649553298950195, "global_step": 58305, "epoch": 347} {"train_loss": -8.74310302734375, "global_step": 58306, "epoch": 347} {"train_loss": -8.501014709472656, "global_step": 58307, "epoch": 347} {"train_loss": -8.570255279541016, "global_step": 58308, "epoch": 347} {"train_loss": -8.516292572021484, "global_step": 58309, "epoch": 347} {"train_loss": -8.635659217834473, "global_step": 58310, "epoch": 347} {"train_loss": -8.52115535736084, "global_step": 58311, "epoch": 347} {"train_loss": -8.49146556854248, "global_step": 58312, "epoch": 347} {"train_loss": -8.178857803344727, "global_step": 58313, "epoch": 347} {"train_loss": -8.587949752807617, "global_step": 58314, "epoch": 347} {"train_loss": -8.355104446411133, "global_step": 58315, "epoch": 347} {"train_loss": -8.380308151245117, "global_step": 58316, "epoch": 347} {"train_loss": -8.728462219238281, "global_step": 58317, "epoch": 347} {"train_loss": -8.635246276855469, "global_step": 58318, "epoch": 347} {"train_loss": -8.647245407104492, "global_step": 58319, "epoch": 347} {"train_loss": -8.688993453979492, "global_step": 58320, "epoch": 347} {"train_loss": -8.499134063720703, "global_step": 58321, "epoch": 347} {"train_loss": -8.325292587280273, "global_step": 58322, "epoch": 347} {"train_loss": -8.595906257629395, "global_step": 58323, "epoch": 347} {"train_loss": -8.554323196411133, "global_step": 58324, "epoch": 347} {"train_loss": -8.385501861572266, "global_step": 58325, "epoch": 347} {"train_loss": -8.617898941040039, "global_step": 58326, "epoch": 347} {"train_loss": -8.521576881408691, "global_step": 58327, "epoch": 347} {"train_loss": -8.600141525268555, "global_step": 58328, "epoch": 347} {"train_loss": -8.481675148010254, "global_step": 58329, "epoch": 347} {"train_loss": -8.603492736816406, "global_step": 58330, "epoch": 347} {"train_loss": -8.732339859008789, "global_step": 58331, "epoch": 347} {"train_loss": -8.509967803955078, "global_step": 58332, "epoch": 347} {"train_loss": -8.59965991973877, "global_step": 58333, "epoch": 347} {"train_loss": -8.346918106079102, "global_step": 58334, "epoch": 347} {"train_loss": -8.87417221069336, "global_step": 58335, "epoch": 347} {"train_loss": -8.46045207977295, "global_step": 58336, "epoch": 347} {"train_loss": -8.537759780883789, "global_step": 58337, "epoch": 347} {"train_loss": -8.419431686401367, "global_step": 58338, "epoch": 347} {"train_loss": -8.471467018127441, "global_step": 58339, "epoch": 347} {"train_loss": -8.092117309570312, "global_step": 58340, "epoch": 347} {"train_loss": -8.613380432128906, "global_step": 58341, "epoch": 347} {"train_loss": -8.386733055114746, "global_step": 58342, "epoch": 347} {"train_loss": -8.622600555419922, "global_step": 58343, "epoch": 347} {"train_loss": -8.39742660522461, "global_step": 58344, "epoch": 347} {"train_loss": -8.6009521484375, "global_step": 58345, "epoch": 347} {"train_loss": -8.513729095458984, "global_step": 58346, "epoch": 347} {"train_loss": -8.215288162231445, "global_step": 58347, "epoch": 347} {"train_loss": -8.589692115783691, "global_step": 58348, "epoch": 347} {"train_loss": -8.346158981323242, "global_step": 58349, "epoch": 347} {"train_loss": -8.337355613708496, "global_step": 58350, "epoch": 347} {"train_loss": -8.614879608154297, "global_step": 58351, "epoch": 347} {"train_loss": -8.517007827758789, "global_step": 58352, "epoch": 347} {"train_loss": -8.323127746582031, "global_step": 58353, "epoch": 347} {"train_loss": -8.50874137878418, "global_step": 58354, "epoch": 347} {"train_loss": -8.6270751953125, "global_step": 58355, "epoch": 347} {"train_loss": -8.307947158813477, "global_step": 58356, "epoch": 347} {"train_loss": -8.572059631347656, "global_step": 58357, "epoch": 347} {"train_loss": -8.323386192321777, "global_step": 58358, "epoch": 347} {"train_loss": -8.510181427001953, "global_step": 58359, "epoch": 347} {"train_loss": -8.581523895263672, "global_step": 58360, "epoch": 347} {"train_loss": -8.557978630065918, "global_step": 58361, "epoch": 347} {"train_loss": -8.584577560424805, "global_step": 58362, "epoch": 347} {"train_loss": -8.517484664916992, "global_step": 58363, "epoch": 347} {"train_loss": -8.673070907592773, "global_step": 58364, "epoch": 347} {"train_loss": -8.706084251403809, "global_step": 58365, "epoch": 347} {"train_loss": -8.701790809631348, "global_step": 58366, "epoch": 347} {"train_loss": -8.346911430358887, "global_step": 58367, "epoch": 347} {"train_loss": -8.633825302124023, "global_step": 58368, "epoch": 347} {"train_loss": -8.464813232421875, "global_step": 58369, "epoch": 347} {"train_loss": -8.856343269348145, "global_step": 58370, "epoch": 347} {"train_loss": -8.77452278137207, "global_step": 58371, "epoch": 347} {"train_loss": -8.74168586730957, "global_step": 58372, "epoch": 347} {"train_loss": -8.498703002929688, "global_step": 58373, "epoch": 347} {"train_loss": -8.217178344726562, "global_step": 58374, "epoch": 347} {"train_loss": -8.44140911102295, "global_step": 58375, "epoch": 347} {"train_loss": -8.288311004638672, "global_step": 58376, "epoch": 347} {"train_loss": -8.509430885314941, "global_step": 58377, "epoch": 347} {"train_loss": -8.318450927734375, "global_step": 58378, "epoch": 347} {"train_loss": -8.399923324584961, "global_step": 58379, "epoch": 347} {"train_loss": -8.351417541503906, "global_step": 58380, "epoch": 347} {"train_loss": -8.461014747619629, "global_step": 58381, "epoch": 347} {"train_loss": -8.619561195373535, "global_step": 58382, "epoch": 347} {"train_loss": -8.818222999572754, "global_step": 58383, "epoch": 347} {"train_loss": -8.530391693115234, "global_step": 58384, "epoch": 347} {"train_loss": -8.418509483337402, "global_step": 58385, "epoch": 347} {"train_loss": -8.507736206054688, "global_step": 58386, "epoch": 347} {"train_loss": -8.210738182067871, "global_step": 58387, "epoch": 347} {"train_loss": -8.574514389038086, "global_step": 58388, "epoch": 347} {"train_loss": -8.40286922454834, "global_step": 58389, "epoch": 347} {"train_loss": -8.434276580810547, "global_step": 58390, "epoch": 347} {"train_loss": -8.663654327392578, "global_step": 58391, "epoch": 347} {"train_loss": -8.510526657104492, "global_step": 58392, "epoch": 347} {"train_loss": -8.744565963745117, "global_step": 58393, "epoch": 347} {"train_loss": -8.730500221252441, "global_step": 58394, "epoch": 347} {"train_loss": -8.71502685546875, "global_step": 58395, "epoch": 347} {"train_loss": -8.586770057678223, "global_step": 58396, "epoch": 347} {"train_loss": -8.61928939819336, "global_step": 58397, "epoch": 347} {"train_loss": -8.577875137329102, "global_step": 58398, "epoch": 347} {"train_loss": -8.66107177734375, "global_step": 58399, "epoch": 347} {"train_loss": -8.804269790649414, "global_step": 58400, "epoch": 347} {"train_loss": -8.659514427185059, "global_step": 58401, "epoch": 347} {"train_loss": -8.82565975189209, "global_step": 58402, "epoch": 347} {"train_loss": -8.766960144042969, "global_step": 58403, "epoch": 347} {"train_loss": -8.61227798461914, "global_step": 58404, "epoch": 347} {"train_loss": -8.844600677490234, "global_step": 58405, "epoch": 347} {"train_loss": -8.587034225463867, "global_step": 58406, "epoch": 347} {"train_loss": -8.777713775634766, "global_step": 58407, "epoch": 347} {"train_loss": -8.54509162902832, "global_step": 58408, "epoch": 347} {"train_loss": -8.541304588317871, "global_step": 58409, "epoch": 347} {"train_loss": -8.76803970336914, "global_step": 58410, "epoch": 347} {"train_loss": -8.811164855957031, "global_step": 58411, "epoch": 347} {"train_loss": -8.776057243347168, "global_step": 58412, "epoch": 347} {"train_loss": -8.800752639770508, "global_step": 58413, "epoch": 347} {"train_loss": -8.724308967590332, "global_step": 58414, "epoch": 347} {"train_loss": -8.602869033813477, "global_step": 58415, "epoch": 347} {"train_loss": -8.692269325256348, "global_step": 58416, "epoch": 347} {"train_loss": -8.542089462280273, "global_step": 58417, "epoch": 347} {"train_loss": -8.563663482666016, "global_step": 58418, "epoch": 347} {"train_loss": -8.852168083190918, "global_step": 58419, "epoch": 347} {"train_loss": -8.168127059936523, "global_step": 58420, "epoch": 347} {"train_loss": -8.576894760131836, "global_step": 58421, "epoch": 347} {"train_loss": -8.40683650970459, "global_step": 58422, "epoch": 347} {"train_loss": -8.730512619018555, "global_step": 58423, "epoch": 347} {"train_loss": -8.724846839904785, "global_step": 58424, "epoch": 347} {"train_loss": -8.331680297851562, "global_step": 58425, "epoch": 347} {"train_loss": -8.702613830566406, "global_step": 58426, "epoch": 347} {"train_loss": -8.567477226257324, "global_step": 58427, "epoch": 347} {"train_loss": -8.67935562133789, "global_step": 58428, "epoch": 347} {"train_loss": -8.635560035705566, "global_step": 58429, "epoch": 347} {"train_loss": -8.630640029907227, "global_step": 58430, "epoch": 347} {"train_loss": -8.432220458984375, "global_step": 58431, "epoch": 347} {"train_loss": -8.436895370483398, "global_step": 58432, "epoch": 347} {"train_loss": -8.60246467590332, "global_step": 58433, "epoch": 347} {"train_loss": -8.712395668029785, "global_step": 58434, "epoch": 347} {"train_loss": -8.560851097106934, "global_step": 58435, "epoch": 347} {"train_loss": -8.392656326293945, "global_step": 58436, "epoch": 347} {"train_loss": -8.74448013305664, "global_step": 58437, "epoch": 347} {"train_loss": -8.706171035766602, "global_step": 58438, "epoch": 347} {"train_loss": -8.595420837402344, "global_step": 58439, "epoch": 347} {"train_loss": -8.651566505432129, "global_step": 58440, "epoch": 347} {"train_loss": -8.629158020019531, "global_step": 58441, "epoch": 347} {"train_loss": -8.717620849609375, "global_step": 58442, "epoch": 347} {"train_loss": -8.656953811645508, "global_step": 58443, "epoch": 347} {"train_loss": -8.187585830688477, "global_step": 58444, "epoch": 347} {"train_loss": -8.568665504455566, "global_step": 58445, "epoch": 347} {"train_loss": -8.376640319824219, "global_step": 58446, "epoch": 347} {"train_loss": -8.111745834350586, "global_step": 58447, "epoch": 347} {"train_loss": -8.218679428100586, "global_step": 58448, "epoch": 347} {"train_loss": -8.354723930358887, "global_step": 58449, "epoch": 347} {"train_loss": -8.518803596496582, "global_step": 58450, "epoch": 347} {"train_loss": -8.218631744384766, "global_step": 58451, "epoch": 347} {"train_loss": -8.524348258972168, "global_step": 58452, "epoch": 347} {"train_loss": -8.062043190002441, "global_step": 58453, "epoch": 347} {"train_loss": -8.132099151611328, "global_step": 58454, "epoch": 347} {"train_loss": -8.181159019470215, "global_step": 58455, "epoch": 347} {"train_loss": -8.265974998474121, "global_step": 58456, "epoch": 347} {"train_loss": -8.62671947479248, "global_step": 58457, "epoch": 347} {"train_loss": -8.34160041809082, "global_step": 58458, "epoch": 347} {"train_loss": -8.238662719726562, "global_step": 58459, "epoch": 347} {"train_loss": -8.415884971618652, "global_step": 58460, "epoch": 347} {"train_loss": -8.384590148925781, "global_step": 58461, "epoch": 347} {"train_loss": -8.369365692138672, "global_step": 58462, "epoch": 347} {"train_loss": -8.535071208363487, "global_step": 58463, "epoch": 347, "val_loss": 190688.5625} {"train_loss": -8.47476863861084, "global_step": 58464, "epoch": 348} {"train_loss": -8.197855949401855, "global_step": 58465, "epoch": 348} {"train_loss": -8.727935791015625, "global_step": 58466, "epoch": 348} {"train_loss": -8.593338012695312, "global_step": 58467, "epoch": 348} {"train_loss": -8.589166641235352, "global_step": 58468, "epoch": 348} {"train_loss": -8.499372482299805, "global_step": 58469, "epoch": 348} {"train_loss": -8.408259391784668, "global_step": 58470, "epoch": 348} {"train_loss": -8.523852348327637, "global_step": 58471, "epoch": 348} {"train_loss": -8.505294799804688, "global_step": 58472, "epoch": 348} {"train_loss": -8.66420841217041, "global_step": 58473, "epoch": 348} {"train_loss": -8.624496459960938, "global_step": 58474, "epoch": 348} {"train_loss": -8.48178482055664, "global_step": 58475, "epoch": 348} {"train_loss": -8.314361572265625, "global_step": 58476, "epoch": 348} {"train_loss": -8.896053314208984, "global_step": 58477, "epoch": 348} {"train_loss": -8.76563549041748, "global_step": 58478, "epoch": 348} {"train_loss": -8.688970565795898, "global_step": 58479, "epoch": 348} {"train_loss": -8.50193977355957, "global_step": 58480, "epoch": 348} {"train_loss": -8.647876739501953, "global_step": 58481, "epoch": 348} {"train_loss": -8.50253677368164, "global_step": 58482, "epoch": 348} {"train_loss": -8.365082740783691, "global_step": 58483, "epoch": 348} {"train_loss": -8.347489356994629, "global_step": 58484, "epoch": 348} {"train_loss": -8.549342155456543, "global_step": 58485, "epoch": 348} {"train_loss": -8.637767791748047, "global_step": 58486, "epoch": 348} {"train_loss": -8.179795265197754, "global_step": 58487, "epoch": 348} {"train_loss": -8.484140396118164, "global_step": 58488, "epoch": 348} {"train_loss": -8.687013626098633, "global_step": 58489, "epoch": 348} {"train_loss": -8.318273544311523, "global_step": 58490, "epoch": 348} {"train_loss": -8.503750801086426, "global_step": 58491, "epoch": 348} {"train_loss": -8.59964370727539, "global_step": 58492, "epoch": 348} {"train_loss": -8.463916778564453, "global_step": 58493, "epoch": 348} {"train_loss": -8.493422508239746, "global_step": 58494, "epoch": 348} {"train_loss": -8.557998657226562, "global_step": 58495, "epoch": 348} {"train_loss": -8.839147567749023, "global_step": 58496, "epoch": 348} {"train_loss": -8.567779541015625, "global_step": 58497, "epoch": 348} {"train_loss": -8.597485542297363, "global_step": 58498, "epoch": 348} {"train_loss": -8.566987991333008, "global_step": 58499, "epoch": 348} {"train_loss": -8.310373306274414, "global_step": 58500, "epoch": 348} {"train_loss": -8.704181671142578, "global_step": 58501, "epoch": 348} {"train_loss": -8.38129997253418, "global_step": 58502, "epoch": 348} {"train_loss": -8.41773796081543, "global_step": 58503, "epoch": 348} {"train_loss": -8.491698265075684, "global_step": 58504, "epoch": 348} {"train_loss": -8.785740852355957, "global_step": 58505, "epoch": 348} {"train_loss": -8.377180099487305, "global_step": 58506, "epoch": 348} {"train_loss": -8.612649917602539, "global_step": 58507, "epoch": 348} {"train_loss": -8.548234939575195, "global_step": 58508, "epoch": 348} {"train_loss": -8.480310440063477, "global_step": 58509, "epoch": 348} {"train_loss": -8.56735610961914, "global_step": 58510, "epoch": 348} {"train_loss": -8.710517883300781, "global_step": 58511, "epoch": 348} {"train_loss": -8.552509307861328, "global_step": 58512, "epoch": 348} {"train_loss": -8.605932235717773, "global_step": 58513, "epoch": 348} {"train_loss": -8.772662162780762, "global_step": 58514, "epoch": 348} {"train_loss": -8.403566360473633, "global_step": 58515, "epoch": 348} {"train_loss": -8.522361755371094, "global_step": 58516, "epoch": 348} {"train_loss": -8.632262229919434, "global_step": 58517, "epoch": 348} {"train_loss": -8.364542007446289, "global_step": 58518, "epoch": 348} {"train_loss": -8.298624038696289, "global_step": 58519, "epoch": 348} {"train_loss": -8.677567481994629, "global_step": 58520, "epoch": 348} {"train_loss": -8.625173568725586, "global_step": 58521, "epoch": 348} {"train_loss": -8.470514297485352, "global_step": 58522, "epoch": 348} {"train_loss": -8.895545959472656, "global_step": 58523, "epoch": 348} {"train_loss": -8.606611251831055, "global_step": 58524, "epoch": 348} {"train_loss": -8.568414688110352, "global_step": 58525, "epoch": 348} {"train_loss": -8.424623489379883, "global_step": 58526, "epoch": 348} {"train_loss": -8.471056938171387, "global_step": 58527, "epoch": 348} {"train_loss": -8.394536018371582, "global_step": 58528, "epoch": 348} {"train_loss": -8.599198341369629, "global_step": 58529, "epoch": 348} {"train_loss": -8.539722442626953, "global_step": 58530, "epoch": 348} {"train_loss": -8.619479179382324, "global_step": 58531, "epoch": 348} {"train_loss": -8.625642776489258, "global_step": 58532, "epoch": 348} {"train_loss": -8.68826675415039, "global_step": 58533, "epoch": 348} {"train_loss": -8.442858695983887, "global_step": 58534, "epoch": 348} {"train_loss": -8.501718521118164, "global_step": 58535, "epoch": 348} {"train_loss": -8.454254150390625, "global_step": 58536, "epoch": 348} {"train_loss": -8.424732208251953, "global_step": 58537, "epoch": 348} {"train_loss": -8.739068031311035, "global_step": 58538, "epoch": 348} {"train_loss": -8.65658187866211, "global_step": 58539, "epoch": 348} {"train_loss": -8.637361526489258, "global_step": 58540, "epoch": 348} {"train_loss": -8.662431716918945, "global_step": 58541, "epoch": 348} {"train_loss": -8.760002136230469, "global_step": 58542, "epoch": 348} {"train_loss": -8.819602966308594, "global_step": 58543, "epoch": 348} {"train_loss": -8.946237564086914, "global_step": 58544, "epoch": 348} {"train_loss": -8.484243392944336, "global_step": 58545, "epoch": 348} {"train_loss": -8.980960845947266, "global_step": 58546, "epoch": 348} {"train_loss": -8.699180603027344, "global_step": 58547, "epoch": 348} {"train_loss": -8.597002029418945, "global_step": 58548, "epoch": 348} {"train_loss": -8.727069854736328, "global_step": 58549, "epoch": 348} {"train_loss": -8.57404899597168, "global_step": 58550, "epoch": 348} {"train_loss": -8.780197143554688, "global_step": 58551, "epoch": 348} {"train_loss": -8.803400993347168, "global_step": 58552, "epoch": 348} {"train_loss": -8.714542388916016, "global_step": 58553, "epoch": 348} {"train_loss": -8.667291641235352, "global_step": 58554, "epoch": 348} {"train_loss": -8.636886596679688, "global_step": 58555, "epoch": 348} {"train_loss": -8.449651718139648, "global_step": 58556, "epoch": 348} {"train_loss": -8.863290786743164, "global_step": 58557, "epoch": 348} {"train_loss": -8.471745491027832, "global_step": 58558, "epoch": 348} {"train_loss": -8.815742492675781, "global_step": 58559, "epoch": 348} {"train_loss": -8.719643592834473, "global_step": 58560, "epoch": 348} {"train_loss": -8.746095657348633, "global_step": 58561, "epoch": 348} {"train_loss": -8.66064167022705, "global_step": 58562, "epoch": 348} {"train_loss": -8.746330261230469, "global_step": 58563, "epoch": 348} {"train_loss": -8.581884384155273, "global_step": 58564, "epoch": 348} {"train_loss": -8.4395751953125, "global_step": 58565, "epoch": 348} {"train_loss": -8.748336791992188, "global_step": 58566, "epoch": 348} {"train_loss": -8.656560897827148, "global_step": 58567, "epoch": 348} {"train_loss": -8.743915557861328, "global_step": 58568, "epoch": 348} {"train_loss": -8.553520202636719, "global_step": 58569, "epoch": 348} {"train_loss": -8.694559097290039, "global_step": 58570, "epoch": 348} {"train_loss": -8.400362014770508, "global_step": 58571, "epoch": 348} {"train_loss": -8.790824890136719, "global_step": 58572, "epoch": 348} {"train_loss": -8.596442222595215, "global_step": 58573, "epoch": 348} {"train_loss": -8.613618850708008, "global_step": 58574, "epoch": 348} {"train_loss": -8.568868637084961, "global_step": 58575, "epoch": 348} {"train_loss": -8.627639770507812, "global_step": 58576, "epoch": 348} {"train_loss": -8.606650352478027, "global_step": 58577, "epoch": 348} {"train_loss": -8.593435287475586, "global_step": 58578, "epoch": 348} {"train_loss": -8.916711807250977, "global_step": 58579, "epoch": 348} {"train_loss": -8.7776460647583, "global_step": 58580, "epoch": 348} {"train_loss": -8.69675064086914, "global_step": 58581, "epoch": 348} {"train_loss": -8.52811336517334, "global_step": 58582, "epoch": 348} {"train_loss": -8.49282455444336, "global_step": 58583, "epoch": 348} {"train_loss": -8.471989631652832, "global_step": 58584, "epoch": 348} {"train_loss": -8.68157958984375, "global_step": 58585, "epoch": 348} {"train_loss": -8.670076370239258, "global_step": 58586, "epoch": 348} {"train_loss": -8.569461822509766, "global_step": 58587, "epoch": 348} {"train_loss": -8.681349754333496, "global_step": 58588, "epoch": 348} {"train_loss": -8.722896575927734, "global_step": 58589, "epoch": 348} {"train_loss": -8.493896484375, "global_step": 58590, "epoch": 348} {"train_loss": -8.88652229309082, "global_step": 58591, "epoch": 348} {"train_loss": -8.564050674438477, "global_step": 58592, "epoch": 348} {"train_loss": -8.636293411254883, "global_step": 58593, "epoch": 348} {"train_loss": -8.449352264404297, "global_step": 58594, "epoch": 348} {"train_loss": -8.714667320251465, "global_step": 58595, "epoch": 348} {"train_loss": -8.455875396728516, "global_step": 58596, "epoch": 348} {"train_loss": -8.58573055267334, "global_step": 58597, "epoch": 348} {"train_loss": -8.551824569702148, "global_step": 58598, "epoch": 348} {"train_loss": -8.674213409423828, "global_step": 58599, "epoch": 348} {"train_loss": -8.470972061157227, "global_step": 58600, "epoch": 348} {"train_loss": -8.67078971862793, "global_step": 58601, "epoch": 348} {"train_loss": -8.459213256835938, "global_step": 58602, "epoch": 348} {"train_loss": -8.67919635772705, "global_step": 58603, "epoch": 348} {"train_loss": -8.396197319030762, "global_step": 58604, "epoch": 348} {"train_loss": -8.666459083557129, "global_step": 58605, "epoch": 348} {"train_loss": -8.771986961364746, "global_step": 58606, "epoch": 348} {"train_loss": -8.816377639770508, "global_step": 58607, "epoch": 348} {"train_loss": -8.605371475219727, "global_step": 58608, "epoch": 348} {"train_loss": -8.633666038513184, "global_step": 58609, "epoch": 348} {"train_loss": -8.705493927001953, "global_step": 58610, "epoch": 348} {"train_loss": -8.381607055664062, "global_step": 58611, "epoch": 348} {"train_loss": -8.621434211730957, "global_step": 58612, "epoch": 348} {"train_loss": -8.58969497680664, "global_step": 58613, "epoch": 348} {"train_loss": -8.80012321472168, "global_step": 58614, "epoch": 348} {"train_loss": -8.771699905395508, "global_step": 58615, "epoch": 348} {"train_loss": -8.711610794067383, "global_step": 58616, "epoch": 348} {"train_loss": -8.623291969299316, "global_step": 58617, "epoch": 348} {"train_loss": -8.700572967529297, "global_step": 58618, "epoch": 348} {"train_loss": -8.530128479003906, "global_step": 58619, "epoch": 348} {"train_loss": -8.73227596282959, "global_step": 58620, "epoch": 348} {"train_loss": -8.472557067871094, "global_step": 58621, "epoch": 348} {"train_loss": -8.93826675415039, "global_step": 58622, "epoch": 348} {"train_loss": -8.553997993469238, "global_step": 58623, "epoch": 348} {"train_loss": -8.565357208251953, "global_step": 58624, "epoch": 348} {"train_loss": -8.490028381347656, "global_step": 58625, "epoch": 348} {"train_loss": -8.951249122619629, "global_step": 58626, "epoch": 348} {"train_loss": -8.47734260559082, "global_step": 58627, "epoch": 348} {"train_loss": -8.874244689941406, "global_step": 58628, "epoch": 348} {"train_loss": -8.601509094238281, "global_step": 58629, "epoch": 348} {"train_loss": -8.69736385345459, "global_step": 58630, "epoch": 348} {"train_loss": -8.601474086443583, "global_step": 58631, "epoch": 348, "val_loss": 190706.90625} {"train_loss": -8.58633041381836, "global_step": 58632, "epoch": 349} {"train_loss": -8.654122352600098, "global_step": 58633, "epoch": 349} {"train_loss": -8.6676607131958, "global_step": 58634, "epoch": 349} {"train_loss": -8.550304412841797, "global_step": 58635, "epoch": 349} {"train_loss": -8.586315155029297, "global_step": 58636, "epoch": 349} {"train_loss": -8.602054595947266, "global_step": 58637, "epoch": 349} {"train_loss": -8.434783935546875, "global_step": 58638, "epoch": 349} {"train_loss": -8.680173873901367, "global_step": 58639, "epoch": 349} {"train_loss": -8.703093528747559, "global_step": 58640, "epoch": 349} {"train_loss": -8.421785354614258, "global_step": 58641, "epoch": 349} {"train_loss": -8.579259872436523, "global_step": 58642, "epoch": 349} {"train_loss": -8.439830780029297, "global_step": 58643, "epoch": 349} {"train_loss": -8.284997940063477, "global_step": 58644, "epoch": 349} {"train_loss": -8.363024711608887, "global_step": 58645, "epoch": 349} {"train_loss": -8.481864929199219, "global_step": 58646, "epoch": 349} {"train_loss": -8.55469799041748, "global_step": 58647, "epoch": 349} {"train_loss": -8.334388732910156, "global_step": 58648, "epoch": 349} {"train_loss": -8.748384475708008, "global_step": 58649, "epoch": 349} {"train_loss": -8.60235595703125, "global_step": 58650, "epoch": 349} {"train_loss": -8.346125602722168, "global_step": 58651, "epoch": 349} {"train_loss": -8.430633544921875, "global_step": 58652, "epoch": 349} {"train_loss": -8.520216941833496, "global_step": 58653, "epoch": 349} {"train_loss": -8.445653915405273, "global_step": 58654, "epoch": 349} {"train_loss": -8.7620849609375, "global_step": 58655, "epoch": 349} {"train_loss": -8.586970329284668, "global_step": 58656, "epoch": 349} {"train_loss": -8.586249351501465, "global_step": 58657, "epoch": 349} {"train_loss": -8.466043472290039, "global_step": 58658, "epoch": 349} {"train_loss": -8.371292114257812, "global_step": 58659, "epoch": 349} {"train_loss": -8.548606872558594, "global_step": 58660, "epoch": 349} {"train_loss": -8.641487121582031, "global_step": 58661, "epoch": 349} {"train_loss": -8.604716300964355, "global_step": 58662, "epoch": 349} {"train_loss": -8.382558822631836, "global_step": 58663, "epoch": 349} {"train_loss": -8.611528396606445, "global_step": 58664, "epoch": 349} {"train_loss": -8.67533016204834, "global_step": 58665, "epoch": 349} {"train_loss": -8.311749458312988, "global_step": 58666, "epoch": 349} {"train_loss": -8.51665210723877, "global_step": 58667, "epoch": 349} {"train_loss": -8.482280731201172, "global_step": 58668, "epoch": 349} {"train_loss": -8.611505508422852, "global_step": 58669, "epoch": 349} {"train_loss": -8.249998092651367, "global_step": 58670, "epoch": 349} {"train_loss": -8.48536491394043, "global_step": 58671, "epoch": 349} {"train_loss": -8.526623725891113, "global_step": 58672, "epoch": 349} {"train_loss": -8.575523376464844, "global_step": 58673, "epoch": 349} {"train_loss": -8.653030395507812, "global_step": 58674, "epoch": 349} {"train_loss": -8.613520622253418, "global_step": 58675, "epoch": 349} {"train_loss": -8.681364059448242, "global_step": 58676, "epoch": 349} {"train_loss": -8.53170394897461, "global_step": 58677, "epoch": 349} {"train_loss": -8.592662811279297, "global_step": 58678, "epoch": 349} {"train_loss": -8.571146011352539, "global_step": 58679, "epoch": 349} {"train_loss": -8.584293365478516, "global_step": 58680, "epoch": 349} {"train_loss": -8.528398513793945, "global_step": 58681, "epoch": 349} {"train_loss": -8.58369255065918, "global_step": 58682, "epoch": 349} {"train_loss": -8.652585983276367, "global_step": 58683, "epoch": 349} {"train_loss": -8.54819107055664, "global_step": 58684, "epoch": 349} {"train_loss": -8.510246276855469, "global_step": 58685, "epoch": 349} {"train_loss": -8.791893005371094, "global_step": 58686, "epoch": 349} {"train_loss": -8.65692138671875, "global_step": 58687, "epoch": 349} {"train_loss": -8.837181091308594, "global_step": 58688, "epoch": 349} {"train_loss": -8.790210723876953, "global_step": 58689, "epoch": 349} {"train_loss": -8.51948070526123, "global_step": 58690, "epoch": 349} {"train_loss": -8.703968048095703, "global_step": 58691, "epoch": 349} {"train_loss": -8.694456100463867, "global_step": 58692, "epoch": 349} {"train_loss": -8.710075378417969, "global_step": 58693, "epoch": 349} {"train_loss": -8.454584121704102, "global_step": 58694, "epoch": 349} {"train_loss": -8.225516319274902, "global_step": 58695, "epoch": 349} {"train_loss": -8.51225471496582, "global_step": 58696, "epoch": 349} {"train_loss": -8.794907569885254, "global_step": 58697, "epoch": 349} {"train_loss": -8.683380126953125, "global_step": 58698, "epoch": 349} {"train_loss": -8.757928848266602, "global_step": 58699, "epoch": 349} {"train_loss": -8.507089614868164, "global_step": 58700, "epoch": 349} {"train_loss": -8.604991912841797, "global_step": 58701, "epoch": 349} {"train_loss": -8.404365539550781, "global_step": 58702, "epoch": 349} {"train_loss": -8.662956237792969, "global_step": 58703, "epoch": 349} {"train_loss": -8.453959465026855, "global_step": 58704, "epoch": 349} {"train_loss": -8.654010772705078, "global_step": 58705, "epoch": 349} {"train_loss": -8.7795991897583, "global_step": 58706, "epoch": 349} {"train_loss": -8.573013305664062, "global_step": 58707, "epoch": 349} {"train_loss": -8.752447128295898, "global_step": 58708, "epoch": 349} {"train_loss": -8.488288879394531, "global_step": 58709, "epoch": 349} {"train_loss": -8.55513858795166, "global_step": 58710, "epoch": 349} {"train_loss": -8.281761169433594, "global_step": 58711, "epoch": 349} {"train_loss": -8.569324493408203, "global_step": 58712, "epoch": 349} {"train_loss": -8.29784870147705, "global_step": 58713, "epoch": 349} {"train_loss": -8.363269805908203, "global_step": 58714, "epoch": 349} {"train_loss": -8.61298942565918, "global_step": 58715, "epoch": 349} {"train_loss": -8.080405235290527, "global_step": 58716, "epoch": 349} {"train_loss": -8.426621437072754, "global_step": 58717, "epoch": 349} {"train_loss": -8.26076602935791, "global_step": 58718, "epoch": 349} {"train_loss": -8.291053771972656, "global_step": 58719, "epoch": 349} {"train_loss": -8.475865364074707, "global_step": 58720, "epoch": 349} {"train_loss": -8.41887092590332, "global_step": 58721, "epoch": 349} {"train_loss": -8.65692138671875, "global_step": 58722, "epoch": 349} {"train_loss": -8.496551513671875, "global_step": 58723, "epoch": 349} {"train_loss": -8.342900276184082, "global_step": 58724, "epoch": 349} {"train_loss": -8.519859313964844, "global_step": 58725, "epoch": 349} {"train_loss": -8.548494338989258, "global_step": 58726, "epoch": 349} {"train_loss": -8.501419067382812, "global_step": 58727, "epoch": 349} {"train_loss": -8.553646087646484, "global_step": 58728, "epoch": 349} {"train_loss": -8.422225952148438, "global_step": 58729, "epoch": 349} {"train_loss": -8.650254249572754, "global_step": 58730, "epoch": 349} {"train_loss": -8.592538833618164, "global_step": 58731, "epoch": 349} {"train_loss": -8.551464080810547, "global_step": 58732, "epoch": 349} {"train_loss": -8.836387634277344, "global_step": 58733, "epoch": 349} {"train_loss": -8.28971004486084, "global_step": 58734, "epoch": 349} {"train_loss": -8.630321502685547, "global_step": 58735, "epoch": 349} {"train_loss": -8.684900283813477, "global_step": 58736, "epoch": 349} {"train_loss": -8.773975372314453, "global_step": 58737, "epoch": 349} {"train_loss": -8.649933815002441, "global_step": 58738, "epoch": 349} {"train_loss": -8.536547660827637, "global_step": 58739, "epoch": 349} {"train_loss": -8.951618194580078, "global_step": 58740, "epoch": 349} {"train_loss": -8.852728843688965, "global_step": 58741, "epoch": 349} {"train_loss": -8.671758651733398, "global_step": 58742, "epoch": 349} {"train_loss": -8.855313301086426, "global_step": 58743, "epoch": 349} {"train_loss": -8.745464324951172, "global_step": 58744, "epoch": 349} {"train_loss": -8.538617134094238, "global_step": 58745, "epoch": 349} {"train_loss": -8.825902938842773, "global_step": 58746, "epoch": 349} {"train_loss": -8.785516738891602, "global_step": 58747, "epoch": 349} {"train_loss": -8.629450798034668, "global_step": 58748, "epoch": 349} {"train_loss": -8.832871437072754, "global_step": 58749, "epoch": 349} {"train_loss": -8.816688537597656, "global_step": 58750, "epoch": 349} {"train_loss": -8.735716819763184, "global_step": 58751, "epoch": 349} {"train_loss": -8.799997329711914, "global_step": 58752, "epoch": 349} {"train_loss": -8.817965507507324, "global_step": 58753, "epoch": 349} {"train_loss": -8.874861717224121, "global_step": 58754, "epoch": 349} {"train_loss": -8.510956764221191, "global_step": 58755, "epoch": 349} {"train_loss": -8.86373519897461, "global_step": 58756, "epoch": 349} {"train_loss": -8.624103546142578, "global_step": 58757, "epoch": 349} {"train_loss": -8.33593463897705, "global_step": 58758, "epoch": 349} {"train_loss": -8.6914644241333, "global_step": 58759, "epoch": 349} {"train_loss": -8.410308837890625, "global_step": 58760, "epoch": 349} {"train_loss": -8.269756317138672, "global_step": 58761, "epoch": 349} {"train_loss": -8.630609512329102, "global_step": 58762, "epoch": 349} {"train_loss": -8.537763595581055, "global_step": 58763, "epoch": 349} {"train_loss": -8.565411567687988, "global_step": 58764, "epoch": 349} {"train_loss": -8.529906272888184, "global_step": 58765, "epoch": 349} {"train_loss": -8.63296890258789, "global_step": 58766, "epoch": 349} {"train_loss": -8.449849128723145, "global_step": 58767, "epoch": 349} {"train_loss": -8.693168640136719, "global_step": 58768, "epoch": 349} {"train_loss": -8.649563789367676, "global_step": 58769, "epoch": 349} {"train_loss": -8.63353157043457, "global_step": 58770, "epoch": 349} {"train_loss": -8.198651313781738, "global_step": 58771, "epoch": 349} {"train_loss": -8.470947265625, "global_step": 58772, "epoch": 349} {"train_loss": -8.261200904846191, "global_step": 58773, "epoch": 349} {"train_loss": -8.102381706237793, "global_step": 58774, "epoch": 349} {"train_loss": -8.364126205444336, "global_step": 58775, "epoch": 349} {"train_loss": -8.361310005187988, "global_step": 58776, "epoch": 349} {"train_loss": -8.423933029174805, "global_step": 58777, "epoch": 349} {"train_loss": -8.38591194152832, "global_step": 58778, "epoch": 349} {"train_loss": -8.648405075073242, "global_step": 58779, "epoch": 349} {"train_loss": -8.394673347473145, "global_step": 58780, "epoch": 349} {"train_loss": -8.528359413146973, "global_step": 58781, "epoch": 349} {"train_loss": -8.348169326782227, "global_step": 58782, "epoch": 349} {"train_loss": -8.506444931030273, "global_step": 58783, "epoch": 349} {"train_loss": -8.714376449584961, "global_step": 58784, "epoch": 349} {"train_loss": -8.360878944396973, "global_step": 58785, "epoch": 349} {"train_loss": -8.385053634643555, "global_step": 58786, "epoch": 349} {"train_loss": -8.563011169433594, "global_step": 58787, "epoch": 349} {"train_loss": -8.671796798706055, "global_step": 58788, "epoch": 349} {"train_loss": -8.415776252746582, "global_step": 58789, "epoch": 349} {"train_loss": -8.302846908569336, "global_step": 58790, "epoch": 349} {"train_loss": -8.318132400512695, "global_step": 58791, "epoch": 349} {"train_loss": -8.299251556396484, "global_step": 58792, "epoch": 349} {"train_loss": -8.405147552490234, "global_step": 58793, "epoch": 349} {"train_loss": -8.391593933105469, "global_step": 58794, "epoch": 349} {"train_loss": -8.605772018432617, "global_step": 58795, "epoch": 349} {"train_loss": -8.3815279006958, "global_step": 58796, "epoch": 349} {"train_loss": -8.322608947753906, "global_step": 58797, "epoch": 349} {"train_loss": -8.44283676147461, "global_step": 58798, "epoch": 349} {"train_loss": -8.545790167081924, "global_step": 58799, "epoch": 349, "val_loss": 191328.90625} {"train_loss": -8.605565071105957, "global_step": 58800, "epoch": 350} {"train_loss": -8.473727226257324, "global_step": 58801, "epoch": 350} {"train_loss": -8.37557601928711, "global_step": 58802, "epoch": 350} {"train_loss": -8.428627014160156, "global_step": 58803, "epoch": 350} {"train_loss": -8.490285873413086, "global_step": 58804, "epoch": 350} {"train_loss": -8.521482467651367, "global_step": 58805, "epoch": 350} {"train_loss": -8.514581680297852, "global_step": 58806, "epoch": 350} {"train_loss": -8.508520126342773, "global_step": 58807, "epoch": 350} {"train_loss": -8.609962463378906, "global_step": 58808, "epoch": 350} {"train_loss": -8.486391067504883, "global_step": 58809, "epoch": 350} {"train_loss": -8.723834991455078, "global_step": 58810, "epoch": 350} {"train_loss": -8.607315063476562, "global_step": 58811, "epoch": 350} {"train_loss": -8.505550384521484, "global_step": 58812, "epoch": 350} {"train_loss": -8.57217788696289, "global_step": 58813, "epoch": 350} {"train_loss": -8.693440437316895, "global_step": 58814, "epoch": 350} {"train_loss": -8.399839401245117, "global_step": 58815, "epoch": 350} {"train_loss": -8.773859977722168, "global_step": 58816, "epoch": 350} {"train_loss": -8.731485366821289, "global_step": 58817, "epoch": 350} {"train_loss": -8.625356674194336, "global_step": 58818, "epoch": 350} {"train_loss": -8.756900787353516, "global_step": 58819, "epoch": 350} {"train_loss": -8.875965118408203, "global_step": 58820, "epoch": 350} {"train_loss": -8.716659545898438, "global_step": 58821, "epoch": 350} {"train_loss": -8.81309700012207, "global_step": 58822, "epoch": 350} {"train_loss": -8.80740737915039, "global_step": 58823, "epoch": 350} {"train_loss": -8.882966041564941, "global_step": 58824, "epoch": 350} {"train_loss": -8.645685195922852, "global_step": 58825, "epoch": 350} {"train_loss": -8.844399452209473, "global_step": 58826, "epoch": 350} {"train_loss": -8.59962272644043, "global_step": 58827, "epoch": 350} {"train_loss": -8.65216064453125, "global_step": 58828, "epoch": 350} {"train_loss": -8.70174789428711, "global_step": 58829, "epoch": 350} {"train_loss": -8.59207820892334, "global_step": 58830, "epoch": 350} {"train_loss": -8.65419864654541, "global_step": 58831, "epoch": 350} {"train_loss": -8.660032272338867, "global_step": 58832, "epoch": 350} {"train_loss": -8.732250213623047, "global_step": 58833, "epoch": 350} {"train_loss": -8.703314781188965, "global_step": 58834, "epoch": 350} {"train_loss": -8.85702133178711, "global_step": 58835, "epoch": 350} {"train_loss": -8.699017524719238, "global_step": 58836, "epoch": 350} {"train_loss": -8.722166061401367, "global_step": 58837, "epoch": 350} {"train_loss": -8.368782997131348, "global_step": 58838, "epoch": 350} {"train_loss": -8.391731262207031, "global_step": 58839, "epoch": 350} {"train_loss": -8.419384002685547, "global_step": 58840, "epoch": 350} {"train_loss": -8.409650802612305, "global_step": 58841, "epoch": 350} {"train_loss": -8.559001922607422, "global_step": 58842, "epoch": 350} {"train_loss": -8.367341995239258, "global_step": 58843, "epoch": 350} {"train_loss": -8.376256942749023, "global_step": 58844, "epoch": 350} {"train_loss": -8.62789535522461, "global_step": 58845, "epoch": 350} {"train_loss": -8.397438049316406, "global_step": 58846, "epoch": 350} {"train_loss": -8.384641647338867, "global_step": 58847, "epoch": 350} {"train_loss": -8.451996803283691, "global_step": 58848, "epoch": 350} {"train_loss": -8.493307113647461, "global_step": 58849, "epoch": 350} {"train_loss": -8.4564208984375, "global_step": 58850, "epoch": 350} {"train_loss": -8.204970359802246, "global_step": 58851, "epoch": 350} {"train_loss": -8.361814498901367, "global_step": 58852, "epoch": 350} {"train_loss": -8.418661117553711, "global_step": 58853, "epoch": 350} {"train_loss": -8.48472785949707, "global_step": 58854, "epoch": 350} {"train_loss": -8.616071701049805, "global_step": 58855, "epoch": 350} {"train_loss": -8.58426284790039, "global_step": 58856, "epoch": 350} {"train_loss": -8.587587356567383, "global_step": 58857, "epoch": 350} {"train_loss": -8.695249557495117, "global_step": 58858, "epoch": 350} {"train_loss": -8.442056655883789, "global_step": 58859, "epoch": 350} {"train_loss": -8.575563430786133, "global_step": 58860, "epoch": 350} {"train_loss": -8.48845386505127, "global_step": 58861, "epoch": 350} {"train_loss": -8.577066421508789, "global_step": 58862, "epoch": 350} {"train_loss": -8.622428894042969, "global_step": 58863, "epoch": 350} {"train_loss": -8.56778335571289, "global_step": 58864, "epoch": 350} {"train_loss": -8.605040550231934, "global_step": 58865, "epoch": 350} {"train_loss": -8.541372299194336, "global_step": 58866, "epoch": 350} {"train_loss": -8.494208335876465, "global_step": 58867, "epoch": 350} {"train_loss": -8.755724906921387, "global_step": 58868, "epoch": 350} {"train_loss": -8.60951042175293, "global_step": 58869, "epoch": 350} {"train_loss": -8.435517311096191, "global_step": 58870, "epoch": 350} {"train_loss": -8.642925262451172, "global_step": 58871, "epoch": 350} {"train_loss": -8.647930145263672, "global_step": 58872, "epoch": 350} {"train_loss": -8.606241226196289, "global_step": 58873, "epoch": 350} {"train_loss": -8.622417449951172, "global_step": 58874, "epoch": 350} {"train_loss": -8.540124893188477, "global_step": 58875, "epoch": 350} {"train_loss": -8.750021934509277, "global_step": 58876, "epoch": 350} {"train_loss": -8.680998802185059, "global_step": 58877, "epoch": 350} {"train_loss": -8.55228328704834, "global_step": 58878, "epoch": 350} {"train_loss": -8.602022171020508, "global_step": 58879, "epoch": 350} {"train_loss": -8.521889686584473, "global_step": 58880, "epoch": 350} {"train_loss": -8.65153694152832, "global_step": 58881, "epoch": 350} {"train_loss": -8.524920463562012, "global_step": 58882, "epoch": 350} {"train_loss": -8.379812240600586, "global_step": 58883, "epoch": 350} {"train_loss": -8.591756820678711, "global_step": 58884, "epoch": 350} {"train_loss": -8.660398483276367, "global_step": 58885, "epoch": 350} {"train_loss": -8.453936576843262, "global_step": 58886, "epoch": 350} {"train_loss": -8.660871505737305, "global_step": 58887, "epoch": 350} {"train_loss": -8.415884971618652, "global_step": 58888, "epoch": 350} {"train_loss": -8.486757278442383, "global_step": 58889, "epoch": 350} {"train_loss": -8.491371154785156, "global_step": 58890, "epoch": 350} {"train_loss": -8.494281768798828, "global_step": 58891, "epoch": 350} {"train_loss": -8.134806632995605, "global_step": 58892, "epoch": 350} {"train_loss": -8.460676193237305, "global_step": 58893, "epoch": 350} {"train_loss": -8.4301118850708, "global_step": 58894, "epoch": 350} {"train_loss": -8.495027542114258, "global_step": 58895, "epoch": 350} {"train_loss": -8.471174240112305, "global_step": 58896, "epoch": 350} {"train_loss": -8.484498023986816, "global_step": 58897, "epoch": 350} {"train_loss": -8.365857124328613, "global_step": 58898, "epoch": 350} {"train_loss": -8.502035140991211, "global_step": 58899, "epoch": 350} {"train_loss": -8.578828811645508, "global_step": 58900, "epoch": 350} {"train_loss": -8.433073997497559, "global_step": 58901, "epoch": 350} {"train_loss": -8.536577224731445, "global_step": 58902, "epoch": 350} {"train_loss": -8.582626342773438, "global_step": 58903, "epoch": 350} {"train_loss": -8.550519943237305, "global_step": 58904, "epoch": 350} {"train_loss": -8.429569244384766, "global_step": 58905, "epoch": 350} {"train_loss": -8.566160202026367, "global_step": 58906, "epoch": 350} {"train_loss": -8.36500072479248, "global_step": 58907, "epoch": 350} {"train_loss": -8.392126083374023, "global_step": 58908, "epoch": 350} {"train_loss": -8.712068557739258, "global_step": 58909, "epoch": 350} {"train_loss": -8.726564407348633, "global_step": 58910, "epoch": 350} {"train_loss": -8.722797393798828, "global_step": 58911, "epoch": 350} {"train_loss": -8.762142181396484, "global_step": 58912, "epoch": 350} {"train_loss": -8.653802871704102, "global_step": 58913, "epoch": 350} {"train_loss": -8.575590133666992, "global_step": 58914, "epoch": 350} {"train_loss": -8.649578094482422, "global_step": 58915, "epoch": 350} {"train_loss": -8.574094772338867, "global_step": 58916, "epoch": 350} {"train_loss": -8.487194061279297, "global_step": 58917, "epoch": 350} {"train_loss": -8.657403945922852, "global_step": 58918, "epoch": 350} {"train_loss": -9.019344329833984, "global_step": 58919, "epoch": 350} {"train_loss": -8.650129318237305, "global_step": 58920, "epoch": 350} {"train_loss": -8.757960319519043, "global_step": 58921, "epoch": 350} {"train_loss": -9.02209758758545, "global_step": 58922, "epoch": 350} {"train_loss": -8.560758590698242, "global_step": 58923, "epoch": 350} {"train_loss": -8.675092697143555, "global_step": 58924, "epoch": 350} {"train_loss": -8.7886962890625, "global_step": 58925, "epoch": 350} {"train_loss": -8.878313064575195, "global_step": 58926, "epoch": 350} {"train_loss": -9.002044677734375, "global_step": 58927, "epoch": 350} {"train_loss": -8.778427124023438, "global_step": 58928, "epoch": 350} {"train_loss": -8.63812255859375, "global_step": 58929, "epoch": 350} {"train_loss": -8.73154067993164, "global_step": 58930, "epoch": 350} {"train_loss": -8.682668685913086, "global_step": 58931, "epoch": 350} {"train_loss": -8.690771102905273, "global_step": 58932, "epoch": 350} {"train_loss": -8.751762390136719, "global_step": 58933, "epoch": 350} {"train_loss": -8.745306968688965, "global_step": 58934, "epoch": 350} {"train_loss": -8.66074275970459, "global_step": 58935, "epoch": 350} {"train_loss": -8.72612476348877, "global_step": 58936, "epoch": 350} {"train_loss": -8.813737869262695, "global_step": 58937, "epoch": 350} {"train_loss": -8.604974746704102, "global_step": 58938, "epoch": 350} {"train_loss": -8.610663414001465, "global_step": 58939, "epoch": 350} {"train_loss": -8.667302131652832, "global_step": 58940, "epoch": 350} {"train_loss": -8.675914764404297, "global_step": 58941, "epoch": 350} {"train_loss": -8.702435493469238, "global_step": 58942, "epoch": 350} {"train_loss": -8.743703842163086, "global_step": 58943, "epoch": 350} {"train_loss": -8.693894386291504, "global_step": 58944, "epoch": 350} {"train_loss": -8.710783004760742, "global_step": 58945, "epoch": 350} {"train_loss": -8.751262664794922, "global_step": 58946, "epoch": 350} {"train_loss": -8.651131629943848, "global_step": 58947, "epoch": 350} {"train_loss": -8.872591018676758, "global_step": 58948, "epoch": 350} {"train_loss": -8.421181678771973, "global_step": 58949, "epoch": 350} {"train_loss": -8.73242473602295, "global_step": 58950, "epoch": 350} {"train_loss": -8.551258087158203, "global_step": 58951, "epoch": 350} {"train_loss": -8.473295211791992, "global_step": 58952, "epoch": 350} {"train_loss": -8.829723358154297, "global_step": 58953, "epoch": 350} {"train_loss": -8.165283203125, "global_step": 58954, "epoch": 350} {"train_loss": -8.438732147216797, "global_step": 58955, "epoch": 350} {"train_loss": -8.646788597106934, "global_step": 58956, "epoch": 350} {"train_loss": -8.707201957702637, "global_step": 58957, "epoch": 350} {"train_loss": -8.644245147705078, "global_step": 58958, "epoch": 350} {"train_loss": -8.27287483215332, "global_step": 58959, "epoch": 350} {"train_loss": -8.679559707641602, "global_step": 58960, "epoch": 350} {"train_loss": -8.170891761779785, "global_step": 58961, "epoch": 350} {"train_loss": -8.470115661621094, "global_step": 58962, "epoch": 350} {"train_loss": -8.403234481811523, "global_step": 58963, "epoch": 350} {"train_loss": -8.315751075744629, "global_step": 58964, "epoch": 350} {"train_loss": -7.850337028503418, "global_step": 58965, "epoch": 350} {"train_loss": -8.370983123779297, "global_step": 58966, "epoch": 350} {"train_loss": -8.584519800685701, "global_step": 58967, "epoch": 350, "train/sim_max_reward_0": 0.9438280421601819, "train/sim_max_reward_1": 0.8699321765226183, "train/sim_max_reward_2": 0.5561517327502701, "train/sim_max_reward_3": 0.6333258755069329, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 0.20000455719151858, "test/sim_max_reward_4400001": 0.23044121570271286, "test/sim_max_reward_4400002": 0.06172183434848112, "test/sim_max_reward_4400003": 0.507592868706988, "test/sim_max_reward_4400004": 0.8383169346553127, "test/sim_max_reward_4400005": 0.9517519482476624, "test/sim_max_reward_4400006": 0.953488885364592, "test/sim_max_reward_4400007": 0.9377622447015416, "test/sim_max_reward_4400008": 0.6901406536407686, "test/sim_max_reward_4400009": 0.03261988251167421, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.9518026226502329, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.9971204744915514, "test/sim_max_reward_4400014": 0.9220531652072581, "test/sim_max_reward_4400015": 0.9574012061138794, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9309416596852068, "test/sim_max_reward_4400019": 0.7224881075261053, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.7020273196156795, "test/sim_max_reward_4400022": 0.9558477403118457, "test/sim_max_reward_4400023": 0.9605821534284843, "test/sim_max_reward_4400024": 0.9787929678688001, "test/sim_max_reward_4400025": 0.6618563712711991, "test/sim_max_reward_4400026": 0.3991489017360274, "test/sim_max_reward_4400027": 1.0, "test/sim_max_reward_4400028": 1.0, "test/sim_max_reward_4400029": 0.715947392103061, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.999767958826291, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.28584836854362516, "test/sim_max_reward_4400034": 0.9892482113814435, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.9952567453768266, "test/sim_max_reward_4400037": 0.9867681395869542, "test/sim_max_reward_4400038": 0.0, "test/sim_max_reward_4400039": 0.4117568179222171, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.7209945788694614, "test/sim_max_reward_4400042": 1.0, "test/sim_max_reward_4400043": 0.9651417139840617, "test/sim_max_reward_4400044": 0.5123558488549298, "test/sim_max_reward_4400045": 0.41615345040140184, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6993704310503651, "test/mean_score": 0.6187420652445317, "val_loss": 188643.71875, "train_action_mse_error": 10.569019317626953} {"train_loss": -8.425172805786133, "global_step": 58968, "epoch": 351} {"train_loss": -8.439791679382324, "global_step": 58969, "epoch": 351} {"train_loss": -8.652762413024902, "global_step": 58970, "epoch": 351} {"train_loss": -8.406882286071777, "global_step": 58971, "epoch": 351} {"train_loss": -8.426908493041992, "global_step": 58972, "epoch": 351} {"train_loss": -8.474555969238281, "global_step": 58973, "epoch": 351} {"train_loss": -8.7830810546875, "global_step": 58974, "epoch": 351} {"train_loss": -8.508039474487305, "global_step": 58975, "epoch": 351} {"train_loss": -8.639127731323242, "global_step": 58976, "epoch": 351} {"train_loss": -8.457651138305664, "global_step": 58977, "epoch": 351} {"train_loss": -8.713767051696777, "global_step": 58978, "epoch": 351} {"train_loss": -8.526925086975098, "global_step": 58979, "epoch": 351} {"train_loss": -8.750147819519043, "global_step": 58980, "epoch": 351} {"train_loss": -8.561582565307617, "global_step": 58981, "epoch": 351} {"train_loss": -8.546998977661133, "global_step": 58982, "epoch": 351} {"train_loss": -8.627693176269531, "global_step": 58983, "epoch": 351} {"train_loss": -8.718616485595703, "global_step": 58984, "epoch": 351} {"train_loss": -8.55926513671875, "global_step": 58985, "epoch": 351} {"train_loss": -8.309792518615723, "global_step": 58986, "epoch": 351} {"train_loss": -8.659574508666992, "global_step": 58987, "epoch": 351} {"train_loss": -8.537158966064453, "global_step": 58988, "epoch": 351} {"train_loss": -8.598917007446289, "global_step": 58989, "epoch": 351} {"train_loss": -8.593582153320312, "global_step": 58990, "epoch": 351} {"train_loss": -8.459808349609375, "global_step": 58991, "epoch": 351} {"train_loss": -8.276021957397461, "global_step": 58992, "epoch": 351} {"train_loss": -8.487458229064941, "global_step": 58993, "epoch": 351} {"train_loss": -8.37433910369873, "global_step": 58994, "epoch": 351} {"train_loss": -8.47854232788086, "global_step": 58995, "epoch": 351} {"train_loss": -8.261287689208984, "global_step": 58996, "epoch": 351} {"train_loss": -8.150390625, "global_step": 58997, "epoch": 351} {"train_loss": -8.309210777282715, "global_step": 58998, "epoch": 351} {"train_loss": -8.364290237426758, "global_step": 58999, "epoch": 351} {"train_loss": -8.317941665649414, "global_step": 59000, "epoch": 351} {"train_loss": -7.864714622497559, "global_step": 59001, "epoch": 351} {"train_loss": -8.201017379760742, "global_step": 59002, "epoch": 351} {"train_loss": -7.888220310211182, "global_step": 59003, "epoch": 351} {"train_loss": -7.917398452758789, "global_step": 59004, "epoch": 351} {"train_loss": -7.889431953430176, "global_step": 59005, "epoch": 351} {"train_loss": -7.996134281158447, "global_step": 59006, "epoch": 351} {"train_loss": -7.919044494628906, "global_step": 59007, "epoch": 351} {"train_loss": -7.962080955505371, "global_step": 59008, "epoch": 351} {"train_loss": -8.158266067504883, "global_step": 59009, "epoch": 351} {"train_loss": -8.132577896118164, "global_step": 59010, "epoch": 351} {"train_loss": -8.105222702026367, "global_step": 59011, "epoch": 351} {"train_loss": -8.392683982849121, "global_step": 59012, "epoch": 351} {"train_loss": -8.18014144897461, "global_step": 59013, "epoch": 351} {"train_loss": -8.279620170593262, "global_step": 59014, "epoch": 351} {"train_loss": -8.430452346801758, "global_step": 59015, "epoch": 351} {"train_loss": -8.36672306060791, "global_step": 59016, "epoch": 351} {"train_loss": -8.416579246520996, "global_step": 59017, "epoch": 351} {"train_loss": -8.455860137939453, "global_step": 59018, "epoch": 351} {"train_loss": -8.690834045410156, "global_step": 59019, "epoch": 351} {"train_loss": -8.358076095581055, "global_step": 59020, "epoch": 351} {"train_loss": -8.237564086914062, "global_step": 59021, "epoch": 351} {"train_loss": -8.36187744140625, "global_step": 59022, "epoch": 351} {"train_loss": -8.341347694396973, "global_step": 59023, "epoch": 351} {"train_loss": -8.56533432006836, "global_step": 59024, "epoch": 351} {"train_loss": -8.65007209777832, "global_step": 59025, "epoch": 351} {"train_loss": -8.645515441894531, "global_step": 59026, "epoch": 351} {"train_loss": -8.6505708694458, "global_step": 59027, "epoch": 351} {"train_loss": -8.780097007751465, "global_step": 59028, "epoch": 351} {"train_loss": -8.613471984863281, "global_step": 59029, "epoch": 351} {"train_loss": -8.636930465698242, "global_step": 59030, "epoch": 351} {"train_loss": -8.864323616027832, "global_step": 59031, "epoch": 351} {"train_loss": -8.752521514892578, "global_step": 59032, "epoch": 351} {"train_loss": -8.737255096435547, "global_step": 59033, "epoch": 351} {"train_loss": -8.861302375793457, "global_step": 59034, "epoch": 351} {"train_loss": -8.80606460571289, "global_step": 59035, "epoch": 351} {"train_loss": -8.836431503295898, "global_step": 59036, "epoch": 351} {"train_loss": -8.65977668762207, "global_step": 59037, "epoch": 351} {"train_loss": -8.936802864074707, "global_step": 59038, "epoch": 351} {"train_loss": -8.632882118225098, "global_step": 59039, "epoch": 351} {"train_loss": -8.96869945526123, "global_step": 59040, "epoch": 351} {"train_loss": -8.8860502243042, "global_step": 59041, "epoch": 351} {"train_loss": -8.812230110168457, "global_step": 59042, "epoch": 351} {"train_loss": -8.753255844116211, "global_step": 59043, "epoch": 351} {"train_loss": -8.58146858215332, "global_step": 59044, "epoch": 351} {"train_loss": -8.787256240844727, "global_step": 59045, "epoch": 351} {"train_loss": -8.359269142150879, "global_step": 59046, "epoch": 351} {"train_loss": -8.599388122558594, "global_step": 59047, "epoch": 351} {"train_loss": -8.11876106262207, "global_step": 59048, "epoch": 351} {"train_loss": -8.473533630371094, "global_step": 59049, "epoch": 351} {"train_loss": -8.586328506469727, "global_step": 59050, "epoch": 351} {"train_loss": -8.45634651184082, "global_step": 59051, "epoch": 351} {"train_loss": -8.314440727233887, "global_step": 59052, "epoch": 351} {"train_loss": -8.687103271484375, "global_step": 59053, "epoch": 351} {"train_loss": -8.524494171142578, "global_step": 59054, "epoch": 351} {"train_loss": -8.675126075744629, "global_step": 59055, "epoch": 351} {"train_loss": -8.556285858154297, "global_step": 59056, "epoch": 351} {"train_loss": -8.59807014465332, "global_step": 59057, "epoch": 351} {"train_loss": -8.64197826385498, "global_step": 59058, "epoch": 351} {"train_loss": -8.488664627075195, "global_step": 59059, "epoch": 351} {"train_loss": -8.610119819641113, "global_step": 59060, "epoch": 351} {"train_loss": -8.613198280334473, "global_step": 59061, "epoch": 351} {"train_loss": -8.53053092956543, "global_step": 59062, "epoch": 351} {"train_loss": -8.263372421264648, "global_step": 59063, "epoch": 351} {"train_loss": -8.735946655273438, "global_step": 59064, "epoch": 351} {"train_loss": -8.146636962890625, "global_step": 59065, "epoch": 351} {"train_loss": -8.683005332946777, "global_step": 59066, "epoch": 351} {"train_loss": -8.75228500366211, "global_step": 59067, "epoch": 351} {"train_loss": -8.31529426574707, "global_step": 59068, "epoch": 351} {"train_loss": -8.54594612121582, "global_step": 59069, "epoch": 351} {"train_loss": -8.618424415588379, "global_step": 59070, "epoch": 351} {"train_loss": -8.716267585754395, "global_step": 59071, "epoch": 351} {"train_loss": -8.634404182434082, "global_step": 59072, "epoch": 351} {"train_loss": -8.612478256225586, "global_step": 59073, "epoch": 351} {"train_loss": -8.74358081817627, "global_step": 59074, "epoch": 351} {"train_loss": -8.624879837036133, "global_step": 59075, "epoch": 351} {"train_loss": -8.833025932312012, "global_step": 59076, "epoch": 351} {"train_loss": -8.661341667175293, "global_step": 59077, "epoch": 351} {"train_loss": -8.513830184936523, "global_step": 59078, "epoch": 351} {"train_loss": -8.614316940307617, "global_step": 59079, "epoch": 351} {"train_loss": -8.775583267211914, "global_step": 59080, "epoch": 351} {"train_loss": -8.576286315917969, "global_step": 59081, "epoch": 351} {"train_loss": -8.53744888305664, "global_step": 59082, "epoch": 351} {"train_loss": -8.584912300109863, "global_step": 59083, "epoch": 351} {"train_loss": -8.584806442260742, "global_step": 59084, "epoch": 351} {"train_loss": -8.727519989013672, "global_step": 59085, "epoch": 351} {"train_loss": -8.407733917236328, "global_step": 59086, "epoch": 351} {"train_loss": -8.632270812988281, "global_step": 59087, "epoch": 351} {"train_loss": -8.555571556091309, "global_step": 59088, "epoch": 351} {"train_loss": -8.751394271850586, "global_step": 59089, "epoch": 351} {"train_loss": -8.407636642456055, "global_step": 59090, "epoch": 351} {"train_loss": -8.683830261230469, "global_step": 59091, "epoch": 351} {"train_loss": -8.601312637329102, "global_step": 59092, "epoch": 351} {"train_loss": -8.585090637207031, "global_step": 59093, "epoch": 351} {"train_loss": -8.705131530761719, "global_step": 59094, "epoch": 351} {"train_loss": -8.502281188964844, "global_step": 59095, "epoch": 351} {"train_loss": -8.48906135559082, "global_step": 59096, "epoch": 351} {"train_loss": -8.39079761505127, "global_step": 59097, "epoch": 351} {"train_loss": -8.569355010986328, "global_step": 59098, "epoch": 351} {"train_loss": -8.573087692260742, "global_step": 59099, "epoch": 351} {"train_loss": -8.619579315185547, "global_step": 59100, "epoch": 351} {"train_loss": -8.57947063446045, "global_step": 59101, "epoch": 351} {"train_loss": -8.863524436950684, "global_step": 59102, "epoch": 351} {"train_loss": -8.834674835205078, "global_step": 59103, "epoch": 351} {"train_loss": -8.569214820861816, "global_step": 59104, "epoch": 351} {"train_loss": -8.792137145996094, "global_step": 59105, "epoch": 351} {"train_loss": -8.673741340637207, "global_step": 59106, "epoch": 351} {"train_loss": -8.655268669128418, "global_step": 59107, "epoch": 351} {"train_loss": -8.813907623291016, "global_step": 59108, "epoch": 351} {"train_loss": -8.607633590698242, "global_step": 59109, "epoch": 351} {"train_loss": -8.751781463623047, "global_step": 59110, "epoch": 351} {"train_loss": -8.813594818115234, "global_step": 59111, "epoch": 351} {"train_loss": -8.42294692993164, "global_step": 59112, "epoch": 351} {"train_loss": -8.678794860839844, "global_step": 59113, "epoch": 351} {"train_loss": -8.3638916015625, "global_step": 59114, "epoch": 351} {"train_loss": -8.465060234069824, "global_step": 59115, "epoch": 351} {"train_loss": -8.679939270019531, "global_step": 59116, "epoch": 351} {"train_loss": -8.667627334594727, "global_step": 59117, "epoch": 351} {"train_loss": -8.750286102294922, "global_step": 59118, "epoch": 351} {"train_loss": -8.57194709777832, "global_step": 59119, "epoch": 351} {"train_loss": -8.761706352233887, "global_step": 59120, "epoch": 351} {"train_loss": -8.687397003173828, "global_step": 59121, "epoch": 351} {"train_loss": -8.99792766571045, "global_step": 59122, "epoch": 351} {"train_loss": -8.84101676940918, "global_step": 59123, "epoch": 351} {"train_loss": -8.537315368652344, "global_step": 59124, "epoch": 351} {"train_loss": -8.582530975341797, "global_step": 59125, "epoch": 351} {"train_loss": -8.491615295410156, "global_step": 59126, "epoch": 351} {"train_loss": -8.50307559967041, "global_step": 59127, "epoch": 351} {"train_loss": -8.490677833557129, "global_step": 59128, "epoch": 351} {"train_loss": -8.697946548461914, "global_step": 59129, "epoch": 351} {"train_loss": -8.512568473815918, "global_step": 59130, "epoch": 351} {"train_loss": -8.79345417022705, "global_step": 59131, "epoch": 351} {"train_loss": -8.625764846801758, "global_step": 59132, "epoch": 351} {"train_loss": -8.799406051635742, "global_step": 59133, "epoch": 351} {"train_loss": -8.678056716918945, "global_step": 59134, "epoch": 351} {"train_loss": -8.544511891546703, "global_step": 59135, "epoch": 351, "val_loss": 190884.125} {"train_loss": -8.75171947479248, "global_step": 59136, "epoch": 352} {"train_loss": -8.685037612915039, "global_step": 59137, "epoch": 352} {"train_loss": -8.811847686767578, "global_step": 59138, "epoch": 352} {"train_loss": -8.597464561462402, "global_step": 59139, "epoch": 352} {"train_loss": -8.680437088012695, "global_step": 59140, "epoch": 352} {"train_loss": -8.586326599121094, "global_step": 59141, "epoch": 352} {"train_loss": -8.858242988586426, "global_step": 59142, "epoch": 352} {"train_loss": -8.557832717895508, "global_step": 59143, "epoch": 352} {"train_loss": -8.778692245483398, "global_step": 59144, "epoch": 352} {"train_loss": -8.747062683105469, "global_step": 59145, "epoch": 352} {"train_loss": -8.56273365020752, "global_step": 59146, "epoch": 352} {"train_loss": -8.657362937927246, "global_step": 59147, "epoch": 352} {"train_loss": -8.685440063476562, "global_step": 59148, "epoch": 352} {"train_loss": -8.86361312866211, "global_step": 59149, "epoch": 352} {"train_loss": -8.586132049560547, "global_step": 59150, "epoch": 352} {"train_loss": -8.688352584838867, "global_step": 59151, "epoch": 352} {"train_loss": -8.610260963439941, "global_step": 59152, "epoch": 352} {"train_loss": -8.377586364746094, "global_step": 59153, "epoch": 352} {"train_loss": -8.67265796661377, "global_step": 59154, "epoch": 352} {"train_loss": -8.771190643310547, "global_step": 59155, "epoch": 352} {"train_loss": -8.754575729370117, "global_step": 59156, "epoch": 352} {"train_loss": -8.60894775390625, "global_step": 59157, "epoch": 352} {"train_loss": -8.61013412475586, "global_step": 59158, "epoch": 352} {"train_loss": -8.582433700561523, "global_step": 59159, "epoch": 352} {"train_loss": -9.049433708190918, "global_step": 59160, "epoch": 352} {"train_loss": -8.624128341674805, "global_step": 59161, "epoch": 352} {"train_loss": -8.293701171875, "global_step": 59162, "epoch": 352} {"train_loss": -8.755067825317383, "global_step": 59163, "epoch": 352} {"train_loss": -8.24277114868164, "global_step": 59164, "epoch": 352} {"train_loss": -8.165563583374023, "global_step": 59165, "epoch": 352} {"train_loss": -8.362531661987305, "global_step": 59166, "epoch": 352} {"train_loss": -8.475717544555664, "global_step": 59167, "epoch": 352} {"train_loss": -8.385605812072754, "global_step": 59168, "epoch": 352} {"train_loss": -8.523621559143066, "global_step": 59169, "epoch": 352} {"train_loss": -8.2050142288208, "global_step": 59170, "epoch": 352} {"train_loss": -8.477357864379883, "global_step": 59171, "epoch": 352} {"train_loss": -8.149850845336914, "global_step": 59172, "epoch": 352} {"train_loss": -8.558854103088379, "global_step": 59173, "epoch": 352} {"train_loss": -8.43308162689209, "global_step": 59174, "epoch": 352} {"train_loss": -8.384002685546875, "global_step": 59175, "epoch": 352} {"train_loss": -8.66092300415039, "global_step": 59176, "epoch": 352} {"train_loss": -8.09292984008789, "global_step": 59177, "epoch": 352} {"train_loss": -8.62696361541748, "global_step": 59178, "epoch": 352} {"train_loss": -8.591672897338867, "global_step": 59179, "epoch": 352} {"train_loss": -8.457071304321289, "global_step": 59180, "epoch": 352} {"train_loss": -8.619014739990234, "global_step": 59181, "epoch": 352} {"train_loss": -8.644254684448242, "global_step": 59182, "epoch": 352} {"train_loss": -8.486482620239258, "global_step": 59183, "epoch": 352} {"train_loss": -8.423635482788086, "global_step": 59184, "epoch": 352} {"train_loss": -8.77480697631836, "global_step": 59185, "epoch": 352} {"train_loss": -8.655233383178711, "global_step": 59186, "epoch": 352} {"train_loss": -8.304801940917969, "global_step": 59187, "epoch": 352} {"train_loss": -8.763874053955078, "global_step": 59188, "epoch": 352} {"train_loss": -8.758073806762695, "global_step": 59189, "epoch": 352} {"train_loss": -8.27263069152832, "global_step": 59190, "epoch": 352} {"train_loss": -8.721035957336426, "global_step": 59191, "epoch": 352} {"train_loss": -8.392454147338867, "global_step": 59192, "epoch": 352} {"train_loss": -8.654052734375, "global_step": 59193, "epoch": 352} {"train_loss": -8.743768692016602, "global_step": 59194, "epoch": 352} {"train_loss": -8.854214668273926, "global_step": 59195, "epoch": 352} {"train_loss": -8.322381973266602, "global_step": 59196, "epoch": 352} {"train_loss": -8.736059188842773, "global_step": 59197, "epoch": 352} {"train_loss": -8.442529678344727, "global_step": 59198, "epoch": 352} {"train_loss": -8.51165771484375, "global_step": 59199, "epoch": 352} {"train_loss": -8.706986427307129, "global_step": 59200, "epoch": 352} {"train_loss": -8.243608474731445, "global_step": 59201, "epoch": 352} {"train_loss": -8.732173919677734, "global_step": 59202, "epoch": 352} {"train_loss": -8.394011497497559, "global_step": 59203, "epoch": 352} {"train_loss": -8.438199996948242, "global_step": 59204, "epoch": 352} {"train_loss": -8.432844161987305, "global_step": 59205, "epoch": 352} {"train_loss": -8.710477828979492, "global_step": 59206, "epoch": 352} {"train_loss": -8.706039428710938, "global_step": 59207, "epoch": 352} {"train_loss": -8.645648956298828, "global_step": 59208, "epoch": 352} {"train_loss": -8.57036304473877, "global_step": 59209, "epoch": 352} {"train_loss": -8.5366849899292, "global_step": 59210, "epoch": 352} {"train_loss": -8.54574203491211, "global_step": 59211, "epoch": 352} {"train_loss": -8.697677612304688, "global_step": 59212, "epoch": 352} {"train_loss": -8.531661987304688, "global_step": 59213, "epoch": 352} {"train_loss": -8.875482559204102, "global_step": 59214, "epoch": 352} {"train_loss": -8.499598503112793, "global_step": 59215, "epoch": 352} {"train_loss": -8.81193733215332, "global_step": 59216, "epoch": 352} {"train_loss": -8.462356567382812, "global_step": 59217, "epoch": 352} {"train_loss": -8.659564018249512, "global_step": 59218, "epoch": 352} {"train_loss": -8.55285358428955, "global_step": 59219, "epoch": 352} {"train_loss": -8.778871536254883, "global_step": 59220, "epoch": 352} {"train_loss": -8.553537368774414, "global_step": 59221, "epoch": 352} {"train_loss": -8.645318031311035, "global_step": 59222, "epoch": 352} {"train_loss": -8.764009475708008, "global_step": 59223, "epoch": 352} {"train_loss": -8.668434143066406, "global_step": 59224, "epoch": 352} {"train_loss": -8.61247444152832, "global_step": 59225, "epoch": 352} {"train_loss": -8.871902465820312, "global_step": 59226, "epoch": 352} {"train_loss": -8.832856178283691, "global_step": 59227, "epoch": 352} {"train_loss": -8.547332763671875, "global_step": 59228, "epoch": 352} {"train_loss": -8.68000316619873, "global_step": 59229, "epoch": 352} {"train_loss": -8.798095703125, "global_step": 59230, "epoch": 352} {"train_loss": -9.004150390625, "global_step": 59231, "epoch": 352} {"train_loss": -8.720829010009766, "global_step": 59232, "epoch": 352} {"train_loss": -8.702512741088867, "global_step": 59233, "epoch": 352} {"train_loss": -8.833220481872559, "global_step": 59234, "epoch": 352} {"train_loss": -8.721046447753906, "global_step": 59235, "epoch": 352} {"train_loss": -8.888481140136719, "global_step": 59236, "epoch": 352} {"train_loss": -8.69614028930664, "global_step": 59237, "epoch": 352} {"train_loss": -8.85171127319336, "global_step": 59238, "epoch": 352} {"train_loss": -8.310551643371582, "global_step": 59239, "epoch": 352} {"train_loss": -8.41185188293457, "global_step": 59240, "epoch": 352} {"train_loss": -8.454198837280273, "global_step": 59241, "epoch": 352} {"train_loss": -8.610858917236328, "global_step": 59242, "epoch": 352} {"train_loss": -8.664649963378906, "global_step": 59243, "epoch": 352} {"train_loss": -8.607964515686035, "global_step": 59244, "epoch": 352} {"train_loss": -8.635113716125488, "global_step": 59245, "epoch": 352} {"train_loss": -8.440593719482422, "global_step": 59246, "epoch": 352} {"train_loss": -8.686508178710938, "global_step": 59247, "epoch": 352} {"train_loss": -8.574925422668457, "global_step": 59248, "epoch": 352} {"train_loss": -8.667511940002441, "global_step": 59249, "epoch": 352} {"train_loss": -8.750850677490234, "global_step": 59250, "epoch": 352} {"train_loss": -8.755412101745605, "global_step": 59251, "epoch": 352} {"train_loss": -8.671111106872559, "global_step": 59252, "epoch": 352} {"train_loss": -8.750871658325195, "global_step": 59253, "epoch": 352} {"train_loss": -8.717750549316406, "global_step": 59254, "epoch": 352} {"train_loss": -8.620561599731445, "global_step": 59255, "epoch": 352} {"train_loss": -8.627298355102539, "global_step": 59256, "epoch": 352} {"train_loss": -8.739679336547852, "global_step": 59257, "epoch": 352} {"train_loss": -8.735176086425781, "global_step": 59258, "epoch": 352} {"train_loss": -8.430301666259766, "global_step": 59259, "epoch": 352} {"train_loss": -8.60605239868164, "global_step": 59260, "epoch": 352} {"train_loss": -8.341814041137695, "global_step": 59261, "epoch": 352} {"train_loss": -8.58942985534668, "global_step": 59262, "epoch": 352} {"train_loss": -8.58740234375, "global_step": 59263, "epoch": 352} {"train_loss": -8.248600959777832, "global_step": 59264, "epoch": 352} {"train_loss": -8.70753288269043, "global_step": 59265, "epoch": 352} {"train_loss": -8.578827857971191, "global_step": 59266, "epoch": 352} {"train_loss": -8.582870483398438, "global_step": 59267, "epoch": 352} {"train_loss": -8.746976852416992, "global_step": 59268, "epoch": 352} {"train_loss": -8.654365539550781, "global_step": 59269, "epoch": 352} {"train_loss": -8.703079223632812, "global_step": 59270, "epoch": 352} {"train_loss": -8.68338394165039, "global_step": 59271, "epoch": 352} {"train_loss": -8.822810173034668, "global_step": 59272, "epoch": 352} {"train_loss": -8.570634841918945, "global_step": 59273, "epoch": 352} {"train_loss": -8.880183219909668, "global_step": 59274, "epoch": 352} {"train_loss": -8.65420913696289, "global_step": 59275, "epoch": 352} {"train_loss": -8.702957153320312, "global_step": 59276, "epoch": 352} {"train_loss": -8.406023025512695, "global_step": 59277, "epoch": 352} {"train_loss": -8.632155418395996, "global_step": 59278, "epoch": 352} {"train_loss": -8.59896469116211, "global_step": 59279, "epoch": 352} {"train_loss": -8.343082427978516, "global_step": 59280, "epoch": 352} {"train_loss": -8.579489707946777, "global_step": 59281, "epoch": 352} {"train_loss": -8.809377670288086, "global_step": 59282, "epoch": 352} {"train_loss": -8.522214889526367, "global_step": 59283, "epoch": 352} {"train_loss": -8.70663833618164, "global_step": 59284, "epoch": 352} {"train_loss": -8.37582015991211, "global_step": 59285, "epoch": 352} {"train_loss": -8.796441078186035, "global_step": 59286, "epoch": 352} {"train_loss": -8.398874282836914, "global_step": 59287, "epoch": 352} {"train_loss": -8.394136428833008, "global_step": 59288, "epoch": 352} {"train_loss": -8.783266067504883, "global_step": 59289, "epoch": 352} {"train_loss": -8.186195373535156, "global_step": 59290, "epoch": 352} {"train_loss": -8.598196983337402, "global_step": 59291, "epoch": 352} {"train_loss": -8.458748817443848, "global_step": 59292, "epoch": 352} {"train_loss": -8.584280014038086, "global_step": 59293, "epoch": 352} {"train_loss": -8.281511306762695, "global_step": 59294, "epoch": 352} {"train_loss": -8.721814155578613, "global_step": 59295, "epoch": 352} {"train_loss": -8.613627433776855, "global_step": 59296, "epoch": 352} {"train_loss": -8.617908477783203, "global_step": 59297, "epoch": 352} {"train_loss": -8.353681564331055, "global_step": 59298, "epoch": 352} {"train_loss": -8.668096542358398, "global_step": 59299, "epoch": 352} {"train_loss": -8.436806678771973, "global_step": 59300, "epoch": 352} {"train_loss": -8.709300994873047, "global_step": 59301, "epoch": 352} {"train_loss": -8.509324073791504, "global_step": 59302, "epoch": 352} {"train_loss": -8.598883946736654, "global_step": 59303, "epoch": 352, "val_loss": 193937.984375} {"train_loss": -8.64587688446045, "global_step": 59304, "epoch": 353} {"train_loss": -8.51668643951416, "global_step": 59305, "epoch": 353} {"train_loss": -8.460468292236328, "global_step": 59306, "epoch": 353} {"train_loss": -8.498844146728516, "global_step": 59307, "epoch": 353} {"train_loss": -8.488417625427246, "global_step": 59308, "epoch": 353} {"train_loss": -8.534036636352539, "global_step": 59309, "epoch": 353} {"train_loss": -8.54300308227539, "global_step": 59310, "epoch": 353} {"train_loss": -8.436487197875977, "global_step": 59311, "epoch": 353} {"train_loss": -8.44554615020752, "global_step": 59312, "epoch": 353} {"train_loss": -8.360494613647461, "global_step": 59313, "epoch": 353} {"train_loss": -8.529923439025879, "global_step": 59314, "epoch": 353} {"train_loss": -8.614047050476074, "global_step": 59315, "epoch": 353} {"train_loss": -8.547595977783203, "global_step": 59316, "epoch": 353} {"train_loss": -8.408194541931152, "global_step": 59317, "epoch": 353} {"train_loss": -8.578258514404297, "global_step": 59318, "epoch": 353} {"train_loss": -8.485147476196289, "global_step": 59319, "epoch": 353} {"train_loss": -8.114706993103027, "global_step": 59320, "epoch": 353} {"train_loss": -8.507822036743164, "global_step": 59321, "epoch": 353} {"train_loss": -8.342643737792969, "global_step": 59322, "epoch": 353} {"train_loss": -8.368431091308594, "global_step": 59323, "epoch": 353} {"train_loss": -8.683560371398926, "global_step": 59324, "epoch": 353} {"train_loss": -8.61850357055664, "global_step": 59325, "epoch": 353} {"train_loss": -8.783130645751953, "global_step": 59326, "epoch": 353} {"train_loss": -8.667972564697266, "global_step": 59327, "epoch": 353} {"train_loss": -8.709285736083984, "global_step": 59328, "epoch": 353} {"train_loss": -8.762791633605957, "global_step": 59329, "epoch": 353} {"train_loss": -8.629983901977539, "global_step": 59330, "epoch": 353} {"train_loss": -8.637109756469727, "global_step": 59331, "epoch": 353} {"train_loss": -8.577387809753418, "global_step": 59332, "epoch": 353} {"train_loss": -8.574117660522461, "global_step": 59333, "epoch": 353} {"train_loss": -8.587411880493164, "global_step": 59334, "epoch": 353} {"train_loss": -8.70156192779541, "global_step": 59335, "epoch": 353} {"train_loss": -8.737934112548828, "global_step": 59336, "epoch": 353} {"train_loss": -8.640586853027344, "global_step": 59337, "epoch": 353} {"train_loss": -8.717912673950195, "global_step": 59338, "epoch": 353} {"train_loss": -8.715449333190918, "global_step": 59339, "epoch": 353} {"train_loss": -8.732754707336426, "global_step": 59340, "epoch": 353} {"train_loss": -8.771732330322266, "global_step": 59341, "epoch": 353} {"train_loss": -8.58012866973877, "global_step": 59342, "epoch": 353} {"train_loss": -8.729619026184082, "global_step": 59343, "epoch": 353} {"train_loss": -8.588526725769043, "global_step": 59344, "epoch": 353} {"train_loss": -8.419658660888672, "global_step": 59345, "epoch": 353} {"train_loss": -8.644841194152832, "global_step": 59346, "epoch": 353} {"train_loss": -8.287885665893555, "global_step": 59347, "epoch": 353} {"train_loss": -8.484820365905762, "global_step": 59348, "epoch": 353} {"train_loss": -8.506786346435547, "global_step": 59349, "epoch": 353} {"train_loss": -8.78171443939209, "global_step": 59350, "epoch": 353} {"train_loss": -8.337411880493164, "global_step": 59351, "epoch": 353} {"train_loss": -8.438447952270508, "global_step": 59352, "epoch": 353} {"train_loss": -8.528717994689941, "global_step": 59353, "epoch": 353} {"train_loss": -7.983805179595947, "global_step": 59354, "epoch": 353} {"train_loss": -8.516618728637695, "global_step": 59355, "epoch": 353} {"train_loss": -8.135835647583008, "global_step": 59356, "epoch": 353} {"train_loss": -8.415693283081055, "global_step": 59357, "epoch": 353} {"train_loss": -8.195186614990234, "global_step": 59358, "epoch": 353} {"train_loss": -8.376670837402344, "global_step": 59359, "epoch": 353} {"train_loss": -8.304555892944336, "global_step": 59360, "epoch": 353} {"train_loss": -8.315363883972168, "global_step": 59361, "epoch": 353} {"train_loss": -8.368667602539062, "global_step": 59362, "epoch": 353} {"train_loss": -8.2535400390625, "global_step": 59363, "epoch": 353} {"train_loss": -8.298851013183594, "global_step": 59364, "epoch": 353} {"train_loss": -8.406349182128906, "global_step": 59365, "epoch": 353} {"train_loss": -8.45943546295166, "global_step": 59366, "epoch": 353} {"train_loss": -8.205412864685059, "global_step": 59367, "epoch": 353} {"train_loss": -8.645496368408203, "global_step": 59368, "epoch": 353} {"train_loss": -8.646090507507324, "global_step": 59369, "epoch": 353} {"train_loss": -8.407464981079102, "global_step": 59370, "epoch": 353} {"train_loss": -8.646707534790039, "global_step": 59371, "epoch": 353} {"train_loss": -8.537153244018555, "global_step": 59372, "epoch": 353} {"train_loss": -8.47572135925293, "global_step": 59373, "epoch": 353} {"train_loss": -8.501309394836426, "global_step": 59374, "epoch": 353} {"train_loss": -8.493278503417969, "global_step": 59375, "epoch": 353} {"train_loss": -8.758919715881348, "global_step": 59376, "epoch": 353} {"train_loss": -8.705963134765625, "global_step": 59377, "epoch": 353} {"train_loss": -8.583821296691895, "global_step": 59378, "epoch": 353} {"train_loss": -8.527297973632812, "global_step": 59379, "epoch": 353} {"train_loss": -8.611345291137695, "global_step": 59380, "epoch": 353} {"train_loss": -8.494697570800781, "global_step": 59381, "epoch": 353} {"train_loss": -8.619159698486328, "global_step": 59382, "epoch": 353} {"train_loss": -8.613146781921387, "global_step": 59383, "epoch": 353} {"train_loss": -8.604303359985352, "global_step": 59384, "epoch": 353} {"train_loss": -8.483365058898926, "global_step": 59385, "epoch": 353} {"train_loss": -8.85462474822998, "global_step": 59386, "epoch": 353} {"train_loss": -8.675140380859375, "global_step": 59387, "epoch": 353} {"train_loss": -8.54330825805664, "global_step": 59388, "epoch": 353} {"train_loss": -8.794776916503906, "global_step": 59389, "epoch": 353} {"train_loss": -8.657018661499023, "global_step": 59390, "epoch": 353} {"train_loss": -8.797760009765625, "global_step": 59391, "epoch": 353} {"train_loss": -8.477680206298828, "global_step": 59392, "epoch": 353} {"train_loss": -8.964277267456055, "global_step": 59393, "epoch": 353} {"train_loss": -8.416009902954102, "global_step": 59394, "epoch": 353} {"train_loss": -8.515864372253418, "global_step": 59395, "epoch": 353} {"train_loss": -8.540114402770996, "global_step": 59396, "epoch": 353} {"train_loss": -8.316908836364746, "global_step": 59397, "epoch": 353} {"train_loss": -8.328178405761719, "global_step": 59398, "epoch": 353} {"train_loss": -8.29503059387207, "global_step": 59399, "epoch": 353} {"train_loss": -8.487966537475586, "global_step": 59400, "epoch": 353} {"train_loss": -8.431852340698242, "global_step": 59401, "epoch": 353} {"train_loss": -8.530710220336914, "global_step": 59402, "epoch": 353} {"train_loss": -8.200387001037598, "global_step": 59403, "epoch": 353} {"train_loss": -8.451396942138672, "global_step": 59404, "epoch": 353} {"train_loss": -8.298151016235352, "global_step": 59405, "epoch": 353} {"train_loss": -8.318682670593262, "global_step": 59406, "epoch": 353} {"train_loss": -8.090536117553711, "global_step": 59407, "epoch": 353} {"train_loss": -8.332449913024902, "global_step": 59408, "epoch": 353} {"train_loss": -8.392838478088379, "global_step": 59409, "epoch": 353} {"train_loss": -8.601007461547852, "global_step": 59410, "epoch": 353} {"train_loss": -8.565852165222168, "global_step": 59411, "epoch": 353} {"train_loss": -8.406254768371582, "global_step": 59412, "epoch": 353} {"train_loss": -8.283580780029297, "global_step": 59413, "epoch": 353} {"train_loss": -8.420978546142578, "global_step": 59414, "epoch": 353} {"train_loss": -8.539710998535156, "global_step": 59415, "epoch": 353} {"train_loss": -8.32432746887207, "global_step": 59416, "epoch": 353} {"train_loss": -8.39310359954834, "global_step": 59417, "epoch": 353} {"train_loss": -8.497785568237305, "global_step": 59418, "epoch": 353} {"train_loss": -8.733709335327148, "global_step": 59419, "epoch": 353} {"train_loss": -8.362218856811523, "global_step": 59420, "epoch": 353} {"train_loss": -8.50813102722168, "global_step": 59421, "epoch": 353} {"train_loss": -8.757759094238281, "global_step": 59422, "epoch": 353} {"train_loss": -8.496672630310059, "global_step": 59423, "epoch": 353} {"train_loss": -8.579548835754395, "global_step": 59424, "epoch": 353} {"train_loss": -8.627954483032227, "global_step": 59425, "epoch": 353} {"train_loss": -8.669197082519531, "global_step": 59426, "epoch": 353} {"train_loss": -8.444822311401367, "global_step": 59427, "epoch": 353} {"train_loss": -8.601081848144531, "global_step": 59428, "epoch": 353} {"train_loss": -8.484867095947266, "global_step": 59429, "epoch": 353} {"train_loss": -8.698260307312012, "global_step": 59430, "epoch": 353} {"train_loss": -8.459041595458984, "global_step": 59431, "epoch": 353} {"train_loss": -8.857890129089355, "global_step": 59432, "epoch": 353} {"train_loss": -8.499494552612305, "global_step": 59433, "epoch": 353} {"train_loss": -8.782476425170898, "global_step": 59434, "epoch": 353} {"train_loss": -8.717657089233398, "global_step": 59435, "epoch": 353} {"train_loss": -8.792317390441895, "global_step": 59436, "epoch": 353} {"train_loss": -8.739034652709961, "global_step": 59437, "epoch": 353} {"train_loss": -8.878789901733398, "global_step": 59438, "epoch": 353} {"train_loss": -8.507227897644043, "global_step": 59439, "epoch": 353} {"train_loss": -8.702179908752441, "global_step": 59440, "epoch": 353} {"train_loss": -8.750993728637695, "global_step": 59441, "epoch": 353} {"train_loss": -8.836045265197754, "global_step": 59442, "epoch": 353} {"train_loss": -8.699118614196777, "global_step": 59443, "epoch": 353} {"train_loss": -8.590429306030273, "global_step": 59444, "epoch": 353} {"train_loss": -8.794384002685547, "global_step": 59445, "epoch": 353} {"train_loss": -8.560859680175781, "global_step": 59446, "epoch": 353} {"train_loss": -8.516870498657227, "global_step": 59447, "epoch": 353} {"train_loss": -8.469282150268555, "global_step": 59448, "epoch": 353} {"train_loss": -8.721273422241211, "global_step": 59449, "epoch": 353} {"train_loss": -8.74038314819336, "global_step": 59450, "epoch": 353} {"train_loss": -8.532472610473633, "global_step": 59451, "epoch": 353} {"train_loss": -8.370597839355469, "global_step": 59452, "epoch": 353} {"train_loss": -8.74606704711914, "global_step": 59453, "epoch": 353} {"train_loss": -8.442026138305664, "global_step": 59454, "epoch": 353} {"train_loss": -8.529452323913574, "global_step": 59455, "epoch": 353} {"train_loss": -8.374839782714844, "global_step": 59456, "epoch": 353} {"train_loss": -8.539902687072754, "global_step": 59457, "epoch": 353} {"train_loss": -8.375579833984375, "global_step": 59458, "epoch": 353} {"train_loss": -8.48493480682373, "global_step": 59459, "epoch": 353} {"train_loss": -8.386127471923828, "global_step": 59460, "epoch": 353} {"train_loss": -8.475576400756836, "global_step": 59461, "epoch": 353} {"train_loss": -8.581228256225586, "global_step": 59462, "epoch": 353} {"train_loss": -8.440402030944824, "global_step": 59463, "epoch": 353} {"train_loss": -8.725690841674805, "global_step": 59464, "epoch": 353} {"train_loss": -8.430490493774414, "global_step": 59465, "epoch": 353} {"train_loss": -8.462909698486328, "global_step": 59466, "epoch": 353} {"train_loss": -8.462152481079102, "global_step": 59467, "epoch": 353} {"train_loss": -8.444795608520508, "global_step": 59468, "epoch": 353} {"train_loss": -8.615720748901367, "global_step": 59469, "epoch": 353} {"train_loss": -8.378352165222168, "global_step": 59470, "epoch": 353} {"train_loss": -8.533176294394902, "global_step": 59471, "epoch": 353, "val_loss": 190872.90625} {"train_loss": -8.533611297607422, "global_step": 59472, "epoch": 354} {"train_loss": -8.500104904174805, "global_step": 59473, "epoch": 354} {"train_loss": -8.430116653442383, "global_step": 59474, "epoch": 354} {"train_loss": -8.685593605041504, "global_step": 59475, "epoch": 354} {"train_loss": -8.324481964111328, "global_step": 59476, "epoch": 354} {"train_loss": -8.64283561706543, "global_step": 59477, "epoch": 354} {"train_loss": -8.46987533569336, "global_step": 59478, "epoch": 354} {"train_loss": -8.57675552368164, "global_step": 59479, "epoch": 354} {"train_loss": -8.438992500305176, "global_step": 59480, "epoch": 354} {"train_loss": -8.65682315826416, "global_step": 59481, "epoch": 354} {"train_loss": -8.614648818969727, "global_step": 59482, "epoch": 354} {"train_loss": -8.38522720336914, "global_step": 59483, "epoch": 354} {"train_loss": -8.507979393005371, "global_step": 59484, "epoch": 354} {"train_loss": -8.326831817626953, "global_step": 59485, "epoch": 354} {"train_loss": -8.25627613067627, "global_step": 59486, "epoch": 354} {"train_loss": -8.40783977508545, "global_step": 59487, "epoch": 354} {"train_loss": -8.341314315795898, "global_step": 59488, "epoch": 354} {"train_loss": -8.622922897338867, "global_step": 59489, "epoch": 354} {"train_loss": -8.667099952697754, "global_step": 59490, "epoch": 354} {"train_loss": -8.311357498168945, "global_step": 59491, "epoch": 354} {"train_loss": -8.581315994262695, "global_step": 59492, "epoch": 354} {"train_loss": -8.579216957092285, "global_step": 59493, "epoch": 354} {"train_loss": -8.813172340393066, "global_step": 59494, "epoch": 354} {"train_loss": -8.6272554397583, "global_step": 59495, "epoch": 354} {"train_loss": -8.528868675231934, "global_step": 59496, "epoch": 354} {"train_loss": -8.641644477844238, "global_step": 59497, "epoch": 354} {"train_loss": -8.942422866821289, "global_step": 59498, "epoch": 354} {"train_loss": -8.611495018005371, "global_step": 59499, "epoch": 354} {"train_loss": -8.562356948852539, "global_step": 59500, "epoch": 354} {"train_loss": -8.560711860656738, "global_step": 59501, "epoch": 354} {"train_loss": -8.73917293548584, "global_step": 59502, "epoch": 354} {"train_loss": -8.665952682495117, "global_step": 59503, "epoch": 354} {"train_loss": -8.808578491210938, "global_step": 59504, "epoch": 354} {"train_loss": -8.630517959594727, "global_step": 59505, "epoch": 354} {"train_loss": -8.485122680664062, "global_step": 59506, "epoch": 354} {"train_loss": -8.698423385620117, "global_step": 59507, "epoch": 354} {"train_loss": -8.818147659301758, "global_step": 59508, "epoch": 354} {"train_loss": -8.585391998291016, "global_step": 59509, "epoch": 354} {"train_loss": -8.090452194213867, "global_step": 59510, "epoch": 354} {"train_loss": -8.711236953735352, "global_step": 59511, "epoch": 354} {"train_loss": -8.425701141357422, "global_step": 59512, "epoch": 354} {"train_loss": -8.225239753723145, "global_step": 59513, "epoch": 354} {"train_loss": -8.249025344848633, "global_step": 59514, "epoch": 354} {"train_loss": -8.533966064453125, "global_step": 59515, "epoch": 354} {"train_loss": -8.59450912475586, "global_step": 59516, "epoch": 354} {"train_loss": -8.443294525146484, "global_step": 59517, "epoch": 354} {"train_loss": -8.773147583007812, "global_step": 59518, "epoch": 354} {"train_loss": -8.779739379882812, "global_step": 59519, "epoch": 354} {"train_loss": -8.357037544250488, "global_step": 59520, "epoch": 354} {"train_loss": -8.720272064208984, "global_step": 59521, "epoch": 354} {"train_loss": -8.622298240661621, "global_step": 59522, "epoch": 354} {"train_loss": -8.516793251037598, "global_step": 59523, "epoch": 354} {"train_loss": -8.912158012390137, "global_step": 59524, "epoch": 354} {"train_loss": -8.746516227722168, "global_step": 59525, "epoch": 354} {"train_loss": -8.666831016540527, "global_step": 59526, "epoch": 354} {"train_loss": -8.413179397583008, "global_step": 59527, "epoch": 354} {"train_loss": -8.827227592468262, "global_step": 59528, "epoch": 354} {"train_loss": -8.493389129638672, "global_step": 59529, "epoch": 354} {"train_loss": -8.684612274169922, "global_step": 59530, "epoch": 354} {"train_loss": -8.67738151550293, "global_step": 59531, "epoch": 354} {"train_loss": -8.713854789733887, "global_step": 59532, "epoch": 354} {"train_loss": -8.68891429901123, "global_step": 59533, "epoch": 354} {"train_loss": -8.676737785339355, "global_step": 59534, "epoch": 354} {"train_loss": -8.61905288696289, "global_step": 59535, "epoch": 354} {"train_loss": -8.60191822052002, "global_step": 59536, "epoch": 354} {"train_loss": -8.495105743408203, "global_step": 59537, "epoch": 354} {"train_loss": -8.52412223815918, "global_step": 59538, "epoch": 354} {"train_loss": -8.538492202758789, "global_step": 59539, "epoch": 354} {"train_loss": -8.819074630737305, "global_step": 59540, "epoch": 354} {"train_loss": -8.447708129882812, "global_step": 59541, "epoch": 354} {"train_loss": -8.885444641113281, "global_step": 59542, "epoch": 354} {"train_loss": -8.53676986694336, "global_step": 59543, "epoch": 354} {"train_loss": -8.771346092224121, "global_step": 59544, "epoch": 354} {"train_loss": -8.96888542175293, "global_step": 59545, "epoch": 354} {"train_loss": -8.745182037353516, "global_step": 59546, "epoch": 354} {"train_loss": -8.751056671142578, "global_step": 59547, "epoch": 354} {"train_loss": -8.619967460632324, "global_step": 59548, "epoch": 354} {"train_loss": -8.75528335571289, "global_step": 59549, "epoch": 354} {"train_loss": -8.829085350036621, "global_step": 59550, "epoch": 354} {"train_loss": -8.742050170898438, "global_step": 59551, "epoch": 354} {"train_loss": -8.92116928100586, "global_step": 59552, "epoch": 354} {"train_loss": -8.40328598022461, "global_step": 59553, "epoch": 354} {"train_loss": -8.657951354980469, "global_step": 59554, "epoch": 354} {"train_loss": -8.821645736694336, "global_step": 59555, "epoch": 354} {"train_loss": -8.563141822814941, "global_step": 59556, "epoch": 354} {"train_loss": -8.735674858093262, "global_step": 59557, "epoch": 354} {"train_loss": -8.61203384399414, "global_step": 59558, "epoch": 354} {"train_loss": -8.564315795898438, "global_step": 59559, "epoch": 354} {"train_loss": -8.655374526977539, "global_step": 59560, "epoch": 354} {"train_loss": -8.61506462097168, "global_step": 59561, "epoch": 354} {"train_loss": -8.800243377685547, "global_step": 59562, "epoch": 354} {"train_loss": -8.787412643432617, "global_step": 59563, "epoch": 354} {"train_loss": -8.90115737915039, "global_step": 59564, "epoch": 354} {"train_loss": -8.543886184692383, "global_step": 59565, "epoch": 354} {"train_loss": -8.9457426071167, "global_step": 59566, "epoch": 354} {"train_loss": -8.56938648223877, "global_step": 59567, "epoch": 354} {"train_loss": -8.660200119018555, "global_step": 59568, "epoch": 354} {"train_loss": -8.781696319580078, "global_step": 59569, "epoch": 354} {"train_loss": -8.683889389038086, "global_step": 59570, "epoch": 354} {"train_loss": -8.522237777709961, "global_step": 59571, "epoch": 354} {"train_loss": -8.310811042785645, "global_step": 59572, "epoch": 354} {"train_loss": -8.450562477111816, "global_step": 59573, "epoch": 354} {"train_loss": -8.553674697875977, "global_step": 59574, "epoch": 354} {"train_loss": -8.405184745788574, "global_step": 59575, "epoch": 354} {"train_loss": -8.603809356689453, "global_step": 59576, "epoch": 354} {"train_loss": -8.454046249389648, "global_step": 59577, "epoch": 354} {"train_loss": -8.510274887084961, "global_step": 59578, "epoch": 354} {"train_loss": -8.453657150268555, "global_step": 59579, "epoch": 354} {"train_loss": -8.637743949890137, "global_step": 59580, "epoch": 354} {"train_loss": -8.624919891357422, "global_step": 59581, "epoch": 354} {"train_loss": -8.676921844482422, "global_step": 59582, "epoch": 354} {"train_loss": -8.624345779418945, "global_step": 59583, "epoch": 354} {"train_loss": -8.602347373962402, "global_step": 59584, "epoch": 354} {"train_loss": -8.61235237121582, "global_step": 59585, "epoch": 354} {"train_loss": -8.947476387023926, "global_step": 59586, "epoch": 354} {"train_loss": -8.651162147521973, "global_step": 59587, "epoch": 354} {"train_loss": -8.700749397277832, "global_step": 59588, "epoch": 354} {"train_loss": -8.543134689331055, "global_step": 59589, "epoch": 354} {"train_loss": -8.637609481811523, "global_step": 59590, "epoch": 354} {"train_loss": -8.831489562988281, "global_step": 59591, "epoch": 354} {"train_loss": -8.627561569213867, "global_step": 59592, "epoch": 354} {"train_loss": -8.6448392868042, "global_step": 59593, "epoch": 354} {"train_loss": -8.753902435302734, "global_step": 59594, "epoch": 354} {"train_loss": -8.50175666809082, "global_step": 59595, "epoch": 354} {"train_loss": -8.632381439208984, "global_step": 59596, "epoch": 354} {"train_loss": -8.434560775756836, "global_step": 59597, "epoch": 354} {"train_loss": -8.727165222167969, "global_step": 59598, "epoch": 354} {"train_loss": -8.623886108398438, "global_step": 59599, "epoch": 354} {"train_loss": -8.79343032836914, "global_step": 59600, "epoch": 354} {"train_loss": -8.584894180297852, "global_step": 59601, "epoch": 354} {"train_loss": -8.735269546508789, "global_step": 59602, "epoch": 354} {"train_loss": -8.646885871887207, "global_step": 59603, "epoch": 354} {"train_loss": -8.899314880371094, "global_step": 59604, "epoch": 354} {"train_loss": -8.70343017578125, "global_step": 59605, "epoch": 354} {"train_loss": -8.556133270263672, "global_step": 59606, "epoch": 354} {"train_loss": -8.785639762878418, "global_step": 59607, "epoch": 354} {"train_loss": -8.88001823425293, "global_step": 59608, "epoch": 354} {"train_loss": -8.651620864868164, "global_step": 59609, "epoch": 354} {"train_loss": -8.893747329711914, "global_step": 59610, "epoch": 354} {"train_loss": -8.799430847167969, "global_step": 59611, "epoch": 354} {"train_loss": -8.5216646194458, "global_step": 59612, "epoch": 354} {"train_loss": -8.83012866973877, "global_step": 59613, "epoch": 354} {"train_loss": -8.744630813598633, "global_step": 59614, "epoch": 354} {"train_loss": -8.107674598693848, "global_step": 59615, "epoch": 354} {"train_loss": -8.719968795776367, "global_step": 59616, "epoch": 354} {"train_loss": -8.223209381103516, "global_step": 59617, "epoch": 354} {"train_loss": -8.503495216369629, "global_step": 59618, "epoch": 354} {"train_loss": -8.59857177734375, "global_step": 59619, "epoch": 354} {"train_loss": -8.151436805725098, "global_step": 59620, "epoch": 354} {"train_loss": -8.395634651184082, "global_step": 59621, "epoch": 354} {"train_loss": -8.570658683776855, "global_step": 59622, "epoch": 354} {"train_loss": -8.348581314086914, "global_step": 59623, "epoch": 354} {"train_loss": -8.292510986328125, "global_step": 59624, "epoch": 354} {"train_loss": -8.423897743225098, "global_step": 59625, "epoch": 354} {"train_loss": -8.541070938110352, "global_step": 59626, "epoch": 354} {"train_loss": -8.569774627685547, "global_step": 59627, "epoch": 354} {"train_loss": -8.269390106201172, "global_step": 59628, "epoch": 354} {"train_loss": -8.563974380493164, "global_step": 59629, "epoch": 354} {"train_loss": -8.499540328979492, "global_step": 59630, "epoch": 354} {"train_loss": -8.457974433898926, "global_step": 59631, "epoch": 354} {"train_loss": -8.431987762451172, "global_step": 59632, "epoch": 354} {"train_loss": -8.449379920959473, "global_step": 59633, "epoch": 354} {"train_loss": -8.163714408874512, "global_step": 59634, "epoch": 354} {"train_loss": -8.525954246520996, "global_step": 59635, "epoch": 354} {"train_loss": -8.506874084472656, "global_step": 59636, "epoch": 354} {"train_loss": -8.46269702911377, "global_step": 59637, "epoch": 354} {"train_loss": -8.548901557922363, "global_step": 59638, "epoch": 354} {"train_loss": -8.595979469163078, "global_step": 59639, "epoch": 354, "val_loss": 189090.734375} {"train_loss": -8.56029987335205, "global_step": 59640, "epoch": 355} {"train_loss": -8.77306842803955, "global_step": 59641, "epoch": 355} {"train_loss": -8.691177368164062, "global_step": 59642, "epoch": 355} {"train_loss": -8.66613483428955, "global_step": 59643, "epoch": 355} {"train_loss": -8.664880752563477, "global_step": 59644, "epoch": 355} {"train_loss": -8.76710033416748, "global_step": 59645, "epoch": 355} {"train_loss": -8.716306686401367, "global_step": 59646, "epoch": 355} {"train_loss": -8.839569091796875, "global_step": 59647, "epoch": 355} {"train_loss": -8.733111381530762, "global_step": 59648, "epoch": 355} {"train_loss": -8.700851440429688, "global_step": 59649, "epoch": 355} {"train_loss": -8.968978881835938, "global_step": 59650, "epoch": 355} {"train_loss": -8.799352645874023, "global_step": 59651, "epoch": 355} {"train_loss": -8.867918014526367, "global_step": 59652, "epoch": 355} {"train_loss": -8.73808765411377, "global_step": 59653, "epoch": 355} {"train_loss": -8.67479133605957, "global_step": 59654, "epoch": 355} {"train_loss": -8.857551574707031, "global_step": 59655, "epoch": 355} {"train_loss": -8.46825122833252, "global_step": 59656, "epoch": 355} {"train_loss": -8.596799850463867, "global_step": 59657, "epoch": 355} {"train_loss": -8.627927780151367, "global_step": 59658, "epoch": 355} {"train_loss": -8.430255889892578, "global_step": 59659, "epoch": 355} {"train_loss": -8.431148529052734, "global_step": 59660, "epoch": 355} {"train_loss": -8.495352745056152, "global_step": 59661, "epoch": 355} {"train_loss": -8.733053207397461, "global_step": 59662, "epoch": 355} {"train_loss": -8.58900260925293, "global_step": 59663, "epoch": 355} {"train_loss": -8.412277221679688, "global_step": 59664, "epoch": 355} {"train_loss": -8.365921020507812, "global_step": 59665, "epoch": 355} {"train_loss": -8.475671768188477, "global_step": 59666, "epoch": 355} {"train_loss": -8.552356719970703, "global_step": 59667, "epoch": 355} {"train_loss": -8.711082458496094, "global_step": 59668, "epoch": 355} {"train_loss": -8.490087509155273, "global_step": 59669, "epoch": 355} {"train_loss": -8.70296859741211, "global_step": 59670, "epoch": 355} {"train_loss": -8.504343032836914, "global_step": 59671, "epoch": 355} {"train_loss": -8.750255584716797, "global_step": 59672, "epoch": 355} {"train_loss": -8.562522888183594, "global_step": 59673, "epoch": 355} {"train_loss": -8.69611930847168, "global_step": 59674, "epoch": 355} {"train_loss": -8.658823013305664, "global_step": 59675, "epoch": 355} {"train_loss": -8.805727005004883, "global_step": 59676, "epoch": 355} {"train_loss": -8.854731559753418, "global_step": 59677, "epoch": 355} {"train_loss": -8.533770561218262, "global_step": 59678, "epoch": 355} {"train_loss": -8.706441879272461, "global_step": 59679, "epoch": 355} {"train_loss": -8.661877632141113, "global_step": 59680, "epoch": 355} {"train_loss": -8.665796279907227, "global_step": 59681, "epoch": 355} {"train_loss": -8.80672836303711, "global_step": 59682, "epoch": 355} {"train_loss": -8.758637428283691, "global_step": 59683, "epoch": 355} {"train_loss": -8.838397979736328, "global_step": 59684, "epoch": 355} {"train_loss": -8.600767135620117, "global_step": 59685, "epoch": 355} {"train_loss": -8.813102722167969, "global_step": 59686, "epoch": 355} {"train_loss": -8.813425064086914, "global_step": 59687, "epoch": 355} {"train_loss": -8.499810218811035, "global_step": 59688, "epoch": 355} {"train_loss": -8.774182319641113, "global_step": 59689, "epoch": 355} {"train_loss": -8.477848052978516, "global_step": 59690, "epoch": 355} {"train_loss": -8.599512100219727, "global_step": 59691, "epoch": 355} {"train_loss": -8.584305763244629, "global_step": 59692, "epoch": 355} {"train_loss": -8.777902603149414, "global_step": 59693, "epoch": 355} {"train_loss": -8.574023246765137, "global_step": 59694, "epoch": 355} {"train_loss": -8.718400001525879, "global_step": 59695, "epoch": 355} {"train_loss": -8.51029109954834, "global_step": 59696, "epoch": 355} {"train_loss": -8.620320320129395, "global_step": 59697, "epoch": 355} {"train_loss": -8.728001594543457, "global_step": 59698, "epoch": 355} {"train_loss": -8.513747215270996, "global_step": 59699, "epoch": 355} {"train_loss": -8.512239456176758, "global_step": 59700, "epoch": 355} {"train_loss": -8.463446617126465, "global_step": 59701, "epoch": 355} {"train_loss": -8.490777969360352, "global_step": 59702, "epoch": 355} {"train_loss": -8.571060180664062, "global_step": 59703, "epoch": 355} {"train_loss": -8.764835357666016, "global_step": 59704, "epoch": 355} {"train_loss": -8.515987396240234, "global_step": 59705, "epoch": 355} {"train_loss": -8.752716064453125, "global_step": 59706, "epoch": 355} {"train_loss": -8.658198356628418, "global_step": 59707, "epoch": 355} {"train_loss": -8.751258850097656, "global_step": 59708, "epoch": 355} {"train_loss": -8.74477767944336, "global_step": 59709, "epoch": 355} {"train_loss": -8.684148788452148, "global_step": 59710, "epoch": 355} {"train_loss": -8.693931579589844, "global_step": 59711, "epoch": 355} {"train_loss": -8.6022367477417, "global_step": 59712, "epoch": 355} {"train_loss": -8.685277938842773, "global_step": 59713, "epoch": 355} {"train_loss": -8.662788391113281, "global_step": 59714, "epoch": 355} {"train_loss": -8.696277618408203, "global_step": 59715, "epoch": 355} {"train_loss": -8.599405288696289, "global_step": 59716, "epoch": 355} {"train_loss": -8.503456115722656, "global_step": 59717, "epoch": 355} {"train_loss": -8.683673858642578, "global_step": 59718, "epoch": 355} {"train_loss": -8.667448997497559, "global_step": 59719, "epoch": 355} {"train_loss": -8.607343673706055, "global_step": 59720, "epoch": 355} {"train_loss": -8.857887268066406, "global_step": 59721, "epoch": 355} {"train_loss": -8.630475997924805, "global_step": 59722, "epoch": 355} {"train_loss": -8.680952072143555, "global_step": 59723, "epoch": 355} {"train_loss": -8.749860763549805, "global_step": 59724, "epoch": 355} {"train_loss": -8.733182907104492, "global_step": 59725, "epoch": 355} {"train_loss": -8.631589889526367, "global_step": 59726, "epoch": 355} {"train_loss": -8.488054275512695, "global_step": 59727, "epoch": 355} {"train_loss": -8.671184539794922, "global_step": 59728, "epoch": 355} {"train_loss": -8.699908256530762, "global_step": 59729, "epoch": 355} {"train_loss": -8.688447952270508, "global_step": 59730, "epoch": 355} {"train_loss": -8.827251434326172, "global_step": 59731, "epoch": 355} {"train_loss": -8.780738830566406, "global_step": 59732, "epoch": 355} {"train_loss": -8.52812385559082, "global_step": 59733, "epoch": 355} {"train_loss": -8.798381805419922, "global_step": 59734, "epoch": 355} {"train_loss": -8.557967185974121, "global_step": 59735, "epoch": 355} {"train_loss": -8.6123046875, "global_step": 59736, "epoch": 355} {"train_loss": -8.790586471557617, "global_step": 59737, "epoch": 355} {"train_loss": -8.686439514160156, "global_step": 59738, "epoch": 355} {"train_loss": -8.476661682128906, "global_step": 59739, "epoch": 355} {"train_loss": -8.546279907226562, "global_step": 59740, "epoch": 355} {"train_loss": -8.54561996459961, "global_step": 59741, "epoch": 355} {"train_loss": -8.768416404724121, "global_step": 59742, "epoch": 355} {"train_loss": -8.626789093017578, "global_step": 59743, "epoch": 355} {"train_loss": -8.814831733703613, "global_step": 59744, "epoch": 355} {"train_loss": -8.609088897705078, "global_step": 59745, "epoch": 355} {"train_loss": -8.786981582641602, "global_step": 59746, "epoch": 355} {"train_loss": -8.586084365844727, "global_step": 59747, "epoch": 355} {"train_loss": -8.770435333251953, "global_step": 59748, "epoch": 355} {"train_loss": -8.640214920043945, "global_step": 59749, "epoch": 355} {"train_loss": -8.86515998840332, "global_step": 59750, "epoch": 355} {"train_loss": -8.729122161865234, "global_step": 59751, "epoch": 355} {"train_loss": -8.723711967468262, "global_step": 59752, "epoch": 355} {"train_loss": -8.729978561401367, "global_step": 59753, "epoch": 355} {"train_loss": -8.76941204071045, "global_step": 59754, "epoch": 355} {"train_loss": -8.745685577392578, "global_step": 59755, "epoch": 355} {"train_loss": -8.964887619018555, "global_step": 59756, "epoch": 355} {"train_loss": -8.483686447143555, "global_step": 59757, "epoch": 355} {"train_loss": -8.871407508850098, "global_step": 59758, "epoch": 355} {"train_loss": -8.84797477722168, "global_step": 59759, "epoch": 355} {"train_loss": -8.784952163696289, "global_step": 59760, "epoch": 355} {"train_loss": -8.710543632507324, "global_step": 59761, "epoch": 355} {"train_loss": -8.827232360839844, "global_step": 59762, "epoch": 355} {"train_loss": -8.621831893920898, "global_step": 59763, "epoch": 355} {"train_loss": -8.875081062316895, "global_step": 59764, "epoch": 355} {"train_loss": -8.707401275634766, "global_step": 59765, "epoch": 355} {"train_loss": -8.776968955993652, "global_step": 59766, "epoch": 355} {"train_loss": -8.82526969909668, "global_step": 59767, "epoch": 355} {"train_loss": -8.507625579833984, "global_step": 59768, "epoch": 355} {"train_loss": -8.631799697875977, "global_step": 59769, "epoch": 355} {"train_loss": -8.844381332397461, "global_step": 59770, "epoch": 355} {"train_loss": -8.633668899536133, "global_step": 59771, "epoch": 355} {"train_loss": -8.543597221374512, "global_step": 59772, "epoch": 355} {"train_loss": -8.742085456848145, "global_step": 59773, "epoch": 355} {"train_loss": -8.71528148651123, "global_step": 59774, "epoch": 355} {"train_loss": -8.551390647888184, "global_step": 59775, "epoch": 355} {"train_loss": -8.811519622802734, "global_step": 59776, "epoch": 355} {"train_loss": -8.481362342834473, "global_step": 59777, "epoch": 355} {"train_loss": -8.571274757385254, "global_step": 59778, "epoch": 355} {"train_loss": -8.700773239135742, "global_step": 59779, "epoch": 355} {"train_loss": -8.583062171936035, "global_step": 59780, "epoch": 355} {"train_loss": -8.48847484588623, "global_step": 59781, "epoch": 355} {"train_loss": -8.55864429473877, "global_step": 59782, "epoch": 355} {"train_loss": -8.41970443725586, "global_step": 59783, "epoch": 355} {"train_loss": -8.344049453735352, "global_step": 59784, "epoch": 355} {"train_loss": -8.729799270629883, "global_step": 59785, "epoch": 355} {"train_loss": -8.719907760620117, "global_step": 59786, "epoch": 355} {"train_loss": -8.66031265258789, "global_step": 59787, "epoch": 355} {"train_loss": -8.674433708190918, "global_step": 59788, "epoch": 355} {"train_loss": -8.82246208190918, "global_step": 59789, "epoch": 355} {"train_loss": -8.49409294128418, "global_step": 59790, "epoch": 355} {"train_loss": -8.796630859375, "global_step": 59791, "epoch": 355} {"train_loss": -8.454398155212402, "global_step": 59792, "epoch": 355} {"train_loss": -8.787481307983398, "global_step": 59793, "epoch": 355} {"train_loss": -8.76384162902832, "global_step": 59794, "epoch": 355} {"train_loss": -8.652681350708008, "global_step": 59795, "epoch": 355} {"train_loss": -8.651491165161133, "global_step": 59796, "epoch": 355} {"train_loss": -8.894845008850098, "global_step": 59797, "epoch": 355} {"train_loss": -8.589700698852539, "global_step": 59798, "epoch": 355} {"train_loss": -8.803445816040039, "global_step": 59799, "epoch": 355} {"train_loss": -8.665329933166504, "global_step": 59800, "epoch": 355} {"train_loss": -8.683612823486328, "global_step": 59801, "epoch": 355} {"train_loss": -8.444099426269531, "global_step": 59802, "epoch": 355} {"train_loss": -8.828764915466309, "global_step": 59803, "epoch": 355} {"train_loss": -8.47309684753418, "global_step": 59804, "epoch": 355} {"train_loss": -8.606075286865234, "global_step": 59805, "epoch": 355} {"train_loss": -8.433027267456055, "global_step": 59806, "epoch": 355} {"train_loss": -8.663179970922924, "global_step": 59807, "epoch": 355, "val_loss": 192161.21875, "train_action_mse_error": 11.188383102416992} {"train_loss": -8.35632610321045, "global_step": 59808, "epoch": 356} {"train_loss": -8.716198921203613, "global_step": 59809, "epoch": 356} {"train_loss": -8.597171783447266, "global_step": 59810, "epoch": 356} {"train_loss": -8.569375991821289, "global_step": 59811, "epoch": 356} {"train_loss": -8.475543975830078, "global_step": 59812, "epoch": 356} {"train_loss": -8.616598129272461, "global_step": 59813, "epoch": 356} {"train_loss": -8.669551849365234, "global_step": 59814, "epoch": 356} {"train_loss": -8.397903442382812, "global_step": 59815, "epoch": 356} {"train_loss": -8.796586990356445, "global_step": 59816, "epoch": 356} {"train_loss": -8.432039260864258, "global_step": 59817, "epoch": 356} {"train_loss": -8.46040153503418, "global_step": 59818, "epoch": 356} {"train_loss": -8.618236541748047, "global_step": 59819, "epoch": 356} {"train_loss": -8.834634780883789, "global_step": 59820, "epoch": 356} {"train_loss": -8.521892547607422, "global_step": 59821, "epoch": 356} {"train_loss": -8.674245834350586, "global_step": 59822, "epoch": 356} {"train_loss": -8.781245231628418, "global_step": 59823, "epoch": 356} {"train_loss": -8.557235717773438, "global_step": 59824, "epoch": 356} {"train_loss": -8.613105773925781, "global_step": 59825, "epoch": 356} {"train_loss": -8.830375671386719, "global_step": 59826, "epoch": 356} {"train_loss": -8.5330810546875, "global_step": 59827, "epoch": 356} {"train_loss": -8.716580390930176, "global_step": 59828, "epoch": 356} {"train_loss": -8.744449615478516, "global_step": 59829, "epoch": 356} {"train_loss": -8.559732437133789, "global_step": 59830, "epoch": 356} {"train_loss": -8.654476165771484, "global_step": 59831, "epoch": 356} {"train_loss": -8.919198989868164, "global_step": 59832, "epoch": 356} {"train_loss": -8.523834228515625, "global_step": 59833, "epoch": 356} {"train_loss": -8.667470932006836, "global_step": 59834, "epoch": 356} {"train_loss": -8.849859237670898, "global_step": 59835, "epoch": 356} {"train_loss": -8.79269790649414, "global_step": 59836, "epoch": 356} {"train_loss": -8.710762977600098, "global_step": 59837, "epoch": 356} {"train_loss": -8.684510231018066, "global_step": 59838, "epoch": 356} {"train_loss": -8.676648139953613, "global_step": 59839, "epoch": 356} {"train_loss": -8.591470718383789, "global_step": 59840, "epoch": 356} {"train_loss": -8.444689750671387, "global_step": 59841, "epoch": 356} {"train_loss": -8.693090438842773, "global_step": 59842, "epoch": 356} {"train_loss": -8.92635440826416, "global_step": 59843, "epoch": 356} {"train_loss": -8.307397842407227, "global_step": 59844, "epoch": 356} {"train_loss": -8.712057113647461, "global_step": 59845, "epoch": 356} {"train_loss": -8.676692008972168, "global_step": 59846, "epoch": 356} {"train_loss": -8.611061096191406, "global_step": 59847, "epoch": 356} {"train_loss": -8.498382568359375, "global_step": 59848, "epoch": 356} {"train_loss": -8.839075088500977, "global_step": 59849, "epoch": 356} {"train_loss": -8.446843147277832, "global_step": 59850, "epoch": 356} {"train_loss": -8.929777145385742, "global_step": 59851, "epoch": 356} {"train_loss": -8.66780948638916, "global_step": 59852, "epoch": 356} {"train_loss": -8.237249374389648, "global_step": 59853, "epoch": 356} {"train_loss": -8.505878448486328, "global_step": 59854, "epoch": 356} {"train_loss": -8.433353424072266, "global_step": 59855, "epoch": 356} {"train_loss": -8.579401016235352, "global_step": 59856, "epoch": 356} {"train_loss": -8.4966459274292, "global_step": 59857, "epoch": 356} {"train_loss": -8.549873352050781, "global_step": 59858, "epoch": 356} {"train_loss": -8.31088638305664, "global_step": 59859, "epoch": 356} {"train_loss": -8.552837371826172, "global_step": 59860, "epoch": 356} {"train_loss": -8.720104217529297, "global_step": 59861, "epoch": 356} {"train_loss": -8.463664054870605, "global_step": 59862, "epoch": 356} {"train_loss": -8.6458740234375, "global_step": 59863, "epoch": 356} {"train_loss": -8.739893913269043, "global_step": 59864, "epoch": 356} {"train_loss": -8.600014686584473, "global_step": 59865, "epoch": 356} {"train_loss": -8.741009712219238, "global_step": 59866, "epoch": 356} {"train_loss": -8.50982666015625, "global_step": 59867, "epoch": 356} {"train_loss": -8.632431030273438, "global_step": 59868, "epoch": 356} {"train_loss": -8.471455574035645, "global_step": 59869, "epoch": 356} {"train_loss": -8.719881057739258, "global_step": 59870, "epoch": 356} {"train_loss": -8.724813461303711, "global_step": 59871, "epoch": 356} {"train_loss": -8.705991744995117, "global_step": 59872, "epoch": 356} {"train_loss": -8.864912033081055, "global_step": 59873, "epoch": 356} {"train_loss": -8.570003509521484, "global_step": 59874, "epoch": 356} {"train_loss": -8.288310050964355, "global_step": 59875, "epoch": 356} {"train_loss": -8.7854642868042, "global_step": 59876, "epoch": 356} {"train_loss": -8.498339653015137, "global_step": 59877, "epoch": 356} {"train_loss": -8.600152969360352, "global_step": 59878, "epoch": 356} {"train_loss": -8.5370512008667, "global_step": 59879, "epoch": 356} {"train_loss": -8.76690673828125, "global_step": 59880, "epoch": 356} {"train_loss": -8.570425987243652, "global_step": 59881, "epoch": 356} {"train_loss": -8.692360877990723, "global_step": 59882, "epoch": 356} {"train_loss": -8.62812328338623, "global_step": 59883, "epoch": 356} {"train_loss": -8.865521430969238, "global_step": 59884, "epoch": 356} {"train_loss": -8.848128318786621, "global_step": 59885, "epoch": 356} {"train_loss": -8.779622077941895, "global_step": 59886, "epoch": 356} {"train_loss": -8.735785484313965, "global_step": 59887, "epoch": 356} {"train_loss": -8.778142929077148, "global_step": 59888, "epoch": 356} {"train_loss": -8.36996078491211, "global_step": 59889, "epoch": 356} {"train_loss": -8.711164474487305, "global_step": 59890, "epoch": 356} {"train_loss": -8.804247856140137, "global_step": 59891, "epoch": 356} {"train_loss": -8.621519088745117, "global_step": 59892, "epoch": 356} {"train_loss": -8.699081420898438, "global_step": 59893, "epoch": 356} {"train_loss": -8.746431350708008, "global_step": 59894, "epoch": 356} {"train_loss": -8.619455337524414, "global_step": 59895, "epoch": 356} {"train_loss": -8.720077514648438, "global_step": 59896, "epoch": 356} {"train_loss": -8.85505199432373, "global_step": 59897, "epoch": 356} {"train_loss": -8.815885543823242, "global_step": 59898, "epoch": 356} {"train_loss": -8.759418487548828, "global_step": 59899, "epoch": 356} {"train_loss": -8.66792106628418, "global_step": 59900, "epoch": 356} {"train_loss": -9.088014602661133, "global_step": 59901, "epoch": 356} {"train_loss": -8.623448371887207, "global_step": 59902, "epoch": 356} {"train_loss": -8.93374252319336, "global_step": 59903, "epoch": 356} {"train_loss": -8.751998901367188, "global_step": 59904, "epoch": 356} {"train_loss": -8.395740509033203, "global_step": 59905, "epoch": 356} {"train_loss": -8.677190780639648, "global_step": 59906, "epoch": 356} {"train_loss": -8.776432037353516, "global_step": 59907, "epoch": 356} {"train_loss": -8.666980743408203, "global_step": 59908, "epoch": 356} {"train_loss": -8.667896270751953, "global_step": 59909, "epoch": 356} {"train_loss": -8.527591705322266, "global_step": 59910, "epoch": 356} {"train_loss": -8.525971412658691, "global_step": 59911, "epoch": 356} {"train_loss": -8.429712295532227, "global_step": 59912, "epoch": 356} {"train_loss": -8.72254467010498, "global_step": 59913, "epoch": 356} {"train_loss": -8.685657501220703, "global_step": 59914, "epoch": 356} {"train_loss": -8.594921112060547, "global_step": 59915, "epoch": 356} {"train_loss": -8.552669525146484, "global_step": 59916, "epoch": 356} {"train_loss": -8.581589698791504, "global_step": 59917, "epoch": 356} {"train_loss": -8.63742733001709, "global_step": 59918, "epoch": 356} {"train_loss": -8.854904174804688, "global_step": 59919, "epoch": 356} {"train_loss": -8.711508750915527, "global_step": 59920, "epoch": 356} {"train_loss": -8.818997383117676, "global_step": 59921, "epoch": 356} {"train_loss": -8.767980575561523, "global_step": 59922, "epoch": 356} {"train_loss": -8.712663650512695, "global_step": 59923, "epoch": 356} {"train_loss": -8.661260604858398, "global_step": 59924, "epoch": 356} {"train_loss": -8.601520538330078, "global_step": 59925, "epoch": 356} {"train_loss": -8.85749626159668, "global_step": 59926, "epoch": 356} {"train_loss": -8.674878120422363, "global_step": 59927, "epoch": 356} {"train_loss": -8.581416130065918, "global_step": 59928, "epoch": 356} {"train_loss": -8.64639663696289, "global_step": 59929, "epoch": 356} {"train_loss": -8.483038902282715, "global_step": 59930, "epoch": 356} {"train_loss": -8.561796188354492, "global_step": 59931, "epoch": 356} {"train_loss": -8.627140998840332, "global_step": 59932, "epoch": 356} {"train_loss": -8.789363861083984, "global_step": 59933, "epoch": 356} {"train_loss": -8.756158828735352, "global_step": 59934, "epoch": 356} {"train_loss": -8.658504486083984, "global_step": 59935, "epoch": 356} {"train_loss": -8.687807083129883, "global_step": 59936, "epoch": 356} {"train_loss": -8.524084091186523, "global_step": 59937, "epoch": 356} {"train_loss": -8.576257705688477, "global_step": 59938, "epoch": 356} {"train_loss": -8.746501922607422, "global_step": 59939, "epoch": 356} {"train_loss": -8.715743064880371, "global_step": 59940, "epoch": 356} {"train_loss": -8.177633285522461, "global_step": 59941, "epoch": 356} {"train_loss": -8.193795204162598, "global_step": 59942, "epoch": 356} {"train_loss": -8.29184341430664, "global_step": 59943, "epoch": 356} {"train_loss": -8.280588150024414, "global_step": 59944, "epoch": 356} {"train_loss": -8.361069679260254, "global_step": 59945, "epoch": 356} {"train_loss": -8.324434280395508, "global_step": 59946, "epoch": 356} {"train_loss": -8.463573455810547, "global_step": 59947, "epoch": 356} {"train_loss": -8.505319595336914, "global_step": 59948, "epoch": 356} {"train_loss": -8.53030014038086, "global_step": 59949, "epoch": 356} {"train_loss": -8.351848602294922, "global_step": 59950, "epoch": 356} {"train_loss": -8.380640983581543, "global_step": 59951, "epoch": 356} {"train_loss": -8.512224197387695, "global_step": 59952, "epoch": 356} {"train_loss": -8.722000122070312, "global_step": 59953, "epoch": 356} {"train_loss": -8.824825286865234, "global_step": 59954, "epoch": 356} {"train_loss": -8.642461776733398, "global_step": 59955, "epoch": 356} {"train_loss": -8.567075729370117, "global_step": 59956, "epoch": 356} {"train_loss": -8.657625198364258, "global_step": 59957, "epoch": 356} {"train_loss": -8.525758743286133, "global_step": 59958, "epoch": 356} {"train_loss": -8.722471237182617, "global_step": 59959, "epoch": 356} {"train_loss": -8.590232849121094, "global_step": 59960, "epoch": 356} {"train_loss": -8.724053382873535, "global_step": 59961, "epoch": 356} {"train_loss": -8.487550735473633, "global_step": 59962, "epoch": 356} {"train_loss": -8.751823425292969, "global_step": 59963, "epoch": 356} {"train_loss": -8.737167358398438, "global_step": 59964, "epoch": 356} {"train_loss": -8.532923698425293, "global_step": 59965, "epoch": 356} {"train_loss": -8.626530647277832, "global_step": 59966, "epoch": 356} {"train_loss": -8.685286521911621, "global_step": 59967, "epoch": 356} {"train_loss": -8.697744369506836, "global_step": 59968, "epoch": 356} {"train_loss": -8.710454940795898, "global_step": 59969, "epoch": 356} {"train_loss": -8.534006118774414, "global_step": 59970, "epoch": 356} {"train_loss": -8.701508522033691, "global_step": 59971, "epoch": 356} {"train_loss": -8.65029525756836, "global_step": 59972, "epoch": 356} {"train_loss": -8.617704391479492, "global_step": 59973, "epoch": 356} {"train_loss": -8.780728340148926, "global_step": 59974, "epoch": 356} {"train_loss": -8.629757063729423, "global_step": 59975, "epoch": 356, "val_loss": 190197.140625} {"train_loss": -8.838234901428223, "global_step": 59976, "epoch": 357} {"train_loss": -8.770832061767578, "global_step": 59977, "epoch": 357} {"train_loss": -8.552425384521484, "global_step": 59978, "epoch": 357} {"train_loss": -8.391698837280273, "global_step": 59979, "epoch": 357} {"train_loss": -8.457854270935059, "global_step": 59980, "epoch": 357} {"train_loss": -8.564380645751953, "global_step": 59981, "epoch": 357} {"train_loss": -8.372188568115234, "global_step": 59982, "epoch": 357} {"train_loss": -8.89326286315918, "global_step": 59983, "epoch": 357} {"train_loss": -8.619307518005371, "global_step": 59984, "epoch": 357} {"train_loss": -8.899417877197266, "global_step": 59985, "epoch": 357} {"train_loss": -8.61514663696289, "global_step": 59986, "epoch": 357} {"train_loss": -8.743705749511719, "global_step": 59987, "epoch": 357} {"train_loss": -8.443938255310059, "global_step": 59988, "epoch": 357} {"train_loss": -8.622204780578613, "global_step": 59989, "epoch": 357} {"train_loss": -8.604117393493652, "global_step": 59990, "epoch": 357} {"train_loss": -8.813838005065918, "global_step": 59991, "epoch": 357} {"train_loss": -8.629777908325195, "global_step": 59992, "epoch": 357} {"train_loss": -8.848274230957031, "global_step": 59993, "epoch": 357} {"train_loss": -8.66037368774414, "global_step": 59994, "epoch": 357} {"train_loss": -8.730253219604492, "global_step": 59995, "epoch": 357} {"train_loss": -8.486178398132324, "global_step": 59996, "epoch": 357} {"train_loss": -8.798731803894043, "global_step": 59997, "epoch": 357} {"train_loss": -8.749527931213379, "global_step": 59998, "epoch": 357} {"train_loss": -8.797080993652344, "global_step": 59999, "epoch": 357} {"train_loss": -8.789812088012695, "global_step": 60000, "epoch": 357} {"train_loss": -8.619843482971191, "global_step": 60001, "epoch": 357} {"train_loss": -8.765789985656738, "global_step": 60002, "epoch": 357} {"train_loss": -8.707789421081543, "global_step": 60003, "epoch": 357} {"train_loss": -8.784451484680176, "global_step": 60004, "epoch": 357} {"train_loss": -8.554536819458008, "global_step": 60005, "epoch": 357} {"train_loss": -8.742593765258789, "global_step": 60006, "epoch": 357} {"train_loss": -8.627685546875, "global_step": 60007, "epoch": 357} {"train_loss": -8.381988525390625, "global_step": 60008, "epoch": 357} {"train_loss": -8.424745559692383, "global_step": 60009, "epoch": 357} {"train_loss": -8.568300247192383, "global_step": 60010, "epoch": 357} {"train_loss": -8.589834213256836, "global_step": 60011, "epoch": 357} {"train_loss": -8.658761978149414, "global_step": 60012, "epoch": 357} {"train_loss": -8.750555038452148, "global_step": 60013, "epoch": 357} {"train_loss": -8.485400199890137, "global_step": 60014, "epoch": 357} {"train_loss": -8.626218795776367, "global_step": 60015, "epoch": 357} {"train_loss": -8.828176498413086, "global_step": 60016, "epoch": 357} {"train_loss": -8.334589004516602, "global_step": 60017, "epoch": 357} {"train_loss": -8.344122886657715, "global_step": 60018, "epoch": 357} {"train_loss": -8.709172248840332, "global_step": 60019, "epoch": 357} {"train_loss": -8.330900192260742, "global_step": 60020, "epoch": 357} {"train_loss": -8.627666473388672, "global_step": 60021, "epoch": 357} {"train_loss": -8.426284790039062, "global_step": 60022, "epoch": 357} {"train_loss": -8.793722152709961, "global_step": 60023, "epoch": 357} {"train_loss": -8.556065559387207, "global_step": 60024, "epoch": 357} {"train_loss": -8.682080268859863, "global_step": 60025, "epoch": 357} {"train_loss": -8.660792350769043, "global_step": 60026, "epoch": 357} {"train_loss": -8.570186614990234, "global_step": 60027, "epoch": 357} {"train_loss": -8.928436279296875, "global_step": 60028, "epoch": 357} {"train_loss": -8.578805923461914, "global_step": 60029, "epoch": 357} {"train_loss": -8.73651123046875, "global_step": 60030, "epoch": 357} {"train_loss": -8.810772895812988, "global_step": 60031, "epoch": 357} {"train_loss": -8.654111862182617, "global_step": 60032, "epoch": 357} {"train_loss": -8.76806354522705, "global_step": 60033, "epoch": 357} {"train_loss": -8.635557174682617, "global_step": 60034, "epoch": 357} {"train_loss": -8.58267593383789, "global_step": 60035, "epoch": 357} {"train_loss": -8.830299377441406, "global_step": 60036, "epoch": 357} {"train_loss": -8.474618911743164, "global_step": 60037, "epoch": 357} {"train_loss": -8.735177993774414, "global_step": 60038, "epoch": 357} {"train_loss": -8.703275680541992, "global_step": 60039, "epoch": 357} {"train_loss": -8.760497093200684, "global_step": 60040, "epoch": 357} {"train_loss": -8.861770629882812, "global_step": 60041, "epoch": 357} {"train_loss": -8.405449867248535, "global_step": 60042, "epoch": 357} {"train_loss": -8.637776374816895, "global_step": 60043, "epoch": 357} {"train_loss": -8.515473365783691, "global_step": 60044, "epoch": 357} {"train_loss": -8.72872257232666, "global_step": 60045, "epoch": 357} {"train_loss": -8.571945190429688, "global_step": 60046, "epoch": 357} {"train_loss": -8.526222229003906, "global_step": 60047, "epoch": 357} {"train_loss": -8.681941032409668, "global_step": 60048, "epoch": 357} {"train_loss": -8.408147811889648, "global_step": 60049, "epoch": 357} {"train_loss": -8.482471466064453, "global_step": 60050, "epoch": 357} {"train_loss": -8.675722122192383, "global_step": 60051, "epoch": 357} {"train_loss": -8.300413131713867, "global_step": 60052, "epoch": 357} {"train_loss": -8.702225685119629, "global_step": 60053, "epoch": 357} {"train_loss": -8.47778606414795, "global_step": 60054, "epoch": 357} {"train_loss": -8.744626998901367, "global_step": 60055, "epoch": 357} {"train_loss": -8.448674201965332, "global_step": 60056, "epoch": 357} {"train_loss": -8.818853378295898, "global_step": 60057, "epoch": 357} {"train_loss": -8.445879936218262, "global_step": 60058, "epoch": 357} {"train_loss": -8.531251907348633, "global_step": 60059, "epoch": 357} {"train_loss": -8.606733322143555, "global_step": 60060, "epoch": 357} {"train_loss": -8.43359375, "global_step": 60061, "epoch": 357} {"train_loss": -8.545211791992188, "global_step": 60062, "epoch": 357} {"train_loss": -8.726295471191406, "global_step": 60063, "epoch": 357} {"train_loss": -8.661600112915039, "global_step": 60064, "epoch": 357} {"train_loss": -8.44637680053711, "global_step": 60065, "epoch": 357} {"train_loss": -8.71780014038086, "global_step": 60066, "epoch": 357} {"train_loss": -8.559858322143555, "global_step": 60067, "epoch": 357} {"train_loss": -8.611810684204102, "global_step": 60068, "epoch": 357} {"train_loss": -8.830667495727539, "global_step": 60069, "epoch": 357} {"train_loss": -8.550690650939941, "global_step": 60070, "epoch": 357} {"train_loss": -8.634174346923828, "global_step": 60071, "epoch": 357} {"train_loss": -8.821060180664062, "global_step": 60072, "epoch": 357} {"train_loss": -9.016351699829102, "global_step": 60073, "epoch": 357} {"train_loss": -8.768022537231445, "global_step": 60074, "epoch": 357} {"train_loss": -8.888193130493164, "global_step": 60075, "epoch": 357} {"train_loss": -8.885892868041992, "global_step": 60076, "epoch": 357} {"train_loss": -8.765316009521484, "global_step": 60077, "epoch": 357} {"train_loss": -8.909830093383789, "global_step": 60078, "epoch": 357} {"train_loss": -8.865575790405273, "global_step": 60079, "epoch": 357} {"train_loss": -8.851140975952148, "global_step": 60080, "epoch": 357} {"train_loss": -8.991411209106445, "global_step": 60081, "epoch": 357} {"train_loss": -8.433029174804688, "global_step": 60082, "epoch": 357} {"train_loss": -8.837393760681152, "global_step": 60083, "epoch": 357} {"train_loss": -8.754793167114258, "global_step": 60084, "epoch": 357} {"train_loss": -8.598873138427734, "global_step": 60085, "epoch": 357} {"train_loss": -8.786416053771973, "global_step": 60086, "epoch": 357} {"train_loss": -8.698709487915039, "global_step": 60087, "epoch": 357} {"train_loss": -8.350122451782227, "global_step": 60088, "epoch": 357} {"train_loss": -8.68528938293457, "global_step": 60089, "epoch": 357} {"train_loss": -8.423971176147461, "global_step": 60090, "epoch": 357} {"train_loss": -8.377744674682617, "global_step": 60091, "epoch": 357} {"train_loss": -8.635063171386719, "global_step": 60092, "epoch": 357} {"train_loss": -8.605069160461426, "global_step": 60093, "epoch": 357} {"train_loss": -8.581480026245117, "global_step": 60094, "epoch": 357} {"train_loss": -8.481840133666992, "global_step": 60095, "epoch": 357} {"train_loss": -8.42782974243164, "global_step": 60096, "epoch": 357} {"train_loss": -8.410808563232422, "global_step": 60097, "epoch": 357} {"train_loss": -8.410770416259766, "global_step": 60098, "epoch": 357} {"train_loss": -8.437323570251465, "global_step": 60099, "epoch": 357} {"train_loss": -8.2908935546875, "global_step": 60100, "epoch": 357} {"train_loss": -8.692237854003906, "global_step": 60101, "epoch": 357} {"train_loss": -8.485902786254883, "global_step": 60102, "epoch": 357} {"train_loss": -8.60643482208252, "global_step": 60103, "epoch": 357} {"train_loss": -8.66592025756836, "global_step": 60104, "epoch": 357} {"train_loss": -8.629541397094727, "global_step": 60105, "epoch": 357} {"train_loss": -8.609628677368164, "global_step": 60106, "epoch": 357} {"train_loss": -8.530036926269531, "global_step": 60107, "epoch": 357} {"train_loss": -8.676023483276367, "global_step": 60108, "epoch": 357} {"train_loss": -8.642400741577148, "global_step": 60109, "epoch": 357} {"train_loss": -8.476741790771484, "global_step": 60110, "epoch": 357} {"train_loss": -8.675567626953125, "global_step": 60111, "epoch": 357} {"train_loss": -8.512717247009277, "global_step": 60112, "epoch": 357} {"train_loss": -8.700515747070312, "global_step": 60113, "epoch": 357} {"train_loss": -8.479867935180664, "global_step": 60114, "epoch": 357} {"train_loss": -8.781187057495117, "global_step": 60115, "epoch": 357} {"train_loss": -8.634954452514648, "global_step": 60116, "epoch": 357} {"train_loss": -8.661893844604492, "global_step": 60117, "epoch": 357} {"train_loss": -8.64995002746582, "global_step": 60118, "epoch": 357} {"train_loss": -8.675517082214355, "global_step": 60119, "epoch": 357} {"train_loss": -8.72622299194336, "global_step": 60120, "epoch": 357} {"train_loss": -8.467597961425781, "global_step": 60121, "epoch": 357} {"train_loss": -8.815756797790527, "global_step": 60122, "epoch": 357} {"train_loss": -8.624935150146484, "global_step": 60123, "epoch": 357} {"train_loss": -8.614065170288086, "global_step": 60124, "epoch": 357} {"train_loss": -8.828006744384766, "global_step": 60125, "epoch": 357} {"train_loss": -8.740779876708984, "global_step": 60126, "epoch": 357} {"train_loss": -8.605501174926758, "global_step": 60127, "epoch": 357} {"train_loss": -8.655033111572266, "global_step": 60128, "epoch": 357} {"train_loss": -8.454797744750977, "global_step": 60129, "epoch": 357} {"train_loss": -8.65113353729248, "global_step": 60130, "epoch": 357} {"train_loss": -8.802714347839355, "global_step": 60131, "epoch": 357} {"train_loss": -8.608545303344727, "global_step": 60132, "epoch": 357} {"train_loss": -8.518675804138184, "global_step": 60133, "epoch": 357} {"train_loss": -8.662948608398438, "global_step": 60134, "epoch": 357} {"train_loss": -8.536283493041992, "global_step": 60135, "epoch": 357} {"train_loss": -8.817326545715332, "global_step": 60136, "epoch": 357} {"train_loss": -8.707232475280762, "global_step": 60137, "epoch": 357} {"train_loss": -8.446826934814453, "global_step": 60138, "epoch": 357} {"train_loss": -8.79696273803711, "global_step": 60139, "epoch": 357} {"train_loss": -8.65294075012207, "global_step": 60140, "epoch": 357} {"train_loss": -8.641796112060547, "global_step": 60141, "epoch": 357} {"train_loss": -8.822306632995605, "global_step": 60142, "epoch": 357} {"train_loss": -8.63624844664619, "global_step": 60143, "epoch": 357, "val_loss": 190762.484375} {"train_loss": -8.5230712890625, "global_step": 60144, "epoch": 358} {"train_loss": -8.692621231079102, "global_step": 60145, "epoch": 358} {"train_loss": -8.847485542297363, "global_step": 60146, "epoch": 358} {"train_loss": -8.838353157043457, "global_step": 60147, "epoch": 358} {"train_loss": -8.77796459197998, "global_step": 60148, "epoch": 358} {"train_loss": -8.878841400146484, "global_step": 60149, "epoch": 358} {"train_loss": -8.701047897338867, "global_step": 60150, "epoch": 358} {"train_loss": -8.685741424560547, "global_step": 60151, "epoch": 358} {"train_loss": -8.383586883544922, "global_step": 60152, "epoch": 358} {"train_loss": -8.680971145629883, "global_step": 60153, "epoch": 358} {"train_loss": -8.590499877929688, "global_step": 60154, "epoch": 358} {"train_loss": -8.775472640991211, "global_step": 60155, "epoch": 358} {"train_loss": -8.576608657836914, "global_step": 60156, "epoch": 358} {"train_loss": -8.686307907104492, "global_step": 60157, "epoch": 358} {"train_loss": -8.5272216796875, "global_step": 60158, "epoch": 358} {"train_loss": -8.834819793701172, "global_step": 60159, "epoch": 358} {"train_loss": -8.6495361328125, "global_step": 60160, "epoch": 358} {"train_loss": -8.613840103149414, "global_step": 60161, "epoch": 358} {"train_loss": -8.585351943969727, "global_step": 60162, "epoch": 358} {"train_loss": -8.686622619628906, "global_step": 60163, "epoch": 358} {"train_loss": -8.51078987121582, "global_step": 60164, "epoch": 358} {"train_loss": -8.634551048278809, "global_step": 60165, "epoch": 358} {"train_loss": -8.771013259887695, "global_step": 60166, "epoch": 358} {"train_loss": -8.630846977233887, "global_step": 60167, "epoch": 358} {"train_loss": -8.510345458984375, "global_step": 60168, "epoch": 358} {"train_loss": -8.510406494140625, "global_step": 60169, "epoch": 358} {"train_loss": -8.490606307983398, "global_step": 60170, "epoch": 358} {"train_loss": -8.546894073486328, "global_step": 60171, "epoch": 358} {"train_loss": -8.64011001586914, "global_step": 60172, "epoch": 358} {"train_loss": -8.706501007080078, "global_step": 60173, "epoch": 358} {"train_loss": -8.5473051071167, "global_step": 60174, "epoch": 358} {"train_loss": -8.45667839050293, "global_step": 60175, "epoch": 358} {"train_loss": -8.577075958251953, "global_step": 60176, "epoch": 358} {"train_loss": -8.406709671020508, "global_step": 60177, "epoch": 358} {"train_loss": -8.462884902954102, "global_step": 60178, "epoch": 358} {"train_loss": -8.51972484588623, "global_step": 60179, "epoch": 358} {"train_loss": -8.496030807495117, "global_step": 60180, "epoch": 358} {"train_loss": -8.790752410888672, "global_step": 60181, "epoch": 358} {"train_loss": -8.678141593933105, "global_step": 60182, "epoch": 358} {"train_loss": -8.714619636535645, "global_step": 60183, "epoch": 358} {"train_loss": -8.75101375579834, "global_step": 60184, "epoch": 358} {"train_loss": -8.862834930419922, "global_step": 60185, "epoch": 358} {"train_loss": -8.321990966796875, "global_step": 60186, "epoch": 358} {"train_loss": -8.77219009399414, "global_step": 60187, "epoch": 358} {"train_loss": -8.606032371520996, "global_step": 60188, "epoch": 358} {"train_loss": -8.701666831970215, "global_step": 60189, "epoch": 358} {"train_loss": -8.9134521484375, "global_step": 60190, "epoch": 358} {"train_loss": -8.767473220825195, "global_step": 60191, "epoch": 358} {"train_loss": -8.673765182495117, "global_step": 60192, "epoch": 358} {"train_loss": -8.737738609313965, "global_step": 60193, "epoch": 358} {"train_loss": -8.671008110046387, "global_step": 60194, "epoch": 358} {"train_loss": -8.933727264404297, "global_step": 60195, "epoch": 358} {"train_loss": -8.688468933105469, "global_step": 60196, "epoch": 358} {"train_loss": -8.712398529052734, "global_step": 60197, "epoch": 358} {"train_loss": -8.579521179199219, "global_step": 60198, "epoch": 358} {"train_loss": -8.907607078552246, "global_step": 60199, "epoch": 358} {"train_loss": -8.749107360839844, "global_step": 60200, "epoch": 358} {"train_loss": -8.633983612060547, "global_step": 60201, "epoch": 358} {"train_loss": -8.72272777557373, "global_step": 60202, "epoch": 358} {"train_loss": -8.60581111907959, "global_step": 60203, "epoch": 358} {"train_loss": -8.485736846923828, "global_step": 60204, "epoch": 358} {"train_loss": -8.826475143432617, "global_step": 60205, "epoch": 358} {"train_loss": -8.692434310913086, "global_step": 60206, "epoch": 358} {"train_loss": -8.65185260772705, "global_step": 60207, "epoch": 358} {"train_loss": -8.743502616882324, "global_step": 60208, "epoch": 358} {"train_loss": -8.642892837524414, "global_step": 60209, "epoch": 358} {"train_loss": -8.684820175170898, "global_step": 60210, "epoch": 358} {"train_loss": -8.651252746582031, "global_step": 60211, "epoch": 358} {"train_loss": -8.61550521850586, "global_step": 60212, "epoch": 358} {"train_loss": -8.71845531463623, "global_step": 60213, "epoch": 358} {"train_loss": -8.77815055847168, "global_step": 60214, "epoch": 358} {"train_loss": -8.866373062133789, "global_step": 60215, "epoch": 358} {"train_loss": -8.471617698669434, "global_step": 60216, "epoch": 358} {"train_loss": -8.627228736877441, "global_step": 60217, "epoch": 358} {"train_loss": -8.875808715820312, "global_step": 60218, "epoch": 358} {"train_loss": -8.856868743896484, "global_step": 60219, "epoch": 358} {"train_loss": -8.948760032653809, "global_step": 60220, "epoch": 358} {"train_loss": -8.757192611694336, "global_step": 60221, "epoch": 358} {"train_loss": -8.744701385498047, "global_step": 60222, "epoch": 358} {"train_loss": -8.86552619934082, "global_step": 60223, "epoch": 358} {"train_loss": -8.732030868530273, "global_step": 60224, "epoch": 358} {"train_loss": -8.933517456054688, "global_step": 60225, "epoch": 358} {"train_loss": -8.868865966796875, "global_step": 60226, "epoch": 358} {"train_loss": -8.815667152404785, "global_step": 60227, "epoch": 358} {"train_loss": -8.80849552154541, "global_step": 60228, "epoch": 358} {"train_loss": -8.741247177124023, "global_step": 60229, "epoch": 358} {"train_loss": -8.738213539123535, "global_step": 60230, "epoch": 358} {"train_loss": -9.087241172790527, "global_step": 60231, "epoch": 358} {"train_loss": -8.725581169128418, "global_step": 60232, "epoch": 358} {"train_loss": -8.722101211547852, "global_step": 60233, "epoch": 358} {"train_loss": -8.74162769317627, "global_step": 60234, "epoch": 358} {"train_loss": -8.861457824707031, "global_step": 60235, "epoch": 358} {"train_loss": -8.96590805053711, "global_step": 60236, "epoch": 358} {"train_loss": -8.780282020568848, "global_step": 60237, "epoch": 358} {"train_loss": -8.640825271606445, "global_step": 60238, "epoch": 358} {"train_loss": -8.903861999511719, "global_step": 60239, "epoch": 358} {"train_loss": -8.633665084838867, "global_step": 60240, "epoch": 358} {"train_loss": -8.77427864074707, "global_step": 60241, "epoch": 358} {"train_loss": -8.214844703674316, "global_step": 60242, "epoch": 358} {"train_loss": -8.868518829345703, "global_step": 60243, "epoch": 358} {"train_loss": -8.467889785766602, "global_step": 60244, "epoch": 358} {"train_loss": -8.587238311767578, "global_step": 60245, "epoch": 358} {"train_loss": -8.838838577270508, "global_step": 60246, "epoch": 358} {"train_loss": -8.701894760131836, "global_step": 60247, "epoch": 358} {"train_loss": -8.481330871582031, "global_step": 60248, "epoch": 358} {"train_loss": -8.561527252197266, "global_step": 60249, "epoch": 358} {"train_loss": -8.297540664672852, "global_step": 60250, "epoch": 358} {"train_loss": -8.273550033569336, "global_step": 60251, "epoch": 358} {"train_loss": -8.783281326293945, "global_step": 60252, "epoch": 358} {"train_loss": -8.38415813446045, "global_step": 60253, "epoch": 358} {"train_loss": -8.522971153259277, "global_step": 60254, "epoch": 358} {"train_loss": -8.411349296569824, "global_step": 60255, "epoch": 358} {"train_loss": -8.461442947387695, "global_step": 60256, "epoch": 358} {"train_loss": -7.985533714294434, "global_step": 60257, "epoch": 358} {"train_loss": -8.542463302612305, "global_step": 60258, "epoch": 358} {"train_loss": -8.282979965209961, "global_step": 60259, "epoch": 358} {"train_loss": -8.19583797454834, "global_step": 60260, "epoch": 358} {"train_loss": -8.251144409179688, "global_step": 60261, "epoch": 358} {"train_loss": -8.139730453491211, "global_step": 60262, "epoch": 358} {"train_loss": -8.254347801208496, "global_step": 60263, "epoch": 358} {"train_loss": -8.324312210083008, "global_step": 60264, "epoch": 358} {"train_loss": -8.459293365478516, "global_step": 60265, "epoch": 358} {"train_loss": -8.449499130249023, "global_step": 60266, "epoch": 358} {"train_loss": -8.222466468811035, "global_step": 60267, "epoch": 358} {"train_loss": -8.410682678222656, "global_step": 60268, "epoch": 358} {"train_loss": -8.309249877929688, "global_step": 60269, "epoch": 358} {"train_loss": -8.425565719604492, "global_step": 60270, "epoch": 358} {"train_loss": -8.220640182495117, "global_step": 60271, "epoch": 358} {"train_loss": -8.345754623413086, "global_step": 60272, "epoch": 358} {"train_loss": -8.465703964233398, "global_step": 60273, "epoch": 358} {"train_loss": -8.433815002441406, "global_step": 60274, "epoch": 358} {"train_loss": -8.462081909179688, "global_step": 60275, "epoch": 358} {"train_loss": -8.634520530700684, "global_step": 60276, "epoch": 358} {"train_loss": -8.485430717468262, "global_step": 60277, "epoch": 358} {"train_loss": -8.801838874816895, "global_step": 60278, "epoch": 358} {"train_loss": -8.552797317504883, "global_step": 60279, "epoch": 358} {"train_loss": -8.729975700378418, "global_step": 60280, "epoch": 358} {"train_loss": -8.392135620117188, "global_step": 60281, "epoch": 358} {"train_loss": -8.682863235473633, "global_step": 60282, "epoch": 358} {"train_loss": -8.829158782958984, "global_step": 60283, "epoch": 358} {"train_loss": -8.781176567077637, "global_step": 60284, "epoch": 358} {"train_loss": -8.70045280456543, "global_step": 60285, "epoch": 358} {"train_loss": -8.555403709411621, "global_step": 60286, "epoch": 358} {"train_loss": -8.550167083740234, "global_step": 60287, "epoch": 358} {"train_loss": -8.653879165649414, "global_step": 60288, "epoch": 358} {"train_loss": -8.63199234008789, "global_step": 60289, "epoch": 358} {"train_loss": -8.518332481384277, "global_step": 60290, "epoch": 358} {"train_loss": -8.528877258300781, "global_step": 60291, "epoch": 358} {"train_loss": -8.667691230773926, "global_step": 60292, "epoch": 358} {"train_loss": -8.809752464294434, "global_step": 60293, "epoch": 358} {"train_loss": -8.509944915771484, "global_step": 60294, "epoch": 358} {"train_loss": -8.629937171936035, "global_step": 60295, "epoch": 358} {"train_loss": -8.855880737304688, "global_step": 60296, "epoch": 358} {"train_loss": -8.77884578704834, "global_step": 60297, "epoch": 358} {"train_loss": -8.739501953125, "global_step": 60298, "epoch": 358} {"train_loss": -8.912835121154785, "global_step": 60299, "epoch": 358} {"train_loss": -8.592500686645508, "global_step": 60300, "epoch": 358} {"train_loss": -8.752845764160156, "global_step": 60301, "epoch": 358} {"train_loss": -8.850441932678223, "global_step": 60302, "epoch": 358} {"train_loss": -8.569392204284668, "global_step": 60303, "epoch": 358} {"train_loss": -8.57486343383789, "global_step": 60304, "epoch": 358} {"train_loss": -8.79371166229248, "global_step": 60305, "epoch": 358} {"train_loss": -8.671252250671387, "global_step": 60306, "epoch": 358} {"train_loss": -8.883487701416016, "global_step": 60307, "epoch": 358} {"train_loss": -8.752471923828125, "global_step": 60308, "epoch": 358} {"train_loss": -8.78535270690918, "global_step": 60309, "epoch": 358} {"train_loss": -8.776313781738281, "global_step": 60310, "epoch": 358} {"train_loss": -8.635244386536735, "global_step": 60311, "epoch": 358, "val_loss": 191033.15625} {"train_loss": -8.979541778564453, "global_step": 60312, "epoch": 359} {"train_loss": -8.532488822937012, "global_step": 60313, "epoch": 359} {"train_loss": -8.715898513793945, "global_step": 60314, "epoch": 359} {"train_loss": -8.69604206085205, "global_step": 60315, "epoch": 359} {"train_loss": -8.668703079223633, "global_step": 60316, "epoch": 359} {"train_loss": -8.95997428894043, "global_step": 60317, "epoch": 359} {"train_loss": -8.528980255126953, "global_step": 60318, "epoch": 359} {"train_loss": -8.687067031860352, "global_step": 60319, "epoch": 359} {"train_loss": -8.537126541137695, "global_step": 60320, "epoch": 359} {"train_loss": -8.380196571350098, "global_step": 60321, "epoch": 359} {"train_loss": -8.37462043762207, "global_step": 60322, "epoch": 359} {"train_loss": -8.268045425415039, "global_step": 60323, "epoch": 359} {"train_loss": -8.238228797912598, "global_step": 60324, "epoch": 359} {"train_loss": -8.630293846130371, "global_step": 60325, "epoch": 359} {"train_loss": -8.284791946411133, "global_step": 60326, "epoch": 359} {"train_loss": -8.139078140258789, "global_step": 60327, "epoch": 359} {"train_loss": -8.344353675842285, "global_step": 60328, "epoch": 359} {"train_loss": -8.41817855834961, "global_step": 60329, "epoch": 359} {"train_loss": -8.125606536865234, "global_step": 60330, "epoch": 359} {"train_loss": -8.560859680175781, "global_step": 60331, "epoch": 359} {"train_loss": -8.66624641418457, "global_step": 60332, "epoch": 359} {"train_loss": -8.543657302856445, "global_step": 60333, "epoch": 359} {"train_loss": -8.671634674072266, "global_step": 60334, "epoch": 359} {"train_loss": -8.522212982177734, "global_step": 60335, "epoch": 359} {"train_loss": -8.468908309936523, "global_step": 60336, "epoch": 359} {"train_loss": -8.611477851867676, "global_step": 60337, "epoch": 359} {"train_loss": -8.554227828979492, "global_step": 60338, "epoch": 359} {"train_loss": -8.420431137084961, "global_step": 60339, "epoch": 359} {"train_loss": -8.59037971496582, "global_step": 60340, "epoch": 359} {"train_loss": -8.465760231018066, "global_step": 60341, "epoch": 359} {"train_loss": -8.803337097167969, "global_step": 60342, "epoch": 359} {"train_loss": -8.758903503417969, "global_step": 60343, "epoch": 359} {"train_loss": -8.750747680664062, "global_step": 60344, "epoch": 359} {"train_loss": -8.797815322875977, "global_step": 60345, "epoch": 359} {"train_loss": -8.714883804321289, "global_step": 60346, "epoch": 359} {"train_loss": -8.804729461669922, "global_step": 60347, "epoch": 359} {"train_loss": -8.958794593811035, "global_step": 60348, "epoch": 359} {"train_loss": -8.849824905395508, "global_step": 60349, "epoch": 359} {"train_loss": -8.541929244995117, "global_step": 60350, "epoch": 359} {"train_loss": -8.771227836608887, "global_step": 60351, "epoch": 359} {"train_loss": -8.770017623901367, "global_step": 60352, "epoch": 359} {"train_loss": -8.579309463500977, "global_step": 60353, "epoch": 359} {"train_loss": -8.693634033203125, "global_step": 60354, "epoch": 359} {"train_loss": -8.716377258300781, "global_step": 60355, "epoch": 359} {"train_loss": -8.828811645507812, "global_step": 60356, "epoch": 359} {"train_loss": -8.74128532409668, "global_step": 60357, "epoch": 359} {"train_loss": -8.654414176940918, "global_step": 60358, "epoch": 359} {"train_loss": -8.911741256713867, "global_step": 60359, "epoch": 359} {"train_loss": -8.645431518554688, "global_step": 60360, "epoch": 359} {"train_loss": -8.637479782104492, "global_step": 60361, "epoch": 359} {"train_loss": -8.73738956451416, "global_step": 60362, "epoch": 359} {"train_loss": -8.592453002929688, "global_step": 60363, "epoch": 359} {"train_loss": -8.881928443908691, "global_step": 60364, "epoch": 359} {"train_loss": -8.466744422912598, "global_step": 60365, "epoch": 359} {"train_loss": -8.24135971069336, "global_step": 60366, "epoch": 359} {"train_loss": -8.578977584838867, "global_step": 60367, "epoch": 359} {"train_loss": -8.70872688293457, "global_step": 60368, "epoch": 359} {"train_loss": -8.810675621032715, "global_step": 60369, "epoch": 359} {"train_loss": -8.674684524536133, "global_step": 60370, "epoch": 359} {"train_loss": -8.510332107543945, "global_step": 60371, "epoch": 359} {"train_loss": -8.518632888793945, "global_step": 60372, "epoch": 359} {"train_loss": -8.867147445678711, "global_step": 60373, "epoch": 359} {"train_loss": -8.744747161865234, "global_step": 60374, "epoch": 359} {"train_loss": -8.539048194885254, "global_step": 60375, "epoch": 359} {"train_loss": -8.570043563842773, "global_step": 60376, "epoch": 359} {"train_loss": -8.755249977111816, "global_step": 60377, "epoch": 359} {"train_loss": -8.75780963897705, "global_step": 60378, "epoch": 359} {"train_loss": -8.656044960021973, "global_step": 60379, "epoch": 359} {"train_loss": -8.68685531616211, "global_step": 60380, "epoch": 359} {"train_loss": -8.771269798278809, "global_step": 60381, "epoch": 359} {"train_loss": -8.591729164123535, "global_step": 60382, "epoch": 359} {"train_loss": -8.577442169189453, "global_step": 60383, "epoch": 359} {"train_loss": -8.656875610351562, "global_step": 60384, "epoch": 359} {"train_loss": -8.828228950500488, "global_step": 60385, "epoch": 359} {"train_loss": -8.61484146118164, "global_step": 60386, "epoch": 359} {"train_loss": -8.584867477416992, "global_step": 60387, "epoch": 359} {"train_loss": -8.536060333251953, "global_step": 60388, "epoch": 359} {"train_loss": -8.709967613220215, "global_step": 60389, "epoch": 359} {"train_loss": -8.917545318603516, "global_step": 60390, "epoch": 359} {"train_loss": -8.721882820129395, "global_step": 60391, "epoch": 359} {"train_loss": -8.94468879699707, "global_step": 60392, "epoch": 359} {"train_loss": -8.838668823242188, "global_step": 60393, "epoch": 359} {"train_loss": -8.830117225646973, "global_step": 60394, "epoch": 359} {"train_loss": -8.318180084228516, "global_step": 60395, "epoch": 359} {"train_loss": -8.889885902404785, "global_step": 60396, "epoch": 359} {"train_loss": -8.941651344299316, "global_step": 60397, "epoch": 359} {"train_loss": -8.511919021606445, "global_step": 60398, "epoch": 359} {"train_loss": -8.990825653076172, "global_step": 60399, "epoch": 359} {"train_loss": -8.612926483154297, "global_step": 60400, "epoch": 359} {"train_loss": -8.594205856323242, "global_step": 60401, "epoch": 359} {"train_loss": -8.69932746887207, "global_step": 60402, "epoch": 359} {"train_loss": -8.594954490661621, "global_step": 60403, "epoch": 359} {"train_loss": -8.78927993774414, "global_step": 60404, "epoch": 359} {"train_loss": -8.514949798583984, "global_step": 60405, "epoch": 359} {"train_loss": -8.733854293823242, "global_step": 60406, "epoch": 359} {"train_loss": -8.820850372314453, "global_step": 60407, "epoch": 359} {"train_loss": -8.857620239257812, "global_step": 60408, "epoch": 359} {"train_loss": -8.931744575500488, "global_step": 60409, "epoch": 359} {"train_loss": -8.90250015258789, "global_step": 60410, "epoch": 359} {"train_loss": -8.450728416442871, "global_step": 60411, "epoch": 359} {"train_loss": -8.782376289367676, "global_step": 60412, "epoch": 359} {"train_loss": -8.833406448364258, "global_step": 60413, "epoch": 359} {"train_loss": -8.713225364685059, "global_step": 60414, "epoch": 359} {"train_loss": -8.81033992767334, "global_step": 60415, "epoch": 359} {"train_loss": -8.496343612670898, "global_step": 60416, "epoch": 359} {"train_loss": -8.879429817199707, "global_step": 60417, "epoch": 359} {"train_loss": -8.580310821533203, "global_step": 60418, "epoch": 359} {"train_loss": -8.619704246520996, "global_step": 60419, "epoch": 359} {"train_loss": -8.447492599487305, "global_step": 60420, "epoch": 359} {"train_loss": -8.74557113647461, "global_step": 60421, "epoch": 359} {"train_loss": -8.671148300170898, "global_step": 60422, "epoch": 359} {"train_loss": -9.039933204650879, "global_step": 60423, "epoch": 359} {"train_loss": -8.65201187133789, "global_step": 60424, "epoch": 359} {"train_loss": -8.948802947998047, "global_step": 60425, "epoch": 359} {"train_loss": -8.514065742492676, "global_step": 60426, "epoch": 359} {"train_loss": -8.950151443481445, "global_step": 60427, "epoch": 359} {"train_loss": -8.683677673339844, "global_step": 60428, "epoch": 359} {"train_loss": -8.666074752807617, "global_step": 60429, "epoch": 359} {"train_loss": -8.640636444091797, "global_step": 60430, "epoch": 359} {"train_loss": -8.533950805664062, "global_step": 60431, "epoch": 359} {"train_loss": -8.910839080810547, "global_step": 60432, "epoch": 359} {"train_loss": -8.638131141662598, "global_step": 60433, "epoch": 359} {"train_loss": -8.666094779968262, "global_step": 60434, "epoch": 359} {"train_loss": -8.354658126831055, "global_step": 60435, "epoch": 359} {"train_loss": -8.360522270202637, "global_step": 60436, "epoch": 359} {"train_loss": -8.430456161499023, "global_step": 60437, "epoch": 359} {"train_loss": -8.65410327911377, "global_step": 60438, "epoch": 359} {"train_loss": -8.211589813232422, "global_step": 60439, "epoch": 359} {"train_loss": -8.570162773132324, "global_step": 60440, "epoch": 359} {"train_loss": -8.569622039794922, "global_step": 60441, "epoch": 359} {"train_loss": -8.443439483642578, "global_step": 60442, "epoch": 359} {"train_loss": -8.2847900390625, "global_step": 60443, "epoch": 359} {"train_loss": -8.580068588256836, "global_step": 60444, "epoch": 359} {"train_loss": -8.353470802307129, "global_step": 60445, "epoch": 359} {"train_loss": -8.117424011230469, "global_step": 60446, "epoch": 359} {"train_loss": -8.228537559509277, "global_step": 60447, "epoch": 359} {"train_loss": -8.291015625, "global_step": 60448, "epoch": 359} {"train_loss": -8.324607849121094, "global_step": 60449, "epoch": 359} {"train_loss": -8.330436706542969, "global_step": 60450, "epoch": 359} {"train_loss": -8.350676536560059, "global_step": 60451, "epoch": 359} {"train_loss": -8.395998001098633, "global_step": 60452, "epoch": 359} {"train_loss": -8.623295783996582, "global_step": 60453, "epoch": 359} {"train_loss": -8.712713241577148, "global_step": 60454, "epoch": 359} {"train_loss": -8.396787643432617, "global_step": 60455, "epoch": 359} {"train_loss": -8.56921672821045, "global_step": 60456, "epoch": 359} {"train_loss": -8.423855781555176, "global_step": 60457, "epoch": 359} {"train_loss": -8.575460433959961, "global_step": 60458, "epoch": 359} {"train_loss": -8.513668060302734, "global_step": 60459, "epoch": 359} {"train_loss": -8.731972694396973, "global_step": 60460, "epoch": 359} {"train_loss": -8.487783432006836, "global_step": 60461, "epoch": 359} {"train_loss": -8.585575103759766, "global_step": 60462, "epoch": 359} {"train_loss": -8.645726203918457, "global_step": 60463, "epoch": 359} {"train_loss": -8.815885543823242, "global_step": 60464, "epoch": 359} {"train_loss": -8.621861457824707, "global_step": 60465, "epoch": 359} {"train_loss": -8.489465713500977, "global_step": 60466, "epoch": 359} {"train_loss": -8.741816520690918, "global_step": 60467, "epoch": 359} {"train_loss": -8.548513412475586, "global_step": 60468, "epoch": 359} {"train_loss": -8.66963005065918, "global_step": 60469, "epoch": 359} {"train_loss": -8.634754180908203, "global_step": 60470, "epoch": 359} {"train_loss": -8.430279731750488, "global_step": 60471, "epoch": 359} {"train_loss": -8.672005653381348, "global_step": 60472, "epoch": 359} {"train_loss": -8.75464916229248, "global_step": 60473, "epoch": 359} {"train_loss": -8.654304504394531, "global_step": 60474, "epoch": 359} {"train_loss": -8.766233444213867, "global_step": 60475, "epoch": 359} {"train_loss": -8.623321533203125, "global_step": 60476, "epoch": 359} {"train_loss": -8.740755081176758, "global_step": 60477, "epoch": 359} {"train_loss": -8.857205390930176, "global_step": 60478, "epoch": 359} {"train_loss": -8.628524155843825, "global_step": 60479, "epoch": 359, "val_loss": 188197.453125} {"train_loss": -8.64854907989502, "global_step": 60480, "epoch": 360} {"train_loss": -8.779745101928711, "global_step": 60481, "epoch": 360} {"train_loss": -8.772720336914062, "global_step": 60482, "epoch": 360} {"train_loss": -8.711652755737305, "global_step": 60483, "epoch": 360} {"train_loss": -8.789466857910156, "global_step": 60484, "epoch": 360} {"train_loss": -8.698601722717285, "global_step": 60485, "epoch": 360} {"train_loss": -8.59623908996582, "global_step": 60486, "epoch": 360} {"train_loss": -8.713645935058594, "global_step": 60487, "epoch": 360} {"train_loss": -8.691892623901367, "global_step": 60488, "epoch": 360} {"train_loss": -8.734996795654297, "global_step": 60489, "epoch": 360} {"train_loss": -8.747882843017578, "global_step": 60490, "epoch": 360} {"train_loss": -8.689680099487305, "global_step": 60491, "epoch": 360} {"train_loss": -8.824583053588867, "global_step": 60492, "epoch": 360} {"train_loss": -8.504056930541992, "global_step": 60493, "epoch": 360} {"train_loss": -8.519514083862305, "global_step": 60494, "epoch": 360} {"train_loss": -8.78420639038086, "global_step": 60495, "epoch": 360} {"train_loss": -8.837970733642578, "global_step": 60496, "epoch": 360} {"train_loss": -8.82433795928955, "global_step": 60497, "epoch": 360} {"train_loss": -8.578264236450195, "global_step": 60498, "epoch": 360} {"train_loss": -8.737384796142578, "global_step": 60499, "epoch": 360} {"train_loss": -8.943262100219727, "global_step": 60500, "epoch": 360} {"train_loss": -8.553963661193848, "global_step": 60501, "epoch": 360} {"train_loss": -8.664443969726562, "global_step": 60502, "epoch": 360} {"train_loss": -8.678478240966797, "global_step": 60503, "epoch": 360} {"train_loss": -8.67599105834961, "global_step": 60504, "epoch": 360} {"train_loss": -8.694112777709961, "global_step": 60505, "epoch": 360} {"train_loss": -8.718405723571777, "global_step": 60506, "epoch": 360} {"train_loss": -8.615047454833984, "global_step": 60507, "epoch": 360} {"train_loss": -8.438039779663086, "global_step": 60508, "epoch": 360} {"train_loss": -8.538084030151367, "global_step": 60509, "epoch": 360} {"train_loss": -8.586344718933105, "global_step": 60510, "epoch": 360} {"train_loss": -8.670060157775879, "global_step": 60511, "epoch": 360} {"train_loss": -8.596014976501465, "global_step": 60512, "epoch": 360} {"train_loss": -8.58110237121582, "global_step": 60513, "epoch": 360} {"train_loss": -8.585333824157715, "global_step": 60514, "epoch": 360} {"train_loss": -8.527469635009766, "global_step": 60515, "epoch": 360} {"train_loss": -8.499944686889648, "global_step": 60516, "epoch": 360} {"train_loss": -8.53624153137207, "global_step": 60517, "epoch": 360} {"train_loss": -8.318901062011719, "global_step": 60518, "epoch": 360} {"train_loss": -8.741067886352539, "global_step": 60519, "epoch": 360} {"train_loss": -8.589527130126953, "global_step": 60520, "epoch": 360} {"train_loss": -8.704267501831055, "global_step": 60521, "epoch": 360} {"train_loss": -8.637508392333984, "global_step": 60522, "epoch": 360} {"train_loss": -8.603490829467773, "global_step": 60523, "epoch": 360} {"train_loss": -8.47004508972168, "global_step": 60524, "epoch": 360} {"train_loss": -8.713821411132812, "global_step": 60525, "epoch": 360} {"train_loss": -8.51968765258789, "global_step": 60526, "epoch": 360} {"train_loss": -8.534183502197266, "global_step": 60527, "epoch": 360} {"train_loss": -8.883773803710938, "global_step": 60528, "epoch": 360} {"train_loss": -8.673227310180664, "global_step": 60529, "epoch": 360} {"train_loss": -8.793769836425781, "global_step": 60530, "epoch": 360} {"train_loss": -8.827010154724121, "global_step": 60531, "epoch": 360} {"train_loss": -8.862287521362305, "global_step": 60532, "epoch": 360} {"train_loss": -8.681417465209961, "global_step": 60533, "epoch": 360} {"train_loss": -8.584227561950684, "global_step": 60534, "epoch": 360} {"train_loss": -8.6677885055542, "global_step": 60535, "epoch": 360} {"train_loss": -8.858184814453125, "global_step": 60536, "epoch": 360} {"train_loss": -8.626312255859375, "global_step": 60537, "epoch": 360} {"train_loss": -8.68190860748291, "global_step": 60538, "epoch": 360} {"train_loss": -8.891026496887207, "global_step": 60539, "epoch": 360} {"train_loss": -8.701075553894043, "global_step": 60540, "epoch": 360} {"train_loss": -8.612700462341309, "global_step": 60541, "epoch": 360} {"train_loss": -8.756017684936523, "global_step": 60542, "epoch": 360} {"train_loss": -8.874056816101074, "global_step": 60543, "epoch": 360} {"train_loss": -8.851520538330078, "global_step": 60544, "epoch": 360} {"train_loss": -9.006586074829102, "global_step": 60545, "epoch": 360} {"train_loss": -8.967913627624512, "global_step": 60546, "epoch": 360} {"train_loss": -8.770659446716309, "global_step": 60547, "epoch": 360} {"train_loss": -8.84772777557373, "global_step": 60548, "epoch": 360} {"train_loss": -8.481241226196289, "global_step": 60549, "epoch": 360} {"train_loss": -8.205436706542969, "global_step": 60550, "epoch": 360} {"train_loss": -8.317503929138184, "global_step": 60551, "epoch": 360} {"train_loss": -7.790346145629883, "global_step": 60552, "epoch": 360} {"train_loss": -8.509864807128906, "global_step": 60553, "epoch": 360} {"train_loss": -8.07972526550293, "global_step": 60554, "epoch": 360} {"train_loss": -8.294208526611328, "global_step": 60555, "epoch": 360} {"train_loss": -8.414011001586914, "global_step": 60556, "epoch": 360} {"train_loss": -8.113252639770508, "global_step": 60557, "epoch": 360} {"train_loss": -8.107076644897461, "global_step": 60558, "epoch": 360} {"train_loss": -8.237092971801758, "global_step": 60559, "epoch": 360} {"train_loss": -8.347505569458008, "global_step": 60560, "epoch": 360} {"train_loss": -8.239432334899902, "global_step": 60561, "epoch": 360} {"train_loss": -8.185949325561523, "global_step": 60562, "epoch": 360} {"train_loss": -8.340221405029297, "global_step": 60563, "epoch": 360} {"train_loss": -8.341545104980469, "global_step": 60564, "epoch": 360} {"train_loss": -8.444311141967773, "global_step": 60565, "epoch": 360} {"train_loss": -8.36406135559082, "global_step": 60566, "epoch": 360} {"train_loss": -8.300562858581543, "global_step": 60567, "epoch": 360} {"train_loss": -8.368973731994629, "global_step": 60568, "epoch": 360} {"train_loss": -8.336565971374512, "global_step": 60569, "epoch": 360} {"train_loss": -8.315692901611328, "global_step": 60570, "epoch": 360} {"train_loss": -8.299203872680664, "global_step": 60571, "epoch": 360} {"train_loss": -8.375799179077148, "global_step": 60572, "epoch": 360} {"train_loss": -8.508968353271484, "global_step": 60573, "epoch": 360} {"train_loss": -8.336629867553711, "global_step": 60574, "epoch": 360} {"train_loss": -8.499242782592773, "global_step": 60575, "epoch": 360} {"train_loss": -8.53410816192627, "global_step": 60576, "epoch": 360} {"train_loss": -8.651506423950195, "global_step": 60577, "epoch": 360} {"train_loss": -8.750653266906738, "global_step": 60578, "epoch": 360} {"train_loss": -8.625940322875977, "global_step": 60579, "epoch": 360} {"train_loss": -8.545862197875977, "global_step": 60580, "epoch": 360} {"train_loss": -8.735712051391602, "global_step": 60581, "epoch": 360} {"train_loss": -8.597623825073242, "global_step": 60582, "epoch": 360} {"train_loss": -8.625633239746094, "global_step": 60583, "epoch": 360} {"train_loss": -8.714760780334473, "global_step": 60584, "epoch": 360} {"train_loss": -8.739896774291992, "global_step": 60585, "epoch": 360} {"train_loss": -8.769198417663574, "global_step": 60586, "epoch": 360} {"train_loss": -8.665255546569824, "global_step": 60587, "epoch": 360} {"train_loss": -8.538238525390625, "global_step": 60588, "epoch": 360} {"train_loss": -8.557869911193848, "global_step": 60589, "epoch": 360} {"train_loss": -8.80984878540039, "global_step": 60590, "epoch": 360} {"train_loss": -8.682199478149414, "global_step": 60591, "epoch": 360} {"train_loss": -8.753396034240723, "global_step": 60592, "epoch": 360} {"train_loss": -8.789483070373535, "global_step": 60593, "epoch": 360} {"train_loss": -8.829408645629883, "global_step": 60594, "epoch": 360} {"train_loss": -8.816718101501465, "global_step": 60595, "epoch": 360} {"train_loss": -8.752957344055176, "global_step": 60596, "epoch": 360} {"train_loss": -8.450559616088867, "global_step": 60597, "epoch": 360} {"train_loss": -8.605228424072266, "global_step": 60598, "epoch": 360} {"train_loss": -8.448345184326172, "global_step": 60599, "epoch": 360} {"train_loss": -8.74945068359375, "global_step": 60600, "epoch": 360} {"train_loss": -8.50236701965332, "global_step": 60601, "epoch": 360} {"train_loss": -8.726408958435059, "global_step": 60602, "epoch": 360} {"train_loss": -8.55488395690918, "global_step": 60603, "epoch": 360} {"train_loss": -8.483107566833496, "global_step": 60604, "epoch": 360} {"train_loss": -8.55981159210205, "global_step": 60605, "epoch": 360} {"train_loss": -8.599288940429688, "global_step": 60606, "epoch": 360} {"train_loss": -8.505072593688965, "global_step": 60607, "epoch": 360} {"train_loss": -8.684993743896484, "global_step": 60608, "epoch": 360} {"train_loss": -8.398148536682129, "global_step": 60609, "epoch": 360} {"train_loss": -8.549816131591797, "global_step": 60610, "epoch": 360} {"train_loss": -8.44268798828125, "global_step": 60611, "epoch": 360} {"train_loss": -8.550722122192383, "global_step": 60612, "epoch": 360} {"train_loss": -8.47268009185791, "global_step": 60613, "epoch": 360} {"train_loss": -8.66606616973877, "global_step": 60614, "epoch": 360} {"train_loss": -8.645467758178711, "global_step": 60615, "epoch": 360} {"train_loss": -8.514245986938477, "global_step": 60616, "epoch": 360} {"train_loss": -8.577571868896484, "global_step": 60617, "epoch": 360} {"train_loss": -8.503682136535645, "global_step": 60618, "epoch": 360} {"train_loss": -8.620306015014648, "global_step": 60619, "epoch": 360} {"train_loss": -8.937450408935547, "global_step": 60620, "epoch": 360} {"train_loss": -8.684541702270508, "global_step": 60621, "epoch": 360} {"train_loss": -8.823604583740234, "global_step": 60622, "epoch": 360} {"train_loss": -8.648223876953125, "global_step": 60623, "epoch": 360} {"train_loss": -8.796488761901855, "global_step": 60624, "epoch": 360} {"train_loss": -8.5554780960083, "global_step": 60625, "epoch": 360} {"train_loss": -8.465774536132812, "global_step": 60626, "epoch": 360} {"train_loss": -8.559558868408203, "global_step": 60627, "epoch": 360} {"train_loss": -8.69067096710205, "global_step": 60628, "epoch": 360} {"train_loss": -8.6477632522583, "global_step": 60629, "epoch": 360} {"train_loss": -8.577144622802734, "global_step": 60630, "epoch": 360} {"train_loss": -8.686469078063965, "global_step": 60631, "epoch": 360} {"train_loss": -8.575902938842773, "global_step": 60632, "epoch": 360} {"train_loss": -8.581562995910645, "global_step": 60633, "epoch": 360} {"train_loss": -8.636364936828613, "global_step": 60634, "epoch": 360} {"train_loss": -8.735435485839844, "global_step": 60635, "epoch": 360} {"train_loss": -8.379554748535156, "global_step": 60636, "epoch": 360} {"train_loss": -8.820650100708008, "global_step": 60637, "epoch": 360} {"train_loss": -8.57821273803711, "global_step": 60638, "epoch": 360} {"train_loss": -8.869884490966797, "global_step": 60639, "epoch": 360} {"train_loss": -8.699600219726562, "global_step": 60640, "epoch": 360} {"train_loss": -8.743671417236328, "global_step": 60641, "epoch": 360} {"train_loss": -8.6429443359375, "global_step": 60642, "epoch": 360} {"train_loss": -8.84933090209961, "global_step": 60643, "epoch": 360} {"train_loss": -8.85942554473877, "global_step": 60644, "epoch": 360} {"train_loss": -8.744359970092773, "global_step": 60645, "epoch": 360} {"train_loss": -8.725135803222656, "global_step": 60646, "epoch": 360} {"train_loss": -8.609499664533706, "global_step": 60647, "epoch": 360, "val_loss": 190794.828125, "train_action_mse_error": 13.290761947631836} {"train_loss": -8.699783325195312, "global_step": 60648, "epoch": 361} {"train_loss": -8.896734237670898, "global_step": 60649, "epoch": 361} {"train_loss": -8.787042617797852, "global_step": 60650, "epoch": 361} {"train_loss": -8.34156608581543, "global_step": 60651, "epoch": 361} {"train_loss": -8.846546173095703, "global_step": 60652, "epoch": 361} {"train_loss": -8.748698234558105, "global_step": 60653, "epoch": 361} {"train_loss": -8.66754150390625, "global_step": 60654, "epoch": 361} {"train_loss": -8.713714599609375, "global_step": 60655, "epoch": 361} {"train_loss": -8.930379867553711, "global_step": 60656, "epoch": 361} {"train_loss": -8.548627853393555, "global_step": 60657, "epoch": 361} {"train_loss": -8.814342498779297, "global_step": 60658, "epoch": 361} {"train_loss": -8.094510078430176, "global_step": 60659, "epoch": 361} {"train_loss": -8.557089805603027, "global_step": 60660, "epoch": 361} {"train_loss": -8.169761657714844, "global_step": 60661, "epoch": 361} {"train_loss": -8.313413619995117, "global_step": 60662, "epoch": 361} {"train_loss": -8.141679763793945, "global_step": 60663, "epoch": 361} {"train_loss": -8.522804260253906, "global_step": 60664, "epoch": 361} {"train_loss": -8.30766773223877, "global_step": 60665, "epoch": 361} {"train_loss": -8.442177772521973, "global_step": 60666, "epoch": 361} {"train_loss": -8.41125774383545, "global_step": 60667, "epoch": 361} {"train_loss": -8.449610710144043, "global_step": 60668, "epoch": 361} {"train_loss": -8.62851333618164, "global_step": 60669, "epoch": 361} {"train_loss": -8.516300201416016, "global_step": 60670, "epoch": 361} {"train_loss": -8.533564567565918, "global_step": 60671, "epoch": 361} {"train_loss": -8.472049713134766, "global_step": 60672, "epoch": 361} {"train_loss": -8.699535369873047, "global_step": 60673, "epoch": 361} {"train_loss": -8.493963241577148, "global_step": 60674, "epoch": 361} {"train_loss": -8.734106063842773, "global_step": 60675, "epoch": 361} {"train_loss": -8.884500503540039, "global_step": 60676, "epoch": 361} {"train_loss": -8.803552627563477, "global_step": 60677, "epoch": 361} {"train_loss": -8.785894393920898, "global_step": 60678, "epoch": 361} {"train_loss": -8.599599838256836, "global_step": 60679, "epoch": 361} {"train_loss": -8.548288345336914, "global_step": 60680, "epoch": 361} {"train_loss": -8.654382705688477, "global_step": 60681, "epoch": 361} {"train_loss": -8.72114372253418, "global_step": 60682, "epoch": 361} {"train_loss": -8.61823558807373, "global_step": 60683, "epoch": 361} {"train_loss": -8.653690338134766, "global_step": 60684, "epoch": 361} {"train_loss": -8.693537712097168, "global_step": 60685, "epoch": 361} {"train_loss": -8.53184700012207, "global_step": 60686, "epoch": 361} {"train_loss": -8.766758918762207, "global_step": 60687, "epoch": 361} {"train_loss": -8.550292015075684, "global_step": 60688, "epoch": 361} {"train_loss": -8.617949485778809, "global_step": 60689, "epoch": 361} {"train_loss": -8.649803161621094, "global_step": 60690, "epoch": 361} {"train_loss": -8.615341186523438, "global_step": 60691, "epoch": 361} {"train_loss": -8.692123413085938, "global_step": 60692, "epoch": 361} {"train_loss": -8.738911628723145, "global_step": 60693, "epoch": 361} {"train_loss": -8.575460433959961, "global_step": 60694, "epoch": 361} {"train_loss": -8.746469497680664, "global_step": 60695, "epoch": 361} {"train_loss": -8.821596145629883, "global_step": 60696, "epoch": 361} {"train_loss": -8.854658126831055, "global_step": 60697, "epoch": 361} {"train_loss": -8.85152530670166, "global_step": 60698, "epoch": 361} {"train_loss": -8.78419017791748, "global_step": 60699, "epoch": 361} {"train_loss": -8.609159469604492, "global_step": 60700, "epoch": 361} {"train_loss": -8.741734504699707, "global_step": 60701, "epoch": 361} {"train_loss": -8.92767333984375, "global_step": 60702, "epoch": 361} {"train_loss": -8.825183868408203, "global_step": 60703, "epoch": 361} {"train_loss": -8.767644882202148, "global_step": 60704, "epoch": 361} {"train_loss": -8.722843170166016, "global_step": 60705, "epoch": 361} {"train_loss": -8.68049144744873, "global_step": 60706, "epoch": 361} {"train_loss": -8.78615951538086, "global_step": 60707, "epoch": 361} {"train_loss": -8.503082275390625, "global_step": 60708, "epoch": 361} {"train_loss": -8.559883117675781, "global_step": 60709, "epoch": 361} {"train_loss": -8.82689094543457, "global_step": 60710, "epoch": 361} {"train_loss": -8.746788024902344, "global_step": 60711, "epoch": 361} {"train_loss": -8.936655044555664, "global_step": 60712, "epoch": 361} {"train_loss": -8.718133926391602, "global_step": 60713, "epoch": 361} {"train_loss": -8.270059585571289, "global_step": 60714, "epoch": 361} {"train_loss": -8.525362014770508, "global_step": 60715, "epoch": 361} {"train_loss": -8.528778076171875, "global_step": 60716, "epoch": 361} {"train_loss": -8.753644943237305, "global_step": 60717, "epoch": 361} {"train_loss": -8.827362060546875, "global_step": 60718, "epoch": 361} {"train_loss": -8.78057861328125, "global_step": 60719, "epoch": 361} {"train_loss": -8.640745162963867, "global_step": 60720, "epoch": 361} {"train_loss": -8.861989974975586, "global_step": 60721, "epoch": 361} {"train_loss": -8.67448902130127, "global_step": 60722, "epoch": 361} {"train_loss": -8.27316665649414, "global_step": 60723, "epoch": 361} {"train_loss": -8.46088695526123, "global_step": 60724, "epoch": 361} {"train_loss": -8.375454902648926, "global_step": 60725, "epoch": 361} {"train_loss": -8.680335998535156, "global_step": 60726, "epoch": 361} {"train_loss": -8.558395385742188, "global_step": 60727, "epoch": 361} {"train_loss": -8.603483200073242, "global_step": 60728, "epoch": 361} {"train_loss": -8.494138717651367, "global_step": 60729, "epoch": 361} {"train_loss": -8.244782447814941, "global_step": 60730, "epoch": 361} {"train_loss": -8.556408882141113, "global_step": 60731, "epoch": 361} {"train_loss": -8.445625305175781, "global_step": 60732, "epoch": 361} {"train_loss": -8.421823501586914, "global_step": 60733, "epoch": 361} {"train_loss": -8.609708786010742, "global_step": 60734, "epoch": 361} {"train_loss": -8.332208633422852, "global_step": 60735, "epoch": 361} {"train_loss": -8.342668533325195, "global_step": 60736, "epoch": 361} {"train_loss": -8.667908668518066, "global_step": 60737, "epoch": 361} {"train_loss": -8.743824005126953, "global_step": 60738, "epoch": 361} {"train_loss": -8.587454795837402, "global_step": 60739, "epoch": 361} {"train_loss": -8.558246612548828, "global_step": 60740, "epoch": 361} {"train_loss": -8.642353057861328, "global_step": 60741, "epoch": 361} {"train_loss": -8.440408706665039, "global_step": 60742, "epoch": 361} {"train_loss": -8.43571662902832, "global_step": 60743, "epoch": 361} {"train_loss": -8.463701248168945, "global_step": 60744, "epoch": 361} {"train_loss": -8.475811004638672, "global_step": 60745, "epoch": 361} {"train_loss": -8.349587440490723, "global_step": 60746, "epoch": 361} {"train_loss": -8.553630828857422, "global_step": 60747, "epoch": 361} {"train_loss": -8.53773307800293, "global_step": 60748, "epoch": 361} {"train_loss": -8.260429382324219, "global_step": 60749, "epoch": 361} {"train_loss": -8.61894416809082, "global_step": 60750, "epoch": 361} {"train_loss": -8.592105865478516, "global_step": 60751, "epoch": 361} {"train_loss": -8.847007751464844, "global_step": 60752, "epoch": 361} {"train_loss": -8.517467498779297, "global_step": 60753, "epoch": 361} {"train_loss": -8.773401260375977, "global_step": 60754, "epoch": 361} {"train_loss": -8.46864128112793, "global_step": 60755, "epoch": 361} {"train_loss": -8.744976997375488, "global_step": 60756, "epoch": 361} {"train_loss": -8.409549713134766, "global_step": 60757, "epoch": 361} {"train_loss": -8.94554328918457, "global_step": 60758, "epoch": 361} {"train_loss": -8.639787673950195, "global_step": 60759, "epoch": 361} {"train_loss": -8.514498710632324, "global_step": 60760, "epoch": 361} {"train_loss": -8.360305786132812, "global_step": 60761, "epoch": 361} {"train_loss": -8.436735153198242, "global_step": 60762, "epoch": 361} {"train_loss": -8.41468334197998, "global_step": 60763, "epoch": 361} {"train_loss": -8.608731269836426, "global_step": 60764, "epoch": 361} {"train_loss": -8.767487525939941, "global_step": 60765, "epoch": 361} {"train_loss": -8.466924667358398, "global_step": 60766, "epoch": 361} {"train_loss": -8.56988525390625, "global_step": 60767, "epoch": 361} {"train_loss": -8.417610168457031, "global_step": 60768, "epoch": 361} {"train_loss": -8.685131072998047, "global_step": 60769, "epoch": 361} {"train_loss": -8.569890975952148, "global_step": 60770, "epoch": 361} {"train_loss": -8.699596405029297, "global_step": 60771, "epoch": 361} {"train_loss": -8.56562614440918, "global_step": 60772, "epoch": 361} {"train_loss": -8.679765701293945, "global_step": 60773, "epoch": 361} {"train_loss": -8.583005905151367, "global_step": 60774, "epoch": 361} {"train_loss": -8.467950820922852, "global_step": 60775, "epoch": 361} {"train_loss": -8.799234390258789, "global_step": 60776, "epoch": 361} {"train_loss": -8.54165267944336, "global_step": 60777, "epoch": 361} {"train_loss": -8.822379112243652, "global_step": 60778, "epoch": 361} {"train_loss": -8.726227760314941, "global_step": 60779, "epoch": 361} {"train_loss": -8.68898868560791, "global_step": 60780, "epoch": 361} {"train_loss": -8.570441246032715, "global_step": 60781, "epoch": 361} {"train_loss": -8.506275177001953, "global_step": 60782, "epoch": 361} {"train_loss": -8.505931854248047, "global_step": 60783, "epoch": 361} {"train_loss": -8.499076843261719, "global_step": 60784, "epoch": 361} {"train_loss": -8.32113265991211, "global_step": 60785, "epoch": 361} {"train_loss": -8.721734046936035, "global_step": 60786, "epoch": 361} {"train_loss": -8.562219619750977, "global_step": 60787, "epoch": 361} {"train_loss": -8.649229049682617, "global_step": 60788, "epoch": 361} {"train_loss": -8.462987899780273, "global_step": 60789, "epoch": 361} {"train_loss": -8.341803550720215, "global_step": 60790, "epoch": 361} {"train_loss": -8.527566909790039, "global_step": 60791, "epoch": 361} {"train_loss": -8.453754425048828, "global_step": 60792, "epoch": 361} {"train_loss": -8.659130096435547, "global_step": 60793, "epoch": 361} {"train_loss": -8.875375747680664, "global_step": 60794, "epoch": 361} {"train_loss": -8.67425537109375, "global_step": 60795, "epoch": 361} {"train_loss": -8.767097473144531, "global_step": 60796, "epoch": 361} {"train_loss": -8.604379653930664, "global_step": 60797, "epoch": 361} {"train_loss": -8.713127136230469, "global_step": 60798, "epoch": 361} {"train_loss": -8.650732040405273, "global_step": 60799, "epoch": 361} {"train_loss": -8.60842227935791, "global_step": 60800, "epoch": 361} {"train_loss": -8.697839736938477, "global_step": 60801, "epoch": 361} {"train_loss": -8.803910255432129, "global_step": 60802, "epoch": 361} {"train_loss": -8.417264938354492, "global_step": 60803, "epoch": 361} {"train_loss": -8.628467559814453, "global_step": 60804, "epoch": 361} {"train_loss": -8.586905479431152, "global_step": 60805, "epoch": 361} {"train_loss": -8.650030136108398, "global_step": 60806, "epoch": 361} {"train_loss": -8.766420364379883, "global_step": 60807, "epoch": 361} {"train_loss": -8.776213645935059, "global_step": 60808, "epoch": 361} {"train_loss": -8.557066917419434, "global_step": 60809, "epoch": 361} {"train_loss": -8.881818771362305, "global_step": 60810, "epoch": 361} {"train_loss": -8.850875854492188, "global_step": 60811, "epoch": 361} {"train_loss": -8.840784072875977, "global_step": 60812, "epoch": 361} {"train_loss": -8.93880558013916, "global_step": 60813, "epoch": 361} {"train_loss": -8.63430404663086, "global_step": 60814, "epoch": 361} {"train_loss": -8.61342465877533, "global_step": 60815, "epoch": 361, "val_loss": 189459.578125} {"train_loss": -8.34875202178955, "global_step": 60816, "epoch": 362} {"train_loss": -8.704317092895508, "global_step": 60817, "epoch": 362} {"train_loss": -8.430402755737305, "global_step": 60818, "epoch": 362} {"train_loss": -8.527395248413086, "global_step": 60819, "epoch": 362} {"train_loss": -8.592251777648926, "global_step": 60820, "epoch": 362} {"train_loss": -8.510688781738281, "global_step": 60821, "epoch": 362} {"train_loss": -8.491645812988281, "global_step": 60822, "epoch": 362} {"train_loss": -8.674581527709961, "global_step": 60823, "epoch": 362} {"train_loss": -8.695379257202148, "global_step": 60824, "epoch": 362} {"train_loss": -8.798877716064453, "global_step": 60825, "epoch": 362} {"train_loss": -8.779409408569336, "global_step": 60826, "epoch": 362} {"train_loss": -8.86064338684082, "global_step": 60827, "epoch": 362} {"train_loss": -8.634054183959961, "global_step": 60828, "epoch": 362} {"train_loss": -8.772198677062988, "global_step": 60829, "epoch": 362} {"train_loss": -8.697782516479492, "global_step": 60830, "epoch": 362} {"train_loss": -8.617019653320312, "global_step": 60831, "epoch": 362} {"train_loss": -8.78702449798584, "global_step": 60832, "epoch": 362} {"train_loss": -8.947403907775879, "global_step": 60833, "epoch": 362} {"train_loss": -8.84592056274414, "global_step": 60834, "epoch": 362} {"train_loss": -8.745436668395996, "global_step": 60835, "epoch": 362} {"train_loss": -8.749231338500977, "global_step": 60836, "epoch": 362} {"train_loss": -8.672159194946289, "global_step": 60837, "epoch": 362} {"train_loss": -8.67353630065918, "global_step": 60838, "epoch": 362} {"train_loss": -8.471610069274902, "global_step": 60839, "epoch": 362} {"train_loss": -8.63688850402832, "global_step": 60840, "epoch": 362} {"train_loss": -8.779485702514648, "global_step": 60841, "epoch": 362} {"train_loss": -8.592918395996094, "global_step": 60842, "epoch": 362} {"train_loss": -9.013113021850586, "global_step": 60843, "epoch": 362} {"train_loss": -8.862319946289062, "global_step": 60844, "epoch": 362} {"train_loss": -8.96780014038086, "global_step": 60845, "epoch": 362} {"train_loss": -8.714653968811035, "global_step": 60846, "epoch": 362} {"train_loss": -8.616374969482422, "global_step": 60847, "epoch": 362} {"train_loss": -8.774428367614746, "global_step": 60848, "epoch": 362} {"train_loss": -8.542494773864746, "global_step": 60849, "epoch": 362} {"train_loss": -8.777875900268555, "global_step": 60850, "epoch": 362} {"train_loss": -8.72237777709961, "global_step": 60851, "epoch": 362} {"train_loss": -8.747193336486816, "global_step": 60852, "epoch": 362} {"train_loss": -8.550349235534668, "global_step": 60853, "epoch": 362} {"train_loss": -8.723027229309082, "global_step": 60854, "epoch": 362} {"train_loss": -8.552762985229492, "global_step": 60855, "epoch": 362} {"train_loss": -8.29770278930664, "global_step": 60856, "epoch": 362} {"train_loss": -8.613956451416016, "global_step": 60857, "epoch": 362} {"train_loss": -8.738142013549805, "global_step": 60858, "epoch": 362} {"train_loss": -8.702458381652832, "global_step": 60859, "epoch": 362} {"train_loss": -8.433391571044922, "global_step": 60860, "epoch": 362} {"train_loss": -8.610125541687012, "global_step": 60861, "epoch": 362} {"train_loss": -8.57100772857666, "global_step": 60862, "epoch": 362} {"train_loss": -8.546621322631836, "global_step": 60863, "epoch": 362} {"train_loss": -8.67332649230957, "global_step": 60864, "epoch": 362} {"train_loss": -8.625405311584473, "global_step": 60865, "epoch": 362} {"train_loss": -8.794066429138184, "global_step": 60866, "epoch": 362} {"train_loss": -8.615582466125488, "global_step": 60867, "epoch": 362} {"train_loss": -8.868863105773926, "global_step": 60868, "epoch": 362} {"train_loss": -8.824283599853516, "global_step": 60869, "epoch": 362} {"train_loss": -8.426742553710938, "global_step": 60870, "epoch": 362} {"train_loss": -8.721919059753418, "global_step": 60871, "epoch": 362} {"train_loss": -8.854142189025879, "global_step": 60872, "epoch": 362} {"train_loss": -8.812684059143066, "global_step": 60873, "epoch": 362} {"train_loss": -8.544010162353516, "global_step": 60874, "epoch": 362} {"train_loss": -8.762873649597168, "global_step": 60875, "epoch": 362} {"train_loss": -8.418342590332031, "global_step": 60876, "epoch": 362} {"train_loss": -8.905508995056152, "global_step": 60877, "epoch": 362} {"train_loss": -8.791955947875977, "global_step": 60878, "epoch": 362} {"train_loss": -8.819223403930664, "global_step": 60879, "epoch": 362} {"train_loss": -8.678757667541504, "global_step": 60880, "epoch": 362} {"train_loss": -8.78174114227295, "global_step": 60881, "epoch": 362} {"train_loss": -8.571401596069336, "global_step": 60882, "epoch": 362} {"train_loss": -8.725686073303223, "global_step": 60883, "epoch": 362} {"train_loss": -8.687262535095215, "global_step": 60884, "epoch": 362} {"train_loss": -8.54753589630127, "global_step": 60885, "epoch": 362} {"train_loss": -8.94033145904541, "global_step": 60886, "epoch": 362} {"train_loss": -8.624605178833008, "global_step": 60887, "epoch": 362} {"train_loss": -8.909595489501953, "global_step": 60888, "epoch": 362} {"train_loss": -8.763824462890625, "global_step": 60889, "epoch": 362} {"train_loss": -8.778390884399414, "global_step": 60890, "epoch": 362} {"train_loss": -8.643698692321777, "global_step": 60891, "epoch": 362} {"train_loss": -8.857048988342285, "global_step": 60892, "epoch": 362} {"train_loss": -8.42906379699707, "global_step": 60893, "epoch": 362} {"train_loss": -8.674969673156738, "global_step": 60894, "epoch": 362} {"train_loss": -8.556171417236328, "global_step": 60895, "epoch": 362} {"train_loss": -8.556953430175781, "global_step": 60896, "epoch": 362} {"train_loss": -8.705402374267578, "global_step": 60897, "epoch": 362} {"train_loss": -8.718830108642578, "global_step": 60898, "epoch": 362} {"train_loss": -8.684737205505371, "global_step": 60899, "epoch": 362} {"train_loss": -8.904090881347656, "global_step": 60900, "epoch": 362} {"train_loss": -8.599081039428711, "global_step": 60901, "epoch": 362} {"train_loss": -8.762701034545898, "global_step": 60902, "epoch": 362} {"train_loss": -8.923776626586914, "global_step": 60903, "epoch": 362} {"train_loss": -8.726020812988281, "global_step": 60904, "epoch": 362} {"train_loss": -8.718753814697266, "global_step": 60905, "epoch": 362} {"train_loss": -8.559576034545898, "global_step": 60906, "epoch": 362} {"train_loss": -8.28339958190918, "global_step": 60907, "epoch": 362} {"train_loss": -8.880874633789062, "global_step": 60908, "epoch": 362} {"train_loss": -8.513514518737793, "global_step": 60909, "epoch": 362} {"train_loss": -8.575370788574219, "global_step": 60910, "epoch": 362} {"train_loss": -8.567206382751465, "global_step": 60911, "epoch": 362} {"train_loss": -8.697430610656738, "global_step": 60912, "epoch": 362} {"train_loss": -8.661515235900879, "global_step": 60913, "epoch": 362} {"train_loss": -8.403640747070312, "global_step": 60914, "epoch": 362} {"train_loss": -8.676994323730469, "global_step": 60915, "epoch": 362} {"train_loss": -8.72125244140625, "global_step": 60916, "epoch": 362} {"train_loss": -8.584573745727539, "global_step": 60917, "epoch": 362} {"train_loss": -8.601530075073242, "global_step": 60918, "epoch": 362} {"train_loss": -8.65914535522461, "global_step": 60919, "epoch": 362} {"train_loss": -8.603227615356445, "global_step": 60920, "epoch": 362} {"train_loss": -8.483318328857422, "global_step": 60921, "epoch": 362} {"train_loss": -8.708739280700684, "global_step": 60922, "epoch": 362} {"train_loss": -8.604442596435547, "global_step": 60923, "epoch": 362} {"train_loss": -8.793172836303711, "global_step": 60924, "epoch": 362} {"train_loss": -8.504463195800781, "global_step": 60925, "epoch": 362} {"train_loss": -8.699518203735352, "global_step": 60926, "epoch": 362} {"train_loss": -8.54537582397461, "global_step": 60927, "epoch": 362} {"train_loss": -8.606260299682617, "global_step": 60928, "epoch": 362} {"train_loss": -8.605597496032715, "global_step": 60929, "epoch": 362} {"train_loss": -8.894186973571777, "global_step": 60930, "epoch": 362} {"train_loss": -8.736083984375, "global_step": 60931, "epoch": 362} {"train_loss": -8.610028266906738, "global_step": 60932, "epoch": 362} {"train_loss": -8.613823890686035, "global_step": 60933, "epoch": 362} {"train_loss": -8.816824913024902, "global_step": 60934, "epoch": 362} {"train_loss": -8.797453880310059, "global_step": 60935, "epoch": 362} {"train_loss": -8.816262245178223, "global_step": 60936, "epoch": 362} {"train_loss": -8.454780578613281, "global_step": 60937, "epoch": 362} {"train_loss": -8.67232894897461, "global_step": 60938, "epoch": 362} {"train_loss": -8.742815017700195, "global_step": 60939, "epoch": 362} {"train_loss": -8.907096862792969, "global_step": 60940, "epoch": 362} {"train_loss": -8.738430976867676, "global_step": 60941, "epoch": 362} {"train_loss": -8.58576774597168, "global_step": 60942, "epoch": 362} {"train_loss": -8.620317459106445, "global_step": 60943, "epoch": 362} {"train_loss": -8.615339279174805, "global_step": 60944, "epoch": 362} {"train_loss": -8.596731185913086, "global_step": 60945, "epoch": 362} {"train_loss": -8.562685012817383, "global_step": 60946, "epoch": 362} {"train_loss": -8.66392707824707, "global_step": 60947, "epoch": 362} {"train_loss": -8.630407333374023, "global_step": 60948, "epoch": 362} {"train_loss": -8.528827667236328, "global_step": 60949, "epoch": 362} {"train_loss": -8.340513229370117, "global_step": 60950, "epoch": 362} {"train_loss": -8.42481803894043, "global_step": 60951, "epoch": 362} {"train_loss": -8.435302734375, "global_step": 60952, "epoch": 362} {"train_loss": -8.313026428222656, "global_step": 60953, "epoch": 362} {"train_loss": -8.693889617919922, "global_step": 60954, "epoch": 362} {"train_loss": -8.540568351745605, "global_step": 60955, "epoch": 362} {"train_loss": -8.495500564575195, "global_step": 60956, "epoch": 362} {"train_loss": -8.72652816772461, "global_step": 60957, "epoch": 362} {"train_loss": -8.439970016479492, "global_step": 60958, "epoch": 362} {"train_loss": -8.380033493041992, "global_step": 60959, "epoch": 362} {"train_loss": -8.192346572875977, "global_step": 60960, "epoch": 362} {"train_loss": -8.501153945922852, "global_step": 60961, "epoch": 362} {"train_loss": -8.419992446899414, "global_step": 60962, "epoch": 362} {"train_loss": -8.471671104431152, "global_step": 60963, "epoch": 362} {"train_loss": -8.112298011779785, "global_step": 60964, "epoch": 362} {"train_loss": -8.355741500854492, "global_step": 60965, "epoch": 362} {"train_loss": -8.640390396118164, "global_step": 60966, "epoch": 362} {"train_loss": -8.519491195678711, "global_step": 60967, "epoch": 362} {"train_loss": -8.386558532714844, "global_step": 60968, "epoch": 362} {"train_loss": -8.47720718383789, "global_step": 60969, "epoch": 362} {"train_loss": -8.404635429382324, "global_step": 60970, "epoch": 362} {"train_loss": -8.735097885131836, "global_step": 60971, "epoch": 362} {"train_loss": -8.484232902526855, "global_step": 60972, "epoch": 362} {"train_loss": -8.638132095336914, "global_step": 60973, "epoch": 362} {"train_loss": -8.729509353637695, "global_step": 60974, "epoch": 362} {"train_loss": -8.511126518249512, "global_step": 60975, "epoch": 362} {"train_loss": -8.48042106628418, "global_step": 60976, "epoch": 362} {"train_loss": -8.65351390838623, "global_step": 60977, "epoch": 362} {"train_loss": -8.669300079345703, "global_step": 60978, "epoch": 362} {"train_loss": -8.562907218933105, "global_step": 60979, "epoch": 362} {"train_loss": -8.653215408325195, "global_step": 60980, "epoch": 362} {"train_loss": -8.738079071044922, "global_step": 60981, "epoch": 362} {"train_loss": -8.921541213989258, "global_step": 60982, "epoch": 362} {"train_loss": -8.643569974672227, "global_step": 60983, "epoch": 362, "val_loss": 190841.390625} {"train_loss": -8.728445053100586, "global_step": 60984, "epoch": 363} {"train_loss": -8.794528007507324, "global_step": 60985, "epoch": 363} {"train_loss": -8.855222702026367, "global_step": 60986, "epoch": 363} {"train_loss": -8.816522598266602, "global_step": 60987, "epoch": 363} {"train_loss": -8.900593757629395, "global_step": 60988, "epoch": 363} {"train_loss": -8.835521697998047, "global_step": 60989, "epoch": 363} {"train_loss": -8.708826065063477, "global_step": 60990, "epoch": 363} {"train_loss": -8.725835800170898, "global_step": 60991, "epoch": 363} {"train_loss": -8.795682907104492, "global_step": 60992, "epoch": 363} {"train_loss": -8.684940338134766, "global_step": 60993, "epoch": 363} {"train_loss": -8.869205474853516, "global_step": 60994, "epoch": 363} {"train_loss": -8.718072891235352, "global_step": 60995, "epoch": 363} {"train_loss": -8.774389266967773, "global_step": 60996, "epoch": 363} {"train_loss": -8.786407470703125, "global_step": 60997, "epoch": 363} {"train_loss": -8.78965950012207, "global_step": 60998, "epoch": 363} {"train_loss": -8.628936767578125, "global_step": 60999, "epoch": 363} {"train_loss": -8.786710739135742, "global_step": 61000, "epoch": 363} {"train_loss": -8.716751098632812, "global_step": 61001, "epoch": 363} {"train_loss": -8.690290451049805, "global_step": 61002, "epoch": 363} {"train_loss": -8.611262321472168, "global_step": 61003, "epoch": 363} {"train_loss": -8.608182907104492, "global_step": 61004, "epoch": 363} {"train_loss": -8.8646240234375, "global_step": 61005, "epoch": 363} {"train_loss": -8.662854194641113, "global_step": 61006, "epoch": 363} {"train_loss": -8.730766296386719, "global_step": 61007, "epoch": 363} {"train_loss": -8.52659797668457, "global_step": 61008, "epoch": 363} {"train_loss": -8.638833045959473, "global_step": 61009, "epoch": 363} {"train_loss": -8.650520324707031, "global_step": 61010, "epoch": 363} {"train_loss": -8.806310653686523, "global_step": 61011, "epoch": 363} {"train_loss": -8.862056732177734, "global_step": 61012, "epoch": 363} {"train_loss": -8.599380493164062, "global_step": 61013, "epoch": 363} {"train_loss": -8.605262756347656, "global_step": 61014, "epoch": 363} {"train_loss": -8.289785385131836, "global_step": 61015, "epoch": 363} {"train_loss": -8.698408126831055, "global_step": 61016, "epoch": 363} {"train_loss": -8.35857105255127, "global_step": 61017, "epoch": 363} {"train_loss": -8.436111450195312, "global_step": 61018, "epoch": 363} {"train_loss": -8.681930541992188, "global_step": 61019, "epoch": 363} {"train_loss": -8.831769943237305, "global_step": 61020, "epoch": 363} {"train_loss": -8.685619354248047, "global_step": 61021, "epoch": 363} {"train_loss": -8.709951400756836, "global_step": 61022, "epoch": 363} {"train_loss": -8.956244468688965, "global_step": 61023, "epoch": 363} {"train_loss": -8.659807205200195, "global_step": 61024, "epoch": 363} {"train_loss": -8.89883804321289, "global_step": 61025, "epoch": 363} {"train_loss": -8.577390670776367, "global_step": 61026, "epoch": 363} {"train_loss": -8.692375183105469, "global_step": 61027, "epoch": 363} {"train_loss": -9.030094146728516, "global_step": 61028, "epoch": 363} {"train_loss": -8.655675888061523, "global_step": 61029, "epoch": 363} {"train_loss": -8.864286422729492, "global_step": 61030, "epoch": 363} {"train_loss": -8.766471862792969, "global_step": 61031, "epoch": 363} {"train_loss": -8.684823989868164, "global_step": 61032, "epoch": 363} {"train_loss": -8.56597900390625, "global_step": 61033, "epoch": 363} {"train_loss": -9.016193389892578, "global_step": 61034, "epoch": 363} {"train_loss": -8.556170463562012, "global_step": 61035, "epoch": 363} {"train_loss": -8.887057304382324, "global_step": 61036, "epoch": 363} {"train_loss": -9.01878833770752, "global_step": 61037, "epoch": 363} {"train_loss": -8.815278053283691, "global_step": 61038, "epoch": 363} {"train_loss": -8.776449203491211, "global_step": 61039, "epoch": 363} {"train_loss": -8.846139907836914, "global_step": 61040, "epoch": 363} {"train_loss": -8.811288833618164, "global_step": 61041, "epoch": 363} {"train_loss": -8.861427307128906, "global_step": 61042, "epoch": 363} {"train_loss": -8.509279251098633, "global_step": 61043, "epoch": 363} {"train_loss": -8.827333450317383, "global_step": 61044, "epoch": 363} {"train_loss": -8.813776016235352, "global_step": 61045, "epoch": 363} {"train_loss": -8.430957794189453, "global_step": 61046, "epoch": 363} {"train_loss": -8.80506420135498, "global_step": 61047, "epoch": 363} {"train_loss": -8.433124542236328, "global_step": 61048, "epoch": 363} {"train_loss": -8.535406112670898, "global_step": 61049, "epoch": 363} {"train_loss": -8.947787284851074, "global_step": 61050, "epoch": 363} {"train_loss": -8.511571884155273, "global_step": 61051, "epoch": 363} {"train_loss": -8.412049293518066, "global_step": 61052, "epoch": 363} {"train_loss": -8.571146011352539, "global_step": 61053, "epoch": 363} {"train_loss": -8.631875038146973, "global_step": 61054, "epoch": 363} {"train_loss": -8.447463989257812, "global_step": 61055, "epoch": 363} {"train_loss": -8.437433242797852, "global_step": 61056, "epoch": 363} {"train_loss": -8.502973556518555, "global_step": 61057, "epoch": 363} {"train_loss": -8.686959266662598, "global_step": 61058, "epoch": 363} {"train_loss": -8.69436264038086, "global_step": 61059, "epoch": 363} {"train_loss": -8.633183479309082, "global_step": 61060, "epoch": 363} {"train_loss": -8.744209289550781, "global_step": 61061, "epoch": 363} {"train_loss": -8.480194091796875, "global_step": 61062, "epoch": 363} {"train_loss": -8.395317077636719, "global_step": 61063, "epoch": 363} {"train_loss": -8.504377365112305, "global_step": 61064, "epoch": 363} {"train_loss": -8.628959655761719, "global_step": 61065, "epoch": 363} {"train_loss": -8.653347969055176, "global_step": 61066, "epoch": 363} {"train_loss": -8.416970252990723, "global_step": 61067, "epoch": 363} {"train_loss": -8.662551879882812, "global_step": 61068, "epoch": 363} {"train_loss": -8.726798057556152, "global_step": 61069, "epoch": 363} {"train_loss": -8.660511016845703, "global_step": 61070, "epoch": 363} {"train_loss": -8.527189254760742, "global_step": 61071, "epoch": 363} {"train_loss": -8.646881103515625, "global_step": 61072, "epoch": 363} {"train_loss": -8.578298568725586, "global_step": 61073, "epoch": 363} {"train_loss": -8.836841583251953, "global_step": 61074, "epoch": 363} {"train_loss": -8.755409240722656, "global_step": 61075, "epoch": 363} {"train_loss": -8.563241004943848, "global_step": 61076, "epoch": 363} {"train_loss": -8.897106170654297, "global_step": 61077, "epoch": 363} {"train_loss": -8.770811080932617, "global_step": 61078, "epoch": 363} {"train_loss": -8.708660125732422, "global_step": 61079, "epoch": 363} {"train_loss": -8.541824340820312, "global_step": 61080, "epoch": 363} {"train_loss": -8.48179817199707, "global_step": 61081, "epoch": 363} {"train_loss": -8.713513374328613, "global_step": 61082, "epoch": 363} {"train_loss": -8.94005012512207, "global_step": 61083, "epoch": 363} {"train_loss": -8.411212921142578, "global_step": 61084, "epoch": 363} {"train_loss": -8.49293327331543, "global_step": 61085, "epoch": 363} {"train_loss": -8.633596420288086, "global_step": 61086, "epoch": 363} {"train_loss": -8.592141151428223, "global_step": 61087, "epoch": 363} {"train_loss": -8.696615219116211, "global_step": 61088, "epoch": 363} {"train_loss": -8.63007926940918, "global_step": 61089, "epoch": 363} {"train_loss": -8.503952026367188, "global_step": 61090, "epoch": 363} {"train_loss": -8.797972679138184, "global_step": 61091, "epoch": 363} {"train_loss": -8.947708129882812, "global_step": 61092, "epoch": 363} {"train_loss": -8.873279571533203, "global_step": 61093, "epoch": 363} {"train_loss": -8.837089538574219, "global_step": 61094, "epoch": 363} {"train_loss": -8.99593734741211, "global_step": 61095, "epoch": 363} {"train_loss": -8.912510871887207, "global_step": 61096, "epoch": 363} {"train_loss": -8.71839714050293, "global_step": 61097, "epoch": 363} {"train_loss": -8.716230392456055, "global_step": 61098, "epoch": 363} {"train_loss": -8.853452682495117, "global_step": 61099, "epoch": 363} {"train_loss": -8.653341293334961, "global_step": 61100, "epoch": 363} {"train_loss": -8.689226150512695, "global_step": 61101, "epoch": 363} {"train_loss": -8.478414535522461, "global_step": 61102, "epoch": 363} {"train_loss": -8.766860008239746, "global_step": 61103, "epoch": 363} {"train_loss": -8.566431045532227, "global_step": 61104, "epoch": 363} {"train_loss": -8.879077911376953, "global_step": 61105, "epoch": 363} {"train_loss": -8.722290992736816, "global_step": 61106, "epoch": 363} {"train_loss": -8.79674243927002, "global_step": 61107, "epoch": 363} {"train_loss": -8.574148178100586, "global_step": 61108, "epoch": 363} {"train_loss": -8.800586700439453, "global_step": 61109, "epoch": 363} {"train_loss": -8.757972717285156, "global_step": 61110, "epoch": 363} {"train_loss": -8.756912231445312, "global_step": 61111, "epoch": 363} {"train_loss": -8.832436561584473, "global_step": 61112, "epoch": 363} {"train_loss": -8.722050666809082, "global_step": 61113, "epoch": 363} {"train_loss": -8.628384590148926, "global_step": 61114, "epoch": 363} {"train_loss": -8.734249114990234, "global_step": 61115, "epoch": 363} {"train_loss": -8.560105323791504, "global_step": 61116, "epoch": 363} {"train_loss": -8.453498840332031, "global_step": 61117, "epoch": 363} {"train_loss": -8.70728874206543, "global_step": 61118, "epoch": 363} {"train_loss": -8.510893821716309, "global_step": 61119, "epoch": 363} {"train_loss": -8.776931762695312, "global_step": 61120, "epoch": 363} {"train_loss": -8.656486511230469, "global_step": 61121, "epoch": 363} {"train_loss": -8.4893798828125, "global_step": 61122, "epoch": 363} {"train_loss": -8.564083099365234, "global_step": 61123, "epoch": 363} {"train_loss": -8.666162490844727, "global_step": 61124, "epoch": 363} {"train_loss": -8.538386344909668, "global_step": 61125, "epoch": 363} {"train_loss": -8.373379707336426, "global_step": 61126, "epoch": 363} {"train_loss": -8.465518951416016, "global_step": 61127, "epoch": 363} {"train_loss": -8.58952522277832, "global_step": 61128, "epoch": 363} {"train_loss": -8.595006942749023, "global_step": 61129, "epoch": 363} {"train_loss": -8.75788402557373, "global_step": 61130, "epoch": 363} {"train_loss": -8.857719421386719, "global_step": 61131, "epoch": 363} {"train_loss": -8.658504486083984, "global_step": 61132, "epoch": 363} {"train_loss": -8.789875030517578, "global_step": 61133, "epoch": 363} {"train_loss": -8.710237503051758, "global_step": 61134, "epoch": 363} {"train_loss": -8.735916137695312, "global_step": 61135, "epoch": 363} {"train_loss": -8.612039566040039, "global_step": 61136, "epoch": 363} {"train_loss": -8.637434005737305, "global_step": 61137, "epoch": 363} {"train_loss": -8.812933921813965, "global_step": 61138, "epoch": 363} {"train_loss": -8.871577262878418, "global_step": 61139, "epoch": 363} {"train_loss": -8.542543411254883, "global_step": 61140, "epoch": 363} {"train_loss": -8.535234451293945, "global_step": 61141, "epoch": 363} {"train_loss": -8.662836074829102, "global_step": 61142, "epoch": 363} {"train_loss": -8.42216968536377, "global_step": 61143, "epoch": 363} {"train_loss": -8.632955551147461, "global_step": 61144, "epoch": 363} {"train_loss": -8.34197998046875, "global_step": 61145, "epoch": 363} {"train_loss": -8.433085441589355, "global_step": 61146, "epoch": 363} {"train_loss": -8.576173782348633, "global_step": 61147, "epoch": 363} {"train_loss": -8.510733604431152, "global_step": 61148, "epoch": 363} {"train_loss": -8.444391250610352, "global_step": 61149, "epoch": 363} {"train_loss": -8.6519775390625, "global_step": 61150, "epoch": 363} {"train_loss": -8.677369242622738, "global_step": 61151, "epoch": 363, "val_loss": 190951.796875} {"train_loss": -8.403475761413574, "global_step": 61152, "epoch": 364} {"train_loss": -8.37098217010498, "global_step": 61153, "epoch": 364} {"train_loss": -8.892607688903809, "global_step": 61154, "epoch": 364} {"train_loss": -8.04275894165039, "global_step": 61155, "epoch": 364} {"train_loss": -8.514533996582031, "global_step": 61156, "epoch": 364} {"train_loss": -7.995517730712891, "global_step": 61157, "epoch": 364} {"train_loss": -8.715868949890137, "global_step": 61158, "epoch": 364} {"train_loss": -8.323299407958984, "global_step": 61159, "epoch": 364} {"train_loss": -8.33231258392334, "global_step": 61160, "epoch": 364} {"train_loss": -8.391611099243164, "global_step": 61161, "epoch": 364} {"train_loss": -8.38517951965332, "global_step": 61162, "epoch": 364} {"train_loss": -8.096227645874023, "global_step": 61163, "epoch": 364} {"train_loss": -8.362711906433105, "global_step": 61164, "epoch": 364} {"train_loss": -8.471044540405273, "global_step": 61165, "epoch": 364} {"train_loss": -8.631841659545898, "global_step": 61166, "epoch": 364} {"train_loss": -8.522991180419922, "global_step": 61167, "epoch": 364} {"train_loss": -8.474152565002441, "global_step": 61168, "epoch": 364} {"train_loss": -8.47484302520752, "global_step": 61169, "epoch": 364} {"train_loss": -8.617876052856445, "global_step": 61170, "epoch": 364} {"train_loss": -8.268425941467285, "global_step": 61171, "epoch": 364} {"train_loss": -8.557247161865234, "global_step": 61172, "epoch": 364} {"train_loss": -8.510868072509766, "global_step": 61173, "epoch": 364} {"train_loss": -8.534294128417969, "global_step": 61174, "epoch": 364} {"train_loss": -8.378149032592773, "global_step": 61175, "epoch": 364} {"train_loss": -8.369902610778809, "global_step": 61176, "epoch": 364} {"train_loss": -8.532114028930664, "global_step": 61177, "epoch": 364} {"train_loss": -8.616405487060547, "global_step": 61178, "epoch": 364} {"train_loss": -8.559456825256348, "global_step": 61179, "epoch": 364} {"train_loss": -8.549345970153809, "global_step": 61180, "epoch": 364} {"train_loss": -8.666532516479492, "global_step": 61181, "epoch": 364} {"train_loss": -8.534360885620117, "global_step": 61182, "epoch": 364} {"train_loss": -8.757050514221191, "global_step": 61183, "epoch": 364} {"train_loss": -8.631645202636719, "global_step": 61184, "epoch": 364} {"train_loss": -8.578104019165039, "global_step": 61185, "epoch": 364} {"train_loss": -8.588801383972168, "global_step": 61186, "epoch": 364} {"train_loss": -8.829387664794922, "global_step": 61187, "epoch": 364} {"train_loss": -8.592514038085938, "global_step": 61188, "epoch": 364} {"train_loss": -8.63557243347168, "global_step": 61189, "epoch": 364} {"train_loss": -8.617799758911133, "global_step": 61190, "epoch": 364} {"train_loss": -8.559024810791016, "global_step": 61191, "epoch": 364} {"train_loss": -8.586124420166016, "global_step": 61192, "epoch": 364} {"train_loss": -8.81389045715332, "global_step": 61193, "epoch": 364} {"train_loss": -8.91925048828125, "global_step": 61194, "epoch": 364} {"train_loss": -8.699777603149414, "global_step": 61195, "epoch": 364} {"train_loss": -8.790273666381836, "global_step": 61196, "epoch": 364} {"train_loss": -8.686578750610352, "global_step": 61197, "epoch": 364} {"train_loss": -8.697542190551758, "global_step": 61198, "epoch": 364} {"train_loss": -8.882421493530273, "global_step": 61199, "epoch": 364} {"train_loss": -8.912068367004395, "global_step": 61200, "epoch": 364} {"train_loss": -9.027216911315918, "global_step": 61201, "epoch": 364} {"train_loss": -8.744287490844727, "global_step": 61202, "epoch": 364} {"train_loss": -8.746025085449219, "global_step": 61203, "epoch": 364} {"train_loss": -8.834210395812988, "global_step": 61204, "epoch": 364} {"train_loss": -8.753885269165039, "global_step": 61205, "epoch": 364} {"train_loss": -8.729825019836426, "global_step": 61206, "epoch": 364} {"train_loss": -8.82998275756836, "global_step": 61207, "epoch": 364} {"train_loss": -8.976491928100586, "global_step": 61208, "epoch": 364} {"train_loss": -8.563004493713379, "global_step": 61209, "epoch": 364} {"train_loss": -8.754582405090332, "global_step": 61210, "epoch": 364} {"train_loss": -8.724414825439453, "global_step": 61211, "epoch": 364} {"train_loss": -8.698690414428711, "global_step": 61212, "epoch": 364} {"train_loss": -8.72025203704834, "global_step": 61213, "epoch": 364} {"train_loss": -8.703231811523438, "global_step": 61214, "epoch": 364} {"train_loss": -8.765953063964844, "global_step": 61215, "epoch": 364} {"train_loss": -8.927023887634277, "global_step": 61216, "epoch": 364} {"train_loss": -8.739049911499023, "global_step": 61217, "epoch": 364} {"train_loss": -9.126343727111816, "global_step": 61218, "epoch": 364} {"train_loss": -8.670294761657715, "global_step": 61219, "epoch": 364} {"train_loss": -8.982259750366211, "global_step": 61220, "epoch": 364} {"train_loss": -8.606498718261719, "global_step": 61221, "epoch": 364} {"train_loss": -8.525876998901367, "global_step": 61222, "epoch": 364} {"train_loss": -8.752458572387695, "global_step": 61223, "epoch": 364} {"train_loss": -8.508068084716797, "global_step": 61224, "epoch": 364} {"train_loss": -8.955662727355957, "global_step": 61225, "epoch": 364} {"train_loss": -8.772241592407227, "global_step": 61226, "epoch": 364} {"train_loss": -8.9312744140625, "global_step": 61227, "epoch": 364} {"train_loss": -8.73254108428955, "global_step": 61228, "epoch": 364} {"train_loss": -8.7542142868042, "global_step": 61229, "epoch": 364} {"train_loss": -8.655996322631836, "global_step": 61230, "epoch": 364} {"train_loss": -8.641011238098145, "global_step": 61231, "epoch": 364} {"train_loss": -8.668025970458984, "global_step": 61232, "epoch": 364} {"train_loss": -8.817354202270508, "global_step": 61233, "epoch": 364} {"train_loss": -8.259613037109375, "global_step": 61234, "epoch": 364} {"train_loss": -8.716606140136719, "global_step": 61235, "epoch": 364} {"train_loss": -8.37998104095459, "global_step": 61236, "epoch": 364} {"train_loss": -8.449003219604492, "global_step": 61237, "epoch": 364} {"train_loss": -8.392425537109375, "global_step": 61238, "epoch": 364} {"train_loss": -8.555188179016113, "global_step": 61239, "epoch": 364} {"train_loss": -8.584942817687988, "global_step": 61240, "epoch": 364} {"train_loss": -8.465926170349121, "global_step": 61241, "epoch": 364} {"train_loss": -8.72404956817627, "global_step": 61242, "epoch": 364} {"train_loss": -8.698512077331543, "global_step": 61243, "epoch": 364} {"train_loss": -8.71804428100586, "global_step": 61244, "epoch": 364} {"train_loss": -8.554336547851562, "global_step": 61245, "epoch": 364} {"train_loss": -8.660130500793457, "global_step": 61246, "epoch": 364} {"train_loss": -8.46876335144043, "global_step": 61247, "epoch": 364} {"train_loss": -8.545236587524414, "global_step": 61248, "epoch": 364} {"train_loss": -8.557939529418945, "global_step": 61249, "epoch": 364} {"train_loss": -8.574131965637207, "global_step": 61250, "epoch": 364} {"train_loss": -8.408199310302734, "global_step": 61251, "epoch": 364} {"train_loss": -8.75594711303711, "global_step": 61252, "epoch": 364} {"train_loss": -8.69167423248291, "global_step": 61253, "epoch": 364} {"train_loss": -8.633968353271484, "global_step": 61254, "epoch": 364} {"train_loss": -8.739524841308594, "global_step": 61255, "epoch": 364} {"train_loss": -8.83293628692627, "global_step": 61256, "epoch": 364} {"train_loss": -8.924605369567871, "global_step": 61257, "epoch": 364} {"train_loss": -8.628822326660156, "global_step": 61258, "epoch": 364} {"train_loss": -8.654964447021484, "global_step": 61259, "epoch": 364} {"train_loss": -8.321415901184082, "global_step": 61260, "epoch": 364} {"train_loss": -8.600014686584473, "global_step": 61261, "epoch": 364} {"train_loss": -8.639772415161133, "global_step": 61262, "epoch": 364} {"train_loss": -8.827104568481445, "global_step": 61263, "epoch": 364} {"train_loss": -8.972926139831543, "global_step": 61264, "epoch": 364} {"train_loss": -8.731781005859375, "global_step": 61265, "epoch": 364} {"train_loss": -8.538372039794922, "global_step": 61266, "epoch": 364} {"train_loss": -8.80858039855957, "global_step": 61267, "epoch": 364} {"train_loss": -8.898015022277832, "global_step": 61268, "epoch": 364} {"train_loss": -8.641351699829102, "global_step": 61269, "epoch": 364} {"train_loss": -8.910356521606445, "global_step": 61270, "epoch": 364} {"train_loss": -8.775590896606445, "global_step": 61271, "epoch": 364} {"train_loss": -8.555737495422363, "global_step": 61272, "epoch": 364} {"train_loss": -8.651311874389648, "global_step": 61273, "epoch": 364} {"train_loss": -8.470973014831543, "global_step": 61274, "epoch": 364} {"train_loss": -9.023897171020508, "global_step": 61275, "epoch": 364} {"train_loss": -8.521653175354004, "global_step": 61276, "epoch": 364} {"train_loss": -8.64914608001709, "global_step": 61277, "epoch": 364} {"train_loss": -8.712911605834961, "global_step": 61278, "epoch": 364} {"train_loss": -8.620530128479004, "global_step": 61279, "epoch": 364} {"train_loss": -8.97693157196045, "global_step": 61280, "epoch": 364} {"train_loss": -8.792661666870117, "global_step": 61281, "epoch": 364} {"train_loss": -8.931528091430664, "global_step": 61282, "epoch": 364} {"train_loss": -8.565327644348145, "global_step": 61283, "epoch": 364} {"train_loss": -8.898852348327637, "global_step": 61284, "epoch": 364} {"train_loss": -8.684267044067383, "global_step": 61285, "epoch": 364} {"train_loss": -8.891446113586426, "global_step": 61286, "epoch": 364} {"train_loss": -8.5592041015625, "global_step": 61287, "epoch": 364} {"train_loss": -8.689826965332031, "global_step": 61288, "epoch": 364} {"train_loss": -8.648690223693848, "global_step": 61289, "epoch": 364} {"train_loss": -8.847564697265625, "global_step": 61290, "epoch": 364} {"train_loss": -8.599869728088379, "global_step": 61291, "epoch": 364} {"train_loss": -8.562182426452637, "global_step": 61292, "epoch": 364} {"train_loss": -8.630677223205566, "global_step": 61293, "epoch": 364} {"train_loss": -8.768753051757812, "global_step": 61294, "epoch": 364} {"train_loss": -8.697463989257812, "global_step": 61295, "epoch": 364} {"train_loss": -8.761741638183594, "global_step": 61296, "epoch": 364} {"train_loss": -8.750455856323242, "global_step": 61297, "epoch": 364} {"train_loss": -8.818925857543945, "global_step": 61298, "epoch": 364} {"train_loss": -8.40776252746582, "global_step": 61299, "epoch": 364} {"train_loss": -8.834651947021484, "global_step": 61300, "epoch": 364} {"train_loss": -8.476384162902832, "global_step": 61301, "epoch": 364} {"train_loss": -8.846412658691406, "global_step": 61302, "epoch": 364} {"train_loss": -8.487417221069336, "global_step": 61303, "epoch": 364} {"train_loss": -8.694564819335938, "global_step": 61304, "epoch": 364} {"train_loss": -8.651789665222168, "global_step": 61305, "epoch": 364} {"train_loss": -8.726247787475586, "global_step": 61306, "epoch": 364} {"train_loss": -8.488350868225098, "global_step": 61307, "epoch": 364} {"train_loss": -8.778863906860352, "global_step": 61308, "epoch": 364} {"train_loss": -8.599508285522461, "global_step": 61309, "epoch": 364} {"train_loss": -8.467068672180176, "global_step": 61310, "epoch": 364} {"train_loss": -8.426417350769043, "global_step": 61311, "epoch": 364} {"train_loss": -8.413544654846191, "global_step": 61312, "epoch": 364} {"train_loss": -8.344858169555664, "global_step": 61313, "epoch": 364} {"train_loss": -8.460554122924805, "global_step": 61314, "epoch": 364} {"train_loss": -8.623903274536133, "global_step": 61315, "epoch": 364} {"train_loss": -8.623579025268555, "global_step": 61316, "epoch": 364} {"train_loss": -8.411808967590332, "global_step": 61317, "epoch": 364} {"train_loss": -8.63831615447998, "global_step": 61318, "epoch": 364} {"train_loss": -8.641200406210762, "global_step": 61319, "epoch": 364, "val_loss": 191423.90625} {"train_loss": -8.480527877807617, "global_step": 61320, "epoch": 365} {"train_loss": -8.706880569458008, "global_step": 61321, "epoch": 365} {"train_loss": -8.478013038635254, "global_step": 61322, "epoch": 365} {"train_loss": -8.489517211914062, "global_step": 61323, "epoch": 365} {"train_loss": -8.608768463134766, "global_step": 61324, "epoch": 365} {"train_loss": -8.61520767211914, "global_step": 61325, "epoch": 365} {"train_loss": -8.68667984008789, "global_step": 61326, "epoch": 365} {"train_loss": -8.642148971557617, "global_step": 61327, "epoch": 365} {"train_loss": -8.703831672668457, "global_step": 61328, "epoch": 365} {"train_loss": -8.566251754760742, "global_step": 61329, "epoch": 365} {"train_loss": -8.820219039916992, "global_step": 61330, "epoch": 365} {"train_loss": -8.717872619628906, "global_step": 61331, "epoch": 365} {"train_loss": -8.69450569152832, "global_step": 61332, "epoch": 365} {"train_loss": -8.766902923583984, "global_step": 61333, "epoch": 365} {"train_loss": -8.767282485961914, "global_step": 61334, "epoch": 365} {"train_loss": -8.862630844116211, "global_step": 61335, "epoch": 365} {"train_loss": -8.85529899597168, "global_step": 61336, "epoch": 365} {"train_loss": -8.727563858032227, "global_step": 61337, "epoch": 365} {"train_loss": -8.798755645751953, "global_step": 61338, "epoch": 365} {"train_loss": -8.331901550292969, "global_step": 61339, "epoch": 365} {"train_loss": -8.552911758422852, "global_step": 61340, "epoch": 365} {"train_loss": -8.743631362915039, "global_step": 61341, "epoch": 365} {"train_loss": -8.374134063720703, "global_step": 61342, "epoch": 365} {"train_loss": -8.608205795288086, "global_step": 61343, "epoch": 365} {"train_loss": -8.52316665649414, "global_step": 61344, "epoch": 365} {"train_loss": -8.451695442199707, "global_step": 61345, "epoch": 365} {"train_loss": -8.680082321166992, "global_step": 61346, "epoch": 365} {"train_loss": -8.753572463989258, "global_step": 61347, "epoch": 365} {"train_loss": -8.81606388092041, "global_step": 61348, "epoch": 365} {"train_loss": -8.682122230529785, "global_step": 61349, "epoch": 365} {"train_loss": -8.646262168884277, "global_step": 61350, "epoch": 365} {"train_loss": -8.69066047668457, "global_step": 61351, "epoch": 365} {"train_loss": -8.728946685791016, "global_step": 61352, "epoch": 365} {"train_loss": -8.609062194824219, "global_step": 61353, "epoch": 365} {"train_loss": -8.642945289611816, "global_step": 61354, "epoch": 365} {"train_loss": -8.943849563598633, "global_step": 61355, "epoch": 365} {"train_loss": -8.511624336242676, "global_step": 61356, "epoch": 365} {"train_loss": -8.742706298828125, "global_step": 61357, "epoch": 365} {"train_loss": -9.169839859008789, "global_step": 61358, "epoch": 365} {"train_loss": -8.545757293701172, "global_step": 61359, "epoch": 365} {"train_loss": -8.727446556091309, "global_step": 61360, "epoch": 365} {"train_loss": -8.682482719421387, "global_step": 61361, "epoch": 365} {"train_loss": -8.805929183959961, "global_step": 61362, "epoch": 365} {"train_loss": -8.736251831054688, "global_step": 61363, "epoch": 365} {"train_loss": -8.926321029663086, "global_step": 61364, "epoch": 365} {"train_loss": -8.44261360168457, "global_step": 61365, "epoch": 365} {"train_loss": -8.543022155761719, "global_step": 61366, "epoch": 365} {"train_loss": -8.540074348449707, "global_step": 61367, "epoch": 365} {"train_loss": -8.124866485595703, "global_step": 61368, "epoch": 365} {"train_loss": -8.308135032653809, "global_step": 61369, "epoch": 365} {"train_loss": -8.053940773010254, "global_step": 61370, "epoch": 365} {"train_loss": -7.778604507446289, "global_step": 61371, "epoch": 365} {"train_loss": -8.285158157348633, "global_step": 61372, "epoch": 365} {"train_loss": -8.228079795837402, "global_step": 61373, "epoch": 365} {"train_loss": -7.946035385131836, "global_step": 61374, "epoch": 365} {"train_loss": -8.233930587768555, "global_step": 61375, "epoch": 365} {"train_loss": -8.592018127441406, "global_step": 61376, "epoch": 365} {"train_loss": -8.142641067504883, "global_step": 61377, "epoch": 365} {"train_loss": -8.004169464111328, "global_step": 61378, "epoch": 365} {"train_loss": -8.394054412841797, "global_step": 61379, "epoch": 365} {"train_loss": -8.466358184814453, "global_step": 61380, "epoch": 365} {"train_loss": -8.436588287353516, "global_step": 61381, "epoch": 365} {"train_loss": -8.403636932373047, "global_step": 61382, "epoch": 365} {"train_loss": -8.405997276306152, "global_step": 61383, "epoch": 365} {"train_loss": -8.46109390258789, "global_step": 61384, "epoch": 365} {"train_loss": -8.446120262145996, "global_step": 61385, "epoch": 365} {"train_loss": -8.397933959960938, "global_step": 61386, "epoch": 365} {"train_loss": -8.395772933959961, "global_step": 61387, "epoch": 365} {"train_loss": -8.364919662475586, "global_step": 61388, "epoch": 365} {"train_loss": -8.61430549621582, "global_step": 61389, "epoch": 365} {"train_loss": -8.324929237365723, "global_step": 61390, "epoch": 365} {"train_loss": -8.44980525970459, "global_step": 61391, "epoch": 365} {"train_loss": -8.586099624633789, "global_step": 61392, "epoch": 365} {"train_loss": -8.557875633239746, "global_step": 61393, "epoch": 365} {"train_loss": -8.529350280761719, "global_step": 61394, "epoch": 365} {"train_loss": -8.558530807495117, "global_step": 61395, "epoch": 365} {"train_loss": -8.665903091430664, "global_step": 61396, "epoch": 365} {"train_loss": -8.84476089477539, "global_step": 61397, "epoch": 365} {"train_loss": -8.599638938903809, "global_step": 61398, "epoch": 365} {"train_loss": -8.616976737976074, "global_step": 61399, "epoch": 365} {"train_loss": -8.632464408874512, "global_step": 61400, "epoch": 365} {"train_loss": -8.642752647399902, "global_step": 61401, "epoch": 365} {"train_loss": -8.579976081848145, "global_step": 61402, "epoch": 365} {"train_loss": -8.669303894042969, "global_step": 61403, "epoch": 365} {"train_loss": -8.732012748718262, "global_step": 61404, "epoch": 365} {"train_loss": -8.762395858764648, "global_step": 61405, "epoch": 365} {"train_loss": -8.60930061340332, "global_step": 61406, "epoch": 365} {"train_loss": -8.62907600402832, "global_step": 61407, "epoch": 365} {"train_loss": -8.26593017578125, "global_step": 61408, "epoch": 365} {"train_loss": -8.37108325958252, "global_step": 61409, "epoch": 365} {"train_loss": -8.6381196975708, "global_step": 61410, "epoch": 365} {"train_loss": -8.389217376708984, "global_step": 61411, "epoch": 365} {"train_loss": -8.533702850341797, "global_step": 61412, "epoch": 365} {"train_loss": -8.3148193359375, "global_step": 61413, "epoch": 365} {"train_loss": -8.542028427124023, "global_step": 61414, "epoch": 365} {"train_loss": -8.510882377624512, "global_step": 61415, "epoch": 365} {"train_loss": -8.542865753173828, "global_step": 61416, "epoch": 365} {"train_loss": -8.457239151000977, "global_step": 61417, "epoch": 365} {"train_loss": -8.604621887207031, "global_step": 61418, "epoch": 365} {"train_loss": -8.735240936279297, "global_step": 61419, "epoch": 365} {"train_loss": -8.50723648071289, "global_step": 61420, "epoch": 365} {"train_loss": -8.505937576293945, "global_step": 61421, "epoch": 365} {"train_loss": -8.531290054321289, "global_step": 61422, "epoch": 365} {"train_loss": -8.73342514038086, "global_step": 61423, "epoch": 365} {"train_loss": -8.595514297485352, "global_step": 61424, "epoch": 365} {"train_loss": -8.704137802124023, "global_step": 61425, "epoch": 365} {"train_loss": -8.516514778137207, "global_step": 61426, "epoch": 365} {"train_loss": -8.6740140914917, "global_step": 61427, "epoch": 365} {"train_loss": -8.774930953979492, "global_step": 61428, "epoch": 365} {"train_loss": -8.579200744628906, "global_step": 61429, "epoch": 365} {"train_loss": -8.641986846923828, "global_step": 61430, "epoch": 365} {"train_loss": -8.400968551635742, "global_step": 61431, "epoch": 365} {"train_loss": -8.858590126037598, "global_step": 61432, "epoch": 365} {"train_loss": -8.078266143798828, "global_step": 61433, "epoch": 365} {"train_loss": -8.77635383605957, "global_step": 61434, "epoch": 365} {"train_loss": -8.683874130249023, "global_step": 61435, "epoch": 365} {"train_loss": -8.642242431640625, "global_step": 61436, "epoch": 365} {"train_loss": -8.77599048614502, "global_step": 61437, "epoch": 365} {"train_loss": -8.654343605041504, "global_step": 61438, "epoch": 365} {"train_loss": -8.67172622680664, "global_step": 61439, "epoch": 365} {"train_loss": -8.703348159790039, "global_step": 61440, "epoch": 365} {"train_loss": -8.790410995483398, "global_step": 61441, "epoch": 365} {"train_loss": -8.669918060302734, "global_step": 61442, "epoch": 365} {"train_loss": -8.735156059265137, "global_step": 61443, "epoch": 365} {"train_loss": -8.691522598266602, "global_step": 61444, "epoch": 365} {"train_loss": -8.934965133666992, "global_step": 61445, "epoch": 365} {"train_loss": -8.512676239013672, "global_step": 61446, "epoch": 365} {"train_loss": -8.93321418762207, "global_step": 61447, "epoch": 365} {"train_loss": -8.771224975585938, "global_step": 61448, "epoch": 365} {"train_loss": -8.498701095581055, "global_step": 61449, "epoch": 365} {"train_loss": -8.863142967224121, "global_step": 61450, "epoch": 365} {"train_loss": -8.840812683105469, "global_step": 61451, "epoch": 365} {"train_loss": -8.610635757446289, "global_step": 61452, "epoch": 365} {"train_loss": -8.88354778289795, "global_step": 61453, "epoch": 365} {"train_loss": -8.782182693481445, "global_step": 61454, "epoch": 365} {"train_loss": -8.356389045715332, "global_step": 61455, "epoch": 365} {"train_loss": -8.682348251342773, "global_step": 61456, "epoch": 365} {"train_loss": -8.559776306152344, "global_step": 61457, "epoch": 365} {"train_loss": -8.718751907348633, "global_step": 61458, "epoch": 365} {"train_loss": -8.583373069763184, "global_step": 61459, "epoch": 365} {"train_loss": -8.786561965942383, "global_step": 61460, "epoch": 365} {"train_loss": -8.776799201965332, "global_step": 61461, "epoch": 365} {"train_loss": -8.801767349243164, "global_step": 61462, "epoch": 365} {"train_loss": -8.782816886901855, "global_step": 61463, "epoch": 365} {"train_loss": -8.643401145935059, "global_step": 61464, "epoch": 365} {"train_loss": -8.426029205322266, "global_step": 61465, "epoch": 365} {"train_loss": -8.713781356811523, "global_step": 61466, "epoch": 365} {"train_loss": -8.571859359741211, "global_step": 61467, "epoch": 365} {"train_loss": -8.374151229858398, "global_step": 61468, "epoch": 365} {"train_loss": -8.688745498657227, "global_step": 61469, "epoch": 365} {"train_loss": -8.786334991455078, "global_step": 61470, "epoch": 365} {"train_loss": -8.770018577575684, "global_step": 61471, "epoch": 365} {"train_loss": -8.260625839233398, "global_step": 61472, "epoch": 365} {"train_loss": -8.789146423339844, "global_step": 61473, "epoch": 365} {"train_loss": -8.575197219848633, "global_step": 61474, "epoch": 365} {"train_loss": -8.757704734802246, "global_step": 61475, "epoch": 365} {"train_loss": -8.519014358520508, "global_step": 61476, "epoch": 365} {"train_loss": -8.824167251586914, "global_step": 61477, "epoch": 365} {"train_loss": -8.691030502319336, "global_step": 61478, "epoch": 365} {"train_loss": -8.773197174072266, "global_step": 61479, "epoch": 365} {"train_loss": -8.775574684143066, "global_step": 61480, "epoch": 365} {"train_loss": -8.898701667785645, "global_step": 61481, "epoch": 365} {"train_loss": -8.651659965515137, "global_step": 61482, "epoch": 365} {"train_loss": -8.620645523071289, "global_step": 61483, "epoch": 365} {"train_loss": -8.524137496948242, "global_step": 61484, "epoch": 365} {"train_loss": -8.658853530883789, "global_step": 61485, "epoch": 365} {"train_loss": -8.620706558227539, "global_step": 61486, "epoch": 365} {"train_loss": -8.599566050938197, "global_step": 61487, "epoch": 365, "val_loss": 189562.96875, "train_action_mse_error": 10.050806045532227} {"train_loss": -8.684659957885742, "global_step": 61488, "epoch": 366} {"train_loss": -8.711845397949219, "global_step": 61489, "epoch": 366} {"train_loss": -8.761053085327148, "global_step": 61490, "epoch": 366} {"train_loss": -8.358591079711914, "global_step": 61491, "epoch": 366} {"train_loss": -8.61867618560791, "global_step": 61492, "epoch": 366} {"train_loss": -8.430058479309082, "global_step": 61493, "epoch": 366} {"train_loss": -8.70036506652832, "global_step": 61494, "epoch": 366} {"train_loss": -8.707746505737305, "global_step": 61495, "epoch": 366} {"train_loss": -8.60406494140625, "global_step": 61496, "epoch": 366} {"train_loss": -8.724998474121094, "global_step": 61497, "epoch": 366} {"train_loss": -8.48875617980957, "global_step": 61498, "epoch": 366} {"train_loss": -8.753286361694336, "global_step": 61499, "epoch": 366} {"train_loss": -8.684560775756836, "global_step": 61500, "epoch": 366} {"train_loss": -8.649288177490234, "global_step": 61501, "epoch": 366} {"train_loss": -8.417936325073242, "global_step": 61502, "epoch": 366} {"train_loss": -8.712117195129395, "global_step": 61503, "epoch": 366} {"train_loss": -8.670564651489258, "global_step": 61504, "epoch": 366} {"train_loss": -8.657249450683594, "global_step": 61505, "epoch": 366} {"train_loss": -8.820430755615234, "global_step": 61506, "epoch": 366} {"train_loss": -8.576326370239258, "global_step": 61507, "epoch": 366} {"train_loss": -8.81645393371582, "global_step": 61508, "epoch": 366} {"train_loss": -8.574732780456543, "global_step": 61509, "epoch": 366} {"train_loss": -8.637791633605957, "global_step": 61510, "epoch": 366} {"train_loss": -8.82359504699707, "global_step": 61511, "epoch": 366} {"train_loss": -8.885851860046387, "global_step": 61512, "epoch": 366} {"train_loss": -8.792540550231934, "global_step": 61513, "epoch": 366} {"train_loss": -8.75503921508789, "global_step": 61514, "epoch": 366} {"train_loss": -8.735239028930664, "global_step": 61515, "epoch": 366} {"train_loss": -8.39787483215332, "global_step": 61516, "epoch": 366} {"train_loss": -8.591649055480957, "global_step": 61517, "epoch": 366} {"train_loss": -8.860441207885742, "global_step": 61518, "epoch": 366} {"train_loss": -8.866584777832031, "global_step": 61519, "epoch": 366} {"train_loss": -8.672161102294922, "global_step": 61520, "epoch": 366} {"train_loss": -8.840599060058594, "global_step": 61521, "epoch": 366} {"train_loss": -9.044290542602539, "global_step": 61522, "epoch": 366} {"train_loss": -8.896768569946289, "global_step": 61523, "epoch": 366} {"train_loss": -8.781265258789062, "global_step": 61524, "epoch": 366} {"train_loss": -8.802152633666992, "global_step": 61525, "epoch": 366} {"train_loss": -8.79518985748291, "global_step": 61526, "epoch": 366} {"train_loss": -8.983123779296875, "global_step": 61527, "epoch": 366} {"train_loss": -8.564722061157227, "global_step": 61528, "epoch": 366} {"train_loss": -8.412631034851074, "global_step": 61529, "epoch": 366} {"train_loss": -8.741677284240723, "global_step": 61530, "epoch": 366} {"train_loss": -8.330928802490234, "global_step": 61531, "epoch": 366} {"train_loss": -8.345213890075684, "global_step": 61532, "epoch": 366} {"train_loss": -8.703378677368164, "global_step": 61533, "epoch": 366} {"train_loss": -8.359691619873047, "global_step": 61534, "epoch": 366} {"train_loss": -8.58635139465332, "global_step": 61535, "epoch": 366} {"train_loss": -8.754334449768066, "global_step": 61536, "epoch": 366} {"train_loss": -8.699039459228516, "global_step": 61537, "epoch": 366} {"train_loss": -8.396665573120117, "global_step": 61538, "epoch": 366} {"train_loss": -8.828547477722168, "global_step": 61539, "epoch": 366} {"train_loss": -8.507694244384766, "global_step": 61540, "epoch": 366} {"train_loss": -8.641355514526367, "global_step": 61541, "epoch": 366} {"train_loss": -8.585298538208008, "global_step": 61542, "epoch": 366} {"train_loss": -8.597972869873047, "global_step": 61543, "epoch": 366} {"train_loss": -8.519306182861328, "global_step": 61544, "epoch": 366} {"train_loss": -8.372323036193848, "global_step": 61545, "epoch": 366} {"train_loss": -8.548759460449219, "global_step": 61546, "epoch": 366} {"train_loss": -8.425983428955078, "global_step": 61547, "epoch": 366} {"train_loss": -8.666461944580078, "global_step": 61548, "epoch": 366} {"train_loss": -8.541999816894531, "global_step": 61549, "epoch": 366} {"train_loss": -8.773218154907227, "global_step": 61550, "epoch": 366} {"train_loss": -8.709938049316406, "global_step": 61551, "epoch": 366} {"train_loss": -8.682311058044434, "global_step": 61552, "epoch": 366} {"train_loss": -8.820724487304688, "global_step": 61553, "epoch": 366} {"train_loss": -8.695775032043457, "global_step": 61554, "epoch": 366} {"train_loss": -8.483482360839844, "global_step": 61555, "epoch": 366} {"train_loss": -8.922205924987793, "global_step": 61556, "epoch": 366} {"train_loss": -8.51541519165039, "global_step": 61557, "epoch": 366} {"train_loss": -8.81113052368164, "global_step": 61558, "epoch": 366} {"train_loss": -8.637277603149414, "global_step": 61559, "epoch": 366} {"train_loss": -8.967477798461914, "global_step": 61560, "epoch": 366} {"train_loss": -8.364492416381836, "global_step": 61561, "epoch": 366} {"train_loss": -8.821578979492188, "global_step": 61562, "epoch": 366} {"train_loss": -8.894608497619629, "global_step": 61563, "epoch": 366} {"train_loss": -8.807785034179688, "global_step": 61564, "epoch": 366} {"train_loss": -8.836050033569336, "global_step": 61565, "epoch": 366} {"train_loss": -8.838079452514648, "global_step": 61566, "epoch": 366} {"train_loss": -8.784732818603516, "global_step": 61567, "epoch": 366} {"train_loss": -8.901320457458496, "global_step": 61568, "epoch": 366} {"train_loss": -8.828681945800781, "global_step": 61569, "epoch": 366} {"train_loss": -8.514866828918457, "global_step": 61570, "epoch": 366} {"train_loss": -8.804407119750977, "global_step": 61571, "epoch": 366} {"train_loss": -8.678655624389648, "global_step": 61572, "epoch": 366} {"train_loss": -8.615434646606445, "global_step": 61573, "epoch": 366} {"train_loss": -8.818153381347656, "global_step": 61574, "epoch": 366} {"train_loss": -8.614265441894531, "global_step": 61575, "epoch": 366} {"train_loss": -8.873506546020508, "global_step": 61576, "epoch": 366} {"train_loss": -8.49882984161377, "global_step": 61577, "epoch": 366} {"train_loss": -8.57304573059082, "global_step": 61578, "epoch": 366} {"train_loss": -8.774219512939453, "global_step": 61579, "epoch": 366} {"train_loss": -8.804681777954102, "global_step": 61580, "epoch": 366} {"train_loss": -8.859960556030273, "global_step": 61581, "epoch": 366} {"train_loss": -9.004175186157227, "global_step": 61582, "epoch": 366} {"train_loss": -8.66811752319336, "global_step": 61583, "epoch": 366} {"train_loss": -8.713335037231445, "global_step": 61584, "epoch": 366} {"train_loss": -8.883055686950684, "global_step": 61585, "epoch": 366} {"train_loss": -8.695014953613281, "global_step": 61586, "epoch": 366} {"train_loss": -9.184229850769043, "global_step": 61587, "epoch": 366} {"train_loss": -8.765443801879883, "global_step": 61588, "epoch": 366} {"train_loss": -8.773439407348633, "global_step": 61589, "epoch": 366} {"train_loss": -8.939379692077637, "global_step": 61590, "epoch": 366} {"train_loss": -8.675336837768555, "global_step": 61591, "epoch": 366} {"train_loss": -8.835567474365234, "global_step": 61592, "epoch": 366} {"train_loss": -8.886638641357422, "global_step": 61593, "epoch": 366} {"train_loss": -8.809209823608398, "global_step": 61594, "epoch": 366} {"train_loss": -8.377878189086914, "global_step": 61595, "epoch": 366} {"train_loss": -8.810232162475586, "global_step": 61596, "epoch": 366} {"train_loss": -8.956512451171875, "global_step": 61597, "epoch": 366} {"train_loss": -8.514509201049805, "global_step": 61598, "epoch": 366} {"train_loss": -8.566947937011719, "global_step": 61599, "epoch": 366} {"train_loss": -8.334999084472656, "global_step": 61600, "epoch": 366} {"train_loss": -8.677300453186035, "global_step": 61601, "epoch": 366} {"train_loss": -8.876937866210938, "global_step": 61602, "epoch": 366} {"train_loss": -8.68356704711914, "global_step": 61603, "epoch": 366} {"train_loss": -8.721700668334961, "global_step": 61604, "epoch": 366} {"train_loss": -8.763496398925781, "global_step": 61605, "epoch": 366} {"train_loss": -8.525931358337402, "global_step": 61606, "epoch": 366} {"train_loss": -8.561060905456543, "global_step": 61607, "epoch": 366} {"train_loss": -8.851276397705078, "global_step": 61608, "epoch": 366} {"train_loss": -8.462545394897461, "global_step": 61609, "epoch": 366} {"train_loss": -8.536287307739258, "global_step": 61610, "epoch": 366} {"train_loss": -8.823741912841797, "global_step": 61611, "epoch": 366} {"train_loss": -8.708953857421875, "global_step": 61612, "epoch": 366} {"train_loss": -8.777883529663086, "global_step": 61613, "epoch": 366} {"train_loss": -8.67931842803955, "global_step": 61614, "epoch": 366} {"train_loss": -8.585376739501953, "global_step": 61615, "epoch": 366} {"train_loss": -8.829476356506348, "global_step": 61616, "epoch": 366} {"train_loss": -8.447019577026367, "global_step": 61617, "epoch": 366} {"train_loss": -8.68954086303711, "global_step": 61618, "epoch": 366} {"train_loss": -8.507118225097656, "global_step": 61619, "epoch": 366} {"train_loss": -8.707664489746094, "global_step": 61620, "epoch": 366} {"train_loss": -8.703582763671875, "global_step": 61621, "epoch": 366} {"train_loss": -8.692126274108887, "global_step": 61622, "epoch": 366} {"train_loss": -8.333327293395996, "global_step": 61623, "epoch": 366} {"train_loss": -8.700551986694336, "global_step": 61624, "epoch": 366} {"train_loss": -8.46053695678711, "global_step": 61625, "epoch": 366} {"train_loss": -8.688331604003906, "global_step": 61626, "epoch": 366} {"train_loss": -8.458452224731445, "global_step": 61627, "epoch": 366} {"train_loss": -8.879596710205078, "global_step": 61628, "epoch": 366} {"train_loss": -8.700275421142578, "global_step": 61629, "epoch": 366} {"train_loss": -8.801551818847656, "global_step": 61630, "epoch": 366} {"train_loss": -8.94393253326416, "global_step": 61631, "epoch": 366} {"train_loss": -8.748634338378906, "global_step": 61632, "epoch": 366} {"train_loss": -8.819648742675781, "global_step": 61633, "epoch": 366} {"train_loss": -8.798011779785156, "global_step": 61634, "epoch": 366} {"train_loss": -8.824506759643555, "global_step": 61635, "epoch": 366} {"train_loss": -8.768301963806152, "global_step": 61636, "epoch": 366} {"train_loss": -9.003503799438477, "global_step": 61637, "epoch": 366} {"train_loss": -8.723912239074707, "global_step": 61638, "epoch": 366} {"train_loss": -8.943560600280762, "global_step": 61639, "epoch": 366} {"train_loss": -8.855575561523438, "global_step": 61640, "epoch": 366} {"train_loss": -8.706616401672363, "global_step": 61641, "epoch": 366} {"train_loss": -9.056049346923828, "global_step": 61642, "epoch": 366} {"train_loss": -8.613685607910156, "global_step": 61643, "epoch": 366} {"train_loss": -8.897863388061523, "global_step": 61644, "epoch": 366} {"train_loss": -8.722465515136719, "global_step": 61645, "epoch": 366} {"train_loss": -8.976095199584961, "global_step": 61646, "epoch": 366} {"train_loss": -9.01702880859375, "global_step": 61647, "epoch": 366} {"train_loss": -8.874093055725098, "global_step": 61648, "epoch": 366} {"train_loss": -8.909997940063477, "global_step": 61649, "epoch": 366} {"train_loss": -8.730934143066406, "global_step": 61650, "epoch": 366} {"train_loss": -8.682838439941406, "global_step": 61651, "epoch": 366} {"train_loss": -8.703129768371582, "global_step": 61652, "epoch": 366} {"train_loss": -8.680976867675781, "global_step": 61653, "epoch": 366} {"train_loss": -8.662630081176758, "global_step": 61654, "epoch": 366} {"train_loss": -8.701317395482745, "global_step": 61655, "epoch": 366, "val_loss": 189763.875} {"train_loss": -8.568838119506836, "global_step": 61656, "epoch": 367} {"train_loss": -8.613618850708008, "global_step": 61657, "epoch": 367} {"train_loss": -8.524927139282227, "global_step": 61658, "epoch": 367} {"train_loss": -8.358260154724121, "global_step": 61659, "epoch": 367} {"train_loss": -8.564715385437012, "global_step": 61660, "epoch": 367} {"train_loss": -8.450636863708496, "global_step": 61661, "epoch": 367} {"train_loss": -8.467361450195312, "global_step": 61662, "epoch": 367} {"train_loss": -8.3677339553833, "global_step": 61663, "epoch": 367} {"train_loss": -8.447651863098145, "global_step": 61664, "epoch": 367} {"train_loss": -8.401532173156738, "global_step": 61665, "epoch": 367} {"train_loss": -8.354584693908691, "global_step": 61666, "epoch": 367} {"train_loss": -8.365510940551758, "global_step": 61667, "epoch": 367} {"train_loss": -8.49782657623291, "global_step": 61668, "epoch": 367} {"train_loss": -8.535270690917969, "global_step": 61669, "epoch": 367} {"train_loss": -8.304449081420898, "global_step": 61670, "epoch": 367} {"train_loss": -8.61214542388916, "global_step": 61671, "epoch": 367} {"train_loss": -8.367521286010742, "global_step": 61672, "epoch": 367} {"train_loss": -8.58128547668457, "global_step": 61673, "epoch": 367} {"train_loss": -8.437470436096191, "global_step": 61674, "epoch": 367} {"train_loss": -8.58009147644043, "global_step": 61675, "epoch": 367} {"train_loss": -8.351305961608887, "global_step": 61676, "epoch": 367} {"train_loss": -8.736111640930176, "global_step": 61677, "epoch": 367} {"train_loss": -8.591062545776367, "global_step": 61678, "epoch": 367} {"train_loss": -8.642199516296387, "global_step": 61679, "epoch": 367} {"train_loss": -8.578262329101562, "global_step": 61680, "epoch": 367} {"train_loss": -8.508947372436523, "global_step": 61681, "epoch": 367} {"train_loss": -8.60118293762207, "global_step": 61682, "epoch": 367} {"train_loss": -8.455401420593262, "global_step": 61683, "epoch": 367} {"train_loss": -8.701624870300293, "global_step": 61684, "epoch": 367} {"train_loss": -8.483359336853027, "global_step": 61685, "epoch": 367} {"train_loss": -8.61935043334961, "global_step": 61686, "epoch": 367} {"train_loss": -8.723867416381836, "global_step": 61687, "epoch": 367} {"train_loss": -8.694828033447266, "global_step": 61688, "epoch": 367} {"train_loss": -8.515273094177246, "global_step": 61689, "epoch": 367} {"train_loss": -8.873111724853516, "global_step": 61690, "epoch": 367} {"train_loss": -8.35517406463623, "global_step": 61691, "epoch": 367} {"train_loss": -8.713861465454102, "global_step": 61692, "epoch": 367} {"train_loss": -8.674701690673828, "global_step": 61693, "epoch": 367} {"train_loss": -8.742025375366211, "global_step": 61694, "epoch": 367} {"train_loss": -8.563825607299805, "global_step": 61695, "epoch": 367} {"train_loss": -8.925987243652344, "global_step": 61696, "epoch": 367} {"train_loss": -8.387619018554688, "global_step": 61697, "epoch": 367} {"train_loss": -8.686885833740234, "global_step": 61698, "epoch": 367} {"train_loss": -8.365778923034668, "global_step": 61699, "epoch": 367} {"train_loss": -8.6641845703125, "global_step": 61700, "epoch": 367} {"train_loss": -8.399730682373047, "global_step": 61701, "epoch": 367} {"train_loss": -8.788579940795898, "global_step": 61702, "epoch": 367} {"train_loss": -8.567644119262695, "global_step": 61703, "epoch": 367} {"train_loss": -8.87158203125, "global_step": 61704, "epoch": 367} {"train_loss": -8.91503620147705, "global_step": 61705, "epoch": 367} {"train_loss": -8.837723731994629, "global_step": 61706, "epoch": 367} {"train_loss": -8.604997634887695, "global_step": 61707, "epoch": 367} {"train_loss": -8.684026718139648, "global_step": 61708, "epoch": 367} {"train_loss": -8.666057586669922, "global_step": 61709, "epoch": 367} {"train_loss": -8.761631965637207, "global_step": 61710, "epoch": 367} {"train_loss": -8.746386528015137, "global_step": 61711, "epoch": 367} {"train_loss": -8.477946281433105, "global_step": 61712, "epoch": 367} {"train_loss": -8.606754302978516, "global_step": 61713, "epoch": 367} {"train_loss": -8.813671112060547, "global_step": 61714, "epoch": 367} {"train_loss": -8.65048599243164, "global_step": 61715, "epoch": 367} {"train_loss": -8.718111038208008, "global_step": 61716, "epoch": 367} {"train_loss": -8.560819625854492, "global_step": 61717, "epoch": 367} {"train_loss": -8.824747085571289, "global_step": 61718, "epoch": 367} {"train_loss": -8.816352844238281, "global_step": 61719, "epoch": 367} {"train_loss": -8.629154205322266, "global_step": 61720, "epoch": 367} {"train_loss": -8.57783031463623, "global_step": 61721, "epoch": 367} {"train_loss": -8.898160934448242, "global_step": 61722, "epoch": 367} {"train_loss": -8.534748077392578, "global_step": 61723, "epoch": 367} {"train_loss": -8.690069198608398, "global_step": 61724, "epoch": 367} {"train_loss": -8.52365493774414, "global_step": 61725, "epoch": 367} {"train_loss": -8.687199592590332, "global_step": 61726, "epoch": 367} {"train_loss": -8.366155624389648, "global_step": 61727, "epoch": 367} {"train_loss": -9.018983840942383, "global_step": 61728, "epoch": 367} {"train_loss": -8.819836616516113, "global_step": 61729, "epoch": 367} {"train_loss": -8.844688415527344, "global_step": 61730, "epoch": 367} {"train_loss": -8.522740364074707, "global_step": 61731, "epoch": 367} {"train_loss": -8.707658767700195, "global_step": 61732, "epoch": 367} {"train_loss": -8.596870422363281, "global_step": 61733, "epoch": 367} {"train_loss": -8.690478324890137, "global_step": 61734, "epoch": 367} {"train_loss": -8.688335418701172, "global_step": 61735, "epoch": 367} {"train_loss": -8.67642593383789, "global_step": 61736, "epoch": 367} {"train_loss": -8.842251777648926, "global_step": 61737, "epoch": 367} {"train_loss": -9.087516784667969, "global_step": 61738, "epoch": 367} {"train_loss": -8.90497875213623, "global_step": 61739, "epoch": 367} {"train_loss": -8.878782272338867, "global_step": 61740, "epoch": 367} {"train_loss": -9.007684707641602, "global_step": 61741, "epoch": 367} {"train_loss": -8.7593994140625, "global_step": 61742, "epoch": 367} {"train_loss": -8.991629600524902, "global_step": 61743, "epoch": 367} {"train_loss": -8.762588500976562, "global_step": 61744, "epoch": 367} {"train_loss": -8.92007827758789, "global_step": 61745, "epoch": 367} {"train_loss": -8.760847091674805, "global_step": 61746, "epoch": 367} {"train_loss": -8.603531837463379, "global_step": 61747, "epoch": 367} {"train_loss": -9.008718490600586, "global_step": 61748, "epoch": 367} {"train_loss": -8.757132530212402, "global_step": 61749, "epoch": 367} {"train_loss": -8.807766914367676, "global_step": 61750, "epoch": 367} {"train_loss": -8.401235580444336, "global_step": 61751, "epoch": 367} {"train_loss": -8.982152938842773, "global_step": 61752, "epoch": 367} {"train_loss": -8.652494430541992, "global_step": 61753, "epoch": 367} {"train_loss": -8.540749549865723, "global_step": 61754, "epoch": 367} {"train_loss": -8.906240463256836, "global_step": 61755, "epoch": 367} {"train_loss": -8.293562889099121, "global_step": 61756, "epoch": 367} {"train_loss": -8.729822158813477, "global_step": 61757, "epoch": 367} {"train_loss": -8.176267623901367, "global_step": 61758, "epoch": 367} {"train_loss": -8.777142524719238, "global_step": 61759, "epoch": 367} {"train_loss": -8.478424072265625, "global_step": 61760, "epoch": 367} {"train_loss": -8.85770320892334, "global_step": 61761, "epoch": 367} {"train_loss": -8.470365524291992, "global_step": 61762, "epoch": 367} {"train_loss": -8.732759475708008, "global_step": 61763, "epoch": 367} {"train_loss": -8.71798324584961, "global_step": 61764, "epoch": 367} {"train_loss": -8.652521133422852, "global_step": 61765, "epoch": 367} {"train_loss": -8.684499740600586, "global_step": 61766, "epoch": 367} {"train_loss": -8.76974105834961, "global_step": 61767, "epoch": 367} {"train_loss": -8.440343856811523, "global_step": 61768, "epoch": 367} {"train_loss": -8.468133926391602, "global_step": 61769, "epoch": 367} {"train_loss": -8.6979398727417, "global_step": 61770, "epoch": 367} {"train_loss": -8.230402946472168, "global_step": 61771, "epoch": 367} {"train_loss": -8.697610855102539, "global_step": 61772, "epoch": 367} {"train_loss": -8.726198196411133, "global_step": 61773, "epoch": 367} {"train_loss": -8.775917053222656, "global_step": 61774, "epoch": 367} {"train_loss": -8.584508895874023, "global_step": 61775, "epoch": 367} {"train_loss": -8.52399730682373, "global_step": 61776, "epoch": 367} {"train_loss": -8.592105865478516, "global_step": 61777, "epoch": 367} {"train_loss": -8.53891372680664, "global_step": 61778, "epoch": 367} {"train_loss": -8.674905776977539, "global_step": 61779, "epoch": 367} {"train_loss": -8.386846542358398, "global_step": 61780, "epoch": 367} {"train_loss": -8.377601623535156, "global_step": 61781, "epoch": 367} {"train_loss": -8.698220252990723, "global_step": 61782, "epoch": 367} {"train_loss": -8.590666770935059, "global_step": 61783, "epoch": 367} {"train_loss": -8.788003921508789, "global_step": 61784, "epoch": 367} {"train_loss": -8.775609016418457, "global_step": 61785, "epoch": 367} {"train_loss": -8.659570693969727, "global_step": 61786, "epoch": 367} {"train_loss": -8.710488319396973, "global_step": 61787, "epoch": 367} {"train_loss": -8.63756275177002, "global_step": 61788, "epoch": 367} {"train_loss": -8.691598892211914, "global_step": 61789, "epoch": 367} {"train_loss": -8.829404830932617, "global_step": 61790, "epoch": 367} {"train_loss": -8.68454360961914, "global_step": 61791, "epoch": 367} {"train_loss": -8.706399917602539, "global_step": 61792, "epoch": 367} {"train_loss": -8.787185668945312, "global_step": 61793, "epoch": 367} {"train_loss": -8.807767868041992, "global_step": 61794, "epoch": 367} {"train_loss": -8.838823318481445, "global_step": 61795, "epoch": 367} {"train_loss": -9.117971420288086, "global_step": 61796, "epoch": 367} {"train_loss": -8.940227508544922, "global_step": 61797, "epoch": 367} {"train_loss": -8.786060333251953, "global_step": 61798, "epoch": 367} {"train_loss": -8.992656707763672, "global_step": 61799, "epoch": 367} {"train_loss": -8.9639892578125, "global_step": 61800, "epoch": 367} {"train_loss": -8.642799377441406, "global_step": 61801, "epoch": 367} {"train_loss": -8.672282218933105, "global_step": 61802, "epoch": 367} {"train_loss": -8.954059600830078, "global_step": 61803, "epoch": 367} {"train_loss": -8.842527389526367, "global_step": 61804, "epoch": 367} {"train_loss": -8.919218063354492, "global_step": 61805, "epoch": 367} {"train_loss": -8.639592170715332, "global_step": 61806, "epoch": 367} {"train_loss": -8.683333396911621, "global_step": 61807, "epoch": 367} {"train_loss": -8.846214294433594, "global_step": 61808, "epoch": 367} {"train_loss": -8.813102722167969, "global_step": 61809, "epoch": 367} {"train_loss": -8.897977828979492, "global_step": 61810, "epoch": 367} {"train_loss": -8.553820610046387, "global_step": 61811, "epoch": 367} {"train_loss": -8.751764297485352, "global_step": 61812, "epoch": 367} {"train_loss": -8.858455657958984, "global_step": 61813, "epoch": 367} {"train_loss": -8.582595825195312, "global_step": 61814, "epoch": 367} {"train_loss": -8.739283561706543, "global_step": 61815, "epoch": 367} {"train_loss": -8.89242935180664, "global_step": 61816, "epoch": 367} {"train_loss": -8.561279296875, "global_step": 61817, "epoch": 367} {"train_loss": -8.664194107055664, "global_step": 61818, "epoch": 367} {"train_loss": -8.829050064086914, "global_step": 61819, "epoch": 367} {"train_loss": -8.48237419128418, "global_step": 61820, "epoch": 367} {"train_loss": -8.550399780273438, "global_step": 61821, "epoch": 367} {"train_loss": -8.541404724121094, "global_step": 61822, "epoch": 367} {"train_loss": -8.662300836472284, "global_step": 61823, "epoch": 367, "val_loss": 190318.484375} {"train_loss": -8.317182540893555, "global_step": 61824, "epoch": 368} {"train_loss": -8.190423965454102, "global_step": 61825, "epoch": 368} {"train_loss": -8.688422203063965, "global_step": 61826, "epoch": 368} {"train_loss": -8.15895938873291, "global_step": 61827, "epoch": 368} {"train_loss": -8.3986177444458, "global_step": 61828, "epoch": 368} {"train_loss": -8.59040641784668, "global_step": 61829, "epoch": 368} {"train_loss": -8.223949432373047, "global_step": 61830, "epoch": 368} {"train_loss": -8.36864948272705, "global_step": 61831, "epoch": 368} {"train_loss": -8.544960975646973, "global_step": 61832, "epoch": 368} {"train_loss": -8.668303489685059, "global_step": 61833, "epoch": 368} {"train_loss": -8.394861221313477, "global_step": 61834, "epoch": 368} {"train_loss": -8.311139106750488, "global_step": 61835, "epoch": 368} {"train_loss": -8.528762817382812, "global_step": 61836, "epoch": 368} {"train_loss": -8.365704536437988, "global_step": 61837, "epoch": 368} {"train_loss": -8.528154373168945, "global_step": 61838, "epoch": 368} {"train_loss": -8.589827537536621, "global_step": 61839, "epoch": 368} {"train_loss": -8.725995063781738, "global_step": 61840, "epoch": 368} {"train_loss": -8.583495140075684, "global_step": 61841, "epoch": 368} {"train_loss": -8.6146879196167, "global_step": 61842, "epoch": 368} {"train_loss": -8.478178977966309, "global_step": 61843, "epoch": 368} {"train_loss": -8.536205291748047, "global_step": 61844, "epoch": 368} {"train_loss": -8.501945495605469, "global_step": 61845, "epoch": 368} {"train_loss": -8.296302795410156, "global_step": 61846, "epoch": 368} {"train_loss": -8.490772247314453, "global_step": 61847, "epoch": 368} {"train_loss": -8.575708389282227, "global_step": 61848, "epoch": 368} {"train_loss": -8.671274185180664, "global_step": 61849, "epoch": 368} {"train_loss": -8.947310447692871, "global_step": 61850, "epoch": 368} {"train_loss": -8.682013511657715, "global_step": 61851, "epoch": 368} {"train_loss": -8.46982192993164, "global_step": 61852, "epoch": 368} {"train_loss": -8.58217716217041, "global_step": 61853, "epoch": 368} {"train_loss": -8.59538459777832, "global_step": 61854, "epoch": 368} {"train_loss": -8.820959091186523, "global_step": 61855, "epoch": 368} {"train_loss": -8.860267639160156, "global_step": 61856, "epoch": 368} {"train_loss": -8.583978652954102, "global_step": 61857, "epoch": 368} {"train_loss": -8.685102462768555, "global_step": 61858, "epoch": 368} {"train_loss": -8.900689125061035, "global_step": 61859, "epoch": 368} {"train_loss": -8.845256805419922, "global_step": 61860, "epoch": 368} {"train_loss": -8.759090423583984, "global_step": 61861, "epoch": 368} {"train_loss": -8.713508605957031, "global_step": 61862, "epoch": 368} {"train_loss": -8.710453033447266, "global_step": 61863, "epoch": 368} {"train_loss": -8.404870986938477, "global_step": 61864, "epoch": 368} {"train_loss": -8.251891136169434, "global_step": 61865, "epoch": 368} {"train_loss": -8.344289779663086, "global_step": 61866, "epoch": 368} {"train_loss": -8.261652946472168, "global_step": 61867, "epoch": 368} {"train_loss": -8.299358367919922, "global_step": 61868, "epoch": 368} {"train_loss": -8.64455509185791, "global_step": 61869, "epoch": 368} {"train_loss": -8.326889038085938, "global_step": 61870, "epoch": 368} {"train_loss": -8.525586128234863, "global_step": 61871, "epoch": 368} {"train_loss": -8.567206382751465, "global_step": 61872, "epoch": 368} {"train_loss": -8.659623146057129, "global_step": 61873, "epoch": 368} {"train_loss": -8.352684020996094, "global_step": 61874, "epoch": 368} {"train_loss": -8.654216766357422, "global_step": 61875, "epoch": 368} {"train_loss": -8.401937484741211, "global_step": 61876, "epoch": 368} {"train_loss": -8.363008499145508, "global_step": 61877, "epoch": 368} {"train_loss": -8.495177268981934, "global_step": 61878, "epoch": 368} {"train_loss": -8.647823333740234, "global_step": 61879, "epoch": 368} {"train_loss": -8.407058715820312, "global_step": 61880, "epoch": 368} {"train_loss": -8.501643180847168, "global_step": 61881, "epoch": 368} {"train_loss": -8.731074333190918, "global_step": 61882, "epoch": 368} {"train_loss": -8.49200439453125, "global_step": 61883, "epoch": 368} {"train_loss": -8.734037399291992, "global_step": 61884, "epoch": 368} {"train_loss": -8.62114429473877, "global_step": 61885, "epoch": 368} {"train_loss": -8.558385848999023, "global_step": 61886, "epoch": 368} {"train_loss": -8.639314651489258, "global_step": 61887, "epoch": 368} {"train_loss": -8.72082805633545, "global_step": 61888, "epoch": 368} {"train_loss": -8.314164161682129, "global_step": 61889, "epoch": 368} {"train_loss": -8.502477645874023, "global_step": 61890, "epoch": 368} {"train_loss": -8.894694328308105, "global_step": 61891, "epoch": 368} {"train_loss": -8.70093059539795, "global_step": 61892, "epoch": 368} {"train_loss": -8.927499771118164, "global_step": 61893, "epoch": 368} {"train_loss": -8.767963409423828, "global_step": 61894, "epoch": 368} {"train_loss": -8.441027641296387, "global_step": 61895, "epoch": 368} {"train_loss": -8.882829666137695, "global_step": 61896, "epoch": 368} {"train_loss": -8.593043327331543, "global_step": 61897, "epoch": 368} {"train_loss": -8.725038528442383, "global_step": 61898, "epoch": 368} {"train_loss": -8.790583610534668, "global_step": 61899, "epoch": 368} {"train_loss": -8.685422897338867, "global_step": 61900, "epoch": 368} {"train_loss": -8.824053764343262, "global_step": 61901, "epoch": 368} {"train_loss": -8.689994812011719, "global_step": 61902, "epoch": 368} {"train_loss": -8.57386302947998, "global_step": 61903, "epoch": 368} {"train_loss": -8.6231050491333, "global_step": 61904, "epoch": 368} {"train_loss": -8.362846374511719, "global_step": 61905, "epoch": 368} {"train_loss": -8.62946891784668, "global_step": 61906, "epoch": 368} {"train_loss": -8.4229154586792, "global_step": 61907, "epoch": 368} {"train_loss": -8.52098274230957, "global_step": 61908, "epoch": 368} {"train_loss": -8.341209411621094, "global_step": 61909, "epoch": 368} {"train_loss": -8.532028198242188, "global_step": 61910, "epoch": 368} {"train_loss": -8.389427185058594, "global_step": 61911, "epoch": 368} {"train_loss": -8.620509147644043, "global_step": 61912, "epoch": 368} {"train_loss": -8.68838119506836, "global_step": 61913, "epoch": 368} {"train_loss": -8.619077682495117, "global_step": 61914, "epoch": 368} {"train_loss": -8.805326461791992, "global_step": 61915, "epoch": 368} {"train_loss": -8.347955703735352, "global_step": 61916, "epoch": 368} {"train_loss": -8.464116096496582, "global_step": 61917, "epoch": 368} {"train_loss": -8.367133140563965, "global_step": 61918, "epoch": 368} {"train_loss": -8.577705383300781, "global_step": 61919, "epoch": 368} {"train_loss": -8.773490905761719, "global_step": 61920, "epoch": 368} {"train_loss": -8.75210189819336, "global_step": 61921, "epoch": 368} {"train_loss": -8.692474365234375, "global_step": 61922, "epoch": 368} {"train_loss": -8.504634857177734, "global_step": 61923, "epoch": 368} {"train_loss": -8.587188720703125, "global_step": 61924, "epoch": 368} {"train_loss": -8.726415634155273, "global_step": 61925, "epoch": 368} {"train_loss": -8.584508895874023, "global_step": 61926, "epoch": 368} {"train_loss": -8.635540008544922, "global_step": 61927, "epoch": 368} {"train_loss": -8.56926155090332, "global_step": 61928, "epoch": 368} {"train_loss": -8.709619522094727, "global_step": 61929, "epoch": 368} {"train_loss": -8.69467544555664, "global_step": 61930, "epoch": 368} {"train_loss": -8.767522811889648, "global_step": 61931, "epoch": 368} {"train_loss": -8.622795104980469, "global_step": 61932, "epoch": 368} {"train_loss": -8.834699630737305, "global_step": 61933, "epoch": 368} {"train_loss": -8.54405403137207, "global_step": 61934, "epoch": 368} {"train_loss": -8.792344093322754, "global_step": 61935, "epoch": 368} {"train_loss": -8.838132858276367, "global_step": 61936, "epoch": 368} {"train_loss": -8.734075546264648, "global_step": 61937, "epoch": 368} {"train_loss": -8.675514221191406, "global_step": 61938, "epoch": 368} {"train_loss": -9.010957717895508, "global_step": 61939, "epoch": 368} {"train_loss": -8.55801773071289, "global_step": 61940, "epoch": 368} {"train_loss": -8.599817276000977, "global_step": 61941, "epoch": 368} {"train_loss": -8.854954719543457, "global_step": 61942, "epoch": 368} {"train_loss": -8.604934692382812, "global_step": 61943, "epoch": 368} {"train_loss": -8.912209510803223, "global_step": 61944, "epoch": 368} {"train_loss": -8.890579223632812, "global_step": 61945, "epoch": 368} {"train_loss": -8.821490287780762, "global_step": 61946, "epoch": 368} {"train_loss": -8.469097137451172, "global_step": 61947, "epoch": 368} {"train_loss": -8.737180709838867, "global_step": 61948, "epoch": 368} {"train_loss": -8.53993034362793, "global_step": 61949, "epoch": 368} {"train_loss": -8.632637023925781, "global_step": 61950, "epoch": 368} {"train_loss": -8.73127555847168, "global_step": 61951, "epoch": 368} {"train_loss": -8.60306453704834, "global_step": 61952, "epoch": 368} {"train_loss": -8.724443435668945, "global_step": 61953, "epoch": 368} {"train_loss": -8.667317390441895, "global_step": 61954, "epoch": 368} {"train_loss": -8.352243423461914, "global_step": 61955, "epoch": 368} {"train_loss": -8.69749641418457, "global_step": 61956, "epoch": 368} {"train_loss": -8.603141784667969, "global_step": 61957, "epoch": 368} {"train_loss": -8.775468826293945, "global_step": 61958, "epoch": 368} {"train_loss": -8.706209182739258, "global_step": 61959, "epoch": 368} {"train_loss": -8.662591934204102, "global_step": 61960, "epoch": 368} {"train_loss": -8.780313491821289, "global_step": 61961, "epoch": 368} {"train_loss": -8.74278450012207, "global_step": 61962, "epoch": 368} {"train_loss": -8.502474784851074, "global_step": 61963, "epoch": 368} {"train_loss": -8.661165237426758, "global_step": 61964, "epoch": 368} {"train_loss": -8.801977157592773, "global_step": 61965, "epoch": 368} {"train_loss": -8.728937149047852, "global_step": 61966, "epoch": 368} {"train_loss": -8.69047737121582, "global_step": 61967, "epoch": 368} {"train_loss": -8.697962760925293, "global_step": 61968, "epoch": 368} {"train_loss": -8.647686958312988, "global_step": 61969, "epoch": 368} {"train_loss": -8.671419143676758, "global_step": 61970, "epoch": 368} {"train_loss": -8.857397079467773, "global_step": 61971, "epoch": 368} {"train_loss": -8.704768180847168, "global_step": 61972, "epoch": 368} {"train_loss": -8.68856430053711, "global_step": 61973, "epoch": 368} {"train_loss": -8.372335433959961, "global_step": 61974, "epoch": 368} {"train_loss": -8.68143081665039, "global_step": 61975, "epoch": 368} {"train_loss": -8.498332977294922, "global_step": 61976, "epoch": 368} {"train_loss": -8.685771942138672, "global_step": 61977, "epoch": 368} {"train_loss": -8.683794021606445, "global_step": 61978, "epoch": 368} {"train_loss": -8.719010353088379, "global_step": 61979, "epoch": 368} {"train_loss": -8.637713432312012, "global_step": 61980, "epoch": 368} {"train_loss": -8.763343811035156, "global_step": 61981, "epoch": 368} {"train_loss": -8.942689895629883, "global_step": 61982, "epoch": 368} {"train_loss": -8.675694465637207, "global_step": 61983, "epoch": 368} {"train_loss": -8.687365531921387, "global_step": 61984, "epoch": 368} {"train_loss": -8.649255752563477, "global_step": 61985, "epoch": 368} {"train_loss": -8.961702346801758, "global_step": 61986, "epoch": 368} {"train_loss": -9.025741577148438, "global_step": 61987, "epoch": 368} {"train_loss": -8.66267204284668, "global_step": 61988, "epoch": 368} {"train_loss": -8.721909523010254, "global_step": 61989, "epoch": 368} {"train_loss": -8.806875228881836, "global_step": 61990, "epoch": 368} {"train_loss": -8.619741331963311, "global_step": 61991, "epoch": 368, "val_loss": 195763.109375} {"train_loss": -8.742050170898438, "global_step": 61992, "epoch": 369} {"train_loss": -8.929855346679688, "global_step": 61993, "epoch": 369} {"train_loss": -8.781368255615234, "global_step": 61994, "epoch": 369} {"train_loss": -8.73501205444336, "global_step": 61995, "epoch": 369} {"train_loss": -8.885477066040039, "global_step": 61996, "epoch": 369} {"train_loss": -8.79764175415039, "global_step": 61997, "epoch": 369} {"train_loss": -8.881135940551758, "global_step": 61998, "epoch": 369} {"train_loss": -8.604652404785156, "global_step": 61999, "epoch": 369} {"train_loss": -8.92613697052002, "global_step": 62000, "epoch": 369} {"train_loss": -8.78378677368164, "global_step": 62001, "epoch": 369} {"train_loss": -8.833784103393555, "global_step": 62002, "epoch": 369} {"train_loss": -8.818347930908203, "global_step": 62003, "epoch": 369} {"train_loss": -8.730005264282227, "global_step": 62004, "epoch": 369} {"train_loss": -8.713947296142578, "global_step": 62005, "epoch": 369} {"train_loss": -8.614340782165527, "global_step": 62006, "epoch": 369} {"train_loss": -8.332246780395508, "global_step": 62007, "epoch": 369} {"train_loss": -9.086214065551758, "global_step": 62008, "epoch": 369} {"train_loss": -8.635741233825684, "global_step": 62009, "epoch": 369} {"train_loss": -8.929323196411133, "global_step": 62010, "epoch": 369} {"train_loss": -8.792572021484375, "global_step": 62011, "epoch": 369} {"train_loss": -8.852396011352539, "global_step": 62012, "epoch": 369} {"train_loss": -8.625993728637695, "global_step": 62013, "epoch": 369} {"train_loss": -8.767208099365234, "global_step": 62014, "epoch": 369} {"train_loss": -8.466687202453613, "global_step": 62015, "epoch": 369} {"train_loss": -8.732344627380371, "global_step": 62016, "epoch": 369} {"train_loss": -8.836997032165527, "global_step": 62017, "epoch": 369} {"train_loss": -8.704851150512695, "global_step": 62018, "epoch": 369} {"train_loss": -8.766536712646484, "global_step": 62019, "epoch": 369} {"train_loss": -8.729880332946777, "global_step": 62020, "epoch": 369} {"train_loss": -8.82787036895752, "global_step": 62021, "epoch": 369} {"train_loss": -8.738155364990234, "global_step": 62022, "epoch": 369} {"train_loss": -8.988354682922363, "global_step": 62023, "epoch": 369} {"train_loss": -8.826251983642578, "global_step": 62024, "epoch": 369} {"train_loss": -8.589921951293945, "global_step": 62025, "epoch": 369} {"train_loss": -8.719551086425781, "global_step": 62026, "epoch": 369} {"train_loss": -8.759456634521484, "global_step": 62027, "epoch": 369} {"train_loss": -8.648704528808594, "global_step": 62028, "epoch": 369} {"train_loss": -8.899646759033203, "global_step": 62029, "epoch": 369} {"train_loss": -8.876485824584961, "global_step": 62030, "epoch": 369} {"train_loss": -8.682129859924316, "global_step": 62031, "epoch": 369} {"train_loss": -8.986438751220703, "global_step": 62032, "epoch": 369} {"train_loss": -8.897636413574219, "global_step": 62033, "epoch": 369} {"train_loss": -9.079221725463867, "global_step": 62034, "epoch": 369} {"train_loss": -8.724647521972656, "global_step": 62035, "epoch": 369} {"train_loss": -8.850512504577637, "global_step": 62036, "epoch": 369} {"train_loss": -9.03509521484375, "global_step": 62037, "epoch": 369} {"train_loss": -8.787793159484863, "global_step": 62038, "epoch": 369} {"train_loss": -8.756410598754883, "global_step": 62039, "epoch": 369} {"train_loss": -8.884803771972656, "global_step": 62040, "epoch": 369} {"train_loss": -8.745307922363281, "global_step": 62041, "epoch": 369} {"train_loss": -8.78067398071289, "global_step": 62042, "epoch": 369} {"train_loss": -8.893369674682617, "global_step": 62043, "epoch": 369} {"train_loss": -8.843791961669922, "global_step": 62044, "epoch": 369} {"train_loss": -8.644495964050293, "global_step": 62045, "epoch": 369} {"train_loss": -8.811853408813477, "global_step": 62046, "epoch": 369} {"train_loss": -8.819784164428711, "global_step": 62047, "epoch": 369} {"train_loss": -8.678789138793945, "global_step": 62048, "epoch": 369} {"train_loss": -8.710601806640625, "global_step": 62049, "epoch": 369} {"train_loss": -8.524799346923828, "global_step": 62050, "epoch": 369} {"train_loss": -8.72120475769043, "global_step": 62051, "epoch": 369} {"train_loss": -8.678007125854492, "global_step": 62052, "epoch": 369} {"train_loss": -8.533851623535156, "global_step": 62053, "epoch": 369} {"train_loss": -8.643595695495605, "global_step": 62054, "epoch": 369} {"train_loss": -8.280475616455078, "global_step": 62055, "epoch": 369} {"train_loss": -8.271016120910645, "global_step": 62056, "epoch": 369} {"train_loss": -8.746679306030273, "global_step": 62057, "epoch": 369} {"train_loss": -8.645162582397461, "global_step": 62058, "epoch": 369} {"train_loss": -8.715996742248535, "global_step": 62059, "epoch": 369} {"train_loss": -8.603034973144531, "global_step": 62060, "epoch": 369} {"train_loss": -8.66836166381836, "global_step": 62061, "epoch": 369} {"train_loss": -8.639531135559082, "global_step": 62062, "epoch": 369} {"train_loss": -8.767343521118164, "global_step": 62063, "epoch": 369} {"train_loss": -8.7403564453125, "global_step": 62064, "epoch": 369} {"train_loss": -8.736353874206543, "global_step": 62065, "epoch": 369} {"train_loss": -8.615382194519043, "global_step": 62066, "epoch": 369} {"train_loss": -8.66162395477295, "global_step": 62067, "epoch": 369} {"train_loss": -8.504411697387695, "global_step": 62068, "epoch": 369} {"train_loss": -8.540365219116211, "global_step": 62069, "epoch": 369} {"train_loss": -8.575404167175293, "global_step": 62070, "epoch": 369} {"train_loss": -8.544759750366211, "global_step": 62071, "epoch": 369} {"train_loss": -8.756444931030273, "global_step": 62072, "epoch": 369} {"train_loss": -8.653076171875, "global_step": 62073, "epoch": 369} {"train_loss": -8.61263656616211, "global_step": 62074, "epoch": 369} {"train_loss": -8.830117225646973, "global_step": 62075, "epoch": 369} {"train_loss": -8.663067817687988, "global_step": 62076, "epoch": 369} {"train_loss": -8.812400817871094, "global_step": 62077, "epoch": 369} {"train_loss": -8.69853401184082, "global_step": 62078, "epoch": 369} {"train_loss": -8.859565734863281, "global_step": 62079, "epoch": 369} {"train_loss": -8.636636734008789, "global_step": 62080, "epoch": 369} {"train_loss": -8.65660285949707, "global_step": 62081, "epoch": 369} {"train_loss": -8.766603469848633, "global_step": 62082, "epoch": 369} {"train_loss": -8.710869789123535, "global_step": 62083, "epoch": 369} {"train_loss": -8.917810440063477, "global_step": 62084, "epoch": 369} {"train_loss": -8.72198486328125, "global_step": 62085, "epoch": 369} {"train_loss": -8.8955078125, "global_step": 62086, "epoch": 369} {"train_loss": -8.875945091247559, "global_step": 62087, "epoch": 369} {"train_loss": -8.966028213500977, "global_step": 62088, "epoch": 369} {"train_loss": -8.724800109863281, "global_step": 62089, "epoch": 369} {"train_loss": -8.928750991821289, "global_step": 62090, "epoch": 369} {"train_loss": -8.816812515258789, "global_step": 62091, "epoch": 369} {"train_loss": -8.968685150146484, "global_step": 62092, "epoch": 369} {"train_loss": -8.764060974121094, "global_step": 62093, "epoch": 369} {"train_loss": -8.719867706298828, "global_step": 62094, "epoch": 369} {"train_loss": -8.64597225189209, "global_step": 62095, "epoch": 369} {"train_loss": -8.675946235656738, "global_step": 62096, "epoch": 369} {"train_loss": -8.92855453491211, "global_step": 62097, "epoch": 369} {"train_loss": -8.898519515991211, "global_step": 62098, "epoch": 369} {"train_loss": -8.764411926269531, "global_step": 62099, "epoch": 369} {"train_loss": -8.711064338684082, "global_step": 62100, "epoch": 369} {"train_loss": -8.828977584838867, "global_step": 62101, "epoch": 369} {"train_loss": -8.58112907409668, "global_step": 62102, "epoch": 369} {"train_loss": -8.745716094970703, "global_step": 62103, "epoch": 369} {"train_loss": -8.757484436035156, "global_step": 62104, "epoch": 369} {"train_loss": -8.815716743469238, "global_step": 62105, "epoch": 369} {"train_loss": -8.721388816833496, "global_step": 62106, "epoch": 369} {"train_loss": -8.79723834991455, "global_step": 62107, "epoch": 369} {"train_loss": -8.467803001403809, "global_step": 62108, "epoch": 369} {"train_loss": -8.696876525878906, "global_step": 62109, "epoch": 369} {"train_loss": -8.877279281616211, "global_step": 62110, "epoch": 369} {"train_loss": -8.610624313354492, "global_step": 62111, "epoch": 369} {"train_loss": -8.871931076049805, "global_step": 62112, "epoch": 369} {"train_loss": -8.548422813415527, "global_step": 62113, "epoch": 369} {"train_loss": -8.503301620483398, "global_step": 62114, "epoch": 369} {"train_loss": -8.402146339416504, "global_step": 62115, "epoch": 369} {"train_loss": -8.638948440551758, "global_step": 62116, "epoch": 369} {"train_loss": -8.338920593261719, "global_step": 62117, "epoch": 369} {"train_loss": -8.321700096130371, "global_step": 62118, "epoch": 369} {"train_loss": -8.528230667114258, "global_step": 62119, "epoch": 369} {"train_loss": -7.985595703125, "global_step": 62120, "epoch": 369} {"train_loss": -8.64830207824707, "global_step": 62121, "epoch": 369} {"train_loss": -8.236641883850098, "global_step": 62122, "epoch": 369} {"train_loss": -8.570539474487305, "global_step": 62123, "epoch": 369} {"train_loss": -8.469161987304688, "global_step": 62124, "epoch": 369} {"train_loss": -8.295450210571289, "global_step": 62125, "epoch": 369} {"train_loss": -8.482548713684082, "global_step": 62126, "epoch": 369} {"train_loss": -8.379539489746094, "global_step": 62127, "epoch": 369} {"train_loss": -8.436139106750488, "global_step": 62128, "epoch": 369} {"train_loss": -8.47671127319336, "global_step": 62129, "epoch": 369} {"train_loss": -8.463672637939453, "global_step": 62130, "epoch": 369} {"train_loss": -8.513973236083984, "global_step": 62131, "epoch": 369} {"train_loss": -8.74365234375, "global_step": 62132, "epoch": 369} {"train_loss": -8.61535358428955, "global_step": 62133, "epoch": 369} {"train_loss": -8.694238662719727, "global_step": 62134, "epoch": 369} {"train_loss": -8.24505615234375, "global_step": 62135, "epoch": 369} {"train_loss": -8.746410369873047, "global_step": 62136, "epoch": 369} {"train_loss": -8.391172409057617, "global_step": 62137, "epoch": 369} {"train_loss": -8.642965316772461, "global_step": 62138, "epoch": 369} {"train_loss": -8.569866180419922, "global_step": 62139, "epoch": 369} {"train_loss": -8.741758346557617, "global_step": 62140, "epoch": 369} {"train_loss": -8.576211929321289, "global_step": 62141, "epoch": 369} {"train_loss": -8.671463012695312, "global_step": 62142, "epoch": 369} {"train_loss": -8.634242057800293, "global_step": 62143, "epoch": 369} {"train_loss": -8.76839828491211, "global_step": 62144, "epoch": 369} {"train_loss": -8.39684009552002, "global_step": 62145, "epoch": 369} {"train_loss": -8.700563430786133, "global_step": 62146, "epoch": 369} {"train_loss": -8.667078018188477, "global_step": 62147, "epoch": 369} {"train_loss": -8.764713287353516, "global_step": 62148, "epoch": 369} {"train_loss": -8.625944137573242, "global_step": 62149, "epoch": 369} {"train_loss": -8.735859870910645, "global_step": 62150, "epoch": 369} {"train_loss": -8.553206443786621, "global_step": 62151, "epoch": 369} {"train_loss": -8.970820426940918, "global_step": 62152, "epoch": 369} {"train_loss": -8.819095611572266, "global_step": 62153, "epoch": 369} {"train_loss": -8.887060165405273, "global_step": 62154, "epoch": 369} {"train_loss": -8.922212600708008, "global_step": 62155, "epoch": 369} {"train_loss": -8.81229019165039, "global_step": 62156, "epoch": 369} {"train_loss": -8.910577774047852, "global_step": 62157, "epoch": 369} {"train_loss": -8.695398330688477, "global_step": 62158, "epoch": 369} {"train_loss": -8.700654359090896, "global_step": 62159, "epoch": 369, "val_loss": 194181.921875} {"train_loss": -8.753154754638672, "global_step": 62160, "epoch": 370} {"train_loss": -8.635369300842285, "global_step": 62161, "epoch": 370} {"train_loss": -8.575730323791504, "global_step": 62162, "epoch": 370} {"train_loss": -9.007336616516113, "global_step": 62163, "epoch": 370} {"train_loss": -8.723367691040039, "global_step": 62164, "epoch": 370} {"train_loss": -8.950695991516113, "global_step": 62165, "epoch": 370} {"train_loss": -8.758735656738281, "global_step": 62166, "epoch": 370} {"train_loss": -8.93459415435791, "global_step": 62167, "epoch": 370} {"train_loss": -8.631860733032227, "global_step": 62168, "epoch": 370} {"train_loss": -8.875480651855469, "global_step": 62169, "epoch": 370} {"train_loss": -8.679037094116211, "global_step": 62170, "epoch": 370} {"train_loss": -8.893821716308594, "global_step": 62171, "epoch": 370} {"train_loss": -8.89990520477295, "global_step": 62172, "epoch": 370} {"train_loss": -8.79671859741211, "global_step": 62173, "epoch": 370} {"train_loss": -8.702340126037598, "global_step": 62174, "epoch": 370} {"train_loss": -8.619416236877441, "global_step": 62175, "epoch": 370} {"train_loss": -8.71335220336914, "global_step": 62176, "epoch": 370} {"train_loss": -8.845258712768555, "global_step": 62177, "epoch": 370} {"train_loss": -8.556325912475586, "global_step": 62178, "epoch": 370} {"train_loss": -8.742877960205078, "global_step": 62179, "epoch": 370} {"train_loss": -8.830163955688477, "global_step": 62180, "epoch": 370} {"train_loss": -8.793590545654297, "global_step": 62181, "epoch": 370} {"train_loss": -8.671112060546875, "global_step": 62182, "epoch": 370} {"train_loss": -8.63068675994873, "global_step": 62183, "epoch": 370} {"train_loss": -8.722991943359375, "global_step": 62184, "epoch": 370} {"train_loss": -8.597328186035156, "global_step": 62185, "epoch": 370} {"train_loss": -8.615019798278809, "global_step": 62186, "epoch": 370} {"train_loss": -8.746199607849121, "global_step": 62187, "epoch": 370} {"train_loss": -8.489368438720703, "global_step": 62188, "epoch": 370} {"train_loss": -8.838245391845703, "global_step": 62189, "epoch": 370} {"train_loss": -8.849329948425293, "global_step": 62190, "epoch": 370} {"train_loss": -8.664700508117676, "global_step": 62191, "epoch": 370} {"train_loss": -8.855842590332031, "global_step": 62192, "epoch": 370} {"train_loss": -9.130212783813477, "global_step": 62193, "epoch": 370} {"train_loss": -8.645977973937988, "global_step": 62194, "epoch": 370} {"train_loss": -8.946441650390625, "global_step": 62195, "epoch": 370} {"train_loss": -8.768385887145996, "global_step": 62196, "epoch": 370} {"train_loss": -9.030722618103027, "global_step": 62197, "epoch": 370} {"train_loss": -8.480079650878906, "global_step": 62198, "epoch": 370} {"train_loss": -8.68537712097168, "global_step": 62199, "epoch": 370} {"train_loss": -8.663837432861328, "global_step": 62200, "epoch": 370} {"train_loss": -8.441317558288574, "global_step": 62201, "epoch": 370} {"train_loss": -9.106515884399414, "global_step": 62202, "epoch": 370} {"train_loss": -8.591001510620117, "global_step": 62203, "epoch": 370} {"train_loss": -8.612700462341309, "global_step": 62204, "epoch": 370} {"train_loss": -8.949874877929688, "global_step": 62205, "epoch": 370} {"train_loss": -8.690332412719727, "global_step": 62206, "epoch": 370} {"train_loss": -8.508821487426758, "global_step": 62207, "epoch": 370} {"train_loss": -8.647534370422363, "global_step": 62208, "epoch": 370} {"train_loss": -8.71072769165039, "global_step": 62209, "epoch": 370} {"train_loss": -8.664119720458984, "global_step": 62210, "epoch": 370} {"train_loss": -8.649253845214844, "global_step": 62211, "epoch": 370} {"train_loss": -8.715791702270508, "global_step": 62212, "epoch": 370} {"train_loss": -8.708826065063477, "global_step": 62213, "epoch": 370} {"train_loss": -8.763408660888672, "global_step": 62214, "epoch": 370} {"train_loss": -8.730917930603027, "global_step": 62215, "epoch": 370} {"train_loss": -8.7947416305542, "global_step": 62216, "epoch": 370} {"train_loss": -8.532552719116211, "global_step": 62217, "epoch": 370} {"train_loss": -8.709207534790039, "global_step": 62218, "epoch": 370} {"train_loss": -8.7267484664917, "global_step": 62219, "epoch": 370} {"train_loss": -8.903003692626953, "global_step": 62220, "epoch": 370} {"train_loss": -8.741820335388184, "global_step": 62221, "epoch": 370} {"train_loss": -8.719792366027832, "global_step": 62222, "epoch": 370} {"train_loss": -8.633502960205078, "global_step": 62223, "epoch": 370} {"train_loss": -8.772026062011719, "global_step": 62224, "epoch": 370} {"train_loss": -8.848203659057617, "global_step": 62225, "epoch": 370} {"train_loss": -8.848724365234375, "global_step": 62226, "epoch": 370} {"train_loss": -8.909713745117188, "global_step": 62227, "epoch": 370} {"train_loss": -8.70829963684082, "global_step": 62228, "epoch": 370} {"train_loss": -8.944862365722656, "global_step": 62229, "epoch": 370} {"train_loss": -8.888477325439453, "global_step": 62230, "epoch": 370} {"train_loss": -8.799274444580078, "global_step": 62231, "epoch": 370} {"train_loss": -8.969080924987793, "global_step": 62232, "epoch": 370} {"train_loss": -8.787015914916992, "global_step": 62233, "epoch": 370} {"train_loss": -8.874335289001465, "global_step": 62234, "epoch": 370} {"train_loss": -8.891483306884766, "global_step": 62235, "epoch": 370} {"train_loss": -8.664506912231445, "global_step": 62236, "epoch": 370} {"train_loss": -8.584210395812988, "global_step": 62237, "epoch": 370} {"train_loss": -8.966293334960938, "global_step": 62238, "epoch": 370} {"train_loss": -8.824991226196289, "global_step": 62239, "epoch": 370} {"train_loss": -8.982511520385742, "global_step": 62240, "epoch": 370} {"train_loss": -8.829275131225586, "global_step": 62241, "epoch": 370} {"train_loss": -8.833487510681152, "global_step": 62242, "epoch": 370} {"train_loss": -8.910575866699219, "global_step": 62243, "epoch": 370} {"train_loss": -8.760732650756836, "global_step": 62244, "epoch": 370} {"train_loss": -8.583301544189453, "global_step": 62245, "epoch": 370} {"train_loss": -8.599377632141113, "global_step": 62246, "epoch": 370} {"train_loss": -8.737866401672363, "global_step": 62247, "epoch": 370} {"train_loss": -8.755212783813477, "global_step": 62248, "epoch": 370} {"train_loss": -8.965689659118652, "global_step": 62249, "epoch": 370} {"train_loss": -8.8375825881958, "global_step": 62250, "epoch": 370} {"train_loss": -8.576799392700195, "global_step": 62251, "epoch": 370} {"train_loss": -8.599435806274414, "global_step": 62252, "epoch": 370} {"train_loss": -8.309446334838867, "global_step": 62253, "epoch": 370} {"train_loss": -8.826184272766113, "global_step": 62254, "epoch": 370} {"train_loss": -8.364116668701172, "global_step": 62255, "epoch": 370} {"train_loss": -8.655099868774414, "global_step": 62256, "epoch": 370} {"train_loss": -8.478015899658203, "global_step": 62257, "epoch": 370} {"train_loss": -8.59495735168457, "global_step": 62258, "epoch": 370} {"train_loss": -8.760902404785156, "global_step": 62259, "epoch": 370} {"train_loss": -8.729762077331543, "global_step": 62260, "epoch": 370} {"train_loss": -8.830201148986816, "global_step": 62261, "epoch": 370} {"train_loss": -8.795493125915527, "global_step": 62262, "epoch": 370} {"train_loss": -8.745736122131348, "global_step": 62263, "epoch": 370} {"train_loss": -8.748440742492676, "global_step": 62264, "epoch": 370} {"train_loss": -8.925785064697266, "global_step": 62265, "epoch": 370} {"train_loss": -8.800185203552246, "global_step": 62266, "epoch": 370} {"train_loss": -8.868661880493164, "global_step": 62267, "epoch": 370} {"train_loss": -8.749160766601562, "global_step": 62268, "epoch": 370} {"train_loss": -8.401148796081543, "global_step": 62269, "epoch": 370} {"train_loss": -8.576236724853516, "global_step": 62270, "epoch": 370} {"train_loss": -8.679780960083008, "global_step": 62271, "epoch": 370} {"train_loss": -8.729452133178711, "global_step": 62272, "epoch": 370} {"train_loss": -8.822909355163574, "global_step": 62273, "epoch": 370} {"train_loss": -8.540773391723633, "global_step": 62274, "epoch": 370} {"train_loss": -8.880003929138184, "global_step": 62275, "epoch": 370} {"train_loss": -8.771230697631836, "global_step": 62276, "epoch": 370} {"train_loss": -8.72288703918457, "global_step": 62277, "epoch": 370} {"train_loss": -8.715520858764648, "global_step": 62278, "epoch": 370} {"train_loss": -8.707039833068848, "global_step": 62279, "epoch": 370} {"train_loss": -8.516494750976562, "global_step": 62280, "epoch": 370} {"train_loss": -8.386805534362793, "global_step": 62281, "epoch": 370} {"train_loss": -8.305627822875977, "global_step": 62282, "epoch": 370} {"train_loss": -8.370268821716309, "global_step": 62283, "epoch": 370} {"train_loss": -8.671684265136719, "global_step": 62284, "epoch": 370} {"train_loss": -8.584819793701172, "global_step": 62285, "epoch": 370} {"train_loss": -8.660562515258789, "global_step": 62286, "epoch": 370} {"train_loss": -8.530235290527344, "global_step": 62287, "epoch": 370} {"train_loss": -8.677465438842773, "global_step": 62288, "epoch": 370} {"train_loss": -8.412670135498047, "global_step": 62289, "epoch": 370} {"train_loss": -8.517448425292969, "global_step": 62290, "epoch": 370} {"train_loss": -8.99873161315918, "global_step": 62291, "epoch": 370} {"train_loss": -8.478078842163086, "global_step": 62292, "epoch": 370} {"train_loss": -8.564994812011719, "global_step": 62293, "epoch": 370} {"train_loss": -8.866021156311035, "global_step": 62294, "epoch": 370} {"train_loss": -8.704777717590332, "global_step": 62295, "epoch": 370} {"train_loss": -8.535258293151855, "global_step": 62296, "epoch": 370} {"train_loss": -8.582966804504395, "global_step": 62297, "epoch": 370} {"train_loss": -8.761409759521484, "global_step": 62298, "epoch": 370} {"train_loss": -8.73189926147461, "global_step": 62299, "epoch": 370} {"train_loss": -8.60728645324707, "global_step": 62300, "epoch": 370} {"train_loss": -8.90512466430664, "global_step": 62301, "epoch": 370} {"train_loss": -8.71247673034668, "global_step": 62302, "epoch": 370} {"train_loss": -8.688819885253906, "global_step": 62303, "epoch": 370} {"train_loss": -8.916604995727539, "global_step": 62304, "epoch": 370} {"train_loss": -8.635486602783203, "global_step": 62305, "epoch": 370} {"train_loss": -8.738835334777832, "global_step": 62306, "epoch": 370} {"train_loss": -8.464408874511719, "global_step": 62307, "epoch": 370} {"train_loss": -8.926977157592773, "global_step": 62308, "epoch": 370} {"train_loss": -8.602180480957031, "global_step": 62309, "epoch": 370} {"train_loss": -8.92525863647461, "global_step": 62310, "epoch": 370} {"train_loss": -8.949810028076172, "global_step": 62311, "epoch": 370} {"train_loss": -8.807062149047852, "global_step": 62312, "epoch": 370} {"train_loss": -8.99595832824707, "global_step": 62313, "epoch": 370} {"train_loss": -9.06461238861084, "global_step": 62314, "epoch": 370} {"train_loss": -8.962821960449219, "global_step": 62315, "epoch": 370} {"train_loss": -8.807419776916504, "global_step": 62316, "epoch": 370} {"train_loss": -8.888453483581543, "global_step": 62317, "epoch": 370} {"train_loss": -8.979411125183105, "global_step": 62318, "epoch": 370} {"train_loss": -8.427736282348633, "global_step": 62319, "epoch": 370} {"train_loss": -8.71047306060791, "global_step": 62320, "epoch": 370} {"train_loss": -8.375442504882812, "global_step": 62321, "epoch": 370} {"train_loss": -8.766461372375488, "global_step": 62322, "epoch": 370} {"train_loss": -8.855911254882812, "global_step": 62323, "epoch": 370} {"train_loss": -8.891443252563477, "global_step": 62324, "epoch": 370} {"train_loss": -8.603280067443848, "global_step": 62325, "epoch": 370} {"train_loss": -8.606489181518555, "global_step": 62326, "epoch": 370} {"train_loss": -8.729117234547934, "global_step": 62327, "epoch": 370, "val_loss": 190269.625, "train_action_mse_error": 8.438081741333008} {"train_loss": -8.66226577758789, "global_step": 62328, "epoch": 371} {"train_loss": -8.889205932617188, "global_step": 62329, "epoch": 371} {"train_loss": -8.811847686767578, "global_step": 62330, "epoch": 371} {"train_loss": -8.326225280761719, "global_step": 62331, "epoch": 371} {"train_loss": -8.620269775390625, "global_step": 62332, "epoch": 371} {"train_loss": -8.39809799194336, "global_step": 62333, "epoch": 371} {"train_loss": -8.536201477050781, "global_step": 62334, "epoch": 371} {"train_loss": -8.35282039642334, "global_step": 62335, "epoch": 371} {"train_loss": -8.78587532043457, "global_step": 62336, "epoch": 371} {"train_loss": -8.498342514038086, "global_step": 62337, "epoch": 371} {"train_loss": -8.625858306884766, "global_step": 62338, "epoch": 371} {"train_loss": -8.621660232543945, "global_step": 62339, "epoch": 371} {"train_loss": -8.550130844116211, "global_step": 62340, "epoch": 371} {"train_loss": -8.518606185913086, "global_step": 62341, "epoch": 371} {"train_loss": -8.572549819946289, "global_step": 62342, "epoch": 371} {"train_loss": -8.712909698486328, "global_step": 62343, "epoch": 371} {"train_loss": -8.910089492797852, "global_step": 62344, "epoch": 371} {"train_loss": -8.760425567626953, "global_step": 62345, "epoch": 371} {"train_loss": -8.90140151977539, "global_step": 62346, "epoch": 371} {"train_loss": -8.774911880493164, "global_step": 62347, "epoch": 371} {"train_loss": -8.811031341552734, "global_step": 62348, "epoch": 371} {"train_loss": -8.72625732421875, "global_step": 62349, "epoch": 371} {"train_loss": -9.022865295410156, "global_step": 62350, "epoch": 371} {"train_loss": -8.650191307067871, "global_step": 62351, "epoch": 371} {"train_loss": -8.744256973266602, "global_step": 62352, "epoch": 371} {"train_loss": -8.673696517944336, "global_step": 62353, "epoch": 371} {"train_loss": -8.871875762939453, "global_step": 62354, "epoch": 371} {"train_loss": -8.797094345092773, "global_step": 62355, "epoch": 371} {"train_loss": -8.93925666809082, "global_step": 62356, "epoch": 371} {"train_loss": -8.798534393310547, "global_step": 62357, "epoch": 371} {"train_loss": -8.860320091247559, "global_step": 62358, "epoch": 371} {"train_loss": -8.65491771697998, "global_step": 62359, "epoch": 371} {"train_loss": -8.810972213745117, "global_step": 62360, "epoch": 371} {"train_loss": -8.810550689697266, "global_step": 62361, "epoch": 371} {"train_loss": -8.635029792785645, "global_step": 62362, "epoch": 371} {"train_loss": -9.014183044433594, "global_step": 62363, "epoch": 371} {"train_loss": -8.50349235534668, "global_step": 62364, "epoch": 371} {"train_loss": -8.917844772338867, "global_step": 62365, "epoch": 371} {"train_loss": -8.950286865234375, "global_step": 62366, "epoch": 371} {"train_loss": -8.795650482177734, "global_step": 62367, "epoch": 371} {"train_loss": -8.98598861694336, "global_step": 62368, "epoch": 371} {"train_loss": -8.828662872314453, "global_step": 62369, "epoch": 371} {"train_loss": -8.918004989624023, "global_step": 62370, "epoch": 371} {"train_loss": -8.637451171875, "global_step": 62371, "epoch": 371} {"train_loss": -8.719362258911133, "global_step": 62372, "epoch": 371} {"train_loss": -8.377192497253418, "global_step": 62373, "epoch": 371} {"train_loss": -8.847164154052734, "global_step": 62374, "epoch": 371} {"train_loss": -8.27377700805664, "global_step": 62375, "epoch": 371} {"train_loss": -8.638237953186035, "global_step": 62376, "epoch": 371} {"train_loss": -8.452128410339355, "global_step": 62377, "epoch": 371} {"train_loss": -8.35226821899414, "global_step": 62378, "epoch": 371} {"train_loss": -8.748932838439941, "global_step": 62379, "epoch": 371} {"train_loss": -8.793174743652344, "global_step": 62380, "epoch": 371} {"train_loss": -8.665284156799316, "global_step": 62381, "epoch": 371} {"train_loss": -8.75328254699707, "global_step": 62382, "epoch": 371} {"train_loss": -8.75969123840332, "global_step": 62383, "epoch": 371} {"train_loss": -8.260207176208496, "global_step": 62384, "epoch": 371} {"train_loss": -8.845986366271973, "global_step": 62385, "epoch": 371} {"train_loss": -8.663457870483398, "global_step": 62386, "epoch": 371} {"train_loss": -8.921393394470215, "global_step": 62387, "epoch": 371} {"train_loss": -8.860128402709961, "global_step": 62388, "epoch": 371} {"train_loss": -8.812541007995605, "global_step": 62389, "epoch": 371} {"train_loss": -8.817169189453125, "global_step": 62390, "epoch": 371} {"train_loss": -8.841215133666992, "global_step": 62391, "epoch": 371} {"train_loss": -8.75566291809082, "global_step": 62392, "epoch": 371} {"train_loss": -8.609639167785645, "global_step": 62393, "epoch": 371} {"train_loss": -8.797628402709961, "global_step": 62394, "epoch": 371} {"train_loss": -8.782770156860352, "global_step": 62395, "epoch": 371} {"train_loss": -8.76365852355957, "global_step": 62396, "epoch": 371} {"train_loss": -9.114612579345703, "global_step": 62397, "epoch": 371} {"train_loss": -8.667983055114746, "global_step": 62398, "epoch": 371} {"train_loss": -8.673837661743164, "global_step": 62399, "epoch": 371} {"train_loss": -8.690568923950195, "global_step": 62400, "epoch": 371} {"train_loss": -8.534305572509766, "global_step": 62401, "epoch": 371} {"train_loss": -8.734307289123535, "global_step": 62402, "epoch": 371} {"train_loss": -8.624242782592773, "global_step": 62403, "epoch": 371} {"train_loss": -8.588930130004883, "global_step": 62404, "epoch": 371} {"train_loss": -8.824502944946289, "global_step": 62405, "epoch": 371} {"train_loss": -8.833423614501953, "global_step": 62406, "epoch": 371} {"train_loss": -8.702825546264648, "global_step": 62407, "epoch": 371} {"train_loss": -9.02430534362793, "global_step": 62408, "epoch": 371} {"train_loss": -8.67430305480957, "global_step": 62409, "epoch": 371} {"train_loss": -8.74440860748291, "global_step": 62410, "epoch": 371} {"train_loss": -9.018257141113281, "global_step": 62411, "epoch": 371} {"train_loss": -8.803169250488281, "global_step": 62412, "epoch": 371} {"train_loss": -8.920021057128906, "global_step": 62413, "epoch": 371} {"train_loss": -8.831581115722656, "global_step": 62414, "epoch": 371} {"train_loss": -8.774070739746094, "global_step": 62415, "epoch": 371} {"train_loss": -8.595684051513672, "global_step": 62416, "epoch": 371} {"train_loss": -8.694469451904297, "global_step": 62417, "epoch": 371} {"train_loss": -8.890764236450195, "global_step": 62418, "epoch": 371} {"train_loss": -8.655807495117188, "global_step": 62419, "epoch": 371} {"train_loss": -8.804520606994629, "global_step": 62420, "epoch": 371} {"train_loss": -8.873510360717773, "global_step": 62421, "epoch": 371} {"train_loss": -8.669593811035156, "global_step": 62422, "epoch": 371} {"train_loss": -8.165472030639648, "global_step": 62423, "epoch": 371} {"train_loss": -8.932960510253906, "global_step": 62424, "epoch": 371} {"train_loss": -8.538281440734863, "global_step": 62425, "epoch": 371} {"train_loss": -8.625312805175781, "global_step": 62426, "epoch": 371} {"train_loss": -8.883940696716309, "global_step": 62427, "epoch": 371} {"train_loss": -8.581539154052734, "global_step": 62428, "epoch": 371} {"train_loss": -8.783740997314453, "global_step": 62429, "epoch": 371} {"train_loss": -8.801947593688965, "global_step": 62430, "epoch": 371} {"train_loss": -8.867889404296875, "global_step": 62431, "epoch": 371} {"train_loss": -8.675535202026367, "global_step": 62432, "epoch": 371} {"train_loss": -8.557380676269531, "global_step": 62433, "epoch": 371} {"train_loss": -8.700407028198242, "global_step": 62434, "epoch": 371} {"train_loss": -8.646966934204102, "global_step": 62435, "epoch": 371} {"train_loss": -8.62608528137207, "global_step": 62436, "epoch": 371} {"train_loss": -8.603164672851562, "global_step": 62437, "epoch": 371} {"train_loss": -8.563240051269531, "global_step": 62438, "epoch": 371} {"train_loss": -8.726027488708496, "global_step": 62439, "epoch": 371} {"train_loss": -8.504563331604004, "global_step": 62440, "epoch": 371} {"train_loss": -8.820367813110352, "global_step": 62441, "epoch": 371} {"train_loss": -8.639806747436523, "global_step": 62442, "epoch": 371} {"train_loss": -8.798041343688965, "global_step": 62443, "epoch": 371} {"train_loss": -8.774364471435547, "global_step": 62444, "epoch": 371} {"train_loss": -8.816051483154297, "global_step": 62445, "epoch": 371} {"train_loss": -8.78672981262207, "global_step": 62446, "epoch": 371} {"train_loss": -8.8767728805542, "global_step": 62447, "epoch": 371} {"train_loss": -8.713140487670898, "global_step": 62448, "epoch": 371} {"train_loss": -8.798820495605469, "global_step": 62449, "epoch": 371} {"train_loss": -8.543668746948242, "global_step": 62450, "epoch": 371} {"train_loss": -8.671012878417969, "global_step": 62451, "epoch": 371} {"train_loss": -8.668468475341797, "global_step": 62452, "epoch": 371} {"train_loss": -9.03097152709961, "global_step": 62453, "epoch": 371} {"train_loss": -8.834332466125488, "global_step": 62454, "epoch": 371} {"train_loss": -8.796871185302734, "global_step": 62455, "epoch": 371} {"train_loss": -8.908711433410645, "global_step": 62456, "epoch": 371} {"train_loss": -8.953655242919922, "global_step": 62457, "epoch": 371} {"train_loss": -9.001877784729004, "global_step": 62458, "epoch": 371} {"train_loss": -8.697409629821777, "global_step": 62459, "epoch": 371} {"train_loss": -8.913105964660645, "global_step": 62460, "epoch": 371} {"train_loss": -9.05123519897461, "global_step": 62461, "epoch": 371} {"train_loss": -8.769298553466797, "global_step": 62462, "epoch": 371} {"train_loss": -8.673246383666992, "global_step": 62463, "epoch": 371} {"train_loss": -8.60854721069336, "global_step": 62464, "epoch": 371} {"train_loss": -8.594902038574219, "global_step": 62465, "epoch": 371} {"train_loss": -8.482057571411133, "global_step": 62466, "epoch": 371} {"train_loss": -8.742814064025879, "global_step": 62467, "epoch": 371} {"train_loss": -8.601937294006348, "global_step": 62468, "epoch": 371} {"train_loss": -8.846302032470703, "global_step": 62469, "epoch": 371} {"train_loss": -8.946754455566406, "global_step": 62470, "epoch": 371} {"train_loss": -8.737845420837402, "global_step": 62471, "epoch": 371} {"train_loss": -8.788976669311523, "global_step": 62472, "epoch": 371} {"train_loss": -8.767766952514648, "global_step": 62473, "epoch": 371} {"train_loss": -8.990643501281738, "global_step": 62474, "epoch": 371} {"train_loss": -8.71597671508789, "global_step": 62475, "epoch": 371} {"train_loss": -9.04713249206543, "global_step": 62476, "epoch": 371} {"train_loss": -8.54074478149414, "global_step": 62477, "epoch": 371} {"train_loss": -8.918540000915527, "global_step": 62478, "epoch": 371} {"train_loss": -8.803913116455078, "global_step": 62479, "epoch": 371} {"train_loss": -8.511857032775879, "global_step": 62480, "epoch": 371} {"train_loss": -8.879026412963867, "global_step": 62481, "epoch": 371} {"train_loss": -8.567281723022461, "global_step": 62482, "epoch": 371} {"train_loss": -8.713415145874023, "global_step": 62483, "epoch": 371} {"train_loss": -8.429431915283203, "global_step": 62484, "epoch": 371} {"train_loss": -8.884966850280762, "global_step": 62485, "epoch": 371} {"train_loss": -8.616418838500977, "global_step": 62486, "epoch": 371} {"train_loss": -8.552299499511719, "global_step": 62487, "epoch": 371} {"train_loss": -8.74463176727295, "global_step": 62488, "epoch": 371} {"train_loss": -8.74574089050293, "global_step": 62489, "epoch": 371} {"train_loss": -8.813262939453125, "global_step": 62490, "epoch": 371} {"train_loss": -8.589214324951172, "global_step": 62491, "epoch": 371} {"train_loss": -8.728668212890625, "global_step": 62492, "epoch": 371} {"train_loss": -8.742549896240234, "global_step": 62493, "epoch": 371} {"train_loss": -8.65038776397705, "global_step": 62494, "epoch": 371} {"train_loss": -8.728864334878468, "global_step": 62495, "epoch": 371, "val_loss": 189962.96875} {"train_loss": -8.529208183288574, "global_step": 62496, "epoch": 372} {"train_loss": -8.29796028137207, "global_step": 62497, "epoch": 372} {"train_loss": -8.552305221557617, "global_step": 62498, "epoch": 372} {"train_loss": -8.224024772644043, "global_step": 62499, "epoch": 372} {"train_loss": -8.666952133178711, "global_step": 62500, "epoch": 372} {"train_loss": -8.642224311828613, "global_step": 62501, "epoch": 372} {"train_loss": -8.566609382629395, "global_step": 62502, "epoch": 372} {"train_loss": -8.747396469116211, "global_step": 62503, "epoch": 372} {"train_loss": -8.592399597167969, "global_step": 62504, "epoch": 372} {"train_loss": -8.62521743774414, "global_step": 62505, "epoch": 372} {"train_loss": -8.643177032470703, "global_step": 62506, "epoch": 372} {"train_loss": -8.617056846618652, "global_step": 62507, "epoch": 372} {"train_loss": -8.968713760375977, "global_step": 62508, "epoch": 372} {"train_loss": -8.619564056396484, "global_step": 62509, "epoch": 372} {"train_loss": -8.739055633544922, "global_step": 62510, "epoch": 372} {"train_loss": -8.357820510864258, "global_step": 62511, "epoch": 372} {"train_loss": -8.875531196594238, "global_step": 62512, "epoch": 372} {"train_loss": -8.886489868164062, "global_step": 62513, "epoch": 372} {"train_loss": -8.923656463623047, "global_step": 62514, "epoch": 372} {"train_loss": -8.78654956817627, "global_step": 62515, "epoch": 372} {"train_loss": -8.67425537109375, "global_step": 62516, "epoch": 372} {"train_loss": -8.780683517456055, "global_step": 62517, "epoch": 372} {"train_loss": -8.861988067626953, "global_step": 62518, "epoch": 372} {"train_loss": -8.88232707977295, "global_step": 62519, "epoch": 372} {"train_loss": -8.696361541748047, "global_step": 62520, "epoch": 372} {"train_loss": -8.629132270812988, "global_step": 62521, "epoch": 372} {"train_loss": -8.746078491210938, "global_step": 62522, "epoch": 372} {"train_loss": -8.365865707397461, "global_step": 62523, "epoch": 372} {"train_loss": -8.826530456542969, "global_step": 62524, "epoch": 372} {"train_loss": -8.440738677978516, "global_step": 62525, "epoch": 372} {"train_loss": -8.743183135986328, "global_step": 62526, "epoch": 372} {"train_loss": -8.643909454345703, "global_step": 62527, "epoch": 372} {"train_loss": -8.56326675415039, "global_step": 62528, "epoch": 372} {"train_loss": -8.223761558532715, "global_step": 62529, "epoch": 372} {"train_loss": -8.439117431640625, "global_step": 62530, "epoch": 372} {"train_loss": -8.437332153320312, "global_step": 62531, "epoch": 372} {"train_loss": -8.474204063415527, "global_step": 62532, "epoch": 372} {"train_loss": -8.505792617797852, "global_step": 62533, "epoch": 372} {"train_loss": -8.4583740234375, "global_step": 62534, "epoch": 372} {"train_loss": -8.376567840576172, "global_step": 62535, "epoch": 372} {"train_loss": -8.325437545776367, "global_step": 62536, "epoch": 372} {"train_loss": -8.512741088867188, "global_step": 62537, "epoch": 372} {"train_loss": -8.642866134643555, "global_step": 62538, "epoch": 372} {"train_loss": -8.730128288269043, "global_step": 62539, "epoch": 372} {"train_loss": -8.62868881225586, "global_step": 62540, "epoch": 372} {"train_loss": -8.670452117919922, "global_step": 62541, "epoch": 372} {"train_loss": -8.654165267944336, "global_step": 62542, "epoch": 372} {"train_loss": -8.732497215270996, "global_step": 62543, "epoch": 372} {"train_loss": -8.852384567260742, "global_step": 62544, "epoch": 372} {"train_loss": -8.751537322998047, "global_step": 62545, "epoch": 372} {"train_loss": -8.634529113769531, "global_step": 62546, "epoch": 372} {"train_loss": -8.750862121582031, "global_step": 62547, "epoch": 372} {"train_loss": -8.622186660766602, "global_step": 62548, "epoch": 372} {"train_loss": -8.690434455871582, "global_step": 62549, "epoch": 372} {"train_loss": -8.614886283874512, "global_step": 62550, "epoch": 372} {"train_loss": -8.734955787658691, "global_step": 62551, "epoch": 372} {"train_loss": -8.880853652954102, "global_step": 62552, "epoch": 372} {"train_loss": -8.737451553344727, "global_step": 62553, "epoch": 372} {"train_loss": -8.849625587463379, "global_step": 62554, "epoch": 372} {"train_loss": -8.784364700317383, "global_step": 62555, "epoch": 372} {"train_loss": -8.903070449829102, "global_step": 62556, "epoch": 372} {"train_loss": -8.721382141113281, "global_step": 62557, "epoch": 372} {"train_loss": -8.729398727416992, "global_step": 62558, "epoch": 372} {"train_loss": -8.879331588745117, "global_step": 62559, "epoch": 372} {"train_loss": -8.798140525817871, "global_step": 62560, "epoch": 372} {"train_loss": -8.52682113647461, "global_step": 62561, "epoch": 372} {"train_loss": -8.84256649017334, "global_step": 62562, "epoch": 372} {"train_loss": -8.86137580871582, "global_step": 62563, "epoch": 372} {"train_loss": -8.863564491271973, "global_step": 62564, "epoch": 372} {"train_loss": -8.663484573364258, "global_step": 62565, "epoch": 372} {"train_loss": -8.744129180908203, "global_step": 62566, "epoch": 372} {"train_loss": -8.357881546020508, "global_step": 62567, "epoch": 372} {"train_loss": -8.615381240844727, "global_step": 62568, "epoch": 372} {"train_loss": -8.633054733276367, "global_step": 62569, "epoch": 372} {"train_loss": -8.69453239440918, "global_step": 62570, "epoch": 372} {"train_loss": -8.688333511352539, "global_step": 62571, "epoch": 372} {"train_loss": -8.600101470947266, "global_step": 62572, "epoch": 372} {"train_loss": -8.591773986816406, "global_step": 62573, "epoch": 372} {"train_loss": -8.702701568603516, "global_step": 62574, "epoch": 372} {"train_loss": -8.60444164276123, "global_step": 62575, "epoch": 372} {"train_loss": -8.790696144104004, "global_step": 62576, "epoch": 372} {"train_loss": -8.814257621765137, "global_step": 62577, "epoch": 372} {"train_loss": -8.54721736907959, "global_step": 62578, "epoch": 372} {"train_loss": -8.383808135986328, "global_step": 62579, "epoch": 372} {"train_loss": -8.716468811035156, "global_step": 62580, "epoch": 372} {"train_loss": -8.646590232849121, "global_step": 62581, "epoch": 372} {"train_loss": -8.599258422851562, "global_step": 62582, "epoch": 372} {"train_loss": -8.722399711608887, "global_step": 62583, "epoch": 372} {"train_loss": -8.535745620727539, "global_step": 62584, "epoch": 372} {"train_loss": -8.713472366333008, "global_step": 62585, "epoch": 372} {"train_loss": -8.80103588104248, "global_step": 62586, "epoch": 372} {"train_loss": -8.779844284057617, "global_step": 62587, "epoch": 372} {"train_loss": -8.829717636108398, "global_step": 62588, "epoch": 372} {"train_loss": -8.92315673828125, "global_step": 62589, "epoch": 372} {"train_loss": -8.76781940460205, "global_step": 62590, "epoch": 372} {"train_loss": -8.644362449645996, "global_step": 62591, "epoch": 372} {"train_loss": -8.902995109558105, "global_step": 62592, "epoch": 372} {"train_loss": -8.609480857849121, "global_step": 62593, "epoch": 372} {"train_loss": -8.742033004760742, "global_step": 62594, "epoch": 372} {"train_loss": -8.88077449798584, "global_step": 62595, "epoch": 372} {"train_loss": -8.679224014282227, "global_step": 62596, "epoch": 372} {"train_loss": -8.991633415222168, "global_step": 62597, "epoch": 372} {"train_loss": -8.90489673614502, "global_step": 62598, "epoch": 372} {"train_loss": -8.524239540100098, "global_step": 62599, "epoch": 372} {"train_loss": -8.652606010437012, "global_step": 62600, "epoch": 372} {"train_loss": -8.88958740234375, "global_step": 62601, "epoch": 372} {"train_loss": -8.836421012878418, "global_step": 62602, "epoch": 372} {"train_loss": -8.83177375793457, "global_step": 62603, "epoch": 372} {"train_loss": -8.453396797180176, "global_step": 62604, "epoch": 372} {"train_loss": -8.640270233154297, "global_step": 62605, "epoch": 372} {"train_loss": -8.219154357910156, "global_step": 62606, "epoch": 372} {"train_loss": -8.509557723999023, "global_step": 62607, "epoch": 372} {"train_loss": -8.682563781738281, "global_step": 62608, "epoch": 372} {"train_loss": -8.593902587890625, "global_step": 62609, "epoch": 372} {"train_loss": -8.48509693145752, "global_step": 62610, "epoch": 372} {"train_loss": -8.4577054977417, "global_step": 62611, "epoch": 372} {"train_loss": -8.606511116027832, "global_step": 62612, "epoch": 372} {"train_loss": -8.564908981323242, "global_step": 62613, "epoch": 372} {"train_loss": -8.683731079101562, "global_step": 62614, "epoch": 372} {"train_loss": -8.481285095214844, "global_step": 62615, "epoch": 372} {"train_loss": -8.627288818359375, "global_step": 62616, "epoch": 372} {"train_loss": -8.661893844604492, "global_step": 62617, "epoch": 372} {"train_loss": -8.818729400634766, "global_step": 62618, "epoch": 372} {"train_loss": -8.489840507507324, "global_step": 62619, "epoch": 372} {"train_loss": -8.612695693969727, "global_step": 62620, "epoch": 372} {"train_loss": -8.447349548339844, "global_step": 62621, "epoch": 372} {"train_loss": -8.880982398986816, "global_step": 62622, "epoch": 372} {"train_loss": -8.587418556213379, "global_step": 62623, "epoch": 372} {"train_loss": -8.819454193115234, "global_step": 62624, "epoch": 372} {"train_loss": -8.57306957244873, "global_step": 62625, "epoch": 372} {"train_loss": -8.838140487670898, "global_step": 62626, "epoch": 372} {"train_loss": -8.902639389038086, "global_step": 62627, "epoch": 372} {"train_loss": -8.807275772094727, "global_step": 62628, "epoch": 372} {"train_loss": -8.59585952758789, "global_step": 62629, "epoch": 372} {"train_loss": -8.85411262512207, "global_step": 62630, "epoch": 372} {"train_loss": -8.795633316040039, "global_step": 62631, "epoch": 372} {"train_loss": -8.864144325256348, "global_step": 62632, "epoch": 372} {"train_loss": -8.704833984375, "global_step": 62633, "epoch": 372} {"train_loss": -8.724743843078613, "global_step": 62634, "epoch": 372} {"train_loss": -8.766305923461914, "global_step": 62635, "epoch": 372} {"train_loss": -8.662282943725586, "global_step": 62636, "epoch": 372} {"train_loss": -8.817915916442871, "global_step": 62637, "epoch": 372} {"train_loss": -8.686326026916504, "global_step": 62638, "epoch": 372} {"train_loss": -8.82497501373291, "global_step": 62639, "epoch": 372} {"train_loss": -8.779056549072266, "global_step": 62640, "epoch": 372} {"train_loss": -8.826223373413086, "global_step": 62641, "epoch": 372} {"train_loss": -8.809236526489258, "global_step": 62642, "epoch": 372} {"train_loss": -8.783285140991211, "global_step": 62643, "epoch": 372} {"train_loss": -8.87679672241211, "global_step": 62644, "epoch": 372} {"train_loss": -8.82692813873291, "global_step": 62645, "epoch": 372} {"train_loss": -8.777763366699219, "global_step": 62646, "epoch": 372} {"train_loss": -8.813562393188477, "global_step": 62647, "epoch": 372} {"train_loss": -8.927973747253418, "global_step": 62648, "epoch": 372} {"train_loss": -8.626784324645996, "global_step": 62649, "epoch": 372} {"train_loss": -8.862215042114258, "global_step": 62650, "epoch": 372} {"train_loss": -8.652379035949707, "global_step": 62651, "epoch": 372} {"train_loss": -8.767111778259277, "global_step": 62652, "epoch": 372} {"train_loss": -8.910362243652344, "global_step": 62653, "epoch": 372} {"train_loss": -8.647031784057617, "global_step": 62654, "epoch": 372} {"train_loss": -8.972064018249512, "global_step": 62655, "epoch": 372} {"train_loss": -8.78995418548584, "global_step": 62656, "epoch": 372} {"train_loss": -8.715934753417969, "global_step": 62657, "epoch": 372} {"train_loss": -8.794107437133789, "global_step": 62658, "epoch": 372} {"train_loss": -8.665599822998047, "global_step": 62659, "epoch": 372} {"train_loss": -8.715734481811523, "global_step": 62660, "epoch": 372} {"train_loss": -8.724109649658203, "global_step": 62661, "epoch": 372} {"train_loss": -8.772010803222656, "global_step": 62662, "epoch": 372} {"train_loss": -8.68810860883622, "global_step": 62663, "epoch": 372, "val_loss": 190719.578125} {"train_loss": -8.571561813354492, "global_step": 62664, "epoch": 373} {"train_loss": -8.679767608642578, "global_step": 62665, "epoch": 373} {"train_loss": -8.865890502929688, "global_step": 62666, "epoch": 373} {"train_loss": -8.433908462524414, "global_step": 62667, "epoch": 373} {"train_loss": -8.936609268188477, "global_step": 62668, "epoch": 373} {"train_loss": -8.667407989501953, "global_step": 62669, "epoch": 373} {"train_loss": -8.77965259552002, "global_step": 62670, "epoch": 373} {"train_loss": -8.82132339477539, "global_step": 62671, "epoch": 373} {"train_loss": -8.829851150512695, "global_step": 62672, "epoch": 373} {"train_loss": -8.55327033996582, "global_step": 62673, "epoch": 373} {"train_loss": -8.722335815429688, "global_step": 62674, "epoch": 373} {"train_loss": -8.595003128051758, "global_step": 62675, "epoch": 373} {"train_loss": -8.687891006469727, "global_step": 62676, "epoch": 373} {"train_loss": -8.588207244873047, "global_step": 62677, "epoch": 373} {"train_loss": -8.82803726196289, "global_step": 62678, "epoch": 373} {"train_loss": -8.54874038696289, "global_step": 62679, "epoch": 373} {"train_loss": -8.640891075134277, "global_step": 62680, "epoch": 373} {"train_loss": -8.69595718383789, "global_step": 62681, "epoch": 373} {"train_loss": -8.380481719970703, "global_step": 62682, "epoch": 373} {"train_loss": -8.492776870727539, "global_step": 62683, "epoch": 373} {"train_loss": -8.731536865234375, "global_step": 62684, "epoch": 373} {"train_loss": -8.55320930480957, "global_step": 62685, "epoch": 373} {"train_loss": -8.605755805969238, "global_step": 62686, "epoch": 373} {"train_loss": -8.526676177978516, "global_step": 62687, "epoch": 373} {"train_loss": -8.72882080078125, "global_step": 62688, "epoch": 373} {"train_loss": -8.288335800170898, "global_step": 62689, "epoch": 373} {"train_loss": -8.89056396484375, "global_step": 62690, "epoch": 373} {"train_loss": -8.638952255249023, "global_step": 62691, "epoch": 373} {"train_loss": -8.565019607543945, "global_step": 62692, "epoch": 373} {"train_loss": -8.823533058166504, "global_step": 62693, "epoch": 373} {"train_loss": -8.830625534057617, "global_step": 62694, "epoch": 373} {"train_loss": -8.771434783935547, "global_step": 62695, "epoch": 373} {"train_loss": -8.624348640441895, "global_step": 62696, "epoch": 373} {"train_loss": -8.751678466796875, "global_step": 62697, "epoch": 373} {"train_loss": -8.839117050170898, "global_step": 62698, "epoch": 373} {"train_loss": -8.625304222106934, "global_step": 62699, "epoch": 373} {"train_loss": -8.547751426696777, "global_step": 62700, "epoch": 373} {"train_loss": -8.855464935302734, "global_step": 62701, "epoch": 373} {"train_loss": -8.77189826965332, "global_step": 62702, "epoch": 373} {"train_loss": -8.854442596435547, "global_step": 62703, "epoch": 373} {"train_loss": -8.761995315551758, "global_step": 62704, "epoch": 373} {"train_loss": -8.88058090209961, "global_step": 62705, "epoch": 373} {"train_loss": -8.717207908630371, "global_step": 62706, "epoch": 373} {"train_loss": -8.466424942016602, "global_step": 62707, "epoch": 373} {"train_loss": -8.692411422729492, "global_step": 62708, "epoch": 373} {"train_loss": -8.78533935546875, "global_step": 62709, "epoch": 373} {"train_loss": -8.791379928588867, "global_step": 62710, "epoch": 373} {"train_loss": -8.835225105285645, "global_step": 62711, "epoch": 373} {"train_loss": -8.723806381225586, "global_step": 62712, "epoch": 373} {"train_loss": -8.425275802612305, "global_step": 62713, "epoch": 373} {"train_loss": -8.625629425048828, "global_step": 62714, "epoch": 373} {"train_loss": -8.646158218383789, "global_step": 62715, "epoch": 373} {"train_loss": -8.631220817565918, "global_step": 62716, "epoch": 373} {"train_loss": -8.405525207519531, "global_step": 62717, "epoch": 373} {"train_loss": -8.751087188720703, "global_step": 62718, "epoch": 373} {"train_loss": -8.520467758178711, "global_step": 62719, "epoch": 373} {"train_loss": -8.860910415649414, "global_step": 62720, "epoch": 373} {"train_loss": -8.383050918579102, "global_step": 62721, "epoch": 373} {"train_loss": -8.536788940429688, "global_step": 62722, "epoch": 373} {"train_loss": -8.678916931152344, "global_step": 62723, "epoch": 373} {"train_loss": -8.574568748474121, "global_step": 62724, "epoch": 373} {"train_loss": -8.530430793762207, "global_step": 62725, "epoch": 373} {"train_loss": -8.322347640991211, "global_step": 62726, "epoch": 373} {"train_loss": -8.338994979858398, "global_step": 62727, "epoch": 373} {"train_loss": -8.374289512634277, "global_step": 62728, "epoch": 373} {"train_loss": -8.603076934814453, "global_step": 62729, "epoch": 373} {"train_loss": -8.67214298248291, "global_step": 62730, "epoch": 373} {"train_loss": -8.460984230041504, "global_step": 62731, "epoch": 373} {"train_loss": -8.655256271362305, "global_step": 62732, "epoch": 373} {"train_loss": -8.520700454711914, "global_step": 62733, "epoch": 373} {"train_loss": -8.748071670532227, "global_step": 62734, "epoch": 373} {"train_loss": -8.901248931884766, "global_step": 62735, "epoch": 373} {"train_loss": -8.628074645996094, "global_step": 62736, "epoch": 373} {"train_loss": -8.714509963989258, "global_step": 62737, "epoch": 373} {"train_loss": -8.688835144042969, "global_step": 62738, "epoch": 373} {"train_loss": -8.575246810913086, "global_step": 62739, "epoch": 373} {"train_loss": -8.96110725402832, "global_step": 62740, "epoch": 373} {"train_loss": -8.80223560333252, "global_step": 62741, "epoch": 373} {"train_loss": -8.828668594360352, "global_step": 62742, "epoch": 373} {"train_loss": -8.741483688354492, "global_step": 62743, "epoch": 373} {"train_loss": -8.861946105957031, "global_step": 62744, "epoch": 373} {"train_loss": -8.756258010864258, "global_step": 62745, "epoch": 373} {"train_loss": -8.6708984375, "global_step": 62746, "epoch": 373} {"train_loss": -8.790605545043945, "global_step": 62747, "epoch": 373} {"train_loss": -8.585713386535645, "global_step": 62748, "epoch": 373} {"train_loss": -8.867643356323242, "global_step": 62749, "epoch": 373} {"train_loss": -8.621901512145996, "global_step": 62750, "epoch": 373} {"train_loss": -8.922186851501465, "global_step": 62751, "epoch": 373} {"train_loss": -8.622817993164062, "global_step": 62752, "epoch": 373} {"train_loss": -8.77962875366211, "global_step": 62753, "epoch": 373} {"train_loss": -8.692879676818848, "global_step": 62754, "epoch": 373} {"train_loss": -8.875608444213867, "global_step": 62755, "epoch": 373} {"train_loss": -8.726800918579102, "global_step": 62756, "epoch": 373} {"train_loss": -8.806770324707031, "global_step": 62757, "epoch": 373} {"train_loss": -8.693618774414062, "global_step": 62758, "epoch": 373} {"train_loss": -8.87074089050293, "global_step": 62759, "epoch": 373} {"train_loss": -8.900857925415039, "global_step": 62760, "epoch": 373} {"train_loss": -8.86272144317627, "global_step": 62761, "epoch": 373} {"train_loss": -8.883685111999512, "global_step": 62762, "epoch": 373} {"train_loss": -8.964451789855957, "global_step": 62763, "epoch": 373} {"train_loss": -8.946020126342773, "global_step": 62764, "epoch": 373} {"train_loss": -8.889110565185547, "global_step": 62765, "epoch": 373} {"train_loss": -8.87445068359375, "global_step": 62766, "epoch": 373} {"train_loss": -8.914468765258789, "global_step": 62767, "epoch": 373} {"train_loss": -8.985142707824707, "global_step": 62768, "epoch": 373} {"train_loss": -8.883813858032227, "global_step": 62769, "epoch": 373} {"train_loss": -8.656641006469727, "global_step": 62770, "epoch": 373} {"train_loss": -8.723175048828125, "global_step": 62771, "epoch": 373} {"train_loss": -8.864869117736816, "global_step": 62772, "epoch": 373} {"train_loss": -8.901571273803711, "global_step": 62773, "epoch": 373} {"train_loss": -8.651773452758789, "global_step": 62774, "epoch": 373} {"train_loss": -8.627496719360352, "global_step": 62775, "epoch": 373} {"train_loss": -8.827937126159668, "global_step": 62776, "epoch": 373} {"train_loss": -8.707511901855469, "global_step": 62777, "epoch": 373} {"train_loss": -8.65728759765625, "global_step": 62778, "epoch": 373} {"train_loss": -8.87668228149414, "global_step": 62779, "epoch": 373} {"train_loss": -8.576377868652344, "global_step": 62780, "epoch": 373} {"train_loss": -8.65510368347168, "global_step": 62781, "epoch": 373} {"train_loss": -8.644362449645996, "global_step": 62782, "epoch": 373} {"train_loss": -8.897699356079102, "global_step": 62783, "epoch": 373} {"train_loss": -8.725351333618164, "global_step": 62784, "epoch": 373} {"train_loss": -8.635316848754883, "global_step": 62785, "epoch": 373} {"train_loss": -8.720497131347656, "global_step": 62786, "epoch": 373} {"train_loss": -8.823892593383789, "global_step": 62787, "epoch": 373} {"train_loss": -8.962352752685547, "global_step": 62788, "epoch": 373} {"train_loss": -8.487335205078125, "global_step": 62789, "epoch": 373} {"train_loss": -8.694618225097656, "global_step": 62790, "epoch": 373} {"train_loss": -8.7075777053833, "global_step": 62791, "epoch": 373} {"train_loss": -8.501002311706543, "global_step": 62792, "epoch": 373} {"train_loss": -8.658526420593262, "global_step": 62793, "epoch": 373} {"train_loss": -8.534689903259277, "global_step": 62794, "epoch": 373} {"train_loss": -8.544710159301758, "global_step": 62795, "epoch": 373} {"train_loss": -8.558088302612305, "global_step": 62796, "epoch": 373} {"train_loss": -8.62382698059082, "global_step": 62797, "epoch": 373} {"train_loss": -8.382688522338867, "global_step": 62798, "epoch": 373} {"train_loss": -8.434093475341797, "global_step": 62799, "epoch": 373} {"train_loss": -8.605936050415039, "global_step": 62800, "epoch": 373} {"train_loss": -8.730915069580078, "global_step": 62801, "epoch": 373} {"train_loss": -8.595951080322266, "global_step": 62802, "epoch": 373} {"train_loss": -8.876084327697754, "global_step": 62803, "epoch": 373} {"train_loss": -8.526718139648438, "global_step": 62804, "epoch": 373} {"train_loss": -8.862356185913086, "global_step": 62805, "epoch": 373} {"train_loss": -8.607892990112305, "global_step": 62806, "epoch": 373} {"train_loss": -8.843893051147461, "global_step": 62807, "epoch": 373} {"train_loss": -8.276954650878906, "global_step": 62808, "epoch": 373} {"train_loss": -8.831528663635254, "global_step": 62809, "epoch": 373} {"train_loss": -8.366617202758789, "global_step": 62810, "epoch": 373} {"train_loss": -8.695945739746094, "global_step": 62811, "epoch": 373} {"train_loss": -8.599613189697266, "global_step": 62812, "epoch": 373} {"train_loss": -8.505680084228516, "global_step": 62813, "epoch": 373} {"train_loss": -8.783319473266602, "global_step": 62814, "epoch": 373} {"train_loss": -8.71745491027832, "global_step": 62815, "epoch": 373} {"train_loss": -8.836490631103516, "global_step": 62816, "epoch": 373} {"train_loss": -8.421815872192383, "global_step": 62817, "epoch": 373} {"train_loss": -8.826484680175781, "global_step": 62818, "epoch": 373} {"train_loss": -8.597031593322754, "global_step": 62819, "epoch": 373} {"train_loss": -8.770638465881348, "global_step": 62820, "epoch": 373} {"train_loss": -8.655831336975098, "global_step": 62821, "epoch": 373} {"train_loss": -8.750120162963867, "global_step": 62822, "epoch": 373} {"train_loss": -8.658655166625977, "global_step": 62823, "epoch": 373} {"train_loss": -8.831886291503906, "global_step": 62824, "epoch": 373} {"train_loss": -8.784598350524902, "global_step": 62825, "epoch": 373} {"train_loss": -8.682862281799316, "global_step": 62826, "epoch": 373} {"train_loss": -8.838132858276367, "global_step": 62827, "epoch": 373} {"train_loss": -8.639107704162598, "global_step": 62828, "epoch": 373} {"train_loss": -8.691388130187988, "global_step": 62829, "epoch": 373} {"train_loss": -8.64134407043457, "global_step": 62830, "epoch": 373} {"train_loss": -8.69081897962661, "global_step": 62831, "epoch": 373, "val_loss": 190118.5625} {"train_loss": -8.596253395080566, "global_step": 62832, "epoch": 374} {"train_loss": -8.829519271850586, "global_step": 62833, "epoch": 374} {"train_loss": -8.755504608154297, "global_step": 62834, "epoch": 374} {"train_loss": -8.683911323547363, "global_step": 62835, "epoch": 374} {"train_loss": -8.585256576538086, "global_step": 62836, "epoch": 374} {"train_loss": -8.94299602508545, "global_step": 62837, "epoch": 374} {"train_loss": -8.659348487854004, "global_step": 62838, "epoch": 374} {"train_loss": -8.589673042297363, "global_step": 62839, "epoch": 374} {"train_loss": -8.38667106628418, "global_step": 62840, "epoch": 374} {"train_loss": -8.605777740478516, "global_step": 62841, "epoch": 374} {"train_loss": -8.555980682373047, "global_step": 62842, "epoch": 374} {"train_loss": -8.782559394836426, "global_step": 62843, "epoch": 374} {"train_loss": -8.555527687072754, "global_step": 62844, "epoch": 374} {"train_loss": -8.659546852111816, "global_step": 62845, "epoch": 374} {"train_loss": -8.702352523803711, "global_step": 62846, "epoch": 374} {"train_loss": -8.681465148925781, "global_step": 62847, "epoch": 374} {"train_loss": -8.895713806152344, "global_step": 62848, "epoch": 374} {"train_loss": -8.836455345153809, "global_step": 62849, "epoch": 374} {"train_loss": -8.888307571411133, "global_step": 62850, "epoch": 374} {"train_loss": -8.637889862060547, "global_step": 62851, "epoch": 374} {"train_loss": -8.944886207580566, "global_step": 62852, "epoch": 374} {"train_loss": -9.00285816192627, "global_step": 62853, "epoch": 374} {"train_loss": -8.71473503112793, "global_step": 62854, "epoch": 374} {"train_loss": -8.731246948242188, "global_step": 62855, "epoch": 374} {"train_loss": -8.978395462036133, "global_step": 62856, "epoch": 374} {"train_loss": -8.385848045349121, "global_step": 62857, "epoch": 374} {"train_loss": -8.905136108398438, "global_step": 62858, "epoch": 374} {"train_loss": -8.53451919555664, "global_step": 62859, "epoch": 374} {"train_loss": -8.624345779418945, "global_step": 62860, "epoch": 374} {"train_loss": -8.725671768188477, "global_step": 62861, "epoch": 374} {"train_loss": -8.739070892333984, "global_step": 62862, "epoch": 374} {"train_loss": -8.715180397033691, "global_step": 62863, "epoch": 374} {"train_loss": -8.632396697998047, "global_step": 62864, "epoch": 374} {"train_loss": -9.00964641571045, "global_step": 62865, "epoch": 374} {"train_loss": -8.83983325958252, "global_step": 62866, "epoch": 374} {"train_loss": -8.545658111572266, "global_step": 62867, "epoch": 374} {"train_loss": -8.88003921508789, "global_step": 62868, "epoch": 374} {"train_loss": -8.590036392211914, "global_step": 62869, "epoch": 374} {"train_loss": -8.90595817565918, "global_step": 62870, "epoch": 374} {"train_loss": -8.385679244995117, "global_step": 62871, "epoch": 374} {"train_loss": -8.841592788696289, "global_step": 62872, "epoch": 374} {"train_loss": -8.789252281188965, "global_step": 62873, "epoch": 374} {"train_loss": -8.924261093139648, "global_step": 62874, "epoch": 374} {"train_loss": -8.714454650878906, "global_step": 62875, "epoch": 374} {"train_loss": -8.797250747680664, "global_step": 62876, "epoch": 374} {"train_loss": -8.807816505432129, "global_step": 62877, "epoch": 374} {"train_loss": -8.698662757873535, "global_step": 62878, "epoch": 374} {"train_loss": -8.876031875610352, "global_step": 62879, "epoch": 374} {"train_loss": -8.960338592529297, "global_step": 62880, "epoch": 374} {"train_loss": -8.99091911315918, "global_step": 62881, "epoch": 374} {"train_loss": -8.603423118591309, "global_step": 62882, "epoch": 374} {"train_loss": -8.846424102783203, "global_step": 62883, "epoch": 374} {"train_loss": -8.827470779418945, "global_step": 62884, "epoch": 374} {"train_loss": -8.564958572387695, "global_step": 62885, "epoch": 374} {"train_loss": -8.812835693359375, "global_step": 62886, "epoch": 374} {"train_loss": -8.622396469116211, "global_step": 62887, "epoch": 374} {"train_loss": -8.559000968933105, "global_step": 62888, "epoch": 374} {"train_loss": -8.644989013671875, "global_step": 62889, "epoch": 374} {"train_loss": -8.65449047088623, "global_step": 62890, "epoch": 374} {"train_loss": -8.658975601196289, "global_step": 62891, "epoch": 374} {"train_loss": -8.407820701599121, "global_step": 62892, "epoch": 374} {"train_loss": -8.824958801269531, "global_step": 62893, "epoch": 374} {"train_loss": -8.426000595092773, "global_step": 62894, "epoch": 374} {"train_loss": -8.60779094696045, "global_step": 62895, "epoch": 374} {"train_loss": -8.475709915161133, "global_step": 62896, "epoch": 374} {"train_loss": -8.656970977783203, "global_step": 62897, "epoch": 374} {"train_loss": -8.406460762023926, "global_step": 62898, "epoch": 374} {"train_loss": -8.615432739257812, "global_step": 62899, "epoch": 374} {"train_loss": -8.56403923034668, "global_step": 62900, "epoch": 374} {"train_loss": -8.496105194091797, "global_step": 62901, "epoch": 374} {"train_loss": -8.875526428222656, "global_step": 62902, "epoch": 374} {"train_loss": -8.6317720413208, "global_step": 62903, "epoch": 374} {"train_loss": -8.508708953857422, "global_step": 62904, "epoch": 374} {"train_loss": -8.61012077331543, "global_step": 62905, "epoch": 374} {"train_loss": -8.550649642944336, "global_step": 62906, "epoch": 374} {"train_loss": -8.709704399108887, "global_step": 62907, "epoch": 374} {"train_loss": -8.561805725097656, "global_step": 62908, "epoch": 374} {"train_loss": -8.707483291625977, "global_step": 62909, "epoch": 374} {"train_loss": -8.561795234680176, "global_step": 62910, "epoch": 374} {"train_loss": -8.754383087158203, "global_step": 62911, "epoch": 374} {"train_loss": -8.768383026123047, "global_step": 62912, "epoch": 374} {"train_loss": -8.91804313659668, "global_step": 62913, "epoch": 374} {"train_loss": -8.608586311340332, "global_step": 62914, "epoch": 374} {"train_loss": -8.691916465759277, "global_step": 62915, "epoch": 374} {"train_loss": -8.675920486450195, "global_step": 62916, "epoch": 374} {"train_loss": -8.683467864990234, "global_step": 62917, "epoch": 374} {"train_loss": -8.867433547973633, "global_step": 62918, "epoch": 374} {"train_loss": -8.691627502441406, "global_step": 62919, "epoch": 374} {"train_loss": -8.759220123291016, "global_step": 62920, "epoch": 374} {"train_loss": -8.60055160522461, "global_step": 62921, "epoch": 374} {"train_loss": -8.655579566955566, "global_step": 62922, "epoch": 374} {"train_loss": -8.849638938903809, "global_step": 62923, "epoch": 374} {"train_loss": -8.808788299560547, "global_step": 62924, "epoch": 374} {"train_loss": -8.799226760864258, "global_step": 62925, "epoch": 374} {"train_loss": -8.72360610961914, "global_step": 62926, "epoch": 374} {"train_loss": -8.561279296875, "global_step": 62927, "epoch": 374} {"train_loss": -8.877725601196289, "global_step": 62928, "epoch": 374} {"train_loss": -8.791933059692383, "global_step": 62929, "epoch": 374} {"train_loss": -8.741084098815918, "global_step": 62930, "epoch": 374} {"train_loss": -8.885213851928711, "global_step": 62931, "epoch": 374} {"train_loss": -8.7149658203125, "global_step": 62932, "epoch": 374} {"train_loss": -8.736078262329102, "global_step": 62933, "epoch": 374} {"train_loss": -8.469642639160156, "global_step": 62934, "epoch": 374} {"train_loss": -8.848066329956055, "global_step": 62935, "epoch": 374} {"train_loss": -8.505284309387207, "global_step": 62936, "epoch": 374} {"train_loss": -8.785815238952637, "global_step": 62937, "epoch": 374} {"train_loss": -8.985603332519531, "global_step": 62938, "epoch": 374} {"train_loss": -8.742841720581055, "global_step": 62939, "epoch": 374} {"train_loss": -8.732306480407715, "global_step": 62940, "epoch": 374} {"train_loss": -8.863021850585938, "global_step": 62941, "epoch": 374} {"train_loss": -8.835603713989258, "global_step": 62942, "epoch": 374} {"train_loss": -8.799270629882812, "global_step": 62943, "epoch": 374} {"train_loss": -8.563596725463867, "global_step": 62944, "epoch": 374} {"train_loss": -8.85139274597168, "global_step": 62945, "epoch": 374} {"train_loss": -8.614433288574219, "global_step": 62946, "epoch": 374} {"train_loss": -8.928630828857422, "global_step": 62947, "epoch": 374} {"train_loss": -8.860550880432129, "global_step": 62948, "epoch": 374} {"train_loss": -8.728285789489746, "global_step": 62949, "epoch": 374} {"train_loss": -8.411813735961914, "global_step": 62950, "epoch": 374} {"train_loss": -8.797290802001953, "global_step": 62951, "epoch": 374} {"train_loss": -8.710287094116211, "global_step": 62952, "epoch": 374} {"train_loss": -8.790629386901855, "global_step": 62953, "epoch": 374} {"train_loss": -8.639063835144043, "global_step": 62954, "epoch": 374} {"train_loss": -8.592769622802734, "global_step": 62955, "epoch": 374} {"train_loss": -8.726066589355469, "global_step": 62956, "epoch": 374} {"train_loss": -8.847347259521484, "global_step": 62957, "epoch": 374} {"train_loss": -8.44253921508789, "global_step": 62958, "epoch": 374} {"train_loss": -8.945191383361816, "global_step": 62959, "epoch": 374} {"train_loss": -8.803668975830078, "global_step": 62960, "epoch": 374} {"train_loss": -8.564099311828613, "global_step": 62961, "epoch": 374} {"train_loss": -8.480027198791504, "global_step": 62962, "epoch": 374} {"train_loss": -8.484349250793457, "global_step": 62963, "epoch": 374} {"train_loss": -8.523383140563965, "global_step": 62964, "epoch": 374} {"train_loss": -8.58559513092041, "global_step": 62965, "epoch": 374} {"train_loss": -8.80954360961914, "global_step": 62966, "epoch": 374} {"train_loss": -8.417911529541016, "global_step": 62967, "epoch": 374} {"train_loss": -8.502141952514648, "global_step": 62968, "epoch": 374} {"train_loss": -8.618598937988281, "global_step": 62969, "epoch": 374} {"train_loss": -8.600192070007324, "global_step": 62970, "epoch": 374} {"train_loss": -8.89399528503418, "global_step": 62971, "epoch": 374} {"train_loss": -8.41772747039795, "global_step": 62972, "epoch": 374} {"train_loss": -8.78126335144043, "global_step": 62973, "epoch": 374} {"train_loss": -8.657196044921875, "global_step": 62974, "epoch": 374} {"train_loss": -8.50261116027832, "global_step": 62975, "epoch": 374} {"train_loss": -8.621009826660156, "global_step": 62976, "epoch": 374} {"train_loss": -8.648551940917969, "global_step": 62977, "epoch": 374} {"train_loss": -8.566617012023926, "global_step": 62978, "epoch": 374} {"train_loss": -8.712119102478027, "global_step": 62979, "epoch": 374} {"train_loss": -8.689020156860352, "global_step": 62980, "epoch": 374} {"train_loss": -8.74831485748291, "global_step": 62981, "epoch": 374} {"train_loss": -8.756719589233398, "global_step": 62982, "epoch": 374} {"train_loss": -8.948283195495605, "global_step": 62983, "epoch": 374} {"train_loss": -8.772698402404785, "global_step": 62984, "epoch": 374} {"train_loss": -8.613243103027344, "global_step": 62985, "epoch": 374} {"train_loss": -8.74070930480957, "global_step": 62986, "epoch": 374} {"train_loss": -8.746214866638184, "global_step": 62987, "epoch": 374} {"train_loss": -8.554752349853516, "global_step": 62988, "epoch": 374} {"train_loss": -8.714990615844727, "global_step": 62989, "epoch": 374} {"train_loss": -8.775947570800781, "global_step": 62990, "epoch": 374} {"train_loss": -8.678390502929688, "global_step": 62991, "epoch": 374} {"train_loss": -8.50987720489502, "global_step": 62992, "epoch": 374} {"train_loss": -8.800921440124512, "global_step": 62993, "epoch": 374} {"train_loss": -8.862215995788574, "global_step": 62994, "epoch": 374} {"train_loss": -8.777442932128906, "global_step": 62995, "epoch": 374} {"train_loss": -8.77912712097168, "global_step": 62996, "epoch": 374} {"train_loss": -8.80068302154541, "global_step": 62997, "epoch": 374} {"train_loss": -8.99670124053955, "global_step": 62998, "epoch": 374} {"train_loss": -8.70363730476016, "global_step": 62999, "epoch": 374, "val_loss": 192773.78125} {"train_loss": -8.877906799316406, "global_step": 63000, "epoch": 375} {"train_loss": -8.790220260620117, "global_step": 63001, "epoch": 375} {"train_loss": -8.758892059326172, "global_step": 63002, "epoch": 375} {"train_loss": -8.828429222106934, "global_step": 63003, "epoch": 375} {"train_loss": -8.468952178955078, "global_step": 63004, "epoch": 375} {"train_loss": -8.852412223815918, "global_step": 63005, "epoch": 375} {"train_loss": -8.61251163482666, "global_step": 63006, "epoch": 375} {"train_loss": -8.827377319335938, "global_step": 63007, "epoch": 375} {"train_loss": -8.682013511657715, "global_step": 63008, "epoch": 375} {"train_loss": -8.826101303100586, "global_step": 63009, "epoch": 375} {"train_loss": -8.680624961853027, "global_step": 63010, "epoch": 375} {"train_loss": -8.690662384033203, "global_step": 63011, "epoch": 375} {"train_loss": -8.9237642288208, "global_step": 63012, "epoch": 375} {"train_loss": -8.585628509521484, "global_step": 63013, "epoch": 375} {"train_loss": -8.764775276184082, "global_step": 63014, "epoch": 375} {"train_loss": -8.889213562011719, "global_step": 63015, "epoch": 375} {"train_loss": -8.595369338989258, "global_step": 63016, "epoch": 375} {"train_loss": -8.722951889038086, "global_step": 63017, "epoch": 375} {"train_loss": -8.997257232666016, "global_step": 63018, "epoch": 375} {"train_loss": -8.484443664550781, "global_step": 63019, "epoch": 375} {"train_loss": -8.96649169921875, "global_step": 63020, "epoch": 375} {"train_loss": -8.727581024169922, "global_step": 63021, "epoch": 375} {"train_loss": -8.582526206970215, "global_step": 63022, "epoch": 375} {"train_loss": -8.570780754089355, "global_step": 63023, "epoch": 375} {"train_loss": -9.017126083374023, "global_step": 63024, "epoch": 375} {"train_loss": -8.571475982666016, "global_step": 63025, "epoch": 375} {"train_loss": -8.696308135986328, "global_step": 63026, "epoch": 375} {"train_loss": -8.695625305175781, "global_step": 63027, "epoch": 375} {"train_loss": -8.548336029052734, "global_step": 63028, "epoch": 375} {"train_loss": -8.802040100097656, "global_step": 63029, "epoch": 375} {"train_loss": -8.779579162597656, "global_step": 63030, "epoch": 375} {"train_loss": -8.38810920715332, "global_step": 63031, "epoch": 375} {"train_loss": -8.538934707641602, "global_step": 63032, "epoch": 375} {"train_loss": -8.681612968444824, "global_step": 63033, "epoch": 375} {"train_loss": -8.333866119384766, "global_step": 63034, "epoch": 375} {"train_loss": -8.115812301635742, "global_step": 63035, "epoch": 375} {"train_loss": -8.889398574829102, "global_step": 63036, "epoch": 375} {"train_loss": -8.28387451171875, "global_step": 63037, "epoch": 375} {"train_loss": -8.402048110961914, "global_step": 63038, "epoch": 375} {"train_loss": -8.591957092285156, "global_step": 63039, "epoch": 375} {"train_loss": -8.291126251220703, "global_step": 63040, "epoch": 375} {"train_loss": -8.469671249389648, "global_step": 63041, "epoch": 375} {"train_loss": -8.572775840759277, "global_step": 63042, "epoch": 375} {"train_loss": -8.529114723205566, "global_step": 63043, "epoch": 375} {"train_loss": -8.510502815246582, "global_step": 63044, "epoch": 375} {"train_loss": -8.57873821258545, "global_step": 63045, "epoch": 375} {"train_loss": -8.401877403259277, "global_step": 63046, "epoch": 375} {"train_loss": -8.62714958190918, "global_step": 63047, "epoch": 375} {"train_loss": -8.480795860290527, "global_step": 63048, "epoch": 375} {"train_loss": -8.65404224395752, "global_step": 63049, "epoch": 375} {"train_loss": -8.633543968200684, "global_step": 63050, "epoch": 375} {"train_loss": -8.52293586730957, "global_step": 63051, "epoch": 375} {"train_loss": -8.61130142211914, "global_step": 63052, "epoch": 375} {"train_loss": -8.522612571716309, "global_step": 63053, "epoch": 375} {"train_loss": -8.566792488098145, "global_step": 63054, "epoch": 375} {"train_loss": -8.59539794921875, "global_step": 63055, "epoch": 375} {"train_loss": -8.769977569580078, "global_step": 63056, "epoch": 375} {"train_loss": -8.779034614562988, "global_step": 63057, "epoch": 375} {"train_loss": -8.830024719238281, "global_step": 63058, "epoch": 375} {"train_loss": -8.61159610748291, "global_step": 63059, "epoch": 375} {"train_loss": -8.68442153930664, "global_step": 63060, "epoch": 375} {"train_loss": -8.882431030273438, "global_step": 63061, "epoch": 375} {"train_loss": -8.96154499053955, "global_step": 63062, "epoch": 375} {"train_loss": -8.749964714050293, "global_step": 63063, "epoch": 375} {"train_loss": -8.691943168640137, "global_step": 63064, "epoch": 375} {"train_loss": -8.910144805908203, "global_step": 63065, "epoch": 375} {"train_loss": -8.812653541564941, "global_step": 63066, "epoch": 375} {"train_loss": -8.773616790771484, "global_step": 63067, "epoch": 375} {"train_loss": -8.885683059692383, "global_step": 63068, "epoch": 375} {"train_loss": -8.973889350891113, "global_step": 63069, "epoch": 375} {"train_loss": -8.763452529907227, "global_step": 63070, "epoch": 375} {"train_loss": -9.003643035888672, "global_step": 63071, "epoch": 375} {"train_loss": -8.740403175354004, "global_step": 63072, "epoch": 375} {"train_loss": -8.647974967956543, "global_step": 63073, "epoch": 375} {"train_loss": -8.837196350097656, "global_step": 63074, "epoch": 375} {"train_loss": -8.685709953308105, "global_step": 63075, "epoch": 375} {"train_loss": -8.718208312988281, "global_step": 63076, "epoch": 375} {"train_loss": -8.644240379333496, "global_step": 63077, "epoch": 375} {"train_loss": -8.544317245483398, "global_step": 63078, "epoch": 375} {"train_loss": -8.626749992370605, "global_step": 63079, "epoch": 375} {"train_loss": -9.024621963500977, "global_step": 63080, "epoch": 375} {"train_loss": -9.02868366241455, "global_step": 63081, "epoch": 375} {"train_loss": -8.941080093383789, "global_step": 63082, "epoch": 375} {"train_loss": -8.763023376464844, "global_step": 63083, "epoch": 375} {"train_loss": -8.849040985107422, "global_step": 63084, "epoch": 375} {"train_loss": -8.714014053344727, "global_step": 63085, "epoch": 375} {"train_loss": -8.70796012878418, "global_step": 63086, "epoch": 375} {"train_loss": -8.661378860473633, "global_step": 63087, "epoch": 375} {"train_loss": -8.468908309936523, "global_step": 63088, "epoch": 375} {"train_loss": -8.771909713745117, "global_step": 63089, "epoch": 375} {"train_loss": -8.326543807983398, "global_step": 63090, "epoch": 375} {"train_loss": -8.838150978088379, "global_step": 63091, "epoch": 375} {"train_loss": -8.27759838104248, "global_step": 63092, "epoch": 375} {"train_loss": -8.225852966308594, "global_step": 63093, "epoch": 375} {"train_loss": -7.991663932800293, "global_step": 63094, "epoch": 375} {"train_loss": -8.281272888183594, "global_step": 63095, "epoch": 375} {"train_loss": -8.260009765625, "global_step": 63096, "epoch": 375} {"train_loss": -8.511396408081055, "global_step": 63097, "epoch": 375} {"train_loss": -8.522911071777344, "global_step": 63098, "epoch": 375} {"train_loss": -8.43861198425293, "global_step": 63099, "epoch": 375} {"train_loss": -8.344038009643555, "global_step": 63100, "epoch": 375} {"train_loss": -8.493102073669434, "global_step": 63101, "epoch": 375} {"train_loss": -8.477632522583008, "global_step": 63102, "epoch": 375} {"train_loss": -8.527566909790039, "global_step": 63103, "epoch": 375} {"train_loss": -8.276460647583008, "global_step": 63104, "epoch": 375} {"train_loss": -8.603889465332031, "global_step": 63105, "epoch": 375} {"train_loss": -8.577648162841797, "global_step": 63106, "epoch": 375} {"train_loss": -8.526586532592773, "global_step": 63107, "epoch": 375} {"train_loss": -8.685983657836914, "global_step": 63108, "epoch": 375} {"train_loss": -8.39267635345459, "global_step": 63109, "epoch": 375} {"train_loss": -8.705404281616211, "global_step": 63110, "epoch": 375} {"train_loss": -8.47708511352539, "global_step": 63111, "epoch": 375} {"train_loss": -8.58983325958252, "global_step": 63112, "epoch": 375} {"train_loss": -8.606325149536133, "global_step": 63113, "epoch": 375} {"train_loss": -8.495820999145508, "global_step": 63114, "epoch": 375} {"train_loss": -8.843942642211914, "global_step": 63115, "epoch": 375} {"train_loss": -8.704305648803711, "global_step": 63116, "epoch": 375} {"train_loss": -8.781197547912598, "global_step": 63117, "epoch": 375} {"train_loss": -8.737127304077148, "global_step": 63118, "epoch": 375} {"train_loss": -8.613293647766113, "global_step": 63119, "epoch": 375} {"train_loss": -8.650161743164062, "global_step": 63120, "epoch": 375} {"train_loss": -8.776975631713867, "global_step": 63121, "epoch": 375} {"train_loss": -8.918426513671875, "global_step": 63122, "epoch": 375} {"train_loss": -8.722017288208008, "global_step": 63123, "epoch": 375} {"train_loss": -8.836894035339355, "global_step": 63124, "epoch": 375} {"train_loss": -8.925073623657227, "global_step": 63125, "epoch": 375} {"train_loss": -8.822732925415039, "global_step": 63126, "epoch": 375} {"train_loss": -8.712137222290039, "global_step": 63127, "epoch": 375} {"train_loss": -8.928595542907715, "global_step": 63128, "epoch": 375} {"train_loss": -8.760868072509766, "global_step": 63129, "epoch": 375} {"train_loss": -8.85645866394043, "global_step": 63130, "epoch": 375} {"train_loss": -8.701265335083008, "global_step": 63131, "epoch": 375} {"train_loss": -9.164852142333984, "global_step": 63132, "epoch": 375} {"train_loss": -8.601301193237305, "global_step": 63133, "epoch": 375} {"train_loss": -8.840080261230469, "global_step": 63134, "epoch": 375} {"train_loss": -8.74499225616455, "global_step": 63135, "epoch": 375} {"train_loss": -8.905158996582031, "global_step": 63136, "epoch": 375} {"train_loss": -8.621528625488281, "global_step": 63137, "epoch": 375} {"train_loss": -8.924530982971191, "global_step": 63138, "epoch": 375} {"train_loss": -8.763195037841797, "global_step": 63139, "epoch": 375} {"train_loss": -8.466836929321289, "global_step": 63140, "epoch": 375} {"train_loss": -8.782866477966309, "global_step": 63141, "epoch": 375} {"train_loss": -8.713323593139648, "global_step": 63142, "epoch": 375} {"train_loss": -8.89858627319336, "global_step": 63143, "epoch": 375} {"train_loss": -8.521259307861328, "global_step": 63144, "epoch": 375} {"train_loss": -8.85491943359375, "global_step": 63145, "epoch": 375} {"train_loss": -8.759712219238281, "global_step": 63146, "epoch": 375} {"train_loss": -8.484382629394531, "global_step": 63147, "epoch": 375} {"train_loss": -8.821324348449707, "global_step": 63148, "epoch": 375} {"train_loss": -8.517711639404297, "global_step": 63149, "epoch": 375} {"train_loss": -8.601713180541992, "global_step": 63150, "epoch": 375} {"train_loss": -8.545308113098145, "global_step": 63151, "epoch": 375} {"train_loss": -8.528477668762207, "global_step": 63152, "epoch": 375} {"train_loss": -8.50408935546875, "global_step": 63153, "epoch": 375} {"train_loss": -8.379524230957031, "global_step": 63154, "epoch": 375} {"train_loss": -8.644824981689453, "global_step": 63155, "epoch": 375} {"train_loss": -8.767990112304688, "global_step": 63156, "epoch": 375} {"train_loss": -8.636425018310547, "global_step": 63157, "epoch": 375} {"train_loss": -8.55846118927002, "global_step": 63158, "epoch": 375} {"train_loss": -8.554387092590332, "global_step": 63159, "epoch": 375} {"train_loss": -8.639230728149414, "global_step": 63160, "epoch": 375} {"train_loss": -8.458301544189453, "global_step": 63161, "epoch": 375} {"train_loss": -8.529388427734375, "global_step": 63162, "epoch": 375} {"train_loss": -8.519916534423828, "global_step": 63163, "epoch": 375} {"train_loss": -8.4801025390625, "global_step": 63164, "epoch": 375} {"train_loss": -8.524162292480469, "global_step": 63165, "epoch": 375} {"train_loss": -8.398944854736328, "global_step": 63166, "epoch": 375} {"train_loss": -8.656244266600837, "global_step": 63167, "epoch": 375, "val_loss": 191319.03125, "train_action_mse_error": 5.36232852935791} {"train_loss": -8.381439208984375, "global_step": 63168, "epoch": 376} {"train_loss": -8.731560707092285, "global_step": 63169, "epoch": 376} {"train_loss": -8.717138290405273, "global_step": 63170, "epoch": 376} {"train_loss": -8.753652572631836, "global_step": 63171, "epoch": 376} {"train_loss": -8.605691909790039, "global_step": 63172, "epoch": 376} {"train_loss": -8.566069602966309, "global_step": 63173, "epoch": 376} {"train_loss": -8.603242874145508, "global_step": 63174, "epoch": 376} {"train_loss": -8.667654037475586, "global_step": 63175, "epoch": 376} {"train_loss": -8.508430480957031, "global_step": 63176, "epoch": 376} {"train_loss": -8.668235778808594, "global_step": 63177, "epoch": 376} {"train_loss": -8.72201156616211, "global_step": 63178, "epoch": 376} {"train_loss": -8.724193572998047, "global_step": 63179, "epoch": 376} {"train_loss": -8.854257583618164, "global_step": 63180, "epoch": 376} {"train_loss": -8.928868293762207, "global_step": 63181, "epoch": 376} {"train_loss": -8.818046569824219, "global_step": 63182, "epoch": 376} {"train_loss": -8.855049133300781, "global_step": 63183, "epoch": 376} {"train_loss": -8.738910675048828, "global_step": 63184, "epoch": 376} {"train_loss": -8.701116561889648, "global_step": 63185, "epoch": 376} {"train_loss": -8.697555541992188, "global_step": 63186, "epoch": 376} {"train_loss": -8.708654403686523, "global_step": 63187, "epoch": 376} {"train_loss": -8.737367630004883, "global_step": 63188, "epoch": 376} {"train_loss": -8.969156265258789, "global_step": 63189, "epoch": 376} {"train_loss": -8.744553565979004, "global_step": 63190, "epoch": 376} {"train_loss": -8.809560775756836, "global_step": 63191, "epoch": 376} {"train_loss": -8.81098461151123, "global_step": 63192, "epoch": 376} {"train_loss": -8.706550598144531, "global_step": 63193, "epoch": 376} {"train_loss": -9.004109382629395, "global_step": 63194, "epoch": 376} {"train_loss": -8.462736129760742, "global_step": 63195, "epoch": 376} {"train_loss": -8.812227249145508, "global_step": 63196, "epoch": 376} {"train_loss": -8.446660995483398, "global_step": 63197, "epoch": 376} {"train_loss": -8.501893997192383, "global_step": 63198, "epoch": 376} {"train_loss": -8.839275360107422, "global_step": 63199, "epoch": 376} {"train_loss": -8.411428451538086, "global_step": 63200, "epoch": 376} {"train_loss": -8.504199981689453, "global_step": 63201, "epoch": 376} {"train_loss": -8.92428207397461, "global_step": 63202, "epoch": 376} {"train_loss": -8.705953598022461, "global_step": 63203, "epoch": 376} {"train_loss": -8.422040939331055, "global_step": 63204, "epoch": 376} {"train_loss": -8.873712539672852, "global_step": 63205, "epoch": 376} {"train_loss": -8.689901351928711, "global_step": 63206, "epoch": 376} {"train_loss": -8.573837280273438, "global_step": 63207, "epoch": 376} {"train_loss": -8.642677307128906, "global_step": 63208, "epoch": 376} {"train_loss": -8.885364532470703, "global_step": 63209, "epoch": 376} {"train_loss": -8.771018028259277, "global_step": 63210, "epoch": 376} {"train_loss": -8.777631759643555, "global_step": 63211, "epoch": 376} {"train_loss": -8.76237678527832, "global_step": 63212, "epoch": 376} {"train_loss": -8.761761665344238, "global_step": 63213, "epoch": 376} {"train_loss": -8.833333015441895, "global_step": 63214, "epoch": 376} {"train_loss": -8.754494667053223, "global_step": 63215, "epoch": 376} {"train_loss": -8.868512153625488, "global_step": 63216, "epoch": 376} {"train_loss": -8.813783645629883, "global_step": 63217, "epoch": 376} {"train_loss": -8.877973556518555, "global_step": 63218, "epoch": 376} {"train_loss": -8.86595344543457, "global_step": 63219, "epoch": 376} {"train_loss": -8.703208923339844, "global_step": 63220, "epoch": 376} {"train_loss": -8.793319702148438, "global_step": 63221, "epoch": 376} {"train_loss": -8.685834884643555, "global_step": 63222, "epoch": 376} {"train_loss": -8.766023635864258, "global_step": 63223, "epoch": 376} {"train_loss": -8.688215255737305, "global_step": 63224, "epoch": 376} {"train_loss": -8.63218879699707, "global_step": 63225, "epoch": 376} {"train_loss": -8.674737930297852, "global_step": 63226, "epoch": 376} {"train_loss": -8.439521789550781, "global_step": 63227, "epoch": 376} {"train_loss": -8.8212251663208, "global_step": 63228, "epoch": 376} {"train_loss": -8.49673843383789, "global_step": 63229, "epoch": 376} {"train_loss": -8.806938171386719, "global_step": 63230, "epoch": 376} {"train_loss": -8.715192794799805, "global_step": 63231, "epoch": 376} {"train_loss": -8.972793579101562, "global_step": 63232, "epoch": 376} {"train_loss": -8.290695190429688, "global_step": 63233, "epoch": 376} {"train_loss": -8.85234260559082, "global_step": 63234, "epoch": 376} {"train_loss": -8.71984577178955, "global_step": 63235, "epoch": 376} {"train_loss": -8.964306831359863, "global_step": 63236, "epoch": 376} {"train_loss": -8.54454231262207, "global_step": 63237, "epoch": 376} {"train_loss": -8.67872142791748, "global_step": 63238, "epoch": 376} {"train_loss": -8.942102432250977, "global_step": 63239, "epoch": 376} {"train_loss": -8.717134475708008, "global_step": 63240, "epoch": 376} {"train_loss": -8.964110374450684, "global_step": 63241, "epoch": 376} {"train_loss": -9.095788955688477, "global_step": 63242, "epoch": 376} {"train_loss": -8.781906127929688, "global_step": 63243, "epoch": 376} {"train_loss": -8.84412956237793, "global_step": 63244, "epoch": 376} {"train_loss": -8.900542259216309, "global_step": 63245, "epoch": 376} {"train_loss": -8.832284927368164, "global_step": 63246, "epoch": 376} {"train_loss": -8.9678955078125, "global_step": 63247, "epoch": 376} {"train_loss": -8.60563850402832, "global_step": 63248, "epoch": 376} {"train_loss": -8.941082000732422, "global_step": 63249, "epoch": 376} {"train_loss": -8.706123352050781, "global_step": 63250, "epoch": 376} {"train_loss": -8.638958930969238, "global_step": 63251, "epoch": 376} {"train_loss": -8.988180160522461, "global_step": 63252, "epoch": 376} {"train_loss": -8.803909301757812, "global_step": 63253, "epoch": 376} {"train_loss": -9.02131462097168, "global_step": 63254, "epoch": 376} {"train_loss": -8.987663269042969, "global_step": 63255, "epoch": 376} {"train_loss": -8.765586853027344, "global_step": 63256, "epoch": 376} {"train_loss": -8.685882568359375, "global_step": 63257, "epoch": 376} {"train_loss": -8.897934913635254, "global_step": 63258, "epoch": 376} {"train_loss": -8.668173789978027, "global_step": 63259, "epoch": 376} {"train_loss": -8.764090538024902, "global_step": 63260, "epoch": 376} {"train_loss": -8.829541206359863, "global_step": 63261, "epoch": 376} {"train_loss": -8.687154769897461, "global_step": 63262, "epoch": 376} {"train_loss": -8.870185852050781, "global_step": 63263, "epoch": 376} {"train_loss": -8.737895965576172, "global_step": 63264, "epoch": 376} {"train_loss": -8.768289566040039, "global_step": 63265, "epoch": 376} {"train_loss": -8.838173866271973, "global_step": 63266, "epoch": 376} {"train_loss": -8.724241256713867, "global_step": 63267, "epoch": 376} {"train_loss": -8.559375762939453, "global_step": 63268, "epoch": 376} {"train_loss": -8.504022598266602, "global_step": 63269, "epoch": 376} {"train_loss": -8.295594215393066, "global_step": 63270, "epoch": 376} {"train_loss": -8.436655044555664, "global_step": 63271, "epoch": 376} {"train_loss": -8.71146297454834, "global_step": 63272, "epoch": 376} {"train_loss": -8.599069595336914, "global_step": 63273, "epoch": 376} {"train_loss": -8.676276206970215, "global_step": 63274, "epoch": 376} {"train_loss": -8.623708724975586, "global_step": 63275, "epoch": 376} {"train_loss": -8.675437927246094, "global_step": 63276, "epoch": 376} {"train_loss": -8.841146469116211, "global_step": 63277, "epoch": 376} {"train_loss": -8.445371627807617, "global_step": 63278, "epoch": 376} {"train_loss": -8.716432571411133, "global_step": 63279, "epoch": 376} {"train_loss": -8.570735931396484, "global_step": 63280, "epoch": 376} {"train_loss": -8.620511054992676, "global_step": 63281, "epoch": 376} {"train_loss": -8.682129859924316, "global_step": 63282, "epoch": 376} {"train_loss": -8.912099838256836, "global_step": 63283, "epoch": 376} {"train_loss": -8.642086029052734, "global_step": 63284, "epoch": 376} {"train_loss": -8.83871841430664, "global_step": 63285, "epoch": 376} {"train_loss": -8.904434204101562, "global_step": 63286, "epoch": 376} {"train_loss": -9.013496398925781, "global_step": 63287, "epoch": 376} {"train_loss": -8.690816879272461, "global_step": 63288, "epoch": 376} {"train_loss": -8.716672897338867, "global_step": 63289, "epoch": 376} {"train_loss": -8.73246955871582, "global_step": 63290, "epoch": 376} {"train_loss": -8.790437698364258, "global_step": 63291, "epoch": 376} {"train_loss": -8.977115631103516, "global_step": 63292, "epoch": 376} {"train_loss": -9.082625389099121, "global_step": 63293, "epoch": 376} {"train_loss": -9.035764694213867, "global_step": 63294, "epoch": 376} {"train_loss": -9.028984069824219, "global_step": 63295, "epoch": 376} {"train_loss": -8.805893898010254, "global_step": 63296, "epoch": 376} {"train_loss": -8.847455978393555, "global_step": 63297, "epoch": 376} {"train_loss": -9.151497840881348, "global_step": 63298, "epoch": 376} {"train_loss": -8.720949172973633, "global_step": 63299, "epoch": 376} {"train_loss": -9.003612518310547, "global_step": 63300, "epoch": 376} {"train_loss": -8.75090217590332, "global_step": 63301, "epoch": 376} {"train_loss": -8.819072723388672, "global_step": 63302, "epoch": 376} {"train_loss": -8.876188278198242, "global_step": 63303, "epoch": 376} {"train_loss": -8.469711303710938, "global_step": 63304, "epoch": 376} {"train_loss": -8.451393127441406, "global_step": 63305, "epoch": 376} {"train_loss": -8.691787719726562, "global_step": 63306, "epoch": 376} {"train_loss": -8.664142608642578, "global_step": 63307, "epoch": 376} {"train_loss": -8.420345306396484, "global_step": 63308, "epoch": 376} {"train_loss": -8.256431579589844, "global_step": 63309, "epoch": 376} {"train_loss": -8.238341331481934, "global_step": 63310, "epoch": 376} {"train_loss": -8.374911308288574, "global_step": 63311, "epoch": 376} {"train_loss": -8.037518501281738, "global_step": 63312, "epoch": 376} {"train_loss": -8.470233917236328, "global_step": 63313, "epoch": 376} {"train_loss": -7.927359104156494, "global_step": 63314, "epoch": 376} {"train_loss": -8.327046394348145, "global_step": 63315, "epoch": 376} {"train_loss": -8.16361141204834, "global_step": 63316, "epoch": 376} {"train_loss": -8.1234130859375, "global_step": 63317, "epoch": 376} {"train_loss": -8.153263092041016, "global_step": 63318, "epoch": 376} {"train_loss": -8.34720516204834, "global_step": 63319, "epoch": 376} {"train_loss": -8.503934860229492, "global_step": 63320, "epoch": 376} {"train_loss": -8.664714813232422, "global_step": 63321, "epoch": 376} {"train_loss": -8.365495681762695, "global_step": 63322, "epoch": 376} {"train_loss": -8.668336868286133, "global_step": 63323, "epoch": 376} {"train_loss": -8.373126029968262, "global_step": 63324, "epoch": 376} {"train_loss": -8.547407150268555, "global_step": 63325, "epoch": 376} {"train_loss": -8.611127853393555, "global_step": 63326, "epoch": 376} {"train_loss": -8.46122932434082, "global_step": 63327, "epoch": 376} {"train_loss": -8.580665588378906, "global_step": 63328, "epoch": 376} {"train_loss": -8.554291725158691, "global_step": 63329, "epoch": 376} {"train_loss": -8.510278701782227, "global_step": 63330, "epoch": 376} {"train_loss": -8.743881225585938, "global_step": 63331, "epoch": 376} {"train_loss": -8.708873748779297, "global_step": 63332, "epoch": 376} {"train_loss": -8.678947448730469, "global_step": 63333, "epoch": 376} {"train_loss": -8.45391845703125, "global_step": 63334, "epoch": 376} {"train_loss": -8.693014329388028, "global_step": 63335, "epoch": 376, "val_loss": 192740.453125} {"train_loss": -8.621919631958008, "global_step": 63336, "epoch": 377} {"train_loss": -8.443063735961914, "global_step": 63337, "epoch": 377} {"train_loss": -8.901958465576172, "global_step": 63338, "epoch": 377} {"train_loss": -8.724992752075195, "global_step": 63339, "epoch": 377} {"train_loss": -8.640917778015137, "global_step": 63340, "epoch": 377} {"train_loss": -8.699127197265625, "global_step": 63341, "epoch": 377} {"train_loss": -8.706249237060547, "global_step": 63342, "epoch": 377} {"train_loss": -8.715048789978027, "global_step": 63343, "epoch": 377} {"train_loss": -8.564360618591309, "global_step": 63344, "epoch": 377} {"train_loss": -8.751527786254883, "global_step": 63345, "epoch": 377} {"train_loss": -8.618423461914062, "global_step": 63346, "epoch": 377} {"train_loss": -9.014921188354492, "global_step": 63347, "epoch": 377} {"train_loss": -8.75076961517334, "global_step": 63348, "epoch": 377} {"train_loss": -9.037561416625977, "global_step": 63349, "epoch": 377} {"train_loss": -8.720537185668945, "global_step": 63350, "epoch": 377} {"train_loss": -8.791898727416992, "global_step": 63351, "epoch": 377} {"train_loss": -8.668804168701172, "global_step": 63352, "epoch": 377} {"train_loss": -8.707744598388672, "global_step": 63353, "epoch": 377} {"train_loss": -8.699341773986816, "global_step": 63354, "epoch": 377} {"train_loss": -8.854947090148926, "global_step": 63355, "epoch": 377} {"train_loss": -8.717000007629395, "global_step": 63356, "epoch": 377} {"train_loss": -8.660356521606445, "global_step": 63357, "epoch": 377} {"train_loss": -8.525779724121094, "global_step": 63358, "epoch": 377} {"train_loss": -8.71163558959961, "global_step": 63359, "epoch": 377} {"train_loss": -8.68470573425293, "global_step": 63360, "epoch": 377} {"train_loss": -8.961099624633789, "global_step": 63361, "epoch": 377} {"train_loss": -8.725431442260742, "global_step": 63362, "epoch": 377} {"train_loss": -8.547712326049805, "global_step": 63363, "epoch": 377} {"train_loss": -8.7567777633667, "global_step": 63364, "epoch": 377} {"train_loss": -8.806170463562012, "global_step": 63365, "epoch": 377} {"train_loss": -8.659977912902832, "global_step": 63366, "epoch": 377} {"train_loss": -8.571887969970703, "global_step": 63367, "epoch": 377} {"train_loss": -8.47912883758545, "global_step": 63368, "epoch": 377} {"train_loss": -8.562047958374023, "global_step": 63369, "epoch": 377} {"train_loss": -8.007284164428711, "global_step": 63370, "epoch": 377} {"train_loss": -8.558242797851562, "global_step": 63371, "epoch": 377} {"train_loss": -8.128301620483398, "global_step": 63372, "epoch": 377} {"train_loss": -8.665514945983887, "global_step": 63373, "epoch": 377} {"train_loss": -8.691787719726562, "global_step": 63374, "epoch": 377} {"train_loss": -8.654367446899414, "global_step": 63375, "epoch": 377} {"train_loss": -8.566625595092773, "global_step": 63376, "epoch": 377} {"train_loss": -8.779635429382324, "global_step": 63377, "epoch": 377} {"train_loss": -8.670608520507812, "global_step": 63378, "epoch": 377} {"train_loss": -8.688600540161133, "global_step": 63379, "epoch": 377} {"train_loss": -8.765111923217773, "global_step": 63380, "epoch": 377} {"train_loss": -8.626197814941406, "global_step": 63381, "epoch": 377} {"train_loss": -8.903311729431152, "global_step": 63382, "epoch": 377} {"train_loss": -8.869359970092773, "global_step": 63383, "epoch": 377} {"train_loss": -8.910317420959473, "global_step": 63384, "epoch": 377} {"train_loss": -8.665666580200195, "global_step": 63385, "epoch": 377} {"train_loss": -8.570404052734375, "global_step": 63386, "epoch": 377} {"train_loss": -8.744649887084961, "global_step": 63387, "epoch": 377} {"train_loss": -8.721990585327148, "global_step": 63388, "epoch": 377} {"train_loss": -8.78573989868164, "global_step": 63389, "epoch": 377} {"train_loss": -8.635629653930664, "global_step": 63390, "epoch": 377} {"train_loss": -8.703424453735352, "global_step": 63391, "epoch": 377} {"train_loss": -8.79468822479248, "global_step": 63392, "epoch": 377} {"train_loss": -8.772318840026855, "global_step": 63393, "epoch": 377} {"train_loss": -8.433797836303711, "global_step": 63394, "epoch": 377} {"train_loss": -8.996334075927734, "global_step": 63395, "epoch": 377} {"train_loss": -8.54044246673584, "global_step": 63396, "epoch": 377} {"train_loss": -8.555305480957031, "global_step": 63397, "epoch": 377} {"train_loss": -8.778177261352539, "global_step": 63398, "epoch": 377} {"train_loss": -8.860841751098633, "global_step": 63399, "epoch": 377} {"train_loss": -8.89985466003418, "global_step": 63400, "epoch": 377} {"train_loss": -8.727041244506836, "global_step": 63401, "epoch": 377} {"train_loss": -8.826823234558105, "global_step": 63402, "epoch": 377} {"train_loss": -8.999089241027832, "global_step": 63403, "epoch": 377} {"train_loss": -8.735899925231934, "global_step": 63404, "epoch": 377} {"train_loss": -8.86023998260498, "global_step": 63405, "epoch": 377} {"train_loss": -8.531319618225098, "global_step": 63406, "epoch": 377} {"train_loss": -8.747848510742188, "global_step": 63407, "epoch": 377} {"train_loss": -8.790228843688965, "global_step": 63408, "epoch": 377} {"train_loss": -8.911075592041016, "global_step": 63409, "epoch": 377} {"train_loss": -9.041980743408203, "global_step": 63410, "epoch": 377} {"train_loss": -9.02015209197998, "global_step": 63411, "epoch": 377} {"train_loss": -8.760965347290039, "global_step": 63412, "epoch": 377} {"train_loss": -8.73841381072998, "global_step": 63413, "epoch": 377} {"train_loss": -8.816286087036133, "global_step": 63414, "epoch": 377} {"train_loss": -8.919198036193848, "global_step": 63415, "epoch": 377} {"train_loss": -8.7203369140625, "global_step": 63416, "epoch": 377} {"train_loss": -8.901778221130371, "global_step": 63417, "epoch": 377} {"train_loss": -8.785125732421875, "global_step": 63418, "epoch": 377} {"train_loss": -8.833476066589355, "global_step": 63419, "epoch": 377} {"train_loss": -8.981241226196289, "global_step": 63420, "epoch": 377} {"train_loss": -8.740764617919922, "global_step": 63421, "epoch": 377} {"train_loss": -8.726760864257812, "global_step": 63422, "epoch": 377} {"train_loss": -8.679197311401367, "global_step": 63423, "epoch": 377} {"train_loss": -9.009689331054688, "global_step": 63424, "epoch": 377} {"train_loss": -8.966354370117188, "global_step": 63425, "epoch": 377} {"train_loss": -8.805047988891602, "global_step": 63426, "epoch": 377} {"train_loss": -8.699747085571289, "global_step": 63427, "epoch": 377} {"train_loss": -8.791427612304688, "global_step": 63428, "epoch": 377} {"train_loss": -8.539762496948242, "global_step": 63429, "epoch": 377} {"train_loss": -8.493167877197266, "global_step": 63430, "epoch": 377} {"train_loss": -8.734504699707031, "global_step": 63431, "epoch": 377} {"train_loss": -8.722257614135742, "global_step": 63432, "epoch": 377} {"train_loss": -8.828487396240234, "global_step": 63433, "epoch": 377} {"train_loss": -8.636743545532227, "global_step": 63434, "epoch": 377} {"train_loss": -8.595634460449219, "global_step": 63435, "epoch": 377} {"train_loss": -8.67622184753418, "global_step": 63436, "epoch": 377} {"train_loss": -8.789592742919922, "global_step": 63437, "epoch": 377} {"train_loss": -8.755964279174805, "global_step": 63438, "epoch": 377} {"train_loss": -8.795724868774414, "global_step": 63439, "epoch": 377} {"train_loss": -8.76101303100586, "global_step": 63440, "epoch": 377} {"train_loss": -8.577873229980469, "global_step": 63441, "epoch": 377} {"train_loss": -8.881107330322266, "global_step": 63442, "epoch": 377} {"train_loss": -8.799398422241211, "global_step": 63443, "epoch": 377} {"train_loss": -8.700657844543457, "global_step": 63444, "epoch": 377} {"train_loss": -8.877140045166016, "global_step": 63445, "epoch": 377} {"train_loss": -8.834644317626953, "global_step": 63446, "epoch": 377} {"train_loss": -8.909158706665039, "global_step": 63447, "epoch": 377} {"train_loss": -8.735370635986328, "global_step": 63448, "epoch": 377} {"train_loss": -8.718866348266602, "global_step": 63449, "epoch": 377} {"train_loss": -8.82054615020752, "global_step": 63450, "epoch": 377} {"train_loss": -8.755562782287598, "global_step": 63451, "epoch": 377} {"train_loss": -9.10213851928711, "global_step": 63452, "epoch": 377} {"train_loss": -8.510700225830078, "global_step": 63453, "epoch": 377} {"train_loss": -8.678299903869629, "global_step": 63454, "epoch": 377} {"train_loss": -8.721488952636719, "global_step": 63455, "epoch": 377} {"train_loss": -8.9132080078125, "global_step": 63456, "epoch": 377} {"train_loss": -8.764131546020508, "global_step": 63457, "epoch": 377} {"train_loss": -8.651253700256348, "global_step": 63458, "epoch": 377} {"train_loss": -8.851776123046875, "global_step": 63459, "epoch": 377} {"train_loss": -8.830415725708008, "global_step": 63460, "epoch": 377} {"train_loss": -9.059881210327148, "global_step": 63461, "epoch": 377} {"train_loss": -8.753684043884277, "global_step": 63462, "epoch": 377} {"train_loss": -8.89107894897461, "global_step": 63463, "epoch": 377} {"train_loss": -8.78700065612793, "global_step": 63464, "epoch": 377} {"train_loss": -9.107150077819824, "global_step": 63465, "epoch": 377} {"train_loss": -8.631712913513184, "global_step": 63466, "epoch": 377} {"train_loss": -8.87313461303711, "global_step": 63467, "epoch": 377} {"train_loss": -8.430952072143555, "global_step": 63468, "epoch": 377} {"train_loss": -8.781652450561523, "global_step": 63469, "epoch": 377} {"train_loss": -8.449599266052246, "global_step": 63470, "epoch": 377} {"train_loss": -8.903300285339355, "global_step": 63471, "epoch": 377} {"train_loss": -8.581925392150879, "global_step": 63472, "epoch": 377} {"train_loss": -8.566915512084961, "global_step": 63473, "epoch": 377} {"train_loss": -8.727542877197266, "global_step": 63474, "epoch": 377} {"train_loss": -8.680840492248535, "global_step": 63475, "epoch": 377} {"train_loss": -8.539039611816406, "global_step": 63476, "epoch": 377} {"train_loss": -8.693318367004395, "global_step": 63477, "epoch": 377} {"train_loss": -8.64360523223877, "global_step": 63478, "epoch": 377} {"train_loss": -8.69050121307373, "global_step": 63479, "epoch": 377} {"train_loss": -8.663063049316406, "global_step": 63480, "epoch": 377} {"train_loss": -8.841484069824219, "global_step": 63481, "epoch": 377} {"train_loss": -8.677399635314941, "global_step": 63482, "epoch": 377} {"train_loss": -8.77979564666748, "global_step": 63483, "epoch": 377} {"train_loss": -8.824056625366211, "global_step": 63484, "epoch": 377} {"train_loss": -8.651374816894531, "global_step": 63485, "epoch": 377} {"train_loss": -8.813539505004883, "global_step": 63486, "epoch": 377} {"train_loss": -8.667025566101074, "global_step": 63487, "epoch": 377} {"train_loss": -8.86739730834961, "global_step": 63488, "epoch": 377} {"train_loss": -8.478772163391113, "global_step": 63489, "epoch": 377} {"train_loss": -8.877311706542969, "global_step": 63490, "epoch": 377} {"train_loss": -8.66314697265625, "global_step": 63491, "epoch": 377} {"train_loss": -8.923013687133789, "global_step": 63492, "epoch": 377} {"train_loss": -8.405664443969727, "global_step": 63493, "epoch": 377} {"train_loss": -8.952096939086914, "global_step": 63494, "epoch": 377} {"train_loss": -8.741735458374023, "global_step": 63495, "epoch": 377} {"train_loss": -8.773667335510254, "global_step": 63496, "epoch": 377} {"train_loss": -8.891298294067383, "global_step": 63497, "epoch": 377} {"train_loss": -8.8460054397583, "global_step": 63498, "epoch": 377} {"train_loss": -8.522185325622559, "global_step": 63499, "epoch": 377} {"train_loss": -8.842710494995117, "global_step": 63500, "epoch": 377} {"train_loss": -8.73129653930664, "global_step": 63501, "epoch": 377} {"train_loss": -8.807076454162598, "global_step": 63502, "epoch": 377} {"train_loss": -8.73562661239079, "global_step": 63503, "epoch": 377, "val_loss": 190218.234375} {"train_loss": -8.892663955688477, "global_step": 63504, "epoch": 378} {"train_loss": -8.713905334472656, "global_step": 63505, "epoch": 378} {"train_loss": -8.892853736877441, "global_step": 63506, "epoch": 378} {"train_loss": -8.733648300170898, "global_step": 63507, "epoch": 378} {"train_loss": -9.040689468383789, "global_step": 63508, "epoch": 378} {"train_loss": -8.867508888244629, "global_step": 63509, "epoch": 378} {"train_loss": -8.801248550415039, "global_step": 63510, "epoch": 378} {"train_loss": -8.789682388305664, "global_step": 63511, "epoch": 378} {"train_loss": -8.906460762023926, "global_step": 63512, "epoch": 378} {"train_loss": -8.862136840820312, "global_step": 63513, "epoch": 378} {"train_loss": -8.74416732788086, "global_step": 63514, "epoch": 378} {"train_loss": -8.944356918334961, "global_step": 63515, "epoch": 378} {"train_loss": -8.747577667236328, "global_step": 63516, "epoch": 378} {"train_loss": -8.892660140991211, "global_step": 63517, "epoch": 378} {"train_loss": -8.660179138183594, "global_step": 63518, "epoch": 378} {"train_loss": -8.821524620056152, "global_step": 63519, "epoch": 378} {"train_loss": -8.629650115966797, "global_step": 63520, "epoch": 378} {"train_loss": -8.870390892028809, "global_step": 63521, "epoch": 378} {"train_loss": -8.68819808959961, "global_step": 63522, "epoch": 378} {"train_loss": -8.863788604736328, "global_step": 63523, "epoch": 378} {"train_loss": -8.592105865478516, "global_step": 63524, "epoch": 378} {"train_loss": -8.63856315612793, "global_step": 63525, "epoch": 378} {"train_loss": -8.544638633728027, "global_step": 63526, "epoch": 378} {"train_loss": -8.740041732788086, "global_step": 63527, "epoch": 378} {"train_loss": -8.46788215637207, "global_step": 63528, "epoch": 378} {"train_loss": -8.838756561279297, "global_step": 63529, "epoch": 378} {"train_loss": -8.763824462890625, "global_step": 63530, "epoch": 378} {"train_loss": -8.570356369018555, "global_step": 63531, "epoch": 378} {"train_loss": -8.61040210723877, "global_step": 63532, "epoch": 378} {"train_loss": -8.527013778686523, "global_step": 63533, "epoch": 378} {"train_loss": -8.969676971435547, "global_step": 63534, "epoch": 378} {"train_loss": -8.860700607299805, "global_step": 63535, "epoch": 378} {"train_loss": -8.624198913574219, "global_step": 63536, "epoch": 378} {"train_loss": -8.61693000793457, "global_step": 63537, "epoch": 378} {"train_loss": -8.891314506530762, "global_step": 63538, "epoch": 378} {"train_loss": -8.700613021850586, "global_step": 63539, "epoch": 378} {"train_loss": -8.86347770690918, "global_step": 63540, "epoch": 378} {"train_loss": -8.95550537109375, "global_step": 63541, "epoch": 378} {"train_loss": -8.653888702392578, "global_step": 63542, "epoch": 378} {"train_loss": -8.872325897216797, "global_step": 63543, "epoch": 378} {"train_loss": -8.71623420715332, "global_step": 63544, "epoch": 378} {"train_loss": -8.711005210876465, "global_step": 63545, "epoch": 378} {"train_loss": -8.743043899536133, "global_step": 63546, "epoch": 378} {"train_loss": -8.986190795898438, "global_step": 63547, "epoch": 378} {"train_loss": -8.751897811889648, "global_step": 63548, "epoch": 378} {"train_loss": -8.902983665466309, "global_step": 63549, "epoch": 378} {"train_loss": -8.978453636169434, "global_step": 63550, "epoch": 378} {"train_loss": -8.830973625183105, "global_step": 63551, "epoch": 378} {"train_loss": -8.770635604858398, "global_step": 63552, "epoch": 378} {"train_loss": -8.95363712310791, "global_step": 63553, "epoch": 378} {"train_loss": -8.824380874633789, "global_step": 63554, "epoch": 378} {"train_loss": -8.742879867553711, "global_step": 63555, "epoch": 378} {"train_loss": -8.926862716674805, "global_step": 63556, "epoch": 378} {"train_loss": -8.961153030395508, "global_step": 63557, "epoch": 378} {"train_loss": -8.771219253540039, "global_step": 63558, "epoch": 378} {"train_loss": -8.762054443359375, "global_step": 63559, "epoch": 378} {"train_loss": -8.977286338806152, "global_step": 63560, "epoch": 378} {"train_loss": -8.826519012451172, "global_step": 63561, "epoch": 378} {"train_loss": -8.899984359741211, "global_step": 63562, "epoch": 378} {"train_loss": -9.13056468963623, "global_step": 63563, "epoch": 378} {"train_loss": -8.951080322265625, "global_step": 63564, "epoch": 378} {"train_loss": -9.051653861999512, "global_step": 63565, "epoch": 378} {"train_loss": -8.908134460449219, "global_step": 63566, "epoch": 378} {"train_loss": -8.9989013671875, "global_step": 63567, "epoch": 378} {"train_loss": -8.809537887573242, "global_step": 63568, "epoch": 378} {"train_loss": -9.006410598754883, "global_step": 63569, "epoch": 378} {"train_loss": -8.907659530639648, "global_step": 63570, "epoch": 378} {"train_loss": -8.827037811279297, "global_step": 63571, "epoch": 378} {"train_loss": -8.871230125427246, "global_step": 63572, "epoch": 378} {"train_loss": -8.767361640930176, "global_step": 63573, "epoch": 378} {"train_loss": -8.880670547485352, "global_step": 63574, "epoch": 378} {"train_loss": -8.72946548461914, "global_step": 63575, "epoch": 378} {"train_loss": -8.586681365966797, "global_step": 63576, "epoch": 378} {"train_loss": -8.92414665222168, "global_step": 63577, "epoch": 378} {"train_loss": -8.59492301940918, "global_step": 63578, "epoch": 378} {"train_loss": -8.453568458557129, "global_step": 63579, "epoch": 378} {"train_loss": -8.370964050292969, "global_step": 63580, "epoch": 378} {"train_loss": -8.074750900268555, "global_step": 63581, "epoch": 378} {"train_loss": -7.886818885803223, "global_step": 63582, "epoch": 378} {"train_loss": -7.19724178314209, "global_step": 63583, "epoch": 378} {"train_loss": -8.12729549407959, "global_step": 63584, "epoch": 378} {"train_loss": -8.356414794921875, "global_step": 63585, "epoch": 378} {"train_loss": -8.162639617919922, "global_step": 63586, "epoch": 378} {"train_loss": -8.255203247070312, "global_step": 63587, "epoch": 378} {"train_loss": -8.224763870239258, "global_step": 63588, "epoch": 378} {"train_loss": -8.20689582824707, "global_step": 63589, "epoch": 378} {"train_loss": -8.408159255981445, "global_step": 63590, "epoch": 378} {"train_loss": -8.37542724609375, "global_step": 63591, "epoch": 378} {"train_loss": -8.431676864624023, "global_step": 63592, "epoch": 378} {"train_loss": -8.302003860473633, "global_step": 63593, "epoch": 378} {"train_loss": -8.580707550048828, "global_step": 63594, "epoch": 378} {"train_loss": -8.528416633605957, "global_step": 63595, "epoch": 378} {"train_loss": -8.576372146606445, "global_step": 63596, "epoch": 378} {"train_loss": -8.45930290222168, "global_step": 63597, "epoch": 378} {"train_loss": -8.544046401977539, "global_step": 63598, "epoch": 378} {"train_loss": -8.604084968566895, "global_step": 63599, "epoch": 378} {"train_loss": -8.417750358581543, "global_step": 63600, "epoch": 378} {"train_loss": -8.55184555053711, "global_step": 63601, "epoch": 378} {"train_loss": -8.599769592285156, "global_step": 63602, "epoch": 378} {"train_loss": -8.696670532226562, "global_step": 63603, "epoch": 378} {"train_loss": -8.658019065856934, "global_step": 63604, "epoch": 378} {"train_loss": -8.64475154876709, "global_step": 63605, "epoch": 378} {"train_loss": -8.707058906555176, "global_step": 63606, "epoch": 378} {"train_loss": -8.557255744934082, "global_step": 63607, "epoch": 378} {"train_loss": -8.836034774780273, "global_step": 63608, "epoch": 378} {"train_loss": -8.597471237182617, "global_step": 63609, "epoch": 378} {"train_loss": -8.748023986816406, "global_step": 63610, "epoch": 378} {"train_loss": -8.811116218566895, "global_step": 63611, "epoch": 378} {"train_loss": -8.875999450683594, "global_step": 63612, "epoch": 378} {"train_loss": -9.068000793457031, "global_step": 63613, "epoch": 378} {"train_loss": -9.018649101257324, "global_step": 63614, "epoch": 378} {"train_loss": -8.885722160339355, "global_step": 63615, "epoch": 378} {"train_loss": -9.055303573608398, "global_step": 63616, "epoch": 378} {"train_loss": -8.891447067260742, "global_step": 63617, "epoch": 378} {"train_loss": -8.645574569702148, "global_step": 63618, "epoch": 378} {"train_loss": -8.756689071655273, "global_step": 63619, "epoch": 378} {"train_loss": -8.798164367675781, "global_step": 63620, "epoch": 378} {"train_loss": -8.83437728881836, "global_step": 63621, "epoch": 378} {"train_loss": -9.058029174804688, "global_step": 63622, "epoch": 378} {"train_loss": -8.47616958618164, "global_step": 63623, "epoch": 378} {"train_loss": -8.667366981506348, "global_step": 63624, "epoch": 378} {"train_loss": -8.529304504394531, "global_step": 63625, "epoch": 378} {"train_loss": -8.725305557250977, "global_step": 63626, "epoch": 378} {"train_loss": -8.233901023864746, "global_step": 63627, "epoch": 378} {"train_loss": -8.715519905090332, "global_step": 63628, "epoch": 378} {"train_loss": -8.35993766784668, "global_step": 63629, "epoch": 378} {"train_loss": -8.419647216796875, "global_step": 63630, "epoch": 378} {"train_loss": -8.797067642211914, "global_step": 63631, "epoch": 378} {"train_loss": -8.739096641540527, "global_step": 63632, "epoch": 378} {"train_loss": -8.960731506347656, "global_step": 63633, "epoch": 378} {"train_loss": -8.686736106872559, "global_step": 63634, "epoch": 378} {"train_loss": -8.644350051879883, "global_step": 63635, "epoch": 378} {"train_loss": -8.708948135375977, "global_step": 63636, "epoch": 378} {"train_loss": -8.762889862060547, "global_step": 63637, "epoch": 378} {"train_loss": -8.779096603393555, "global_step": 63638, "epoch": 378} {"train_loss": -8.749052047729492, "global_step": 63639, "epoch": 378} {"train_loss": -8.664896011352539, "global_step": 63640, "epoch": 378} {"train_loss": -8.655421257019043, "global_step": 63641, "epoch": 378} {"train_loss": -8.696401596069336, "global_step": 63642, "epoch": 378} {"train_loss": -8.730513572692871, "global_step": 63643, "epoch": 378} {"train_loss": -8.836018562316895, "global_step": 63644, "epoch": 378} {"train_loss": -8.914008140563965, "global_step": 63645, "epoch": 378} {"train_loss": -8.932794570922852, "global_step": 63646, "epoch": 378} {"train_loss": -8.835105895996094, "global_step": 63647, "epoch": 378} {"train_loss": -8.670083999633789, "global_step": 63648, "epoch": 378} {"train_loss": -9.002706527709961, "global_step": 63649, "epoch": 378} {"train_loss": -8.942855834960938, "global_step": 63650, "epoch": 378} {"train_loss": -8.822381973266602, "global_step": 63651, "epoch": 378} {"train_loss": -8.901002883911133, "global_step": 63652, "epoch": 378} {"train_loss": -9.007333755493164, "global_step": 63653, "epoch": 378} {"train_loss": -8.83299732208252, "global_step": 63654, "epoch": 378} {"train_loss": -8.612452507019043, "global_step": 63655, "epoch": 378} {"train_loss": -8.851978302001953, "global_step": 63656, "epoch": 378} {"train_loss": -8.904340744018555, "global_step": 63657, "epoch": 378} {"train_loss": -8.766288757324219, "global_step": 63658, "epoch": 378} {"train_loss": -8.770130157470703, "global_step": 63659, "epoch": 378} {"train_loss": -8.958992958068848, "global_step": 63660, "epoch": 378} {"train_loss": -8.806520462036133, "global_step": 63661, "epoch": 378} {"train_loss": -8.93400764465332, "global_step": 63662, "epoch": 378} {"train_loss": -8.688356399536133, "global_step": 63663, "epoch": 378} {"train_loss": -8.739927291870117, "global_step": 63664, "epoch": 378} {"train_loss": -8.864588737487793, "global_step": 63665, "epoch": 378} {"train_loss": -8.695613861083984, "global_step": 63666, "epoch": 378} {"train_loss": -8.736188888549805, "global_step": 63667, "epoch": 378} {"train_loss": -8.45916748046875, "global_step": 63668, "epoch": 378} {"train_loss": -8.651121139526367, "global_step": 63669, "epoch": 378} {"train_loss": -8.647621154785156, "global_step": 63670, "epoch": 378} {"train_loss": -8.716746557326545, "global_step": 63671, "epoch": 378, "val_loss": 192617.296875} {"train_loss": -8.864072799682617, "global_step": 63672, "epoch": 379} {"train_loss": -8.602166175842285, "global_step": 63673, "epoch": 379} {"train_loss": -8.540998458862305, "global_step": 63674, "epoch": 379} {"train_loss": -8.511009216308594, "global_step": 63675, "epoch": 379} {"train_loss": -8.634366035461426, "global_step": 63676, "epoch": 379} {"train_loss": -8.303102493286133, "global_step": 63677, "epoch": 379} {"train_loss": -8.544366836547852, "global_step": 63678, "epoch": 379} {"train_loss": -8.161552429199219, "global_step": 63679, "epoch": 379} {"train_loss": -8.741891860961914, "global_step": 63680, "epoch": 379} {"train_loss": -8.375734329223633, "global_step": 63681, "epoch": 379} {"train_loss": -8.613136291503906, "global_step": 63682, "epoch": 379} {"train_loss": -8.651908874511719, "global_step": 63683, "epoch": 379} {"train_loss": -8.67987060546875, "global_step": 63684, "epoch": 379} {"train_loss": -8.367177963256836, "global_step": 63685, "epoch": 379} {"train_loss": -8.755434036254883, "global_step": 63686, "epoch": 379} {"train_loss": -8.848089218139648, "global_step": 63687, "epoch": 379} {"train_loss": -8.598283767700195, "global_step": 63688, "epoch": 379} {"train_loss": -8.683399200439453, "global_step": 63689, "epoch": 379} {"train_loss": -8.651618003845215, "global_step": 63690, "epoch": 379} {"train_loss": -8.4517240524292, "global_step": 63691, "epoch": 379} {"train_loss": -8.728324890136719, "global_step": 63692, "epoch": 379} {"train_loss": -8.74450969696045, "global_step": 63693, "epoch": 379} {"train_loss": -8.584334373474121, "global_step": 63694, "epoch": 379} {"train_loss": -8.663578033447266, "global_step": 63695, "epoch": 379} {"train_loss": -8.68580150604248, "global_step": 63696, "epoch": 379} {"train_loss": -8.84521198272705, "global_step": 63697, "epoch": 379} {"train_loss": -8.692644119262695, "global_step": 63698, "epoch": 379} {"train_loss": -8.937514305114746, "global_step": 63699, "epoch": 379} {"train_loss": -8.81552505493164, "global_step": 63700, "epoch": 379} {"train_loss": -8.820860862731934, "global_step": 63701, "epoch": 379} {"train_loss": -8.735511779785156, "global_step": 63702, "epoch": 379} {"train_loss": -8.929518699645996, "global_step": 63703, "epoch": 379} {"train_loss": -9.076042175292969, "global_step": 63704, "epoch": 379} {"train_loss": -9.036311149597168, "global_step": 63705, "epoch": 379} {"train_loss": -8.958690643310547, "global_step": 63706, "epoch": 379} {"train_loss": -8.78095817565918, "global_step": 63707, "epoch": 379} {"train_loss": -8.948975563049316, "global_step": 63708, "epoch": 379} {"train_loss": -8.542634963989258, "global_step": 63709, "epoch": 379} {"train_loss": -8.750619888305664, "global_step": 63710, "epoch": 379} {"train_loss": -8.66054916381836, "global_step": 63711, "epoch": 379} {"train_loss": -8.777725219726562, "global_step": 63712, "epoch": 379} {"train_loss": -8.776946067810059, "global_step": 63713, "epoch": 379} {"train_loss": -8.684581756591797, "global_step": 63714, "epoch": 379} {"train_loss": -8.803858757019043, "global_step": 63715, "epoch": 379} {"train_loss": -8.896234512329102, "global_step": 63716, "epoch": 379} {"train_loss": -8.950021743774414, "global_step": 63717, "epoch": 379} {"train_loss": -8.680187225341797, "global_step": 63718, "epoch": 379} {"train_loss": -8.791704177856445, "global_step": 63719, "epoch": 379} {"train_loss": -8.815670013427734, "global_step": 63720, "epoch": 379} {"train_loss": -8.6790189743042, "global_step": 63721, "epoch": 379} {"train_loss": -8.569769859313965, "global_step": 63722, "epoch": 379} {"train_loss": -8.838797569274902, "global_step": 63723, "epoch": 379} {"train_loss": -8.939599990844727, "global_step": 63724, "epoch": 379} {"train_loss": -8.695026397705078, "global_step": 63725, "epoch": 379} {"train_loss": -8.826042175292969, "global_step": 63726, "epoch": 379} {"train_loss": -8.75427532196045, "global_step": 63727, "epoch": 379} {"train_loss": -8.797454833984375, "global_step": 63728, "epoch": 379} {"train_loss": -8.801475524902344, "global_step": 63729, "epoch": 379} {"train_loss": -8.870316505432129, "global_step": 63730, "epoch": 379} {"train_loss": -8.69426155090332, "global_step": 63731, "epoch": 379} {"train_loss": -9.015710830688477, "global_step": 63732, "epoch": 379} {"train_loss": -8.801019668579102, "global_step": 63733, "epoch": 379} {"train_loss": -8.805160522460938, "global_step": 63734, "epoch": 379} {"train_loss": -8.777137756347656, "global_step": 63735, "epoch": 379} {"train_loss": -8.631299018859863, "global_step": 63736, "epoch": 379} {"train_loss": -8.902206420898438, "global_step": 63737, "epoch": 379} {"train_loss": -8.612117767333984, "global_step": 63738, "epoch": 379} {"train_loss": -8.668864250183105, "global_step": 63739, "epoch": 379} {"train_loss": -8.852066040039062, "global_step": 63740, "epoch": 379} {"train_loss": -8.773968696594238, "global_step": 63741, "epoch": 379} {"train_loss": -8.907435417175293, "global_step": 63742, "epoch": 379} {"train_loss": -8.615739822387695, "global_step": 63743, "epoch": 379} {"train_loss": -8.85086441040039, "global_step": 63744, "epoch": 379} {"train_loss": -8.523717880249023, "global_step": 63745, "epoch": 379} {"train_loss": -8.95461368560791, "global_step": 63746, "epoch": 379} {"train_loss": -8.522144317626953, "global_step": 63747, "epoch": 379} {"train_loss": -8.875083923339844, "global_step": 63748, "epoch": 379} {"train_loss": -8.543632507324219, "global_step": 63749, "epoch": 379} {"train_loss": -8.879861831665039, "global_step": 63750, "epoch": 379} {"train_loss": -8.573591232299805, "global_step": 63751, "epoch": 379} {"train_loss": -8.631166458129883, "global_step": 63752, "epoch": 379} {"train_loss": -8.522143363952637, "global_step": 63753, "epoch": 379} {"train_loss": -8.609512329101562, "global_step": 63754, "epoch": 379} {"train_loss": -8.632108688354492, "global_step": 63755, "epoch": 379} {"train_loss": -8.514223098754883, "global_step": 63756, "epoch": 379} {"train_loss": -8.583511352539062, "global_step": 63757, "epoch": 379} {"train_loss": -8.71255874633789, "global_step": 63758, "epoch": 379} {"train_loss": -8.564268112182617, "global_step": 63759, "epoch": 379} {"train_loss": -8.901426315307617, "global_step": 63760, "epoch": 379} {"train_loss": -8.853292465209961, "global_step": 63761, "epoch": 379} {"train_loss": -8.511919021606445, "global_step": 63762, "epoch": 379} {"train_loss": -8.665901184082031, "global_step": 63763, "epoch": 379} {"train_loss": -8.761550903320312, "global_step": 63764, "epoch": 379} {"train_loss": -8.806039810180664, "global_step": 63765, "epoch": 379} {"train_loss": -8.44372272491455, "global_step": 63766, "epoch": 379} {"train_loss": -8.849063873291016, "global_step": 63767, "epoch": 379} {"train_loss": -8.888436317443848, "global_step": 63768, "epoch": 379} {"train_loss": -8.800012588500977, "global_step": 63769, "epoch": 379} {"train_loss": -8.699901580810547, "global_step": 63770, "epoch": 379} {"train_loss": -8.918015480041504, "global_step": 63771, "epoch": 379} {"train_loss": -8.869905471801758, "global_step": 63772, "epoch": 379} {"train_loss": -8.874067306518555, "global_step": 63773, "epoch": 379} {"train_loss": -8.877828598022461, "global_step": 63774, "epoch": 379} {"train_loss": -8.66612720489502, "global_step": 63775, "epoch": 379} {"train_loss": -8.657552719116211, "global_step": 63776, "epoch": 379} {"train_loss": -8.743907928466797, "global_step": 63777, "epoch": 379} {"train_loss": -8.735617637634277, "global_step": 63778, "epoch": 379} {"train_loss": -8.706403732299805, "global_step": 63779, "epoch": 379} {"train_loss": -8.876724243164062, "global_step": 63780, "epoch": 379} {"train_loss": -8.814502716064453, "global_step": 63781, "epoch": 379} {"train_loss": -8.814144134521484, "global_step": 63782, "epoch": 379} {"train_loss": -8.870092391967773, "global_step": 63783, "epoch": 379} {"train_loss": -8.668901443481445, "global_step": 63784, "epoch": 379} {"train_loss": -8.915456771850586, "global_step": 63785, "epoch": 379} {"train_loss": -8.709677696228027, "global_step": 63786, "epoch": 379} {"train_loss": -8.6657075881958, "global_step": 63787, "epoch": 379} {"train_loss": -8.869287490844727, "global_step": 63788, "epoch": 379} {"train_loss": -8.843156814575195, "global_step": 63789, "epoch": 379} {"train_loss": -8.67380142211914, "global_step": 63790, "epoch": 379} {"train_loss": -8.7630033493042, "global_step": 63791, "epoch": 379} {"train_loss": -8.868841171264648, "global_step": 63792, "epoch": 379} {"train_loss": -8.815644264221191, "global_step": 63793, "epoch": 379} {"train_loss": -8.87101936340332, "global_step": 63794, "epoch": 379} {"train_loss": -8.839695930480957, "global_step": 63795, "epoch": 379} {"train_loss": -8.845200538635254, "global_step": 63796, "epoch": 379} {"train_loss": -8.771865844726562, "global_step": 63797, "epoch": 379} {"train_loss": -8.946615219116211, "global_step": 63798, "epoch": 379} {"train_loss": -8.72977352142334, "global_step": 63799, "epoch": 379} {"train_loss": -8.785127639770508, "global_step": 63800, "epoch": 379} {"train_loss": -8.952581405639648, "global_step": 63801, "epoch": 379} {"train_loss": -8.816642761230469, "global_step": 63802, "epoch": 379} {"train_loss": -8.864593505859375, "global_step": 63803, "epoch": 379} {"train_loss": -8.870046615600586, "global_step": 63804, "epoch": 379} {"train_loss": -8.67764663696289, "global_step": 63805, "epoch": 379} {"train_loss": -8.802270889282227, "global_step": 63806, "epoch": 379} {"train_loss": -8.732851028442383, "global_step": 63807, "epoch": 379} {"train_loss": -8.913178443908691, "global_step": 63808, "epoch": 379} {"train_loss": -8.746472358703613, "global_step": 63809, "epoch": 379} {"train_loss": -8.797399520874023, "global_step": 63810, "epoch": 379} {"train_loss": -8.61783504486084, "global_step": 63811, "epoch": 379} {"train_loss": -8.752657890319824, "global_step": 63812, "epoch": 379} {"train_loss": -8.855064392089844, "global_step": 63813, "epoch": 379} {"train_loss": -8.957625389099121, "global_step": 63814, "epoch": 379} {"train_loss": -8.805351257324219, "global_step": 63815, "epoch": 379} {"train_loss": -8.95736312866211, "global_step": 63816, "epoch": 379} {"train_loss": -8.786836624145508, "global_step": 63817, "epoch": 379} {"train_loss": -8.94958209991455, "global_step": 63818, "epoch": 379} {"train_loss": -8.931197166442871, "global_step": 63819, "epoch": 379} {"train_loss": -9.013969421386719, "global_step": 63820, "epoch": 379} {"train_loss": -9.103260040283203, "global_step": 63821, "epoch": 379} {"train_loss": -8.897601127624512, "global_step": 63822, "epoch": 379} {"train_loss": -8.93149185180664, "global_step": 63823, "epoch": 379} {"train_loss": -9.01791000366211, "global_step": 63824, "epoch": 379} {"train_loss": -8.9127197265625, "global_step": 63825, "epoch": 379} {"train_loss": -9.011590957641602, "global_step": 63826, "epoch": 379} {"train_loss": -8.700641632080078, "global_step": 63827, "epoch": 379} {"train_loss": -8.767303466796875, "global_step": 63828, "epoch": 379} {"train_loss": -8.639957427978516, "global_step": 63829, "epoch": 379} {"train_loss": -8.627821922302246, "global_step": 63830, "epoch": 379} {"train_loss": -8.485416412353516, "global_step": 63831, "epoch": 379} {"train_loss": -8.82187271118164, "global_step": 63832, "epoch": 379} {"train_loss": -8.673477172851562, "global_step": 63833, "epoch": 379} {"train_loss": -8.81474781036377, "global_step": 63834, "epoch": 379} {"train_loss": -8.619699478149414, "global_step": 63835, "epoch": 379} {"train_loss": -8.511992454528809, "global_step": 63836, "epoch": 379} {"train_loss": -8.964081764221191, "global_step": 63837, "epoch": 379} {"train_loss": -8.782659530639648, "global_step": 63838, "epoch": 379} {"train_loss": -8.755642828487215, "global_step": 63839, "epoch": 379, "val_loss": 191506.5625} {"train_loss": -8.77487850189209, "global_step": 63840, "epoch": 380} {"train_loss": -8.827631950378418, "global_step": 63841, "epoch": 380} {"train_loss": -9.050699234008789, "global_step": 63842, "epoch": 380} {"train_loss": -8.74351692199707, "global_step": 63843, "epoch": 380} {"train_loss": -8.74072265625, "global_step": 63844, "epoch": 380} {"train_loss": -8.779231071472168, "global_step": 63845, "epoch": 380} {"train_loss": -8.556164741516113, "global_step": 63846, "epoch": 380} {"train_loss": -8.47216796875, "global_step": 63847, "epoch": 380} {"train_loss": -8.70551872253418, "global_step": 63848, "epoch": 380} {"train_loss": -8.502429962158203, "global_step": 63849, "epoch": 380} {"train_loss": -8.733975410461426, "global_step": 63850, "epoch": 380} {"train_loss": -8.589662551879883, "global_step": 63851, "epoch": 380} {"train_loss": -8.508098602294922, "global_step": 63852, "epoch": 380} {"train_loss": -8.5665283203125, "global_step": 63853, "epoch": 380} {"train_loss": -8.368683815002441, "global_step": 63854, "epoch": 380} {"train_loss": -8.404376983642578, "global_step": 63855, "epoch": 380} {"train_loss": -8.656347274780273, "global_step": 63856, "epoch": 380} {"train_loss": -8.692109107971191, "global_step": 63857, "epoch": 380} {"train_loss": -8.792269706726074, "global_step": 63858, "epoch": 380} {"train_loss": -8.436677932739258, "global_step": 63859, "epoch": 380} {"train_loss": -8.864680290222168, "global_step": 63860, "epoch": 380} {"train_loss": -8.562225341796875, "global_step": 63861, "epoch": 380} {"train_loss": -8.551750183105469, "global_step": 63862, "epoch": 380} {"train_loss": -8.730648040771484, "global_step": 63863, "epoch": 380} {"train_loss": -8.628232955932617, "global_step": 63864, "epoch": 380} {"train_loss": -8.90865707397461, "global_step": 63865, "epoch": 380} {"train_loss": -8.719985961914062, "global_step": 63866, "epoch": 380} {"train_loss": -8.797365188598633, "global_step": 63867, "epoch": 380} {"train_loss": -8.74244499206543, "global_step": 63868, "epoch": 380} {"train_loss": -8.629796981811523, "global_step": 63869, "epoch": 380} {"train_loss": -8.517438888549805, "global_step": 63870, "epoch": 380} {"train_loss": -8.878000259399414, "global_step": 63871, "epoch": 380} {"train_loss": -8.807453155517578, "global_step": 63872, "epoch": 380} {"train_loss": -8.765344619750977, "global_step": 63873, "epoch": 380} {"train_loss": -8.75660514831543, "global_step": 63874, "epoch": 380} {"train_loss": -8.667562484741211, "global_step": 63875, "epoch": 380} {"train_loss": -8.634849548339844, "global_step": 63876, "epoch": 380} {"train_loss": -8.829154968261719, "global_step": 63877, "epoch": 380} {"train_loss": -8.713052749633789, "global_step": 63878, "epoch": 380} {"train_loss": -8.74577522277832, "global_step": 63879, "epoch": 380} {"train_loss": -8.9015531539917, "global_step": 63880, "epoch": 380} {"train_loss": -8.76805305480957, "global_step": 63881, "epoch": 380} {"train_loss": -8.942485809326172, "global_step": 63882, "epoch": 380} {"train_loss": -8.852304458618164, "global_step": 63883, "epoch": 380} {"train_loss": -8.728960037231445, "global_step": 63884, "epoch": 380} {"train_loss": -8.85268497467041, "global_step": 63885, "epoch": 380} {"train_loss": -8.85153579711914, "global_step": 63886, "epoch": 380} {"train_loss": -9.008345603942871, "global_step": 63887, "epoch": 380} {"train_loss": -8.953847885131836, "global_step": 63888, "epoch": 380} {"train_loss": -8.958379745483398, "global_step": 63889, "epoch": 380} {"train_loss": -8.301008224487305, "global_step": 63890, "epoch": 380} {"train_loss": -8.797426223754883, "global_step": 63891, "epoch": 380} {"train_loss": -8.761945724487305, "global_step": 63892, "epoch": 380} {"train_loss": -8.778228759765625, "global_step": 63893, "epoch": 380} {"train_loss": -8.918542861938477, "global_step": 63894, "epoch": 380} {"train_loss": -8.950785636901855, "global_step": 63895, "epoch": 380} {"train_loss": -8.717223167419434, "global_step": 63896, "epoch": 380} {"train_loss": -8.75490951538086, "global_step": 63897, "epoch": 380} {"train_loss": -8.516305923461914, "global_step": 63898, "epoch": 380} {"train_loss": -8.713903427124023, "global_step": 63899, "epoch": 380} {"train_loss": -8.786675453186035, "global_step": 63900, "epoch": 380} {"train_loss": -8.797904968261719, "global_step": 63901, "epoch": 380} {"train_loss": -8.660062789916992, "global_step": 63902, "epoch": 380} {"train_loss": -8.847525596618652, "global_step": 63903, "epoch": 380} {"train_loss": -8.68059253692627, "global_step": 63904, "epoch": 380} {"train_loss": -8.892555236816406, "global_step": 63905, "epoch": 380} {"train_loss": -8.723390579223633, "global_step": 63906, "epoch": 380} {"train_loss": -8.660751342773438, "global_step": 63907, "epoch": 380} {"train_loss": -8.704289436340332, "global_step": 63908, "epoch": 380} {"train_loss": -8.627748489379883, "global_step": 63909, "epoch": 380} {"train_loss": -8.688282012939453, "global_step": 63910, "epoch": 380} {"train_loss": -8.944812774658203, "global_step": 63911, "epoch": 380} {"train_loss": -8.585623741149902, "global_step": 63912, "epoch": 380} {"train_loss": -8.739998817443848, "global_step": 63913, "epoch": 380} {"train_loss": -8.493179321289062, "global_step": 63914, "epoch": 380} {"train_loss": -8.974176406860352, "global_step": 63915, "epoch": 380} {"train_loss": -8.600364685058594, "global_step": 63916, "epoch": 380} {"train_loss": -8.667644500732422, "global_step": 63917, "epoch": 380} {"train_loss": -8.58204174041748, "global_step": 63918, "epoch": 380} {"train_loss": -8.599099159240723, "global_step": 63919, "epoch": 380} {"train_loss": -8.625770568847656, "global_step": 63920, "epoch": 380} {"train_loss": -8.787199020385742, "global_step": 63921, "epoch": 380} {"train_loss": -8.884188652038574, "global_step": 63922, "epoch": 380} {"train_loss": -8.945525169372559, "global_step": 63923, "epoch": 380} {"train_loss": -9.099716186523438, "global_step": 63924, "epoch": 380} {"train_loss": -8.800662994384766, "global_step": 63925, "epoch": 380} {"train_loss": -8.631731033325195, "global_step": 63926, "epoch": 380} {"train_loss": -8.733160018920898, "global_step": 63927, "epoch": 380} {"train_loss": -8.59023666381836, "global_step": 63928, "epoch": 380} {"train_loss": -8.845297813415527, "global_step": 63929, "epoch": 380} {"train_loss": -8.725337982177734, "global_step": 63930, "epoch": 380} {"train_loss": -8.662825584411621, "global_step": 63931, "epoch": 380} {"train_loss": -8.800138473510742, "global_step": 63932, "epoch": 380} {"train_loss": -9.02291488647461, "global_step": 63933, "epoch": 380} {"train_loss": -8.896951675415039, "global_step": 63934, "epoch": 380} {"train_loss": -8.885814666748047, "global_step": 63935, "epoch": 380} {"train_loss": -8.561712265014648, "global_step": 63936, "epoch": 380} {"train_loss": -8.909342765808105, "global_step": 63937, "epoch": 380} {"train_loss": -8.464714050292969, "global_step": 63938, "epoch": 380} {"train_loss": -8.997207641601562, "global_step": 63939, "epoch": 380} {"train_loss": -8.77454662322998, "global_step": 63940, "epoch": 380} {"train_loss": -8.833883285522461, "global_step": 63941, "epoch": 380} {"train_loss": -8.862773895263672, "global_step": 63942, "epoch": 380} {"train_loss": -8.64207935333252, "global_step": 63943, "epoch": 380} {"train_loss": -8.987171173095703, "global_step": 63944, "epoch": 380} {"train_loss": -8.579601287841797, "global_step": 63945, "epoch": 380} {"train_loss": -8.716524124145508, "global_step": 63946, "epoch": 380} {"train_loss": -8.775030136108398, "global_step": 63947, "epoch": 380} {"train_loss": -8.640569686889648, "global_step": 63948, "epoch": 380} {"train_loss": -8.580038070678711, "global_step": 63949, "epoch": 380} {"train_loss": -8.903024673461914, "global_step": 63950, "epoch": 380} {"train_loss": -8.52005672454834, "global_step": 63951, "epoch": 380} {"train_loss": -8.59315299987793, "global_step": 63952, "epoch": 380} {"train_loss": -8.757299423217773, "global_step": 63953, "epoch": 380} {"train_loss": -8.649133682250977, "global_step": 63954, "epoch": 380} {"train_loss": -8.276620864868164, "global_step": 63955, "epoch": 380} {"train_loss": -8.747390747070312, "global_step": 63956, "epoch": 380} {"train_loss": -8.244811058044434, "global_step": 63957, "epoch": 380} {"train_loss": -8.459053039550781, "global_step": 63958, "epoch": 380} {"train_loss": -8.46423625946045, "global_step": 63959, "epoch": 380} {"train_loss": -8.685670852661133, "global_step": 63960, "epoch": 380} {"train_loss": -8.67057991027832, "global_step": 63961, "epoch": 380} {"train_loss": -8.752742767333984, "global_step": 63962, "epoch": 380} {"train_loss": -8.617227554321289, "global_step": 63963, "epoch": 380} {"train_loss": -8.71668529510498, "global_step": 63964, "epoch": 380} {"train_loss": -8.760232925415039, "global_step": 63965, "epoch": 380} {"train_loss": -8.65292739868164, "global_step": 63966, "epoch": 380} {"train_loss": -8.63206672668457, "global_step": 63967, "epoch": 380} {"train_loss": -8.721542358398438, "global_step": 63968, "epoch": 380} {"train_loss": -8.692320823669434, "global_step": 63969, "epoch": 380} {"train_loss": -8.852737426757812, "global_step": 63970, "epoch": 380} {"train_loss": -8.652536392211914, "global_step": 63971, "epoch": 380} {"train_loss": -8.372798919677734, "global_step": 63972, "epoch": 380} {"train_loss": -8.918905258178711, "global_step": 63973, "epoch": 380} {"train_loss": -9.001903533935547, "global_step": 63974, "epoch": 380} {"train_loss": -8.938640594482422, "global_step": 63975, "epoch": 380} {"train_loss": -8.843908309936523, "global_step": 63976, "epoch": 380} {"train_loss": -8.76577377319336, "global_step": 63977, "epoch": 380} {"train_loss": -8.607536315917969, "global_step": 63978, "epoch": 380} {"train_loss": -8.964983940124512, "global_step": 63979, "epoch": 380} {"train_loss": -8.658117294311523, "global_step": 63980, "epoch": 380} {"train_loss": -8.922830581665039, "global_step": 63981, "epoch": 380} {"train_loss": -8.74715805053711, "global_step": 63982, "epoch": 380} {"train_loss": -8.714696884155273, "global_step": 63983, "epoch": 380} {"train_loss": -8.632476806640625, "global_step": 63984, "epoch": 380} {"train_loss": -8.992581367492676, "global_step": 63985, "epoch": 380} {"train_loss": -8.86153793334961, "global_step": 63986, "epoch": 380} {"train_loss": -8.953168869018555, "global_step": 63987, "epoch": 380} {"train_loss": -8.993239402770996, "global_step": 63988, "epoch": 380} {"train_loss": -9.000247955322266, "global_step": 63989, "epoch": 380} {"train_loss": -9.095876693725586, "global_step": 63990, "epoch": 380} {"train_loss": -8.581465721130371, "global_step": 63991, "epoch": 380} {"train_loss": -8.714990615844727, "global_step": 63992, "epoch": 380} {"train_loss": -8.82946491241455, "global_step": 63993, "epoch": 380} {"train_loss": -8.531839370727539, "global_step": 63994, "epoch": 380} {"train_loss": -8.964637756347656, "global_step": 63995, "epoch": 380} {"train_loss": -8.575230598449707, "global_step": 63996, "epoch": 380} {"train_loss": -8.448619842529297, "global_step": 63997, "epoch": 380} {"train_loss": -8.680673599243164, "global_step": 63998, "epoch": 380} {"train_loss": -8.212459564208984, "global_step": 63999, "epoch": 380} {"train_loss": -8.259665489196777, "global_step": 64000, "epoch": 380} {"train_loss": -8.121367454528809, "global_step": 64001, "epoch": 380} {"train_loss": -8.646209716796875, "global_step": 64002, "epoch": 380} {"train_loss": -8.096064567565918, "global_step": 64003, "epoch": 380} {"train_loss": -8.663389205932617, "global_step": 64004, "epoch": 380} {"train_loss": -7.800778388977051, "global_step": 64005, "epoch": 380} {"train_loss": -8.329959869384766, "global_step": 64006, "epoch": 380} {"train_loss": -8.704640098980494, "global_step": 64007, "epoch": 380, "val_loss": 191371.96875, "train_action_mse_error": 8.801795959472656} {"train_loss": -8.172407150268555, "global_step": 64008, "epoch": 381} {"train_loss": -8.174127578735352, "global_step": 64009, "epoch": 381} {"train_loss": -8.219871520996094, "global_step": 64010, "epoch": 381} {"train_loss": -8.167818069458008, "global_step": 64011, "epoch": 381} {"train_loss": -8.31364631652832, "global_step": 64012, "epoch": 381} {"train_loss": -8.081254959106445, "global_step": 64013, "epoch": 381} {"train_loss": -8.34062385559082, "global_step": 64014, "epoch": 381} {"train_loss": -8.108827590942383, "global_step": 64015, "epoch": 381} {"train_loss": -8.227336883544922, "global_step": 64016, "epoch": 381} {"train_loss": -8.41678524017334, "global_step": 64017, "epoch": 381} {"train_loss": -8.338445663452148, "global_step": 64018, "epoch": 381} {"train_loss": -8.41264533996582, "global_step": 64019, "epoch": 381} {"train_loss": -8.240252494812012, "global_step": 64020, "epoch": 381} {"train_loss": -8.40501594543457, "global_step": 64021, "epoch": 381} {"train_loss": -8.35110855102539, "global_step": 64022, "epoch": 381} {"train_loss": -8.434391975402832, "global_step": 64023, "epoch": 381} {"train_loss": -8.747845649719238, "global_step": 64024, "epoch": 381} {"train_loss": -8.371004104614258, "global_step": 64025, "epoch": 381} {"train_loss": -8.583908081054688, "global_step": 64026, "epoch": 381} {"train_loss": -8.610952377319336, "global_step": 64027, "epoch": 381} {"train_loss": -8.397114753723145, "global_step": 64028, "epoch": 381} {"train_loss": -8.40017032623291, "global_step": 64029, "epoch": 381} {"train_loss": -8.75000286102295, "global_step": 64030, "epoch": 381} {"train_loss": -8.659252166748047, "global_step": 64031, "epoch": 381} {"train_loss": -8.819507598876953, "global_step": 64032, "epoch": 381} {"train_loss": -8.826862335205078, "global_step": 64033, "epoch": 381} {"train_loss": -8.912969589233398, "global_step": 64034, "epoch": 381} {"train_loss": -8.742462158203125, "global_step": 64035, "epoch": 381} {"train_loss": -8.955154418945312, "global_step": 64036, "epoch": 381} {"train_loss": -9.002153396606445, "global_step": 64037, "epoch": 381} {"train_loss": -9.021289825439453, "global_step": 64038, "epoch": 381} {"train_loss": -9.185052871704102, "global_step": 64039, "epoch": 381} {"train_loss": -9.058176040649414, "global_step": 64040, "epoch": 381} {"train_loss": -8.900873184204102, "global_step": 64041, "epoch": 381} {"train_loss": -8.752511978149414, "global_step": 64042, "epoch": 381} {"train_loss": -9.117140769958496, "global_step": 64043, "epoch": 381} {"train_loss": -8.844825744628906, "global_step": 64044, "epoch": 381} {"train_loss": -8.994840621948242, "global_step": 64045, "epoch": 381} {"train_loss": -8.753409385681152, "global_step": 64046, "epoch": 381} {"train_loss": -8.982891082763672, "global_step": 64047, "epoch": 381} {"train_loss": -8.55250072479248, "global_step": 64048, "epoch": 381} {"train_loss": -9.162750244140625, "global_step": 64049, "epoch": 381} {"train_loss": -8.853964805603027, "global_step": 64050, "epoch": 381} {"train_loss": -8.935260772705078, "global_step": 64051, "epoch": 381} {"train_loss": -9.177088737487793, "global_step": 64052, "epoch": 381} {"train_loss": -8.66457748413086, "global_step": 64053, "epoch": 381} {"train_loss": -8.61398696899414, "global_step": 64054, "epoch": 381} {"train_loss": -8.76900863647461, "global_step": 64055, "epoch": 381} {"train_loss": -8.947811126708984, "global_step": 64056, "epoch": 381} {"train_loss": -8.701024055480957, "global_step": 64057, "epoch": 381} {"train_loss": -9.05666732788086, "global_step": 64058, "epoch": 381} {"train_loss": -9.068538665771484, "global_step": 64059, "epoch": 381} {"train_loss": -8.845681190490723, "global_step": 64060, "epoch": 381} {"train_loss": -8.700424194335938, "global_step": 64061, "epoch": 381} {"train_loss": -8.92064094543457, "global_step": 64062, "epoch": 381} {"train_loss": -8.742820739746094, "global_step": 64063, "epoch": 381} {"train_loss": -9.011597633361816, "global_step": 64064, "epoch": 381} {"train_loss": -8.463661193847656, "global_step": 64065, "epoch": 381} {"train_loss": -8.433181762695312, "global_step": 64066, "epoch": 381} {"train_loss": -8.673687934875488, "global_step": 64067, "epoch": 381} {"train_loss": -8.677446365356445, "global_step": 64068, "epoch": 381} {"train_loss": -8.678442001342773, "global_step": 64069, "epoch": 381} {"train_loss": -8.970308303833008, "global_step": 64070, "epoch": 381} {"train_loss": -8.48044204711914, "global_step": 64071, "epoch": 381} {"train_loss": -8.706602096557617, "global_step": 64072, "epoch": 381} {"train_loss": -8.695432662963867, "global_step": 64073, "epoch": 381} {"train_loss": -8.260091781616211, "global_step": 64074, "epoch": 381} {"train_loss": -8.790738105773926, "global_step": 64075, "epoch": 381} {"train_loss": -8.32125473022461, "global_step": 64076, "epoch": 381} {"train_loss": -8.83945083618164, "global_step": 64077, "epoch": 381} {"train_loss": -8.618480682373047, "global_step": 64078, "epoch": 381} {"train_loss": -8.710437774658203, "global_step": 64079, "epoch": 381} {"train_loss": -8.680642127990723, "global_step": 64080, "epoch": 381} {"train_loss": -8.65886402130127, "global_step": 64081, "epoch": 381} {"train_loss": -8.760332107543945, "global_step": 64082, "epoch": 381} {"train_loss": -8.699470520019531, "global_step": 64083, "epoch": 381} {"train_loss": -8.66533374786377, "global_step": 64084, "epoch": 381} {"train_loss": -8.851381301879883, "global_step": 64085, "epoch": 381} {"train_loss": -8.748613357543945, "global_step": 64086, "epoch": 381} {"train_loss": -8.996445655822754, "global_step": 64087, "epoch": 381} {"train_loss": -8.821611404418945, "global_step": 64088, "epoch": 381} {"train_loss": -8.752765655517578, "global_step": 64089, "epoch": 381} {"train_loss": -8.504940032958984, "global_step": 64090, "epoch": 381} {"train_loss": -8.672152519226074, "global_step": 64091, "epoch": 381} {"train_loss": -8.505941390991211, "global_step": 64092, "epoch": 381} {"train_loss": -8.646136283874512, "global_step": 64093, "epoch": 381} {"train_loss": -8.979314804077148, "global_step": 64094, "epoch": 381} {"train_loss": -8.85122299194336, "global_step": 64095, "epoch": 381} {"train_loss": -8.805730819702148, "global_step": 64096, "epoch": 381} {"train_loss": -8.862106323242188, "global_step": 64097, "epoch": 381} {"train_loss": -8.655771255493164, "global_step": 64098, "epoch": 381} {"train_loss": -8.879140853881836, "global_step": 64099, "epoch": 381} {"train_loss": -8.910099029541016, "global_step": 64100, "epoch": 381} {"train_loss": -8.652429580688477, "global_step": 64101, "epoch": 381} {"train_loss": -8.790369033813477, "global_step": 64102, "epoch": 381} {"train_loss": -8.792445182800293, "global_step": 64103, "epoch": 381} {"train_loss": -8.877864837646484, "global_step": 64104, "epoch": 381} {"train_loss": -8.945034980773926, "global_step": 64105, "epoch": 381} {"train_loss": -9.061521530151367, "global_step": 64106, "epoch": 381} {"train_loss": -8.839441299438477, "global_step": 64107, "epoch": 381} {"train_loss": -9.041950225830078, "global_step": 64108, "epoch": 381} {"train_loss": -8.740241050720215, "global_step": 64109, "epoch": 381} {"train_loss": -8.670316696166992, "global_step": 64110, "epoch": 381} {"train_loss": -8.83825397491455, "global_step": 64111, "epoch": 381} {"train_loss": -8.681472778320312, "global_step": 64112, "epoch": 381} {"train_loss": -8.626827239990234, "global_step": 64113, "epoch": 381} {"train_loss": -9.077302932739258, "global_step": 64114, "epoch": 381} {"train_loss": -8.916404724121094, "global_step": 64115, "epoch": 381} {"train_loss": -8.968802452087402, "global_step": 64116, "epoch": 381} {"train_loss": -9.041061401367188, "global_step": 64117, "epoch": 381} {"train_loss": -8.763729095458984, "global_step": 64118, "epoch": 381} {"train_loss": -9.004358291625977, "global_step": 64119, "epoch": 381} {"train_loss": -8.862689018249512, "global_step": 64120, "epoch": 381} {"train_loss": -8.80937385559082, "global_step": 64121, "epoch": 381} {"train_loss": -9.050400733947754, "global_step": 64122, "epoch": 381} {"train_loss": -8.712827682495117, "global_step": 64123, "epoch": 381} {"train_loss": -8.687435150146484, "global_step": 64124, "epoch": 381} {"train_loss": -8.763575553894043, "global_step": 64125, "epoch": 381} {"train_loss": -8.896812438964844, "global_step": 64126, "epoch": 381} {"train_loss": -8.826817512512207, "global_step": 64127, "epoch": 381} {"train_loss": -8.914552688598633, "global_step": 64128, "epoch": 381} {"train_loss": -8.968576431274414, "global_step": 64129, "epoch": 381} {"train_loss": -8.789386749267578, "global_step": 64130, "epoch": 381} {"train_loss": -8.890460968017578, "global_step": 64131, "epoch": 381} {"train_loss": -8.881044387817383, "global_step": 64132, "epoch": 381} {"train_loss": -8.63232707977295, "global_step": 64133, "epoch": 381} {"train_loss": -9.000412940979004, "global_step": 64134, "epoch": 381} {"train_loss": -8.806499481201172, "global_step": 64135, "epoch": 381} {"train_loss": -8.87208080291748, "global_step": 64136, "epoch": 381} {"train_loss": -8.724796295166016, "global_step": 64137, "epoch": 381} {"train_loss": -8.805809020996094, "global_step": 64138, "epoch": 381} {"train_loss": -8.836820602416992, "global_step": 64139, "epoch": 381} {"train_loss": -8.794365882873535, "global_step": 64140, "epoch": 381} {"train_loss": -8.72848892211914, "global_step": 64141, "epoch": 381} {"train_loss": -8.882962226867676, "global_step": 64142, "epoch": 381} {"train_loss": -8.861896514892578, "global_step": 64143, "epoch": 381} {"train_loss": -8.825045585632324, "global_step": 64144, "epoch": 381} {"train_loss": -8.828630447387695, "global_step": 64145, "epoch": 381} {"train_loss": -8.66348648071289, "global_step": 64146, "epoch": 381} {"train_loss": -8.725183486938477, "global_step": 64147, "epoch": 381} {"train_loss": -8.59326171875, "global_step": 64148, "epoch": 381} {"train_loss": -8.893482208251953, "global_step": 64149, "epoch": 381} {"train_loss": -8.860801696777344, "global_step": 64150, "epoch": 381} {"train_loss": -8.858667373657227, "global_step": 64151, "epoch": 381} {"train_loss": -8.720069885253906, "global_step": 64152, "epoch": 381} {"train_loss": -8.54697036743164, "global_step": 64153, "epoch": 381} {"train_loss": -8.792255401611328, "global_step": 64154, "epoch": 381} {"train_loss": -8.917701721191406, "global_step": 64155, "epoch": 381} {"train_loss": -8.744528770446777, "global_step": 64156, "epoch": 381} {"train_loss": -8.665820121765137, "global_step": 64157, "epoch": 381} {"train_loss": -8.731706619262695, "global_step": 64158, "epoch": 381} {"train_loss": -8.824541091918945, "global_step": 64159, "epoch": 381} {"train_loss": -8.453731536865234, "global_step": 64160, "epoch": 381} {"train_loss": -8.516249656677246, "global_step": 64161, "epoch": 381} {"train_loss": -8.631932258605957, "global_step": 64162, "epoch": 381} {"train_loss": -8.649944305419922, "global_step": 64163, "epoch": 381} {"train_loss": -8.469595909118652, "global_step": 64164, "epoch": 381} {"train_loss": -8.862820625305176, "global_step": 64165, "epoch": 381} {"train_loss": -8.605133056640625, "global_step": 64166, "epoch": 381} {"train_loss": -8.74324893951416, "global_step": 64167, "epoch": 381} {"train_loss": -8.660452842712402, "global_step": 64168, "epoch": 381} {"train_loss": -8.874898910522461, "global_step": 64169, "epoch": 381} {"train_loss": -8.82125473022461, "global_step": 64170, "epoch": 381} {"train_loss": -8.78212833404541, "global_step": 64171, "epoch": 381} {"train_loss": -8.916281700134277, "global_step": 64172, "epoch": 381} {"train_loss": -8.741125106811523, "global_step": 64173, "epoch": 381} {"train_loss": -8.7605619430542, "global_step": 64174, "epoch": 381} {"train_loss": -8.734423029990424, "global_step": 64175, "epoch": 381, "val_loss": 190194.234375} {"train_loss": -8.836837768554688, "global_step": 64176, "epoch": 382} {"train_loss": -8.688592910766602, "global_step": 64177, "epoch": 382} {"train_loss": -8.666154861450195, "global_step": 64178, "epoch": 382} {"train_loss": -8.689300537109375, "global_step": 64179, "epoch": 382} {"train_loss": -8.766911506652832, "global_step": 64180, "epoch": 382} {"train_loss": -8.709637641906738, "global_step": 64181, "epoch": 382} {"train_loss": -8.72829818725586, "global_step": 64182, "epoch": 382} {"train_loss": -8.724090576171875, "global_step": 64183, "epoch": 382} {"train_loss": -8.831319808959961, "global_step": 64184, "epoch": 382} {"train_loss": -8.691850662231445, "global_step": 64185, "epoch": 382} {"train_loss": -8.754568099975586, "global_step": 64186, "epoch": 382} {"train_loss": -8.570876121520996, "global_step": 64187, "epoch": 382} {"train_loss": -8.830964088439941, "global_step": 64188, "epoch": 382} {"train_loss": -8.776737213134766, "global_step": 64189, "epoch": 382} {"train_loss": -8.438050270080566, "global_step": 64190, "epoch": 382} {"train_loss": -8.768037796020508, "global_step": 64191, "epoch": 382} {"train_loss": -8.505992889404297, "global_step": 64192, "epoch": 382} {"train_loss": -8.680740356445312, "global_step": 64193, "epoch": 382} {"train_loss": -8.629731178283691, "global_step": 64194, "epoch": 382} {"train_loss": -8.745315551757812, "global_step": 64195, "epoch": 382} {"train_loss": -8.66023063659668, "global_step": 64196, "epoch": 382} {"train_loss": -8.754152297973633, "global_step": 64197, "epoch": 382} {"train_loss": -8.461355209350586, "global_step": 64198, "epoch": 382} {"train_loss": -8.72222900390625, "global_step": 64199, "epoch": 382} {"train_loss": -8.676082611083984, "global_step": 64200, "epoch": 382} {"train_loss": -8.934043884277344, "global_step": 64201, "epoch": 382} {"train_loss": -8.672629356384277, "global_step": 64202, "epoch": 382} {"train_loss": -8.63168716430664, "global_step": 64203, "epoch": 382} {"train_loss": -8.733125686645508, "global_step": 64204, "epoch": 382} {"train_loss": -8.915098190307617, "global_step": 64205, "epoch": 382} {"train_loss": -8.980714797973633, "global_step": 64206, "epoch": 382} {"train_loss": -8.766334533691406, "global_step": 64207, "epoch": 382} {"train_loss": -8.974420547485352, "global_step": 64208, "epoch": 382} {"train_loss": -9.087562561035156, "global_step": 64209, "epoch": 382} {"train_loss": -8.897836685180664, "global_step": 64210, "epoch": 382} {"train_loss": -8.923885345458984, "global_step": 64211, "epoch": 382} {"train_loss": -8.977128982543945, "global_step": 64212, "epoch": 382} {"train_loss": -9.0797119140625, "global_step": 64213, "epoch": 382} {"train_loss": -9.017248153686523, "global_step": 64214, "epoch": 382} {"train_loss": -8.975107192993164, "global_step": 64215, "epoch": 382} {"train_loss": -8.696451187133789, "global_step": 64216, "epoch": 382} {"train_loss": -8.991954803466797, "global_step": 64217, "epoch": 382} {"train_loss": -8.455312728881836, "global_step": 64218, "epoch": 382} {"train_loss": -8.914289474487305, "global_step": 64219, "epoch": 382} {"train_loss": -8.649160385131836, "global_step": 64220, "epoch": 382} {"train_loss": -8.990965843200684, "global_step": 64221, "epoch": 382} {"train_loss": -8.88336181640625, "global_step": 64222, "epoch": 382} {"train_loss": -8.808768272399902, "global_step": 64223, "epoch": 382} {"train_loss": -8.708608627319336, "global_step": 64224, "epoch": 382} {"train_loss": -8.885848999023438, "global_step": 64225, "epoch": 382} {"train_loss": -8.720190048217773, "global_step": 64226, "epoch": 382} {"train_loss": -8.84419059753418, "global_step": 64227, "epoch": 382} {"train_loss": -8.614242553710938, "global_step": 64228, "epoch": 382} {"train_loss": -9.099822044372559, "global_step": 64229, "epoch": 382} {"train_loss": -8.831731796264648, "global_step": 64230, "epoch": 382} {"train_loss": -9.13888931274414, "global_step": 64231, "epoch": 382} {"train_loss": -8.928820610046387, "global_step": 64232, "epoch": 382} {"train_loss": -8.853592872619629, "global_step": 64233, "epoch": 382} {"train_loss": -8.750816345214844, "global_step": 64234, "epoch": 382} {"train_loss": -8.966116905212402, "global_step": 64235, "epoch": 382} {"train_loss": -8.72492790222168, "global_step": 64236, "epoch": 382} {"train_loss": -8.878829956054688, "global_step": 64237, "epoch": 382} {"train_loss": -8.80008602142334, "global_step": 64238, "epoch": 382} {"train_loss": -8.75318431854248, "global_step": 64239, "epoch": 382} {"train_loss": -8.902702331542969, "global_step": 64240, "epoch": 382} {"train_loss": -8.927285194396973, "global_step": 64241, "epoch": 382} {"train_loss": -8.904064178466797, "global_step": 64242, "epoch": 382} {"train_loss": -8.814602851867676, "global_step": 64243, "epoch": 382} {"train_loss": -8.621288299560547, "global_step": 64244, "epoch": 382} {"train_loss": -8.792694091796875, "global_step": 64245, "epoch": 382} {"train_loss": -8.769161224365234, "global_step": 64246, "epoch": 382} {"train_loss": -9.02598762512207, "global_step": 64247, "epoch": 382} {"train_loss": -8.790040969848633, "global_step": 64248, "epoch": 382} {"train_loss": -8.61104679107666, "global_step": 64249, "epoch": 382} {"train_loss": -8.895814895629883, "global_step": 64250, "epoch": 382} {"train_loss": -8.956984519958496, "global_step": 64251, "epoch": 382} {"train_loss": -8.719524383544922, "global_step": 64252, "epoch": 382} {"train_loss": -9.054923057556152, "global_step": 64253, "epoch": 382} {"train_loss": -8.888152122497559, "global_step": 64254, "epoch": 382} {"train_loss": -8.867254257202148, "global_step": 64255, "epoch": 382} {"train_loss": -8.914773941040039, "global_step": 64256, "epoch": 382} {"train_loss": -8.913593292236328, "global_step": 64257, "epoch": 382} {"train_loss": -8.888450622558594, "global_step": 64258, "epoch": 382} {"train_loss": -9.155794143676758, "global_step": 64259, "epoch": 382} {"train_loss": -8.804603576660156, "global_step": 64260, "epoch": 382} {"train_loss": -8.770126342773438, "global_step": 64261, "epoch": 382} {"train_loss": -8.954056739807129, "global_step": 64262, "epoch": 382} {"train_loss": -8.662739753723145, "global_step": 64263, "epoch": 382} {"train_loss": -8.653955459594727, "global_step": 64264, "epoch": 382} {"train_loss": -9.115694046020508, "global_step": 64265, "epoch": 382} {"train_loss": -8.87735366821289, "global_step": 64266, "epoch": 382} {"train_loss": -8.890727043151855, "global_step": 64267, "epoch": 382} {"train_loss": -9.005722045898438, "global_step": 64268, "epoch": 382} {"train_loss": -8.793600082397461, "global_step": 64269, "epoch": 382} {"train_loss": -8.824355125427246, "global_step": 64270, "epoch": 382} {"train_loss": -8.903390884399414, "global_step": 64271, "epoch": 382} {"train_loss": -8.714054107666016, "global_step": 64272, "epoch": 382} {"train_loss": -8.678797721862793, "global_step": 64273, "epoch": 382} {"train_loss": -8.989975929260254, "global_step": 64274, "epoch": 382} {"train_loss": -8.736404418945312, "global_step": 64275, "epoch": 382} {"train_loss": -8.852449417114258, "global_step": 64276, "epoch": 382} {"train_loss": -8.580069541931152, "global_step": 64277, "epoch": 382} {"train_loss": -8.538806915283203, "global_step": 64278, "epoch": 382} {"train_loss": -8.606555938720703, "global_step": 64279, "epoch": 382} {"train_loss": -8.748893737792969, "global_step": 64280, "epoch": 382} {"train_loss": -8.539695739746094, "global_step": 64281, "epoch": 382} {"train_loss": -8.824722290039062, "global_step": 64282, "epoch": 382} {"train_loss": -8.583992958068848, "global_step": 64283, "epoch": 382} {"train_loss": -8.81419563293457, "global_step": 64284, "epoch": 382} {"train_loss": -8.518928527832031, "global_step": 64285, "epoch": 382} {"train_loss": -8.7088623046875, "global_step": 64286, "epoch": 382} {"train_loss": -8.4940185546875, "global_step": 64287, "epoch": 382} {"train_loss": -8.65798568725586, "global_step": 64288, "epoch": 382} {"train_loss": -8.694652557373047, "global_step": 64289, "epoch": 382} {"train_loss": -8.663250923156738, "global_step": 64290, "epoch": 382} {"train_loss": -8.813346862792969, "global_step": 64291, "epoch": 382} {"train_loss": -8.739076614379883, "global_step": 64292, "epoch": 382} {"train_loss": -8.80817985534668, "global_step": 64293, "epoch": 382} {"train_loss": -8.783016204833984, "global_step": 64294, "epoch": 382} {"train_loss": -8.549060821533203, "global_step": 64295, "epoch": 382} {"train_loss": -8.680662155151367, "global_step": 64296, "epoch": 382} {"train_loss": -8.817610740661621, "global_step": 64297, "epoch": 382} {"train_loss": -8.780550003051758, "global_step": 64298, "epoch": 382} {"train_loss": -8.905254364013672, "global_step": 64299, "epoch": 382} {"train_loss": -8.744421005249023, "global_step": 64300, "epoch": 382} {"train_loss": -8.908313751220703, "global_step": 64301, "epoch": 382} {"train_loss": -8.895211219787598, "global_step": 64302, "epoch": 382} {"train_loss": -8.930076599121094, "global_step": 64303, "epoch": 382} {"train_loss": -8.650586128234863, "global_step": 64304, "epoch": 382} {"train_loss": -8.871801376342773, "global_step": 64305, "epoch": 382} {"train_loss": -9.030591011047363, "global_step": 64306, "epoch": 382} {"train_loss": -8.830254554748535, "global_step": 64307, "epoch": 382} {"train_loss": -8.887048721313477, "global_step": 64308, "epoch": 382} {"train_loss": -8.675372123718262, "global_step": 64309, "epoch": 382} {"train_loss": -8.553913116455078, "global_step": 64310, "epoch": 382} {"train_loss": -8.799209594726562, "global_step": 64311, "epoch": 382} {"train_loss": -8.979148864746094, "global_step": 64312, "epoch": 382} {"train_loss": -8.849601745605469, "global_step": 64313, "epoch": 382} {"train_loss": -8.748458862304688, "global_step": 64314, "epoch": 382} {"train_loss": -8.819934844970703, "global_step": 64315, "epoch": 382} {"train_loss": -8.835728645324707, "global_step": 64316, "epoch": 382} {"train_loss": -9.075141906738281, "global_step": 64317, "epoch": 382} {"train_loss": -8.745830535888672, "global_step": 64318, "epoch": 382} {"train_loss": -9.033496856689453, "global_step": 64319, "epoch": 382} {"train_loss": -8.907587051391602, "global_step": 64320, "epoch": 382} {"train_loss": -9.046327590942383, "global_step": 64321, "epoch": 382} {"train_loss": -8.61477279663086, "global_step": 64322, "epoch": 382} {"train_loss": -9.029574394226074, "global_step": 64323, "epoch": 382} {"train_loss": -8.875078201293945, "global_step": 64324, "epoch": 382} {"train_loss": -8.926190376281738, "global_step": 64325, "epoch": 382} {"train_loss": -8.804717063903809, "global_step": 64326, "epoch": 382} {"train_loss": -8.561975479125977, "global_step": 64327, "epoch": 382} {"train_loss": -8.823841094970703, "global_step": 64328, "epoch": 382} {"train_loss": -8.72762680053711, "global_step": 64329, "epoch": 382} {"train_loss": -8.867891311645508, "global_step": 64330, "epoch": 382} {"train_loss": -8.850214004516602, "global_step": 64331, "epoch": 382} {"train_loss": -8.78593635559082, "global_step": 64332, "epoch": 382} {"train_loss": -8.795621871948242, "global_step": 64333, "epoch": 382} {"train_loss": -8.68398666381836, "global_step": 64334, "epoch": 382} {"train_loss": -8.69108772277832, "global_step": 64335, "epoch": 382} {"train_loss": -8.720060348510742, "global_step": 64336, "epoch": 382} {"train_loss": -8.246687889099121, "global_step": 64337, "epoch": 382} {"train_loss": -8.677194595336914, "global_step": 64338, "epoch": 382} {"train_loss": -8.46156120300293, "global_step": 64339, "epoch": 382} {"train_loss": -8.712098121643066, "global_step": 64340, "epoch": 382} {"train_loss": -8.427672386169434, "global_step": 64341, "epoch": 382} {"train_loss": -8.688156127929688, "global_step": 64342, "epoch": 382} {"train_loss": -8.786984091713315, "global_step": 64343, "epoch": 382, "val_loss": 191664.234375} {"train_loss": -8.383308410644531, "global_step": 64344, "epoch": 383} {"train_loss": -8.619421005249023, "global_step": 64345, "epoch": 383} {"train_loss": -8.54631519317627, "global_step": 64346, "epoch": 383} {"train_loss": -8.459064483642578, "global_step": 64347, "epoch": 383} {"train_loss": -8.382878303527832, "global_step": 64348, "epoch": 383} {"train_loss": -8.420766830444336, "global_step": 64349, "epoch": 383} {"train_loss": -8.840764045715332, "global_step": 64350, "epoch": 383} {"train_loss": -8.680814743041992, "global_step": 64351, "epoch": 383} {"train_loss": -8.586942672729492, "global_step": 64352, "epoch": 383} {"train_loss": -8.494318008422852, "global_step": 64353, "epoch": 383} {"train_loss": -8.639261245727539, "global_step": 64354, "epoch": 383} {"train_loss": -8.462677001953125, "global_step": 64355, "epoch": 383} {"train_loss": -8.454971313476562, "global_step": 64356, "epoch": 383} {"train_loss": -8.529510498046875, "global_step": 64357, "epoch": 383} {"train_loss": -8.303627967834473, "global_step": 64358, "epoch": 383} {"train_loss": -8.620153427124023, "global_step": 64359, "epoch": 383} {"train_loss": -8.721235275268555, "global_step": 64360, "epoch": 383} {"train_loss": -8.788046836853027, "global_step": 64361, "epoch": 383} {"train_loss": -8.72020149230957, "global_step": 64362, "epoch": 383} {"train_loss": -8.766711235046387, "global_step": 64363, "epoch": 383} {"train_loss": -8.691812515258789, "global_step": 64364, "epoch": 383} {"train_loss": -8.580537796020508, "global_step": 64365, "epoch": 383} {"train_loss": -8.793525695800781, "global_step": 64366, "epoch": 383} {"train_loss": -8.885266304016113, "global_step": 64367, "epoch": 383} {"train_loss": -8.651817321777344, "global_step": 64368, "epoch": 383} {"train_loss": -9.108636856079102, "global_step": 64369, "epoch": 383} {"train_loss": -8.944746017456055, "global_step": 64370, "epoch": 383} {"train_loss": -9.132026672363281, "global_step": 64371, "epoch": 383} {"train_loss": -8.697124481201172, "global_step": 64372, "epoch": 383} {"train_loss": -8.777568817138672, "global_step": 64373, "epoch": 383} {"train_loss": -8.862313270568848, "global_step": 64374, "epoch": 383} {"train_loss": -9.044984817504883, "global_step": 64375, "epoch": 383} {"train_loss": -8.785582542419434, "global_step": 64376, "epoch": 383} {"train_loss": -8.818211555480957, "global_step": 64377, "epoch": 383} {"train_loss": -8.945295333862305, "global_step": 64378, "epoch": 383} {"train_loss": -8.842891693115234, "global_step": 64379, "epoch": 383} {"train_loss": -9.131760597229004, "global_step": 64380, "epoch": 383} {"train_loss": -8.764272689819336, "global_step": 64381, "epoch": 383} {"train_loss": -8.868940353393555, "global_step": 64382, "epoch": 383} {"train_loss": -8.874099731445312, "global_step": 64383, "epoch": 383} {"train_loss": -8.689279556274414, "global_step": 64384, "epoch": 383} {"train_loss": -8.730920791625977, "global_step": 64385, "epoch": 383} {"train_loss": -8.671812057495117, "global_step": 64386, "epoch": 383} {"train_loss": -8.771623611450195, "global_step": 64387, "epoch": 383} {"train_loss": -8.83633804321289, "global_step": 64388, "epoch": 383} {"train_loss": -8.564187049865723, "global_step": 64389, "epoch": 383} {"train_loss": -8.814556121826172, "global_step": 64390, "epoch": 383} {"train_loss": -8.651107788085938, "global_step": 64391, "epoch": 383} {"train_loss": -8.769200325012207, "global_step": 64392, "epoch": 383} {"train_loss": -8.902755737304688, "global_step": 64393, "epoch": 383} {"train_loss": -8.946794509887695, "global_step": 64394, "epoch": 383} {"train_loss": -8.813791275024414, "global_step": 64395, "epoch": 383} {"train_loss": -8.907447814941406, "global_step": 64396, "epoch": 383} {"train_loss": -8.840009689331055, "global_step": 64397, "epoch": 383} {"train_loss": -8.776820182800293, "global_step": 64398, "epoch": 383} {"train_loss": -8.780811309814453, "global_step": 64399, "epoch": 383} {"train_loss": -8.876026153564453, "global_step": 64400, "epoch": 383} {"train_loss": -8.426582336425781, "global_step": 64401, "epoch": 383} {"train_loss": -8.68552017211914, "global_step": 64402, "epoch": 383} {"train_loss": -8.606720924377441, "global_step": 64403, "epoch": 383} {"train_loss": -8.76011848449707, "global_step": 64404, "epoch": 383} {"train_loss": -8.781923294067383, "global_step": 64405, "epoch": 383} {"train_loss": -8.870253562927246, "global_step": 64406, "epoch": 383} {"train_loss": -8.695503234863281, "global_step": 64407, "epoch": 383} {"train_loss": -8.77756118774414, "global_step": 64408, "epoch": 383} {"train_loss": -8.76869010925293, "global_step": 64409, "epoch": 383} {"train_loss": -8.723648071289062, "global_step": 64410, "epoch": 383} {"train_loss": -8.781039237976074, "global_step": 64411, "epoch": 383} {"train_loss": -8.929057121276855, "global_step": 64412, "epoch": 383} {"train_loss": -8.616260528564453, "global_step": 64413, "epoch": 383} {"train_loss": -8.92955207824707, "global_step": 64414, "epoch": 383} {"train_loss": -8.80583667755127, "global_step": 64415, "epoch": 383} {"train_loss": -8.59062385559082, "global_step": 64416, "epoch": 383} {"train_loss": -8.838245391845703, "global_step": 64417, "epoch": 383} {"train_loss": -8.74815845489502, "global_step": 64418, "epoch": 383} {"train_loss": -8.718236923217773, "global_step": 64419, "epoch": 383} {"train_loss": -8.885153770446777, "global_step": 64420, "epoch": 383} {"train_loss": -8.524784088134766, "global_step": 64421, "epoch": 383} {"train_loss": -9.022533416748047, "global_step": 64422, "epoch": 383} {"train_loss": -8.788078308105469, "global_step": 64423, "epoch": 383} {"train_loss": -8.708650588989258, "global_step": 64424, "epoch": 383} {"train_loss": -9.073440551757812, "global_step": 64425, "epoch": 383} {"train_loss": -8.905410766601562, "global_step": 64426, "epoch": 383} {"train_loss": -8.848889350891113, "global_step": 64427, "epoch": 383} {"train_loss": -8.846035957336426, "global_step": 64428, "epoch": 383} {"train_loss": -9.039886474609375, "global_step": 64429, "epoch": 383} {"train_loss": -8.653327941894531, "global_step": 64430, "epoch": 383} {"train_loss": -8.653148651123047, "global_step": 64431, "epoch": 383} {"train_loss": -8.652185440063477, "global_step": 64432, "epoch": 383} {"train_loss": -8.786325454711914, "global_step": 64433, "epoch": 383} {"train_loss": -8.805904388427734, "global_step": 64434, "epoch": 383} {"train_loss": -8.584033966064453, "global_step": 64435, "epoch": 383} {"train_loss": -8.563310623168945, "global_step": 64436, "epoch": 383} {"train_loss": -8.827630996704102, "global_step": 64437, "epoch": 383} {"train_loss": -8.627847671508789, "global_step": 64438, "epoch": 383} {"train_loss": -8.714380264282227, "global_step": 64439, "epoch": 383} {"train_loss": -8.51259708404541, "global_step": 64440, "epoch": 383} {"train_loss": -8.556140899658203, "global_step": 64441, "epoch": 383} {"train_loss": -8.566659927368164, "global_step": 64442, "epoch": 383} {"train_loss": -8.560810089111328, "global_step": 64443, "epoch": 383} {"train_loss": -8.526540756225586, "global_step": 64444, "epoch": 383} {"train_loss": -8.663515090942383, "global_step": 64445, "epoch": 383} {"train_loss": -8.704252243041992, "global_step": 64446, "epoch": 383} {"train_loss": -8.484904289245605, "global_step": 64447, "epoch": 383} {"train_loss": -8.486732482910156, "global_step": 64448, "epoch": 383} {"train_loss": -8.899455070495605, "global_step": 64449, "epoch": 383} {"train_loss": -8.317878723144531, "global_step": 64450, "epoch": 383} {"train_loss": -8.568687438964844, "global_step": 64451, "epoch": 383} {"train_loss": -8.292243957519531, "global_step": 64452, "epoch": 383} {"train_loss": -8.663302421569824, "global_step": 64453, "epoch": 383} {"train_loss": -8.751970291137695, "global_step": 64454, "epoch": 383} {"train_loss": -8.577219009399414, "global_step": 64455, "epoch": 383} {"train_loss": -8.757308959960938, "global_step": 64456, "epoch": 383} {"train_loss": -8.476852416992188, "global_step": 64457, "epoch": 383} {"train_loss": -8.581342697143555, "global_step": 64458, "epoch": 383} {"train_loss": -8.616323471069336, "global_step": 64459, "epoch": 383} {"train_loss": -8.670954704284668, "global_step": 64460, "epoch": 383} {"train_loss": -8.532378196716309, "global_step": 64461, "epoch": 383} {"train_loss": -8.662567138671875, "global_step": 64462, "epoch": 383} {"train_loss": -8.685837745666504, "global_step": 64463, "epoch": 383} {"train_loss": -8.64864730834961, "global_step": 64464, "epoch": 383} {"train_loss": -8.704809188842773, "global_step": 64465, "epoch": 383} {"train_loss": -8.9197359085083, "global_step": 64466, "epoch": 383} {"train_loss": -8.932231903076172, "global_step": 64467, "epoch": 383} {"train_loss": -8.857040405273438, "global_step": 64468, "epoch": 383} {"train_loss": -8.872191429138184, "global_step": 64469, "epoch": 383} {"train_loss": -8.7550687789917, "global_step": 64470, "epoch": 383} {"train_loss": -8.87887954711914, "global_step": 64471, "epoch": 383} {"train_loss": -8.856487274169922, "global_step": 64472, "epoch": 383} {"train_loss": -8.820319175720215, "global_step": 64473, "epoch": 383} {"train_loss": -8.721453666687012, "global_step": 64474, "epoch": 383} {"train_loss": -8.925344467163086, "global_step": 64475, "epoch": 383} {"train_loss": -8.866483688354492, "global_step": 64476, "epoch": 383} {"train_loss": -8.801881790161133, "global_step": 64477, "epoch": 383} {"train_loss": -8.457197189331055, "global_step": 64478, "epoch": 383} {"train_loss": -8.74500846862793, "global_step": 64479, "epoch": 383} {"train_loss": -8.862405776977539, "global_step": 64480, "epoch": 383} {"train_loss": -8.760900497436523, "global_step": 64481, "epoch": 383} {"train_loss": -8.965739250183105, "global_step": 64482, "epoch": 383} {"train_loss": -8.869851112365723, "global_step": 64483, "epoch": 383} {"train_loss": -8.76215648651123, "global_step": 64484, "epoch": 383} {"train_loss": -8.710220336914062, "global_step": 64485, "epoch": 383} {"train_loss": -8.803339004516602, "global_step": 64486, "epoch": 383} {"train_loss": -8.844127655029297, "global_step": 64487, "epoch": 383} {"train_loss": -8.992654800415039, "global_step": 64488, "epoch": 383} {"train_loss": -8.942903518676758, "global_step": 64489, "epoch": 383} {"train_loss": -8.536032676696777, "global_step": 64490, "epoch": 383} {"train_loss": -8.803916931152344, "global_step": 64491, "epoch": 383} {"train_loss": -8.507994651794434, "global_step": 64492, "epoch": 383} {"train_loss": -8.571500778198242, "global_step": 64493, "epoch": 383} {"train_loss": -8.86396598815918, "global_step": 64494, "epoch": 383} {"train_loss": -8.765329360961914, "global_step": 64495, "epoch": 383} {"train_loss": -8.792534828186035, "global_step": 64496, "epoch": 383} {"train_loss": -8.701974868774414, "global_step": 64497, "epoch": 383} {"train_loss": -8.843889236450195, "global_step": 64498, "epoch": 383} {"train_loss": -8.332975387573242, "global_step": 64499, "epoch": 383} {"train_loss": -8.94041633605957, "global_step": 64500, "epoch": 383} {"train_loss": -8.666696548461914, "global_step": 64501, "epoch": 383} {"train_loss": -8.519049644470215, "global_step": 64502, "epoch": 383} {"train_loss": -8.628044128417969, "global_step": 64503, "epoch": 383} {"train_loss": -8.691021919250488, "global_step": 64504, "epoch": 383} {"train_loss": -8.675901412963867, "global_step": 64505, "epoch": 383} {"train_loss": -8.685076713562012, "global_step": 64506, "epoch": 383} {"train_loss": -8.700677871704102, "global_step": 64507, "epoch": 383} {"train_loss": -8.426983833312988, "global_step": 64508, "epoch": 383} {"train_loss": -8.895180702209473, "global_step": 64509, "epoch": 383} {"train_loss": -8.679183959960938, "global_step": 64510, "epoch": 383} {"train_loss": -8.724628221421014, "global_step": 64511, "epoch": 383, "val_loss": 193687.09375} {"train_loss": -8.59280014038086, "global_step": 64512, "epoch": 384} {"train_loss": -9.100021362304688, "global_step": 64513, "epoch": 384} {"train_loss": -8.763006210327148, "global_step": 64514, "epoch": 384} {"train_loss": -8.754020690917969, "global_step": 64515, "epoch": 384} {"train_loss": -8.806602478027344, "global_step": 64516, "epoch": 384} {"train_loss": -8.748636245727539, "global_step": 64517, "epoch": 384} {"train_loss": -8.56541633605957, "global_step": 64518, "epoch": 384} {"train_loss": -8.840517044067383, "global_step": 64519, "epoch": 384} {"train_loss": -8.799331665039062, "global_step": 64520, "epoch": 384} {"train_loss": -8.62492847442627, "global_step": 64521, "epoch": 384} {"train_loss": -8.77617073059082, "global_step": 64522, "epoch": 384} {"train_loss": -8.597076416015625, "global_step": 64523, "epoch": 384} {"train_loss": -8.299888610839844, "global_step": 64524, "epoch": 384} {"train_loss": -8.422128677368164, "global_step": 64525, "epoch": 384} {"train_loss": -8.101858139038086, "global_step": 64526, "epoch": 384} {"train_loss": -8.469600677490234, "global_step": 64527, "epoch": 384} {"train_loss": -8.437152862548828, "global_step": 64528, "epoch": 384} {"train_loss": -8.470966339111328, "global_step": 64529, "epoch": 384} {"train_loss": -8.18419075012207, "global_step": 64530, "epoch": 384} {"train_loss": -8.239173889160156, "global_step": 64531, "epoch": 384} {"train_loss": -8.510391235351562, "global_step": 64532, "epoch": 384} {"train_loss": -8.340335845947266, "global_step": 64533, "epoch": 384} {"train_loss": -8.463729858398438, "global_step": 64534, "epoch": 384} {"train_loss": -8.576910018920898, "global_step": 64535, "epoch": 384} {"train_loss": -8.243431091308594, "global_step": 64536, "epoch": 384} {"train_loss": -8.427532196044922, "global_step": 64537, "epoch": 384} {"train_loss": -8.654108047485352, "global_step": 64538, "epoch": 384} {"train_loss": -8.720451354980469, "global_step": 64539, "epoch": 384} {"train_loss": -8.747443199157715, "global_step": 64540, "epoch": 384} {"train_loss": -8.689884185791016, "global_step": 64541, "epoch": 384} {"train_loss": -8.691452026367188, "global_step": 64542, "epoch": 384} {"train_loss": -8.979328155517578, "global_step": 64543, "epoch": 384} {"train_loss": -8.814979553222656, "global_step": 64544, "epoch": 384} {"train_loss": -8.67569351196289, "global_step": 64545, "epoch": 384} {"train_loss": -8.7805757522583, "global_step": 64546, "epoch": 384} {"train_loss": -8.751293182373047, "global_step": 64547, "epoch": 384} {"train_loss": -8.589208602905273, "global_step": 64548, "epoch": 384} {"train_loss": -8.995914459228516, "global_step": 64549, "epoch": 384} {"train_loss": -8.621118545532227, "global_step": 64550, "epoch": 384} {"train_loss": -8.808439254760742, "global_step": 64551, "epoch": 384} {"train_loss": -8.683399200439453, "global_step": 64552, "epoch": 384} {"train_loss": -8.650896072387695, "global_step": 64553, "epoch": 384} {"train_loss": -8.609952926635742, "global_step": 64554, "epoch": 384} {"train_loss": -8.680543899536133, "global_step": 64555, "epoch": 384} {"train_loss": -8.749364852905273, "global_step": 64556, "epoch": 384} {"train_loss": -8.846000671386719, "global_step": 64557, "epoch": 384} {"train_loss": -8.654911041259766, "global_step": 64558, "epoch": 384} {"train_loss": -8.8494873046875, "global_step": 64559, "epoch": 384} {"train_loss": -8.815535545349121, "global_step": 64560, "epoch": 384} {"train_loss": -8.922852516174316, "global_step": 64561, "epoch": 384} {"train_loss": -8.737076759338379, "global_step": 64562, "epoch": 384} {"train_loss": -9.005672454833984, "global_step": 64563, "epoch": 384} {"train_loss": -8.61536979675293, "global_step": 64564, "epoch": 384} {"train_loss": -8.91779613494873, "global_step": 64565, "epoch": 384} {"train_loss": -8.501986503601074, "global_step": 64566, "epoch": 384} {"train_loss": -8.784842491149902, "global_step": 64567, "epoch": 384} {"train_loss": -8.644697189331055, "global_step": 64568, "epoch": 384} {"train_loss": -9.07597541809082, "global_step": 64569, "epoch": 384} {"train_loss": -8.516483306884766, "global_step": 64570, "epoch": 384} {"train_loss": -8.748275756835938, "global_step": 64571, "epoch": 384} {"train_loss": -8.83837890625, "global_step": 64572, "epoch": 384} {"train_loss": -8.733359336853027, "global_step": 64573, "epoch": 384} {"train_loss": -9.084403991699219, "global_step": 64574, "epoch": 384} {"train_loss": -8.826171875, "global_step": 64575, "epoch": 384} {"train_loss": -8.626848220825195, "global_step": 64576, "epoch": 384} {"train_loss": -8.90277099609375, "global_step": 64577, "epoch": 384} {"train_loss": -8.853921890258789, "global_step": 64578, "epoch": 384} {"train_loss": -8.711753845214844, "global_step": 64579, "epoch": 384} {"train_loss": -8.711389541625977, "global_step": 64580, "epoch": 384} {"train_loss": -8.72156047821045, "global_step": 64581, "epoch": 384} {"train_loss": -8.709413528442383, "global_step": 64582, "epoch": 384} {"train_loss": -8.665430068969727, "global_step": 64583, "epoch": 384} {"train_loss": -8.854196548461914, "global_step": 64584, "epoch": 384} {"train_loss": -8.633543014526367, "global_step": 64585, "epoch": 384} {"train_loss": -8.662830352783203, "global_step": 64586, "epoch": 384} {"train_loss": -8.717613220214844, "global_step": 64587, "epoch": 384} {"train_loss": -8.682210922241211, "global_step": 64588, "epoch": 384} {"train_loss": -8.80898666381836, "global_step": 64589, "epoch": 384} {"train_loss": -8.809694290161133, "global_step": 64590, "epoch": 384} {"train_loss": -8.749958038330078, "global_step": 64591, "epoch": 384} {"train_loss": -8.587929725646973, "global_step": 64592, "epoch": 384} {"train_loss": -8.628779411315918, "global_step": 64593, "epoch": 384} {"train_loss": -8.532524108886719, "global_step": 64594, "epoch": 384} {"train_loss": -8.636768341064453, "global_step": 64595, "epoch": 384} {"train_loss": -8.888120651245117, "global_step": 64596, "epoch": 384} {"train_loss": -8.608831405639648, "global_step": 64597, "epoch": 384} {"train_loss": -8.466462135314941, "global_step": 64598, "epoch": 384} {"train_loss": -8.638347625732422, "global_step": 64599, "epoch": 384} {"train_loss": -8.636829376220703, "global_step": 64600, "epoch": 384} {"train_loss": -8.745180130004883, "global_step": 64601, "epoch": 384} {"train_loss": -8.653081893920898, "global_step": 64602, "epoch": 384} {"train_loss": -8.708620071411133, "global_step": 64603, "epoch": 384} {"train_loss": -8.604312896728516, "global_step": 64604, "epoch": 384} {"train_loss": -8.646990776062012, "global_step": 64605, "epoch": 384} {"train_loss": -8.477642059326172, "global_step": 64606, "epoch": 384} {"train_loss": -8.527633666992188, "global_step": 64607, "epoch": 384} {"train_loss": -8.859152793884277, "global_step": 64608, "epoch": 384} {"train_loss": -8.667343139648438, "global_step": 64609, "epoch": 384} {"train_loss": -8.578839302062988, "global_step": 64610, "epoch": 384} {"train_loss": -8.460683822631836, "global_step": 64611, "epoch": 384} {"train_loss": -8.509745597839355, "global_step": 64612, "epoch": 384} {"train_loss": -8.434040069580078, "global_step": 64613, "epoch": 384} {"train_loss": -8.727651596069336, "global_step": 64614, "epoch": 384} {"train_loss": -8.619190216064453, "global_step": 64615, "epoch": 384} {"train_loss": -8.620094299316406, "global_step": 64616, "epoch": 384} {"train_loss": -8.697663307189941, "global_step": 64617, "epoch": 384} {"train_loss": -8.691617012023926, "global_step": 64618, "epoch": 384} {"train_loss": -8.608427047729492, "global_step": 64619, "epoch": 384} {"train_loss": -8.668378829956055, "global_step": 64620, "epoch": 384} {"train_loss": -8.845977783203125, "global_step": 64621, "epoch": 384} {"train_loss": -8.825493812561035, "global_step": 64622, "epoch": 384} {"train_loss": -8.631794929504395, "global_step": 64623, "epoch": 384} {"train_loss": -8.668851852416992, "global_step": 64624, "epoch": 384} {"train_loss": -8.657855987548828, "global_step": 64625, "epoch": 384} {"train_loss": -8.552026748657227, "global_step": 64626, "epoch": 384} {"train_loss": -8.619865417480469, "global_step": 64627, "epoch": 384} {"train_loss": -8.730216026306152, "global_step": 64628, "epoch": 384} {"train_loss": -8.792972564697266, "global_step": 64629, "epoch": 384} {"train_loss": -8.55107593536377, "global_step": 64630, "epoch": 384} {"train_loss": -8.957101821899414, "global_step": 64631, "epoch": 384} {"train_loss": -8.765233993530273, "global_step": 64632, "epoch": 384} {"train_loss": -8.639142990112305, "global_step": 64633, "epoch": 384} {"train_loss": -8.647994995117188, "global_step": 64634, "epoch": 384} {"train_loss": -8.819883346557617, "global_step": 64635, "epoch": 384} {"train_loss": -8.417388916015625, "global_step": 64636, "epoch": 384} {"train_loss": -8.705280303955078, "global_step": 64637, "epoch": 384} {"train_loss": -8.691540718078613, "global_step": 64638, "epoch": 384} {"train_loss": -8.722471237182617, "global_step": 64639, "epoch": 384} {"train_loss": -8.710700988769531, "global_step": 64640, "epoch": 384} {"train_loss": -8.58934211730957, "global_step": 64641, "epoch": 384} {"train_loss": -8.80340576171875, "global_step": 64642, "epoch": 384} {"train_loss": -8.614160537719727, "global_step": 64643, "epoch": 384} {"train_loss": -8.475922584533691, "global_step": 64644, "epoch": 384} {"train_loss": -9.002790451049805, "global_step": 64645, "epoch": 384} {"train_loss": -8.720516204833984, "global_step": 64646, "epoch": 384} {"train_loss": -8.866294860839844, "global_step": 64647, "epoch": 384} {"train_loss": -8.783893585205078, "global_step": 64648, "epoch": 384} {"train_loss": -8.818578720092773, "global_step": 64649, "epoch": 384} {"train_loss": -8.888879776000977, "global_step": 64650, "epoch": 384} {"train_loss": -8.521455764770508, "global_step": 64651, "epoch": 384} {"train_loss": -8.707281112670898, "global_step": 64652, "epoch": 384} {"train_loss": -8.866724014282227, "global_step": 64653, "epoch": 384} {"train_loss": -8.574668884277344, "global_step": 64654, "epoch": 384} {"train_loss": -8.842611312866211, "global_step": 64655, "epoch": 384} {"train_loss": -8.512923240661621, "global_step": 64656, "epoch": 384} {"train_loss": -8.806511878967285, "global_step": 64657, "epoch": 384} {"train_loss": -8.735343933105469, "global_step": 64658, "epoch": 384} {"train_loss": -8.571454048156738, "global_step": 64659, "epoch": 384} {"train_loss": -8.716841697692871, "global_step": 64660, "epoch": 384} {"train_loss": -9.014819145202637, "global_step": 64661, "epoch": 384} {"train_loss": -8.519675254821777, "global_step": 64662, "epoch": 384} {"train_loss": -8.812313079833984, "global_step": 64663, "epoch": 384} {"train_loss": -8.506815910339355, "global_step": 64664, "epoch": 384} {"train_loss": -8.353815078735352, "global_step": 64665, "epoch": 384} {"train_loss": -8.522794723510742, "global_step": 64666, "epoch": 384} {"train_loss": -8.895012855529785, "global_step": 64667, "epoch": 384} {"train_loss": -8.577485084533691, "global_step": 64668, "epoch": 384} {"train_loss": -8.92684555053711, "global_step": 64669, "epoch": 384} {"train_loss": -8.874549865722656, "global_step": 64670, "epoch": 384} {"train_loss": -8.541973114013672, "global_step": 64671, "epoch": 384} {"train_loss": -8.59466552734375, "global_step": 64672, "epoch": 384} {"train_loss": -8.898218154907227, "global_step": 64673, "epoch": 384} {"train_loss": -8.221834182739258, "global_step": 64674, "epoch": 384} {"train_loss": -9.009720802307129, "global_step": 64675, "epoch": 384} {"train_loss": -8.735429763793945, "global_step": 64676, "epoch": 384} {"train_loss": -8.743236541748047, "global_step": 64677, "epoch": 384} {"train_loss": -8.495656967163086, "global_step": 64678, "epoch": 384} {"train_loss": -8.680487065088181, "global_step": 64679, "epoch": 384, "val_loss": 189594.15625} {"train_loss": -8.477014541625977, "global_step": 64680, "epoch": 385} {"train_loss": -8.623422622680664, "global_step": 64681, "epoch": 385} {"train_loss": -8.793931007385254, "global_step": 64682, "epoch": 385} {"train_loss": -8.440621376037598, "global_step": 64683, "epoch": 385} {"train_loss": -9.034294128417969, "global_step": 64684, "epoch": 385} {"train_loss": -8.825648307800293, "global_step": 64685, "epoch": 385} {"train_loss": -8.400741577148438, "global_step": 64686, "epoch": 385} {"train_loss": -8.600414276123047, "global_step": 64687, "epoch": 385} {"train_loss": -8.697935104370117, "global_step": 64688, "epoch": 385} {"train_loss": -9.004302978515625, "global_step": 64689, "epoch": 385} {"train_loss": -8.771124839782715, "global_step": 64690, "epoch": 385} {"train_loss": -8.773645401000977, "global_step": 64691, "epoch": 385} {"train_loss": -8.750993728637695, "global_step": 64692, "epoch": 385} {"train_loss": -8.55778694152832, "global_step": 64693, "epoch": 385} {"train_loss": -8.547647476196289, "global_step": 64694, "epoch": 385} {"train_loss": -8.789983749389648, "global_step": 64695, "epoch": 385} {"train_loss": -9.101713180541992, "global_step": 64696, "epoch": 385} {"train_loss": -8.70936393737793, "global_step": 64697, "epoch": 385} {"train_loss": -9.058366775512695, "global_step": 64698, "epoch": 385} {"train_loss": -8.897789001464844, "global_step": 64699, "epoch": 385} {"train_loss": -8.72671127319336, "global_step": 64700, "epoch": 385} {"train_loss": -9.027290344238281, "global_step": 64701, "epoch": 385} {"train_loss": -9.04083251953125, "global_step": 64702, "epoch": 385} {"train_loss": -8.889421463012695, "global_step": 64703, "epoch": 385} {"train_loss": -9.000277519226074, "global_step": 64704, "epoch": 385} {"train_loss": -8.823007583618164, "global_step": 64705, "epoch": 385} {"train_loss": -9.034217834472656, "global_step": 64706, "epoch": 385} {"train_loss": -9.125751495361328, "global_step": 64707, "epoch": 385} {"train_loss": -8.95775318145752, "global_step": 64708, "epoch": 385} {"train_loss": -9.063045501708984, "global_step": 64709, "epoch": 385} {"train_loss": -9.048664093017578, "global_step": 64710, "epoch": 385} {"train_loss": -9.09158706665039, "global_step": 64711, "epoch": 385} {"train_loss": -8.873552322387695, "global_step": 64712, "epoch": 385} {"train_loss": -9.28713607788086, "global_step": 64713, "epoch": 385} {"train_loss": -8.930888175964355, "global_step": 64714, "epoch": 385} {"train_loss": -8.909717559814453, "global_step": 64715, "epoch": 385} {"train_loss": -9.095033645629883, "global_step": 64716, "epoch": 385} {"train_loss": -8.817134857177734, "global_step": 64717, "epoch": 385} {"train_loss": -8.965137481689453, "global_step": 64718, "epoch": 385} {"train_loss": -9.120321273803711, "global_step": 64719, "epoch": 385} {"train_loss": -9.234176635742188, "global_step": 64720, "epoch": 385} {"train_loss": -8.93691635131836, "global_step": 64721, "epoch": 385} {"train_loss": -8.738075256347656, "global_step": 64722, "epoch": 385} {"train_loss": -8.990049362182617, "global_step": 64723, "epoch": 385} {"train_loss": -8.816629409790039, "global_step": 64724, "epoch": 385} {"train_loss": -9.322747230529785, "global_step": 64725, "epoch": 385} {"train_loss": -8.71441650390625, "global_step": 64726, "epoch": 385} {"train_loss": -8.979292869567871, "global_step": 64727, "epoch": 385} {"train_loss": -8.873212814331055, "global_step": 64728, "epoch": 385} {"train_loss": -8.791524887084961, "global_step": 64729, "epoch": 385} {"train_loss": -8.700639724731445, "global_step": 64730, "epoch": 385} {"train_loss": -9.00114631652832, "global_step": 64731, "epoch": 385} {"train_loss": -8.359926223754883, "global_step": 64732, "epoch": 385} {"train_loss": -9.08027458190918, "global_step": 64733, "epoch": 385} {"train_loss": -8.655830383300781, "global_step": 64734, "epoch": 385} {"train_loss": -8.855772972106934, "global_step": 64735, "epoch": 385} {"train_loss": -8.298585891723633, "global_step": 64736, "epoch": 385} {"train_loss": -9.001943588256836, "global_step": 64737, "epoch": 385} {"train_loss": -8.773842811584473, "global_step": 64738, "epoch": 385} {"train_loss": -8.631061553955078, "global_step": 64739, "epoch": 385} {"train_loss": -8.813613891601562, "global_step": 64740, "epoch": 385} {"train_loss": -8.653640747070312, "global_step": 64741, "epoch": 385} {"train_loss": -8.828454971313477, "global_step": 64742, "epoch": 385} {"train_loss": -8.519906997680664, "global_step": 64743, "epoch": 385} {"train_loss": -8.584041595458984, "global_step": 64744, "epoch": 385} {"train_loss": -8.581158638000488, "global_step": 64745, "epoch": 385} {"train_loss": -8.529582023620605, "global_step": 64746, "epoch": 385} {"train_loss": -8.75285816192627, "global_step": 64747, "epoch": 385} {"train_loss": -8.471717834472656, "global_step": 64748, "epoch": 385} {"train_loss": -8.688497543334961, "global_step": 64749, "epoch": 385} {"train_loss": -8.7201509475708, "global_step": 64750, "epoch": 385} {"train_loss": -8.569232940673828, "global_step": 64751, "epoch": 385} {"train_loss": -8.358643531799316, "global_step": 64752, "epoch": 385} {"train_loss": -8.646111488342285, "global_step": 64753, "epoch": 385} {"train_loss": -8.700080871582031, "global_step": 64754, "epoch": 385} {"train_loss": -8.400705337524414, "global_step": 64755, "epoch": 385} {"train_loss": -8.76925277709961, "global_step": 64756, "epoch": 385} {"train_loss": -8.939798355102539, "global_step": 64757, "epoch": 385} {"train_loss": -8.751575469970703, "global_step": 64758, "epoch": 385} {"train_loss": -8.631021499633789, "global_step": 64759, "epoch": 385} {"train_loss": -8.743658065795898, "global_step": 64760, "epoch": 385} {"train_loss": -8.57706069946289, "global_step": 64761, "epoch": 385} {"train_loss": -8.61666488647461, "global_step": 64762, "epoch": 385} {"train_loss": -8.648086547851562, "global_step": 64763, "epoch": 385} {"train_loss": -8.75482177734375, "global_step": 64764, "epoch": 385} {"train_loss": -8.819375991821289, "global_step": 64765, "epoch": 385} {"train_loss": -8.747815132141113, "global_step": 64766, "epoch": 385} {"train_loss": -8.724567413330078, "global_step": 64767, "epoch": 385} {"train_loss": -8.404364585876465, "global_step": 64768, "epoch": 385} {"train_loss": -8.82756519317627, "global_step": 64769, "epoch": 385} {"train_loss": -8.667304039001465, "global_step": 64770, "epoch": 385} {"train_loss": -8.762971878051758, "global_step": 64771, "epoch": 385} {"train_loss": -8.733338356018066, "global_step": 64772, "epoch": 385} {"train_loss": -9.078551292419434, "global_step": 64773, "epoch": 385} {"train_loss": -8.537788391113281, "global_step": 64774, "epoch": 385} {"train_loss": -8.354164123535156, "global_step": 64775, "epoch": 385} {"train_loss": -8.486324310302734, "global_step": 64776, "epoch": 385} {"train_loss": -8.750959396362305, "global_step": 64777, "epoch": 385} {"train_loss": -8.4151611328125, "global_step": 64778, "epoch": 385} {"train_loss": -8.858747482299805, "global_step": 64779, "epoch": 385} {"train_loss": -8.631643295288086, "global_step": 64780, "epoch": 385} {"train_loss": -8.569969177246094, "global_step": 64781, "epoch": 385} {"train_loss": -8.612164497375488, "global_step": 64782, "epoch": 385} {"train_loss": -8.681358337402344, "global_step": 64783, "epoch": 385} {"train_loss": -8.670183181762695, "global_step": 64784, "epoch": 385} {"train_loss": -8.547370910644531, "global_step": 64785, "epoch": 385} {"train_loss": -8.494022369384766, "global_step": 64786, "epoch": 385} {"train_loss": -8.92414665222168, "global_step": 64787, "epoch": 385} {"train_loss": -8.7733154296875, "global_step": 64788, "epoch": 385} {"train_loss": -8.746784210205078, "global_step": 64789, "epoch": 385} {"train_loss": -8.755147933959961, "global_step": 64790, "epoch": 385} {"train_loss": -8.559157371520996, "global_step": 64791, "epoch": 385} {"train_loss": -8.542306900024414, "global_step": 64792, "epoch": 385} {"train_loss": -8.783097267150879, "global_step": 64793, "epoch": 385} {"train_loss": -8.764166831970215, "global_step": 64794, "epoch": 385} {"train_loss": -8.375314712524414, "global_step": 64795, "epoch": 385} {"train_loss": -8.551668167114258, "global_step": 64796, "epoch": 385} {"train_loss": -8.58301067352295, "global_step": 64797, "epoch": 385} {"train_loss": -8.668495178222656, "global_step": 64798, "epoch": 385} {"train_loss": -8.286660194396973, "global_step": 64799, "epoch": 385} {"train_loss": -8.435062408447266, "global_step": 64800, "epoch": 385} {"train_loss": -8.516814231872559, "global_step": 64801, "epoch": 385} {"train_loss": -8.690642356872559, "global_step": 64802, "epoch": 385} {"train_loss": -8.577373504638672, "global_step": 64803, "epoch": 385} {"train_loss": -8.627147674560547, "global_step": 64804, "epoch": 385} {"train_loss": -8.43110179901123, "global_step": 64805, "epoch": 385} {"train_loss": -8.614531517028809, "global_step": 64806, "epoch": 385} {"train_loss": -8.360330581665039, "global_step": 64807, "epoch": 385} {"train_loss": -8.572783470153809, "global_step": 64808, "epoch": 385} {"train_loss": -8.627012252807617, "global_step": 64809, "epoch": 385} {"train_loss": -8.649600982666016, "global_step": 64810, "epoch": 385} {"train_loss": -8.708247184753418, "global_step": 64811, "epoch": 385} {"train_loss": -8.709206581115723, "global_step": 64812, "epoch": 385} {"train_loss": -8.940662384033203, "global_step": 64813, "epoch": 385} {"train_loss": -8.840988159179688, "global_step": 64814, "epoch": 385} {"train_loss": -8.79873275756836, "global_step": 64815, "epoch": 385} {"train_loss": -8.676408767700195, "global_step": 64816, "epoch": 385} {"train_loss": -8.772315979003906, "global_step": 64817, "epoch": 385} {"train_loss": -8.94488525390625, "global_step": 64818, "epoch": 385} {"train_loss": -9.01910400390625, "global_step": 64819, "epoch": 385} {"train_loss": -8.91842269897461, "global_step": 64820, "epoch": 385} {"train_loss": -9.084980010986328, "global_step": 64821, "epoch": 385} {"train_loss": -8.799469947814941, "global_step": 64822, "epoch": 385} {"train_loss": -8.786840438842773, "global_step": 64823, "epoch": 385} {"train_loss": -8.792097091674805, "global_step": 64824, "epoch": 385} {"train_loss": -9.023683547973633, "global_step": 64825, "epoch": 385} {"train_loss": -8.585803985595703, "global_step": 64826, "epoch": 385} {"train_loss": -8.687539100646973, "global_step": 64827, "epoch": 385} {"train_loss": -8.823013305664062, "global_step": 64828, "epoch": 385} {"train_loss": -8.73859977722168, "global_step": 64829, "epoch": 385} {"train_loss": -8.912158966064453, "global_step": 64830, "epoch": 385} {"train_loss": -8.608835220336914, "global_step": 64831, "epoch": 385} {"train_loss": -8.883919715881348, "global_step": 64832, "epoch": 385} {"train_loss": -8.849323272705078, "global_step": 64833, "epoch": 385} {"train_loss": -8.75385856628418, "global_step": 64834, "epoch": 385} {"train_loss": -9.105627059936523, "global_step": 64835, "epoch": 385} {"train_loss": -8.798624038696289, "global_step": 64836, "epoch": 385} {"train_loss": -8.959269523620605, "global_step": 64837, "epoch": 385} {"train_loss": -9.000059127807617, "global_step": 64838, "epoch": 385} {"train_loss": -8.908219337463379, "global_step": 64839, "epoch": 385} {"train_loss": -8.951591491699219, "global_step": 64840, "epoch": 385} {"train_loss": -8.94285774230957, "global_step": 64841, "epoch": 385} {"train_loss": -8.721198081970215, "global_step": 64842, "epoch": 385} {"train_loss": -8.871040344238281, "global_step": 64843, "epoch": 385} {"train_loss": -8.700639724731445, "global_step": 64844, "epoch": 385} {"train_loss": -8.746795654296875, "global_step": 64845, "epoch": 385} {"train_loss": -8.53425407409668, "global_step": 64846, "epoch": 385} {"train_loss": -8.755700826644897, "global_step": 64847, "epoch": 385, "val_loss": 193393.9375, "train_action_mse_error": 5.556522369384766} {"train_loss": -8.628376960754395, "global_step": 64848, "epoch": 386} {"train_loss": -8.563764572143555, "global_step": 64849, "epoch": 386} {"train_loss": -8.649761199951172, "global_step": 64850, "epoch": 386} {"train_loss": -8.626497268676758, "global_step": 64851, "epoch": 386} {"train_loss": -8.759382247924805, "global_step": 64852, "epoch": 386} {"train_loss": -8.710227966308594, "global_step": 64853, "epoch": 386} {"train_loss": -8.635221481323242, "global_step": 64854, "epoch": 386} {"train_loss": -8.689411163330078, "global_step": 64855, "epoch": 386} {"train_loss": -8.678996086120605, "global_step": 64856, "epoch": 386} {"train_loss": -8.947813987731934, "global_step": 64857, "epoch": 386} {"train_loss": -8.804883003234863, "global_step": 64858, "epoch": 386} {"train_loss": -8.806314468383789, "global_step": 64859, "epoch": 386} {"train_loss": -8.85650634765625, "global_step": 64860, "epoch": 386} {"train_loss": -8.399271011352539, "global_step": 64861, "epoch": 386} {"train_loss": -8.93067741394043, "global_step": 64862, "epoch": 386} {"train_loss": -8.718238830566406, "global_step": 64863, "epoch": 386} {"train_loss": -8.734366416931152, "global_step": 64864, "epoch": 386} {"train_loss": -8.878803253173828, "global_step": 64865, "epoch": 386} {"train_loss": -8.729869842529297, "global_step": 64866, "epoch": 386} {"train_loss": -8.774322509765625, "global_step": 64867, "epoch": 386} {"train_loss": -8.871060371398926, "global_step": 64868, "epoch": 386} {"train_loss": -8.877732276916504, "global_step": 64869, "epoch": 386} {"train_loss": -9.001794815063477, "global_step": 64870, "epoch": 386} {"train_loss": -8.833564758300781, "global_step": 64871, "epoch": 386} {"train_loss": -8.833012580871582, "global_step": 64872, "epoch": 386} {"train_loss": -8.905241012573242, "global_step": 64873, "epoch": 386} {"train_loss": -9.044673919677734, "global_step": 64874, "epoch": 386} {"train_loss": -8.935675621032715, "global_step": 64875, "epoch": 386} {"train_loss": -9.164518356323242, "global_step": 64876, "epoch": 386} {"train_loss": -8.78644847869873, "global_step": 64877, "epoch": 386} {"train_loss": -8.988188743591309, "global_step": 64878, "epoch": 386} {"train_loss": -9.071304321289062, "global_step": 64879, "epoch": 386} {"train_loss": -9.018264770507812, "global_step": 64880, "epoch": 386} {"train_loss": -8.965359687805176, "global_step": 64881, "epoch": 386} {"train_loss": -8.774603843688965, "global_step": 64882, "epoch": 386} {"train_loss": -8.936600685119629, "global_step": 64883, "epoch": 386} {"train_loss": -8.771722793579102, "global_step": 64884, "epoch": 386} {"train_loss": -8.944586753845215, "global_step": 64885, "epoch": 386} {"train_loss": -9.158065795898438, "global_step": 64886, "epoch": 386} {"train_loss": -8.75265121459961, "global_step": 64887, "epoch": 386} {"train_loss": -9.098444938659668, "global_step": 64888, "epoch": 386} {"train_loss": -8.842315673828125, "global_step": 64889, "epoch": 386} {"train_loss": -8.827150344848633, "global_step": 64890, "epoch": 386} {"train_loss": -8.873300552368164, "global_step": 64891, "epoch": 386} {"train_loss": -8.804420471191406, "global_step": 64892, "epoch": 386} {"train_loss": -8.869739532470703, "global_step": 64893, "epoch": 386} {"train_loss": -8.66711139678955, "global_step": 64894, "epoch": 386} {"train_loss": -8.928821563720703, "global_step": 64895, "epoch": 386} {"train_loss": -8.449756622314453, "global_step": 64896, "epoch": 386} {"train_loss": -8.742229461669922, "global_step": 64897, "epoch": 386} {"train_loss": -8.877453804016113, "global_step": 64898, "epoch": 386} {"train_loss": -8.767793655395508, "global_step": 64899, "epoch": 386} {"train_loss": -8.787847518920898, "global_step": 64900, "epoch": 386} {"train_loss": -8.687386512756348, "global_step": 64901, "epoch": 386} {"train_loss": -8.665813446044922, "global_step": 64902, "epoch": 386} {"train_loss": -8.720296859741211, "global_step": 64903, "epoch": 386} {"train_loss": -8.704681396484375, "global_step": 64904, "epoch": 386} {"train_loss": -8.739304542541504, "global_step": 64905, "epoch": 386} {"train_loss": -8.687472343444824, "global_step": 64906, "epoch": 386} {"train_loss": -8.895669937133789, "global_step": 64907, "epoch": 386} {"train_loss": -8.183128356933594, "global_step": 64908, "epoch": 386} {"train_loss": -8.533235549926758, "global_step": 64909, "epoch": 386} {"train_loss": -8.348773956298828, "global_step": 64910, "epoch": 386} {"train_loss": -8.441181182861328, "global_step": 64911, "epoch": 386} {"train_loss": -8.512422561645508, "global_step": 64912, "epoch": 386} {"train_loss": -8.713096618652344, "global_step": 64913, "epoch": 386} {"train_loss": -8.460747718811035, "global_step": 64914, "epoch": 386} {"train_loss": -8.78389835357666, "global_step": 64915, "epoch": 386} {"train_loss": -8.357046127319336, "global_step": 64916, "epoch": 386} {"train_loss": -8.817102432250977, "global_step": 64917, "epoch": 386} {"train_loss": -8.742353439331055, "global_step": 64918, "epoch": 386} {"train_loss": -8.555002212524414, "global_step": 64919, "epoch": 386} {"train_loss": -8.88044548034668, "global_step": 64920, "epoch": 386} {"train_loss": -8.80892562866211, "global_step": 64921, "epoch": 386} {"train_loss": -8.643455505371094, "global_step": 64922, "epoch": 386} {"train_loss": -8.724157333374023, "global_step": 64923, "epoch": 386} {"train_loss": -8.805792808532715, "global_step": 64924, "epoch": 386} {"train_loss": -8.707662582397461, "global_step": 64925, "epoch": 386} {"train_loss": -8.65780258178711, "global_step": 64926, "epoch": 386} {"train_loss": -8.689044952392578, "global_step": 64927, "epoch": 386} {"train_loss": -8.681699752807617, "global_step": 64928, "epoch": 386} {"train_loss": -8.811727523803711, "global_step": 64929, "epoch": 386} {"train_loss": -8.88632583618164, "global_step": 64930, "epoch": 386} {"train_loss": -8.785541534423828, "global_step": 64931, "epoch": 386} {"train_loss": -8.69052505493164, "global_step": 64932, "epoch": 386} {"train_loss": -8.878023147583008, "global_step": 64933, "epoch": 386} {"train_loss": -8.940078735351562, "global_step": 64934, "epoch": 386} {"train_loss": -8.86762523651123, "global_step": 64935, "epoch": 386} {"train_loss": -8.950724601745605, "global_step": 64936, "epoch": 386} {"train_loss": -9.028334617614746, "global_step": 64937, "epoch": 386} {"train_loss": -8.874893188476562, "global_step": 64938, "epoch": 386} {"train_loss": -8.827999114990234, "global_step": 64939, "epoch": 386} {"train_loss": -8.695929527282715, "global_step": 64940, "epoch": 386} {"train_loss": -8.939191818237305, "global_step": 64941, "epoch": 386} {"train_loss": -8.649177551269531, "global_step": 64942, "epoch": 386} {"train_loss": -8.743431091308594, "global_step": 64943, "epoch": 386} {"train_loss": -8.927824020385742, "global_step": 64944, "epoch": 386} {"train_loss": -8.83224105834961, "global_step": 64945, "epoch": 386} {"train_loss": -8.763223648071289, "global_step": 64946, "epoch": 386} {"train_loss": -8.963167190551758, "global_step": 64947, "epoch": 386} {"train_loss": -8.826778411865234, "global_step": 64948, "epoch": 386} {"train_loss": -8.88057804107666, "global_step": 64949, "epoch": 386} {"train_loss": -8.948843002319336, "global_step": 64950, "epoch": 386} {"train_loss": -8.330272674560547, "global_step": 64951, "epoch": 386} {"train_loss": -9.022562026977539, "global_step": 64952, "epoch": 386} {"train_loss": -8.560579299926758, "global_step": 64953, "epoch": 386} {"train_loss": -8.804608345031738, "global_step": 64954, "epoch": 386} {"train_loss": -8.443750381469727, "global_step": 64955, "epoch": 386} {"train_loss": -8.516946792602539, "global_step": 64956, "epoch": 386} {"train_loss": -8.608034133911133, "global_step": 64957, "epoch": 386} {"train_loss": -8.78414249420166, "global_step": 64958, "epoch": 386} {"train_loss": -8.688789367675781, "global_step": 64959, "epoch": 386} {"train_loss": -8.726461410522461, "global_step": 64960, "epoch": 386} {"train_loss": -8.651517868041992, "global_step": 64961, "epoch": 386} {"train_loss": -8.880792617797852, "global_step": 64962, "epoch": 386} {"train_loss": -8.533402442932129, "global_step": 64963, "epoch": 386} {"train_loss": -8.799884796142578, "global_step": 64964, "epoch": 386} {"train_loss": -8.723953247070312, "global_step": 64965, "epoch": 386} {"train_loss": -8.555952072143555, "global_step": 64966, "epoch": 386} {"train_loss": -8.664407730102539, "global_step": 64967, "epoch": 386} {"train_loss": -8.48630428314209, "global_step": 64968, "epoch": 386} {"train_loss": -8.698213577270508, "global_step": 64969, "epoch": 386} {"train_loss": -8.71238899230957, "global_step": 64970, "epoch": 386} {"train_loss": -8.787243843078613, "global_step": 64971, "epoch": 386} {"train_loss": -8.790830612182617, "global_step": 64972, "epoch": 386} {"train_loss": -8.739599227905273, "global_step": 64973, "epoch": 386} {"train_loss": -8.634437561035156, "global_step": 64974, "epoch": 386} {"train_loss": -8.631601333618164, "global_step": 64975, "epoch": 386} {"train_loss": -8.77523136138916, "global_step": 64976, "epoch": 386} {"train_loss": -8.668620109558105, "global_step": 64977, "epoch": 386} {"train_loss": -8.813470840454102, "global_step": 64978, "epoch": 386} {"train_loss": -8.28005599975586, "global_step": 64979, "epoch": 386} {"train_loss": -9.04742431640625, "global_step": 64980, "epoch": 386} {"train_loss": -8.349213600158691, "global_step": 64981, "epoch": 386} {"train_loss": -8.939785957336426, "global_step": 64982, "epoch": 386} {"train_loss": -8.740129470825195, "global_step": 64983, "epoch": 386} {"train_loss": -8.575767517089844, "global_step": 64984, "epoch": 386} {"train_loss": -8.515420913696289, "global_step": 64985, "epoch": 386} {"train_loss": -8.694132804870605, "global_step": 64986, "epoch": 386} {"train_loss": -8.834314346313477, "global_step": 64987, "epoch": 386} {"train_loss": -8.671791076660156, "global_step": 64988, "epoch": 386} {"train_loss": -8.80877685546875, "global_step": 64989, "epoch": 386} {"train_loss": -8.806291580200195, "global_step": 64990, "epoch": 386} {"train_loss": -8.742843627929688, "global_step": 64991, "epoch": 386} {"train_loss": -8.720407485961914, "global_step": 64992, "epoch": 386} {"train_loss": -8.781699180603027, "global_step": 64993, "epoch": 386} {"train_loss": -8.826844215393066, "global_step": 64994, "epoch": 386} {"train_loss": -8.651212692260742, "global_step": 64995, "epoch": 386} {"train_loss": -8.952754020690918, "global_step": 64996, "epoch": 386} {"train_loss": -8.453621864318848, "global_step": 64997, "epoch": 386} {"train_loss": -8.62353515625, "global_step": 64998, "epoch": 386} {"train_loss": -8.626405715942383, "global_step": 64999, "epoch": 386} {"train_loss": -8.723660469055176, "global_step": 65000, "epoch": 386} {"train_loss": -8.703531265258789, "global_step": 65001, "epoch": 386} {"train_loss": -8.49606704711914, "global_step": 65002, "epoch": 386} {"train_loss": -8.683302879333496, "global_step": 65003, "epoch": 386} {"train_loss": -8.499079704284668, "global_step": 65004, "epoch": 386} {"train_loss": -8.594364166259766, "global_step": 65005, "epoch": 386} {"train_loss": -8.870138168334961, "global_step": 65006, "epoch": 386} {"train_loss": -8.652303695678711, "global_step": 65007, "epoch": 386} {"train_loss": -8.687299728393555, "global_step": 65008, "epoch": 386} {"train_loss": -8.747779846191406, "global_step": 65009, "epoch": 386} {"train_loss": -8.814422607421875, "global_step": 65010, "epoch": 386} {"train_loss": -8.830804824829102, "global_step": 65011, "epoch": 386} {"train_loss": -8.63642692565918, "global_step": 65012, "epoch": 386} {"train_loss": -8.789238929748535, "global_step": 65013, "epoch": 386} {"train_loss": -8.674369812011719, "global_step": 65014, "epoch": 386} {"train_loss": -8.747119091805958, "global_step": 65015, "epoch": 386, "val_loss": 192454.328125} {"train_loss": -9.120248794555664, "global_step": 65016, "epoch": 387} {"train_loss": -8.971746444702148, "global_step": 65017, "epoch": 387} {"train_loss": -8.778156280517578, "global_step": 65018, "epoch": 387} {"train_loss": -9.000720024108887, "global_step": 65019, "epoch": 387} {"train_loss": -8.879575729370117, "global_step": 65020, "epoch": 387} {"train_loss": -8.768611907958984, "global_step": 65021, "epoch": 387} {"train_loss": -8.915497779846191, "global_step": 65022, "epoch": 387} {"train_loss": -8.950368881225586, "global_step": 65023, "epoch": 387} {"train_loss": -8.69898796081543, "global_step": 65024, "epoch": 387} {"train_loss": -8.762571334838867, "global_step": 65025, "epoch": 387} {"train_loss": -8.83398151397705, "global_step": 65026, "epoch": 387} {"train_loss": -8.704137802124023, "global_step": 65027, "epoch": 387} {"train_loss": -8.945552825927734, "global_step": 65028, "epoch": 387} {"train_loss": -8.703269004821777, "global_step": 65029, "epoch": 387} {"train_loss": -8.849367141723633, "global_step": 65030, "epoch": 387} {"train_loss": -8.804996490478516, "global_step": 65031, "epoch": 387} {"train_loss": -8.958379745483398, "global_step": 65032, "epoch": 387} {"train_loss": -8.902168273925781, "global_step": 65033, "epoch": 387} {"train_loss": -8.973535537719727, "global_step": 65034, "epoch": 387} {"train_loss": -8.851888656616211, "global_step": 65035, "epoch": 387} {"train_loss": -8.890304565429688, "global_step": 65036, "epoch": 387} {"train_loss": -8.898574829101562, "global_step": 65037, "epoch": 387} {"train_loss": -8.81425666809082, "global_step": 65038, "epoch": 387} {"train_loss": -8.726337432861328, "global_step": 65039, "epoch": 387} {"train_loss": -8.848832130432129, "global_step": 65040, "epoch": 387} {"train_loss": -8.661818504333496, "global_step": 65041, "epoch": 387} {"train_loss": -8.608850479125977, "global_step": 65042, "epoch": 387} {"train_loss": -8.690377235412598, "global_step": 65043, "epoch": 387} {"train_loss": -8.862015724182129, "global_step": 65044, "epoch": 387} {"train_loss": -8.522648811340332, "global_step": 65045, "epoch": 387} {"train_loss": -8.701364517211914, "global_step": 65046, "epoch": 387} {"train_loss": -8.648307800292969, "global_step": 65047, "epoch": 387} {"train_loss": -8.690271377563477, "global_step": 65048, "epoch": 387} {"train_loss": -8.74643325805664, "global_step": 65049, "epoch": 387} {"train_loss": -8.604963302612305, "global_step": 65050, "epoch": 387} {"train_loss": -8.585016250610352, "global_step": 65051, "epoch": 387} {"train_loss": -8.772905349731445, "global_step": 65052, "epoch": 387} {"train_loss": -8.796600341796875, "global_step": 65053, "epoch": 387} {"train_loss": -8.437124252319336, "global_step": 65054, "epoch": 387} {"train_loss": -8.854957580566406, "global_step": 65055, "epoch": 387} {"train_loss": -8.618782043457031, "global_step": 65056, "epoch": 387} {"train_loss": -8.860331535339355, "global_step": 65057, "epoch": 387} {"train_loss": -8.436275482177734, "global_step": 65058, "epoch": 387} {"train_loss": -8.79178524017334, "global_step": 65059, "epoch": 387} {"train_loss": -8.689579010009766, "global_step": 65060, "epoch": 387} {"train_loss": -8.831306457519531, "global_step": 65061, "epoch": 387} {"train_loss": -8.880138397216797, "global_step": 65062, "epoch": 387} {"train_loss": -8.78860092163086, "global_step": 65063, "epoch": 387} {"train_loss": -8.899252891540527, "global_step": 65064, "epoch": 387} {"train_loss": -8.852514266967773, "global_step": 65065, "epoch": 387} {"train_loss": -9.024842262268066, "global_step": 65066, "epoch": 387} {"train_loss": -9.009963989257812, "global_step": 65067, "epoch": 387} {"train_loss": -8.82022476196289, "global_step": 65068, "epoch": 387} {"train_loss": -8.862520217895508, "global_step": 65069, "epoch": 387} {"train_loss": -8.715200424194336, "global_step": 65070, "epoch": 387} {"train_loss": -8.798177719116211, "global_step": 65071, "epoch": 387} {"train_loss": -8.88430118560791, "global_step": 65072, "epoch": 387} {"train_loss": -8.707296371459961, "global_step": 65073, "epoch": 387} {"train_loss": -8.679646492004395, "global_step": 65074, "epoch": 387} {"train_loss": -8.688780784606934, "global_step": 65075, "epoch": 387} {"train_loss": -8.894500732421875, "global_step": 65076, "epoch": 387} {"train_loss": -8.799089431762695, "global_step": 65077, "epoch": 387} {"train_loss": -8.828680992126465, "global_step": 65078, "epoch": 387} {"train_loss": -8.609757423400879, "global_step": 65079, "epoch": 387} {"train_loss": -8.842966079711914, "global_step": 65080, "epoch": 387} {"train_loss": -8.666889190673828, "global_step": 65081, "epoch": 387} {"train_loss": -8.908227920532227, "global_step": 65082, "epoch": 387} {"train_loss": -8.861599922180176, "global_step": 65083, "epoch": 387} {"train_loss": -8.927867889404297, "global_step": 65084, "epoch": 387} {"train_loss": -8.664018630981445, "global_step": 65085, "epoch": 387} {"train_loss": -8.808916091918945, "global_step": 65086, "epoch": 387} {"train_loss": -8.879615783691406, "global_step": 65087, "epoch": 387} {"train_loss": -9.03200912475586, "global_step": 65088, "epoch": 387} {"train_loss": -8.952754020690918, "global_step": 65089, "epoch": 387} {"train_loss": -8.76153564453125, "global_step": 65090, "epoch": 387} {"train_loss": -8.802270889282227, "global_step": 65091, "epoch": 387} {"train_loss": -8.777387619018555, "global_step": 65092, "epoch": 387} {"train_loss": -8.852633476257324, "global_step": 65093, "epoch": 387} {"train_loss": -8.873722076416016, "global_step": 65094, "epoch": 387} {"train_loss": -8.608570098876953, "global_step": 65095, "epoch": 387} {"train_loss": -8.897806167602539, "global_step": 65096, "epoch": 387} {"train_loss": -8.996219635009766, "global_step": 65097, "epoch": 387} {"train_loss": -8.702119827270508, "global_step": 65098, "epoch": 387} {"train_loss": -8.71674919128418, "global_step": 65099, "epoch": 387} {"train_loss": -8.578527450561523, "global_step": 65100, "epoch": 387} {"train_loss": -8.813350677490234, "global_step": 65101, "epoch": 387} {"train_loss": -8.552278518676758, "global_step": 65102, "epoch": 387} {"train_loss": -8.731956481933594, "global_step": 65103, "epoch": 387} {"train_loss": -8.708824157714844, "global_step": 65104, "epoch": 387} {"train_loss": -8.668512344360352, "global_step": 65105, "epoch": 387} {"train_loss": -8.771926879882812, "global_step": 65106, "epoch": 387} {"train_loss": -8.871834754943848, "global_step": 65107, "epoch": 387} {"train_loss": -8.833866119384766, "global_step": 65108, "epoch": 387} {"train_loss": -8.818567276000977, "global_step": 65109, "epoch": 387} {"train_loss": -8.715778350830078, "global_step": 65110, "epoch": 387} {"train_loss": -8.718158721923828, "global_step": 65111, "epoch": 387} {"train_loss": -8.823978424072266, "global_step": 65112, "epoch": 387} {"train_loss": -8.664775848388672, "global_step": 65113, "epoch": 387} {"train_loss": -8.974712371826172, "global_step": 65114, "epoch": 387} {"train_loss": -8.840498924255371, "global_step": 65115, "epoch": 387} {"train_loss": -8.620113372802734, "global_step": 65116, "epoch": 387} {"train_loss": -9.082578659057617, "global_step": 65117, "epoch": 387} {"train_loss": -8.96345329284668, "global_step": 65118, "epoch": 387} {"train_loss": -8.85988998413086, "global_step": 65119, "epoch": 387} {"train_loss": -8.725885391235352, "global_step": 65120, "epoch": 387} {"train_loss": -8.92544937133789, "global_step": 65121, "epoch": 387} {"train_loss": -8.69668197631836, "global_step": 65122, "epoch": 387} {"train_loss": -8.657191276550293, "global_step": 65123, "epoch": 387} {"train_loss": -8.769062042236328, "global_step": 65124, "epoch": 387} {"train_loss": -8.726128578186035, "global_step": 65125, "epoch": 387} {"train_loss": -8.69117546081543, "global_step": 65126, "epoch": 387} {"train_loss": -9.000057220458984, "global_step": 65127, "epoch": 387} {"train_loss": -8.852519989013672, "global_step": 65128, "epoch": 387} {"train_loss": -8.643614768981934, "global_step": 65129, "epoch": 387} {"train_loss": -8.793378829956055, "global_step": 65130, "epoch": 387} {"train_loss": -8.659052848815918, "global_step": 65131, "epoch": 387} {"train_loss": -8.753032684326172, "global_step": 65132, "epoch": 387} {"train_loss": -8.891231536865234, "global_step": 65133, "epoch": 387} {"train_loss": -8.723087310791016, "global_step": 65134, "epoch": 387} {"train_loss": -8.874975204467773, "global_step": 65135, "epoch": 387} {"train_loss": -8.644878387451172, "global_step": 65136, "epoch": 387} {"train_loss": -8.653375625610352, "global_step": 65137, "epoch": 387} {"train_loss": -8.799397468566895, "global_step": 65138, "epoch": 387} {"train_loss": -8.915742874145508, "global_step": 65139, "epoch": 387} {"train_loss": -8.88180160522461, "global_step": 65140, "epoch": 387} {"train_loss": -8.646361351013184, "global_step": 65141, "epoch": 387} {"train_loss": -8.729591369628906, "global_step": 65142, "epoch": 387} {"train_loss": -8.593286514282227, "global_step": 65143, "epoch": 387} {"train_loss": -8.830697059631348, "global_step": 65144, "epoch": 387} {"train_loss": -8.921807289123535, "global_step": 65145, "epoch": 387} {"train_loss": -8.698909759521484, "global_step": 65146, "epoch": 387} {"train_loss": -8.665904998779297, "global_step": 65147, "epoch": 387} {"train_loss": -8.742795944213867, "global_step": 65148, "epoch": 387} {"train_loss": -8.789766311645508, "global_step": 65149, "epoch": 387} {"train_loss": -8.615537643432617, "global_step": 65150, "epoch": 387} {"train_loss": -9.075357437133789, "global_step": 65151, "epoch": 387} {"train_loss": -8.781913757324219, "global_step": 65152, "epoch": 387} {"train_loss": -8.562939643859863, "global_step": 65153, "epoch": 387} {"train_loss": -8.420809745788574, "global_step": 65154, "epoch": 387} {"train_loss": -8.907502174377441, "global_step": 65155, "epoch": 387} {"train_loss": -8.86373519897461, "global_step": 65156, "epoch": 387} {"train_loss": -8.776793479919434, "global_step": 65157, "epoch": 387} {"train_loss": -8.736326217651367, "global_step": 65158, "epoch": 387} {"train_loss": -8.673011779785156, "global_step": 65159, "epoch": 387} {"train_loss": -8.799589157104492, "global_step": 65160, "epoch": 387} {"train_loss": -8.7269287109375, "global_step": 65161, "epoch": 387} {"train_loss": -8.766885757446289, "global_step": 65162, "epoch": 387} {"train_loss": -8.750505447387695, "global_step": 65163, "epoch": 387} {"train_loss": -8.93155288696289, "global_step": 65164, "epoch": 387} {"train_loss": -8.605762481689453, "global_step": 65165, "epoch": 387} {"train_loss": -8.66270637512207, "global_step": 65166, "epoch": 387} {"train_loss": -8.562074661254883, "global_step": 65167, "epoch": 387} {"train_loss": -8.905357360839844, "global_step": 65168, "epoch": 387} {"train_loss": -8.688602447509766, "global_step": 65169, "epoch": 387} {"train_loss": -8.806760787963867, "global_step": 65170, "epoch": 387} {"train_loss": -8.816893577575684, "global_step": 65171, "epoch": 387} {"train_loss": -8.631467819213867, "global_step": 65172, "epoch": 387} {"train_loss": -8.912759780883789, "global_step": 65173, "epoch": 387} {"train_loss": -9.109130859375, "global_step": 65174, "epoch": 387} {"train_loss": -8.735649108886719, "global_step": 65175, "epoch": 387} {"train_loss": -8.9700288772583, "global_step": 65176, "epoch": 387} {"train_loss": -8.657886505126953, "global_step": 65177, "epoch": 387} {"train_loss": -8.650928497314453, "global_step": 65178, "epoch": 387} {"train_loss": -8.889005661010742, "global_step": 65179, "epoch": 387} {"train_loss": -8.888006210327148, "global_step": 65180, "epoch": 387} {"train_loss": -8.718429565429688, "global_step": 65181, "epoch": 387} {"train_loss": -8.699628829956055, "global_step": 65182, "epoch": 387} {"train_loss": -8.783447958174206, "global_step": 65183, "epoch": 387, "val_loss": 192826.390625} {"train_loss": -8.855169296264648, "global_step": 65184, "epoch": 388} {"train_loss": -8.599641799926758, "global_step": 65185, "epoch": 388} {"train_loss": -8.819276809692383, "global_step": 65186, "epoch": 388} {"train_loss": -8.786271095275879, "global_step": 65187, "epoch": 388} {"train_loss": -9.07004165649414, "global_step": 65188, "epoch": 388} {"train_loss": -8.87607192993164, "global_step": 65189, "epoch": 388} {"train_loss": -8.883136749267578, "global_step": 65190, "epoch": 388} {"train_loss": -8.699466705322266, "global_step": 65191, "epoch": 388} {"train_loss": -7.7945356369018555, "global_step": 65192, "epoch": 388} {"train_loss": -8.792708396911621, "global_step": 65193, "epoch": 388} {"train_loss": -8.678810119628906, "global_step": 65194, "epoch": 388} {"train_loss": -8.701130867004395, "global_step": 65195, "epoch": 388} {"train_loss": -8.86829948425293, "global_step": 65196, "epoch": 388} {"train_loss": -8.53476619720459, "global_step": 65197, "epoch": 388} {"train_loss": -8.757000923156738, "global_step": 65198, "epoch": 388} {"train_loss": -8.811198234558105, "global_step": 65199, "epoch": 388} {"train_loss": -8.60527515411377, "global_step": 65200, "epoch": 388} {"train_loss": -8.75872802734375, "global_step": 65201, "epoch": 388} {"train_loss": -8.687663078308105, "global_step": 65202, "epoch": 388} {"train_loss": -8.679725646972656, "global_step": 65203, "epoch": 388} {"train_loss": -8.703554153442383, "global_step": 65204, "epoch": 388} {"train_loss": -8.394181251525879, "global_step": 65205, "epoch": 388} {"train_loss": -8.536806106567383, "global_step": 65206, "epoch": 388} {"train_loss": -8.575706481933594, "global_step": 65207, "epoch": 388} {"train_loss": -8.861757278442383, "global_step": 65208, "epoch": 388} {"train_loss": -8.858015060424805, "global_step": 65209, "epoch": 388} {"train_loss": -8.741157531738281, "global_step": 65210, "epoch": 388} {"train_loss": -8.731719970703125, "global_step": 65211, "epoch": 388} {"train_loss": -8.730871200561523, "global_step": 65212, "epoch": 388} {"train_loss": -8.723546028137207, "global_step": 65213, "epoch": 388} {"train_loss": -8.644004821777344, "global_step": 65214, "epoch": 388} {"train_loss": -8.795269012451172, "global_step": 65215, "epoch": 388} {"train_loss": -8.64317512512207, "global_step": 65216, "epoch": 388} {"train_loss": -8.911910057067871, "global_step": 65217, "epoch": 388} {"train_loss": -8.531824111938477, "global_step": 65218, "epoch": 388} {"train_loss": -8.859450340270996, "global_step": 65219, "epoch": 388} {"train_loss": -8.600072860717773, "global_step": 65220, "epoch": 388} {"train_loss": -8.88498306274414, "global_step": 65221, "epoch": 388} {"train_loss": -8.908138275146484, "global_step": 65222, "epoch": 388} {"train_loss": -8.922167778015137, "global_step": 65223, "epoch": 388} {"train_loss": -8.807903289794922, "global_step": 65224, "epoch": 388} {"train_loss": -8.903448104858398, "global_step": 65225, "epoch": 388} {"train_loss": -8.68631649017334, "global_step": 65226, "epoch": 388} {"train_loss": -8.833715438842773, "global_step": 65227, "epoch": 388} {"train_loss": -8.6690673828125, "global_step": 65228, "epoch": 388} {"train_loss": -8.660255432128906, "global_step": 65229, "epoch": 388} {"train_loss": -8.618520736694336, "global_step": 65230, "epoch": 388} {"train_loss": -8.458208084106445, "global_step": 65231, "epoch": 388} {"train_loss": -8.741247177124023, "global_step": 65232, "epoch": 388} {"train_loss": -8.649781227111816, "global_step": 65233, "epoch": 388} {"train_loss": -8.533761978149414, "global_step": 65234, "epoch": 388} {"train_loss": -8.469383239746094, "global_step": 65235, "epoch": 388} {"train_loss": -8.665609359741211, "global_step": 65236, "epoch": 388} {"train_loss": -8.641765594482422, "global_step": 65237, "epoch": 388} {"train_loss": -8.34864616394043, "global_step": 65238, "epoch": 388} {"train_loss": -8.90249252319336, "global_step": 65239, "epoch": 388} {"train_loss": -8.697065353393555, "global_step": 65240, "epoch": 388} {"train_loss": -8.681295394897461, "global_step": 65241, "epoch": 388} {"train_loss": -8.914017677307129, "global_step": 65242, "epoch": 388} {"train_loss": -8.852540969848633, "global_step": 65243, "epoch": 388} {"train_loss": -8.683351516723633, "global_step": 65244, "epoch": 388} {"train_loss": -8.660594940185547, "global_step": 65245, "epoch": 388} {"train_loss": -8.713685989379883, "global_step": 65246, "epoch": 388} {"train_loss": -8.820711135864258, "global_step": 65247, "epoch": 388} {"train_loss": -8.732027053833008, "global_step": 65248, "epoch": 388} {"train_loss": -8.781997680664062, "global_step": 65249, "epoch": 388} {"train_loss": -8.82158374786377, "global_step": 65250, "epoch": 388} {"train_loss": -8.598052978515625, "global_step": 65251, "epoch": 388} {"train_loss": -8.663293838500977, "global_step": 65252, "epoch": 388} {"train_loss": -8.707071304321289, "global_step": 65253, "epoch": 388} {"train_loss": -8.735041618347168, "global_step": 65254, "epoch": 388} {"train_loss": -8.993051528930664, "global_step": 65255, "epoch": 388} {"train_loss": -8.817277908325195, "global_step": 65256, "epoch": 388} {"train_loss": -8.818078994750977, "global_step": 65257, "epoch": 388} {"train_loss": -8.94817066192627, "global_step": 65258, "epoch": 388} {"train_loss": -9.112555503845215, "global_step": 65259, "epoch": 388} {"train_loss": -8.957603454589844, "global_step": 65260, "epoch": 388} {"train_loss": -8.913947105407715, "global_step": 65261, "epoch": 388} {"train_loss": -8.927099227905273, "global_step": 65262, "epoch": 388} {"train_loss": -8.986869812011719, "global_step": 65263, "epoch": 388} {"train_loss": -8.993537902832031, "global_step": 65264, "epoch": 388} {"train_loss": -9.010231018066406, "global_step": 65265, "epoch": 388} {"train_loss": -8.8783597946167, "global_step": 65266, "epoch": 388} {"train_loss": -8.3790922164917, "global_step": 65267, "epoch": 388} {"train_loss": -8.617729187011719, "global_step": 65268, "epoch": 388} {"train_loss": -8.561619758605957, "global_step": 65269, "epoch": 388} {"train_loss": -8.617332458496094, "global_step": 65270, "epoch": 388} {"train_loss": -8.454872131347656, "global_step": 65271, "epoch": 388} {"train_loss": -8.698661804199219, "global_step": 65272, "epoch": 388} {"train_loss": -8.89315128326416, "global_step": 65273, "epoch": 388} {"train_loss": -8.782371520996094, "global_step": 65274, "epoch": 388} {"train_loss": -8.62159538269043, "global_step": 65275, "epoch": 388} {"train_loss": -8.857610702514648, "global_step": 65276, "epoch": 388} {"train_loss": -8.818809509277344, "global_step": 65277, "epoch": 388} {"train_loss": -8.82429313659668, "global_step": 65278, "epoch": 388} {"train_loss": -8.921934127807617, "global_step": 65279, "epoch": 388} {"train_loss": -8.544717788696289, "global_step": 65280, "epoch": 388} {"train_loss": -8.708450317382812, "global_step": 65281, "epoch": 388} {"train_loss": -8.728378295898438, "global_step": 65282, "epoch": 388} {"train_loss": -9.040498733520508, "global_step": 65283, "epoch": 388} {"train_loss": -8.620203018188477, "global_step": 65284, "epoch": 388} {"train_loss": -8.640909194946289, "global_step": 65285, "epoch": 388} {"train_loss": -8.662922859191895, "global_step": 65286, "epoch": 388} {"train_loss": -8.935367584228516, "global_step": 65287, "epoch": 388} {"train_loss": -8.627731323242188, "global_step": 65288, "epoch": 388} {"train_loss": -8.646865844726562, "global_step": 65289, "epoch": 388} {"train_loss": -8.618110656738281, "global_step": 65290, "epoch": 388} {"train_loss": -8.805169105529785, "global_step": 65291, "epoch": 388} {"train_loss": -8.635854721069336, "global_step": 65292, "epoch": 388} {"train_loss": -8.60340404510498, "global_step": 65293, "epoch": 388} {"train_loss": -8.627994537353516, "global_step": 65294, "epoch": 388} {"train_loss": -8.72979736328125, "global_step": 65295, "epoch": 388} {"train_loss": -8.85682487487793, "global_step": 65296, "epoch": 388} {"train_loss": -8.719451904296875, "global_step": 65297, "epoch": 388} {"train_loss": -8.847768783569336, "global_step": 65298, "epoch": 388} {"train_loss": -8.85580062866211, "global_step": 65299, "epoch": 388} {"train_loss": -8.70848560333252, "global_step": 65300, "epoch": 388} {"train_loss": -8.858407020568848, "global_step": 65301, "epoch": 388} {"train_loss": -8.843338012695312, "global_step": 65302, "epoch": 388} {"train_loss": -8.60331916809082, "global_step": 65303, "epoch": 388} {"train_loss": -8.672707557678223, "global_step": 65304, "epoch": 388} {"train_loss": -8.938013076782227, "global_step": 65305, "epoch": 388} {"train_loss": -9.050307273864746, "global_step": 65306, "epoch": 388} {"train_loss": -8.816489219665527, "global_step": 65307, "epoch": 388} {"train_loss": -8.953760147094727, "global_step": 65308, "epoch": 388} {"train_loss": -8.884331703186035, "global_step": 65309, "epoch": 388} {"train_loss": -9.01630973815918, "global_step": 65310, "epoch": 388} {"train_loss": -8.941737174987793, "global_step": 65311, "epoch": 388} {"train_loss": -9.040407180786133, "global_step": 65312, "epoch": 388} {"train_loss": -8.907442092895508, "global_step": 65313, "epoch": 388} {"train_loss": -9.120399475097656, "global_step": 65314, "epoch": 388} {"train_loss": -8.855239868164062, "global_step": 65315, "epoch": 388} {"train_loss": -9.062976837158203, "global_step": 65316, "epoch": 388} {"train_loss": -9.070205688476562, "global_step": 65317, "epoch": 388} {"train_loss": -9.03842544555664, "global_step": 65318, "epoch": 388} {"train_loss": -8.880677223205566, "global_step": 65319, "epoch": 388} {"train_loss": -8.952421188354492, "global_step": 65320, "epoch": 388} {"train_loss": -8.917893409729004, "global_step": 65321, "epoch": 388} {"train_loss": -8.789579391479492, "global_step": 65322, "epoch": 388} {"train_loss": -8.815937042236328, "global_step": 65323, "epoch": 388} {"train_loss": -8.94426441192627, "global_step": 65324, "epoch": 388} {"train_loss": -8.760564804077148, "global_step": 65325, "epoch": 388} {"train_loss": -8.734758377075195, "global_step": 65326, "epoch": 388} {"train_loss": -8.759526252746582, "global_step": 65327, "epoch": 388} {"train_loss": -8.731014251708984, "global_step": 65328, "epoch": 388} {"train_loss": -8.915422439575195, "global_step": 65329, "epoch": 388} {"train_loss": -9.068281173706055, "global_step": 65330, "epoch": 388} {"train_loss": -8.969121932983398, "global_step": 65331, "epoch": 388} {"train_loss": -8.847732543945312, "global_step": 65332, "epoch": 388} {"train_loss": -8.943140029907227, "global_step": 65333, "epoch": 388} {"train_loss": -9.162124633789062, "global_step": 65334, "epoch": 388} {"train_loss": -8.879066467285156, "global_step": 65335, "epoch": 388} {"train_loss": -8.816296577453613, "global_step": 65336, "epoch": 388} {"train_loss": -8.854798316955566, "global_step": 65337, "epoch": 388} {"train_loss": -9.026100158691406, "global_step": 65338, "epoch": 388} {"train_loss": -8.451393127441406, "global_step": 65339, "epoch": 388} {"train_loss": -8.901840209960938, "global_step": 65340, "epoch": 388} {"train_loss": -8.64084529876709, "global_step": 65341, "epoch": 388} {"train_loss": -8.782504081726074, "global_step": 65342, "epoch": 388} {"train_loss": -8.822076797485352, "global_step": 65343, "epoch": 388} {"train_loss": -8.542346954345703, "global_step": 65344, "epoch": 388} {"train_loss": -8.801092147827148, "global_step": 65345, "epoch": 388} {"train_loss": -8.864984512329102, "global_step": 65346, "epoch": 388} {"train_loss": -8.629231452941895, "global_step": 65347, "epoch": 388} {"train_loss": -8.625099182128906, "global_step": 65348, "epoch": 388} {"train_loss": -8.520867347717285, "global_step": 65349, "epoch": 388} {"train_loss": -8.510040283203125, "global_step": 65350, "epoch": 388} {"train_loss": -8.768283912113734, "global_step": 65351, "epoch": 388, "val_loss": 190420.515625} {"train_loss": -8.757648468017578, "global_step": 65352, "epoch": 389} {"train_loss": -8.553445816040039, "global_step": 65353, "epoch": 389} {"train_loss": -8.725319862365723, "global_step": 65354, "epoch": 389} {"train_loss": -8.482002258300781, "global_step": 65355, "epoch": 389} {"train_loss": -8.825587272644043, "global_step": 65356, "epoch": 389} {"train_loss": -8.21409797668457, "global_step": 65357, "epoch": 389} {"train_loss": -8.7319974899292, "global_step": 65358, "epoch": 389} {"train_loss": -8.729803085327148, "global_step": 65359, "epoch": 389} {"train_loss": -8.465316772460938, "global_step": 65360, "epoch": 389} {"train_loss": -8.469358444213867, "global_step": 65361, "epoch": 389} {"train_loss": -8.404106140136719, "global_step": 65362, "epoch": 389} {"train_loss": -8.830410957336426, "global_step": 65363, "epoch": 389} {"train_loss": -8.519322395324707, "global_step": 65364, "epoch": 389} {"train_loss": -8.570324897766113, "global_step": 65365, "epoch": 389} {"train_loss": -8.850532531738281, "global_step": 65366, "epoch": 389} {"train_loss": -8.922826766967773, "global_step": 65367, "epoch": 389} {"train_loss": -8.585363388061523, "global_step": 65368, "epoch": 389} {"train_loss": -8.643085479736328, "global_step": 65369, "epoch": 389} {"train_loss": -8.816644668579102, "global_step": 65370, "epoch": 389} {"train_loss": -8.649742126464844, "global_step": 65371, "epoch": 389} {"train_loss": -8.642740249633789, "global_step": 65372, "epoch": 389} {"train_loss": -8.769161224365234, "global_step": 65373, "epoch": 389} {"train_loss": -9.054774284362793, "global_step": 65374, "epoch": 389} {"train_loss": -8.878334045410156, "global_step": 65375, "epoch": 389} {"train_loss": -8.696464538574219, "global_step": 65376, "epoch": 389} {"train_loss": -8.819830894470215, "global_step": 65377, "epoch": 389} {"train_loss": -8.976605415344238, "global_step": 65378, "epoch": 389} {"train_loss": -8.551025390625, "global_step": 65379, "epoch": 389} {"train_loss": -9.034322738647461, "global_step": 65380, "epoch": 389} {"train_loss": -8.752290725708008, "global_step": 65381, "epoch": 389} {"train_loss": -8.995455741882324, "global_step": 65382, "epoch": 389} {"train_loss": -8.771095275878906, "global_step": 65383, "epoch": 389} {"train_loss": -8.740196228027344, "global_step": 65384, "epoch": 389} {"train_loss": -8.833532333374023, "global_step": 65385, "epoch": 389} {"train_loss": -8.553196907043457, "global_step": 65386, "epoch": 389} {"train_loss": -9.011028289794922, "global_step": 65387, "epoch": 389} {"train_loss": -8.928044319152832, "global_step": 65388, "epoch": 389} {"train_loss": -8.746990203857422, "global_step": 65389, "epoch": 389} {"train_loss": -8.913496017456055, "global_step": 65390, "epoch": 389} {"train_loss": -9.04793930053711, "global_step": 65391, "epoch": 389} {"train_loss": -8.914323806762695, "global_step": 65392, "epoch": 389} {"train_loss": -8.817344665527344, "global_step": 65393, "epoch": 389} {"train_loss": -9.008712768554688, "global_step": 65394, "epoch": 389} {"train_loss": -8.612791061401367, "global_step": 65395, "epoch": 389} {"train_loss": -9.158614158630371, "global_step": 65396, "epoch": 389} {"train_loss": -8.492523193359375, "global_step": 65397, "epoch": 389} {"train_loss": -9.054085731506348, "global_step": 65398, "epoch": 389} {"train_loss": -8.633020401000977, "global_step": 65399, "epoch": 389} {"train_loss": -8.876487731933594, "global_step": 65400, "epoch": 389} {"train_loss": -8.853559494018555, "global_step": 65401, "epoch": 389} {"train_loss": -8.820114135742188, "global_step": 65402, "epoch": 389} {"train_loss": -8.735101699829102, "global_step": 65403, "epoch": 389} {"train_loss": -8.861993789672852, "global_step": 65404, "epoch": 389} {"train_loss": -8.560202598571777, "global_step": 65405, "epoch": 389} {"train_loss": -8.914505958557129, "global_step": 65406, "epoch": 389} {"train_loss": -8.76441764831543, "global_step": 65407, "epoch": 389} {"train_loss": -8.812702178955078, "global_step": 65408, "epoch": 389} {"train_loss": -8.837325096130371, "global_step": 65409, "epoch": 389} {"train_loss": -8.855854988098145, "global_step": 65410, "epoch": 389} {"train_loss": -8.824377059936523, "global_step": 65411, "epoch": 389} {"train_loss": -8.759873390197754, "global_step": 65412, "epoch": 389} {"train_loss": -8.67090892791748, "global_step": 65413, "epoch": 389} {"train_loss": -8.687309265136719, "global_step": 65414, "epoch": 389} {"train_loss": -9.096216201782227, "global_step": 65415, "epoch": 389} {"train_loss": -8.870656967163086, "global_step": 65416, "epoch": 389} {"train_loss": -8.83581256866455, "global_step": 65417, "epoch": 389} {"train_loss": -8.991555213928223, "global_step": 65418, "epoch": 389} {"train_loss": -8.59183120727539, "global_step": 65419, "epoch": 389} {"train_loss": -8.916421890258789, "global_step": 65420, "epoch": 389} {"train_loss": -8.99689769744873, "global_step": 65421, "epoch": 389} {"train_loss": -8.997308731079102, "global_step": 65422, "epoch": 389} {"train_loss": -8.869205474853516, "global_step": 65423, "epoch": 389} {"train_loss": -8.665396690368652, "global_step": 65424, "epoch": 389} {"train_loss": -8.490209579467773, "global_step": 65425, "epoch": 389} {"train_loss": -8.900055885314941, "global_step": 65426, "epoch": 389} {"train_loss": -8.793807983398438, "global_step": 65427, "epoch": 389} {"train_loss": -8.544843673706055, "global_step": 65428, "epoch": 389} {"train_loss": -8.765490531921387, "global_step": 65429, "epoch": 389} {"train_loss": -8.777851104736328, "global_step": 65430, "epoch": 389} {"train_loss": -8.66926383972168, "global_step": 65431, "epoch": 389} {"train_loss": -8.68641471862793, "global_step": 65432, "epoch": 389} {"train_loss": -8.584674835205078, "global_step": 65433, "epoch": 389} {"train_loss": -8.788895606994629, "global_step": 65434, "epoch": 389} {"train_loss": -8.51986312866211, "global_step": 65435, "epoch": 389} {"train_loss": -8.9693603515625, "global_step": 65436, "epoch": 389} {"train_loss": -8.86520004272461, "global_step": 65437, "epoch": 389} {"train_loss": -8.974259376525879, "global_step": 65438, "epoch": 389} {"train_loss": -8.894306182861328, "global_step": 65439, "epoch": 389} {"train_loss": -8.936965942382812, "global_step": 65440, "epoch": 389} {"train_loss": -8.835058212280273, "global_step": 65441, "epoch": 389} {"train_loss": -8.905831336975098, "global_step": 65442, "epoch": 389} {"train_loss": -8.97000503540039, "global_step": 65443, "epoch": 389} {"train_loss": -8.868460655212402, "global_step": 65444, "epoch": 389} {"train_loss": -9.01101303100586, "global_step": 65445, "epoch": 389} {"train_loss": -9.1284818649292, "global_step": 65446, "epoch": 389} {"train_loss": -9.210476875305176, "global_step": 65447, "epoch": 389} {"train_loss": -8.926555633544922, "global_step": 65448, "epoch": 389} {"train_loss": -8.742901802062988, "global_step": 65449, "epoch": 389} {"train_loss": -8.939787864685059, "global_step": 65450, "epoch": 389} {"train_loss": -8.77202033996582, "global_step": 65451, "epoch": 389} {"train_loss": -9.000133514404297, "global_step": 65452, "epoch": 389} {"train_loss": -8.928054809570312, "global_step": 65453, "epoch": 389} {"train_loss": -8.954300880432129, "global_step": 65454, "epoch": 389} {"train_loss": -8.86076545715332, "global_step": 65455, "epoch": 389} {"train_loss": -8.765680313110352, "global_step": 65456, "epoch": 389} {"train_loss": -9.148232460021973, "global_step": 65457, "epoch": 389} {"train_loss": -9.142560005187988, "global_step": 65458, "epoch": 389} {"train_loss": -8.683876991271973, "global_step": 65459, "epoch": 389} {"train_loss": -8.806477546691895, "global_step": 65460, "epoch": 389} {"train_loss": -8.827052116394043, "global_step": 65461, "epoch": 389} {"train_loss": -8.801308631896973, "global_step": 65462, "epoch": 389} {"train_loss": -8.85220718383789, "global_step": 65463, "epoch": 389} {"train_loss": -8.822280883789062, "global_step": 65464, "epoch": 389} {"train_loss": -8.7747802734375, "global_step": 65465, "epoch": 389} {"train_loss": -8.892862319946289, "global_step": 65466, "epoch": 389} {"train_loss": -8.584936141967773, "global_step": 65467, "epoch": 389} {"train_loss": -9.051458358764648, "global_step": 65468, "epoch": 389} {"train_loss": -8.638864517211914, "global_step": 65469, "epoch": 389} {"train_loss": -8.804485321044922, "global_step": 65470, "epoch": 389} {"train_loss": -8.809462547302246, "global_step": 65471, "epoch": 389} {"train_loss": -8.861817359924316, "global_step": 65472, "epoch": 389} {"train_loss": -8.796375274658203, "global_step": 65473, "epoch": 389} {"train_loss": -8.561344146728516, "global_step": 65474, "epoch": 389} {"train_loss": -9.014148712158203, "global_step": 65475, "epoch": 389} {"train_loss": -8.8802490234375, "global_step": 65476, "epoch": 389} {"train_loss": -8.831710815429688, "global_step": 65477, "epoch": 389} {"train_loss": -8.888910293579102, "global_step": 65478, "epoch": 389} {"train_loss": -8.929489135742188, "global_step": 65479, "epoch": 389} {"train_loss": -8.795374870300293, "global_step": 65480, "epoch": 389} {"train_loss": -8.985103607177734, "global_step": 65481, "epoch": 389} {"train_loss": -8.651508331298828, "global_step": 65482, "epoch": 389} {"train_loss": -8.597970008850098, "global_step": 65483, "epoch": 389} {"train_loss": -8.68964672088623, "global_step": 65484, "epoch": 389} {"train_loss": -8.688101768493652, "global_step": 65485, "epoch": 389} {"train_loss": -8.356513977050781, "global_step": 65486, "epoch": 389} {"train_loss": -8.647148132324219, "global_step": 65487, "epoch": 389} {"train_loss": -8.1229887008667, "global_step": 65488, "epoch": 389} {"train_loss": -8.85858154296875, "global_step": 65489, "epoch": 389} {"train_loss": -8.5501127243042, "global_step": 65490, "epoch": 389} {"train_loss": -8.688779830932617, "global_step": 65491, "epoch": 389} {"train_loss": -8.340149879455566, "global_step": 65492, "epoch": 389} {"train_loss": -8.715269088745117, "global_step": 65493, "epoch": 389} {"train_loss": -8.697322845458984, "global_step": 65494, "epoch": 389} {"train_loss": -8.504598617553711, "global_step": 65495, "epoch": 389} {"train_loss": -8.559741973876953, "global_step": 65496, "epoch": 389} {"train_loss": -8.795430183410645, "global_step": 65497, "epoch": 389} {"train_loss": -8.588506698608398, "global_step": 65498, "epoch": 389} {"train_loss": -8.77193546295166, "global_step": 65499, "epoch": 389} {"train_loss": -8.485536575317383, "global_step": 65500, "epoch": 389} {"train_loss": -8.743213653564453, "global_step": 65501, "epoch": 389} {"train_loss": -8.833236694335938, "global_step": 65502, "epoch": 389} {"train_loss": -8.63056755065918, "global_step": 65503, "epoch": 389} {"train_loss": -8.75306510925293, "global_step": 65504, "epoch": 389} {"train_loss": -8.706146240234375, "global_step": 65505, "epoch": 389} {"train_loss": -8.649392127990723, "global_step": 65506, "epoch": 389} {"train_loss": -8.611435890197754, "global_step": 65507, "epoch": 389} {"train_loss": -8.657144546508789, "global_step": 65508, "epoch": 389} {"train_loss": -8.576656341552734, "global_step": 65509, "epoch": 389} {"train_loss": -8.824922561645508, "global_step": 65510, "epoch": 389} {"train_loss": -8.698002815246582, "global_step": 65511, "epoch": 389} {"train_loss": -8.816252708435059, "global_step": 65512, "epoch": 389} {"train_loss": -8.682777404785156, "global_step": 65513, "epoch": 389} {"train_loss": -8.838567733764648, "global_step": 65514, "epoch": 389} {"train_loss": -8.866588592529297, "global_step": 65515, "epoch": 389} {"train_loss": -8.823820114135742, "global_step": 65516, "epoch": 389} {"train_loss": -8.921283721923828, "global_step": 65517, "epoch": 389} {"train_loss": -8.701166152954102, "global_step": 65518, "epoch": 389} {"train_loss": -8.775344649950663, "global_step": 65519, "epoch": 389, "val_loss": 192481.71875} {"train_loss": -8.542862892150879, "global_step": 65520, "epoch": 390} {"train_loss": -8.969337463378906, "global_step": 65521, "epoch": 390} {"train_loss": -8.831032752990723, "global_step": 65522, "epoch": 390} {"train_loss": -8.763988494873047, "global_step": 65523, "epoch": 390} {"train_loss": -8.861658096313477, "global_step": 65524, "epoch": 390} {"train_loss": -8.845468521118164, "global_step": 65525, "epoch": 390} {"train_loss": -8.946768760681152, "global_step": 65526, "epoch": 390} {"train_loss": -8.899791717529297, "global_step": 65527, "epoch": 390} {"train_loss": -8.753437042236328, "global_step": 65528, "epoch": 390} {"train_loss": -8.854904174804688, "global_step": 65529, "epoch": 390} {"train_loss": -8.864561080932617, "global_step": 65530, "epoch": 390} {"train_loss": -8.852203369140625, "global_step": 65531, "epoch": 390} {"train_loss": -8.808831214904785, "global_step": 65532, "epoch": 390} {"train_loss": -8.94977855682373, "global_step": 65533, "epoch": 390} {"train_loss": -8.848321914672852, "global_step": 65534, "epoch": 390} {"train_loss": -9.036116600036621, "global_step": 65535, "epoch": 390} {"train_loss": -9.027717590332031, "global_step": 65536, "epoch": 390} {"train_loss": -8.809114456176758, "global_step": 65537, "epoch": 390} {"train_loss": -8.965965270996094, "global_step": 65538, "epoch": 390} {"train_loss": -8.868875503540039, "global_step": 65539, "epoch": 390} {"train_loss": -8.91901969909668, "global_step": 65540, "epoch": 390} {"train_loss": -9.005986213684082, "global_step": 65541, "epoch": 390} {"train_loss": -8.917572021484375, "global_step": 65542, "epoch": 390} {"train_loss": -8.77044677734375, "global_step": 65543, "epoch": 390} {"train_loss": -9.00223159790039, "global_step": 65544, "epoch": 390} {"train_loss": -8.710983276367188, "global_step": 65545, "epoch": 390} {"train_loss": -8.61798095703125, "global_step": 65546, "epoch": 390} {"train_loss": -9.011041641235352, "global_step": 65547, "epoch": 390} {"train_loss": -8.990184783935547, "global_step": 65548, "epoch": 390} {"train_loss": -8.841105461120605, "global_step": 65549, "epoch": 390} {"train_loss": -8.310623168945312, "global_step": 65550, "epoch": 390} {"train_loss": -9.1641263961792, "global_step": 65551, "epoch": 390} {"train_loss": -8.785361289978027, "global_step": 65552, "epoch": 390} {"train_loss": -8.91518783569336, "global_step": 65553, "epoch": 390} {"train_loss": -8.726035118103027, "global_step": 65554, "epoch": 390} {"train_loss": -8.807555198669434, "global_step": 65555, "epoch": 390} {"train_loss": -8.879608154296875, "global_step": 65556, "epoch": 390} {"train_loss": -9.017509460449219, "global_step": 65557, "epoch": 390} {"train_loss": -9.018564224243164, "global_step": 65558, "epoch": 390} {"train_loss": -8.876913070678711, "global_step": 65559, "epoch": 390} {"train_loss": -8.965561866760254, "global_step": 65560, "epoch": 390} {"train_loss": -8.791180610656738, "global_step": 65561, "epoch": 390} {"train_loss": -9.135026931762695, "global_step": 65562, "epoch": 390} {"train_loss": -8.715521812438965, "global_step": 65563, "epoch": 390} {"train_loss": -8.830450057983398, "global_step": 65564, "epoch": 390} {"train_loss": -8.64865493774414, "global_step": 65565, "epoch": 390} {"train_loss": -8.301496505737305, "global_step": 65566, "epoch": 390} {"train_loss": -9.018342018127441, "global_step": 65567, "epoch": 390} {"train_loss": -8.563154220581055, "global_step": 65568, "epoch": 390} {"train_loss": -8.4613676071167, "global_step": 65569, "epoch": 390} {"train_loss": -8.71368408203125, "global_step": 65570, "epoch": 390} {"train_loss": -8.675346374511719, "global_step": 65571, "epoch": 390} {"train_loss": -8.738654136657715, "global_step": 65572, "epoch": 390} {"train_loss": -8.98924732208252, "global_step": 65573, "epoch": 390} {"train_loss": -8.988882064819336, "global_step": 65574, "epoch": 390} {"train_loss": -8.537571907043457, "global_step": 65575, "epoch": 390} {"train_loss": -8.807132720947266, "global_step": 65576, "epoch": 390} {"train_loss": -9.00897216796875, "global_step": 65577, "epoch": 390} {"train_loss": -8.524341583251953, "global_step": 65578, "epoch": 390} {"train_loss": -8.668218612670898, "global_step": 65579, "epoch": 390} {"train_loss": -8.877634048461914, "global_step": 65580, "epoch": 390} {"train_loss": -8.67007064819336, "global_step": 65581, "epoch": 390} {"train_loss": -8.686712265014648, "global_step": 65582, "epoch": 390} {"train_loss": -8.819499969482422, "global_step": 65583, "epoch": 390} {"train_loss": -8.812969207763672, "global_step": 65584, "epoch": 390} {"train_loss": -8.954885482788086, "global_step": 65585, "epoch": 390} {"train_loss": -8.861566543579102, "global_step": 65586, "epoch": 390} {"train_loss": -8.842525482177734, "global_step": 65587, "epoch": 390} {"train_loss": -8.797811508178711, "global_step": 65588, "epoch": 390} {"train_loss": -8.726408958435059, "global_step": 65589, "epoch": 390} {"train_loss": -8.79788589477539, "global_step": 65590, "epoch": 390} {"train_loss": -8.838680267333984, "global_step": 65591, "epoch": 390} {"train_loss": -9.00285816192627, "global_step": 65592, "epoch": 390} {"train_loss": -8.710742950439453, "global_step": 65593, "epoch": 390} {"train_loss": -8.87929916381836, "global_step": 65594, "epoch": 390} {"train_loss": -8.918645858764648, "global_step": 65595, "epoch": 390} {"train_loss": -8.84110164642334, "global_step": 65596, "epoch": 390} {"train_loss": -8.759401321411133, "global_step": 65597, "epoch": 390} {"train_loss": -8.678796768188477, "global_step": 65598, "epoch": 390} {"train_loss": -8.879548072814941, "global_step": 65599, "epoch": 390} {"train_loss": -8.985162734985352, "global_step": 65600, "epoch": 390} {"train_loss": -8.933390617370605, "global_step": 65601, "epoch": 390} {"train_loss": -9.216527938842773, "global_step": 65602, "epoch": 390} {"train_loss": -8.96378231048584, "global_step": 65603, "epoch": 390} {"train_loss": -8.977023124694824, "global_step": 65604, "epoch": 390} {"train_loss": -8.981077194213867, "global_step": 65605, "epoch": 390} {"train_loss": -9.020570755004883, "global_step": 65606, "epoch": 390} {"train_loss": -8.95026969909668, "global_step": 65607, "epoch": 390} {"train_loss": -8.799460411071777, "global_step": 65608, "epoch": 390} {"train_loss": -8.917444229125977, "global_step": 65609, "epoch": 390} {"train_loss": -8.719482421875, "global_step": 65610, "epoch": 390} {"train_loss": -9.04593276977539, "global_step": 65611, "epoch": 390} {"train_loss": -8.984472274780273, "global_step": 65612, "epoch": 390} {"train_loss": -8.608026504516602, "global_step": 65613, "epoch": 390} {"train_loss": -8.837730407714844, "global_step": 65614, "epoch": 390} {"train_loss": -8.793462753295898, "global_step": 65615, "epoch": 390} {"train_loss": -8.8882417678833, "global_step": 65616, "epoch": 390} {"train_loss": -8.909366607666016, "global_step": 65617, "epoch": 390} {"train_loss": -8.907814979553223, "global_step": 65618, "epoch": 390} {"train_loss": -8.745984077453613, "global_step": 65619, "epoch": 390} {"train_loss": -8.721489906311035, "global_step": 65620, "epoch": 390} {"train_loss": -8.745816230773926, "global_step": 65621, "epoch": 390} {"train_loss": -8.708089828491211, "global_step": 65622, "epoch": 390} {"train_loss": -8.374397277832031, "global_step": 65623, "epoch": 390} {"train_loss": -8.932685852050781, "global_step": 65624, "epoch": 390} {"train_loss": -8.770527839660645, "global_step": 65625, "epoch": 390} {"train_loss": -8.831859588623047, "global_step": 65626, "epoch": 390} {"train_loss": -8.687652587890625, "global_step": 65627, "epoch": 390} {"train_loss": -8.80583381652832, "global_step": 65628, "epoch": 390} {"train_loss": -8.955892562866211, "global_step": 65629, "epoch": 390} {"train_loss": -8.917935371398926, "global_step": 65630, "epoch": 390} {"train_loss": -8.92264461517334, "global_step": 65631, "epoch": 390} {"train_loss": -8.948539733886719, "global_step": 65632, "epoch": 390} {"train_loss": -8.496428489685059, "global_step": 65633, "epoch": 390} {"train_loss": -9.08447265625, "global_step": 65634, "epoch": 390} {"train_loss": -8.771499633789062, "global_step": 65635, "epoch": 390} {"train_loss": -9.100165367126465, "global_step": 65636, "epoch": 390} {"train_loss": -8.835943222045898, "global_step": 65637, "epoch": 390} {"train_loss": -8.934683799743652, "global_step": 65638, "epoch": 390} {"train_loss": -9.046318054199219, "global_step": 65639, "epoch": 390} {"train_loss": -8.610333442687988, "global_step": 65640, "epoch": 390} {"train_loss": -8.890256881713867, "global_step": 65641, "epoch": 390} {"train_loss": -8.99888801574707, "global_step": 65642, "epoch": 390} {"train_loss": -8.70724105834961, "global_step": 65643, "epoch": 390} {"train_loss": -8.92694091796875, "global_step": 65644, "epoch": 390} {"train_loss": -8.794881820678711, "global_step": 65645, "epoch": 390} {"train_loss": -8.843820571899414, "global_step": 65646, "epoch": 390} {"train_loss": -9.011676788330078, "global_step": 65647, "epoch": 390} {"train_loss": -8.847051620483398, "global_step": 65648, "epoch": 390} {"train_loss": -9.163376808166504, "global_step": 65649, "epoch": 390} {"train_loss": -8.80821704864502, "global_step": 65650, "epoch": 390} {"train_loss": -8.823254585266113, "global_step": 65651, "epoch": 390} {"train_loss": -9.138729095458984, "global_step": 65652, "epoch": 390} {"train_loss": -8.84140396118164, "global_step": 65653, "epoch": 390} {"train_loss": -8.525430679321289, "global_step": 65654, "epoch": 390} {"train_loss": -8.730317115783691, "global_step": 65655, "epoch": 390} {"train_loss": -8.785113334655762, "global_step": 65656, "epoch": 390} {"train_loss": -8.946901321411133, "global_step": 65657, "epoch": 390} {"train_loss": -8.62332534790039, "global_step": 65658, "epoch": 390} {"train_loss": -8.677896499633789, "global_step": 65659, "epoch": 390} {"train_loss": -8.802403450012207, "global_step": 65660, "epoch": 390} {"train_loss": -8.790380477905273, "global_step": 65661, "epoch": 390} {"train_loss": -8.776330947875977, "global_step": 65662, "epoch": 390} {"train_loss": -8.79806900024414, "global_step": 65663, "epoch": 390} {"train_loss": -8.715094566345215, "global_step": 65664, "epoch": 390} {"train_loss": -8.598974227905273, "global_step": 65665, "epoch": 390} {"train_loss": -8.763259887695312, "global_step": 65666, "epoch": 390} {"train_loss": -8.697896957397461, "global_step": 65667, "epoch": 390} {"train_loss": -8.59722900390625, "global_step": 65668, "epoch": 390} {"train_loss": -8.608492851257324, "global_step": 65669, "epoch": 390} {"train_loss": -8.80040168762207, "global_step": 65670, "epoch": 390} {"train_loss": -8.521724700927734, "global_step": 65671, "epoch": 390} {"train_loss": -8.669333457946777, "global_step": 65672, "epoch": 390} {"train_loss": -8.776269912719727, "global_step": 65673, "epoch": 390} {"train_loss": -8.754980087280273, "global_step": 65674, "epoch": 390} {"train_loss": -8.50551986694336, "global_step": 65675, "epoch": 390} {"train_loss": -8.70071029663086, "global_step": 65676, "epoch": 390} {"train_loss": -8.698680877685547, "global_step": 65677, "epoch": 390} {"train_loss": -8.594053268432617, "global_step": 65678, "epoch": 390} {"train_loss": -8.380788803100586, "global_step": 65679, "epoch": 390} {"train_loss": -8.689208030700684, "global_step": 65680, "epoch": 390} {"train_loss": -8.454425811767578, "global_step": 65681, "epoch": 390} {"train_loss": -8.850777626037598, "global_step": 65682, "epoch": 390} {"train_loss": -8.684284210205078, "global_step": 65683, "epoch": 390} {"train_loss": -8.790285110473633, "global_step": 65684, "epoch": 390} {"train_loss": -9.05843734741211, "global_step": 65685, "epoch": 390} {"train_loss": -8.785009384155273, "global_step": 65686, "epoch": 390} {"train_loss": -8.816117059616815, "global_step": 65687, "epoch": 390, "val_loss": 192939.984375, "train_action_mse_error": 6.284187316894531} {"train_loss": -8.959207534790039, "global_step": 65688, "epoch": 391} {"train_loss": -8.747976303100586, "global_step": 65689, "epoch": 391} {"train_loss": -8.807538032531738, "global_step": 65690, "epoch": 391} {"train_loss": -8.936426162719727, "global_step": 65691, "epoch": 391} {"train_loss": -8.80732536315918, "global_step": 65692, "epoch": 391} {"train_loss": -8.68838119506836, "global_step": 65693, "epoch": 391} {"train_loss": -8.724705696105957, "global_step": 65694, "epoch": 391} {"train_loss": -9.038691520690918, "global_step": 65695, "epoch": 391} {"train_loss": -8.544029235839844, "global_step": 65696, "epoch": 391} {"train_loss": -8.960580825805664, "global_step": 65697, "epoch": 391} {"train_loss": -8.924824714660645, "global_step": 65698, "epoch": 391} {"train_loss": -8.526655197143555, "global_step": 65699, "epoch": 391} {"train_loss": -8.541860580444336, "global_step": 65700, "epoch": 391} {"train_loss": -8.913073539733887, "global_step": 65701, "epoch": 391} {"train_loss": -8.860064506530762, "global_step": 65702, "epoch": 391} {"train_loss": -8.625748634338379, "global_step": 65703, "epoch": 391} {"train_loss": -8.944690704345703, "global_step": 65704, "epoch": 391} {"train_loss": -8.806459426879883, "global_step": 65705, "epoch": 391} {"train_loss": -8.514880180358887, "global_step": 65706, "epoch": 391} {"train_loss": -8.843090057373047, "global_step": 65707, "epoch": 391} {"train_loss": -8.589987754821777, "global_step": 65708, "epoch": 391} {"train_loss": -8.705543518066406, "global_step": 65709, "epoch": 391} {"train_loss": -8.914737701416016, "global_step": 65710, "epoch": 391} {"train_loss": -8.897507667541504, "global_step": 65711, "epoch": 391} {"train_loss": -9.034257888793945, "global_step": 65712, "epoch": 391} {"train_loss": -8.630325317382812, "global_step": 65713, "epoch": 391} {"train_loss": -8.77424430847168, "global_step": 65714, "epoch": 391} {"train_loss": -8.967248916625977, "global_step": 65715, "epoch": 391} {"train_loss": -8.862493515014648, "global_step": 65716, "epoch": 391} {"train_loss": -8.812835693359375, "global_step": 65717, "epoch": 391} {"train_loss": -8.756298065185547, "global_step": 65718, "epoch": 391} {"train_loss": -8.51883602142334, "global_step": 65719, "epoch": 391} {"train_loss": -8.75407886505127, "global_step": 65720, "epoch": 391} {"train_loss": -8.627472877502441, "global_step": 65721, "epoch": 391} {"train_loss": -8.87446403503418, "global_step": 65722, "epoch": 391} {"train_loss": -8.804330825805664, "global_step": 65723, "epoch": 391} {"train_loss": -8.863276481628418, "global_step": 65724, "epoch": 391} {"train_loss": -8.7804536819458, "global_step": 65725, "epoch": 391} {"train_loss": -8.761427879333496, "global_step": 65726, "epoch": 391} {"train_loss": -8.647293090820312, "global_step": 65727, "epoch": 391} {"train_loss": -8.819075584411621, "global_step": 65728, "epoch": 391} {"train_loss": -8.828546524047852, "global_step": 65729, "epoch": 391} {"train_loss": -8.624284744262695, "global_step": 65730, "epoch": 391} {"train_loss": -8.548036575317383, "global_step": 65731, "epoch": 391} {"train_loss": -8.699373245239258, "global_step": 65732, "epoch": 391} {"train_loss": -8.846261024475098, "global_step": 65733, "epoch": 391} {"train_loss": -9.02530288696289, "global_step": 65734, "epoch": 391} {"train_loss": -8.662324905395508, "global_step": 65735, "epoch": 391} {"train_loss": -8.713645935058594, "global_step": 65736, "epoch": 391} {"train_loss": -8.793811798095703, "global_step": 65737, "epoch": 391} {"train_loss": -8.806768417358398, "global_step": 65738, "epoch": 391} {"train_loss": -8.968005180358887, "global_step": 65739, "epoch": 391} {"train_loss": -8.906103134155273, "global_step": 65740, "epoch": 391} {"train_loss": -8.833093643188477, "global_step": 65741, "epoch": 391} {"train_loss": -9.020380020141602, "global_step": 65742, "epoch": 391} {"train_loss": -8.817956924438477, "global_step": 65743, "epoch": 391} {"train_loss": -8.795564651489258, "global_step": 65744, "epoch": 391} {"train_loss": -8.984981536865234, "global_step": 65745, "epoch": 391} {"train_loss": -9.080544471740723, "global_step": 65746, "epoch": 391} {"train_loss": -8.847043991088867, "global_step": 65747, "epoch": 391} {"train_loss": -8.779596328735352, "global_step": 65748, "epoch": 391} {"train_loss": -8.970321655273438, "global_step": 65749, "epoch": 391} {"train_loss": -9.02529525756836, "global_step": 65750, "epoch": 391} {"train_loss": -8.788963317871094, "global_step": 65751, "epoch": 391} {"train_loss": -8.763313293457031, "global_step": 65752, "epoch": 391} {"train_loss": -8.638201713562012, "global_step": 65753, "epoch": 391} {"train_loss": -8.699902534484863, "global_step": 65754, "epoch": 391} {"train_loss": -9.048731803894043, "global_step": 65755, "epoch": 391} {"train_loss": -8.514375686645508, "global_step": 65756, "epoch": 391} {"train_loss": -8.599966049194336, "global_step": 65757, "epoch": 391} {"train_loss": -8.607425689697266, "global_step": 65758, "epoch": 391} {"train_loss": -8.884239196777344, "global_step": 65759, "epoch": 391} {"train_loss": -8.799982070922852, "global_step": 65760, "epoch": 391} {"train_loss": -8.722817420959473, "global_step": 65761, "epoch": 391} {"train_loss": -8.63979721069336, "global_step": 65762, "epoch": 391} {"train_loss": -8.691429138183594, "global_step": 65763, "epoch": 391} {"train_loss": -8.53335952758789, "global_step": 65764, "epoch": 391} {"train_loss": -8.655858993530273, "global_step": 65765, "epoch": 391} {"train_loss": -8.890289306640625, "global_step": 65766, "epoch": 391} {"train_loss": -8.415168762207031, "global_step": 65767, "epoch": 391} {"train_loss": -8.708383560180664, "global_step": 65768, "epoch": 391} {"train_loss": -8.407838821411133, "global_step": 65769, "epoch": 391} {"train_loss": -8.766411781311035, "global_step": 65770, "epoch": 391} {"train_loss": -8.471099853515625, "global_step": 65771, "epoch": 391} {"train_loss": -8.559440612792969, "global_step": 65772, "epoch": 391} {"train_loss": -8.390998840332031, "global_step": 65773, "epoch": 391} {"train_loss": -8.227224349975586, "global_step": 65774, "epoch": 391} {"train_loss": -8.388452529907227, "global_step": 65775, "epoch": 391} {"train_loss": -8.709461212158203, "global_step": 65776, "epoch": 391} {"train_loss": -8.270849227905273, "global_step": 65777, "epoch": 391} {"train_loss": -8.811590194702148, "global_step": 65778, "epoch": 391} {"train_loss": -8.232667922973633, "global_step": 65779, "epoch": 391} {"train_loss": -8.652128219604492, "global_step": 65780, "epoch": 391} {"train_loss": -8.583385467529297, "global_step": 65781, "epoch": 391} {"train_loss": -8.654632568359375, "global_step": 65782, "epoch": 391} {"train_loss": -8.764043807983398, "global_step": 65783, "epoch": 391} {"train_loss": -8.571807861328125, "global_step": 65784, "epoch": 391} {"train_loss": -8.744495391845703, "global_step": 65785, "epoch": 391} {"train_loss": -8.581241607666016, "global_step": 65786, "epoch": 391} {"train_loss": -8.849870681762695, "global_step": 65787, "epoch": 391} {"train_loss": -8.548856735229492, "global_step": 65788, "epoch": 391} {"train_loss": -8.563179969787598, "global_step": 65789, "epoch": 391} {"train_loss": -8.913366317749023, "global_step": 65790, "epoch": 391} {"train_loss": -8.642431259155273, "global_step": 65791, "epoch": 391} {"train_loss": -8.660028457641602, "global_step": 65792, "epoch": 391} {"train_loss": -8.555411338806152, "global_step": 65793, "epoch": 391} {"train_loss": -8.750123977661133, "global_step": 65794, "epoch": 391} {"train_loss": -8.508260726928711, "global_step": 65795, "epoch": 391} {"train_loss": -8.782451629638672, "global_step": 65796, "epoch": 391} {"train_loss": -8.783116340637207, "global_step": 65797, "epoch": 391} {"train_loss": -8.734612464904785, "global_step": 65798, "epoch": 391} {"train_loss": -8.823105812072754, "global_step": 65799, "epoch": 391} {"train_loss": -8.630595207214355, "global_step": 65800, "epoch": 391} {"train_loss": -8.86631965637207, "global_step": 65801, "epoch": 391} {"train_loss": -8.530210494995117, "global_step": 65802, "epoch": 391} {"train_loss": -8.957748413085938, "global_step": 65803, "epoch": 391} {"train_loss": -8.60390853881836, "global_step": 65804, "epoch": 391} {"train_loss": -8.816404342651367, "global_step": 65805, "epoch": 391} {"train_loss": -8.598187446594238, "global_step": 65806, "epoch": 391} {"train_loss": -8.84982967376709, "global_step": 65807, "epoch": 391} {"train_loss": -8.560615539550781, "global_step": 65808, "epoch": 391} {"train_loss": -8.727274894714355, "global_step": 65809, "epoch": 391} {"train_loss": -8.408956527709961, "global_step": 65810, "epoch": 391} {"train_loss": -8.632344245910645, "global_step": 65811, "epoch": 391} {"train_loss": -8.876394271850586, "global_step": 65812, "epoch": 391} {"train_loss": -8.559867858886719, "global_step": 65813, "epoch": 391} {"train_loss": -8.737552642822266, "global_step": 65814, "epoch": 391} {"train_loss": -8.701750755310059, "global_step": 65815, "epoch": 391} {"train_loss": -8.812518119812012, "global_step": 65816, "epoch": 391} {"train_loss": -8.240927696228027, "global_step": 65817, "epoch": 391} {"train_loss": -8.909862518310547, "global_step": 65818, "epoch": 391} {"train_loss": -8.647679328918457, "global_step": 65819, "epoch": 391} {"train_loss": -8.585936546325684, "global_step": 65820, "epoch": 391} {"train_loss": -8.437095642089844, "global_step": 65821, "epoch": 391} {"train_loss": -8.460105895996094, "global_step": 65822, "epoch": 391} {"train_loss": -8.540563583374023, "global_step": 65823, "epoch": 391} {"train_loss": -8.628828048706055, "global_step": 65824, "epoch": 391} {"train_loss": -8.757650375366211, "global_step": 65825, "epoch": 391} {"train_loss": -8.532068252563477, "global_step": 65826, "epoch": 391} {"train_loss": -8.771129608154297, "global_step": 65827, "epoch": 391} {"train_loss": -8.627311706542969, "global_step": 65828, "epoch": 391} {"train_loss": -8.861298561096191, "global_step": 65829, "epoch": 391} {"train_loss": -8.536314010620117, "global_step": 65830, "epoch": 391} {"train_loss": -8.762876510620117, "global_step": 65831, "epoch": 391} {"train_loss": -8.733625411987305, "global_step": 65832, "epoch": 391} {"train_loss": -8.888607025146484, "global_step": 65833, "epoch": 391} {"train_loss": -8.637746810913086, "global_step": 65834, "epoch": 391} {"train_loss": -8.67633056640625, "global_step": 65835, "epoch": 391} {"train_loss": -8.809328079223633, "global_step": 65836, "epoch": 391} {"train_loss": -8.660581588745117, "global_step": 65837, "epoch": 391} {"train_loss": -8.70663070678711, "global_step": 65838, "epoch": 391} {"train_loss": -9.071073532104492, "global_step": 65839, "epoch": 391} {"train_loss": -8.970646858215332, "global_step": 65840, "epoch": 391} {"train_loss": -8.868871688842773, "global_step": 65841, "epoch": 391} {"train_loss": -8.85218620300293, "global_step": 65842, "epoch": 391} {"train_loss": -8.761420249938965, "global_step": 65843, "epoch": 391} {"train_loss": -8.46872615814209, "global_step": 65844, "epoch": 391} {"train_loss": -8.53420639038086, "global_step": 65845, "epoch": 391} {"train_loss": -8.624267578125, "global_step": 65846, "epoch": 391} {"train_loss": -8.712837219238281, "global_step": 65847, "epoch": 391} {"train_loss": -8.97782039642334, "global_step": 65848, "epoch": 391} {"train_loss": -8.77564811706543, "global_step": 65849, "epoch": 391} {"train_loss": -8.87639045715332, "global_step": 65850, "epoch": 391} {"train_loss": -8.935084342956543, "global_step": 65851, "epoch": 391} {"train_loss": -8.97816276550293, "global_step": 65852, "epoch": 391} {"train_loss": -9.01345443725586, "global_step": 65853, "epoch": 391} {"train_loss": -8.866589546203613, "global_step": 65854, "epoch": 391} {"train_loss": -8.728349583489555, "global_step": 65855, "epoch": 391, "val_loss": 191143.359375} {"train_loss": -8.380674362182617, "global_step": 65856, "epoch": 392} {"train_loss": -8.940102577209473, "global_step": 65857, "epoch": 392} {"train_loss": -8.395949363708496, "global_step": 65858, "epoch": 392} {"train_loss": -8.557792663574219, "global_step": 65859, "epoch": 392} {"train_loss": -8.638565063476562, "global_step": 65860, "epoch": 392} {"train_loss": -8.787359237670898, "global_step": 65861, "epoch": 392} {"train_loss": -8.739181518554688, "global_step": 65862, "epoch": 392} {"train_loss": -8.648489952087402, "global_step": 65863, "epoch": 392} {"train_loss": -8.752321243286133, "global_step": 65864, "epoch": 392} {"train_loss": -8.598447799682617, "global_step": 65865, "epoch": 392} {"train_loss": -8.792888641357422, "global_step": 65866, "epoch": 392} {"train_loss": -8.776948928833008, "global_step": 65867, "epoch": 392} {"train_loss": -8.699624061584473, "global_step": 65868, "epoch": 392} {"train_loss": -8.880660057067871, "global_step": 65869, "epoch": 392} {"train_loss": -8.737770080566406, "global_step": 65870, "epoch": 392} {"train_loss": -8.872833251953125, "global_step": 65871, "epoch": 392} {"train_loss": -8.840657234191895, "global_step": 65872, "epoch": 392} {"train_loss": -8.999833106994629, "global_step": 65873, "epoch": 392} {"train_loss": -8.826700210571289, "global_step": 65874, "epoch": 392} {"train_loss": -8.848003387451172, "global_step": 65875, "epoch": 392} {"train_loss": -8.765323638916016, "global_step": 65876, "epoch": 392} {"train_loss": -8.931796073913574, "global_step": 65877, "epoch": 392} {"train_loss": -8.926319122314453, "global_step": 65878, "epoch": 392} {"train_loss": -8.740676879882812, "global_step": 65879, "epoch": 392} {"train_loss": -8.848642349243164, "global_step": 65880, "epoch": 392} {"train_loss": -8.89256763458252, "global_step": 65881, "epoch": 392} {"train_loss": -8.625555038452148, "global_step": 65882, "epoch": 392} {"train_loss": -8.634928703308105, "global_step": 65883, "epoch": 392} {"train_loss": -8.737653732299805, "global_step": 65884, "epoch": 392} {"train_loss": -8.860503196716309, "global_step": 65885, "epoch": 392} {"train_loss": -8.379138946533203, "global_step": 65886, "epoch": 392} {"train_loss": -8.78211784362793, "global_step": 65887, "epoch": 392} {"train_loss": -8.558679580688477, "global_step": 65888, "epoch": 392} {"train_loss": -8.888152122497559, "global_step": 65889, "epoch": 392} {"train_loss": -8.672386169433594, "global_step": 65890, "epoch": 392} {"train_loss": -8.642192840576172, "global_step": 65891, "epoch": 392} {"train_loss": -8.787216186523438, "global_step": 65892, "epoch": 392} {"train_loss": -8.398553848266602, "global_step": 65893, "epoch": 392} {"train_loss": -8.434393882751465, "global_step": 65894, "epoch": 392} {"train_loss": -8.762840270996094, "global_step": 65895, "epoch": 392} {"train_loss": -8.221643447875977, "global_step": 65896, "epoch": 392} {"train_loss": -8.41490650177002, "global_step": 65897, "epoch": 392} {"train_loss": -8.786056518554688, "global_step": 65898, "epoch": 392} {"train_loss": -8.505739212036133, "global_step": 65899, "epoch": 392} {"train_loss": -8.658360481262207, "global_step": 65900, "epoch": 392} {"train_loss": -8.386371612548828, "global_step": 65901, "epoch": 392} {"train_loss": -8.696769714355469, "global_step": 65902, "epoch": 392} {"train_loss": -8.532636642456055, "global_step": 65903, "epoch": 392} {"train_loss": -8.71776008605957, "global_step": 65904, "epoch": 392} {"train_loss": -8.454778671264648, "global_step": 65905, "epoch": 392} {"train_loss": -8.65310001373291, "global_step": 65906, "epoch": 392} {"train_loss": -8.716676712036133, "global_step": 65907, "epoch": 392} {"train_loss": -8.75261116027832, "global_step": 65908, "epoch": 392} {"train_loss": -8.330322265625, "global_step": 65909, "epoch": 392} {"train_loss": -8.752845764160156, "global_step": 65910, "epoch": 392} {"train_loss": -8.62742805480957, "global_step": 65911, "epoch": 392} {"train_loss": -8.394500732421875, "global_step": 65912, "epoch": 392} {"train_loss": -8.675867080688477, "global_step": 65913, "epoch": 392} {"train_loss": -8.792540550231934, "global_step": 65914, "epoch": 392} {"train_loss": -8.599796295166016, "global_step": 65915, "epoch": 392} {"train_loss": -8.747541427612305, "global_step": 65916, "epoch": 392} {"train_loss": -8.78713321685791, "global_step": 65917, "epoch": 392} {"train_loss": -8.798951148986816, "global_step": 65918, "epoch": 392} {"train_loss": -8.765788078308105, "global_step": 65919, "epoch": 392} {"train_loss": -8.686580657958984, "global_step": 65920, "epoch": 392} {"train_loss": -8.688444137573242, "global_step": 65921, "epoch": 392} {"train_loss": -9.002790451049805, "global_step": 65922, "epoch": 392} {"train_loss": -8.67928695678711, "global_step": 65923, "epoch": 392} {"train_loss": -8.667003631591797, "global_step": 65924, "epoch": 392} {"train_loss": -8.761474609375, "global_step": 65925, "epoch": 392} {"train_loss": -8.800326347351074, "global_step": 65926, "epoch": 392} {"train_loss": -8.783612251281738, "global_step": 65927, "epoch": 392} {"train_loss": -8.696678161621094, "global_step": 65928, "epoch": 392} {"train_loss": -8.842058181762695, "global_step": 65929, "epoch": 392} {"train_loss": -8.963987350463867, "global_step": 65930, "epoch": 392} {"train_loss": -8.752223014831543, "global_step": 65931, "epoch": 392} {"train_loss": -8.729907035827637, "global_step": 65932, "epoch": 392} {"train_loss": -8.739707946777344, "global_step": 65933, "epoch": 392} {"train_loss": -8.824627876281738, "global_step": 65934, "epoch": 392} {"train_loss": -8.830381393432617, "global_step": 65935, "epoch": 392} {"train_loss": -8.80034065246582, "global_step": 65936, "epoch": 392} {"train_loss": -8.729527473449707, "global_step": 65937, "epoch": 392} {"train_loss": -8.78016471862793, "global_step": 65938, "epoch": 392} {"train_loss": -8.704779624938965, "global_step": 65939, "epoch": 392} {"train_loss": -8.517786026000977, "global_step": 65940, "epoch": 392} {"train_loss": -8.9056396484375, "global_step": 65941, "epoch": 392} {"train_loss": -8.720757484436035, "global_step": 65942, "epoch": 392} {"train_loss": -8.874998092651367, "global_step": 65943, "epoch": 392} {"train_loss": -8.833932876586914, "global_step": 65944, "epoch": 392} {"train_loss": -8.959454536437988, "global_step": 65945, "epoch": 392} {"train_loss": -8.833983421325684, "global_step": 65946, "epoch": 392} {"train_loss": -8.99403190612793, "global_step": 65947, "epoch": 392} {"train_loss": -8.788398742675781, "global_step": 65948, "epoch": 392} {"train_loss": -8.919960021972656, "global_step": 65949, "epoch": 392} {"train_loss": -8.806144714355469, "global_step": 65950, "epoch": 392} {"train_loss": -8.82883071899414, "global_step": 65951, "epoch": 392} {"train_loss": -8.622041702270508, "global_step": 65952, "epoch": 392} {"train_loss": -8.88776969909668, "global_step": 65953, "epoch": 392} {"train_loss": -8.337396621704102, "global_step": 65954, "epoch": 392} {"train_loss": -9.06236457824707, "global_step": 65955, "epoch": 392} {"train_loss": -8.613420486450195, "global_step": 65956, "epoch": 392} {"train_loss": -8.731578826904297, "global_step": 65957, "epoch": 392} {"train_loss": -8.960359573364258, "global_step": 65958, "epoch": 392} {"train_loss": -8.84257698059082, "global_step": 65959, "epoch": 392} {"train_loss": -8.793050765991211, "global_step": 65960, "epoch": 392} {"train_loss": -8.711424827575684, "global_step": 65961, "epoch": 392} {"train_loss": -8.90195369720459, "global_step": 65962, "epoch": 392} {"train_loss": -9.126838684082031, "global_step": 65963, "epoch": 392} {"train_loss": -9.098098754882812, "global_step": 65964, "epoch": 392} {"train_loss": -8.88824462890625, "global_step": 65965, "epoch": 392} {"train_loss": -8.92599868774414, "global_step": 65966, "epoch": 392} {"train_loss": -8.730624198913574, "global_step": 65967, "epoch": 392} {"train_loss": -8.769735336303711, "global_step": 65968, "epoch": 392} {"train_loss": -9.020913124084473, "global_step": 65969, "epoch": 392} {"train_loss": -8.84411334991455, "global_step": 65970, "epoch": 392} {"train_loss": -9.140892028808594, "global_step": 65971, "epoch": 392} {"train_loss": -9.02766227722168, "global_step": 65972, "epoch": 392} {"train_loss": -8.66272258758545, "global_step": 65973, "epoch": 392} {"train_loss": -8.998310089111328, "global_step": 65974, "epoch": 392} {"train_loss": -8.801868438720703, "global_step": 65975, "epoch": 392} {"train_loss": -8.994318962097168, "global_step": 65976, "epoch": 392} {"train_loss": -9.089502334594727, "global_step": 65977, "epoch": 392} {"train_loss": -8.62850284576416, "global_step": 65978, "epoch": 392} {"train_loss": -8.62244987487793, "global_step": 65979, "epoch": 392} {"train_loss": -8.894641876220703, "global_step": 65980, "epoch": 392} {"train_loss": -8.625465393066406, "global_step": 65981, "epoch": 392} {"train_loss": -8.86217212677002, "global_step": 65982, "epoch": 392} {"train_loss": -8.759491920471191, "global_step": 65983, "epoch": 392} {"train_loss": -8.908316612243652, "global_step": 65984, "epoch": 392} {"train_loss": -8.924863815307617, "global_step": 65985, "epoch": 392} {"train_loss": -8.86234188079834, "global_step": 65986, "epoch": 392} {"train_loss": -9.033822059631348, "global_step": 65987, "epoch": 392} {"train_loss": -8.685508728027344, "global_step": 65988, "epoch": 392} {"train_loss": -9.054864883422852, "global_step": 65989, "epoch": 392} {"train_loss": -8.762432098388672, "global_step": 65990, "epoch": 392} {"train_loss": -8.896004676818848, "global_step": 65991, "epoch": 392} {"train_loss": -8.661803245544434, "global_step": 65992, "epoch": 392} {"train_loss": -8.83414077758789, "global_step": 65993, "epoch": 392} {"train_loss": -8.812870025634766, "global_step": 65994, "epoch": 392} {"train_loss": -8.777460098266602, "global_step": 65995, "epoch": 392} {"train_loss": -8.661779403686523, "global_step": 65996, "epoch": 392} {"train_loss": -8.798858642578125, "global_step": 65997, "epoch": 392} {"train_loss": -8.307363510131836, "global_step": 65998, "epoch": 392} {"train_loss": -8.766131401062012, "global_step": 65999, "epoch": 392} {"train_loss": -8.528976440429688, "global_step": 66000, "epoch": 392} {"train_loss": -8.603754997253418, "global_step": 66001, "epoch": 392} {"train_loss": -8.59688663482666, "global_step": 66002, "epoch": 392} {"train_loss": -8.881343841552734, "global_step": 66003, "epoch": 392} {"train_loss": -8.536786079406738, "global_step": 66004, "epoch": 392} {"train_loss": -8.462692260742188, "global_step": 66005, "epoch": 392} {"train_loss": -8.617568969726562, "global_step": 66006, "epoch": 392} {"train_loss": -8.583314895629883, "global_step": 66007, "epoch": 392} {"train_loss": -8.785696983337402, "global_step": 66008, "epoch": 392} {"train_loss": -8.752157211303711, "global_step": 66009, "epoch": 392} {"train_loss": -8.71236801147461, "global_step": 66010, "epoch": 392} {"train_loss": -8.717314720153809, "global_step": 66011, "epoch": 392} {"train_loss": -8.788232803344727, "global_step": 66012, "epoch": 392} {"train_loss": -8.718924522399902, "global_step": 66013, "epoch": 392} {"train_loss": -8.751531600952148, "global_step": 66014, "epoch": 392} {"train_loss": -8.884981155395508, "global_step": 66015, "epoch": 392} {"train_loss": -9.01723575592041, "global_step": 66016, "epoch": 392} {"train_loss": -8.586700439453125, "global_step": 66017, "epoch": 392} {"train_loss": -8.79922103881836, "global_step": 66018, "epoch": 392} {"train_loss": -9.112802505493164, "global_step": 66019, "epoch": 392} {"train_loss": -8.874069213867188, "global_step": 66020, "epoch": 392} {"train_loss": -8.819051742553711, "global_step": 66021, "epoch": 392} {"train_loss": -8.818839073181152, "global_step": 66022, "epoch": 392} {"train_loss": -8.754687922341484, "global_step": 66023, "epoch": 392, "val_loss": 193907.71875} {"train_loss": -8.87758731842041, "global_step": 66024, "epoch": 393} {"train_loss": -8.859341621398926, "global_step": 66025, "epoch": 393} {"train_loss": -9.025583267211914, "global_step": 66026, "epoch": 393} {"train_loss": -9.022380828857422, "global_step": 66027, "epoch": 393} {"train_loss": -8.89611530303955, "global_step": 66028, "epoch": 393} {"train_loss": -8.519659042358398, "global_step": 66029, "epoch": 393} {"train_loss": -8.815008163452148, "global_step": 66030, "epoch": 393} {"train_loss": -8.59749984741211, "global_step": 66031, "epoch": 393} {"train_loss": -8.813079833984375, "global_step": 66032, "epoch": 393} {"train_loss": -8.510448455810547, "global_step": 66033, "epoch": 393} {"train_loss": -8.814718246459961, "global_step": 66034, "epoch": 393} {"train_loss": -8.73647689819336, "global_step": 66035, "epoch": 393} {"train_loss": -8.814014434814453, "global_step": 66036, "epoch": 393} {"train_loss": -8.772603988647461, "global_step": 66037, "epoch": 393} {"train_loss": -8.371355056762695, "global_step": 66038, "epoch": 393} {"train_loss": -8.7803316116333, "global_step": 66039, "epoch": 393} {"train_loss": -8.595602035522461, "global_step": 66040, "epoch": 393} {"train_loss": -8.662405014038086, "global_step": 66041, "epoch": 393} {"train_loss": -8.737236022949219, "global_step": 66042, "epoch": 393} {"train_loss": -8.832355499267578, "global_step": 66043, "epoch": 393} {"train_loss": -8.90971565246582, "global_step": 66044, "epoch": 393} {"train_loss": -8.853555679321289, "global_step": 66045, "epoch": 393} {"train_loss": -8.900477409362793, "global_step": 66046, "epoch": 393} {"train_loss": -8.893106460571289, "global_step": 66047, "epoch": 393} {"train_loss": -8.668270111083984, "global_step": 66048, "epoch": 393} {"train_loss": -8.789170265197754, "global_step": 66049, "epoch": 393} {"train_loss": -8.752492904663086, "global_step": 66050, "epoch": 393} {"train_loss": -8.944412231445312, "global_step": 66051, "epoch": 393} {"train_loss": -8.923517227172852, "global_step": 66052, "epoch": 393} {"train_loss": -8.949713706970215, "global_step": 66053, "epoch": 393} {"train_loss": -8.63880729675293, "global_step": 66054, "epoch": 393} {"train_loss": -8.732160568237305, "global_step": 66055, "epoch": 393} {"train_loss": -8.498671531677246, "global_step": 66056, "epoch": 393} {"train_loss": -8.76485824584961, "global_step": 66057, "epoch": 393} {"train_loss": -8.574043273925781, "global_step": 66058, "epoch": 393} {"train_loss": -8.643040657043457, "global_step": 66059, "epoch": 393} {"train_loss": -8.481363296508789, "global_step": 66060, "epoch": 393} {"train_loss": -8.794536590576172, "global_step": 66061, "epoch": 393} {"train_loss": -8.64492416381836, "global_step": 66062, "epoch": 393} {"train_loss": -8.762880325317383, "global_step": 66063, "epoch": 393} {"train_loss": -8.771038055419922, "global_step": 66064, "epoch": 393} {"train_loss": -8.99188232421875, "global_step": 66065, "epoch": 393} {"train_loss": -8.628107070922852, "global_step": 66066, "epoch": 393} {"train_loss": -8.7888765335083, "global_step": 66067, "epoch": 393} {"train_loss": -8.590845108032227, "global_step": 66068, "epoch": 393} {"train_loss": -8.964268684387207, "global_step": 66069, "epoch": 393} {"train_loss": -8.72629165649414, "global_step": 66070, "epoch": 393} {"train_loss": -8.651174545288086, "global_step": 66071, "epoch": 393} {"train_loss": -8.719949722290039, "global_step": 66072, "epoch": 393} {"train_loss": -8.429141998291016, "global_step": 66073, "epoch": 393} {"train_loss": -8.802082061767578, "global_step": 66074, "epoch": 393} {"train_loss": -8.285892486572266, "global_step": 66075, "epoch": 393} {"train_loss": -8.59216594696045, "global_step": 66076, "epoch": 393} {"train_loss": -8.497875213623047, "global_step": 66077, "epoch": 393} {"train_loss": -8.787437438964844, "global_step": 66078, "epoch": 393} {"train_loss": -8.409692764282227, "global_step": 66079, "epoch": 393} {"train_loss": -8.49346923828125, "global_step": 66080, "epoch": 393} {"train_loss": -8.77549934387207, "global_step": 66081, "epoch": 393} {"train_loss": -8.588101387023926, "global_step": 66082, "epoch": 393} {"train_loss": -8.58717155456543, "global_step": 66083, "epoch": 393} {"train_loss": -8.737374305725098, "global_step": 66084, "epoch": 393} {"train_loss": -8.683624267578125, "global_step": 66085, "epoch": 393} {"train_loss": -8.698134422302246, "global_step": 66086, "epoch": 393} {"train_loss": -8.666234970092773, "global_step": 66087, "epoch": 393} {"train_loss": -8.748761177062988, "global_step": 66088, "epoch": 393} {"train_loss": -8.797422409057617, "global_step": 66089, "epoch": 393} {"train_loss": -8.720940589904785, "global_step": 66090, "epoch": 393} {"train_loss": -8.720985412597656, "global_step": 66091, "epoch": 393} {"train_loss": -8.69677734375, "global_step": 66092, "epoch": 393} {"train_loss": -8.873035430908203, "global_step": 66093, "epoch": 393} {"train_loss": -8.73086929321289, "global_step": 66094, "epoch": 393} {"train_loss": -8.907072067260742, "global_step": 66095, "epoch": 393} {"train_loss": -9.03903579711914, "global_step": 66096, "epoch": 393} {"train_loss": -9.10659408569336, "global_step": 66097, "epoch": 393} {"train_loss": -8.763879776000977, "global_step": 66098, "epoch": 393} {"train_loss": -8.982666015625, "global_step": 66099, "epoch": 393} {"train_loss": -8.857145309448242, "global_step": 66100, "epoch": 393} {"train_loss": -8.846488952636719, "global_step": 66101, "epoch": 393} {"train_loss": -8.781834602355957, "global_step": 66102, "epoch": 393} {"train_loss": -8.867595672607422, "global_step": 66103, "epoch": 393} {"train_loss": -8.982837677001953, "global_step": 66104, "epoch": 393} {"train_loss": -8.69513988494873, "global_step": 66105, "epoch": 393} {"train_loss": -8.679184913635254, "global_step": 66106, "epoch": 393} {"train_loss": -8.888742446899414, "global_step": 66107, "epoch": 393} {"train_loss": -8.851266860961914, "global_step": 66108, "epoch": 393} {"train_loss": -8.59650707244873, "global_step": 66109, "epoch": 393} {"train_loss": -8.960336685180664, "global_step": 66110, "epoch": 393} {"train_loss": -8.405743598937988, "global_step": 66111, "epoch": 393} {"train_loss": -8.689543724060059, "global_step": 66112, "epoch": 393} {"train_loss": -8.11724853515625, "global_step": 66113, "epoch": 393} {"train_loss": -8.722368240356445, "global_step": 66114, "epoch": 393} {"train_loss": -8.423044204711914, "global_step": 66115, "epoch": 393} {"train_loss": -8.723186492919922, "global_step": 66116, "epoch": 393} {"train_loss": -8.260883331298828, "global_step": 66117, "epoch": 393} {"train_loss": -8.551711082458496, "global_step": 66118, "epoch": 393} {"train_loss": -8.57577133178711, "global_step": 66119, "epoch": 393} {"train_loss": -8.421831130981445, "global_step": 66120, "epoch": 393} {"train_loss": -8.343925476074219, "global_step": 66121, "epoch": 393} {"train_loss": -8.72712516784668, "global_step": 66122, "epoch": 393} {"train_loss": -8.699851989746094, "global_step": 66123, "epoch": 393} {"train_loss": -8.538633346557617, "global_step": 66124, "epoch": 393} {"train_loss": -8.54892349243164, "global_step": 66125, "epoch": 393} {"train_loss": -8.555069923400879, "global_step": 66126, "epoch": 393} {"train_loss": -8.548842430114746, "global_step": 66127, "epoch": 393} {"train_loss": -8.496711730957031, "global_step": 66128, "epoch": 393} {"train_loss": -8.573206901550293, "global_step": 66129, "epoch": 393} {"train_loss": -8.868975639343262, "global_step": 66130, "epoch": 393} {"train_loss": -8.600146293640137, "global_step": 66131, "epoch": 393} {"train_loss": -8.810067176818848, "global_step": 66132, "epoch": 393} {"train_loss": -8.517581939697266, "global_step": 66133, "epoch": 393} {"train_loss": -8.669206619262695, "global_step": 66134, "epoch": 393} {"train_loss": -8.94859504699707, "global_step": 66135, "epoch": 393} {"train_loss": -8.897964477539062, "global_step": 66136, "epoch": 393} {"train_loss": -8.793539047241211, "global_step": 66137, "epoch": 393} {"train_loss": -8.866479873657227, "global_step": 66138, "epoch": 393} {"train_loss": -9.026962280273438, "global_step": 66139, "epoch": 393} {"train_loss": -9.051508903503418, "global_step": 66140, "epoch": 393} {"train_loss": -9.108116149902344, "global_step": 66141, "epoch": 393} {"train_loss": -8.90633773803711, "global_step": 66142, "epoch": 393} {"train_loss": -8.895875930786133, "global_step": 66143, "epoch": 393} {"train_loss": -8.865686416625977, "global_step": 66144, "epoch": 393} {"train_loss": -8.713872909545898, "global_step": 66145, "epoch": 393} {"train_loss": -8.996774673461914, "global_step": 66146, "epoch": 393} {"train_loss": -9.154255867004395, "global_step": 66147, "epoch": 393} {"train_loss": -9.047735214233398, "global_step": 66148, "epoch": 393} {"train_loss": -9.144144058227539, "global_step": 66149, "epoch": 393} {"train_loss": -8.897005081176758, "global_step": 66150, "epoch": 393} {"train_loss": -8.688592910766602, "global_step": 66151, "epoch": 393} {"train_loss": -9.015600204467773, "global_step": 66152, "epoch": 393} {"train_loss": -8.675058364868164, "global_step": 66153, "epoch": 393} {"train_loss": -8.830451965332031, "global_step": 66154, "epoch": 393} {"train_loss": -8.947410583496094, "global_step": 66155, "epoch": 393} {"train_loss": -8.666613578796387, "global_step": 66156, "epoch": 393} {"train_loss": -8.8773832321167, "global_step": 66157, "epoch": 393} {"train_loss": -8.983816146850586, "global_step": 66158, "epoch": 393} {"train_loss": -8.759065628051758, "global_step": 66159, "epoch": 393} {"train_loss": -8.765946388244629, "global_step": 66160, "epoch": 393} {"train_loss": -8.834118843078613, "global_step": 66161, "epoch": 393} {"train_loss": -8.930586814880371, "global_step": 66162, "epoch": 393} {"train_loss": -8.459657669067383, "global_step": 66163, "epoch": 393} {"train_loss": -8.901029586791992, "global_step": 66164, "epoch": 393} {"train_loss": -8.695037841796875, "global_step": 66165, "epoch": 393} {"train_loss": -8.642791748046875, "global_step": 66166, "epoch": 393} {"train_loss": -8.959724426269531, "global_step": 66167, "epoch": 393} {"train_loss": -8.681344985961914, "global_step": 66168, "epoch": 393} {"train_loss": -8.867576599121094, "global_step": 66169, "epoch": 393} {"train_loss": -8.93777847290039, "global_step": 66170, "epoch": 393} {"train_loss": -8.779890060424805, "global_step": 66171, "epoch": 393} {"train_loss": -8.854928970336914, "global_step": 66172, "epoch": 393} {"train_loss": -8.943750381469727, "global_step": 66173, "epoch": 393} {"train_loss": -8.899190902709961, "global_step": 66174, "epoch": 393} {"train_loss": -8.758371353149414, "global_step": 66175, "epoch": 393} {"train_loss": -9.096899032592773, "global_step": 66176, "epoch": 393} {"train_loss": -8.69304084777832, "global_step": 66177, "epoch": 393} {"train_loss": -8.802111625671387, "global_step": 66178, "epoch": 393} {"train_loss": -8.820178985595703, "global_step": 66179, "epoch": 393} {"train_loss": -8.446205139160156, "global_step": 66180, "epoch": 393} {"train_loss": -8.913825988769531, "global_step": 66181, "epoch": 393} {"train_loss": -8.94490909576416, "global_step": 66182, "epoch": 393} {"train_loss": -9.015178680419922, "global_step": 66183, "epoch": 393} {"train_loss": -8.716225624084473, "global_step": 66184, "epoch": 393} {"train_loss": -9.004825592041016, "global_step": 66185, "epoch": 393} {"train_loss": -9.098379135131836, "global_step": 66186, "epoch": 393} {"train_loss": -9.139945030212402, "global_step": 66187, "epoch": 393} {"train_loss": -8.666203498840332, "global_step": 66188, "epoch": 393} {"train_loss": -8.807699203491211, "global_step": 66189, "epoch": 393} {"train_loss": -8.789478302001953, "global_step": 66190, "epoch": 393} {"train_loss": -8.757651658285232, "global_step": 66191, "epoch": 393, "val_loss": 192152.453125} {"train_loss": -8.920452117919922, "global_step": 66192, "epoch": 394} {"train_loss": -8.337146759033203, "global_step": 66193, "epoch": 394} {"train_loss": -8.593505859375, "global_step": 66194, "epoch": 394} {"train_loss": -8.54055404663086, "global_step": 66195, "epoch": 394} {"train_loss": -8.61366081237793, "global_step": 66196, "epoch": 394} {"train_loss": -8.37098217010498, "global_step": 66197, "epoch": 394} {"train_loss": -8.804818153381348, "global_step": 66198, "epoch": 394} {"train_loss": -8.59234619140625, "global_step": 66199, "epoch": 394} {"train_loss": -8.61099910736084, "global_step": 66200, "epoch": 394} {"train_loss": -8.996814727783203, "global_step": 66201, "epoch": 394} {"train_loss": -8.784704208374023, "global_step": 66202, "epoch": 394} {"train_loss": -8.414346694946289, "global_step": 66203, "epoch": 394} {"train_loss": -8.816544532775879, "global_step": 66204, "epoch": 394} {"train_loss": -8.773157119750977, "global_step": 66205, "epoch": 394} {"train_loss": -8.653739929199219, "global_step": 66206, "epoch": 394} {"train_loss": -8.632243156433105, "global_step": 66207, "epoch": 394} {"train_loss": -8.452142715454102, "global_step": 66208, "epoch": 394} {"train_loss": -8.485227584838867, "global_step": 66209, "epoch": 394} {"train_loss": -8.660968780517578, "global_step": 66210, "epoch": 394} {"train_loss": -8.70123291015625, "global_step": 66211, "epoch": 394} {"train_loss": -8.774787902832031, "global_step": 66212, "epoch": 394} {"train_loss": -8.563920974731445, "global_step": 66213, "epoch": 394} {"train_loss": -8.739259719848633, "global_step": 66214, "epoch": 394} {"train_loss": -8.813213348388672, "global_step": 66215, "epoch": 394} {"train_loss": -8.515579223632812, "global_step": 66216, "epoch": 394} {"train_loss": -8.779306411743164, "global_step": 66217, "epoch": 394} {"train_loss": -8.602363586425781, "global_step": 66218, "epoch": 394} {"train_loss": -8.64335823059082, "global_step": 66219, "epoch": 394} {"train_loss": -8.559907913208008, "global_step": 66220, "epoch": 394} {"train_loss": -8.721307754516602, "global_step": 66221, "epoch": 394} {"train_loss": -8.775308609008789, "global_step": 66222, "epoch": 394} {"train_loss": -8.820606231689453, "global_step": 66223, "epoch": 394} {"train_loss": -8.623880386352539, "global_step": 66224, "epoch": 394} {"train_loss": -8.505915641784668, "global_step": 66225, "epoch": 394} {"train_loss": -8.779040336608887, "global_step": 66226, "epoch": 394} {"train_loss": -8.586989402770996, "global_step": 66227, "epoch": 394} {"train_loss": -8.822636604309082, "global_step": 66228, "epoch": 394} {"train_loss": -8.638333320617676, "global_step": 66229, "epoch": 394} {"train_loss": -8.74367618560791, "global_step": 66230, "epoch": 394} {"train_loss": -8.893518447875977, "global_step": 66231, "epoch": 394} {"train_loss": -8.761396408081055, "global_step": 66232, "epoch": 394} {"train_loss": -8.762290000915527, "global_step": 66233, "epoch": 394} {"train_loss": -8.442319869995117, "global_step": 66234, "epoch": 394} {"train_loss": -8.915019989013672, "global_step": 66235, "epoch": 394} {"train_loss": -8.846755981445312, "global_step": 66236, "epoch": 394} {"train_loss": -8.703466415405273, "global_step": 66237, "epoch": 394} {"train_loss": -8.648941040039062, "global_step": 66238, "epoch": 394} {"train_loss": -9.013986587524414, "global_step": 66239, "epoch": 394} {"train_loss": -8.779024124145508, "global_step": 66240, "epoch": 394} {"train_loss": -8.861688613891602, "global_step": 66241, "epoch": 394} {"train_loss": -8.798198699951172, "global_step": 66242, "epoch": 394} {"train_loss": -8.842634201049805, "global_step": 66243, "epoch": 394} {"train_loss": -8.720090866088867, "global_step": 66244, "epoch": 394} {"train_loss": -8.804817199707031, "global_step": 66245, "epoch": 394} {"train_loss": -8.926682472229004, "global_step": 66246, "epoch": 394} {"train_loss": -8.915454864501953, "global_step": 66247, "epoch": 394} {"train_loss": -9.147960662841797, "global_step": 66248, "epoch": 394} {"train_loss": -8.736214637756348, "global_step": 66249, "epoch": 394} {"train_loss": -9.067526817321777, "global_step": 66250, "epoch": 394} {"train_loss": -8.931999206542969, "global_step": 66251, "epoch": 394} {"train_loss": -8.989830017089844, "global_step": 66252, "epoch": 394} {"train_loss": -8.884909629821777, "global_step": 66253, "epoch": 394} {"train_loss": -9.1221342086792, "global_step": 66254, "epoch": 394} {"train_loss": -9.019811630249023, "global_step": 66255, "epoch": 394} {"train_loss": -8.493195533752441, "global_step": 66256, "epoch": 394} {"train_loss": -9.014432907104492, "global_step": 66257, "epoch": 394} {"train_loss": -8.805442810058594, "global_step": 66258, "epoch": 394} {"train_loss": -8.98886775970459, "global_step": 66259, "epoch": 394} {"train_loss": -8.749286651611328, "global_step": 66260, "epoch": 394} {"train_loss": -8.678409576416016, "global_step": 66261, "epoch": 394} {"train_loss": -8.858448028564453, "global_step": 66262, "epoch": 394} {"train_loss": -8.212966918945312, "global_step": 66263, "epoch": 394} {"train_loss": -8.899833679199219, "global_step": 66264, "epoch": 394} {"train_loss": -8.402395248413086, "global_step": 66265, "epoch": 394} {"train_loss": -9.054899215698242, "global_step": 66266, "epoch": 394} {"train_loss": -8.318950653076172, "global_step": 66267, "epoch": 394} {"train_loss": -8.860786437988281, "global_step": 66268, "epoch": 394} {"train_loss": -8.541313171386719, "global_step": 66269, "epoch": 394} {"train_loss": -8.55754280090332, "global_step": 66270, "epoch": 394} {"train_loss": -8.517358779907227, "global_step": 66271, "epoch": 394} {"train_loss": -8.814599990844727, "global_step": 66272, "epoch": 394} {"train_loss": -8.799028396606445, "global_step": 66273, "epoch": 394} {"train_loss": -8.492279052734375, "global_step": 66274, "epoch": 394} {"train_loss": -8.932220458984375, "global_step": 66275, "epoch": 394} {"train_loss": -8.776126861572266, "global_step": 66276, "epoch": 394} {"train_loss": -8.926079750061035, "global_step": 66277, "epoch": 394} {"train_loss": -8.659095764160156, "global_step": 66278, "epoch": 394} {"train_loss": -9.008427619934082, "global_step": 66279, "epoch": 394} {"train_loss": -8.910802841186523, "global_step": 66280, "epoch": 394} {"train_loss": -8.863630294799805, "global_step": 66281, "epoch": 394} {"train_loss": -8.779516220092773, "global_step": 66282, "epoch": 394} {"train_loss": -8.924615859985352, "global_step": 66283, "epoch": 394} {"train_loss": -8.666622161865234, "global_step": 66284, "epoch": 394} {"train_loss": -8.823005676269531, "global_step": 66285, "epoch": 394} {"train_loss": -9.048843383789062, "global_step": 66286, "epoch": 394} {"train_loss": -8.883864402770996, "global_step": 66287, "epoch": 394} {"train_loss": -8.812226295471191, "global_step": 66288, "epoch": 394} {"train_loss": -8.805068969726562, "global_step": 66289, "epoch": 394} {"train_loss": -8.866960525512695, "global_step": 66290, "epoch": 394} {"train_loss": -8.947391510009766, "global_step": 66291, "epoch": 394} {"train_loss": -8.718921661376953, "global_step": 66292, "epoch": 394} {"train_loss": -8.913711547851562, "global_step": 66293, "epoch": 394} {"train_loss": -8.876164436340332, "global_step": 66294, "epoch": 394} {"train_loss": -8.93570327758789, "global_step": 66295, "epoch": 394} {"train_loss": -8.587194442749023, "global_step": 66296, "epoch": 394} {"train_loss": -9.007434844970703, "global_step": 66297, "epoch": 394} {"train_loss": -8.760108947753906, "global_step": 66298, "epoch": 394} {"train_loss": -8.903040885925293, "global_step": 66299, "epoch": 394} {"train_loss": -8.720602035522461, "global_step": 66300, "epoch": 394} {"train_loss": -8.884594917297363, "global_step": 66301, "epoch": 394} {"train_loss": -8.769736289978027, "global_step": 66302, "epoch": 394} {"train_loss": -8.917600631713867, "global_step": 66303, "epoch": 394} {"train_loss": -9.165964126586914, "global_step": 66304, "epoch": 394} {"train_loss": -8.762260437011719, "global_step": 66305, "epoch": 394} {"train_loss": -8.927770614624023, "global_step": 66306, "epoch": 394} {"train_loss": -8.654935836791992, "global_step": 66307, "epoch": 394} {"train_loss": -8.736034393310547, "global_step": 66308, "epoch": 394} {"train_loss": -8.882551193237305, "global_step": 66309, "epoch": 394} {"train_loss": -8.805309295654297, "global_step": 66310, "epoch": 394} {"train_loss": -8.66482925415039, "global_step": 66311, "epoch": 394} {"train_loss": -8.686538696289062, "global_step": 66312, "epoch": 394} {"train_loss": -8.886627197265625, "global_step": 66313, "epoch": 394} {"train_loss": -8.669973373413086, "global_step": 66314, "epoch": 394} {"train_loss": -8.953146934509277, "global_step": 66315, "epoch": 394} {"train_loss": -8.525701522827148, "global_step": 66316, "epoch": 394} {"train_loss": -8.84949016571045, "global_step": 66317, "epoch": 394} {"train_loss": -8.793082237243652, "global_step": 66318, "epoch": 394} {"train_loss": -8.740228652954102, "global_step": 66319, "epoch": 394} {"train_loss": -8.861625671386719, "global_step": 66320, "epoch": 394} {"train_loss": -8.775653839111328, "global_step": 66321, "epoch": 394} {"train_loss": -8.884305953979492, "global_step": 66322, "epoch": 394} {"train_loss": -8.980779647827148, "global_step": 66323, "epoch": 394} {"train_loss": -8.855752944946289, "global_step": 66324, "epoch": 394} {"train_loss": -8.905033111572266, "global_step": 66325, "epoch": 394} {"train_loss": -8.99630355834961, "global_step": 66326, "epoch": 394} {"train_loss": -8.989901542663574, "global_step": 66327, "epoch": 394} {"train_loss": -9.02858829498291, "global_step": 66328, "epoch": 394} {"train_loss": -9.026742935180664, "global_step": 66329, "epoch": 394} {"train_loss": -8.926797866821289, "global_step": 66330, "epoch": 394} {"train_loss": -8.865500450134277, "global_step": 66331, "epoch": 394} {"train_loss": -8.95128059387207, "global_step": 66332, "epoch": 394} {"train_loss": -8.71851634979248, "global_step": 66333, "epoch": 394} {"train_loss": -8.832868576049805, "global_step": 66334, "epoch": 394} {"train_loss": -8.968993186950684, "global_step": 66335, "epoch": 394} {"train_loss": -8.586526870727539, "global_step": 66336, "epoch": 394} {"train_loss": -8.900259017944336, "global_step": 66337, "epoch": 394} {"train_loss": -8.818374633789062, "global_step": 66338, "epoch": 394} {"train_loss": -8.802619934082031, "global_step": 66339, "epoch": 394} {"train_loss": -8.904314041137695, "global_step": 66340, "epoch": 394} {"train_loss": -8.919102668762207, "global_step": 66341, "epoch": 394} {"train_loss": -8.42569351196289, "global_step": 66342, "epoch": 394} {"train_loss": -8.819384574890137, "global_step": 66343, "epoch": 394} {"train_loss": -8.890161514282227, "global_step": 66344, "epoch": 394} {"train_loss": -8.679664611816406, "global_step": 66345, "epoch": 394} {"train_loss": -9.047160148620605, "global_step": 66346, "epoch": 394} {"train_loss": -8.94664192199707, "global_step": 66347, "epoch": 394} {"train_loss": -8.801836967468262, "global_step": 66348, "epoch": 394} {"train_loss": -9.121963500976562, "global_step": 66349, "epoch": 394} {"train_loss": -9.072513580322266, "global_step": 66350, "epoch": 394} {"train_loss": -8.867448806762695, "global_step": 66351, "epoch": 394} {"train_loss": -8.985841751098633, "global_step": 66352, "epoch": 394} {"train_loss": -8.70576286315918, "global_step": 66353, "epoch": 394} {"train_loss": -8.899089813232422, "global_step": 66354, "epoch": 394} {"train_loss": -8.910922050476074, "global_step": 66355, "epoch": 394} {"train_loss": -8.91555404663086, "global_step": 66356, "epoch": 394} {"train_loss": -9.144414901733398, "global_step": 66357, "epoch": 394} {"train_loss": -8.593635559082031, "global_step": 66358, "epoch": 394} {"train_loss": -8.793100726036798, "global_step": 66359, "epoch": 394, "val_loss": 193305.234375} {"train_loss": -8.815589904785156, "global_step": 66360, "epoch": 395} {"train_loss": -8.760917663574219, "global_step": 66361, "epoch": 395} {"train_loss": -9.002278327941895, "global_step": 66362, "epoch": 395} {"train_loss": -8.709403991699219, "global_step": 66363, "epoch": 395} {"train_loss": -9.194990158081055, "global_step": 66364, "epoch": 395} {"train_loss": -8.972478866577148, "global_step": 66365, "epoch": 395} {"train_loss": -9.224136352539062, "global_step": 66366, "epoch": 395} {"train_loss": -9.103507041931152, "global_step": 66367, "epoch": 395} {"train_loss": -9.095662117004395, "global_step": 66368, "epoch": 395} {"train_loss": -8.745004653930664, "global_step": 66369, "epoch": 395} {"train_loss": -8.995342254638672, "global_step": 66370, "epoch": 395} {"train_loss": -8.995635986328125, "global_step": 66371, "epoch": 395} {"train_loss": -8.789641380310059, "global_step": 66372, "epoch": 395} {"train_loss": -8.874744415283203, "global_step": 66373, "epoch": 395} {"train_loss": -8.850637435913086, "global_step": 66374, "epoch": 395} {"train_loss": -8.997993469238281, "global_step": 66375, "epoch": 395} {"train_loss": -8.656225204467773, "global_step": 66376, "epoch": 395} {"train_loss": -8.944454193115234, "global_step": 66377, "epoch": 395} {"train_loss": -9.019607543945312, "global_step": 66378, "epoch": 395} {"train_loss": -8.913606643676758, "global_step": 66379, "epoch": 395} {"train_loss": -8.49323844909668, "global_step": 66380, "epoch": 395} {"train_loss": -8.452003479003906, "global_step": 66381, "epoch": 395} {"train_loss": -8.459193229675293, "global_step": 66382, "epoch": 395} {"train_loss": -8.730470657348633, "global_step": 66383, "epoch": 395} {"train_loss": -8.796006202697754, "global_step": 66384, "epoch": 395} {"train_loss": -8.556558609008789, "global_step": 66385, "epoch": 395} {"train_loss": -8.60763931274414, "global_step": 66386, "epoch": 395} {"train_loss": -8.746326446533203, "global_step": 66387, "epoch": 395} {"train_loss": -8.541655540466309, "global_step": 66388, "epoch": 395} {"train_loss": -8.688824653625488, "global_step": 66389, "epoch": 395} {"train_loss": -8.645384788513184, "global_step": 66390, "epoch": 395} {"train_loss": -8.458518981933594, "global_step": 66391, "epoch": 395} {"train_loss": -8.785943984985352, "global_step": 66392, "epoch": 395} {"train_loss": -8.634954452514648, "global_step": 66393, "epoch": 395} {"train_loss": -8.737258911132812, "global_step": 66394, "epoch": 395} {"train_loss": -8.86893367767334, "global_step": 66395, "epoch": 395} {"train_loss": -8.852745056152344, "global_step": 66396, "epoch": 395} {"train_loss": -8.831792831420898, "global_step": 66397, "epoch": 395} {"train_loss": -8.74888801574707, "global_step": 66398, "epoch": 395} {"train_loss": -8.950989723205566, "global_step": 66399, "epoch": 395} {"train_loss": -8.878548622131348, "global_step": 66400, "epoch": 395} {"train_loss": -8.788094520568848, "global_step": 66401, "epoch": 395} {"train_loss": -8.901318550109863, "global_step": 66402, "epoch": 395} {"train_loss": -8.910261154174805, "global_step": 66403, "epoch": 395} {"train_loss": -8.692072868347168, "global_step": 66404, "epoch": 395} {"train_loss": -8.893171310424805, "global_step": 66405, "epoch": 395} {"train_loss": -8.727367401123047, "global_step": 66406, "epoch": 395} {"train_loss": -8.72463607788086, "global_step": 66407, "epoch": 395} {"train_loss": -8.789264678955078, "global_step": 66408, "epoch": 395} {"train_loss": -8.518274307250977, "global_step": 66409, "epoch": 395} {"train_loss": -8.87275218963623, "global_step": 66410, "epoch": 395} {"train_loss": -8.88821792602539, "global_step": 66411, "epoch": 395} {"train_loss": -8.664715766906738, "global_step": 66412, "epoch": 395} {"train_loss": -8.876554489135742, "global_step": 66413, "epoch": 395} {"train_loss": -8.812227249145508, "global_step": 66414, "epoch": 395} {"train_loss": -8.63817024230957, "global_step": 66415, "epoch": 395} {"train_loss": -8.740283012390137, "global_step": 66416, "epoch": 395} {"train_loss": -9.073930740356445, "global_step": 66417, "epoch": 395} {"train_loss": -8.809203147888184, "global_step": 66418, "epoch": 395} {"train_loss": -8.864856719970703, "global_step": 66419, "epoch": 395} {"train_loss": -8.961487770080566, "global_step": 66420, "epoch": 395} {"train_loss": -8.664144515991211, "global_step": 66421, "epoch": 395} {"train_loss": -9.047298431396484, "global_step": 66422, "epoch": 395} {"train_loss": -8.604572296142578, "global_step": 66423, "epoch": 395} {"train_loss": -8.735962867736816, "global_step": 66424, "epoch": 395} {"train_loss": -8.93975830078125, "global_step": 66425, "epoch": 395} {"train_loss": -8.525440216064453, "global_step": 66426, "epoch": 395} {"train_loss": -8.89327335357666, "global_step": 66427, "epoch": 395} {"train_loss": -8.88549518585205, "global_step": 66428, "epoch": 395} {"train_loss": -8.931201934814453, "global_step": 66429, "epoch": 395} {"train_loss": -8.600994110107422, "global_step": 66430, "epoch": 395} {"train_loss": -8.713204383850098, "global_step": 66431, "epoch": 395} {"train_loss": -8.649049758911133, "global_step": 66432, "epoch": 395} {"train_loss": -8.429849624633789, "global_step": 66433, "epoch": 395} {"train_loss": -8.79356861114502, "global_step": 66434, "epoch": 395} {"train_loss": -8.385587692260742, "global_step": 66435, "epoch": 395} {"train_loss": -8.539434432983398, "global_step": 66436, "epoch": 395} {"train_loss": -8.849433898925781, "global_step": 66437, "epoch": 395} {"train_loss": -8.821883201599121, "global_step": 66438, "epoch": 395} {"train_loss": -8.73136043548584, "global_step": 66439, "epoch": 395} {"train_loss": -8.54647445678711, "global_step": 66440, "epoch": 395} {"train_loss": -8.738152503967285, "global_step": 66441, "epoch": 395} {"train_loss": -8.866355895996094, "global_step": 66442, "epoch": 395} {"train_loss": -8.539438247680664, "global_step": 66443, "epoch": 395} {"train_loss": -8.488978385925293, "global_step": 66444, "epoch": 395} {"train_loss": -8.783370971679688, "global_step": 66445, "epoch": 395} {"train_loss": -8.769495010375977, "global_step": 66446, "epoch": 395} {"train_loss": -9.006677627563477, "global_step": 66447, "epoch": 395} {"train_loss": -8.761495590209961, "global_step": 66448, "epoch": 395} {"train_loss": -8.694169998168945, "global_step": 66449, "epoch": 395} {"train_loss": -8.848999977111816, "global_step": 66450, "epoch": 395} {"train_loss": -8.856301307678223, "global_step": 66451, "epoch": 395} {"train_loss": -8.746424674987793, "global_step": 66452, "epoch": 395} {"train_loss": -9.034168243408203, "global_step": 66453, "epoch": 395} {"train_loss": -9.071928977966309, "global_step": 66454, "epoch": 395} {"train_loss": -8.96347427368164, "global_step": 66455, "epoch": 395} {"train_loss": -9.049100875854492, "global_step": 66456, "epoch": 395} {"train_loss": -8.96395206451416, "global_step": 66457, "epoch": 395} {"train_loss": -9.16643238067627, "global_step": 66458, "epoch": 395} {"train_loss": -8.881301879882812, "global_step": 66459, "epoch": 395} {"train_loss": -8.89205551147461, "global_step": 66460, "epoch": 395} {"train_loss": -8.928129196166992, "global_step": 66461, "epoch": 395} {"train_loss": -8.968679428100586, "global_step": 66462, "epoch": 395} {"train_loss": -8.878548622131348, "global_step": 66463, "epoch": 395} {"train_loss": -9.03661060333252, "global_step": 66464, "epoch": 395} {"train_loss": -8.785309791564941, "global_step": 66465, "epoch": 395} {"train_loss": -8.526375770568848, "global_step": 66466, "epoch": 395} {"train_loss": -9.061368942260742, "global_step": 66467, "epoch": 395} {"train_loss": -8.399137496948242, "global_step": 66468, "epoch": 395} {"train_loss": -9.007179260253906, "global_step": 66469, "epoch": 395} {"train_loss": -8.566987037658691, "global_step": 66470, "epoch": 395} {"train_loss": -8.972073554992676, "global_step": 66471, "epoch": 395} {"train_loss": -8.404736518859863, "global_step": 66472, "epoch": 395} {"train_loss": -8.722524642944336, "global_step": 66473, "epoch": 395} {"train_loss": -8.359911918640137, "global_step": 66474, "epoch": 395} {"train_loss": -8.661825180053711, "global_step": 66475, "epoch": 395} {"train_loss": -8.611371994018555, "global_step": 66476, "epoch": 395} {"train_loss": -8.674185752868652, "global_step": 66477, "epoch": 395} {"train_loss": -8.731826782226562, "global_step": 66478, "epoch": 395} {"train_loss": -8.864789962768555, "global_step": 66479, "epoch": 395} {"train_loss": -8.652482986450195, "global_step": 66480, "epoch": 395} {"train_loss": -8.789827346801758, "global_step": 66481, "epoch": 395} {"train_loss": -8.883370399475098, "global_step": 66482, "epoch": 395} {"train_loss": -8.967974662780762, "global_step": 66483, "epoch": 395} {"train_loss": -8.726495742797852, "global_step": 66484, "epoch": 395} {"train_loss": -9.117684364318848, "global_step": 66485, "epoch": 395} {"train_loss": -8.810684204101562, "global_step": 66486, "epoch": 395} {"train_loss": -8.860360145568848, "global_step": 66487, "epoch": 395} {"train_loss": -8.77707290649414, "global_step": 66488, "epoch": 395} {"train_loss": -8.62942123413086, "global_step": 66489, "epoch": 395} {"train_loss": -8.77143669128418, "global_step": 66490, "epoch": 395} {"train_loss": -8.754169464111328, "global_step": 66491, "epoch": 395} {"train_loss": -8.864995956420898, "global_step": 66492, "epoch": 395} {"train_loss": -8.822837829589844, "global_step": 66493, "epoch": 395} {"train_loss": -8.667268753051758, "global_step": 66494, "epoch": 395} {"train_loss": -8.971795082092285, "global_step": 66495, "epoch": 395} {"train_loss": -8.87809944152832, "global_step": 66496, "epoch": 395} {"train_loss": -8.339609146118164, "global_step": 66497, "epoch": 395} {"train_loss": -8.892740249633789, "global_step": 66498, "epoch": 395} {"train_loss": -8.94300365447998, "global_step": 66499, "epoch": 395} {"train_loss": -8.28573226928711, "global_step": 66500, "epoch": 395} {"train_loss": -8.774608612060547, "global_step": 66501, "epoch": 395} {"train_loss": -8.949235916137695, "global_step": 66502, "epoch": 395} {"train_loss": -8.789137840270996, "global_step": 66503, "epoch": 395} {"train_loss": -8.755516052246094, "global_step": 66504, "epoch": 395} {"train_loss": -8.929327964782715, "global_step": 66505, "epoch": 395} {"train_loss": -8.959586143493652, "global_step": 66506, "epoch": 395} {"train_loss": -8.925235748291016, "global_step": 66507, "epoch": 395} {"train_loss": -8.692527770996094, "global_step": 66508, "epoch": 395} {"train_loss": -9.00080394744873, "global_step": 66509, "epoch": 395} {"train_loss": -8.86107349395752, "global_step": 66510, "epoch": 395} {"train_loss": -8.9214448928833, "global_step": 66511, "epoch": 395} {"train_loss": -8.802177429199219, "global_step": 66512, "epoch": 395} {"train_loss": -8.807573318481445, "global_step": 66513, "epoch": 395} {"train_loss": -8.756404876708984, "global_step": 66514, "epoch": 395} {"train_loss": -8.816438674926758, "global_step": 66515, "epoch": 395} {"train_loss": -8.853981018066406, "global_step": 66516, "epoch": 395} {"train_loss": -8.675283432006836, "global_step": 66517, "epoch": 395} {"train_loss": -8.77945327758789, "global_step": 66518, "epoch": 395} {"train_loss": -8.679361343383789, "global_step": 66519, "epoch": 395} {"train_loss": -8.72940444946289, "global_step": 66520, "epoch": 395} {"train_loss": -8.868078231811523, "global_step": 66521, "epoch": 395} {"train_loss": -8.855810165405273, "global_step": 66522, "epoch": 395} {"train_loss": -8.955821990966797, "global_step": 66523, "epoch": 395} {"train_loss": -8.723066329956055, "global_step": 66524, "epoch": 395} {"train_loss": -8.698862075805664, "global_step": 66525, "epoch": 395} {"train_loss": -8.83022403717041, "global_step": 66526, "epoch": 395} {"train_loss": -8.793667407262893, "global_step": 66527, "epoch": 395, "val_loss": 191553.390625, "train_action_mse_error": 8.436689376831055} {"train_loss": -8.762393951416016, "global_step": 66528, "epoch": 396} {"train_loss": -8.832648277282715, "global_step": 66529, "epoch": 396} {"train_loss": -8.722639083862305, "global_step": 66530, "epoch": 396} {"train_loss": -8.485145568847656, "global_step": 66531, "epoch": 396} {"train_loss": -8.704618453979492, "global_step": 66532, "epoch": 396} {"train_loss": -8.702699661254883, "global_step": 66533, "epoch": 396} {"train_loss": -8.751741409301758, "global_step": 66534, "epoch": 396} {"train_loss": -8.92460823059082, "global_step": 66535, "epoch": 396} {"train_loss": -8.810579299926758, "global_step": 66536, "epoch": 396} {"train_loss": -8.889620780944824, "global_step": 66537, "epoch": 396} {"train_loss": -9.103557586669922, "global_step": 66538, "epoch": 396} {"train_loss": -9.025184631347656, "global_step": 66539, "epoch": 396} {"train_loss": -8.93514347076416, "global_step": 66540, "epoch": 396} {"train_loss": -8.950248718261719, "global_step": 66541, "epoch": 396} {"train_loss": -9.166299819946289, "global_step": 66542, "epoch": 396} {"train_loss": -8.985998153686523, "global_step": 66543, "epoch": 396} {"train_loss": -8.94547176361084, "global_step": 66544, "epoch": 396} {"train_loss": -8.991976737976074, "global_step": 66545, "epoch": 396} {"train_loss": -8.966388702392578, "global_step": 66546, "epoch": 396} {"train_loss": -8.866193771362305, "global_step": 66547, "epoch": 396} {"train_loss": -9.09419059753418, "global_step": 66548, "epoch": 396} {"train_loss": -8.787858009338379, "global_step": 66549, "epoch": 396} {"train_loss": -8.873273849487305, "global_step": 66550, "epoch": 396} {"train_loss": -9.024988174438477, "global_step": 66551, "epoch": 396} {"train_loss": -9.158073425292969, "global_step": 66552, "epoch": 396} {"train_loss": -8.978967666625977, "global_step": 66553, "epoch": 396} {"train_loss": -8.911953926086426, "global_step": 66554, "epoch": 396} {"train_loss": -8.913490295410156, "global_step": 66555, "epoch": 396} {"train_loss": -9.006969451904297, "global_step": 66556, "epoch": 396} {"train_loss": -8.787454605102539, "global_step": 66557, "epoch": 396} {"train_loss": -9.156339645385742, "global_step": 66558, "epoch": 396} {"train_loss": -8.751382827758789, "global_step": 66559, "epoch": 396} {"train_loss": -8.78618049621582, "global_step": 66560, "epoch": 396} {"train_loss": -8.942832946777344, "global_step": 66561, "epoch": 396} {"train_loss": -8.702702522277832, "global_step": 66562, "epoch": 396} {"train_loss": -8.832550048828125, "global_step": 66563, "epoch": 396} {"train_loss": -8.726801872253418, "global_step": 66564, "epoch": 396} {"train_loss": -8.926484107971191, "global_step": 66565, "epoch": 396} {"train_loss": -8.853632926940918, "global_step": 66566, "epoch": 396} {"train_loss": -8.676084518432617, "global_step": 66567, "epoch": 396} {"train_loss": -8.878615379333496, "global_step": 66568, "epoch": 396} {"train_loss": -8.947961807250977, "global_step": 66569, "epoch": 396} {"train_loss": -8.835469245910645, "global_step": 66570, "epoch": 396} {"train_loss": -8.81895637512207, "global_step": 66571, "epoch": 396} {"train_loss": -8.873054504394531, "global_step": 66572, "epoch": 396} {"train_loss": -8.728082656860352, "global_step": 66573, "epoch": 396} {"train_loss": -8.800924301147461, "global_step": 66574, "epoch": 396} {"train_loss": -9.08678913116455, "global_step": 66575, "epoch": 396} {"train_loss": -8.789131164550781, "global_step": 66576, "epoch": 396} {"train_loss": -8.699637413024902, "global_step": 66577, "epoch": 396} {"train_loss": -9.06165885925293, "global_step": 66578, "epoch": 396} {"train_loss": -8.805218696594238, "global_step": 66579, "epoch": 396} {"train_loss": -8.955625534057617, "global_step": 66580, "epoch": 396} {"train_loss": -8.990428924560547, "global_step": 66581, "epoch": 396} {"train_loss": -8.879960060119629, "global_step": 66582, "epoch": 396} {"train_loss": -9.118959426879883, "global_step": 66583, "epoch": 396} {"train_loss": -9.004956245422363, "global_step": 66584, "epoch": 396} {"train_loss": -8.964098930358887, "global_step": 66585, "epoch": 396} {"train_loss": -9.068960189819336, "global_step": 66586, "epoch": 396} {"train_loss": -8.974103927612305, "global_step": 66587, "epoch": 396} {"train_loss": -8.81620979309082, "global_step": 66588, "epoch": 396} {"train_loss": -8.776060104370117, "global_step": 66589, "epoch": 396} {"train_loss": -9.133296966552734, "global_step": 66590, "epoch": 396} {"train_loss": -8.835813522338867, "global_step": 66591, "epoch": 396} {"train_loss": -8.601967811584473, "global_step": 66592, "epoch": 396} {"train_loss": -9.041324615478516, "global_step": 66593, "epoch": 396} {"train_loss": -9.016599655151367, "global_step": 66594, "epoch": 396} {"train_loss": -8.999330520629883, "global_step": 66595, "epoch": 396} {"train_loss": -8.695589065551758, "global_step": 66596, "epoch": 396} {"train_loss": -8.610647201538086, "global_step": 66597, "epoch": 396} {"train_loss": -8.75405502319336, "global_step": 66598, "epoch": 396} {"train_loss": -8.676814079284668, "global_step": 66599, "epoch": 396} {"train_loss": -8.953741073608398, "global_step": 66600, "epoch": 396} {"train_loss": -8.744586944580078, "global_step": 66601, "epoch": 396} {"train_loss": -8.646800994873047, "global_step": 66602, "epoch": 396} {"train_loss": -8.917901039123535, "global_step": 66603, "epoch": 396} {"train_loss": -8.593631744384766, "global_step": 66604, "epoch": 396} {"train_loss": -8.683965682983398, "global_step": 66605, "epoch": 396} {"train_loss": -8.842782020568848, "global_step": 66606, "epoch": 396} {"train_loss": -8.704374313354492, "global_step": 66607, "epoch": 396} {"train_loss": -8.601247787475586, "global_step": 66608, "epoch": 396} {"train_loss": -8.620494842529297, "global_step": 66609, "epoch": 396} {"train_loss": -8.71889877319336, "global_step": 66610, "epoch": 396} {"train_loss": -8.757823944091797, "global_step": 66611, "epoch": 396} {"train_loss": -8.793315887451172, "global_step": 66612, "epoch": 396} {"train_loss": -8.615646362304688, "global_step": 66613, "epoch": 396} {"train_loss": -8.633441925048828, "global_step": 66614, "epoch": 396} {"train_loss": -8.6259183883667, "global_step": 66615, "epoch": 396} {"train_loss": -8.675865173339844, "global_step": 66616, "epoch": 396} {"train_loss": -8.867119789123535, "global_step": 66617, "epoch": 396} {"train_loss": -8.794008255004883, "global_step": 66618, "epoch": 396} {"train_loss": -8.715234756469727, "global_step": 66619, "epoch": 396} {"train_loss": -8.817680358886719, "global_step": 66620, "epoch": 396} {"train_loss": -8.762319564819336, "global_step": 66621, "epoch": 396} {"train_loss": -8.837355613708496, "global_step": 66622, "epoch": 396} {"train_loss": -8.91172981262207, "global_step": 66623, "epoch": 396} {"train_loss": -8.83352279663086, "global_step": 66624, "epoch": 396} {"train_loss": -8.760436058044434, "global_step": 66625, "epoch": 396} {"train_loss": -8.957012176513672, "global_step": 66626, "epoch": 396} {"train_loss": -8.69176959991455, "global_step": 66627, "epoch": 396} {"train_loss": -8.995240211486816, "global_step": 66628, "epoch": 396} {"train_loss": -9.03647232055664, "global_step": 66629, "epoch": 396} {"train_loss": -8.919536590576172, "global_step": 66630, "epoch": 396} {"train_loss": -8.749725341796875, "global_step": 66631, "epoch": 396} {"train_loss": -8.8088960647583, "global_step": 66632, "epoch": 396} {"train_loss": -9.03714370727539, "global_step": 66633, "epoch": 396} {"train_loss": -9.13107967376709, "global_step": 66634, "epoch": 396} {"train_loss": -8.815383911132812, "global_step": 66635, "epoch": 396} {"train_loss": -9.020654678344727, "global_step": 66636, "epoch": 396} {"train_loss": -8.75789737701416, "global_step": 66637, "epoch": 396} {"train_loss": -9.009366989135742, "global_step": 66638, "epoch": 396} {"train_loss": -9.116058349609375, "global_step": 66639, "epoch": 396} {"train_loss": -8.660898208618164, "global_step": 66640, "epoch": 396} {"train_loss": -8.664752960205078, "global_step": 66641, "epoch": 396} {"train_loss": -8.828973770141602, "global_step": 66642, "epoch": 396} {"train_loss": -8.951583862304688, "global_step": 66643, "epoch": 396} {"train_loss": -9.04243278503418, "global_step": 66644, "epoch": 396} {"train_loss": -8.98847484588623, "global_step": 66645, "epoch": 396} {"train_loss": -8.690189361572266, "global_step": 66646, "epoch": 396} {"train_loss": -8.545150756835938, "global_step": 66647, "epoch": 396} {"train_loss": -8.920915603637695, "global_step": 66648, "epoch": 396} {"train_loss": -8.83525562286377, "global_step": 66649, "epoch": 396} {"train_loss": -8.848472595214844, "global_step": 66650, "epoch": 396} {"train_loss": -8.845901489257812, "global_step": 66651, "epoch": 396} {"train_loss": -8.824431419372559, "global_step": 66652, "epoch": 396} {"train_loss": -8.78300666809082, "global_step": 66653, "epoch": 396} {"train_loss": -9.157608032226562, "global_step": 66654, "epoch": 396} {"train_loss": -8.655630111694336, "global_step": 66655, "epoch": 396} {"train_loss": -8.75196647644043, "global_step": 66656, "epoch": 396} {"train_loss": -8.775419235229492, "global_step": 66657, "epoch": 396} {"train_loss": -8.591320037841797, "global_step": 66658, "epoch": 396} {"train_loss": -8.7660551071167, "global_step": 66659, "epoch": 396} {"train_loss": -8.823529243469238, "global_step": 66660, "epoch": 396} {"train_loss": -8.466363906860352, "global_step": 66661, "epoch": 396} {"train_loss": -8.662428855895996, "global_step": 66662, "epoch": 396} {"train_loss": -9.094806671142578, "global_step": 66663, "epoch": 396} {"train_loss": -8.66779899597168, "global_step": 66664, "epoch": 396} {"train_loss": -8.926337242126465, "global_step": 66665, "epoch": 396} {"train_loss": -8.777789115905762, "global_step": 66666, "epoch": 396} {"train_loss": -8.75610065460205, "global_step": 66667, "epoch": 396} {"train_loss": -9.044116020202637, "global_step": 66668, "epoch": 396} {"train_loss": -8.80154037475586, "global_step": 66669, "epoch": 396} {"train_loss": -8.773561477661133, "global_step": 66670, "epoch": 396} {"train_loss": -8.790667533874512, "global_step": 66671, "epoch": 396} {"train_loss": -8.980451583862305, "global_step": 66672, "epoch": 396} {"train_loss": -8.779117584228516, "global_step": 66673, "epoch": 396} {"train_loss": -8.693953514099121, "global_step": 66674, "epoch": 396} {"train_loss": -8.81060791015625, "global_step": 66675, "epoch": 396} {"train_loss": -9.08351993560791, "global_step": 66676, "epoch": 396} {"train_loss": -8.740124702453613, "global_step": 66677, "epoch": 396} {"train_loss": -8.926897048950195, "global_step": 66678, "epoch": 396} {"train_loss": -8.959789276123047, "global_step": 66679, "epoch": 396} {"train_loss": -8.999652862548828, "global_step": 66680, "epoch": 396} {"train_loss": -9.036346435546875, "global_step": 66681, "epoch": 396} {"train_loss": -8.966035842895508, "global_step": 66682, "epoch": 396} {"train_loss": -9.162508010864258, "global_step": 66683, "epoch": 396} {"train_loss": -8.857963562011719, "global_step": 66684, "epoch": 396} {"train_loss": -9.159955978393555, "global_step": 66685, "epoch": 396} {"train_loss": -9.069263458251953, "global_step": 66686, "epoch": 396} {"train_loss": -9.078926086425781, "global_step": 66687, "epoch": 396} {"train_loss": -8.925068855285645, "global_step": 66688, "epoch": 396} {"train_loss": -9.006840705871582, "global_step": 66689, "epoch": 396} {"train_loss": -9.075860977172852, "global_step": 66690, "epoch": 396} {"train_loss": -8.92397689819336, "global_step": 66691, "epoch": 396} {"train_loss": -8.802732467651367, "global_step": 66692, "epoch": 396} {"train_loss": -8.780312538146973, "global_step": 66693, "epoch": 396} {"train_loss": -9.129721641540527, "global_step": 66694, "epoch": 396} {"train_loss": -8.859430682091485, "global_step": 66695, "epoch": 396, "val_loss": 191953.671875} {"train_loss": -8.959270477294922, "global_step": 66696, "epoch": 397} {"train_loss": -8.441516876220703, "global_step": 66697, "epoch": 397} {"train_loss": -8.772555351257324, "global_step": 66698, "epoch": 397} {"train_loss": -8.42640209197998, "global_step": 66699, "epoch": 397} {"train_loss": -8.174260139465332, "global_step": 66700, "epoch": 397} {"train_loss": -8.241896629333496, "global_step": 66701, "epoch": 397} {"train_loss": -8.87186050415039, "global_step": 66702, "epoch": 397} {"train_loss": -8.740629196166992, "global_step": 66703, "epoch": 397} {"train_loss": -8.391120910644531, "global_step": 66704, "epoch": 397} {"train_loss": -8.564836502075195, "global_step": 66705, "epoch": 397} {"train_loss": -8.391782760620117, "global_step": 66706, "epoch": 397} {"train_loss": -8.448014259338379, "global_step": 66707, "epoch": 397} {"train_loss": -8.27737045288086, "global_step": 66708, "epoch": 397} {"train_loss": -8.659916877746582, "global_step": 66709, "epoch": 397} {"train_loss": -8.517454147338867, "global_step": 66710, "epoch": 397} {"train_loss": -8.873546600341797, "global_step": 66711, "epoch": 397} {"train_loss": -8.59195327758789, "global_step": 66712, "epoch": 397} {"train_loss": -8.501642227172852, "global_step": 66713, "epoch": 397} {"train_loss": -8.384941101074219, "global_step": 66714, "epoch": 397} {"train_loss": -8.44941520690918, "global_step": 66715, "epoch": 397} {"train_loss": -8.029967308044434, "global_step": 66716, "epoch": 397} {"train_loss": -8.169656753540039, "global_step": 66717, "epoch": 397} {"train_loss": -8.267049789428711, "global_step": 66718, "epoch": 397} {"train_loss": -8.578657150268555, "global_step": 66719, "epoch": 397} {"train_loss": -8.571292877197266, "global_step": 66720, "epoch": 397} {"train_loss": -8.370957374572754, "global_step": 66721, "epoch": 397} {"train_loss": -8.555337905883789, "global_step": 66722, "epoch": 397} {"train_loss": -8.57299518585205, "global_step": 66723, "epoch": 397} {"train_loss": -8.622173309326172, "global_step": 66724, "epoch": 397} {"train_loss": -8.599485397338867, "global_step": 66725, "epoch": 397} {"train_loss": -8.541903495788574, "global_step": 66726, "epoch": 397} {"train_loss": -8.583230018615723, "global_step": 66727, "epoch": 397} {"train_loss": -8.726280212402344, "global_step": 66728, "epoch": 397} {"train_loss": -8.730463981628418, "global_step": 66729, "epoch": 397} {"train_loss": -8.699064254760742, "global_step": 66730, "epoch": 397} {"train_loss": -8.803932189941406, "global_step": 66731, "epoch": 397} {"train_loss": -8.641624450683594, "global_step": 66732, "epoch": 397} {"train_loss": -8.881097793579102, "global_step": 66733, "epoch": 397} {"train_loss": -8.684553146362305, "global_step": 66734, "epoch": 397} {"train_loss": -8.763493537902832, "global_step": 66735, "epoch": 397} {"train_loss": -8.67195987701416, "global_step": 66736, "epoch": 397} {"train_loss": -8.840015411376953, "global_step": 66737, "epoch": 397} {"train_loss": -8.892626762390137, "global_step": 66738, "epoch": 397} {"train_loss": -8.911006927490234, "global_step": 66739, "epoch": 397} {"train_loss": -9.085351943969727, "global_step": 66740, "epoch": 397} {"train_loss": -8.945356369018555, "global_step": 66741, "epoch": 397} {"train_loss": -8.945417404174805, "global_step": 66742, "epoch": 397} {"train_loss": -8.848159790039062, "global_step": 66743, "epoch": 397} {"train_loss": -9.074871063232422, "global_step": 66744, "epoch": 397} {"train_loss": -9.214519500732422, "global_step": 66745, "epoch": 397} {"train_loss": -8.932390213012695, "global_step": 66746, "epoch": 397} {"train_loss": -9.002706527709961, "global_step": 66747, "epoch": 397} {"train_loss": -8.941997528076172, "global_step": 66748, "epoch": 397} {"train_loss": -9.092711448669434, "global_step": 66749, "epoch": 397} {"train_loss": -9.109347343444824, "global_step": 66750, "epoch": 397} {"train_loss": -8.414277076721191, "global_step": 66751, "epoch": 397} {"train_loss": -8.937355041503906, "global_step": 66752, "epoch": 397} {"train_loss": -8.906953811645508, "global_step": 66753, "epoch": 397} {"train_loss": -8.937674522399902, "global_step": 66754, "epoch": 397} {"train_loss": -8.62753677368164, "global_step": 66755, "epoch": 397} {"train_loss": -8.847146987915039, "global_step": 66756, "epoch": 397} {"train_loss": -8.933675765991211, "global_step": 66757, "epoch": 397} {"train_loss": -9.110448837280273, "global_step": 66758, "epoch": 397} {"train_loss": -8.317567825317383, "global_step": 66759, "epoch": 397} {"train_loss": -8.427007675170898, "global_step": 66760, "epoch": 397} {"train_loss": -8.24913215637207, "global_step": 66761, "epoch": 397} {"train_loss": -8.743410110473633, "global_step": 66762, "epoch": 397} {"train_loss": -8.149030685424805, "global_step": 66763, "epoch": 397} {"train_loss": -8.590105056762695, "global_step": 66764, "epoch": 397} {"train_loss": -8.346060752868652, "global_step": 66765, "epoch": 397} {"train_loss": -8.412590980529785, "global_step": 66766, "epoch": 397} {"train_loss": -8.632927894592285, "global_step": 66767, "epoch": 397} {"train_loss": -8.528858184814453, "global_step": 66768, "epoch": 397} {"train_loss": -8.483793258666992, "global_step": 66769, "epoch": 397} {"train_loss": -8.45272445678711, "global_step": 66770, "epoch": 397} {"train_loss": -8.458375930786133, "global_step": 66771, "epoch": 397} {"train_loss": -8.675270080566406, "global_step": 66772, "epoch": 397} {"train_loss": -8.394279479980469, "global_step": 66773, "epoch": 397} {"train_loss": -8.665183067321777, "global_step": 66774, "epoch": 397} {"train_loss": -8.705317497253418, "global_step": 66775, "epoch": 397} {"train_loss": -8.573387145996094, "global_step": 66776, "epoch": 397} {"train_loss": -8.60185432434082, "global_step": 66777, "epoch": 397} {"train_loss": -8.551115989685059, "global_step": 66778, "epoch": 397} {"train_loss": -8.593825340270996, "global_step": 66779, "epoch": 397} {"train_loss": -8.659688949584961, "global_step": 66780, "epoch": 397} {"train_loss": -8.893474578857422, "global_step": 66781, "epoch": 397} {"train_loss": -8.882772445678711, "global_step": 66782, "epoch": 397} {"train_loss": -8.844133377075195, "global_step": 66783, "epoch": 397} {"train_loss": -8.87967300415039, "global_step": 66784, "epoch": 397} {"train_loss": -8.796236991882324, "global_step": 66785, "epoch": 397} {"train_loss": -8.719795227050781, "global_step": 66786, "epoch": 397} {"train_loss": -8.877944946289062, "global_step": 66787, "epoch": 397} {"train_loss": -8.899425506591797, "global_step": 66788, "epoch": 397} {"train_loss": -8.851072311401367, "global_step": 66789, "epoch": 397} {"train_loss": -9.040799140930176, "global_step": 66790, "epoch": 397} {"train_loss": -8.790346145629883, "global_step": 66791, "epoch": 397} {"train_loss": -8.728500366210938, "global_step": 66792, "epoch": 397} {"train_loss": -9.062544822692871, "global_step": 66793, "epoch": 397} {"train_loss": -9.042415618896484, "global_step": 66794, "epoch": 397} {"train_loss": -8.932674407958984, "global_step": 66795, "epoch": 397} {"train_loss": -9.099194526672363, "global_step": 66796, "epoch": 397} {"train_loss": -8.900260925292969, "global_step": 66797, "epoch": 397} {"train_loss": -9.135049819946289, "global_step": 66798, "epoch": 397} {"train_loss": -9.123613357543945, "global_step": 66799, "epoch": 397} {"train_loss": -8.954729080200195, "global_step": 66800, "epoch": 397} {"train_loss": -9.129467010498047, "global_step": 66801, "epoch": 397} {"train_loss": -9.191469192504883, "global_step": 66802, "epoch": 397} {"train_loss": -9.00368881225586, "global_step": 66803, "epoch": 397} {"train_loss": -9.211140632629395, "global_step": 66804, "epoch": 397} {"train_loss": -8.775970458984375, "global_step": 66805, "epoch": 397} {"train_loss": -9.037832260131836, "global_step": 66806, "epoch": 397} {"train_loss": -8.958639144897461, "global_step": 66807, "epoch": 397} {"train_loss": -8.949880599975586, "global_step": 66808, "epoch": 397} {"train_loss": -8.92039680480957, "global_step": 66809, "epoch": 397} {"train_loss": -8.874561309814453, "global_step": 66810, "epoch": 397} {"train_loss": -8.835893630981445, "global_step": 66811, "epoch": 397} {"train_loss": -8.942084312438965, "global_step": 66812, "epoch": 397} {"train_loss": -9.082837104797363, "global_step": 66813, "epoch": 397} {"train_loss": -8.970499038696289, "global_step": 66814, "epoch": 397} {"train_loss": -8.767036437988281, "global_step": 66815, "epoch": 397} {"train_loss": -9.09869384765625, "global_step": 66816, "epoch": 397} {"train_loss": -8.608744621276855, "global_step": 66817, "epoch": 397} {"train_loss": -9.098764419555664, "global_step": 66818, "epoch": 397} {"train_loss": -8.582908630371094, "global_step": 66819, "epoch": 397} {"train_loss": -9.027488708496094, "global_step": 66820, "epoch": 397} {"train_loss": -8.903003692626953, "global_step": 66821, "epoch": 397} {"train_loss": -8.757715225219727, "global_step": 66822, "epoch": 397} {"train_loss": -8.685358047485352, "global_step": 66823, "epoch": 397} {"train_loss": -8.605180740356445, "global_step": 66824, "epoch": 397} {"train_loss": -8.814475059509277, "global_step": 66825, "epoch": 397} {"train_loss": -8.734526634216309, "global_step": 66826, "epoch": 397} {"train_loss": -8.813478469848633, "global_step": 66827, "epoch": 397} {"train_loss": -8.69813346862793, "global_step": 66828, "epoch": 397} {"train_loss": -8.559314727783203, "global_step": 66829, "epoch": 397} {"train_loss": -8.571430206298828, "global_step": 66830, "epoch": 397} {"train_loss": -8.848703384399414, "global_step": 66831, "epoch": 397} {"train_loss": -8.4609375, "global_step": 66832, "epoch": 397} {"train_loss": -8.650416374206543, "global_step": 66833, "epoch": 397} {"train_loss": -8.704758644104004, "global_step": 66834, "epoch": 397} {"train_loss": -8.652969360351562, "global_step": 66835, "epoch": 397} {"train_loss": -8.805795669555664, "global_step": 66836, "epoch": 397} {"train_loss": -8.586861610412598, "global_step": 66837, "epoch": 397} {"train_loss": -8.805974960327148, "global_step": 66838, "epoch": 397} {"train_loss": -8.712423324584961, "global_step": 66839, "epoch": 397} {"train_loss": -8.755048751831055, "global_step": 66840, "epoch": 397} {"train_loss": -8.754192352294922, "global_step": 66841, "epoch": 397} {"train_loss": -8.730738639831543, "global_step": 66842, "epoch": 397} {"train_loss": -8.627910614013672, "global_step": 66843, "epoch": 397} {"train_loss": -8.703224182128906, "global_step": 66844, "epoch": 397} {"train_loss": -8.916328430175781, "global_step": 66845, "epoch": 397} {"train_loss": -8.659961700439453, "global_step": 66846, "epoch": 397} {"train_loss": -8.84298324584961, "global_step": 66847, "epoch": 397} {"train_loss": -8.771265983581543, "global_step": 66848, "epoch": 397} {"train_loss": -8.562623977661133, "global_step": 66849, "epoch": 397} {"train_loss": -8.816427230834961, "global_step": 66850, "epoch": 397} {"train_loss": -8.842825889587402, "global_step": 66851, "epoch": 397} {"train_loss": -8.900389671325684, "global_step": 66852, "epoch": 397} {"train_loss": -8.884753227233887, "global_step": 66853, "epoch": 397} {"train_loss": -8.874734878540039, "global_step": 66854, "epoch": 397} {"train_loss": -8.9622802734375, "global_step": 66855, "epoch": 397} {"train_loss": -8.943623542785645, "global_step": 66856, "epoch": 397} {"train_loss": -8.694567680358887, "global_step": 66857, "epoch": 397} {"train_loss": -8.806951522827148, "global_step": 66858, "epoch": 397} {"train_loss": -8.862165451049805, "global_step": 66859, "epoch": 397} {"train_loss": -8.734634399414062, "global_step": 66860, "epoch": 397} {"train_loss": -9.005807876586914, "global_step": 66861, "epoch": 397} {"train_loss": -8.813430786132812, "global_step": 66862, "epoch": 397} {"train_loss": -8.743112938744682, "global_step": 66863, "epoch": 397, "val_loss": 192930.96875} {"train_loss": -8.715998649597168, "global_step": 66864, "epoch": 398} {"train_loss": -8.872742652893066, "global_step": 66865, "epoch": 398} {"train_loss": -8.777796745300293, "global_step": 66866, "epoch": 398} {"train_loss": -8.979686737060547, "global_step": 66867, "epoch": 398} {"train_loss": -8.97459888458252, "global_step": 66868, "epoch": 398} {"train_loss": -8.87887954711914, "global_step": 66869, "epoch": 398} {"train_loss": -8.696091651916504, "global_step": 66870, "epoch": 398} {"train_loss": -8.94896125793457, "global_step": 66871, "epoch": 398} {"train_loss": -8.680885314941406, "global_step": 66872, "epoch": 398} {"train_loss": -8.815505027770996, "global_step": 66873, "epoch": 398} {"train_loss": -8.840190887451172, "global_step": 66874, "epoch": 398} {"train_loss": -8.825763702392578, "global_step": 66875, "epoch": 398} {"train_loss": -8.578594207763672, "global_step": 66876, "epoch": 398} {"train_loss": -8.564399719238281, "global_step": 66877, "epoch": 398} {"train_loss": -8.90837574005127, "global_step": 66878, "epoch": 398} {"train_loss": -8.817313194274902, "global_step": 66879, "epoch": 398} {"train_loss": -8.739604949951172, "global_step": 66880, "epoch": 398} {"train_loss": -8.730634689331055, "global_step": 66881, "epoch": 398} {"train_loss": -8.636832237243652, "global_step": 66882, "epoch": 398} {"train_loss": -8.739501953125, "global_step": 66883, "epoch": 398} {"train_loss": -8.784149169921875, "global_step": 66884, "epoch": 398} {"train_loss": -8.931093215942383, "global_step": 66885, "epoch": 398} {"train_loss": -8.679513931274414, "global_step": 66886, "epoch": 398} {"train_loss": -8.858699798583984, "global_step": 66887, "epoch": 398} {"train_loss": -8.913029670715332, "global_step": 66888, "epoch": 398} {"train_loss": -8.895345687866211, "global_step": 66889, "epoch": 398} {"train_loss": -8.766470909118652, "global_step": 66890, "epoch": 398} {"train_loss": -8.97829818725586, "global_step": 66891, "epoch": 398} {"train_loss": -8.98251724243164, "global_step": 66892, "epoch": 398} {"train_loss": -8.963979721069336, "global_step": 66893, "epoch": 398} {"train_loss": -9.02967643737793, "global_step": 66894, "epoch": 398} {"train_loss": -8.952017784118652, "global_step": 66895, "epoch": 398} {"train_loss": -8.862693786621094, "global_step": 66896, "epoch": 398} {"train_loss": -8.685667037963867, "global_step": 66897, "epoch": 398} {"train_loss": -9.030851364135742, "global_step": 66898, "epoch": 398} {"train_loss": -8.741421699523926, "global_step": 66899, "epoch": 398} {"train_loss": -9.032987594604492, "global_step": 66900, "epoch": 398} {"train_loss": -8.769987106323242, "global_step": 66901, "epoch": 398} {"train_loss": -8.541089057922363, "global_step": 66902, "epoch": 398} {"train_loss": -8.94987964630127, "global_step": 66903, "epoch": 398} {"train_loss": -8.926139831542969, "global_step": 66904, "epoch": 398} {"train_loss": -8.873147964477539, "global_step": 66905, "epoch": 398} {"train_loss": -8.761857986450195, "global_step": 66906, "epoch": 398} {"train_loss": -8.940898895263672, "global_step": 66907, "epoch": 398} {"train_loss": -8.871538162231445, "global_step": 66908, "epoch": 398} {"train_loss": -8.811561584472656, "global_step": 66909, "epoch": 398} {"train_loss": -8.71795654296875, "global_step": 66910, "epoch": 398} {"train_loss": -8.835498809814453, "global_step": 66911, "epoch": 398} {"train_loss": -8.79539966583252, "global_step": 66912, "epoch": 398} {"train_loss": -8.889049530029297, "global_step": 66913, "epoch": 398} {"train_loss": -8.87138557434082, "global_step": 66914, "epoch": 398} {"train_loss": -8.86805534362793, "global_step": 66915, "epoch": 398} {"train_loss": -9.004495620727539, "global_step": 66916, "epoch": 398} {"train_loss": -8.924302101135254, "global_step": 66917, "epoch": 398} {"train_loss": -8.99099063873291, "global_step": 66918, "epoch": 398} {"train_loss": -8.960851669311523, "global_step": 66919, "epoch": 398} {"train_loss": -8.913887977600098, "global_step": 66920, "epoch": 398} {"train_loss": -8.8883056640625, "global_step": 66921, "epoch": 398} {"train_loss": -8.94371223449707, "global_step": 66922, "epoch": 398} {"train_loss": -8.989559173583984, "global_step": 66923, "epoch": 398} {"train_loss": -8.753135681152344, "global_step": 66924, "epoch": 398} {"train_loss": -8.812374114990234, "global_step": 66925, "epoch": 398} {"train_loss": -9.005636215209961, "global_step": 66926, "epoch": 398} {"train_loss": -8.795516014099121, "global_step": 66927, "epoch": 398} {"train_loss": -9.005605697631836, "global_step": 66928, "epoch": 398} {"train_loss": -8.716514587402344, "global_step": 66929, "epoch": 398} {"train_loss": -8.612224578857422, "global_step": 66930, "epoch": 398} {"train_loss": -8.627069473266602, "global_step": 66931, "epoch": 398} {"train_loss": -8.991649627685547, "global_step": 66932, "epoch": 398} {"train_loss": -8.909536361694336, "global_step": 66933, "epoch": 398} {"train_loss": -8.803689956665039, "global_step": 66934, "epoch": 398} {"train_loss": -9.05041217803955, "global_step": 66935, "epoch": 398} {"train_loss": -8.840227127075195, "global_step": 66936, "epoch": 398} {"train_loss": -8.867071151733398, "global_step": 66937, "epoch": 398} {"train_loss": -8.816040992736816, "global_step": 66938, "epoch": 398} {"train_loss": -8.971209526062012, "global_step": 66939, "epoch": 398} {"train_loss": -8.836081504821777, "global_step": 66940, "epoch": 398} {"train_loss": -8.764471054077148, "global_step": 66941, "epoch": 398} {"train_loss": -8.847674369812012, "global_step": 66942, "epoch": 398} {"train_loss": -8.573371887207031, "global_step": 66943, "epoch": 398} {"train_loss": -8.545709609985352, "global_step": 66944, "epoch": 398} {"train_loss": -8.645430564880371, "global_step": 66945, "epoch": 398} {"train_loss": -8.320379257202148, "global_step": 66946, "epoch": 398} {"train_loss": -8.25381088256836, "global_step": 66947, "epoch": 398} {"train_loss": -8.486737251281738, "global_step": 66948, "epoch": 398} {"train_loss": -8.421854972839355, "global_step": 66949, "epoch": 398} {"train_loss": -8.410236358642578, "global_step": 66950, "epoch": 398} {"train_loss": -8.472818374633789, "global_step": 66951, "epoch": 398} {"train_loss": -8.499907493591309, "global_step": 66952, "epoch": 398} {"train_loss": -8.61507797241211, "global_step": 66953, "epoch": 398} {"train_loss": -8.62263298034668, "global_step": 66954, "epoch": 398} {"train_loss": -8.831075668334961, "global_step": 66955, "epoch": 398} {"train_loss": -8.594095230102539, "global_step": 66956, "epoch": 398} {"train_loss": -8.681293487548828, "global_step": 66957, "epoch": 398} {"train_loss": -8.813783645629883, "global_step": 66958, "epoch": 398} {"train_loss": -8.708284378051758, "global_step": 66959, "epoch": 398} {"train_loss": -8.618453025817871, "global_step": 66960, "epoch": 398} {"train_loss": -8.803642272949219, "global_step": 66961, "epoch": 398} {"train_loss": -8.453458786010742, "global_step": 66962, "epoch": 398} {"train_loss": -8.816644668579102, "global_step": 66963, "epoch": 398} {"train_loss": -8.603707313537598, "global_step": 66964, "epoch": 398} {"train_loss": -8.59348201751709, "global_step": 66965, "epoch": 398} {"train_loss": -8.64993667602539, "global_step": 66966, "epoch": 398} {"train_loss": -8.646308898925781, "global_step": 66967, "epoch": 398} {"train_loss": -8.631263732910156, "global_step": 66968, "epoch": 398} {"train_loss": -8.707230567932129, "global_step": 66969, "epoch": 398} {"train_loss": -8.853265762329102, "global_step": 66970, "epoch": 398} {"train_loss": -9.01881217956543, "global_step": 66971, "epoch": 398} {"train_loss": -8.649219512939453, "global_step": 66972, "epoch": 398} {"train_loss": -8.698492050170898, "global_step": 66973, "epoch": 398} {"train_loss": -8.827110290527344, "global_step": 66974, "epoch": 398} {"train_loss": -8.371292114257812, "global_step": 66975, "epoch": 398} {"train_loss": -8.932378768920898, "global_step": 66976, "epoch": 398} {"train_loss": -8.753141403198242, "global_step": 66977, "epoch": 398} {"train_loss": -8.904243469238281, "global_step": 66978, "epoch": 398} {"train_loss": -8.500657081604004, "global_step": 66979, "epoch": 398} {"train_loss": -8.84188461303711, "global_step": 66980, "epoch": 398} {"train_loss": -9.08790397644043, "global_step": 66981, "epoch": 398} {"train_loss": -8.773566246032715, "global_step": 66982, "epoch": 398} {"train_loss": -9.102996826171875, "global_step": 66983, "epoch": 398} {"train_loss": -8.753068923950195, "global_step": 66984, "epoch": 398} {"train_loss": -8.948253631591797, "global_step": 66985, "epoch": 398} {"train_loss": -8.872437477111816, "global_step": 66986, "epoch": 398} {"train_loss": -8.962629318237305, "global_step": 66987, "epoch": 398} {"train_loss": -8.748218536376953, "global_step": 66988, "epoch": 398} {"train_loss": -9.078514099121094, "global_step": 66989, "epoch": 398} {"train_loss": -8.615975379943848, "global_step": 66990, "epoch": 398} {"train_loss": -8.771110534667969, "global_step": 66991, "epoch": 398} {"train_loss": -8.466022491455078, "global_step": 66992, "epoch": 398} {"train_loss": -8.891138076782227, "global_step": 66993, "epoch": 398} {"train_loss": -8.715862274169922, "global_step": 66994, "epoch": 398} {"train_loss": -8.670234680175781, "global_step": 66995, "epoch": 398} {"train_loss": -8.72497844696045, "global_step": 66996, "epoch": 398} {"train_loss": -8.831298828125, "global_step": 66997, "epoch": 398} {"train_loss": -8.711944580078125, "global_step": 66998, "epoch": 398} {"train_loss": -8.66451644897461, "global_step": 66999, "epoch": 398} {"train_loss": -8.847134590148926, "global_step": 67000, "epoch": 398} {"train_loss": -8.821521759033203, "global_step": 67001, "epoch": 398} {"train_loss": -8.856346130371094, "global_step": 67002, "epoch": 398} {"train_loss": -9.029877662658691, "global_step": 67003, "epoch": 398} {"train_loss": -8.755550384521484, "global_step": 67004, "epoch": 398} {"train_loss": -8.70435905456543, "global_step": 67005, "epoch": 398} {"train_loss": -9.019266128540039, "global_step": 67006, "epoch": 398} {"train_loss": -8.791778564453125, "global_step": 67007, "epoch": 398} {"train_loss": -8.918663024902344, "global_step": 67008, "epoch": 398} {"train_loss": -8.67789077758789, "global_step": 67009, "epoch": 398} {"train_loss": -9.022064208984375, "global_step": 67010, "epoch": 398} {"train_loss": -8.788147926330566, "global_step": 67011, "epoch": 398} {"train_loss": -8.698017120361328, "global_step": 67012, "epoch": 398} {"train_loss": -8.944271087646484, "global_step": 67013, "epoch": 398} {"train_loss": -8.82819938659668, "global_step": 67014, "epoch": 398} {"train_loss": -8.892495155334473, "global_step": 67015, "epoch": 398} {"train_loss": -8.999046325683594, "global_step": 67016, "epoch": 398} {"train_loss": -8.926094055175781, "global_step": 67017, "epoch": 398} {"train_loss": -9.046886444091797, "global_step": 67018, "epoch": 398} {"train_loss": -8.93643569946289, "global_step": 67019, "epoch": 398} {"train_loss": -9.09687328338623, "global_step": 67020, "epoch": 398} {"train_loss": -8.759857177734375, "global_step": 67021, "epoch": 398} {"train_loss": -8.858370780944824, "global_step": 67022, "epoch": 398} {"train_loss": -8.883363723754883, "global_step": 67023, "epoch": 398} {"train_loss": -8.926913261413574, "global_step": 67024, "epoch": 398} {"train_loss": -8.817167282104492, "global_step": 67025, "epoch": 398} {"train_loss": -8.817083358764648, "global_step": 67026, "epoch": 398} {"train_loss": -8.921757698059082, "global_step": 67027, "epoch": 398} {"train_loss": -8.899484634399414, "global_step": 67028, "epoch": 398} {"train_loss": -8.844364166259766, "global_step": 67029, "epoch": 398} {"train_loss": -8.806829452514648, "global_step": 67030, "epoch": 398} {"train_loss": -8.800706613631476, "global_step": 67031, "epoch": 398, "val_loss": 190577.78125} {"train_loss": -8.917491912841797, "global_step": 67032, "epoch": 399} {"train_loss": -8.978933334350586, "global_step": 67033, "epoch": 399} {"train_loss": -8.615886688232422, "global_step": 67034, "epoch": 399} {"train_loss": -8.615717887878418, "global_step": 67035, "epoch": 399} {"train_loss": -8.941930770874023, "global_step": 67036, "epoch": 399} {"train_loss": -8.739477157592773, "global_step": 67037, "epoch": 399} {"train_loss": -8.646059036254883, "global_step": 67038, "epoch": 399} {"train_loss": -8.926852226257324, "global_step": 67039, "epoch": 399} {"train_loss": -8.754613876342773, "global_step": 67040, "epoch": 399} {"train_loss": -8.781010627746582, "global_step": 67041, "epoch": 399} {"train_loss": -8.674102783203125, "global_step": 67042, "epoch": 399} {"train_loss": -8.702676773071289, "global_step": 67043, "epoch": 399} {"train_loss": -8.551060676574707, "global_step": 67044, "epoch": 399} {"train_loss": -8.838574409484863, "global_step": 67045, "epoch": 399} {"train_loss": -8.381851196289062, "global_step": 67046, "epoch": 399} {"train_loss": -8.755110740661621, "global_step": 67047, "epoch": 399} {"train_loss": -8.567047119140625, "global_step": 67048, "epoch": 399} {"train_loss": -8.569307327270508, "global_step": 67049, "epoch": 399} {"train_loss": -8.658356666564941, "global_step": 67050, "epoch": 399} {"train_loss": -8.475336074829102, "global_step": 67051, "epoch": 399} {"train_loss": -9.000267028808594, "global_step": 67052, "epoch": 399} {"train_loss": -8.775177955627441, "global_step": 67053, "epoch": 399} {"train_loss": -8.802074432373047, "global_step": 67054, "epoch": 399} {"train_loss": -8.719744682312012, "global_step": 67055, "epoch": 399} {"train_loss": -8.943766593933105, "global_step": 67056, "epoch": 399} {"train_loss": -8.762717247009277, "global_step": 67057, "epoch": 399} {"train_loss": -8.785704612731934, "global_step": 67058, "epoch": 399} {"train_loss": -8.89146614074707, "global_step": 67059, "epoch": 399} {"train_loss": -8.989023208618164, "global_step": 67060, "epoch": 399} {"train_loss": -8.904592514038086, "global_step": 67061, "epoch": 399} {"train_loss": -8.81956672668457, "global_step": 67062, "epoch": 399} {"train_loss": -8.89860725402832, "global_step": 67063, "epoch": 399} {"train_loss": -9.195363998413086, "global_step": 67064, "epoch": 399} {"train_loss": -8.719036102294922, "global_step": 67065, "epoch": 399} {"train_loss": -8.928203582763672, "global_step": 67066, "epoch": 399} {"train_loss": -8.822181701660156, "global_step": 67067, "epoch": 399} {"train_loss": -9.094608306884766, "global_step": 67068, "epoch": 399} {"train_loss": -8.73828411102295, "global_step": 67069, "epoch": 399} {"train_loss": -9.03342056274414, "global_step": 67070, "epoch": 399} {"train_loss": -9.212008476257324, "global_step": 67071, "epoch": 399} {"train_loss": -9.014485359191895, "global_step": 67072, "epoch": 399} {"train_loss": -9.023548126220703, "global_step": 67073, "epoch": 399} {"train_loss": -9.273202896118164, "global_step": 67074, "epoch": 399} {"train_loss": -8.733448028564453, "global_step": 67075, "epoch": 399} {"train_loss": -9.133909225463867, "global_step": 67076, "epoch": 399} {"train_loss": -8.89225959777832, "global_step": 67077, "epoch": 399} {"train_loss": -8.831284523010254, "global_step": 67078, "epoch": 399} {"train_loss": -8.689300537109375, "global_step": 67079, "epoch": 399} {"train_loss": -9.042329788208008, "global_step": 67080, "epoch": 399} {"train_loss": -8.902898788452148, "global_step": 67081, "epoch": 399} {"train_loss": -9.188050270080566, "global_step": 67082, "epoch": 399} {"train_loss": -8.978325843811035, "global_step": 67083, "epoch": 399} {"train_loss": -8.969758987426758, "global_step": 67084, "epoch": 399} {"train_loss": -8.958379745483398, "global_step": 67085, "epoch": 399} {"train_loss": -8.933805465698242, "global_step": 67086, "epoch": 399} {"train_loss": -8.957731246948242, "global_step": 67087, "epoch": 399} {"train_loss": -9.261802673339844, "global_step": 67088, "epoch": 399} {"train_loss": -8.698042869567871, "global_step": 67089, "epoch": 399} {"train_loss": -8.852310180664062, "global_step": 67090, "epoch": 399} {"train_loss": -9.139507293701172, "global_step": 67091, "epoch": 399} {"train_loss": -8.790491104125977, "global_step": 67092, "epoch": 399} {"train_loss": -9.116609573364258, "global_step": 67093, "epoch": 399} {"train_loss": -8.815608024597168, "global_step": 67094, "epoch": 399} {"train_loss": -8.94973087310791, "global_step": 67095, "epoch": 399} {"train_loss": -8.913189888000488, "global_step": 67096, "epoch": 399} {"train_loss": -9.157618522644043, "global_step": 67097, "epoch": 399} {"train_loss": -8.827476501464844, "global_step": 67098, "epoch": 399} {"train_loss": -8.891448974609375, "global_step": 67099, "epoch": 399} {"train_loss": -8.836204528808594, "global_step": 67100, "epoch": 399} {"train_loss": -9.051932334899902, "global_step": 67101, "epoch": 399} {"train_loss": -9.059677124023438, "global_step": 67102, "epoch": 399} {"train_loss": -8.899036407470703, "global_step": 67103, "epoch": 399} {"train_loss": -8.952786445617676, "global_step": 67104, "epoch": 399} {"train_loss": -8.86154556274414, "global_step": 67105, "epoch": 399} {"train_loss": -8.831502914428711, "global_step": 67106, "epoch": 399} {"train_loss": -8.990289688110352, "global_step": 67107, "epoch": 399} {"train_loss": -9.103784561157227, "global_step": 67108, "epoch": 399} {"train_loss": -9.120712280273438, "global_step": 67109, "epoch": 399} {"train_loss": -8.928069114685059, "global_step": 67110, "epoch": 399} {"train_loss": -8.862638473510742, "global_step": 67111, "epoch": 399} {"train_loss": -8.8707914352417, "global_step": 67112, "epoch": 399} {"train_loss": -8.889371871948242, "global_step": 67113, "epoch": 399} {"train_loss": -9.138763427734375, "global_step": 67114, "epoch": 399} {"train_loss": -9.085808753967285, "global_step": 67115, "epoch": 399} {"train_loss": -8.990676879882812, "global_step": 67116, "epoch": 399} {"train_loss": -8.843891143798828, "global_step": 67117, "epoch": 399} {"train_loss": -8.956085205078125, "global_step": 67118, "epoch": 399} {"train_loss": -8.897043228149414, "global_step": 67119, "epoch": 399} {"train_loss": -8.972947120666504, "global_step": 67120, "epoch": 399} {"train_loss": -9.010979652404785, "global_step": 67121, "epoch": 399} {"train_loss": -9.004096031188965, "global_step": 67122, "epoch": 399} {"train_loss": -9.214027404785156, "global_step": 67123, "epoch": 399} {"train_loss": -9.12746810913086, "global_step": 67124, "epoch": 399} {"train_loss": -8.91067123413086, "global_step": 67125, "epoch": 399} {"train_loss": -8.870607376098633, "global_step": 67126, "epoch": 399} {"train_loss": -8.737548828125, "global_step": 67127, "epoch": 399} {"train_loss": -8.95987319946289, "global_step": 67128, "epoch": 399} {"train_loss": -9.093352317810059, "global_step": 67129, "epoch": 399} {"train_loss": -8.95195484161377, "global_step": 67130, "epoch": 399} {"train_loss": -9.113555908203125, "global_step": 67131, "epoch": 399} {"train_loss": -8.602225303649902, "global_step": 67132, "epoch": 399} {"train_loss": -9.048752784729004, "global_step": 67133, "epoch": 399} {"train_loss": -8.363056182861328, "global_step": 67134, "epoch": 399} {"train_loss": -9.048720359802246, "global_step": 67135, "epoch": 399} {"train_loss": -8.80700397491455, "global_step": 67136, "epoch": 399} {"train_loss": -8.943851470947266, "global_step": 67137, "epoch": 399} {"train_loss": -8.5525541305542, "global_step": 67138, "epoch": 399} {"train_loss": -8.998075485229492, "global_step": 67139, "epoch": 399} {"train_loss": -8.701021194458008, "global_step": 67140, "epoch": 399} {"train_loss": -8.518226623535156, "global_step": 67141, "epoch": 399} {"train_loss": -8.857730865478516, "global_step": 67142, "epoch": 399} {"train_loss": -8.73735237121582, "global_step": 67143, "epoch": 399} {"train_loss": -8.890121459960938, "global_step": 67144, "epoch": 399} {"train_loss": -8.690934181213379, "global_step": 67145, "epoch": 399} {"train_loss": -8.734950065612793, "global_step": 67146, "epoch": 399} {"train_loss": -8.643235206604004, "global_step": 67147, "epoch": 399} {"train_loss": -8.817207336425781, "global_step": 67148, "epoch": 399} {"train_loss": -8.69015884399414, "global_step": 67149, "epoch": 399} {"train_loss": -8.773597717285156, "global_step": 67150, "epoch": 399} {"train_loss": -8.448554039001465, "global_step": 67151, "epoch": 399} {"train_loss": -8.968944549560547, "global_step": 67152, "epoch": 399} {"train_loss": -8.892500877380371, "global_step": 67153, "epoch": 399} {"train_loss": -8.669469833374023, "global_step": 67154, "epoch": 399} {"train_loss": -8.772969245910645, "global_step": 67155, "epoch": 399} {"train_loss": -8.762941360473633, "global_step": 67156, "epoch": 399} {"train_loss": -8.675869941711426, "global_step": 67157, "epoch": 399} {"train_loss": -8.537124633789062, "global_step": 67158, "epoch": 399} {"train_loss": -8.77982234954834, "global_step": 67159, "epoch": 399} {"train_loss": -8.746732711791992, "global_step": 67160, "epoch": 399} {"train_loss": -8.345524787902832, "global_step": 67161, "epoch": 399} {"train_loss": -8.434852600097656, "global_step": 67162, "epoch": 399} {"train_loss": -8.528921127319336, "global_step": 67163, "epoch": 399} {"train_loss": -8.405877113342285, "global_step": 67164, "epoch": 399} {"train_loss": -8.888521194458008, "global_step": 67165, "epoch": 399} {"train_loss": -8.771146774291992, "global_step": 67166, "epoch": 399} {"train_loss": -8.884149551391602, "global_step": 67167, "epoch": 399} {"train_loss": -8.94985580444336, "global_step": 67168, "epoch": 399} {"train_loss": -8.61463737487793, "global_step": 67169, "epoch": 399} {"train_loss": -8.97067928314209, "global_step": 67170, "epoch": 399} {"train_loss": -8.837713241577148, "global_step": 67171, "epoch": 399} {"train_loss": -8.809688568115234, "global_step": 67172, "epoch": 399} {"train_loss": -8.988008499145508, "global_step": 67173, "epoch": 399} {"train_loss": -9.059572219848633, "global_step": 67174, "epoch": 399} {"train_loss": -9.118691444396973, "global_step": 67175, "epoch": 399} {"train_loss": -8.713996887207031, "global_step": 67176, "epoch": 399} {"train_loss": -8.940364837646484, "global_step": 67177, "epoch": 399} {"train_loss": -8.994952201843262, "global_step": 67178, "epoch": 399} {"train_loss": -8.891063690185547, "global_step": 67179, "epoch": 399} {"train_loss": -8.786645889282227, "global_step": 67180, "epoch": 399} {"train_loss": -8.860508918762207, "global_step": 67181, "epoch": 399} {"train_loss": -8.679450988769531, "global_step": 67182, "epoch": 399} {"train_loss": -8.538822174072266, "global_step": 67183, "epoch": 399} {"train_loss": -8.852334976196289, "global_step": 67184, "epoch": 399} {"train_loss": -9.09223461151123, "global_step": 67185, "epoch": 399} {"train_loss": -8.525415420532227, "global_step": 67186, "epoch": 399} {"train_loss": -8.752020835876465, "global_step": 67187, "epoch": 399} {"train_loss": -8.796738624572754, "global_step": 67188, "epoch": 399} {"train_loss": -8.707229614257812, "global_step": 67189, "epoch": 399} {"train_loss": -8.902118682861328, "global_step": 67190, "epoch": 399} {"train_loss": -8.937384605407715, "global_step": 67191, "epoch": 399} {"train_loss": -8.725399017333984, "global_step": 67192, "epoch": 399} {"train_loss": -8.587014198303223, "global_step": 67193, "epoch": 399} {"train_loss": -8.729159355163574, "global_step": 67194, "epoch": 399} {"train_loss": -9.030155181884766, "global_step": 67195, "epoch": 399} {"train_loss": -8.879230499267578, "global_step": 67196, "epoch": 399} {"train_loss": -8.370295524597168, "global_step": 67197, "epoch": 399} {"train_loss": -8.69367790222168, "global_step": 67198, "epoch": 399} {"train_loss": -8.84653790224166, "global_step": 67199, "epoch": 399, "val_loss": 194242.3125} {"train_loss": -8.694908142089844, "global_step": 67200, "epoch": 400} {"train_loss": -8.73034954071045, "global_step": 67201, "epoch": 400} {"train_loss": -8.779311180114746, "global_step": 67202, "epoch": 400} {"train_loss": -8.696969032287598, "global_step": 67203, "epoch": 400} {"train_loss": -8.740785598754883, "global_step": 67204, "epoch": 400} {"train_loss": -8.997749328613281, "global_step": 67205, "epoch": 400} {"train_loss": -8.735555648803711, "global_step": 67206, "epoch": 400} {"train_loss": -8.778358459472656, "global_step": 67207, "epoch": 400} {"train_loss": -8.899486541748047, "global_step": 67208, "epoch": 400} {"train_loss": -8.812369346618652, "global_step": 67209, "epoch": 400} {"train_loss": -8.671709060668945, "global_step": 67210, "epoch": 400} {"train_loss": -8.861542701721191, "global_step": 67211, "epoch": 400} {"train_loss": -8.859195709228516, "global_step": 67212, "epoch": 400} {"train_loss": -9.03353500366211, "global_step": 67213, "epoch": 400} {"train_loss": -8.8684663772583, "global_step": 67214, "epoch": 400} {"train_loss": -8.777153015136719, "global_step": 67215, "epoch": 400} {"train_loss": -9.014892578125, "global_step": 67216, "epoch": 400} {"train_loss": -9.012659072875977, "global_step": 67217, "epoch": 400} {"train_loss": -8.92323112487793, "global_step": 67218, "epoch": 400} {"train_loss": -8.965259552001953, "global_step": 67219, "epoch": 400} {"train_loss": -9.082338333129883, "global_step": 67220, "epoch": 400} {"train_loss": -8.924575805664062, "global_step": 67221, "epoch": 400} {"train_loss": -8.819433212280273, "global_step": 67222, "epoch": 400} {"train_loss": -8.683462142944336, "global_step": 67223, "epoch": 400} {"train_loss": -9.181690216064453, "global_step": 67224, "epoch": 400} {"train_loss": -9.087181091308594, "global_step": 67225, "epoch": 400} {"train_loss": -8.797477722167969, "global_step": 67226, "epoch": 400} {"train_loss": -8.978660583496094, "global_step": 67227, "epoch": 400} {"train_loss": -8.60548210144043, "global_step": 67228, "epoch": 400} {"train_loss": -8.850800514221191, "global_step": 67229, "epoch": 400} {"train_loss": -8.959196090698242, "global_step": 67230, "epoch": 400} {"train_loss": -8.883139610290527, "global_step": 67231, "epoch": 400} {"train_loss": -9.117433547973633, "global_step": 67232, "epoch": 400} {"train_loss": -8.985725402832031, "global_step": 67233, "epoch": 400} {"train_loss": -8.749841690063477, "global_step": 67234, "epoch": 400} {"train_loss": -8.961823463439941, "global_step": 67235, "epoch": 400} {"train_loss": -8.986186981201172, "global_step": 67236, "epoch": 400} {"train_loss": -8.858940124511719, "global_step": 67237, "epoch": 400} {"train_loss": -9.194442749023438, "global_step": 67238, "epoch": 400} {"train_loss": -9.18714714050293, "global_step": 67239, "epoch": 400} {"train_loss": -9.138081550598145, "global_step": 67240, "epoch": 400} {"train_loss": -9.07866382598877, "global_step": 67241, "epoch": 400} {"train_loss": -9.107576370239258, "global_step": 67242, "epoch": 400} {"train_loss": -9.026546478271484, "global_step": 67243, "epoch": 400} {"train_loss": -8.753608703613281, "global_step": 67244, "epoch": 400} {"train_loss": -8.986713409423828, "global_step": 67245, "epoch": 400} {"train_loss": -8.893411636352539, "global_step": 67246, "epoch": 400} {"train_loss": -8.828773498535156, "global_step": 67247, "epoch": 400} {"train_loss": -8.973057746887207, "global_step": 67248, "epoch": 400} {"train_loss": -8.78403377532959, "global_step": 67249, "epoch": 400} {"train_loss": -8.779531478881836, "global_step": 67250, "epoch": 400} {"train_loss": -8.914770126342773, "global_step": 67251, "epoch": 400} {"train_loss": -8.730791091918945, "global_step": 67252, "epoch": 400} {"train_loss": -8.90197467803955, "global_step": 67253, "epoch": 400} {"train_loss": -8.844698905944824, "global_step": 67254, "epoch": 400} {"train_loss": -9.140765190124512, "global_step": 67255, "epoch": 400} {"train_loss": -8.883524894714355, "global_step": 67256, "epoch": 400} {"train_loss": -8.846435546875, "global_step": 67257, "epoch": 400} {"train_loss": -8.712836265563965, "global_step": 67258, "epoch": 400} {"train_loss": -9.022037506103516, "global_step": 67259, "epoch": 400} {"train_loss": -8.747690200805664, "global_step": 67260, "epoch": 400} {"train_loss": -9.057496070861816, "global_step": 67261, "epoch": 400} {"train_loss": -8.78317642211914, "global_step": 67262, "epoch": 400} {"train_loss": -9.003328323364258, "global_step": 67263, "epoch": 400} {"train_loss": -8.962228775024414, "global_step": 67264, "epoch": 400} {"train_loss": -8.833060264587402, "global_step": 67265, "epoch": 400} {"train_loss": -8.792760848999023, "global_step": 67266, "epoch": 400} {"train_loss": -8.970904350280762, "global_step": 67267, "epoch": 400} {"train_loss": -8.548728942871094, "global_step": 67268, "epoch": 400} {"train_loss": -8.871606826782227, "global_step": 67269, "epoch": 400} {"train_loss": -8.814596176147461, "global_step": 67270, "epoch": 400} {"train_loss": -9.09233283996582, "global_step": 67271, "epoch": 400} {"train_loss": -8.99675178527832, "global_step": 67272, "epoch": 400} {"train_loss": -8.864677429199219, "global_step": 67273, "epoch": 400} {"train_loss": -9.106453895568848, "global_step": 67274, "epoch": 400} {"train_loss": -8.963132858276367, "global_step": 67275, "epoch": 400} {"train_loss": -9.083183288574219, "global_step": 67276, "epoch": 400} {"train_loss": -8.814620971679688, "global_step": 67277, "epoch": 400} {"train_loss": -8.95211410522461, "global_step": 67278, "epoch": 400} {"train_loss": -8.873202323913574, "global_step": 67279, "epoch": 400} {"train_loss": -8.754117012023926, "global_step": 67280, "epoch": 400} {"train_loss": -8.977239608764648, "global_step": 67281, "epoch": 400} {"train_loss": -9.076129913330078, "global_step": 67282, "epoch": 400} {"train_loss": -8.744059562683105, "global_step": 67283, "epoch": 400} {"train_loss": -8.82864761352539, "global_step": 67284, "epoch": 400} {"train_loss": -8.933073997497559, "global_step": 67285, "epoch": 400} {"train_loss": -8.740218162536621, "global_step": 67286, "epoch": 400} {"train_loss": -8.998998641967773, "global_step": 67287, "epoch": 400} {"train_loss": -9.000739097595215, "global_step": 67288, "epoch": 400} {"train_loss": -8.68223762512207, "global_step": 67289, "epoch": 400} {"train_loss": -9.048314094543457, "global_step": 67290, "epoch": 400} {"train_loss": -8.832868576049805, "global_step": 67291, "epoch": 400} {"train_loss": -8.848365783691406, "global_step": 67292, "epoch": 400} {"train_loss": -8.844423294067383, "global_step": 67293, "epoch": 400} {"train_loss": -8.756271362304688, "global_step": 67294, "epoch": 400} {"train_loss": -9.057628631591797, "global_step": 67295, "epoch": 400} {"train_loss": -9.012895584106445, "global_step": 67296, "epoch": 400} {"train_loss": -8.88652229309082, "global_step": 67297, "epoch": 400} {"train_loss": -8.75, "global_step": 67298, "epoch": 400} {"train_loss": -8.984066009521484, "global_step": 67299, "epoch": 400} {"train_loss": -8.896366119384766, "global_step": 67300, "epoch": 400} {"train_loss": -9.030630111694336, "global_step": 67301, "epoch": 400} {"train_loss": -8.713783264160156, "global_step": 67302, "epoch": 400} {"train_loss": -8.959589958190918, "global_step": 67303, "epoch": 400} {"train_loss": -9.059480667114258, "global_step": 67304, "epoch": 400} {"train_loss": -8.918155670166016, "global_step": 67305, "epoch": 400} {"train_loss": -9.172403335571289, "global_step": 67306, "epoch": 400} {"train_loss": -9.157207489013672, "global_step": 67307, "epoch": 400} {"train_loss": -8.787769317626953, "global_step": 67308, "epoch": 400} {"train_loss": -8.989801406860352, "global_step": 67309, "epoch": 400} {"train_loss": -9.222262382507324, "global_step": 67310, "epoch": 400} {"train_loss": -9.201257705688477, "global_step": 67311, "epoch": 400} {"train_loss": -8.804830551147461, "global_step": 67312, "epoch": 400} {"train_loss": -8.975034713745117, "global_step": 67313, "epoch": 400} {"train_loss": -9.00576114654541, "global_step": 67314, "epoch": 400} {"train_loss": -8.998302459716797, "global_step": 67315, "epoch": 400} {"train_loss": -8.850972175598145, "global_step": 67316, "epoch": 400} {"train_loss": -9.073478698730469, "global_step": 67317, "epoch": 400} {"train_loss": -8.940912246704102, "global_step": 67318, "epoch": 400} {"train_loss": -8.805370330810547, "global_step": 67319, "epoch": 400} {"train_loss": -8.831249237060547, "global_step": 67320, "epoch": 400} {"train_loss": -8.700325012207031, "global_step": 67321, "epoch": 400} {"train_loss": -8.79861068725586, "global_step": 67322, "epoch": 400} {"train_loss": -8.549811363220215, "global_step": 67323, "epoch": 400} {"train_loss": -8.503716468811035, "global_step": 67324, "epoch": 400} {"train_loss": -8.78714370727539, "global_step": 67325, "epoch": 400} {"train_loss": -8.568058013916016, "global_step": 67326, "epoch": 400} {"train_loss": -8.798295974731445, "global_step": 67327, "epoch": 400} {"train_loss": -8.904714584350586, "global_step": 67328, "epoch": 400} {"train_loss": -8.968015670776367, "global_step": 67329, "epoch": 400} {"train_loss": -8.824464797973633, "global_step": 67330, "epoch": 400} {"train_loss": -9.100597381591797, "global_step": 67331, "epoch": 400} {"train_loss": -8.94014835357666, "global_step": 67332, "epoch": 400} {"train_loss": -8.9036865234375, "global_step": 67333, "epoch": 400} {"train_loss": -8.921570777893066, "global_step": 67334, "epoch": 400} {"train_loss": -8.983261108398438, "global_step": 67335, "epoch": 400} {"train_loss": -8.89684009552002, "global_step": 67336, "epoch": 400} {"train_loss": -9.039234161376953, "global_step": 67337, "epoch": 400} {"train_loss": -8.90513801574707, "global_step": 67338, "epoch": 400} {"train_loss": -8.82257080078125, "global_step": 67339, "epoch": 400} {"train_loss": -8.921470642089844, "global_step": 67340, "epoch": 400} {"train_loss": -9.025814056396484, "global_step": 67341, "epoch": 400} {"train_loss": -8.811888694763184, "global_step": 67342, "epoch": 400} {"train_loss": -8.693401336669922, "global_step": 67343, "epoch": 400} {"train_loss": -8.695235252380371, "global_step": 67344, "epoch": 400} {"train_loss": -8.777192115783691, "global_step": 67345, "epoch": 400} {"train_loss": -8.626928329467773, "global_step": 67346, "epoch": 400} {"train_loss": -8.576662063598633, "global_step": 67347, "epoch": 400} {"train_loss": -8.775532722473145, "global_step": 67348, "epoch": 400} {"train_loss": -8.672927856445312, "global_step": 67349, "epoch": 400} {"train_loss": -8.755853652954102, "global_step": 67350, "epoch": 400} {"train_loss": -8.972981452941895, "global_step": 67351, "epoch": 400} {"train_loss": -8.642733573913574, "global_step": 67352, "epoch": 400} {"train_loss": -8.90622329711914, "global_step": 67353, "epoch": 400} {"train_loss": -8.826160430908203, "global_step": 67354, "epoch": 400} {"train_loss": -8.876935958862305, "global_step": 67355, "epoch": 400} {"train_loss": -8.815397262573242, "global_step": 67356, "epoch": 400} {"train_loss": -8.708717346191406, "global_step": 67357, "epoch": 400} {"train_loss": -8.732492446899414, "global_step": 67358, "epoch": 400} {"train_loss": -8.747379302978516, "global_step": 67359, "epoch": 400} {"train_loss": -8.795002937316895, "global_step": 67360, "epoch": 400} {"train_loss": -8.638134002685547, "global_step": 67361, "epoch": 400} {"train_loss": -8.820932388305664, "global_step": 67362, "epoch": 400} {"train_loss": -8.813772201538086, "global_step": 67363, "epoch": 400} {"train_loss": -8.85186767578125, "global_step": 67364, "epoch": 400} {"train_loss": -9.073909759521484, "global_step": 67365, "epoch": 400} {"train_loss": -8.931468963623047, "global_step": 67366, "epoch": 400} {"train_loss": -8.885007898012796, "global_step": 67367, "epoch": 400, "train/sim_max_reward_0": 0.549043187847988, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.026012284790977662, "train/sim_max_reward_3": 0.6881352510253899, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.5516081429451095, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.3528240822052638, "test/sim_max_reward_4400002": 0.08977809982794174, "test/sim_max_reward_4400003": 0.5200881602925447, "test/sim_max_reward_4400004": 0.4062603461017144, "test/sim_max_reward_4400005": 0.548009300353651, "test/sim_max_reward_4400006": 0.8280703931517643, "test/sim_max_reward_4400007": 0.9658395005384554, "test/sim_max_reward_4400008": 0.7229473989299738, "test/sim_max_reward_4400009": 0.3822575014477728, "test/sim_max_reward_4400010": 0.2207113095227116, "test/sim_max_reward_4400011": 0.6604976948411783, "test/sim_max_reward_4400012": 0.9863583097815395, "test/sim_max_reward_4400013": 0.9751061363349628, "test/sim_max_reward_4400014": 0.7057733895322712, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.925212635204185, "test/sim_max_reward_4400019": 0.49362320629763035, "test/sim_max_reward_4400020": 0.0005987464230124357, "test/sim_max_reward_4400021": 0.9343610931054537, "test/sim_max_reward_4400022": 0.9570376094750292, "test/sim_max_reward_4400023": 0.9943180781336746, "test/sim_max_reward_4400024": 0.2914484975534042, "test/sim_max_reward_4400025": 0.6634986495103987, "test/sim_max_reward_4400026": 1.0, "test/sim_max_reward_4400027": 1.0, "test/sim_max_reward_4400028": 0.7084326939910154, "test/sim_max_reward_4400029": 0.506424584878618, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.4455159008348304, "test/sim_max_reward_4400033": 0.16284511024006476, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.5260543057931523, "test/sim_max_reward_4400036": 0.36726506465425995, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.9474985824132979, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.2610864072764229, "test/sim_max_reward_4400041": 0.19471550777975535, "test/sim_max_reward_4400042": 0.022269911980947153, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.4196240795304258, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6357998111015775, "test/mean_score": 0.591957930523701, "val_loss": 189445.609375, "train_action_mse_error": 4.323156356811523} {"train_loss": -9.122438430786133, "global_step": 67368, "epoch": 401} {"train_loss": -8.978815078735352, "global_step": 67369, "epoch": 401} {"train_loss": -9.027469635009766, "global_step": 67370, "epoch": 401} {"train_loss": -9.099261283874512, "global_step": 67371, "epoch": 401} {"train_loss": -8.882915496826172, "global_step": 67372, "epoch": 401} {"train_loss": -8.69301986694336, "global_step": 67373, "epoch": 401} {"train_loss": -9.105987548828125, "global_step": 67374, "epoch": 401} {"train_loss": -8.677312850952148, "global_step": 67375, "epoch": 401} {"train_loss": -8.744725227355957, "global_step": 67376, "epoch": 401} {"train_loss": -9.100534439086914, "global_step": 67377, "epoch": 401} {"train_loss": -8.63176155090332, "global_step": 67378, "epoch": 401} {"train_loss": -8.892117500305176, "global_step": 67379, "epoch": 401} {"train_loss": -8.896515846252441, "global_step": 67380, "epoch": 401} {"train_loss": -8.67719841003418, "global_step": 67381, "epoch": 401} {"train_loss": -8.914813041687012, "global_step": 67382, "epoch": 401} {"train_loss": -8.755759239196777, "global_step": 67383, "epoch": 401} {"train_loss": -8.508171081542969, "global_step": 67384, "epoch": 401} {"train_loss": -8.788032531738281, "global_step": 67385, "epoch": 401} {"train_loss": -8.826133728027344, "global_step": 67386, "epoch": 401} {"train_loss": -8.785776138305664, "global_step": 67387, "epoch": 401} {"train_loss": -8.68093204498291, "global_step": 67388, "epoch": 401} {"train_loss": -8.824172973632812, "global_step": 67389, "epoch": 401} {"train_loss": -8.365741729736328, "global_step": 67390, "epoch": 401} {"train_loss": -8.804563522338867, "global_step": 67391, "epoch": 401} {"train_loss": -8.689220428466797, "global_step": 67392, "epoch": 401} {"train_loss": -8.725536346435547, "global_step": 67393, "epoch": 401} {"train_loss": -8.669819831848145, "global_step": 67394, "epoch": 401} {"train_loss": -8.741106033325195, "global_step": 67395, "epoch": 401} {"train_loss": -8.535616874694824, "global_step": 67396, "epoch": 401} {"train_loss": -8.410917282104492, "global_step": 67397, "epoch": 401} {"train_loss": -8.547486305236816, "global_step": 67398, "epoch": 401} {"train_loss": -8.53567123413086, "global_step": 67399, "epoch": 401} {"train_loss": -8.606409072875977, "global_step": 67400, "epoch": 401} {"train_loss": -8.822986602783203, "global_step": 67401, "epoch": 401} {"train_loss": -8.816072463989258, "global_step": 67402, "epoch": 401} {"train_loss": -8.702375411987305, "global_step": 67403, "epoch": 401} {"train_loss": -8.791861534118652, "global_step": 67404, "epoch": 401} {"train_loss": -8.92072868347168, "global_step": 67405, "epoch": 401} {"train_loss": -8.651134490966797, "global_step": 67406, "epoch": 401} {"train_loss": -8.956123352050781, "global_step": 67407, "epoch": 401} {"train_loss": -8.788900375366211, "global_step": 67408, "epoch": 401} {"train_loss": -8.694809913635254, "global_step": 67409, "epoch": 401} {"train_loss": -9.057920455932617, "global_step": 67410, "epoch": 401} {"train_loss": -8.619173049926758, "global_step": 67411, "epoch": 401} {"train_loss": -8.806961059570312, "global_step": 67412, "epoch": 401} {"train_loss": -8.76289176940918, "global_step": 67413, "epoch": 401} {"train_loss": -8.906595230102539, "global_step": 67414, "epoch": 401} {"train_loss": -8.808855056762695, "global_step": 67415, "epoch": 401} {"train_loss": -8.8226957321167, "global_step": 67416, "epoch": 401} {"train_loss": -8.791128158569336, "global_step": 67417, "epoch": 401} {"train_loss": -8.94284439086914, "global_step": 67418, "epoch": 401} {"train_loss": -9.131631851196289, "global_step": 67419, "epoch": 401} {"train_loss": -8.974126815795898, "global_step": 67420, "epoch": 401} {"train_loss": -9.10580062866211, "global_step": 67421, "epoch": 401} {"train_loss": -8.524883270263672, "global_step": 67422, "epoch": 401} {"train_loss": -8.810497283935547, "global_step": 67423, "epoch": 401} {"train_loss": -8.653267860412598, "global_step": 67424, "epoch": 401} {"train_loss": -8.581491470336914, "global_step": 67425, "epoch": 401} {"train_loss": -8.99397087097168, "global_step": 67426, "epoch": 401} {"train_loss": -8.626277923583984, "global_step": 67427, "epoch": 401} {"train_loss": -9.197805404663086, "global_step": 67428, "epoch": 401} {"train_loss": -8.7911376953125, "global_step": 67429, "epoch": 401} {"train_loss": -8.796284675598145, "global_step": 67430, "epoch": 401} {"train_loss": -8.929431915283203, "global_step": 67431, "epoch": 401} {"train_loss": -8.765830039978027, "global_step": 67432, "epoch": 401} {"train_loss": -8.819299697875977, "global_step": 67433, "epoch": 401} {"train_loss": -8.964256286621094, "global_step": 67434, "epoch": 401} {"train_loss": -8.940706253051758, "global_step": 67435, "epoch": 401} {"train_loss": -8.886445999145508, "global_step": 67436, "epoch": 401} {"train_loss": -8.936761856079102, "global_step": 67437, "epoch": 401} {"train_loss": -8.397266387939453, "global_step": 67438, "epoch": 401} {"train_loss": -8.559253692626953, "global_step": 67439, "epoch": 401} {"train_loss": -8.725362777709961, "global_step": 67440, "epoch": 401} {"train_loss": -8.292545318603516, "global_step": 67441, "epoch": 401} {"train_loss": -8.48676872253418, "global_step": 67442, "epoch": 401} {"train_loss": -8.572135925292969, "global_step": 67443, "epoch": 401} {"train_loss": -8.453454971313477, "global_step": 67444, "epoch": 401} {"train_loss": -8.338475227355957, "global_step": 67445, "epoch": 401} {"train_loss": -8.931679725646973, "global_step": 67446, "epoch": 401} {"train_loss": -8.613456726074219, "global_step": 67447, "epoch": 401} {"train_loss": -8.15728759765625, "global_step": 67448, "epoch": 401} {"train_loss": -8.563669204711914, "global_step": 67449, "epoch": 401} {"train_loss": -8.716754913330078, "global_step": 67450, "epoch": 401} {"train_loss": -8.32516098022461, "global_step": 67451, "epoch": 401} {"train_loss": -8.433422088623047, "global_step": 67452, "epoch": 401} {"train_loss": -8.658567428588867, "global_step": 67453, "epoch": 401} {"train_loss": -8.390142440795898, "global_step": 67454, "epoch": 401} {"train_loss": -8.399173736572266, "global_step": 67455, "epoch": 401} {"train_loss": -8.685136795043945, "global_step": 67456, "epoch": 401} {"train_loss": -8.755884170532227, "global_step": 67457, "epoch": 401} {"train_loss": -8.626548767089844, "global_step": 67458, "epoch": 401} {"train_loss": -8.350242614746094, "global_step": 67459, "epoch": 401} {"train_loss": -8.59933853149414, "global_step": 67460, "epoch": 401} {"train_loss": -8.832141876220703, "global_step": 67461, "epoch": 401} {"train_loss": -8.438611030578613, "global_step": 67462, "epoch": 401} {"train_loss": -8.747116088867188, "global_step": 67463, "epoch": 401} {"train_loss": -8.590967178344727, "global_step": 67464, "epoch": 401} {"train_loss": -8.932483673095703, "global_step": 67465, "epoch": 401} {"train_loss": -8.931642532348633, "global_step": 67466, "epoch": 401} {"train_loss": -8.62858772277832, "global_step": 67467, "epoch": 401} {"train_loss": -8.727031707763672, "global_step": 67468, "epoch": 401} {"train_loss": -8.809856414794922, "global_step": 67469, "epoch": 401} {"train_loss": -8.74413013458252, "global_step": 67470, "epoch": 401} {"train_loss": -8.742027282714844, "global_step": 67471, "epoch": 401} {"train_loss": -8.823478698730469, "global_step": 67472, "epoch": 401} {"train_loss": -9.177350997924805, "global_step": 67473, "epoch": 401} {"train_loss": -8.628925323486328, "global_step": 67474, "epoch": 401} {"train_loss": -8.740950584411621, "global_step": 67475, "epoch": 401} {"train_loss": -8.636821746826172, "global_step": 67476, "epoch": 401} {"train_loss": -8.868483543395996, "global_step": 67477, "epoch": 401} {"train_loss": -8.61888599395752, "global_step": 67478, "epoch": 401} {"train_loss": -8.885644912719727, "global_step": 67479, "epoch": 401} {"train_loss": -8.854068756103516, "global_step": 67480, "epoch": 401} {"train_loss": -9.03342056274414, "global_step": 67481, "epoch": 401} {"train_loss": -8.880682945251465, "global_step": 67482, "epoch": 401} {"train_loss": -9.051273345947266, "global_step": 67483, "epoch": 401} {"train_loss": -9.167884826660156, "global_step": 67484, "epoch": 401} {"train_loss": -8.972599029541016, "global_step": 67485, "epoch": 401} {"train_loss": -9.082426071166992, "global_step": 67486, "epoch": 401} {"train_loss": -9.02735710144043, "global_step": 67487, "epoch": 401} {"train_loss": -8.918741226196289, "global_step": 67488, "epoch": 401} {"train_loss": -9.040050506591797, "global_step": 67489, "epoch": 401} {"train_loss": -8.85814094543457, "global_step": 67490, "epoch": 401} {"train_loss": -9.28521728515625, "global_step": 67491, "epoch": 401} {"train_loss": -8.94807243347168, "global_step": 67492, "epoch": 401} {"train_loss": -9.108805656433105, "global_step": 67493, "epoch": 401} {"train_loss": -8.940999031066895, "global_step": 67494, "epoch": 401} {"train_loss": -8.585567474365234, "global_step": 67495, "epoch": 401} {"train_loss": -8.743995666503906, "global_step": 67496, "epoch": 401} {"train_loss": -8.849483489990234, "global_step": 67497, "epoch": 401} {"train_loss": -8.655097961425781, "global_step": 67498, "epoch": 401} {"train_loss": -8.875024795532227, "global_step": 67499, "epoch": 401} {"train_loss": -8.505770683288574, "global_step": 67500, "epoch": 401} {"train_loss": -8.509054183959961, "global_step": 67501, "epoch": 401} {"train_loss": -8.36550235748291, "global_step": 67502, "epoch": 401} {"train_loss": -8.508859634399414, "global_step": 67503, "epoch": 401} {"train_loss": -8.57729721069336, "global_step": 67504, "epoch": 401} {"train_loss": -8.587556838989258, "global_step": 67505, "epoch": 401} {"train_loss": -8.86893081665039, "global_step": 67506, "epoch": 401} {"train_loss": -8.655633926391602, "global_step": 67507, "epoch": 401} {"train_loss": -8.851762771606445, "global_step": 67508, "epoch": 401} {"train_loss": -8.586403846740723, "global_step": 67509, "epoch": 401} {"train_loss": -8.684504508972168, "global_step": 67510, "epoch": 401} {"train_loss": -8.613306045532227, "global_step": 67511, "epoch": 401} {"train_loss": -8.493182182312012, "global_step": 67512, "epoch": 401} {"train_loss": -8.859712600708008, "global_step": 67513, "epoch": 401} {"train_loss": -8.456945419311523, "global_step": 67514, "epoch": 401} {"train_loss": -8.806083679199219, "global_step": 67515, "epoch": 401} {"train_loss": -8.52589225769043, "global_step": 67516, "epoch": 401} {"train_loss": -8.61622428894043, "global_step": 67517, "epoch": 401} {"train_loss": -8.734861373901367, "global_step": 67518, "epoch": 401} {"train_loss": -8.618232727050781, "global_step": 67519, "epoch": 401} {"train_loss": -8.748255729675293, "global_step": 67520, "epoch": 401} {"train_loss": -8.703194618225098, "global_step": 67521, "epoch": 401} {"train_loss": -8.80410385131836, "global_step": 67522, "epoch": 401} {"train_loss": -8.975951194763184, "global_step": 67523, "epoch": 401} {"train_loss": -8.722994804382324, "global_step": 67524, "epoch": 401} {"train_loss": -8.782852172851562, "global_step": 67525, "epoch": 401} {"train_loss": -8.81555461883545, "global_step": 67526, "epoch": 401} {"train_loss": -8.84793472290039, "global_step": 67527, "epoch": 401} {"train_loss": -8.635346412658691, "global_step": 67528, "epoch": 401} {"train_loss": -9.118692398071289, "global_step": 67529, "epoch": 401} {"train_loss": -8.561677932739258, "global_step": 67530, "epoch": 401} {"train_loss": -8.848692893981934, "global_step": 67531, "epoch": 401} {"train_loss": -8.774555206298828, "global_step": 67532, "epoch": 401} {"train_loss": -8.672891616821289, "global_step": 67533, "epoch": 401} {"train_loss": -8.9530029296875, "global_step": 67534, "epoch": 401} {"train_loss": -8.755125108219328, "global_step": 67535, "epoch": 401, "val_loss": 192429.09375} {"train_loss": -8.949382781982422, "global_step": 67536, "epoch": 402} {"train_loss": -8.531824111938477, "global_step": 67537, "epoch": 402} {"train_loss": -8.768528938293457, "global_step": 67538, "epoch": 402} {"train_loss": -8.50753402709961, "global_step": 67539, "epoch": 402} {"train_loss": -8.54301643371582, "global_step": 67540, "epoch": 402} {"train_loss": -8.576339721679688, "global_step": 67541, "epoch": 402} {"train_loss": -8.726637840270996, "global_step": 67542, "epoch": 402} {"train_loss": -8.640119552612305, "global_step": 67543, "epoch": 402} {"train_loss": -8.763781547546387, "global_step": 67544, "epoch": 402} {"train_loss": -8.655710220336914, "global_step": 67545, "epoch": 402} {"train_loss": -8.55909538269043, "global_step": 67546, "epoch": 402} {"train_loss": -8.426580429077148, "global_step": 67547, "epoch": 402} {"train_loss": -8.707478523254395, "global_step": 67548, "epoch": 402} {"train_loss": -8.77531909942627, "global_step": 67549, "epoch": 402} {"train_loss": -8.706171989440918, "global_step": 67550, "epoch": 402} {"train_loss": -8.568041801452637, "global_step": 67551, "epoch": 402} {"train_loss": -8.88502025604248, "global_step": 67552, "epoch": 402} {"train_loss": -8.867773056030273, "global_step": 67553, "epoch": 402} {"train_loss": -8.784778594970703, "global_step": 67554, "epoch": 402} {"train_loss": -8.995916366577148, "global_step": 67555, "epoch": 402} {"train_loss": -9.035780906677246, "global_step": 67556, "epoch": 402} {"train_loss": -8.808505058288574, "global_step": 67557, "epoch": 402} {"train_loss": -8.831438064575195, "global_step": 67558, "epoch": 402} {"train_loss": -8.926332473754883, "global_step": 67559, "epoch": 402} {"train_loss": -9.021331787109375, "global_step": 67560, "epoch": 402} {"train_loss": -8.766271591186523, "global_step": 67561, "epoch": 402} {"train_loss": -8.962640762329102, "global_step": 67562, "epoch": 402} {"train_loss": -9.053262710571289, "global_step": 67563, "epoch": 402} {"train_loss": -8.868552207946777, "global_step": 67564, "epoch": 402} {"train_loss": -8.979757308959961, "global_step": 67565, "epoch": 402} {"train_loss": -8.99952220916748, "global_step": 67566, "epoch": 402} {"train_loss": -8.866447448730469, "global_step": 67567, "epoch": 402} {"train_loss": -8.814403533935547, "global_step": 67568, "epoch": 402} {"train_loss": -8.979644775390625, "global_step": 67569, "epoch": 402} {"train_loss": -9.026115417480469, "global_step": 67570, "epoch": 402} {"train_loss": -8.852546691894531, "global_step": 67571, "epoch": 402} {"train_loss": -9.112451553344727, "global_step": 67572, "epoch": 402} {"train_loss": -9.09122085571289, "global_step": 67573, "epoch": 402} {"train_loss": -8.782451629638672, "global_step": 67574, "epoch": 402} {"train_loss": -8.819816589355469, "global_step": 67575, "epoch": 402} {"train_loss": -9.015130996704102, "global_step": 67576, "epoch": 402} {"train_loss": -8.848649978637695, "global_step": 67577, "epoch": 402} {"train_loss": -9.10377311706543, "global_step": 67578, "epoch": 402} {"train_loss": -8.785326957702637, "global_step": 67579, "epoch": 402} {"train_loss": -9.088248252868652, "global_step": 67580, "epoch": 402} {"train_loss": -8.66551399230957, "global_step": 67581, "epoch": 402} {"train_loss": -8.944839477539062, "global_step": 67582, "epoch": 402} {"train_loss": -8.455825805664062, "global_step": 67583, "epoch": 402} {"train_loss": -8.95461654663086, "global_step": 67584, "epoch": 402} {"train_loss": -8.658191680908203, "global_step": 67585, "epoch": 402} {"train_loss": -8.721607208251953, "global_step": 67586, "epoch": 402} {"train_loss": -8.596614837646484, "global_step": 67587, "epoch": 402} {"train_loss": -8.536903381347656, "global_step": 67588, "epoch": 402} {"train_loss": -8.487092971801758, "global_step": 67589, "epoch": 402} {"train_loss": -8.448382377624512, "global_step": 67590, "epoch": 402} {"train_loss": -8.561885833740234, "global_step": 67591, "epoch": 402} {"train_loss": -7.96041202545166, "global_step": 67592, "epoch": 402} {"train_loss": -8.582876205444336, "global_step": 67593, "epoch": 402} {"train_loss": -8.253032684326172, "global_step": 67594, "epoch": 402} {"train_loss": -8.236161231994629, "global_step": 67595, "epoch": 402} {"train_loss": -8.527898788452148, "global_step": 67596, "epoch": 402} {"train_loss": -8.709444999694824, "global_step": 67597, "epoch": 402} {"train_loss": -8.32807731628418, "global_step": 67598, "epoch": 402} {"train_loss": -8.647225379943848, "global_step": 67599, "epoch": 402} {"train_loss": -8.647993087768555, "global_step": 67600, "epoch": 402} {"train_loss": -8.827661514282227, "global_step": 67601, "epoch": 402} {"train_loss": -8.822395324707031, "global_step": 67602, "epoch": 402} {"train_loss": -8.611135482788086, "global_step": 67603, "epoch": 402} {"train_loss": -8.799566268920898, "global_step": 67604, "epoch": 402} {"train_loss": -8.817683219909668, "global_step": 67605, "epoch": 402} {"train_loss": -8.855768203735352, "global_step": 67606, "epoch": 402} {"train_loss": -8.644057273864746, "global_step": 67607, "epoch": 402} {"train_loss": -8.940591812133789, "global_step": 67608, "epoch": 402} {"train_loss": -8.826824188232422, "global_step": 67609, "epoch": 402} {"train_loss": -8.658015251159668, "global_step": 67610, "epoch": 402} {"train_loss": -8.828604698181152, "global_step": 67611, "epoch": 402} {"train_loss": -8.957939147949219, "global_step": 67612, "epoch": 402} {"train_loss": -8.828624725341797, "global_step": 67613, "epoch": 402} {"train_loss": -8.811187744140625, "global_step": 67614, "epoch": 402} {"train_loss": -9.065462112426758, "global_step": 67615, "epoch": 402} {"train_loss": -8.956241607666016, "global_step": 67616, "epoch": 402} {"train_loss": -9.071897506713867, "global_step": 67617, "epoch": 402} {"train_loss": -9.036113739013672, "global_step": 67618, "epoch": 402} {"train_loss": -9.170392990112305, "global_step": 67619, "epoch": 402} {"train_loss": -8.96153450012207, "global_step": 67620, "epoch": 402} {"train_loss": -8.954639434814453, "global_step": 67621, "epoch": 402} {"train_loss": -9.124970436096191, "global_step": 67622, "epoch": 402} {"train_loss": -9.034109115600586, "global_step": 67623, "epoch": 402} {"train_loss": -8.973356246948242, "global_step": 67624, "epoch": 402} {"train_loss": -9.296843528747559, "global_step": 67625, "epoch": 402} {"train_loss": -9.115047454833984, "global_step": 67626, "epoch": 402} {"train_loss": -8.983400344848633, "global_step": 67627, "epoch": 402} {"train_loss": -8.98867416381836, "global_step": 67628, "epoch": 402} {"train_loss": -8.913800239562988, "global_step": 67629, "epoch": 402} {"train_loss": -8.735044479370117, "global_step": 67630, "epoch": 402} {"train_loss": -8.962703704833984, "global_step": 67631, "epoch": 402} {"train_loss": -8.657554626464844, "global_step": 67632, "epoch": 402} {"train_loss": -9.009712219238281, "global_step": 67633, "epoch": 402} {"train_loss": -8.648298263549805, "global_step": 67634, "epoch": 402} {"train_loss": -8.65986442565918, "global_step": 67635, "epoch": 402} {"train_loss": -8.48448371887207, "global_step": 67636, "epoch": 402} {"train_loss": -8.72467041015625, "global_step": 67637, "epoch": 402} {"train_loss": -8.550213813781738, "global_step": 67638, "epoch": 402} {"train_loss": -8.941137313842773, "global_step": 67639, "epoch": 402} {"train_loss": -8.903678894042969, "global_step": 67640, "epoch": 402} {"train_loss": -8.597139358520508, "global_step": 67641, "epoch": 402} {"train_loss": -8.882009506225586, "global_step": 67642, "epoch": 402} {"train_loss": -8.743843078613281, "global_step": 67643, "epoch": 402} {"train_loss": -8.818441390991211, "global_step": 67644, "epoch": 402} {"train_loss": -8.783080101013184, "global_step": 67645, "epoch": 402} {"train_loss": -8.614384651184082, "global_step": 67646, "epoch": 402} {"train_loss": -8.650463104248047, "global_step": 67647, "epoch": 402} {"train_loss": -8.993087768554688, "global_step": 67648, "epoch": 402} {"train_loss": -8.918654441833496, "global_step": 67649, "epoch": 402} {"train_loss": -8.969758987426758, "global_step": 67650, "epoch": 402} {"train_loss": -8.597139358520508, "global_step": 67651, "epoch": 402} {"train_loss": -8.472747802734375, "global_step": 67652, "epoch": 402} {"train_loss": -8.541077613830566, "global_step": 67653, "epoch": 402} {"train_loss": -8.82954216003418, "global_step": 67654, "epoch": 402} {"train_loss": -8.769139289855957, "global_step": 67655, "epoch": 402} {"train_loss": -8.797621726989746, "global_step": 67656, "epoch": 402} {"train_loss": -8.639886856079102, "global_step": 67657, "epoch": 402} {"train_loss": -8.830489158630371, "global_step": 67658, "epoch": 402} {"train_loss": -8.925166130065918, "global_step": 67659, "epoch": 402} {"train_loss": -8.749227523803711, "global_step": 67660, "epoch": 402} {"train_loss": -8.807269096374512, "global_step": 67661, "epoch": 402} {"train_loss": -8.941543579101562, "global_step": 67662, "epoch": 402} {"train_loss": -8.632989883422852, "global_step": 67663, "epoch": 402} {"train_loss": -8.799932479858398, "global_step": 67664, "epoch": 402} {"train_loss": -8.881912231445312, "global_step": 67665, "epoch": 402} {"train_loss": -8.963888168334961, "global_step": 67666, "epoch": 402} {"train_loss": -8.966407775878906, "global_step": 67667, "epoch": 402} {"train_loss": -8.773941993713379, "global_step": 67668, "epoch": 402} {"train_loss": -8.943227767944336, "global_step": 67669, "epoch": 402} {"train_loss": -8.831415176391602, "global_step": 67670, "epoch": 402} {"train_loss": -8.98791217803955, "global_step": 67671, "epoch": 402} {"train_loss": -8.923471450805664, "global_step": 67672, "epoch": 402} {"train_loss": -9.069185256958008, "global_step": 67673, "epoch": 402} {"train_loss": -8.983509063720703, "global_step": 67674, "epoch": 402} {"train_loss": -8.93452262878418, "global_step": 67675, "epoch": 402} {"train_loss": -8.732162475585938, "global_step": 67676, "epoch": 402} {"train_loss": -9.197704315185547, "global_step": 67677, "epoch": 402} {"train_loss": -8.769161224365234, "global_step": 67678, "epoch": 402} {"train_loss": -8.758607864379883, "global_step": 67679, "epoch": 402} {"train_loss": -8.672647476196289, "global_step": 67680, "epoch": 402} {"train_loss": -8.942928314208984, "global_step": 67681, "epoch": 402} {"train_loss": -8.978779792785645, "global_step": 67682, "epoch": 402} {"train_loss": -9.004133224487305, "global_step": 67683, "epoch": 402} {"train_loss": -8.829109191894531, "global_step": 67684, "epoch": 402} {"train_loss": -8.954530715942383, "global_step": 67685, "epoch": 402} {"train_loss": -8.904901504516602, "global_step": 67686, "epoch": 402} {"train_loss": -9.078542709350586, "global_step": 67687, "epoch": 402} {"train_loss": -8.959985733032227, "global_step": 67688, "epoch": 402} {"train_loss": -8.683340072631836, "global_step": 67689, "epoch": 402} {"train_loss": -8.837340354919434, "global_step": 67690, "epoch": 402} {"train_loss": -8.706937789916992, "global_step": 67691, "epoch": 402} {"train_loss": -8.520788192749023, "global_step": 67692, "epoch": 402} {"train_loss": -8.84672737121582, "global_step": 67693, "epoch": 402} {"train_loss": -8.44741153717041, "global_step": 67694, "epoch": 402} {"train_loss": -8.314584732055664, "global_step": 67695, "epoch": 402} {"train_loss": -8.558801651000977, "global_step": 67696, "epoch": 402} {"train_loss": -8.256668090820312, "global_step": 67697, "epoch": 402} {"train_loss": -8.952096939086914, "global_step": 67698, "epoch": 402} {"train_loss": -8.341818809509277, "global_step": 67699, "epoch": 402} {"train_loss": -8.628711700439453, "global_step": 67700, "epoch": 402} {"train_loss": -8.342778205871582, "global_step": 67701, "epoch": 402} {"train_loss": -8.26175594329834, "global_step": 67702, "epoch": 402} {"train_loss": -8.786640859785534, "global_step": 67703, "epoch": 402, "val_loss": 190714.828125} {"train_loss": -8.125921249389648, "global_step": 67704, "epoch": 403} {"train_loss": -8.070159912109375, "global_step": 67705, "epoch": 403} {"train_loss": -7.880363464355469, "global_step": 67706, "epoch": 403} {"train_loss": -8.544196128845215, "global_step": 67707, "epoch": 403} {"train_loss": -8.206270217895508, "global_step": 67708, "epoch": 403} {"train_loss": -8.282508850097656, "global_step": 67709, "epoch": 403} {"train_loss": -8.570952415466309, "global_step": 67710, "epoch": 403} {"train_loss": -8.378604888916016, "global_step": 67711, "epoch": 403} {"train_loss": -8.495360374450684, "global_step": 67712, "epoch": 403} {"train_loss": -8.426539421081543, "global_step": 67713, "epoch": 403} {"train_loss": -8.35911750793457, "global_step": 67714, "epoch": 403} {"train_loss": -8.52587890625, "global_step": 67715, "epoch": 403} {"train_loss": -8.466830253601074, "global_step": 67716, "epoch": 403} {"train_loss": -8.629398345947266, "global_step": 67717, "epoch": 403} {"train_loss": -8.494328498840332, "global_step": 67718, "epoch": 403} {"train_loss": -8.620824813842773, "global_step": 67719, "epoch": 403} {"train_loss": -8.512779235839844, "global_step": 67720, "epoch": 403} {"train_loss": -8.471755027770996, "global_step": 67721, "epoch": 403} {"train_loss": -8.577705383300781, "global_step": 67722, "epoch": 403} {"train_loss": -8.535938262939453, "global_step": 67723, "epoch": 403} {"train_loss": -8.671341896057129, "global_step": 67724, "epoch": 403} {"train_loss": -8.846059799194336, "global_step": 67725, "epoch": 403} {"train_loss": -8.814239501953125, "global_step": 67726, "epoch": 403} {"train_loss": -8.729875564575195, "global_step": 67727, "epoch": 403} {"train_loss": -8.804730415344238, "global_step": 67728, "epoch": 403} {"train_loss": -8.760576248168945, "global_step": 67729, "epoch": 403} {"train_loss": -8.82995891571045, "global_step": 67730, "epoch": 403} {"train_loss": -8.884788513183594, "global_step": 67731, "epoch": 403} {"train_loss": -8.982155799865723, "global_step": 67732, "epoch": 403} {"train_loss": -8.833135604858398, "global_step": 67733, "epoch": 403} {"train_loss": -8.908928871154785, "global_step": 67734, "epoch": 403} {"train_loss": -8.845282554626465, "global_step": 67735, "epoch": 403} {"train_loss": -8.823304176330566, "global_step": 67736, "epoch": 403} {"train_loss": -8.910544395446777, "global_step": 67737, "epoch": 403} {"train_loss": -8.815152168273926, "global_step": 67738, "epoch": 403} {"train_loss": -9.006057739257812, "global_step": 67739, "epoch": 403} {"train_loss": -9.023621559143066, "global_step": 67740, "epoch": 403} {"train_loss": -8.907434463500977, "global_step": 67741, "epoch": 403} {"train_loss": -8.8930025100708, "global_step": 67742, "epoch": 403} {"train_loss": -9.070219993591309, "global_step": 67743, "epoch": 403} {"train_loss": -9.020824432373047, "global_step": 67744, "epoch": 403} {"train_loss": -9.008622169494629, "global_step": 67745, "epoch": 403} {"train_loss": -9.18221664428711, "global_step": 67746, "epoch": 403} {"train_loss": -9.115209579467773, "global_step": 67747, "epoch": 403} {"train_loss": -9.034523010253906, "global_step": 67748, "epoch": 403} {"train_loss": -8.751376152038574, "global_step": 67749, "epoch": 403} {"train_loss": -8.981306076049805, "global_step": 67750, "epoch": 403} {"train_loss": -8.92283821105957, "global_step": 67751, "epoch": 403} {"train_loss": -8.654027938842773, "global_step": 67752, "epoch": 403} {"train_loss": -8.870628356933594, "global_step": 67753, "epoch": 403} {"train_loss": -8.398776054382324, "global_step": 67754, "epoch": 403} {"train_loss": -8.728443145751953, "global_step": 67755, "epoch": 403} {"train_loss": -8.747261047363281, "global_step": 67756, "epoch": 403} {"train_loss": -8.538716316223145, "global_step": 67757, "epoch": 403} {"train_loss": -9.068766593933105, "global_step": 67758, "epoch": 403} {"train_loss": -8.524293899536133, "global_step": 67759, "epoch": 403} {"train_loss": -8.764469146728516, "global_step": 67760, "epoch": 403} {"train_loss": -8.423328399658203, "global_step": 67761, "epoch": 403} {"train_loss": -8.624261856079102, "global_step": 67762, "epoch": 403} {"train_loss": -8.906612396240234, "global_step": 67763, "epoch": 403} {"train_loss": -8.91590404510498, "global_step": 67764, "epoch": 403} {"train_loss": -8.569602012634277, "global_step": 67765, "epoch": 403} {"train_loss": -8.5575590133667, "global_step": 67766, "epoch": 403} {"train_loss": -8.952865600585938, "global_step": 67767, "epoch": 403} {"train_loss": -8.461237907409668, "global_step": 67768, "epoch": 403} {"train_loss": -8.658512115478516, "global_step": 67769, "epoch": 403} {"train_loss": -8.84237289428711, "global_step": 67770, "epoch": 403} {"train_loss": -8.774548530578613, "global_step": 67771, "epoch": 403} {"train_loss": -8.734354972839355, "global_step": 67772, "epoch": 403} {"train_loss": -8.676752090454102, "global_step": 67773, "epoch": 403} {"train_loss": -8.789989471435547, "global_step": 67774, "epoch": 403} {"train_loss": -8.56049633026123, "global_step": 67775, "epoch": 403} {"train_loss": -8.897832870483398, "global_step": 67776, "epoch": 403} {"train_loss": -8.38983154296875, "global_step": 67777, "epoch": 403} {"train_loss": -8.695783615112305, "global_step": 67778, "epoch": 403} {"train_loss": -9.075246810913086, "global_step": 67779, "epoch": 403} {"train_loss": -8.611661911010742, "global_step": 67780, "epoch": 403} {"train_loss": -8.731983184814453, "global_step": 67781, "epoch": 403} {"train_loss": -8.648798942565918, "global_step": 67782, "epoch": 403} {"train_loss": -8.792070388793945, "global_step": 67783, "epoch": 403} {"train_loss": -8.533279418945312, "global_step": 67784, "epoch": 403} {"train_loss": -8.817014694213867, "global_step": 67785, "epoch": 403} {"train_loss": -8.750497817993164, "global_step": 67786, "epoch": 403} {"train_loss": -8.575475692749023, "global_step": 67787, "epoch": 403} {"train_loss": -8.717822074890137, "global_step": 67788, "epoch": 403} {"train_loss": -8.73909854888916, "global_step": 67789, "epoch": 403} {"train_loss": -8.827888488769531, "global_step": 67790, "epoch": 403} {"train_loss": -8.985042572021484, "global_step": 67791, "epoch": 403} {"train_loss": -8.640406608581543, "global_step": 67792, "epoch": 403} {"train_loss": -8.967503547668457, "global_step": 67793, "epoch": 403} {"train_loss": -8.853683471679688, "global_step": 67794, "epoch": 403} {"train_loss": -8.850659370422363, "global_step": 67795, "epoch": 403} {"train_loss": -8.965149879455566, "global_step": 67796, "epoch": 403} {"train_loss": -8.796491622924805, "global_step": 67797, "epoch": 403} {"train_loss": -8.825592041015625, "global_step": 67798, "epoch": 403} {"train_loss": -8.972027778625488, "global_step": 67799, "epoch": 403} {"train_loss": -8.711076736450195, "global_step": 67800, "epoch": 403} {"train_loss": -8.891160011291504, "global_step": 67801, "epoch": 403} {"train_loss": -8.980182647705078, "global_step": 67802, "epoch": 403} {"train_loss": -8.989286422729492, "global_step": 67803, "epoch": 403} {"train_loss": -9.072031021118164, "global_step": 67804, "epoch": 403} {"train_loss": -9.161903381347656, "global_step": 67805, "epoch": 403} {"train_loss": -9.15573501586914, "global_step": 67806, "epoch": 403} {"train_loss": -8.797126770019531, "global_step": 67807, "epoch": 403} {"train_loss": -9.009753227233887, "global_step": 67808, "epoch": 403} {"train_loss": -9.11832046508789, "global_step": 67809, "epoch": 403} {"train_loss": -9.152585983276367, "global_step": 67810, "epoch": 403} {"train_loss": -9.097099304199219, "global_step": 67811, "epoch": 403} {"train_loss": -8.894285202026367, "global_step": 67812, "epoch": 403} {"train_loss": -8.893657684326172, "global_step": 67813, "epoch": 403} {"train_loss": -8.696416854858398, "global_step": 67814, "epoch": 403} {"train_loss": -9.0174560546875, "global_step": 67815, "epoch": 403} {"train_loss": -8.948993682861328, "global_step": 67816, "epoch": 403} {"train_loss": -9.031346321105957, "global_step": 67817, "epoch": 403} {"train_loss": -8.79287052154541, "global_step": 67818, "epoch": 403} {"train_loss": -8.991975784301758, "global_step": 67819, "epoch": 403} {"train_loss": -8.85008430480957, "global_step": 67820, "epoch": 403} {"train_loss": -8.8653564453125, "global_step": 67821, "epoch": 403} {"train_loss": -9.150579452514648, "global_step": 67822, "epoch": 403} {"train_loss": -8.786252975463867, "global_step": 67823, "epoch": 403} {"train_loss": -8.846006393432617, "global_step": 67824, "epoch": 403} {"train_loss": -8.939332008361816, "global_step": 67825, "epoch": 403} {"train_loss": -8.638851165771484, "global_step": 67826, "epoch": 403} {"train_loss": -8.884538650512695, "global_step": 67827, "epoch": 403} {"train_loss": -9.2252197265625, "global_step": 67828, "epoch": 403} {"train_loss": -8.746028900146484, "global_step": 67829, "epoch": 403} {"train_loss": -8.676637649536133, "global_step": 67830, "epoch": 403} {"train_loss": -8.947525024414062, "global_step": 67831, "epoch": 403} {"train_loss": -8.906713485717773, "global_step": 67832, "epoch": 403} {"train_loss": -8.866785049438477, "global_step": 67833, "epoch": 403} {"train_loss": -8.791011810302734, "global_step": 67834, "epoch": 403} {"train_loss": -9.013589859008789, "global_step": 67835, "epoch": 403} {"train_loss": -8.717767715454102, "global_step": 67836, "epoch": 403} {"train_loss": -8.944643020629883, "global_step": 67837, "epoch": 403} {"train_loss": -8.914346694946289, "global_step": 67838, "epoch": 403} {"train_loss": -8.728656768798828, "global_step": 67839, "epoch": 403} {"train_loss": -9.04650592803955, "global_step": 67840, "epoch": 403} {"train_loss": -8.99679946899414, "global_step": 67841, "epoch": 403} {"train_loss": -8.716763496398926, "global_step": 67842, "epoch": 403} {"train_loss": -8.932090759277344, "global_step": 67843, "epoch": 403} {"train_loss": -9.0548095703125, "global_step": 67844, "epoch": 403} {"train_loss": -8.525453567504883, "global_step": 67845, "epoch": 403} {"train_loss": -8.899435043334961, "global_step": 67846, "epoch": 403} {"train_loss": -8.502570152282715, "global_step": 67847, "epoch": 403} {"train_loss": -8.92985725402832, "global_step": 67848, "epoch": 403} {"train_loss": -8.857670783996582, "global_step": 67849, "epoch": 403} {"train_loss": -8.97297191619873, "global_step": 67850, "epoch": 403} {"train_loss": -8.788300514221191, "global_step": 67851, "epoch": 403} {"train_loss": -8.702695846557617, "global_step": 67852, "epoch": 403} {"train_loss": -8.83285140991211, "global_step": 67853, "epoch": 403} {"train_loss": -8.489953994750977, "global_step": 67854, "epoch": 403} {"train_loss": -8.975226402282715, "global_step": 67855, "epoch": 403} {"train_loss": -8.844724655151367, "global_step": 67856, "epoch": 403} {"train_loss": -8.90657901763916, "global_step": 67857, "epoch": 403} {"train_loss": -8.726500511169434, "global_step": 67858, "epoch": 403} {"train_loss": -8.825909614562988, "global_step": 67859, "epoch": 403} {"train_loss": -8.922483444213867, "global_step": 67860, "epoch": 403} {"train_loss": -8.921150207519531, "global_step": 67861, "epoch": 403} {"train_loss": -8.953640937805176, "global_step": 67862, "epoch": 403} {"train_loss": -8.663993835449219, "global_step": 67863, "epoch": 403} {"train_loss": -8.9098539352417, "global_step": 67864, "epoch": 403} {"train_loss": -8.859613418579102, "global_step": 67865, "epoch": 403} {"train_loss": -8.85551643371582, "global_step": 67866, "epoch": 403} {"train_loss": -8.956310272216797, "global_step": 67867, "epoch": 403} {"train_loss": -8.765016555786133, "global_step": 67868, "epoch": 403} {"train_loss": -8.804169654846191, "global_step": 67869, "epoch": 403} {"train_loss": -9.066417694091797, "global_step": 67870, "epoch": 403} {"train_loss": -8.789589365323385, "global_step": 67871, "epoch": 403, "val_loss": 193215.578125} {"train_loss": -8.865509033203125, "global_step": 67872, "epoch": 404} {"train_loss": -8.84326457977295, "global_step": 67873, "epoch": 404} {"train_loss": -8.791805267333984, "global_step": 67874, "epoch": 404} {"train_loss": -8.863489151000977, "global_step": 67875, "epoch": 404} {"train_loss": -8.816276550292969, "global_step": 67876, "epoch": 404} {"train_loss": -9.03862190246582, "global_step": 67877, "epoch": 404} {"train_loss": -9.012784957885742, "global_step": 67878, "epoch": 404} {"train_loss": -9.028299331665039, "global_step": 67879, "epoch": 404} {"train_loss": -8.926811218261719, "global_step": 67880, "epoch": 404} {"train_loss": -9.207913398742676, "global_step": 67881, "epoch": 404} {"train_loss": -8.912322998046875, "global_step": 67882, "epoch": 404} {"train_loss": -8.98543643951416, "global_step": 67883, "epoch": 404} {"train_loss": -8.964363098144531, "global_step": 67884, "epoch": 404} {"train_loss": -8.915425300598145, "global_step": 67885, "epoch": 404} {"train_loss": -9.032576560974121, "global_step": 67886, "epoch": 404} {"train_loss": -8.85644245147705, "global_step": 67887, "epoch": 404} {"train_loss": -9.070603370666504, "global_step": 67888, "epoch": 404} {"train_loss": -8.92788314819336, "global_step": 67889, "epoch": 404} {"train_loss": -9.251553535461426, "global_step": 67890, "epoch": 404} {"train_loss": -9.020883560180664, "global_step": 67891, "epoch": 404} {"train_loss": -8.831277847290039, "global_step": 67892, "epoch": 404} {"train_loss": -8.883646011352539, "global_step": 67893, "epoch": 404} {"train_loss": -9.218645095825195, "global_step": 67894, "epoch": 404} {"train_loss": -9.034143447875977, "global_step": 67895, "epoch": 404} {"train_loss": -9.016386032104492, "global_step": 67896, "epoch": 404} {"train_loss": -9.073880195617676, "global_step": 67897, "epoch": 404} {"train_loss": -8.757818222045898, "global_step": 67898, "epoch": 404} {"train_loss": -8.748918533325195, "global_step": 67899, "epoch": 404} {"train_loss": -8.887636184692383, "global_step": 67900, "epoch": 404} {"train_loss": -8.815330505371094, "global_step": 67901, "epoch": 404} {"train_loss": -8.742542266845703, "global_step": 67902, "epoch": 404} {"train_loss": -8.522945404052734, "global_step": 67903, "epoch": 404} {"train_loss": -8.227871894836426, "global_step": 67904, "epoch": 404} {"train_loss": -8.99332332611084, "global_step": 67905, "epoch": 404} {"train_loss": -8.533252716064453, "global_step": 67906, "epoch": 404} {"train_loss": -8.665298461914062, "global_step": 67907, "epoch": 404} {"train_loss": -8.321812629699707, "global_step": 67908, "epoch": 404} {"train_loss": -8.776103973388672, "global_step": 67909, "epoch": 404} {"train_loss": -8.506803512573242, "global_step": 67910, "epoch": 404} {"train_loss": -8.529463768005371, "global_step": 67911, "epoch": 404} {"train_loss": -8.644525527954102, "global_step": 67912, "epoch": 404} {"train_loss": -8.660659790039062, "global_step": 67913, "epoch": 404} {"train_loss": -8.642916679382324, "global_step": 67914, "epoch": 404} {"train_loss": -8.98141098022461, "global_step": 67915, "epoch": 404} {"train_loss": -8.64058780670166, "global_step": 67916, "epoch": 404} {"train_loss": -8.345446586608887, "global_step": 67917, "epoch": 404} {"train_loss": -8.649392127990723, "global_step": 67918, "epoch": 404} {"train_loss": -8.696676254272461, "global_step": 67919, "epoch": 404} {"train_loss": -8.695110321044922, "global_step": 67920, "epoch": 404} {"train_loss": -8.693632125854492, "global_step": 67921, "epoch": 404} {"train_loss": -8.842141151428223, "global_step": 67922, "epoch": 404} {"train_loss": -8.890649795532227, "global_step": 67923, "epoch": 404} {"train_loss": -8.801095962524414, "global_step": 67924, "epoch": 404} {"train_loss": -8.784095764160156, "global_step": 67925, "epoch": 404} {"train_loss": -8.817217826843262, "global_step": 67926, "epoch": 404} {"train_loss": -8.7351655960083, "global_step": 67927, "epoch": 404} {"train_loss": -8.686511039733887, "global_step": 67928, "epoch": 404} {"train_loss": -8.912065505981445, "global_step": 67929, "epoch": 404} {"train_loss": -8.721905708312988, "global_step": 67930, "epoch": 404} {"train_loss": -8.833456039428711, "global_step": 67931, "epoch": 404} {"train_loss": -8.824667930603027, "global_step": 67932, "epoch": 404} {"train_loss": -8.927987098693848, "global_step": 67933, "epoch": 404} {"train_loss": -8.965421676635742, "global_step": 67934, "epoch": 404} {"train_loss": -8.781290054321289, "global_step": 67935, "epoch": 404} {"train_loss": -8.908114433288574, "global_step": 67936, "epoch": 404} {"train_loss": -8.972253799438477, "global_step": 67937, "epoch": 404} {"train_loss": -8.698348999023438, "global_step": 67938, "epoch": 404} {"train_loss": -8.570500373840332, "global_step": 67939, "epoch": 404} {"train_loss": -8.993959426879883, "global_step": 67940, "epoch": 404} {"train_loss": -8.610111236572266, "global_step": 67941, "epoch": 404} {"train_loss": -8.803510665893555, "global_step": 67942, "epoch": 404} {"train_loss": -8.670647621154785, "global_step": 67943, "epoch": 404} {"train_loss": -8.858123779296875, "global_step": 67944, "epoch": 404} {"train_loss": -8.867586135864258, "global_step": 67945, "epoch": 404} {"train_loss": -8.77401351928711, "global_step": 67946, "epoch": 404} {"train_loss": -8.688873291015625, "global_step": 67947, "epoch": 404} {"train_loss": -8.758105278015137, "global_step": 67948, "epoch": 404} {"train_loss": -8.524436950683594, "global_step": 67949, "epoch": 404} {"train_loss": -8.726715087890625, "global_step": 67950, "epoch": 404} {"train_loss": -8.74492359161377, "global_step": 67951, "epoch": 404} {"train_loss": -8.63390827178955, "global_step": 67952, "epoch": 404} {"train_loss": -8.828519821166992, "global_step": 67953, "epoch": 404} {"train_loss": -8.848461151123047, "global_step": 67954, "epoch": 404} {"train_loss": -8.807031631469727, "global_step": 67955, "epoch": 404} {"train_loss": -9.026612281799316, "global_step": 67956, "epoch": 404} {"train_loss": -8.889917373657227, "global_step": 67957, "epoch": 404} {"train_loss": -8.695289611816406, "global_step": 67958, "epoch": 404} {"train_loss": -9.071146011352539, "global_step": 67959, "epoch": 404} {"train_loss": -9.061217308044434, "global_step": 67960, "epoch": 404} {"train_loss": -9.056739807128906, "global_step": 67961, "epoch": 404} {"train_loss": -8.873373031616211, "global_step": 67962, "epoch": 404} {"train_loss": -8.805917739868164, "global_step": 67963, "epoch": 404} {"train_loss": -8.819019317626953, "global_step": 67964, "epoch": 404} {"train_loss": -8.891044616699219, "global_step": 67965, "epoch": 404} {"train_loss": -8.760849952697754, "global_step": 67966, "epoch": 404} {"train_loss": -8.783138275146484, "global_step": 67967, "epoch": 404} {"train_loss": -8.734613418579102, "global_step": 67968, "epoch": 404} {"train_loss": -8.831171989440918, "global_step": 67969, "epoch": 404} {"train_loss": -8.80687141418457, "global_step": 67970, "epoch": 404} {"train_loss": -8.89999771118164, "global_step": 67971, "epoch": 404} {"train_loss": -8.902326583862305, "global_step": 67972, "epoch": 404} {"train_loss": -8.98222541809082, "global_step": 67973, "epoch": 404} {"train_loss": -8.897502899169922, "global_step": 67974, "epoch": 404} {"train_loss": -8.851606369018555, "global_step": 67975, "epoch": 404} {"train_loss": -8.99709701538086, "global_step": 67976, "epoch": 404} {"train_loss": -8.996959686279297, "global_step": 67977, "epoch": 404} {"train_loss": -9.158356666564941, "global_step": 67978, "epoch": 404} {"train_loss": -8.925239562988281, "global_step": 67979, "epoch": 404} {"train_loss": -9.216066360473633, "global_step": 67980, "epoch": 404} {"train_loss": -8.803993225097656, "global_step": 67981, "epoch": 404} {"train_loss": -9.196704864501953, "global_step": 67982, "epoch": 404} {"train_loss": -8.895889282226562, "global_step": 67983, "epoch": 404} {"train_loss": -9.223753929138184, "global_step": 67984, "epoch": 404} {"train_loss": -9.119937896728516, "global_step": 67985, "epoch": 404} {"train_loss": -8.974613189697266, "global_step": 67986, "epoch": 404} {"train_loss": -8.740549087524414, "global_step": 67987, "epoch": 404} {"train_loss": -9.035501480102539, "global_step": 67988, "epoch": 404} {"train_loss": -8.765790939331055, "global_step": 67989, "epoch": 404} {"train_loss": -8.873855590820312, "global_step": 67990, "epoch": 404} {"train_loss": -8.840067863464355, "global_step": 67991, "epoch": 404} {"train_loss": -8.390188217163086, "global_step": 67992, "epoch": 404} {"train_loss": -8.648179054260254, "global_step": 67993, "epoch": 404} {"train_loss": -7.891531944274902, "global_step": 67994, "epoch": 404} {"train_loss": -8.487186431884766, "global_step": 67995, "epoch": 404} {"train_loss": -8.478188514709473, "global_step": 67996, "epoch": 404} {"train_loss": -8.312148094177246, "global_step": 67997, "epoch": 404} {"train_loss": -8.658849716186523, "global_step": 67998, "epoch": 404} {"train_loss": -9.008625030517578, "global_step": 67999, "epoch": 404} {"train_loss": -8.617292404174805, "global_step": 68000, "epoch": 404} {"train_loss": -8.51858901977539, "global_step": 68001, "epoch": 404} {"train_loss": -8.758099555969238, "global_step": 68002, "epoch": 404} {"train_loss": -8.578338623046875, "global_step": 68003, "epoch": 404} {"train_loss": -8.5839204788208, "global_step": 68004, "epoch": 404} {"train_loss": -8.52673053741455, "global_step": 68005, "epoch": 404} {"train_loss": -8.556686401367188, "global_step": 68006, "epoch": 404} {"train_loss": -8.790297508239746, "global_step": 68007, "epoch": 404} {"train_loss": -8.577709197998047, "global_step": 68008, "epoch": 404} {"train_loss": -8.90652847290039, "global_step": 68009, "epoch": 404} {"train_loss": -8.787017822265625, "global_step": 68010, "epoch": 404} {"train_loss": -8.755558967590332, "global_step": 68011, "epoch": 404} {"train_loss": -8.705782890319824, "global_step": 68012, "epoch": 404} {"train_loss": -8.641742706298828, "global_step": 68013, "epoch": 404} {"train_loss": -8.774656295776367, "global_step": 68014, "epoch": 404} {"train_loss": -8.750920295715332, "global_step": 68015, "epoch": 404} {"train_loss": -8.935554504394531, "global_step": 68016, "epoch": 404} {"train_loss": -8.75141429901123, "global_step": 68017, "epoch": 404} {"train_loss": -8.739151000976562, "global_step": 68018, "epoch": 404} {"train_loss": -8.823698043823242, "global_step": 68019, "epoch": 404} {"train_loss": -8.951542854309082, "global_step": 68020, "epoch": 404} {"train_loss": -9.06475830078125, "global_step": 68021, "epoch": 404} {"train_loss": -9.038663864135742, "global_step": 68022, "epoch": 404} {"train_loss": -8.926008224487305, "global_step": 68023, "epoch": 404} {"train_loss": -8.902608871459961, "global_step": 68024, "epoch": 404} {"train_loss": -9.071130752563477, "global_step": 68025, "epoch": 404} {"train_loss": -9.019673347473145, "global_step": 68026, "epoch": 404} {"train_loss": -9.145174026489258, "global_step": 68027, "epoch": 404} {"train_loss": -9.084209442138672, "global_step": 68028, "epoch": 404} {"train_loss": -9.13609504699707, "global_step": 68029, "epoch": 404} {"train_loss": -9.097163200378418, "global_step": 68030, "epoch": 404} {"train_loss": -9.034603118896484, "global_step": 68031, "epoch": 404} {"train_loss": -8.939234733581543, "global_step": 68032, "epoch": 404} {"train_loss": -9.105979919433594, "global_step": 68033, "epoch": 404} {"train_loss": -8.795404434204102, "global_step": 68034, "epoch": 404} {"train_loss": -9.001161575317383, "global_step": 68035, "epoch": 404} {"train_loss": -8.877960205078125, "global_step": 68036, "epoch": 404} {"train_loss": -8.920980453491211, "global_step": 68037, "epoch": 404} {"train_loss": -8.757561683654785, "global_step": 68038, "epoch": 404} {"train_loss": -8.829354819797334, "global_step": 68039, "epoch": 404, "val_loss": 192504.546875} {"train_loss": -9.023096084594727, "global_step": 68040, "epoch": 405} {"train_loss": -9.034513473510742, "global_step": 68041, "epoch": 405} {"train_loss": -9.038788795471191, "global_step": 68042, "epoch": 405} {"train_loss": -9.0238676071167, "global_step": 68043, "epoch": 405} {"train_loss": -9.14863395690918, "global_step": 68044, "epoch": 405} {"train_loss": -9.10734748840332, "global_step": 68045, "epoch": 405} {"train_loss": -9.160362243652344, "global_step": 68046, "epoch": 405} {"train_loss": -8.973962783813477, "global_step": 68047, "epoch": 405} {"train_loss": -9.14114761352539, "global_step": 68048, "epoch": 405} {"train_loss": -9.035937309265137, "global_step": 68049, "epoch": 405} {"train_loss": -9.081278800964355, "global_step": 68050, "epoch": 405} {"train_loss": -8.90980339050293, "global_step": 68051, "epoch": 405} {"train_loss": -9.058337211608887, "global_step": 68052, "epoch": 405} {"train_loss": -8.846839904785156, "global_step": 68053, "epoch": 405} {"train_loss": -8.989378929138184, "global_step": 68054, "epoch": 405} {"train_loss": -8.734919548034668, "global_step": 68055, "epoch": 405} {"train_loss": -8.762907981872559, "global_step": 68056, "epoch": 405} {"train_loss": -8.704272270202637, "global_step": 68057, "epoch": 405} {"train_loss": -8.683494567871094, "global_step": 68058, "epoch": 405} {"train_loss": -8.85552978515625, "global_step": 68059, "epoch": 405} {"train_loss": -9.001874923706055, "global_step": 68060, "epoch": 405} {"train_loss": -8.759469985961914, "global_step": 68061, "epoch": 405} {"train_loss": -8.630359649658203, "global_step": 68062, "epoch": 405} {"train_loss": -8.96257209777832, "global_step": 68063, "epoch": 405} {"train_loss": -8.799925804138184, "global_step": 68064, "epoch": 405} {"train_loss": -8.787554740905762, "global_step": 68065, "epoch": 405} {"train_loss": -8.899628639221191, "global_step": 68066, "epoch": 405} {"train_loss": -8.944852828979492, "global_step": 68067, "epoch": 405} {"train_loss": -9.039670944213867, "global_step": 68068, "epoch": 405} {"train_loss": -8.964862823486328, "global_step": 68069, "epoch": 405} {"train_loss": -8.90243911743164, "global_step": 68070, "epoch": 405} {"train_loss": -8.96729850769043, "global_step": 68071, "epoch": 405} {"train_loss": -9.08150577545166, "global_step": 68072, "epoch": 405} {"train_loss": -8.914033889770508, "global_step": 68073, "epoch": 405} {"train_loss": -9.014786720275879, "global_step": 68074, "epoch": 405} {"train_loss": -8.883852005004883, "global_step": 68075, "epoch": 405} {"train_loss": -9.038228988647461, "global_step": 68076, "epoch": 405} {"train_loss": -9.11221694946289, "global_step": 68077, "epoch": 405} {"train_loss": -9.14222526550293, "global_step": 68078, "epoch": 405} {"train_loss": -8.46047306060791, "global_step": 68079, "epoch": 405} {"train_loss": -9.178617477416992, "global_step": 68080, "epoch": 405} {"train_loss": -8.33950138092041, "global_step": 68081, "epoch": 405} {"train_loss": -8.739227294921875, "global_step": 68082, "epoch": 405} {"train_loss": -8.741008758544922, "global_step": 68083, "epoch": 405} {"train_loss": -8.950284957885742, "global_step": 68084, "epoch": 405} {"train_loss": -8.789395332336426, "global_step": 68085, "epoch": 405} {"train_loss": -8.913593292236328, "global_step": 68086, "epoch": 405} {"train_loss": -8.645683288574219, "global_step": 68087, "epoch": 405} {"train_loss": -8.736306190490723, "global_step": 68088, "epoch": 405} {"train_loss": -8.735654830932617, "global_step": 68089, "epoch": 405} {"train_loss": -8.76943588256836, "global_step": 68090, "epoch": 405} {"train_loss": -9.047685623168945, "global_step": 68091, "epoch": 405} {"train_loss": -8.799524307250977, "global_step": 68092, "epoch": 405} {"train_loss": -9.031233787536621, "global_step": 68093, "epoch": 405} {"train_loss": -8.974106788635254, "global_step": 68094, "epoch": 405} {"train_loss": -9.011137962341309, "global_step": 68095, "epoch": 405} {"train_loss": -8.86878776550293, "global_step": 68096, "epoch": 405} {"train_loss": -9.087233543395996, "global_step": 68097, "epoch": 405} {"train_loss": -9.088854789733887, "global_step": 68098, "epoch": 405} {"train_loss": -8.751981735229492, "global_step": 68099, "epoch": 405} {"train_loss": -9.085091590881348, "global_step": 68100, "epoch": 405} {"train_loss": -8.649003982543945, "global_step": 68101, "epoch": 405} {"train_loss": -8.699024200439453, "global_step": 68102, "epoch": 405} {"train_loss": -8.703536987304688, "global_step": 68103, "epoch": 405} {"train_loss": -8.738306045532227, "global_step": 68104, "epoch": 405} {"train_loss": -8.964487075805664, "global_step": 68105, "epoch": 405} {"train_loss": -9.034225463867188, "global_step": 68106, "epoch": 405} {"train_loss": -9.011455535888672, "global_step": 68107, "epoch": 405} {"train_loss": -8.954455375671387, "global_step": 68108, "epoch": 405} {"train_loss": -8.901611328125, "global_step": 68109, "epoch": 405} {"train_loss": -9.106030464172363, "global_step": 68110, "epoch": 405} {"train_loss": -9.176712989807129, "global_step": 68111, "epoch": 405} {"train_loss": -8.628175735473633, "global_step": 68112, "epoch": 405} {"train_loss": -9.217981338500977, "global_step": 68113, "epoch": 405} {"train_loss": -8.779010772705078, "global_step": 68114, "epoch": 405} {"train_loss": -8.942036628723145, "global_step": 68115, "epoch": 405} {"train_loss": -9.057938575744629, "global_step": 68116, "epoch": 405} {"train_loss": -8.160196304321289, "global_step": 68117, "epoch": 405} {"train_loss": -8.864648818969727, "global_step": 68118, "epoch": 405} {"train_loss": -7.812211990356445, "global_step": 68119, "epoch": 405} {"train_loss": -8.733131408691406, "global_step": 68120, "epoch": 405} {"train_loss": -8.094613075256348, "global_step": 68121, "epoch": 405} {"train_loss": -8.56651496887207, "global_step": 68122, "epoch": 405} {"train_loss": -8.362468719482422, "global_step": 68123, "epoch": 405} {"train_loss": -8.49554443359375, "global_step": 68124, "epoch": 405} {"train_loss": -8.505880355834961, "global_step": 68125, "epoch": 405} {"train_loss": -8.782052993774414, "global_step": 68126, "epoch": 405} {"train_loss": -8.608541488647461, "global_step": 68127, "epoch": 405} {"train_loss": -8.56296157836914, "global_step": 68128, "epoch": 405} {"train_loss": -8.417095184326172, "global_step": 68129, "epoch": 405} {"train_loss": -8.789295196533203, "global_step": 68130, "epoch": 405} {"train_loss": -8.526931762695312, "global_step": 68131, "epoch": 405} {"train_loss": -8.458723068237305, "global_step": 68132, "epoch": 405} {"train_loss": -8.582475662231445, "global_step": 68133, "epoch": 405} {"train_loss": -8.53757095336914, "global_step": 68134, "epoch": 405} {"train_loss": -8.90731430053711, "global_step": 68135, "epoch": 405} {"train_loss": -8.751640319824219, "global_step": 68136, "epoch": 405} {"train_loss": -8.583759307861328, "global_step": 68137, "epoch": 405} {"train_loss": -8.821819305419922, "global_step": 68138, "epoch": 405} {"train_loss": -8.718755722045898, "global_step": 68139, "epoch": 405} {"train_loss": -8.924473762512207, "global_step": 68140, "epoch": 405} {"train_loss": -8.704501152038574, "global_step": 68141, "epoch": 405} {"train_loss": -8.806842803955078, "global_step": 68142, "epoch": 405} {"train_loss": -8.532452583312988, "global_step": 68143, "epoch": 405} {"train_loss": -8.828062057495117, "global_step": 68144, "epoch": 405} {"train_loss": -8.842493057250977, "global_step": 68145, "epoch": 405} {"train_loss": -8.910619735717773, "global_step": 68146, "epoch": 405} {"train_loss": -8.846789360046387, "global_step": 68147, "epoch": 405} {"train_loss": -8.633766174316406, "global_step": 68148, "epoch": 405} {"train_loss": -8.834646224975586, "global_step": 68149, "epoch": 405} {"train_loss": -8.787168502807617, "global_step": 68150, "epoch": 405} {"train_loss": -8.900138854980469, "global_step": 68151, "epoch": 405} {"train_loss": -8.859309196472168, "global_step": 68152, "epoch": 405} {"train_loss": -8.94504165649414, "global_step": 68153, "epoch": 405} {"train_loss": -8.879671096801758, "global_step": 68154, "epoch": 405} {"train_loss": -9.080093383789062, "global_step": 68155, "epoch": 405} {"train_loss": -9.054903030395508, "global_step": 68156, "epoch": 405} {"train_loss": -8.766204833984375, "global_step": 68157, "epoch": 405} {"train_loss": -8.916577339172363, "global_step": 68158, "epoch": 405} {"train_loss": -9.048887252807617, "global_step": 68159, "epoch": 405} {"train_loss": -8.78438949584961, "global_step": 68160, "epoch": 405} {"train_loss": -9.06020736694336, "global_step": 68161, "epoch": 405} {"train_loss": -8.860509872436523, "global_step": 68162, "epoch": 405} {"train_loss": -8.763086318969727, "global_step": 68163, "epoch": 405} {"train_loss": -9.127641677856445, "global_step": 68164, "epoch": 405} {"train_loss": -8.826555252075195, "global_step": 68165, "epoch": 405} {"train_loss": -8.857345581054688, "global_step": 68166, "epoch": 405} {"train_loss": -9.2001371383667, "global_step": 68167, "epoch": 405} {"train_loss": -9.106058120727539, "global_step": 68168, "epoch": 405} {"train_loss": -8.955820083618164, "global_step": 68169, "epoch": 405} {"train_loss": -8.73781967163086, "global_step": 68170, "epoch": 405} {"train_loss": -8.788631439208984, "global_step": 68171, "epoch": 405} {"train_loss": -8.916547775268555, "global_step": 68172, "epoch": 405} {"train_loss": -8.665275573730469, "global_step": 68173, "epoch": 405} {"train_loss": -8.55689811706543, "global_step": 68174, "epoch": 405} {"train_loss": -8.928410530090332, "global_step": 68175, "epoch": 405} {"train_loss": -8.209794044494629, "global_step": 68176, "epoch": 405} {"train_loss": -8.747821807861328, "global_step": 68177, "epoch": 405} {"train_loss": -8.780739784240723, "global_step": 68178, "epoch": 405} {"train_loss": -8.719794273376465, "global_step": 68179, "epoch": 405} {"train_loss": -8.660224914550781, "global_step": 68180, "epoch": 405} {"train_loss": -8.847248077392578, "global_step": 68181, "epoch": 405} {"train_loss": -8.935636520385742, "global_step": 68182, "epoch": 405} {"train_loss": -8.520794868469238, "global_step": 68183, "epoch": 405} {"train_loss": -8.721521377563477, "global_step": 68184, "epoch": 405} {"train_loss": -8.861106872558594, "global_step": 68185, "epoch": 405} {"train_loss": -8.975915908813477, "global_step": 68186, "epoch": 405} {"train_loss": -8.777957916259766, "global_step": 68187, "epoch": 405} {"train_loss": -8.99660873413086, "global_step": 68188, "epoch": 405} {"train_loss": -8.842872619628906, "global_step": 68189, "epoch": 405} {"train_loss": -8.80088996887207, "global_step": 68190, "epoch": 405} {"train_loss": -9.00787353515625, "global_step": 68191, "epoch": 405} {"train_loss": -8.71558666229248, "global_step": 68192, "epoch": 405} {"train_loss": -8.848159790039062, "global_step": 68193, "epoch": 405} {"train_loss": -8.799001693725586, "global_step": 68194, "epoch": 405} {"train_loss": -8.798457145690918, "global_step": 68195, "epoch": 405} {"train_loss": -8.969488143920898, "global_step": 68196, "epoch": 405} {"train_loss": -9.067441940307617, "global_step": 68197, "epoch": 405} {"train_loss": -8.849137306213379, "global_step": 68198, "epoch": 405} {"train_loss": -9.022777557373047, "global_step": 68199, "epoch": 405} {"train_loss": -8.848188400268555, "global_step": 68200, "epoch": 405} {"train_loss": -8.627500534057617, "global_step": 68201, "epoch": 405} {"train_loss": -9.004613876342773, "global_step": 68202, "epoch": 405} {"train_loss": -8.75462532043457, "global_step": 68203, "epoch": 405} {"train_loss": -8.860322952270508, "global_step": 68204, "epoch": 405} {"train_loss": -9.019569396972656, "global_step": 68205, "epoch": 405} {"train_loss": -8.971662521362305, "global_step": 68206, "epoch": 405} {"train_loss": -8.839362064997355, "global_step": 68207, "epoch": 405, "val_loss": 194399.90625, "train_action_mse_error": 8.72553825378418} {"train_loss": -8.903555870056152, "global_step": 68208, "epoch": 406} {"train_loss": -8.89361572265625, "global_step": 68209, "epoch": 406} {"train_loss": -8.715421676635742, "global_step": 68210, "epoch": 406} {"train_loss": -9.032673835754395, "global_step": 68211, "epoch": 406} {"train_loss": -8.89281177520752, "global_step": 68212, "epoch": 406} {"train_loss": -9.148975372314453, "global_step": 68213, "epoch": 406} {"train_loss": -8.897600173950195, "global_step": 68214, "epoch": 406} {"train_loss": -8.784774780273438, "global_step": 68215, "epoch": 406} {"train_loss": -8.775901794433594, "global_step": 68216, "epoch": 406} {"train_loss": -8.988460540771484, "global_step": 68217, "epoch": 406} {"train_loss": -9.014120101928711, "global_step": 68218, "epoch": 406} {"train_loss": -8.824605941772461, "global_step": 68219, "epoch": 406} {"train_loss": -8.782909393310547, "global_step": 68220, "epoch": 406} {"train_loss": -8.8076810836792, "global_step": 68221, "epoch": 406} {"train_loss": -8.738313674926758, "global_step": 68222, "epoch": 406} {"train_loss": -9.091931343078613, "global_step": 68223, "epoch": 406} {"train_loss": -8.807720184326172, "global_step": 68224, "epoch": 406} {"train_loss": -8.791682243347168, "global_step": 68225, "epoch": 406} {"train_loss": -8.95378303527832, "global_step": 68226, "epoch": 406} {"train_loss": -8.679792404174805, "global_step": 68227, "epoch": 406} {"train_loss": -8.773801803588867, "global_step": 68228, "epoch": 406} {"train_loss": -8.966816902160645, "global_step": 68229, "epoch": 406} {"train_loss": -8.93185806274414, "global_step": 68230, "epoch": 406} {"train_loss": -8.99266242980957, "global_step": 68231, "epoch": 406} {"train_loss": -8.572072982788086, "global_step": 68232, "epoch": 406} {"train_loss": -8.729619979858398, "global_step": 68233, "epoch": 406} {"train_loss": -8.77077865600586, "global_step": 68234, "epoch": 406} {"train_loss": -8.663239479064941, "global_step": 68235, "epoch": 406} {"train_loss": -8.613801002502441, "global_step": 68236, "epoch": 406} {"train_loss": -8.99677848815918, "global_step": 68237, "epoch": 406} {"train_loss": -8.950058937072754, "global_step": 68238, "epoch": 406} {"train_loss": -8.83337116241455, "global_step": 68239, "epoch": 406} {"train_loss": -8.845961570739746, "global_step": 68240, "epoch": 406} {"train_loss": -8.997014045715332, "global_step": 68241, "epoch": 406} {"train_loss": -8.933574676513672, "global_step": 68242, "epoch": 406} {"train_loss": -8.919000625610352, "global_step": 68243, "epoch": 406} {"train_loss": -9.069635391235352, "global_step": 68244, "epoch": 406} {"train_loss": -8.546097755432129, "global_step": 68245, "epoch": 406} {"train_loss": -8.978132247924805, "global_step": 68246, "epoch": 406} {"train_loss": -8.934926986694336, "global_step": 68247, "epoch": 406} {"train_loss": -8.914457321166992, "global_step": 68248, "epoch": 406} {"train_loss": -8.92204761505127, "global_step": 68249, "epoch": 406} {"train_loss": -8.654891967773438, "global_step": 68250, "epoch": 406} {"train_loss": -8.848394393920898, "global_step": 68251, "epoch": 406} {"train_loss": -8.852994918823242, "global_step": 68252, "epoch": 406} {"train_loss": -8.67929458618164, "global_step": 68253, "epoch": 406} {"train_loss": -8.7567138671875, "global_step": 68254, "epoch": 406} {"train_loss": -8.772693634033203, "global_step": 68255, "epoch": 406} {"train_loss": -8.789934158325195, "global_step": 68256, "epoch": 406} {"train_loss": -8.89730453491211, "global_step": 68257, "epoch": 406} {"train_loss": -8.883211135864258, "global_step": 68258, "epoch": 406} {"train_loss": -8.783358573913574, "global_step": 68259, "epoch": 406} {"train_loss": -8.809659957885742, "global_step": 68260, "epoch": 406} {"train_loss": -8.76319408416748, "global_step": 68261, "epoch": 406} {"train_loss": -8.37081241607666, "global_step": 68262, "epoch": 406} {"train_loss": -8.903675079345703, "global_step": 68263, "epoch": 406} {"train_loss": -8.743355751037598, "global_step": 68264, "epoch": 406} {"train_loss": -8.829750061035156, "global_step": 68265, "epoch": 406} {"train_loss": -8.824548721313477, "global_step": 68266, "epoch": 406} {"train_loss": -8.776900291442871, "global_step": 68267, "epoch": 406} {"train_loss": -8.826858520507812, "global_step": 68268, "epoch": 406} {"train_loss": -8.867790222167969, "global_step": 68269, "epoch": 406} {"train_loss": -8.959056854248047, "global_step": 68270, "epoch": 406} {"train_loss": -9.097513198852539, "global_step": 68271, "epoch": 406} {"train_loss": -8.8463773727417, "global_step": 68272, "epoch": 406} {"train_loss": -8.818572998046875, "global_step": 68273, "epoch": 406} {"train_loss": -8.814099311828613, "global_step": 68274, "epoch": 406} {"train_loss": -8.63508129119873, "global_step": 68275, "epoch": 406} {"train_loss": -9.033614158630371, "global_step": 68276, "epoch": 406} {"train_loss": -8.531277656555176, "global_step": 68277, "epoch": 406} {"train_loss": -8.970741271972656, "global_step": 68278, "epoch": 406} {"train_loss": -8.84878158569336, "global_step": 68279, "epoch": 406} {"train_loss": -9.024592399597168, "global_step": 68280, "epoch": 406} {"train_loss": -9.014251708984375, "global_step": 68281, "epoch": 406} {"train_loss": -9.060240745544434, "global_step": 68282, "epoch": 406} {"train_loss": -8.845072746276855, "global_step": 68283, "epoch": 406} {"train_loss": -8.913637161254883, "global_step": 68284, "epoch": 406} {"train_loss": -9.11228084564209, "global_step": 68285, "epoch": 406} {"train_loss": -8.755979537963867, "global_step": 68286, "epoch": 406} {"train_loss": -9.0066556930542, "global_step": 68287, "epoch": 406} {"train_loss": -8.81556510925293, "global_step": 68288, "epoch": 406} {"train_loss": -8.7550630569458, "global_step": 68289, "epoch": 406} {"train_loss": -8.886889457702637, "global_step": 68290, "epoch": 406} {"train_loss": -9.244172096252441, "global_step": 68291, "epoch": 406} {"train_loss": -8.689803123474121, "global_step": 68292, "epoch": 406} {"train_loss": -9.037315368652344, "global_step": 68293, "epoch": 406} {"train_loss": -8.865447998046875, "global_step": 68294, "epoch": 406} {"train_loss": -8.822427749633789, "global_step": 68295, "epoch": 406} {"train_loss": -8.497279167175293, "global_step": 68296, "epoch": 406} {"train_loss": -8.755683898925781, "global_step": 68297, "epoch": 406} {"train_loss": -8.649768829345703, "global_step": 68298, "epoch": 406} {"train_loss": -8.855673789978027, "global_step": 68299, "epoch": 406} {"train_loss": -8.6362886428833, "global_step": 68300, "epoch": 406} {"train_loss": -8.851394653320312, "global_step": 68301, "epoch": 406} {"train_loss": -8.872387886047363, "global_step": 68302, "epoch": 406} {"train_loss": -8.761231422424316, "global_step": 68303, "epoch": 406} {"train_loss": -8.71760368347168, "global_step": 68304, "epoch": 406} {"train_loss": -8.954771995544434, "global_step": 68305, "epoch": 406} {"train_loss": -8.74610424041748, "global_step": 68306, "epoch": 406} {"train_loss": -8.860061645507812, "global_step": 68307, "epoch": 406} {"train_loss": -8.871166229248047, "global_step": 68308, "epoch": 406} {"train_loss": -8.842026710510254, "global_step": 68309, "epoch": 406} {"train_loss": -8.631007194519043, "global_step": 68310, "epoch": 406} {"train_loss": -8.90783405303955, "global_step": 68311, "epoch": 406} {"train_loss": -8.770380020141602, "global_step": 68312, "epoch": 406} {"train_loss": -8.920064926147461, "global_step": 68313, "epoch": 406} {"train_loss": -8.914262771606445, "global_step": 68314, "epoch": 406} {"train_loss": -8.863253593444824, "global_step": 68315, "epoch": 406} {"train_loss": -8.947969436645508, "global_step": 68316, "epoch": 406} {"train_loss": -8.732439041137695, "global_step": 68317, "epoch": 406} {"train_loss": -8.65875244140625, "global_step": 68318, "epoch": 406} {"train_loss": -8.766706466674805, "global_step": 68319, "epoch": 406} {"train_loss": -8.705354690551758, "global_step": 68320, "epoch": 406} {"train_loss": -8.976301193237305, "global_step": 68321, "epoch": 406} {"train_loss": -8.874773025512695, "global_step": 68322, "epoch": 406} {"train_loss": -8.892921447753906, "global_step": 68323, "epoch": 406} {"train_loss": -9.039103507995605, "global_step": 68324, "epoch": 406} {"train_loss": -8.935968399047852, "global_step": 68325, "epoch": 406} {"train_loss": -9.011263847351074, "global_step": 68326, "epoch": 406} {"train_loss": -9.09197998046875, "global_step": 68327, "epoch": 406} {"train_loss": -9.043460845947266, "global_step": 68328, "epoch": 406} {"train_loss": -8.88464641571045, "global_step": 68329, "epoch": 406} {"train_loss": -8.804064750671387, "global_step": 68330, "epoch": 406} {"train_loss": -8.680813789367676, "global_step": 68331, "epoch": 406} {"train_loss": -8.876577377319336, "global_step": 68332, "epoch": 406} {"train_loss": -9.14201545715332, "global_step": 68333, "epoch": 406} {"train_loss": -8.728858947753906, "global_step": 68334, "epoch": 406} {"train_loss": -8.897638320922852, "global_step": 68335, "epoch": 406} {"train_loss": -8.690208435058594, "global_step": 68336, "epoch": 406} {"train_loss": -8.834468841552734, "global_step": 68337, "epoch": 406} {"train_loss": -8.622568130493164, "global_step": 68338, "epoch": 406} {"train_loss": -8.693547248840332, "global_step": 68339, "epoch": 406} {"train_loss": -8.874449729919434, "global_step": 68340, "epoch": 406} {"train_loss": -8.644119262695312, "global_step": 68341, "epoch": 406} {"train_loss": -9.093287467956543, "global_step": 68342, "epoch": 406} {"train_loss": -8.87633991241455, "global_step": 68343, "epoch": 406} {"train_loss": -8.874425888061523, "global_step": 68344, "epoch": 406} {"train_loss": -8.986725807189941, "global_step": 68345, "epoch": 406} {"train_loss": -8.93524169921875, "global_step": 68346, "epoch": 406} {"train_loss": -8.975217819213867, "global_step": 68347, "epoch": 406} {"train_loss": -8.79622745513916, "global_step": 68348, "epoch": 406} {"train_loss": -9.057541847229004, "global_step": 68349, "epoch": 406} {"train_loss": -8.470211029052734, "global_step": 68350, "epoch": 406} {"train_loss": -8.97854232788086, "global_step": 68351, "epoch": 406} {"train_loss": -8.442120552062988, "global_step": 68352, "epoch": 406} {"train_loss": -8.966773986816406, "global_step": 68353, "epoch": 406} {"train_loss": -8.58831787109375, "global_step": 68354, "epoch": 406} {"train_loss": -8.998315811157227, "global_step": 68355, "epoch": 406} {"train_loss": -8.67530345916748, "global_step": 68356, "epoch": 406} {"train_loss": -8.751529693603516, "global_step": 68357, "epoch": 406} {"train_loss": -8.878494262695312, "global_step": 68358, "epoch": 406} {"train_loss": -9.102867126464844, "global_step": 68359, "epoch": 406} {"train_loss": -8.71358871459961, "global_step": 68360, "epoch": 406} {"train_loss": -8.832098007202148, "global_step": 68361, "epoch": 406} {"train_loss": -8.481048583984375, "global_step": 68362, "epoch": 406} {"train_loss": -8.994732856750488, "global_step": 68363, "epoch": 406} {"train_loss": -8.834632873535156, "global_step": 68364, "epoch": 406} {"train_loss": -8.647974014282227, "global_step": 68365, "epoch": 406} {"train_loss": -8.8240966796875, "global_step": 68366, "epoch": 406} {"train_loss": -8.797744750976562, "global_step": 68367, "epoch": 406} {"train_loss": -8.70936393737793, "global_step": 68368, "epoch": 406} {"train_loss": -8.919012069702148, "global_step": 68369, "epoch": 406} {"train_loss": -8.75744342803955, "global_step": 68370, "epoch": 406} {"train_loss": -8.722464561462402, "global_step": 68371, "epoch": 406} {"train_loss": -9.07682991027832, "global_step": 68372, "epoch": 406} {"train_loss": -8.833958625793457, "global_step": 68373, "epoch": 406} {"train_loss": -8.962854385375977, "global_step": 68374, "epoch": 406} {"train_loss": -8.843065539995829, "global_step": 68375, "epoch": 406, "val_loss": 193499.65625} {"train_loss": -8.817280769348145, "global_step": 68376, "epoch": 407} {"train_loss": -9.081857681274414, "global_step": 68377, "epoch": 407} {"train_loss": -9.044652938842773, "global_step": 68378, "epoch": 407} {"train_loss": -8.984883308410645, "global_step": 68379, "epoch": 407} {"train_loss": -8.818033218383789, "global_step": 68380, "epoch": 407} {"train_loss": -9.000994682312012, "global_step": 68381, "epoch": 407} {"train_loss": -8.940045356750488, "global_step": 68382, "epoch": 407} {"train_loss": -8.884733200073242, "global_step": 68383, "epoch": 407} {"train_loss": -8.710004806518555, "global_step": 68384, "epoch": 407} {"train_loss": -9.061924934387207, "global_step": 68385, "epoch": 407} {"train_loss": -8.907414436340332, "global_step": 68386, "epoch": 407} {"train_loss": -9.10037612915039, "global_step": 68387, "epoch": 407} {"train_loss": -8.825807571411133, "global_step": 68388, "epoch": 407} {"train_loss": -8.836926460266113, "global_step": 68389, "epoch": 407} {"train_loss": -8.99034595489502, "global_step": 68390, "epoch": 407} {"train_loss": -9.068719863891602, "global_step": 68391, "epoch": 407} {"train_loss": -9.133056640625, "global_step": 68392, "epoch": 407} {"train_loss": -8.95865249633789, "global_step": 68393, "epoch": 407} {"train_loss": -8.948853492736816, "global_step": 68394, "epoch": 407} {"train_loss": -9.114474296569824, "global_step": 68395, "epoch": 407} {"train_loss": -8.911701202392578, "global_step": 68396, "epoch": 407} {"train_loss": -8.864192962646484, "global_step": 68397, "epoch": 407} {"train_loss": -8.89622688293457, "global_step": 68398, "epoch": 407} {"train_loss": -9.086482048034668, "global_step": 68399, "epoch": 407} {"train_loss": -8.714447975158691, "global_step": 68400, "epoch": 407} {"train_loss": -8.527545928955078, "global_step": 68401, "epoch": 407} {"train_loss": -8.932615280151367, "global_step": 68402, "epoch": 407} {"train_loss": -8.538894653320312, "global_step": 68403, "epoch": 407} {"train_loss": -8.860753059387207, "global_step": 68404, "epoch": 407} {"train_loss": -8.786609649658203, "global_step": 68405, "epoch": 407} {"train_loss": -8.87881851196289, "global_step": 68406, "epoch": 407} {"train_loss": -8.543933868408203, "global_step": 68407, "epoch": 407} {"train_loss": -8.728462219238281, "global_step": 68408, "epoch": 407} {"train_loss": -8.487569808959961, "global_step": 68409, "epoch": 407} {"train_loss": -8.774961471557617, "global_step": 68410, "epoch": 407} {"train_loss": -8.723100662231445, "global_step": 68411, "epoch": 407} {"train_loss": -8.609621047973633, "global_step": 68412, "epoch": 407} {"train_loss": -8.689159393310547, "global_step": 68413, "epoch": 407} {"train_loss": -8.824438095092773, "global_step": 68414, "epoch": 407} {"train_loss": -8.736942291259766, "global_step": 68415, "epoch": 407} {"train_loss": -8.863138198852539, "global_step": 68416, "epoch": 407} {"train_loss": -8.892810821533203, "global_step": 68417, "epoch": 407} {"train_loss": -8.700368881225586, "global_step": 68418, "epoch": 407} {"train_loss": -8.9217529296875, "global_step": 68419, "epoch": 407} {"train_loss": -8.891058921813965, "global_step": 68420, "epoch": 407} {"train_loss": -8.998311996459961, "global_step": 68421, "epoch": 407} {"train_loss": -8.707143783569336, "global_step": 68422, "epoch": 407} {"train_loss": -8.973180770874023, "global_step": 68423, "epoch": 407} {"train_loss": -8.708026885986328, "global_step": 68424, "epoch": 407} {"train_loss": -9.040468215942383, "global_step": 68425, "epoch": 407} {"train_loss": -8.81619644165039, "global_step": 68426, "epoch": 407} {"train_loss": -8.77271842956543, "global_step": 68427, "epoch": 407} {"train_loss": -8.78410530090332, "global_step": 68428, "epoch": 407} {"train_loss": -8.862868309020996, "global_step": 68429, "epoch": 407} {"train_loss": -8.723007202148438, "global_step": 68430, "epoch": 407} {"train_loss": -8.75465202331543, "global_step": 68431, "epoch": 407} {"train_loss": -9.038895606994629, "global_step": 68432, "epoch": 407} {"train_loss": -8.892230987548828, "global_step": 68433, "epoch": 407} {"train_loss": -8.884737014770508, "global_step": 68434, "epoch": 407} {"train_loss": -8.602272033691406, "global_step": 68435, "epoch": 407} {"train_loss": -9.01701545715332, "global_step": 68436, "epoch": 407} {"train_loss": -8.764776229858398, "global_step": 68437, "epoch": 407} {"train_loss": -8.8626708984375, "global_step": 68438, "epoch": 407} {"train_loss": -8.800134658813477, "global_step": 68439, "epoch": 407} {"train_loss": -8.84881591796875, "global_step": 68440, "epoch": 407} {"train_loss": -8.655200004577637, "global_step": 68441, "epoch": 407} {"train_loss": -8.926952362060547, "global_step": 68442, "epoch": 407} {"train_loss": -9.020345687866211, "global_step": 68443, "epoch": 407} {"train_loss": -8.667135238647461, "global_step": 68444, "epoch": 407} {"train_loss": -9.138214111328125, "global_step": 68445, "epoch": 407} {"train_loss": -8.887527465820312, "global_step": 68446, "epoch": 407} {"train_loss": -8.448582649230957, "global_step": 68447, "epoch": 407} {"train_loss": -9.01053237915039, "global_step": 68448, "epoch": 407} {"train_loss": -9.16385555267334, "global_step": 68449, "epoch": 407} {"train_loss": -8.747026443481445, "global_step": 68450, "epoch": 407} {"train_loss": -8.822563171386719, "global_step": 68451, "epoch": 407} {"train_loss": -8.796991348266602, "global_step": 68452, "epoch": 407} {"train_loss": -8.596960067749023, "global_step": 68453, "epoch": 407} {"train_loss": -8.901172637939453, "global_step": 68454, "epoch": 407} {"train_loss": -8.945231437683105, "global_step": 68455, "epoch": 407} {"train_loss": -8.722814559936523, "global_step": 68456, "epoch": 407} {"train_loss": -8.867439270019531, "global_step": 68457, "epoch": 407} {"train_loss": -8.605768203735352, "global_step": 68458, "epoch": 407} {"train_loss": -8.899145126342773, "global_step": 68459, "epoch": 407} {"train_loss": -8.610008239746094, "global_step": 68460, "epoch": 407} {"train_loss": -8.826643943786621, "global_step": 68461, "epoch": 407} {"train_loss": -8.82260513305664, "global_step": 68462, "epoch": 407} {"train_loss": -8.921417236328125, "global_step": 68463, "epoch": 407} {"train_loss": -8.641532897949219, "global_step": 68464, "epoch": 407} {"train_loss": -9.091480255126953, "global_step": 68465, "epoch": 407} {"train_loss": -9.006417274475098, "global_step": 68466, "epoch": 407} {"train_loss": -8.953750610351562, "global_step": 68467, "epoch": 407} {"train_loss": -9.112466812133789, "global_step": 68468, "epoch": 407} {"train_loss": -9.119783401489258, "global_step": 68469, "epoch": 407} {"train_loss": -8.806952476501465, "global_step": 68470, "epoch": 407} {"train_loss": -8.81659984588623, "global_step": 68471, "epoch": 407} {"train_loss": -8.832402229309082, "global_step": 68472, "epoch": 407} {"train_loss": -8.49952507019043, "global_step": 68473, "epoch": 407} {"train_loss": -8.748064994812012, "global_step": 68474, "epoch": 407} {"train_loss": -8.342203140258789, "global_step": 68475, "epoch": 407} {"train_loss": -8.846757888793945, "global_step": 68476, "epoch": 407} {"train_loss": -8.490310668945312, "global_step": 68477, "epoch": 407} {"train_loss": -8.768563270568848, "global_step": 68478, "epoch": 407} {"train_loss": -8.392906188964844, "global_step": 68479, "epoch": 407} {"train_loss": -8.519133567810059, "global_step": 68480, "epoch": 407} {"train_loss": -8.815516471862793, "global_step": 68481, "epoch": 407} {"train_loss": -8.652408599853516, "global_step": 68482, "epoch": 407} {"train_loss": -8.740240097045898, "global_step": 68483, "epoch": 407} {"train_loss": -8.929779052734375, "global_step": 68484, "epoch": 407} {"train_loss": -8.967782020568848, "global_step": 68485, "epoch": 407} {"train_loss": -8.754554748535156, "global_step": 68486, "epoch": 407} {"train_loss": -9.020488739013672, "global_step": 68487, "epoch": 407} {"train_loss": -8.874383926391602, "global_step": 68488, "epoch": 407} {"train_loss": -9.025434494018555, "global_step": 68489, "epoch": 407} {"train_loss": -8.706646919250488, "global_step": 68490, "epoch": 407} {"train_loss": -8.913270950317383, "global_step": 68491, "epoch": 407} {"train_loss": -8.987199783325195, "global_step": 68492, "epoch": 407} {"train_loss": -8.950115203857422, "global_step": 68493, "epoch": 407} {"train_loss": -9.073890686035156, "global_step": 68494, "epoch": 407} {"train_loss": -8.966226577758789, "global_step": 68495, "epoch": 407} {"train_loss": -8.925716400146484, "global_step": 68496, "epoch": 407} {"train_loss": -8.789544105529785, "global_step": 68497, "epoch": 407} {"train_loss": -9.165151596069336, "global_step": 68498, "epoch": 407} {"train_loss": -9.15553092956543, "global_step": 68499, "epoch": 407} {"train_loss": -9.130377769470215, "global_step": 68500, "epoch": 407} {"train_loss": -8.81921672821045, "global_step": 68501, "epoch": 407} {"train_loss": -9.10847282409668, "global_step": 68502, "epoch": 407} {"train_loss": -9.098054885864258, "global_step": 68503, "epoch": 407} {"train_loss": -9.108494758605957, "global_step": 68504, "epoch": 407} {"train_loss": -8.978654861450195, "global_step": 68505, "epoch": 407} {"train_loss": -8.586926460266113, "global_step": 68506, "epoch": 407} {"train_loss": -9.059349060058594, "global_step": 68507, "epoch": 407} {"train_loss": -8.98057746887207, "global_step": 68508, "epoch": 407} {"train_loss": -8.740151405334473, "global_step": 68509, "epoch": 407} {"train_loss": -8.9871826171875, "global_step": 68510, "epoch": 407} {"train_loss": -8.858051300048828, "global_step": 68511, "epoch": 407} {"train_loss": -8.83082389831543, "global_step": 68512, "epoch": 407} {"train_loss": -8.855944633483887, "global_step": 68513, "epoch": 407} {"train_loss": -8.90876579284668, "global_step": 68514, "epoch": 407} {"train_loss": -8.950748443603516, "global_step": 68515, "epoch": 407} {"train_loss": -9.21660327911377, "global_step": 68516, "epoch": 407} {"train_loss": -8.739730834960938, "global_step": 68517, "epoch": 407} {"train_loss": -8.97983169555664, "global_step": 68518, "epoch": 407} {"train_loss": -8.832273483276367, "global_step": 68519, "epoch": 407} {"train_loss": -8.902273178100586, "global_step": 68520, "epoch": 407} {"train_loss": -8.911197662353516, "global_step": 68521, "epoch": 407} {"train_loss": -8.801979064941406, "global_step": 68522, "epoch": 407} {"train_loss": -8.767757415771484, "global_step": 68523, "epoch": 407} {"train_loss": -8.928382873535156, "global_step": 68524, "epoch": 407} {"train_loss": -8.965262413024902, "global_step": 68525, "epoch": 407} {"train_loss": -8.859149932861328, "global_step": 68526, "epoch": 407} {"train_loss": -8.87996768951416, "global_step": 68527, "epoch": 407} {"train_loss": -8.772801399230957, "global_step": 68528, "epoch": 407} {"train_loss": -9.05876350402832, "global_step": 68529, "epoch": 407} {"train_loss": -8.639572143554688, "global_step": 68530, "epoch": 407} {"train_loss": -8.84781551361084, "global_step": 68531, "epoch": 407} {"train_loss": -8.769506454467773, "global_step": 68532, "epoch": 407} {"train_loss": -8.682958602905273, "global_step": 68533, "epoch": 407} {"train_loss": -8.73996639251709, "global_step": 68534, "epoch": 407} {"train_loss": -8.853446960449219, "global_step": 68535, "epoch": 407} {"train_loss": -8.780223846435547, "global_step": 68536, "epoch": 407} {"train_loss": -8.597251892089844, "global_step": 68537, "epoch": 407} {"train_loss": -8.917073249816895, "global_step": 68538, "epoch": 407} {"train_loss": -8.735137939453125, "global_step": 68539, "epoch": 407} {"train_loss": -8.395605087280273, "global_step": 68540, "epoch": 407} {"train_loss": -8.637840270996094, "global_step": 68541, "epoch": 407} {"train_loss": -8.897733688354492, "global_step": 68542, "epoch": 407} {"train_loss": -8.849415506635394, "global_step": 68543, "epoch": 407, "val_loss": 190747.453125} {"train_loss": -8.558698654174805, "global_step": 68544, "epoch": 408} {"train_loss": -8.958061218261719, "global_step": 68545, "epoch": 408} {"train_loss": -8.646648406982422, "global_step": 68546, "epoch": 408} {"train_loss": -8.808099746704102, "global_step": 68547, "epoch": 408} {"train_loss": -8.905531883239746, "global_step": 68548, "epoch": 408} {"train_loss": -8.904012680053711, "global_step": 68549, "epoch": 408} {"train_loss": -8.90281867980957, "global_step": 68550, "epoch": 408} {"train_loss": -8.707474708557129, "global_step": 68551, "epoch": 408} {"train_loss": -8.942116737365723, "global_step": 68552, "epoch": 408} {"train_loss": -8.961980819702148, "global_step": 68553, "epoch": 408} {"train_loss": -8.888992309570312, "global_step": 68554, "epoch": 408} {"train_loss": -8.897689819335938, "global_step": 68555, "epoch": 408} {"train_loss": -9.096158027648926, "global_step": 68556, "epoch": 408} {"train_loss": -8.961261749267578, "global_step": 68557, "epoch": 408} {"train_loss": -8.923967361450195, "global_step": 68558, "epoch": 408} {"train_loss": -9.080172538757324, "global_step": 68559, "epoch": 408} {"train_loss": -8.866850852966309, "global_step": 68560, "epoch": 408} {"train_loss": -9.173205375671387, "global_step": 68561, "epoch": 408} {"train_loss": -9.064599990844727, "global_step": 68562, "epoch": 408} {"train_loss": -9.117719650268555, "global_step": 68563, "epoch": 408} {"train_loss": -9.096574783325195, "global_step": 68564, "epoch": 408} {"train_loss": -9.152709007263184, "global_step": 68565, "epoch": 408} {"train_loss": -9.113019943237305, "global_step": 68566, "epoch": 408} {"train_loss": -9.153725624084473, "global_step": 68567, "epoch": 408} {"train_loss": -9.038919448852539, "global_step": 68568, "epoch": 408} {"train_loss": -9.155121803283691, "global_step": 68569, "epoch": 408} {"train_loss": -9.178728103637695, "global_step": 68570, "epoch": 408} {"train_loss": -8.963152885437012, "global_step": 68571, "epoch": 408} {"train_loss": -8.790059089660645, "global_step": 68572, "epoch": 408} {"train_loss": -9.201422691345215, "global_step": 68573, "epoch": 408} {"train_loss": -8.895431518554688, "global_step": 68574, "epoch": 408} {"train_loss": -9.035064697265625, "global_step": 68575, "epoch": 408} {"train_loss": -8.888614654541016, "global_step": 68576, "epoch": 408} {"train_loss": -8.921260833740234, "global_step": 68577, "epoch": 408} {"train_loss": -8.930450439453125, "global_step": 68578, "epoch": 408} {"train_loss": -8.799092292785645, "global_step": 68579, "epoch": 408} {"train_loss": -9.035171508789062, "global_step": 68580, "epoch": 408} {"train_loss": -8.980905532836914, "global_step": 68581, "epoch": 408} {"train_loss": -8.959000587463379, "global_step": 68582, "epoch": 408} {"train_loss": -9.038839340209961, "global_step": 68583, "epoch": 408} {"train_loss": -8.692336082458496, "global_step": 68584, "epoch": 408} {"train_loss": -8.96103286743164, "global_step": 68585, "epoch": 408} {"train_loss": -8.91615104675293, "global_step": 68586, "epoch": 408} {"train_loss": -8.901552200317383, "global_step": 68587, "epoch": 408} {"train_loss": -8.6425199508667, "global_step": 68588, "epoch": 408} {"train_loss": -8.961179733276367, "global_step": 68589, "epoch": 408} {"train_loss": -8.813026428222656, "global_step": 68590, "epoch": 408} {"train_loss": -8.89689826965332, "global_step": 68591, "epoch": 408} {"train_loss": -8.954456329345703, "global_step": 68592, "epoch": 408} {"train_loss": -8.962471008300781, "global_step": 68593, "epoch": 408} {"train_loss": -8.495498657226562, "global_step": 68594, "epoch": 408} {"train_loss": -9.051128387451172, "global_step": 68595, "epoch": 408} {"train_loss": -9.103593826293945, "global_step": 68596, "epoch": 408} {"train_loss": -8.785454750061035, "global_step": 68597, "epoch": 408} {"train_loss": -8.77463150024414, "global_step": 68598, "epoch": 408} {"train_loss": -9.048315048217773, "global_step": 68599, "epoch": 408} {"train_loss": -8.926703453063965, "global_step": 68600, "epoch": 408} {"train_loss": -8.603584289550781, "global_step": 68601, "epoch": 408} {"train_loss": -9.107823371887207, "global_step": 68602, "epoch": 408} {"train_loss": -8.751062393188477, "global_step": 68603, "epoch": 408} {"train_loss": -8.971485137939453, "global_step": 68604, "epoch": 408} {"train_loss": -8.977062225341797, "global_step": 68605, "epoch": 408} {"train_loss": -8.884666442871094, "global_step": 68606, "epoch": 408} {"train_loss": -8.860535621643066, "global_step": 68607, "epoch": 408} {"train_loss": -8.890942573547363, "global_step": 68608, "epoch": 408} {"train_loss": -8.918007850646973, "global_step": 68609, "epoch": 408} {"train_loss": -8.747011184692383, "global_step": 68610, "epoch": 408} {"train_loss": -9.06888484954834, "global_step": 68611, "epoch": 408} {"train_loss": -8.90577220916748, "global_step": 68612, "epoch": 408} {"train_loss": -9.039772033691406, "global_step": 68613, "epoch": 408} {"train_loss": -8.922890663146973, "global_step": 68614, "epoch": 408} {"train_loss": -8.941011428833008, "global_step": 68615, "epoch": 408} {"train_loss": -8.930658340454102, "global_step": 68616, "epoch": 408} {"train_loss": -9.032057762145996, "global_step": 68617, "epoch": 408} {"train_loss": -9.133371353149414, "global_step": 68618, "epoch": 408} {"train_loss": -9.08896541595459, "global_step": 68619, "epoch": 408} {"train_loss": -9.050529479980469, "global_step": 68620, "epoch": 408} {"train_loss": -9.0714111328125, "global_step": 68621, "epoch": 408} {"train_loss": -8.941198348999023, "global_step": 68622, "epoch": 408} {"train_loss": -8.749273300170898, "global_step": 68623, "epoch": 408} {"train_loss": -8.916457176208496, "global_step": 68624, "epoch": 408} {"train_loss": -9.006271362304688, "global_step": 68625, "epoch": 408} {"train_loss": -9.087560653686523, "global_step": 68626, "epoch": 408} {"train_loss": -8.467514991760254, "global_step": 68627, "epoch": 408} {"train_loss": -8.587648391723633, "global_step": 68628, "epoch": 408} {"train_loss": -8.876312255859375, "global_step": 68629, "epoch": 408} {"train_loss": -8.403240203857422, "global_step": 68630, "epoch": 408} {"train_loss": -9.113862037658691, "global_step": 68631, "epoch": 408} {"train_loss": -8.67631721496582, "global_step": 68632, "epoch": 408} {"train_loss": -9.19788646697998, "global_step": 68633, "epoch": 408} {"train_loss": -8.78245735168457, "global_step": 68634, "epoch": 408} {"train_loss": -8.892706871032715, "global_step": 68635, "epoch": 408} {"train_loss": -8.764226913452148, "global_step": 68636, "epoch": 408} {"train_loss": -8.752922058105469, "global_step": 68637, "epoch": 408} {"train_loss": -8.844892501831055, "global_step": 68638, "epoch": 408} {"train_loss": -8.706284523010254, "global_step": 68639, "epoch": 408} {"train_loss": -8.794275283813477, "global_step": 68640, "epoch": 408} {"train_loss": -8.549896240234375, "global_step": 68641, "epoch": 408} {"train_loss": -8.793232917785645, "global_step": 68642, "epoch": 408} {"train_loss": -8.70231819152832, "global_step": 68643, "epoch": 408} {"train_loss": -8.690467834472656, "global_step": 68644, "epoch": 408} {"train_loss": -8.754192352294922, "global_step": 68645, "epoch": 408} {"train_loss": -8.179118156433105, "global_step": 68646, "epoch": 408} {"train_loss": -8.935373306274414, "global_step": 68647, "epoch": 408} {"train_loss": -8.546808242797852, "global_step": 68648, "epoch": 408} {"train_loss": -8.652103424072266, "global_step": 68649, "epoch": 408} {"train_loss": -8.866174697875977, "global_step": 68650, "epoch": 408} {"train_loss": -8.755878448486328, "global_step": 68651, "epoch": 408} {"train_loss": -8.738344192504883, "global_step": 68652, "epoch": 408} {"train_loss": -9.028112411499023, "global_step": 68653, "epoch": 408} {"train_loss": -8.770942687988281, "global_step": 68654, "epoch": 408} {"train_loss": -8.95761775970459, "global_step": 68655, "epoch": 408} {"train_loss": -8.725075721740723, "global_step": 68656, "epoch": 408} {"train_loss": -9.189417839050293, "global_step": 68657, "epoch": 408} {"train_loss": -8.665782928466797, "global_step": 68658, "epoch": 408} {"train_loss": -8.798617362976074, "global_step": 68659, "epoch": 408} {"train_loss": -8.652847290039062, "global_step": 68660, "epoch": 408} {"train_loss": -8.719181060791016, "global_step": 68661, "epoch": 408} {"train_loss": -9.157605171203613, "global_step": 68662, "epoch": 408} {"train_loss": -9.083574295043945, "global_step": 68663, "epoch": 408} {"train_loss": -8.786949157714844, "global_step": 68664, "epoch": 408} {"train_loss": -8.5328950881958, "global_step": 68665, "epoch": 408} {"train_loss": -9.212164878845215, "global_step": 68666, "epoch": 408} {"train_loss": -8.746831893920898, "global_step": 68667, "epoch": 408} {"train_loss": -8.870597839355469, "global_step": 68668, "epoch": 408} {"train_loss": -8.744173049926758, "global_step": 68669, "epoch": 408} {"train_loss": -8.927433967590332, "global_step": 68670, "epoch": 408} {"train_loss": -8.680013656616211, "global_step": 68671, "epoch": 408} {"train_loss": -9.061356544494629, "global_step": 68672, "epoch": 408} {"train_loss": -8.734304428100586, "global_step": 68673, "epoch": 408} {"train_loss": -8.878421783447266, "global_step": 68674, "epoch": 408} {"train_loss": -8.501805305480957, "global_step": 68675, "epoch": 408} {"train_loss": -8.848289489746094, "global_step": 68676, "epoch": 408} {"train_loss": -8.773185729980469, "global_step": 68677, "epoch": 408} {"train_loss": -8.811647415161133, "global_step": 68678, "epoch": 408} {"train_loss": -8.756214141845703, "global_step": 68679, "epoch": 408} {"train_loss": -8.625532150268555, "global_step": 68680, "epoch": 408} {"train_loss": -8.937259674072266, "global_step": 68681, "epoch": 408} {"train_loss": -8.650917053222656, "global_step": 68682, "epoch": 408} {"train_loss": -8.598358154296875, "global_step": 68683, "epoch": 408} {"train_loss": -8.765094757080078, "global_step": 68684, "epoch": 408} {"train_loss": -8.625419616699219, "global_step": 68685, "epoch": 408} {"train_loss": -8.578166961669922, "global_step": 68686, "epoch": 408} {"train_loss": -8.366305351257324, "global_step": 68687, "epoch": 408} {"train_loss": -8.847530364990234, "global_step": 68688, "epoch": 408} {"train_loss": -8.324747085571289, "global_step": 68689, "epoch": 408} {"train_loss": -8.564237594604492, "global_step": 68690, "epoch": 408} {"train_loss": -8.743703842163086, "global_step": 68691, "epoch": 408} {"train_loss": -8.657100677490234, "global_step": 68692, "epoch": 408} {"train_loss": -8.993537902832031, "global_step": 68693, "epoch": 408} {"train_loss": -8.862335205078125, "global_step": 68694, "epoch": 408} {"train_loss": -8.761529922485352, "global_step": 68695, "epoch": 408} {"train_loss": -8.724191665649414, "global_step": 68696, "epoch": 408} {"train_loss": -8.798677444458008, "global_step": 68697, "epoch": 408} {"train_loss": -8.908224105834961, "global_step": 68698, "epoch": 408} {"train_loss": -8.804141998291016, "global_step": 68699, "epoch": 408} {"train_loss": -9.010709762573242, "global_step": 68700, "epoch": 408} {"train_loss": -8.968097686767578, "global_step": 68701, "epoch": 408} {"train_loss": -9.013715744018555, "global_step": 68702, "epoch": 408} {"train_loss": -8.925516128540039, "global_step": 68703, "epoch": 408} {"train_loss": -8.927347183227539, "global_step": 68704, "epoch": 408} {"train_loss": -8.761762619018555, "global_step": 68705, "epoch": 408} {"train_loss": -9.090255737304688, "global_step": 68706, "epoch": 408} {"train_loss": -8.7935209274292, "global_step": 68707, "epoch": 408} {"train_loss": -9.032153129577637, "global_step": 68708, "epoch": 408} {"train_loss": -8.875945091247559, "global_step": 68709, "epoch": 408} {"train_loss": -8.940054893493652, "global_step": 68710, "epoch": 408} {"train_loss": -8.86173963546753, "global_step": 68711, "epoch": 408, "val_loss": 191734.3125} {"train_loss": -8.500686645507812, "global_step": 68712, "epoch": 409} {"train_loss": -8.831733703613281, "global_step": 68713, "epoch": 409} {"train_loss": -8.652935028076172, "global_step": 68714, "epoch": 409} {"train_loss": -8.707636833190918, "global_step": 68715, "epoch": 409} {"train_loss": -8.440345764160156, "global_step": 68716, "epoch": 409} {"train_loss": -8.462468147277832, "global_step": 68717, "epoch": 409} {"train_loss": -8.566709518432617, "global_step": 68718, "epoch": 409} {"train_loss": -8.594866752624512, "global_step": 68719, "epoch": 409} {"train_loss": -8.716450691223145, "global_step": 68720, "epoch": 409} {"train_loss": -8.709478378295898, "global_step": 68721, "epoch": 409} {"train_loss": -8.83993148803711, "global_step": 68722, "epoch": 409} {"train_loss": -8.714655876159668, "global_step": 68723, "epoch": 409} {"train_loss": -8.913233757019043, "global_step": 68724, "epoch": 409} {"train_loss": -8.460240364074707, "global_step": 68725, "epoch": 409} {"train_loss": -8.984842300415039, "global_step": 68726, "epoch": 409} {"train_loss": -8.630193710327148, "global_step": 68727, "epoch": 409} {"train_loss": -8.724891662597656, "global_step": 68728, "epoch": 409} {"train_loss": -8.755932807922363, "global_step": 68729, "epoch": 409} {"train_loss": -8.65568733215332, "global_step": 68730, "epoch": 409} {"train_loss": -8.810044288635254, "global_step": 68731, "epoch": 409} {"train_loss": -8.820792198181152, "global_step": 68732, "epoch": 409} {"train_loss": -8.749299049377441, "global_step": 68733, "epoch": 409} {"train_loss": -9.024727821350098, "global_step": 68734, "epoch": 409} {"train_loss": -8.878634452819824, "global_step": 68735, "epoch": 409} {"train_loss": -9.015661239624023, "global_step": 68736, "epoch": 409} {"train_loss": -8.953420639038086, "global_step": 68737, "epoch": 409} {"train_loss": -8.833824157714844, "global_step": 68738, "epoch": 409} {"train_loss": -9.075754165649414, "global_step": 68739, "epoch": 409} {"train_loss": -8.80289077758789, "global_step": 68740, "epoch": 409} {"train_loss": -8.741304397583008, "global_step": 68741, "epoch": 409} {"train_loss": -9.018854141235352, "global_step": 68742, "epoch": 409} {"train_loss": -8.418498039245605, "global_step": 68743, "epoch": 409} {"train_loss": -8.96034049987793, "global_step": 68744, "epoch": 409} {"train_loss": -8.65176010131836, "global_step": 68745, "epoch": 409} {"train_loss": -8.951587677001953, "global_step": 68746, "epoch": 409} {"train_loss": -8.995960235595703, "global_step": 68747, "epoch": 409} {"train_loss": -8.82741928100586, "global_step": 68748, "epoch": 409} {"train_loss": -8.823396682739258, "global_step": 68749, "epoch": 409} {"train_loss": -8.600316047668457, "global_step": 68750, "epoch": 409} {"train_loss": -8.874736785888672, "global_step": 68751, "epoch": 409} {"train_loss": -9.038476943969727, "global_step": 68752, "epoch": 409} {"train_loss": -8.791097640991211, "global_step": 68753, "epoch": 409} {"train_loss": -8.67887020111084, "global_step": 68754, "epoch": 409} {"train_loss": -9.068740844726562, "global_step": 68755, "epoch": 409} {"train_loss": -8.633264541625977, "global_step": 68756, "epoch": 409} {"train_loss": -8.735427856445312, "global_step": 68757, "epoch": 409} {"train_loss": -9.153861045837402, "global_step": 68758, "epoch": 409} {"train_loss": -8.650110244750977, "global_step": 68759, "epoch": 409} {"train_loss": -9.116084098815918, "global_step": 68760, "epoch": 409} {"train_loss": -9.015026092529297, "global_step": 68761, "epoch": 409} {"train_loss": -8.965958595275879, "global_step": 68762, "epoch": 409} {"train_loss": -8.876532554626465, "global_step": 68763, "epoch": 409} {"train_loss": -8.942176818847656, "global_step": 68764, "epoch": 409} {"train_loss": -9.005149841308594, "global_step": 68765, "epoch": 409} {"train_loss": -9.051751136779785, "global_step": 68766, "epoch": 409} {"train_loss": -9.091043472290039, "global_step": 68767, "epoch": 409} {"train_loss": -9.029817581176758, "global_step": 68768, "epoch": 409} {"train_loss": -9.01445484161377, "global_step": 68769, "epoch": 409} {"train_loss": -9.107840538024902, "global_step": 68770, "epoch": 409} {"train_loss": -9.21129035949707, "global_step": 68771, "epoch": 409} {"train_loss": -8.854676246643066, "global_step": 68772, "epoch": 409} {"train_loss": -9.122915267944336, "global_step": 68773, "epoch": 409} {"train_loss": -8.999478340148926, "global_step": 68774, "epoch": 409} {"train_loss": -9.083243370056152, "global_step": 68775, "epoch": 409} {"train_loss": -9.026359558105469, "global_step": 68776, "epoch": 409} {"train_loss": -9.035980224609375, "global_step": 68777, "epoch": 409} {"train_loss": -9.040250778198242, "global_step": 68778, "epoch": 409} {"train_loss": -9.110227584838867, "global_step": 68779, "epoch": 409} {"train_loss": -9.061700820922852, "global_step": 68780, "epoch": 409} {"train_loss": -8.955392837524414, "global_step": 68781, "epoch": 409} {"train_loss": -9.207460403442383, "global_step": 68782, "epoch": 409} {"train_loss": -8.894733428955078, "global_step": 68783, "epoch": 409} {"train_loss": -9.22307300567627, "global_step": 68784, "epoch": 409} {"train_loss": -8.85891342163086, "global_step": 68785, "epoch": 409} {"train_loss": -8.949296951293945, "global_step": 68786, "epoch": 409} {"train_loss": -9.055587768554688, "global_step": 68787, "epoch": 409} {"train_loss": -8.80659294128418, "global_step": 68788, "epoch": 409} {"train_loss": -8.94578742980957, "global_step": 68789, "epoch": 409} {"train_loss": -8.7172269821167, "global_step": 68790, "epoch": 409} {"train_loss": -8.849029541015625, "global_step": 68791, "epoch": 409} {"train_loss": -8.751127243041992, "global_step": 68792, "epoch": 409} {"train_loss": -8.88831901550293, "global_step": 68793, "epoch": 409} {"train_loss": -8.883426666259766, "global_step": 68794, "epoch": 409} {"train_loss": -8.815832138061523, "global_step": 68795, "epoch": 409} {"train_loss": -8.76877498626709, "global_step": 68796, "epoch": 409} {"train_loss": -8.964853286743164, "global_step": 68797, "epoch": 409} {"train_loss": -8.788797378540039, "global_step": 68798, "epoch": 409} {"train_loss": -8.740188598632812, "global_step": 68799, "epoch": 409} {"train_loss": -8.66545581817627, "global_step": 68800, "epoch": 409} {"train_loss": -8.744734764099121, "global_step": 68801, "epoch": 409} {"train_loss": -8.465456008911133, "global_step": 68802, "epoch": 409} {"train_loss": -8.718982696533203, "global_step": 68803, "epoch": 409} {"train_loss": -8.737340927124023, "global_step": 68804, "epoch": 409} {"train_loss": -8.793789863586426, "global_step": 68805, "epoch": 409} {"train_loss": -8.938953399658203, "global_step": 68806, "epoch": 409} {"train_loss": -8.780656814575195, "global_step": 68807, "epoch": 409} {"train_loss": -9.078790664672852, "global_step": 68808, "epoch": 409} {"train_loss": -8.752057075500488, "global_step": 68809, "epoch": 409} {"train_loss": -8.970653533935547, "global_step": 68810, "epoch": 409} {"train_loss": -8.784936904907227, "global_step": 68811, "epoch": 409} {"train_loss": -8.715473175048828, "global_step": 68812, "epoch": 409} {"train_loss": -8.96689510345459, "global_step": 68813, "epoch": 409} {"train_loss": -8.601628303527832, "global_step": 68814, "epoch": 409} {"train_loss": -8.849945068359375, "global_step": 68815, "epoch": 409} {"train_loss": -8.969417572021484, "global_step": 68816, "epoch": 409} {"train_loss": -9.008056640625, "global_step": 68817, "epoch": 409} {"train_loss": -8.819586753845215, "global_step": 68818, "epoch": 409} {"train_loss": -9.041946411132812, "global_step": 68819, "epoch": 409} {"train_loss": -8.891182899475098, "global_step": 68820, "epoch": 409} {"train_loss": -9.037251472473145, "global_step": 68821, "epoch": 409} {"train_loss": -8.867122650146484, "global_step": 68822, "epoch": 409} {"train_loss": -9.090324401855469, "global_step": 68823, "epoch": 409} {"train_loss": -8.918710708618164, "global_step": 68824, "epoch": 409} {"train_loss": -9.192337036132812, "global_step": 68825, "epoch": 409} {"train_loss": -9.058462142944336, "global_step": 68826, "epoch": 409} {"train_loss": -9.160751342773438, "global_step": 68827, "epoch": 409} {"train_loss": -8.849071502685547, "global_step": 68828, "epoch": 409} {"train_loss": -8.856224060058594, "global_step": 68829, "epoch": 409} {"train_loss": -9.155139923095703, "global_step": 68830, "epoch": 409} {"train_loss": -9.000871658325195, "global_step": 68831, "epoch": 409} {"train_loss": -9.152227401733398, "global_step": 68832, "epoch": 409} {"train_loss": -8.767906188964844, "global_step": 68833, "epoch": 409} {"train_loss": -9.264766693115234, "global_step": 68834, "epoch": 409} {"train_loss": -9.104972839355469, "global_step": 68835, "epoch": 409} {"train_loss": -8.599760055541992, "global_step": 68836, "epoch": 409} {"train_loss": -9.125923156738281, "global_step": 68837, "epoch": 409} {"train_loss": -8.865923881530762, "global_step": 68838, "epoch": 409} {"train_loss": -8.98585319519043, "global_step": 68839, "epoch": 409} {"train_loss": -9.055959701538086, "global_step": 68840, "epoch": 409} {"train_loss": -9.01239013671875, "global_step": 68841, "epoch": 409} {"train_loss": -8.502549171447754, "global_step": 68842, "epoch": 409} {"train_loss": -8.907476425170898, "global_step": 68843, "epoch": 409} {"train_loss": -8.548564910888672, "global_step": 68844, "epoch": 409} {"train_loss": -8.782027244567871, "global_step": 68845, "epoch": 409} {"train_loss": -9.014139175415039, "global_step": 68846, "epoch": 409} {"train_loss": -8.966972351074219, "global_step": 68847, "epoch": 409} {"train_loss": -8.936366081237793, "global_step": 68848, "epoch": 409} {"train_loss": -8.870543479919434, "global_step": 68849, "epoch": 409} {"train_loss": -8.827014923095703, "global_step": 68850, "epoch": 409} {"train_loss": -8.71432876586914, "global_step": 68851, "epoch": 409} {"train_loss": -9.004026412963867, "global_step": 68852, "epoch": 409} {"train_loss": -8.979355812072754, "global_step": 68853, "epoch": 409} {"train_loss": -8.877395629882812, "global_step": 68854, "epoch": 409} {"train_loss": -9.051868438720703, "global_step": 68855, "epoch": 409} {"train_loss": -9.020721435546875, "global_step": 68856, "epoch": 409} {"train_loss": -8.953084945678711, "global_step": 68857, "epoch": 409} {"train_loss": -8.915987014770508, "global_step": 68858, "epoch": 409} {"train_loss": -8.791862487792969, "global_step": 68859, "epoch": 409} {"train_loss": -8.763925552368164, "global_step": 68860, "epoch": 409} {"train_loss": -8.7960786819458, "global_step": 68861, "epoch": 409} {"train_loss": -8.686593055725098, "global_step": 68862, "epoch": 409} {"train_loss": -8.805936813354492, "global_step": 68863, "epoch": 409} {"train_loss": -8.943410873413086, "global_step": 68864, "epoch": 409} {"train_loss": -8.764134407043457, "global_step": 68865, "epoch": 409} {"train_loss": -9.165472030639648, "global_step": 68866, "epoch": 409} {"train_loss": -8.915653228759766, "global_step": 68867, "epoch": 409} {"train_loss": -8.701187133789062, "global_step": 68868, "epoch": 409} {"train_loss": -8.927499771118164, "global_step": 68869, "epoch": 409} {"train_loss": -9.041467666625977, "global_step": 68870, "epoch": 409} {"train_loss": -9.060165405273438, "global_step": 68871, "epoch": 409} {"train_loss": -8.925848007202148, "global_step": 68872, "epoch": 409} {"train_loss": -9.066767692565918, "global_step": 68873, "epoch": 409} {"train_loss": -8.731054306030273, "global_step": 68874, "epoch": 409} {"train_loss": -8.948168754577637, "global_step": 68875, "epoch": 409} {"train_loss": -9.151443481445312, "global_step": 68876, "epoch": 409} {"train_loss": -9.058931350708008, "global_step": 68877, "epoch": 409} {"train_loss": -8.898582458496094, "global_step": 68878, "epoch": 409} {"train_loss": -8.884248296419779, "global_step": 68879, "epoch": 409, "val_loss": 192479.296875} {"train_loss": -8.994403839111328, "global_step": 68880, "epoch": 410} {"train_loss": -8.969525337219238, "global_step": 68881, "epoch": 410} {"train_loss": -8.868982315063477, "global_step": 68882, "epoch": 410} {"train_loss": -9.206256866455078, "global_step": 68883, "epoch": 410} {"train_loss": -8.981836318969727, "global_step": 68884, "epoch": 410} {"train_loss": -8.89234733581543, "global_step": 68885, "epoch": 410} {"train_loss": -8.93680191040039, "global_step": 68886, "epoch": 410} {"train_loss": -8.845121383666992, "global_step": 68887, "epoch": 410} {"train_loss": -9.117874145507812, "global_step": 68888, "epoch": 410} {"train_loss": -9.02304744720459, "global_step": 68889, "epoch": 410} {"train_loss": -8.811683654785156, "global_step": 68890, "epoch": 410} {"train_loss": -8.815499305725098, "global_step": 68891, "epoch": 410} {"train_loss": -8.898853302001953, "global_step": 68892, "epoch": 410} {"train_loss": -8.63730525970459, "global_step": 68893, "epoch": 410} {"train_loss": -8.95161247253418, "global_step": 68894, "epoch": 410} {"train_loss": -8.408244132995605, "global_step": 68895, "epoch": 410} {"train_loss": -8.769274711608887, "global_step": 68896, "epoch": 410} {"train_loss": -8.620575904846191, "global_step": 68897, "epoch": 410} {"train_loss": -8.899992942810059, "global_step": 68898, "epoch": 410} {"train_loss": -8.68233871459961, "global_step": 68899, "epoch": 410} {"train_loss": -8.781230926513672, "global_step": 68900, "epoch": 410} {"train_loss": -8.69621467590332, "global_step": 68901, "epoch": 410} {"train_loss": -8.81309700012207, "global_step": 68902, "epoch": 410} {"train_loss": -8.665060997009277, "global_step": 68903, "epoch": 410} {"train_loss": -8.565495491027832, "global_step": 68904, "epoch": 410} {"train_loss": -8.579828262329102, "global_step": 68905, "epoch": 410} {"train_loss": -8.504003524780273, "global_step": 68906, "epoch": 410} {"train_loss": -8.702596664428711, "global_step": 68907, "epoch": 410} {"train_loss": -8.642032623291016, "global_step": 68908, "epoch": 410} {"train_loss": -8.676921844482422, "global_step": 68909, "epoch": 410} {"train_loss": -8.572063446044922, "global_step": 68910, "epoch": 410} {"train_loss": -8.594442367553711, "global_step": 68911, "epoch": 410} {"train_loss": -8.729349136352539, "global_step": 68912, "epoch": 410} {"train_loss": -8.853577613830566, "global_step": 68913, "epoch": 410} {"train_loss": -8.697367668151855, "global_step": 68914, "epoch": 410} {"train_loss": -8.742096900939941, "global_step": 68915, "epoch": 410} {"train_loss": -8.569112777709961, "global_step": 68916, "epoch": 410} {"train_loss": -8.841268539428711, "global_step": 68917, "epoch": 410} {"train_loss": -8.633960723876953, "global_step": 68918, "epoch": 410} {"train_loss": -8.762894630432129, "global_step": 68919, "epoch": 410} {"train_loss": -8.641578674316406, "global_step": 68920, "epoch": 410} {"train_loss": -8.571080207824707, "global_step": 68921, "epoch": 410} {"train_loss": -8.82638168334961, "global_step": 68922, "epoch": 410} {"train_loss": -8.845321655273438, "global_step": 68923, "epoch": 410} {"train_loss": -8.710831642150879, "global_step": 68924, "epoch": 410} {"train_loss": -8.678359985351562, "global_step": 68925, "epoch": 410} {"train_loss": -9.058060646057129, "global_step": 68926, "epoch": 410} {"train_loss": -8.949836730957031, "global_step": 68927, "epoch": 410} {"train_loss": -8.735895156860352, "global_step": 68928, "epoch": 410} {"train_loss": -9.038610458374023, "global_step": 68929, "epoch": 410} {"train_loss": -8.78911018371582, "global_step": 68930, "epoch": 410} {"train_loss": -8.697549819946289, "global_step": 68931, "epoch": 410} {"train_loss": -8.823780059814453, "global_step": 68932, "epoch": 410} {"train_loss": -8.873651504516602, "global_step": 68933, "epoch": 410} {"train_loss": -8.789070129394531, "global_step": 68934, "epoch": 410} {"train_loss": -9.004852294921875, "global_step": 68935, "epoch": 410} {"train_loss": -9.200860023498535, "global_step": 68936, "epoch": 410} {"train_loss": -8.763206481933594, "global_step": 68937, "epoch": 410} {"train_loss": -8.85682487487793, "global_step": 68938, "epoch": 410} {"train_loss": -8.54043197631836, "global_step": 68939, "epoch": 410} {"train_loss": -9.064087867736816, "global_step": 68940, "epoch": 410} {"train_loss": -8.78021240234375, "global_step": 68941, "epoch": 410} {"train_loss": -8.619997024536133, "global_step": 68942, "epoch": 410} {"train_loss": -9.220149993896484, "global_step": 68943, "epoch": 410} {"train_loss": -8.72644329071045, "global_step": 68944, "epoch": 410} {"train_loss": -8.942023277282715, "global_step": 68945, "epoch": 410} {"train_loss": -8.894983291625977, "global_step": 68946, "epoch": 410} {"train_loss": -8.763467788696289, "global_step": 68947, "epoch": 410} {"train_loss": -8.760528564453125, "global_step": 68948, "epoch": 410} {"train_loss": -8.970799446105957, "global_step": 68949, "epoch": 410} {"train_loss": -8.754968643188477, "global_step": 68950, "epoch": 410} {"train_loss": -8.662206649780273, "global_step": 68951, "epoch": 410} {"train_loss": -8.838936805725098, "global_step": 68952, "epoch": 410} {"train_loss": -8.663190841674805, "global_step": 68953, "epoch": 410} {"train_loss": -8.523819923400879, "global_step": 68954, "epoch": 410} {"train_loss": -8.733692169189453, "global_step": 68955, "epoch": 410} {"train_loss": -8.698236465454102, "global_step": 68956, "epoch": 410} {"train_loss": -8.836204528808594, "global_step": 68957, "epoch": 410} {"train_loss": -8.80184555053711, "global_step": 68958, "epoch": 410} {"train_loss": -8.728978157043457, "global_step": 68959, "epoch": 410} {"train_loss": -8.909754753112793, "global_step": 68960, "epoch": 410} {"train_loss": -8.777377128601074, "global_step": 68961, "epoch": 410} {"train_loss": -8.946014404296875, "global_step": 68962, "epoch": 410} {"train_loss": -8.818473815917969, "global_step": 68963, "epoch": 410} {"train_loss": -8.828004837036133, "global_step": 68964, "epoch": 410} {"train_loss": -8.94911003112793, "global_step": 68965, "epoch": 410} {"train_loss": -8.843027114868164, "global_step": 68966, "epoch": 410} {"train_loss": -9.052395820617676, "global_step": 68967, "epoch": 410} {"train_loss": -8.933514595031738, "global_step": 68968, "epoch": 410} {"train_loss": -8.88748550415039, "global_step": 68969, "epoch": 410} {"train_loss": -8.789376258850098, "global_step": 68970, "epoch": 410} {"train_loss": -8.880844116210938, "global_step": 68971, "epoch": 410} {"train_loss": -8.813490867614746, "global_step": 68972, "epoch": 410} {"train_loss": -9.119819641113281, "global_step": 68973, "epoch": 410} {"train_loss": -8.717547416687012, "global_step": 68974, "epoch": 410} {"train_loss": -8.99412727355957, "global_step": 68975, "epoch": 410} {"train_loss": -8.9325532913208, "global_step": 68976, "epoch": 410} {"train_loss": -8.83372688293457, "global_step": 68977, "epoch": 410} {"train_loss": -8.985441207885742, "global_step": 68978, "epoch": 410} {"train_loss": -9.063562393188477, "global_step": 68979, "epoch": 410} {"train_loss": -8.954660415649414, "global_step": 68980, "epoch": 410} {"train_loss": -8.69942569732666, "global_step": 68981, "epoch": 410} {"train_loss": -8.806679725646973, "global_step": 68982, "epoch": 410} {"train_loss": -8.777579307556152, "global_step": 68983, "epoch": 410} {"train_loss": -8.692544937133789, "global_step": 68984, "epoch": 410} {"train_loss": -8.694791793823242, "global_step": 68985, "epoch": 410} {"train_loss": -8.502811431884766, "global_step": 68986, "epoch": 410} {"train_loss": -8.501307487487793, "global_step": 68987, "epoch": 410} {"train_loss": -8.447502136230469, "global_step": 68988, "epoch": 410} {"train_loss": -8.706483840942383, "global_step": 68989, "epoch": 410} {"train_loss": -8.930471420288086, "global_step": 68990, "epoch": 410} {"train_loss": -8.835683822631836, "global_step": 68991, "epoch": 410} {"train_loss": -8.958722114562988, "global_step": 68992, "epoch": 410} {"train_loss": -8.74520206451416, "global_step": 68993, "epoch": 410} {"train_loss": -8.847143173217773, "global_step": 68994, "epoch": 410} {"train_loss": -8.782291412353516, "global_step": 68995, "epoch": 410} {"train_loss": -8.79944133758545, "global_step": 68996, "epoch": 410} {"train_loss": -8.72718620300293, "global_step": 68997, "epoch": 410} {"train_loss": -8.714254379272461, "global_step": 68998, "epoch": 410} {"train_loss": -8.437532424926758, "global_step": 68999, "epoch": 410} {"train_loss": -8.929121017456055, "global_step": 69000, "epoch": 410} {"train_loss": -8.628819465637207, "global_step": 69001, "epoch": 410} {"train_loss": -8.784687042236328, "global_step": 69002, "epoch": 410} {"train_loss": -8.729148864746094, "global_step": 69003, "epoch": 410} {"train_loss": -9.019695281982422, "global_step": 69004, "epoch": 410} {"train_loss": -8.72152328491211, "global_step": 69005, "epoch": 410} {"train_loss": -8.906278610229492, "global_step": 69006, "epoch": 410} {"train_loss": -8.939752578735352, "global_step": 69007, "epoch": 410} {"train_loss": -8.90494441986084, "global_step": 69008, "epoch": 410} {"train_loss": -8.759552001953125, "global_step": 69009, "epoch": 410} {"train_loss": -9.108142852783203, "global_step": 69010, "epoch": 410} {"train_loss": -8.923443794250488, "global_step": 69011, "epoch": 410} {"train_loss": -8.887796401977539, "global_step": 69012, "epoch": 410} {"train_loss": -9.1361722946167, "global_step": 69013, "epoch": 410} {"train_loss": -8.813032150268555, "global_step": 69014, "epoch": 410} {"train_loss": -8.976601600646973, "global_step": 69015, "epoch": 410} {"train_loss": -8.989166259765625, "global_step": 69016, "epoch": 410} {"train_loss": -9.162400245666504, "global_step": 69017, "epoch": 410} {"train_loss": -8.926427841186523, "global_step": 69018, "epoch": 410} {"train_loss": -8.923340797424316, "global_step": 69019, "epoch": 410} {"train_loss": -8.985506057739258, "global_step": 69020, "epoch": 410} {"train_loss": -8.712996482849121, "global_step": 69021, "epoch": 410} {"train_loss": -8.820823669433594, "global_step": 69022, "epoch": 410} {"train_loss": -8.975677490234375, "global_step": 69023, "epoch": 410} {"train_loss": -8.957233428955078, "global_step": 69024, "epoch": 410} {"train_loss": -8.696295738220215, "global_step": 69025, "epoch": 410} {"train_loss": -8.829025268554688, "global_step": 69026, "epoch": 410} {"train_loss": -8.495397567749023, "global_step": 69027, "epoch": 410} {"train_loss": -8.91956901550293, "global_step": 69028, "epoch": 410} {"train_loss": -8.393891334533691, "global_step": 69029, "epoch": 410} {"train_loss": -8.804828643798828, "global_step": 69030, "epoch": 410} {"train_loss": -8.394880294799805, "global_step": 69031, "epoch": 410} {"train_loss": -8.837690353393555, "global_step": 69032, "epoch": 410} {"train_loss": -8.552896499633789, "global_step": 69033, "epoch": 410} {"train_loss": -8.8916654586792, "global_step": 69034, "epoch": 410} {"train_loss": -8.417688369750977, "global_step": 69035, "epoch": 410} {"train_loss": -8.83864974975586, "global_step": 69036, "epoch": 410} {"train_loss": -8.483705520629883, "global_step": 69037, "epoch": 410} {"train_loss": -8.753061294555664, "global_step": 69038, "epoch": 410} {"train_loss": -8.847734451293945, "global_step": 69039, "epoch": 410} {"train_loss": -8.9554443359375, "global_step": 69040, "epoch": 410} {"train_loss": -8.913042068481445, "global_step": 69041, "epoch": 410} {"train_loss": -8.856087684631348, "global_step": 69042, "epoch": 410} {"train_loss": -8.773419380187988, "global_step": 69043, "epoch": 410} {"train_loss": -8.992185592651367, "global_step": 69044, "epoch": 410} {"train_loss": -8.868541717529297, "global_step": 69045, "epoch": 410} {"train_loss": -9.097232818603516, "global_step": 69046, "epoch": 410} {"train_loss": -8.810133286884852, "global_step": 69047, "epoch": 410, "val_loss": 192281.84375, "train_action_mse_error": 8.25291919708252} {"train_loss": -9.083006858825684, "global_step": 69048, "epoch": 411} {"train_loss": -8.794677734375, "global_step": 69049, "epoch": 411} {"train_loss": -9.032514572143555, "global_step": 69050, "epoch": 411} {"train_loss": -9.124232292175293, "global_step": 69051, "epoch": 411} {"train_loss": -8.674878120422363, "global_step": 69052, "epoch": 411} {"train_loss": -9.116138458251953, "global_step": 69053, "epoch": 411} {"train_loss": -8.818963050842285, "global_step": 69054, "epoch": 411} {"train_loss": -8.91224479675293, "global_step": 69055, "epoch": 411} {"train_loss": -8.944929122924805, "global_step": 69056, "epoch": 411} {"train_loss": -8.770927429199219, "global_step": 69057, "epoch": 411} {"train_loss": -8.908349990844727, "global_step": 69058, "epoch": 411} {"train_loss": -8.539383888244629, "global_step": 69059, "epoch": 411} {"train_loss": -8.843114852905273, "global_step": 69060, "epoch": 411} {"train_loss": -8.836219787597656, "global_step": 69061, "epoch": 411} {"train_loss": -8.945243835449219, "global_step": 69062, "epoch": 411} {"train_loss": -8.892810821533203, "global_step": 69063, "epoch": 411} {"train_loss": -8.973492622375488, "global_step": 69064, "epoch": 411} {"train_loss": -8.420552253723145, "global_step": 69065, "epoch": 411} {"train_loss": -8.531494140625, "global_step": 69066, "epoch": 411} {"train_loss": -8.893594741821289, "global_step": 69067, "epoch": 411} {"train_loss": -8.960807800292969, "global_step": 69068, "epoch": 411} {"train_loss": -8.940547943115234, "global_step": 69069, "epoch": 411} {"train_loss": -8.980809211730957, "global_step": 69070, "epoch": 411} {"train_loss": -8.685816764831543, "global_step": 69071, "epoch": 411} {"train_loss": -8.8689603805542, "global_step": 69072, "epoch": 411} {"train_loss": -8.83326530456543, "global_step": 69073, "epoch": 411} {"train_loss": -8.797975540161133, "global_step": 69074, "epoch": 411} {"train_loss": -8.654400825500488, "global_step": 69075, "epoch": 411} {"train_loss": -8.981449127197266, "global_step": 69076, "epoch": 411} {"train_loss": -8.79326343536377, "global_step": 69077, "epoch": 411} {"train_loss": -8.780084609985352, "global_step": 69078, "epoch": 411} {"train_loss": -8.85507583618164, "global_step": 69079, "epoch": 411} {"train_loss": -8.62374496459961, "global_step": 69080, "epoch": 411} {"train_loss": -8.576904296875, "global_step": 69081, "epoch": 411} {"train_loss": -8.737485885620117, "global_step": 69082, "epoch": 411} {"train_loss": -8.921501159667969, "global_step": 69083, "epoch": 411} {"train_loss": -8.759297370910645, "global_step": 69084, "epoch": 411} {"train_loss": -8.83276081085205, "global_step": 69085, "epoch": 411} {"train_loss": -8.420866012573242, "global_step": 69086, "epoch": 411} {"train_loss": -8.88968563079834, "global_step": 69087, "epoch": 411} {"train_loss": -8.59255599975586, "global_step": 69088, "epoch": 411} {"train_loss": -8.945631980895996, "global_step": 69089, "epoch": 411} {"train_loss": -8.775285720825195, "global_step": 69090, "epoch": 411} {"train_loss": -8.700212478637695, "global_step": 69091, "epoch": 411} {"train_loss": -8.505346298217773, "global_step": 69092, "epoch": 411} {"train_loss": -8.723913192749023, "global_step": 69093, "epoch": 411} {"train_loss": -8.47308349609375, "global_step": 69094, "epoch": 411} {"train_loss": -8.793060302734375, "global_step": 69095, "epoch": 411} {"train_loss": -8.626060485839844, "global_step": 69096, "epoch": 411} {"train_loss": -8.768556594848633, "global_step": 69097, "epoch": 411} {"train_loss": -8.335208892822266, "global_step": 69098, "epoch": 411} {"train_loss": -8.830266952514648, "global_step": 69099, "epoch": 411} {"train_loss": -8.443915367126465, "global_step": 69100, "epoch": 411} {"train_loss": -8.741677284240723, "global_step": 69101, "epoch": 411} {"train_loss": -8.3402681350708, "global_step": 69102, "epoch": 411} {"train_loss": -8.647770881652832, "global_step": 69103, "epoch": 411} {"train_loss": -8.513574600219727, "global_step": 69104, "epoch": 411} {"train_loss": -8.876199722290039, "global_step": 69105, "epoch": 411} {"train_loss": -8.63241958618164, "global_step": 69106, "epoch": 411} {"train_loss": -8.332115173339844, "global_step": 69107, "epoch": 411} {"train_loss": -8.962697982788086, "global_step": 69108, "epoch": 411} {"train_loss": -8.690519332885742, "global_step": 69109, "epoch": 411} {"train_loss": -8.584178924560547, "global_step": 69110, "epoch": 411} {"train_loss": -8.842933654785156, "global_step": 69111, "epoch": 411} {"train_loss": -8.677120208740234, "global_step": 69112, "epoch": 411} {"train_loss": -8.990888595581055, "global_step": 69113, "epoch": 411} {"train_loss": -8.648078918457031, "global_step": 69114, "epoch": 411} {"train_loss": -8.90908432006836, "global_step": 69115, "epoch": 411} {"train_loss": -8.880017280578613, "global_step": 69116, "epoch": 411} {"train_loss": -8.731855392456055, "global_step": 69117, "epoch": 411} {"train_loss": -8.826736450195312, "global_step": 69118, "epoch": 411} {"train_loss": -9.127250671386719, "global_step": 69119, "epoch": 411} {"train_loss": -8.913579940795898, "global_step": 69120, "epoch": 411} {"train_loss": -8.825700759887695, "global_step": 69121, "epoch": 411} {"train_loss": -9.190813064575195, "global_step": 69122, "epoch": 411} {"train_loss": -8.872308731079102, "global_step": 69123, "epoch": 411} {"train_loss": -8.900187492370605, "global_step": 69124, "epoch": 411} {"train_loss": -8.806970596313477, "global_step": 69125, "epoch": 411} {"train_loss": -9.038736343383789, "global_step": 69126, "epoch": 411} {"train_loss": -9.081517219543457, "global_step": 69127, "epoch": 411} {"train_loss": -9.16838264465332, "global_step": 69128, "epoch": 411} {"train_loss": -9.213764190673828, "global_step": 69129, "epoch": 411} {"train_loss": -9.131710052490234, "global_step": 69130, "epoch": 411} {"train_loss": -9.15614128112793, "global_step": 69131, "epoch": 411} {"train_loss": -9.099771499633789, "global_step": 69132, "epoch": 411} {"train_loss": -9.24774169921875, "global_step": 69133, "epoch": 411} {"train_loss": -9.288742065429688, "global_step": 69134, "epoch": 411} {"train_loss": -9.085180282592773, "global_step": 69135, "epoch": 411} {"train_loss": -9.014625549316406, "global_step": 69136, "epoch": 411} {"train_loss": -9.010799407958984, "global_step": 69137, "epoch": 411} {"train_loss": -8.810413360595703, "global_step": 69138, "epoch": 411} {"train_loss": -9.061822891235352, "global_step": 69139, "epoch": 411} {"train_loss": -9.296073913574219, "global_step": 69140, "epoch": 411} {"train_loss": -9.082569122314453, "global_step": 69141, "epoch": 411} {"train_loss": -9.112861633300781, "global_step": 69142, "epoch": 411} {"train_loss": -8.667236328125, "global_step": 69143, "epoch": 411} {"train_loss": -8.746101379394531, "global_step": 69144, "epoch": 411} {"train_loss": -8.871234893798828, "global_step": 69145, "epoch": 411} {"train_loss": -8.465712547302246, "global_step": 69146, "epoch": 411} {"train_loss": -8.661710739135742, "global_step": 69147, "epoch": 411} {"train_loss": -8.733973503112793, "global_step": 69148, "epoch": 411} {"train_loss": -8.480401992797852, "global_step": 69149, "epoch": 411} {"train_loss": -8.521533012390137, "global_step": 69150, "epoch": 411} {"train_loss": -8.41153335571289, "global_step": 69151, "epoch": 411} {"train_loss": -8.699520111083984, "global_step": 69152, "epoch": 411} {"train_loss": -8.412773132324219, "global_step": 69153, "epoch": 411} {"train_loss": -8.916868209838867, "global_step": 69154, "epoch": 411} {"train_loss": -8.477094650268555, "global_step": 69155, "epoch": 411} {"train_loss": -8.905590057373047, "global_step": 69156, "epoch": 411} {"train_loss": -8.847755432128906, "global_step": 69157, "epoch": 411} {"train_loss": -8.508434295654297, "global_step": 69158, "epoch": 411} {"train_loss": -8.82686996459961, "global_step": 69159, "epoch": 411} {"train_loss": -8.878937721252441, "global_step": 69160, "epoch": 411} {"train_loss": -8.644838333129883, "global_step": 69161, "epoch": 411} {"train_loss": -8.707635879516602, "global_step": 69162, "epoch": 411} {"train_loss": -8.483480453491211, "global_step": 69163, "epoch": 411} {"train_loss": -8.64124870300293, "global_step": 69164, "epoch": 411} {"train_loss": -9.012924194335938, "global_step": 69165, "epoch": 411} {"train_loss": -8.71291732788086, "global_step": 69166, "epoch": 411} {"train_loss": -8.788515090942383, "global_step": 69167, "epoch": 411} {"train_loss": -9.01555061340332, "global_step": 69168, "epoch": 411} {"train_loss": -8.890413284301758, "global_step": 69169, "epoch": 411} {"train_loss": -8.886581420898438, "global_step": 69170, "epoch": 411} {"train_loss": -8.759064674377441, "global_step": 69171, "epoch": 411} {"train_loss": -8.886255264282227, "global_step": 69172, "epoch": 411} {"train_loss": -9.06085205078125, "global_step": 69173, "epoch": 411} {"train_loss": -9.023277282714844, "global_step": 69174, "epoch": 411} {"train_loss": -8.762199401855469, "global_step": 69175, "epoch": 411} {"train_loss": -8.965816497802734, "global_step": 69176, "epoch": 411} {"train_loss": -8.955307960510254, "global_step": 69177, "epoch": 411} {"train_loss": -8.93452262878418, "global_step": 69178, "epoch": 411} {"train_loss": -9.00107192993164, "global_step": 69179, "epoch": 411} {"train_loss": -9.103761672973633, "global_step": 69180, "epoch": 411} {"train_loss": -8.848103523254395, "global_step": 69181, "epoch": 411} {"train_loss": -9.014948844909668, "global_step": 69182, "epoch": 411} {"train_loss": -9.056377410888672, "global_step": 69183, "epoch": 411} {"train_loss": -8.939913749694824, "global_step": 69184, "epoch": 411} {"train_loss": -8.958213806152344, "global_step": 69185, "epoch": 411} {"train_loss": -9.103123664855957, "global_step": 69186, "epoch": 411} {"train_loss": -8.68220329284668, "global_step": 69187, "epoch": 411} {"train_loss": -9.044878005981445, "global_step": 69188, "epoch": 411} {"train_loss": -8.817953109741211, "global_step": 69189, "epoch": 411} {"train_loss": -9.232450485229492, "global_step": 69190, "epoch": 411} {"train_loss": -8.991188049316406, "global_step": 69191, "epoch": 411} {"train_loss": -8.952566146850586, "global_step": 69192, "epoch": 411} {"train_loss": -8.942392349243164, "global_step": 69193, "epoch": 411} {"train_loss": -9.074596405029297, "global_step": 69194, "epoch": 411} {"train_loss": -9.074624061584473, "global_step": 69195, "epoch": 411} {"train_loss": -9.151355743408203, "global_step": 69196, "epoch": 411} {"train_loss": -8.974276542663574, "global_step": 69197, "epoch": 411} {"train_loss": -8.874731063842773, "global_step": 69198, "epoch": 411} {"train_loss": -8.724170684814453, "global_step": 69199, "epoch": 411} {"train_loss": -8.747465133666992, "global_step": 69200, "epoch": 411} {"train_loss": -8.756298065185547, "global_step": 69201, "epoch": 411} {"train_loss": -8.997081756591797, "global_step": 69202, "epoch": 411} {"train_loss": -9.124580383300781, "global_step": 69203, "epoch": 411} {"train_loss": -8.667593955993652, "global_step": 69204, "epoch": 411} {"train_loss": -8.793949127197266, "global_step": 69205, "epoch": 411} {"train_loss": -8.853534698486328, "global_step": 69206, "epoch": 411} {"train_loss": -8.763938903808594, "global_step": 69207, "epoch": 411} {"train_loss": -8.556172370910645, "global_step": 69208, "epoch": 411} {"train_loss": -8.749910354614258, "global_step": 69209, "epoch": 411} {"train_loss": -8.561786651611328, "global_step": 69210, "epoch": 411} {"train_loss": -8.56663703918457, "global_step": 69211, "epoch": 411} {"train_loss": -8.653789520263672, "global_step": 69212, "epoch": 411} {"train_loss": -8.695768356323242, "global_step": 69213, "epoch": 411} {"train_loss": -8.687213897705078, "global_step": 69214, "epoch": 411} {"train_loss": -8.830054635093326, "global_step": 69215, "epoch": 411, "val_loss": 191180.6875} {"train_loss": -8.826988220214844, "global_step": 69216, "epoch": 412} {"train_loss": -8.785568237304688, "global_step": 69217, "epoch": 412} {"train_loss": -8.728628158569336, "global_step": 69218, "epoch": 412} {"train_loss": -8.68616771697998, "global_step": 69219, "epoch": 412} {"train_loss": -8.883270263671875, "global_step": 69220, "epoch": 412} {"train_loss": -8.871650695800781, "global_step": 69221, "epoch": 412} {"train_loss": -8.971646308898926, "global_step": 69222, "epoch": 412} {"train_loss": -8.910627365112305, "global_step": 69223, "epoch": 412} {"train_loss": -8.972314834594727, "global_step": 69224, "epoch": 412} {"train_loss": -8.845780372619629, "global_step": 69225, "epoch": 412} {"train_loss": -9.043864250183105, "global_step": 69226, "epoch": 412} {"train_loss": -8.713372230529785, "global_step": 69227, "epoch": 412} {"train_loss": -9.023601531982422, "global_step": 69228, "epoch": 412} {"train_loss": -8.91537857055664, "global_step": 69229, "epoch": 412} {"train_loss": -8.979817390441895, "global_step": 69230, "epoch": 412} {"train_loss": -9.002195358276367, "global_step": 69231, "epoch": 412} {"train_loss": -9.041332244873047, "global_step": 69232, "epoch": 412} {"train_loss": -8.908758163452148, "global_step": 69233, "epoch": 412} {"train_loss": -9.154536247253418, "global_step": 69234, "epoch": 412} {"train_loss": -9.042738914489746, "global_step": 69235, "epoch": 412} {"train_loss": -9.144143104553223, "global_step": 69236, "epoch": 412} {"train_loss": -9.028083801269531, "global_step": 69237, "epoch": 412} {"train_loss": -9.100302696228027, "global_step": 69238, "epoch": 412} {"train_loss": -8.675158500671387, "global_step": 69239, "epoch": 412} {"train_loss": -9.074625015258789, "global_step": 69240, "epoch": 412} {"train_loss": -8.933722496032715, "global_step": 69241, "epoch": 412} {"train_loss": -9.056241989135742, "global_step": 69242, "epoch": 412} {"train_loss": -8.986970901489258, "global_step": 69243, "epoch": 412} {"train_loss": -8.726417541503906, "global_step": 69244, "epoch": 412} {"train_loss": -9.101993560791016, "global_step": 69245, "epoch": 412} {"train_loss": -8.646984100341797, "global_step": 69246, "epoch": 412} {"train_loss": -8.992169380187988, "global_step": 69247, "epoch": 412} {"train_loss": -9.03141975402832, "global_step": 69248, "epoch": 412} {"train_loss": -9.187965393066406, "global_step": 69249, "epoch": 412} {"train_loss": -9.122034072875977, "global_step": 69250, "epoch": 412} {"train_loss": -8.987785339355469, "global_step": 69251, "epoch": 412} {"train_loss": -8.995054244995117, "global_step": 69252, "epoch": 412} {"train_loss": -8.987863540649414, "global_step": 69253, "epoch": 412} {"train_loss": -9.065512657165527, "global_step": 69254, "epoch": 412} {"train_loss": -8.948533058166504, "global_step": 69255, "epoch": 412} {"train_loss": -9.03036117553711, "global_step": 69256, "epoch": 412} {"train_loss": -8.563398361206055, "global_step": 69257, "epoch": 412} {"train_loss": -9.04926872253418, "global_step": 69258, "epoch": 412} {"train_loss": -8.946292877197266, "global_step": 69259, "epoch": 412} {"train_loss": -9.15260124206543, "global_step": 69260, "epoch": 412} {"train_loss": -8.955583572387695, "global_step": 69261, "epoch": 412} {"train_loss": -8.883195877075195, "global_step": 69262, "epoch": 412} {"train_loss": -9.019145965576172, "global_step": 69263, "epoch": 412} {"train_loss": -8.840521812438965, "global_step": 69264, "epoch": 412} {"train_loss": -8.750131607055664, "global_step": 69265, "epoch": 412} {"train_loss": -8.450569152832031, "global_step": 69266, "epoch": 412} {"train_loss": -9.097467422485352, "global_step": 69267, "epoch": 412} {"train_loss": -8.505817413330078, "global_step": 69268, "epoch": 412} {"train_loss": -8.987433433532715, "global_step": 69269, "epoch": 412} {"train_loss": -8.316222190856934, "global_step": 69270, "epoch": 412} {"train_loss": -8.868146896362305, "global_step": 69271, "epoch": 412} {"train_loss": -8.757984161376953, "global_step": 69272, "epoch": 412} {"train_loss": -8.513813018798828, "global_step": 69273, "epoch": 412} {"train_loss": -8.730714797973633, "global_step": 69274, "epoch": 412} {"train_loss": -8.40958023071289, "global_step": 69275, "epoch": 412} {"train_loss": -8.525012969970703, "global_step": 69276, "epoch": 412} {"train_loss": -8.695941925048828, "global_step": 69277, "epoch": 412} {"train_loss": -8.352452278137207, "global_step": 69278, "epoch": 412} {"train_loss": -8.572476387023926, "global_step": 69279, "epoch": 412} {"train_loss": -8.531458854675293, "global_step": 69280, "epoch": 412} {"train_loss": -8.605100631713867, "global_step": 69281, "epoch": 412} {"train_loss": -8.656452178955078, "global_step": 69282, "epoch": 412} {"train_loss": -8.65676498413086, "global_step": 69283, "epoch": 412} {"train_loss": -8.778243064880371, "global_step": 69284, "epoch": 412} {"train_loss": -9.086307525634766, "global_step": 69285, "epoch": 412} {"train_loss": -8.905738830566406, "global_step": 69286, "epoch": 412} {"train_loss": -8.669915199279785, "global_step": 69287, "epoch": 412} {"train_loss": -8.911109924316406, "global_step": 69288, "epoch": 412} {"train_loss": -8.963922500610352, "global_step": 69289, "epoch": 412} {"train_loss": -8.804994583129883, "global_step": 69290, "epoch": 412} {"train_loss": -8.930292129516602, "global_step": 69291, "epoch": 412} {"train_loss": -8.768359184265137, "global_step": 69292, "epoch": 412} {"train_loss": -9.026302337646484, "global_step": 69293, "epoch": 412} {"train_loss": -9.093976974487305, "global_step": 69294, "epoch": 412} {"train_loss": -8.87071418762207, "global_step": 69295, "epoch": 412} {"train_loss": -9.126501083374023, "global_step": 69296, "epoch": 412} {"train_loss": -9.185686111450195, "global_step": 69297, "epoch": 412} {"train_loss": -9.017351150512695, "global_step": 69298, "epoch": 412} {"train_loss": -8.79395866394043, "global_step": 69299, "epoch": 412} {"train_loss": -8.920794486999512, "global_step": 69300, "epoch": 412} {"train_loss": -8.974420547485352, "global_step": 69301, "epoch": 412} {"train_loss": -8.889286041259766, "global_step": 69302, "epoch": 412} {"train_loss": -9.118277549743652, "global_step": 69303, "epoch": 412} {"train_loss": -9.186067581176758, "global_step": 69304, "epoch": 412} {"train_loss": -9.091984748840332, "global_step": 69305, "epoch": 412} {"train_loss": -8.951131820678711, "global_step": 69306, "epoch": 412} {"train_loss": -9.09997844696045, "global_step": 69307, "epoch": 412} {"train_loss": -9.183520317077637, "global_step": 69308, "epoch": 412} {"train_loss": -8.849382400512695, "global_step": 69309, "epoch": 412} {"train_loss": -8.757232666015625, "global_step": 69310, "epoch": 412} {"train_loss": -8.630563735961914, "global_step": 69311, "epoch": 412} {"train_loss": -8.766975402832031, "global_step": 69312, "epoch": 412} {"train_loss": -8.681158065795898, "global_step": 69313, "epoch": 412} {"train_loss": -8.629866600036621, "global_step": 69314, "epoch": 412} {"train_loss": -8.619718551635742, "global_step": 69315, "epoch": 412} {"train_loss": -8.687742233276367, "global_step": 69316, "epoch": 412} {"train_loss": -8.777268409729004, "global_step": 69317, "epoch": 412} {"train_loss": -8.653322219848633, "global_step": 69318, "epoch": 412} {"train_loss": -8.60571002960205, "global_step": 69319, "epoch": 412} {"train_loss": -8.432388305664062, "global_step": 69320, "epoch": 412} {"train_loss": -8.867019653320312, "global_step": 69321, "epoch": 412} {"train_loss": -8.594971656799316, "global_step": 69322, "epoch": 412} {"train_loss": -8.657123565673828, "global_step": 69323, "epoch": 412} {"train_loss": -8.75424575805664, "global_step": 69324, "epoch": 412} {"train_loss": -8.761141777038574, "global_step": 69325, "epoch": 412} {"train_loss": -8.53158950805664, "global_step": 69326, "epoch": 412} {"train_loss": -8.52841567993164, "global_step": 69327, "epoch": 412} {"train_loss": -8.653287887573242, "global_step": 69328, "epoch": 412} {"train_loss": -8.734667778015137, "global_step": 69329, "epoch": 412} {"train_loss": -8.701925277709961, "global_step": 69330, "epoch": 412} {"train_loss": -8.80965518951416, "global_step": 69331, "epoch": 412} {"train_loss": -8.788330078125, "global_step": 69332, "epoch": 412} {"train_loss": -8.585756301879883, "global_step": 69333, "epoch": 412} {"train_loss": -8.725900650024414, "global_step": 69334, "epoch": 412} {"train_loss": -8.905900955200195, "global_step": 69335, "epoch": 412} {"train_loss": -8.531696319580078, "global_step": 69336, "epoch": 412} {"train_loss": -8.696632385253906, "global_step": 69337, "epoch": 412} {"train_loss": -9.150264739990234, "global_step": 69338, "epoch": 412} {"train_loss": -8.642477035522461, "global_step": 69339, "epoch": 412} {"train_loss": -8.78206729888916, "global_step": 69340, "epoch": 412} {"train_loss": -8.837461471557617, "global_step": 69341, "epoch": 412} {"train_loss": -8.74082088470459, "global_step": 69342, "epoch": 412} {"train_loss": -8.730161666870117, "global_step": 69343, "epoch": 412} {"train_loss": -8.657828330993652, "global_step": 69344, "epoch": 412} {"train_loss": -9.02895736694336, "global_step": 69345, "epoch": 412} {"train_loss": -8.822711944580078, "global_step": 69346, "epoch": 412} {"train_loss": -8.74371337890625, "global_step": 69347, "epoch": 412} {"train_loss": -8.89948844909668, "global_step": 69348, "epoch": 412} {"train_loss": -8.700887680053711, "global_step": 69349, "epoch": 412} {"train_loss": -8.679096221923828, "global_step": 69350, "epoch": 412} {"train_loss": -8.566526412963867, "global_step": 69351, "epoch": 412} {"train_loss": -8.847294807434082, "global_step": 69352, "epoch": 412} {"train_loss": -8.669525146484375, "global_step": 69353, "epoch": 412} {"train_loss": -8.825551986694336, "global_step": 69354, "epoch": 412} {"train_loss": -8.932697296142578, "global_step": 69355, "epoch": 412} {"train_loss": -8.761140823364258, "global_step": 69356, "epoch": 412} {"train_loss": -9.120223045349121, "global_step": 69357, "epoch": 412} {"train_loss": -9.075674057006836, "global_step": 69358, "epoch": 412} {"train_loss": -9.041518211364746, "global_step": 69359, "epoch": 412} {"train_loss": -8.999832153320312, "global_step": 69360, "epoch": 412} {"train_loss": -8.973282814025879, "global_step": 69361, "epoch": 412} {"train_loss": -9.112348556518555, "global_step": 69362, "epoch": 412} {"train_loss": -9.010454177856445, "global_step": 69363, "epoch": 412} {"train_loss": -8.783699035644531, "global_step": 69364, "epoch": 412} {"train_loss": -9.087915420532227, "global_step": 69365, "epoch": 412} {"train_loss": -8.64391040802002, "global_step": 69366, "epoch": 412} {"train_loss": -8.921870231628418, "global_step": 69367, "epoch": 412} {"train_loss": -9.016222953796387, "global_step": 69368, "epoch": 412} {"train_loss": -9.075937271118164, "global_step": 69369, "epoch": 412} {"train_loss": -9.071516990661621, "global_step": 69370, "epoch": 412} {"train_loss": -9.141109466552734, "global_step": 69371, "epoch": 412} {"train_loss": -9.052614212036133, "global_step": 69372, "epoch": 412} {"train_loss": -8.860904693603516, "global_step": 69373, "epoch": 412} {"train_loss": -8.928987503051758, "global_step": 69374, "epoch": 412} {"train_loss": -9.137592315673828, "global_step": 69375, "epoch": 412} {"train_loss": -8.613295555114746, "global_step": 69376, "epoch": 412} {"train_loss": -8.9452486038208, "global_step": 69377, "epoch": 412} {"train_loss": -8.67319107055664, "global_step": 69378, "epoch": 412} {"train_loss": -8.710185050964355, "global_step": 69379, "epoch": 412} {"train_loss": -8.508618354797363, "global_step": 69380, "epoch": 412} {"train_loss": -8.959676742553711, "global_step": 69381, "epoch": 412} {"train_loss": -8.852149963378906, "global_step": 69382, "epoch": 412} {"train_loss": -8.849852669806708, "global_step": 69383, "epoch": 412, "val_loss": 190466.328125} {"train_loss": -9.2522611618042, "global_step": 69384, "epoch": 413} {"train_loss": -8.971641540527344, "global_step": 69385, "epoch": 413} {"train_loss": -8.838249206542969, "global_step": 69386, "epoch": 413} {"train_loss": -8.782745361328125, "global_step": 69387, "epoch": 413} {"train_loss": -8.751260757446289, "global_step": 69388, "epoch": 413} {"train_loss": -8.895418167114258, "global_step": 69389, "epoch": 413} {"train_loss": -8.813108444213867, "global_step": 69390, "epoch": 413} {"train_loss": -8.754138946533203, "global_step": 69391, "epoch": 413} {"train_loss": -8.844318389892578, "global_step": 69392, "epoch": 413} {"train_loss": -8.714561462402344, "global_step": 69393, "epoch": 413} {"train_loss": -8.627665519714355, "global_step": 69394, "epoch": 413} {"train_loss": -8.716320037841797, "global_step": 69395, "epoch": 413} {"train_loss": -8.646745681762695, "global_step": 69396, "epoch": 413} {"train_loss": -8.854251861572266, "global_step": 69397, "epoch": 413} {"train_loss": -8.851938247680664, "global_step": 69398, "epoch": 413} {"train_loss": -8.805038452148438, "global_step": 69399, "epoch": 413} {"train_loss": -8.944168090820312, "global_step": 69400, "epoch": 413} {"train_loss": -8.717899322509766, "global_step": 69401, "epoch": 413} {"train_loss": -8.899633407592773, "global_step": 69402, "epoch": 413} {"train_loss": -8.795207023620605, "global_step": 69403, "epoch": 413} {"train_loss": -9.038549423217773, "global_step": 69404, "epoch": 413} {"train_loss": -9.022546768188477, "global_step": 69405, "epoch": 413} {"train_loss": -8.993935585021973, "global_step": 69406, "epoch": 413} {"train_loss": -9.124503135681152, "global_step": 69407, "epoch": 413} {"train_loss": -9.123222351074219, "global_step": 69408, "epoch": 413} {"train_loss": -8.97658634185791, "global_step": 69409, "epoch": 413} {"train_loss": -9.011825561523438, "global_step": 69410, "epoch": 413} {"train_loss": -8.959287643432617, "global_step": 69411, "epoch": 413} {"train_loss": -9.149858474731445, "global_step": 69412, "epoch": 413} {"train_loss": -8.919300079345703, "global_step": 69413, "epoch": 413} {"train_loss": -8.937238693237305, "global_step": 69414, "epoch": 413} {"train_loss": -8.697696685791016, "global_step": 69415, "epoch": 413} {"train_loss": -8.294724464416504, "global_step": 69416, "epoch": 413} {"train_loss": -8.77907943725586, "global_step": 69417, "epoch": 413} {"train_loss": -8.874990463256836, "global_step": 69418, "epoch": 413} {"train_loss": -9.001253128051758, "global_step": 69419, "epoch": 413} {"train_loss": -8.721366882324219, "global_step": 69420, "epoch": 413} {"train_loss": -8.99736213684082, "global_step": 69421, "epoch": 413} {"train_loss": -8.821525573730469, "global_step": 69422, "epoch": 413} {"train_loss": -9.051775932312012, "global_step": 69423, "epoch": 413} {"train_loss": -8.860316276550293, "global_step": 69424, "epoch": 413} {"train_loss": -9.051898956298828, "global_step": 69425, "epoch": 413} {"train_loss": -8.987412452697754, "global_step": 69426, "epoch": 413} {"train_loss": -8.92656421661377, "global_step": 69427, "epoch": 413} {"train_loss": -8.72573184967041, "global_step": 69428, "epoch": 413} {"train_loss": -9.19489574432373, "global_step": 69429, "epoch": 413} {"train_loss": -9.108712196350098, "global_step": 69430, "epoch": 413} {"train_loss": -8.923589706420898, "global_step": 69431, "epoch": 413} {"train_loss": -9.068031311035156, "global_step": 69432, "epoch": 413} {"train_loss": -8.902763366699219, "global_step": 69433, "epoch": 413} {"train_loss": -9.044129371643066, "global_step": 69434, "epoch": 413} {"train_loss": -9.027105331420898, "global_step": 69435, "epoch": 413} {"train_loss": -9.027399063110352, "global_step": 69436, "epoch": 413} {"train_loss": -9.029824256896973, "global_step": 69437, "epoch": 413} {"train_loss": -8.753035545349121, "global_step": 69438, "epoch": 413} {"train_loss": -8.632352828979492, "global_step": 69439, "epoch": 413} {"train_loss": -9.060995101928711, "global_step": 69440, "epoch": 413} {"train_loss": -8.81159782409668, "global_step": 69441, "epoch": 413} {"train_loss": -8.64669418334961, "global_step": 69442, "epoch": 413} {"train_loss": -8.754890441894531, "global_step": 69443, "epoch": 413} {"train_loss": -8.797710418701172, "global_step": 69444, "epoch": 413} {"train_loss": -8.890945434570312, "global_step": 69445, "epoch": 413} {"train_loss": -8.715896606445312, "global_step": 69446, "epoch": 413} {"train_loss": -8.940248489379883, "global_step": 69447, "epoch": 413} {"train_loss": -8.790079116821289, "global_step": 69448, "epoch": 413} {"train_loss": -8.744537353515625, "global_step": 69449, "epoch": 413} {"train_loss": -8.664103507995605, "global_step": 69450, "epoch": 413} {"train_loss": -8.99641227722168, "global_step": 69451, "epoch": 413} {"train_loss": -8.741434097290039, "global_step": 69452, "epoch": 413} {"train_loss": -8.752362251281738, "global_step": 69453, "epoch": 413} {"train_loss": -8.835212707519531, "global_step": 69454, "epoch": 413} {"train_loss": -9.02081298828125, "global_step": 69455, "epoch": 413} {"train_loss": -8.777256965637207, "global_step": 69456, "epoch": 413} {"train_loss": -8.917032241821289, "global_step": 69457, "epoch": 413} {"train_loss": -8.92039966583252, "global_step": 69458, "epoch": 413} {"train_loss": -9.049819946289062, "global_step": 69459, "epoch": 413} {"train_loss": -8.8576021194458, "global_step": 69460, "epoch": 413} {"train_loss": -9.065994262695312, "global_step": 69461, "epoch": 413} {"train_loss": -8.890678405761719, "global_step": 69462, "epoch": 413} {"train_loss": -8.5446138381958, "global_step": 69463, "epoch": 413} {"train_loss": -9.022299766540527, "global_step": 69464, "epoch": 413} {"train_loss": -8.827784538269043, "global_step": 69465, "epoch": 413} {"train_loss": -8.903351783752441, "global_step": 69466, "epoch": 413} {"train_loss": -8.654934883117676, "global_step": 69467, "epoch": 413} {"train_loss": -8.946243286132812, "global_step": 69468, "epoch": 413} {"train_loss": -8.899969100952148, "global_step": 69469, "epoch": 413} {"train_loss": -8.924419403076172, "global_step": 69470, "epoch": 413} {"train_loss": -8.734103202819824, "global_step": 69471, "epoch": 413} {"train_loss": -8.546428680419922, "global_step": 69472, "epoch": 413} {"train_loss": -8.987293243408203, "global_step": 69473, "epoch": 413} {"train_loss": -8.700262069702148, "global_step": 69474, "epoch": 413} {"train_loss": -9.041412353515625, "global_step": 69475, "epoch": 413} {"train_loss": -8.946685791015625, "global_step": 69476, "epoch": 413} {"train_loss": -8.871463775634766, "global_step": 69477, "epoch": 413} {"train_loss": -8.828596115112305, "global_step": 69478, "epoch": 413} {"train_loss": -8.776935577392578, "global_step": 69479, "epoch": 413} {"train_loss": -8.89690113067627, "global_step": 69480, "epoch": 413} {"train_loss": -8.879867553710938, "global_step": 69481, "epoch": 413} {"train_loss": -8.984676361083984, "global_step": 69482, "epoch": 413} {"train_loss": -8.95319938659668, "global_step": 69483, "epoch": 413} {"train_loss": -9.056203842163086, "global_step": 69484, "epoch": 413} {"train_loss": -8.894843101501465, "global_step": 69485, "epoch": 413} {"train_loss": -8.660255432128906, "global_step": 69486, "epoch": 413} {"train_loss": -8.814476013183594, "global_step": 69487, "epoch": 413} {"train_loss": -8.665667533874512, "global_step": 69488, "epoch": 413} {"train_loss": -8.884468078613281, "global_step": 69489, "epoch": 413} {"train_loss": -8.912246704101562, "global_step": 69490, "epoch": 413} {"train_loss": -9.159278869628906, "global_step": 69491, "epoch": 413} {"train_loss": -8.90688419342041, "global_step": 69492, "epoch": 413} {"train_loss": -8.89836311340332, "global_step": 69493, "epoch": 413} {"train_loss": -9.035614967346191, "global_step": 69494, "epoch": 413} {"train_loss": -8.624665260314941, "global_step": 69495, "epoch": 413} {"train_loss": -8.828191757202148, "global_step": 69496, "epoch": 413} {"train_loss": -8.781664848327637, "global_step": 69497, "epoch": 413} {"train_loss": -9.132322311401367, "global_step": 69498, "epoch": 413} {"train_loss": -8.74366569519043, "global_step": 69499, "epoch": 413} {"train_loss": -9.086124420166016, "global_step": 69500, "epoch": 413} {"train_loss": -8.754837036132812, "global_step": 69501, "epoch": 413} {"train_loss": -8.913324356079102, "global_step": 69502, "epoch": 413} {"train_loss": -8.924015998840332, "global_step": 69503, "epoch": 413} {"train_loss": -8.325085639953613, "global_step": 69504, "epoch": 413} {"train_loss": -9.024967193603516, "global_step": 69505, "epoch": 413} {"train_loss": -8.86575698852539, "global_step": 69506, "epoch": 413} {"train_loss": -8.865224838256836, "global_step": 69507, "epoch": 413} {"train_loss": -8.690834045410156, "global_step": 69508, "epoch": 413} {"train_loss": -8.713247299194336, "global_step": 69509, "epoch": 413} {"train_loss": -8.649703979492188, "global_step": 69510, "epoch": 413} {"train_loss": -8.778465270996094, "global_step": 69511, "epoch": 413} {"train_loss": -8.946157455444336, "global_step": 69512, "epoch": 413} {"train_loss": -8.726076126098633, "global_step": 69513, "epoch": 413} {"train_loss": -8.87085247039795, "global_step": 69514, "epoch": 413} {"train_loss": -8.849424362182617, "global_step": 69515, "epoch": 413} {"train_loss": -8.95574951171875, "global_step": 69516, "epoch": 413} {"train_loss": -8.773195266723633, "global_step": 69517, "epoch": 413} {"train_loss": -8.871787071228027, "global_step": 69518, "epoch": 413} {"train_loss": -8.760446548461914, "global_step": 69519, "epoch": 413} {"train_loss": -8.691947937011719, "global_step": 69520, "epoch": 413} {"train_loss": -8.603873252868652, "global_step": 69521, "epoch": 413} {"train_loss": -8.969133377075195, "global_step": 69522, "epoch": 413} {"train_loss": -8.862634658813477, "global_step": 69523, "epoch": 413} {"train_loss": -9.167437553405762, "global_step": 69524, "epoch": 413} {"train_loss": -8.888810157775879, "global_step": 69525, "epoch": 413} {"train_loss": -8.94646167755127, "global_step": 69526, "epoch": 413} {"train_loss": -8.831926345825195, "global_step": 69527, "epoch": 413} {"train_loss": -8.939397811889648, "global_step": 69528, "epoch": 413} {"train_loss": -8.744682312011719, "global_step": 69529, "epoch": 413} {"train_loss": -8.701342582702637, "global_step": 69530, "epoch": 413} {"train_loss": -8.571632385253906, "global_step": 69531, "epoch": 413} {"train_loss": -8.9728364944458, "global_step": 69532, "epoch": 413} {"train_loss": -8.861475944519043, "global_step": 69533, "epoch": 413} {"train_loss": -8.895585060119629, "global_step": 69534, "epoch": 413} {"train_loss": -8.888982772827148, "global_step": 69535, "epoch": 413} {"train_loss": -9.086000442504883, "global_step": 69536, "epoch": 413} {"train_loss": -8.683330535888672, "global_step": 69537, "epoch": 413} {"train_loss": -8.876734733581543, "global_step": 69538, "epoch": 413} {"train_loss": -8.654531478881836, "global_step": 69539, "epoch": 413} {"train_loss": -9.010597229003906, "global_step": 69540, "epoch": 413} {"train_loss": -8.524190902709961, "global_step": 69541, "epoch": 413} {"train_loss": -9.065984725952148, "global_step": 69542, "epoch": 413} {"train_loss": -8.942465782165527, "global_step": 69543, "epoch": 413} {"train_loss": -8.670528411865234, "global_step": 69544, "epoch": 413} {"train_loss": -8.923300743103027, "global_step": 69545, "epoch": 413} {"train_loss": -8.556913375854492, "global_step": 69546, "epoch": 413} {"train_loss": -8.766622543334961, "global_step": 69547, "epoch": 413} {"train_loss": -8.978374481201172, "global_step": 69548, "epoch": 413} {"train_loss": -8.816451072692871, "global_step": 69549, "epoch": 413} {"train_loss": -8.898436546325684, "global_step": 69550, "epoch": 413} {"train_loss": -8.863790188516889, "global_step": 69551, "epoch": 413, "val_loss": 194189.03125} {"train_loss": -8.557170867919922, "global_step": 69552, "epoch": 414} {"train_loss": -8.918581008911133, "global_step": 69553, "epoch": 414} {"train_loss": -8.890374183654785, "global_step": 69554, "epoch": 414} {"train_loss": -8.754068374633789, "global_step": 69555, "epoch": 414} {"train_loss": -8.887748718261719, "global_step": 69556, "epoch": 414} {"train_loss": -8.912250518798828, "global_step": 69557, "epoch": 414} {"train_loss": -8.540901184082031, "global_step": 69558, "epoch": 414} {"train_loss": -8.96908187866211, "global_step": 69559, "epoch": 414} {"train_loss": -8.801993370056152, "global_step": 69560, "epoch": 414} {"train_loss": -8.884081840515137, "global_step": 69561, "epoch": 414} {"train_loss": -9.123564720153809, "global_step": 69562, "epoch": 414} {"train_loss": -8.957170486450195, "global_step": 69563, "epoch": 414} {"train_loss": -8.973401069641113, "global_step": 69564, "epoch": 414} {"train_loss": -8.770881652832031, "global_step": 69565, "epoch": 414} {"train_loss": -9.014289855957031, "global_step": 69566, "epoch": 414} {"train_loss": -8.840058326721191, "global_step": 69567, "epoch": 414} {"train_loss": -8.977221488952637, "global_step": 69568, "epoch": 414} {"train_loss": -8.867737770080566, "global_step": 69569, "epoch": 414} {"train_loss": -8.857025146484375, "global_step": 69570, "epoch": 414} {"train_loss": -9.065128326416016, "global_step": 69571, "epoch": 414} {"train_loss": -9.320289611816406, "global_step": 69572, "epoch": 414} {"train_loss": -8.901023864746094, "global_step": 69573, "epoch": 414} {"train_loss": -8.891168594360352, "global_step": 69574, "epoch": 414} {"train_loss": -9.028816223144531, "global_step": 69575, "epoch": 414} {"train_loss": -8.779922485351562, "global_step": 69576, "epoch": 414} {"train_loss": -8.57823371887207, "global_step": 69577, "epoch": 414} {"train_loss": -8.829870223999023, "global_step": 69578, "epoch": 414} {"train_loss": -8.70928955078125, "global_step": 69579, "epoch": 414} {"train_loss": -8.421290397644043, "global_step": 69580, "epoch": 414} {"train_loss": -8.377004623413086, "global_step": 69581, "epoch": 414} {"train_loss": -8.506930351257324, "global_step": 69582, "epoch": 414} {"train_loss": -8.67239761352539, "global_step": 69583, "epoch": 414} {"train_loss": -8.710136413574219, "global_step": 69584, "epoch": 414} {"train_loss": -8.55508041381836, "global_step": 69585, "epoch": 414} {"train_loss": -8.67296028137207, "global_step": 69586, "epoch": 414} {"train_loss": -8.664411544799805, "global_step": 69587, "epoch": 414} {"train_loss": -8.878480911254883, "global_step": 69588, "epoch": 414} {"train_loss": -8.644607543945312, "global_step": 69589, "epoch": 414} {"train_loss": -8.782215118408203, "global_step": 69590, "epoch": 414} {"train_loss": -8.877062797546387, "global_step": 69591, "epoch": 414} {"train_loss": -8.762280464172363, "global_step": 69592, "epoch": 414} {"train_loss": -8.879837036132812, "global_step": 69593, "epoch": 414} {"train_loss": -8.763131141662598, "global_step": 69594, "epoch": 414} {"train_loss": -8.96766185760498, "global_step": 69595, "epoch": 414} {"train_loss": -8.770805358886719, "global_step": 69596, "epoch": 414} {"train_loss": -9.002782821655273, "global_step": 69597, "epoch": 414} {"train_loss": -8.839778900146484, "global_step": 69598, "epoch": 414} {"train_loss": -8.969054222106934, "global_step": 69599, "epoch": 414} {"train_loss": -8.861700057983398, "global_step": 69600, "epoch": 414} {"train_loss": -8.906529426574707, "global_step": 69601, "epoch": 414} {"train_loss": -8.910343170166016, "global_step": 69602, "epoch": 414} {"train_loss": -9.083199501037598, "global_step": 69603, "epoch": 414} {"train_loss": -8.815837860107422, "global_step": 69604, "epoch": 414} {"train_loss": -8.876484870910645, "global_step": 69605, "epoch": 414} {"train_loss": -9.077430725097656, "global_step": 69606, "epoch": 414} {"train_loss": -8.977514266967773, "global_step": 69607, "epoch": 414} {"train_loss": -9.228018760681152, "global_step": 69608, "epoch": 414} {"train_loss": -9.121994972229004, "global_step": 69609, "epoch": 414} {"train_loss": -9.089034080505371, "global_step": 69610, "epoch": 414} {"train_loss": -9.19487190246582, "global_step": 69611, "epoch": 414} {"train_loss": -9.010409355163574, "global_step": 69612, "epoch": 414} {"train_loss": -9.106439590454102, "global_step": 69613, "epoch": 414} {"train_loss": -8.909309387207031, "global_step": 69614, "epoch": 414} {"train_loss": -9.235573768615723, "global_step": 69615, "epoch": 414} {"train_loss": -9.18942642211914, "global_step": 69616, "epoch": 414} {"train_loss": -9.270011901855469, "global_step": 69617, "epoch": 414} {"train_loss": -9.133769989013672, "global_step": 69618, "epoch": 414} {"train_loss": -9.25171184539795, "global_step": 69619, "epoch": 414} {"train_loss": -9.168707847595215, "global_step": 69620, "epoch": 414} {"train_loss": -9.162025451660156, "global_step": 69621, "epoch": 414} {"train_loss": -8.991621971130371, "global_step": 69622, "epoch": 414} {"train_loss": -9.2227783203125, "global_step": 69623, "epoch": 414} {"train_loss": -9.002885818481445, "global_step": 69624, "epoch": 414} {"train_loss": -9.115702629089355, "global_step": 69625, "epoch": 414} {"train_loss": -8.959211349487305, "global_step": 69626, "epoch": 414} {"train_loss": -8.82815933227539, "global_step": 69627, "epoch": 414} {"train_loss": -8.756921768188477, "global_step": 69628, "epoch": 414} {"train_loss": -8.602962493896484, "global_step": 69629, "epoch": 414} {"train_loss": -8.683895111083984, "global_step": 69630, "epoch": 414} {"train_loss": -8.925680160522461, "global_step": 69631, "epoch": 414} {"train_loss": -8.76961612701416, "global_step": 69632, "epoch": 414} {"train_loss": -9.059438705444336, "global_step": 69633, "epoch": 414} {"train_loss": -9.245706558227539, "global_step": 69634, "epoch": 414} {"train_loss": -8.97765064239502, "global_step": 69635, "epoch": 414} {"train_loss": -8.67104434967041, "global_step": 69636, "epoch": 414} {"train_loss": -8.752689361572266, "global_step": 69637, "epoch": 414} {"train_loss": -8.210358619689941, "global_step": 69638, "epoch": 414} {"train_loss": -8.730167388916016, "global_step": 69639, "epoch": 414} {"train_loss": -7.714885711669922, "global_step": 69640, "epoch": 414} {"train_loss": -8.818109512329102, "global_step": 69641, "epoch": 414} {"train_loss": -8.07638168334961, "global_step": 69642, "epoch": 414} {"train_loss": -8.797063827514648, "global_step": 69643, "epoch": 414} {"train_loss": -8.614892959594727, "global_step": 69644, "epoch": 414} {"train_loss": -8.661211013793945, "global_step": 69645, "epoch": 414} {"train_loss": -8.819429397583008, "global_step": 69646, "epoch": 414} {"train_loss": -8.82303237915039, "global_step": 69647, "epoch": 414} {"train_loss": -8.644693374633789, "global_step": 69648, "epoch": 414} {"train_loss": -8.711538314819336, "global_step": 69649, "epoch": 414} {"train_loss": -8.574468612670898, "global_step": 69650, "epoch": 414} {"train_loss": -8.74116039276123, "global_step": 69651, "epoch": 414} {"train_loss": -8.788280487060547, "global_step": 69652, "epoch": 414} {"train_loss": -8.63183879852295, "global_step": 69653, "epoch": 414} {"train_loss": -8.724237442016602, "global_step": 69654, "epoch": 414} {"train_loss": -8.51558780670166, "global_step": 69655, "epoch": 414} {"train_loss": -8.770095825195312, "global_step": 69656, "epoch": 414} {"train_loss": -8.96302604675293, "global_step": 69657, "epoch": 414} {"train_loss": -8.712512016296387, "global_step": 69658, "epoch": 414} {"train_loss": -8.983743667602539, "global_step": 69659, "epoch": 414} {"train_loss": -8.657751083374023, "global_step": 69660, "epoch": 414} {"train_loss": -8.980193138122559, "global_step": 69661, "epoch": 414} {"train_loss": -8.775182723999023, "global_step": 69662, "epoch": 414} {"train_loss": -8.86250114440918, "global_step": 69663, "epoch": 414} {"train_loss": -9.09311294555664, "global_step": 69664, "epoch": 414} {"train_loss": -9.079010963439941, "global_step": 69665, "epoch": 414} {"train_loss": -8.861812591552734, "global_step": 69666, "epoch": 414} {"train_loss": -9.05807876586914, "global_step": 69667, "epoch": 414} {"train_loss": -8.825128555297852, "global_step": 69668, "epoch": 414} {"train_loss": -8.854394912719727, "global_step": 69669, "epoch": 414} {"train_loss": -8.608848571777344, "global_step": 69670, "epoch": 414} {"train_loss": -8.940237045288086, "global_step": 69671, "epoch": 414} {"train_loss": -8.89041805267334, "global_step": 69672, "epoch": 414} {"train_loss": -8.865230560302734, "global_step": 69673, "epoch": 414} {"train_loss": -8.95354175567627, "global_step": 69674, "epoch": 414} {"train_loss": -8.831947326660156, "global_step": 69675, "epoch": 414} {"train_loss": -8.845686912536621, "global_step": 69676, "epoch": 414} {"train_loss": -9.074104309082031, "global_step": 69677, "epoch": 414} {"train_loss": -8.966636657714844, "global_step": 69678, "epoch": 414} {"train_loss": -8.790088653564453, "global_step": 69679, "epoch": 414} {"train_loss": -8.939340591430664, "global_step": 69680, "epoch": 414} {"train_loss": -8.667993545532227, "global_step": 69681, "epoch": 414} {"train_loss": -8.995061874389648, "global_step": 69682, "epoch": 414} {"train_loss": -8.616777420043945, "global_step": 69683, "epoch": 414} {"train_loss": -8.977568626403809, "global_step": 69684, "epoch": 414} {"train_loss": -8.479683876037598, "global_step": 69685, "epoch": 414} {"train_loss": -8.988992691040039, "global_step": 69686, "epoch": 414} {"train_loss": -8.725914001464844, "global_step": 69687, "epoch": 414} {"train_loss": -8.61471176147461, "global_step": 69688, "epoch": 414} {"train_loss": -8.839508056640625, "global_step": 69689, "epoch": 414} {"train_loss": -8.74111557006836, "global_step": 69690, "epoch": 414} {"train_loss": -8.562654495239258, "global_step": 69691, "epoch": 414} {"train_loss": -8.836666107177734, "global_step": 69692, "epoch": 414} {"train_loss": -8.675085067749023, "global_step": 69693, "epoch": 414} {"train_loss": -9.120656967163086, "global_step": 69694, "epoch": 414} {"train_loss": -8.833578109741211, "global_step": 69695, "epoch": 414} {"train_loss": -8.732816696166992, "global_step": 69696, "epoch": 414} {"train_loss": -8.974557876586914, "global_step": 69697, "epoch": 414} {"train_loss": -9.058008193969727, "global_step": 69698, "epoch": 414} {"train_loss": -9.01182746887207, "global_step": 69699, "epoch": 414} {"train_loss": -8.890582084655762, "global_step": 69700, "epoch": 414} {"train_loss": -9.070798873901367, "global_step": 69701, "epoch": 414} {"train_loss": -9.189516067504883, "global_step": 69702, "epoch": 414} {"train_loss": -8.877933502197266, "global_step": 69703, "epoch": 414} {"train_loss": -9.02840805053711, "global_step": 69704, "epoch": 414} {"train_loss": -9.05423641204834, "global_step": 69705, "epoch": 414} {"train_loss": -9.081033706665039, "global_step": 69706, "epoch": 414} {"train_loss": -9.067573547363281, "global_step": 69707, "epoch": 414} {"train_loss": -9.186409950256348, "global_step": 69708, "epoch": 414} {"train_loss": -9.049894332885742, "global_step": 69709, "epoch": 414} {"train_loss": -9.32982063293457, "global_step": 69710, "epoch": 414} {"train_loss": -9.030104637145996, "global_step": 69711, "epoch": 414} {"train_loss": -9.170031547546387, "global_step": 69712, "epoch": 414} {"train_loss": -9.083425521850586, "global_step": 69713, "epoch": 414} {"train_loss": -9.100664138793945, "global_step": 69714, "epoch": 414} {"train_loss": -9.052736282348633, "global_step": 69715, "epoch": 414} {"train_loss": -8.876765251159668, "global_step": 69716, "epoch": 414} {"train_loss": -8.865949630737305, "global_step": 69717, "epoch": 414} {"train_loss": -9.04916763305664, "global_step": 69718, "epoch": 414} {"train_loss": -8.871986973853339, "global_step": 69719, "epoch": 414, "val_loss": 192916.0} {"train_loss": -9.064679145812988, "global_step": 69720, "epoch": 415} {"train_loss": -8.87082290649414, "global_step": 69721, "epoch": 415} {"train_loss": -8.442131042480469, "global_step": 69722, "epoch": 415} {"train_loss": -8.45477294921875, "global_step": 69723, "epoch": 415} {"train_loss": -8.7562255859375, "global_step": 69724, "epoch": 415} {"train_loss": -8.620227813720703, "global_step": 69725, "epoch": 415} {"train_loss": -8.858743667602539, "global_step": 69726, "epoch": 415} {"train_loss": -8.435144424438477, "global_step": 69727, "epoch": 415} {"train_loss": -8.676898956298828, "global_step": 69728, "epoch": 415} {"train_loss": -8.73878288269043, "global_step": 69729, "epoch": 415} {"train_loss": -8.800626754760742, "global_step": 69730, "epoch": 415} {"train_loss": -8.489498138427734, "global_step": 69731, "epoch": 415} {"train_loss": -8.811655044555664, "global_step": 69732, "epoch": 415} {"train_loss": -8.861473083496094, "global_step": 69733, "epoch": 415} {"train_loss": -9.041751861572266, "global_step": 69734, "epoch": 415} {"train_loss": -9.021931648254395, "global_step": 69735, "epoch": 415} {"train_loss": -8.850156784057617, "global_step": 69736, "epoch": 415} {"train_loss": -8.919322967529297, "global_step": 69737, "epoch": 415} {"train_loss": -8.843475341796875, "global_step": 69738, "epoch": 415} {"train_loss": -8.880132675170898, "global_step": 69739, "epoch": 415} {"train_loss": -8.784561157226562, "global_step": 69740, "epoch": 415} {"train_loss": -9.00758171081543, "global_step": 69741, "epoch": 415} {"train_loss": -9.034337997436523, "global_step": 69742, "epoch": 415} {"train_loss": -8.96194076538086, "global_step": 69743, "epoch": 415} {"train_loss": -8.843279838562012, "global_step": 69744, "epoch": 415} {"train_loss": -8.883781433105469, "global_step": 69745, "epoch": 415} {"train_loss": -8.893535614013672, "global_step": 69746, "epoch": 415} {"train_loss": -9.055123329162598, "global_step": 69747, "epoch": 415} {"train_loss": -9.069934844970703, "global_step": 69748, "epoch": 415} {"train_loss": -8.901901245117188, "global_step": 69749, "epoch": 415} {"train_loss": -8.991037368774414, "global_step": 69750, "epoch": 415} {"train_loss": -9.138346672058105, "global_step": 69751, "epoch": 415} {"train_loss": -9.032258033752441, "global_step": 69752, "epoch": 415} {"train_loss": -9.125574111938477, "global_step": 69753, "epoch": 415} {"train_loss": -8.855997085571289, "global_step": 69754, "epoch": 415} {"train_loss": -9.178461074829102, "global_step": 69755, "epoch": 415} {"train_loss": -9.021293640136719, "global_step": 69756, "epoch": 415} {"train_loss": -8.825468063354492, "global_step": 69757, "epoch": 415} {"train_loss": -8.973043441772461, "global_step": 69758, "epoch": 415} {"train_loss": -9.026506423950195, "global_step": 69759, "epoch": 415} {"train_loss": -9.131416320800781, "global_step": 69760, "epoch": 415} {"train_loss": -9.051643371582031, "global_step": 69761, "epoch": 415} {"train_loss": -9.089118957519531, "global_step": 69762, "epoch": 415} {"train_loss": -9.118576049804688, "global_step": 69763, "epoch": 415} {"train_loss": -9.310575485229492, "global_step": 69764, "epoch": 415} {"train_loss": -8.981644630432129, "global_step": 69765, "epoch": 415} {"train_loss": -9.012961387634277, "global_step": 69766, "epoch": 415} {"train_loss": -9.074674606323242, "global_step": 69767, "epoch": 415} {"train_loss": -8.90930461883545, "global_step": 69768, "epoch": 415} {"train_loss": -8.909448623657227, "global_step": 69769, "epoch": 415} {"train_loss": -9.101483345031738, "global_step": 69770, "epoch": 415} {"train_loss": -9.027823448181152, "global_step": 69771, "epoch": 415} {"train_loss": -8.89781379699707, "global_step": 69772, "epoch": 415} {"train_loss": -8.968805313110352, "global_step": 69773, "epoch": 415} {"train_loss": -9.233528137207031, "global_step": 69774, "epoch": 415} {"train_loss": -8.910231590270996, "global_step": 69775, "epoch": 415} {"train_loss": -9.107926368713379, "global_step": 69776, "epoch": 415} {"train_loss": -9.05123519897461, "global_step": 69777, "epoch": 415} {"train_loss": -8.886360168457031, "global_step": 69778, "epoch": 415} {"train_loss": -8.920310020446777, "global_step": 69779, "epoch": 415} {"train_loss": -9.103940963745117, "global_step": 69780, "epoch": 415} {"train_loss": -8.93045425415039, "global_step": 69781, "epoch": 415} {"train_loss": -9.20681095123291, "global_step": 69782, "epoch": 415} {"train_loss": -8.847646713256836, "global_step": 69783, "epoch": 415} {"train_loss": -9.2028226852417, "global_step": 69784, "epoch": 415} {"train_loss": -9.255952835083008, "global_step": 69785, "epoch": 415} {"train_loss": -9.174571990966797, "global_step": 69786, "epoch": 415} {"train_loss": -9.093637466430664, "global_step": 69787, "epoch": 415} {"train_loss": -8.94683837890625, "global_step": 69788, "epoch": 415} {"train_loss": -8.750421524047852, "global_step": 69789, "epoch": 415} {"train_loss": -9.03503131866455, "global_step": 69790, "epoch": 415} {"train_loss": -8.736966133117676, "global_step": 69791, "epoch": 415} {"train_loss": -8.82388687133789, "global_step": 69792, "epoch": 415} {"train_loss": -8.48682975769043, "global_step": 69793, "epoch": 415} {"train_loss": -8.784765243530273, "global_step": 69794, "epoch": 415} {"train_loss": -8.602907180786133, "global_step": 69795, "epoch": 415} {"train_loss": -8.90007209777832, "global_step": 69796, "epoch": 415} {"train_loss": -8.716552734375, "global_step": 69797, "epoch": 415} {"train_loss": -8.895544052124023, "global_step": 69798, "epoch": 415} {"train_loss": -8.70301628112793, "global_step": 69799, "epoch": 415} {"train_loss": -8.771327018737793, "global_step": 69800, "epoch": 415} {"train_loss": -8.5135498046875, "global_step": 69801, "epoch": 415} {"train_loss": -8.485625267028809, "global_step": 69802, "epoch": 415} {"train_loss": -8.80660629272461, "global_step": 69803, "epoch": 415} {"train_loss": -8.676761627197266, "global_step": 69804, "epoch": 415} {"train_loss": -8.890432357788086, "global_step": 69805, "epoch": 415} {"train_loss": -8.438228607177734, "global_step": 69806, "epoch": 415} {"train_loss": -8.824281692504883, "global_step": 69807, "epoch": 415} {"train_loss": -8.89331340789795, "global_step": 69808, "epoch": 415} {"train_loss": -8.549430847167969, "global_step": 69809, "epoch": 415} {"train_loss": -8.838629722595215, "global_step": 69810, "epoch": 415} {"train_loss": -8.561372756958008, "global_step": 69811, "epoch": 415} {"train_loss": -8.693299293518066, "global_step": 69812, "epoch": 415} {"train_loss": -8.969802856445312, "global_step": 69813, "epoch": 415} {"train_loss": -8.670882225036621, "global_step": 69814, "epoch": 415} {"train_loss": -8.758395195007324, "global_step": 69815, "epoch": 415} {"train_loss": -8.816272735595703, "global_step": 69816, "epoch": 415} {"train_loss": -8.825386047363281, "global_step": 69817, "epoch": 415} {"train_loss": -8.754432678222656, "global_step": 69818, "epoch": 415} {"train_loss": -8.880819320678711, "global_step": 69819, "epoch": 415} {"train_loss": -9.038854598999023, "global_step": 69820, "epoch": 415} {"train_loss": -8.910065650939941, "global_step": 69821, "epoch": 415} {"train_loss": -8.737873077392578, "global_step": 69822, "epoch": 415} {"train_loss": -8.951885223388672, "global_step": 69823, "epoch": 415} {"train_loss": -8.670755386352539, "global_step": 69824, "epoch": 415} {"train_loss": -8.91470718383789, "global_step": 69825, "epoch": 415} {"train_loss": -9.056303977966309, "global_step": 69826, "epoch": 415} {"train_loss": -8.941642761230469, "global_step": 69827, "epoch": 415} {"train_loss": -9.08028793334961, "global_step": 69828, "epoch": 415} {"train_loss": -8.869621276855469, "global_step": 69829, "epoch": 415} {"train_loss": -9.044559478759766, "global_step": 69830, "epoch": 415} {"train_loss": -8.960250854492188, "global_step": 69831, "epoch": 415} {"train_loss": -9.049055099487305, "global_step": 69832, "epoch": 415} {"train_loss": -8.733299255371094, "global_step": 69833, "epoch": 415} {"train_loss": -9.030393600463867, "global_step": 69834, "epoch": 415} {"train_loss": -8.307351112365723, "global_step": 69835, "epoch": 415} {"train_loss": -8.810046195983887, "global_step": 69836, "epoch": 415} {"train_loss": -8.617077827453613, "global_step": 69837, "epoch": 415} {"train_loss": -8.564239501953125, "global_step": 69838, "epoch": 415} {"train_loss": -8.357545852661133, "global_step": 69839, "epoch": 415} {"train_loss": -8.910687446594238, "global_step": 69840, "epoch": 415} {"train_loss": -8.451302528381348, "global_step": 69841, "epoch": 415} {"train_loss": -8.714384078979492, "global_step": 69842, "epoch": 415} {"train_loss": -8.469359397888184, "global_step": 69843, "epoch": 415} {"train_loss": -8.528793334960938, "global_step": 69844, "epoch": 415} {"train_loss": -8.906401634216309, "global_step": 69845, "epoch": 415} {"train_loss": -8.626029968261719, "global_step": 69846, "epoch": 415} {"train_loss": -8.498146057128906, "global_step": 69847, "epoch": 415} {"train_loss": -8.63807487487793, "global_step": 69848, "epoch": 415} {"train_loss": -8.8797607421875, "global_step": 69849, "epoch": 415} {"train_loss": -8.52213191986084, "global_step": 69850, "epoch": 415} {"train_loss": -8.994132995605469, "global_step": 69851, "epoch": 415} {"train_loss": -8.852209091186523, "global_step": 69852, "epoch": 415} {"train_loss": -8.8703031539917, "global_step": 69853, "epoch": 415} {"train_loss": -8.751338005065918, "global_step": 69854, "epoch": 415} {"train_loss": -8.726713180541992, "global_step": 69855, "epoch": 415} {"train_loss": -8.848417282104492, "global_step": 69856, "epoch": 415} {"train_loss": -8.703164100646973, "global_step": 69857, "epoch": 415} {"train_loss": -8.774024963378906, "global_step": 69858, "epoch": 415} {"train_loss": -8.815446853637695, "global_step": 69859, "epoch": 415} {"train_loss": -8.69919204711914, "global_step": 69860, "epoch": 415} {"train_loss": -8.702264785766602, "global_step": 69861, "epoch": 415} {"train_loss": -8.859557151794434, "global_step": 69862, "epoch": 415} {"train_loss": -8.815441131591797, "global_step": 69863, "epoch": 415} {"train_loss": -8.841014862060547, "global_step": 69864, "epoch": 415} {"train_loss": -8.895589828491211, "global_step": 69865, "epoch": 415} {"train_loss": -8.655410766601562, "global_step": 69866, "epoch": 415} {"train_loss": -8.987465858459473, "global_step": 69867, "epoch": 415} {"train_loss": -8.864221572875977, "global_step": 69868, "epoch": 415} {"train_loss": -8.706327438354492, "global_step": 69869, "epoch": 415} {"train_loss": -8.818477630615234, "global_step": 69870, "epoch": 415} {"train_loss": -8.72089672088623, "global_step": 69871, "epoch": 415} {"train_loss": -8.914097785949707, "global_step": 69872, "epoch": 415} {"train_loss": -8.742374420166016, "global_step": 69873, "epoch": 415} {"train_loss": -8.726115226745605, "global_step": 69874, "epoch": 415} {"train_loss": -8.931415557861328, "global_step": 69875, "epoch": 415} {"train_loss": -8.633880615234375, "global_step": 69876, "epoch": 415} {"train_loss": -8.778700828552246, "global_step": 69877, "epoch": 415} {"train_loss": -8.836774826049805, "global_step": 69878, "epoch": 415} {"train_loss": -8.851301193237305, "global_step": 69879, "epoch": 415} {"train_loss": -8.866294860839844, "global_step": 69880, "epoch": 415} {"train_loss": -9.126859664916992, "global_step": 69881, "epoch": 415} {"train_loss": -8.716099739074707, "global_step": 69882, "epoch": 415} {"train_loss": -8.764873504638672, "global_step": 69883, "epoch": 415} {"train_loss": -8.89091682434082, "global_step": 69884, "epoch": 415} {"train_loss": -8.844717025756836, "global_step": 69885, "epoch": 415} {"train_loss": -8.883932113647461, "global_step": 69886, "epoch": 415} {"train_loss": -8.849852204322815, "global_step": 69887, "epoch": 415, "val_loss": 191418.8125, "train_action_mse_error": 4.8558573722839355} {"train_loss": -8.832736015319824, "global_step": 69888, "epoch": 416} {"train_loss": -9.068909645080566, "global_step": 69889, "epoch": 416} {"train_loss": -8.963972091674805, "global_step": 69890, "epoch": 416} {"train_loss": -8.7084379196167, "global_step": 69891, "epoch": 416} {"train_loss": -8.874136924743652, "global_step": 69892, "epoch": 416} {"train_loss": -9.160303115844727, "global_step": 69893, "epoch": 416} {"train_loss": -8.88645076751709, "global_step": 69894, "epoch": 416} {"train_loss": -8.871072769165039, "global_step": 69895, "epoch": 416} {"train_loss": -9.015066146850586, "global_step": 69896, "epoch": 416} {"train_loss": -8.83184814453125, "global_step": 69897, "epoch": 416} {"train_loss": -8.853302001953125, "global_step": 69898, "epoch": 416} {"train_loss": -9.061688423156738, "global_step": 69899, "epoch": 416} {"train_loss": -8.602975845336914, "global_step": 69900, "epoch": 416} {"train_loss": -9.0747652053833, "global_step": 69901, "epoch": 416} {"train_loss": -8.928730010986328, "global_step": 69902, "epoch": 416} {"train_loss": -8.857526779174805, "global_step": 69903, "epoch": 416} {"train_loss": -9.016658782958984, "global_step": 69904, "epoch": 416} {"train_loss": -9.061473846435547, "global_step": 69905, "epoch": 416} {"train_loss": -8.894364356994629, "global_step": 69906, "epoch": 416} {"train_loss": -8.82369613647461, "global_step": 69907, "epoch": 416} {"train_loss": -8.880889892578125, "global_step": 69908, "epoch": 416} {"train_loss": -8.600200653076172, "global_step": 69909, "epoch": 416} {"train_loss": -8.9815034866333, "global_step": 69910, "epoch": 416} {"train_loss": -8.800674438476562, "global_step": 69911, "epoch": 416} {"train_loss": -8.947141647338867, "global_step": 69912, "epoch": 416} {"train_loss": -8.86117172241211, "global_step": 69913, "epoch": 416} {"train_loss": -8.942829132080078, "global_step": 69914, "epoch": 416} {"train_loss": -8.713211059570312, "global_step": 69915, "epoch": 416} {"train_loss": -8.672283172607422, "global_step": 69916, "epoch": 416} {"train_loss": -9.039128303527832, "global_step": 69917, "epoch": 416} {"train_loss": -8.57939338684082, "global_step": 69918, "epoch": 416} {"train_loss": -8.556327819824219, "global_step": 69919, "epoch": 416} {"train_loss": -8.79730224609375, "global_step": 69920, "epoch": 416} {"train_loss": -8.975072860717773, "global_step": 69921, "epoch": 416} {"train_loss": -8.617048263549805, "global_step": 69922, "epoch": 416} {"train_loss": -8.932143211364746, "global_step": 69923, "epoch": 416} {"train_loss": -8.744407653808594, "global_step": 69924, "epoch": 416} {"train_loss": -8.934906005859375, "global_step": 69925, "epoch": 416} {"train_loss": -8.655614852905273, "global_step": 69926, "epoch": 416} {"train_loss": -9.218432426452637, "global_step": 69927, "epoch": 416} {"train_loss": -8.837146759033203, "global_step": 69928, "epoch": 416} {"train_loss": -8.702164649963379, "global_step": 69929, "epoch": 416} {"train_loss": -8.895940780639648, "global_step": 69930, "epoch": 416} {"train_loss": -8.991578102111816, "global_step": 69931, "epoch": 416} {"train_loss": -8.743696212768555, "global_step": 69932, "epoch": 416} {"train_loss": -8.790929794311523, "global_step": 69933, "epoch": 416} {"train_loss": -9.010564804077148, "global_step": 69934, "epoch": 416} {"train_loss": -9.04401969909668, "global_step": 69935, "epoch": 416} {"train_loss": -9.047859191894531, "global_step": 69936, "epoch": 416} {"train_loss": -9.154192924499512, "global_step": 69937, "epoch": 416} {"train_loss": -8.928839683532715, "global_step": 69938, "epoch": 416} {"train_loss": -9.022340774536133, "global_step": 69939, "epoch": 416} {"train_loss": -8.929973602294922, "global_step": 69940, "epoch": 416} {"train_loss": -8.93063735961914, "global_step": 69941, "epoch": 416} {"train_loss": -8.876479148864746, "global_step": 69942, "epoch": 416} {"train_loss": -8.931591987609863, "global_step": 69943, "epoch": 416} {"train_loss": -8.795465469360352, "global_step": 69944, "epoch": 416} {"train_loss": -9.097355842590332, "global_step": 69945, "epoch": 416} {"train_loss": -9.032135009765625, "global_step": 69946, "epoch": 416} {"train_loss": -8.860686302185059, "global_step": 69947, "epoch": 416} {"train_loss": -8.94392204284668, "global_step": 69948, "epoch": 416} {"train_loss": -9.027708053588867, "global_step": 69949, "epoch": 416} {"train_loss": -9.014488220214844, "global_step": 69950, "epoch": 416} {"train_loss": -9.08154296875, "global_step": 69951, "epoch": 416} {"train_loss": -8.92261028289795, "global_step": 69952, "epoch": 416} {"train_loss": -8.886871337890625, "global_step": 69953, "epoch": 416} {"train_loss": -8.613183975219727, "global_step": 69954, "epoch": 416} {"train_loss": -9.053171157836914, "global_step": 69955, "epoch": 416} {"train_loss": -8.917025566101074, "global_step": 69956, "epoch": 416} {"train_loss": -8.92999267578125, "global_step": 69957, "epoch": 416} {"train_loss": -8.791481971740723, "global_step": 69958, "epoch": 416} {"train_loss": -9.106147766113281, "global_step": 69959, "epoch": 416} {"train_loss": -9.012251853942871, "global_step": 69960, "epoch": 416} {"train_loss": -8.985898971557617, "global_step": 69961, "epoch": 416} {"train_loss": -9.01339340209961, "global_step": 69962, "epoch": 416} {"train_loss": -9.199922561645508, "global_step": 69963, "epoch": 416} {"train_loss": -8.945623397827148, "global_step": 69964, "epoch": 416} {"train_loss": -8.937231063842773, "global_step": 69965, "epoch": 416} {"train_loss": -9.061826705932617, "global_step": 69966, "epoch": 416} {"train_loss": -8.883453369140625, "global_step": 69967, "epoch": 416} {"train_loss": -9.019546508789062, "global_step": 69968, "epoch": 416} {"train_loss": -8.91823673248291, "global_step": 69969, "epoch": 416} {"train_loss": -8.940690994262695, "global_step": 69970, "epoch": 416} {"train_loss": -9.055265426635742, "global_step": 69971, "epoch": 416} {"train_loss": -8.976313591003418, "global_step": 69972, "epoch": 416} {"train_loss": -9.172574996948242, "global_step": 69973, "epoch": 416} {"train_loss": -8.64970588684082, "global_step": 69974, "epoch": 416} {"train_loss": -8.532133102416992, "global_step": 69975, "epoch": 416} {"train_loss": -8.982511520385742, "global_step": 69976, "epoch": 416} {"train_loss": -8.71693229675293, "global_step": 69977, "epoch": 416} {"train_loss": -8.518260955810547, "global_step": 69978, "epoch": 416} {"train_loss": -8.768560409545898, "global_step": 69979, "epoch": 416} {"train_loss": -8.730798721313477, "global_step": 69980, "epoch": 416} {"train_loss": -8.859878540039062, "global_step": 69981, "epoch": 416} {"train_loss": -8.836661338806152, "global_step": 69982, "epoch": 416} {"train_loss": -8.919134140014648, "global_step": 69983, "epoch": 416} {"train_loss": -8.85474681854248, "global_step": 69984, "epoch": 416} {"train_loss": -8.733004570007324, "global_step": 69985, "epoch": 416} {"train_loss": -8.858783721923828, "global_step": 69986, "epoch": 416} {"train_loss": -8.969830513000488, "global_step": 69987, "epoch": 416} {"train_loss": -8.835184097290039, "global_step": 69988, "epoch": 416} {"train_loss": -8.754603385925293, "global_step": 69989, "epoch": 416} {"train_loss": -8.893040657043457, "global_step": 69990, "epoch": 416} {"train_loss": -8.894574165344238, "global_step": 69991, "epoch": 416} {"train_loss": -8.75566291809082, "global_step": 69992, "epoch": 416} {"train_loss": -8.902507781982422, "global_step": 69993, "epoch": 416} {"train_loss": -8.905458450317383, "global_step": 69994, "epoch": 416} {"train_loss": -9.133243560791016, "global_step": 69995, "epoch": 416} {"train_loss": -8.949745178222656, "global_step": 69996, "epoch": 416} {"train_loss": -8.898946762084961, "global_step": 69997, "epoch": 416} {"train_loss": -8.760615348815918, "global_step": 69998, "epoch": 416} {"train_loss": -9.11794662475586, "global_step": 69999, "epoch": 416} {"train_loss": -8.859590530395508, "global_step": 70000, "epoch": 416} {"train_loss": -9.107939720153809, "global_step": 70001, "epoch": 416} {"train_loss": -9.045406341552734, "global_step": 70002, "epoch": 416} {"train_loss": -8.848657608032227, "global_step": 70003, "epoch": 416} {"train_loss": -8.719430923461914, "global_step": 70004, "epoch": 416} {"train_loss": -8.794546127319336, "global_step": 70005, "epoch": 416} {"train_loss": -8.880245208740234, "global_step": 70006, "epoch": 416} {"train_loss": -8.885270118713379, "global_step": 70007, "epoch": 416} {"train_loss": -8.762805938720703, "global_step": 70008, "epoch": 416} {"train_loss": -8.842613220214844, "global_step": 70009, "epoch": 416} {"train_loss": -8.4708251953125, "global_step": 70010, "epoch": 416} {"train_loss": -8.96136474609375, "global_step": 70011, "epoch": 416} {"train_loss": -8.647884368896484, "global_step": 70012, "epoch": 416} {"train_loss": -8.876087188720703, "global_step": 70013, "epoch": 416} {"train_loss": -8.68773078918457, "global_step": 70014, "epoch": 416} {"train_loss": -8.732402801513672, "global_step": 70015, "epoch": 416} {"train_loss": -8.92953872680664, "global_step": 70016, "epoch": 416} {"train_loss": -8.844738006591797, "global_step": 70017, "epoch": 416} {"train_loss": -8.952011108398438, "global_step": 70018, "epoch": 416} {"train_loss": -8.97456169128418, "global_step": 70019, "epoch": 416} {"train_loss": -8.867141723632812, "global_step": 70020, "epoch": 416} {"train_loss": -8.759766578674316, "global_step": 70021, "epoch": 416} {"train_loss": -8.910781860351562, "global_step": 70022, "epoch": 416} {"train_loss": -8.883283615112305, "global_step": 70023, "epoch": 416} {"train_loss": -8.886396408081055, "global_step": 70024, "epoch": 416} {"train_loss": -9.034592628479004, "global_step": 70025, "epoch": 416} {"train_loss": -8.695475578308105, "global_step": 70026, "epoch": 416} {"train_loss": -8.915678024291992, "global_step": 70027, "epoch": 416} {"train_loss": -9.240667343139648, "global_step": 70028, "epoch": 416} {"train_loss": -8.795275688171387, "global_step": 70029, "epoch": 416} {"train_loss": -8.958870887756348, "global_step": 70030, "epoch": 416} {"train_loss": -8.984838485717773, "global_step": 70031, "epoch": 416} {"train_loss": -8.805764198303223, "global_step": 70032, "epoch": 416} {"train_loss": -8.997306823730469, "global_step": 70033, "epoch": 416} {"train_loss": -8.899225234985352, "global_step": 70034, "epoch": 416} {"train_loss": -9.033821105957031, "global_step": 70035, "epoch": 416} {"train_loss": -9.06509017944336, "global_step": 70036, "epoch": 416} {"train_loss": -8.904533386230469, "global_step": 70037, "epoch": 416} {"train_loss": -8.821212768554688, "global_step": 70038, "epoch": 416} {"train_loss": -8.839849472045898, "global_step": 70039, "epoch": 416} {"train_loss": -9.050863265991211, "global_step": 70040, "epoch": 416} {"train_loss": -8.991617202758789, "global_step": 70041, "epoch": 416} {"train_loss": -8.959526062011719, "global_step": 70042, "epoch": 416} {"train_loss": -9.11347770690918, "global_step": 70043, "epoch": 416} {"train_loss": -9.074167251586914, "global_step": 70044, "epoch": 416} {"train_loss": -8.931718826293945, "global_step": 70045, "epoch": 416} {"train_loss": -9.095076560974121, "global_step": 70046, "epoch": 416} {"train_loss": -8.915446281433105, "global_step": 70047, "epoch": 416} {"train_loss": -8.85154914855957, "global_step": 70048, "epoch": 416} {"train_loss": -8.728708267211914, "global_step": 70049, "epoch": 416} {"train_loss": -8.701854705810547, "global_step": 70050, "epoch": 416} {"train_loss": -8.822843551635742, "global_step": 70051, "epoch": 416} {"train_loss": -8.78373908996582, "global_step": 70052, "epoch": 416} {"train_loss": -8.9727201461792, "global_step": 70053, "epoch": 416} {"train_loss": -8.800383567810059, "global_step": 70054, "epoch": 416} {"train_loss": -8.896066830271767, "global_step": 70055, "epoch": 416, "val_loss": 195694.578125} {"train_loss": -9.02627182006836, "global_step": 70056, "epoch": 417} {"train_loss": -8.945300102233887, "global_step": 70057, "epoch": 417} {"train_loss": -9.036262512207031, "global_step": 70058, "epoch": 417} {"train_loss": -8.939192771911621, "global_step": 70059, "epoch": 417} {"train_loss": -8.97708797454834, "global_step": 70060, "epoch": 417} {"train_loss": -8.97437858581543, "global_step": 70061, "epoch": 417} {"train_loss": -9.149253845214844, "global_step": 70062, "epoch": 417} {"train_loss": -8.944116592407227, "global_step": 70063, "epoch": 417} {"train_loss": -9.081838607788086, "global_step": 70064, "epoch": 417} {"train_loss": -8.860648155212402, "global_step": 70065, "epoch": 417} {"train_loss": -8.837797164916992, "global_step": 70066, "epoch": 417} {"train_loss": -8.533524513244629, "global_step": 70067, "epoch": 417} {"train_loss": -8.834141731262207, "global_step": 70068, "epoch": 417} {"train_loss": -8.911389350891113, "global_step": 70069, "epoch": 417} {"train_loss": -8.782768249511719, "global_step": 70070, "epoch": 417} {"train_loss": -8.930978775024414, "global_step": 70071, "epoch": 417} {"train_loss": -8.781673431396484, "global_step": 70072, "epoch": 417} {"train_loss": -8.96861457824707, "global_step": 70073, "epoch": 417} {"train_loss": -8.695716857910156, "global_step": 70074, "epoch": 417} {"train_loss": -9.108489036560059, "global_step": 70075, "epoch": 417} {"train_loss": -8.920068740844727, "global_step": 70076, "epoch": 417} {"train_loss": -8.724587440490723, "global_step": 70077, "epoch": 417} {"train_loss": -8.908315658569336, "global_step": 70078, "epoch": 417} {"train_loss": -8.836160659790039, "global_step": 70079, "epoch": 417} {"train_loss": -9.154319763183594, "global_step": 70080, "epoch": 417} {"train_loss": -8.652828216552734, "global_step": 70081, "epoch": 417} {"train_loss": -9.00826644897461, "global_step": 70082, "epoch": 417} {"train_loss": -8.729305267333984, "global_step": 70083, "epoch": 417} {"train_loss": -8.945704460144043, "global_step": 70084, "epoch": 417} {"train_loss": -8.995773315429688, "global_step": 70085, "epoch": 417} {"train_loss": -8.941889762878418, "global_step": 70086, "epoch": 417} {"train_loss": -8.862335205078125, "global_step": 70087, "epoch": 417} {"train_loss": -8.989931106567383, "global_step": 70088, "epoch": 417} {"train_loss": -8.849626541137695, "global_step": 70089, "epoch": 417} {"train_loss": -8.969602584838867, "global_step": 70090, "epoch": 417} {"train_loss": -9.048141479492188, "global_step": 70091, "epoch": 417} {"train_loss": -8.83642578125, "global_step": 70092, "epoch": 417} {"train_loss": -9.1395263671875, "global_step": 70093, "epoch": 417} {"train_loss": -8.916162490844727, "global_step": 70094, "epoch": 417} {"train_loss": -8.93844985961914, "global_step": 70095, "epoch": 417} {"train_loss": -8.82602596282959, "global_step": 70096, "epoch": 417} {"train_loss": -8.881546020507812, "global_step": 70097, "epoch": 417} {"train_loss": -9.129218101501465, "global_step": 70098, "epoch": 417} {"train_loss": -9.075257301330566, "global_step": 70099, "epoch": 417} {"train_loss": -8.987783432006836, "global_step": 70100, "epoch": 417} {"train_loss": -9.072565078735352, "global_step": 70101, "epoch": 417} {"train_loss": -9.045205116271973, "global_step": 70102, "epoch": 417} {"train_loss": -8.975250244140625, "global_step": 70103, "epoch": 417} {"train_loss": -9.201444625854492, "global_step": 70104, "epoch": 417} {"train_loss": -8.893332481384277, "global_step": 70105, "epoch": 417} {"train_loss": -9.089677810668945, "global_step": 70106, "epoch": 417} {"train_loss": -8.976423263549805, "global_step": 70107, "epoch": 417} {"train_loss": -9.09912109375, "global_step": 70108, "epoch": 417} {"train_loss": -8.910688400268555, "global_step": 70109, "epoch": 417} {"train_loss": -8.605079650878906, "global_step": 70110, "epoch": 417} {"train_loss": -8.96122932434082, "global_step": 70111, "epoch": 417} {"train_loss": -8.436944961547852, "global_step": 70112, "epoch": 417} {"train_loss": -8.899011611938477, "global_step": 70113, "epoch": 417} {"train_loss": -8.335062026977539, "global_step": 70114, "epoch": 417} {"train_loss": -9.007320404052734, "global_step": 70115, "epoch": 417} {"train_loss": -8.56257152557373, "global_step": 70116, "epoch": 417} {"train_loss": -8.69801139831543, "global_step": 70117, "epoch": 417} {"train_loss": -8.487792015075684, "global_step": 70118, "epoch": 417} {"train_loss": -8.982135772705078, "global_step": 70119, "epoch": 417} {"train_loss": -8.62277603149414, "global_step": 70120, "epoch": 417} {"train_loss": -8.863377571105957, "global_step": 70121, "epoch": 417} {"train_loss": -8.604032516479492, "global_step": 70122, "epoch": 417} {"train_loss": -8.549525260925293, "global_step": 70123, "epoch": 417} {"train_loss": -8.943399429321289, "global_step": 70124, "epoch": 417} {"train_loss": -8.971414566040039, "global_step": 70125, "epoch": 417} {"train_loss": -8.787363052368164, "global_step": 70126, "epoch": 417} {"train_loss": -9.080533027648926, "global_step": 70127, "epoch": 417} {"train_loss": -8.891095161437988, "global_step": 70128, "epoch": 417} {"train_loss": -9.065703392028809, "global_step": 70129, "epoch": 417} {"train_loss": -8.774243354797363, "global_step": 70130, "epoch": 417} {"train_loss": -8.807969093322754, "global_step": 70131, "epoch": 417} {"train_loss": -8.921516418457031, "global_step": 70132, "epoch": 417} {"train_loss": -8.758323669433594, "global_step": 70133, "epoch": 417} {"train_loss": -8.853031158447266, "global_step": 70134, "epoch": 417} {"train_loss": -9.106884002685547, "global_step": 70135, "epoch": 417} {"train_loss": -9.026312828063965, "global_step": 70136, "epoch": 417} {"train_loss": -9.070028305053711, "global_step": 70137, "epoch": 417} {"train_loss": -9.182096481323242, "global_step": 70138, "epoch": 417} {"train_loss": -9.083538055419922, "global_step": 70139, "epoch": 417} {"train_loss": -9.048307418823242, "global_step": 70140, "epoch": 417} {"train_loss": -8.973695755004883, "global_step": 70141, "epoch": 417} {"train_loss": -9.050371170043945, "global_step": 70142, "epoch": 417} {"train_loss": -9.093867301940918, "global_step": 70143, "epoch": 417} {"train_loss": -8.976012229919434, "global_step": 70144, "epoch": 417} {"train_loss": -8.820209503173828, "global_step": 70145, "epoch": 417} {"train_loss": -9.11938762664795, "global_step": 70146, "epoch": 417} {"train_loss": -9.146297454833984, "global_step": 70147, "epoch": 417} {"train_loss": -9.158964157104492, "global_step": 70148, "epoch": 417} {"train_loss": -9.261466979980469, "global_step": 70149, "epoch": 417} {"train_loss": -9.073822021484375, "global_step": 70150, "epoch": 417} {"train_loss": -9.003725051879883, "global_step": 70151, "epoch": 417} {"train_loss": -8.953989028930664, "global_step": 70152, "epoch": 417} {"train_loss": -8.930094718933105, "global_step": 70153, "epoch": 417} {"train_loss": -9.034873962402344, "global_step": 70154, "epoch": 417} {"train_loss": -9.175739288330078, "global_step": 70155, "epoch": 417} {"train_loss": -8.990689277648926, "global_step": 70156, "epoch": 417} {"train_loss": -9.075479507446289, "global_step": 70157, "epoch": 417} {"train_loss": -9.2542085647583, "global_step": 70158, "epoch": 417} {"train_loss": -9.004478454589844, "global_step": 70159, "epoch": 417} {"train_loss": -9.206154823303223, "global_step": 70160, "epoch": 417} {"train_loss": -8.808404922485352, "global_step": 70161, "epoch": 417} {"train_loss": -9.055389404296875, "global_step": 70162, "epoch": 417} {"train_loss": -9.052704811096191, "global_step": 70163, "epoch": 417} {"train_loss": -8.993271827697754, "global_step": 70164, "epoch": 417} {"train_loss": -8.833538055419922, "global_step": 70165, "epoch": 417} {"train_loss": -8.903221130371094, "global_step": 70166, "epoch": 417} {"train_loss": -9.080987930297852, "global_step": 70167, "epoch": 417} {"train_loss": -9.007264137268066, "global_step": 70168, "epoch": 417} {"train_loss": -9.117030143737793, "global_step": 70169, "epoch": 417} {"train_loss": -8.884254455566406, "global_step": 70170, "epoch": 417} {"train_loss": -8.936427116394043, "global_step": 70171, "epoch": 417} {"train_loss": -9.068488121032715, "global_step": 70172, "epoch": 417} {"train_loss": -8.952778816223145, "global_step": 70173, "epoch": 417} {"train_loss": -8.863726615905762, "global_step": 70174, "epoch": 417} {"train_loss": -9.072996139526367, "global_step": 70175, "epoch": 417} {"train_loss": -8.854175567626953, "global_step": 70176, "epoch": 417} {"train_loss": -8.982542991638184, "global_step": 70177, "epoch": 417} {"train_loss": -8.753412246704102, "global_step": 70178, "epoch": 417} {"train_loss": -8.782320022583008, "global_step": 70179, "epoch": 417} {"train_loss": -8.766752243041992, "global_step": 70180, "epoch": 417} {"train_loss": -8.695965766906738, "global_step": 70181, "epoch": 417} {"train_loss": -8.81631088256836, "global_step": 70182, "epoch": 417} {"train_loss": -8.641510009765625, "global_step": 70183, "epoch": 417} {"train_loss": -8.70954704284668, "global_step": 70184, "epoch": 417} {"train_loss": -8.825300216674805, "global_step": 70185, "epoch": 417} {"train_loss": -8.584356307983398, "global_step": 70186, "epoch": 417} {"train_loss": -8.912662506103516, "global_step": 70187, "epoch": 417} {"train_loss": -8.811935424804688, "global_step": 70188, "epoch": 417} {"train_loss": -8.814638137817383, "global_step": 70189, "epoch": 417} {"train_loss": -8.57989501953125, "global_step": 70190, "epoch": 417} {"train_loss": -9.007604598999023, "global_step": 70191, "epoch": 417} {"train_loss": -8.782777786254883, "global_step": 70192, "epoch": 417} {"train_loss": -9.032671928405762, "global_step": 70193, "epoch": 417} {"train_loss": -8.902714729309082, "global_step": 70194, "epoch": 417} {"train_loss": -8.910531997680664, "global_step": 70195, "epoch": 417} {"train_loss": -8.900569915771484, "global_step": 70196, "epoch": 417} {"train_loss": -9.161481857299805, "global_step": 70197, "epoch": 417} {"train_loss": -9.088451385498047, "global_step": 70198, "epoch": 417} {"train_loss": -8.840046882629395, "global_step": 70199, "epoch": 417} {"train_loss": -8.918449401855469, "global_step": 70200, "epoch": 417} {"train_loss": -9.125160217285156, "global_step": 70201, "epoch": 417} {"train_loss": -9.135612487792969, "global_step": 70202, "epoch": 417} {"train_loss": -8.943222045898438, "global_step": 70203, "epoch": 417} {"train_loss": -9.058343887329102, "global_step": 70204, "epoch": 417} {"train_loss": -9.109331130981445, "global_step": 70205, "epoch": 417} {"train_loss": -9.08040714263916, "global_step": 70206, "epoch": 417} {"train_loss": -9.203046798706055, "global_step": 70207, "epoch": 417} {"train_loss": -9.05022144317627, "global_step": 70208, "epoch": 417} {"train_loss": -9.08216667175293, "global_step": 70209, "epoch": 417} {"train_loss": -9.016159057617188, "global_step": 70210, "epoch": 417} {"train_loss": -9.058538436889648, "global_step": 70211, "epoch": 417} {"train_loss": -9.147699356079102, "global_step": 70212, "epoch": 417} {"train_loss": -9.19998550415039, "global_step": 70213, "epoch": 417} {"train_loss": -9.120584487915039, "global_step": 70214, "epoch": 417} {"train_loss": -9.154378890991211, "global_step": 70215, "epoch": 417} {"train_loss": -9.143814086914062, "global_step": 70216, "epoch": 417} {"train_loss": -9.0283203125, "global_step": 70217, "epoch": 417} {"train_loss": -9.194957733154297, "global_step": 70218, "epoch": 417} {"train_loss": -9.11713695526123, "global_step": 70219, "epoch": 417} {"train_loss": -9.106921195983887, "global_step": 70220, "epoch": 417} {"train_loss": -8.972404479980469, "global_step": 70221, "epoch": 417} {"train_loss": -8.915221214294434, "global_step": 70222, "epoch": 417} {"train_loss": -8.944683313369751, "global_step": 70223, "epoch": 417, "val_loss": 192821.8125} {"train_loss": -9.202765464782715, "global_step": 70224, "epoch": 418} {"train_loss": -9.0239896774292, "global_step": 70225, "epoch": 418} {"train_loss": -9.147550582885742, "global_step": 70226, "epoch": 418} {"train_loss": -9.13768196105957, "global_step": 70227, "epoch": 418} {"train_loss": -8.879602432250977, "global_step": 70228, "epoch": 418} {"train_loss": -9.156261444091797, "global_step": 70229, "epoch": 418} {"train_loss": -9.180628776550293, "global_step": 70230, "epoch": 418} {"train_loss": -8.952934265136719, "global_step": 70231, "epoch": 418} {"train_loss": -8.968027114868164, "global_step": 70232, "epoch": 418} {"train_loss": -8.797977447509766, "global_step": 70233, "epoch": 418} {"train_loss": -9.038949966430664, "global_step": 70234, "epoch": 418} {"train_loss": -8.951175689697266, "global_step": 70235, "epoch": 418} {"train_loss": -8.858360290527344, "global_step": 70236, "epoch": 418} {"train_loss": -8.967634201049805, "global_step": 70237, "epoch": 418} {"train_loss": -9.170463562011719, "global_step": 70238, "epoch": 418} {"train_loss": -8.822513580322266, "global_step": 70239, "epoch": 418} {"train_loss": -9.00904655456543, "global_step": 70240, "epoch": 418} {"train_loss": -8.821695327758789, "global_step": 70241, "epoch": 418} {"train_loss": -9.204620361328125, "global_step": 70242, "epoch": 418} {"train_loss": -9.148746490478516, "global_step": 70243, "epoch": 418} {"train_loss": -9.026956558227539, "global_step": 70244, "epoch": 418} {"train_loss": -8.981318473815918, "global_step": 70245, "epoch": 418} {"train_loss": -8.853828430175781, "global_step": 70246, "epoch": 418} {"train_loss": -8.848033905029297, "global_step": 70247, "epoch": 418} {"train_loss": -9.05109977722168, "global_step": 70248, "epoch": 418} {"train_loss": -8.693458557128906, "global_step": 70249, "epoch": 418} {"train_loss": -8.771759986877441, "global_step": 70250, "epoch": 418} {"train_loss": -8.73972225189209, "global_step": 70251, "epoch": 418} {"train_loss": -9.015131950378418, "global_step": 70252, "epoch": 418} {"train_loss": -8.88042163848877, "global_step": 70253, "epoch": 418} {"train_loss": -8.710343360900879, "global_step": 70254, "epoch": 418} {"train_loss": -8.876996040344238, "global_step": 70255, "epoch": 418} {"train_loss": -9.06833267211914, "global_step": 70256, "epoch": 418} {"train_loss": -8.962684631347656, "global_step": 70257, "epoch": 418} {"train_loss": -8.991907119750977, "global_step": 70258, "epoch": 418} {"train_loss": -8.663640975952148, "global_step": 70259, "epoch": 418} {"train_loss": -8.955387115478516, "global_step": 70260, "epoch": 418} {"train_loss": -8.76733112335205, "global_step": 70261, "epoch": 418} {"train_loss": -8.816022872924805, "global_step": 70262, "epoch": 418} {"train_loss": -8.741009712219238, "global_step": 70263, "epoch": 418} {"train_loss": -8.892807006835938, "global_step": 70264, "epoch": 418} {"train_loss": -8.81723403930664, "global_step": 70265, "epoch": 418} {"train_loss": -8.892383575439453, "global_step": 70266, "epoch": 418} {"train_loss": -8.949182510375977, "global_step": 70267, "epoch": 418} {"train_loss": -8.66076374053955, "global_step": 70268, "epoch": 418} {"train_loss": -8.717795372009277, "global_step": 70269, "epoch": 418} {"train_loss": -8.926298141479492, "global_step": 70270, "epoch": 418} {"train_loss": -9.391403198242188, "global_step": 70271, "epoch": 418} {"train_loss": -9.007862091064453, "global_step": 70272, "epoch": 418} {"train_loss": -8.983686447143555, "global_step": 70273, "epoch": 418} {"train_loss": -8.567747116088867, "global_step": 70274, "epoch": 418} {"train_loss": -8.898731231689453, "global_step": 70275, "epoch": 418} {"train_loss": -8.98287296295166, "global_step": 70276, "epoch": 418} {"train_loss": -9.037511825561523, "global_step": 70277, "epoch": 418} {"train_loss": -8.97770881652832, "global_step": 70278, "epoch": 418} {"train_loss": -8.92392349243164, "global_step": 70279, "epoch": 418} {"train_loss": -8.84797191619873, "global_step": 70280, "epoch": 418} {"train_loss": -9.10153579711914, "global_step": 70281, "epoch": 418} {"train_loss": -8.665376663208008, "global_step": 70282, "epoch": 418} {"train_loss": -9.011213302612305, "global_step": 70283, "epoch": 418} {"train_loss": -9.076704978942871, "global_step": 70284, "epoch": 418} {"train_loss": -8.997838973999023, "global_step": 70285, "epoch": 418} {"train_loss": -8.885053634643555, "global_step": 70286, "epoch": 418} {"train_loss": -8.92057991027832, "global_step": 70287, "epoch": 418} {"train_loss": -9.094038009643555, "global_step": 70288, "epoch": 418} {"train_loss": -8.802329063415527, "global_step": 70289, "epoch": 418} {"train_loss": -9.06987190246582, "global_step": 70290, "epoch": 418} {"train_loss": -8.944327354431152, "global_step": 70291, "epoch": 418} {"train_loss": -8.813774108886719, "global_step": 70292, "epoch": 418} {"train_loss": -8.983216285705566, "global_step": 70293, "epoch": 418} {"train_loss": -8.873172760009766, "global_step": 70294, "epoch": 418} {"train_loss": -9.193737983703613, "global_step": 70295, "epoch": 418} {"train_loss": -8.923495292663574, "global_step": 70296, "epoch": 418} {"train_loss": -8.81688404083252, "global_step": 70297, "epoch": 418} {"train_loss": -8.653340339660645, "global_step": 70298, "epoch": 418} {"train_loss": -8.953004837036133, "global_step": 70299, "epoch": 418} {"train_loss": -8.856250762939453, "global_step": 70300, "epoch": 418} {"train_loss": -8.947057723999023, "global_step": 70301, "epoch": 418} {"train_loss": -8.997797966003418, "global_step": 70302, "epoch": 418} {"train_loss": -8.747276306152344, "global_step": 70303, "epoch": 418} {"train_loss": -9.109681129455566, "global_step": 70304, "epoch": 418} {"train_loss": -9.134048461914062, "global_step": 70305, "epoch": 418} {"train_loss": -8.869142532348633, "global_step": 70306, "epoch": 418} {"train_loss": -8.958257675170898, "global_step": 70307, "epoch": 418} {"train_loss": -9.097387313842773, "global_step": 70308, "epoch": 418} {"train_loss": -8.994637489318848, "global_step": 70309, "epoch": 418} {"train_loss": -9.183202743530273, "global_step": 70310, "epoch": 418} {"train_loss": -9.006650924682617, "global_step": 70311, "epoch": 418} {"train_loss": -8.826264381408691, "global_step": 70312, "epoch": 418} {"train_loss": -9.234725952148438, "global_step": 70313, "epoch": 418} {"train_loss": -8.744647979736328, "global_step": 70314, "epoch": 418} {"train_loss": -8.745609283447266, "global_step": 70315, "epoch": 418} {"train_loss": -8.91543197631836, "global_step": 70316, "epoch": 418} {"train_loss": -8.937066078186035, "global_step": 70317, "epoch": 418} {"train_loss": -8.833000183105469, "global_step": 70318, "epoch": 418} {"train_loss": -8.769392967224121, "global_step": 70319, "epoch": 418} {"train_loss": -8.741024017333984, "global_step": 70320, "epoch": 418} {"train_loss": -9.162256240844727, "global_step": 70321, "epoch": 418} {"train_loss": -8.958840370178223, "global_step": 70322, "epoch": 418} {"train_loss": -8.965471267700195, "global_step": 70323, "epoch": 418} {"train_loss": -9.046499252319336, "global_step": 70324, "epoch": 418} {"train_loss": -9.005343437194824, "global_step": 70325, "epoch": 418} {"train_loss": -9.111791610717773, "global_step": 70326, "epoch": 418} {"train_loss": -9.07213306427002, "global_step": 70327, "epoch": 418} {"train_loss": -9.083083152770996, "global_step": 70328, "epoch": 418} {"train_loss": -9.164705276489258, "global_step": 70329, "epoch": 418} {"train_loss": -8.87504768371582, "global_step": 70330, "epoch": 418} {"train_loss": -8.991476058959961, "global_step": 70331, "epoch": 418} {"train_loss": -9.049843788146973, "global_step": 70332, "epoch": 418} {"train_loss": -8.858530044555664, "global_step": 70333, "epoch": 418} {"train_loss": -8.325281143188477, "global_step": 70334, "epoch": 418} {"train_loss": -9.223085403442383, "global_step": 70335, "epoch": 418} {"train_loss": -8.636796951293945, "global_step": 70336, "epoch": 418} {"train_loss": -8.958263397216797, "global_step": 70337, "epoch": 418} {"train_loss": -8.370281219482422, "global_step": 70338, "epoch": 418} {"train_loss": -8.980426788330078, "global_step": 70339, "epoch": 418} {"train_loss": -8.300406455993652, "global_step": 70340, "epoch": 418} {"train_loss": -8.927528381347656, "global_step": 70341, "epoch": 418} {"train_loss": -8.767931938171387, "global_step": 70342, "epoch": 418} {"train_loss": -8.508377075195312, "global_step": 70343, "epoch": 418} {"train_loss": -8.733709335327148, "global_step": 70344, "epoch": 418} {"train_loss": -8.895862579345703, "global_step": 70345, "epoch": 418} {"train_loss": -8.642908096313477, "global_step": 70346, "epoch": 418} {"train_loss": -8.868438720703125, "global_step": 70347, "epoch": 418} {"train_loss": -8.95655632019043, "global_step": 70348, "epoch": 418} {"train_loss": -8.893393516540527, "global_step": 70349, "epoch": 418} {"train_loss": -8.863363265991211, "global_step": 70350, "epoch": 418} {"train_loss": -8.764481544494629, "global_step": 70351, "epoch": 418} {"train_loss": -8.883865356445312, "global_step": 70352, "epoch": 418} {"train_loss": -9.131796836853027, "global_step": 70353, "epoch": 418} {"train_loss": -8.903148651123047, "global_step": 70354, "epoch": 418} {"train_loss": -8.814600944519043, "global_step": 70355, "epoch": 418} {"train_loss": -8.726181030273438, "global_step": 70356, "epoch": 418} {"train_loss": -8.974386215209961, "global_step": 70357, "epoch": 418} {"train_loss": -8.631599426269531, "global_step": 70358, "epoch": 418} {"train_loss": -9.052461624145508, "global_step": 70359, "epoch": 418} {"train_loss": -8.770676612854004, "global_step": 70360, "epoch": 418} {"train_loss": -8.9916353225708, "global_step": 70361, "epoch": 418} {"train_loss": -8.581415176391602, "global_step": 70362, "epoch": 418} {"train_loss": -8.684869766235352, "global_step": 70363, "epoch": 418} {"train_loss": -8.73143196105957, "global_step": 70364, "epoch": 418} {"train_loss": -8.95063304901123, "global_step": 70365, "epoch": 418} {"train_loss": -8.78294849395752, "global_step": 70366, "epoch": 418} {"train_loss": -8.959854125976562, "global_step": 70367, "epoch": 418} {"train_loss": -8.988188743591309, "global_step": 70368, "epoch": 418} {"train_loss": -8.74520492553711, "global_step": 70369, "epoch": 418} {"train_loss": -9.134419441223145, "global_step": 70370, "epoch": 418} {"train_loss": -8.781574249267578, "global_step": 70371, "epoch": 418} {"train_loss": -8.817885398864746, "global_step": 70372, "epoch": 418} {"train_loss": -8.976495742797852, "global_step": 70373, "epoch": 418} {"train_loss": -8.77560043334961, "global_step": 70374, "epoch": 418} {"train_loss": -8.935277938842773, "global_step": 70375, "epoch": 418} {"train_loss": -8.82923698425293, "global_step": 70376, "epoch": 418} {"train_loss": -9.12417221069336, "global_step": 70377, "epoch": 418} {"train_loss": -9.031564712524414, "global_step": 70378, "epoch": 418} {"train_loss": -9.102058410644531, "global_step": 70379, "epoch": 418} {"train_loss": -9.026121139526367, "global_step": 70380, "epoch": 418} {"train_loss": -9.031396865844727, "global_step": 70381, "epoch": 418} {"train_loss": -8.966166496276855, "global_step": 70382, "epoch": 418} {"train_loss": -8.891875267028809, "global_step": 70383, "epoch": 418} {"train_loss": -9.059941291809082, "global_step": 70384, "epoch": 418} {"train_loss": -8.938812255859375, "global_step": 70385, "epoch": 418} {"train_loss": -8.804292678833008, "global_step": 70386, "epoch": 418} {"train_loss": -9.027567863464355, "global_step": 70387, "epoch": 418} {"train_loss": -8.933045387268066, "global_step": 70388, "epoch": 418} {"train_loss": -8.968907356262207, "global_step": 70389, "epoch": 418} {"train_loss": -9.112131118774414, "global_step": 70390, "epoch": 418} {"train_loss": -8.919145498956953, "global_step": 70391, "epoch": 418, "val_loss": 193478.640625} {"train_loss": -8.998611450195312, "global_step": 70392, "epoch": 419} {"train_loss": -9.195637702941895, "global_step": 70393, "epoch": 419} {"train_loss": -9.026203155517578, "global_step": 70394, "epoch": 419} {"train_loss": -8.940838813781738, "global_step": 70395, "epoch": 419} {"train_loss": -8.893350601196289, "global_step": 70396, "epoch": 419} {"train_loss": -8.694986343383789, "global_step": 70397, "epoch": 419} {"train_loss": -8.986629486083984, "global_step": 70398, "epoch": 419} {"train_loss": -8.92936897277832, "global_step": 70399, "epoch": 419} {"train_loss": -8.9683837890625, "global_step": 70400, "epoch": 419} {"train_loss": -8.483482360839844, "global_step": 70401, "epoch": 419} {"train_loss": -9.048609733581543, "global_step": 70402, "epoch": 419} {"train_loss": -8.887107849121094, "global_step": 70403, "epoch": 419} {"train_loss": -8.858348846435547, "global_step": 70404, "epoch": 419} {"train_loss": -8.835592269897461, "global_step": 70405, "epoch": 419} {"train_loss": -8.45968246459961, "global_step": 70406, "epoch": 419} {"train_loss": -8.709978103637695, "global_step": 70407, "epoch": 419} {"train_loss": -9.046331405639648, "global_step": 70408, "epoch": 419} {"train_loss": -8.593605041503906, "global_step": 70409, "epoch": 419} {"train_loss": -8.760711669921875, "global_step": 70410, "epoch": 419} {"train_loss": -8.858482360839844, "global_step": 70411, "epoch": 419} {"train_loss": -8.97228717803955, "global_step": 70412, "epoch": 419} {"train_loss": -9.070219039916992, "global_step": 70413, "epoch": 419} {"train_loss": -8.669641494750977, "global_step": 70414, "epoch": 419} {"train_loss": -8.789170265197754, "global_step": 70415, "epoch": 419} {"train_loss": -8.815732955932617, "global_step": 70416, "epoch": 419} {"train_loss": -8.837751388549805, "global_step": 70417, "epoch": 419} {"train_loss": -8.847034454345703, "global_step": 70418, "epoch": 419} {"train_loss": -8.976675987243652, "global_step": 70419, "epoch": 419} {"train_loss": -8.899757385253906, "global_step": 70420, "epoch": 419} {"train_loss": -8.841983795166016, "global_step": 70421, "epoch": 419} {"train_loss": -9.06306266784668, "global_step": 70422, "epoch": 419} {"train_loss": -8.987759590148926, "global_step": 70423, "epoch": 419} {"train_loss": -8.930593490600586, "global_step": 70424, "epoch": 419} {"train_loss": -9.06173324584961, "global_step": 70425, "epoch": 419} {"train_loss": -8.963094711303711, "global_step": 70426, "epoch": 419} {"train_loss": -8.952374458312988, "global_step": 70427, "epoch": 419} {"train_loss": -8.921125411987305, "global_step": 70428, "epoch": 419} {"train_loss": -8.902029037475586, "global_step": 70429, "epoch": 419} {"train_loss": -8.47787857055664, "global_step": 70430, "epoch": 419} {"train_loss": -8.813404083251953, "global_step": 70431, "epoch": 419} {"train_loss": -8.849164962768555, "global_step": 70432, "epoch": 419} {"train_loss": -9.060728073120117, "global_step": 70433, "epoch": 419} {"train_loss": -8.88167953491211, "global_step": 70434, "epoch": 419} {"train_loss": -8.916985511779785, "global_step": 70435, "epoch": 419} {"train_loss": -8.92495059967041, "global_step": 70436, "epoch": 419} {"train_loss": -8.938461303710938, "global_step": 70437, "epoch": 419} {"train_loss": -8.730681419372559, "global_step": 70438, "epoch": 419} {"train_loss": -8.652734756469727, "global_step": 70439, "epoch": 419} {"train_loss": -9.07913589477539, "global_step": 70440, "epoch": 419} {"train_loss": -8.971752166748047, "global_step": 70441, "epoch": 419} {"train_loss": -8.675578117370605, "global_step": 70442, "epoch": 419} {"train_loss": -8.81082534790039, "global_step": 70443, "epoch": 419} {"train_loss": -8.936575889587402, "global_step": 70444, "epoch": 419} {"train_loss": -8.842679977416992, "global_step": 70445, "epoch": 419} {"train_loss": -8.581063270568848, "global_step": 70446, "epoch": 419} {"train_loss": -8.99174690246582, "global_step": 70447, "epoch": 419} {"train_loss": -8.368165969848633, "global_step": 70448, "epoch": 419} {"train_loss": -8.859027862548828, "global_step": 70449, "epoch": 419} {"train_loss": -8.871831893920898, "global_step": 70450, "epoch": 419} {"train_loss": -8.629149436950684, "global_step": 70451, "epoch": 419} {"train_loss": -8.505426406860352, "global_step": 70452, "epoch": 419} {"train_loss": -8.881832122802734, "global_step": 70453, "epoch": 419} {"train_loss": -8.590190887451172, "global_step": 70454, "epoch": 419} {"train_loss": -9.02529525756836, "global_step": 70455, "epoch": 419} {"train_loss": -8.91744613647461, "global_step": 70456, "epoch": 419} {"train_loss": -8.858735084533691, "global_step": 70457, "epoch": 419} {"train_loss": -8.646913528442383, "global_step": 70458, "epoch": 419} {"train_loss": -8.813606262207031, "global_step": 70459, "epoch": 419} {"train_loss": -8.792901039123535, "global_step": 70460, "epoch": 419} {"train_loss": -8.725984573364258, "global_step": 70461, "epoch": 419} {"train_loss": -8.861125946044922, "global_step": 70462, "epoch": 419} {"train_loss": -8.822038650512695, "global_step": 70463, "epoch": 419} {"train_loss": -8.889957427978516, "global_step": 70464, "epoch": 419} {"train_loss": -8.973535537719727, "global_step": 70465, "epoch": 419} {"train_loss": -8.777364730834961, "global_step": 70466, "epoch": 419} {"train_loss": -8.61963939666748, "global_step": 70467, "epoch": 419} {"train_loss": -8.89639949798584, "global_step": 70468, "epoch": 419} {"train_loss": -8.526288986206055, "global_step": 70469, "epoch": 419} {"train_loss": -8.228242874145508, "global_step": 70470, "epoch": 419} {"train_loss": -8.627059936523438, "global_step": 70471, "epoch": 419} {"train_loss": -8.560922622680664, "global_step": 70472, "epoch": 419} {"train_loss": -8.561873435974121, "global_step": 70473, "epoch": 419} {"train_loss": -8.67129135131836, "global_step": 70474, "epoch": 419} {"train_loss": -8.754669189453125, "global_step": 70475, "epoch": 419} {"train_loss": -8.70315933227539, "global_step": 70476, "epoch": 419} {"train_loss": -8.767942428588867, "global_step": 70477, "epoch": 419} {"train_loss": -8.977546691894531, "global_step": 70478, "epoch": 419} {"train_loss": -8.633613586425781, "global_step": 70479, "epoch": 419} {"train_loss": -8.728384017944336, "global_step": 70480, "epoch": 419} {"train_loss": -8.569622039794922, "global_step": 70481, "epoch": 419} {"train_loss": -8.908581733703613, "global_step": 70482, "epoch": 419} {"train_loss": -8.765605926513672, "global_step": 70483, "epoch": 419} {"train_loss": -8.996318817138672, "global_step": 70484, "epoch": 419} {"train_loss": -9.001320838928223, "global_step": 70485, "epoch": 419} {"train_loss": -9.11440658569336, "global_step": 70486, "epoch": 419} {"train_loss": -9.029151916503906, "global_step": 70487, "epoch": 419} {"train_loss": -8.756759643554688, "global_step": 70488, "epoch": 419} {"train_loss": -8.771360397338867, "global_step": 70489, "epoch": 419} {"train_loss": -8.991636276245117, "global_step": 70490, "epoch": 419} {"train_loss": -8.99305248260498, "global_step": 70491, "epoch": 419} {"train_loss": -8.860475540161133, "global_step": 70492, "epoch": 419} {"train_loss": -9.046147346496582, "global_step": 70493, "epoch": 419} {"train_loss": -8.875921249389648, "global_step": 70494, "epoch": 419} {"train_loss": -8.658170700073242, "global_step": 70495, "epoch": 419} {"train_loss": -8.803694725036621, "global_step": 70496, "epoch": 419} {"train_loss": -8.725330352783203, "global_step": 70497, "epoch": 419} {"train_loss": -9.049592971801758, "global_step": 70498, "epoch": 419} {"train_loss": -8.776911735534668, "global_step": 70499, "epoch": 419} {"train_loss": -8.731182098388672, "global_step": 70500, "epoch": 419} {"train_loss": -8.747697830200195, "global_step": 70501, "epoch": 419} {"train_loss": -9.114387512207031, "global_step": 70502, "epoch": 419} {"train_loss": -8.541250228881836, "global_step": 70503, "epoch": 419} {"train_loss": -9.0953369140625, "global_step": 70504, "epoch": 419} {"train_loss": -8.657510757446289, "global_step": 70505, "epoch": 419} {"train_loss": -8.962942123413086, "global_step": 70506, "epoch": 419} {"train_loss": -8.850916862487793, "global_step": 70507, "epoch": 419} {"train_loss": -9.03065299987793, "global_step": 70508, "epoch": 419} {"train_loss": -9.057205200195312, "global_step": 70509, "epoch": 419} {"train_loss": -8.947347640991211, "global_step": 70510, "epoch": 419} {"train_loss": -8.981338500976562, "global_step": 70511, "epoch": 419} {"train_loss": -9.086624145507812, "global_step": 70512, "epoch": 419} {"train_loss": -9.049691200256348, "global_step": 70513, "epoch": 419} {"train_loss": -9.02396011352539, "global_step": 70514, "epoch": 419} {"train_loss": -9.067496299743652, "global_step": 70515, "epoch": 419} {"train_loss": -9.123751640319824, "global_step": 70516, "epoch": 419} {"train_loss": -8.637275695800781, "global_step": 70517, "epoch": 419} {"train_loss": -8.81360912322998, "global_step": 70518, "epoch": 419} {"train_loss": -9.039823532104492, "global_step": 70519, "epoch": 419} {"train_loss": -8.826286315917969, "global_step": 70520, "epoch": 419} {"train_loss": -8.950030326843262, "global_step": 70521, "epoch": 419} {"train_loss": -8.975750923156738, "global_step": 70522, "epoch": 419} {"train_loss": -9.176151275634766, "global_step": 70523, "epoch": 419} {"train_loss": -8.934926986694336, "global_step": 70524, "epoch": 419} {"train_loss": -8.860395431518555, "global_step": 70525, "epoch": 419} {"train_loss": -9.042943000793457, "global_step": 70526, "epoch": 419} {"train_loss": -8.987110137939453, "global_step": 70527, "epoch": 419} {"train_loss": -8.811958312988281, "global_step": 70528, "epoch": 419} {"train_loss": -8.874393463134766, "global_step": 70529, "epoch": 419} {"train_loss": -9.198970794677734, "global_step": 70530, "epoch": 419} {"train_loss": -8.792268753051758, "global_step": 70531, "epoch": 419} {"train_loss": -8.98411750793457, "global_step": 70532, "epoch": 419} {"train_loss": -8.880111694335938, "global_step": 70533, "epoch": 419} {"train_loss": -9.042283058166504, "global_step": 70534, "epoch": 419} {"train_loss": -8.825531959533691, "global_step": 70535, "epoch": 419} {"train_loss": -8.89941120147705, "global_step": 70536, "epoch": 419} {"train_loss": -8.839359283447266, "global_step": 70537, "epoch": 419} {"train_loss": -8.825667381286621, "global_step": 70538, "epoch": 419} {"train_loss": -8.929104804992676, "global_step": 70539, "epoch": 419} {"train_loss": -9.048362731933594, "global_step": 70540, "epoch": 419} {"train_loss": -9.045893669128418, "global_step": 70541, "epoch": 419} {"train_loss": -8.979897499084473, "global_step": 70542, "epoch": 419} {"train_loss": -8.824909210205078, "global_step": 70543, "epoch": 419} {"train_loss": -8.944082260131836, "global_step": 70544, "epoch": 419} {"train_loss": -8.935518264770508, "global_step": 70545, "epoch": 419} {"train_loss": -8.99592399597168, "global_step": 70546, "epoch": 419} {"train_loss": -8.810914993286133, "global_step": 70547, "epoch": 419} {"train_loss": -9.0079345703125, "global_step": 70548, "epoch": 419} {"train_loss": -8.567750930786133, "global_step": 70549, "epoch": 419} {"train_loss": -9.227407455444336, "global_step": 70550, "epoch": 419} {"train_loss": -8.74821662902832, "global_step": 70551, "epoch": 419} {"train_loss": -8.89443588256836, "global_step": 70552, "epoch": 419} {"train_loss": -8.552702903747559, "global_step": 70553, "epoch": 419} {"train_loss": -9.090039253234863, "global_step": 70554, "epoch": 419} {"train_loss": -8.907636642456055, "global_step": 70555, "epoch": 419} {"train_loss": -8.878928184509277, "global_step": 70556, "epoch": 419} {"train_loss": -9.073565483093262, "global_step": 70557, "epoch": 419} {"train_loss": -8.898816108703613, "global_step": 70558, "epoch": 419} {"train_loss": -8.864856861886524, "global_step": 70559, "epoch": 419, "val_loss": 194469.21875} {"train_loss": -9.033063888549805, "global_step": 70560, "epoch": 420} {"train_loss": -9.08009147644043, "global_step": 70561, "epoch": 420} {"train_loss": -8.930166244506836, "global_step": 70562, "epoch": 420} {"train_loss": -9.072609901428223, "global_step": 70563, "epoch": 420} {"train_loss": -8.865032196044922, "global_step": 70564, "epoch": 420} {"train_loss": -8.83538818359375, "global_step": 70565, "epoch": 420} {"train_loss": -8.745420455932617, "global_step": 70566, "epoch": 420} {"train_loss": -9.011539459228516, "global_step": 70567, "epoch": 420} {"train_loss": -8.92394733428955, "global_step": 70568, "epoch": 420} {"train_loss": -8.718950271606445, "global_step": 70569, "epoch": 420} {"train_loss": -8.761466026306152, "global_step": 70570, "epoch": 420} {"train_loss": -8.986733436584473, "global_step": 70571, "epoch": 420} {"train_loss": -8.974210739135742, "global_step": 70572, "epoch": 420} {"train_loss": -8.922590255737305, "global_step": 70573, "epoch": 420} {"train_loss": -8.988471984863281, "global_step": 70574, "epoch": 420} {"train_loss": -9.290451049804688, "global_step": 70575, "epoch": 420} {"train_loss": -9.043864250183105, "global_step": 70576, "epoch": 420} {"train_loss": -9.196954727172852, "global_step": 70577, "epoch": 420} {"train_loss": -9.281309127807617, "global_step": 70578, "epoch": 420} {"train_loss": -9.208980560302734, "global_step": 70579, "epoch": 420} {"train_loss": -9.241206169128418, "global_step": 70580, "epoch": 420} {"train_loss": -9.210683822631836, "global_step": 70581, "epoch": 420} {"train_loss": -9.169419288635254, "global_step": 70582, "epoch": 420} {"train_loss": -9.078923225402832, "global_step": 70583, "epoch": 420} {"train_loss": -9.039928436279297, "global_step": 70584, "epoch": 420} {"train_loss": -9.004072189331055, "global_step": 70585, "epoch": 420} {"train_loss": -9.055041313171387, "global_step": 70586, "epoch": 420} {"train_loss": -9.063045501708984, "global_step": 70587, "epoch": 420} {"train_loss": -9.031661033630371, "global_step": 70588, "epoch": 420} {"train_loss": -9.06245231628418, "global_step": 70589, "epoch": 420} {"train_loss": -8.886646270751953, "global_step": 70590, "epoch": 420} {"train_loss": -8.73310375213623, "global_step": 70591, "epoch": 420} {"train_loss": -9.194173812866211, "global_step": 70592, "epoch": 420} {"train_loss": -9.045129776000977, "global_step": 70593, "epoch": 420} {"train_loss": -9.222465515136719, "global_step": 70594, "epoch": 420} {"train_loss": -8.886918067932129, "global_step": 70595, "epoch": 420} {"train_loss": -9.094291687011719, "global_step": 70596, "epoch": 420} {"train_loss": -9.052665710449219, "global_step": 70597, "epoch": 420} {"train_loss": -8.9232816696167, "global_step": 70598, "epoch": 420} {"train_loss": -9.142036437988281, "global_step": 70599, "epoch": 420} {"train_loss": -9.063446044921875, "global_step": 70600, "epoch": 420} {"train_loss": -9.166969299316406, "global_step": 70601, "epoch": 420} {"train_loss": -8.909229278564453, "global_step": 70602, "epoch": 420} {"train_loss": -9.022043228149414, "global_step": 70603, "epoch": 420} {"train_loss": -9.038599014282227, "global_step": 70604, "epoch": 420} {"train_loss": -8.985346794128418, "global_step": 70605, "epoch": 420} {"train_loss": -8.932600021362305, "global_step": 70606, "epoch": 420} {"train_loss": -9.109415054321289, "global_step": 70607, "epoch": 420} {"train_loss": -9.090856552124023, "global_step": 70608, "epoch": 420} {"train_loss": -8.855300903320312, "global_step": 70609, "epoch": 420} {"train_loss": -8.913999557495117, "global_step": 70610, "epoch": 420} {"train_loss": -8.894994735717773, "global_step": 70611, "epoch": 420} {"train_loss": -8.907220840454102, "global_step": 70612, "epoch": 420} {"train_loss": -8.874139785766602, "global_step": 70613, "epoch": 420} {"train_loss": -8.820119857788086, "global_step": 70614, "epoch": 420} {"train_loss": -8.788299560546875, "global_step": 70615, "epoch": 420} {"train_loss": -8.834554672241211, "global_step": 70616, "epoch": 420} {"train_loss": -8.762399673461914, "global_step": 70617, "epoch": 420} {"train_loss": -8.509326934814453, "global_step": 70618, "epoch": 420} {"train_loss": -8.808313369750977, "global_step": 70619, "epoch": 420} {"train_loss": -8.64228630065918, "global_step": 70620, "epoch": 420} {"train_loss": -8.540082931518555, "global_step": 70621, "epoch": 420} {"train_loss": -8.75071907043457, "global_step": 70622, "epoch": 420} {"train_loss": -8.632343292236328, "global_step": 70623, "epoch": 420} {"train_loss": -8.79522705078125, "global_step": 70624, "epoch": 420} {"train_loss": -8.258540153503418, "global_step": 70625, "epoch": 420} {"train_loss": -9.004353523254395, "global_step": 70626, "epoch": 420} {"train_loss": -8.473186492919922, "global_step": 70627, "epoch": 420} {"train_loss": -8.590597152709961, "global_step": 70628, "epoch": 420} {"train_loss": -8.730582237243652, "global_step": 70629, "epoch": 420} {"train_loss": -8.85987377166748, "global_step": 70630, "epoch": 420} {"train_loss": -8.524923324584961, "global_step": 70631, "epoch": 420} {"train_loss": -8.916114807128906, "global_step": 70632, "epoch": 420} {"train_loss": -8.808805465698242, "global_step": 70633, "epoch": 420} {"train_loss": -8.833717346191406, "global_step": 70634, "epoch": 420} {"train_loss": -8.947683334350586, "global_step": 70635, "epoch": 420} {"train_loss": -9.156231880187988, "global_step": 70636, "epoch": 420} {"train_loss": -8.808652877807617, "global_step": 70637, "epoch": 420} {"train_loss": -8.732431411743164, "global_step": 70638, "epoch": 420} {"train_loss": -8.787667274475098, "global_step": 70639, "epoch": 420} {"train_loss": -8.838403701782227, "global_step": 70640, "epoch": 420} {"train_loss": -8.65452766418457, "global_step": 70641, "epoch": 420} {"train_loss": -9.060047149658203, "global_step": 70642, "epoch": 420} {"train_loss": -8.8516845703125, "global_step": 70643, "epoch": 420} {"train_loss": -8.62509536743164, "global_step": 70644, "epoch": 420} {"train_loss": -8.800230979919434, "global_step": 70645, "epoch": 420} {"train_loss": -8.923410415649414, "global_step": 70646, "epoch": 420} {"train_loss": -8.916205406188965, "global_step": 70647, "epoch": 420} {"train_loss": -8.887883186340332, "global_step": 70648, "epoch": 420} {"train_loss": -9.079745292663574, "global_step": 70649, "epoch": 420} {"train_loss": -8.83743953704834, "global_step": 70650, "epoch": 420} {"train_loss": -8.892208099365234, "global_step": 70651, "epoch": 420} {"train_loss": -8.924552917480469, "global_step": 70652, "epoch": 420} {"train_loss": -9.182123184204102, "global_step": 70653, "epoch": 420} {"train_loss": -8.996984481811523, "global_step": 70654, "epoch": 420} {"train_loss": -9.125612258911133, "global_step": 70655, "epoch": 420} {"train_loss": -8.953446388244629, "global_step": 70656, "epoch": 420} {"train_loss": -8.97459602355957, "global_step": 70657, "epoch": 420} {"train_loss": -8.895940780639648, "global_step": 70658, "epoch": 420} {"train_loss": -8.615242004394531, "global_step": 70659, "epoch": 420} {"train_loss": -9.239480972290039, "global_step": 70660, "epoch": 420} {"train_loss": -8.890514373779297, "global_step": 70661, "epoch": 420} {"train_loss": -8.813643455505371, "global_step": 70662, "epoch": 420} {"train_loss": -8.851105690002441, "global_step": 70663, "epoch": 420} {"train_loss": -8.943181037902832, "global_step": 70664, "epoch": 420} {"train_loss": -8.324175834655762, "global_step": 70665, "epoch": 420} {"train_loss": -8.964122772216797, "global_step": 70666, "epoch": 420} {"train_loss": -8.632331848144531, "global_step": 70667, "epoch": 420} {"train_loss": -8.682889938354492, "global_step": 70668, "epoch": 420} {"train_loss": -8.769107818603516, "global_step": 70669, "epoch": 420} {"train_loss": -8.821151733398438, "global_step": 70670, "epoch": 420} {"train_loss": -8.781820297241211, "global_step": 70671, "epoch": 420} {"train_loss": -8.740215301513672, "global_step": 70672, "epoch": 420} {"train_loss": -8.774602890014648, "global_step": 70673, "epoch": 420} {"train_loss": -8.810508728027344, "global_step": 70674, "epoch": 420} {"train_loss": -8.537531852722168, "global_step": 70675, "epoch": 420} {"train_loss": -8.887292861938477, "global_step": 70676, "epoch": 420} {"train_loss": -8.698904037475586, "global_step": 70677, "epoch": 420} {"train_loss": -8.735107421875, "global_step": 70678, "epoch": 420} {"train_loss": -8.591221809387207, "global_step": 70679, "epoch": 420} {"train_loss": -8.851634979248047, "global_step": 70680, "epoch": 420} {"train_loss": -8.946904182434082, "global_step": 70681, "epoch": 420} {"train_loss": -8.990884780883789, "global_step": 70682, "epoch": 420} {"train_loss": -8.950910568237305, "global_step": 70683, "epoch": 420} {"train_loss": -8.959710121154785, "global_step": 70684, "epoch": 420} {"train_loss": -8.858617782592773, "global_step": 70685, "epoch": 420} {"train_loss": -8.968270301818848, "global_step": 70686, "epoch": 420} {"train_loss": -9.0250244140625, "global_step": 70687, "epoch": 420} {"train_loss": -8.833431243896484, "global_step": 70688, "epoch": 420} {"train_loss": -9.207948684692383, "global_step": 70689, "epoch": 420} {"train_loss": -8.651620864868164, "global_step": 70690, "epoch": 420} {"train_loss": -9.045137405395508, "global_step": 70691, "epoch": 420} {"train_loss": -9.032630920410156, "global_step": 70692, "epoch": 420} {"train_loss": -9.016529083251953, "global_step": 70693, "epoch": 420} {"train_loss": -8.775468826293945, "global_step": 70694, "epoch": 420} {"train_loss": -9.020302772521973, "global_step": 70695, "epoch": 420} {"train_loss": -8.977633476257324, "global_step": 70696, "epoch": 420} {"train_loss": -9.068527221679688, "global_step": 70697, "epoch": 420} {"train_loss": -9.037351608276367, "global_step": 70698, "epoch": 420} {"train_loss": -9.182035446166992, "global_step": 70699, "epoch": 420} {"train_loss": -9.078688621520996, "global_step": 70700, "epoch": 420} {"train_loss": -9.102521896362305, "global_step": 70701, "epoch": 420} {"train_loss": -9.175359725952148, "global_step": 70702, "epoch": 420} {"train_loss": -8.8543062210083, "global_step": 70703, "epoch": 420} {"train_loss": -8.763914108276367, "global_step": 70704, "epoch": 420} {"train_loss": -8.939194679260254, "global_step": 70705, "epoch": 420} {"train_loss": -8.9803466796875, "global_step": 70706, "epoch": 420} {"train_loss": -8.899328231811523, "global_step": 70707, "epoch": 420} {"train_loss": -8.71838092803955, "global_step": 70708, "epoch": 420} {"train_loss": -9.19133186340332, "global_step": 70709, "epoch": 420} {"train_loss": -8.197681427001953, "global_step": 70710, "epoch": 420} {"train_loss": -8.946144104003906, "global_step": 70711, "epoch": 420} {"train_loss": -8.63382339477539, "global_step": 70712, "epoch": 420} {"train_loss": -8.864800453186035, "global_step": 70713, "epoch": 420} {"train_loss": -8.768985748291016, "global_step": 70714, "epoch": 420} {"train_loss": -8.905815124511719, "global_step": 70715, "epoch": 420} {"train_loss": -8.75295639038086, "global_step": 70716, "epoch": 420} {"train_loss": -9.028697967529297, "global_step": 70717, "epoch": 420} {"train_loss": -8.741082191467285, "global_step": 70718, "epoch": 420} {"train_loss": -8.992169380187988, "global_step": 70719, "epoch": 420} {"train_loss": -8.926187515258789, "global_step": 70720, "epoch": 420} {"train_loss": -8.867871284484863, "global_step": 70721, "epoch": 420} {"train_loss": -9.016376495361328, "global_step": 70722, "epoch": 420} {"train_loss": -8.714922904968262, "global_step": 70723, "epoch": 420} {"train_loss": -8.66054916381836, "global_step": 70724, "epoch": 420} {"train_loss": -8.977694511413574, "global_step": 70725, "epoch": 420} {"train_loss": -8.635674476623535, "global_step": 70726, "epoch": 420} {"train_loss": -8.901366364388238, "global_step": 70727, "epoch": 420, "val_loss": 194953.984375, "train_action_mse_error": 4.827620506286621} {"train_loss": -8.815591812133789, "global_step": 70728, "epoch": 421} {"train_loss": -9.092405319213867, "global_step": 70729, "epoch": 421} {"train_loss": -8.889261245727539, "global_step": 70730, "epoch": 421} {"train_loss": -9.015093803405762, "global_step": 70731, "epoch": 421} {"train_loss": -8.685928344726562, "global_step": 70732, "epoch": 421} {"train_loss": -8.67519760131836, "global_step": 70733, "epoch": 421} {"train_loss": -8.914610862731934, "global_step": 70734, "epoch": 421} {"train_loss": -8.491684913635254, "global_step": 70735, "epoch": 421} {"train_loss": -8.791191101074219, "global_step": 70736, "epoch": 421} {"train_loss": -8.6627197265625, "global_step": 70737, "epoch": 421} {"train_loss": -8.936457633972168, "global_step": 70738, "epoch": 421} {"train_loss": -8.724983215332031, "global_step": 70739, "epoch": 421} {"train_loss": -8.504804611206055, "global_step": 70740, "epoch": 421} {"train_loss": -8.746499061584473, "global_step": 70741, "epoch": 421} {"train_loss": -8.868886947631836, "global_step": 70742, "epoch": 421} {"train_loss": -8.596960067749023, "global_step": 70743, "epoch": 421} {"train_loss": -8.78403091430664, "global_step": 70744, "epoch": 421} {"train_loss": -8.648717880249023, "global_step": 70745, "epoch": 421} {"train_loss": -8.632501602172852, "global_step": 70746, "epoch": 421} {"train_loss": -8.71910285949707, "global_step": 70747, "epoch": 421} {"train_loss": -8.413172721862793, "global_step": 70748, "epoch": 421} {"train_loss": -8.764148712158203, "global_step": 70749, "epoch": 421} {"train_loss": -8.334602355957031, "global_step": 70750, "epoch": 421} {"train_loss": -8.444336891174316, "global_step": 70751, "epoch": 421} {"train_loss": -8.701356887817383, "global_step": 70752, "epoch": 421} {"train_loss": -8.728541374206543, "global_step": 70753, "epoch": 421} {"train_loss": -8.517776489257812, "global_step": 70754, "epoch": 421} {"train_loss": -8.5928316116333, "global_step": 70755, "epoch": 421} {"train_loss": -8.755609512329102, "global_step": 70756, "epoch": 421} {"train_loss": -8.915939331054688, "global_step": 70757, "epoch": 421} {"train_loss": -8.683000564575195, "global_step": 70758, "epoch": 421} {"train_loss": -8.772308349609375, "global_step": 70759, "epoch": 421} {"train_loss": -8.72287654876709, "global_step": 70760, "epoch": 421} {"train_loss": -8.8607759475708, "global_step": 70761, "epoch": 421} {"train_loss": -8.721176147460938, "global_step": 70762, "epoch": 421} {"train_loss": -8.735036849975586, "global_step": 70763, "epoch": 421} {"train_loss": -8.997201919555664, "global_step": 70764, "epoch": 421} {"train_loss": -9.167387962341309, "global_step": 70765, "epoch": 421} {"train_loss": -9.063480377197266, "global_step": 70766, "epoch": 421} {"train_loss": -8.896678924560547, "global_step": 70767, "epoch": 421} {"train_loss": -9.072071075439453, "global_step": 70768, "epoch": 421} {"train_loss": -8.948921203613281, "global_step": 70769, "epoch": 421} {"train_loss": -9.143159866333008, "global_step": 70770, "epoch": 421} {"train_loss": -9.070451736450195, "global_step": 70771, "epoch": 421} {"train_loss": -9.275189399719238, "global_step": 70772, "epoch": 421} {"train_loss": -9.093496322631836, "global_step": 70773, "epoch": 421} {"train_loss": -9.068565368652344, "global_step": 70774, "epoch": 421} {"train_loss": -9.082840919494629, "global_step": 70775, "epoch": 421} {"train_loss": -9.14212703704834, "global_step": 70776, "epoch": 421} {"train_loss": -9.104532241821289, "global_step": 70777, "epoch": 421} {"train_loss": -9.149637222290039, "global_step": 70778, "epoch": 421} {"train_loss": -8.947725296020508, "global_step": 70779, "epoch": 421} {"train_loss": -9.078876495361328, "global_step": 70780, "epoch": 421} {"train_loss": -9.236285209655762, "global_step": 70781, "epoch": 421} {"train_loss": -8.720281600952148, "global_step": 70782, "epoch": 421} {"train_loss": -8.883864402770996, "global_step": 70783, "epoch": 421} {"train_loss": -9.036333084106445, "global_step": 70784, "epoch": 421} {"train_loss": -8.50328254699707, "global_step": 70785, "epoch": 421} {"train_loss": -8.911434173583984, "global_step": 70786, "epoch": 421} {"train_loss": -8.739145278930664, "global_step": 70787, "epoch": 421} {"train_loss": -8.863119125366211, "global_step": 70788, "epoch": 421} {"train_loss": -8.725700378417969, "global_step": 70789, "epoch": 421} {"train_loss": -9.111536026000977, "global_step": 70790, "epoch": 421} {"train_loss": -9.02302360534668, "global_step": 70791, "epoch": 421} {"train_loss": -8.873498916625977, "global_step": 70792, "epoch": 421} {"train_loss": -8.868269920349121, "global_step": 70793, "epoch": 421} {"train_loss": -8.755001068115234, "global_step": 70794, "epoch": 421} {"train_loss": -8.776114463806152, "global_step": 70795, "epoch": 421} {"train_loss": -8.93008041381836, "global_step": 70796, "epoch": 421} {"train_loss": -8.503559112548828, "global_step": 70797, "epoch": 421} {"train_loss": -8.842267990112305, "global_step": 70798, "epoch": 421} {"train_loss": -8.949071884155273, "global_step": 70799, "epoch": 421} {"train_loss": -9.034613609313965, "global_step": 70800, "epoch": 421} {"train_loss": -8.675836563110352, "global_step": 70801, "epoch": 421} {"train_loss": -8.877321243286133, "global_step": 70802, "epoch": 421} {"train_loss": -8.732288360595703, "global_step": 70803, "epoch": 421} {"train_loss": -8.811742782592773, "global_step": 70804, "epoch": 421} {"train_loss": -8.862021446228027, "global_step": 70805, "epoch": 421} {"train_loss": -8.71622085571289, "global_step": 70806, "epoch": 421} {"train_loss": -8.651395797729492, "global_step": 70807, "epoch": 421} {"train_loss": -8.76292610168457, "global_step": 70808, "epoch": 421} {"train_loss": -8.701478004455566, "global_step": 70809, "epoch": 421} {"train_loss": -8.924406051635742, "global_step": 70810, "epoch": 421} {"train_loss": -8.877874374389648, "global_step": 70811, "epoch": 421} {"train_loss": -8.901327133178711, "global_step": 70812, "epoch": 421} {"train_loss": -8.632200241088867, "global_step": 70813, "epoch": 421} {"train_loss": -8.966176986694336, "global_step": 70814, "epoch": 421} {"train_loss": -8.790958404541016, "global_step": 70815, "epoch": 421} {"train_loss": -8.804825782775879, "global_step": 70816, "epoch": 421} {"train_loss": -8.923480033874512, "global_step": 70817, "epoch": 421} {"train_loss": -8.745595932006836, "global_step": 70818, "epoch": 421} {"train_loss": -8.846107482910156, "global_step": 70819, "epoch": 421} {"train_loss": -8.819604873657227, "global_step": 70820, "epoch": 421} {"train_loss": -8.482339859008789, "global_step": 70821, "epoch": 421} {"train_loss": -9.061763763427734, "global_step": 70822, "epoch": 421} {"train_loss": -8.989862442016602, "global_step": 70823, "epoch": 421} {"train_loss": -8.606731414794922, "global_step": 70824, "epoch": 421} {"train_loss": -8.894407272338867, "global_step": 70825, "epoch": 421} {"train_loss": -8.954524040222168, "global_step": 70826, "epoch": 421} {"train_loss": -8.80642032623291, "global_step": 70827, "epoch": 421} {"train_loss": -9.00342082977295, "global_step": 70828, "epoch": 421} {"train_loss": -8.897089004516602, "global_step": 70829, "epoch": 421} {"train_loss": -8.977739334106445, "global_step": 70830, "epoch": 421} {"train_loss": -9.006267547607422, "global_step": 70831, "epoch": 421} {"train_loss": -8.862885475158691, "global_step": 70832, "epoch": 421} {"train_loss": -8.92880630493164, "global_step": 70833, "epoch": 421} {"train_loss": -8.943912506103516, "global_step": 70834, "epoch": 421} {"train_loss": -8.650938034057617, "global_step": 70835, "epoch": 421} {"train_loss": -8.832886695861816, "global_step": 70836, "epoch": 421} {"train_loss": -8.730886459350586, "global_step": 70837, "epoch": 421} {"train_loss": -8.86641788482666, "global_step": 70838, "epoch": 421} {"train_loss": -9.002838134765625, "global_step": 70839, "epoch": 421} {"train_loss": -8.930885314941406, "global_step": 70840, "epoch": 421} {"train_loss": -8.848625183105469, "global_step": 70841, "epoch": 421} {"train_loss": -8.89529800415039, "global_step": 70842, "epoch": 421} {"train_loss": -9.04577922821045, "global_step": 70843, "epoch": 421} {"train_loss": -8.730916023254395, "global_step": 70844, "epoch": 421} {"train_loss": -9.107332229614258, "global_step": 70845, "epoch": 421} {"train_loss": -8.864709854125977, "global_step": 70846, "epoch": 421} {"train_loss": -8.878223419189453, "global_step": 70847, "epoch": 421} {"train_loss": -9.000146865844727, "global_step": 70848, "epoch": 421} {"train_loss": -9.01003360748291, "global_step": 70849, "epoch": 421} {"train_loss": -9.061193466186523, "global_step": 70850, "epoch": 421} {"train_loss": -8.997217178344727, "global_step": 70851, "epoch": 421} {"train_loss": -8.944429397583008, "global_step": 70852, "epoch": 421} {"train_loss": -9.075154304504395, "global_step": 70853, "epoch": 421} {"train_loss": -9.07246208190918, "global_step": 70854, "epoch": 421} {"train_loss": -8.925899505615234, "global_step": 70855, "epoch": 421} {"train_loss": -8.950653076171875, "global_step": 70856, "epoch": 421} {"train_loss": -8.859106063842773, "global_step": 70857, "epoch": 421} {"train_loss": -8.90966796875, "global_step": 70858, "epoch": 421} {"train_loss": -8.663949966430664, "global_step": 70859, "epoch": 421} {"train_loss": -9.06875228881836, "global_step": 70860, "epoch": 421} {"train_loss": -8.899930953979492, "global_step": 70861, "epoch": 421} {"train_loss": -9.019553184509277, "global_step": 70862, "epoch": 421} {"train_loss": -8.646528244018555, "global_step": 70863, "epoch": 421} {"train_loss": -8.94528579711914, "global_step": 70864, "epoch": 421} {"train_loss": -9.058340072631836, "global_step": 70865, "epoch": 421} {"train_loss": -9.009893417358398, "global_step": 70866, "epoch": 421} {"train_loss": -8.611847877502441, "global_step": 70867, "epoch": 421} {"train_loss": -9.003896713256836, "global_step": 70868, "epoch": 421} {"train_loss": -9.093829154968262, "global_step": 70869, "epoch": 421} {"train_loss": -9.165426254272461, "global_step": 70870, "epoch": 421} {"train_loss": -8.840052604675293, "global_step": 70871, "epoch": 421} {"train_loss": -9.220388412475586, "global_step": 70872, "epoch": 421} {"train_loss": -8.814803123474121, "global_step": 70873, "epoch": 421} {"train_loss": -9.031928062438965, "global_step": 70874, "epoch": 421} {"train_loss": -8.826311111450195, "global_step": 70875, "epoch": 421} {"train_loss": -9.056961059570312, "global_step": 70876, "epoch": 421} {"train_loss": -9.018659591674805, "global_step": 70877, "epoch": 421} {"train_loss": -9.130805015563965, "global_step": 70878, "epoch": 421} {"train_loss": -8.96019172668457, "global_step": 70879, "epoch": 421} {"train_loss": -8.676552772521973, "global_step": 70880, "epoch": 421} {"train_loss": -8.909442901611328, "global_step": 70881, "epoch": 421} {"train_loss": -8.810043334960938, "global_step": 70882, "epoch": 421} {"train_loss": -9.05921745300293, "global_step": 70883, "epoch": 421} {"train_loss": -8.864803314208984, "global_step": 70884, "epoch": 421} {"train_loss": -8.743334770202637, "global_step": 70885, "epoch": 421} {"train_loss": -8.922496795654297, "global_step": 70886, "epoch": 421} {"train_loss": -8.981598854064941, "global_step": 70887, "epoch": 421} {"train_loss": -9.137468338012695, "global_step": 70888, "epoch": 421} {"train_loss": -8.959550857543945, "global_step": 70889, "epoch": 421} {"train_loss": -8.715873718261719, "global_step": 70890, "epoch": 421} {"train_loss": -9.162689208984375, "global_step": 70891, "epoch": 421} {"train_loss": -8.845224380493164, "global_step": 70892, "epoch": 421} {"train_loss": -9.076969146728516, "global_step": 70893, "epoch": 421} {"train_loss": -8.920557975769043, "global_step": 70894, "epoch": 421} {"train_loss": -8.87486367566245, "global_step": 70895, "epoch": 421, "val_loss": 194245.765625} {"train_loss": -9.001220703125, "global_step": 70896, "epoch": 422} {"train_loss": -8.691291809082031, "global_step": 70897, "epoch": 422} {"train_loss": -9.245448112487793, "global_step": 70898, "epoch": 422} {"train_loss": -8.770133018493652, "global_step": 70899, "epoch": 422} {"train_loss": -9.136219024658203, "global_step": 70900, "epoch": 422} {"train_loss": -8.846553802490234, "global_step": 70901, "epoch": 422} {"train_loss": -8.972905158996582, "global_step": 70902, "epoch": 422} {"train_loss": -8.752264022827148, "global_step": 70903, "epoch": 422} {"train_loss": -9.1206693649292, "global_step": 70904, "epoch": 422} {"train_loss": -8.835689544677734, "global_step": 70905, "epoch": 422} {"train_loss": -9.072306632995605, "global_step": 70906, "epoch": 422} {"train_loss": -8.740145683288574, "global_step": 70907, "epoch": 422} {"train_loss": -9.120344161987305, "global_step": 70908, "epoch": 422} {"train_loss": -8.718229293823242, "global_step": 70909, "epoch": 422} {"train_loss": -8.905403137207031, "global_step": 70910, "epoch": 422} {"train_loss": -8.934642791748047, "global_step": 70911, "epoch": 422} {"train_loss": -8.629897117614746, "global_step": 70912, "epoch": 422} {"train_loss": -8.989916801452637, "global_step": 70913, "epoch": 422} {"train_loss": -8.960878372192383, "global_step": 70914, "epoch": 422} {"train_loss": -8.898810386657715, "global_step": 70915, "epoch": 422} {"train_loss": -9.047746658325195, "global_step": 70916, "epoch": 422} {"train_loss": -8.617033004760742, "global_step": 70917, "epoch": 422} {"train_loss": -8.901998519897461, "global_step": 70918, "epoch": 422} {"train_loss": -9.037759780883789, "global_step": 70919, "epoch": 422} {"train_loss": -9.120128631591797, "global_step": 70920, "epoch": 422} {"train_loss": -8.941133499145508, "global_step": 70921, "epoch": 422} {"train_loss": -9.2055082321167, "global_step": 70922, "epoch": 422} {"train_loss": -8.987271308898926, "global_step": 70923, "epoch": 422} {"train_loss": -9.00014877319336, "global_step": 70924, "epoch": 422} {"train_loss": -8.834253311157227, "global_step": 70925, "epoch": 422} {"train_loss": -8.871580123901367, "global_step": 70926, "epoch": 422} {"train_loss": -9.067708015441895, "global_step": 70927, "epoch": 422} {"train_loss": -8.979324340820312, "global_step": 70928, "epoch": 422} {"train_loss": -9.237924575805664, "global_step": 70929, "epoch": 422} {"train_loss": -9.07504653930664, "global_step": 70930, "epoch": 422} {"train_loss": -8.8997802734375, "global_step": 70931, "epoch": 422} {"train_loss": -8.848520278930664, "global_step": 70932, "epoch": 422} {"train_loss": -8.99847412109375, "global_step": 70933, "epoch": 422} {"train_loss": -9.136682510375977, "global_step": 70934, "epoch": 422} {"train_loss": -8.897582054138184, "global_step": 70935, "epoch": 422} {"train_loss": -8.810541152954102, "global_step": 70936, "epoch": 422} {"train_loss": -9.09776782989502, "global_step": 70937, "epoch": 422} {"train_loss": -9.035065650939941, "global_step": 70938, "epoch": 422} {"train_loss": -8.953425407409668, "global_step": 70939, "epoch": 422} {"train_loss": -8.806802749633789, "global_step": 70940, "epoch": 422} {"train_loss": -8.985218048095703, "global_step": 70941, "epoch": 422} {"train_loss": -8.963438987731934, "global_step": 70942, "epoch": 422} {"train_loss": -8.95041561126709, "global_step": 70943, "epoch": 422} {"train_loss": -9.05230712890625, "global_step": 70944, "epoch": 422} {"train_loss": -9.128872871398926, "global_step": 70945, "epoch": 422} {"train_loss": -8.930110931396484, "global_step": 70946, "epoch": 422} {"train_loss": -8.987014770507812, "global_step": 70947, "epoch": 422} {"train_loss": -9.084341049194336, "global_step": 70948, "epoch": 422} {"train_loss": -8.89451789855957, "global_step": 70949, "epoch": 422} {"train_loss": -8.886096000671387, "global_step": 70950, "epoch": 422} {"train_loss": -9.04398250579834, "global_step": 70951, "epoch": 422} {"train_loss": -8.849661827087402, "global_step": 70952, "epoch": 422} {"train_loss": -8.628003120422363, "global_step": 70953, "epoch": 422} {"train_loss": -8.811338424682617, "global_step": 70954, "epoch": 422} {"train_loss": -8.673812866210938, "global_step": 70955, "epoch": 422} {"train_loss": -9.100939750671387, "global_step": 70956, "epoch": 422} {"train_loss": -8.935586929321289, "global_step": 70957, "epoch": 422} {"train_loss": -8.87240219116211, "global_step": 70958, "epoch": 422} {"train_loss": -9.042550086975098, "global_step": 70959, "epoch": 422} {"train_loss": -8.937713623046875, "global_step": 70960, "epoch": 422} {"train_loss": -8.978436470031738, "global_step": 70961, "epoch": 422} {"train_loss": -9.014666557312012, "global_step": 70962, "epoch": 422} {"train_loss": -8.912084579467773, "global_step": 70963, "epoch": 422} {"train_loss": -8.980595588684082, "global_step": 70964, "epoch": 422} {"train_loss": -9.04873275756836, "global_step": 70965, "epoch": 422} {"train_loss": -9.005904197692871, "global_step": 70966, "epoch": 422} {"train_loss": -8.730683326721191, "global_step": 70967, "epoch": 422} {"train_loss": -8.951327323913574, "global_step": 70968, "epoch": 422} {"train_loss": -8.740415573120117, "global_step": 70969, "epoch": 422} {"train_loss": -8.7908296585083, "global_step": 70970, "epoch": 422} {"train_loss": -8.866544723510742, "global_step": 70971, "epoch": 422} {"train_loss": -8.864436149597168, "global_step": 70972, "epoch": 422} {"train_loss": -8.906423568725586, "global_step": 70973, "epoch": 422} {"train_loss": -8.892988204956055, "global_step": 70974, "epoch": 422} {"train_loss": -9.184992790222168, "global_step": 70975, "epoch": 422} {"train_loss": -8.960332870483398, "global_step": 70976, "epoch": 422} {"train_loss": -9.184446334838867, "global_step": 70977, "epoch": 422} {"train_loss": -9.02592658996582, "global_step": 70978, "epoch": 422} {"train_loss": -9.013114929199219, "global_step": 70979, "epoch": 422} {"train_loss": -8.932672500610352, "global_step": 70980, "epoch": 422} {"train_loss": -8.863330841064453, "global_step": 70981, "epoch": 422} {"train_loss": -9.289389610290527, "global_step": 70982, "epoch": 422} {"train_loss": -8.967633247375488, "global_step": 70983, "epoch": 422} {"train_loss": -8.997900009155273, "global_step": 70984, "epoch": 422} {"train_loss": -9.074389457702637, "global_step": 70985, "epoch": 422} {"train_loss": -8.931487083435059, "global_step": 70986, "epoch": 422} {"train_loss": -8.855897903442383, "global_step": 70987, "epoch": 422} {"train_loss": -9.145416259765625, "global_step": 70988, "epoch": 422} {"train_loss": -9.030719757080078, "global_step": 70989, "epoch": 422} {"train_loss": -9.112625122070312, "global_step": 70990, "epoch": 422} {"train_loss": -8.992681503295898, "global_step": 70991, "epoch": 422} {"train_loss": -9.178173065185547, "global_step": 70992, "epoch": 422} {"train_loss": -9.015329360961914, "global_step": 70993, "epoch": 422} {"train_loss": -8.863930702209473, "global_step": 70994, "epoch": 422} {"train_loss": -9.02802848815918, "global_step": 70995, "epoch": 422} {"train_loss": -8.599370002746582, "global_step": 70996, "epoch": 422} {"train_loss": -8.88697338104248, "global_step": 70997, "epoch": 422} {"train_loss": -8.764019012451172, "global_step": 70998, "epoch": 422} {"train_loss": -8.854403495788574, "global_step": 70999, "epoch": 422} {"train_loss": -8.559206008911133, "global_step": 71000, "epoch": 422} {"train_loss": -9.04842758178711, "global_step": 71001, "epoch": 422} {"train_loss": -8.460031509399414, "global_step": 71002, "epoch": 422} {"train_loss": -9.223440170288086, "global_step": 71003, "epoch": 422} {"train_loss": -8.667985916137695, "global_step": 71004, "epoch": 422} {"train_loss": -8.923710823059082, "global_step": 71005, "epoch": 422} {"train_loss": -8.90245246887207, "global_step": 71006, "epoch": 422} {"train_loss": -9.017541885375977, "global_step": 71007, "epoch": 422} {"train_loss": -8.788811683654785, "global_step": 71008, "epoch": 422} {"train_loss": -9.039612770080566, "global_step": 71009, "epoch": 422} {"train_loss": -8.758010864257812, "global_step": 71010, "epoch": 422} {"train_loss": -9.004241943359375, "global_step": 71011, "epoch": 422} {"train_loss": -8.89029312133789, "global_step": 71012, "epoch": 422} {"train_loss": -8.792055130004883, "global_step": 71013, "epoch": 422} {"train_loss": -9.086861610412598, "global_step": 71014, "epoch": 422} {"train_loss": -8.986311912536621, "global_step": 71015, "epoch": 422} {"train_loss": -9.06097412109375, "global_step": 71016, "epoch": 422} {"train_loss": -8.998459815979004, "global_step": 71017, "epoch": 422} {"train_loss": -9.029406547546387, "global_step": 71018, "epoch": 422} {"train_loss": -8.8049955368042, "global_step": 71019, "epoch": 422} {"train_loss": -8.870805740356445, "global_step": 71020, "epoch": 422} {"train_loss": -9.189491271972656, "global_step": 71021, "epoch": 422} {"train_loss": -9.00023078918457, "global_step": 71022, "epoch": 422} {"train_loss": -9.063557624816895, "global_step": 71023, "epoch": 422} {"train_loss": -9.262046813964844, "global_step": 71024, "epoch": 422} {"train_loss": -8.507476806640625, "global_step": 71025, "epoch": 422} {"train_loss": -8.989250183105469, "global_step": 71026, "epoch": 422} {"train_loss": -8.672809600830078, "global_step": 71027, "epoch": 422} {"train_loss": -8.572174072265625, "global_step": 71028, "epoch": 422} {"train_loss": -8.788208961486816, "global_step": 71029, "epoch": 422} {"train_loss": -8.548286437988281, "global_step": 71030, "epoch": 422} {"train_loss": -8.973612785339355, "global_step": 71031, "epoch": 422} {"train_loss": -8.78768253326416, "global_step": 71032, "epoch": 422} {"train_loss": -8.906429290771484, "global_step": 71033, "epoch": 422} {"train_loss": -8.983013153076172, "global_step": 71034, "epoch": 422} {"train_loss": -8.744840621948242, "global_step": 71035, "epoch": 422} {"train_loss": -8.7915678024292, "global_step": 71036, "epoch": 422} {"train_loss": -8.951119422912598, "global_step": 71037, "epoch": 422} {"train_loss": -8.771815299987793, "global_step": 71038, "epoch": 422} {"train_loss": -8.756522178649902, "global_step": 71039, "epoch": 422} {"train_loss": -8.974950790405273, "global_step": 71040, "epoch": 422} {"train_loss": -8.764419555664062, "global_step": 71041, "epoch": 422} {"train_loss": -8.706404685974121, "global_step": 71042, "epoch": 422} {"train_loss": -8.727620124816895, "global_step": 71043, "epoch": 422} {"train_loss": -9.174148559570312, "global_step": 71044, "epoch": 422} {"train_loss": -8.828094482421875, "global_step": 71045, "epoch": 422} {"train_loss": -8.660568237304688, "global_step": 71046, "epoch": 422} {"train_loss": -8.783093452453613, "global_step": 71047, "epoch": 422} {"train_loss": -8.865697860717773, "global_step": 71048, "epoch": 422} {"train_loss": -9.06173324584961, "global_step": 71049, "epoch": 422} {"train_loss": -8.819314002990723, "global_step": 71050, "epoch": 422} {"train_loss": -9.024662971496582, "global_step": 71051, "epoch": 422} {"train_loss": -8.878339767456055, "global_step": 71052, "epoch": 422} {"train_loss": -9.151140213012695, "global_step": 71053, "epoch": 422} {"train_loss": -9.080894470214844, "global_step": 71054, "epoch": 422} {"train_loss": -8.800524711608887, "global_step": 71055, "epoch": 422} {"train_loss": -8.967538833618164, "global_step": 71056, "epoch": 422} {"train_loss": -8.939172744750977, "global_step": 71057, "epoch": 422} {"train_loss": -8.910928726196289, "global_step": 71058, "epoch": 422} {"train_loss": -8.934602737426758, "global_step": 71059, "epoch": 422} {"train_loss": -8.68334674835205, "global_step": 71060, "epoch": 422} {"train_loss": -9.081664085388184, "global_step": 71061, "epoch": 422} {"train_loss": -8.918462753295898, "global_step": 71062, "epoch": 422} {"train_loss": -8.926313133466811, "global_step": 71063, "epoch": 422, "val_loss": 194331.03125} {"train_loss": -8.890275955200195, "global_step": 71064, "epoch": 423} {"train_loss": -8.90065860748291, "global_step": 71065, "epoch": 423} {"train_loss": -8.834171295166016, "global_step": 71066, "epoch": 423} {"train_loss": -8.738351821899414, "global_step": 71067, "epoch": 423} {"train_loss": -9.060081481933594, "global_step": 71068, "epoch": 423} {"train_loss": -8.985776901245117, "global_step": 71069, "epoch": 423} {"train_loss": -8.992473602294922, "global_step": 71070, "epoch": 423} {"train_loss": -8.936505317687988, "global_step": 71071, "epoch": 423} {"train_loss": -8.966009140014648, "global_step": 71072, "epoch": 423} {"train_loss": -9.078734397888184, "global_step": 71073, "epoch": 423} {"train_loss": -9.051278114318848, "global_step": 71074, "epoch": 423} {"train_loss": -8.911895751953125, "global_step": 71075, "epoch": 423} {"train_loss": -8.970078468322754, "global_step": 71076, "epoch": 423} {"train_loss": -8.734159469604492, "global_step": 71077, "epoch": 423} {"train_loss": -8.909536361694336, "global_step": 71078, "epoch": 423} {"train_loss": -8.979957580566406, "global_step": 71079, "epoch": 423} {"train_loss": -8.97117805480957, "global_step": 71080, "epoch": 423} {"train_loss": -9.151165962219238, "global_step": 71081, "epoch": 423} {"train_loss": -9.030994415283203, "global_step": 71082, "epoch": 423} {"train_loss": -9.03289794921875, "global_step": 71083, "epoch": 423} {"train_loss": -9.025482177734375, "global_step": 71084, "epoch": 423} {"train_loss": -8.739303588867188, "global_step": 71085, "epoch": 423} {"train_loss": -8.95017147064209, "global_step": 71086, "epoch": 423} {"train_loss": -9.186981201171875, "global_step": 71087, "epoch": 423} {"train_loss": -9.071355819702148, "global_step": 71088, "epoch": 423} {"train_loss": -9.216615676879883, "global_step": 71089, "epoch": 423} {"train_loss": -9.142478942871094, "global_step": 71090, "epoch": 423} {"train_loss": -8.80583381652832, "global_step": 71091, "epoch": 423} {"train_loss": -8.866765975952148, "global_step": 71092, "epoch": 423} {"train_loss": -9.020256042480469, "global_step": 71093, "epoch": 423} {"train_loss": -9.153932571411133, "global_step": 71094, "epoch": 423} {"train_loss": -9.10284423828125, "global_step": 71095, "epoch": 423} {"train_loss": -8.790306091308594, "global_step": 71096, "epoch": 423} {"train_loss": -9.176904678344727, "global_step": 71097, "epoch": 423} {"train_loss": -9.001983642578125, "global_step": 71098, "epoch": 423} {"train_loss": -9.074755668640137, "global_step": 71099, "epoch": 423} {"train_loss": -8.938011169433594, "global_step": 71100, "epoch": 423} {"train_loss": -8.929872512817383, "global_step": 71101, "epoch": 423} {"train_loss": -9.098811149597168, "global_step": 71102, "epoch": 423} {"train_loss": -8.902366638183594, "global_step": 71103, "epoch": 423} {"train_loss": -8.978981018066406, "global_step": 71104, "epoch": 423} {"train_loss": -9.239032745361328, "global_step": 71105, "epoch": 423} {"train_loss": -8.402339935302734, "global_step": 71106, "epoch": 423} {"train_loss": -9.080301284790039, "global_step": 71107, "epoch": 423} {"train_loss": -8.86199951171875, "global_step": 71108, "epoch": 423} {"train_loss": -8.742178916931152, "global_step": 71109, "epoch": 423} {"train_loss": -8.828848838806152, "global_step": 71110, "epoch": 423} {"train_loss": -8.778617858886719, "global_step": 71111, "epoch": 423} {"train_loss": -8.967388153076172, "global_step": 71112, "epoch": 423} {"train_loss": -8.962353706359863, "global_step": 71113, "epoch": 423} {"train_loss": -9.211593627929688, "global_step": 71114, "epoch": 423} {"train_loss": -8.966048240661621, "global_step": 71115, "epoch": 423} {"train_loss": -9.134002685546875, "global_step": 71116, "epoch": 423} {"train_loss": -9.088424682617188, "global_step": 71117, "epoch": 423} {"train_loss": -8.823816299438477, "global_step": 71118, "epoch": 423} {"train_loss": -8.998000144958496, "global_step": 71119, "epoch": 423} {"train_loss": -9.215539932250977, "global_step": 71120, "epoch": 423} {"train_loss": -9.1565580368042, "global_step": 71121, "epoch": 423} {"train_loss": -9.02299976348877, "global_step": 71122, "epoch": 423} {"train_loss": -9.181872367858887, "global_step": 71123, "epoch": 423} {"train_loss": -8.913344383239746, "global_step": 71124, "epoch": 423} {"train_loss": -9.038734436035156, "global_step": 71125, "epoch": 423} {"train_loss": -9.257814407348633, "global_step": 71126, "epoch": 423} {"train_loss": -9.093881607055664, "global_step": 71127, "epoch": 423} {"train_loss": -9.251775741577148, "global_step": 71128, "epoch": 423} {"train_loss": -9.223227500915527, "global_step": 71129, "epoch": 423} {"train_loss": -8.912073135375977, "global_step": 71130, "epoch": 423} {"train_loss": -8.974505424499512, "global_step": 71131, "epoch": 423} {"train_loss": -9.033269882202148, "global_step": 71132, "epoch": 423} {"train_loss": -9.168352127075195, "global_step": 71133, "epoch": 423} {"train_loss": -8.876429557800293, "global_step": 71134, "epoch": 423} {"train_loss": -9.178610801696777, "global_step": 71135, "epoch": 423} {"train_loss": -9.202146530151367, "global_step": 71136, "epoch": 423} {"train_loss": -9.079258918762207, "global_step": 71137, "epoch": 423} {"train_loss": -8.926584243774414, "global_step": 71138, "epoch": 423} {"train_loss": -8.772490501403809, "global_step": 71139, "epoch": 423} {"train_loss": -9.092493057250977, "global_step": 71140, "epoch": 423} {"train_loss": -9.036871910095215, "global_step": 71141, "epoch": 423} {"train_loss": -9.18262767791748, "global_step": 71142, "epoch": 423} {"train_loss": -9.044055938720703, "global_step": 71143, "epoch": 423} {"train_loss": -8.903564453125, "global_step": 71144, "epoch": 423} {"train_loss": -8.949773788452148, "global_step": 71145, "epoch": 423} {"train_loss": -8.826282501220703, "global_step": 71146, "epoch": 423} {"train_loss": -8.88229751586914, "global_step": 71147, "epoch": 423} {"train_loss": -8.503673553466797, "global_step": 71148, "epoch": 423} {"train_loss": -8.89786148071289, "global_step": 71149, "epoch": 423} {"train_loss": -8.801222801208496, "global_step": 71150, "epoch": 423} {"train_loss": -8.943359375, "global_step": 71151, "epoch": 423} {"train_loss": -8.765714645385742, "global_step": 71152, "epoch": 423} {"train_loss": -8.980339050292969, "global_step": 71153, "epoch": 423} {"train_loss": -8.686680793762207, "global_step": 71154, "epoch": 423} {"train_loss": -9.012663841247559, "global_step": 71155, "epoch": 423} {"train_loss": -8.898847579956055, "global_step": 71156, "epoch": 423} {"train_loss": -8.907933235168457, "global_step": 71157, "epoch": 423} {"train_loss": -8.340020179748535, "global_step": 71158, "epoch": 423} {"train_loss": -8.860830307006836, "global_step": 71159, "epoch": 423} {"train_loss": -8.568897247314453, "global_step": 71160, "epoch": 423} {"train_loss": -8.69717788696289, "global_step": 71161, "epoch": 423} {"train_loss": -8.856486320495605, "global_step": 71162, "epoch": 423} {"train_loss": -8.798561096191406, "global_step": 71163, "epoch": 423} {"train_loss": -8.756072998046875, "global_step": 71164, "epoch": 423} {"train_loss": -8.863529205322266, "global_step": 71165, "epoch": 423} {"train_loss": -8.722047805786133, "global_step": 71166, "epoch": 423} {"train_loss": -8.852781295776367, "global_step": 71167, "epoch": 423} {"train_loss": -8.84228515625, "global_step": 71168, "epoch": 423} {"train_loss": -8.791906356811523, "global_step": 71169, "epoch": 423} {"train_loss": -8.911783218383789, "global_step": 71170, "epoch": 423} {"train_loss": -8.85598087310791, "global_step": 71171, "epoch": 423} {"train_loss": -8.910971641540527, "global_step": 71172, "epoch": 423} {"train_loss": -9.005428314208984, "global_step": 71173, "epoch": 423} {"train_loss": -8.920512199401855, "global_step": 71174, "epoch": 423} {"train_loss": -8.756538391113281, "global_step": 71175, "epoch": 423} {"train_loss": -9.194432258605957, "global_step": 71176, "epoch": 423} {"train_loss": -8.797185897827148, "global_step": 71177, "epoch": 423} {"train_loss": -8.9917631149292, "global_step": 71178, "epoch": 423} {"train_loss": -8.976602554321289, "global_step": 71179, "epoch": 423} {"train_loss": -9.027059555053711, "global_step": 71180, "epoch": 423} {"train_loss": -8.792065620422363, "global_step": 71181, "epoch": 423} {"train_loss": -8.950477600097656, "global_step": 71182, "epoch": 423} {"train_loss": -8.920458793640137, "global_step": 71183, "epoch": 423} {"train_loss": -8.848731994628906, "global_step": 71184, "epoch": 423} {"train_loss": -9.092193603515625, "global_step": 71185, "epoch": 423} {"train_loss": -9.016962051391602, "global_step": 71186, "epoch": 423} {"train_loss": -9.174653053283691, "global_step": 71187, "epoch": 423} {"train_loss": -9.117809295654297, "global_step": 71188, "epoch": 423} {"train_loss": -9.024642944335938, "global_step": 71189, "epoch": 423} {"train_loss": -8.95838451385498, "global_step": 71190, "epoch": 423} {"train_loss": -9.107746124267578, "global_step": 71191, "epoch": 423} {"train_loss": -9.173518180847168, "global_step": 71192, "epoch": 423} {"train_loss": -8.923527717590332, "global_step": 71193, "epoch": 423} {"train_loss": -8.974180221557617, "global_step": 71194, "epoch": 423} {"train_loss": -9.248154640197754, "global_step": 71195, "epoch": 423} {"train_loss": -9.230365753173828, "global_step": 71196, "epoch": 423} {"train_loss": -9.016271591186523, "global_step": 71197, "epoch": 423} {"train_loss": -9.241914749145508, "global_step": 71198, "epoch": 423} {"train_loss": -9.151264190673828, "global_step": 71199, "epoch": 423} {"train_loss": -8.781108856201172, "global_step": 71200, "epoch": 423} {"train_loss": -8.8202543258667, "global_step": 71201, "epoch": 423} {"train_loss": -9.081180572509766, "global_step": 71202, "epoch": 423} {"train_loss": -8.990650177001953, "global_step": 71203, "epoch": 423} {"train_loss": -8.608144760131836, "global_step": 71204, "epoch": 423} {"train_loss": -8.741286277770996, "global_step": 71205, "epoch": 423} {"train_loss": -8.828470230102539, "global_step": 71206, "epoch": 423} {"train_loss": -8.521324157714844, "global_step": 71207, "epoch": 423} {"train_loss": -8.509105682373047, "global_step": 71208, "epoch": 423} {"train_loss": -8.719036102294922, "global_step": 71209, "epoch": 423} {"train_loss": -8.588661193847656, "global_step": 71210, "epoch": 423} {"train_loss": -8.772844314575195, "global_step": 71211, "epoch": 423} {"train_loss": -8.834278106689453, "global_step": 71212, "epoch": 423} {"train_loss": -8.748878479003906, "global_step": 71213, "epoch": 423} {"train_loss": -8.886235237121582, "global_step": 71214, "epoch": 423} {"train_loss": -8.55489730834961, "global_step": 71215, "epoch": 423} {"train_loss": -8.605379104614258, "global_step": 71216, "epoch": 423} {"train_loss": -8.785562515258789, "global_step": 71217, "epoch": 423} {"train_loss": -8.927236557006836, "global_step": 71218, "epoch": 423} {"train_loss": -8.624375343322754, "global_step": 71219, "epoch": 423} {"train_loss": -8.688610076904297, "global_step": 71220, "epoch": 423} {"train_loss": -9.009129524230957, "global_step": 71221, "epoch": 423} {"train_loss": -8.726785659790039, "global_step": 71222, "epoch": 423} {"train_loss": -8.767736434936523, "global_step": 71223, "epoch": 423} {"train_loss": -9.042010307312012, "global_step": 71224, "epoch": 423} {"train_loss": -8.872894287109375, "global_step": 71225, "epoch": 423} {"train_loss": -8.927033424377441, "global_step": 71226, "epoch": 423} {"train_loss": -8.9368896484375, "global_step": 71227, "epoch": 423} {"train_loss": -8.96046257019043, "global_step": 71228, "epoch": 423} {"train_loss": -8.734298706054688, "global_step": 71229, "epoch": 423} {"train_loss": -8.828205108642578, "global_step": 71230, "epoch": 423} {"train_loss": -8.934598059881301, "global_step": 71231, "epoch": 423, "val_loss": 193446.859375} {"train_loss": -8.921403884887695, "global_step": 71232, "epoch": 424} {"train_loss": -8.815113067626953, "global_step": 71233, "epoch": 424} {"train_loss": -8.999956130981445, "global_step": 71234, "epoch": 424} {"train_loss": -8.947114944458008, "global_step": 71235, "epoch": 424} {"train_loss": -8.784740447998047, "global_step": 71236, "epoch": 424} {"train_loss": -8.962043762207031, "global_step": 71237, "epoch": 424} {"train_loss": -9.034618377685547, "global_step": 71238, "epoch": 424} {"train_loss": -8.923300743103027, "global_step": 71239, "epoch": 424} {"train_loss": -8.965775489807129, "global_step": 71240, "epoch": 424} {"train_loss": -9.071304321289062, "global_step": 71241, "epoch": 424} {"train_loss": -8.976969718933105, "global_step": 71242, "epoch": 424} {"train_loss": -8.847625732421875, "global_step": 71243, "epoch": 424} {"train_loss": -9.038976669311523, "global_step": 71244, "epoch": 424} {"train_loss": -8.9878568649292, "global_step": 71245, "epoch": 424} {"train_loss": -9.015372276306152, "global_step": 71246, "epoch": 424} {"train_loss": -8.979532241821289, "global_step": 71247, "epoch": 424} {"train_loss": -9.246492385864258, "global_step": 71248, "epoch": 424} {"train_loss": -8.894859313964844, "global_step": 71249, "epoch": 424} {"train_loss": -9.103199005126953, "global_step": 71250, "epoch": 424} {"train_loss": -9.140937805175781, "global_step": 71251, "epoch": 424} {"train_loss": -8.906492233276367, "global_step": 71252, "epoch": 424} {"train_loss": -9.144514083862305, "global_step": 71253, "epoch": 424} {"train_loss": -8.96035385131836, "global_step": 71254, "epoch": 424} {"train_loss": -9.176569938659668, "global_step": 71255, "epoch": 424} {"train_loss": -8.882230758666992, "global_step": 71256, "epoch": 424} {"train_loss": -9.028705596923828, "global_step": 71257, "epoch": 424} {"train_loss": -8.932610511779785, "global_step": 71258, "epoch": 424} {"train_loss": -8.928874969482422, "global_step": 71259, "epoch": 424} {"train_loss": -8.955985069274902, "global_step": 71260, "epoch": 424} {"train_loss": -9.218925476074219, "global_step": 71261, "epoch": 424} {"train_loss": -9.03687572479248, "global_step": 71262, "epoch": 424} {"train_loss": -9.182914733886719, "global_step": 71263, "epoch": 424} {"train_loss": -8.836654663085938, "global_step": 71264, "epoch": 424} {"train_loss": -9.149602890014648, "global_step": 71265, "epoch": 424} {"train_loss": -8.850048065185547, "global_step": 71266, "epoch": 424} {"train_loss": -8.920631408691406, "global_step": 71267, "epoch": 424} {"train_loss": -9.254072189331055, "global_step": 71268, "epoch": 424} {"train_loss": -8.768798828125, "global_step": 71269, "epoch": 424} {"train_loss": -8.876152038574219, "global_step": 71270, "epoch": 424} {"train_loss": -8.923565864562988, "global_step": 71271, "epoch": 424} {"train_loss": -8.889114379882812, "global_step": 71272, "epoch": 424} {"train_loss": -8.65369987487793, "global_step": 71273, "epoch": 424} {"train_loss": -8.814138412475586, "global_step": 71274, "epoch": 424} {"train_loss": -9.132040023803711, "global_step": 71275, "epoch": 424} {"train_loss": -8.878646850585938, "global_step": 71276, "epoch": 424} {"train_loss": -8.772947311401367, "global_step": 71277, "epoch": 424} {"train_loss": -9.111614227294922, "global_step": 71278, "epoch": 424} {"train_loss": -9.15571117401123, "global_step": 71279, "epoch": 424} {"train_loss": -8.92902946472168, "global_step": 71280, "epoch": 424} {"train_loss": -9.171619415283203, "global_step": 71281, "epoch": 424} {"train_loss": -9.201455116271973, "global_step": 71282, "epoch": 424} {"train_loss": -9.219488143920898, "global_step": 71283, "epoch": 424} {"train_loss": -9.098260879516602, "global_step": 71284, "epoch": 424} {"train_loss": -8.830525398254395, "global_step": 71285, "epoch": 424} {"train_loss": -8.969340324401855, "global_step": 71286, "epoch": 424} {"train_loss": -9.174418449401855, "global_step": 71287, "epoch": 424} {"train_loss": -9.104616165161133, "global_step": 71288, "epoch": 424} {"train_loss": -9.034618377685547, "global_step": 71289, "epoch": 424} {"train_loss": -8.991390228271484, "global_step": 71290, "epoch": 424} {"train_loss": -8.959646224975586, "global_step": 71291, "epoch": 424} {"train_loss": -9.028359413146973, "global_step": 71292, "epoch": 424} {"train_loss": -9.051528930664062, "global_step": 71293, "epoch": 424} {"train_loss": -9.062920570373535, "global_step": 71294, "epoch": 424} {"train_loss": -9.01207160949707, "global_step": 71295, "epoch": 424} {"train_loss": -9.264892578125, "global_step": 71296, "epoch": 424} {"train_loss": -9.14895248413086, "global_step": 71297, "epoch": 424} {"train_loss": -8.983388900756836, "global_step": 71298, "epoch": 424} {"train_loss": -8.896160125732422, "global_step": 71299, "epoch": 424} {"train_loss": -8.998701095581055, "global_step": 71300, "epoch": 424} {"train_loss": -9.193994522094727, "global_step": 71301, "epoch": 424} {"train_loss": -8.944450378417969, "global_step": 71302, "epoch": 424} {"train_loss": -8.913064956665039, "global_step": 71303, "epoch": 424} {"train_loss": -8.947248458862305, "global_step": 71304, "epoch": 424} {"train_loss": -9.050209045410156, "global_step": 71305, "epoch": 424} {"train_loss": -8.98038101196289, "global_step": 71306, "epoch": 424} {"train_loss": -8.963312149047852, "global_step": 71307, "epoch": 424} {"train_loss": -8.8883056640625, "global_step": 71308, "epoch": 424} {"train_loss": -8.961246490478516, "global_step": 71309, "epoch": 424} {"train_loss": -8.807985305786133, "global_step": 71310, "epoch": 424} {"train_loss": -8.848738670349121, "global_step": 71311, "epoch": 424} {"train_loss": -8.849783897399902, "global_step": 71312, "epoch": 424} {"train_loss": -9.099899291992188, "global_step": 71313, "epoch": 424} {"train_loss": -8.931676864624023, "global_step": 71314, "epoch": 424} {"train_loss": -8.999401092529297, "global_step": 71315, "epoch": 424} {"train_loss": -8.603800773620605, "global_step": 71316, "epoch": 424} {"train_loss": -8.959200859069824, "global_step": 71317, "epoch": 424} {"train_loss": -8.68018913269043, "global_step": 71318, "epoch": 424} {"train_loss": -8.87299919128418, "global_step": 71319, "epoch": 424} {"train_loss": -8.702641487121582, "global_step": 71320, "epoch": 424} {"train_loss": -9.112979888916016, "global_step": 71321, "epoch": 424} {"train_loss": -8.406490325927734, "global_step": 71322, "epoch": 424} {"train_loss": -8.830171585083008, "global_step": 71323, "epoch": 424} {"train_loss": -8.886711120605469, "global_step": 71324, "epoch": 424} {"train_loss": -8.889606475830078, "global_step": 71325, "epoch": 424} {"train_loss": -9.18250846862793, "global_step": 71326, "epoch": 424} {"train_loss": -9.02204418182373, "global_step": 71327, "epoch": 424} {"train_loss": -8.796285629272461, "global_step": 71328, "epoch": 424} {"train_loss": -9.08700180053711, "global_step": 71329, "epoch": 424} {"train_loss": -8.937206268310547, "global_step": 71330, "epoch": 424} {"train_loss": -9.049009323120117, "global_step": 71331, "epoch": 424} {"train_loss": -8.884307861328125, "global_step": 71332, "epoch": 424} {"train_loss": -9.139713287353516, "global_step": 71333, "epoch": 424} {"train_loss": -8.899280548095703, "global_step": 71334, "epoch": 424} {"train_loss": -9.024251937866211, "global_step": 71335, "epoch": 424} {"train_loss": -9.123769760131836, "global_step": 71336, "epoch": 424} {"train_loss": -9.05225944519043, "global_step": 71337, "epoch": 424} {"train_loss": -9.098410606384277, "global_step": 71338, "epoch": 424} {"train_loss": -9.170668601989746, "global_step": 71339, "epoch": 424} {"train_loss": -9.044014930725098, "global_step": 71340, "epoch": 424} {"train_loss": -9.07044792175293, "global_step": 71341, "epoch": 424} {"train_loss": -9.262856483459473, "global_step": 71342, "epoch": 424} {"train_loss": -8.918251037597656, "global_step": 71343, "epoch": 424} {"train_loss": -8.919979095458984, "global_step": 71344, "epoch": 424} {"train_loss": -8.947324752807617, "global_step": 71345, "epoch": 424} {"train_loss": -8.965383529663086, "global_step": 71346, "epoch": 424} {"train_loss": -8.720109939575195, "global_step": 71347, "epoch": 424} {"train_loss": -9.005975723266602, "global_step": 71348, "epoch": 424} {"train_loss": -8.183675765991211, "global_step": 71349, "epoch": 424} {"train_loss": -8.708992004394531, "global_step": 71350, "epoch": 424} {"train_loss": -8.644805908203125, "global_step": 71351, "epoch": 424} {"train_loss": -8.932294845581055, "global_step": 71352, "epoch": 424} {"train_loss": -8.362005233764648, "global_step": 71353, "epoch": 424} {"train_loss": -8.779914855957031, "global_step": 71354, "epoch": 424} {"train_loss": -8.726423263549805, "global_step": 71355, "epoch": 424} {"train_loss": -8.728412628173828, "global_step": 71356, "epoch": 424} {"train_loss": -8.398248672485352, "global_step": 71357, "epoch": 424} {"train_loss": -8.741440773010254, "global_step": 71358, "epoch": 424} {"train_loss": -8.695934295654297, "global_step": 71359, "epoch": 424} {"train_loss": -8.560498237609863, "global_step": 71360, "epoch": 424} {"train_loss": -8.844220161437988, "global_step": 71361, "epoch": 424} {"train_loss": -8.768315315246582, "global_step": 71362, "epoch": 424} {"train_loss": -8.6402006149292, "global_step": 71363, "epoch": 424} {"train_loss": -8.601221084594727, "global_step": 71364, "epoch": 424} {"train_loss": -8.453425407409668, "global_step": 71365, "epoch": 424} {"train_loss": -8.840354919433594, "global_step": 71366, "epoch": 424} {"train_loss": -8.639883041381836, "global_step": 71367, "epoch": 424} {"train_loss": -8.516839981079102, "global_step": 71368, "epoch": 424} {"train_loss": -8.845735549926758, "global_step": 71369, "epoch": 424} {"train_loss": -8.880854606628418, "global_step": 71370, "epoch": 424} {"train_loss": -8.974466323852539, "global_step": 71371, "epoch": 424} {"train_loss": -8.62325382232666, "global_step": 71372, "epoch": 424} {"train_loss": -8.982081413269043, "global_step": 71373, "epoch": 424} {"train_loss": -8.959136962890625, "global_step": 71374, "epoch": 424} {"train_loss": -8.885229110717773, "global_step": 71375, "epoch": 424} {"train_loss": -9.042753219604492, "global_step": 71376, "epoch": 424} {"train_loss": -8.90553092956543, "global_step": 71377, "epoch": 424} {"train_loss": -8.899903297424316, "global_step": 71378, "epoch": 424} {"train_loss": -9.018770217895508, "global_step": 71379, "epoch": 424} {"train_loss": -8.84310531616211, "global_step": 71380, "epoch": 424} {"train_loss": -9.177392959594727, "global_step": 71381, "epoch": 424} {"train_loss": -9.135406494140625, "global_step": 71382, "epoch": 424} {"train_loss": -8.99477767944336, "global_step": 71383, "epoch": 424} {"train_loss": -9.31754207611084, "global_step": 71384, "epoch": 424} {"train_loss": -8.814465522766113, "global_step": 71385, "epoch": 424} {"train_loss": -9.08993148803711, "global_step": 71386, "epoch": 424} {"train_loss": -8.811269760131836, "global_step": 71387, "epoch": 424} {"train_loss": -8.963630676269531, "global_step": 71388, "epoch": 424} {"train_loss": -9.147562980651855, "global_step": 71389, "epoch": 424} {"train_loss": -9.058855056762695, "global_step": 71390, "epoch": 424} {"train_loss": -8.89865779876709, "global_step": 71391, "epoch": 424} {"train_loss": -9.060103416442871, "global_step": 71392, "epoch": 424} {"train_loss": -9.12890911102295, "global_step": 71393, "epoch": 424} {"train_loss": -9.033964157104492, "global_step": 71394, "epoch": 424} {"train_loss": -8.884580612182617, "global_step": 71395, "epoch": 424} {"train_loss": -9.243870735168457, "global_step": 71396, "epoch": 424} {"train_loss": -9.072702407836914, "global_step": 71397, "epoch": 424} {"train_loss": -9.1754789352417, "global_step": 71398, "epoch": 424} {"train_loss": -8.943768654550825, "global_step": 71399, "epoch": 424, "val_loss": 193723.53125} {"train_loss": -8.876182556152344, "global_step": 71400, "epoch": 425} {"train_loss": -9.163223266601562, "global_step": 71401, "epoch": 425} {"train_loss": -9.053970336914062, "global_step": 71402, "epoch": 425} {"train_loss": -9.048076629638672, "global_step": 71403, "epoch": 425} {"train_loss": -9.046799659729004, "global_step": 71404, "epoch": 425} {"train_loss": -9.08262825012207, "global_step": 71405, "epoch": 425} {"train_loss": -8.96430778503418, "global_step": 71406, "epoch": 425} {"train_loss": -9.206955909729004, "global_step": 71407, "epoch": 425} {"train_loss": -8.984867095947266, "global_step": 71408, "epoch": 425} {"train_loss": -9.048047065734863, "global_step": 71409, "epoch": 425} {"train_loss": -9.094558715820312, "global_step": 71410, "epoch": 425} {"train_loss": -8.91305923461914, "global_step": 71411, "epoch": 425} {"train_loss": -9.072738647460938, "global_step": 71412, "epoch": 425} {"train_loss": -9.097877502441406, "global_step": 71413, "epoch": 425} {"train_loss": -9.386354446411133, "global_step": 71414, "epoch": 425} {"train_loss": -9.044036865234375, "global_step": 71415, "epoch": 425} {"train_loss": -8.597665786743164, "global_step": 71416, "epoch": 425} {"train_loss": -9.068380355834961, "global_step": 71417, "epoch": 425} {"train_loss": -9.205143928527832, "global_step": 71418, "epoch": 425} {"train_loss": -8.962318420410156, "global_step": 71419, "epoch": 425} {"train_loss": -8.70413875579834, "global_step": 71420, "epoch": 425} {"train_loss": -9.186620712280273, "global_step": 71421, "epoch": 425} {"train_loss": -8.777725219726562, "global_step": 71422, "epoch": 425} {"train_loss": -8.561073303222656, "global_step": 71423, "epoch": 425} {"train_loss": -8.888429641723633, "global_step": 71424, "epoch": 425} {"train_loss": -8.587783813476562, "global_step": 71425, "epoch": 425} {"train_loss": -8.97671127319336, "global_step": 71426, "epoch": 425} {"train_loss": -8.782041549682617, "global_step": 71427, "epoch": 425} {"train_loss": -8.927847862243652, "global_step": 71428, "epoch": 425} {"train_loss": -8.798212051391602, "global_step": 71429, "epoch": 425} {"train_loss": -8.787520408630371, "global_step": 71430, "epoch": 425} {"train_loss": -8.879744529724121, "global_step": 71431, "epoch": 425} {"train_loss": -8.896076202392578, "global_step": 71432, "epoch": 425} {"train_loss": -8.786312103271484, "global_step": 71433, "epoch": 425} {"train_loss": -8.80429458618164, "global_step": 71434, "epoch": 425} {"train_loss": -8.641080856323242, "global_step": 71435, "epoch": 425} {"train_loss": -8.797667503356934, "global_step": 71436, "epoch": 425} {"train_loss": -9.019742965698242, "global_step": 71437, "epoch": 425} {"train_loss": -8.915077209472656, "global_step": 71438, "epoch": 425} {"train_loss": -9.022383689880371, "global_step": 71439, "epoch": 425} {"train_loss": -8.98696517944336, "global_step": 71440, "epoch": 425} {"train_loss": -8.938024520874023, "global_step": 71441, "epoch": 425} {"train_loss": -9.088123321533203, "global_step": 71442, "epoch": 425} {"train_loss": -8.841062545776367, "global_step": 71443, "epoch": 425} {"train_loss": -9.001693725585938, "global_step": 71444, "epoch": 425} {"train_loss": -8.995621681213379, "global_step": 71445, "epoch": 425} {"train_loss": -9.069791793823242, "global_step": 71446, "epoch": 425} {"train_loss": -8.99180793762207, "global_step": 71447, "epoch": 425} {"train_loss": -8.980770111083984, "global_step": 71448, "epoch": 425} {"train_loss": -9.140987396240234, "global_step": 71449, "epoch": 425} {"train_loss": -8.924722671508789, "global_step": 71450, "epoch": 425} {"train_loss": -9.202856063842773, "global_step": 71451, "epoch": 425} {"train_loss": -8.985994338989258, "global_step": 71452, "epoch": 425} {"train_loss": -9.203605651855469, "global_step": 71453, "epoch": 425} {"train_loss": -9.411436080932617, "global_step": 71454, "epoch": 425} {"train_loss": -9.08265495300293, "global_step": 71455, "epoch": 425} {"train_loss": -9.492630958557129, "global_step": 71456, "epoch": 425} {"train_loss": -9.037266731262207, "global_step": 71457, "epoch": 425} {"train_loss": -9.219658851623535, "global_step": 71458, "epoch": 425} {"train_loss": -9.026537895202637, "global_step": 71459, "epoch": 425} {"train_loss": -9.14743423461914, "global_step": 71460, "epoch": 425} {"train_loss": -9.171916961669922, "global_step": 71461, "epoch": 425} {"train_loss": -9.300317764282227, "global_step": 71462, "epoch": 425} {"train_loss": -9.052797317504883, "global_step": 71463, "epoch": 425} {"train_loss": -9.269370079040527, "global_step": 71464, "epoch": 425} {"train_loss": -9.121733665466309, "global_step": 71465, "epoch": 425} {"train_loss": -9.144546508789062, "global_step": 71466, "epoch": 425} {"train_loss": -9.361207962036133, "global_step": 71467, "epoch": 425} {"train_loss": -9.15493106842041, "global_step": 71468, "epoch": 425} {"train_loss": -9.082902908325195, "global_step": 71469, "epoch": 425} {"train_loss": -9.200977325439453, "global_step": 71470, "epoch": 425} {"train_loss": -9.259407043457031, "global_step": 71471, "epoch": 425} {"train_loss": -8.995174407958984, "global_step": 71472, "epoch": 425} {"train_loss": -8.471567153930664, "global_step": 71473, "epoch": 425} {"train_loss": -9.062942504882812, "global_step": 71474, "epoch": 425} {"train_loss": -7.877198219299316, "global_step": 71475, "epoch": 425} {"train_loss": -8.429858207702637, "global_step": 71476, "epoch": 425} {"train_loss": -8.764812469482422, "global_step": 71477, "epoch": 425} {"train_loss": -8.716879844665527, "global_step": 71478, "epoch": 425} {"train_loss": -8.611675262451172, "global_step": 71479, "epoch": 425} {"train_loss": -8.804949760437012, "global_step": 71480, "epoch": 425} {"train_loss": -8.550477981567383, "global_step": 71481, "epoch": 425} {"train_loss": -8.831357955932617, "global_step": 71482, "epoch": 425} {"train_loss": -8.444506645202637, "global_step": 71483, "epoch": 425} {"train_loss": -8.690840721130371, "global_step": 71484, "epoch": 425} {"train_loss": -8.757028579711914, "global_step": 71485, "epoch": 425} {"train_loss": -8.589242935180664, "global_step": 71486, "epoch": 425} {"train_loss": -8.817096710205078, "global_step": 71487, "epoch": 425} {"train_loss": -8.800518035888672, "global_step": 71488, "epoch": 425} {"train_loss": -8.631158828735352, "global_step": 71489, "epoch": 425} {"train_loss": -8.72743034362793, "global_step": 71490, "epoch": 425} {"train_loss": -8.888174057006836, "global_step": 71491, "epoch": 425} {"train_loss": -8.827938079833984, "global_step": 71492, "epoch": 425} {"train_loss": -8.754560470581055, "global_step": 71493, "epoch": 425} {"train_loss": -8.820892333984375, "global_step": 71494, "epoch": 425} {"train_loss": -8.855648040771484, "global_step": 71495, "epoch": 425} {"train_loss": -8.878175735473633, "global_step": 71496, "epoch": 425} {"train_loss": -8.962181091308594, "global_step": 71497, "epoch": 425} {"train_loss": -8.906844139099121, "global_step": 71498, "epoch": 425} {"train_loss": -8.766745567321777, "global_step": 71499, "epoch": 425} {"train_loss": -8.75711441040039, "global_step": 71500, "epoch": 425} {"train_loss": -8.83446979522705, "global_step": 71501, "epoch": 425} {"train_loss": -8.84425163269043, "global_step": 71502, "epoch": 425} {"train_loss": -8.939486503601074, "global_step": 71503, "epoch": 425} {"train_loss": -9.027496337890625, "global_step": 71504, "epoch": 425} {"train_loss": -8.697660446166992, "global_step": 71505, "epoch": 425} {"train_loss": -8.996784210205078, "global_step": 71506, "epoch": 425} {"train_loss": -8.836128234863281, "global_step": 71507, "epoch": 425} {"train_loss": -8.960440635681152, "global_step": 71508, "epoch": 425} {"train_loss": -8.866729736328125, "global_step": 71509, "epoch": 425} {"train_loss": -8.94900894165039, "global_step": 71510, "epoch": 425} {"train_loss": -9.095860481262207, "global_step": 71511, "epoch": 425} {"train_loss": -8.951827049255371, "global_step": 71512, "epoch": 425} {"train_loss": -8.957681655883789, "global_step": 71513, "epoch": 425} {"train_loss": -9.316471099853516, "global_step": 71514, "epoch": 425} {"train_loss": -8.87099838256836, "global_step": 71515, "epoch": 425} {"train_loss": -8.958944320678711, "global_step": 71516, "epoch": 425} {"train_loss": -8.901272773742676, "global_step": 71517, "epoch": 425} {"train_loss": -8.857112884521484, "global_step": 71518, "epoch": 425} {"train_loss": -8.937125205993652, "global_step": 71519, "epoch": 425} {"train_loss": -8.918689727783203, "global_step": 71520, "epoch": 425} {"train_loss": -8.640498161315918, "global_step": 71521, "epoch": 425} {"train_loss": -8.984853744506836, "global_step": 71522, "epoch": 425} {"train_loss": -8.915013313293457, "global_step": 71523, "epoch": 425} {"train_loss": -8.93134593963623, "global_step": 71524, "epoch": 425} {"train_loss": -8.893098831176758, "global_step": 71525, "epoch": 425} {"train_loss": -9.136878967285156, "global_step": 71526, "epoch": 425} {"train_loss": -8.746594429016113, "global_step": 71527, "epoch": 425} {"train_loss": -9.058223724365234, "global_step": 71528, "epoch": 425} {"train_loss": -9.039752960205078, "global_step": 71529, "epoch": 425} {"train_loss": -8.895742416381836, "global_step": 71530, "epoch": 425} {"train_loss": -8.944745063781738, "global_step": 71531, "epoch": 425} {"train_loss": -8.716175079345703, "global_step": 71532, "epoch": 425} {"train_loss": -9.160480499267578, "global_step": 71533, "epoch": 425} {"train_loss": -8.969379425048828, "global_step": 71534, "epoch": 425} {"train_loss": -9.18900203704834, "global_step": 71535, "epoch": 425} {"train_loss": -8.866374969482422, "global_step": 71536, "epoch": 425} {"train_loss": -9.20083999633789, "global_step": 71537, "epoch": 425} {"train_loss": -9.07546329498291, "global_step": 71538, "epoch": 425} {"train_loss": -8.920393943786621, "global_step": 71539, "epoch": 425} {"train_loss": -9.149852752685547, "global_step": 71540, "epoch": 425} {"train_loss": -9.081682205200195, "global_step": 71541, "epoch": 425} {"train_loss": -9.184370994567871, "global_step": 71542, "epoch": 425} {"train_loss": -8.782035827636719, "global_step": 71543, "epoch": 425} {"train_loss": -9.209966659545898, "global_step": 71544, "epoch": 425} {"train_loss": -8.755192756652832, "global_step": 71545, "epoch": 425} {"train_loss": -9.08095932006836, "global_step": 71546, "epoch": 425} {"train_loss": -9.19302749633789, "global_step": 71547, "epoch": 425} {"train_loss": -9.056846618652344, "global_step": 71548, "epoch": 425} {"train_loss": -9.066534042358398, "global_step": 71549, "epoch": 425} {"train_loss": -8.827579498291016, "global_step": 71550, "epoch": 425} {"train_loss": -8.782844543457031, "global_step": 71551, "epoch": 425} {"train_loss": -8.84490966796875, "global_step": 71552, "epoch": 425} {"train_loss": -8.998331069946289, "global_step": 71553, "epoch": 425} {"train_loss": -8.948229789733887, "global_step": 71554, "epoch": 425} {"train_loss": -9.024251937866211, "global_step": 71555, "epoch": 425} {"train_loss": -8.899096488952637, "global_step": 71556, "epoch": 425} {"train_loss": -9.056876182556152, "global_step": 71557, "epoch": 425} {"train_loss": -9.003562927246094, "global_step": 71558, "epoch": 425} {"train_loss": -8.683609008789062, "global_step": 71559, "epoch": 425} {"train_loss": -9.079171180725098, "global_step": 71560, "epoch": 425} {"train_loss": -8.66768741607666, "global_step": 71561, "epoch": 425} {"train_loss": -8.909652709960938, "global_step": 71562, "epoch": 425} {"train_loss": -8.766481399536133, "global_step": 71563, "epoch": 425} {"train_loss": -8.841745376586914, "global_step": 71564, "epoch": 425} {"train_loss": -8.53702163696289, "global_step": 71565, "epoch": 425} {"train_loss": -8.751094818115234, "global_step": 71566, "epoch": 425} {"train_loss": -8.939600734483628, "global_step": 71567, "epoch": 425, "val_loss": 192479.984375, "train_action_mse_error": 8.127154350280762} {"train_loss": -8.822649002075195, "global_step": 71568, "epoch": 426} {"train_loss": -8.679350852966309, "global_step": 71569, "epoch": 426} {"train_loss": -8.880330085754395, "global_step": 71570, "epoch": 426} {"train_loss": -8.711384773254395, "global_step": 71571, "epoch": 426} {"train_loss": -8.882698059082031, "global_step": 71572, "epoch": 426} {"train_loss": -8.780290603637695, "global_step": 71573, "epoch": 426} {"train_loss": -8.916682243347168, "global_step": 71574, "epoch": 426} {"train_loss": -8.712922096252441, "global_step": 71575, "epoch": 426} {"train_loss": -8.753067970275879, "global_step": 71576, "epoch": 426} {"train_loss": -8.822562217712402, "global_step": 71577, "epoch": 426} {"train_loss": -8.561761856079102, "global_step": 71578, "epoch": 426} {"train_loss": -9.07825756072998, "global_step": 71579, "epoch": 426} {"train_loss": -8.851344108581543, "global_step": 71580, "epoch": 426} {"train_loss": -8.685699462890625, "global_step": 71581, "epoch": 426} {"train_loss": -9.00384521484375, "global_step": 71582, "epoch": 426} {"train_loss": -8.768798828125, "global_step": 71583, "epoch": 426} {"train_loss": -8.981074333190918, "global_step": 71584, "epoch": 426} {"train_loss": -8.90018081665039, "global_step": 71585, "epoch": 426} {"train_loss": -8.91036605834961, "global_step": 71586, "epoch": 426} {"train_loss": -9.029488563537598, "global_step": 71587, "epoch": 426} {"train_loss": -8.819385528564453, "global_step": 71588, "epoch": 426} {"train_loss": -8.7938232421875, "global_step": 71589, "epoch": 426} {"train_loss": -8.91568374633789, "global_step": 71590, "epoch": 426} {"train_loss": -8.879495620727539, "global_step": 71591, "epoch": 426} {"train_loss": -8.86299991607666, "global_step": 71592, "epoch": 426} {"train_loss": -9.177359580993652, "global_step": 71593, "epoch": 426} {"train_loss": -8.712616920471191, "global_step": 71594, "epoch": 426} {"train_loss": -9.04096794128418, "global_step": 71595, "epoch": 426} {"train_loss": -8.994437217712402, "global_step": 71596, "epoch": 426} {"train_loss": -9.017190933227539, "global_step": 71597, "epoch": 426} {"train_loss": -8.879255294799805, "global_step": 71598, "epoch": 426} {"train_loss": -8.542801856994629, "global_step": 71599, "epoch": 426} {"train_loss": -8.999504089355469, "global_step": 71600, "epoch": 426} {"train_loss": -8.722408294677734, "global_step": 71601, "epoch": 426} {"train_loss": -9.06755256652832, "global_step": 71602, "epoch": 426} {"train_loss": -9.035483360290527, "global_step": 71603, "epoch": 426} {"train_loss": -8.827542304992676, "global_step": 71604, "epoch": 426} {"train_loss": -8.687599182128906, "global_step": 71605, "epoch": 426} {"train_loss": -8.882696151733398, "global_step": 71606, "epoch": 426} {"train_loss": -8.918312072753906, "global_step": 71607, "epoch": 426} {"train_loss": -8.919225692749023, "global_step": 71608, "epoch": 426} {"train_loss": -8.990028381347656, "global_step": 71609, "epoch": 426} {"train_loss": -8.910530090332031, "global_step": 71610, "epoch": 426} {"train_loss": -9.01485538482666, "global_step": 71611, "epoch": 426} {"train_loss": -8.751277923583984, "global_step": 71612, "epoch": 426} {"train_loss": -9.092557907104492, "global_step": 71613, "epoch": 426} {"train_loss": -8.756875991821289, "global_step": 71614, "epoch": 426} {"train_loss": -9.07225227355957, "global_step": 71615, "epoch": 426} {"train_loss": -8.93280029296875, "global_step": 71616, "epoch": 426} {"train_loss": -9.021064758300781, "global_step": 71617, "epoch": 426} {"train_loss": -9.013477325439453, "global_step": 71618, "epoch": 426} {"train_loss": -8.962126731872559, "global_step": 71619, "epoch": 426} {"train_loss": -8.98914909362793, "global_step": 71620, "epoch": 426} {"train_loss": -9.04676628112793, "global_step": 71621, "epoch": 426} {"train_loss": -9.189071655273438, "global_step": 71622, "epoch": 426} {"train_loss": -8.914403915405273, "global_step": 71623, "epoch": 426} {"train_loss": -9.021848678588867, "global_step": 71624, "epoch": 426} {"train_loss": -9.097511291503906, "global_step": 71625, "epoch": 426} {"train_loss": -8.97635269165039, "global_step": 71626, "epoch": 426} {"train_loss": -9.072182655334473, "global_step": 71627, "epoch": 426} {"train_loss": -9.028528213500977, "global_step": 71628, "epoch": 426} {"train_loss": -9.302409172058105, "global_step": 71629, "epoch": 426} {"train_loss": -9.093777656555176, "global_step": 71630, "epoch": 426} {"train_loss": -9.134252548217773, "global_step": 71631, "epoch": 426} {"train_loss": -8.888005256652832, "global_step": 71632, "epoch": 426} {"train_loss": -9.143321990966797, "global_step": 71633, "epoch": 426} {"train_loss": -9.023681640625, "global_step": 71634, "epoch": 426} {"train_loss": -8.890993118286133, "global_step": 71635, "epoch": 426} {"train_loss": -8.982062339782715, "global_step": 71636, "epoch": 426} {"train_loss": -9.127654075622559, "global_step": 71637, "epoch": 426} {"train_loss": -9.267101287841797, "global_step": 71638, "epoch": 426} {"train_loss": -9.3433837890625, "global_step": 71639, "epoch": 426} {"train_loss": -9.06578254699707, "global_step": 71640, "epoch": 426} {"train_loss": -9.257678985595703, "global_step": 71641, "epoch": 426} {"train_loss": -9.0380220413208, "global_step": 71642, "epoch": 426} {"train_loss": -8.903538703918457, "global_step": 71643, "epoch": 426} {"train_loss": -8.824678421020508, "global_step": 71644, "epoch": 426} {"train_loss": -8.903697967529297, "global_step": 71645, "epoch": 426} {"train_loss": -9.146005630493164, "global_step": 71646, "epoch": 426} {"train_loss": -9.055559158325195, "global_step": 71647, "epoch": 426} {"train_loss": -8.912580490112305, "global_step": 71648, "epoch": 426} {"train_loss": -8.869718551635742, "global_step": 71649, "epoch": 426} {"train_loss": -8.886541366577148, "global_step": 71650, "epoch": 426} {"train_loss": -8.591720581054688, "global_step": 71651, "epoch": 426} {"train_loss": -8.802322387695312, "global_step": 71652, "epoch": 426} {"train_loss": -8.817132949829102, "global_step": 71653, "epoch": 426} {"train_loss": -8.900230407714844, "global_step": 71654, "epoch": 426} {"train_loss": -8.94880485534668, "global_step": 71655, "epoch": 426} {"train_loss": -9.012908935546875, "global_step": 71656, "epoch": 426} {"train_loss": -8.845236778259277, "global_step": 71657, "epoch": 426} {"train_loss": -9.060592651367188, "global_step": 71658, "epoch": 426} {"train_loss": -8.734546661376953, "global_step": 71659, "epoch": 426} {"train_loss": -8.910892486572266, "global_step": 71660, "epoch": 426} {"train_loss": -9.037353515625, "global_step": 71661, "epoch": 426} {"train_loss": -8.868712425231934, "global_step": 71662, "epoch": 426} {"train_loss": -8.937348365783691, "global_step": 71663, "epoch": 426} {"train_loss": -9.080132484436035, "global_step": 71664, "epoch": 426} {"train_loss": -8.919074058532715, "global_step": 71665, "epoch": 426} {"train_loss": -8.978914260864258, "global_step": 71666, "epoch": 426} {"train_loss": -8.831525802612305, "global_step": 71667, "epoch": 426} {"train_loss": -8.847419738769531, "global_step": 71668, "epoch": 426} {"train_loss": -8.976991653442383, "global_step": 71669, "epoch": 426} {"train_loss": -8.78961181640625, "global_step": 71670, "epoch": 426} {"train_loss": -9.109662055969238, "global_step": 71671, "epoch": 426} {"train_loss": -8.916763305664062, "global_step": 71672, "epoch": 426} {"train_loss": -9.005380630493164, "global_step": 71673, "epoch": 426} {"train_loss": -8.860776901245117, "global_step": 71674, "epoch": 426} {"train_loss": -9.169317245483398, "global_step": 71675, "epoch": 426} {"train_loss": -8.631210327148438, "global_step": 71676, "epoch": 426} {"train_loss": -8.98716926574707, "global_step": 71677, "epoch": 426} {"train_loss": -8.80524730682373, "global_step": 71678, "epoch": 426} {"train_loss": -9.061197280883789, "global_step": 71679, "epoch": 426} {"train_loss": -8.930194854736328, "global_step": 71680, "epoch": 426} {"train_loss": -8.915578842163086, "global_step": 71681, "epoch": 426} {"train_loss": -9.04919719696045, "global_step": 71682, "epoch": 426} {"train_loss": -8.618035316467285, "global_step": 71683, "epoch": 426} {"train_loss": -8.850042343139648, "global_step": 71684, "epoch": 426} {"train_loss": -8.82645320892334, "global_step": 71685, "epoch": 426} {"train_loss": -8.610405921936035, "global_step": 71686, "epoch": 426} {"train_loss": -8.86796760559082, "global_step": 71687, "epoch": 426} {"train_loss": -8.971595764160156, "global_step": 71688, "epoch": 426} {"train_loss": -8.957364082336426, "global_step": 71689, "epoch": 426} {"train_loss": -8.6343994140625, "global_step": 71690, "epoch": 426} {"train_loss": -8.948613166809082, "global_step": 71691, "epoch": 426} {"train_loss": -9.074710845947266, "global_step": 71692, "epoch": 426} {"train_loss": -8.740427017211914, "global_step": 71693, "epoch": 426} {"train_loss": -8.814298629760742, "global_step": 71694, "epoch": 426} {"train_loss": -9.120319366455078, "global_step": 71695, "epoch": 426} {"train_loss": -8.774726867675781, "global_step": 71696, "epoch": 426} {"train_loss": -8.87412166595459, "global_step": 71697, "epoch": 426} {"train_loss": -8.994598388671875, "global_step": 71698, "epoch": 426} {"train_loss": -8.997400283813477, "global_step": 71699, "epoch": 426} {"train_loss": -9.03140640258789, "global_step": 71700, "epoch": 426} {"train_loss": -8.805991172790527, "global_step": 71701, "epoch": 426} {"train_loss": -9.040613174438477, "global_step": 71702, "epoch": 426} {"train_loss": -8.816364288330078, "global_step": 71703, "epoch": 426} {"train_loss": -8.87540054321289, "global_step": 71704, "epoch": 426} {"train_loss": -8.800046920776367, "global_step": 71705, "epoch": 426} {"train_loss": -8.835086822509766, "global_step": 71706, "epoch": 426} {"train_loss": -8.888197898864746, "global_step": 71707, "epoch": 426} {"train_loss": -8.813090324401855, "global_step": 71708, "epoch": 426} {"train_loss": -8.968307495117188, "global_step": 71709, "epoch": 426} {"train_loss": -8.784745216369629, "global_step": 71710, "epoch": 426} {"train_loss": -8.868279457092285, "global_step": 71711, "epoch": 426} {"train_loss": -9.043947219848633, "global_step": 71712, "epoch": 426} {"train_loss": -8.835173606872559, "global_step": 71713, "epoch": 426} {"train_loss": -8.880071640014648, "global_step": 71714, "epoch": 426} {"train_loss": -9.029733657836914, "global_step": 71715, "epoch": 426} {"train_loss": -9.05163288116455, "global_step": 71716, "epoch": 426} {"train_loss": -9.1510009765625, "global_step": 71717, "epoch": 426} {"train_loss": -8.763771057128906, "global_step": 71718, "epoch": 426} {"train_loss": -8.922616004943848, "global_step": 71719, "epoch": 426} {"train_loss": -9.155227661132812, "global_step": 71720, "epoch": 426} {"train_loss": -9.230636596679688, "global_step": 71721, "epoch": 426} {"train_loss": -9.222185134887695, "global_step": 71722, "epoch": 426} {"train_loss": -9.18170166015625, "global_step": 71723, "epoch": 426} {"train_loss": -9.031959533691406, "global_step": 71724, "epoch": 426} {"train_loss": -8.985389709472656, "global_step": 71725, "epoch": 426} {"train_loss": -9.177251815795898, "global_step": 71726, "epoch": 426} {"train_loss": -9.14291000366211, "global_step": 71727, "epoch": 426} {"train_loss": -9.101329803466797, "global_step": 71728, "epoch": 426} {"train_loss": -9.101802825927734, "global_step": 71729, "epoch": 426} {"train_loss": -9.039992332458496, "global_step": 71730, "epoch": 426} {"train_loss": -9.240434646606445, "global_step": 71731, "epoch": 426} {"train_loss": -9.200695037841797, "global_step": 71732, "epoch": 426} {"train_loss": -9.004148483276367, "global_step": 71733, "epoch": 426} {"train_loss": -9.32458782196045, "global_step": 71734, "epoch": 426} {"train_loss": -8.945988825389318, "global_step": 71735, "epoch": 426, "val_loss": 194853.875} {"train_loss": -9.041485786437988, "global_step": 71736, "epoch": 427} {"train_loss": -9.260671615600586, "global_step": 71737, "epoch": 427} {"train_loss": -9.11018180847168, "global_step": 71738, "epoch": 427} {"train_loss": -9.222982406616211, "global_step": 71739, "epoch": 427} {"train_loss": -9.234673500061035, "global_step": 71740, "epoch": 427} {"train_loss": -9.104155540466309, "global_step": 71741, "epoch": 427} {"train_loss": -9.235217094421387, "global_step": 71742, "epoch": 427} {"train_loss": -9.303306579589844, "global_step": 71743, "epoch": 427} {"train_loss": -9.058502197265625, "global_step": 71744, "epoch": 427} {"train_loss": -9.348917007446289, "global_step": 71745, "epoch": 427} {"train_loss": -9.49312973022461, "global_step": 71746, "epoch": 427} {"train_loss": -9.267646789550781, "global_step": 71747, "epoch": 427} {"train_loss": -8.93152141571045, "global_step": 71748, "epoch": 427} {"train_loss": -8.865321159362793, "global_step": 71749, "epoch": 427} {"train_loss": -8.9934663772583, "global_step": 71750, "epoch": 427} {"train_loss": -8.91877555847168, "global_step": 71751, "epoch": 427} {"train_loss": -8.893733978271484, "global_step": 71752, "epoch": 427} {"train_loss": -9.118738174438477, "global_step": 71753, "epoch": 427} {"train_loss": -8.968500137329102, "global_step": 71754, "epoch": 427} {"train_loss": -9.09539794921875, "global_step": 71755, "epoch": 427} {"train_loss": -9.036886215209961, "global_step": 71756, "epoch": 427} {"train_loss": -9.010116577148438, "global_step": 71757, "epoch": 427} {"train_loss": -8.752628326416016, "global_step": 71758, "epoch": 427} {"train_loss": -8.89067268371582, "global_step": 71759, "epoch": 427} {"train_loss": -8.50983715057373, "global_step": 71760, "epoch": 427} {"train_loss": -8.620109558105469, "global_step": 71761, "epoch": 427} {"train_loss": -8.755203247070312, "global_step": 71762, "epoch": 427} {"train_loss": -8.856929779052734, "global_step": 71763, "epoch": 427} {"train_loss": -8.953187942504883, "global_step": 71764, "epoch": 427} {"train_loss": -8.805061340332031, "global_step": 71765, "epoch": 427} {"train_loss": -8.83901309967041, "global_step": 71766, "epoch": 427} {"train_loss": -8.967554092407227, "global_step": 71767, "epoch": 427} {"train_loss": -8.852968215942383, "global_step": 71768, "epoch": 427} {"train_loss": -8.734867095947266, "global_step": 71769, "epoch": 427} {"train_loss": -8.745847702026367, "global_step": 71770, "epoch": 427} {"train_loss": -8.682080268859863, "global_step": 71771, "epoch": 427} {"train_loss": -9.176983833312988, "global_step": 71772, "epoch": 427} {"train_loss": -8.521926879882812, "global_step": 71773, "epoch": 427} {"train_loss": -9.064205169677734, "global_step": 71774, "epoch": 427} {"train_loss": -8.84675407409668, "global_step": 71775, "epoch": 427} {"train_loss": -8.727530479431152, "global_step": 71776, "epoch": 427} {"train_loss": -8.678627967834473, "global_step": 71777, "epoch": 427} {"train_loss": -9.046649932861328, "global_step": 71778, "epoch": 427} {"train_loss": -8.662702560424805, "global_step": 71779, "epoch": 427} {"train_loss": -8.876551628112793, "global_step": 71780, "epoch": 427} {"train_loss": -9.104568481445312, "global_step": 71781, "epoch": 427} {"train_loss": -8.799821853637695, "global_step": 71782, "epoch": 427} {"train_loss": -8.833598136901855, "global_step": 71783, "epoch": 427} {"train_loss": -8.794132232666016, "global_step": 71784, "epoch": 427} {"train_loss": -9.065632820129395, "global_step": 71785, "epoch": 427} {"train_loss": -8.887428283691406, "global_step": 71786, "epoch": 427} {"train_loss": -9.029834747314453, "global_step": 71787, "epoch": 427} {"train_loss": -9.273710250854492, "global_step": 71788, "epoch": 427} {"train_loss": -8.964214324951172, "global_step": 71789, "epoch": 427} {"train_loss": -9.084066390991211, "global_step": 71790, "epoch": 427} {"train_loss": -9.317358016967773, "global_step": 71791, "epoch": 427} {"train_loss": -9.185638427734375, "global_step": 71792, "epoch": 427} {"train_loss": -9.174915313720703, "global_step": 71793, "epoch": 427} {"train_loss": -9.104914665222168, "global_step": 71794, "epoch": 427} {"train_loss": -8.978900909423828, "global_step": 71795, "epoch": 427} {"train_loss": -9.20582389831543, "global_step": 71796, "epoch": 427} {"train_loss": -9.146682739257812, "global_step": 71797, "epoch": 427} {"train_loss": -9.176259994506836, "global_step": 71798, "epoch": 427} {"train_loss": -9.136810302734375, "global_step": 71799, "epoch": 427} {"train_loss": -9.103259086608887, "global_step": 71800, "epoch": 427} {"train_loss": -8.923070907592773, "global_step": 71801, "epoch": 427} {"train_loss": -9.16962718963623, "global_step": 71802, "epoch": 427} {"train_loss": -9.212850570678711, "global_step": 71803, "epoch": 427} {"train_loss": -9.137507438659668, "global_step": 71804, "epoch": 427} {"train_loss": -8.92216968536377, "global_step": 71805, "epoch": 427} {"train_loss": -9.219350814819336, "global_step": 71806, "epoch": 427} {"train_loss": -9.134679794311523, "global_step": 71807, "epoch": 427} {"train_loss": -9.063556671142578, "global_step": 71808, "epoch": 427} {"train_loss": -9.316692352294922, "global_step": 71809, "epoch": 427} {"train_loss": -9.033903121948242, "global_step": 71810, "epoch": 427} {"train_loss": -8.840409278869629, "global_step": 71811, "epoch": 427} {"train_loss": -9.049187660217285, "global_step": 71812, "epoch": 427} {"train_loss": -8.789180755615234, "global_step": 71813, "epoch": 427} {"train_loss": -9.235780715942383, "global_step": 71814, "epoch": 427} {"train_loss": -8.900869369506836, "global_step": 71815, "epoch": 427} {"train_loss": -8.672748565673828, "global_step": 71816, "epoch": 427} {"train_loss": -9.151822090148926, "global_step": 71817, "epoch": 427} {"train_loss": -8.84953498840332, "global_step": 71818, "epoch": 427} {"train_loss": -9.015477180480957, "global_step": 71819, "epoch": 427} {"train_loss": -8.91517448425293, "global_step": 71820, "epoch": 427} {"train_loss": -8.986183166503906, "global_step": 71821, "epoch": 427} {"train_loss": -9.01935863494873, "global_step": 71822, "epoch": 427} {"train_loss": -8.819295883178711, "global_step": 71823, "epoch": 427} {"train_loss": -9.21876049041748, "global_step": 71824, "epoch": 427} {"train_loss": -8.833352088928223, "global_step": 71825, "epoch": 427} {"train_loss": -8.843189239501953, "global_step": 71826, "epoch": 427} {"train_loss": -9.21487808227539, "global_step": 71827, "epoch": 427} {"train_loss": -8.822513580322266, "global_step": 71828, "epoch": 427} {"train_loss": -9.09821891784668, "global_step": 71829, "epoch": 427} {"train_loss": -8.887590408325195, "global_step": 71830, "epoch": 427} {"train_loss": -9.062936782836914, "global_step": 71831, "epoch": 427} {"train_loss": -8.875426292419434, "global_step": 71832, "epoch": 427} {"train_loss": -9.20169448852539, "global_step": 71833, "epoch": 427} {"train_loss": -8.663049697875977, "global_step": 71834, "epoch": 427} {"train_loss": -9.109249114990234, "global_step": 71835, "epoch": 427} {"train_loss": -8.713855743408203, "global_step": 71836, "epoch": 427} {"train_loss": -8.971807479858398, "global_step": 71837, "epoch": 427} {"train_loss": -8.842575073242188, "global_step": 71838, "epoch": 427} {"train_loss": -9.050619125366211, "global_step": 71839, "epoch": 427} {"train_loss": -9.110851287841797, "global_step": 71840, "epoch": 427} {"train_loss": -8.739033699035645, "global_step": 71841, "epoch": 427} {"train_loss": -8.99734115600586, "global_step": 71842, "epoch": 427} {"train_loss": -8.8231201171875, "global_step": 71843, "epoch": 427} {"train_loss": -9.107475280761719, "global_step": 71844, "epoch": 427} {"train_loss": -8.823699951171875, "global_step": 71845, "epoch": 427} {"train_loss": -8.858940124511719, "global_step": 71846, "epoch": 427} {"train_loss": -8.95723819732666, "global_step": 71847, "epoch": 427} {"train_loss": -8.616299629211426, "global_step": 71848, "epoch": 427} {"train_loss": -8.910211563110352, "global_step": 71849, "epoch": 427} {"train_loss": -8.781586647033691, "global_step": 71850, "epoch": 427} {"train_loss": -9.134571075439453, "global_step": 71851, "epoch": 427} {"train_loss": -8.792935371398926, "global_step": 71852, "epoch": 427} {"train_loss": -8.72757339477539, "global_step": 71853, "epoch": 427} {"train_loss": -8.786497116088867, "global_step": 71854, "epoch": 427} {"train_loss": -8.91677474975586, "global_step": 71855, "epoch": 427} {"train_loss": -8.603221893310547, "global_step": 71856, "epoch": 427} {"train_loss": -9.01841926574707, "global_step": 71857, "epoch": 427} {"train_loss": -8.634029388427734, "global_step": 71858, "epoch": 427} {"train_loss": -8.859663009643555, "global_step": 71859, "epoch": 427} {"train_loss": -8.66268539428711, "global_step": 71860, "epoch": 427} {"train_loss": -8.659639358520508, "global_step": 71861, "epoch": 427} {"train_loss": -8.853803634643555, "global_step": 71862, "epoch": 427} {"train_loss": -8.645368576049805, "global_step": 71863, "epoch": 427} {"train_loss": -8.881019592285156, "global_step": 71864, "epoch": 427} {"train_loss": -8.884994506835938, "global_step": 71865, "epoch": 427} {"train_loss": -9.052178382873535, "global_step": 71866, "epoch": 427} {"train_loss": -8.738600730895996, "global_step": 71867, "epoch": 427} {"train_loss": -8.935593605041504, "global_step": 71868, "epoch": 427} {"train_loss": -8.921480178833008, "global_step": 71869, "epoch": 427} {"train_loss": -9.022123336791992, "global_step": 71870, "epoch": 427} {"train_loss": -8.872882843017578, "global_step": 71871, "epoch": 427} {"train_loss": -9.039029121398926, "global_step": 71872, "epoch": 427} {"train_loss": -9.17547607421875, "global_step": 71873, "epoch": 427} {"train_loss": -9.01198959350586, "global_step": 71874, "epoch": 427} {"train_loss": -8.869625091552734, "global_step": 71875, "epoch": 427} {"train_loss": -8.72170639038086, "global_step": 71876, "epoch": 427} {"train_loss": -8.755178451538086, "global_step": 71877, "epoch": 427} {"train_loss": -8.730603218078613, "global_step": 71878, "epoch": 427} {"train_loss": -8.87448501586914, "global_step": 71879, "epoch": 427} {"train_loss": -8.74359130859375, "global_step": 71880, "epoch": 427} {"train_loss": -8.478838920593262, "global_step": 71881, "epoch": 427} {"train_loss": -8.941990852355957, "global_step": 71882, "epoch": 427} {"train_loss": -8.801971435546875, "global_step": 71883, "epoch": 427} {"train_loss": -8.841512680053711, "global_step": 71884, "epoch": 427} {"train_loss": -8.536974906921387, "global_step": 71885, "epoch": 427} {"train_loss": -8.852685928344727, "global_step": 71886, "epoch": 427} {"train_loss": -8.70334243774414, "global_step": 71887, "epoch": 427} {"train_loss": -8.718595504760742, "global_step": 71888, "epoch": 427} {"train_loss": -8.990777969360352, "global_step": 71889, "epoch": 427} {"train_loss": -9.154687881469727, "global_step": 71890, "epoch": 427} {"train_loss": -8.708237648010254, "global_step": 71891, "epoch": 427} {"train_loss": -9.01915168762207, "global_step": 71892, "epoch": 427} {"train_loss": -9.005373001098633, "global_step": 71893, "epoch": 427} {"train_loss": -8.765584945678711, "global_step": 71894, "epoch": 427} {"train_loss": -8.992195129394531, "global_step": 71895, "epoch": 427} {"train_loss": -9.042722702026367, "global_step": 71896, "epoch": 427} {"train_loss": -9.335628509521484, "global_step": 71897, "epoch": 427} {"train_loss": -8.905954360961914, "global_step": 71898, "epoch": 427} {"train_loss": -9.060564994812012, "global_step": 71899, "epoch": 427} {"train_loss": -9.169106483459473, "global_step": 71900, "epoch": 427} {"train_loss": -9.2555513381958, "global_step": 71901, "epoch": 427} {"train_loss": -9.072311401367188, "global_step": 71902, "epoch": 427} {"train_loss": -8.953297637757801, "global_step": 71903, "epoch": 427, "val_loss": 193303.8125} {"train_loss": -9.18779182434082, "global_step": 71904, "epoch": 428} {"train_loss": -8.964117050170898, "global_step": 71905, "epoch": 428} {"train_loss": -9.139631271362305, "global_step": 71906, "epoch": 428} {"train_loss": -9.012186050415039, "global_step": 71907, "epoch": 428} {"train_loss": -8.777830123901367, "global_step": 71908, "epoch": 428} {"train_loss": -9.093137741088867, "global_step": 71909, "epoch": 428} {"train_loss": -8.954301834106445, "global_step": 71910, "epoch": 428} {"train_loss": -9.196460723876953, "global_step": 71911, "epoch": 428} {"train_loss": -8.961739540100098, "global_step": 71912, "epoch": 428} {"train_loss": -9.140838623046875, "global_step": 71913, "epoch": 428} {"train_loss": -8.833525657653809, "global_step": 71914, "epoch": 428} {"train_loss": -9.028778076171875, "global_step": 71915, "epoch": 428} {"train_loss": -8.968033790588379, "global_step": 71916, "epoch": 428} {"train_loss": -8.68017578125, "global_step": 71917, "epoch": 428} {"train_loss": -8.80164909362793, "global_step": 71918, "epoch": 428} {"train_loss": -8.69521713256836, "global_step": 71919, "epoch": 428} {"train_loss": -8.84100341796875, "global_step": 71920, "epoch": 428} {"train_loss": -8.967910766601562, "global_step": 71921, "epoch": 428} {"train_loss": -8.778898239135742, "global_step": 71922, "epoch": 428} {"train_loss": -8.759618759155273, "global_step": 71923, "epoch": 428} {"train_loss": -8.567018508911133, "global_step": 71924, "epoch": 428} {"train_loss": -9.09034252166748, "global_step": 71925, "epoch": 428} {"train_loss": -8.791902542114258, "global_step": 71926, "epoch": 428} {"train_loss": -9.01905345916748, "global_step": 71927, "epoch": 428} {"train_loss": -8.805583953857422, "global_step": 71928, "epoch": 428} {"train_loss": -8.8775053024292, "global_step": 71929, "epoch": 428} {"train_loss": -8.727148056030273, "global_step": 71930, "epoch": 428} {"train_loss": -8.912111282348633, "global_step": 71931, "epoch": 428} {"train_loss": -8.989376068115234, "global_step": 71932, "epoch": 428} {"train_loss": -9.128376007080078, "global_step": 71933, "epoch": 428} {"train_loss": -8.757608413696289, "global_step": 71934, "epoch": 428} {"train_loss": -8.992134094238281, "global_step": 71935, "epoch": 428} {"train_loss": -8.952302932739258, "global_step": 71936, "epoch": 428} {"train_loss": -9.089744567871094, "global_step": 71937, "epoch": 428} {"train_loss": -8.837556838989258, "global_step": 71938, "epoch": 428} {"train_loss": -9.019445419311523, "global_step": 71939, "epoch": 428} {"train_loss": -8.836368560791016, "global_step": 71940, "epoch": 428} {"train_loss": -9.232987403869629, "global_step": 71941, "epoch": 428} {"train_loss": -8.857885360717773, "global_step": 71942, "epoch": 428} {"train_loss": -8.80803394317627, "global_step": 71943, "epoch": 428} {"train_loss": -9.017560958862305, "global_step": 71944, "epoch": 428} {"train_loss": -9.049637794494629, "global_step": 71945, "epoch": 428} {"train_loss": -9.118927001953125, "global_step": 71946, "epoch": 428} {"train_loss": -9.141806602478027, "global_step": 71947, "epoch": 428} {"train_loss": -9.021754264831543, "global_step": 71948, "epoch": 428} {"train_loss": -8.934239387512207, "global_step": 71949, "epoch": 428} {"train_loss": -9.106123924255371, "global_step": 71950, "epoch": 428} {"train_loss": -9.029694557189941, "global_step": 71951, "epoch": 428} {"train_loss": -9.090482711791992, "global_step": 71952, "epoch": 428} {"train_loss": -9.061295509338379, "global_step": 71953, "epoch": 428} {"train_loss": -8.97032642364502, "global_step": 71954, "epoch": 428} {"train_loss": -9.261151313781738, "global_step": 71955, "epoch": 428} {"train_loss": -8.93310260772705, "global_step": 71956, "epoch": 428} {"train_loss": -9.17746639251709, "global_step": 71957, "epoch": 428} {"train_loss": -9.040046691894531, "global_step": 71958, "epoch": 428} {"train_loss": -9.087797164916992, "global_step": 71959, "epoch": 428} {"train_loss": -9.074947357177734, "global_step": 71960, "epoch": 428} {"train_loss": -9.020890235900879, "global_step": 71961, "epoch": 428} {"train_loss": -8.883197784423828, "global_step": 71962, "epoch": 428} {"train_loss": -8.922210693359375, "global_step": 71963, "epoch": 428} {"train_loss": -9.087873458862305, "global_step": 71964, "epoch": 428} {"train_loss": -8.826469421386719, "global_step": 71965, "epoch": 428} {"train_loss": -9.098287582397461, "global_step": 71966, "epoch": 428} {"train_loss": -9.12468147277832, "global_step": 71967, "epoch": 428} {"train_loss": -8.970438957214355, "global_step": 71968, "epoch": 428} {"train_loss": -8.990615844726562, "global_step": 71969, "epoch": 428} {"train_loss": -8.951837539672852, "global_step": 71970, "epoch": 428} {"train_loss": -9.073396682739258, "global_step": 71971, "epoch": 428} {"train_loss": -8.905937194824219, "global_step": 71972, "epoch": 428} {"train_loss": -8.978736877441406, "global_step": 71973, "epoch": 428} {"train_loss": -9.005790710449219, "global_step": 71974, "epoch": 428} {"train_loss": -8.606224060058594, "global_step": 71975, "epoch": 428} {"train_loss": -8.918859481811523, "global_step": 71976, "epoch": 428} {"train_loss": -9.008492469787598, "global_step": 71977, "epoch": 428} {"train_loss": -8.721536636352539, "global_step": 71978, "epoch": 428} {"train_loss": -8.999929428100586, "global_step": 71979, "epoch": 428} {"train_loss": -8.751842498779297, "global_step": 71980, "epoch": 428} {"train_loss": -8.702118873596191, "global_step": 71981, "epoch": 428} {"train_loss": -8.61215877532959, "global_step": 71982, "epoch": 428} {"train_loss": -9.038818359375, "global_step": 71983, "epoch": 428} {"train_loss": -8.685335159301758, "global_step": 71984, "epoch": 428} {"train_loss": -9.1494140625, "global_step": 71985, "epoch": 428} {"train_loss": -9.002363204956055, "global_step": 71986, "epoch": 428} {"train_loss": -8.759012222290039, "global_step": 71987, "epoch": 428} {"train_loss": -8.96119213104248, "global_step": 71988, "epoch": 428} {"train_loss": -9.139256477355957, "global_step": 71989, "epoch": 428} {"train_loss": -9.00541877746582, "global_step": 71990, "epoch": 428} {"train_loss": -9.04096794128418, "global_step": 71991, "epoch": 428} {"train_loss": -8.882558822631836, "global_step": 71992, "epoch": 428} {"train_loss": -9.055044174194336, "global_step": 71993, "epoch": 428} {"train_loss": -8.935050964355469, "global_step": 71994, "epoch": 428} {"train_loss": -8.51094913482666, "global_step": 71995, "epoch": 428} {"train_loss": -8.896231651306152, "global_step": 71996, "epoch": 428} {"train_loss": -8.936320304870605, "global_step": 71997, "epoch": 428} {"train_loss": -8.860897064208984, "global_step": 71998, "epoch": 428} {"train_loss": -8.86871337890625, "global_step": 71999, "epoch": 428} {"train_loss": -9.083182334899902, "global_step": 72000, "epoch": 428} {"train_loss": -8.900129318237305, "global_step": 72001, "epoch": 428} {"train_loss": -8.597124099731445, "global_step": 72002, "epoch": 428} {"train_loss": -9.127849578857422, "global_step": 72003, "epoch": 428} {"train_loss": -8.979257583618164, "global_step": 72004, "epoch": 428} {"train_loss": -9.029507637023926, "global_step": 72005, "epoch": 428} {"train_loss": -8.97513198852539, "global_step": 72006, "epoch": 428} {"train_loss": -9.144017219543457, "global_step": 72007, "epoch": 428} {"train_loss": -9.307579040527344, "global_step": 72008, "epoch": 428} {"train_loss": -9.064292907714844, "global_step": 72009, "epoch": 428} {"train_loss": -9.050518035888672, "global_step": 72010, "epoch": 428} {"train_loss": -9.034774780273438, "global_step": 72011, "epoch": 428} {"train_loss": -9.17679214477539, "global_step": 72012, "epoch": 428} {"train_loss": -9.05323600769043, "global_step": 72013, "epoch": 428} {"train_loss": -9.012609481811523, "global_step": 72014, "epoch": 428} {"train_loss": -9.271547317504883, "global_step": 72015, "epoch": 428} {"train_loss": -9.196800231933594, "global_step": 72016, "epoch": 428} {"train_loss": -9.23379898071289, "global_step": 72017, "epoch": 428} {"train_loss": -9.226088523864746, "global_step": 72018, "epoch": 428} {"train_loss": -9.019791603088379, "global_step": 72019, "epoch": 428} {"train_loss": -8.948812484741211, "global_step": 72020, "epoch": 428} {"train_loss": -8.924476623535156, "global_step": 72021, "epoch": 428} {"train_loss": -8.330159187316895, "global_step": 72022, "epoch": 428} {"train_loss": -8.989675521850586, "global_step": 72023, "epoch": 428} {"train_loss": -8.738219261169434, "global_step": 72024, "epoch": 428} {"train_loss": -8.889179229736328, "global_step": 72025, "epoch": 428} {"train_loss": -8.630624771118164, "global_step": 72026, "epoch": 428} {"train_loss": -8.510237693786621, "global_step": 72027, "epoch": 428} {"train_loss": -8.93569564819336, "global_step": 72028, "epoch": 428} {"train_loss": -8.915040969848633, "global_step": 72029, "epoch": 428} {"train_loss": -8.908177375793457, "global_step": 72030, "epoch": 428} {"train_loss": -8.977462768554688, "global_step": 72031, "epoch": 428} {"train_loss": -8.89574909210205, "global_step": 72032, "epoch": 428} {"train_loss": -8.965087890625, "global_step": 72033, "epoch": 428} {"train_loss": -8.909408569335938, "global_step": 72034, "epoch": 428} {"train_loss": -9.0890474319458, "global_step": 72035, "epoch": 428} {"train_loss": -8.990240097045898, "global_step": 72036, "epoch": 428} {"train_loss": -8.69798469543457, "global_step": 72037, "epoch": 428} {"train_loss": -8.779152870178223, "global_step": 72038, "epoch": 428} {"train_loss": -8.852821350097656, "global_step": 72039, "epoch": 428} {"train_loss": -9.021693229675293, "global_step": 72040, "epoch": 428} {"train_loss": -9.070289611816406, "global_step": 72041, "epoch": 428} {"train_loss": -9.152599334716797, "global_step": 72042, "epoch": 428} {"train_loss": -8.940902709960938, "global_step": 72043, "epoch": 428} {"train_loss": -8.833066940307617, "global_step": 72044, "epoch": 428} {"train_loss": -9.039644241333008, "global_step": 72045, "epoch": 428} {"train_loss": -9.011829376220703, "global_step": 72046, "epoch": 428} {"train_loss": -9.13787841796875, "global_step": 72047, "epoch": 428} {"train_loss": -9.224433898925781, "global_step": 72048, "epoch": 428} {"train_loss": -9.027541160583496, "global_step": 72049, "epoch": 428} {"train_loss": -8.780939102172852, "global_step": 72050, "epoch": 428} {"train_loss": -8.854711532592773, "global_step": 72051, "epoch": 428} {"train_loss": -8.551374435424805, "global_step": 72052, "epoch": 428} {"train_loss": -8.889579772949219, "global_step": 72053, "epoch": 428} {"train_loss": -8.726198196411133, "global_step": 72054, "epoch": 428} {"train_loss": -8.917583465576172, "global_step": 72055, "epoch": 428} {"train_loss": -8.654802322387695, "global_step": 72056, "epoch": 428} {"train_loss": -8.943864822387695, "global_step": 72057, "epoch": 428} {"train_loss": -8.786191940307617, "global_step": 72058, "epoch": 428} {"train_loss": -8.839012145996094, "global_step": 72059, "epoch": 428} {"train_loss": -8.758519172668457, "global_step": 72060, "epoch": 428} {"train_loss": -8.792142868041992, "global_step": 72061, "epoch": 428} {"train_loss": -9.053464889526367, "global_step": 72062, "epoch": 428} {"train_loss": -8.654129028320312, "global_step": 72063, "epoch": 428} {"train_loss": -8.777973175048828, "global_step": 72064, "epoch": 428} {"train_loss": -8.678993225097656, "global_step": 72065, "epoch": 428} {"train_loss": -8.791881561279297, "global_step": 72066, "epoch": 428} {"train_loss": -8.997385025024414, "global_step": 72067, "epoch": 428} {"train_loss": -8.896318435668945, "global_step": 72068, "epoch": 428} {"train_loss": -9.002965927124023, "global_step": 72069, "epoch": 428} {"train_loss": -8.790440559387207, "global_step": 72070, "epoch": 428} {"train_loss": -8.941707809766134, "global_step": 72071, "epoch": 428, "val_loss": 195503.640625} {"train_loss": -9.135845184326172, "global_step": 72072, "epoch": 429} {"train_loss": -9.138463973999023, "global_step": 72073, "epoch": 429} {"train_loss": -8.964044570922852, "global_step": 72074, "epoch": 429} {"train_loss": -9.059808731079102, "global_step": 72075, "epoch": 429} {"train_loss": -8.977724075317383, "global_step": 72076, "epoch": 429} {"train_loss": -8.832357406616211, "global_step": 72077, "epoch": 429} {"train_loss": -9.113248825073242, "global_step": 72078, "epoch": 429} {"train_loss": -9.000635147094727, "global_step": 72079, "epoch": 429} {"train_loss": -9.034418106079102, "global_step": 72080, "epoch": 429} {"train_loss": -9.254195213317871, "global_step": 72081, "epoch": 429} {"train_loss": -8.765175819396973, "global_step": 72082, "epoch": 429} {"train_loss": -9.116059303283691, "global_step": 72083, "epoch": 429} {"train_loss": -8.888118743896484, "global_step": 72084, "epoch": 429} {"train_loss": -9.081249237060547, "global_step": 72085, "epoch": 429} {"train_loss": -8.780374526977539, "global_step": 72086, "epoch": 429} {"train_loss": -8.807657241821289, "global_step": 72087, "epoch": 429} {"train_loss": -8.881114959716797, "global_step": 72088, "epoch": 429} {"train_loss": -8.87492561340332, "global_step": 72089, "epoch": 429} {"train_loss": -9.216362953186035, "global_step": 72090, "epoch": 429} {"train_loss": -9.002575874328613, "global_step": 72091, "epoch": 429} {"train_loss": -9.134990692138672, "global_step": 72092, "epoch": 429} {"train_loss": -9.194826126098633, "global_step": 72093, "epoch": 429} {"train_loss": -9.350118637084961, "global_step": 72094, "epoch": 429} {"train_loss": -8.953886032104492, "global_step": 72095, "epoch": 429} {"train_loss": -8.882112503051758, "global_step": 72096, "epoch": 429} {"train_loss": -9.072566986083984, "global_step": 72097, "epoch": 429} {"train_loss": -9.16673469543457, "global_step": 72098, "epoch": 429} {"train_loss": -9.325628280639648, "global_step": 72099, "epoch": 429} {"train_loss": -8.752574920654297, "global_step": 72100, "epoch": 429} {"train_loss": -9.084283828735352, "global_step": 72101, "epoch": 429} {"train_loss": -8.861091613769531, "global_step": 72102, "epoch": 429} {"train_loss": -9.030149459838867, "global_step": 72103, "epoch": 429} {"train_loss": -8.999467849731445, "global_step": 72104, "epoch": 429} {"train_loss": -8.775620460510254, "global_step": 72105, "epoch": 429} {"train_loss": -8.794845581054688, "global_step": 72106, "epoch": 429} {"train_loss": -9.049704551696777, "global_step": 72107, "epoch": 429} {"train_loss": -9.130781173706055, "global_step": 72108, "epoch": 429} {"train_loss": -9.107701301574707, "global_step": 72109, "epoch": 429} {"train_loss": -9.098930358886719, "global_step": 72110, "epoch": 429} {"train_loss": -8.753471374511719, "global_step": 72111, "epoch": 429} {"train_loss": -9.191320419311523, "global_step": 72112, "epoch": 429} {"train_loss": -9.142633438110352, "global_step": 72113, "epoch": 429} {"train_loss": -8.934674263000488, "global_step": 72114, "epoch": 429} {"train_loss": -9.15574836730957, "global_step": 72115, "epoch": 429} {"train_loss": -8.99014663696289, "global_step": 72116, "epoch": 429} {"train_loss": -9.066167831420898, "global_step": 72117, "epoch": 429} {"train_loss": -9.07253360748291, "global_step": 72118, "epoch": 429} {"train_loss": -9.191198348999023, "global_step": 72119, "epoch": 429} {"train_loss": -9.27672004699707, "global_step": 72120, "epoch": 429} {"train_loss": -8.85583209991455, "global_step": 72121, "epoch": 429} {"train_loss": -9.25047779083252, "global_step": 72122, "epoch": 429} {"train_loss": -9.08852767944336, "global_step": 72123, "epoch": 429} {"train_loss": -8.93642807006836, "global_step": 72124, "epoch": 429} {"train_loss": -9.074941635131836, "global_step": 72125, "epoch": 429} {"train_loss": -9.09105110168457, "global_step": 72126, "epoch": 429} {"train_loss": -9.06223201751709, "global_step": 72127, "epoch": 429} {"train_loss": -8.910533905029297, "global_step": 72128, "epoch": 429} {"train_loss": -8.754234313964844, "global_step": 72129, "epoch": 429} {"train_loss": -9.005084037780762, "global_step": 72130, "epoch": 429} {"train_loss": -9.170053482055664, "global_step": 72131, "epoch": 429} {"train_loss": -9.005067825317383, "global_step": 72132, "epoch": 429} {"train_loss": -9.053034782409668, "global_step": 72133, "epoch": 429} {"train_loss": -9.217813491821289, "global_step": 72134, "epoch": 429} {"train_loss": -9.312013626098633, "global_step": 72135, "epoch": 429} {"train_loss": -9.229825973510742, "global_step": 72136, "epoch": 429} {"train_loss": -9.162302017211914, "global_step": 72137, "epoch": 429} {"train_loss": -9.05940055847168, "global_step": 72138, "epoch": 429} {"train_loss": -8.981224060058594, "global_step": 72139, "epoch": 429} {"train_loss": -8.862157821655273, "global_step": 72140, "epoch": 429} {"train_loss": -9.236330032348633, "global_step": 72141, "epoch": 429} {"train_loss": -8.970317840576172, "global_step": 72142, "epoch": 429} {"train_loss": -9.489875793457031, "global_step": 72143, "epoch": 429} {"train_loss": -9.028730392456055, "global_step": 72144, "epoch": 429} {"train_loss": -8.908052444458008, "global_step": 72145, "epoch": 429} {"train_loss": -9.099872589111328, "global_step": 72146, "epoch": 429} {"train_loss": -9.105703353881836, "global_step": 72147, "epoch": 429} {"train_loss": -9.07191276550293, "global_step": 72148, "epoch": 429} {"train_loss": -9.184320449829102, "global_step": 72149, "epoch": 429} {"train_loss": -9.140532493591309, "global_step": 72150, "epoch": 429} {"train_loss": -9.181581497192383, "global_step": 72151, "epoch": 429} {"train_loss": -9.023507118225098, "global_step": 72152, "epoch": 429} {"train_loss": -9.07377815246582, "global_step": 72153, "epoch": 429} {"train_loss": -9.018302917480469, "global_step": 72154, "epoch": 429} {"train_loss": -9.20380687713623, "global_step": 72155, "epoch": 429} {"train_loss": -8.942340850830078, "global_step": 72156, "epoch": 429} {"train_loss": -9.360840797424316, "global_step": 72157, "epoch": 429} {"train_loss": -8.91911506652832, "global_step": 72158, "epoch": 429} {"train_loss": -9.309220314025879, "global_step": 72159, "epoch": 429} {"train_loss": -9.084162712097168, "global_step": 72160, "epoch": 429} {"train_loss": -8.83452033996582, "global_step": 72161, "epoch": 429} {"train_loss": -8.947160720825195, "global_step": 72162, "epoch": 429} {"train_loss": -9.086556434631348, "global_step": 72163, "epoch": 429} {"train_loss": -9.044533729553223, "global_step": 72164, "epoch": 429} {"train_loss": -8.96371078491211, "global_step": 72165, "epoch": 429} {"train_loss": -9.263325691223145, "global_step": 72166, "epoch": 429} {"train_loss": -8.757326126098633, "global_step": 72167, "epoch": 429} {"train_loss": -9.265952110290527, "global_step": 72168, "epoch": 429} {"train_loss": -9.013946533203125, "global_step": 72169, "epoch": 429} {"train_loss": -8.679422378540039, "global_step": 72170, "epoch": 429} {"train_loss": -8.743531227111816, "global_step": 72171, "epoch": 429} {"train_loss": -8.959612846374512, "global_step": 72172, "epoch": 429} {"train_loss": -8.768902778625488, "global_step": 72173, "epoch": 429} {"train_loss": -9.075273513793945, "global_step": 72174, "epoch": 429} {"train_loss": -8.976629257202148, "global_step": 72175, "epoch": 429} {"train_loss": -8.75776195526123, "global_step": 72176, "epoch": 429} {"train_loss": -9.034791946411133, "global_step": 72177, "epoch": 429} {"train_loss": -8.944452285766602, "global_step": 72178, "epoch": 429} {"train_loss": -8.839963912963867, "global_step": 72179, "epoch": 429} {"train_loss": -8.861701965332031, "global_step": 72180, "epoch": 429} {"train_loss": -8.912633895874023, "global_step": 72181, "epoch": 429} {"train_loss": -8.925346374511719, "global_step": 72182, "epoch": 429} {"train_loss": -8.730182647705078, "global_step": 72183, "epoch": 429} {"train_loss": -8.891899108886719, "global_step": 72184, "epoch": 429} {"train_loss": -8.931185722351074, "global_step": 72185, "epoch": 429} {"train_loss": -8.993200302124023, "global_step": 72186, "epoch": 429} {"train_loss": -8.871037483215332, "global_step": 72187, "epoch": 429} {"train_loss": -9.060586929321289, "global_step": 72188, "epoch": 429} {"train_loss": -9.063684463500977, "global_step": 72189, "epoch": 429} {"train_loss": -9.02656364440918, "global_step": 72190, "epoch": 429} {"train_loss": -9.018359184265137, "global_step": 72191, "epoch": 429} {"train_loss": -8.89435863494873, "global_step": 72192, "epoch": 429} {"train_loss": -8.997217178344727, "global_step": 72193, "epoch": 429} {"train_loss": -8.998333930969238, "global_step": 72194, "epoch": 429} {"train_loss": -9.105026245117188, "global_step": 72195, "epoch": 429} {"train_loss": -9.05008316040039, "global_step": 72196, "epoch": 429} {"train_loss": -9.034198760986328, "global_step": 72197, "epoch": 429} {"train_loss": -9.090888977050781, "global_step": 72198, "epoch": 429} {"train_loss": -9.02115535736084, "global_step": 72199, "epoch": 429} {"train_loss": -9.268174171447754, "global_step": 72200, "epoch": 429} {"train_loss": -9.094253540039062, "global_step": 72201, "epoch": 429} {"train_loss": -9.043859481811523, "global_step": 72202, "epoch": 429} {"train_loss": -9.050840377807617, "global_step": 72203, "epoch": 429} {"train_loss": -9.066413879394531, "global_step": 72204, "epoch": 429} {"train_loss": -9.210572242736816, "global_step": 72205, "epoch": 429} {"train_loss": -9.060043334960938, "global_step": 72206, "epoch": 429} {"train_loss": -8.835488319396973, "global_step": 72207, "epoch": 429} {"train_loss": -8.627650260925293, "global_step": 72208, "epoch": 429} {"train_loss": -8.822708129882812, "global_step": 72209, "epoch": 429} {"train_loss": -8.936569213867188, "global_step": 72210, "epoch": 429} {"train_loss": -8.868231773376465, "global_step": 72211, "epoch": 429} {"train_loss": -8.753562927246094, "global_step": 72212, "epoch": 429} {"train_loss": -8.872369766235352, "global_step": 72213, "epoch": 429} {"train_loss": -8.851423263549805, "global_step": 72214, "epoch": 429} {"train_loss": -8.844985961914062, "global_step": 72215, "epoch": 429} {"train_loss": -8.64202880859375, "global_step": 72216, "epoch": 429} {"train_loss": -8.995062828063965, "global_step": 72217, "epoch": 429} {"train_loss": -8.66685676574707, "global_step": 72218, "epoch": 429} {"train_loss": -8.746155738830566, "global_step": 72219, "epoch": 429} {"train_loss": -8.73944091796875, "global_step": 72220, "epoch": 429} {"train_loss": -8.785463333129883, "global_step": 72221, "epoch": 429} {"train_loss": -8.529696464538574, "global_step": 72222, "epoch": 429} {"train_loss": -8.674266815185547, "global_step": 72223, "epoch": 429} {"train_loss": -8.93722152709961, "global_step": 72224, "epoch": 429} {"train_loss": -8.603442192077637, "global_step": 72225, "epoch": 429} {"train_loss": -8.724977493286133, "global_step": 72226, "epoch": 429} {"train_loss": -8.796682357788086, "global_step": 72227, "epoch": 429} {"train_loss": -8.967489242553711, "global_step": 72228, "epoch": 429} {"train_loss": -8.612058639526367, "global_step": 72229, "epoch": 429} {"train_loss": -8.818058967590332, "global_step": 72230, "epoch": 429} {"train_loss": -8.875228881835938, "global_step": 72231, "epoch": 429} {"train_loss": -8.93493938446045, "global_step": 72232, "epoch": 429} {"train_loss": -8.751618385314941, "global_step": 72233, "epoch": 429} {"train_loss": -8.770074844360352, "global_step": 72234, "epoch": 429} {"train_loss": -8.891036987304688, "global_step": 72235, "epoch": 429} {"train_loss": -8.707399368286133, "global_step": 72236, "epoch": 429} {"train_loss": -8.925888061523438, "global_step": 72237, "epoch": 429} {"train_loss": -8.98971939086914, "global_step": 72238, "epoch": 429} {"train_loss": -8.984605459939866, "global_step": 72239, "epoch": 429, "val_loss": 193281.5} {"train_loss": -8.955357551574707, "global_step": 72240, "epoch": 430} {"train_loss": -9.08803939819336, "global_step": 72241, "epoch": 430} {"train_loss": -9.230701446533203, "global_step": 72242, "epoch": 430} {"train_loss": -8.96789264678955, "global_step": 72243, "epoch": 430} {"train_loss": -9.051462173461914, "global_step": 72244, "epoch": 430} {"train_loss": -8.893342018127441, "global_step": 72245, "epoch": 430} {"train_loss": -9.1193265914917, "global_step": 72246, "epoch": 430} {"train_loss": -9.047027587890625, "global_step": 72247, "epoch": 430} {"train_loss": -9.253535270690918, "global_step": 72248, "epoch": 430} {"train_loss": -9.204670906066895, "global_step": 72249, "epoch": 430} {"train_loss": -9.294846534729004, "global_step": 72250, "epoch": 430} {"train_loss": -9.214826583862305, "global_step": 72251, "epoch": 430} {"train_loss": -9.074068069458008, "global_step": 72252, "epoch": 430} {"train_loss": -9.08233642578125, "global_step": 72253, "epoch": 430} {"train_loss": -9.201519966125488, "global_step": 72254, "epoch": 430} {"train_loss": -9.064300537109375, "global_step": 72255, "epoch": 430} {"train_loss": -9.30864429473877, "global_step": 72256, "epoch": 430} {"train_loss": -9.231184005737305, "global_step": 72257, "epoch": 430} {"train_loss": -9.357172012329102, "global_step": 72258, "epoch": 430} {"train_loss": -9.278987884521484, "global_step": 72259, "epoch": 430} {"train_loss": -9.270149230957031, "global_step": 72260, "epoch": 430} {"train_loss": -9.164541244506836, "global_step": 72261, "epoch": 430} {"train_loss": -8.858881950378418, "global_step": 72262, "epoch": 430} {"train_loss": -8.87439250946045, "global_step": 72263, "epoch": 430} {"train_loss": -9.256603240966797, "global_step": 72264, "epoch": 430} {"train_loss": -9.093452453613281, "global_step": 72265, "epoch": 430} {"train_loss": -9.264203071594238, "global_step": 72266, "epoch": 430} {"train_loss": -8.982998847961426, "global_step": 72267, "epoch": 430} {"train_loss": -9.086944580078125, "global_step": 72268, "epoch": 430} {"train_loss": -9.18431282043457, "global_step": 72269, "epoch": 430} {"train_loss": -8.770130157470703, "global_step": 72270, "epoch": 430} {"train_loss": -9.20683765411377, "global_step": 72271, "epoch": 430} {"train_loss": -8.884186744689941, "global_step": 72272, "epoch": 430} {"train_loss": -8.98312759399414, "global_step": 72273, "epoch": 430} {"train_loss": -9.225988388061523, "global_step": 72274, "epoch": 430} {"train_loss": -9.01702880859375, "global_step": 72275, "epoch": 430} {"train_loss": -9.014999389648438, "global_step": 72276, "epoch": 430} {"train_loss": -9.065603256225586, "global_step": 72277, "epoch": 430} {"train_loss": -8.886707305908203, "global_step": 72278, "epoch": 430} {"train_loss": -9.013055801391602, "global_step": 72279, "epoch": 430} {"train_loss": -9.05975341796875, "global_step": 72280, "epoch": 430} {"train_loss": -9.012313842773438, "global_step": 72281, "epoch": 430} {"train_loss": -9.095951080322266, "global_step": 72282, "epoch": 430} {"train_loss": -8.995574951171875, "global_step": 72283, "epoch": 430} {"train_loss": -8.921878814697266, "global_step": 72284, "epoch": 430} {"train_loss": -8.82092571258545, "global_step": 72285, "epoch": 430} {"train_loss": -9.156576156616211, "global_step": 72286, "epoch": 430} {"train_loss": -8.997867584228516, "global_step": 72287, "epoch": 430} {"train_loss": -8.79891586303711, "global_step": 72288, "epoch": 430} {"train_loss": -9.011951446533203, "global_step": 72289, "epoch": 430} {"train_loss": -8.634952545166016, "global_step": 72290, "epoch": 430} {"train_loss": -8.74241828918457, "global_step": 72291, "epoch": 430} {"train_loss": -9.157289505004883, "global_step": 72292, "epoch": 430} {"train_loss": -8.73605728149414, "global_step": 72293, "epoch": 430} {"train_loss": -8.880340576171875, "global_step": 72294, "epoch": 430} {"train_loss": -9.113423347473145, "global_step": 72295, "epoch": 430} {"train_loss": -8.96940803527832, "global_step": 72296, "epoch": 430} {"train_loss": -9.062201499938965, "global_step": 72297, "epoch": 430} {"train_loss": -9.055350303649902, "global_step": 72298, "epoch": 430} {"train_loss": -9.014823913574219, "global_step": 72299, "epoch": 430} {"train_loss": -8.846711158752441, "global_step": 72300, "epoch": 430} {"train_loss": -9.065011978149414, "global_step": 72301, "epoch": 430} {"train_loss": -8.836222648620605, "global_step": 72302, "epoch": 430} {"train_loss": -8.87781047821045, "global_step": 72303, "epoch": 430} {"train_loss": -8.576212882995605, "global_step": 72304, "epoch": 430} {"train_loss": -8.532886505126953, "global_step": 72305, "epoch": 430} {"train_loss": -8.965085983276367, "global_step": 72306, "epoch": 430} {"train_loss": -8.934709548950195, "global_step": 72307, "epoch": 430} {"train_loss": -8.544971466064453, "global_step": 72308, "epoch": 430} {"train_loss": -8.992181777954102, "global_step": 72309, "epoch": 430} {"train_loss": -8.709339141845703, "global_step": 72310, "epoch": 430} {"train_loss": -8.793766021728516, "global_step": 72311, "epoch": 430} {"train_loss": -8.936954498291016, "global_step": 72312, "epoch": 430} {"train_loss": -8.824102401733398, "global_step": 72313, "epoch": 430} {"train_loss": -8.863262176513672, "global_step": 72314, "epoch": 430} {"train_loss": -8.800861358642578, "global_step": 72315, "epoch": 430} {"train_loss": -8.876225471496582, "global_step": 72316, "epoch": 430} {"train_loss": -8.705059051513672, "global_step": 72317, "epoch": 430} {"train_loss": -8.948159217834473, "global_step": 72318, "epoch": 430} {"train_loss": -8.707443237304688, "global_step": 72319, "epoch": 430} {"train_loss": -8.887288093566895, "global_step": 72320, "epoch": 430} {"train_loss": -8.726639747619629, "global_step": 72321, "epoch": 430} {"train_loss": -8.947389602661133, "global_step": 72322, "epoch": 430} {"train_loss": -9.008890151977539, "global_step": 72323, "epoch": 430} {"train_loss": -8.897090911865234, "global_step": 72324, "epoch": 430} {"train_loss": -8.839615821838379, "global_step": 72325, "epoch": 430} {"train_loss": -8.792970657348633, "global_step": 72326, "epoch": 430} {"train_loss": -9.161418914794922, "global_step": 72327, "epoch": 430} {"train_loss": -8.91580867767334, "global_step": 72328, "epoch": 430} {"train_loss": -8.960638046264648, "global_step": 72329, "epoch": 430} {"train_loss": -8.777042388916016, "global_step": 72330, "epoch": 430} {"train_loss": -8.914112091064453, "global_step": 72331, "epoch": 430} {"train_loss": -9.122827529907227, "global_step": 72332, "epoch": 430} {"train_loss": -8.896520614624023, "global_step": 72333, "epoch": 430} {"train_loss": -9.200499534606934, "global_step": 72334, "epoch": 430} {"train_loss": -9.117902755737305, "global_step": 72335, "epoch": 430} {"train_loss": -9.180349349975586, "global_step": 72336, "epoch": 430} {"train_loss": -8.843595504760742, "global_step": 72337, "epoch": 430} {"train_loss": -9.154402732849121, "global_step": 72338, "epoch": 430} {"train_loss": -8.989494323730469, "global_step": 72339, "epoch": 430} {"train_loss": -8.861560821533203, "global_step": 72340, "epoch": 430} {"train_loss": -8.991443634033203, "global_step": 72341, "epoch": 430} {"train_loss": -9.288095474243164, "global_step": 72342, "epoch": 430} {"train_loss": -8.920330047607422, "global_step": 72343, "epoch": 430} {"train_loss": -9.102713584899902, "global_step": 72344, "epoch": 430} {"train_loss": -9.178442001342773, "global_step": 72345, "epoch": 430} {"train_loss": -8.995004653930664, "global_step": 72346, "epoch": 430} {"train_loss": -9.21347713470459, "global_step": 72347, "epoch": 430} {"train_loss": -8.900674819946289, "global_step": 72348, "epoch": 430} {"train_loss": -8.947484970092773, "global_step": 72349, "epoch": 430} {"train_loss": -9.049622535705566, "global_step": 72350, "epoch": 430} {"train_loss": -8.941364288330078, "global_step": 72351, "epoch": 430} {"train_loss": -8.981559753417969, "global_step": 72352, "epoch": 430} {"train_loss": -9.068530082702637, "global_step": 72353, "epoch": 430} {"train_loss": -8.958002090454102, "global_step": 72354, "epoch": 430} {"train_loss": -8.95291805267334, "global_step": 72355, "epoch": 430} {"train_loss": -8.928287506103516, "global_step": 72356, "epoch": 430} {"train_loss": -8.86756706237793, "global_step": 72357, "epoch": 430} {"train_loss": -9.013751029968262, "global_step": 72358, "epoch": 430} {"train_loss": -9.009847640991211, "global_step": 72359, "epoch": 430} {"train_loss": -8.96577262878418, "global_step": 72360, "epoch": 430} {"train_loss": -8.986072540283203, "global_step": 72361, "epoch": 430} {"train_loss": -9.087928771972656, "global_step": 72362, "epoch": 430} {"train_loss": -8.882919311523438, "global_step": 72363, "epoch": 430} {"train_loss": -8.6467924118042, "global_step": 72364, "epoch": 430} {"train_loss": -9.00844955444336, "global_step": 72365, "epoch": 430} {"train_loss": -8.853033065795898, "global_step": 72366, "epoch": 430} {"train_loss": -8.315689086914062, "global_step": 72367, "epoch": 430} {"train_loss": -8.560956954956055, "global_step": 72368, "epoch": 430} {"train_loss": -8.937891006469727, "global_step": 72369, "epoch": 430} {"train_loss": -8.609067916870117, "global_step": 72370, "epoch": 430} {"train_loss": -8.415227890014648, "global_step": 72371, "epoch": 430} {"train_loss": -8.545526504516602, "global_step": 72372, "epoch": 430} {"train_loss": -8.567991256713867, "global_step": 72373, "epoch": 430} {"train_loss": -8.880972862243652, "global_step": 72374, "epoch": 430} {"train_loss": -8.625932693481445, "global_step": 72375, "epoch": 430} {"train_loss": -8.669219017028809, "global_step": 72376, "epoch": 430} {"train_loss": -8.738273620605469, "global_step": 72377, "epoch": 430} {"train_loss": -8.84115219116211, "global_step": 72378, "epoch": 430} {"train_loss": -8.783580780029297, "global_step": 72379, "epoch": 430} {"train_loss": -9.02754020690918, "global_step": 72380, "epoch": 430} {"train_loss": -8.991573333740234, "global_step": 72381, "epoch": 430} {"train_loss": -8.99232006072998, "global_step": 72382, "epoch": 430} {"train_loss": -8.844504356384277, "global_step": 72383, "epoch": 430} {"train_loss": -8.981738090515137, "global_step": 72384, "epoch": 430} {"train_loss": -9.054709434509277, "global_step": 72385, "epoch": 430} {"train_loss": -8.987668991088867, "global_step": 72386, "epoch": 430} {"train_loss": -9.111247062683105, "global_step": 72387, "epoch": 430} {"train_loss": -9.016059875488281, "global_step": 72388, "epoch": 430} {"train_loss": -9.237821578979492, "global_step": 72389, "epoch": 430} {"train_loss": -9.014371871948242, "global_step": 72390, "epoch": 430} {"train_loss": -8.994746208190918, "global_step": 72391, "epoch": 430} {"train_loss": -9.289488792419434, "global_step": 72392, "epoch": 430} {"train_loss": -9.125618934631348, "global_step": 72393, "epoch": 430} {"train_loss": -9.144627571105957, "global_step": 72394, "epoch": 430} {"train_loss": -9.024213790893555, "global_step": 72395, "epoch": 430} {"train_loss": -9.199490547180176, "global_step": 72396, "epoch": 430} {"train_loss": -8.926973342895508, "global_step": 72397, "epoch": 430} {"train_loss": -8.878456115722656, "global_step": 72398, "epoch": 430} {"train_loss": -8.954513549804688, "global_step": 72399, "epoch": 430} {"train_loss": -8.91421890258789, "global_step": 72400, "epoch": 430} {"train_loss": -9.115394592285156, "global_step": 72401, "epoch": 430} {"train_loss": -9.053535461425781, "global_step": 72402, "epoch": 430} {"train_loss": -8.919663429260254, "global_step": 72403, "epoch": 430} {"train_loss": -8.900100708007812, "global_step": 72404, "epoch": 430} {"train_loss": -8.875856399536133, "global_step": 72405, "epoch": 430} {"train_loss": -8.844416618347168, "global_step": 72406, "epoch": 430} {"train_loss": -8.965942905062722, "global_step": 72407, "epoch": 430, "val_loss": 194388.46875, "train_action_mse_error": 9.001470565795898} {"train_loss": -8.814735412597656, "global_step": 72408, "epoch": 431} {"train_loss": -8.773872375488281, "global_step": 72409, "epoch": 431} {"train_loss": -8.834474563598633, "global_step": 72410, "epoch": 431} {"train_loss": -8.629870414733887, "global_step": 72411, "epoch": 431} {"train_loss": -8.672201156616211, "global_step": 72412, "epoch": 431} {"train_loss": -8.73495101928711, "global_step": 72413, "epoch": 431} {"train_loss": -8.557210922241211, "global_step": 72414, "epoch": 431} {"train_loss": -8.863258361816406, "global_step": 72415, "epoch": 431} {"train_loss": -8.914621353149414, "global_step": 72416, "epoch": 431} {"train_loss": -8.704610824584961, "global_step": 72417, "epoch": 431} {"train_loss": -8.6458740234375, "global_step": 72418, "epoch": 431} {"train_loss": -8.990323066711426, "global_step": 72419, "epoch": 431} {"train_loss": -8.871761322021484, "global_step": 72420, "epoch": 431} {"train_loss": -8.869214057922363, "global_step": 72421, "epoch": 431} {"train_loss": -8.902053833007812, "global_step": 72422, "epoch": 431} {"train_loss": -8.882549285888672, "global_step": 72423, "epoch": 431} {"train_loss": -9.117767333984375, "global_step": 72424, "epoch": 431} {"train_loss": -8.999277114868164, "global_step": 72425, "epoch": 431} {"train_loss": -8.748190879821777, "global_step": 72426, "epoch": 431} {"train_loss": -9.335756301879883, "global_step": 72427, "epoch": 431} {"train_loss": -9.020471572875977, "global_step": 72428, "epoch": 431} {"train_loss": -8.79885482788086, "global_step": 72429, "epoch": 431} {"train_loss": -9.268511772155762, "global_step": 72430, "epoch": 431} {"train_loss": -8.7645263671875, "global_step": 72431, "epoch": 431} {"train_loss": -9.034123420715332, "global_step": 72432, "epoch": 431} {"train_loss": -8.838419914245605, "global_step": 72433, "epoch": 431} {"train_loss": -9.063512802124023, "global_step": 72434, "epoch": 431} {"train_loss": -8.826898574829102, "global_step": 72435, "epoch": 431} {"train_loss": -8.892241477966309, "global_step": 72436, "epoch": 431} {"train_loss": -8.912473678588867, "global_step": 72437, "epoch": 431} {"train_loss": -8.754332542419434, "global_step": 72438, "epoch": 431} {"train_loss": -9.302237510681152, "global_step": 72439, "epoch": 431} {"train_loss": -9.136966705322266, "global_step": 72440, "epoch": 431} {"train_loss": -9.302373886108398, "global_step": 72441, "epoch": 431} {"train_loss": -9.301194190979004, "global_step": 72442, "epoch": 431} {"train_loss": -8.952857971191406, "global_step": 72443, "epoch": 431} {"train_loss": -9.04046630859375, "global_step": 72444, "epoch": 431} {"train_loss": -9.252328872680664, "global_step": 72445, "epoch": 431} {"train_loss": -8.9296875, "global_step": 72446, "epoch": 431} {"train_loss": -8.912187576293945, "global_step": 72447, "epoch": 431} {"train_loss": -9.279373168945312, "global_step": 72448, "epoch": 431} {"train_loss": -9.051122665405273, "global_step": 72449, "epoch": 431} {"train_loss": -9.240293502807617, "global_step": 72450, "epoch": 431} {"train_loss": -9.064445495605469, "global_step": 72451, "epoch": 431} {"train_loss": -9.127050399780273, "global_step": 72452, "epoch": 431} {"train_loss": -9.249855041503906, "global_step": 72453, "epoch": 431} {"train_loss": -9.110620498657227, "global_step": 72454, "epoch": 431} {"train_loss": -9.10461139678955, "global_step": 72455, "epoch": 431} {"train_loss": -9.02310562133789, "global_step": 72456, "epoch": 431} {"train_loss": -8.98213005065918, "global_step": 72457, "epoch": 431} {"train_loss": -9.011130332946777, "global_step": 72458, "epoch": 431} {"train_loss": -9.232105255126953, "global_step": 72459, "epoch": 431} {"train_loss": -8.829360961914062, "global_step": 72460, "epoch": 431} {"train_loss": -8.866875648498535, "global_step": 72461, "epoch": 431} {"train_loss": -9.127120971679688, "global_step": 72462, "epoch": 431} {"train_loss": -8.754118919372559, "global_step": 72463, "epoch": 431} {"train_loss": -8.949177742004395, "global_step": 72464, "epoch": 431} {"train_loss": -8.811885833740234, "global_step": 72465, "epoch": 431} {"train_loss": -8.938108444213867, "global_step": 72466, "epoch": 431} {"train_loss": -8.874590873718262, "global_step": 72467, "epoch": 431} {"train_loss": -8.912209510803223, "global_step": 72468, "epoch": 431} {"train_loss": -8.793272972106934, "global_step": 72469, "epoch": 431} {"train_loss": -9.045380592346191, "global_step": 72470, "epoch": 431} {"train_loss": -8.957389831542969, "global_step": 72471, "epoch": 431} {"train_loss": -8.827362060546875, "global_step": 72472, "epoch": 431} {"train_loss": -8.791563034057617, "global_step": 72473, "epoch": 431} {"train_loss": -8.78330135345459, "global_step": 72474, "epoch": 431} {"train_loss": -8.618962287902832, "global_step": 72475, "epoch": 431} {"train_loss": -8.77939510345459, "global_step": 72476, "epoch": 431} {"train_loss": -9.12549114227295, "global_step": 72477, "epoch": 431} {"train_loss": -8.890438079833984, "global_step": 72478, "epoch": 431} {"train_loss": -8.949002265930176, "global_step": 72479, "epoch": 431} {"train_loss": -8.565751075744629, "global_step": 72480, "epoch": 431} {"train_loss": -9.10015869140625, "global_step": 72481, "epoch": 431} {"train_loss": -9.01852798461914, "global_step": 72482, "epoch": 431} {"train_loss": -9.048578262329102, "global_step": 72483, "epoch": 431} {"train_loss": -8.963993072509766, "global_step": 72484, "epoch": 431} {"train_loss": -9.025440216064453, "global_step": 72485, "epoch": 431} {"train_loss": -8.749380111694336, "global_step": 72486, "epoch": 431} {"train_loss": -9.086048126220703, "global_step": 72487, "epoch": 431} {"train_loss": -8.898345947265625, "global_step": 72488, "epoch": 431} {"train_loss": -8.956676483154297, "global_step": 72489, "epoch": 431} {"train_loss": -9.120771408081055, "global_step": 72490, "epoch": 431} {"train_loss": -9.1735258102417, "global_step": 72491, "epoch": 431} {"train_loss": -9.27672004699707, "global_step": 72492, "epoch": 431} {"train_loss": -9.202529907226562, "global_step": 72493, "epoch": 431} {"train_loss": -9.096458435058594, "global_step": 72494, "epoch": 431} {"train_loss": -9.186604499816895, "global_step": 72495, "epoch": 431} {"train_loss": -8.988666534423828, "global_step": 72496, "epoch": 431} {"train_loss": -8.97728157043457, "global_step": 72497, "epoch": 431} {"train_loss": -8.747159004211426, "global_step": 72498, "epoch": 431} {"train_loss": -9.129281997680664, "global_step": 72499, "epoch": 431} {"train_loss": -8.753044128417969, "global_step": 72500, "epoch": 431} {"train_loss": -9.004903793334961, "global_step": 72501, "epoch": 431} {"train_loss": -9.189644813537598, "global_step": 72502, "epoch": 431} {"train_loss": -9.072200775146484, "global_step": 72503, "epoch": 431} {"train_loss": -9.064406394958496, "global_step": 72504, "epoch": 431} {"train_loss": -9.247224807739258, "global_step": 72505, "epoch": 431} {"train_loss": -9.005393981933594, "global_step": 72506, "epoch": 431} {"train_loss": -9.157098770141602, "global_step": 72507, "epoch": 431} {"train_loss": -9.442544937133789, "global_step": 72508, "epoch": 431} {"train_loss": -9.137357711791992, "global_step": 72509, "epoch": 431} {"train_loss": -9.152483940124512, "global_step": 72510, "epoch": 431} {"train_loss": -9.075429916381836, "global_step": 72511, "epoch": 431} {"train_loss": -9.184734344482422, "global_step": 72512, "epoch": 431} {"train_loss": -8.779305458068848, "global_step": 72513, "epoch": 431} {"train_loss": -9.024116516113281, "global_step": 72514, "epoch": 431} {"train_loss": -8.935847282409668, "global_step": 72515, "epoch": 431} {"train_loss": -8.982027053833008, "global_step": 72516, "epoch": 431} {"train_loss": -9.000252723693848, "global_step": 72517, "epoch": 431} {"train_loss": -8.644861221313477, "global_step": 72518, "epoch": 431} {"train_loss": -9.126411437988281, "global_step": 72519, "epoch": 431} {"train_loss": -9.071348190307617, "global_step": 72520, "epoch": 431} {"train_loss": -8.974451065063477, "global_step": 72521, "epoch": 431} {"train_loss": -9.032219886779785, "global_step": 72522, "epoch": 431} {"train_loss": -8.940452575683594, "global_step": 72523, "epoch": 431} {"train_loss": -9.035221099853516, "global_step": 72524, "epoch": 431} {"train_loss": -8.599132537841797, "global_step": 72525, "epoch": 431} {"train_loss": -9.056686401367188, "global_step": 72526, "epoch": 431} {"train_loss": -8.669754028320312, "global_step": 72527, "epoch": 431} {"train_loss": -8.777155876159668, "global_step": 72528, "epoch": 431} {"train_loss": -8.58383560180664, "global_step": 72529, "epoch": 431} {"train_loss": -8.751341819763184, "global_step": 72530, "epoch": 431} {"train_loss": -8.848657608032227, "global_step": 72531, "epoch": 431} {"train_loss": -8.724276542663574, "global_step": 72532, "epoch": 431} {"train_loss": -8.923162460327148, "global_step": 72533, "epoch": 431} {"train_loss": -8.770477294921875, "global_step": 72534, "epoch": 431} {"train_loss": -8.858376502990723, "global_step": 72535, "epoch": 431} {"train_loss": -8.813395500183105, "global_step": 72536, "epoch": 431} {"train_loss": -8.980463027954102, "global_step": 72537, "epoch": 431} {"train_loss": -8.660757064819336, "global_step": 72538, "epoch": 431} {"train_loss": -8.88813304901123, "global_step": 72539, "epoch": 431} {"train_loss": -8.946929931640625, "global_step": 72540, "epoch": 431} {"train_loss": -9.070486068725586, "global_step": 72541, "epoch": 431} {"train_loss": -8.820554733276367, "global_step": 72542, "epoch": 431} {"train_loss": -8.936036109924316, "global_step": 72543, "epoch": 431} {"train_loss": -9.120319366455078, "global_step": 72544, "epoch": 431} {"train_loss": -8.784322738647461, "global_step": 72545, "epoch": 431} {"train_loss": -8.88864517211914, "global_step": 72546, "epoch": 431} {"train_loss": -8.955245971679688, "global_step": 72547, "epoch": 431} {"train_loss": -8.860679626464844, "global_step": 72548, "epoch": 431} {"train_loss": -8.71120548248291, "global_step": 72549, "epoch": 431} {"train_loss": -8.74775505065918, "global_step": 72550, "epoch": 431} {"train_loss": -8.944099426269531, "global_step": 72551, "epoch": 431} {"train_loss": -8.991681098937988, "global_step": 72552, "epoch": 431} {"train_loss": -8.822104454040527, "global_step": 72553, "epoch": 431} {"train_loss": -8.903696060180664, "global_step": 72554, "epoch": 431} {"train_loss": -8.826891899108887, "global_step": 72555, "epoch": 431} {"train_loss": -8.764028549194336, "global_step": 72556, "epoch": 431} {"train_loss": -8.892404556274414, "global_step": 72557, "epoch": 431} {"train_loss": -9.031367301940918, "global_step": 72558, "epoch": 431} {"train_loss": -8.848904609680176, "global_step": 72559, "epoch": 431} {"train_loss": -8.939484596252441, "global_step": 72560, "epoch": 431} {"train_loss": -9.03878116607666, "global_step": 72561, "epoch": 431} {"train_loss": -9.085866928100586, "global_step": 72562, "epoch": 431} {"train_loss": -9.304197311401367, "global_step": 72563, "epoch": 431} {"train_loss": -9.190101623535156, "global_step": 72564, "epoch": 431} {"train_loss": -9.166893005371094, "global_step": 72565, "epoch": 431} {"train_loss": -9.023004531860352, "global_step": 72566, "epoch": 431} {"train_loss": -9.260788917541504, "global_step": 72567, "epoch": 431} {"train_loss": -9.186468124389648, "global_step": 72568, "epoch": 431} {"train_loss": -9.030824661254883, "global_step": 72569, "epoch": 431} {"train_loss": -9.024888038635254, "global_step": 72570, "epoch": 431} {"train_loss": -9.140303611755371, "global_step": 72571, "epoch": 431} {"train_loss": -8.939807891845703, "global_step": 72572, "epoch": 431} {"train_loss": -9.202226638793945, "global_step": 72573, "epoch": 431} {"train_loss": -9.312773704528809, "global_step": 72574, "epoch": 431} {"train_loss": -8.966930116925921, "global_step": 72575, "epoch": 431, "val_loss": 195448.796875} {"train_loss": -8.943811416625977, "global_step": 72576, "epoch": 432} {"train_loss": -8.971439361572266, "global_step": 72577, "epoch": 432} {"train_loss": -9.26104736328125, "global_step": 72578, "epoch": 432} {"train_loss": -8.931062698364258, "global_step": 72579, "epoch": 432} {"train_loss": -8.962423324584961, "global_step": 72580, "epoch": 432} {"train_loss": -9.16726016998291, "global_step": 72581, "epoch": 432} {"train_loss": -9.064876556396484, "global_step": 72582, "epoch": 432} {"train_loss": -8.753687858581543, "global_step": 72583, "epoch": 432} {"train_loss": -9.149064064025879, "global_step": 72584, "epoch": 432} {"train_loss": -8.851873397827148, "global_step": 72585, "epoch": 432} {"train_loss": -8.952655792236328, "global_step": 72586, "epoch": 432} {"train_loss": -9.066827774047852, "global_step": 72587, "epoch": 432} {"train_loss": -9.174079895019531, "global_step": 72588, "epoch": 432} {"train_loss": -8.94790267944336, "global_step": 72589, "epoch": 432} {"train_loss": -9.07343864440918, "global_step": 72590, "epoch": 432} {"train_loss": -9.129730224609375, "global_step": 72591, "epoch": 432} {"train_loss": -9.1696195602417, "global_step": 72592, "epoch": 432} {"train_loss": -9.116902351379395, "global_step": 72593, "epoch": 432} {"train_loss": -9.147878646850586, "global_step": 72594, "epoch": 432} {"train_loss": -9.143379211425781, "global_step": 72595, "epoch": 432} {"train_loss": -8.910877227783203, "global_step": 72596, "epoch": 432} {"train_loss": -9.202211380004883, "global_step": 72597, "epoch": 432} {"train_loss": -9.270624160766602, "global_step": 72598, "epoch": 432} {"train_loss": -8.989736557006836, "global_step": 72599, "epoch": 432} {"train_loss": -9.22791862487793, "global_step": 72600, "epoch": 432} {"train_loss": -8.942628860473633, "global_step": 72601, "epoch": 432} {"train_loss": -9.256780624389648, "global_step": 72602, "epoch": 432} {"train_loss": -9.168806076049805, "global_step": 72603, "epoch": 432} {"train_loss": -9.032313346862793, "global_step": 72604, "epoch": 432} {"train_loss": -9.056553840637207, "global_step": 72605, "epoch": 432} {"train_loss": -8.961767196655273, "global_step": 72606, "epoch": 432} {"train_loss": -9.137174606323242, "global_step": 72607, "epoch": 432} {"train_loss": -8.8173828125, "global_step": 72608, "epoch": 432} {"train_loss": -9.198431015014648, "global_step": 72609, "epoch": 432} {"train_loss": -9.143808364868164, "global_step": 72610, "epoch": 432} {"train_loss": -8.915721893310547, "global_step": 72611, "epoch": 432} {"train_loss": -8.986248016357422, "global_step": 72612, "epoch": 432} {"train_loss": -9.219819068908691, "global_step": 72613, "epoch": 432} {"train_loss": -9.047554016113281, "global_step": 72614, "epoch": 432} {"train_loss": -8.928163528442383, "global_step": 72615, "epoch": 432} {"train_loss": -8.79779052734375, "global_step": 72616, "epoch": 432} {"train_loss": -9.166792869567871, "global_step": 72617, "epoch": 432} {"train_loss": -8.99056339263916, "global_step": 72618, "epoch": 432} {"train_loss": -8.898906707763672, "global_step": 72619, "epoch": 432} {"train_loss": -9.004083633422852, "global_step": 72620, "epoch": 432} {"train_loss": -8.96739387512207, "global_step": 72621, "epoch": 432} {"train_loss": -8.977231979370117, "global_step": 72622, "epoch": 432} {"train_loss": -8.92538070678711, "global_step": 72623, "epoch": 432} {"train_loss": -9.098593711853027, "global_step": 72624, "epoch": 432} {"train_loss": -9.003828048706055, "global_step": 72625, "epoch": 432} {"train_loss": -8.83606243133545, "global_step": 72626, "epoch": 432} {"train_loss": -8.774157524108887, "global_step": 72627, "epoch": 432} {"train_loss": -8.734329223632812, "global_step": 72628, "epoch": 432} {"train_loss": -8.864818572998047, "global_step": 72629, "epoch": 432} {"train_loss": -8.776106834411621, "global_step": 72630, "epoch": 432} {"train_loss": -8.572649955749512, "global_step": 72631, "epoch": 432} {"train_loss": -9.064414978027344, "global_step": 72632, "epoch": 432} {"train_loss": -8.66819953918457, "global_step": 72633, "epoch": 432} {"train_loss": -8.811113357543945, "global_step": 72634, "epoch": 432} {"train_loss": -8.845209121704102, "global_step": 72635, "epoch": 432} {"train_loss": -8.762258529663086, "global_step": 72636, "epoch": 432} {"train_loss": -8.686542510986328, "global_step": 72637, "epoch": 432} {"train_loss": -8.614227294921875, "global_step": 72638, "epoch": 432} {"train_loss": -8.554656028747559, "global_step": 72639, "epoch": 432} {"train_loss": -8.727145195007324, "global_step": 72640, "epoch": 432} {"train_loss": -8.746829986572266, "global_step": 72641, "epoch": 432} {"train_loss": -8.68497085571289, "global_step": 72642, "epoch": 432} {"train_loss": -8.544294357299805, "global_step": 72643, "epoch": 432} {"train_loss": -8.739176750183105, "global_step": 72644, "epoch": 432} {"train_loss": -8.846491813659668, "global_step": 72645, "epoch": 432} {"train_loss": -8.837467193603516, "global_step": 72646, "epoch": 432} {"train_loss": -8.770170211791992, "global_step": 72647, "epoch": 432} {"train_loss": -8.918930053710938, "global_step": 72648, "epoch": 432} {"train_loss": -8.876901626586914, "global_step": 72649, "epoch": 432} {"train_loss": -8.724002838134766, "global_step": 72650, "epoch": 432} {"train_loss": -8.8438720703125, "global_step": 72651, "epoch": 432} {"train_loss": -8.862404823303223, "global_step": 72652, "epoch": 432} {"train_loss": -8.930756568908691, "global_step": 72653, "epoch": 432} {"train_loss": -8.83837604522705, "global_step": 72654, "epoch": 432} {"train_loss": -9.139944076538086, "global_step": 72655, "epoch": 432} {"train_loss": -9.081137657165527, "global_step": 72656, "epoch": 432} {"train_loss": -8.79810905456543, "global_step": 72657, "epoch": 432} {"train_loss": -9.130578994750977, "global_step": 72658, "epoch": 432} {"train_loss": -8.6331787109375, "global_step": 72659, "epoch": 432} {"train_loss": -9.082111358642578, "global_step": 72660, "epoch": 432} {"train_loss": -9.193408966064453, "global_step": 72661, "epoch": 432} {"train_loss": -9.180547714233398, "global_step": 72662, "epoch": 432} {"train_loss": -9.122496604919434, "global_step": 72663, "epoch": 432} {"train_loss": -8.941812515258789, "global_step": 72664, "epoch": 432} {"train_loss": -9.115671157836914, "global_step": 72665, "epoch": 432} {"train_loss": -9.344137191772461, "global_step": 72666, "epoch": 432} {"train_loss": -8.979459762573242, "global_step": 72667, "epoch": 432} {"train_loss": -9.16334342956543, "global_step": 72668, "epoch": 432} {"train_loss": -9.169607162475586, "global_step": 72669, "epoch": 432} {"train_loss": -9.221809387207031, "global_step": 72670, "epoch": 432} {"train_loss": -9.207520484924316, "global_step": 72671, "epoch": 432} {"train_loss": -8.74873161315918, "global_step": 72672, "epoch": 432} {"train_loss": -9.156901359558105, "global_step": 72673, "epoch": 432} {"train_loss": -9.02318000793457, "global_step": 72674, "epoch": 432} {"train_loss": -9.057540893554688, "global_step": 72675, "epoch": 432} {"train_loss": -8.890377044677734, "global_step": 72676, "epoch": 432} {"train_loss": -9.023920059204102, "global_step": 72677, "epoch": 432} {"train_loss": -8.528852462768555, "global_step": 72678, "epoch": 432} {"train_loss": -9.013327598571777, "global_step": 72679, "epoch": 432} {"train_loss": -8.88899040222168, "global_step": 72680, "epoch": 432} {"train_loss": -9.01823616027832, "global_step": 72681, "epoch": 432} {"train_loss": -8.930044174194336, "global_step": 72682, "epoch": 432} {"train_loss": -8.810192108154297, "global_step": 72683, "epoch": 432} {"train_loss": -8.836400985717773, "global_step": 72684, "epoch": 432} {"train_loss": -9.090603828430176, "global_step": 72685, "epoch": 432} {"train_loss": -8.461573600769043, "global_step": 72686, "epoch": 432} {"train_loss": -9.127058029174805, "global_step": 72687, "epoch": 432} {"train_loss": -9.11115837097168, "global_step": 72688, "epoch": 432} {"train_loss": -8.964987754821777, "global_step": 72689, "epoch": 432} {"train_loss": -8.948678970336914, "global_step": 72690, "epoch": 432} {"train_loss": -9.057304382324219, "global_step": 72691, "epoch": 432} {"train_loss": -8.917579650878906, "global_step": 72692, "epoch": 432} {"train_loss": -8.916460990905762, "global_step": 72693, "epoch": 432} {"train_loss": -8.787504196166992, "global_step": 72694, "epoch": 432} {"train_loss": -8.766645431518555, "global_step": 72695, "epoch": 432} {"train_loss": -9.014938354492188, "global_step": 72696, "epoch": 432} {"train_loss": -8.641157150268555, "global_step": 72697, "epoch": 432} {"train_loss": -8.84051513671875, "global_step": 72698, "epoch": 432} {"train_loss": -8.707144737243652, "global_step": 72699, "epoch": 432} {"train_loss": -8.858844757080078, "global_step": 72700, "epoch": 432} {"train_loss": -8.919425964355469, "global_step": 72701, "epoch": 432} {"train_loss": -8.771952629089355, "global_step": 72702, "epoch": 432} {"train_loss": -8.827607154846191, "global_step": 72703, "epoch": 432} {"train_loss": -9.033931732177734, "global_step": 72704, "epoch": 432} {"train_loss": -8.901849746704102, "global_step": 72705, "epoch": 432} {"train_loss": -9.117599487304688, "global_step": 72706, "epoch": 432} {"train_loss": -9.158594131469727, "global_step": 72707, "epoch": 432} {"train_loss": -9.170122146606445, "global_step": 72708, "epoch": 432} {"train_loss": -8.990571975708008, "global_step": 72709, "epoch": 432} {"train_loss": -9.155519485473633, "global_step": 72710, "epoch": 432} {"train_loss": -9.214762687683105, "global_step": 72711, "epoch": 432} {"train_loss": -9.23881721496582, "global_step": 72712, "epoch": 432} {"train_loss": -9.219472885131836, "global_step": 72713, "epoch": 432} {"train_loss": -9.227405548095703, "global_step": 72714, "epoch": 432} {"train_loss": -9.027223587036133, "global_step": 72715, "epoch": 432} {"train_loss": -9.051593780517578, "global_step": 72716, "epoch": 432} {"train_loss": -9.086660385131836, "global_step": 72717, "epoch": 432} {"train_loss": -8.92729663848877, "global_step": 72718, "epoch": 432} {"train_loss": -9.181994438171387, "global_step": 72719, "epoch": 432} {"train_loss": -9.077682495117188, "global_step": 72720, "epoch": 432} {"train_loss": -8.897621154785156, "global_step": 72721, "epoch": 432} {"train_loss": -9.063846588134766, "global_step": 72722, "epoch": 432} {"train_loss": -9.102239608764648, "global_step": 72723, "epoch": 432} {"train_loss": -8.798637390136719, "global_step": 72724, "epoch": 432} {"train_loss": -9.086297988891602, "global_step": 72725, "epoch": 432} {"train_loss": -8.962410926818848, "global_step": 72726, "epoch": 432} {"train_loss": -9.205570220947266, "global_step": 72727, "epoch": 432} {"train_loss": -8.916925430297852, "global_step": 72728, "epoch": 432} {"train_loss": -9.216075897216797, "global_step": 72729, "epoch": 432} {"train_loss": -8.930399894714355, "global_step": 72730, "epoch": 432} {"train_loss": -9.349457740783691, "global_step": 72731, "epoch": 432} {"train_loss": -8.966556549072266, "global_step": 72732, "epoch": 432} {"train_loss": -9.038313865661621, "global_step": 72733, "epoch": 432} {"train_loss": -8.882779121398926, "global_step": 72734, "epoch": 432} {"train_loss": -9.313728332519531, "global_step": 72735, "epoch": 432} {"train_loss": -9.330699920654297, "global_step": 72736, "epoch": 432} {"train_loss": -9.075016021728516, "global_step": 72737, "epoch": 432} {"train_loss": -9.072164535522461, "global_step": 72738, "epoch": 432} {"train_loss": -8.828911781311035, "global_step": 72739, "epoch": 432} {"train_loss": -9.119083404541016, "global_step": 72740, "epoch": 432} {"train_loss": -9.243141174316406, "global_step": 72741, "epoch": 432} {"train_loss": -9.168617248535156, "global_step": 72742, "epoch": 432} {"train_loss": -8.983815045583816, "global_step": 72743, "epoch": 432, "val_loss": 196635.1875} {"train_loss": -9.002724647521973, "global_step": 72744, "epoch": 433} {"train_loss": -8.987042427062988, "global_step": 72745, "epoch": 433} {"train_loss": -9.299163818359375, "global_step": 72746, "epoch": 433} {"train_loss": -8.703378677368164, "global_step": 72747, "epoch": 433} {"train_loss": -8.893829345703125, "global_step": 72748, "epoch": 433} {"train_loss": -8.931140899658203, "global_step": 72749, "epoch": 433} {"train_loss": -9.122557640075684, "global_step": 72750, "epoch": 433} {"train_loss": -9.01231575012207, "global_step": 72751, "epoch": 433} {"train_loss": -8.987403869628906, "global_step": 72752, "epoch": 433} {"train_loss": -9.136322021484375, "global_step": 72753, "epoch": 433} {"train_loss": -9.132347106933594, "global_step": 72754, "epoch": 433} {"train_loss": -9.057132720947266, "global_step": 72755, "epoch": 433} {"train_loss": -9.128355979919434, "global_step": 72756, "epoch": 433} {"train_loss": -9.246559143066406, "global_step": 72757, "epoch": 433} {"train_loss": -8.834237098693848, "global_step": 72758, "epoch": 433} {"train_loss": -8.852763175964355, "global_step": 72759, "epoch": 433} {"train_loss": -8.832698822021484, "global_step": 72760, "epoch": 433} {"train_loss": -8.666858673095703, "global_step": 72761, "epoch": 433} {"train_loss": -8.735162734985352, "global_step": 72762, "epoch": 433} {"train_loss": -8.883659362792969, "global_step": 72763, "epoch": 433} {"train_loss": -8.574463844299316, "global_step": 72764, "epoch": 433} {"train_loss": -8.661108016967773, "global_step": 72765, "epoch": 433} {"train_loss": -8.632423400878906, "global_step": 72766, "epoch": 433} {"train_loss": -8.797874450683594, "global_step": 72767, "epoch": 433} {"train_loss": -8.718729019165039, "global_step": 72768, "epoch": 433} {"train_loss": -8.818522453308105, "global_step": 72769, "epoch": 433} {"train_loss": -8.944951057434082, "global_step": 72770, "epoch": 433} {"train_loss": -8.635716438293457, "global_step": 72771, "epoch": 433} {"train_loss": -8.65174674987793, "global_step": 72772, "epoch": 433} {"train_loss": -8.861555099487305, "global_step": 72773, "epoch": 433} {"train_loss": -8.622352600097656, "global_step": 72774, "epoch": 433} {"train_loss": -8.909053802490234, "global_step": 72775, "epoch": 433} {"train_loss": -9.032088279724121, "global_step": 72776, "epoch": 433} {"train_loss": -9.020907402038574, "global_step": 72777, "epoch": 433} {"train_loss": -8.752010345458984, "global_step": 72778, "epoch": 433} {"train_loss": -9.075492858886719, "global_step": 72779, "epoch": 433} {"train_loss": -8.911114692687988, "global_step": 72780, "epoch": 433} {"train_loss": -8.904134750366211, "global_step": 72781, "epoch": 433} {"train_loss": -9.029428482055664, "global_step": 72782, "epoch": 433} {"train_loss": -8.936954498291016, "global_step": 72783, "epoch": 433} {"train_loss": -9.070619583129883, "global_step": 72784, "epoch": 433} {"train_loss": -9.052030563354492, "global_step": 72785, "epoch": 433} {"train_loss": -8.948086738586426, "global_step": 72786, "epoch": 433} {"train_loss": -9.022944450378418, "global_step": 72787, "epoch": 433} {"train_loss": -9.121551513671875, "global_step": 72788, "epoch": 433} {"train_loss": -9.052421569824219, "global_step": 72789, "epoch": 433} {"train_loss": -9.248254776000977, "global_step": 72790, "epoch": 433} {"train_loss": -9.217884063720703, "global_step": 72791, "epoch": 433} {"train_loss": -9.133848190307617, "global_step": 72792, "epoch": 433} {"train_loss": -8.999473571777344, "global_step": 72793, "epoch": 433} {"train_loss": -9.226831436157227, "global_step": 72794, "epoch": 433} {"train_loss": -9.094724655151367, "global_step": 72795, "epoch": 433} {"train_loss": -9.145721435546875, "global_step": 72796, "epoch": 433} {"train_loss": -9.04039192199707, "global_step": 72797, "epoch": 433} {"train_loss": -9.183015823364258, "global_step": 72798, "epoch": 433} {"train_loss": -8.94259262084961, "global_step": 72799, "epoch": 433} {"train_loss": -8.963384628295898, "global_step": 72800, "epoch": 433} {"train_loss": -9.01743221282959, "global_step": 72801, "epoch": 433} {"train_loss": -8.822629928588867, "global_step": 72802, "epoch": 433} {"train_loss": -8.99760913848877, "global_step": 72803, "epoch": 433} {"train_loss": -9.024345397949219, "global_step": 72804, "epoch": 433} {"train_loss": -8.78438663482666, "global_step": 72805, "epoch": 433} {"train_loss": -8.921296119689941, "global_step": 72806, "epoch": 433} {"train_loss": -8.990053176879883, "global_step": 72807, "epoch": 433} {"train_loss": -9.065540313720703, "global_step": 72808, "epoch": 433} {"train_loss": -9.252605438232422, "global_step": 72809, "epoch": 433} {"train_loss": -8.884961128234863, "global_step": 72810, "epoch": 433} {"train_loss": -9.015228271484375, "global_step": 72811, "epoch": 433} {"train_loss": -9.098020553588867, "global_step": 72812, "epoch": 433} {"train_loss": -8.676490783691406, "global_step": 72813, "epoch": 433} {"train_loss": -8.862852096557617, "global_step": 72814, "epoch": 433} {"train_loss": -9.027694702148438, "global_step": 72815, "epoch": 433} {"train_loss": -8.669118881225586, "global_step": 72816, "epoch": 433} {"train_loss": -8.945247650146484, "global_step": 72817, "epoch": 433} {"train_loss": -8.916158676147461, "global_step": 72818, "epoch": 433} {"train_loss": -9.197641372680664, "global_step": 72819, "epoch": 433} {"train_loss": -8.847782135009766, "global_step": 72820, "epoch": 433} {"train_loss": -9.039649963378906, "global_step": 72821, "epoch": 433} {"train_loss": -9.135936737060547, "global_step": 72822, "epoch": 433} {"train_loss": -8.79755973815918, "global_step": 72823, "epoch": 433} {"train_loss": -9.097414016723633, "global_step": 72824, "epoch": 433} {"train_loss": -9.045912742614746, "global_step": 72825, "epoch": 433} {"train_loss": -9.138538360595703, "global_step": 72826, "epoch": 433} {"train_loss": -9.035584449768066, "global_step": 72827, "epoch": 433} {"train_loss": -9.177236557006836, "global_step": 72828, "epoch": 433} {"train_loss": -9.343148231506348, "global_step": 72829, "epoch": 433} {"train_loss": -9.094380378723145, "global_step": 72830, "epoch": 433} {"train_loss": -9.125734329223633, "global_step": 72831, "epoch": 433} {"train_loss": -9.140846252441406, "global_step": 72832, "epoch": 433} {"train_loss": -9.27701187133789, "global_step": 72833, "epoch": 433} {"train_loss": -9.238195419311523, "global_step": 72834, "epoch": 433} {"train_loss": -9.1719970703125, "global_step": 72835, "epoch": 433} {"train_loss": -9.136788368225098, "global_step": 72836, "epoch": 433} {"train_loss": -9.232431411743164, "global_step": 72837, "epoch": 433} {"train_loss": -9.245141983032227, "global_step": 72838, "epoch": 433} {"train_loss": -9.212162017822266, "global_step": 72839, "epoch": 433} {"train_loss": -9.106873512268066, "global_step": 72840, "epoch": 433} {"train_loss": -9.078060150146484, "global_step": 72841, "epoch": 433} {"train_loss": -9.170037269592285, "global_step": 72842, "epoch": 433} {"train_loss": -9.120515823364258, "global_step": 72843, "epoch": 433} {"train_loss": -9.10161018371582, "global_step": 72844, "epoch": 433} {"train_loss": -9.030560493469238, "global_step": 72845, "epoch": 433} {"train_loss": -9.162056922912598, "global_step": 72846, "epoch": 433} {"train_loss": -8.985629081726074, "global_step": 72847, "epoch": 433} {"train_loss": -9.267854690551758, "global_step": 72848, "epoch": 433} {"train_loss": -8.977200508117676, "global_step": 72849, "epoch": 433} {"train_loss": -8.89449691772461, "global_step": 72850, "epoch": 433} {"train_loss": -8.787452697753906, "global_step": 72851, "epoch": 433} {"train_loss": -9.09001350402832, "global_step": 72852, "epoch": 433} {"train_loss": -8.999652862548828, "global_step": 72853, "epoch": 433} {"train_loss": -8.847593307495117, "global_step": 72854, "epoch": 433} {"train_loss": -9.04979133605957, "global_step": 72855, "epoch": 433} {"train_loss": -8.705141067504883, "global_step": 72856, "epoch": 433} {"train_loss": -8.861860275268555, "global_step": 72857, "epoch": 433} {"train_loss": -8.961186408996582, "global_step": 72858, "epoch": 433} {"train_loss": -8.900569915771484, "global_step": 72859, "epoch": 433} {"train_loss": -8.686426162719727, "global_step": 72860, "epoch": 433} {"train_loss": -8.855001449584961, "global_step": 72861, "epoch": 433} {"train_loss": -8.907293319702148, "global_step": 72862, "epoch": 433} {"train_loss": -8.969742774963379, "global_step": 72863, "epoch": 433} {"train_loss": -9.035270690917969, "global_step": 72864, "epoch": 433} {"train_loss": -8.906339645385742, "global_step": 72865, "epoch": 433} {"train_loss": -8.934835433959961, "global_step": 72866, "epoch": 433} {"train_loss": -8.786689758300781, "global_step": 72867, "epoch": 433} {"train_loss": -8.99738883972168, "global_step": 72868, "epoch": 433} {"train_loss": -8.852689743041992, "global_step": 72869, "epoch": 433} {"train_loss": -8.969026565551758, "global_step": 72870, "epoch": 433} {"train_loss": -8.798526763916016, "global_step": 72871, "epoch": 433} {"train_loss": -8.933614730834961, "global_step": 72872, "epoch": 433} {"train_loss": -8.898399353027344, "global_step": 72873, "epoch": 433} {"train_loss": -9.15418815612793, "global_step": 72874, "epoch": 433} {"train_loss": -9.191703796386719, "global_step": 72875, "epoch": 433} {"train_loss": -9.186956405639648, "global_step": 72876, "epoch": 433} {"train_loss": -9.258833885192871, "global_step": 72877, "epoch": 433} {"train_loss": -9.208196640014648, "global_step": 72878, "epoch": 433} {"train_loss": -8.924899101257324, "global_step": 72879, "epoch": 433} {"train_loss": -9.184226989746094, "global_step": 72880, "epoch": 433} {"train_loss": -9.054950714111328, "global_step": 72881, "epoch": 433} {"train_loss": -9.150657653808594, "global_step": 72882, "epoch": 433} {"train_loss": -9.038679122924805, "global_step": 72883, "epoch": 433} {"train_loss": -8.979257583618164, "global_step": 72884, "epoch": 433} {"train_loss": -9.136028289794922, "global_step": 72885, "epoch": 433} {"train_loss": -9.098876953125, "global_step": 72886, "epoch": 433} {"train_loss": -9.251911163330078, "global_step": 72887, "epoch": 433} {"train_loss": -9.178902626037598, "global_step": 72888, "epoch": 433} {"train_loss": -9.212299346923828, "global_step": 72889, "epoch": 433} {"train_loss": -9.118853569030762, "global_step": 72890, "epoch": 433} {"train_loss": -9.334090232849121, "global_step": 72891, "epoch": 433} {"train_loss": -9.161234855651855, "global_step": 72892, "epoch": 433} {"train_loss": -9.0811767578125, "global_step": 72893, "epoch": 433} {"train_loss": -9.293628692626953, "global_step": 72894, "epoch": 433} {"train_loss": -9.089536666870117, "global_step": 72895, "epoch": 433} {"train_loss": -9.399423599243164, "global_step": 72896, "epoch": 433} {"train_loss": -8.93612289428711, "global_step": 72897, "epoch": 433} {"train_loss": -9.064820289611816, "global_step": 72898, "epoch": 433} {"train_loss": -9.205972671508789, "global_step": 72899, "epoch": 433} {"train_loss": -9.105180740356445, "global_step": 72900, "epoch": 433} {"train_loss": -8.734090805053711, "global_step": 72901, "epoch": 433} {"train_loss": -8.8157958984375, "global_step": 72902, "epoch": 433} {"train_loss": -8.746587753295898, "global_step": 72903, "epoch": 433} {"train_loss": -8.377837181091309, "global_step": 72904, "epoch": 433} {"train_loss": -8.95034408569336, "global_step": 72905, "epoch": 433} {"train_loss": -8.258920669555664, "global_step": 72906, "epoch": 433} {"train_loss": -8.629983901977539, "global_step": 72907, "epoch": 433} {"train_loss": -8.826021194458008, "global_step": 72908, "epoch": 433} {"train_loss": -8.465278625488281, "global_step": 72909, "epoch": 433} {"train_loss": -8.678811073303223, "global_step": 72910, "epoch": 433} {"train_loss": -8.986931380771455, "global_step": 72911, "epoch": 433, "val_loss": 192444.125} {"train_loss": -8.61967658996582, "global_step": 72912, "epoch": 434} {"train_loss": -8.531356811523438, "global_step": 72913, "epoch": 434} {"train_loss": -8.719637870788574, "global_step": 72914, "epoch": 434} {"train_loss": -8.609724044799805, "global_step": 72915, "epoch": 434} {"train_loss": -8.724353790283203, "global_step": 72916, "epoch": 434} {"train_loss": -8.727594375610352, "global_step": 72917, "epoch": 434} {"train_loss": -8.93301010131836, "global_step": 72918, "epoch": 434} {"train_loss": -8.880302429199219, "global_step": 72919, "epoch": 434} {"train_loss": -8.994929313659668, "global_step": 72920, "epoch": 434} {"train_loss": -8.793196678161621, "global_step": 72921, "epoch": 434} {"train_loss": -8.798848152160645, "global_step": 72922, "epoch": 434} {"train_loss": -8.721210479736328, "global_step": 72923, "epoch": 434} {"train_loss": -8.737272262573242, "global_step": 72924, "epoch": 434} {"train_loss": -8.737640380859375, "global_step": 72925, "epoch": 434} {"train_loss": -8.871376037597656, "global_step": 72926, "epoch": 434} {"train_loss": -8.936912536621094, "global_step": 72927, "epoch": 434} {"train_loss": -9.036602973937988, "global_step": 72928, "epoch": 434} {"train_loss": -8.80683708190918, "global_step": 72929, "epoch": 434} {"train_loss": -8.89320182800293, "global_step": 72930, "epoch": 434} {"train_loss": -9.04887580871582, "global_step": 72931, "epoch": 434} {"train_loss": -8.975707054138184, "global_step": 72932, "epoch": 434} {"train_loss": -8.987564086914062, "global_step": 72933, "epoch": 434} {"train_loss": -9.00085163116455, "global_step": 72934, "epoch": 434} {"train_loss": -8.894550323486328, "global_step": 72935, "epoch": 434} {"train_loss": -8.949165344238281, "global_step": 72936, "epoch": 434} {"train_loss": -8.81995964050293, "global_step": 72937, "epoch": 434} {"train_loss": -9.08053970336914, "global_step": 72938, "epoch": 434} {"train_loss": -9.16609001159668, "global_step": 72939, "epoch": 434} {"train_loss": -9.083978652954102, "global_step": 72940, "epoch": 434} {"train_loss": -9.146967887878418, "global_step": 72941, "epoch": 434} {"train_loss": -8.982488632202148, "global_step": 72942, "epoch": 434} {"train_loss": -9.09174633026123, "global_step": 72943, "epoch": 434} {"train_loss": -9.159767150878906, "global_step": 72944, "epoch": 434} {"train_loss": -9.128133773803711, "global_step": 72945, "epoch": 434} {"train_loss": -9.169204711914062, "global_step": 72946, "epoch": 434} {"train_loss": -9.132431030273438, "global_step": 72947, "epoch": 434} {"train_loss": -9.124471664428711, "global_step": 72948, "epoch": 434} {"train_loss": -9.047796249389648, "global_step": 72949, "epoch": 434} {"train_loss": -9.269662857055664, "global_step": 72950, "epoch": 434} {"train_loss": -9.035520553588867, "global_step": 72951, "epoch": 434} {"train_loss": -9.241666793823242, "global_step": 72952, "epoch": 434} {"train_loss": -8.919655799865723, "global_step": 72953, "epoch": 434} {"train_loss": -9.000319480895996, "global_step": 72954, "epoch": 434} {"train_loss": -9.14068603515625, "global_step": 72955, "epoch": 434} {"train_loss": -9.233070373535156, "global_step": 72956, "epoch": 434} {"train_loss": -8.964700698852539, "global_step": 72957, "epoch": 434} {"train_loss": -9.166572570800781, "global_step": 72958, "epoch": 434} {"train_loss": -9.126766204833984, "global_step": 72959, "epoch": 434} {"train_loss": -8.88447380065918, "global_step": 72960, "epoch": 434} {"train_loss": -9.121139526367188, "global_step": 72961, "epoch": 434} {"train_loss": -8.845663070678711, "global_step": 72962, "epoch": 434} {"train_loss": -9.161310195922852, "global_step": 72963, "epoch": 434} {"train_loss": -9.116239547729492, "global_step": 72964, "epoch": 434} {"train_loss": -9.15963077545166, "global_step": 72965, "epoch": 434} {"train_loss": -8.951803207397461, "global_step": 72966, "epoch": 434} {"train_loss": -8.75157356262207, "global_step": 72967, "epoch": 434} {"train_loss": -9.028047561645508, "global_step": 72968, "epoch": 434} {"train_loss": -8.985084533691406, "global_step": 72969, "epoch": 434} {"train_loss": -8.617891311645508, "global_step": 72970, "epoch": 434} {"train_loss": -8.971478462219238, "global_step": 72971, "epoch": 434} {"train_loss": -8.85917854309082, "global_step": 72972, "epoch": 434} {"train_loss": -9.056559562683105, "global_step": 72973, "epoch": 434} {"train_loss": -9.145536422729492, "global_step": 72974, "epoch": 434} {"train_loss": -8.97182846069336, "global_step": 72975, "epoch": 434} {"train_loss": -9.002921104431152, "global_step": 72976, "epoch": 434} {"train_loss": -9.071968078613281, "global_step": 72977, "epoch": 434} {"train_loss": -9.119746208190918, "global_step": 72978, "epoch": 434} {"train_loss": -8.704532623291016, "global_step": 72979, "epoch": 434} {"train_loss": -8.840225219726562, "global_step": 72980, "epoch": 434} {"train_loss": -9.167058944702148, "global_step": 72981, "epoch": 434} {"train_loss": -9.259647369384766, "global_step": 72982, "epoch": 434} {"train_loss": -9.061656951904297, "global_step": 72983, "epoch": 434} {"train_loss": -8.927742958068848, "global_step": 72984, "epoch": 434} {"train_loss": -9.050296783447266, "global_step": 72985, "epoch": 434} {"train_loss": -9.062262535095215, "global_step": 72986, "epoch": 434} {"train_loss": -8.974061965942383, "global_step": 72987, "epoch": 434} {"train_loss": -8.82673454284668, "global_step": 72988, "epoch": 434} {"train_loss": -9.076114654541016, "global_step": 72989, "epoch": 434} {"train_loss": -9.006875991821289, "global_step": 72990, "epoch": 434} {"train_loss": -8.871252059936523, "global_step": 72991, "epoch": 434} {"train_loss": -8.840307235717773, "global_step": 72992, "epoch": 434} {"train_loss": -9.151899337768555, "global_step": 72993, "epoch": 434} {"train_loss": -8.972675323486328, "global_step": 72994, "epoch": 434} {"train_loss": -8.756858825683594, "global_step": 72995, "epoch": 434} {"train_loss": -8.73017692565918, "global_step": 72996, "epoch": 434} {"train_loss": -8.806804656982422, "global_step": 72997, "epoch": 434} {"train_loss": -8.953466415405273, "global_step": 72998, "epoch": 434} {"train_loss": -8.680191993713379, "global_step": 72999, "epoch": 434} {"train_loss": -8.390541076660156, "global_step": 73000, "epoch": 434} {"train_loss": -9.050341606140137, "global_step": 73001, "epoch": 434} {"train_loss": -8.954627990722656, "global_step": 73002, "epoch": 434} {"train_loss": -8.860676765441895, "global_step": 73003, "epoch": 434} {"train_loss": -8.539257049560547, "global_step": 73004, "epoch": 434} {"train_loss": -9.02829647064209, "global_step": 73005, "epoch": 434} {"train_loss": -9.060487747192383, "global_step": 73006, "epoch": 434} {"train_loss": -8.688448905944824, "global_step": 73007, "epoch": 434} {"train_loss": -8.902318954467773, "global_step": 73008, "epoch": 434} {"train_loss": -8.931020736694336, "global_step": 73009, "epoch": 434} {"train_loss": -9.093942642211914, "global_step": 73010, "epoch": 434} {"train_loss": -8.76881217956543, "global_step": 73011, "epoch": 434} {"train_loss": -8.775309562683105, "global_step": 73012, "epoch": 434} {"train_loss": -8.841143608093262, "global_step": 73013, "epoch": 434} {"train_loss": -8.779993057250977, "global_step": 73014, "epoch": 434} {"train_loss": -8.82720947265625, "global_step": 73015, "epoch": 434} {"train_loss": -8.792501449584961, "global_step": 73016, "epoch": 434} {"train_loss": -9.162858963012695, "global_step": 73017, "epoch": 434} {"train_loss": -8.676469802856445, "global_step": 73018, "epoch": 434} {"train_loss": -8.960630416870117, "global_step": 73019, "epoch": 434} {"train_loss": -9.057069778442383, "global_step": 73020, "epoch": 434} {"train_loss": -8.602642059326172, "global_step": 73021, "epoch": 434} {"train_loss": -8.935220718383789, "global_step": 73022, "epoch": 434} {"train_loss": -8.789467811584473, "global_step": 73023, "epoch": 434} {"train_loss": -9.121145248413086, "global_step": 73024, "epoch": 434} {"train_loss": -9.026485443115234, "global_step": 73025, "epoch": 434} {"train_loss": -9.107812881469727, "global_step": 73026, "epoch": 434} {"train_loss": -9.023599624633789, "global_step": 73027, "epoch": 434} {"train_loss": -9.142937660217285, "global_step": 73028, "epoch": 434} {"train_loss": -8.975444793701172, "global_step": 73029, "epoch": 434} {"train_loss": -9.03046703338623, "global_step": 73030, "epoch": 434} {"train_loss": -9.211265563964844, "global_step": 73031, "epoch": 434} {"train_loss": -9.081622123718262, "global_step": 73032, "epoch": 434} {"train_loss": -9.252487182617188, "global_step": 73033, "epoch": 434} {"train_loss": -9.155943870544434, "global_step": 73034, "epoch": 434} {"train_loss": -9.078956604003906, "global_step": 73035, "epoch": 434} {"train_loss": -8.970970153808594, "global_step": 73036, "epoch": 434} {"train_loss": -9.051698684692383, "global_step": 73037, "epoch": 434} {"train_loss": -9.109066009521484, "global_step": 73038, "epoch": 434} {"train_loss": -8.995173454284668, "global_step": 73039, "epoch": 434} {"train_loss": -9.162544250488281, "global_step": 73040, "epoch": 434} {"train_loss": -9.194530487060547, "global_step": 73041, "epoch": 434} {"train_loss": -9.163406372070312, "global_step": 73042, "epoch": 434} {"train_loss": -9.094879150390625, "global_step": 73043, "epoch": 434} {"train_loss": -9.199316024780273, "global_step": 73044, "epoch": 434} {"train_loss": -8.98383903503418, "global_step": 73045, "epoch": 434} {"train_loss": -9.087404251098633, "global_step": 73046, "epoch": 434} {"train_loss": -9.080509185791016, "global_step": 73047, "epoch": 434} {"train_loss": -9.266790390014648, "global_step": 73048, "epoch": 434} {"train_loss": -9.334060668945312, "global_step": 73049, "epoch": 434} {"train_loss": -9.065905570983887, "global_step": 73050, "epoch": 434} {"train_loss": -9.236946105957031, "global_step": 73051, "epoch": 434} {"train_loss": -9.423482894897461, "global_step": 73052, "epoch": 434} {"train_loss": -9.269064903259277, "global_step": 73053, "epoch": 434} {"train_loss": -9.164423942565918, "global_step": 73054, "epoch": 434} {"train_loss": -9.063760757446289, "global_step": 73055, "epoch": 434} {"train_loss": -9.199930191040039, "global_step": 73056, "epoch": 434} {"train_loss": -9.161348342895508, "global_step": 73057, "epoch": 434} {"train_loss": -9.044088363647461, "global_step": 73058, "epoch": 434} {"train_loss": -9.341462135314941, "global_step": 73059, "epoch": 434} {"train_loss": -8.835622787475586, "global_step": 73060, "epoch": 434} {"train_loss": -8.577460289001465, "global_step": 73061, "epoch": 434} {"train_loss": -8.907600402832031, "global_step": 73062, "epoch": 434} {"train_loss": -8.721220016479492, "global_step": 73063, "epoch": 434} {"train_loss": -8.966227531433105, "global_step": 73064, "epoch": 434} {"train_loss": -9.002254486083984, "global_step": 73065, "epoch": 434} {"train_loss": -8.920255661010742, "global_step": 73066, "epoch": 434} {"train_loss": -9.185186386108398, "global_step": 73067, "epoch": 434} {"train_loss": -9.055083274841309, "global_step": 73068, "epoch": 434} {"train_loss": -9.000585556030273, "global_step": 73069, "epoch": 434} {"train_loss": -9.155073165893555, "global_step": 73070, "epoch": 434} {"train_loss": -8.820228576660156, "global_step": 73071, "epoch": 434} {"train_loss": -9.169307708740234, "global_step": 73072, "epoch": 434} {"train_loss": -9.172730445861816, "global_step": 73073, "epoch": 434} {"train_loss": -8.980742454528809, "global_step": 73074, "epoch": 434} {"train_loss": -8.88630485534668, "global_step": 73075, "epoch": 434} {"train_loss": -9.178714752197266, "global_step": 73076, "epoch": 434} {"train_loss": -9.24222183227539, "global_step": 73077, "epoch": 434} {"train_loss": -9.028072357177734, "global_step": 73078, "epoch": 434} {"train_loss": -8.98631621542431, "global_step": 73079, "epoch": 434, "val_loss": 195806.1875} {"train_loss": -8.942988395690918, "global_step": 73080, "epoch": 435} {"train_loss": -8.812040328979492, "global_step": 73081, "epoch": 435} {"train_loss": -8.94561767578125, "global_step": 73082, "epoch": 435} {"train_loss": -8.896137237548828, "global_step": 73083, "epoch": 435} {"train_loss": -9.062799453735352, "global_step": 73084, "epoch": 435} {"train_loss": -8.953453063964844, "global_step": 73085, "epoch": 435} {"train_loss": -9.14167594909668, "global_step": 73086, "epoch": 435} {"train_loss": -8.724763870239258, "global_step": 73087, "epoch": 435} {"train_loss": -9.083145141601562, "global_step": 73088, "epoch": 435} {"train_loss": -8.682608604431152, "global_step": 73089, "epoch": 435} {"train_loss": -9.013956069946289, "global_step": 73090, "epoch": 435} {"train_loss": -9.019878387451172, "global_step": 73091, "epoch": 435} {"train_loss": -8.599873542785645, "global_step": 73092, "epoch": 435} {"train_loss": -8.845085144042969, "global_step": 73093, "epoch": 435} {"train_loss": -8.844613075256348, "global_step": 73094, "epoch": 435} {"train_loss": -8.817571640014648, "global_step": 73095, "epoch": 435} {"train_loss": -8.66553783416748, "global_step": 73096, "epoch": 435} {"train_loss": -8.726945877075195, "global_step": 73097, "epoch": 435} {"train_loss": -8.519329071044922, "global_step": 73098, "epoch": 435} {"train_loss": -8.962061882019043, "global_step": 73099, "epoch": 435} {"train_loss": -8.808202743530273, "global_step": 73100, "epoch": 435} {"train_loss": -8.741231918334961, "global_step": 73101, "epoch": 435} {"train_loss": -8.983171463012695, "global_step": 73102, "epoch": 435} {"train_loss": -9.030123710632324, "global_step": 73103, "epoch": 435} {"train_loss": -8.923864364624023, "global_step": 73104, "epoch": 435} {"train_loss": -9.044320106506348, "global_step": 73105, "epoch": 435} {"train_loss": -9.17160415649414, "global_step": 73106, "epoch": 435} {"train_loss": -9.064120292663574, "global_step": 73107, "epoch": 435} {"train_loss": -8.93110466003418, "global_step": 73108, "epoch": 435} {"train_loss": -9.060932159423828, "global_step": 73109, "epoch": 435} {"train_loss": -9.089999198913574, "global_step": 73110, "epoch": 435} {"train_loss": -9.356401443481445, "global_step": 73111, "epoch": 435} {"train_loss": -9.38438892364502, "global_step": 73112, "epoch": 435} {"train_loss": -9.15037727355957, "global_step": 73113, "epoch": 435} {"train_loss": -9.091331481933594, "global_step": 73114, "epoch": 435} {"train_loss": -9.209756851196289, "global_step": 73115, "epoch": 435} {"train_loss": -9.163322448730469, "global_step": 73116, "epoch": 435} {"train_loss": -9.031611442565918, "global_step": 73117, "epoch": 435} {"train_loss": -9.119580268859863, "global_step": 73118, "epoch": 435} {"train_loss": -9.32046890258789, "global_step": 73119, "epoch": 435} {"train_loss": -9.162771224975586, "global_step": 73120, "epoch": 435} {"train_loss": -9.228023529052734, "global_step": 73121, "epoch": 435} {"train_loss": -9.108448028564453, "global_step": 73122, "epoch": 435} {"train_loss": -9.020074844360352, "global_step": 73123, "epoch": 435} {"train_loss": -9.253228187561035, "global_step": 73124, "epoch": 435} {"train_loss": -9.163304328918457, "global_step": 73125, "epoch": 435} {"train_loss": -9.31399154663086, "global_step": 73126, "epoch": 435} {"train_loss": -9.411397933959961, "global_step": 73127, "epoch": 435} {"train_loss": -9.115452766418457, "global_step": 73128, "epoch": 435} {"train_loss": -9.255130767822266, "global_step": 73129, "epoch": 435} {"train_loss": -9.30270004272461, "global_step": 73130, "epoch": 435} {"train_loss": -9.104840278625488, "global_step": 73131, "epoch": 435} {"train_loss": -9.033873558044434, "global_step": 73132, "epoch": 435} {"train_loss": -9.185667991638184, "global_step": 73133, "epoch": 435} {"train_loss": -9.427700996398926, "global_step": 73134, "epoch": 435} {"train_loss": -9.181570053100586, "global_step": 73135, "epoch": 435} {"train_loss": -8.940566062927246, "global_step": 73136, "epoch": 435} {"train_loss": -9.30086898803711, "global_step": 73137, "epoch": 435} {"train_loss": -9.01060676574707, "global_step": 73138, "epoch": 435} {"train_loss": -8.83527946472168, "global_step": 73139, "epoch": 435} {"train_loss": -9.062262535095215, "global_step": 73140, "epoch": 435} {"train_loss": -9.180676460266113, "global_step": 73141, "epoch": 435} {"train_loss": -9.035350799560547, "global_step": 73142, "epoch": 435} {"train_loss": -8.883382797241211, "global_step": 73143, "epoch": 435} {"train_loss": -8.654647827148438, "global_step": 73144, "epoch": 435} {"train_loss": -9.189018249511719, "global_step": 73145, "epoch": 435} {"train_loss": -8.808749198913574, "global_step": 73146, "epoch": 435} {"train_loss": -9.046623229980469, "global_step": 73147, "epoch": 435} {"train_loss": -8.709661483764648, "global_step": 73148, "epoch": 435} {"train_loss": -8.80386734008789, "global_step": 73149, "epoch": 435} {"train_loss": -9.082122802734375, "global_step": 73150, "epoch": 435} {"train_loss": -9.107189178466797, "global_step": 73151, "epoch": 435} {"train_loss": -8.82491683959961, "global_step": 73152, "epoch": 435} {"train_loss": -8.768356323242188, "global_step": 73153, "epoch": 435} {"train_loss": -8.804084777832031, "global_step": 73154, "epoch": 435} {"train_loss": -9.097572326660156, "global_step": 73155, "epoch": 435} {"train_loss": -8.737176895141602, "global_step": 73156, "epoch": 435} {"train_loss": -8.644886016845703, "global_step": 73157, "epoch": 435} {"train_loss": -8.786604881286621, "global_step": 73158, "epoch": 435} {"train_loss": -8.601455688476562, "global_step": 73159, "epoch": 435} {"train_loss": -8.704187393188477, "global_step": 73160, "epoch": 435} {"train_loss": -8.854923248291016, "global_step": 73161, "epoch": 435} {"train_loss": -9.049186706542969, "global_step": 73162, "epoch": 435} {"train_loss": -8.793550491333008, "global_step": 73163, "epoch": 435} {"train_loss": -8.602729797363281, "global_step": 73164, "epoch": 435} {"train_loss": -9.013708114624023, "global_step": 73165, "epoch": 435} {"train_loss": -8.650531768798828, "global_step": 73166, "epoch": 435} {"train_loss": -8.892192840576172, "global_step": 73167, "epoch": 435} {"train_loss": -8.79501724243164, "global_step": 73168, "epoch": 435} {"train_loss": -9.176264762878418, "global_step": 73169, "epoch": 435} {"train_loss": -8.686996459960938, "global_step": 73170, "epoch": 435} {"train_loss": -8.722617149353027, "global_step": 73171, "epoch": 435} {"train_loss": -8.914443016052246, "global_step": 73172, "epoch": 435} {"train_loss": -8.881486892700195, "global_step": 73173, "epoch": 435} {"train_loss": -9.028345108032227, "global_step": 73174, "epoch": 435} {"train_loss": -8.914092063903809, "global_step": 73175, "epoch": 435} {"train_loss": -9.115875244140625, "global_step": 73176, "epoch": 435} {"train_loss": -8.968134880065918, "global_step": 73177, "epoch": 435} {"train_loss": -9.031867980957031, "global_step": 73178, "epoch": 435} {"train_loss": -8.940479278564453, "global_step": 73179, "epoch": 435} {"train_loss": -8.87583065032959, "global_step": 73180, "epoch": 435} {"train_loss": -8.868593215942383, "global_step": 73181, "epoch": 435} {"train_loss": -9.060724258422852, "global_step": 73182, "epoch": 435} {"train_loss": -9.151468276977539, "global_step": 73183, "epoch": 435} {"train_loss": -8.894899368286133, "global_step": 73184, "epoch": 435} {"train_loss": -9.18735408782959, "global_step": 73185, "epoch": 435} {"train_loss": -8.865808486938477, "global_step": 73186, "epoch": 435} {"train_loss": -8.968472480773926, "global_step": 73187, "epoch": 435} {"train_loss": -9.026748657226562, "global_step": 73188, "epoch": 435} {"train_loss": -8.98375129699707, "global_step": 73189, "epoch": 435} {"train_loss": -8.89826774597168, "global_step": 73190, "epoch": 435} {"train_loss": -9.15422248840332, "global_step": 73191, "epoch": 435} {"train_loss": -8.980875015258789, "global_step": 73192, "epoch": 435} {"train_loss": -8.896699905395508, "global_step": 73193, "epoch": 435} {"train_loss": -9.11669921875, "global_step": 73194, "epoch": 435} {"train_loss": -9.138909339904785, "global_step": 73195, "epoch": 435} {"train_loss": -9.066341400146484, "global_step": 73196, "epoch": 435} {"train_loss": -9.013561248779297, "global_step": 73197, "epoch": 435} {"train_loss": -9.003741264343262, "global_step": 73198, "epoch": 435} {"train_loss": -8.836995124816895, "global_step": 73199, "epoch": 435} {"train_loss": -8.920888900756836, "global_step": 73200, "epoch": 435} {"train_loss": -9.206863403320312, "global_step": 73201, "epoch": 435} {"train_loss": -9.202478408813477, "global_step": 73202, "epoch": 435} {"train_loss": -9.220914840698242, "global_step": 73203, "epoch": 435} {"train_loss": -9.103840827941895, "global_step": 73204, "epoch": 435} {"train_loss": -9.044851303100586, "global_step": 73205, "epoch": 435} {"train_loss": -9.090614318847656, "global_step": 73206, "epoch": 435} {"train_loss": -9.19057846069336, "global_step": 73207, "epoch": 435} {"train_loss": -9.09787368774414, "global_step": 73208, "epoch": 435} {"train_loss": -9.163187026977539, "global_step": 73209, "epoch": 435} {"train_loss": -9.20764446258545, "global_step": 73210, "epoch": 435} {"train_loss": -9.11151123046875, "global_step": 73211, "epoch": 435} {"train_loss": -9.047492980957031, "global_step": 73212, "epoch": 435} {"train_loss": -9.382037162780762, "global_step": 73213, "epoch": 435} {"train_loss": -8.909494400024414, "global_step": 73214, "epoch": 435} {"train_loss": -9.229928970336914, "global_step": 73215, "epoch": 435} {"train_loss": -8.844425201416016, "global_step": 73216, "epoch": 435} {"train_loss": -9.018057823181152, "global_step": 73217, "epoch": 435} {"train_loss": -8.558061599731445, "global_step": 73218, "epoch": 435} {"train_loss": -9.002046585083008, "global_step": 73219, "epoch": 435} {"train_loss": -8.619954109191895, "global_step": 73220, "epoch": 435} {"train_loss": -8.65831184387207, "global_step": 73221, "epoch": 435} {"train_loss": -8.93939208984375, "global_step": 73222, "epoch": 435} {"train_loss": -8.863201141357422, "global_step": 73223, "epoch": 435} {"train_loss": -9.061376571655273, "global_step": 73224, "epoch": 435} {"train_loss": -8.946792602539062, "global_step": 73225, "epoch": 435} {"train_loss": -9.163257598876953, "global_step": 73226, "epoch": 435} {"train_loss": -8.567721366882324, "global_step": 73227, "epoch": 435} {"train_loss": -8.842440605163574, "global_step": 73228, "epoch": 435} {"train_loss": -8.953679084777832, "global_step": 73229, "epoch": 435} {"train_loss": -8.993617057800293, "global_step": 73230, "epoch": 435} {"train_loss": -8.872278213500977, "global_step": 73231, "epoch": 435} {"train_loss": -8.981801986694336, "global_step": 73232, "epoch": 435} {"train_loss": -8.948817253112793, "global_step": 73233, "epoch": 435} {"train_loss": -8.865303993225098, "global_step": 73234, "epoch": 435} {"train_loss": -9.04987907409668, "global_step": 73235, "epoch": 435} {"train_loss": -9.074823379516602, "global_step": 73236, "epoch": 435} {"train_loss": -8.932780265808105, "global_step": 73237, "epoch": 435} {"train_loss": -9.059280395507812, "global_step": 73238, "epoch": 435} {"train_loss": -9.061256408691406, "global_step": 73239, "epoch": 435} {"train_loss": -8.933263778686523, "global_step": 73240, "epoch": 435} {"train_loss": -8.965120315551758, "global_step": 73241, "epoch": 435} {"train_loss": -9.007863998413086, "global_step": 73242, "epoch": 435} {"train_loss": -8.967966079711914, "global_step": 73243, "epoch": 435} {"train_loss": -8.949435234069824, "global_step": 73244, "epoch": 435} {"train_loss": -8.982464790344238, "global_step": 73245, "epoch": 435} {"train_loss": -9.295230865478516, "global_step": 73246, "epoch": 435} {"train_loss": -8.990099146252586, "global_step": 73247, "epoch": 435, "val_loss": 193535.109375, "train_action_mse_error": 4.300495147705078} {"train_loss": -8.947684288024902, "global_step": 73248, "epoch": 436} {"train_loss": -9.279951095581055, "global_step": 73249, "epoch": 436} {"train_loss": -8.983856201171875, "global_step": 73250, "epoch": 436} {"train_loss": -9.046966552734375, "global_step": 73251, "epoch": 436} {"train_loss": -9.257133483886719, "global_step": 73252, "epoch": 436} {"train_loss": -9.3326416015625, "global_step": 73253, "epoch": 436} {"train_loss": -9.170806884765625, "global_step": 73254, "epoch": 436} {"train_loss": -9.19236946105957, "global_step": 73255, "epoch": 436} {"train_loss": -9.244054794311523, "global_step": 73256, "epoch": 436} {"train_loss": -9.027911186218262, "global_step": 73257, "epoch": 436} {"train_loss": -9.1496000289917, "global_step": 73258, "epoch": 436} {"train_loss": -9.226960182189941, "global_step": 73259, "epoch": 436} {"train_loss": -9.188383102416992, "global_step": 73260, "epoch": 436} {"train_loss": -9.181303024291992, "global_step": 73261, "epoch": 436} {"train_loss": -9.129169464111328, "global_step": 73262, "epoch": 436} {"train_loss": -9.089479446411133, "global_step": 73263, "epoch": 436} {"train_loss": -9.060522079467773, "global_step": 73264, "epoch": 436} {"train_loss": -9.115673065185547, "global_step": 73265, "epoch": 436} {"train_loss": -9.063032150268555, "global_step": 73266, "epoch": 436} {"train_loss": -9.105422019958496, "global_step": 73267, "epoch": 436} {"train_loss": -9.02971076965332, "global_step": 73268, "epoch": 436} {"train_loss": -8.928078651428223, "global_step": 73269, "epoch": 436} {"train_loss": -9.03937816619873, "global_step": 73270, "epoch": 436} {"train_loss": -8.928069114685059, "global_step": 73271, "epoch": 436} {"train_loss": -9.148079872131348, "global_step": 73272, "epoch": 436} {"train_loss": -8.956432342529297, "global_step": 73273, "epoch": 436} {"train_loss": -9.267131805419922, "global_step": 73274, "epoch": 436} {"train_loss": -8.825043678283691, "global_step": 73275, "epoch": 436} {"train_loss": -9.255545616149902, "global_step": 73276, "epoch": 436} {"train_loss": -8.687963485717773, "global_step": 73277, "epoch": 436} {"train_loss": -8.992311477661133, "global_step": 73278, "epoch": 436} {"train_loss": -8.51469612121582, "global_step": 73279, "epoch": 436} {"train_loss": -8.969083786010742, "global_step": 73280, "epoch": 436} {"train_loss": -8.941666603088379, "global_step": 73281, "epoch": 436} {"train_loss": -8.971168518066406, "global_step": 73282, "epoch": 436} {"train_loss": -8.770553588867188, "global_step": 73283, "epoch": 436} {"train_loss": -8.821678161621094, "global_step": 73284, "epoch": 436} {"train_loss": -8.792494773864746, "global_step": 73285, "epoch": 436} {"train_loss": -8.948034286499023, "global_step": 73286, "epoch": 436} {"train_loss": -8.73310375213623, "global_step": 73287, "epoch": 436} {"train_loss": -8.66592025756836, "global_step": 73288, "epoch": 436} {"train_loss": -8.867206573486328, "global_step": 73289, "epoch": 436} {"train_loss": -8.663373947143555, "global_step": 73290, "epoch": 436} {"train_loss": -8.52712631225586, "global_step": 73291, "epoch": 436} {"train_loss": -8.651966094970703, "global_step": 73292, "epoch": 436} {"train_loss": -8.916694641113281, "global_step": 73293, "epoch": 436} {"train_loss": -8.58133316040039, "global_step": 73294, "epoch": 436} {"train_loss": -8.799567222595215, "global_step": 73295, "epoch": 436} {"train_loss": -9.01906967163086, "global_step": 73296, "epoch": 436} {"train_loss": -8.941391944885254, "global_step": 73297, "epoch": 436} {"train_loss": -8.826087951660156, "global_step": 73298, "epoch": 436} {"train_loss": -8.892793655395508, "global_step": 73299, "epoch": 436} {"train_loss": -9.09652328491211, "global_step": 73300, "epoch": 436} {"train_loss": -8.930337905883789, "global_step": 73301, "epoch": 436} {"train_loss": -9.062150955200195, "global_step": 73302, "epoch": 436} {"train_loss": -9.10464096069336, "global_step": 73303, "epoch": 436} {"train_loss": -9.163590431213379, "global_step": 73304, "epoch": 436} {"train_loss": -9.19333553314209, "global_step": 73305, "epoch": 436} {"train_loss": -9.045891761779785, "global_step": 73306, "epoch": 436} {"train_loss": -8.951565742492676, "global_step": 73307, "epoch": 436} {"train_loss": -9.206562995910645, "global_step": 73308, "epoch": 436} {"train_loss": -8.902106285095215, "global_step": 73309, "epoch": 436} {"train_loss": -9.023246765136719, "global_step": 73310, "epoch": 436} {"train_loss": -9.093451499938965, "global_step": 73311, "epoch": 436} {"train_loss": -9.082524299621582, "global_step": 73312, "epoch": 436} {"train_loss": -8.806892395019531, "global_step": 73313, "epoch": 436} {"train_loss": -9.165019989013672, "global_step": 73314, "epoch": 436} {"train_loss": -9.031421661376953, "global_step": 73315, "epoch": 436} {"train_loss": -9.130910873413086, "global_step": 73316, "epoch": 436} {"train_loss": -9.441679000854492, "global_step": 73317, "epoch": 436} {"train_loss": -9.018625259399414, "global_step": 73318, "epoch": 436} {"train_loss": -9.348899841308594, "global_step": 73319, "epoch": 436} {"train_loss": -9.102072715759277, "global_step": 73320, "epoch": 436} {"train_loss": -9.223091125488281, "global_step": 73321, "epoch": 436} {"train_loss": -9.265852928161621, "global_step": 73322, "epoch": 436} {"train_loss": -8.971895217895508, "global_step": 73323, "epoch": 436} {"train_loss": -9.05283260345459, "global_step": 73324, "epoch": 436} {"train_loss": -9.072225570678711, "global_step": 73325, "epoch": 436} {"train_loss": -9.143622398376465, "global_step": 73326, "epoch": 436} {"train_loss": -9.065381050109863, "global_step": 73327, "epoch": 436} {"train_loss": -9.201502799987793, "global_step": 73328, "epoch": 436} {"train_loss": -9.0264253616333, "global_step": 73329, "epoch": 436} {"train_loss": -9.113122940063477, "global_step": 73330, "epoch": 436} {"train_loss": -9.096542358398438, "global_step": 73331, "epoch": 436} {"train_loss": -9.204081535339355, "global_step": 73332, "epoch": 436} {"train_loss": -9.142997741699219, "global_step": 73333, "epoch": 436} {"train_loss": -9.283332824707031, "global_step": 73334, "epoch": 436} {"train_loss": -8.969956398010254, "global_step": 73335, "epoch": 436} {"train_loss": -9.129993438720703, "global_step": 73336, "epoch": 436} {"train_loss": -9.018975257873535, "global_step": 73337, "epoch": 436} {"train_loss": -8.98170280456543, "global_step": 73338, "epoch": 436} {"train_loss": -9.087784767150879, "global_step": 73339, "epoch": 436} {"train_loss": -9.05596923828125, "global_step": 73340, "epoch": 436} {"train_loss": -9.147676467895508, "global_step": 73341, "epoch": 436} {"train_loss": -8.868827819824219, "global_step": 73342, "epoch": 436} {"train_loss": -9.162418365478516, "global_step": 73343, "epoch": 436} {"train_loss": -9.044662475585938, "global_step": 73344, "epoch": 436} {"train_loss": -9.084470748901367, "global_step": 73345, "epoch": 436} {"train_loss": -8.972949981689453, "global_step": 73346, "epoch": 436} {"train_loss": -9.1799898147583, "global_step": 73347, "epoch": 436} {"train_loss": -8.873102188110352, "global_step": 73348, "epoch": 436} {"train_loss": -8.939668655395508, "global_step": 73349, "epoch": 436} {"train_loss": -9.119863510131836, "global_step": 73350, "epoch": 436} {"train_loss": -9.118789672851562, "global_step": 73351, "epoch": 436} {"train_loss": -8.907535552978516, "global_step": 73352, "epoch": 436} {"train_loss": -8.797008514404297, "global_step": 73353, "epoch": 436} {"train_loss": -9.043573379516602, "global_step": 73354, "epoch": 436} {"train_loss": -8.866252899169922, "global_step": 73355, "epoch": 436} {"train_loss": -9.155187606811523, "global_step": 73356, "epoch": 436} {"train_loss": -8.67348861694336, "global_step": 73357, "epoch": 436} {"train_loss": -8.812044143676758, "global_step": 73358, "epoch": 436} {"train_loss": -8.867021560668945, "global_step": 73359, "epoch": 436} {"train_loss": -8.836563110351562, "global_step": 73360, "epoch": 436} {"train_loss": -8.880762100219727, "global_step": 73361, "epoch": 436} {"train_loss": -9.09124755859375, "global_step": 73362, "epoch": 436} {"train_loss": -8.806877136230469, "global_step": 73363, "epoch": 436} {"train_loss": -8.883801460266113, "global_step": 73364, "epoch": 436} {"train_loss": -9.100807189941406, "global_step": 73365, "epoch": 436} {"train_loss": -9.142098426818848, "global_step": 73366, "epoch": 436} {"train_loss": -9.137100219726562, "global_step": 73367, "epoch": 436} {"train_loss": -8.96115493774414, "global_step": 73368, "epoch": 436} {"train_loss": -9.063055038452148, "global_step": 73369, "epoch": 436} {"train_loss": -9.127519607543945, "global_step": 73370, "epoch": 436} {"train_loss": -9.160209655761719, "global_step": 73371, "epoch": 436} {"train_loss": -9.062118530273438, "global_step": 73372, "epoch": 436} {"train_loss": -9.047409057617188, "global_step": 73373, "epoch": 436} {"train_loss": -9.010812759399414, "global_step": 73374, "epoch": 436} {"train_loss": -9.165282249450684, "global_step": 73375, "epoch": 436} {"train_loss": -8.851495742797852, "global_step": 73376, "epoch": 436} {"train_loss": -8.978019714355469, "global_step": 73377, "epoch": 436} {"train_loss": -8.931758880615234, "global_step": 73378, "epoch": 436} {"train_loss": -8.878300666809082, "global_step": 73379, "epoch": 436} {"train_loss": -9.061251640319824, "global_step": 73380, "epoch": 436} {"train_loss": -9.17611312866211, "global_step": 73381, "epoch": 436} {"train_loss": -9.057245254516602, "global_step": 73382, "epoch": 436} {"train_loss": -8.998573303222656, "global_step": 73383, "epoch": 436} {"train_loss": -9.071048736572266, "global_step": 73384, "epoch": 436} {"train_loss": -9.022613525390625, "global_step": 73385, "epoch": 436} {"train_loss": -8.878486633300781, "global_step": 73386, "epoch": 436} {"train_loss": -9.185891151428223, "global_step": 73387, "epoch": 436} {"train_loss": -9.040000915527344, "global_step": 73388, "epoch": 436} {"train_loss": -9.040075302124023, "global_step": 73389, "epoch": 436} {"train_loss": -9.119258880615234, "global_step": 73390, "epoch": 436} {"train_loss": -8.959392547607422, "global_step": 73391, "epoch": 436} {"train_loss": -9.200277328491211, "global_step": 73392, "epoch": 436} {"train_loss": -9.19741439819336, "global_step": 73393, "epoch": 436} {"train_loss": -9.27175235748291, "global_step": 73394, "epoch": 436} {"train_loss": -9.031890869140625, "global_step": 73395, "epoch": 436} {"train_loss": -9.273303985595703, "global_step": 73396, "epoch": 436} {"train_loss": -8.928537368774414, "global_step": 73397, "epoch": 436} {"train_loss": -9.093936920166016, "global_step": 73398, "epoch": 436} {"train_loss": -9.18394660949707, "global_step": 73399, "epoch": 436} {"train_loss": -8.445470809936523, "global_step": 73400, "epoch": 436} {"train_loss": -9.165231704711914, "global_step": 73401, "epoch": 436} {"train_loss": -9.007844924926758, "global_step": 73402, "epoch": 436} {"train_loss": -8.745878219604492, "global_step": 73403, "epoch": 436} {"train_loss": -8.94073486328125, "global_step": 73404, "epoch": 436} {"train_loss": -8.897455215454102, "global_step": 73405, "epoch": 436} {"train_loss": -8.938512802124023, "global_step": 73406, "epoch": 436} {"train_loss": -8.956180572509766, "global_step": 73407, "epoch": 436} {"train_loss": -8.769123077392578, "global_step": 73408, "epoch": 436} {"train_loss": -8.88974666595459, "global_step": 73409, "epoch": 436} {"train_loss": -8.937446594238281, "global_step": 73410, "epoch": 436} {"train_loss": -9.057568550109863, "global_step": 73411, "epoch": 436} {"train_loss": -8.856725692749023, "global_step": 73412, "epoch": 436} {"train_loss": -8.713409423828125, "global_step": 73413, "epoch": 436} {"train_loss": -8.983573913574219, "global_step": 73414, "epoch": 436} {"train_loss": -9.013503068969364, "global_step": 73415, "epoch": 436, "val_loss": 193260.015625} {"train_loss": -9.01851749420166, "global_step": 73416, "epoch": 437} {"train_loss": -8.950634002685547, "global_step": 73417, "epoch": 437} {"train_loss": -8.868217468261719, "global_step": 73418, "epoch": 437} {"train_loss": -8.734365463256836, "global_step": 73419, "epoch": 437} {"train_loss": -8.93307876586914, "global_step": 73420, "epoch": 437} {"train_loss": -9.023293495178223, "global_step": 73421, "epoch": 437} {"train_loss": -8.680034637451172, "global_step": 73422, "epoch": 437} {"train_loss": -8.849862098693848, "global_step": 73423, "epoch": 437} {"train_loss": -8.842687606811523, "global_step": 73424, "epoch": 437} {"train_loss": -8.863973617553711, "global_step": 73425, "epoch": 437} {"train_loss": -8.628715515136719, "global_step": 73426, "epoch": 437} {"train_loss": -8.951471328735352, "global_step": 73427, "epoch": 437} {"train_loss": -8.635759353637695, "global_step": 73428, "epoch": 437} {"train_loss": -8.637046813964844, "global_step": 73429, "epoch": 437} {"train_loss": -8.90573787689209, "global_step": 73430, "epoch": 437} {"train_loss": -8.995729446411133, "global_step": 73431, "epoch": 437} {"train_loss": -8.799345016479492, "global_step": 73432, "epoch": 437} {"train_loss": -9.029943466186523, "global_step": 73433, "epoch": 437} {"train_loss": -9.103090286254883, "global_step": 73434, "epoch": 437} {"train_loss": -8.837969779968262, "global_step": 73435, "epoch": 437} {"train_loss": -9.15349006652832, "global_step": 73436, "epoch": 437} {"train_loss": -9.113353729248047, "global_step": 73437, "epoch": 437} {"train_loss": -9.024600982666016, "global_step": 73438, "epoch": 437} {"train_loss": -8.940317153930664, "global_step": 73439, "epoch": 437} {"train_loss": -8.95765495300293, "global_step": 73440, "epoch": 437} {"train_loss": -9.003246307373047, "global_step": 73441, "epoch": 437} {"train_loss": -9.077252388000488, "global_step": 73442, "epoch": 437} {"train_loss": -9.186554908752441, "global_step": 73443, "epoch": 437} {"train_loss": -9.099893569946289, "global_step": 73444, "epoch": 437} {"train_loss": -9.110991477966309, "global_step": 73445, "epoch": 437} {"train_loss": -9.267755508422852, "global_step": 73446, "epoch": 437} {"train_loss": -8.975744247436523, "global_step": 73447, "epoch": 437} {"train_loss": -9.245344161987305, "global_step": 73448, "epoch": 437} {"train_loss": -8.989933013916016, "global_step": 73449, "epoch": 437} {"train_loss": -8.999940872192383, "global_step": 73450, "epoch": 437} {"train_loss": -9.364814758300781, "global_step": 73451, "epoch": 437} {"train_loss": -9.243307113647461, "global_step": 73452, "epoch": 437} {"train_loss": -9.11762809753418, "global_step": 73453, "epoch": 437} {"train_loss": -9.092885971069336, "global_step": 73454, "epoch": 437} {"train_loss": -9.085915565490723, "global_step": 73455, "epoch": 437} {"train_loss": -9.215620994567871, "global_step": 73456, "epoch": 437} {"train_loss": -9.259242057800293, "global_step": 73457, "epoch": 437} {"train_loss": -9.073083877563477, "global_step": 73458, "epoch": 437} {"train_loss": -9.151056289672852, "global_step": 73459, "epoch": 437} {"train_loss": -9.090710639953613, "global_step": 73460, "epoch": 437} {"train_loss": -9.332357406616211, "global_step": 73461, "epoch": 437} {"train_loss": -9.172544479370117, "global_step": 73462, "epoch": 437} {"train_loss": -9.040336608886719, "global_step": 73463, "epoch": 437} {"train_loss": -9.181229591369629, "global_step": 73464, "epoch": 437} {"train_loss": -9.180389404296875, "global_step": 73465, "epoch": 437} {"train_loss": -9.029886245727539, "global_step": 73466, "epoch": 437} {"train_loss": -9.070819854736328, "global_step": 73467, "epoch": 437} {"train_loss": -8.845404624938965, "global_step": 73468, "epoch": 437} {"train_loss": -8.818649291992188, "global_step": 73469, "epoch": 437} {"train_loss": -8.804071426391602, "global_step": 73470, "epoch": 437} {"train_loss": -8.775691986083984, "global_step": 73471, "epoch": 437} {"train_loss": -8.705878257751465, "global_step": 73472, "epoch": 437} {"train_loss": -9.067766189575195, "global_step": 73473, "epoch": 437} {"train_loss": -8.779074668884277, "global_step": 73474, "epoch": 437} {"train_loss": -8.973922729492188, "global_step": 73475, "epoch": 437} {"train_loss": -8.795886993408203, "global_step": 73476, "epoch": 437} {"train_loss": -8.974342346191406, "global_step": 73477, "epoch": 437} {"train_loss": -8.764239311218262, "global_step": 73478, "epoch": 437} {"train_loss": -8.934064865112305, "global_step": 73479, "epoch": 437} {"train_loss": -8.850458145141602, "global_step": 73480, "epoch": 437} {"train_loss": -9.012051582336426, "global_step": 73481, "epoch": 437} {"train_loss": -8.842645645141602, "global_step": 73482, "epoch": 437} {"train_loss": -9.129368782043457, "global_step": 73483, "epoch": 437} {"train_loss": -9.032392501831055, "global_step": 73484, "epoch": 437} {"train_loss": -9.137775421142578, "global_step": 73485, "epoch": 437} {"train_loss": -8.95094108581543, "global_step": 73486, "epoch": 437} {"train_loss": -8.97824478149414, "global_step": 73487, "epoch": 437} {"train_loss": -9.162068367004395, "global_step": 73488, "epoch": 437} {"train_loss": -9.083885192871094, "global_step": 73489, "epoch": 437} {"train_loss": -8.826218605041504, "global_step": 73490, "epoch": 437} {"train_loss": -9.044527053833008, "global_step": 73491, "epoch": 437} {"train_loss": -8.958470344543457, "global_step": 73492, "epoch": 437} {"train_loss": -9.112937927246094, "global_step": 73493, "epoch": 437} {"train_loss": -9.228946685791016, "global_step": 73494, "epoch": 437} {"train_loss": -8.930944442749023, "global_step": 73495, "epoch": 437} {"train_loss": -9.225812911987305, "global_step": 73496, "epoch": 437} {"train_loss": -9.228182792663574, "global_step": 73497, "epoch": 437} {"train_loss": -9.179274559020996, "global_step": 73498, "epoch": 437} {"train_loss": -9.0384521484375, "global_step": 73499, "epoch": 437} {"train_loss": -9.072593688964844, "global_step": 73500, "epoch": 437} {"train_loss": -9.199261665344238, "global_step": 73501, "epoch": 437} {"train_loss": -9.115367889404297, "global_step": 73502, "epoch": 437} {"train_loss": -9.24040412902832, "global_step": 73503, "epoch": 437} {"train_loss": -8.854194641113281, "global_step": 73504, "epoch": 437} {"train_loss": -9.151073455810547, "global_step": 73505, "epoch": 437} {"train_loss": -9.088769912719727, "global_step": 73506, "epoch": 437} {"train_loss": -8.923969268798828, "global_step": 73507, "epoch": 437} {"train_loss": -9.129373550415039, "global_step": 73508, "epoch": 437} {"train_loss": -8.85622787475586, "global_step": 73509, "epoch": 437} {"train_loss": -9.1285982131958, "global_step": 73510, "epoch": 437} {"train_loss": -8.951726913452148, "global_step": 73511, "epoch": 437} {"train_loss": -9.20263957977295, "global_step": 73512, "epoch": 437} {"train_loss": -9.162697792053223, "global_step": 73513, "epoch": 437} {"train_loss": -9.187238693237305, "global_step": 73514, "epoch": 437} {"train_loss": -9.485286712646484, "global_step": 73515, "epoch": 437} {"train_loss": -9.144306182861328, "global_step": 73516, "epoch": 437} {"train_loss": -9.255270004272461, "global_step": 73517, "epoch": 437} {"train_loss": -9.05459213256836, "global_step": 73518, "epoch": 437} {"train_loss": -8.71788215637207, "global_step": 73519, "epoch": 437} {"train_loss": -8.913803100585938, "global_step": 73520, "epoch": 437} {"train_loss": -9.039800643920898, "global_step": 73521, "epoch": 437} {"train_loss": -8.685708999633789, "global_step": 73522, "epoch": 437} {"train_loss": -9.286426544189453, "global_step": 73523, "epoch": 437} {"train_loss": -8.816286087036133, "global_step": 73524, "epoch": 437} {"train_loss": -9.232908248901367, "global_step": 73525, "epoch": 437} {"train_loss": -8.845792770385742, "global_step": 73526, "epoch": 437} {"train_loss": -9.00384521484375, "global_step": 73527, "epoch": 437} {"train_loss": -8.515192031860352, "global_step": 73528, "epoch": 437} {"train_loss": -8.880577087402344, "global_step": 73529, "epoch": 437} {"train_loss": -8.56215763092041, "global_step": 73530, "epoch": 437} {"train_loss": -8.69662857055664, "global_step": 73531, "epoch": 437} {"train_loss": -8.531295776367188, "global_step": 73532, "epoch": 437} {"train_loss": -8.75149917602539, "global_step": 73533, "epoch": 437} {"train_loss": -8.79367733001709, "global_step": 73534, "epoch": 437} {"train_loss": -8.785837173461914, "global_step": 73535, "epoch": 437} {"train_loss": -8.855473518371582, "global_step": 73536, "epoch": 437} {"train_loss": -8.821145057678223, "global_step": 73537, "epoch": 437} {"train_loss": -8.8935546875, "global_step": 73538, "epoch": 437} {"train_loss": -8.899007797241211, "global_step": 73539, "epoch": 437} {"train_loss": -9.184539794921875, "global_step": 73540, "epoch": 437} {"train_loss": -8.995711326599121, "global_step": 73541, "epoch": 437} {"train_loss": -8.956687927246094, "global_step": 73542, "epoch": 437} {"train_loss": -9.062335014343262, "global_step": 73543, "epoch": 437} {"train_loss": -9.086763381958008, "global_step": 73544, "epoch": 437} {"train_loss": -9.075885772705078, "global_step": 73545, "epoch": 437} {"train_loss": -9.201305389404297, "global_step": 73546, "epoch": 437} {"train_loss": -9.18284797668457, "global_step": 73547, "epoch": 437} {"train_loss": -9.15580940246582, "global_step": 73548, "epoch": 437} {"train_loss": -9.101533889770508, "global_step": 73549, "epoch": 437} {"train_loss": -9.023353576660156, "global_step": 73550, "epoch": 437} {"train_loss": -9.006736755371094, "global_step": 73551, "epoch": 437} {"train_loss": -9.079672813415527, "global_step": 73552, "epoch": 437} {"train_loss": -8.869071960449219, "global_step": 73553, "epoch": 437} {"train_loss": -9.148516654968262, "global_step": 73554, "epoch": 437} {"train_loss": -9.088386535644531, "global_step": 73555, "epoch": 437} {"train_loss": -9.135770797729492, "global_step": 73556, "epoch": 437} {"train_loss": -8.872964859008789, "global_step": 73557, "epoch": 437} {"train_loss": -8.714683532714844, "global_step": 73558, "epoch": 437} {"train_loss": -9.012552261352539, "global_step": 73559, "epoch": 437} {"train_loss": -9.32972526550293, "global_step": 73560, "epoch": 437} {"train_loss": -8.358369827270508, "global_step": 73561, "epoch": 437} {"train_loss": -9.286362648010254, "global_step": 73562, "epoch": 437} {"train_loss": -8.8555908203125, "global_step": 73563, "epoch": 437} {"train_loss": -9.058813095092773, "global_step": 73564, "epoch": 437} {"train_loss": -8.951942443847656, "global_step": 73565, "epoch": 437} {"train_loss": -8.944782257080078, "global_step": 73566, "epoch": 437} {"train_loss": -8.884967803955078, "global_step": 73567, "epoch": 437} {"train_loss": -8.619766235351562, "global_step": 73568, "epoch": 437} {"train_loss": -8.576745986938477, "global_step": 73569, "epoch": 437} {"train_loss": -8.857010841369629, "global_step": 73570, "epoch": 437} {"train_loss": -8.554227828979492, "global_step": 73571, "epoch": 437} {"train_loss": -9.070399284362793, "global_step": 73572, "epoch": 437} {"train_loss": -8.713391304016113, "global_step": 73573, "epoch": 437} {"train_loss": -8.996622085571289, "global_step": 73574, "epoch": 437} {"train_loss": -8.58621597290039, "global_step": 73575, "epoch": 437} {"train_loss": -9.075504302978516, "global_step": 73576, "epoch": 437} {"train_loss": -8.76161003112793, "global_step": 73577, "epoch": 437} {"train_loss": -9.06848430633545, "global_step": 73578, "epoch": 437} {"train_loss": -9.1121826171875, "global_step": 73579, "epoch": 437} {"train_loss": -9.008872032165527, "global_step": 73580, "epoch": 437} {"train_loss": -9.274179458618164, "global_step": 73581, "epoch": 437} {"train_loss": -8.918085098266602, "global_step": 73582, "epoch": 437} {"train_loss": -8.986593359992618, "global_step": 73583, "epoch": 437, "val_loss": 193757.9375} {"train_loss": -8.975622177124023, "global_step": 73584, "epoch": 438} {"train_loss": -9.168255805969238, "global_step": 73585, "epoch": 438} {"train_loss": -9.034656524658203, "global_step": 73586, "epoch": 438} {"train_loss": -9.164077758789062, "global_step": 73587, "epoch": 438} {"train_loss": -9.135751724243164, "global_step": 73588, "epoch": 438} {"train_loss": -9.12313175201416, "global_step": 73589, "epoch": 438} {"train_loss": -9.363700866699219, "global_step": 73590, "epoch": 438} {"train_loss": -9.315836906433105, "global_step": 73591, "epoch": 438} {"train_loss": -8.916540145874023, "global_step": 73592, "epoch": 438} {"train_loss": -9.241626739501953, "global_step": 73593, "epoch": 438} {"train_loss": -9.158013343811035, "global_step": 73594, "epoch": 438} {"train_loss": -9.20468521118164, "global_step": 73595, "epoch": 438} {"train_loss": -9.18336009979248, "global_step": 73596, "epoch": 438} {"train_loss": -9.390172004699707, "global_step": 73597, "epoch": 438} {"train_loss": -9.150857925415039, "global_step": 73598, "epoch": 438} {"train_loss": -9.189384460449219, "global_step": 73599, "epoch": 438} {"train_loss": -9.349197387695312, "global_step": 73600, "epoch": 438} {"train_loss": -9.101160049438477, "global_step": 73601, "epoch": 438} {"train_loss": -9.022686004638672, "global_step": 73602, "epoch": 438} {"train_loss": -9.00752067565918, "global_step": 73603, "epoch": 438} {"train_loss": -9.199089050292969, "global_step": 73604, "epoch": 438} {"train_loss": -8.832179069519043, "global_step": 73605, "epoch": 438} {"train_loss": -9.23134994506836, "global_step": 73606, "epoch": 438} {"train_loss": -9.081598281860352, "global_step": 73607, "epoch": 438} {"train_loss": -9.413520812988281, "global_step": 73608, "epoch": 438} {"train_loss": -8.831583976745605, "global_step": 73609, "epoch": 438} {"train_loss": -8.882916450500488, "global_step": 73610, "epoch": 438} {"train_loss": -9.090604782104492, "global_step": 73611, "epoch": 438} {"train_loss": -9.163904190063477, "global_step": 73612, "epoch": 438} {"train_loss": -9.328391075134277, "global_step": 73613, "epoch": 438} {"train_loss": -9.109684944152832, "global_step": 73614, "epoch": 438} {"train_loss": -9.080608367919922, "global_step": 73615, "epoch": 438} {"train_loss": -9.116186141967773, "global_step": 73616, "epoch": 438} {"train_loss": -9.378303527832031, "global_step": 73617, "epoch": 438} {"train_loss": -9.180248260498047, "global_step": 73618, "epoch": 438} {"train_loss": -9.231758117675781, "global_step": 73619, "epoch": 438} {"train_loss": -9.125263214111328, "global_step": 73620, "epoch": 438} {"train_loss": -9.207489013671875, "global_step": 73621, "epoch": 438} {"train_loss": -9.070870399475098, "global_step": 73622, "epoch": 438} {"train_loss": -9.015291213989258, "global_step": 73623, "epoch": 438} {"train_loss": -9.084799766540527, "global_step": 73624, "epoch": 438} {"train_loss": -9.01053524017334, "global_step": 73625, "epoch": 438} {"train_loss": -9.046114921569824, "global_step": 73626, "epoch": 438} {"train_loss": -8.729718208312988, "global_step": 73627, "epoch": 438} {"train_loss": -9.071651458740234, "global_step": 73628, "epoch": 438} {"train_loss": -8.923208236694336, "global_step": 73629, "epoch": 438} {"train_loss": -8.382131576538086, "global_step": 73630, "epoch": 438} {"train_loss": -8.624889373779297, "global_step": 73631, "epoch": 438} {"train_loss": -8.552573204040527, "global_step": 73632, "epoch": 438} {"train_loss": -8.63815975189209, "global_step": 73633, "epoch": 438} {"train_loss": -8.933140754699707, "global_step": 73634, "epoch": 438} {"train_loss": -8.848983764648438, "global_step": 73635, "epoch": 438} {"train_loss": -8.770379066467285, "global_step": 73636, "epoch": 438} {"train_loss": -8.7272367477417, "global_step": 73637, "epoch": 438} {"train_loss": -8.698675155639648, "global_step": 73638, "epoch": 438} {"train_loss": -8.669905662536621, "global_step": 73639, "epoch": 438} {"train_loss": -8.95181655883789, "global_step": 73640, "epoch": 438} {"train_loss": -8.687246322631836, "global_step": 73641, "epoch": 438} {"train_loss": -8.930915832519531, "global_step": 73642, "epoch": 438} {"train_loss": -8.782305717468262, "global_step": 73643, "epoch": 438} {"train_loss": -8.870494842529297, "global_step": 73644, "epoch": 438} {"train_loss": -8.969306945800781, "global_step": 73645, "epoch": 438} {"train_loss": -8.612425804138184, "global_step": 73646, "epoch": 438} {"train_loss": -8.732076644897461, "global_step": 73647, "epoch": 438} {"train_loss": -9.100956916809082, "global_step": 73648, "epoch": 438} {"train_loss": -8.662425994873047, "global_step": 73649, "epoch": 438} {"train_loss": -8.883447647094727, "global_step": 73650, "epoch": 438} {"train_loss": -9.001777648925781, "global_step": 73651, "epoch": 438} {"train_loss": -8.919249534606934, "global_step": 73652, "epoch": 438} {"train_loss": -9.011076927185059, "global_step": 73653, "epoch": 438} {"train_loss": -9.020745277404785, "global_step": 73654, "epoch": 438} {"train_loss": -9.02821159362793, "global_step": 73655, "epoch": 438} {"train_loss": -9.100034713745117, "global_step": 73656, "epoch": 438} {"train_loss": -9.169364929199219, "global_step": 73657, "epoch": 438} {"train_loss": -9.014280319213867, "global_step": 73658, "epoch": 438} {"train_loss": -9.09504508972168, "global_step": 73659, "epoch": 438} {"train_loss": -9.033140182495117, "global_step": 73660, "epoch": 438} {"train_loss": -8.994815826416016, "global_step": 73661, "epoch": 438} {"train_loss": -9.178715705871582, "global_step": 73662, "epoch": 438} {"train_loss": -8.70345687866211, "global_step": 73663, "epoch": 438} {"train_loss": -9.180269241333008, "global_step": 73664, "epoch": 438} {"train_loss": -8.812230110168457, "global_step": 73665, "epoch": 438} {"train_loss": -8.862476348876953, "global_step": 73666, "epoch": 438} {"train_loss": -9.045201301574707, "global_step": 73667, "epoch": 438} {"train_loss": -9.208334922790527, "global_step": 73668, "epoch": 438} {"train_loss": -9.220212936401367, "global_step": 73669, "epoch": 438} {"train_loss": -9.15944766998291, "global_step": 73670, "epoch": 438} {"train_loss": -9.1444730758667, "global_step": 73671, "epoch": 438} {"train_loss": -9.208101272583008, "global_step": 73672, "epoch": 438} {"train_loss": -9.076194763183594, "global_step": 73673, "epoch": 438} {"train_loss": -9.29899787902832, "global_step": 73674, "epoch": 438} {"train_loss": -9.029047012329102, "global_step": 73675, "epoch": 438} {"train_loss": -9.31751823425293, "global_step": 73676, "epoch": 438} {"train_loss": -8.942155838012695, "global_step": 73677, "epoch": 438} {"train_loss": -9.031227111816406, "global_step": 73678, "epoch": 438} {"train_loss": -9.218362808227539, "global_step": 73679, "epoch": 438} {"train_loss": -9.130645751953125, "global_step": 73680, "epoch": 438} {"train_loss": -8.682149887084961, "global_step": 73681, "epoch": 438} {"train_loss": -8.9738130569458, "global_step": 73682, "epoch": 438} {"train_loss": -8.902870178222656, "global_step": 73683, "epoch": 438} {"train_loss": -8.920634269714355, "global_step": 73684, "epoch": 438} {"train_loss": -9.13155746459961, "global_step": 73685, "epoch": 438} {"train_loss": -8.530248641967773, "global_step": 73686, "epoch": 438} {"train_loss": -8.915464401245117, "global_step": 73687, "epoch": 438} {"train_loss": -8.61361026763916, "global_step": 73688, "epoch": 438} {"train_loss": -8.967506408691406, "global_step": 73689, "epoch": 438} {"train_loss": -8.813995361328125, "global_step": 73690, "epoch": 438} {"train_loss": -8.776734352111816, "global_step": 73691, "epoch": 438} {"train_loss": -8.837085723876953, "global_step": 73692, "epoch": 438} {"train_loss": -8.815508842468262, "global_step": 73693, "epoch": 438} {"train_loss": -8.83975887298584, "global_step": 73694, "epoch": 438} {"train_loss": -8.823371887207031, "global_step": 73695, "epoch": 438} {"train_loss": -8.805837631225586, "global_step": 73696, "epoch": 438} {"train_loss": -8.96523666381836, "global_step": 73697, "epoch": 438} {"train_loss": -8.86497688293457, "global_step": 73698, "epoch": 438} {"train_loss": -8.974349975585938, "global_step": 73699, "epoch": 438} {"train_loss": -9.062708854675293, "global_step": 73700, "epoch": 438} {"train_loss": -8.906978607177734, "global_step": 73701, "epoch": 438} {"train_loss": -8.936180114746094, "global_step": 73702, "epoch": 438} {"train_loss": -9.005531311035156, "global_step": 73703, "epoch": 438} {"train_loss": -9.199819564819336, "global_step": 73704, "epoch": 438} {"train_loss": -9.17686653137207, "global_step": 73705, "epoch": 438} {"train_loss": -9.032127380371094, "global_step": 73706, "epoch": 438} {"train_loss": -8.992729187011719, "global_step": 73707, "epoch": 438} {"train_loss": -9.325284957885742, "global_step": 73708, "epoch": 438} {"train_loss": -9.17396354675293, "global_step": 73709, "epoch": 438} {"train_loss": -8.952096939086914, "global_step": 73710, "epoch": 438} {"train_loss": -9.37792682647705, "global_step": 73711, "epoch": 438} {"train_loss": -9.025863647460938, "global_step": 73712, "epoch": 438} {"train_loss": -9.197383880615234, "global_step": 73713, "epoch": 438} {"train_loss": -9.039872169494629, "global_step": 73714, "epoch": 438} {"train_loss": -9.260311126708984, "global_step": 73715, "epoch": 438} {"train_loss": -9.228160858154297, "global_step": 73716, "epoch": 438} {"train_loss": -8.983922958374023, "global_step": 73717, "epoch": 438} {"train_loss": -9.195351600646973, "global_step": 73718, "epoch": 438} {"train_loss": -9.109329223632812, "global_step": 73719, "epoch": 438} {"train_loss": -9.134471893310547, "global_step": 73720, "epoch": 438} {"train_loss": -9.077239990234375, "global_step": 73721, "epoch": 438} {"train_loss": -9.08028793334961, "global_step": 73722, "epoch": 438} {"train_loss": -9.075697898864746, "global_step": 73723, "epoch": 438} {"train_loss": -9.11953067779541, "global_step": 73724, "epoch": 438} {"train_loss": -8.969663619995117, "global_step": 73725, "epoch": 438} {"train_loss": -8.855091094970703, "global_step": 73726, "epoch": 438} {"train_loss": -8.805824279785156, "global_step": 73727, "epoch": 438} {"train_loss": -9.18960952758789, "global_step": 73728, "epoch": 438} {"train_loss": -9.17142391204834, "global_step": 73729, "epoch": 438} {"train_loss": -9.049038887023926, "global_step": 73730, "epoch": 438} {"train_loss": -9.041342735290527, "global_step": 73731, "epoch": 438} {"train_loss": -9.163809776306152, "global_step": 73732, "epoch": 438} {"train_loss": -8.924055099487305, "global_step": 73733, "epoch": 438} {"train_loss": -8.708932876586914, "global_step": 73734, "epoch": 438} {"train_loss": -9.020224571228027, "global_step": 73735, "epoch": 438} {"train_loss": -8.381067276000977, "global_step": 73736, "epoch": 438} {"train_loss": -9.056862831115723, "global_step": 73737, "epoch": 438} {"train_loss": -8.785063743591309, "global_step": 73738, "epoch": 438} {"train_loss": -8.881020545959473, "global_step": 73739, "epoch": 438} {"train_loss": -8.756452560424805, "global_step": 73740, "epoch": 438} {"train_loss": -9.040033340454102, "global_step": 73741, "epoch": 438} {"train_loss": -9.059013366699219, "global_step": 73742, "epoch": 438} {"train_loss": -8.890149116516113, "global_step": 73743, "epoch": 438} {"train_loss": -9.039773941040039, "global_step": 73744, "epoch": 438} {"train_loss": -9.040498733520508, "global_step": 73745, "epoch": 438} {"train_loss": -9.003960609436035, "global_step": 73746, "epoch": 438} {"train_loss": -9.164058685302734, "global_step": 73747, "epoch": 438} {"train_loss": -9.248296737670898, "global_step": 73748, "epoch": 438} {"train_loss": -8.909070014953613, "global_step": 73749, "epoch": 438} {"train_loss": -8.842704772949219, "global_step": 73750, "epoch": 438} {"train_loss": -9.009920216742016, "global_step": 73751, "epoch": 438, "val_loss": 194636.265625} {"train_loss": -8.83775806427002, "global_step": 73752, "epoch": 439} {"train_loss": -8.871978759765625, "global_step": 73753, "epoch": 439} {"train_loss": -8.88161849975586, "global_step": 73754, "epoch": 439} {"train_loss": -8.953969955444336, "global_step": 73755, "epoch": 439} {"train_loss": -8.871559143066406, "global_step": 73756, "epoch": 439} {"train_loss": -8.829345703125, "global_step": 73757, "epoch": 439} {"train_loss": -8.960541725158691, "global_step": 73758, "epoch": 439} {"train_loss": -8.988983154296875, "global_step": 73759, "epoch": 439} {"train_loss": -8.568140983581543, "global_step": 73760, "epoch": 439} {"train_loss": -8.800076484680176, "global_step": 73761, "epoch": 439} {"train_loss": -8.915812492370605, "global_step": 73762, "epoch": 439} {"train_loss": -8.80136489868164, "global_step": 73763, "epoch": 439} {"train_loss": -9.01374626159668, "global_step": 73764, "epoch": 439} {"train_loss": -8.502886772155762, "global_step": 73765, "epoch": 439} {"train_loss": -9.07841682434082, "global_step": 73766, "epoch": 439} {"train_loss": -8.811860084533691, "global_step": 73767, "epoch": 439} {"train_loss": -8.866939544677734, "global_step": 73768, "epoch": 439} {"train_loss": -9.082599639892578, "global_step": 73769, "epoch": 439} {"train_loss": -9.034394264221191, "global_step": 73770, "epoch": 439} {"train_loss": -8.932312965393066, "global_step": 73771, "epoch": 439} {"train_loss": -9.119799613952637, "global_step": 73772, "epoch": 439} {"train_loss": -8.919240951538086, "global_step": 73773, "epoch": 439} {"train_loss": -9.08712100982666, "global_step": 73774, "epoch": 439} {"train_loss": -9.188672065734863, "global_step": 73775, "epoch": 439} {"train_loss": -9.140332221984863, "global_step": 73776, "epoch": 439} {"train_loss": -8.98826789855957, "global_step": 73777, "epoch": 439} {"train_loss": -9.095808029174805, "global_step": 73778, "epoch": 439} {"train_loss": -8.913339614868164, "global_step": 73779, "epoch": 439} {"train_loss": -9.041853904724121, "global_step": 73780, "epoch": 439} {"train_loss": -9.23790454864502, "global_step": 73781, "epoch": 439} {"train_loss": -9.048873901367188, "global_step": 73782, "epoch": 439} {"train_loss": -8.859171867370605, "global_step": 73783, "epoch": 439} {"train_loss": -9.184599876403809, "global_step": 73784, "epoch": 439} {"train_loss": -9.064332962036133, "global_step": 73785, "epoch": 439} {"train_loss": -9.014425277709961, "global_step": 73786, "epoch": 439} {"train_loss": -8.836923599243164, "global_step": 73787, "epoch": 439} {"train_loss": -8.64634895324707, "global_step": 73788, "epoch": 439} {"train_loss": -8.981062889099121, "global_step": 73789, "epoch": 439} {"train_loss": -8.86098861694336, "global_step": 73790, "epoch": 439} {"train_loss": -8.99954605102539, "global_step": 73791, "epoch": 439} {"train_loss": -9.123661994934082, "global_step": 73792, "epoch": 439} {"train_loss": -8.988354682922363, "global_step": 73793, "epoch": 439} {"train_loss": -8.885176658630371, "global_step": 73794, "epoch": 439} {"train_loss": -8.993818283081055, "global_step": 73795, "epoch": 439} {"train_loss": -9.11836051940918, "global_step": 73796, "epoch": 439} {"train_loss": -8.94512939453125, "global_step": 73797, "epoch": 439} {"train_loss": -9.16827392578125, "global_step": 73798, "epoch": 439} {"train_loss": -8.891661643981934, "global_step": 73799, "epoch": 439} {"train_loss": -9.19306468963623, "global_step": 73800, "epoch": 439} {"train_loss": -9.196752548217773, "global_step": 73801, "epoch": 439} {"train_loss": -8.876655578613281, "global_step": 73802, "epoch": 439} {"train_loss": -9.16157054901123, "global_step": 73803, "epoch": 439} {"train_loss": -9.014436721801758, "global_step": 73804, "epoch": 439} {"train_loss": -8.993448257446289, "global_step": 73805, "epoch": 439} {"train_loss": -8.796395301818848, "global_step": 73806, "epoch": 439} {"train_loss": -9.145698547363281, "global_step": 73807, "epoch": 439} {"train_loss": -8.692813873291016, "global_step": 73808, "epoch": 439} {"train_loss": -8.918184280395508, "global_step": 73809, "epoch": 439} {"train_loss": -8.537073135375977, "global_step": 73810, "epoch": 439} {"train_loss": -9.105037689208984, "global_step": 73811, "epoch": 439} {"train_loss": -8.67626953125, "global_step": 73812, "epoch": 439} {"train_loss": -8.619619369506836, "global_step": 73813, "epoch": 439} {"train_loss": -8.721210479736328, "global_step": 73814, "epoch": 439} {"train_loss": -8.808194160461426, "global_step": 73815, "epoch": 439} {"train_loss": -8.397140502929688, "global_step": 73816, "epoch": 439} {"train_loss": -8.766860961914062, "global_step": 73817, "epoch": 439} {"train_loss": -8.67660903930664, "global_step": 73818, "epoch": 439} {"train_loss": -8.789227485656738, "global_step": 73819, "epoch": 439} {"train_loss": -8.748099327087402, "global_step": 73820, "epoch": 439} {"train_loss": -8.92339038848877, "global_step": 73821, "epoch": 439} {"train_loss": -8.693065643310547, "global_step": 73822, "epoch": 439} {"train_loss": -8.731945991516113, "global_step": 73823, "epoch": 439} {"train_loss": -8.890361785888672, "global_step": 73824, "epoch": 439} {"train_loss": -8.900153160095215, "global_step": 73825, "epoch": 439} {"train_loss": -8.963760375976562, "global_step": 73826, "epoch": 439} {"train_loss": -9.01489543914795, "global_step": 73827, "epoch": 439} {"train_loss": -9.105875015258789, "global_step": 73828, "epoch": 439} {"train_loss": -8.943004608154297, "global_step": 73829, "epoch": 439} {"train_loss": -9.114433288574219, "global_step": 73830, "epoch": 439} {"train_loss": -9.074661254882812, "global_step": 73831, "epoch": 439} {"train_loss": -8.695561408996582, "global_step": 73832, "epoch": 439} {"train_loss": -8.95186710357666, "global_step": 73833, "epoch": 439} {"train_loss": -9.111496925354004, "global_step": 73834, "epoch": 439} {"train_loss": -8.953388214111328, "global_step": 73835, "epoch": 439} {"train_loss": -9.010242462158203, "global_step": 73836, "epoch": 439} {"train_loss": -9.128994941711426, "global_step": 73837, "epoch": 439} {"train_loss": -8.991060256958008, "global_step": 73838, "epoch": 439} {"train_loss": -9.016919136047363, "global_step": 73839, "epoch": 439} {"train_loss": -9.116047859191895, "global_step": 73840, "epoch": 439} {"train_loss": -8.961418151855469, "global_step": 73841, "epoch": 439} {"train_loss": -9.073461532592773, "global_step": 73842, "epoch": 439} {"train_loss": -9.079545021057129, "global_step": 73843, "epoch": 439} {"train_loss": -9.221590042114258, "global_step": 73844, "epoch": 439} {"train_loss": -9.2783784866333, "global_step": 73845, "epoch": 439} {"train_loss": -9.067437171936035, "global_step": 73846, "epoch": 439} {"train_loss": -9.00728988647461, "global_step": 73847, "epoch": 439} {"train_loss": -9.126171112060547, "global_step": 73848, "epoch": 439} {"train_loss": -9.088829040527344, "global_step": 73849, "epoch": 439} {"train_loss": -9.027851104736328, "global_step": 73850, "epoch": 439} {"train_loss": -8.715330123901367, "global_step": 73851, "epoch": 439} {"train_loss": -9.331388473510742, "global_step": 73852, "epoch": 439} {"train_loss": -9.01240348815918, "global_step": 73853, "epoch": 439} {"train_loss": -9.091729164123535, "global_step": 73854, "epoch": 439} {"train_loss": -9.068113327026367, "global_step": 73855, "epoch": 439} {"train_loss": -9.043519973754883, "global_step": 73856, "epoch": 439} {"train_loss": -8.883749008178711, "global_step": 73857, "epoch": 439} {"train_loss": -9.073263168334961, "global_step": 73858, "epoch": 439} {"train_loss": -9.143159866333008, "global_step": 73859, "epoch": 439} {"train_loss": -9.227405548095703, "global_step": 73860, "epoch": 439} {"train_loss": -8.86532974243164, "global_step": 73861, "epoch": 439} {"train_loss": -9.2891206741333, "global_step": 73862, "epoch": 439} {"train_loss": -9.20396614074707, "global_step": 73863, "epoch": 439} {"train_loss": -9.130500793457031, "global_step": 73864, "epoch": 439} {"train_loss": -9.153522491455078, "global_step": 73865, "epoch": 439} {"train_loss": -9.03622817993164, "global_step": 73866, "epoch": 439} {"train_loss": -9.268762588500977, "global_step": 73867, "epoch": 439} {"train_loss": -8.891891479492188, "global_step": 73868, "epoch": 439} {"train_loss": -9.08241081237793, "global_step": 73869, "epoch": 439} {"train_loss": -9.013212203979492, "global_step": 73870, "epoch": 439} {"train_loss": -9.081855773925781, "global_step": 73871, "epoch": 439} {"train_loss": -9.030728340148926, "global_step": 73872, "epoch": 439} {"train_loss": -8.994505882263184, "global_step": 73873, "epoch": 439} {"train_loss": -9.037131309509277, "global_step": 73874, "epoch": 439} {"train_loss": -9.04246711730957, "global_step": 73875, "epoch": 439} {"train_loss": -8.933289527893066, "global_step": 73876, "epoch": 439} {"train_loss": -8.979329109191895, "global_step": 73877, "epoch": 439} {"train_loss": -8.97162914276123, "global_step": 73878, "epoch": 439} {"train_loss": -9.223260879516602, "global_step": 73879, "epoch": 439} {"train_loss": -8.849287033081055, "global_step": 73880, "epoch": 439} {"train_loss": -9.171894073486328, "global_step": 73881, "epoch": 439} {"train_loss": -9.25051212310791, "global_step": 73882, "epoch": 439} {"train_loss": -8.531925201416016, "global_step": 73883, "epoch": 439} {"train_loss": -9.166633605957031, "global_step": 73884, "epoch": 439} {"train_loss": -8.724242210388184, "global_step": 73885, "epoch": 439} {"train_loss": -9.169726371765137, "global_step": 73886, "epoch": 439} {"train_loss": -8.940811157226562, "global_step": 73887, "epoch": 439} {"train_loss": -9.017779350280762, "global_step": 73888, "epoch": 439} {"train_loss": -8.887591361999512, "global_step": 73889, "epoch": 439} {"train_loss": -8.906991958618164, "global_step": 73890, "epoch": 439} {"train_loss": -9.1953125, "global_step": 73891, "epoch": 439} {"train_loss": -8.913408279418945, "global_step": 73892, "epoch": 439} {"train_loss": -9.03219985961914, "global_step": 73893, "epoch": 439} {"train_loss": -9.238039016723633, "global_step": 73894, "epoch": 439} {"train_loss": -9.042396545410156, "global_step": 73895, "epoch": 439} {"train_loss": -9.047647476196289, "global_step": 73896, "epoch": 439} {"train_loss": -8.86076545715332, "global_step": 73897, "epoch": 439} {"train_loss": -8.839683532714844, "global_step": 73898, "epoch": 439} {"train_loss": -8.888216018676758, "global_step": 73899, "epoch": 439} {"train_loss": -8.939779281616211, "global_step": 73900, "epoch": 439} {"train_loss": -8.894601821899414, "global_step": 73901, "epoch": 439} {"train_loss": -9.116641998291016, "global_step": 73902, "epoch": 439} {"train_loss": -9.097748756408691, "global_step": 73903, "epoch": 439} {"train_loss": -8.988090515136719, "global_step": 73904, "epoch": 439} {"train_loss": -8.757696151733398, "global_step": 73905, "epoch": 439} {"train_loss": -9.164344787597656, "global_step": 73906, "epoch": 439} {"train_loss": -8.75535774230957, "global_step": 73907, "epoch": 439} {"train_loss": -8.89885139465332, "global_step": 73908, "epoch": 439} {"train_loss": -8.66024398803711, "global_step": 73909, "epoch": 439} {"train_loss": -9.074867248535156, "global_step": 73910, "epoch": 439} {"train_loss": -8.873309135437012, "global_step": 73911, "epoch": 439} {"train_loss": -9.024696350097656, "global_step": 73912, "epoch": 439} {"train_loss": -9.01187515258789, "global_step": 73913, "epoch": 439} {"train_loss": -8.926457405090332, "global_step": 73914, "epoch": 439} {"train_loss": -8.915125846862793, "global_step": 73915, "epoch": 439} {"train_loss": -8.880643844604492, "global_step": 73916, "epoch": 439} {"train_loss": -8.841769218444824, "global_step": 73917, "epoch": 439} {"train_loss": -8.992883682250977, "global_step": 73918, "epoch": 439} {"train_loss": -8.97256388550713, "global_step": 73919, "epoch": 439, "val_loss": 194933.0625} {"train_loss": -8.822795867919922, "global_step": 73920, "epoch": 440} {"train_loss": -8.847461700439453, "global_step": 73921, "epoch": 440} {"train_loss": -9.228836059570312, "global_step": 73922, "epoch": 440} {"train_loss": -8.886670112609863, "global_step": 73923, "epoch": 440} {"train_loss": -8.993807792663574, "global_step": 73924, "epoch": 440} {"train_loss": -9.065932273864746, "global_step": 73925, "epoch": 440} {"train_loss": -9.139873504638672, "global_step": 73926, "epoch": 440} {"train_loss": -8.94847583770752, "global_step": 73927, "epoch": 440} {"train_loss": -9.042847633361816, "global_step": 73928, "epoch": 440} {"train_loss": -8.747127532958984, "global_step": 73929, "epoch": 440} {"train_loss": -9.13098430633545, "global_step": 73930, "epoch": 440} {"train_loss": -8.904746055603027, "global_step": 73931, "epoch": 440} {"train_loss": -9.062762260437012, "global_step": 73932, "epoch": 440} {"train_loss": -8.976310729980469, "global_step": 73933, "epoch": 440} {"train_loss": -8.96224594116211, "global_step": 73934, "epoch": 440} {"train_loss": -8.987775802612305, "global_step": 73935, "epoch": 440} {"train_loss": -9.21638298034668, "global_step": 73936, "epoch": 440} {"train_loss": -8.927478790283203, "global_step": 73937, "epoch": 440} {"train_loss": -8.748502731323242, "global_step": 73938, "epoch": 440} {"train_loss": -8.972166061401367, "global_step": 73939, "epoch": 440} {"train_loss": -8.958555221557617, "global_step": 73940, "epoch": 440} {"train_loss": -9.045026779174805, "global_step": 73941, "epoch": 440} {"train_loss": -8.929709434509277, "global_step": 73942, "epoch": 440} {"train_loss": -9.14675521850586, "global_step": 73943, "epoch": 440} {"train_loss": -8.843552589416504, "global_step": 73944, "epoch": 440} {"train_loss": -8.823614120483398, "global_step": 73945, "epoch": 440} {"train_loss": -8.986875534057617, "global_step": 73946, "epoch": 440} {"train_loss": -9.127656936645508, "global_step": 73947, "epoch": 440} {"train_loss": -8.395467758178711, "global_step": 73948, "epoch": 440} {"train_loss": -9.079605102539062, "global_step": 73949, "epoch": 440} {"train_loss": -8.797983169555664, "global_step": 73950, "epoch": 440} {"train_loss": -8.946637153625488, "global_step": 73951, "epoch": 440} {"train_loss": -9.062694549560547, "global_step": 73952, "epoch": 440} {"train_loss": -8.978132247924805, "global_step": 73953, "epoch": 440} {"train_loss": -8.890974044799805, "global_step": 73954, "epoch": 440} {"train_loss": -9.033426284790039, "global_step": 73955, "epoch": 440} {"train_loss": -9.202577590942383, "global_step": 73956, "epoch": 440} {"train_loss": -9.062376976013184, "global_step": 73957, "epoch": 440} {"train_loss": -8.860208511352539, "global_step": 73958, "epoch": 440} {"train_loss": -8.989185333251953, "global_step": 73959, "epoch": 440} {"train_loss": -9.091416358947754, "global_step": 73960, "epoch": 440} {"train_loss": -8.834590911865234, "global_step": 73961, "epoch": 440} {"train_loss": -8.962188720703125, "global_step": 73962, "epoch": 440} {"train_loss": -9.192939758300781, "global_step": 73963, "epoch": 440} {"train_loss": -9.059026718139648, "global_step": 73964, "epoch": 440} {"train_loss": -8.873720169067383, "global_step": 73965, "epoch": 440} {"train_loss": -9.105603218078613, "global_step": 73966, "epoch": 440} {"train_loss": -9.1298189163208, "global_step": 73967, "epoch": 440} {"train_loss": -9.177205085754395, "global_step": 73968, "epoch": 440} {"train_loss": -9.211616516113281, "global_step": 73969, "epoch": 440} {"train_loss": -9.021079063415527, "global_step": 73970, "epoch": 440} {"train_loss": -9.297172546386719, "global_step": 73971, "epoch": 440} {"train_loss": -9.320005416870117, "global_step": 73972, "epoch": 440} {"train_loss": -8.99976921081543, "global_step": 73973, "epoch": 440} {"train_loss": -9.24034309387207, "global_step": 73974, "epoch": 440} {"train_loss": -9.068694114685059, "global_step": 73975, "epoch": 440} {"train_loss": -8.813528060913086, "global_step": 73976, "epoch": 440} {"train_loss": -8.924322128295898, "global_step": 73977, "epoch": 440} {"train_loss": -9.156755447387695, "global_step": 73978, "epoch": 440} {"train_loss": -8.716928482055664, "global_step": 73979, "epoch": 440} {"train_loss": -8.735761642456055, "global_step": 73980, "epoch": 440} {"train_loss": -8.821197509765625, "global_step": 73981, "epoch": 440} {"train_loss": -8.861143112182617, "global_step": 73982, "epoch": 440} {"train_loss": -8.66541862487793, "global_step": 73983, "epoch": 440} {"train_loss": -8.713188171386719, "global_step": 73984, "epoch": 440} {"train_loss": -8.706283569335938, "global_step": 73985, "epoch": 440} {"train_loss": -8.78697395324707, "global_step": 73986, "epoch": 440} {"train_loss": -8.998891830444336, "global_step": 73987, "epoch": 440} {"train_loss": -8.9786376953125, "global_step": 73988, "epoch": 440} {"train_loss": -8.968929290771484, "global_step": 73989, "epoch": 440} {"train_loss": -8.941913604736328, "global_step": 73990, "epoch": 440} {"train_loss": -8.499359130859375, "global_step": 73991, "epoch": 440} {"train_loss": -8.715919494628906, "global_step": 73992, "epoch": 440} {"train_loss": -8.858043670654297, "global_step": 73993, "epoch": 440} {"train_loss": -8.835891723632812, "global_step": 73994, "epoch": 440} {"train_loss": -9.09465217590332, "global_step": 73995, "epoch": 440} {"train_loss": -9.012964248657227, "global_step": 73996, "epoch": 440} {"train_loss": -9.010665893554688, "global_step": 73997, "epoch": 440} {"train_loss": -9.04682731628418, "global_step": 73998, "epoch": 440} {"train_loss": -8.847579956054688, "global_step": 73999, "epoch": 440} {"train_loss": -8.941987991333008, "global_step": 74000, "epoch": 440} {"train_loss": -8.824198722839355, "global_step": 74001, "epoch": 440} {"train_loss": -8.94743537902832, "global_step": 74002, "epoch": 440} {"train_loss": -8.947491645812988, "global_step": 74003, "epoch": 440} {"train_loss": -9.086406707763672, "global_step": 74004, "epoch": 440} {"train_loss": -8.721610069274902, "global_step": 74005, "epoch": 440} {"train_loss": -8.946395874023438, "global_step": 74006, "epoch": 440} {"train_loss": -9.119003295898438, "global_step": 74007, "epoch": 440} {"train_loss": -8.924683570861816, "global_step": 74008, "epoch": 440} {"train_loss": -8.982614517211914, "global_step": 74009, "epoch": 440} {"train_loss": -8.987815856933594, "global_step": 74010, "epoch": 440} {"train_loss": -9.123170852661133, "global_step": 74011, "epoch": 440} {"train_loss": -9.037382125854492, "global_step": 74012, "epoch": 440} {"train_loss": -9.052064895629883, "global_step": 74013, "epoch": 440} {"train_loss": -9.280250549316406, "global_step": 74014, "epoch": 440} {"train_loss": -8.906950950622559, "global_step": 74015, "epoch": 440} {"train_loss": -9.084406852722168, "global_step": 74016, "epoch": 440} {"train_loss": -9.166744232177734, "global_step": 74017, "epoch": 440} {"train_loss": -9.017223358154297, "global_step": 74018, "epoch": 440} {"train_loss": -9.328081130981445, "global_step": 74019, "epoch": 440} {"train_loss": -8.968097686767578, "global_step": 74020, "epoch": 440} {"train_loss": -8.957844734191895, "global_step": 74021, "epoch": 440} {"train_loss": -9.165626525878906, "global_step": 74022, "epoch": 440} {"train_loss": -9.033963203430176, "global_step": 74023, "epoch": 440} {"train_loss": -9.35023021697998, "global_step": 74024, "epoch": 440} {"train_loss": -9.179129600524902, "global_step": 74025, "epoch": 440} {"train_loss": -9.230962753295898, "global_step": 74026, "epoch": 440} {"train_loss": -9.241665840148926, "global_step": 74027, "epoch": 440} {"train_loss": -9.241166114807129, "global_step": 74028, "epoch": 440} {"train_loss": -9.145716667175293, "global_step": 74029, "epoch": 440} {"train_loss": -9.197973251342773, "global_step": 74030, "epoch": 440} {"train_loss": -8.984105110168457, "global_step": 74031, "epoch": 440} {"train_loss": -9.203571319580078, "global_step": 74032, "epoch": 440} {"train_loss": -9.144542694091797, "global_step": 74033, "epoch": 440} {"train_loss": -9.095792770385742, "global_step": 74034, "epoch": 440} {"train_loss": -9.17756462097168, "global_step": 74035, "epoch": 440} {"train_loss": -9.00054931640625, "global_step": 74036, "epoch": 440} {"train_loss": -9.014150619506836, "global_step": 74037, "epoch": 440} {"train_loss": -9.189369201660156, "global_step": 74038, "epoch": 440} {"train_loss": -9.033531188964844, "global_step": 74039, "epoch": 440} {"train_loss": -9.085212707519531, "global_step": 74040, "epoch": 440} {"train_loss": -8.839025497436523, "global_step": 74041, "epoch": 440} {"train_loss": -8.908004760742188, "global_step": 74042, "epoch": 440} {"train_loss": -9.37939453125, "global_step": 74043, "epoch": 440} {"train_loss": -8.651631355285645, "global_step": 74044, "epoch": 440} {"train_loss": -9.189895629882812, "global_step": 74045, "epoch": 440} {"train_loss": -8.803959846496582, "global_step": 74046, "epoch": 440} {"train_loss": -8.876060485839844, "global_step": 74047, "epoch": 440} {"train_loss": -8.922796249389648, "global_step": 74048, "epoch": 440} {"train_loss": -8.805473327636719, "global_step": 74049, "epoch": 440} {"train_loss": -8.786460876464844, "global_step": 74050, "epoch": 440} {"train_loss": -8.929408073425293, "global_step": 74051, "epoch": 440} {"train_loss": -8.621562957763672, "global_step": 74052, "epoch": 440} {"train_loss": -8.94580078125, "global_step": 74053, "epoch": 440} {"train_loss": -8.920072555541992, "global_step": 74054, "epoch": 440} {"train_loss": -8.842376708984375, "global_step": 74055, "epoch": 440} {"train_loss": -8.898695945739746, "global_step": 74056, "epoch": 440} {"train_loss": -8.959152221679688, "global_step": 74057, "epoch": 440} {"train_loss": -8.748183250427246, "global_step": 74058, "epoch": 440} {"train_loss": -9.043901443481445, "global_step": 74059, "epoch": 440} {"train_loss": -9.119062423706055, "global_step": 74060, "epoch": 440} {"train_loss": -8.889730453491211, "global_step": 74061, "epoch": 440} {"train_loss": -8.946589469909668, "global_step": 74062, "epoch": 440} {"train_loss": -9.097888946533203, "global_step": 74063, "epoch": 440} {"train_loss": -8.695514678955078, "global_step": 74064, "epoch": 440} {"train_loss": -9.210436820983887, "global_step": 74065, "epoch": 440} {"train_loss": -9.187932014465332, "global_step": 74066, "epoch": 440} {"train_loss": -8.910085678100586, "global_step": 74067, "epoch": 440} {"train_loss": -8.956953048706055, "global_step": 74068, "epoch": 440} {"train_loss": -9.169212341308594, "global_step": 74069, "epoch": 440} {"train_loss": -9.244214057922363, "global_step": 74070, "epoch": 440} {"train_loss": -9.254559516906738, "global_step": 74071, "epoch": 440} {"train_loss": -9.072107315063477, "global_step": 74072, "epoch": 440} {"train_loss": -9.102861404418945, "global_step": 74073, "epoch": 440} {"train_loss": -9.23167610168457, "global_step": 74074, "epoch": 440} {"train_loss": -9.275617599487305, "global_step": 74075, "epoch": 440} {"train_loss": -9.24049186706543, "global_step": 74076, "epoch": 440} {"train_loss": -9.166324615478516, "global_step": 74077, "epoch": 440} {"train_loss": -9.277212142944336, "global_step": 74078, "epoch": 440} {"train_loss": -9.280133247375488, "global_step": 74079, "epoch": 440} {"train_loss": -9.346624374389648, "global_step": 74080, "epoch": 440} {"train_loss": -8.906359672546387, "global_step": 74081, "epoch": 440} {"train_loss": -9.125669479370117, "global_step": 74082, "epoch": 440} {"train_loss": -9.061906814575195, "global_step": 74083, "epoch": 440} {"train_loss": -9.231497764587402, "global_step": 74084, "epoch": 440} {"train_loss": -9.180233001708984, "global_step": 74085, "epoch": 440} {"train_loss": -8.975813865661621, "global_step": 74086, "epoch": 440} {"train_loss": -9.009539195469447, "global_step": 74087, "epoch": 440, "val_loss": 195984.5, "train_action_mse_error": 8.191181182861328} {"train_loss": -9.07362174987793, "global_step": 74088, "epoch": 441} {"train_loss": -9.244392395019531, "global_step": 74089, "epoch": 441} {"train_loss": -9.013294219970703, "global_step": 74090, "epoch": 441} {"train_loss": -9.00902271270752, "global_step": 74091, "epoch": 441} {"train_loss": -9.04792594909668, "global_step": 74092, "epoch": 441} {"train_loss": -8.54382610321045, "global_step": 74093, "epoch": 441} {"train_loss": -8.599916458129883, "global_step": 74094, "epoch": 441} {"train_loss": -8.845893859863281, "global_step": 74095, "epoch": 441} {"train_loss": -8.564469337463379, "global_step": 74096, "epoch": 441} {"train_loss": -8.784322738647461, "global_step": 74097, "epoch": 441} {"train_loss": -8.630566596984863, "global_step": 74098, "epoch": 441} {"train_loss": -8.662260055541992, "global_step": 74099, "epoch": 441} {"train_loss": -8.691961288452148, "global_step": 74100, "epoch": 441} {"train_loss": -8.799654006958008, "global_step": 74101, "epoch": 441} {"train_loss": -8.73652172088623, "global_step": 74102, "epoch": 441} {"train_loss": -8.741079330444336, "global_step": 74103, "epoch": 441} {"train_loss": -8.512269973754883, "global_step": 74104, "epoch": 441} {"train_loss": -8.742362976074219, "global_step": 74105, "epoch": 441} {"train_loss": -8.855134963989258, "global_step": 74106, "epoch": 441} {"train_loss": -8.624914169311523, "global_step": 74107, "epoch": 441} {"train_loss": -8.866037368774414, "global_step": 74108, "epoch": 441} {"train_loss": -8.777522087097168, "global_step": 74109, "epoch": 441} {"train_loss": -8.864461898803711, "global_step": 74110, "epoch": 441} {"train_loss": -8.857505798339844, "global_step": 74111, "epoch": 441} {"train_loss": -9.056106567382812, "global_step": 74112, "epoch": 441} {"train_loss": -8.825113296508789, "global_step": 74113, "epoch": 441} {"train_loss": -8.835758209228516, "global_step": 74114, "epoch": 441} {"train_loss": -8.610225677490234, "global_step": 74115, "epoch": 441} {"train_loss": -8.820067405700684, "global_step": 74116, "epoch": 441} {"train_loss": -8.584512710571289, "global_step": 74117, "epoch": 441} {"train_loss": -8.840316772460938, "global_step": 74118, "epoch": 441} {"train_loss": -8.900457382202148, "global_step": 74119, "epoch": 441} {"train_loss": -8.88546085357666, "global_step": 74120, "epoch": 441} {"train_loss": -8.730629920959473, "global_step": 74121, "epoch": 441} {"train_loss": -8.795524597167969, "global_step": 74122, "epoch": 441} {"train_loss": -8.904125213623047, "global_step": 74123, "epoch": 441} {"train_loss": -8.760108947753906, "global_step": 74124, "epoch": 441} {"train_loss": -8.476715087890625, "global_step": 74125, "epoch": 441} {"train_loss": -9.006938934326172, "global_step": 74126, "epoch": 441} {"train_loss": -8.972827911376953, "global_step": 74127, "epoch": 441} {"train_loss": -8.911084175109863, "global_step": 74128, "epoch": 441} {"train_loss": -8.86093521118164, "global_step": 74129, "epoch": 441} {"train_loss": -9.05752182006836, "global_step": 74130, "epoch": 441} {"train_loss": -8.9754638671875, "global_step": 74131, "epoch": 441} {"train_loss": -9.284399032592773, "global_step": 74132, "epoch": 441} {"train_loss": -8.997410774230957, "global_step": 74133, "epoch": 441} {"train_loss": -9.226889610290527, "global_step": 74134, "epoch": 441} {"train_loss": -8.974218368530273, "global_step": 74135, "epoch": 441} {"train_loss": -9.15421199798584, "global_step": 74136, "epoch": 441} {"train_loss": -9.108192443847656, "global_step": 74137, "epoch": 441} {"train_loss": -9.080514907836914, "global_step": 74138, "epoch": 441} {"train_loss": -8.920116424560547, "global_step": 74139, "epoch": 441} {"train_loss": -9.009811401367188, "global_step": 74140, "epoch": 441} {"train_loss": -8.972816467285156, "global_step": 74141, "epoch": 441} {"train_loss": -9.175344467163086, "global_step": 74142, "epoch": 441} {"train_loss": -9.061387062072754, "global_step": 74143, "epoch": 441} {"train_loss": -9.001691818237305, "global_step": 74144, "epoch": 441} {"train_loss": -9.258188247680664, "global_step": 74145, "epoch": 441} {"train_loss": -8.946499824523926, "global_step": 74146, "epoch": 441} {"train_loss": -9.228887557983398, "global_step": 74147, "epoch": 441} {"train_loss": -9.51042652130127, "global_step": 74148, "epoch": 441} {"train_loss": -9.148892402648926, "global_step": 74149, "epoch": 441} {"train_loss": -9.28261947631836, "global_step": 74150, "epoch": 441} {"train_loss": -9.034889221191406, "global_step": 74151, "epoch": 441} {"train_loss": -9.15139389038086, "global_step": 74152, "epoch": 441} {"train_loss": -8.982847213745117, "global_step": 74153, "epoch": 441} {"train_loss": -9.242457389831543, "global_step": 74154, "epoch": 441} {"train_loss": -9.084999084472656, "global_step": 74155, "epoch": 441} {"train_loss": -8.626794815063477, "global_step": 74156, "epoch": 441} {"train_loss": -9.060914993286133, "global_step": 74157, "epoch": 441} {"train_loss": -8.939811706542969, "global_step": 74158, "epoch": 441} {"train_loss": -9.020261764526367, "global_step": 74159, "epoch": 441} {"train_loss": -9.235433578491211, "global_step": 74160, "epoch": 441} {"train_loss": -9.163745880126953, "global_step": 74161, "epoch": 441} {"train_loss": -8.977165222167969, "global_step": 74162, "epoch": 441} {"train_loss": -9.282854080200195, "global_step": 74163, "epoch": 441} {"train_loss": -8.926137924194336, "global_step": 74164, "epoch": 441} {"train_loss": -9.02868938446045, "global_step": 74165, "epoch": 441} {"train_loss": -9.162230491638184, "global_step": 74166, "epoch": 441} {"train_loss": -8.94814395904541, "global_step": 74167, "epoch": 441} {"train_loss": -9.066999435424805, "global_step": 74168, "epoch": 441} {"train_loss": -8.790548324584961, "global_step": 74169, "epoch": 441} {"train_loss": -9.25059700012207, "global_step": 74170, "epoch": 441} {"train_loss": -8.963297843933105, "global_step": 74171, "epoch": 441} {"train_loss": -9.105775833129883, "global_step": 74172, "epoch": 441} {"train_loss": -8.967606544494629, "global_step": 74173, "epoch": 441} {"train_loss": -9.149921417236328, "global_step": 74174, "epoch": 441} {"train_loss": -8.934814453125, "global_step": 74175, "epoch": 441} {"train_loss": -8.910247802734375, "global_step": 74176, "epoch": 441} {"train_loss": -8.832890510559082, "global_step": 74177, "epoch": 441} {"train_loss": -8.69255256652832, "global_step": 74178, "epoch": 441} {"train_loss": -8.652109146118164, "global_step": 74179, "epoch": 441} {"train_loss": -8.741569519042969, "global_step": 74180, "epoch": 441} {"train_loss": -8.422171592712402, "global_step": 74181, "epoch": 441} {"train_loss": -8.688161849975586, "global_step": 74182, "epoch": 441} {"train_loss": -8.423639297485352, "global_step": 74183, "epoch": 441} {"train_loss": -8.482988357543945, "global_step": 74184, "epoch": 441} {"train_loss": -8.224531173706055, "global_step": 74185, "epoch": 441} {"train_loss": -8.681598663330078, "global_step": 74186, "epoch": 441} {"train_loss": -8.776269912719727, "global_step": 74187, "epoch": 441} {"train_loss": -8.586584091186523, "global_step": 74188, "epoch": 441} {"train_loss": -8.739495277404785, "global_step": 74189, "epoch": 441} {"train_loss": -8.891061782836914, "global_step": 74190, "epoch": 441} {"train_loss": -8.697956085205078, "global_step": 74191, "epoch": 441} {"train_loss": -8.926018714904785, "global_step": 74192, "epoch": 441} {"train_loss": -8.913294792175293, "global_step": 74193, "epoch": 441} {"train_loss": -8.815156936645508, "global_step": 74194, "epoch": 441} {"train_loss": -8.915494918823242, "global_step": 74195, "epoch": 441} {"train_loss": -8.907304763793945, "global_step": 74196, "epoch": 441} {"train_loss": -8.94359302520752, "global_step": 74197, "epoch": 441} {"train_loss": -9.06801700592041, "global_step": 74198, "epoch": 441} {"train_loss": -8.93766975402832, "global_step": 74199, "epoch": 441} {"train_loss": -9.12778377532959, "global_step": 74200, "epoch": 441} {"train_loss": -9.150300979614258, "global_step": 74201, "epoch": 441} {"train_loss": -9.138982772827148, "global_step": 74202, "epoch": 441} {"train_loss": -8.763134002685547, "global_step": 74203, "epoch": 441} {"train_loss": -9.079504013061523, "global_step": 74204, "epoch": 441} {"train_loss": -9.200679779052734, "global_step": 74205, "epoch": 441} {"train_loss": -8.782035827636719, "global_step": 74206, "epoch": 441} {"train_loss": -9.114577293395996, "global_step": 74207, "epoch": 441} {"train_loss": -8.827152252197266, "global_step": 74208, "epoch": 441} {"train_loss": -9.234676361083984, "global_step": 74209, "epoch": 441} {"train_loss": -8.618157386779785, "global_step": 74210, "epoch": 441} {"train_loss": -9.158663749694824, "global_step": 74211, "epoch": 441} {"train_loss": -8.93089485168457, "global_step": 74212, "epoch": 441} {"train_loss": -9.134774208068848, "global_step": 74213, "epoch": 441} {"train_loss": -9.084407806396484, "global_step": 74214, "epoch": 441} {"train_loss": -9.08389949798584, "global_step": 74215, "epoch": 441} {"train_loss": -9.117874145507812, "global_step": 74216, "epoch": 441} {"train_loss": -8.617798805236816, "global_step": 74217, "epoch": 441} {"train_loss": -9.12196159362793, "global_step": 74218, "epoch": 441} {"train_loss": -9.106072425842285, "global_step": 74219, "epoch": 441} {"train_loss": -8.78399658203125, "global_step": 74220, "epoch": 441} {"train_loss": -9.099529266357422, "global_step": 74221, "epoch": 441} {"train_loss": -8.995792388916016, "global_step": 74222, "epoch": 441} {"train_loss": -9.272685050964355, "global_step": 74223, "epoch": 441} {"train_loss": -9.035541534423828, "global_step": 74224, "epoch": 441} {"train_loss": -9.20632553100586, "global_step": 74225, "epoch": 441} {"train_loss": -9.060632705688477, "global_step": 74226, "epoch": 441} {"train_loss": -9.301191329956055, "global_step": 74227, "epoch": 441} {"train_loss": -9.13760757446289, "global_step": 74228, "epoch": 441} {"train_loss": -9.039278030395508, "global_step": 74229, "epoch": 441} {"train_loss": -9.270904541015625, "global_step": 74230, "epoch": 441} {"train_loss": -8.831718444824219, "global_step": 74231, "epoch": 441} {"train_loss": -9.203635215759277, "global_step": 74232, "epoch": 441} {"train_loss": -9.227198600769043, "global_step": 74233, "epoch": 441} {"train_loss": -8.759764671325684, "global_step": 74234, "epoch": 441} {"train_loss": -9.138286590576172, "global_step": 74235, "epoch": 441} {"train_loss": -9.019165992736816, "global_step": 74236, "epoch": 441} {"train_loss": -8.912826538085938, "global_step": 74237, "epoch": 441} {"train_loss": -8.990259170532227, "global_step": 74238, "epoch": 441} {"train_loss": -9.101882934570312, "global_step": 74239, "epoch": 441} {"train_loss": -9.025413513183594, "global_step": 74240, "epoch": 441} {"train_loss": -9.139535903930664, "global_step": 74241, "epoch": 441} {"train_loss": -9.081119537353516, "global_step": 74242, "epoch": 441} {"train_loss": -9.147592544555664, "global_step": 74243, "epoch": 441} {"train_loss": -8.908867835998535, "global_step": 74244, "epoch": 441} {"train_loss": -9.068870544433594, "global_step": 74245, "epoch": 441} {"train_loss": -9.022786140441895, "global_step": 74246, "epoch": 441} {"train_loss": -9.019941329956055, "global_step": 74247, "epoch": 441} {"train_loss": -9.005314826965332, "global_step": 74248, "epoch": 441} {"train_loss": -9.23367977142334, "global_step": 74249, "epoch": 441} {"train_loss": -9.008790016174316, "global_step": 74250, "epoch": 441} {"train_loss": -8.992384910583496, "global_step": 74251, "epoch": 441} {"train_loss": -9.078071594238281, "global_step": 74252, "epoch": 441} {"train_loss": -8.843755722045898, "global_step": 74253, "epoch": 441} {"train_loss": -9.154375076293945, "global_step": 74254, "epoch": 441} {"train_loss": -8.951640464010692, "global_step": 74255, "epoch": 441, "val_loss": 195396.296875} {"train_loss": -8.932136535644531, "global_step": 74256, "epoch": 442} {"train_loss": -8.997776985168457, "global_step": 74257, "epoch": 442} {"train_loss": -8.799463272094727, "global_step": 74258, "epoch": 442} {"train_loss": -8.925338745117188, "global_step": 74259, "epoch": 442} {"train_loss": -8.833551406860352, "global_step": 74260, "epoch": 442} {"train_loss": -8.594582557678223, "global_step": 74261, "epoch": 442} {"train_loss": -8.993980407714844, "global_step": 74262, "epoch": 442} {"train_loss": -8.534085273742676, "global_step": 74263, "epoch": 442} {"train_loss": -8.989031791687012, "global_step": 74264, "epoch": 442} {"train_loss": -9.09350872039795, "global_step": 74265, "epoch": 442} {"train_loss": -9.121360778808594, "global_step": 74266, "epoch": 442} {"train_loss": -9.1571044921875, "global_step": 74267, "epoch": 442} {"train_loss": -8.812366485595703, "global_step": 74268, "epoch": 442} {"train_loss": -9.055633544921875, "global_step": 74269, "epoch": 442} {"train_loss": -9.04387378692627, "global_step": 74270, "epoch": 442} {"train_loss": -9.266565322875977, "global_step": 74271, "epoch": 442} {"train_loss": -9.184035301208496, "global_step": 74272, "epoch": 442} {"train_loss": -9.041253089904785, "global_step": 74273, "epoch": 442} {"train_loss": -8.962326049804688, "global_step": 74274, "epoch": 442} {"train_loss": -9.236217498779297, "global_step": 74275, "epoch": 442} {"train_loss": -9.206995010375977, "global_step": 74276, "epoch": 442} {"train_loss": -9.217794418334961, "global_step": 74277, "epoch": 442} {"train_loss": -9.198582649230957, "global_step": 74278, "epoch": 442} {"train_loss": -8.87887191772461, "global_step": 74279, "epoch": 442} {"train_loss": -9.061402320861816, "global_step": 74280, "epoch": 442} {"train_loss": -8.973581314086914, "global_step": 74281, "epoch": 442} {"train_loss": -9.253890037536621, "global_step": 74282, "epoch": 442} {"train_loss": -8.689033508300781, "global_step": 74283, "epoch": 442} {"train_loss": -9.069567680358887, "global_step": 74284, "epoch": 442} {"train_loss": -8.692730903625488, "global_step": 74285, "epoch": 442} {"train_loss": -9.093830108642578, "global_step": 74286, "epoch": 442} {"train_loss": -8.716499328613281, "global_step": 74287, "epoch": 442} {"train_loss": -8.673069953918457, "global_step": 74288, "epoch": 442} {"train_loss": -8.37736701965332, "global_step": 74289, "epoch": 442} {"train_loss": -8.955785751342773, "global_step": 74290, "epoch": 442} {"train_loss": -8.877164840698242, "global_step": 74291, "epoch": 442} {"train_loss": -9.073620796203613, "global_step": 74292, "epoch": 442} {"train_loss": -8.809786796569824, "global_step": 74293, "epoch": 442} {"train_loss": -9.136527061462402, "global_step": 74294, "epoch": 442} {"train_loss": -8.970402717590332, "global_step": 74295, "epoch": 442} {"train_loss": -8.865999221801758, "global_step": 74296, "epoch": 442} {"train_loss": -8.839325904846191, "global_step": 74297, "epoch": 442} {"train_loss": -8.964075088500977, "global_step": 74298, "epoch": 442} {"train_loss": -8.949398040771484, "global_step": 74299, "epoch": 442} {"train_loss": -8.969453811645508, "global_step": 74300, "epoch": 442} {"train_loss": -8.8880615234375, "global_step": 74301, "epoch": 442} {"train_loss": -8.661642074584961, "global_step": 74302, "epoch": 442} {"train_loss": -8.9439058303833, "global_step": 74303, "epoch": 442} {"train_loss": -9.144865036010742, "global_step": 74304, "epoch": 442} {"train_loss": -8.861021041870117, "global_step": 74305, "epoch": 442} {"train_loss": -9.065559387207031, "global_step": 74306, "epoch": 442} {"train_loss": -8.852693557739258, "global_step": 74307, "epoch": 442} {"train_loss": -9.18867301940918, "global_step": 74308, "epoch": 442} {"train_loss": -9.036619186401367, "global_step": 74309, "epoch": 442} {"train_loss": -9.254670143127441, "global_step": 74310, "epoch": 442} {"train_loss": -8.929056167602539, "global_step": 74311, "epoch": 442} {"train_loss": -8.924848556518555, "global_step": 74312, "epoch": 442} {"train_loss": -9.141714096069336, "global_step": 74313, "epoch": 442} {"train_loss": -9.06069564819336, "global_step": 74314, "epoch": 442} {"train_loss": -9.117243766784668, "global_step": 74315, "epoch": 442} {"train_loss": -9.317171096801758, "global_step": 74316, "epoch": 442} {"train_loss": -9.379624366760254, "global_step": 74317, "epoch": 442} {"train_loss": -9.293824195861816, "global_step": 74318, "epoch": 442} {"train_loss": -9.29776382446289, "global_step": 74319, "epoch": 442} {"train_loss": -9.170816421508789, "global_step": 74320, "epoch": 442} {"train_loss": -9.253519058227539, "global_step": 74321, "epoch": 442} {"train_loss": -9.456984519958496, "global_step": 74322, "epoch": 442} {"train_loss": -8.958745956420898, "global_step": 74323, "epoch": 442} {"train_loss": -9.309314727783203, "global_step": 74324, "epoch": 442} {"train_loss": -9.016168594360352, "global_step": 74325, "epoch": 442} {"train_loss": -9.325019836425781, "global_step": 74326, "epoch": 442} {"train_loss": -9.21274471282959, "global_step": 74327, "epoch": 442} {"train_loss": -9.111518859863281, "global_step": 74328, "epoch": 442} {"train_loss": -9.14864730834961, "global_step": 74329, "epoch": 442} {"train_loss": -8.945215225219727, "global_step": 74330, "epoch": 442} {"train_loss": -8.963188171386719, "global_step": 74331, "epoch": 442} {"train_loss": -9.027009010314941, "global_step": 74332, "epoch": 442} {"train_loss": -8.892373085021973, "global_step": 74333, "epoch": 442} {"train_loss": -8.91346549987793, "global_step": 74334, "epoch": 442} {"train_loss": -8.942346572875977, "global_step": 74335, "epoch": 442} {"train_loss": -8.933844566345215, "global_step": 74336, "epoch": 442} {"train_loss": -9.016799926757812, "global_step": 74337, "epoch": 442} {"train_loss": -9.073100090026855, "global_step": 74338, "epoch": 442} {"train_loss": -9.210346221923828, "global_step": 74339, "epoch": 442} {"train_loss": -8.958109855651855, "global_step": 74340, "epoch": 442} {"train_loss": -9.039769172668457, "global_step": 74341, "epoch": 442} {"train_loss": -9.189996719360352, "global_step": 74342, "epoch": 442} {"train_loss": -9.008698463439941, "global_step": 74343, "epoch": 442} {"train_loss": -9.15517807006836, "global_step": 74344, "epoch": 442} {"train_loss": -9.081947326660156, "global_step": 74345, "epoch": 442} {"train_loss": -9.14948844909668, "global_step": 74346, "epoch": 442} {"train_loss": -8.760150909423828, "global_step": 74347, "epoch": 442} {"train_loss": -9.248930931091309, "global_step": 74348, "epoch": 442} {"train_loss": -9.080914497375488, "global_step": 74349, "epoch": 442} {"train_loss": -9.130913734436035, "global_step": 74350, "epoch": 442} {"train_loss": -9.219276428222656, "global_step": 74351, "epoch": 442} {"train_loss": -9.059008598327637, "global_step": 74352, "epoch": 442} {"train_loss": -9.364312171936035, "global_step": 74353, "epoch": 442} {"train_loss": -9.446273803710938, "global_step": 74354, "epoch": 442} {"train_loss": -8.998468399047852, "global_step": 74355, "epoch": 442} {"train_loss": -9.15015983581543, "global_step": 74356, "epoch": 442} {"train_loss": -9.090049743652344, "global_step": 74357, "epoch": 442} {"train_loss": -9.228062629699707, "global_step": 74358, "epoch": 442} {"train_loss": -9.192588806152344, "global_step": 74359, "epoch": 442} {"train_loss": -9.404447555541992, "global_step": 74360, "epoch": 442} {"train_loss": -8.944190979003906, "global_step": 74361, "epoch": 442} {"train_loss": -9.359309196472168, "global_step": 74362, "epoch": 442} {"train_loss": -9.067804336547852, "global_step": 74363, "epoch": 442} {"train_loss": -8.99410629272461, "global_step": 74364, "epoch": 442} {"train_loss": -9.000417709350586, "global_step": 74365, "epoch": 442} {"train_loss": -8.896788597106934, "global_step": 74366, "epoch": 442} {"train_loss": -9.234334945678711, "global_step": 74367, "epoch": 442} {"train_loss": -8.97412395477295, "global_step": 74368, "epoch": 442} {"train_loss": -9.03284740447998, "global_step": 74369, "epoch": 442} {"train_loss": -9.228111267089844, "global_step": 74370, "epoch": 442} {"train_loss": -9.076133728027344, "global_step": 74371, "epoch": 442} {"train_loss": -9.316946983337402, "global_step": 74372, "epoch": 442} {"train_loss": -8.858266830444336, "global_step": 74373, "epoch": 442} {"train_loss": -9.078573226928711, "global_step": 74374, "epoch": 442} {"train_loss": -9.152100563049316, "global_step": 74375, "epoch": 442} {"train_loss": -9.217329978942871, "global_step": 74376, "epoch": 442} {"train_loss": -9.117626190185547, "global_step": 74377, "epoch": 442} {"train_loss": -9.093789100646973, "global_step": 74378, "epoch": 442} {"train_loss": -8.848451614379883, "global_step": 74379, "epoch": 442} {"train_loss": -8.724491119384766, "global_step": 74380, "epoch": 442} {"train_loss": -9.16640853881836, "global_step": 74381, "epoch": 442} {"train_loss": -8.767610549926758, "global_step": 74382, "epoch": 442} {"train_loss": -8.634987831115723, "global_step": 74383, "epoch": 442} {"train_loss": -8.769100189208984, "global_step": 74384, "epoch": 442} {"train_loss": -8.755236625671387, "global_step": 74385, "epoch": 442} {"train_loss": -8.80100154876709, "global_step": 74386, "epoch": 442} {"train_loss": -8.909782409667969, "global_step": 74387, "epoch": 442} {"train_loss": -8.692665100097656, "global_step": 74388, "epoch": 442} {"train_loss": -8.716020584106445, "global_step": 74389, "epoch": 442} {"train_loss": -8.893019676208496, "global_step": 74390, "epoch": 442} {"train_loss": -8.877978324890137, "global_step": 74391, "epoch": 442} {"train_loss": -9.064879417419434, "global_step": 74392, "epoch": 442} {"train_loss": -8.879111289978027, "global_step": 74393, "epoch": 442} {"train_loss": -8.919906616210938, "global_step": 74394, "epoch": 442} {"train_loss": -8.893190383911133, "global_step": 74395, "epoch": 442} {"train_loss": -9.124881744384766, "global_step": 74396, "epoch": 442} {"train_loss": -9.201171875, "global_step": 74397, "epoch": 442} {"train_loss": -9.18600845336914, "global_step": 74398, "epoch": 442} {"train_loss": -8.931203842163086, "global_step": 74399, "epoch": 442} {"train_loss": -8.952640533447266, "global_step": 74400, "epoch": 442} {"train_loss": -9.12574577331543, "global_step": 74401, "epoch": 442} {"train_loss": -9.191274642944336, "global_step": 74402, "epoch": 442} {"train_loss": -9.070467948913574, "global_step": 74403, "epoch": 442} {"train_loss": -8.955595016479492, "global_step": 74404, "epoch": 442} {"train_loss": -8.943330764770508, "global_step": 74405, "epoch": 442} {"train_loss": -9.076741218566895, "global_step": 74406, "epoch": 442} {"train_loss": -8.974563598632812, "global_step": 74407, "epoch": 442} {"train_loss": -8.852765083312988, "global_step": 74408, "epoch": 442} {"train_loss": -9.052763938903809, "global_step": 74409, "epoch": 442} {"train_loss": -8.804102897644043, "global_step": 74410, "epoch": 442} {"train_loss": -9.172183990478516, "global_step": 74411, "epoch": 442} {"train_loss": -9.111751556396484, "global_step": 74412, "epoch": 442} {"train_loss": -8.979226112365723, "global_step": 74413, "epoch": 442} {"train_loss": -9.05880355834961, "global_step": 74414, "epoch": 442} {"train_loss": -9.128889083862305, "global_step": 74415, "epoch": 442} {"train_loss": -8.83664321899414, "global_step": 74416, "epoch": 442} {"train_loss": -9.193479537963867, "global_step": 74417, "epoch": 442} {"train_loss": -9.134596824645996, "global_step": 74418, "epoch": 442} {"train_loss": -8.862077713012695, "global_step": 74419, "epoch": 442} {"train_loss": -9.377880096435547, "global_step": 74420, "epoch": 442} {"train_loss": -9.029891967773438, "global_step": 74421, "epoch": 442} {"train_loss": -9.150872230529785, "global_step": 74422, "epoch": 442} {"train_loss": -9.026352547463917, "global_step": 74423, "epoch": 442, "val_loss": 194279.125} {"train_loss": -9.263265609741211, "global_step": 74424, "epoch": 443} {"train_loss": -8.856890678405762, "global_step": 74425, "epoch": 443} {"train_loss": -8.95596694946289, "global_step": 74426, "epoch": 443} {"train_loss": -8.963640213012695, "global_step": 74427, "epoch": 443} {"train_loss": -9.015586853027344, "global_step": 74428, "epoch": 443} {"train_loss": -8.579551696777344, "global_step": 74429, "epoch": 443} {"train_loss": -9.024320602416992, "global_step": 74430, "epoch": 443} {"train_loss": -8.81488037109375, "global_step": 74431, "epoch": 443} {"train_loss": -9.000446319580078, "global_step": 74432, "epoch": 443} {"train_loss": -8.971870422363281, "global_step": 74433, "epoch": 443} {"train_loss": -9.071057319641113, "global_step": 74434, "epoch": 443} {"train_loss": -9.036526679992676, "global_step": 74435, "epoch": 443} {"train_loss": -8.920988082885742, "global_step": 74436, "epoch": 443} {"train_loss": -8.941957473754883, "global_step": 74437, "epoch": 443} {"train_loss": -9.07064437866211, "global_step": 74438, "epoch": 443} {"train_loss": -9.048941612243652, "global_step": 74439, "epoch": 443} {"train_loss": -9.162291526794434, "global_step": 74440, "epoch": 443} {"train_loss": -9.112432479858398, "global_step": 74441, "epoch": 443} {"train_loss": -9.177855491638184, "global_step": 74442, "epoch": 443} {"train_loss": -9.247507095336914, "global_step": 74443, "epoch": 443} {"train_loss": -9.067631721496582, "global_step": 74444, "epoch": 443} {"train_loss": -9.217620849609375, "global_step": 74445, "epoch": 443} {"train_loss": -9.098628997802734, "global_step": 74446, "epoch": 443} {"train_loss": -9.102298736572266, "global_step": 74447, "epoch": 443} {"train_loss": -9.087100982666016, "global_step": 74448, "epoch": 443} {"train_loss": -9.26736831665039, "global_step": 74449, "epoch": 443} {"train_loss": -9.282011985778809, "global_step": 74450, "epoch": 443} {"train_loss": -9.21108341217041, "global_step": 74451, "epoch": 443} {"train_loss": -9.341468811035156, "global_step": 74452, "epoch": 443} {"train_loss": -9.361564636230469, "global_step": 74453, "epoch": 443} {"train_loss": -9.136343002319336, "global_step": 74454, "epoch": 443} {"train_loss": -9.197803497314453, "global_step": 74455, "epoch": 443} {"train_loss": -9.24562931060791, "global_step": 74456, "epoch": 443} {"train_loss": -8.977102279663086, "global_step": 74457, "epoch": 443} {"train_loss": -8.963763236999512, "global_step": 74458, "epoch": 443} {"train_loss": -9.16650390625, "global_step": 74459, "epoch": 443} {"train_loss": -9.184579849243164, "global_step": 74460, "epoch": 443} {"train_loss": -8.942984580993652, "global_step": 74461, "epoch": 443} {"train_loss": -9.088178634643555, "global_step": 74462, "epoch": 443} {"train_loss": -9.104056358337402, "global_step": 74463, "epoch": 443} {"train_loss": -9.170282363891602, "global_step": 74464, "epoch": 443} {"train_loss": -9.264556884765625, "global_step": 74465, "epoch": 443} {"train_loss": -8.73928165435791, "global_step": 74466, "epoch": 443} {"train_loss": -9.074703216552734, "global_step": 74467, "epoch": 443} {"train_loss": -9.129292488098145, "global_step": 74468, "epoch": 443} {"train_loss": -9.120988845825195, "global_step": 74469, "epoch": 443} {"train_loss": -8.699134826660156, "global_step": 74470, "epoch": 443} {"train_loss": -8.586832046508789, "global_step": 74471, "epoch": 443} {"train_loss": -8.860034942626953, "global_step": 74472, "epoch": 443} {"train_loss": -9.112627983093262, "global_step": 74473, "epoch": 443} {"train_loss": -8.870553970336914, "global_step": 74474, "epoch": 443} {"train_loss": -8.998018264770508, "global_step": 74475, "epoch": 443} {"train_loss": -8.981689453125, "global_step": 74476, "epoch": 443} {"train_loss": -9.049269676208496, "global_step": 74477, "epoch": 443} {"train_loss": -8.885886192321777, "global_step": 74478, "epoch": 443} {"train_loss": -9.197632789611816, "global_step": 74479, "epoch": 443} {"train_loss": -8.686193466186523, "global_step": 74480, "epoch": 443} {"train_loss": -8.908048629760742, "global_step": 74481, "epoch": 443} {"train_loss": -9.055846214294434, "global_step": 74482, "epoch": 443} {"train_loss": -9.240802764892578, "global_step": 74483, "epoch": 443} {"train_loss": -9.187064170837402, "global_step": 74484, "epoch": 443} {"train_loss": -8.89727783203125, "global_step": 74485, "epoch": 443} {"train_loss": -9.154788970947266, "global_step": 74486, "epoch": 443} {"train_loss": -8.948881149291992, "global_step": 74487, "epoch": 443} {"train_loss": -9.194887161254883, "global_step": 74488, "epoch": 443} {"train_loss": -9.222893714904785, "global_step": 74489, "epoch": 443} {"train_loss": -8.896071434020996, "global_step": 74490, "epoch": 443} {"train_loss": -9.066394805908203, "global_step": 74491, "epoch": 443} {"train_loss": -9.239038467407227, "global_step": 74492, "epoch": 443} {"train_loss": -9.010930061340332, "global_step": 74493, "epoch": 443} {"train_loss": -9.148275375366211, "global_step": 74494, "epoch": 443} {"train_loss": -9.371637344360352, "global_step": 74495, "epoch": 443} {"train_loss": -9.137904167175293, "global_step": 74496, "epoch": 443} {"train_loss": -9.115180969238281, "global_step": 74497, "epoch": 443} {"train_loss": -9.098834991455078, "global_step": 74498, "epoch": 443} {"train_loss": -9.036920547485352, "global_step": 74499, "epoch": 443} {"train_loss": -8.933321952819824, "global_step": 74500, "epoch": 443} {"train_loss": -9.104241371154785, "global_step": 74501, "epoch": 443} {"train_loss": -8.856849670410156, "global_step": 74502, "epoch": 443} {"train_loss": -9.064017295837402, "global_step": 74503, "epoch": 443} {"train_loss": -9.286876678466797, "global_step": 74504, "epoch": 443} {"train_loss": -8.857264518737793, "global_step": 74505, "epoch": 443} {"train_loss": -9.226401329040527, "global_step": 74506, "epoch": 443} {"train_loss": -8.880265235900879, "global_step": 74507, "epoch": 443} {"train_loss": -8.878423690795898, "global_step": 74508, "epoch": 443} {"train_loss": -8.990900039672852, "global_step": 74509, "epoch": 443} {"train_loss": -8.852106094360352, "global_step": 74510, "epoch": 443} {"train_loss": -8.800518035888672, "global_step": 74511, "epoch": 443} {"train_loss": -8.873193740844727, "global_step": 74512, "epoch": 443} {"train_loss": -8.928261756896973, "global_step": 74513, "epoch": 443} {"train_loss": -8.88677978515625, "global_step": 74514, "epoch": 443} {"train_loss": -8.925556182861328, "global_step": 74515, "epoch": 443} {"train_loss": -8.87649917602539, "global_step": 74516, "epoch": 443} {"train_loss": -8.823216438293457, "global_step": 74517, "epoch": 443} {"train_loss": -8.746591567993164, "global_step": 74518, "epoch": 443} {"train_loss": -8.9405517578125, "global_step": 74519, "epoch": 443} {"train_loss": -8.84725284576416, "global_step": 74520, "epoch": 443} {"train_loss": -8.79929256439209, "global_step": 74521, "epoch": 443} {"train_loss": -8.843002319335938, "global_step": 74522, "epoch": 443} {"train_loss": -8.948394775390625, "global_step": 74523, "epoch": 443} {"train_loss": -8.781820297241211, "global_step": 74524, "epoch": 443} {"train_loss": -8.858955383300781, "global_step": 74525, "epoch": 443} {"train_loss": -9.26110553741455, "global_step": 74526, "epoch": 443} {"train_loss": -9.064286231994629, "global_step": 74527, "epoch": 443} {"train_loss": -9.111614227294922, "global_step": 74528, "epoch": 443} {"train_loss": -9.074464797973633, "global_step": 74529, "epoch": 443} {"train_loss": -9.205618858337402, "global_step": 74530, "epoch": 443} {"train_loss": -8.86273193359375, "global_step": 74531, "epoch": 443} {"train_loss": -9.271072387695312, "global_step": 74532, "epoch": 443} {"train_loss": -9.056028366088867, "global_step": 74533, "epoch": 443} {"train_loss": -9.174875259399414, "global_step": 74534, "epoch": 443} {"train_loss": -9.0857515335083, "global_step": 74535, "epoch": 443} {"train_loss": -8.926074981689453, "global_step": 74536, "epoch": 443} {"train_loss": -9.285484313964844, "global_step": 74537, "epoch": 443} {"train_loss": -9.18918228149414, "global_step": 74538, "epoch": 443} {"train_loss": -9.2284574508667, "global_step": 74539, "epoch": 443} {"train_loss": -9.188724517822266, "global_step": 74540, "epoch": 443} {"train_loss": -9.540952682495117, "global_step": 74541, "epoch": 443} {"train_loss": -9.313043594360352, "global_step": 74542, "epoch": 443} {"train_loss": -9.00166130065918, "global_step": 74543, "epoch": 443} {"train_loss": -9.351158142089844, "global_step": 74544, "epoch": 443} {"train_loss": -8.896255493164062, "global_step": 74545, "epoch": 443} {"train_loss": -9.253469467163086, "global_step": 74546, "epoch": 443} {"train_loss": -9.239437103271484, "global_step": 74547, "epoch": 443} {"train_loss": -9.253907203674316, "global_step": 74548, "epoch": 443} {"train_loss": -9.172146797180176, "global_step": 74549, "epoch": 443} {"train_loss": -9.206780433654785, "global_step": 74550, "epoch": 443} {"train_loss": -9.400857925415039, "global_step": 74551, "epoch": 443} {"train_loss": -9.173859596252441, "global_step": 74552, "epoch": 443} {"train_loss": -9.39773178100586, "global_step": 74553, "epoch": 443} {"train_loss": -9.226866722106934, "global_step": 74554, "epoch": 443} {"train_loss": -9.460046768188477, "global_step": 74555, "epoch": 443} {"train_loss": -9.284869194030762, "global_step": 74556, "epoch": 443} {"train_loss": -8.639293670654297, "global_step": 74557, "epoch": 443} {"train_loss": -8.670077323913574, "global_step": 74558, "epoch": 443} {"train_loss": -9.088945388793945, "global_step": 74559, "epoch": 443} {"train_loss": -8.502935409545898, "global_step": 74560, "epoch": 443} {"train_loss": -8.888574600219727, "global_step": 74561, "epoch": 443} {"train_loss": -8.432826042175293, "global_step": 74562, "epoch": 443} {"train_loss": -8.919897079467773, "global_step": 74563, "epoch": 443} {"train_loss": -8.699811935424805, "global_step": 74564, "epoch": 443} {"train_loss": -9.163819313049316, "global_step": 74565, "epoch": 443} {"train_loss": -8.834861755371094, "global_step": 74566, "epoch": 443} {"train_loss": -8.750049591064453, "global_step": 74567, "epoch": 443} {"train_loss": -9.08407211303711, "global_step": 74568, "epoch": 443} {"train_loss": -8.85539436340332, "global_step": 74569, "epoch": 443} {"train_loss": -8.928266525268555, "global_step": 74570, "epoch": 443} {"train_loss": -9.036985397338867, "global_step": 74571, "epoch": 443} {"train_loss": -8.94461441040039, "global_step": 74572, "epoch": 443} {"train_loss": -8.885184288024902, "global_step": 74573, "epoch": 443} {"train_loss": -8.948725700378418, "global_step": 74574, "epoch": 443} {"train_loss": -8.949553489685059, "global_step": 74575, "epoch": 443} {"train_loss": -9.163394927978516, "global_step": 74576, "epoch": 443} {"train_loss": -8.768871307373047, "global_step": 74577, "epoch": 443} {"train_loss": -9.203211784362793, "global_step": 74578, "epoch": 443} {"train_loss": -9.00664234161377, "global_step": 74579, "epoch": 443} {"train_loss": -9.110000610351562, "global_step": 74580, "epoch": 443} {"train_loss": -9.142655372619629, "global_step": 74581, "epoch": 443} {"train_loss": -9.309438705444336, "global_step": 74582, "epoch": 443} {"train_loss": -8.944255828857422, "global_step": 74583, "epoch": 443} {"train_loss": -9.148488998413086, "global_step": 74584, "epoch": 443} {"train_loss": -8.841650009155273, "global_step": 74585, "epoch": 443} {"train_loss": -9.11337661743164, "global_step": 74586, "epoch": 443} {"train_loss": -8.621837615966797, "global_step": 74587, "epoch": 443} {"train_loss": -9.191129684448242, "global_step": 74588, "epoch": 443} {"train_loss": -8.842195510864258, "global_step": 74589, "epoch": 443} {"train_loss": -8.977567672729492, "global_step": 74590, "epoch": 443} {"train_loss": -9.036067888850258, "global_step": 74591, "epoch": 443, "val_loss": 194801.890625} {"train_loss": -8.878373146057129, "global_step": 74592, "epoch": 444} {"train_loss": -9.13231086730957, "global_step": 74593, "epoch": 444} {"train_loss": -8.39838981628418, "global_step": 74594, "epoch": 444} {"train_loss": -9.007034301757812, "global_step": 74595, "epoch": 444} {"train_loss": -8.600167274475098, "global_step": 74596, "epoch": 444} {"train_loss": -9.007955551147461, "global_step": 74597, "epoch": 444} {"train_loss": -8.868922233581543, "global_step": 74598, "epoch": 444} {"train_loss": -8.585199356079102, "global_step": 74599, "epoch": 444} {"train_loss": -8.835536003112793, "global_step": 74600, "epoch": 444} {"train_loss": -8.574840545654297, "global_step": 74601, "epoch": 444} {"train_loss": -8.858314514160156, "global_step": 74602, "epoch": 444} {"train_loss": -8.654233932495117, "global_step": 74603, "epoch": 444} {"train_loss": -9.091825485229492, "global_step": 74604, "epoch": 444} {"train_loss": -9.131433486938477, "global_step": 74605, "epoch": 444} {"train_loss": -8.760918617248535, "global_step": 74606, "epoch": 444} {"train_loss": -9.157000541687012, "global_step": 74607, "epoch": 444} {"train_loss": -8.875341415405273, "global_step": 74608, "epoch": 444} {"train_loss": -8.716289520263672, "global_step": 74609, "epoch": 444} {"train_loss": -8.970855712890625, "global_step": 74610, "epoch": 444} {"train_loss": -8.655428886413574, "global_step": 74611, "epoch": 444} {"train_loss": -8.904439926147461, "global_step": 74612, "epoch": 444} {"train_loss": -8.656584739685059, "global_step": 74613, "epoch": 444} {"train_loss": -8.901460647583008, "global_step": 74614, "epoch": 444} {"train_loss": -8.153366088867188, "global_step": 74615, "epoch": 444} {"train_loss": -8.929632186889648, "global_step": 74616, "epoch": 444} {"train_loss": -8.489389419555664, "global_step": 74617, "epoch": 444} {"train_loss": -8.546516418457031, "global_step": 74618, "epoch": 444} {"train_loss": -8.593442916870117, "global_step": 74619, "epoch": 444} {"train_loss": -8.441634178161621, "global_step": 74620, "epoch": 444} {"train_loss": -8.649511337280273, "global_step": 74621, "epoch": 444} {"train_loss": -8.53400707244873, "global_step": 74622, "epoch": 444} {"train_loss": -8.787928581237793, "global_step": 74623, "epoch": 444} {"train_loss": -8.762481689453125, "global_step": 74624, "epoch": 444} {"train_loss": -8.710638046264648, "global_step": 74625, "epoch": 444} {"train_loss": -8.850622177124023, "global_step": 74626, "epoch": 444} {"train_loss": -8.865470886230469, "global_step": 74627, "epoch": 444} {"train_loss": -8.884653091430664, "global_step": 74628, "epoch": 444} {"train_loss": -8.703414916992188, "global_step": 74629, "epoch": 444} {"train_loss": -8.848852157592773, "global_step": 74630, "epoch": 444} {"train_loss": -8.917221069335938, "global_step": 74631, "epoch": 444} {"train_loss": -8.931756973266602, "global_step": 74632, "epoch": 444} {"train_loss": -9.008106231689453, "global_step": 74633, "epoch": 444} {"train_loss": -8.83189582824707, "global_step": 74634, "epoch": 444} {"train_loss": -8.982986450195312, "global_step": 74635, "epoch": 444} {"train_loss": -9.082326889038086, "global_step": 74636, "epoch": 444} {"train_loss": -8.927303314208984, "global_step": 74637, "epoch": 444} {"train_loss": -8.94579029083252, "global_step": 74638, "epoch": 444} {"train_loss": -9.015034675598145, "global_step": 74639, "epoch": 444} {"train_loss": -9.278303146362305, "global_step": 74640, "epoch": 444} {"train_loss": -9.284867286682129, "global_step": 74641, "epoch": 444} {"train_loss": -9.110773086547852, "global_step": 74642, "epoch": 444} {"train_loss": -9.056184768676758, "global_step": 74643, "epoch": 444} {"train_loss": -9.234962463378906, "global_step": 74644, "epoch": 444} {"train_loss": -8.899615287780762, "global_step": 74645, "epoch": 444} {"train_loss": -9.044027328491211, "global_step": 74646, "epoch": 444} {"train_loss": -9.18139362335205, "global_step": 74647, "epoch": 444} {"train_loss": -8.954511642456055, "global_step": 74648, "epoch": 444} {"train_loss": -9.161792755126953, "global_step": 74649, "epoch": 444} {"train_loss": -9.201234817504883, "global_step": 74650, "epoch": 444} {"train_loss": -9.204201698303223, "global_step": 74651, "epoch": 444} {"train_loss": -9.235246658325195, "global_step": 74652, "epoch": 444} {"train_loss": -8.896890640258789, "global_step": 74653, "epoch": 444} {"train_loss": -9.209339141845703, "global_step": 74654, "epoch": 444} {"train_loss": -8.842869758605957, "global_step": 74655, "epoch": 444} {"train_loss": -9.181587219238281, "global_step": 74656, "epoch": 444} {"train_loss": -8.949677467346191, "global_step": 74657, "epoch": 444} {"train_loss": -9.168460845947266, "global_step": 74658, "epoch": 444} {"train_loss": -9.082365036010742, "global_step": 74659, "epoch": 444} {"train_loss": -9.051249504089355, "global_step": 74660, "epoch": 444} {"train_loss": -9.139871597290039, "global_step": 74661, "epoch": 444} {"train_loss": -9.134905815124512, "global_step": 74662, "epoch": 444} {"train_loss": -9.045555114746094, "global_step": 74663, "epoch": 444} {"train_loss": -9.157852172851562, "global_step": 74664, "epoch": 444} {"train_loss": -8.83135986328125, "global_step": 74665, "epoch": 444} {"train_loss": -8.85174560546875, "global_step": 74666, "epoch": 444} {"train_loss": -9.137411117553711, "global_step": 74667, "epoch": 444} {"train_loss": -9.151549339294434, "global_step": 74668, "epoch": 444} {"train_loss": -9.15350341796875, "global_step": 74669, "epoch": 444} {"train_loss": -8.980427742004395, "global_step": 74670, "epoch": 444} {"train_loss": -8.9739990234375, "global_step": 74671, "epoch": 444} {"train_loss": -9.189680099487305, "global_step": 74672, "epoch": 444} {"train_loss": -9.116718292236328, "global_step": 74673, "epoch": 444} {"train_loss": -8.768024444580078, "global_step": 74674, "epoch": 444} {"train_loss": -9.222786903381348, "global_step": 74675, "epoch": 444} {"train_loss": -9.055191040039062, "global_step": 74676, "epoch": 444} {"train_loss": -9.122718811035156, "global_step": 74677, "epoch": 444} {"train_loss": -8.87988567352295, "global_step": 74678, "epoch": 444} {"train_loss": -9.149895668029785, "global_step": 74679, "epoch": 444} {"train_loss": -9.00855827331543, "global_step": 74680, "epoch": 444} {"train_loss": -9.200572967529297, "global_step": 74681, "epoch": 444} {"train_loss": -9.245198249816895, "global_step": 74682, "epoch": 444} {"train_loss": -8.907241821289062, "global_step": 74683, "epoch": 444} {"train_loss": -9.054662704467773, "global_step": 74684, "epoch": 444} {"train_loss": -8.886343002319336, "global_step": 74685, "epoch": 444} {"train_loss": -8.867633819580078, "global_step": 74686, "epoch": 444} {"train_loss": -8.893453598022461, "global_step": 74687, "epoch": 444} {"train_loss": -8.964116096496582, "global_step": 74688, "epoch": 444} {"train_loss": -8.652303695678711, "global_step": 74689, "epoch": 444} {"train_loss": -8.732792854309082, "global_step": 74690, "epoch": 444} {"train_loss": -8.722023010253906, "global_step": 74691, "epoch": 444} {"train_loss": -8.515016555786133, "global_step": 74692, "epoch": 444} {"train_loss": -8.957521438598633, "global_step": 74693, "epoch": 444} {"train_loss": -8.915631294250488, "global_step": 74694, "epoch": 444} {"train_loss": -8.681217193603516, "global_step": 74695, "epoch": 444} {"train_loss": -8.983207702636719, "global_step": 74696, "epoch": 444} {"train_loss": -8.947874069213867, "global_step": 74697, "epoch": 444} {"train_loss": -9.012519836425781, "global_step": 74698, "epoch": 444} {"train_loss": -8.931772232055664, "global_step": 74699, "epoch": 444} {"train_loss": -8.785806655883789, "global_step": 74700, "epoch": 444} {"train_loss": -9.158622741699219, "global_step": 74701, "epoch": 444} {"train_loss": -8.972431182861328, "global_step": 74702, "epoch": 444} {"train_loss": -9.099410057067871, "global_step": 74703, "epoch": 444} {"train_loss": -9.149714469909668, "global_step": 74704, "epoch": 444} {"train_loss": -9.204874992370605, "global_step": 74705, "epoch": 444} {"train_loss": -9.156604766845703, "global_step": 74706, "epoch": 444} {"train_loss": -9.068685531616211, "global_step": 74707, "epoch": 444} {"train_loss": -9.096461296081543, "global_step": 74708, "epoch": 444} {"train_loss": -9.036182403564453, "global_step": 74709, "epoch": 444} {"train_loss": -8.98283863067627, "global_step": 74710, "epoch": 444} {"train_loss": -9.174935340881348, "global_step": 74711, "epoch": 444} {"train_loss": -8.794960975646973, "global_step": 74712, "epoch": 444} {"train_loss": -9.118284225463867, "global_step": 74713, "epoch": 444} {"train_loss": -9.204879760742188, "global_step": 74714, "epoch": 444} {"train_loss": -8.90821647644043, "global_step": 74715, "epoch": 444} {"train_loss": -9.243154525756836, "global_step": 74716, "epoch": 444} {"train_loss": -8.988591194152832, "global_step": 74717, "epoch": 444} {"train_loss": -9.061025619506836, "global_step": 74718, "epoch": 444} {"train_loss": -9.340282440185547, "global_step": 74719, "epoch": 444} {"train_loss": -8.950281143188477, "global_step": 74720, "epoch": 444} {"train_loss": -9.111627578735352, "global_step": 74721, "epoch": 444} {"train_loss": -9.212475776672363, "global_step": 74722, "epoch": 444} {"train_loss": -9.165881156921387, "global_step": 74723, "epoch": 444} {"train_loss": -9.033148765563965, "global_step": 74724, "epoch": 444} {"train_loss": -9.074281692504883, "global_step": 74725, "epoch": 444} {"train_loss": -9.136470794677734, "global_step": 74726, "epoch": 444} {"train_loss": -9.057979583740234, "global_step": 74727, "epoch": 444} {"train_loss": -9.072000503540039, "global_step": 74728, "epoch": 444} {"train_loss": -9.283753395080566, "global_step": 74729, "epoch": 444} {"train_loss": -9.201417922973633, "global_step": 74730, "epoch": 444} {"train_loss": -9.183049201965332, "global_step": 74731, "epoch": 444} {"train_loss": -8.949499130249023, "global_step": 74732, "epoch": 444} {"train_loss": -9.231553077697754, "global_step": 74733, "epoch": 444} {"train_loss": -9.145930290222168, "global_step": 74734, "epoch": 444} {"train_loss": -8.973007202148438, "global_step": 74735, "epoch": 444} {"train_loss": -9.370352745056152, "global_step": 74736, "epoch": 444} {"train_loss": -9.1492338180542, "global_step": 74737, "epoch": 444} {"train_loss": -9.093425750732422, "global_step": 74738, "epoch": 444} {"train_loss": -9.224496841430664, "global_step": 74739, "epoch": 444} {"train_loss": -8.81560230255127, "global_step": 74740, "epoch": 444} {"train_loss": -9.38485050201416, "global_step": 74741, "epoch": 444} {"train_loss": -9.01196575164795, "global_step": 74742, "epoch": 444} {"train_loss": -8.944475173950195, "global_step": 74743, "epoch": 444} {"train_loss": -9.13261604309082, "global_step": 74744, "epoch": 444} {"train_loss": -9.041419982910156, "global_step": 74745, "epoch": 444} {"train_loss": -9.179571151733398, "global_step": 74746, "epoch": 444} {"train_loss": -9.117494583129883, "global_step": 74747, "epoch": 444} {"train_loss": -8.922016143798828, "global_step": 74748, "epoch": 444} {"train_loss": -9.062372207641602, "global_step": 74749, "epoch": 444} {"train_loss": -9.005794525146484, "global_step": 74750, "epoch": 444} {"train_loss": -8.750785827636719, "global_step": 74751, "epoch": 444} {"train_loss": -8.992166519165039, "global_step": 74752, "epoch": 444} {"train_loss": -8.966011047363281, "global_step": 74753, "epoch": 444} {"train_loss": -8.723332405090332, "global_step": 74754, "epoch": 444} {"train_loss": -9.197525978088379, "global_step": 74755, "epoch": 444} {"train_loss": -8.724982261657715, "global_step": 74756, "epoch": 444} {"train_loss": -8.97689437866211, "global_step": 74757, "epoch": 444} {"train_loss": -9.039599418640137, "global_step": 74758, "epoch": 444} {"train_loss": -8.974216540654501, "global_step": 74759, "epoch": 444, "val_loss": 197055.21875} {"train_loss": -8.941186904907227, "global_step": 74760, "epoch": 445} {"train_loss": -8.478163719177246, "global_step": 74761, "epoch": 445} {"train_loss": -9.005324363708496, "global_step": 74762, "epoch": 445} {"train_loss": -8.713282585144043, "global_step": 74763, "epoch": 445} {"train_loss": -8.671262741088867, "global_step": 74764, "epoch": 445} {"train_loss": -8.695171356201172, "global_step": 74765, "epoch": 445} {"train_loss": -8.785743713378906, "global_step": 74766, "epoch": 445} {"train_loss": -8.604307174682617, "global_step": 74767, "epoch": 445} {"train_loss": -8.740039825439453, "global_step": 74768, "epoch": 445} {"train_loss": -8.988690376281738, "global_step": 74769, "epoch": 445} {"train_loss": -8.526749610900879, "global_step": 74770, "epoch": 445} {"train_loss": -9.11090087890625, "global_step": 74771, "epoch": 445} {"train_loss": -8.993109703063965, "global_step": 74772, "epoch": 445} {"train_loss": -8.90765380859375, "global_step": 74773, "epoch": 445} {"train_loss": -9.001154899597168, "global_step": 74774, "epoch": 445} {"train_loss": -8.942956924438477, "global_step": 74775, "epoch": 445} {"train_loss": -8.934429168701172, "global_step": 74776, "epoch": 445} {"train_loss": -9.099919319152832, "global_step": 74777, "epoch": 445} {"train_loss": -9.105148315429688, "global_step": 74778, "epoch": 445} {"train_loss": -9.206562042236328, "global_step": 74779, "epoch": 445} {"train_loss": -8.82322883605957, "global_step": 74780, "epoch": 445} {"train_loss": -9.193471908569336, "global_step": 74781, "epoch": 445} {"train_loss": -9.091193199157715, "global_step": 74782, "epoch": 445} {"train_loss": -9.427334785461426, "global_step": 74783, "epoch": 445} {"train_loss": -9.143075942993164, "global_step": 74784, "epoch": 445} {"train_loss": -9.1682767868042, "global_step": 74785, "epoch": 445} {"train_loss": -8.98379898071289, "global_step": 74786, "epoch": 445} {"train_loss": -9.224449157714844, "global_step": 74787, "epoch": 445} {"train_loss": -8.822797775268555, "global_step": 74788, "epoch": 445} {"train_loss": -8.999092102050781, "global_step": 74789, "epoch": 445} {"train_loss": -8.807596206665039, "global_step": 74790, "epoch": 445} {"train_loss": -9.07612133026123, "global_step": 74791, "epoch": 445} {"train_loss": -8.977059364318848, "global_step": 74792, "epoch": 445} {"train_loss": -9.236298561096191, "global_step": 74793, "epoch": 445} {"train_loss": -9.001733779907227, "global_step": 74794, "epoch": 445} {"train_loss": -8.967578887939453, "global_step": 74795, "epoch": 445} {"train_loss": -9.116928100585938, "global_step": 74796, "epoch": 445} {"train_loss": -8.730117797851562, "global_step": 74797, "epoch": 445} {"train_loss": -9.192829132080078, "global_step": 74798, "epoch": 445} {"train_loss": -9.064903259277344, "global_step": 74799, "epoch": 445} {"train_loss": -9.066490173339844, "global_step": 74800, "epoch": 445} {"train_loss": -9.025543212890625, "global_step": 74801, "epoch": 445} {"train_loss": -8.80656909942627, "global_step": 74802, "epoch": 445} {"train_loss": -9.271434783935547, "global_step": 74803, "epoch": 445} {"train_loss": -9.067076683044434, "global_step": 74804, "epoch": 445} {"train_loss": -8.928979873657227, "global_step": 74805, "epoch": 445} {"train_loss": -8.977901458740234, "global_step": 74806, "epoch": 445} {"train_loss": -8.392745971679688, "global_step": 74807, "epoch": 445} {"train_loss": -8.97098159790039, "global_step": 74808, "epoch": 445} {"train_loss": -8.524181365966797, "global_step": 74809, "epoch": 445} {"train_loss": -9.113383293151855, "global_step": 74810, "epoch": 445} {"train_loss": -8.848413467407227, "global_step": 74811, "epoch": 445} {"train_loss": -8.895052909851074, "global_step": 74812, "epoch": 445} {"train_loss": -9.172603607177734, "global_step": 74813, "epoch": 445} {"train_loss": -8.783415794372559, "global_step": 74814, "epoch": 445} {"train_loss": -8.981531143188477, "global_step": 74815, "epoch": 445} {"train_loss": -9.163256645202637, "global_step": 74816, "epoch": 445} {"train_loss": -9.077831268310547, "global_step": 74817, "epoch": 445} {"train_loss": -9.09637451171875, "global_step": 74818, "epoch": 445} {"train_loss": -8.952542304992676, "global_step": 74819, "epoch": 445} {"train_loss": -9.124536514282227, "global_step": 74820, "epoch": 445} {"train_loss": -9.006414413452148, "global_step": 74821, "epoch": 445} {"train_loss": -8.968378067016602, "global_step": 74822, "epoch": 445} {"train_loss": -9.355581283569336, "global_step": 74823, "epoch": 445} {"train_loss": -8.812711715698242, "global_step": 74824, "epoch": 445} {"train_loss": -9.26972770690918, "global_step": 74825, "epoch": 445} {"train_loss": -9.21084213256836, "global_step": 74826, "epoch": 445} {"train_loss": -8.748916625976562, "global_step": 74827, "epoch": 445} {"train_loss": -9.13118839263916, "global_step": 74828, "epoch": 445} {"train_loss": -8.702432632446289, "global_step": 74829, "epoch": 445} {"train_loss": -9.116556167602539, "global_step": 74830, "epoch": 445} {"train_loss": -8.775518417358398, "global_step": 74831, "epoch": 445} {"train_loss": -9.106292724609375, "global_step": 74832, "epoch": 445} {"train_loss": -8.922470092773438, "global_step": 74833, "epoch": 445} {"train_loss": -8.871040344238281, "global_step": 74834, "epoch": 445} {"train_loss": -8.822149276733398, "global_step": 74835, "epoch": 445} {"train_loss": -8.95913314819336, "global_step": 74836, "epoch": 445} {"train_loss": -9.184417724609375, "global_step": 74837, "epoch": 445} {"train_loss": -9.086057662963867, "global_step": 74838, "epoch": 445} {"train_loss": -8.702974319458008, "global_step": 74839, "epoch": 445} {"train_loss": -8.949395179748535, "global_step": 74840, "epoch": 445} {"train_loss": -9.02023983001709, "global_step": 74841, "epoch": 445} {"train_loss": -9.044867515563965, "global_step": 74842, "epoch": 445} {"train_loss": -8.84891128540039, "global_step": 74843, "epoch": 445} {"train_loss": -9.108838081359863, "global_step": 74844, "epoch": 445} {"train_loss": -8.934032440185547, "global_step": 74845, "epoch": 445} {"train_loss": -9.000438690185547, "global_step": 74846, "epoch": 445} {"train_loss": -8.941286087036133, "global_step": 74847, "epoch": 445} {"train_loss": -9.245004653930664, "global_step": 74848, "epoch": 445} {"train_loss": -8.93798828125, "global_step": 74849, "epoch": 445} {"train_loss": -9.327384948730469, "global_step": 74850, "epoch": 445} {"train_loss": -8.73051643371582, "global_step": 74851, "epoch": 445} {"train_loss": -9.01480484008789, "global_step": 74852, "epoch": 445} {"train_loss": -9.080612182617188, "global_step": 74853, "epoch": 445} {"train_loss": -8.834514617919922, "global_step": 74854, "epoch": 445} {"train_loss": -8.850707054138184, "global_step": 74855, "epoch": 445} {"train_loss": -8.778360366821289, "global_step": 74856, "epoch": 445} {"train_loss": -8.852090835571289, "global_step": 74857, "epoch": 445} {"train_loss": -8.70861530303955, "global_step": 74858, "epoch": 445} {"train_loss": -8.891462326049805, "global_step": 74859, "epoch": 445} {"train_loss": -8.991689682006836, "global_step": 74860, "epoch": 445} {"train_loss": -9.0213041305542, "global_step": 74861, "epoch": 445} {"train_loss": -8.921344757080078, "global_step": 74862, "epoch": 445} {"train_loss": -8.924535751342773, "global_step": 74863, "epoch": 445} {"train_loss": -8.964818000793457, "global_step": 74864, "epoch": 445} {"train_loss": -9.140168190002441, "global_step": 74865, "epoch": 445} {"train_loss": -9.12641716003418, "global_step": 74866, "epoch": 445} {"train_loss": -8.706104278564453, "global_step": 74867, "epoch": 445} {"train_loss": -9.140819549560547, "global_step": 74868, "epoch": 445} {"train_loss": -8.96906852722168, "global_step": 74869, "epoch": 445} {"train_loss": -8.969681739807129, "global_step": 74870, "epoch": 445} {"train_loss": -8.816384315490723, "global_step": 74871, "epoch": 445} {"train_loss": -9.012523651123047, "global_step": 74872, "epoch": 445} {"train_loss": -9.064077377319336, "global_step": 74873, "epoch": 445} {"train_loss": -9.03797721862793, "global_step": 74874, "epoch": 445} {"train_loss": -8.83432388305664, "global_step": 74875, "epoch": 445} {"train_loss": -8.741170883178711, "global_step": 74876, "epoch": 445} {"train_loss": -8.961346626281738, "global_step": 74877, "epoch": 445} {"train_loss": -9.266502380371094, "global_step": 74878, "epoch": 445} {"train_loss": -9.077495574951172, "global_step": 74879, "epoch": 445} {"train_loss": -9.133550643920898, "global_step": 74880, "epoch": 445} {"train_loss": -8.92097282409668, "global_step": 74881, "epoch": 445} {"train_loss": -8.88453483581543, "global_step": 74882, "epoch": 445} {"train_loss": -8.967203140258789, "global_step": 74883, "epoch": 445} {"train_loss": -8.882769584655762, "global_step": 74884, "epoch": 445} {"train_loss": -8.557332992553711, "global_step": 74885, "epoch": 445} {"train_loss": -9.171310424804688, "global_step": 74886, "epoch": 445} {"train_loss": -8.85944938659668, "global_step": 74887, "epoch": 445} {"train_loss": -8.981386184692383, "global_step": 74888, "epoch": 445} {"train_loss": -9.086939811706543, "global_step": 74889, "epoch": 445} {"train_loss": -9.110342025756836, "global_step": 74890, "epoch": 445} {"train_loss": -9.030267715454102, "global_step": 74891, "epoch": 445} {"train_loss": -9.005426406860352, "global_step": 74892, "epoch": 445} {"train_loss": -9.148601531982422, "global_step": 74893, "epoch": 445} {"train_loss": -9.04688835144043, "global_step": 74894, "epoch": 445} {"train_loss": -8.954843521118164, "global_step": 74895, "epoch": 445} {"train_loss": -9.00178337097168, "global_step": 74896, "epoch": 445} {"train_loss": -8.951343536376953, "global_step": 74897, "epoch": 445} {"train_loss": -9.275497436523438, "global_step": 74898, "epoch": 445} {"train_loss": -8.928802490234375, "global_step": 74899, "epoch": 445} {"train_loss": -9.134211540222168, "global_step": 74900, "epoch": 445} {"train_loss": -9.230026245117188, "global_step": 74901, "epoch": 445} {"train_loss": -9.009584426879883, "global_step": 74902, "epoch": 445} {"train_loss": -8.96855354309082, "global_step": 74903, "epoch": 445} {"train_loss": -9.20085334777832, "global_step": 74904, "epoch": 445} {"train_loss": -9.393232345581055, "global_step": 74905, "epoch": 445} {"train_loss": -9.021448135375977, "global_step": 74906, "epoch": 445} {"train_loss": -9.041749954223633, "global_step": 74907, "epoch": 445} {"train_loss": -9.026668548583984, "global_step": 74908, "epoch": 445} {"train_loss": -9.14005184173584, "global_step": 74909, "epoch": 445} {"train_loss": -9.086921691894531, "global_step": 74910, "epoch": 445} {"train_loss": -9.266358375549316, "global_step": 74911, "epoch": 445} {"train_loss": -8.538515090942383, "global_step": 74912, "epoch": 445} {"train_loss": -9.196722030639648, "global_step": 74913, "epoch": 445} {"train_loss": -8.865267753601074, "global_step": 74914, "epoch": 445} {"train_loss": -9.0645751953125, "global_step": 74915, "epoch": 445} {"train_loss": -8.874530792236328, "global_step": 74916, "epoch": 445} {"train_loss": -8.735175132751465, "global_step": 74917, "epoch": 445} {"train_loss": -8.61124324798584, "global_step": 74918, "epoch": 445} {"train_loss": -8.960659980773926, "global_step": 74919, "epoch": 445} {"train_loss": -8.563612937927246, "global_step": 74920, "epoch": 445} {"train_loss": -8.88548469543457, "global_step": 74921, "epoch": 445} {"train_loss": -8.71593952178955, "global_step": 74922, "epoch": 445} {"train_loss": -8.952040672302246, "global_step": 74923, "epoch": 445} {"train_loss": -8.816673278808594, "global_step": 74924, "epoch": 445} {"train_loss": -8.789236068725586, "global_step": 74925, "epoch": 445} {"train_loss": -8.798065185546875, "global_step": 74926, "epoch": 445} {"train_loss": -8.970662996882485, "global_step": 74927, "epoch": 445, "val_loss": 197253.4375, "train_action_mse_error": 8.125621795654297} {"train_loss": -9.126953125, "global_step": 74928, "epoch": 446} {"train_loss": -8.919344902038574, "global_step": 74929, "epoch": 446} {"train_loss": -9.13283920288086, "global_step": 74930, "epoch": 446} {"train_loss": -9.118403434753418, "global_step": 74931, "epoch": 446} {"train_loss": -9.254562377929688, "global_step": 74932, "epoch": 446} {"train_loss": -9.099495887756348, "global_step": 74933, "epoch": 446} {"train_loss": -8.914082527160645, "global_step": 74934, "epoch": 446} {"train_loss": -9.240813255310059, "global_step": 74935, "epoch": 446} {"train_loss": -8.962617874145508, "global_step": 74936, "epoch": 446} {"train_loss": -8.923208236694336, "global_step": 74937, "epoch": 446} {"train_loss": -8.876895904541016, "global_step": 74938, "epoch": 446} {"train_loss": -8.877771377563477, "global_step": 74939, "epoch": 446} {"train_loss": -8.910932540893555, "global_step": 74940, "epoch": 446} {"train_loss": -9.212106704711914, "global_step": 74941, "epoch": 446} {"train_loss": -9.080536842346191, "global_step": 74942, "epoch": 446} {"train_loss": -9.326408386230469, "global_step": 74943, "epoch": 446} {"train_loss": -9.08829116821289, "global_step": 74944, "epoch": 446} {"train_loss": -9.137397766113281, "global_step": 74945, "epoch": 446} {"train_loss": -9.144969940185547, "global_step": 74946, "epoch": 446} {"train_loss": -9.207277297973633, "global_step": 74947, "epoch": 446} {"train_loss": -9.032915115356445, "global_step": 74948, "epoch": 446} {"train_loss": -8.965470314025879, "global_step": 74949, "epoch": 446} {"train_loss": -9.116551399230957, "global_step": 74950, "epoch": 446} {"train_loss": -9.130443572998047, "global_step": 74951, "epoch": 446} {"train_loss": -9.018851280212402, "global_step": 74952, "epoch": 446} {"train_loss": -9.319051742553711, "global_step": 74953, "epoch": 446} {"train_loss": -9.052967071533203, "global_step": 74954, "epoch": 446} {"train_loss": -9.285863876342773, "global_step": 74955, "epoch": 446} {"train_loss": -8.995502471923828, "global_step": 74956, "epoch": 446} {"train_loss": -9.002098083496094, "global_step": 74957, "epoch": 446} {"train_loss": -9.297917366027832, "global_step": 74958, "epoch": 446} {"train_loss": -9.08594799041748, "global_step": 74959, "epoch": 446} {"train_loss": -9.11567211151123, "global_step": 74960, "epoch": 446} {"train_loss": -9.011754035949707, "global_step": 74961, "epoch": 446} {"train_loss": -8.909290313720703, "global_step": 74962, "epoch": 446} {"train_loss": -9.330389022827148, "global_step": 74963, "epoch": 446} {"train_loss": -9.282255172729492, "global_step": 74964, "epoch": 446} {"train_loss": -9.281570434570312, "global_step": 74965, "epoch": 446} {"train_loss": -9.456464767456055, "global_step": 74966, "epoch": 446} {"train_loss": -9.050661087036133, "global_step": 74967, "epoch": 446} {"train_loss": -9.55810546875, "global_step": 74968, "epoch": 446} {"train_loss": -8.889021873474121, "global_step": 74969, "epoch": 446} {"train_loss": -9.194709777832031, "global_step": 74970, "epoch": 446} {"train_loss": -9.096378326416016, "global_step": 74971, "epoch": 446} {"train_loss": -9.088578224182129, "global_step": 74972, "epoch": 446} {"train_loss": -9.023965835571289, "global_step": 74973, "epoch": 446} {"train_loss": -9.294367790222168, "global_step": 74974, "epoch": 446} {"train_loss": -9.167928695678711, "global_step": 74975, "epoch": 446} {"train_loss": -8.937760353088379, "global_step": 74976, "epoch": 446} {"train_loss": -8.825321197509766, "global_step": 74977, "epoch": 446} {"train_loss": -8.931310653686523, "global_step": 74978, "epoch": 446} {"train_loss": -8.966653823852539, "global_step": 74979, "epoch": 446} {"train_loss": -9.088726043701172, "global_step": 74980, "epoch": 446} {"train_loss": -9.027612686157227, "global_step": 74981, "epoch": 446} {"train_loss": -9.122488975524902, "global_step": 74982, "epoch": 446} {"train_loss": -9.010679244995117, "global_step": 74983, "epoch": 446} {"train_loss": -9.183907508850098, "global_step": 74984, "epoch": 446} {"train_loss": -9.24681282043457, "global_step": 74985, "epoch": 446} {"train_loss": -9.127220153808594, "global_step": 74986, "epoch": 446} {"train_loss": -8.86886215209961, "global_step": 74987, "epoch": 446} {"train_loss": -9.161102294921875, "global_step": 74988, "epoch": 446} {"train_loss": -9.048468589782715, "global_step": 74989, "epoch": 446} {"train_loss": -8.932188987731934, "global_step": 74990, "epoch": 446} {"train_loss": -8.800418853759766, "global_step": 74991, "epoch": 446} {"train_loss": -8.968113899230957, "global_step": 74992, "epoch": 446} {"train_loss": -9.090503692626953, "global_step": 74993, "epoch": 446} {"train_loss": -8.997403144836426, "global_step": 74994, "epoch": 446} {"train_loss": -9.357404708862305, "global_step": 74995, "epoch": 446} {"train_loss": -9.181100845336914, "global_step": 74996, "epoch": 446} {"train_loss": -9.049267768859863, "global_step": 74997, "epoch": 446} {"train_loss": -9.005434036254883, "global_step": 74998, "epoch": 446} {"train_loss": -8.978923797607422, "global_step": 74999, "epoch": 446} {"train_loss": -8.982538223266602, "global_step": 75000, "epoch": 446} {"train_loss": -9.265068054199219, "global_step": 75001, "epoch": 446} {"train_loss": -9.241077423095703, "global_step": 75002, "epoch": 446} {"train_loss": -9.184078216552734, "global_step": 75003, "epoch": 446} {"train_loss": -9.080133438110352, "global_step": 75004, "epoch": 446} {"train_loss": -9.234466552734375, "global_step": 75005, "epoch": 446} {"train_loss": -9.178936958312988, "global_step": 75006, "epoch": 446} {"train_loss": -9.13962459564209, "global_step": 75007, "epoch": 446} {"train_loss": -9.11428165435791, "global_step": 75008, "epoch": 446} {"train_loss": -9.19897174835205, "global_step": 75009, "epoch": 446} {"train_loss": -9.053836822509766, "global_step": 75010, "epoch": 446} {"train_loss": -9.156005859375, "global_step": 75011, "epoch": 446} {"train_loss": -9.13176155090332, "global_step": 75012, "epoch": 446} {"train_loss": -9.013425827026367, "global_step": 75013, "epoch": 446} {"train_loss": -9.339664459228516, "global_step": 75014, "epoch": 446} {"train_loss": -8.87421989440918, "global_step": 75015, "epoch": 446} {"train_loss": -8.871099472045898, "global_step": 75016, "epoch": 446} {"train_loss": -8.991695404052734, "global_step": 75017, "epoch": 446} {"train_loss": -9.036694526672363, "global_step": 75018, "epoch": 446} {"train_loss": -8.980226516723633, "global_step": 75019, "epoch": 446} {"train_loss": -9.211933135986328, "global_step": 75020, "epoch": 446} {"train_loss": -9.118199348449707, "global_step": 75021, "epoch": 446} {"train_loss": -8.988870620727539, "global_step": 75022, "epoch": 446} {"train_loss": -8.930585861206055, "global_step": 75023, "epoch": 446} {"train_loss": -8.894295692443848, "global_step": 75024, "epoch": 446} {"train_loss": -8.495696067810059, "global_step": 75025, "epoch": 446} {"train_loss": -9.142126083374023, "global_step": 75026, "epoch": 446} {"train_loss": -9.021635055541992, "global_step": 75027, "epoch": 446} {"train_loss": -8.871946334838867, "global_step": 75028, "epoch": 446} {"train_loss": -8.68076229095459, "global_step": 75029, "epoch": 446} {"train_loss": -8.713663101196289, "global_step": 75030, "epoch": 446} {"train_loss": -9.052574157714844, "global_step": 75031, "epoch": 446} {"train_loss": -8.91957950592041, "global_step": 75032, "epoch": 446} {"train_loss": -8.866140365600586, "global_step": 75033, "epoch": 446} {"train_loss": -9.058649063110352, "global_step": 75034, "epoch": 446} {"train_loss": -9.063164710998535, "global_step": 75035, "epoch": 446} {"train_loss": -9.050190925598145, "global_step": 75036, "epoch": 446} {"train_loss": -8.822542190551758, "global_step": 75037, "epoch": 446} {"train_loss": -9.183944702148438, "global_step": 75038, "epoch": 446} {"train_loss": -9.006816864013672, "global_step": 75039, "epoch": 446} {"train_loss": -9.10501480102539, "global_step": 75040, "epoch": 446} {"train_loss": -9.180253028869629, "global_step": 75041, "epoch": 446} {"train_loss": -9.11782455444336, "global_step": 75042, "epoch": 446} {"train_loss": -9.043548583984375, "global_step": 75043, "epoch": 446} {"train_loss": -9.177745819091797, "global_step": 75044, "epoch": 446} {"train_loss": -9.237085342407227, "global_step": 75045, "epoch": 446} {"train_loss": -9.208772659301758, "global_step": 75046, "epoch": 446} {"train_loss": -9.1967191696167, "global_step": 75047, "epoch": 446} {"train_loss": -9.369979858398438, "global_step": 75048, "epoch": 446} {"train_loss": -8.86229133605957, "global_step": 75049, "epoch": 446} {"train_loss": -9.030330657958984, "global_step": 75050, "epoch": 446} {"train_loss": -8.769889831542969, "global_step": 75051, "epoch": 446} {"train_loss": -9.241080284118652, "global_step": 75052, "epoch": 446} {"train_loss": -9.250748634338379, "global_step": 75053, "epoch": 446} {"train_loss": -9.0213041305542, "global_step": 75054, "epoch": 446} {"train_loss": -9.24940299987793, "global_step": 75055, "epoch": 446} {"train_loss": -8.746294975280762, "global_step": 75056, "epoch": 446} {"train_loss": -8.985015869140625, "global_step": 75057, "epoch": 446} {"train_loss": -8.68224048614502, "global_step": 75058, "epoch": 446} {"train_loss": -8.790233612060547, "global_step": 75059, "epoch": 446} {"train_loss": -8.652484893798828, "global_step": 75060, "epoch": 446} {"train_loss": -8.84227180480957, "global_step": 75061, "epoch": 446} {"train_loss": -8.962482452392578, "global_step": 75062, "epoch": 446} {"train_loss": -9.012779235839844, "global_step": 75063, "epoch": 446} {"train_loss": -8.601436614990234, "global_step": 75064, "epoch": 446} {"train_loss": -8.9717378616333, "global_step": 75065, "epoch": 446} {"train_loss": -8.900187492370605, "global_step": 75066, "epoch": 446} {"train_loss": -8.847140312194824, "global_step": 75067, "epoch": 446} {"train_loss": -8.945568084716797, "global_step": 75068, "epoch": 446} {"train_loss": -9.04767894744873, "global_step": 75069, "epoch": 446} {"train_loss": -8.809394836425781, "global_step": 75070, "epoch": 446} {"train_loss": -9.001411437988281, "global_step": 75071, "epoch": 446} {"train_loss": -9.309381484985352, "global_step": 75072, "epoch": 446} {"train_loss": -8.932352066040039, "global_step": 75073, "epoch": 446} {"train_loss": -9.042537689208984, "global_step": 75074, "epoch": 446} {"train_loss": -9.14599895477295, "global_step": 75075, "epoch": 446} {"train_loss": -9.011714935302734, "global_step": 75076, "epoch": 446} {"train_loss": -9.170663833618164, "global_step": 75077, "epoch": 446} {"train_loss": -9.102554321289062, "global_step": 75078, "epoch": 446} {"train_loss": -9.00523567199707, "global_step": 75079, "epoch": 446} {"train_loss": -8.978736877441406, "global_step": 75080, "epoch": 446} {"train_loss": -8.810470581054688, "global_step": 75081, "epoch": 446} {"train_loss": -9.067021369934082, "global_step": 75082, "epoch": 446} {"train_loss": -8.97753620147705, "global_step": 75083, "epoch": 446} {"train_loss": -8.860590934753418, "global_step": 75084, "epoch": 446} {"train_loss": -8.97225570678711, "global_step": 75085, "epoch": 446} {"train_loss": -8.805746078491211, "global_step": 75086, "epoch": 446} {"train_loss": -9.024129867553711, "global_step": 75087, "epoch": 446} {"train_loss": -8.941909790039062, "global_step": 75088, "epoch": 446} {"train_loss": -8.8817138671875, "global_step": 75089, "epoch": 446} {"train_loss": -8.800286293029785, "global_step": 75090, "epoch": 446} {"train_loss": -9.055313110351562, "global_step": 75091, "epoch": 446} {"train_loss": -9.157249450683594, "global_step": 75092, "epoch": 446} {"train_loss": -8.92892074584961, "global_step": 75093, "epoch": 446} {"train_loss": -8.921806335449219, "global_step": 75094, "epoch": 446} {"train_loss": -9.045577060608636, "global_step": 75095, "epoch": 446, "val_loss": 196090.078125} {"train_loss": -8.822331428527832, "global_step": 75096, "epoch": 447} {"train_loss": -8.843318939208984, "global_step": 75097, "epoch": 447} {"train_loss": -9.09796142578125, "global_step": 75098, "epoch": 447} {"train_loss": -8.640462875366211, "global_step": 75099, "epoch": 447} {"train_loss": -9.006027221679688, "global_step": 75100, "epoch": 447} {"train_loss": -9.056567192077637, "global_step": 75101, "epoch": 447} {"train_loss": -8.909501075744629, "global_step": 75102, "epoch": 447} {"train_loss": -8.799299240112305, "global_step": 75103, "epoch": 447} {"train_loss": -8.794578552246094, "global_step": 75104, "epoch": 447} {"train_loss": -9.1343412399292, "global_step": 75105, "epoch": 447} {"train_loss": -9.059334754943848, "global_step": 75106, "epoch": 447} {"train_loss": -8.931041717529297, "global_step": 75107, "epoch": 447} {"train_loss": -8.976434707641602, "global_step": 75108, "epoch": 447} {"train_loss": -8.87885570526123, "global_step": 75109, "epoch": 447} {"train_loss": -8.787135124206543, "global_step": 75110, "epoch": 447} {"train_loss": -9.077470779418945, "global_step": 75111, "epoch": 447} {"train_loss": -9.102340698242188, "global_step": 75112, "epoch": 447} {"train_loss": -8.857400894165039, "global_step": 75113, "epoch": 447} {"train_loss": -8.99307632446289, "global_step": 75114, "epoch": 447} {"train_loss": -9.151224136352539, "global_step": 75115, "epoch": 447} {"train_loss": -9.064221382141113, "global_step": 75116, "epoch": 447} {"train_loss": -8.837747573852539, "global_step": 75117, "epoch": 447} {"train_loss": -8.935243606567383, "global_step": 75118, "epoch": 447} {"train_loss": -9.04787540435791, "global_step": 75119, "epoch": 447} {"train_loss": -8.906220436096191, "global_step": 75120, "epoch": 447} {"train_loss": -9.030464172363281, "global_step": 75121, "epoch": 447} {"train_loss": -8.887947082519531, "global_step": 75122, "epoch": 447} {"train_loss": -9.033398628234863, "global_step": 75123, "epoch": 447} {"train_loss": -8.634270668029785, "global_step": 75124, "epoch": 447} {"train_loss": -8.996468544006348, "global_step": 75125, "epoch": 447} {"train_loss": -8.958019256591797, "global_step": 75126, "epoch": 447} {"train_loss": -8.916315078735352, "global_step": 75127, "epoch": 447} {"train_loss": -9.036760330200195, "global_step": 75128, "epoch": 447} {"train_loss": -9.126774787902832, "global_step": 75129, "epoch": 447} {"train_loss": -8.969278335571289, "global_step": 75130, "epoch": 447} {"train_loss": -9.095338821411133, "global_step": 75131, "epoch": 447} {"train_loss": -8.94770336151123, "global_step": 75132, "epoch": 447} {"train_loss": -9.05373764038086, "global_step": 75133, "epoch": 447} {"train_loss": -8.989839553833008, "global_step": 75134, "epoch": 447} {"train_loss": -9.350482940673828, "global_step": 75135, "epoch": 447} {"train_loss": -8.98448371887207, "global_step": 75136, "epoch": 447} {"train_loss": -9.271345138549805, "global_step": 75137, "epoch": 447} {"train_loss": -9.015543937683105, "global_step": 75138, "epoch": 447} {"train_loss": -9.094423294067383, "global_step": 75139, "epoch": 447} {"train_loss": -9.025766372680664, "global_step": 75140, "epoch": 447} {"train_loss": -9.307478904724121, "global_step": 75141, "epoch": 447} {"train_loss": -9.218713760375977, "global_step": 75142, "epoch": 447} {"train_loss": -9.228570938110352, "global_step": 75143, "epoch": 447} {"train_loss": -9.226086616516113, "global_step": 75144, "epoch": 447} {"train_loss": -9.219809532165527, "global_step": 75145, "epoch": 447} {"train_loss": -9.162753105163574, "global_step": 75146, "epoch": 447} {"train_loss": -9.389602661132812, "global_step": 75147, "epoch": 447} {"train_loss": -9.044754028320312, "global_step": 75148, "epoch": 447} {"train_loss": -9.279598236083984, "global_step": 75149, "epoch": 447} {"train_loss": -8.955972671508789, "global_step": 75150, "epoch": 447} {"train_loss": -8.498302459716797, "global_step": 75151, "epoch": 447} {"train_loss": -9.005894660949707, "global_step": 75152, "epoch": 447} {"train_loss": -8.892815589904785, "global_step": 75153, "epoch": 447} {"train_loss": -8.9603910446167, "global_step": 75154, "epoch": 447} {"train_loss": -8.851305961608887, "global_step": 75155, "epoch": 447} {"train_loss": -9.045740127563477, "global_step": 75156, "epoch": 447} {"train_loss": -8.962784767150879, "global_step": 75157, "epoch": 447} {"train_loss": -8.945234298706055, "global_step": 75158, "epoch": 447} {"train_loss": -8.790014266967773, "global_step": 75159, "epoch": 447} {"train_loss": -9.075425148010254, "global_step": 75160, "epoch": 447} {"train_loss": -8.873598098754883, "global_step": 75161, "epoch": 447} {"train_loss": -9.041467666625977, "global_step": 75162, "epoch": 447} {"train_loss": -9.107206344604492, "global_step": 75163, "epoch": 447} {"train_loss": -9.100427627563477, "global_step": 75164, "epoch": 447} {"train_loss": -9.106108665466309, "global_step": 75165, "epoch": 447} {"train_loss": -8.511857986450195, "global_step": 75166, "epoch": 447} {"train_loss": -9.177938461303711, "global_step": 75167, "epoch": 447} {"train_loss": -8.842798233032227, "global_step": 75168, "epoch": 447} {"train_loss": -9.210868835449219, "global_step": 75169, "epoch": 447} {"train_loss": -8.858841896057129, "global_step": 75170, "epoch": 447} {"train_loss": -8.971324920654297, "global_step": 75171, "epoch": 447} {"train_loss": -8.602657318115234, "global_step": 75172, "epoch": 447} {"train_loss": -8.762397766113281, "global_step": 75173, "epoch": 447} {"train_loss": -9.074005126953125, "global_step": 75174, "epoch": 447} {"train_loss": -8.572665214538574, "global_step": 75175, "epoch": 447} {"train_loss": -9.120397567749023, "global_step": 75176, "epoch": 447} {"train_loss": -8.75143814086914, "global_step": 75177, "epoch": 447} {"train_loss": -8.945581436157227, "global_step": 75178, "epoch": 447} {"train_loss": -9.19510269165039, "global_step": 75179, "epoch": 447} {"train_loss": -9.047014236450195, "global_step": 75180, "epoch": 447} {"train_loss": -9.101049423217773, "global_step": 75181, "epoch": 447} {"train_loss": -9.086517333984375, "global_step": 75182, "epoch": 447} {"train_loss": -8.912830352783203, "global_step": 75183, "epoch": 447} {"train_loss": -8.96310806274414, "global_step": 75184, "epoch": 447} {"train_loss": -9.041967391967773, "global_step": 75185, "epoch": 447} {"train_loss": -9.070354461669922, "global_step": 75186, "epoch": 447} {"train_loss": -9.250732421875, "global_step": 75187, "epoch": 447} {"train_loss": -8.905309677124023, "global_step": 75188, "epoch": 447} {"train_loss": -8.784314155578613, "global_step": 75189, "epoch": 447} {"train_loss": -9.121788024902344, "global_step": 75190, "epoch": 447} {"train_loss": -8.903965950012207, "global_step": 75191, "epoch": 447} {"train_loss": -9.370194435119629, "global_step": 75192, "epoch": 447} {"train_loss": -8.58503532409668, "global_step": 75193, "epoch": 447} {"train_loss": -8.98110294342041, "global_step": 75194, "epoch": 447} {"train_loss": -8.967182159423828, "global_step": 75195, "epoch": 447} {"train_loss": -8.848204612731934, "global_step": 75196, "epoch": 447} {"train_loss": -9.029630661010742, "global_step": 75197, "epoch": 447} {"train_loss": -9.320894241333008, "global_step": 75198, "epoch": 447} {"train_loss": -9.121944427490234, "global_step": 75199, "epoch": 447} {"train_loss": -9.151257514953613, "global_step": 75200, "epoch": 447} {"train_loss": -9.054647445678711, "global_step": 75201, "epoch": 447} {"train_loss": -9.192734718322754, "global_step": 75202, "epoch": 447} {"train_loss": -9.081039428710938, "global_step": 75203, "epoch": 447} {"train_loss": -9.317167282104492, "global_step": 75204, "epoch": 447} {"train_loss": -9.111940383911133, "global_step": 75205, "epoch": 447} {"train_loss": -9.239425659179688, "global_step": 75206, "epoch": 447} {"train_loss": -9.161048889160156, "global_step": 75207, "epoch": 447} {"train_loss": -9.028443336486816, "global_step": 75208, "epoch": 447} {"train_loss": -8.930400848388672, "global_step": 75209, "epoch": 447} {"train_loss": -9.033300399780273, "global_step": 75210, "epoch": 447} {"train_loss": -9.300700187683105, "global_step": 75211, "epoch": 447} {"train_loss": -9.054157257080078, "global_step": 75212, "epoch": 447} {"train_loss": -9.308534622192383, "global_step": 75213, "epoch": 447} {"train_loss": -9.268973350524902, "global_step": 75214, "epoch": 447} {"train_loss": -9.157596588134766, "global_step": 75215, "epoch": 447} {"train_loss": -9.159966468811035, "global_step": 75216, "epoch": 447} {"train_loss": -8.932616233825684, "global_step": 75217, "epoch": 447} {"train_loss": -8.95024585723877, "global_step": 75218, "epoch": 447} {"train_loss": -8.983711242675781, "global_step": 75219, "epoch": 447} {"train_loss": -8.99365520477295, "global_step": 75220, "epoch": 447} {"train_loss": -9.022573471069336, "global_step": 75221, "epoch": 447} {"train_loss": -9.001887321472168, "global_step": 75222, "epoch": 447} {"train_loss": -9.14893913269043, "global_step": 75223, "epoch": 447} {"train_loss": -9.068668365478516, "global_step": 75224, "epoch": 447} {"train_loss": -9.280317306518555, "global_step": 75225, "epoch": 447} {"train_loss": -8.932047843933105, "global_step": 75226, "epoch": 447} {"train_loss": -9.166720390319824, "global_step": 75227, "epoch": 447} {"train_loss": -9.028806686401367, "global_step": 75228, "epoch": 447} {"train_loss": -9.226269721984863, "global_step": 75229, "epoch": 447} {"train_loss": -9.00147533416748, "global_step": 75230, "epoch": 447} {"train_loss": -9.225830078125, "global_step": 75231, "epoch": 447} {"train_loss": -9.01127815246582, "global_step": 75232, "epoch": 447} {"train_loss": -9.143648147583008, "global_step": 75233, "epoch": 447} {"train_loss": -9.022852897644043, "global_step": 75234, "epoch": 447} {"train_loss": -9.14314079284668, "global_step": 75235, "epoch": 447} {"train_loss": -9.367488861083984, "global_step": 75236, "epoch": 447} {"train_loss": -9.411117553710938, "global_step": 75237, "epoch": 447} {"train_loss": -9.371635437011719, "global_step": 75238, "epoch": 447} {"train_loss": -9.197291374206543, "global_step": 75239, "epoch": 447} {"train_loss": -9.153512954711914, "global_step": 75240, "epoch": 447} {"train_loss": -9.217757225036621, "global_step": 75241, "epoch": 447} {"train_loss": -9.21525764465332, "global_step": 75242, "epoch": 447} {"train_loss": -9.304737091064453, "global_step": 75243, "epoch": 447} {"train_loss": -9.286197662353516, "global_step": 75244, "epoch": 447} {"train_loss": -9.21078872680664, "global_step": 75245, "epoch": 447} {"train_loss": -9.234724044799805, "global_step": 75246, "epoch": 447} {"train_loss": -9.432565689086914, "global_step": 75247, "epoch": 447} {"train_loss": -9.141178131103516, "global_step": 75248, "epoch": 447} {"train_loss": -9.378829956054688, "global_step": 75249, "epoch": 447} {"train_loss": -9.221250534057617, "global_step": 75250, "epoch": 447} {"train_loss": -9.024812698364258, "global_step": 75251, "epoch": 447} {"train_loss": -8.945874214172363, "global_step": 75252, "epoch": 447} {"train_loss": -8.888940811157227, "global_step": 75253, "epoch": 447} {"train_loss": -8.910482406616211, "global_step": 75254, "epoch": 447} {"train_loss": -8.640044212341309, "global_step": 75255, "epoch": 447} {"train_loss": -8.724385261535645, "global_step": 75256, "epoch": 447} {"train_loss": -8.958714485168457, "global_step": 75257, "epoch": 447} {"train_loss": -8.679868698120117, "global_step": 75258, "epoch": 447} {"train_loss": -8.593084335327148, "global_step": 75259, "epoch": 447} {"train_loss": -7.768914222717285, "global_step": 75260, "epoch": 447} {"train_loss": -8.564352035522461, "global_step": 75261, "epoch": 447} {"train_loss": -8.00271224975586, "global_step": 75262, "epoch": 447} {"train_loss": -9.013445053781782, "global_step": 75263, "epoch": 447, "val_loss": 197573.359375} {"train_loss": -8.012308120727539, "global_step": 75264, "epoch": 448} {"train_loss": -8.149068832397461, "global_step": 75265, "epoch": 448} {"train_loss": -8.355489730834961, "global_step": 75266, "epoch": 448} {"train_loss": -8.61374568939209, "global_step": 75267, "epoch": 448} {"train_loss": -8.219249725341797, "global_step": 75268, "epoch": 448} {"train_loss": -8.49368953704834, "global_step": 75269, "epoch": 448} {"train_loss": -8.577656745910645, "global_step": 75270, "epoch": 448} {"train_loss": -8.616621017456055, "global_step": 75271, "epoch": 448} {"train_loss": -8.676946640014648, "global_step": 75272, "epoch": 448} {"train_loss": -8.312217712402344, "global_step": 75273, "epoch": 448} {"train_loss": -8.601633071899414, "global_step": 75274, "epoch": 448} {"train_loss": -8.594671249389648, "global_step": 75275, "epoch": 448} {"train_loss": -8.716228485107422, "global_step": 75276, "epoch": 448} {"train_loss": -8.572397232055664, "global_step": 75277, "epoch": 448} {"train_loss": -8.871428489685059, "global_step": 75278, "epoch": 448} {"train_loss": -8.7181396484375, "global_step": 75279, "epoch": 448} {"train_loss": -8.461097717285156, "global_step": 75280, "epoch": 448} {"train_loss": -8.806418418884277, "global_step": 75281, "epoch": 448} {"train_loss": -9.042308807373047, "global_step": 75282, "epoch": 448} {"train_loss": -8.56187629699707, "global_step": 75283, "epoch": 448} {"train_loss": -8.901952743530273, "global_step": 75284, "epoch": 448} {"train_loss": -8.912517547607422, "global_step": 75285, "epoch": 448} {"train_loss": -8.98741340637207, "global_step": 75286, "epoch": 448} {"train_loss": -8.915868759155273, "global_step": 75287, "epoch": 448} {"train_loss": -8.834253311157227, "global_step": 75288, "epoch": 448} {"train_loss": -9.10590934753418, "global_step": 75289, "epoch": 448} {"train_loss": -8.958030700683594, "global_step": 75290, "epoch": 448} {"train_loss": -9.054210662841797, "global_step": 75291, "epoch": 448} {"train_loss": -8.960517883300781, "global_step": 75292, "epoch": 448} {"train_loss": -9.023347854614258, "global_step": 75293, "epoch": 448} {"train_loss": -8.954483032226562, "global_step": 75294, "epoch": 448} {"train_loss": -9.183914184570312, "global_step": 75295, "epoch": 448} {"train_loss": -9.131368637084961, "global_step": 75296, "epoch": 448} {"train_loss": -9.177224159240723, "global_step": 75297, "epoch": 448} {"train_loss": -9.0263671875, "global_step": 75298, "epoch": 448} {"train_loss": -9.14783763885498, "global_step": 75299, "epoch": 448} {"train_loss": -9.244463920593262, "global_step": 75300, "epoch": 448} {"train_loss": -9.094953536987305, "global_step": 75301, "epoch": 448} {"train_loss": -9.078033447265625, "global_step": 75302, "epoch": 448} {"train_loss": -9.037504196166992, "global_step": 75303, "epoch": 448} {"train_loss": -9.270150184631348, "global_step": 75304, "epoch": 448} {"train_loss": -9.389280319213867, "global_step": 75305, "epoch": 448} {"train_loss": -9.104588508605957, "global_step": 75306, "epoch": 448} {"train_loss": -9.140504837036133, "global_step": 75307, "epoch": 448} {"train_loss": -8.924583435058594, "global_step": 75308, "epoch": 448} {"train_loss": -9.266332626342773, "global_step": 75309, "epoch": 448} {"train_loss": -9.254003524780273, "global_step": 75310, "epoch": 448} {"train_loss": -8.934995651245117, "global_step": 75311, "epoch": 448} {"train_loss": -9.400529861450195, "global_step": 75312, "epoch": 448} {"train_loss": -9.388720512390137, "global_step": 75313, "epoch": 448} {"train_loss": -9.202522277832031, "global_step": 75314, "epoch": 448} {"train_loss": -9.143741607666016, "global_step": 75315, "epoch": 448} {"train_loss": -9.320497512817383, "global_step": 75316, "epoch": 448} {"train_loss": -9.050872802734375, "global_step": 75317, "epoch": 448} {"train_loss": -9.309707641601562, "global_step": 75318, "epoch": 448} {"train_loss": -9.209308624267578, "global_step": 75319, "epoch": 448} {"train_loss": -9.12863540649414, "global_step": 75320, "epoch": 448} {"train_loss": -8.895797729492188, "global_step": 75321, "epoch": 448} {"train_loss": -9.124956130981445, "global_step": 75322, "epoch": 448} {"train_loss": -9.328546524047852, "global_step": 75323, "epoch": 448} {"train_loss": -8.858932495117188, "global_step": 75324, "epoch": 448} {"train_loss": -9.105801582336426, "global_step": 75325, "epoch": 448} {"train_loss": -9.13827133178711, "global_step": 75326, "epoch": 448} {"train_loss": -9.3157958984375, "global_step": 75327, "epoch": 448} {"train_loss": -8.770318984985352, "global_step": 75328, "epoch": 448} {"train_loss": -8.936270713806152, "global_step": 75329, "epoch": 448} {"train_loss": -9.237703323364258, "global_step": 75330, "epoch": 448} {"train_loss": -9.217073440551758, "global_step": 75331, "epoch": 448} {"train_loss": -9.057889938354492, "global_step": 75332, "epoch": 448} {"train_loss": -9.067205429077148, "global_step": 75333, "epoch": 448} {"train_loss": -9.133655548095703, "global_step": 75334, "epoch": 448} {"train_loss": -8.845985412597656, "global_step": 75335, "epoch": 448} {"train_loss": -9.007728576660156, "global_step": 75336, "epoch": 448} {"train_loss": -9.047394752502441, "global_step": 75337, "epoch": 448} {"train_loss": -9.18783950805664, "global_step": 75338, "epoch": 448} {"train_loss": -8.728219032287598, "global_step": 75339, "epoch": 448} {"train_loss": -9.329849243164062, "global_step": 75340, "epoch": 448} {"train_loss": -9.131424903869629, "global_step": 75341, "epoch": 448} {"train_loss": -8.937700271606445, "global_step": 75342, "epoch": 448} {"train_loss": -8.956510543823242, "global_step": 75343, "epoch": 448} {"train_loss": -9.075621604919434, "global_step": 75344, "epoch": 448} {"train_loss": -9.029333114624023, "global_step": 75345, "epoch": 448} {"train_loss": -8.832204818725586, "global_step": 75346, "epoch": 448} {"train_loss": -9.013713836669922, "global_step": 75347, "epoch": 448} {"train_loss": -9.077219009399414, "global_step": 75348, "epoch": 448} {"train_loss": -8.90518569946289, "global_step": 75349, "epoch": 448} {"train_loss": -9.03952407836914, "global_step": 75350, "epoch": 448} {"train_loss": -8.952548027038574, "global_step": 75351, "epoch": 448} {"train_loss": -9.208057403564453, "global_step": 75352, "epoch": 448} {"train_loss": -8.767003059387207, "global_step": 75353, "epoch": 448} {"train_loss": -9.036060333251953, "global_step": 75354, "epoch": 448} {"train_loss": -9.088258743286133, "global_step": 75355, "epoch": 448} {"train_loss": -9.0810546875, "global_step": 75356, "epoch": 448} {"train_loss": -9.126592636108398, "global_step": 75357, "epoch": 448} {"train_loss": -8.997591018676758, "global_step": 75358, "epoch": 448} {"train_loss": -8.684715270996094, "global_step": 75359, "epoch": 448} {"train_loss": -8.886133193969727, "global_step": 75360, "epoch": 448} {"train_loss": -9.261238098144531, "global_step": 75361, "epoch": 448} {"train_loss": -8.946466445922852, "global_step": 75362, "epoch": 448} {"train_loss": -8.940847396850586, "global_step": 75363, "epoch": 448} {"train_loss": -9.253837585449219, "global_step": 75364, "epoch": 448} {"train_loss": -8.901586532592773, "global_step": 75365, "epoch": 448} {"train_loss": -9.203520774841309, "global_step": 75366, "epoch": 448} {"train_loss": -9.076455116271973, "global_step": 75367, "epoch": 448} {"train_loss": -9.055803298950195, "global_step": 75368, "epoch": 448} {"train_loss": -9.158411026000977, "global_step": 75369, "epoch": 448} {"train_loss": -9.07778263092041, "global_step": 75370, "epoch": 448} {"train_loss": -8.977462768554688, "global_step": 75371, "epoch": 448} {"train_loss": -8.96813678741455, "global_step": 75372, "epoch": 448} {"train_loss": -9.065506935119629, "global_step": 75373, "epoch": 448} {"train_loss": -9.132783889770508, "global_step": 75374, "epoch": 448} {"train_loss": -9.064399719238281, "global_step": 75375, "epoch": 448} {"train_loss": -9.085864067077637, "global_step": 75376, "epoch": 448} {"train_loss": -9.129190444946289, "global_step": 75377, "epoch": 448} {"train_loss": -9.068266868591309, "global_step": 75378, "epoch": 448} {"train_loss": -9.215768814086914, "global_step": 75379, "epoch": 448} {"train_loss": -9.119271278381348, "global_step": 75380, "epoch": 448} {"train_loss": -9.11709213256836, "global_step": 75381, "epoch": 448} {"train_loss": -9.148909568786621, "global_step": 75382, "epoch": 448} {"train_loss": -9.039203643798828, "global_step": 75383, "epoch": 448} {"train_loss": -8.919686317443848, "global_step": 75384, "epoch": 448} {"train_loss": -9.143050193786621, "global_step": 75385, "epoch": 448} {"train_loss": -9.123297691345215, "global_step": 75386, "epoch": 448} {"train_loss": -9.268392562866211, "global_step": 75387, "epoch": 448} {"train_loss": -8.823719024658203, "global_step": 75388, "epoch": 448} {"train_loss": -9.146928787231445, "global_step": 75389, "epoch": 448} {"train_loss": -8.878162384033203, "global_step": 75390, "epoch": 448} {"train_loss": -9.118501663208008, "global_step": 75391, "epoch": 448} {"train_loss": -9.161516189575195, "global_step": 75392, "epoch": 448} {"train_loss": -9.180065155029297, "global_step": 75393, "epoch": 448} {"train_loss": -9.156954765319824, "global_step": 75394, "epoch": 448} {"train_loss": -9.02517318725586, "global_step": 75395, "epoch": 448} {"train_loss": -9.115495681762695, "global_step": 75396, "epoch": 448} {"train_loss": -9.039253234863281, "global_step": 75397, "epoch": 448} {"train_loss": -9.278489112854004, "global_step": 75398, "epoch": 448} {"train_loss": -9.310707092285156, "global_step": 75399, "epoch": 448} {"train_loss": -9.334630966186523, "global_step": 75400, "epoch": 448} {"train_loss": -8.989959716796875, "global_step": 75401, "epoch": 448} {"train_loss": -9.251235961914062, "global_step": 75402, "epoch": 448} {"train_loss": -9.22106647491455, "global_step": 75403, "epoch": 448} {"train_loss": -9.004173278808594, "global_step": 75404, "epoch": 448} {"train_loss": -8.77090072631836, "global_step": 75405, "epoch": 448} {"train_loss": -9.104950904846191, "global_step": 75406, "epoch": 448} {"train_loss": -8.885643005371094, "global_step": 75407, "epoch": 448} {"train_loss": -9.155157089233398, "global_step": 75408, "epoch": 448} {"train_loss": -9.092229843139648, "global_step": 75409, "epoch": 448} {"train_loss": -8.936670303344727, "global_step": 75410, "epoch": 448} {"train_loss": -8.90587043762207, "global_step": 75411, "epoch": 448} {"train_loss": -9.013671875, "global_step": 75412, "epoch": 448} {"train_loss": -9.176412582397461, "global_step": 75413, "epoch": 448} {"train_loss": -8.882164001464844, "global_step": 75414, "epoch": 448} {"train_loss": -9.17654800415039, "global_step": 75415, "epoch": 448} {"train_loss": -9.037059783935547, "global_step": 75416, "epoch": 448} {"train_loss": -9.350297927856445, "global_step": 75417, "epoch": 448} {"train_loss": -9.230744361877441, "global_step": 75418, "epoch": 448} {"train_loss": -9.041557312011719, "global_step": 75419, "epoch": 448} {"train_loss": -9.00423812866211, "global_step": 75420, "epoch": 448} {"train_loss": -8.832016944885254, "global_step": 75421, "epoch": 448} {"train_loss": -9.119264602661133, "global_step": 75422, "epoch": 448} {"train_loss": -9.112212181091309, "global_step": 75423, "epoch": 448} {"train_loss": -8.495553970336914, "global_step": 75424, "epoch": 448} {"train_loss": -9.118328094482422, "global_step": 75425, "epoch": 448} {"train_loss": -9.126633644104004, "global_step": 75426, "epoch": 448} {"train_loss": -8.873916625976562, "global_step": 75427, "epoch": 448} {"train_loss": -8.907999992370605, "global_step": 75428, "epoch": 448} {"train_loss": -8.908717155456543, "global_step": 75429, "epoch": 448} {"train_loss": -8.87193489074707, "global_step": 75430, "epoch": 448} {"train_loss": -9.004027213369097, "global_step": 75431, "epoch": 448, "val_loss": 194514.109375} {"train_loss": -9.302144050598145, "global_step": 75432, "epoch": 449} {"train_loss": -9.002235412597656, "global_step": 75433, "epoch": 449} {"train_loss": -8.667766571044922, "global_step": 75434, "epoch": 449} {"train_loss": -8.831151008605957, "global_step": 75435, "epoch": 449} {"train_loss": -8.955312728881836, "global_step": 75436, "epoch": 449} {"train_loss": -8.907175064086914, "global_step": 75437, "epoch": 449} {"train_loss": -8.768949508666992, "global_step": 75438, "epoch": 449} {"train_loss": -8.92994213104248, "global_step": 75439, "epoch": 449} {"train_loss": -8.825029373168945, "global_step": 75440, "epoch": 449} {"train_loss": -8.809731483459473, "global_step": 75441, "epoch": 449} {"train_loss": -9.061254501342773, "global_step": 75442, "epoch": 449} {"train_loss": -9.100785255432129, "global_step": 75443, "epoch": 449} {"train_loss": -9.088141441345215, "global_step": 75444, "epoch": 449} {"train_loss": -9.149616241455078, "global_step": 75445, "epoch": 449} {"train_loss": -9.256715774536133, "global_step": 75446, "epoch": 449} {"train_loss": -9.068464279174805, "global_step": 75447, "epoch": 449} {"train_loss": -9.176387786865234, "global_step": 75448, "epoch": 449} {"train_loss": -9.167987823486328, "global_step": 75449, "epoch": 449} {"train_loss": -9.207921981811523, "global_step": 75450, "epoch": 449} {"train_loss": -9.066999435424805, "global_step": 75451, "epoch": 449} {"train_loss": -9.147732734680176, "global_step": 75452, "epoch": 449} {"train_loss": -9.23977279663086, "global_step": 75453, "epoch": 449} {"train_loss": -9.079029083251953, "global_step": 75454, "epoch": 449} {"train_loss": -9.168392181396484, "global_step": 75455, "epoch": 449} {"train_loss": -9.27048397064209, "global_step": 75456, "epoch": 449} {"train_loss": -9.279264450073242, "global_step": 75457, "epoch": 449} {"train_loss": -9.344917297363281, "global_step": 75458, "epoch": 449} {"train_loss": -9.119997024536133, "global_step": 75459, "epoch": 449} {"train_loss": -9.034993171691895, "global_step": 75460, "epoch": 449} {"train_loss": -9.332499504089355, "global_step": 75461, "epoch": 449} {"train_loss": -9.000903129577637, "global_step": 75462, "epoch": 449} {"train_loss": -8.9337797164917, "global_step": 75463, "epoch": 449} {"train_loss": -9.445901870727539, "global_step": 75464, "epoch": 449} {"train_loss": -9.105087280273438, "global_step": 75465, "epoch": 449} {"train_loss": -8.969230651855469, "global_step": 75466, "epoch": 449} {"train_loss": -8.912714004516602, "global_step": 75467, "epoch": 449} {"train_loss": -8.93748950958252, "global_step": 75468, "epoch": 449} {"train_loss": -9.214487075805664, "global_step": 75469, "epoch": 449} {"train_loss": -8.878803253173828, "global_step": 75470, "epoch": 449} {"train_loss": -8.639747619628906, "global_step": 75471, "epoch": 449} {"train_loss": -8.985570907592773, "global_step": 75472, "epoch": 449} {"train_loss": -8.39513111114502, "global_step": 75473, "epoch": 449} {"train_loss": -8.683023452758789, "global_step": 75474, "epoch": 449} {"train_loss": -7.9252214431762695, "global_step": 75475, "epoch": 449} {"train_loss": -8.699535369873047, "global_step": 75476, "epoch": 449} {"train_loss": -8.353575706481934, "global_step": 75477, "epoch": 449} {"train_loss": -8.185131072998047, "global_step": 75478, "epoch": 449} {"train_loss": -8.116649627685547, "global_step": 75479, "epoch": 449} {"train_loss": -8.49782943725586, "global_step": 75480, "epoch": 449} {"train_loss": -8.55501937866211, "global_step": 75481, "epoch": 449} {"train_loss": -8.146026611328125, "global_step": 75482, "epoch": 449} {"train_loss": -8.53531265258789, "global_step": 75483, "epoch": 449} {"train_loss": -8.60978889465332, "global_step": 75484, "epoch": 449} {"train_loss": -8.488122940063477, "global_step": 75485, "epoch": 449} {"train_loss": -8.605386734008789, "global_step": 75486, "epoch": 449} {"train_loss": -8.52186393737793, "global_step": 75487, "epoch": 449} {"train_loss": -8.68145751953125, "global_step": 75488, "epoch": 449} {"train_loss": -8.652883529663086, "global_step": 75489, "epoch": 449} {"train_loss": -8.812077522277832, "global_step": 75490, "epoch": 449} {"train_loss": -8.747659683227539, "global_step": 75491, "epoch": 449} {"train_loss": -8.880105972290039, "global_step": 75492, "epoch": 449} {"train_loss": -8.853250503540039, "global_step": 75493, "epoch": 449} {"train_loss": -8.707831382751465, "global_step": 75494, "epoch": 449} {"train_loss": -8.767501831054688, "global_step": 75495, "epoch": 449} {"train_loss": -9.018152236938477, "global_step": 75496, "epoch": 449} {"train_loss": -8.757676124572754, "global_step": 75497, "epoch": 449} {"train_loss": -8.80133056640625, "global_step": 75498, "epoch": 449} {"train_loss": -8.93905258178711, "global_step": 75499, "epoch": 449} {"train_loss": -8.683879852294922, "global_step": 75500, "epoch": 449} {"train_loss": -9.006170272827148, "global_step": 75501, "epoch": 449} {"train_loss": -9.097545623779297, "global_step": 75502, "epoch": 449} {"train_loss": -9.043432235717773, "global_step": 75503, "epoch": 449} {"train_loss": -8.856456756591797, "global_step": 75504, "epoch": 449} {"train_loss": -9.054276466369629, "global_step": 75505, "epoch": 449} {"train_loss": -9.167442321777344, "global_step": 75506, "epoch": 449} {"train_loss": -9.070271492004395, "global_step": 75507, "epoch": 449} {"train_loss": -9.207596778869629, "global_step": 75508, "epoch": 449} {"train_loss": -9.174930572509766, "global_step": 75509, "epoch": 449} {"train_loss": -9.232908248901367, "global_step": 75510, "epoch": 449} {"train_loss": -9.113551139831543, "global_step": 75511, "epoch": 449} {"train_loss": -9.008027076721191, "global_step": 75512, "epoch": 449} {"train_loss": -9.19268798828125, "global_step": 75513, "epoch": 449} {"train_loss": -9.041298866271973, "global_step": 75514, "epoch": 449} {"train_loss": -9.244363784790039, "global_step": 75515, "epoch": 449} {"train_loss": -8.990310668945312, "global_step": 75516, "epoch": 449} {"train_loss": -8.937049865722656, "global_step": 75517, "epoch": 449} {"train_loss": -8.974899291992188, "global_step": 75518, "epoch": 449} {"train_loss": -9.376388549804688, "global_step": 75519, "epoch": 449} {"train_loss": -8.097992897033691, "global_step": 75520, "epoch": 449} {"train_loss": -9.104348182678223, "global_step": 75521, "epoch": 449} {"train_loss": -8.614497184753418, "global_step": 75522, "epoch": 449} {"train_loss": -8.792205810546875, "global_step": 75523, "epoch": 449} {"train_loss": -8.218059539794922, "global_step": 75524, "epoch": 449} {"train_loss": -8.868125915527344, "global_step": 75525, "epoch": 449} {"train_loss": -8.645947456359863, "global_step": 75526, "epoch": 449} {"train_loss": -8.918169021606445, "global_step": 75527, "epoch": 449} {"train_loss": -8.578861236572266, "global_step": 75528, "epoch": 449} {"train_loss": -9.064844131469727, "global_step": 75529, "epoch": 449} {"train_loss": -9.002941131591797, "global_step": 75530, "epoch": 449} {"train_loss": -8.958003997802734, "global_step": 75531, "epoch": 449} {"train_loss": -8.841146469116211, "global_step": 75532, "epoch": 449} {"train_loss": -8.91904067993164, "global_step": 75533, "epoch": 449} {"train_loss": -8.895965576171875, "global_step": 75534, "epoch": 449} {"train_loss": -9.082754135131836, "global_step": 75535, "epoch": 449} {"train_loss": -9.270153045654297, "global_step": 75536, "epoch": 449} {"train_loss": -9.067283630371094, "global_step": 75537, "epoch": 449} {"train_loss": -8.910984992980957, "global_step": 75538, "epoch": 449} {"train_loss": -9.28390121459961, "global_step": 75539, "epoch": 449} {"train_loss": -9.255901336669922, "global_step": 75540, "epoch": 449} {"train_loss": -9.039995193481445, "global_step": 75541, "epoch": 449} {"train_loss": -9.241500854492188, "global_step": 75542, "epoch": 449} {"train_loss": -9.092157363891602, "global_step": 75543, "epoch": 449} {"train_loss": -8.998385429382324, "global_step": 75544, "epoch": 449} {"train_loss": -9.009065628051758, "global_step": 75545, "epoch": 449} {"train_loss": -9.172857284545898, "global_step": 75546, "epoch": 449} {"train_loss": -8.897714614868164, "global_step": 75547, "epoch": 449} {"train_loss": -9.195414543151855, "global_step": 75548, "epoch": 449} {"train_loss": -9.330198287963867, "global_step": 75549, "epoch": 449} {"train_loss": -9.312736511230469, "global_step": 75550, "epoch": 449} {"train_loss": -9.049371719360352, "global_step": 75551, "epoch": 449} {"train_loss": -9.281781196594238, "global_step": 75552, "epoch": 449} {"train_loss": -9.086404800415039, "global_step": 75553, "epoch": 449} {"train_loss": -9.088153839111328, "global_step": 75554, "epoch": 449} {"train_loss": -9.154279708862305, "global_step": 75555, "epoch": 449} {"train_loss": -9.112777709960938, "global_step": 75556, "epoch": 449} {"train_loss": -9.06698226928711, "global_step": 75557, "epoch": 449} {"train_loss": -8.884987831115723, "global_step": 75558, "epoch": 449} {"train_loss": -8.966083526611328, "global_step": 75559, "epoch": 449} {"train_loss": -8.762535095214844, "global_step": 75560, "epoch": 449} {"train_loss": -9.233461380004883, "global_step": 75561, "epoch": 449} {"train_loss": -9.154142379760742, "global_step": 75562, "epoch": 449} {"train_loss": -8.98300838470459, "global_step": 75563, "epoch": 449} {"train_loss": -8.987992286682129, "global_step": 75564, "epoch": 449} {"train_loss": -9.138158798217773, "global_step": 75565, "epoch": 449} {"train_loss": -9.101791381835938, "global_step": 75566, "epoch": 449} {"train_loss": -9.210970878601074, "global_step": 75567, "epoch": 449} {"train_loss": -9.432526588439941, "global_step": 75568, "epoch": 449} {"train_loss": -9.185247421264648, "global_step": 75569, "epoch": 449} {"train_loss": -9.177846908569336, "global_step": 75570, "epoch": 449} {"train_loss": -9.10513973236084, "global_step": 75571, "epoch": 449} {"train_loss": -9.224095344543457, "global_step": 75572, "epoch": 449} {"train_loss": -9.078673362731934, "global_step": 75573, "epoch": 449} {"train_loss": -9.004315376281738, "global_step": 75574, "epoch": 449} {"train_loss": -9.099032402038574, "global_step": 75575, "epoch": 449} {"train_loss": -9.069843292236328, "global_step": 75576, "epoch": 449} {"train_loss": -9.020949363708496, "global_step": 75577, "epoch": 449} {"train_loss": -9.00563907623291, "global_step": 75578, "epoch": 449} {"train_loss": -9.224784851074219, "global_step": 75579, "epoch": 449} {"train_loss": -9.092039108276367, "global_step": 75580, "epoch": 449} {"train_loss": -9.346253395080566, "global_step": 75581, "epoch": 449} {"train_loss": -8.9419527053833, "global_step": 75582, "epoch": 449} {"train_loss": -9.153999328613281, "global_step": 75583, "epoch": 449} {"train_loss": -9.120594024658203, "global_step": 75584, "epoch": 449} {"train_loss": -9.130087852478027, "global_step": 75585, "epoch": 449} {"train_loss": -9.184253692626953, "global_step": 75586, "epoch": 449} {"train_loss": -9.026390075683594, "global_step": 75587, "epoch": 449} {"train_loss": -8.972949981689453, "global_step": 75588, "epoch": 449} {"train_loss": -8.990891456604004, "global_step": 75589, "epoch": 449} {"train_loss": -9.130661964416504, "global_step": 75590, "epoch": 449} {"train_loss": -9.394933700561523, "global_step": 75591, "epoch": 449} {"train_loss": -8.947284698486328, "global_step": 75592, "epoch": 449} {"train_loss": -9.021007537841797, "global_step": 75593, "epoch": 449} {"train_loss": -9.038322448730469, "global_step": 75594, "epoch": 449} {"train_loss": -8.899673461914062, "global_step": 75595, "epoch": 449} {"train_loss": -9.203829765319824, "global_step": 75596, "epoch": 449} {"train_loss": -8.922710418701172, "global_step": 75597, "epoch": 449} {"train_loss": -9.099599838256836, "global_step": 75598, "epoch": 449} {"train_loss": -8.975097077233452, "global_step": 75599, "epoch": 449, "val_loss": 197376.109375} {"train_loss": -9.228780746459961, "global_step": 75600, "epoch": 450} {"train_loss": -8.898723602294922, "global_step": 75601, "epoch": 450} {"train_loss": -9.156343460083008, "global_step": 75602, "epoch": 450} {"train_loss": -9.248517036437988, "global_step": 75603, "epoch": 450} {"train_loss": -8.942951202392578, "global_step": 75604, "epoch": 450} {"train_loss": -8.892666816711426, "global_step": 75605, "epoch": 450} {"train_loss": -8.9695405960083, "global_step": 75606, "epoch": 450} {"train_loss": -9.24574089050293, "global_step": 75607, "epoch": 450} {"train_loss": -9.335935592651367, "global_step": 75608, "epoch": 450} {"train_loss": -9.241682052612305, "global_step": 75609, "epoch": 450} {"train_loss": -8.885135650634766, "global_step": 75610, "epoch": 450} {"train_loss": -9.355405807495117, "global_step": 75611, "epoch": 450} {"train_loss": -9.006250381469727, "global_step": 75612, "epoch": 450} {"train_loss": -8.83329963684082, "global_step": 75613, "epoch": 450} {"train_loss": -9.010335922241211, "global_step": 75614, "epoch": 450} {"train_loss": -9.014978408813477, "global_step": 75615, "epoch": 450} {"train_loss": -8.942388534545898, "global_step": 75616, "epoch": 450} {"train_loss": -8.993675231933594, "global_step": 75617, "epoch": 450} {"train_loss": -8.958806991577148, "global_step": 75618, "epoch": 450} {"train_loss": -9.225198745727539, "global_step": 75619, "epoch": 450} {"train_loss": -8.965846061706543, "global_step": 75620, "epoch": 450} {"train_loss": -9.043706893920898, "global_step": 75621, "epoch": 450} {"train_loss": -8.896052360534668, "global_step": 75622, "epoch": 450} {"train_loss": -8.543136596679688, "global_step": 75623, "epoch": 450} {"train_loss": -9.08047103881836, "global_step": 75624, "epoch": 450} {"train_loss": -8.752080917358398, "global_step": 75625, "epoch": 450} {"train_loss": -8.903711318969727, "global_step": 75626, "epoch": 450} {"train_loss": -8.978419303894043, "global_step": 75627, "epoch": 450} {"train_loss": -9.036846160888672, "global_step": 75628, "epoch": 450} {"train_loss": -8.859624862670898, "global_step": 75629, "epoch": 450} {"train_loss": -9.168716430664062, "global_step": 75630, "epoch": 450} {"train_loss": -9.25885009765625, "global_step": 75631, "epoch": 450} {"train_loss": -9.008475303649902, "global_step": 75632, "epoch": 450} {"train_loss": -9.355116844177246, "global_step": 75633, "epoch": 450} {"train_loss": -9.209938049316406, "global_step": 75634, "epoch": 450} {"train_loss": -9.016617774963379, "global_step": 75635, "epoch": 450} {"train_loss": -9.088445663452148, "global_step": 75636, "epoch": 450} {"train_loss": -9.222892761230469, "global_step": 75637, "epoch": 450} {"train_loss": -9.031841278076172, "global_step": 75638, "epoch": 450} {"train_loss": -8.99597454071045, "global_step": 75639, "epoch": 450} {"train_loss": -9.088682174682617, "global_step": 75640, "epoch": 450} {"train_loss": -8.851865768432617, "global_step": 75641, "epoch": 450} {"train_loss": -9.251334190368652, "global_step": 75642, "epoch": 450} {"train_loss": -8.808465957641602, "global_step": 75643, "epoch": 450} {"train_loss": -8.945344924926758, "global_step": 75644, "epoch": 450} {"train_loss": -9.084155082702637, "global_step": 75645, "epoch": 450} {"train_loss": -8.913663864135742, "global_step": 75646, "epoch": 450} {"train_loss": -9.242274284362793, "global_step": 75647, "epoch": 450} {"train_loss": -8.838634490966797, "global_step": 75648, "epoch": 450} {"train_loss": -8.929771423339844, "global_step": 75649, "epoch": 450} {"train_loss": -8.992535591125488, "global_step": 75650, "epoch": 450} {"train_loss": -8.729853630065918, "global_step": 75651, "epoch": 450} {"train_loss": -9.01508903503418, "global_step": 75652, "epoch": 450} {"train_loss": -8.89118766784668, "global_step": 75653, "epoch": 450} {"train_loss": -9.057948112487793, "global_step": 75654, "epoch": 450} {"train_loss": -8.873319625854492, "global_step": 75655, "epoch": 450} {"train_loss": -8.991843223571777, "global_step": 75656, "epoch": 450} {"train_loss": -8.594649314880371, "global_step": 75657, "epoch": 450} {"train_loss": -9.12131118774414, "global_step": 75658, "epoch": 450} {"train_loss": -8.927502632141113, "global_step": 75659, "epoch": 450} {"train_loss": -9.054264068603516, "global_step": 75660, "epoch": 450} {"train_loss": -8.968559265136719, "global_step": 75661, "epoch": 450} {"train_loss": -9.030455589294434, "global_step": 75662, "epoch": 450} {"train_loss": -8.975530624389648, "global_step": 75663, "epoch": 450} {"train_loss": -9.028684616088867, "global_step": 75664, "epoch": 450} {"train_loss": -8.971436500549316, "global_step": 75665, "epoch": 450} {"train_loss": -9.046224594116211, "global_step": 75666, "epoch": 450} {"train_loss": -8.803630828857422, "global_step": 75667, "epoch": 450} {"train_loss": -9.032060623168945, "global_step": 75668, "epoch": 450} {"train_loss": -8.915637016296387, "global_step": 75669, "epoch": 450} {"train_loss": -9.02741527557373, "global_step": 75670, "epoch": 450} {"train_loss": -8.800504684448242, "global_step": 75671, "epoch": 450} {"train_loss": -8.961649894714355, "global_step": 75672, "epoch": 450} {"train_loss": -8.975403785705566, "global_step": 75673, "epoch": 450} {"train_loss": -8.899106979370117, "global_step": 75674, "epoch": 450} {"train_loss": -8.831439018249512, "global_step": 75675, "epoch": 450} {"train_loss": -9.122119903564453, "global_step": 75676, "epoch": 450} {"train_loss": -8.724085807800293, "global_step": 75677, "epoch": 450} {"train_loss": -8.970911979675293, "global_step": 75678, "epoch": 450} {"train_loss": -9.01192569732666, "global_step": 75679, "epoch": 450} {"train_loss": -8.746465682983398, "global_step": 75680, "epoch": 450} {"train_loss": -8.888185501098633, "global_step": 75681, "epoch": 450} {"train_loss": -9.161706924438477, "global_step": 75682, "epoch": 450} {"train_loss": -9.123685836791992, "global_step": 75683, "epoch": 450} {"train_loss": -9.150481224060059, "global_step": 75684, "epoch": 450} {"train_loss": -9.108959197998047, "global_step": 75685, "epoch": 450} {"train_loss": -9.239388465881348, "global_step": 75686, "epoch": 450} {"train_loss": -9.02431869506836, "global_step": 75687, "epoch": 450} {"train_loss": -9.197563171386719, "global_step": 75688, "epoch": 450} {"train_loss": -9.153553009033203, "global_step": 75689, "epoch": 450} {"train_loss": -9.288854598999023, "global_step": 75690, "epoch": 450} {"train_loss": -9.065349578857422, "global_step": 75691, "epoch": 450} {"train_loss": -9.05096435546875, "global_step": 75692, "epoch": 450} {"train_loss": -9.279170989990234, "global_step": 75693, "epoch": 450} {"train_loss": -9.105426788330078, "global_step": 75694, "epoch": 450} {"train_loss": -9.173101425170898, "global_step": 75695, "epoch": 450} {"train_loss": -9.298456192016602, "global_step": 75696, "epoch": 450} {"train_loss": -9.255569458007812, "global_step": 75697, "epoch": 450} {"train_loss": -9.341961860656738, "global_step": 75698, "epoch": 450} {"train_loss": -9.318839073181152, "global_step": 75699, "epoch": 450} {"train_loss": -9.264664649963379, "global_step": 75700, "epoch": 450} {"train_loss": -9.22828483581543, "global_step": 75701, "epoch": 450} {"train_loss": -9.044509887695312, "global_step": 75702, "epoch": 450} {"train_loss": -9.314013481140137, "global_step": 75703, "epoch": 450} {"train_loss": -9.138673782348633, "global_step": 75704, "epoch": 450} {"train_loss": -9.536659240722656, "global_step": 75705, "epoch": 450} {"train_loss": -9.312786102294922, "global_step": 75706, "epoch": 450} {"train_loss": -9.129375457763672, "global_step": 75707, "epoch": 450} {"train_loss": -8.770380973815918, "global_step": 75708, "epoch": 450} {"train_loss": -9.522345542907715, "global_step": 75709, "epoch": 450} {"train_loss": -9.209858894348145, "global_step": 75710, "epoch": 450} {"train_loss": -8.878036499023438, "global_step": 75711, "epoch": 450} {"train_loss": -9.093286514282227, "global_step": 75712, "epoch": 450} {"train_loss": -8.971786499023438, "global_step": 75713, "epoch": 450} {"train_loss": -9.147531509399414, "global_step": 75714, "epoch": 450} {"train_loss": -8.71908187866211, "global_step": 75715, "epoch": 450} {"train_loss": -8.998767852783203, "global_step": 75716, "epoch": 450} {"train_loss": -8.801880836486816, "global_step": 75717, "epoch": 450} {"train_loss": -8.929231643676758, "global_step": 75718, "epoch": 450} {"train_loss": -9.102481842041016, "global_step": 75719, "epoch": 450} {"train_loss": -8.614900588989258, "global_step": 75720, "epoch": 450} {"train_loss": -8.568235397338867, "global_step": 75721, "epoch": 450} {"train_loss": -8.513684272766113, "global_step": 75722, "epoch": 450} {"train_loss": -8.701042175292969, "global_step": 75723, "epoch": 450} {"train_loss": -8.504114151000977, "global_step": 75724, "epoch": 450} {"train_loss": -8.877639770507812, "global_step": 75725, "epoch": 450} {"train_loss": -8.896308898925781, "global_step": 75726, "epoch": 450} {"train_loss": -8.998944282531738, "global_step": 75727, "epoch": 450} {"train_loss": -8.740633964538574, "global_step": 75728, "epoch": 450} {"train_loss": -8.696967124938965, "global_step": 75729, "epoch": 450} {"train_loss": -9.001699447631836, "global_step": 75730, "epoch": 450} {"train_loss": -9.070034980773926, "global_step": 75731, "epoch": 450} {"train_loss": -8.972831726074219, "global_step": 75732, "epoch": 450} {"train_loss": -8.989402770996094, "global_step": 75733, "epoch": 450} {"train_loss": -8.878910064697266, "global_step": 75734, "epoch": 450} {"train_loss": -9.168268203735352, "global_step": 75735, "epoch": 450} {"train_loss": -8.998138427734375, "global_step": 75736, "epoch": 450} {"train_loss": -8.945860862731934, "global_step": 75737, "epoch": 450} {"train_loss": -9.186153411865234, "global_step": 75738, "epoch": 450} {"train_loss": -9.012592315673828, "global_step": 75739, "epoch": 450} {"train_loss": -8.954647064208984, "global_step": 75740, "epoch": 450} {"train_loss": -9.075828552246094, "global_step": 75741, "epoch": 450} {"train_loss": -9.063695907592773, "global_step": 75742, "epoch": 450} {"train_loss": -9.01679801940918, "global_step": 75743, "epoch": 450} {"train_loss": -9.23674488067627, "global_step": 75744, "epoch": 450} {"train_loss": -9.122108459472656, "global_step": 75745, "epoch": 450} {"train_loss": -9.399267196655273, "global_step": 75746, "epoch": 450} {"train_loss": -9.162266731262207, "global_step": 75747, "epoch": 450} {"train_loss": -9.279401779174805, "global_step": 75748, "epoch": 450} {"train_loss": -9.106422424316406, "global_step": 75749, "epoch": 450} {"train_loss": -8.95482063293457, "global_step": 75750, "epoch": 450} {"train_loss": -9.262300491333008, "global_step": 75751, "epoch": 450} {"train_loss": -9.154804229736328, "global_step": 75752, "epoch": 450} {"train_loss": -9.229042053222656, "global_step": 75753, "epoch": 450} {"train_loss": -9.066227912902832, "global_step": 75754, "epoch": 450} {"train_loss": -9.221973419189453, "global_step": 75755, "epoch": 450} {"train_loss": -8.940864562988281, "global_step": 75756, "epoch": 450} {"train_loss": -9.211296081542969, "global_step": 75757, "epoch": 450} {"train_loss": -8.97953987121582, "global_step": 75758, "epoch": 450} {"train_loss": -8.61368179321289, "global_step": 75759, "epoch": 450} {"train_loss": -9.183122634887695, "global_step": 75760, "epoch": 450} {"train_loss": -8.854934692382812, "global_step": 75761, "epoch": 450} {"train_loss": -9.235984802246094, "global_step": 75762, "epoch": 450} {"train_loss": -9.047110557556152, "global_step": 75763, "epoch": 450} {"train_loss": -8.902274131774902, "global_step": 75764, "epoch": 450} {"train_loss": -9.184501647949219, "global_step": 75765, "epoch": 450} {"train_loss": -9.000219345092773, "global_step": 75766, "epoch": 450} {"train_loss": -9.029490317617144, "global_step": 75767, "epoch": 450, "train/sim_max_reward_0": 0.5488945056854049, "train/sim_max_reward_1": 0.9637439751975785, "train/sim_max_reward_2": 0.021773119890179982, "train/sim_max_reward_3": 0.6337328155892149, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.3497256690532148, "test/sim_max_reward_4400002": 0.06723914066680814, "test/sim_max_reward_4400003": 0.3291565228981545, "test/sim_max_reward_4400004": 0.40808085159416124, "test/sim_max_reward_4400005": 0.9967617336966744, "test/sim_max_reward_4400006": 0.4706565168640927, "test/sim_max_reward_4400007": 0.9444638007219748, "test/sim_max_reward_4400008": 0.6032513981757605, "test/sim_max_reward_4400009": 0.39597281377879695, "test/sim_max_reward_4400010": 0.9244331344114789, "test/sim_max_reward_4400011": 0.9298737772980479, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.680342675061926, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.5056670459765699, "test/sim_max_reward_4400018": 0.9880027742932733, "test/sim_max_reward_4400019": 0.48647535954951254, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.9983513007208973, "test/sim_max_reward_4400022": 0.9776909057750719, "test/sim_max_reward_4400023": 0.9930494267512653, "test/sim_max_reward_4400024": 1.0, "test/sim_max_reward_4400025": 0.6384317939500148, "test/sim_max_reward_4400026": 1.0, "test/sim_max_reward_4400027": 1.0, "test/sim_max_reward_4400028": 0.7120402746475888, "test/sim_max_reward_4400029": 1.0, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.08928423381974744, "test/sim_max_reward_4400033": 0.1604522004489964, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.5327560360593689, "test/sim_max_reward_4400036": 0.36791377505701783, "test/sim_max_reward_4400037": 0.9716847875576221, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.6256343497275242, "test/sim_max_reward_4400042": 1.0, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.8924722109640539, "test/sim_max_reward_4400045": 0.41441403942234467, "test/sim_max_reward_4400046": 0.9113847576385149, "test/sim_max_reward_4400047": 0.982434625193477, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6946907360603963, "test/mean_score": 0.6751970519125601, "val_loss": 196803.3125, "train_action_mse_error": 5.207672595977783} {"train_loss": -9.4450044631958, "global_step": 75768, "epoch": 451} {"train_loss": -9.321077346801758, "global_step": 75769, "epoch": 451} {"train_loss": -9.030584335327148, "global_step": 75770, "epoch": 451} {"train_loss": -8.987732887268066, "global_step": 75771, "epoch": 451} {"train_loss": -9.105217933654785, "global_step": 75772, "epoch": 451} {"train_loss": -9.3192138671875, "global_step": 75773, "epoch": 451} {"train_loss": -9.121960639953613, "global_step": 75774, "epoch": 451} {"train_loss": -9.208771705627441, "global_step": 75775, "epoch": 451} {"train_loss": -9.13064193725586, "global_step": 75776, "epoch": 451} {"train_loss": -9.288591384887695, "global_step": 75777, "epoch": 451} {"train_loss": -9.242223739624023, "global_step": 75778, "epoch": 451} {"train_loss": -9.294255256652832, "global_step": 75779, "epoch": 451} {"train_loss": -9.287775039672852, "global_step": 75780, "epoch": 451} {"train_loss": -9.032363891601562, "global_step": 75781, "epoch": 451} {"train_loss": -9.276054382324219, "global_step": 75782, "epoch": 451} {"train_loss": -9.129898071289062, "global_step": 75783, "epoch": 451} {"train_loss": -9.274412155151367, "global_step": 75784, "epoch": 451} {"train_loss": -9.364158630371094, "global_step": 75785, "epoch": 451} {"train_loss": -9.240164756774902, "global_step": 75786, "epoch": 451} {"train_loss": -8.926559448242188, "global_step": 75787, "epoch": 451} {"train_loss": -9.272765159606934, "global_step": 75788, "epoch": 451} {"train_loss": -9.30335521697998, "global_step": 75789, "epoch": 451} {"train_loss": -9.232259750366211, "global_step": 75790, "epoch": 451} {"train_loss": -9.30081558227539, "global_step": 75791, "epoch": 451} {"train_loss": -9.269312858581543, "global_step": 75792, "epoch": 451} {"train_loss": -9.05015754699707, "global_step": 75793, "epoch": 451} {"train_loss": -9.326457977294922, "global_step": 75794, "epoch": 451} {"train_loss": -9.11470890045166, "global_step": 75795, "epoch": 451} {"train_loss": -9.049867630004883, "global_step": 75796, "epoch": 451} {"train_loss": -9.078063011169434, "global_step": 75797, "epoch": 451} {"train_loss": -9.329615592956543, "global_step": 75798, "epoch": 451} {"train_loss": -9.0472412109375, "global_step": 75799, "epoch": 451} {"train_loss": -9.246172904968262, "global_step": 75800, "epoch": 451} {"train_loss": -8.962980270385742, "global_step": 75801, "epoch": 451} {"train_loss": -8.956991195678711, "global_step": 75802, "epoch": 451} {"train_loss": -8.92191219329834, "global_step": 75803, "epoch": 451} {"train_loss": -9.031831741333008, "global_step": 75804, "epoch": 451} {"train_loss": -8.81473445892334, "global_step": 75805, "epoch": 451} {"train_loss": -8.9694242477417, "global_step": 75806, "epoch": 451} {"train_loss": -8.961943626403809, "global_step": 75807, "epoch": 451} {"train_loss": -9.003935813903809, "global_step": 75808, "epoch": 451} {"train_loss": -9.053033828735352, "global_step": 75809, "epoch": 451} {"train_loss": -8.941537857055664, "global_step": 75810, "epoch": 451} {"train_loss": -9.03685188293457, "global_step": 75811, "epoch": 451} {"train_loss": -8.946611404418945, "global_step": 75812, "epoch": 451} {"train_loss": -9.069540023803711, "global_step": 75813, "epoch": 451} {"train_loss": -9.09695816040039, "global_step": 75814, "epoch": 451} {"train_loss": -8.788700103759766, "global_step": 75815, "epoch": 451} {"train_loss": -8.89990234375, "global_step": 75816, "epoch": 451} {"train_loss": -9.300427436828613, "global_step": 75817, "epoch": 451} {"train_loss": -8.851840019226074, "global_step": 75818, "epoch": 451} {"train_loss": -9.011192321777344, "global_step": 75819, "epoch": 451} {"train_loss": -8.978116035461426, "global_step": 75820, "epoch": 451} {"train_loss": -8.744115829467773, "global_step": 75821, "epoch": 451} {"train_loss": -9.291335105895996, "global_step": 75822, "epoch": 451} {"train_loss": -8.878717422485352, "global_step": 75823, "epoch": 451} {"train_loss": -8.810224533081055, "global_step": 75824, "epoch": 451} {"train_loss": -9.071980476379395, "global_step": 75825, "epoch": 451} {"train_loss": -9.239606857299805, "global_step": 75826, "epoch": 451} {"train_loss": -8.693772315979004, "global_step": 75827, "epoch": 451} {"train_loss": -9.32472038269043, "global_step": 75828, "epoch": 451} {"train_loss": -8.919513702392578, "global_step": 75829, "epoch": 451} {"train_loss": -9.064992904663086, "global_step": 75830, "epoch": 451} {"train_loss": -8.825568199157715, "global_step": 75831, "epoch": 451} {"train_loss": -8.930381774902344, "global_step": 75832, "epoch": 451} {"train_loss": -9.00381851196289, "global_step": 75833, "epoch": 451} {"train_loss": -9.151620864868164, "global_step": 75834, "epoch": 451} {"train_loss": -8.84842300415039, "global_step": 75835, "epoch": 451} {"train_loss": -9.02301025390625, "global_step": 75836, "epoch": 451} {"train_loss": -9.068626403808594, "global_step": 75837, "epoch": 451} {"train_loss": -9.041271209716797, "global_step": 75838, "epoch": 451} {"train_loss": -9.288162231445312, "global_step": 75839, "epoch": 451} {"train_loss": -9.099472045898438, "global_step": 75840, "epoch": 451} {"train_loss": -9.368905067443848, "global_step": 75841, "epoch": 451} {"train_loss": -9.183198928833008, "global_step": 75842, "epoch": 451} {"train_loss": -8.998767852783203, "global_step": 75843, "epoch": 451} {"train_loss": -9.073784828186035, "global_step": 75844, "epoch": 451} {"train_loss": -9.357562065124512, "global_step": 75845, "epoch": 451} {"train_loss": -8.897411346435547, "global_step": 75846, "epoch": 451} {"train_loss": -9.242820739746094, "global_step": 75847, "epoch": 451} {"train_loss": -9.020843505859375, "global_step": 75848, "epoch": 451} {"train_loss": -9.056388854980469, "global_step": 75849, "epoch": 451} {"train_loss": -9.327722549438477, "global_step": 75850, "epoch": 451} {"train_loss": -9.063770294189453, "global_step": 75851, "epoch": 451} {"train_loss": -9.485804557800293, "global_step": 75852, "epoch": 451} {"train_loss": -9.126428604125977, "global_step": 75853, "epoch": 451} {"train_loss": -9.141670227050781, "global_step": 75854, "epoch": 451} {"train_loss": -9.249128341674805, "global_step": 75855, "epoch": 451} {"train_loss": -8.95958137512207, "global_step": 75856, "epoch": 451} {"train_loss": -9.025751113891602, "global_step": 75857, "epoch": 451} {"train_loss": -8.942331314086914, "global_step": 75858, "epoch": 451} {"train_loss": -9.251364707946777, "global_step": 75859, "epoch": 451} {"train_loss": -9.127969741821289, "global_step": 75860, "epoch": 451} {"train_loss": -9.248331069946289, "global_step": 75861, "epoch": 451} {"train_loss": -9.0316162109375, "global_step": 75862, "epoch": 451} {"train_loss": -9.369874954223633, "global_step": 75863, "epoch": 451} {"train_loss": -9.141866683959961, "global_step": 75864, "epoch": 451} {"train_loss": -9.373688697814941, "global_step": 75865, "epoch": 451} {"train_loss": -8.83769416809082, "global_step": 75866, "epoch": 451} {"train_loss": -9.25676441192627, "global_step": 75867, "epoch": 451} {"train_loss": -8.966367721557617, "global_step": 75868, "epoch": 451} {"train_loss": -8.771353721618652, "global_step": 75869, "epoch": 451} {"train_loss": -9.31173324584961, "global_step": 75870, "epoch": 451} {"train_loss": -9.219480514526367, "global_step": 75871, "epoch": 451} {"train_loss": -8.91141414642334, "global_step": 75872, "epoch": 451} {"train_loss": -8.921001434326172, "global_step": 75873, "epoch": 451} {"train_loss": -8.890891075134277, "global_step": 75874, "epoch": 451} {"train_loss": -8.725597381591797, "global_step": 75875, "epoch": 451} {"train_loss": -9.148420333862305, "global_step": 75876, "epoch": 451} {"train_loss": -9.064239501953125, "global_step": 75877, "epoch": 451} {"train_loss": -9.044745445251465, "global_step": 75878, "epoch": 451} {"train_loss": -9.174942970275879, "global_step": 75879, "epoch": 451} {"train_loss": -9.012788772583008, "global_step": 75880, "epoch": 451} {"train_loss": -9.181486129760742, "global_step": 75881, "epoch": 451} {"train_loss": -9.10344123840332, "global_step": 75882, "epoch": 451} {"train_loss": -9.041219711303711, "global_step": 75883, "epoch": 451} {"train_loss": -9.176260948181152, "global_step": 75884, "epoch": 451} {"train_loss": -9.23148250579834, "global_step": 75885, "epoch": 451} {"train_loss": -8.858156204223633, "global_step": 75886, "epoch": 451} {"train_loss": -9.23179817199707, "global_step": 75887, "epoch": 451} {"train_loss": -9.144371032714844, "global_step": 75888, "epoch": 451} {"train_loss": -9.00716781616211, "global_step": 75889, "epoch": 451} {"train_loss": -9.040818214416504, "global_step": 75890, "epoch": 451} {"train_loss": -9.116226196289062, "global_step": 75891, "epoch": 451} {"train_loss": -8.923154830932617, "global_step": 75892, "epoch": 451} {"train_loss": -8.88834285736084, "global_step": 75893, "epoch": 451} {"train_loss": -8.960244178771973, "global_step": 75894, "epoch": 451} {"train_loss": -9.017324447631836, "global_step": 75895, "epoch": 451} {"train_loss": -8.942924499511719, "global_step": 75896, "epoch": 451} {"train_loss": -8.884064674377441, "global_step": 75897, "epoch": 451} {"train_loss": -8.978675842285156, "global_step": 75898, "epoch": 451} {"train_loss": -8.9655122756958, "global_step": 75899, "epoch": 451} {"train_loss": -9.337093353271484, "global_step": 75900, "epoch": 451} {"train_loss": -9.085433959960938, "global_step": 75901, "epoch": 451} {"train_loss": -8.906229019165039, "global_step": 75902, "epoch": 451} {"train_loss": -9.185450553894043, "global_step": 75903, "epoch": 451} {"train_loss": -9.267200469970703, "global_step": 75904, "epoch": 451} {"train_loss": -9.171457290649414, "global_step": 75905, "epoch": 451} {"train_loss": -9.106987953186035, "global_step": 75906, "epoch": 451} {"train_loss": -8.965272903442383, "global_step": 75907, "epoch": 451} {"train_loss": -8.99397087097168, "global_step": 75908, "epoch": 451} {"train_loss": -9.006414413452148, "global_step": 75909, "epoch": 451} {"train_loss": -9.15218448638916, "global_step": 75910, "epoch": 451} {"train_loss": -9.19375991821289, "global_step": 75911, "epoch": 451} {"train_loss": -8.938157081604004, "global_step": 75912, "epoch": 451} {"train_loss": -9.21688175201416, "global_step": 75913, "epoch": 451} {"train_loss": -9.119887351989746, "global_step": 75914, "epoch": 451} {"train_loss": -8.996068000793457, "global_step": 75915, "epoch": 451} {"train_loss": -9.04214859008789, "global_step": 75916, "epoch": 451} {"train_loss": -8.876062393188477, "global_step": 75917, "epoch": 451} {"train_loss": -9.06679630279541, "global_step": 75918, "epoch": 451} {"train_loss": -9.084943771362305, "global_step": 75919, "epoch": 451} {"train_loss": -9.088290214538574, "global_step": 75920, "epoch": 451} {"train_loss": -9.166406631469727, "global_step": 75921, "epoch": 451} {"train_loss": -9.17038345336914, "global_step": 75922, "epoch": 451} {"train_loss": -8.955867767333984, "global_step": 75923, "epoch": 451} {"train_loss": -9.1111478805542, "global_step": 75924, "epoch": 451} {"train_loss": -8.970043182373047, "global_step": 75925, "epoch": 451} {"train_loss": -9.372175216674805, "global_step": 75926, "epoch": 451} {"train_loss": -9.00624942779541, "global_step": 75927, "epoch": 451} {"train_loss": -8.960515975952148, "global_step": 75928, "epoch": 451} {"train_loss": -9.18093204498291, "global_step": 75929, "epoch": 451} {"train_loss": -9.189519882202148, "global_step": 75930, "epoch": 451} {"train_loss": -9.233783721923828, "global_step": 75931, "epoch": 451} {"train_loss": -9.030803680419922, "global_step": 75932, "epoch": 451} {"train_loss": -8.8756103515625, "global_step": 75933, "epoch": 451} {"train_loss": -9.214770317077637, "global_step": 75934, "epoch": 451} {"train_loss": -9.088055604980106, "global_step": 75935, "epoch": 451, "val_loss": 194331.8125} {"train_loss": -9.057266235351562, "global_step": 75936, "epoch": 452} {"train_loss": -9.221630096435547, "global_step": 75937, "epoch": 452} {"train_loss": -9.2315034866333, "global_step": 75938, "epoch": 452} {"train_loss": -9.170064926147461, "global_step": 75939, "epoch": 452} {"train_loss": -9.315008163452148, "global_step": 75940, "epoch": 452} {"train_loss": -9.248727798461914, "global_step": 75941, "epoch": 452} {"train_loss": -9.022940635681152, "global_step": 75942, "epoch": 452} {"train_loss": -9.358221054077148, "global_step": 75943, "epoch": 452} {"train_loss": -9.048959732055664, "global_step": 75944, "epoch": 452} {"train_loss": -9.203960418701172, "global_step": 75945, "epoch": 452} {"train_loss": -9.2907075881958, "global_step": 75946, "epoch": 452} {"train_loss": -9.248482704162598, "global_step": 75947, "epoch": 452} {"train_loss": -9.334157943725586, "global_step": 75948, "epoch": 452} {"train_loss": -9.212539672851562, "global_step": 75949, "epoch": 452} {"train_loss": -9.375006675720215, "global_step": 75950, "epoch": 452} {"train_loss": -9.370492935180664, "global_step": 75951, "epoch": 452} {"train_loss": -9.147026062011719, "global_step": 75952, "epoch": 452} {"train_loss": -9.39989948272705, "global_step": 75953, "epoch": 452} {"train_loss": -9.268004417419434, "global_step": 75954, "epoch": 452} {"train_loss": -9.217119216918945, "global_step": 75955, "epoch": 452} {"train_loss": -9.426565170288086, "global_step": 75956, "epoch": 452} {"train_loss": -9.094430923461914, "global_step": 75957, "epoch": 452} {"train_loss": -9.370451927185059, "global_step": 75958, "epoch": 452} {"train_loss": -9.01164436340332, "global_step": 75959, "epoch": 452} {"train_loss": -9.079517364501953, "global_step": 75960, "epoch": 452} {"train_loss": -9.140110969543457, "global_step": 75961, "epoch": 452} {"train_loss": -9.339056968688965, "global_step": 75962, "epoch": 452} {"train_loss": -9.399407386779785, "global_step": 75963, "epoch": 452} {"train_loss": -9.383583068847656, "global_step": 75964, "epoch": 452} {"train_loss": -9.369094848632812, "global_step": 75965, "epoch": 452} {"train_loss": -9.253076553344727, "global_step": 75966, "epoch": 452} {"train_loss": -9.04054069519043, "global_step": 75967, "epoch": 452} {"train_loss": -9.103700637817383, "global_step": 75968, "epoch": 452} {"train_loss": -9.097763061523438, "global_step": 75969, "epoch": 452} {"train_loss": -8.929189682006836, "global_step": 75970, "epoch": 452} {"train_loss": -9.075482368469238, "global_step": 75971, "epoch": 452} {"train_loss": -8.942032814025879, "global_step": 75972, "epoch": 452} {"train_loss": -8.942211151123047, "global_step": 75973, "epoch": 452} {"train_loss": -8.62735366821289, "global_step": 75974, "epoch": 452} {"train_loss": -9.240579605102539, "global_step": 75975, "epoch": 452} {"train_loss": -8.665964126586914, "global_step": 75976, "epoch": 452} {"train_loss": -9.09316635131836, "global_step": 75977, "epoch": 452} {"train_loss": -9.069244384765625, "global_step": 75978, "epoch": 452} {"train_loss": -8.788664817810059, "global_step": 75979, "epoch": 452} {"train_loss": -8.932645797729492, "global_step": 75980, "epoch": 452} {"train_loss": -8.687339782714844, "global_step": 75981, "epoch": 452} {"train_loss": -9.229360580444336, "global_step": 75982, "epoch": 452} {"train_loss": -8.661032676696777, "global_step": 75983, "epoch": 452} {"train_loss": -8.887112617492676, "global_step": 75984, "epoch": 452} {"train_loss": -9.014055252075195, "global_step": 75985, "epoch": 452} {"train_loss": -8.881938934326172, "global_step": 75986, "epoch": 452} {"train_loss": -8.854341506958008, "global_step": 75987, "epoch": 452} {"train_loss": -9.18613052368164, "global_step": 75988, "epoch": 452} {"train_loss": -9.099624633789062, "global_step": 75989, "epoch": 452} {"train_loss": -9.110061645507812, "global_step": 75990, "epoch": 452} {"train_loss": -9.197021484375, "global_step": 75991, "epoch": 452} {"train_loss": -8.754781723022461, "global_step": 75992, "epoch": 452} {"train_loss": -9.175825119018555, "global_step": 75993, "epoch": 452} {"train_loss": -9.016510963439941, "global_step": 75994, "epoch": 452} {"train_loss": -9.25083065032959, "global_step": 75995, "epoch": 452} {"train_loss": -9.02696418762207, "global_step": 75996, "epoch": 452} {"train_loss": -9.229145050048828, "global_step": 75997, "epoch": 452} {"train_loss": -9.210582733154297, "global_step": 75998, "epoch": 452} {"train_loss": -9.29792308807373, "global_step": 75999, "epoch": 452} {"train_loss": -9.25328254699707, "global_step": 76000, "epoch": 452} {"train_loss": -9.29629898071289, "global_step": 76001, "epoch": 452} {"train_loss": -9.075567245483398, "global_step": 76002, "epoch": 452} {"train_loss": -9.374174118041992, "global_step": 76003, "epoch": 452} {"train_loss": -8.90488338470459, "global_step": 76004, "epoch": 452} {"train_loss": -9.041452407836914, "global_step": 76005, "epoch": 452} {"train_loss": -9.27232551574707, "global_step": 76006, "epoch": 452} {"train_loss": -9.120702743530273, "global_step": 76007, "epoch": 452} {"train_loss": -9.159236907958984, "global_step": 76008, "epoch": 452} {"train_loss": -9.106042861938477, "global_step": 76009, "epoch": 452} {"train_loss": -9.347698211669922, "global_step": 76010, "epoch": 452} {"train_loss": -8.867904663085938, "global_step": 76011, "epoch": 452} {"train_loss": -9.174436569213867, "global_step": 76012, "epoch": 452} {"train_loss": -9.107254028320312, "global_step": 76013, "epoch": 452} {"train_loss": -9.163540840148926, "global_step": 76014, "epoch": 452} {"train_loss": -9.24160385131836, "global_step": 76015, "epoch": 452} {"train_loss": -8.937633514404297, "global_step": 76016, "epoch": 452} {"train_loss": -9.125167846679688, "global_step": 76017, "epoch": 452} {"train_loss": -9.276311874389648, "global_step": 76018, "epoch": 452} {"train_loss": -9.310647964477539, "global_step": 76019, "epoch": 452} {"train_loss": -9.341421127319336, "global_step": 76020, "epoch": 452} {"train_loss": -8.912118911743164, "global_step": 76021, "epoch": 452} {"train_loss": -9.049833297729492, "global_step": 76022, "epoch": 452} {"train_loss": -9.124503135681152, "global_step": 76023, "epoch": 452} {"train_loss": -9.133733749389648, "global_step": 76024, "epoch": 452} {"train_loss": -9.12826919555664, "global_step": 76025, "epoch": 452} {"train_loss": -9.020739555358887, "global_step": 76026, "epoch": 452} {"train_loss": -9.197848320007324, "global_step": 76027, "epoch": 452} {"train_loss": -9.035018920898438, "global_step": 76028, "epoch": 452} {"train_loss": -9.114727020263672, "global_step": 76029, "epoch": 452} {"train_loss": -9.15381145477295, "global_step": 76030, "epoch": 452} {"train_loss": -9.005066871643066, "global_step": 76031, "epoch": 452} {"train_loss": -9.136394500732422, "global_step": 76032, "epoch": 452} {"train_loss": -9.400126457214355, "global_step": 76033, "epoch": 452} {"train_loss": -9.205493927001953, "global_step": 76034, "epoch": 452} {"train_loss": -9.174251556396484, "global_step": 76035, "epoch": 452} {"train_loss": -9.066587448120117, "global_step": 76036, "epoch": 452} {"train_loss": -9.192877769470215, "global_step": 76037, "epoch": 452} {"train_loss": -9.076925277709961, "global_step": 76038, "epoch": 452} {"train_loss": -9.241657257080078, "global_step": 76039, "epoch": 452} {"train_loss": -9.222919464111328, "global_step": 76040, "epoch": 452} {"train_loss": -9.484935760498047, "global_step": 76041, "epoch": 452} {"train_loss": -9.302075386047363, "global_step": 76042, "epoch": 452} {"train_loss": -9.275419235229492, "global_step": 76043, "epoch": 452} {"train_loss": -9.195836067199707, "global_step": 76044, "epoch": 452} {"train_loss": -9.211690902709961, "global_step": 76045, "epoch": 452} {"train_loss": -9.15591812133789, "global_step": 76046, "epoch": 452} {"train_loss": -8.747384071350098, "global_step": 76047, "epoch": 452} {"train_loss": -9.327994346618652, "global_step": 76048, "epoch": 452} {"train_loss": -8.720572471618652, "global_step": 76049, "epoch": 452} {"train_loss": -9.223091125488281, "global_step": 76050, "epoch": 452} {"train_loss": -8.770509719848633, "global_step": 76051, "epoch": 452} {"train_loss": -8.838486671447754, "global_step": 76052, "epoch": 452} {"train_loss": -8.61410140991211, "global_step": 76053, "epoch": 452} {"train_loss": -9.065332412719727, "global_step": 76054, "epoch": 452} {"train_loss": -8.749029159545898, "global_step": 76055, "epoch": 452} {"train_loss": -8.884994506835938, "global_step": 76056, "epoch": 452} {"train_loss": -8.5989990234375, "global_step": 76057, "epoch": 452} {"train_loss": -9.049118995666504, "global_step": 76058, "epoch": 452} {"train_loss": -8.970111846923828, "global_step": 76059, "epoch": 452} {"train_loss": -9.116403579711914, "global_step": 76060, "epoch": 452} {"train_loss": -8.958187103271484, "global_step": 76061, "epoch": 452} {"train_loss": -9.088205337524414, "global_step": 76062, "epoch": 452} {"train_loss": -8.872743606567383, "global_step": 76063, "epoch": 452} {"train_loss": -9.002365112304688, "global_step": 76064, "epoch": 452} {"train_loss": -9.219659805297852, "global_step": 76065, "epoch": 452} {"train_loss": -8.757851600646973, "global_step": 76066, "epoch": 452} {"train_loss": -8.875040054321289, "global_step": 76067, "epoch": 452} {"train_loss": -9.197320938110352, "global_step": 76068, "epoch": 452} {"train_loss": -9.176168441772461, "global_step": 76069, "epoch": 452} {"train_loss": -9.197790145874023, "global_step": 76070, "epoch": 452} {"train_loss": -9.057668685913086, "global_step": 76071, "epoch": 452} {"train_loss": -9.313820838928223, "global_step": 76072, "epoch": 452} {"train_loss": -9.233043670654297, "global_step": 76073, "epoch": 452} {"train_loss": -9.204558372497559, "global_step": 76074, "epoch": 452} {"train_loss": -9.03984260559082, "global_step": 76075, "epoch": 452} {"train_loss": -9.128423690795898, "global_step": 76076, "epoch": 452} {"train_loss": -8.989577293395996, "global_step": 76077, "epoch": 452} {"train_loss": -9.267498016357422, "global_step": 76078, "epoch": 452} {"train_loss": -9.03587532043457, "global_step": 76079, "epoch": 452} {"train_loss": -9.268230438232422, "global_step": 76080, "epoch": 452} {"train_loss": -8.954099655151367, "global_step": 76081, "epoch": 452} {"train_loss": -9.252910614013672, "global_step": 76082, "epoch": 452} {"train_loss": -8.847248077392578, "global_step": 76083, "epoch": 452} {"train_loss": -9.311727523803711, "global_step": 76084, "epoch": 452} {"train_loss": -8.801066398620605, "global_step": 76085, "epoch": 452} {"train_loss": -9.186351776123047, "global_step": 76086, "epoch": 452} {"train_loss": -8.726314544677734, "global_step": 76087, "epoch": 452} {"train_loss": -9.015663146972656, "global_step": 76088, "epoch": 452} {"train_loss": -9.110982894897461, "global_step": 76089, "epoch": 452} {"train_loss": -8.674922943115234, "global_step": 76090, "epoch": 452} {"train_loss": -9.253905296325684, "global_step": 76091, "epoch": 452} {"train_loss": -8.984404563903809, "global_step": 76092, "epoch": 452} {"train_loss": -9.177896499633789, "global_step": 76093, "epoch": 452} {"train_loss": -9.08127212524414, "global_step": 76094, "epoch": 452} {"train_loss": -9.199358940124512, "global_step": 76095, "epoch": 452} {"train_loss": -9.068772315979004, "global_step": 76096, "epoch": 452} {"train_loss": -9.114774703979492, "global_step": 76097, "epoch": 452} {"train_loss": -8.954428672790527, "global_step": 76098, "epoch": 452} {"train_loss": -9.059194564819336, "global_step": 76099, "epoch": 452} {"train_loss": -9.361361503601074, "global_step": 76100, "epoch": 452} {"train_loss": -9.07144546508789, "global_step": 76101, "epoch": 452} {"train_loss": -9.244321823120117, "global_step": 76102, "epoch": 452} {"train_loss": -9.10650026230585, "global_step": 76103, "epoch": 452, "val_loss": 196013.078125} {"train_loss": -8.915388107299805, "global_step": 76104, "epoch": 453} {"train_loss": -8.915730476379395, "global_step": 76105, "epoch": 453} {"train_loss": -9.297712326049805, "global_step": 76106, "epoch": 453} {"train_loss": -9.330160140991211, "global_step": 76107, "epoch": 453} {"train_loss": -9.257431983947754, "global_step": 76108, "epoch": 453} {"train_loss": -8.89926815032959, "global_step": 76109, "epoch": 453} {"train_loss": -9.192301750183105, "global_step": 76110, "epoch": 453} {"train_loss": -9.356414794921875, "global_step": 76111, "epoch": 453} {"train_loss": -9.148604393005371, "global_step": 76112, "epoch": 453} {"train_loss": -9.201473236083984, "global_step": 76113, "epoch": 453} {"train_loss": -8.945799827575684, "global_step": 76114, "epoch": 453} {"train_loss": -9.39271354675293, "global_step": 76115, "epoch": 453} {"train_loss": -8.992015838623047, "global_step": 76116, "epoch": 453} {"train_loss": -9.013811111450195, "global_step": 76117, "epoch": 453} {"train_loss": -9.082666397094727, "global_step": 76118, "epoch": 453} {"train_loss": -8.710729598999023, "global_step": 76119, "epoch": 453} {"train_loss": -9.097652435302734, "global_step": 76120, "epoch": 453} {"train_loss": -8.974971771240234, "global_step": 76121, "epoch": 453} {"train_loss": -9.150106430053711, "global_step": 76122, "epoch": 453} {"train_loss": -9.072044372558594, "global_step": 76123, "epoch": 453} {"train_loss": -9.143844604492188, "global_step": 76124, "epoch": 453} {"train_loss": -9.015317916870117, "global_step": 76125, "epoch": 453} {"train_loss": -9.228309631347656, "global_step": 76126, "epoch": 453} {"train_loss": -9.035219192504883, "global_step": 76127, "epoch": 453} {"train_loss": -9.06010913848877, "global_step": 76128, "epoch": 453} {"train_loss": -9.070392608642578, "global_step": 76129, "epoch": 453} {"train_loss": -9.162467956542969, "global_step": 76130, "epoch": 453} {"train_loss": -9.036416053771973, "global_step": 76131, "epoch": 453} {"train_loss": -9.14314079284668, "global_step": 76132, "epoch": 453} {"train_loss": -8.961687088012695, "global_step": 76133, "epoch": 453} {"train_loss": -8.948756217956543, "global_step": 76134, "epoch": 453} {"train_loss": -9.12751579284668, "global_step": 76135, "epoch": 453} {"train_loss": -8.939663887023926, "global_step": 76136, "epoch": 453} {"train_loss": -9.248247146606445, "global_step": 76137, "epoch": 453} {"train_loss": -9.260893821716309, "global_step": 76138, "epoch": 453} {"train_loss": -9.381196022033691, "global_step": 76139, "epoch": 453} {"train_loss": -9.065255165100098, "global_step": 76140, "epoch": 453} {"train_loss": -9.323195457458496, "global_step": 76141, "epoch": 453} {"train_loss": -9.042869567871094, "global_step": 76142, "epoch": 453} {"train_loss": -8.904678344726562, "global_step": 76143, "epoch": 453} {"train_loss": -9.156879425048828, "global_step": 76144, "epoch": 453} {"train_loss": -9.135032653808594, "global_step": 76145, "epoch": 453} {"train_loss": -9.067293167114258, "global_step": 76146, "epoch": 453} {"train_loss": -9.17831039428711, "global_step": 76147, "epoch": 453} {"train_loss": -9.240901947021484, "global_step": 76148, "epoch": 453} {"train_loss": -9.136449813842773, "global_step": 76149, "epoch": 453} {"train_loss": -9.267317771911621, "global_step": 76150, "epoch": 453} {"train_loss": -9.295987129211426, "global_step": 76151, "epoch": 453} {"train_loss": -9.131349563598633, "global_step": 76152, "epoch": 453} {"train_loss": -9.228546142578125, "global_step": 76153, "epoch": 453} {"train_loss": -9.103399276733398, "global_step": 76154, "epoch": 453} {"train_loss": -8.994553565979004, "global_step": 76155, "epoch": 453} {"train_loss": -9.081395149230957, "global_step": 76156, "epoch": 453} {"train_loss": -9.176433563232422, "global_step": 76157, "epoch": 453} {"train_loss": -8.885590553283691, "global_step": 76158, "epoch": 453} {"train_loss": -9.040714263916016, "global_step": 76159, "epoch": 453} {"train_loss": -9.073436737060547, "global_step": 76160, "epoch": 453} {"train_loss": -9.255263328552246, "global_step": 76161, "epoch": 453} {"train_loss": -9.039262771606445, "global_step": 76162, "epoch": 453} {"train_loss": -9.09527587890625, "global_step": 76163, "epoch": 453} {"train_loss": -8.859809875488281, "global_step": 76164, "epoch": 453} {"train_loss": -9.19827651977539, "global_step": 76165, "epoch": 453} {"train_loss": -9.185688018798828, "global_step": 76166, "epoch": 453} {"train_loss": -9.194093704223633, "global_step": 76167, "epoch": 453} {"train_loss": -9.318939208984375, "global_step": 76168, "epoch": 453} {"train_loss": -9.057779312133789, "global_step": 76169, "epoch": 453} {"train_loss": -8.80413818359375, "global_step": 76170, "epoch": 453} {"train_loss": -8.843947410583496, "global_step": 76171, "epoch": 453} {"train_loss": -9.02528190612793, "global_step": 76172, "epoch": 453} {"train_loss": -9.005481719970703, "global_step": 76173, "epoch": 453} {"train_loss": -8.990909576416016, "global_step": 76174, "epoch": 453} {"train_loss": -9.174202919006348, "global_step": 76175, "epoch": 453} {"train_loss": -9.078714370727539, "global_step": 76176, "epoch": 453} {"train_loss": -8.9266357421875, "global_step": 76177, "epoch": 453} {"train_loss": -9.066625595092773, "global_step": 76178, "epoch": 453} {"train_loss": -9.008209228515625, "global_step": 76179, "epoch": 453} {"train_loss": -8.948633193969727, "global_step": 76180, "epoch": 453} {"train_loss": -9.113725662231445, "global_step": 76181, "epoch": 453} {"train_loss": -8.922649383544922, "global_step": 76182, "epoch": 453} {"train_loss": -8.986452102661133, "global_step": 76183, "epoch": 453} {"train_loss": -9.106635093688965, "global_step": 76184, "epoch": 453} {"train_loss": -9.1192626953125, "global_step": 76185, "epoch": 453} {"train_loss": -9.161507606506348, "global_step": 76186, "epoch": 453} {"train_loss": -9.161056518554688, "global_step": 76187, "epoch": 453} {"train_loss": -9.332817077636719, "global_step": 76188, "epoch": 453} {"train_loss": -9.205379486083984, "global_step": 76189, "epoch": 453} {"train_loss": -9.205046653747559, "global_step": 76190, "epoch": 453} {"train_loss": -9.127781867980957, "global_step": 76191, "epoch": 453} {"train_loss": -8.954303741455078, "global_step": 76192, "epoch": 453} {"train_loss": -9.03689193725586, "global_step": 76193, "epoch": 453} {"train_loss": -9.148183822631836, "global_step": 76194, "epoch": 453} {"train_loss": -9.174522399902344, "global_step": 76195, "epoch": 453} {"train_loss": -9.336341857910156, "global_step": 76196, "epoch": 453} {"train_loss": -9.16583251953125, "global_step": 76197, "epoch": 453} {"train_loss": -9.319854736328125, "global_step": 76198, "epoch": 453} {"train_loss": -9.092578887939453, "global_step": 76199, "epoch": 453} {"train_loss": -9.271343231201172, "global_step": 76200, "epoch": 453} {"train_loss": -9.173999786376953, "global_step": 76201, "epoch": 453} {"train_loss": -9.036038398742676, "global_step": 76202, "epoch": 453} {"train_loss": -8.998231887817383, "global_step": 76203, "epoch": 453} {"train_loss": -9.212172508239746, "global_step": 76204, "epoch": 453} {"train_loss": -9.166149139404297, "global_step": 76205, "epoch": 453} {"train_loss": -9.447680473327637, "global_step": 76206, "epoch": 453} {"train_loss": -9.052757263183594, "global_step": 76207, "epoch": 453} {"train_loss": -9.245052337646484, "global_step": 76208, "epoch": 453} {"train_loss": -9.239267349243164, "global_step": 76209, "epoch": 453} {"train_loss": -9.088033676147461, "global_step": 76210, "epoch": 453} {"train_loss": -9.054264068603516, "global_step": 76211, "epoch": 453} {"train_loss": -8.962146759033203, "global_step": 76212, "epoch": 453} {"train_loss": -9.076509475708008, "global_step": 76213, "epoch": 453} {"train_loss": -8.97947883605957, "global_step": 76214, "epoch": 453} {"train_loss": -9.184814453125, "global_step": 76215, "epoch": 453} {"train_loss": -9.141236305236816, "global_step": 76216, "epoch": 453} {"train_loss": -8.960827827453613, "global_step": 76217, "epoch": 453} {"train_loss": -9.166963577270508, "global_step": 76218, "epoch": 453} {"train_loss": -8.894107818603516, "global_step": 76219, "epoch": 453} {"train_loss": -9.356171607971191, "global_step": 76220, "epoch": 453} {"train_loss": -9.0792236328125, "global_step": 76221, "epoch": 453} {"train_loss": -9.326034545898438, "global_step": 76222, "epoch": 453} {"train_loss": -9.378641128540039, "global_step": 76223, "epoch": 453} {"train_loss": -9.32194709777832, "global_step": 76224, "epoch": 453} {"train_loss": -9.06105899810791, "global_step": 76225, "epoch": 453} {"train_loss": -9.358978271484375, "global_step": 76226, "epoch": 453} {"train_loss": -9.324914932250977, "global_step": 76227, "epoch": 453} {"train_loss": -9.255298614501953, "global_step": 76228, "epoch": 453} {"train_loss": -9.425928115844727, "global_step": 76229, "epoch": 453} {"train_loss": -8.891548156738281, "global_step": 76230, "epoch": 453} {"train_loss": -9.162790298461914, "global_step": 76231, "epoch": 453} {"train_loss": -9.368756294250488, "global_step": 76232, "epoch": 453} {"train_loss": -9.309600830078125, "global_step": 76233, "epoch": 453} {"train_loss": -9.133160591125488, "global_step": 76234, "epoch": 453} {"train_loss": -9.219016075134277, "global_step": 76235, "epoch": 453} {"train_loss": -9.262543678283691, "global_step": 76236, "epoch": 453} {"train_loss": -9.424884796142578, "global_step": 76237, "epoch": 453} {"train_loss": -9.184213638305664, "global_step": 76238, "epoch": 453} {"train_loss": -9.075241088867188, "global_step": 76239, "epoch": 453} {"train_loss": -9.31325912475586, "global_step": 76240, "epoch": 453} {"train_loss": -9.258367538452148, "global_step": 76241, "epoch": 453} {"train_loss": -9.019937515258789, "global_step": 76242, "epoch": 453} {"train_loss": -9.06197452545166, "global_step": 76243, "epoch": 453} {"train_loss": -9.217116355895996, "global_step": 76244, "epoch": 453} {"train_loss": -9.084707260131836, "global_step": 76245, "epoch": 453} {"train_loss": -8.912443161010742, "global_step": 76246, "epoch": 453} {"train_loss": -9.008787155151367, "global_step": 76247, "epoch": 453} {"train_loss": -9.184171676635742, "global_step": 76248, "epoch": 453} {"train_loss": -8.97940444946289, "global_step": 76249, "epoch": 453} {"train_loss": -9.086614608764648, "global_step": 76250, "epoch": 453} {"train_loss": -9.189712524414062, "global_step": 76251, "epoch": 453} {"train_loss": -9.198400497436523, "global_step": 76252, "epoch": 453} {"train_loss": -9.137748718261719, "global_step": 76253, "epoch": 453} {"train_loss": -9.364720344543457, "global_step": 76254, "epoch": 453} {"train_loss": -9.08021354675293, "global_step": 76255, "epoch": 453} {"train_loss": -9.087459564208984, "global_step": 76256, "epoch": 453} {"train_loss": -9.320850372314453, "global_step": 76257, "epoch": 453} {"train_loss": -8.951616287231445, "global_step": 76258, "epoch": 453} {"train_loss": -8.88758659362793, "global_step": 76259, "epoch": 453} {"train_loss": -9.100217819213867, "global_step": 76260, "epoch": 453} {"train_loss": -9.011407852172852, "global_step": 76261, "epoch": 453} {"train_loss": -9.123615264892578, "global_step": 76262, "epoch": 453} {"train_loss": -9.062065124511719, "global_step": 76263, "epoch": 453} {"train_loss": -9.190939903259277, "global_step": 76264, "epoch": 453} {"train_loss": -8.943227767944336, "global_step": 76265, "epoch": 453} {"train_loss": -8.94955062866211, "global_step": 76266, "epoch": 453} {"train_loss": -9.072854995727539, "global_step": 76267, "epoch": 453} {"train_loss": -8.89062213897705, "global_step": 76268, "epoch": 453} {"train_loss": -8.825082778930664, "global_step": 76269, "epoch": 453} {"train_loss": -8.917315483093262, "global_step": 76270, "epoch": 453} {"train_loss": -9.117027350834437, "global_step": 76271, "epoch": 453, "val_loss": 196087.5} {"train_loss": -8.689977645874023, "global_step": 76272, "epoch": 454} {"train_loss": -9.040372848510742, "global_step": 76273, "epoch": 454} {"train_loss": -8.797527313232422, "global_step": 76274, "epoch": 454} {"train_loss": -9.222509384155273, "global_step": 76275, "epoch": 454} {"train_loss": -9.018594741821289, "global_step": 76276, "epoch": 454} {"train_loss": -9.173456192016602, "global_step": 76277, "epoch": 454} {"train_loss": -9.0873441696167, "global_step": 76278, "epoch": 454} {"train_loss": -9.208030700683594, "global_step": 76279, "epoch": 454} {"train_loss": -9.065433502197266, "global_step": 76280, "epoch": 454} {"train_loss": -9.026214599609375, "global_step": 76281, "epoch": 454} {"train_loss": -9.189891815185547, "global_step": 76282, "epoch": 454} {"train_loss": -8.998786926269531, "global_step": 76283, "epoch": 454} {"train_loss": -9.243673324584961, "global_step": 76284, "epoch": 454} {"train_loss": -9.13018798828125, "global_step": 76285, "epoch": 454} {"train_loss": -9.298076629638672, "global_step": 76286, "epoch": 454} {"train_loss": -9.338312149047852, "global_step": 76287, "epoch": 454} {"train_loss": -9.117948532104492, "global_step": 76288, "epoch": 454} {"train_loss": -9.249340057373047, "global_step": 76289, "epoch": 454} {"train_loss": -9.097210884094238, "global_step": 76290, "epoch": 454} {"train_loss": -9.221380233764648, "global_step": 76291, "epoch": 454} {"train_loss": -9.310802459716797, "global_step": 76292, "epoch": 454} {"train_loss": -8.968437194824219, "global_step": 76293, "epoch": 454} {"train_loss": -9.161934852600098, "global_step": 76294, "epoch": 454} {"train_loss": -8.7511568069458, "global_step": 76295, "epoch": 454} {"train_loss": -9.111882209777832, "global_step": 76296, "epoch": 454} {"train_loss": -9.244384765625, "global_step": 76297, "epoch": 454} {"train_loss": -8.774017333984375, "global_step": 76298, "epoch": 454} {"train_loss": -9.190771102905273, "global_step": 76299, "epoch": 454} {"train_loss": -8.847537994384766, "global_step": 76300, "epoch": 454} {"train_loss": -8.944324493408203, "global_step": 76301, "epoch": 454} {"train_loss": -9.0447416305542, "global_step": 76302, "epoch": 454} {"train_loss": -9.112048149108887, "global_step": 76303, "epoch": 454} {"train_loss": -8.981298446655273, "global_step": 76304, "epoch": 454} {"train_loss": -8.926897048950195, "global_step": 76305, "epoch": 454} {"train_loss": -9.17908000946045, "global_step": 76306, "epoch": 454} {"train_loss": -8.965210914611816, "global_step": 76307, "epoch": 454} {"train_loss": -9.17341423034668, "global_step": 76308, "epoch": 454} {"train_loss": -9.26858139038086, "global_step": 76309, "epoch": 454} {"train_loss": -8.76127815246582, "global_step": 76310, "epoch": 454} {"train_loss": -9.124166488647461, "global_step": 76311, "epoch": 454} {"train_loss": -8.937820434570312, "global_step": 76312, "epoch": 454} {"train_loss": -8.825236320495605, "global_step": 76313, "epoch": 454} {"train_loss": -8.97414493560791, "global_step": 76314, "epoch": 454} {"train_loss": -9.150724411010742, "global_step": 76315, "epoch": 454} {"train_loss": -9.210027694702148, "global_step": 76316, "epoch": 454} {"train_loss": -9.158618927001953, "global_step": 76317, "epoch": 454} {"train_loss": -9.261775970458984, "global_step": 76318, "epoch": 454} {"train_loss": -9.307907104492188, "global_step": 76319, "epoch": 454} {"train_loss": -8.722763061523438, "global_step": 76320, "epoch": 454} {"train_loss": -9.33572006225586, "global_step": 76321, "epoch": 454} {"train_loss": -8.78439998626709, "global_step": 76322, "epoch": 454} {"train_loss": -9.192618370056152, "global_step": 76323, "epoch": 454} {"train_loss": -9.112839698791504, "global_step": 76324, "epoch": 454} {"train_loss": -9.065770149230957, "global_step": 76325, "epoch": 454} {"train_loss": -9.21534538269043, "global_step": 76326, "epoch": 454} {"train_loss": -8.87049674987793, "global_step": 76327, "epoch": 454} {"train_loss": -9.268535614013672, "global_step": 76328, "epoch": 454} {"train_loss": -8.972800254821777, "global_step": 76329, "epoch": 454} {"train_loss": -8.916375160217285, "global_step": 76330, "epoch": 454} {"train_loss": -9.199752807617188, "global_step": 76331, "epoch": 454} {"train_loss": -8.73201847076416, "global_step": 76332, "epoch": 454} {"train_loss": -9.104551315307617, "global_step": 76333, "epoch": 454} {"train_loss": -8.94122314453125, "global_step": 76334, "epoch": 454} {"train_loss": -9.11794662475586, "global_step": 76335, "epoch": 454} {"train_loss": -9.156749725341797, "global_step": 76336, "epoch": 454} {"train_loss": -8.959489822387695, "global_step": 76337, "epoch": 454} {"train_loss": -8.9478759765625, "global_step": 76338, "epoch": 454} {"train_loss": -9.197379112243652, "global_step": 76339, "epoch": 454} {"train_loss": -9.327219009399414, "global_step": 76340, "epoch": 454} {"train_loss": -8.918608665466309, "global_step": 76341, "epoch": 454} {"train_loss": -9.196067810058594, "global_step": 76342, "epoch": 454} {"train_loss": -8.762735366821289, "global_step": 76343, "epoch": 454} {"train_loss": -9.036428451538086, "global_step": 76344, "epoch": 454} {"train_loss": -8.977185249328613, "global_step": 76345, "epoch": 454} {"train_loss": -8.802820205688477, "global_step": 76346, "epoch": 454} {"train_loss": -9.287981986999512, "global_step": 76347, "epoch": 454} {"train_loss": -9.113996505737305, "global_step": 76348, "epoch": 454} {"train_loss": -9.08833122253418, "global_step": 76349, "epoch": 454} {"train_loss": -9.089420318603516, "global_step": 76350, "epoch": 454} {"train_loss": -9.056941986083984, "global_step": 76351, "epoch": 454} {"train_loss": -8.579917907714844, "global_step": 76352, "epoch": 454} {"train_loss": -9.175453186035156, "global_step": 76353, "epoch": 454} {"train_loss": -8.751154899597168, "global_step": 76354, "epoch": 454} {"train_loss": -9.156133651733398, "global_step": 76355, "epoch": 454} {"train_loss": -9.108793258666992, "global_step": 76356, "epoch": 454} {"train_loss": -8.812488555908203, "global_step": 76357, "epoch": 454} {"train_loss": -9.199873924255371, "global_step": 76358, "epoch": 454} {"train_loss": -9.167468070983887, "global_step": 76359, "epoch": 454} {"train_loss": -9.052255630493164, "global_step": 76360, "epoch": 454} {"train_loss": -8.959003448486328, "global_step": 76361, "epoch": 454} {"train_loss": -9.04309368133545, "global_step": 76362, "epoch": 454} {"train_loss": -9.143204689025879, "global_step": 76363, "epoch": 454} {"train_loss": -9.197205543518066, "global_step": 76364, "epoch": 454} {"train_loss": -9.419426918029785, "global_step": 76365, "epoch": 454} {"train_loss": -9.232873916625977, "global_step": 76366, "epoch": 454} {"train_loss": -9.158318519592285, "global_step": 76367, "epoch": 454} {"train_loss": -9.260404586791992, "global_step": 76368, "epoch": 454} {"train_loss": -9.210116386413574, "global_step": 76369, "epoch": 454} {"train_loss": -9.1281099319458, "global_step": 76370, "epoch": 454} {"train_loss": -9.144649505615234, "global_step": 76371, "epoch": 454} {"train_loss": -9.041107177734375, "global_step": 76372, "epoch": 454} {"train_loss": -9.144922256469727, "global_step": 76373, "epoch": 454} {"train_loss": -9.168546676635742, "global_step": 76374, "epoch": 454} {"train_loss": -9.454549789428711, "global_step": 76375, "epoch": 454} {"train_loss": -9.122930526733398, "global_step": 76376, "epoch": 454} {"train_loss": -9.228521347045898, "global_step": 76377, "epoch": 454} {"train_loss": -9.40716552734375, "global_step": 76378, "epoch": 454} {"train_loss": -9.203843116760254, "global_step": 76379, "epoch": 454} {"train_loss": -9.204805374145508, "global_step": 76380, "epoch": 454} {"train_loss": -9.478944778442383, "global_step": 76381, "epoch": 454} {"train_loss": -9.4088134765625, "global_step": 76382, "epoch": 454} {"train_loss": -9.071544647216797, "global_step": 76383, "epoch": 454} {"train_loss": -9.231788635253906, "global_step": 76384, "epoch": 454} {"train_loss": -9.264345169067383, "global_step": 76385, "epoch": 454} {"train_loss": -8.608358383178711, "global_step": 76386, "epoch": 454} {"train_loss": -8.774177551269531, "global_step": 76387, "epoch": 454} {"train_loss": -8.886316299438477, "global_step": 76388, "epoch": 454} {"train_loss": -8.79914665222168, "global_step": 76389, "epoch": 454} {"train_loss": -9.036565780639648, "global_step": 76390, "epoch": 454} {"train_loss": -8.865649223327637, "global_step": 76391, "epoch": 454} {"train_loss": -9.279088973999023, "global_step": 76392, "epoch": 454} {"train_loss": -8.92304515838623, "global_step": 76393, "epoch": 454} {"train_loss": -8.896081924438477, "global_step": 76394, "epoch": 454} {"train_loss": -8.888693809509277, "global_step": 76395, "epoch": 454} {"train_loss": -9.007577896118164, "global_step": 76396, "epoch": 454} {"train_loss": -8.895027160644531, "global_step": 76397, "epoch": 454} {"train_loss": -9.039961814880371, "global_step": 76398, "epoch": 454} {"train_loss": -8.940740585327148, "global_step": 76399, "epoch": 454} {"train_loss": -9.024175643920898, "global_step": 76400, "epoch": 454} {"train_loss": -8.988656044006348, "global_step": 76401, "epoch": 454} {"train_loss": -8.916168212890625, "global_step": 76402, "epoch": 454} {"train_loss": -9.060906410217285, "global_step": 76403, "epoch": 454} {"train_loss": -9.119762420654297, "global_step": 76404, "epoch": 454} {"train_loss": -8.96656608581543, "global_step": 76405, "epoch": 454} {"train_loss": -9.00157642364502, "global_step": 76406, "epoch": 454} {"train_loss": -8.950765609741211, "global_step": 76407, "epoch": 454} {"train_loss": -9.148482322692871, "global_step": 76408, "epoch": 454} {"train_loss": -8.76188850402832, "global_step": 76409, "epoch": 454} {"train_loss": -9.014771461486816, "global_step": 76410, "epoch": 454} {"train_loss": -8.7491455078125, "global_step": 76411, "epoch": 454} {"train_loss": -8.984667778015137, "global_step": 76412, "epoch": 454} {"train_loss": -9.092418670654297, "global_step": 76413, "epoch": 454} {"train_loss": -8.887824058532715, "global_step": 76414, "epoch": 454} {"train_loss": -8.970672607421875, "global_step": 76415, "epoch": 454} {"train_loss": -9.181568145751953, "global_step": 76416, "epoch": 454} {"train_loss": -8.981740951538086, "global_step": 76417, "epoch": 454} {"train_loss": -9.191963195800781, "global_step": 76418, "epoch": 454} {"train_loss": -8.962440490722656, "global_step": 76419, "epoch": 454} {"train_loss": -8.989748001098633, "global_step": 76420, "epoch": 454} {"train_loss": -9.19540023803711, "global_step": 76421, "epoch": 454} {"train_loss": -9.292572975158691, "global_step": 76422, "epoch": 454} {"train_loss": -9.09554386138916, "global_step": 76423, "epoch": 454} {"train_loss": -9.084871292114258, "global_step": 76424, "epoch": 454} {"train_loss": -9.350910186767578, "global_step": 76425, "epoch": 454} {"train_loss": -9.22227668762207, "global_step": 76426, "epoch": 454} {"train_loss": -8.988008499145508, "global_step": 76427, "epoch": 454} {"train_loss": -9.519364356994629, "global_step": 76428, "epoch": 454} {"train_loss": -9.04796028137207, "global_step": 76429, "epoch": 454} {"train_loss": -8.944793701171875, "global_step": 76430, "epoch": 454} {"train_loss": -9.107426643371582, "global_step": 76431, "epoch": 454} {"train_loss": -8.776290893554688, "global_step": 76432, "epoch": 454} {"train_loss": -9.176937103271484, "global_step": 76433, "epoch": 454} {"train_loss": -9.105720520019531, "global_step": 76434, "epoch": 454} {"train_loss": -9.14288330078125, "global_step": 76435, "epoch": 454} {"train_loss": -8.70606517791748, "global_step": 76436, "epoch": 454} {"train_loss": -9.178300857543945, "global_step": 76437, "epoch": 454} {"train_loss": -9.156588554382324, "global_step": 76438, "epoch": 454} {"train_loss": -9.068583244369144, "global_step": 76439, "epoch": 454, "val_loss": 194394.515625} {"train_loss": -9.06264877319336, "global_step": 76440, "epoch": 455} {"train_loss": -9.159151077270508, "global_step": 76441, "epoch": 455} {"train_loss": -9.104021072387695, "global_step": 76442, "epoch": 455} {"train_loss": -8.98564338684082, "global_step": 76443, "epoch": 455} {"train_loss": -9.29358196258545, "global_step": 76444, "epoch": 455} {"train_loss": -9.226414680480957, "global_step": 76445, "epoch": 455} {"train_loss": -9.020235061645508, "global_step": 76446, "epoch": 455} {"train_loss": -9.261907577514648, "global_step": 76447, "epoch": 455} {"train_loss": -9.242439270019531, "global_step": 76448, "epoch": 455} {"train_loss": -9.187848091125488, "global_step": 76449, "epoch": 455} {"train_loss": -9.220634460449219, "global_step": 76450, "epoch": 455} {"train_loss": -9.26333999633789, "global_step": 76451, "epoch": 455} {"train_loss": -8.929861068725586, "global_step": 76452, "epoch": 455} {"train_loss": -8.97096061706543, "global_step": 76453, "epoch": 455} {"train_loss": -9.260564804077148, "global_step": 76454, "epoch": 455} {"train_loss": -8.785677909851074, "global_step": 76455, "epoch": 455} {"train_loss": -9.022104263305664, "global_step": 76456, "epoch": 455} {"train_loss": -9.382669448852539, "global_step": 76457, "epoch": 455} {"train_loss": -9.029029846191406, "global_step": 76458, "epoch": 455} {"train_loss": -9.166528701782227, "global_step": 76459, "epoch": 455} {"train_loss": -9.024171829223633, "global_step": 76460, "epoch": 455} {"train_loss": -8.757553100585938, "global_step": 76461, "epoch": 455} {"train_loss": -9.191157341003418, "global_step": 76462, "epoch": 455} {"train_loss": -8.798279762268066, "global_step": 76463, "epoch": 455} {"train_loss": -9.012622833251953, "global_step": 76464, "epoch": 455} {"train_loss": -9.176946640014648, "global_step": 76465, "epoch": 455} {"train_loss": -8.727673530578613, "global_step": 76466, "epoch": 455} {"train_loss": -9.15305233001709, "global_step": 76467, "epoch": 455} {"train_loss": -9.080024719238281, "global_step": 76468, "epoch": 455} {"train_loss": -8.961159706115723, "global_step": 76469, "epoch": 455} {"train_loss": -9.109916687011719, "global_step": 76470, "epoch": 455} {"train_loss": -9.190290451049805, "global_step": 76471, "epoch": 455} {"train_loss": -9.005224227905273, "global_step": 76472, "epoch": 455} {"train_loss": -9.137497901916504, "global_step": 76473, "epoch": 455} {"train_loss": -9.068117141723633, "global_step": 76474, "epoch": 455} {"train_loss": -9.252496719360352, "global_step": 76475, "epoch": 455} {"train_loss": -9.071124076843262, "global_step": 76476, "epoch": 455} {"train_loss": -9.100234031677246, "global_step": 76477, "epoch": 455} {"train_loss": -9.193893432617188, "global_step": 76478, "epoch": 455} {"train_loss": -9.04309368133545, "global_step": 76479, "epoch": 455} {"train_loss": -9.06485366821289, "global_step": 76480, "epoch": 455} {"train_loss": -8.997617721557617, "global_step": 76481, "epoch": 455} {"train_loss": -8.996337890625, "global_step": 76482, "epoch": 455} {"train_loss": -9.04122543334961, "global_step": 76483, "epoch": 455} {"train_loss": -8.788333892822266, "global_step": 76484, "epoch": 455} {"train_loss": -9.00735855102539, "global_step": 76485, "epoch": 455} {"train_loss": -9.104181289672852, "global_step": 76486, "epoch": 455} {"train_loss": -9.135175704956055, "global_step": 76487, "epoch": 455} {"train_loss": -9.252666473388672, "global_step": 76488, "epoch": 455} {"train_loss": -9.202983856201172, "global_step": 76489, "epoch": 455} {"train_loss": -9.09653091430664, "global_step": 76490, "epoch": 455} {"train_loss": -9.314001083374023, "global_step": 76491, "epoch": 455} {"train_loss": -9.0193452835083, "global_step": 76492, "epoch": 455} {"train_loss": -9.196097373962402, "global_step": 76493, "epoch": 455} {"train_loss": -8.804784774780273, "global_step": 76494, "epoch": 455} {"train_loss": -8.957351684570312, "global_step": 76495, "epoch": 455} {"train_loss": -9.163361549377441, "global_step": 76496, "epoch": 455} {"train_loss": -9.001070976257324, "global_step": 76497, "epoch": 455} {"train_loss": -9.257960319519043, "global_step": 76498, "epoch": 455} {"train_loss": -9.129800796508789, "global_step": 76499, "epoch": 455} {"train_loss": -9.060372352600098, "global_step": 76500, "epoch": 455} {"train_loss": -9.14891242980957, "global_step": 76501, "epoch": 455} {"train_loss": -9.109017372131348, "global_step": 76502, "epoch": 455} {"train_loss": -9.246011734008789, "global_step": 76503, "epoch": 455} {"train_loss": -8.917110443115234, "global_step": 76504, "epoch": 455} {"train_loss": -9.075889587402344, "global_step": 76505, "epoch": 455} {"train_loss": -8.908121109008789, "global_step": 76506, "epoch": 455} {"train_loss": -9.317676544189453, "global_step": 76507, "epoch": 455} {"train_loss": -9.026407241821289, "global_step": 76508, "epoch": 455} {"train_loss": -9.270303726196289, "global_step": 76509, "epoch": 455} {"train_loss": -9.125039100646973, "global_step": 76510, "epoch": 455} {"train_loss": -8.92231559753418, "global_step": 76511, "epoch": 455} {"train_loss": -8.940534591674805, "global_step": 76512, "epoch": 455} {"train_loss": -9.178579330444336, "global_step": 76513, "epoch": 455} {"train_loss": -8.831939697265625, "global_step": 76514, "epoch": 455} {"train_loss": -9.091622352600098, "global_step": 76515, "epoch": 455} {"train_loss": -9.307147026062012, "global_step": 76516, "epoch": 455} {"train_loss": -9.15670108795166, "global_step": 76517, "epoch": 455} {"train_loss": -9.224042892456055, "global_step": 76518, "epoch": 455} {"train_loss": -9.080026626586914, "global_step": 76519, "epoch": 455} {"train_loss": -9.124974250793457, "global_step": 76520, "epoch": 455} {"train_loss": -9.092382431030273, "global_step": 76521, "epoch": 455} {"train_loss": -9.133916854858398, "global_step": 76522, "epoch": 455} {"train_loss": -9.248241424560547, "global_step": 76523, "epoch": 455} {"train_loss": -8.911447525024414, "global_step": 76524, "epoch": 455} {"train_loss": -9.019060134887695, "global_step": 76525, "epoch": 455} {"train_loss": -9.126849174499512, "global_step": 76526, "epoch": 455} {"train_loss": -9.221534729003906, "global_step": 76527, "epoch": 455} {"train_loss": -9.265398979187012, "global_step": 76528, "epoch": 455} {"train_loss": -9.176156044006348, "global_step": 76529, "epoch": 455} {"train_loss": -9.258464813232422, "global_step": 76530, "epoch": 455} {"train_loss": -9.188739776611328, "global_step": 76531, "epoch": 455} {"train_loss": -9.17249870300293, "global_step": 76532, "epoch": 455} {"train_loss": -8.80327033996582, "global_step": 76533, "epoch": 455} {"train_loss": -9.137657165527344, "global_step": 76534, "epoch": 455} {"train_loss": -8.869071960449219, "global_step": 76535, "epoch": 455} {"train_loss": -9.24854850769043, "global_step": 76536, "epoch": 455} {"train_loss": -8.958126068115234, "global_step": 76537, "epoch": 455} {"train_loss": -9.027837753295898, "global_step": 76538, "epoch": 455} {"train_loss": -8.97176742553711, "global_step": 76539, "epoch": 455} {"train_loss": -9.044820785522461, "global_step": 76540, "epoch": 455} {"train_loss": -8.89529037475586, "global_step": 76541, "epoch": 455} {"train_loss": -9.123161315917969, "global_step": 76542, "epoch": 455} {"train_loss": -8.849421501159668, "global_step": 76543, "epoch": 455} {"train_loss": -9.014634132385254, "global_step": 76544, "epoch": 455} {"train_loss": -8.896767616271973, "global_step": 76545, "epoch": 455} {"train_loss": -8.91699504852295, "global_step": 76546, "epoch": 455} {"train_loss": -8.85059642791748, "global_step": 76547, "epoch": 455} {"train_loss": -9.184873580932617, "global_step": 76548, "epoch": 455} {"train_loss": -8.89396858215332, "global_step": 76549, "epoch": 455} {"train_loss": -8.91402816772461, "global_step": 76550, "epoch": 455} {"train_loss": -8.936578750610352, "global_step": 76551, "epoch": 455} {"train_loss": -9.166568756103516, "global_step": 76552, "epoch": 455} {"train_loss": -9.032821655273438, "global_step": 76553, "epoch": 455} {"train_loss": -9.006656646728516, "global_step": 76554, "epoch": 455} {"train_loss": -9.138954162597656, "global_step": 76555, "epoch": 455} {"train_loss": -8.981061935424805, "global_step": 76556, "epoch": 455} {"train_loss": -8.789017677307129, "global_step": 76557, "epoch": 455} {"train_loss": -9.306714057922363, "global_step": 76558, "epoch": 455} {"train_loss": -8.924654006958008, "global_step": 76559, "epoch": 455} {"train_loss": -9.122377395629883, "global_step": 76560, "epoch": 455} {"train_loss": -9.182393074035645, "global_step": 76561, "epoch": 455} {"train_loss": -9.180000305175781, "global_step": 76562, "epoch": 455} {"train_loss": -9.176921844482422, "global_step": 76563, "epoch": 455} {"train_loss": -9.12601089477539, "global_step": 76564, "epoch": 455} {"train_loss": -9.155838012695312, "global_step": 76565, "epoch": 455} {"train_loss": -9.240157127380371, "global_step": 76566, "epoch": 455} {"train_loss": -9.477051734924316, "global_step": 76567, "epoch": 455} {"train_loss": -9.01487922668457, "global_step": 76568, "epoch": 455} {"train_loss": -9.075204849243164, "global_step": 76569, "epoch": 455} {"train_loss": -9.143702507019043, "global_step": 76570, "epoch": 455} {"train_loss": -8.790146827697754, "global_step": 76571, "epoch": 455} {"train_loss": -9.223278045654297, "global_step": 76572, "epoch": 455} {"train_loss": -9.084181785583496, "global_step": 76573, "epoch": 455} {"train_loss": -8.954647064208984, "global_step": 76574, "epoch": 455} {"train_loss": -9.156033515930176, "global_step": 76575, "epoch": 455} {"train_loss": -8.716655731201172, "global_step": 76576, "epoch": 455} {"train_loss": -9.205467224121094, "global_step": 76577, "epoch": 455} {"train_loss": -9.079399108886719, "global_step": 76578, "epoch": 455} {"train_loss": -8.997967720031738, "global_step": 76579, "epoch": 455} {"train_loss": -9.090624809265137, "global_step": 76580, "epoch": 455} {"train_loss": -9.126949310302734, "global_step": 76581, "epoch": 455} {"train_loss": -8.70611572265625, "global_step": 76582, "epoch": 455} {"train_loss": -9.234514236450195, "global_step": 76583, "epoch": 455} {"train_loss": -9.031721115112305, "global_step": 76584, "epoch": 455} {"train_loss": -9.13137149810791, "global_step": 76585, "epoch": 455} {"train_loss": -9.285799026489258, "global_step": 76586, "epoch": 455} {"train_loss": -9.061685562133789, "global_step": 76587, "epoch": 455} {"train_loss": -9.057364463806152, "global_step": 76588, "epoch": 455} {"train_loss": -9.140389442443848, "global_step": 76589, "epoch": 455} {"train_loss": -9.15693187713623, "global_step": 76590, "epoch": 455} {"train_loss": -8.823586463928223, "global_step": 76591, "epoch": 455} {"train_loss": -8.83156967163086, "global_step": 76592, "epoch": 455} {"train_loss": -9.215947151184082, "global_step": 76593, "epoch": 455} {"train_loss": -8.881669998168945, "global_step": 76594, "epoch": 455} {"train_loss": -8.845697402954102, "global_step": 76595, "epoch": 455} {"train_loss": -8.942024230957031, "global_step": 76596, "epoch": 455} {"train_loss": -9.102588653564453, "global_step": 76597, "epoch": 455} {"train_loss": -9.359856605529785, "global_step": 76598, "epoch": 455} {"train_loss": -9.24917221069336, "global_step": 76599, "epoch": 455} {"train_loss": -9.228779792785645, "global_step": 76600, "epoch": 455} {"train_loss": -9.10194206237793, "global_step": 76601, "epoch": 455} {"train_loss": -9.007320404052734, "global_step": 76602, "epoch": 455} {"train_loss": -9.123950004577637, "global_step": 76603, "epoch": 455} {"train_loss": -9.206944465637207, "global_step": 76604, "epoch": 455} {"train_loss": -9.049055099487305, "global_step": 76605, "epoch": 455} {"train_loss": -9.235085487365723, "global_step": 76606, "epoch": 455} {"train_loss": -9.079304837045216, "global_step": 76607, "epoch": 455, "val_loss": 196066.734375, "train_action_mse_error": 2.8138203620910645} {"train_loss": -8.733604431152344, "global_step": 76608, "epoch": 456} {"train_loss": -9.36445426940918, "global_step": 76609, "epoch": 456} {"train_loss": -9.119412422180176, "global_step": 76610, "epoch": 456} {"train_loss": -9.034370422363281, "global_step": 76611, "epoch": 456} {"train_loss": -9.110638618469238, "global_step": 76612, "epoch": 456} {"train_loss": -9.170906066894531, "global_step": 76613, "epoch": 456} {"train_loss": -9.047323226928711, "global_step": 76614, "epoch": 456} {"train_loss": -9.277809143066406, "global_step": 76615, "epoch": 456} {"train_loss": -9.122357368469238, "global_step": 76616, "epoch": 456} {"train_loss": -9.033051490783691, "global_step": 76617, "epoch": 456} {"train_loss": -8.94025993347168, "global_step": 76618, "epoch": 456} {"train_loss": -8.79996395111084, "global_step": 76619, "epoch": 456} {"train_loss": -9.169313430786133, "global_step": 76620, "epoch": 456} {"train_loss": -9.288864135742188, "global_step": 76621, "epoch": 456} {"train_loss": -9.270371437072754, "global_step": 76622, "epoch": 456} {"train_loss": -9.183246612548828, "global_step": 76623, "epoch": 456} {"train_loss": -8.926854133605957, "global_step": 76624, "epoch": 456} {"train_loss": -9.186655044555664, "global_step": 76625, "epoch": 456} {"train_loss": -9.079292297363281, "global_step": 76626, "epoch": 456} {"train_loss": -9.256528854370117, "global_step": 76627, "epoch": 456} {"train_loss": -9.022472381591797, "global_step": 76628, "epoch": 456} {"train_loss": -9.358365058898926, "global_step": 76629, "epoch": 456} {"train_loss": -9.22562026977539, "global_step": 76630, "epoch": 456} {"train_loss": -8.7991943359375, "global_step": 76631, "epoch": 456} {"train_loss": -9.156740188598633, "global_step": 76632, "epoch": 456} {"train_loss": -9.389703750610352, "global_step": 76633, "epoch": 456} {"train_loss": -9.5452880859375, "global_step": 76634, "epoch": 456} {"train_loss": -9.20172119140625, "global_step": 76635, "epoch": 456} {"train_loss": -9.160057067871094, "global_step": 76636, "epoch": 456} {"train_loss": -9.17065715789795, "global_step": 76637, "epoch": 456} {"train_loss": -9.251195907592773, "global_step": 76638, "epoch": 456} {"train_loss": -9.385967254638672, "global_step": 76639, "epoch": 456} {"train_loss": -9.233574867248535, "global_step": 76640, "epoch": 456} {"train_loss": -9.156980514526367, "global_step": 76641, "epoch": 456} {"train_loss": -9.169548034667969, "global_step": 76642, "epoch": 456} {"train_loss": -9.220476150512695, "global_step": 76643, "epoch": 456} {"train_loss": -8.896215438842773, "global_step": 76644, "epoch": 456} {"train_loss": -9.173357009887695, "global_step": 76645, "epoch": 456} {"train_loss": -9.255191802978516, "global_step": 76646, "epoch": 456} {"train_loss": -9.078161239624023, "global_step": 76647, "epoch": 456} {"train_loss": -9.265665054321289, "global_step": 76648, "epoch": 456} {"train_loss": -9.255642890930176, "global_step": 76649, "epoch": 456} {"train_loss": -9.3355131149292, "global_step": 76650, "epoch": 456} {"train_loss": -8.783039093017578, "global_step": 76651, "epoch": 456} {"train_loss": -9.294811248779297, "global_step": 76652, "epoch": 456} {"train_loss": -9.05200481414795, "global_step": 76653, "epoch": 456} {"train_loss": -9.118260383605957, "global_step": 76654, "epoch": 456} {"train_loss": -8.873244285583496, "global_step": 76655, "epoch": 456} {"train_loss": -9.266016006469727, "global_step": 76656, "epoch": 456} {"train_loss": -9.022699356079102, "global_step": 76657, "epoch": 456} {"train_loss": -8.922613143920898, "global_step": 76658, "epoch": 456} {"train_loss": -9.156063079833984, "global_step": 76659, "epoch": 456} {"train_loss": -8.563936233520508, "global_step": 76660, "epoch": 456} {"train_loss": -9.118871688842773, "global_step": 76661, "epoch": 456} {"train_loss": -8.900925636291504, "global_step": 76662, "epoch": 456} {"train_loss": -9.119885444641113, "global_step": 76663, "epoch": 456} {"train_loss": -9.081083297729492, "global_step": 76664, "epoch": 456} {"train_loss": -8.672412872314453, "global_step": 76665, "epoch": 456} {"train_loss": -9.046245574951172, "global_step": 76666, "epoch": 456} {"train_loss": -9.033431053161621, "global_step": 76667, "epoch": 456} {"train_loss": -8.955240249633789, "global_step": 76668, "epoch": 456} {"train_loss": -9.122597694396973, "global_step": 76669, "epoch": 456} {"train_loss": -9.231199264526367, "global_step": 76670, "epoch": 456} {"train_loss": -8.997368812561035, "global_step": 76671, "epoch": 456} {"train_loss": -9.174283027648926, "global_step": 76672, "epoch": 456} {"train_loss": -8.916563987731934, "global_step": 76673, "epoch": 456} {"train_loss": -9.088066101074219, "global_step": 76674, "epoch": 456} {"train_loss": -8.754185676574707, "global_step": 76675, "epoch": 456} {"train_loss": -9.349211692810059, "global_step": 76676, "epoch": 456} {"train_loss": -9.041458129882812, "global_step": 76677, "epoch": 456} {"train_loss": -8.912114143371582, "global_step": 76678, "epoch": 456} {"train_loss": -8.780868530273438, "global_step": 76679, "epoch": 456} {"train_loss": -9.08272933959961, "global_step": 76680, "epoch": 456} {"train_loss": -8.688560485839844, "global_step": 76681, "epoch": 456} {"train_loss": -9.293550491333008, "global_step": 76682, "epoch": 456} {"train_loss": -9.132457733154297, "global_step": 76683, "epoch": 456} {"train_loss": -8.709272384643555, "global_step": 76684, "epoch": 456} {"train_loss": -8.70449447631836, "global_step": 76685, "epoch": 456} {"train_loss": -8.926290512084961, "global_step": 76686, "epoch": 456} {"train_loss": -8.993156433105469, "global_step": 76687, "epoch": 456} {"train_loss": -8.754415512084961, "global_step": 76688, "epoch": 456} {"train_loss": -8.883386611938477, "global_step": 76689, "epoch": 456} {"train_loss": -8.995390892028809, "global_step": 76690, "epoch": 456} {"train_loss": -8.826973915100098, "global_step": 76691, "epoch": 456} {"train_loss": -9.191143035888672, "global_step": 76692, "epoch": 456} {"train_loss": -8.958128929138184, "global_step": 76693, "epoch": 456} {"train_loss": -9.066741943359375, "global_step": 76694, "epoch": 456} {"train_loss": -9.065528869628906, "global_step": 76695, "epoch": 456} {"train_loss": -9.182032585144043, "global_step": 76696, "epoch": 456} {"train_loss": -8.693639755249023, "global_step": 76697, "epoch": 456} {"train_loss": -8.95667552947998, "global_step": 76698, "epoch": 456} {"train_loss": -9.113182067871094, "global_step": 76699, "epoch": 456} {"train_loss": -9.076519012451172, "global_step": 76700, "epoch": 456} {"train_loss": -9.092876434326172, "global_step": 76701, "epoch": 456} {"train_loss": -9.024561882019043, "global_step": 76702, "epoch": 456} {"train_loss": -9.01761245727539, "global_step": 76703, "epoch": 456} {"train_loss": -8.989808082580566, "global_step": 76704, "epoch": 456} {"train_loss": -9.116765975952148, "global_step": 76705, "epoch": 456} {"train_loss": -9.239494323730469, "global_step": 76706, "epoch": 456} {"train_loss": -9.166550636291504, "global_step": 76707, "epoch": 456} {"train_loss": -9.087947845458984, "global_step": 76708, "epoch": 456} {"train_loss": -9.227157592773438, "global_step": 76709, "epoch": 456} {"train_loss": -9.21878433227539, "global_step": 76710, "epoch": 456} {"train_loss": -9.291709899902344, "global_step": 76711, "epoch": 456} {"train_loss": -9.417555809020996, "global_step": 76712, "epoch": 456} {"train_loss": -9.03963565826416, "global_step": 76713, "epoch": 456} {"train_loss": -9.332578659057617, "global_step": 76714, "epoch": 456} {"train_loss": -8.993701934814453, "global_step": 76715, "epoch": 456} {"train_loss": -9.12272834777832, "global_step": 76716, "epoch": 456} {"train_loss": -9.02604866027832, "global_step": 76717, "epoch": 456} {"train_loss": -8.960357666015625, "global_step": 76718, "epoch": 456} {"train_loss": -9.362933158874512, "global_step": 76719, "epoch": 456} {"train_loss": -8.918756484985352, "global_step": 76720, "epoch": 456} {"train_loss": -9.193660736083984, "global_step": 76721, "epoch": 456} {"train_loss": -9.233299255371094, "global_step": 76722, "epoch": 456} {"train_loss": -8.66653060913086, "global_step": 76723, "epoch": 456} {"train_loss": -8.786831855773926, "global_step": 76724, "epoch": 456} {"train_loss": -8.573320388793945, "global_step": 76725, "epoch": 456} {"train_loss": -8.93227481842041, "global_step": 76726, "epoch": 456} {"train_loss": -8.73228645324707, "global_step": 76727, "epoch": 456} {"train_loss": -9.17748737335205, "global_step": 76728, "epoch": 456} {"train_loss": -8.720369338989258, "global_step": 76729, "epoch": 456} {"train_loss": -8.84689998626709, "global_step": 76730, "epoch": 456} {"train_loss": -8.992635726928711, "global_step": 76731, "epoch": 456} {"train_loss": -8.997476577758789, "global_step": 76732, "epoch": 456} {"train_loss": -9.062994956970215, "global_step": 76733, "epoch": 456} {"train_loss": -9.22639274597168, "global_step": 76734, "epoch": 456} {"train_loss": -8.928072929382324, "global_step": 76735, "epoch": 456} {"train_loss": -8.965381622314453, "global_step": 76736, "epoch": 456} {"train_loss": -9.176977157592773, "global_step": 76737, "epoch": 456} {"train_loss": -9.094949722290039, "global_step": 76738, "epoch": 456} {"train_loss": -9.241887092590332, "global_step": 76739, "epoch": 456} {"train_loss": -9.237293243408203, "global_step": 76740, "epoch": 456} {"train_loss": -9.11648178100586, "global_step": 76741, "epoch": 456} {"train_loss": -9.195070266723633, "global_step": 76742, "epoch": 456} {"train_loss": -9.20210075378418, "global_step": 76743, "epoch": 456} {"train_loss": -9.159889221191406, "global_step": 76744, "epoch": 456} {"train_loss": -8.946399688720703, "global_step": 76745, "epoch": 456} {"train_loss": -9.217294692993164, "global_step": 76746, "epoch": 456} {"train_loss": -9.15401840209961, "global_step": 76747, "epoch": 456} {"train_loss": -9.247478485107422, "global_step": 76748, "epoch": 456} {"train_loss": -9.358363151550293, "global_step": 76749, "epoch": 456} {"train_loss": -9.530939102172852, "global_step": 76750, "epoch": 456} {"train_loss": -9.444666862487793, "global_step": 76751, "epoch": 456} {"train_loss": -9.287080764770508, "global_step": 76752, "epoch": 456} {"train_loss": -9.14002513885498, "global_step": 76753, "epoch": 456} {"train_loss": -9.184398651123047, "global_step": 76754, "epoch": 456} {"train_loss": -8.918815612792969, "global_step": 76755, "epoch": 456} {"train_loss": -9.378040313720703, "global_step": 76756, "epoch": 456} {"train_loss": -9.114355087280273, "global_step": 76757, "epoch": 456} {"train_loss": -9.108582496643066, "global_step": 76758, "epoch": 456} {"train_loss": -9.345467567443848, "global_step": 76759, "epoch": 456} {"train_loss": -9.365833282470703, "global_step": 76760, "epoch": 456} {"train_loss": -9.254645347595215, "global_step": 76761, "epoch": 456} {"train_loss": -8.983781814575195, "global_step": 76762, "epoch": 456} {"train_loss": -9.170472145080566, "global_step": 76763, "epoch": 456} {"train_loss": -9.291858673095703, "global_step": 76764, "epoch": 456} {"train_loss": -9.205721855163574, "global_step": 76765, "epoch": 456} {"train_loss": -8.729368209838867, "global_step": 76766, "epoch": 456} {"train_loss": -9.348912239074707, "global_step": 76767, "epoch": 456} {"train_loss": -8.954500198364258, "global_step": 76768, "epoch": 456} {"train_loss": -9.094877243041992, "global_step": 76769, "epoch": 456} {"train_loss": -8.84532356262207, "global_step": 76770, "epoch": 456} {"train_loss": -9.120109558105469, "global_step": 76771, "epoch": 456} {"train_loss": -8.778547286987305, "global_step": 76772, "epoch": 456} {"train_loss": -8.899545669555664, "global_step": 76773, "epoch": 456} {"train_loss": -9.009764671325684, "global_step": 76774, "epoch": 456} {"train_loss": -9.08349791594914, "global_step": 76775, "epoch": 456, "val_loss": 196238.15625} {"train_loss": -8.932500839233398, "global_step": 76776, "epoch": 457} {"train_loss": -8.689685821533203, "global_step": 76777, "epoch": 457} {"train_loss": -9.090092658996582, "global_step": 76778, "epoch": 457} {"train_loss": -8.78253173828125, "global_step": 76779, "epoch": 457} {"train_loss": -9.28759479522705, "global_step": 76780, "epoch": 457} {"train_loss": -8.494751930236816, "global_step": 76781, "epoch": 457} {"train_loss": -8.891197204589844, "global_step": 76782, "epoch": 457} {"train_loss": -8.73811149597168, "global_step": 76783, "epoch": 457} {"train_loss": -8.764793395996094, "global_step": 76784, "epoch": 457} {"train_loss": -8.867610931396484, "global_step": 76785, "epoch": 457} {"train_loss": -8.711310386657715, "global_step": 76786, "epoch": 457} {"train_loss": -9.011661529541016, "global_step": 76787, "epoch": 457} {"train_loss": -8.907710075378418, "global_step": 76788, "epoch": 457} {"train_loss": -9.062936782836914, "global_step": 76789, "epoch": 457} {"train_loss": -8.76845932006836, "global_step": 76790, "epoch": 457} {"train_loss": -8.962072372436523, "global_step": 76791, "epoch": 457} {"train_loss": -9.15340805053711, "global_step": 76792, "epoch": 457} {"train_loss": -8.995857238769531, "global_step": 76793, "epoch": 457} {"train_loss": -9.329385757446289, "global_step": 76794, "epoch": 457} {"train_loss": -9.124835968017578, "global_step": 76795, "epoch": 457} {"train_loss": -8.882096290588379, "global_step": 76796, "epoch": 457} {"train_loss": -9.052699089050293, "global_step": 76797, "epoch": 457} {"train_loss": -9.22736930847168, "global_step": 76798, "epoch": 457} {"train_loss": -9.209230422973633, "global_step": 76799, "epoch": 457} {"train_loss": -9.074593544006348, "global_step": 76800, "epoch": 457} {"train_loss": -9.277925491333008, "global_step": 76801, "epoch": 457} {"train_loss": -9.310527801513672, "global_step": 76802, "epoch": 457} {"train_loss": -9.179594993591309, "global_step": 76803, "epoch": 457} {"train_loss": -9.064399719238281, "global_step": 76804, "epoch": 457} {"train_loss": -9.403383255004883, "global_step": 76805, "epoch": 457} {"train_loss": -9.353525161743164, "global_step": 76806, "epoch": 457} {"train_loss": -9.279632568359375, "global_step": 76807, "epoch": 457} {"train_loss": -9.355020523071289, "global_step": 76808, "epoch": 457} {"train_loss": -9.281176567077637, "global_step": 76809, "epoch": 457} {"train_loss": -9.136080741882324, "global_step": 76810, "epoch": 457} {"train_loss": -9.154363632202148, "global_step": 76811, "epoch": 457} {"train_loss": -9.257614135742188, "global_step": 76812, "epoch": 457} {"train_loss": -9.269214630126953, "global_step": 76813, "epoch": 457} {"train_loss": -9.260697364807129, "global_step": 76814, "epoch": 457} {"train_loss": -9.495977401733398, "global_step": 76815, "epoch": 457} {"train_loss": -9.398767471313477, "global_step": 76816, "epoch": 457} {"train_loss": -9.378022193908691, "global_step": 76817, "epoch": 457} {"train_loss": -9.385488510131836, "global_step": 76818, "epoch": 457} {"train_loss": -9.155277252197266, "global_step": 76819, "epoch": 457} {"train_loss": -9.335554122924805, "global_step": 76820, "epoch": 457} {"train_loss": -9.330907821655273, "global_step": 76821, "epoch": 457} {"train_loss": -9.257797241210938, "global_step": 76822, "epoch": 457} {"train_loss": -9.27799129486084, "global_step": 76823, "epoch": 457} {"train_loss": -9.282920837402344, "global_step": 76824, "epoch": 457} {"train_loss": -9.446477890014648, "global_step": 76825, "epoch": 457} {"train_loss": -9.040517807006836, "global_step": 76826, "epoch": 457} {"train_loss": -9.419435501098633, "global_step": 76827, "epoch": 457} {"train_loss": -9.194276809692383, "global_step": 76828, "epoch": 457} {"train_loss": -9.24721908569336, "global_step": 76829, "epoch": 457} {"train_loss": -9.403818130493164, "global_step": 76830, "epoch": 457} {"train_loss": -9.162139892578125, "global_step": 76831, "epoch": 457} {"train_loss": -9.051942825317383, "global_step": 76832, "epoch": 457} {"train_loss": -9.07343864440918, "global_step": 76833, "epoch": 457} {"train_loss": -9.281728744506836, "global_step": 76834, "epoch": 457} {"train_loss": -9.178930282592773, "global_step": 76835, "epoch": 457} {"train_loss": -8.626649856567383, "global_step": 76836, "epoch": 457} {"train_loss": -9.462746620178223, "global_step": 76837, "epoch": 457} {"train_loss": -8.720637321472168, "global_step": 76838, "epoch": 457} {"train_loss": -9.049327850341797, "global_step": 76839, "epoch": 457} {"train_loss": -8.916748046875, "global_step": 76840, "epoch": 457} {"train_loss": -8.85841178894043, "global_step": 76841, "epoch": 457} {"train_loss": -8.966779708862305, "global_step": 76842, "epoch": 457} {"train_loss": -9.005208015441895, "global_step": 76843, "epoch": 457} {"train_loss": -9.00239372253418, "global_step": 76844, "epoch": 457} {"train_loss": -9.119643211364746, "global_step": 76845, "epoch": 457} {"train_loss": -8.941150665283203, "global_step": 76846, "epoch": 457} {"train_loss": -9.036078453063965, "global_step": 76847, "epoch": 457} {"train_loss": -9.1848783493042, "global_step": 76848, "epoch": 457} {"train_loss": -9.14278507232666, "global_step": 76849, "epoch": 457} {"train_loss": -9.085617065429688, "global_step": 76850, "epoch": 457} {"train_loss": -9.092394828796387, "global_step": 76851, "epoch": 457} {"train_loss": -9.134931564331055, "global_step": 76852, "epoch": 457} {"train_loss": -9.353519439697266, "global_step": 76853, "epoch": 457} {"train_loss": -9.000825881958008, "global_step": 76854, "epoch": 457} {"train_loss": -9.14850902557373, "global_step": 76855, "epoch": 457} {"train_loss": -9.196006774902344, "global_step": 76856, "epoch": 457} {"train_loss": -9.188116073608398, "global_step": 76857, "epoch": 457} {"train_loss": -9.167379379272461, "global_step": 76858, "epoch": 457} {"train_loss": -9.469355583190918, "global_step": 76859, "epoch": 457} {"train_loss": -9.13031005859375, "global_step": 76860, "epoch": 457} {"train_loss": -8.952556610107422, "global_step": 76861, "epoch": 457} {"train_loss": -9.2701416015625, "global_step": 76862, "epoch": 457} {"train_loss": -9.182117462158203, "global_step": 76863, "epoch": 457} {"train_loss": -9.105364799499512, "global_step": 76864, "epoch": 457} {"train_loss": -9.16517448425293, "global_step": 76865, "epoch": 457} {"train_loss": -9.344810485839844, "global_step": 76866, "epoch": 457} {"train_loss": -8.822324752807617, "global_step": 76867, "epoch": 457} {"train_loss": -9.014371871948242, "global_step": 76868, "epoch": 457} {"train_loss": -9.081567764282227, "global_step": 76869, "epoch": 457} {"train_loss": -9.23448371887207, "global_step": 76870, "epoch": 457} {"train_loss": -9.39321231842041, "global_step": 76871, "epoch": 457} {"train_loss": -9.389017105102539, "global_step": 76872, "epoch": 457} {"train_loss": -9.13387680053711, "global_step": 76873, "epoch": 457} {"train_loss": -9.2115478515625, "global_step": 76874, "epoch": 457} {"train_loss": -9.17330551147461, "global_step": 76875, "epoch": 457} {"train_loss": -8.891519546508789, "global_step": 76876, "epoch": 457} {"train_loss": -8.97055435180664, "global_step": 76877, "epoch": 457} {"train_loss": -9.05341911315918, "global_step": 76878, "epoch": 457} {"train_loss": -8.924697875976562, "global_step": 76879, "epoch": 457} {"train_loss": -9.16377067565918, "global_step": 76880, "epoch": 457} {"train_loss": -8.623971939086914, "global_step": 76881, "epoch": 457} {"train_loss": -8.981395721435547, "global_step": 76882, "epoch": 457} {"train_loss": -8.974035263061523, "global_step": 76883, "epoch": 457} {"train_loss": -8.563455581665039, "global_step": 76884, "epoch": 457} {"train_loss": -8.731963157653809, "global_step": 76885, "epoch": 457} {"train_loss": -9.028499603271484, "global_step": 76886, "epoch": 457} {"train_loss": -9.02219295501709, "global_step": 76887, "epoch": 457} {"train_loss": -8.416436195373535, "global_step": 76888, "epoch": 457} {"train_loss": -8.927984237670898, "global_step": 76889, "epoch": 457} {"train_loss": -8.52792739868164, "global_step": 76890, "epoch": 457} {"train_loss": -8.642692565917969, "global_step": 76891, "epoch": 457} {"train_loss": -8.645301818847656, "global_step": 76892, "epoch": 457} {"train_loss": -9.043790817260742, "global_step": 76893, "epoch": 457} {"train_loss": -8.744464874267578, "global_step": 76894, "epoch": 457} {"train_loss": -8.821882247924805, "global_step": 76895, "epoch": 457} {"train_loss": -8.979087829589844, "global_step": 76896, "epoch": 457} {"train_loss": -8.8358154296875, "global_step": 76897, "epoch": 457} {"train_loss": -9.177931785583496, "global_step": 76898, "epoch": 457} {"train_loss": -8.666095733642578, "global_step": 76899, "epoch": 457} {"train_loss": -8.86090087890625, "global_step": 76900, "epoch": 457} {"train_loss": -8.967889785766602, "global_step": 76901, "epoch": 457} {"train_loss": -8.928139686584473, "global_step": 76902, "epoch": 457} {"train_loss": -9.177465438842773, "global_step": 76903, "epoch": 457} {"train_loss": -8.868167877197266, "global_step": 76904, "epoch": 457} {"train_loss": -9.260622024536133, "global_step": 76905, "epoch": 457} {"train_loss": -9.13652229309082, "global_step": 76906, "epoch": 457} {"train_loss": -9.123538970947266, "global_step": 76907, "epoch": 457} {"train_loss": -9.078054428100586, "global_step": 76908, "epoch": 457} {"train_loss": -9.204873085021973, "global_step": 76909, "epoch": 457} {"train_loss": -9.269930839538574, "global_step": 76910, "epoch": 457} {"train_loss": -9.08838176727295, "global_step": 76911, "epoch": 457} {"train_loss": -9.319284439086914, "global_step": 76912, "epoch": 457} {"train_loss": -9.231405258178711, "global_step": 76913, "epoch": 457} {"train_loss": -9.127118110656738, "global_step": 76914, "epoch": 457} {"train_loss": -9.113958358764648, "global_step": 76915, "epoch": 457} {"train_loss": -9.112649917602539, "global_step": 76916, "epoch": 457} {"train_loss": -9.186532974243164, "global_step": 76917, "epoch": 457} {"train_loss": -9.335735321044922, "global_step": 76918, "epoch": 457} {"train_loss": -9.417694091796875, "global_step": 76919, "epoch": 457} {"train_loss": -9.153609275817871, "global_step": 76920, "epoch": 457} {"train_loss": -9.07158088684082, "global_step": 76921, "epoch": 457} {"train_loss": -9.152249336242676, "global_step": 76922, "epoch": 457} {"train_loss": -9.084654808044434, "global_step": 76923, "epoch": 457} {"train_loss": -9.256831169128418, "global_step": 76924, "epoch": 457} {"train_loss": -9.099651336669922, "global_step": 76925, "epoch": 457} {"train_loss": -9.215370178222656, "global_step": 76926, "epoch": 457} {"train_loss": -9.3499174118042, "global_step": 76927, "epoch": 457} {"train_loss": -9.124509811401367, "global_step": 76928, "epoch": 457} {"train_loss": -9.345529556274414, "global_step": 76929, "epoch": 457} {"train_loss": -8.894594192504883, "global_step": 76930, "epoch": 457} {"train_loss": -9.212127685546875, "global_step": 76931, "epoch": 457} {"train_loss": -9.282711029052734, "global_step": 76932, "epoch": 457} {"train_loss": -9.099868774414062, "global_step": 76933, "epoch": 457} {"train_loss": -9.331363677978516, "global_step": 76934, "epoch": 457} {"train_loss": -9.01201057434082, "global_step": 76935, "epoch": 457} {"train_loss": -9.133390426635742, "global_step": 76936, "epoch": 457} {"train_loss": -9.085923194885254, "global_step": 76937, "epoch": 457} {"train_loss": -8.789944648742676, "global_step": 76938, "epoch": 457} {"train_loss": -9.152182579040527, "global_step": 76939, "epoch": 457} {"train_loss": -8.632003784179688, "global_step": 76940, "epoch": 457} {"train_loss": -8.652843475341797, "global_step": 76941, "epoch": 457} {"train_loss": -8.576422691345215, "global_step": 76942, "epoch": 457} {"train_loss": -9.081809191476731, "global_step": 76943, "epoch": 457, "val_loss": 199103.3125} {"train_loss": -8.515820503234863, "global_step": 76944, "epoch": 458} {"train_loss": -8.576897621154785, "global_step": 76945, "epoch": 458} {"train_loss": -8.290119171142578, "global_step": 76946, "epoch": 458} {"train_loss": -8.77571964263916, "global_step": 76947, "epoch": 458} {"train_loss": -8.3982572555542, "global_step": 76948, "epoch": 458} {"train_loss": -8.660909652709961, "global_step": 76949, "epoch": 458} {"train_loss": -9.029518127441406, "global_step": 76950, "epoch": 458} {"train_loss": -8.567742347717285, "global_step": 76951, "epoch": 458} {"train_loss": -8.941543579101562, "global_step": 76952, "epoch": 458} {"train_loss": -9.02366828918457, "global_step": 76953, "epoch": 458} {"train_loss": -8.775842666625977, "global_step": 76954, "epoch": 458} {"train_loss": -8.937895774841309, "global_step": 76955, "epoch": 458} {"train_loss": -8.964385986328125, "global_step": 76956, "epoch": 458} {"train_loss": -8.793659210205078, "global_step": 76957, "epoch": 458} {"train_loss": -8.947772979736328, "global_step": 76958, "epoch": 458} {"train_loss": -8.949372291564941, "global_step": 76959, "epoch": 458} {"train_loss": -9.04869556427002, "global_step": 76960, "epoch": 458} {"train_loss": -8.965789794921875, "global_step": 76961, "epoch": 458} {"train_loss": -8.948833465576172, "global_step": 76962, "epoch": 458} {"train_loss": -8.992855072021484, "global_step": 76963, "epoch": 458} {"train_loss": -8.751163482666016, "global_step": 76964, "epoch": 458} {"train_loss": -9.062067031860352, "global_step": 76965, "epoch": 458} {"train_loss": -9.177749633789062, "global_step": 76966, "epoch": 458} {"train_loss": -8.825435638427734, "global_step": 76967, "epoch": 458} {"train_loss": -9.004472732543945, "global_step": 76968, "epoch": 458} {"train_loss": -9.20084285736084, "global_step": 76969, "epoch": 458} {"train_loss": -9.062888145446777, "global_step": 76970, "epoch": 458} {"train_loss": -9.151304244995117, "global_step": 76971, "epoch": 458} {"train_loss": -9.18600845336914, "global_step": 76972, "epoch": 458} {"train_loss": -9.034939765930176, "global_step": 76973, "epoch": 458} {"train_loss": -9.05902099609375, "global_step": 76974, "epoch": 458} {"train_loss": -9.338850021362305, "global_step": 76975, "epoch": 458} {"train_loss": -9.09385871887207, "global_step": 76976, "epoch": 458} {"train_loss": -9.235280990600586, "global_step": 76977, "epoch": 458} {"train_loss": -9.216435432434082, "global_step": 76978, "epoch": 458} {"train_loss": -9.123305320739746, "global_step": 76979, "epoch": 458} {"train_loss": -9.10555648803711, "global_step": 76980, "epoch": 458} {"train_loss": -9.452888488769531, "global_step": 76981, "epoch": 458} {"train_loss": -9.162616729736328, "global_step": 76982, "epoch": 458} {"train_loss": -9.14987564086914, "global_step": 76983, "epoch": 458} {"train_loss": -9.046340942382812, "global_step": 76984, "epoch": 458} {"train_loss": -8.96592903137207, "global_step": 76985, "epoch": 458} {"train_loss": -9.135955810546875, "global_step": 76986, "epoch": 458} {"train_loss": -9.190498352050781, "global_step": 76987, "epoch": 458} {"train_loss": -8.978642463684082, "global_step": 76988, "epoch": 458} {"train_loss": -9.281227111816406, "global_step": 76989, "epoch": 458} {"train_loss": -9.08796501159668, "global_step": 76990, "epoch": 458} {"train_loss": -9.437240600585938, "global_step": 76991, "epoch": 458} {"train_loss": -9.140636444091797, "global_step": 76992, "epoch": 458} {"train_loss": -9.122383117675781, "global_step": 76993, "epoch": 458} {"train_loss": -9.382518768310547, "global_step": 76994, "epoch": 458} {"train_loss": -9.12001895904541, "global_step": 76995, "epoch": 458} {"train_loss": -9.307806015014648, "global_step": 76996, "epoch": 458} {"train_loss": -9.013396263122559, "global_step": 76997, "epoch": 458} {"train_loss": -8.923755645751953, "global_step": 76998, "epoch": 458} {"train_loss": -9.027373313903809, "global_step": 76999, "epoch": 458} {"train_loss": -9.029423713684082, "global_step": 77000, "epoch": 458} {"train_loss": -8.621549606323242, "global_step": 77001, "epoch": 458} {"train_loss": -8.922971725463867, "global_step": 77002, "epoch": 458} {"train_loss": -8.481359481811523, "global_step": 77003, "epoch": 458} {"train_loss": -9.358037948608398, "global_step": 77004, "epoch": 458} {"train_loss": -8.794731140136719, "global_step": 77005, "epoch": 458} {"train_loss": -9.012472152709961, "global_step": 77006, "epoch": 458} {"train_loss": -8.744327545166016, "global_step": 77007, "epoch": 458} {"train_loss": -9.199319839477539, "global_step": 77008, "epoch": 458} {"train_loss": -8.964263916015625, "global_step": 77009, "epoch": 458} {"train_loss": -8.701475143432617, "global_step": 77010, "epoch": 458} {"train_loss": -8.815601348876953, "global_step": 77011, "epoch": 458} {"train_loss": -8.654611587524414, "global_step": 77012, "epoch": 458} {"train_loss": -9.12161636352539, "global_step": 77013, "epoch": 458} {"train_loss": -8.72512149810791, "global_step": 77014, "epoch": 458} {"train_loss": -9.077112197875977, "global_step": 77015, "epoch": 458} {"train_loss": -8.955586433410645, "global_step": 77016, "epoch": 458} {"train_loss": -9.073995590209961, "global_step": 77017, "epoch": 458} {"train_loss": -9.206575393676758, "global_step": 77018, "epoch": 458} {"train_loss": -9.010099411010742, "global_step": 77019, "epoch": 458} {"train_loss": -9.188751220703125, "global_step": 77020, "epoch": 458} {"train_loss": -9.251431465148926, "global_step": 77021, "epoch": 458} {"train_loss": -9.193374633789062, "global_step": 77022, "epoch": 458} {"train_loss": -9.04103946685791, "global_step": 77023, "epoch": 458} {"train_loss": -9.321832656860352, "global_step": 77024, "epoch": 458} {"train_loss": -9.291419982910156, "global_step": 77025, "epoch": 458} {"train_loss": -9.17894172668457, "global_step": 77026, "epoch": 458} {"train_loss": -9.069601058959961, "global_step": 77027, "epoch": 458} {"train_loss": -9.194290161132812, "global_step": 77028, "epoch": 458} {"train_loss": -9.095151901245117, "global_step": 77029, "epoch": 458} {"train_loss": -9.123798370361328, "global_step": 77030, "epoch": 458} {"train_loss": -8.808677673339844, "global_step": 77031, "epoch": 458} {"train_loss": -9.295318603515625, "global_step": 77032, "epoch": 458} {"train_loss": -9.05526351928711, "global_step": 77033, "epoch": 458} {"train_loss": -9.318437576293945, "global_step": 77034, "epoch": 458} {"train_loss": -8.84366226196289, "global_step": 77035, "epoch": 458} {"train_loss": -8.999086380004883, "global_step": 77036, "epoch": 458} {"train_loss": -9.194293975830078, "global_step": 77037, "epoch": 458} {"train_loss": -9.103208541870117, "global_step": 77038, "epoch": 458} {"train_loss": -8.828789710998535, "global_step": 77039, "epoch": 458} {"train_loss": -9.272359848022461, "global_step": 77040, "epoch": 458} {"train_loss": -9.035989761352539, "global_step": 77041, "epoch": 458} {"train_loss": -8.949430465698242, "global_step": 77042, "epoch": 458} {"train_loss": -9.021005630493164, "global_step": 77043, "epoch": 458} {"train_loss": -8.833932876586914, "global_step": 77044, "epoch": 458} {"train_loss": -9.071327209472656, "global_step": 77045, "epoch": 458} {"train_loss": -8.815948486328125, "global_step": 77046, "epoch": 458} {"train_loss": -9.190479278564453, "global_step": 77047, "epoch": 458} {"train_loss": -9.31692886352539, "global_step": 77048, "epoch": 458} {"train_loss": -8.728870391845703, "global_step": 77049, "epoch": 458} {"train_loss": -9.074254989624023, "global_step": 77050, "epoch": 458} {"train_loss": -9.163046836853027, "global_step": 77051, "epoch": 458} {"train_loss": -9.2205171585083, "global_step": 77052, "epoch": 458} {"train_loss": -9.191444396972656, "global_step": 77053, "epoch": 458} {"train_loss": -9.154921531677246, "global_step": 77054, "epoch": 458} {"train_loss": -9.364311218261719, "global_step": 77055, "epoch": 458} {"train_loss": -9.297822952270508, "global_step": 77056, "epoch": 458} {"train_loss": -9.248113632202148, "global_step": 77057, "epoch": 458} {"train_loss": -9.045780181884766, "global_step": 77058, "epoch": 458} {"train_loss": -9.241972923278809, "global_step": 77059, "epoch": 458} {"train_loss": -9.204073905944824, "global_step": 77060, "epoch": 458} {"train_loss": -8.966608047485352, "global_step": 77061, "epoch": 458} {"train_loss": -9.232778549194336, "global_step": 77062, "epoch": 458} {"train_loss": -9.095157623291016, "global_step": 77063, "epoch": 458} {"train_loss": -9.001474380493164, "global_step": 77064, "epoch": 458} {"train_loss": -9.408018112182617, "global_step": 77065, "epoch": 458} {"train_loss": -8.953359603881836, "global_step": 77066, "epoch": 458} {"train_loss": -8.99631118774414, "global_step": 77067, "epoch": 458} {"train_loss": -8.79002571105957, "global_step": 77068, "epoch": 458} {"train_loss": -9.009721755981445, "global_step": 77069, "epoch": 458} {"train_loss": -9.106491088867188, "global_step": 77070, "epoch": 458} {"train_loss": -8.981959342956543, "global_step": 77071, "epoch": 458} {"train_loss": -9.10466480255127, "global_step": 77072, "epoch": 458} {"train_loss": -8.894951820373535, "global_step": 77073, "epoch": 458} {"train_loss": -8.778083801269531, "global_step": 77074, "epoch": 458} {"train_loss": -9.106215476989746, "global_step": 77075, "epoch": 458} {"train_loss": -8.965383529663086, "global_step": 77076, "epoch": 458} {"train_loss": -9.073848724365234, "global_step": 77077, "epoch": 458} {"train_loss": -9.261794090270996, "global_step": 77078, "epoch": 458} {"train_loss": -9.099212646484375, "global_step": 77079, "epoch": 458} {"train_loss": -9.11735725402832, "global_step": 77080, "epoch": 458} {"train_loss": -9.256486892700195, "global_step": 77081, "epoch": 458} {"train_loss": -9.245536804199219, "global_step": 77082, "epoch": 458} {"train_loss": -9.199753761291504, "global_step": 77083, "epoch": 458} {"train_loss": -8.632562637329102, "global_step": 77084, "epoch": 458} {"train_loss": -8.943977355957031, "global_step": 77085, "epoch": 458} {"train_loss": -8.938467979431152, "global_step": 77086, "epoch": 458} {"train_loss": -8.986328125, "global_step": 77087, "epoch": 458} {"train_loss": -9.241476058959961, "global_step": 77088, "epoch": 458} {"train_loss": -9.005449295043945, "global_step": 77089, "epoch": 458} {"train_loss": -9.006948471069336, "global_step": 77090, "epoch": 458} {"train_loss": -9.21479606628418, "global_step": 77091, "epoch": 458} {"train_loss": -9.022968292236328, "global_step": 77092, "epoch": 458} {"train_loss": -8.937066078186035, "global_step": 77093, "epoch": 458} {"train_loss": -9.14340591430664, "global_step": 77094, "epoch": 458} {"train_loss": -9.184452056884766, "global_step": 77095, "epoch": 458} {"train_loss": -8.869036674499512, "global_step": 77096, "epoch": 458} {"train_loss": -9.165182113647461, "global_step": 77097, "epoch": 458} {"train_loss": -8.920222282409668, "global_step": 77098, "epoch": 458} {"train_loss": -9.02901554107666, "global_step": 77099, "epoch": 458} {"train_loss": -9.203755378723145, "global_step": 77100, "epoch": 458} {"train_loss": -8.900763511657715, "global_step": 77101, "epoch": 458} {"train_loss": -9.463987350463867, "global_step": 77102, "epoch": 458} {"train_loss": -9.111041069030762, "global_step": 77103, "epoch": 458} {"train_loss": -9.220340728759766, "global_step": 77104, "epoch": 458} {"train_loss": -8.866401672363281, "global_step": 77105, "epoch": 458} {"train_loss": -9.038751602172852, "global_step": 77106, "epoch": 458} {"train_loss": -9.276179313659668, "global_step": 77107, "epoch": 458} {"train_loss": -8.972640037536621, "global_step": 77108, "epoch": 458} {"train_loss": -9.05044174194336, "global_step": 77109, "epoch": 458} {"train_loss": -9.088628768920898, "global_step": 77110, "epoch": 458} {"train_loss": -9.042864311309089, "global_step": 77111, "epoch": 458, "val_loss": 193771.375} {"train_loss": -9.137845993041992, "global_step": 77112, "epoch": 459} {"train_loss": -9.144121170043945, "global_step": 77113, "epoch": 459} {"train_loss": -9.02759838104248, "global_step": 77114, "epoch": 459} {"train_loss": -9.130248069763184, "global_step": 77115, "epoch": 459} {"train_loss": -8.98576545715332, "global_step": 77116, "epoch": 459} {"train_loss": -8.94216251373291, "global_step": 77117, "epoch": 459} {"train_loss": -9.141491889953613, "global_step": 77118, "epoch": 459} {"train_loss": -9.123759269714355, "global_step": 77119, "epoch": 459} {"train_loss": -9.138422966003418, "global_step": 77120, "epoch": 459} {"train_loss": -9.121454238891602, "global_step": 77121, "epoch": 459} {"train_loss": -9.105025291442871, "global_step": 77122, "epoch": 459} {"train_loss": -9.327682495117188, "global_step": 77123, "epoch": 459} {"train_loss": -9.241106033325195, "global_step": 77124, "epoch": 459} {"train_loss": -8.749305725097656, "global_step": 77125, "epoch": 459} {"train_loss": -9.371246337890625, "global_step": 77126, "epoch": 459} {"train_loss": -9.432489395141602, "global_step": 77127, "epoch": 459} {"train_loss": -8.991155624389648, "global_step": 77128, "epoch": 459} {"train_loss": -9.196887969970703, "global_step": 77129, "epoch": 459} {"train_loss": -9.151853561401367, "global_step": 77130, "epoch": 459} {"train_loss": -9.300464630126953, "global_step": 77131, "epoch": 459} {"train_loss": -8.962736129760742, "global_step": 77132, "epoch": 459} {"train_loss": -9.255043029785156, "global_step": 77133, "epoch": 459} {"train_loss": -9.059338569641113, "global_step": 77134, "epoch": 459} {"train_loss": -9.036905288696289, "global_step": 77135, "epoch": 459} {"train_loss": -8.535383224487305, "global_step": 77136, "epoch": 459} {"train_loss": -9.148109436035156, "global_step": 77137, "epoch": 459} {"train_loss": -9.033451080322266, "global_step": 77138, "epoch": 459} {"train_loss": -8.611332893371582, "global_step": 77139, "epoch": 459} {"train_loss": -9.073491096496582, "global_step": 77140, "epoch": 459} {"train_loss": -8.734010696411133, "global_step": 77141, "epoch": 459} {"train_loss": -9.0169095993042, "global_step": 77142, "epoch": 459} {"train_loss": -8.532318115234375, "global_step": 77143, "epoch": 459} {"train_loss": -9.021258354187012, "global_step": 77144, "epoch": 459} {"train_loss": -8.78396224975586, "global_step": 77145, "epoch": 459} {"train_loss": -8.706737518310547, "global_step": 77146, "epoch": 459} {"train_loss": -8.872692108154297, "global_step": 77147, "epoch": 459} {"train_loss": -8.523237228393555, "global_step": 77148, "epoch": 459} {"train_loss": -8.71174430847168, "global_step": 77149, "epoch": 459} {"train_loss": -9.104682922363281, "global_step": 77150, "epoch": 459} {"train_loss": -8.747757911682129, "global_step": 77151, "epoch": 459} {"train_loss": -9.15665340423584, "global_step": 77152, "epoch": 459} {"train_loss": -8.88109302520752, "global_step": 77153, "epoch": 459} {"train_loss": -8.77723503112793, "global_step": 77154, "epoch": 459} {"train_loss": -8.709644317626953, "global_step": 77155, "epoch": 459} {"train_loss": -8.697063446044922, "global_step": 77156, "epoch": 459} {"train_loss": -8.643349647521973, "global_step": 77157, "epoch": 459} {"train_loss": -8.840685844421387, "global_step": 77158, "epoch": 459} {"train_loss": -8.831247329711914, "global_step": 77159, "epoch": 459} {"train_loss": -8.915167808532715, "global_step": 77160, "epoch": 459} {"train_loss": -8.760802268981934, "global_step": 77161, "epoch": 459} {"train_loss": -8.740215301513672, "global_step": 77162, "epoch": 459} {"train_loss": -9.011877059936523, "global_step": 77163, "epoch": 459} {"train_loss": -9.073216438293457, "global_step": 77164, "epoch": 459} {"train_loss": -9.09894847869873, "global_step": 77165, "epoch": 459} {"train_loss": -8.946167945861816, "global_step": 77166, "epoch": 459} {"train_loss": -9.188127517700195, "global_step": 77167, "epoch": 459} {"train_loss": -9.09321403503418, "global_step": 77168, "epoch": 459} {"train_loss": -9.042729377746582, "global_step": 77169, "epoch": 459} {"train_loss": -8.928146362304688, "global_step": 77170, "epoch": 459} {"train_loss": -8.994643211364746, "global_step": 77171, "epoch": 459} {"train_loss": -9.019735336303711, "global_step": 77172, "epoch": 459} {"train_loss": -9.16971206665039, "global_step": 77173, "epoch": 459} {"train_loss": -9.328173637390137, "global_step": 77174, "epoch": 459} {"train_loss": -9.269207000732422, "global_step": 77175, "epoch": 459} {"train_loss": -9.25791072845459, "global_step": 77176, "epoch": 459} {"train_loss": -9.206417083740234, "global_step": 77177, "epoch": 459} {"train_loss": -9.003164291381836, "global_step": 77178, "epoch": 459} {"train_loss": -9.244446754455566, "global_step": 77179, "epoch": 459} {"train_loss": -9.377960205078125, "global_step": 77180, "epoch": 459} {"train_loss": -9.155008316040039, "global_step": 77181, "epoch": 459} {"train_loss": -9.216081619262695, "global_step": 77182, "epoch": 459} {"train_loss": -8.944893836975098, "global_step": 77183, "epoch": 459} {"train_loss": -9.15152359008789, "global_step": 77184, "epoch": 459} {"train_loss": -9.187603950500488, "global_step": 77185, "epoch": 459} {"train_loss": -9.068767547607422, "global_step": 77186, "epoch": 459} {"train_loss": -9.316803932189941, "global_step": 77187, "epoch": 459} {"train_loss": -9.06647777557373, "global_step": 77188, "epoch": 459} {"train_loss": -9.237720489501953, "global_step": 77189, "epoch": 459} {"train_loss": -9.431711196899414, "global_step": 77190, "epoch": 459} {"train_loss": -9.050731658935547, "global_step": 77191, "epoch": 459} {"train_loss": -8.82425308227539, "global_step": 77192, "epoch": 459} {"train_loss": -8.928232192993164, "global_step": 77193, "epoch": 459} {"train_loss": -8.789543151855469, "global_step": 77194, "epoch": 459} {"train_loss": -8.172609329223633, "global_step": 77195, "epoch": 459} {"train_loss": -8.761438369750977, "global_step": 77196, "epoch": 459} {"train_loss": -8.9098539352417, "global_step": 77197, "epoch": 459} {"train_loss": -9.060681343078613, "global_step": 77198, "epoch": 459} {"train_loss": -8.944799423217773, "global_step": 77199, "epoch": 459} {"train_loss": -8.86214542388916, "global_step": 77200, "epoch": 459} {"train_loss": -8.90292739868164, "global_step": 77201, "epoch": 459} {"train_loss": -8.895160675048828, "global_step": 77202, "epoch": 459} {"train_loss": -8.838556289672852, "global_step": 77203, "epoch": 459} {"train_loss": -8.83653450012207, "global_step": 77204, "epoch": 459} {"train_loss": -8.537164688110352, "global_step": 77205, "epoch": 459} {"train_loss": -8.774287223815918, "global_step": 77206, "epoch": 459} {"train_loss": -8.673309326171875, "global_step": 77207, "epoch": 459} {"train_loss": -9.061397552490234, "global_step": 77208, "epoch": 459} {"train_loss": -9.067947387695312, "global_step": 77209, "epoch": 459} {"train_loss": -9.058767318725586, "global_step": 77210, "epoch": 459} {"train_loss": -8.920812606811523, "global_step": 77211, "epoch": 459} {"train_loss": -9.05648422241211, "global_step": 77212, "epoch": 459} {"train_loss": -9.015350341796875, "global_step": 77213, "epoch": 459} {"train_loss": -9.094165802001953, "global_step": 77214, "epoch": 459} {"train_loss": -9.213092803955078, "global_step": 77215, "epoch": 459} {"train_loss": -9.381656646728516, "global_step": 77216, "epoch": 459} {"train_loss": -9.213990211486816, "global_step": 77217, "epoch": 459} {"train_loss": -9.186147689819336, "global_step": 77218, "epoch": 459} {"train_loss": -9.295625686645508, "global_step": 77219, "epoch": 459} {"train_loss": -9.310032844543457, "global_step": 77220, "epoch": 459} {"train_loss": -9.469391822814941, "global_step": 77221, "epoch": 459} {"train_loss": -9.209269523620605, "global_step": 77222, "epoch": 459} {"train_loss": -9.146122932434082, "global_step": 77223, "epoch": 459} {"train_loss": -9.155862808227539, "global_step": 77224, "epoch": 459} {"train_loss": -9.203401565551758, "global_step": 77225, "epoch": 459} {"train_loss": -9.247832298278809, "global_step": 77226, "epoch": 459} {"train_loss": -9.261099815368652, "global_step": 77227, "epoch": 459} {"train_loss": -9.08840274810791, "global_step": 77228, "epoch": 459} {"train_loss": -9.11846923828125, "global_step": 77229, "epoch": 459} {"train_loss": -9.179244995117188, "global_step": 77230, "epoch": 459} {"train_loss": -9.386754989624023, "global_step": 77231, "epoch": 459} {"train_loss": -9.069698333740234, "global_step": 77232, "epoch": 459} {"train_loss": -9.20240306854248, "global_step": 77233, "epoch": 459} {"train_loss": -8.991083145141602, "global_step": 77234, "epoch": 459} {"train_loss": -9.375713348388672, "global_step": 77235, "epoch": 459} {"train_loss": -8.852090835571289, "global_step": 77236, "epoch": 459} {"train_loss": -9.301709175109863, "global_step": 77237, "epoch": 459} {"train_loss": -9.078995704650879, "global_step": 77238, "epoch": 459} {"train_loss": -9.221475601196289, "global_step": 77239, "epoch": 459} {"train_loss": -9.060178756713867, "global_step": 77240, "epoch": 459} {"train_loss": -9.410835266113281, "global_step": 77241, "epoch": 459} {"train_loss": -8.875080108642578, "global_step": 77242, "epoch": 459} {"train_loss": -9.068955421447754, "global_step": 77243, "epoch": 459} {"train_loss": -9.00632381439209, "global_step": 77244, "epoch": 459} {"train_loss": -8.93082332611084, "global_step": 77245, "epoch": 459} {"train_loss": -9.278348922729492, "global_step": 77246, "epoch": 459} {"train_loss": -8.969654083251953, "global_step": 77247, "epoch": 459} {"train_loss": -9.207436561584473, "global_step": 77248, "epoch": 459} {"train_loss": -9.087061882019043, "global_step": 77249, "epoch": 459} {"train_loss": -9.203363418579102, "global_step": 77250, "epoch": 459} {"train_loss": -9.190073013305664, "global_step": 77251, "epoch": 459} {"train_loss": -9.218324661254883, "global_step": 77252, "epoch": 459} {"train_loss": -9.25590705871582, "global_step": 77253, "epoch": 459} {"train_loss": -9.194817543029785, "global_step": 77254, "epoch": 459} {"train_loss": -9.295927047729492, "global_step": 77255, "epoch": 459} {"train_loss": -9.0975341796875, "global_step": 77256, "epoch": 459} {"train_loss": -9.311834335327148, "global_step": 77257, "epoch": 459} {"train_loss": -9.079351425170898, "global_step": 77258, "epoch": 459} {"train_loss": -9.12211799621582, "global_step": 77259, "epoch": 459} {"train_loss": -9.294812202453613, "global_step": 77260, "epoch": 459} {"train_loss": -9.242810249328613, "global_step": 77261, "epoch": 459} {"train_loss": -9.23934268951416, "global_step": 77262, "epoch": 459} {"train_loss": -9.458892822265625, "global_step": 77263, "epoch": 459} {"train_loss": -9.084380149841309, "global_step": 77264, "epoch": 459} {"train_loss": -9.407859802246094, "global_step": 77265, "epoch": 459} {"train_loss": -9.10885238647461, "global_step": 77266, "epoch": 459} {"train_loss": -9.35862922668457, "global_step": 77267, "epoch": 459} {"train_loss": -9.126535415649414, "global_step": 77268, "epoch": 459} {"train_loss": -9.351672172546387, "global_step": 77269, "epoch": 459} {"train_loss": -9.204279899597168, "global_step": 77270, "epoch": 459} {"train_loss": -9.111003875732422, "global_step": 77271, "epoch": 459} {"train_loss": -8.969491004943848, "global_step": 77272, "epoch": 459} {"train_loss": -8.769208908081055, "global_step": 77273, "epoch": 459} {"train_loss": -9.04041862487793, "global_step": 77274, "epoch": 459} {"train_loss": -8.644832611083984, "global_step": 77275, "epoch": 459} {"train_loss": -8.925373077392578, "global_step": 77276, "epoch": 459} {"train_loss": -9.095897674560547, "global_step": 77277, "epoch": 459} {"train_loss": -8.929079055786133, "global_step": 77278, "epoch": 459} {"train_loss": -9.056872668720427, "global_step": 77279, "epoch": 459, "val_loss": 197567.21875} {"train_loss": -9.141972541809082, "global_step": 77280, "epoch": 460} {"train_loss": -8.732330322265625, "global_step": 77281, "epoch": 460} {"train_loss": -8.92672348022461, "global_step": 77282, "epoch": 460} {"train_loss": -9.138404846191406, "global_step": 77283, "epoch": 460} {"train_loss": -9.088910102844238, "global_step": 77284, "epoch": 460} {"train_loss": -9.097368240356445, "global_step": 77285, "epoch": 460} {"train_loss": -8.968721389770508, "global_step": 77286, "epoch": 460} {"train_loss": -8.766589164733887, "global_step": 77287, "epoch": 460} {"train_loss": -9.006860733032227, "global_step": 77288, "epoch": 460} {"train_loss": -9.02968978881836, "global_step": 77289, "epoch": 460} {"train_loss": -9.245492935180664, "global_step": 77290, "epoch": 460} {"train_loss": -9.141716003417969, "global_step": 77291, "epoch": 460} {"train_loss": -8.97891616821289, "global_step": 77292, "epoch": 460} {"train_loss": -9.106270790100098, "global_step": 77293, "epoch": 460} {"train_loss": -9.018293380737305, "global_step": 77294, "epoch": 460} {"train_loss": -8.961688995361328, "global_step": 77295, "epoch": 460} {"train_loss": -8.82921028137207, "global_step": 77296, "epoch": 460} {"train_loss": -9.021915435791016, "global_step": 77297, "epoch": 460} {"train_loss": -9.039155960083008, "global_step": 77298, "epoch": 460} {"train_loss": -9.11724853515625, "global_step": 77299, "epoch": 460} {"train_loss": -9.12083911895752, "global_step": 77300, "epoch": 460} {"train_loss": -8.969584465026855, "global_step": 77301, "epoch": 460} {"train_loss": -9.157230377197266, "global_step": 77302, "epoch": 460} {"train_loss": -9.063066482543945, "global_step": 77303, "epoch": 460} {"train_loss": -8.998940467834473, "global_step": 77304, "epoch": 460} {"train_loss": -9.085729598999023, "global_step": 77305, "epoch": 460} {"train_loss": -9.024959564208984, "global_step": 77306, "epoch": 460} {"train_loss": -9.205248832702637, "global_step": 77307, "epoch": 460} {"train_loss": -8.974241256713867, "global_step": 77308, "epoch": 460} {"train_loss": -9.131278991699219, "global_step": 77309, "epoch": 460} {"train_loss": -8.893074035644531, "global_step": 77310, "epoch": 460} {"train_loss": -9.097475051879883, "global_step": 77311, "epoch": 460} {"train_loss": -8.839996337890625, "global_step": 77312, "epoch": 460} {"train_loss": -9.102388381958008, "global_step": 77313, "epoch": 460} {"train_loss": -8.915132522583008, "global_step": 77314, "epoch": 460} {"train_loss": -9.302749633789062, "global_step": 77315, "epoch": 460} {"train_loss": -9.030204772949219, "global_step": 77316, "epoch": 460} {"train_loss": -8.866994857788086, "global_step": 77317, "epoch": 460} {"train_loss": -8.901815414428711, "global_step": 77318, "epoch": 460} {"train_loss": -9.031036376953125, "global_step": 77319, "epoch": 460} {"train_loss": -8.735725402832031, "global_step": 77320, "epoch": 460} {"train_loss": -9.065703392028809, "global_step": 77321, "epoch": 460} {"train_loss": -9.080832481384277, "global_step": 77322, "epoch": 460} {"train_loss": -8.925490379333496, "global_step": 77323, "epoch": 460} {"train_loss": -9.041147232055664, "global_step": 77324, "epoch": 460} {"train_loss": -8.856012344360352, "global_step": 77325, "epoch": 460} {"train_loss": -9.020563125610352, "global_step": 77326, "epoch": 460} {"train_loss": -9.029146194458008, "global_step": 77327, "epoch": 460} {"train_loss": -9.155754089355469, "global_step": 77328, "epoch": 460} {"train_loss": -8.949342727661133, "global_step": 77329, "epoch": 460} {"train_loss": -9.138856887817383, "global_step": 77330, "epoch": 460} {"train_loss": -9.10976791381836, "global_step": 77331, "epoch": 460} {"train_loss": -9.179503440856934, "global_step": 77332, "epoch": 460} {"train_loss": -9.084482192993164, "global_step": 77333, "epoch": 460} {"train_loss": -9.157221794128418, "global_step": 77334, "epoch": 460} {"train_loss": -9.049646377563477, "global_step": 77335, "epoch": 460} {"train_loss": -9.181965827941895, "global_step": 77336, "epoch": 460} {"train_loss": -9.191240310668945, "global_step": 77337, "epoch": 460} {"train_loss": -8.94314193725586, "global_step": 77338, "epoch": 460} {"train_loss": -9.20272445678711, "global_step": 77339, "epoch": 460} {"train_loss": -9.153030395507812, "global_step": 77340, "epoch": 460} {"train_loss": -9.179239273071289, "global_step": 77341, "epoch": 460} {"train_loss": -9.337986946105957, "global_step": 77342, "epoch": 460} {"train_loss": -9.352815628051758, "global_step": 77343, "epoch": 460} {"train_loss": -8.988664627075195, "global_step": 77344, "epoch": 460} {"train_loss": -8.8798828125, "global_step": 77345, "epoch": 460} {"train_loss": -9.297898292541504, "global_step": 77346, "epoch": 460} {"train_loss": -9.152472496032715, "global_step": 77347, "epoch": 460} {"train_loss": -9.262176513671875, "global_step": 77348, "epoch": 460} {"train_loss": -9.230548858642578, "global_step": 77349, "epoch": 460} {"train_loss": -9.257646560668945, "global_step": 77350, "epoch": 460} {"train_loss": -9.323224067687988, "global_step": 77351, "epoch": 460} {"train_loss": -9.512004852294922, "global_step": 77352, "epoch": 460} {"train_loss": -9.350594520568848, "global_step": 77353, "epoch": 460} {"train_loss": -9.307401657104492, "global_step": 77354, "epoch": 460} {"train_loss": -9.001922607421875, "global_step": 77355, "epoch": 460} {"train_loss": -9.200736999511719, "global_step": 77356, "epoch": 460} {"train_loss": -8.748580932617188, "global_step": 77357, "epoch": 460} {"train_loss": -8.781754493713379, "global_step": 77358, "epoch": 460} {"train_loss": -8.920708656311035, "global_step": 77359, "epoch": 460} {"train_loss": -9.06093978881836, "global_step": 77360, "epoch": 460} {"train_loss": -8.508173942565918, "global_step": 77361, "epoch": 460} {"train_loss": -8.981399536132812, "global_step": 77362, "epoch": 460} {"train_loss": -8.509683609008789, "global_step": 77363, "epoch": 460} {"train_loss": -8.990042686462402, "global_step": 77364, "epoch": 460} {"train_loss": -8.694686889648438, "global_step": 77365, "epoch": 460} {"train_loss": -8.50523567199707, "global_step": 77366, "epoch": 460} {"train_loss": -9.09521770477295, "global_step": 77367, "epoch": 460} {"train_loss": -8.558908462524414, "global_step": 77368, "epoch": 460} {"train_loss": -8.731593132019043, "global_step": 77369, "epoch": 460} {"train_loss": -8.340490341186523, "global_step": 77370, "epoch": 460} {"train_loss": -8.569427490234375, "global_step": 77371, "epoch": 460} {"train_loss": -8.999247550964355, "global_step": 77372, "epoch": 460} {"train_loss": -8.593416213989258, "global_step": 77373, "epoch": 460} {"train_loss": -8.769271850585938, "global_step": 77374, "epoch": 460} {"train_loss": -8.64200496673584, "global_step": 77375, "epoch": 460} {"train_loss": -8.928369522094727, "global_step": 77376, "epoch": 460} {"train_loss": -8.646023750305176, "global_step": 77377, "epoch": 460} {"train_loss": -8.922626495361328, "global_step": 77378, "epoch": 460} {"train_loss": -9.017223358154297, "global_step": 77379, "epoch": 460} {"train_loss": -9.07746410369873, "global_step": 77380, "epoch": 460} {"train_loss": -8.949239730834961, "global_step": 77381, "epoch": 460} {"train_loss": -8.863924026489258, "global_step": 77382, "epoch": 460} {"train_loss": -8.951684951782227, "global_step": 77383, "epoch": 460} {"train_loss": -8.921567916870117, "global_step": 77384, "epoch": 460} {"train_loss": -8.92370891571045, "global_step": 77385, "epoch": 460} {"train_loss": -9.13839340209961, "global_step": 77386, "epoch": 460} {"train_loss": -9.055704116821289, "global_step": 77387, "epoch": 460} {"train_loss": -9.184639930725098, "global_step": 77388, "epoch": 460} {"train_loss": -9.076484680175781, "global_step": 77389, "epoch": 460} {"train_loss": -9.144322395324707, "global_step": 77390, "epoch": 460} {"train_loss": -9.094017028808594, "global_step": 77391, "epoch": 460} {"train_loss": -9.129680633544922, "global_step": 77392, "epoch": 460} {"train_loss": -9.308053016662598, "global_step": 77393, "epoch": 460} {"train_loss": -8.935165405273438, "global_step": 77394, "epoch": 460} {"train_loss": -8.86132526397705, "global_step": 77395, "epoch": 460} {"train_loss": -9.131490707397461, "global_step": 77396, "epoch": 460} {"train_loss": -9.235965728759766, "global_step": 77397, "epoch": 460} {"train_loss": -9.102252960205078, "global_step": 77398, "epoch": 460} {"train_loss": -9.16558837890625, "global_step": 77399, "epoch": 460} {"train_loss": -9.283599853515625, "global_step": 77400, "epoch": 460} {"train_loss": -8.823274612426758, "global_step": 77401, "epoch": 460} {"train_loss": -9.279426574707031, "global_step": 77402, "epoch": 460} {"train_loss": -9.212586402893066, "global_step": 77403, "epoch": 460} {"train_loss": -9.114595413208008, "global_step": 77404, "epoch": 460} {"train_loss": -8.973067283630371, "global_step": 77405, "epoch": 460} {"train_loss": -9.487237930297852, "global_step": 77406, "epoch": 460} {"train_loss": -9.101090431213379, "global_step": 77407, "epoch": 460} {"train_loss": -9.331033706665039, "global_step": 77408, "epoch": 460} {"train_loss": -8.92318058013916, "global_step": 77409, "epoch": 460} {"train_loss": -9.457586288452148, "global_step": 77410, "epoch": 460} {"train_loss": -9.195261001586914, "global_step": 77411, "epoch": 460} {"train_loss": -9.458111763000488, "global_step": 77412, "epoch": 460} {"train_loss": -9.051973342895508, "global_step": 77413, "epoch": 460} {"train_loss": -8.98334789276123, "global_step": 77414, "epoch": 460} {"train_loss": -8.740280151367188, "global_step": 77415, "epoch": 460} {"train_loss": -9.296321868896484, "global_step": 77416, "epoch": 460} {"train_loss": -8.557167053222656, "global_step": 77417, "epoch": 460} {"train_loss": -9.312292098999023, "global_step": 77418, "epoch": 460} {"train_loss": -8.777307510375977, "global_step": 77419, "epoch": 460} {"train_loss": -8.984489440917969, "global_step": 77420, "epoch": 460} {"train_loss": -9.227842330932617, "global_step": 77421, "epoch": 460} {"train_loss": -8.665366172790527, "global_step": 77422, "epoch": 460} {"train_loss": -9.105669021606445, "global_step": 77423, "epoch": 460} {"train_loss": -8.731122970581055, "global_step": 77424, "epoch": 460} {"train_loss": -9.071950912475586, "global_step": 77425, "epoch": 460} {"train_loss": -9.322736740112305, "global_step": 77426, "epoch": 460} {"train_loss": -9.187997817993164, "global_step": 77427, "epoch": 460} {"train_loss": -9.31479263305664, "global_step": 77428, "epoch": 460} {"train_loss": -9.080049514770508, "global_step": 77429, "epoch": 460} {"train_loss": -9.078348159790039, "global_step": 77430, "epoch": 460} {"train_loss": -9.216012954711914, "global_step": 77431, "epoch": 460} {"train_loss": -9.097179412841797, "global_step": 77432, "epoch": 460} {"train_loss": -9.064334869384766, "global_step": 77433, "epoch": 460} {"train_loss": -9.176933288574219, "global_step": 77434, "epoch": 460} {"train_loss": -8.922314643859863, "global_step": 77435, "epoch": 460} {"train_loss": -9.168656349182129, "global_step": 77436, "epoch": 460} {"train_loss": -9.069375038146973, "global_step": 77437, "epoch": 460} {"train_loss": -9.192289352416992, "global_step": 77438, "epoch": 460} {"train_loss": -9.199081420898438, "global_step": 77439, "epoch": 460} {"train_loss": -8.898418426513672, "global_step": 77440, "epoch": 460} {"train_loss": -9.194883346557617, "global_step": 77441, "epoch": 460} {"train_loss": -9.229896545410156, "global_step": 77442, "epoch": 460} {"train_loss": -9.267590522766113, "global_step": 77443, "epoch": 460} {"train_loss": -9.167515754699707, "global_step": 77444, "epoch": 460} {"train_loss": -9.182062149047852, "global_step": 77445, "epoch": 460} {"train_loss": -8.906335830688477, "global_step": 77446, "epoch": 460} {"train_loss": -9.041296714828128, "global_step": 77447, "epoch": 460, "val_loss": 195214.640625, "train_action_mse_error": 4.194271087646484} {"train_loss": -9.158698081970215, "global_step": 77448, "epoch": 461} {"train_loss": -9.154218673706055, "global_step": 77449, "epoch": 461} {"train_loss": -8.995471954345703, "global_step": 77450, "epoch": 461} {"train_loss": -9.277271270751953, "global_step": 77451, "epoch": 461} {"train_loss": -9.345458984375, "global_step": 77452, "epoch": 461} {"train_loss": -9.130435943603516, "global_step": 77453, "epoch": 461} {"train_loss": -9.342582702636719, "global_step": 77454, "epoch": 461} {"train_loss": -8.966054916381836, "global_step": 77455, "epoch": 461} {"train_loss": -9.065890312194824, "global_step": 77456, "epoch": 461} {"train_loss": -9.243050575256348, "global_step": 77457, "epoch": 461} {"train_loss": -9.413495063781738, "global_step": 77458, "epoch": 461} {"train_loss": -8.964607238769531, "global_step": 77459, "epoch": 461} {"train_loss": -9.344547271728516, "global_step": 77460, "epoch": 461} {"train_loss": -9.242243766784668, "global_step": 77461, "epoch": 461} {"train_loss": -9.194547653198242, "global_step": 77462, "epoch": 461} {"train_loss": -9.00290298461914, "global_step": 77463, "epoch": 461} {"train_loss": -9.156026840209961, "global_step": 77464, "epoch": 461} {"train_loss": -9.0040864944458, "global_step": 77465, "epoch": 461} {"train_loss": -9.094870567321777, "global_step": 77466, "epoch": 461} {"train_loss": -8.77238941192627, "global_step": 77467, "epoch": 461} {"train_loss": -8.892180442810059, "global_step": 77468, "epoch": 461} {"train_loss": -8.91848373413086, "global_step": 77469, "epoch": 461} {"train_loss": -8.951910018920898, "global_step": 77470, "epoch": 461} {"train_loss": -8.953925132751465, "global_step": 77471, "epoch": 461} {"train_loss": -9.146831512451172, "global_step": 77472, "epoch": 461} {"train_loss": -9.275796890258789, "global_step": 77473, "epoch": 461} {"train_loss": -9.314631462097168, "global_step": 77474, "epoch": 461} {"train_loss": -9.226287841796875, "global_step": 77475, "epoch": 461} {"train_loss": -9.104530334472656, "global_step": 77476, "epoch": 461} {"train_loss": -8.982828140258789, "global_step": 77477, "epoch": 461} {"train_loss": -8.865942001342773, "global_step": 77478, "epoch": 461} {"train_loss": -9.093889236450195, "global_step": 77479, "epoch": 461} {"train_loss": -9.126680374145508, "global_step": 77480, "epoch": 461} {"train_loss": -9.016765594482422, "global_step": 77481, "epoch": 461} {"train_loss": -9.1981782913208, "global_step": 77482, "epoch": 461} {"train_loss": -8.860702514648438, "global_step": 77483, "epoch": 461} {"train_loss": -9.2575044631958, "global_step": 77484, "epoch": 461} {"train_loss": -9.167510986328125, "global_step": 77485, "epoch": 461} {"train_loss": -9.068872451782227, "global_step": 77486, "epoch": 461} {"train_loss": -9.224359512329102, "global_step": 77487, "epoch": 461} {"train_loss": -9.068138122558594, "global_step": 77488, "epoch": 461} {"train_loss": -9.194021224975586, "global_step": 77489, "epoch": 461} {"train_loss": -8.992055892944336, "global_step": 77490, "epoch": 461} {"train_loss": -9.334298133850098, "global_step": 77491, "epoch": 461} {"train_loss": -9.275630950927734, "global_step": 77492, "epoch": 461} {"train_loss": -9.334918022155762, "global_step": 77493, "epoch": 461} {"train_loss": -9.095348358154297, "global_step": 77494, "epoch": 461} {"train_loss": -9.388535499572754, "global_step": 77495, "epoch": 461} {"train_loss": -9.287668228149414, "global_step": 77496, "epoch": 461} {"train_loss": -9.229576110839844, "global_step": 77497, "epoch": 461} {"train_loss": -9.594515800476074, "global_step": 77498, "epoch": 461} {"train_loss": -9.238718032836914, "global_step": 77499, "epoch": 461} {"train_loss": -9.197713851928711, "global_step": 77500, "epoch": 461} {"train_loss": -9.125511169433594, "global_step": 77501, "epoch": 461} {"train_loss": -9.18551254272461, "global_step": 77502, "epoch": 461} {"train_loss": -9.174813270568848, "global_step": 77503, "epoch": 461} {"train_loss": -9.38264274597168, "global_step": 77504, "epoch": 461} {"train_loss": -8.952486038208008, "global_step": 77505, "epoch": 461} {"train_loss": -8.894489288330078, "global_step": 77506, "epoch": 461} {"train_loss": -9.183784484863281, "global_step": 77507, "epoch": 461} {"train_loss": -9.322877883911133, "global_step": 77508, "epoch": 461} {"train_loss": -9.362403869628906, "global_step": 77509, "epoch": 461} {"train_loss": -8.928661346435547, "global_step": 77510, "epoch": 461} {"train_loss": -9.227737426757812, "global_step": 77511, "epoch": 461} {"train_loss": -8.883476257324219, "global_step": 77512, "epoch": 461} {"train_loss": -9.439414978027344, "global_step": 77513, "epoch": 461} {"train_loss": -9.143726348876953, "global_step": 77514, "epoch": 461} {"train_loss": -9.102782249450684, "global_step": 77515, "epoch": 461} {"train_loss": -9.283736228942871, "global_step": 77516, "epoch": 461} {"train_loss": -9.39484977722168, "global_step": 77517, "epoch": 461} {"train_loss": -9.338655471801758, "global_step": 77518, "epoch": 461} {"train_loss": -9.131105422973633, "global_step": 77519, "epoch": 461} {"train_loss": -9.110724449157715, "global_step": 77520, "epoch": 461} {"train_loss": -9.037479400634766, "global_step": 77521, "epoch": 461} {"train_loss": -9.276015281677246, "global_step": 77522, "epoch": 461} {"train_loss": -8.995383262634277, "global_step": 77523, "epoch": 461} {"train_loss": -9.283975601196289, "global_step": 77524, "epoch": 461} {"train_loss": -9.039094924926758, "global_step": 77525, "epoch": 461} {"train_loss": -8.850894927978516, "global_step": 77526, "epoch": 461} {"train_loss": -8.763994216918945, "global_step": 77527, "epoch": 461} {"train_loss": -8.515430450439453, "global_step": 77528, "epoch": 461} {"train_loss": -8.562252044677734, "global_step": 77529, "epoch": 461} {"train_loss": -8.565912246704102, "global_step": 77530, "epoch": 461} {"train_loss": -8.844950675964355, "global_step": 77531, "epoch": 461} {"train_loss": -8.608304977416992, "global_step": 77532, "epoch": 461} {"train_loss": -9.088282585144043, "global_step": 77533, "epoch": 461} {"train_loss": -8.89820671081543, "global_step": 77534, "epoch": 461} {"train_loss": -8.570083618164062, "global_step": 77535, "epoch": 461} {"train_loss": -8.713167190551758, "global_step": 77536, "epoch": 461} {"train_loss": -8.665681838989258, "global_step": 77537, "epoch": 461} {"train_loss": -8.65024185180664, "global_step": 77538, "epoch": 461} {"train_loss": -8.694487571716309, "global_step": 77539, "epoch": 461} {"train_loss": -8.957572937011719, "global_step": 77540, "epoch": 461} {"train_loss": -8.854656219482422, "global_step": 77541, "epoch": 461} {"train_loss": -8.897430419921875, "global_step": 77542, "epoch": 461} {"train_loss": -8.825213432312012, "global_step": 77543, "epoch": 461} {"train_loss": -8.934955596923828, "global_step": 77544, "epoch": 461} {"train_loss": -8.855429649353027, "global_step": 77545, "epoch": 461} {"train_loss": -9.200454711914062, "global_step": 77546, "epoch": 461} {"train_loss": -9.251519203186035, "global_step": 77547, "epoch": 461} {"train_loss": -9.169678688049316, "global_step": 77548, "epoch": 461} {"train_loss": -9.089958190917969, "global_step": 77549, "epoch": 461} {"train_loss": -9.074018478393555, "global_step": 77550, "epoch": 461} {"train_loss": -9.124872207641602, "global_step": 77551, "epoch": 461} {"train_loss": -9.13991641998291, "global_step": 77552, "epoch": 461} {"train_loss": -9.23747730255127, "global_step": 77553, "epoch": 461} {"train_loss": -9.401609420776367, "global_step": 77554, "epoch": 461} {"train_loss": -9.393316268920898, "global_step": 77555, "epoch": 461} {"train_loss": -9.347477912902832, "global_step": 77556, "epoch": 461} {"train_loss": -9.229276657104492, "global_step": 77557, "epoch": 461} {"train_loss": -9.09375, "global_step": 77558, "epoch": 461} {"train_loss": -9.153620719909668, "global_step": 77559, "epoch": 461} {"train_loss": -9.336530685424805, "global_step": 77560, "epoch": 461} {"train_loss": -9.171987533569336, "global_step": 77561, "epoch": 461} {"train_loss": -9.428929328918457, "global_step": 77562, "epoch": 461} {"train_loss": -9.316408157348633, "global_step": 77563, "epoch": 461} {"train_loss": -9.091682434082031, "global_step": 77564, "epoch": 461} {"train_loss": -9.396807670593262, "global_step": 77565, "epoch": 461} {"train_loss": -9.334660530090332, "global_step": 77566, "epoch": 461} {"train_loss": -9.235666275024414, "global_step": 77567, "epoch": 461} {"train_loss": -9.246184349060059, "global_step": 77568, "epoch": 461} {"train_loss": -9.325437545776367, "global_step": 77569, "epoch": 461} {"train_loss": -8.995851516723633, "global_step": 77570, "epoch": 461} {"train_loss": -8.979561805725098, "global_step": 77571, "epoch": 461} {"train_loss": -8.706901550292969, "global_step": 77572, "epoch": 461} {"train_loss": -9.472925186157227, "global_step": 77573, "epoch": 461} {"train_loss": -8.761543273925781, "global_step": 77574, "epoch": 461} {"train_loss": -8.742647171020508, "global_step": 77575, "epoch": 461} {"train_loss": -8.987815856933594, "global_step": 77576, "epoch": 461} {"train_loss": -8.434510231018066, "global_step": 77577, "epoch": 461} {"train_loss": -8.511102676391602, "global_step": 77578, "epoch": 461} {"train_loss": -8.891075134277344, "global_step": 77579, "epoch": 461} {"train_loss": -8.86728286743164, "global_step": 77580, "epoch": 461} {"train_loss": -8.655183792114258, "global_step": 77581, "epoch": 461} {"train_loss": -8.755294799804688, "global_step": 77582, "epoch": 461} {"train_loss": -9.058456420898438, "global_step": 77583, "epoch": 461} {"train_loss": -8.935822486877441, "global_step": 77584, "epoch": 461} {"train_loss": -8.790185928344727, "global_step": 77585, "epoch": 461} {"train_loss": -9.15632152557373, "global_step": 77586, "epoch": 461} {"train_loss": -8.98668384552002, "global_step": 77587, "epoch": 461} {"train_loss": -8.856243133544922, "global_step": 77588, "epoch": 461} {"train_loss": -8.934368133544922, "global_step": 77589, "epoch": 461} {"train_loss": -9.028850555419922, "global_step": 77590, "epoch": 461} {"train_loss": -8.936068534851074, "global_step": 77591, "epoch": 461} {"train_loss": -9.025260925292969, "global_step": 77592, "epoch": 461} {"train_loss": -9.189362525939941, "global_step": 77593, "epoch": 461} {"train_loss": -9.037208557128906, "global_step": 77594, "epoch": 461} {"train_loss": -9.016458511352539, "global_step": 77595, "epoch": 461} {"train_loss": -9.15477180480957, "global_step": 77596, "epoch": 461} {"train_loss": -9.146222114562988, "global_step": 77597, "epoch": 461} {"train_loss": -8.797199249267578, "global_step": 77598, "epoch": 461} {"train_loss": -9.116104125976562, "global_step": 77599, "epoch": 461} {"train_loss": -9.134611129760742, "global_step": 77600, "epoch": 461} {"train_loss": -9.076274871826172, "global_step": 77601, "epoch": 461} {"train_loss": -9.233007431030273, "global_step": 77602, "epoch": 461} {"train_loss": -9.533443450927734, "global_step": 77603, "epoch": 461} {"train_loss": -9.226469993591309, "global_step": 77604, "epoch": 461} {"train_loss": -9.2621488571167, "global_step": 77605, "epoch": 461} {"train_loss": -9.13672924041748, "global_step": 77606, "epoch": 461} {"train_loss": -9.195676803588867, "global_step": 77607, "epoch": 461} {"train_loss": -9.095967292785645, "global_step": 77608, "epoch": 461} {"train_loss": -9.22085952758789, "global_step": 77609, "epoch": 461} {"train_loss": -9.136680603027344, "global_step": 77610, "epoch": 461} {"train_loss": -8.745101928710938, "global_step": 77611, "epoch": 461} {"train_loss": -9.071446418762207, "global_step": 77612, "epoch": 461} {"train_loss": -9.130330085754395, "global_step": 77613, "epoch": 461} {"train_loss": -9.29389476776123, "global_step": 77614, "epoch": 461} {"train_loss": -9.081652749152411, "global_step": 77615, "epoch": 461, "val_loss": 194216.875} {"train_loss": -9.027246475219727, "global_step": 77616, "epoch": 462} {"train_loss": -9.079267501831055, "global_step": 77617, "epoch": 462} {"train_loss": -8.753427505493164, "global_step": 77618, "epoch": 462} {"train_loss": -8.859309196472168, "global_step": 77619, "epoch": 462} {"train_loss": -9.052217483520508, "global_step": 77620, "epoch": 462} {"train_loss": -9.116567611694336, "global_step": 77621, "epoch": 462} {"train_loss": -8.837213516235352, "global_step": 77622, "epoch": 462} {"train_loss": -9.114334106445312, "global_step": 77623, "epoch": 462} {"train_loss": -9.023374557495117, "global_step": 77624, "epoch": 462} {"train_loss": -8.781147003173828, "global_step": 77625, "epoch": 462} {"train_loss": -9.071773529052734, "global_step": 77626, "epoch": 462} {"train_loss": -9.027734756469727, "global_step": 77627, "epoch": 462} {"train_loss": -8.798738479614258, "global_step": 77628, "epoch": 462} {"train_loss": -8.740129470825195, "global_step": 77629, "epoch": 462} {"train_loss": -8.676301002502441, "global_step": 77630, "epoch": 462} {"train_loss": -8.979249954223633, "global_step": 77631, "epoch": 462} {"train_loss": -8.930841445922852, "global_step": 77632, "epoch": 462} {"train_loss": -9.136064529418945, "global_step": 77633, "epoch": 462} {"train_loss": -8.967026710510254, "global_step": 77634, "epoch": 462} {"train_loss": -9.038511276245117, "global_step": 77635, "epoch": 462} {"train_loss": -9.197166442871094, "global_step": 77636, "epoch": 462} {"train_loss": -9.011606216430664, "global_step": 77637, "epoch": 462} {"train_loss": -9.108563423156738, "global_step": 77638, "epoch": 462} {"train_loss": -9.188165664672852, "global_step": 77639, "epoch": 462} {"train_loss": -9.083892822265625, "global_step": 77640, "epoch": 462} {"train_loss": -9.060752868652344, "global_step": 77641, "epoch": 462} {"train_loss": -9.206737518310547, "global_step": 77642, "epoch": 462} {"train_loss": -8.828353881835938, "global_step": 77643, "epoch": 462} {"train_loss": -9.26618766784668, "global_step": 77644, "epoch": 462} {"train_loss": -9.103355407714844, "global_step": 77645, "epoch": 462} {"train_loss": -9.134499549865723, "global_step": 77646, "epoch": 462} {"train_loss": -9.10848617553711, "global_step": 77647, "epoch": 462} {"train_loss": -8.939414978027344, "global_step": 77648, "epoch": 462} {"train_loss": -9.177896499633789, "global_step": 77649, "epoch": 462} {"train_loss": -9.056934356689453, "global_step": 77650, "epoch": 462} {"train_loss": -9.244149208068848, "global_step": 77651, "epoch": 462} {"train_loss": -9.059857368469238, "global_step": 77652, "epoch": 462} {"train_loss": -9.191479682922363, "global_step": 77653, "epoch": 462} {"train_loss": -9.25896167755127, "global_step": 77654, "epoch": 462} {"train_loss": -8.886316299438477, "global_step": 77655, "epoch": 462} {"train_loss": -9.236822128295898, "global_step": 77656, "epoch": 462} {"train_loss": -8.941658020019531, "global_step": 77657, "epoch": 462} {"train_loss": -8.98330020904541, "global_step": 77658, "epoch": 462} {"train_loss": -8.776060104370117, "global_step": 77659, "epoch": 462} {"train_loss": -9.20091438293457, "global_step": 77660, "epoch": 462} {"train_loss": -9.12391471862793, "global_step": 77661, "epoch": 462} {"train_loss": -8.911674499511719, "global_step": 77662, "epoch": 462} {"train_loss": -8.962779998779297, "global_step": 77663, "epoch": 462} {"train_loss": -8.877891540527344, "global_step": 77664, "epoch": 462} {"train_loss": -8.801078796386719, "global_step": 77665, "epoch": 462} {"train_loss": -8.883840560913086, "global_step": 77666, "epoch": 462} {"train_loss": -8.927244186401367, "global_step": 77667, "epoch": 462} {"train_loss": -8.885181427001953, "global_step": 77668, "epoch": 462} {"train_loss": -9.071438789367676, "global_step": 77669, "epoch": 462} {"train_loss": -8.765350341796875, "global_step": 77670, "epoch": 462} {"train_loss": -9.007447242736816, "global_step": 77671, "epoch": 462} {"train_loss": -8.93514633178711, "global_step": 77672, "epoch": 462} {"train_loss": -8.896038055419922, "global_step": 77673, "epoch": 462} {"train_loss": -8.931851387023926, "global_step": 77674, "epoch": 462} {"train_loss": -8.950769424438477, "global_step": 77675, "epoch": 462} {"train_loss": -8.876363754272461, "global_step": 77676, "epoch": 462} {"train_loss": -9.021082878112793, "global_step": 77677, "epoch": 462} {"train_loss": -8.895694732666016, "global_step": 77678, "epoch": 462} {"train_loss": -8.995573997497559, "global_step": 77679, "epoch": 462} {"train_loss": -8.801168441772461, "global_step": 77680, "epoch": 462} {"train_loss": -9.21585464477539, "global_step": 77681, "epoch": 462} {"train_loss": -8.715117454528809, "global_step": 77682, "epoch": 462} {"train_loss": -8.7418851852417, "global_step": 77683, "epoch": 462} {"train_loss": -8.952526092529297, "global_step": 77684, "epoch": 462} {"train_loss": -9.105676651000977, "global_step": 77685, "epoch": 462} {"train_loss": -8.92064094543457, "global_step": 77686, "epoch": 462} {"train_loss": -9.016717910766602, "global_step": 77687, "epoch": 462} {"train_loss": -8.955260276794434, "global_step": 77688, "epoch": 462} {"train_loss": -9.144754409790039, "global_step": 77689, "epoch": 462} {"train_loss": -9.188573837280273, "global_step": 77690, "epoch": 462} {"train_loss": -9.135944366455078, "global_step": 77691, "epoch": 462} {"train_loss": -9.07105827331543, "global_step": 77692, "epoch": 462} {"train_loss": -9.128523826599121, "global_step": 77693, "epoch": 462} {"train_loss": -9.105183601379395, "global_step": 77694, "epoch": 462} {"train_loss": -9.296849250793457, "global_step": 77695, "epoch": 462} {"train_loss": -9.117273330688477, "global_step": 77696, "epoch": 462} {"train_loss": -9.445272445678711, "global_step": 77697, "epoch": 462} {"train_loss": -9.252042770385742, "global_step": 77698, "epoch": 462} {"train_loss": -9.125530242919922, "global_step": 77699, "epoch": 462} {"train_loss": -9.264291763305664, "global_step": 77700, "epoch": 462} {"train_loss": -9.288599967956543, "global_step": 77701, "epoch": 462} {"train_loss": -9.461979866027832, "global_step": 77702, "epoch": 462} {"train_loss": -9.453657150268555, "global_step": 77703, "epoch": 462} {"train_loss": -9.233491897583008, "global_step": 77704, "epoch": 462} {"train_loss": -9.056587219238281, "global_step": 77705, "epoch": 462} {"train_loss": -9.270011901855469, "global_step": 77706, "epoch": 462} {"train_loss": -9.232826232910156, "global_step": 77707, "epoch": 462} {"train_loss": -8.865044593811035, "global_step": 77708, "epoch": 462} {"train_loss": -9.250526428222656, "global_step": 77709, "epoch": 462} {"train_loss": -9.07088565826416, "global_step": 77710, "epoch": 462} {"train_loss": -8.947280883789062, "global_step": 77711, "epoch": 462} {"train_loss": -8.629186630249023, "global_step": 77712, "epoch": 462} {"train_loss": -9.379477500915527, "global_step": 77713, "epoch": 462} {"train_loss": -8.509611129760742, "global_step": 77714, "epoch": 462} {"train_loss": -9.245208740234375, "global_step": 77715, "epoch": 462} {"train_loss": -8.603652000427246, "global_step": 77716, "epoch": 462} {"train_loss": -8.920791625976562, "global_step": 77717, "epoch": 462} {"train_loss": -8.772836685180664, "global_step": 77718, "epoch": 462} {"train_loss": -8.792125701904297, "global_step": 77719, "epoch": 462} {"train_loss": -8.985923767089844, "global_step": 77720, "epoch": 462} {"train_loss": -8.743255615234375, "global_step": 77721, "epoch": 462} {"train_loss": -9.091875076293945, "global_step": 77722, "epoch": 462} {"train_loss": -8.78842544555664, "global_step": 77723, "epoch": 462} {"train_loss": -9.07197093963623, "global_step": 77724, "epoch": 462} {"train_loss": -8.687097549438477, "global_step": 77725, "epoch": 462} {"train_loss": -9.019766807556152, "global_step": 77726, "epoch": 462} {"train_loss": -9.046182632446289, "global_step": 77727, "epoch": 462} {"train_loss": -9.07989501953125, "global_step": 77728, "epoch": 462} {"train_loss": -9.108040809631348, "global_step": 77729, "epoch": 462} {"train_loss": -8.944412231445312, "global_step": 77730, "epoch": 462} {"train_loss": -9.013833999633789, "global_step": 77731, "epoch": 462} {"train_loss": -8.969568252563477, "global_step": 77732, "epoch": 462} {"train_loss": -8.910788536071777, "global_step": 77733, "epoch": 462} {"train_loss": -9.047711372375488, "global_step": 77734, "epoch": 462} {"train_loss": -8.727445602416992, "global_step": 77735, "epoch": 462} {"train_loss": -9.141386032104492, "global_step": 77736, "epoch": 462} {"train_loss": -9.086797714233398, "global_step": 77737, "epoch": 462} {"train_loss": -9.229162216186523, "global_step": 77738, "epoch": 462} {"train_loss": -9.209224700927734, "global_step": 77739, "epoch": 462} {"train_loss": -9.004450798034668, "global_step": 77740, "epoch": 462} {"train_loss": -9.002176284790039, "global_step": 77741, "epoch": 462} {"train_loss": -9.064592361450195, "global_step": 77742, "epoch": 462} {"train_loss": -9.17269229888916, "global_step": 77743, "epoch": 462} {"train_loss": -8.96026611328125, "global_step": 77744, "epoch": 462} {"train_loss": -9.012598037719727, "global_step": 77745, "epoch": 462} {"train_loss": -9.132843017578125, "global_step": 77746, "epoch": 462} {"train_loss": -8.655733108520508, "global_step": 77747, "epoch": 462} {"train_loss": -8.78132438659668, "global_step": 77748, "epoch": 462} {"train_loss": -9.232050895690918, "global_step": 77749, "epoch": 462} {"train_loss": -8.774866104125977, "global_step": 77750, "epoch": 462} {"train_loss": -8.748086929321289, "global_step": 77751, "epoch": 462} {"train_loss": -9.167994499206543, "global_step": 77752, "epoch": 462} {"train_loss": -9.148847579956055, "global_step": 77753, "epoch": 462} {"train_loss": -8.82586669921875, "global_step": 77754, "epoch": 462} {"train_loss": -9.30575942993164, "global_step": 77755, "epoch": 462} {"train_loss": -9.10789680480957, "global_step": 77756, "epoch": 462} {"train_loss": -8.96041488647461, "global_step": 77757, "epoch": 462} {"train_loss": -9.262765884399414, "global_step": 77758, "epoch": 462} {"train_loss": -9.29266357421875, "global_step": 77759, "epoch": 462} {"train_loss": -9.02064323425293, "global_step": 77760, "epoch": 462} {"train_loss": -9.185613632202148, "global_step": 77761, "epoch": 462} {"train_loss": -9.058177947998047, "global_step": 77762, "epoch": 462} {"train_loss": -8.978996276855469, "global_step": 77763, "epoch": 462} {"train_loss": -9.22346019744873, "global_step": 77764, "epoch": 462} {"train_loss": -9.249279022216797, "global_step": 77765, "epoch": 462} {"train_loss": -9.199445724487305, "global_step": 77766, "epoch": 462} {"train_loss": -9.39937973022461, "global_step": 77767, "epoch": 462} {"train_loss": -9.247303009033203, "global_step": 77768, "epoch": 462} {"train_loss": -9.43604850769043, "global_step": 77769, "epoch": 462} {"train_loss": -9.466693878173828, "global_step": 77770, "epoch": 462} {"train_loss": -9.387960433959961, "global_step": 77771, "epoch": 462} {"train_loss": -9.063552856445312, "global_step": 77772, "epoch": 462} {"train_loss": -9.230049133300781, "global_step": 77773, "epoch": 462} {"train_loss": -9.551627159118652, "global_step": 77774, "epoch": 462} {"train_loss": -9.235958099365234, "global_step": 77775, "epoch": 462} {"train_loss": -9.296516418457031, "global_step": 77776, "epoch": 462} {"train_loss": -9.017934799194336, "global_step": 77777, "epoch": 462} {"train_loss": -9.175033569335938, "global_step": 77778, "epoch": 462} {"train_loss": -9.29658031463623, "global_step": 77779, "epoch": 462} {"train_loss": -8.9751558303833, "global_step": 77780, "epoch": 462} {"train_loss": -9.495340347290039, "global_step": 77781, "epoch": 462} {"train_loss": -9.169951438903809, "global_step": 77782, "epoch": 462} {"train_loss": -9.052180767059326, "global_step": 77783, "epoch": 462, "val_loss": 195877.171875} {"train_loss": -9.13723087310791, "global_step": 77784, "epoch": 463} {"train_loss": -9.405340194702148, "global_step": 77785, "epoch": 463} {"train_loss": -9.274078369140625, "global_step": 77786, "epoch": 463} {"train_loss": -9.129895210266113, "global_step": 77787, "epoch": 463} {"train_loss": -8.932458877563477, "global_step": 77788, "epoch": 463} {"train_loss": -9.054811477661133, "global_step": 77789, "epoch": 463} {"train_loss": -9.102832794189453, "global_step": 77790, "epoch": 463} {"train_loss": -9.135440826416016, "global_step": 77791, "epoch": 463} {"train_loss": -8.881109237670898, "global_step": 77792, "epoch": 463} {"train_loss": -9.328847885131836, "global_step": 77793, "epoch": 463} {"train_loss": -8.774808883666992, "global_step": 77794, "epoch": 463} {"train_loss": -9.134517669677734, "global_step": 77795, "epoch": 463} {"train_loss": -9.034246444702148, "global_step": 77796, "epoch": 463} {"train_loss": -8.557387351989746, "global_step": 77797, "epoch": 463} {"train_loss": -8.864713668823242, "global_step": 77798, "epoch": 463} {"train_loss": -8.813558578491211, "global_step": 77799, "epoch": 463} {"train_loss": -8.69766616821289, "global_step": 77800, "epoch": 463} {"train_loss": -8.646323204040527, "global_step": 77801, "epoch": 463} {"train_loss": -9.094892501831055, "global_step": 77802, "epoch": 463} {"train_loss": -8.826370239257812, "global_step": 77803, "epoch": 463} {"train_loss": -9.113344192504883, "global_step": 77804, "epoch": 463} {"train_loss": -8.908023834228516, "global_step": 77805, "epoch": 463} {"train_loss": -8.978347778320312, "global_step": 77806, "epoch": 463} {"train_loss": -8.659866333007812, "global_step": 77807, "epoch": 463} {"train_loss": -9.120928764343262, "global_step": 77808, "epoch": 463} {"train_loss": -8.917362213134766, "global_step": 77809, "epoch": 463} {"train_loss": -8.943140029907227, "global_step": 77810, "epoch": 463} {"train_loss": -8.876277923583984, "global_step": 77811, "epoch": 463} {"train_loss": -9.194089889526367, "global_step": 77812, "epoch": 463} {"train_loss": -9.071979522705078, "global_step": 77813, "epoch": 463} {"train_loss": -8.943099021911621, "global_step": 77814, "epoch": 463} {"train_loss": -8.966560363769531, "global_step": 77815, "epoch": 463} {"train_loss": -9.166096687316895, "global_step": 77816, "epoch": 463} {"train_loss": -8.78925609588623, "global_step": 77817, "epoch": 463} {"train_loss": -9.14499282836914, "global_step": 77818, "epoch": 463} {"train_loss": -9.289140701293945, "global_step": 77819, "epoch": 463} {"train_loss": -9.24262523651123, "global_step": 77820, "epoch": 463} {"train_loss": -9.279016494750977, "global_step": 77821, "epoch": 463} {"train_loss": -9.252971649169922, "global_step": 77822, "epoch": 463} {"train_loss": -9.352216720581055, "global_step": 77823, "epoch": 463} {"train_loss": -9.355274200439453, "global_step": 77824, "epoch": 463} {"train_loss": -9.070486068725586, "global_step": 77825, "epoch": 463} {"train_loss": -9.180543899536133, "global_step": 77826, "epoch": 463} {"train_loss": -9.389840126037598, "global_step": 77827, "epoch": 463} {"train_loss": -9.124245643615723, "global_step": 77828, "epoch": 463} {"train_loss": -9.3323392868042, "global_step": 77829, "epoch": 463} {"train_loss": -9.363451957702637, "global_step": 77830, "epoch": 463} {"train_loss": -9.179997444152832, "global_step": 77831, "epoch": 463} {"train_loss": -9.289112091064453, "global_step": 77832, "epoch": 463} {"train_loss": -9.415258407592773, "global_step": 77833, "epoch": 463} {"train_loss": -9.196584701538086, "global_step": 77834, "epoch": 463} {"train_loss": -9.345171928405762, "global_step": 77835, "epoch": 463} {"train_loss": -9.089601516723633, "global_step": 77836, "epoch": 463} {"train_loss": -9.464395523071289, "global_step": 77837, "epoch": 463} {"train_loss": -9.20897102355957, "global_step": 77838, "epoch": 463} {"train_loss": -9.578625679016113, "global_step": 77839, "epoch": 463} {"train_loss": -9.104269027709961, "global_step": 77840, "epoch": 463} {"train_loss": -9.173954010009766, "global_step": 77841, "epoch": 463} {"train_loss": -9.11618709564209, "global_step": 77842, "epoch": 463} {"train_loss": -9.391059875488281, "global_step": 77843, "epoch": 463} {"train_loss": -9.392030715942383, "global_step": 77844, "epoch": 463} {"train_loss": -9.032970428466797, "global_step": 77845, "epoch": 463} {"train_loss": -9.307511329650879, "global_step": 77846, "epoch": 463} {"train_loss": -8.91225814819336, "global_step": 77847, "epoch": 463} {"train_loss": -9.026296615600586, "global_step": 77848, "epoch": 463} {"train_loss": -8.761345863342285, "global_step": 77849, "epoch": 463} {"train_loss": -8.97485637664795, "global_step": 77850, "epoch": 463} {"train_loss": -8.733142852783203, "global_step": 77851, "epoch": 463} {"train_loss": -8.932376861572266, "global_step": 77852, "epoch": 463} {"train_loss": -9.332990646362305, "global_step": 77853, "epoch": 463} {"train_loss": -9.206010818481445, "global_step": 77854, "epoch": 463} {"train_loss": -9.182783126831055, "global_step": 77855, "epoch": 463} {"train_loss": -9.038285255432129, "global_step": 77856, "epoch": 463} {"train_loss": -9.143921852111816, "global_step": 77857, "epoch": 463} {"train_loss": -9.004825592041016, "global_step": 77858, "epoch": 463} {"train_loss": -9.173931121826172, "global_step": 77859, "epoch": 463} {"train_loss": -9.048527717590332, "global_step": 77860, "epoch": 463} {"train_loss": -9.178016662597656, "global_step": 77861, "epoch": 463} {"train_loss": -9.018213272094727, "global_step": 77862, "epoch": 463} {"train_loss": -9.09459400177002, "global_step": 77863, "epoch": 463} {"train_loss": -8.917704582214355, "global_step": 77864, "epoch": 463} {"train_loss": -9.173589706420898, "global_step": 77865, "epoch": 463} {"train_loss": -8.899555206298828, "global_step": 77866, "epoch": 463} {"train_loss": -9.178296089172363, "global_step": 77867, "epoch": 463} {"train_loss": -9.115326881408691, "global_step": 77868, "epoch": 463} {"train_loss": -8.843448638916016, "global_step": 77869, "epoch": 463} {"train_loss": -9.01668930053711, "global_step": 77870, "epoch": 463} {"train_loss": -8.972030639648438, "global_step": 77871, "epoch": 463} {"train_loss": -8.972054481506348, "global_step": 77872, "epoch": 463} {"train_loss": -9.232889175415039, "global_step": 77873, "epoch": 463} {"train_loss": -8.729022026062012, "global_step": 77874, "epoch": 463} {"train_loss": -9.158510208129883, "global_step": 77875, "epoch": 463} {"train_loss": -8.808656692504883, "global_step": 77876, "epoch": 463} {"train_loss": -9.321250915527344, "global_step": 77877, "epoch": 463} {"train_loss": -8.621968269348145, "global_step": 77878, "epoch": 463} {"train_loss": -9.069807052612305, "global_step": 77879, "epoch": 463} {"train_loss": -8.911966323852539, "global_step": 77880, "epoch": 463} {"train_loss": -9.34194564819336, "global_step": 77881, "epoch": 463} {"train_loss": -8.957254409790039, "global_step": 77882, "epoch": 463} {"train_loss": -9.061782836914062, "global_step": 77883, "epoch": 463} {"train_loss": -9.180593490600586, "global_step": 77884, "epoch": 463} {"train_loss": -9.217009544372559, "global_step": 77885, "epoch": 463} {"train_loss": -9.103382110595703, "global_step": 77886, "epoch": 463} {"train_loss": -9.391100883483887, "global_step": 77887, "epoch": 463} {"train_loss": -8.995183944702148, "global_step": 77888, "epoch": 463} {"train_loss": -9.29892635345459, "global_step": 77889, "epoch": 463} {"train_loss": -9.140716552734375, "global_step": 77890, "epoch": 463} {"train_loss": -9.168785095214844, "global_step": 77891, "epoch": 463} {"train_loss": -9.008186340332031, "global_step": 77892, "epoch": 463} {"train_loss": -9.163976669311523, "global_step": 77893, "epoch": 463} {"train_loss": -9.073221206665039, "global_step": 77894, "epoch": 463} {"train_loss": -9.30894660949707, "global_step": 77895, "epoch": 463} {"train_loss": -9.435920715332031, "global_step": 77896, "epoch": 463} {"train_loss": -9.162378311157227, "global_step": 77897, "epoch": 463} {"train_loss": -9.211875915527344, "global_step": 77898, "epoch": 463} {"train_loss": -9.308183670043945, "global_step": 77899, "epoch": 463} {"train_loss": -9.036391258239746, "global_step": 77900, "epoch": 463} {"train_loss": -9.210596084594727, "global_step": 77901, "epoch": 463} {"train_loss": -9.268024444580078, "global_step": 77902, "epoch": 463} {"train_loss": -9.152506828308105, "global_step": 77903, "epoch": 463} {"train_loss": -9.450681686401367, "global_step": 77904, "epoch": 463} {"train_loss": -8.868476867675781, "global_step": 77905, "epoch": 463} {"train_loss": -9.25391960144043, "global_step": 77906, "epoch": 463} {"train_loss": -9.03248119354248, "global_step": 77907, "epoch": 463} {"train_loss": -8.78292465209961, "global_step": 77908, "epoch": 463} {"train_loss": -8.882871627807617, "global_step": 77909, "epoch": 463} {"train_loss": -8.897167205810547, "global_step": 77910, "epoch": 463} {"train_loss": -8.944120407104492, "global_step": 77911, "epoch": 463} {"train_loss": -8.78223991394043, "global_step": 77912, "epoch": 463} {"train_loss": -8.78592300415039, "global_step": 77913, "epoch": 463} {"train_loss": -9.056724548339844, "global_step": 77914, "epoch": 463} {"train_loss": -8.976594924926758, "global_step": 77915, "epoch": 463} {"train_loss": -8.9041748046875, "global_step": 77916, "epoch": 463} {"train_loss": -9.111330032348633, "global_step": 77917, "epoch": 463} {"train_loss": -8.938541412353516, "global_step": 77918, "epoch": 463} {"train_loss": -8.918021202087402, "global_step": 77919, "epoch": 463} {"train_loss": -8.940925598144531, "global_step": 77920, "epoch": 463} {"train_loss": -8.993764877319336, "global_step": 77921, "epoch": 463} {"train_loss": -9.094083786010742, "global_step": 77922, "epoch": 463} {"train_loss": -8.905523300170898, "global_step": 77923, "epoch": 463} {"train_loss": -9.134517669677734, "global_step": 77924, "epoch": 463} {"train_loss": -8.937713623046875, "global_step": 77925, "epoch": 463} {"train_loss": -9.207940101623535, "global_step": 77926, "epoch": 463} {"train_loss": -9.11252212524414, "global_step": 77927, "epoch": 463} {"train_loss": -9.382776260375977, "global_step": 77928, "epoch": 463} {"train_loss": -9.07501220703125, "global_step": 77929, "epoch": 463} {"train_loss": -9.328577041625977, "global_step": 77930, "epoch": 463} {"train_loss": -9.252782821655273, "global_step": 77931, "epoch": 463} {"train_loss": -9.244952201843262, "global_step": 77932, "epoch": 463} {"train_loss": -9.143075942993164, "global_step": 77933, "epoch": 463} {"train_loss": -9.239232063293457, "global_step": 77934, "epoch": 463} {"train_loss": -8.968332290649414, "global_step": 77935, "epoch": 463} {"train_loss": -9.341641426086426, "global_step": 77936, "epoch": 463} {"train_loss": -9.219884872436523, "global_step": 77937, "epoch": 463} {"train_loss": -9.102922439575195, "global_step": 77938, "epoch": 463} {"train_loss": -9.013182640075684, "global_step": 77939, "epoch": 463} {"train_loss": -9.021875381469727, "global_step": 77940, "epoch": 463} {"train_loss": -9.18563175201416, "global_step": 77941, "epoch": 463} {"train_loss": -9.431594848632812, "global_step": 77942, "epoch": 463} {"train_loss": -9.322418212890625, "global_step": 77943, "epoch": 463} {"train_loss": -9.366884231567383, "global_step": 77944, "epoch": 463} {"train_loss": -9.109882354736328, "global_step": 77945, "epoch": 463} {"train_loss": -9.393926620483398, "global_step": 77946, "epoch": 463} {"train_loss": -9.212871551513672, "global_step": 77947, "epoch": 463} {"train_loss": -9.402523040771484, "global_step": 77948, "epoch": 463} {"train_loss": -9.269421577453613, "global_step": 77949, "epoch": 463} {"train_loss": -9.297679901123047, "global_step": 77950, "epoch": 463} {"train_loss": -9.105436211540585, "global_step": 77951, "epoch": 463, "val_loss": 195128.09375} {"train_loss": -9.215209007263184, "global_step": 77952, "epoch": 464} {"train_loss": -9.367598533630371, "global_step": 77953, "epoch": 464} {"train_loss": -9.518838882446289, "global_step": 77954, "epoch": 464} {"train_loss": -9.30035400390625, "global_step": 77955, "epoch": 464} {"train_loss": -9.338703155517578, "global_step": 77956, "epoch": 464} {"train_loss": -9.39077377319336, "global_step": 77957, "epoch": 464} {"train_loss": -9.053336143493652, "global_step": 77958, "epoch": 464} {"train_loss": -9.172952651977539, "global_step": 77959, "epoch": 464} {"train_loss": -9.431434631347656, "global_step": 77960, "epoch": 464} {"train_loss": -9.267637252807617, "global_step": 77961, "epoch": 464} {"train_loss": -9.256484985351562, "global_step": 77962, "epoch": 464} {"train_loss": -9.015521049499512, "global_step": 77963, "epoch": 464} {"train_loss": -9.401374816894531, "global_step": 77964, "epoch": 464} {"train_loss": -8.872507095336914, "global_step": 77965, "epoch": 464} {"train_loss": -9.242551803588867, "global_step": 77966, "epoch": 464} {"train_loss": -8.83362102508545, "global_step": 77967, "epoch": 464} {"train_loss": -9.149297714233398, "global_step": 77968, "epoch": 464} {"train_loss": -9.065832138061523, "global_step": 77969, "epoch": 464} {"train_loss": -9.007096290588379, "global_step": 77970, "epoch": 464} {"train_loss": -9.015165328979492, "global_step": 77971, "epoch": 464} {"train_loss": -8.79076862335205, "global_step": 77972, "epoch": 464} {"train_loss": -8.905523300170898, "global_step": 77973, "epoch": 464} {"train_loss": -8.810665130615234, "global_step": 77974, "epoch": 464} {"train_loss": -9.125455856323242, "global_step": 77975, "epoch": 464} {"train_loss": -9.019847869873047, "global_step": 77976, "epoch": 464} {"train_loss": -8.963302612304688, "global_step": 77977, "epoch": 464} {"train_loss": -9.146927833557129, "global_step": 77978, "epoch": 464} {"train_loss": -8.828378677368164, "global_step": 77979, "epoch": 464} {"train_loss": -9.08956527709961, "global_step": 77980, "epoch": 464} {"train_loss": -9.131088256835938, "global_step": 77981, "epoch": 464} {"train_loss": -9.191997528076172, "global_step": 77982, "epoch": 464} {"train_loss": -8.699143409729004, "global_step": 77983, "epoch": 464} {"train_loss": -9.130682945251465, "global_step": 77984, "epoch": 464} {"train_loss": -8.828993797302246, "global_step": 77985, "epoch": 464} {"train_loss": -8.971789360046387, "global_step": 77986, "epoch": 464} {"train_loss": -9.413566589355469, "global_step": 77987, "epoch": 464} {"train_loss": -9.077876091003418, "global_step": 77988, "epoch": 464} {"train_loss": -9.236451148986816, "global_step": 77989, "epoch": 464} {"train_loss": -9.034555435180664, "global_step": 77990, "epoch": 464} {"train_loss": -9.25574016571045, "global_step": 77991, "epoch": 464} {"train_loss": -8.821138381958008, "global_step": 77992, "epoch": 464} {"train_loss": -9.285384178161621, "global_step": 77993, "epoch": 464} {"train_loss": -9.028084754943848, "global_step": 77994, "epoch": 464} {"train_loss": -8.908661842346191, "global_step": 77995, "epoch": 464} {"train_loss": -9.165497779846191, "global_step": 77996, "epoch": 464} {"train_loss": -9.074777603149414, "global_step": 77997, "epoch": 464} {"train_loss": -9.151224136352539, "global_step": 77998, "epoch": 464} {"train_loss": -9.18354320526123, "global_step": 77999, "epoch": 464} {"train_loss": -9.147500991821289, "global_step": 78000, "epoch": 464} {"train_loss": -8.939008712768555, "global_step": 78001, "epoch": 464} {"train_loss": -9.296401977539062, "global_step": 78002, "epoch": 464} {"train_loss": -8.990957260131836, "global_step": 78003, "epoch": 464} {"train_loss": -9.463045120239258, "global_step": 78004, "epoch": 464} {"train_loss": -9.114412307739258, "global_step": 78005, "epoch": 464} {"train_loss": -9.04841136932373, "global_step": 78006, "epoch": 464} {"train_loss": -9.262033462524414, "global_step": 78007, "epoch": 464} {"train_loss": -8.956299781799316, "global_step": 78008, "epoch": 464} {"train_loss": -9.209647178649902, "global_step": 78009, "epoch": 464} {"train_loss": -9.109619140625, "global_step": 78010, "epoch": 464} {"train_loss": -9.140460968017578, "global_step": 78011, "epoch": 464} {"train_loss": -9.178304672241211, "global_step": 78012, "epoch": 464} {"train_loss": -9.006882667541504, "global_step": 78013, "epoch": 464} {"train_loss": -9.177906036376953, "global_step": 78014, "epoch": 464} {"train_loss": -9.098722457885742, "global_step": 78015, "epoch": 464} {"train_loss": -9.174020767211914, "global_step": 78016, "epoch": 464} {"train_loss": -9.243569374084473, "global_step": 78017, "epoch": 464} {"train_loss": -9.172771453857422, "global_step": 78018, "epoch": 464} {"train_loss": -9.282123565673828, "global_step": 78019, "epoch": 464} {"train_loss": -9.236231803894043, "global_step": 78020, "epoch": 464} {"train_loss": -8.936849594116211, "global_step": 78021, "epoch": 464} {"train_loss": -9.204839706420898, "global_step": 78022, "epoch": 464} {"train_loss": -9.327299118041992, "global_step": 78023, "epoch": 464} {"train_loss": -9.034311294555664, "global_step": 78024, "epoch": 464} {"train_loss": -9.205465316772461, "global_step": 78025, "epoch": 464} {"train_loss": -9.108282089233398, "global_step": 78026, "epoch": 464} {"train_loss": -9.080679893493652, "global_step": 78027, "epoch": 464} {"train_loss": -9.328268051147461, "global_step": 78028, "epoch": 464} {"train_loss": -8.805495262145996, "global_step": 78029, "epoch": 464} {"train_loss": -9.361891746520996, "global_step": 78030, "epoch": 464} {"train_loss": -8.827471733093262, "global_step": 78031, "epoch": 464} {"train_loss": -9.079021453857422, "global_step": 78032, "epoch": 464} {"train_loss": -9.027791023254395, "global_step": 78033, "epoch": 464} {"train_loss": -8.82906723022461, "global_step": 78034, "epoch": 464} {"train_loss": -8.777630805969238, "global_step": 78035, "epoch": 464} {"train_loss": -8.793638229370117, "global_step": 78036, "epoch": 464} {"train_loss": -9.043243408203125, "global_step": 78037, "epoch": 464} {"train_loss": -8.749361038208008, "global_step": 78038, "epoch": 464} {"train_loss": -8.999540328979492, "global_step": 78039, "epoch": 464} {"train_loss": -9.079310417175293, "global_step": 78040, "epoch": 464} {"train_loss": -8.741876602172852, "global_step": 78041, "epoch": 464} {"train_loss": -8.960661888122559, "global_step": 78042, "epoch": 464} {"train_loss": -9.001094818115234, "global_step": 78043, "epoch": 464} {"train_loss": -9.227150917053223, "global_step": 78044, "epoch": 464} {"train_loss": -9.21999740600586, "global_step": 78045, "epoch": 464} {"train_loss": -9.245729446411133, "global_step": 78046, "epoch": 464} {"train_loss": -9.192512512207031, "global_step": 78047, "epoch": 464} {"train_loss": -9.084877014160156, "global_step": 78048, "epoch": 464} {"train_loss": -9.146533012390137, "global_step": 78049, "epoch": 464} {"train_loss": -8.94868278503418, "global_step": 78050, "epoch": 464} {"train_loss": -9.302225112915039, "global_step": 78051, "epoch": 464} {"train_loss": -8.953338623046875, "global_step": 78052, "epoch": 464} {"train_loss": -9.290547370910645, "global_step": 78053, "epoch": 464} {"train_loss": -8.931371688842773, "global_step": 78054, "epoch": 464} {"train_loss": -9.257197380065918, "global_step": 78055, "epoch": 464} {"train_loss": -9.048398971557617, "global_step": 78056, "epoch": 464} {"train_loss": -9.39223861694336, "global_step": 78057, "epoch": 464} {"train_loss": -9.1046142578125, "global_step": 78058, "epoch": 464} {"train_loss": -9.08492660522461, "global_step": 78059, "epoch": 464} {"train_loss": -9.223028182983398, "global_step": 78060, "epoch": 464} {"train_loss": -9.240129470825195, "global_step": 78061, "epoch": 464} {"train_loss": -9.449630737304688, "global_step": 78062, "epoch": 464} {"train_loss": -9.091310501098633, "global_step": 78063, "epoch": 464} {"train_loss": -9.285907745361328, "global_step": 78064, "epoch": 464} {"train_loss": -8.83441162109375, "global_step": 78065, "epoch": 464} {"train_loss": -9.356523513793945, "global_step": 78066, "epoch": 464} {"train_loss": -8.853985786437988, "global_step": 78067, "epoch": 464} {"train_loss": -9.179220199584961, "global_step": 78068, "epoch": 464} {"train_loss": -9.111141204833984, "global_step": 78069, "epoch": 464} {"train_loss": -8.972253799438477, "global_step": 78070, "epoch": 464} {"train_loss": -9.049983978271484, "global_step": 78071, "epoch": 464} {"train_loss": -9.15440559387207, "global_step": 78072, "epoch": 464} {"train_loss": -8.961870193481445, "global_step": 78073, "epoch": 464} {"train_loss": -9.063955307006836, "global_step": 78074, "epoch": 464} {"train_loss": -9.005680084228516, "global_step": 78075, "epoch": 464} {"train_loss": -9.194043159484863, "global_step": 78076, "epoch": 464} {"train_loss": -9.282118797302246, "global_step": 78077, "epoch": 464} {"train_loss": -9.19670295715332, "global_step": 78078, "epoch": 464} {"train_loss": -9.084147453308105, "global_step": 78079, "epoch": 464} {"train_loss": -9.087776184082031, "global_step": 78080, "epoch": 464} {"train_loss": -9.273283004760742, "global_step": 78081, "epoch": 464} {"train_loss": -8.78669548034668, "global_step": 78082, "epoch": 464} {"train_loss": -9.06751823425293, "global_step": 78083, "epoch": 464} {"train_loss": -8.909404754638672, "global_step": 78084, "epoch": 464} {"train_loss": -9.147588729858398, "global_step": 78085, "epoch": 464} {"train_loss": -9.053892135620117, "global_step": 78086, "epoch": 464} {"train_loss": -9.27881145477295, "global_step": 78087, "epoch": 464} {"train_loss": -9.23305606842041, "global_step": 78088, "epoch": 464} {"train_loss": -9.116491317749023, "global_step": 78089, "epoch": 464} {"train_loss": -9.171026229858398, "global_step": 78090, "epoch": 464} {"train_loss": -9.46490478515625, "global_step": 78091, "epoch": 464} {"train_loss": -9.153181076049805, "global_step": 78092, "epoch": 464} {"train_loss": -9.235389709472656, "global_step": 78093, "epoch": 464} {"train_loss": -9.137212753295898, "global_step": 78094, "epoch": 464} {"train_loss": -9.276056289672852, "global_step": 78095, "epoch": 464} {"train_loss": -8.913128852844238, "global_step": 78096, "epoch": 464} {"train_loss": -9.269431114196777, "global_step": 78097, "epoch": 464} {"train_loss": -9.240898132324219, "global_step": 78098, "epoch": 464} {"train_loss": -9.309733390808105, "global_step": 78099, "epoch": 464} {"train_loss": -9.346527099609375, "global_step": 78100, "epoch": 464} {"train_loss": -9.14630126953125, "global_step": 78101, "epoch": 464} {"train_loss": -9.351028442382812, "global_step": 78102, "epoch": 464} {"train_loss": -9.141037940979004, "global_step": 78103, "epoch": 464} {"train_loss": -8.734309196472168, "global_step": 78104, "epoch": 464} {"train_loss": -9.063516616821289, "global_step": 78105, "epoch": 464} {"train_loss": -8.860149383544922, "global_step": 78106, "epoch": 464} {"train_loss": -9.218488693237305, "global_step": 78107, "epoch": 464} {"train_loss": -8.82823371887207, "global_step": 78108, "epoch": 464} {"train_loss": -9.366716384887695, "global_step": 78109, "epoch": 464} {"train_loss": -8.634425163269043, "global_step": 78110, "epoch": 464} {"train_loss": -9.18491268157959, "global_step": 78111, "epoch": 464} {"train_loss": -8.694295883178711, "global_step": 78112, "epoch": 464} {"train_loss": -9.33439826965332, "global_step": 78113, "epoch": 464} {"train_loss": -8.879992485046387, "global_step": 78114, "epoch": 464} {"train_loss": -9.138320922851562, "global_step": 78115, "epoch": 464} {"train_loss": -8.785802841186523, "global_step": 78116, "epoch": 464} {"train_loss": -8.873537063598633, "global_step": 78117, "epoch": 464} {"train_loss": -9.121709823608398, "global_step": 78118, "epoch": 464} {"train_loss": -9.103904582205272, "global_step": 78119, "epoch": 464, "val_loss": 196628.515625} {"train_loss": -8.638640403747559, "global_step": 78120, "epoch": 465} {"train_loss": -8.973762512207031, "global_step": 78121, "epoch": 465} {"train_loss": -8.777809143066406, "global_step": 78122, "epoch": 465} {"train_loss": -8.873067855834961, "global_step": 78123, "epoch": 465} {"train_loss": -8.994335174560547, "global_step": 78124, "epoch": 465} {"train_loss": -9.124456405639648, "global_step": 78125, "epoch": 465} {"train_loss": -8.986532211303711, "global_step": 78126, "epoch": 465} {"train_loss": -9.17850399017334, "global_step": 78127, "epoch": 465} {"train_loss": -9.005889892578125, "global_step": 78128, "epoch": 465} {"train_loss": -9.158032417297363, "global_step": 78129, "epoch": 465} {"train_loss": -9.16951847076416, "global_step": 78130, "epoch": 465} {"train_loss": -9.16746711730957, "global_step": 78131, "epoch": 465} {"train_loss": -8.988321304321289, "global_step": 78132, "epoch": 465} {"train_loss": -8.988380432128906, "global_step": 78133, "epoch": 465} {"train_loss": -9.130640029907227, "global_step": 78134, "epoch": 465} {"train_loss": -9.006307601928711, "global_step": 78135, "epoch": 465} {"train_loss": -9.066801071166992, "global_step": 78136, "epoch": 465} {"train_loss": -9.099966049194336, "global_step": 78137, "epoch": 465} {"train_loss": -9.343993186950684, "global_step": 78138, "epoch": 465} {"train_loss": -9.093575477600098, "global_step": 78139, "epoch": 465} {"train_loss": -9.421276092529297, "global_step": 78140, "epoch": 465} {"train_loss": -9.21603012084961, "global_step": 78141, "epoch": 465} {"train_loss": -8.849366188049316, "global_step": 78142, "epoch": 465} {"train_loss": -9.11661148071289, "global_step": 78143, "epoch": 465} {"train_loss": -8.965389251708984, "global_step": 78144, "epoch": 465} {"train_loss": -9.006036758422852, "global_step": 78145, "epoch": 465} {"train_loss": -9.278094291687012, "global_step": 78146, "epoch": 465} {"train_loss": -9.158501625061035, "global_step": 78147, "epoch": 465} {"train_loss": -8.902283668518066, "global_step": 78148, "epoch": 465} {"train_loss": -9.129088401794434, "global_step": 78149, "epoch": 465} {"train_loss": -9.036543846130371, "global_step": 78150, "epoch": 465} {"train_loss": -8.901451110839844, "global_step": 78151, "epoch": 465} {"train_loss": -9.006328582763672, "global_step": 78152, "epoch": 465} {"train_loss": -9.294326782226562, "global_step": 78153, "epoch": 465} {"train_loss": -9.158324241638184, "global_step": 78154, "epoch": 465} {"train_loss": -9.144155502319336, "global_step": 78155, "epoch": 465} {"train_loss": -9.200636863708496, "global_step": 78156, "epoch": 465} {"train_loss": -9.084884643554688, "global_step": 78157, "epoch": 465} {"train_loss": -9.189824104309082, "global_step": 78158, "epoch": 465} {"train_loss": -8.984330177307129, "global_step": 78159, "epoch": 465} {"train_loss": -9.085877418518066, "global_step": 78160, "epoch": 465} {"train_loss": -9.106542587280273, "global_step": 78161, "epoch": 465} {"train_loss": -9.122173309326172, "global_step": 78162, "epoch": 465} {"train_loss": -9.086933135986328, "global_step": 78163, "epoch": 465} {"train_loss": -8.875732421875, "global_step": 78164, "epoch": 465} {"train_loss": -8.954488754272461, "global_step": 78165, "epoch": 465} {"train_loss": -8.831100463867188, "global_step": 78166, "epoch": 465} {"train_loss": -8.204021453857422, "global_step": 78167, "epoch": 465} {"train_loss": -8.842269897460938, "global_step": 78168, "epoch": 465} {"train_loss": -7.93919038772583, "global_step": 78169, "epoch": 465} {"train_loss": -8.72740364074707, "global_step": 78170, "epoch": 465} {"train_loss": -8.173184394836426, "global_step": 78171, "epoch": 465} {"train_loss": -8.80745792388916, "global_step": 78172, "epoch": 465} {"train_loss": -8.411764144897461, "global_step": 78173, "epoch": 465} {"train_loss": -8.48701000213623, "global_step": 78174, "epoch": 465} {"train_loss": -8.636129379272461, "global_step": 78175, "epoch": 465} {"train_loss": -8.48613166809082, "global_step": 78176, "epoch": 465} {"train_loss": -8.773608207702637, "global_step": 78177, "epoch": 465} {"train_loss": -8.60268497467041, "global_step": 78178, "epoch": 465} {"train_loss": -8.748306274414062, "global_step": 78179, "epoch": 465} {"train_loss": -8.808998107910156, "global_step": 78180, "epoch": 465} {"train_loss": -8.443367004394531, "global_step": 78181, "epoch": 465} {"train_loss": -8.779064178466797, "global_step": 78182, "epoch": 465} {"train_loss": -8.950429916381836, "global_step": 78183, "epoch": 465} {"train_loss": -8.571117401123047, "global_step": 78184, "epoch": 465} {"train_loss": -8.801387786865234, "global_step": 78185, "epoch": 465} {"train_loss": -8.812520980834961, "global_step": 78186, "epoch": 465} {"train_loss": -8.901296615600586, "global_step": 78187, "epoch": 465} {"train_loss": -9.020742416381836, "global_step": 78188, "epoch": 465} {"train_loss": -8.973664283752441, "global_step": 78189, "epoch": 465} {"train_loss": -8.967169761657715, "global_step": 78190, "epoch": 465} {"train_loss": -8.945566177368164, "global_step": 78191, "epoch": 465} {"train_loss": -9.179080963134766, "global_step": 78192, "epoch": 465} {"train_loss": -8.892339706420898, "global_step": 78193, "epoch": 465} {"train_loss": -9.004744529724121, "global_step": 78194, "epoch": 465} {"train_loss": -8.999731063842773, "global_step": 78195, "epoch": 465} {"train_loss": -9.243221282958984, "global_step": 78196, "epoch": 465} {"train_loss": -9.01861572265625, "global_step": 78197, "epoch": 465} {"train_loss": -8.961631774902344, "global_step": 78198, "epoch": 465} {"train_loss": -8.985746383666992, "global_step": 78199, "epoch": 465} {"train_loss": -9.019794464111328, "global_step": 78200, "epoch": 465} {"train_loss": -9.069725036621094, "global_step": 78201, "epoch": 465} {"train_loss": -8.955697059631348, "global_step": 78202, "epoch": 465} {"train_loss": -8.940277099609375, "global_step": 78203, "epoch": 465} {"train_loss": -9.463985443115234, "global_step": 78204, "epoch": 465} {"train_loss": -9.193191528320312, "global_step": 78205, "epoch": 465} {"train_loss": -9.275733947753906, "global_step": 78206, "epoch": 465} {"train_loss": -9.142580032348633, "global_step": 78207, "epoch": 465} {"train_loss": -9.453332901000977, "global_step": 78208, "epoch": 465} {"train_loss": -9.429943084716797, "global_step": 78209, "epoch": 465} {"train_loss": -9.455619812011719, "global_step": 78210, "epoch": 465} {"train_loss": -9.204036712646484, "global_step": 78211, "epoch": 465} {"train_loss": -9.333515167236328, "global_step": 78212, "epoch": 465} {"train_loss": -9.333179473876953, "global_step": 78213, "epoch": 465} {"train_loss": -9.176338195800781, "global_step": 78214, "epoch": 465} {"train_loss": -9.142017364501953, "global_step": 78215, "epoch": 465} {"train_loss": -9.04516887664795, "global_step": 78216, "epoch": 465} {"train_loss": -9.185392379760742, "global_step": 78217, "epoch": 465} {"train_loss": -9.182028770446777, "global_step": 78218, "epoch": 465} {"train_loss": -9.23747730255127, "global_step": 78219, "epoch": 465} {"train_loss": -9.48824405670166, "global_step": 78220, "epoch": 465} {"train_loss": -9.164204597473145, "global_step": 78221, "epoch": 465} {"train_loss": -9.418957710266113, "global_step": 78222, "epoch": 465} {"train_loss": -9.122934341430664, "global_step": 78223, "epoch": 465} {"train_loss": -9.457569122314453, "global_step": 78224, "epoch": 465} {"train_loss": -9.443251609802246, "global_step": 78225, "epoch": 465} {"train_loss": -9.452600479125977, "global_step": 78226, "epoch": 465} {"train_loss": -9.397603988647461, "global_step": 78227, "epoch": 465} {"train_loss": -9.051450729370117, "global_step": 78228, "epoch": 465} {"train_loss": -9.209529876708984, "global_step": 78229, "epoch": 465} {"train_loss": -9.087538719177246, "global_step": 78230, "epoch": 465} {"train_loss": -9.274320602416992, "global_step": 78231, "epoch": 465} {"train_loss": -9.16051197052002, "global_step": 78232, "epoch": 465} {"train_loss": -9.30756664276123, "global_step": 78233, "epoch": 465} {"train_loss": -9.243090629577637, "global_step": 78234, "epoch": 465} {"train_loss": -9.079781532287598, "global_step": 78235, "epoch": 465} {"train_loss": -8.957727432250977, "global_step": 78236, "epoch": 465} {"train_loss": -9.02204418182373, "global_step": 78237, "epoch": 465} {"train_loss": -9.154268264770508, "global_step": 78238, "epoch": 465} {"train_loss": -9.102675437927246, "global_step": 78239, "epoch": 465} {"train_loss": -8.844911575317383, "global_step": 78240, "epoch": 465} {"train_loss": -9.046072006225586, "global_step": 78241, "epoch": 465} {"train_loss": -9.126595497131348, "global_step": 78242, "epoch": 465} {"train_loss": -8.863809585571289, "global_step": 78243, "epoch": 465} {"train_loss": -8.82417106628418, "global_step": 78244, "epoch": 465} {"train_loss": -9.072610855102539, "global_step": 78245, "epoch": 465} {"train_loss": -9.077409744262695, "global_step": 78246, "epoch": 465} {"train_loss": -9.083829879760742, "global_step": 78247, "epoch": 465} {"train_loss": -8.960805892944336, "global_step": 78248, "epoch": 465} {"train_loss": -9.10171890258789, "global_step": 78249, "epoch": 465} {"train_loss": -9.109155654907227, "global_step": 78250, "epoch": 465} {"train_loss": -8.979146003723145, "global_step": 78251, "epoch": 465} {"train_loss": -8.9922456741333, "global_step": 78252, "epoch": 465} {"train_loss": -9.19102668762207, "global_step": 78253, "epoch": 465} {"train_loss": -9.188962936401367, "global_step": 78254, "epoch": 465} {"train_loss": -8.926507949829102, "global_step": 78255, "epoch": 465} {"train_loss": -9.334330558776855, "global_step": 78256, "epoch": 465} {"train_loss": -9.086485862731934, "global_step": 78257, "epoch": 465} {"train_loss": -9.176643371582031, "global_step": 78258, "epoch": 465} {"train_loss": -9.00094985961914, "global_step": 78259, "epoch": 465} {"train_loss": -9.199710845947266, "global_step": 78260, "epoch": 465} {"train_loss": -8.74188232421875, "global_step": 78261, "epoch": 465} {"train_loss": -9.103561401367188, "global_step": 78262, "epoch": 465} {"train_loss": -8.872774124145508, "global_step": 78263, "epoch": 465} {"train_loss": -8.985840797424316, "global_step": 78264, "epoch": 465} {"train_loss": -9.013322830200195, "global_step": 78265, "epoch": 465} {"train_loss": -8.947691917419434, "global_step": 78266, "epoch": 465} {"train_loss": -8.859073638916016, "global_step": 78267, "epoch": 465} {"train_loss": -8.950870513916016, "global_step": 78268, "epoch": 465} {"train_loss": -9.291285514831543, "global_step": 78269, "epoch": 465} {"train_loss": -9.038933753967285, "global_step": 78270, "epoch": 465} {"train_loss": -9.048550605773926, "global_step": 78271, "epoch": 465} {"train_loss": -9.122627258300781, "global_step": 78272, "epoch": 465} {"train_loss": -9.082468032836914, "global_step": 78273, "epoch": 465} {"train_loss": -9.322774887084961, "global_step": 78274, "epoch": 465} {"train_loss": -9.254459381103516, "global_step": 78275, "epoch": 465} {"train_loss": -9.043989181518555, "global_step": 78276, "epoch": 465} {"train_loss": -9.234855651855469, "global_step": 78277, "epoch": 465} {"train_loss": -9.3184814453125, "global_step": 78278, "epoch": 465} {"train_loss": -9.105541229248047, "global_step": 78279, "epoch": 465} {"train_loss": -9.441804885864258, "global_step": 78280, "epoch": 465} {"train_loss": -9.151792526245117, "global_step": 78281, "epoch": 465} {"train_loss": -9.356072425842285, "global_step": 78282, "epoch": 465} {"train_loss": -9.32762622833252, "global_step": 78283, "epoch": 465} {"train_loss": -9.326761245727539, "global_step": 78284, "epoch": 465} {"train_loss": -9.483417510986328, "global_step": 78285, "epoch": 465} {"train_loss": -9.012547492980957, "global_step": 78286, "epoch": 465} {"train_loss": -9.052535008816491, "global_step": 78287, "epoch": 465, "val_loss": 197252.015625, "train_action_mse_error": 6.923925399780273} {"train_loss": -9.085186958312988, "global_step": 78288, "epoch": 466} {"train_loss": -9.107789993286133, "global_step": 78289, "epoch": 466} {"train_loss": -9.415592193603516, "global_step": 78290, "epoch": 466} {"train_loss": -9.203588485717773, "global_step": 78291, "epoch": 466} {"train_loss": -9.082880020141602, "global_step": 78292, "epoch": 466} {"train_loss": -9.236778259277344, "global_step": 78293, "epoch": 466} {"train_loss": -9.270325660705566, "global_step": 78294, "epoch": 466} {"train_loss": -9.274983406066895, "global_step": 78295, "epoch": 466} {"train_loss": -9.3134765625, "global_step": 78296, "epoch": 466} {"train_loss": -9.287333488464355, "global_step": 78297, "epoch": 466} {"train_loss": -9.482317924499512, "global_step": 78298, "epoch": 466} {"train_loss": -9.446654319763184, "global_step": 78299, "epoch": 466} {"train_loss": -9.337650299072266, "global_step": 78300, "epoch": 466} {"train_loss": -9.309638977050781, "global_step": 78301, "epoch": 466} {"train_loss": -9.098718643188477, "global_step": 78302, "epoch": 466} {"train_loss": -9.087692260742188, "global_step": 78303, "epoch": 466} {"train_loss": -8.808536529541016, "global_step": 78304, "epoch": 466} {"train_loss": -8.673532485961914, "global_step": 78305, "epoch": 466} {"train_loss": -8.9960298538208, "global_step": 78306, "epoch": 466} {"train_loss": -8.902338027954102, "global_step": 78307, "epoch": 466} {"train_loss": -9.085246086120605, "global_step": 78308, "epoch": 466} {"train_loss": -9.219034194946289, "global_step": 78309, "epoch": 466} {"train_loss": -9.015807151794434, "global_step": 78310, "epoch": 466} {"train_loss": -8.925376892089844, "global_step": 78311, "epoch": 466} {"train_loss": -9.213708877563477, "global_step": 78312, "epoch": 466} {"train_loss": -8.974193572998047, "global_step": 78313, "epoch": 466} {"train_loss": -9.053895950317383, "global_step": 78314, "epoch": 466} {"train_loss": -9.157722473144531, "global_step": 78315, "epoch": 466} {"train_loss": -8.872665405273438, "global_step": 78316, "epoch": 466} {"train_loss": -9.21971321105957, "global_step": 78317, "epoch": 466} {"train_loss": -9.057903289794922, "global_step": 78318, "epoch": 466} {"train_loss": -9.060707092285156, "global_step": 78319, "epoch": 466} {"train_loss": -9.191205978393555, "global_step": 78320, "epoch": 466} {"train_loss": -9.111654281616211, "global_step": 78321, "epoch": 466} {"train_loss": -9.154847145080566, "global_step": 78322, "epoch": 466} {"train_loss": -8.89848518371582, "global_step": 78323, "epoch": 466} {"train_loss": -9.48128890991211, "global_step": 78324, "epoch": 466} {"train_loss": -9.253389358520508, "global_step": 78325, "epoch": 466} {"train_loss": -9.251762390136719, "global_step": 78326, "epoch": 466} {"train_loss": -9.37972640991211, "global_step": 78327, "epoch": 466} {"train_loss": -9.116179466247559, "global_step": 78328, "epoch": 466} {"train_loss": -9.212417602539062, "global_step": 78329, "epoch": 466} {"train_loss": -9.308952331542969, "global_step": 78330, "epoch": 466} {"train_loss": -9.138595581054688, "global_step": 78331, "epoch": 466} {"train_loss": -9.415398597717285, "global_step": 78332, "epoch": 466} {"train_loss": -8.986326217651367, "global_step": 78333, "epoch": 466} {"train_loss": -9.295479774475098, "global_step": 78334, "epoch": 466} {"train_loss": -9.161885261535645, "global_step": 78335, "epoch": 466} {"train_loss": -8.965490341186523, "global_step": 78336, "epoch": 466} {"train_loss": -9.241082191467285, "global_step": 78337, "epoch": 466} {"train_loss": -9.12907886505127, "global_step": 78338, "epoch": 466} {"train_loss": -9.273075103759766, "global_step": 78339, "epoch": 466} {"train_loss": -9.188152313232422, "global_step": 78340, "epoch": 466} {"train_loss": -9.104568481445312, "global_step": 78341, "epoch": 466} {"train_loss": -9.23541259765625, "global_step": 78342, "epoch": 466} {"train_loss": -9.18565559387207, "global_step": 78343, "epoch": 466} {"train_loss": -8.998661041259766, "global_step": 78344, "epoch": 466} {"train_loss": -9.352933883666992, "global_step": 78345, "epoch": 466} {"train_loss": -9.239893913269043, "global_step": 78346, "epoch": 466} {"train_loss": -9.258923530578613, "global_step": 78347, "epoch": 466} {"train_loss": -9.25940227508545, "global_step": 78348, "epoch": 466} {"train_loss": -9.231258392333984, "global_step": 78349, "epoch": 466} {"train_loss": -9.244264602661133, "global_step": 78350, "epoch": 466} {"train_loss": -9.141084671020508, "global_step": 78351, "epoch": 466} {"train_loss": -9.117713928222656, "global_step": 78352, "epoch": 466} {"train_loss": -9.102100372314453, "global_step": 78353, "epoch": 466} {"train_loss": -9.229823112487793, "global_step": 78354, "epoch": 466} {"train_loss": -9.201715469360352, "global_step": 78355, "epoch": 466} {"train_loss": -9.186020851135254, "global_step": 78356, "epoch": 466} {"train_loss": -9.11038875579834, "global_step": 78357, "epoch": 466} {"train_loss": -9.21351432800293, "global_step": 78358, "epoch": 466} {"train_loss": -9.318641662597656, "global_step": 78359, "epoch": 466} {"train_loss": -9.118850708007812, "global_step": 78360, "epoch": 466} {"train_loss": -9.311288833618164, "global_step": 78361, "epoch": 466} {"train_loss": -9.242116928100586, "global_step": 78362, "epoch": 466} {"train_loss": -9.231437683105469, "global_step": 78363, "epoch": 466} {"train_loss": -9.208517074584961, "global_step": 78364, "epoch": 466} {"train_loss": -9.182134628295898, "global_step": 78365, "epoch": 466} {"train_loss": -9.202262878417969, "global_step": 78366, "epoch": 466} {"train_loss": -8.892898559570312, "global_step": 78367, "epoch": 466} {"train_loss": -8.977431297302246, "global_step": 78368, "epoch": 466} {"train_loss": -8.801385879516602, "global_step": 78369, "epoch": 466} {"train_loss": -9.207608222961426, "global_step": 78370, "epoch": 466} {"train_loss": -8.58033561706543, "global_step": 78371, "epoch": 466} {"train_loss": -8.705377578735352, "global_step": 78372, "epoch": 466} {"train_loss": -8.759931564331055, "global_step": 78373, "epoch": 466} {"train_loss": -9.086000442504883, "global_step": 78374, "epoch": 466} {"train_loss": -8.922529220581055, "global_step": 78375, "epoch": 466} {"train_loss": -9.066669464111328, "global_step": 78376, "epoch": 466} {"train_loss": -8.704191207885742, "global_step": 78377, "epoch": 466} {"train_loss": -9.115569114685059, "global_step": 78378, "epoch": 466} {"train_loss": -8.955482482910156, "global_step": 78379, "epoch": 466} {"train_loss": -9.007037162780762, "global_step": 78380, "epoch": 466} {"train_loss": -9.024121284484863, "global_step": 78381, "epoch": 466} {"train_loss": -8.81335163116455, "global_step": 78382, "epoch": 466} {"train_loss": -8.939596176147461, "global_step": 78383, "epoch": 466} {"train_loss": -8.946717262268066, "global_step": 78384, "epoch": 466} {"train_loss": -9.17329216003418, "global_step": 78385, "epoch": 466} {"train_loss": -8.90450668334961, "global_step": 78386, "epoch": 466} {"train_loss": -9.283117294311523, "global_step": 78387, "epoch": 466} {"train_loss": -8.958727836608887, "global_step": 78388, "epoch": 466} {"train_loss": -8.934237480163574, "global_step": 78389, "epoch": 466} {"train_loss": -8.837567329406738, "global_step": 78390, "epoch": 466} {"train_loss": -9.164264678955078, "global_step": 78391, "epoch": 466} {"train_loss": -8.888957977294922, "global_step": 78392, "epoch": 466} {"train_loss": -8.718597412109375, "global_step": 78393, "epoch": 466} {"train_loss": -9.019103050231934, "global_step": 78394, "epoch": 466} {"train_loss": -9.177000045776367, "global_step": 78395, "epoch": 466} {"train_loss": -9.014145851135254, "global_step": 78396, "epoch": 466} {"train_loss": -8.843038558959961, "global_step": 78397, "epoch": 466} {"train_loss": -9.201082229614258, "global_step": 78398, "epoch": 466} {"train_loss": -8.982660293579102, "global_step": 78399, "epoch": 466} {"train_loss": -8.96915340423584, "global_step": 78400, "epoch": 466} {"train_loss": -9.343450546264648, "global_step": 78401, "epoch": 466} {"train_loss": -9.005392074584961, "global_step": 78402, "epoch": 466} {"train_loss": -9.09103012084961, "global_step": 78403, "epoch": 466} {"train_loss": -9.212678909301758, "global_step": 78404, "epoch": 466} {"train_loss": -9.265883445739746, "global_step": 78405, "epoch": 466} {"train_loss": -9.001151084899902, "global_step": 78406, "epoch": 466} {"train_loss": -9.419816017150879, "global_step": 78407, "epoch": 466} {"train_loss": -9.10241985321045, "global_step": 78408, "epoch": 466} {"train_loss": -9.180448532104492, "global_step": 78409, "epoch": 466} {"train_loss": -9.100593566894531, "global_step": 78410, "epoch": 466} {"train_loss": -9.051666259765625, "global_step": 78411, "epoch": 466} {"train_loss": -9.30201530456543, "global_step": 78412, "epoch": 466} {"train_loss": -9.155366897583008, "global_step": 78413, "epoch": 466} {"train_loss": -9.291189193725586, "global_step": 78414, "epoch": 466} {"train_loss": -9.354988098144531, "global_step": 78415, "epoch": 466} {"train_loss": -9.37702751159668, "global_step": 78416, "epoch": 466} {"train_loss": -9.064016342163086, "global_step": 78417, "epoch": 466} {"train_loss": -9.076366424560547, "global_step": 78418, "epoch": 466} {"train_loss": -9.075963973999023, "global_step": 78419, "epoch": 466} {"train_loss": -9.224242210388184, "global_step": 78420, "epoch": 466} {"train_loss": -9.328449249267578, "global_step": 78421, "epoch": 466} {"train_loss": -9.18893051147461, "global_step": 78422, "epoch": 466} {"train_loss": -9.238781929016113, "global_step": 78423, "epoch": 466} {"train_loss": -8.808525085449219, "global_step": 78424, "epoch": 466} {"train_loss": -9.119710922241211, "global_step": 78425, "epoch": 466} {"train_loss": -8.990941047668457, "global_step": 78426, "epoch": 466} {"train_loss": -9.076522827148438, "global_step": 78427, "epoch": 466} {"train_loss": -8.919065475463867, "global_step": 78428, "epoch": 466} {"train_loss": -9.17249870300293, "global_step": 78429, "epoch": 466} {"train_loss": -9.473679542541504, "global_step": 78430, "epoch": 466} {"train_loss": -9.166912078857422, "global_step": 78431, "epoch": 466} {"train_loss": -9.094518661499023, "global_step": 78432, "epoch": 466} {"train_loss": -9.14058780670166, "global_step": 78433, "epoch": 466} {"train_loss": -8.967857360839844, "global_step": 78434, "epoch": 466} {"train_loss": -9.219684600830078, "global_step": 78435, "epoch": 466} {"train_loss": -9.257827758789062, "global_step": 78436, "epoch": 466} {"train_loss": -9.095762252807617, "global_step": 78437, "epoch": 466} {"train_loss": -9.164371490478516, "global_step": 78438, "epoch": 466} {"train_loss": -9.21593952178955, "global_step": 78439, "epoch": 466} {"train_loss": -9.156108856201172, "global_step": 78440, "epoch": 466} {"train_loss": -9.010530471801758, "global_step": 78441, "epoch": 466} {"train_loss": -9.512365341186523, "global_step": 78442, "epoch": 466} {"train_loss": -9.043455123901367, "global_step": 78443, "epoch": 466} {"train_loss": -9.235809326171875, "global_step": 78444, "epoch": 466} {"train_loss": -9.296087265014648, "global_step": 78445, "epoch": 466} {"train_loss": -9.197118759155273, "global_step": 78446, "epoch": 466} {"train_loss": -9.251779556274414, "global_step": 78447, "epoch": 466} {"train_loss": -9.330202102661133, "global_step": 78448, "epoch": 466} {"train_loss": -9.290254592895508, "global_step": 78449, "epoch": 466} {"train_loss": -9.288932800292969, "global_step": 78450, "epoch": 466} {"train_loss": -9.308101654052734, "global_step": 78451, "epoch": 466} {"train_loss": -9.28638744354248, "global_step": 78452, "epoch": 466} {"train_loss": -9.086044311523438, "global_step": 78453, "epoch": 466} {"train_loss": -8.994678497314453, "global_step": 78454, "epoch": 466} {"train_loss": -9.131489538011097, "global_step": 78455, "epoch": 466, "val_loss": 196690.484375} {"train_loss": -9.029891967773438, "global_step": 78456, "epoch": 467} {"train_loss": -9.496906280517578, "global_step": 78457, "epoch": 467} {"train_loss": -9.282022476196289, "global_step": 78458, "epoch": 467} {"train_loss": -9.403478622436523, "global_step": 78459, "epoch": 467} {"train_loss": -9.307575225830078, "global_step": 78460, "epoch": 467} {"train_loss": -9.480616569519043, "global_step": 78461, "epoch": 467} {"train_loss": -9.323967933654785, "global_step": 78462, "epoch": 467} {"train_loss": -9.323455810546875, "global_step": 78463, "epoch": 467} {"train_loss": -9.28355884552002, "global_step": 78464, "epoch": 467} {"train_loss": -9.230260848999023, "global_step": 78465, "epoch": 467} {"train_loss": -8.872603416442871, "global_step": 78466, "epoch": 467} {"train_loss": -9.153525352478027, "global_step": 78467, "epoch": 467} {"train_loss": -9.295877456665039, "global_step": 78468, "epoch": 467} {"train_loss": -9.437422752380371, "global_step": 78469, "epoch": 467} {"train_loss": -9.022058486938477, "global_step": 78470, "epoch": 467} {"train_loss": -9.237823486328125, "global_step": 78471, "epoch": 467} {"train_loss": -9.369318008422852, "global_step": 78472, "epoch": 467} {"train_loss": -9.110050201416016, "global_step": 78473, "epoch": 467} {"train_loss": -9.199761390686035, "global_step": 78474, "epoch": 467} {"train_loss": -9.13769817352295, "global_step": 78475, "epoch": 467} {"train_loss": -9.063484191894531, "global_step": 78476, "epoch": 467} {"train_loss": -8.710947036743164, "global_step": 78477, "epoch": 467} {"train_loss": -9.045269012451172, "global_step": 78478, "epoch": 467} {"train_loss": -8.807144165039062, "global_step": 78479, "epoch": 467} {"train_loss": -8.97295093536377, "global_step": 78480, "epoch": 467} {"train_loss": -9.199821472167969, "global_step": 78481, "epoch": 467} {"train_loss": -9.093133926391602, "global_step": 78482, "epoch": 467} {"train_loss": -8.995988845825195, "global_step": 78483, "epoch": 467} {"train_loss": -8.686174392700195, "global_step": 78484, "epoch": 467} {"train_loss": -9.200605392456055, "global_step": 78485, "epoch": 467} {"train_loss": -8.717472076416016, "global_step": 78486, "epoch": 467} {"train_loss": -8.721115112304688, "global_step": 78487, "epoch": 467} {"train_loss": -8.973817825317383, "global_step": 78488, "epoch": 467} {"train_loss": -8.697357177734375, "global_step": 78489, "epoch": 467} {"train_loss": -9.106573104858398, "global_step": 78490, "epoch": 467} {"train_loss": -8.963958740234375, "global_step": 78491, "epoch": 467} {"train_loss": -9.003860473632812, "global_step": 78492, "epoch": 467} {"train_loss": -8.913640975952148, "global_step": 78493, "epoch": 467} {"train_loss": -9.153556823730469, "global_step": 78494, "epoch": 467} {"train_loss": -9.005699157714844, "global_step": 78495, "epoch": 467} {"train_loss": -9.006426811218262, "global_step": 78496, "epoch": 467} {"train_loss": -9.002065658569336, "global_step": 78497, "epoch": 467} {"train_loss": -9.233380317687988, "global_step": 78498, "epoch": 467} {"train_loss": -9.095741271972656, "global_step": 78499, "epoch": 467} {"train_loss": -9.045181274414062, "global_step": 78500, "epoch": 467} {"train_loss": -9.22185230255127, "global_step": 78501, "epoch": 467} {"train_loss": -9.10708236694336, "global_step": 78502, "epoch": 467} {"train_loss": -9.173938751220703, "global_step": 78503, "epoch": 467} {"train_loss": -9.162341117858887, "global_step": 78504, "epoch": 467} {"train_loss": -9.220608711242676, "global_step": 78505, "epoch": 467} {"train_loss": -8.961556434631348, "global_step": 78506, "epoch": 467} {"train_loss": -9.304527282714844, "global_step": 78507, "epoch": 467} {"train_loss": -9.298105239868164, "global_step": 78508, "epoch": 467} {"train_loss": -9.446805000305176, "global_step": 78509, "epoch": 467} {"train_loss": -9.316494941711426, "global_step": 78510, "epoch": 467} {"train_loss": -9.12914752960205, "global_step": 78511, "epoch": 467} {"train_loss": -9.275060653686523, "global_step": 78512, "epoch": 467} {"train_loss": -9.274463653564453, "global_step": 78513, "epoch": 467} {"train_loss": -9.18932056427002, "global_step": 78514, "epoch": 467} {"train_loss": -9.311365127563477, "global_step": 78515, "epoch": 467} {"train_loss": -9.251692771911621, "global_step": 78516, "epoch": 467} {"train_loss": -8.934133529663086, "global_step": 78517, "epoch": 467} {"train_loss": -9.449102401733398, "global_step": 78518, "epoch": 467} {"train_loss": -9.14309024810791, "global_step": 78519, "epoch": 467} {"train_loss": -9.018899917602539, "global_step": 78520, "epoch": 467} {"train_loss": -9.301677703857422, "global_step": 78521, "epoch": 467} {"train_loss": -9.29937744140625, "global_step": 78522, "epoch": 467} {"train_loss": -9.253180503845215, "global_step": 78523, "epoch": 467} {"train_loss": -9.185232162475586, "global_step": 78524, "epoch": 467} {"train_loss": -9.028955459594727, "global_step": 78525, "epoch": 467} {"train_loss": -9.012474060058594, "global_step": 78526, "epoch": 467} {"train_loss": -9.078645706176758, "global_step": 78527, "epoch": 467} {"train_loss": -9.036040306091309, "global_step": 78528, "epoch": 467} {"train_loss": -9.216835975646973, "global_step": 78529, "epoch": 467} {"train_loss": -8.789703369140625, "global_step": 78530, "epoch": 467} {"train_loss": -8.666474342346191, "global_step": 78531, "epoch": 467} {"train_loss": -9.100702285766602, "global_step": 78532, "epoch": 467} {"train_loss": -8.783061981201172, "global_step": 78533, "epoch": 467} {"train_loss": -9.102912902832031, "global_step": 78534, "epoch": 467} {"train_loss": -8.888593673706055, "global_step": 78535, "epoch": 467} {"train_loss": -8.822391510009766, "global_step": 78536, "epoch": 467} {"train_loss": -9.138982772827148, "global_step": 78537, "epoch": 467} {"train_loss": -9.237284660339355, "global_step": 78538, "epoch": 467} {"train_loss": -8.972764015197754, "global_step": 78539, "epoch": 467} {"train_loss": -9.065759658813477, "global_step": 78540, "epoch": 467} {"train_loss": -9.225606918334961, "global_step": 78541, "epoch": 467} {"train_loss": -8.867097854614258, "global_step": 78542, "epoch": 467} {"train_loss": -9.008413314819336, "global_step": 78543, "epoch": 467} {"train_loss": -9.211648941040039, "global_step": 78544, "epoch": 467} {"train_loss": -8.83879280090332, "global_step": 78545, "epoch": 467} {"train_loss": -8.966129302978516, "global_step": 78546, "epoch": 467} {"train_loss": -9.222846984863281, "global_step": 78547, "epoch": 467} {"train_loss": -8.763338088989258, "global_step": 78548, "epoch": 467} {"train_loss": -9.07070541381836, "global_step": 78549, "epoch": 467} {"train_loss": -8.811956405639648, "global_step": 78550, "epoch": 467} {"train_loss": -9.03138542175293, "global_step": 78551, "epoch": 467} {"train_loss": -8.988550186157227, "global_step": 78552, "epoch": 467} {"train_loss": -9.20203971862793, "global_step": 78553, "epoch": 467} {"train_loss": -8.964818000793457, "global_step": 78554, "epoch": 467} {"train_loss": -9.274216651916504, "global_step": 78555, "epoch": 467} {"train_loss": -8.816363334655762, "global_step": 78556, "epoch": 467} {"train_loss": -9.225313186645508, "global_step": 78557, "epoch": 467} {"train_loss": -9.185628890991211, "global_step": 78558, "epoch": 467} {"train_loss": -8.856740951538086, "global_step": 78559, "epoch": 467} {"train_loss": -9.145925521850586, "global_step": 78560, "epoch": 467} {"train_loss": -8.908828735351562, "global_step": 78561, "epoch": 467} {"train_loss": -9.101764678955078, "global_step": 78562, "epoch": 467} {"train_loss": -8.909259796142578, "global_step": 78563, "epoch": 467} {"train_loss": -9.224241256713867, "global_step": 78564, "epoch": 467} {"train_loss": -8.693597793579102, "global_step": 78565, "epoch": 467} {"train_loss": -9.042709350585938, "global_step": 78566, "epoch": 467} {"train_loss": -9.0520601272583, "global_step": 78567, "epoch": 467} {"train_loss": -8.7618989944458, "global_step": 78568, "epoch": 467} {"train_loss": -8.387189865112305, "global_step": 78569, "epoch": 467} {"train_loss": -8.935300827026367, "global_step": 78570, "epoch": 467} {"train_loss": -8.724327087402344, "global_step": 78571, "epoch": 467} {"train_loss": -8.881998062133789, "global_step": 78572, "epoch": 467} {"train_loss": -8.674766540527344, "global_step": 78573, "epoch": 467} {"train_loss": -8.816793441772461, "global_step": 78574, "epoch": 467} {"train_loss": -8.920629501342773, "global_step": 78575, "epoch": 467} {"train_loss": -8.90472412109375, "global_step": 78576, "epoch": 467} {"train_loss": -8.848627090454102, "global_step": 78577, "epoch": 467} {"train_loss": -8.892387390136719, "global_step": 78578, "epoch": 467} {"train_loss": -8.937410354614258, "global_step": 78579, "epoch": 467} {"train_loss": -8.93710994720459, "global_step": 78580, "epoch": 467} {"train_loss": -9.188374519348145, "global_step": 78581, "epoch": 467} {"train_loss": -9.032451629638672, "global_step": 78582, "epoch": 467} {"train_loss": -8.88033676147461, "global_step": 78583, "epoch": 467} {"train_loss": -8.88084602355957, "global_step": 78584, "epoch": 467} {"train_loss": -9.011341094970703, "global_step": 78585, "epoch": 467} {"train_loss": -9.05100154876709, "global_step": 78586, "epoch": 467} {"train_loss": -9.095029830932617, "global_step": 78587, "epoch": 467} {"train_loss": -8.972110748291016, "global_step": 78588, "epoch": 467} {"train_loss": -9.316909790039062, "global_step": 78589, "epoch": 467} {"train_loss": -9.160451889038086, "global_step": 78590, "epoch": 467} {"train_loss": -8.997453689575195, "global_step": 78591, "epoch": 467} {"train_loss": -9.121047973632812, "global_step": 78592, "epoch": 467} {"train_loss": -8.989728927612305, "global_step": 78593, "epoch": 467} {"train_loss": -8.942974090576172, "global_step": 78594, "epoch": 467} {"train_loss": -9.218647956848145, "global_step": 78595, "epoch": 467} {"train_loss": -9.568187713623047, "global_step": 78596, "epoch": 467} {"train_loss": -8.971881866455078, "global_step": 78597, "epoch": 467} {"train_loss": -9.316780090332031, "global_step": 78598, "epoch": 467} {"train_loss": -8.93273639678955, "global_step": 78599, "epoch": 467} {"train_loss": -9.019145965576172, "global_step": 78600, "epoch": 467} {"train_loss": -9.354820251464844, "global_step": 78601, "epoch": 467} {"train_loss": -9.21945571899414, "global_step": 78602, "epoch": 467} {"train_loss": -9.17145824432373, "global_step": 78603, "epoch": 467} {"train_loss": -9.184765815734863, "global_step": 78604, "epoch": 467} {"train_loss": -9.245246887207031, "global_step": 78605, "epoch": 467} {"train_loss": -9.350130081176758, "global_step": 78606, "epoch": 467} {"train_loss": -8.848752975463867, "global_step": 78607, "epoch": 467} {"train_loss": -9.174211502075195, "global_step": 78608, "epoch": 467} {"train_loss": -9.142196655273438, "global_step": 78609, "epoch": 467} {"train_loss": -8.984685897827148, "global_step": 78610, "epoch": 467} {"train_loss": -9.094566345214844, "global_step": 78611, "epoch": 467} {"train_loss": -9.229893684387207, "global_step": 78612, "epoch": 467} {"train_loss": -9.32514476776123, "global_step": 78613, "epoch": 467} {"train_loss": -9.292272567749023, "global_step": 78614, "epoch": 467} {"train_loss": -8.884876251220703, "global_step": 78615, "epoch": 467} {"train_loss": -9.134034156799316, "global_step": 78616, "epoch": 467} {"train_loss": -9.064508438110352, "global_step": 78617, "epoch": 467} {"train_loss": -8.911771774291992, "global_step": 78618, "epoch": 467} {"train_loss": -9.13878059387207, "global_step": 78619, "epoch": 467} {"train_loss": -9.104177474975586, "global_step": 78620, "epoch": 467} {"train_loss": -9.044841766357422, "global_step": 78621, "epoch": 467} {"train_loss": -8.785418510437012, "global_step": 78622, "epoch": 467} {"train_loss": -9.073687967799959, "global_step": 78623, "epoch": 467, "val_loss": 196084.90625} {"train_loss": -9.083959579467773, "global_step": 78624, "epoch": 468} {"train_loss": -8.505030632019043, "global_step": 78625, "epoch": 468} {"train_loss": -8.990633010864258, "global_step": 78626, "epoch": 468} {"train_loss": -8.891921043395996, "global_step": 78627, "epoch": 468} {"train_loss": -8.733179092407227, "global_step": 78628, "epoch": 468} {"train_loss": -8.70969009399414, "global_step": 78629, "epoch": 468} {"train_loss": -8.618824005126953, "global_step": 78630, "epoch": 468} {"train_loss": -8.712568283081055, "global_step": 78631, "epoch": 468} {"train_loss": -8.836587905883789, "global_step": 78632, "epoch": 468} {"train_loss": -8.847860336303711, "global_step": 78633, "epoch": 468} {"train_loss": -8.9569730758667, "global_step": 78634, "epoch": 468} {"train_loss": -8.964582443237305, "global_step": 78635, "epoch": 468} {"train_loss": -9.114029884338379, "global_step": 78636, "epoch": 468} {"train_loss": -8.946516036987305, "global_step": 78637, "epoch": 468} {"train_loss": -9.055907249450684, "global_step": 78638, "epoch": 468} {"train_loss": -8.91392993927002, "global_step": 78639, "epoch": 468} {"train_loss": -8.738481521606445, "global_step": 78640, "epoch": 468} {"train_loss": -9.258296966552734, "global_step": 78641, "epoch": 468} {"train_loss": -9.10152530670166, "global_step": 78642, "epoch": 468} {"train_loss": -9.229785919189453, "global_step": 78643, "epoch": 468} {"train_loss": -9.248910903930664, "global_step": 78644, "epoch": 468} {"train_loss": -9.367165565490723, "global_step": 78645, "epoch": 468} {"train_loss": -9.306597709655762, "global_step": 78646, "epoch": 468} {"train_loss": -9.075959205627441, "global_step": 78647, "epoch": 468} {"train_loss": -9.231023788452148, "global_step": 78648, "epoch": 468} {"train_loss": -9.20330810546875, "global_step": 78649, "epoch": 468} {"train_loss": -9.156179428100586, "global_step": 78650, "epoch": 468} {"train_loss": -9.17111873626709, "global_step": 78651, "epoch": 468} {"train_loss": -9.429346084594727, "global_step": 78652, "epoch": 468} {"train_loss": -8.974900245666504, "global_step": 78653, "epoch": 468} {"train_loss": -9.224485397338867, "global_step": 78654, "epoch": 468} {"train_loss": -9.24899673461914, "global_step": 78655, "epoch": 468} {"train_loss": -9.242303848266602, "global_step": 78656, "epoch": 468} {"train_loss": -9.12905502319336, "global_step": 78657, "epoch": 468} {"train_loss": -9.285039901733398, "global_step": 78658, "epoch": 468} {"train_loss": -9.311214447021484, "global_step": 78659, "epoch": 468} {"train_loss": -9.19056510925293, "global_step": 78660, "epoch": 468} {"train_loss": -9.181196212768555, "global_step": 78661, "epoch": 468} {"train_loss": -9.273822784423828, "global_step": 78662, "epoch": 468} {"train_loss": -9.380950927734375, "global_step": 78663, "epoch": 468} {"train_loss": -9.134706497192383, "global_step": 78664, "epoch": 468} {"train_loss": -9.295899391174316, "global_step": 78665, "epoch": 468} {"train_loss": -9.354461669921875, "global_step": 78666, "epoch": 468} {"train_loss": -9.15780258178711, "global_step": 78667, "epoch": 468} {"train_loss": -9.076131820678711, "global_step": 78668, "epoch": 468} {"train_loss": -8.671611785888672, "global_step": 78669, "epoch": 468} {"train_loss": -9.15048885345459, "global_step": 78670, "epoch": 468} {"train_loss": -8.836387634277344, "global_step": 78671, "epoch": 468} {"train_loss": -8.719133377075195, "global_step": 78672, "epoch": 468} {"train_loss": -9.057548522949219, "global_step": 78673, "epoch": 468} {"train_loss": -8.849841117858887, "global_step": 78674, "epoch": 468} {"train_loss": -9.142559051513672, "global_step": 78675, "epoch": 468} {"train_loss": -9.054508209228516, "global_step": 78676, "epoch": 468} {"train_loss": -9.161975860595703, "global_step": 78677, "epoch": 468} {"train_loss": -9.021657943725586, "global_step": 78678, "epoch": 468} {"train_loss": -9.114134788513184, "global_step": 78679, "epoch": 468} {"train_loss": -9.185020446777344, "global_step": 78680, "epoch": 468} {"train_loss": -8.748201370239258, "global_step": 78681, "epoch": 468} {"train_loss": -9.034629821777344, "global_step": 78682, "epoch": 468} {"train_loss": -9.236164093017578, "global_step": 78683, "epoch": 468} {"train_loss": -9.184732437133789, "global_step": 78684, "epoch": 468} {"train_loss": -9.043672561645508, "global_step": 78685, "epoch": 468} {"train_loss": -9.178901672363281, "global_step": 78686, "epoch": 468} {"train_loss": -8.963299751281738, "global_step": 78687, "epoch": 468} {"train_loss": -9.244656562805176, "global_step": 78688, "epoch": 468} {"train_loss": -9.334541320800781, "global_step": 78689, "epoch": 468} {"train_loss": -9.123523712158203, "global_step": 78690, "epoch": 468} {"train_loss": -9.16867733001709, "global_step": 78691, "epoch": 468} {"train_loss": -8.803741455078125, "global_step": 78692, "epoch": 468} {"train_loss": -9.228376388549805, "global_step": 78693, "epoch": 468} {"train_loss": -9.070906639099121, "global_step": 78694, "epoch": 468} {"train_loss": -9.194307327270508, "global_step": 78695, "epoch": 468} {"train_loss": -9.069534301757812, "global_step": 78696, "epoch": 468} {"train_loss": -9.377487182617188, "global_step": 78697, "epoch": 468} {"train_loss": -9.197074890136719, "global_step": 78698, "epoch": 468} {"train_loss": -9.285271644592285, "global_step": 78699, "epoch": 468} {"train_loss": -9.007869720458984, "global_step": 78700, "epoch": 468} {"train_loss": -9.253247261047363, "global_step": 78701, "epoch": 468} {"train_loss": -9.572102546691895, "global_step": 78702, "epoch": 468} {"train_loss": -9.16726303100586, "global_step": 78703, "epoch": 468} {"train_loss": -9.193964004516602, "global_step": 78704, "epoch": 468} {"train_loss": -8.955825805664062, "global_step": 78705, "epoch": 468} {"train_loss": -9.226648330688477, "global_step": 78706, "epoch": 468} {"train_loss": -9.17990493774414, "global_step": 78707, "epoch": 468} {"train_loss": -9.36782169342041, "global_step": 78708, "epoch": 468} {"train_loss": -8.972068786621094, "global_step": 78709, "epoch": 468} {"train_loss": -9.184869766235352, "global_step": 78710, "epoch": 468} {"train_loss": -8.883703231811523, "global_step": 78711, "epoch": 468} {"train_loss": -9.274517059326172, "global_step": 78712, "epoch": 468} {"train_loss": -9.250740051269531, "global_step": 78713, "epoch": 468} {"train_loss": -8.968854904174805, "global_step": 78714, "epoch": 468} {"train_loss": -8.93380069732666, "global_step": 78715, "epoch": 468} {"train_loss": -8.863018035888672, "global_step": 78716, "epoch": 468} {"train_loss": -9.229406356811523, "global_step": 78717, "epoch": 468} {"train_loss": -9.19201374053955, "global_step": 78718, "epoch": 468} {"train_loss": -9.4730224609375, "global_step": 78719, "epoch": 468} {"train_loss": -9.207406997680664, "global_step": 78720, "epoch": 468} {"train_loss": -9.22548770904541, "global_step": 78721, "epoch": 468} {"train_loss": -9.21365737915039, "global_step": 78722, "epoch": 468} {"train_loss": -9.052534103393555, "global_step": 78723, "epoch": 468} {"train_loss": -8.91009521484375, "global_step": 78724, "epoch": 468} {"train_loss": -9.230745315551758, "global_step": 78725, "epoch": 468} {"train_loss": -9.175603866577148, "global_step": 78726, "epoch": 468} {"train_loss": -8.67392635345459, "global_step": 78727, "epoch": 468} {"train_loss": -8.842206001281738, "global_step": 78728, "epoch": 468} {"train_loss": -9.065991401672363, "global_step": 78729, "epoch": 468} {"train_loss": -8.860100746154785, "global_step": 78730, "epoch": 468} {"train_loss": -9.176149368286133, "global_step": 78731, "epoch": 468} {"train_loss": -9.333459854125977, "global_step": 78732, "epoch": 468} {"train_loss": -9.139347076416016, "global_step": 78733, "epoch": 468} {"train_loss": -9.19825553894043, "global_step": 78734, "epoch": 468} {"train_loss": -8.946084022521973, "global_step": 78735, "epoch": 468} {"train_loss": -9.056528091430664, "global_step": 78736, "epoch": 468} {"train_loss": -9.053106307983398, "global_step": 78737, "epoch": 468} {"train_loss": -9.271361351013184, "global_step": 78738, "epoch": 468} {"train_loss": -8.961690902709961, "global_step": 78739, "epoch": 468} {"train_loss": -9.244318008422852, "global_step": 78740, "epoch": 468} {"train_loss": -9.359872817993164, "global_step": 78741, "epoch": 468} {"train_loss": -9.004170417785645, "global_step": 78742, "epoch": 468} {"train_loss": -9.35050106048584, "global_step": 78743, "epoch": 468} {"train_loss": -9.072271347045898, "global_step": 78744, "epoch": 468} {"train_loss": -9.329049110412598, "global_step": 78745, "epoch": 468} {"train_loss": -9.328680992126465, "global_step": 78746, "epoch": 468} {"train_loss": -9.086874008178711, "global_step": 78747, "epoch": 468} {"train_loss": -9.152856826782227, "global_step": 78748, "epoch": 468} {"train_loss": -8.867414474487305, "global_step": 78749, "epoch": 468} {"train_loss": -9.330293655395508, "global_step": 78750, "epoch": 468} {"train_loss": -9.224809646606445, "global_step": 78751, "epoch": 468} {"train_loss": -9.372762680053711, "global_step": 78752, "epoch": 468} {"train_loss": -9.272382736206055, "global_step": 78753, "epoch": 468} {"train_loss": -9.535295486450195, "global_step": 78754, "epoch": 468} {"train_loss": -9.428733825683594, "global_step": 78755, "epoch": 468} {"train_loss": -9.354171752929688, "global_step": 78756, "epoch": 468} {"train_loss": -9.04100227355957, "global_step": 78757, "epoch": 468} {"train_loss": -9.186205863952637, "global_step": 78758, "epoch": 468} {"train_loss": -8.94742488861084, "global_step": 78759, "epoch": 468} {"train_loss": -8.978710174560547, "global_step": 78760, "epoch": 468} {"train_loss": -9.271934509277344, "global_step": 78761, "epoch": 468} {"train_loss": -9.217994689941406, "global_step": 78762, "epoch": 468} {"train_loss": -9.269427299499512, "global_step": 78763, "epoch": 468} {"train_loss": -9.305490493774414, "global_step": 78764, "epoch": 468} {"train_loss": -9.134328842163086, "global_step": 78765, "epoch": 468} {"train_loss": -8.862302780151367, "global_step": 78766, "epoch": 468} {"train_loss": -9.388611793518066, "global_step": 78767, "epoch": 468} {"train_loss": -9.222107887268066, "global_step": 78768, "epoch": 468} {"train_loss": -9.0787353515625, "global_step": 78769, "epoch": 468} {"train_loss": -9.066694259643555, "global_step": 78770, "epoch": 468} {"train_loss": -8.73690128326416, "global_step": 78771, "epoch": 468} {"train_loss": -9.24378776550293, "global_step": 78772, "epoch": 468} {"train_loss": -8.785688400268555, "global_step": 78773, "epoch": 468} {"train_loss": -8.83144474029541, "global_step": 78774, "epoch": 468} {"train_loss": -8.92031192779541, "global_step": 78775, "epoch": 468} {"train_loss": -8.867094039916992, "global_step": 78776, "epoch": 468} {"train_loss": -9.074978828430176, "global_step": 78777, "epoch": 468} {"train_loss": -8.918191909790039, "global_step": 78778, "epoch": 468} {"train_loss": -9.068950653076172, "global_step": 78779, "epoch": 468} {"train_loss": -8.715890884399414, "global_step": 78780, "epoch": 468} {"train_loss": -9.102941513061523, "global_step": 78781, "epoch": 468} {"train_loss": -8.868585586547852, "global_step": 78782, "epoch": 468} {"train_loss": -9.135054588317871, "global_step": 78783, "epoch": 468} {"train_loss": -9.400115966796875, "global_step": 78784, "epoch": 468} {"train_loss": -9.076140403747559, "global_step": 78785, "epoch": 468} {"train_loss": -8.859380722045898, "global_step": 78786, "epoch": 468} {"train_loss": -9.026843070983887, "global_step": 78787, "epoch": 468} {"train_loss": -9.229610443115234, "global_step": 78788, "epoch": 468} {"train_loss": -9.167051315307617, "global_step": 78789, "epoch": 468} {"train_loss": -9.02688217163086, "global_step": 78790, "epoch": 468} {"train_loss": -9.103569916316442, "global_step": 78791, "epoch": 468, "val_loss": 195488.515625} {"train_loss": -9.053759574890137, "global_step": 78792, "epoch": 469} {"train_loss": -9.262676239013672, "global_step": 78793, "epoch": 469} {"train_loss": -9.250776290893555, "global_step": 78794, "epoch": 469} {"train_loss": -9.131311416625977, "global_step": 78795, "epoch": 469} {"train_loss": -8.954387664794922, "global_step": 78796, "epoch": 469} {"train_loss": -9.05017375946045, "global_step": 78797, "epoch": 469} {"train_loss": -9.213214874267578, "global_step": 78798, "epoch": 469} {"train_loss": -8.976781845092773, "global_step": 78799, "epoch": 469} {"train_loss": -9.436653137207031, "global_step": 78800, "epoch": 469} {"train_loss": -9.257898330688477, "global_step": 78801, "epoch": 469} {"train_loss": -9.189018249511719, "global_step": 78802, "epoch": 469} {"train_loss": -9.413726806640625, "global_step": 78803, "epoch": 469} {"train_loss": -9.29356575012207, "global_step": 78804, "epoch": 469} {"train_loss": -9.409112930297852, "global_step": 78805, "epoch": 469} {"train_loss": -9.454895973205566, "global_step": 78806, "epoch": 469} {"train_loss": -9.221439361572266, "global_step": 78807, "epoch": 469} {"train_loss": -9.420404434204102, "global_step": 78808, "epoch": 469} {"train_loss": -9.14635944366455, "global_step": 78809, "epoch": 469} {"train_loss": -9.580042839050293, "global_step": 78810, "epoch": 469} {"train_loss": -9.122381210327148, "global_step": 78811, "epoch": 469} {"train_loss": -9.521060943603516, "global_step": 78812, "epoch": 469} {"train_loss": -9.261322975158691, "global_step": 78813, "epoch": 469} {"train_loss": -9.399787902832031, "global_step": 78814, "epoch": 469} {"train_loss": -9.579180717468262, "global_step": 78815, "epoch": 469} {"train_loss": -9.352246284484863, "global_step": 78816, "epoch": 469} {"train_loss": -9.264236450195312, "global_step": 78817, "epoch": 469} {"train_loss": -9.29743766784668, "global_step": 78818, "epoch": 469} {"train_loss": -9.431108474731445, "global_step": 78819, "epoch": 469} {"train_loss": -9.353107452392578, "global_step": 78820, "epoch": 469} {"train_loss": -9.271041870117188, "global_step": 78821, "epoch": 469} {"train_loss": -9.488170623779297, "global_step": 78822, "epoch": 469} {"train_loss": -9.177886962890625, "global_step": 78823, "epoch": 469} {"train_loss": -9.329244613647461, "global_step": 78824, "epoch": 469} {"train_loss": -9.512659072875977, "global_step": 78825, "epoch": 469} {"train_loss": -9.46216106414795, "global_step": 78826, "epoch": 469} {"train_loss": -9.449432373046875, "global_step": 78827, "epoch": 469} {"train_loss": -9.371883392333984, "global_step": 78828, "epoch": 469} {"train_loss": -9.244497299194336, "global_step": 78829, "epoch": 469} {"train_loss": -9.24721622467041, "global_step": 78830, "epoch": 469} {"train_loss": -9.102025985717773, "global_step": 78831, "epoch": 469} {"train_loss": -9.519853591918945, "global_step": 78832, "epoch": 469} {"train_loss": -9.344096183776855, "global_step": 78833, "epoch": 469} {"train_loss": -9.309179306030273, "global_step": 78834, "epoch": 469} {"train_loss": -9.531745910644531, "global_step": 78835, "epoch": 469} {"train_loss": -9.149136543273926, "global_step": 78836, "epoch": 469} {"train_loss": -9.387781143188477, "global_step": 78837, "epoch": 469} {"train_loss": -8.782360076904297, "global_step": 78838, "epoch": 469} {"train_loss": -9.272523880004883, "global_step": 78839, "epoch": 469} {"train_loss": -9.233474731445312, "global_step": 78840, "epoch": 469} {"train_loss": -9.040229797363281, "global_step": 78841, "epoch": 469} {"train_loss": -9.30391788482666, "global_step": 78842, "epoch": 469} {"train_loss": -9.092988967895508, "global_step": 78843, "epoch": 469} {"train_loss": -9.151965141296387, "global_step": 78844, "epoch": 469} {"train_loss": -8.969008445739746, "global_step": 78845, "epoch": 469} {"train_loss": -9.264280319213867, "global_step": 78846, "epoch": 469} {"train_loss": -9.219707489013672, "global_step": 78847, "epoch": 469} {"train_loss": -9.257040023803711, "global_step": 78848, "epoch": 469} {"train_loss": -9.169072151184082, "global_step": 78849, "epoch": 469} {"train_loss": -9.29731559753418, "global_step": 78850, "epoch": 469} {"train_loss": -9.237202644348145, "global_step": 78851, "epoch": 469} {"train_loss": -9.275108337402344, "global_step": 78852, "epoch": 469} {"train_loss": -8.959206581115723, "global_step": 78853, "epoch": 469} {"train_loss": -9.27989673614502, "global_step": 78854, "epoch": 469} {"train_loss": -9.015338897705078, "global_step": 78855, "epoch": 469} {"train_loss": -9.141986846923828, "global_step": 78856, "epoch": 469} {"train_loss": -8.994842529296875, "global_step": 78857, "epoch": 469} {"train_loss": -9.171475410461426, "global_step": 78858, "epoch": 469} {"train_loss": -8.910505294799805, "global_step": 78859, "epoch": 469} {"train_loss": -8.934526443481445, "global_step": 78860, "epoch": 469} {"train_loss": -8.888826370239258, "global_step": 78861, "epoch": 469} {"train_loss": -9.268951416015625, "global_step": 78862, "epoch": 469} {"train_loss": -8.853538513183594, "global_step": 78863, "epoch": 469} {"train_loss": -8.885757446289062, "global_step": 78864, "epoch": 469} {"train_loss": -9.378447532653809, "global_step": 78865, "epoch": 469} {"train_loss": -9.215347290039062, "global_step": 78866, "epoch": 469} {"train_loss": -9.158339500427246, "global_step": 78867, "epoch": 469} {"train_loss": -9.325944900512695, "global_step": 78868, "epoch": 469} {"train_loss": -9.140613555908203, "global_step": 78869, "epoch": 469} {"train_loss": -9.423458099365234, "global_step": 78870, "epoch": 469} {"train_loss": -9.189414024353027, "global_step": 78871, "epoch": 469} {"train_loss": -9.106328964233398, "global_step": 78872, "epoch": 469} {"train_loss": -9.134803771972656, "global_step": 78873, "epoch": 469} {"train_loss": -9.122343063354492, "global_step": 78874, "epoch": 469} {"train_loss": -9.239227294921875, "global_step": 78875, "epoch": 469} {"train_loss": -9.353384017944336, "global_step": 78876, "epoch": 469} {"train_loss": -9.207765579223633, "global_step": 78877, "epoch": 469} {"train_loss": -9.316859245300293, "global_step": 78878, "epoch": 469} {"train_loss": -9.338811874389648, "global_step": 78879, "epoch": 469} {"train_loss": -9.128353118896484, "global_step": 78880, "epoch": 469} {"train_loss": -8.993465423583984, "global_step": 78881, "epoch": 469} {"train_loss": -9.142213821411133, "global_step": 78882, "epoch": 469} {"train_loss": -9.108336448669434, "global_step": 78883, "epoch": 469} {"train_loss": -9.20414924621582, "global_step": 78884, "epoch": 469} {"train_loss": -9.317331314086914, "global_step": 78885, "epoch": 469} {"train_loss": -9.416330337524414, "global_step": 78886, "epoch": 469} {"train_loss": -9.22829818725586, "global_step": 78887, "epoch": 469} {"train_loss": -9.152538299560547, "global_step": 78888, "epoch": 469} {"train_loss": -9.317916870117188, "global_step": 78889, "epoch": 469} {"train_loss": -9.171588897705078, "global_step": 78890, "epoch": 469} {"train_loss": -9.07258415222168, "global_step": 78891, "epoch": 469} {"train_loss": -9.423857688903809, "global_step": 78892, "epoch": 469} {"train_loss": -9.053964614868164, "global_step": 78893, "epoch": 469} {"train_loss": -9.209549903869629, "global_step": 78894, "epoch": 469} {"train_loss": -9.418045043945312, "global_step": 78895, "epoch": 469} {"train_loss": -9.226593017578125, "global_step": 78896, "epoch": 469} {"train_loss": -9.063264846801758, "global_step": 78897, "epoch": 469} {"train_loss": -9.127542495727539, "global_step": 78898, "epoch": 469} {"train_loss": -9.261873245239258, "global_step": 78899, "epoch": 469} {"train_loss": -9.011415481567383, "global_step": 78900, "epoch": 469} {"train_loss": -9.207233428955078, "global_step": 78901, "epoch": 469} {"train_loss": -9.280973434448242, "global_step": 78902, "epoch": 469} {"train_loss": -9.269538879394531, "global_step": 78903, "epoch": 469} {"train_loss": -9.058904647827148, "global_step": 78904, "epoch": 469} {"train_loss": -9.290964126586914, "global_step": 78905, "epoch": 469} {"train_loss": -9.332799911499023, "global_step": 78906, "epoch": 469} {"train_loss": -9.326300621032715, "global_step": 78907, "epoch": 469} {"train_loss": -9.18962574005127, "global_step": 78908, "epoch": 469} {"train_loss": -9.27392578125, "global_step": 78909, "epoch": 469} {"train_loss": -9.289392471313477, "global_step": 78910, "epoch": 469} {"train_loss": -9.176355361938477, "global_step": 78911, "epoch": 469} {"train_loss": -9.20334243774414, "global_step": 78912, "epoch": 469} {"train_loss": -9.158456802368164, "global_step": 78913, "epoch": 469} {"train_loss": -9.170872688293457, "global_step": 78914, "epoch": 469} {"train_loss": -9.387874603271484, "global_step": 78915, "epoch": 469} {"train_loss": -9.079349517822266, "global_step": 78916, "epoch": 469} {"train_loss": -9.324590682983398, "global_step": 78917, "epoch": 469} {"train_loss": -9.231081008911133, "global_step": 78918, "epoch": 469} {"train_loss": -9.153060913085938, "global_step": 78919, "epoch": 469} {"train_loss": -9.412150382995605, "global_step": 78920, "epoch": 469} {"train_loss": -9.014836311340332, "global_step": 78921, "epoch": 469} {"train_loss": -8.62943172454834, "global_step": 78922, "epoch": 469} {"train_loss": -9.169504165649414, "global_step": 78923, "epoch": 469} {"train_loss": -8.649805068969727, "global_step": 78924, "epoch": 469} {"train_loss": -9.16627311706543, "global_step": 78925, "epoch": 469} {"train_loss": -9.009038925170898, "global_step": 78926, "epoch": 469} {"train_loss": -8.71190071105957, "global_step": 78927, "epoch": 469} {"train_loss": -9.098520278930664, "global_step": 78928, "epoch": 469} {"train_loss": -8.924899101257324, "global_step": 78929, "epoch": 469} {"train_loss": -9.001426696777344, "global_step": 78930, "epoch": 469} {"train_loss": -9.072872161865234, "global_step": 78931, "epoch": 469} {"train_loss": -9.065164566040039, "global_step": 78932, "epoch": 469} {"train_loss": -9.26972770690918, "global_step": 78933, "epoch": 469} {"train_loss": -9.162351608276367, "global_step": 78934, "epoch": 469} {"train_loss": -9.011701583862305, "global_step": 78935, "epoch": 469} {"train_loss": -9.030451774597168, "global_step": 78936, "epoch": 469} {"train_loss": -8.995950698852539, "global_step": 78937, "epoch": 469} {"train_loss": -9.153779983520508, "global_step": 78938, "epoch": 469} {"train_loss": -9.332886695861816, "global_step": 78939, "epoch": 469} {"train_loss": -9.297279357910156, "global_step": 78940, "epoch": 469} {"train_loss": -9.100356101989746, "global_step": 78941, "epoch": 469} {"train_loss": -9.04115104675293, "global_step": 78942, "epoch": 469} {"train_loss": -9.048165321350098, "global_step": 78943, "epoch": 469} {"train_loss": -9.194640159606934, "global_step": 78944, "epoch": 469} {"train_loss": -9.059248924255371, "global_step": 78945, "epoch": 469} {"train_loss": -9.186529159545898, "global_step": 78946, "epoch": 469} {"train_loss": -8.88323974609375, "global_step": 78947, "epoch": 469} {"train_loss": -8.970548629760742, "global_step": 78948, "epoch": 469} {"train_loss": -9.381753921508789, "global_step": 78949, "epoch": 469} {"train_loss": -9.017409324645996, "global_step": 78950, "epoch": 469} {"train_loss": -9.404352188110352, "global_step": 78951, "epoch": 469} {"train_loss": -9.24831771850586, "global_step": 78952, "epoch": 469} {"train_loss": -9.27608871459961, "global_step": 78953, "epoch": 469} {"train_loss": -9.082586288452148, "global_step": 78954, "epoch": 469} {"train_loss": -9.436302185058594, "global_step": 78955, "epoch": 469} {"train_loss": -9.169175148010254, "global_step": 78956, "epoch": 469} {"train_loss": -9.091861724853516, "global_step": 78957, "epoch": 469} {"train_loss": -9.576455116271973, "global_step": 78958, "epoch": 469} {"train_loss": -9.200784569694882, "global_step": 78959, "epoch": 469, "val_loss": 197528.65625} {"train_loss": -9.20246696472168, "global_step": 78960, "epoch": 470} {"train_loss": -9.32608413696289, "global_step": 78961, "epoch": 470} {"train_loss": -9.04985523223877, "global_step": 78962, "epoch": 470} {"train_loss": -9.182615280151367, "global_step": 78963, "epoch": 470} {"train_loss": -8.741918563842773, "global_step": 78964, "epoch": 470} {"train_loss": -9.238201141357422, "global_step": 78965, "epoch": 470} {"train_loss": -9.306207656860352, "global_step": 78966, "epoch": 470} {"train_loss": -8.752195358276367, "global_step": 78967, "epoch": 470} {"train_loss": -9.004074096679688, "global_step": 78968, "epoch": 470} {"train_loss": -9.150106430053711, "global_step": 78969, "epoch": 470} {"train_loss": -8.974294662475586, "global_step": 78970, "epoch": 470} {"train_loss": -9.295671463012695, "global_step": 78971, "epoch": 470} {"train_loss": -8.882146835327148, "global_step": 78972, "epoch": 470} {"train_loss": -9.19271469116211, "global_step": 78973, "epoch": 470} {"train_loss": -9.251875877380371, "global_step": 78974, "epoch": 470} {"train_loss": -9.24129867553711, "global_step": 78975, "epoch": 470} {"train_loss": -9.016151428222656, "global_step": 78976, "epoch": 470} {"train_loss": -9.155271530151367, "global_step": 78977, "epoch": 470} {"train_loss": -9.306089401245117, "global_step": 78978, "epoch": 470} {"train_loss": -8.979660034179688, "global_step": 78979, "epoch": 470} {"train_loss": -9.242752075195312, "global_step": 78980, "epoch": 470} {"train_loss": -8.912123680114746, "global_step": 78981, "epoch": 470} {"train_loss": -8.946008682250977, "global_step": 78982, "epoch": 470} {"train_loss": -8.87381362915039, "global_step": 78983, "epoch": 470} {"train_loss": -9.12380599975586, "global_step": 78984, "epoch": 470} {"train_loss": -8.895090103149414, "global_step": 78985, "epoch": 470} {"train_loss": -9.327655792236328, "global_step": 78986, "epoch": 470} {"train_loss": -9.129986763000488, "global_step": 78987, "epoch": 470} {"train_loss": -9.213544845581055, "global_step": 78988, "epoch": 470} {"train_loss": -9.077518463134766, "global_step": 78989, "epoch": 470} {"train_loss": -9.219730377197266, "global_step": 78990, "epoch": 470} {"train_loss": -9.057352066040039, "global_step": 78991, "epoch": 470} {"train_loss": -9.181547164916992, "global_step": 78992, "epoch": 470} {"train_loss": -9.260665893554688, "global_step": 78993, "epoch": 470} {"train_loss": -9.100138664245605, "global_step": 78994, "epoch": 470} {"train_loss": -9.031590461730957, "global_step": 78995, "epoch": 470} {"train_loss": -9.046463012695312, "global_step": 78996, "epoch": 470} {"train_loss": -9.078645706176758, "global_step": 78997, "epoch": 470} {"train_loss": -9.230681419372559, "global_step": 78998, "epoch": 470} {"train_loss": -9.177833557128906, "global_step": 78999, "epoch": 470} {"train_loss": -9.170763969421387, "global_step": 79000, "epoch": 470} {"train_loss": -9.298867225646973, "global_step": 79001, "epoch": 470} {"train_loss": -9.128450393676758, "global_step": 79002, "epoch": 470} {"train_loss": -9.052129745483398, "global_step": 79003, "epoch": 470} {"train_loss": -9.118507385253906, "global_step": 79004, "epoch": 470} {"train_loss": -9.33011245727539, "global_step": 79005, "epoch": 470} {"train_loss": -9.144411087036133, "global_step": 79006, "epoch": 470} {"train_loss": -9.18630599975586, "global_step": 79007, "epoch": 470} {"train_loss": -9.37326431274414, "global_step": 79008, "epoch": 470} {"train_loss": -9.309111595153809, "global_step": 79009, "epoch": 470} {"train_loss": -9.228346824645996, "global_step": 79010, "epoch": 470} {"train_loss": -9.25001335144043, "global_step": 79011, "epoch": 470} {"train_loss": -9.326327323913574, "global_step": 79012, "epoch": 470} {"train_loss": -9.242189407348633, "global_step": 79013, "epoch": 470} {"train_loss": -9.24821662902832, "global_step": 79014, "epoch": 470} {"train_loss": -9.368791580200195, "global_step": 79015, "epoch": 470} {"train_loss": -9.291324615478516, "global_step": 79016, "epoch": 470} {"train_loss": -9.141063690185547, "global_step": 79017, "epoch": 470} {"train_loss": -9.281801223754883, "global_step": 79018, "epoch": 470} {"train_loss": -9.166390419006348, "global_step": 79019, "epoch": 470} {"train_loss": -9.398746490478516, "global_step": 79020, "epoch": 470} {"train_loss": -8.976085662841797, "global_step": 79021, "epoch": 470} {"train_loss": -9.120758056640625, "global_step": 79022, "epoch": 470} {"train_loss": -9.241019248962402, "global_step": 79023, "epoch": 470} {"train_loss": -9.219361305236816, "global_step": 79024, "epoch": 470} {"train_loss": -9.23830795288086, "global_step": 79025, "epoch": 470} {"train_loss": -9.084181785583496, "global_step": 79026, "epoch": 470} {"train_loss": -8.9160737991333, "global_step": 79027, "epoch": 470} {"train_loss": -8.933484077453613, "global_step": 79028, "epoch": 470} {"train_loss": -9.086211204528809, "global_step": 79029, "epoch": 470} {"train_loss": -8.979452133178711, "global_step": 79030, "epoch": 470} {"train_loss": -8.852837562561035, "global_step": 79031, "epoch": 470} {"train_loss": -8.88422966003418, "global_step": 79032, "epoch": 470} {"train_loss": -9.004833221435547, "global_step": 79033, "epoch": 470} {"train_loss": -8.936177253723145, "global_step": 79034, "epoch": 470} {"train_loss": -8.68471908569336, "global_step": 79035, "epoch": 470} {"train_loss": -9.029359817504883, "global_step": 79036, "epoch": 470} {"train_loss": -9.02299690246582, "global_step": 79037, "epoch": 470} {"train_loss": -9.102622985839844, "global_step": 79038, "epoch": 470} {"train_loss": -9.07184886932373, "global_step": 79039, "epoch": 470} {"train_loss": -9.090094566345215, "global_step": 79040, "epoch": 470} {"train_loss": -8.782669067382812, "global_step": 79041, "epoch": 470} {"train_loss": -9.05467414855957, "global_step": 79042, "epoch": 470} {"train_loss": -9.108046531677246, "global_step": 79043, "epoch": 470} {"train_loss": -8.822257041931152, "global_step": 79044, "epoch": 470} {"train_loss": -8.827554702758789, "global_step": 79045, "epoch": 470} {"train_loss": -9.061153411865234, "global_step": 79046, "epoch": 470} {"train_loss": -9.311443328857422, "global_step": 79047, "epoch": 470} {"train_loss": -8.872562408447266, "global_step": 79048, "epoch": 470} {"train_loss": -9.047858238220215, "global_step": 79049, "epoch": 470} {"train_loss": -9.185178756713867, "global_step": 79050, "epoch": 470} {"train_loss": -8.950189590454102, "global_step": 79051, "epoch": 470} {"train_loss": -9.136341094970703, "global_step": 79052, "epoch": 470} {"train_loss": -9.352599143981934, "global_step": 79053, "epoch": 470} {"train_loss": -9.035836219787598, "global_step": 79054, "epoch": 470} {"train_loss": -9.279487609863281, "global_step": 79055, "epoch": 470} {"train_loss": -8.906357765197754, "global_step": 79056, "epoch": 470} {"train_loss": -9.141266822814941, "global_step": 79057, "epoch": 470} {"train_loss": -9.299427032470703, "global_step": 79058, "epoch": 470} {"train_loss": -9.18736457824707, "global_step": 79059, "epoch": 470} {"train_loss": -9.022201538085938, "global_step": 79060, "epoch": 470} {"train_loss": -8.779867172241211, "global_step": 79061, "epoch": 470} {"train_loss": -9.020539283752441, "global_step": 79062, "epoch": 470} {"train_loss": -9.014603614807129, "global_step": 79063, "epoch": 470} {"train_loss": -9.207952499389648, "global_step": 79064, "epoch": 470} {"train_loss": -9.058623313903809, "global_step": 79065, "epoch": 470} {"train_loss": -9.054357528686523, "global_step": 79066, "epoch": 470} {"train_loss": -9.14117431640625, "global_step": 79067, "epoch": 470} {"train_loss": -9.17280387878418, "global_step": 79068, "epoch": 470} {"train_loss": -9.012704849243164, "global_step": 79069, "epoch": 470} {"train_loss": -9.359310150146484, "global_step": 79070, "epoch": 470} {"train_loss": -9.232912063598633, "global_step": 79071, "epoch": 470} {"train_loss": -9.191852569580078, "global_step": 79072, "epoch": 470} {"train_loss": -9.267610549926758, "global_step": 79073, "epoch": 470} {"train_loss": -9.384939193725586, "global_step": 79074, "epoch": 470} {"train_loss": -9.057437896728516, "global_step": 79075, "epoch": 470} {"train_loss": -9.280082702636719, "global_step": 79076, "epoch": 470} {"train_loss": -9.14455795288086, "global_step": 79077, "epoch": 470} {"train_loss": -9.355599403381348, "global_step": 79078, "epoch": 470} {"train_loss": -9.241268157958984, "global_step": 79079, "epoch": 470} {"train_loss": -9.138389587402344, "global_step": 79080, "epoch": 470} {"train_loss": -9.414865493774414, "global_step": 79081, "epoch": 470} {"train_loss": -9.026779174804688, "global_step": 79082, "epoch": 470} {"train_loss": -9.18722152709961, "global_step": 79083, "epoch": 470} {"train_loss": -9.0543212890625, "global_step": 79084, "epoch": 470} {"train_loss": -9.252614974975586, "global_step": 79085, "epoch": 470} {"train_loss": -9.241798400878906, "global_step": 79086, "epoch": 470} {"train_loss": -9.19119644165039, "global_step": 79087, "epoch": 470} {"train_loss": -9.244415283203125, "global_step": 79088, "epoch": 470} {"train_loss": -8.857747077941895, "global_step": 79089, "epoch": 470} {"train_loss": -9.45099925994873, "global_step": 79090, "epoch": 470} {"train_loss": -9.324806213378906, "global_step": 79091, "epoch": 470} {"train_loss": -9.002446174621582, "global_step": 79092, "epoch": 470} {"train_loss": -9.181373596191406, "global_step": 79093, "epoch": 470} {"train_loss": -8.958900451660156, "global_step": 79094, "epoch": 470} {"train_loss": -9.10312271118164, "global_step": 79095, "epoch": 470} {"train_loss": -9.015779495239258, "global_step": 79096, "epoch": 470} {"train_loss": -9.113350868225098, "global_step": 79097, "epoch": 470} {"train_loss": -9.007087707519531, "global_step": 79098, "epoch": 470} {"train_loss": -9.093574523925781, "global_step": 79099, "epoch": 470} {"train_loss": -8.863658905029297, "global_step": 79100, "epoch": 470} {"train_loss": -9.029525756835938, "global_step": 79101, "epoch": 470} {"train_loss": -9.069955825805664, "global_step": 79102, "epoch": 470} {"train_loss": -8.798799514770508, "global_step": 79103, "epoch": 470} {"train_loss": -8.671944618225098, "global_step": 79104, "epoch": 470} {"train_loss": -8.886032104492188, "global_step": 79105, "epoch": 470} {"train_loss": -9.030542373657227, "global_step": 79106, "epoch": 470} {"train_loss": -8.281731605529785, "global_step": 79107, "epoch": 470} {"train_loss": -9.056364059448242, "global_step": 79108, "epoch": 470} {"train_loss": -8.893465995788574, "global_step": 79109, "epoch": 470} {"train_loss": -8.846399307250977, "global_step": 79110, "epoch": 470} {"train_loss": -9.033855438232422, "global_step": 79111, "epoch": 470} {"train_loss": -9.265159606933594, "global_step": 79112, "epoch": 470} {"train_loss": -9.180628776550293, "global_step": 79113, "epoch": 470} {"train_loss": -8.817476272583008, "global_step": 79114, "epoch": 470} {"train_loss": -8.99576473236084, "global_step": 79115, "epoch": 470} {"train_loss": -8.962173461914062, "global_step": 79116, "epoch": 470} {"train_loss": -9.09404182434082, "global_step": 79117, "epoch": 470} {"train_loss": -9.266942024230957, "global_step": 79118, "epoch": 470} {"train_loss": -9.075654983520508, "global_step": 79119, "epoch": 470} {"train_loss": -9.151975631713867, "global_step": 79120, "epoch": 470} {"train_loss": -9.308237075805664, "global_step": 79121, "epoch": 470} {"train_loss": -9.458576202392578, "global_step": 79122, "epoch": 470} {"train_loss": -9.279451370239258, "global_step": 79123, "epoch": 470} {"train_loss": -8.977800369262695, "global_step": 79124, "epoch": 470} {"train_loss": -9.336835861206055, "global_step": 79125, "epoch": 470} {"train_loss": -9.088847160339355, "global_step": 79126, "epoch": 470} {"train_loss": -9.107593422844296, "global_step": 79127, "epoch": 470, "val_loss": 195886.40625, "train_action_mse_error": 4.920970439910889} {"train_loss": -8.942861557006836, "global_step": 79128, "epoch": 471} {"train_loss": -9.043270111083984, "global_step": 79129, "epoch": 471} {"train_loss": -9.183633804321289, "global_step": 79130, "epoch": 471} {"train_loss": -9.15029239654541, "global_step": 79131, "epoch": 471} {"train_loss": -9.351295471191406, "global_step": 79132, "epoch": 471} {"train_loss": -9.198202133178711, "global_step": 79133, "epoch": 471} {"train_loss": -8.985161781311035, "global_step": 79134, "epoch": 471} {"train_loss": -9.077958106994629, "global_step": 79135, "epoch": 471} {"train_loss": -8.977136611938477, "global_step": 79136, "epoch": 471} {"train_loss": -9.162884712219238, "global_step": 79137, "epoch": 471} {"train_loss": -9.028399467468262, "global_step": 79138, "epoch": 471} {"train_loss": -9.273103713989258, "global_step": 79139, "epoch": 471} {"train_loss": -8.891934394836426, "global_step": 79140, "epoch": 471} {"train_loss": -9.196527481079102, "global_step": 79141, "epoch": 471} {"train_loss": -9.07408618927002, "global_step": 79142, "epoch": 471} {"train_loss": -9.13672924041748, "global_step": 79143, "epoch": 471} {"train_loss": -8.955591201782227, "global_step": 79144, "epoch": 471} {"train_loss": -9.302785873413086, "global_step": 79145, "epoch": 471} {"train_loss": -9.166463851928711, "global_step": 79146, "epoch": 471} {"train_loss": -9.13201904296875, "global_step": 79147, "epoch": 471} {"train_loss": -8.959145545959473, "global_step": 79148, "epoch": 471} {"train_loss": -9.370741844177246, "global_step": 79149, "epoch": 471} {"train_loss": -8.635241508483887, "global_step": 79150, "epoch": 471} {"train_loss": -9.25136947631836, "global_step": 79151, "epoch": 471} {"train_loss": -9.2921724319458, "global_step": 79152, "epoch": 471} {"train_loss": -9.274589538574219, "global_step": 79153, "epoch": 471} {"train_loss": -9.088953018188477, "global_step": 79154, "epoch": 471} {"train_loss": -9.349523544311523, "global_step": 79155, "epoch": 471} {"train_loss": -9.041604995727539, "global_step": 79156, "epoch": 471} {"train_loss": -9.098657608032227, "global_step": 79157, "epoch": 471} {"train_loss": -9.241113662719727, "global_step": 79158, "epoch": 471} {"train_loss": -8.95884895324707, "global_step": 79159, "epoch": 471} {"train_loss": -9.403446197509766, "global_step": 79160, "epoch": 471} {"train_loss": -8.856111526489258, "global_step": 79161, "epoch": 471} {"train_loss": -9.23211669921875, "global_step": 79162, "epoch": 471} {"train_loss": -8.814038276672363, "global_step": 79163, "epoch": 471} {"train_loss": -8.669629096984863, "global_step": 79164, "epoch": 471} {"train_loss": -9.278701782226562, "global_step": 79165, "epoch": 471} {"train_loss": -8.79142951965332, "global_step": 79166, "epoch": 471} {"train_loss": -8.936063766479492, "global_step": 79167, "epoch": 471} {"train_loss": -8.86123275756836, "global_step": 79168, "epoch": 471} {"train_loss": -8.888171195983887, "global_step": 79169, "epoch": 471} {"train_loss": -8.809667587280273, "global_step": 79170, "epoch": 471} {"train_loss": -8.963944435119629, "global_step": 79171, "epoch": 471} {"train_loss": -8.94760799407959, "global_step": 79172, "epoch": 471} {"train_loss": -9.116910934448242, "global_step": 79173, "epoch": 471} {"train_loss": -8.892791748046875, "global_step": 79174, "epoch": 471} {"train_loss": -9.222084045410156, "global_step": 79175, "epoch": 471} {"train_loss": -8.929451942443848, "global_step": 79176, "epoch": 471} {"train_loss": -9.352058410644531, "global_step": 79177, "epoch": 471} {"train_loss": -9.04764461517334, "global_step": 79178, "epoch": 471} {"train_loss": -9.04977798461914, "global_step": 79179, "epoch": 471} {"train_loss": -9.081134796142578, "global_step": 79180, "epoch": 471} {"train_loss": -9.127326965332031, "global_step": 79181, "epoch": 471} {"train_loss": -8.9847412109375, "global_step": 79182, "epoch": 471} {"train_loss": -9.534692764282227, "global_step": 79183, "epoch": 471} {"train_loss": -9.002314567565918, "global_step": 79184, "epoch": 471} {"train_loss": -9.511476516723633, "global_step": 79185, "epoch": 471} {"train_loss": -9.393381118774414, "global_step": 79186, "epoch": 471} {"train_loss": -9.187061309814453, "global_step": 79187, "epoch": 471} {"train_loss": -9.194720268249512, "global_step": 79188, "epoch": 471} {"train_loss": -9.279626846313477, "global_step": 79189, "epoch": 471} {"train_loss": -9.032766342163086, "global_step": 79190, "epoch": 471} {"train_loss": -9.374945640563965, "global_step": 79191, "epoch": 471} {"train_loss": -9.356640815734863, "global_step": 79192, "epoch": 471} {"train_loss": -9.331997871398926, "global_step": 79193, "epoch": 471} {"train_loss": -9.302572250366211, "global_step": 79194, "epoch": 471} {"train_loss": -9.349605560302734, "global_step": 79195, "epoch": 471} {"train_loss": -9.299352645874023, "global_step": 79196, "epoch": 471} {"train_loss": -9.328608512878418, "global_step": 79197, "epoch": 471} {"train_loss": -9.095518112182617, "global_step": 79198, "epoch": 471} {"train_loss": -9.092419624328613, "global_step": 79199, "epoch": 471} {"train_loss": -9.14311695098877, "global_step": 79200, "epoch": 471} {"train_loss": -9.188704490661621, "global_step": 79201, "epoch": 471} {"train_loss": -9.207588195800781, "global_step": 79202, "epoch": 471} {"train_loss": -9.045629501342773, "global_step": 79203, "epoch": 471} {"train_loss": -9.31901741027832, "global_step": 79204, "epoch": 471} {"train_loss": -8.998465538024902, "global_step": 79205, "epoch": 471} {"train_loss": -9.307469367980957, "global_step": 79206, "epoch": 471} {"train_loss": -9.316052436828613, "global_step": 79207, "epoch": 471} {"train_loss": -9.050169944763184, "global_step": 79208, "epoch": 471} {"train_loss": -9.361105918884277, "global_step": 79209, "epoch": 471} {"train_loss": -9.101594924926758, "global_step": 79210, "epoch": 471} {"train_loss": -9.050954818725586, "global_step": 79211, "epoch": 471} {"train_loss": -9.011454582214355, "global_step": 79212, "epoch": 471} {"train_loss": -9.148931503295898, "global_step": 79213, "epoch": 471} {"train_loss": -8.953691482543945, "global_step": 79214, "epoch": 471} {"train_loss": -9.06631851196289, "global_step": 79215, "epoch": 471} {"train_loss": -9.381169319152832, "global_step": 79216, "epoch": 471} {"train_loss": -9.057588577270508, "global_step": 79217, "epoch": 471} {"train_loss": -9.0999755859375, "global_step": 79218, "epoch": 471} {"train_loss": -9.014176368713379, "global_step": 79219, "epoch": 471} {"train_loss": -9.445943832397461, "global_step": 79220, "epoch": 471} {"train_loss": -9.023554801940918, "global_step": 79221, "epoch": 471} {"train_loss": -8.973882675170898, "global_step": 79222, "epoch": 471} {"train_loss": -9.150476455688477, "global_step": 79223, "epoch": 471} {"train_loss": -9.551881790161133, "global_step": 79224, "epoch": 471} {"train_loss": -9.137922286987305, "global_step": 79225, "epoch": 471} {"train_loss": -9.348520278930664, "global_step": 79226, "epoch": 471} {"train_loss": -9.356273651123047, "global_step": 79227, "epoch": 471} {"train_loss": -8.862472534179688, "global_step": 79228, "epoch": 471} {"train_loss": -9.219257354736328, "global_step": 79229, "epoch": 471} {"train_loss": -8.980606079101562, "global_step": 79230, "epoch": 471} {"train_loss": -8.85612964630127, "global_step": 79231, "epoch": 471} {"train_loss": -8.916010856628418, "global_step": 79232, "epoch": 471} {"train_loss": -8.685365676879883, "global_step": 79233, "epoch": 471} {"train_loss": -8.74169921875, "global_step": 79234, "epoch": 471} {"train_loss": -8.778255462646484, "global_step": 79235, "epoch": 471} {"train_loss": -9.103515625, "global_step": 79236, "epoch": 471} {"train_loss": -8.877538681030273, "global_step": 79237, "epoch": 471} {"train_loss": -9.156241416931152, "global_step": 79238, "epoch": 471} {"train_loss": -8.93047046661377, "global_step": 79239, "epoch": 471} {"train_loss": -9.050013542175293, "global_step": 79240, "epoch": 471} {"train_loss": -8.979107856750488, "global_step": 79241, "epoch": 471} {"train_loss": -8.984437942504883, "global_step": 79242, "epoch": 471} {"train_loss": -8.822653770446777, "global_step": 79243, "epoch": 471} {"train_loss": -8.935215950012207, "global_step": 79244, "epoch": 471} {"train_loss": -8.966358184814453, "global_step": 79245, "epoch": 471} {"train_loss": -9.020490646362305, "global_step": 79246, "epoch": 471} {"train_loss": -8.925779342651367, "global_step": 79247, "epoch": 471} {"train_loss": -8.881080627441406, "global_step": 79248, "epoch": 471} {"train_loss": -9.15749740600586, "global_step": 79249, "epoch": 471} {"train_loss": -8.951973915100098, "global_step": 79250, "epoch": 471} {"train_loss": -9.107950210571289, "global_step": 79251, "epoch": 471} {"train_loss": -8.823084831237793, "global_step": 79252, "epoch": 471} {"train_loss": -9.099039077758789, "global_step": 79253, "epoch": 471} {"train_loss": -9.0812349319458, "global_step": 79254, "epoch": 471} {"train_loss": -9.306544303894043, "global_step": 79255, "epoch": 471} {"train_loss": -9.025854110717773, "global_step": 79256, "epoch": 471} {"train_loss": -9.166532516479492, "global_step": 79257, "epoch": 471} {"train_loss": -9.347719192504883, "global_step": 79258, "epoch": 471} {"train_loss": -9.018721580505371, "global_step": 79259, "epoch": 471} {"train_loss": -9.381425857543945, "global_step": 79260, "epoch": 471} {"train_loss": -9.456521034240723, "global_step": 79261, "epoch": 471} {"train_loss": -9.373785018920898, "global_step": 79262, "epoch": 471} {"train_loss": -9.076409339904785, "global_step": 79263, "epoch": 471} {"train_loss": -9.33798599243164, "global_step": 79264, "epoch": 471} {"train_loss": -9.00921630859375, "global_step": 79265, "epoch": 471} {"train_loss": -9.312658309936523, "global_step": 79266, "epoch": 471} {"train_loss": -9.080108642578125, "global_step": 79267, "epoch": 471} {"train_loss": -9.390547752380371, "global_step": 79268, "epoch": 471} {"train_loss": -9.082331657409668, "global_step": 79269, "epoch": 471} {"train_loss": -9.028318405151367, "global_step": 79270, "epoch": 471} {"train_loss": -9.093952178955078, "global_step": 79271, "epoch": 471} {"train_loss": -9.188993453979492, "global_step": 79272, "epoch": 471} {"train_loss": -9.09744644165039, "global_step": 79273, "epoch": 471} {"train_loss": -9.19219970703125, "global_step": 79274, "epoch": 471} {"train_loss": -9.376955032348633, "global_step": 79275, "epoch": 471} {"train_loss": -9.400239944458008, "global_step": 79276, "epoch": 471} {"train_loss": -9.446310997009277, "global_step": 79277, "epoch": 471} {"train_loss": -9.363813400268555, "global_step": 79278, "epoch": 471} {"train_loss": -9.572121620178223, "global_step": 79279, "epoch": 471} {"train_loss": -9.362678527832031, "global_step": 79280, "epoch": 471} {"train_loss": -9.339457511901855, "global_step": 79281, "epoch": 471} {"train_loss": -9.157227516174316, "global_step": 79282, "epoch": 471} {"train_loss": -9.305049896240234, "global_step": 79283, "epoch": 471} {"train_loss": -9.013781547546387, "global_step": 79284, "epoch": 471} {"train_loss": -9.305801391601562, "global_step": 79285, "epoch": 471} {"train_loss": -9.151430130004883, "global_step": 79286, "epoch": 471} {"train_loss": -9.142622947692871, "global_step": 79287, "epoch": 471} {"train_loss": -9.431722640991211, "global_step": 79288, "epoch": 471} {"train_loss": -9.026996612548828, "global_step": 79289, "epoch": 471} {"train_loss": -9.211771011352539, "global_step": 79290, "epoch": 471} {"train_loss": -9.213821411132812, "global_step": 79291, "epoch": 471} {"train_loss": -8.795075416564941, "global_step": 79292, "epoch": 471} {"train_loss": -9.185298919677734, "global_step": 79293, "epoch": 471} {"train_loss": -8.637388229370117, "global_step": 79294, "epoch": 471} {"train_loss": -9.118456443150839, "global_step": 79295, "epoch": 471, "val_loss": 196157.453125} {"train_loss": -8.604169845581055, "global_step": 79296, "epoch": 472} {"train_loss": -8.723828315734863, "global_step": 79297, "epoch": 472} {"train_loss": -8.627366065979004, "global_step": 79298, "epoch": 472} {"train_loss": -8.729219436645508, "global_step": 79299, "epoch": 472} {"train_loss": -8.914641380310059, "global_step": 79300, "epoch": 472} {"train_loss": -8.573792457580566, "global_step": 79301, "epoch": 472} {"train_loss": -8.508363723754883, "global_step": 79302, "epoch": 472} {"train_loss": -8.588268280029297, "global_step": 79303, "epoch": 472} {"train_loss": -8.443239212036133, "global_step": 79304, "epoch": 472} {"train_loss": -8.57961654663086, "global_step": 79305, "epoch": 472} {"train_loss": -8.7910795211792, "global_step": 79306, "epoch": 472} {"train_loss": -8.780734062194824, "global_step": 79307, "epoch": 472} {"train_loss": -8.850754737854004, "global_step": 79308, "epoch": 472} {"train_loss": -8.92911148071289, "global_step": 79309, "epoch": 472} {"train_loss": -8.853144645690918, "global_step": 79310, "epoch": 472} {"train_loss": -8.855313301086426, "global_step": 79311, "epoch": 472} {"train_loss": -8.713382720947266, "global_step": 79312, "epoch": 472} {"train_loss": -8.941946029663086, "global_step": 79313, "epoch": 472} {"train_loss": -8.97207260131836, "global_step": 79314, "epoch": 472} {"train_loss": -8.886245727539062, "global_step": 79315, "epoch": 472} {"train_loss": -8.72943115234375, "global_step": 79316, "epoch": 472} {"train_loss": -8.920246124267578, "global_step": 79317, "epoch": 472} {"train_loss": -9.072097778320312, "global_step": 79318, "epoch": 472} {"train_loss": -8.911470413208008, "global_step": 79319, "epoch": 472} {"train_loss": -9.053476333618164, "global_step": 79320, "epoch": 472} {"train_loss": -9.310333251953125, "global_step": 79321, "epoch": 472} {"train_loss": -9.138635635375977, "global_step": 79322, "epoch": 472} {"train_loss": -9.060456275939941, "global_step": 79323, "epoch": 472} {"train_loss": -9.171098709106445, "global_step": 79324, "epoch": 472} {"train_loss": -9.05129623413086, "global_step": 79325, "epoch": 472} {"train_loss": -8.901928901672363, "global_step": 79326, "epoch": 472} {"train_loss": -9.094560623168945, "global_step": 79327, "epoch": 472} {"train_loss": -9.416991233825684, "global_step": 79328, "epoch": 472} {"train_loss": -9.31134033203125, "global_step": 79329, "epoch": 472} {"train_loss": -9.065492630004883, "global_step": 79330, "epoch": 472} {"train_loss": -9.183433532714844, "global_step": 79331, "epoch": 472} {"train_loss": -9.21909236907959, "global_step": 79332, "epoch": 472} {"train_loss": -9.345209121704102, "global_step": 79333, "epoch": 472} {"train_loss": -9.250679969787598, "global_step": 79334, "epoch": 472} {"train_loss": -9.264076232910156, "global_step": 79335, "epoch": 472} {"train_loss": -9.362467765808105, "global_step": 79336, "epoch": 472} {"train_loss": -9.421327590942383, "global_step": 79337, "epoch": 472} {"train_loss": -9.511543273925781, "global_step": 79338, "epoch": 472} {"train_loss": -9.108743667602539, "global_step": 79339, "epoch": 472} {"train_loss": -9.42263126373291, "global_step": 79340, "epoch": 472} {"train_loss": -9.064988136291504, "global_step": 79341, "epoch": 472} {"train_loss": -9.343562126159668, "global_step": 79342, "epoch": 472} {"train_loss": -9.128538131713867, "global_step": 79343, "epoch": 472} {"train_loss": -8.94188404083252, "global_step": 79344, "epoch": 472} {"train_loss": -9.295324325561523, "global_step": 79345, "epoch": 472} {"train_loss": -8.98049545288086, "global_step": 79346, "epoch": 472} {"train_loss": -9.219606399536133, "global_step": 79347, "epoch": 472} {"train_loss": -9.038087844848633, "global_step": 79348, "epoch": 472} {"train_loss": -8.943421363830566, "global_step": 79349, "epoch": 472} {"train_loss": -9.170597076416016, "global_step": 79350, "epoch": 472} {"train_loss": -9.175199508666992, "global_step": 79351, "epoch": 472} {"train_loss": -9.161857604980469, "global_step": 79352, "epoch": 472} {"train_loss": -9.341727256774902, "global_step": 79353, "epoch": 472} {"train_loss": -9.213310241699219, "global_step": 79354, "epoch": 472} {"train_loss": -9.034201622009277, "global_step": 79355, "epoch": 472} {"train_loss": -9.218233108520508, "global_step": 79356, "epoch": 472} {"train_loss": -8.856640815734863, "global_step": 79357, "epoch": 472} {"train_loss": -9.197614669799805, "global_step": 79358, "epoch": 472} {"train_loss": -9.04128360748291, "global_step": 79359, "epoch": 472} {"train_loss": -8.853008270263672, "global_step": 79360, "epoch": 472} {"train_loss": -9.03752613067627, "global_step": 79361, "epoch": 472} {"train_loss": -9.02690601348877, "global_step": 79362, "epoch": 472} {"train_loss": -9.117424964904785, "global_step": 79363, "epoch": 472} {"train_loss": -9.242314338684082, "global_step": 79364, "epoch": 472} {"train_loss": -8.906192779541016, "global_step": 79365, "epoch": 472} {"train_loss": -9.12870979309082, "global_step": 79366, "epoch": 472} {"train_loss": -8.932779312133789, "global_step": 79367, "epoch": 472} {"train_loss": -8.895530700683594, "global_step": 79368, "epoch": 472} {"train_loss": -9.001141548156738, "global_step": 79369, "epoch": 472} {"train_loss": -8.982674598693848, "global_step": 79370, "epoch": 472} {"train_loss": -8.986164093017578, "global_step": 79371, "epoch": 472} {"train_loss": -9.237749099731445, "global_step": 79372, "epoch": 472} {"train_loss": -8.94444465637207, "global_step": 79373, "epoch": 472} {"train_loss": -9.10826301574707, "global_step": 79374, "epoch": 472} {"train_loss": -9.090636253356934, "global_step": 79375, "epoch": 472} {"train_loss": -8.952142715454102, "global_step": 79376, "epoch": 472} {"train_loss": -8.911393165588379, "global_step": 79377, "epoch": 472} {"train_loss": -9.17667293548584, "global_step": 79378, "epoch": 472} {"train_loss": -8.984914779663086, "global_step": 79379, "epoch": 472} {"train_loss": -9.090448379516602, "global_step": 79380, "epoch": 472} {"train_loss": -9.132225036621094, "global_step": 79381, "epoch": 472} {"train_loss": -9.056070327758789, "global_step": 79382, "epoch": 472} {"train_loss": -8.750718116760254, "global_step": 79383, "epoch": 472} {"train_loss": -9.14824104309082, "global_step": 79384, "epoch": 472} {"train_loss": -9.363895416259766, "global_step": 79385, "epoch": 472} {"train_loss": -9.18101692199707, "global_step": 79386, "epoch": 472} {"train_loss": -9.088926315307617, "global_step": 79387, "epoch": 472} {"train_loss": -9.133045196533203, "global_step": 79388, "epoch": 472} {"train_loss": -9.187768936157227, "global_step": 79389, "epoch": 472} {"train_loss": -9.18626594543457, "global_step": 79390, "epoch": 472} {"train_loss": -9.247209548950195, "global_step": 79391, "epoch": 472} {"train_loss": -9.239143371582031, "global_step": 79392, "epoch": 472} {"train_loss": -9.239392280578613, "global_step": 79393, "epoch": 472} {"train_loss": -9.306795120239258, "global_step": 79394, "epoch": 472} {"train_loss": -9.102693557739258, "global_step": 79395, "epoch": 472} {"train_loss": -9.46341323852539, "global_step": 79396, "epoch": 472} {"train_loss": -9.15713119506836, "global_step": 79397, "epoch": 472} {"train_loss": -9.22658634185791, "global_step": 79398, "epoch": 472} {"train_loss": -9.265119552612305, "global_step": 79399, "epoch": 472} {"train_loss": -9.444406509399414, "global_step": 79400, "epoch": 472} {"train_loss": -9.024269104003906, "global_step": 79401, "epoch": 472} {"train_loss": -9.2871732711792, "global_step": 79402, "epoch": 472} {"train_loss": -9.244330406188965, "global_step": 79403, "epoch": 472} {"train_loss": -9.245140075683594, "global_step": 79404, "epoch": 472} {"train_loss": -9.040689468383789, "global_step": 79405, "epoch": 472} {"train_loss": -9.354782104492188, "global_step": 79406, "epoch": 472} {"train_loss": -9.400196075439453, "global_step": 79407, "epoch": 472} {"train_loss": -9.17905330657959, "global_step": 79408, "epoch": 472} {"train_loss": -9.16336441040039, "global_step": 79409, "epoch": 472} {"train_loss": -9.464700698852539, "global_step": 79410, "epoch": 472} {"train_loss": -8.88790512084961, "global_step": 79411, "epoch": 472} {"train_loss": -9.044876098632812, "global_step": 79412, "epoch": 472} {"train_loss": -9.13977336883545, "global_step": 79413, "epoch": 472} {"train_loss": -9.166004180908203, "global_step": 79414, "epoch": 472} {"train_loss": -8.9695405960083, "global_step": 79415, "epoch": 472} {"train_loss": -9.155620574951172, "global_step": 79416, "epoch": 472} {"train_loss": -8.919103622436523, "global_step": 79417, "epoch": 472} {"train_loss": -9.285423278808594, "global_step": 79418, "epoch": 472} {"train_loss": -9.242208480834961, "global_step": 79419, "epoch": 472} {"train_loss": -9.37258529663086, "global_step": 79420, "epoch": 472} {"train_loss": -9.120052337646484, "global_step": 79421, "epoch": 472} {"train_loss": -9.033392906188965, "global_step": 79422, "epoch": 472} {"train_loss": -9.455835342407227, "global_step": 79423, "epoch": 472} {"train_loss": -9.302047729492188, "global_step": 79424, "epoch": 472} {"train_loss": -9.29139518737793, "global_step": 79425, "epoch": 472} {"train_loss": -9.244405746459961, "global_step": 79426, "epoch": 472} {"train_loss": -9.38658332824707, "global_step": 79427, "epoch": 472} {"train_loss": -9.421194076538086, "global_step": 79428, "epoch": 472} {"train_loss": -9.386383056640625, "global_step": 79429, "epoch": 472} {"train_loss": -9.197265625, "global_step": 79430, "epoch": 472} {"train_loss": -9.38537883758545, "global_step": 79431, "epoch": 472} {"train_loss": -8.69471263885498, "global_step": 79432, "epoch": 472} {"train_loss": -9.267738342285156, "global_step": 79433, "epoch": 472} {"train_loss": -8.856659889221191, "global_step": 79434, "epoch": 472} {"train_loss": -9.069260597229004, "global_step": 79435, "epoch": 472} {"train_loss": -8.651788711547852, "global_step": 79436, "epoch": 472} {"train_loss": -8.92082405090332, "global_step": 79437, "epoch": 472} {"train_loss": -9.230688095092773, "global_step": 79438, "epoch": 472} {"train_loss": -9.154878616333008, "global_step": 79439, "epoch": 472} {"train_loss": -9.25452995300293, "global_step": 79440, "epoch": 472} {"train_loss": -8.88387680053711, "global_step": 79441, "epoch": 472} {"train_loss": -9.179059982299805, "global_step": 79442, "epoch": 472} {"train_loss": -8.720848083496094, "global_step": 79443, "epoch": 472} {"train_loss": -9.194377899169922, "global_step": 79444, "epoch": 472} {"train_loss": -9.38936710357666, "global_step": 79445, "epoch": 472} {"train_loss": -9.079858779907227, "global_step": 79446, "epoch": 472} {"train_loss": -8.85505485534668, "global_step": 79447, "epoch": 472} {"train_loss": -9.138875007629395, "global_step": 79448, "epoch": 472} {"train_loss": -9.013251304626465, "global_step": 79449, "epoch": 472} {"train_loss": -8.775394439697266, "global_step": 79450, "epoch": 472} {"train_loss": -9.072678565979004, "global_step": 79451, "epoch": 472} {"train_loss": -8.9567289352417, "global_step": 79452, "epoch": 472} {"train_loss": -9.055805206298828, "global_step": 79453, "epoch": 472} {"train_loss": -9.06740951538086, "global_step": 79454, "epoch": 472} {"train_loss": -9.29430866241455, "global_step": 79455, "epoch": 472} {"train_loss": -9.274292945861816, "global_step": 79456, "epoch": 472} {"train_loss": -9.044334411621094, "global_step": 79457, "epoch": 472} {"train_loss": -9.33175277709961, "global_step": 79458, "epoch": 472} {"train_loss": -9.023077011108398, "global_step": 79459, "epoch": 472} {"train_loss": -9.334938049316406, "global_step": 79460, "epoch": 472} {"train_loss": -9.199385643005371, "global_step": 79461, "epoch": 472} {"train_loss": -9.175838470458984, "global_step": 79462, "epoch": 472} {"train_loss": -9.09115810053689, "global_step": 79463, "epoch": 472, "val_loss": 196921.78125} {"train_loss": -9.416705131530762, "global_step": 79464, "epoch": 473} {"train_loss": -9.328222274780273, "global_step": 79465, "epoch": 473} {"train_loss": -9.085855484008789, "global_step": 79466, "epoch": 473} {"train_loss": -9.3297119140625, "global_step": 79467, "epoch": 473} {"train_loss": -9.025287628173828, "global_step": 79468, "epoch": 473} {"train_loss": -8.919403076171875, "global_step": 79469, "epoch": 473} {"train_loss": -9.156957626342773, "global_step": 79470, "epoch": 473} {"train_loss": -9.260048866271973, "global_step": 79471, "epoch": 473} {"train_loss": -8.97335433959961, "global_step": 79472, "epoch": 473} {"train_loss": -9.03065299987793, "global_step": 79473, "epoch": 473} {"train_loss": -9.151618957519531, "global_step": 79474, "epoch": 473} {"train_loss": -9.268976211547852, "global_step": 79475, "epoch": 473} {"train_loss": -8.669920921325684, "global_step": 79476, "epoch": 473} {"train_loss": -9.249349594116211, "global_step": 79477, "epoch": 473} {"train_loss": -9.149934768676758, "global_step": 79478, "epoch": 473} {"train_loss": -8.910423278808594, "global_step": 79479, "epoch": 473} {"train_loss": -9.402725219726562, "global_step": 79480, "epoch": 473} {"train_loss": -9.261253356933594, "global_step": 79481, "epoch": 473} {"train_loss": -9.18632698059082, "global_step": 79482, "epoch": 473} {"train_loss": -9.258938789367676, "global_step": 79483, "epoch": 473} {"train_loss": -9.16751766204834, "global_step": 79484, "epoch": 473} {"train_loss": -9.18669319152832, "global_step": 79485, "epoch": 473} {"train_loss": -9.360652923583984, "global_step": 79486, "epoch": 473} {"train_loss": -9.175705909729004, "global_step": 79487, "epoch": 473} {"train_loss": -9.37114143371582, "global_step": 79488, "epoch": 473} {"train_loss": -9.43831729888916, "global_step": 79489, "epoch": 473} {"train_loss": -9.299409866333008, "global_step": 79490, "epoch": 473} {"train_loss": -9.165557861328125, "global_step": 79491, "epoch": 473} {"train_loss": -9.346171379089355, "global_step": 79492, "epoch": 473} {"train_loss": -9.15803337097168, "global_step": 79493, "epoch": 473} {"train_loss": -9.132148742675781, "global_step": 79494, "epoch": 473} {"train_loss": -9.249730110168457, "global_step": 79495, "epoch": 473} {"train_loss": -9.207075119018555, "global_step": 79496, "epoch": 473} {"train_loss": -9.109842300415039, "global_step": 79497, "epoch": 473} {"train_loss": -9.363872528076172, "global_step": 79498, "epoch": 473} {"train_loss": -9.13144302368164, "global_step": 79499, "epoch": 473} {"train_loss": -9.084495544433594, "global_step": 79500, "epoch": 473} {"train_loss": -9.247636795043945, "global_step": 79501, "epoch": 473} {"train_loss": -9.406547546386719, "global_step": 79502, "epoch": 473} {"train_loss": -9.325239181518555, "global_step": 79503, "epoch": 473} {"train_loss": -9.319826126098633, "global_step": 79504, "epoch": 473} {"train_loss": -9.417215347290039, "global_step": 79505, "epoch": 473} {"train_loss": -9.181293487548828, "global_step": 79506, "epoch": 473} {"train_loss": -9.319154739379883, "global_step": 79507, "epoch": 473} {"train_loss": -9.045135498046875, "global_step": 79508, "epoch": 473} {"train_loss": -9.285188674926758, "global_step": 79509, "epoch": 473} {"train_loss": -9.089081764221191, "global_step": 79510, "epoch": 473} {"train_loss": -9.416062355041504, "global_step": 79511, "epoch": 473} {"train_loss": -8.868792533874512, "global_step": 79512, "epoch": 473} {"train_loss": -9.293089866638184, "global_step": 79513, "epoch": 473} {"train_loss": -9.135385513305664, "global_step": 79514, "epoch": 473} {"train_loss": -9.190201759338379, "global_step": 79515, "epoch": 473} {"train_loss": -9.16126823425293, "global_step": 79516, "epoch": 473} {"train_loss": -9.439226150512695, "global_step": 79517, "epoch": 473} {"train_loss": -9.264920234680176, "global_step": 79518, "epoch": 473} {"train_loss": -9.203510284423828, "global_step": 79519, "epoch": 473} {"train_loss": -9.13651180267334, "global_step": 79520, "epoch": 473} {"train_loss": -9.394001960754395, "global_step": 79521, "epoch": 473} {"train_loss": -9.10055923461914, "global_step": 79522, "epoch": 473} {"train_loss": -9.339879989624023, "global_step": 79523, "epoch": 473} {"train_loss": -9.362349510192871, "global_step": 79524, "epoch": 473} {"train_loss": -9.20576000213623, "global_step": 79525, "epoch": 473} {"train_loss": -9.306449890136719, "global_step": 79526, "epoch": 473} {"train_loss": -9.069604873657227, "global_step": 79527, "epoch": 473} {"train_loss": -9.402120590209961, "global_step": 79528, "epoch": 473} {"train_loss": -9.156230926513672, "global_step": 79529, "epoch": 473} {"train_loss": -9.136012077331543, "global_step": 79530, "epoch": 473} {"train_loss": -9.447006225585938, "global_step": 79531, "epoch": 473} {"train_loss": -9.490839004516602, "global_step": 79532, "epoch": 473} {"train_loss": -9.269370079040527, "global_step": 79533, "epoch": 473} {"train_loss": -9.260053634643555, "global_step": 79534, "epoch": 473} {"train_loss": -9.31306266784668, "global_step": 79535, "epoch": 473} {"train_loss": -9.420967102050781, "global_step": 79536, "epoch": 473} {"train_loss": -9.463018417358398, "global_step": 79537, "epoch": 473} {"train_loss": -9.234643936157227, "global_step": 79538, "epoch": 473} {"train_loss": -9.075643539428711, "global_step": 79539, "epoch": 473} {"train_loss": -8.874624252319336, "global_step": 79540, "epoch": 473} {"train_loss": -9.173027038574219, "global_step": 79541, "epoch": 473} {"train_loss": -9.108129501342773, "global_step": 79542, "epoch": 473} {"train_loss": -9.166040420532227, "global_step": 79543, "epoch": 473} {"train_loss": -8.860637664794922, "global_step": 79544, "epoch": 473} {"train_loss": -9.170331001281738, "global_step": 79545, "epoch": 473} {"train_loss": -9.147979736328125, "global_step": 79546, "epoch": 473} {"train_loss": -9.111556053161621, "global_step": 79547, "epoch": 473} {"train_loss": -8.954015731811523, "global_step": 79548, "epoch": 473} {"train_loss": -9.290132522583008, "global_step": 79549, "epoch": 473} {"train_loss": -9.200254440307617, "global_step": 79550, "epoch": 473} {"train_loss": -8.82579231262207, "global_step": 79551, "epoch": 473} {"train_loss": -9.19818115234375, "global_step": 79552, "epoch": 473} {"train_loss": -8.923572540283203, "global_step": 79553, "epoch": 473} {"train_loss": -8.983814239501953, "global_step": 79554, "epoch": 473} {"train_loss": -8.988822937011719, "global_step": 79555, "epoch": 473} {"train_loss": -8.948562622070312, "global_step": 79556, "epoch": 473} {"train_loss": -8.848258018493652, "global_step": 79557, "epoch": 473} {"train_loss": -9.120372772216797, "global_step": 79558, "epoch": 473} {"train_loss": -9.332555770874023, "global_step": 79559, "epoch": 473} {"train_loss": -9.059189796447754, "global_step": 79560, "epoch": 473} {"train_loss": -9.085997581481934, "global_step": 79561, "epoch": 473} {"train_loss": -9.05606460571289, "global_step": 79562, "epoch": 473} {"train_loss": -9.090771675109863, "global_step": 79563, "epoch": 473} {"train_loss": -8.875274658203125, "global_step": 79564, "epoch": 473} {"train_loss": -9.110180854797363, "global_step": 79565, "epoch": 473} {"train_loss": -8.893659591674805, "global_step": 79566, "epoch": 473} {"train_loss": -8.985211372375488, "global_step": 79567, "epoch": 473} {"train_loss": -8.941681861877441, "global_step": 79568, "epoch": 473} {"train_loss": -8.998921394348145, "global_step": 79569, "epoch": 473} {"train_loss": -8.948299407958984, "global_step": 79570, "epoch": 473} {"train_loss": -8.878779411315918, "global_step": 79571, "epoch": 473} {"train_loss": -9.13209056854248, "global_step": 79572, "epoch": 473} {"train_loss": -8.591794967651367, "global_step": 79573, "epoch": 473} {"train_loss": -9.119932174682617, "global_step": 79574, "epoch": 473} {"train_loss": -9.04415512084961, "global_step": 79575, "epoch": 473} {"train_loss": -8.996339797973633, "global_step": 79576, "epoch": 473} {"train_loss": -8.799570083618164, "global_step": 79577, "epoch": 473} {"train_loss": -9.118927001953125, "global_step": 79578, "epoch": 473} {"train_loss": -9.155765533447266, "global_step": 79579, "epoch": 473} {"train_loss": -8.911603927612305, "global_step": 79580, "epoch": 473} {"train_loss": -9.24562931060791, "global_step": 79581, "epoch": 473} {"train_loss": -9.296728134155273, "global_step": 79582, "epoch": 473} {"train_loss": -9.431974411010742, "global_step": 79583, "epoch": 473} {"train_loss": -9.229562759399414, "global_step": 79584, "epoch": 473} {"train_loss": -9.29534912109375, "global_step": 79585, "epoch": 473} {"train_loss": -9.285135269165039, "global_step": 79586, "epoch": 473} {"train_loss": -9.09567642211914, "global_step": 79587, "epoch": 473} {"train_loss": -9.284022331237793, "global_step": 79588, "epoch": 473} {"train_loss": -9.176013946533203, "global_step": 79589, "epoch": 473} {"train_loss": -9.383840560913086, "global_step": 79590, "epoch": 473} {"train_loss": -9.386014938354492, "global_step": 79591, "epoch": 473} {"train_loss": -9.16745376586914, "global_step": 79592, "epoch": 473} {"train_loss": -9.152678489685059, "global_step": 79593, "epoch": 473} {"train_loss": -9.18350601196289, "global_step": 79594, "epoch": 473} {"train_loss": -9.059284210205078, "global_step": 79595, "epoch": 473} {"train_loss": -9.146669387817383, "global_step": 79596, "epoch": 473} {"train_loss": -9.442238807678223, "global_step": 79597, "epoch": 473} {"train_loss": -9.037213325500488, "global_step": 79598, "epoch": 473} {"train_loss": -9.179535865783691, "global_step": 79599, "epoch": 473} {"train_loss": -9.18394947052002, "global_step": 79600, "epoch": 473} {"train_loss": -8.827864646911621, "global_step": 79601, "epoch": 473} {"train_loss": -9.200607299804688, "global_step": 79602, "epoch": 473} {"train_loss": -9.184913635253906, "global_step": 79603, "epoch": 473} {"train_loss": -9.231921195983887, "global_step": 79604, "epoch": 473} {"train_loss": -9.330764770507812, "global_step": 79605, "epoch": 473} {"train_loss": -9.055780410766602, "global_step": 79606, "epoch": 473} {"train_loss": -9.13167953491211, "global_step": 79607, "epoch": 473} {"train_loss": -9.1785249710083, "global_step": 79608, "epoch": 473} {"train_loss": -9.274195671081543, "global_step": 79609, "epoch": 473} {"train_loss": -9.271194458007812, "global_step": 79610, "epoch": 473} {"train_loss": -8.92558479309082, "global_step": 79611, "epoch": 473} {"train_loss": -9.330331802368164, "global_step": 79612, "epoch": 473} {"train_loss": -9.007308959960938, "global_step": 79613, "epoch": 473} {"train_loss": -9.148056983947754, "global_step": 79614, "epoch": 473} {"train_loss": -9.059823989868164, "global_step": 79615, "epoch": 473} {"train_loss": -9.016317367553711, "global_step": 79616, "epoch": 473} {"train_loss": -8.864588737487793, "global_step": 79617, "epoch": 473} {"train_loss": -8.782232284545898, "global_step": 79618, "epoch": 473} {"train_loss": -8.852848052978516, "global_step": 79619, "epoch": 473} {"train_loss": -8.550970077514648, "global_step": 79620, "epoch": 473} {"train_loss": -9.141424179077148, "global_step": 79621, "epoch": 473} {"train_loss": -8.587991714477539, "global_step": 79622, "epoch": 473} {"train_loss": -9.197473526000977, "global_step": 79623, "epoch": 473} {"train_loss": -8.815937995910645, "global_step": 79624, "epoch": 473} {"train_loss": -8.791411399841309, "global_step": 79625, "epoch": 473} {"train_loss": -9.023500442504883, "global_step": 79626, "epoch": 473} {"train_loss": -8.868447303771973, "global_step": 79627, "epoch": 473} {"train_loss": -9.12353801727295, "global_step": 79628, "epoch": 473} {"train_loss": -9.04698371887207, "global_step": 79629, "epoch": 473} {"train_loss": -8.962905883789062, "global_step": 79630, "epoch": 473} {"train_loss": -9.141512910525003, "global_step": 79631, "epoch": 473, "val_loss": 198087.4375} {"train_loss": -9.164311408996582, "global_step": 79632, "epoch": 474} {"train_loss": -9.081274032592773, "global_step": 79633, "epoch": 474} {"train_loss": -9.361991882324219, "global_step": 79634, "epoch": 474} {"train_loss": -9.443450927734375, "global_step": 79635, "epoch": 474} {"train_loss": -9.212933540344238, "global_step": 79636, "epoch": 474} {"train_loss": -9.229829788208008, "global_step": 79637, "epoch": 474} {"train_loss": -9.056514739990234, "global_step": 79638, "epoch": 474} {"train_loss": -9.362602233886719, "global_step": 79639, "epoch": 474} {"train_loss": -9.096700668334961, "global_step": 79640, "epoch": 474} {"train_loss": -9.09576416015625, "global_step": 79641, "epoch": 474} {"train_loss": -9.45534896850586, "global_step": 79642, "epoch": 474} {"train_loss": -9.285839080810547, "global_step": 79643, "epoch": 474} {"train_loss": -9.231430053710938, "global_step": 79644, "epoch": 474} {"train_loss": -9.194503784179688, "global_step": 79645, "epoch": 474} {"train_loss": -9.231294631958008, "global_step": 79646, "epoch": 474} {"train_loss": -9.299520492553711, "global_step": 79647, "epoch": 474} {"train_loss": -9.249195098876953, "global_step": 79648, "epoch": 474} {"train_loss": -9.389444351196289, "global_step": 79649, "epoch": 474} {"train_loss": -9.485261917114258, "global_step": 79650, "epoch": 474} {"train_loss": -9.205087661743164, "global_step": 79651, "epoch": 474} {"train_loss": -9.220149993896484, "global_step": 79652, "epoch": 474} {"train_loss": -9.485200881958008, "global_step": 79653, "epoch": 474} {"train_loss": -9.07669448852539, "global_step": 79654, "epoch": 474} {"train_loss": -9.368361473083496, "global_step": 79655, "epoch": 474} {"train_loss": -9.123491287231445, "global_step": 79656, "epoch": 474} {"train_loss": -9.206498146057129, "global_step": 79657, "epoch": 474} {"train_loss": -9.37933349609375, "global_step": 79658, "epoch": 474} {"train_loss": -9.38379955291748, "global_step": 79659, "epoch": 474} {"train_loss": -9.33993911743164, "global_step": 79660, "epoch": 474} {"train_loss": -9.487062454223633, "global_step": 79661, "epoch": 474} {"train_loss": -9.220869064331055, "global_step": 79662, "epoch": 474} {"train_loss": -9.588562965393066, "global_step": 79663, "epoch": 474} {"train_loss": -9.341700553894043, "global_step": 79664, "epoch": 474} {"train_loss": -9.12663459777832, "global_step": 79665, "epoch": 474} {"train_loss": -9.27231216430664, "global_step": 79666, "epoch": 474} {"train_loss": -9.040773391723633, "global_step": 79667, "epoch": 474} {"train_loss": -9.134674072265625, "global_step": 79668, "epoch": 474} {"train_loss": -8.941886901855469, "global_step": 79669, "epoch": 474} {"train_loss": -8.9811372756958, "global_step": 79670, "epoch": 474} {"train_loss": -8.683481216430664, "global_step": 79671, "epoch": 474} {"train_loss": -8.645877838134766, "global_step": 79672, "epoch": 474} {"train_loss": -8.901692390441895, "global_step": 79673, "epoch": 474} {"train_loss": -8.348555564880371, "global_step": 79674, "epoch": 474} {"train_loss": -8.820884704589844, "global_step": 79675, "epoch": 474} {"train_loss": -8.993231773376465, "global_step": 79676, "epoch": 474} {"train_loss": -8.490289688110352, "global_step": 79677, "epoch": 474} {"train_loss": -8.902168273925781, "global_step": 79678, "epoch": 474} {"train_loss": -8.803759574890137, "global_step": 79679, "epoch": 474} {"train_loss": -8.629937171936035, "global_step": 79680, "epoch": 474} {"train_loss": -8.850889205932617, "global_step": 79681, "epoch": 474} {"train_loss": -8.795814514160156, "global_step": 79682, "epoch": 474} {"train_loss": -8.9525146484375, "global_step": 79683, "epoch": 474} {"train_loss": -8.803281784057617, "global_step": 79684, "epoch": 474} {"train_loss": -9.01640510559082, "global_step": 79685, "epoch": 474} {"train_loss": -9.00204849243164, "global_step": 79686, "epoch": 474} {"train_loss": -8.827299118041992, "global_step": 79687, "epoch": 474} {"train_loss": -9.342789649963379, "global_step": 79688, "epoch": 474} {"train_loss": -8.697242736816406, "global_step": 79689, "epoch": 474} {"train_loss": -8.875347137451172, "global_step": 79690, "epoch": 474} {"train_loss": -9.071512222290039, "global_step": 79691, "epoch": 474} {"train_loss": -8.919788360595703, "global_step": 79692, "epoch": 474} {"train_loss": -9.058887481689453, "global_step": 79693, "epoch": 474} {"train_loss": -9.23264217376709, "global_step": 79694, "epoch": 474} {"train_loss": -9.040966033935547, "global_step": 79695, "epoch": 474} {"train_loss": -9.23193359375, "global_step": 79696, "epoch": 474} {"train_loss": -9.181305885314941, "global_step": 79697, "epoch": 474} {"train_loss": -9.102285385131836, "global_step": 79698, "epoch": 474} {"train_loss": -9.342933654785156, "global_step": 79699, "epoch": 474} {"train_loss": -9.22219181060791, "global_step": 79700, "epoch": 474} {"train_loss": -9.222719192504883, "global_step": 79701, "epoch": 474} {"train_loss": -9.350541114807129, "global_step": 79702, "epoch": 474} {"train_loss": -9.312668800354004, "global_step": 79703, "epoch": 474} {"train_loss": -9.151312828063965, "global_step": 79704, "epoch": 474} {"train_loss": -9.261310577392578, "global_step": 79705, "epoch": 474} {"train_loss": -9.375788688659668, "global_step": 79706, "epoch": 474} {"train_loss": -8.947488784790039, "global_step": 79707, "epoch": 474} {"train_loss": -9.228981018066406, "global_step": 79708, "epoch": 474} {"train_loss": -9.298393249511719, "global_step": 79709, "epoch": 474} {"train_loss": -9.320552825927734, "global_step": 79710, "epoch": 474} {"train_loss": -9.35489559173584, "global_step": 79711, "epoch": 474} {"train_loss": -9.407926559448242, "global_step": 79712, "epoch": 474} {"train_loss": -9.392961502075195, "global_step": 79713, "epoch": 474} {"train_loss": -9.346353530883789, "global_step": 79714, "epoch": 474} {"train_loss": -9.105424880981445, "global_step": 79715, "epoch": 474} {"train_loss": -9.454952239990234, "global_step": 79716, "epoch": 474} {"train_loss": -9.035909652709961, "global_step": 79717, "epoch": 474} {"train_loss": -9.199819564819336, "global_step": 79718, "epoch": 474} {"train_loss": -9.214049339294434, "global_step": 79719, "epoch": 474} {"train_loss": -9.044910430908203, "global_step": 79720, "epoch": 474} {"train_loss": -8.791085243225098, "global_step": 79721, "epoch": 474} {"train_loss": -9.128559112548828, "global_step": 79722, "epoch": 474} {"train_loss": -9.053030014038086, "global_step": 79723, "epoch": 474} {"train_loss": -9.146245956420898, "global_step": 79724, "epoch": 474} {"train_loss": -8.78790283203125, "global_step": 79725, "epoch": 474} {"train_loss": -9.138269424438477, "global_step": 79726, "epoch": 474} {"train_loss": -8.875492095947266, "global_step": 79727, "epoch": 474} {"train_loss": -9.096479415893555, "global_step": 79728, "epoch": 474} {"train_loss": -9.248876571655273, "global_step": 79729, "epoch": 474} {"train_loss": -9.078615188598633, "global_step": 79730, "epoch": 474} {"train_loss": -9.153420448303223, "global_step": 79731, "epoch": 474} {"train_loss": -8.78529167175293, "global_step": 79732, "epoch": 474} {"train_loss": -9.129847526550293, "global_step": 79733, "epoch": 474} {"train_loss": -9.043083190917969, "global_step": 79734, "epoch": 474} {"train_loss": -9.03934383392334, "global_step": 79735, "epoch": 474} {"train_loss": -8.782308578491211, "global_step": 79736, "epoch": 474} {"train_loss": -9.066814422607422, "global_step": 79737, "epoch": 474} {"train_loss": -9.116409301757812, "global_step": 79738, "epoch": 474} {"train_loss": -9.222890853881836, "global_step": 79739, "epoch": 474} {"train_loss": -9.108415603637695, "global_step": 79740, "epoch": 474} {"train_loss": -9.337018966674805, "global_step": 79741, "epoch": 474} {"train_loss": -9.025405883789062, "global_step": 79742, "epoch": 474} {"train_loss": -8.64578628540039, "global_step": 79743, "epoch": 474} {"train_loss": -9.229161262512207, "global_step": 79744, "epoch": 474} {"train_loss": -9.030247688293457, "global_step": 79745, "epoch": 474} {"train_loss": -9.233722686767578, "global_step": 79746, "epoch": 474} {"train_loss": -9.17132568359375, "global_step": 79747, "epoch": 474} {"train_loss": -9.238734245300293, "global_step": 79748, "epoch": 474} {"train_loss": -9.274742126464844, "global_step": 79749, "epoch": 474} {"train_loss": -9.280023574829102, "global_step": 79750, "epoch": 474} {"train_loss": -9.419257164001465, "global_step": 79751, "epoch": 474} {"train_loss": -9.017894744873047, "global_step": 79752, "epoch": 474} {"train_loss": -8.89593505859375, "global_step": 79753, "epoch": 474} {"train_loss": -9.093965530395508, "global_step": 79754, "epoch": 474} {"train_loss": -9.410028457641602, "global_step": 79755, "epoch": 474} {"train_loss": -9.11610221862793, "global_step": 79756, "epoch": 474} {"train_loss": -9.105393409729004, "global_step": 79757, "epoch": 474} {"train_loss": -8.841315269470215, "global_step": 79758, "epoch": 474} {"train_loss": -9.362200736999512, "global_step": 79759, "epoch": 474} {"train_loss": -8.552942276000977, "global_step": 79760, "epoch": 474} {"train_loss": -9.58542251586914, "global_step": 79761, "epoch": 474} {"train_loss": -8.735251426696777, "global_step": 79762, "epoch": 474} {"train_loss": -9.182428359985352, "global_step": 79763, "epoch": 474} {"train_loss": -8.871978759765625, "global_step": 79764, "epoch": 474} {"train_loss": -9.282024383544922, "global_step": 79765, "epoch": 474} {"train_loss": -9.040348052978516, "global_step": 79766, "epoch": 474} {"train_loss": -9.108621597290039, "global_step": 79767, "epoch": 474} {"train_loss": -9.019285202026367, "global_step": 79768, "epoch": 474} {"train_loss": -9.15134048461914, "global_step": 79769, "epoch": 474} {"train_loss": -8.962259292602539, "global_step": 79770, "epoch": 474} {"train_loss": -9.164007186889648, "global_step": 79771, "epoch": 474} {"train_loss": -9.050088882446289, "global_step": 79772, "epoch": 474} {"train_loss": -9.035555839538574, "global_step": 79773, "epoch": 474} {"train_loss": -9.261996269226074, "global_step": 79774, "epoch": 474} {"train_loss": -8.772491455078125, "global_step": 79775, "epoch": 474} {"train_loss": -9.147677421569824, "global_step": 79776, "epoch": 474} {"train_loss": -9.184062957763672, "global_step": 79777, "epoch": 474} {"train_loss": -9.035789489746094, "global_step": 79778, "epoch": 474} {"train_loss": -8.930644035339355, "global_step": 79779, "epoch": 474} {"train_loss": -9.290679931640625, "global_step": 79780, "epoch": 474} {"train_loss": -9.173100471496582, "global_step": 79781, "epoch": 474} {"train_loss": -9.20648193359375, "global_step": 79782, "epoch": 474} {"train_loss": -9.020671844482422, "global_step": 79783, "epoch": 474} {"train_loss": -9.245532989501953, "global_step": 79784, "epoch": 474} {"train_loss": -9.186603546142578, "global_step": 79785, "epoch": 474} {"train_loss": -9.38365650177002, "global_step": 79786, "epoch": 474} {"train_loss": -9.368959426879883, "global_step": 79787, "epoch": 474} {"train_loss": -9.358417510986328, "global_step": 79788, "epoch": 474} {"train_loss": -9.29095458984375, "global_step": 79789, "epoch": 474} {"train_loss": -9.340850830078125, "global_step": 79790, "epoch": 474} {"train_loss": -9.060746192932129, "global_step": 79791, "epoch": 474} {"train_loss": -9.135337829589844, "global_step": 79792, "epoch": 474} {"train_loss": -9.287853240966797, "global_step": 79793, "epoch": 474} {"train_loss": -9.052035331726074, "global_step": 79794, "epoch": 474} {"train_loss": -9.283212661743164, "global_step": 79795, "epoch": 474} {"train_loss": -9.11962890625, "global_step": 79796, "epoch": 474} {"train_loss": -9.293889045715332, "global_step": 79797, "epoch": 474} {"train_loss": -9.320712089538574, "global_step": 79798, "epoch": 474} {"train_loss": -9.12732830501738, "global_step": 79799, "epoch": 474, "val_loss": 196263.203125} {"train_loss": -9.284679412841797, "global_step": 79800, "epoch": 475} {"train_loss": -9.041126251220703, "global_step": 79801, "epoch": 475} {"train_loss": -9.286438941955566, "global_step": 79802, "epoch": 475} {"train_loss": -9.27429485321045, "global_step": 79803, "epoch": 475} {"train_loss": -9.256797790527344, "global_step": 79804, "epoch": 475} {"train_loss": -8.897351264953613, "global_step": 79805, "epoch": 475} {"train_loss": -9.155925750732422, "global_step": 79806, "epoch": 475} {"train_loss": -9.124582290649414, "global_step": 79807, "epoch": 475} {"train_loss": -9.24160385131836, "global_step": 79808, "epoch": 475} {"train_loss": -9.276607513427734, "global_step": 79809, "epoch": 475} {"train_loss": -9.049519538879395, "global_step": 79810, "epoch": 475} {"train_loss": -9.286919593811035, "global_step": 79811, "epoch": 475} {"train_loss": -9.358951568603516, "global_step": 79812, "epoch": 475} {"train_loss": -9.38386344909668, "global_step": 79813, "epoch": 475} {"train_loss": -9.259878158569336, "global_step": 79814, "epoch": 475} {"train_loss": -8.998586654663086, "global_step": 79815, "epoch": 475} {"train_loss": -9.158916473388672, "global_step": 79816, "epoch": 475} {"train_loss": -9.272122383117676, "global_step": 79817, "epoch": 475} {"train_loss": -9.125544548034668, "global_step": 79818, "epoch": 475} {"train_loss": -9.278697967529297, "global_step": 79819, "epoch": 475} {"train_loss": -9.395791053771973, "global_step": 79820, "epoch": 475} {"train_loss": -9.163818359375, "global_step": 79821, "epoch": 475} {"train_loss": -9.47148609161377, "global_step": 79822, "epoch": 475} {"train_loss": -9.26024341583252, "global_step": 79823, "epoch": 475} {"train_loss": -9.227279663085938, "global_step": 79824, "epoch": 475} {"train_loss": -9.176029205322266, "global_step": 79825, "epoch": 475} {"train_loss": -8.933368682861328, "global_step": 79826, "epoch": 475} {"train_loss": -9.604780197143555, "global_step": 79827, "epoch": 475} {"train_loss": -9.067811012268066, "global_step": 79828, "epoch": 475} {"train_loss": -9.40266227722168, "global_step": 79829, "epoch": 475} {"train_loss": -9.341178894042969, "global_step": 79830, "epoch": 475} {"train_loss": -8.993066787719727, "global_step": 79831, "epoch": 475} {"train_loss": -9.157746315002441, "global_step": 79832, "epoch": 475} {"train_loss": -9.290307998657227, "global_step": 79833, "epoch": 475} {"train_loss": -8.898017883300781, "global_step": 79834, "epoch": 475} {"train_loss": -9.146319389343262, "global_step": 79835, "epoch": 475} {"train_loss": -9.116512298583984, "global_step": 79836, "epoch": 475} {"train_loss": -8.813700675964355, "global_step": 79837, "epoch": 475} {"train_loss": -9.062919616699219, "global_step": 79838, "epoch": 475} {"train_loss": -9.231698989868164, "global_step": 79839, "epoch": 475} {"train_loss": -9.220492362976074, "global_step": 79840, "epoch": 475} {"train_loss": -8.959071159362793, "global_step": 79841, "epoch": 475} {"train_loss": -9.339150428771973, "global_step": 79842, "epoch": 475} {"train_loss": -8.954397201538086, "global_step": 79843, "epoch": 475} {"train_loss": -9.01797103881836, "global_step": 79844, "epoch": 475} {"train_loss": -9.12877082824707, "global_step": 79845, "epoch": 475} {"train_loss": -8.793781280517578, "global_step": 79846, "epoch": 475} {"train_loss": -8.997997283935547, "global_step": 79847, "epoch": 475} {"train_loss": -8.6617431640625, "global_step": 79848, "epoch": 475} {"train_loss": -9.147518157958984, "global_step": 79849, "epoch": 475} {"train_loss": -8.943483352661133, "global_step": 79850, "epoch": 475} {"train_loss": -8.867996215820312, "global_step": 79851, "epoch": 475} {"train_loss": -8.9287691116333, "global_step": 79852, "epoch": 475} {"train_loss": -8.98866081237793, "global_step": 79853, "epoch": 475} {"train_loss": -9.139883995056152, "global_step": 79854, "epoch": 475} {"train_loss": -8.932901382446289, "global_step": 79855, "epoch": 475} {"train_loss": -9.087664604187012, "global_step": 79856, "epoch": 475} {"train_loss": -8.971689224243164, "global_step": 79857, "epoch": 475} {"train_loss": -8.724020004272461, "global_step": 79858, "epoch": 475} {"train_loss": -9.019639015197754, "global_step": 79859, "epoch": 475} {"train_loss": -9.096515655517578, "global_step": 79860, "epoch": 475} {"train_loss": -9.054914474487305, "global_step": 79861, "epoch": 475} {"train_loss": -8.951009750366211, "global_step": 79862, "epoch": 475} {"train_loss": -9.095458984375, "global_step": 79863, "epoch": 475} {"train_loss": -9.056741714477539, "global_step": 79864, "epoch": 475} {"train_loss": -9.051990509033203, "global_step": 79865, "epoch": 475} {"train_loss": -8.90103530883789, "global_step": 79866, "epoch": 475} {"train_loss": -8.900497436523438, "global_step": 79867, "epoch": 475} {"train_loss": -9.154820442199707, "global_step": 79868, "epoch": 475} {"train_loss": -9.260522842407227, "global_step": 79869, "epoch": 475} {"train_loss": -9.185264587402344, "global_step": 79870, "epoch": 475} {"train_loss": -9.121848106384277, "global_step": 79871, "epoch": 475} {"train_loss": -9.167230606079102, "global_step": 79872, "epoch": 475} {"train_loss": -9.368492126464844, "global_step": 79873, "epoch": 475} {"train_loss": -9.300716400146484, "global_step": 79874, "epoch": 475} {"train_loss": -9.19739818572998, "global_step": 79875, "epoch": 475} {"train_loss": -9.308215141296387, "global_step": 79876, "epoch": 475} {"train_loss": -9.215717315673828, "global_step": 79877, "epoch": 475} {"train_loss": -9.50405502319336, "global_step": 79878, "epoch": 475} {"train_loss": -9.420928001403809, "global_step": 79879, "epoch": 475} {"train_loss": -9.517393112182617, "global_step": 79880, "epoch": 475} {"train_loss": -9.156730651855469, "global_step": 79881, "epoch": 475} {"train_loss": -9.351896286010742, "global_step": 79882, "epoch": 475} {"train_loss": -9.016830444335938, "global_step": 79883, "epoch": 475} {"train_loss": -9.425037384033203, "global_step": 79884, "epoch": 475} {"train_loss": -9.54897689819336, "global_step": 79885, "epoch": 475} {"train_loss": -9.520990371704102, "global_step": 79886, "epoch": 475} {"train_loss": -9.273492813110352, "global_step": 79887, "epoch": 475} {"train_loss": -9.393135070800781, "global_step": 79888, "epoch": 475} {"train_loss": -9.518610000610352, "global_step": 79889, "epoch": 475} {"train_loss": -9.429281234741211, "global_step": 79890, "epoch": 475} {"train_loss": -9.389250755310059, "global_step": 79891, "epoch": 475} {"train_loss": -9.284912109375, "global_step": 79892, "epoch": 475} {"train_loss": -9.3053560256958, "global_step": 79893, "epoch": 475} {"train_loss": -9.063251495361328, "global_step": 79894, "epoch": 475} {"train_loss": -9.299629211425781, "global_step": 79895, "epoch": 475} {"train_loss": -9.53492259979248, "global_step": 79896, "epoch": 475} {"train_loss": -9.251607894897461, "global_step": 79897, "epoch": 475} {"train_loss": -8.93341064453125, "global_step": 79898, "epoch": 475} {"train_loss": -9.117982864379883, "global_step": 79899, "epoch": 475} {"train_loss": -9.0535306930542, "global_step": 79900, "epoch": 475} {"train_loss": -8.713410377502441, "global_step": 79901, "epoch": 475} {"train_loss": -9.277978897094727, "global_step": 79902, "epoch": 475} {"train_loss": -8.928434371948242, "global_step": 79903, "epoch": 475} {"train_loss": -9.425543785095215, "global_step": 79904, "epoch": 475} {"train_loss": -8.855133056640625, "global_step": 79905, "epoch": 475} {"train_loss": -9.170087814331055, "global_step": 79906, "epoch": 475} {"train_loss": -9.021710395812988, "global_step": 79907, "epoch": 475} {"train_loss": -9.123831748962402, "global_step": 79908, "epoch": 475} {"train_loss": -9.152153015136719, "global_step": 79909, "epoch": 475} {"train_loss": -9.071739196777344, "global_step": 79910, "epoch": 475} {"train_loss": -9.354073524475098, "global_step": 79911, "epoch": 475} {"train_loss": -9.293622970581055, "global_step": 79912, "epoch": 475} {"train_loss": -9.019855499267578, "global_step": 79913, "epoch": 475} {"train_loss": -9.287271499633789, "global_step": 79914, "epoch": 475} {"train_loss": -9.316707611083984, "global_step": 79915, "epoch": 475} {"train_loss": -9.119494438171387, "global_step": 79916, "epoch": 475} {"train_loss": -9.240671157836914, "global_step": 79917, "epoch": 475} {"train_loss": -9.438423156738281, "global_step": 79918, "epoch": 475} {"train_loss": -9.08420181274414, "global_step": 79919, "epoch": 475} {"train_loss": -9.220818519592285, "global_step": 79920, "epoch": 475} {"train_loss": -9.197028160095215, "global_step": 79921, "epoch": 475} {"train_loss": -9.426530838012695, "global_step": 79922, "epoch": 475} {"train_loss": -9.379552841186523, "global_step": 79923, "epoch": 475} {"train_loss": -9.10694694519043, "global_step": 79924, "epoch": 475} {"train_loss": -9.242698669433594, "global_step": 79925, "epoch": 475} {"train_loss": -9.324161529541016, "global_step": 79926, "epoch": 475} {"train_loss": -9.30295467376709, "global_step": 79927, "epoch": 475} {"train_loss": -9.215493202209473, "global_step": 79928, "epoch": 475} {"train_loss": -8.982772827148438, "global_step": 79929, "epoch": 475} {"train_loss": -9.222713470458984, "global_step": 79930, "epoch": 475} {"train_loss": -9.244077682495117, "global_step": 79931, "epoch": 475} {"train_loss": -9.113901138305664, "global_step": 79932, "epoch": 475} {"train_loss": -9.226705551147461, "global_step": 79933, "epoch": 475} {"train_loss": -9.187273025512695, "global_step": 79934, "epoch": 475} {"train_loss": -8.944413185119629, "global_step": 79935, "epoch": 475} {"train_loss": -9.260298728942871, "global_step": 79936, "epoch": 475} {"train_loss": -9.143439292907715, "global_step": 79937, "epoch": 475} {"train_loss": -9.293952941894531, "global_step": 79938, "epoch": 475} {"train_loss": -8.931869506835938, "global_step": 79939, "epoch": 475} {"train_loss": -9.187889099121094, "global_step": 79940, "epoch": 475} {"train_loss": -9.081005096435547, "global_step": 79941, "epoch": 475} {"train_loss": -8.86992359161377, "global_step": 79942, "epoch": 475} {"train_loss": -9.236656188964844, "global_step": 79943, "epoch": 475} {"train_loss": -9.133881568908691, "global_step": 79944, "epoch": 475} {"train_loss": -8.95972728729248, "global_step": 79945, "epoch": 475} {"train_loss": -9.240480422973633, "global_step": 79946, "epoch": 475} {"train_loss": -9.196101188659668, "global_step": 79947, "epoch": 475} {"train_loss": -9.303529739379883, "global_step": 79948, "epoch": 475} {"train_loss": -9.084575653076172, "global_step": 79949, "epoch": 475} {"train_loss": -9.22804069519043, "global_step": 79950, "epoch": 475} {"train_loss": -9.343152046203613, "global_step": 79951, "epoch": 475} {"train_loss": -9.129217147827148, "global_step": 79952, "epoch": 475} {"train_loss": -9.240579605102539, "global_step": 79953, "epoch": 475} {"train_loss": -9.102190017700195, "global_step": 79954, "epoch": 475} {"train_loss": -9.209214210510254, "global_step": 79955, "epoch": 475} {"train_loss": -9.37703800201416, "global_step": 79956, "epoch": 475} {"train_loss": -9.173924446105957, "global_step": 79957, "epoch": 475} {"train_loss": -9.254024505615234, "global_step": 79958, "epoch": 475} {"train_loss": -9.134225845336914, "global_step": 79959, "epoch": 475} {"train_loss": -9.280314445495605, "global_step": 79960, "epoch": 475} {"train_loss": -9.371084213256836, "global_step": 79961, "epoch": 475} {"train_loss": -9.270227432250977, "global_step": 79962, "epoch": 475} {"train_loss": -8.908676147460938, "global_step": 79963, "epoch": 475} {"train_loss": -9.002395629882812, "global_step": 79964, "epoch": 475} {"train_loss": -8.839174270629883, "global_step": 79965, "epoch": 475} {"train_loss": -9.335403442382812, "global_step": 79966, "epoch": 475} {"train_loss": -9.168189957028343, "global_step": 79967, "epoch": 475, "val_loss": 195712.421875, "train_action_mse_error": 2.479840040206909} {"train_loss": -8.984209060668945, "global_step": 79968, "epoch": 476} {"train_loss": -9.270600318908691, "global_step": 79969, "epoch": 476} {"train_loss": -9.262115478515625, "global_step": 79970, "epoch": 476} {"train_loss": -9.056729316711426, "global_step": 79971, "epoch": 476} {"train_loss": -9.128329277038574, "global_step": 79972, "epoch": 476} {"train_loss": -9.169179916381836, "global_step": 79973, "epoch": 476} {"train_loss": -9.276843070983887, "global_step": 79974, "epoch": 476} {"train_loss": -8.938743591308594, "global_step": 79975, "epoch": 476} {"train_loss": -9.220930099487305, "global_step": 79976, "epoch": 476} {"train_loss": -8.700616836547852, "global_step": 79977, "epoch": 476} {"train_loss": -9.076683044433594, "global_step": 79978, "epoch": 476} {"train_loss": -8.748268127441406, "global_step": 79979, "epoch": 476} {"train_loss": -9.086187362670898, "global_step": 79980, "epoch": 476} {"train_loss": -9.022930145263672, "global_step": 79981, "epoch": 476} {"train_loss": -9.288269996643066, "global_step": 79982, "epoch": 476} {"train_loss": -9.209098815917969, "global_step": 79983, "epoch": 476} {"train_loss": -8.868176460266113, "global_step": 79984, "epoch": 476} {"train_loss": -9.057638168334961, "global_step": 79985, "epoch": 476} {"train_loss": -9.214790344238281, "global_step": 79986, "epoch": 476} {"train_loss": -8.869173049926758, "global_step": 79987, "epoch": 476} {"train_loss": -8.740514755249023, "global_step": 79988, "epoch": 476} {"train_loss": -9.329774856567383, "global_step": 79989, "epoch": 476} {"train_loss": -8.947807312011719, "global_step": 79990, "epoch": 476} {"train_loss": -9.119489669799805, "global_step": 79991, "epoch": 476} {"train_loss": -9.239461898803711, "global_step": 79992, "epoch": 476} {"train_loss": -9.01477336883545, "global_step": 79993, "epoch": 476} {"train_loss": -9.05228042602539, "global_step": 79994, "epoch": 476} {"train_loss": -9.169376373291016, "global_step": 79995, "epoch": 476} {"train_loss": -9.171530723571777, "global_step": 79996, "epoch": 476} {"train_loss": -8.97578239440918, "global_step": 79997, "epoch": 476} {"train_loss": -9.371572494506836, "global_step": 79998, "epoch": 476} {"train_loss": -9.224367141723633, "global_step": 79999, "epoch": 476} {"train_loss": -9.293022155761719, "global_step": 80000, "epoch": 476} {"train_loss": -9.411994934082031, "global_step": 80001, "epoch": 476} {"train_loss": -9.168313980102539, "global_step": 80002, "epoch": 476} {"train_loss": -9.173818588256836, "global_step": 80003, "epoch": 476} {"train_loss": -9.120037078857422, "global_step": 80004, "epoch": 476} {"train_loss": -9.20245361328125, "global_step": 80005, "epoch": 476} {"train_loss": -8.92739200592041, "global_step": 80006, "epoch": 476} {"train_loss": -9.215412139892578, "global_step": 80007, "epoch": 476} {"train_loss": -8.973648071289062, "global_step": 80008, "epoch": 476} {"train_loss": -9.08222770690918, "global_step": 80009, "epoch": 476} {"train_loss": -9.148836135864258, "global_step": 80010, "epoch": 476} {"train_loss": -8.801127433776855, "global_step": 80011, "epoch": 476} {"train_loss": -9.03229808807373, "global_step": 80012, "epoch": 476} {"train_loss": -9.044790267944336, "global_step": 80013, "epoch": 476} {"train_loss": -9.228044509887695, "global_step": 80014, "epoch": 476} {"train_loss": -9.062408447265625, "global_step": 80015, "epoch": 476} {"train_loss": -9.479717254638672, "global_step": 80016, "epoch": 476} {"train_loss": -9.234697341918945, "global_step": 80017, "epoch": 476} {"train_loss": -9.337217330932617, "global_step": 80018, "epoch": 476} {"train_loss": -9.0006685256958, "global_step": 80019, "epoch": 476} {"train_loss": -9.03152084350586, "global_step": 80020, "epoch": 476} {"train_loss": -9.215758323669434, "global_step": 80021, "epoch": 476} {"train_loss": -9.29120922088623, "global_step": 80022, "epoch": 476} {"train_loss": -9.291788101196289, "global_step": 80023, "epoch": 476} {"train_loss": -9.239299774169922, "global_step": 80024, "epoch": 476} {"train_loss": -9.339132308959961, "global_step": 80025, "epoch": 476} {"train_loss": -9.286380767822266, "global_step": 80026, "epoch": 476} {"train_loss": -9.228672981262207, "global_step": 80027, "epoch": 476} {"train_loss": -9.174537658691406, "global_step": 80028, "epoch": 476} {"train_loss": -9.391914367675781, "global_step": 80029, "epoch": 476} {"train_loss": -9.242765426635742, "global_step": 80030, "epoch": 476} {"train_loss": -9.456537246704102, "global_step": 80031, "epoch": 476} {"train_loss": -9.360404968261719, "global_step": 80032, "epoch": 476} {"train_loss": -9.398723602294922, "global_step": 80033, "epoch": 476} {"train_loss": -9.380358695983887, "global_step": 80034, "epoch": 476} {"train_loss": -9.464998245239258, "global_step": 80035, "epoch": 476} {"train_loss": -9.308277130126953, "global_step": 80036, "epoch": 476} {"train_loss": -9.44780158996582, "global_step": 80037, "epoch": 476} {"train_loss": -9.23154354095459, "global_step": 80038, "epoch": 476} {"train_loss": -9.207612991333008, "global_step": 80039, "epoch": 476} {"train_loss": -9.191304206848145, "global_step": 80040, "epoch": 476} {"train_loss": -9.534599304199219, "global_step": 80041, "epoch": 476} {"train_loss": -9.117057800292969, "global_step": 80042, "epoch": 476} {"train_loss": -9.23054027557373, "global_step": 80043, "epoch": 476} {"train_loss": -9.384169578552246, "global_step": 80044, "epoch": 476} {"train_loss": -9.418952941894531, "global_step": 80045, "epoch": 476} {"train_loss": -9.364080429077148, "global_step": 80046, "epoch": 476} {"train_loss": -9.381746292114258, "global_step": 80047, "epoch": 476} {"train_loss": -9.1209716796875, "global_step": 80048, "epoch": 476} {"train_loss": -9.087175369262695, "global_step": 80049, "epoch": 476} {"train_loss": -9.168673515319824, "global_step": 80050, "epoch": 476} {"train_loss": -9.236801147460938, "global_step": 80051, "epoch": 476} {"train_loss": -9.29055404663086, "global_step": 80052, "epoch": 476} {"train_loss": -9.123751640319824, "global_step": 80053, "epoch": 476} {"train_loss": -9.264838218688965, "global_step": 80054, "epoch": 476} {"train_loss": -9.005845069885254, "global_step": 80055, "epoch": 476} {"train_loss": -9.159439086914062, "global_step": 80056, "epoch": 476} {"train_loss": -9.289649963378906, "global_step": 80057, "epoch": 476} {"train_loss": -9.102757453918457, "global_step": 80058, "epoch": 476} {"train_loss": -9.132684707641602, "global_step": 80059, "epoch": 476} {"train_loss": -9.388071060180664, "global_step": 80060, "epoch": 476} {"train_loss": -9.23096752166748, "global_step": 80061, "epoch": 476} {"train_loss": -9.279155731201172, "global_step": 80062, "epoch": 476} {"train_loss": -9.183908462524414, "global_step": 80063, "epoch": 476} {"train_loss": -9.230406761169434, "global_step": 80064, "epoch": 476} {"train_loss": -9.136115074157715, "global_step": 80065, "epoch": 476} {"train_loss": -9.20710277557373, "global_step": 80066, "epoch": 476} {"train_loss": -9.15139389038086, "global_step": 80067, "epoch": 476} {"train_loss": -9.304845809936523, "global_step": 80068, "epoch": 476} {"train_loss": -8.79734992980957, "global_step": 80069, "epoch": 476} {"train_loss": -9.173992156982422, "global_step": 80070, "epoch": 476} {"train_loss": -9.338916778564453, "global_step": 80071, "epoch": 476} {"train_loss": -9.300363540649414, "global_step": 80072, "epoch": 476} {"train_loss": -9.26789665222168, "global_step": 80073, "epoch": 476} {"train_loss": -9.190492630004883, "global_step": 80074, "epoch": 476} {"train_loss": -9.231302261352539, "global_step": 80075, "epoch": 476} {"train_loss": -9.211581230163574, "global_step": 80076, "epoch": 476} {"train_loss": -9.098699569702148, "global_step": 80077, "epoch": 476} {"train_loss": -8.931869506835938, "global_step": 80078, "epoch": 476} {"train_loss": -9.240644454956055, "global_step": 80079, "epoch": 476} {"train_loss": -9.02113151550293, "global_step": 80080, "epoch": 476} {"train_loss": -8.951717376708984, "global_step": 80081, "epoch": 476} {"train_loss": -8.978277206420898, "global_step": 80082, "epoch": 476} {"train_loss": -9.063465118408203, "global_step": 80083, "epoch": 476} {"train_loss": -8.865551948547363, "global_step": 80084, "epoch": 476} {"train_loss": -9.139883041381836, "global_step": 80085, "epoch": 476} {"train_loss": -8.813501358032227, "global_step": 80086, "epoch": 476} {"train_loss": -9.311602592468262, "global_step": 80087, "epoch": 476} {"train_loss": -8.987566947937012, "global_step": 80088, "epoch": 476} {"train_loss": -9.126140594482422, "global_step": 80089, "epoch": 476} {"train_loss": -9.105167388916016, "global_step": 80090, "epoch": 476} {"train_loss": -9.321393966674805, "global_step": 80091, "epoch": 476} {"train_loss": -8.940033912658691, "global_step": 80092, "epoch": 476} {"train_loss": -9.049116134643555, "global_step": 80093, "epoch": 476} {"train_loss": -9.009787559509277, "global_step": 80094, "epoch": 476} {"train_loss": -9.038728713989258, "global_step": 80095, "epoch": 476} {"train_loss": -9.307390213012695, "global_step": 80096, "epoch": 476} {"train_loss": -9.378982543945312, "global_step": 80097, "epoch": 476} {"train_loss": -9.133955955505371, "global_step": 80098, "epoch": 476} {"train_loss": -9.206710815429688, "global_step": 80099, "epoch": 476} {"train_loss": -9.288179397583008, "global_step": 80100, "epoch": 476} {"train_loss": -9.331443786621094, "global_step": 80101, "epoch": 476} {"train_loss": -9.086618423461914, "global_step": 80102, "epoch": 476} {"train_loss": -9.198348999023438, "global_step": 80103, "epoch": 476} {"train_loss": -9.134615898132324, "global_step": 80104, "epoch": 476} {"train_loss": -9.077804565429688, "global_step": 80105, "epoch": 476} {"train_loss": -9.0947265625, "global_step": 80106, "epoch": 476} {"train_loss": -9.151142120361328, "global_step": 80107, "epoch": 476} {"train_loss": -9.094886779785156, "global_step": 80108, "epoch": 476} {"train_loss": -8.923482894897461, "global_step": 80109, "epoch": 476} {"train_loss": -9.20338249206543, "global_step": 80110, "epoch": 476} {"train_loss": -8.880851745605469, "global_step": 80111, "epoch": 476} {"train_loss": -9.246031761169434, "global_step": 80112, "epoch": 476} {"train_loss": -9.059187889099121, "global_step": 80113, "epoch": 476} {"train_loss": -9.121612548828125, "global_step": 80114, "epoch": 476} {"train_loss": -9.064428329467773, "global_step": 80115, "epoch": 476} {"train_loss": -8.85464096069336, "global_step": 80116, "epoch": 476} {"train_loss": -9.064775466918945, "global_step": 80117, "epoch": 476} {"train_loss": -8.902921676635742, "global_step": 80118, "epoch": 476} {"train_loss": -9.105609893798828, "global_step": 80119, "epoch": 476} {"train_loss": -9.183225631713867, "global_step": 80120, "epoch": 476} {"train_loss": -9.047346115112305, "global_step": 80121, "epoch": 476} {"train_loss": -9.050561904907227, "global_step": 80122, "epoch": 476} {"train_loss": -9.107686042785645, "global_step": 80123, "epoch": 476} {"train_loss": -8.998495101928711, "global_step": 80124, "epoch": 476} {"train_loss": -9.013570785522461, "global_step": 80125, "epoch": 476} {"train_loss": -9.013132095336914, "global_step": 80126, "epoch": 476} {"train_loss": -9.145284652709961, "global_step": 80127, "epoch": 476} {"train_loss": -9.145981788635254, "global_step": 80128, "epoch": 476} {"train_loss": -8.932920455932617, "global_step": 80129, "epoch": 476} {"train_loss": -9.220203399658203, "global_step": 80130, "epoch": 476} {"train_loss": -9.28601360321045, "global_step": 80131, "epoch": 476} {"train_loss": -9.065414428710938, "global_step": 80132, "epoch": 476} {"train_loss": -9.285149574279785, "global_step": 80133, "epoch": 476} {"train_loss": -9.147573471069336, "global_step": 80134, "epoch": 476} {"train_loss": -9.151074602490379, "global_step": 80135, "epoch": 476, "val_loss": 196645.515625} {"train_loss": -9.160539627075195, "global_step": 80136, "epoch": 477} {"train_loss": -9.251445770263672, "global_step": 80137, "epoch": 477} {"train_loss": -8.952629089355469, "global_step": 80138, "epoch": 477} {"train_loss": -9.013399124145508, "global_step": 80139, "epoch": 477} {"train_loss": -8.959856986999512, "global_step": 80140, "epoch": 477} {"train_loss": -9.111342430114746, "global_step": 80141, "epoch": 477} {"train_loss": -8.948087692260742, "global_step": 80142, "epoch": 477} {"train_loss": -9.102094650268555, "global_step": 80143, "epoch": 477} {"train_loss": -9.130247116088867, "global_step": 80144, "epoch": 477} {"train_loss": -9.003626823425293, "global_step": 80145, "epoch": 477} {"train_loss": -8.872014999389648, "global_step": 80146, "epoch": 477} {"train_loss": -9.018096923828125, "global_step": 80147, "epoch": 477} {"train_loss": -9.280750274658203, "global_step": 80148, "epoch": 477} {"train_loss": -9.14583969116211, "global_step": 80149, "epoch": 477} {"train_loss": -8.785747528076172, "global_step": 80150, "epoch": 477} {"train_loss": -9.347527503967285, "global_step": 80151, "epoch": 477} {"train_loss": -9.251554489135742, "global_step": 80152, "epoch": 477} {"train_loss": -9.15482234954834, "global_step": 80153, "epoch": 477} {"train_loss": -9.288529396057129, "global_step": 80154, "epoch": 477} {"train_loss": -9.275121688842773, "global_step": 80155, "epoch": 477} {"train_loss": -9.33358383178711, "global_step": 80156, "epoch": 477} {"train_loss": -9.191061019897461, "global_step": 80157, "epoch": 477} {"train_loss": -9.305331230163574, "global_step": 80158, "epoch": 477} {"train_loss": -9.094818115234375, "global_step": 80159, "epoch": 477} {"train_loss": -9.37844181060791, "global_step": 80160, "epoch": 477} {"train_loss": -9.099918365478516, "global_step": 80161, "epoch": 477} {"train_loss": -9.36382007598877, "global_step": 80162, "epoch": 477} {"train_loss": -9.274773597717285, "global_step": 80163, "epoch": 477} {"train_loss": -9.188302040100098, "global_step": 80164, "epoch": 477} {"train_loss": -9.282583236694336, "global_step": 80165, "epoch": 477} {"train_loss": -9.271467208862305, "global_step": 80166, "epoch": 477} {"train_loss": -9.282197952270508, "global_step": 80167, "epoch": 477} {"train_loss": -9.315055847167969, "global_step": 80168, "epoch": 477} {"train_loss": -9.236848831176758, "global_step": 80169, "epoch": 477} {"train_loss": -9.437189102172852, "global_step": 80170, "epoch": 477} {"train_loss": -9.084648132324219, "global_step": 80171, "epoch": 477} {"train_loss": -8.666997909545898, "global_step": 80172, "epoch": 477} {"train_loss": -9.123481750488281, "global_step": 80173, "epoch": 477} {"train_loss": -8.215568542480469, "global_step": 80174, "epoch": 477} {"train_loss": -8.887470245361328, "global_step": 80175, "epoch": 477} {"train_loss": -8.616774559020996, "global_step": 80176, "epoch": 477} {"train_loss": -8.173104286193848, "global_step": 80177, "epoch": 477} {"train_loss": -8.617502212524414, "global_step": 80178, "epoch": 477} {"train_loss": -8.899800300598145, "global_step": 80179, "epoch": 477} {"train_loss": -8.762887954711914, "global_step": 80180, "epoch": 477} {"train_loss": -8.527632713317871, "global_step": 80181, "epoch": 477} {"train_loss": -8.936239242553711, "global_step": 80182, "epoch": 477} {"train_loss": -9.104095458984375, "global_step": 80183, "epoch": 477} {"train_loss": -8.979129791259766, "global_step": 80184, "epoch": 477} {"train_loss": -8.80431842803955, "global_step": 80185, "epoch": 477} {"train_loss": -8.853816986083984, "global_step": 80186, "epoch": 477} {"train_loss": -9.214635848999023, "global_step": 80187, "epoch": 477} {"train_loss": -9.006477355957031, "global_step": 80188, "epoch": 477} {"train_loss": -9.024360656738281, "global_step": 80189, "epoch": 477} {"train_loss": -8.985128402709961, "global_step": 80190, "epoch": 477} {"train_loss": -8.984333038330078, "global_step": 80191, "epoch": 477} {"train_loss": -9.348997116088867, "global_step": 80192, "epoch": 477} {"train_loss": -9.132528305053711, "global_step": 80193, "epoch": 477} {"train_loss": -9.15997314453125, "global_step": 80194, "epoch": 477} {"train_loss": -9.1065673828125, "global_step": 80195, "epoch": 477} {"train_loss": -9.197182655334473, "global_step": 80196, "epoch": 477} {"train_loss": -9.33891773223877, "global_step": 80197, "epoch": 477} {"train_loss": -9.189886093139648, "global_step": 80198, "epoch": 477} {"train_loss": -9.09991455078125, "global_step": 80199, "epoch": 477} {"train_loss": -9.198331832885742, "global_step": 80200, "epoch": 477} {"train_loss": -9.265390396118164, "global_step": 80201, "epoch": 477} {"train_loss": -9.308418273925781, "global_step": 80202, "epoch": 477} {"train_loss": -9.479684829711914, "global_step": 80203, "epoch": 477} {"train_loss": -9.347328186035156, "global_step": 80204, "epoch": 477} {"train_loss": -9.245075225830078, "global_step": 80205, "epoch": 477} {"train_loss": -9.3787841796875, "global_step": 80206, "epoch": 477} {"train_loss": -9.486002922058105, "global_step": 80207, "epoch": 477} {"train_loss": -9.414213180541992, "global_step": 80208, "epoch": 477} {"train_loss": -9.452455520629883, "global_step": 80209, "epoch": 477} {"train_loss": -9.491302490234375, "global_step": 80210, "epoch": 477} {"train_loss": -9.334124565124512, "global_step": 80211, "epoch": 477} {"train_loss": -9.225326538085938, "global_step": 80212, "epoch": 477} {"train_loss": -9.214563369750977, "global_step": 80213, "epoch": 477} {"train_loss": -9.423166275024414, "global_step": 80214, "epoch": 477} {"train_loss": -9.319862365722656, "global_step": 80215, "epoch": 477} {"train_loss": -9.271121978759766, "global_step": 80216, "epoch": 477} {"train_loss": -9.120264053344727, "global_step": 80217, "epoch": 477} {"train_loss": -9.271158218383789, "global_step": 80218, "epoch": 477} {"train_loss": -8.919990539550781, "global_step": 80219, "epoch": 477} {"train_loss": -9.324504852294922, "global_step": 80220, "epoch": 477} {"train_loss": -8.886337280273438, "global_step": 80221, "epoch": 477} {"train_loss": -8.359081268310547, "global_step": 80222, "epoch": 477} {"train_loss": -8.951323509216309, "global_step": 80223, "epoch": 477} {"train_loss": -8.90814208984375, "global_step": 80224, "epoch": 477} {"train_loss": -9.06369400024414, "global_step": 80225, "epoch": 477} {"train_loss": -8.811253547668457, "global_step": 80226, "epoch": 477} {"train_loss": -9.130285263061523, "global_step": 80227, "epoch": 477} {"train_loss": -9.033836364746094, "global_step": 80228, "epoch": 477} {"train_loss": -8.851102828979492, "global_step": 80229, "epoch": 477} {"train_loss": -8.855144500732422, "global_step": 80230, "epoch": 477} {"train_loss": -8.896641731262207, "global_step": 80231, "epoch": 477} {"train_loss": -8.875466346740723, "global_step": 80232, "epoch": 477} {"train_loss": -8.963639259338379, "global_step": 80233, "epoch": 477} {"train_loss": -9.003204345703125, "global_step": 80234, "epoch": 477} {"train_loss": -8.965850830078125, "global_step": 80235, "epoch": 477} {"train_loss": -9.084564208984375, "global_step": 80236, "epoch": 477} {"train_loss": -8.95228385925293, "global_step": 80237, "epoch": 477} {"train_loss": -9.160974502563477, "global_step": 80238, "epoch": 477} {"train_loss": -9.266368865966797, "global_step": 80239, "epoch": 477} {"train_loss": -9.04704475402832, "global_step": 80240, "epoch": 477} {"train_loss": -9.308076858520508, "global_step": 80241, "epoch": 477} {"train_loss": -9.24856948852539, "global_step": 80242, "epoch": 477} {"train_loss": -9.276668548583984, "global_step": 80243, "epoch": 477} {"train_loss": -9.276583671569824, "global_step": 80244, "epoch": 477} {"train_loss": -9.209243774414062, "global_step": 80245, "epoch": 477} {"train_loss": -9.274768829345703, "global_step": 80246, "epoch": 477} {"train_loss": -9.153071403503418, "global_step": 80247, "epoch": 477} {"train_loss": -9.259872436523438, "global_step": 80248, "epoch": 477} {"train_loss": -9.30765151977539, "global_step": 80249, "epoch": 477} {"train_loss": -9.242517471313477, "global_step": 80250, "epoch": 477} {"train_loss": -9.332036018371582, "global_step": 80251, "epoch": 477} {"train_loss": -9.257219314575195, "global_step": 80252, "epoch": 477} {"train_loss": -9.562240600585938, "global_step": 80253, "epoch": 477} {"train_loss": -9.239145278930664, "global_step": 80254, "epoch": 477} {"train_loss": -9.139129638671875, "global_step": 80255, "epoch": 477} {"train_loss": -9.32602596282959, "global_step": 80256, "epoch": 477} {"train_loss": -9.127113342285156, "global_step": 80257, "epoch": 477} {"train_loss": -9.363652229309082, "global_step": 80258, "epoch": 477} {"train_loss": -9.372003555297852, "global_step": 80259, "epoch": 477} {"train_loss": -9.071710586547852, "global_step": 80260, "epoch": 477} {"train_loss": -9.286576271057129, "global_step": 80261, "epoch": 477} {"train_loss": -9.313982009887695, "global_step": 80262, "epoch": 477} {"train_loss": -9.30877685546875, "global_step": 80263, "epoch": 477} {"train_loss": -9.514339447021484, "global_step": 80264, "epoch": 477} {"train_loss": -9.233209609985352, "global_step": 80265, "epoch": 477} {"train_loss": -9.426534652709961, "global_step": 80266, "epoch": 477} {"train_loss": -8.961112976074219, "global_step": 80267, "epoch": 477} {"train_loss": -9.20456314086914, "global_step": 80268, "epoch": 477} {"train_loss": -9.371774673461914, "global_step": 80269, "epoch": 477} {"train_loss": -9.071043968200684, "global_step": 80270, "epoch": 477} {"train_loss": -9.409757614135742, "global_step": 80271, "epoch": 477} {"train_loss": -9.290360450744629, "global_step": 80272, "epoch": 477} {"train_loss": -8.994344711303711, "global_step": 80273, "epoch": 477} {"train_loss": -9.265097618103027, "global_step": 80274, "epoch": 477} {"train_loss": -8.813419342041016, "global_step": 80275, "epoch": 477} {"train_loss": -9.126559257507324, "global_step": 80276, "epoch": 477} {"train_loss": -9.237059593200684, "global_step": 80277, "epoch": 477} {"train_loss": -9.030563354492188, "global_step": 80278, "epoch": 477} {"train_loss": -8.908143997192383, "global_step": 80279, "epoch": 477} {"train_loss": -8.859664916992188, "global_step": 80280, "epoch": 477} {"train_loss": -8.854899406433105, "global_step": 80281, "epoch": 477} {"train_loss": -8.800613403320312, "global_step": 80282, "epoch": 477} {"train_loss": -8.977299690246582, "global_step": 80283, "epoch": 477} {"train_loss": -8.99955940246582, "global_step": 80284, "epoch": 477} {"train_loss": -8.895380973815918, "global_step": 80285, "epoch": 477} {"train_loss": -9.01706314086914, "global_step": 80286, "epoch": 477} {"train_loss": -9.237079620361328, "global_step": 80287, "epoch": 477} {"train_loss": -9.248028755187988, "global_step": 80288, "epoch": 477} {"train_loss": -9.313368797302246, "global_step": 80289, "epoch": 477} {"train_loss": -9.193370819091797, "global_step": 80290, "epoch": 477} {"train_loss": -9.136157989501953, "global_step": 80291, "epoch": 477} {"train_loss": -9.07664966583252, "global_step": 80292, "epoch": 477} {"train_loss": -9.29155158996582, "global_step": 80293, "epoch": 477} {"train_loss": -9.223699569702148, "global_step": 80294, "epoch": 477} {"train_loss": -9.27053165435791, "global_step": 80295, "epoch": 477} {"train_loss": -9.304369926452637, "global_step": 80296, "epoch": 477} {"train_loss": -9.188565254211426, "global_step": 80297, "epoch": 477} {"train_loss": -9.204927444458008, "global_step": 80298, "epoch": 477} {"train_loss": -9.393712043762207, "global_step": 80299, "epoch": 477} {"train_loss": -9.272838592529297, "global_step": 80300, "epoch": 477} {"train_loss": -9.246707916259766, "global_step": 80301, "epoch": 477} {"train_loss": -9.069803237915039, "global_step": 80302, "epoch": 477} {"train_loss": -9.13156741573697, "global_step": 80303, "epoch": 477, "val_loss": 195950.484375} {"train_loss": -8.905641555786133, "global_step": 80304, "epoch": 478} {"train_loss": -9.414369583129883, "global_step": 80305, "epoch": 478} {"train_loss": -9.08482551574707, "global_step": 80306, "epoch": 478} {"train_loss": -9.00828742980957, "global_step": 80307, "epoch": 478} {"train_loss": -9.351706504821777, "global_step": 80308, "epoch": 478} {"train_loss": -9.171276092529297, "global_step": 80309, "epoch": 478} {"train_loss": -8.837323188781738, "global_step": 80310, "epoch": 478} {"train_loss": -9.138835906982422, "global_step": 80311, "epoch": 478} {"train_loss": -8.96195125579834, "global_step": 80312, "epoch": 478} {"train_loss": -9.312084197998047, "global_step": 80313, "epoch": 478} {"train_loss": -8.813558578491211, "global_step": 80314, "epoch": 478} {"train_loss": -8.945727348327637, "global_step": 80315, "epoch": 478} {"train_loss": -9.099706649780273, "global_step": 80316, "epoch": 478} {"train_loss": -9.349828720092773, "global_step": 80317, "epoch": 478} {"train_loss": -8.873392105102539, "global_step": 80318, "epoch": 478} {"train_loss": -9.237595558166504, "global_step": 80319, "epoch": 478} {"train_loss": -9.038167953491211, "global_step": 80320, "epoch": 478} {"train_loss": -9.287801742553711, "global_step": 80321, "epoch": 478} {"train_loss": -9.146265029907227, "global_step": 80322, "epoch": 478} {"train_loss": -9.069427490234375, "global_step": 80323, "epoch": 478} {"train_loss": -9.29707145690918, "global_step": 80324, "epoch": 478} {"train_loss": -9.070898056030273, "global_step": 80325, "epoch": 478} {"train_loss": -9.308903694152832, "global_step": 80326, "epoch": 478} {"train_loss": -9.258827209472656, "global_step": 80327, "epoch": 478} {"train_loss": -9.257120132446289, "global_step": 80328, "epoch": 478} {"train_loss": -9.31602668762207, "global_step": 80329, "epoch": 478} {"train_loss": -9.20801830291748, "global_step": 80330, "epoch": 478} {"train_loss": -9.534051895141602, "global_step": 80331, "epoch": 478} {"train_loss": -9.37393569946289, "global_step": 80332, "epoch": 478} {"train_loss": -9.094671249389648, "global_step": 80333, "epoch": 478} {"train_loss": -9.599328994750977, "global_step": 80334, "epoch": 478} {"train_loss": -9.46726131439209, "global_step": 80335, "epoch": 478} {"train_loss": -9.169528007507324, "global_step": 80336, "epoch": 478} {"train_loss": -9.3577299118042, "global_step": 80337, "epoch": 478} {"train_loss": -9.436619758605957, "global_step": 80338, "epoch": 478} {"train_loss": -9.500408172607422, "global_step": 80339, "epoch": 478} {"train_loss": -9.36398696899414, "global_step": 80340, "epoch": 478} {"train_loss": -9.29524040222168, "global_step": 80341, "epoch": 478} {"train_loss": -9.189835548400879, "global_step": 80342, "epoch": 478} {"train_loss": -9.41943359375, "global_step": 80343, "epoch": 478} {"train_loss": -9.58123779296875, "global_step": 80344, "epoch": 478} {"train_loss": -9.262834548950195, "global_step": 80345, "epoch": 478} {"train_loss": -9.504940032958984, "global_step": 80346, "epoch": 478} {"train_loss": -9.135824203491211, "global_step": 80347, "epoch": 478} {"train_loss": -9.10144329071045, "global_step": 80348, "epoch": 478} {"train_loss": -9.202295303344727, "global_step": 80349, "epoch": 478} {"train_loss": -9.380949020385742, "global_step": 80350, "epoch": 478} {"train_loss": -9.400385856628418, "global_step": 80351, "epoch": 478} {"train_loss": -9.182680130004883, "global_step": 80352, "epoch": 478} {"train_loss": -9.305154800415039, "global_step": 80353, "epoch": 478} {"train_loss": -9.20045280456543, "global_step": 80354, "epoch": 478} {"train_loss": -9.235115051269531, "global_step": 80355, "epoch": 478} {"train_loss": -9.001424789428711, "global_step": 80356, "epoch": 478} {"train_loss": -9.137994766235352, "global_step": 80357, "epoch": 478} {"train_loss": -8.827141761779785, "global_step": 80358, "epoch": 478} {"train_loss": -8.61341381072998, "global_step": 80359, "epoch": 478} {"train_loss": -8.6476469039917, "global_step": 80360, "epoch": 478} {"train_loss": -9.28042221069336, "global_step": 80361, "epoch": 478} {"train_loss": -8.757885932922363, "global_step": 80362, "epoch": 478} {"train_loss": -9.296027183532715, "global_step": 80363, "epoch": 478} {"train_loss": -8.644213676452637, "global_step": 80364, "epoch": 478} {"train_loss": -8.979948043823242, "global_step": 80365, "epoch": 478} {"train_loss": -8.855569839477539, "global_step": 80366, "epoch": 478} {"train_loss": -9.124143600463867, "global_step": 80367, "epoch": 478} {"train_loss": -8.802202224731445, "global_step": 80368, "epoch": 478} {"train_loss": -8.863452911376953, "global_step": 80369, "epoch": 478} {"train_loss": -8.759162902832031, "global_step": 80370, "epoch": 478} {"train_loss": -9.078398704528809, "global_step": 80371, "epoch": 478} {"train_loss": -8.860261917114258, "global_step": 80372, "epoch": 478} {"train_loss": -9.06832504272461, "global_step": 80373, "epoch": 478} {"train_loss": -9.040691375732422, "global_step": 80374, "epoch": 478} {"train_loss": -9.049103736877441, "global_step": 80375, "epoch": 478} {"train_loss": -8.962942123413086, "global_step": 80376, "epoch": 478} {"train_loss": -9.04781723022461, "global_step": 80377, "epoch": 478} {"train_loss": -9.013994216918945, "global_step": 80378, "epoch": 478} {"train_loss": -8.962592124938965, "global_step": 80379, "epoch": 478} {"train_loss": -8.916313171386719, "global_step": 80380, "epoch": 478} {"train_loss": -9.136085510253906, "global_step": 80381, "epoch": 478} {"train_loss": -8.984373092651367, "global_step": 80382, "epoch": 478} {"train_loss": -9.032675743103027, "global_step": 80383, "epoch": 478} {"train_loss": -9.080571174621582, "global_step": 80384, "epoch": 478} {"train_loss": -9.072885513305664, "global_step": 80385, "epoch": 478} {"train_loss": -8.869991302490234, "global_step": 80386, "epoch": 478} {"train_loss": -9.240253448486328, "global_step": 80387, "epoch": 478} {"train_loss": -9.01562213897705, "global_step": 80388, "epoch": 478} {"train_loss": -9.134994506835938, "global_step": 80389, "epoch": 478} {"train_loss": -9.323630332946777, "global_step": 80390, "epoch": 478} {"train_loss": -8.902018547058105, "global_step": 80391, "epoch": 478} {"train_loss": -9.100847244262695, "global_step": 80392, "epoch": 478} {"train_loss": -9.24746322631836, "global_step": 80393, "epoch": 478} {"train_loss": -9.367264747619629, "global_step": 80394, "epoch": 478} {"train_loss": -9.04335880279541, "global_step": 80395, "epoch": 478} {"train_loss": -9.33203125, "global_step": 80396, "epoch": 478} {"train_loss": -9.215802192687988, "global_step": 80397, "epoch": 478} {"train_loss": -9.401346206665039, "global_step": 80398, "epoch": 478} {"train_loss": -9.058439254760742, "global_step": 80399, "epoch": 478} {"train_loss": -9.376592636108398, "global_step": 80400, "epoch": 478} {"train_loss": -8.924850463867188, "global_step": 80401, "epoch": 478} {"train_loss": -9.2545804977417, "global_step": 80402, "epoch": 478} {"train_loss": -9.004681587219238, "global_step": 80403, "epoch": 478} {"train_loss": -9.220550537109375, "global_step": 80404, "epoch": 478} {"train_loss": -9.111847877502441, "global_step": 80405, "epoch": 478} {"train_loss": -9.400959014892578, "global_step": 80406, "epoch": 478} {"train_loss": -9.110881805419922, "global_step": 80407, "epoch": 478} {"train_loss": -9.388775825500488, "global_step": 80408, "epoch": 478} {"train_loss": -9.17051887512207, "global_step": 80409, "epoch": 478} {"train_loss": -8.701557159423828, "global_step": 80410, "epoch": 478} {"train_loss": -8.927149772644043, "global_step": 80411, "epoch": 478} {"train_loss": -9.117595672607422, "global_step": 80412, "epoch": 478} {"train_loss": -9.09009838104248, "global_step": 80413, "epoch": 478} {"train_loss": -8.797189712524414, "global_step": 80414, "epoch": 478} {"train_loss": -8.9019775390625, "global_step": 80415, "epoch": 478} {"train_loss": -9.080802917480469, "global_step": 80416, "epoch": 478} {"train_loss": -8.801712036132812, "global_step": 80417, "epoch": 478} {"train_loss": -8.938207626342773, "global_step": 80418, "epoch": 478} {"train_loss": -8.902495384216309, "global_step": 80419, "epoch": 478} {"train_loss": -9.064871788024902, "global_step": 80420, "epoch": 478} {"train_loss": -8.952163696289062, "global_step": 80421, "epoch": 478} {"train_loss": -8.900836944580078, "global_step": 80422, "epoch": 478} {"train_loss": -9.01457405090332, "global_step": 80423, "epoch": 478} {"train_loss": -9.096014022827148, "global_step": 80424, "epoch": 478} {"train_loss": -9.076370239257812, "global_step": 80425, "epoch": 478} {"train_loss": -8.876070022583008, "global_step": 80426, "epoch": 478} {"train_loss": -9.180191040039062, "global_step": 80427, "epoch": 478} {"train_loss": -9.019237518310547, "global_step": 80428, "epoch": 478} {"train_loss": -9.212838172912598, "global_step": 80429, "epoch": 478} {"train_loss": -9.040453910827637, "global_step": 80430, "epoch": 478} {"train_loss": -9.240625381469727, "global_step": 80431, "epoch": 478} {"train_loss": -9.025430679321289, "global_step": 80432, "epoch": 478} {"train_loss": -9.358552932739258, "global_step": 80433, "epoch": 478} {"train_loss": -8.95588493347168, "global_step": 80434, "epoch": 478} {"train_loss": -9.308740615844727, "global_step": 80435, "epoch": 478} {"train_loss": -8.965343475341797, "global_step": 80436, "epoch": 478} {"train_loss": -9.402002334594727, "global_step": 80437, "epoch": 478} {"train_loss": -9.090383529663086, "global_step": 80438, "epoch": 478} {"train_loss": -9.302335739135742, "global_step": 80439, "epoch": 478} {"train_loss": -8.91545295715332, "global_step": 80440, "epoch": 478} {"train_loss": -9.371992111206055, "global_step": 80441, "epoch": 478} {"train_loss": -8.773601531982422, "global_step": 80442, "epoch": 478} {"train_loss": -9.111282348632812, "global_step": 80443, "epoch": 478} {"train_loss": -9.17945384979248, "global_step": 80444, "epoch": 478} {"train_loss": -8.923443794250488, "global_step": 80445, "epoch": 478} {"train_loss": -9.33481216430664, "global_step": 80446, "epoch": 478} {"train_loss": -9.272642135620117, "global_step": 80447, "epoch": 478} {"train_loss": -9.18182373046875, "global_step": 80448, "epoch": 478} {"train_loss": -9.444305419921875, "global_step": 80449, "epoch": 478} {"train_loss": -9.276616096496582, "global_step": 80450, "epoch": 478} {"train_loss": -9.112211227416992, "global_step": 80451, "epoch": 478} {"train_loss": -9.161859512329102, "global_step": 80452, "epoch": 478} {"train_loss": -9.363621711730957, "global_step": 80453, "epoch": 478} {"train_loss": -9.322896003723145, "global_step": 80454, "epoch": 478} {"train_loss": -9.182387351989746, "global_step": 80455, "epoch": 478} {"train_loss": -9.236307144165039, "global_step": 80456, "epoch": 478} {"train_loss": -9.096053123474121, "global_step": 80457, "epoch": 478} {"train_loss": -9.141256332397461, "global_step": 80458, "epoch": 478} {"train_loss": -9.313880920410156, "global_step": 80459, "epoch": 478} {"train_loss": -9.334278106689453, "global_step": 80460, "epoch": 478} {"train_loss": -8.907373428344727, "global_step": 80461, "epoch": 478} {"train_loss": -9.100186347961426, "global_step": 80462, "epoch": 478} {"train_loss": -9.276422500610352, "global_step": 80463, "epoch": 478} {"train_loss": -9.118444442749023, "global_step": 80464, "epoch": 478} {"train_loss": -9.110908508300781, "global_step": 80465, "epoch": 478} {"train_loss": -9.075973510742188, "global_step": 80466, "epoch": 478} {"train_loss": -8.980833053588867, "global_step": 80467, "epoch": 478} {"train_loss": -7.933000564575195, "global_step": 80468, "epoch": 478} {"train_loss": -9.218751907348633, "global_step": 80469, "epoch": 478} {"train_loss": -8.407646179199219, "global_step": 80470, "epoch": 478} {"train_loss": -9.115911262375969, "global_step": 80471, "epoch": 478, "val_loss": 197109.09375} {"train_loss": -8.516108512878418, "global_step": 80472, "epoch": 479} {"train_loss": -8.6343994140625, "global_step": 80473, "epoch": 479} {"train_loss": -8.555204391479492, "global_step": 80474, "epoch": 479} {"train_loss": -8.559782028198242, "global_step": 80475, "epoch": 479} {"train_loss": -8.712368965148926, "global_step": 80476, "epoch": 479} {"train_loss": -8.87901496887207, "global_step": 80477, "epoch": 479} {"train_loss": -8.767982482910156, "global_step": 80478, "epoch": 479} {"train_loss": -8.820175170898438, "global_step": 80479, "epoch": 479} {"train_loss": -8.881505012512207, "global_step": 80480, "epoch": 479} {"train_loss": -8.952486038208008, "global_step": 80481, "epoch": 479} {"train_loss": -8.77901840209961, "global_step": 80482, "epoch": 479} {"train_loss": -8.888050079345703, "global_step": 80483, "epoch": 479} {"train_loss": -9.075559616088867, "global_step": 80484, "epoch": 479} {"train_loss": -9.0065336227417, "global_step": 80485, "epoch": 479} {"train_loss": -8.951974868774414, "global_step": 80486, "epoch": 479} {"train_loss": -9.235928535461426, "global_step": 80487, "epoch": 479} {"train_loss": -8.984220504760742, "global_step": 80488, "epoch": 479} {"train_loss": -9.098541259765625, "global_step": 80489, "epoch": 479} {"train_loss": -9.151762008666992, "global_step": 80490, "epoch": 479} {"train_loss": -9.109406471252441, "global_step": 80491, "epoch": 479} {"train_loss": -9.279056549072266, "global_step": 80492, "epoch": 479} {"train_loss": -9.251981735229492, "global_step": 80493, "epoch": 479} {"train_loss": -9.27599811553955, "global_step": 80494, "epoch": 479} {"train_loss": -9.143828392028809, "global_step": 80495, "epoch": 479} {"train_loss": -9.337194442749023, "global_step": 80496, "epoch": 479} {"train_loss": -9.227566719055176, "global_step": 80497, "epoch": 479} {"train_loss": -9.29354476928711, "global_step": 80498, "epoch": 479} {"train_loss": -9.332259178161621, "global_step": 80499, "epoch": 479} {"train_loss": -9.305314064025879, "global_step": 80500, "epoch": 479} {"train_loss": -9.452733039855957, "global_step": 80501, "epoch": 479} {"train_loss": -9.186259269714355, "global_step": 80502, "epoch": 479} {"train_loss": -9.435131072998047, "global_step": 80503, "epoch": 479} {"train_loss": -9.477152824401855, "global_step": 80504, "epoch": 479} {"train_loss": -9.345258712768555, "global_step": 80505, "epoch": 479} {"train_loss": -9.232062339782715, "global_step": 80506, "epoch": 479} {"train_loss": -8.9573974609375, "global_step": 80507, "epoch": 479} {"train_loss": -9.418965339660645, "global_step": 80508, "epoch": 479} {"train_loss": -8.670246124267578, "global_step": 80509, "epoch": 479} {"train_loss": -9.311897277832031, "global_step": 80510, "epoch": 479} {"train_loss": -8.917993545532227, "global_step": 80511, "epoch": 479} {"train_loss": -9.140024185180664, "global_step": 80512, "epoch": 479} {"train_loss": -9.099954605102539, "global_step": 80513, "epoch": 479} {"train_loss": -9.247101783752441, "global_step": 80514, "epoch": 479} {"train_loss": -8.959261894226074, "global_step": 80515, "epoch": 479} {"train_loss": -9.29466438293457, "global_step": 80516, "epoch": 479} {"train_loss": -9.023248672485352, "global_step": 80517, "epoch": 479} {"train_loss": -9.102021217346191, "global_step": 80518, "epoch": 479} {"train_loss": -9.44774055480957, "global_step": 80519, "epoch": 479} {"train_loss": -8.977170944213867, "global_step": 80520, "epoch": 479} {"train_loss": -9.219564437866211, "global_step": 80521, "epoch": 479} {"train_loss": -9.252153396606445, "global_step": 80522, "epoch": 479} {"train_loss": -9.347837448120117, "global_step": 80523, "epoch": 479} {"train_loss": -9.02876091003418, "global_step": 80524, "epoch": 479} {"train_loss": -9.176097869873047, "global_step": 80525, "epoch": 479} {"train_loss": -9.340654373168945, "global_step": 80526, "epoch": 479} {"train_loss": -9.118717193603516, "global_step": 80527, "epoch": 479} {"train_loss": -9.257823944091797, "global_step": 80528, "epoch": 479} {"train_loss": -9.477486610412598, "global_step": 80529, "epoch": 479} {"train_loss": -9.116873741149902, "global_step": 80530, "epoch": 479} {"train_loss": -9.485384941101074, "global_step": 80531, "epoch": 479} {"train_loss": -9.092397689819336, "global_step": 80532, "epoch": 479} {"train_loss": -9.345985412597656, "global_step": 80533, "epoch": 479} {"train_loss": -9.21576976776123, "global_step": 80534, "epoch": 479} {"train_loss": -9.3659029006958, "global_step": 80535, "epoch": 479} {"train_loss": -9.120932579040527, "global_step": 80536, "epoch": 479} {"train_loss": -8.929960250854492, "global_step": 80537, "epoch": 479} {"train_loss": -9.123401641845703, "global_step": 80538, "epoch": 479} {"train_loss": -9.410405158996582, "global_step": 80539, "epoch": 479} {"train_loss": -9.339371681213379, "global_step": 80540, "epoch": 479} {"train_loss": -9.362943649291992, "global_step": 80541, "epoch": 479} {"train_loss": -9.244352340698242, "global_step": 80542, "epoch": 479} {"train_loss": -9.23154067993164, "global_step": 80543, "epoch": 479} {"train_loss": -9.257625579833984, "global_step": 80544, "epoch": 479} {"train_loss": -9.310425758361816, "global_step": 80545, "epoch": 479} {"train_loss": -9.348108291625977, "global_step": 80546, "epoch": 479} {"train_loss": -9.121694564819336, "global_step": 80547, "epoch": 479} {"train_loss": -9.052955627441406, "global_step": 80548, "epoch": 479} {"train_loss": -9.231534004211426, "global_step": 80549, "epoch": 479} {"train_loss": -9.17258358001709, "global_step": 80550, "epoch": 479} {"train_loss": -9.100729942321777, "global_step": 80551, "epoch": 479} {"train_loss": -9.284191131591797, "global_step": 80552, "epoch": 479} {"train_loss": -9.274969100952148, "global_step": 80553, "epoch": 479} {"train_loss": -9.2412109375, "global_step": 80554, "epoch": 479} {"train_loss": -9.365837097167969, "global_step": 80555, "epoch": 479} {"train_loss": -9.340460777282715, "global_step": 80556, "epoch": 479} {"train_loss": -9.271368026733398, "global_step": 80557, "epoch": 479} {"train_loss": -9.33525276184082, "global_step": 80558, "epoch": 479} {"train_loss": -9.362634658813477, "global_step": 80559, "epoch": 479} {"train_loss": -9.142969131469727, "global_step": 80560, "epoch": 479} {"train_loss": -9.258161544799805, "global_step": 80561, "epoch": 479} {"train_loss": -9.393264770507812, "global_step": 80562, "epoch": 479} {"train_loss": -9.419618606567383, "global_step": 80563, "epoch": 479} {"train_loss": -9.162712097167969, "global_step": 80564, "epoch": 479} {"train_loss": -9.5033540725708, "global_step": 80565, "epoch": 479} {"train_loss": -8.865592956542969, "global_step": 80566, "epoch": 479} {"train_loss": -9.54289436340332, "global_step": 80567, "epoch": 479} {"train_loss": -8.904626846313477, "global_step": 80568, "epoch": 479} {"train_loss": -8.978777885437012, "global_step": 80569, "epoch": 479} {"train_loss": -9.436208724975586, "global_step": 80570, "epoch": 479} {"train_loss": -9.127825736999512, "global_step": 80571, "epoch": 479} {"train_loss": -9.355023384094238, "global_step": 80572, "epoch": 479} {"train_loss": -9.066398620605469, "global_step": 80573, "epoch": 479} {"train_loss": -9.190473556518555, "global_step": 80574, "epoch": 479} {"train_loss": -9.233168601989746, "global_step": 80575, "epoch": 479} {"train_loss": -8.913660049438477, "global_step": 80576, "epoch": 479} {"train_loss": -9.278773307800293, "global_step": 80577, "epoch": 479} {"train_loss": -9.222810745239258, "global_step": 80578, "epoch": 479} {"train_loss": -9.207435607910156, "global_step": 80579, "epoch": 479} {"train_loss": -9.241545677185059, "global_step": 80580, "epoch": 479} {"train_loss": -9.390954971313477, "global_step": 80581, "epoch": 479} {"train_loss": -9.530126571655273, "global_step": 80582, "epoch": 479} {"train_loss": -9.292509078979492, "global_step": 80583, "epoch": 479} {"train_loss": -9.248573303222656, "global_step": 80584, "epoch": 479} {"train_loss": -9.151590347290039, "global_step": 80585, "epoch": 479} {"train_loss": -9.292911529541016, "global_step": 80586, "epoch": 479} {"train_loss": -9.12849235534668, "global_step": 80587, "epoch": 479} {"train_loss": -9.293645858764648, "global_step": 80588, "epoch": 479} {"train_loss": -9.282234191894531, "global_step": 80589, "epoch": 479} {"train_loss": -9.225908279418945, "global_step": 80590, "epoch": 479} {"train_loss": -9.2655611038208, "global_step": 80591, "epoch": 479} {"train_loss": -9.296646118164062, "global_step": 80592, "epoch": 479} {"train_loss": -9.137554168701172, "global_step": 80593, "epoch": 479} {"train_loss": -9.137619972229004, "global_step": 80594, "epoch": 479} {"train_loss": -8.899246215820312, "global_step": 80595, "epoch": 479} {"train_loss": -9.220006942749023, "global_step": 80596, "epoch": 479} {"train_loss": -8.921174049377441, "global_step": 80597, "epoch": 479} {"train_loss": -9.333311080932617, "global_step": 80598, "epoch": 479} {"train_loss": -9.217849731445312, "global_step": 80599, "epoch": 479} {"train_loss": -8.922012329101562, "global_step": 80600, "epoch": 479} {"train_loss": -9.184551239013672, "global_step": 80601, "epoch": 479} {"train_loss": -9.193111419677734, "global_step": 80602, "epoch": 479} {"train_loss": -9.069738388061523, "global_step": 80603, "epoch": 479} {"train_loss": -8.910964012145996, "global_step": 80604, "epoch": 479} {"train_loss": -9.398807525634766, "global_step": 80605, "epoch": 479} {"train_loss": -8.897697448730469, "global_step": 80606, "epoch": 479} {"train_loss": -9.292015075683594, "global_step": 80607, "epoch": 479} {"train_loss": -9.231672286987305, "global_step": 80608, "epoch": 479} {"train_loss": -9.019474029541016, "global_step": 80609, "epoch": 479} {"train_loss": -9.281743049621582, "global_step": 80610, "epoch": 479} {"train_loss": -8.83351993560791, "global_step": 80611, "epoch": 479} {"train_loss": -9.458002090454102, "global_step": 80612, "epoch": 479} {"train_loss": -9.024991989135742, "global_step": 80613, "epoch": 479} {"train_loss": -9.301265716552734, "global_step": 80614, "epoch": 479} {"train_loss": -9.226847648620605, "global_step": 80615, "epoch": 479} {"train_loss": -8.98373794555664, "global_step": 80616, "epoch": 479} {"train_loss": -8.988082885742188, "global_step": 80617, "epoch": 479} {"train_loss": -9.301226615905762, "global_step": 80618, "epoch": 479} {"train_loss": -9.106646537780762, "global_step": 80619, "epoch": 479} {"train_loss": -9.176584243774414, "global_step": 80620, "epoch": 479} {"train_loss": -9.144360542297363, "global_step": 80621, "epoch": 479} {"train_loss": -9.195517539978027, "global_step": 80622, "epoch": 479} {"train_loss": -9.217074394226074, "global_step": 80623, "epoch": 479} {"train_loss": -9.202901840209961, "global_step": 80624, "epoch": 479} {"train_loss": -9.07557487487793, "global_step": 80625, "epoch": 479} {"train_loss": -9.074201583862305, "global_step": 80626, "epoch": 479} {"train_loss": -9.486651420593262, "global_step": 80627, "epoch": 479} {"train_loss": -9.378168106079102, "global_step": 80628, "epoch": 479} {"train_loss": -9.203208923339844, "global_step": 80629, "epoch": 479} {"train_loss": -9.177786827087402, "global_step": 80630, "epoch": 479} {"train_loss": -9.141545295715332, "global_step": 80631, "epoch": 479} {"train_loss": -9.083381652832031, "global_step": 80632, "epoch": 479} {"train_loss": -8.795515060424805, "global_step": 80633, "epoch": 479} {"train_loss": -8.872343063354492, "global_step": 80634, "epoch": 479} {"train_loss": -8.923742294311523, "global_step": 80635, "epoch": 479} {"train_loss": -9.041910171508789, "global_step": 80636, "epoch": 479} {"train_loss": -8.987176895141602, "global_step": 80637, "epoch": 479} {"train_loss": -8.818441390991211, "global_step": 80638, "epoch": 479} {"train_loss": -9.15839493842352, "global_step": 80639, "epoch": 479, "val_loss": 198118.296875} {"train_loss": -8.817569732666016, "global_step": 80640, "epoch": 480} {"train_loss": -8.933067321777344, "global_step": 80641, "epoch": 480} {"train_loss": -8.705448150634766, "global_step": 80642, "epoch": 480} {"train_loss": -8.808612823486328, "global_step": 80643, "epoch": 480} {"train_loss": -8.721357345581055, "global_step": 80644, "epoch": 480} {"train_loss": -8.989606857299805, "global_step": 80645, "epoch": 480} {"train_loss": -8.595135688781738, "global_step": 80646, "epoch": 480} {"train_loss": -9.045710563659668, "global_step": 80647, "epoch": 480} {"train_loss": -8.840259552001953, "global_step": 80648, "epoch": 480} {"train_loss": -8.857297897338867, "global_step": 80649, "epoch": 480} {"train_loss": -8.759051322937012, "global_step": 80650, "epoch": 480} {"train_loss": -8.794361114501953, "global_step": 80651, "epoch": 480} {"train_loss": -8.967302322387695, "global_step": 80652, "epoch": 480} {"train_loss": -9.142463684082031, "global_step": 80653, "epoch": 480} {"train_loss": -9.111735343933105, "global_step": 80654, "epoch": 480} {"train_loss": -8.987576484680176, "global_step": 80655, "epoch": 480} {"train_loss": -9.188667297363281, "global_step": 80656, "epoch": 480} {"train_loss": -8.764913558959961, "global_step": 80657, "epoch": 480} {"train_loss": -9.23022174835205, "global_step": 80658, "epoch": 480} {"train_loss": -8.982357025146484, "global_step": 80659, "epoch": 480} {"train_loss": -9.286340713500977, "global_step": 80660, "epoch": 480} {"train_loss": -9.105794906616211, "global_step": 80661, "epoch": 480} {"train_loss": -9.135231971740723, "global_step": 80662, "epoch": 480} {"train_loss": -9.274532318115234, "global_step": 80663, "epoch": 480} {"train_loss": -9.17495346069336, "global_step": 80664, "epoch": 480} {"train_loss": -9.093506813049316, "global_step": 80665, "epoch": 480} {"train_loss": -9.302278518676758, "global_step": 80666, "epoch": 480} {"train_loss": -9.17352294921875, "global_step": 80667, "epoch": 480} {"train_loss": -9.315837860107422, "global_step": 80668, "epoch": 480} {"train_loss": -9.336063385009766, "global_step": 80669, "epoch": 480} {"train_loss": -9.202997207641602, "global_step": 80670, "epoch": 480} {"train_loss": -9.25225830078125, "global_step": 80671, "epoch": 480} {"train_loss": -8.95173454284668, "global_step": 80672, "epoch": 480} {"train_loss": -9.390164375305176, "global_step": 80673, "epoch": 480} {"train_loss": -9.196971893310547, "global_step": 80674, "epoch": 480} {"train_loss": -9.249685287475586, "global_step": 80675, "epoch": 480} {"train_loss": -9.276999473571777, "global_step": 80676, "epoch": 480} {"train_loss": -9.260335922241211, "global_step": 80677, "epoch": 480} {"train_loss": -9.259288787841797, "global_step": 80678, "epoch": 480} {"train_loss": -9.07669448852539, "global_step": 80679, "epoch": 480} {"train_loss": -9.411968231201172, "global_step": 80680, "epoch": 480} {"train_loss": -9.307294845581055, "global_step": 80681, "epoch": 480} {"train_loss": -9.329755783081055, "global_step": 80682, "epoch": 480} {"train_loss": -8.993684768676758, "global_step": 80683, "epoch": 480} {"train_loss": -9.387621879577637, "global_step": 80684, "epoch": 480} {"train_loss": -9.371272087097168, "global_step": 80685, "epoch": 480} {"train_loss": -9.11726188659668, "global_step": 80686, "epoch": 480} {"train_loss": -9.271507263183594, "global_step": 80687, "epoch": 480} {"train_loss": -9.303564071655273, "global_step": 80688, "epoch": 480} {"train_loss": -9.396102905273438, "global_step": 80689, "epoch": 480} {"train_loss": -9.325905799865723, "global_step": 80690, "epoch": 480} {"train_loss": -9.28730297088623, "global_step": 80691, "epoch": 480} {"train_loss": -9.329435348510742, "global_step": 80692, "epoch": 480} {"train_loss": -9.359683990478516, "global_step": 80693, "epoch": 480} {"train_loss": -9.43609619140625, "global_step": 80694, "epoch": 480} {"train_loss": -9.415434837341309, "global_step": 80695, "epoch": 480} {"train_loss": -9.074402809143066, "global_step": 80696, "epoch": 480} {"train_loss": -9.303085327148438, "global_step": 80697, "epoch": 480} {"train_loss": -9.323222160339355, "global_step": 80698, "epoch": 480} {"train_loss": -9.232613563537598, "global_step": 80699, "epoch": 480} {"train_loss": -9.373387336730957, "global_step": 80700, "epoch": 480} {"train_loss": -8.959127426147461, "global_step": 80701, "epoch": 480} {"train_loss": -9.419157981872559, "global_step": 80702, "epoch": 480} {"train_loss": -8.909843444824219, "global_step": 80703, "epoch": 480} {"train_loss": -9.39204216003418, "global_step": 80704, "epoch": 480} {"train_loss": -8.968498229980469, "global_step": 80705, "epoch": 480} {"train_loss": -9.219568252563477, "global_step": 80706, "epoch": 480} {"train_loss": -9.117595672607422, "global_step": 80707, "epoch": 480} {"train_loss": -9.418612480163574, "global_step": 80708, "epoch": 480} {"train_loss": -9.17907428741455, "global_step": 80709, "epoch": 480} {"train_loss": -9.341591835021973, "global_step": 80710, "epoch": 480} {"train_loss": -9.335112571716309, "global_step": 80711, "epoch": 480} {"train_loss": -9.42340087890625, "global_step": 80712, "epoch": 480} {"train_loss": -9.393289566040039, "global_step": 80713, "epoch": 480} {"train_loss": -9.4713773727417, "global_step": 80714, "epoch": 480} {"train_loss": -9.37701416015625, "global_step": 80715, "epoch": 480} {"train_loss": -9.415613174438477, "global_step": 80716, "epoch": 480} {"train_loss": -9.427167892456055, "global_step": 80717, "epoch": 480} {"train_loss": -9.481073379516602, "global_step": 80718, "epoch": 480} {"train_loss": -9.36888313293457, "global_step": 80719, "epoch": 480} {"train_loss": -8.925151824951172, "global_step": 80720, "epoch": 480} {"train_loss": -9.195425987243652, "global_step": 80721, "epoch": 480} {"train_loss": -9.164480209350586, "global_step": 80722, "epoch": 480} {"train_loss": -9.002710342407227, "global_step": 80723, "epoch": 480} {"train_loss": -9.196603775024414, "global_step": 80724, "epoch": 480} {"train_loss": -9.08469295501709, "global_step": 80725, "epoch": 480} {"train_loss": -9.402118682861328, "global_step": 80726, "epoch": 480} {"train_loss": -9.467679023742676, "global_step": 80727, "epoch": 480} {"train_loss": -9.28376293182373, "global_step": 80728, "epoch": 480} {"train_loss": -9.13477897644043, "global_step": 80729, "epoch": 480} {"train_loss": -9.310212135314941, "global_step": 80730, "epoch": 480} {"train_loss": -9.022717475891113, "global_step": 80731, "epoch": 480} {"train_loss": -9.144861221313477, "global_step": 80732, "epoch": 480} {"train_loss": -9.222475051879883, "global_step": 80733, "epoch": 480} {"train_loss": -9.318349838256836, "global_step": 80734, "epoch": 480} {"train_loss": -9.225590705871582, "global_step": 80735, "epoch": 480} {"train_loss": -9.095465660095215, "global_step": 80736, "epoch": 480} {"train_loss": -9.13118839263916, "global_step": 80737, "epoch": 480} {"train_loss": -9.316193580627441, "global_step": 80738, "epoch": 480} {"train_loss": -9.348457336425781, "global_step": 80739, "epoch": 480} {"train_loss": -9.364684104919434, "global_step": 80740, "epoch": 480} {"train_loss": -9.386810302734375, "global_step": 80741, "epoch": 480} {"train_loss": -9.294471740722656, "global_step": 80742, "epoch": 480} {"train_loss": -9.50505256652832, "global_step": 80743, "epoch": 480} {"train_loss": -9.090893745422363, "global_step": 80744, "epoch": 480} {"train_loss": -9.130413055419922, "global_step": 80745, "epoch": 480} {"train_loss": -9.394527435302734, "global_step": 80746, "epoch": 480} {"train_loss": -9.326789855957031, "global_step": 80747, "epoch": 480} {"train_loss": -9.285533905029297, "global_step": 80748, "epoch": 480} {"train_loss": -9.201214790344238, "global_step": 80749, "epoch": 480} {"train_loss": -9.353418350219727, "global_step": 80750, "epoch": 480} {"train_loss": -9.013028144836426, "global_step": 80751, "epoch": 480} {"train_loss": -9.020490646362305, "global_step": 80752, "epoch": 480} {"train_loss": -9.409028053283691, "global_step": 80753, "epoch": 480} {"train_loss": -8.976311683654785, "global_step": 80754, "epoch": 480} {"train_loss": -9.42503547668457, "global_step": 80755, "epoch": 480} {"train_loss": -8.921709060668945, "global_step": 80756, "epoch": 480} {"train_loss": -9.179433822631836, "global_step": 80757, "epoch": 480} {"train_loss": -9.316397666931152, "global_step": 80758, "epoch": 480} {"train_loss": -9.186197280883789, "global_step": 80759, "epoch": 480} {"train_loss": -9.163514137268066, "global_step": 80760, "epoch": 480} {"train_loss": -9.219703674316406, "global_step": 80761, "epoch": 480} {"train_loss": -9.236007690429688, "global_step": 80762, "epoch": 480} {"train_loss": -9.101019859313965, "global_step": 80763, "epoch": 480} {"train_loss": -9.217752456665039, "global_step": 80764, "epoch": 480} {"train_loss": -9.309154510498047, "global_step": 80765, "epoch": 480} {"train_loss": -9.341123580932617, "global_step": 80766, "epoch": 480} {"train_loss": -9.441446304321289, "global_step": 80767, "epoch": 480} {"train_loss": -9.405097961425781, "global_step": 80768, "epoch": 480} {"train_loss": -9.362770080566406, "global_step": 80769, "epoch": 480} {"train_loss": -9.010652542114258, "global_step": 80770, "epoch": 480} {"train_loss": -9.34079360961914, "global_step": 80771, "epoch": 480} {"train_loss": -9.370956420898438, "global_step": 80772, "epoch": 480} {"train_loss": -8.794681549072266, "global_step": 80773, "epoch": 480} {"train_loss": -9.274785995483398, "global_step": 80774, "epoch": 480} {"train_loss": -9.209454536437988, "global_step": 80775, "epoch": 480} {"train_loss": -9.36882209777832, "global_step": 80776, "epoch": 480} {"train_loss": -9.394247055053711, "global_step": 80777, "epoch": 480} {"train_loss": -9.014691352844238, "global_step": 80778, "epoch": 480} {"train_loss": -9.230013847351074, "global_step": 80779, "epoch": 480} {"train_loss": -9.144572257995605, "global_step": 80780, "epoch": 480} {"train_loss": -9.386819839477539, "global_step": 80781, "epoch": 480} {"train_loss": -9.264249801635742, "global_step": 80782, "epoch": 480} {"train_loss": -9.1497220993042, "global_step": 80783, "epoch": 480} {"train_loss": -9.197649002075195, "global_step": 80784, "epoch": 480} {"train_loss": -9.006240844726562, "global_step": 80785, "epoch": 480} {"train_loss": -8.709641456604004, "global_step": 80786, "epoch": 480} {"train_loss": -9.187824249267578, "global_step": 80787, "epoch": 480} {"train_loss": -8.877962112426758, "global_step": 80788, "epoch": 480} {"train_loss": -9.025175094604492, "global_step": 80789, "epoch": 480} {"train_loss": -9.185824394226074, "global_step": 80790, "epoch": 480} {"train_loss": -8.7911376953125, "global_step": 80791, "epoch": 480} {"train_loss": -9.018254280090332, "global_step": 80792, "epoch": 480} {"train_loss": -8.912571907043457, "global_step": 80793, "epoch": 480} {"train_loss": -8.999046325683594, "global_step": 80794, "epoch": 480} {"train_loss": -8.814421653747559, "global_step": 80795, "epoch": 480} {"train_loss": -8.962738037109375, "global_step": 80796, "epoch": 480} {"train_loss": -8.917072296142578, "global_step": 80797, "epoch": 480} {"train_loss": -9.087808609008789, "global_step": 80798, "epoch": 480} {"train_loss": -9.067207336425781, "global_step": 80799, "epoch": 480} {"train_loss": -9.127372741699219, "global_step": 80800, "epoch": 480} {"train_loss": -9.001554489135742, "global_step": 80801, "epoch": 480} {"train_loss": -9.103202819824219, "global_step": 80802, "epoch": 480} {"train_loss": -9.16964340209961, "global_step": 80803, "epoch": 480} {"train_loss": -9.21921157836914, "global_step": 80804, "epoch": 480} {"train_loss": -9.02212905883789, "global_step": 80805, "epoch": 480} {"train_loss": -9.01052474975586, "global_step": 80806, "epoch": 480} {"train_loss": -9.175221477236066, "global_step": 80807, "epoch": 480, "val_loss": 198134.28125, "train_action_mse_error": 1.5607093572616577} {"train_loss": -9.234382629394531, "global_step": 80808, "epoch": 481} {"train_loss": -9.243413925170898, "global_step": 80809, "epoch": 481} {"train_loss": -9.311193466186523, "global_step": 80810, "epoch": 481} {"train_loss": -9.34799575805664, "global_step": 80811, "epoch": 481} {"train_loss": -9.126119613647461, "global_step": 80812, "epoch": 481} {"train_loss": -9.152754783630371, "global_step": 80813, "epoch": 481} {"train_loss": -9.223855018615723, "global_step": 80814, "epoch": 481} {"train_loss": -8.956901550292969, "global_step": 80815, "epoch": 481} {"train_loss": -9.466535568237305, "global_step": 80816, "epoch": 481} {"train_loss": -9.088059425354004, "global_step": 80817, "epoch": 481} {"train_loss": -9.181337356567383, "global_step": 80818, "epoch": 481} {"train_loss": -9.122297286987305, "global_step": 80819, "epoch": 481} {"train_loss": -9.382652282714844, "global_step": 80820, "epoch": 481} {"train_loss": -9.278468132019043, "global_step": 80821, "epoch": 481} {"train_loss": -9.268416404724121, "global_step": 80822, "epoch": 481} {"train_loss": -9.424579620361328, "global_step": 80823, "epoch": 481} {"train_loss": -9.24841594696045, "global_step": 80824, "epoch": 481} {"train_loss": -9.456220626831055, "global_step": 80825, "epoch": 481} {"train_loss": -9.235347747802734, "global_step": 80826, "epoch": 481} {"train_loss": -9.2670259475708, "global_step": 80827, "epoch": 481} {"train_loss": -9.181958198547363, "global_step": 80828, "epoch": 481} {"train_loss": -9.257160186767578, "global_step": 80829, "epoch": 481} {"train_loss": -9.27360725402832, "global_step": 80830, "epoch": 481} {"train_loss": -8.932331085205078, "global_step": 80831, "epoch": 481} {"train_loss": -8.980611801147461, "global_step": 80832, "epoch": 481} {"train_loss": -9.185611724853516, "global_step": 80833, "epoch": 481} {"train_loss": -8.913694381713867, "global_step": 80834, "epoch": 481} {"train_loss": -9.07377815246582, "global_step": 80835, "epoch": 481} {"train_loss": -8.868911743164062, "global_step": 80836, "epoch": 481} {"train_loss": -9.204333305358887, "global_step": 80837, "epoch": 481} {"train_loss": -8.905564308166504, "global_step": 80838, "epoch": 481} {"train_loss": -9.025224685668945, "global_step": 80839, "epoch": 481} {"train_loss": -8.669947624206543, "global_step": 80840, "epoch": 481} {"train_loss": -9.029184341430664, "global_step": 80841, "epoch": 481} {"train_loss": -8.815679550170898, "global_step": 80842, "epoch": 481} {"train_loss": -8.951530456542969, "global_step": 80843, "epoch": 481} {"train_loss": -8.614866256713867, "global_step": 80844, "epoch": 481} {"train_loss": -9.048343658447266, "global_step": 80845, "epoch": 481} {"train_loss": -9.118589401245117, "global_step": 80846, "epoch": 481} {"train_loss": -8.807608604431152, "global_step": 80847, "epoch": 481} {"train_loss": -8.91134262084961, "global_step": 80848, "epoch": 481} {"train_loss": -9.13789176940918, "global_step": 80849, "epoch": 481} {"train_loss": -9.105327606201172, "global_step": 80850, "epoch": 481} {"train_loss": -9.033350944519043, "global_step": 80851, "epoch": 481} {"train_loss": -9.220148086547852, "global_step": 80852, "epoch": 481} {"train_loss": -9.292000770568848, "global_step": 80853, "epoch": 481} {"train_loss": -8.969942092895508, "global_step": 80854, "epoch": 481} {"train_loss": -9.166349411010742, "global_step": 80855, "epoch": 481} {"train_loss": -9.197351455688477, "global_step": 80856, "epoch": 481} {"train_loss": -8.926618576049805, "global_step": 80857, "epoch": 481} {"train_loss": -9.206047058105469, "global_step": 80858, "epoch": 481} {"train_loss": -8.96937370300293, "global_step": 80859, "epoch": 481} {"train_loss": -9.042425155639648, "global_step": 80860, "epoch": 481} {"train_loss": -9.239648818969727, "global_step": 80861, "epoch": 481} {"train_loss": -9.310928344726562, "global_step": 80862, "epoch": 481} {"train_loss": -9.186971664428711, "global_step": 80863, "epoch": 481} {"train_loss": -9.216114044189453, "global_step": 80864, "epoch": 481} {"train_loss": -9.195085525512695, "global_step": 80865, "epoch": 481} {"train_loss": -9.427556991577148, "global_step": 80866, "epoch": 481} {"train_loss": -9.242029190063477, "global_step": 80867, "epoch": 481} {"train_loss": -9.372031211853027, "global_step": 80868, "epoch": 481} {"train_loss": -9.353845596313477, "global_step": 80869, "epoch": 481} {"train_loss": -9.117271423339844, "global_step": 80870, "epoch": 481} {"train_loss": -9.182928085327148, "global_step": 80871, "epoch": 481} {"train_loss": -9.413467407226562, "global_step": 80872, "epoch": 481} {"train_loss": -9.176834106445312, "global_step": 80873, "epoch": 481} {"train_loss": -9.513050079345703, "global_step": 80874, "epoch": 481} {"train_loss": -9.366836547851562, "global_step": 80875, "epoch": 481} {"train_loss": -9.250604629516602, "global_step": 80876, "epoch": 481} {"train_loss": -9.483794212341309, "global_step": 80877, "epoch": 481} {"train_loss": -9.413497924804688, "global_step": 80878, "epoch": 481} {"train_loss": -9.089763641357422, "global_step": 80879, "epoch": 481} {"train_loss": -9.212838172912598, "global_step": 80880, "epoch": 481} {"train_loss": -9.122676849365234, "global_step": 80881, "epoch": 481} {"train_loss": -9.3820219039917, "global_step": 80882, "epoch": 481} {"train_loss": -9.244829177856445, "global_step": 80883, "epoch": 481} {"train_loss": -9.286189079284668, "global_step": 80884, "epoch": 481} {"train_loss": -9.449268341064453, "global_step": 80885, "epoch": 481} {"train_loss": -9.377351760864258, "global_step": 80886, "epoch": 481} {"train_loss": -9.42890453338623, "global_step": 80887, "epoch": 481} {"train_loss": -9.224510192871094, "global_step": 80888, "epoch": 481} {"train_loss": -9.093321800231934, "global_step": 80889, "epoch": 481} {"train_loss": -9.003486633300781, "global_step": 80890, "epoch": 481} {"train_loss": -8.831684112548828, "global_step": 80891, "epoch": 481} {"train_loss": -9.046821594238281, "global_step": 80892, "epoch": 481} {"train_loss": -9.151668548583984, "global_step": 80893, "epoch": 481} {"train_loss": -9.188539505004883, "global_step": 80894, "epoch": 481} {"train_loss": -8.813036918640137, "global_step": 80895, "epoch": 481} {"train_loss": -8.824689865112305, "global_step": 80896, "epoch": 481} {"train_loss": -8.750248908996582, "global_step": 80897, "epoch": 481} {"train_loss": -8.811473846435547, "global_step": 80898, "epoch": 481} {"train_loss": -9.332103729248047, "global_step": 80899, "epoch": 481} {"train_loss": -9.04857063293457, "global_step": 80900, "epoch": 481} {"train_loss": -8.824654579162598, "global_step": 80901, "epoch": 481} {"train_loss": -9.177117347717285, "global_step": 80902, "epoch": 481} {"train_loss": -8.843676567077637, "global_step": 80903, "epoch": 481} {"train_loss": -8.859582901000977, "global_step": 80904, "epoch": 481} {"train_loss": -8.994505882263184, "global_step": 80905, "epoch": 481} {"train_loss": -9.19074821472168, "global_step": 80906, "epoch": 481} {"train_loss": -8.94997787475586, "global_step": 80907, "epoch": 481} {"train_loss": -9.22642707824707, "global_step": 80908, "epoch": 481} {"train_loss": -9.17587661743164, "global_step": 80909, "epoch": 481} {"train_loss": -8.866962432861328, "global_step": 80910, "epoch": 481} {"train_loss": -9.224231719970703, "global_step": 80911, "epoch": 481} {"train_loss": -9.209173202514648, "global_step": 80912, "epoch": 481} {"train_loss": -9.070103645324707, "global_step": 80913, "epoch": 481} {"train_loss": -9.096436500549316, "global_step": 80914, "epoch": 481} {"train_loss": -9.278383255004883, "global_step": 80915, "epoch": 481} {"train_loss": -9.01324462890625, "global_step": 80916, "epoch": 481} {"train_loss": -9.221992492675781, "global_step": 80917, "epoch": 481} {"train_loss": -9.04319953918457, "global_step": 80918, "epoch": 481} {"train_loss": -9.358610153198242, "global_step": 80919, "epoch": 481} {"train_loss": -8.985151290893555, "global_step": 80920, "epoch": 481} {"train_loss": -9.18110179901123, "global_step": 80921, "epoch": 481} {"train_loss": -9.256629943847656, "global_step": 80922, "epoch": 481} {"train_loss": -9.354753494262695, "global_step": 80923, "epoch": 481} {"train_loss": -9.289368629455566, "global_step": 80924, "epoch": 481} {"train_loss": -8.954215049743652, "global_step": 80925, "epoch": 481} {"train_loss": -9.328161239624023, "global_step": 80926, "epoch": 481} {"train_loss": -8.880732536315918, "global_step": 80927, "epoch": 481} {"train_loss": -9.3035306930542, "global_step": 80928, "epoch": 481} {"train_loss": -8.918502807617188, "global_step": 80929, "epoch": 481} {"train_loss": -9.274130821228027, "global_step": 80930, "epoch": 481} {"train_loss": -8.958013534545898, "global_step": 80931, "epoch": 481} {"train_loss": -9.134468078613281, "global_step": 80932, "epoch": 481} {"train_loss": -9.04611587524414, "global_step": 80933, "epoch": 481} {"train_loss": -9.331247329711914, "global_step": 80934, "epoch": 481} {"train_loss": -9.33065128326416, "global_step": 80935, "epoch": 481} {"train_loss": -9.25575065612793, "global_step": 80936, "epoch": 481} {"train_loss": -9.242111206054688, "global_step": 80937, "epoch": 481} {"train_loss": -9.253026962280273, "global_step": 80938, "epoch": 481} {"train_loss": -9.137430191040039, "global_step": 80939, "epoch": 481} {"train_loss": -9.228720664978027, "global_step": 80940, "epoch": 481} {"train_loss": -9.213296890258789, "global_step": 80941, "epoch": 481} {"train_loss": -9.373947143554688, "global_step": 80942, "epoch": 481} {"train_loss": -9.459973335266113, "global_step": 80943, "epoch": 481} {"train_loss": -9.293365478515625, "global_step": 80944, "epoch": 481} {"train_loss": -9.316648483276367, "global_step": 80945, "epoch": 481} {"train_loss": -9.347925186157227, "global_step": 80946, "epoch": 481} {"train_loss": -9.024518013000488, "global_step": 80947, "epoch": 481} {"train_loss": -9.135162353515625, "global_step": 80948, "epoch": 481} {"train_loss": -9.174720764160156, "global_step": 80949, "epoch": 481} {"train_loss": -9.421035766601562, "global_step": 80950, "epoch": 481} {"train_loss": -9.295589447021484, "global_step": 80951, "epoch": 481} {"train_loss": -9.031807899475098, "global_step": 80952, "epoch": 481} {"train_loss": -9.216304779052734, "global_step": 80953, "epoch": 481} {"train_loss": -9.204018592834473, "global_step": 80954, "epoch": 481} {"train_loss": -9.22572135925293, "global_step": 80955, "epoch": 481} {"train_loss": -9.06832504272461, "global_step": 80956, "epoch": 481} {"train_loss": -9.377067565917969, "global_step": 80957, "epoch": 481} {"train_loss": -9.290868759155273, "global_step": 80958, "epoch": 481} {"train_loss": -9.107280731201172, "global_step": 80959, "epoch": 481} {"train_loss": -9.141789436340332, "global_step": 80960, "epoch": 481} {"train_loss": -9.207860946655273, "global_step": 80961, "epoch": 481} {"train_loss": -9.376307487487793, "global_step": 80962, "epoch": 481} {"train_loss": -9.384908676147461, "global_step": 80963, "epoch": 481} {"train_loss": -9.13481330871582, "global_step": 80964, "epoch": 481} {"train_loss": -9.225603103637695, "global_step": 80965, "epoch": 481} {"train_loss": -9.140670776367188, "global_step": 80966, "epoch": 481} {"train_loss": -9.024556159973145, "global_step": 80967, "epoch": 481} {"train_loss": -9.130342483520508, "global_step": 80968, "epoch": 481} {"train_loss": -8.999853134155273, "global_step": 80969, "epoch": 481} {"train_loss": -9.028775215148926, "global_step": 80970, "epoch": 481} {"train_loss": -9.192329406738281, "global_step": 80971, "epoch": 481} {"train_loss": -9.067800521850586, "global_step": 80972, "epoch": 481} {"train_loss": -8.845048904418945, "global_step": 80973, "epoch": 481} {"train_loss": -9.083223342895508, "global_step": 80974, "epoch": 481} {"train_loss": -9.156679073969523, "global_step": 80975, "epoch": 481, "val_loss": 198259.109375} {"train_loss": -9.003454208374023, "global_step": 80976, "epoch": 482} {"train_loss": -9.158130645751953, "global_step": 80977, "epoch": 482} {"train_loss": -9.338432312011719, "global_step": 80978, "epoch": 482} {"train_loss": -9.180169105529785, "global_step": 80979, "epoch": 482} {"train_loss": -9.151975631713867, "global_step": 80980, "epoch": 482} {"train_loss": -9.023979187011719, "global_step": 80981, "epoch": 482} {"train_loss": -9.20096206665039, "global_step": 80982, "epoch": 482} {"train_loss": -9.054632186889648, "global_step": 80983, "epoch": 482} {"train_loss": -9.422937393188477, "global_step": 80984, "epoch": 482} {"train_loss": -9.160059928894043, "global_step": 80985, "epoch": 482} {"train_loss": -9.354452133178711, "global_step": 80986, "epoch": 482} {"train_loss": -9.327897071838379, "global_step": 80987, "epoch": 482} {"train_loss": -9.244178771972656, "global_step": 80988, "epoch": 482} {"train_loss": -9.272590637207031, "global_step": 80989, "epoch": 482} {"train_loss": -9.422418594360352, "global_step": 80990, "epoch": 482} {"train_loss": -9.12798023223877, "global_step": 80991, "epoch": 482} {"train_loss": -9.205556869506836, "global_step": 80992, "epoch": 482} {"train_loss": -9.324077606201172, "global_step": 80993, "epoch": 482} {"train_loss": -9.339303016662598, "global_step": 80994, "epoch": 482} {"train_loss": -9.345681190490723, "global_step": 80995, "epoch": 482} {"train_loss": -9.464225769042969, "global_step": 80996, "epoch": 482} {"train_loss": -9.345226287841797, "global_step": 80997, "epoch": 482} {"train_loss": -9.357528686523438, "global_step": 80998, "epoch": 482} {"train_loss": -9.36784553527832, "global_step": 80999, "epoch": 482} {"train_loss": -9.4695463180542, "global_step": 81000, "epoch": 482} {"train_loss": -9.013223648071289, "global_step": 81001, "epoch": 482} {"train_loss": -9.339592933654785, "global_step": 81002, "epoch": 482} {"train_loss": -8.889543533325195, "global_step": 81003, "epoch": 482} {"train_loss": -9.179765701293945, "global_step": 81004, "epoch": 482} {"train_loss": -9.163844108581543, "global_step": 81005, "epoch": 482} {"train_loss": -9.052138328552246, "global_step": 81006, "epoch": 482} {"train_loss": -9.320058822631836, "global_step": 81007, "epoch": 482} {"train_loss": -9.137454986572266, "global_step": 81008, "epoch": 482} {"train_loss": -9.049948692321777, "global_step": 81009, "epoch": 482} {"train_loss": -9.004478454589844, "global_step": 81010, "epoch": 482} {"train_loss": -9.41817569732666, "global_step": 81011, "epoch": 482} {"train_loss": -9.202850341796875, "global_step": 81012, "epoch": 482} {"train_loss": -9.463217735290527, "global_step": 81013, "epoch": 482} {"train_loss": -9.088666915893555, "global_step": 81014, "epoch": 482} {"train_loss": -9.267999649047852, "global_step": 81015, "epoch": 482} {"train_loss": -8.794939041137695, "global_step": 81016, "epoch": 482} {"train_loss": -9.210323333740234, "global_step": 81017, "epoch": 482} {"train_loss": -8.686040878295898, "global_step": 81018, "epoch": 482} {"train_loss": -9.160723686218262, "global_step": 81019, "epoch": 482} {"train_loss": -9.08974838256836, "global_step": 81020, "epoch": 482} {"train_loss": -9.218555450439453, "global_step": 81021, "epoch": 482} {"train_loss": -9.26597785949707, "global_step": 81022, "epoch": 482} {"train_loss": -9.265485763549805, "global_step": 81023, "epoch": 482} {"train_loss": -9.208881378173828, "global_step": 81024, "epoch": 482} {"train_loss": -9.20582103729248, "global_step": 81025, "epoch": 482} {"train_loss": -9.347875595092773, "global_step": 81026, "epoch": 482} {"train_loss": -9.295027732849121, "global_step": 81027, "epoch": 482} {"train_loss": -8.919952392578125, "global_step": 81028, "epoch": 482} {"train_loss": -8.936155319213867, "global_step": 81029, "epoch": 482} {"train_loss": -9.213096618652344, "global_step": 81030, "epoch": 482} {"train_loss": -9.34830093383789, "global_step": 81031, "epoch": 482} {"train_loss": -9.125190734863281, "global_step": 81032, "epoch": 482} {"train_loss": -9.295380592346191, "global_step": 81033, "epoch": 482} {"train_loss": -9.464065551757812, "global_step": 81034, "epoch": 482} {"train_loss": -9.125571250915527, "global_step": 81035, "epoch": 482} {"train_loss": -9.355013847351074, "global_step": 81036, "epoch": 482} {"train_loss": -9.28565788269043, "global_step": 81037, "epoch": 482} {"train_loss": -9.357906341552734, "global_step": 81038, "epoch": 482} {"train_loss": -9.278867721557617, "global_step": 81039, "epoch": 482} {"train_loss": -9.374923706054688, "global_step": 81040, "epoch": 482} {"train_loss": -9.159732818603516, "global_step": 81041, "epoch": 482} {"train_loss": -9.448335647583008, "global_step": 81042, "epoch": 482} {"train_loss": -9.314682006835938, "global_step": 81043, "epoch": 482} {"train_loss": -9.349020004272461, "global_step": 81044, "epoch": 482} {"train_loss": -9.654800415039062, "global_step": 81045, "epoch": 482} {"train_loss": -9.239089965820312, "global_step": 81046, "epoch": 482} {"train_loss": -9.596200942993164, "global_step": 81047, "epoch": 482} {"train_loss": -9.598488807678223, "global_step": 81048, "epoch": 482} {"train_loss": -9.500815391540527, "global_step": 81049, "epoch": 482} {"train_loss": -9.47768783569336, "global_step": 81050, "epoch": 482} {"train_loss": -9.360044479370117, "global_step": 81051, "epoch": 482} {"train_loss": -9.430171966552734, "global_step": 81052, "epoch": 482} {"train_loss": -9.407540321350098, "global_step": 81053, "epoch": 482} {"train_loss": -9.322309494018555, "global_step": 81054, "epoch": 482} {"train_loss": -9.463443756103516, "global_step": 81055, "epoch": 482} {"train_loss": -9.462040901184082, "global_step": 81056, "epoch": 482} {"train_loss": -9.298243522644043, "global_step": 81057, "epoch": 482} {"train_loss": -9.384678840637207, "global_step": 81058, "epoch": 482} {"train_loss": -9.31271743774414, "global_step": 81059, "epoch": 482} {"train_loss": -9.46187973022461, "global_step": 81060, "epoch": 482} {"train_loss": -9.312153816223145, "global_step": 81061, "epoch": 482} {"train_loss": -9.301401138305664, "global_step": 81062, "epoch": 482} {"train_loss": -9.404194831848145, "global_step": 81063, "epoch": 482} {"train_loss": -9.21435260772705, "global_step": 81064, "epoch": 482} {"train_loss": -9.365137100219727, "global_step": 81065, "epoch": 482} {"train_loss": -9.353010177612305, "global_step": 81066, "epoch": 482} {"train_loss": -9.232341766357422, "global_step": 81067, "epoch": 482} {"train_loss": -9.455291748046875, "global_step": 81068, "epoch": 482} {"train_loss": -9.162891387939453, "global_step": 81069, "epoch": 482} {"train_loss": -8.940829277038574, "global_step": 81070, "epoch": 482} {"train_loss": -9.14265251159668, "global_step": 81071, "epoch": 482} {"train_loss": -9.165185928344727, "global_step": 81072, "epoch": 482} {"train_loss": -9.076654434204102, "global_step": 81073, "epoch": 482} {"train_loss": -9.050050735473633, "global_step": 81074, "epoch": 482} {"train_loss": -9.27010726928711, "global_step": 81075, "epoch": 482} {"train_loss": -8.96655559539795, "global_step": 81076, "epoch": 482} {"train_loss": -9.357770919799805, "global_step": 81077, "epoch": 482} {"train_loss": -9.215239524841309, "global_step": 81078, "epoch": 482} {"train_loss": -9.201568603515625, "global_step": 81079, "epoch": 482} {"train_loss": -9.326062202453613, "global_step": 81080, "epoch": 482} {"train_loss": -9.064658164978027, "global_step": 81081, "epoch": 482} {"train_loss": -9.576056480407715, "global_step": 81082, "epoch": 482} {"train_loss": -8.904129028320312, "global_step": 81083, "epoch": 482} {"train_loss": -9.09865951538086, "global_step": 81084, "epoch": 482} {"train_loss": -9.373651504516602, "global_step": 81085, "epoch": 482} {"train_loss": -9.118440628051758, "global_step": 81086, "epoch": 482} {"train_loss": -9.238991737365723, "global_step": 81087, "epoch": 482} {"train_loss": -9.336017608642578, "global_step": 81088, "epoch": 482} {"train_loss": -9.269535064697266, "global_step": 81089, "epoch": 482} {"train_loss": -9.476432800292969, "global_step": 81090, "epoch": 482} {"train_loss": -9.332881927490234, "global_step": 81091, "epoch": 482} {"train_loss": -9.262309074401855, "global_step": 81092, "epoch": 482} {"train_loss": -9.361324310302734, "global_step": 81093, "epoch": 482} {"train_loss": -9.40379524230957, "global_step": 81094, "epoch": 482} {"train_loss": -9.240836143493652, "global_step": 81095, "epoch": 482} {"train_loss": -9.295890808105469, "global_step": 81096, "epoch": 482} {"train_loss": -9.176226615905762, "global_step": 81097, "epoch": 482} {"train_loss": -9.1934814453125, "global_step": 81098, "epoch": 482} {"train_loss": -9.484389305114746, "global_step": 81099, "epoch": 482} {"train_loss": -9.390646934509277, "global_step": 81100, "epoch": 482} {"train_loss": -9.190640449523926, "global_step": 81101, "epoch": 482} {"train_loss": -9.561415672302246, "global_step": 81102, "epoch": 482} {"train_loss": -9.158952713012695, "global_step": 81103, "epoch": 482} {"train_loss": -9.322072982788086, "global_step": 81104, "epoch": 482} {"train_loss": -8.903444290161133, "global_step": 81105, "epoch": 482} {"train_loss": -9.126256942749023, "global_step": 81106, "epoch": 482} {"train_loss": -9.216265678405762, "global_step": 81107, "epoch": 482} {"train_loss": -9.161054611206055, "global_step": 81108, "epoch": 482} {"train_loss": -9.266046524047852, "global_step": 81109, "epoch": 482} {"train_loss": -9.016273498535156, "global_step": 81110, "epoch": 482} {"train_loss": -9.163469314575195, "global_step": 81111, "epoch": 482} {"train_loss": -8.800699234008789, "global_step": 81112, "epoch": 482} {"train_loss": -9.170574188232422, "global_step": 81113, "epoch": 482} {"train_loss": -9.015571594238281, "global_step": 81114, "epoch": 482} {"train_loss": -9.472867012023926, "global_step": 81115, "epoch": 482} {"train_loss": -8.894648551940918, "global_step": 81116, "epoch": 482} {"train_loss": -8.880781173706055, "global_step": 81117, "epoch": 482} {"train_loss": -9.080377578735352, "global_step": 81118, "epoch": 482} {"train_loss": -9.0222749710083, "global_step": 81119, "epoch": 482} {"train_loss": -8.969789505004883, "global_step": 81120, "epoch": 482} {"train_loss": -9.01954460144043, "global_step": 81121, "epoch": 482} {"train_loss": -9.017913818359375, "global_step": 81122, "epoch": 482} {"train_loss": -9.062414169311523, "global_step": 81123, "epoch": 482} {"train_loss": -9.000351905822754, "global_step": 81124, "epoch": 482} {"train_loss": -9.117837905883789, "global_step": 81125, "epoch": 482} {"train_loss": -9.02999496459961, "global_step": 81126, "epoch": 482} {"train_loss": -9.061795234680176, "global_step": 81127, "epoch": 482} {"train_loss": -9.034409523010254, "global_step": 81128, "epoch": 482} {"train_loss": -9.41922664642334, "global_step": 81129, "epoch": 482} {"train_loss": -8.91795539855957, "global_step": 81130, "epoch": 482} {"train_loss": -8.97700309753418, "global_step": 81131, "epoch": 482} {"train_loss": -9.001790046691895, "global_step": 81132, "epoch": 482} {"train_loss": -9.091839790344238, "global_step": 81133, "epoch": 482} {"train_loss": -8.988632202148438, "global_step": 81134, "epoch": 482} {"train_loss": -9.411993026733398, "global_step": 81135, "epoch": 482} {"train_loss": -9.16429328918457, "global_step": 81136, "epoch": 482} {"train_loss": -9.276755332946777, "global_step": 81137, "epoch": 482} {"train_loss": -9.177568435668945, "global_step": 81138, "epoch": 482} {"train_loss": -9.406792640686035, "global_step": 81139, "epoch": 482} {"train_loss": -9.009665489196777, "global_step": 81140, "epoch": 482} {"train_loss": -9.540048599243164, "global_step": 81141, "epoch": 482} {"train_loss": -9.188871383666992, "global_step": 81142, "epoch": 482} {"train_loss": -9.227189262708029, "global_step": 81143, "epoch": 482, "val_loss": 196442.9375} {"train_loss": -9.022873878479004, "global_step": 81144, "epoch": 483} {"train_loss": -9.27747917175293, "global_step": 81145, "epoch": 483} {"train_loss": -9.076947212219238, "global_step": 81146, "epoch": 483} {"train_loss": -9.217588424682617, "global_step": 81147, "epoch": 483} {"train_loss": -9.187760353088379, "global_step": 81148, "epoch": 483} {"train_loss": -9.320571899414062, "global_step": 81149, "epoch": 483} {"train_loss": -9.36114501953125, "global_step": 81150, "epoch": 483} {"train_loss": -9.421223640441895, "global_step": 81151, "epoch": 483} {"train_loss": -9.21474838256836, "global_step": 81152, "epoch": 483} {"train_loss": -9.317634582519531, "global_step": 81153, "epoch": 483} {"train_loss": -9.161819458007812, "global_step": 81154, "epoch": 483} {"train_loss": -9.304388046264648, "global_step": 81155, "epoch": 483} {"train_loss": -9.397441864013672, "global_step": 81156, "epoch": 483} {"train_loss": -9.528207778930664, "global_step": 81157, "epoch": 483} {"train_loss": -9.297069549560547, "global_step": 81158, "epoch": 483} {"train_loss": -9.176740646362305, "global_step": 81159, "epoch": 483} {"train_loss": -9.20724105834961, "global_step": 81160, "epoch": 483} {"train_loss": -9.347671508789062, "global_step": 81161, "epoch": 483} {"train_loss": -9.28548812866211, "global_step": 81162, "epoch": 483} {"train_loss": -9.118062973022461, "global_step": 81163, "epoch": 483} {"train_loss": -9.146201133728027, "global_step": 81164, "epoch": 483} {"train_loss": -9.1875581741333, "global_step": 81165, "epoch": 483} {"train_loss": -9.110437393188477, "global_step": 81166, "epoch": 483} {"train_loss": -9.369831085205078, "global_step": 81167, "epoch": 483} {"train_loss": -9.225995063781738, "global_step": 81168, "epoch": 483} {"train_loss": -9.225669860839844, "global_step": 81169, "epoch": 483} {"train_loss": -9.530511856079102, "global_step": 81170, "epoch": 483} {"train_loss": -9.219636917114258, "global_step": 81171, "epoch": 483} {"train_loss": -9.220294952392578, "global_step": 81172, "epoch": 483} {"train_loss": -8.913558959960938, "global_step": 81173, "epoch": 483} {"train_loss": -9.254203796386719, "global_step": 81174, "epoch": 483} {"train_loss": -9.343475341796875, "global_step": 81175, "epoch": 483} {"train_loss": -9.297002792358398, "global_step": 81176, "epoch": 483} {"train_loss": -9.38853645324707, "global_step": 81177, "epoch": 483} {"train_loss": -9.476076126098633, "global_step": 81178, "epoch": 483} {"train_loss": -9.373176574707031, "global_step": 81179, "epoch": 483} {"train_loss": -9.258359909057617, "global_step": 81180, "epoch": 483} {"train_loss": -9.265140533447266, "global_step": 81181, "epoch": 483} {"train_loss": -9.533387184143066, "global_step": 81182, "epoch": 483} {"train_loss": -9.484359741210938, "global_step": 81183, "epoch": 483} {"train_loss": -9.317831039428711, "global_step": 81184, "epoch": 483} {"train_loss": -9.27354621887207, "global_step": 81185, "epoch": 483} {"train_loss": -9.376802444458008, "global_step": 81186, "epoch": 483} {"train_loss": -9.090275764465332, "global_step": 81187, "epoch": 483} {"train_loss": -9.22176742553711, "global_step": 81188, "epoch": 483} {"train_loss": -9.50317096710205, "global_step": 81189, "epoch": 483} {"train_loss": -9.200250625610352, "global_step": 81190, "epoch": 483} {"train_loss": -9.176969528198242, "global_step": 81191, "epoch": 483} {"train_loss": -9.503314018249512, "global_step": 81192, "epoch": 483} {"train_loss": -9.543001174926758, "global_step": 81193, "epoch": 483} {"train_loss": -9.334712982177734, "global_step": 81194, "epoch": 483} {"train_loss": -9.344568252563477, "global_step": 81195, "epoch": 483} {"train_loss": -9.114177703857422, "global_step": 81196, "epoch": 483} {"train_loss": -9.549198150634766, "global_step": 81197, "epoch": 483} {"train_loss": -9.329910278320312, "global_step": 81198, "epoch": 483} {"train_loss": -9.195072174072266, "global_step": 81199, "epoch": 483} {"train_loss": -8.995840072631836, "global_step": 81200, "epoch": 483} {"train_loss": -9.188484191894531, "global_step": 81201, "epoch": 483} {"train_loss": -9.28665542602539, "global_step": 81202, "epoch": 483} {"train_loss": -9.261738777160645, "global_step": 81203, "epoch": 483} {"train_loss": -9.0536470413208, "global_step": 81204, "epoch": 483} {"train_loss": -9.441115379333496, "global_step": 81205, "epoch": 483} {"train_loss": -9.074592590332031, "global_step": 81206, "epoch": 483} {"train_loss": -9.223917961120605, "global_step": 81207, "epoch": 483} {"train_loss": -9.322408676147461, "global_step": 81208, "epoch": 483} {"train_loss": -9.397685050964355, "global_step": 81209, "epoch": 483} {"train_loss": -9.482486724853516, "global_step": 81210, "epoch": 483} {"train_loss": -9.088802337646484, "global_step": 81211, "epoch": 483} {"train_loss": -9.288972854614258, "global_step": 81212, "epoch": 483} {"train_loss": -9.387124061584473, "global_step": 81213, "epoch": 483} {"train_loss": -8.79376220703125, "global_step": 81214, "epoch": 483} {"train_loss": -9.321833610534668, "global_step": 81215, "epoch": 483} {"train_loss": -9.261375427246094, "global_step": 81216, "epoch": 483} {"train_loss": -9.292956352233887, "global_step": 81217, "epoch": 483} {"train_loss": -9.083081245422363, "global_step": 81218, "epoch": 483} {"train_loss": -8.954564094543457, "global_step": 81219, "epoch": 483} {"train_loss": -9.193998336791992, "global_step": 81220, "epoch": 483} {"train_loss": -9.42652702331543, "global_step": 81221, "epoch": 483} {"train_loss": -9.277698516845703, "global_step": 81222, "epoch": 483} {"train_loss": -9.18996810913086, "global_step": 81223, "epoch": 483} {"train_loss": -9.341348648071289, "global_step": 81224, "epoch": 483} {"train_loss": -9.323883056640625, "global_step": 81225, "epoch": 483} {"train_loss": -9.33073616027832, "global_step": 81226, "epoch": 483} {"train_loss": -9.308952331542969, "global_step": 81227, "epoch": 483} {"train_loss": -9.032878875732422, "global_step": 81228, "epoch": 483} {"train_loss": -9.055381774902344, "global_step": 81229, "epoch": 483} {"train_loss": -9.123468399047852, "global_step": 81230, "epoch": 483} {"train_loss": -9.007474899291992, "global_step": 81231, "epoch": 483} {"train_loss": -9.066094398498535, "global_step": 81232, "epoch": 483} {"train_loss": -9.294514656066895, "global_step": 81233, "epoch": 483} {"train_loss": -9.116300582885742, "global_step": 81234, "epoch": 483} {"train_loss": -8.979133605957031, "global_step": 81235, "epoch": 483} {"train_loss": -9.190444946289062, "global_step": 81236, "epoch": 483} {"train_loss": -9.000499725341797, "global_step": 81237, "epoch": 483} {"train_loss": -9.21463680267334, "global_step": 81238, "epoch": 483} {"train_loss": -9.210611343383789, "global_step": 81239, "epoch": 483} {"train_loss": -9.044100761413574, "global_step": 81240, "epoch": 483} {"train_loss": -9.151729583740234, "global_step": 81241, "epoch": 483} {"train_loss": -9.152254104614258, "global_step": 81242, "epoch": 483} {"train_loss": -8.908122062683105, "global_step": 81243, "epoch": 483} {"train_loss": -9.189735412597656, "global_step": 81244, "epoch": 483} {"train_loss": -9.325401306152344, "global_step": 81245, "epoch": 483} {"train_loss": -9.206033706665039, "global_step": 81246, "epoch": 483} {"train_loss": -9.334787368774414, "global_step": 81247, "epoch": 483} {"train_loss": -9.308673858642578, "global_step": 81248, "epoch": 483} {"train_loss": -9.071060180664062, "global_step": 81249, "epoch": 483} {"train_loss": -9.063950538635254, "global_step": 81250, "epoch": 483} {"train_loss": -9.108869552612305, "global_step": 81251, "epoch": 483} {"train_loss": -9.048137664794922, "global_step": 81252, "epoch": 483} {"train_loss": -9.239827156066895, "global_step": 81253, "epoch": 483} {"train_loss": -9.240659713745117, "global_step": 81254, "epoch": 483} {"train_loss": -8.957077980041504, "global_step": 81255, "epoch": 483} {"train_loss": -9.304071426391602, "global_step": 81256, "epoch": 483} {"train_loss": -8.908517837524414, "global_step": 81257, "epoch": 483} {"train_loss": -9.226099967956543, "global_step": 81258, "epoch": 483} {"train_loss": -8.731794357299805, "global_step": 81259, "epoch": 483} {"train_loss": -8.999889373779297, "global_step": 81260, "epoch": 483} {"train_loss": -8.936650276184082, "global_step": 81261, "epoch": 483} {"train_loss": -9.149538040161133, "global_step": 81262, "epoch": 483} {"train_loss": -9.193380355834961, "global_step": 81263, "epoch": 483} {"train_loss": -8.860228538513184, "global_step": 81264, "epoch": 483} {"train_loss": -9.130426406860352, "global_step": 81265, "epoch": 483} {"train_loss": -9.167410850524902, "global_step": 81266, "epoch": 483} {"train_loss": -8.80723762512207, "global_step": 81267, "epoch": 483} {"train_loss": -8.942358016967773, "global_step": 81268, "epoch": 483} {"train_loss": -9.208319664001465, "global_step": 81269, "epoch": 483} {"train_loss": -9.13309097290039, "global_step": 81270, "epoch": 483} {"train_loss": -9.135244369506836, "global_step": 81271, "epoch": 483} {"train_loss": -8.788874626159668, "global_step": 81272, "epoch": 483} {"train_loss": -9.411317825317383, "global_step": 81273, "epoch": 483} {"train_loss": -8.767359733581543, "global_step": 81274, "epoch": 483} {"train_loss": -9.316198348999023, "global_step": 81275, "epoch": 483} {"train_loss": -8.99998664855957, "global_step": 81276, "epoch": 483} {"train_loss": -8.699901580810547, "global_step": 81277, "epoch": 483} {"train_loss": -9.134969711303711, "global_step": 81278, "epoch": 483} {"train_loss": -9.061542510986328, "global_step": 81279, "epoch": 483} {"train_loss": -9.004108428955078, "global_step": 81280, "epoch": 483} {"train_loss": -9.252082824707031, "global_step": 81281, "epoch": 483} {"train_loss": -9.145054817199707, "global_step": 81282, "epoch": 483} {"train_loss": -9.301950454711914, "global_step": 81283, "epoch": 483} {"train_loss": -8.906793594360352, "global_step": 81284, "epoch": 483} {"train_loss": -9.04804801940918, "global_step": 81285, "epoch": 483} {"train_loss": -8.933981895446777, "global_step": 81286, "epoch": 483} {"train_loss": -9.20756721496582, "global_step": 81287, "epoch": 483} {"train_loss": -8.89135456085205, "global_step": 81288, "epoch": 483} {"train_loss": -9.081157684326172, "global_step": 81289, "epoch": 483} {"train_loss": -9.018573760986328, "global_step": 81290, "epoch": 483} {"train_loss": -9.252604484558105, "global_step": 81291, "epoch": 483} {"train_loss": -9.04191780090332, "global_step": 81292, "epoch": 483} {"train_loss": -9.106100082397461, "global_step": 81293, "epoch": 483} {"train_loss": -9.134552955627441, "global_step": 81294, "epoch": 483} {"train_loss": -8.954544067382812, "global_step": 81295, "epoch": 483} {"train_loss": -9.300373077392578, "global_step": 81296, "epoch": 483} {"train_loss": -9.03012466430664, "global_step": 81297, "epoch": 483} {"train_loss": -9.24389362335205, "global_step": 81298, "epoch": 483} {"train_loss": -8.908809661865234, "global_step": 81299, "epoch": 483} {"train_loss": -9.25899887084961, "global_step": 81300, "epoch": 483} {"train_loss": -9.162515640258789, "global_step": 81301, "epoch": 483} {"train_loss": -9.316834449768066, "global_step": 81302, "epoch": 483} {"train_loss": -9.124871253967285, "global_step": 81303, "epoch": 483} {"train_loss": -9.313241958618164, "global_step": 81304, "epoch": 483} {"train_loss": -9.246034622192383, "global_step": 81305, "epoch": 483} {"train_loss": -9.284358978271484, "global_step": 81306, "epoch": 483} {"train_loss": -9.174264907836914, "global_step": 81307, "epoch": 483} {"train_loss": -9.281343460083008, "global_step": 81308, "epoch": 483} {"train_loss": -9.183340072631836, "global_step": 81309, "epoch": 483} {"train_loss": -9.35437297821045, "global_step": 81310, "epoch": 483} {"train_loss": -9.189655695642744, "global_step": 81311, "epoch": 483, "val_loss": 198704.171875} {"train_loss": -8.930357933044434, "global_step": 81312, "epoch": 484} {"train_loss": -9.349443435668945, "global_step": 81313, "epoch": 484} {"train_loss": -9.015462875366211, "global_step": 81314, "epoch": 484} {"train_loss": -9.2811279296875, "global_step": 81315, "epoch": 484} {"train_loss": -9.068792343139648, "global_step": 81316, "epoch": 484} {"train_loss": -9.09544563293457, "global_step": 81317, "epoch": 484} {"train_loss": -9.157669067382812, "global_step": 81318, "epoch": 484} {"train_loss": -9.196639060974121, "global_step": 81319, "epoch": 484} {"train_loss": -9.101731300354004, "global_step": 81320, "epoch": 484} {"train_loss": -9.083368301391602, "global_step": 81321, "epoch": 484} {"train_loss": -9.362303733825684, "global_step": 81322, "epoch": 484} {"train_loss": -9.122699737548828, "global_step": 81323, "epoch": 484} {"train_loss": -9.468645095825195, "global_step": 81324, "epoch": 484} {"train_loss": -9.26024055480957, "global_step": 81325, "epoch": 484} {"train_loss": -9.204398155212402, "global_step": 81326, "epoch": 484} {"train_loss": -8.943236351013184, "global_step": 81327, "epoch": 484} {"train_loss": -9.159370422363281, "global_step": 81328, "epoch": 484} {"train_loss": -9.063239097595215, "global_step": 81329, "epoch": 484} {"train_loss": -9.266581535339355, "global_step": 81330, "epoch": 484} {"train_loss": -9.170978546142578, "global_step": 81331, "epoch": 484} {"train_loss": -9.295074462890625, "global_step": 81332, "epoch": 484} {"train_loss": -9.040090560913086, "global_step": 81333, "epoch": 484} {"train_loss": -9.066805839538574, "global_step": 81334, "epoch": 484} {"train_loss": -9.51331901550293, "global_step": 81335, "epoch": 484} {"train_loss": -9.395286560058594, "global_step": 81336, "epoch": 484} {"train_loss": -9.339152336120605, "global_step": 81337, "epoch": 484} {"train_loss": -9.11402702331543, "global_step": 81338, "epoch": 484} {"train_loss": -9.281713485717773, "global_step": 81339, "epoch": 484} {"train_loss": -9.042975425720215, "global_step": 81340, "epoch": 484} {"train_loss": -9.341175079345703, "global_step": 81341, "epoch": 484} {"train_loss": -9.271785736083984, "global_step": 81342, "epoch": 484} {"train_loss": -9.041687965393066, "global_step": 81343, "epoch": 484} {"train_loss": -9.421136856079102, "global_step": 81344, "epoch": 484} {"train_loss": -9.489126205444336, "global_step": 81345, "epoch": 484} {"train_loss": -9.26801586151123, "global_step": 81346, "epoch": 484} {"train_loss": -9.294867515563965, "global_step": 81347, "epoch": 484} {"train_loss": -9.142629623413086, "global_step": 81348, "epoch": 484} {"train_loss": -9.007396697998047, "global_step": 81349, "epoch": 484} {"train_loss": -9.35112190246582, "global_step": 81350, "epoch": 484} {"train_loss": -8.844842910766602, "global_step": 81351, "epoch": 484} {"train_loss": -9.181427001953125, "global_step": 81352, "epoch": 484} {"train_loss": -9.170985221862793, "global_step": 81353, "epoch": 484} {"train_loss": -9.408337593078613, "global_step": 81354, "epoch": 484} {"train_loss": -9.41030216217041, "global_step": 81355, "epoch": 484} {"train_loss": -9.283278465270996, "global_step": 81356, "epoch": 484} {"train_loss": -9.110322952270508, "global_step": 81357, "epoch": 484} {"train_loss": -9.446884155273438, "global_step": 81358, "epoch": 484} {"train_loss": -9.216426849365234, "global_step": 81359, "epoch": 484} {"train_loss": -9.456707954406738, "global_step": 81360, "epoch": 484} {"train_loss": -9.490439414978027, "global_step": 81361, "epoch": 484} {"train_loss": -9.362357139587402, "global_step": 81362, "epoch": 484} {"train_loss": -9.432662010192871, "global_step": 81363, "epoch": 484} {"train_loss": -9.387519836425781, "global_step": 81364, "epoch": 484} {"train_loss": -9.06136703491211, "global_step": 81365, "epoch": 484} {"train_loss": -9.08033561706543, "global_step": 81366, "epoch": 484} {"train_loss": -9.280214309692383, "global_step": 81367, "epoch": 484} {"train_loss": -9.239654541015625, "global_step": 81368, "epoch": 484} {"train_loss": -9.366381645202637, "global_step": 81369, "epoch": 484} {"train_loss": -9.026971817016602, "global_step": 81370, "epoch": 484} {"train_loss": -9.434833526611328, "global_step": 81371, "epoch": 484} {"train_loss": -9.012164115905762, "global_step": 81372, "epoch": 484} {"train_loss": -9.090898513793945, "global_step": 81373, "epoch": 484} {"train_loss": -9.28740119934082, "global_step": 81374, "epoch": 484} {"train_loss": -8.998085021972656, "global_step": 81375, "epoch": 484} {"train_loss": -9.12013053894043, "global_step": 81376, "epoch": 484} {"train_loss": -9.336390495300293, "global_step": 81377, "epoch": 484} {"train_loss": -9.076667785644531, "global_step": 81378, "epoch": 484} {"train_loss": -8.91569709777832, "global_step": 81379, "epoch": 484} {"train_loss": -9.162923812866211, "global_step": 81380, "epoch": 484} {"train_loss": -9.371492385864258, "global_step": 81381, "epoch": 484} {"train_loss": -9.055804252624512, "global_step": 81382, "epoch": 484} {"train_loss": -9.259480476379395, "global_step": 81383, "epoch": 484} {"train_loss": -9.103673934936523, "global_step": 81384, "epoch": 484} {"train_loss": -9.185079574584961, "global_step": 81385, "epoch": 484} {"train_loss": -9.083966255187988, "global_step": 81386, "epoch": 484} {"train_loss": -9.238601684570312, "global_step": 81387, "epoch": 484} {"train_loss": -8.590812683105469, "global_step": 81388, "epoch": 484} {"train_loss": -9.150744438171387, "global_step": 81389, "epoch": 484} {"train_loss": -9.029825210571289, "global_step": 81390, "epoch": 484} {"train_loss": -9.212204933166504, "global_step": 81391, "epoch": 484} {"train_loss": -8.989215850830078, "global_step": 81392, "epoch": 484} {"train_loss": -9.364980697631836, "global_step": 81393, "epoch": 484} {"train_loss": -9.001193046569824, "global_step": 81394, "epoch": 484} {"train_loss": -9.057504653930664, "global_step": 81395, "epoch": 484} {"train_loss": -9.375019073486328, "global_step": 81396, "epoch": 484} {"train_loss": -9.054765701293945, "global_step": 81397, "epoch": 484} {"train_loss": -9.08928108215332, "global_step": 81398, "epoch": 484} {"train_loss": -9.194744110107422, "global_step": 81399, "epoch": 484} {"train_loss": -9.19329833984375, "global_step": 81400, "epoch": 484} {"train_loss": -9.102668762207031, "global_step": 81401, "epoch": 484} {"train_loss": -9.143387794494629, "global_step": 81402, "epoch": 484} {"train_loss": -9.229656219482422, "global_step": 81403, "epoch": 484} {"train_loss": -8.954336166381836, "global_step": 81404, "epoch": 484} {"train_loss": -9.391868591308594, "global_step": 81405, "epoch": 484} {"train_loss": -9.063922882080078, "global_step": 81406, "epoch": 484} {"train_loss": -9.132164001464844, "global_step": 81407, "epoch": 484} {"train_loss": -9.349081039428711, "global_step": 81408, "epoch": 484} {"train_loss": -9.155797004699707, "global_step": 81409, "epoch": 484} {"train_loss": -9.355364799499512, "global_step": 81410, "epoch": 484} {"train_loss": -9.017858505249023, "global_step": 81411, "epoch": 484} {"train_loss": -9.252279281616211, "global_step": 81412, "epoch": 484} {"train_loss": -9.204727172851562, "global_step": 81413, "epoch": 484} {"train_loss": -9.487173080444336, "global_step": 81414, "epoch": 484} {"train_loss": -9.347121238708496, "global_step": 81415, "epoch": 484} {"train_loss": -9.137395858764648, "global_step": 81416, "epoch": 484} {"train_loss": -9.338855743408203, "global_step": 81417, "epoch": 484} {"train_loss": -9.378458023071289, "global_step": 81418, "epoch": 484} {"train_loss": -9.308127403259277, "global_step": 81419, "epoch": 484} {"train_loss": -9.568421363830566, "global_step": 81420, "epoch": 484} {"train_loss": -9.258041381835938, "global_step": 81421, "epoch": 484} {"train_loss": -9.493095397949219, "global_step": 81422, "epoch": 484} {"train_loss": -9.29600715637207, "global_step": 81423, "epoch": 484} {"train_loss": -9.301485061645508, "global_step": 81424, "epoch": 484} {"train_loss": -9.430962562561035, "global_step": 81425, "epoch": 484} {"train_loss": -9.38623046875, "global_step": 81426, "epoch": 484} {"train_loss": -9.383517265319824, "global_step": 81427, "epoch": 484} {"train_loss": -9.477616310119629, "global_step": 81428, "epoch": 484} {"train_loss": -9.422136306762695, "global_step": 81429, "epoch": 484} {"train_loss": -9.3257417678833, "global_step": 81430, "epoch": 484} {"train_loss": -9.312068939208984, "global_step": 81431, "epoch": 484} {"train_loss": -9.365478515625, "global_step": 81432, "epoch": 484} {"train_loss": -9.430452346801758, "global_step": 81433, "epoch": 484} {"train_loss": -9.307409286499023, "global_step": 81434, "epoch": 484} {"train_loss": -9.243875503540039, "global_step": 81435, "epoch": 484} {"train_loss": -9.104930877685547, "global_step": 81436, "epoch": 484} {"train_loss": -9.401725769042969, "global_step": 81437, "epoch": 484} {"train_loss": -9.304287910461426, "global_step": 81438, "epoch": 484} {"train_loss": -9.405176162719727, "global_step": 81439, "epoch": 484} {"train_loss": -9.423090934753418, "global_step": 81440, "epoch": 484} {"train_loss": -9.206253051757812, "global_step": 81441, "epoch": 484} {"train_loss": -9.296472549438477, "global_step": 81442, "epoch": 484} {"train_loss": -8.897727966308594, "global_step": 81443, "epoch": 484} {"train_loss": -9.235071182250977, "global_step": 81444, "epoch": 484} {"train_loss": -9.134407997131348, "global_step": 81445, "epoch": 484} {"train_loss": -9.029548645019531, "global_step": 81446, "epoch": 484} {"train_loss": -8.599347114562988, "global_step": 81447, "epoch": 484} {"train_loss": -9.087141036987305, "global_step": 81448, "epoch": 484} {"train_loss": -8.876636505126953, "global_step": 81449, "epoch": 484} {"train_loss": -9.141435623168945, "global_step": 81450, "epoch": 484} {"train_loss": -8.63068675994873, "global_step": 81451, "epoch": 484} {"train_loss": -9.22460651397705, "global_step": 81452, "epoch": 484} {"train_loss": -8.742916107177734, "global_step": 81453, "epoch": 484} {"train_loss": -8.461865425109863, "global_step": 81454, "epoch": 484} {"train_loss": -8.818537712097168, "global_step": 81455, "epoch": 484} {"train_loss": -8.927858352661133, "global_step": 81456, "epoch": 484} {"train_loss": -8.792631149291992, "global_step": 81457, "epoch": 484} {"train_loss": -8.89956283569336, "global_step": 81458, "epoch": 484} {"train_loss": -9.137712478637695, "global_step": 81459, "epoch": 484} {"train_loss": -8.900489807128906, "global_step": 81460, "epoch": 484} {"train_loss": -8.646251678466797, "global_step": 81461, "epoch": 484} {"train_loss": -8.92310619354248, "global_step": 81462, "epoch": 484} {"train_loss": -9.067075729370117, "global_step": 81463, "epoch": 484} {"train_loss": -9.14250659942627, "global_step": 81464, "epoch": 484} {"train_loss": -8.932957649230957, "global_step": 81465, "epoch": 484} {"train_loss": -8.783720970153809, "global_step": 81466, "epoch": 484} {"train_loss": -9.274242401123047, "global_step": 81467, "epoch": 484} {"train_loss": -9.013408660888672, "global_step": 81468, "epoch": 484} {"train_loss": -8.918577194213867, "global_step": 81469, "epoch": 484} {"train_loss": -9.167702674865723, "global_step": 81470, "epoch": 484} {"train_loss": -9.318490028381348, "global_step": 81471, "epoch": 484} {"train_loss": -9.246150970458984, "global_step": 81472, "epoch": 484} {"train_loss": -9.132421493530273, "global_step": 81473, "epoch": 484} {"train_loss": -9.36131763458252, "global_step": 81474, "epoch": 484} {"train_loss": -9.123018264770508, "global_step": 81475, "epoch": 484} {"train_loss": -9.216900825500488, "global_step": 81476, "epoch": 484} {"train_loss": -9.099382400512695, "global_step": 81477, "epoch": 484} {"train_loss": -9.221385955810547, "global_step": 81478, "epoch": 484} {"train_loss": -9.180696249008179, "global_step": 81479, "epoch": 484, "val_loss": 197977.546875} {"train_loss": -9.454910278320312, "global_step": 81480, "epoch": 485} {"train_loss": -9.500894546508789, "global_step": 81481, "epoch": 485} {"train_loss": -9.377933502197266, "global_step": 81482, "epoch": 485} {"train_loss": -9.321803092956543, "global_step": 81483, "epoch": 485} {"train_loss": -9.14784049987793, "global_step": 81484, "epoch": 485} {"train_loss": -9.432571411132812, "global_step": 81485, "epoch": 485} {"train_loss": -9.316499710083008, "global_step": 81486, "epoch": 485} {"train_loss": -9.319770812988281, "global_step": 81487, "epoch": 485} {"train_loss": -9.28045654296875, "global_step": 81488, "epoch": 485} {"train_loss": -9.139700889587402, "global_step": 81489, "epoch": 485} {"train_loss": -9.207437515258789, "global_step": 81490, "epoch": 485} {"train_loss": -9.02377700805664, "global_step": 81491, "epoch": 485} {"train_loss": -9.569625854492188, "global_step": 81492, "epoch": 485} {"train_loss": -8.89328384399414, "global_step": 81493, "epoch": 485} {"train_loss": -9.369879722595215, "global_step": 81494, "epoch": 485} {"train_loss": -8.996152877807617, "global_step": 81495, "epoch": 485} {"train_loss": -9.177396774291992, "global_step": 81496, "epoch": 485} {"train_loss": -8.994510650634766, "global_step": 81497, "epoch": 485} {"train_loss": -8.748054504394531, "global_step": 81498, "epoch": 485} {"train_loss": -8.638506889343262, "global_step": 81499, "epoch": 485} {"train_loss": -8.71413516998291, "global_step": 81500, "epoch": 485} {"train_loss": -8.47902774810791, "global_step": 81501, "epoch": 485} {"train_loss": -8.97971248626709, "global_step": 81502, "epoch": 485} {"train_loss": -8.884307861328125, "global_step": 81503, "epoch": 485} {"train_loss": -8.933618545532227, "global_step": 81504, "epoch": 485} {"train_loss": -9.029241561889648, "global_step": 81505, "epoch": 485} {"train_loss": -8.84284782409668, "global_step": 81506, "epoch": 485} {"train_loss": -9.029618263244629, "global_step": 81507, "epoch": 485} {"train_loss": -8.998344421386719, "global_step": 81508, "epoch": 485} {"train_loss": -8.99760913848877, "global_step": 81509, "epoch": 485} {"train_loss": -8.918001174926758, "global_step": 81510, "epoch": 485} {"train_loss": -9.30724048614502, "global_step": 81511, "epoch": 485} {"train_loss": -9.166654586791992, "global_step": 81512, "epoch": 485} {"train_loss": -9.185285568237305, "global_step": 81513, "epoch": 485} {"train_loss": -9.222797393798828, "global_step": 81514, "epoch": 485} {"train_loss": -9.212621688842773, "global_step": 81515, "epoch": 485} {"train_loss": -9.305508613586426, "global_step": 81516, "epoch": 485} {"train_loss": -9.24026107788086, "global_step": 81517, "epoch": 485} {"train_loss": -9.081781387329102, "global_step": 81518, "epoch": 485} {"train_loss": -9.188177108764648, "global_step": 81519, "epoch": 485} {"train_loss": -9.182659149169922, "global_step": 81520, "epoch": 485} {"train_loss": -9.543057441711426, "global_step": 81521, "epoch": 485} {"train_loss": -9.423517227172852, "global_step": 81522, "epoch": 485} {"train_loss": -9.217733383178711, "global_step": 81523, "epoch": 485} {"train_loss": -9.266419410705566, "global_step": 81524, "epoch": 485} {"train_loss": -9.425703048706055, "global_step": 81525, "epoch": 485} {"train_loss": -9.31489086151123, "global_step": 81526, "epoch": 485} {"train_loss": -9.34927749633789, "global_step": 81527, "epoch": 485} {"train_loss": -9.308378219604492, "global_step": 81528, "epoch": 485} {"train_loss": -9.226264953613281, "global_step": 81529, "epoch": 485} {"train_loss": -9.307974815368652, "global_step": 81530, "epoch": 485} {"train_loss": -9.443998336791992, "global_step": 81531, "epoch": 485} {"train_loss": -9.355852127075195, "global_step": 81532, "epoch": 485} {"train_loss": -9.52326774597168, "global_step": 81533, "epoch": 485} {"train_loss": -9.451211929321289, "global_step": 81534, "epoch": 485} {"train_loss": -9.472811698913574, "global_step": 81535, "epoch": 485} {"train_loss": -9.365673065185547, "global_step": 81536, "epoch": 485} {"train_loss": -9.120132446289062, "global_step": 81537, "epoch": 485} {"train_loss": -8.878713607788086, "global_step": 81538, "epoch": 485} {"train_loss": -9.548707962036133, "global_step": 81539, "epoch": 485} {"train_loss": -8.948689460754395, "global_step": 81540, "epoch": 485} {"train_loss": -9.359936714172363, "global_step": 81541, "epoch": 485} {"train_loss": -9.323065757751465, "global_step": 81542, "epoch": 485} {"train_loss": -9.198186874389648, "global_step": 81543, "epoch": 485} {"train_loss": -9.413917541503906, "global_step": 81544, "epoch": 485} {"train_loss": -9.275619506835938, "global_step": 81545, "epoch": 485} {"train_loss": -9.466033935546875, "global_step": 81546, "epoch": 485} {"train_loss": -9.181593894958496, "global_step": 81547, "epoch": 485} {"train_loss": -8.84276008605957, "global_step": 81548, "epoch": 485} {"train_loss": -9.340606689453125, "global_step": 81549, "epoch": 485} {"train_loss": -9.059151649475098, "global_step": 81550, "epoch": 485} {"train_loss": -9.335395812988281, "global_step": 81551, "epoch": 485} {"train_loss": -9.355301856994629, "global_step": 81552, "epoch": 485} {"train_loss": -8.855450630187988, "global_step": 81553, "epoch": 485} {"train_loss": -9.12985897064209, "global_step": 81554, "epoch": 485} {"train_loss": -9.078470230102539, "global_step": 81555, "epoch": 485} {"train_loss": -9.15233039855957, "global_step": 81556, "epoch": 485} {"train_loss": -8.897993087768555, "global_step": 81557, "epoch": 485} {"train_loss": -9.23022174835205, "global_step": 81558, "epoch": 485} {"train_loss": -9.196292877197266, "global_step": 81559, "epoch": 485} {"train_loss": -9.309213638305664, "global_step": 81560, "epoch": 485} {"train_loss": -9.48440170288086, "global_step": 81561, "epoch": 485} {"train_loss": -9.341936111450195, "global_step": 81562, "epoch": 485} {"train_loss": -9.207969665527344, "global_step": 81563, "epoch": 485} {"train_loss": -9.365523338317871, "global_step": 81564, "epoch": 485} {"train_loss": -9.26984977722168, "global_step": 81565, "epoch": 485} {"train_loss": -9.301996231079102, "global_step": 81566, "epoch": 485} {"train_loss": -9.02236557006836, "global_step": 81567, "epoch": 485} {"train_loss": -9.48184871673584, "global_step": 81568, "epoch": 485} {"train_loss": -9.339996337890625, "global_step": 81569, "epoch": 485} {"train_loss": -9.592233657836914, "global_step": 81570, "epoch": 485} {"train_loss": -9.491666793823242, "global_step": 81571, "epoch": 485} {"train_loss": -9.181899070739746, "global_step": 81572, "epoch": 485} {"train_loss": -9.394625663757324, "global_step": 81573, "epoch": 485} {"train_loss": -9.150898933410645, "global_step": 81574, "epoch": 485} {"train_loss": -9.410500526428223, "global_step": 81575, "epoch": 485} {"train_loss": -9.324729919433594, "global_step": 81576, "epoch": 485} {"train_loss": -9.291543006896973, "global_step": 81577, "epoch": 485} {"train_loss": -9.175552368164062, "global_step": 81578, "epoch": 485} {"train_loss": -9.184338569641113, "global_step": 81579, "epoch": 485} {"train_loss": -9.331159591674805, "global_step": 81580, "epoch": 485} {"train_loss": -9.148983001708984, "global_step": 81581, "epoch": 485} {"train_loss": -9.477642059326172, "global_step": 81582, "epoch": 485} {"train_loss": -9.164913177490234, "global_step": 81583, "epoch": 485} {"train_loss": -9.424812316894531, "global_step": 81584, "epoch": 485} {"train_loss": -9.030235290527344, "global_step": 81585, "epoch": 485} {"train_loss": -9.231141090393066, "global_step": 81586, "epoch": 485} {"train_loss": -9.004128456115723, "global_step": 81587, "epoch": 485} {"train_loss": -9.040328979492188, "global_step": 81588, "epoch": 485} {"train_loss": -8.970134735107422, "global_step": 81589, "epoch": 485} {"train_loss": -8.979056358337402, "global_step": 81590, "epoch": 485} {"train_loss": -9.178886413574219, "global_step": 81591, "epoch": 485} {"train_loss": -8.991775512695312, "global_step": 81592, "epoch": 485} {"train_loss": -9.174116134643555, "global_step": 81593, "epoch": 485} {"train_loss": -8.816452026367188, "global_step": 81594, "epoch": 485} {"train_loss": -9.513042449951172, "global_step": 81595, "epoch": 485} {"train_loss": -9.081367492675781, "global_step": 81596, "epoch": 485} {"train_loss": -9.31125259399414, "global_step": 81597, "epoch": 485} {"train_loss": -9.260149955749512, "global_step": 81598, "epoch": 485} {"train_loss": -9.331777572631836, "global_step": 81599, "epoch": 485} {"train_loss": -9.01816177368164, "global_step": 81600, "epoch": 485} {"train_loss": -9.344764709472656, "global_step": 81601, "epoch": 485} {"train_loss": -9.052448272705078, "global_step": 81602, "epoch": 485} {"train_loss": -9.237905502319336, "global_step": 81603, "epoch": 485} {"train_loss": -9.230433464050293, "global_step": 81604, "epoch": 485} {"train_loss": -9.081474304199219, "global_step": 81605, "epoch": 485} {"train_loss": -9.202491760253906, "global_step": 81606, "epoch": 485} {"train_loss": -9.152018547058105, "global_step": 81607, "epoch": 485} {"train_loss": -8.994884490966797, "global_step": 81608, "epoch": 485} {"train_loss": -9.28683853149414, "global_step": 81609, "epoch": 485} {"train_loss": -9.153690338134766, "global_step": 81610, "epoch": 485} {"train_loss": -9.161128997802734, "global_step": 81611, "epoch": 485} {"train_loss": -8.992989540100098, "global_step": 81612, "epoch": 485} {"train_loss": -9.030152320861816, "global_step": 81613, "epoch": 485} {"train_loss": -9.239347457885742, "global_step": 81614, "epoch": 485} {"train_loss": -9.345008850097656, "global_step": 81615, "epoch": 485} {"train_loss": -9.140167236328125, "global_step": 81616, "epoch": 485} {"train_loss": -8.978630065917969, "global_step": 81617, "epoch": 485} {"train_loss": -9.376277923583984, "global_step": 81618, "epoch": 485} {"train_loss": -8.838698387145996, "global_step": 81619, "epoch": 485} {"train_loss": -8.96183967590332, "global_step": 81620, "epoch": 485} {"train_loss": -9.038045883178711, "global_step": 81621, "epoch": 485} {"train_loss": -9.02236557006836, "global_step": 81622, "epoch": 485} {"train_loss": -9.073583602905273, "global_step": 81623, "epoch": 485} {"train_loss": -9.1447172164917, "global_step": 81624, "epoch": 485} {"train_loss": -9.179071426391602, "global_step": 81625, "epoch": 485} {"train_loss": -8.990592002868652, "global_step": 81626, "epoch": 485} {"train_loss": -9.377726554870605, "global_step": 81627, "epoch": 485} {"train_loss": -9.329051971435547, "global_step": 81628, "epoch": 485} {"train_loss": -9.161985397338867, "global_step": 81629, "epoch": 485} {"train_loss": -9.166633605957031, "global_step": 81630, "epoch": 485} {"train_loss": -9.175716400146484, "global_step": 81631, "epoch": 485} {"train_loss": -9.199705123901367, "global_step": 81632, "epoch": 485} {"train_loss": -9.28525161743164, "global_step": 81633, "epoch": 485} {"train_loss": -9.186662673950195, "global_step": 81634, "epoch": 485} {"train_loss": -9.107616424560547, "global_step": 81635, "epoch": 485} {"train_loss": -9.068754196166992, "global_step": 81636, "epoch": 485} {"train_loss": -9.4110689163208, "global_step": 81637, "epoch": 485} {"train_loss": -9.302448272705078, "global_step": 81638, "epoch": 485} {"train_loss": -9.053396224975586, "global_step": 81639, "epoch": 485} {"train_loss": -9.339933395385742, "global_step": 81640, "epoch": 485} {"train_loss": -9.354602813720703, "global_step": 81641, "epoch": 485} {"train_loss": -9.06656265258789, "global_step": 81642, "epoch": 485} {"train_loss": -9.356609344482422, "global_step": 81643, "epoch": 485} {"train_loss": -8.922700881958008, "global_step": 81644, "epoch": 485} {"train_loss": -9.132471084594727, "global_step": 81645, "epoch": 485} {"train_loss": -9.189752578735352, "global_step": 81646, "epoch": 485} {"train_loss": -9.192942273049127, "global_step": 81647, "epoch": 485, "val_loss": 200629.0625, "train_action_mse_error": 5.3181843757629395} {"train_loss": -9.300443649291992, "global_step": 81648, "epoch": 486} {"train_loss": -9.280180931091309, "global_step": 81649, "epoch": 486} {"train_loss": -8.956528663635254, "global_step": 81650, "epoch": 486} {"train_loss": -9.402924537658691, "global_step": 81651, "epoch": 486} {"train_loss": -9.07744026184082, "global_step": 81652, "epoch": 486} {"train_loss": -8.98921012878418, "global_step": 81653, "epoch": 486} {"train_loss": -9.36036491394043, "global_step": 81654, "epoch": 486} {"train_loss": -9.53060531616211, "global_step": 81655, "epoch": 486} {"train_loss": -8.940385818481445, "global_step": 81656, "epoch": 486} {"train_loss": -9.554935455322266, "global_step": 81657, "epoch": 486} {"train_loss": -9.19039535522461, "global_step": 81658, "epoch": 486} {"train_loss": -9.12427806854248, "global_step": 81659, "epoch": 486} {"train_loss": -9.22109317779541, "global_step": 81660, "epoch": 486} {"train_loss": -9.214666366577148, "global_step": 81661, "epoch": 486} {"train_loss": -9.244361877441406, "global_step": 81662, "epoch": 486} {"train_loss": -9.34979248046875, "global_step": 81663, "epoch": 486} {"train_loss": -8.93896770477295, "global_step": 81664, "epoch": 486} {"train_loss": -9.353927612304688, "global_step": 81665, "epoch": 486} {"train_loss": -9.124238014221191, "global_step": 81666, "epoch": 486} {"train_loss": -9.2979154586792, "global_step": 81667, "epoch": 486} {"train_loss": -8.950374603271484, "global_step": 81668, "epoch": 486} {"train_loss": -9.146932601928711, "global_step": 81669, "epoch": 486} {"train_loss": -9.126633644104004, "global_step": 81670, "epoch": 486} {"train_loss": -9.265771865844727, "global_step": 81671, "epoch": 486} {"train_loss": -9.167630195617676, "global_step": 81672, "epoch": 486} {"train_loss": -9.305919647216797, "global_step": 81673, "epoch": 486} {"train_loss": -9.155130386352539, "global_step": 81674, "epoch": 486} {"train_loss": -9.344381332397461, "global_step": 81675, "epoch": 486} {"train_loss": -9.090021133422852, "global_step": 81676, "epoch": 486} {"train_loss": -9.111639022827148, "global_step": 81677, "epoch": 486} {"train_loss": -9.333081245422363, "global_step": 81678, "epoch": 486} {"train_loss": -9.165088653564453, "global_step": 81679, "epoch": 486} {"train_loss": -9.075983047485352, "global_step": 81680, "epoch": 486} {"train_loss": -9.15595531463623, "global_step": 81681, "epoch": 486} {"train_loss": -9.200536727905273, "global_step": 81682, "epoch": 486} {"train_loss": -9.198386192321777, "global_step": 81683, "epoch": 486} {"train_loss": -9.178478240966797, "global_step": 81684, "epoch": 486} {"train_loss": -9.318754196166992, "global_step": 81685, "epoch": 486} {"train_loss": -9.337324142456055, "global_step": 81686, "epoch": 486} {"train_loss": -8.991079330444336, "global_step": 81687, "epoch": 486} {"train_loss": -9.221328735351562, "global_step": 81688, "epoch": 486} {"train_loss": -9.259726524353027, "global_step": 81689, "epoch": 486} {"train_loss": -9.124276161193848, "global_step": 81690, "epoch": 486} {"train_loss": -9.01869010925293, "global_step": 81691, "epoch": 486} {"train_loss": -9.31117057800293, "global_step": 81692, "epoch": 486} {"train_loss": -9.271360397338867, "global_step": 81693, "epoch": 486} {"train_loss": -9.18636703491211, "global_step": 81694, "epoch": 486} {"train_loss": -9.275033950805664, "global_step": 81695, "epoch": 486} {"train_loss": -9.337326049804688, "global_step": 81696, "epoch": 486} {"train_loss": -9.381318092346191, "global_step": 81697, "epoch": 486} {"train_loss": -9.154852867126465, "global_step": 81698, "epoch": 486} {"train_loss": -9.57315444946289, "global_step": 81699, "epoch": 486} {"train_loss": -9.324708938598633, "global_step": 81700, "epoch": 486} {"train_loss": -9.449048042297363, "global_step": 81701, "epoch": 486} {"train_loss": -9.128257751464844, "global_step": 81702, "epoch": 486} {"train_loss": -9.361547470092773, "global_step": 81703, "epoch": 486} {"train_loss": -9.369941711425781, "global_step": 81704, "epoch": 486} {"train_loss": -9.27769947052002, "global_step": 81705, "epoch": 486} {"train_loss": -8.96170425415039, "global_step": 81706, "epoch": 486} {"train_loss": -9.080684661865234, "global_step": 81707, "epoch": 486} {"train_loss": -9.263498306274414, "global_step": 81708, "epoch": 486} {"train_loss": -9.105917930603027, "global_step": 81709, "epoch": 486} {"train_loss": -9.189332962036133, "global_step": 81710, "epoch": 486} {"train_loss": -9.0922269821167, "global_step": 81711, "epoch": 486} {"train_loss": -9.471641540527344, "global_step": 81712, "epoch": 486} {"train_loss": -9.091878890991211, "global_step": 81713, "epoch": 486} {"train_loss": -8.986021041870117, "global_step": 81714, "epoch": 486} {"train_loss": -9.254467010498047, "global_step": 81715, "epoch": 486} {"train_loss": -8.900209426879883, "global_step": 81716, "epoch": 486} {"train_loss": -9.183874130249023, "global_step": 81717, "epoch": 486} {"train_loss": -9.086217880249023, "global_step": 81718, "epoch": 486} {"train_loss": -9.329615592956543, "global_step": 81719, "epoch": 486} {"train_loss": -8.757650375366211, "global_step": 81720, "epoch": 486} {"train_loss": -9.490839004516602, "global_step": 81721, "epoch": 486} {"train_loss": -9.276700973510742, "global_step": 81722, "epoch": 486} {"train_loss": -9.001622200012207, "global_step": 81723, "epoch": 486} {"train_loss": -9.21457290649414, "global_step": 81724, "epoch": 486} {"train_loss": -9.13672161102295, "global_step": 81725, "epoch": 486} {"train_loss": -9.265969276428223, "global_step": 81726, "epoch": 486} {"train_loss": -9.307188034057617, "global_step": 81727, "epoch": 486} {"train_loss": -9.228116989135742, "global_step": 81728, "epoch": 486} {"train_loss": -9.31175708770752, "global_step": 81729, "epoch": 486} {"train_loss": -9.212183952331543, "global_step": 81730, "epoch": 486} {"train_loss": -9.306169509887695, "global_step": 81731, "epoch": 486} {"train_loss": -9.378066062927246, "global_step": 81732, "epoch": 486} {"train_loss": -9.363323211669922, "global_step": 81733, "epoch": 486} {"train_loss": -9.475421905517578, "global_step": 81734, "epoch": 486} {"train_loss": -9.2387113571167, "global_step": 81735, "epoch": 486} {"train_loss": -9.556913375854492, "global_step": 81736, "epoch": 486} {"train_loss": -9.549976348876953, "global_step": 81737, "epoch": 486} {"train_loss": -9.359661102294922, "global_step": 81738, "epoch": 486} {"train_loss": -9.401954650878906, "global_step": 81739, "epoch": 486} {"train_loss": -9.472589492797852, "global_step": 81740, "epoch": 486} {"train_loss": -9.61752700805664, "global_step": 81741, "epoch": 486} {"train_loss": -9.71192741394043, "global_step": 81742, "epoch": 486} {"train_loss": -9.465646743774414, "global_step": 81743, "epoch": 486} {"train_loss": -9.428115844726562, "global_step": 81744, "epoch": 486} {"train_loss": -9.529821395874023, "global_step": 81745, "epoch": 486} {"train_loss": -9.493317604064941, "global_step": 81746, "epoch": 486} {"train_loss": -9.1557035446167, "global_step": 81747, "epoch": 486} {"train_loss": -9.555326461791992, "global_step": 81748, "epoch": 486} {"train_loss": -9.198853492736816, "global_step": 81749, "epoch": 486} {"train_loss": -8.553167343139648, "global_step": 81750, "epoch": 486} {"train_loss": -9.525505065917969, "global_step": 81751, "epoch": 486} {"train_loss": -8.443734169006348, "global_step": 81752, "epoch": 486} {"train_loss": -8.999759674072266, "global_step": 81753, "epoch": 486} {"train_loss": -9.03707218170166, "global_step": 81754, "epoch": 486} {"train_loss": -9.281120300292969, "global_step": 81755, "epoch": 486} {"train_loss": -8.997529029846191, "global_step": 81756, "epoch": 486} {"train_loss": -9.140583038330078, "global_step": 81757, "epoch": 486} {"train_loss": -8.970083236694336, "global_step": 81758, "epoch": 486} {"train_loss": -9.023740768432617, "global_step": 81759, "epoch": 486} {"train_loss": -9.265532493591309, "global_step": 81760, "epoch": 486} {"train_loss": -9.106576919555664, "global_step": 81761, "epoch": 486} {"train_loss": -9.307064056396484, "global_step": 81762, "epoch": 486} {"train_loss": -9.299697875976562, "global_step": 81763, "epoch": 486} {"train_loss": -9.380731582641602, "global_step": 81764, "epoch": 486} {"train_loss": -9.362309455871582, "global_step": 81765, "epoch": 486} {"train_loss": -9.361063957214355, "global_step": 81766, "epoch": 486} {"train_loss": -9.211860656738281, "global_step": 81767, "epoch": 486} {"train_loss": -9.525920867919922, "global_step": 81768, "epoch": 486} {"train_loss": -9.326558113098145, "global_step": 81769, "epoch": 486} {"train_loss": -9.311328887939453, "global_step": 81770, "epoch": 486} {"train_loss": -9.302267074584961, "global_step": 81771, "epoch": 486} {"train_loss": -9.390935897827148, "global_step": 81772, "epoch": 486} {"train_loss": -9.414497375488281, "global_step": 81773, "epoch": 486} {"train_loss": -9.548179626464844, "global_step": 81774, "epoch": 486} {"train_loss": -9.491148948669434, "global_step": 81775, "epoch": 486} {"train_loss": -9.496896743774414, "global_step": 81776, "epoch": 486} {"train_loss": -9.354862213134766, "global_step": 81777, "epoch": 486} {"train_loss": -9.422456741333008, "global_step": 81778, "epoch": 486} {"train_loss": -9.470678329467773, "global_step": 81779, "epoch": 486} {"train_loss": -9.557137489318848, "global_step": 81780, "epoch": 486} {"train_loss": -9.693192481994629, "global_step": 81781, "epoch": 486} {"train_loss": -9.515798568725586, "global_step": 81782, "epoch": 486} {"train_loss": -9.4189453125, "global_step": 81783, "epoch": 486} {"train_loss": -9.119924545288086, "global_step": 81784, "epoch": 486} {"train_loss": -9.404914855957031, "global_step": 81785, "epoch": 486} {"train_loss": -9.544685363769531, "global_step": 81786, "epoch": 486} {"train_loss": -9.324280738830566, "global_step": 81787, "epoch": 486} {"train_loss": -9.52751350402832, "global_step": 81788, "epoch": 486} {"train_loss": -9.361760139465332, "global_step": 81789, "epoch": 486} {"train_loss": -9.329536437988281, "global_step": 81790, "epoch": 486} {"train_loss": -9.08702564239502, "global_step": 81791, "epoch": 486} {"train_loss": -9.214615821838379, "global_step": 81792, "epoch": 486} {"train_loss": -9.166954040527344, "global_step": 81793, "epoch": 486} {"train_loss": -9.11806583404541, "global_step": 81794, "epoch": 486} {"train_loss": -9.287971496582031, "global_step": 81795, "epoch": 486} {"train_loss": -8.972360610961914, "global_step": 81796, "epoch": 486} {"train_loss": -9.086141586303711, "global_step": 81797, "epoch": 486} {"train_loss": -9.229058265686035, "global_step": 81798, "epoch": 486} {"train_loss": -9.023426055908203, "global_step": 81799, "epoch": 486} {"train_loss": -9.111069679260254, "global_step": 81800, "epoch": 486} {"train_loss": -9.000669479370117, "global_step": 81801, "epoch": 486} {"train_loss": -9.234711647033691, "global_step": 81802, "epoch": 486} {"train_loss": -9.049412727355957, "global_step": 81803, "epoch": 486} {"train_loss": -9.088603973388672, "global_step": 81804, "epoch": 486} {"train_loss": -8.892313003540039, "global_step": 81805, "epoch": 486} {"train_loss": -9.090237617492676, "global_step": 81806, "epoch": 486} {"train_loss": -8.982919692993164, "global_step": 81807, "epoch": 486} {"train_loss": -8.943872451782227, "global_step": 81808, "epoch": 486} {"train_loss": -9.288923263549805, "global_step": 81809, "epoch": 486} {"train_loss": -9.100425720214844, "global_step": 81810, "epoch": 486} {"train_loss": -9.034957885742188, "global_step": 81811, "epoch": 486} {"train_loss": -9.090269088745117, "global_step": 81812, "epoch": 486} {"train_loss": -9.120684623718262, "global_step": 81813, "epoch": 486} {"train_loss": -9.05070686340332, "global_step": 81814, "epoch": 486} {"train_loss": -9.23825660773686, "global_step": 81815, "epoch": 486, "val_loss": 198071.703125} {"train_loss": -9.032794952392578, "global_step": 81816, "epoch": 487} {"train_loss": -9.18359088897705, "global_step": 81817, "epoch": 487} {"train_loss": -9.075756072998047, "global_step": 81818, "epoch": 487} {"train_loss": -8.983166694641113, "global_step": 81819, "epoch": 487} {"train_loss": -9.280557632446289, "global_step": 81820, "epoch": 487} {"train_loss": -9.09830093383789, "global_step": 81821, "epoch": 487} {"train_loss": -8.984260559082031, "global_step": 81822, "epoch": 487} {"train_loss": -9.29053020477295, "global_step": 81823, "epoch": 487} {"train_loss": -8.85482406616211, "global_step": 81824, "epoch": 487} {"train_loss": -9.026869773864746, "global_step": 81825, "epoch": 487} {"train_loss": -9.336651802062988, "global_step": 81826, "epoch": 487} {"train_loss": -9.149718284606934, "global_step": 81827, "epoch": 487} {"train_loss": -9.214360237121582, "global_step": 81828, "epoch": 487} {"train_loss": -9.258831024169922, "global_step": 81829, "epoch": 487} {"train_loss": -8.903402328491211, "global_step": 81830, "epoch": 487} {"train_loss": -9.275840759277344, "global_step": 81831, "epoch": 487} {"train_loss": -9.371431350708008, "global_step": 81832, "epoch": 487} {"train_loss": -9.13071060180664, "global_step": 81833, "epoch": 487} {"train_loss": -9.288843154907227, "global_step": 81834, "epoch": 487} {"train_loss": -9.131795883178711, "global_step": 81835, "epoch": 487} {"train_loss": -9.214672088623047, "global_step": 81836, "epoch": 487} {"train_loss": -8.852276802062988, "global_step": 81837, "epoch": 487} {"train_loss": -9.033914566040039, "global_step": 81838, "epoch": 487} {"train_loss": -8.570900917053223, "global_step": 81839, "epoch": 487} {"train_loss": -8.93301010131836, "global_step": 81840, "epoch": 487} {"train_loss": -8.538145065307617, "global_step": 81841, "epoch": 487} {"train_loss": -8.682551383972168, "global_step": 81842, "epoch": 487} {"train_loss": -8.361342430114746, "global_step": 81843, "epoch": 487} {"train_loss": -8.491354942321777, "global_step": 81844, "epoch": 487} {"train_loss": -8.970195770263672, "global_step": 81845, "epoch": 487} {"train_loss": -8.747447967529297, "global_step": 81846, "epoch": 487} {"train_loss": -8.083124160766602, "global_step": 81847, "epoch": 487} {"train_loss": -8.933511734008789, "global_step": 81848, "epoch": 487} {"train_loss": -8.526575088500977, "global_step": 81849, "epoch": 487} {"train_loss": -8.374040603637695, "global_step": 81850, "epoch": 487} {"train_loss": -8.718072891235352, "global_step": 81851, "epoch": 487} {"train_loss": -8.45739459991455, "global_step": 81852, "epoch": 487} {"train_loss": -8.825011253356934, "global_step": 81853, "epoch": 487} {"train_loss": -9.026571273803711, "global_step": 81854, "epoch": 487} {"train_loss": -8.764671325683594, "global_step": 81855, "epoch": 487} {"train_loss": -9.047845840454102, "global_step": 81856, "epoch": 487} {"train_loss": -8.886215209960938, "global_step": 81857, "epoch": 487} {"train_loss": -9.015726089477539, "global_step": 81858, "epoch": 487} {"train_loss": -8.971681594848633, "global_step": 81859, "epoch": 487} {"train_loss": -8.829279899597168, "global_step": 81860, "epoch": 487} {"train_loss": -8.75666618347168, "global_step": 81861, "epoch": 487} {"train_loss": -9.180662155151367, "global_step": 81862, "epoch": 487} {"train_loss": -8.876527786254883, "global_step": 81863, "epoch": 487} {"train_loss": -8.873639106750488, "global_step": 81864, "epoch": 487} {"train_loss": -9.0715913772583, "global_step": 81865, "epoch": 487} {"train_loss": -9.166104316711426, "global_step": 81866, "epoch": 487} {"train_loss": -9.218355178833008, "global_step": 81867, "epoch": 487} {"train_loss": -9.263111114501953, "global_step": 81868, "epoch": 487} {"train_loss": -9.059840202331543, "global_step": 81869, "epoch": 487} {"train_loss": -9.044196128845215, "global_step": 81870, "epoch": 487} {"train_loss": -9.225776672363281, "global_step": 81871, "epoch": 487} {"train_loss": -9.246315956115723, "global_step": 81872, "epoch": 487} {"train_loss": -9.531766891479492, "global_step": 81873, "epoch": 487} {"train_loss": -9.188965797424316, "global_step": 81874, "epoch": 487} {"train_loss": -9.388809204101562, "global_step": 81875, "epoch": 487} {"train_loss": -9.327727317810059, "global_step": 81876, "epoch": 487} {"train_loss": -9.564406394958496, "global_step": 81877, "epoch": 487} {"train_loss": -9.561073303222656, "global_step": 81878, "epoch": 487} {"train_loss": -9.632246971130371, "global_step": 81879, "epoch": 487} {"train_loss": -9.468788146972656, "global_step": 81880, "epoch": 487} {"train_loss": -9.469837188720703, "global_step": 81881, "epoch": 487} {"train_loss": -9.347411155700684, "global_step": 81882, "epoch": 487} {"train_loss": -9.357999801635742, "global_step": 81883, "epoch": 487} {"train_loss": -9.116647720336914, "global_step": 81884, "epoch": 487} {"train_loss": -8.82296371459961, "global_step": 81885, "epoch": 487} {"train_loss": -9.426170349121094, "global_step": 81886, "epoch": 487} {"train_loss": -9.179486274719238, "global_step": 81887, "epoch": 487} {"train_loss": -9.357731819152832, "global_step": 81888, "epoch": 487} {"train_loss": -8.830339431762695, "global_step": 81889, "epoch": 487} {"train_loss": -8.547197341918945, "global_step": 81890, "epoch": 487} {"train_loss": -8.188410758972168, "global_step": 81891, "epoch": 487} {"train_loss": -8.664529800415039, "global_step": 81892, "epoch": 487} {"train_loss": -9.00102424621582, "global_step": 81893, "epoch": 487} {"train_loss": -8.886628150939941, "global_step": 81894, "epoch": 487} {"train_loss": -9.011001586914062, "global_step": 81895, "epoch": 487} {"train_loss": -9.020618438720703, "global_step": 81896, "epoch": 487} {"train_loss": -9.014351844787598, "global_step": 81897, "epoch": 487} {"train_loss": -8.83792495727539, "global_step": 81898, "epoch": 487} {"train_loss": -8.851286888122559, "global_step": 81899, "epoch": 487} {"train_loss": -9.078245162963867, "global_step": 81900, "epoch": 487} {"train_loss": -9.045266151428223, "global_step": 81901, "epoch": 487} {"train_loss": -9.340258598327637, "global_step": 81902, "epoch": 487} {"train_loss": -9.095817565917969, "global_step": 81903, "epoch": 487} {"train_loss": -9.02038288116455, "global_step": 81904, "epoch": 487} {"train_loss": -9.126358985900879, "global_step": 81905, "epoch": 487} {"train_loss": -9.157334327697754, "global_step": 81906, "epoch": 487} {"train_loss": -9.458194732666016, "global_step": 81907, "epoch": 487} {"train_loss": -9.217245101928711, "global_step": 81908, "epoch": 487} {"train_loss": -9.099013328552246, "global_step": 81909, "epoch": 487} {"train_loss": -9.300317764282227, "global_step": 81910, "epoch": 487} {"train_loss": -9.197977066040039, "global_step": 81911, "epoch": 487} {"train_loss": -9.136516571044922, "global_step": 81912, "epoch": 487} {"train_loss": -9.199945449829102, "global_step": 81913, "epoch": 487} {"train_loss": -8.9364652633667, "global_step": 81914, "epoch": 487} {"train_loss": -9.277270317077637, "global_step": 81915, "epoch": 487} {"train_loss": -9.486903190612793, "global_step": 81916, "epoch": 487} {"train_loss": -9.273757934570312, "global_step": 81917, "epoch": 487} {"train_loss": -9.208785057067871, "global_step": 81918, "epoch": 487} {"train_loss": -9.30634880065918, "global_step": 81919, "epoch": 487} {"train_loss": -9.08651065826416, "global_step": 81920, "epoch": 487} {"train_loss": -9.396223068237305, "global_step": 81921, "epoch": 487} {"train_loss": -9.535411834716797, "global_step": 81922, "epoch": 487} {"train_loss": -9.309833526611328, "global_step": 81923, "epoch": 487} {"train_loss": -9.308841705322266, "global_step": 81924, "epoch": 487} {"train_loss": -9.45033073425293, "global_step": 81925, "epoch": 487} {"train_loss": -9.44352912902832, "global_step": 81926, "epoch": 487} {"train_loss": -9.42972183227539, "global_step": 81927, "epoch": 487} {"train_loss": -9.30143928527832, "global_step": 81928, "epoch": 487} {"train_loss": -9.305734634399414, "global_step": 81929, "epoch": 487} {"train_loss": -9.684784889221191, "global_step": 81930, "epoch": 487} {"train_loss": -9.436494827270508, "global_step": 81931, "epoch": 487} {"train_loss": -9.254085540771484, "global_step": 81932, "epoch": 487} {"train_loss": -9.652929306030273, "global_step": 81933, "epoch": 487} {"train_loss": -9.517081260681152, "global_step": 81934, "epoch": 487} {"train_loss": -9.20467758178711, "global_step": 81935, "epoch": 487} {"train_loss": -9.56147575378418, "global_step": 81936, "epoch": 487} {"train_loss": -9.529526710510254, "global_step": 81937, "epoch": 487} {"train_loss": -9.419599533081055, "global_step": 81938, "epoch": 487} {"train_loss": -9.150315284729004, "global_step": 81939, "epoch": 487} {"train_loss": -9.241273880004883, "global_step": 81940, "epoch": 487} {"train_loss": -9.309138298034668, "global_step": 81941, "epoch": 487} {"train_loss": -9.289567947387695, "global_step": 81942, "epoch": 487} {"train_loss": -8.823832511901855, "global_step": 81943, "epoch": 487} {"train_loss": -9.334125518798828, "global_step": 81944, "epoch": 487} {"train_loss": -9.381078720092773, "global_step": 81945, "epoch": 487} {"train_loss": -9.08537483215332, "global_step": 81946, "epoch": 487} {"train_loss": -9.057703018188477, "global_step": 81947, "epoch": 487} {"train_loss": -9.068816184997559, "global_step": 81948, "epoch": 487} {"train_loss": -9.192591667175293, "global_step": 81949, "epoch": 487} {"train_loss": -9.094009399414062, "global_step": 81950, "epoch": 487} {"train_loss": -8.943897247314453, "global_step": 81951, "epoch": 487} {"train_loss": -8.865140914916992, "global_step": 81952, "epoch": 487} {"train_loss": -9.039639472961426, "global_step": 81953, "epoch": 487} {"train_loss": -9.060771942138672, "global_step": 81954, "epoch": 487} {"train_loss": -9.145055770874023, "global_step": 81955, "epoch": 487} {"train_loss": -8.9644775390625, "global_step": 81956, "epoch": 487} {"train_loss": -9.346885681152344, "global_step": 81957, "epoch": 487} {"train_loss": -8.936779975891113, "global_step": 81958, "epoch": 487} {"train_loss": -9.193880081176758, "global_step": 81959, "epoch": 487} {"train_loss": -9.463068008422852, "global_step": 81960, "epoch": 487} {"train_loss": -9.258879661560059, "global_step": 81961, "epoch": 487} {"train_loss": -9.332525253295898, "global_step": 81962, "epoch": 487} {"train_loss": -9.028098106384277, "global_step": 81963, "epoch": 487} {"train_loss": -9.205018997192383, "global_step": 81964, "epoch": 487} {"train_loss": -9.279021263122559, "global_step": 81965, "epoch": 487} {"train_loss": -9.381542205810547, "global_step": 81966, "epoch": 487} {"train_loss": -9.118924140930176, "global_step": 81967, "epoch": 487} {"train_loss": -9.332808494567871, "global_step": 81968, "epoch": 487} {"train_loss": -9.3430757522583, "global_step": 81969, "epoch": 487} {"train_loss": -9.466133117675781, "global_step": 81970, "epoch": 487} {"train_loss": -9.124248504638672, "global_step": 81971, "epoch": 487} {"train_loss": -9.338101387023926, "global_step": 81972, "epoch": 487} {"train_loss": -9.167074203491211, "global_step": 81973, "epoch": 487} {"train_loss": -9.416559219360352, "global_step": 81974, "epoch": 487} {"train_loss": -9.342021942138672, "global_step": 81975, "epoch": 487} {"train_loss": -9.472785949707031, "global_step": 81976, "epoch": 487} {"train_loss": -9.323896408081055, "global_step": 81977, "epoch": 487} {"train_loss": -9.208757400512695, "global_step": 81978, "epoch": 487} {"train_loss": -9.378351211547852, "global_step": 81979, "epoch": 487} {"train_loss": -9.303444862365723, "global_step": 81980, "epoch": 487} {"train_loss": -9.301776885986328, "global_step": 81981, "epoch": 487} {"train_loss": -9.41372013092041, "global_step": 81982, "epoch": 487} {"train_loss": -9.134547659329005, "global_step": 81983, "epoch": 487, "val_loss": 199949.234375} {"train_loss": -9.316608428955078, "global_step": 81984, "epoch": 488} {"train_loss": -9.317840576171875, "global_step": 81985, "epoch": 488} {"train_loss": -9.439559936523438, "global_step": 81986, "epoch": 488} {"train_loss": -9.102497100830078, "global_step": 81987, "epoch": 488} {"train_loss": -9.468016624450684, "global_step": 81988, "epoch": 488} {"train_loss": -9.258320808410645, "global_step": 81989, "epoch": 488} {"train_loss": -9.403095245361328, "global_step": 81990, "epoch": 488} {"train_loss": -9.29698371887207, "global_step": 81991, "epoch": 488} {"train_loss": -9.257813453674316, "global_step": 81992, "epoch": 488} {"train_loss": -9.258323669433594, "global_step": 81993, "epoch": 488} {"train_loss": -9.214553833007812, "global_step": 81994, "epoch": 488} {"train_loss": -9.455729484558105, "global_step": 81995, "epoch": 488} {"train_loss": -9.39921760559082, "global_step": 81996, "epoch": 488} {"train_loss": -9.517572402954102, "global_step": 81997, "epoch": 488} {"train_loss": -9.184720993041992, "global_step": 81998, "epoch": 488} {"train_loss": -9.303956985473633, "global_step": 81999, "epoch": 488} {"train_loss": -9.43612289428711, "global_step": 82000, "epoch": 488} {"train_loss": -9.272544860839844, "global_step": 82001, "epoch": 488} {"train_loss": -9.47912311553955, "global_step": 82002, "epoch": 488} {"train_loss": -9.395484924316406, "global_step": 82003, "epoch": 488} {"train_loss": -9.18405818939209, "global_step": 82004, "epoch": 488} {"train_loss": -9.223752975463867, "global_step": 82005, "epoch": 488} {"train_loss": -9.017213821411133, "global_step": 82006, "epoch": 488} {"train_loss": -9.075584411621094, "global_step": 82007, "epoch": 488} {"train_loss": -9.259637832641602, "global_step": 82008, "epoch": 488} {"train_loss": -9.117238998413086, "global_step": 82009, "epoch": 488} {"train_loss": -9.488686561584473, "global_step": 82010, "epoch": 488} {"train_loss": -9.377031326293945, "global_step": 82011, "epoch": 488} {"train_loss": -9.265111923217773, "global_step": 82012, "epoch": 488} {"train_loss": -9.333667755126953, "global_step": 82013, "epoch": 488} {"train_loss": -9.155346870422363, "global_step": 82014, "epoch": 488} {"train_loss": -9.435770988464355, "global_step": 82015, "epoch": 488} {"train_loss": -9.352754592895508, "global_step": 82016, "epoch": 488} {"train_loss": -9.244318008422852, "global_step": 82017, "epoch": 488} {"train_loss": -9.062585830688477, "global_step": 82018, "epoch": 488} {"train_loss": -9.458707809448242, "global_step": 82019, "epoch": 488} {"train_loss": -9.343456268310547, "global_step": 82020, "epoch": 488} {"train_loss": -9.38759994506836, "global_step": 82021, "epoch": 488} {"train_loss": -9.332324028015137, "global_step": 82022, "epoch": 488} {"train_loss": -9.50639533996582, "global_step": 82023, "epoch": 488} {"train_loss": -9.197641372680664, "global_step": 82024, "epoch": 488} {"train_loss": -9.31551456451416, "global_step": 82025, "epoch": 488} {"train_loss": -9.305183410644531, "global_step": 82026, "epoch": 488} {"train_loss": -9.252622604370117, "global_step": 82027, "epoch": 488} {"train_loss": -9.361251831054688, "global_step": 82028, "epoch": 488} {"train_loss": -9.281950950622559, "global_step": 82029, "epoch": 488} {"train_loss": -9.516361236572266, "global_step": 82030, "epoch": 488} {"train_loss": -9.421940803527832, "global_step": 82031, "epoch": 488} {"train_loss": -9.126246452331543, "global_step": 82032, "epoch": 488} {"train_loss": -9.41028118133545, "global_step": 82033, "epoch": 488} {"train_loss": -9.199117660522461, "global_step": 82034, "epoch": 488} {"train_loss": -9.273077964782715, "global_step": 82035, "epoch": 488} {"train_loss": -9.275300979614258, "global_step": 82036, "epoch": 488} {"train_loss": -9.42125129699707, "global_step": 82037, "epoch": 488} {"train_loss": -9.636411666870117, "global_step": 82038, "epoch": 488} {"train_loss": -9.358253479003906, "global_step": 82039, "epoch": 488} {"train_loss": -9.247283935546875, "global_step": 82040, "epoch": 488} {"train_loss": -8.95500373840332, "global_step": 82041, "epoch": 488} {"train_loss": -9.279775619506836, "global_step": 82042, "epoch": 488} {"train_loss": -9.018993377685547, "global_step": 82043, "epoch": 488} {"train_loss": -9.113150596618652, "global_step": 82044, "epoch": 488} {"train_loss": -8.857524871826172, "global_step": 82045, "epoch": 488} {"train_loss": -9.232601165771484, "global_step": 82046, "epoch": 488} {"train_loss": -8.943340301513672, "global_step": 82047, "epoch": 488} {"train_loss": -8.805584907531738, "global_step": 82048, "epoch": 488} {"train_loss": -9.146648406982422, "global_step": 82049, "epoch": 488} {"train_loss": -9.09707260131836, "global_step": 82050, "epoch": 488} {"train_loss": -8.866171836853027, "global_step": 82051, "epoch": 488} {"train_loss": -9.11639404296875, "global_step": 82052, "epoch": 488} {"train_loss": -9.265857696533203, "global_step": 82053, "epoch": 488} {"train_loss": -9.34443187713623, "global_step": 82054, "epoch": 488} {"train_loss": -9.273964881896973, "global_step": 82055, "epoch": 488} {"train_loss": -9.01390552520752, "global_step": 82056, "epoch": 488} {"train_loss": -9.285126686096191, "global_step": 82057, "epoch": 488} {"train_loss": -8.924752235412598, "global_step": 82058, "epoch": 488} {"train_loss": -8.926936149597168, "global_step": 82059, "epoch": 488} {"train_loss": -9.272520065307617, "global_step": 82060, "epoch": 488} {"train_loss": -9.393014907836914, "global_step": 82061, "epoch": 488} {"train_loss": -8.969897270202637, "global_step": 82062, "epoch": 488} {"train_loss": -9.278179168701172, "global_step": 82063, "epoch": 488} {"train_loss": -9.360931396484375, "global_step": 82064, "epoch": 488} {"train_loss": -9.217095375061035, "global_step": 82065, "epoch": 488} {"train_loss": -9.440467834472656, "global_step": 82066, "epoch": 488} {"train_loss": -9.354531288146973, "global_step": 82067, "epoch": 488} {"train_loss": -9.011635780334473, "global_step": 82068, "epoch": 488} {"train_loss": -9.221298217773438, "global_step": 82069, "epoch": 488} {"train_loss": -9.364980697631836, "global_step": 82070, "epoch": 488} {"train_loss": -9.10915470123291, "global_step": 82071, "epoch": 488} {"train_loss": -9.33838939666748, "global_step": 82072, "epoch": 488} {"train_loss": -9.37773609161377, "global_step": 82073, "epoch": 488} {"train_loss": -9.132290840148926, "global_step": 82074, "epoch": 488} {"train_loss": -9.290229797363281, "global_step": 82075, "epoch": 488} {"train_loss": -9.088563919067383, "global_step": 82076, "epoch": 488} {"train_loss": -9.404706954956055, "global_step": 82077, "epoch": 488} {"train_loss": -9.203963279724121, "global_step": 82078, "epoch": 488} {"train_loss": -9.121134757995605, "global_step": 82079, "epoch": 488} {"train_loss": -9.242990493774414, "global_step": 82080, "epoch": 488} {"train_loss": -9.082154273986816, "global_step": 82081, "epoch": 488} {"train_loss": -9.058232307434082, "global_step": 82082, "epoch": 488} {"train_loss": -9.39950180053711, "global_step": 82083, "epoch": 488} {"train_loss": -9.109331130981445, "global_step": 82084, "epoch": 488} {"train_loss": -9.001898765563965, "global_step": 82085, "epoch": 488} {"train_loss": -9.180976867675781, "global_step": 82086, "epoch": 488} {"train_loss": -9.28216552734375, "global_step": 82087, "epoch": 488} {"train_loss": -9.261666297912598, "global_step": 82088, "epoch": 488} {"train_loss": -8.845571517944336, "global_step": 82089, "epoch": 488} {"train_loss": -9.276166915893555, "global_step": 82090, "epoch": 488} {"train_loss": -9.130508422851562, "global_step": 82091, "epoch": 488} {"train_loss": -9.204623222351074, "global_step": 82092, "epoch": 488} {"train_loss": -8.719884872436523, "global_step": 82093, "epoch": 488} {"train_loss": -9.28439712524414, "global_step": 82094, "epoch": 488} {"train_loss": -9.174688339233398, "global_step": 82095, "epoch": 488} {"train_loss": -9.291801452636719, "global_step": 82096, "epoch": 488} {"train_loss": -9.370078086853027, "global_step": 82097, "epoch": 488} {"train_loss": -9.210930824279785, "global_step": 82098, "epoch": 488} {"train_loss": -9.122430801391602, "global_step": 82099, "epoch": 488} {"train_loss": -9.356277465820312, "global_step": 82100, "epoch": 488} {"train_loss": -9.34821891784668, "global_step": 82101, "epoch": 488} {"train_loss": -9.109190940856934, "global_step": 82102, "epoch": 488} {"train_loss": -9.507883071899414, "global_step": 82103, "epoch": 488} {"train_loss": -9.418996810913086, "global_step": 82104, "epoch": 488} {"train_loss": -9.379074096679688, "global_step": 82105, "epoch": 488} {"train_loss": -9.392461776733398, "global_step": 82106, "epoch": 488} {"train_loss": -9.350286483764648, "global_step": 82107, "epoch": 488} {"train_loss": -9.520447731018066, "global_step": 82108, "epoch": 488} {"train_loss": -9.202219009399414, "global_step": 82109, "epoch": 488} {"train_loss": -9.366058349609375, "global_step": 82110, "epoch": 488} {"train_loss": -9.35413646697998, "global_step": 82111, "epoch": 488} {"train_loss": -9.217092514038086, "global_step": 82112, "epoch": 488} {"train_loss": -9.548235893249512, "global_step": 82113, "epoch": 488} {"train_loss": -9.335237503051758, "global_step": 82114, "epoch": 488} {"train_loss": -9.290778160095215, "global_step": 82115, "epoch": 488} {"train_loss": -9.27527904510498, "global_step": 82116, "epoch": 488} {"train_loss": -9.369741439819336, "global_step": 82117, "epoch": 488} {"train_loss": -8.849736213684082, "global_step": 82118, "epoch": 488} {"train_loss": -9.273804664611816, "global_step": 82119, "epoch": 488} {"train_loss": -9.242877960205078, "global_step": 82120, "epoch": 488} {"train_loss": -9.184226036071777, "global_step": 82121, "epoch": 488} {"train_loss": -9.417572021484375, "global_step": 82122, "epoch": 488} {"train_loss": -9.210317611694336, "global_step": 82123, "epoch": 488} {"train_loss": -9.410629272460938, "global_step": 82124, "epoch": 488} {"train_loss": -9.044490814208984, "global_step": 82125, "epoch": 488} {"train_loss": -9.131608009338379, "global_step": 82126, "epoch": 488} {"train_loss": -9.529687881469727, "global_step": 82127, "epoch": 488} {"train_loss": -9.418787002563477, "global_step": 82128, "epoch": 488} {"train_loss": -9.257030487060547, "global_step": 82129, "epoch": 488} {"train_loss": -9.340032577514648, "global_step": 82130, "epoch": 488} {"train_loss": -9.49006462097168, "global_step": 82131, "epoch": 488} {"train_loss": -9.363292694091797, "global_step": 82132, "epoch": 488} {"train_loss": -9.368269920349121, "global_step": 82133, "epoch": 488} {"train_loss": -9.321344375610352, "global_step": 82134, "epoch": 488} {"train_loss": -9.471315383911133, "global_step": 82135, "epoch": 488} {"train_loss": -9.528448104858398, "global_step": 82136, "epoch": 488} {"train_loss": -9.244122505187988, "global_step": 82137, "epoch": 488} {"train_loss": -9.361043930053711, "global_step": 82138, "epoch": 488} {"train_loss": -9.190145492553711, "global_step": 82139, "epoch": 488} {"train_loss": -9.48370361328125, "global_step": 82140, "epoch": 488} {"train_loss": -9.261082649230957, "global_step": 82141, "epoch": 488} {"train_loss": -9.495426177978516, "global_step": 82142, "epoch": 488} {"train_loss": -9.30388069152832, "global_step": 82143, "epoch": 488} {"train_loss": -9.420669555664062, "global_step": 82144, "epoch": 488} {"train_loss": -9.446016311645508, "global_step": 82145, "epoch": 488} {"train_loss": -8.867712020874023, "global_step": 82146, "epoch": 488} {"train_loss": -9.395153045654297, "global_step": 82147, "epoch": 488} {"train_loss": -9.303678512573242, "global_step": 82148, "epoch": 488} {"train_loss": -9.35934829711914, "global_step": 82149, "epoch": 488} {"train_loss": -8.897031784057617, "global_step": 82150, "epoch": 488} {"train_loss": -9.26045907111395, "global_step": 82151, "epoch": 488, "val_loss": 197902.390625} {"train_loss": -9.460432052612305, "global_step": 82152, "epoch": 489} {"train_loss": -8.860210418701172, "global_step": 82153, "epoch": 489} {"train_loss": -9.310127258300781, "global_step": 82154, "epoch": 489} {"train_loss": -8.925647735595703, "global_step": 82155, "epoch": 489} {"train_loss": -9.103517532348633, "global_step": 82156, "epoch": 489} {"train_loss": -8.882665634155273, "global_step": 82157, "epoch": 489} {"train_loss": -9.213560104370117, "global_step": 82158, "epoch": 489} {"train_loss": -8.943624496459961, "global_step": 82159, "epoch": 489} {"train_loss": -9.19216251373291, "global_step": 82160, "epoch": 489} {"train_loss": -9.291499137878418, "global_step": 82161, "epoch": 489} {"train_loss": -9.083852767944336, "global_step": 82162, "epoch": 489} {"train_loss": -9.036209106445312, "global_step": 82163, "epoch": 489} {"train_loss": -9.169156074523926, "global_step": 82164, "epoch": 489} {"train_loss": -8.903383255004883, "global_step": 82165, "epoch": 489} {"train_loss": -9.278590202331543, "global_step": 82166, "epoch": 489} {"train_loss": -9.079740524291992, "global_step": 82167, "epoch": 489} {"train_loss": -9.279459953308105, "global_step": 82168, "epoch": 489} {"train_loss": -9.329856872558594, "global_step": 82169, "epoch": 489} {"train_loss": -9.554340362548828, "global_step": 82170, "epoch": 489} {"train_loss": -9.398813247680664, "global_step": 82171, "epoch": 489} {"train_loss": -9.25774097442627, "global_step": 82172, "epoch": 489} {"train_loss": -9.297276496887207, "global_step": 82173, "epoch": 489} {"train_loss": -9.332449913024902, "global_step": 82174, "epoch": 489} {"train_loss": -9.176194190979004, "global_step": 82175, "epoch": 489} {"train_loss": -9.378122329711914, "global_step": 82176, "epoch": 489} {"train_loss": -9.062067031860352, "global_step": 82177, "epoch": 489} {"train_loss": -9.486827850341797, "global_step": 82178, "epoch": 489} {"train_loss": -9.427098274230957, "global_step": 82179, "epoch": 489} {"train_loss": -9.322042465209961, "global_step": 82180, "epoch": 489} {"train_loss": -9.624837875366211, "global_step": 82181, "epoch": 489} {"train_loss": -9.610801696777344, "global_step": 82182, "epoch": 489} {"train_loss": -9.205103874206543, "global_step": 82183, "epoch": 489} {"train_loss": -9.320472717285156, "global_step": 82184, "epoch": 489} {"train_loss": -9.355356216430664, "global_step": 82185, "epoch": 489} {"train_loss": -9.390588760375977, "global_step": 82186, "epoch": 489} {"train_loss": -9.515664100646973, "global_step": 82187, "epoch": 489} {"train_loss": -9.433076858520508, "global_step": 82188, "epoch": 489} {"train_loss": -9.385303497314453, "global_step": 82189, "epoch": 489} {"train_loss": -9.282405853271484, "global_step": 82190, "epoch": 489} {"train_loss": -9.331663131713867, "global_step": 82191, "epoch": 489} {"train_loss": -9.338308334350586, "global_step": 82192, "epoch": 489} {"train_loss": -9.432194709777832, "global_step": 82193, "epoch": 489} {"train_loss": -9.380331993103027, "global_step": 82194, "epoch": 489} {"train_loss": -9.057168960571289, "global_step": 82195, "epoch": 489} {"train_loss": -9.10995101928711, "global_step": 82196, "epoch": 489} {"train_loss": -9.353494644165039, "global_step": 82197, "epoch": 489} {"train_loss": -9.171534538269043, "global_step": 82198, "epoch": 489} {"train_loss": -8.875066757202148, "global_step": 82199, "epoch": 489} {"train_loss": -9.27299976348877, "global_step": 82200, "epoch": 489} {"train_loss": -9.180081367492676, "global_step": 82201, "epoch": 489} {"train_loss": -9.215534210205078, "global_step": 82202, "epoch": 489} {"train_loss": -9.117470741271973, "global_step": 82203, "epoch": 489} {"train_loss": -8.911418914794922, "global_step": 82204, "epoch": 489} {"train_loss": -9.059762954711914, "global_step": 82205, "epoch": 489} {"train_loss": -8.69817066192627, "global_step": 82206, "epoch": 489} {"train_loss": -9.087190628051758, "global_step": 82207, "epoch": 489} {"train_loss": -8.866694450378418, "global_step": 82208, "epoch": 489} {"train_loss": -8.647214889526367, "global_step": 82209, "epoch": 489} {"train_loss": -8.421791076660156, "global_step": 82210, "epoch": 489} {"train_loss": -8.521732330322266, "global_step": 82211, "epoch": 489} {"train_loss": -8.45718765258789, "global_step": 82212, "epoch": 489} {"train_loss": -8.926610946655273, "global_step": 82213, "epoch": 489} {"train_loss": -8.579852104187012, "global_step": 82214, "epoch": 489} {"train_loss": -9.079662322998047, "global_step": 82215, "epoch": 489} {"train_loss": -8.919843673706055, "global_step": 82216, "epoch": 489} {"train_loss": -8.880498886108398, "global_step": 82217, "epoch": 489} {"train_loss": -8.803295135498047, "global_step": 82218, "epoch": 489} {"train_loss": -8.897285461425781, "global_step": 82219, "epoch": 489} {"train_loss": -9.026479721069336, "global_step": 82220, "epoch": 489} {"train_loss": -9.137493133544922, "global_step": 82221, "epoch": 489} {"train_loss": -9.11445426940918, "global_step": 82222, "epoch": 489} {"train_loss": -9.191762924194336, "global_step": 82223, "epoch": 489} {"train_loss": -9.091296195983887, "global_step": 82224, "epoch": 489} {"train_loss": -9.079282760620117, "global_step": 82225, "epoch": 489} {"train_loss": -8.979740142822266, "global_step": 82226, "epoch": 489} {"train_loss": -9.073934555053711, "global_step": 82227, "epoch": 489} {"train_loss": -9.029393196105957, "global_step": 82228, "epoch": 489} {"train_loss": -9.13395881652832, "global_step": 82229, "epoch": 489} {"train_loss": -9.021965026855469, "global_step": 82230, "epoch": 489} {"train_loss": -9.182581901550293, "global_step": 82231, "epoch": 489} {"train_loss": -9.014272689819336, "global_step": 82232, "epoch": 489} {"train_loss": -9.174942016601562, "global_step": 82233, "epoch": 489} {"train_loss": -9.12553882598877, "global_step": 82234, "epoch": 489} {"train_loss": -9.132050514221191, "global_step": 82235, "epoch": 489} {"train_loss": -9.14558219909668, "global_step": 82236, "epoch": 489} {"train_loss": -9.219182968139648, "global_step": 82237, "epoch": 489} {"train_loss": -9.109368324279785, "global_step": 82238, "epoch": 489} {"train_loss": -9.295328140258789, "global_step": 82239, "epoch": 489} {"train_loss": -8.942646026611328, "global_step": 82240, "epoch": 489} {"train_loss": -9.408397674560547, "global_step": 82241, "epoch": 489} {"train_loss": -9.229448318481445, "global_step": 82242, "epoch": 489} {"train_loss": -9.273067474365234, "global_step": 82243, "epoch": 489} {"train_loss": -9.089940071105957, "global_step": 82244, "epoch": 489} {"train_loss": -9.089460372924805, "global_step": 82245, "epoch": 489} {"train_loss": -9.513916015625, "global_step": 82246, "epoch": 489} {"train_loss": -9.38184928894043, "global_step": 82247, "epoch": 489} {"train_loss": -9.397406578063965, "global_step": 82248, "epoch": 489} {"train_loss": -9.241073608398438, "global_step": 82249, "epoch": 489} {"train_loss": -9.471474647521973, "global_step": 82250, "epoch": 489} {"train_loss": -9.607837677001953, "global_step": 82251, "epoch": 489} {"train_loss": -9.329909324645996, "global_step": 82252, "epoch": 489} {"train_loss": -9.312668800354004, "global_step": 82253, "epoch": 489} {"train_loss": -9.480195999145508, "global_step": 82254, "epoch": 489} {"train_loss": -9.312776565551758, "global_step": 82255, "epoch": 489} {"train_loss": -9.344078063964844, "global_step": 82256, "epoch": 489} {"train_loss": -9.38929557800293, "global_step": 82257, "epoch": 489} {"train_loss": -9.273547172546387, "global_step": 82258, "epoch": 489} {"train_loss": -9.47037410736084, "global_step": 82259, "epoch": 489} {"train_loss": -9.31689167022705, "global_step": 82260, "epoch": 489} {"train_loss": -9.410064697265625, "global_step": 82261, "epoch": 489} {"train_loss": -9.34665584564209, "global_step": 82262, "epoch": 489} {"train_loss": -9.0012788772583, "global_step": 82263, "epoch": 489} {"train_loss": -9.526444435119629, "global_step": 82264, "epoch": 489} {"train_loss": -9.01452922821045, "global_step": 82265, "epoch": 489} {"train_loss": -9.267227172851562, "global_step": 82266, "epoch": 489} {"train_loss": -9.139354705810547, "global_step": 82267, "epoch": 489} {"train_loss": -9.314208030700684, "global_step": 82268, "epoch": 489} {"train_loss": -9.164277076721191, "global_step": 82269, "epoch": 489} {"train_loss": -9.373493194580078, "global_step": 82270, "epoch": 489} {"train_loss": -9.272111892700195, "global_step": 82271, "epoch": 489} {"train_loss": -8.928848266601562, "global_step": 82272, "epoch": 489} {"train_loss": -9.310815811157227, "global_step": 82273, "epoch": 489} {"train_loss": -9.162304878234863, "global_step": 82274, "epoch": 489} {"train_loss": -9.25851058959961, "global_step": 82275, "epoch": 489} {"train_loss": -9.165159225463867, "global_step": 82276, "epoch": 489} {"train_loss": -9.25832748413086, "global_step": 82277, "epoch": 489} {"train_loss": -9.047523498535156, "global_step": 82278, "epoch": 489} {"train_loss": -9.383980751037598, "global_step": 82279, "epoch": 489} {"train_loss": -9.568716049194336, "global_step": 82280, "epoch": 489} {"train_loss": -9.410789489746094, "global_step": 82281, "epoch": 489} {"train_loss": -9.38986587524414, "global_step": 82282, "epoch": 489} {"train_loss": -9.4425048828125, "global_step": 82283, "epoch": 489} {"train_loss": -9.206315040588379, "global_step": 82284, "epoch": 489} {"train_loss": -9.519390106201172, "global_step": 82285, "epoch": 489} {"train_loss": -9.320083618164062, "global_step": 82286, "epoch": 489} {"train_loss": -9.461101531982422, "global_step": 82287, "epoch": 489} {"train_loss": -9.496004104614258, "global_step": 82288, "epoch": 489} {"train_loss": -9.351606369018555, "global_step": 82289, "epoch": 489} {"train_loss": -9.653974533081055, "global_step": 82290, "epoch": 489} {"train_loss": -9.033038139343262, "global_step": 82291, "epoch": 489} {"train_loss": -9.573318481445312, "global_step": 82292, "epoch": 489} {"train_loss": -9.641059875488281, "global_step": 82293, "epoch": 489} {"train_loss": -9.399145126342773, "global_step": 82294, "epoch": 489} {"train_loss": -9.467859268188477, "global_step": 82295, "epoch": 489} {"train_loss": -9.497095108032227, "global_step": 82296, "epoch": 489} {"train_loss": -9.439062118530273, "global_step": 82297, "epoch": 489} {"train_loss": -9.51242446899414, "global_step": 82298, "epoch": 489} {"train_loss": -9.566290855407715, "global_step": 82299, "epoch": 489} {"train_loss": -9.191936492919922, "global_step": 82300, "epoch": 489} {"train_loss": -8.975571632385254, "global_step": 82301, "epoch": 489} {"train_loss": -9.21745491027832, "global_step": 82302, "epoch": 489} {"train_loss": -9.353477478027344, "global_step": 82303, "epoch": 489} {"train_loss": -9.460750579833984, "global_step": 82304, "epoch": 489} {"train_loss": -9.324172973632812, "global_step": 82305, "epoch": 489} {"train_loss": -8.98680591583252, "global_step": 82306, "epoch": 489} {"train_loss": -9.3128662109375, "global_step": 82307, "epoch": 489} {"train_loss": -8.95745849609375, "global_step": 82308, "epoch": 489} {"train_loss": -9.508566856384277, "global_step": 82309, "epoch": 489} {"train_loss": -9.003326416015625, "global_step": 82310, "epoch": 489} {"train_loss": -8.860065460205078, "global_step": 82311, "epoch": 489} {"train_loss": -8.991323471069336, "global_step": 82312, "epoch": 489} {"train_loss": -8.72874641418457, "global_step": 82313, "epoch": 489} {"train_loss": -9.009687423706055, "global_step": 82314, "epoch": 489} {"train_loss": -8.713464736938477, "global_step": 82315, "epoch": 489} {"train_loss": -8.973396301269531, "global_step": 82316, "epoch": 489} {"train_loss": -8.921728134155273, "global_step": 82317, "epoch": 489} {"train_loss": -9.375691413879395, "global_step": 82318, "epoch": 489} {"train_loss": -9.203375992320833, "global_step": 82319, "epoch": 489, "val_loss": 199559.453125} {"train_loss": -9.293069839477539, "global_step": 82320, "epoch": 490} {"train_loss": -8.760940551757812, "global_step": 82321, "epoch": 490} {"train_loss": -9.048681259155273, "global_step": 82322, "epoch": 490} {"train_loss": -9.158330917358398, "global_step": 82323, "epoch": 490} {"train_loss": -8.971071243286133, "global_step": 82324, "epoch": 490} {"train_loss": -8.942856788635254, "global_step": 82325, "epoch": 490} {"train_loss": -8.853755950927734, "global_step": 82326, "epoch": 490} {"train_loss": -9.20057201385498, "global_step": 82327, "epoch": 490} {"train_loss": -9.223800659179688, "global_step": 82328, "epoch": 490} {"train_loss": -9.223991394042969, "global_step": 82329, "epoch": 490} {"train_loss": -9.065010070800781, "global_step": 82330, "epoch": 490} {"train_loss": -9.17691707611084, "global_step": 82331, "epoch": 490} {"train_loss": -9.12699031829834, "global_step": 82332, "epoch": 490} {"train_loss": -9.150718688964844, "global_step": 82333, "epoch": 490} {"train_loss": -9.362591743469238, "global_step": 82334, "epoch": 490} {"train_loss": -9.187450408935547, "global_step": 82335, "epoch": 490} {"train_loss": -9.507268905639648, "global_step": 82336, "epoch": 490} {"train_loss": -9.118612289428711, "global_step": 82337, "epoch": 490} {"train_loss": -9.229199409484863, "global_step": 82338, "epoch": 490} {"train_loss": -9.2869873046875, "global_step": 82339, "epoch": 490} {"train_loss": -9.366168975830078, "global_step": 82340, "epoch": 490} {"train_loss": -9.130687713623047, "global_step": 82341, "epoch": 490} {"train_loss": -9.401800155639648, "global_step": 82342, "epoch": 490} {"train_loss": -9.306341171264648, "global_step": 82343, "epoch": 490} {"train_loss": -9.370572090148926, "global_step": 82344, "epoch": 490} {"train_loss": -9.497480392456055, "global_step": 82345, "epoch": 490} {"train_loss": -9.41330337524414, "global_step": 82346, "epoch": 490} {"train_loss": -9.432317733764648, "global_step": 82347, "epoch": 490} {"train_loss": -9.061058044433594, "global_step": 82348, "epoch": 490} {"train_loss": -9.554187774658203, "global_step": 82349, "epoch": 490} {"train_loss": -9.367733001708984, "global_step": 82350, "epoch": 490} {"train_loss": -9.274395942687988, "global_step": 82351, "epoch": 490} {"train_loss": -9.18781852722168, "global_step": 82352, "epoch": 490} {"train_loss": -9.559720993041992, "global_step": 82353, "epoch": 490} {"train_loss": -9.194104194641113, "global_step": 82354, "epoch": 490} {"train_loss": -9.145163536071777, "global_step": 82355, "epoch": 490} {"train_loss": -8.869430541992188, "global_step": 82356, "epoch": 490} {"train_loss": -9.264593124389648, "global_step": 82357, "epoch": 490} {"train_loss": -8.911667823791504, "global_step": 82358, "epoch": 490} {"train_loss": -9.222570419311523, "global_step": 82359, "epoch": 490} {"train_loss": -9.309213638305664, "global_step": 82360, "epoch": 490} {"train_loss": -9.252074241638184, "global_step": 82361, "epoch": 490} {"train_loss": -8.889852523803711, "global_step": 82362, "epoch": 490} {"train_loss": -8.983274459838867, "global_step": 82363, "epoch": 490} {"train_loss": -8.488759994506836, "global_step": 82364, "epoch": 490} {"train_loss": -8.788849830627441, "global_step": 82365, "epoch": 490} {"train_loss": -8.995336532592773, "global_step": 82366, "epoch": 490} {"train_loss": -9.053293228149414, "global_step": 82367, "epoch": 490} {"train_loss": -9.100353240966797, "global_step": 82368, "epoch": 490} {"train_loss": -8.910131454467773, "global_step": 82369, "epoch": 490} {"train_loss": -9.19691276550293, "global_step": 82370, "epoch": 490} {"train_loss": -8.950128555297852, "global_step": 82371, "epoch": 490} {"train_loss": -9.102910995483398, "global_step": 82372, "epoch": 490} {"train_loss": -8.739092826843262, "global_step": 82373, "epoch": 490} {"train_loss": -9.295732498168945, "global_step": 82374, "epoch": 490} {"train_loss": -8.885059356689453, "global_step": 82375, "epoch": 490} {"train_loss": -9.034139633178711, "global_step": 82376, "epoch": 490} {"train_loss": -8.897256851196289, "global_step": 82377, "epoch": 490} {"train_loss": -8.966939926147461, "global_step": 82378, "epoch": 490} {"train_loss": -8.700777053833008, "global_step": 82379, "epoch": 490} {"train_loss": -8.726980209350586, "global_step": 82380, "epoch": 490} {"train_loss": -9.202938079833984, "global_step": 82381, "epoch": 490} {"train_loss": -8.84306526184082, "global_step": 82382, "epoch": 490} {"train_loss": -8.972586631774902, "global_step": 82383, "epoch": 490} {"train_loss": -9.231424331665039, "global_step": 82384, "epoch": 490} {"train_loss": -9.189075469970703, "global_step": 82385, "epoch": 490} {"train_loss": -9.189817428588867, "global_step": 82386, "epoch": 490} {"train_loss": -9.303351402282715, "global_step": 82387, "epoch": 490} {"train_loss": -9.16992473602295, "global_step": 82388, "epoch": 490} {"train_loss": -8.785268783569336, "global_step": 82389, "epoch": 490} {"train_loss": -9.214122772216797, "global_step": 82390, "epoch": 490} {"train_loss": -9.279197692871094, "global_step": 82391, "epoch": 490} {"train_loss": -9.277873039245605, "global_step": 82392, "epoch": 490} {"train_loss": -9.215937614440918, "global_step": 82393, "epoch": 490} {"train_loss": -9.365925788879395, "global_step": 82394, "epoch": 490} {"train_loss": -9.210564613342285, "global_step": 82395, "epoch": 490} {"train_loss": -9.195703506469727, "global_step": 82396, "epoch": 490} {"train_loss": -9.403353691101074, "global_step": 82397, "epoch": 490} {"train_loss": -8.866724014282227, "global_step": 82398, "epoch": 490} {"train_loss": -9.09622573852539, "global_step": 82399, "epoch": 490} {"train_loss": -8.589160919189453, "global_step": 82400, "epoch": 490} {"train_loss": -8.79666519165039, "global_step": 82401, "epoch": 490} {"train_loss": -8.441771507263184, "global_step": 82402, "epoch": 490} {"train_loss": -8.648645401000977, "global_step": 82403, "epoch": 490} {"train_loss": -8.223470687866211, "global_step": 82404, "epoch": 490} {"train_loss": -8.615619659423828, "global_step": 82405, "epoch": 490} {"train_loss": -8.843696594238281, "global_step": 82406, "epoch": 490} {"train_loss": -8.480798721313477, "global_step": 82407, "epoch": 490} {"train_loss": -9.01958179473877, "global_step": 82408, "epoch": 490} {"train_loss": -8.731918334960938, "global_step": 82409, "epoch": 490} {"train_loss": -8.792553901672363, "global_step": 82410, "epoch": 490} {"train_loss": -8.635305404663086, "global_step": 82411, "epoch": 490} {"train_loss": -8.809225082397461, "global_step": 82412, "epoch": 490} {"train_loss": -8.641119956970215, "global_step": 82413, "epoch": 490} {"train_loss": -8.713768005371094, "global_step": 82414, "epoch": 490} {"train_loss": -9.061585426330566, "global_step": 82415, "epoch": 490} {"train_loss": -8.690412521362305, "global_step": 82416, "epoch": 490} {"train_loss": -9.113801956176758, "global_step": 82417, "epoch": 490} {"train_loss": -8.987144470214844, "global_step": 82418, "epoch": 490} {"train_loss": -9.001230239868164, "global_step": 82419, "epoch": 490} {"train_loss": -9.144563674926758, "global_step": 82420, "epoch": 490} {"train_loss": -8.990083694458008, "global_step": 82421, "epoch": 490} {"train_loss": -9.154541015625, "global_step": 82422, "epoch": 490} {"train_loss": -9.120391845703125, "global_step": 82423, "epoch": 490} {"train_loss": -9.266020774841309, "global_step": 82424, "epoch": 490} {"train_loss": -9.250173568725586, "global_step": 82425, "epoch": 490} {"train_loss": -9.131026268005371, "global_step": 82426, "epoch": 490} {"train_loss": -9.177806854248047, "global_step": 82427, "epoch": 490} {"train_loss": -9.176473617553711, "global_step": 82428, "epoch": 490} {"train_loss": -8.999286651611328, "global_step": 82429, "epoch": 490} {"train_loss": -9.43145751953125, "global_step": 82430, "epoch": 490} {"train_loss": -9.176006317138672, "global_step": 82431, "epoch": 490} {"train_loss": -9.1565523147583, "global_step": 82432, "epoch": 490} {"train_loss": -9.356815338134766, "global_step": 82433, "epoch": 490} {"train_loss": -9.244779586791992, "global_step": 82434, "epoch": 490} {"train_loss": -9.414536476135254, "global_step": 82435, "epoch": 490} {"train_loss": -9.232348442077637, "global_step": 82436, "epoch": 490} {"train_loss": -9.409934043884277, "global_step": 82437, "epoch": 490} {"train_loss": -9.514095306396484, "global_step": 82438, "epoch": 490} {"train_loss": -9.283027648925781, "global_step": 82439, "epoch": 490} {"train_loss": -9.606182098388672, "global_step": 82440, "epoch": 490} {"train_loss": -9.488576889038086, "global_step": 82441, "epoch": 490} {"train_loss": -9.440330505371094, "global_step": 82442, "epoch": 490} {"train_loss": -9.404335021972656, "global_step": 82443, "epoch": 490} {"train_loss": -9.566780090332031, "global_step": 82444, "epoch": 490} {"train_loss": -9.451932907104492, "global_step": 82445, "epoch": 490} {"train_loss": -9.588621139526367, "global_step": 82446, "epoch": 490} {"train_loss": -9.235922813415527, "global_step": 82447, "epoch": 490} {"train_loss": -9.5433988571167, "global_step": 82448, "epoch": 490} {"train_loss": -9.590770721435547, "global_step": 82449, "epoch": 490} {"train_loss": -9.2941255569458, "global_step": 82450, "epoch": 490} {"train_loss": -9.425078392028809, "global_step": 82451, "epoch": 490} {"train_loss": -8.928332328796387, "global_step": 82452, "epoch": 490} {"train_loss": -9.189981460571289, "global_step": 82453, "epoch": 490} {"train_loss": -8.895149230957031, "global_step": 82454, "epoch": 490} {"train_loss": -9.339818000793457, "global_step": 82455, "epoch": 490} {"train_loss": -8.679174423217773, "global_step": 82456, "epoch": 490} {"train_loss": -8.995586395263672, "global_step": 82457, "epoch": 490} {"train_loss": -8.788007736206055, "global_step": 82458, "epoch": 490} {"train_loss": -8.775459289550781, "global_step": 82459, "epoch": 490} {"train_loss": -8.976115226745605, "global_step": 82460, "epoch": 490} {"train_loss": -8.651421546936035, "global_step": 82461, "epoch": 490} {"train_loss": -8.977745056152344, "global_step": 82462, "epoch": 490} {"train_loss": -9.077102661132812, "global_step": 82463, "epoch": 490} {"train_loss": -8.981361389160156, "global_step": 82464, "epoch": 490} {"train_loss": -8.945091247558594, "global_step": 82465, "epoch": 490} {"train_loss": -9.332244873046875, "global_step": 82466, "epoch": 490} {"train_loss": -9.201108932495117, "global_step": 82467, "epoch": 490} {"train_loss": -9.321453094482422, "global_step": 82468, "epoch": 490} {"train_loss": -9.031877517700195, "global_step": 82469, "epoch": 490} {"train_loss": -9.064165115356445, "global_step": 82470, "epoch": 490} {"train_loss": -9.125631332397461, "global_step": 82471, "epoch": 490} {"train_loss": -9.216784477233887, "global_step": 82472, "epoch": 490} {"train_loss": -9.202099800109863, "global_step": 82473, "epoch": 490} {"train_loss": -9.278179168701172, "global_step": 82474, "epoch": 490} {"train_loss": -9.206584930419922, "global_step": 82475, "epoch": 490} {"train_loss": -9.1774263381958, "global_step": 82476, "epoch": 490} {"train_loss": -9.501371383666992, "global_step": 82477, "epoch": 490} {"train_loss": -9.141555786132812, "global_step": 82478, "epoch": 490} {"train_loss": -9.320749282836914, "global_step": 82479, "epoch": 490} {"train_loss": -9.419015884399414, "global_step": 82480, "epoch": 490} {"train_loss": -9.423774719238281, "global_step": 82481, "epoch": 490} {"train_loss": -9.388772010803223, "global_step": 82482, "epoch": 490} {"train_loss": -9.559099197387695, "global_step": 82483, "epoch": 490} {"train_loss": -9.33659553527832, "global_step": 82484, "epoch": 490} {"train_loss": -9.56222915649414, "global_step": 82485, "epoch": 490} {"train_loss": -9.599859237670898, "global_step": 82486, "epoch": 490} {"train_loss": -9.12994719119299, "global_step": 82487, "epoch": 490, "val_loss": 197923.453125, "train_action_mse_error": 3.9869847297668457} {"train_loss": -9.375659942626953, "global_step": 82488, "epoch": 491} {"train_loss": -9.436271667480469, "global_step": 82489, "epoch": 491} {"train_loss": -9.388374328613281, "global_step": 82490, "epoch": 491} {"train_loss": -9.411375045776367, "global_step": 82491, "epoch": 491} {"train_loss": -9.496354103088379, "global_step": 82492, "epoch": 491} {"train_loss": -9.550799369812012, "global_step": 82493, "epoch": 491} {"train_loss": -9.48608684539795, "global_step": 82494, "epoch": 491} {"train_loss": -9.509384155273438, "global_step": 82495, "epoch": 491} {"train_loss": -9.181889533996582, "global_step": 82496, "epoch": 491} {"train_loss": -9.329275131225586, "global_step": 82497, "epoch": 491} {"train_loss": -9.315706253051758, "global_step": 82498, "epoch": 491} {"train_loss": -9.324624061584473, "global_step": 82499, "epoch": 491} {"train_loss": -9.43254280090332, "global_step": 82500, "epoch": 491} {"train_loss": -9.205548286437988, "global_step": 82501, "epoch": 491} {"train_loss": -9.194473266601562, "global_step": 82502, "epoch": 491} {"train_loss": -8.797807693481445, "global_step": 82503, "epoch": 491} {"train_loss": -8.968456268310547, "global_step": 82504, "epoch": 491} {"train_loss": -9.30327033996582, "global_step": 82505, "epoch": 491} {"train_loss": -8.865165710449219, "global_step": 82506, "epoch": 491} {"train_loss": -9.122215270996094, "global_step": 82507, "epoch": 491} {"train_loss": -8.807823181152344, "global_step": 82508, "epoch": 491} {"train_loss": -9.149656295776367, "global_step": 82509, "epoch": 491} {"train_loss": -8.882406234741211, "global_step": 82510, "epoch": 491} {"train_loss": -8.832911491394043, "global_step": 82511, "epoch": 491} {"train_loss": -9.008829116821289, "global_step": 82512, "epoch": 491} {"train_loss": -8.72762393951416, "global_step": 82513, "epoch": 491} {"train_loss": -8.945703506469727, "global_step": 82514, "epoch": 491} {"train_loss": -8.913724899291992, "global_step": 82515, "epoch": 491} {"train_loss": -8.818531036376953, "global_step": 82516, "epoch": 491} {"train_loss": -9.126916885375977, "global_step": 82517, "epoch": 491} {"train_loss": -8.837056159973145, "global_step": 82518, "epoch": 491} {"train_loss": -9.05678939819336, "global_step": 82519, "epoch": 491} {"train_loss": -9.215429306030273, "global_step": 82520, "epoch": 491} {"train_loss": -9.124753952026367, "global_step": 82521, "epoch": 491} {"train_loss": -9.0285062789917, "global_step": 82522, "epoch": 491} {"train_loss": -9.089298248291016, "global_step": 82523, "epoch": 491} {"train_loss": -8.950660705566406, "global_step": 82524, "epoch": 491} {"train_loss": -9.115415573120117, "global_step": 82525, "epoch": 491} {"train_loss": -9.017110824584961, "global_step": 82526, "epoch": 491} {"train_loss": -9.015059471130371, "global_step": 82527, "epoch": 491} {"train_loss": -9.134840965270996, "global_step": 82528, "epoch": 491} {"train_loss": -9.011621475219727, "global_step": 82529, "epoch": 491} {"train_loss": -9.115379333496094, "global_step": 82530, "epoch": 491} {"train_loss": -9.281686782836914, "global_step": 82531, "epoch": 491} {"train_loss": -9.033285140991211, "global_step": 82532, "epoch": 491} {"train_loss": -9.495565414428711, "global_step": 82533, "epoch": 491} {"train_loss": -8.99714183807373, "global_step": 82534, "epoch": 491} {"train_loss": -9.274958610534668, "global_step": 82535, "epoch": 491} {"train_loss": -9.194580078125, "global_step": 82536, "epoch": 491} {"train_loss": -9.250934600830078, "global_step": 82537, "epoch": 491} {"train_loss": -9.255607604980469, "global_step": 82538, "epoch": 491} {"train_loss": -9.259464263916016, "global_step": 82539, "epoch": 491} {"train_loss": -9.45052719116211, "global_step": 82540, "epoch": 491} {"train_loss": -9.049274444580078, "global_step": 82541, "epoch": 491} {"train_loss": -9.26419448852539, "global_step": 82542, "epoch": 491} {"train_loss": -9.326446533203125, "global_step": 82543, "epoch": 491} {"train_loss": -9.327462196350098, "global_step": 82544, "epoch": 491} {"train_loss": -9.440926551818848, "global_step": 82545, "epoch": 491} {"train_loss": -9.40275764465332, "global_step": 82546, "epoch": 491} {"train_loss": -9.462308883666992, "global_step": 82547, "epoch": 491} {"train_loss": -9.255708694458008, "global_step": 82548, "epoch": 491} {"train_loss": -9.08633804321289, "global_step": 82549, "epoch": 491} {"train_loss": -9.374906539916992, "global_step": 82550, "epoch": 491} {"train_loss": -9.101175308227539, "global_step": 82551, "epoch": 491} {"train_loss": -9.376630783081055, "global_step": 82552, "epoch": 491} {"train_loss": -9.27587890625, "global_step": 82553, "epoch": 491} {"train_loss": -9.213160514831543, "global_step": 82554, "epoch": 491} {"train_loss": -9.260759353637695, "global_step": 82555, "epoch": 491} {"train_loss": -9.126996994018555, "global_step": 82556, "epoch": 491} {"train_loss": -9.209522247314453, "global_step": 82557, "epoch": 491} {"train_loss": -9.251176834106445, "global_step": 82558, "epoch": 491} {"train_loss": -9.290456771850586, "global_step": 82559, "epoch": 491} {"train_loss": -9.144266128540039, "global_step": 82560, "epoch": 491} {"train_loss": -9.306428909301758, "global_step": 82561, "epoch": 491} {"train_loss": -9.114879608154297, "global_step": 82562, "epoch": 491} {"train_loss": -9.165555953979492, "global_step": 82563, "epoch": 491} {"train_loss": -9.27618408203125, "global_step": 82564, "epoch": 491} {"train_loss": -9.206771850585938, "global_step": 82565, "epoch": 491} {"train_loss": -9.172876358032227, "global_step": 82566, "epoch": 491} {"train_loss": -8.760887145996094, "global_step": 82567, "epoch": 491} {"train_loss": -9.151372909545898, "global_step": 82568, "epoch": 491} {"train_loss": -8.80863094329834, "global_step": 82569, "epoch": 491} {"train_loss": -8.955904006958008, "global_step": 82570, "epoch": 491} {"train_loss": -8.983104705810547, "global_step": 82571, "epoch": 491} {"train_loss": -9.002878189086914, "global_step": 82572, "epoch": 491} {"train_loss": -8.872950553894043, "global_step": 82573, "epoch": 491} {"train_loss": -9.411334037780762, "global_step": 82574, "epoch": 491} {"train_loss": -8.798857688903809, "global_step": 82575, "epoch": 491} {"train_loss": -9.186260223388672, "global_step": 82576, "epoch": 491} {"train_loss": -9.233467102050781, "global_step": 82577, "epoch": 491} {"train_loss": -9.194271087646484, "global_step": 82578, "epoch": 491} {"train_loss": -8.743743896484375, "global_step": 82579, "epoch": 491} {"train_loss": -9.268157958984375, "global_step": 82580, "epoch": 491} {"train_loss": -9.10203742980957, "global_step": 82581, "epoch": 491} {"train_loss": -9.305686950683594, "global_step": 82582, "epoch": 491} {"train_loss": -9.3248929977417, "global_step": 82583, "epoch": 491} {"train_loss": -9.114240646362305, "global_step": 82584, "epoch": 491} {"train_loss": -9.461987495422363, "global_step": 82585, "epoch": 491} {"train_loss": -9.321800231933594, "global_step": 82586, "epoch": 491} {"train_loss": -9.523321151733398, "global_step": 82587, "epoch": 491} {"train_loss": -9.358516693115234, "global_step": 82588, "epoch": 491} {"train_loss": -9.292348861694336, "global_step": 82589, "epoch": 491} {"train_loss": -9.28567886352539, "global_step": 82590, "epoch": 491} {"train_loss": -9.214461326599121, "global_step": 82591, "epoch": 491} {"train_loss": -9.24365234375, "global_step": 82592, "epoch": 491} {"train_loss": -9.555389404296875, "global_step": 82593, "epoch": 491} {"train_loss": -9.454200744628906, "global_step": 82594, "epoch": 491} {"train_loss": -9.434175491333008, "global_step": 82595, "epoch": 491} {"train_loss": -9.227724075317383, "global_step": 82596, "epoch": 491} {"train_loss": -9.198236465454102, "global_step": 82597, "epoch": 491} {"train_loss": -9.196427345275879, "global_step": 82598, "epoch": 491} {"train_loss": -9.391122817993164, "global_step": 82599, "epoch": 491} {"train_loss": -9.308673858642578, "global_step": 82600, "epoch": 491} {"train_loss": -9.414739608764648, "global_step": 82601, "epoch": 491} {"train_loss": -9.351532936096191, "global_step": 82602, "epoch": 491} {"train_loss": -9.364255905151367, "global_step": 82603, "epoch": 491} {"train_loss": -9.337104797363281, "global_step": 82604, "epoch": 491} {"train_loss": -9.415445327758789, "global_step": 82605, "epoch": 491} {"train_loss": -9.33751392364502, "global_step": 82606, "epoch": 491} {"train_loss": -9.33470344543457, "global_step": 82607, "epoch": 491} {"train_loss": -9.388199806213379, "global_step": 82608, "epoch": 491} {"train_loss": -9.281879425048828, "global_step": 82609, "epoch": 491} {"train_loss": -9.116329193115234, "global_step": 82610, "epoch": 491} {"train_loss": -9.370664596557617, "global_step": 82611, "epoch": 491} {"train_loss": -9.345527648925781, "global_step": 82612, "epoch": 491} {"train_loss": -8.990880012512207, "global_step": 82613, "epoch": 491} {"train_loss": -8.782155990600586, "global_step": 82614, "epoch": 491} {"train_loss": -9.217950820922852, "global_step": 82615, "epoch": 491} {"train_loss": -9.000650405883789, "global_step": 82616, "epoch": 491} {"train_loss": -9.005027770996094, "global_step": 82617, "epoch": 491} {"train_loss": -8.671928405761719, "global_step": 82618, "epoch": 491} {"train_loss": -8.833907127380371, "global_step": 82619, "epoch": 491} {"train_loss": -8.702920913696289, "global_step": 82620, "epoch": 491} {"train_loss": -8.978827476501465, "global_step": 82621, "epoch": 491} {"train_loss": -9.382902145385742, "global_step": 82622, "epoch": 491} {"train_loss": -8.954004287719727, "global_step": 82623, "epoch": 491} {"train_loss": -8.717405319213867, "global_step": 82624, "epoch": 491} {"train_loss": -8.941171646118164, "global_step": 82625, "epoch": 491} {"train_loss": -9.147632598876953, "global_step": 82626, "epoch": 491} {"train_loss": -8.893343925476074, "global_step": 82627, "epoch": 491} {"train_loss": -9.078561782836914, "global_step": 82628, "epoch": 491} {"train_loss": -9.220112800598145, "global_step": 82629, "epoch": 491} {"train_loss": -9.143503189086914, "global_step": 82630, "epoch": 491} {"train_loss": -9.206175804138184, "global_step": 82631, "epoch": 491} {"train_loss": -9.329572677612305, "global_step": 82632, "epoch": 491} {"train_loss": -9.09980297088623, "global_step": 82633, "epoch": 491} {"train_loss": -9.197465896606445, "global_step": 82634, "epoch": 491} {"train_loss": -9.211447715759277, "global_step": 82635, "epoch": 491} {"train_loss": -9.301093101501465, "global_step": 82636, "epoch": 491} {"train_loss": -9.138574600219727, "global_step": 82637, "epoch": 491} {"train_loss": -9.251412391662598, "global_step": 82638, "epoch": 491} {"train_loss": -9.060544967651367, "global_step": 82639, "epoch": 491} {"train_loss": -9.530464172363281, "global_step": 82640, "epoch": 491} {"train_loss": -9.043218612670898, "global_step": 82641, "epoch": 491} {"train_loss": -9.094165802001953, "global_step": 82642, "epoch": 491} {"train_loss": -9.426435470581055, "global_step": 82643, "epoch": 491} {"train_loss": -9.37923812866211, "global_step": 82644, "epoch": 491} {"train_loss": -9.376716613769531, "global_step": 82645, "epoch": 491} {"train_loss": -9.319866180419922, "global_step": 82646, "epoch": 491} {"train_loss": -9.591451644897461, "global_step": 82647, "epoch": 491} {"train_loss": -9.363113403320312, "global_step": 82648, "epoch": 491} {"train_loss": -9.391082763671875, "global_step": 82649, "epoch": 491} {"train_loss": -9.256280899047852, "global_step": 82650, "epoch": 491} {"train_loss": -9.083303451538086, "global_step": 82651, "epoch": 491} {"train_loss": -9.499480247497559, "global_step": 82652, "epoch": 491} {"train_loss": -9.191044807434082, "global_step": 82653, "epoch": 491} {"train_loss": -9.563620567321777, "global_step": 82654, "epoch": 491} {"train_loss": -9.189695012001764, "global_step": 82655, "epoch": 491, "val_loss": 200015.140625} {"train_loss": -9.358403205871582, "global_step": 82656, "epoch": 492} {"train_loss": -9.31995964050293, "global_step": 82657, "epoch": 492} {"train_loss": -9.315914154052734, "global_step": 82658, "epoch": 492} {"train_loss": -9.226844787597656, "global_step": 82659, "epoch": 492} {"train_loss": -9.272891998291016, "global_step": 82660, "epoch": 492} {"train_loss": -9.505910873413086, "global_step": 82661, "epoch": 492} {"train_loss": -9.3355073928833, "global_step": 82662, "epoch": 492} {"train_loss": -9.153144836425781, "global_step": 82663, "epoch": 492} {"train_loss": -8.932003021240234, "global_step": 82664, "epoch": 492} {"train_loss": -9.449337005615234, "global_step": 82665, "epoch": 492} {"train_loss": -9.113518714904785, "global_step": 82666, "epoch": 492} {"train_loss": -9.442609786987305, "global_step": 82667, "epoch": 492} {"train_loss": -9.441191673278809, "global_step": 82668, "epoch": 492} {"train_loss": -9.107734680175781, "global_step": 82669, "epoch": 492} {"train_loss": -9.20419692993164, "global_step": 82670, "epoch": 492} {"train_loss": -9.4244966506958, "global_step": 82671, "epoch": 492} {"train_loss": -9.053016662597656, "global_step": 82672, "epoch": 492} {"train_loss": -9.384469032287598, "global_step": 82673, "epoch": 492} {"train_loss": -9.38653564453125, "global_step": 82674, "epoch": 492} {"train_loss": -9.26485824584961, "global_step": 82675, "epoch": 492} {"train_loss": -9.182989120483398, "global_step": 82676, "epoch": 492} {"train_loss": -9.113042831420898, "global_step": 82677, "epoch": 492} {"train_loss": -9.22514533996582, "global_step": 82678, "epoch": 492} {"train_loss": -9.228450775146484, "global_step": 82679, "epoch": 492} {"train_loss": -9.071685791015625, "global_step": 82680, "epoch": 492} {"train_loss": -9.335084915161133, "global_step": 82681, "epoch": 492} {"train_loss": -8.972028732299805, "global_step": 82682, "epoch": 492} {"train_loss": -9.011825561523438, "global_step": 82683, "epoch": 492} {"train_loss": -8.99330997467041, "global_step": 82684, "epoch": 492} {"train_loss": -8.848984718322754, "global_step": 82685, "epoch": 492} {"train_loss": -8.641300201416016, "global_step": 82686, "epoch": 492} {"train_loss": -9.226564407348633, "global_step": 82687, "epoch": 492} {"train_loss": -9.183332443237305, "global_step": 82688, "epoch": 492} {"train_loss": -9.096620559692383, "global_step": 82689, "epoch": 492} {"train_loss": -9.148674964904785, "global_step": 82690, "epoch": 492} {"train_loss": -9.193912506103516, "global_step": 82691, "epoch": 492} {"train_loss": -9.418292999267578, "global_step": 82692, "epoch": 492} {"train_loss": -9.221324920654297, "global_step": 82693, "epoch": 492} {"train_loss": -9.226686477661133, "global_step": 82694, "epoch": 492} {"train_loss": -9.09288215637207, "global_step": 82695, "epoch": 492} {"train_loss": -9.216204643249512, "global_step": 82696, "epoch": 492} {"train_loss": -9.24759292602539, "global_step": 82697, "epoch": 492} {"train_loss": -9.061578750610352, "global_step": 82698, "epoch": 492} {"train_loss": -9.090987205505371, "global_step": 82699, "epoch": 492} {"train_loss": -9.177233695983887, "global_step": 82700, "epoch": 492} {"train_loss": -9.266788482666016, "global_step": 82701, "epoch": 492} {"train_loss": -9.127479553222656, "global_step": 82702, "epoch": 492} {"train_loss": -9.222293853759766, "global_step": 82703, "epoch": 492} {"train_loss": -9.194873809814453, "global_step": 82704, "epoch": 492} {"train_loss": -9.308938980102539, "global_step": 82705, "epoch": 492} {"train_loss": -9.216514587402344, "global_step": 82706, "epoch": 492} {"train_loss": -9.079137802124023, "global_step": 82707, "epoch": 492} {"train_loss": -9.105461120605469, "global_step": 82708, "epoch": 492} {"train_loss": -9.379295349121094, "global_step": 82709, "epoch": 492} {"train_loss": -9.046297073364258, "global_step": 82710, "epoch": 492} {"train_loss": -8.914823532104492, "global_step": 82711, "epoch": 492} {"train_loss": -9.368290901184082, "global_step": 82712, "epoch": 492} {"train_loss": -9.392250061035156, "global_step": 82713, "epoch": 492} {"train_loss": -9.170673370361328, "global_step": 82714, "epoch": 492} {"train_loss": -9.260336875915527, "global_step": 82715, "epoch": 492} {"train_loss": -9.283792495727539, "global_step": 82716, "epoch": 492} {"train_loss": -9.023090362548828, "global_step": 82717, "epoch": 492} {"train_loss": -9.243578910827637, "global_step": 82718, "epoch": 492} {"train_loss": -9.336989402770996, "global_step": 82719, "epoch": 492} {"train_loss": -9.032096862792969, "global_step": 82720, "epoch": 492} {"train_loss": -8.879983901977539, "global_step": 82721, "epoch": 492} {"train_loss": -9.039974212646484, "global_step": 82722, "epoch": 492} {"train_loss": -8.89689826965332, "global_step": 82723, "epoch": 492} {"train_loss": -9.23346996307373, "global_step": 82724, "epoch": 492} {"train_loss": -8.826038360595703, "global_step": 82725, "epoch": 492} {"train_loss": -8.87393569946289, "global_step": 82726, "epoch": 492} {"train_loss": -8.661063194274902, "global_step": 82727, "epoch": 492} {"train_loss": -9.104063987731934, "global_step": 82728, "epoch": 492} {"train_loss": -9.008549690246582, "global_step": 82729, "epoch": 492} {"train_loss": -8.971384048461914, "global_step": 82730, "epoch": 492} {"train_loss": -9.09865951538086, "global_step": 82731, "epoch": 492} {"train_loss": -9.082825660705566, "global_step": 82732, "epoch": 492} {"train_loss": -9.182755470275879, "global_step": 82733, "epoch": 492} {"train_loss": -8.909082412719727, "global_step": 82734, "epoch": 492} {"train_loss": -9.080656051635742, "global_step": 82735, "epoch": 492} {"train_loss": -9.247455596923828, "global_step": 82736, "epoch": 492} {"train_loss": -8.901254653930664, "global_step": 82737, "epoch": 492} {"train_loss": -8.749507904052734, "global_step": 82738, "epoch": 492} {"train_loss": -9.176074028015137, "global_step": 82739, "epoch": 492} {"train_loss": -9.05369758605957, "global_step": 82740, "epoch": 492} {"train_loss": -9.17072868347168, "global_step": 82741, "epoch": 492} {"train_loss": -9.406425476074219, "global_step": 82742, "epoch": 492} {"train_loss": -9.496553421020508, "global_step": 82743, "epoch": 492} {"train_loss": -9.335641860961914, "global_step": 82744, "epoch": 492} {"train_loss": -9.290447235107422, "global_step": 82745, "epoch": 492} {"train_loss": -9.43516731262207, "global_step": 82746, "epoch": 492} {"train_loss": -9.028169631958008, "global_step": 82747, "epoch": 492} {"train_loss": -9.273540496826172, "global_step": 82748, "epoch": 492} {"train_loss": -9.269464492797852, "global_step": 82749, "epoch": 492} {"train_loss": -9.257834434509277, "global_step": 82750, "epoch": 492} {"train_loss": -9.270763397216797, "global_step": 82751, "epoch": 492} {"train_loss": -9.616332054138184, "global_step": 82752, "epoch": 492} {"train_loss": -9.098052024841309, "global_step": 82753, "epoch": 492} {"train_loss": -9.325525283813477, "global_step": 82754, "epoch": 492} {"train_loss": -9.060401916503906, "global_step": 82755, "epoch": 492} {"train_loss": -9.357122421264648, "global_step": 82756, "epoch": 492} {"train_loss": -9.24554443359375, "global_step": 82757, "epoch": 492} {"train_loss": -9.313438415527344, "global_step": 82758, "epoch": 492} {"train_loss": -9.337903022766113, "global_step": 82759, "epoch": 492} {"train_loss": -9.198183059692383, "global_step": 82760, "epoch": 492} {"train_loss": -9.152059555053711, "global_step": 82761, "epoch": 492} {"train_loss": -9.338665008544922, "global_step": 82762, "epoch": 492} {"train_loss": -9.005500793457031, "global_step": 82763, "epoch": 492} {"train_loss": -9.51460075378418, "global_step": 82764, "epoch": 492} {"train_loss": -9.053861618041992, "global_step": 82765, "epoch": 492} {"train_loss": -9.237037658691406, "global_step": 82766, "epoch": 492} {"train_loss": -9.285636901855469, "global_step": 82767, "epoch": 492} {"train_loss": -9.254629135131836, "global_step": 82768, "epoch": 492} {"train_loss": -9.416454315185547, "global_step": 82769, "epoch": 492} {"train_loss": -9.377388000488281, "global_step": 82770, "epoch": 492} {"train_loss": -9.267208099365234, "global_step": 82771, "epoch": 492} {"train_loss": -9.473587989807129, "global_step": 82772, "epoch": 492} {"train_loss": -9.168885231018066, "global_step": 82773, "epoch": 492} {"train_loss": -9.291239738464355, "global_step": 82774, "epoch": 492} {"train_loss": -9.460477828979492, "global_step": 82775, "epoch": 492} {"train_loss": -9.18289566040039, "global_step": 82776, "epoch": 492} {"train_loss": -9.502037048339844, "global_step": 82777, "epoch": 492} {"train_loss": -9.055121421813965, "global_step": 82778, "epoch": 492} {"train_loss": -9.2452392578125, "global_step": 82779, "epoch": 492} {"train_loss": -8.901134490966797, "global_step": 82780, "epoch": 492} {"train_loss": -9.380735397338867, "global_step": 82781, "epoch": 492} {"train_loss": -9.002731323242188, "global_step": 82782, "epoch": 492} {"train_loss": -9.016916275024414, "global_step": 82783, "epoch": 492} {"train_loss": -9.180791854858398, "global_step": 82784, "epoch": 492} {"train_loss": -9.132083892822266, "global_step": 82785, "epoch": 492} {"train_loss": -9.270050048828125, "global_step": 82786, "epoch": 492} {"train_loss": -9.234166145324707, "global_step": 82787, "epoch": 492} {"train_loss": -9.158153533935547, "global_step": 82788, "epoch": 492} {"train_loss": -9.004657745361328, "global_step": 82789, "epoch": 492} {"train_loss": -9.252344131469727, "global_step": 82790, "epoch": 492} {"train_loss": -9.238386154174805, "global_step": 82791, "epoch": 492} {"train_loss": -9.0595703125, "global_step": 82792, "epoch": 492} {"train_loss": -9.283838272094727, "global_step": 82793, "epoch": 492} {"train_loss": -9.206480026245117, "global_step": 82794, "epoch": 492} {"train_loss": -9.180585861206055, "global_step": 82795, "epoch": 492} {"train_loss": -9.211315155029297, "global_step": 82796, "epoch": 492} {"train_loss": -9.244659423828125, "global_step": 82797, "epoch": 492} {"train_loss": -9.259952545166016, "global_step": 82798, "epoch": 492} {"train_loss": -9.28466796875, "global_step": 82799, "epoch": 492} {"train_loss": -9.145337104797363, "global_step": 82800, "epoch": 492} {"train_loss": -9.197354316711426, "global_step": 82801, "epoch": 492} {"train_loss": -9.511235237121582, "global_step": 82802, "epoch": 492} {"train_loss": -9.282243728637695, "global_step": 82803, "epoch": 492} {"train_loss": -9.346107482910156, "global_step": 82804, "epoch": 492} {"train_loss": -9.464601516723633, "global_step": 82805, "epoch": 492} {"train_loss": -9.171622276306152, "global_step": 82806, "epoch": 492} {"train_loss": -9.20261001586914, "global_step": 82807, "epoch": 492} {"train_loss": -9.20132064819336, "global_step": 82808, "epoch": 492} {"train_loss": -9.368160247802734, "global_step": 82809, "epoch": 492} {"train_loss": -9.252327919006348, "global_step": 82810, "epoch": 492} {"train_loss": -9.308682441711426, "global_step": 82811, "epoch": 492} {"train_loss": -9.282569885253906, "global_step": 82812, "epoch": 492} {"train_loss": -9.38949203491211, "global_step": 82813, "epoch": 492} {"train_loss": -9.255754470825195, "global_step": 82814, "epoch": 492} {"train_loss": -9.155064582824707, "global_step": 82815, "epoch": 492} {"train_loss": -9.199053764343262, "global_step": 82816, "epoch": 492} {"train_loss": -8.912981033325195, "global_step": 82817, "epoch": 492} {"train_loss": -9.397575378417969, "global_step": 82818, "epoch": 492} {"train_loss": -9.272457122802734, "global_step": 82819, "epoch": 492} {"train_loss": -9.323657989501953, "global_step": 82820, "epoch": 492} {"train_loss": -9.250336647033691, "global_step": 82821, "epoch": 492} {"train_loss": -9.255300521850586, "global_step": 82822, "epoch": 492} {"train_loss": -9.201456654639472, "global_step": 82823, "epoch": 492, "val_loss": 199758.421875} {"train_loss": -9.387409210205078, "global_step": 82824, "epoch": 493} {"train_loss": -9.476801872253418, "global_step": 82825, "epoch": 493} {"train_loss": -9.291696548461914, "global_step": 82826, "epoch": 493} {"train_loss": -9.26871395111084, "global_step": 82827, "epoch": 493} {"train_loss": -9.443872451782227, "global_step": 82828, "epoch": 493} {"train_loss": -8.962743759155273, "global_step": 82829, "epoch": 493} {"train_loss": -9.493515014648438, "global_step": 82830, "epoch": 493} {"train_loss": -9.273313522338867, "global_step": 82831, "epoch": 493} {"train_loss": -9.318370819091797, "global_step": 82832, "epoch": 493} {"train_loss": -9.022604942321777, "global_step": 82833, "epoch": 493} {"train_loss": -9.106698989868164, "global_step": 82834, "epoch": 493} {"train_loss": -8.903202056884766, "global_step": 82835, "epoch": 493} {"train_loss": -9.182947158813477, "global_step": 82836, "epoch": 493} {"train_loss": -9.143158912658691, "global_step": 82837, "epoch": 493} {"train_loss": -9.342211723327637, "global_step": 82838, "epoch": 493} {"train_loss": -8.91734504699707, "global_step": 82839, "epoch": 493} {"train_loss": -9.262419700622559, "global_step": 82840, "epoch": 493} {"train_loss": -9.533035278320312, "global_step": 82841, "epoch": 493} {"train_loss": -9.301630020141602, "global_step": 82842, "epoch": 493} {"train_loss": -9.295917510986328, "global_step": 82843, "epoch": 493} {"train_loss": -9.158374786376953, "global_step": 82844, "epoch": 493} {"train_loss": -9.349489212036133, "global_step": 82845, "epoch": 493} {"train_loss": -9.2528076171875, "global_step": 82846, "epoch": 493} {"train_loss": -9.289962768554688, "global_step": 82847, "epoch": 493} {"train_loss": -9.245010375976562, "global_step": 82848, "epoch": 493} {"train_loss": -9.170889854431152, "global_step": 82849, "epoch": 493} {"train_loss": -9.204985618591309, "global_step": 82850, "epoch": 493} {"train_loss": -9.189908981323242, "global_step": 82851, "epoch": 493} {"train_loss": -9.262340545654297, "global_step": 82852, "epoch": 493} {"train_loss": -9.2357759475708, "global_step": 82853, "epoch": 493} {"train_loss": -9.292177200317383, "global_step": 82854, "epoch": 493} {"train_loss": -8.970746994018555, "global_step": 82855, "epoch": 493} {"train_loss": -9.509344100952148, "global_step": 82856, "epoch": 493} {"train_loss": -9.049854278564453, "global_step": 82857, "epoch": 493} {"train_loss": -9.442357063293457, "global_step": 82858, "epoch": 493} {"train_loss": -9.195840835571289, "global_step": 82859, "epoch": 493} {"train_loss": -9.205232620239258, "global_step": 82860, "epoch": 493} {"train_loss": -9.226860046386719, "global_step": 82861, "epoch": 493} {"train_loss": -9.002634048461914, "global_step": 82862, "epoch": 493} {"train_loss": -9.192926406860352, "global_step": 82863, "epoch": 493} {"train_loss": -9.141397476196289, "global_step": 82864, "epoch": 493} {"train_loss": -8.874704360961914, "global_step": 82865, "epoch": 493} {"train_loss": -9.157455444335938, "global_step": 82866, "epoch": 493} {"train_loss": -9.25285530090332, "global_step": 82867, "epoch": 493} {"train_loss": -9.251896858215332, "global_step": 82868, "epoch": 493} {"train_loss": -9.420503616333008, "global_step": 82869, "epoch": 493} {"train_loss": -9.262364387512207, "global_step": 82870, "epoch": 493} {"train_loss": -9.028059005737305, "global_step": 82871, "epoch": 493} {"train_loss": -9.30311107635498, "global_step": 82872, "epoch": 493} {"train_loss": -9.222379684448242, "global_step": 82873, "epoch": 493} {"train_loss": -8.952631950378418, "global_step": 82874, "epoch": 493} {"train_loss": -9.486106872558594, "global_step": 82875, "epoch": 493} {"train_loss": -9.0646333694458, "global_step": 82876, "epoch": 493} {"train_loss": -9.176408767700195, "global_step": 82877, "epoch": 493} {"train_loss": -9.243492126464844, "global_step": 82878, "epoch": 493} {"train_loss": -9.229434967041016, "global_step": 82879, "epoch": 493} {"train_loss": -9.073296546936035, "global_step": 82880, "epoch": 493} {"train_loss": -9.015128135681152, "global_step": 82881, "epoch": 493} {"train_loss": -8.850898742675781, "global_step": 82882, "epoch": 493} {"train_loss": -9.157210350036621, "global_step": 82883, "epoch": 493} {"train_loss": -9.098124504089355, "global_step": 82884, "epoch": 493} {"train_loss": -9.101078987121582, "global_step": 82885, "epoch": 493} {"train_loss": -9.270366668701172, "global_step": 82886, "epoch": 493} {"train_loss": -9.466861724853516, "global_step": 82887, "epoch": 493} {"train_loss": -9.115485191345215, "global_step": 82888, "epoch": 493} {"train_loss": -9.381874084472656, "global_step": 82889, "epoch": 493} {"train_loss": -8.926773071289062, "global_step": 82890, "epoch": 493} {"train_loss": -9.370431900024414, "global_step": 82891, "epoch": 493} {"train_loss": -9.371757507324219, "global_step": 82892, "epoch": 493} {"train_loss": -9.303791046142578, "global_step": 82893, "epoch": 493} {"train_loss": -9.245861053466797, "global_step": 82894, "epoch": 493} {"train_loss": -9.515087127685547, "global_step": 82895, "epoch": 493} {"train_loss": -9.160289764404297, "global_step": 82896, "epoch": 493} {"train_loss": -9.236930847167969, "global_step": 82897, "epoch": 493} {"train_loss": -9.443642616271973, "global_step": 82898, "epoch": 493} {"train_loss": -9.084829330444336, "global_step": 82899, "epoch": 493} {"train_loss": -9.57099723815918, "global_step": 82900, "epoch": 493} {"train_loss": -9.337265014648438, "global_step": 82901, "epoch": 493} {"train_loss": -9.197029113769531, "global_step": 82902, "epoch": 493} {"train_loss": -9.439652442932129, "global_step": 82903, "epoch": 493} {"train_loss": -9.146158218383789, "global_step": 82904, "epoch": 493} {"train_loss": -9.157022476196289, "global_step": 82905, "epoch": 493} {"train_loss": -9.226133346557617, "global_step": 82906, "epoch": 493} {"train_loss": -9.087444305419922, "global_step": 82907, "epoch": 493} {"train_loss": -9.354252815246582, "global_step": 82908, "epoch": 493} {"train_loss": -9.15648365020752, "global_step": 82909, "epoch": 493} {"train_loss": -9.375797271728516, "global_step": 82910, "epoch": 493} {"train_loss": -9.518434524536133, "global_step": 82911, "epoch": 493} {"train_loss": -9.129920959472656, "global_step": 82912, "epoch": 493} {"train_loss": -9.62230110168457, "global_step": 82913, "epoch": 493} {"train_loss": -9.459800720214844, "global_step": 82914, "epoch": 493} {"train_loss": -9.4571533203125, "global_step": 82915, "epoch": 493} {"train_loss": -9.312206268310547, "global_step": 82916, "epoch": 493} {"train_loss": -9.430681228637695, "global_step": 82917, "epoch": 493} {"train_loss": -9.250856399536133, "global_step": 82918, "epoch": 493} {"train_loss": -9.759068489074707, "global_step": 82919, "epoch": 493} {"train_loss": -9.15926742553711, "global_step": 82920, "epoch": 493} {"train_loss": -9.387474060058594, "global_step": 82921, "epoch": 493} {"train_loss": -8.90736198425293, "global_step": 82922, "epoch": 493} {"train_loss": -9.538228034973145, "global_step": 82923, "epoch": 493} {"train_loss": -9.199752807617188, "global_step": 82924, "epoch": 493} {"train_loss": -8.866735458374023, "global_step": 82925, "epoch": 493} {"train_loss": -9.212733268737793, "global_step": 82926, "epoch": 493} {"train_loss": -9.280414581298828, "global_step": 82927, "epoch": 493} {"train_loss": -9.19338607788086, "global_step": 82928, "epoch": 493} {"train_loss": -9.398548126220703, "global_step": 82929, "epoch": 493} {"train_loss": -9.20452880859375, "global_step": 82930, "epoch": 493} {"train_loss": -9.19299030303955, "global_step": 82931, "epoch": 493} {"train_loss": -9.258517265319824, "global_step": 82932, "epoch": 493} {"train_loss": -9.487340927124023, "global_step": 82933, "epoch": 493} {"train_loss": -9.097345352172852, "global_step": 82934, "epoch": 493} {"train_loss": -9.50615119934082, "global_step": 82935, "epoch": 493} {"train_loss": -9.254558563232422, "global_step": 82936, "epoch": 493} {"train_loss": -9.36674690246582, "global_step": 82937, "epoch": 493} {"train_loss": -9.288281440734863, "global_step": 82938, "epoch": 493} {"train_loss": -9.273263931274414, "global_step": 82939, "epoch": 493} {"train_loss": -9.282488822937012, "global_step": 82940, "epoch": 493} {"train_loss": -9.300540924072266, "global_step": 82941, "epoch": 493} {"train_loss": -9.3732271194458, "global_step": 82942, "epoch": 493} {"train_loss": -9.330679893493652, "global_step": 82943, "epoch": 493} {"train_loss": -9.422879219055176, "global_step": 82944, "epoch": 493} {"train_loss": -9.343341827392578, "global_step": 82945, "epoch": 493} {"train_loss": -9.571307182312012, "global_step": 82946, "epoch": 493} {"train_loss": -9.099912643432617, "global_step": 82947, "epoch": 493} {"train_loss": -9.310640335083008, "global_step": 82948, "epoch": 493} {"train_loss": -9.20220947265625, "global_step": 82949, "epoch": 493} {"train_loss": -9.276200294494629, "global_step": 82950, "epoch": 493} {"train_loss": -9.504343032836914, "global_step": 82951, "epoch": 493} {"train_loss": -9.17348861694336, "global_step": 82952, "epoch": 493} {"train_loss": -9.144318580627441, "global_step": 82953, "epoch": 493} {"train_loss": -8.63323974609375, "global_step": 82954, "epoch": 493} {"train_loss": -9.101490020751953, "global_step": 82955, "epoch": 493} {"train_loss": -9.143851280212402, "global_step": 82956, "epoch": 493} {"train_loss": -9.262897491455078, "global_step": 82957, "epoch": 493} {"train_loss": -9.087276458740234, "global_step": 82958, "epoch": 493} {"train_loss": -9.290787696838379, "global_step": 82959, "epoch": 493} {"train_loss": -9.254432678222656, "global_step": 82960, "epoch": 493} {"train_loss": -9.001404762268066, "global_step": 82961, "epoch": 493} {"train_loss": -9.257730484008789, "global_step": 82962, "epoch": 493} {"train_loss": -9.197778701782227, "global_step": 82963, "epoch": 493} {"train_loss": -9.001424789428711, "global_step": 82964, "epoch": 493} {"train_loss": -9.292162895202637, "global_step": 82965, "epoch": 493} {"train_loss": -9.021926879882812, "global_step": 82966, "epoch": 493} {"train_loss": -9.045307159423828, "global_step": 82967, "epoch": 493} {"train_loss": -9.072532653808594, "global_step": 82968, "epoch": 493} {"train_loss": -9.311429023742676, "global_step": 82969, "epoch": 493} {"train_loss": -9.197965621948242, "global_step": 82970, "epoch": 493} {"train_loss": -8.989240646362305, "global_step": 82971, "epoch": 493} {"train_loss": -9.211706161499023, "global_step": 82972, "epoch": 493} {"train_loss": -9.19565200805664, "global_step": 82973, "epoch": 493} {"train_loss": -9.020208358764648, "global_step": 82974, "epoch": 493} {"train_loss": -8.976003646850586, "global_step": 82975, "epoch": 493} {"train_loss": -9.044008255004883, "global_step": 82976, "epoch": 493} {"train_loss": -9.076202392578125, "global_step": 82977, "epoch": 493} {"train_loss": -9.35110855102539, "global_step": 82978, "epoch": 493} {"train_loss": -9.121959686279297, "global_step": 82979, "epoch": 493} {"train_loss": -9.246047973632812, "global_step": 82980, "epoch": 493} {"train_loss": -9.24385929107666, "global_step": 82981, "epoch": 493} {"train_loss": -9.138261795043945, "global_step": 82982, "epoch": 493} {"train_loss": -9.211418151855469, "global_step": 82983, "epoch": 493} {"train_loss": -9.072507858276367, "global_step": 82984, "epoch": 493} {"train_loss": -9.242122650146484, "global_step": 82985, "epoch": 493} {"train_loss": -9.456527709960938, "global_step": 82986, "epoch": 493} {"train_loss": -9.485788345336914, "global_step": 82987, "epoch": 493} {"train_loss": -9.114230155944824, "global_step": 82988, "epoch": 493} {"train_loss": -9.419925689697266, "global_step": 82989, "epoch": 493} {"train_loss": -9.409626960754395, "global_step": 82990, "epoch": 493} {"train_loss": -9.234718617938814, "global_step": 82991, "epoch": 493, "val_loss": 197716.296875} {"train_loss": -9.382991790771484, "global_step": 82992, "epoch": 494} {"train_loss": -9.383831024169922, "global_step": 82993, "epoch": 494} {"train_loss": -9.320856094360352, "global_step": 82994, "epoch": 494} {"train_loss": -9.372526168823242, "global_step": 82995, "epoch": 494} {"train_loss": -9.117158889770508, "global_step": 82996, "epoch": 494} {"train_loss": -9.477431297302246, "global_step": 82997, "epoch": 494} {"train_loss": -9.393904685974121, "global_step": 82998, "epoch": 494} {"train_loss": -9.336095809936523, "global_step": 82999, "epoch": 494} {"train_loss": -9.223920822143555, "global_step": 83000, "epoch": 494} {"train_loss": -9.123321533203125, "global_step": 83001, "epoch": 494} {"train_loss": -9.507194519042969, "global_step": 83002, "epoch": 494} {"train_loss": -8.991083145141602, "global_step": 83003, "epoch": 494} {"train_loss": -9.486916542053223, "global_step": 83004, "epoch": 494} {"train_loss": -8.981353759765625, "global_step": 83005, "epoch": 494} {"train_loss": -9.443233489990234, "global_step": 83006, "epoch": 494} {"train_loss": -9.414016723632812, "global_step": 83007, "epoch": 494} {"train_loss": -9.51266098022461, "global_step": 83008, "epoch": 494} {"train_loss": -9.405509948730469, "global_step": 83009, "epoch": 494} {"train_loss": -9.494841575622559, "global_step": 83010, "epoch": 494} {"train_loss": -9.080674171447754, "global_step": 83011, "epoch": 494} {"train_loss": -9.492241859436035, "global_step": 83012, "epoch": 494} {"train_loss": -9.357549667358398, "global_step": 83013, "epoch": 494} {"train_loss": -9.216482162475586, "global_step": 83014, "epoch": 494} {"train_loss": -9.474510192871094, "global_step": 83015, "epoch": 494} {"train_loss": -9.230573654174805, "global_step": 83016, "epoch": 494} {"train_loss": -9.102224349975586, "global_step": 83017, "epoch": 494} {"train_loss": -9.58842658996582, "global_step": 83018, "epoch": 494} {"train_loss": -8.987178802490234, "global_step": 83019, "epoch": 494} {"train_loss": -9.210824966430664, "global_step": 83020, "epoch": 494} {"train_loss": -9.233726501464844, "global_step": 83021, "epoch": 494} {"train_loss": -9.110801696777344, "global_step": 83022, "epoch": 494} {"train_loss": -9.343870162963867, "global_step": 83023, "epoch": 494} {"train_loss": -9.24630355834961, "global_step": 83024, "epoch": 494} {"train_loss": -9.50340461730957, "global_step": 83025, "epoch": 494} {"train_loss": -9.305459976196289, "global_step": 83026, "epoch": 494} {"train_loss": -9.218852996826172, "global_step": 83027, "epoch": 494} {"train_loss": -9.125503540039062, "global_step": 83028, "epoch": 494} {"train_loss": -9.176712989807129, "global_step": 83029, "epoch": 494} {"train_loss": -9.360292434692383, "global_step": 83030, "epoch": 494} {"train_loss": -9.165323257446289, "global_step": 83031, "epoch": 494} {"train_loss": -9.295103073120117, "global_step": 83032, "epoch": 494} {"train_loss": -9.574639320373535, "global_step": 83033, "epoch": 494} {"train_loss": -9.011411666870117, "global_step": 83034, "epoch": 494} {"train_loss": -9.397518157958984, "global_step": 83035, "epoch": 494} {"train_loss": -9.195667266845703, "global_step": 83036, "epoch": 494} {"train_loss": -9.303960800170898, "global_step": 83037, "epoch": 494} {"train_loss": -9.167043685913086, "global_step": 83038, "epoch": 494} {"train_loss": -9.58702278137207, "global_step": 83039, "epoch": 494} {"train_loss": -8.873207092285156, "global_step": 83040, "epoch": 494} {"train_loss": -9.330819129943848, "global_step": 83041, "epoch": 494} {"train_loss": -9.20521354675293, "global_step": 83042, "epoch": 494} {"train_loss": -9.224884033203125, "global_step": 83043, "epoch": 494} {"train_loss": -9.239513397216797, "global_step": 83044, "epoch": 494} {"train_loss": -9.479461669921875, "global_step": 83045, "epoch": 494} {"train_loss": -9.222840309143066, "global_step": 83046, "epoch": 494} {"train_loss": -9.482388496398926, "global_step": 83047, "epoch": 494} {"train_loss": -9.208861351013184, "global_step": 83048, "epoch": 494} {"train_loss": -9.428921699523926, "global_step": 83049, "epoch": 494} {"train_loss": -9.160537719726562, "global_step": 83050, "epoch": 494} {"train_loss": -9.394540786743164, "global_step": 83051, "epoch": 494} {"train_loss": -8.903306007385254, "global_step": 83052, "epoch": 494} {"train_loss": -9.47587776184082, "global_step": 83053, "epoch": 494} {"train_loss": -9.200897216796875, "global_step": 83054, "epoch": 494} {"train_loss": -9.285331726074219, "global_step": 83055, "epoch": 494} {"train_loss": -9.218815803527832, "global_step": 83056, "epoch": 494} {"train_loss": -9.150224685668945, "global_step": 83057, "epoch": 494} {"train_loss": -9.150933265686035, "global_step": 83058, "epoch": 494} {"train_loss": -9.048513412475586, "global_step": 83059, "epoch": 494} {"train_loss": -9.244104385375977, "global_step": 83060, "epoch": 494} {"train_loss": -9.134071350097656, "global_step": 83061, "epoch": 494} {"train_loss": -9.111420631408691, "global_step": 83062, "epoch": 494} {"train_loss": -9.450879096984863, "global_step": 83063, "epoch": 494} {"train_loss": -9.086043357849121, "global_step": 83064, "epoch": 494} {"train_loss": -9.198469161987305, "global_step": 83065, "epoch": 494} {"train_loss": -9.219644546508789, "global_step": 83066, "epoch": 494} {"train_loss": -9.083555221557617, "global_step": 83067, "epoch": 494} {"train_loss": -9.213056564331055, "global_step": 83068, "epoch": 494} {"train_loss": -9.019993782043457, "global_step": 83069, "epoch": 494} {"train_loss": -9.325242042541504, "global_step": 83070, "epoch": 494} {"train_loss": -8.785024642944336, "global_step": 83071, "epoch": 494} {"train_loss": -9.206153869628906, "global_step": 83072, "epoch": 494} {"train_loss": -9.003697395324707, "global_step": 83073, "epoch": 494} {"train_loss": -9.033987045288086, "global_step": 83074, "epoch": 494} {"train_loss": -9.24635124206543, "global_step": 83075, "epoch": 494} {"train_loss": -9.001520156860352, "global_step": 83076, "epoch": 494} {"train_loss": -9.169530868530273, "global_step": 83077, "epoch": 494} {"train_loss": -8.759906768798828, "global_step": 83078, "epoch": 494} {"train_loss": -9.434613227844238, "global_step": 83079, "epoch": 494} {"train_loss": -9.1565580368042, "global_step": 83080, "epoch": 494} {"train_loss": -9.083085060119629, "global_step": 83081, "epoch": 494} {"train_loss": -9.239696502685547, "global_step": 83082, "epoch": 494} {"train_loss": -9.064535140991211, "global_step": 83083, "epoch": 494} {"train_loss": -9.44645881652832, "global_step": 83084, "epoch": 494} {"train_loss": -9.13621711730957, "global_step": 83085, "epoch": 494} {"train_loss": -9.180912017822266, "global_step": 83086, "epoch": 494} {"train_loss": -9.33781623840332, "global_step": 83087, "epoch": 494} {"train_loss": -9.28546142578125, "global_step": 83088, "epoch": 494} {"train_loss": -9.114983558654785, "global_step": 83089, "epoch": 494} {"train_loss": -9.187904357910156, "global_step": 83090, "epoch": 494} {"train_loss": -9.345190048217773, "global_step": 83091, "epoch": 494} {"train_loss": -9.056446075439453, "global_step": 83092, "epoch": 494} {"train_loss": -9.490438461303711, "global_step": 83093, "epoch": 494} {"train_loss": -9.149374008178711, "global_step": 83094, "epoch": 494} {"train_loss": -9.471203804016113, "global_step": 83095, "epoch": 494} {"train_loss": -9.352470397949219, "global_step": 83096, "epoch": 494} {"train_loss": -9.420204162597656, "global_step": 83097, "epoch": 494} {"train_loss": -9.315032005310059, "global_step": 83098, "epoch": 494} {"train_loss": -9.405920028686523, "global_step": 83099, "epoch": 494} {"train_loss": -9.207931518554688, "global_step": 83100, "epoch": 494} {"train_loss": -9.402729034423828, "global_step": 83101, "epoch": 494} {"train_loss": -9.149288177490234, "global_step": 83102, "epoch": 494} {"train_loss": -9.526652336120605, "global_step": 83103, "epoch": 494} {"train_loss": -9.49948501586914, "global_step": 83104, "epoch": 494} {"train_loss": -9.284324645996094, "global_step": 83105, "epoch": 494} {"train_loss": -9.524106979370117, "global_step": 83106, "epoch": 494} {"train_loss": -9.409082412719727, "global_step": 83107, "epoch": 494} {"train_loss": -9.362262725830078, "global_step": 83108, "epoch": 494} {"train_loss": -9.279987335205078, "global_step": 83109, "epoch": 494} {"train_loss": -9.44211483001709, "global_step": 83110, "epoch": 494} {"train_loss": -9.212148666381836, "global_step": 83111, "epoch": 494} {"train_loss": -9.486968994140625, "global_step": 83112, "epoch": 494} {"train_loss": -8.956911087036133, "global_step": 83113, "epoch": 494} {"train_loss": -9.511433601379395, "global_step": 83114, "epoch": 494} {"train_loss": -9.213926315307617, "global_step": 83115, "epoch": 494} {"train_loss": -9.287662506103516, "global_step": 83116, "epoch": 494} {"train_loss": -9.078319549560547, "global_step": 83117, "epoch": 494} {"train_loss": -9.347114562988281, "global_step": 83118, "epoch": 494} {"train_loss": -9.00905990600586, "global_step": 83119, "epoch": 494} {"train_loss": -9.048164367675781, "global_step": 83120, "epoch": 494} {"train_loss": -9.200608253479004, "global_step": 83121, "epoch": 494} {"train_loss": -8.873411178588867, "global_step": 83122, "epoch": 494} {"train_loss": -8.897868156433105, "global_step": 83123, "epoch": 494} {"train_loss": -9.157716751098633, "global_step": 83124, "epoch": 494} {"train_loss": -8.930932998657227, "global_step": 83125, "epoch": 494} {"train_loss": -9.3114013671875, "global_step": 83126, "epoch": 494} {"train_loss": -9.028188705444336, "global_step": 83127, "epoch": 494} {"train_loss": -9.157634735107422, "global_step": 83128, "epoch": 494} {"train_loss": -9.02988052368164, "global_step": 83129, "epoch": 494} {"train_loss": -8.993894577026367, "global_step": 83130, "epoch": 494} {"train_loss": -9.272027015686035, "global_step": 83131, "epoch": 494} {"train_loss": -9.102426528930664, "global_step": 83132, "epoch": 494} {"train_loss": -9.033966064453125, "global_step": 83133, "epoch": 494} {"train_loss": -9.319845199584961, "global_step": 83134, "epoch": 494} {"train_loss": -9.14640998840332, "global_step": 83135, "epoch": 494} {"train_loss": -9.359415054321289, "global_step": 83136, "epoch": 494} {"train_loss": -9.232172012329102, "global_step": 83137, "epoch": 494} {"train_loss": -9.15349292755127, "global_step": 83138, "epoch": 494} {"train_loss": -9.2725191116333, "global_step": 83139, "epoch": 494} {"train_loss": -9.131077766418457, "global_step": 83140, "epoch": 494} {"train_loss": -9.129000663757324, "global_step": 83141, "epoch": 494} {"train_loss": -9.317214965820312, "global_step": 83142, "epoch": 494} {"train_loss": -9.438158988952637, "global_step": 83143, "epoch": 494} {"train_loss": -9.231990814208984, "global_step": 83144, "epoch": 494} {"train_loss": -9.411994934082031, "global_step": 83145, "epoch": 494} {"train_loss": -9.475399017333984, "global_step": 83146, "epoch": 494} {"train_loss": -9.556270599365234, "global_step": 83147, "epoch": 494} {"train_loss": -9.24417495727539, "global_step": 83148, "epoch": 494} {"train_loss": -9.277151107788086, "global_step": 83149, "epoch": 494} {"train_loss": -9.360504150390625, "global_step": 83150, "epoch": 494} {"train_loss": -9.498199462890625, "global_step": 83151, "epoch": 494} {"train_loss": -9.665336608886719, "global_step": 83152, "epoch": 494} {"train_loss": -9.530718803405762, "global_step": 83153, "epoch": 494} {"train_loss": -9.495241165161133, "global_step": 83154, "epoch": 494} {"train_loss": -9.552268981933594, "global_step": 83155, "epoch": 494} {"train_loss": -9.654557228088379, "global_step": 83156, "epoch": 494} {"train_loss": -9.589841842651367, "global_step": 83157, "epoch": 494} {"train_loss": -9.370471954345703, "global_step": 83158, "epoch": 494} {"train_loss": -9.260827626500811, "global_step": 83159, "epoch": 494, "val_loss": 199769.578125} {"train_loss": -9.21731185913086, "global_step": 83160, "epoch": 495} {"train_loss": -9.517573356628418, "global_step": 83161, "epoch": 495} {"train_loss": -9.649227142333984, "global_step": 83162, "epoch": 495} {"train_loss": -9.64284896850586, "global_step": 83163, "epoch": 495} {"train_loss": -9.387919425964355, "global_step": 83164, "epoch": 495} {"train_loss": -9.469160079956055, "global_step": 83165, "epoch": 495} {"train_loss": -9.237223625183105, "global_step": 83166, "epoch": 495} {"train_loss": -9.137231826782227, "global_step": 83167, "epoch": 495} {"train_loss": -9.625253677368164, "global_step": 83168, "epoch": 495} {"train_loss": -9.432085037231445, "global_step": 83169, "epoch": 495} {"train_loss": -9.211053848266602, "global_step": 83170, "epoch": 495} {"train_loss": -9.384172439575195, "global_step": 83171, "epoch": 495} {"train_loss": -8.984066009521484, "global_step": 83172, "epoch": 495} {"train_loss": -9.154165267944336, "global_step": 83173, "epoch": 495} {"train_loss": -8.97344970703125, "global_step": 83174, "epoch": 495} {"train_loss": -9.283363342285156, "global_step": 83175, "epoch": 495} {"train_loss": -9.293008804321289, "global_step": 83176, "epoch": 495} {"train_loss": -9.0159273147583, "global_step": 83177, "epoch": 495} {"train_loss": -9.129981994628906, "global_step": 83178, "epoch": 495} {"train_loss": -9.194488525390625, "global_step": 83179, "epoch": 495} {"train_loss": -9.021533012390137, "global_step": 83180, "epoch": 495} {"train_loss": -9.326704025268555, "global_step": 83181, "epoch": 495} {"train_loss": -9.423251152038574, "global_step": 83182, "epoch": 495} {"train_loss": -9.326939582824707, "global_step": 83183, "epoch": 495} {"train_loss": -9.385428428649902, "global_step": 83184, "epoch": 495} {"train_loss": -9.156936645507812, "global_step": 83185, "epoch": 495} {"train_loss": -9.319671630859375, "global_step": 83186, "epoch": 495} {"train_loss": -9.126834869384766, "global_step": 83187, "epoch": 495} {"train_loss": -8.987165451049805, "global_step": 83188, "epoch": 495} {"train_loss": -9.003068923950195, "global_step": 83189, "epoch": 495} {"train_loss": -8.423808097839355, "global_step": 83190, "epoch": 495} {"train_loss": -9.180118560791016, "global_step": 83191, "epoch": 495} {"train_loss": -8.719329833984375, "global_step": 83192, "epoch": 495} {"train_loss": -9.02998161315918, "global_step": 83193, "epoch": 495} {"train_loss": -9.083974838256836, "global_step": 83194, "epoch": 495} {"train_loss": -9.011693954467773, "global_step": 83195, "epoch": 495} {"train_loss": -9.064214706420898, "global_step": 83196, "epoch": 495} {"train_loss": -9.159951210021973, "global_step": 83197, "epoch": 495} {"train_loss": -9.24962329864502, "global_step": 83198, "epoch": 495} {"train_loss": -8.848097801208496, "global_step": 83199, "epoch": 495} {"train_loss": -9.048118591308594, "global_step": 83200, "epoch": 495} {"train_loss": -9.187337875366211, "global_step": 83201, "epoch": 495} {"train_loss": -9.292560577392578, "global_step": 83202, "epoch": 495} {"train_loss": -9.023958206176758, "global_step": 83203, "epoch": 495} {"train_loss": -9.097127914428711, "global_step": 83204, "epoch": 495} {"train_loss": -9.19521713256836, "global_step": 83205, "epoch": 495} {"train_loss": -9.041290283203125, "global_step": 83206, "epoch": 495} {"train_loss": -9.274924278259277, "global_step": 83207, "epoch": 495} {"train_loss": -9.25164794921875, "global_step": 83208, "epoch": 495} {"train_loss": -9.232935905456543, "global_step": 83209, "epoch": 495} {"train_loss": -9.299838066101074, "global_step": 83210, "epoch": 495} {"train_loss": -9.164628028869629, "global_step": 83211, "epoch": 495} {"train_loss": -9.235711097717285, "global_step": 83212, "epoch": 495} {"train_loss": -9.263716697692871, "global_step": 83213, "epoch": 495} {"train_loss": -9.206650733947754, "global_step": 83214, "epoch": 495} {"train_loss": -9.536659240722656, "global_step": 83215, "epoch": 495} {"train_loss": -9.176179885864258, "global_step": 83216, "epoch": 495} {"train_loss": -9.384727478027344, "global_step": 83217, "epoch": 495} {"train_loss": -9.44674015045166, "global_step": 83218, "epoch": 495} {"train_loss": -9.380119323730469, "global_step": 83219, "epoch": 495} {"train_loss": -9.231383323669434, "global_step": 83220, "epoch": 495} {"train_loss": -9.24709701538086, "global_step": 83221, "epoch": 495} {"train_loss": -9.783607482910156, "global_step": 83222, "epoch": 495} {"train_loss": -9.166513442993164, "global_step": 83223, "epoch": 495} {"train_loss": -9.391672134399414, "global_step": 83224, "epoch": 495} {"train_loss": -9.509408950805664, "global_step": 83225, "epoch": 495} {"train_loss": -9.360984802246094, "global_step": 83226, "epoch": 495} {"train_loss": -9.510902404785156, "global_step": 83227, "epoch": 495} {"train_loss": -9.510798454284668, "global_step": 83228, "epoch": 495} {"train_loss": -9.645320892333984, "global_step": 83229, "epoch": 495} {"train_loss": -9.559488296508789, "global_step": 83230, "epoch": 495} {"train_loss": -9.379518508911133, "global_step": 83231, "epoch": 495} {"train_loss": -8.557779312133789, "global_step": 83232, "epoch": 495} {"train_loss": -8.992513656616211, "global_step": 83233, "epoch": 495} {"train_loss": -9.442102432250977, "global_step": 83234, "epoch": 495} {"train_loss": -9.000375747680664, "global_step": 83235, "epoch": 495} {"train_loss": -9.299400329589844, "global_step": 83236, "epoch": 495} {"train_loss": -9.115617752075195, "global_step": 83237, "epoch": 495} {"train_loss": -9.166654586791992, "global_step": 83238, "epoch": 495} {"train_loss": -9.094200134277344, "global_step": 83239, "epoch": 495} {"train_loss": -9.01939582824707, "global_step": 83240, "epoch": 495} {"train_loss": -8.762188911437988, "global_step": 83241, "epoch": 495} {"train_loss": -8.996752738952637, "global_step": 83242, "epoch": 495} {"train_loss": -8.897682189941406, "global_step": 83243, "epoch": 495} {"train_loss": -8.801722526550293, "global_step": 83244, "epoch": 495} {"train_loss": -8.72935676574707, "global_step": 83245, "epoch": 495} {"train_loss": -8.595890045166016, "global_step": 83246, "epoch": 495} {"train_loss": -8.682246208190918, "global_step": 83247, "epoch": 495} {"train_loss": -8.827902793884277, "global_step": 83248, "epoch": 495} {"train_loss": -8.822572708129883, "global_step": 83249, "epoch": 495} {"train_loss": -8.335491180419922, "global_step": 83250, "epoch": 495} {"train_loss": -8.952485084533691, "global_step": 83251, "epoch": 495} {"train_loss": -9.092859268188477, "global_step": 83252, "epoch": 495} {"train_loss": -8.864767074584961, "global_step": 83253, "epoch": 495} {"train_loss": -8.814160346984863, "global_step": 83254, "epoch": 495} {"train_loss": -9.059667587280273, "global_step": 83255, "epoch": 495} {"train_loss": -9.03235912322998, "global_step": 83256, "epoch": 495} {"train_loss": -8.76664924621582, "global_step": 83257, "epoch": 495} {"train_loss": -9.061866760253906, "global_step": 83258, "epoch": 495} {"train_loss": -8.981012344360352, "global_step": 83259, "epoch": 495} {"train_loss": -9.199699401855469, "global_step": 83260, "epoch": 495} {"train_loss": -9.180183410644531, "global_step": 83261, "epoch": 495} {"train_loss": -9.083365440368652, "global_step": 83262, "epoch": 495} {"train_loss": -8.96937084197998, "global_step": 83263, "epoch": 495} {"train_loss": -9.279571533203125, "global_step": 83264, "epoch": 495} {"train_loss": -9.290096282958984, "global_step": 83265, "epoch": 495} {"train_loss": -9.102367401123047, "global_step": 83266, "epoch": 495} {"train_loss": -8.782013893127441, "global_step": 83267, "epoch": 495} {"train_loss": -9.130840301513672, "global_step": 83268, "epoch": 495} {"train_loss": -9.188446044921875, "global_step": 83269, "epoch": 495} {"train_loss": -9.004322052001953, "global_step": 83270, "epoch": 495} {"train_loss": -9.134727478027344, "global_step": 83271, "epoch": 495} {"train_loss": -9.511738777160645, "global_step": 83272, "epoch": 495} {"train_loss": -9.078380584716797, "global_step": 83273, "epoch": 495} {"train_loss": -9.312225341796875, "global_step": 83274, "epoch": 495} {"train_loss": -9.256673812866211, "global_step": 83275, "epoch": 495} {"train_loss": -9.102725982666016, "global_step": 83276, "epoch": 495} {"train_loss": -9.372136116027832, "global_step": 83277, "epoch": 495} {"train_loss": -9.57436752319336, "global_step": 83278, "epoch": 495} {"train_loss": -9.417827606201172, "global_step": 83279, "epoch": 495} {"train_loss": -9.563749313354492, "global_step": 83280, "epoch": 495} {"train_loss": -9.56320571899414, "global_step": 83281, "epoch": 495} {"train_loss": -9.440017700195312, "global_step": 83282, "epoch": 495} {"train_loss": -9.478293418884277, "global_step": 83283, "epoch": 495} {"train_loss": -9.530808448791504, "global_step": 83284, "epoch": 495} {"train_loss": -9.435583114624023, "global_step": 83285, "epoch": 495} {"train_loss": -9.496432304382324, "global_step": 83286, "epoch": 495} {"train_loss": -9.315155029296875, "global_step": 83287, "epoch": 495} {"train_loss": -9.532737731933594, "global_step": 83288, "epoch": 495} {"train_loss": -9.21387004852295, "global_step": 83289, "epoch": 495} {"train_loss": -9.378934860229492, "global_step": 83290, "epoch": 495} {"train_loss": -9.383493423461914, "global_step": 83291, "epoch": 495} {"train_loss": -9.283282279968262, "global_step": 83292, "epoch": 495} {"train_loss": -9.229947090148926, "global_step": 83293, "epoch": 495} {"train_loss": -9.072786331176758, "global_step": 83294, "epoch": 495} {"train_loss": -9.262199401855469, "global_step": 83295, "epoch": 495} {"train_loss": -9.33919906616211, "global_step": 83296, "epoch": 495} {"train_loss": -9.074259757995605, "global_step": 83297, "epoch": 495} {"train_loss": -9.229008674621582, "global_step": 83298, "epoch": 495} {"train_loss": -9.201889038085938, "global_step": 83299, "epoch": 495} {"train_loss": -9.347206115722656, "global_step": 83300, "epoch": 495} {"train_loss": -9.212711334228516, "global_step": 83301, "epoch": 495} {"train_loss": -9.401931762695312, "global_step": 83302, "epoch": 495} {"train_loss": -9.319780349731445, "global_step": 83303, "epoch": 495} {"train_loss": -8.973989486694336, "global_step": 83304, "epoch": 495} {"train_loss": -9.386098861694336, "global_step": 83305, "epoch": 495} {"train_loss": -8.953235626220703, "global_step": 83306, "epoch": 495} {"train_loss": -9.284872055053711, "global_step": 83307, "epoch": 495} {"train_loss": -9.007698059082031, "global_step": 83308, "epoch": 495} {"train_loss": -8.93425178527832, "global_step": 83309, "epoch": 495} {"train_loss": -8.965982437133789, "global_step": 83310, "epoch": 495} {"train_loss": -9.068450927734375, "global_step": 83311, "epoch": 495} {"train_loss": -8.881546974182129, "global_step": 83312, "epoch": 495} {"train_loss": -9.098959922790527, "global_step": 83313, "epoch": 495} {"train_loss": -9.346511840820312, "global_step": 83314, "epoch": 495} {"train_loss": -8.795811653137207, "global_step": 83315, "epoch": 495} {"train_loss": -8.819022178649902, "global_step": 83316, "epoch": 495} {"train_loss": -9.088308334350586, "global_step": 83317, "epoch": 495} {"train_loss": -8.970512390136719, "global_step": 83318, "epoch": 495} {"train_loss": -8.88412094116211, "global_step": 83319, "epoch": 495} {"train_loss": -9.302789688110352, "global_step": 83320, "epoch": 495} {"train_loss": -9.040483474731445, "global_step": 83321, "epoch": 495} {"train_loss": -9.116272926330566, "global_step": 83322, "epoch": 495} {"train_loss": -8.96053695678711, "global_step": 83323, "epoch": 495} {"train_loss": -9.138465881347656, "global_step": 83324, "epoch": 495} {"train_loss": -9.138650894165039, "global_step": 83325, "epoch": 495} {"train_loss": -8.911661148071289, "global_step": 83326, "epoch": 495} {"train_loss": -9.17327424458095, "global_step": 83327, "epoch": 495, "val_loss": 199280.828125, "train_action_mse_error": 4.933509826660156} {"train_loss": -8.934906005859375, "global_step": 83328, "epoch": 496} {"train_loss": -9.057092666625977, "global_step": 83329, "epoch": 496} {"train_loss": -9.195115089416504, "global_step": 83330, "epoch": 496} {"train_loss": -9.127073287963867, "global_step": 83331, "epoch": 496} {"train_loss": -9.10990047454834, "global_step": 83332, "epoch": 496} {"train_loss": -9.082356452941895, "global_step": 83333, "epoch": 496} {"train_loss": -9.268903732299805, "global_step": 83334, "epoch": 496} {"train_loss": -9.258896827697754, "global_step": 83335, "epoch": 496} {"train_loss": -9.232999801635742, "global_step": 83336, "epoch": 496} {"train_loss": -9.381599426269531, "global_step": 83337, "epoch": 496} {"train_loss": -9.439861297607422, "global_step": 83338, "epoch": 496} {"train_loss": -9.411337852478027, "global_step": 83339, "epoch": 496} {"train_loss": -9.336709022521973, "global_step": 83340, "epoch": 496} {"train_loss": -9.346200942993164, "global_step": 83341, "epoch": 496} {"train_loss": -9.501148223876953, "global_step": 83342, "epoch": 496} {"train_loss": -9.400474548339844, "global_step": 83343, "epoch": 496} {"train_loss": -9.279075622558594, "global_step": 83344, "epoch": 496} {"train_loss": -9.266753196716309, "global_step": 83345, "epoch": 496} {"train_loss": -9.344717025756836, "global_step": 83346, "epoch": 496} {"train_loss": -9.560094833374023, "global_step": 83347, "epoch": 496} {"train_loss": -9.467883110046387, "global_step": 83348, "epoch": 496} {"train_loss": -9.33893871307373, "global_step": 83349, "epoch": 496} {"train_loss": -9.449617385864258, "global_step": 83350, "epoch": 496} {"train_loss": -9.140993118286133, "global_step": 83351, "epoch": 496} {"train_loss": -9.26148796081543, "global_step": 83352, "epoch": 496} {"train_loss": -9.234659194946289, "global_step": 83353, "epoch": 496} {"train_loss": -9.007270812988281, "global_step": 83354, "epoch": 496} {"train_loss": -9.319653511047363, "global_step": 83355, "epoch": 496} {"train_loss": -9.202362060546875, "global_step": 83356, "epoch": 496} {"train_loss": -9.041229248046875, "global_step": 83357, "epoch": 496} {"train_loss": -9.223033905029297, "global_step": 83358, "epoch": 496} {"train_loss": -9.24030876159668, "global_step": 83359, "epoch": 496} {"train_loss": -9.060531616210938, "global_step": 83360, "epoch": 496} {"train_loss": -9.273277282714844, "global_step": 83361, "epoch": 496} {"train_loss": -9.040727615356445, "global_step": 83362, "epoch": 496} {"train_loss": -9.22796630859375, "global_step": 83363, "epoch": 496} {"train_loss": -8.989479064941406, "global_step": 83364, "epoch": 496} {"train_loss": -9.04344367980957, "global_step": 83365, "epoch": 496} {"train_loss": -8.935506820678711, "global_step": 83366, "epoch": 496} {"train_loss": -8.981918334960938, "global_step": 83367, "epoch": 496} {"train_loss": -9.0604829788208, "global_step": 83368, "epoch": 496} {"train_loss": -9.205732345581055, "global_step": 83369, "epoch": 496} {"train_loss": -9.0509033203125, "global_step": 83370, "epoch": 496} {"train_loss": -9.073784828186035, "global_step": 83371, "epoch": 496} {"train_loss": -9.067419052124023, "global_step": 83372, "epoch": 496} {"train_loss": -9.079106330871582, "global_step": 83373, "epoch": 496} {"train_loss": -9.251708030700684, "global_step": 83374, "epoch": 496} {"train_loss": -8.845738410949707, "global_step": 83375, "epoch": 496} {"train_loss": -9.211524963378906, "global_step": 83376, "epoch": 496} {"train_loss": -9.226780891418457, "global_step": 83377, "epoch": 496} {"train_loss": -9.124963760375977, "global_step": 83378, "epoch": 496} {"train_loss": -9.12257194519043, "global_step": 83379, "epoch": 496} {"train_loss": -9.174100875854492, "global_step": 83380, "epoch": 496} {"train_loss": -9.30154800415039, "global_step": 83381, "epoch": 496} {"train_loss": -8.968658447265625, "global_step": 83382, "epoch": 496} {"train_loss": -9.279539108276367, "global_step": 83383, "epoch": 496} {"train_loss": -9.414351463317871, "global_step": 83384, "epoch": 496} {"train_loss": -9.08935546875, "global_step": 83385, "epoch": 496} {"train_loss": -9.255304336547852, "global_step": 83386, "epoch": 496} {"train_loss": -9.3251953125, "global_step": 83387, "epoch": 496} {"train_loss": -9.349502563476562, "global_step": 83388, "epoch": 496} {"train_loss": -9.274039268493652, "global_step": 83389, "epoch": 496} {"train_loss": -9.319877624511719, "global_step": 83390, "epoch": 496} {"train_loss": -9.294190406799316, "global_step": 83391, "epoch": 496} {"train_loss": -9.259246826171875, "global_step": 83392, "epoch": 496} {"train_loss": -9.323240280151367, "global_step": 83393, "epoch": 496} {"train_loss": -9.24244499206543, "global_step": 83394, "epoch": 496} {"train_loss": -9.019121170043945, "global_step": 83395, "epoch": 496} {"train_loss": -9.354440689086914, "global_step": 83396, "epoch": 496} {"train_loss": -9.131457328796387, "global_step": 83397, "epoch": 496} {"train_loss": -9.27241325378418, "global_step": 83398, "epoch": 496} {"train_loss": -9.249265670776367, "global_step": 83399, "epoch": 496} {"train_loss": -9.19261360168457, "global_step": 83400, "epoch": 496} {"train_loss": -9.354644775390625, "global_step": 83401, "epoch": 496} {"train_loss": -9.214618682861328, "global_step": 83402, "epoch": 496} {"train_loss": -9.337260246276855, "global_step": 83403, "epoch": 496} {"train_loss": -9.057575225830078, "global_step": 83404, "epoch": 496} {"train_loss": -9.372905731201172, "global_step": 83405, "epoch": 496} {"train_loss": -9.076196670532227, "global_step": 83406, "epoch": 496} {"train_loss": -9.236078262329102, "global_step": 83407, "epoch": 496} {"train_loss": -9.123101234436035, "global_step": 83408, "epoch": 496} {"train_loss": -9.333234786987305, "global_step": 83409, "epoch": 496} {"train_loss": -9.084888458251953, "global_step": 83410, "epoch": 496} {"train_loss": -8.932060241699219, "global_step": 83411, "epoch": 496} {"train_loss": -9.347126007080078, "global_step": 83412, "epoch": 496} {"train_loss": -8.971685409545898, "global_step": 83413, "epoch": 496} {"train_loss": -9.09278678894043, "global_step": 83414, "epoch": 496} {"train_loss": -9.105308532714844, "global_step": 83415, "epoch": 496} {"train_loss": -9.267824172973633, "global_step": 83416, "epoch": 496} {"train_loss": -9.091557502746582, "global_step": 83417, "epoch": 496} {"train_loss": -9.52570915222168, "global_step": 83418, "epoch": 496} {"train_loss": -9.385819435119629, "global_step": 83419, "epoch": 496} {"train_loss": -9.403512954711914, "global_step": 83420, "epoch": 496} {"train_loss": -9.423135757446289, "global_step": 83421, "epoch": 496} {"train_loss": -9.254024505615234, "global_step": 83422, "epoch": 496} {"train_loss": -9.266122817993164, "global_step": 83423, "epoch": 496} {"train_loss": -9.184377670288086, "global_step": 83424, "epoch": 496} {"train_loss": -9.365718841552734, "global_step": 83425, "epoch": 496} {"train_loss": -9.182519912719727, "global_step": 83426, "epoch": 496} {"train_loss": -9.138025283813477, "global_step": 83427, "epoch": 496} {"train_loss": -9.520210266113281, "global_step": 83428, "epoch": 496} {"train_loss": -9.476555824279785, "global_step": 83429, "epoch": 496} {"train_loss": -9.385015487670898, "global_step": 83430, "epoch": 496} {"train_loss": -9.027634620666504, "global_step": 83431, "epoch": 496} {"train_loss": -9.246910095214844, "global_step": 83432, "epoch": 496} {"train_loss": -9.521212577819824, "global_step": 83433, "epoch": 496} {"train_loss": -9.093058586120605, "global_step": 83434, "epoch": 496} {"train_loss": -9.282133102416992, "global_step": 83435, "epoch": 496} {"train_loss": -9.243758201599121, "global_step": 83436, "epoch": 496} {"train_loss": -9.387855529785156, "global_step": 83437, "epoch": 496} {"train_loss": -9.478618621826172, "global_step": 83438, "epoch": 496} {"train_loss": -9.289003372192383, "global_step": 83439, "epoch": 496} {"train_loss": -9.372448921203613, "global_step": 83440, "epoch": 496} {"train_loss": -9.454379081726074, "global_step": 83441, "epoch": 496} {"train_loss": -9.288261413574219, "global_step": 83442, "epoch": 496} {"train_loss": -9.405012130737305, "global_step": 83443, "epoch": 496} {"train_loss": -9.240100860595703, "global_step": 83444, "epoch": 496} {"train_loss": -9.464019775390625, "global_step": 83445, "epoch": 496} {"train_loss": -9.206071853637695, "global_step": 83446, "epoch": 496} {"train_loss": -9.444429397583008, "global_step": 83447, "epoch": 496} {"train_loss": -9.2584867477417, "global_step": 83448, "epoch": 496} {"train_loss": -9.080095291137695, "global_step": 83449, "epoch": 496} {"train_loss": -9.355409622192383, "global_step": 83450, "epoch": 496} {"train_loss": -9.122303009033203, "global_step": 83451, "epoch": 496} {"train_loss": -9.555891036987305, "global_step": 83452, "epoch": 496} {"train_loss": -9.588200569152832, "global_step": 83453, "epoch": 496} {"train_loss": -9.304981231689453, "global_step": 83454, "epoch": 496} {"train_loss": -9.424079895019531, "global_step": 83455, "epoch": 496} {"train_loss": -9.304667472839355, "global_step": 83456, "epoch": 496} {"train_loss": -9.440495491027832, "global_step": 83457, "epoch": 496} {"train_loss": -9.537847518920898, "global_step": 83458, "epoch": 496} {"train_loss": -9.420223236083984, "global_step": 83459, "epoch": 496} {"train_loss": -9.464740753173828, "global_step": 83460, "epoch": 496} {"train_loss": -9.545907974243164, "global_step": 83461, "epoch": 496} {"train_loss": -9.448862075805664, "global_step": 83462, "epoch": 496} {"train_loss": -9.338842391967773, "global_step": 83463, "epoch": 496} {"train_loss": -9.619441986083984, "global_step": 83464, "epoch": 496} {"train_loss": -9.310529708862305, "global_step": 83465, "epoch": 496} {"train_loss": -9.23393726348877, "global_step": 83466, "epoch": 496} {"train_loss": -9.507902145385742, "global_step": 83467, "epoch": 496} {"train_loss": -9.24116325378418, "global_step": 83468, "epoch": 496} {"train_loss": -9.316512107849121, "global_step": 83469, "epoch": 496} {"train_loss": -9.490568161010742, "global_step": 83470, "epoch": 496} {"train_loss": -9.522408485412598, "global_step": 83471, "epoch": 496} {"train_loss": -9.650044441223145, "global_step": 83472, "epoch": 496} {"train_loss": -9.628480911254883, "global_step": 83473, "epoch": 496} {"train_loss": -9.348718643188477, "global_step": 83474, "epoch": 496} {"train_loss": -9.263595581054688, "global_step": 83475, "epoch": 496} {"train_loss": -9.206714630126953, "global_step": 83476, "epoch": 496} {"train_loss": -9.310079574584961, "global_step": 83477, "epoch": 496} {"train_loss": -9.259075164794922, "global_step": 83478, "epoch": 496} {"train_loss": -9.274565696716309, "global_step": 83479, "epoch": 496} {"train_loss": -9.49450397491455, "global_step": 83480, "epoch": 496} {"train_loss": -9.549177169799805, "global_step": 83481, "epoch": 496} {"train_loss": -8.970212936401367, "global_step": 83482, "epoch": 496} {"train_loss": -9.12489128112793, "global_step": 83483, "epoch": 496} {"train_loss": -8.828435897827148, "global_step": 83484, "epoch": 496} {"train_loss": -8.937597274780273, "global_step": 83485, "epoch": 496} {"train_loss": -8.53250503540039, "global_step": 83486, "epoch": 496} {"train_loss": -8.879308700561523, "global_step": 83487, "epoch": 496} {"train_loss": -8.471704483032227, "global_step": 83488, "epoch": 496} {"train_loss": -8.874961853027344, "global_step": 83489, "epoch": 496} {"train_loss": -8.949970245361328, "global_step": 83490, "epoch": 496} {"train_loss": -8.67187786102295, "global_step": 83491, "epoch": 496} {"train_loss": -8.78579330444336, "global_step": 83492, "epoch": 496} {"train_loss": -9.000589370727539, "global_step": 83493, "epoch": 496} {"train_loss": -8.802276611328125, "global_step": 83494, "epoch": 496} {"train_loss": -9.235734564917427, "global_step": 83495, "epoch": 496, "val_loss": 199313.25} {"train_loss": -8.787812232971191, "global_step": 83496, "epoch": 497} {"train_loss": -9.027868270874023, "global_step": 83497, "epoch": 497} {"train_loss": -8.947319030761719, "global_step": 83498, "epoch": 497} {"train_loss": -9.00997543334961, "global_step": 83499, "epoch": 497} {"train_loss": -9.07604694366455, "global_step": 83500, "epoch": 497} {"train_loss": -9.16224479675293, "global_step": 83501, "epoch": 497} {"train_loss": -9.101982116699219, "global_step": 83502, "epoch": 497} {"train_loss": -8.959705352783203, "global_step": 83503, "epoch": 497} {"train_loss": -9.31592082977295, "global_step": 83504, "epoch": 497} {"train_loss": -9.247772216796875, "global_step": 83505, "epoch": 497} {"train_loss": -9.301905632019043, "global_step": 83506, "epoch": 497} {"train_loss": -9.216438293457031, "global_step": 83507, "epoch": 497} {"train_loss": -9.030366897583008, "global_step": 83508, "epoch": 497} {"train_loss": -9.402839660644531, "global_step": 83509, "epoch": 497} {"train_loss": -9.34461784362793, "global_step": 83510, "epoch": 497} {"train_loss": -9.343531608581543, "global_step": 83511, "epoch": 497} {"train_loss": -9.127826690673828, "global_step": 83512, "epoch": 497} {"train_loss": -9.334272384643555, "global_step": 83513, "epoch": 497} {"train_loss": -9.502945899963379, "global_step": 83514, "epoch": 497} {"train_loss": -9.401135444641113, "global_step": 83515, "epoch": 497} {"train_loss": -9.238509178161621, "global_step": 83516, "epoch": 497} {"train_loss": -9.39921760559082, "global_step": 83517, "epoch": 497} {"train_loss": -9.219803810119629, "global_step": 83518, "epoch": 497} {"train_loss": -9.334867477416992, "global_step": 83519, "epoch": 497} {"train_loss": -9.120931625366211, "global_step": 83520, "epoch": 497} {"train_loss": -9.414567947387695, "global_step": 83521, "epoch": 497} {"train_loss": -9.412242889404297, "global_step": 83522, "epoch": 497} {"train_loss": -9.522451400756836, "global_step": 83523, "epoch": 497} {"train_loss": -9.219781875610352, "global_step": 83524, "epoch": 497} {"train_loss": -9.487651824951172, "global_step": 83525, "epoch": 497} {"train_loss": -9.196053504943848, "global_step": 83526, "epoch": 497} {"train_loss": -9.305032730102539, "global_step": 83527, "epoch": 497} {"train_loss": -9.281821250915527, "global_step": 83528, "epoch": 497} {"train_loss": -9.100259780883789, "global_step": 83529, "epoch": 497} {"train_loss": -9.48481273651123, "global_step": 83530, "epoch": 497} {"train_loss": -9.02871036529541, "global_step": 83531, "epoch": 497} {"train_loss": -8.962176322937012, "global_step": 83532, "epoch": 497} {"train_loss": -8.870278358459473, "global_step": 83533, "epoch": 497} {"train_loss": -9.15835189819336, "global_step": 83534, "epoch": 497} {"train_loss": -8.921281814575195, "global_step": 83535, "epoch": 497} {"train_loss": -8.765481948852539, "global_step": 83536, "epoch": 497} {"train_loss": -8.887439727783203, "global_step": 83537, "epoch": 497} {"train_loss": -8.943979263305664, "global_step": 83538, "epoch": 497} {"train_loss": -9.04709243774414, "global_step": 83539, "epoch": 497} {"train_loss": -9.179746627807617, "global_step": 83540, "epoch": 497} {"train_loss": -8.880078315734863, "global_step": 83541, "epoch": 497} {"train_loss": -9.4331693649292, "global_step": 83542, "epoch": 497} {"train_loss": -9.176464080810547, "global_step": 83543, "epoch": 497} {"train_loss": -8.955949783325195, "global_step": 83544, "epoch": 497} {"train_loss": -9.025970458984375, "global_step": 83545, "epoch": 497} {"train_loss": -9.106544494628906, "global_step": 83546, "epoch": 497} {"train_loss": -9.260429382324219, "global_step": 83547, "epoch": 497} {"train_loss": -8.893985748291016, "global_step": 83548, "epoch": 497} {"train_loss": -8.967476844787598, "global_step": 83549, "epoch": 497} {"train_loss": -9.20979118347168, "global_step": 83550, "epoch": 497} {"train_loss": -9.206912994384766, "global_step": 83551, "epoch": 497} {"train_loss": -9.17831039428711, "global_step": 83552, "epoch": 497} {"train_loss": -8.917865753173828, "global_step": 83553, "epoch": 497} {"train_loss": -9.045425415039062, "global_step": 83554, "epoch": 497} {"train_loss": -9.364496231079102, "global_step": 83555, "epoch": 497} {"train_loss": -9.158376693725586, "global_step": 83556, "epoch": 497} {"train_loss": -9.376181602478027, "global_step": 83557, "epoch": 497} {"train_loss": -9.439240455627441, "global_step": 83558, "epoch": 497} {"train_loss": -9.01965618133545, "global_step": 83559, "epoch": 497} {"train_loss": -9.317119598388672, "global_step": 83560, "epoch": 497} {"train_loss": -9.171977996826172, "global_step": 83561, "epoch": 497} {"train_loss": -9.390722274780273, "global_step": 83562, "epoch": 497} {"train_loss": -9.12486743927002, "global_step": 83563, "epoch": 497} {"train_loss": -9.196767807006836, "global_step": 83564, "epoch": 497} {"train_loss": -9.100176811218262, "global_step": 83565, "epoch": 497} {"train_loss": -9.399359703063965, "global_step": 83566, "epoch": 497} {"train_loss": -9.268033027648926, "global_step": 83567, "epoch": 497} {"train_loss": -9.319262504577637, "global_step": 83568, "epoch": 497} {"train_loss": -9.44148063659668, "global_step": 83569, "epoch": 497} {"train_loss": -9.065474510192871, "global_step": 83570, "epoch": 497} {"train_loss": -9.270868301391602, "global_step": 83571, "epoch": 497} {"train_loss": -9.015369415283203, "global_step": 83572, "epoch": 497} {"train_loss": -9.356524467468262, "global_step": 83573, "epoch": 497} {"train_loss": -9.324612617492676, "global_step": 83574, "epoch": 497} {"train_loss": -9.380719184875488, "global_step": 83575, "epoch": 497} {"train_loss": -9.402959823608398, "global_step": 83576, "epoch": 497} {"train_loss": -9.276176452636719, "global_step": 83577, "epoch": 497} {"train_loss": -9.315813064575195, "global_step": 83578, "epoch": 497} {"train_loss": -9.29281234741211, "global_step": 83579, "epoch": 497} {"train_loss": -9.284820556640625, "global_step": 83580, "epoch": 497} {"train_loss": -9.540586471557617, "global_step": 83581, "epoch": 497} {"train_loss": -9.155447006225586, "global_step": 83582, "epoch": 497} {"train_loss": -9.533651351928711, "global_step": 83583, "epoch": 497} {"train_loss": -9.137083053588867, "global_step": 83584, "epoch": 497} {"train_loss": -9.357678413391113, "global_step": 83585, "epoch": 497} {"train_loss": -9.587591171264648, "global_step": 83586, "epoch": 497} {"train_loss": -9.262550354003906, "global_step": 83587, "epoch": 497} {"train_loss": -9.442566871643066, "global_step": 83588, "epoch": 497} {"train_loss": -9.42867374420166, "global_step": 83589, "epoch": 497} {"train_loss": -9.172517776489258, "global_step": 83590, "epoch": 497} {"train_loss": -9.305709838867188, "global_step": 83591, "epoch": 497} {"train_loss": -9.501251220703125, "global_step": 83592, "epoch": 497} {"train_loss": -9.338506698608398, "global_step": 83593, "epoch": 497} {"train_loss": -9.332253456115723, "global_step": 83594, "epoch": 497} {"train_loss": -9.232869148254395, "global_step": 83595, "epoch": 497} {"train_loss": -9.219076156616211, "global_step": 83596, "epoch": 497} {"train_loss": -9.414958953857422, "global_step": 83597, "epoch": 497} {"train_loss": -9.40665054321289, "global_step": 83598, "epoch": 497} {"train_loss": -9.526956558227539, "global_step": 83599, "epoch": 497} {"train_loss": -9.298994064331055, "global_step": 83600, "epoch": 497} {"train_loss": -9.340852737426758, "global_step": 83601, "epoch": 497} {"train_loss": -9.241331100463867, "global_step": 83602, "epoch": 497} {"train_loss": -8.896154403686523, "global_step": 83603, "epoch": 497} {"train_loss": -9.130924224853516, "global_step": 83604, "epoch": 497} {"train_loss": -8.833471298217773, "global_step": 83605, "epoch": 497} {"train_loss": -8.601034164428711, "global_step": 83606, "epoch": 497} {"train_loss": -8.943645477294922, "global_step": 83607, "epoch": 497} {"train_loss": -8.528457641601562, "global_step": 83608, "epoch": 497} {"train_loss": -8.529216766357422, "global_step": 83609, "epoch": 497} {"train_loss": -8.721864700317383, "global_step": 83610, "epoch": 497} {"train_loss": -8.8463134765625, "global_step": 83611, "epoch": 497} {"train_loss": -8.727494239807129, "global_step": 83612, "epoch": 497} {"train_loss": -8.987998962402344, "global_step": 83613, "epoch": 497} {"train_loss": -8.955940246582031, "global_step": 83614, "epoch": 497} {"train_loss": -8.881319046020508, "global_step": 83615, "epoch": 497} {"train_loss": -9.02918815612793, "global_step": 83616, "epoch": 497} {"train_loss": -8.797914505004883, "global_step": 83617, "epoch": 497} {"train_loss": -8.909065246582031, "global_step": 83618, "epoch": 497} {"train_loss": -8.996004104614258, "global_step": 83619, "epoch": 497} {"train_loss": -9.012571334838867, "global_step": 83620, "epoch": 497} {"train_loss": -9.365373611450195, "global_step": 83621, "epoch": 497} {"train_loss": -9.099504470825195, "global_step": 83622, "epoch": 497} {"train_loss": -9.235260963439941, "global_step": 83623, "epoch": 497} {"train_loss": -9.337342262268066, "global_step": 83624, "epoch": 497} {"train_loss": -9.119340896606445, "global_step": 83625, "epoch": 497} {"train_loss": -9.467119216918945, "global_step": 83626, "epoch": 497} {"train_loss": -9.208293914794922, "global_step": 83627, "epoch": 497} {"train_loss": -9.416228294372559, "global_step": 83628, "epoch": 497} {"train_loss": -9.205069541931152, "global_step": 83629, "epoch": 497} {"train_loss": -9.31926155090332, "global_step": 83630, "epoch": 497} {"train_loss": -9.322391510009766, "global_step": 83631, "epoch": 497} {"train_loss": -9.352767944335938, "global_step": 83632, "epoch": 497} {"train_loss": -9.482015609741211, "global_step": 83633, "epoch": 497} {"train_loss": -9.429311752319336, "global_step": 83634, "epoch": 497} {"train_loss": -9.565093994140625, "global_step": 83635, "epoch": 497} {"train_loss": -9.408458709716797, "global_step": 83636, "epoch": 497} {"train_loss": -9.454578399658203, "global_step": 83637, "epoch": 497} {"train_loss": -9.341538429260254, "global_step": 83638, "epoch": 497} {"train_loss": -9.60411262512207, "global_step": 83639, "epoch": 497} {"train_loss": -9.532991409301758, "global_step": 83640, "epoch": 497} {"train_loss": -9.269233703613281, "global_step": 83641, "epoch": 497} {"train_loss": -9.045003890991211, "global_step": 83642, "epoch": 497} {"train_loss": -9.321802139282227, "global_step": 83643, "epoch": 497} {"train_loss": -9.288032531738281, "global_step": 83644, "epoch": 497} {"train_loss": -9.315961837768555, "global_step": 83645, "epoch": 497} {"train_loss": -9.318984985351562, "global_step": 83646, "epoch": 497} {"train_loss": -9.644285202026367, "global_step": 83647, "epoch": 497} {"train_loss": -9.30717658996582, "global_step": 83648, "epoch": 497} {"train_loss": -9.41048812866211, "global_step": 83649, "epoch": 497} {"train_loss": -9.271735191345215, "global_step": 83650, "epoch": 497} {"train_loss": -9.49179458618164, "global_step": 83651, "epoch": 497} {"train_loss": -9.3109712600708, "global_step": 83652, "epoch": 497} {"train_loss": -9.405633926391602, "global_step": 83653, "epoch": 497} {"train_loss": -9.397563934326172, "global_step": 83654, "epoch": 497} {"train_loss": -9.054868698120117, "global_step": 83655, "epoch": 497} {"train_loss": -9.37948989868164, "global_step": 83656, "epoch": 497} {"train_loss": -9.260812759399414, "global_step": 83657, "epoch": 497} {"train_loss": -9.504866600036621, "global_step": 83658, "epoch": 497} {"train_loss": -9.06291389465332, "global_step": 83659, "epoch": 497} {"train_loss": -9.136507034301758, "global_step": 83660, "epoch": 497} {"train_loss": -9.013622283935547, "global_step": 83661, "epoch": 497} {"train_loss": -8.543649673461914, "global_step": 83662, "epoch": 497} {"train_loss": -9.206061964943295, "global_step": 83663, "epoch": 497, "val_loss": 201052.78125} {"train_loss": -9.126091003417969, "global_step": 83664, "epoch": 498} {"train_loss": -8.711057662963867, "global_step": 83665, "epoch": 498} {"train_loss": -8.879684448242188, "global_step": 83666, "epoch": 498} {"train_loss": -9.272506713867188, "global_step": 83667, "epoch": 498} {"train_loss": -8.759357452392578, "global_step": 83668, "epoch": 498} {"train_loss": -8.93108081817627, "global_step": 83669, "epoch": 498} {"train_loss": -9.239189147949219, "global_step": 83670, "epoch": 498} {"train_loss": -9.02505111694336, "global_step": 83671, "epoch": 498} {"train_loss": -8.90800666809082, "global_step": 83672, "epoch": 498} {"train_loss": -8.866903305053711, "global_step": 83673, "epoch": 498} {"train_loss": -9.019654273986816, "global_step": 83674, "epoch": 498} {"train_loss": -8.867762565612793, "global_step": 83675, "epoch": 498} {"train_loss": -8.850433349609375, "global_step": 83676, "epoch": 498} {"train_loss": -8.868646621704102, "global_step": 83677, "epoch": 498} {"train_loss": -9.043243408203125, "global_step": 83678, "epoch": 498} {"train_loss": -9.092668533325195, "global_step": 83679, "epoch": 498} {"train_loss": -9.310937881469727, "global_step": 83680, "epoch": 498} {"train_loss": -9.100675582885742, "global_step": 83681, "epoch": 498} {"train_loss": -9.246395111083984, "global_step": 83682, "epoch": 498} {"train_loss": -9.34439468383789, "global_step": 83683, "epoch": 498} {"train_loss": -9.411088943481445, "global_step": 83684, "epoch": 498} {"train_loss": -9.384749412536621, "global_step": 83685, "epoch": 498} {"train_loss": -9.479673385620117, "global_step": 83686, "epoch": 498} {"train_loss": -9.344358444213867, "global_step": 83687, "epoch": 498} {"train_loss": -9.313297271728516, "global_step": 83688, "epoch": 498} {"train_loss": -9.396677017211914, "global_step": 83689, "epoch": 498} {"train_loss": -9.272113800048828, "global_step": 83690, "epoch": 498} {"train_loss": -9.334102630615234, "global_step": 83691, "epoch": 498} {"train_loss": -9.543020248413086, "global_step": 83692, "epoch": 498} {"train_loss": -9.398192405700684, "global_step": 83693, "epoch": 498} {"train_loss": -9.473648071289062, "global_step": 83694, "epoch": 498} {"train_loss": -9.25363540649414, "global_step": 83695, "epoch": 498} {"train_loss": -9.370931625366211, "global_step": 83696, "epoch": 498} {"train_loss": -9.510891914367676, "global_step": 83697, "epoch": 498} {"train_loss": -9.398946762084961, "global_step": 83698, "epoch": 498} {"train_loss": -9.567788124084473, "global_step": 83699, "epoch": 498} {"train_loss": -9.402795791625977, "global_step": 83700, "epoch": 498} {"train_loss": -9.427058219909668, "global_step": 83701, "epoch": 498} {"train_loss": -9.472867965698242, "global_step": 83702, "epoch": 498} {"train_loss": -9.353697776794434, "global_step": 83703, "epoch": 498} {"train_loss": -9.412155151367188, "global_step": 83704, "epoch": 498} {"train_loss": -9.072368621826172, "global_step": 83705, "epoch": 498} {"train_loss": -9.427474975585938, "global_step": 83706, "epoch": 498} {"train_loss": -9.379047393798828, "global_step": 83707, "epoch": 498} {"train_loss": -9.40778923034668, "global_step": 83708, "epoch": 498} {"train_loss": -9.12123966217041, "global_step": 83709, "epoch": 498} {"train_loss": -8.975313186645508, "global_step": 83710, "epoch": 498} {"train_loss": -8.875253677368164, "global_step": 83711, "epoch": 498} {"train_loss": -8.808283805847168, "global_step": 83712, "epoch": 498} {"train_loss": -9.37841796875, "global_step": 83713, "epoch": 498} {"train_loss": -8.84928035736084, "global_step": 83714, "epoch": 498} {"train_loss": -9.169248580932617, "global_step": 83715, "epoch": 498} {"train_loss": -9.092456817626953, "global_step": 83716, "epoch": 498} {"train_loss": -8.991386413574219, "global_step": 83717, "epoch": 498} {"train_loss": -9.145672798156738, "global_step": 83718, "epoch": 498} {"train_loss": -9.15034294128418, "global_step": 83719, "epoch": 498} {"train_loss": -9.035593032836914, "global_step": 83720, "epoch": 498} {"train_loss": -9.284255981445312, "global_step": 83721, "epoch": 498} {"train_loss": -9.364282608032227, "global_step": 83722, "epoch": 498} {"train_loss": -9.292778015136719, "global_step": 83723, "epoch": 498} {"train_loss": -9.384382247924805, "global_step": 83724, "epoch": 498} {"train_loss": -9.134963035583496, "global_step": 83725, "epoch": 498} {"train_loss": -9.124723434448242, "global_step": 83726, "epoch": 498} {"train_loss": -9.296813011169434, "global_step": 83727, "epoch": 498} {"train_loss": -9.40950870513916, "global_step": 83728, "epoch": 498} {"train_loss": -9.217341423034668, "global_step": 83729, "epoch": 498} {"train_loss": -9.357531547546387, "global_step": 83730, "epoch": 498} {"train_loss": -9.250828742980957, "global_step": 83731, "epoch": 498} {"train_loss": -9.462661743164062, "global_step": 83732, "epoch": 498} {"train_loss": -9.300292015075684, "global_step": 83733, "epoch": 498} {"train_loss": -9.385457038879395, "global_step": 83734, "epoch": 498} {"train_loss": -9.43437385559082, "global_step": 83735, "epoch": 498} {"train_loss": -9.450672149658203, "global_step": 83736, "epoch": 498} {"train_loss": -9.522734642028809, "global_step": 83737, "epoch": 498} {"train_loss": -9.385034561157227, "global_step": 83738, "epoch": 498} {"train_loss": -9.27749252319336, "global_step": 83739, "epoch": 498} {"train_loss": -9.509790420532227, "global_step": 83740, "epoch": 498} {"train_loss": -9.284385681152344, "global_step": 83741, "epoch": 498} {"train_loss": -9.062362670898438, "global_step": 83742, "epoch": 498} {"train_loss": -9.41943645477295, "global_step": 83743, "epoch": 498} {"train_loss": -9.240995407104492, "global_step": 83744, "epoch": 498} {"train_loss": -9.294952392578125, "global_step": 83745, "epoch": 498} {"train_loss": -9.415918350219727, "global_step": 83746, "epoch": 498} {"train_loss": -9.589811325073242, "global_step": 83747, "epoch": 498} {"train_loss": -9.164182662963867, "global_step": 83748, "epoch": 498} {"train_loss": -9.320972442626953, "global_step": 83749, "epoch": 498} {"train_loss": -9.050444602966309, "global_step": 83750, "epoch": 498} {"train_loss": -8.982184410095215, "global_step": 83751, "epoch": 498} {"train_loss": -9.388656616210938, "global_step": 83752, "epoch": 498} {"train_loss": -9.38222885131836, "global_step": 83753, "epoch": 498} {"train_loss": -9.565668106079102, "global_step": 83754, "epoch": 498} {"train_loss": -9.284402847290039, "global_step": 83755, "epoch": 498} {"train_loss": -9.556194305419922, "global_step": 83756, "epoch": 498} {"train_loss": -9.387134552001953, "global_step": 83757, "epoch": 498} {"train_loss": -9.235495567321777, "global_step": 83758, "epoch": 498} {"train_loss": -9.680704116821289, "global_step": 83759, "epoch": 498} {"train_loss": -9.25157356262207, "global_step": 83760, "epoch": 498} {"train_loss": -9.358192443847656, "global_step": 83761, "epoch": 498} {"train_loss": -9.356225967407227, "global_step": 83762, "epoch": 498} {"train_loss": -9.168644905090332, "global_step": 83763, "epoch": 498} {"train_loss": -9.393625259399414, "global_step": 83764, "epoch": 498} {"train_loss": -9.133966445922852, "global_step": 83765, "epoch": 498} {"train_loss": -9.242573738098145, "global_step": 83766, "epoch": 498} {"train_loss": -9.074422836303711, "global_step": 83767, "epoch": 498} {"train_loss": -9.240377426147461, "global_step": 83768, "epoch": 498} {"train_loss": -9.15898323059082, "global_step": 83769, "epoch": 498} {"train_loss": -9.047542572021484, "global_step": 83770, "epoch": 498} {"train_loss": -9.160507202148438, "global_step": 83771, "epoch": 498} {"train_loss": -9.22371768951416, "global_step": 83772, "epoch": 498} {"train_loss": -9.423443794250488, "global_step": 83773, "epoch": 498} {"train_loss": -9.645591735839844, "global_step": 83774, "epoch": 498} {"train_loss": -9.344118118286133, "global_step": 83775, "epoch": 498} {"train_loss": -9.553777694702148, "global_step": 83776, "epoch": 498} {"train_loss": -9.380001068115234, "global_step": 83777, "epoch": 498} {"train_loss": -9.335338592529297, "global_step": 83778, "epoch": 498} {"train_loss": -9.173025131225586, "global_step": 83779, "epoch": 498} {"train_loss": -9.52363395690918, "global_step": 83780, "epoch": 498} {"train_loss": -9.37809944152832, "global_step": 83781, "epoch": 498} {"train_loss": -9.359418869018555, "global_step": 83782, "epoch": 498} {"train_loss": -9.435384750366211, "global_step": 83783, "epoch": 498} {"train_loss": -9.531848907470703, "global_step": 83784, "epoch": 498} {"train_loss": -9.329961776733398, "global_step": 83785, "epoch": 498} {"train_loss": -9.292976379394531, "global_step": 83786, "epoch": 498} {"train_loss": -9.387478828430176, "global_step": 83787, "epoch": 498} {"train_loss": -9.53217601776123, "global_step": 83788, "epoch": 498} {"train_loss": -9.5433349609375, "global_step": 83789, "epoch": 498} {"train_loss": -9.425596237182617, "global_step": 83790, "epoch": 498} {"train_loss": -9.435993194580078, "global_step": 83791, "epoch": 498} {"train_loss": -9.273483276367188, "global_step": 83792, "epoch": 498} {"train_loss": -9.193492889404297, "global_step": 83793, "epoch": 498} {"train_loss": -9.282090187072754, "global_step": 83794, "epoch": 498} {"train_loss": -9.270023345947266, "global_step": 83795, "epoch": 498} {"train_loss": -9.155763626098633, "global_step": 83796, "epoch": 498} {"train_loss": -9.31256103515625, "global_step": 83797, "epoch": 498} {"train_loss": -9.02008056640625, "global_step": 83798, "epoch": 498} {"train_loss": -9.2732515335083, "global_step": 83799, "epoch": 498} {"train_loss": -9.440136909484863, "global_step": 83800, "epoch": 498} {"train_loss": -9.287302017211914, "global_step": 83801, "epoch": 498} {"train_loss": -9.514824867248535, "global_step": 83802, "epoch": 498} {"train_loss": -9.310968399047852, "global_step": 83803, "epoch": 498} {"train_loss": -9.07221794128418, "global_step": 83804, "epoch": 498} {"train_loss": -9.251953125, "global_step": 83805, "epoch": 498} {"train_loss": -9.231983184814453, "global_step": 83806, "epoch": 498} {"train_loss": -9.180395126342773, "global_step": 83807, "epoch": 498} {"train_loss": -9.089935302734375, "global_step": 83808, "epoch": 498} {"train_loss": -9.257234573364258, "global_step": 83809, "epoch": 498} {"train_loss": -9.157268524169922, "global_step": 83810, "epoch": 498} {"train_loss": -9.07357406616211, "global_step": 83811, "epoch": 498} {"train_loss": -9.465951919555664, "global_step": 83812, "epoch": 498} {"train_loss": -9.215211868286133, "global_step": 83813, "epoch": 498} {"train_loss": -9.291414260864258, "global_step": 83814, "epoch": 498} {"train_loss": -9.431086540222168, "global_step": 83815, "epoch": 498} {"train_loss": -9.27794075012207, "global_step": 83816, "epoch": 498} {"train_loss": -9.133645057678223, "global_step": 83817, "epoch": 498} {"train_loss": -9.274975776672363, "global_step": 83818, "epoch": 498} {"train_loss": -9.55211067199707, "global_step": 83819, "epoch": 498} {"train_loss": -9.379315376281738, "global_step": 83820, "epoch": 498} {"train_loss": -9.367936134338379, "global_step": 83821, "epoch": 498} {"train_loss": -9.444731712341309, "global_step": 83822, "epoch": 498} {"train_loss": -9.47896957397461, "global_step": 83823, "epoch": 498} {"train_loss": -9.311237335205078, "global_step": 83824, "epoch": 498} {"train_loss": -9.355182647705078, "global_step": 83825, "epoch": 498} {"train_loss": -9.350910186767578, "global_step": 83826, "epoch": 498} {"train_loss": -9.511685371398926, "global_step": 83827, "epoch": 498} {"train_loss": -8.97768497467041, "global_step": 83828, "epoch": 498} {"train_loss": -9.382981300354004, "global_step": 83829, "epoch": 498} {"train_loss": -9.227813720703125, "global_step": 83830, "epoch": 498} {"train_loss": -9.2740972950345, "global_step": 83831, "epoch": 498, "val_loss": 198240.03125} {"train_loss": -9.465317726135254, "global_step": 83832, "epoch": 499} {"train_loss": -9.135366439819336, "global_step": 83833, "epoch": 499} {"train_loss": -9.384786605834961, "global_step": 83834, "epoch": 499} {"train_loss": -9.365856170654297, "global_step": 83835, "epoch": 499} {"train_loss": -9.294960021972656, "global_step": 83836, "epoch": 499} {"train_loss": -9.080190658569336, "global_step": 83837, "epoch": 499} {"train_loss": -8.929996490478516, "global_step": 83838, "epoch": 499} {"train_loss": -9.023628234863281, "global_step": 83839, "epoch": 499} {"train_loss": -8.943229675292969, "global_step": 83840, "epoch": 499} {"train_loss": -9.242607116699219, "global_step": 83841, "epoch": 499} {"train_loss": -9.194913864135742, "global_step": 83842, "epoch": 499} {"train_loss": -9.240625381469727, "global_step": 83843, "epoch": 499} {"train_loss": -9.117212295532227, "global_step": 83844, "epoch": 499} {"train_loss": -9.354633331298828, "global_step": 83845, "epoch": 499} {"train_loss": -9.272098541259766, "global_step": 83846, "epoch": 499} {"train_loss": -9.310945510864258, "global_step": 83847, "epoch": 499} {"train_loss": -9.550483703613281, "global_step": 83848, "epoch": 499} {"train_loss": -9.460458755493164, "global_step": 83849, "epoch": 499} {"train_loss": -9.539375305175781, "global_step": 83850, "epoch": 499} {"train_loss": -9.576614379882812, "global_step": 83851, "epoch": 499} {"train_loss": -9.309200286865234, "global_step": 83852, "epoch": 499} {"train_loss": -9.115835189819336, "global_step": 83853, "epoch": 499} {"train_loss": -9.443609237670898, "global_step": 83854, "epoch": 499} {"train_loss": -9.331048965454102, "global_step": 83855, "epoch": 499} {"train_loss": -9.356094360351562, "global_step": 83856, "epoch": 499} {"train_loss": -9.250068664550781, "global_step": 83857, "epoch": 499} {"train_loss": -9.4210844039917, "global_step": 83858, "epoch": 499} {"train_loss": -9.05435848236084, "global_step": 83859, "epoch": 499} {"train_loss": -9.600713729858398, "global_step": 83860, "epoch": 499} {"train_loss": -9.073492050170898, "global_step": 83861, "epoch": 499} {"train_loss": -9.049341201782227, "global_step": 83862, "epoch": 499} {"train_loss": -9.13032341003418, "global_step": 83863, "epoch": 499} {"train_loss": -9.060100555419922, "global_step": 83864, "epoch": 499} {"train_loss": -8.96940803527832, "global_step": 83865, "epoch": 499} {"train_loss": -9.070542335510254, "global_step": 83866, "epoch": 499} {"train_loss": -9.024962425231934, "global_step": 83867, "epoch": 499} {"train_loss": -9.304695129394531, "global_step": 83868, "epoch": 499} {"train_loss": -9.06020736694336, "global_step": 83869, "epoch": 499} {"train_loss": -8.89683723449707, "global_step": 83870, "epoch": 499} {"train_loss": -9.476116180419922, "global_step": 83871, "epoch": 499} {"train_loss": -8.857580184936523, "global_step": 83872, "epoch": 499} {"train_loss": -9.24538516998291, "global_step": 83873, "epoch": 499} {"train_loss": -9.012886047363281, "global_step": 83874, "epoch": 499} {"train_loss": -9.3822660446167, "global_step": 83875, "epoch": 499} {"train_loss": -8.888650894165039, "global_step": 83876, "epoch": 499} {"train_loss": -9.242509841918945, "global_step": 83877, "epoch": 499} {"train_loss": -9.355607986450195, "global_step": 83878, "epoch": 499} {"train_loss": -9.240129470825195, "global_step": 83879, "epoch": 499} {"train_loss": -9.180076599121094, "global_step": 83880, "epoch": 499} {"train_loss": -9.267410278320312, "global_step": 83881, "epoch": 499} {"train_loss": -9.298060417175293, "global_step": 83882, "epoch": 499} {"train_loss": -9.244484901428223, "global_step": 83883, "epoch": 499} {"train_loss": -9.144783020019531, "global_step": 83884, "epoch": 499} {"train_loss": -9.403841018676758, "global_step": 83885, "epoch": 499} {"train_loss": -9.378521919250488, "global_step": 83886, "epoch": 499} {"train_loss": -9.207548141479492, "global_step": 83887, "epoch": 499} {"train_loss": -9.11406421661377, "global_step": 83888, "epoch": 499} {"train_loss": -9.347648620605469, "global_step": 83889, "epoch": 499} {"train_loss": -9.258245468139648, "global_step": 83890, "epoch": 499} {"train_loss": -9.235539436340332, "global_step": 83891, "epoch": 499} {"train_loss": -9.44821548461914, "global_step": 83892, "epoch": 499} {"train_loss": -9.309593200683594, "global_step": 83893, "epoch": 499} {"train_loss": -9.461055755615234, "global_step": 83894, "epoch": 499} {"train_loss": -9.250540733337402, "global_step": 83895, "epoch": 499} {"train_loss": -9.439722061157227, "global_step": 83896, "epoch": 499} {"train_loss": -9.186141014099121, "global_step": 83897, "epoch": 499} {"train_loss": -9.424877166748047, "global_step": 83898, "epoch": 499} {"train_loss": -9.438098907470703, "global_step": 83899, "epoch": 499} {"train_loss": -9.178363800048828, "global_step": 83900, "epoch": 499} {"train_loss": -9.279277801513672, "global_step": 83901, "epoch": 499} {"train_loss": -9.444023132324219, "global_step": 83902, "epoch": 499} {"train_loss": -9.331880569458008, "global_step": 83903, "epoch": 499} {"train_loss": -9.435592651367188, "global_step": 83904, "epoch": 499} {"train_loss": -9.42362117767334, "global_step": 83905, "epoch": 499} {"train_loss": -9.430717468261719, "global_step": 83906, "epoch": 499} {"train_loss": -9.547906875610352, "global_step": 83907, "epoch": 499} {"train_loss": -9.098060607910156, "global_step": 83908, "epoch": 499} {"train_loss": -9.27233600616455, "global_step": 83909, "epoch": 499} {"train_loss": -8.946840286254883, "global_step": 83910, "epoch": 499} {"train_loss": -8.9190673828125, "global_step": 83911, "epoch": 499} {"train_loss": -8.958727836608887, "global_step": 83912, "epoch": 499} {"train_loss": -8.968902587890625, "global_step": 83913, "epoch": 499} {"train_loss": -9.058764457702637, "global_step": 83914, "epoch": 499} {"train_loss": -9.236047744750977, "global_step": 83915, "epoch": 499} {"train_loss": -8.943777084350586, "global_step": 83916, "epoch": 499} {"train_loss": -9.077589988708496, "global_step": 83917, "epoch": 499} {"train_loss": -8.843632698059082, "global_step": 83918, "epoch": 499} {"train_loss": -9.270709991455078, "global_step": 83919, "epoch": 499} {"train_loss": -9.152456283569336, "global_step": 83920, "epoch": 499} {"train_loss": -9.185047149658203, "global_step": 83921, "epoch": 499} {"train_loss": -9.032486915588379, "global_step": 83922, "epoch": 499} {"train_loss": -9.145679473876953, "global_step": 83923, "epoch": 499} {"train_loss": -9.133501052856445, "global_step": 83924, "epoch": 499} {"train_loss": -9.220693588256836, "global_step": 83925, "epoch": 499} {"train_loss": -9.21121597290039, "global_step": 83926, "epoch": 499} {"train_loss": -9.100671768188477, "global_step": 83927, "epoch": 499} {"train_loss": -9.195945739746094, "global_step": 83928, "epoch": 499} {"train_loss": -9.062968254089355, "global_step": 83929, "epoch": 499} {"train_loss": -9.284765243530273, "global_step": 83930, "epoch": 499} {"train_loss": -9.240583419799805, "global_step": 83931, "epoch": 499} {"train_loss": -9.168622016906738, "global_step": 83932, "epoch": 499} {"train_loss": -9.333603858947754, "global_step": 83933, "epoch": 499} {"train_loss": -9.33262825012207, "global_step": 83934, "epoch": 499} {"train_loss": -9.348428726196289, "global_step": 83935, "epoch": 499} {"train_loss": -9.406560897827148, "global_step": 83936, "epoch": 499} {"train_loss": -9.492958068847656, "global_step": 83937, "epoch": 499} {"train_loss": -9.4823579788208, "global_step": 83938, "epoch": 499} {"train_loss": -9.242835998535156, "global_step": 83939, "epoch": 499} {"train_loss": -9.31953239440918, "global_step": 83940, "epoch": 499} {"train_loss": -9.383489608764648, "global_step": 83941, "epoch": 499} {"train_loss": -9.487814903259277, "global_step": 83942, "epoch": 499} {"train_loss": -9.508329391479492, "global_step": 83943, "epoch": 499} {"train_loss": -9.399529457092285, "global_step": 83944, "epoch": 499} {"train_loss": -9.434985160827637, "global_step": 83945, "epoch": 499} {"train_loss": -9.353110313415527, "global_step": 83946, "epoch": 499} {"train_loss": -9.410120010375977, "global_step": 83947, "epoch": 499} {"train_loss": -9.496337890625, "global_step": 83948, "epoch": 499} {"train_loss": -9.503166198730469, "global_step": 83949, "epoch": 499} {"train_loss": -9.31918716430664, "global_step": 83950, "epoch": 499} {"train_loss": -9.244523048400879, "global_step": 83951, "epoch": 499} {"train_loss": -9.277297973632812, "global_step": 83952, "epoch": 499} {"train_loss": -9.220438003540039, "global_step": 83953, "epoch": 499} {"train_loss": -9.53974723815918, "global_step": 83954, "epoch": 499} {"train_loss": -9.477096557617188, "global_step": 83955, "epoch": 499} {"train_loss": -9.661833763122559, "global_step": 83956, "epoch": 499} {"train_loss": -9.475506782531738, "global_step": 83957, "epoch": 499} {"train_loss": -9.561269760131836, "global_step": 83958, "epoch": 499} {"train_loss": -9.266700744628906, "global_step": 83959, "epoch": 499} {"train_loss": -9.235884666442871, "global_step": 83960, "epoch": 499} {"train_loss": -9.3756685256958, "global_step": 83961, "epoch": 499} {"train_loss": -9.187646865844727, "global_step": 83962, "epoch": 499} {"train_loss": -9.021949768066406, "global_step": 83963, "epoch": 499} {"train_loss": -9.1204833984375, "global_step": 83964, "epoch": 499} {"train_loss": -9.144651412963867, "global_step": 83965, "epoch": 499} {"train_loss": -9.137207984924316, "global_step": 83966, "epoch": 499} {"train_loss": -9.258382797241211, "global_step": 83967, "epoch": 499} {"train_loss": -9.26206111907959, "global_step": 83968, "epoch": 499} {"train_loss": -9.238971710205078, "global_step": 83969, "epoch": 499} {"train_loss": -9.415477752685547, "global_step": 83970, "epoch": 499} {"train_loss": -9.302300453186035, "global_step": 83971, "epoch": 499} {"train_loss": -9.346651077270508, "global_step": 83972, "epoch": 499} {"train_loss": -9.287858009338379, "global_step": 83973, "epoch": 499} {"train_loss": -9.016141891479492, "global_step": 83974, "epoch": 499} {"train_loss": -9.09152603149414, "global_step": 83975, "epoch": 499} {"train_loss": -9.30846118927002, "global_step": 83976, "epoch": 499} {"train_loss": -8.99176025390625, "global_step": 83977, "epoch": 499} {"train_loss": -9.258066177368164, "global_step": 83978, "epoch": 499} {"train_loss": -9.2159423828125, "global_step": 83979, "epoch": 499} {"train_loss": -9.101076126098633, "global_step": 83980, "epoch": 499} {"train_loss": -9.257490158081055, "global_step": 83981, "epoch": 499} {"train_loss": -9.193761825561523, "global_step": 83982, "epoch": 499} {"train_loss": -9.221051216125488, "global_step": 83983, "epoch": 499} {"train_loss": -9.162027359008789, "global_step": 83984, "epoch": 499} {"train_loss": -9.2282075881958, "global_step": 83985, "epoch": 499} {"train_loss": -9.187705039978027, "global_step": 83986, "epoch": 499} {"train_loss": -9.222099304199219, "global_step": 83987, "epoch": 499} {"train_loss": -9.13612174987793, "global_step": 83988, "epoch": 499} {"train_loss": -9.330055236816406, "global_step": 83989, "epoch": 499} {"train_loss": -9.021510124206543, "global_step": 83990, "epoch": 499} {"train_loss": -9.40843391418457, "global_step": 83991, "epoch": 499} {"train_loss": -9.240243911743164, "global_step": 83992, "epoch": 499} {"train_loss": -9.272298812866211, "global_step": 83993, "epoch": 499} {"train_loss": -9.442716598510742, "global_step": 83994, "epoch": 499} {"train_loss": -9.068441390991211, "global_step": 83995, "epoch": 499} {"train_loss": -9.308253288269043, "global_step": 83996, "epoch": 499} {"train_loss": -9.080109596252441, "global_step": 83997, "epoch": 499} {"train_loss": -9.29448127746582, "global_step": 83998, "epoch": 499} {"train_loss": -9.247580539612542, "global_step": 83999, "epoch": 499, "val_loss": 198962.8125} {"train_loss": -9.259119987487793, "global_step": 84000, "epoch": 500} {"train_loss": -9.157478332519531, "global_step": 84001, "epoch": 500} {"train_loss": -9.01933479309082, "global_step": 84002, "epoch": 500} {"train_loss": -9.348148345947266, "global_step": 84003, "epoch": 500} {"train_loss": -9.085897445678711, "global_step": 84004, "epoch": 500} {"train_loss": -9.04757308959961, "global_step": 84005, "epoch": 500} {"train_loss": -9.292753219604492, "global_step": 84006, "epoch": 500} {"train_loss": -9.071202278137207, "global_step": 84007, "epoch": 500} {"train_loss": -8.97375774383545, "global_step": 84008, "epoch": 500} {"train_loss": -9.194229125976562, "global_step": 84009, "epoch": 500} {"train_loss": -9.21945571899414, "global_step": 84010, "epoch": 500} {"train_loss": -9.354436874389648, "global_step": 84011, "epoch": 500} {"train_loss": -9.290008544921875, "global_step": 84012, "epoch": 500} {"train_loss": -9.35354232788086, "global_step": 84013, "epoch": 500} {"train_loss": -9.327536582946777, "global_step": 84014, "epoch": 500} {"train_loss": -9.294528007507324, "global_step": 84015, "epoch": 500} {"train_loss": -9.258825302124023, "global_step": 84016, "epoch": 500} {"train_loss": -9.289716720581055, "global_step": 84017, "epoch": 500} {"train_loss": -9.420785903930664, "global_step": 84018, "epoch": 500} {"train_loss": -9.341865539550781, "global_step": 84019, "epoch": 500} {"train_loss": -9.31020450592041, "global_step": 84020, "epoch": 500} {"train_loss": -9.192296981811523, "global_step": 84021, "epoch": 500} {"train_loss": -9.47608470916748, "global_step": 84022, "epoch": 500} {"train_loss": -9.253743171691895, "global_step": 84023, "epoch": 500} {"train_loss": -9.174488067626953, "global_step": 84024, "epoch": 500} {"train_loss": -9.329285621643066, "global_step": 84025, "epoch": 500} {"train_loss": -9.441926002502441, "global_step": 84026, "epoch": 500} {"train_loss": -9.441822052001953, "global_step": 84027, "epoch": 500} {"train_loss": -9.379900932312012, "global_step": 84028, "epoch": 500} {"train_loss": -9.439279556274414, "global_step": 84029, "epoch": 500} {"train_loss": -9.087772369384766, "global_step": 84030, "epoch": 500} {"train_loss": -9.243014335632324, "global_step": 84031, "epoch": 500} {"train_loss": -9.201000213623047, "global_step": 84032, "epoch": 500} {"train_loss": -9.294386863708496, "global_step": 84033, "epoch": 500} {"train_loss": -9.501190185546875, "global_step": 84034, "epoch": 500} {"train_loss": -9.128162384033203, "global_step": 84035, "epoch": 500} {"train_loss": -9.361800193786621, "global_step": 84036, "epoch": 500} {"train_loss": -9.203279495239258, "global_step": 84037, "epoch": 500} {"train_loss": -9.456964492797852, "global_step": 84038, "epoch": 500} {"train_loss": -9.185224533081055, "global_step": 84039, "epoch": 500} {"train_loss": -8.952909469604492, "global_step": 84040, "epoch": 500} {"train_loss": -8.97419261932373, "global_step": 84041, "epoch": 500} {"train_loss": -8.518259048461914, "global_step": 84042, "epoch": 500} {"train_loss": -9.134262084960938, "global_step": 84043, "epoch": 500} {"train_loss": -8.896806716918945, "global_step": 84044, "epoch": 500} {"train_loss": -8.729490280151367, "global_step": 84045, "epoch": 500} {"train_loss": -8.67750358581543, "global_step": 84046, "epoch": 500} {"train_loss": -8.391824722290039, "global_step": 84047, "epoch": 500} {"train_loss": -8.94472885131836, "global_step": 84048, "epoch": 500} {"train_loss": -8.950096130371094, "global_step": 84049, "epoch": 500} {"train_loss": -8.089742660522461, "global_step": 84050, "epoch": 500} {"train_loss": -9.081092834472656, "global_step": 84051, "epoch": 500} {"train_loss": -8.770380020141602, "global_step": 84052, "epoch": 500} {"train_loss": -8.686290740966797, "global_step": 84053, "epoch": 500} {"train_loss": -8.573992729187012, "global_step": 84054, "epoch": 500} {"train_loss": -9.023164749145508, "global_step": 84055, "epoch": 500} {"train_loss": -9.082240104675293, "global_step": 84056, "epoch": 500} {"train_loss": -8.928367614746094, "global_step": 84057, "epoch": 500} {"train_loss": -9.069188117980957, "global_step": 84058, "epoch": 500} {"train_loss": -9.143479347229004, "global_step": 84059, "epoch": 500} {"train_loss": -9.13249397277832, "global_step": 84060, "epoch": 500} {"train_loss": -8.985238075256348, "global_step": 84061, "epoch": 500} {"train_loss": -9.232428550720215, "global_step": 84062, "epoch": 500} {"train_loss": -9.079975128173828, "global_step": 84063, "epoch": 500} {"train_loss": -9.238056182861328, "global_step": 84064, "epoch": 500} {"train_loss": -9.122355461120605, "global_step": 84065, "epoch": 500} {"train_loss": -8.93205451965332, "global_step": 84066, "epoch": 500} {"train_loss": -9.335067749023438, "global_step": 84067, "epoch": 500} {"train_loss": -9.188997268676758, "global_step": 84068, "epoch": 500} {"train_loss": -9.30412483215332, "global_step": 84069, "epoch": 500} {"train_loss": -9.435856819152832, "global_step": 84070, "epoch": 500} {"train_loss": -9.571577072143555, "global_step": 84071, "epoch": 500} {"train_loss": -9.550122261047363, "global_step": 84072, "epoch": 500} {"train_loss": -9.316062927246094, "global_step": 84073, "epoch": 500} {"train_loss": -9.186050415039062, "global_step": 84074, "epoch": 500} {"train_loss": -9.256613731384277, "global_step": 84075, "epoch": 500} {"train_loss": -9.315729141235352, "global_step": 84076, "epoch": 500} {"train_loss": -9.430469512939453, "global_step": 84077, "epoch": 500} {"train_loss": -9.294639587402344, "global_step": 84078, "epoch": 500} {"train_loss": -9.276911735534668, "global_step": 84079, "epoch": 500} {"train_loss": -9.280631065368652, "global_step": 84080, "epoch": 500} {"train_loss": -9.306669235229492, "global_step": 84081, "epoch": 500} {"train_loss": -9.236763000488281, "global_step": 84082, "epoch": 500} {"train_loss": -9.266413688659668, "global_step": 84083, "epoch": 500} {"train_loss": -9.259214401245117, "global_step": 84084, "epoch": 500} {"train_loss": -9.185264587402344, "global_step": 84085, "epoch": 500} {"train_loss": -9.355552673339844, "global_step": 84086, "epoch": 500} {"train_loss": -9.462932586669922, "global_step": 84087, "epoch": 500} {"train_loss": -9.350966453552246, "global_step": 84088, "epoch": 500} {"train_loss": -9.282086372375488, "global_step": 84089, "epoch": 500} {"train_loss": -9.348611831665039, "global_step": 84090, "epoch": 500} {"train_loss": -8.958078384399414, "global_step": 84091, "epoch": 500} {"train_loss": -9.22673511505127, "global_step": 84092, "epoch": 500} {"train_loss": -9.187262535095215, "global_step": 84093, "epoch": 500} {"train_loss": -8.817569732666016, "global_step": 84094, "epoch": 500} {"train_loss": -8.86442756652832, "global_step": 84095, "epoch": 500} {"train_loss": -9.343989372253418, "global_step": 84096, "epoch": 500} {"train_loss": -9.207378387451172, "global_step": 84097, "epoch": 500} {"train_loss": -8.826741218566895, "global_step": 84098, "epoch": 500} {"train_loss": -9.161125183105469, "global_step": 84099, "epoch": 500} {"train_loss": -9.207077026367188, "global_step": 84100, "epoch": 500} {"train_loss": -9.035503387451172, "global_step": 84101, "epoch": 500} {"train_loss": -9.035856246948242, "global_step": 84102, "epoch": 500} {"train_loss": -9.281024932861328, "global_step": 84103, "epoch": 500} {"train_loss": -9.002426147460938, "global_step": 84104, "epoch": 500} {"train_loss": -9.064825057983398, "global_step": 84105, "epoch": 500} {"train_loss": -9.243111610412598, "global_step": 84106, "epoch": 500} {"train_loss": -9.361140251159668, "global_step": 84107, "epoch": 500} {"train_loss": -9.26759147644043, "global_step": 84108, "epoch": 500} {"train_loss": -9.235129356384277, "global_step": 84109, "epoch": 500} {"train_loss": -9.356334686279297, "global_step": 84110, "epoch": 500} {"train_loss": -9.333438873291016, "global_step": 84111, "epoch": 500} {"train_loss": -9.372359275817871, "global_step": 84112, "epoch": 500} {"train_loss": -9.397430419921875, "global_step": 84113, "epoch": 500} {"train_loss": -9.277754783630371, "global_step": 84114, "epoch": 500} {"train_loss": -9.520761489868164, "global_step": 84115, "epoch": 500} {"train_loss": -9.518906593322754, "global_step": 84116, "epoch": 500} {"train_loss": -9.413322448730469, "global_step": 84117, "epoch": 500} {"train_loss": -8.988649368286133, "global_step": 84118, "epoch": 500} {"train_loss": -9.56277084350586, "global_step": 84119, "epoch": 500} {"train_loss": -9.079561233520508, "global_step": 84120, "epoch": 500} {"train_loss": -9.171087265014648, "global_step": 84121, "epoch": 500} {"train_loss": -9.245201110839844, "global_step": 84122, "epoch": 500} {"train_loss": -9.33251953125, "global_step": 84123, "epoch": 500} {"train_loss": -9.143244743347168, "global_step": 84124, "epoch": 500} {"train_loss": -9.344618797302246, "global_step": 84125, "epoch": 500} {"train_loss": -9.197807312011719, "global_step": 84126, "epoch": 500} {"train_loss": -9.331901550292969, "global_step": 84127, "epoch": 500} {"train_loss": -9.160577774047852, "global_step": 84128, "epoch": 500} {"train_loss": -9.472332000732422, "global_step": 84129, "epoch": 500} {"train_loss": -9.256134986877441, "global_step": 84130, "epoch": 500} {"train_loss": -9.714632987976074, "global_step": 84131, "epoch": 500} {"train_loss": -9.302484512329102, "global_step": 84132, "epoch": 500} {"train_loss": -9.36130142211914, "global_step": 84133, "epoch": 500} {"train_loss": -9.512149810791016, "global_step": 84134, "epoch": 500} {"train_loss": -9.38180923461914, "global_step": 84135, "epoch": 500} {"train_loss": -9.555169105529785, "global_step": 84136, "epoch": 500} {"train_loss": -9.41958236694336, "global_step": 84137, "epoch": 500} {"train_loss": -9.496906280517578, "global_step": 84138, "epoch": 500} {"train_loss": -9.365598678588867, "global_step": 84139, "epoch": 500} {"train_loss": -9.502460479736328, "global_step": 84140, "epoch": 500} {"train_loss": -9.540386199951172, "global_step": 84141, "epoch": 500} {"train_loss": -9.316457748413086, "global_step": 84142, "epoch": 500} {"train_loss": -9.307092666625977, "global_step": 84143, "epoch": 500} {"train_loss": -9.2479248046875, "global_step": 84144, "epoch": 500} {"train_loss": -9.107522964477539, "global_step": 84145, "epoch": 500} {"train_loss": -9.564191818237305, "global_step": 84146, "epoch": 500} {"train_loss": -9.345714569091797, "global_step": 84147, "epoch": 500} {"train_loss": -9.505074501037598, "global_step": 84148, "epoch": 500} {"train_loss": -9.313587188720703, "global_step": 84149, "epoch": 500} {"train_loss": -9.259876251220703, "global_step": 84150, "epoch": 500} {"train_loss": -9.306640625, "global_step": 84151, "epoch": 500} {"train_loss": -9.295904159545898, "global_step": 84152, "epoch": 500} {"train_loss": -9.310737609863281, "global_step": 84153, "epoch": 500} {"train_loss": -9.054767608642578, "global_step": 84154, "epoch": 500} {"train_loss": -9.366443634033203, "global_step": 84155, "epoch": 500} {"train_loss": -9.079511642456055, "global_step": 84156, "epoch": 500} {"train_loss": -9.30544662475586, "global_step": 84157, "epoch": 500} {"train_loss": -8.9350004196167, "global_step": 84158, "epoch": 500} {"train_loss": -9.321613311767578, "global_step": 84159, "epoch": 500} {"train_loss": -9.160419464111328, "global_step": 84160, "epoch": 500} {"train_loss": -9.330904006958008, "global_step": 84161, "epoch": 500} {"train_loss": -9.298055648803711, "global_step": 84162, "epoch": 500} {"train_loss": -9.229095458984375, "global_step": 84163, "epoch": 500} {"train_loss": -9.33693790435791, "global_step": 84164, "epoch": 500} {"train_loss": -8.964834213256836, "global_step": 84165, "epoch": 500} {"train_loss": -9.022623062133789, "global_step": 84166, "epoch": 500} {"train_loss": -9.214876543907891, "global_step": 84167, "epoch": 500, "train/sim_max_reward_0": 0.6374095279125795, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.9685277824558546e-06, "train/sim_max_reward_3": 0.7230499996061714, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 0.2703925901329496, "test/sim_max_reward_4400001": 0.2981597376618111, "test/sim_max_reward_4400002": 0.4498372837628859, "test/sim_max_reward_4400003": 0.5268668906579884, "test/sim_max_reward_4400004": 0.402621943495682, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 0.28404429951127885, "test/sim_max_reward_4400007": 0.47846394638133954, "test/sim_max_reward_4400008": 0.5118983630963944, "test/sim_max_reward_4400009": 0.49007230815187447, "test/sim_max_reward_4400010": 0.2358484599039295, "test/sim_max_reward_4400011": 0.9020234830293884, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.9799740108783214, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9899789115021183, "test/sim_max_reward_4400019": 0.43333384360597327, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.6887591291652339, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.13999483225767823, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.6652669249029022, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.9212008471263512, "test/sim_max_reward_4400028": 0.6983025268184165, "test/sim_max_reward_4400029": 0.6263175502267586, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.004674931932248272, "test/sim_max_reward_4400033": 0.9739188657603387, "test/sim_max_reward_4400034": 0.970920666392278, "test/sim_max_reward_4400035": 0.9838251569403532, "test/sim_max_reward_4400036": 0.368438027923315, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.9944587741630712, "test/sim_max_reward_4400039": 0.9609493085789568, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.6612987771440069, "test/sim_max_reward_4400042": 0.08834356599320513, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.9903933322495404, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.7267435826744223, "test/mean_score": 0.5817777187233646, "val_loss": 198244.359375, "train_action_mse_error": 5.458433151245117} {"train_loss": -9.008650779724121, "global_step": 84168, "epoch": 501} {"train_loss": -9.191920280456543, "global_step": 84169, "epoch": 501} {"train_loss": -8.72842025756836, "global_step": 84170, "epoch": 501} {"train_loss": -8.763437271118164, "global_step": 84171, "epoch": 501} {"train_loss": -8.818868637084961, "global_step": 84172, "epoch": 501} {"train_loss": -9.15941047668457, "global_step": 84173, "epoch": 501} {"train_loss": -8.740267753601074, "global_step": 84174, "epoch": 501} {"train_loss": -9.102884292602539, "global_step": 84175, "epoch": 501} {"train_loss": -8.776342391967773, "global_step": 84176, "epoch": 501} {"train_loss": -8.922662734985352, "global_step": 84177, "epoch": 501} {"train_loss": -9.031087875366211, "global_step": 84178, "epoch": 501} {"train_loss": -9.014094352722168, "global_step": 84179, "epoch": 501} {"train_loss": -9.15821647644043, "global_step": 84180, "epoch": 501} {"train_loss": -9.05943489074707, "global_step": 84181, "epoch": 501} {"train_loss": -8.948029518127441, "global_step": 84182, "epoch": 501} {"train_loss": -9.289876937866211, "global_step": 84183, "epoch": 501} {"train_loss": -9.237987518310547, "global_step": 84184, "epoch": 501} {"train_loss": -9.064300537109375, "global_step": 84185, "epoch": 501} {"train_loss": -9.19034481048584, "global_step": 84186, "epoch": 501} {"train_loss": -9.096084594726562, "global_step": 84187, "epoch": 501} {"train_loss": -8.85940170288086, "global_step": 84188, "epoch": 501} {"train_loss": -9.005520820617676, "global_step": 84189, "epoch": 501} {"train_loss": -8.933961868286133, "global_step": 84190, "epoch": 501} {"train_loss": -9.125646591186523, "global_step": 84191, "epoch": 501} {"train_loss": -9.063713073730469, "global_step": 84192, "epoch": 501} {"train_loss": -9.422880172729492, "global_step": 84193, "epoch": 501} {"train_loss": -9.078941345214844, "global_step": 84194, "epoch": 501} {"train_loss": -9.179275512695312, "global_step": 84195, "epoch": 501} {"train_loss": -9.14889907836914, "global_step": 84196, "epoch": 501} {"train_loss": -9.333721160888672, "global_step": 84197, "epoch": 501} {"train_loss": -9.302943229675293, "global_step": 84198, "epoch": 501} {"train_loss": -9.338438987731934, "global_step": 84199, "epoch": 501} {"train_loss": -9.23511791229248, "global_step": 84200, "epoch": 501} {"train_loss": -9.503946304321289, "global_step": 84201, "epoch": 501} {"train_loss": -9.493520736694336, "global_step": 84202, "epoch": 501} {"train_loss": -9.48656940460205, "global_step": 84203, "epoch": 501} {"train_loss": -9.255233764648438, "global_step": 84204, "epoch": 501} {"train_loss": -9.311295509338379, "global_step": 84205, "epoch": 501} {"train_loss": -9.439037322998047, "global_step": 84206, "epoch": 501} {"train_loss": -9.335575103759766, "global_step": 84207, "epoch": 501} {"train_loss": -9.482181549072266, "global_step": 84208, "epoch": 501} {"train_loss": -9.320146560668945, "global_step": 84209, "epoch": 501} {"train_loss": -9.340139389038086, "global_step": 84210, "epoch": 501} {"train_loss": -9.347650527954102, "global_step": 84211, "epoch": 501} {"train_loss": -9.179433822631836, "global_step": 84212, "epoch": 501} {"train_loss": -9.281376838684082, "global_step": 84213, "epoch": 501} {"train_loss": -8.988167762756348, "global_step": 84214, "epoch": 501} {"train_loss": -9.548230171203613, "global_step": 84215, "epoch": 501} {"train_loss": -9.329500198364258, "global_step": 84216, "epoch": 501} {"train_loss": -9.10036849975586, "global_step": 84217, "epoch": 501} {"train_loss": -9.251752853393555, "global_step": 84218, "epoch": 501} {"train_loss": -9.099536895751953, "global_step": 84219, "epoch": 501} {"train_loss": -9.41158390045166, "global_step": 84220, "epoch": 501} {"train_loss": -8.99442195892334, "global_step": 84221, "epoch": 501} {"train_loss": -9.194515228271484, "global_step": 84222, "epoch": 501} {"train_loss": -9.022867202758789, "global_step": 84223, "epoch": 501} {"train_loss": -9.004295349121094, "global_step": 84224, "epoch": 501} {"train_loss": -9.096602439880371, "global_step": 84225, "epoch": 501} {"train_loss": -9.201972007751465, "global_step": 84226, "epoch": 501} {"train_loss": -8.804924011230469, "global_step": 84227, "epoch": 501} {"train_loss": -8.711466789245605, "global_step": 84228, "epoch": 501} {"train_loss": -8.92625617980957, "global_step": 84229, "epoch": 501} {"train_loss": -8.875948905944824, "global_step": 84230, "epoch": 501} {"train_loss": -8.865584373474121, "global_step": 84231, "epoch": 501} {"train_loss": -8.688850402832031, "global_step": 84232, "epoch": 501} {"train_loss": -9.079591751098633, "global_step": 84233, "epoch": 501} {"train_loss": -8.864702224731445, "global_step": 84234, "epoch": 501} {"train_loss": -9.089563369750977, "global_step": 84235, "epoch": 501} {"train_loss": -8.842998504638672, "global_step": 84236, "epoch": 501} {"train_loss": -9.198622703552246, "global_step": 84237, "epoch": 501} {"train_loss": -8.814041137695312, "global_step": 84238, "epoch": 501} {"train_loss": -9.041353225708008, "global_step": 84239, "epoch": 501} {"train_loss": -8.876724243164062, "global_step": 84240, "epoch": 501} {"train_loss": -9.29056167602539, "global_step": 84241, "epoch": 501} {"train_loss": -9.034971237182617, "global_step": 84242, "epoch": 501} {"train_loss": -9.099843978881836, "global_step": 84243, "epoch": 501} {"train_loss": -9.090582847595215, "global_step": 84244, "epoch": 501} {"train_loss": -9.119823455810547, "global_step": 84245, "epoch": 501} {"train_loss": -9.256792068481445, "global_step": 84246, "epoch": 501} {"train_loss": -9.135686874389648, "global_step": 84247, "epoch": 501} {"train_loss": -9.280046463012695, "global_step": 84248, "epoch": 501} {"train_loss": -8.935602188110352, "global_step": 84249, "epoch": 501} {"train_loss": -9.234785079956055, "global_step": 84250, "epoch": 501} {"train_loss": -9.375741958618164, "global_step": 84251, "epoch": 501} {"train_loss": -9.154708862304688, "global_step": 84252, "epoch": 501} {"train_loss": -9.38926887512207, "global_step": 84253, "epoch": 501} {"train_loss": -9.160348892211914, "global_step": 84254, "epoch": 501} {"train_loss": -9.411605834960938, "global_step": 84255, "epoch": 501} {"train_loss": -9.228425025939941, "global_step": 84256, "epoch": 501} {"train_loss": -9.329427719116211, "global_step": 84257, "epoch": 501} {"train_loss": -9.487787246704102, "global_step": 84258, "epoch": 501} {"train_loss": -9.452792167663574, "global_step": 84259, "epoch": 501} {"train_loss": -9.498326301574707, "global_step": 84260, "epoch": 501} {"train_loss": -9.468640327453613, "global_step": 84261, "epoch": 501} {"train_loss": -9.263047218322754, "global_step": 84262, "epoch": 501} {"train_loss": -9.321523666381836, "global_step": 84263, "epoch": 501} {"train_loss": -9.277560234069824, "global_step": 84264, "epoch": 501} {"train_loss": -9.690220832824707, "global_step": 84265, "epoch": 501} {"train_loss": -9.43516731262207, "global_step": 84266, "epoch": 501} {"train_loss": -9.364110946655273, "global_step": 84267, "epoch": 501} {"train_loss": -9.267383575439453, "global_step": 84268, "epoch": 501} {"train_loss": -9.450811386108398, "global_step": 84269, "epoch": 501} {"train_loss": -9.500709533691406, "global_step": 84270, "epoch": 501} {"train_loss": -9.352030754089355, "global_step": 84271, "epoch": 501} {"train_loss": -9.220279693603516, "global_step": 84272, "epoch": 501} {"train_loss": -9.455066680908203, "global_step": 84273, "epoch": 501} {"train_loss": -9.228021621704102, "global_step": 84274, "epoch": 501} {"train_loss": -9.287017822265625, "global_step": 84275, "epoch": 501} {"train_loss": -9.220369338989258, "global_step": 84276, "epoch": 501} {"train_loss": -9.434389114379883, "global_step": 84277, "epoch": 501} {"train_loss": -9.300577163696289, "global_step": 84278, "epoch": 501} {"train_loss": -9.420308113098145, "global_step": 84279, "epoch": 501} {"train_loss": -9.327173233032227, "global_step": 84280, "epoch": 501} {"train_loss": -9.314456939697266, "global_step": 84281, "epoch": 501} {"train_loss": -9.069537162780762, "global_step": 84282, "epoch": 501} {"train_loss": -9.048375129699707, "global_step": 84283, "epoch": 501} {"train_loss": -9.469343185424805, "global_step": 84284, "epoch": 501} {"train_loss": -9.30682373046875, "global_step": 84285, "epoch": 501} {"train_loss": -9.477545738220215, "global_step": 84286, "epoch": 501} {"train_loss": -9.307685852050781, "global_step": 84287, "epoch": 501} {"train_loss": -9.134222984313965, "global_step": 84288, "epoch": 501} {"train_loss": -9.028138160705566, "global_step": 84289, "epoch": 501} {"train_loss": -9.132593154907227, "global_step": 84290, "epoch": 501} {"train_loss": -9.290794372558594, "global_step": 84291, "epoch": 501} {"train_loss": -9.276439666748047, "global_step": 84292, "epoch": 501} {"train_loss": -9.286073684692383, "global_step": 84293, "epoch": 501} {"train_loss": -9.132554054260254, "global_step": 84294, "epoch": 501} {"train_loss": -9.20608139038086, "global_step": 84295, "epoch": 501} {"train_loss": -9.397693634033203, "global_step": 84296, "epoch": 501} {"train_loss": -9.097536087036133, "global_step": 84297, "epoch": 501} {"train_loss": -9.202244758605957, "global_step": 84298, "epoch": 501} {"train_loss": -9.012256622314453, "global_step": 84299, "epoch": 501} {"train_loss": -9.220085144042969, "global_step": 84300, "epoch": 501} {"train_loss": -9.185914993286133, "global_step": 84301, "epoch": 501} {"train_loss": -9.072212219238281, "global_step": 84302, "epoch": 501} {"train_loss": -9.193441390991211, "global_step": 84303, "epoch": 501} {"train_loss": -9.358625411987305, "global_step": 84304, "epoch": 501} {"train_loss": -9.088567733764648, "global_step": 84305, "epoch": 501} {"train_loss": -9.240726470947266, "global_step": 84306, "epoch": 501} {"train_loss": -9.353092193603516, "global_step": 84307, "epoch": 501} {"train_loss": -9.476398468017578, "global_step": 84308, "epoch": 501} {"train_loss": -9.35260009765625, "global_step": 84309, "epoch": 501} {"train_loss": -9.433977127075195, "global_step": 84310, "epoch": 501} {"train_loss": -9.36392879486084, "global_step": 84311, "epoch": 501} {"train_loss": -9.448229789733887, "global_step": 84312, "epoch": 501} {"train_loss": -9.564155578613281, "global_step": 84313, "epoch": 501} {"train_loss": -9.40194320678711, "global_step": 84314, "epoch": 501} {"train_loss": -9.436010360717773, "global_step": 84315, "epoch": 501} {"train_loss": -9.22535514831543, "global_step": 84316, "epoch": 501} {"train_loss": -9.31495475769043, "global_step": 84317, "epoch": 501} {"train_loss": -9.054132461547852, "global_step": 84318, "epoch": 501} {"train_loss": -9.541570663452148, "global_step": 84319, "epoch": 501} {"train_loss": -9.385931015014648, "global_step": 84320, "epoch": 501} {"train_loss": -9.359530448913574, "global_step": 84321, "epoch": 501} {"train_loss": -8.949003219604492, "global_step": 84322, "epoch": 501} {"train_loss": -9.473169326782227, "global_step": 84323, "epoch": 501} {"train_loss": -9.305213928222656, "global_step": 84324, "epoch": 501} {"train_loss": -9.032171249389648, "global_step": 84325, "epoch": 501} {"train_loss": -9.437705039978027, "global_step": 84326, "epoch": 501} {"train_loss": -9.048948287963867, "global_step": 84327, "epoch": 501} {"train_loss": -9.324256896972656, "global_step": 84328, "epoch": 501} {"train_loss": -9.116491317749023, "global_step": 84329, "epoch": 501} {"train_loss": -9.335168838500977, "global_step": 84330, "epoch": 501} {"train_loss": -9.377176284790039, "global_step": 84331, "epoch": 501} {"train_loss": -9.254416465759277, "global_step": 84332, "epoch": 501} {"train_loss": -9.207871437072754, "global_step": 84333, "epoch": 501} {"train_loss": -9.296821594238281, "global_step": 84334, "epoch": 501} {"train_loss": -9.206946083477565, "global_step": 84335, "epoch": 501, "val_loss": 200002.3125} {"train_loss": -9.443218231201172, "global_step": 84336, "epoch": 502} {"train_loss": -9.359594345092773, "global_step": 84337, "epoch": 502} {"train_loss": -9.172318458557129, "global_step": 84338, "epoch": 502} {"train_loss": -9.19717788696289, "global_step": 84339, "epoch": 502} {"train_loss": -9.283876419067383, "global_step": 84340, "epoch": 502} {"train_loss": -9.20464038848877, "global_step": 84341, "epoch": 502} {"train_loss": -9.306665420532227, "global_step": 84342, "epoch": 502} {"train_loss": -9.27035140991211, "global_step": 84343, "epoch": 502} {"train_loss": -8.70022201538086, "global_step": 84344, "epoch": 502} {"train_loss": -9.274580001831055, "global_step": 84345, "epoch": 502} {"train_loss": -8.863048553466797, "global_step": 84346, "epoch": 502} {"train_loss": -9.29630184173584, "global_step": 84347, "epoch": 502} {"train_loss": -8.795328140258789, "global_step": 84348, "epoch": 502} {"train_loss": -8.998340606689453, "global_step": 84349, "epoch": 502} {"train_loss": -9.022228240966797, "global_step": 84350, "epoch": 502} {"train_loss": -9.151283264160156, "global_step": 84351, "epoch": 502} {"train_loss": -8.991122245788574, "global_step": 84352, "epoch": 502} {"train_loss": -8.919539451599121, "global_step": 84353, "epoch": 502} {"train_loss": -9.302351951599121, "global_step": 84354, "epoch": 502} {"train_loss": -9.03560733795166, "global_step": 84355, "epoch": 502} {"train_loss": -8.92981243133545, "global_step": 84356, "epoch": 502} {"train_loss": -9.211174011230469, "global_step": 84357, "epoch": 502} {"train_loss": -9.161437034606934, "global_step": 84358, "epoch": 502} {"train_loss": -8.954736709594727, "global_step": 84359, "epoch": 502} {"train_loss": -8.879658699035645, "global_step": 84360, "epoch": 502} {"train_loss": -9.140514373779297, "global_step": 84361, "epoch": 502} {"train_loss": -8.950033187866211, "global_step": 84362, "epoch": 502} {"train_loss": -9.227361679077148, "global_step": 84363, "epoch": 502} {"train_loss": -9.065321922302246, "global_step": 84364, "epoch": 502} {"train_loss": -8.844599723815918, "global_step": 84365, "epoch": 502} {"train_loss": -9.339750289916992, "global_step": 84366, "epoch": 502} {"train_loss": -9.356756210327148, "global_step": 84367, "epoch": 502} {"train_loss": -9.182685852050781, "global_step": 84368, "epoch": 502} {"train_loss": -9.016032218933105, "global_step": 84369, "epoch": 502} {"train_loss": -9.412553787231445, "global_step": 84370, "epoch": 502} {"train_loss": -9.079687118530273, "global_step": 84371, "epoch": 502} {"train_loss": -9.121194839477539, "global_step": 84372, "epoch": 502} {"train_loss": -9.49599838256836, "global_step": 84373, "epoch": 502} {"train_loss": -9.085951805114746, "global_step": 84374, "epoch": 502} {"train_loss": -9.166936874389648, "global_step": 84375, "epoch": 502} {"train_loss": -9.465795516967773, "global_step": 84376, "epoch": 502} {"train_loss": -9.343730926513672, "global_step": 84377, "epoch": 502} {"train_loss": -9.377033233642578, "global_step": 84378, "epoch": 502} {"train_loss": -8.921590805053711, "global_step": 84379, "epoch": 502} {"train_loss": -9.407651901245117, "global_step": 84380, "epoch": 502} {"train_loss": -9.240509986877441, "global_step": 84381, "epoch": 502} {"train_loss": -9.377927780151367, "global_step": 84382, "epoch": 502} {"train_loss": -9.348403930664062, "global_step": 84383, "epoch": 502} {"train_loss": -9.329690933227539, "global_step": 84384, "epoch": 502} {"train_loss": -9.397029876708984, "global_step": 84385, "epoch": 502} {"train_loss": -9.277524948120117, "global_step": 84386, "epoch": 502} {"train_loss": -9.530421257019043, "global_step": 84387, "epoch": 502} {"train_loss": -9.314087867736816, "global_step": 84388, "epoch": 502} {"train_loss": -9.423334121704102, "global_step": 84389, "epoch": 502} {"train_loss": -9.278341293334961, "global_step": 84390, "epoch": 502} {"train_loss": -9.335378646850586, "global_step": 84391, "epoch": 502} {"train_loss": -9.701927185058594, "global_step": 84392, "epoch": 502} {"train_loss": -9.707878112792969, "global_step": 84393, "epoch": 502} {"train_loss": -9.643672943115234, "global_step": 84394, "epoch": 502} {"train_loss": -9.469551086425781, "global_step": 84395, "epoch": 502} {"train_loss": -9.525999069213867, "global_step": 84396, "epoch": 502} {"train_loss": -9.600322723388672, "global_step": 84397, "epoch": 502} {"train_loss": -9.443902015686035, "global_step": 84398, "epoch": 502} {"train_loss": -9.142909049987793, "global_step": 84399, "epoch": 502} {"train_loss": -9.56597900390625, "global_step": 84400, "epoch": 502} {"train_loss": -9.308303833007812, "global_step": 84401, "epoch": 502} {"train_loss": -9.442787170410156, "global_step": 84402, "epoch": 502} {"train_loss": -9.233575820922852, "global_step": 84403, "epoch": 502} {"train_loss": -9.181617736816406, "global_step": 84404, "epoch": 502} {"train_loss": -9.38755989074707, "global_step": 84405, "epoch": 502} {"train_loss": -9.355598449707031, "global_step": 84406, "epoch": 502} {"train_loss": -9.59939956665039, "global_step": 84407, "epoch": 502} {"train_loss": -9.332643508911133, "global_step": 84408, "epoch": 502} {"train_loss": -9.158941268920898, "global_step": 84409, "epoch": 502} {"train_loss": -9.382789611816406, "global_step": 84410, "epoch": 502} {"train_loss": -9.284862518310547, "global_step": 84411, "epoch": 502} {"train_loss": -9.315790176391602, "global_step": 84412, "epoch": 502} {"train_loss": -9.204728126525879, "global_step": 84413, "epoch": 502} {"train_loss": -8.970137596130371, "global_step": 84414, "epoch": 502} {"train_loss": -9.364191055297852, "global_step": 84415, "epoch": 502} {"train_loss": -9.068487167358398, "global_step": 84416, "epoch": 502} {"train_loss": -9.515605926513672, "global_step": 84417, "epoch": 502} {"train_loss": -9.12570571899414, "global_step": 84418, "epoch": 502} {"train_loss": -9.056107521057129, "global_step": 84419, "epoch": 502} {"train_loss": -9.381370544433594, "global_step": 84420, "epoch": 502} {"train_loss": -9.086041450500488, "global_step": 84421, "epoch": 502} {"train_loss": -9.520589828491211, "global_step": 84422, "epoch": 502} {"train_loss": -9.3201904296875, "global_step": 84423, "epoch": 502} {"train_loss": -9.313896179199219, "global_step": 84424, "epoch": 502} {"train_loss": -9.298376083374023, "global_step": 84425, "epoch": 502} {"train_loss": -9.440998077392578, "global_step": 84426, "epoch": 502} {"train_loss": -9.531410217285156, "global_step": 84427, "epoch": 502} {"train_loss": -9.378759384155273, "global_step": 84428, "epoch": 502} {"train_loss": -9.45203685760498, "global_step": 84429, "epoch": 502} {"train_loss": -9.115732192993164, "global_step": 84430, "epoch": 502} {"train_loss": -9.390495300292969, "global_step": 84431, "epoch": 502} {"train_loss": -9.353475570678711, "global_step": 84432, "epoch": 502} {"train_loss": -9.240875244140625, "global_step": 84433, "epoch": 502} {"train_loss": -9.451655387878418, "global_step": 84434, "epoch": 502} {"train_loss": -9.400246620178223, "global_step": 84435, "epoch": 502} {"train_loss": -9.380961418151855, "global_step": 84436, "epoch": 502} {"train_loss": -9.354154586791992, "global_step": 84437, "epoch": 502} {"train_loss": -9.423981666564941, "global_step": 84438, "epoch": 502} {"train_loss": -9.467101097106934, "global_step": 84439, "epoch": 502} {"train_loss": -9.372756958007812, "global_step": 84440, "epoch": 502} {"train_loss": -9.22757339477539, "global_step": 84441, "epoch": 502} {"train_loss": -9.449865341186523, "global_step": 84442, "epoch": 502} {"train_loss": -9.331576347351074, "global_step": 84443, "epoch": 502} {"train_loss": -9.12411880493164, "global_step": 84444, "epoch": 502} {"train_loss": -9.186317443847656, "global_step": 84445, "epoch": 502} {"train_loss": -9.193446159362793, "global_step": 84446, "epoch": 502} {"train_loss": -9.388282775878906, "global_step": 84447, "epoch": 502} {"train_loss": -9.218212127685547, "global_step": 84448, "epoch": 502} {"train_loss": -9.372292518615723, "global_step": 84449, "epoch": 502} {"train_loss": -9.110664367675781, "global_step": 84450, "epoch": 502} {"train_loss": -9.171833992004395, "global_step": 84451, "epoch": 502} {"train_loss": -9.38664436340332, "global_step": 84452, "epoch": 502} {"train_loss": -9.179402351379395, "global_step": 84453, "epoch": 502} {"train_loss": -9.162554740905762, "global_step": 84454, "epoch": 502} {"train_loss": -9.162872314453125, "global_step": 84455, "epoch": 502} {"train_loss": -9.08121395111084, "global_step": 84456, "epoch": 502} {"train_loss": -9.409646987915039, "global_step": 84457, "epoch": 502} {"train_loss": -9.288511276245117, "global_step": 84458, "epoch": 502} {"train_loss": -9.002968788146973, "global_step": 84459, "epoch": 502} {"train_loss": -9.52719497680664, "global_step": 84460, "epoch": 502} {"train_loss": -9.190662384033203, "global_step": 84461, "epoch": 502} {"train_loss": -9.233078002929688, "global_step": 84462, "epoch": 502} {"train_loss": -9.175137519836426, "global_step": 84463, "epoch": 502} {"train_loss": -9.318286895751953, "global_step": 84464, "epoch": 502} {"train_loss": -9.323186874389648, "global_step": 84465, "epoch": 502} {"train_loss": -9.167900085449219, "global_step": 84466, "epoch": 502} {"train_loss": -9.29800796508789, "global_step": 84467, "epoch": 502} {"train_loss": -9.006856918334961, "global_step": 84468, "epoch": 502} {"train_loss": -9.34416675567627, "global_step": 84469, "epoch": 502} {"train_loss": -9.314947128295898, "global_step": 84470, "epoch": 502} {"train_loss": -9.179901123046875, "global_step": 84471, "epoch": 502} {"train_loss": -9.470603942871094, "global_step": 84472, "epoch": 502} {"train_loss": -9.349784851074219, "global_step": 84473, "epoch": 502} {"train_loss": -9.461434364318848, "global_step": 84474, "epoch": 502} {"train_loss": -9.235721588134766, "global_step": 84475, "epoch": 502} {"train_loss": -9.362668991088867, "global_step": 84476, "epoch": 502} {"train_loss": -9.409652709960938, "global_step": 84477, "epoch": 502} {"train_loss": -9.199287414550781, "global_step": 84478, "epoch": 502} {"train_loss": -9.54983901977539, "global_step": 84479, "epoch": 502} {"train_loss": -9.385791778564453, "global_step": 84480, "epoch": 502} {"train_loss": -9.478165626525879, "global_step": 84481, "epoch": 502} {"train_loss": -9.116887092590332, "global_step": 84482, "epoch": 502} {"train_loss": -9.604413986206055, "global_step": 84483, "epoch": 502} {"train_loss": -9.526847839355469, "global_step": 84484, "epoch": 502} {"train_loss": -9.208660125732422, "global_step": 84485, "epoch": 502} {"train_loss": -9.56022834777832, "global_step": 84486, "epoch": 502} {"train_loss": -9.501314163208008, "global_step": 84487, "epoch": 502} {"train_loss": -9.370218276977539, "global_step": 84488, "epoch": 502} {"train_loss": -9.293210983276367, "global_step": 84489, "epoch": 502} {"train_loss": -9.254405975341797, "global_step": 84490, "epoch": 502} {"train_loss": -9.095544815063477, "global_step": 84491, "epoch": 502} {"train_loss": -9.253859519958496, "global_step": 84492, "epoch": 502} {"train_loss": -9.15463638305664, "global_step": 84493, "epoch": 502} {"train_loss": -9.048307418823242, "global_step": 84494, "epoch": 502} {"train_loss": -9.405162811279297, "global_step": 84495, "epoch": 502} {"train_loss": -8.75457763671875, "global_step": 84496, "epoch": 502} {"train_loss": -9.311112403869629, "global_step": 84497, "epoch": 502} {"train_loss": -9.175230979919434, "global_step": 84498, "epoch": 502} {"train_loss": -9.138374328613281, "global_step": 84499, "epoch": 502} {"train_loss": -9.02487564086914, "global_step": 84500, "epoch": 502} {"train_loss": -9.337512016296387, "global_step": 84501, "epoch": 502} {"train_loss": -9.201972961425781, "global_step": 84502, "epoch": 502} {"train_loss": -9.268195316905068, "global_step": 84503, "epoch": 502, "val_loss": 198998.109375} {"train_loss": -9.190293312072754, "global_step": 84504, "epoch": 503} {"train_loss": -9.344286918640137, "global_step": 84505, "epoch": 503} {"train_loss": -9.398200988769531, "global_step": 84506, "epoch": 503} {"train_loss": -9.346406936645508, "global_step": 84507, "epoch": 503} {"train_loss": -9.340831756591797, "global_step": 84508, "epoch": 503} {"train_loss": -9.391331672668457, "global_step": 84509, "epoch": 503} {"train_loss": -9.390512466430664, "global_step": 84510, "epoch": 503} {"train_loss": -9.177424430847168, "global_step": 84511, "epoch": 503} {"train_loss": -9.032058715820312, "global_step": 84512, "epoch": 503} {"train_loss": -9.255793571472168, "global_step": 84513, "epoch": 503} {"train_loss": -9.335380554199219, "global_step": 84514, "epoch": 503} {"train_loss": -9.385017395019531, "global_step": 84515, "epoch": 503} {"train_loss": -9.276535987854004, "global_step": 84516, "epoch": 503} {"train_loss": -9.574540138244629, "global_step": 84517, "epoch": 503} {"train_loss": -9.6466646194458, "global_step": 84518, "epoch": 503} {"train_loss": -9.461333274841309, "global_step": 84519, "epoch": 503} {"train_loss": -9.204996109008789, "global_step": 84520, "epoch": 503} {"train_loss": -9.589813232421875, "global_step": 84521, "epoch": 503} {"train_loss": -9.556077003479004, "global_step": 84522, "epoch": 503} {"train_loss": -9.227117538452148, "global_step": 84523, "epoch": 503} {"train_loss": -9.381980895996094, "global_step": 84524, "epoch": 503} {"train_loss": -9.349581718444824, "global_step": 84525, "epoch": 503} {"train_loss": -8.781608581542969, "global_step": 84526, "epoch": 503} {"train_loss": -9.098943710327148, "global_step": 84527, "epoch": 503} {"train_loss": -9.040443420410156, "global_step": 84528, "epoch": 503} {"train_loss": -9.150495529174805, "global_step": 84529, "epoch": 503} {"train_loss": -9.247505187988281, "global_step": 84530, "epoch": 503} {"train_loss": -9.095067024230957, "global_step": 84531, "epoch": 503} {"train_loss": -9.001933097839355, "global_step": 84532, "epoch": 503} {"train_loss": -9.084806442260742, "global_step": 84533, "epoch": 503} {"train_loss": -8.994871139526367, "global_step": 84534, "epoch": 503} {"train_loss": -8.97507095336914, "global_step": 84535, "epoch": 503} {"train_loss": -9.15721321105957, "global_step": 84536, "epoch": 503} {"train_loss": -9.180509567260742, "global_step": 84537, "epoch": 503} {"train_loss": -9.118517875671387, "global_step": 84538, "epoch": 503} {"train_loss": -9.09550666809082, "global_step": 84539, "epoch": 503} {"train_loss": -9.473978042602539, "global_step": 84540, "epoch": 503} {"train_loss": -9.047948837280273, "global_step": 84541, "epoch": 503} {"train_loss": -9.248588562011719, "global_step": 84542, "epoch": 503} {"train_loss": -8.963068962097168, "global_step": 84543, "epoch": 503} {"train_loss": -9.068655014038086, "global_step": 84544, "epoch": 503} {"train_loss": -8.764525413513184, "global_step": 84545, "epoch": 503} {"train_loss": -8.808517456054688, "global_step": 84546, "epoch": 503} {"train_loss": -9.099924087524414, "global_step": 84547, "epoch": 503} {"train_loss": -8.407122611999512, "global_step": 84548, "epoch": 503} {"train_loss": -9.342382431030273, "global_step": 84549, "epoch": 503} {"train_loss": -9.080869674682617, "global_step": 84550, "epoch": 503} {"train_loss": -9.08707046508789, "global_step": 84551, "epoch": 503} {"train_loss": -8.794711112976074, "global_step": 84552, "epoch": 503} {"train_loss": -8.884326934814453, "global_step": 84553, "epoch": 503} {"train_loss": -8.972517013549805, "global_step": 84554, "epoch": 503} {"train_loss": -9.207176208496094, "global_step": 84555, "epoch": 503} {"train_loss": -9.043041229248047, "global_step": 84556, "epoch": 503} {"train_loss": -8.962545394897461, "global_step": 84557, "epoch": 503} {"train_loss": -9.225557327270508, "global_step": 84558, "epoch": 503} {"train_loss": -9.12620735168457, "global_step": 84559, "epoch": 503} {"train_loss": -9.18842887878418, "global_step": 84560, "epoch": 503} {"train_loss": -8.895036697387695, "global_step": 84561, "epoch": 503} {"train_loss": -9.264947891235352, "global_step": 84562, "epoch": 503} {"train_loss": -9.124320030212402, "global_step": 84563, "epoch": 503} {"train_loss": -9.104814529418945, "global_step": 84564, "epoch": 503} {"train_loss": -9.43448543548584, "global_step": 84565, "epoch": 503} {"train_loss": -9.033868789672852, "global_step": 84566, "epoch": 503} {"train_loss": -9.457540512084961, "global_step": 84567, "epoch": 503} {"train_loss": -8.883587837219238, "global_step": 84568, "epoch": 503} {"train_loss": -9.15097713470459, "global_step": 84569, "epoch": 503} {"train_loss": -8.999141693115234, "global_step": 84570, "epoch": 503} {"train_loss": -9.203994750976562, "global_step": 84571, "epoch": 503} {"train_loss": -8.820219039916992, "global_step": 84572, "epoch": 503} {"train_loss": -9.321746826171875, "global_step": 84573, "epoch": 503} {"train_loss": -9.348665237426758, "global_step": 84574, "epoch": 503} {"train_loss": -9.280675888061523, "global_step": 84575, "epoch": 503} {"train_loss": -9.517101287841797, "global_step": 84576, "epoch": 503} {"train_loss": -9.207881927490234, "global_step": 84577, "epoch": 503} {"train_loss": -9.265499114990234, "global_step": 84578, "epoch": 503} {"train_loss": -9.437952995300293, "global_step": 84579, "epoch": 503} {"train_loss": -9.357599258422852, "global_step": 84580, "epoch": 503} {"train_loss": -9.246728897094727, "global_step": 84581, "epoch": 503} {"train_loss": -9.432510375976562, "global_step": 84582, "epoch": 503} {"train_loss": -9.465631484985352, "global_step": 84583, "epoch": 503} {"train_loss": -9.280414581298828, "global_step": 84584, "epoch": 503} {"train_loss": -9.611526489257812, "global_step": 84585, "epoch": 503} {"train_loss": -9.439806938171387, "global_step": 84586, "epoch": 503} {"train_loss": -9.224061965942383, "global_step": 84587, "epoch": 503} {"train_loss": -9.601008415222168, "global_step": 84588, "epoch": 503} {"train_loss": -9.432245254516602, "global_step": 84589, "epoch": 503} {"train_loss": -9.196093559265137, "global_step": 84590, "epoch": 503} {"train_loss": -9.359237670898438, "global_step": 84591, "epoch": 503} {"train_loss": -9.350796699523926, "global_step": 84592, "epoch": 503} {"train_loss": -9.346304893493652, "global_step": 84593, "epoch": 503} {"train_loss": -9.277839660644531, "global_step": 84594, "epoch": 503} {"train_loss": -9.235603332519531, "global_step": 84595, "epoch": 503} {"train_loss": -9.144756317138672, "global_step": 84596, "epoch": 503} {"train_loss": -9.47132682800293, "global_step": 84597, "epoch": 503} {"train_loss": -9.15168285369873, "global_step": 84598, "epoch": 503} {"train_loss": -9.392578125, "global_step": 84599, "epoch": 503} {"train_loss": -9.604419708251953, "global_step": 84600, "epoch": 503} {"train_loss": -9.352981567382812, "global_step": 84601, "epoch": 503} {"train_loss": -9.37253189086914, "global_step": 84602, "epoch": 503} {"train_loss": -9.527924537658691, "global_step": 84603, "epoch": 503} {"train_loss": -9.195564270019531, "global_step": 84604, "epoch": 503} {"train_loss": -9.411584854125977, "global_step": 84605, "epoch": 503} {"train_loss": -9.45279312133789, "global_step": 84606, "epoch": 503} {"train_loss": -9.372507095336914, "global_step": 84607, "epoch": 503} {"train_loss": -9.587797164916992, "global_step": 84608, "epoch": 503} {"train_loss": -9.220003128051758, "global_step": 84609, "epoch": 503} {"train_loss": -9.344593048095703, "global_step": 84610, "epoch": 503} {"train_loss": -9.345869064331055, "global_step": 84611, "epoch": 503} {"train_loss": -9.120168685913086, "global_step": 84612, "epoch": 503} {"train_loss": -9.276926040649414, "global_step": 84613, "epoch": 503} {"train_loss": -9.32384204864502, "global_step": 84614, "epoch": 503} {"train_loss": -9.27534008026123, "global_step": 84615, "epoch": 503} {"train_loss": -9.227060317993164, "global_step": 84616, "epoch": 503} {"train_loss": -9.207056045532227, "global_step": 84617, "epoch": 503} {"train_loss": -9.476356506347656, "global_step": 84618, "epoch": 503} {"train_loss": -9.192018508911133, "global_step": 84619, "epoch": 503} {"train_loss": -9.528282165527344, "global_step": 84620, "epoch": 503} {"train_loss": -9.525674819946289, "global_step": 84621, "epoch": 503} {"train_loss": -9.420661926269531, "global_step": 84622, "epoch": 503} {"train_loss": -9.375953674316406, "global_step": 84623, "epoch": 503} {"train_loss": -9.457046508789062, "global_step": 84624, "epoch": 503} {"train_loss": -9.133074760437012, "global_step": 84625, "epoch": 503} {"train_loss": -9.096000671386719, "global_step": 84626, "epoch": 503} {"train_loss": -9.634716033935547, "global_step": 84627, "epoch": 503} {"train_loss": -9.449682235717773, "global_step": 84628, "epoch": 503} {"train_loss": -9.397603034973145, "global_step": 84629, "epoch": 503} {"train_loss": -9.188600540161133, "global_step": 84630, "epoch": 503} {"train_loss": -9.407649993896484, "global_step": 84631, "epoch": 503} {"train_loss": -9.36648941040039, "global_step": 84632, "epoch": 503} {"train_loss": -9.359235763549805, "global_step": 84633, "epoch": 503} {"train_loss": -9.226693153381348, "global_step": 84634, "epoch": 503} {"train_loss": -9.342674255371094, "global_step": 84635, "epoch": 503} {"train_loss": -9.207576751708984, "global_step": 84636, "epoch": 503} {"train_loss": -9.160176277160645, "global_step": 84637, "epoch": 503} {"train_loss": -9.35469913482666, "global_step": 84638, "epoch": 503} {"train_loss": -9.225370407104492, "global_step": 84639, "epoch": 503} {"train_loss": -9.489842414855957, "global_step": 84640, "epoch": 503} {"train_loss": -9.130592346191406, "global_step": 84641, "epoch": 503} {"train_loss": -9.442825317382812, "global_step": 84642, "epoch": 503} {"train_loss": -9.433841705322266, "global_step": 84643, "epoch": 503} {"train_loss": -9.163562774658203, "global_step": 84644, "epoch": 503} {"train_loss": -9.51816177368164, "global_step": 84645, "epoch": 503} {"train_loss": -9.379501342773438, "global_step": 84646, "epoch": 503} {"train_loss": -9.374532699584961, "global_step": 84647, "epoch": 503} {"train_loss": -9.30340576171875, "global_step": 84648, "epoch": 503} {"train_loss": -9.104523658752441, "global_step": 84649, "epoch": 503} {"train_loss": -9.095507621765137, "global_step": 84650, "epoch": 503} {"train_loss": -9.38477611541748, "global_step": 84651, "epoch": 503} {"train_loss": -9.262229919433594, "global_step": 84652, "epoch": 503} {"train_loss": -9.197481155395508, "global_step": 84653, "epoch": 503} {"train_loss": -9.066410064697266, "global_step": 84654, "epoch": 503} {"train_loss": -8.940627098083496, "global_step": 84655, "epoch": 503} {"train_loss": -9.318403244018555, "global_step": 84656, "epoch": 503} {"train_loss": -8.992773056030273, "global_step": 84657, "epoch": 503} {"train_loss": -9.148881912231445, "global_step": 84658, "epoch": 503} {"train_loss": -9.11473274230957, "global_step": 84659, "epoch": 503} {"train_loss": -9.017366409301758, "global_step": 84660, "epoch": 503} {"train_loss": -9.111886978149414, "global_step": 84661, "epoch": 503} {"train_loss": -9.098588943481445, "global_step": 84662, "epoch": 503} {"train_loss": -9.055656433105469, "global_step": 84663, "epoch": 503} {"train_loss": -8.892056465148926, "global_step": 84664, "epoch": 503} {"train_loss": -9.050800323486328, "global_step": 84665, "epoch": 503} {"train_loss": -9.182611465454102, "global_step": 84666, "epoch": 503} {"train_loss": -9.19495964050293, "global_step": 84667, "epoch": 503} {"train_loss": -8.922809600830078, "global_step": 84668, "epoch": 503} {"train_loss": -8.918475151062012, "global_step": 84669, "epoch": 503} {"train_loss": -9.23996639251709, "global_step": 84670, "epoch": 503} {"train_loss": -9.237568832579113, "global_step": 84671, "epoch": 503, "val_loss": 199102.703125} {"train_loss": -9.31208324432373, "global_step": 84672, "epoch": 504} {"train_loss": -9.303335189819336, "global_step": 84673, "epoch": 504} {"train_loss": -9.153079986572266, "global_step": 84674, "epoch": 504} {"train_loss": -9.058012008666992, "global_step": 84675, "epoch": 504} {"train_loss": -9.192193984985352, "global_step": 84676, "epoch": 504} {"train_loss": -9.282947540283203, "global_step": 84677, "epoch": 504} {"train_loss": -9.35287094116211, "global_step": 84678, "epoch": 504} {"train_loss": -9.297266006469727, "global_step": 84679, "epoch": 504} {"train_loss": -9.459516525268555, "global_step": 84680, "epoch": 504} {"train_loss": -9.519299507141113, "global_step": 84681, "epoch": 504} {"train_loss": -9.415059089660645, "global_step": 84682, "epoch": 504} {"train_loss": -9.38686752319336, "global_step": 84683, "epoch": 504} {"train_loss": -9.201042175292969, "global_step": 84684, "epoch": 504} {"train_loss": -9.089960098266602, "global_step": 84685, "epoch": 504} {"train_loss": -9.424930572509766, "global_step": 84686, "epoch": 504} {"train_loss": -9.489013671875, "global_step": 84687, "epoch": 504} {"train_loss": -9.503121376037598, "global_step": 84688, "epoch": 504} {"train_loss": -9.38994026184082, "global_step": 84689, "epoch": 504} {"train_loss": -9.47572135925293, "global_step": 84690, "epoch": 504} {"train_loss": -9.397192001342773, "global_step": 84691, "epoch": 504} {"train_loss": -9.512224197387695, "global_step": 84692, "epoch": 504} {"train_loss": -9.470144271850586, "global_step": 84693, "epoch": 504} {"train_loss": -9.530165672302246, "global_step": 84694, "epoch": 504} {"train_loss": -9.274574279785156, "global_step": 84695, "epoch": 504} {"train_loss": -9.619382858276367, "global_step": 84696, "epoch": 504} {"train_loss": -9.451746940612793, "global_step": 84697, "epoch": 504} {"train_loss": -9.17673110961914, "global_step": 84698, "epoch": 504} {"train_loss": -9.33595085144043, "global_step": 84699, "epoch": 504} {"train_loss": -9.6659517288208, "global_step": 84700, "epoch": 504} {"train_loss": -9.526540756225586, "global_step": 84701, "epoch": 504} {"train_loss": -9.450510025024414, "global_step": 84702, "epoch": 504} {"train_loss": -9.725522994995117, "global_step": 84703, "epoch": 504} {"train_loss": -9.674320220947266, "global_step": 84704, "epoch": 504} {"train_loss": -9.429078102111816, "global_step": 84705, "epoch": 504} {"train_loss": -9.704280853271484, "global_step": 84706, "epoch": 504} {"train_loss": -9.618902206420898, "global_step": 84707, "epoch": 504} {"train_loss": -9.567835807800293, "global_step": 84708, "epoch": 504} {"train_loss": -9.421781539916992, "global_step": 84709, "epoch": 504} {"train_loss": -9.299230575561523, "global_step": 84710, "epoch": 504} {"train_loss": -9.301225662231445, "global_step": 84711, "epoch": 504} {"train_loss": -9.291923522949219, "global_step": 84712, "epoch": 504} {"train_loss": -9.306227684020996, "global_step": 84713, "epoch": 504} {"train_loss": -9.638137817382812, "global_step": 84714, "epoch": 504} {"train_loss": -9.567033767700195, "global_step": 84715, "epoch": 504} {"train_loss": -9.447136878967285, "global_step": 84716, "epoch": 504} {"train_loss": -9.265092849731445, "global_step": 84717, "epoch": 504} {"train_loss": -9.48427963256836, "global_step": 84718, "epoch": 504} {"train_loss": -9.220368385314941, "global_step": 84719, "epoch": 504} {"train_loss": -9.302338600158691, "global_step": 84720, "epoch": 504} {"train_loss": -9.403456687927246, "global_step": 84721, "epoch": 504} {"train_loss": -9.14785385131836, "global_step": 84722, "epoch": 504} {"train_loss": -9.301542282104492, "global_step": 84723, "epoch": 504} {"train_loss": -9.177356719970703, "global_step": 84724, "epoch": 504} {"train_loss": -9.230682373046875, "global_step": 84725, "epoch": 504} {"train_loss": -9.24605941772461, "global_step": 84726, "epoch": 504} {"train_loss": -9.201997756958008, "global_step": 84727, "epoch": 504} {"train_loss": -9.32419490814209, "global_step": 84728, "epoch": 504} {"train_loss": -9.38487434387207, "global_step": 84729, "epoch": 504} {"train_loss": -9.136835098266602, "global_step": 84730, "epoch": 504} {"train_loss": -9.49799633026123, "global_step": 84731, "epoch": 504} {"train_loss": -9.1729736328125, "global_step": 84732, "epoch": 504} {"train_loss": -9.258098602294922, "global_step": 84733, "epoch": 504} {"train_loss": -9.018089294433594, "global_step": 84734, "epoch": 504} {"train_loss": -9.412729263305664, "global_step": 84735, "epoch": 504} {"train_loss": -9.00103759765625, "global_step": 84736, "epoch": 504} {"train_loss": -8.863214492797852, "global_step": 84737, "epoch": 504} {"train_loss": -8.84599781036377, "global_step": 84738, "epoch": 504} {"train_loss": -8.843013763427734, "global_step": 84739, "epoch": 504} {"train_loss": -9.298559188842773, "global_step": 84740, "epoch": 504} {"train_loss": -8.703313827514648, "global_step": 84741, "epoch": 504} {"train_loss": -9.039917945861816, "global_step": 84742, "epoch": 504} {"train_loss": -9.060100555419922, "global_step": 84743, "epoch": 504} {"train_loss": -9.063413619995117, "global_step": 84744, "epoch": 504} {"train_loss": -8.953254699707031, "global_step": 84745, "epoch": 504} {"train_loss": -8.940732955932617, "global_step": 84746, "epoch": 504} {"train_loss": -9.099896430969238, "global_step": 84747, "epoch": 504} {"train_loss": -8.796333312988281, "global_step": 84748, "epoch": 504} {"train_loss": -8.875927925109863, "global_step": 84749, "epoch": 504} {"train_loss": -9.180289268493652, "global_step": 84750, "epoch": 504} {"train_loss": -9.137205123901367, "global_step": 84751, "epoch": 504} {"train_loss": -9.374786376953125, "global_step": 84752, "epoch": 504} {"train_loss": -9.276224136352539, "global_step": 84753, "epoch": 504} {"train_loss": -9.303997039794922, "global_step": 84754, "epoch": 504} {"train_loss": -9.45345401763916, "global_step": 84755, "epoch": 504} {"train_loss": -9.292464256286621, "global_step": 84756, "epoch": 504} {"train_loss": -9.417420387268066, "global_step": 84757, "epoch": 504} {"train_loss": -9.323236465454102, "global_step": 84758, "epoch": 504} {"train_loss": -9.41325569152832, "global_step": 84759, "epoch": 504} {"train_loss": -9.311508178710938, "global_step": 84760, "epoch": 504} {"train_loss": -9.560043334960938, "global_step": 84761, "epoch": 504} {"train_loss": -9.426681518554688, "global_step": 84762, "epoch": 504} {"train_loss": -9.23604679107666, "global_step": 84763, "epoch": 504} {"train_loss": -9.270454406738281, "global_step": 84764, "epoch": 504} {"train_loss": -9.619802474975586, "global_step": 84765, "epoch": 504} {"train_loss": -9.300504684448242, "global_step": 84766, "epoch": 504} {"train_loss": -9.239744186401367, "global_step": 84767, "epoch": 504} {"train_loss": -9.394886016845703, "global_step": 84768, "epoch": 504} {"train_loss": -9.529809951782227, "global_step": 84769, "epoch": 504} {"train_loss": -9.489994049072266, "global_step": 84770, "epoch": 504} {"train_loss": -9.20132827758789, "global_step": 84771, "epoch": 504} {"train_loss": -9.538204193115234, "global_step": 84772, "epoch": 504} {"train_loss": -9.001771926879883, "global_step": 84773, "epoch": 504} {"train_loss": -9.640952110290527, "global_step": 84774, "epoch": 504} {"train_loss": -8.959964752197266, "global_step": 84775, "epoch": 504} {"train_loss": -9.074459075927734, "global_step": 84776, "epoch": 504} {"train_loss": -9.04936695098877, "global_step": 84777, "epoch": 504} {"train_loss": -8.954046249389648, "global_step": 84778, "epoch": 504} {"train_loss": -9.049982070922852, "global_step": 84779, "epoch": 504} {"train_loss": -8.917259216308594, "global_step": 84780, "epoch": 504} {"train_loss": -9.104900360107422, "global_step": 84781, "epoch": 504} {"train_loss": -9.041532516479492, "global_step": 84782, "epoch": 504} {"train_loss": -9.170042037963867, "global_step": 84783, "epoch": 504} {"train_loss": -9.170393943786621, "global_step": 84784, "epoch": 504} {"train_loss": -9.077322006225586, "global_step": 84785, "epoch": 504} {"train_loss": -8.946924209594727, "global_step": 84786, "epoch": 504} {"train_loss": -9.254905700683594, "global_step": 84787, "epoch": 504} {"train_loss": -8.976140975952148, "global_step": 84788, "epoch": 504} {"train_loss": -9.294929504394531, "global_step": 84789, "epoch": 504} {"train_loss": -9.379388809204102, "global_step": 84790, "epoch": 504} {"train_loss": -9.12321662902832, "global_step": 84791, "epoch": 504} {"train_loss": -9.214815139770508, "global_step": 84792, "epoch": 504} {"train_loss": -9.203104019165039, "global_step": 84793, "epoch": 504} {"train_loss": -9.176286697387695, "global_step": 84794, "epoch": 504} {"train_loss": -9.16022777557373, "global_step": 84795, "epoch": 504} {"train_loss": -9.343130111694336, "global_step": 84796, "epoch": 504} {"train_loss": -8.896065711975098, "global_step": 84797, "epoch": 504} {"train_loss": -9.266290664672852, "global_step": 84798, "epoch": 504} {"train_loss": -9.228069305419922, "global_step": 84799, "epoch": 504} {"train_loss": -9.114046096801758, "global_step": 84800, "epoch": 504} {"train_loss": -9.247201919555664, "global_step": 84801, "epoch": 504} {"train_loss": -9.186726570129395, "global_step": 84802, "epoch": 504} {"train_loss": -9.415977478027344, "global_step": 84803, "epoch": 504} {"train_loss": -9.460336685180664, "global_step": 84804, "epoch": 504} {"train_loss": -9.291825294494629, "global_step": 84805, "epoch": 504} {"train_loss": -9.344776153564453, "global_step": 84806, "epoch": 504} {"train_loss": -9.130745887756348, "global_step": 84807, "epoch": 504} {"train_loss": -9.150541305541992, "global_step": 84808, "epoch": 504} {"train_loss": -9.251628875732422, "global_step": 84809, "epoch": 504} {"train_loss": -9.138887405395508, "global_step": 84810, "epoch": 504} {"train_loss": -9.5106201171875, "global_step": 84811, "epoch": 504} {"train_loss": -9.348125457763672, "global_step": 84812, "epoch": 504} {"train_loss": -9.425668716430664, "global_step": 84813, "epoch": 504} {"train_loss": -9.275701522827148, "global_step": 84814, "epoch": 504} {"train_loss": -9.148061752319336, "global_step": 84815, "epoch": 504} {"train_loss": -9.4443359375, "global_step": 84816, "epoch": 504} {"train_loss": -9.323887825012207, "global_step": 84817, "epoch": 504} {"train_loss": -9.161561965942383, "global_step": 84818, "epoch": 504} {"train_loss": -9.195183753967285, "global_step": 84819, "epoch": 504} {"train_loss": -9.272515296936035, "global_step": 84820, "epoch": 504} {"train_loss": -9.047809600830078, "global_step": 84821, "epoch": 504} {"train_loss": -9.17816162109375, "global_step": 84822, "epoch": 504} {"train_loss": -9.289597511291504, "global_step": 84823, "epoch": 504} {"train_loss": -9.42404556274414, "global_step": 84824, "epoch": 504} {"train_loss": -9.091629028320312, "global_step": 84825, "epoch": 504} {"train_loss": -9.178946495056152, "global_step": 84826, "epoch": 504} {"train_loss": -9.202630043029785, "global_step": 84827, "epoch": 504} {"train_loss": -8.818283081054688, "global_step": 84828, "epoch": 504} {"train_loss": -9.554474830627441, "global_step": 84829, "epoch": 504} {"train_loss": -8.98477840423584, "global_step": 84830, "epoch": 504} {"train_loss": -9.160467147827148, "global_step": 84831, "epoch": 504} {"train_loss": -9.042154312133789, "global_step": 84832, "epoch": 504} {"train_loss": -9.248449325561523, "global_step": 84833, "epoch": 504} {"train_loss": -8.859159469604492, "global_step": 84834, "epoch": 504} {"train_loss": -9.191910743713379, "global_step": 84835, "epoch": 504} {"train_loss": -9.152652740478516, "global_step": 84836, "epoch": 504} {"train_loss": -9.205422401428223, "global_step": 84837, "epoch": 504} {"train_loss": -9.105777740478516, "global_step": 84838, "epoch": 504} {"train_loss": -9.261417229970297, "global_step": 84839, "epoch": 504, "val_loss": 199243.84375} {"train_loss": -9.00442123413086, "global_step": 84840, "epoch": 505} {"train_loss": -9.23155689239502, "global_step": 84841, "epoch": 505} {"train_loss": -9.367305755615234, "global_step": 84842, "epoch": 505} {"train_loss": -9.354409217834473, "global_step": 84843, "epoch": 505} {"train_loss": -9.19175910949707, "global_step": 84844, "epoch": 505} {"train_loss": -9.220393180847168, "global_step": 84845, "epoch": 505} {"train_loss": -9.192832946777344, "global_step": 84846, "epoch": 505} {"train_loss": -9.231048583984375, "global_step": 84847, "epoch": 505} {"train_loss": -9.28642463684082, "global_step": 84848, "epoch": 505} {"train_loss": -9.276925086975098, "global_step": 84849, "epoch": 505} {"train_loss": -9.564038276672363, "global_step": 84850, "epoch": 505} {"train_loss": -9.47227668762207, "global_step": 84851, "epoch": 505} {"train_loss": -9.345439910888672, "global_step": 84852, "epoch": 505} {"train_loss": -9.292985916137695, "global_step": 84853, "epoch": 505} {"train_loss": -9.075273513793945, "global_step": 84854, "epoch": 505} {"train_loss": -9.491891860961914, "global_step": 84855, "epoch": 505} {"train_loss": -9.019901275634766, "global_step": 84856, "epoch": 505} {"train_loss": -9.58983039855957, "global_step": 84857, "epoch": 505} {"train_loss": -9.385011672973633, "global_step": 84858, "epoch": 505} {"train_loss": -9.50561809539795, "global_step": 84859, "epoch": 505} {"train_loss": -9.333447456359863, "global_step": 84860, "epoch": 505} {"train_loss": -9.224705696105957, "global_step": 84861, "epoch": 505} {"train_loss": -9.44997787475586, "global_step": 84862, "epoch": 505} {"train_loss": -9.45152473449707, "global_step": 84863, "epoch": 505} {"train_loss": -9.435344696044922, "global_step": 84864, "epoch": 505} {"train_loss": -9.376092910766602, "global_step": 84865, "epoch": 505} {"train_loss": -9.175933837890625, "global_step": 84866, "epoch": 505} {"train_loss": -9.393704414367676, "global_step": 84867, "epoch": 505} {"train_loss": -9.172286987304688, "global_step": 84868, "epoch": 505} {"train_loss": -9.427675247192383, "global_step": 84869, "epoch": 505} {"train_loss": -8.989542007446289, "global_step": 84870, "epoch": 505} {"train_loss": -9.045604705810547, "global_step": 84871, "epoch": 505} {"train_loss": -9.314019203186035, "global_step": 84872, "epoch": 505} {"train_loss": -9.003300666809082, "global_step": 84873, "epoch": 505} {"train_loss": -9.600159645080566, "global_step": 84874, "epoch": 505} {"train_loss": -9.206903457641602, "global_step": 84875, "epoch": 505} {"train_loss": -9.362775802612305, "global_step": 84876, "epoch": 505} {"train_loss": -9.428312301635742, "global_step": 84877, "epoch": 505} {"train_loss": -9.328288078308105, "global_step": 84878, "epoch": 505} {"train_loss": -9.405736923217773, "global_step": 84879, "epoch": 505} {"train_loss": -9.417802810668945, "global_step": 84880, "epoch": 505} {"train_loss": -9.185399055480957, "global_step": 84881, "epoch": 505} {"train_loss": -8.765161514282227, "global_step": 84882, "epoch": 505} {"train_loss": -9.418134689331055, "global_step": 84883, "epoch": 505} {"train_loss": -9.333988189697266, "global_step": 84884, "epoch": 505} {"train_loss": -9.579202651977539, "global_step": 84885, "epoch": 505} {"train_loss": -9.30470085144043, "global_step": 84886, "epoch": 505} {"train_loss": -9.090904235839844, "global_step": 84887, "epoch": 505} {"train_loss": -9.150313377380371, "global_step": 84888, "epoch": 505} {"train_loss": -9.23441219329834, "global_step": 84889, "epoch": 505} {"train_loss": -9.326108932495117, "global_step": 84890, "epoch": 505} {"train_loss": -9.025586128234863, "global_step": 84891, "epoch": 505} {"train_loss": -9.173654556274414, "global_step": 84892, "epoch": 505} {"train_loss": -9.09814453125, "global_step": 84893, "epoch": 505} {"train_loss": -9.090564727783203, "global_step": 84894, "epoch": 505} {"train_loss": -9.305730819702148, "global_step": 84895, "epoch": 505} {"train_loss": -9.421716690063477, "global_step": 84896, "epoch": 505} {"train_loss": -9.177967071533203, "global_step": 84897, "epoch": 505} {"train_loss": -9.461634635925293, "global_step": 84898, "epoch": 505} {"train_loss": -9.343308448791504, "global_step": 84899, "epoch": 505} {"train_loss": -9.446977615356445, "global_step": 84900, "epoch": 505} {"train_loss": -9.22630786895752, "global_step": 84901, "epoch": 505} {"train_loss": -9.457308769226074, "global_step": 84902, "epoch": 505} {"train_loss": -9.178248405456543, "global_step": 84903, "epoch": 505} {"train_loss": -9.501232147216797, "global_step": 84904, "epoch": 505} {"train_loss": -9.445703506469727, "global_step": 84905, "epoch": 505} {"train_loss": -9.524190902709961, "global_step": 84906, "epoch": 505} {"train_loss": -9.538712501525879, "global_step": 84907, "epoch": 505} {"train_loss": -9.602340698242188, "global_step": 84908, "epoch": 505} {"train_loss": -9.486526489257812, "global_step": 84909, "epoch": 505} {"train_loss": -9.702348709106445, "global_step": 84910, "epoch": 505} {"train_loss": -9.375932693481445, "global_step": 84911, "epoch": 505} {"train_loss": -9.486668586730957, "global_step": 84912, "epoch": 505} {"train_loss": -9.557842254638672, "global_step": 84913, "epoch": 505} {"train_loss": -9.526933670043945, "global_step": 84914, "epoch": 505} {"train_loss": -9.285791397094727, "global_step": 84915, "epoch": 505} {"train_loss": -9.281698226928711, "global_step": 84916, "epoch": 505} {"train_loss": -9.546977996826172, "global_step": 84917, "epoch": 505} {"train_loss": -9.36202621459961, "global_step": 84918, "epoch": 505} {"train_loss": -9.160392761230469, "global_step": 84919, "epoch": 505} {"train_loss": -9.3553466796875, "global_step": 84920, "epoch": 505} {"train_loss": -9.421976089477539, "global_step": 84921, "epoch": 505} {"train_loss": -9.213849067687988, "global_step": 84922, "epoch": 505} {"train_loss": -9.516561508178711, "global_step": 84923, "epoch": 505} {"train_loss": -9.231636047363281, "global_step": 84924, "epoch": 505} {"train_loss": -9.497198104858398, "global_step": 84925, "epoch": 505} {"train_loss": -9.081927299499512, "global_step": 84926, "epoch": 505} {"train_loss": -9.50157356262207, "global_step": 84927, "epoch": 505} {"train_loss": -9.555328369140625, "global_step": 84928, "epoch": 505} {"train_loss": -9.610212326049805, "global_step": 84929, "epoch": 505} {"train_loss": -9.5552978515625, "global_step": 84930, "epoch": 505} {"train_loss": -9.649815559387207, "global_step": 84931, "epoch": 505} {"train_loss": -9.296735763549805, "global_step": 84932, "epoch": 505} {"train_loss": -9.424217224121094, "global_step": 84933, "epoch": 505} {"train_loss": -9.464311599731445, "global_step": 84934, "epoch": 505} {"train_loss": -9.606584548950195, "global_step": 84935, "epoch": 505} {"train_loss": -9.080560684204102, "global_step": 84936, "epoch": 505} {"train_loss": -9.438345909118652, "global_step": 84937, "epoch": 505} {"train_loss": -9.223451614379883, "global_step": 84938, "epoch": 505} {"train_loss": -9.297586441040039, "global_step": 84939, "epoch": 505} {"train_loss": -9.159170150756836, "global_step": 84940, "epoch": 505} {"train_loss": -9.402069091796875, "global_step": 84941, "epoch": 505} {"train_loss": -9.315672874450684, "global_step": 84942, "epoch": 505} {"train_loss": -9.120920181274414, "global_step": 84943, "epoch": 505} {"train_loss": -9.028369903564453, "global_step": 84944, "epoch": 505} {"train_loss": -8.919683456420898, "global_step": 84945, "epoch": 505} {"train_loss": -8.936845779418945, "global_step": 84946, "epoch": 505} {"train_loss": -9.169038772583008, "global_step": 84947, "epoch": 505} {"train_loss": -8.920635223388672, "global_step": 84948, "epoch": 505} {"train_loss": -8.948213577270508, "global_step": 84949, "epoch": 505} {"train_loss": -9.294261932373047, "global_step": 84950, "epoch": 505} {"train_loss": -9.134529113769531, "global_step": 84951, "epoch": 505} {"train_loss": -9.398337364196777, "global_step": 84952, "epoch": 505} {"train_loss": -9.367627143859863, "global_step": 84953, "epoch": 505} {"train_loss": -9.410137176513672, "global_step": 84954, "epoch": 505} {"train_loss": -9.236665725708008, "global_step": 84955, "epoch": 505} {"train_loss": -9.275664329528809, "global_step": 84956, "epoch": 505} {"train_loss": -9.20229721069336, "global_step": 84957, "epoch": 505} {"train_loss": -9.430892944335938, "global_step": 84958, "epoch": 505} {"train_loss": -9.240540504455566, "global_step": 84959, "epoch": 505} {"train_loss": -9.31055736541748, "global_step": 84960, "epoch": 505} {"train_loss": -9.284784317016602, "global_step": 84961, "epoch": 505} {"train_loss": -9.057660102844238, "global_step": 84962, "epoch": 505} {"train_loss": -9.481797218322754, "global_step": 84963, "epoch": 505} {"train_loss": -9.313727378845215, "global_step": 84964, "epoch": 505} {"train_loss": -9.347501754760742, "global_step": 84965, "epoch": 505} {"train_loss": -9.475333213806152, "global_step": 84966, "epoch": 505} {"train_loss": -8.941163063049316, "global_step": 84967, "epoch": 505} {"train_loss": -9.303403854370117, "global_step": 84968, "epoch": 505} {"train_loss": -9.159302711486816, "global_step": 84969, "epoch": 505} {"train_loss": -9.256580352783203, "global_step": 84970, "epoch": 505} {"train_loss": -9.307104110717773, "global_step": 84971, "epoch": 505} {"train_loss": -9.034497261047363, "global_step": 84972, "epoch": 505} {"train_loss": -9.14501953125, "global_step": 84973, "epoch": 505} {"train_loss": -8.971243858337402, "global_step": 84974, "epoch": 505} {"train_loss": -9.045215606689453, "global_step": 84975, "epoch": 505} {"train_loss": -9.01167106628418, "global_step": 84976, "epoch": 505} {"train_loss": -9.203916549682617, "global_step": 84977, "epoch": 505} {"train_loss": -9.33029556274414, "global_step": 84978, "epoch": 505} {"train_loss": -9.313315391540527, "global_step": 84979, "epoch": 505} {"train_loss": -9.16796588897705, "global_step": 84980, "epoch": 505} {"train_loss": -9.1726655960083, "global_step": 84981, "epoch": 505} {"train_loss": -8.558412551879883, "global_step": 84982, "epoch": 505} {"train_loss": -9.08707046508789, "global_step": 84983, "epoch": 505} {"train_loss": -8.747673034667969, "global_step": 84984, "epoch": 505} {"train_loss": -9.112003326416016, "global_step": 84985, "epoch": 505} {"train_loss": -9.125885009765625, "global_step": 84986, "epoch": 505} {"train_loss": -9.056398391723633, "global_step": 84987, "epoch": 505} {"train_loss": -9.286262512207031, "global_step": 84988, "epoch": 505} {"train_loss": -9.275827407836914, "global_step": 84989, "epoch": 505} {"train_loss": -9.00634765625, "global_step": 84990, "epoch": 505} {"train_loss": -9.07075023651123, "global_step": 84991, "epoch": 505} {"train_loss": -9.407325744628906, "global_step": 84992, "epoch": 505} {"train_loss": -9.303232192993164, "global_step": 84993, "epoch": 505} {"train_loss": -9.28287124633789, "global_step": 84994, "epoch": 505} {"train_loss": -9.003778457641602, "global_step": 84995, "epoch": 505} {"train_loss": -9.27273178100586, "global_step": 84996, "epoch": 505} {"train_loss": -9.149998664855957, "global_step": 84997, "epoch": 505} {"train_loss": -8.96474552154541, "global_step": 84998, "epoch": 505} {"train_loss": -9.531488418579102, "global_step": 84999, "epoch": 505} {"train_loss": -9.128929138183594, "global_step": 85000, "epoch": 505} {"train_loss": -9.290802001953125, "global_step": 85001, "epoch": 505} {"train_loss": -9.257431030273438, "global_step": 85002, "epoch": 505} {"train_loss": -9.39070987701416, "global_step": 85003, "epoch": 505} {"train_loss": -9.242212295532227, "global_step": 85004, "epoch": 505} {"train_loss": -9.280075073242188, "global_step": 85005, "epoch": 505} {"train_loss": -9.083909034729004, "global_step": 85006, "epoch": 505} {"train_loss": -9.277326481682914, "global_step": 85007, "epoch": 505, "val_loss": 199010.015625, "train_action_mse_error": 6.810710430145264} {"train_loss": -8.840513229370117, "global_step": 85008, "epoch": 506} {"train_loss": -9.297002792358398, "global_step": 85009, "epoch": 506} {"train_loss": -9.45711898803711, "global_step": 85010, "epoch": 506} {"train_loss": -8.977644920349121, "global_step": 85011, "epoch": 506} {"train_loss": -9.321563720703125, "global_step": 85012, "epoch": 506} {"train_loss": -9.19788932800293, "global_step": 85013, "epoch": 506} {"train_loss": -9.07686710357666, "global_step": 85014, "epoch": 506} {"train_loss": -9.267455101013184, "global_step": 85015, "epoch": 506} {"train_loss": -8.962212562561035, "global_step": 85016, "epoch": 506} {"train_loss": -8.980113983154297, "global_step": 85017, "epoch": 506} {"train_loss": -8.862127304077148, "global_step": 85018, "epoch": 506} {"train_loss": -8.937925338745117, "global_step": 85019, "epoch": 506} {"train_loss": -8.795256614685059, "global_step": 85020, "epoch": 506} {"train_loss": -9.216944694519043, "global_step": 85021, "epoch": 506} {"train_loss": -9.198766708374023, "global_step": 85022, "epoch": 506} {"train_loss": -8.8934326171875, "global_step": 85023, "epoch": 506} {"train_loss": -9.327893257141113, "global_step": 85024, "epoch": 506} {"train_loss": -9.154194831848145, "global_step": 85025, "epoch": 506} {"train_loss": -9.110037803649902, "global_step": 85026, "epoch": 506} {"train_loss": -9.06104850769043, "global_step": 85027, "epoch": 506} {"train_loss": -9.356792449951172, "global_step": 85028, "epoch": 506} {"train_loss": -9.363300323486328, "global_step": 85029, "epoch": 506} {"train_loss": -9.345218658447266, "global_step": 85030, "epoch": 506} {"train_loss": -9.461297988891602, "global_step": 85031, "epoch": 506} {"train_loss": -9.376827239990234, "global_step": 85032, "epoch": 506} {"train_loss": -9.414045333862305, "global_step": 85033, "epoch": 506} {"train_loss": -9.31324577331543, "global_step": 85034, "epoch": 506} {"train_loss": -9.41225528717041, "global_step": 85035, "epoch": 506} {"train_loss": -9.332093238830566, "global_step": 85036, "epoch": 506} {"train_loss": -9.450154304504395, "global_step": 85037, "epoch": 506} {"train_loss": -9.269267082214355, "global_step": 85038, "epoch": 506} {"train_loss": -9.550376892089844, "global_step": 85039, "epoch": 506} {"train_loss": -9.490870475769043, "global_step": 85040, "epoch": 506} {"train_loss": -9.27413558959961, "global_step": 85041, "epoch": 506} {"train_loss": -9.694070816040039, "global_step": 85042, "epoch": 506} {"train_loss": -9.435827255249023, "global_step": 85043, "epoch": 506} {"train_loss": -9.580581665039062, "global_step": 85044, "epoch": 506} {"train_loss": -9.508418083190918, "global_step": 85045, "epoch": 506} {"train_loss": -9.30722713470459, "global_step": 85046, "epoch": 506} {"train_loss": -9.6707763671875, "global_step": 85047, "epoch": 506} {"train_loss": -9.135217666625977, "global_step": 85048, "epoch": 506} {"train_loss": -9.546338081359863, "global_step": 85049, "epoch": 506} {"train_loss": -8.906206130981445, "global_step": 85050, "epoch": 506} {"train_loss": -9.35031795501709, "global_step": 85051, "epoch": 506} {"train_loss": -9.34583854675293, "global_step": 85052, "epoch": 506} {"train_loss": -9.615913391113281, "global_step": 85053, "epoch": 506} {"train_loss": -9.07918930053711, "global_step": 85054, "epoch": 506} {"train_loss": -9.608270645141602, "global_step": 85055, "epoch": 506} {"train_loss": -9.526938438415527, "global_step": 85056, "epoch": 506} {"train_loss": -9.277853012084961, "global_step": 85057, "epoch": 506} {"train_loss": -9.29921817779541, "global_step": 85058, "epoch": 506} {"train_loss": -9.521442413330078, "global_step": 85059, "epoch": 506} {"train_loss": -9.454681396484375, "global_step": 85060, "epoch": 506} {"train_loss": -9.613749504089355, "global_step": 85061, "epoch": 506} {"train_loss": -9.251469612121582, "global_step": 85062, "epoch": 506} {"train_loss": -9.342727661132812, "global_step": 85063, "epoch": 506} {"train_loss": -9.298404693603516, "global_step": 85064, "epoch": 506} {"train_loss": -9.186624526977539, "global_step": 85065, "epoch": 506} {"train_loss": -9.336603164672852, "global_step": 85066, "epoch": 506} {"train_loss": -8.90469741821289, "global_step": 85067, "epoch": 506} {"train_loss": -9.199871063232422, "global_step": 85068, "epoch": 506} {"train_loss": -9.16961669921875, "global_step": 85069, "epoch": 506} {"train_loss": -9.069080352783203, "global_step": 85070, "epoch": 506} {"train_loss": -9.20667839050293, "global_step": 85071, "epoch": 506} {"train_loss": -9.280200958251953, "global_step": 85072, "epoch": 506} {"train_loss": -9.456842422485352, "global_step": 85073, "epoch": 506} {"train_loss": -9.447319984436035, "global_step": 85074, "epoch": 506} {"train_loss": -9.281072616577148, "global_step": 85075, "epoch": 506} {"train_loss": -9.340557098388672, "global_step": 85076, "epoch": 506} {"train_loss": -9.24504280090332, "global_step": 85077, "epoch": 506} {"train_loss": -9.351005554199219, "global_step": 85078, "epoch": 506} {"train_loss": -9.448854446411133, "global_step": 85079, "epoch": 506} {"train_loss": -9.458881378173828, "global_step": 85080, "epoch": 506} {"train_loss": -9.482084274291992, "global_step": 85081, "epoch": 506} {"train_loss": -9.238401412963867, "global_step": 85082, "epoch": 506} {"train_loss": -9.586387634277344, "global_step": 85083, "epoch": 506} {"train_loss": -9.50714111328125, "global_step": 85084, "epoch": 506} {"train_loss": -9.365367889404297, "global_step": 85085, "epoch": 506} {"train_loss": -9.389228820800781, "global_step": 85086, "epoch": 506} {"train_loss": -8.939897537231445, "global_step": 85087, "epoch": 506} {"train_loss": -9.241971969604492, "global_step": 85088, "epoch": 506} {"train_loss": -9.24262809753418, "global_step": 85089, "epoch": 506} {"train_loss": -9.305779457092285, "global_step": 85090, "epoch": 506} {"train_loss": -9.170108795166016, "global_step": 85091, "epoch": 506} {"train_loss": -9.049671173095703, "global_step": 85092, "epoch": 506} {"train_loss": -9.21803092956543, "global_step": 85093, "epoch": 506} {"train_loss": -9.29137134552002, "global_step": 85094, "epoch": 506} {"train_loss": -9.006964683532715, "global_step": 85095, "epoch": 506} {"train_loss": -9.457931518554688, "global_step": 85096, "epoch": 506} {"train_loss": -9.23310375213623, "global_step": 85097, "epoch": 506} {"train_loss": -9.31840705871582, "global_step": 85098, "epoch": 506} {"train_loss": -9.335671424865723, "global_step": 85099, "epoch": 506} {"train_loss": -9.284423828125, "global_step": 85100, "epoch": 506} {"train_loss": -9.220455169677734, "global_step": 85101, "epoch": 506} {"train_loss": -9.400609970092773, "global_step": 85102, "epoch": 506} {"train_loss": -9.292774200439453, "global_step": 85103, "epoch": 506} {"train_loss": -9.402881622314453, "global_step": 85104, "epoch": 506} {"train_loss": -9.402502059936523, "global_step": 85105, "epoch": 506} {"train_loss": -9.433426856994629, "global_step": 85106, "epoch": 506} {"train_loss": -9.361984252929688, "global_step": 85107, "epoch": 506} {"train_loss": -9.520970344543457, "global_step": 85108, "epoch": 506} {"train_loss": -9.371703147888184, "global_step": 85109, "epoch": 506} {"train_loss": -9.513175964355469, "global_step": 85110, "epoch": 506} {"train_loss": -9.387005805969238, "global_step": 85111, "epoch": 506} {"train_loss": -9.414203643798828, "global_step": 85112, "epoch": 506} {"train_loss": -9.108692169189453, "global_step": 85113, "epoch": 506} {"train_loss": -9.386311531066895, "global_step": 85114, "epoch": 506} {"train_loss": -9.173179626464844, "global_step": 85115, "epoch": 506} {"train_loss": -9.390811920166016, "global_step": 85116, "epoch": 506} {"train_loss": -9.382362365722656, "global_step": 85117, "epoch": 506} {"train_loss": -9.475643157958984, "global_step": 85118, "epoch": 506} {"train_loss": -9.322781562805176, "global_step": 85119, "epoch": 506} {"train_loss": -9.168798446655273, "global_step": 85120, "epoch": 506} {"train_loss": -9.405533790588379, "global_step": 85121, "epoch": 506} {"train_loss": -9.442550659179688, "global_step": 85122, "epoch": 506} {"train_loss": -9.305824279785156, "global_step": 85123, "epoch": 506} {"train_loss": -9.128955841064453, "global_step": 85124, "epoch": 506} {"train_loss": -9.172112464904785, "global_step": 85125, "epoch": 506} {"train_loss": -9.499471664428711, "global_step": 85126, "epoch": 506} {"train_loss": -9.196133613586426, "global_step": 85127, "epoch": 506} {"train_loss": -9.457799911499023, "global_step": 85128, "epoch": 506} {"train_loss": -9.256978034973145, "global_step": 85129, "epoch": 506} {"train_loss": -9.382197380065918, "global_step": 85130, "epoch": 506} {"train_loss": -9.297039031982422, "global_step": 85131, "epoch": 506} {"train_loss": -9.317878723144531, "global_step": 85132, "epoch": 506} {"train_loss": -9.334657669067383, "global_step": 85133, "epoch": 506} {"train_loss": -9.490974426269531, "global_step": 85134, "epoch": 506} {"train_loss": -9.189070701599121, "global_step": 85135, "epoch": 506} {"train_loss": -9.419351577758789, "global_step": 85136, "epoch": 506} {"train_loss": -9.257997512817383, "global_step": 85137, "epoch": 506} {"train_loss": -8.826826095581055, "global_step": 85138, "epoch": 506} {"train_loss": -9.389521598815918, "global_step": 85139, "epoch": 506} {"train_loss": -8.781778335571289, "global_step": 85140, "epoch": 506} {"train_loss": -9.323572158813477, "global_step": 85141, "epoch": 506} {"train_loss": -8.626049041748047, "global_step": 85142, "epoch": 506} {"train_loss": -8.733083724975586, "global_step": 85143, "epoch": 506} {"train_loss": -9.257521629333496, "global_step": 85144, "epoch": 506} {"train_loss": -9.142047882080078, "global_step": 85145, "epoch": 506} {"train_loss": -8.963134765625, "global_step": 85146, "epoch": 506} {"train_loss": -8.944623947143555, "global_step": 85147, "epoch": 506} {"train_loss": -8.955718994140625, "global_step": 85148, "epoch": 506} {"train_loss": -9.09909725189209, "global_step": 85149, "epoch": 506} {"train_loss": -9.022443771362305, "global_step": 85150, "epoch": 506} {"train_loss": -9.122978210449219, "global_step": 85151, "epoch": 506} {"train_loss": -9.318647384643555, "global_step": 85152, "epoch": 506} {"train_loss": -9.238637924194336, "global_step": 85153, "epoch": 506} {"train_loss": -9.102021217346191, "global_step": 85154, "epoch": 506} {"train_loss": -9.230560302734375, "global_step": 85155, "epoch": 506} {"train_loss": -9.243614196777344, "global_step": 85156, "epoch": 506} {"train_loss": -9.370622634887695, "global_step": 85157, "epoch": 506} {"train_loss": -9.311761856079102, "global_step": 85158, "epoch": 506} {"train_loss": -9.419971466064453, "global_step": 85159, "epoch": 506} {"train_loss": -9.418865203857422, "global_step": 85160, "epoch": 506} {"train_loss": -9.420576095581055, "global_step": 85161, "epoch": 506} {"train_loss": -9.532081604003906, "global_step": 85162, "epoch": 506} {"train_loss": -9.433018684387207, "global_step": 85163, "epoch": 506} {"train_loss": -9.437200546264648, "global_step": 85164, "epoch": 506} {"train_loss": -9.316584587097168, "global_step": 85165, "epoch": 506} {"train_loss": -9.386821746826172, "global_step": 85166, "epoch": 506} {"train_loss": -9.447396278381348, "global_step": 85167, "epoch": 506} {"train_loss": -9.360795974731445, "global_step": 85168, "epoch": 506} {"train_loss": -9.416482925415039, "global_step": 85169, "epoch": 506} {"train_loss": -9.668627738952637, "global_step": 85170, "epoch": 506} {"train_loss": -9.461477279663086, "global_step": 85171, "epoch": 506} {"train_loss": -9.478464126586914, "global_step": 85172, "epoch": 506} {"train_loss": -9.158859252929688, "global_step": 85173, "epoch": 506} {"train_loss": -9.323392868041992, "global_step": 85174, "epoch": 506} {"train_loss": -9.286919156710306, "global_step": 85175, "epoch": 506, "val_loss": 201049.03125} {"train_loss": -9.532891273498535, "global_step": 85176, "epoch": 507} {"train_loss": -9.313694953918457, "global_step": 85177, "epoch": 507} {"train_loss": -9.289546966552734, "global_step": 85178, "epoch": 507} {"train_loss": -9.284882545471191, "global_step": 85179, "epoch": 507} {"train_loss": -9.310257911682129, "global_step": 85180, "epoch": 507} {"train_loss": -9.384418487548828, "global_step": 85181, "epoch": 507} {"train_loss": -9.382307052612305, "global_step": 85182, "epoch": 507} {"train_loss": -9.43315315246582, "global_step": 85183, "epoch": 507} {"train_loss": -9.374053001403809, "global_step": 85184, "epoch": 507} {"train_loss": -9.409377098083496, "global_step": 85185, "epoch": 507} {"train_loss": -9.276349067687988, "global_step": 85186, "epoch": 507} {"train_loss": -9.55647087097168, "global_step": 85187, "epoch": 507} {"train_loss": -9.352743148803711, "global_step": 85188, "epoch": 507} {"train_loss": -9.216897010803223, "global_step": 85189, "epoch": 507} {"train_loss": -9.331033706665039, "global_step": 85190, "epoch": 507} {"train_loss": -9.324697494506836, "global_step": 85191, "epoch": 507} {"train_loss": -9.563587188720703, "global_step": 85192, "epoch": 507} {"train_loss": -9.318338394165039, "global_step": 85193, "epoch": 507} {"train_loss": -9.281621932983398, "global_step": 85194, "epoch": 507} {"train_loss": -9.385090827941895, "global_step": 85195, "epoch": 507} {"train_loss": -9.28546142578125, "global_step": 85196, "epoch": 507} {"train_loss": -9.299684524536133, "global_step": 85197, "epoch": 507} {"train_loss": -9.208410263061523, "global_step": 85198, "epoch": 507} {"train_loss": -9.019810676574707, "global_step": 85199, "epoch": 507} {"train_loss": -9.280998229980469, "global_step": 85200, "epoch": 507} {"train_loss": -9.09085750579834, "global_step": 85201, "epoch": 507} {"train_loss": -9.275924682617188, "global_step": 85202, "epoch": 507} {"train_loss": -9.356487274169922, "global_step": 85203, "epoch": 507} {"train_loss": -9.348653793334961, "global_step": 85204, "epoch": 507} {"train_loss": -9.144935607910156, "global_step": 85205, "epoch": 507} {"train_loss": -9.16978645324707, "global_step": 85206, "epoch": 507} {"train_loss": -9.371994972229004, "global_step": 85207, "epoch": 507} {"train_loss": -9.138916015625, "global_step": 85208, "epoch": 507} {"train_loss": -9.543843269348145, "global_step": 85209, "epoch": 507} {"train_loss": -9.18045425415039, "global_step": 85210, "epoch": 507} {"train_loss": -9.39213752746582, "global_step": 85211, "epoch": 507} {"train_loss": -9.27391242980957, "global_step": 85212, "epoch": 507} {"train_loss": -9.464265823364258, "global_step": 85213, "epoch": 507} {"train_loss": -8.980327606201172, "global_step": 85214, "epoch": 507} {"train_loss": -9.277166366577148, "global_step": 85215, "epoch": 507} {"train_loss": -8.957513809204102, "global_step": 85216, "epoch": 507} {"train_loss": -9.057348251342773, "global_step": 85217, "epoch": 507} {"train_loss": -9.261003494262695, "global_step": 85218, "epoch": 507} {"train_loss": -9.312752723693848, "global_step": 85219, "epoch": 507} {"train_loss": -9.08514404296875, "global_step": 85220, "epoch": 507} {"train_loss": -9.438222885131836, "global_step": 85221, "epoch": 507} {"train_loss": -9.177587509155273, "global_step": 85222, "epoch": 507} {"train_loss": -9.012114524841309, "global_step": 85223, "epoch": 507} {"train_loss": -9.259248733520508, "global_step": 85224, "epoch": 507} {"train_loss": -9.395861625671387, "global_step": 85225, "epoch": 507} {"train_loss": -9.282204627990723, "global_step": 85226, "epoch": 507} {"train_loss": -9.17601203918457, "global_step": 85227, "epoch": 507} {"train_loss": -8.890626907348633, "global_step": 85228, "epoch": 507} {"train_loss": -9.509071350097656, "global_step": 85229, "epoch": 507} {"train_loss": -9.151506423950195, "global_step": 85230, "epoch": 507} {"train_loss": -9.070158004760742, "global_step": 85231, "epoch": 507} {"train_loss": -9.320650100708008, "global_step": 85232, "epoch": 507} {"train_loss": -9.131790161132812, "global_step": 85233, "epoch": 507} {"train_loss": -9.274275779724121, "global_step": 85234, "epoch": 507} {"train_loss": -9.329095840454102, "global_step": 85235, "epoch": 507} {"train_loss": -9.816564559936523, "global_step": 85236, "epoch": 507} {"train_loss": -9.20760726928711, "global_step": 85237, "epoch": 507} {"train_loss": -9.254743576049805, "global_step": 85238, "epoch": 507} {"train_loss": -9.597477912902832, "global_step": 85239, "epoch": 507} {"train_loss": -9.274065971374512, "global_step": 85240, "epoch": 507} {"train_loss": -9.370108604431152, "global_step": 85241, "epoch": 507} {"train_loss": -9.151453971862793, "global_step": 85242, "epoch": 507} {"train_loss": -9.607970237731934, "global_step": 85243, "epoch": 507} {"train_loss": -9.463208198547363, "global_step": 85244, "epoch": 507} {"train_loss": -9.295820236206055, "global_step": 85245, "epoch": 507} {"train_loss": -9.203157424926758, "global_step": 85246, "epoch": 507} {"train_loss": -9.567776679992676, "global_step": 85247, "epoch": 507} {"train_loss": -9.374284744262695, "global_step": 85248, "epoch": 507} {"train_loss": -9.381814956665039, "global_step": 85249, "epoch": 507} {"train_loss": -9.220263481140137, "global_step": 85250, "epoch": 507} {"train_loss": -9.362188339233398, "global_step": 85251, "epoch": 507} {"train_loss": -9.42839241027832, "global_step": 85252, "epoch": 507} {"train_loss": -9.439436912536621, "global_step": 85253, "epoch": 507} {"train_loss": -9.396724700927734, "global_step": 85254, "epoch": 507} {"train_loss": -9.249275207519531, "global_step": 85255, "epoch": 507} {"train_loss": -9.493682861328125, "global_step": 85256, "epoch": 507} {"train_loss": -9.288528442382812, "global_step": 85257, "epoch": 507} {"train_loss": -9.479456901550293, "global_step": 85258, "epoch": 507} {"train_loss": -9.29132080078125, "global_step": 85259, "epoch": 507} {"train_loss": -9.497398376464844, "global_step": 85260, "epoch": 507} {"train_loss": -9.56013298034668, "global_step": 85261, "epoch": 507} {"train_loss": -9.411870956420898, "global_step": 85262, "epoch": 507} {"train_loss": -9.294673919677734, "global_step": 85263, "epoch": 507} {"train_loss": -9.175372123718262, "global_step": 85264, "epoch": 507} {"train_loss": -9.246477127075195, "global_step": 85265, "epoch": 507} {"train_loss": -9.366826057434082, "global_step": 85266, "epoch": 507} {"train_loss": -9.229328155517578, "global_step": 85267, "epoch": 507} {"train_loss": -9.561986923217773, "global_step": 85268, "epoch": 507} {"train_loss": -9.298080444335938, "global_step": 85269, "epoch": 507} {"train_loss": -9.378213882446289, "global_step": 85270, "epoch": 507} {"train_loss": -9.353265762329102, "global_step": 85271, "epoch": 507} {"train_loss": -9.311832427978516, "global_step": 85272, "epoch": 507} {"train_loss": -9.16048812866211, "global_step": 85273, "epoch": 507} {"train_loss": -9.174307823181152, "global_step": 85274, "epoch": 507} {"train_loss": -9.378284454345703, "global_step": 85275, "epoch": 507} {"train_loss": -9.07101058959961, "global_step": 85276, "epoch": 507} {"train_loss": -8.737116813659668, "global_step": 85277, "epoch": 507} {"train_loss": -9.232915878295898, "global_step": 85278, "epoch": 507} {"train_loss": -9.204633712768555, "global_step": 85279, "epoch": 507} {"train_loss": -9.065321922302246, "global_step": 85280, "epoch": 507} {"train_loss": -9.325214385986328, "global_step": 85281, "epoch": 507} {"train_loss": -9.21941089630127, "global_step": 85282, "epoch": 507} {"train_loss": -9.109302520751953, "global_step": 85283, "epoch": 507} {"train_loss": -9.332942962646484, "global_step": 85284, "epoch": 507} {"train_loss": -9.543708801269531, "global_step": 85285, "epoch": 507} {"train_loss": -9.272480010986328, "global_step": 85286, "epoch": 507} {"train_loss": -9.446535110473633, "global_step": 85287, "epoch": 507} {"train_loss": -9.204052925109863, "global_step": 85288, "epoch": 507} {"train_loss": -9.327794075012207, "global_step": 85289, "epoch": 507} {"train_loss": -9.290935516357422, "global_step": 85290, "epoch": 507} {"train_loss": -9.281692504882812, "global_step": 85291, "epoch": 507} {"train_loss": -9.567626953125, "global_step": 85292, "epoch": 507} {"train_loss": -9.321344375610352, "global_step": 85293, "epoch": 507} {"train_loss": -9.28739070892334, "global_step": 85294, "epoch": 507} {"train_loss": -9.120059967041016, "global_step": 85295, "epoch": 507} {"train_loss": -9.144538879394531, "global_step": 85296, "epoch": 507} {"train_loss": -9.498074531555176, "global_step": 85297, "epoch": 507} {"train_loss": -9.309586524963379, "global_step": 85298, "epoch": 507} {"train_loss": -9.364694595336914, "global_step": 85299, "epoch": 507} {"train_loss": -9.540475845336914, "global_step": 85300, "epoch": 507} {"train_loss": -9.367874145507812, "global_step": 85301, "epoch": 507} {"train_loss": -9.210920333862305, "global_step": 85302, "epoch": 507} {"train_loss": -9.29342269897461, "global_step": 85303, "epoch": 507} {"train_loss": -9.067063331604004, "global_step": 85304, "epoch": 507} {"train_loss": -9.180967330932617, "global_step": 85305, "epoch": 507} {"train_loss": -9.274311065673828, "global_step": 85306, "epoch": 507} {"train_loss": -9.491325378417969, "global_step": 85307, "epoch": 507} {"train_loss": -9.136167526245117, "global_step": 85308, "epoch": 507} {"train_loss": -9.34434986114502, "global_step": 85309, "epoch": 507} {"train_loss": -9.071675300598145, "global_step": 85310, "epoch": 507} {"train_loss": -9.164323806762695, "global_step": 85311, "epoch": 507} {"train_loss": -9.016277313232422, "global_step": 85312, "epoch": 507} {"train_loss": -9.381190299987793, "global_step": 85313, "epoch": 507} {"train_loss": -9.253000259399414, "global_step": 85314, "epoch": 507} {"train_loss": -9.13568115234375, "global_step": 85315, "epoch": 507} {"train_loss": -9.281882286071777, "global_step": 85316, "epoch": 507} {"train_loss": -9.148815155029297, "global_step": 85317, "epoch": 507} {"train_loss": -9.005699157714844, "global_step": 85318, "epoch": 507} {"train_loss": -8.942781448364258, "global_step": 85319, "epoch": 507} {"train_loss": -9.060995101928711, "global_step": 85320, "epoch": 507} {"train_loss": -9.127610206604004, "global_step": 85321, "epoch": 507} {"train_loss": -9.243204116821289, "global_step": 85322, "epoch": 507} {"train_loss": -9.108729362487793, "global_step": 85323, "epoch": 507} {"train_loss": -9.033440589904785, "global_step": 85324, "epoch": 507} {"train_loss": -9.30251693725586, "global_step": 85325, "epoch": 507} {"train_loss": -9.041706085205078, "global_step": 85326, "epoch": 507} {"train_loss": -9.24482536315918, "global_step": 85327, "epoch": 507} {"train_loss": -9.246834754943848, "global_step": 85328, "epoch": 507} {"train_loss": -9.232680320739746, "global_step": 85329, "epoch": 507} {"train_loss": -9.267072677612305, "global_step": 85330, "epoch": 507} {"train_loss": -9.2237548828125, "global_step": 85331, "epoch": 507} {"train_loss": -9.004718780517578, "global_step": 85332, "epoch": 507} {"train_loss": -9.163055419921875, "global_step": 85333, "epoch": 507} {"train_loss": -9.240509033203125, "global_step": 85334, "epoch": 507} {"train_loss": -9.333035469055176, "global_step": 85335, "epoch": 507} {"train_loss": -9.20564079284668, "global_step": 85336, "epoch": 507} {"train_loss": -9.331268310546875, "global_step": 85337, "epoch": 507} {"train_loss": -9.040361404418945, "global_step": 85338, "epoch": 507} {"train_loss": -9.396224975585938, "global_step": 85339, "epoch": 507} {"train_loss": -8.873845100402832, "global_step": 85340, "epoch": 507} {"train_loss": -8.941557884216309, "global_step": 85341, "epoch": 507} {"train_loss": -9.26491928100586, "global_step": 85342, "epoch": 507} {"train_loss": -9.27273964881897, "global_step": 85343, "epoch": 507, "val_loss": 201366.90625} {"train_loss": -9.177581787109375, "global_step": 85344, "epoch": 508} {"train_loss": -8.96030044555664, "global_step": 85345, "epoch": 508} {"train_loss": -8.868412017822266, "global_step": 85346, "epoch": 508} {"train_loss": -9.377784729003906, "global_step": 85347, "epoch": 508} {"train_loss": -8.791250228881836, "global_step": 85348, "epoch": 508} {"train_loss": -9.186117172241211, "global_step": 85349, "epoch": 508} {"train_loss": -8.728293418884277, "global_step": 85350, "epoch": 508} {"train_loss": -9.113091468811035, "global_step": 85351, "epoch": 508} {"train_loss": -8.969292640686035, "global_step": 85352, "epoch": 508} {"train_loss": -9.128519058227539, "global_step": 85353, "epoch": 508} {"train_loss": -9.083746910095215, "global_step": 85354, "epoch": 508} {"train_loss": -9.21733570098877, "global_step": 85355, "epoch": 508} {"train_loss": -9.193228721618652, "global_step": 85356, "epoch": 508} {"train_loss": -8.934911727905273, "global_step": 85357, "epoch": 508} {"train_loss": -8.936569213867188, "global_step": 85358, "epoch": 508} {"train_loss": -9.230125427246094, "global_step": 85359, "epoch": 508} {"train_loss": -9.17221450805664, "global_step": 85360, "epoch": 508} {"train_loss": -9.05301284790039, "global_step": 85361, "epoch": 508} {"train_loss": -9.233774185180664, "global_step": 85362, "epoch": 508} {"train_loss": -9.069986343383789, "global_step": 85363, "epoch": 508} {"train_loss": -9.127534866333008, "global_step": 85364, "epoch": 508} {"train_loss": -9.120007514953613, "global_step": 85365, "epoch": 508} {"train_loss": -9.27324104309082, "global_step": 85366, "epoch": 508} {"train_loss": -9.040781021118164, "global_step": 85367, "epoch": 508} {"train_loss": -9.420302391052246, "global_step": 85368, "epoch": 508} {"train_loss": -9.066934585571289, "global_step": 85369, "epoch": 508} {"train_loss": -9.137680053710938, "global_step": 85370, "epoch": 508} {"train_loss": -9.301206588745117, "global_step": 85371, "epoch": 508} {"train_loss": -8.911060333251953, "global_step": 85372, "epoch": 508} {"train_loss": -9.011054039001465, "global_step": 85373, "epoch": 508} {"train_loss": -9.363027572631836, "global_step": 85374, "epoch": 508} {"train_loss": -9.186834335327148, "global_step": 85375, "epoch": 508} {"train_loss": -9.366177558898926, "global_step": 85376, "epoch": 508} {"train_loss": -9.374626159667969, "global_step": 85377, "epoch": 508} {"train_loss": -9.152754783630371, "global_step": 85378, "epoch": 508} {"train_loss": -9.462924003601074, "global_step": 85379, "epoch": 508} {"train_loss": -9.30558967590332, "global_step": 85380, "epoch": 508} {"train_loss": -9.334243774414062, "global_step": 85381, "epoch": 508} {"train_loss": -9.432703018188477, "global_step": 85382, "epoch": 508} {"train_loss": -9.213374137878418, "global_step": 85383, "epoch": 508} {"train_loss": -9.58789348602295, "global_step": 85384, "epoch": 508} {"train_loss": -9.27530288696289, "global_step": 85385, "epoch": 508} {"train_loss": -9.246589660644531, "global_step": 85386, "epoch": 508} {"train_loss": -9.297304153442383, "global_step": 85387, "epoch": 508} {"train_loss": -9.405637741088867, "global_step": 85388, "epoch": 508} {"train_loss": -9.462102890014648, "global_step": 85389, "epoch": 508} {"train_loss": -9.699944496154785, "global_step": 85390, "epoch": 508} {"train_loss": -9.437131881713867, "global_step": 85391, "epoch": 508} {"train_loss": -9.406936645507812, "global_step": 85392, "epoch": 508} {"train_loss": -9.712516784667969, "global_step": 85393, "epoch": 508} {"train_loss": -9.490659713745117, "global_step": 85394, "epoch": 508} {"train_loss": -9.545610427856445, "global_step": 85395, "epoch": 508} {"train_loss": -9.417661666870117, "global_step": 85396, "epoch": 508} {"train_loss": -9.405867576599121, "global_step": 85397, "epoch": 508} {"train_loss": -9.269575119018555, "global_step": 85398, "epoch": 508} {"train_loss": -9.335917472839355, "global_step": 85399, "epoch": 508} {"train_loss": -9.162952423095703, "global_step": 85400, "epoch": 508} {"train_loss": -8.437171936035156, "global_step": 85401, "epoch": 508} {"train_loss": -9.301206588745117, "global_step": 85402, "epoch": 508} {"train_loss": -8.590758323669434, "global_step": 85403, "epoch": 508} {"train_loss": -8.906793594360352, "global_step": 85404, "epoch": 508} {"train_loss": -9.342401504516602, "global_step": 85405, "epoch": 508} {"train_loss": -9.087936401367188, "global_step": 85406, "epoch": 508} {"train_loss": -9.166221618652344, "global_step": 85407, "epoch": 508} {"train_loss": -9.343164443969727, "global_step": 85408, "epoch": 508} {"train_loss": -8.911163330078125, "global_step": 85409, "epoch": 508} {"train_loss": -9.259026527404785, "global_step": 85410, "epoch": 508} {"train_loss": -9.179508209228516, "global_step": 85411, "epoch": 508} {"train_loss": -9.327916145324707, "global_step": 85412, "epoch": 508} {"train_loss": -9.126380920410156, "global_step": 85413, "epoch": 508} {"train_loss": -9.26470947265625, "global_step": 85414, "epoch": 508} {"train_loss": -9.167593002319336, "global_step": 85415, "epoch": 508} {"train_loss": -9.064361572265625, "global_step": 85416, "epoch": 508} {"train_loss": -9.144392013549805, "global_step": 85417, "epoch": 508} {"train_loss": -9.04355239868164, "global_step": 85418, "epoch": 508} {"train_loss": -8.629251480102539, "global_step": 85419, "epoch": 508} {"train_loss": -9.356142044067383, "global_step": 85420, "epoch": 508} {"train_loss": -8.854714393615723, "global_step": 85421, "epoch": 508} {"train_loss": -9.330924987792969, "global_step": 85422, "epoch": 508} {"train_loss": -9.23204231262207, "global_step": 85423, "epoch": 508} {"train_loss": -9.16842269897461, "global_step": 85424, "epoch": 508} {"train_loss": -9.166509628295898, "global_step": 85425, "epoch": 508} {"train_loss": -9.294845581054688, "global_step": 85426, "epoch": 508} {"train_loss": -9.245749473571777, "global_step": 85427, "epoch": 508} {"train_loss": -9.090314865112305, "global_step": 85428, "epoch": 508} {"train_loss": -9.202997207641602, "global_step": 85429, "epoch": 508} {"train_loss": -9.539719581604004, "global_step": 85430, "epoch": 508} {"train_loss": -9.297271728515625, "global_step": 85431, "epoch": 508} {"train_loss": -9.370013236999512, "global_step": 85432, "epoch": 508} {"train_loss": -9.264083862304688, "global_step": 85433, "epoch": 508} {"train_loss": -9.36900520324707, "global_step": 85434, "epoch": 508} {"train_loss": -9.228164672851562, "global_step": 85435, "epoch": 508} {"train_loss": -9.501680374145508, "global_step": 85436, "epoch": 508} {"train_loss": -9.515202522277832, "global_step": 85437, "epoch": 508} {"train_loss": -9.551131248474121, "global_step": 85438, "epoch": 508} {"train_loss": -9.42697525024414, "global_step": 85439, "epoch": 508} {"train_loss": -9.560554504394531, "global_step": 85440, "epoch": 508} {"train_loss": -9.503179550170898, "global_step": 85441, "epoch": 508} {"train_loss": -9.532371520996094, "global_step": 85442, "epoch": 508} {"train_loss": -9.418496131896973, "global_step": 85443, "epoch": 508} {"train_loss": -9.233543395996094, "global_step": 85444, "epoch": 508} {"train_loss": -9.587800979614258, "global_step": 85445, "epoch": 508} {"train_loss": -9.150437355041504, "global_step": 85446, "epoch": 508} {"train_loss": -9.449520111083984, "global_step": 85447, "epoch": 508} {"train_loss": -9.578357696533203, "global_step": 85448, "epoch": 508} {"train_loss": -9.213113784790039, "global_step": 85449, "epoch": 508} {"train_loss": -9.47337818145752, "global_step": 85450, "epoch": 508} {"train_loss": -9.266519546508789, "global_step": 85451, "epoch": 508} {"train_loss": -9.54723834991455, "global_step": 85452, "epoch": 508} {"train_loss": -9.368281364440918, "global_step": 85453, "epoch": 508} {"train_loss": -9.443683624267578, "global_step": 85454, "epoch": 508} {"train_loss": -9.42919635772705, "global_step": 85455, "epoch": 508} {"train_loss": -9.328044891357422, "global_step": 85456, "epoch": 508} {"train_loss": -8.859566688537598, "global_step": 85457, "epoch": 508} {"train_loss": -9.585319519042969, "global_step": 85458, "epoch": 508} {"train_loss": -9.095795631408691, "global_step": 85459, "epoch": 508} {"train_loss": -9.33404541015625, "global_step": 85460, "epoch": 508} {"train_loss": -9.161723136901855, "global_step": 85461, "epoch": 508} {"train_loss": -8.74522590637207, "global_step": 85462, "epoch": 508} {"train_loss": -9.149428367614746, "global_step": 85463, "epoch": 508} {"train_loss": -8.95146656036377, "global_step": 85464, "epoch": 508} {"train_loss": -9.032787322998047, "global_step": 85465, "epoch": 508} {"train_loss": -9.055948257446289, "global_step": 85466, "epoch": 508} {"train_loss": -9.112000465393066, "global_step": 85467, "epoch": 508} {"train_loss": -8.993827819824219, "global_step": 85468, "epoch": 508} {"train_loss": -9.014909744262695, "global_step": 85469, "epoch": 508} {"train_loss": -9.185951232910156, "global_step": 85470, "epoch": 508} {"train_loss": -9.432046890258789, "global_step": 85471, "epoch": 508} {"train_loss": -9.269634246826172, "global_step": 85472, "epoch": 508} {"train_loss": -9.399218559265137, "global_step": 85473, "epoch": 508} {"train_loss": -9.17341136932373, "global_step": 85474, "epoch": 508} {"train_loss": -9.269889831542969, "global_step": 85475, "epoch": 508} {"train_loss": -9.177996635437012, "global_step": 85476, "epoch": 508} {"train_loss": -9.352235794067383, "global_step": 85477, "epoch": 508} {"train_loss": -9.339072227478027, "global_step": 85478, "epoch": 508} {"train_loss": -9.360658645629883, "global_step": 85479, "epoch": 508} {"train_loss": -9.415909767150879, "global_step": 85480, "epoch": 508} {"train_loss": -9.401087760925293, "global_step": 85481, "epoch": 508} {"train_loss": -9.367268562316895, "global_step": 85482, "epoch": 508} {"train_loss": -9.439733505249023, "global_step": 85483, "epoch": 508} {"train_loss": -9.495519638061523, "global_step": 85484, "epoch": 508} {"train_loss": -9.200443267822266, "global_step": 85485, "epoch": 508} {"train_loss": -9.346261978149414, "global_step": 85486, "epoch": 508} {"train_loss": -9.46592903137207, "global_step": 85487, "epoch": 508} {"train_loss": -9.26938533782959, "global_step": 85488, "epoch": 508} {"train_loss": -9.291507720947266, "global_step": 85489, "epoch": 508} {"train_loss": -9.289852142333984, "global_step": 85490, "epoch": 508} {"train_loss": -9.452661514282227, "global_step": 85491, "epoch": 508} {"train_loss": -9.277095794677734, "global_step": 85492, "epoch": 508} {"train_loss": -9.413751602172852, "global_step": 85493, "epoch": 508} {"train_loss": -9.419240951538086, "global_step": 85494, "epoch": 508} {"train_loss": -9.282750129699707, "global_step": 85495, "epoch": 508} {"train_loss": -9.15577507019043, "global_step": 85496, "epoch": 508} {"train_loss": -9.651496887207031, "global_step": 85497, "epoch": 508} {"train_loss": -9.348459243774414, "global_step": 85498, "epoch": 508} {"train_loss": -9.329690933227539, "global_step": 85499, "epoch": 508} {"train_loss": -9.448759078979492, "global_step": 85500, "epoch": 508} {"train_loss": -9.530658721923828, "global_step": 85501, "epoch": 508} {"train_loss": -9.378751754760742, "global_step": 85502, "epoch": 508} {"train_loss": -9.440654754638672, "global_step": 85503, "epoch": 508} {"train_loss": -9.312738418579102, "global_step": 85504, "epoch": 508} {"train_loss": -9.30375862121582, "global_step": 85505, "epoch": 508} {"train_loss": -9.665328979492188, "global_step": 85506, "epoch": 508} {"train_loss": -9.431405067443848, "global_step": 85507, "epoch": 508} {"train_loss": -9.41537857055664, "global_step": 85508, "epoch": 508} {"train_loss": -9.380340576171875, "global_step": 85509, "epoch": 508} {"train_loss": -9.406145095825195, "global_step": 85510, "epoch": 508} {"train_loss": -9.263578942843846, "global_step": 85511, "epoch": 508, "val_loss": 198046.28125} {"train_loss": -9.407817840576172, "global_step": 85512, "epoch": 509} {"train_loss": -9.289661407470703, "global_step": 85513, "epoch": 509} {"train_loss": -9.494231224060059, "global_step": 85514, "epoch": 509} {"train_loss": -9.340444564819336, "global_step": 85515, "epoch": 509} {"train_loss": -9.667999267578125, "global_step": 85516, "epoch": 509} {"train_loss": -9.531272888183594, "global_step": 85517, "epoch": 509} {"train_loss": -9.197586059570312, "global_step": 85518, "epoch": 509} {"train_loss": -9.32434368133545, "global_step": 85519, "epoch": 509} {"train_loss": -9.47531509399414, "global_step": 85520, "epoch": 509} {"train_loss": -9.505367279052734, "global_step": 85521, "epoch": 509} {"train_loss": -9.529848098754883, "global_step": 85522, "epoch": 509} {"train_loss": -9.544194221496582, "global_step": 85523, "epoch": 509} {"train_loss": -9.445789337158203, "global_step": 85524, "epoch": 509} {"train_loss": -9.110726356506348, "global_step": 85525, "epoch": 509} {"train_loss": -9.282523155212402, "global_step": 85526, "epoch": 509} {"train_loss": -9.563819885253906, "global_step": 85527, "epoch": 509} {"train_loss": -9.358734130859375, "global_step": 85528, "epoch": 509} {"train_loss": -9.53853988647461, "global_step": 85529, "epoch": 509} {"train_loss": -9.164345741271973, "global_step": 85530, "epoch": 509} {"train_loss": -9.476409912109375, "global_step": 85531, "epoch": 509} {"train_loss": -8.971473693847656, "global_step": 85532, "epoch": 509} {"train_loss": -9.326108932495117, "global_step": 85533, "epoch": 509} {"train_loss": -8.839858055114746, "global_step": 85534, "epoch": 509} {"train_loss": -8.969889640808105, "global_step": 85535, "epoch": 509} {"train_loss": -9.01350212097168, "global_step": 85536, "epoch": 509} {"train_loss": -9.095490455627441, "global_step": 85537, "epoch": 509} {"train_loss": -8.902298927307129, "global_step": 85538, "epoch": 509} {"train_loss": -9.307999610900879, "global_step": 85539, "epoch": 509} {"train_loss": -9.227707862854004, "global_step": 85540, "epoch": 509} {"train_loss": -9.158279418945312, "global_step": 85541, "epoch": 509} {"train_loss": -9.264547348022461, "global_step": 85542, "epoch": 509} {"train_loss": -8.995830535888672, "global_step": 85543, "epoch": 509} {"train_loss": -9.375900268554688, "global_step": 85544, "epoch": 509} {"train_loss": -9.233593940734863, "global_step": 85545, "epoch": 509} {"train_loss": -9.051813125610352, "global_step": 85546, "epoch": 509} {"train_loss": -9.0322847366333, "global_step": 85547, "epoch": 509} {"train_loss": -9.172094345092773, "global_step": 85548, "epoch": 509} {"train_loss": -9.27006721496582, "global_step": 85549, "epoch": 509} {"train_loss": -9.12944221496582, "global_step": 85550, "epoch": 509} {"train_loss": -9.122146606445312, "global_step": 85551, "epoch": 509} {"train_loss": -9.454541206359863, "global_step": 85552, "epoch": 509} {"train_loss": -9.003162384033203, "global_step": 85553, "epoch": 509} {"train_loss": -9.39168643951416, "global_step": 85554, "epoch": 509} {"train_loss": -9.309976577758789, "global_step": 85555, "epoch": 509} {"train_loss": -9.335861206054688, "global_step": 85556, "epoch": 509} {"train_loss": -9.453838348388672, "global_step": 85557, "epoch": 509} {"train_loss": -9.462348937988281, "global_step": 85558, "epoch": 509} {"train_loss": -9.277735710144043, "global_step": 85559, "epoch": 509} {"train_loss": -9.416213035583496, "global_step": 85560, "epoch": 509} {"train_loss": -9.211174011230469, "global_step": 85561, "epoch": 509} {"train_loss": -9.409324645996094, "global_step": 85562, "epoch": 509} {"train_loss": -9.413593292236328, "global_step": 85563, "epoch": 509} {"train_loss": -9.20114803314209, "global_step": 85564, "epoch": 509} {"train_loss": -9.424765586853027, "global_step": 85565, "epoch": 509} {"train_loss": -9.396369934082031, "global_step": 85566, "epoch": 509} {"train_loss": -9.521160125732422, "global_step": 85567, "epoch": 509} {"train_loss": -9.250767707824707, "global_step": 85568, "epoch": 509} {"train_loss": -9.332332611083984, "global_step": 85569, "epoch": 509} {"train_loss": -9.538795471191406, "global_step": 85570, "epoch": 509} {"train_loss": -9.446150779724121, "global_step": 85571, "epoch": 509} {"train_loss": -9.602156639099121, "global_step": 85572, "epoch": 509} {"train_loss": -9.384779930114746, "global_step": 85573, "epoch": 509} {"train_loss": -9.357916831970215, "global_step": 85574, "epoch": 509} {"train_loss": -9.429913520812988, "global_step": 85575, "epoch": 509} {"train_loss": -9.390371322631836, "global_step": 85576, "epoch": 509} {"train_loss": -9.429316520690918, "global_step": 85577, "epoch": 509} {"train_loss": -9.30221939086914, "global_step": 85578, "epoch": 509} {"train_loss": -9.132771492004395, "global_step": 85579, "epoch": 509} {"train_loss": -9.274706840515137, "global_step": 85580, "epoch": 509} {"train_loss": -9.307069778442383, "global_step": 85581, "epoch": 509} {"train_loss": -9.333946228027344, "global_step": 85582, "epoch": 509} {"train_loss": -9.315132141113281, "global_step": 85583, "epoch": 509} {"train_loss": -9.499133110046387, "global_step": 85584, "epoch": 509} {"train_loss": -8.904170036315918, "global_step": 85585, "epoch": 509} {"train_loss": -9.466808319091797, "global_step": 85586, "epoch": 509} {"train_loss": -9.324563980102539, "global_step": 85587, "epoch": 509} {"train_loss": -9.374631881713867, "global_step": 85588, "epoch": 509} {"train_loss": -9.280884742736816, "global_step": 85589, "epoch": 509} {"train_loss": -9.329913139343262, "global_step": 85590, "epoch": 509} {"train_loss": -9.253337860107422, "global_step": 85591, "epoch": 509} {"train_loss": -8.875850677490234, "global_step": 85592, "epoch": 509} {"train_loss": -9.229026794433594, "global_step": 85593, "epoch": 509} {"train_loss": -9.109395027160645, "global_step": 85594, "epoch": 509} {"train_loss": -9.545173645019531, "global_step": 85595, "epoch": 509} {"train_loss": -8.680822372436523, "global_step": 85596, "epoch": 509} {"train_loss": -9.116616249084473, "global_step": 85597, "epoch": 509} {"train_loss": -8.641191482543945, "global_step": 85598, "epoch": 509} {"train_loss": -8.759369850158691, "global_step": 85599, "epoch": 509} {"train_loss": -8.340644836425781, "global_step": 85600, "epoch": 509} {"train_loss": -8.913930892944336, "global_step": 85601, "epoch": 509} {"train_loss": -9.18086051940918, "global_step": 85602, "epoch": 509} {"train_loss": -8.932865142822266, "global_step": 85603, "epoch": 509} {"train_loss": -8.936466217041016, "global_step": 85604, "epoch": 509} {"train_loss": -9.194921493530273, "global_step": 85605, "epoch": 509} {"train_loss": -9.038408279418945, "global_step": 85606, "epoch": 509} {"train_loss": -8.807878494262695, "global_step": 85607, "epoch": 509} {"train_loss": -8.911981582641602, "global_step": 85608, "epoch": 509} {"train_loss": -9.063172340393066, "global_step": 85609, "epoch": 509} {"train_loss": -9.040027618408203, "global_step": 85610, "epoch": 509} {"train_loss": -9.231407165527344, "global_step": 85611, "epoch": 509} {"train_loss": -9.478256225585938, "global_step": 85612, "epoch": 509} {"train_loss": -9.188762664794922, "global_step": 85613, "epoch": 509} {"train_loss": -9.486912727355957, "global_step": 85614, "epoch": 509} {"train_loss": -8.981945037841797, "global_step": 85615, "epoch": 509} {"train_loss": -9.159709930419922, "global_step": 85616, "epoch": 509} {"train_loss": -9.379934310913086, "global_step": 85617, "epoch": 509} {"train_loss": -9.363988876342773, "global_step": 85618, "epoch": 509} {"train_loss": -9.427030563354492, "global_step": 85619, "epoch": 509} {"train_loss": -9.443567276000977, "global_step": 85620, "epoch": 509} {"train_loss": -9.441059112548828, "global_step": 85621, "epoch": 509} {"train_loss": -9.053644180297852, "global_step": 85622, "epoch": 509} {"train_loss": -9.25385570526123, "global_step": 85623, "epoch": 509} {"train_loss": -9.52840805053711, "global_step": 85624, "epoch": 509} {"train_loss": -9.423850059509277, "global_step": 85625, "epoch": 509} {"train_loss": -9.487297058105469, "global_step": 85626, "epoch": 509} {"train_loss": -9.130257606506348, "global_step": 85627, "epoch": 509} {"train_loss": -9.589820861816406, "global_step": 85628, "epoch": 509} {"train_loss": -9.20694637298584, "global_step": 85629, "epoch": 509} {"train_loss": -9.324087142944336, "global_step": 85630, "epoch": 509} {"train_loss": -9.310672760009766, "global_step": 85631, "epoch": 509} {"train_loss": -9.438436508178711, "global_step": 85632, "epoch": 509} {"train_loss": -9.38326644897461, "global_step": 85633, "epoch": 509} {"train_loss": -9.437201499938965, "global_step": 85634, "epoch": 509} {"train_loss": -9.251401901245117, "global_step": 85635, "epoch": 509} {"train_loss": -9.308707237243652, "global_step": 85636, "epoch": 509} {"train_loss": -9.096738815307617, "global_step": 85637, "epoch": 509} {"train_loss": -9.425542831420898, "global_step": 85638, "epoch": 509} {"train_loss": -9.287315368652344, "global_step": 85639, "epoch": 509} {"train_loss": -9.473823547363281, "global_step": 85640, "epoch": 509} {"train_loss": -9.399726867675781, "global_step": 85641, "epoch": 509} {"train_loss": -9.174287796020508, "global_step": 85642, "epoch": 509} {"train_loss": -9.332975387573242, "global_step": 85643, "epoch": 509} {"train_loss": -9.597550392150879, "global_step": 85644, "epoch": 509} {"train_loss": -9.599310874938965, "global_step": 85645, "epoch": 509} {"train_loss": -9.517688751220703, "global_step": 85646, "epoch": 509} {"train_loss": -9.361011505126953, "global_step": 85647, "epoch": 509} {"train_loss": -9.606685638427734, "global_step": 85648, "epoch": 509} {"train_loss": -9.531198501586914, "global_step": 85649, "epoch": 509} {"train_loss": -8.990375518798828, "global_step": 85650, "epoch": 509} {"train_loss": -9.487809181213379, "global_step": 85651, "epoch": 509} {"train_loss": -9.445830345153809, "global_step": 85652, "epoch": 509} {"train_loss": -9.331066131591797, "global_step": 85653, "epoch": 509} {"train_loss": -9.434812545776367, "global_step": 85654, "epoch": 509} {"train_loss": -9.31097412109375, "global_step": 85655, "epoch": 509} {"train_loss": -9.560966491699219, "global_step": 85656, "epoch": 509} {"train_loss": -9.283690452575684, "global_step": 85657, "epoch": 509} {"train_loss": -9.327911376953125, "global_step": 85658, "epoch": 509} {"train_loss": -9.243772506713867, "global_step": 85659, "epoch": 509} {"train_loss": -9.369892120361328, "global_step": 85660, "epoch": 509} {"train_loss": -9.623434066772461, "global_step": 85661, "epoch": 509} {"train_loss": -9.325357437133789, "global_step": 85662, "epoch": 509} {"train_loss": -9.400659561157227, "global_step": 85663, "epoch": 509} {"train_loss": -9.534128189086914, "global_step": 85664, "epoch": 509} {"train_loss": -9.314794540405273, "global_step": 85665, "epoch": 509} {"train_loss": -9.372791290283203, "global_step": 85666, "epoch": 509} {"train_loss": -9.39993667602539, "global_step": 85667, "epoch": 509} {"train_loss": -9.352962493896484, "global_step": 85668, "epoch": 509} {"train_loss": -9.413125991821289, "global_step": 85669, "epoch": 509} {"train_loss": -9.491971969604492, "global_step": 85670, "epoch": 509} {"train_loss": -9.602191925048828, "global_step": 85671, "epoch": 509} {"train_loss": -9.543187141418457, "global_step": 85672, "epoch": 509} {"train_loss": -9.339153289794922, "global_step": 85673, "epoch": 509} {"train_loss": -9.503748893737793, "global_step": 85674, "epoch": 509} {"train_loss": -9.489522933959961, "global_step": 85675, "epoch": 509} {"train_loss": -9.682600021362305, "global_step": 85676, "epoch": 509} {"train_loss": -9.609249114990234, "global_step": 85677, "epoch": 509} {"train_loss": -9.432767868041992, "global_step": 85678, "epoch": 509} {"train_loss": -9.30241827170054, "global_step": 85679, "epoch": 509, "val_loss": 198718.453125} {"train_loss": -9.135229110717773, "global_step": 85680, "epoch": 510} {"train_loss": -9.596162796020508, "global_step": 85681, "epoch": 510} {"train_loss": -9.346368789672852, "global_step": 85682, "epoch": 510} {"train_loss": -9.495525360107422, "global_step": 85683, "epoch": 510} {"train_loss": -9.367910385131836, "global_step": 85684, "epoch": 510} {"train_loss": -9.338695526123047, "global_step": 85685, "epoch": 510} {"train_loss": -9.386968612670898, "global_step": 85686, "epoch": 510} {"train_loss": -9.219110488891602, "global_step": 85687, "epoch": 510} {"train_loss": -9.240372657775879, "global_step": 85688, "epoch": 510} {"train_loss": -9.294769287109375, "global_step": 85689, "epoch": 510} {"train_loss": -9.21540641784668, "global_step": 85690, "epoch": 510} {"train_loss": -8.856863021850586, "global_step": 85691, "epoch": 510} {"train_loss": -9.453292846679688, "global_step": 85692, "epoch": 510} {"train_loss": -8.89452075958252, "global_step": 85693, "epoch": 510} {"train_loss": -9.27532958984375, "global_step": 85694, "epoch": 510} {"train_loss": -9.123592376708984, "global_step": 85695, "epoch": 510} {"train_loss": -8.949209213256836, "global_step": 85696, "epoch": 510} {"train_loss": -9.146328926086426, "global_step": 85697, "epoch": 510} {"train_loss": -9.236652374267578, "global_step": 85698, "epoch": 510} {"train_loss": -8.979215621948242, "global_step": 85699, "epoch": 510} {"train_loss": -9.188962936401367, "global_step": 85700, "epoch": 510} {"train_loss": -8.923013687133789, "global_step": 85701, "epoch": 510} {"train_loss": -9.154802322387695, "global_step": 85702, "epoch": 510} {"train_loss": -9.121688842773438, "global_step": 85703, "epoch": 510} {"train_loss": -9.098613739013672, "global_step": 85704, "epoch": 510} {"train_loss": -9.091337203979492, "global_step": 85705, "epoch": 510} {"train_loss": -9.355142593383789, "global_step": 85706, "epoch": 510} {"train_loss": -9.294178009033203, "global_step": 85707, "epoch": 510} {"train_loss": -9.196318626403809, "global_step": 85708, "epoch": 510} {"train_loss": -9.361544609069824, "global_step": 85709, "epoch": 510} {"train_loss": -9.249846458435059, "global_step": 85710, "epoch": 510} {"train_loss": -9.281156539916992, "global_step": 85711, "epoch": 510} {"train_loss": -9.319015502929688, "global_step": 85712, "epoch": 510} {"train_loss": -9.428199768066406, "global_step": 85713, "epoch": 510} {"train_loss": -9.216403007507324, "global_step": 85714, "epoch": 510} {"train_loss": -9.335765838623047, "global_step": 85715, "epoch": 510} {"train_loss": -9.047246932983398, "global_step": 85716, "epoch": 510} {"train_loss": -9.430649757385254, "global_step": 85717, "epoch": 510} {"train_loss": -9.264509201049805, "global_step": 85718, "epoch": 510} {"train_loss": -9.36367130279541, "global_step": 85719, "epoch": 510} {"train_loss": -9.537538528442383, "global_step": 85720, "epoch": 510} {"train_loss": -9.496585845947266, "global_step": 85721, "epoch": 510} {"train_loss": -9.446720123291016, "global_step": 85722, "epoch": 510} {"train_loss": -9.374747276306152, "global_step": 85723, "epoch": 510} {"train_loss": -9.545875549316406, "global_step": 85724, "epoch": 510} {"train_loss": -9.382322311401367, "global_step": 85725, "epoch": 510} {"train_loss": -9.42935562133789, "global_step": 85726, "epoch": 510} {"train_loss": -9.394340515136719, "global_step": 85727, "epoch": 510} {"train_loss": -9.373753547668457, "global_step": 85728, "epoch": 510} {"train_loss": -9.606745719909668, "global_step": 85729, "epoch": 510} {"train_loss": -9.47976303100586, "global_step": 85730, "epoch": 510} {"train_loss": -9.190254211425781, "global_step": 85731, "epoch": 510} {"train_loss": -9.414970397949219, "global_step": 85732, "epoch": 510} {"train_loss": -9.549142837524414, "global_step": 85733, "epoch": 510} {"train_loss": -9.037971496582031, "global_step": 85734, "epoch": 510} {"train_loss": -9.427656173706055, "global_step": 85735, "epoch": 510} {"train_loss": -9.390586853027344, "global_step": 85736, "epoch": 510} {"train_loss": -9.507709503173828, "global_step": 85737, "epoch": 510} {"train_loss": -9.435593605041504, "global_step": 85738, "epoch": 510} {"train_loss": -9.468626022338867, "global_step": 85739, "epoch": 510} {"train_loss": -9.223220825195312, "global_step": 85740, "epoch": 510} {"train_loss": -9.692917823791504, "global_step": 85741, "epoch": 510} {"train_loss": -9.19715690612793, "global_step": 85742, "epoch": 510} {"train_loss": -9.293088912963867, "global_step": 85743, "epoch": 510} {"train_loss": -9.288459777832031, "global_step": 85744, "epoch": 510} {"train_loss": -9.648159980773926, "global_step": 85745, "epoch": 510} {"train_loss": -9.287900924682617, "global_step": 85746, "epoch": 510} {"train_loss": -9.50223445892334, "global_step": 85747, "epoch": 510} {"train_loss": -9.564699172973633, "global_step": 85748, "epoch": 510} {"train_loss": -9.265501022338867, "global_step": 85749, "epoch": 510} {"train_loss": -9.596677780151367, "global_step": 85750, "epoch": 510} {"train_loss": -9.00208568572998, "global_step": 85751, "epoch": 510} {"train_loss": -9.362964630126953, "global_step": 85752, "epoch": 510} {"train_loss": -9.060486793518066, "global_step": 85753, "epoch": 510} {"train_loss": -9.436138153076172, "global_step": 85754, "epoch": 510} {"train_loss": -9.318729400634766, "global_step": 85755, "epoch": 510} {"train_loss": -9.30217170715332, "global_step": 85756, "epoch": 510} {"train_loss": -9.21898365020752, "global_step": 85757, "epoch": 510} {"train_loss": -9.323272705078125, "global_step": 85758, "epoch": 510} {"train_loss": -9.152704238891602, "global_step": 85759, "epoch": 510} {"train_loss": -9.182395935058594, "global_step": 85760, "epoch": 510} {"train_loss": -9.374065399169922, "global_step": 85761, "epoch": 510} {"train_loss": -9.053691864013672, "global_step": 85762, "epoch": 510} {"train_loss": -8.950529098510742, "global_step": 85763, "epoch": 510} {"train_loss": -9.161406517028809, "global_step": 85764, "epoch": 510} {"train_loss": -9.394469261169434, "global_step": 85765, "epoch": 510} {"train_loss": -9.233243942260742, "global_step": 85766, "epoch": 510} {"train_loss": -9.334062576293945, "global_step": 85767, "epoch": 510} {"train_loss": -9.411589622497559, "global_step": 85768, "epoch": 510} {"train_loss": -9.123296737670898, "global_step": 85769, "epoch": 510} {"train_loss": -9.198854446411133, "global_step": 85770, "epoch": 510} {"train_loss": -9.434294700622559, "global_step": 85771, "epoch": 510} {"train_loss": -9.551559448242188, "global_step": 85772, "epoch": 510} {"train_loss": -9.328420639038086, "global_step": 85773, "epoch": 510} {"train_loss": -9.203594207763672, "global_step": 85774, "epoch": 510} {"train_loss": -9.193459510803223, "global_step": 85775, "epoch": 510} {"train_loss": -9.266311645507812, "global_step": 85776, "epoch": 510} {"train_loss": -9.372390747070312, "global_step": 85777, "epoch": 510} {"train_loss": -9.403773307800293, "global_step": 85778, "epoch": 510} {"train_loss": -9.391286849975586, "global_step": 85779, "epoch": 510} {"train_loss": -9.427416801452637, "global_step": 85780, "epoch": 510} {"train_loss": -9.296570777893066, "global_step": 85781, "epoch": 510} {"train_loss": -9.606154441833496, "global_step": 85782, "epoch": 510} {"train_loss": -9.427184104919434, "global_step": 85783, "epoch": 510} {"train_loss": -9.514875411987305, "global_step": 85784, "epoch": 510} {"train_loss": -9.22776985168457, "global_step": 85785, "epoch": 510} {"train_loss": -9.652763366699219, "global_step": 85786, "epoch": 510} {"train_loss": -9.402948379516602, "global_step": 85787, "epoch": 510} {"train_loss": -9.31978988647461, "global_step": 85788, "epoch": 510} {"train_loss": -9.36384391784668, "global_step": 85789, "epoch": 510} {"train_loss": -9.151183128356934, "global_step": 85790, "epoch": 510} {"train_loss": -9.538697242736816, "global_step": 85791, "epoch": 510} {"train_loss": -9.157110214233398, "global_step": 85792, "epoch": 510} {"train_loss": -9.2819242477417, "global_step": 85793, "epoch": 510} {"train_loss": -9.359452247619629, "global_step": 85794, "epoch": 510} {"train_loss": -9.211490631103516, "global_step": 85795, "epoch": 510} {"train_loss": -9.36777114868164, "global_step": 85796, "epoch": 510} {"train_loss": -9.08047103881836, "global_step": 85797, "epoch": 510} {"train_loss": -9.413387298583984, "global_step": 85798, "epoch": 510} {"train_loss": -9.233325004577637, "global_step": 85799, "epoch": 510} {"train_loss": -9.439474105834961, "global_step": 85800, "epoch": 510} {"train_loss": -8.819011688232422, "global_step": 85801, "epoch": 510} {"train_loss": -8.919750213623047, "global_step": 85802, "epoch": 510} {"train_loss": -8.990553855895996, "global_step": 85803, "epoch": 510} {"train_loss": -9.168404579162598, "global_step": 85804, "epoch": 510} {"train_loss": -9.107440948486328, "global_step": 85805, "epoch": 510} {"train_loss": -8.822336196899414, "global_step": 85806, "epoch": 510} {"train_loss": -9.149686813354492, "global_step": 85807, "epoch": 510} {"train_loss": -9.003120422363281, "global_step": 85808, "epoch": 510} {"train_loss": -9.029911041259766, "global_step": 85809, "epoch": 510} {"train_loss": -9.3475341796875, "global_step": 85810, "epoch": 510} {"train_loss": -9.164703369140625, "global_step": 85811, "epoch": 510} {"train_loss": -9.16026782989502, "global_step": 85812, "epoch": 510} {"train_loss": -9.229732513427734, "global_step": 85813, "epoch": 510} {"train_loss": -9.2730712890625, "global_step": 85814, "epoch": 510} {"train_loss": -9.176027297973633, "global_step": 85815, "epoch": 510} {"train_loss": -9.342713356018066, "global_step": 85816, "epoch": 510} {"train_loss": -9.127042770385742, "global_step": 85817, "epoch": 510} {"train_loss": -9.208108901977539, "global_step": 85818, "epoch": 510} {"train_loss": -9.225982666015625, "global_step": 85819, "epoch": 510} {"train_loss": -9.398931503295898, "global_step": 85820, "epoch": 510} {"train_loss": -9.155664443969727, "global_step": 85821, "epoch": 510} {"train_loss": -9.128795623779297, "global_step": 85822, "epoch": 510} {"train_loss": -9.488396644592285, "global_step": 85823, "epoch": 510} {"train_loss": -9.32038688659668, "global_step": 85824, "epoch": 510} {"train_loss": -9.343546867370605, "global_step": 85825, "epoch": 510} {"train_loss": -9.123493194580078, "global_step": 85826, "epoch": 510} {"train_loss": -9.41292953491211, "global_step": 85827, "epoch": 510} {"train_loss": -9.227054595947266, "global_step": 85828, "epoch": 510} {"train_loss": -9.194092750549316, "global_step": 85829, "epoch": 510} {"train_loss": -9.262100219726562, "global_step": 85830, "epoch": 510} {"train_loss": -9.180790901184082, "global_step": 85831, "epoch": 510} {"train_loss": -9.252159118652344, "global_step": 85832, "epoch": 510} {"train_loss": -9.487715721130371, "global_step": 85833, "epoch": 510} {"train_loss": -9.450891494750977, "global_step": 85834, "epoch": 510} {"train_loss": -9.239048957824707, "global_step": 85835, "epoch": 510} {"train_loss": -9.199732780456543, "global_step": 85836, "epoch": 510} {"train_loss": -9.420755386352539, "global_step": 85837, "epoch": 510} {"train_loss": -9.41874885559082, "global_step": 85838, "epoch": 510} {"train_loss": -9.478132247924805, "global_step": 85839, "epoch": 510} {"train_loss": -9.277961730957031, "global_step": 85840, "epoch": 510} {"train_loss": -9.446125030517578, "global_step": 85841, "epoch": 510} {"train_loss": -9.413761138916016, "global_step": 85842, "epoch": 510} {"train_loss": -9.253040313720703, "global_step": 85843, "epoch": 510} {"train_loss": -9.49428939819336, "global_step": 85844, "epoch": 510} {"train_loss": -9.222593307495117, "global_step": 85845, "epoch": 510} {"train_loss": -9.422449111938477, "global_step": 85846, "epoch": 510} {"train_loss": -9.28903457664308, "global_step": 85847, "epoch": 510, "val_loss": 201440.890625, "train_action_mse_error": 5.280429363250732} {"train_loss": -8.953778266906738, "global_step": 85848, "epoch": 511} {"train_loss": -9.33315658569336, "global_step": 85849, "epoch": 511} {"train_loss": -8.997781753540039, "global_step": 85850, "epoch": 511} {"train_loss": -9.391706466674805, "global_step": 85851, "epoch": 511} {"train_loss": -8.876321792602539, "global_step": 85852, "epoch": 511} {"train_loss": -9.155461311340332, "global_step": 85853, "epoch": 511} {"train_loss": -9.280211448669434, "global_step": 85854, "epoch": 511} {"train_loss": -9.045829772949219, "global_step": 85855, "epoch": 511} {"train_loss": -9.29841136932373, "global_step": 85856, "epoch": 511} {"train_loss": -9.260607719421387, "global_step": 85857, "epoch": 511} {"train_loss": -9.021717071533203, "global_step": 85858, "epoch": 511} {"train_loss": -9.14842414855957, "global_step": 85859, "epoch": 511} {"train_loss": -9.17527961730957, "global_step": 85860, "epoch": 511} {"train_loss": -8.999421119689941, "global_step": 85861, "epoch": 511} {"train_loss": -9.188075065612793, "global_step": 85862, "epoch": 511} {"train_loss": -9.098531723022461, "global_step": 85863, "epoch": 511} {"train_loss": -8.968311309814453, "global_step": 85864, "epoch": 511} {"train_loss": -9.404640197753906, "global_step": 85865, "epoch": 511} {"train_loss": -8.953987121582031, "global_step": 85866, "epoch": 511} {"train_loss": -9.57185173034668, "global_step": 85867, "epoch": 511} {"train_loss": -9.225739479064941, "global_step": 85868, "epoch": 511} {"train_loss": -9.128417015075684, "global_step": 85869, "epoch": 511} {"train_loss": -9.282106399536133, "global_step": 85870, "epoch": 511} {"train_loss": -9.2849760055542, "global_step": 85871, "epoch": 511} {"train_loss": -9.453731536865234, "global_step": 85872, "epoch": 511} {"train_loss": -9.583396911621094, "global_step": 85873, "epoch": 511} {"train_loss": -9.299407958984375, "global_step": 85874, "epoch": 511} {"train_loss": -9.579449653625488, "global_step": 85875, "epoch": 511} {"train_loss": -9.34553050994873, "global_step": 85876, "epoch": 511} {"train_loss": -9.298669815063477, "global_step": 85877, "epoch": 511} {"train_loss": -9.051675796508789, "global_step": 85878, "epoch": 511} {"train_loss": -9.28327751159668, "global_step": 85879, "epoch": 511} {"train_loss": -9.276651382446289, "global_step": 85880, "epoch": 511} {"train_loss": -9.323484420776367, "global_step": 85881, "epoch": 511} {"train_loss": -9.529762268066406, "global_step": 85882, "epoch": 511} {"train_loss": -9.212995529174805, "global_step": 85883, "epoch": 511} {"train_loss": -9.529661178588867, "global_step": 85884, "epoch": 511} {"train_loss": -9.384084701538086, "global_step": 85885, "epoch": 511} {"train_loss": -9.405693054199219, "global_step": 85886, "epoch": 511} {"train_loss": -9.515241622924805, "global_step": 85887, "epoch": 511} {"train_loss": -9.566694259643555, "global_step": 85888, "epoch": 511} {"train_loss": -9.45764446258545, "global_step": 85889, "epoch": 511} {"train_loss": -9.419811248779297, "global_step": 85890, "epoch": 511} {"train_loss": -9.42074966430664, "global_step": 85891, "epoch": 511} {"train_loss": -9.687711715698242, "global_step": 85892, "epoch": 511} {"train_loss": -9.084237098693848, "global_step": 85893, "epoch": 511} {"train_loss": -9.44138240814209, "global_step": 85894, "epoch": 511} {"train_loss": -9.250497817993164, "global_step": 85895, "epoch": 511} {"train_loss": -9.442278861999512, "global_step": 85896, "epoch": 511} {"train_loss": -8.850411415100098, "global_step": 85897, "epoch": 511} {"train_loss": -9.311500549316406, "global_step": 85898, "epoch": 511} {"train_loss": -9.114995002746582, "global_step": 85899, "epoch": 511} {"train_loss": -9.307534217834473, "global_step": 85900, "epoch": 511} {"train_loss": -9.160479545593262, "global_step": 85901, "epoch": 511} {"train_loss": -9.001221656799316, "global_step": 85902, "epoch": 511} {"train_loss": -9.269129753112793, "global_step": 85903, "epoch": 511} {"train_loss": -9.266495704650879, "global_step": 85904, "epoch": 511} {"train_loss": -9.228742599487305, "global_step": 85905, "epoch": 511} {"train_loss": -9.106017112731934, "global_step": 85906, "epoch": 511} {"train_loss": -9.313095092773438, "global_step": 85907, "epoch": 511} {"train_loss": -8.888404846191406, "global_step": 85908, "epoch": 511} {"train_loss": -9.424610137939453, "global_step": 85909, "epoch": 511} {"train_loss": -8.972585678100586, "global_step": 85910, "epoch": 511} {"train_loss": -9.125833511352539, "global_step": 85911, "epoch": 511} {"train_loss": -9.067419052124023, "global_step": 85912, "epoch": 511} {"train_loss": -9.075550079345703, "global_step": 85913, "epoch": 511} {"train_loss": -8.97982406616211, "global_step": 85914, "epoch": 511} {"train_loss": -9.08115005493164, "global_step": 85915, "epoch": 511} {"train_loss": -9.198116302490234, "global_step": 85916, "epoch": 511} {"train_loss": -9.039971351623535, "global_step": 85917, "epoch": 511} {"train_loss": -9.119215965270996, "global_step": 85918, "epoch": 511} {"train_loss": -9.388906478881836, "global_step": 85919, "epoch": 511} {"train_loss": -9.07192611694336, "global_step": 85920, "epoch": 511} {"train_loss": -9.027019500732422, "global_step": 85921, "epoch": 511} {"train_loss": -9.130411148071289, "global_step": 85922, "epoch": 511} {"train_loss": -9.245247840881348, "global_step": 85923, "epoch": 511} {"train_loss": -9.259973526000977, "global_step": 85924, "epoch": 511} {"train_loss": -9.216156959533691, "global_step": 85925, "epoch": 511} {"train_loss": -9.218067169189453, "global_step": 85926, "epoch": 511} {"train_loss": -9.259840965270996, "global_step": 85927, "epoch": 511} {"train_loss": -9.23323917388916, "global_step": 85928, "epoch": 511} {"train_loss": -9.12234115600586, "global_step": 85929, "epoch": 511} {"train_loss": -9.37271499633789, "global_step": 85930, "epoch": 511} {"train_loss": -9.00712776184082, "global_step": 85931, "epoch": 511} {"train_loss": -9.288885116577148, "global_step": 85932, "epoch": 511} {"train_loss": -9.332544326782227, "global_step": 85933, "epoch": 511} {"train_loss": -9.417915344238281, "global_step": 85934, "epoch": 511} {"train_loss": -9.328276634216309, "global_step": 85935, "epoch": 511} {"train_loss": -9.08626651763916, "global_step": 85936, "epoch": 511} {"train_loss": -9.46410846710205, "global_step": 85937, "epoch": 511} {"train_loss": -9.317717552185059, "global_step": 85938, "epoch": 511} {"train_loss": -9.298656463623047, "global_step": 85939, "epoch": 511} {"train_loss": -9.578328132629395, "global_step": 85940, "epoch": 511} {"train_loss": -9.375198364257812, "global_step": 85941, "epoch": 511} {"train_loss": -9.380973815917969, "global_step": 85942, "epoch": 511} {"train_loss": -9.530075073242188, "global_step": 85943, "epoch": 511} {"train_loss": -9.18016242980957, "global_step": 85944, "epoch": 511} {"train_loss": -9.476807594299316, "global_step": 85945, "epoch": 511} {"train_loss": -9.459697723388672, "global_step": 85946, "epoch": 511} {"train_loss": -9.552994728088379, "global_step": 85947, "epoch": 511} {"train_loss": -9.587400436401367, "global_step": 85948, "epoch": 511} {"train_loss": -9.396025657653809, "global_step": 85949, "epoch": 511} {"train_loss": -9.749595642089844, "global_step": 85950, "epoch": 511} {"train_loss": -8.998804092407227, "global_step": 85951, "epoch": 511} {"train_loss": -9.182016372680664, "global_step": 85952, "epoch": 511} {"train_loss": -9.438455581665039, "global_step": 85953, "epoch": 511} {"train_loss": -9.451841354370117, "global_step": 85954, "epoch": 511} {"train_loss": -9.500541687011719, "global_step": 85955, "epoch": 511} {"train_loss": -9.431182861328125, "global_step": 85956, "epoch": 511} {"train_loss": -9.292154312133789, "global_step": 85957, "epoch": 511} {"train_loss": -9.379539489746094, "global_step": 85958, "epoch": 511} {"train_loss": -9.163236618041992, "global_step": 85959, "epoch": 511} {"train_loss": -8.99072551727295, "global_step": 85960, "epoch": 511} {"train_loss": -9.542430877685547, "global_step": 85961, "epoch": 511} {"train_loss": -8.935647964477539, "global_step": 85962, "epoch": 511} {"train_loss": -9.096037864685059, "global_step": 85963, "epoch": 511} {"train_loss": -8.995294570922852, "global_step": 85964, "epoch": 511} {"train_loss": -8.872068405151367, "global_step": 85965, "epoch": 511} {"train_loss": -8.815971374511719, "global_step": 85966, "epoch": 511} {"train_loss": -8.825311660766602, "global_step": 85967, "epoch": 511} {"train_loss": -9.25314712524414, "global_step": 85968, "epoch": 511} {"train_loss": -8.760705947875977, "global_step": 85969, "epoch": 511} {"train_loss": -9.208860397338867, "global_step": 85970, "epoch": 511} {"train_loss": -9.178339004516602, "global_step": 85971, "epoch": 511} {"train_loss": -9.362743377685547, "global_step": 85972, "epoch": 511} {"train_loss": -8.986017227172852, "global_step": 85973, "epoch": 511} {"train_loss": -9.251520156860352, "global_step": 85974, "epoch": 511} {"train_loss": -8.736433029174805, "global_step": 85975, "epoch": 511} {"train_loss": -9.256573677062988, "global_step": 85976, "epoch": 511} {"train_loss": -9.231280326843262, "global_step": 85977, "epoch": 511} {"train_loss": -8.935964584350586, "global_step": 85978, "epoch": 511} {"train_loss": -9.233881950378418, "global_step": 85979, "epoch": 511} {"train_loss": -9.173673629760742, "global_step": 85980, "epoch": 511} {"train_loss": -9.000593185424805, "global_step": 85981, "epoch": 511} {"train_loss": -9.200202941894531, "global_step": 85982, "epoch": 511} {"train_loss": -9.187216758728027, "global_step": 85983, "epoch": 511} {"train_loss": -9.540565490722656, "global_step": 85984, "epoch": 511} {"train_loss": -8.986257553100586, "global_step": 85985, "epoch": 511} {"train_loss": -9.402566909790039, "global_step": 85986, "epoch": 511} {"train_loss": -9.26390266418457, "global_step": 85987, "epoch": 511} {"train_loss": -9.176145553588867, "global_step": 85988, "epoch": 511} {"train_loss": -9.186992645263672, "global_step": 85989, "epoch": 511} {"train_loss": -9.262543678283691, "global_step": 85990, "epoch": 511} {"train_loss": -9.400762557983398, "global_step": 85991, "epoch": 511} {"train_loss": -9.436382293701172, "global_step": 85992, "epoch": 511} {"train_loss": -9.388716697692871, "global_step": 85993, "epoch": 511} {"train_loss": -9.271800994873047, "global_step": 85994, "epoch": 511} {"train_loss": -9.422162055969238, "global_step": 85995, "epoch": 511} {"train_loss": -8.855297088623047, "global_step": 85996, "epoch": 511} {"train_loss": -9.583829879760742, "global_step": 85997, "epoch": 511} {"train_loss": -9.290766716003418, "global_step": 85998, "epoch": 511} {"train_loss": -9.441289901733398, "global_step": 85999, "epoch": 511} {"train_loss": -9.463621139526367, "global_step": 86000, "epoch": 511} {"train_loss": -9.365368843078613, "global_step": 86001, "epoch": 511} {"train_loss": -9.467357635498047, "global_step": 86002, "epoch": 511} {"train_loss": -9.460165023803711, "global_step": 86003, "epoch": 511} {"train_loss": -9.242259979248047, "global_step": 86004, "epoch": 511} {"train_loss": -9.458711624145508, "global_step": 86005, "epoch": 511} {"train_loss": -9.394001007080078, "global_step": 86006, "epoch": 511} {"train_loss": -9.589486122131348, "global_step": 86007, "epoch": 511} {"train_loss": -9.547863960266113, "global_step": 86008, "epoch": 511} {"train_loss": -9.404691696166992, "global_step": 86009, "epoch": 511} {"train_loss": -9.666132926940918, "global_step": 86010, "epoch": 511} {"train_loss": -9.446464538574219, "global_step": 86011, "epoch": 511} {"train_loss": -9.733932495117188, "global_step": 86012, "epoch": 511} {"train_loss": -9.286293029785156, "global_step": 86013, "epoch": 511} {"train_loss": -9.54831600189209, "global_step": 86014, "epoch": 511} {"train_loss": -9.265181830951146, "global_step": 86015, "epoch": 511, "val_loss": 202307.8125} {"train_loss": -9.504115104675293, "global_step": 86016, "epoch": 512} {"train_loss": -9.241987228393555, "global_step": 86017, "epoch": 512} {"train_loss": -9.266040802001953, "global_step": 86018, "epoch": 512} {"train_loss": -9.411127090454102, "global_step": 86019, "epoch": 512} {"train_loss": -9.242801666259766, "global_step": 86020, "epoch": 512} {"train_loss": -9.040372848510742, "global_step": 86021, "epoch": 512} {"train_loss": -9.570266723632812, "global_step": 86022, "epoch": 512} {"train_loss": -9.466705322265625, "global_step": 86023, "epoch": 512} {"train_loss": -9.529964447021484, "global_step": 86024, "epoch": 512} {"train_loss": -9.395872116088867, "global_step": 86025, "epoch": 512} {"train_loss": -9.31728744506836, "global_step": 86026, "epoch": 512} {"train_loss": -9.683204650878906, "global_step": 86027, "epoch": 512} {"train_loss": -9.579498291015625, "global_step": 86028, "epoch": 512} {"train_loss": -9.457345962524414, "global_step": 86029, "epoch": 512} {"train_loss": -9.533127784729004, "global_step": 86030, "epoch": 512} {"train_loss": -9.514535903930664, "global_step": 86031, "epoch": 512} {"train_loss": -9.483174324035645, "global_step": 86032, "epoch": 512} {"train_loss": -9.615337371826172, "global_step": 86033, "epoch": 512} {"train_loss": -9.119342803955078, "global_step": 86034, "epoch": 512} {"train_loss": -9.35441780090332, "global_step": 86035, "epoch": 512} {"train_loss": -9.471365928649902, "global_step": 86036, "epoch": 512} {"train_loss": -9.349139213562012, "global_step": 86037, "epoch": 512} {"train_loss": -9.399550437927246, "global_step": 86038, "epoch": 512} {"train_loss": -8.822094917297363, "global_step": 86039, "epoch": 512} {"train_loss": -9.390382766723633, "global_step": 86040, "epoch": 512} {"train_loss": -9.42819595336914, "global_step": 86041, "epoch": 512} {"train_loss": -9.34138011932373, "global_step": 86042, "epoch": 512} {"train_loss": -9.405675888061523, "global_step": 86043, "epoch": 512} {"train_loss": -9.407614707946777, "global_step": 86044, "epoch": 512} {"train_loss": -9.402131080627441, "global_step": 86045, "epoch": 512} {"train_loss": -9.14034652709961, "global_step": 86046, "epoch": 512} {"train_loss": -9.572399139404297, "global_step": 86047, "epoch": 512} {"train_loss": -9.43989372253418, "global_step": 86048, "epoch": 512} {"train_loss": -9.233098030090332, "global_step": 86049, "epoch": 512} {"train_loss": -9.45280647277832, "global_step": 86050, "epoch": 512} {"train_loss": -9.243707656860352, "global_step": 86051, "epoch": 512} {"train_loss": -9.319744110107422, "global_step": 86052, "epoch": 512} {"train_loss": -9.282062530517578, "global_step": 86053, "epoch": 512} {"train_loss": -9.035747528076172, "global_step": 86054, "epoch": 512} {"train_loss": -9.406993865966797, "global_step": 86055, "epoch": 512} {"train_loss": -9.311338424682617, "global_step": 86056, "epoch": 512} {"train_loss": -9.19265079498291, "global_step": 86057, "epoch": 512} {"train_loss": -9.462746620178223, "global_step": 86058, "epoch": 512} {"train_loss": -9.38558292388916, "global_step": 86059, "epoch": 512} {"train_loss": -9.383241653442383, "global_step": 86060, "epoch": 512} {"train_loss": -9.544676780700684, "global_step": 86061, "epoch": 512} {"train_loss": -9.488340377807617, "global_step": 86062, "epoch": 512} {"train_loss": -9.27864933013916, "global_step": 86063, "epoch": 512} {"train_loss": -9.340301513671875, "global_step": 86064, "epoch": 512} {"train_loss": -9.090182304382324, "global_step": 86065, "epoch": 512} {"train_loss": -9.471746444702148, "global_step": 86066, "epoch": 512} {"train_loss": -9.384235382080078, "global_step": 86067, "epoch": 512} {"train_loss": -9.370233535766602, "global_step": 86068, "epoch": 512} {"train_loss": -9.127470016479492, "global_step": 86069, "epoch": 512} {"train_loss": -9.169229507446289, "global_step": 86070, "epoch": 512} {"train_loss": -9.323781967163086, "global_step": 86071, "epoch": 512} {"train_loss": -9.605941772460938, "global_step": 86072, "epoch": 512} {"train_loss": -9.22816276550293, "global_step": 86073, "epoch": 512} {"train_loss": -9.290178298950195, "global_step": 86074, "epoch": 512} {"train_loss": -9.40639591217041, "global_step": 86075, "epoch": 512} {"train_loss": -9.371770858764648, "global_step": 86076, "epoch": 512} {"train_loss": -9.615720748901367, "global_step": 86077, "epoch": 512} {"train_loss": -9.089777946472168, "global_step": 86078, "epoch": 512} {"train_loss": -9.380817413330078, "global_step": 86079, "epoch": 512} {"train_loss": -9.287653923034668, "global_step": 86080, "epoch": 512} {"train_loss": -9.490482330322266, "global_step": 86081, "epoch": 512} {"train_loss": -9.425613403320312, "global_step": 86082, "epoch": 512} {"train_loss": -9.423094749450684, "global_step": 86083, "epoch": 512} {"train_loss": -9.355354309082031, "global_step": 86084, "epoch": 512} {"train_loss": -9.271108627319336, "global_step": 86085, "epoch": 512} {"train_loss": -9.488990783691406, "global_step": 86086, "epoch": 512} {"train_loss": -9.389702796936035, "global_step": 86087, "epoch": 512} {"train_loss": -9.546937942504883, "global_step": 86088, "epoch": 512} {"train_loss": -9.320063591003418, "global_step": 86089, "epoch": 512} {"train_loss": -9.170323371887207, "global_step": 86090, "epoch": 512} {"train_loss": -9.227200508117676, "global_step": 86091, "epoch": 512} {"train_loss": -9.173458099365234, "global_step": 86092, "epoch": 512} {"train_loss": -9.32080078125, "global_step": 86093, "epoch": 512} {"train_loss": -9.387731552124023, "global_step": 86094, "epoch": 512} {"train_loss": -9.470365524291992, "global_step": 86095, "epoch": 512} {"train_loss": -9.33792781829834, "global_step": 86096, "epoch": 512} {"train_loss": -9.469476699829102, "global_step": 86097, "epoch": 512} {"train_loss": -9.527244567871094, "global_step": 86098, "epoch": 512} {"train_loss": -9.343788146972656, "global_step": 86099, "epoch": 512} {"train_loss": -9.434873580932617, "global_step": 86100, "epoch": 512} {"train_loss": -9.346613883972168, "global_step": 86101, "epoch": 512} {"train_loss": -9.600601196289062, "global_step": 86102, "epoch": 512} {"train_loss": -9.595643043518066, "global_step": 86103, "epoch": 512} {"train_loss": -9.410557746887207, "global_step": 86104, "epoch": 512} {"train_loss": -9.346542358398438, "global_step": 86105, "epoch": 512} {"train_loss": -9.447450637817383, "global_step": 86106, "epoch": 512} {"train_loss": -9.541048049926758, "global_step": 86107, "epoch": 512} {"train_loss": -9.459243774414062, "global_step": 86108, "epoch": 512} {"train_loss": -9.259883880615234, "global_step": 86109, "epoch": 512} {"train_loss": -9.40957260131836, "global_step": 86110, "epoch": 512} {"train_loss": -9.142681121826172, "global_step": 86111, "epoch": 512} {"train_loss": -9.105461120605469, "global_step": 86112, "epoch": 512} {"train_loss": -9.650042533874512, "global_step": 86113, "epoch": 512} {"train_loss": -9.187610626220703, "global_step": 86114, "epoch": 512} {"train_loss": -9.178428649902344, "global_step": 86115, "epoch": 512} {"train_loss": -9.218484878540039, "global_step": 86116, "epoch": 512} {"train_loss": -9.226487159729004, "global_step": 86117, "epoch": 512} {"train_loss": -9.393377304077148, "global_step": 86118, "epoch": 512} {"train_loss": -8.858505249023438, "global_step": 86119, "epoch": 512} {"train_loss": -9.22041130065918, "global_step": 86120, "epoch": 512} {"train_loss": -9.557195663452148, "global_step": 86121, "epoch": 512} {"train_loss": -9.120271682739258, "global_step": 86122, "epoch": 512} {"train_loss": -9.26071834564209, "global_step": 86123, "epoch": 512} {"train_loss": -9.43678092956543, "global_step": 86124, "epoch": 512} {"train_loss": -9.404804229736328, "global_step": 86125, "epoch": 512} {"train_loss": -9.56191635131836, "global_step": 86126, "epoch": 512} {"train_loss": -9.344143867492676, "global_step": 86127, "epoch": 512} {"train_loss": -9.506251335144043, "global_step": 86128, "epoch": 512} {"train_loss": -9.420660018920898, "global_step": 86129, "epoch": 512} {"train_loss": -9.476114273071289, "global_step": 86130, "epoch": 512} {"train_loss": -9.47569465637207, "global_step": 86131, "epoch": 512} {"train_loss": -9.383036613464355, "global_step": 86132, "epoch": 512} {"train_loss": -9.511441230773926, "global_step": 86133, "epoch": 512} {"train_loss": -9.377195358276367, "global_step": 86134, "epoch": 512} {"train_loss": -9.510237693786621, "global_step": 86135, "epoch": 512} {"train_loss": -9.430490493774414, "global_step": 86136, "epoch": 512} {"train_loss": -9.40456771850586, "global_step": 86137, "epoch": 512} {"train_loss": -9.445554733276367, "global_step": 86138, "epoch": 512} {"train_loss": -9.30118179321289, "global_step": 86139, "epoch": 512} {"train_loss": -9.195169448852539, "global_step": 86140, "epoch": 512} {"train_loss": -9.411466598510742, "global_step": 86141, "epoch": 512} {"train_loss": -9.313577651977539, "global_step": 86142, "epoch": 512} {"train_loss": -9.302262306213379, "global_step": 86143, "epoch": 512} {"train_loss": -9.504936218261719, "global_step": 86144, "epoch": 512} {"train_loss": -9.218596458435059, "global_step": 86145, "epoch": 512} {"train_loss": -9.32436752319336, "global_step": 86146, "epoch": 512} {"train_loss": -9.495994567871094, "global_step": 86147, "epoch": 512} {"train_loss": -9.300294876098633, "global_step": 86148, "epoch": 512} {"train_loss": -9.342769622802734, "global_step": 86149, "epoch": 512} {"train_loss": -9.46914291381836, "global_step": 86150, "epoch": 512} {"train_loss": -9.039080619812012, "global_step": 86151, "epoch": 512} {"train_loss": -9.331887245178223, "global_step": 86152, "epoch": 512} {"train_loss": -9.1234769821167, "global_step": 86153, "epoch": 512} {"train_loss": -9.452433586120605, "global_step": 86154, "epoch": 512} {"train_loss": -9.063302040100098, "global_step": 86155, "epoch": 512} {"train_loss": -9.328474044799805, "global_step": 86156, "epoch": 512} {"train_loss": -9.319348335266113, "global_step": 86157, "epoch": 512} {"train_loss": -9.201241493225098, "global_step": 86158, "epoch": 512} {"train_loss": -9.145999908447266, "global_step": 86159, "epoch": 512} {"train_loss": -9.11825180053711, "global_step": 86160, "epoch": 512} {"train_loss": -9.290268898010254, "global_step": 86161, "epoch": 512} {"train_loss": -9.317869186401367, "global_step": 86162, "epoch": 512} {"train_loss": -9.256134033203125, "global_step": 86163, "epoch": 512} {"train_loss": -8.996492385864258, "global_step": 86164, "epoch": 512} {"train_loss": -9.310482025146484, "global_step": 86165, "epoch": 512} {"train_loss": -9.218812942504883, "global_step": 86166, "epoch": 512} {"train_loss": -8.812992095947266, "global_step": 86167, "epoch": 512} {"train_loss": -8.88530445098877, "global_step": 86168, "epoch": 512} {"train_loss": -8.804855346679688, "global_step": 86169, "epoch": 512} {"train_loss": -9.11417007446289, "global_step": 86170, "epoch": 512} {"train_loss": -8.931140899658203, "global_step": 86171, "epoch": 512} {"train_loss": -9.066610336303711, "global_step": 86172, "epoch": 512} {"train_loss": -9.316999435424805, "global_step": 86173, "epoch": 512} {"train_loss": -8.974591255187988, "global_step": 86174, "epoch": 512} {"train_loss": -9.234766960144043, "global_step": 86175, "epoch": 512} {"train_loss": -9.009710311889648, "global_step": 86176, "epoch": 512} {"train_loss": -8.884204864501953, "global_step": 86177, "epoch": 512} {"train_loss": -8.764823913574219, "global_step": 86178, "epoch": 512} {"train_loss": -9.305599212646484, "global_step": 86179, "epoch": 512} {"train_loss": -9.083578109741211, "global_step": 86180, "epoch": 512} {"train_loss": -9.013290405273438, "global_step": 86181, "epoch": 512} {"train_loss": -9.358207702636719, "global_step": 86182, "epoch": 512} {"train_loss": -9.317358181590127, "global_step": 86183, "epoch": 512, "val_loss": 199933.140625} {"train_loss": -9.333303451538086, "global_step": 86184, "epoch": 513} {"train_loss": -8.820422172546387, "global_step": 86185, "epoch": 513} {"train_loss": -8.952418327331543, "global_step": 86186, "epoch": 513} {"train_loss": -8.653801918029785, "global_step": 86187, "epoch": 513} {"train_loss": -9.232741355895996, "global_step": 86188, "epoch": 513} {"train_loss": -8.988903045654297, "global_step": 86189, "epoch": 513} {"train_loss": -9.182973861694336, "global_step": 86190, "epoch": 513} {"train_loss": -9.137887001037598, "global_step": 86191, "epoch": 513} {"train_loss": -9.246040344238281, "global_step": 86192, "epoch": 513} {"train_loss": -9.143580436706543, "global_step": 86193, "epoch": 513} {"train_loss": -9.254615783691406, "global_step": 86194, "epoch": 513} {"train_loss": -9.535356521606445, "global_step": 86195, "epoch": 513} {"train_loss": -9.484481811523438, "global_step": 86196, "epoch": 513} {"train_loss": -9.365087509155273, "global_step": 86197, "epoch": 513} {"train_loss": -9.332809448242188, "global_step": 86198, "epoch": 513} {"train_loss": -9.592108726501465, "global_step": 86199, "epoch": 513} {"train_loss": -9.482909202575684, "global_step": 86200, "epoch": 513} {"train_loss": -9.439215660095215, "global_step": 86201, "epoch": 513} {"train_loss": -9.45825481414795, "global_step": 86202, "epoch": 513} {"train_loss": -9.64543628692627, "global_step": 86203, "epoch": 513} {"train_loss": -9.268632888793945, "global_step": 86204, "epoch": 513} {"train_loss": -9.43696403503418, "global_step": 86205, "epoch": 513} {"train_loss": -9.075019836425781, "global_step": 86206, "epoch": 513} {"train_loss": -9.58977222442627, "global_step": 86207, "epoch": 513} {"train_loss": -9.440858840942383, "global_step": 86208, "epoch": 513} {"train_loss": -9.461902618408203, "global_step": 86209, "epoch": 513} {"train_loss": -9.586713790893555, "global_step": 86210, "epoch": 513} {"train_loss": -9.464452743530273, "global_step": 86211, "epoch": 513} {"train_loss": -9.484598159790039, "global_step": 86212, "epoch": 513} {"train_loss": -9.493085861206055, "global_step": 86213, "epoch": 513} {"train_loss": -9.456328392028809, "global_step": 86214, "epoch": 513} {"train_loss": -9.431673049926758, "global_step": 86215, "epoch": 513} {"train_loss": -9.27239990234375, "global_step": 86216, "epoch": 513} {"train_loss": -9.371503829956055, "global_step": 86217, "epoch": 513} {"train_loss": -9.438810348510742, "global_step": 86218, "epoch": 513} {"train_loss": -9.329706192016602, "global_step": 86219, "epoch": 513} {"train_loss": -9.44749641418457, "global_step": 86220, "epoch": 513} {"train_loss": -9.598487854003906, "global_step": 86221, "epoch": 513} {"train_loss": -9.217288970947266, "global_step": 86222, "epoch": 513} {"train_loss": -9.2877836227417, "global_step": 86223, "epoch": 513} {"train_loss": -9.232940673828125, "global_step": 86224, "epoch": 513} {"train_loss": -9.136998176574707, "global_step": 86225, "epoch": 513} {"train_loss": -9.61545181274414, "global_step": 86226, "epoch": 513} {"train_loss": -9.541366577148438, "global_step": 86227, "epoch": 513} {"train_loss": -9.127647399902344, "global_step": 86228, "epoch": 513} {"train_loss": -9.490276336669922, "global_step": 86229, "epoch": 513} {"train_loss": -8.870121955871582, "global_step": 86230, "epoch": 513} {"train_loss": -9.337328910827637, "global_step": 86231, "epoch": 513} {"train_loss": -9.294071197509766, "global_step": 86232, "epoch": 513} {"train_loss": -9.174174308776855, "global_step": 86233, "epoch": 513} {"train_loss": -9.13125991821289, "global_step": 86234, "epoch": 513} {"train_loss": -9.355957984924316, "global_step": 86235, "epoch": 513} {"train_loss": -9.449756622314453, "global_step": 86236, "epoch": 513} {"train_loss": -9.144487380981445, "global_step": 86237, "epoch": 513} {"train_loss": -9.275617599487305, "global_step": 86238, "epoch": 513} {"train_loss": -9.131811141967773, "global_step": 86239, "epoch": 513} {"train_loss": -9.186298370361328, "global_step": 86240, "epoch": 513} {"train_loss": -9.269502639770508, "global_step": 86241, "epoch": 513} {"train_loss": -9.397269248962402, "global_step": 86242, "epoch": 513} {"train_loss": -9.06617546081543, "global_step": 86243, "epoch": 513} {"train_loss": -9.384016036987305, "global_step": 86244, "epoch": 513} {"train_loss": -9.337303161621094, "global_step": 86245, "epoch": 513} {"train_loss": -8.868897438049316, "global_step": 86246, "epoch": 513} {"train_loss": -9.042741775512695, "global_step": 86247, "epoch": 513} {"train_loss": -9.437265396118164, "global_step": 86248, "epoch": 513} {"train_loss": -8.919391632080078, "global_step": 86249, "epoch": 513} {"train_loss": -9.255805969238281, "global_step": 86250, "epoch": 513} {"train_loss": -9.304937362670898, "global_step": 86251, "epoch": 513} {"train_loss": -9.32723617553711, "global_step": 86252, "epoch": 513} {"train_loss": -9.152799606323242, "global_step": 86253, "epoch": 513} {"train_loss": -9.272268295288086, "global_step": 86254, "epoch": 513} {"train_loss": -9.325075149536133, "global_step": 86255, "epoch": 513} {"train_loss": -9.165313720703125, "global_step": 86256, "epoch": 513} {"train_loss": -9.215206146240234, "global_step": 86257, "epoch": 513} {"train_loss": -9.339735984802246, "global_step": 86258, "epoch": 513} {"train_loss": -9.1826810836792, "global_step": 86259, "epoch": 513} {"train_loss": -9.319904327392578, "global_step": 86260, "epoch": 513} {"train_loss": -9.280508041381836, "global_step": 86261, "epoch": 513} {"train_loss": -9.249931335449219, "global_step": 86262, "epoch": 513} {"train_loss": -9.352730751037598, "global_step": 86263, "epoch": 513} {"train_loss": -9.144983291625977, "global_step": 86264, "epoch": 513} {"train_loss": -9.38287353515625, "global_step": 86265, "epoch": 513} {"train_loss": -8.932503700256348, "global_step": 86266, "epoch": 513} {"train_loss": -9.321887969970703, "global_step": 86267, "epoch": 513} {"train_loss": -9.247329711914062, "global_step": 86268, "epoch": 513} {"train_loss": -9.174930572509766, "global_step": 86269, "epoch": 513} {"train_loss": -9.031246185302734, "global_step": 86270, "epoch": 513} {"train_loss": -9.280701637268066, "global_step": 86271, "epoch": 513} {"train_loss": -9.336135864257812, "global_step": 86272, "epoch": 513} {"train_loss": -9.149797439575195, "global_step": 86273, "epoch": 513} {"train_loss": -9.252033233642578, "global_step": 86274, "epoch": 513} {"train_loss": -8.945682525634766, "global_step": 86275, "epoch": 513} {"train_loss": -9.588079452514648, "global_step": 86276, "epoch": 513} {"train_loss": -8.78215217590332, "global_step": 86277, "epoch": 513} {"train_loss": -9.337579727172852, "global_step": 86278, "epoch": 513} {"train_loss": -9.225095748901367, "global_step": 86279, "epoch": 513} {"train_loss": -9.132575988769531, "global_step": 86280, "epoch": 513} {"train_loss": -9.215873718261719, "global_step": 86281, "epoch": 513} {"train_loss": -9.180124282836914, "global_step": 86282, "epoch": 513} {"train_loss": -9.371221542358398, "global_step": 86283, "epoch": 513} {"train_loss": -9.148797035217285, "global_step": 86284, "epoch": 513} {"train_loss": -9.41663932800293, "global_step": 86285, "epoch": 513} {"train_loss": -9.319380760192871, "global_step": 86286, "epoch": 513} {"train_loss": -9.057319641113281, "global_step": 86287, "epoch": 513} {"train_loss": -9.302031517028809, "global_step": 86288, "epoch": 513} {"train_loss": -9.116819381713867, "global_step": 86289, "epoch": 513} {"train_loss": -8.927000045776367, "global_step": 86290, "epoch": 513} {"train_loss": -8.896814346313477, "global_step": 86291, "epoch": 513} {"train_loss": -9.24305534362793, "global_step": 86292, "epoch": 513} {"train_loss": -9.133768081665039, "global_step": 86293, "epoch": 513} {"train_loss": -9.242959976196289, "global_step": 86294, "epoch": 513} {"train_loss": -9.050821304321289, "global_step": 86295, "epoch": 513} {"train_loss": -9.233097076416016, "global_step": 86296, "epoch": 513} {"train_loss": -9.199427604675293, "global_step": 86297, "epoch": 513} {"train_loss": -9.198830604553223, "global_step": 86298, "epoch": 513} {"train_loss": -9.52814769744873, "global_step": 86299, "epoch": 513} {"train_loss": -9.319744110107422, "global_step": 86300, "epoch": 513} {"train_loss": -9.071075439453125, "global_step": 86301, "epoch": 513} {"train_loss": -9.451691627502441, "global_step": 86302, "epoch": 513} {"train_loss": -9.152250289916992, "global_step": 86303, "epoch": 513} {"train_loss": -9.25256633758545, "global_step": 86304, "epoch": 513} {"train_loss": -9.345166206359863, "global_step": 86305, "epoch": 513} {"train_loss": -9.198368072509766, "global_step": 86306, "epoch": 513} {"train_loss": -9.019363403320312, "global_step": 86307, "epoch": 513} {"train_loss": -9.362621307373047, "global_step": 86308, "epoch": 513} {"train_loss": -8.971288681030273, "global_step": 86309, "epoch": 513} {"train_loss": -9.171802520751953, "global_step": 86310, "epoch": 513} {"train_loss": -9.353341102600098, "global_step": 86311, "epoch": 513} {"train_loss": -9.461959838867188, "global_step": 86312, "epoch": 513} {"train_loss": -9.176636695861816, "global_step": 86313, "epoch": 513} {"train_loss": -9.35340690612793, "global_step": 86314, "epoch": 513} {"train_loss": -9.432125091552734, "global_step": 86315, "epoch": 513} {"train_loss": -9.446624755859375, "global_step": 86316, "epoch": 513} {"train_loss": -9.000032424926758, "global_step": 86317, "epoch": 513} {"train_loss": -9.287031173706055, "global_step": 86318, "epoch": 513} {"train_loss": -9.157086372375488, "global_step": 86319, "epoch": 513} {"train_loss": -9.297197341918945, "global_step": 86320, "epoch": 513} {"train_loss": -9.217733383178711, "global_step": 86321, "epoch": 513} {"train_loss": -9.192278861999512, "global_step": 86322, "epoch": 513} {"train_loss": -9.167281150817871, "global_step": 86323, "epoch": 513} {"train_loss": -9.31533432006836, "global_step": 86324, "epoch": 513} {"train_loss": -9.223527908325195, "global_step": 86325, "epoch": 513} {"train_loss": -9.064687728881836, "global_step": 86326, "epoch": 513} {"train_loss": -9.185808181762695, "global_step": 86327, "epoch": 513} {"train_loss": -9.081453323364258, "global_step": 86328, "epoch": 513} {"train_loss": -9.175010681152344, "global_step": 86329, "epoch": 513} {"train_loss": -9.111932754516602, "global_step": 86330, "epoch": 513} {"train_loss": -9.343074798583984, "global_step": 86331, "epoch": 513} {"train_loss": -9.426321029663086, "global_step": 86332, "epoch": 513} {"train_loss": -9.432241439819336, "global_step": 86333, "epoch": 513} {"train_loss": -9.34924030303955, "global_step": 86334, "epoch": 513} {"train_loss": -9.259744644165039, "global_step": 86335, "epoch": 513} {"train_loss": -9.518207550048828, "global_step": 86336, "epoch": 513} {"train_loss": -9.32646369934082, "global_step": 86337, "epoch": 513} {"train_loss": -9.219420433044434, "global_step": 86338, "epoch": 513} {"train_loss": -9.377754211425781, "global_step": 86339, "epoch": 513} {"train_loss": -9.303966522216797, "global_step": 86340, "epoch": 513} {"train_loss": -9.591212272644043, "global_step": 86341, "epoch": 513} {"train_loss": -9.610604286193848, "global_step": 86342, "epoch": 513} {"train_loss": -9.500616073608398, "global_step": 86343, "epoch": 513} {"train_loss": -9.636642456054688, "global_step": 86344, "epoch": 513} {"train_loss": -9.345495223999023, "global_step": 86345, "epoch": 513} {"train_loss": -9.265859603881836, "global_step": 86346, "epoch": 513} {"train_loss": -9.306546211242676, "global_step": 86347, "epoch": 513} {"train_loss": -9.390687942504883, "global_step": 86348, "epoch": 513} {"train_loss": -9.276437759399414, "global_step": 86349, "epoch": 513} {"train_loss": -9.692588806152344, "global_step": 86350, "epoch": 513} {"train_loss": -9.272772431373596, "global_step": 86351, "epoch": 513, "val_loss": 199350.84375} {"train_loss": -9.245346069335938, "global_step": 86352, "epoch": 514} {"train_loss": -9.199411392211914, "global_step": 86353, "epoch": 514} {"train_loss": -9.140581130981445, "global_step": 86354, "epoch": 514} {"train_loss": -9.324783325195312, "global_step": 86355, "epoch": 514} {"train_loss": -9.263492584228516, "global_step": 86356, "epoch": 514} {"train_loss": -8.997201919555664, "global_step": 86357, "epoch": 514} {"train_loss": -9.063529014587402, "global_step": 86358, "epoch": 514} {"train_loss": -9.377326011657715, "global_step": 86359, "epoch": 514} {"train_loss": -9.089909553527832, "global_step": 86360, "epoch": 514} {"train_loss": -9.465455055236816, "global_step": 86361, "epoch": 514} {"train_loss": -9.389509201049805, "global_step": 86362, "epoch": 514} {"train_loss": -9.090782165527344, "global_step": 86363, "epoch": 514} {"train_loss": -9.512670516967773, "global_step": 86364, "epoch": 514} {"train_loss": -9.141742706298828, "global_step": 86365, "epoch": 514} {"train_loss": -9.585827827453613, "global_step": 86366, "epoch": 514} {"train_loss": -9.598051071166992, "global_step": 86367, "epoch": 514} {"train_loss": -9.405231475830078, "global_step": 86368, "epoch": 514} {"train_loss": -9.416585922241211, "global_step": 86369, "epoch": 514} {"train_loss": -9.381624221801758, "global_step": 86370, "epoch": 514} {"train_loss": -9.41842269897461, "global_step": 86371, "epoch": 514} {"train_loss": -9.524474143981934, "global_step": 86372, "epoch": 514} {"train_loss": -9.079656600952148, "global_step": 86373, "epoch": 514} {"train_loss": -9.09967041015625, "global_step": 86374, "epoch": 514} {"train_loss": -9.393697738647461, "global_step": 86375, "epoch": 514} {"train_loss": -9.08881950378418, "global_step": 86376, "epoch": 514} {"train_loss": -9.3152437210083, "global_step": 86377, "epoch": 514} {"train_loss": -9.230925559997559, "global_step": 86378, "epoch": 514} {"train_loss": -9.162626266479492, "global_step": 86379, "epoch": 514} {"train_loss": -9.563716888427734, "global_step": 86380, "epoch": 514} {"train_loss": -9.071721076965332, "global_step": 86381, "epoch": 514} {"train_loss": -9.276686668395996, "global_step": 86382, "epoch": 514} {"train_loss": -9.560705184936523, "global_step": 86383, "epoch": 514} {"train_loss": -9.27169132232666, "global_step": 86384, "epoch": 514} {"train_loss": -9.275065422058105, "global_step": 86385, "epoch": 514} {"train_loss": -9.401288986206055, "global_step": 86386, "epoch": 514} {"train_loss": -9.089010238647461, "global_step": 86387, "epoch": 514} {"train_loss": -9.367252349853516, "global_step": 86388, "epoch": 514} {"train_loss": -9.35455322265625, "global_step": 86389, "epoch": 514} {"train_loss": -9.363455772399902, "global_step": 86390, "epoch": 514} {"train_loss": -9.304463386535645, "global_step": 86391, "epoch": 514} {"train_loss": -9.467462539672852, "global_step": 86392, "epoch": 514} {"train_loss": -9.479448318481445, "global_step": 86393, "epoch": 514} {"train_loss": -9.319530487060547, "global_step": 86394, "epoch": 514} {"train_loss": -9.455751419067383, "global_step": 86395, "epoch": 514} {"train_loss": -9.56573486328125, "global_step": 86396, "epoch": 514} {"train_loss": -9.211528778076172, "global_step": 86397, "epoch": 514} {"train_loss": -9.335227966308594, "global_step": 86398, "epoch": 514} {"train_loss": -9.536357879638672, "global_step": 86399, "epoch": 514} {"train_loss": -9.314501762390137, "global_step": 86400, "epoch": 514} {"train_loss": -9.413819313049316, "global_step": 86401, "epoch": 514} {"train_loss": -9.351354598999023, "global_step": 86402, "epoch": 514} {"train_loss": -9.316184043884277, "global_step": 86403, "epoch": 514} {"train_loss": -9.325239181518555, "global_step": 86404, "epoch": 514} {"train_loss": -9.229482650756836, "global_step": 86405, "epoch": 514} {"train_loss": -9.22126579284668, "global_step": 86406, "epoch": 514} {"train_loss": -9.448212623596191, "global_step": 86407, "epoch": 514} {"train_loss": -9.222330093383789, "global_step": 86408, "epoch": 514} {"train_loss": -9.636147499084473, "global_step": 86409, "epoch": 514} {"train_loss": -9.558094024658203, "global_step": 86410, "epoch": 514} {"train_loss": -9.221808433532715, "global_step": 86411, "epoch": 514} {"train_loss": -9.500840187072754, "global_step": 86412, "epoch": 514} {"train_loss": -9.255839347839355, "global_step": 86413, "epoch": 514} {"train_loss": -9.340633392333984, "global_step": 86414, "epoch": 514} {"train_loss": -9.39179801940918, "global_step": 86415, "epoch": 514} {"train_loss": -9.257723808288574, "global_step": 86416, "epoch": 514} {"train_loss": -9.454225540161133, "global_step": 86417, "epoch": 514} {"train_loss": -9.447547912597656, "global_step": 86418, "epoch": 514} {"train_loss": -9.413374900817871, "global_step": 86419, "epoch": 514} {"train_loss": -9.644950866699219, "global_step": 86420, "epoch": 514} {"train_loss": -9.437646865844727, "global_step": 86421, "epoch": 514} {"train_loss": -9.417825698852539, "global_step": 86422, "epoch": 514} {"train_loss": -9.322561264038086, "global_step": 86423, "epoch": 514} {"train_loss": -9.173645973205566, "global_step": 86424, "epoch": 514} {"train_loss": -9.39915657043457, "global_step": 86425, "epoch": 514} {"train_loss": -9.415349960327148, "global_step": 86426, "epoch": 514} {"train_loss": -9.461553573608398, "global_step": 86427, "epoch": 514} {"train_loss": -9.307350158691406, "global_step": 86428, "epoch": 514} {"train_loss": -9.423501968383789, "global_step": 86429, "epoch": 514} {"train_loss": -9.300411224365234, "global_step": 86430, "epoch": 514} {"train_loss": -9.546785354614258, "global_step": 86431, "epoch": 514} {"train_loss": -9.322425842285156, "global_step": 86432, "epoch": 514} {"train_loss": -9.141425132751465, "global_step": 86433, "epoch": 514} {"train_loss": -9.461170196533203, "global_step": 86434, "epoch": 514} {"train_loss": -9.233074188232422, "global_step": 86435, "epoch": 514} {"train_loss": -9.195291519165039, "global_step": 86436, "epoch": 514} {"train_loss": -9.31216812133789, "global_step": 86437, "epoch": 514} {"train_loss": -9.227922439575195, "global_step": 86438, "epoch": 514} {"train_loss": -9.409183502197266, "global_step": 86439, "epoch": 514} {"train_loss": -8.624273300170898, "global_step": 86440, "epoch": 514} {"train_loss": -9.148724555969238, "global_step": 86441, "epoch": 514} {"train_loss": -8.869344711303711, "global_step": 86442, "epoch": 514} {"train_loss": -8.906639099121094, "global_step": 86443, "epoch": 514} {"train_loss": -9.157121658325195, "global_step": 86444, "epoch": 514} {"train_loss": -8.903890609741211, "global_step": 86445, "epoch": 514} {"train_loss": -9.371482849121094, "global_step": 86446, "epoch": 514} {"train_loss": -9.140554428100586, "global_step": 86447, "epoch": 514} {"train_loss": -9.283737182617188, "global_step": 86448, "epoch": 514} {"train_loss": -9.07234001159668, "global_step": 86449, "epoch": 514} {"train_loss": -9.161355972290039, "global_step": 86450, "epoch": 514} {"train_loss": -9.284689903259277, "global_step": 86451, "epoch": 514} {"train_loss": -9.5478515625, "global_step": 86452, "epoch": 514} {"train_loss": -9.10628604888916, "global_step": 86453, "epoch": 514} {"train_loss": -9.439393043518066, "global_step": 86454, "epoch": 514} {"train_loss": -9.02077865600586, "global_step": 86455, "epoch": 514} {"train_loss": -9.354764938354492, "global_step": 86456, "epoch": 514} {"train_loss": -9.145319938659668, "global_step": 86457, "epoch": 514} {"train_loss": -9.044750213623047, "global_step": 86458, "epoch": 514} {"train_loss": -9.552301406860352, "global_step": 86459, "epoch": 514} {"train_loss": -9.356910705566406, "global_step": 86460, "epoch": 514} {"train_loss": -9.344888687133789, "global_step": 86461, "epoch": 514} {"train_loss": -9.331144332885742, "global_step": 86462, "epoch": 514} {"train_loss": -9.466894149780273, "global_step": 86463, "epoch": 514} {"train_loss": -9.197277069091797, "global_step": 86464, "epoch": 514} {"train_loss": -9.108724594116211, "global_step": 86465, "epoch": 514} {"train_loss": -9.537017822265625, "global_step": 86466, "epoch": 514} {"train_loss": -9.381117820739746, "global_step": 86467, "epoch": 514} {"train_loss": -9.30150032043457, "global_step": 86468, "epoch": 514} {"train_loss": -9.488348007202148, "global_step": 86469, "epoch": 514} {"train_loss": -9.468851089477539, "global_step": 86470, "epoch": 514} {"train_loss": -9.492856979370117, "global_step": 86471, "epoch": 514} {"train_loss": -9.44051742553711, "global_step": 86472, "epoch": 514} {"train_loss": -9.070884704589844, "global_step": 86473, "epoch": 514} {"train_loss": -9.390748977661133, "global_step": 86474, "epoch": 514} {"train_loss": -9.257253646850586, "global_step": 86475, "epoch": 514} {"train_loss": -9.594770431518555, "global_step": 86476, "epoch": 514} {"train_loss": -9.416227340698242, "global_step": 86477, "epoch": 514} {"train_loss": -9.350320816040039, "global_step": 86478, "epoch": 514} {"train_loss": -9.345178604125977, "global_step": 86479, "epoch": 514} {"train_loss": -9.518415451049805, "global_step": 86480, "epoch": 514} {"train_loss": -9.3819580078125, "global_step": 86481, "epoch": 514} {"train_loss": -9.366722106933594, "global_step": 86482, "epoch": 514} {"train_loss": -9.430675506591797, "global_step": 86483, "epoch": 514} {"train_loss": -9.50772762298584, "global_step": 86484, "epoch": 514} {"train_loss": -9.52791976928711, "global_step": 86485, "epoch": 514} {"train_loss": -9.569879531860352, "global_step": 86486, "epoch": 514} {"train_loss": -9.324502944946289, "global_step": 86487, "epoch": 514} {"train_loss": -9.273578643798828, "global_step": 86488, "epoch": 514} {"train_loss": -9.493865966796875, "global_step": 86489, "epoch": 514} {"train_loss": -9.47548770904541, "global_step": 86490, "epoch": 514} {"train_loss": -9.352071762084961, "global_step": 86491, "epoch": 514} {"train_loss": -9.720464706420898, "global_step": 86492, "epoch": 514} {"train_loss": -9.352028846740723, "global_step": 86493, "epoch": 514} {"train_loss": -9.18582534790039, "global_step": 86494, "epoch": 514} {"train_loss": -9.285898208618164, "global_step": 86495, "epoch": 514} {"train_loss": -9.067203521728516, "global_step": 86496, "epoch": 514} {"train_loss": -8.680940628051758, "global_step": 86497, "epoch": 514} {"train_loss": -9.196325302124023, "global_step": 86498, "epoch": 514} {"train_loss": -8.822746276855469, "global_step": 86499, "epoch": 514} {"train_loss": -8.880759239196777, "global_step": 86500, "epoch": 514} {"train_loss": -8.838615417480469, "global_step": 86501, "epoch": 514} {"train_loss": -9.048257827758789, "global_step": 86502, "epoch": 514} {"train_loss": -8.889471054077148, "global_step": 86503, "epoch": 514} {"train_loss": -8.834016799926758, "global_step": 86504, "epoch": 514} {"train_loss": -9.031054496765137, "global_step": 86505, "epoch": 514} {"train_loss": -9.266359329223633, "global_step": 86506, "epoch": 514} {"train_loss": -9.278697967529297, "global_step": 86507, "epoch": 514} {"train_loss": -8.999031066894531, "global_step": 86508, "epoch": 514} {"train_loss": -9.136591911315918, "global_step": 86509, "epoch": 514} {"train_loss": -9.15898323059082, "global_step": 86510, "epoch": 514} {"train_loss": -9.027891159057617, "global_step": 86511, "epoch": 514} {"train_loss": -9.217093467712402, "global_step": 86512, "epoch": 514} {"train_loss": -9.355228424072266, "global_step": 86513, "epoch": 514} {"train_loss": -9.063356399536133, "global_step": 86514, "epoch": 514} {"train_loss": -9.268843650817871, "global_step": 86515, "epoch": 514} {"train_loss": -9.392274856567383, "global_step": 86516, "epoch": 514} {"train_loss": -9.181514739990234, "global_step": 86517, "epoch": 514} {"train_loss": -9.171615600585938, "global_step": 86518, "epoch": 514} {"train_loss": -9.293268146969023, "global_step": 86519, "epoch": 514, "val_loss": 202080.90625} {"train_loss": -9.397638320922852, "global_step": 86520, "epoch": 515} {"train_loss": -9.412984848022461, "global_step": 86521, "epoch": 515} {"train_loss": -9.203277587890625, "global_step": 86522, "epoch": 515} {"train_loss": -9.251245498657227, "global_step": 86523, "epoch": 515} {"train_loss": -9.516194343566895, "global_step": 86524, "epoch": 515} {"train_loss": -9.125507354736328, "global_step": 86525, "epoch": 515} {"train_loss": -9.250635147094727, "global_step": 86526, "epoch": 515} {"train_loss": -9.30773639678955, "global_step": 86527, "epoch": 515} {"train_loss": -9.394938468933105, "global_step": 86528, "epoch": 515} {"train_loss": -9.405874252319336, "global_step": 86529, "epoch": 515} {"train_loss": -9.279203414916992, "global_step": 86530, "epoch": 515} {"train_loss": -9.420122146606445, "global_step": 86531, "epoch": 515} {"train_loss": -9.553838729858398, "global_step": 86532, "epoch": 515} {"train_loss": -9.526468276977539, "global_step": 86533, "epoch": 515} {"train_loss": -9.474498748779297, "global_step": 86534, "epoch": 515} {"train_loss": -9.754619598388672, "global_step": 86535, "epoch": 515} {"train_loss": -9.360940933227539, "global_step": 86536, "epoch": 515} {"train_loss": -9.530052185058594, "global_step": 86537, "epoch": 515} {"train_loss": -9.480743408203125, "global_step": 86538, "epoch": 515} {"train_loss": -9.644735336303711, "global_step": 86539, "epoch": 515} {"train_loss": -9.40259838104248, "global_step": 86540, "epoch": 515} {"train_loss": -9.612773895263672, "global_step": 86541, "epoch": 515} {"train_loss": -9.561670303344727, "global_step": 86542, "epoch": 515} {"train_loss": -9.389833450317383, "global_step": 86543, "epoch": 515} {"train_loss": -9.332633972167969, "global_step": 86544, "epoch": 515} {"train_loss": -9.643596649169922, "global_step": 86545, "epoch": 515} {"train_loss": -9.645965576171875, "global_step": 86546, "epoch": 515} {"train_loss": -9.458733558654785, "global_step": 86547, "epoch": 515} {"train_loss": -9.612427711486816, "global_step": 86548, "epoch": 515} {"train_loss": -9.723396301269531, "global_step": 86549, "epoch": 515} {"train_loss": -9.151698112487793, "global_step": 86550, "epoch": 515} {"train_loss": -9.571146965026855, "global_step": 86551, "epoch": 515} {"train_loss": -8.369210243225098, "global_step": 86552, "epoch": 515} {"train_loss": -9.532333374023438, "global_step": 86553, "epoch": 515} {"train_loss": -8.665679931640625, "global_step": 86554, "epoch": 515} {"train_loss": -9.227036476135254, "global_step": 86555, "epoch": 515} {"train_loss": -9.16061782836914, "global_step": 86556, "epoch": 515} {"train_loss": -9.032764434814453, "global_step": 86557, "epoch": 515} {"train_loss": -8.91681957244873, "global_step": 86558, "epoch": 515} {"train_loss": -8.984959602355957, "global_step": 86559, "epoch": 515} {"train_loss": -9.021955490112305, "global_step": 86560, "epoch": 515} {"train_loss": -9.02039909362793, "global_step": 86561, "epoch": 515} {"train_loss": -9.257522583007812, "global_step": 86562, "epoch": 515} {"train_loss": -9.270111083984375, "global_step": 86563, "epoch": 515} {"train_loss": -9.341103553771973, "global_step": 86564, "epoch": 515} {"train_loss": -9.436372756958008, "global_step": 86565, "epoch": 515} {"train_loss": -9.452779769897461, "global_step": 86566, "epoch": 515} {"train_loss": -9.007896423339844, "global_step": 86567, "epoch": 515} {"train_loss": -9.138069152832031, "global_step": 86568, "epoch": 515} {"train_loss": -9.29800796508789, "global_step": 86569, "epoch": 515} {"train_loss": -9.340736389160156, "global_step": 86570, "epoch": 515} {"train_loss": -9.257606506347656, "global_step": 86571, "epoch": 515} {"train_loss": -9.327929496765137, "global_step": 86572, "epoch": 515} {"train_loss": -9.279510498046875, "global_step": 86573, "epoch": 515} {"train_loss": -9.45030403137207, "global_step": 86574, "epoch": 515} {"train_loss": -9.131572723388672, "global_step": 86575, "epoch": 515} {"train_loss": -9.49368953704834, "global_step": 86576, "epoch": 515} {"train_loss": -9.520515441894531, "global_step": 86577, "epoch": 515} {"train_loss": -9.361979484558105, "global_step": 86578, "epoch": 515} {"train_loss": -9.5189790725708, "global_step": 86579, "epoch": 515} {"train_loss": -9.616570472717285, "global_step": 86580, "epoch": 515} {"train_loss": -9.364906311035156, "global_step": 86581, "epoch": 515} {"train_loss": -9.580280303955078, "global_step": 86582, "epoch": 515} {"train_loss": -9.751501083374023, "global_step": 86583, "epoch": 515} {"train_loss": -9.51419448852539, "global_step": 86584, "epoch": 515} {"train_loss": -9.698452949523926, "global_step": 86585, "epoch": 515} {"train_loss": -9.357770919799805, "global_step": 86586, "epoch": 515} {"train_loss": -9.612499237060547, "global_step": 86587, "epoch": 515} {"train_loss": -9.466853141784668, "global_step": 86588, "epoch": 515} {"train_loss": -9.474428176879883, "global_step": 86589, "epoch": 515} {"train_loss": -9.520183563232422, "global_step": 86590, "epoch": 515} {"train_loss": -9.71169376373291, "global_step": 86591, "epoch": 515} {"train_loss": -9.662566184997559, "global_step": 86592, "epoch": 515} {"train_loss": -9.48081111907959, "global_step": 86593, "epoch": 515} {"train_loss": -9.499595642089844, "global_step": 86594, "epoch": 515} {"train_loss": -9.160299301147461, "global_step": 86595, "epoch": 515} {"train_loss": -9.025981903076172, "global_step": 86596, "epoch": 515} {"train_loss": -9.17111587524414, "global_step": 86597, "epoch": 515} {"train_loss": -9.453166961669922, "global_step": 86598, "epoch": 515} {"train_loss": -8.650165557861328, "global_step": 86599, "epoch": 515} {"train_loss": -9.275156021118164, "global_step": 86600, "epoch": 515} {"train_loss": -8.85491943359375, "global_step": 86601, "epoch": 515} {"train_loss": -8.912492752075195, "global_step": 86602, "epoch": 515} {"train_loss": -9.079619407653809, "global_step": 86603, "epoch": 515} {"train_loss": -8.849369049072266, "global_step": 86604, "epoch": 515} {"train_loss": -8.82525634765625, "global_step": 86605, "epoch": 515} {"train_loss": -8.926921844482422, "global_step": 86606, "epoch": 515} {"train_loss": -8.567072868347168, "global_step": 86607, "epoch": 515} {"train_loss": -9.167451858520508, "global_step": 86608, "epoch": 515} {"train_loss": -9.191085815429688, "global_step": 86609, "epoch": 515} {"train_loss": -8.955724716186523, "global_step": 86610, "epoch": 515} {"train_loss": -9.19892692565918, "global_step": 86611, "epoch": 515} {"train_loss": -8.786579132080078, "global_step": 86612, "epoch": 515} {"train_loss": -9.057876586914062, "global_step": 86613, "epoch": 515} {"train_loss": -8.917757034301758, "global_step": 86614, "epoch": 515} {"train_loss": -9.073554039001465, "global_step": 86615, "epoch": 515} {"train_loss": -8.874639511108398, "global_step": 86616, "epoch": 515} {"train_loss": -9.416491508483887, "global_step": 86617, "epoch": 515} {"train_loss": -9.079520225524902, "global_step": 86618, "epoch": 515} {"train_loss": -9.007250785827637, "global_step": 86619, "epoch": 515} {"train_loss": -9.17693042755127, "global_step": 86620, "epoch": 515} {"train_loss": -9.119025230407715, "global_step": 86621, "epoch": 515} {"train_loss": -9.344526290893555, "global_step": 86622, "epoch": 515} {"train_loss": -9.246158599853516, "global_step": 86623, "epoch": 515} {"train_loss": -9.33686637878418, "global_step": 86624, "epoch": 515} {"train_loss": -8.928958892822266, "global_step": 86625, "epoch": 515} {"train_loss": -9.23971176147461, "global_step": 86626, "epoch": 515} {"train_loss": -9.333450317382812, "global_step": 86627, "epoch": 515} {"train_loss": -9.455326080322266, "global_step": 86628, "epoch": 515} {"train_loss": -9.294675827026367, "global_step": 86629, "epoch": 515} {"train_loss": -9.345779418945312, "global_step": 86630, "epoch": 515} {"train_loss": -9.346635818481445, "global_step": 86631, "epoch": 515} {"train_loss": -9.519594192504883, "global_step": 86632, "epoch": 515} {"train_loss": -9.480198860168457, "global_step": 86633, "epoch": 515} {"train_loss": -9.474908828735352, "global_step": 86634, "epoch": 515} {"train_loss": -9.47240924835205, "global_step": 86635, "epoch": 515} {"train_loss": -9.518867492675781, "global_step": 86636, "epoch": 515} {"train_loss": -9.667118072509766, "global_step": 86637, "epoch": 515} {"train_loss": -9.545211791992188, "global_step": 86638, "epoch": 515} {"train_loss": -9.493677139282227, "global_step": 86639, "epoch": 515} {"train_loss": -9.672574996948242, "global_step": 86640, "epoch": 515} {"train_loss": -9.383634567260742, "global_step": 86641, "epoch": 515} {"train_loss": -9.565133094787598, "global_step": 86642, "epoch": 515} {"train_loss": -9.347168922424316, "global_step": 86643, "epoch": 515} {"train_loss": -9.532660484313965, "global_step": 86644, "epoch": 515} {"train_loss": -9.525510787963867, "global_step": 86645, "epoch": 515} {"train_loss": -9.12738037109375, "global_step": 86646, "epoch": 515} {"train_loss": -9.0774564743042, "global_step": 86647, "epoch": 515} {"train_loss": -9.233689308166504, "global_step": 86648, "epoch": 515} {"train_loss": -8.941667556762695, "global_step": 86649, "epoch": 515} {"train_loss": -9.094918251037598, "global_step": 86650, "epoch": 515} {"train_loss": -9.094714164733887, "global_step": 86651, "epoch": 515} {"train_loss": -9.03408432006836, "global_step": 86652, "epoch": 515} {"train_loss": -9.015106201171875, "global_step": 86653, "epoch": 515} {"train_loss": -8.90434741973877, "global_step": 86654, "epoch": 515} {"train_loss": -9.28156852722168, "global_step": 86655, "epoch": 515} {"train_loss": -9.041997909545898, "global_step": 86656, "epoch": 515} {"train_loss": -9.241947174072266, "global_step": 86657, "epoch": 515} {"train_loss": -9.1220064163208, "global_step": 86658, "epoch": 515} {"train_loss": -8.814340591430664, "global_step": 86659, "epoch": 515} {"train_loss": -9.107809066772461, "global_step": 86660, "epoch": 515} {"train_loss": -9.317536354064941, "global_step": 86661, "epoch": 515} {"train_loss": -9.230501174926758, "global_step": 86662, "epoch": 515} {"train_loss": -8.925039291381836, "global_step": 86663, "epoch": 515} {"train_loss": -9.382431030273438, "global_step": 86664, "epoch": 515} {"train_loss": -9.450845718383789, "global_step": 86665, "epoch": 515} {"train_loss": -9.350662231445312, "global_step": 86666, "epoch": 515} {"train_loss": -9.354867935180664, "global_step": 86667, "epoch": 515} {"train_loss": -9.55626106262207, "global_step": 86668, "epoch": 515} {"train_loss": -9.428304672241211, "global_step": 86669, "epoch": 515} {"train_loss": -9.450105667114258, "global_step": 86670, "epoch": 515} {"train_loss": -9.339272499084473, "global_step": 86671, "epoch": 515} {"train_loss": -9.443353652954102, "global_step": 86672, "epoch": 515} {"train_loss": -9.242443084716797, "global_step": 86673, "epoch": 515} {"train_loss": -9.50457763671875, "global_step": 86674, "epoch": 515} {"train_loss": -9.519342422485352, "global_step": 86675, "epoch": 515} {"train_loss": -9.50052261352539, "global_step": 86676, "epoch": 515} {"train_loss": -9.614095687866211, "global_step": 86677, "epoch": 515} {"train_loss": -9.63039779663086, "global_step": 86678, "epoch": 515} {"train_loss": -9.257881164550781, "global_step": 86679, "epoch": 515} {"train_loss": -9.428125381469727, "global_step": 86680, "epoch": 515} {"train_loss": -9.595827102661133, "global_step": 86681, "epoch": 515} {"train_loss": -9.447773933410645, "global_step": 86682, "epoch": 515} {"train_loss": -9.502262115478516, "global_step": 86683, "epoch": 515} {"train_loss": -9.372066497802734, "global_step": 86684, "epoch": 515} {"train_loss": -9.460836410522461, "global_step": 86685, "epoch": 515} {"train_loss": -9.650632858276367, "global_step": 86686, "epoch": 515} {"train_loss": -9.309136765343803, "global_step": 86687, "epoch": 515, "val_loss": 201339.21875, "train_action_mse_error": 3.1948816776275635} {"train_loss": -9.579885482788086, "global_step": 86688, "epoch": 516} {"train_loss": -9.441659927368164, "global_step": 86689, "epoch": 516} {"train_loss": -9.250478744506836, "global_step": 86690, "epoch": 516} {"train_loss": -9.727625846862793, "global_step": 86691, "epoch": 516} {"train_loss": -9.30156421661377, "global_step": 86692, "epoch": 516} {"train_loss": -9.38779067993164, "global_step": 86693, "epoch": 516} {"train_loss": -9.320840835571289, "global_step": 86694, "epoch": 516} {"train_loss": -9.371585845947266, "global_step": 86695, "epoch": 516} {"train_loss": -9.346017837524414, "global_step": 86696, "epoch": 516} {"train_loss": -9.171358108520508, "global_step": 86697, "epoch": 516} {"train_loss": -9.122496604919434, "global_step": 86698, "epoch": 516} {"train_loss": -9.49286937713623, "global_step": 86699, "epoch": 516} {"train_loss": -9.213616371154785, "global_step": 86700, "epoch": 516} {"train_loss": -9.243480682373047, "global_step": 86701, "epoch": 516} {"train_loss": -9.454056739807129, "global_step": 86702, "epoch": 516} {"train_loss": -9.207069396972656, "global_step": 86703, "epoch": 516} {"train_loss": -9.353264808654785, "global_step": 86704, "epoch": 516} {"train_loss": -9.35618782043457, "global_step": 86705, "epoch": 516} {"train_loss": -9.16693115234375, "global_step": 86706, "epoch": 516} {"train_loss": -9.201669692993164, "global_step": 86707, "epoch": 516} {"train_loss": -9.247913360595703, "global_step": 86708, "epoch": 516} {"train_loss": -9.12106704711914, "global_step": 86709, "epoch": 516} {"train_loss": -9.226122856140137, "global_step": 86710, "epoch": 516} {"train_loss": -9.149003028869629, "global_step": 86711, "epoch": 516} {"train_loss": -9.28782844543457, "global_step": 86712, "epoch": 516} {"train_loss": -9.056750297546387, "global_step": 86713, "epoch": 516} {"train_loss": -9.32807445526123, "global_step": 86714, "epoch": 516} {"train_loss": -9.483654022216797, "global_step": 86715, "epoch": 516} {"train_loss": -9.1995849609375, "global_step": 86716, "epoch": 516} {"train_loss": -9.259289741516113, "global_step": 86717, "epoch": 516} {"train_loss": -9.255810737609863, "global_step": 86718, "epoch": 516} {"train_loss": -9.587726593017578, "global_step": 86719, "epoch": 516} {"train_loss": -9.383140563964844, "global_step": 86720, "epoch": 516} {"train_loss": -9.324213027954102, "global_step": 86721, "epoch": 516} {"train_loss": -9.369577407836914, "global_step": 86722, "epoch": 516} {"train_loss": -9.392086029052734, "global_step": 86723, "epoch": 516} {"train_loss": -9.568254470825195, "global_step": 86724, "epoch": 516} {"train_loss": -9.205591201782227, "global_step": 86725, "epoch": 516} {"train_loss": -9.111351013183594, "global_step": 86726, "epoch": 516} {"train_loss": -9.316940307617188, "global_step": 86727, "epoch": 516} {"train_loss": -9.332441329956055, "global_step": 86728, "epoch": 516} {"train_loss": -9.606748580932617, "global_step": 86729, "epoch": 516} {"train_loss": -9.255407333374023, "global_step": 86730, "epoch": 516} {"train_loss": -9.40690803527832, "global_step": 86731, "epoch": 516} {"train_loss": -9.227095603942871, "global_step": 86732, "epoch": 516} {"train_loss": -9.507085800170898, "global_step": 86733, "epoch": 516} {"train_loss": -9.1841459274292, "global_step": 86734, "epoch": 516} {"train_loss": -9.272978782653809, "global_step": 86735, "epoch": 516} {"train_loss": -9.431205749511719, "global_step": 86736, "epoch": 516} {"train_loss": -9.505507469177246, "global_step": 86737, "epoch": 516} {"train_loss": -9.172760009765625, "global_step": 86738, "epoch": 516} {"train_loss": -9.535754203796387, "global_step": 86739, "epoch": 516} {"train_loss": -9.416296005249023, "global_step": 86740, "epoch": 516} {"train_loss": -9.4452543258667, "global_step": 86741, "epoch": 516} {"train_loss": -9.578756332397461, "global_step": 86742, "epoch": 516} {"train_loss": -9.406177520751953, "global_step": 86743, "epoch": 516} {"train_loss": -9.560972213745117, "global_step": 86744, "epoch": 516} {"train_loss": -9.367478370666504, "global_step": 86745, "epoch": 516} {"train_loss": -9.61203384399414, "global_step": 86746, "epoch": 516} {"train_loss": -9.322429656982422, "global_step": 86747, "epoch": 516} {"train_loss": -9.484689712524414, "global_step": 86748, "epoch": 516} {"train_loss": -9.15366268157959, "global_step": 86749, "epoch": 516} {"train_loss": -9.135398864746094, "global_step": 86750, "epoch": 516} {"train_loss": -9.458612442016602, "global_step": 86751, "epoch": 516} {"train_loss": -9.38604736328125, "global_step": 86752, "epoch": 516} {"train_loss": -9.69471549987793, "global_step": 86753, "epoch": 516} {"train_loss": -9.212182998657227, "global_step": 86754, "epoch": 516} {"train_loss": -9.436968803405762, "global_step": 86755, "epoch": 516} {"train_loss": -9.354863166809082, "global_step": 86756, "epoch": 516} {"train_loss": -9.264314651489258, "global_step": 86757, "epoch": 516} {"train_loss": -9.256052017211914, "global_step": 86758, "epoch": 516} {"train_loss": -9.19561767578125, "global_step": 86759, "epoch": 516} {"train_loss": -9.555038452148438, "global_step": 86760, "epoch": 516} {"train_loss": -9.41513729095459, "global_step": 86761, "epoch": 516} {"train_loss": -9.364293098449707, "global_step": 86762, "epoch": 516} {"train_loss": -9.373313903808594, "global_step": 86763, "epoch": 516} {"train_loss": -8.966350555419922, "global_step": 86764, "epoch": 516} {"train_loss": -9.405445098876953, "global_step": 86765, "epoch": 516} {"train_loss": -8.859505653381348, "global_step": 86766, "epoch": 516} {"train_loss": -9.582722663879395, "global_step": 86767, "epoch": 516} {"train_loss": -9.298144340515137, "global_step": 86768, "epoch": 516} {"train_loss": -9.464893341064453, "global_step": 86769, "epoch": 516} {"train_loss": -9.287178039550781, "global_step": 86770, "epoch": 516} {"train_loss": -9.346992492675781, "global_step": 86771, "epoch": 516} {"train_loss": -9.321863174438477, "global_step": 86772, "epoch": 516} {"train_loss": -9.347742080688477, "global_step": 86773, "epoch": 516} {"train_loss": -9.413414001464844, "global_step": 86774, "epoch": 516} {"train_loss": -9.315393447875977, "global_step": 86775, "epoch": 516} {"train_loss": -9.481582641601562, "global_step": 86776, "epoch": 516} {"train_loss": -9.308216094970703, "global_step": 86777, "epoch": 516} {"train_loss": -9.353221893310547, "global_step": 86778, "epoch": 516} {"train_loss": -9.374282836914062, "global_step": 86779, "epoch": 516} {"train_loss": -9.329057693481445, "global_step": 86780, "epoch": 516} {"train_loss": -9.27951431274414, "global_step": 86781, "epoch": 516} {"train_loss": -9.604174613952637, "global_step": 86782, "epoch": 516} {"train_loss": -9.625133514404297, "global_step": 86783, "epoch": 516} {"train_loss": -9.540767669677734, "global_step": 86784, "epoch": 516} {"train_loss": -9.586105346679688, "global_step": 86785, "epoch": 516} {"train_loss": -9.315068244934082, "global_step": 86786, "epoch": 516} {"train_loss": -9.327939987182617, "global_step": 86787, "epoch": 516} {"train_loss": -9.448583602905273, "global_step": 86788, "epoch": 516} {"train_loss": -9.697684288024902, "global_step": 86789, "epoch": 516} {"train_loss": -9.626636505126953, "global_step": 86790, "epoch": 516} {"train_loss": -9.38846492767334, "global_step": 86791, "epoch": 516} {"train_loss": -9.468780517578125, "global_step": 86792, "epoch": 516} {"train_loss": -9.560373306274414, "global_step": 86793, "epoch": 516} {"train_loss": -9.530740737915039, "global_step": 86794, "epoch": 516} {"train_loss": -9.390968322753906, "global_step": 86795, "epoch": 516} {"train_loss": -9.415273666381836, "global_step": 86796, "epoch": 516} {"train_loss": -9.54376220703125, "global_step": 86797, "epoch": 516} {"train_loss": -9.499391555786133, "global_step": 86798, "epoch": 516} {"train_loss": -9.60413932800293, "global_step": 86799, "epoch": 516} {"train_loss": -9.214923858642578, "global_step": 86800, "epoch": 516} {"train_loss": -9.316280364990234, "global_step": 86801, "epoch": 516} {"train_loss": -9.145393371582031, "global_step": 86802, "epoch": 516} {"train_loss": -9.437820434570312, "global_step": 86803, "epoch": 516} {"train_loss": -9.395663261413574, "global_step": 86804, "epoch": 516} {"train_loss": -9.43820858001709, "global_step": 86805, "epoch": 516} {"train_loss": -9.424335479736328, "global_step": 86806, "epoch": 516} {"train_loss": -9.411608695983887, "global_step": 86807, "epoch": 516} {"train_loss": -9.277996063232422, "global_step": 86808, "epoch": 516} {"train_loss": -9.396368026733398, "global_step": 86809, "epoch": 516} {"train_loss": -9.439369201660156, "global_step": 86810, "epoch": 516} {"train_loss": -9.409688949584961, "global_step": 86811, "epoch": 516} {"train_loss": -9.562551498413086, "global_step": 86812, "epoch": 516} {"train_loss": -9.510826110839844, "global_step": 86813, "epoch": 516} {"train_loss": -9.632933616638184, "global_step": 86814, "epoch": 516} {"train_loss": -9.351058959960938, "global_step": 86815, "epoch": 516} {"train_loss": -9.33827018737793, "global_step": 86816, "epoch": 516} {"train_loss": -9.55144214630127, "global_step": 86817, "epoch": 516} {"train_loss": -9.57165241241455, "global_step": 86818, "epoch": 516} {"train_loss": -9.469987869262695, "global_step": 86819, "epoch": 516} {"train_loss": -9.66482925415039, "global_step": 86820, "epoch": 516} {"train_loss": -9.235721588134766, "global_step": 86821, "epoch": 516} {"train_loss": -9.59402084350586, "global_step": 86822, "epoch": 516} {"train_loss": -9.434955596923828, "global_step": 86823, "epoch": 516} {"train_loss": -9.43018913269043, "global_step": 86824, "epoch": 516} {"train_loss": -9.301185607910156, "global_step": 86825, "epoch": 516} {"train_loss": -8.966599464416504, "global_step": 86826, "epoch": 516} {"train_loss": -9.590476989746094, "global_step": 86827, "epoch": 516} {"train_loss": -9.438375473022461, "global_step": 86828, "epoch": 516} {"train_loss": -9.406671524047852, "global_step": 86829, "epoch": 516} {"train_loss": -9.546649932861328, "global_step": 86830, "epoch": 516} {"train_loss": -9.368921279907227, "global_step": 86831, "epoch": 516} {"train_loss": -9.34691047668457, "global_step": 86832, "epoch": 516} {"train_loss": -9.640510559082031, "global_step": 86833, "epoch": 516} {"train_loss": -9.456599235534668, "global_step": 86834, "epoch": 516} {"train_loss": -9.580037117004395, "global_step": 86835, "epoch": 516} {"train_loss": -9.522753715515137, "global_step": 86836, "epoch": 516} {"train_loss": -9.244665145874023, "global_step": 86837, "epoch": 516} {"train_loss": -9.393452644348145, "global_step": 86838, "epoch": 516} {"train_loss": -9.561112403869629, "global_step": 86839, "epoch": 516} {"train_loss": -9.351530075073242, "global_step": 86840, "epoch": 516} {"train_loss": -9.431562423706055, "global_step": 86841, "epoch": 516} {"train_loss": -9.382890701293945, "global_step": 86842, "epoch": 516} {"train_loss": -9.219389915466309, "global_step": 86843, "epoch": 516} {"train_loss": -9.51068115234375, "global_step": 86844, "epoch": 516} {"train_loss": -8.898003578186035, "global_step": 86845, "epoch": 516} {"train_loss": -9.215360641479492, "global_step": 86846, "epoch": 516} {"train_loss": -9.282190322875977, "global_step": 86847, "epoch": 516} {"train_loss": -9.338279724121094, "global_step": 86848, "epoch": 516} {"train_loss": -9.1131591796875, "global_step": 86849, "epoch": 516} {"train_loss": -9.128765106201172, "global_step": 86850, "epoch": 516} {"train_loss": -9.191646575927734, "global_step": 86851, "epoch": 516} {"train_loss": -9.26538372039795, "global_step": 86852, "epoch": 516} {"train_loss": -9.326797485351562, "global_step": 86853, "epoch": 516} {"train_loss": -9.101044654846191, "global_step": 86854, "epoch": 516} {"train_loss": -9.372182539531163, "global_step": 86855, "epoch": 516, "val_loss": 200593.890625} {"train_loss": -9.145484924316406, "global_step": 86856, "epoch": 517} {"train_loss": -9.384586334228516, "global_step": 86857, "epoch": 517} {"train_loss": -9.295825958251953, "global_step": 86858, "epoch": 517} {"train_loss": -9.377758026123047, "global_step": 86859, "epoch": 517} {"train_loss": -9.176231384277344, "global_step": 86860, "epoch": 517} {"train_loss": -9.273012161254883, "global_step": 86861, "epoch": 517} {"train_loss": -9.448156356811523, "global_step": 86862, "epoch": 517} {"train_loss": -9.43687629699707, "global_step": 86863, "epoch": 517} {"train_loss": -9.130474090576172, "global_step": 86864, "epoch": 517} {"train_loss": -9.302692413330078, "global_step": 86865, "epoch": 517} {"train_loss": -9.381052017211914, "global_step": 86866, "epoch": 517} {"train_loss": -9.08763313293457, "global_step": 86867, "epoch": 517} {"train_loss": -9.530357360839844, "global_step": 86868, "epoch": 517} {"train_loss": -9.323265075683594, "global_step": 86869, "epoch": 517} {"train_loss": -9.327483177185059, "global_step": 86870, "epoch": 517} {"train_loss": -9.367181777954102, "global_step": 86871, "epoch": 517} {"train_loss": -9.393329620361328, "global_step": 86872, "epoch": 517} {"train_loss": -9.047082901000977, "global_step": 86873, "epoch": 517} {"train_loss": -9.227992057800293, "global_step": 86874, "epoch": 517} {"train_loss": -9.510866165161133, "global_step": 86875, "epoch": 517} {"train_loss": -9.502279281616211, "global_step": 86876, "epoch": 517} {"train_loss": -9.092798233032227, "global_step": 86877, "epoch": 517} {"train_loss": -9.527201652526855, "global_step": 86878, "epoch": 517} {"train_loss": -9.402956008911133, "global_step": 86879, "epoch": 517} {"train_loss": -9.550821304321289, "global_step": 86880, "epoch": 517} {"train_loss": -9.293034553527832, "global_step": 86881, "epoch": 517} {"train_loss": -9.370386123657227, "global_step": 86882, "epoch": 517} {"train_loss": -9.331111907958984, "global_step": 86883, "epoch": 517} {"train_loss": -9.366215705871582, "global_step": 86884, "epoch": 517} {"train_loss": -9.140307426452637, "global_step": 86885, "epoch": 517} {"train_loss": -9.452876091003418, "global_step": 86886, "epoch": 517} {"train_loss": -9.590633392333984, "global_step": 86887, "epoch": 517} {"train_loss": -9.437252044677734, "global_step": 86888, "epoch": 517} {"train_loss": -9.3841552734375, "global_step": 86889, "epoch": 517} {"train_loss": -9.421245574951172, "global_step": 86890, "epoch": 517} {"train_loss": -9.163642883300781, "global_step": 86891, "epoch": 517} {"train_loss": -9.562360763549805, "global_step": 86892, "epoch": 517} {"train_loss": -9.274772644042969, "global_step": 86893, "epoch": 517} {"train_loss": -9.31989574432373, "global_step": 86894, "epoch": 517} {"train_loss": -9.665933609008789, "global_step": 86895, "epoch": 517} {"train_loss": -9.308917999267578, "global_step": 86896, "epoch": 517} {"train_loss": -9.601265907287598, "global_step": 86897, "epoch": 517} {"train_loss": -9.61345100402832, "global_step": 86898, "epoch": 517} {"train_loss": -9.526598930358887, "global_step": 86899, "epoch": 517} {"train_loss": -9.53101921081543, "global_step": 86900, "epoch": 517} {"train_loss": -9.362258911132812, "global_step": 86901, "epoch": 517} {"train_loss": -9.724945068359375, "global_step": 86902, "epoch": 517} {"train_loss": -9.32177734375, "global_step": 86903, "epoch": 517} {"train_loss": -9.601059913635254, "global_step": 86904, "epoch": 517} {"train_loss": -9.678372383117676, "global_step": 86905, "epoch": 517} {"train_loss": -9.289824485778809, "global_step": 86906, "epoch": 517} {"train_loss": -9.536469459533691, "global_step": 86907, "epoch": 517} {"train_loss": -9.818519592285156, "global_step": 86908, "epoch": 517} {"train_loss": -9.34681510925293, "global_step": 86909, "epoch": 517} {"train_loss": -9.348695755004883, "global_step": 86910, "epoch": 517} {"train_loss": -9.563619613647461, "global_step": 86911, "epoch": 517} {"train_loss": -9.1983003616333, "global_step": 86912, "epoch": 517} {"train_loss": -9.625777244567871, "global_step": 86913, "epoch": 517} {"train_loss": -9.38005256652832, "global_step": 86914, "epoch": 517} {"train_loss": -9.28138542175293, "global_step": 86915, "epoch": 517} {"train_loss": -9.34698486328125, "global_step": 86916, "epoch": 517} {"train_loss": -9.099397659301758, "global_step": 86917, "epoch": 517} {"train_loss": -9.50436019897461, "global_step": 86918, "epoch": 517} {"train_loss": -9.211472511291504, "global_step": 86919, "epoch": 517} {"train_loss": -9.454700469970703, "global_step": 86920, "epoch": 517} {"train_loss": -9.567205429077148, "global_step": 86921, "epoch": 517} {"train_loss": -9.185332298278809, "global_step": 86922, "epoch": 517} {"train_loss": -9.44393539428711, "global_step": 86923, "epoch": 517} {"train_loss": -9.420045852661133, "global_step": 86924, "epoch": 517} {"train_loss": -9.228497505187988, "global_step": 86925, "epoch": 517} {"train_loss": -9.358658790588379, "global_step": 86926, "epoch": 517} {"train_loss": -9.521801948547363, "global_step": 86927, "epoch": 517} {"train_loss": -9.247516632080078, "global_step": 86928, "epoch": 517} {"train_loss": -9.519851684570312, "global_step": 86929, "epoch": 517} {"train_loss": -9.543840408325195, "global_step": 86930, "epoch": 517} {"train_loss": -9.67514419555664, "global_step": 86931, "epoch": 517} {"train_loss": -9.230958938598633, "global_step": 86932, "epoch": 517} {"train_loss": -9.351192474365234, "global_step": 86933, "epoch": 517} {"train_loss": -9.12473201751709, "global_step": 86934, "epoch": 517} {"train_loss": -9.319375991821289, "global_step": 86935, "epoch": 517} {"train_loss": -9.046896934509277, "global_step": 86936, "epoch": 517} {"train_loss": -9.169790267944336, "global_step": 86937, "epoch": 517} {"train_loss": -9.234213829040527, "global_step": 86938, "epoch": 517} {"train_loss": -9.019817352294922, "global_step": 86939, "epoch": 517} {"train_loss": -9.274669647216797, "global_step": 86940, "epoch": 517} {"train_loss": -8.922689437866211, "global_step": 86941, "epoch": 517} {"train_loss": -9.2689847946167, "global_step": 86942, "epoch": 517} {"train_loss": -8.996232032775879, "global_step": 86943, "epoch": 517} {"train_loss": -9.300617218017578, "global_step": 86944, "epoch": 517} {"train_loss": -9.291189193725586, "global_step": 86945, "epoch": 517} {"train_loss": -9.325368881225586, "global_step": 86946, "epoch": 517} {"train_loss": -9.203387260437012, "global_step": 86947, "epoch": 517} {"train_loss": -9.407909393310547, "global_step": 86948, "epoch": 517} {"train_loss": -9.08619213104248, "global_step": 86949, "epoch": 517} {"train_loss": -9.195489883422852, "global_step": 86950, "epoch": 517} {"train_loss": -9.277472496032715, "global_step": 86951, "epoch": 517} {"train_loss": -8.888996124267578, "global_step": 86952, "epoch": 517} {"train_loss": -9.390316009521484, "global_step": 86953, "epoch": 517} {"train_loss": -8.918497085571289, "global_step": 86954, "epoch": 517} {"train_loss": -9.374290466308594, "global_step": 86955, "epoch": 517} {"train_loss": -9.13774299621582, "global_step": 86956, "epoch": 517} {"train_loss": -9.354446411132812, "global_step": 86957, "epoch": 517} {"train_loss": -9.165811538696289, "global_step": 86958, "epoch": 517} {"train_loss": -9.381227493286133, "global_step": 86959, "epoch": 517} {"train_loss": -8.979976654052734, "global_step": 86960, "epoch": 517} {"train_loss": -9.139226913452148, "global_step": 86961, "epoch": 517} {"train_loss": -9.2428617477417, "global_step": 86962, "epoch": 517} {"train_loss": -9.298312187194824, "global_step": 86963, "epoch": 517} {"train_loss": -9.032472610473633, "global_step": 86964, "epoch": 517} {"train_loss": -9.402776718139648, "global_step": 86965, "epoch": 517} {"train_loss": -9.108833312988281, "global_step": 86966, "epoch": 517} {"train_loss": -9.399742126464844, "global_step": 86967, "epoch": 517} {"train_loss": -9.31332778930664, "global_step": 86968, "epoch": 517} {"train_loss": -9.37677001953125, "global_step": 86969, "epoch": 517} {"train_loss": -9.054344177246094, "global_step": 86970, "epoch": 517} {"train_loss": -9.351280212402344, "global_step": 86971, "epoch": 517} {"train_loss": -9.300835609436035, "global_step": 86972, "epoch": 517} {"train_loss": -9.446328163146973, "global_step": 86973, "epoch": 517} {"train_loss": -9.348071098327637, "global_step": 86974, "epoch": 517} {"train_loss": -9.453857421875, "global_step": 86975, "epoch": 517} {"train_loss": -9.323230743408203, "global_step": 86976, "epoch": 517} {"train_loss": -9.576300621032715, "global_step": 86977, "epoch": 517} {"train_loss": -9.314645767211914, "global_step": 86978, "epoch": 517} {"train_loss": -9.341269493103027, "global_step": 86979, "epoch": 517} {"train_loss": -9.404967308044434, "global_step": 86980, "epoch": 517} {"train_loss": -9.44847583770752, "global_step": 86981, "epoch": 517} {"train_loss": -9.551603317260742, "global_step": 86982, "epoch": 517} {"train_loss": -9.360749244689941, "global_step": 86983, "epoch": 517} {"train_loss": -9.305343627929688, "global_step": 86984, "epoch": 517} {"train_loss": -9.496917724609375, "global_step": 86985, "epoch": 517} {"train_loss": -9.309985160827637, "global_step": 86986, "epoch": 517} {"train_loss": -9.380504608154297, "global_step": 86987, "epoch": 517} {"train_loss": -9.023998260498047, "global_step": 86988, "epoch": 517} {"train_loss": -9.167292594909668, "global_step": 86989, "epoch": 517} {"train_loss": -9.279129028320312, "global_step": 86990, "epoch": 517} {"train_loss": -9.181562423706055, "global_step": 86991, "epoch": 517} {"train_loss": -9.389503479003906, "global_step": 86992, "epoch": 517} {"train_loss": -9.280980110168457, "global_step": 86993, "epoch": 517} {"train_loss": -9.11619758605957, "global_step": 86994, "epoch": 517} {"train_loss": -9.127359390258789, "global_step": 86995, "epoch": 517} {"train_loss": -9.241823196411133, "global_step": 86996, "epoch": 517} {"train_loss": -9.326364517211914, "global_step": 86997, "epoch": 517} {"train_loss": -9.245844841003418, "global_step": 86998, "epoch": 517} {"train_loss": -9.387838363647461, "global_step": 86999, "epoch": 517} {"train_loss": -9.07583236694336, "global_step": 87000, "epoch": 517} {"train_loss": -9.52421760559082, "global_step": 87001, "epoch": 517} {"train_loss": -9.135793685913086, "global_step": 87002, "epoch": 517} {"train_loss": -9.069904327392578, "global_step": 87003, "epoch": 517} {"train_loss": -9.341196060180664, "global_step": 87004, "epoch": 517} {"train_loss": -9.017202377319336, "global_step": 87005, "epoch": 517} {"train_loss": -9.412787437438965, "global_step": 87006, "epoch": 517} {"train_loss": -9.271625518798828, "global_step": 87007, "epoch": 517} {"train_loss": -9.295944213867188, "global_step": 87008, "epoch": 517} {"train_loss": -9.326126098632812, "global_step": 87009, "epoch": 517} {"train_loss": -9.370906829833984, "global_step": 87010, "epoch": 517} {"train_loss": -9.43875503540039, "global_step": 87011, "epoch": 517} {"train_loss": -9.267364501953125, "global_step": 87012, "epoch": 517} {"train_loss": -9.225751876831055, "global_step": 87013, "epoch": 517} {"train_loss": -9.460872650146484, "global_step": 87014, "epoch": 517} {"train_loss": -9.133879661560059, "global_step": 87015, "epoch": 517} {"train_loss": -9.344544410705566, "global_step": 87016, "epoch": 517} {"train_loss": -9.246591567993164, "global_step": 87017, "epoch": 517} {"train_loss": -9.176673889160156, "global_step": 87018, "epoch": 517} {"train_loss": -9.179075241088867, "global_step": 87019, "epoch": 517} {"train_loss": -9.287007331848145, "global_step": 87020, "epoch": 517} {"train_loss": -9.406839370727539, "global_step": 87021, "epoch": 517} {"train_loss": -9.326201438903809, "global_step": 87022, "epoch": 517} {"train_loss": -9.323014168512254, "global_step": 87023, "epoch": 517, "val_loss": 199491.9375} {"train_loss": -9.26070499420166, "global_step": 87024, "epoch": 518} {"train_loss": -8.761065483093262, "global_step": 87025, "epoch": 518} {"train_loss": -9.269879341125488, "global_step": 87026, "epoch": 518} {"train_loss": -9.147375106811523, "global_step": 87027, "epoch": 518} {"train_loss": -9.101882934570312, "global_step": 87028, "epoch": 518} {"train_loss": -9.23236083984375, "global_step": 87029, "epoch": 518} {"train_loss": -9.14479923248291, "global_step": 87030, "epoch": 518} {"train_loss": -9.30140495300293, "global_step": 87031, "epoch": 518} {"train_loss": -9.410039901733398, "global_step": 87032, "epoch": 518} {"train_loss": -9.194230079650879, "global_step": 87033, "epoch": 518} {"train_loss": -9.256689071655273, "global_step": 87034, "epoch": 518} {"train_loss": -9.36428165435791, "global_step": 87035, "epoch": 518} {"train_loss": -9.399011611938477, "global_step": 87036, "epoch": 518} {"train_loss": -9.305055618286133, "global_step": 87037, "epoch": 518} {"train_loss": -8.916402816772461, "global_step": 87038, "epoch": 518} {"train_loss": -9.299745559692383, "global_step": 87039, "epoch": 518} {"train_loss": -9.19102668762207, "global_step": 87040, "epoch": 518} {"train_loss": -9.45523452758789, "global_step": 87041, "epoch": 518} {"train_loss": -9.130961418151855, "global_step": 87042, "epoch": 518} {"train_loss": -9.361763000488281, "global_step": 87043, "epoch": 518} {"train_loss": -8.976578712463379, "global_step": 87044, "epoch": 518} {"train_loss": -9.3607177734375, "global_step": 87045, "epoch": 518} {"train_loss": -9.560935974121094, "global_step": 87046, "epoch": 518} {"train_loss": -8.952960968017578, "global_step": 87047, "epoch": 518} {"train_loss": -9.4952392578125, "global_step": 87048, "epoch": 518} {"train_loss": -9.197579383850098, "global_step": 87049, "epoch": 518} {"train_loss": -9.293500900268555, "global_step": 87050, "epoch": 518} {"train_loss": -9.264199256896973, "global_step": 87051, "epoch": 518} {"train_loss": -9.604448318481445, "global_step": 87052, "epoch": 518} {"train_loss": -9.031675338745117, "global_step": 87053, "epoch": 518} {"train_loss": -9.221845626831055, "global_step": 87054, "epoch": 518} {"train_loss": -9.189956665039062, "global_step": 87055, "epoch": 518} {"train_loss": -9.343473434448242, "global_step": 87056, "epoch": 518} {"train_loss": -9.157352447509766, "global_step": 87057, "epoch": 518} {"train_loss": -9.080337524414062, "global_step": 87058, "epoch": 518} {"train_loss": -9.383810997009277, "global_step": 87059, "epoch": 518} {"train_loss": -9.037817001342773, "global_step": 87060, "epoch": 518} {"train_loss": -9.366975784301758, "global_step": 87061, "epoch": 518} {"train_loss": -9.125283241271973, "global_step": 87062, "epoch": 518} {"train_loss": -9.305854797363281, "global_step": 87063, "epoch": 518} {"train_loss": -9.188970565795898, "global_step": 87064, "epoch": 518} {"train_loss": -9.474072456359863, "global_step": 87065, "epoch": 518} {"train_loss": -9.42221450805664, "global_step": 87066, "epoch": 518} {"train_loss": -9.242860794067383, "global_step": 87067, "epoch": 518} {"train_loss": -9.362707138061523, "global_step": 87068, "epoch": 518} {"train_loss": -9.081612586975098, "global_step": 87069, "epoch": 518} {"train_loss": -9.083211898803711, "global_step": 87070, "epoch": 518} {"train_loss": -9.148649215698242, "global_step": 87071, "epoch": 518} {"train_loss": -9.466733932495117, "global_step": 87072, "epoch": 518} {"train_loss": -9.476773262023926, "global_step": 87073, "epoch": 518} {"train_loss": -9.307816505432129, "global_step": 87074, "epoch": 518} {"train_loss": -9.373159408569336, "global_step": 87075, "epoch": 518} {"train_loss": -9.704072952270508, "global_step": 87076, "epoch": 518} {"train_loss": -9.40250015258789, "global_step": 87077, "epoch": 518} {"train_loss": -9.437798500061035, "global_step": 87078, "epoch": 518} {"train_loss": -9.528852462768555, "global_step": 87079, "epoch": 518} {"train_loss": -9.550169944763184, "global_step": 87080, "epoch": 518} {"train_loss": -9.365333557128906, "global_step": 87081, "epoch": 518} {"train_loss": -9.726858139038086, "global_step": 87082, "epoch": 518} {"train_loss": -9.203131675720215, "global_step": 87083, "epoch": 518} {"train_loss": -9.743494987487793, "global_step": 87084, "epoch": 518} {"train_loss": -9.551902770996094, "global_step": 87085, "epoch": 518} {"train_loss": -9.441060066223145, "global_step": 87086, "epoch": 518} {"train_loss": -9.424777030944824, "global_step": 87087, "epoch": 518} {"train_loss": -9.407898902893066, "global_step": 87088, "epoch": 518} {"train_loss": -9.354373931884766, "global_step": 87089, "epoch": 518} {"train_loss": -9.614725112915039, "global_step": 87090, "epoch": 518} {"train_loss": -9.458751678466797, "global_step": 87091, "epoch": 518} {"train_loss": -9.358905792236328, "global_step": 87092, "epoch": 518} {"train_loss": -9.451874732971191, "global_step": 87093, "epoch": 518} {"train_loss": -9.424528121948242, "global_step": 87094, "epoch": 518} {"train_loss": -9.509126663208008, "global_step": 87095, "epoch": 518} {"train_loss": -9.117288589477539, "global_step": 87096, "epoch": 518} {"train_loss": -9.399683952331543, "global_step": 87097, "epoch": 518} {"train_loss": -9.137548446655273, "global_step": 87098, "epoch": 518} {"train_loss": -9.572670936584473, "global_step": 87099, "epoch": 518} {"train_loss": -9.358550071716309, "global_step": 87100, "epoch": 518} {"train_loss": -9.362618446350098, "global_step": 87101, "epoch": 518} {"train_loss": -9.287732124328613, "global_step": 87102, "epoch": 518} {"train_loss": -9.03492259979248, "global_step": 87103, "epoch": 518} {"train_loss": -9.339790344238281, "global_step": 87104, "epoch": 518} {"train_loss": -9.129315376281738, "global_step": 87105, "epoch": 518} {"train_loss": -9.367904663085938, "global_step": 87106, "epoch": 518} {"train_loss": -9.178960800170898, "global_step": 87107, "epoch": 518} {"train_loss": -9.472028732299805, "global_step": 87108, "epoch": 518} {"train_loss": -9.42670726776123, "global_step": 87109, "epoch": 518} {"train_loss": -9.365928649902344, "global_step": 87110, "epoch": 518} {"train_loss": -9.5486478805542, "global_step": 87111, "epoch": 518} {"train_loss": -9.272268295288086, "global_step": 87112, "epoch": 518} {"train_loss": -9.2142333984375, "global_step": 87113, "epoch": 518} {"train_loss": -9.25168514251709, "global_step": 87114, "epoch": 518} {"train_loss": -9.24227523803711, "global_step": 87115, "epoch": 518} {"train_loss": -9.278223037719727, "global_step": 87116, "epoch": 518} {"train_loss": -9.323150634765625, "global_step": 87117, "epoch": 518} {"train_loss": -9.108661651611328, "global_step": 87118, "epoch": 518} {"train_loss": -9.626771926879883, "global_step": 87119, "epoch": 518} {"train_loss": -9.361756324768066, "global_step": 87120, "epoch": 518} {"train_loss": -9.375164031982422, "global_step": 87121, "epoch": 518} {"train_loss": -9.496389389038086, "global_step": 87122, "epoch": 518} {"train_loss": -9.400069236755371, "global_step": 87123, "epoch": 518} {"train_loss": -9.259363174438477, "global_step": 87124, "epoch": 518} {"train_loss": -9.494479179382324, "global_step": 87125, "epoch": 518} {"train_loss": -9.286802291870117, "global_step": 87126, "epoch": 518} {"train_loss": -9.559006690979004, "global_step": 87127, "epoch": 518} {"train_loss": -9.261241912841797, "global_step": 87128, "epoch": 518} {"train_loss": -9.360215187072754, "global_step": 87129, "epoch": 518} {"train_loss": -9.418743133544922, "global_step": 87130, "epoch": 518} {"train_loss": -9.32319164276123, "global_step": 87131, "epoch": 518} {"train_loss": -9.419529914855957, "global_step": 87132, "epoch": 518} {"train_loss": -9.431018829345703, "global_step": 87133, "epoch": 518} {"train_loss": -9.36496353149414, "global_step": 87134, "epoch": 518} {"train_loss": -9.378717422485352, "global_step": 87135, "epoch": 518} {"train_loss": -9.301337242126465, "global_step": 87136, "epoch": 518} {"train_loss": -9.564718246459961, "global_step": 87137, "epoch": 518} {"train_loss": -9.488324165344238, "global_step": 87138, "epoch": 518} {"train_loss": -9.382840156555176, "global_step": 87139, "epoch": 518} {"train_loss": -9.408001899719238, "global_step": 87140, "epoch": 518} {"train_loss": -9.42961311340332, "global_step": 87141, "epoch": 518} {"train_loss": -9.57735824584961, "global_step": 87142, "epoch": 518} {"train_loss": -9.6478271484375, "global_step": 87143, "epoch": 518} {"train_loss": -9.301093101501465, "global_step": 87144, "epoch": 518} {"train_loss": -9.722623825073242, "global_step": 87145, "epoch": 518} {"train_loss": -9.095314025878906, "global_step": 87146, "epoch": 518} {"train_loss": -9.621700286865234, "global_step": 87147, "epoch": 518} {"train_loss": -9.492902755737305, "global_step": 87148, "epoch": 518} {"train_loss": -9.47480583190918, "global_step": 87149, "epoch": 518} {"train_loss": -9.582792282104492, "global_step": 87150, "epoch": 518} {"train_loss": -9.136178970336914, "global_step": 87151, "epoch": 518} {"train_loss": -9.552464485168457, "global_step": 87152, "epoch": 518} {"train_loss": -9.658805847167969, "global_step": 87153, "epoch": 518} {"train_loss": -9.671982765197754, "global_step": 87154, "epoch": 518} {"train_loss": -9.539568901062012, "global_step": 87155, "epoch": 518} {"train_loss": -9.829994201660156, "global_step": 87156, "epoch": 518} {"train_loss": -9.509077072143555, "global_step": 87157, "epoch": 518} {"train_loss": -9.703147888183594, "global_step": 87158, "epoch": 518} {"train_loss": -9.579813003540039, "global_step": 87159, "epoch": 518} {"train_loss": -9.688541412353516, "global_step": 87160, "epoch": 518} {"train_loss": -9.377593040466309, "global_step": 87161, "epoch": 518} {"train_loss": -9.315295219421387, "global_step": 87162, "epoch": 518} {"train_loss": -9.475701332092285, "global_step": 87163, "epoch": 518} {"train_loss": -9.007932662963867, "global_step": 87164, "epoch": 518} {"train_loss": -9.564935684204102, "global_step": 87165, "epoch": 518} {"train_loss": -9.378593444824219, "global_step": 87166, "epoch": 518} {"train_loss": -9.26798152923584, "global_step": 87167, "epoch": 518} {"train_loss": -9.455320358276367, "global_step": 87168, "epoch": 518} {"train_loss": -9.375401496887207, "global_step": 87169, "epoch": 518} {"train_loss": -9.438608169555664, "global_step": 87170, "epoch": 518} {"train_loss": -9.488229751586914, "global_step": 87171, "epoch": 518} {"train_loss": -9.327608108520508, "global_step": 87172, "epoch": 518} {"train_loss": -9.49869441986084, "global_step": 87173, "epoch": 518} {"train_loss": -9.517644882202148, "global_step": 87174, "epoch": 518} {"train_loss": -9.335066795349121, "global_step": 87175, "epoch": 518} {"train_loss": -9.209680557250977, "global_step": 87176, "epoch": 518} {"train_loss": -9.358370780944824, "global_step": 87177, "epoch": 518} {"train_loss": -9.396215438842773, "global_step": 87178, "epoch": 518} {"train_loss": -9.541568756103516, "global_step": 87179, "epoch": 518} {"train_loss": -9.335314750671387, "global_step": 87180, "epoch": 518} {"train_loss": -9.283799171447754, "global_step": 87181, "epoch": 518} {"train_loss": -9.270341873168945, "global_step": 87182, "epoch": 518} {"train_loss": -9.265213012695312, "global_step": 87183, "epoch": 518} {"train_loss": -9.047574996948242, "global_step": 87184, "epoch": 518} {"train_loss": -9.351651191711426, "global_step": 87185, "epoch": 518} {"train_loss": -9.426735877990723, "global_step": 87186, "epoch": 518} {"train_loss": -9.309953689575195, "global_step": 87187, "epoch": 518} {"train_loss": -9.372488021850586, "global_step": 87188, "epoch": 518} {"train_loss": -9.370086669921875, "global_step": 87189, "epoch": 518} {"train_loss": -9.402572631835938, "global_step": 87190, "epoch": 518} {"train_loss": -9.358940130188351, "global_step": 87191, "epoch": 518, "val_loss": 199014.15625} {"train_loss": -9.208216667175293, "global_step": 87192, "epoch": 519} {"train_loss": -9.279581069946289, "global_step": 87193, "epoch": 519} {"train_loss": -9.198160171508789, "global_step": 87194, "epoch": 519} {"train_loss": -9.128761291503906, "global_step": 87195, "epoch": 519} {"train_loss": -8.763833999633789, "global_step": 87196, "epoch": 519} {"train_loss": -8.841288566589355, "global_step": 87197, "epoch": 519} {"train_loss": -8.23501968383789, "global_step": 87198, "epoch": 519} {"train_loss": -8.685625076293945, "global_step": 87199, "epoch": 519} {"train_loss": -8.33829116821289, "global_step": 87200, "epoch": 519} {"train_loss": -8.217899322509766, "global_step": 87201, "epoch": 519} {"train_loss": -8.65025520324707, "global_step": 87202, "epoch": 519} {"train_loss": -8.799670219421387, "global_step": 87203, "epoch": 519} {"train_loss": -8.66642951965332, "global_step": 87204, "epoch": 519} {"train_loss": -8.874792098999023, "global_step": 87205, "epoch": 519} {"train_loss": -8.985967636108398, "global_step": 87206, "epoch": 519} {"train_loss": -8.679080963134766, "global_step": 87207, "epoch": 519} {"train_loss": -8.462133407592773, "global_step": 87208, "epoch": 519} {"train_loss": -8.971895217895508, "global_step": 87209, "epoch": 519} {"train_loss": -8.813495635986328, "global_step": 87210, "epoch": 519} {"train_loss": -9.057899475097656, "global_step": 87211, "epoch": 519} {"train_loss": -8.821824073791504, "global_step": 87212, "epoch": 519} {"train_loss": -8.960049629211426, "global_step": 87213, "epoch": 519} {"train_loss": -9.037906646728516, "global_step": 87214, "epoch": 519} {"train_loss": -9.082443237304688, "global_step": 87215, "epoch": 519} {"train_loss": -9.07333755493164, "global_step": 87216, "epoch": 519} {"train_loss": -9.174690246582031, "global_step": 87217, "epoch": 519} {"train_loss": -9.143638610839844, "global_step": 87218, "epoch": 519} {"train_loss": -9.132038116455078, "global_step": 87219, "epoch": 519} {"train_loss": -9.193513870239258, "global_step": 87220, "epoch": 519} {"train_loss": -9.305185317993164, "global_step": 87221, "epoch": 519} {"train_loss": -9.272768020629883, "global_step": 87222, "epoch": 519} {"train_loss": -9.366716384887695, "global_step": 87223, "epoch": 519} {"train_loss": -9.23432445526123, "global_step": 87224, "epoch": 519} {"train_loss": -9.511518478393555, "global_step": 87225, "epoch": 519} {"train_loss": -9.246564865112305, "global_step": 87226, "epoch": 519} {"train_loss": -9.179464340209961, "global_step": 87227, "epoch": 519} {"train_loss": -9.367862701416016, "global_step": 87228, "epoch": 519} {"train_loss": -9.518351554870605, "global_step": 87229, "epoch": 519} {"train_loss": -9.596397399902344, "global_step": 87230, "epoch": 519} {"train_loss": -9.50627326965332, "global_step": 87231, "epoch": 519} {"train_loss": -9.579513549804688, "global_step": 87232, "epoch": 519} {"train_loss": -9.824904441833496, "global_step": 87233, "epoch": 519} {"train_loss": -9.505097389221191, "global_step": 87234, "epoch": 519} {"train_loss": -9.550943374633789, "global_step": 87235, "epoch": 519} {"train_loss": -9.668049812316895, "global_step": 87236, "epoch": 519} {"train_loss": -9.75646686553955, "global_step": 87237, "epoch": 519} {"train_loss": -9.901944160461426, "global_step": 87238, "epoch": 519} {"train_loss": -9.776957511901855, "global_step": 87239, "epoch": 519} {"train_loss": -9.718771934509277, "global_step": 87240, "epoch": 519} {"train_loss": -9.669601440429688, "global_step": 87241, "epoch": 519} {"train_loss": -9.569154739379883, "global_step": 87242, "epoch": 519} {"train_loss": -9.611083030700684, "global_step": 87243, "epoch": 519} {"train_loss": -9.520546913146973, "global_step": 87244, "epoch": 519} {"train_loss": -9.485702514648438, "global_step": 87245, "epoch": 519} {"train_loss": -9.420453071594238, "global_step": 87246, "epoch": 519} {"train_loss": -9.048454284667969, "global_step": 87247, "epoch": 519} {"train_loss": -9.704745292663574, "global_step": 87248, "epoch": 519} {"train_loss": -9.309724807739258, "global_step": 87249, "epoch": 519} {"train_loss": -9.492502212524414, "global_step": 87250, "epoch": 519} {"train_loss": -9.588916778564453, "global_step": 87251, "epoch": 519} {"train_loss": -9.270139694213867, "global_step": 87252, "epoch": 519} {"train_loss": -9.499509811401367, "global_step": 87253, "epoch": 519} {"train_loss": -9.341501235961914, "global_step": 87254, "epoch": 519} {"train_loss": -9.458677291870117, "global_step": 87255, "epoch": 519} {"train_loss": -9.375, "global_step": 87256, "epoch": 519} {"train_loss": -9.049391746520996, "global_step": 87257, "epoch": 519} {"train_loss": -9.240150451660156, "global_step": 87258, "epoch": 519} {"train_loss": -9.32687759399414, "global_step": 87259, "epoch": 519} {"train_loss": -9.125152587890625, "global_step": 87260, "epoch": 519} {"train_loss": -9.241125106811523, "global_step": 87261, "epoch": 519} {"train_loss": -9.167667388916016, "global_step": 87262, "epoch": 519} {"train_loss": -9.405529022216797, "global_step": 87263, "epoch": 519} {"train_loss": -9.233711242675781, "global_step": 87264, "epoch": 519} {"train_loss": -8.903027534484863, "global_step": 87265, "epoch": 519} {"train_loss": -9.224143981933594, "global_step": 87266, "epoch": 519} {"train_loss": -9.109068870544434, "global_step": 87267, "epoch": 519} {"train_loss": -9.34739875793457, "global_step": 87268, "epoch": 519} {"train_loss": -9.367788314819336, "global_step": 87269, "epoch": 519} {"train_loss": -9.327699661254883, "global_step": 87270, "epoch": 519} {"train_loss": -9.204588890075684, "global_step": 87271, "epoch": 519} {"train_loss": -9.362262725830078, "global_step": 87272, "epoch": 519} {"train_loss": -9.190742492675781, "global_step": 87273, "epoch": 519} {"train_loss": -9.279037475585938, "global_step": 87274, "epoch": 519} {"train_loss": -9.311775207519531, "global_step": 87275, "epoch": 519} {"train_loss": -9.171772003173828, "global_step": 87276, "epoch": 519} {"train_loss": -9.042966842651367, "global_step": 87277, "epoch": 519} {"train_loss": -9.567780494689941, "global_step": 87278, "epoch": 519} {"train_loss": -9.54334831237793, "global_step": 87279, "epoch": 519} {"train_loss": -9.476035118103027, "global_step": 87280, "epoch": 519} {"train_loss": -9.272615432739258, "global_step": 87281, "epoch": 519} {"train_loss": -9.382863998413086, "global_step": 87282, "epoch": 519} {"train_loss": -9.497739791870117, "global_step": 87283, "epoch": 519} {"train_loss": -9.357111930847168, "global_step": 87284, "epoch": 519} {"train_loss": -9.2742280960083, "global_step": 87285, "epoch": 519} {"train_loss": -9.398056983947754, "global_step": 87286, "epoch": 519} {"train_loss": -9.255029678344727, "global_step": 87287, "epoch": 519} {"train_loss": -9.232867240905762, "global_step": 87288, "epoch": 519} {"train_loss": -9.36532974243164, "global_step": 87289, "epoch": 519} {"train_loss": -9.326532363891602, "global_step": 87290, "epoch": 519} {"train_loss": -9.176522254943848, "global_step": 87291, "epoch": 519} {"train_loss": -9.43283462524414, "global_step": 87292, "epoch": 519} {"train_loss": -9.431489944458008, "global_step": 87293, "epoch": 519} {"train_loss": -9.435674667358398, "global_step": 87294, "epoch": 519} {"train_loss": -9.663717269897461, "global_step": 87295, "epoch": 519} {"train_loss": -9.221023559570312, "global_step": 87296, "epoch": 519} {"train_loss": -9.551765441894531, "global_step": 87297, "epoch": 519} {"train_loss": -9.389998435974121, "global_step": 87298, "epoch": 519} {"train_loss": -9.207529067993164, "global_step": 87299, "epoch": 519} {"train_loss": -9.455299377441406, "global_step": 87300, "epoch": 519} {"train_loss": -9.406913757324219, "global_step": 87301, "epoch": 519} {"train_loss": -9.514418601989746, "global_step": 87302, "epoch": 519} {"train_loss": -9.4405517578125, "global_step": 87303, "epoch": 519} {"train_loss": -9.417839050292969, "global_step": 87304, "epoch": 519} {"train_loss": -9.436861038208008, "global_step": 87305, "epoch": 519} {"train_loss": -9.375418663024902, "global_step": 87306, "epoch": 519} {"train_loss": -9.62519645690918, "global_step": 87307, "epoch": 519} {"train_loss": -9.480936050415039, "global_step": 87308, "epoch": 519} {"train_loss": -9.362166404724121, "global_step": 87309, "epoch": 519} {"train_loss": -9.641040802001953, "global_step": 87310, "epoch": 519} {"train_loss": -9.591403007507324, "global_step": 87311, "epoch": 519} {"train_loss": -9.412006378173828, "global_step": 87312, "epoch": 519} {"train_loss": -9.654905319213867, "global_step": 87313, "epoch": 519} {"train_loss": -9.306172370910645, "global_step": 87314, "epoch": 519} {"train_loss": -9.749587059020996, "global_step": 87315, "epoch": 519} {"train_loss": -9.611968994140625, "global_step": 87316, "epoch": 519} {"train_loss": -9.288434982299805, "global_step": 87317, "epoch": 519} {"train_loss": -9.23589038848877, "global_step": 87318, "epoch": 519} {"train_loss": -9.476584434509277, "global_step": 87319, "epoch": 519} {"train_loss": -9.467950820922852, "global_step": 87320, "epoch": 519} {"train_loss": -9.625570297241211, "global_step": 87321, "epoch": 519} {"train_loss": -9.346946716308594, "global_step": 87322, "epoch": 519} {"train_loss": -9.416312217712402, "global_step": 87323, "epoch": 519} {"train_loss": -9.468408584594727, "global_step": 87324, "epoch": 519} {"train_loss": -9.455608367919922, "global_step": 87325, "epoch": 519} {"train_loss": -9.386438369750977, "global_step": 87326, "epoch": 519} {"train_loss": -9.27408218383789, "global_step": 87327, "epoch": 519} {"train_loss": -9.40156364440918, "global_step": 87328, "epoch": 519} {"train_loss": -9.252594947814941, "global_step": 87329, "epoch": 519} {"train_loss": -9.439367294311523, "global_step": 87330, "epoch": 519} {"train_loss": -9.176338195800781, "global_step": 87331, "epoch": 519} {"train_loss": -9.22889232635498, "global_step": 87332, "epoch": 519} {"train_loss": -8.987995147705078, "global_step": 87333, "epoch": 519} {"train_loss": -8.904542922973633, "global_step": 87334, "epoch": 519} {"train_loss": -9.276830673217773, "global_step": 87335, "epoch": 519} {"train_loss": -8.794939041137695, "global_step": 87336, "epoch": 519} {"train_loss": -9.118518829345703, "global_step": 87337, "epoch": 519} {"train_loss": -8.868672370910645, "global_step": 87338, "epoch": 519} {"train_loss": -9.041677474975586, "global_step": 87339, "epoch": 519} {"train_loss": -8.846689224243164, "global_step": 87340, "epoch": 519} {"train_loss": -9.043255805969238, "global_step": 87341, "epoch": 519} {"train_loss": -9.135127067565918, "global_step": 87342, "epoch": 519} {"train_loss": -9.051412582397461, "global_step": 87343, "epoch": 519} {"train_loss": -9.213784217834473, "global_step": 87344, "epoch": 519} {"train_loss": -9.295429229736328, "global_step": 87345, "epoch": 519} {"train_loss": -9.103072166442871, "global_step": 87346, "epoch": 519} {"train_loss": -9.222959518432617, "global_step": 87347, "epoch": 519} {"train_loss": -9.332073211669922, "global_step": 87348, "epoch": 519} {"train_loss": -9.372225761413574, "global_step": 87349, "epoch": 519} {"train_loss": -9.32779312133789, "global_step": 87350, "epoch": 519} {"train_loss": -9.078373908996582, "global_step": 87351, "epoch": 519} {"train_loss": -9.418140411376953, "global_step": 87352, "epoch": 519} {"train_loss": -9.404729843139648, "global_step": 87353, "epoch": 519} {"train_loss": -9.329463958740234, "global_step": 87354, "epoch": 519} {"train_loss": -9.298056602478027, "global_step": 87355, "epoch": 519} {"train_loss": -9.452054023742676, "global_step": 87356, "epoch": 519} {"train_loss": -9.260129928588867, "global_step": 87357, "epoch": 519} {"train_loss": -9.475847244262695, "global_step": 87358, "epoch": 519} {"train_loss": -9.279191851615906, "global_step": 87359, "epoch": 519, "val_loss": 201267.875} {"train_loss": -9.155054092407227, "global_step": 87360, "epoch": 520} {"train_loss": -9.460489273071289, "global_step": 87361, "epoch": 520} {"train_loss": -9.171405792236328, "global_step": 87362, "epoch": 520} {"train_loss": -9.119302749633789, "global_step": 87363, "epoch": 520} {"train_loss": -9.315436363220215, "global_step": 87364, "epoch": 520} {"train_loss": -9.546283721923828, "global_step": 87365, "epoch": 520} {"train_loss": -9.379386901855469, "global_step": 87366, "epoch": 520} {"train_loss": -9.311920166015625, "global_step": 87367, "epoch": 520} {"train_loss": -9.399686813354492, "global_step": 87368, "epoch": 520} {"train_loss": -9.593600273132324, "global_step": 87369, "epoch": 520} {"train_loss": -9.332012176513672, "global_step": 87370, "epoch": 520} {"train_loss": -9.547126770019531, "global_step": 87371, "epoch": 520} {"train_loss": -9.161022186279297, "global_step": 87372, "epoch": 520} {"train_loss": -9.623473167419434, "global_step": 87373, "epoch": 520} {"train_loss": -9.318209648132324, "global_step": 87374, "epoch": 520} {"train_loss": -9.585922241210938, "global_step": 87375, "epoch": 520} {"train_loss": -9.614500999450684, "global_step": 87376, "epoch": 520} {"train_loss": -9.332147598266602, "global_step": 87377, "epoch": 520} {"train_loss": -9.577173233032227, "global_step": 87378, "epoch": 520} {"train_loss": -9.48908805847168, "global_step": 87379, "epoch": 520} {"train_loss": -9.620521545410156, "global_step": 87380, "epoch": 520} {"train_loss": -9.620903015136719, "global_step": 87381, "epoch": 520} {"train_loss": -9.4848051071167, "global_step": 87382, "epoch": 520} {"train_loss": -9.640759468078613, "global_step": 87383, "epoch": 520} {"train_loss": -9.470480918884277, "global_step": 87384, "epoch": 520} {"train_loss": -9.542654037475586, "global_step": 87385, "epoch": 520} {"train_loss": -9.554910659790039, "global_step": 87386, "epoch": 520} {"train_loss": -9.545351028442383, "global_step": 87387, "epoch": 520} {"train_loss": -9.462468147277832, "global_step": 87388, "epoch": 520} {"train_loss": -9.444613456726074, "global_step": 87389, "epoch": 520} {"train_loss": -9.824629783630371, "global_step": 87390, "epoch": 520} {"train_loss": -9.39484977722168, "global_step": 87391, "epoch": 520} {"train_loss": -9.079549789428711, "global_step": 87392, "epoch": 520} {"train_loss": -9.654495239257812, "global_step": 87393, "epoch": 520} {"train_loss": -9.293790817260742, "global_step": 87394, "epoch": 520} {"train_loss": -9.35589599609375, "global_step": 87395, "epoch": 520} {"train_loss": -9.378798484802246, "global_step": 87396, "epoch": 520} {"train_loss": -9.570404052734375, "global_step": 87397, "epoch": 520} {"train_loss": -9.508481979370117, "global_step": 87398, "epoch": 520} {"train_loss": -9.426212310791016, "global_step": 87399, "epoch": 520} {"train_loss": -9.533350944519043, "global_step": 87400, "epoch": 520} {"train_loss": -9.45094108581543, "global_step": 87401, "epoch": 520} {"train_loss": -9.272964477539062, "global_step": 87402, "epoch": 520} {"train_loss": -9.550642013549805, "global_step": 87403, "epoch": 520} {"train_loss": -9.413335800170898, "global_step": 87404, "epoch": 520} {"train_loss": -9.724233627319336, "global_step": 87405, "epoch": 520} {"train_loss": -9.392690658569336, "global_step": 87406, "epoch": 520} {"train_loss": -9.46209716796875, "global_step": 87407, "epoch": 520} {"train_loss": -9.579202651977539, "global_step": 87408, "epoch": 520} {"train_loss": -9.503422737121582, "global_step": 87409, "epoch": 520} {"train_loss": -9.30571174621582, "global_step": 87410, "epoch": 520} {"train_loss": -9.569814682006836, "global_step": 87411, "epoch": 520} {"train_loss": -9.624091148376465, "global_step": 87412, "epoch": 520} {"train_loss": -9.258039474487305, "global_step": 87413, "epoch": 520} {"train_loss": -9.296957969665527, "global_step": 87414, "epoch": 520} {"train_loss": -9.445499420166016, "global_step": 87415, "epoch": 520} {"train_loss": -9.293760299682617, "global_step": 87416, "epoch": 520} {"train_loss": -9.243804931640625, "global_step": 87417, "epoch": 520} {"train_loss": -9.364299774169922, "global_step": 87418, "epoch": 520} {"train_loss": -8.969884872436523, "global_step": 87419, "epoch": 520} {"train_loss": -9.435518264770508, "global_step": 87420, "epoch": 520} {"train_loss": -9.325766563415527, "global_step": 87421, "epoch": 520} {"train_loss": -8.287788391113281, "global_step": 87422, "epoch": 520} {"train_loss": -9.387535095214844, "global_step": 87423, "epoch": 520} {"train_loss": -9.091104507446289, "global_step": 87424, "epoch": 520} {"train_loss": -9.211837768554688, "global_step": 87425, "epoch": 520} {"train_loss": -8.749396324157715, "global_step": 87426, "epoch": 520} {"train_loss": -9.169170379638672, "global_step": 87427, "epoch": 520} {"train_loss": -8.880559921264648, "global_step": 87428, "epoch": 520} {"train_loss": -9.180719375610352, "global_step": 87429, "epoch": 520} {"train_loss": -9.070016860961914, "global_step": 87430, "epoch": 520} {"train_loss": -9.313838958740234, "global_step": 87431, "epoch": 520} {"train_loss": -9.04394817352295, "global_step": 87432, "epoch": 520} {"train_loss": -9.25408935546875, "global_step": 87433, "epoch": 520} {"train_loss": -8.930885314941406, "global_step": 87434, "epoch": 520} {"train_loss": -9.5872220993042, "global_step": 87435, "epoch": 520} {"train_loss": -9.274919509887695, "global_step": 87436, "epoch": 520} {"train_loss": -9.274161338806152, "global_step": 87437, "epoch": 520} {"train_loss": -9.15478801727295, "global_step": 87438, "epoch": 520} {"train_loss": -9.169212341308594, "global_step": 87439, "epoch": 520} {"train_loss": -9.021663665771484, "global_step": 87440, "epoch": 520} {"train_loss": -9.423090934753418, "global_step": 87441, "epoch": 520} {"train_loss": -9.242008209228516, "global_step": 87442, "epoch": 520} {"train_loss": -9.047819137573242, "global_step": 87443, "epoch": 520} {"train_loss": -9.385594367980957, "global_step": 87444, "epoch": 520} {"train_loss": -9.254171371459961, "global_step": 87445, "epoch": 520} {"train_loss": -9.389039993286133, "global_step": 87446, "epoch": 520} {"train_loss": -9.282647132873535, "global_step": 87447, "epoch": 520} {"train_loss": -9.521814346313477, "global_step": 87448, "epoch": 520} {"train_loss": -9.387811660766602, "global_step": 87449, "epoch": 520} {"train_loss": -9.499258041381836, "global_step": 87450, "epoch": 520} {"train_loss": -9.600686073303223, "global_step": 87451, "epoch": 520} {"train_loss": -9.50880241394043, "global_step": 87452, "epoch": 520} {"train_loss": -9.27859878540039, "global_step": 87453, "epoch": 520} {"train_loss": -9.639656066894531, "global_step": 87454, "epoch": 520} {"train_loss": -9.377754211425781, "global_step": 87455, "epoch": 520} {"train_loss": -9.423072814941406, "global_step": 87456, "epoch": 520} {"train_loss": -9.550248146057129, "global_step": 87457, "epoch": 520} {"train_loss": -9.308563232421875, "global_step": 87458, "epoch": 520} {"train_loss": -9.557456970214844, "global_step": 87459, "epoch": 520} {"train_loss": -9.238808631896973, "global_step": 87460, "epoch": 520} {"train_loss": -9.692834854125977, "global_step": 87461, "epoch": 520} {"train_loss": -9.36499309539795, "global_step": 87462, "epoch": 520} {"train_loss": -9.56654167175293, "global_step": 87463, "epoch": 520} {"train_loss": -9.488426208496094, "global_step": 87464, "epoch": 520} {"train_loss": -9.50637435913086, "global_step": 87465, "epoch": 520} {"train_loss": -9.197980880737305, "global_step": 87466, "epoch": 520} {"train_loss": -9.6974515914917, "global_step": 87467, "epoch": 520} {"train_loss": -9.469415664672852, "global_step": 87468, "epoch": 520} {"train_loss": -9.428632736206055, "global_step": 87469, "epoch": 520} {"train_loss": -9.433233261108398, "global_step": 87470, "epoch": 520} {"train_loss": -9.205005645751953, "global_step": 87471, "epoch": 520} {"train_loss": -9.45601749420166, "global_step": 87472, "epoch": 520} {"train_loss": -9.505302429199219, "global_step": 87473, "epoch": 520} {"train_loss": -9.397451400756836, "global_step": 87474, "epoch": 520} {"train_loss": -9.253138542175293, "global_step": 87475, "epoch": 520} {"train_loss": -9.612228393554688, "global_step": 87476, "epoch": 520} {"train_loss": -9.283735275268555, "global_step": 87477, "epoch": 520} {"train_loss": -9.542734146118164, "global_step": 87478, "epoch": 520} {"train_loss": -9.403438568115234, "global_step": 87479, "epoch": 520} {"train_loss": -9.599184036254883, "global_step": 87480, "epoch": 520} {"train_loss": -9.592975616455078, "global_step": 87481, "epoch": 520} {"train_loss": -9.533965110778809, "global_step": 87482, "epoch": 520} {"train_loss": -9.402538299560547, "global_step": 87483, "epoch": 520} {"train_loss": -9.603473663330078, "global_step": 87484, "epoch": 520} {"train_loss": -9.672002792358398, "global_step": 87485, "epoch": 520} {"train_loss": -9.61154556274414, "global_step": 87486, "epoch": 520} {"train_loss": -9.615352630615234, "global_step": 87487, "epoch": 520} {"train_loss": -9.715720176696777, "global_step": 87488, "epoch": 520} {"train_loss": -9.504860877990723, "global_step": 87489, "epoch": 520} {"train_loss": -9.764957427978516, "global_step": 87490, "epoch": 520} {"train_loss": -9.488922119140625, "global_step": 87491, "epoch": 520} {"train_loss": -9.70524787902832, "global_step": 87492, "epoch": 520} {"train_loss": -9.550466537475586, "global_step": 87493, "epoch": 520} {"train_loss": -9.424271583557129, "global_step": 87494, "epoch": 520} {"train_loss": -9.602270126342773, "global_step": 87495, "epoch": 520} {"train_loss": -9.625428199768066, "global_step": 87496, "epoch": 520} {"train_loss": -9.695831298828125, "global_step": 87497, "epoch": 520} {"train_loss": -9.305389404296875, "global_step": 87498, "epoch": 520} {"train_loss": -9.391135215759277, "global_step": 87499, "epoch": 520} {"train_loss": -9.300134658813477, "global_step": 87500, "epoch": 520} {"train_loss": -9.344085693359375, "global_step": 87501, "epoch": 520} {"train_loss": -9.282626152038574, "global_step": 87502, "epoch": 520} {"train_loss": -9.388282775878906, "global_step": 87503, "epoch": 520} {"train_loss": -9.463910102844238, "global_step": 87504, "epoch": 520} {"train_loss": -9.427961349487305, "global_step": 87505, "epoch": 520} {"train_loss": -9.607661247253418, "global_step": 87506, "epoch": 520} {"train_loss": -9.539131164550781, "global_step": 87507, "epoch": 520} {"train_loss": -9.018925666809082, "global_step": 87508, "epoch": 520} {"train_loss": -9.419513702392578, "global_step": 87509, "epoch": 520} {"train_loss": -9.360664367675781, "global_step": 87510, "epoch": 520} {"train_loss": -9.145574569702148, "global_step": 87511, "epoch": 520} {"train_loss": -9.399731636047363, "global_step": 87512, "epoch": 520} {"train_loss": -9.385286331176758, "global_step": 87513, "epoch": 520} {"train_loss": -9.440995216369629, "global_step": 87514, "epoch": 520} {"train_loss": -9.384960174560547, "global_step": 87515, "epoch": 520} {"train_loss": -9.496683120727539, "global_step": 87516, "epoch": 520} {"train_loss": -9.188858032226562, "global_step": 87517, "epoch": 520} {"train_loss": -9.480669021606445, "global_step": 87518, "epoch": 520} {"train_loss": -9.18277645111084, "global_step": 87519, "epoch": 520} {"train_loss": -9.335350036621094, "global_step": 87520, "epoch": 520} {"train_loss": -9.201972961425781, "global_step": 87521, "epoch": 520} {"train_loss": -9.196266174316406, "global_step": 87522, "epoch": 520} {"train_loss": -9.507220268249512, "global_step": 87523, "epoch": 520} {"train_loss": -9.393856048583984, "global_step": 87524, "epoch": 520} {"train_loss": -9.554758071899414, "global_step": 87525, "epoch": 520} {"train_loss": -9.174468040466309, "global_step": 87526, "epoch": 520} {"train_loss": -9.398792306582132, "global_step": 87527, "epoch": 520, "val_loss": 202137.5, "train_action_mse_error": 8.54265308380127} {"train_loss": -9.153495788574219, "global_step": 87528, "epoch": 521} {"train_loss": -9.713519096374512, "global_step": 87529, "epoch": 521} {"train_loss": -9.312999725341797, "global_step": 87530, "epoch": 521} {"train_loss": -9.653236389160156, "global_step": 87531, "epoch": 521} {"train_loss": -9.144050598144531, "global_step": 87532, "epoch": 521} {"train_loss": -9.515406608581543, "global_step": 87533, "epoch": 521} {"train_loss": -9.497150421142578, "global_step": 87534, "epoch": 521} {"train_loss": -9.624753952026367, "global_step": 87535, "epoch": 521} {"train_loss": -9.519817352294922, "global_step": 87536, "epoch": 521} {"train_loss": -9.527743339538574, "global_step": 87537, "epoch": 521} {"train_loss": -9.401626586914062, "global_step": 87538, "epoch": 521} {"train_loss": -9.524497985839844, "global_step": 87539, "epoch": 521} {"train_loss": -9.080549240112305, "global_step": 87540, "epoch": 521} {"train_loss": -9.360458374023438, "global_step": 87541, "epoch": 521} {"train_loss": -9.59819507598877, "global_step": 87542, "epoch": 521} {"train_loss": -9.285408020019531, "global_step": 87543, "epoch": 521} {"train_loss": -9.453149795532227, "global_step": 87544, "epoch": 521} {"train_loss": -9.188980102539062, "global_step": 87545, "epoch": 521} {"train_loss": -9.404096603393555, "global_step": 87546, "epoch": 521} {"train_loss": -9.49143123626709, "global_step": 87547, "epoch": 521} {"train_loss": -9.250438690185547, "global_step": 87548, "epoch": 521} {"train_loss": -9.570047378540039, "global_step": 87549, "epoch": 521} {"train_loss": -9.438475608825684, "global_step": 87550, "epoch": 521} {"train_loss": -9.542472839355469, "global_step": 87551, "epoch": 521} {"train_loss": -9.367660522460938, "global_step": 87552, "epoch": 521} {"train_loss": -9.251867294311523, "global_step": 87553, "epoch": 521} {"train_loss": -9.184444427490234, "global_step": 87554, "epoch": 521} {"train_loss": -9.443286895751953, "global_step": 87555, "epoch": 521} {"train_loss": -9.44342041015625, "global_step": 87556, "epoch": 521} {"train_loss": -9.447243690490723, "global_step": 87557, "epoch": 521} {"train_loss": -9.486700057983398, "global_step": 87558, "epoch": 521} {"train_loss": -9.28844928741455, "global_step": 87559, "epoch": 521} {"train_loss": -9.327062606811523, "global_step": 87560, "epoch": 521} {"train_loss": -9.418943405151367, "global_step": 87561, "epoch": 521} {"train_loss": -9.150611877441406, "global_step": 87562, "epoch": 521} {"train_loss": -9.625289916992188, "global_step": 87563, "epoch": 521} {"train_loss": -9.397024154663086, "global_step": 87564, "epoch": 521} {"train_loss": -9.218873977661133, "global_step": 87565, "epoch": 521} {"train_loss": -9.318142890930176, "global_step": 87566, "epoch": 521} {"train_loss": -9.418537139892578, "global_step": 87567, "epoch": 521} {"train_loss": -9.176925659179688, "global_step": 87568, "epoch": 521} {"train_loss": -9.358570098876953, "global_step": 87569, "epoch": 521} {"train_loss": -9.364227294921875, "global_step": 87570, "epoch": 521} {"train_loss": -9.207447052001953, "global_step": 87571, "epoch": 521} {"train_loss": -9.23481273651123, "global_step": 87572, "epoch": 521} {"train_loss": -9.151233673095703, "global_step": 87573, "epoch": 521} {"train_loss": -9.419267654418945, "global_step": 87574, "epoch": 521} {"train_loss": -9.266261100769043, "global_step": 87575, "epoch": 521} {"train_loss": -9.053950309753418, "global_step": 87576, "epoch": 521} {"train_loss": -9.252042770385742, "global_step": 87577, "epoch": 521} {"train_loss": -9.331135749816895, "global_step": 87578, "epoch": 521} {"train_loss": -8.922656059265137, "global_step": 87579, "epoch": 521} {"train_loss": -9.307310104370117, "global_step": 87580, "epoch": 521} {"train_loss": -9.181774139404297, "global_step": 87581, "epoch": 521} {"train_loss": -9.426189422607422, "global_step": 87582, "epoch": 521} {"train_loss": -9.067482948303223, "global_step": 87583, "epoch": 521} {"train_loss": -9.524759292602539, "global_step": 87584, "epoch": 521} {"train_loss": -8.976119995117188, "global_step": 87585, "epoch": 521} {"train_loss": -9.043990135192871, "global_step": 87586, "epoch": 521} {"train_loss": -9.393031120300293, "global_step": 87587, "epoch": 521} {"train_loss": -9.393144607543945, "global_step": 87588, "epoch": 521} {"train_loss": -9.183778762817383, "global_step": 87589, "epoch": 521} {"train_loss": -9.15457534790039, "global_step": 87590, "epoch": 521} {"train_loss": -9.552592277526855, "global_step": 87591, "epoch": 521} {"train_loss": -9.162654876708984, "global_step": 87592, "epoch": 521} {"train_loss": -8.961008071899414, "global_step": 87593, "epoch": 521} {"train_loss": -9.339128494262695, "global_step": 87594, "epoch": 521} {"train_loss": -9.373882293701172, "global_step": 87595, "epoch": 521} {"train_loss": -9.072742462158203, "global_step": 87596, "epoch": 521} {"train_loss": -9.44809627532959, "global_step": 87597, "epoch": 521} {"train_loss": -9.224599838256836, "global_step": 87598, "epoch": 521} {"train_loss": -9.513057708740234, "global_step": 87599, "epoch": 521} {"train_loss": -9.331673622131348, "global_step": 87600, "epoch": 521} {"train_loss": -9.332365036010742, "global_step": 87601, "epoch": 521} {"train_loss": -9.592472076416016, "global_step": 87602, "epoch": 521} {"train_loss": -9.462055206298828, "global_step": 87603, "epoch": 521} {"train_loss": -9.423375129699707, "global_step": 87604, "epoch": 521} {"train_loss": -9.390031814575195, "global_step": 87605, "epoch": 521} {"train_loss": -9.661230087280273, "global_step": 87606, "epoch": 521} {"train_loss": -9.128979682922363, "global_step": 87607, "epoch": 521} {"train_loss": -9.496498107910156, "global_step": 87608, "epoch": 521} {"train_loss": -9.38121223449707, "global_step": 87609, "epoch": 521} {"train_loss": -9.325960159301758, "global_step": 87610, "epoch": 521} {"train_loss": -9.263699531555176, "global_step": 87611, "epoch": 521} {"train_loss": -9.226150512695312, "global_step": 87612, "epoch": 521} {"train_loss": -9.298429489135742, "global_step": 87613, "epoch": 521} {"train_loss": -9.417753219604492, "global_step": 87614, "epoch": 521} {"train_loss": -9.535964965820312, "global_step": 87615, "epoch": 521} {"train_loss": -9.507993698120117, "global_step": 87616, "epoch": 521} {"train_loss": -9.282506942749023, "global_step": 87617, "epoch": 521} {"train_loss": -9.348501205444336, "global_step": 87618, "epoch": 521} {"train_loss": -9.435918807983398, "global_step": 87619, "epoch": 521} {"train_loss": -9.27627182006836, "global_step": 87620, "epoch": 521} {"train_loss": -9.377914428710938, "global_step": 87621, "epoch": 521} {"train_loss": -9.172436714172363, "global_step": 87622, "epoch": 521} {"train_loss": -9.49316120147705, "global_step": 87623, "epoch": 521} {"train_loss": -9.373885154724121, "global_step": 87624, "epoch": 521} {"train_loss": -9.027843475341797, "global_step": 87625, "epoch": 521} {"train_loss": -9.186883926391602, "global_step": 87626, "epoch": 521} {"train_loss": -9.422447204589844, "global_step": 87627, "epoch": 521} {"train_loss": -9.212364196777344, "global_step": 87628, "epoch": 521} {"train_loss": -9.490781784057617, "global_step": 87629, "epoch": 521} {"train_loss": -9.445333480834961, "global_step": 87630, "epoch": 521} {"train_loss": -9.372440338134766, "global_step": 87631, "epoch": 521} {"train_loss": -9.53924560546875, "global_step": 87632, "epoch": 521} {"train_loss": -9.128253936767578, "global_step": 87633, "epoch": 521} {"train_loss": -9.491640090942383, "global_step": 87634, "epoch": 521} {"train_loss": -8.911264419555664, "global_step": 87635, "epoch": 521} {"train_loss": -9.313394546508789, "global_step": 87636, "epoch": 521} {"train_loss": -9.380133628845215, "global_step": 87637, "epoch": 521} {"train_loss": -9.202714920043945, "global_step": 87638, "epoch": 521} {"train_loss": -9.541970252990723, "global_step": 87639, "epoch": 521} {"train_loss": -9.255348205566406, "global_step": 87640, "epoch": 521} {"train_loss": -9.589534759521484, "global_step": 87641, "epoch": 521} {"train_loss": -9.618378639221191, "global_step": 87642, "epoch": 521} {"train_loss": -9.180789947509766, "global_step": 87643, "epoch": 521} {"train_loss": -9.553567886352539, "global_step": 87644, "epoch": 521} {"train_loss": -9.167984008789062, "global_step": 87645, "epoch": 521} {"train_loss": -9.39222240447998, "global_step": 87646, "epoch": 521} {"train_loss": -9.363490104675293, "global_step": 87647, "epoch": 521} {"train_loss": -9.116209030151367, "global_step": 87648, "epoch": 521} {"train_loss": -9.277166366577148, "global_step": 87649, "epoch": 521} {"train_loss": -8.791156768798828, "global_step": 87650, "epoch": 521} {"train_loss": -9.374760627746582, "global_step": 87651, "epoch": 521} {"train_loss": -8.947181701660156, "global_step": 87652, "epoch": 521} {"train_loss": -9.144765853881836, "global_step": 87653, "epoch": 521} {"train_loss": -9.318763732910156, "global_step": 87654, "epoch": 521} {"train_loss": -9.090664863586426, "global_step": 87655, "epoch": 521} {"train_loss": -9.008282661437988, "global_step": 87656, "epoch": 521} {"train_loss": -9.285276412963867, "global_step": 87657, "epoch": 521} {"train_loss": -9.416299819946289, "global_step": 87658, "epoch": 521} {"train_loss": -9.101283073425293, "global_step": 87659, "epoch": 521} {"train_loss": -9.190717697143555, "global_step": 87660, "epoch": 521} {"train_loss": -9.334187507629395, "global_step": 87661, "epoch": 521} {"train_loss": -9.289210319519043, "global_step": 87662, "epoch": 521} {"train_loss": -9.130552291870117, "global_step": 87663, "epoch": 521} {"train_loss": -9.440572738647461, "global_step": 87664, "epoch": 521} {"train_loss": -9.144763946533203, "global_step": 87665, "epoch": 521} {"train_loss": -9.175461769104004, "global_step": 87666, "epoch": 521} {"train_loss": -9.31204605102539, "global_step": 87667, "epoch": 521} {"train_loss": -9.480932235717773, "global_step": 87668, "epoch": 521} {"train_loss": -9.46193790435791, "global_step": 87669, "epoch": 521} {"train_loss": -9.179849624633789, "global_step": 87670, "epoch": 521} {"train_loss": -9.359002113342285, "global_step": 87671, "epoch": 521} {"train_loss": -9.22700309753418, "global_step": 87672, "epoch": 521} {"train_loss": -9.380973815917969, "global_step": 87673, "epoch": 521} {"train_loss": -9.390880584716797, "global_step": 87674, "epoch": 521} {"train_loss": -9.371810913085938, "global_step": 87675, "epoch": 521} {"train_loss": -9.558391571044922, "global_step": 87676, "epoch": 521} {"train_loss": -9.254400253295898, "global_step": 87677, "epoch": 521} {"train_loss": -9.538735389709473, "global_step": 87678, "epoch": 521} {"train_loss": -9.672961235046387, "global_step": 87679, "epoch": 521} {"train_loss": -9.322244644165039, "global_step": 87680, "epoch": 521} {"train_loss": -9.434416770935059, "global_step": 87681, "epoch": 521} {"train_loss": -9.547836303710938, "global_step": 87682, "epoch": 521} {"train_loss": -9.2528076171875, "global_step": 87683, "epoch": 521} {"train_loss": -9.603250503540039, "global_step": 87684, "epoch": 521} {"train_loss": -9.424949645996094, "global_step": 87685, "epoch": 521} {"train_loss": -9.667623519897461, "global_step": 87686, "epoch": 521} {"train_loss": -9.488151550292969, "global_step": 87687, "epoch": 521} {"train_loss": -9.728260040283203, "global_step": 87688, "epoch": 521} {"train_loss": -9.362744331359863, "global_step": 87689, "epoch": 521} {"train_loss": -9.697099685668945, "global_step": 87690, "epoch": 521} {"train_loss": -9.488788604736328, "global_step": 87691, "epoch": 521} {"train_loss": -9.594794273376465, "global_step": 87692, "epoch": 521} {"train_loss": -9.722667694091797, "global_step": 87693, "epoch": 521} {"train_loss": -9.683725357055664, "global_step": 87694, "epoch": 521} {"train_loss": -9.34874579452333, "global_step": 87695, "epoch": 521, "val_loss": 203548.703125} {"train_loss": -9.62864875793457, "global_step": 87696, "epoch": 522} {"train_loss": -9.302757263183594, "global_step": 87697, "epoch": 522} {"train_loss": -9.500740051269531, "global_step": 87698, "epoch": 522} {"train_loss": -9.463762283325195, "global_step": 87699, "epoch": 522} {"train_loss": -9.505706787109375, "global_step": 87700, "epoch": 522} {"train_loss": -9.433855056762695, "global_step": 87701, "epoch": 522} {"train_loss": -9.43666934967041, "global_step": 87702, "epoch": 522} {"train_loss": -9.411528587341309, "global_step": 87703, "epoch": 522} {"train_loss": -9.375434875488281, "global_step": 87704, "epoch": 522} {"train_loss": -9.727615356445312, "global_step": 87705, "epoch": 522} {"train_loss": -9.641340255737305, "global_step": 87706, "epoch": 522} {"train_loss": -9.414789199829102, "global_step": 87707, "epoch": 522} {"train_loss": -9.393171310424805, "global_step": 87708, "epoch": 522} {"train_loss": -9.215574264526367, "global_step": 87709, "epoch": 522} {"train_loss": -9.461700439453125, "global_step": 87710, "epoch": 522} {"train_loss": -9.409723281860352, "global_step": 87711, "epoch": 522} {"train_loss": -9.564887046813965, "global_step": 87712, "epoch": 522} {"train_loss": -9.491081237792969, "global_step": 87713, "epoch": 522} {"train_loss": -9.554662704467773, "global_step": 87714, "epoch": 522} {"train_loss": -9.039215087890625, "global_step": 87715, "epoch": 522} {"train_loss": -9.37147045135498, "global_step": 87716, "epoch": 522} {"train_loss": -9.160588264465332, "global_step": 87717, "epoch": 522} {"train_loss": -9.237007141113281, "global_step": 87718, "epoch": 522} {"train_loss": -9.050407409667969, "global_step": 87719, "epoch": 522} {"train_loss": -9.181970596313477, "global_step": 87720, "epoch": 522} {"train_loss": -8.73457145690918, "global_step": 87721, "epoch": 522} {"train_loss": -8.985494613647461, "global_step": 87722, "epoch": 522} {"train_loss": -9.226457595825195, "global_step": 87723, "epoch": 522} {"train_loss": -9.081331253051758, "global_step": 87724, "epoch": 522} {"train_loss": -9.001672744750977, "global_step": 87725, "epoch": 522} {"train_loss": -9.075431823730469, "global_step": 87726, "epoch": 522} {"train_loss": -9.259429931640625, "global_step": 87727, "epoch": 522} {"train_loss": -9.42941665649414, "global_step": 87728, "epoch": 522} {"train_loss": -9.07858657836914, "global_step": 87729, "epoch": 522} {"train_loss": -9.345712661743164, "global_step": 87730, "epoch": 522} {"train_loss": -9.266899108886719, "global_step": 87731, "epoch": 522} {"train_loss": -8.904008865356445, "global_step": 87732, "epoch": 522} {"train_loss": -9.21095085144043, "global_step": 87733, "epoch": 522} {"train_loss": -9.070883750915527, "global_step": 87734, "epoch": 522} {"train_loss": -9.287837982177734, "global_step": 87735, "epoch": 522} {"train_loss": -9.044244766235352, "global_step": 87736, "epoch": 522} {"train_loss": -9.092733383178711, "global_step": 87737, "epoch": 522} {"train_loss": -9.373519897460938, "global_step": 87738, "epoch": 522} {"train_loss": -9.501348495483398, "global_step": 87739, "epoch": 522} {"train_loss": -9.22127914428711, "global_step": 87740, "epoch": 522} {"train_loss": -9.27107048034668, "global_step": 87741, "epoch": 522} {"train_loss": -9.26237678527832, "global_step": 87742, "epoch": 522} {"train_loss": -9.37073802947998, "global_step": 87743, "epoch": 522} {"train_loss": -9.138107299804688, "global_step": 87744, "epoch": 522} {"train_loss": -9.335641860961914, "global_step": 87745, "epoch": 522} {"train_loss": -9.496719360351562, "global_step": 87746, "epoch": 522} {"train_loss": -9.32480525970459, "global_step": 87747, "epoch": 522} {"train_loss": -9.320150375366211, "global_step": 87748, "epoch": 522} {"train_loss": -9.539119720458984, "global_step": 87749, "epoch": 522} {"train_loss": -9.411273956298828, "global_step": 87750, "epoch": 522} {"train_loss": -9.353307723999023, "global_step": 87751, "epoch": 522} {"train_loss": -9.517154693603516, "global_step": 87752, "epoch": 522} {"train_loss": -9.476995468139648, "global_step": 87753, "epoch": 522} {"train_loss": -9.649045944213867, "global_step": 87754, "epoch": 522} {"train_loss": -9.385396957397461, "global_step": 87755, "epoch": 522} {"train_loss": -9.275141716003418, "global_step": 87756, "epoch": 522} {"train_loss": -9.450180053710938, "global_step": 87757, "epoch": 522} {"train_loss": -9.196311950683594, "global_step": 87758, "epoch": 522} {"train_loss": -9.497146606445312, "global_step": 87759, "epoch": 522} {"train_loss": -9.64453411102295, "global_step": 87760, "epoch": 522} {"train_loss": -9.51685619354248, "global_step": 87761, "epoch": 522} {"train_loss": -9.572229385375977, "global_step": 87762, "epoch": 522} {"train_loss": -9.499977111816406, "global_step": 87763, "epoch": 522} {"train_loss": -9.430354118347168, "global_step": 87764, "epoch": 522} {"train_loss": -9.58823013305664, "global_step": 87765, "epoch": 522} {"train_loss": -9.422548294067383, "global_step": 87766, "epoch": 522} {"train_loss": -9.257708549499512, "global_step": 87767, "epoch": 522} {"train_loss": -9.506117820739746, "global_step": 87768, "epoch": 522} {"train_loss": -9.593196868896484, "global_step": 87769, "epoch": 522} {"train_loss": -9.332181930541992, "global_step": 87770, "epoch": 522} {"train_loss": -9.260866165161133, "global_step": 87771, "epoch": 522} {"train_loss": -9.245475769042969, "global_step": 87772, "epoch": 522} {"train_loss": -9.402973175048828, "global_step": 87773, "epoch": 522} {"train_loss": -9.651800155639648, "global_step": 87774, "epoch": 522} {"train_loss": -9.478882789611816, "global_step": 87775, "epoch": 522} {"train_loss": -9.281770706176758, "global_step": 87776, "epoch": 522} {"train_loss": -9.302606582641602, "global_step": 87777, "epoch": 522} {"train_loss": -9.322687149047852, "global_step": 87778, "epoch": 522} {"train_loss": -9.333730697631836, "global_step": 87779, "epoch": 522} {"train_loss": -9.408792495727539, "global_step": 87780, "epoch": 522} {"train_loss": -9.399728775024414, "global_step": 87781, "epoch": 522} {"train_loss": -9.325700759887695, "global_step": 87782, "epoch": 522} {"train_loss": -9.439730644226074, "global_step": 87783, "epoch": 522} {"train_loss": -9.359774589538574, "global_step": 87784, "epoch": 522} {"train_loss": -9.350074768066406, "global_step": 87785, "epoch": 522} {"train_loss": -9.328803062438965, "global_step": 87786, "epoch": 522} {"train_loss": -9.566370964050293, "global_step": 87787, "epoch": 522} {"train_loss": -9.542949676513672, "global_step": 87788, "epoch": 522} {"train_loss": -9.647144317626953, "global_step": 87789, "epoch": 522} {"train_loss": -9.508172988891602, "global_step": 87790, "epoch": 522} {"train_loss": -9.6462984085083, "global_step": 87791, "epoch": 522} {"train_loss": -9.439009666442871, "global_step": 87792, "epoch": 522} {"train_loss": -9.247672080993652, "global_step": 87793, "epoch": 522} {"train_loss": -9.397552490234375, "global_step": 87794, "epoch": 522} {"train_loss": -9.155197143554688, "global_step": 87795, "epoch": 522} {"train_loss": -9.129414558410645, "global_step": 87796, "epoch": 522} {"train_loss": -9.298225402832031, "global_step": 87797, "epoch": 522} {"train_loss": -9.095773696899414, "global_step": 87798, "epoch": 522} {"train_loss": -9.101638793945312, "global_step": 87799, "epoch": 522} {"train_loss": -9.127756118774414, "global_step": 87800, "epoch": 522} {"train_loss": -9.143685340881348, "global_step": 87801, "epoch": 522} {"train_loss": -9.130114555358887, "global_step": 87802, "epoch": 522} {"train_loss": -9.158111572265625, "global_step": 87803, "epoch": 522} {"train_loss": -9.2569580078125, "global_step": 87804, "epoch": 522} {"train_loss": -9.209729194641113, "global_step": 87805, "epoch": 522} {"train_loss": -9.272106170654297, "global_step": 87806, "epoch": 522} {"train_loss": -9.214096069335938, "global_step": 87807, "epoch": 522} {"train_loss": -9.356319427490234, "global_step": 87808, "epoch": 522} {"train_loss": -9.322553634643555, "global_step": 87809, "epoch": 522} {"train_loss": -9.231517791748047, "global_step": 87810, "epoch": 522} {"train_loss": -9.521029472351074, "global_step": 87811, "epoch": 522} {"train_loss": -9.290630340576172, "global_step": 87812, "epoch": 522} {"train_loss": -9.376056671142578, "global_step": 87813, "epoch": 522} {"train_loss": -9.274381637573242, "global_step": 87814, "epoch": 522} {"train_loss": -9.41695785522461, "global_step": 87815, "epoch": 522} {"train_loss": -9.371540069580078, "global_step": 87816, "epoch": 522} {"train_loss": -9.387706756591797, "global_step": 87817, "epoch": 522} {"train_loss": -9.508766174316406, "global_step": 87818, "epoch": 522} {"train_loss": -9.502280235290527, "global_step": 87819, "epoch": 522} {"train_loss": -9.229496002197266, "global_step": 87820, "epoch": 522} {"train_loss": -9.488897323608398, "global_step": 87821, "epoch": 522} {"train_loss": -9.570915222167969, "global_step": 87822, "epoch": 522} {"train_loss": -9.363767623901367, "global_step": 87823, "epoch": 522} {"train_loss": -9.673851013183594, "global_step": 87824, "epoch": 522} {"train_loss": -9.229860305786133, "global_step": 87825, "epoch": 522} {"train_loss": -9.398305892944336, "global_step": 87826, "epoch": 522} {"train_loss": -9.049850463867188, "global_step": 87827, "epoch": 522} {"train_loss": -9.31967830657959, "global_step": 87828, "epoch": 522} {"train_loss": -9.229239463806152, "global_step": 87829, "epoch": 522} {"train_loss": -9.525566101074219, "global_step": 87830, "epoch": 522} {"train_loss": -9.438847541809082, "global_step": 87831, "epoch": 522} {"train_loss": -9.263978958129883, "global_step": 87832, "epoch": 522} {"train_loss": -9.659791946411133, "global_step": 87833, "epoch": 522} {"train_loss": -9.677555084228516, "global_step": 87834, "epoch": 522} {"train_loss": -9.402385711669922, "global_step": 87835, "epoch": 522} {"train_loss": -9.479159355163574, "global_step": 87836, "epoch": 522} {"train_loss": -9.47110366821289, "global_step": 87837, "epoch": 522} {"train_loss": -9.403343200683594, "global_step": 87838, "epoch": 522} {"train_loss": -9.607421875, "global_step": 87839, "epoch": 522} {"train_loss": -9.638285636901855, "global_step": 87840, "epoch": 522} {"train_loss": -9.08636474609375, "global_step": 87841, "epoch": 522} {"train_loss": -9.528127670288086, "global_step": 87842, "epoch": 522} {"train_loss": -9.113055229187012, "global_step": 87843, "epoch": 522} {"train_loss": -9.340668678283691, "global_step": 87844, "epoch": 522} {"train_loss": -9.272109985351562, "global_step": 87845, "epoch": 522} {"train_loss": -8.987995147705078, "global_step": 87846, "epoch": 522} {"train_loss": -9.258310317993164, "global_step": 87847, "epoch": 522} {"train_loss": -9.040215492248535, "global_step": 87848, "epoch": 522} {"train_loss": -9.357569694519043, "global_step": 87849, "epoch": 522} {"train_loss": -8.678839683532715, "global_step": 87850, "epoch": 522} {"train_loss": -9.05194091796875, "global_step": 87851, "epoch": 522} {"train_loss": -8.691308975219727, "global_step": 87852, "epoch": 522} {"train_loss": -8.96940803527832, "global_step": 87853, "epoch": 522} {"train_loss": -9.292171478271484, "global_step": 87854, "epoch": 522} {"train_loss": -9.10664176940918, "global_step": 87855, "epoch": 522} {"train_loss": -9.059925079345703, "global_step": 87856, "epoch": 522} {"train_loss": -9.283575057983398, "global_step": 87857, "epoch": 522} {"train_loss": -9.37326717376709, "global_step": 87858, "epoch": 522} {"train_loss": -9.340734481811523, "global_step": 87859, "epoch": 522} {"train_loss": -9.270044326782227, "global_step": 87860, "epoch": 522} {"train_loss": -9.191993713378906, "global_step": 87861, "epoch": 522} {"train_loss": -9.49901008605957, "global_step": 87862, "epoch": 522} {"train_loss": -9.331644796189808, "global_step": 87863, "epoch": 522, "val_loss": 201984.015625} {"train_loss": -9.383466720581055, "global_step": 87864, "epoch": 523} {"train_loss": -9.321138381958008, "global_step": 87865, "epoch": 523} {"train_loss": -9.371070861816406, "global_step": 87866, "epoch": 523} {"train_loss": -9.361162185668945, "global_step": 87867, "epoch": 523} {"train_loss": -9.28482437133789, "global_step": 87868, "epoch": 523} {"train_loss": -9.631422996520996, "global_step": 87869, "epoch": 523} {"train_loss": -9.278670310974121, "global_step": 87870, "epoch": 523} {"train_loss": -9.469703674316406, "global_step": 87871, "epoch": 523} {"train_loss": -9.298164367675781, "global_step": 87872, "epoch": 523} {"train_loss": -9.62306022644043, "global_step": 87873, "epoch": 523} {"train_loss": -9.570755004882812, "global_step": 87874, "epoch": 523} {"train_loss": -9.511930465698242, "global_step": 87875, "epoch": 523} {"train_loss": -9.39303970336914, "global_step": 87876, "epoch": 523} {"train_loss": -9.326972961425781, "global_step": 87877, "epoch": 523} {"train_loss": -9.487144470214844, "global_step": 87878, "epoch": 523} {"train_loss": -9.202434539794922, "global_step": 87879, "epoch": 523} {"train_loss": -9.421361923217773, "global_step": 87880, "epoch": 523} {"train_loss": -9.524053573608398, "global_step": 87881, "epoch": 523} {"train_loss": -9.629673957824707, "global_step": 87882, "epoch": 523} {"train_loss": -9.528303146362305, "global_step": 87883, "epoch": 523} {"train_loss": -9.51102066040039, "global_step": 87884, "epoch": 523} {"train_loss": -9.290633201599121, "global_step": 87885, "epoch": 523} {"train_loss": -9.399438858032227, "global_step": 87886, "epoch": 523} {"train_loss": -9.378084182739258, "global_step": 87887, "epoch": 523} {"train_loss": -9.481130599975586, "global_step": 87888, "epoch": 523} {"train_loss": -9.032892227172852, "global_step": 87889, "epoch": 523} {"train_loss": -9.667243957519531, "global_step": 87890, "epoch": 523} {"train_loss": -9.161066055297852, "global_step": 87891, "epoch": 523} {"train_loss": -9.400468826293945, "global_step": 87892, "epoch": 523} {"train_loss": -9.597088813781738, "global_step": 87893, "epoch": 523} {"train_loss": -9.404396057128906, "global_step": 87894, "epoch": 523} {"train_loss": -9.483464241027832, "global_step": 87895, "epoch": 523} {"train_loss": -9.472248077392578, "global_step": 87896, "epoch": 523} {"train_loss": -9.434449195861816, "global_step": 87897, "epoch": 523} {"train_loss": -9.402195930480957, "global_step": 87898, "epoch": 523} {"train_loss": -9.310287475585938, "global_step": 87899, "epoch": 523} {"train_loss": -9.281190872192383, "global_step": 87900, "epoch": 523} {"train_loss": -9.314166069030762, "global_step": 87901, "epoch": 523} {"train_loss": -9.53454875946045, "global_step": 87902, "epoch": 523} {"train_loss": -9.327619552612305, "global_step": 87903, "epoch": 523} {"train_loss": -9.378158569335938, "global_step": 87904, "epoch": 523} {"train_loss": -9.574951171875, "global_step": 87905, "epoch": 523} {"train_loss": -9.431624412536621, "global_step": 87906, "epoch": 523} {"train_loss": -9.123054504394531, "global_step": 87907, "epoch": 523} {"train_loss": -9.438472747802734, "global_step": 87908, "epoch": 523} {"train_loss": -9.127945899963379, "global_step": 87909, "epoch": 523} {"train_loss": -8.909160614013672, "global_step": 87910, "epoch": 523} {"train_loss": -9.377347946166992, "global_step": 87911, "epoch": 523} {"train_loss": -9.040091514587402, "global_step": 87912, "epoch": 523} {"train_loss": -9.300676345825195, "global_step": 87913, "epoch": 523} {"train_loss": -9.299728393554688, "global_step": 87914, "epoch": 523} {"train_loss": -9.213258743286133, "global_step": 87915, "epoch": 523} {"train_loss": -8.983560562133789, "global_step": 87916, "epoch": 523} {"train_loss": -9.3735990524292, "global_step": 87917, "epoch": 523} {"train_loss": -9.055768966674805, "global_step": 87918, "epoch": 523} {"train_loss": -9.179733276367188, "global_step": 87919, "epoch": 523} {"train_loss": -9.074560165405273, "global_step": 87920, "epoch": 523} {"train_loss": -9.334151268005371, "global_step": 87921, "epoch": 523} {"train_loss": -9.471290588378906, "global_step": 87922, "epoch": 523} {"train_loss": -9.254222869873047, "global_step": 87923, "epoch": 523} {"train_loss": -9.317416191101074, "global_step": 87924, "epoch": 523} {"train_loss": -9.345163345336914, "global_step": 87925, "epoch": 523} {"train_loss": -9.401782035827637, "global_step": 87926, "epoch": 523} {"train_loss": -9.345101356506348, "global_step": 87927, "epoch": 523} {"train_loss": -9.102240562438965, "global_step": 87928, "epoch": 523} {"train_loss": -8.932111740112305, "global_step": 87929, "epoch": 523} {"train_loss": -9.126958847045898, "global_step": 87930, "epoch": 523} {"train_loss": -9.235373497009277, "global_step": 87931, "epoch": 523} {"train_loss": -9.288116455078125, "global_step": 87932, "epoch": 523} {"train_loss": -9.401467323303223, "global_step": 87933, "epoch": 523} {"train_loss": -9.4595365524292, "global_step": 87934, "epoch": 523} {"train_loss": -9.466731071472168, "global_step": 87935, "epoch": 523} {"train_loss": -9.239187240600586, "global_step": 87936, "epoch": 523} {"train_loss": -9.50764274597168, "global_step": 87937, "epoch": 523} {"train_loss": -9.222426414489746, "global_step": 87938, "epoch": 523} {"train_loss": -9.581939697265625, "global_step": 87939, "epoch": 523} {"train_loss": -9.53924560546875, "global_step": 87940, "epoch": 523} {"train_loss": -9.551488876342773, "global_step": 87941, "epoch": 523} {"train_loss": -9.356986999511719, "global_step": 87942, "epoch": 523} {"train_loss": -9.572428703308105, "global_step": 87943, "epoch": 523} {"train_loss": -9.422540664672852, "global_step": 87944, "epoch": 523} {"train_loss": -9.301546096801758, "global_step": 87945, "epoch": 523} {"train_loss": -9.680135726928711, "global_step": 87946, "epoch": 523} {"train_loss": -9.480439186096191, "global_step": 87947, "epoch": 523} {"train_loss": -9.409908294677734, "global_step": 87948, "epoch": 523} {"train_loss": -9.464512825012207, "global_step": 87949, "epoch": 523} {"train_loss": -9.397516250610352, "global_step": 87950, "epoch": 523} {"train_loss": -9.562106132507324, "global_step": 87951, "epoch": 523} {"train_loss": -9.458332061767578, "global_step": 87952, "epoch": 523} {"train_loss": -9.572188377380371, "global_step": 87953, "epoch": 523} {"train_loss": -9.511180877685547, "global_step": 87954, "epoch": 523} {"train_loss": -9.41357421875, "global_step": 87955, "epoch": 523} {"train_loss": -9.517904281616211, "global_step": 87956, "epoch": 523} {"train_loss": -9.426277160644531, "global_step": 87957, "epoch": 523} {"train_loss": -9.262084007263184, "global_step": 87958, "epoch": 523} {"train_loss": -9.41663932800293, "global_step": 87959, "epoch": 523} {"train_loss": -9.288239479064941, "global_step": 87960, "epoch": 523} {"train_loss": -9.38008975982666, "global_step": 87961, "epoch": 523} {"train_loss": -9.39909553527832, "global_step": 87962, "epoch": 523} {"train_loss": -9.355745315551758, "global_step": 87963, "epoch": 523} {"train_loss": -9.342748641967773, "global_step": 87964, "epoch": 523} {"train_loss": -9.503087997436523, "global_step": 87965, "epoch": 523} {"train_loss": -9.421001434326172, "global_step": 87966, "epoch": 523} {"train_loss": -9.483932495117188, "global_step": 87967, "epoch": 523} {"train_loss": -9.327653884887695, "global_step": 87968, "epoch": 523} {"train_loss": -9.46438217163086, "global_step": 87969, "epoch": 523} {"train_loss": -9.755099296569824, "global_step": 87970, "epoch": 523} {"train_loss": -9.413901329040527, "global_step": 87971, "epoch": 523} {"train_loss": -9.23194694519043, "global_step": 87972, "epoch": 523} {"train_loss": -9.374207496643066, "global_step": 87973, "epoch": 523} {"train_loss": -9.514217376708984, "global_step": 87974, "epoch": 523} {"train_loss": -9.26568603515625, "global_step": 87975, "epoch": 523} {"train_loss": -9.297252655029297, "global_step": 87976, "epoch": 523} {"train_loss": -9.207267761230469, "global_step": 87977, "epoch": 523} {"train_loss": -9.416051864624023, "global_step": 87978, "epoch": 523} {"train_loss": -9.437278747558594, "global_step": 87979, "epoch": 523} {"train_loss": -9.394347190856934, "global_step": 87980, "epoch": 523} {"train_loss": -9.311075210571289, "global_step": 87981, "epoch": 523} {"train_loss": -9.485491752624512, "global_step": 87982, "epoch": 523} {"train_loss": -9.338990211486816, "global_step": 87983, "epoch": 523} {"train_loss": -9.325749397277832, "global_step": 87984, "epoch": 523} {"train_loss": -9.1886568069458, "global_step": 87985, "epoch": 523} {"train_loss": -9.385393142700195, "global_step": 87986, "epoch": 523} {"train_loss": -9.491800308227539, "global_step": 87987, "epoch": 523} {"train_loss": -9.285566329956055, "global_step": 87988, "epoch": 523} {"train_loss": -9.54513168334961, "global_step": 87989, "epoch": 523} {"train_loss": -9.166570663452148, "global_step": 87990, "epoch": 523} {"train_loss": -9.513232231140137, "global_step": 87991, "epoch": 523} {"train_loss": -9.211142539978027, "global_step": 87992, "epoch": 523} {"train_loss": -9.074951171875, "global_step": 87993, "epoch": 523} {"train_loss": -9.598478317260742, "global_step": 87994, "epoch": 523} {"train_loss": -8.987804412841797, "global_step": 87995, "epoch": 523} {"train_loss": -9.599536895751953, "global_step": 87996, "epoch": 523} {"train_loss": -9.304206848144531, "global_step": 87997, "epoch": 523} {"train_loss": -9.086841583251953, "global_step": 87998, "epoch": 523} {"train_loss": -9.398835182189941, "global_step": 87999, "epoch": 523} {"train_loss": -9.246912002563477, "global_step": 88000, "epoch": 523} {"train_loss": -9.182027816772461, "global_step": 88001, "epoch": 523} {"train_loss": -9.423318862915039, "global_step": 88002, "epoch": 523} {"train_loss": -9.314979553222656, "global_step": 88003, "epoch": 523} {"train_loss": -9.345867156982422, "global_step": 88004, "epoch": 523} {"train_loss": -9.373170852661133, "global_step": 88005, "epoch": 523} {"train_loss": -9.530509948730469, "global_step": 88006, "epoch": 523} {"train_loss": -9.451765060424805, "global_step": 88007, "epoch": 523} {"train_loss": -9.698713302612305, "global_step": 88008, "epoch": 523} {"train_loss": -9.521303176879883, "global_step": 88009, "epoch": 523} {"train_loss": -9.49730396270752, "global_step": 88010, "epoch": 523} {"train_loss": -9.29885196685791, "global_step": 88011, "epoch": 523} {"train_loss": -9.460485458374023, "global_step": 88012, "epoch": 523} {"train_loss": -9.550430297851562, "global_step": 88013, "epoch": 523} {"train_loss": -9.438518524169922, "global_step": 88014, "epoch": 523} {"train_loss": -9.61843490600586, "global_step": 88015, "epoch": 523} {"train_loss": -9.397473335266113, "global_step": 88016, "epoch": 523} {"train_loss": -9.420560836791992, "global_step": 88017, "epoch": 523} {"train_loss": -9.391307830810547, "global_step": 88018, "epoch": 523} {"train_loss": -9.304767608642578, "global_step": 88019, "epoch": 523} {"train_loss": -9.354440689086914, "global_step": 88020, "epoch": 523} {"train_loss": -9.178548812866211, "global_step": 88021, "epoch": 523} {"train_loss": -9.716669082641602, "global_step": 88022, "epoch": 523} {"train_loss": -9.40681266784668, "global_step": 88023, "epoch": 523} {"train_loss": -9.227155685424805, "global_step": 88024, "epoch": 523} {"train_loss": -9.391268730163574, "global_step": 88025, "epoch": 523} {"train_loss": -9.30636978149414, "global_step": 88026, "epoch": 523} {"train_loss": -9.633321762084961, "global_step": 88027, "epoch": 523} {"train_loss": -9.335607528686523, "global_step": 88028, "epoch": 523} {"train_loss": -9.458808898925781, "global_step": 88029, "epoch": 523} {"train_loss": -9.636496543884277, "global_step": 88030, "epoch": 523} {"train_loss": -9.379181413423447, "global_step": 88031, "epoch": 523, "val_loss": 201418.609375} {"train_loss": -9.538267135620117, "global_step": 88032, "epoch": 524} {"train_loss": -9.391861915588379, "global_step": 88033, "epoch": 524} {"train_loss": -9.525793075561523, "global_step": 88034, "epoch": 524} {"train_loss": -9.383869171142578, "global_step": 88035, "epoch": 524} {"train_loss": -9.44955825805664, "global_step": 88036, "epoch": 524} {"train_loss": -9.667073249816895, "global_step": 88037, "epoch": 524} {"train_loss": -9.628364562988281, "global_step": 88038, "epoch": 524} {"train_loss": -9.56561279296875, "global_step": 88039, "epoch": 524} {"train_loss": -9.669323921203613, "global_step": 88040, "epoch": 524} {"train_loss": -9.527381896972656, "global_step": 88041, "epoch": 524} {"train_loss": -9.609563827514648, "global_step": 88042, "epoch": 524} {"train_loss": -9.660902976989746, "global_step": 88043, "epoch": 524} {"train_loss": -9.366795539855957, "global_step": 88044, "epoch": 524} {"train_loss": -9.461429595947266, "global_step": 88045, "epoch": 524} {"train_loss": -9.675138473510742, "global_step": 88046, "epoch": 524} {"train_loss": -9.474702835083008, "global_step": 88047, "epoch": 524} {"train_loss": -9.497313499450684, "global_step": 88048, "epoch": 524} {"train_loss": -9.411107063293457, "global_step": 88049, "epoch": 524} {"train_loss": -9.587859153747559, "global_step": 88050, "epoch": 524} {"train_loss": -9.40246295928955, "global_step": 88051, "epoch": 524} {"train_loss": -9.323099136352539, "global_step": 88052, "epoch": 524} {"train_loss": -9.532697677612305, "global_step": 88053, "epoch": 524} {"train_loss": -9.4290771484375, "global_step": 88054, "epoch": 524} {"train_loss": -9.541019439697266, "global_step": 88055, "epoch": 524} {"train_loss": -9.403453826904297, "global_step": 88056, "epoch": 524} {"train_loss": -9.4424409866333, "global_step": 88057, "epoch": 524} {"train_loss": -9.144124984741211, "global_step": 88058, "epoch": 524} {"train_loss": -9.329082489013672, "global_step": 88059, "epoch": 524} {"train_loss": -9.542484283447266, "global_step": 88060, "epoch": 524} {"train_loss": -9.517568588256836, "global_step": 88061, "epoch": 524} {"train_loss": -9.18519401550293, "global_step": 88062, "epoch": 524} {"train_loss": -9.373147010803223, "global_step": 88063, "epoch": 524} {"train_loss": -9.800901412963867, "global_step": 88064, "epoch": 524} {"train_loss": -9.290645599365234, "global_step": 88065, "epoch": 524} {"train_loss": -9.438867568969727, "global_step": 88066, "epoch": 524} {"train_loss": -9.129472732543945, "global_step": 88067, "epoch": 524} {"train_loss": -9.135030746459961, "global_step": 88068, "epoch": 524} {"train_loss": -9.411981582641602, "global_step": 88069, "epoch": 524} {"train_loss": -9.153387069702148, "global_step": 88070, "epoch": 524} {"train_loss": -9.378538131713867, "global_step": 88071, "epoch": 524} {"train_loss": -9.456708908081055, "global_step": 88072, "epoch": 524} {"train_loss": -8.914705276489258, "global_step": 88073, "epoch": 524} {"train_loss": -9.356714248657227, "global_step": 88074, "epoch": 524} {"train_loss": -9.415690422058105, "global_step": 88075, "epoch": 524} {"train_loss": -9.449679374694824, "global_step": 88076, "epoch": 524} {"train_loss": -9.388294219970703, "global_step": 88077, "epoch": 524} {"train_loss": -9.208019256591797, "global_step": 88078, "epoch": 524} {"train_loss": -9.41933536529541, "global_step": 88079, "epoch": 524} {"train_loss": -9.436057090759277, "global_step": 88080, "epoch": 524} {"train_loss": -9.346357345581055, "global_step": 88081, "epoch": 524} {"train_loss": -9.478899002075195, "global_step": 88082, "epoch": 524} {"train_loss": -9.246221542358398, "global_step": 88083, "epoch": 524} {"train_loss": -9.597192764282227, "global_step": 88084, "epoch": 524} {"train_loss": -9.49325180053711, "global_step": 88085, "epoch": 524} {"train_loss": -9.157999038696289, "global_step": 88086, "epoch": 524} {"train_loss": -9.348438262939453, "global_step": 88087, "epoch": 524} {"train_loss": -9.558853149414062, "global_step": 88088, "epoch": 524} {"train_loss": -9.55583381652832, "global_step": 88089, "epoch": 524} {"train_loss": -9.551910400390625, "global_step": 88090, "epoch": 524} {"train_loss": -8.950868606567383, "global_step": 88091, "epoch": 524} {"train_loss": -9.380033493041992, "global_step": 88092, "epoch": 524} {"train_loss": -8.788856506347656, "global_step": 88093, "epoch": 524} {"train_loss": -8.926248550415039, "global_step": 88094, "epoch": 524} {"train_loss": -9.012433052062988, "global_step": 88095, "epoch": 524} {"train_loss": -9.275843620300293, "global_step": 88096, "epoch": 524} {"train_loss": -9.082101821899414, "global_step": 88097, "epoch": 524} {"train_loss": -8.864646911621094, "global_step": 88098, "epoch": 524} {"train_loss": -8.800854682922363, "global_step": 88099, "epoch": 524} {"train_loss": -9.259187698364258, "global_step": 88100, "epoch": 524} {"train_loss": -9.185611724853516, "global_step": 88101, "epoch": 524} {"train_loss": -9.452278137207031, "global_step": 88102, "epoch": 524} {"train_loss": -9.361852645874023, "global_step": 88103, "epoch": 524} {"train_loss": -9.3811674118042, "global_step": 88104, "epoch": 524} {"train_loss": -9.274600982666016, "global_step": 88105, "epoch": 524} {"train_loss": -9.176149368286133, "global_step": 88106, "epoch": 524} {"train_loss": -9.222145080566406, "global_step": 88107, "epoch": 524} {"train_loss": -9.258811950683594, "global_step": 88108, "epoch": 524} {"train_loss": -9.385726928710938, "global_step": 88109, "epoch": 524} {"train_loss": -9.072244644165039, "global_step": 88110, "epoch": 524} {"train_loss": -9.524419784545898, "global_step": 88111, "epoch": 524} {"train_loss": -9.219148635864258, "global_step": 88112, "epoch": 524} {"train_loss": -9.402776718139648, "global_step": 88113, "epoch": 524} {"train_loss": -9.506402015686035, "global_step": 88114, "epoch": 524} {"train_loss": -9.222476959228516, "global_step": 88115, "epoch": 524} {"train_loss": -9.429255485534668, "global_step": 88116, "epoch": 524} {"train_loss": -9.550992965698242, "global_step": 88117, "epoch": 524} {"train_loss": -9.67733383178711, "global_step": 88118, "epoch": 524} {"train_loss": -9.593642234802246, "global_step": 88119, "epoch": 524} {"train_loss": -9.51080322265625, "global_step": 88120, "epoch": 524} {"train_loss": -9.610498428344727, "global_step": 88121, "epoch": 524} {"train_loss": -9.357687950134277, "global_step": 88122, "epoch": 524} {"train_loss": -9.296478271484375, "global_step": 88123, "epoch": 524} {"train_loss": -9.44498062133789, "global_step": 88124, "epoch": 524} {"train_loss": -9.840402603149414, "global_step": 88125, "epoch": 524} {"train_loss": -9.479448318481445, "global_step": 88126, "epoch": 524} {"train_loss": -9.478653907775879, "global_step": 88127, "epoch": 524} {"train_loss": -9.58765983581543, "global_step": 88128, "epoch": 524} {"train_loss": -9.494461059570312, "global_step": 88129, "epoch": 524} {"train_loss": -9.639896392822266, "global_step": 88130, "epoch": 524} {"train_loss": -9.572035789489746, "global_step": 88131, "epoch": 524} {"train_loss": -9.685144424438477, "global_step": 88132, "epoch": 524} {"train_loss": -9.513141632080078, "global_step": 88133, "epoch": 524} {"train_loss": -9.314105987548828, "global_step": 88134, "epoch": 524} {"train_loss": -9.511850357055664, "global_step": 88135, "epoch": 524} {"train_loss": -9.528839111328125, "global_step": 88136, "epoch": 524} {"train_loss": -9.354719161987305, "global_step": 88137, "epoch": 524} {"train_loss": -9.562198638916016, "global_step": 88138, "epoch": 524} {"train_loss": -9.523612976074219, "global_step": 88139, "epoch": 524} {"train_loss": -9.75436782836914, "global_step": 88140, "epoch": 524} {"train_loss": -9.592041969299316, "global_step": 88141, "epoch": 524} {"train_loss": -9.66708755493164, "global_step": 88142, "epoch": 524} {"train_loss": -9.25150203704834, "global_step": 88143, "epoch": 524} {"train_loss": -9.333669662475586, "global_step": 88144, "epoch": 524} {"train_loss": -9.637187004089355, "global_step": 88145, "epoch": 524} {"train_loss": -9.178030014038086, "global_step": 88146, "epoch": 524} {"train_loss": -9.581531524658203, "global_step": 88147, "epoch": 524} {"train_loss": -9.401073455810547, "global_step": 88148, "epoch": 524} {"train_loss": -9.666613578796387, "global_step": 88149, "epoch": 524} {"train_loss": -9.437305450439453, "global_step": 88150, "epoch": 524} {"train_loss": -9.400979995727539, "global_step": 88151, "epoch": 524} {"train_loss": -9.488161087036133, "global_step": 88152, "epoch": 524} {"train_loss": -9.299335479736328, "global_step": 88153, "epoch": 524} {"train_loss": -9.420045852661133, "global_step": 88154, "epoch": 524} {"train_loss": -9.559152603149414, "global_step": 88155, "epoch": 524} {"train_loss": -9.296087265014648, "global_step": 88156, "epoch": 524} {"train_loss": -9.536266326904297, "global_step": 88157, "epoch": 524} {"train_loss": -9.32738208770752, "global_step": 88158, "epoch": 524} {"train_loss": -9.152936935424805, "global_step": 88159, "epoch": 524} {"train_loss": -9.618204116821289, "global_step": 88160, "epoch": 524} {"train_loss": -9.478593826293945, "global_step": 88161, "epoch": 524} {"train_loss": -9.110563278198242, "global_step": 88162, "epoch": 524} {"train_loss": -9.588004112243652, "global_step": 88163, "epoch": 524} {"train_loss": -9.389419555664062, "global_step": 88164, "epoch": 524} {"train_loss": -9.154624938964844, "global_step": 88165, "epoch": 524} {"train_loss": -9.205873489379883, "global_step": 88166, "epoch": 524} {"train_loss": -9.013991355895996, "global_step": 88167, "epoch": 524} {"train_loss": -9.16178035736084, "global_step": 88168, "epoch": 524} {"train_loss": -8.863847732543945, "global_step": 88169, "epoch": 524} {"train_loss": -9.31479549407959, "global_step": 88170, "epoch": 524} {"train_loss": -9.389519691467285, "global_step": 88171, "epoch": 524} {"train_loss": -9.547379493713379, "global_step": 88172, "epoch": 524} {"train_loss": -9.10757064819336, "global_step": 88173, "epoch": 524} {"train_loss": -9.183262825012207, "global_step": 88174, "epoch": 524} {"train_loss": -9.266836166381836, "global_step": 88175, "epoch": 524} {"train_loss": -8.891196250915527, "global_step": 88176, "epoch": 524} {"train_loss": -9.31596565246582, "global_step": 88177, "epoch": 524} {"train_loss": -9.026877403259277, "global_step": 88178, "epoch": 524} {"train_loss": -9.473531723022461, "global_step": 88179, "epoch": 524} {"train_loss": -9.310604095458984, "global_step": 88180, "epoch": 524} {"train_loss": -9.281806945800781, "global_step": 88181, "epoch": 524} {"train_loss": -9.518804550170898, "global_step": 88182, "epoch": 524} {"train_loss": -9.548273086547852, "global_step": 88183, "epoch": 524} {"train_loss": -9.454825401306152, "global_step": 88184, "epoch": 524} {"train_loss": -9.397867202758789, "global_step": 88185, "epoch": 524} {"train_loss": -9.338130950927734, "global_step": 88186, "epoch": 524} {"train_loss": -9.629764556884766, "global_step": 88187, "epoch": 524} {"train_loss": -9.59521484375, "global_step": 88188, "epoch": 524} {"train_loss": -9.513711929321289, "global_step": 88189, "epoch": 524} {"train_loss": -9.183035850524902, "global_step": 88190, "epoch": 524} {"train_loss": -9.554546356201172, "global_step": 88191, "epoch": 524} {"train_loss": -9.654603958129883, "global_step": 88192, "epoch": 524} {"train_loss": -9.714032173156738, "global_step": 88193, "epoch": 524} {"train_loss": -9.537562370300293, "global_step": 88194, "epoch": 524} {"train_loss": -9.543569564819336, "global_step": 88195, "epoch": 524} {"train_loss": -9.56709098815918, "global_step": 88196, "epoch": 524} {"train_loss": -9.599534034729004, "global_step": 88197, "epoch": 524} {"train_loss": -9.131186485290527, "global_step": 88198, "epoch": 524} {"train_loss": -9.394873902911232, "global_step": 88199, "epoch": 524, "val_loss": 203197.921875} {"train_loss": -9.535928726196289, "global_step": 88200, "epoch": 525} {"train_loss": -9.351359367370605, "global_step": 88201, "epoch": 525} {"train_loss": -9.448259353637695, "global_step": 88202, "epoch": 525} {"train_loss": -9.564094543457031, "global_step": 88203, "epoch": 525} {"train_loss": -9.533546447753906, "global_step": 88204, "epoch": 525} {"train_loss": -9.440888404846191, "global_step": 88205, "epoch": 525} {"train_loss": -9.503381729125977, "global_step": 88206, "epoch": 525} {"train_loss": -9.439497947692871, "global_step": 88207, "epoch": 525} {"train_loss": -9.357738494873047, "global_step": 88208, "epoch": 525} {"train_loss": -9.468454360961914, "global_step": 88209, "epoch": 525} {"train_loss": -9.314908981323242, "global_step": 88210, "epoch": 525} {"train_loss": -9.335639953613281, "global_step": 88211, "epoch": 525} {"train_loss": -9.453733444213867, "global_step": 88212, "epoch": 525} {"train_loss": -9.482358932495117, "global_step": 88213, "epoch": 525} {"train_loss": -9.4427490234375, "global_step": 88214, "epoch": 525} {"train_loss": -9.722600936889648, "global_step": 88215, "epoch": 525} {"train_loss": -9.475732803344727, "global_step": 88216, "epoch": 525} {"train_loss": -9.578275680541992, "global_step": 88217, "epoch": 525} {"train_loss": -9.197565078735352, "global_step": 88218, "epoch": 525} {"train_loss": -9.040677070617676, "global_step": 88219, "epoch": 525} {"train_loss": -9.110452651977539, "global_step": 88220, "epoch": 525} {"train_loss": -9.116003036499023, "global_step": 88221, "epoch": 525} {"train_loss": -9.42807388305664, "global_step": 88222, "epoch": 525} {"train_loss": -9.071019172668457, "global_step": 88223, "epoch": 525} {"train_loss": -9.52351188659668, "global_step": 88224, "epoch": 525} {"train_loss": -9.380128860473633, "global_step": 88225, "epoch": 525} {"train_loss": -9.400959014892578, "global_step": 88226, "epoch": 525} {"train_loss": -9.435407638549805, "global_step": 88227, "epoch": 525} {"train_loss": -9.324708938598633, "global_step": 88228, "epoch": 525} {"train_loss": -9.299909591674805, "global_step": 88229, "epoch": 525} {"train_loss": -9.354110717773438, "global_step": 88230, "epoch": 525} {"train_loss": -9.19095230102539, "global_step": 88231, "epoch": 525} {"train_loss": -9.56203556060791, "global_step": 88232, "epoch": 525} {"train_loss": -9.416717529296875, "global_step": 88233, "epoch": 525} {"train_loss": -9.375513076782227, "global_step": 88234, "epoch": 525} {"train_loss": -9.375418663024902, "global_step": 88235, "epoch": 525} {"train_loss": -9.161741256713867, "global_step": 88236, "epoch": 525} {"train_loss": -9.193490028381348, "global_step": 88237, "epoch": 525} {"train_loss": -9.56962776184082, "global_step": 88238, "epoch": 525} {"train_loss": -8.958179473876953, "global_step": 88239, "epoch": 525} {"train_loss": -9.295754432678223, "global_step": 88240, "epoch": 525} {"train_loss": -9.186384201049805, "global_step": 88241, "epoch": 525} {"train_loss": -9.192776679992676, "global_step": 88242, "epoch": 525} {"train_loss": -9.09766960144043, "global_step": 88243, "epoch": 525} {"train_loss": -9.269026756286621, "global_step": 88244, "epoch": 525} {"train_loss": -9.545732498168945, "global_step": 88245, "epoch": 525} {"train_loss": -8.879352569580078, "global_step": 88246, "epoch": 525} {"train_loss": -9.4506254196167, "global_step": 88247, "epoch": 525} {"train_loss": -9.343379020690918, "global_step": 88248, "epoch": 525} {"train_loss": -9.26765251159668, "global_step": 88249, "epoch": 525} {"train_loss": -9.380109786987305, "global_step": 88250, "epoch": 525} {"train_loss": -9.40018081665039, "global_step": 88251, "epoch": 525} {"train_loss": -9.250019073486328, "global_step": 88252, "epoch": 525} {"train_loss": -9.405878067016602, "global_step": 88253, "epoch": 525} {"train_loss": -8.88302230834961, "global_step": 88254, "epoch": 525} {"train_loss": -9.517021179199219, "global_step": 88255, "epoch": 525} {"train_loss": -9.337383270263672, "global_step": 88256, "epoch": 525} {"train_loss": -9.51462173461914, "global_step": 88257, "epoch": 525} {"train_loss": -9.097440719604492, "global_step": 88258, "epoch": 525} {"train_loss": -9.281816482543945, "global_step": 88259, "epoch": 525} {"train_loss": -9.628681182861328, "global_step": 88260, "epoch": 525} {"train_loss": -9.488758087158203, "global_step": 88261, "epoch": 525} {"train_loss": -9.440464973449707, "global_step": 88262, "epoch": 525} {"train_loss": -9.537943840026855, "global_step": 88263, "epoch": 525} {"train_loss": -9.310234069824219, "global_step": 88264, "epoch": 525} {"train_loss": -9.53138542175293, "global_step": 88265, "epoch": 525} {"train_loss": -9.518312454223633, "global_step": 88266, "epoch": 525} {"train_loss": -9.278453826904297, "global_step": 88267, "epoch": 525} {"train_loss": -9.500269889831543, "global_step": 88268, "epoch": 525} {"train_loss": -9.393915176391602, "global_step": 88269, "epoch": 525} {"train_loss": -9.284926414489746, "global_step": 88270, "epoch": 525} {"train_loss": -9.693574905395508, "global_step": 88271, "epoch": 525} {"train_loss": -9.767630577087402, "global_step": 88272, "epoch": 525} {"train_loss": -9.456653594970703, "global_step": 88273, "epoch": 525} {"train_loss": -9.424247741699219, "global_step": 88274, "epoch": 525} {"train_loss": -9.389445304870605, "global_step": 88275, "epoch": 525} {"train_loss": -9.601594924926758, "global_step": 88276, "epoch": 525} {"train_loss": -9.190074920654297, "global_step": 88277, "epoch": 525} {"train_loss": -9.458148002624512, "global_step": 88278, "epoch": 525} {"train_loss": -9.466721534729004, "global_step": 88279, "epoch": 525} {"train_loss": -9.210315704345703, "global_step": 88280, "epoch": 525} {"train_loss": -9.459022521972656, "global_step": 88281, "epoch": 525} {"train_loss": -9.306058883666992, "global_step": 88282, "epoch": 525} {"train_loss": -9.452009201049805, "global_step": 88283, "epoch": 525} {"train_loss": -9.554666519165039, "global_step": 88284, "epoch": 525} {"train_loss": -9.40781307220459, "global_step": 88285, "epoch": 525} {"train_loss": -9.637903213500977, "global_step": 88286, "epoch": 525} {"train_loss": -9.532304763793945, "global_step": 88287, "epoch": 525} {"train_loss": -9.262123107910156, "global_step": 88288, "epoch": 525} {"train_loss": -9.430240631103516, "global_step": 88289, "epoch": 525} {"train_loss": -9.393423080444336, "global_step": 88290, "epoch": 525} {"train_loss": -9.460498809814453, "global_step": 88291, "epoch": 525} {"train_loss": -9.59707260131836, "global_step": 88292, "epoch": 525} {"train_loss": -9.246953964233398, "global_step": 88293, "epoch": 525} {"train_loss": -9.446943283081055, "global_step": 88294, "epoch": 525} {"train_loss": -9.331048965454102, "global_step": 88295, "epoch": 525} {"train_loss": -9.206409454345703, "global_step": 88296, "epoch": 525} {"train_loss": -9.327094078063965, "global_step": 88297, "epoch": 525} {"train_loss": -9.43521499633789, "global_step": 88298, "epoch": 525} {"train_loss": -9.386543273925781, "global_step": 88299, "epoch": 525} {"train_loss": -9.502779006958008, "global_step": 88300, "epoch": 525} {"train_loss": -9.259241104125977, "global_step": 88301, "epoch": 525} {"train_loss": -9.489182472229004, "global_step": 88302, "epoch": 525} {"train_loss": -9.273921966552734, "global_step": 88303, "epoch": 525} {"train_loss": -9.194587707519531, "global_step": 88304, "epoch": 525} {"train_loss": -9.383401870727539, "global_step": 88305, "epoch": 525} {"train_loss": -9.221319198608398, "global_step": 88306, "epoch": 525} {"train_loss": -9.484844207763672, "global_step": 88307, "epoch": 525} {"train_loss": -9.582317352294922, "global_step": 88308, "epoch": 525} {"train_loss": -9.263851165771484, "global_step": 88309, "epoch": 525} {"train_loss": -9.441922187805176, "global_step": 88310, "epoch": 525} {"train_loss": -9.643363952636719, "global_step": 88311, "epoch": 525} {"train_loss": -9.154600143432617, "global_step": 88312, "epoch": 525} {"train_loss": -9.218561172485352, "global_step": 88313, "epoch": 525} {"train_loss": -9.346220016479492, "global_step": 88314, "epoch": 525} {"train_loss": -9.613672256469727, "global_step": 88315, "epoch": 525} {"train_loss": -9.556392669677734, "global_step": 88316, "epoch": 525} {"train_loss": -9.356287956237793, "global_step": 88317, "epoch": 525} {"train_loss": -9.27245807647705, "global_step": 88318, "epoch": 525} {"train_loss": -9.241769790649414, "global_step": 88319, "epoch": 525} {"train_loss": -9.262063980102539, "global_step": 88320, "epoch": 525} {"train_loss": -9.325480461120605, "global_step": 88321, "epoch": 525} {"train_loss": -9.453550338745117, "global_step": 88322, "epoch": 525} {"train_loss": -9.438790321350098, "global_step": 88323, "epoch": 525} {"train_loss": -9.410469055175781, "global_step": 88324, "epoch": 525} {"train_loss": -9.491683959960938, "global_step": 88325, "epoch": 525} {"train_loss": -9.754384994506836, "global_step": 88326, "epoch": 525} {"train_loss": -9.231607437133789, "global_step": 88327, "epoch": 525} {"train_loss": -9.462182998657227, "global_step": 88328, "epoch": 525} {"train_loss": -9.47993278503418, "global_step": 88329, "epoch": 525} {"train_loss": -9.633987426757812, "global_step": 88330, "epoch": 525} {"train_loss": -9.527976989746094, "global_step": 88331, "epoch": 525} {"train_loss": -9.60831356048584, "global_step": 88332, "epoch": 525} {"train_loss": -9.267135620117188, "global_step": 88333, "epoch": 525} {"train_loss": -9.358110427856445, "global_step": 88334, "epoch": 525} {"train_loss": -9.73917293548584, "global_step": 88335, "epoch": 525} {"train_loss": -9.429849624633789, "global_step": 88336, "epoch": 525} {"train_loss": -9.417672157287598, "global_step": 88337, "epoch": 525} {"train_loss": -9.473451614379883, "global_step": 88338, "epoch": 525} {"train_loss": -9.561269760131836, "global_step": 88339, "epoch": 525} {"train_loss": -9.450299263000488, "global_step": 88340, "epoch": 525} {"train_loss": -9.378658294677734, "global_step": 88341, "epoch": 525} {"train_loss": -9.200943946838379, "global_step": 88342, "epoch": 525} {"train_loss": -9.471882820129395, "global_step": 88343, "epoch": 525} {"train_loss": -9.149459838867188, "global_step": 88344, "epoch": 525} {"train_loss": -9.449987411499023, "global_step": 88345, "epoch": 525} {"train_loss": -9.319665908813477, "global_step": 88346, "epoch": 525} {"train_loss": -9.402219772338867, "global_step": 88347, "epoch": 525} {"train_loss": -9.645103454589844, "global_step": 88348, "epoch": 525} {"train_loss": -9.608052253723145, "global_step": 88349, "epoch": 525} {"train_loss": -9.496383666992188, "global_step": 88350, "epoch": 525} {"train_loss": -9.455028533935547, "global_step": 88351, "epoch": 525} {"train_loss": -9.72680377960205, "global_step": 88352, "epoch": 525} {"train_loss": -9.2899751663208, "global_step": 88353, "epoch": 525} {"train_loss": -9.690805435180664, "global_step": 88354, "epoch": 525} {"train_loss": -9.440464973449707, "global_step": 88355, "epoch": 525} {"train_loss": -9.416170120239258, "global_step": 88356, "epoch": 525} {"train_loss": -9.69584846496582, "global_step": 88357, "epoch": 525} {"train_loss": -9.177428245544434, "global_step": 88358, "epoch": 525} {"train_loss": -9.586532592773438, "global_step": 88359, "epoch": 525} {"train_loss": -9.196876525878906, "global_step": 88360, "epoch": 525} {"train_loss": -9.15355110168457, "global_step": 88361, "epoch": 525} {"train_loss": -9.269303321838379, "global_step": 88362, "epoch": 525} {"train_loss": -9.386682510375977, "global_step": 88363, "epoch": 525} {"train_loss": -9.380653381347656, "global_step": 88364, "epoch": 525} {"train_loss": -9.364312171936035, "global_step": 88365, "epoch": 525} {"train_loss": -9.410293579101562, "global_step": 88366, "epoch": 525} {"train_loss": -9.395376829873948, "global_step": 88367, "epoch": 525, "val_loss": 200872.90625, "train_action_mse_error": 1.560846209526062} {"train_loss": -8.80237102508545, "global_step": 88368, "epoch": 526} {"train_loss": -9.426078796386719, "global_step": 88369, "epoch": 526} {"train_loss": -9.06326675415039, "global_step": 88370, "epoch": 526} {"train_loss": -9.643884658813477, "global_step": 88371, "epoch": 526} {"train_loss": -9.059673309326172, "global_step": 88372, "epoch": 526} {"train_loss": -9.43779182434082, "global_step": 88373, "epoch": 526} {"train_loss": -9.230311393737793, "global_step": 88374, "epoch": 526} {"train_loss": -9.119620323181152, "global_step": 88375, "epoch": 526} {"train_loss": -9.090795516967773, "global_step": 88376, "epoch": 526} {"train_loss": -9.281661987304688, "global_step": 88377, "epoch": 526} {"train_loss": -9.14517879486084, "global_step": 88378, "epoch": 526} {"train_loss": -9.212499618530273, "global_step": 88379, "epoch": 526} {"train_loss": -9.016647338867188, "global_step": 88380, "epoch": 526} {"train_loss": -9.516326904296875, "global_step": 88381, "epoch": 526} {"train_loss": -9.348442077636719, "global_step": 88382, "epoch": 526} {"train_loss": -9.35279655456543, "global_step": 88383, "epoch": 526} {"train_loss": -9.458179473876953, "global_step": 88384, "epoch": 526} {"train_loss": -9.335456848144531, "global_step": 88385, "epoch": 526} {"train_loss": -9.378671646118164, "global_step": 88386, "epoch": 526} {"train_loss": -9.228256225585938, "global_step": 88387, "epoch": 526} {"train_loss": -9.35278034210205, "global_step": 88388, "epoch": 526} {"train_loss": -9.487709045410156, "global_step": 88389, "epoch": 526} {"train_loss": -9.35824966430664, "global_step": 88390, "epoch": 526} {"train_loss": -9.397127151489258, "global_step": 88391, "epoch": 526} {"train_loss": -9.303003311157227, "global_step": 88392, "epoch": 526} {"train_loss": -9.314228057861328, "global_step": 88393, "epoch": 526} {"train_loss": -9.456304550170898, "global_step": 88394, "epoch": 526} {"train_loss": -9.42361068725586, "global_step": 88395, "epoch": 526} {"train_loss": -9.55341911315918, "global_step": 88396, "epoch": 526} {"train_loss": -9.601494789123535, "global_step": 88397, "epoch": 526} {"train_loss": -9.387693405151367, "global_step": 88398, "epoch": 526} {"train_loss": -9.620952606201172, "global_step": 88399, "epoch": 526} {"train_loss": -9.409849166870117, "global_step": 88400, "epoch": 526} {"train_loss": -9.502182006835938, "global_step": 88401, "epoch": 526} {"train_loss": -9.55129623413086, "global_step": 88402, "epoch": 526} {"train_loss": -9.193711280822754, "global_step": 88403, "epoch": 526} {"train_loss": -9.538246154785156, "global_step": 88404, "epoch": 526} {"train_loss": -9.414628982543945, "global_step": 88405, "epoch": 526} {"train_loss": -9.519972801208496, "global_step": 88406, "epoch": 526} {"train_loss": -9.146326065063477, "global_step": 88407, "epoch": 526} {"train_loss": -9.409852981567383, "global_step": 88408, "epoch": 526} {"train_loss": -9.494114875793457, "global_step": 88409, "epoch": 526} {"train_loss": -9.518085479736328, "global_step": 88410, "epoch": 526} {"train_loss": -9.311423301696777, "global_step": 88411, "epoch": 526} {"train_loss": -9.162152290344238, "global_step": 88412, "epoch": 526} {"train_loss": -9.57217788696289, "global_step": 88413, "epoch": 526} {"train_loss": -9.295631408691406, "global_step": 88414, "epoch": 526} {"train_loss": -9.047696113586426, "global_step": 88415, "epoch": 526} {"train_loss": -9.376994132995605, "global_step": 88416, "epoch": 526} {"train_loss": -9.265705108642578, "global_step": 88417, "epoch": 526} {"train_loss": -9.210598945617676, "global_step": 88418, "epoch": 526} {"train_loss": -9.244840621948242, "global_step": 88419, "epoch": 526} {"train_loss": -9.62890625, "global_step": 88420, "epoch": 526} {"train_loss": -9.398092269897461, "global_step": 88421, "epoch": 526} {"train_loss": -9.41252613067627, "global_step": 88422, "epoch": 526} {"train_loss": -9.220109939575195, "global_step": 88423, "epoch": 526} {"train_loss": -9.337384223937988, "global_step": 88424, "epoch": 526} {"train_loss": -9.208379745483398, "global_step": 88425, "epoch": 526} {"train_loss": -9.4981050491333, "global_step": 88426, "epoch": 526} {"train_loss": -9.489978790283203, "global_step": 88427, "epoch": 526} {"train_loss": -9.488421440124512, "global_step": 88428, "epoch": 526} {"train_loss": -9.467851638793945, "global_step": 88429, "epoch": 526} {"train_loss": -9.38288688659668, "global_step": 88430, "epoch": 526} {"train_loss": -9.446653366088867, "global_step": 88431, "epoch": 526} {"train_loss": -9.521517753601074, "global_step": 88432, "epoch": 526} {"train_loss": -9.343815803527832, "global_step": 88433, "epoch": 526} {"train_loss": -9.583206176757812, "global_step": 88434, "epoch": 526} {"train_loss": -9.528238296508789, "global_step": 88435, "epoch": 526} {"train_loss": -9.37869644165039, "global_step": 88436, "epoch": 526} {"train_loss": -9.475478172302246, "global_step": 88437, "epoch": 526} {"train_loss": -9.505698204040527, "global_step": 88438, "epoch": 526} {"train_loss": -9.54530143737793, "global_step": 88439, "epoch": 526} {"train_loss": -9.541772842407227, "global_step": 88440, "epoch": 526} {"train_loss": -9.356348037719727, "global_step": 88441, "epoch": 526} {"train_loss": -9.554686546325684, "global_step": 88442, "epoch": 526} {"train_loss": -9.698577880859375, "global_step": 88443, "epoch": 526} {"train_loss": -9.6648588180542, "global_step": 88444, "epoch": 526} {"train_loss": -9.46265983581543, "global_step": 88445, "epoch": 526} {"train_loss": -9.642227172851562, "global_step": 88446, "epoch": 526} {"train_loss": -9.57345962524414, "global_step": 88447, "epoch": 526} {"train_loss": -9.133014678955078, "global_step": 88448, "epoch": 526} {"train_loss": -9.22514533996582, "global_step": 88449, "epoch": 526} {"train_loss": -9.369379997253418, "global_step": 88450, "epoch": 526} {"train_loss": -9.269574165344238, "global_step": 88451, "epoch": 526} {"train_loss": -9.200569152832031, "global_step": 88452, "epoch": 526} {"train_loss": -9.406112670898438, "global_step": 88453, "epoch": 526} {"train_loss": -9.321568489074707, "global_step": 88454, "epoch": 526} {"train_loss": -9.35409164428711, "global_step": 88455, "epoch": 526} {"train_loss": -9.607683181762695, "global_step": 88456, "epoch": 526} {"train_loss": -9.160280227661133, "global_step": 88457, "epoch": 526} {"train_loss": -9.854814529418945, "global_step": 88458, "epoch": 526} {"train_loss": -9.434856414794922, "global_step": 88459, "epoch": 526} {"train_loss": -9.338627815246582, "global_step": 88460, "epoch": 526} {"train_loss": -9.200216293334961, "global_step": 88461, "epoch": 526} {"train_loss": -9.615880012512207, "global_step": 88462, "epoch": 526} {"train_loss": -9.358970642089844, "global_step": 88463, "epoch": 526} {"train_loss": -9.299407005310059, "global_step": 88464, "epoch": 526} {"train_loss": -9.140100479125977, "global_step": 88465, "epoch": 526} {"train_loss": -9.18391227722168, "global_step": 88466, "epoch": 526} {"train_loss": -9.302326202392578, "global_step": 88467, "epoch": 526} {"train_loss": -9.150933265686035, "global_step": 88468, "epoch": 526} {"train_loss": -9.200742721557617, "global_step": 88469, "epoch": 526} {"train_loss": -9.328885078430176, "global_step": 88470, "epoch": 526} {"train_loss": -9.414539337158203, "global_step": 88471, "epoch": 526} {"train_loss": -9.500993728637695, "global_step": 88472, "epoch": 526} {"train_loss": -9.572196960449219, "global_step": 88473, "epoch": 526} {"train_loss": -9.34018325805664, "global_step": 88474, "epoch": 526} {"train_loss": -9.283257484436035, "global_step": 88475, "epoch": 526} {"train_loss": -9.605953216552734, "global_step": 88476, "epoch": 526} {"train_loss": -9.585248947143555, "global_step": 88477, "epoch": 526} {"train_loss": -9.566217422485352, "global_step": 88478, "epoch": 526} {"train_loss": -9.439787864685059, "global_step": 88479, "epoch": 526} {"train_loss": -9.487693786621094, "global_step": 88480, "epoch": 526} {"train_loss": -9.470970153808594, "global_step": 88481, "epoch": 526} {"train_loss": -9.27090835571289, "global_step": 88482, "epoch": 526} {"train_loss": -9.511192321777344, "global_step": 88483, "epoch": 526} {"train_loss": -9.547319412231445, "global_step": 88484, "epoch": 526} {"train_loss": -9.24588394165039, "global_step": 88485, "epoch": 526} {"train_loss": -9.603033065795898, "global_step": 88486, "epoch": 526} {"train_loss": -9.391989707946777, "global_step": 88487, "epoch": 526} {"train_loss": -9.624214172363281, "global_step": 88488, "epoch": 526} {"train_loss": -9.29557991027832, "global_step": 88489, "epoch": 526} {"train_loss": -9.491961479187012, "global_step": 88490, "epoch": 526} {"train_loss": -9.305803298950195, "global_step": 88491, "epoch": 526} {"train_loss": -9.505722999572754, "global_step": 88492, "epoch": 526} {"train_loss": -9.109397888183594, "global_step": 88493, "epoch": 526} {"train_loss": -9.464288711547852, "global_step": 88494, "epoch": 526} {"train_loss": -9.536168098449707, "global_step": 88495, "epoch": 526} {"train_loss": -9.379009246826172, "global_step": 88496, "epoch": 526} {"train_loss": -9.442381858825684, "global_step": 88497, "epoch": 526} {"train_loss": -9.39052963256836, "global_step": 88498, "epoch": 526} {"train_loss": -9.549470901489258, "global_step": 88499, "epoch": 526} {"train_loss": -9.374086380004883, "global_step": 88500, "epoch": 526} {"train_loss": -9.285950660705566, "global_step": 88501, "epoch": 526} {"train_loss": -9.341104507446289, "global_step": 88502, "epoch": 526} {"train_loss": -9.226364135742188, "global_step": 88503, "epoch": 526} {"train_loss": -9.437068939208984, "global_step": 88504, "epoch": 526} {"train_loss": -9.288362503051758, "global_step": 88505, "epoch": 526} {"train_loss": -9.483327865600586, "global_step": 88506, "epoch": 526} {"train_loss": -9.351543426513672, "global_step": 88507, "epoch": 526} {"train_loss": -9.345267295837402, "global_step": 88508, "epoch": 526} {"train_loss": -8.908869743347168, "global_step": 88509, "epoch": 526} {"train_loss": -9.39716911315918, "global_step": 88510, "epoch": 526} {"train_loss": -9.233102798461914, "global_step": 88511, "epoch": 526} {"train_loss": -9.218639373779297, "global_step": 88512, "epoch": 526} {"train_loss": -9.12270736694336, "global_step": 88513, "epoch": 526} {"train_loss": -9.507914543151855, "global_step": 88514, "epoch": 526} {"train_loss": -9.224077224731445, "global_step": 88515, "epoch": 526} {"train_loss": -9.474857330322266, "global_step": 88516, "epoch": 526} {"train_loss": -9.054916381835938, "global_step": 88517, "epoch": 526} {"train_loss": -9.156193733215332, "global_step": 88518, "epoch": 526} {"train_loss": -9.335561752319336, "global_step": 88519, "epoch": 526} {"train_loss": -9.472779273986816, "global_step": 88520, "epoch": 526} {"train_loss": -9.15298843383789, "global_step": 88521, "epoch": 526} {"train_loss": -9.539125442504883, "global_step": 88522, "epoch": 526} {"train_loss": -9.31918716430664, "global_step": 88523, "epoch": 526} {"train_loss": -9.5467529296875, "global_step": 88524, "epoch": 526} {"train_loss": -9.265753746032715, "global_step": 88525, "epoch": 526} {"train_loss": -9.3375825881958, "global_step": 88526, "epoch": 526} {"train_loss": -9.296674728393555, "global_step": 88527, "epoch": 526} {"train_loss": -9.211524963378906, "global_step": 88528, "epoch": 526} {"train_loss": -9.543150901794434, "global_step": 88529, "epoch": 526} {"train_loss": -9.396121978759766, "global_step": 88530, "epoch": 526} {"train_loss": -9.413078308105469, "global_step": 88531, "epoch": 526} {"train_loss": -9.320894241333008, "global_step": 88532, "epoch": 526} {"train_loss": -9.333810806274414, "global_step": 88533, "epoch": 526} {"train_loss": -9.447450637817383, "global_step": 88534, "epoch": 526} {"train_loss": -9.375934754099164, "global_step": 88535, "epoch": 526, "val_loss": 202743.65625} {"train_loss": -8.958707809448242, "global_step": 88536, "epoch": 527} {"train_loss": -9.47772216796875, "global_step": 88537, "epoch": 527} {"train_loss": -8.849348068237305, "global_step": 88538, "epoch": 527} {"train_loss": -9.383617401123047, "global_step": 88539, "epoch": 527} {"train_loss": -9.102302551269531, "global_step": 88540, "epoch": 527} {"train_loss": -8.827260971069336, "global_step": 88541, "epoch": 527} {"train_loss": -9.227996826171875, "global_step": 88542, "epoch": 527} {"train_loss": -9.2423095703125, "global_step": 88543, "epoch": 527} {"train_loss": -9.45216178894043, "global_step": 88544, "epoch": 527} {"train_loss": -9.302035331726074, "global_step": 88545, "epoch": 527} {"train_loss": -9.514654159545898, "global_step": 88546, "epoch": 527} {"train_loss": -9.21356201171875, "global_step": 88547, "epoch": 527} {"train_loss": -9.227094650268555, "global_step": 88548, "epoch": 527} {"train_loss": -9.207967758178711, "global_step": 88549, "epoch": 527} {"train_loss": -9.261168479919434, "global_step": 88550, "epoch": 527} {"train_loss": -9.005578994750977, "global_step": 88551, "epoch": 527} {"train_loss": -9.27813720703125, "global_step": 88552, "epoch": 527} {"train_loss": -9.156387329101562, "global_step": 88553, "epoch": 527} {"train_loss": -9.485140800476074, "global_step": 88554, "epoch": 527} {"train_loss": -9.120254516601562, "global_step": 88555, "epoch": 527} {"train_loss": -9.451863288879395, "global_step": 88556, "epoch": 527} {"train_loss": -9.384255409240723, "global_step": 88557, "epoch": 527} {"train_loss": -9.289512634277344, "global_step": 88558, "epoch": 527} {"train_loss": -9.412718772888184, "global_step": 88559, "epoch": 527} {"train_loss": -9.25277328491211, "global_step": 88560, "epoch": 527} {"train_loss": -9.520662307739258, "global_step": 88561, "epoch": 527} {"train_loss": -9.173471450805664, "global_step": 88562, "epoch": 527} {"train_loss": -9.287900924682617, "global_step": 88563, "epoch": 527} {"train_loss": -9.141056060791016, "global_step": 88564, "epoch": 527} {"train_loss": -9.297150611877441, "global_step": 88565, "epoch": 527} {"train_loss": -9.40672492980957, "global_step": 88566, "epoch": 527} {"train_loss": -9.21408748626709, "global_step": 88567, "epoch": 527} {"train_loss": -9.295352935791016, "global_step": 88568, "epoch": 527} {"train_loss": -9.257108688354492, "global_step": 88569, "epoch": 527} {"train_loss": -9.557523727416992, "global_step": 88570, "epoch": 527} {"train_loss": -9.452764511108398, "global_step": 88571, "epoch": 527} {"train_loss": -9.32193660736084, "global_step": 88572, "epoch": 527} {"train_loss": -9.30246353149414, "global_step": 88573, "epoch": 527} {"train_loss": -9.444296836853027, "global_step": 88574, "epoch": 527} {"train_loss": -9.326932907104492, "global_step": 88575, "epoch": 527} {"train_loss": -9.139004707336426, "global_step": 88576, "epoch": 527} {"train_loss": -9.51567268371582, "global_step": 88577, "epoch": 527} {"train_loss": -9.404390335083008, "global_step": 88578, "epoch": 527} {"train_loss": -9.549388885498047, "global_step": 88579, "epoch": 527} {"train_loss": -9.498272895812988, "global_step": 88580, "epoch": 527} {"train_loss": -9.47579574584961, "global_step": 88581, "epoch": 527} {"train_loss": -9.206750869750977, "global_step": 88582, "epoch": 527} {"train_loss": -9.25411605834961, "global_step": 88583, "epoch": 527} {"train_loss": -9.425609588623047, "global_step": 88584, "epoch": 527} {"train_loss": -9.527416229248047, "global_step": 88585, "epoch": 527} {"train_loss": -8.907814025878906, "global_step": 88586, "epoch": 527} {"train_loss": -9.403812408447266, "global_step": 88587, "epoch": 527} {"train_loss": -9.12049674987793, "global_step": 88588, "epoch": 527} {"train_loss": -9.173208236694336, "global_step": 88589, "epoch": 527} {"train_loss": -9.029345512390137, "global_step": 88590, "epoch": 527} {"train_loss": -9.319976806640625, "global_step": 88591, "epoch": 527} {"train_loss": -9.010574340820312, "global_step": 88592, "epoch": 527} {"train_loss": -9.376730918884277, "global_step": 88593, "epoch": 527} {"train_loss": -9.150068283081055, "global_step": 88594, "epoch": 527} {"train_loss": -9.243754386901855, "global_step": 88595, "epoch": 527} {"train_loss": -9.160019874572754, "global_step": 88596, "epoch": 527} {"train_loss": -9.429634094238281, "global_step": 88597, "epoch": 527} {"train_loss": -9.385940551757812, "global_step": 88598, "epoch": 527} {"train_loss": -9.54583740234375, "global_step": 88599, "epoch": 527} {"train_loss": -9.305187225341797, "global_step": 88600, "epoch": 527} {"train_loss": -9.285614967346191, "global_step": 88601, "epoch": 527} {"train_loss": -9.31332778930664, "global_step": 88602, "epoch": 527} {"train_loss": -9.67220687866211, "global_step": 88603, "epoch": 527} {"train_loss": -9.331398010253906, "global_step": 88604, "epoch": 527} {"train_loss": -9.343866348266602, "global_step": 88605, "epoch": 527} {"train_loss": -9.481404304504395, "global_step": 88606, "epoch": 527} {"train_loss": -9.366697311401367, "global_step": 88607, "epoch": 527} {"train_loss": -9.5000581741333, "global_step": 88608, "epoch": 527} {"train_loss": -9.494377136230469, "global_step": 88609, "epoch": 527} {"train_loss": -9.449195861816406, "global_step": 88610, "epoch": 527} {"train_loss": -9.604888916015625, "global_step": 88611, "epoch": 527} {"train_loss": -9.502470970153809, "global_step": 88612, "epoch": 527} {"train_loss": -9.431053161621094, "global_step": 88613, "epoch": 527} {"train_loss": -9.736143112182617, "global_step": 88614, "epoch": 527} {"train_loss": -9.436366081237793, "global_step": 88615, "epoch": 527} {"train_loss": -9.496267318725586, "global_step": 88616, "epoch": 527} {"train_loss": -9.420379638671875, "global_step": 88617, "epoch": 527} {"train_loss": -9.453190803527832, "global_step": 88618, "epoch": 527} {"train_loss": -9.477100372314453, "global_step": 88619, "epoch": 527} {"train_loss": -9.50729751586914, "global_step": 88620, "epoch": 527} {"train_loss": -9.383638381958008, "global_step": 88621, "epoch": 527} {"train_loss": -9.187190055847168, "global_step": 88622, "epoch": 527} {"train_loss": -9.512382507324219, "global_step": 88623, "epoch": 527} {"train_loss": -9.467324256896973, "global_step": 88624, "epoch": 527} {"train_loss": -9.362218856811523, "global_step": 88625, "epoch": 527} {"train_loss": -9.632159233093262, "global_step": 88626, "epoch": 527} {"train_loss": -9.376241683959961, "global_step": 88627, "epoch": 527} {"train_loss": -9.460214614868164, "global_step": 88628, "epoch": 527} {"train_loss": -9.646280288696289, "global_step": 88629, "epoch": 527} {"train_loss": -9.594279289245605, "global_step": 88630, "epoch": 527} {"train_loss": -9.609437942504883, "global_step": 88631, "epoch": 527} {"train_loss": -9.387253761291504, "global_step": 88632, "epoch": 527} {"train_loss": -9.573299407958984, "global_step": 88633, "epoch": 527} {"train_loss": -9.140012741088867, "global_step": 88634, "epoch": 527} {"train_loss": -8.937295913696289, "global_step": 88635, "epoch": 527} {"train_loss": -8.833475112915039, "global_step": 88636, "epoch": 527} {"train_loss": -8.774490356445312, "global_step": 88637, "epoch": 527} {"train_loss": -8.196590423583984, "global_step": 88638, "epoch": 527} {"train_loss": -8.854961395263672, "global_step": 88639, "epoch": 527} {"train_loss": -8.482672691345215, "global_step": 88640, "epoch": 527} {"train_loss": -9.070194244384766, "global_step": 88641, "epoch": 527} {"train_loss": -8.587160110473633, "global_step": 88642, "epoch": 527} {"train_loss": -8.601393699645996, "global_step": 88643, "epoch": 527} {"train_loss": -8.687370300292969, "global_step": 88644, "epoch": 527} {"train_loss": -8.726749420166016, "global_step": 88645, "epoch": 527} {"train_loss": -8.823691368103027, "global_step": 88646, "epoch": 527} {"train_loss": -8.916312217712402, "global_step": 88647, "epoch": 527} {"train_loss": -9.10223388671875, "global_step": 88648, "epoch": 527} {"train_loss": -8.951955795288086, "global_step": 88649, "epoch": 527} {"train_loss": -9.05234146118164, "global_step": 88650, "epoch": 527} {"train_loss": -9.053915023803711, "global_step": 88651, "epoch": 527} {"train_loss": -9.264225006103516, "global_step": 88652, "epoch": 527} {"train_loss": -9.086164474487305, "global_step": 88653, "epoch": 527} {"train_loss": -9.068365097045898, "global_step": 88654, "epoch": 527} {"train_loss": -9.200618743896484, "global_step": 88655, "epoch": 527} {"train_loss": -9.251441955566406, "global_step": 88656, "epoch": 527} {"train_loss": -9.208019256591797, "global_step": 88657, "epoch": 527} {"train_loss": -9.126718521118164, "global_step": 88658, "epoch": 527} {"train_loss": -9.161495208740234, "global_step": 88659, "epoch": 527} {"train_loss": -9.462108612060547, "global_step": 88660, "epoch": 527} {"train_loss": -9.083562850952148, "global_step": 88661, "epoch": 527} {"train_loss": -9.195212364196777, "global_step": 88662, "epoch": 527} {"train_loss": -9.427519798278809, "global_step": 88663, "epoch": 527} {"train_loss": -9.336902618408203, "global_step": 88664, "epoch": 527} {"train_loss": -9.53478717803955, "global_step": 88665, "epoch": 527} {"train_loss": -9.211602210998535, "global_step": 88666, "epoch": 527} {"train_loss": -9.171128273010254, "global_step": 88667, "epoch": 527} {"train_loss": -9.437843322753906, "global_step": 88668, "epoch": 527} {"train_loss": -9.447213172912598, "global_step": 88669, "epoch": 527} {"train_loss": -9.361350059509277, "global_step": 88670, "epoch": 527} {"train_loss": -9.394964218139648, "global_step": 88671, "epoch": 527} {"train_loss": -9.323921203613281, "global_step": 88672, "epoch": 527} {"train_loss": -9.445243835449219, "global_step": 88673, "epoch": 527} {"train_loss": -9.467647552490234, "global_step": 88674, "epoch": 527} {"train_loss": -9.411333084106445, "global_step": 88675, "epoch": 527} {"train_loss": -9.509319305419922, "global_step": 88676, "epoch": 527} {"train_loss": -9.716541290283203, "global_step": 88677, "epoch": 527} {"train_loss": -9.37054443359375, "global_step": 88678, "epoch": 527} {"train_loss": -9.438993453979492, "global_step": 88679, "epoch": 527} {"train_loss": -9.557802200317383, "global_step": 88680, "epoch": 527} {"train_loss": -9.464035034179688, "global_step": 88681, "epoch": 527} {"train_loss": -9.190641403198242, "global_step": 88682, "epoch": 527} {"train_loss": -9.557734489440918, "global_step": 88683, "epoch": 527} {"train_loss": -9.464942932128906, "global_step": 88684, "epoch": 527} {"train_loss": -9.434602737426758, "global_step": 88685, "epoch": 527} {"train_loss": -9.801942825317383, "global_step": 88686, "epoch": 527} {"train_loss": -9.156795501708984, "global_step": 88687, "epoch": 527} {"train_loss": -9.537272453308105, "global_step": 88688, "epoch": 527} {"train_loss": -9.496723175048828, "global_step": 88689, "epoch": 527} {"train_loss": -9.44196891784668, "global_step": 88690, "epoch": 527} {"train_loss": -9.132436752319336, "global_step": 88691, "epoch": 527} {"train_loss": -9.42000961303711, "global_step": 88692, "epoch": 527} {"train_loss": -9.141926765441895, "global_step": 88693, "epoch": 527} {"train_loss": -9.659393310546875, "global_step": 88694, "epoch": 527} {"train_loss": -9.541109085083008, "global_step": 88695, "epoch": 527} {"train_loss": -9.59874153137207, "global_step": 88696, "epoch": 527} {"train_loss": -9.394176483154297, "global_step": 88697, "epoch": 527} {"train_loss": -9.588395118713379, "global_step": 88698, "epoch": 527} {"train_loss": -9.410496711730957, "global_step": 88699, "epoch": 527} {"train_loss": -9.726096153259277, "global_step": 88700, "epoch": 527} {"train_loss": -9.60698127746582, "global_step": 88701, "epoch": 527} {"train_loss": -9.330934524536133, "global_step": 88702, "epoch": 527} {"train_loss": -9.303710273333959, "global_step": 88703, "epoch": 527, "val_loss": 201936.65625} {"train_loss": -9.538352966308594, "global_step": 88704, "epoch": 528} {"train_loss": -9.612971305847168, "global_step": 88705, "epoch": 528} {"train_loss": -9.737726211547852, "global_step": 88706, "epoch": 528} {"train_loss": -9.394247055053711, "global_step": 88707, "epoch": 528} {"train_loss": -9.682210922241211, "global_step": 88708, "epoch": 528} {"train_loss": -9.418891906738281, "global_step": 88709, "epoch": 528} {"train_loss": -9.574882507324219, "global_step": 88710, "epoch": 528} {"train_loss": -9.442697525024414, "global_step": 88711, "epoch": 528} {"train_loss": -9.454565048217773, "global_step": 88712, "epoch": 528} {"train_loss": -9.45482349395752, "global_step": 88713, "epoch": 528} {"train_loss": -9.203243255615234, "global_step": 88714, "epoch": 528} {"train_loss": -9.573741912841797, "global_step": 88715, "epoch": 528} {"train_loss": -9.243874549865723, "global_step": 88716, "epoch": 528} {"train_loss": -9.342182159423828, "global_step": 88717, "epoch": 528} {"train_loss": -9.4228515625, "global_step": 88718, "epoch": 528} {"train_loss": -9.4296875, "global_step": 88719, "epoch": 528} {"train_loss": -9.154958724975586, "global_step": 88720, "epoch": 528} {"train_loss": -9.618682861328125, "global_step": 88721, "epoch": 528} {"train_loss": -9.331670761108398, "global_step": 88722, "epoch": 528} {"train_loss": -9.397439956665039, "global_step": 88723, "epoch": 528} {"train_loss": -9.206918716430664, "global_step": 88724, "epoch": 528} {"train_loss": -9.395787239074707, "global_step": 88725, "epoch": 528} {"train_loss": -9.560127258300781, "global_step": 88726, "epoch": 528} {"train_loss": -9.43353271484375, "global_step": 88727, "epoch": 528} {"train_loss": -9.17076301574707, "global_step": 88728, "epoch": 528} {"train_loss": -9.572991371154785, "global_step": 88729, "epoch": 528} {"train_loss": -9.220754623413086, "global_step": 88730, "epoch": 528} {"train_loss": -9.24624252319336, "global_step": 88731, "epoch": 528} {"train_loss": -9.256217956542969, "global_step": 88732, "epoch": 528} {"train_loss": -9.037968635559082, "global_step": 88733, "epoch": 528} {"train_loss": -9.488677978515625, "global_step": 88734, "epoch": 528} {"train_loss": -9.336981773376465, "global_step": 88735, "epoch": 528} {"train_loss": -9.504812240600586, "global_step": 88736, "epoch": 528} {"train_loss": -9.295713424682617, "global_step": 88737, "epoch": 528} {"train_loss": -9.35342788696289, "global_step": 88738, "epoch": 528} {"train_loss": -9.40189266204834, "global_step": 88739, "epoch": 528} {"train_loss": -9.066970825195312, "global_step": 88740, "epoch": 528} {"train_loss": -9.496213912963867, "global_step": 88741, "epoch": 528} {"train_loss": -9.389896392822266, "global_step": 88742, "epoch": 528} {"train_loss": -9.393120765686035, "global_step": 88743, "epoch": 528} {"train_loss": -9.293472290039062, "global_step": 88744, "epoch": 528} {"train_loss": -9.244894981384277, "global_step": 88745, "epoch": 528} {"train_loss": -9.31148624420166, "global_step": 88746, "epoch": 528} {"train_loss": -9.211910247802734, "global_step": 88747, "epoch": 528} {"train_loss": -9.755512237548828, "global_step": 88748, "epoch": 528} {"train_loss": -9.201114654541016, "global_step": 88749, "epoch": 528} {"train_loss": -9.547290802001953, "global_step": 88750, "epoch": 528} {"train_loss": -9.322141647338867, "global_step": 88751, "epoch": 528} {"train_loss": -9.49573040008545, "global_step": 88752, "epoch": 528} {"train_loss": -9.512044906616211, "global_step": 88753, "epoch": 528} {"train_loss": -9.406497955322266, "global_step": 88754, "epoch": 528} {"train_loss": -9.180715560913086, "global_step": 88755, "epoch": 528} {"train_loss": -9.290115356445312, "global_step": 88756, "epoch": 528} {"train_loss": -9.379891395568848, "global_step": 88757, "epoch": 528} {"train_loss": -9.359512329101562, "global_step": 88758, "epoch": 528} {"train_loss": -9.309818267822266, "global_step": 88759, "epoch": 528} {"train_loss": -9.22859001159668, "global_step": 88760, "epoch": 528} {"train_loss": -9.17977523803711, "global_step": 88761, "epoch": 528} {"train_loss": -9.260213851928711, "global_step": 88762, "epoch": 528} {"train_loss": -9.264979362487793, "global_step": 88763, "epoch": 528} {"train_loss": -9.458683013916016, "global_step": 88764, "epoch": 528} {"train_loss": -9.58836555480957, "global_step": 88765, "epoch": 528} {"train_loss": -9.539876937866211, "global_step": 88766, "epoch": 528} {"train_loss": -9.41492748260498, "global_step": 88767, "epoch": 528} {"train_loss": -9.496448516845703, "global_step": 88768, "epoch": 528} {"train_loss": -9.491483688354492, "global_step": 88769, "epoch": 528} {"train_loss": -9.384622573852539, "global_step": 88770, "epoch": 528} {"train_loss": -9.361827850341797, "global_step": 88771, "epoch": 528} {"train_loss": -9.414013862609863, "global_step": 88772, "epoch": 528} {"train_loss": -9.549787521362305, "global_step": 88773, "epoch": 528} {"train_loss": -9.382183074951172, "global_step": 88774, "epoch": 528} {"train_loss": -9.695270538330078, "global_step": 88775, "epoch": 528} {"train_loss": -9.563810348510742, "global_step": 88776, "epoch": 528} {"train_loss": -9.522665977478027, "global_step": 88777, "epoch": 528} {"train_loss": -9.565465927124023, "global_step": 88778, "epoch": 528} {"train_loss": -9.434576034545898, "global_step": 88779, "epoch": 528} {"train_loss": -9.45982837677002, "global_step": 88780, "epoch": 528} {"train_loss": -9.126832962036133, "global_step": 88781, "epoch": 528} {"train_loss": -9.613521575927734, "global_step": 88782, "epoch": 528} {"train_loss": -9.352149963378906, "global_step": 88783, "epoch": 528} {"train_loss": -9.222591400146484, "global_step": 88784, "epoch": 528} {"train_loss": -9.139986991882324, "global_step": 88785, "epoch": 528} {"train_loss": -9.442981719970703, "global_step": 88786, "epoch": 528} {"train_loss": -9.60835075378418, "global_step": 88787, "epoch": 528} {"train_loss": -9.079565048217773, "global_step": 88788, "epoch": 528} {"train_loss": -9.452242851257324, "global_step": 88789, "epoch": 528} {"train_loss": -8.898880004882812, "global_step": 88790, "epoch": 528} {"train_loss": -9.336935043334961, "global_step": 88791, "epoch": 528} {"train_loss": -9.382713317871094, "global_step": 88792, "epoch": 528} {"train_loss": -9.322360038757324, "global_step": 88793, "epoch": 528} {"train_loss": -9.167925834655762, "global_step": 88794, "epoch": 528} {"train_loss": -9.239315032958984, "global_step": 88795, "epoch": 528} {"train_loss": -9.277251243591309, "global_step": 88796, "epoch": 528} {"train_loss": -9.280651092529297, "global_step": 88797, "epoch": 528} {"train_loss": -9.13514518737793, "global_step": 88798, "epoch": 528} {"train_loss": -9.336223602294922, "global_step": 88799, "epoch": 528} {"train_loss": -9.403918266296387, "global_step": 88800, "epoch": 528} {"train_loss": -9.403512954711914, "global_step": 88801, "epoch": 528} {"train_loss": -9.48533821105957, "global_step": 88802, "epoch": 528} {"train_loss": -9.28421401977539, "global_step": 88803, "epoch": 528} {"train_loss": -9.381131172180176, "global_step": 88804, "epoch": 528} {"train_loss": -9.29673957824707, "global_step": 88805, "epoch": 528} {"train_loss": -9.01372241973877, "global_step": 88806, "epoch": 528} {"train_loss": -9.15534782409668, "global_step": 88807, "epoch": 528} {"train_loss": -9.320700645446777, "global_step": 88808, "epoch": 528} {"train_loss": -9.432107925415039, "global_step": 88809, "epoch": 528} {"train_loss": -8.847925186157227, "global_step": 88810, "epoch": 528} {"train_loss": -9.610355377197266, "global_step": 88811, "epoch": 528} {"train_loss": -9.083264350891113, "global_step": 88812, "epoch": 528} {"train_loss": -9.12093734741211, "global_step": 88813, "epoch": 528} {"train_loss": -9.213542938232422, "global_step": 88814, "epoch": 528} {"train_loss": -9.529138565063477, "global_step": 88815, "epoch": 528} {"train_loss": -9.368227005004883, "global_step": 88816, "epoch": 528} {"train_loss": -9.661686897277832, "global_step": 88817, "epoch": 528} {"train_loss": -9.365467071533203, "global_step": 88818, "epoch": 528} {"train_loss": -9.40544319152832, "global_step": 88819, "epoch": 528} {"train_loss": -9.472070693969727, "global_step": 88820, "epoch": 528} {"train_loss": -9.41071891784668, "global_step": 88821, "epoch": 528} {"train_loss": -9.548660278320312, "global_step": 88822, "epoch": 528} {"train_loss": -9.36881160736084, "global_step": 88823, "epoch": 528} {"train_loss": -9.467216491699219, "global_step": 88824, "epoch": 528} {"train_loss": -9.4690523147583, "global_step": 88825, "epoch": 528} {"train_loss": -9.497039794921875, "global_step": 88826, "epoch": 528} {"train_loss": -9.451311111450195, "global_step": 88827, "epoch": 528} {"train_loss": -9.566514015197754, "global_step": 88828, "epoch": 528} {"train_loss": -9.55707836151123, "global_step": 88829, "epoch": 528} {"train_loss": -9.520511627197266, "global_step": 88830, "epoch": 528} {"train_loss": -9.628990173339844, "global_step": 88831, "epoch": 528} {"train_loss": -9.445205688476562, "global_step": 88832, "epoch": 528} {"train_loss": -9.546058654785156, "global_step": 88833, "epoch": 528} {"train_loss": -9.638708114624023, "global_step": 88834, "epoch": 528} {"train_loss": -9.599836349487305, "global_step": 88835, "epoch": 528} {"train_loss": -9.505154609680176, "global_step": 88836, "epoch": 528} {"train_loss": -9.262150764465332, "global_step": 88837, "epoch": 528} {"train_loss": -9.760713577270508, "global_step": 88838, "epoch": 528} {"train_loss": -9.176717758178711, "global_step": 88839, "epoch": 528} {"train_loss": -9.348311424255371, "global_step": 88840, "epoch": 528} {"train_loss": -9.473590850830078, "global_step": 88841, "epoch": 528} {"train_loss": -9.333029747009277, "global_step": 88842, "epoch": 528} {"train_loss": -9.784309387207031, "global_step": 88843, "epoch": 528} {"train_loss": -9.258001327514648, "global_step": 88844, "epoch": 528} {"train_loss": -9.477947235107422, "global_step": 88845, "epoch": 528} {"train_loss": -9.386999130249023, "global_step": 88846, "epoch": 528} {"train_loss": -9.525134086608887, "global_step": 88847, "epoch": 528} {"train_loss": -9.712015151977539, "global_step": 88848, "epoch": 528} {"train_loss": -9.553852081298828, "global_step": 88849, "epoch": 528} {"train_loss": -9.578904151916504, "global_step": 88850, "epoch": 528} {"train_loss": -9.552032470703125, "global_step": 88851, "epoch": 528} {"train_loss": -9.56948184967041, "global_step": 88852, "epoch": 528} {"train_loss": -9.716133117675781, "global_step": 88853, "epoch": 528} {"train_loss": -9.106487274169922, "global_step": 88854, "epoch": 528} {"train_loss": -9.585899353027344, "global_step": 88855, "epoch": 528} {"train_loss": -9.546541213989258, "global_step": 88856, "epoch": 528} {"train_loss": -9.401656150817871, "global_step": 88857, "epoch": 528} {"train_loss": -9.669105529785156, "global_step": 88858, "epoch": 528} {"train_loss": -9.352965354919434, "global_step": 88859, "epoch": 528} {"train_loss": -9.237192153930664, "global_step": 88860, "epoch": 528} {"train_loss": -9.528493881225586, "global_step": 88861, "epoch": 528} {"train_loss": -9.448554992675781, "global_step": 88862, "epoch": 528} {"train_loss": -9.098743438720703, "global_step": 88863, "epoch": 528} {"train_loss": -9.312231063842773, "global_step": 88864, "epoch": 528} {"train_loss": -9.565244674682617, "global_step": 88865, "epoch": 528} {"train_loss": -9.130899429321289, "global_step": 88866, "epoch": 528} {"train_loss": -9.416915893554688, "global_step": 88867, "epoch": 528} {"train_loss": -9.231240272521973, "global_step": 88868, "epoch": 528} {"train_loss": -9.401802062988281, "global_step": 88869, "epoch": 528} {"train_loss": -9.196100234985352, "global_step": 88870, "epoch": 528} {"train_loss": -9.395734031995138, "global_step": 88871, "epoch": 528, "val_loss": 200588.421875} {"train_loss": -9.134824752807617, "global_step": 88872, "epoch": 529} {"train_loss": -9.078821182250977, "global_step": 88873, "epoch": 529} {"train_loss": -9.16008186340332, "global_step": 88874, "epoch": 529} {"train_loss": -9.399596214294434, "global_step": 88875, "epoch": 529} {"train_loss": -9.353104591369629, "global_step": 88876, "epoch": 529} {"train_loss": -9.59361457824707, "global_step": 88877, "epoch": 529} {"train_loss": -9.53530216217041, "global_step": 88878, "epoch": 529} {"train_loss": -9.212248802185059, "global_step": 88879, "epoch": 529} {"train_loss": -9.55313491821289, "global_step": 88880, "epoch": 529} {"train_loss": -9.403192520141602, "global_step": 88881, "epoch": 529} {"train_loss": -9.435931205749512, "global_step": 88882, "epoch": 529} {"train_loss": -9.492488861083984, "global_step": 88883, "epoch": 529} {"train_loss": -9.42647933959961, "global_step": 88884, "epoch": 529} {"train_loss": -9.456867218017578, "global_step": 88885, "epoch": 529} {"train_loss": -9.758391380310059, "global_step": 88886, "epoch": 529} {"train_loss": -9.62717056274414, "global_step": 88887, "epoch": 529} {"train_loss": -9.443724632263184, "global_step": 88888, "epoch": 529} {"train_loss": -9.532732009887695, "global_step": 88889, "epoch": 529} {"train_loss": -9.355013847351074, "global_step": 88890, "epoch": 529} {"train_loss": -9.654632568359375, "global_step": 88891, "epoch": 529} {"train_loss": -9.281248092651367, "global_step": 88892, "epoch": 529} {"train_loss": -9.303061485290527, "global_step": 88893, "epoch": 529} {"train_loss": -9.262038230895996, "global_step": 88894, "epoch": 529} {"train_loss": -9.22989273071289, "global_step": 88895, "epoch": 529} {"train_loss": -9.392663955688477, "global_step": 88896, "epoch": 529} {"train_loss": -9.332524299621582, "global_step": 88897, "epoch": 529} {"train_loss": -9.512750625610352, "global_step": 88898, "epoch": 529} {"train_loss": -9.289469718933105, "global_step": 88899, "epoch": 529} {"train_loss": -9.40939998626709, "global_step": 88900, "epoch": 529} {"train_loss": -9.39586353302002, "global_step": 88901, "epoch": 529} {"train_loss": -9.389534950256348, "global_step": 88902, "epoch": 529} {"train_loss": -9.545327186584473, "global_step": 88903, "epoch": 529} {"train_loss": -9.446900367736816, "global_step": 88904, "epoch": 529} {"train_loss": -9.47122573852539, "global_step": 88905, "epoch": 529} {"train_loss": -9.440756797790527, "global_step": 88906, "epoch": 529} {"train_loss": -9.563907623291016, "global_step": 88907, "epoch": 529} {"train_loss": -9.700484275817871, "global_step": 88908, "epoch": 529} {"train_loss": -9.395551681518555, "global_step": 88909, "epoch": 529} {"train_loss": -9.512306213378906, "global_step": 88910, "epoch": 529} {"train_loss": -9.487725257873535, "global_step": 88911, "epoch": 529} {"train_loss": -9.250823020935059, "global_step": 88912, "epoch": 529} {"train_loss": -9.557785034179688, "global_step": 88913, "epoch": 529} {"train_loss": -8.759841918945312, "global_step": 88914, "epoch": 529} {"train_loss": -9.5350923538208, "global_step": 88915, "epoch": 529} {"train_loss": -9.403661727905273, "global_step": 88916, "epoch": 529} {"train_loss": -9.282556533813477, "global_step": 88917, "epoch": 529} {"train_loss": -9.502028465270996, "global_step": 88918, "epoch": 529} {"train_loss": -9.220319747924805, "global_step": 88919, "epoch": 529} {"train_loss": -9.256645202636719, "global_step": 88920, "epoch": 529} {"train_loss": -9.664030075073242, "global_step": 88921, "epoch": 529} {"train_loss": -9.109800338745117, "global_step": 88922, "epoch": 529} {"train_loss": -9.527301788330078, "global_step": 88923, "epoch": 529} {"train_loss": -9.079692840576172, "global_step": 88924, "epoch": 529} {"train_loss": -9.331219673156738, "global_step": 88925, "epoch": 529} {"train_loss": -9.184600830078125, "global_step": 88926, "epoch": 529} {"train_loss": -9.36286449432373, "global_step": 88927, "epoch": 529} {"train_loss": -9.189874649047852, "global_step": 88928, "epoch": 529} {"train_loss": -9.385251998901367, "global_step": 88929, "epoch": 529} {"train_loss": -9.132124900817871, "global_step": 88930, "epoch": 529} {"train_loss": -9.17051887512207, "global_step": 88931, "epoch": 529} {"train_loss": -9.443020820617676, "global_step": 88932, "epoch": 529} {"train_loss": -9.27639389038086, "global_step": 88933, "epoch": 529} {"train_loss": -9.14963150024414, "global_step": 88934, "epoch": 529} {"train_loss": -9.51046371459961, "global_step": 88935, "epoch": 529} {"train_loss": -9.361897468566895, "global_step": 88936, "epoch": 529} {"train_loss": -9.448042869567871, "global_step": 88937, "epoch": 529} {"train_loss": -9.61114501953125, "global_step": 88938, "epoch": 529} {"train_loss": -9.583318710327148, "global_step": 88939, "epoch": 529} {"train_loss": -9.582496643066406, "global_step": 88940, "epoch": 529} {"train_loss": -9.283182144165039, "global_step": 88941, "epoch": 529} {"train_loss": -9.344257354736328, "global_step": 88942, "epoch": 529} {"train_loss": -9.668598175048828, "global_step": 88943, "epoch": 529} {"train_loss": -9.518141746520996, "global_step": 88944, "epoch": 529} {"train_loss": -9.337766647338867, "global_step": 88945, "epoch": 529} {"train_loss": -9.084339141845703, "global_step": 88946, "epoch": 529} {"train_loss": -9.407075881958008, "global_step": 88947, "epoch": 529} {"train_loss": -9.650715827941895, "global_step": 88948, "epoch": 529} {"train_loss": -9.491289138793945, "global_step": 88949, "epoch": 529} {"train_loss": -9.591870307922363, "global_step": 88950, "epoch": 529} {"train_loss": -9.480138778686523, "global_step": 88951, "epoch": 529} {"train_loss": -9.438949584960938, "global_step": 88952, "epoch": 529} {"train_loss": -9.27081298828125, "global_step": 88953, "epoch": 529} {"train_loss": -9.508633613586426, "global_step": 88954, "epoch": 529} {"train_loss": -9.678964614868164, "global_step": 88955, "epoch": 529} {"train_loss": -9.378683090209961, "global_step": 88956, "epoch": 529} {"train_loss": -9.627424240112305, "global_step": 88957, "epoch": 529} {"train_loss": -9.526180267333984, "global_step": 88958, "epoch": 529} {"train_loss": -9.229368209838867, "global_step": 88959, "epoch": 529} {"train_loss": -9.583359718322754, "global_step": 88960, "epoch": 529} {"train_loss": -9.408599853515625, "global_step": 88961, "epoch": 529} {"train_loss": -9.377388000488281, "global_step": 88962, "epoch": 529} {"train_loss": -9.65670394897461, "global_step": 88963, "epoch": 529} {"train_loss": -9.604028701782227, "global_step": 88964, "epoch": 529} {"train_loss": -9.397705078125, "global_step": 88965, "epoch": 529} {"train_loss": -9.624334335327148, "global_step": 88966, "epoch": 529} {"train_loss": -9.176254272460938, "global_step": 88967, "epoch": 529} {"train_loss": -9.545426368713379, "global_step": 88968, "epoch": 529} {"train_loss": -9.432939529418945, "global_step": 88969, "epoch": 529} {"train_loss": -9.230088233947754, "global_step": 88970, "epoch": 529} {"train_loss": -9.486503601074219, "global_step": 88971, "epoch": 529} {"train_loss": -9.535469055175781, "global_step": 88972, "epoch": 529} {"train_loss": -9.662538528442383, "global_step": 88973, "epoch": 529} {"train_loss": -9.391178131103516, "global_step": 88974, "epoch": 529} {"train_loss": -9.563063621520996, "global_step": 88975, "epoch": 529} {"train_loss": -9.542747497558594, "global_step": 88976, "epoch": 529} {"train_loss": -9.565208435058594, "global_step": 88977, "epoch": 529} {"train_loss": -9.679937362670898, "global_step": 88978, "epoch": 529} {"train_loss": -9.60204792022705, "global_step": 88979, "epoch": 529} {"train_loss": -9.797943115234375, "global_step": 88980, "epoch": 529} {"train_loss": -9.713608741760254, "global_step": 88981, "epoch": 529} {"train_loss": -9.40383529663086, "global_step": 88982, "epoch": 529} {"train_loss": -9.709321975708008, "global_step": 88983, "epoch": 529} {"train_loss": -9.688671112060547, "global_step": 88984, "epoch": 529} {"train_loss": -9.799137115478516, "global_step": 88985, "epoch": 529} {"train_loss": -9.54963493347168, "global_step": 88986, "epoch": 529} {"train_loss": -9.69493293762207, "global_step": 88987, "epoch": 529} {"train_loss": -9.259516716003418, "global_step": 88988, "epoch": 529} {"train_loss": -8.882438659667969, "global_step": 88989, "epoch": 529} {"train_loss": -9.382453918457031, "global_step": 88990, "epoch": 529} {"train_loss": -8.861154556274414, "global_step": 88991, "epoch": 529} {"train_loss": -9.30616569519043, "global_step": 88992, "epoch": 529} {"train_loss": -9.28302001953125, "global_step": 88993, "epoch": 529} {"train_loss": -9.272031784057617, "global_step": 88994, "epoch": 529} {"train_loss": -9.413092613220215, "global_step": 88995, "epoch": 529} {"train_loss": -9.414844512939453, "global_step": 88996, "epoch": 529} {"train_loss": -9.232763290405273, "global_step": 88997, "epoch": 529} {"train_loss": -9.298515319824219, "global_step": 88998, "epoch": 529} {"train_loss": -9.414109230041504, "global_step": 88999, "epoch": 529} {"train_loss": -9.3228178024292, "global_step": 89000, "epoch": 529} {"train_loss": -9.209748268127441, "global_step": 89001, "epoch": 529} {"train_loss": -9.64230728149414, "global_step": 89002, "epoch": 529} {"train_loss": -9.403501510620117, "global_step": 89003, "epoch": 529} {"train_loss": -9.343480110168457, "global_step": 89004, "epoch": 529} {"train_loss": -9.582283020019531, "global_step": 89005, "epoch": 529} {"train_loss": -9.677160263061523, "global_step": 89006, "epoch": 529} {"train_loss": -9.309720993041992, "global_step": 89007, "epoch": 529} {"train_loss": -9.493196487426758, "global_step": 89008, "epoch": 529} {"train_loss": -9.486860275268555, "global_step": 89009, "epoch": 529} {"train_loss": -9.37073802947998, "global_step": 89010, "epoch": 529} {"train_loss": -9.734838485717773, "global_step": 89011, "epoch": 529} {"train_loss": -9.668827056884766, "global_step": 89012, "epoch": 529} {"train_loss": -9.688631057739258, "global_step": 89013, "epoch": 529} {"train_loss": -9.710761070251465, "global_step": 89014, "epoch": 529} {"train_loss": -9.35975170135498, "global_step": 89015, "epoch": 529} {"train_loss": -9.725689888000488, "global_step": 89016, "epoch": 529} {"train_loss": -9.323436737060547, "global_step": 89017, "epoch": 529} {"train_loss": -9.691572189331055, "global_step": 89018, "epoch": 529} {"train_loss": -9.44561767578125, "global_step": 89019, "epoch": 529} {"train_loss": -9.274561882019043, "global_step": 89020, "epoch": 529} {"train_loss": -9.419600486755371, "global_step": 89021, "epoch": 529} {"train_loss": -8.34666633605957, "global_step": 89022, "epoch": 529} {"train_loss": -9.566740036010742, "global_step": 89023, "epoch": 529} {"train_loss": -8.756148338317871, "global_step": 89024, "epoch": 529} {"train_loss": -9.047918319702148, "global_step": 89025, "epoch": 529} {"train_loss": -8.930899620056152, "global_step": 89026, "epoch": 529} {"train_loss": -9.088552474975586, "global_step": 89027, "epoch": 529} {"train_loss": -9.196393966674805, "global_step": 89028, "epoch": 529} {"train_loss": -9.057884216308594, "global_step": 89029, "epoch": 529} {"train_loss": -9.375556945800781, "global_step": 89030, "epoch": 529} {"train_loss": -9.131009101867676, "global_step": 89031, "epoch": 529} {"train_loss": -9.358663558959961, "global_step": 89032, "epoch": 529} {"train_loss": -9.168115615844727, "global_step": 89033, "epoch": 529} {"train_loss": -9.307565689086914, "global_step": 89034, "epoch": 529} {"train_loss": -9.25362491607666, "global_step": 89035, "epoch": 529} {"train_loss": -9.418844223022461, "global_step": 89036, "epoch": 529} {"train_loss": -9.350982666015625, "global_step": 89037, "epoch": 529} {"train_loss": -9.23547077178955, "global_step": 89038, "epoch": 529} {"train_loss": -9.402372672444297, "global_step": 89039, "epoch": 529, "val_loss": 198420.59375} {"train_loss": -9.113317489624023, "global_step": 89040, "epoch": 530} {"train_loss": -9.48499870300293, "global_step": 89041, "epoch": 530} {"train_loss": -9.44984245300293, "global_step": 89042, "epoch": 530} {"train_loss": -9.338714599609375, "global_step": 89043, "epoch": 530} {"train_loss": -9.481149673461914, "global_step": 89044, "epoch": 530} {"train_loss": -9.66090202331543, "global_step": 89045, "epoch": 530} {"train_loss": -9.59206771850586, "global_step": 89046, "epoch": 530} {"train_loss": -9.436203002929688, "global_step": 89047, "epoch": 530} {"train_loss": -9.52830982208252, "global_step": 89048, "epoch": 530} {"train_loss": -9.459440231323242, "global_step": 89049, "epoch": 530} {"train_loss": -9.476491928100586, "global_step": 89050, "epoch": 530} {"train_loss": -9.508659362792969, "global_step": 89051, "epoch": 530} {"train_loss": -9.65093994140625, "global_step": 89052, "epoch": 530} {"train_loss": -9.61091136932373, "global_step": 89053, "epoch": 530} {"train_loss": -9.543476104736328, "global_step": 89054, "epoch": 530} {"train_loss": -9.55688762664795, "global_step": 89055, "epoch": 530} {"train_loss": -9.446011543273926, "global_step": 89056, "epoch": 530} {"train_loss": -9.386343002319336, "global_step": 89057, "epoch": 530} {"train_loss": -9.440902709960938, "global_step": 89058, "epoch": 530} {"train_loss": -9.488100051879883, "global_step": 89059, "epoch": 530} {"train_loss": -9.544301986694336, "global_step": 89060, "epoch": 530} {"train_loss": -9.462727546691895, "global_step": 89061, "epoch": 530} {"train_loss": -9.440407752990723, "global_step": 89062, "epoch": 530} {"train_loss": -9.061651229858398, "global_step": 89063, "epoch": 530} {"train_loss": -9.430506706237793, "global_step": 89064, "epoch": 530} {"train_loss": -8.557568550109863, "global_step": 89065, "epoch": 530} {"train_loss": -9.512738227844238, "global_step": 89066, "epoch": 530} {"train_loss": -8.949708938598633, "global_step": 89067, "epoch": 530} {"train_loss": -9.22874641418457, "global_step": 89068, "epoch": 530} {"train_loss": -9.099566459655762, "global_step": 89069, "epoch": 530} {"train_loss": -9.160781860351562, "global_step": 89070, "epoch": 530} {"train_loss": -8.638704299926758, "global_step": 89071, "epoch": 530} {"train_loss": -9.161127090454102, "global_step": 89072, "epoch": 530} {"train_loss": -8.860681533813477, "global_step": 89073, "epoch": 530} {"train_loss": -9.04865837097168, "global_step": 89074, "epoch": 530} {"train_loss": -9.0072603225708, "global_step": 89075, "epoch": 530} {"train_loss": -9.204452514648438, "global_step": 89076, "epoch": 530} {"train_loss": -8.986909866333008, "global_step": 89077, "epoch": 530} {"train_loss": -9.33740234375, "global_step": 89078, "epoch": 530} {"train_loss": -9.236422538757324, "global_step": 89079, "epoch": 530} {"train_loss": -9.318939208984375, "global_step": 89080, "epoch": 530} {"train_loss": -9.642070770263672, "global_step": 89081, "epoch": 530} {"train_loss": -9.364826202392578, "global_step": 89082, "epoch": 530} {"train_loss": -9.097172737121582, "global_step": 89083, "epoch": 530} {"train_loss": -9.361349105834961, "global_step": 89084, "epoch": 530} {"train_loss": -9.525216102600098, "global_step": 89085, "epoch": 530} {"train_loss": -9.166662216186523, "global_step": 89086, "epoch": 530} {"train_loss": -9.508027076721191, "global_step": 89087, "epoch": 530} {"train_loss": -9.270421981811523, "global_step": 89088, "epoch": 530} {"train_loss": -9.048458099365234, "global_step": 89089, "epoch": 530} {"train_loss": -9.338467597961426, "global_step": 89090, "epoch": 530} {"train_loss": -9.273016929626465, "global_step": 89091, "epoch": 530} {"train_loss": -9.223161697387695, "global_step": 89092, "epoch": 530} {"train_loss": -9.369815826416016, "global_step": 89093, "epoch": 530} {"train_loss": -9.314279556274414, "global_step": 89094, "epoch": 530} {"train_loss": -9.598501205444336, "global_step": 89095, "epoch": 530} {"train_loss": -9.328330993652344, "global_step": 89096, "epoch": 530} {"train_loss": -9.358612060546875, "global_step": 89097, "epoch": 530} {"train_loss": -9.533519744873047, "global_step": 89098, "epoch": 530} {"train_loss": -9.665146827697754, "global_step": 89099, "epoch": 530} {"train_loss": -9.657379150390625, "global_step": 89100, "epoch": 530} {"train_loss": -9.345527648925781, "global_step": 89101, "epoch": 530} {"train_loss": -9.65447998046875, "global_step": 89102, "epoch": 530} {"train_loss": -9.475890159606934, "global_step": 89103, "epoch": 530} {"train_loss": -9.519420623779297, "global_step": 89104, "epoch": 530} {"train_loss": -9.595056533813477, "global_step": 89105, "epoch": 530} {"train_loss": -9.408299446105957, "global_step": 89106, "epoch": 530} {"train_loss": -9.67800521850586, "global_step": 89107, "epoch": 530} {"train_loss": -9.645988464355469, "global_step": 89108, "epoch": 530} {"train_loss": -9.517093658447266, "global_step": 89109, "epoch": 530} {"train_loss": -9.562127113342285, "global_step": 89110, "epoch": 530} {"train_loss": -9.444477081298828, "global_step": 89111, "epoch": 530} {"train_loss": -9.895957946777344, "global_step": 89112, "epoch": 530} {"train_loss": -9.621045112609863, "global_step": 89113, "epoch": 530} {"train_loss": -9.475208282470703, "global_step": 89114, "epoch": 530} {"train_loss": -9.620073318481445, "global_step": 89115, "epoch": 530} {"train_loss": -9.478395462036133, "global_step": 89116, "epoch": 530} {"train_loss": -9.516642570495605, "global_step": 89117, "epoch": 530} {"train_loss": -9.429100036621094, "global_step": 89118, "epoch": 530} {"train_loss": -9.463663101196289, "global_step": 89119, "epoch": 530} {"train_loss": -9.320524215698242, "global_step": 89120, "epoch": 530} {"train_loss": -9.748805046081543, "global_step": 89121, "epoch": 530} {"train_loss": -9.432229042053223, "global_step": 89122, "epoch": 530} {"train_loss": -9.606843948364258, "global_step": 89123, "epoch": 530} {"train_loss": -9.713035583496094, "global_step": 89124, "epoch": 530} {"train_loss": -9.380447387695312, "global_step": 89125, "epoch": 530} {"train_loss": -9.439094543457031, "global_step": 89126, "epoch": 530} {"train_loss": -9.322929382324219, "global_step": 89127, "epoch": 530} {"train_loss": -9.402074813842773, "global_step": 89128, "epoch": 530} {"train_loss": -9.205368041992188, "global_step": 89129, "epoch": 530} {"train_loss": -9.359050750732422, "global_step": 89130, "epoch": 530} {"train_loss": -9.363641738891602, "global_step": 89131, "epoch": 530} {"train_loss": -9.374902725219727, "global_step": 89132, "epoch": 530} {"train_loss": -8.996129989624023, "global_step": 89133, "epoch": 530} {"train_loss": -9.425458908081055, "global_step": 89134, "epoch": 530} {"train_loss": -9.448530197143555, "global_step": 89135, "epoch": 530} {"train_loss": -8.845086097717285, "global_step": 89136, "epoch": 530} {"train_loss": -9.112366676330566, "global_step": 89137, "epoch": 530} {"train_loss": -9.204715728759766, "global_step": 89138, "epoch": 530} {"train_loss": -9.413030624389648, "global_step": 89139, "epoch": 530} {"train_loss": -8.915996551513672, "global_step": 89140, "epoch": 530} {"train_loss": -8.983379364013672, "global_step": 89141, "epoch": 530} {"train_loss": -8.898934364318848, "global_step": 89142, "epoch": 530} {"train_loss": -8.7874116897583, "global_step": 89143, "epoch": 530} {"train_loss": -9.270602226257324, "global_step": 89144, "epoch": 530} {"train_loss": -9.123558044433594, "global_step": 89145, "epoch": 530} {"train_loss": -9.104073524475098, "global_step": 89146, "epoch": 530} {"train_loss": -9.472662925720215, "global_step": 89147, "epoch": 530} {"train_loss": -9.265321731567383, "global_step": 89148, "epoch": 530} {"train_loss": -9.123851776123047, "global_step": 89149, "epoch": 530} {"train_loss": -9.075579643249512, "global_step": 89150, "epoch": 530} {"train_loss": -9.196008682250977, "global_step": 89151, "epoch": 530} {"train_loss": -9.181790351867676, "global_step": 89152, "epoch": 530} {"train_loss": -9.207005500793457, "global_step": 89153, "epoch": 530} {"train_loss": -9.174200057983398, "global_step": 89154, "epoch": 530} {"train_loss": -9.294479370117188, "global_step": 89155, "epoch": 530} {"train_loss": -8.959488868713379, "global_step": 89156, "epoch": 530} {"train_loss": -9.26753044128418, "global_step": 89157, "epoch": 530} {"train_loss": -9.337068557739258, "global_step": 89158, "epoch": 530} {"train_loss": -9.30999755859375, "global_step": 89159, "epoch": 530} {"train_loss": -9.669466972351074, "global_step": 89160, "epoch": 530} {"train_loss": -9.076343536376953, "global_step": 89161, "epoch": 530} {"train_loss": -9.422640800476074, "global_step": 89162, "epoch": 530} {"train_loss": -9.40157699584961, "global_step": 89163, "epoch": 530} {"train_loss": -9.351451873779297, "global_step": 89164, "epoch": 530} {"train_loss": -9.425600051879883, "global_step": 89165, "epoch": 530} {"train_loss": -9.320660591125488, "global_step": 89166, "epoch": 530} {"train_loss": -9.436290740966797, "global_step": 89167, "epoch": 530} {"train_loss": -9.298158645629883, "global_step": 89168, "epoch": 530} {"train_loss": -9.736714363098145, "global_step": 89169, "epoch": 530} {"train_loss": -9.553715705871582, "global_step": 89170, "epoch": 530} {"train_loss": -9.457887649536133, "global_step": 89171, "epoch": 530} {"train_loss": -9.731877326965332, "global_step": 89172, "epoch": 530} {"train_loss": -9.337285995483398, "global_step": 89173, "epoch": 530} {"train_loss": -9.421173095703125, "global_step": 89174, "epoch": 530} {"train_loss": -9.676036834716797, "global_step": 89175, "epoch": 530} {"train_loss": -9.556591987609863, "global_step": 89176, "epoch": 530} {"train_loss": -9.3382568359375, "global_step": 89177, "epoch": 530} {"train_loss": -9.405351638793945, "global_step": 89178, "epoch": 530} {"train_loss": -9.57079792022705, "global_step": 89179, "epoch": 530} {"train_loss": -9.456214904785156, "global_step": 89180, "epoch": 530} {"train_loss": -9.420894622802734, "global_step": 89181, "epoch": 530} {"train_loss": -9.163701057434082, "global_step": 89182, "epoch": 530} {"train_loss": -9.423368453979492, "global_step": 89183, "epoch": 530} {"train_loss": -9.116259574890137, "global_step": 89184, "epoch": 530} {"train_loss": -9.763923645019531, "global_step": 89185, "epoch": 530} {"train_loss": -9.287385940551758, "global_step": 89186, "epoch": 530} {"train_loss": -9.31126594543457, "global_step": 89187, "epoch": 530} {"train_loss": -9.399259567260742, "global_step": 89188, "epoch": 530} {"train_loss": -9.504602432250977, "global_step": 89189, "epoch": 530} {"train_loss": -9.285982131958008, "global_step": 89190, "epoch": 530} {"train_loss": -9.346506118774414, "global_step": 89191, "epoch": 530} {"train_loss": -9.193082809448242, "global_step": 89192, "epoch": 530} {"train_loss": -9.283756256103516, "global_step": 89193, "epoch": 530} {"train_loss": -9.461931228637695, "global_step": 89194, "epoch": 530} {"train_loss": -9.064188003540039, "global_step": 89195, "epoch": 530} {"train_loss": -9.461341857910156, "global_step": 89196, "epoch": 530} {"train_loss": -9.535728454589844, "global_step": 89197, "epoch": 530} {"train_loss": -9.42839241027832, "global_step": 89198, "epoch": 530} {"train_loss": -9.453733444213867, "global_step": 89199, "epoch": 530} {"train_loss": -9.309042930603027, "global_step": 89200, "epoch": 530} {"train_loss": -9.168343544006348, "global_step": 89201, "epoch": 530} {"train_loss": -9.653841972351074, "global_step": 89202, "epoch": 530} {"train_loss": -9.373725891113281, "global_step": 89203, "epoch": 530} {"train_loss": -9.544055938720703, "global_step": 89204, "epoch": 530} {"train_loss": -9.238222122192383, "global_step": 89205, "epoch": 530} {"train_loss": -9.609272956848145, "global_step": 89206, "epoch": 530} {"train_loss": -9.362594661258516, "global_step": 89207, "epoch": 530, "val_loss": 201664.078125, "train_action_mse_error": 2.1461422443389893} {"train_loss": -9.50832748413086, "global_step": 89208, "epoch": 531} {"train_loss": -9.459630966186523, "global_step": 89209, "epoch": 531} {"train_loss": -9.625360488891602, "global_step": 89210, "epoch": 531} {"train_loss": -9.52182388305664, "global_step": 89211, "epoch": 531} {"train_loss": -9.688619613647461, "global_step": 89212, "epoch": 531} {"train_loss": -9.479269027709961, "global_step": 89213, "epoch": 531} {"train_loss": -9.635843276977539, "global_step": 89214, "epoch": 531} {"train_loss": -9.451136589050293, "global_step": 89215, "epoch": 531} {"train_loss": -9.462350845336914, "global_step": 89216, "epoch": 531} {"train_loss": -9.500495910644531, "global_step": 89217, "epoch": 531} {"train_loss": -9.225790977478027, "global_step": 89218, "epoch": 531} {"train_loss": -9.200617790222168, "global_step": 89219, "epoch": 531} {"train_loss": -9.464406967163086, "global_step": 89220, "epoch": 531} {"train_loss": -9.300350189208984, "global_step": 89221, "epoch": 531} {"train_loss": -9.759725570678711, "global_step": 89222, "epoch": 531} {"train_loss": -8.973384857177734, "global_step": 89223, "epoch": 531} {"train_loss": -9.363554000854492, "global_step": 89224, "epoch": 531} {"train_loss": -9.054559707641602, "global_step": 89225, "epoch": 531} {"train_loss": -9.057271957397461, "global_step": 89226, "epoch": 531} {"train_loss": -9.17502212524414, "global_step": 89227, "epoch": 531} {"train_loss": -9.379672050476074, "global_step": 89228, "epoch": 531} {"train_loss": -9.354817390441895, "global_step": 89229, "epoch": 531} {"train_loss": -9.027749061584473, "global_step": 89230, "epoch": 531} {"train_loss": -9.650253295898438, "global_step": 89231, "epoch": 531} {"train_loss": -9.34197998046875, "global_step": 89232, "epoch": 531} {"train_loss": -8.99837875366211, "global_step": 89233, "epoch": 531} {"train_loss": -8.89797306060791, "global_step": 89234, "epoch": 531} {"train_loss": -9.22468376159668, "global_step": 89235, "epoch": 531} {"train_loss": -9.056325912475586, "global_step": 89236, "epoch": 531} {"train_loss": -9.113511085510254, "global_step": 89237, "epoch": 531} {"train_loss": -9.117368698120117, "global_step": 89238, "epoch": 531} {"train_loss": -9.389543533325195, "global_step": 89239, "epoch": 531} {"train_loss": -9.370148658752441, "global_step": 89240, "epoch": 531} {"train_loss": -9.340065956115723, "global_step": 89241, "epoch": 531} {"train_loss": -9.406927108764648, "global_step": 89242, "epoch": 531} {"train_loss": -9.382194519042969, "global_step": 89243, "epoch": 531} {"train_loss": -9.552305221557617, "global_step": 89244, "epoch": 531} {"train_loss": -9.504255294799805, "global_step": 89245, "epoch": 531} {"train_loss": -9.28990364074707, "global_step": 89246, "epoch": 531} {"train_loss": -9.514094352722168, "global_step": 89247, "epoch": 531} {"train_loss": -9.280754089355469, "global_step": 89248, "epoch": 531} {"train_loss": -9.535984992980957, "global_step": 89249, "epoch": 531} {"train_loss": -9.28261947631836, "global_step": 89250, "epoch": 531} {"train_loss": -9.401641845703125, "global_step": 89251, "epoch": 531} {"train_loss": -9.128389358520508, "global_step": 89252, "epoch": 531} {"train_loss": -9.41145133972168, "global_step": 89253, "epoch": 531} {"train_loss": -9.410669326782227, "global_step": 89254, "epoch": 531} {"train_loss": -9.351154327392578, "global_step": 89255, "epoch": 531} {"train_loss": -9.37880802154541, "global_step": 89256, "epoch": 531} {"train_loss": -9.404556274414062, "global_step": 89257, "epoch": 531} {"train_loss": -9.249309539794922, "global_step": 89258, "epoch": 531} {"train_loss": -9.454211235046387, "global_step": 89259, "epoch": 531} {"train_loss": -9.111984252929688, "global_step": 89260, "epoch": 531} {"train_loss": -9.262688636779785, "global_step": 89261, "epoch": 531} {"train_loss": -9.208248138427734, "global_step": 89262, "epoch": 531} {"train_loss": -9.39187240600586, "global_step": 89263, "epoch": 531} {"train_loss": -9.010478973388672, "global_step": 89264, "epoch": 531} {"train_loss": -9.467079162597656, "global_step": 89265, "epoch": 531} {"train_loss": -9.163917541503906, "global_step": 89266, "epoch": 531} {"train_loss": -9.413515090942383, "global_step": 89267, "epoch": 531} {"train_loss": -9.315449714660645, "global_step": 89268, "epoch": 531} {"train_loss": -9.003110885620117, "global_step": 89269, "epoch": 531} {"train_loss": -9.676122665405273, "global_step": 89270, "epoch": 531} {"train_loss": -9.375410079956055, "global_step": 89271, "epoch": 531} {"train_loss": -9.414593696594238, "global_step": 89272, "epoch": 531} {"train_loss": -9.761614799499512, "global_step": 89273, "epoch": 531} {"train_loss": -9.709840774536133, "global_step": 89274, "epoch": 531} {"train_loss": -9.577065467834473, "global_step": 89275, "epoch": 531} {"train_loss": -9.49741268157959, "global_step": 89276, "epoch": 531} {"train_loss": -9.450187683105469, "global_step": 89277, "epoch": 531} {"train_loss": -9.567211151123047, "global_step": 89278, "epoch": 531} {"train_loss": -9.623973846435547, "global_step": 89279, "epoch": 531} {"train_loss": -9.648698806762695, "global_step": 89280, "epoch": 531} {"train_loss": -9.533203125, "global_step": 89281, "epoch": 531} {"train_loss": -9.493194580078125, "global_step": 89282, "epoch": 531} {"train_loss": -9.65264892578125, "global_step": 89283, "epoch": 531} {"train_loss": -9.400044441223145, "global_step": 89284, "epoch": 531} {"train_loss": -9.712798118591309, "global_step": 89285, "epoch": 531} {"train_loss": -9.65742301940918, "global_step": 89286, "epoch": 531} {"train_loss": -9.563292503356934, "global_step": 89287, "epoch": 531} {"train_loss": -9.560565948486328, "global_step": 89288, "epoch": 531} {"train_loss": -9.400568962097168, "global_step": 89289, "epoch": 531} {"train_loss": -9.45018196105957, "global_step": 89290, "epoch": 531} {"train_loss": -9.55306625366211, "global_step": 89291, "epoch": 531} {"train_loss": -9.642452239990234, "global_step": 89292, "epoch": 531} {"train_loss": -9.042057991027832, "global_step": 89293, "epoch": 531} {"train_loss": -9.293331146240234, "global_step": 89294, "epoch": 531} {"train_loss": -9.343865394592285, "global_step": 89295, "epoch": 531} {"train_loss": -9.237781524658203, "global_step": 89296, "epoch": 531} {"train_loss": -9.116880416870117, "global_step": 89297, "epoch": 531} {"train_loss": -9.352584838867188, "global_step": 89298, "epoch": 531} {"train_loss": -9.056802749633789, "global_step": 89299, "epoch": 531} {"train_loss": -9.22561264038086, "global_step": 89300, "epoch": 531} {"train_loss": -9.213241577148438, "global_step": 89301, "epoch": 531} {"train_loss": -9.64837646484375, "global_step": 89302, "epoch": 531} {"train_loss": -9.114168167114258, "global_step": 89303, "epoch": 531} {"train_loss": -9.50786018371582, "global_step": 89304, "epoch": 531} {"train_loss": -9.140121459960938, "global_step": 89305, "epoch": 531} {"train_loss": -9.311620712280273, "global_step": 89306, "epoch": 531} {"train_loss": -8.866125106811523, "global_step": 89307, "epoch": 531} {"train_loss": -9.13397216796875, "global_step": 89308, "epoch": 531} {"train_loss": -9.211995124816895, "global_step": 89309, "epoch": 531} {"train_loss": -9.178829193115234, "global_step": 89310, "epoch": 531} {"train_loss": -9.377242088317871, "global_step": 89311, "epoch": 531} {"train_loss": -8.922472953796387, "global_step": 89312, "epoch": 531} {"train_loss": -9.29854679107666, "global_step": 89313, "epoch": 531} {"train_loss": -9.328872680664062, "global_step": 89314, "epoch": 531} {"train_loss": -9.437646865844727, "global_step": 89315, "epoch": 531} {"train_loss": -9.371261596679688, "global_step": 89316, "epoch": 531} {"train_loss": -9.303181648254395, "global_step": 89317, "epoch": 531} {"train_loss": -9.43010139465332, "global_step": 89318, "epoch": 531} {"train_loss": -9.283273696899414, "global_step": 89319, "epoch": 531} {"train_loss": -9.530888557434082, "global_step": 89320, "epoch": 531} {"train_loss": -9.377144813537598, "global_step": 89321, "epoch": 531} {"train_loss": -9.401632308959961, "global_step": 89322, "epoch": 531} {"train_loss": -9.337373733520508, "global_step": 89323, "epoch": 531} {"train_loss": -9.577218055725098, "global_step": 89324, "epoch": 531} {"train_loss": -9.397226333618164, "global_step": 89325, "epoch": 531} {"train_loss": -9.621253967285156, "global_step": 89326, "epoch": 531} {"train_loss": -9.318793296813965, "global_step": 89327, "epoch": 531} {"train_loss": -9.14258098602295, "global_step": 89328, "epoch": 531} {"train_loss": -9.422998428344727, "global_step": 89329, "epoch": 531} {"train_loss": -9.379912376403809, "global_step": 89330, "epoch": 531} {"train_loss": -9.475699424743652, "global_step": 89331, "epoch": 531} {"train_loss": -9.333948135375977, "global_step": 89332, "epoch": 531} {"train_loss": -9.005423545837402, "global_step": 89333, "epoch": 531} {"train_loss": -9.22136402130127, "global_step": 89334, "epoch": 531} {"train_loss": -9.150337219238281, "global_step": 89335, "epoch": 531} {"train_loss": -9.388362884521484, "global_step": 89336, "epoch": 531} {"train_loss": -9.224748611450195, "global_step": 89337, "epoch": 531} {"train_loss": -9.416940689086914, "global_step": 89338, "epoch": 531} {"train_loss": -9.52177619934082, "global_step": 89339, "epoch": 531} {"train_loss": -9.36947250366211, "global_step": 89340, "epoch": 531} {"train_loss": -9.57395076751709, "global_step": 89341, "epoch": 531} {"train_loss": -9.501983642578125, "global_step": 89342, "epoch": 531} {"train_loss": -9.26259708404541, "global_step": 89343, "epoch": 531} {"train_loss": -9.518712997436523, "global_step": 89344, "epoch": 531} {"train_loss": -9.674999237060547, "global_step": 89345, "epoch": 531} {"train_loss": -9.497201919555664, "global_step": 89346, "epoch": 531} {"train_loss": -9.493473052978516, "global_step": 89347, "epoch": 531} {"train_loss": -9.486044883728027, "global_step": 89348, "epoch": 531} {"train_loss": -9.790610313415527, "global_step": 89349, "epoch": 531} {"train_loss": -9.514089584350586, "global_step": 89350, "epoch": 531} {"train_loss": -9.699535369873047, "global_step": 89351, "epoch": 531} {"train_loss": -9.599964141845703, "global_step": 89352, "epoch": 531} {"train_loss": -9.6539306640625, "global_step": 89353, "epoch": 531} {"train_loss": -9.553919792175293, "global_step": 89354, "epoch": 531} {"train_loss": -9.684857368469238, "global_step": 89355, "epoch": 531} {"train_loss": -9.279449462890625, "global_step": 89356, "epoch": 531} {"train_loss": -9.3601713180542, "global_step": 89357, "epoch": 531} {"train_loss": -9.382392883300781, "global_step": 89358, "epoch": 531} {"train_loss": -9.666915893554688, "global_step": 89359, "epoch": 531} {"train_loss": -9.500360488891602, "global_step": 89360, "epoch": 531} {"train_loss": -9.418988227844238, "global_step": 89361, "epoch": 531} {"train_loss": -9.506616592407227, "global_step": 89362, "epoch": 531} {"train_loss": -9.54971981048584, "global_step": 89363, "epoch": 531} {"train_loss": -9.464441299438477, "global_step": 89364, "epoch": 531} {"train_loss": -9.4856595993042, "global_step": 89365, "epoch": 531} {"train_loss": -9.567681312561035, "global_step": 89366, "epoch": 531} {"train_loss": -9.550315856933594, "global_step": 89367, "epoch": 531} {"train_loss": -9.160852432250977, "global_step": 89368, "epoch": 531} {"train_loss": -9.65943717956543, "global_step": 89369, "epoch": 531} {"train_loss": -9.469011306762695, "global_step": 89370, "epoch": 531} {"train_loss": -9.378910064697266, "global_step": 89371, "epoch": 531} {"train_loss": -9.604340553283691, "global_step": 89372, "epoch": 531} {"train_loss": -9.357229232788086, "global_step": 89373, "epoch": 531} {"train_loss": -9.611907958984375, "global_step": 89374, "epoch": 531} {"train_loss": -9.390521742048717, "global_step": 89375, "epoch": 531, "val_loss": 202290.671875} {"train_loss": -9.460846900939941, "global_step": 89376, "epoch": 532} {"train_loss": -9.627245903015137, "global_step": 89377, "epoch": 532} {"train_loss": -9.531259536743164, "global_step": 89378, "epoch": 532} {"train_loss": -9.696551322937012, "global_step": 89379, "epoch": 532} {"train_loss": -9.57522201538086, "global_step": 89380, "epoch": 532} {"train_loss": -9.372511863708496, "global_step": 89381, "epoch": 532} {"train_loss": -9.502752304077148, "global_step": 89382, "epoch": 532} {"train_loss": -9.651759147644043, "global_step": 89383, "epoch": 532} {"train_loss": -9.44792366027832, "global_step": 89384, "epoch": 532} {"train_loss": -9.512245178222656, "global_step": 89385, "epoch": 532} {"train_loss": -9.488986015319824, "global_step": 89386, "epoch": 532} {"train_loss": -9.65395736694336, "global_step": 89387, "epoch": 532} {"train_loss": -9.486827850341797, "global_step": 89388, "epoch": 532} {"train_loss": -9.372625350952148, "global_step": 89389, "epoch": 532} {"train_loss": -9.55872917175293, "global_step": 89390, "epoch": 532} {"train_loss": -9.638296127319336, "global_step": 89391, "epoch": 532} {"train_loss": -9.586771965026855, "global_step": 89392, "epoch": 532} {"train_loss": -9.467156410217285, "global_step": 89393, "epoch": 532} {"train_loss": -9.51022720336914, "global_step": 89394, "epoch": 532} {"train_loss": -9.560991287231445, "global_step": 89395, "epoch": 532} {"train_loss": -9.162928581237793, "global_step": 89396, "epoch": 532} {"train_loss": -9.645572662353516, "global_step": 89397, "epoch": 532} {"train_loss": -9.391037940979004, "global_step": 89398, "epoch": 532} {"train_loss": -9.479174613952637, "global_step": 89399, "epoch": 532} {"train_loss": -9.48559856414795, "global_step": 89400, "epoch": 532} {"train_loss": -9.360546112060547, "global_step": 89401, "epoch": 532} {"train_loss": -9.44521713256836, "global_step": 89402, "epoch": 532} {"train_loss": -9.58890438079834, "global_step": 89403, "epoch": 532} {"train_loss": -8.996841430664062, "global_step": 89404, "epoch": 532} {"train_loss": -9.457199096679688, "global_step": 89405, "epoch": 532} {"train_loss": -9.41270637512207, "global_step": 89406, "epoch": 532} {"train_loss": -8.932101249694824, "global_step": 89407, "epoch": 532} {"train_loss": -9.573025703430176, "global_step": 89408, "epoch": 532} {"train_loss": -8.817645072937012, "global_step": 89409, "epoch": 532} {"train_loss": -9.313947677612305, "global_step": 89410, "epoch": 532} {"train_loss": -8.729472160339355, "global_step": 89411, "epoch": 532} {"train_loss": -9.420612335205078, "global_step": 89412, "epoch": 532} {"train_loss": -8.79133129119873, "global_step": 89413, "epoch": 532} {"train_loss": -8.967390060424805, "global_step": 89414, "epoch": 532} {"train_loss": -9.12615966796875, "global_step": 89415, "epoch": 532} {"train_loss": -9.121713638305664, "global_step": 89416, "epoch": 532} {"train_loss": -9.024182319641113, "global_step": 89417, "epoch": 532} {"train_loss": -9.357654571533203, "global_step": 89418, "epoch": 532} {"train_loss": -9.537978172302246, "global_step": 89419, "epoch": 532} {"train_loss": -9.244935035705566, "global_step": 89420, "epoch": 532} {"train_loss": -9.088031768798828, "global_step": 89421, "epoch": 532} {"train_loss": -9.400835037231445, "global_step": 89422, "epoch": 532} {"train_loss": -9.239641189575195, "global_step": 89423, "epoch": 532} {"train_loss": -9.252405166625977, "global_step": 89424, "epoch": 532} {"train_loss": -9.309690475463867, "global_step": 89425, "epoch": 532} {"train_loss": -9.504955291748047, "global_step": 89426, "epoch": 532} {"train_loss": -9.250097274780273, "global_step": 89427, "epoch": 532} {"train_loss": -9.499141693115234, "global_step": 89428, "epoch": 532} {"train_loss": -9.648761749267578, "global_step": 89429, "epoch": 532} {"train_loss": -9.511741638183594, "global_step": 89430, "epoch": 532} {"train_loss": -9.369375228881836, "global_step": 89431, "epoch": 532} {"train_loss": -9.43891429901123, "global_step": 89432, "epoch": 532} {"train_loss": -9.473137855529785, "global_step": 89433, "epoch": 532} {"train_loss": -9.527515411376953, "global_step": 89434, "epoch": 532} {"train_loss": -9.71113395690918, "global_step": 89435, "epoch": 532} {"train_loss": -9.552316665649414, "global_step": 89436, "epoch": 532} {"train_loss": -9.503083229064941, "global_step": 89437, "epoch": 532} {"train_loss": -9.482173919677734, "global_step": 89438, "epoch": 532} {"train_loss": -9.631086349487305, "global_step": 89439, "epoch": 532} {"train_loss": -9.498289108276367, "global_step": 89440, "epoch": 532} {"train_loss": -9.465485572814941, "global_step": 89441, "epoch": 532} {"train_loss": -9.858512878417969, "global_step": 89442, "epoch": 532} {"train_loss": -9.550028800964355, "global_step": 89443, "epoch": 532} {"train_loss": -9.723930358886719, "global_step": 89444, "epoch": 532} {"train_loss": -9.422030448913574, "global_step": 89445, "epoch": 532} {"train_loss": -9.537485122680664, "global_step": 89446, "epoch": 532} {"train_loss": -9.551551818847656, "global_step": 89447, "epoch": 532} {"train_loss": -9.799400329589844, "global_step": 89448, "epoch": 532} {"train_loss": -9.56749153137207, "global_step": 89449, "epoch": 532} {"train_loss": -9.573755264282227, "global_step": 89450, "epoch": 532} {"train_loss": -9.615564346313477, "global_step": 89451, "epoch": 532} {"train_loss": -9.792635917663574, "global_step": 89452, "epoch": 532} {"train_loss": -9.697134017944336, "global_step": 89453, "epoch": 532} {"train_loss": -9.488344192504883, "global_step": 89454, "epoch": 532} {"train_loss": -9.760242462158203, "global_step": 89455, "epoch": 532} {"train_loss": -9.711241722106934, "global_step": 89456, "epoch": 532} {"train_loss": -9.740459442138672, "global_step": 89457, "epoch": 532} {"train_loss": -9.845915794372559, "global_step": 89458, "epoch": 532} {"train_loss": -9.815484046936035, "global_step": 89459, "epoch": 532} {"train_loss": -9.482736587524414, "global_step": 89460, "epoch": 532} {"train_loss": -9.531635284423828, "global_step": 89461, "epoch": 532} {"train_loss": -9.494293212890625, "global_step": 89462, "epoch": 532} {"train_loss": -9.3270845413208, "global_step": 89463, "epoch": 532} {"train_loss": -9.394732475280762, "global_step": 89464, "epoch": 532} {"train_loss": -9.432003021240234, "global_step": 89465, "epoch": 532} {"train_loss": -9.491853713989258, "global_step": 89466, "epoch": 532} {"train_loss": -9.388448715209961, "global_step": 89467, "epoch": 532} {"train_loss": -9.232797622680664, "global_step": 89468, "epoch": 532} {"train_loss": -9.272239685058594, "global_step": 89469, "epoch": 532} {"train_loss": -9.405333518981934, "global_step": 89470, "epoch": 532} {"train_loss": -9.172447204589844, "global_step": 89471, "epoch": 532} {"train_loss": -9.268158912658691, "global_step": 89472, "epoch": 532} {"train_loss": -9.156597137451172, "global_step": 89473, "epoch": 532} {"train_loss": -9.305736541748047, "global_step": 89474, "epoch": 532} {"train_loss": -9.57693862915039, "global_step": 89475, "epoch": 532} {"train_loss": -9.108646392822266, "global_step": 89476, "epoch": 532} {"train_loss": -9.699151992797852, "global_step": 89477, "epoch": 532} {"train_loss": -9.292793273925781, "global_step": 89478, "epoch": 532} {"train_loss": -9.123499870300293, "global_step": 89479, "epoch": 532} {"train_loss": -9.140278816223145, "global_step": 89480, "epoch": 532} {"train_loss": -9.394063949584961, "global_step": 89481, "epoch": 532} {"train_loss": -8.852218627929688, "global_step": 89482, "epoch": 532} {"train_loss": -9.336484909057617, "global_step": 89483, "epoch": 532} {"train_loss": -9.039081573486328, "global_step": 89484, "epoch": 532} {"train_loss": -9.329460144042969, "global_step": 89485, "epoch": 532} {"train_loss": -9.252997398376465, "global_step": 89486, "epoch": 532} {"train_loss": -9.179539680480957, "global_step": 89487, "epoch": 532} {"train_loss": -9.293257713317871, "global_step": 89488, "epoch": 532} {"train_loss": -9.303461074829102, "global_step": 89489, "epoch": 532} {"train_loss": -9.242376327514648, "global_step": 89490, "epoch": 532} {"train_loss": -9.1572847366333, "global_step": 89491, "epoch": 532} {"train_loss": -9.363611221313477, "global_step": 89492, "epoch": 532} {"train_loss": -9.3179931640625, "global_step": 89493, "epoch": 532} {"train_loss": -9.212077140808105, "global_step": 89494, "epoch": 532} {"train_loss": -9.340716361999512, "global_step": 89495, "epoch": 532} {"train_loss": -9.335161209106445, "global_step": 89496, "epoch": 532} {"train_loss": -9.43271255493164, "global_step": 89497, "epoch": 532} {"train_loss": -9.452692031860352, "global_step": 89498, "epoch": 532} {"train_loss": -9.250088691711426, "global_step": 89499, "epoch": 532} {"train_loss": -9.35081672668457, "global_step": 89500, "epoch": 532} {"train_loss": -9.50908374786377, "global_step": 89501, "epoch": 532} {"train_loss": -9.318802833557129, "global_step": 89502, "epoch": 532} {"train_loss": -9.730951309204102, "global_step": 89503, "epoch": 532} {"train_loss": -9.463922500610352, "global_step": 89504, "epoch": 532} {"train_loss": -9.546599388122559, "global_step": 89505, "epoch": 532} {"train_loss": -9.156627655029297, "global_step": 89506, "epoch": 532} {"train_loss": -9.599752426147461, "global_step": 89507, "epoch": 532} {"train_loss": -9.248785018920898, "global_step": 89508, "epoch": 532} {"train_loss": -9.50881576538086, "global_step": 89509, "epoch": 532} {"train_loss": -9.128357887268066, "global_step": 89510, "epoch": 532} {"train_loss": -9.399444580078125, "global_step": 89511, "epoch": 532} {"train_loss": -9.207477569580078, "global_step": 89512, "epoch": 532} {"train_loss": -9.20021915435791, "global_step": 89513, "epoch": 532} {"train_loss": -9.133689880371094, "global_step": 89514, "epoch": 532} {"train_loss": -9.355256080627441, "global_step": 89515, "epoch": 532} {"train_loss": -9.284689903259277, "global_step": 89516, "epoch": 532} {"train_loss": -9.094684600830078, "global_step": 89517, "epoch": 532} {"train_loss": -9.302801132202148, "global_step": 89518, "epoch": 532} {"train_loss": -9.306184768676758, "global_step": 89519, "epoch": 532} {"train_loss": -9.27674674987793, "global_step": 89520, "epoch": 532} {"train_loss": -9.406596183776855, "global_step": 89521, "epoch": 532} {"train_loss": -9.178238868713379, "global_step": 89522, "epoch": 532} {"train_loss": -9.255714416503906, "global_step": 89523, "epoch": 532} {"train_loss": -9.443334579467773, "global_step": 89524, "epoch": 532} {"train_loss": -8.915397644042969, "global_step": 89525, "epoch": 532} {"train_loss": -9.336090087890625, "global_step": 89526, "epoch": 532} {"train_loss": -9.178682327270508, "global_step": 89527, "epoch": 532} {"train_loss": -9.359930992126465, "global_step": 89528, "epoch": 532} {"train_loss": -9.377348899841309, "global_step": 89529, "epoch": 532} {"train_loss": -9.545110702514648, "global_step": 89530, "epoch": 532} {"train_loss": -9.452400207519531, "global_step": 89531, "epoch": 532} {"train_loss": -9.361370086669922, "global_step": 89532, "epoch": 532} {"train_loss": -9.291276931762695, "global_step": 89533, "epoch": 532} {"train_loss": -9.147150039672852, "global_step": 89534, "epoch": 532} {"train_loss": -9.064840316772461, "global_step": 89535, "epoch": 532} {"train_loss": -9.215259552001953, "global_step": 89536, "epoch": 532} {"train_loss": -9.144745826721191, "global_step": 89537, "epoch": 532} {"train_loss": -9.189422607421875, "global_step": 89538, "epoch": 532} {"train_loss": -9.31620979309082, "global_step": 89539, "epoch": 532} {"train_loss": -9.242680549621582, "global_step": 89540, "epoch": 532} {"train_loss": -9.51215934753418, "global_step": 89541, "epoch": 532} {"train_loss": -9.269309997558594, "global_step": 89542, "epoch": 532} {"train_loss": -9.383822435424442, "global_step": 89543, "epoch": 532, "val_loss": 204603.484375} {"train_loss": -9.292425155639648, "global_step": 89544, "epoch": 533} {"train_loss": -9.367776870727539, "global_step": 89545, "epoch": 533} {"train_loss": -9.383861541748047, "global_step": 89546, "epoch": 533} {"train_loss": -9.251947402954102, "global_step": 89547, "epoch": 533} {"train_loss": -9.307571411132812, "global_step": 89548, "epoch": 533} {"train_loss": -9.377656936645508, "global_step": 89549, "epoch": 533} {"train_loss": -9.226922988891602, "global_step": 89550, "epoch": 533} {"train_loss": -9.331974029541016, "global_step": 89551, "epoch": 533} {"train_loss": -9.719401359558105, "global_step": 89552, "epoch": 533} {"train_loss": -9.512103080749512, "global_step": 89553, "epoch": 533} {"train_loss": -9.566177368164062, "global_step": 89554, "epoch": 533} {"train_loss": -9.322137832641602, "global_step": 89555, "epoch": 533} {"train_loss": -9.598756790161133, "global_step": 89556, "epoch": 533} {"train_loss": -9.619857788085938, "global_step": 89557, "epoch": 533} {"train_loss": -9.499942779541016, "global_step": 89558, "epoch": 533} {"train_loss": -9.72205924987793, "global_step": 89559, "epoch": 533} {"train_loss": -9.342884063720703, "global_step": 89560, "epoch": 533} {"train_loss": -9.685802459716797, "global_step": 89561, "epoch": 533} {"train_loss": -9.495110511779785, "global_step": 89562, "epoch": 533} {"train_loss": -9.323860168457031, "global_step": 89563, "epoch": 533} {"train_loss": -9.482168197631836, "global_step": 89564, "epoch": 533} {"train_loss": -9.67370319366455, "global_step": 89565, "epoch": 533} {"train_loss": -9.67003059387207, "global_step": 89566, "epoch": 533} {"train_loss": -9.559704780578613, "global_step": 89567, "epoch": 533} {"train_loss": -9.334463119506836, "global_step": 89568, "epoch": 533} {"train_loss": -9.539641380310059, "global_step": 89569, "epoch": 533} {"train_loss": -9.49813461303711, "global_step": 89570, "epoch": 533} {"train_loss": -9.1719970703125, "global_step": 89571, "epoch": 533} {"train_loss": -9.295257568359375, "global_step": 89572, "epoch": 533} {"train_loss": -9.777403831481934, "global_step": 89573, "epoch": 533} {"train_loss": -9.449357032775879, "global_step": 89574, "epoch": 533} {"train_loss": -9.461187362670898, "global_step": 89575, "epoch": 533} {"train_loss": -9.53333568572998, "global_step": 89576, "epoch": 533} {"train_loss": -9.498125076293945, "global_step": 89577, "epoch": 533} {"train_loss": -9.506836891174316, "global_step": 89578, "epoch": 533} {"train_loss": -9.460162162780762, "global_step": 89579, "epoch": 533} {"train_loss": -9.417937278747559, "global_step": 89580, "epoch": 533} {"train_loss": -9.517224311828613, "global_step": 89581, "epoch": 533} {"train_loss": -9.659675598144531, "global_step": 89582, "epoch": 533} {"train_loss": -9.401885986328125, "global_step": 89583, "epoch": 533} {"train_loss": -9.513242721557617, "global_step": 89584, "epoch": 533} {"train_loss": -9.553420066833496, "global_step": 89585, "epoch": 533} {"train_loss": -9.477741241455078, "global_step": 89586, "epoch": 533} {"train_loss": -9.56221866607666, "global_step": 89587, "epoch": 533} {"train_loss": -9.590084075927734, "global_step": 89588, "epoch": 533} {"train_loss": -9.40463638305664, "global_step": 89589, "epoch": 533} {"train_loss": -9.505813598632812, "global_step": 89590, "epoch": 533} {"train_loss": -9.306270599365234, "global_step": 89591, "epoch": 533} {"train_loss": -9.797826766967773, "global_step": 89592, "epoch": 533} {"train_loss": -9.667683601379395, "global_step": 89593, "epoch": 533} {"train_loss": -9.538931846618652, "global_step": 89594, "epoch": 533} {"train_loss": -9.453897476196289, "global_step": 89595, "epoch": 533} {"train_loss": -9.77953815460205, "global_step": 89596, "epoch": 533} {"train_loss": -9.576481819152832, "global_step": 89597, "epoch": 533} {"train_loss": -9.762842178344727, "global_step": 89598, "epoch": 533} {"train_loss": -9.43169116973877, "global_step": 89599, "epoch": 533} {"train_loss": -9.624715805053711, "global_step": 89600, "epoch": 533} {"train_loss": -9.714936256408691, "global_step": 89601, "epoch": 533} {"train_loss": -9.56905746459961, "global_step": 89602, "epoch": 533} {"train_loss": -9.1071195602417, "global_step": 89603, "epoch": 533} {"train_loss": -9.226953506469727, "global_step": 89604, "epoch": 533} {"train_loss": -9.546555519104004, "global_step": 89605, "epoch": 533} {"train_loss": -9.364301681518555, "global_step": 89606, "epoch": 533} {"train_loss": -9.368856430053711, "global_step": 89607, "epoch": 533} {"train_loss": -9.462536811828613, "global_step": 89608, "epoch": 533} {"train_loss": -9.451298713684082, "global_step": 89609, "epoch": 533} {"train_loss": -9.610584259033203, "global_step": 89610, "epoch": 533} {"train_loss": -9.292661666870117, "global_step": 89611, "epoch": 533} {"train_loss": -9.241929054260254, "global_step": 89612, "epoch": 533} {"train_loss": -9.440071105957031, "global_step": 89613, "epoch": 533} {"train_loss": -9.603352546691895, "global_step": 89614, "epoch": 533} {"train_loss": -9.55774974822998, "global_step": 89615, "epoch": 533} {"train_loss": -9.586036682128906, "global_step": 89616, "epoch": 533} {"train_loss": -9.42849349975586, "global_step": 89617, "epoch": 533} {"train_loss": -9.421806335449219, "global_step": 89618, "epoch": 533} {"train_loss": -9.628301620483398, "global_step": 89619, "epoch": 533} {"train_loss": -9.47238540649414, "global_step": 89620, "epoch": 533} {"train_loss": -9.348837852478027, "global_step": 89621, "epoch": 533} {"train_loss": -9.505475997924805, "global_step": 89622, "epoch": 533} {"train_loss": -9.338081359863281, "global_step": 89623, "epoch": 533} {"train_loss": -9.587860107421875, "global_step": 89624, "epoch": 533} {"train_loss": -9.577596664428711, "global_step": 89625, "epoch": 533} {"train_loss": -9.230571746826172, "global_step": 89626, "epoch": 533} {"train_loss": -9.433478355407715, "global_step": 89627, "epoch": 533} {"train_loss": -9.300161361694336, "global_step": 89628, "epoch": 533} {"train_loss": -9.288406372070312, "global_step": 89629, "epoch": 533} {"train_loss": -9.704647064208984, "global_step": 89630, "epoch": 533} {"train_loss": -9.421516418457031, "global_step": 89631, "epoch": 533} {"train_loss": -9.544584274291992, "global_step": 89632, "epoch": 533} {"train_loss": -9.288476943969727, "global_step": 89633, "epoch": 533} {"train_loss": -8.95594310760498, "global_step": 89634, "epoch": 533} {"train_loss": -9.749813079833984, "global_step": 89635, "epoch": 533} {"train_loss": -9.002967834472656, "global_step": 89636, "epoch": 533} {"train_loss": -9.343528747558594, "global_step": 89637, "epoch": 533} {"train_loss": -9.258537292480469, "global_step": 89638, "epoch": 533} {"train_loss": -9.221811294555664, "global_step": 89639, "epoch": 533} {"train_loss": -9.053333282470703, "global_step": 89640, "epoch": 533} {"train_loss": -9.275839805603027, "global_step": 89641, "epoch": 533} {"train_loss": -9.2298583984375, "global_step": 89642, "epoch": 533} {"train_loss": -9.369295120239258, "global_step": 89643, "epoch": 533} {"train_loss": -9.420559883117676, "global_step": 89644, "epoch": 533} {"train_loss": -8.93934154510498, "global_step": 89645, "epoch": 533} {"train_loss": -9.164137840270996, "global_step": 89646, "epoch": 533} {"train_loss": -9.044260025024414, "global_step": 89647, "epoch": 533} {"train_loss": -9.081830978393555, "global_step": 89648, "epoch": 533} {"train_loss": -9.179574012756348, "global_step": 89649, "epoch": 533} {"train_loss": -9.52593994140625, "global_step": 89650, "epoch": 533} {"train_loss": -9.053438186645508, "global_step": 89651, "epoch": 533} {"train_loss": -9.36717414855957, "global_step": 89652, "epoch": 533} {"train_loss": -9.460968017578125, "global_step": 89653, "epoch": 533} {"train_loss": -9.55092716217041, "global_step": 89654, "epoch": 533} {"train_loss": -9.145254135131836, "global_step": 89655, "epoch": 533} {"train_loss": -9.461526870727539, "global_step": 89656, "epoch": 533} {"train_loss": -9.33175277709961, "global_step": 89657, "epoch": 533} {"train_loss": -9.20252799987793, "global_step": 89658, "epoch": 533} {"train_loss": -9.316650390625, "global_step": 89659, "epoch": 533} {"train_loss": -9.434122085571289, "global_step": 89660, "epoch": 533} {"train_loss": -9.526830673217773, "global_step": 89661, "epoch": 533} {"train_loss": -9.177978515625, "global_step": 89662, "epoch": 533} {"train_loss": -9.580180168151855, "global_step": 89663, "epoch": 533} {"train_loss": -9.309446334838867, "global_step": 89664, "epoch": 533} {"train_loss": -9.510644912719727, "global_step": 89665, "epoch": 533} {"train_loss": -9.179815292358398, "global_step": 89666, "epoch": 533} {"train_loss": -9.35579776763916, "global_step": 89667, "epoch": 533} {"train_loss": -9.264382362365723, "global_step": 89668, "epoch": 533} {"train_loss": -9.196213722229004, "global_step": 89669, "epoch": 533} {"train_loss": -9.273219108581543, "global_step": 89670, "epoch": 533} {"train_loss": -9.383209228515625, "global_step": 89671, "epoch": 533} {"train_loss": -9.257978439331055, "global_step": 89672, "epoch": 533} {"train_loss": -9.428199768066406, "global_step": 89673, "epoch": 533} {"train_loss": -9.317521095275879, "global_step": 89674, "epoch": 533} {"train_loss": -9.249946594238281, "global_step": 89675, "epoch": 533} {"train_loss": -9.63345718383789, "global_step": 89676, "epoch": 533} {"train_loss": -9.136199951171875, "global_step": 89677, "epoch": 533} {"train_loss": -9.15052604675293, "global_step": 89678, "epoch": 533} {"train_loss": -9.2955322265625, "global_step": 89679, "epoch": 533} {"train_loss": -9.381622314453125, "global_step": 89680, "epoch": 533} {"train_loss": -9.057693481445312, "global_step": 89681, "epoch": 533} {"train_loss": -9.02381706237793, "global_step": 89682, "epoch": 533} {"train_loss": -9.025880813598633, "global_step": 89683, "epoch": 533} {"train_loss": -9.424074172973633, "global_step": 89684, "epoch": 533} {"train_loss": -9.192405700683594, "global_step": 89685, "epoch": 533} {"train_loss": -9.132577896118164, "global_step": 89686, "epoch": 533} {"train_loss": -9.270331382751465, "global_step": 89687, "epoch": 533} {"train_loss": -8.891751289367676, "global_step": 89688, "epoch": 533} {"train_loss": -9.320943832397461, "global_step": 89689, "epoch": 533} {"train_loss": -9.137052536010742, "global_step": 89690, "epoch": 533} {"train_loss": -9.408393859863281, "global_step": 89691, "epoch": 533} {"train_loss": -9.214799880981445, "global_step": 89692, "epoch": 533} {"train_loss": -9.532697677612305, "global_step": 89693, "epoch": 533} {"train_loss": -9.65835952758789, "global_step": 89694, "epoch": 533} {"train_loss": -9.566377639770508, "global_step": 89695, "epoch": 533} {"train_loss": -9.304811477661133, "global_step": 89696, "epoch": 533} {"train_loss": -9.553766250610352, "global_step": 89697, "epoch": 533} {"train_loss": -9.48739242553711, "global_step": 89698, "epoch": 533} {"train_loss": -9.458589553833008, "global_step": 89699, "epoch": 533} {"train_loss": -9.645343780517578, "global_step": 89700, "epoch": 533} {"train_loss": -9.663509368896484, "global_step": 89701, "epoch": 533} {"train_loss": -9.645047187805176, "global_step": 89702, "epoch": 533} {"train_loss": -9.62923526763916, "global_step": 89703, "epoch": 533} {"train_loss": -9.501639366149902, "global_step": 89704, "epoch": 533} {"train_loss": -9.541779518127441, "global_step": 89705, "epoch": 533} {"train_loss": -9.455255508422852, "global_step": 89706, "epoch": 533} {"train_loss": -9.427309036254883, "global_step": 89707, "epoch": 533} {"train_loss": -9.412063598632812, "global_step": 89708, "epoch": 533} {"train_loss": -9.43233871459961, "global_step": 89709, "epoch": 533} {"train_loss": -9.378776550292969, "global_step": 89710, "epoch": 533} {"train_loss": -9.407723301932926, "global_step": 89711, "epoch": 533, "val_loss": 202787.46875} {"train_loss": -9.311273574829102, "global_step": 89712, "epoch": 534} {"train_loss": -9.599328994750977, "global_step": 89713, "epoch": 534} {"train_loss": -8.972002029418945, "global_step": 89714, "epoch": 534} {"train_loss": -9.414430618286133, "global_step": 89715, "epoch": 534} {"train_loss": -9.267470359802246, "global_step": 89716, "epoch": 534} {"train_loss": -9.026578903198242, "global_step": 89717, "epoch": 534} {"train_loss": -8.988917350769043, "global_step": 89718, "epoch": 534} {"train_loss": -9.014552116394043, "global_step": 89719, "epoch": 534} {"train_loss": -8.740636825561523, "global_step": 89720, "epoch": 534} {"train_loss": -9.084091186523438, "global_step": 89721, "epoch": 534} {"train_loss": -8.981742858886719, "global_step": 89722, "epoch": 534} {"train_loss": -8.564048767089844, "global_step": 89723, "epoch": 534} {"train_loss": -8.655052185058594, "global_step": 89724, "epoch": 534} {"train_loss": -8.760072708129883, "global_step": 89725, "epoch": 534} {"train_loss": -9.022821426391602, "global_step": 89726, "epoch": 534} {"train_loss": -8.988119125366211, "global_step": 89727, "epoch": 534} {"train_loss": -8.888357162475586, "global_step": 89728, "epoch": 534} {"train_loss": -9.23777961730957, "global_step": 89729, "epoch": 534} {"train_loss": -9.164587020874023, "global_step": 89730, "epoch": 534} {"train_loss": -9.203458786010742, "global_step": 89731, "epoch": 534} {"train_loss": -9.194671630859375, "global_step": 89732, "epoch": 534} {"train_loss": -9.35683536529541, "global_step": 89733, "epoch": 534} {"train_loss": -9.036458015441895, "global_step": 89734, "epoch": 534} {"train_loss": -9.295713424682617, "global_step": 89735, "epoch": 534} {"train_loss": -9.269776344299316, "global_step": 89736, "epoch": 534} {"train_loss": -9.307016372680664, "global_step": 89737, "epoch": 534} {"train_loss": -9.399822235107422, "global_step": 89738, "epoch": 534} {"train_loss": -9.426681518554688, "global_step": 89739, "epoch": 534} {"train_loss": -9.378995895385742, "global_step": 89740, "epoch": 534} {"train_loss": -9.377786636352539, "global_step": 89741, "epoch": 534} {"train_loss": -9.548369407653809, "global_step": 89742, "epoch": 534} {"train_loss": -9.389154434204102, "global_step": 89743, "epoch": 534} {"train_loss": -9.666184425354004, "global_step": 89744, "epoch": 534} {"train_loss": -9.59556770324707, "global_step": 89745, "epoch": 534} {"train_loss": -9.51145076751709, "global_step": 89746, "epoch": 534} {"train_loss": -9.353593826293945, "global_step": 89747, "epoch": 534} {"train_loss": -9.522253036499023, "global_step": 89748, "epoch": 534} {"train_loss": -9.639554977416992, "global_step": 89749, "epoch": 534} {"train_loss": -9.729635238647461, "global_step": 89750, "epoch": 534} {"train_loss": -9.822210311889648, "global_step": 89751, "epoch": 534} {"train_loss": -9.607725143432617, "global_step": 89752, "epoch": 534} {"train_loss": -9.532573699951172, "global_step": 89753, "epoch": 534} {"train_loss": -9.40165901184082, "global_step": 89754, "epoch": 534} {"train_loss": -9.5260591506958, "global_step": 89755, "epoch": 534} {"train_loss": -9.403751373291016, "global_step": 89756, "epoch": 534} {"train_loss": -8.954856872558594, "global_step": 89757, "epoch": 534} {"train_loss": -9.40760326385498, "global_step": 89758, "epoch": 534} {"train_loss": -9.290618896484375, "global_step": 89759, "epoch": 534} {"train_loss": -9.108388900756836, "global_step": 89760, "epoch": 534} {"train_loss": -9.262943267822266, "global_step": 89761, "epoch": 534} {"train_loss": -9.291492462158203, "global_step": 89762, "epoch": 534} {"train_loss": -9.288800239562988, "global_step": 89763, "epoch": 534} {"train_loss": -9.426225662231445, "global_step": 89764, "epoch": 534} {"train_loss": -9.005237579345703, "global_step": 89765, "epoch": 534} {"train_loss": -9.57776927947998, "global_step": 89766, "epoch": 534} {"train_loss": -9.514058113098145, "global_step": 89767, "epoch": 534} {"train_loss": -9.358587265014648, "global_step": 89768, "epoch": 534} {"train_loss": -9.237075805664062, "global_step": 89769, "epoch": 534} {"train_loss": -9.295565605163574, "global_step": 89770, "epoch": 534} {"train_loss": -9.325882911682129, "global_step": 89771, "epoch": 534} {"train_loss": -9.182531356811523, "global_step": 89772, "epoch": 534} {"train_loss": -9.471951484680176, "global_step": 89773, "epoch": 534} {"train_loss": -9.27775764465332, "global_step": 89774, "epoch": 534} {"train_loss": -9.325571060180664, "global_step": 89775, "epoch": 534} {"train_loss": -8.947376251220703, "global_step": 89776, "epoch": 534} {"train_loss": -9.239462852478027, "global_step": 89777, "epoch": 534} {"train_loss": -9.09190559387207, "global_step": 89778, "epoch": 534} {"train_loss": -9.704785346984863, "global_step": 89779, "epoch": 534} {"train_loss": -9.357118606567383, "global_step": 89780, "epoch": 534} {"train_loss": -9.544227600097656, "global_step": 89781, "epoch": 534} {"train_loss": -9.286579132080078, "global_step": 89782, "epoch": 534} {"train_loss": -9.378507614135742, "global_step": 89783, "epoch": 534} {"train_loss": -9.39288330078125, "global_step": 89784, "epoch": 534} {"train_loss": -9.383037567138672, "global_step": 89785, "epoch": 534} {"train_loss": -9.419899940490723, "global_step": 89786, "epoch": 534} {"train_loss": -9.412348747253418, "global_step": 89787, "epoch": 534} {"train_loss": -9.479604721069336, "global_step": 89788, "epoch": 534} {"train_loss": -9.47547721862793, "global_step": 89789, "epoch": 534} {"train_loss": -9.155975341796875, "global_step": 89790, "epoch": 534} {"train_loss": -9.407483100891113, "global_step": 89791, "epoch": 534} {"train_loss": -8.884666442871094, "global_step": 89792, "epoch": 534} {"train_loss": -9.347527503967285, "global_step": 89793, "epoch": 534} {"train_loss": -9.281761169433594, "global_step": 89794, "epoch": 534} {"train_loss": -9.364046096801758, "global_step": 89795, "epoch": 534} {"train_loss": -9.160232543945312, "global_step": 89796, "epoch": 534} {"train_loss": -9.077495574951172, "global_step": 89797, "epoch": 534} {"train_loss": -9.499171257019043, "global_step": 89798, "epoch": 534} {"train_loss": -9.19460391998291, "global_step": 89799, "epoch": 534} {"train_loss": -9.180076599121094, "global_step": 89800, "epoch": 534} {"train_loss": -9.466775894165039, "global_step": 89801, "epoch": 534} {"train_loss": -9.55034065246582, "global_step": 89802, "epoch": 534} {"train_loss": -9.220151901245117, "global_step": 89803, "epoch": 534} {"train_loss": -9.285604476928711, "global_step": 89804, "epoch": 534} {"train_loss": -9.521299362182617, "global_step": 89805, "epoch": 534} {"train_loss": -9.62014389038086, "global_step": 89806, "epoch": 534} {"train_loss": -9.62141227722168, "global_step": 89807, "epoch": 534} {"train_loss": -9.69072437286377, "global_step": 89808, "epoch": 534} {"train_loss": -9.549349784851074, "global_step": 89809, "epoch": 534} {"train_loss": -9.516292572021484, "global_step": 89810, "epoch": 534} {"train_loss": -9.202736854553223, "global_step": 89811, "epoch": 534} {"train_loss": -9.590816497802734, "global_step": 89812, "epoch": 534} {"train_loss": -9.560900688171387, "global_step": 89813, "epoch": 534} {"train_loss": -9.420245170593262, "global_step": 89814, "epoch": 534} {"train_loss": -9.396415710449219, "global_step": 89815, "epoch": 534} {"train_loss": -9.287243843078613, "global_step": 89816, "epoch": 534} {"train_loss": -9.355731964111328, "global_step": 89817, "epoch": 534} {"train_loss": -9.231340408325195, "global_step": 89818, "epoch": 534} {"train_loss": -9.396628379821777, "global_step": 89819, "epoch": 534} {"train_loss": -8.972709655761719, "global_step": 89820, "epoch": 534} {"train_loss": -9.378877639770508, "global_step": 89821, "epoch": 534} {"train_loss": -9.19998550415039, "global_step": 89822, "epoch": 534} {"train_loss": -9.39512825012207, "global_step": 89823, "epoch": 534} {"train_loss": -9.32706069946289, "global_step": 89824, "epoch": 534} {"train_loss": -9.03520393371582, "global_step": 89825, "epoch": 534} {"train_loss": -9.461124420166016, "global_step": 89826, "epoch": 534} {"train_loss": -9.24359130859375, "global_step": 89827, "epoch": 534} {"train_loss": -9.2166166305542, "global_step": 89828, "epoch": 534} {"train_loss": -9.375308990478516, "global_step": 89829, "epoch": 534} {"train_loss": -9.208091735839844, "global_step": 89830, "epoch": 534} {"train_loss": -8.982148170471191, "global_step": 89831, "epoch": 534} {"train_loss": -9.682470321655273, "global_step": 89832, "epoch": 534} {"train_loss": -9.246070861816406, "global_step": 89833, "epoch": 534} {"train_loss": -9.27871322631836, "global_step": 89834, "epoch": 534} {"train_loss": -9.56562328338623, "global_step": 89835, "epoch": 534} {"train_loss": -9.548242568969727, "global_step": 89836, "epoch": 534} {"train_loss": -9.249027252197266, "global_step": 89837, "epoch": 534} {"train_loss": -9.820438385009766, "global_step": 89838, "epoch": 534} {"train_loss": -9.253393173217773, "global_step": 89839, "epoch": 534} {"train_loss": -9.65096664428711, "global_step": 89840, "epoch": 534} {"train_loss": -9.344966888427734, "global_step": 89841, "epoch": 534} {"train_loss": -9.694818496704102, "global_step": 89842, "epoch": 534} {"train_loss": -9.524335861206055, "global_step": 89843, "epoch": 534} {"train_loss": -9.7447509765625, "global_step": 89844, "epoch": 534} {"train_loss": -9.370733261108398, "global_step": 89845, "epoch": 534} {"train_loss": -9.809364318847656, "global_step": 89846, "epoch": 534} {"train_loss": -9.580083847045898, "global_step": 89847, "epoch": 534} {"train_loss": -9.39403247833252, "global_step": 89848, "epoch": 534} {"train_loss": -9.282072067260742, "global_step": 89849, "epoch": 534} {"train_loss": -9.587451934814453, "global_step": 89850, "epoch": 534} {"train_loss": -9.471379280090332, "global_step": 89851, "epoch": 534} {"train_loss": -9.726594924926758, "global_step": 89852, "epoch": 534} {"train_loss": -9.257467269897461, "global_step": 89853, "epoch": 534} {"train_loss": -9.700112342834473, "global_step": 89854, "epoch": 534} {"train_loss": -9.582023620605469, "global_step": 89855, "epoch": 534} {"train_loss": -9.33953857421875, "global_step": 89856, "epoch": 534} {"train_loss": -9.603257179260254, "global_step": 89857, "epoch": 534} {"train_loss": -9.579976081848145, "global_step": 89858, "epoch": 534} {"train_loss": -9.398992538452148, "global_step": 89859, "epoch": 534} {"train_loss": -9.206599235534668, "global_step": 89860, "epoch": 534} {"train_loss": -9.227378845214844, "global_step": 89861, "epoch": 534} {"train_loss": -9.707262992858887, "global_step": 89862, "epoch": 534} {"train_loss": -9.451217651367188, "global_step": 89863, "epoch": 534} {"train_loss": -9.304662704467773, "global_step": 89864, "epoch": 534} {"train_loss": -9.585744857788086, "global_step": 89865, "epoch": 534} {"train_loss": -9.29697036743164, "global_step": 89866, "epoch": 534} {"train_loss": -9.325071334838867, "global_step": 89867, "epoch": 534} {"train_loss": -9.48373031616211, "global_step": 89868, "epoch": 534} {"train_loss": -9.365450859069824, "global_step": 89869, "epoch": 534} {"train_loss": -9.46023941040039, "global_step": 89870, "epoch": 534} {"train_loss": -9.260676383972168, "global_step": 89871, "epoch": 534} {"train_loss": -9.116352081298828, "global_step": 89872, "epoch": 534} {"train_loss": -9.194284439086914, "global_step": 89873, "epoch": 534} {"train_loss": -9.051714897155762, "global_step": 89874, "epoch": 534} {"train_loss": -9.183530807495117, "global_step": 89875, "epoch": 534} {"train_loss": -8.995169639587402, "global_step": 89876, "epoch": 534} {"train_loss": -9.014486312866211, "global_step": 89877, "epoch": 534} {"train_loss": -9.218067169189453, "global_step": 89878, "epoch": 534} {"train_loss": -9.335695936566307, "global_step": 89879, "epoch": 534, "val_loss": 200584.34375} {"train_loss": -9.325267791748047, "global_step": 89880, "epoch": 535} {"train_loss": -9.399505615234375, "global_step": 89881, "epoch": 535} {"train_loss": -9.19959831237793, "global_step": 89882, "epoch": 535} {"train_loss": -9.208425521850586, "global_step": 89883, "epoch": 535} {"train_loss": -9.155900955200195, "global_step": 89884, "epoch": 535} {"train_loss": -9.4215087890625, "global_step": 89885, "epoch": 535} {"train_loss": -9.308277130126953, "global_step": 89886, "epoch": 535} {"train_loss": -9.27748966217041, "global_step": 89887, "epoch": 535} {"train_loss": -9.33909797668457, "global_step": 89888, "epoch": 535} {"train_loss": -9.342337608337402, "global_step": 89889, "epoch": 535} {"train_loss": -9.386093139648438, "global_step": 89890, "epoch": 535} {"train_loss": -9.23076057434082, "global_step": 89891, "epoch": 535} {"train_loss": -9.526081085205078, "global_step": 89892, "epoch": 535} {"train_loss": -9.362565994262695, "global_step": 89893, "epoch": 535} {"train_loss": -9.385547637939453, "global_step": 89894, "epoch": 535} {"train_loss": -9.460878372192383, "global_step": 89895, "epoch": 535} {"train_loss": -9.500247955322266, "global_step": 89896, "epoch": 535} {"train_loss": -9.41597843170166, "global_step": 89897, "epoch": 535} {"train_loss": -9.681337356567383, "global_step": 89898, "epoch": 535} {"train_loss": -9.39603328704834, "global_step": 89899, "epoch": 535} {"train_loss": -9.74766731262207, "global_step": 89900, "epoch": 535} {"train_loss": -9.51272201538086, "global_step": 89901, "epoch": 535} {"train_loss": -9.667764663696289, "global_step": 89902, "epoch": 535} {"train_loss": -9.439334869384766, "global_step": 89903, "epoch": 535} {"train_loss": -9.754476547241211, "global_step": 89904, "epoch": 535} {"train_loss": -9.713716506958008, "global_step": 89905, "epoch": 535} {"train_loss": -9.533547401428223, "global_step": 89906, "epoch": 535} {"train_loss": -9.695568084716797, "global_step": 89907, "epoch": 535} {"train_loss": -9.776593208312988, "global_step": 89908, "epoch": 535} {"train_loss": -9.475247383117676, "global_step": 89909, "epoch": 535} {"train_loss": -9.596720695495605, "global_step": 89910, "epoch": 535} {"train_loss": -9.449935913085938, "global_step": 89911, "epoch": 535} {"train_loss": -9.391514778137207, "global_step": 89912, "epoch": 535} {"train_loss": -9.53203010559082, "global_step": 89913, "epoch": 535} {"train_loss": -9.592619895935059, "global_step": 89914, "epoch": 535} {"train_loss": -9.694759368896484, "global_step": 89915, "epoch": 535} {"train_loss": -9.290035247802734, "global_step": 89916, "epoch": 535} {"train_loss": -9.747459411621094, "global_step": 89917, "epoch": 535} {"train_loss": -9.627033233642578, "global_step": 89918, "epoch": 535} {"train_loss": -9.39436149597168, "global_step": 89919, "epoch": 535} {"train_loss": -9.447578430175781, "global_step": 89920, "epoch": 535} {"train_loss": -9.206433296203613, "global_step": 89921, "epoch": 535} {"train_loss": -9.59304428100586, "global_step": 89922, "epoch": 535} {"train_loss": -9.486042022705078, "global_step": 89923, "epoch": 535} {"train_loss": -9.52419376373291, "global_step": 89924, "epoch": 535} {"train_loss": -9.497533798217773, "global_step": 89925, "epoch": 535} {"train_loss": -9.64119815826416, "global_step": 89926, "epoch": 535} {"train_loss": -9.578575134277344, "global_step": 89927, "epoch": 535} {"train_loss": -9.548155784606934, "global_step": 89928, "epoch": 535} {"train_loss": -9.5564546585083, "global_step": 89929, "epoch": 535} {"train_loss": -9.539375305175781, "global_step": 89930, "epoch": 535} {"train_loss": -9.556514739990234, "global_step": 89931, "epoch": 535} {"train_loss": -9.646028518676758, "global_step": 89932, "epoch": 535} {"train_loss": -9.608939170837402, "global_step": 89933, "epoch": 535} {"train_loss": -9.287665367126465, "global_step": 89934, "epoch": 535} {"train_loss": -9.50261116027832, "global_step": 89935, "epoch": 535} {"train_loss": -9.513612747192383, "global_step": 89936, "epoch": 535} {"train_loss": -9.629412651062012, "global_step": 89937, "epoch": 535} {"train_loss": -9.448028564453125, "global_step": 89938, "epoch": 535} {"train_loss": -9.495685577392578, "global_step": 89939, "epoch": 535} {"train_loss": -9.493142127990723, "global_step": 89940, "epoch": 535} {"train_loss": -9.593828201293945, "global_step": 89941, "epoch": 535} {"train_loss": -9.414134979248047, "global_step": 89942, "epoch": 535} {"train_loss": -9.547147750854492, "global_step": 89943, "epoch": 535} {"train_loss": -9.195117950439453, "global_step": 89944, "epoch": 535} {"train_loss": -9.49008560180664, "global_step": 89945, "epoch": 535} {"train_loss": -9.130514144897461, "global_step": 89946, "epoch": 535} {"train_loss": -9.276541709899902, "global_step": 89947, "epoch": 535} {"train_loss": -9.074880599975586, "global_step": 89948, "epoch": 535} {"train_loss": -9.026243209838867, "global_step": 89949, "epoch": 535} {"train_loss": -9.027463912963867, "global_step": 89950, "epoch": 535} {"train_loss": -9.345569610595703, "global_step": 89951, "epoch": 535} {"train_loss": -9.180255889892578, "global_step": 89952, "epoch": 535} {"train_loss": -8.945259094238281, "global_step": 89953, "epoch": 535} {"train_loss": -9.443164825439453, "global_step": 89954, "epoch": 535} {"train_loss": -8.926065444946289, "global_step": 89955, "epoch": 535} {"train_loss": -9.371795654296875, "global_step": 89956, "epoch": 535} {"train_loss": -9.253644943237305, "global_step": 89957, "epoch": 535} {"train_loss": -9.143245697021484, "global_step": 89958, "epoch": 535} {"train_loss": -9.094963073730469, "global_step": 89959, "epoch": 535} {"train_loss": -9.29025936126709, "global_step": 89960, "epoch": 535} {"train_loss": -9.017473220825195, "global_step": 89961, "epoch": 535} {"train_loss": -9.116777420043945, "global_step": 89962, "epoch": 535} {"train_loss": -9.08942699432373, "global_step": 89963, "epoch": 535} {"train_loss": -9.130603790283203, "global_step": 89964, "epoch": 535} {"train_loss": -8.919479370117188, "global_step": 89965, "epoch": 535} {"train_loss": -9.20276927947998, "global_step": 89966, "epoch": 535} {"train_loss": -9.144133567810059, "global_step": 89967, "epoch": 535} {"train_loss": -9.502795219421387, "global_step": 89968, "epoch": 535} {"train_loss": -8.898086547851562, "global_step": 89969, "epoch": 535} {"train_loss": -9.317850112915039, "global_step": 89970, "epoch": 535} {"train_loss": -9.279499053955078, "global_step": 89971, "epoch": 535} {"train_loss": -9.274592399597168, "global_step": 89972, "epoch": 535} {"train_loss": -9.012617111206055, "global_step": 89973, "epoch": 535} {"train_loss": -9.17062759399414, "global_step": 89974, "epoch": 535} {"train_loss": -9.15890121459961, "global_step": 89975, "epoch": 535} {"train_loss": -9.19099235534668, "global_step": 89976, "epoch": 535} {"train_loss": -9.060223579406738, "global_step": 89977, "epoch": 535} {"train_loss": -9.20334243774414, "global_step": 89978, "epoch": 535} {"train_loss": -9.361549377441406, "global_step": 89979, "epoch": 535} {"train_loss": -9.362897872924805, "global_step": 89980, "epoch": 535} {"train_loss": -9.168996810913086, "global_step": 89981, "epoch": 535} {"train_loss": -9.158012390136719, "global_step": 89982, "epoch": 535} {"train_loss": -9.3765869140625, "global_step": 89983, "epoch": 535} {"train_loss": -9.315851211547852, "global_step": 89984, "epoch": 535} {"train_loss": -9.556007385253906, "global_step": 89985, "epoch": 535} {"train_loss": -9.361102104187012, "global_step": 89986, "epoch": 535} {"train_loss": -9.608526229858398, "global_step": 89987, "epoch": 535} {"train_loss": -9.434980392456055, "global_step": 89988, "epoch": 535} {"train_loss": -9.545488357543945, "global_step": 89989, "epoch": 535} {"train_loss": -9.532078742980957, "global_step": 89990, "epoch": 535} {"train_loss": -9.510366439819336, "global_step": 89991, "epoch": 535} {"train_loss": -9.654715538024902, "global_step": 89992, "epoch": 535} {"train_loss": -9.568866729736328, "global_step": 89993, "epoch": 535} {"train_loss": -9.704198837280273, "global_step": 89994, "epoch": 535} {"train_loss": -9.488821029663086, "global_step": 89995, "epoch": 535} {"train_loss": -9.480629920959473, "global_step": 89996, "epoch": 535} {"train_loss": -9.516840934753418, "global_step": 89997, "epoch": 535} {"train_loss": -9.507867813110352, "global_step": 89998, "epoch": 535} {"train_loss": -9.81580924987793, "global_step": 89999, "epoch": 535} {"train_loss": -9.667612075805664, "global_step": 90000, "epoch": 535} {"train_loss": -9.8333101272583, "global_step": 90001, "epoch": 535} {"train_loss": -9.726083755493164, "global_step": 90002, "epoch": 535} {"train_loss": -9.575750350952148, "global_step": 90003, "epoch": 535} {"train_loss": -9.762022018432617, "global_step": 90004, "epoch": 535} {"train_loss": -9.485381126403809, "global_step": 90005, "epoch": 535} {"train_loss": -10.002710342407227, "global_step": 90006, "epoch": 535} {"train_loss": -9.207100868225098, "global_step": 90007, "epoch": 535} {"train_loss": -9.663459777832031, "global_step": 90008, "epoch": 535} {"train_loss": -9.579209327697754, "global_step": 90009, "epoch": 535} {"train_loss": -9.246769905090332, "global_step": 90010, "epoch": 535} {"train_loss": -9.569379806518555, "global_step": 90011, "epoch": 535} {"train_loss": -9.335186958312988, "global_step": 90012, "epoch": 535} {"train_loss": -9.312186241149902, "global_step": 90013, "epoch": 535} {"train_loss": -9.716512680053711, "global_step": 90014, "epoch": 535} {"train_loss": -9.366996765136719, "global_step": 90015, "epoch": 535} {"train_loss": -9.41042709350586, "global_step": 90016, "epoch": 535} {"train_loss": -9.331092834472656, "global_step": 90017, "epoch": 535} {"train_loss": -9.362887382507324, "global_step": 90018, "epoch": 535} {"train_loss": -9.451910972595215, "global_step": 90019, "epoch": 535} {"train_loss": -9.507534980773926, "global_step": 90020, "epoch": 535} {"train_loss": -9.472806930541992, "global_step": 90021, "epoch": 535} {"train_loss": -9.416704177856445, "global_step": 90022, "epoch": 535} {"train_loss": -9.5599365234375, "global_step": 90023, "epoch": 535} {"train_loss": -9.536635398864746, "global_step": 90024, "epoch": 535} {"train_loss": -9.432086944580078, "global_step": 90025, "epoch": 535} {"train_loss": -9.708487510681152, "global_step": 90026, "epoch": 535} {"train_loss": -9.19393539428711, "global_step": 90027, "epoch": 535} {"train_loss": -9.606679916381836, "global_step": 90028, "epoch": 535} {"train_loss": -9.609926223754883, "global_step": 90029, "epoch": 535} {"train_loss": -9.37873363494873, "global_step": 90030, "epoch": 535} {"train_loss": -9.62680435180664, "global_step": 90031, "epoch": 535} {"train_loss": -9.606010437011719, "global_step": 90032, "epoch": 535} {"train_loss": -9.76830005645752, "global_step": 90033, "epoch": 535} {"train_loss": -9.588422775268555, "global_step": 90034, "epoch": 535} {"train_loss": -9.630914688110352, "global_step": 90035, "epoch": 535} {"train_loss": -9.68686580657959, "global_step": 90036, "epoch": 535} {"train_loss": -9.48559284210205, "global_step": 90037, "epoch": 535} {"train_loss": -9.485495567321777, "global_step": 90038, "epoch": 535} {"train_loss": -9.566473007202148, "global_step": 90039, "epoch": 535} {"train_loss": -9.088529586791992, "global_step": 90040, "epoch": 535} {"train_loss": -9.517265319824219, "global_step": 90041, "epoch": 535} {"train_loss": -9.499679565429688, "global_step": 90042, "epoch": 535} {"train_loss": -9.132810592651367, "global_step": 90043, "epoch": 535} {"train_loss": -9.48093032836914, "global_step": 90044, "epoch": 535} {"train_loss": -8.806458473205566, "global_step": 90045, "epoch": 535} {"train_loss": -9.152759552001953, "global_step": 90046, "epoch": 535} {"train_loss": -9.420167094185238, "global_step": 90047, "epoch": 535, "val_loss": 202662.671875, "train_action_mse_error": 5.875053882598877} {"train_loss": -9.207839965820312, "global_step": 90048, "epoch": 536} {"train_loss": -9.21708869934082, "global_step": 90049, "epoch": 536} {"train_loss": -9.05797004699707, "global_step": 90050, "epoch": 536} {"train_loss": -9.339910507202148, "global_step": 90051, "epoch": 536} {"train_loss": -8.833473205566406, "global_step": 90052, "epoch": 536} {"train_loss": -9.271241188049316, "global_step": 90053, "epoch": 536} {"train_loss": -9.442429542541504, "global_step": 90054, "epoch": 536} {"train_loss": -9.129802703857422, "global_step": 90055, "epoch": 536} {"train_loss": -9.300196647644043, "global_step": 90056, "epoch": 536} {"train_loss": -9.41765022277832, "global_step": 90057, "epoch": 536} {"train_loss": -9.231975555419922, "global_step": 90058, "epoch": 536} {"train_loss": -9.589330673217773, "global_step": 90059, "epoch": 536} {"train_loss": -8.929450988769531, "global_step": 90060, "epoch": 536} {"train_loss": -9.52161979675293, "global_step": 90061, "epoch": 536} {"train_loss": -9.21788501739502, "global_step": 90062, "epoch": 536} {"train_loss": -9.372781753540039, "global_step": 90063, "epoch": 536} {"train_loss": -9.120506286621094, "global_step": 90064, "epoch": 536} {"train_loss": -9.466650009155273, "global_step": 90065, "epoch": 536} {"train_loss": -9.184431076049805, "global_step": 90066, "epoch": 536} {"train_loss": -9.504170417785645, "global_step": 90067, "epoch": 536} {"train_loss": -9.429738998413086, "global_step": 90068, "epoch": 536} {"train_loss": -9.254656791687012, "global_step": 90069, "epoch": 536} {"train_loss": -9.3818941116333, "global_step": 90070, "epoch": 536} {"train_loss": -9.468778610229492, "global_step": 90071, "epoch": 536} {"train_loss": -9.127763748168945, "global_step": 90072, "epoch": 536} {"train_loss": -9.663774490356445, "global_step": 90073, "epoch": 536} {"train_loss": -9.432724952697754, "global_step": 90074, "epoch": 536} {"train_loss": -9.687651634216309, "global_step": 90075, "epoch": 536} {"train_loss": -9.371715545654297, "global_step": 90076, "epoch": 536} {"train_loss": -9.475142478942871, "global_step": 90077, "epoch": 536} {"train_loss": -9.371185302734375, "global_step": 90078, "epoch": 536} {"train_loss": -9.57032299041748, "global_step": 90079, "epoch": 536} {"train_loss": -9.570892333984375, "global_step": 90080, "epoch": 536} {"train_loss": -9.62881851196289, "global_step": 90081, "epoch": 536} {"train_loss": -9.650341033935547, "global_step": 90082, "epoch": 536} {"train_loss": -9.696250915527344, "global_step": 90083, "epoch": 536} {"train_loss": -9.818382263183594, "global_step": 90084, "epoch": 536} {"train_loss": -9.595548629760742, "global_step": 90085, "epoch": 536} {"train_loss": -9.78984260559082, "global_step": 90086, "epoch": 536} {"train_loss": -9.721683502197266, "global_step": 90087, "epoch": 536} {"train_loss": -9.756969451904297, "global_step": 90088, "epoch": 536} {"train_loss": -9.709346771240234, "global_step": 90089, "epoch": 536} {"train_loss": -9.673095703125, "global_step": 90090, "epoch": 536} {"train_loss": -9.56442642211914, "global_step": 90091, "epoch": 536} {"train_loss": -9.302454948425293, "global_step": 90092, "epoch": 536} {"train_loss": -9.786372184753418, "global_step": 90093, "epoch": 536} {"train_loss": -9.61316204071045, "global_step": 90094, "epoch": 536} {"train_loss": -9.584955215454102, "global_step": 90095, "epoch": 536} {"train_loss": -9.473682403564453, "global_step": 90096, "epoch": 536} {"train_loss": -9.508182525634766, "global_step": 90097, "epoch": 536} {"train_loss": -9.68722915649414, "global_step": 90098, "epoch": 536} {"train_loss": -9.748459815979004, "global_step": 90099, "epoch": 536} {"train_loss": -9.513591766357422, "global_step": 90100, "epoch": 536} {"train_loss": -9.543262481689453, "global_step": 90101, "epoch": 536} {"train_loss": -9.68756103515625, "global_step": 90102, "epoch": 536} {"train_loss": -9.749992370605469, "global_step": 90103, "epoch": 536} {"train_loss": -9.492291450500488, "global_step": 90104, "epoch": 536} {"train_loss": -9.97515869140625, "global_step": 90105, "epoch": 536} {"train_loss": -9.460001945495605, "global_step": 90106, "epoch": 536} {"train_loss": -8.98533821105957, "global_step": 90107, "epoch": 536} {"train_loss": -9.41804313659668, "global_step": 90108, "epoch": 536} {"train_loss": -9.593710899353027, "global_step": 90109, "epoch": 536} {"train_loss": -9.343280792236328, "global_step": 90110, "epoch": 536} {"train_loss": -9.590879440307617, "global_step": 90111, "epoch": 536} {"train_loss": -9.386148452758789, "global_step": 90112, "epoch": 536} {"train_loss": -9.552751541137695, "global_step": 90113, "epoch": 536} {"train_loss": -9.401293754577637, "global_step": 90114, "epoch": 536} {"train_loss": -9.594168663024902, "global_step": 90115, "epoch": 536} {"train_loss": -9.27173137664795, "global_step": 90116, "epoch": 536} {"train_loss": -9.299148559570312, "global_step": 90117, "epoch": 536} {"train_loss": -9.473091125488281, "global_step": 90118, "epoch": 536} {"train_loss": -9.113303184509277, "global_step": 90119, "epoch": 536} {"train_loss": -9.322830200195312, "global_step": 90120, "epoch": 536} {"train_loss": -9.434100151062012, "global_step": 90121, "epoch": 536} {"train_loss": -9.486082077026367, "global_step": 90122, "epoch": 536} {"train_loss": -9.422880172729492, "global_step": 90123, "epoch": 536} {"train_loss": -9.37442684173584, "global_step": 90124, "epoch": 536} {"train_loss": -9.717986106872559, "global_step": 90125, "epoch": 536} {"train_loss": -9.211984634399414, "global_step": 90126, "epoch": 536} {"train_loss": -9.374282836914062, "global_step": 90127, "epoch": 536} {"train_loss": -9.700231552124023, "global_step": 90128, "epoch": 536} {"train_loss": -9.493078231811523, "global_step": 90129, "epoch": 536} {"train_loss": -9.57056999206543, "global_step": 90130, "epoch": 536} {"train_loss": -9.42288589477539, "global_step": 90131, "epoch": 536} {"train_loss": -9.473733901977539, "global_step": 90132, "epoch": 536} {"train_loss": -9.517273902893066, "global_step": 90133, "epoch": 536} {"train_loss": -9.312360763549805, "global_step": 90134, "epoch": 536} {"train_loss": -9.566732406616211, "global_step": 90135, "epoch": 536} {"train_loss": -9.263262748718262, "global_step": 90136, "epoch": 536} {"train_loss": -9.558792114257812, "global_step": 90137, "epoch": 536} {"train_loss": -9.327096939086914, "global_step": 90138, "epoch": 536} {"train_loss": -9.227030754089355, "global_step": 90139, "epoch": 536} {"train_loss": -9.164846420288086, "global_step": 90140, "epoch": 536} {"train_loss": -9.074782371520996, "global_step": 90141, "epoch": 536} {"train_loss": -9.100878715515137, "global_step": 90142, "epoch": 536} {"train_loss": -9.119487762451172, "global_step": 90143, "epoch": 536} {"train_loss": -9.292031288146973, "global_step": 90144, "epoch": 536} {"train_loss": -9.406174659729004, "global_step": 90145, "epoch": 536} {"train_loss": -9.053093910217285, "global_step": 90146, "epoch": 536} {"train_loss": -9.471543312072754, "global_step": 90147, "epoch": 536} {"train_loss": -8.854248046875, "global_step": 90148, "epoch": 536} {"train_loss": -9.087610244750977, "global_step": 90149, "epoch": 536} {"train_loss": -9.400999069213867, "global_step": 90150, "epoch": 536} {"train_loss": -9.152551651000977, "global_step": 90151, "epoch": 536} {"train_loss": -9.070772171020508, "global_step": 90152, "epoch": 536} {"train_loss": -9.102958679199219, "global_step": 90153, "epoch": 536} {"train_loss": -9.210184097290039, "global_step": 90154, "epoch": 536} {"train_loss": -9.087263107299805, "global_step": 90155, "epoch": 536} {"train_loss": -9.326027870178223, "global_step": 90156, "epoch": 536} {"train_loss": -9.177371978759766, "global_step": 90157, "epoch": 536} {"train_loss": -9.397823333740234, "global_step": 90158, "epoch": 536} {"train_loss": -9.407387733459473, "global_step": 90159, "epoch": 536} {"train_loss": -9.389537811279297, "global_step": 90160, "epoch": 536} {"train_loss": -9.423739433288574, "global_step": 90161, "epoch": 536} {"train_loss": -9.393240928649902, "global_step": 90162, "epoch": 536} {"train_loss": -9.497978210449219, "global_step": 90163, "epoch": 536} {"train_loss": -9.416510581970215, "global_step": 90164, "epoch": 536} {"train_loss": -9.277615547180176, "global_step": 90165, "epoch": 536} {"train_loss": -9.646051406860352, "global_step": 90166, "epoch": 536} {"train_loss": -9.480669975280762, "global_step": 90167, "epoch": 536} {"train_loss": -9.463912963867188, "global_step": 90168, "epoch": 536} {"train_loss": -9.593725204467773, "global_step": 90169, "epoch": 536} {"train_loss": -9.60434341430664, "global_step": 90170, "epoch": 536} {"train_loss": -9.467373847961426, "global_step": 90171, "epoch": 536} {"train_loss": -9.49407958984375, "global_step": 90172, "epoch": 536} {"train_loss": -9.56259822845459, "global_step": 90173, "epoch": 536} {"train_loss": -9.80112075805664, "global_step": 90174, "epoch": 536} {"train_loss": -9.56308364868164, "global_step": 90175, "epoch": 536} {"train_loss": -9.433847427368164, "global_step": 90176, "epoch": 536} {"train_loss": -9.46290397644043, "global_step": 90177, "epoch": 536} {"train_loss": -9.44481086730957, "global_step": 90178, "epoch": 536} {"train_loss": -9.552610397338867, "global_step": 90179, "epoch": 536} {"train_loss": -9.504094123840332, "global_step": 90180, "epoch": 536} {"train_loss": -9.681946754455566, "global_step": 90181, "epoch": 536} {"train_loss": -9.617727279663086, "global_step": 90182, "epoch": 536} {"train_loss": -9.62539291381836, "global_step": 90183, "epoch": 536} {"train_loss": -9.806320190429688, "global_step": 90184, "epoch": 536} {"train_loss": -9.720782279968262, "global_step": 90185, "epoch": 536} {"train_loss": -9.624194145202637, "global_step": 90186, "epoch": 536} {"train_loss": -9.561134338378906, "global_step": 90187, "epoch": 536} {"train_loss": -9.694657325744629, "global_step": 90188, "epoch": 536} {"train_loss": -9.622502326965332, "global_step": 90189, "epoch": 536} {"train_loss": -9.448270797729492, "global_step": 90190, "epoch": 536} {"train_loss": -9.417207717895508, "global_step": 90191, "epoch": 536} {"train_loss": -9.532195091247559, "global_step": 90192, "epoch": 536} {"train_loss": -9.702142715454102, "global_step": 90193, "epoch": 536} {"train_loss": -9.501557350158691, "global_step": 90194, "epoch": 536} {"train_loss": -9.622098922729492, "global_step": 90195, "epoch": 536} {"train_loss": -9.491168975830078, "global_step": 90196, "epoch": 536} {"train_loss": -9.446414947509766, "global_step": 90197, "epoch": 536} {"train_loss": -9.709905624389648, "global_step": 90198, "epoch": 536} {"train_loss": -9.54547119140625, "global_step": 90199, "epoch": 536} {"train_loss": -9.497279167175293, "global_step": 90200, "epoch": 536} {"train_loss": -9.558709144592285, "global_step": 90201, "epoch": 536} {"train_loss": -9.526298522949219, "global_step": 90202, "epoch": 536} {"train_loss": -9.39468765258789, "global_step": 90203, "epoch": 536} {"train_loss": -9.434013366699219, "global_step": 90204, "epoch": 536} {"train_loss": -9.707283973693848, "global_step": 90205, "epoch": 536} {"train_loss": -9.553473472595215, "global_step": 90206, "epoch": 536} {"train_loss": -9.29361343383789, "global_step": 90207, "epoch": 536} {"train_loss": -9.296266555786133, "global_step": 90208, "epoch": 536} {"train_loss": -9.08808422088623, "global_step": 90209, "epoch": 536} {"train_loss": -9.430642127990723, "global_step": 90210, "epoch": 536} {"train_loss": -9.140803337097168, "global_step": 90211, "epoch": 536} {"train_loss": -9.336111068725586, "global_step": 90212, "epoch": 536} {"train_loss": -9.411659240722656, "global_step": 90213, "epoch": 536} {"train_loss": -9.288046836853027, "global_step": 90214, "epoch": 536} {"train_loss": -9.438955630574908, "global_step": 90215, "epoch": 536, "val_loss": 201866.203125} {"train_loss": -9.136496543884277, "global_step": 90216, "epoch": 537} {"train_loss": -9.413267135620117, "global_step": 90217, "epoch": 537} {"train_loss": -9.38764762878418, "global_step": 90218, "epoch": 537} {"train_loss": -9.059991836547852, "global_step": 90219, "epoch": 537} {"train_loss": -9.401374816894531, "global_step": 90220, "epoch": 537} {"train_loss": -9.467310905456543, "global_step": 90221, "epoch": 537} {"train_loss": -9.332764625549316, "global_step": 90222, "epoch": 537} {"train_loss": -9.139720916748047, "global_step": 90223, "epoch": 537} {"train_loss": -9.375823974609375, "global_step": 90224, "epoch": 537} {"train_loss": -9.296086311340332, "global_step": 90225, "epoch": 537} {"train_loss": -9.410430908203125, "global_step": 90226, "epoch": 537} {"train_loss": -9.5275297164917, "global_step": 90227, "epoch": 537} {"train_loss": -9.268640518188477, "global_step": 90228, "epoch": 537} {"train_loss": -9.477067947387695, "global_step": 90229, "epoch": 537} {"train_loss": -9.229569435119629, "global_step": 90230, "epoch": 537} {"train_loss": -9.142663955688477, "global_step": 90231, "epoch": 537} {"train_loss": -9.18189811706543, "global_step": 90232, "epoch": 537} {"train_loss": -9.38012981414795, "global_step": 90233, "epoch": 537} {"train_loss": -9.317554473876953, "global_step": 90234, "epoch": 537} {"train_loss": -9.495943069458008, "global_step": 90235, "epoch": 537} {"train_loss": -9.199775695800781, "global_step": 90236, "epoch": 537} {"train_loss": -9.505823135375977, "global_step": 90237, "epoch": 537} {"train_loss": -9.425138473510742, "global_step": 90238, "epoch": 537} {"train_loss": -9.381715774536133, "global_step": 90239, "epoch": 537} {"train_loss": -9.38827133178711, "global_step": 90240, "epoch": 537} {"train_loss": -9.395198822021484, "global_step": 90241, "epoch": 537} {"train_loss": -9.543301582336426, "global_step": 90242, "epoch": 537} {"train_loss": -9.372515678405762, "global_step": 90243, "epoch": 537} {"train_loss": -9.767698287963867, "global_step": 90244, "epoch": 537} {"train_loss": -9.522680282592773, "global_step": 90245, "epoch": 537} {"train_loss": -9.495841026306152, "global_step": 90246, "epoch": 537} {"train_loss": -9.281436920166016, "global_step": 90247, "epoch": 537} {"train_loss": -9.484151840209961, "global_step": 90248, "epoch": 537} {"train_loss": -9.636958122253418, "global_step": 90249, "epoch": 537} {"train_loss": -9.749343872070312, "global_step": 90250, "epoch": 537} {"train_loss": -9.561920166015625, "global_step": 90251, "epoch": 537} {"train_loss": -9.584382057189941, "global_step": 90252, "epoch": 537} {"train_loss": -9.666059494018555, "global_step": 90253, "epoch": 537} {"train_loss": -9.367206573486328, "global_step": 90254, "epoch": 537} {"train_loss": -9.635313034057617, "global_step": 90255, "epoch": 537} {"train_loss": -9.629663467407227, "global_step": 90256, "epoch": 537} {"train_loss": -9.772403717041016, "global_step": 90257, "epoch": 537} {"train_loss": -9.635744094848633, "global_step": 90258, "epoch": 537} {"train_loss": -9.561731338500977, "global_step": 90259, "epoch": 537} {"train_loss": -9.512322425842285, "global_step": 90260, "epoch": 537} {"train_loss": -9.72528076171875, "global_step": 90261, "epoch": 537} {"train_loss": -9.460994720458984, "global_step": 90262, "epoch": 537} {"train_loss": -9.554755210876465, "global_step": 90263, "epoch": 537} {"train_loss": -9.659551620483398, "global_step": 90264, "epoch": 537} {"train_loss": -9.394623756408691, "global_step": 90265, "epoch": 537} {"train_loss": -9.436604499816895, "global_step": 90266, "epoch": 537} {"train_loss": -9.540407180786133, "global_step": 90267, "epoch": 537} {"train_loss": -9.565937995910645, "global_step": 90268, "epoch": 537} {"train_loss": -9.526187896728516, "global_step": 90269, "epoch": 537} {"train_loss": -9.442461013793945, "global_step": 90270, "epoch": 537} {"train_loss": -9.731721878051758, "global_step": 90271, "epoch": 537} {"train_loss": -9.598284721374512, "global_step": 90272, "epoch": 537} {"train_loss": -9.691337585449219, "global_step": 90273, "epoch": 537} {"train_loss": -9.478263854980469, "global_step": 90274, "epoch": 537} {"train_loss": -9.614248275756836, "global_step": 90275, "epoch": 537} {"train_loss": -9.637979507446289, "global_step": 90276, "epoch": 537} {"train_loss": -9.702420234680176, "global_step": 90277, "epoch": 537} {"train_loss": -9.520124435424805, "global_step": 90278, "epoch": 537} {"train_loss": -9.532672882080078, "global_step": 90279, "epoch": 537} {"train_loss": -9.43874740600586, "global_step": 90280, "epoch": 537} {"train_loss": -9.361761093139648, "global_step": 90281, "epoch": 537} {"train_loss": -9.304887771606445, "global_step": 90282, "epoch": 537} {"train_loss": -9.45511531829834, "global_step": 90283, "epoch": 537} {"train_loss": -9.395115852355957, "global_step": 90284, "epoch": 537} {"train_loss": -9.464664459228516, "global_step": 90285, "epoch": 537} {"train_loss": -9.110349655151367, "global_step": 90286, "epoch": 537} {"train_loss": -8.973062515258789, "global_step": 90287, "epoch": 537} {"train_loss": -8.769524574279785, "global_step": 90288, "epoch": 537} {"train_loss": -9.194853782653809, "global_step": 90289, "epoch": 537} {"train_loss": -9.179773330688477, "global_step": 90290, "epoch": 537} {"train_loss": -8.794429779052734, "global_step": 90291, "epoch": 537} {"train_loss": -8.863323211669922, "global_step": 90292, "epoch": 537} {"train_loss": -9.329329490661621, "global_step": 90293, "epoch": 537} {"train_loss": -8.653491973876953, "global_step": 90294, "epoch": 537} {"train_loss": -9.121795654296875, "global_step": 90295, "epoch": 537} {"train_loss": -9.034843444824219, "global_step": 90296, "epoch": 537} {"train_loss": -9.199836730957031, "global_step": 90297, "epoch": 537} {"train_loss": -8.535964965820312, "global_step": 90298, "epoch": 537} {"train_loss": -9.016542434692383, "global_step": 90299, "epoch": 537} {"train_loss": -9.079451560974121, "global_step": 90300, "epoch": 537} {"train_loss": -8.902442932128906, "global_step": 90301, "epoch": 537} {"train_loss": -9.014195442199707, "global_step": 90302, "epoch": 537} {"train_loss": -9.098209381103516, "global_step": 90303, "epoch": 537} {"train_loss": -8.711847305297852, "global_step": 90304, "epoch": 537} {"train_loss": -9.001117706298828, "global_step": 90305, "epoch": 537} {"train_loss": -9.067680358886719, "global_step": 90306, "epoch": 537} {"train_loss": -8.902936935424805, "global_step": 90307, "epoch": 537} {"train_loss": -9.060868263244629, "global_step": 90308, "epoch": 537} {"train_loss": -9.11158561706543, "global_step": 90309, "epoch": 537} {"train_loss": -9.319818496704102, "global_step": 90310, "epoch": 537} {"train_loss": -9.358933448791504, "global_step": 90311, "epoch": 537} {"train_loss": -9.088329315185547, "global_step": 90312, "epoch": 537} {"train_loss": -9.305784225463867, "global_step": 90313, "epoch": 537} {"train_loss": -9.237773895263672, "global_step": 90314, "epoch": 537} {"train_loss": -9.37729263305664, "global_step": 90315, "epoch": 537} {"train_loss": -9.485641479492188, "global_step": 90316, "epoch": 537} {"train_loss": -9.331747055053711, "global_step": 90317, "epoch": 537} {"train_loss": -9.38000202178955, "global_step": 90318, "epoch": 537} {"train_loss": -9.326183319091797, "global_step": 90319, "epoch": 537} {"train_loss": -9.581928253173828, "global_step": 90320, "epoch": 537} {"train_loss": -9.36018180847168, "global_step": 90321, "epoch": 537} {"train_loss": -9.45427417755127, "global_step": 90322, "epoch": 537} {"train_loss": -9.56688117980957, "global_step": 90323, "epoch": 537} {"train_loss": -9.578023910522461, "global_step": 90324, "epoch": 537} {"train_loss": -9.49906063079834, "global_step": 90325, "epoch": 537} {"train_loss": -9.57655143737793, "global_step": 90326, "epoch": 537} {"train_loss": -9.603693962097168, "global_step": 90327, "epoch": 537} {"train_loss": -9.718692779541016, "global_step": 90328, "epoch": 537} {"train_loss": -9.684588432312012, "global_step": 90329, "epoch": 537} {"train_loss": -9.83263874053955, "global_step": 90330, "epoch": 537} {"train_loss": -9.413318634033203, "global_step": 90331, "epoch": 537} {"train_loss": -9.57778549194336, "global_step": 90332, "epoch": 537} {"train_loss": -9.49455451965332, "global_step": 90333, "epoch": 537} {"train_loss": -9.832399368286133, "global_step": 90334, "epoch": 537} {"train_loss": -9.700311660766602, "global_step": 90335, "epoch": 537} {"train_loss": -9.803709983825684, "global_step": 90336, "epoch": 537} {"train_loss": -9.667160034179688, "global_step": 90337, "epoch": 537} {"train_loss": -9.542027473449707, "global_step": 90338, "epoch": 537} {"train_loss": -9.734546661376953, "global_step": 90339, "epoch": 537} {"train_loss": -9.398209571838379, "global_step": 90340, "epoch": 537} {"train_loss": -9.804764747619629, "global_step": 90341, "epoch": 537} {"train_loss": -9.644454956054688, "global_step": 90342, "epoch": 537} {"train_loss": -9.769932746887207, "global_step": 90343, "epoch": 537} {"train_loss": -9.430904388427734, "global_step": 90344, "epoch": 537} {"train_loss": -9.627473831176758, "global_step": 90345, "epoch": 537} {"train_loss": -9.744311332702637, "global_step": 90346, "epoch": 537} {"train_loss": -9.704309463500977, "global_step": 90347, "epoch": 537} {"train_loss": -9.645837783813477, "global_step": 90348, "epoch": 537} {"train_loss": -9.6234130859375, "global_step": 90349, "epoch": 537} {"train_loss": -9.441577911376953, "global_step": 90350, "epoch": 537} {"train_loss": -9.571341514587402, "global_step": 90351, "epoch": 537} {"train_loss": -9.194816589355469, "global_step": 90352, "epoch": 537} {"train_loss": -9.613322257995605, "global_step": 90353, "epoch": 537} {"train_loss": -9.140522003173828, "global_step": 90354, "epoch": 537} {"train_loss": -9.605091094970703, "global_step": 90355, "epoch": 537} {"train_loss": -8.98017406463623, "global_step": 90356, "epoch": 537} {"train_loss": -9.168435096740723, "global_step": 90357, "epoch": 537} {"train_loss": -9.141395568847656, "global_step": 90358, "epoch": 537} {"train_loss": -9.558502197265625, "global_step": 90359, "epoch": 537} {"train_loss": -9.37449836730957, "global_step": 90360, "epoch": 537} {"train_loss": -9.23175048828125, "global_step": 90361, "epoch": 537} {"train_loss": -9.504080772399902, "global_step": 90362, "epoch": 537} {"train_loss": -9.269109725952148, "global_step": 90363, "epoch": 537} {"train_loss": -9.263603210449219, "global_step": 90364, "epoch": 537} {"train_loss": -9.411441802978516, "global_step": 90365, "epoch": 537} {"train_loss": -9.668008804321289, "global_step": 90366, "epoch": 537} {"train_loss": -9.479619979858398, "global_step": 90367, "epoch": 537} {"train_loss": -9.617600440979004, "global_step": 90368, "epoch": 537} {"train_loss": -9.462896347045898, "global_step": 90369, "epoch": 537} {"train_loss": -9.407819747924805, "global_step": 90370, "epoch": 537} {"train_loss": -9.4014310836792, "global_step": 90371, "epoch": 537} {"train_loss": -9.367286682128906, "global_step": 90372, "epoch": 537} {"train_loss": -9.584187507629395, "global_step": 90373, "epoch": 537} {"train_loss": -9.178180694580078, "global_step": 90374, "epoch": 537} {"train_loss": -9.574772834777832, "global_step": 90375, "epoch": 537} {"train_loss": -9.234469413757324, "global_step": 90376, "epoch": 537} {"train_loss": -9.499568939208984, "global_step": 90377, "epoch": 537} {"train_loss": -9.004281997680664, "global_step": 90378, "epoch": 537} {"train_loss": -9.502864837646484, "global_step": 90379, "epoch": 537} {"train_loss": -8.94249153137207, "global_step": 90380, "epoch": 537} {"train_loss": -9.075450897216797, "global_step": 90381, "epoch": 537} {"train_loss": -9.165637969970703, "global_step": 90382, "epoch": 537} {"train_loss": -9.39452888852074, "global_step": 90383, "epoch": 537, "val_loss": 203826.40625} {"train_loss": -8.949014663696289, "global_step": 90384, "epoch": 538} {"train_loss": -9.235555648803711, "global_step": 90385, "epoch": 538} {"train_loss": -9.164745330810547, "global_step": 90386, "epoch": 538} {"train_loss": -9.261266708374023, "global_step": 90387, "epoch": 538} {"train_loss": -8.94495964050293, "global_step": 90388, "epoch": 538} {"train_loss": -8.990594863891602, "global_step": 90389, "epoch": 538} {"train_loss": -9.245725631713867, "global_step": 90390, "epoch": 538} {"train_loss": -9.222721099853516, "global_step": 90391, "epoch": 538} {"train_loss": -9.337029457092285, "global_step": 90392, "epoch": 538} {"train_loss": -9.194103240966797, "global_step": 90393, "epoch": 538} {"train_loss": -9.262068748474121, "global_step": 90394, "epoch": 538} {"train_loss": -9.288373947143555, "global_step": 90395, "epoch": 538} {"train_loss": -9.37736701965332, "global_step": 90396, "epoch": 538} {"train_loss": -9.430489540100098, "global_step": 90397, "epoch": 538} {"train_loss": -9.364421844482422, "global_step": 90398, "epoch": 538} {"train_loss": -9.597024917602539, "global_step": 90399, "epoch": 538} {"train_loss": -9.413986206054688, "global_step": 90400, "epoch": 538} {"train_loss": -9.32319450378418, "global_step": 90401, "epoch": 538} {"train_loss": -9.63687515258789, "global_step": 90402, "epoch": 538} {"train_loss": -9.45452880859375, "global_step": 90403, "epoch": 538} {"train_loss": -9.267362594604492, "global_step": 90404, "epoch": 538} {"train_loss": -9.479893684387207, "global_step": 90405, "epoch": 538} {"train_loss": -9.324766159057617, "global_step": 90406, "epoch": 538} {"train_loss": -9.696962356567383, "global_step": 90407, "epoch": 538} {"train_loss": -9.41331672668457, "global_step": 90408, "epoch": 538} {"train_loss": -9.498994827270508, "global_step": 90409, "epoch": 538} {"train_loss": -9.112957000732422, "global_step": 90410, "epoch": 538} {"train_loss": -9.687503814697266, "global_step": 90411, "epoch": 538} {"train_loss": -9.034473419189453, "global_step": 90412, "epoch": 538} {"train_loss": -9.230026245117188, "global_step": 90413, "epoch": 538} {"train_loss": -9.459156036376953, "global_step": 90414, "epoch": 538} {"train_loss": -9.060897827148438, "global_step": 90415, "epoch": 538} {"train_loss": -9.506632804870605, "global_step": 90416, "epoch": 538} {"train_loss": -9.385820388793945, "global_step": 90417, "epoch": 538} {"train_loss": -9.466377258300781, "global_step": 90418, "epoch": 538} {"train_loss": -9.040729522705078, "global_step": 90419, "epoch": 538} {"train_loss": -9.15039348602295, "global_step": 90420, "epoch": 538} {"train_loss": -9.104745864868164, "global_step": 90421, "epoch": 538} {"train_loss": -9.13873291015625, "global_step": 90422, "epoch": 538} {"train_loss": -9.164044380187988, "global_step": 90423, "epoch": 538} {"train_loss": -9.282928466796875, "global_step": 90424, "epoch": 538} {"train_loss": -9.036401748657227, "global_step": 90425, "epoch": 538} {"train_loss": -9.281827926635742, "global_step": 90426, "epoch": 538} {"train_loss": -9.285100936889648, "global_step": 90427, "epoch": 538} {"train_loss": -9.263517379760742, "global_step": 90428, "epoch": 538} {"train_loss": -9.302718162536621, "global_step": 90429, "epoch": 538} {"train_loss": -9.307685852050781, "global_step": 90430, "epoch": 538} {"train_loss": -9.26953411102295, "global_step": 90431, "epoch": 538} {"train_loss": -9.302574157714844, "global_step": 90432, "epoch": 538} {"train_loss": -9.213582992553711, "global_step": 90433, "epoch": 538} {"train_loss": -9.437073707580566, "global_step": 90434, "epoch": 538} {"train_loss": -9.470165252685547, "global_step": 90435, "epoch": 538} {"train_loss": -9.459981918334961, "global_step": 90436, "epoch": 538} {"train_loss": -9.404598236083984, "global_step": 90437, "epoch": 538} {"train_loss": -9.45982551574707, "global_step": 90438, "epoch": 538} {"train_loss": -9.220928192138672, "global_step": 90439, "epoch": 538} {"train_loss": -9.564213752746582, "global_step": 90440, "epoch": 538} {"train_loss": -9.197093963623047, "global_step": 90441, "epoch": 538} {"train_loss": -8.993627548217773, "global_step": 90442, "epoch": 538} {"train_loss": -8.91938591003418, "global_step": 90443, "epoch": 538} {"train_loss": -9.387569427490234, "global_step": 90444, "epoch": 538} {"train_loss": -9.169323921203613, "global_step": 90445, "epoch": 538} {"train_loss": -9.252150535583496, "global_step": 90446, "epoch": 538} {"train_loss": -9.418294906616211, "global_step": 90447, "epoch": 538} {"train_loss": -9.280834197998047, "global_step": 90448, "epoch": 538} {"train_loss": -9.426074981689453, "global_step": 90449, "epoch": 538} {"train_loss": -9.566670417785645, "global_step": 90450, "epoch": 538} {"train_loss": -9.540471076965332, "global_step": 90451, "epoch": 538} {"train_loss": -9.358510971069336, "global_step": 90452, "epoch": 538} {"train_loss": -9.32699966430664, "global_step": 90453, "epoch": 538} {"train_loss": -9.54872989654541, "global_step": 90454, "epoch": 538} {"train_loss": -9.395910263061523, "global_step": 90455, "epoch": 538} {"train_loss": -9.404507637023926, "global_step": 90456, "epoch": 538} {"train_loss": -9.638391494750977, "global_step": 90457, "epoch": 538} {"train_loss": -9.442548751831055, "global_step": 90458, "epoch": 538} {"train_loss": -9.472347259521484, "global_step": 90459, "epoch": 538} {"train_loss": -9.42587661743164, "global_step": 90460, "epoch": 538} {"train_loss": -9.403426170349121, "global_step": 90461, "epoch": 538} {"train_loss": -9.687535285949707, "global_step": 90462, "epoch": 538} {"train_loss": -9.476715087890625, "global_step": 90463, "epoch": 538} {"train_loss": -9.563613891601562, "global_step": 90464, "epoch": 538} {"train_loss": -9.276958465576172, "global_step": 90465, "epoch": 538} {"train_loss": -9.736726760864258, "global_step": 90466, "epoch": 538} {"train_loss": -9.499601364135742, "global_step": 90467, "epoch": 538} {"train_loss": -9.400033950805664, "global_step": 90468, "epoch": 538} {"train_loss": -9.47590446472168, "global_step": 90469, "epoch": 538} {"train_loss": -9.561298370361328, "global_step": 90470, "epoch": 538} {"train_loss": -9.232820510864258, "global_step": 90471, "epoch": 538} {"train_loss": -9.330175399780273, "global_step": 90472, "epoch": 538} {"train_loss": -9.552923202514648, "global_step": 90473, "epoch": 538} {"train_loss": -9.061260223388672, "global_step": 90474, "epoch": 538} {"train_loss": -9.417654037475586, "global_step": 90475, "epoch": 538} {"train_loss": -8.784042358398438, "global_step": 90476, "epoch": 538} {"train_loss": -9.506233215332031, "global_step": 90477, "epoch": 538} {"train_loss": -8.96291446685791, "global_step": 90478, "epoch": 538} {"train_loss": -9.24592399597168, "global_step": 90479, "epoch": 538} {"train_loss": -9.220052719116211, "global_step": 90480, "epoch": 538} {"train_loss": -8.656330108642578, "global_step": 90481, "epoch": 538} {"train_loss": -9.452815055847168, "global_step": 90482, "epoch": 538} {"train_loss": -9.28304672241211, "global_step": 90483, "epoch": 538} {"train_loss": -9.372172355651855, "global_step": 90484, "epoch": 538} {"train_loss": -9.195463180541992, "global_step": 90485, "epoch": 538} {"train_loss": -9.23306655883789, "global_step": 90486, "epoch": 538} {"train_loss": -9.11485767364502, "global_step": 90487, "epoch": 538} {"train_loss": -9.23812484741211, "global_step": 90488, "epoch": 538} {"train_loss": -9.078592300415039, "global_step": 90489, "epoch": 538} {"train_loss": -9.380914688110352, "global_step": 90490, "epoch": 538} {"train_loss": -9.344379425048828, "global_step": 90491, "epoch": 538} {"train_loss": -9.049317359924316, "global_step": 90492, "epoch": 538} {"train_loss": -9.434181213378906, "global_step": 90493, "epoch": 538} {"train_loss": -9.557220458984375, "global_step": 90494, "epoch": 538} {"train_loss": -9.219584465026855, "global_step": 90495, "epoch": 538} {"train_loss": -9.26913070678711, "global_step": 90496, "epoch": 538} {"train_loss": -9.665754318237305, "global_step": 90497, "epoch": 538} {"train_loss": -9.032317161560059, "global_step": 90498, "epoch": 538} {"train_loss": -9.505757331848145, "global_step": 90499, "epoch": 538} {"train_loss": -9.410714149475098, "global_step": 90500, "epoch": 538} {"train_loss": -9.207597732543945, "global_step": 90501, "epoch": 538} {"train_loss": -9.539663314819336, "global_step": 90502, "epoch": 538} {"train_loss": -9.518360137939453, "global_step": 90503, "epoch": 538} {"train_loss": -9.498222351074219, "global_step": 90504, "epoch": 538} {"train_loss": -9.256084442138672, "global_step": 90505, "epoch": 538} {"train_loss": -9.491339683532715, "global_step": 90506, "epoch": 538} {"train_loss": -9.33388900756836, "global_step": 90507, "epoch": 538} {"train_loss": -9.684968948364258, "global_step": 90508, "epoch": 538} {"train_loss": -9.653642654418945, "global_step": 90509, "epoch": 538} {"train_loss": -9.214170455932617, "global_step": 90510, "epoch": 538} {"train_loss": -9.568185806274414, "global_step": 90511, "epoch": 538} {"train_loss": -9.496076583862305, "global_step": 90512, "epoch": 538} {"train_loss": -9.511249542236328, "global_step": 90513, "epoch": 538} {"train_loss": -9.257488250732422, "global_step": 90514, "epoch": 538} {"train_loss": -9.525918960571289, "global_step": 90515, "epoch": 538} {"train_loss": -9.41362476348877, "global_step": 90516, "epoch": 538} {"train_loss": -9.301746368408203, "global_step": 90517, "epoch": 538} {"train_loss": -9.301286697387695, "global_step": 90518, "epoch": 538} {"train_loss": -9.607158660888672, "global_step": 90519, "epoch": 538} {"train_loss": -9.395030975341797, "global_step": 90520, "epoch": 538} {"train_loss": -9.232351303100586, "global_step": 90521, "epoch": 538} {"train_loss": -9.566272735595703, "global_step": 90522, "epoch": 538} {"train_loss": -9.50810432434082, "global_step": 90523, "epoch": 538} {"train_loss": -8.720958709716797, "global_step": 90524, "epoch": 538} {"train_loss": -9.605531692504883, "global_step": 90525, "epoch": 538} {"train_loss": -9.316807746887207, "global_step": 90526, "epoch": 538} {"train_loss": -9.335798263549805, "global_step": 90527, "epoch": 538} {"train_loss": -9.350582122802734, "global_step": 90528, "epoch": 538} {"train_loss": -9.259035110473633, "global_step": 90529, "epoch": 538} {"train_loss": -9.603004455566406, "global_step": 90530, "epoch": 538} {"train_loss": -9.524125099182129, "global_step": 90531, "epoch": 538} {"train_loss": -9.422409057617188, "global_step": 90532, "epoch": 538} {"train_loss": -9.215717315673828, "global_step": 90533, "epoch": 538} {"train_loss": -9.354314804077148, "global_step": 90534, "epoch": 538} {"train_loss": -9.639098167419434, "global_step": 90535, "epoch": 538} {"train_loss": -9.551496505737305, "global_step": 90536, "epoch": 538} {"train_loss": -9.488877296447754, "global_step": 90537, "epoch": 538} {"train_loss": -9.715921401977539, "global_step": 90538, "epoch": 538} {"train_loss": -9.601875305175781, "global_step": 90539, "epoch": 538} {"train_loss": -9.501279830932617, "global_step": 90540, "epoch": 538} {"train_loss": -9.606345176696777, "global_step": 90541, "epoch": 538} {"train_loss": -9.310501098632812, "global_step": 90542, "epoch": 538} {"train_loss": -9.640571594238281, "global_step": 90543, "epoch": 538} {"train_loss": -9.177648544311523, "global_step": 90544, "epoch": 538} {"train_loss": -9.694669723510742, "global_step": 90545, "epoch": 538} {"train_loss": -9.073190689086914, "global_step": 90546, "epoch": 538} {"train_loss": -9.580863952636719, "global_step": 90547, "epoch": 538} {"train_loss": -9.544939041137695, "global_step": 90548, "epoch": 538} {"train_loss": -9.502655982971191, "global_step": 90549, "epoch": 538} {"train_loss": -9.383003234863281, "global_step": 90550, "epoch": 538} {"train_loss": -9.355734745661417, "global_step": 90551, "epoch": 538, "val_loss": 202211.453125} {"train_loss": -9.660536766052246, "global_step": 90552, "epoch": 539} {"train_loss": -9.647452354431152, "global_step": 90553, "epoch": 539} {"train_loss": -9.776968955993652, "global_step": 90554, "epoch": 539} {"train_loss": -9.558513641357422, "global_step": 90555, "epoch": 539} {"train_loss": -9.541573524475098, "global_step": 90556, "epoch": 539} {"train_loss": -9.471089363098145, "global_step": 90557, "epoch": 539} {"train_loss": -9.50925064086914, "global_step": 90558, "epoch": 539} {"train_loss": -9.801513671875, "global_step": 90559, "epoch": 539} {"train_loss": -9.517256736755371, "global_step": 90560, "epoch": 539} {"train_loss": -9.417342185974121, "global_step": 90561, "epoch": 539} {"train_loss": -9.487649917602539, "global_step": 90562, "epoch": 539} {"train_loss": -9.313810348510742, "global_step": 90563, "epoch": 539} {"train_loss": -9.514968872070312, "global_step": 90564, "epoch": 539} {"train_loss": -9.675278663635254, "global_step": 90565, "epoch": 539} {"train_loss": -9.526569366455078, "global_step": 90566, "epoch": 539} {"train_loss": -9.70947265625, "global_step": 90567, "epoch": 539} {"train_loss": -9.703533172607422, "global_step": 90568, "epoch": 539} {"train_loss": -9.823537826538086, "global_step": 90569, "epoch": 539} {"train_loss": -9.747787475585938, "global_step": 90570, "epoch": 539} {"train_loss": -9.418317794799805, "global_step": 90571, "epoch": 539} {"train_loss": -9.733821868896484, "global_step": 90572, "epoch": 539} {"train_loss": -9.39986515045166, "global_step": 90573, "epoch": 539} {"train_loss": -9.372048377990723, "global_step": 90574, "epoch": 539} {"train_loss": -9.52584457397461, "global_step": 90575, "epoch": 539} {"train_loss": -9.25819206237793, "global_step": 90576, "epoch": 539} {"train_loss": -9.57640266418457, "global_step": 90577, "epoch": 539} {"train_loss": -9.52391242980957, "global_step": 90578, "epoch": 539} {"train_loss": -9.43148136138916, "global_step": 90579, "epoch": 539} {"train_loss": -9.629794120788574, "global_step": 90580, "epoch": 539} {"train_loss": -9.184879302978516, "global_step": 90581, "epoch": 539} {"train_loss": -9.333022117614746, "global_step": 90582, "epoch": 539} {"train_loss": -9.477129936218262, "global_step": 90583, "epoch": 539} {"train_loss": -9.369977951049805, "global_step": 90584, "epoch": 539} {"train_loss": -9.467334747314453, "global_step": 90585, "epoch": 539} {"train_loss": -9.416489601135254, "global_step": 90586, "epoch": 539} {"train_loss": -9.020647048950195, "global_step": 90587, "epoch": 539} {"train_loss": -9.753681182861328, "global_step": 90588, "epoch": 539} {"train_loss": -9.277135848999023, "global_step": 90589, "epoch": 539} {"train_loss": -9.577548027038574, "global_step": 90590, "epoch": 539} {"train_loss": -9.412209510803223, "global_step": 90591, "epoch": 539} {"train_loss": -9.375155448913574, "global_step": 90592, "epoch": 539} {"train_loss": -9.124238014221191, "global_step": 90593, "epoch": 539} {"train_loss": -9.459319114685059, "global_step": 90594, "epoch": 539} {"train_loss": -9.385475158691406, "global_step": 90595, "epoch": 539} {"train_loss": -9.310978889465332, "global_step": 90596, "epoch": 539} {"train_loss": -9.341534614562988, "global_step": 90597, "epoch": 539} {"train_loss": -9.31934642791748, "global_step": 90598, "epoch": 539} {"train_loss": -9.396806716918945, "global_step": 90599, "epoch": 539} {"train_loss": -9.419164657592773, "global_step": 90600, "epoch": 539} {"train_loss": -9.276121139526367, "global_step": 90601, "epoch": 539} {"train_loss": -9.252957344055176, "global_step": 90602, "epoch": 539} {"train_loss": -9.377416610717773, "global_step": 90603, "epoch": 539} {"train_loss": -9.245165824890137, "global_step": 90604, "epoch": 539} {"train_loss": -9.368439674377441, "global_step": 90605, "epoch": 539} {"train_loss": -9.45046615600586, "global_step": 90606, "epoch": 539} {"train_loss": -9.472108840942383, "global_step": 90607, "epoch": 539} {"train_loss": -9.318534851074219, "global_step": 90608, "epoch": 539} {"train_loss": -9.490127563476562, "global_step": 90609, "epoch": 539} {"train_loss": -9.1875, "global_step": 90610, "epoch": 539} {"train_loss": -9.562337875366211, "global_step": 90611, "epoch": 539} {"train_loss": -9.372949600219727, "global_step": 90612, "epoch": 539} {"train_loss": -9.424453735351562, "global_step": 90613, "epoch": 539} {"train_loss": -9.365751266479492, "global_step": 90614, "epoch": 539} {"train_loss": -9.48367977142334, "global_step": 90615, "epoch": 539} {"train_loss": -9.471704483032227, "global_step": 90616, "epoch": 539} {"train_loss": -9.477109909057617, "global_step": 90617, "epoch": 539} {"train_loss": -9.445960998535156, "global_step": 90618, "epoch": 539} {"train_loss": -9.391551971435547, "global_step": 90619, "epoch": 539} {"train_loss": -9.266142845153809, "global_step": 90620, "epoch": 539} {"train_loss": -9.30717658996582, "global_step": 90621, "epoch": 539} {"train_loss": -9.606770515441895, "global_step": 90622, "epoch": 539} {"train_loss": -9.29959487915039, "global_step": 90623, "epoch": 539} {"train_loss": -9.349549293518066, "global_step": 90624, "epoch": 539} {"train_loss": -9.499391555786133, "global_step": 90625, "epoch": 539} {"train_loss": -9.144808769226074, "global_step": 90626, "epoch": 539} {"train_loss": -9.636737823486328, "global_step": 90627, "epoch": 539} {"train_loss": -9.298088073730469, "global_step": 90628, "epoch": 539} {"train_loss": -9.437050819396973, "global_step": 90629, "epoch": 539} {"train_loss": -9.369397163391113, "global_step": 90630, "epoch": 539} {"train_loss": -9.385692596435547, "global_step": 90631, "epoch": 539} {"train_loss": -9.467000961303711, "global_step": 90632, "epoch": 539} {"train_loss": -9.264406204223633, "global_step": 90633, "epoch": 539} {"train_loss": -9.095645904541016, "global_step": 90634, "epoch": 539} {"train_loss": -9.37894058227539, "global_step": 90635, "epoch": 539} {"train_loss": -9.292003631591797, "global_step": 90636, "epoch": 539} {"train_loss": -9.270347595214844, "global_step": 90637, "epoch": 539} {"train_loss": -9.428117752075195, "global_step": 90638, "epoch": 539} {"train_loss": -9.607366561889648, "global_step": 90639, "epoch": 539} {"train_loss": -9.596739768981934, "global_step": 90640, "epoch": 539} {"train_loss": -9.663579940795898, "global_step": 90641, "epoch": 539} {"train_loss": -9.818696022033691, "global_step": 90642, "epoch": 539} {"train_loss": -9.5971097946167, "global_step": 90643, "epoch": 539} {"train_loss": -9.759147644042969, "global_step": 90644, "epoch": 539} {"train_loss": -9.637503623962402, "global_step": 90645, "epoch": 539} {"train_loss": -9.504495620727539, "global_step": 90646, "epoch": 539} {"train_loss": -9.47411823272705, "global_step": 90647, "epoch": 539} {"train_loss": -9.54908275604248, "global_step": 90648, "epoch": 539} {"train_loss": -9.586227416992188, "global_step": 90649, "epoch": 539} {"train_loss": -9.354568481445312, "global_step": 90650, "epoch": 539} {"train_loss": -9.598540306091309, "global_step": 90651, "epoch": 539} {"train_loss": -9.383807182312012, "global_step": 90652, "epoch": 539} {"train_loss": -9.63565731048584, "global_step": 90653, "epoch": 539} {"train_loss": -9.536399841308594, "global_step": 90654, "epoch": 539} {"train_loss": -9.382942199707031, "global_step": 90655, "epoch": 539} {"train_loss": -9.60425090789795, "global_step": 90656, "epoch": 539} {"train_loss": -9.105273246765137, "global_step": 90657, "epoch": 539} {"train_loss": -9.206807136535645, "global_step": 90658, "epoch": 539} {"train_loss": -9.224752426147461, "global_step": 90659, "epoch": 539} {"train_loss": -9.055307388305664, "global_step": 90660, "epoch": 539} {"train_loss": -8.80111312866211, "global_step": 90661, "epoch": 539} {"train_loss": -9.071834564208984, "global_step": 90662, "epoch": 539} {"train_loss": -9.181390762329102, "global_step": 90663, "epoch": 539} {"train_loss": -9.480079650878906, "global_step": 90664, "epoch": 539} {"train_loss": -8.940256118774414, "global_step": 90665, "epoch": 539} {"train_loss": -9.071494102478027, "global_step": 90666, "epoch": 539} {"train_loss": -8.905135154724121, "global_step": 90667, "epoch": 539} {"train_loss": -9.228729248046875, "global_step": 90668, "epoch": 539} {"train_loss": -9.23451042175293, "global_step": 90669, "epoch": 539} {"train_loss": -9.255887031555176, "global_step": 90670, "epoch": 539} {"train_loss": -9.08593463897705, "global_step": 90671, "epoch": 539} {"train_loss": -9.321691513061523, "global_step": 90672, "epoch": 539} {"train_loss": -9.020793914794922, "global_step": 90673, "epoch": 539} {"train_loss": -9.168342590332031, "global_step": 90674, "epoch": 539} {"train_loss": -8.861989974975586, "global_step": 90675, "epoch": 539} {"train_loss": -9.180492401123047, "global_step": 90676, "epoch": 539} {"train_loss": -9.40505599975586, "global_step": 90677, "epoch": 539} {"train_loss": -9.02956771850586, "global_step": 90678, "epoch": 539} {"train_loss": -9.485300064086914, "global_step": 90679, "epoch": 539} {"train_loss": -9.082449913024902, "global_step": 90680, "epoch": 539} {"train_loss": -9.240558624267578, "global_step": 90681, "epoch": 539} {"train_loss": -9.112771987915039, "global_step": 90682, "epoch": 539} {"train_loss": -9.373339653015137, "global_step": 90683, "epoch": 539} {"train_loss": -9.37557601928711, "global_step": 90684, "epoch": 539} {"train_loss": -9.469717025756836, "global_step": 90685, "epoch": 539} {"train_loss": -9.150821685791016, "global_step": 90686, "epoch": 539} {"train_loss": -9.321823120117188, "global_step": 90687, "epoch": 539} {"train_loss": -9.452707290649414, "global_step": 90688, "epoch": 539} {"train_loss": -9.327079772949219, "global_step": 90689, "epoch": 539} {"train_loss": -9.610626220703125, "global_step": 90690, "epoch": 539} {"train_loss": -9.367206573486328, "global_step": 90691, "epoch": 539} {"train_loss": -9.424077987670898, "global_step": 90692, "epoch": 539} {"train_loss": -9.433185577392578, "global_step": 90693, "epoch": 539} {"train_loss": -9.40262222290039, "global_step": 90694, "epoch": 539} {"train_loss": -9.632454872131348, "global_step": 90695, "epoch": 539} {"train_loss": -9.362616539001465, "global_step": 90696, "epoch": 539} {"train_loss": -9.517067909240723, "global_step": 90697, "epoch": 539} {"train_loss": -9.664909362792969, "global_step": 90698, "epoch": 539} {"train_loss": -9.455263137817383, "global_step": 90699, "epoch": 539} {"train_loss": -9.616840362548828, "global_step": 90700, "epoch": 539} {"train_loss": -9.45359992980957, "global_step": 90701, "epoch": 539} {"train_loss": -9.727432250976562, "global_step": 90702, "epoch": 539} {"train_loss": -9.625282287597656, "global_step": 90703, "epoch": 539} {"train_loss": -9.570383071899414, "global_step": 90704, "epoch": 539} {"train_loss": -9.697755813598633, "global_step": 90705, "epoch": 539} {"train_loss": -9.63026237487793, "global_step": 90706, "epoch": 539} {"train_loss": -9.703041076660156, "global_step": 90707, "epoch": 539} {"train_loss": -9.566425323486328, "global_step": 90708, "epoch": 539} {"train_loss": -9.504826545715332, "global_step": 90709, "epoch": 539} {"train_loss": -9.59581184387207, "global_step": 90710, "epoch": 539} {"train_loss": -9.313490867614746, "global_step": 90711, "epoch": 539} {"train_loss": -9.399566650390625, "global_step": 90712, "epoch": 539} {"train_loss": -9.439964294433594, "global_step": 90713, "epoch": 539} {"train_loss": -9.48244857788086, "global_step": 90714, "epoch": 539} {"train_loss": -9.025779724121094, "global_step": 90715, "epoch": 539} {"train_loss": -9.148200035095215, "global_step": 90716, "epoch": 539} {"train_loss": -9.635726928710938, "global_step": 90717, "epoch": 539} {"train_loss": -9.167943954467773, "global_step": 90718, "epoch": 539} {"train_loss": -9.409464353606815, "global_step": 90719, "epoch": 539, "val_loss": 201695.3125} {"train_loss": -9.44933795928955, "global_step": 90720, "epoch": 540} {"train_loss": -9.269905090332031, "global_step": 90721, "epoch": 540} {"train_loss": -9.445161819458008, "global_step": 90722, "epoch": 540} {"train_loss": -9.41265869140625, "global_step": 90723, "epoch": 540} {"train_loss": -9.339210510253906, "global_step": 90724, "epoch": 540} {"train_loss": -9.459977149963379, "global_step": 90725, "epoch": 540} {"train_loss": -9.13890266418457, "global_step": 90726, "epoch": 540} {"train_loss": -9.308491706848145, "global_step": 90727, "epoch": 540} {"train_loss": -9.438623428344727, "global_step": 90728, "epoch": 540} {"train_loss": -9.233050346374512, "global_step": 90729, "epoch": 540} {"train_loss": -9.427325248718262, "global_step": 90730, "epoch": 540} {"train_loss": -9.197429656982422, "global_step": 90731, "epoch": 540} {"train_loss": -9.434257507324219, "global_step": 90732, "epoch": 540} {"train_loss": -9.252765655517578, "global_step": 90733, "epoch": 540} {"train_loss": -9.3756742477417, "global_step": 90734, "epoch": 540} {"train_loss": -9.316082000732422, "global_step": 90735, "epoch": 540} {"train_loss": -9.343095779418945, "global_step": 90736, "epoch": 540} {"train_loss": -9.449182510375977, "global_step": 90737, "epoch": 540} {"train_loss": -9.412615776062012, "global_step": 90738, "epoch": 540} {"train_loss": -9.388822555541992, "global_step": 90739, "epoch": 540} {"train_loss": -9.42936897277832, "global_step": 90740, "epoch": 540} {"train_loss": -9.313232421875, "global_step": 90741, "epoch": 540} {"train_loss": -9.56132984161377, "global_step": 90742, "epoch": 540} {"train_loss": -9.456567764282227, "global_step": 90743, "epoch": 540} {"train_loss": -9.550148010253906, "global_step": 90744, "epoch": 540} {"train_loss": -9.43912124633789, "global_step": 90745, "epoch": 540} {"train_loss": -9.719879150390625, "global_step": 90746, "epoch": 540} {"train_loss": -9.520598411560059, "global_step": 90747, "epoch": 540} {"train_loss": -9.476709365844727, "global_step": 90748, "epoch": 540} {"train_loss": -9.668082237243652, "global_step": 90749, "epoch": 540} {"train_loss": -9.683422088623047, "global_step": 90750, "epoch": 540} {"train_loss": -9.50721549987793, "global_step": 90751, "epoch": 540} {"train_loss": -9.651312828063965, "global_step": 90752, "epoch": 540} {"train_loss": -9.49880599975586, "global_step": 90753, "epoch": 540} {"train_loss": -9.546085357666016, "global_step": 90754, "epoch": 540} {"train_loss": -9.776339530944824, "global_step": 90755, "epoch": 540} {"train_loss": -9.210715293884277, "global_step": 90756, "epoch": 540} {"train_loss": -9.414340019226074, "global_step": 90757, "epoch": 540} {"train_loss": -9.651278495788574, "global_step": 90758, "epoch": 540} {"train_loss": -9.562444686889648, "global_step": 90759, "epoch": 540} {"train_loss": -9.60860824584961, "global_step": 90760, "epoch": 540} {"train_loss": -9.413468360900879, "global_step": 90761, "epoch": 540} {"train_loss": -9.551591873168945, "global_step": 90762, "epoch": 540} {"train_loss": -9.798189163208008, "global_step": 90763, "epoch": 540} {"train_loss": -9.562905311584473, "global_step": 90764, "epoch": 540} {"train_loss": -9.452911376953125, "global_step": 90765, "epoch": 540} {"train_loss": -9.557517051696777, "global_step": 90766, "epoch": 540} {"train_loss": -9.380132675170898, "global_step": 90767, "epoch": 540} {"train_loss": -9.65217113494873, "global_step": 90768, "epoch": 540} {"train_loss": -9.140689849853516, "global_step": 90769, "epoch": 540} {"train_loss": -9.178967475891113, "global_step": 90770, "epoch": 540} {"train_loss": -9.35873794555664, "global_step": 90771, "epoch": 540} {"train_loss": -9.409478187561035, "global_step": 90772, "epoch": 540} {"train_loss": -9.298575401306152, "global_step": 90773, "epoch": 540} {"train_loss": -9.223875045776367, "global_step": 90774, "epoch": 540} {"train_loss": -9.394744873046875, "global_step": 90775, "epoch": 540} {"train_loss": -9.300256729125977, "global_step": 90776, "epoch": 540} {"train_loss": -9.39501953125, "global_step": 90777, "epoch": 540} {"train_loss": -9.22254753112793, "global_step": 90778, "epoch": 540} {"train_loss": -9.444928169250488, "global_step": 90779, "epoch": 540} {"train_loss": -9.48055648803711, "global_step": 90780, "epoch": 540} {"train_loss": -9.412834167480469, "global_step": 90781, "epoch": 540} {"train_loss": -9.582088470458984, "global_step": 90782, "epoch": 540} {"train_loss": -9.525114059448242, "global_step": 90783, "epoch": 540} {"train_loss": -9.531075477600098, "global_step": 90784, "epoch": 540} {"train_loss": -9.238845825195312, "global_step": 90785, "epoch": 540} {"train_loss": -9.425516128540039, "global_step": 90786, "epoch": 540} {"train_loss": -9.496710777282715, "global_step": 90787, "epoch": 540} {"train_loss": -9.4302978515625, "global_step": 90788, "epoch": 540} {"train_loss": -9.380849838256836, "global_step": 90789, "epoch": 540} {"train_loss": -9.505971908569336, "global_step": 90790, "epoch": 540} {"train_loss": -9.329712867736816, "global_step": 90791, "epoch": 540} {"train_loss": -9.443880081176758, "global_step": 90792, "epoch": 540} {"train_loss": -9.517712593078613, "global_step": 90793, "epoch": 540} {"train_loss": -9.334136962890625, "global_step": 90794, "epoch": 540} {"train_loss": -9.68701171875, "global_step": 90795, "epoch": 540} {"train_loss": -9.311161041259766, "global_step": 90796, "epoch": 540} {"train_loss": -9.758565902709961, "global_step": 90797, "epoch": 540} {"train_loss": -9.224438667297363, "global_step": 90798, "epoch": 540} {"train_loss": -9.494492530822754, "global_step": 90799, "epoch": 540} {"train_loss": -9.38071060180664, "global_step": 90800, "epoch": 540} {"train_loss": -9.616328239440918, "global_step": 90801, "epoch": 540} {"train_loss": -9.474446296691895, "global_step": 90802, "epoch": 540} {"train_loss": -9.541032791137695, "global_step": 90803, "epoch": 540} {"train_loss": -9.535511016845703, "global_step": 90804, "epoch": 540} {"train_loss": -9.633570671081543, "global_step": 90805, "epoch": 540} {"train_loss": -9.615350723266602, "global_step": 90806, "epoch": 540} {"train_loss": -9.567903518676758, "global_step": 90807, "epoch": 540} {"train_loss": -9.310104370117188, "global_step": 90808, "epoch": 540} {"train_loss": -9.576860427856445, "global_step": 90809, "epoch": 540} {"train_loss": -9.522162437438965, "global_step": 90810, "epoch": 540} {"train_loss": -9.653644561767578, "global_step": 90811, "epoch": 540} {"train_loss": -9.489564895629883, "global_step": 90812, "epoch": 540} {"train_loss": -9.171368598937988, "global_step": 90813, "epoch": 540} {"train_loss": -9.326387405395508, "global_step": 90814, "epoch": 540} {"train_loss": -9.289721488952637, "global_step": 90815, "epoch": 540} {"train_loss": -9.13833236694336, "global_step": 90816, "epoch": 540} {"train_loss": -9.084272384643555, "global_step": 90817, "epoch": 540} {"train_loss": -9.23907470703125, "global_step": 90818, "epoch": 540} {"train_loss": -9.495817184448242, "global_step": 90819, "epoch": 540} {"train_loss": -9.306947708129883, "global_step": 90820, "epoch": 540} {"train_loss": -9.346672058105469, "global_step": 90821, "epoch": 540} {"train_loss": -9.449206352233887, "global_step": 90822, "epoch": 540} {"train_loss": -9.122274398803711, "global_step": 90823, "epoch": 540} {"train_loss": -9.444639205932617, "global_step": 90824, "epoch": 540} {"train_loss": -9.122610092163086, "global_step": 90825, "epoch": 540} {"train_loss": -9.468502044677734, "global_step": 90826, "epoch": 540} {"train_loss": -9.171424865722656, "global_step": 90827, "epoch": 540} {"train_loss": -9.302034378051758, "global_step": 90828, "epoch": 540} {"train_loss": -9.194921493530273, "global_step": 90829, "epoch": 540} {"train_loss": -9.354388236999512, "global_step": 90830, "epoch": 540} {"train_loss": -9.33397102355957, "global_step": 90831, "epoch": 540} {"train_loss": -9.252267837524414, "global_step": 90832, "epoch": 540} {"train_loss": -9.415104866027832, "global_step": 90833, "epoch": 540} {"train_loss": -9.690540313720703, "global_step": 90834, "epoch": 540} {"train_loss": -9.348296165466309, "global_step": 90835, "epoch": 540} {"train_loss": -9.468469619750977, "global_step": 90836, "epoch": 540} {"train_loss": -9.281076431274414, "global_step": 90837, "epoch": 540} {"train_loss": -9.577672958374023, "global_step": 90838, "epoch": 540} {"train_loss": -9.369619369506836, "global_step": 90839, "epoch": 540} {"train_loss": -9.560070991516113, "global_step": 90840, "epoch": 540} {"train_loss": -9.512059211730957, "global_step": 90841, "epoch": 540} {"train_loss": -9.307401657104492, "global_step": 90842, "epoch": 540} {"train_loss": -9.546316146850586, "global_step": 90843, "epoch": 540} {"train_loss": -9.613504409790039, "global_step": 90844, "epoch": 540} {"train_loss": -9.456564903259277, "global_step": 90845, "epoch": 540} {"train_loss": -9.420799255371094, "global_step": 90846, "epoch": 540} {"train_loss": -9.49354362487793, "global_step": 90847, "epoch": 540} {"train_loss": -9.299908638000488, "global_step": 90848, "epoch": 540} {"train_loss": -9.591117858886719, "global_step": 90849, "epoch": 540} {"train_loss": -9.46651840209961, "global_step": 90850, "epoch": 540} {"train_loss": -9.399242401123047, "global_step": 90851, "epoch": 540} {"train_loss": -9.672301292419434, "global_step": 90852, "epoch": 540} {"train_loss": -9.582904815673828, "global_step": 90853, "epoch": 540} {"train_loss": -9.520556449890137, "global_step": 90854, "epoch": 540} {"train_loss": -9.749857902526855, "global_step": 90855, "epoch": 540} {"train_loss": -9.375494956970215, "global_step": 90856, "epoch": 540} {"train_loss": -9.609554290771484, "global_step": 90857, "epoch": 540} {"train_loss": -9.380725860595703, "global_step": 90858, "epoch": 540} {"train_loss": -9.228641510009766, "global_step": 90859, "epoch": 540} {"train_loss": -9.677785873413086, "global_step": 90860, "epoch": 540} {"train_loss": -9.370400428771973, "global_step": 90861, "epoch": 540} {"train_loss": -9.390313148498535, "global_step": 90862, "epoch": 540} {"train_loss": -9.46347713470459, "global_step": 90863, "epoch": 540} {"train_loss": -9.560441970825195, "global_step": 90864, "epoch": 540} {"train_loss": -9.565756797790527, "global_step": 90865, "epoch": 540} {"train_loss": -9.46029281616211, "global_step": 90866, "epoch": 540} {"train_loss": -9.513460159301758, "global_step": 90867, "epoch": 540} {"train_loss": -9.138524055480957, "global_step": 90868, "epoch": 540} {"train_loss": -9.538057327270508, "global_step": 90869, "epoch": 540} {"train_loss": -9.525128364562988, "global_step": 90870, "epoch": 540} {"train_loss": -9.43543815612793, "global_step": 90871, "epoch": 540} {"train_loss": -9.31716537475586, "global_step": 90872, "epoch": 540} {"train_loss": -9.200961112976074, "global_step": 90873, "epoch": 540} {"train_loss": -9.380563735961914, "global_step": 90874, "epoch": 540} {"train_loss": -9.227147102355957, "global_step": 90875, "epoch": 540} {"train_loss": -9.416266441345215, "global_step": 90876, "epoch": 540} {"train_loss": -9.35336685180664, "global_step": 90877, "epoch": 540} {"train_loss": -9.499982833862305, "global_step": 90878, "epoch": 540} {"train_loss": -9.384170532226562, "global_step": 90879, "epoch": 540} {"train_loss": -9.247834205627441, "global_step": 90880, "epoch": 540} {"train_loss": -9.338529586791992, "global_step": 90881, "epoch": 540} {"train_loss": -9.302705764770508, "global_step": 90882, "epoch": 540} {"train_loss": -9.346631050109863, "global_step": 90883, "epoch": 540} {"train_loss": -9.68282699584961, "global_step": 90884, "epoch": 540} {"train_loss": -9.470481872558594, "global_step": 90885, "epoch": 540} {"train_loss": -9.427356719970703, "global_step": 90886, "epoch": 540} {"train_loss": -9.43068756375994, "global_step": 90887, "epoch": 540, "val_loss": 203718.78125, "train_action_mse_error": 2.8136706352233887} {"train_loss": -9.47864818572998, "global_step": 90888, "epoch": 541} {"train_loss": -9.278592109680176, "global_step": 90889, "epoch": 541} {"train_loss": -9.32844066619873, "global_step": 90890, "epoch": 541} {"train_loss": -9.752976417541504, "global_step": 90891, "epoch": 541} {"train_loss": -9.474152565002441, "global_step": 90892, "epoch": 541} {"train_loss": -9.512571334838867, "global_step": 90893, "epoch": 541} {"train_loss": -9.435678482055664, "global_step": 90894, "epoch": 541} {"train_loss": -9.605559349060059, "global_step": 90895, "epoch": 541} {"train_loss": -9.418926239013672, "global_step": 90896, "epoch": 541} {"train_loss": -9.458539009094238, "global_step": 90897, "epoch": 541} {"train_loss": -9.698760986328125, "global_step": 90898, "epoch": 541} {"train_loss": -9.59029769897461, "global_step": 90899, "epoch": 541} {"train_loss": -9.512555122375488, "global_step": 90900, "epoch": 541} {"train_loss": -9.58755111694336, "global_step": 90901, "epoch": 541} {"train_loss": -9.544876098632812, "global_step": 90902, "epoch": 541} {"train_loss": -9.415813446044922, "global_step": 90903, "epoch": 541} {"train_loss": -9.242202758789062, "global_step": 90904, "epoch": 541} {"train_loss": -9.129941940307617, "global_step": 90905, "epoch": 541} {"train_loss": -9.113450050354004, "global_step": 90906, "epoch": 541} {"train_loss": -8.94627571105957, "global_step": 90907, "epoch": 541} {"train_loss": -9.184354782104492, "global_step": 90908, "epoch": 541} {"train_loss": -9.356766700744629, "global_step": 90909, "epoch": 541} {"train_loss": -8.324609756469727, "global_step": 90910, "epoch": 541} {"train_loss": -9.237112045288086, "global_step": 90911, "epoch": 541} {"train_loss": -8.836638450622559, "global_step": 90912, "epoch": 541} {"train_loss": -9.22143268585205, "global_step": 90913, "epoch": 541} {"train_loss": -9.252683639526367, "global_step": 90914, "epoch": 541} {"train_loss": -9.185111045837402, "global_step": 90915, "epoch": 541} {"train_loss": -9.084909439086914, "global_step": 90916, "epoch": 541} {"train_loss": -9.558847427368164, "global_step": 90917, "epoch": 541} {"train_loss": -9.449061393737793, "global_step": 90918, "epoch": 541} {"train_loss": -8.978556632995605, "global_step": 90919, "epoch": 541} {"train_loss": -9.304122924804688, "global_step": 90920, "epoch": 541} {"train_loss": -9.156035423278809, "global_step": 90921, "epoch": 541} {"train_loss": -9.492176055908203, "global_step": 90922, "epoch": 541} {"train_loss": -9.22810173034668, "global_step": 90923, "epoch": 541} {"train_loss": -9.49020004272461, "global_step": 90924, "epoch": 541} {"train_loss": -9.42888355255127, "global_step": 90925, "epoch": 541} {"train_loss": -9.361265182495117, "global_step": 90926, "epoch": 541} {"train_loss": -9.665781021118164, "global_step": 90927, "epoch": 541} {"train_loss": -9.454549789428711, "global_step": 90928, "epoch": 541} {"train_loss": -9.61874008178711, "global_step": 90929, "epoch": 541} {"train_loss": -9.562149047851562, "global_step": 90930, "epoch": 541} {"train_loss": -9.348916053771973, "global_step": 90931, "epoch": 541} {"train_loss": -9.480319023132324, "global_step": 90932, "epoch": 541} {"train_loss": -9.42906665802002, "global_step": 90933, "epoch": 541} {"train_loss": -9.45199203491211, "global_step": 90934, "epoch": 541} {"train_loss": -9.707599639892578, "global_step": 90935, "epoch": 541} {"train_loss": -9.560096740722656, "global_step": 90936, "epoch": 541} {"train_loss": -9.700576782226562, "global_step": 90937, "epoch": 541} {"train_loss": -9.503379821777344, "global_step": 90938, "epoch": 541} {"train_loss": -9.403119087219238, "global_step": 90939, "epoch": 541} {"train_loss": -9.353391647338867, "global_step": 90940, "epoch": 541} {"train_loss": -9.55328369140625, "global_step": 90941, "epoch": 541} {"train_loss": -9.487815856933594, "global_step": 90942, "epoch": 541} {"train_loss": -9.37654972076416, "global_step": 90943, "epoch": 541} {"train_loss": -9.687271118164062, "global_step": 90944, "epoch": 541} {"train_loss": -9.596967697143555, "global_step": 90945, "epoch": 541} {"train_loss": -9.274784088134766, "global_step": 90946, "epoch": 541} {"train_loss": -9.480815887451172, "global_step": 90947, "epoch": 541} {"train_loss": -9.581787109375, "global_step": 90948, "epoch": 541} {"train_loss": -9.784465789794922, "global_step": 90949, "epoch": 541} {"train_loss": -9.575885772705078, "global_step": 90950, "epoch": 541} {"train_loss": -9.566984176635742, "global_step": 90951, "epoch": 541} {"train_loss": -9.817415237426758, "global_step": 90952, "epoch": 541} {"train_loss": -9.664623260498047, "global_step": 90953, "epoch": 541} {"train_loss": -9.7244873046875, "global_step": 90954, "epoch": 541} {"train_loss": -9.627273559570312, "global_step": 90955, "epoch": 541} {"train_loss": -9.54172134399414, "global_step": 90956, "epoch": 541} {"train_loss": -9.312294960021973, "global_step": 90957, "epoch": 541} {"train_loss": -9.433330535888672, "global_step": 90958, "epoch": 541} {"train_loss": -9.28957748413086, "global_step": 90959, "epoch": 541} {"train_loss": -8.765668869018555, "global_step": 90960, "epoch": 541} {"train_loss": -9.506136894226074, "global_step": 90961, "epoch": 541} {"train_loss": -9.08614730834961, "global_step": 90962, "epoch": 541} {"train_loss": -9.466862678527832, "global_step": 90963, "epoch": 541} {"train_loss": -9.045149803161621, "global_step": 90964, "epoch": 541} {"train_loss": -9.386457443237305, "global_step": 90965, "epoch": 541} {"train_loss": -9.07618522644043, "global_step": 90966, "epoch": 541} {"train_loss": -9.338338851928711, "global_step": 90967, "epoch": 541} {"train_loss": -9.525237083435059, "global_step": 90968, "epoch": 541} {"train_loss": -9.377584457397461, "global_step": 90969, "epoch": 541} {"train_loss": -9.235508918762207, "global_step": 90970, "epoch": 541} {"train_loss": -9.307966232299805, "global_step": 90971, "epoch": 541} {"train_loss": -9.292888641357422, "global_step": 90972, "epoch": 541} {"train_loss": -9.600737571716309, "global_step": 90973, "epoch": 541} {"train_loss": -9.315967559814453, "global_step": 90974, "epoch": 541} {"train_loss": -9.406608581542969, "global_step": 90975, "epoch": 541} {"train_loss": -9.64077091217041, "global_step": 90976, "epoch": 541} {"train_loss": -9.419061660766602, "global_step": 90977, "epoch": 541} {"train_loss": -9.34803295135498, "global_step": 90978, "epoch": 541} {"train_loss": -9.248868942260742, "global_step": 90979, "epoch": 541} {"train_loss": -9.373191833496094, "global_step": 90980, "epoch": 541} {"train_loss": -9.266498565673828, "global_step": 90981, "epoch": 541} {"train_loss": -9.234783172607422, "global_step": 90982, "epoch": 541} {"train_loss": -9.935218811035156, "global_step": 90983, "epoch": 541} {"train_loss": -9.394548416137695, "global_step": 90984, "epoch": 541} {"train_loss": -9.63387680053711, "global_step": 90985, "epoch": 541} {"train_loss": -9.74464225769043, "global_step": 90986, "epoch": 541} {"train_loss": -9.383708000183105, "global_step": 90987, "epoch": 541} {"train_loss": -9.429752349853516, "global_step": 90988, "epoch": 541} {"train_loss": -9.48464584350586, "global_step": 90989, "epoch": 541} {"train_loss": -9.596817970275879, "global_step": 90990, "epoch": 541} {"train_loss": -9.593039512634277, "global_step": 90991, "epoch": 541} {"train_loss": -9.61259651184082, "global_step": 90992, "epoch": 541} {"train_loss": -9.571877479553223, "global_step": 90993, "epoch": 541} {"train_loss": -9.535058975219727, "global_step": 90994, "epoch": 541} {"train_loss": -9.635929107666016, "global_step": 90995, "epoch": 541} {"train_loss": -9.333694458007812, "global_step": 90996, "epoch": 541} {"train_loss": -9.517744064331055, "global_step": 90997, "epoch": 541} {"train_loss": -9.611551284790039, "global_step": 90998, "epoch": 541} {"train_loss": -9.699624061584473, "global_step": 90999, "epoch": 541} {"train_loss": -9.582504272460938, "global_step": 91000, "epoch": 541} {"train_loss": -9.681038856506348, "global_step": 91001, "epoch": 541} {"train_loss": -9.487616539001465, "global_step": 91002, "epoch": 541} {"train_loss": -9.591997146606445, "global_step": 91003, "epoch": 541} {"train_loss": -9.758630752563477, "global_step": 91004, "epoch": 541} {"train_loss": -9.305841445922852, "global_step": 91005, "epoch": 541} {"train_loss": -9.47430419921875, "global_step": 91006, "epoch": 541} {"train_loss": -9.458602905273438, "global_step": 91007, "epoch": 541} {"train_loss": -9.343648910522461, "global_step": 91008, "epoch": 541} {"train_loss": -9.701929092407227, "global_step": 91009, "epoch": 541} {"train_loss": -9.544754981994629, "global_step": 91010, "epoch": 541} {"train_loss": -9.425668716430664, "global_step": 91011, "epoch": 541} {"train_loss": -9.518218040466309, "global_step": 91012, "epoch": 541} {"train_loss": -9.511117935180664, "global_step": 91013, "epoch": 541} {"train_loss": -9.699670791625977, "global_step": 91014, "epoch": 541} {"train_loss": -9.387187957763672, "global_step": 91015, "epoch": 541} {"train_loss": -9.373785018920898, "global_step": 91016, "epoch": 541} {"train_loss": -9.583580017089844, "global_step": 91017, "epoch": 541} {"train_loss": -9.560039520263672, "global_step": 91018, "epoch": 541} {"train_loss": -9.15561294555664, "global_step": 91019, "epoch": 541} {"train_loss": -9.415546417236328, "global_step": 91020, "epoch": 541} {"train_loss": -9.448086738586426, "global_step": 91021, "epoch": 541} {"train_loss": -9.806368827819824, "global_step": 91022, "epoch": 541} {"train_loss": -9.679521560668945, "global_step": 91023, "epoch": 541} {"train_loss": -9.56871223449707, "global_step": 91024, "epoch": 541} {"train_loss": -9.652900695800781, "global_step": 91025, "epoch": 541} {"train_loss": -9.562952041625977, "global_step": 91026, "epoch": 541} {"train_loss": -9.345754623413086, "global_step": 91027, "epoch": 541} {"train_loss": -9.519002914428711, "global_step": 91028, "epoch": 541} {"train_loss": -9.511322021484375, "global_step": 91029, "epoch": 541} {"train_loss": -9.164127349853516, "global_step": 91030, "epoch": 541} {"train_loss": -9.399642944335938, "global_step": 91031, "epoch": 541} {"train_loss": -9.613672256469727, "global_step": 91032, "epoch": 541} {"train_loss": -9.201065063476562, "global_step": 91033, "epoch": 541} {"train_loss": -9.422950744628906, "global_step": 91034, "epoch": 541} {"train_loss": -9.337072372436523, "global_step": 91035, "epoch": 541} {"train_loss": -9.452231407165527, "global_step": 91036, "epoch": 541} {"train_loss": -9.466184616088867, "global_step": 91037, "epoch": 541} {"train_loss": -9.47627067565918, "global_step": 91038, "epoch": 541} {"train_loss": -9.290996551513672, "global_step": 91039, "epoch": 541} {"train_loss": -9.0940523147583, "global_step": 91040, "epoch": 541} {"train_loss": -9.368816375732422, "global_step": 91041, "epoch": 541} {"train_loss": -9.385814666748047, "global_step": 91042, "epoch": 541} {"train_loss": -9.56303596496582, "global_step": 91043, "epoch": 541} {"train_loss": -9.396543502807617, "global_step": 91044, "epoch": 541} {"train_loss": -9.439510345458984, "global_step": 91045, "epoch": 541} {"train_loss": -9.260249137878418, "global_step": 91046, "epoch": 541} {"train_loss": -9.560237884521484, "global_step": 91047, "epoch": 541} {"train_loss": -9.326421737670898, "global_step": 91048, "epoch": 541} {"train_loss": -9.521574020385742, "global_step": 91049, "epoch": 541} {"train_loss": -9.499082565307617, "global_step": 91050, "epoch": 541} {"train_loss": -9.514671325683594, "global_step": 91051, "epoch": 541} {"train_loss": -9.406577110290527, "global_step": 91052, "epoch": 541} {"train_loss": -9.454014778137207, "global_step": 91053, "epoch": 541} {"train_loss": -9.601760864257812, "global_step": 91054, "epoch": 541} {"train_loss": -9.438215340886797, "global_step": 91055, "epoch": 541, "val_loss": 200831.734375} {"train_loss": -9.638525009155273, "global_step": 91056, "epoch": 542} {"train_loss": -9.574249267578125, "global_step": 91057, "epoch": 542} {"train_loss": -9.493581771850586, "global_step": 91058, "epoch": 542} {"train_loss": -9.681449890136719, "global_step": 91059, "epoch": 542} {"train_loss": -9.341115951538086, "global_step": 91060, "epoch": 542} {"train_loss": -9.102373123168945, "global_step": 91061, "epoch": 542} {"train_loss": -9.628504753112793, "global_step": 91062, "epoch": 542} {"train_loss": -9.140294075012207, "global_step": 91063, "epoch": 542} {"train_loss": -9.503673553466797, "global_step": 91064, "epoch": 542} {"train_loss": -9.36799430847168, "global_step": 91065, "epoch": 542} {"train_loss": -9.48133659362793, "global_step": 91066, "epoch": 542} {"train_loss": -9.496014595031738, "global_step": 91067, "epoch": 542} {"train_loss": -9.47745132446289, "global_step": 91068, "epoch": 542} {"train_loss": -9.44609260559082, "global_step": 91069, "epoch": 542} {"train_loss": -9.54186725616455, "global_step": 91070, "epoch": 542} {"train_loss": -9.541955947875977, "global_step": 91071, "epoch": 542} {"train_loss": -9.457170486450195, "global_step": 91072, "epoch": 542} {"train_loss": -9.481414794921875, "global_step": 91073, "epoch": 542} {"train_loss": -9.702573776245117, "global_step": 91074, "epoch": 542} {"train_loss": -9.329719543457031, "global_step": 91075, "epoch": 542} {"train_loss": -9.321504592895508, "global_step": 91076, "epoch": 542} {"train_loss": -9.388065338134766, "global_step": 91077, "epoch": 542} {"train_loss": -9.327744483947754, "global_step": 91078, "epoch": 542} {"train_loss": -9.413018226623535, "global_step": 91079, "epoch": 542} {"train_loss": -9.636232376098633, "global_step": 91080, "epoch": 542} {"train_loss": -9.406192779541016, "global_step": 91081, "epoch": 542} {"train_loss": -9.134696960449219, "global_step": 91082, "epoch": 542} {"train_loss": -9.351905822753906, "global_step": 91083, "epoch": 542} {"train_loss": -9.146767616271973, "global_step": 91084, "epoch": 542} {"train_loss": -9.346158981323242, "global_step": 91085, "epoch": 542} {"train_loss": -8.929468154907227, "global_step": 91086, "epoch": 542} {"train_loss": -9.443151473999023, "global_step": 91087, "epoch": 542} {"train_loss": -9.047933578491211, "global_step": 91088, "epoch": 542} {"train_loss": -9.44896125793457, "global_step": 91089, "epoch": 542} {"train_loss": -9.173055648803711, "global_step": 91090, "epoch": 542} {"train_loss": -9.390079498291016, "global_step": 91091, "epoch": 542} {"train_loss": -9.039548873901367, "global_step": 91092, "epoch": 542} {"train_loss": -9.370382308959961, "global_step": 91093, "epoch": 542} {"train_loss": -9.160192489624023, "global_step": 91094, "epoch": 542} {"train_loss": -9.228267669677734, "global_step": 91095, "epoch": 542} {"train_loss": -8.99783706665039, "global_step": 91096, "epoch": 542} {"train_loss": -9.270376205444336, "global_step": 91097, "epoch": 542} {"train_loss": -9.123979568481445, "global_step": 91098, "epoch": 542} {"train_loss": -9.432872772216797, "global_step": 91099, "epoch": 542} {"train_loss": -9.369194030761719, "global_step": 91100, "epoch": 542} {"train_loss": -9.481505393981934, "global_step": 91101, "epoch": 542} {"train_loss": -9.464466094970703, "global_step": 91102, "epoch": 542} {"train_loss": -9.37990951538086, "global_step": 91103, "epoch": 542} {"train_loss": -9.503536224365234, "global_step": 91104, "epoch": 542} {"train_loss": -9.279735565185547, "global_step": 91105, "epoch": 542} {"train_loss": -9.6379976272583, "global_step": 91106, "epoch": 542} {"train_loss": -9.597980499267578, "global_step": 91107, "epoch": 542} {"train_loss": -9.557676315307617, "global_step": 91108, "epoch": 542} {"train_loss": -9.610212326049805, "global_step": 91109, "epoch": 542} {"train_loss": -9.437261581420898, "global_step": 91110, "epoch": 542} {"train_loss": -9.416082382202148, "global_step": 91111, "epoch": 542} {"train_loss": -9.564458847045898, "global_step": 91112, "epoch": 542} {"train_loss": -9.44747543334961, "global_step": 91113, "epoch": 542} {"train_loss": -9.746674537658691, "global_step": 91114, "epoch": 542} {"train_loss": -9.680503845214844, "global_step": 91115, "epoch": 542} {"train_loss": -9.697559356689453, "global_step": 91116, "epoch": 542} {"train_loss": -9.665327072143555, "global_step": 91117, "epoch": 542} {"train_loss": -9.509243965148926, "global_step": 91118, "epoch": 542} {"train_loss": -9.820075035095215, "global_step": 91119, "epoch": 542} {"train_loss": -9.493154525756836, "global_step": 91120, "epoch": 542} {"train_loss": -9.468925476074219, "global_step": 91121, "epoch": 542} {"train_loss": -9.527244567871094, "global_step": 91122, "epoch": 542} {"train_loss": -9.074738502502441, "global_step": 91123, "epoch": 542} {"train_loss": -9.539426803588867, "global_step": 91124, "epoch": 542} {"train_loss": -9.309234619140625, "global_step": 91125, "epoch": 542} {"train_loss": -9.27518081665039, "global_step": 91126, "epoch": 542} {"train_loss": -9.543123245239258, "global_step": 91127, "epoch": 542} {"train_loss": -9.279474258422852, "global_step": 91128, "epoch": 542} {"train_loss": -9.538763046264648, "global_step": 91129, "epoch": 542} {"train_loss": -9.420289993286133, "global_step": 91130, "epoch": 542} {"train_loss": -9.193368911743164, "global_step": 91131, "epoch": 542} {"train_loss": -9.614553451538086, "global_step": 91132, "epoch": 542} {"train_loss": -9.638108253479004, "global_step": 91133, "epoch": 542} {"train_loss": -9.413593292236328, "global_step": 91134, "epoch": 542} {"train_loss": -9.193435668945312, "global_step": 91135, "epoch": 542} {"train_loss": -9.333386421203613, "global_step": 91136, "epoch": 542} {"train_loss": -9.140544891357422, "global_step": 91137, "epoch": 542} {"train_loss": -9.451879501342773, "global_step": 91138, "epoch": 542} {"train_loss": -9.38633918762207, "global_step": 91139, "epoch": 542} {"train_loss": -9.458131790161133, "global_step": 91140, "epoch": 542} {"train_loss": -9.296931266784668, "global_step": 91141, "epoch": 542} {"train_loss": -9.282590866088867, "global_step": 91142, "epoch": 542} {"train_loss": -9.020252227783203, "global_step": 91143, "epoch": 542} {"train_loss": -9.565631866455078, "global_step": 91144, "epoch": 542} {"train_loss": -9.311308860778809, "global_step": 91145, "epoch": 542} {"train_loss": -9.514795303344727, "global_step": 91146, "epoch": 542} {"train_loss": -9.486313819885254, "global_step": 91147, "epoch": 542} {"train_loss": -9.579856872558594, "global_step": 91148, "epoch": 542} {"train_loss": -9.402375221252441, "global_step": 91149, "epoch": 542} {"train_loss": -9.551471710205078, "global_step": 91150, "epoch": 542} {"train_loss": -9.57204818725586, "global_step": 91151, "epoch": 542} {"train_loss": -9.393534660339355, "global_step": 91152, "epoch": 542} {"train_loss": -9.420886993408203, "global_step": 91153, "epoch": 542} {"train_loss": -9.419532775878906, "global_step": 91154, "epoch": 542} {"train_loss": -9.14209270477295, "global_step": 91155, "epoch": 542} {"train_loss": -9.441530227661133, "global_step": 91156, "epoch": 542} {"train_loss": -9.360307693481445, "global_step": 91157, "epoch": 542} {"train_loss": -9.611202239990234, "global_step": 91158, "epoch": 542} {"train_loss": -9.288101196289062, "global_step": 91159, "epoch": 542} {"train_loss": -9.431428909301758, "global_step": 91160, "epoch": 542} {"train_loss": -9.616472244262695, "global_step": 91161, "epoch": 542} {"train_loss": -9.419902801513672, "global_step": 91162, "epoch": 542} {"train_loss": -9.35639762878418, "global_step": 91163, "epoch": 542} {"train_loss": -9.246356010437012, "global_step": 91164, "epoch": 542} {"train_loss": -9.182104110717773, "global_step": 91165, "epoch": 542} {"train_loss": -9.283915519714355, "global_step": 91166, "epoch": 542} {"train_loss": -9.272859573364258, "global_step": 91167, "epoch": 542} {"train_loss": -9.393035888671875, "global_step": 91168, "epoch": 542} {"train_loss": -9.808608055114746, "global_step": 91169, "epoch": 542} {"train_loss": -9.488399505615234, "global_step": 91170, "epoch": 542} {"train_loss": -9.639663696289062, "global_step": 91171, "epoch": 542} {"train_loss": -9.486577987670898, "global_step": 91172, "epoch": 542} {"train_loss": -9.711164474487305, "global_step": 91173, "epoch": 542} {"train_loss": -9.49520492553711, "global_step": 91174, "epoch": 542} {"train_loss": -9.706961631774902, "global_step": 91175, "epoch": 542} {"train_loss": -9.455875396728516, "global_step": 91176, "epoch": 542} {"train_loss": -9.663900375366211, "global_step": 91177, "epoch": 542} {"train_loss": -9.423904418945312, "global_step": 91178, "epoch": 542} {"train_loss": -9.502087593078613, "global_step": 91179, "epoch": 542} {"train_loss": -9.476615905761719, "global_step": 91180, "epoch": 542} {"train_loss": -9.582072257995605, "global_step": 91181, "epoch": 542} {"train_loss": -9.36466121673584, "global_step": 91182, "epoch": 542} {"train_loss": -9.479253768920898, "global_step": 91183, "epoch": 542} {"train_loss": -9.799052238464355, "global_step": 91184, "epoch": 542} {"train_loss": -9.663604736328125, "global_step": 91185, "epoch": 542} {"train_loss": -9.644512176513672, "global_step": 91186, "epoch": 542} {"train_loss": -9.613064765930176, "global_step": 91187, "epoch": 542} {"train_loss": -9.332149505615234, "global_step": 91188, "epoch": 542} {"train_loss": -9.538673400878906, "global_step": 91189, "epoch": 542} {"train_loss": -9.623714447021484, "global_step": 91190, "epoch": 542} {"train_loss": -9.479708671569824, "global_step": 91191, "epoch": 542} {"train_loss": -9.553247451782227, "global_step": 91192, "epoch": 542} {"train_loss": -9.78626537322998, "global_step": 91193, "epoch": 542} {"train_loss": -9.48119831085205, "global_step": 91194, "epoch": 542} {"train_loss": -9.910510063171387, "global_step": 91195, "epoch": 542} {"train_loss": -9.533554077148438, "global_step": 91196, "epoch": 542} {"train_loss": -9.502412796020508, "global_step": 91197, "epoch": 542} {"train_loss": -9.639835357666016, "global_step": 91198, "epoch": 542} {"train_loss": -9.467597961425781, "global_step": 91199, "epoch": 542} {"train_loss": -9.566322326660156, "global_step": 91200, "epoch": 542} {"train_loss": -9.358442306518555, "global_step": 91201, "epoch": 542} {"train_loss": -9.049156188964844, "global_step": 91202, "epoch": 542} {"train_loss": -9.661277770996094, "global_step": 91203, "epoch": 542} {"train_loss": -9.544790267944336, "global_step": 91204, "epoch": 542} {"train_loss": -9.484647750854492, "global_step": 91205, "epoch": 542} {"train_loss": -9.366628646850586, "global_step": 91206, "epoch": 542} {"train_loss": -9.775545120239258, "global_step": 91207, "epoch": 542} {"train_loss": -9.221637725830078, "global_step": 91208, "epoch": 542} {"train_loss": -9.550945281982422, "global_step": 91209, "epoch": 542} {"train_loss": -9.483765602111816, "global_step": 91210, "epoch": 542} {"train_loss": -9.326675415039062, "global_step": 91211, "epoch": 542} {"train_loss": -9.411272048950195, "global_step": 91212, "epoch": 542} {"train_loss": -9.54500961303711, "global_step": 91213, "epoch": 542} {"train_loss": -9.387639999389648, "global_step": 91214, "epoch": 542} {"train_loss": -9.630205154418945, "global_step": 91215, "epoch": 542} {"train_loss": -9.510845184326172, "global_step": 91216, "epoch": 542} {"train_loss": -9.379441261291504, "global_step": 91217, "epoch": 542} {"train_loss": -9.337690353393555, "global_step": 91218, "epoch": 542} {"train_loss": -9.389724731445312, "global_step": 91219, "epoch": 542} {"train_loss": -9.188015937805176, "global_step": 91220, "epoch": 542} {"train_loss": -9.287208557128906, "global_step": 91221, "epoch": 542} {"train_loss": -9.257339477539062, "global_step": 91222, "epoch": 542} {"train_loss": -9.438002223060245, "global_step": 91223, "epoch": 542, "val_loss": 202623.0} {"train_loss": -9.490182876586914, "global_step": 91224, "epoch": 543} {"train_loss": -9.63049030303955, "global_step": 91225, "epoch": 543} {"train_loss": -9.495159149169922, "global_step": 91226, "epoch": 543} {"train_loss": -9.738744735717773, "global_step": 91227, "epoch": 543} {"train_loss": -9.360902786254883, "global_step": 91228, "epoch": 543} {"train_loss": -9.25650405883789, "global_step": 91229, "epoch": 543} {"train_loss": -9.432247161865234, "global_step": 91230, "epoch": 543} {"train_loss": -8.783448219299316, "global_step": 91231, "epoch": 543} {"train_loss": -9.517461776733398, "global_step": 91232, "epoch": 543} {"train_loss": -9.305375099182129, "global_step": 91233, "epoch": 543} {"train_loss": -9.3302583694458, "global_step": 91234, "epoch": 543} {"train_loss": -9.360027313232422, "global_step": 91235, "epoch": 543} {"train_loss": -9.299152374267578, "global_step": 91236, "epoch": 543} {"train_loss": -9.118009567260742, "global_step": 91237, "epoch": 543} {"train_loss": -9.331350326538086, "global_step": 91238, "epoch": 543} {"train_loss": -9.368572235107422, "global_step": 91239, "epoch": 543} {"train_loss": -9.338296890258789, "global_step": 91240, "epoch": 543} {"train_loss": -9.528343200683594, "global_step": 91241, "epoch": 543} {"train_loss": -9.308284759521484, "global_step": 91242, "epoch": 543} {"train_loss": -9.292160034179688, "global_step": 91243, "epoch": 543} {"train_loss": -9.438180923461914, "global_step": 91244, "epoch": 543} {"train_loss": -8.589192390441895, "global_step": 91245, "epoch": 543} {"train_loss": -9.385246276855469, "global_step": 91246, "epoch": 543} {"train_loss": -8.614940643310547, "global_step": 91247, "epoch": 543} {"train_loss": -9.555242538452148, "global_step": 91248, "epoch": 543} {"train_loss": -9.057170867919922, "global_step": 91249, "epoch": 543} {"train_loss": -9.181827545166016, "global_step": 91250, "epoch": 543} {"train_loss": -9.022544860839844, "global_step": 91251, "epoch": 543} {"train_loss": -9.339598655700684, "global_step": 91252, "epoch": 543} {"train_loss": -9.190333366394043, "global_step": 91253, "epoch": 543} {"train_loss": -9.203774452209473, "global_step": 91254, "epoch": 543} {"train_loss": -9.369885444641113, "global_step": 91255, "epoch": 543} {"train_loss": -9.223209381103516, "global_step": 91256, "epoch": 543} {"train_loss": -9.284461975097656, "global_step": 91257, "epoch": 543} {"train_loss": -9.10533332824707, "global_step": 91258, "epoch": 543} {"train_loss": -9.201122283935547, "global_step": 91259, "epoch": 543} {"train_loss": -9.110710144042969, "global_step": 91260, "epoch": 543} {"train_loss": -9.34294319152832, "global_step": 91261, "epoch": 543} {"train_loss": -9.404494285583496, "global_step": 91262, "epoch": 543} {"train_loss": -9.569164276123047, "global_step": 91263, "epoch": 543} {"train_loss": -9.368902206420898, "global_step": 91264, "epoch": 543} {"train_loss": -9.640134811401367, "global_step": 91265, "epoch": 543} {"train_loss": -9.474058151245117, "global_step": 91266, "epoch": 543} {"train_loss": -9.599088668823242, "global_step": 91267, "epoch": 543} {"train_loss": -9.569397926330566, "global_step": 91268, "epoch": 543} {"train_loss": -9.645185470581055, "global_step": 91269, "epoch": 543} {"train_loss": -9.216180801391602, "global_step": 91270, "epoch": 543} {"train_loss": -9.481504440307617, "global_step": 91271, "epoch": 543} {"train_loss": -9.642175674438477, "global_step": 91272, "epoch": 543} {"train_loss": -9.389997482299805, "global_step": 91273, "epoch": 543} {"train_loss": -9.271195411682129, "global_step": 91274, "epoch": 543} {"train_loss": -9.481205940246582, "global_step": 91275, "epoch": 543} {"train_loss": -9.254298210144043, "global_step": 91276, "epoch": 543} {"train_loss": -9.54001235961914, "global_step": 91277, "epoch": 543} {"train_loss": -9.743379592895508, "global_step": 91278, "epoch": 543} {"train_loss": -9.583686828613281, "global_step": 91279, "epoch": 543} {"train_loss": -9.475713729858398, "global_step": 91280, "epoch": 543} {"train_loss": -9.678449630737305, "global_step": 91281, "epoch": 543} {"train_loss": -9.498889923095703, "global_step": 91282, "epoch": 543} {"train_loss": -9.693709373474121, "global_step": 91283, "epoch": 543} {"train_loss": -9.718037605285645, "global_step": 91284, "epoch": 543} {"train_loss": -9.59241008758545, "global_step": 91285, "epoch": 543} {"train_loss": -9.745262145996094, "global_step": 91286, "epoch": 543} {"train_loss": -9.788573265075684, "global_step": 91287, "epoch": 543} {"train_loss": -9.25827407836914, "global_step": 91288, "epoch": 543} {"train_loss": -9.618532180786133, "global_step": 91289, "epoch": 543} {"train_loss": -9.495962142944336, "global_step": 91290, "epoch": 543} {"train_loss": -9.808100700378418, "global_step": 91291, "epoch": 543} {"train_loss": -9.210836410522461, "global_step": 91292, "epoch": 543} {"train_loss": -8.939773559570312, "global_step": 91293, "epoch": 543} {"train_loss": -9.441656112670898, "global_step": 91294, "epoch": 543} {"train_loss": -9.271476745605469, "global_step": 91295, "epoch": 543} {"train_loss": -9.144956588745117, "global_step": 91296, "epoch": 543} {"train_loss": -9.322704315185547, "global_step": 91297, "epoch": 543} {"train_loss": -9.448958396911621, "global_step": 91298, "epoch": 543} {"train_loss": -9.414863586425781, "global_step": 91299, "epoch": 543} {"train_loss": -9.340188980102539, "global_step": 91300, "epoch": 543} {"train_loss": -9.660943031311035, "global_step": 91301, "epoch": 543} {"train_loss": -9.314952850341797, "global_step": 91302, "epoch": 543} {"train_loss": -9.653014183044434, "global_step": 91303, "epoch": 543} {"train_loss": -9.537195205688477, "global_step": 91304, "epoch": 543} {"train_loss": -9.660823822021484, "global_step": 91305, "epoch": 543} {"train_loss": -9.440372467041016, "global_step": 91306, "epoch": 543} {"train_loss": -9.561224937438965, "global_step": 91307, "epoch": 543} {"train_loss": -9.283744812011719, "global_step": 91308, "epoch": 543} {"train_loss": -9.304019927978516, "global_step": 91309, "epoch": 543} {"train_loss": -9.591835021972656, "global_step": 91310, "epoch": 543} {"train_loss": -9.583918571472168, "global_step": 91311, "epoch": 543} {"train_loss": -9.405008316040039, "global_step": 91312, "epoch": 543} {"train_loss": -9.412081718444824, "global_step": 91313, "epoch": 543} {"train_loss": -8.901487350463867, "global_step": 91314, "epoch": 543} {"train_loss": -9.175710678100586, "global_step": 91315, "epoch": 543} {"train_loss": -9.205087661743164, "global_step": 91316, "epoch": 543} {"train_loss": -9.307968139648438, "global_step": 91317, "epoch": 543} {"train_loss": -9.391512870788574, "global_step": 91318, "epoch": 543} {"train_loss": -8.80830192565918, "global_step": 91319, "epoch": 543} {"train_loss": -9.493106842041016, "global_step": 91320, "epoch": 543} {"train_loss": -9.077967643737793, "global_step": 91321, "epoch": 543} {"train_loss": -9.458293914794922, "global_step": 91322, "epoch": 543} {"train_loss": -9.273628234863281, "global_step": 91323, "epoch": 543} {"train_loss": -9.592832565307617, "global_step": 91324, "epoch": 543} {"train_loss": -9.348163604736328, "global_step": 91325, "epoch": 543} {"train_loss": -9.41370677947998, "global_step": 91326, "epoch": 543} {"train_loss": -9.584244728088379, "global_step": 91327, "epoch": 543} {"train_loss": -9.489867210388184, "global_step": 91328, "epoch": 543} {"train_loss": -9.358024597167969, "global_step": 91329, "epoch": 543} {"train_loss": -9.446574211120605, "global_step": 91330, "epoch": 543} {"train_loss": -9.3975830078125, "global_step": 91331, "epoch": 543} {"train_loss": -9.609712600708008, "global_step": 91332, "epoch": 543} {"train_loss": -9.585566520690918, "global_step": 91333, "epoch": 543} {"train_loss": -9.519904136657715, "global_step": 91334, "epoch": 543} {"train_loss": -9.523921966552734, "global_step": 91335, "epoch": 543} {"train_loss": -9.498132705688477, "global_step": 91336, "epoch": 543} {"train_loss": -9.355571746826172, "global_step": 91337, "epoch": 543} {"train_loss": -9.350695610046387, "global_step": 91338, "epoch": 543} {"train_loss": -9.357816696166992, "global_step": 91339, "epoch": 543} {"train_loss": -9.584833145141602, "global_step": 91340, "epoch": 543} {"train_loss": -9.564006805419922, "global_step": 91341, "epoch": 543} {"train_loss": -9.531635284423828, "global_step": 91342, "epoch": 543} {"train_loss": -9.67910385131836, "global_step": 91343, "epoch": 543} {"train_loss": -9.455971717834473, "global_step": 91344, "epoch": 543} {"train_loss": -9.658458709716797, "global_step": 91345, "epoch": 543} {"train_loss": -9.34823226928711, "global_step": 91346, "epoch": 543} {"train_loss": -9.786507606506348, "global_step": 91347, "epoch": 543} {"train_loss": -9.628419876098633, "global_step": 91348, "epoch": 543} {"train_loss": -9.542646408081055, "global_step": 91349, "epoch": 543} {"train_loss": -9.56812572479248, "global_step": 91350, "epoch": 543} {"train_loss": -9.600844383239746, "global_step": 91351, "epoch": 543} {"train_loss": -9.592487335205078, "global_step": 91352, "epoch": 543} {"train_loss": -9.538400650024414, "global_step": 91353, "epoch": 543} {"train_loss": -9.71367073059082, "global_step": 91354, "epoch": 543} {"train_loss": -9.533162117004395, "global_step": 91355, "epoch": 543} {"train_loss": -9.131601333618164, "global_step": 91356, "epoch": 543} {"train_loss": -9.235307693481445, "global_step": 91357, "epoch": 543} {"train_loss": -9.196349143981934, "global_step": 91358, "epoch": 543} {"train_loss": -9.243295669555664, "global_step": 91359, "epoch": 543} {"train_loss": -9.139741897583008, "global_step": 91360, "epoch": 543} {"train_loss": -9.161384582519531, "global_step": 91361, "epoch": 543} {"train_loss": -9.234055519104004, "global_step": 91362, "epoch": 543} {"train_loss": -9.303057670593262, "global_step": 91363, "epoch": 543} {"train_loss": -9.218629837036133, "global_step": 91364, "epoch": 543} {"train_loss": -9.017730712890625, "global_step": 91365, "epoch": 543} {"train_loss": -9.032203674316406, "global_step": 91366, "epoch": 543} {"train_loss": -9.249078750610352, "global_step": 91367, "epoch": 543} {"train_loss": -9.176589965820312, "global_step": 91368, "epoch": 543} {"train_loss": -9.1495361328125, "global_step": 91369, "epoch": 543} {"train_loss": -9.198344230651855, "global_step": 91370, "epoch": 543} {"train_loss": -9.115211486816406, "global_step": 91371, "epoch": 543} {"train_loss": -9.406278610229492, "global_step": 91372, "epoch": 543} {"train_loss": -9.234033584594727, "global_step": 91373, "epoch": 543} {"train_loss": -9.649650573730469, "global_step": 91374, "epoch": 543} {"train_loss": -9.460322380065918, "global_step": 91375, "epoch": 543} {"train_loss": -9.501750946044922, "global_step": 91376, "epoch": 543} {"train_loss": -9.575488090515137, "global_step": 91377, "epoch": 543} {"train_loss": -9.518192291259766, "global_step": 91378, "epoch": 543} {"train_loss": -9.44788646697998, "global_step": 91379, "epoch": 543} {"train_loss": -9.708868026733398, "global_step": 91380, "epoch": 543} {"train_loss": -9.297246932983398, "global_step": 91381, "epoch": 543} {"train_loss": -9.682315826416016, "global_step": 91382, "epoch": 543} {"train_loss": -9.81607437133789, "global_step": 91383, "epoch": 543} {"train_loss": -9.463264465332031, "global_step": 91384, "epoch": 543} {"train_loss": -9.726696014404297, "global_step": 91385, "epoch": 543} {"train_loss": -9.62095832824707, "global_step": 91386, "epoch": 543} {"train_loss": -9.499471664428711, "global_step": 91387, "epoch": 543} {"train_loss": -9.60501480102539, "global_step": 91388, "epoch": 543} {"train_loss": -9.62165641784668, "global_step": 91389, "epoch": 543} {"train_loss": -9.612190246582031, "global_step": 91390, "epoch": 543} {"train_loss": -9.407929000400362, "global_step": 91391, "epoch": 543, "val_loss": 202168.609375} {"train_loss": -9.625377655029297, "global_step": 91392, "epoch": 544} {"train_loss": -9.781652450561523, "global_step": 91393, "epoch": 544} {"train_loss": -9.401748657226562, "global_step": 91394, "epoch": 544} {"train_loss": -9.340063095092773, "global_step": 91395, "epoch": 544} {"train_loss": -9.697803497314453, "global_step": 91396, "epoch": 544} {"train_loss": -9.454277038574219, "global_step": 91397, "epoch": 544} {"train_loss": -9.541753768920898, "global_step": 91398, "epoch": 544} {"train_loss": -9.540435791015625, "global_step": 91399, "epoch": 544} {"train_loss": -9.352148056030273, "global_step": 91400, "epoch": 544} {"train_loss": -9.629788398742676, "global_step": 91401, "epoch": 544} {"train_loss": -9.398088455200195, "global_step": 91402, "epoch": 544} {"train_loss": -9.136283874511719, "global_step": 91403, "epoch": 544} {"train_loss": -9.419838905334473, "global_step": 91404, "epoch": 544} {"train_loss": -9.232172012329102, "global_step": 91405, "epoch": 544} {"train_loss": -9.206669807434082, "global_step": 91406, "epoch": 544} {"train_loss": -9.228687286376953, "global_step": 91407, "epoch": 544} {"train_loss": -8.835790634155273, "global_step": 91408, "epoch": 544} {"train_loss": -8.58746337890625, "global_step": 91409, "epoch": 544} {"train_loss": -9.112276077270508, "global_step": 91410, "epoch": 544} {"train_loss": -8.437966346740723, "global_step": 91411, "epoch": 544} {"train_loss": -8.552032470703125, "global_step": 91412, "epoch": 544} {"train_loss": -8.929128646850586, "global_step": 91413, "epoch": 544} {"train_loss": -8.628290176391602, "global_step": 91414, "epoch": 544} {"train_loss": -8.642194747924805, "global_step": 91415, "epoch": 544} {"train_loss": -9.128129959106445, "global_step": 91416, "epoch": 544} {"train_loss": -8.778092384338379, "global_step": 91417, "epoch": 544} {"train_loss": -9.107696533203125, "global_step": 91418, "epoch": 544} {"train_loss": -8.882457733154297, "global_step": 91419, "epoch": 544} {"train_loss": -8.941194534301758, "global_step": 91420, "epoch": 544} {"train_loss": -9.25598430633545, "global_step": 91421, "epoch": 544} {"train_loss": -8.983346939086914, "global_step": 91422, "epoch": 544} {"train_loss": -8.730880737304688, "global_step": 91423, "epoch": 544} {"train_loss": -9.143861770629883, "global_step": 91424, "epoch": 544} {"train_loss": -8.988224029541016, "global_step": 91425, "epoch": 544} {"train_loss": -9.21503734588623, "global_step": 91426, "epoch": 544} {"train_loss": -9.091012954711914, "global_step": 91427, "epoch": 544} {"train_loss": -8.93520450592041, "global_step": 91428, "epoch": 544} {"train_loss": -9.095091819763184, "global_step": 91429, "epoch": 544} {"train_loss": -9.371232986450195, "global_step": 91430, "epoch": 544} {"train_loss": -9.37038803100586, "global_step": 91431, "epoch": 544} {"train_loss": -9.229301452636719, "global_step": 91432, "epoch": 544} {"train_loss": -9.3301420211792, "global_step": 91433, "epoch": 544} {"train_loss": -9.208126068115234, "global_step": 91434, "epoch": 544} {"train_loss": -9.198844909667969, "global_step": 91435, "epoch": 544} {"train_loss": -9.584878921508789, "global_step": 91436, "epoch": 544} {"train_loss": -9.243436813354492, "global_step": 91437, "epoch": 544} {"train_loss": -9.289287567138672, "global_step": 91438, "epoch": 544} {"train_loss": -9.611486434936523, "global_step": 91439, "epoch": 544} {"train_loss": -9.458553314208984, "global_step": 91440, "epoch": 544} {"train_loss": -9.375301361083984, "global_step": 91441, "epoch": 544} {"train_loss": -9.55418872833252, "global_step": 91442, "epoch": 544} {"train_loss": -9.544906616210938, "global_step": 91443, "epoch": 544} {"train_loss": -9.644736289978027, "global_step": 91444, "epoch": 544} {"train_loss": -9.773637771606445, "global_step": 91445, "epoch": 544} {"train_loss": -9.57126235961914, "global_step": 91446, "epoch": 544} {"train_loss": -9.522665023803711, "global_step": 91447, "epoch": 544} {"train_loss": -9.708353042602539, "global_step": 91448, "epoch": 544} {"train_loss": -9.736273765563965, "global_step": 91449, "epoch": 544} {"train_loss": -9.640949249267578, "global_step": 91450, "epoch": 544} {"train_loss": -9.673998832702637, "global_step": 91451, "epoch": 544} {"train_loss": -9.554277420043945, "global_step": 91452, "epoch": 544} {"train_loss": -9.216407775878906, "global_step": 91453, "epoch": 544} {"train_loss": -9.611178398132324, "global_step": 91454, "epoch": 544} {"train_loss": -9.489383697509766, "global_step": 91455, "epoch": 544} {"train_loss": -9.660618782043457, "global_step": 91456, "epoch": 544} {"train_loss": -9.587881088256836, "global_step": 91457, "epoch": 544} {"train_loss": -9.461770057678223, "global_step": 91458, "epoch": 544} {"train_loss": -9.8285551071167, "global_step": 91459, "epoch": 544} {"train_loss": -9.443066596984863, "global_step": 91460, "epoch": 544} {"train_loss": -9.487455368041992, "global_step": 91461, "epoch": 544} {"train_loss": -9.514093399047852, "global_step": 91462, "epoch": 544} {"train_loss": -9.69562816619873, "global_step": 91463, "epoch": 544} {"train_loss": -9.557646751403809, "global_step": 91464, "epoch": 544} {"train_loss": -9.375696182250977, "global_step": 91465, "epoch": 544} {"train_loss": -9.429208755493164, "global_step": 91466, "epoch": 544} {"train_loss": -9.436531066894531, "global_step": 91467, "epoch": 544} {"train_loss": -9.012418746948242, "global_step": 91468, "epoch": 544} {"train_loss": -9.662564277648926, "global_step": 91469, "epoch": 544} {"train_loss": -9.435474395751953, "global_step": 91470, "epoch": 544} {"train_loss": -9.374359130859375, "global_step": 91471, "epoch": 544} {"train_loss": -9.612255096435547, "global_step": 91472, "epoch": 544} {"train_loss": -9.615026473999023, "global_step": 91473, "epoch": 544} {"train_loss": -9.494438171386719, "global_step": 91474, "epoch": 544} {"train_loss": -9.372626304626465, "global_step": 91475, "epoch": 544} {"train_loss": -9.505155563354492, "global_step": 91476, "epoch": 544} {"train_loss": -9.51703929901123, "global_step": 91477, "epoch": 544} {"train_loss": -9.591691970825195, "global_step": 91478, "epoch": 544} {"train_loss": -9.654071807861328, "global_step": 91479, "epoch": 544} {"train_loss": -9.580024719238281, "global_step": 91480, "epoch": 544} {"train_loss": -9.64686393737793, "global_step": 91481, "epoch": 544} {"train_loss": -9.710868835449219, "global_step": 91482, "epoch": 544} {"train_loss": -9.705495834350586, "global_step": 91483, "epoch": 544} {"train_loss": -9.162301063537598, "global_step": 91484, "epoch": 544} {"train_loss": -9.181310653686523, "global_step": 91485, "epoch": 544} {"train_loss": -9.486028671264648, "global_step": 91486, "epoch": 544} {"train_loss": -9.379493713378906, "global_step": 91487, "epoch": 544} {"train_loss": -9.303071975708008, "global_step": 91488, "epoch": 544} {"train_loss": -9.334981918334961, "global_step": 91489, "epoch": 544} {"train_loss": -9.452911376953125, "global_step": 91490, "epoch": 544} {"train_loss": -9.220365524291992, "global_step": 91491, "epoch": 544} {"train_loss": -9.2058744430542, "global_step": 91492, "epoch": 544} {"train_loss": -9.272836685180664, "global_step": 91493, "epoch": 544} {"train_loss": -9.138349533081055, "global_step": 91494, "epoch": 544} {"train_loss": -9.482856750488281, "global_step": 91495, "epoch": 544} {"train_loss": -9.085457801818848, "global_step": 91496, "epoch": 544} {"train_loss": -9.266976356506348, "global_step": 91497, "epoch": 544} {"train_loss": -9.316632270812988, "global_step": 91498, "epoch": 544} {"train_loss": -9.1483154296875, "global_step": 91499, "epoch": 544} {"train_loss": -9.167160987854004, "global_step": 91500, "epoch": 544} {"train_loss": -9.292179107666016, "global_step": 91501, "epoch": 544} {"train_loss": -9.356329917907715, "global_step": 91502, "epoch": 544} {"train_loss": -9.414045333862305, "global_step": 91503, "epoch": 544} {"train_loss": -9.467596054077148, "global_step": 91504, "epoch": 544} {"train_loss": -9.324057579040527, "global_step": 91505, "epoch": 544} {"train_loss": -9.373918533325195, "global_step": 91506, "epoch": 544} {"train_loss": -9.445268630981445, "global_step": 91507, "epoch": 544} {"train_loss": -9.600244522094727, "global_step": 91508, "epoch": 544} {"train_loss": -9.410524368286133, "global_step": 91509, "epoch": 544} {"train_loss": -9.628461837768555, "global_step": 91510, "epoch": 544} {"train_loss": -9.652853965759277, "global_step": 91511, "epoch": 544} {"train_loss": -9.529090881347656, "global_step": 91512, "epoch": 544} {"train_loss": -9.543652534484863, "global_step": 91513, "epoch": 544} {"train_loss": -9.453115463256836, "global_step": 91514, "epoch": 544} {"train_loss": -9.703226089477539, "global_step": 91515, "epoch": 544} {"train_loss": -9.698465347290039, "global_step": 91516, "epoch": 544} {"train_loss": -9.697513580322266, "global_step": 91517, "epoch": 544} {"train_loss": -9.503369331359863, "global_step": 91518, "epoch": 544} {"train_loss": -9.551514625549316, "global_step": 91519, "epoch": 544} {"train_loss": -9.671367645263672, "global_step": 91520, "epoch": 544} {"train_loss": -9.659994125366211, "global_step": 91521, "epoch": 544} {"train_loss": -9.255739212036133, "global_step": 91522, "epoch": 544} {"train_loss": -9.495796203613281, "global_step": 91523, "epoch": 544} {"train_loss": -9.387613296508789, "global_step": 91524, "epoch": 544} {"train_loss": -9.432181358337402, "global_step": 91525, "epoch": 544} {"train_loss": -9.48938274383545, "global_step": 91526, "epoch": 544} {"train_loss": -9.491281509399414, "global_step": 91527, "epoch": 544} {"train_loss": -9.499811172485352, "global_step": 91528, "epoch": 544} {"train_loss": -9.587084770202637, "global_step": 91529, "epoch": 544} {"train_loss": -9.296168327331543, "global_step": 91530, "epoch": 544} {"train_loss": -9.347092628479004, "global_step": 91531, "epoch": 544} {"train_loss": -9.300893783569336, "global_step": 91532, "epoch": 544} {"train_loss": -9.36202621459961, "global_step": 91533, "epoch": 544} {"train_loss": -9.425539016723633, "global_step": 91534, "epoch": 544} {"train_loss": -9.547750473022461, "global_step": 91535, "epoch": 544} {"train_loss": -9.397369384765625, "global_step": 91536, "epoch": 544} {"train_loss": -9.546113014221191, "global_step": 91537, "epoch": 544} {"train_loss": -9.611991882324219, "global_step": 91538, "epoch": 544} {"train_loss": -9.598638534545898, "global_step": 91539, "epoch": 544} {"train_loss": -9.59184455871582, "global_step": 91540, "epoch": 544} {"train_loss": -9.687559127807617, "global_step": 91541, "epoch": 544} {"train_loss": -9.389341354370117, "global_step": 91542, "epoch": 544} {"train_loss": -9.614029884338379, "global_step": 91543, "epoch": 544} {"train_loss": -9.600810050964355, "global_step": 91544, "epoch": 544} {"train_loss": -9.705883026123047, "global_step": 91545, "epoch": 544} {"train_loss": -9.658018112182617, "global_step": 91546, "epoch": 544} {"train_loss": -9.457379341125488, "global_step": 91547, "epoch": 544} {"train_loss": -9.758649826049805, "global_step": 91548, "epoch": 544} {"train_loss": -9.584793090820312, "global_step": 91549, "epoch": 544} {"train_loss": -9.661958694458008, "global_step": 91550, "epoch": 544} {"train_loss": -9.776070594787598, "global_step": 91551, "epoch": 544} {"train_loss": -9.758905410766602, "global_step": 91552, "epoch": 544} {"train_loss": -9.689931869506836, "global_step": 91553, "epoch": 544} {"train_loss": -9.63787841796875, "global_step": 91554, "epoch": 544} {"train_loss": -9.653156280517578, "global_step": 91555, "epoch": 544} {"train_loss": -9.556937217712402, "global_step": 91556, "epoch": 544} {"train_loss": -9.294431686401367, "global_step": 91557, "epoch": 544} {"train_loss": -9.519248962402344, "global_step": 91558, "epoch": 544} {"train_loss": -9.40253372419448, "global_step": 91559, "epoch": 544, "val_loss": 203372.359375} {"train_loss": -8.949178695678711, "global_step": 91560, "epoch": 545} {"train_loss": -8.74848747253418, "global_step": 91561, "epoch": 545} {"train_loss": -9.041574478149414, "global_step": 91562, "epoch": 545} {"train_loss": -9.362324714660645, "global_step": 91563, "epoch": 545} {"train_loss": -9.009854316711426, "global_step": 91564, "epoch": 545} {"train_loss": -9.19735336303711, "global_step": 91565, "epoch": 545} {"train_loss": -8.87813663482666, "global_step": 91566, "epoch": 545} {"train_loss": -9.093473434448242, "global_step": 91567, "epoch": 545} {"train_loss": -8.78053092956543, "global_step": 91568, "epoch": 545} {"train_loss": -9.160277366638184, "global_step": 91569, "epoch": 545} {"train_loss": -8.707660675048828, "global_step": 91570, "epoch": 545} {"train_loss": -9.456146240234375, "global_step": 91571, "epoch": 545} {"train_loss": -9.154565811157227, "global_step": 91572, "epoch": 545} {"train_loss": -8.829402923583984, "global_step": 91573, "epoch": 545} {"train_loss": -8.849655151367188, "global_step": 91574, "epoch": 545} {"train_loss": -8.939010620117188, "global_step": 91575, "epoch": 545} {"train_loss": -9.041253089904785, "global_step": 91576, "epoch": 545} {"train_loss": -9.059686660766602, "global_step": 91577, "epoch": 545} {"train_loss": -9.120981216430664, "global_step": 91578, "epoch": 545} {"train_loss": -9.027074813842773, "global_step": 91579, "epoch": 545} {"train_loss": -9.218019485473633, "global_step": 91580, "epoch": 545} {"train_loss": -9.353452682495117, "global_step": 91581, "epoch": 545} {"train_loss": -9.178421974182129, "global_step": 91582, "epoch": 545} {"train_loss": -9.262308120727539, "global_step": 91583, "epoch": 545} {"train_loss": -9.438947677612305, "global_step": 91584, "epoch": 545} {"train_loss": -9.061064720153809, "global_step": 91585, "epoch": 545} {"train_loss": -9.493505477905273, "global_step": 91586, "epoch": 545} {"train_loss": -9.348747253417969, "global_step": 91587, "epoch": 545} {"train_loss": -9.364364624023438, "global_step": 91588, "epoch": 545} {"train_loss": -9.16286849975586, "global_step": 91589, "epoch": 545} {"train_loss": -8.938142776489258, "global_step": 91590, "epoch": 545} {"train_loss": -9.551589012145996, "global_step": 91591, "epoch": 545} {"train_loss": -9.178064346313477, "global_step": 91592, "epoch": 545} {"train_loss": -9.390563011169434, "global_step": 91593, "epoch": 545} {"train_loss": -9.438764572143555, "global_step": 91594, "epoch": 545} {"train_loss": -9.250061988830566, "global_step": 91595, "epoch": 545} {"train_loss": -9.493730545043945, "global_step": 91596, "epoch": 545} {"train_loss": -9.5394287109375, "global_step": 91597, "epoch": 545} {"train_loss": -9.523351669311523, "global_step": 91598, "epoch": 545} {"train_loss": -9.43147087097168, "global_step": 91599, "epoch": 545} {"train_loss": -9.386253356933594, "global_step": 91600, "epoch": 545} {"train_loss": -9.691421508789062, "global_step": 91601, "epoch": 545} {"train_loss": -9.402833938598633, "global_step": 91602, "epoch": 545} {"train_loss": -9.444820404052734, "global_step": 91603, "epoch": 545} {"train_loss": -9.549698829650879, "global_step": 91604, "epoch": 545} {"train_loss": -9.4979248046875, "global_step": 91605, "epoch": 545} {"train_loss": -9.65648078918457, "global_step": 91606, "epoch": 545} {"train_loss": -9.244840621948242, "global_step": 91607, "epoch": 545} {"train_loss": -9.385625839233398, "global_step": 91608, "epoch": 545} {"train_loss": -9.613004684448242, "global_step": 91609, "epoch": 545} {"train_loss": -9.652257919311523, "global_step": 91610, "epoch": 545} {"train_loss": -9.352548599243164, "global_step": 91611, "epoch": 545} {"train_loss": -9.254595756530762, "global_step": 91612, "epoch": 545} {"train_loss": -9.391212463378906, "global_step": 91613, "epoch": 545} {"train_loss": -9.63127326965332, "global_step": 91614, "epoch": 545} {"train_loss": -9.54285717010498, "global_step": 91615, "epoch": 545} {"train_loss": -9.358603477478027, "global_step": 91616, "epoch": 545} {"train_loss": -9.617554664611816, "global_step": 91617, "epoch": 545} {"train_loss": -9.32693099975586, "global_step": 91618, "epoch": 545} {"train_loss": -9.22645092010498, "global_step": 91619, "epoch": 545} {"train_loss": -9.374588012695312, "global_step": 91620, "epoch": 545} {"train_loss": -9.251615524291992, "global_step": 91621, "epoch": 545} {"train_loss": -9.489217758178711, "global_step": 91622, "epoch": 545} {"train_loss": -9.414066314697266, "global_step": 91623, "epoch": 545} {"train_loss": -9.507099151611328, "global_step": 91624, "epoch": 545} {"train_loss": -9.538818359375, "global_step": 91625, "epoch": 545} {"train_loss": -9.527400970458984, "global_step": 91626, "epoch": 545} {"train_loss": -9.599300384521484, "global_step": 91627, "epoch": 545} {"train_loss": -9.440202713012695, "global_step": 91628, "epoch": 545} {"train_loss": -9.60360050201416, "global_step": 91629, "epoch": 545} {"train_loss": -9.470590591430664, "global_step": 91630, "epoch": 545} {"train_loss": -9.627274513244629, "global_step": 91631, "epoch": 545} {"train_loss": -9.530482292175293, "global_step": 91632, "epoch": 545} {"train_loss": -9.642086029052734, "global_step": 91633, "epoch": 545} {"train_loss": -9.438995361328125, "global_step": 91634, "epoch": 545} {"train_loss": -9.609979629516602, "global_step": 91635, "epoch": 545} {"train_loss": -9.736461639404297, "global_step": 91636, "epoch": 545} {"train_loss": -9.359938621520996, "global_step": 91637, "epoch": 545} {"train_loss": -9.645402908325195, "global_step": 91638, "epoch": 545} {"train_loss": -9.534656524658203, "global_step": 91639, "epoch": 545} {"train_loss": -9.57691764831543, "global_step": 91640, "epoch": 545} {"train_loss": -9.19957160949707, "global_step": 91641, "epoch": 545} {"train_loss": -9.348722457885742, "global_step": 91642, "epoch": 545} {"train_loss": -9.485747337341309, "global_step": 91643, "epoch": 545} {"train_loss": -9.205676078796387, "global_step": 91644, "epoch": 545} {"train_loss": -9.645559310913086, "global_step": 91645, "epoch": 545} {"train_loss": -9.497347831726074, "global_step": 91646, "epoch": 545} {"train_loss": -9.605976104736328, "global_step": 91647, "epoch": 545} {"train_loss": -9.761077880859375, "global_step": 91648, "epoch": 545} {"train_loss": -9.699231147766113, "global_step": 91649, "epoch": 545} {"train_loss": -9.49437427520752, "global_step": 91650, "epoch": 545} {"train_loss": -9.657867431640625, "global_step": 91651, "epoch": 545} {"train_loss": -9.441333770751953, "global_step": 91652, "epoch": 545} {"train_loss": -9.562820434570312, "global_step": 91653, "epoch": 545} {"train_loss": -9.566783905029297, "global_step": 91654, "epoch": 545} {"train_loss": -9.676708221435547, "global_step": 91655, "epoch": 545} {"train_loss": -9.667774200439453, "global_step": 91656, "epoch": 545} {"train_loss": -9.939909934997559, "global_step": 91657, "epoch": 545} {"train_loss": -9.649727821350098, "global_step": 91658, "epoch": 545} {"train_loss": -9.578413009643555, "global_step": 91659, "epoch": 545} {"train_loss": -10.038068771362305, "global_step": 91660, "epoch": 545} {"train_loss": -9.561988830566406, "global_step": 91661, "epoch": 545} {"train_loss": -9.651456832885742, "global_step": 91662, "epoch": 545} {"train_loss": -9.860540390014648, "global_step": 91663, "epoch": 545} {"train_loss": -9.932271957397461, "global_step": 91664, "epoch": 545} {"train_loss": -9.695690155029297, "global_step": 91665, "epoch": 545} {"train_loss": -9.418999671936035, "global_step": 91666, "epoch": 545} {"train_loss": -9.770373344421387, "global_step": 91667, "epoch": 545} {"train_loss": -9.622393608093262, "global_step": 91668, "epoch": 545} {"train_loss": -9.558887481689453, "global_step": 91669, "epoch": 545} {"train_loss": -9.364225387573242, "global_step": 91670, "epoch": 545} {"train_loss": -9.568603515625, "global_step": 91671, "epoch": 545} {"train_loss": -9.307619094848633, "global_step": 91672, "epoch": 545} {"train_loss": -9.59426498413086, "global_step": 91673, "epoch": 545} {"train_loss": -9.394210815429688, "global_step": 91674, "epoch": 545} {"train_loss": -9.530364990234375, "global_step": 91675, "epoch": 545} {"train_loss": -9.50344467163086, "global_step": 91676, "epoch": 545} {"train_loss": -9.737546920776367, "global_step": 91677, "epoch": 545} {"train_loss": -9.500494003295898, "global_step": 91678, "epoch": 545} {"train_loss": -9.489873886108398, "global_step": 91679, "epoch": 545} {"train_loss": -9.68885612487793, "global_step": 91680, "epoch": 545} {"train_loss": -9.172797203063965, "global_step": 91681, "epoch": 545} {"train_loss": -9.351387023925781, "global_step": 91682, "epoch": 545} {"train_loss": -9.520280838012695, "global_step": 91683, "epoch": 545} {"train_loss": -9.463634490966797, "global_step": 91684, "epoch": 545} {"train_loss": -9.407337188720703, "global_step": 91685, "epoch": 545} {"train_loss": -9.44751262664795, "global_step": 91686, "epoch": 545} {"train_loss": -9.583375930786133, "global_step": 91687, "epoch": 545} {"train_loss": -9.552690505981445, "global_step": 91688, "epoch": 545} {"train_loss": -9.75346565246582, "global_step": 91689, "epoch": 545} {"train_loss": -9.562685012817383, "global_step": 91690, "epoch": 545} {"train_loss": -9.672311782836914, "global_step": 91691, "epoch": 545} {"train_loss": -9.818840026855469, "global_step": 91692, "epoch": 545} {"train_loss": -9.680313110351562, "global_step": 91693, "epoch": 545} {"train_loss": -9.646703720092773, "global_step": 91694, "epoch": 545} {"train_loss": -9.309745788574219, "global_step": 91695, "epoch": 545} {"train_loss": -9.421062469482422, "global_step": 91696, "epoch": 545} {"train_loss": -9.48835563659668, "global_step": 91697, "epoch": 545} {"train_loss": -9.554622650146484, "global_step": 91698, "epoch": 545} {"train_loss": -9.788505554199219, "global_step": 91699, "epoch": 545} {"train_loss": -9.567487716674805, "global_step": 91700, "epoch": 545} {"train_loss": -9.596169471740723, "global_step": 91701, "epoch": 545} {"train_loss": -9.754874229431152, "global_step": 91702, "epoch": 545} {"train_loss": -9.17108154296875, "global_step": 91703, "epoch": 545} {"train_loss": -9.750029563903809, "global_step": 91704, "epoch": 545} {"train_loss": -9.217958450317383, "global_step": 91705, "epoch": 545} {"train_loss": -9.231428146362305, "global_step": 91706, "epoch": 545} {"train_loss": -9.393905639648438, "global_step": 91707, "epoch": 545} {"train_loss": -9.27938461303711, "global_step": 91708, "epoch": 545} {"train_loss": -9.602904319763184, "global_step": 91709, "epoch": 545} {"train_loss": -9.58763313293457, "global_step": 91710, "epoch": 545} {"train_loss": -9.590272903442383, "global_step": 91711, "epoch": 545} {"train_loss": -9.458791732788086, "global_step": 91712, "epoch": 545} {"train_loss": -9.706620216369629, "global_step": 91713, "epoch": 545} {"train_loss": -9.324867248535156, "global_step": 91714, "epoch": 545} {"train_loss": -9.202878952026367, "global_step": 91715, "epoch": 545} {"train_loss": -9.47054672241211, "global_step": 91716, "epoch": 545} {"train_loss": -9.375787734985352, "global_step": 91717, "epoch": 545} {"train_loss": -9.45855712890625, "global_step": 91718, "epoch": 545} {"train_loss": -9.339143753051758, "global_step": 91719, "epoch": 545} {"train_loss": -9.48372745513916, "global_step": 91720, "epoch": 545} {"train_loss": -9.555599212646484, "global_step": 91721, "epoch": 545} {"train_loss": -9.38665771484375, "global_step": 91722, "epoch": 545} {"train_loss": -9.657184600830078, "global_step": 91723, "epoch": 545} {"train_loss": -9.55677604675293, "global_step": 91724, "epoch": 545} {"train_loss": -9.488422393798828, "global_step": 91725, "epoch": 545} {"train_loss": -9.310416221618652, "global_step": 91726, "epoch": 545} {"train_loss": -9.439107117198763, "global_step": 91727, "epoch": 545, "val_loss": 202835.265625, "train_action_mse_error": 3.0188052654266357} {"train_loss": -9.312487602233887, "global_step": 91728, "epoch": 546} {"train_loss": -9.577692985534668, "global_step": 91729, "epoch": 546} {"train_loss": -9.370979309082031, "global_step": 91730, "epoch": 546} {"train_loss": -9.736384391784668, "global_step": 91731, "epoch": 546} {"train_loss": -9.236096382141113, "global_step": 91732, "epoch": 546} {"train_loss": -9.544578552246094, "global_step": 91733, "epoch": 546} {"train_loss": -9.266899108886719, "global_step": 91734, "epoch": 546} {"train_loss": -9.364500999450684, "global_step": 91735, "epoch": 546} {"train_loss": -9.675863265991211, "global_step": 91736, "epoch": 546} {"train_loss": -9.247852325439453, "global_step": 91737, "epoch": 546} {"train_loss": -9.497028350830078, "global_step": 91738, "epoch": 546} {"train_loss": -9.680492401123047, "global_step": 91739, "epoch": 546} {"train_loss": -9.598267555236816, "global_step": 91740, "epoch": 546} {"train_loss": -9.717447280883789, "global_step": 91741, "epoch": 546} {"train_loss": -9.578338623046875, "global_step": 91742, "epoch": 546} {"train_loss": -9.645471572875977, "global_step": 91743, "epoch": 546} {"train_loss": -9.715518951416016, "global_step": 91744, "epoch": 546} {"train_loss": -9.39059829711914, "global_step": 91745, "epoch": 546} {"train_loss": -9.452144622802734, "global_step": 91746, "epoch": 546} {"train_loss": -9.345060348510742, "global_step": 91747, "epoch": 546} {"train_loss": -9.579715728759766, "global_step": 91748, "epoch": 546} {"train_loss": -9.516416549682617, "global_step": 91749, "epoch": 546} {"train_loss": -9.494170188903809, "global_step": 91750, "epoch": 546} {"train_loss": -9.486187934875488, "global_step": 91751, "epoch": 546} {"train_loss": -9.662506103515625, "global_step": 91752, "epoch": 546} {"train_loss": -9.339897155761719, "global_step": 91753, "epoch": 546} {"train_loss": -9.523202896118164, "global_step": 91754, "epoch": 546} {"train_loss": -9.703654289245605, "global_step": 91755, "epoch": 546} {"train_loss": -9.281492233276367, "global_step": 91756, "epoch": 546} {"train_loss": -9.754172325134277, "global_step": 91757, "epoch": 546} {"train_loss": -9.065896987915039, "global_step": 91758, "epoch": 546} {"train_loss": -9.426389694213867, "global_step": 91759, "epoch": 546} {"train_loss": -9.353318214416504, "global_step": 91760, "epoch": 546} {"train_loss": -9.399801254272461, "global_step": 91761, "epoch": 546} {"train_loss": -9.075995445251465, "global_step": 91762, "epoch": 546} {"train_loss": -9.007097244262695, "global_step": 91763, "epoch": 546} {"train_loss": -9.30935287475586, "global_step": 91764, "epoch": 546} {"train_loss": -9.430610656738281, "global_step": 91765, "epoch": 546} {"train_loss": -8.879222869873047, "global_step": 91766, "epoch": 546} {"train_loss": -9.148846626281738, "global_step": 91767, "epoch": 546} {"train_loss": -9.378379821777344, "global_step": 91768, "epoch": 546} {"train_loss": -9.287376403808594, "global_step": 91769, "epoch": 546} {"train_loss": -9.279308319091797, "global_step": 91770, "epoch": 546} {"train_loss": -9.263008117675781, "global_step": 91771, "epoch": 546} {"train_loss": -9.420835494995117, "global_step": 91772, "epoch": 546} {"train_loss": -9.40916633605957, "global_step": 91773, "epoch": 546} {"train_loss": -9.423961639404297, "global_step": 91774, "epoch": 546} {"train_loss": -9.533194541931152, "global_step": 91775, "epoch": 546} {"train_loss": -9.616613388061523, "global_step": 91776, "epoch": 546} {"train_loss": -9.463033676147461, "global_step": 91777, "epoch": 546} {"train_loss": -9.463789939880371, "global_step": 91778, "epoch": 546} {"train_loss": -9.574074745178223, "global_step": 91779, "epoch": 546} {"train_loss": -9.63975715637207, "global_step": 91780, "epoch": 546} {"train_loss": -9.524633407592773, "global_step": 91781, "epoch": 546} {"train_loss": -9.485508918762207, "global_step": 91782, "epoch": 546} {"train_loss": -9.673221588134766, "global_step": 91783, "epoch": 546} {"train_loss": -9.354781150817871, "global_step": 91784, "epoch": 546} {"train_loss": -9.508633613586426, "global_step": 91785, "epoch": 546} {"train_loss": -9.502874374389648, "global_step": 91786, "epoch": 546} {"train_loss": -9.69245719909668, "global_step": 91787, "epoch": 546} {"train_loss": -9.674564361572266, "global_step": 91788, "epoch": 546} {"train_loss": -9.654319763183594, "global_step": 91789, "epoch": 546} {"train_loss": -9.633573532104492, "global_step": 91790, "epoch": 546} {"train_loss": -9.539822578430176, "global_step": 91791, "epoch": 546} {"train_loss": -9.740787506103516, "global_step": 91792, "epoch": 546} {"train_loss": -9.730653762817383, "global_step": 91793, "epoch": 546} {"train_loss": -9.756772994995117, "global_step": 91794, "epoch": 546} {"train_loss": -9.457554817199707, "global_step": 91795, "epoch": 546} {"train_loss": -9.59805965423584, "global_step": 91796, "epoch": 546} {"train_loss": -9.678723335266113, "global_step": 91797, "epoch": 546} {"train_loss": -9.603717803955078, "global_step": 91798, "epoch": 546} {"train_loss": -9.677352905273438, "global_step": 91799, "epoch": 546} {"train_loss": -9.759986877441406, "global_step": 91800, "epoch": 546} {"train_loss": -9.391940116882324, "global_step": 91801, "epoch": 546} {"train_loss": -9.561614990234375, "global_step": 91802, "epoch": 546} {"train_loss": -9.489492416381836, "global_step": 91803, "epoch": 546} {"train_loss": -9.557794570922852, "global_step": 91804, "epoch": 546} {"train_loss": -9.055020332336426, "global_step": 91805, "epoch": 546} {"train_loss": -9.796340942382812, "global_step": 91806, "epoch": 546} {"train_loss": -9.236672401428223, "global_step": 91807, "epoch": 546} {"train_loss": -9.255606651306152, "global_step": 91808, "epoch": 546} {"train_loss": -9.51345157623291, "global_step": 91809, "epoch": 546} {"train_loss": -9.313800811767578, "global_step": 91810, "epoch": 546} {"train_loss": -9.293500900268555, "global_step": 91811, "epoch": 546} {"train_loss": -9.596658706665039, "global_step": 91812, "epoch": 546} {"train_loss": -9.410382270812988, "global_step": 91813, "epoch": 546} {"train_loss": -9.564912796020508, "global_step": 91814, "epoch": 546} {"train_loss": -9.456097602844238, "global_step": 91815, "epoch": 546} {"train_loss": -8.908391952514648, "global_step": 91816, "epoch": 546} {"train_loss": -9.579863548278809, "global_step": 91817, "epoch": 546} {"train_loss": -8.587705612182617, "global_step": 91818, "epoch": 546} {"train_loss": -9.282242774963379, "global_step": 91819, "epoch": 546} {"train_loss": -9.100797653198242, "global_step": 91820, "epoch": 546} {"train_loss": -9.439637184143066, "global_step": 91821, "epoch": 546} {"train_loss": -9.254156112670898, "global_step": 91822, "epoch": 546} {"train_loss": -9.309656143188477, "global_step": 91823, "epoch": 546} {"train_loss": -9.091562271118164, "global_step": 91824, "epoch": 546} {"train_loss": -9.529102325439453, "global_step": 91825, "epoch": 546} {"train_loss": -8.933053970336914, "global_step": 91826, "epoch": 546} {"train_loss": -9.064088821411133, "global_step": 91827, "epoch": 546} {"train_loss": -9.083484649658203, "global_step": 91828, "epoch": 546} {"train_loss": -9.108112335205078, "global_step": 91829, "epoch": 546} {"train_loss": -8.862516403198242, "global_step": 91830, "epoch": 546} {"train_loss": -9.204296112060547, "global_step": 91831, "epoch": 546} {"train_loss": -9.055718421936035, "global_step": 91832, "epoch": 546} {"train_loss": -9.231401443481445, "global_step": 91833, "epoch": 546} {"train_loss": -9.374448776245117, "global_step": 91834, "epoch": 546} {"train_loss": -9.233314514160156, "global_step": 91835, "epoch": 546} {"train_loss": -9.147172927856445, "global_step": 91836, "epoch": 546} {"train_loss": -9.29560375213623, "global_step": 91837, "epoch": 546} {"train_loss": -9.434687614440918, "global_step": 91838, "epoch": 546} {"train_loss": -9.347274780273438, "global_step": 91839, "epoch": 546} {"train_loss": -9.421097755432129, "global_step": 91840, "epoch": 546} {"train_loss": -9.525552749633789, "global_step": 91841, "epoch": 546} {"train_loss": -9.469409942626953, "global_step": 91842, "epoch": 546} {"train_loss": -9.44739055633545, "global_step": 91843, "epoch": 546} {"train_loss": -9.507943153381348, "global_step": 91844, "epoch": 546} {"train_loss": -9.462148666381836, "global_step": 91845, "epoch": 546} {"train_loss": -9.551498413085938, "global_step": 91846, "epoch": 546} {"train_loss": -9.498865127563477, "global_step": 91847, "epoch": 546} {"train_loss": -9.499139785766602, "global_step": 91848, "epoch": 546} {"train_loss": -9.464271545410156, "global_step": 91849, "epoch": 546} {"train_loss": -9.675020217895508, "global_step": 91850, "epoch": 546} {"train_loss": -9.315431594848633, "global_step": 91851, "epoch": 546} {"train_loss": -9.5661039352417, "global_step": 91852, "epoch": 546} {"train_loss": -9.678979873657227, "global_step": 91853, "epoch": 546} {"train_loss": -9.495586395263672, "global_step": 91854, "epoch": 546} {"train_loss": -9.755597114562988, "global_step": 91855, "epoch": 546} {"train_loss": -9.62083625793457, "global_step": 91856, "epoch": 546} {"train_loss": -9.474040985107422, "global_step": 91857, "epoch": 546} {"train_loss": -9.144094467163086, "global_step": 91858, "epoch": 546} {"train_loss": -9.595653533935547, "global_step": 91859, "epoch": 546} {"train_loss": -9.485821723937988, "global_step": 91860, "epoch": 546} {"train_loss": -9.739618301391602, "global_step": 91861, "epoch": 546} {"train_loss": -9.682910919189453, "global_step": 91862, "epoch": 546} {"train_loss": -9.6549711227417, "global_step": 91863, "epoch": 546} {"train_loss": -9.44863510131836, "global_step": 91864, "epoch": 546} {"train_loss": -9.707444190979004, "global_step": 91865, "epoch": 546} {"train_loss": -9.456951141357422, "global_step": 91866, "epoch": 546} {"train_loss": -9.929231643676758, "global_step": 91867, "epoch": 546} {"train_loss": -9.667434692382812, "global_step": 91868, "epoch": 546} {"train_loss": -9.552240371704102, "global_step": 91869, "epoch": 546} {"train_loss": -9.747934341430664, "global_step": 91870, "epoch": 546} {"train_loss": -9.34189224243164, "global_step": 91871, "epoch": 546} {"train_loss": -9.666138648986816, "global_step": 91872, "epoch": 546} {"train_loss": -9.31010627746582, "global_step": 91873, "epoch": 546} {"train_loss": -9.308540344238281, "global_step": 91874, "epoch": 546} {"train_loss": -9.31680679321289, "global_step": 91875, "epoch": 546} {"train_loss": -9.578690528869629, "global_step": 91876, "epoch": 546} {"train_loss": -9.39742660522461, "global_step": 91877, "epoch": 546} {"train_loss": -9.281222343444824, "global_step": 91878, "epoch": 546} {"train_loss": -9.558126449584961, "global_step": 91879, "epoch": 546} {"train_loss": -9.450582504272461, "global_step": 91880, "epoch": 546} {"train_loss": -9.544220924377441, "global_step": 91881, "epoch": 546} {"train_loss": -9.414308547973633, "global_step": 91882, "epoch": 546} {"train_loss": -9.570348739624023, "global_step": 91883, "epoch": 546} {"train_loss": -9.404336929321289, "global_step": 91884, "epoch": 546} {"train_loss": -9.468812942504883, "global_step": 91885, "epoch": 546} {"train_loss": -9.295297622680664, "global_step": 91886, "epoch": 546} {"train_loss": -9.465012550354004, "global_step": 91887, "epoch": 546} {"train_loss": -9.309188842773438, "global_step": 91888, "epoch": 546} {"train_loss": -9.154401779174805, "global_step": 91889, "epoch": 546} {"train_loss": -9.550058364868164, "global_step": 91890, "epoch": 546} {"train_loss": -9.317615509033203, "global_step": 91891, "epoch": 546} {"train_loss": -9.129571914672852, "global_step": 91892, "epoch": 546} {"train_loss": -9.194690704345703, "global_step": 91893, "epoch": 546} {"train_loss": -9.313825607299805, "global_step": 91894, "epoch": 546} {"train_loss": -9.43587559177762, "global_step": 91895, "epoch": 546, "val_loss": 203170.8125} {"train_loss": -9.161724090576172, "global_step": 91896, "epoch": 547} {"train_loss": -9.491832733154297, "global_step": 91897, "epoch": 547} {"train_loss": -9.207903861999512, "global_step": 91898, "epoch": 547} {"train_loss": -9.387336730957031, "global_step": 91899, "epoch": 547} {"train_loss": -9.360804557800293, "global_step": 91900, "epoch": 547} {"train_loss": -9.275385856628418, "global_step": 91901, "epoch": 547} {"train_loss": -9.316226959228516, "global_step": 91902, "epoch": 547} {"train_loss": -9.538106918334961, "global_step": 91903, "epoch": 547} {"train_loss": -9.124561309814453, "global_step": 91904, "epoch": 547} {"train_loss": -9.363286972045898, "global_step": 91905, "epoch": 547} {"train_loss": -9.415647506713867, "global_step": 91906, "epoch": 547} {"train_loss": -9.302473068237305, "global_step": 91907, "epoch": 547} {"train_loss": -9.190452575683594, "global_step": 91908, "epoch": 547} {"train_loss": -9.325311660766602, "global_step": 91909, "epoch": 547} {"train_loss": -9.455129623413086, "global_step": 91910, "epoch": 547} {"train_loss": -9.386703491210938, "global_step": 91911, "epoch": 547} {"train_loss": -9.45513916015625, "global_step": 91912, "epoch": 547} {"train_loss": -9.426721572875977, "global_step": 91913, "epoch": 547} {"train_loss": -9.486981391906738, "global_step": 91914, "epoch": 547} {"train_loss": -9.41025447845459, "global_step": 91915, "epoch": 547} {"train_loss": -9.457877159118652, "global_step": 91916, "epoch": 547} {"train_loss": -9.515948295593262, "global_step": 91917, "epoch": 547} {"train_loss": -9.523670196533203, "global_step": 91918, "epoch": 547} {"train_loss": -9.324445724487305, "global_step": 91919, "epoch": 547} {"train_loss": -9.724494934082031, "global_step": 91920, "epoch": 547} {"train_loss": -9.143409729003906, "global_step": 91921, "epoch": 547} {"train_loss": -9.45538330078125, "global_step": 91922, "epoch": 547} {"train_loss": -9.562238693237305, "global_step": 91923, "epoch": 547} {"train_loss": -9.557403564453125, "global_step": 91924, "epoch": 547} {"train_loss": -9.45233154296875, "global_step": 91925, "epoch": 547} {"train_loss": -9.53078842163086, "global_step": 91926, "epoch": 547} {"train_loss": -9.304492950439453, "global_step": 91927, "epoch": 547} {"train_loss": -9.342005729675293, "global_step": 91928, "epoch": 547} {"train_loss": -9.209610939025879, "global_step": 91929, "epoch": 547} {"train_loss": -9.147682189941406, "global_step": 91930, "epoch": 547} {"train_loss": -9.618794441223145, "global_step": 91931, "epoch": 547} {"train_loss": -9.496464729309082, "global_step": 91932, "epoch": 547} {"train_loss": -9.345476150512695, "global_step": 91933, "epoch": 547} {"train_loss": -9.479277610778809, "global_step": 91934, "epoch": 547} {"train_loss": -9.466523170471191, "global_step": 91935, "epoch": 547} {"train_loss": -9.575369834899902, "global_step": 91936, "epoch": 547} {"train_loss": -9.515883445739746, "global_step": 91937, "epoch": 547} {"train_loss": -9.454263687133789, "global_step": 91938, "epoch": 547} {"train_loss": -9.92376708984375, "global_step": 91939, "epoch": 547} {"train_loss": -9.047614097595215, "global_step": 91940, "epoch": 547} {"train_loss": -9.581267356872559, "global_step": 91941, "epoch": 547} {"train_loss": -9.533902168273926, "global_step": 91942, "epoch": 547} {"train_loss": -9.401485443115234, "global_step": 91943, "epoch": 547} {"train_loss": -9.644749641418457, "global_step": 91944, "epoch": 547} {"train_loss": -9.145339965820312, "global_step": 91945, "epoch": 547} {"train_loss": -9.434122085571289, "global_step": 91946, "epoch": 547} {"train_loss": -9.420263290405273, "global_step": 91947, "epoch": 547} {"train_loss": -9.529316902160645, "global_step": 91948, "epoch": 547} {"train_loss": -9.66964340209961, "global_step": 91949, "epoch": 547} {"train_loss": -9.646835327148438, "global_step": 91950, "epoch": 547} {"train_loss": -9.373922348022461, "global_step": 91951, "epoch": 547} {"train_loss": -9.669248580932617, "global_step": 91952, "epoch": 547} {"train_loss": -9.641400337219238, "global_step": 91953, "epoch": 547} {"train_loss": -9.599621772766113, "global_step": 91954, "epoch": 547} {"train_loss": -9.654277801513672, "global_step": 91955, "epoch": 547} {"train_loss": -9.627279281616211, "global_step": 91956, "epoch": 547} {"train_loss": -9.52166748046875, "global_step": 91957, "epoch": 547} {"train_loss": -9.695663452148438, "global_step": 91958, "epoch": 547} {"train_loss": -9.617639541625977, "global_step": 91959, "epoch": 547} {"train_loss": -9.73483657836914, "global_step": 91960, "epoch": 547} {"train_loss": -9.68682861328125, "global_step": 91961, "epoch": 547} {"train_loss": -9.668481826782227, "global_step": 91962, "epoch": 547} {"train_loss": -9.490964889526367, "global_step": 91963, "epoch": 547} {"train_loss": -9.5967378616333, "global_step": 91964, "epoch": 547} {"train_loss": -9.49893856048584, "global_step": 91965, "epoch": 547} {"train_loss": -9.621603012084961, "global_step": 91966, "epoch": 547} {"train_loss": -9.574162483215332, "global_step": 91967, "epoch": 547} {"train_loss": -9.681746482849121, "global_step": 91968, "epoch": 547} {"train_loss": -9.758255004882812, "global_step": 91969, "epoch": 547} {"train_loss": -9.440984725952148, "global_step": 91970, "epoch": 547} {"train_loss": -9.620854377746582, "global_step": 91971, "epoch": 547} {"train_loss": -9.511829376220703, "global_step": 91972, "epoch": 547} {"train_loss": -9.910566329956055, "global_step": 91973, "epoch": 547} {"train_loss": -9.356348037719727, "global_step": 91974, "epoch": 547} {"train_loss": -9.389289855957031, "global_step": 91975, "epoch": 547} {"train_loss": -9.720620155334473, "global_step": 91976, "epoch": 547} {"train_loss": -9.339238166809082, "global_step": 91977, "epoch": 547} {"train_loss": -9.475048065185547, "global_step": 91978, "epoch": 547} {"train_loss": -9.695816993713379, "global_step": 91979, "epoch": 547} {"train_loss": -9.234756469726562, "global_step": 91980, "epoch": 547} {"train_loss": -9.886926651000977, "global_step": 91981, "epoch": 547} {"train_loss": -9.17570686340332, "global_step": 91982, "epoch": 547} {"train_loss": -9.036996841430664, "global_step": 91983, "epoch": 547} {"train_loss": -9.757970809936523, "global_step": 91984, "epoch": 547} {"train_loss": -9.815171241760254, "global_step": 91985, "epoch": 547} {"train_loss": -9.540548324584961, "global_step": 91986, "epoch": 547} {"train_loss": -9.64863395690918, "global_step": 91987, "epoch": 547} {"train_loss": -9.823814392089844, "global_step": 91988, "epoch": 547} {"train_loss": -9.578909873962402, "global_step": 91989, "epoch": 547} {"train_loss": -9.679143905639648, "global_step": 91990, "epoch": 547} {"train_loss": -9.603097915649414, "global_step": 91991, "epoch": 547} {"train_loss": -9.745216369628906, "global_step": 91992, "epoch": 547} {"train_loss": -9.723868370056152, "global_step": 91993, "epoch": 547} {"train_loss": -9.33049201965332, "global_step": 91994, "epoch": 547} {"train_loss": -9.584134101867676, "global_step": 91995, "epoch": 547} {"train_loss": -9.615250587463379, "global_step": 91996, "epoch": 547} {"train_loss": -9.487961769104004, "global_step": 91997, "epoch": 547} {"train_loss": -9.562660217285156, "global_step": 91998, "epoch": 547} {"train_loss": -8.813268661499023, "global_step": 91999, "epoch": 547} {"train_loss": -9.335530281066895, "global_step": 92000, "epoch": 547} {"train_loss": -9.173691749572754, "global_step": 92001, "epoch": 547} {"train_loss": -8.632089614868164, "global_step": 92002, "epoch": 547} {"train_loss": -8.573445320129395, "global_step": 92003, "epoch": 547} {"train_loss": -9.009021759033203, "global_step": 92004, "epoch": 547} {"train_loss": -8.749380111694336, "global_step": 92005, "epoch": 547} {"train_loss": -8.858931541442871, "global_step": 92006, "epoch": 547} {"train_loss": -8.801163673400879, "global_step": 92007, "epoch": 547} {"train_loss": -8.698951721191406, "global_step": 92008, "epoch": 547} {"train_loss": -8.94791030883789, "global_step": 92009, "epoch": 547} {"train_loss": -8.86001205444336, "global_step": 92010, "epoch": 547} {"train_loss": -9.054045677185059, "global_step": 92011, "epoch": 547} {"train_loss": -8.906684875488281, "global_step": 92012, "epoch": 547} {"train_loss": -8.940635681152344, "global_step": 92013, "epoch": 547} {"train_loss": -9.327116012573242, "global_step": 92014, "epoch": 547} {"train_loss": -9.188423156738281, "global_step": 92015, "epoch": 547} {"train_loss": -9.199687957763672, "global_step": 92016, "epoch": 547} {"train_loss": -9.100281715393066, "global_step": 92017, "epoch": 547} {"train_loss": -9.312623977661133, "global_step": 92018, "epoch": 547} {"train_loss": -9.309932708740234, "global_step": 92019, "epoch": 547} {"train_loss": -9.266712188720703, "global_step": 92020, "epoch": 547} {"train_loss": -9.394694328308105, "global_step": 92021, "epoch": 547} {"train_loss": -9.208723068237305, "global_step": 92022, "epoch": 547} {"train_loss": -9.478273391723633, "global_step": 92023, "epoch": 547} {"train_loss": -9.471846580505371, "global_step": 92024, "epoch": 547} {"train_loss": -9.575241088867188, "global_step": 92025, "epoch": 547} {"train_loss": -9.427587509155273, "global_step": 92026, "epoch": 547} {"train_loss": -9.759664535522461, "global_step": 92027, "epoch": 547} {"train_loss": -9.580495834350586, "global_step": 92028, "epoch": 547} {"train_loss": -9.400162696838379, "global_step": 92029, "epoch": 547} {"train_loss": -9.481904983520508, "global_step": 92030, "epoch": 547} {"train_loss": -9.35097885131836, "global_step": 92031, "epoch": 547} {"train_loss": -9.539936065673828, "global_step": 92032, "epoch": 547} {"train_loss": -9.678990364074707, "global_step": 92033, "epoch": 547} {"train_loss": -9.44424057006836, "global_step": 92034, "epoch": 547} {"train_loss": -9.54646110534668, "global_step": 92035, "epoch": 547} {"train_loss": -9.516298294067383, "global_step": 92036, "epoch": 547} {"train_loss": -9.39559555053711, "global_step": 92037, "epoch": 547} {"train_loss": -9.403646469116211, "global_step": 92038, "epoch": 547} {"train_loss": -9.429830551147461, "global_step": 92039, "epoch": 547} {"train_loss": -9.394062042236328, "global_step": 92040, "epoch": 547} {"train_loss": -9.202831268310547, "global_step": 92041, "epoch": 547} {"train_loss": -9.56512451171875, "global_step": 92042, "epoch": 547} {"train_loss": -9.581058502197266, "global_step": 92043, "epoch": 547} {"train_loss": -9.581718444824219, "global_step": 92044, "epoch": 547} {"train_loss": -9.654031753540039, "global_step": 92045, "epoch": 547} {"train_loss": -9.61923885345459, "global_step": 92046, "epoch": 547} {"train_loss": -9.408201217651367, "global_step": 92047, "epoch": 547} {"train_loss": -9.717761993408203, "global_step": 92048, "epoch": 547} {"train_loss": -9.639968872070312, "global_step": 92049, "epoch": 547} {"train_loss": -9.373887062072754, "global_step": 92050, "epoch": 547} {"train_loss": -9.804349899291992, "global_step": 92051, "epoch": 547} {"train_loss": -9.424175262451172, "global_step": 92052, "epoch": 547} {"train_loss": -9.567682266235352, "global_step": 92053, "epoch": 547} {"train_loss": -9.555225372314453, "global_step": 92054, "epoch": 547} {"train_loss": -9.545133590698242, "global_step": 92055, "epoch": 547} {"train_loss": -9.65780258178711, "global_step": 92056, "epoch": 547} {"train_loss": -9.477075576782227, "global_step": 92057, "epoch": 547} {"train_loss": -9.675885200500488, "global_step": 92058, "epoch": 547} {"train_loss": -9.587882995605469, "global_step": 92059, "epoch": 547} {"train_loss": -9.429876327514648, "global_step": 92060, "epoch": 547} {"train_loss": -9.36878776550293, "global_step": 92061, "epoch": 547} {"train_loss": -9.563421249389648, "global_step": 92062, "epoch": 547} {"train_loss": -9.435773735954648, "global_step": 92063, "epoch": 547, "val_loss": 204812.890625} {"train_loss": -9.342338562011719, "global_step": 92064, "epoch": 548} {"train_loss": -9.549896240234375, "global_step": 92065, "epoch": 548} {"train_loss": -9.366043090820312, "global_step": 92066, "epoch": 548} {"train_loss": -9.467950820922852, "global_step": 92067, "epoch": 548} {"train_loss": -8.850770950317383, "global_step": 92068, "epoch": 548} {"train_loss": -9.38033390045166, "global_step": 92069, "epoch": 548} {"train_loss": -9.049962997436523, "global_step": 92070, "epoch": 548} {"train_loss": -9.30404281616211, "global_step": 92071, "epoch": 548} {"train_loss": -9.099910736083984, "global_step": 92072, "epoch": 548} {"train_loss": -9.108122825622559, "global_step": 92073, "epoch": 548} {"train_loss": -9.440710067749023, "global_step": 92074, "epoch": 548} {"train_loss": -9.208677291870117, "global_step": 92075, "epoch": 548} {"train_loss": -9.307250022888184, "global_step": 92076, "epoch": 548} {"train_loss": -9.305261611938477, "global_step": 92077, "epoch": 548} {"train_loss": -9.24896240234375, "global_step": 92078, "epoch": 548} {"train_loss": -9.256696701049805, "global_step": 92079, "epoch": 548} {"train_loss": -8.974705696105957, "global_step": 92080, "epoch": 548} {"train_loss": -9.232632637023926, "global_step": 92081, "epoch": 548} {"train_loss": -8.991081237792969, "global_step": 92082, "epoch": 548} {"train_loss": -9.263675689697266, "global_step": 92083, "epoch": 548} {"train_loss": -9.276796340942383, "global_step": 92084, "epoch": 548} {"train_loss": -9.150603294372559, "global_step": 92085, "epoch": 548} {"train_loss": -9.304746627807617, "global_step": 92086, "epoch": 548} {"train_loss": -9.156181335449219, "global_step": 92087, "epoch": 548} {"train_loss": -9.439300537109375, "global_step": 92088, "epoch": 548} {"train_loss": -9.60671329498291, "global_step": 92089, "epoch": 548} {"train_loss": -9.5197172164917, "global_step": 92090, "epoch": 548} {"train_loss": -9.382123947143555, "global_step": 92091, "epoch": 548} {"train_loss": -9.64652156829834, "global_step": 92092, "epoch": 548} {"train_loss": -9.122865676879883, "global_step": 92093, "epoch": 548} {"train_loss": -9.454962730407715, "global_step": 92094, "epoch": 548} {"train_loss": -9.65213394165039, "global_step": 92095, "epoch": 548} {"train_loss": -9.417289733886719, "global_step": 92096, "epoch": 548} {"train_loss": -9.515396118164062, "global_step": 92097, "epoch": 548} {"train_loss": -9.655927658081055, "global_step": 92098, "epoch": 548} {"train_loss": -9.226312637329102, "global_step": 92099, "epoch": 548} {"train_loss": -9.312746047973633, "global_step": 92100, "epoch": 548} {"train_loss": -9.406722068786621, "global_step": 92101, "epoch": 548} {"train_loss": -9.494704246520996, "global_step": 92102, "epoch": 548} {"train_loss": -9.607383728027344, "global_step": 92103, "epoch": 548} {"train_loss": -9.388519287109375, "global_step": 92104, "epoch": 548} {"train_loss": -9.59566879272461, "global_step": 92105, "epoch": 548} {"train_loss": -9.311501502990723, "global_step": 92106, "epoch": 548} {"train_loss": -9.615242958068848, "global_step": 92107, "epoch": 548} {"train_loss": -9.426353454589844, "global_step": 92108, "epoch": 548} {"train_loss": -9.292800903320312, "global_step": 92109, "epoch": 548} {"train_loss": -9.684233665466309, "global_step": 92110, "epoch": 548} {"train_loss": -9.355146408081055, "global_step": 92111, "epoch": 548} {"train_loss": -9.576604843139648, "global_step": 92112, "epoch": 548} {"train_loss": -9.569318771362305, "global_step": 92113, "epoch": 548} {"train_loss": -9.301630020141602, "global_step": 92114, "epoch": 548} {"train_loss": -9.644386291503906, "global_step": 92115, "epoch": 548} {"train_loss": -9.648979187011719, "global_step": 92116, "epoch": 548} {"train_loss": -9.640142440795898, "global_step": 92117, "epoch": 548} {"train_loss": -9.646121978759766, "global_step": 92118, "epoch": 548} {"train_loss": -9.759110450744629, "global_step": 92119, "epoch": 548} {"train_loss": -9.527682304382324, "global_step": 92120, "epoch": 548} {"train_loss": -9.740350723266602, "global_step": 92121, "epoch": 548} {"train_loss": -9.593894958496094, "global_step": 92122, "epoch": 548} {"train_loss": -9.896035194396973, "global_step": 92123, "epoch": 548} {"train_loss": -9.050034523010254, "global_step": 92124, "epoch": 548} {"train_loss": -9.690118789672852, "global_step": 92125, "epoch": 548} {"train_loss": -9.409398078918457, "global_step": 92126, "epoch": 548} {"train_loss": -9.088289260864258, "global_step": 92127, "epoch": 548} {"train_loss": -9.030728340148926, "global_step": 92128, "epoch": 548} {"train_loss": -9.356710433959961, "global_step": 92129, "epoch": 548} {"train_loss": -8.833730697631836, "global_step": 92130, "epoch": 548} {"train_loss": -9.417998313903809, "global_step": 92131, "epoch": 548} {"train_loss": -9.29802131652832, "global_step": 92132, "epoch": 548} {"train_loss": -9.282733917236328, "global_step": 92133, "epoch": 548} {"train_loss": -9.664741516113281, "global_step": 92134, "epoch": 548} {"train_loss": -9.549779891967773, "global_step": 92135, "epoch": 548} {"train_loss": -9.34200668334961, "global_step": 92136, "epoch": 548} {"train_loss": -9.529465675354004, "global_step": 92137, "epoch": 548} {"train_loss": -9.303262710571289, "global_step": 92138, "epoch": 548} {"train_loss": -9.418445587158203, "global_step": 92139, "epoch": 548} {"train_loss": -9.40483283996582, "global_step": 92140, "epoch": 548} {"train_loss": -9.477819442749023, "global_step": 92141, "epoch": 548} {"train_loss": -9.586211204528809, "global_step": 92142, "epoch": 548} {"train_loss": -9.33217716217041, "global_step": 92143, "epoch": 548} {"train_loss": -9.332554817199707, "global_step": 92144, "epoch": 548} {"train_loss": -9.029546737670898, "global_step": 92145, "epoch": 548} {"train_loss": -9.633135795593262, "global_step": 92146, "epoch": 548} {"train_loss": -9.333263397216797, "global_step": 92147, "epoch": 548} {"train_loss": -9.598560333251953, "global_step": 92148, "epoch": 548} {"train_loss": -9.536848068237305, "global_step": 92149, "epoch": 548} {"train_loss": -9.331932067871094, "global_step": 92150, "epoch": 548} {"train_loss": -9.466093063354492, "global_step": 92151, "epoch": 548} {"train_loss": -9.626331329345703, "global_step": 92152, "epoch": 548} {"train_loss": -9.459033966064453, "global_step": 92153, "epoch": 548} {"train_loss": -9.5523681640625, "global_step": 92154, "epoch": 548} {"train_loss": -9.257006645202637, "global_step": 92155, "epoch": 548} {"train_loss": -9.621318817138672, "global_step": 92156, "epoch": 548} {"train_loss": -9.296545028686523, "global_step": 92157, "epoch": 548} {"train_loss": -9.252912521362305, "global_step": 92158, "epoch": 548} {"train_loss": -9.36083984375, "global_step": 92159, "epoch": 548} {"train_loss": -9.56406021118164, "global_step": 92160, "epoch": 548} {"train_loss": -9.33902359008789, "global_step": 92161, "epoch": 548} {"train_loss": -9.704659461975098, "global_step": 92162, "epoch": 548} {"train_loss": -9.393863677978516, "global_step": 92163, "epoch": 548} {"train_loss": -9.81625747680664, "global_step": 92164, "epoch": 548} {"train_loss": -9.4198637008667, "global_step": 92165, "epoch": 548} {"train_loss": -9.584199905395508, "global_step": 92166, "epoch": 548} {"train_loss": -9.662849426269531, "global_step": 92167, "epoch": 548} {"train_loss": -9.661543846130371, "global_step": 92168, "epoch": 548} {"train_loss": -9.668940544128418, "global_step": 92169, "epoch": 548} {"train_loss": -9.824661254882812, "global_step": 92170, "epoch": 548} {"train_loss": -9.714570999145508, "global_step": 92171, "epoch": 548} {"train_loss": -9.462398529052734, "global_step": 92172, "epoch": 548} {"train_loss": -9.500701904296875, "global_step": 92173, "epoch": 548} {"train_loss": -9.52983283996582, "global_step": 92174, "epoch": 548} {"train_loss": -9.674924850463867, "global_step": 92175, "epoch": 548} {"train_loss": -9.523612976074219, "global_step": 92176, "epoch": 548} {"train_loss": -9.400874137878418, "global_step": 92177, "epoch": 548} {"train_loss": -9.482135772705078, "global_step": 92178, "epoch": 548} {"train_loss": -9.435325622558594, "global_step": 92179, "epoch": 548} {"train_loss": -9.350242614746094, "global_step": 92180, "epoch": 548} {"train_loss": -9.498863220214844, "global_step": 92181, "epoch": 548} {"train_loss": -9.049665451049805, "global_step": 92182, "epoch": 548} {"train_loss": -9.09040641784668, "global_step": 92183, "epoch": 548} {"train_loss": -8.962532997131348, "global_step": 92184, "epoch": 548} {"train_loss": -9.021629333496094, "global_step": 92185, "epoch": 548} {"train_loss": -8.917686462402344, "global_step": 92186, "epoch": 548} {"train_loss": -9.321700096130371, "global_step": 92187, "epoch": 548} {"train_loss": -9.5957612991333, "global_step": 92188, "epoch": 548} {"train_loss": -9.324217796325684, "global_step": 92189, "epoch": 548} {"train_loss": -8.944385528564453, "global_step": 92190, "epoch": 548} {"train_loss": -9.421468734741211, "global_step": 92191, "epoch": 548} {"train_loss": -9.378608703613281, "global_step": 92192, "epoch": 548} {"train_loss": -9.26934814453125, "global_step": 92193, "epoch": 548} {"train_loss": -9.25820541381836, "global_step": 92194, "epoch": 548} {"train_loss": -9.669105529785156, "global_step": 92195, "epoch": 548} {"train_loss": -9.602136611938477, "global_step": 92196, "epoch": 548} {"train_loss": -9.442192077636719, "global_step": 92197, "epoch": 548} {"train_loss": -9.534137725830078, "global_step": 92198, "epoch": 548} {"train_loss": -9.461874961853027, "global_step": 92199, "epoch": 548} {"train_loss": -9.523401260375977, "global_step": 92200, "epoch": 548} {"train_loss": -9.506896018981934, "global_step": 92201, "epoch": 548} {"train_loss": -9.612205505371094, "global_step": 92202, "epoch": 548} {"train_loss": -9.626293182373047, "global_step": 92203, "epoch": 548} {"train_loss": -9.517677307128906, "global_step": 92204, "epoch": 548} {"train_loss": -9.828136444091797, "global_step": 92205, "epoch": 548} {"train_loss": -9.642000198364258, "global_step": 92206, "epoch": 548} {"train_loss": -9.606951713562012, "global_step": 92207, "epoch": 548} {"train_loss": -9.644617080688477, "global_step": 92208, "epoch": 548} {"train_loss": -9.657333374023438, "global_step": 92209, "epoch": 548} {"train_loss": -9.586387634277344, "global_step": 92210, "epoch": 548} {"train_loss": -9.634956359863281, "global_step": 92211, "epoch": 548} {"train_loss": -9.561328887939453, "global_step": 92212, "epoch": 548} {"train_loss": -9.499120712280273, "global_step": 92213, "epoch": 548} {"train_loss": -9.531305313110352, "global_step": 92214, "epoch": 548} {"train_loss": -9.542407989501953, "global_step": 92215, "epoch": 548} {"train_loss": -9.663307189941406, "global_step": 92216, "epoch": 548} {"train_loss": -9.663226127624512, "global_step": 92217, "epoch": 548} {"train_loss": -9.73576545715332, "global_step": 92218, "epoch": 548} {"train_loss": -9.746289253234863, "global_step": 92219, "epoch": 548} {"train_loss": -9.658862113952637, "global_step": 92220, "epoch": 548} {"train_loss": -9.585014343261719, "global_step": 92221, "epoch": 548} {"train_loss": -9.649802207946777, "global_step": 92222, "epoch": 548} {"train_loss": -9.695545196533203, "global_step": 92223, "epoch": 548} {"train_loss": -9.238019943237305, "global_step": 92224, "epoch": 548} {"train_loss": -9.31581974029541, "global_step": 92225, "epoch": 548} {"train_loss": -9.370681762695312, "global_step": 92226, "epoch": 548} {"train_loss": -9.443925857543945, "global_step": 92227, "epoch": 548} {"train_loss": -9.431037902832031, "global_step": 92228, "epoch": 548} {"train_loss": -9.058706283569336, "global_step": 92229, "epoch": 548} {"train_loss": -9.20180892944336, "global_step": 92230, "epoch": 548} {"train_loss": -9.43189365523202, "global_step": 92231, "epoch": 548, "val_loss": 201684.640625} {"train_loss": -9.316851615905762, "global_step": 92232, "epoch": 549} {"train_loss": -8.78602123260498, "global_step": 92233, "epoch": 549} {"train_loss": -9.480363845825195, "global_step": 92234, "epoch": 549} {"train_loss": -8.944560050964355, "global_step": 92235, "epoch": 549} {"train_loss": -9.232223510742188, "global_step": 92236, "epoch": 549} {"train_loss": -9.392268180847168, "global_step": 92237, "epoch": 549} {"train_loss": -9.155633926391602, "global_step": 92238, "epoch": 549} {"train_loss": -9.18260383605957, "global_step": 92239, "epoch": 549} {"train_loss": -9.010099411010742, "global_step": 92240, "epoch": 549} {"train_loss": -9.230353355407715, "global_step": 92241, "epoch": 549} {"train_loss": -9.207052230834961, "global_step": 92242, "epoch": 549} {"train_loss": -9.498400688171387, "global_step": 92243, "epoch": 549} {"train_loss": -9.104257583618164, "global_step": 92244, "epoch": 549} {"train_loss": -9.299898147583008, "global_step": 92245, "epoch": 549} {"train_loss": -9.36492919921875, "global_step": 92246, "epoch": 549} {"train_loss": -9.107786178588867, "global_step": 92247, "epoch": 549} {"train_loss": -9.331934928894043, "global_step": 92248, "epoch": 549} {"train_loss": -9.125033378601074, "global_step": 92249, "epoch": 549} {"train_loss": -9.35135555267334, "global_step": 92250, "epoch": 549} {"train_loss": -9.281111717224121, "global_step": 92251, "epoch": 549} {"train_loss": -9.434440612792969, "global_step": 92252, "epoch": 549} {"train_loss": -9.419475555419922, "global_step": 92253, "epoch": 549} {"train_loss": -9.420154571533203, "global_step": 92254, "epoch": 549} {"train_loss": -9.437167167663574, "global_step": 92255, "epoch": 549} {"train_loss": -9.160256385803223, "global_step": 92256, "epoch": 549} {"train_loss": -9.567499160766602, "global_step": 92257, "epoch": 549} {"train_loss": -9.333791732788086, "global_step": 92258, "epoch": 549} {"train_loss": -9.123663902282715, "global_step": 92259, "epoch": 549} {"train_loss": -9.544974327087402, "global_step": 92260, "epoch": 549} {"train_loss": -9.194683074951172, "global_step": 92261, "epoch": 549} {"train_loss": -9.473726272583008, "global_step": 92262, "epoch": 549} {"train_loss": -9.218584060668945, "global_step": 92263, "epoch": 549} {"train_loss": -9.349722862243652, "global_step": 92264, "epoch": 549} {"train_loss": -9.143186569213867, "global_step": 92265, "epoch": 549} {"train_loss": -9.419492721557617, "global_step": 92266, "epoch": 549} {"train_loss": -9.495462417602539, "global_step": 92267, "epoch": 549} {"train_loss": -9.340328216552734, "global_step": 92268, "epoch": 549} {"train_loss": -9.38131332397461, "global_step": 92269, "epoch": 549} {"train_loss": -9.359436988830566, "global_step": 92270, "epoch": 549} {"train_loss": -9.588141441345215, "global_step": 92271, "epoch": 549} {"train_loss": -9.322123527526855, "global_step": 92272, "epoch": 549} {"train_loss": -9.522300720214844, "global_step": 92273, "epoch": 549} {"train_loss": -9.486988067626953, "global_step": 92274, "epoch": 549} {"train_loss": -9.363893508911133, "global_step": 92275, "epoch": 549} {"train_loss": -9.118125915527344, "global_step": 92276, "epoch": 549} {"train_loss": -9.393648147583008, "global_step": 92277, "epoch": 549} {"train_loss": -9.502986907958984, "global_step": 92278, "epoch": 549} {"train_loss": -9.657901763916016, "global_step": 92279, "epoch": 549} {"train_loss": -9.564678192138672, "global_step": 92280, "epoch": 549} {"train_loss": -9.729869842529297, "global_step": 92281, "epoch": 549} {"train_loss": -9.660465240478516, "global_step": 92282, "epoch": 549} {"train_loss": -9.423531532287598, "global_step": 92283, "epoch": 549} {"train_loss": -9.546077728271484, "global_step": 92284, "epoch": 549} {"train_loss": -9.669843673706055, "global_step": 92285, "epoch": 549} {"train_loss": -9.76611614227295, "global_step": 92286, "epoch": 549} {"train_loss": -9.511629104614258, "global_step": 92287, "epoch": 549} {"train_loss": -9.531072616577148, "global_step": 92288, "epoch": 549} {"train_loss": -9.495613098144531, "global_step": 92289, "epoch": 549} {"train_loss": -9.55778694152832, "global_step": 92290, "epoch": 549} {"train_loss": -9.491589546203613, "global_step": 92291, "epoch": 549} {"train_loss": -9.608139991760254, "global_step": 92292, "epoch": 549} {"train_loss": -9.52365493774414, "global_step": 92293, "epoch": 549} {"train_loss": -9.23000717163086, "global_step": 92294, "epoch": 549} {"train_loss": -9.362913131713867, "global_step": 92295, "epoch": 549} {"train_loss": -9.39208984375, "global_step": 92296, "epoch": 549} {"train_loss": -9.066232681274414, "global_step": 92297, "epoch": 549} {"train_loss": -8.958053588867188, "global_step": 92298, "epoch": 549} {"train_loss": -9.227241516113281, "global_step": 92299, "epoch": 549} {"train_loss": -8.808595657348633, "global_step": 92300, "epoch": 549} {"train_loss": -9.046554565429688, "global_step": 92301, "epoch": 549} {"train_loss": -9.219501495361328, "global_step": 92302, "epoch": 549} {"train_loss": -9.247587203979492, "global_step": 92303, "epoch": 549} {"train_loss": -9.083395004272461, "global_step": 92304, "epoch": 549} {"train_loss": -9.036395072937012, "global_step": 92305, "epoch": 549} {"train_loss": -9.01608657836914, "global_step": 92306, "epoch": 549} {"train_loss": -9.233667373657227, "global_step": 92307, "epoch": 549} {"train_loss": -9.152142524719238, "global_step": 92308, "epoch": 549} {"train_loss": -9.171767234802246, "global_step": 92309, "epoch": 549} {"train_loss": -9.158223152160645, "global_step": 92310, "epoch": 549} {"train_loss": -9.290268898010254, "global_step": 92311, "epoch": 549} {"train_loss": -8.996206283569336, "global_step": 92312, "epoch": 549} {"train_loss": -9.369897842407227, "global_step": 92313, "epoch": 549} {"train_loss": -8.87975788116455, "global_step": 92314, "epoch": 549} {"train_loss": -9.357782363891602, "global_step": 92315, "epoch": 549} {"train_loss": -9.143682479858398, "global_step": 92316, "epoch": 549} {"train_loss": -9.189872741699219, "global_step": 92317, "epoch": 549} {"train_loss": -9.313579559326172, "global_step": 92318, "epoch": 549} {"train_loss": -9.380908966064453, "global_step": 92319, "epoch": 549} {"train_loss": -9.403304100036621, "global_step": 92320, "epoch": 549} {"train_loss": -9.366271018981934, "global_step": 92321, "epoch": 549} {"train_loss": -9.435943603515625, "global_step": 92322, "epoch": 549} {"train_loss": -9.45926570892334, "global_step": 92323, "epoch": 549} {"train_loss": -9.488822937011719, "global_step": 92324, "epoch": 549} {"train_loss": -9.670486450195312, "global_step": 92325, "epoch": 549} {"train_loss": -9.633527755737305, "global_step": 92326, "epoch": 549} {"train_loss": -9.530720710754395, "global_step": 92327, "epoch": 549} {"train_loss": -9.698373794555664, "global_step": 92328, "epoch": 549} {"train_loss": -9.549222946166992, "global_step": 92329, "epoch": 549} {"train_loss": -9.518295288085938, "global_step": 92330, "epoch": 549} {"train_loss": -9.524784088134766, "global_step": 92331, "epoch": 549} {"train_loss": -9.638604164123535, "global_step": 92332, "epoch": 549} {"train_loss": -9.505611419677734, "global_step": 92333, "epoch": 549} {"train_loss": -9.311710357666016, "global_step": 92334, "epoch": 549} {"train_loss": -9.56958293914795, "global_step": 92335, "epoch": 549} {"train_loss": -9.654909133911133, "global_step": 92336, "epoch": 549} {"train_loss": -9.696746826171875, "global_step": 92337, "epoch": 549} {"train_loss": -9.807720184326172, "global_step": 92338, "epoch": 549} {"train_loss": -9.413093566894531, "global_step": 92339, "epoch": 549} {"train_loss": -9.593013763427734, "global_step": 92340, "epoch": 549} {"train_loss": -9.665231704711914, "global_step": 92341, "epoch": 549} {"train_loss": -9.8649320602417, "global_step": 92342, "epoch": 549} {"train_loss": -9.695011138916016, "global_step": 92343, "epoch": 549} {"train_loss": -9.720205307006836, "global_step": 92344, "epoch": 549} {"train_loss": -9.920511245727539, "global_step": 92345, "epoch": 549} {"train_loss": -9.584196090698242, "global_step": 92346, "epoch": 549} {"train_loss": -9.706766128540039, "global_step": 92347, "epoch": 549} {"train_loss": -9.891380310058594, "global_step": 92348, "epoch": 549} {"train_loss": -9.567593574523926, "global_step": 92349, "epoch": 549} {"train_loss": -9.72045612335205, "global_step": 92350, "epoch": 549} {"train_loss": -9.609994888305664, "global_step": 92351, "epoch": 549} {"train_loss": -9.677573204040527, "global_step": 92352, "epoch": 549} {"train_loss": -9.59914779663086, "global_step": 92353, "epoch": 549} {"train_loss": -9.5485200881958, "global_step": 92354, "epoch": 549} {"train_loss": -9.697013854980469, "global_step": 92355, "epoch": 549} {"train_loss": -9.632345199584961, "global_step": 92356, "epoch": 549} {"train_loss": -9.436613082885742, "global_step": 92357, "epoch": 549} {"train_loss": -9.543556213378906, "global_step": 92358, "epoch": 549} {"train_loss": -9.429463386535645, "global_step": 92359, "epoch": 549} {"train_loss": -9.276992797851562, "global_step": 92360, "epoch": 549} {"train_loss": -9.715686798095703, "global_step": 92361, "epoch": 549} {"train_loss": -9.430273056030273, "global_step": 92362, "epoch": 549} {"train_loss": -9.309922218322754, "global_step": 92363, "epoch": 549} {"train_loss": -9.385271072387695, "global_step": 92364, "epoch": 549} {"train_loss": -9.44302749633789, "global_step": 92365, "epoch": 549} {"train_loss": -9.533323287963867, "global_step": 92366, "epoch": 549} {"train_loss": -9.320390701293945, "global_step": 92367, "epoch": 549} {"train_loss": -9.70548152923584, "global_step": 92368, "epoch": 549} {"train_loss": -9.534562110900879, "global_step": 92369, "epoch": 549} {"train_loss": -9.613726615905762, "global_step": 92370, "epoch": 549} {"train_loss": -9.317462921142578, "global_step": 92371, "epoch": 549} {"train_loss": -9.651674270629883, "global_step": 92372, "epoch": 549} {"train_loss": -9.530061721801758, "global_step": 92373, "epoch": 549} {"train_loss": -9.42009449005127, "global_step": 92374, "epoch": 549} {"train_loss": -9.491698265075684, "global_step": 92375, "epoch": 549} {"train_loss": -9.301678657531738, "global_step": 92376, "epoch": 549} {"train_loss": -9.082391738891602, "global_step": 92377, "epoch": 549} {"train_loss": -9.465692520141602, "global_step": 92378, "epoch": 549} {"train_loss": -9.003679275512695, "global_step": 92379, "epoch": 549} {"train_loss": -9.399613380432129, "global_step": 92380, "epoch": 549} {"train_loss": -9.176491737365723, "global_step": 92381, "epoch": 549} {"train_loss": -9.263269424438477, "global_step": 92382, "epoch": 549} {"train_loss": -9.382574081420898, "global_step": 92383, "epoch": 549} {"train_loss": -9.39393424987793, "global_step": 92384, "epoch": 549} {"train_loss": -9.357715606689453, "global_step": 92385, "epoch": 549} {"train_loss": -9.348581314086914, "global_step": 92386, "epoch": 549} {"train_loss": -8.932268142700195, "global_step": 92387, "epoch": 549} {"train_loss": -9.43099308013916, "global_step": 92388, "epoch": 549} {"train_loss": -9.395849227905273, "global_step": 92389, "epoch": 549} {"train_loss": -9.229839324951172, "global_step": 92390, "epoch": 549} {"train_loss": -9.435524940490723, "global_step": 92391, "epoch": 549} {"train_loss": -9.266353607177734, "global_step": 92392, "epoch": 549} {"train_loss": -9.32162094116211, "global_step": 92393, "epoch": 549} {"train_loss": -9.450254440307617, "global_step": 92394, "epoch": 549} {"train_loss": -9.613602638244629, "global_step": 92395, "epoch": 549} {"train_loss": -9.407686233520508, "global_step": 92396, "epoch": 549} {"train_loss": -9.519815444946289, "global_step": 92397, "epoch": 549} {"train_loss": -9.461006164550781, "global_step": 92398, "epoch": 549} {"train_loss": -9.400178154309591, "global_step": 92399, "epoch": 549, "val_loss": 203580.734375} {"train_loss": -9.1048002243042, "global_step": 92400, "epoch": 550} {"train_loss": -9.486886978149414, "global_step": 92401, "epoch": 550} {"train_loss": -9.29210376739502, "global_step": 92402, "epoch": 550} {"train_loss": -9.27369213104248, "global_step": 92403, "epoch": 550} {"train_loss": -9.698372840881348, "global_step": 92404, "epoch": 550} {"train_loss": -9.495973587036133, "global_step": 92405, "epoch": 550} {"train_loss": -9.516519546508789, "global_step": 92406, "epoch": 550} {"train_loss": -9.4652099609375, "global_step": 92407, "epoch": 550} {"train_loss": -9.5377836227417, "global_step": 92408, "epoch": 550} {"train_loss": -9.596975326538086, "global_step": 92409, "epoch": 550} {"train_loss": -9.539909362792969, "global_step": 92410, "epoch": 550} {"train_loss": -9.368630409240723, "global_step": 92411, "epoch": 550} {"train_loss": -9.657342910766602, "global_step": 92412, "epoch": 550} {"train_loss": -9.276098251342773, "global_step": 92413, "epoch": 550} {"train_loss": -9.656335830688477, "global_step": 92414, "epoch": 550} {"train_loss": -9.387727737426758, "global_step": 92415, "epoch": 550} {"train_loss": -9.534977912902832, "global_step": 92416, "epoch": 550} {"train_loss": -9.635527610778809, "global_step": 92417, "epoch": 550} {"train_loss": -9.36129093170166, "global_step": 92418, "epoch": 550} {"train_loss": -9.609312057495117, "global_step": 92419, "epoch": 550} {"train_loss": -9.469549179077148, "global_step": 92420, "epoch": 550} {"train_loss": -9.215274810791016, "global_step": 92421, "epoch": 550} {"train_loss": -9.497942924499512, "global_step": 92422, "epoch": 550} {"train_loss": -9.401995658874512, "global_step": 92423, "epoch": 550} {"train_loss": -9.467864036560059, "global_step": 92424, "epoch": 550} {"train_loss": -9.55636978149414, "global_step": 92425, "epoch": 550} {"train_loss": -9.525200843811035, "global_step": 92426, "epoch": 550} {"train_loss": -9.583317756652832, "global_step": 92427, "epoch": 550} {"train_loss": -9.657329559326172, "global_step": 92428, "epoch": 550} {"train_loss": -9.781379699707031, "global_step": 92429, "epoch": 550} {"train_loss": -9.758800506591797, "global_step": 92430, "epoch": 550} {"train_loss": -9.679290771484375, "global_step": 92431, "epoch": 550} {"train_loss": -9.518343925476074, "global_step": 92432, "epoch": 550} {"train_loss": -9.665544509887695, "global_step": 92433, "epoch": 550} {"train_loss": -9.585722923278809, "global_step": 92434, "epoch": 550} {"train_loss": -9.621906280517578, "global_step": 92435, "epoch": 550} {"train_loss": -9.776660919189453, "global_step": 92436, "epoch": 550} {"train_loss": -9.41258430480957, "global_step": 92437, "epoch": 550} {"train_loss": -9.291618347167969, "global_step": 92438, "epoch": 550} {"train_loss": -9.39539909362793, "global_step": 92439, "epoch": 550} {"train_loss": -9.390190124511719, "global_step": 92440, "epoch": 550} {"train_loss": -9.643423080444336, "global_step": 92441, "epoch": 550} {"train_loss": -9.635946273803711, "global_step": 92442, "epoch": 550} {"train_loss": -9.340781211853027, "global_step": 92443, "epoch": 550} {"train_loss": -9.38817310333252, "global_step": 92444, "epoch": 550} {"train_loss": -9.749690055847168, "global_step": 92445, "epoch": 550} {"train_loss": -9.50622844696045, "global_step": 92446, "epoch": 550} {"train_loss": -9.423954010009766, "global_step": 92447, "epoch": 550} {"train_loss": -9.183850288391113, "global_step": 92448, "epoch": 550} {"train_loss": -9.5012845993042, "global_step": 92449, "epoch": 550} {"train_loss": -9.539192199707031, "global_step": 92450, "epoch": 550} {"train_loss": -9.396198272705078, "global_step": 92451, "epoch": 550} {"train_loss": -9.415887832641602, "global_step": 92452, "epoch": 550} {"train_loss": -9.725401878356934, "global_step": 92453, "epoch": 550} {"train_loss": -9.609465599060059, "global_step": 92454, "epoch": 550} {"train_loss": -9.494134902954102, "global_step": 92455, "epoch": 550} {"train_loss": -9.204167366027832, "global_step": 92456, "epoch": 550} {"train_loss": -9.528493881225586, "global_step": 92457, "epoch": 550} {"train_loss": -9.405753135681152, "global_step": 92458, "epoch": 550} {"train_loss": -9.382930755615234, "global_step": 92459, "epoch": 550} {"train_loss": -9.67974853515625, "global_step": 92460, "epoch": 550} {"train_loss": -9.037494659423828, "global_step": 92461, "epoch": 550} {"train_loss": -9.49962329864502, "global_step": 92462, "epoch": 550} {"train_loss": -9.324259757995605, "global_step": 92463, "epoch": 550} {"train_loss": -9.302587509155273, "global_step": 92464, "epoch": 550} {"train_loss": -9.151297569274902, "global_step": 92465, "epoch": 550} {"train_loss": -9.467366218566895, "global_step": 92466, "epoch": 550} {"train_loss": -9.365453720092773, "global_step": 92467, "epoch": 550} {"train_loss": -9.385467529296875, "global_step": 92468, "epoch": 550} {"train_loss": -9.436698913574219, "global_step": 92469, "epoch": 550} {"train_loss": -9.663045883178711, "global_step": 92470, "epoch": 550} {"train_loss": -9.293523788452148, "global_step": 92471, "epoch": 550} {"train_loss": -9.608699798583984, "global_step": 92472, "epoch": 550} {"train_loss": -9.39851188659668, "global_step": 92473, "epoch": 550} {"train_loss": -9.529465675354004, "global_step": 92474, "epoch": 550} {"train_loss": -9.509505271911621, "global_step": 92475, "epoch": 550} {"train_loss": -9.522438049316406, "global_step": 92476, "epoch": 550} {"train_loss": -9.433021545410156, "global_step": 92477, "epoch": 550} {"train_loss": -9.510986328125, "global_step": 92478, "epoch": 550} {"train_loss": -9.354249000549316, "global_step": 92479, "epoch": 550} {"train_loss": -9.462791442871094, "global_step": 92480, "epoch": 550} {"train_loss": -9.348973274230957, "global_step": 92481, "epoch": 550} {"train_loss": -9.620550155639648, "global_step": 92482, "epoch": 550} {"train_loss": -9.521503448486328, "global_step": 92483, "epoch": 550} {"train_loss": -9.551082611083984, "global_step": 92484, "epoch": 550} {"train_loss": -9.446012496948242, "global_step": 92485, "epoch": 550} {"train_loss": -9.74849796295166, "global_step": 92486, "epoch": 550} {"train_loss": -9.780122756958008, "global_step": 92487, "epoch": 550} {"train_loss": -9.714977264404297, "global_step": 92488, "epoch": 550} {"train_loss": -9.756269454956055, "global_step": 92489, "epoch": 550} {"train_loss": -9.636476516723633, "global_step": 92490, "epoch": 550} {"train_loss": -9.806851387023926, "global_step": 92491, "epoch": 550} {"train_loss": -9.545029640197754, "global_step": 92492, "epoch": 550} {"train_loss": -9.641536712646484, "global_step": 92493, "epoch": 550} {"train_loss": -9.69129467010498, "global_step": 92494, "epoch": 550} {"train_loss": -9.692073822021484, "global_step": 92495, "epoch": 550} {"train_loss": -9.565526962280273, "global_step": 92496, "epoch": 550} {"train_loss": -9.878406524658203, "global_step": 92497, "epoch": 550} {"train_loss": -9.585759162902832, "global_step": 92498, "epoch": 550} {"train_loss": -9.710193634033203, "global_step": 92499, "epoch": 550} {"train_loss": -9.542922973632812, "global_step": 92500, "epoch": 550} {"train_loss": -9.897578239440918, "global_step": 92501, "epoch": 550} {"train_loss": -9.756200790405273, "global_step": 92502, "epoch": 550} {"train_loss": -9.833002090454102, "global_step": 92503, "epoch": 550} {"train_loss": -9.375320434570312, "global_step": 92504, "epoch": 550} {"train_loss": -9.590638160705566, "global_step": 92505, "epoch": 550} {"train_loss": -9.744064331054688, "global_step": 92506, "epoch": 550} {"train_loss": -9.652664184570312, "global_step": 92507, "epoch": 550} {"train_loss": -9.4169921875, "global_step": 92508, "epoch": 550} {"train_loss": -9.708723068237305, "global_step": 92509, "epoch": 550} {"train_loss": -9.455095291137695, "global_step": 92510, "epoch": 550} {"train_loss": -9.864175796508789, "global_step": 92511, "epoch": 550} {"train_loss": -9.841425895690918, "global_step": 92512, "epoch": 550} {"train_loss": -9.462484359741211, "global_step": 92513, "epoch": 550} {"train_loss": -9.671197891235352, "global_step": 92514, "epoch": 550} {"train_loss": -9.460762977600098, "global_step": 92515, "epoch": 550} {"train_loss": -9.708708763122559, "global_step": 92516, "epoch": 550} {"train_loss": -9.64329719543457, "global_step": 92517, "epoch": 550} {"train_loss": -9.358322143554688, "global_step": 92518, "epoch": 550} {"train_loss": -9.484879493713379, "global_step": 92519, "epoch": 550} {"train_loss": -9.272558212280273, "global_step": 92520, "epoch": 550} {"train_loss": -9.473580360412598, "global_step": 92521, "epoch": 550} {"train_loss": -9.102149963378906, "global_step": 92522, "epoch": 550} {"train_loss": -9.35060977935791, "global_step": 92523, "epoch": 550} {"train_loss": -9.556143760681152, "global_step": 92524, "epoch": 550} {"train_loss": -9.512235641479492, "global_step": 92525, "epoch": 550} {"train_loss": -9.336932182312012, "global_step": 92526, "epoch": 550} {"train_loss": -9.69414234161377, "global_step": 92527, "epoch": 550} {"train_loss": -9.442327499389648, "global_step": 92528, "epoch": 550} {"train_loss": -9.705648422241211, "global_step": 92529, "epoch": 550} {"train_loss": -9.374750137329102, "global_step": 92530, "epoch": 550} {"train_loss": -9.16905403137207, "global_step": 92531, "epoch": 550} {"train_loss": -9.590514183044434, "global_step": 92532, "epoch": 550} {"train_loss": -9.142223358154297, "global_step": 92533, "epoch": 550} {"train_loss": -9.195953369140625, "global_step": 92534, "epoch": 550} {"train_loss": -8.974969863891602, "global_step": 92535, "epoch": 550} {"train_loss": -9.07632827758789, "global_step": 92536, "epoch": 550} {"train_loss": -8.988500595092773, "global_step": 92537, "epoch": 550} {"train_loss": -9.14164924621582, "global_step": 92538, "epoch": 550} {"train_loss": -8.939014434814453, "global_step": 92539, "epoch": 550} {"train_loss": -9.281342506408691, "global_step": 92540, "epoch": 550} {"train_loss": -9.308120727539062, "global_step": 92541, "epoch": 550} {"train_loss": -9.399812698364258, "global_step": 92542, "epoch": 550} {"train_loss": -9.510730743408203, "global_step": 92543, "epoch": 550} {"train_loss": -9.168901443481445, "global_step": 92544, "epoch": 550} {"train_loss": -9.143543243408203, "global_step": 92545, "epoch": 550} {"train_loss": -9.265398979187012, "global_step": 92546, "epoch": 550} {"train_loss": -9.314529418945312, "global_step": 92547, "epoch": 550} {"train_loss": -9.343828201293945, "global_step": 92548, "epoch": 550} {"train_loss": -9.299605369567871, "global_step": 92549, "epoch": 550} {"train_loss": -9.609888076782227, "global_step": 92550, "epoch": 550} {"train_loss": -9.256837844848633, "global_step": 92551, "epoch": 550} {"train_loss": -9.431818962097168, "global_step": 92552, "epoch": 550} {"train_loss": -9.399618148803711, "global_step": 92553, "epoch": 550} {"train_loss": -9.707403182983398, "global_step": 92554, "epoch": 550} {"train_loss": -9.623390197753906, "global_step": 92555, "epoch": 550} {"train_loss": -9.663639068603516, "global_step": 92556, "epoch": 550} {"train_loss": -9.475896835327148, "global_step": 92557, "epoch": 550} {"train_loss": -9.568723678588867, "global_step": 92558, "epoch": 550} {"train_loss": -9.496661186218262, "global_step": 92559, "epoch": 550} {"train_loss": -9.420933723449707, "global_step": 92560, "epoch": 550} {"train_loss": -9.390481948852539, "global_step": 92561, "epoch": 550} {"train_loss": -9.655414581298828, "global_step": 92562, "epoch": 550} {"train_loss": -9.057558059692383, "global_step": 92563, "epoch": 550} {"train_loss": -9.487306594848633, "global_step": 92564, "epoch": 550} {"train_loss": -9.438421249389648, "global_step": 92565, "epoch": 550} {"train_loss": -9.505846977233887, "global_step": 92566, "epoch": 550} {"train_loss": -9.481520130520774, "global_step": 92567, "epoch": 550, "train/sim_max_reward_0": 0.5174501379187403, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.01595400000718132, "train/sim_max_reward_3": 0.1836673990436183, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 0.24783674189122737, "test/sim_max_reward_4400001": 0.33634685985778984, "test/sim_max_reward_4400002": 0.963480883282799, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.4040720192794284, "test/sim_max_reward_4400005": 0.9668355370451202, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 0.9713285043329407, "test/sim_max_reward_4400008": 0.5542572995375145, "test/sim_max_reward_4400009": 0.4443247466936078, "test/sim_max_reward_4400010": 0.9998796545628408, "test/sim_max_reward_4400011": 0.9589433525576659, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.5435880445132136, "test/sim_max_reward_4400015": 0.9862806211563652, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 0.2062019177555356, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.663922997322572, "test/sim_max_reward_4400022": 0.972538175199556, "test/sim_max_reward_4400023": 0.9510281530991576, "test/sim_max_reward_4400024": 1.0, "test/sim_max_reward_4400025": 0.6223638264542628, "test/sim_max_reward_4400026": 0.9865368333944938, "test/sim_max_reward_4400027": 1.0, "test/sim_max_reward_4400028": 0.6858752458805584, "test/sim_max_reward_4400029": 1.0, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.7123312240549838, "test/sim_max_reward_4400034": 0.4815087972843059, "test/sim_max_reward_4400035": 0.9674277773905009, "test/sim_max_reward_4400036": 0.3763540650093049, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.9791078172703198, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.43096458462286386, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.99610073561027, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.3844992752997752, "test/sim_max_reward_4400046": 0.29395639601664625, "test/sim_max_reward_4400047": 0.9841437851150455, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6195119228282566, "test/mean_score": 0.6296758107068944, "val_loss": 203566.21875, "train_action_mse_error": 3.1949691772460938} {"train_loss": -9.483561515808105, "global_step": 92568, "epoch": 551} {"train_loss": -9.278589248657227, "global_step": 92569, "epoch": 551} {"train_loss": -9.495954513549805, "global_step": 92570, "epoch": 551} {"train_loss": -9.393508911132812, "global_step": 92571, "epoch": 551} {"train_loss": -9.495437622070312, "global_step": 92572, "epoch": 551} {"train_loss": -9.64498519897461, "global_step": 92573, "epoch": 551} {"train_loss": -9.487732887268066, "global_step": 92574, "epoch": 551} {"train_loss": -9.486604690551758, "global_step": 92575, "epoch": 551} {"train_loss": -9.338717460632324, "global_step": 92576, "epoch": 551} {"train_loss": -9.493579864501953, "global_step": 92577, "epoch": 551} {"train_loss": -9.12377643585205, "global_step": 92578, "epoch": 551} {"train_loss": -9.266119003295898, "global_step": 92579, "epoch": 551} {"train_loss": -9.696760177612305, "global_step": 92580, "epoch": 551} {"train_loss": -9.445751190185547, "global_step": 92581, "epoch": 551} {"train_loss": -9.512411117553711, "global_step": 92582, "epoch": 551} {"train_loss": -9.709113121032715, "global_step": 92583, "epoch": 551} {"train_loss": -9.566108703613281, "global_step": 92584, "epoch": 551} {"train_loss": -9.479793548583984, "global_step": 92585, "epoch": 551} {"train_loss": -9.373658180236816, "global_step": 92586, "epoch": 551} {"train_loss": -9.324211120605469, "global_step": 92587, "epoch": 551} {"train_loss": -9.518411636352539, "global_step": 92588, "epoch": 551} {"train_loss": -9.568255424499512, "global_step": 92589, "epoch": 551} {"train_loss": -9.719329833984375, "global_step": 92590, "epoch": 551} {"train_loss": -9.669305801391602, "global_step": 92591, "epoch": 551} {"train_loss": -9.522666931152344, "global_step": 92592, "epoch": 551} {"train_loss": -9.567560195922852, "global_step": 92593, "epoch": 551} {"train_loss": -9.653509140014648, "global_step": 92594, "epoch": 551} {"train_loss": -9.37968635559082, "global_step": 92595, "epoch": 551} {"train_loss": -9.298440933227539, "global_step": 92596, "epoch": 551} {"train_loss": -9.460650444030762, "global_step": 92597, "epoch": 551} {"train_loss": -8.949539184570312, "global_step": 92598, "epoch": 551} {"train_loss": -9.682061195373535, "global_step": 92599, "epoch": 551} {"train_loss": -9.167594909667969, "global_step": 92600, "epoch": 551} {"train_loss": -9.60012149810791, "global_step": 92601, "epoch": 551} {"train_loss": -8.937776565551758, "global_step": 92602, "epoch": 551} {"train_loss": -9.226173400878906, "global_step": 92603, "epoch": 551} {"train_loss": -9.07098388671875, "global_step": 92604, "epoch": 551} {"train_loss": -9.299763679504395, "global_step": 92605, "epoch": 551} {"train_loss": -9.200541496276855, "global_step": 92606, "epoch": 551} {"train_loss": -9.087837219238281, "global_step": 92607, "epoch": 551} {"train_loss": -9.338945388793945, "global_step": 92608, "epoch": 551} {"train_loss": -9.164081573486328, "global_step": 92609, "epoch": 551} {"train_loss": -9.53684139251709, "global_step": 92610, "epoch": 551} {"train_loss": -9.341888427734375, "global_step": 92611, "epoch": 551} {"train_loss": -9.364870071411133, "global_step": 92612, "epoch": 551} {"train_loss": -9.102310180664062, "global_step": 92613, "epoch": 551} {"train_loss": -9.657919883728027, "global_step": 92614, "epoch": 551} {"train_loss": -9.478460311889648, "global_step": 92615, "epoch": 551} {"train_loss": -9.491250991821289, "global_step": 92616, "epoch": 551} {"train_loss": -9.320338249206543, "global_step": 92617, "epoch": 551} {"train_loss": -9.353446960449219, "global_step": 92618, "epoch": 551} {"train_loss": -9.348001480102539, "global_step": 92619, "epoch": 551} {"train_loss": -8.94089412689209, "global_step": 92620, "epoch": 551} {"train_loss": -9.29261589050293, "global_step": 92621, "epoch": 551} {"train_loss": -9.451574325561523, "global_step": 92622, "epoch": 551} {"train_loss": -9.05745792388916, "global_step": 92623, "epoch": 551} {"train_loss": -9.57080364227295, "global_step": 92624, "epoch": 551} {"train_loss": -9.404542922973633, "global_step": 92625, "epoch": 551} {"train_loss": -9.439451217651367, "global_step": 92626, "epoch": 551} {"train_loss": -9.414929389953613, "global_step": 92627, "epoch": 551} {"train_loss": -9.663301467895508, "global_step": 92628, "epoch": 551} {"train_loss": -9.46989631652832, "global_step": 92629, "epoch": 551} {"train_loss": -9.552566528320312, "global_step": 92630, "epoch": 551} {"train_loss": -9.391971588134766, "global_step": 92631, "epoch": 551} {"train_loss": -9.781209945678711, "global_step": 92632, "epoch": 551} {"train_loss": -9.5481595993042, "global_step": 92633, "epoch": 551} {"train_loss": -9.738310813903809, "global_step": 92634, "epoch": 551} {"train_loss": -9.278791427612305, "global_step": 92635, "epoch": 551} {"train_loss": -9.567682266235352, "global_step": 92636, "epoch": 551} {"train_loss": -9.601652145385742, "global_step": 92637, "epoch": 551} {"train_loss": -9.618430137634277, "global_step": 92638, "epoch": 551} {"train_loss": -9.468017578125, "global_step": 92639, "epoch": 551} {"train_loss": -9.512924194335938, "global_step": 92640, "epoch": 551} {"train_loss": -9.466873168945312, "global_step": 92641, "epoch": 551} {"train_loss": -9.469036102294922, "global_step": 92642, "epoch": 551} {"train_loss": -9.436426162719727, "global_step": 92643, "epoch": 551} {"train_loss": -9.637163162231445, "global_step": 92644, "epoch": 551} {"train_loss": -9.364126205444336, "global_step": 92645, "epoch": 551} {"train_loss": -9.67148494720459, "global_step": 92646, "epoch": 551} {"train_loss": -9.367530822753906, "global_step": 92647, "epoch": 551} {"train_loss": -9.315120697021484, "global_step": 92648, "epoch": 551} {"train_loss": -9.393665313720703, "global_step": 92649, "epoch": 551} {"train_loss": -9.471824645996094, "global_step": 92650, "epoch": 551} {"train_loss": -9.418368339538574, "global_step": 92651, "epoch": 551} {"train_loss": -9.699369430541992, "global_step": 92652, "epoch": 551} {"train_loss": -9.378299713134766, "global_step": 92653, "epoch": 551} {"train_loss": -9.527267456054688, "global_step": 92654, "epoch": 551} {"train_loss": -9.541385650634766, "global_step": 92655, "epoch": 551} {"train_loss": -9.30010986328125, "global_step": 92656, "epoch": 551} {"train_loss": -9.907691955566406, "global_step": 92657, "epoch": 551} {"train_loss": -9.410164833068848, "global_step": 92658, "epoch": 551} {"train_loss": -9.666749954223633, "global_step": 92659, "epoch": 551} {"train_loss": -9.552123069763184, "global_step": 92660, "epoch": 551} {"train_loss": -9.639787673950195, "global_step": 92661, "epoch": 551} {"train_loss": -9.33746337890625, "global_step": 92662, "epoch": 551} {"train_loss": -9.795103073120117, "global_step": 92663, "epoch": 551} {"train_loss": -9.368374824523926, "global_step": 92664, "epoch": 551} {"train_loss": -9.58224105834961, "global_step": 92665, "epoch": 551} {"train_loss": -9.275615692138672, "global_step": 92666, "epoch": 551} {"train_loss": -9.571967124938965, "global_step": 92667, "epoch": 551} {"train_loss": -9.44549560546875, "global_step": 92668, "epoch": 551} {"train_loss": -9.319526672363281, "global_step": 92669, "epoch": 551} {"train_loss": -9.712902069091797, "global_step": 92670, "epoch": 551} {"train_loss": -9.040136337280273, "global_step": 92671, "epoch": 551} {"train_loss": -9.18189811706543, "global_step": 92672, "epoch": 551} {"train_loss": -9.619096755981445, "global_step": 92673, "epoch": 551} {"train_loss": -9.505416870117188, "global_step": 92674, "epoch": 551} {"train_loss": -9.496488571166992, "global_step": 92675, "epoch": 551} {"train_loss": -9.669873237609863, "global_step": 92676, "epoch": 551} {"train_loss": -9.425962448120117, "global_step": 92677, "epoch": 551} {"train_loss": -9.839454650878906, "global_step": 92678, "epoch": 551} {"train_loss": -9.543153762817383, "global_step": 92679, "epoch": 551} {"train_loss": -9.69906234741211, "global_step": 92680, "epoch": 551} {"train_loss": -9.629555702209473, "global_step": 92681, "epoch": 551} {"train_loss": -9.352651596069336, "global_step": 92682, "epoch": 551} {"train_loss": -9.697818756103516, "global_step": 92683, "epoch": 551} {"train_loss": -9.736903190612793, "global_step": 92684, "epoch": 551} {"train_loss": -9.634106636047363, "global_step": 92685, "epoch": 551} {"train_loss": -9.661527633666992, "global_step": 92686, "epoch": 551} {"train_loss": -9.664749145507812, "global_step": 92687, "epoch": 551} {"train_loss": -9.528833389282227, "global_step": 92688, "epoch": 551} {"train_loss": -9.623577117919922, "global_step": 92689, "epoch": 551} {"train_loss": -9.615620613098145, "global_step": 92690, "epoch": 551} {"train_loss": -9.470998764038086, "global_step": 92691, "epoch": 551} {"train_loss": -9.659370422363281, "global_step": 92692, "epoch": 551} {"train_loss": -9.657560348510742, "global_step": 92693, "epoch": 551} {"train_loss": -9.5556640625, "global_step": 92694, "epoch": 551} {"train_loss": -9.6768217086792, "global_step": 92695, "epoch": 551} {"train_loss": -9.536161422729492, "global_step": 92696, "epoch": 551} {"train_loss": -9.824579238891602, "global_step": 92697, "epoch": 551} {"train_loss": -9.636308670043945, "global_step": 92698, "epoch": 551} {"train_loss": -9.678627014160156, "global_step": 92699, "epoch": 551} {"train_loss": -9.671147346496582, "global_step": 92700, "epoch": 551} {"train_loss": -9.580376625061035, "global_step": 92701, "epoch": 551} {"train_loss": -9.59581470489502, "global_step": 92702, "epoch": 551} {"train_loss": -9.398199081420898, "global_step": 92703, "epoch": 551} {"train_loss": -9.460866928100586, "global_step": 92704, "epoch": 551} {"train_loss": -9.503633499145508, "global_step": 92705, "epoch": 551} {"train_loss": -9.25982666015625, "global_step": 92706, "epoch": 551} {"train_loss": -9.230960845947266, "global_step": 92707, "epoch": 551} {"train_loss": -9.315744400024414, "global_step": 92708, "epoch": 551} {"train_loss": -9.47555923461914, "global_step": 92709, "epoch": 551} {"train_loss": -9.569650650024414, "global_step": 92710, "epoch": 551} {"train_loss": -9.47634506225586, "global_step": 92711, "epoch": 551} {"train_loss": -9.412189483642578, "global_step": 92712, "epoch": 551} {"train_loss": -9.486604690551758, "global_step": 92713, "epoch": 551} {"train_loss": -9.351316452026367, "global_step": 92714, "epoch": 551} {"train_loss": -9.289892196655273, "global_step": 92715, "epoch": 551} {"train_loss": -9.56678581237793, "global_step": 92716, "epoch": 551} {"train_loss": -9.606216430664062, "global_step": 92717, "epoch": 551} {"train_loss": -9.270362854003906, "global_step": 92718, "epoch": 551} {"train_loss": -9.454164505004883, "global_step": 92719, "epoch": 551} {"train_loss": -9.616525650024414, "global_step": 92720, "epoch": 551} {"train_loss": -9.218789100646973, "global_step": 92721, "epoch": 551} {"train_loss": -9.219742774963379, "global_step": 92722, "epoch": 551} {"train_loss": -9.468860626220703, "global_step": 92723, "epoch": 551} {"train_loss": -9.31768798828125, "global_step": 92724, "epoch": 551} {"train_loss": -9.092020988464355, "global_step": 92725, "epoch": 551} {"train_loss": -9.67713451385498, "global_step": 92726, "epoch": 551} {"train_loss": -9.379737854003906, "global_step": 92727, "epoch": 551} {"train_loss": -9.319672584533691, "global_step": 92728, "epoch": 551} {"train_loss": -9.477899551391602, "global_step": 92729, "epoch": 551} {"train_loss": -9.264739036560059, "global_step": 92730, "epoch": 551} {"train_loss": -9.277795791625977, "global_step": 92731, "epoch": 551} {"train_loss": -9.408978462219238, "global_step": 92732, "epoch": 551} {"train_loss": -9.45042896270752, "global_step": 92733, "epoch": 551} {"train_loss": -9.345163345336914, "global_step": 92734, "epoch": 551} {"train_loss": -9.463707946595692, "global_step": 92735, "epoch": 551, "val_loss": 204501.390625} {"train_loss": -9.531083106994629, "global_step": 92736, "epoch": 552} {"train_loss": -9.550045013427734, "global_step": 92737, "epoch": 552} {"train_loss": -9.463953018188477, "global_step": 92738, "epoch": 552} {"train_loss": -9.600768089294434, "global_step": 92739, "epoch": 552} {"train_loss": -9.413373947143555, "global_step": 92740, "epoch": 552} {"train_loss": -9.41867733001709, "global_step": 92741, "epoch": 552} {"train_loss": -9.516996383666992, "global_step": 92742, "epoch": 552} {"train_loss": -9.592131614685059, "global_step": 92743, "epoch": 552} {"train_loss": -9.418630599975586, "global_step": 92744, "epoch": 552} {"train_loss": -9.631877899169922, "global_step": 92745, "epoch": 552} {"train_loss": -9.56725788116455, "global_step": 92746, "epoch": 552} {"train_loss": -9.679779052734375, "global_step": 92747, "epoch": 552} {"train_loss": -9.712971687316895, "global_step": 92748, "epoch": 552} {"train_loss": -9.30556869506836, "global_step": 92749, "epoch": 552} {"train_loss": -9.559694290161133, "global_step": 92750, "epoch": 552} {"train_loss": -9.426382064819336, "global_step": 92751, "epoch": 552} {"train_loss": -9.334115982055664, "global_step": 92752, "epoch": 552} {"train_loss": -9.533990859985352, "global_step": 92753, "epoch": 552} {"train_loss": -9.428486824035645, "global_step": 92754, "epoch": 552} {"train_loss": -9.47469711303711, "global_step": 92755, "epoch": 552} {"train_loss": -9.378072738647461, "global_step": 92756, "epoch": 552} {"train_loss": -9.405080795288086, "global_step": 92757, "epoch": 552} {"train_loss": -9.238582611083984, "global_step": 92758, "epoch": 552} {"train_loss": -9.633232116699219, "global_step": 92759, "epoch": 552} {"train_loss": -9.006505012512207, "global_step": 92760, "epoch": 552} {"train_loss": -9.036713600158691, "global_step": 92761, "epoch": 552} {"train_loss": -9.533220291137695, "global_step": 92762, "epoch": 552} {"train_loss": -8.896475791931152, "global_step": 92763, "epoch": 552} {"train_loss": -9.561582565307617, "global_step": 92764, "epoch": 552} {"train_loss": -9.194726943969727, "global_step": 92765, "epoch": 552} {"train_loss": -9.299562454223633, "global_step": 92766, "epoch": 552} {"train_loss": -9.303359985351562, "global_step": 92767, "epoch": 552} {"train_loss": -9.485101699829102, "global_step": 92768, "epoch": 552} {"train_loss": -9.155972480773926, "global_step": 92769, "epoch": 552} {"train_loss": -9.169527053833008, "global_step": 92770, "epoch": 552} {"train_loss": -9.48622989654541, "global_step": 92771, "epoch": 552} {"train_loss": -9.269165992736816, "global_step": 92772, "epoch": 552} {"train_loss": -9.306012153625488, "global_step": 92773, "epoch": 552} {"train_loss": -9.348477363586426, "global_step": 92774, "epoch": 552} {"train_loss": -9.352107048034668, "global_step": 92775, "epoch": 552} {"train_loss": -9.400733947753906, "global_step": 92776, "epoch": 552} {"train_loss": -9.301663398742676, "global_step": 92777, "epoch": 552} {"train_loss": -9.503622055053711, "global_step": 92778, "epoch": 552} {"train_loss": -9.530694007873535, "global_step": 92779, "epoch": 552} {"train_loss": -9.577917098999023, "global_step": 92780, "epoch": 552} {"train_loss": -9.483240127563477, "global_step": 92781, "epoch": 552} {"train_loss": -9.251212120056152, "global_step": 92782, "epoch": 552} {"train_loss": -9.69550895690918, "global_step": 92783, "epoch": 552} {"train_loss": -9.664817810058594, "global_step": 92784, "epoch": 552} {"train_loss": -9.483993530273438, "global_step": 92785, "epoch": 552} {"train_loss": -9.448690414428711, "global_step": 92786, "epoch": 552} {"train_loss": -9.485453605651855, "global_step": 92787, "epoch": 552} {"train_loss": -9.496232986450195, "global_step": 92788, "epoch": 552} {"train_loss": -9.757205963134766, "global_step": 92789, "epoch": 552} {"train_loss": -9.684656143188477, "global_step": 92790, "epoch": 552} {"train_loss": -9.746496200561523, "global_step": 92791, "epoch": 552} {"train_loss": -9.786060333251953, "global_step": 92792, "epoch": 552} {"train_loss": -9.802302360534668, "global_step": 92793, "epoch": 552} {"train_loss": -9.628150939941406, "global_step": 92794, "epoch": 552} {"train_loss": -9.718912124633789, "global_step": 92795, "epoch": 552} {"train_loss": -9.899876594543457, "global_step": 92796, "epoch": 552} {"train_loss": -9.511484146118164, "global_step": 92797, "epoch": 552} {"train_loss": -9.67041301727295, "global_step": 92798, "epoch": 552} {"train_loss": -9.753507614135742, "global_step": 92799, "epoch": 552} {"train_loss": -9.564334869384766, "global_step": 92800, "epoch": 552} {"train_loss": -9.63128662109375, "global_step": 92801, "epoch": 552} {"train_loss": -9.405475616455078, "global_step": 92802, "epoch": 552} {"train_loss": -9.462753295898438, "global_step": 92803, "epoch": 552} {"train_loss": -9.677218437194824, "global_step": 92804, "epoch": 552} {"train_loss": -9.653280258178711, "global_step": 92805, "epoch": 552} {"train_loss": -9.629293441772461, "global_step": 92806, "epoch": 552} {"train_loss": -9.522781372070312, "global_step": 92807, "epoch": 552} {"train_loss": -9.559422492980957, "global_step": 92808, "epoch": 552} {"train_loss": -9.460423469543457, "global_step": 92809, "epoch": 552} {"train_loss": -9.490425109863281, "global_step": 92810, "epoch": 552} {"train_loss": -9.712297439575195, "global_step": 92811, "epoch": 552} {"train_loss": -9.739025115966797, "global_step": 92812, "epoch": 552} {"train_loss": -9.574432373046875, "global_step": 92813, "epoch": 552} {"train_loss": -9.592588424682617, "global_step": 92814, "epoch": 552} {"train_loss": -9.572330474853516, "global_step": 92815, "epoch": 552} {"train_loss": -9.266399383544922, "global_step": 92816, "epoch": 552} {"train_loss": -9.623847961425781, "global_step": 92817, "epoch": 552} {"train_loss": -9.509651184082031, "global_step": 92818, "epoch": 552} {"train_loss": -9.58041000366211, "global_step": 92819, "epoch": 552} {"train_loss": -9.552858352661133, "global_step": 92820, "epoch": 552} {"train_loss": -9.632772445678711, "global_step": 92821, "epoch": 552} {"train_loss": -9.81428337097168, "global_step": 92822, "epoch": 552} {"train_loss": -9.568197250366211, "global_step": 92823, "epoch": 552} {"train_loss": -9.725693702697754, "global_step": 92824, "epoch": 552} {"train_loss": -9.695588111877441, "global_step": 92825, "epoch": 552} {"train_loss": -9.725656509399414, "global_step": 92826, "epoch": 552} {"train_loss": -9.889829635620117, "global_step": 92827, "epoch": 552} {"train_loss": -9.513710021972656, "global_step": 92828, "epoch": 552} {"train_loss": -9.179022789001465, "global_step": 92829, "epoch": 552} {"train_loss": -9.395048141479492, "global_step": 92830, "epoch": 552} {"train_loss": -8.840465545654297, "global_step": 92831, "epoch": 552} {"train_loss": -9.228981018066406, "global_step": 92832, "epoch": 552} {"train_loss": -9.509317398071289, "global_step": 92833, "epoch": 552} {"train_loss": -9.426726341247559, "global_step": 92834, "epoch": 552} {"train_loss": -9.46348762512207, "global_step": 92835, "epoch": 552} {"train_loss": -9.265779495239258, "global_step": 92836, "epoch": 552} {"train_loss": -9.40909194946289, "global_step": 92837, "epoch": 552} {"train_loss": -9.41454029083252, "global_step": 92838, "epoch": 552} {"train_loss": -9.335103988647461, "global_step": 92839, "epoch": 552} {"train_loss": -9.404550552368164, "global_step": 92840, "epoch": 552} {"train_loss": -9.29935073852539, "global_step": 92841, "epoch": 552} {"train_loss": -9.65351676940918, "global_step": 92842, "epoch": 552} {"train_loss": -9.581524848937988, "global_step": 92843, "epoch": 552} {"train_loss": -9.5961275100708, "global_step": 92844, "epoch": 552} {"train_loss": -9.5286865234375, "global_step": 92845, "epoch": 552} {"train_loss": -9.661718368530273, "global_step": 92846, "epoch": 552} {"train_loss": -9.422800064086914, "global_step": 92847, "epoch": 552} {"train_loss": -9.472089767456055, "global_step": 92848, "epoch": 552} {"train_loss": -9.615653991699219, "global_step": 92849, "epoch": 552} {"train_loss": -9.561700820922852, "global_step": 92850, "epoch": 552} {"train_loss": -9.723220825195312, "global_step": 92851, "epoch": 552} {"train_loss": -9.770490646362305, "global_step": 92852, "epoch": 552} {"train_loss": -9.544523239135742, "global_step": 92853, "epoch": 552} {"train_loss": -9.86009693145752, "global_step": 92854, "epoch": 552} {"train_loss": -9.719841003417969, "global_step": 92855, "epoch": 552} {"train_loss": -9.531940460205078, "global_step": 92856, "epoch": 552} {"train_loss": -9.461212158203125, "global_step": 92857, "epoch": 552} {"train_loss": -9.467432975769043, "global_step": 92858, "epoch": 552} {"train_loss": -9.685393333435059, "global_step": 92859, "epoch": 552} {"train_loss": -9.567388534545898, "global_step": 92860, "epoch": 552} {"train_loss": -9.524564743041992, "global_step": 92861, "epoch": 552} {"train_loss": -9.539874076843262, "global_step": 92862, "epoch": 552} {"train_loss": -9.687962532043457, "global_step": 92863, "epoch": 552} {"train_loss": -9.412374496459961, "global_step": 92864, "epoch": 552} {"train_loss": -9.66695499420166, "global_step": 92865, "epoch": 552} {"train_loss": -9.651809692382812, "global_step": 92866, "epoch": 552} {"train_loss": -9.616645812988281, "global_step": 92867, "epoch": 552} {"train_loss": -9.596014022827148, "global_step": 92868, "epoch": 552} {"train_loss": -9.460552215576172, "global_step": 92869, "epoch": 552} {"train_loss": -9.886502265930176, "global_step": 92870, "epoch": 552} {"train_loss": -9.696874618530273, "global_step": 92871, "epoch": 552} {"train_loss": -9.732137680053711, "global_step": 92872, "epoch": 552} {"train_loss": -9.627679824829102, "global_step": 92873, "epoch": 552} {"train_loss": -9.576920509338379, "global_step": 92874, "epoch": 552} {"train_loss": -9.420623779296875, "global_step": 92875, "epoch": 552} {"train_loss": -9.67629623413086, "global_step": 92876, "epoch": 552} {"train_loss": -9.616765975952148, "global_step": 92877, "epoch": 552} {"train_loss": -9.465301513671875, "global_step": 92878, "epoch": 552} {"train_loss": -9.427006721496582, "global_step": 92879, "epoch": 552} {"train_loss": -9.637410163879395, "global_step": 92880, "epoch": 552} {"train_loss": -9.294214248657227, "global_step": 92881, "epoch": 552} {"train_loss": -9.496917724609375, "global_step": 92882, "epoch": 552} {"train_loss": -9.279810905456543, "global_step": 92883, "epoch": 552} {"train_loss": -9.448558807373047, "global_step": 92884, "epoch": 552} {"train_loss": -9.192093849182129, "global_step": 92885, "epoch": 552} {"train_loss": -9.22862720489502, "global_step": 92886, "epoch": 552} {"train_loss": -9.298686981201172, "global_step": 92887, "epoch": 552} {"train_loss": -9.05312728881836, "global_step": 92888, "epoch": 552} {"train_loss": -9.33585262298584, "global_step": 92889, "epoch": 552} {"train_loss": -9.122589111328125, "global_step": 92890, "epoch": 552} {"train_loss": -9.29531478881836, "global_step": 92891, "epoch": 552} {"train_loss": -9.01220703125, "global_step": 92892, "epoch": 552} {"train_loss": -9.084200859069824, "global_step": 92893, "epoch": 552} {"train_loss": -8.980074882507324, "global_step": 92894, "epoch": 552} {"train_loss": -9.125212669372559, "global_step": 92895, "epoch": 552} {"train_loss": -8.805683135986328, "global_step": 92896, "epoch": 552} {"train_loss": -9.307350158691406, "global_step": 92897, "epoch": 552} {"train_loss": -9.41036605834961, "global_step": 92898, "epoch": 552} {"train_loss": -9.320261001586914, "global_step": 92899, "epoch": 552} {"train_loss": -9.481071472167969, "global_step": 92900, "epoch": 552} {"train_loss": -9.324462890625, "global_step": 92901, "epoch": 552} {"train_loss": -9.409329414367676, "global_step": 92902, "epoch": 552} {"train_loss": -9.483895801362538, "global_step": 92903, "epoch": 552, "val_loss": 203884.90625} {"train_loss": -9.216657638549805, "global_step": 92904, "epoch": 553} {"train_loss": -9.52135944366455, "global_step": 92905, "epoch": 553} {"train_loss": -9.262394905090332, "global_step": 92906, "epoch": 553} {"train_loss": -9.662278175354004, "global_step": 92907, "epoch": 553} {"train_loss": -9.350680351257324, "global_step": 92908, "epoch": 553} {"train_loss": -9.241825103759766, "global_step": 92909, "epoch": 553} {"train_loss": -9.541074752807617, "global_step": 92910, "epoch": 553} {"train_loss": -9.444231033325195, "global_step": 92911, "epoch": 553} {"train_loss": -9.645933151245117, "global_step": 92912, "epoch": 553} {"train_loss": -9.561120986938477, "global_step": 92913, "epoch": 553} {"train_loss": -9.575176239013672, "global_step": 92914, "epoch": 553} {"train_loss": -9.677868843078613, "global_step": 92915, "epoch": 553} {"train_loss": -9.329120635986328, "global_step": 92916, "epoch": 553} {"train_loss": -9.566722869873047, "global_step": 92917, "epoch": 553} {"train_loss": -9.535755157470703, "global_step": 92918, "epoch": 553} {"train_loss": -9.440755844116211, "global_step": 92919, "epoch": 553} {"train_loss": -9.311525344848633, "global_step": 92920, "epoch": 553} {"train_loss": -9.64088249206543, "global_step": 92921, "epoch": 553} {"train_loss": -9.423576354980469, "global_step": 92922, "epoch": 553} {"train_loss": -9.544290542602539, "global_step": 92923, "epoch": 553} {"train_loss": -9.63361644744873, "global_step": 92924, "epoch": 553} {"train_loss": -9.37462043762207, "global_step": 92925, "epoch": 553} {"train_loss": -9.592914581298828, "global_step": 92926, "epoch": 553} {"train_loss": -9.873579025268555, "global_step": 92927, "epoch": 553} {"train_loss": -9.557292938232422, "global_step": 92928, "epoch": 553} {"train_loss": -9.466873168945312, "global_step": 92929, "epoch": 553} {"train_loss": -9.421207427978516, "global_step": 92930, "epoch": 553} {"train_loss": -9.519336700439453, "global_step": 92931, "epoch": 553} {"train_loss": -9.568066596984863, "global_step": 92932, "epoch": 553} {"train_loss": -9.49798583984375, "global_step": 92933, "epoch": 553} {"train_loss": -9.342806816101074, "global_step": 92934, "epoch": 553} {"train_loss": -9.815672874450684, "global_step": 92935, "epoch": 553} {"train_loss": -9.551298141479492, "global_step": 92936, "epoch": 553} {"train_loss": -9.62794017791748, "global_step": 92937, "epoch": 553} {"train_loss": -9.640165328979492, "global_step": 92938, "epoch": 553} {"train_loss": -9.775102615356445, "global_step": 92939, "epoch": 553} {"train_loss": -9.805506706237793, "global_step": 92940, "epoch": 553} {"train_loss": -9.584792137145996, "global_step": 92941, "epoch": 553} {"train_loss": -9.850875854492188, "global_step": 92942, "epoch": 553} {"train_loss": -9.618078231811523, "global_step": 92943, "epoch": 553} {"train_loss": -9.906862258911133, "global_step": 92944, "epoch": 553} {"train_loss": -9.810866355895996, "global_step": 92945, "epoch": 553} {"train_loss": -9.485657691955566, "global_step": 92946, "epoch": 553} {"train_loss": -10.042724609375, "global_step": 92947, "epoch": 553} {"train_loss": -9.6038818359375, "global_step": 92948, "epoch": 553} {"train_loss": -9.752677917480469, "global_step": 92949, "epoch": 553} {"train_loss": -9.592838287353516, "global_step": 92950, "epoch": 553} {"train_loss": -9.681446075439453, "global_step": 92951, "epoch": 553} {"train_loss": -9.793036460876465, "global_step": 92952, "epoch": 553} {"train_loss": -9.77605152130127, "global_step": 92953, "epoch": 553} {"train_loss": -9.630953788757324, "global_step": 92954, "epoch": 553} {"train_loss": -9.600381851196289, "global_step": 92955, "epoch": 553} {"train_loss": -9.662290573120117, "global_step": 92956, "epoch": 553} {"train_loss": -9.402753829956055, "global_step": 92957, "epoch": 553} {"train_loss": -9.668628692626953, "global_step": 92958, "epoch": 553} {"train_loss": -9.45736026763916, "global_step": 92959, "epoch": 553} {"train_loss": -9.393777847290039, "global_step": 92960, "epoch": 553} {"train_loss": -9.279613494873047, "global_step": 92961, "epoch": 553} {"train_loss": -9.642642974853516, "global_step": 92962, "epoch": 553} {"train_loss": -8.972678184509277, "global_step": 92963, "epoch": 553} {"train_loss": -8.994924545288086, "global_step": 92964, "epoch": 553} {"train_loss": -9.260754585266113, "global_step": 92965, "epoch": 553} {"train_loss": -9.423116683959961, "global_step": 92966, "epoch": 553} {"train_loss": -9.021343231201172, "global_step": 92967, "epoch": 553} {"train_loss": -9.32243537902832, "global_step": 92968, "epoch": 553} {"train_loss": -9.460145950317383, "global_step": 92969, "epoch": 553} {"train_loss": -9.14246654510498, "global_step": 92970, "epoch": 553} {"train_loss": -9.513643264770508, "global_step": 92971, "epoch": 553} {"train_loss": -9.275469779968262, "global_step": 92972, "epoch": 553} {"train_loss": -9.481279373168945, "global_step": 92973, "epoch": 553} {"train_loss": -9.401841163635254, "global_step": 92974, "epoch": 553} {"train_loss": -9.09390640258789, "global_step": 92975, "epoch": 553} {"train_loss": -9.471137046813965, "global_step": 92976, "epoch": 553} {"train_loss": -9.292771339416504, "global_step": 92977, "epoch": 553} {"train_loss": -9.366619110107422, "global_step": 92978, "epoch": 553} {"train_loss": -9.423989295959473, "global_step": 92979, "epoch": 553} {"train_loss": -9.210550308227539, "global_step": 92980, "epoch": 553} {"train_loss": -9.466409683227539, "global_step": 92981, "epoch": 553} {"train_loss": -9.30610179901123, "global_step": 92982, "epoch": 553} {"train_loss": -9.445103645324707, "global_step": 92983, "epoch": 553} {"train_loss": -9.188953399658203, "global_step": 92984, "epoch": 553} {"train_loss": -9.2781982421875, "global_step": 92985, "epoch": 553} {"train_loss": -9.312451362609863, "global_step": 92986, "epoch": 553} {"train_loss": -9.169822692871094, "global_step": 92987, "epoch": 553} {"train_loss": -9.253618240356445, "global_step": 92988, "epoch": 553} {"train_loss": -9.500659942626953, "global_step": 92989, "epoch": 553} {"train_loss": -9.21766471862793, "global_step": 92990, "epoch": 553} {"train_loss": -9.198227882385254, "global_step": 92991, "epoch": 553} {"train_loss": -9.14089584350586, "global_step": 92992, "epoch": 553} {"train_loss": -9.47143840789795, "global_step": 92993, "epoch": 553} {"train_loss": -9.453523635864258, "global_step": 92994, "epoch": 553} {"train_loss": -9.40066909790039, "global_step": 92995, "epoch": 553} {"train_loss": -9.479866027832031, "global_step": 92996, "epoch": 553} {"train_loss": -9.566367149353027, "global_step": 92997, "epoch": 553} {"train_loss": -9.649402618408203, "global_step": 92998, "epoch": 553} {"train_loss": -9.633663177490234, "global_step": 92999, "epoch": 553} {"train_loss": -9.674074172973633, "global_step": 93000, "epoch": 553} {"train_loss": -9.757439613342285, "global_step": 93001, "epoch": 553} {"train_loss": -9.736616134643555, "global_step": 93002, "epoch": 553} {"train_loss": -9.633749008178711, "global_step": 93003, "epoch": 553} {"train_loss": -9.629826545715332, "global_step": 93004, "epoch": 553} {"train_loss": -9.408679962158203, "global_step": 93005, "epoch": 553} {"train_loss": -9.592637062072754, "global_step": 93006, "epoch": 553} {"train_loss": -9.846210479736328, "global_step": 93007, "epoch": 553} {"train_loss": -9.840214729309082, "global_step": 93008, "epoch": 553} {"train_loss": -9.806061744689941, "global_step": 93009, "epoch": 553} {"train_loss": -9.930411338806152, "global_step": 93010, "epoch": 553} {"train_loss": -9.67269515991211, "global_step": 93011, "epoch": 553} {"train_loss": -9.748798370361328, "global_step": 93012, "epoch": 553} {"train_loss": -9.752424240112305, "global_step": 93013, "epoch": 553} {"train_loss": -9.623692512512207, "global_step": 93014, "epoch": 553} {"train_loss": -9.581387519836426, "global_step": 93015, "epoch": 553} {"train_loss": -9.219213485717773, "global_step": 93016, "epoch": 553} {"train_loss": -9.55111312866211, "global_step": 93017, "epoch": 553} {"train_loss": -9.032426834106445, "global_step": 93018, "epoch": 553} {"train_loss": -9.541715621948242, "global_step": 93019, "epoch": 553} {"train_loss": -9.220415115356445, "global_step": 93020, "epoch": 553} {"train_loss": -9.195318222045898, "global_step": 93021, "epoch": 553} {"train_loss": -9.237412452697754, "global_step": 93022, "epoch": 553} {"train_loss": -9.492256164550781, "global_step": 93023, "epoch": 553} {"train_loss": -9.297701835632324, "global_step": 93024, "epoch": 553} {"train_loss": -9.363560676574707, "global_step": 93025, "epoch": 553} {"train_loss": -9.527236938476562, "global_step": 93026, "epoch": 553} {"train_loss": -9.568766593933105, "global_step": 93027, "epoch": 553} {"train_loss": -9.62738037109375, "global_step": 93028, "epoch": 553} {"train_loss": -9.556034088134766, "global_step": 93029, "epoch": 553} {"train_loss": -9.474176406860352, "global_step": 93030, "epoch": 553} {"train_loss": -9.555695533752441, "global_step": 93031, "epoch": 553} {"train_loss": -9.608301162719727, "global_step": 93032, "epoch": 553} {"train_loss": -9.321876525878906, "global_step": 93033, "epoch": 553} {"train_loss": -9.527385711669922, "global_step": 93034, "epoch": 553} {"train_loss": -9.28455924987793, "global_step": 93035, "epoch": 553} {"train_loss": -9.349056243896484, "global_step": 93036, "epoch": 553} {"train_loss": -9.612529754638672, "global_step": 93037, "epoch": 553} {"train_loss": -9.297039985656738, "global_step": 93038, "epoch": 553} {"train_loss": -9.495149612426758, "global_step": 93039, "epoch": 553} {"train_loss": -9.667840003967285, "global_step": 93040, "epoch": 553} {"train_loss": -9.51359748840332, "global_step": 93041, "epoch": 553} {"train_loss": -9.571165084838867, "global_step": 93042, "epoch": 553} {"train_loss": -9.615827560424805, "global_step": 93043, "epoch": 553} {"train_loss": -9.688675880432129, "global_step": 93044, "epoch": 553} {"train_loss": -9.56109619140625, "global_step": 93045, "epoch": 553} {"train_loss": -9.462337493896484, "global_step": 93046, "epoch": 553} {"train_loss": -9.452499389648438, "global_step": 93047, "epoch": 553} {"train_loss": -9.744949340820312, "global_step": 93048, "epoch": 553} {"train_loss": -9.700453758239746, "global_step": 93049, "epoch": 553} {"train_loss": -9.591543197631836, "global_step": 93050, "epoch": 553} {"train_loss": -9.485369682312012, "global_step": 93051, "epoch": 553} {"train_loss": -9.624990463256836, "global_step": 93052, "epoch": 553} {"train_loss": -9.580699920654297, "global_step": 93053, "epoch": 553} {"train_loss": -9.29464340209961, "global_step": 93054, "epoch": 553} {"train_loss": -9.39812183380127, "global_step": 93055, "epoch": 553} {"train_loss": -9.595352172851562, "global_step": 93056, "epoch": 553} {"train_loss": -9.662809371948242, "global_step": 93057, "epoch": 553} {"train_loss": -9.531509399414062, "global_step": 93058, "epoch": 553} {"train_loss": -9.553016662597656, "global_step": 93059, "epoch": 553} {"train_loss": -9.526595115661621, "global_step": 93060, "epoch": 553} {"train_loss": -9.562980651855469, "global_step": 93061, "epoch": 553} {"train_loss": -9.560311317443848, "global_step": 93062, "epoch": 553} {"train_loss": -9.52678394317627, "global_step": 93063, "epoch": 553} {"train_loss": -9.671379089355469, "global_step": 93064, "epoch": 553} {"train_loss": -9.18271255493164, "global_step": 93065, "epoch": 553} {"train_loss": -9.469968795776367, "global_step": 93066, "epoch": 553} {"train_loss": -9.432695388793945, "global_step": 93067, "epoch": 553} {"train_loss": -9.505643844604492, "global_step": 93068, "epoch": 553} {"train_loss": -9.829297065734863, "global_step": 93069, "epoch": 553} {"train_loss": -9.477715492248535, "global_step": 93070, "epoch": 553} {"train_loss": -9.505199063391913, "global_step": 93071, "epoch": 553, "val_loss": 209833.296875} {"train_loss": -9.536787033081055, "global_step": 93072, "epoch": 554} {"train_loss": -9.30482292175293, "global_step": 93073, "epoch": 554} {"train_loss": -9.417277336120605, "global_step": 93074, "epoch": 554} {"train_loss": -9.572442054748535, "global_step": 93075, "epoch": 554} {"train_loss": -9.215263366699219, "global_step": 93076, "epoch": 554} {"train_loss": -9.483377456665039, "global_step": 93077, "epoch": 554} {"train_loss": -9.341045379638672, "global_step": 93078, "epoch": 554} {"train_loss": -9.226713180541992, "global_step": 93079, "epoch": 554} {"train_loss": -9.50870132446289, "global_step": 93080, "epoch": 554} {"train_loss": -9.564226150512695, "global_step": 93081, "epoch": 554} {"train_loss": -9.281258583068848, "global_step": 93082, "epoch": 554} {"train_loss": -9.43438720703125, "global_step": 93083, "epoch": 554} {"train_loss": -9.431119918823242, "global_step": 93084, "epoch": 554} {"train_loss": -9.373285293579102, "global_step": 93085, "epoch": 554} {"train_loss": -9.55072021484375, "global_step": 93086, "epoch": 554} {"train_loss": -9.274665832519531, "global_step": 93087, "epoch": 554} {"train_loss": -9.337879180908203, "global_step": 93088, "epoch": 554} {"train_loss": -8.983292579650879, "global_step": 93089, "epoch": 554} {"train_loss": -9.205924987792969, "global_step": 93090, "epoch": 554} {"train_loss": -9.198383331298828, "global_step": 93091, "epoch": 554} {"train_loss": -9.30008316040039, "global_step": 93092, "epoch": 554} {"train_loss": -9.305316925048828, "global_step": 93093, "epoch": 554} {"train_loss": -9.150066375732422, "global_step": 93094, "epoch": 554} {"train_loss": -9.10701847076416, "global_step": 93095, "epoch": 554} {"train_loss": -9.223630905151367, "global_step": 93096, "epoch": 554} {"train_loss": -9.080866813659668, "global_step": 93097, "epoch": 554} {"train_loss": -9.043878555297852, "global_step": 93098, "epoch": 554} {"train_loss": -9.343032836914062, "global_step": 93099, "epoch": 554} {"train_loss": -9.339195251464844, "global_step": 93100, "epoch": 554} {"train_loss": -8.91698932647705, "global_step": 93101, "epoch": 554} {"train_loss": -9.433256149291992, "global_step": 93102, "epoch": 554} {"train_loss": -9.228788375854492, "global_step": 93103, "epoch": 554} {"train_loss": -9.317850112915039, "global_step": 93104, "epoch": 554} {"train_loss": -9.484703063964844, "global_step": 93105, "epoch": 554} {"train_loss": -9.676284790039062, "global_step": 93106, "epoch": 554} {"train_loss": -9.329607009887695, "global_step": 93107, "epoch": 554} {"train_loss": -9.404701232910156, "global_step": 93108, "epoch": 554} {"train_loss": -9.277450561523438, "global_step": 93109, "epoch": 554} {"train_loss": -9.256964683532715, "global_step": 93110, "epoch": 554} {"train_loss": -9.437840461730957, "global_step": 93111, "epoch": 554} {"train_loss": -9.49746036529541, "global_step": 93112, "epoch": 554} {"train_loss": -9.162454605102539, "global_step": 93113, "epoch": 554} {"train_loss": -9.608174324035645, "global_step": 93114, "epoch": 554} {"train_loss": -9.482409477233887, "global_step": 93115, "epoch": 554} {"train_loss": -9.626445770263672, "global_step": 93116, "epoch": 554} {"train_loss": -9.311965942382812, "global_step": 93117, "epoch": 554} {"train_loss": -9.389644622802734, "global_step": 93118, "epoch": 554} {"train_loss": -9.435063362121582, "global_step": 93119, "epoch": 554} {"train_loss": -9.342135429382324, "global_step": 93120, "epoch": 554} {"train_loss": -9.696879386901855, "global_step": 93121, "epoch": 554} {"train_loss": -9.466449737548828, "global_step": 93122, "epoch": 554} {"train_loss": -9.54440689086914, "global_step": 93123, "epoch": 554} {"train_loss": -9.56533432006836, "global_step": 93124, "epoch": 554} {"train_loss": -9.6357421875, "global_step": 93125, "epoch": 554} {"train_loss": -9.641075134277344, "global_step": 93126, "epoch": 554} {"train_loss": -9.460250854492188, "global_step": 93127, "epoch": 554} {"train_loss": -9.661250114440918, "global_step": 93128, "epoch": 554} {"train_loss": -9.20966911315918, "global_step": 93129, "epoch": 554} {"train_loss": -9.483025550842285, "global_step": 93130, "epoch": 554} {"train_loss": -9.451942443847656, "global_step": 93131, "epoch": 554} {"train_loss": -9.66923713684082, "global_step": 93132, "epoch": 554} {"train_loss": -9.621926307678223, "global_step": 93133, "epoch": 554} {"train_loss": -9.47010612487793, "global_step": 93134, "epoch": 554} {"train_loss": -9.42249870300293, "global_step": 93135, "epoch": 554} {"train_loss": -9.323675155639648, "global_step": 93136, "epoch": 554} {"train_loss": -9.273124694824219, "global_step": 93137, "epoch": 554} {"train_loss": -9.408470153808594, "global_step": 93138, "epoch": 554} {"train_loss": -9.334220886230469, "global_step": 93139, "epoch": 554} {"train_loss": -9.458868026733398, "global_step": 93140, "epoch": 554} {"train_loss": -9.076330184936523, "global_step": 93141, "epoch": 554} {"train_loss": -9.449113845825195, "global_step": 93142, "epoch": 554} {"train_loss": -9.08386516571045, "global_step": 93143, "epoch": 554} {"train_loss": -9.274169921875, "global_step": 93144, "epoch": 554} {"train_loss": -9.702153205871582, "global_step": 93145, "epoch": 554} {"train_loss": -9.539158821105957, "global_step": 93146, "epoch": 554} {"train_loss": -9.613468170166016, "global_step": 93147, "epoch": 554} {"train_loss": -9.734428405761719, "global_step": 93148, "epoch": 554} {"train_loss": -9.460002899169922, "global_step": 93149, "epoch": 554} {"train_loss": -9.588749885559082, "global_step": 93150, "epoch": 554} {"train_loss": -9.633169174194336, "global_step": 93151, "epoch": 554} {"train_loss": -9.405594825744629, "global_step": 93152, "epoch": 554} {"train_loss": -9.551675796508789, "global_step": 93153, "epoch": 554} {"train_loss": -9.380733489990234, "global_step": 93154, "epoch": 554} {"train_loss": -9.707900047302246, "global_step": 93155, "epoch": 554} {"train_loss": -9.623140335083008, "global_step": 93156, "epoch": 554} {"train_loss": -9.482826232910156, "global_step": 93157, "epoch": 554} {"train_loss": -9.652650833129883, "global_step": 93158, "epoch": 554} {"train_loss": -9.605823516845703, "global_step": 93159, "epoch": 554} {"train_loss": -9.523154258728027, "global_step": 93160, "epoch": 554} {"train_loss": -9.822271347045898, "global_step": 93161, "epoch": 554} {"train_loss": -9.317523002624512, "global_step": 93162, "epoch": 554} {"train_loss": -9.515657424926758, "global_step": 93163, "epoch": 554} {"train_loss": -9.684754371643066, "global_step": 93164, "epoch": 554} {"train_loss": -9.683743476867676, "global_step": 93165, "epoch": 554} {"train_loss": -9.897968292236328, "global_step": 93166, "epoch": 554} {"train_loss": -9.657907485961914, "global_step": 93167, "epoch": 554} {"train_loss": -9.768510818481445, "global_step": 93168, "epoch": 554} {"train_loss": -9.949071884155273, "global_step": 93169, "epoch": 554} {"train_loss": -9.638984680175781, "global_step": 93170, "epoch": 554} {"train_loss": -9.742826461791992, "global_step": 93171, "epoch": 554} {"train_loss": -9.640501976013184, "global_step": 93172, "epoch": 554} {"train_loss": -9.701709747314453, "global_step": 93173, "epoch": 554} {"train_loss": -9.633660316467285, "global_step": 93174, "epoch": 554} {"train_loss": -9.399652481079102, "global_step": 93175, "epoch": 554} {"train_loss": -9.373205184936523, "global_step": 93176, "epoch": 554} {"train_loss": -9.390279769897461, "global_step": 93177, "epoch": 554} {"train_loss": -9.703798294067383, "global_step": 93178, "epoch": 554} {"train_loss": -9.21827507019043, "global_step": 93179, "epoch": 554} {"train_loss": -9.687931060791016, "global_step": 93180, "epoch": 554} {"train_loss": -9.427452087402344, "global_step": 93181, "epoch": 554} {"train_loss": -9.516721725463867, "global_step": 93182, "epoch": 554} {"train_loss": -9.722960472106934, "global_step": 93183, "epoch": 554} {"train_loss": -9.451827049255371, "global_step": 93184, "epoch": 554} {"train_loss": -9.593811988830566, "global_step": 93185, "epoch": 554} {"train_loss": -9.796370506286621, "global_step": 93186, "epoch": 554} {"train_loss": -9.614508628845215, "global_step": 93187, "epoch": 554} {"train_loss": -9.609302520751953, "global_step": 93188, "epoch": 554} {"train_loss": -9.594207763671875, "global_step": 93189, "epoch": 554} {"train_loss": -9.566551208496094, "global_step": 93190, "epoch": 554} {"train_loss": -9.462240219116211, "global_step": 93191, "epoch": 554} {"train_loss": -9.40379524230957, "global_step": 93192, "epoch": 554} {"train_loss": -9.511701583862305, "global_step": 93193, "epoch": 554} {"train_loss": -9.64892578125, "global_step": 93194, "epoch": 554} {"train_loss": -9.66585922241211, "global_step": 93195, "epoch": 554} {"train_loss": -9.427356719970703, "global_step": 93196, "epoch": 554} {"train_loss": -9.060440063476562, "global_step": 93197, "epoch": 554} {"train_loss": -9.418964385986328, "global_step": 93198, "epoch": 554} {"train_loss": -9.113134384155273, "global_step": 93199, "epoch": 554} {"train_loss": -9.091839790344238, "global_step": 93200, "epoch": 554} {"train_loss": -9.278676986694336, "global_step": 93201, "epoch": 554} {"train_loss": -8.86279296875, "global_step": 93202, "epoch": 554} {"train_loss": -9.139222145080566, "global_step": 93203, "epoch": 554} {"train_loss": -9.350044250488281, "global_step": 93204, "epoch": 554} {"train_loss": -9.23822021484375, "global_step": 93205, "epoch": 554} {"train_loss": -9.096927642822266, "global_step": 93206, "epoch": 554} {"train_loss": -9.483271598815918, "global_step": 93207, "epoch": 554} {"train_loss": -9.527779579162598, "global_step": 93208, "epoch": 554} {"train_loss": -9.436038970947266, "global_step": 93209, "epoch": 554} {"train_loss": -9.295417785644531, "global_step": 93210, "epoch": 554} {"train_loss": -9.331483840942383, "global_step": 93211, "epoch": 554} {"train_loss": -9.31035041809082, "global_step": 93212, "epoch": 554} {"train_loss": -9.278486251831055, "global_step": 93213, "epoch": 554} {"train_loss": -9.451170921325684, "global_step": 93214, "epoch": 554} {"train_loss": -9.316722869873047, "global_step": 93215, "epoch": 554} {"train_loss": -9.506766319274902, "global_step": 93216, "epoch": 554} {"train_loss": -9.31677532196045, "global_step": 93217, "epoch": 554} {"train_loss": -9.378471374511719, "global_step": 93218, "epoch": 554} {"train_loss": -9.365331649780273, "global_step": 93219, "epoch": 554} {"train_loss": -9.46243667602539, "global_step": 93220, "epoch": 554} {"train_loss": -9.225563049316406, "global_step": 93221, "epoch": 554} {"train_loss": -9.517542839050293, "global_step": 93222, "epoch": 554} {"train_loss": -9.331842422485352, "global_step": 93223, "epoch": 554} {"train_loss": -9.419929504394531, "global_step": 93224, "epoch": 554} {"train_loss": -9.305868148803711, "global_step": 93225, "epoch": 554} {"train_loss": -9.806111335754395, "global_step": 93226, "epoch": 554} {"train_loss": -9.307924270629883, "global_step": 93227, "epoch": 554} {"train_loss": -9.614326477050781, "global_step": 93228, "epoch": 554} {"train_loss": -9.424356460571289, "global_step": 93229, "epoch": 554} {"train_loss": -9.557619094848633, "global_step": 93230, "epoch": 554} {"train_loss": -9.641878128051758, "global_step": 93231, "epoch": 554} {"train_loss": -9.668977737426758, "global_step": 93232, "epoch": 554} {"train_loss": -9.465024948120117, "global_step": 93233, "epoch": 554} {"train_loss": -9.617085456848145, "global_step": 93234, "epoch": 554} {"train_loss": -9.29029369354248, "global_step": 93235, "epoch": 554} {"train_loss": -9.488007545471191, "global_step": 93236, "epoch": 554} {"train_loss": -9.505617141723633, "global_step": 93237, "epoch": 554} {"train_loss": -9.467670440673828, "global_step": 93238, "epoch": 554} {"train_loss": -9.442561768350147, "global_step": 93239, "epoch": 554, "val_loss": 205264.546875} {"train_loss": -9.410577774047852, "global_step": 93240, "epoch": 555} {"train_loss": -9.717910766601562, "global_step": 93241, "epoch": 555} {"train_loss": -9.74532413482666, "global_step": 93242, "epoch": 555} {"train_loss": -9.651362419128418, "global_step": 93243, "epoch": 555} {"train_loss": -9.602095603942871, "global_step": 93244, "epoch": 555} {"train_loss": -9.252480506896973, "global_step": 93245, "epoch": 555} {"train_loss": -9.625940322875977, "global_step": 93246, "epoch": 555} {"train_loss": -9.36041259765625, "global_step": 93247, "epoch": 555} {"train_loss": -9.763461112976074, "global_step": 93248, "epoch": 555} {"train_loss": -9.486143112182617, "global_step": 93249, "epoch": 555} {"train_loss": -9.426429748535156, "global_step": 93250, "epoch": 555} {"train_loss": -9.528936386108398, "global_step": 93251, "epoch": 555} {"train_loss": -9.392557144165039, "global_step": 93252, "epoch": 555} {"train_loss": -9.73705005645752, "global_step": 93253, "epoch": 555} {"train_loss": -9.362386703491211, "global_step": 93254, "epoch": 555} {"train_loss": -9.774099349975586, "global_step": 93255, "epoch": 555} {"train_loss": -9.601900100708008, "global_step": 93256, "epoch": 555} {"train_loss": -9.798970222473145, "global_step": 93257, "epoch": 555} {"train_loss": -9.529671669006348, "global_step": 93258, "epoch": 555} {"train_loss": -9.772570610046387, "global_step": 93259, "epoch": 555} {"train_loss": -9.586567878723145, "global_step": 93260, "epoch": 555} {"train_loss": -9.389606475830078, "global_step": 93261, "epoch": 555} {"train_loss": -9.399370193481445, "global_step": 93262, "epoch": 555} {"train_loss": -9.324745178222656, "global_step": 93263, "epoch": 555} {"train_loss": -9.456926345825195, "global_step": 93264, "epoch": 555} {"train_loss": -9.398364067077637, "global_step": 93265, "epoch": 555} {"train_loss": -9.392601013183594, "global_step": 93266, "epoch": 555} {"train_loss": -9.476386070251465, "global_step": 93267, "epoch": 555} {"train_loss": -9.372474670410156, "global_step": 93268, "epoch": 555} {"train_loss": -9.347488403320312, "global_step": 93269, "epoch": 555} {"train_loss": -9.257781982421875, "global_step": 93270, "epoch": 555} {"train_loss": -9.519963264465332, "global_step": 93271, "epoch": 555} {"train_loss": -9.37814998626709, "global_step": 93272, "epoch": 555} {"train_loss": -9.4414701461792, "global_step": 93273, "epoch": 555} {"train_loss": -9.512945175170898, "global_step": 93274, "epoch": 555} {"train_loss": -9.14963436126709, "global_step": 93275, "epoch": 555} {"train_loss": -9.545523643493652, "global_step": 93276, "epoch": 555} {"train_loss": -9.378442764282227, "global_step": 93277, "epoch": 555} {"train_loss": -9.644671440124512, "global_step": 93278, "epoch": 555} {"train_loss": -9.454527854919434, "global_step": 93279, "epoch": 555} {"train_loss": -9.331674575805664, "global_step": 93280, "epoch": 555} {"train_loss": -9.785626411437988, "global_step": 93281, "epoch": 555} {"train_loss": -9.539094924926758, "global_step": 93282, "epoch": 555} {"train_loss": -9.58867359161377, "global_step": 93283, "epoch": 555} {"train_loss": -9.325691223144531, "global_step": 93284, "epoch": 555} {"train_loss": -9.401000022888184, "global_step": 93285, "epoch": 555} {"train_loss": -9.501629829406738, "global_step": 93286, "epoch": 555} {"train_loss": -9.285548210144043, "global_step": 93287, "epoch": 555} {"train_loss": -9.533744812011719, "global_step": 93288, "epoch": 555} {"train_loss": -9.685018539428711, "global_step": 93289, "epoch": 555} {"train_loss": -9.515045166015625, "global_step": 93290, "epoch": 555} {"train_loss": -9.632820129394531, "global_step": 93291, "epoch": 555} {"train_loss": -9.620849609375, "global_step": 93292, "epoch": 555} {"train_loss": -9.729028701782227, "global_step": 93293, "epoch": 555} {"train_loss": -9.61518669128418, "global_step": 93294, "epoch": 555} {"train_loss": -9.28724479675293, "global_step": 93295, "epoch": 555} {"train_loss": -9.58493423461914, "global_step": 93296, "epoch": 555} {"train_loss": -9.47243881225586, "global_step": 93297, "epoch": 555} {"train_loss": -9.332801818847656, "global_step": 93298, "epoch": 555} {"train_loss": -9.345191955566406, "global_step": 93299, "epoch": 555} {"train_loss": -9.616453170776367, "global_step": 93300, "epoch": 555} {"train_loss": -9.538909912109375, "global_step": 93301, "epoch": 555} {"train_loss": -9.741085052490234, "global_step": 93302, "epoch": 555} {"train_loss": -9.721305847167969, "global_step": 93303, "epoch": 555} {"train_loss": -9.847955703735352, "global_step": 93304, "epoch": 555} {"train_loss": -9.645466804504395, "global_step": 93305, "epoch": 555} {"train_loss": -9.213608741760254, "global_step": 93306, "epoch": 555} {"train_loss": -9.751022338867188, "global_step": 93307, "epoch": 555} {"train_loss": -9.245613098144531, "global_step": 93308, "epoch": 555} {"train_loss": -9.474701881408691, "global_step": 93309, "epoch": 555} {"train_loss": -9.156188011169434, "global_step": 93310, "epoch": 555} {"train_loss": -9.099573135375977, "global_step": 93311, "epoch": 555} {"train_loss": -9.442109107971191, "global_step": 93312, "epoch": 555} {"train_loss": -9.149052619934082, "global_step": 93313, "epoch": 555} {"train_loss": -9.468788146972656, "global_step": 93314, "epoch": 555} {"train_loss": -8.996237754821777, "global_step": 93315, "epoch": 555} {"train_loss": -9.589303970336914, "global_step": 93316, "epoch": 555} {"train_loss": -8.959758758544922, "global_step": 93317, "epoch": 555} {"train_loss": -9.09840202331543, "global_step": 93318, "epoch": 555} {"train_loss": -9.409774780273438, "global_step": 93319, "epoch": 555} {"train_loss": -8.991647720336914, "global_step": 93320, "epoch": 555} {"train_loss": -9.247129440307617, "global_step": 93321, "epoch": 555} {"train_loss": -9.328320503234863, "global_step": 93322, "epoch": 555} {"train_loss": -9.199223518371582, "global_step": 93323, "epoch": 555} {"train_loss": -9.062801361083984, "global_step": 93324, "epoch": 555} {"train_loss": -9.467884063720703, "global_step": 93325, "epoch": 555} {"train_loss": -9.597233772277832, "global_step": 93326, "epoch": 555} {"train_loss": -9.315011978149414, "global_step": 93327, "epoch": 555} {"train_loss": -9.343157768249512, "global_step": 93328, "epoch": 555} {"train_loss": -9.403358459472656, "global_step": 93329, "epoch": 555} {"train_loss": -9.429445266723633, "global_step": 93330, "epoch": 555} {"train_loss": -9.237939834594727, "global_step": 93331, "epoch": 555} {"train_loss": -9.820928573608398, "global_step": 93332, "epoch": 555} {"train_loss": -9.266777992248535, "global_step": 93333, "epoch": 555} {"train_loss": -9.342954635620117, "global_step": 93334, "epoch": 555} {"train_loss": -9.327301025390625, "global_step": 93335, "epoch": 555} {"train_loss": -9.224712371826172, "global_step": 93336, "epoch": 555} {"train_loss": -9.370583534240723, "global_step": 93337, "epoch": 555} {"train_loss": -9.326702117919922, "global_step": 93338, "epoch": 555} {"train_loss": -9.499589920043945, "global_step": 93339, "epoch": 555} {"train_loss": -9.148263931274414, "global_step": 93340, "epoch": 555} {"train_loss": -9.671684265136719, "global_step": 93341, "epoch": 555} {"train_loss": -9.045969009399414, "global_step": 93342, "epoch": 555} {"train_loss": -9.368295669555664, "global_step": 93343, "epoch": 555} {"train_loss": -9.523397445678711, "global_step": 93344, "epoch": 555} {"train_loss": -8.980241775512695, "global_step": 93345, "epoch": 555} {"train_loss": -9.79646110534668, "global_step": 93346, "epoch": 555} {"train_loss": -9.239917755126953, "global_step": 93347, "epoch": 555} {"train_loss": -9.183916091918945, "global_step": 93348, "epoch": 555} {"train_loss": -9.436821937561035, "global_step": 93349, "epoch": 555} {"train_loss": -9.558016777038574, "global_step": 93350, "epoch": 555} {"train_loss": -9.419713973999023, "global_step": 93351, "epoch": 555} {"train_loss": -9.3863525390625, "global_step": 93352, "epoch": 555} {"train_loss": -9.452523231506348, "global_step": 93353, "epoch": 555} {"train_loss": -9.601675033569336, "global_step": 93354, "epoch": 555} {"train_loss": -9.455328941345215, "global_step": 93355, "epoch": 555} {"train_loss": -9.478370666503906, "global_step": 93356, "epoch": 555} {"train_loss": -9.658401489257812, "global_step": 93357, "epoch": 555} {"train_loss": -9.470691680908203, "global_step": 93358, "epoch": 555} {"train_loss": -9.581991195678711, "global_step": 93359, "epoch": 555} {"train_loss": -9.475913047790527, "global_step": 93360, "epoch": 555} {"train_loss": -9.69466781616211, "global_step": 93361, "epoch": 555} {"train_loss": -9.211469650268555, "global_step": 93362, "epoch": 555} {"train_loss": -9.440147399902344, "global_step": 93363, "epoch": 555} {"train_loss": -9.569604873657227, "global_step": 93364, "epoch": 555} {"train_loss": -9.421892166137695, "global_step": 93365, "epoch": 555} {"train_loss": -9.56593132019043, "global_step": 93366, "epoch": 555} {"train_loss": -9.508317947387695, "global_step": 93367, "epoch": 555} {"train_loss": -9.501276016235352, "global_step": 93368, "epoch": 555} {"train_loss": -9.510063171386719, "global_step": 93369, "epoch": 555} {"train_loss": -9.436614036560059, "global_step": 93370, "epoch": 555} {"train_loss": -9.447441101074219, "global_step": 93371, "epoch": 555} {"train_loss": -9.611465454101562, "global_step": 93372, "epoch": 555} {"train_loss": -9.63977336883545, "global_step": 93373, "epoch": 555} {"train_loss": -9.631728172302246, "global_step": 93374, "epoch": 555} {"train_loss": -9.601095199584961, "global_step": 93375, "epoch": 555} {"train_loss": -9.669147491455078, "global_step": 93376, "epoch": 555} {"train_loss": -9.86452865600586, "global_step": 93377, "epoch": 555} {"train_loss": -9.615158081054688, "global_step": 93378, "epoch": 555} {"train_loss": -9.616674423217773, "global_step": 93379, "epoch": 555} {"train_loss": -9.641386032104492, "global_step": 93380, "epoch": 555} {"train_loss": -9.673134803771973, "global_step": 93381, "epoch": 555} {"train_loss": -9.784561157226562, "global_step": 93382, "epoch": 555} {"train_loss": -9.595633506774902, "global_step": 93383, "epoch": 555} {"train_loss": -9.445537567138672, "global_step": 93384, "epoch": 555} {"train_loss": -9.482613563537598, "global_step": 93385, "epoch": 555} {"train_loss": -9.671528816223145, "global_step": 93386, "epoch": 555} {"train_loss": -9.910677909851074, "global_step": 93387, "epoch": 555} {"train_loss": -9.587308883666992, "global_step": 93388, "epoch": 555} {"train_loss": -9.63982105255127, "global_step": 93389, "epoch": 555} {"train_loss": -9.66500473022461, "global_step": 93390, "epoch": 555} {"train_loss": -9.507610321044922, "global_step": 93391, "epoch": 555} {"train_loss": -9.643638610839844, "global_step": 93392, "epoch": 555} {"train_loss": -9.524731636047363, "global_step": 93393, "epoch": 555} {"train_loss": -9.509105682373047, "global_step": 93394, "epoch": 555} {"train_loss": -9.819948196411133, "global_step": 93395, "epoch": 555} {"train_loss": -9.461067199707031, "global_step": 93396, "epoch": 555} {"train_loss": -9.506678581237793, "global_step": 93397, "epoch": 555} {"train_loss": -9.601980209350586, "global_step": 93398, "epoch": 555} {"train_loss": -9.59869384765625, "global_step": 93399, "epoch": 555} {"train_loss": -9.33584213256836, "global_step": 93400, "epoch": 555} {"train_loss": -9.379049301147461, "global_step": 93401, "epoch": 555} {"train_loss": -9.458271980285645, "global_step": 93402, "epoch": 555} {"train_loss": -9.139925003051758, "global_step": 93403, "epoch": 555} {"train_loss": -9.457746505737305, "global_step": 93404, "epoch": 555} {"train_loss": -9.474418640136719, "global_step": 93405, "epoch": 555} {"train_loss": -9.478435516357422, "global_step": 93406, "epoch": 555} {"train_loss": -9.47556833993821, "global_step": 93407, "epoch": 555, "val_loss": 204222.25, "train_action_mse_error": 7.195193767547607} {"train_loss": -9.34459400177002, "global_step": 93408, "epoch": 556} {"train_loss": -9.358055114746094, "global_step": 93409, "epoch": 556} {"train_loss": -9.631431579589844, "global_step": 93410, "epoch": 556} {"train_loss": -9.259201049804688, "global_step": 93411, "epoch": 556} {"train_loss": -9.631067276000977, "global_step": 93412, "epoch": 556} {"train_loss": -9.420602798461914, "global_step": 93413, "epoch": 556} {"train_loss": -9.604408264160156, "global_step": 93414, "epoch": 556} {"train_loss": -9.500844955444336, "global_step": 93415, "epoch": 556} {"train_loss": -9.492115020751953, "global_step": 93416, "epoch": 556} {"train_loss": -9.369152069091797, "global_step": 93417, "epoch": 556} {"train_loss": -9.536996841430664, "global_step": 93418, "epoch": 556} {"train_loss": -9.690448760986328, "global_step": 93419, "epoch": 556} {"train_loss": -9.408975601196289, "global_step": 93420, "epoch": 556} {"train_loss": -9.428694725036621, "global_step": 93421, "epoch": 556} {"train_loss": -9.149961471557617, "global_step": 93422, "epoch": 556} {"train_loss": -9.253210067749023, "global_step": 93423, "epoch": 556} {"train_loss": -9.181865692138672, "global_step": 93424, "epoch": 556} {"train_loss": -9.617366790771484, "global_step": 93425, "epoch": 556} {"train_loss": -9.351190567016602, "global_step": 93426, "epoch": 556} {"train_loss": -9.465677261352539, "global_step": 93427, "epoch": 556} {"train_loss": -9.46939468383789, "global_step": 93428, "epoch": 556} {"train_loss": -9.433423042297363, "global_step": 93429, "epoch": 556} {"train_loss": -9.29074478149414, "global_step": 93430, "epoch": 556} {"train_loss": -9.561681747436523, "global_step": 93431, "epoch": 556} {"train_loss": -9.595857620239258, "global_step": 93432, "epoch": 556} {"train_loss": -9.464397430419922, "global_step": 93433, "epoch": 556} {"train_loss": -9.64439582824707, "global_step": 93434, "epoch": 556} {"train_loss": -9.69287395477295, "global_step": 93435, "epoch": 556} {"train_loss": -9.597431182861328, "global_step": 93436, "epoch": 556} {"train_loss": -9.589725494384766, "global_step": 93437, "epoch": 556} {"train_loss": -9.625259399414062, "global_step": 93438, "epoch": 556} {"train_loss": -9.520048141479492, "global_step": 93439, "epoch": 556} {"train_loss": -9.446293830871582, "global_step": 93440, "epoch": 556} {"train_loss": -9.562501907348633, "global_step": 93441, "epoch": 556} {"train_loss": -9.545032501220703, "global_step": 93442, "epoch": 556} {"train_loss": -9.503734588623047, "global_step": 93443, "epoch": 556} {"train_loss": -9.821741104125977, "global_step": 93444, "epoch": 556} {"train_loss": -9.24165153503418, "global_step": 93445, "epoch": 556} {"train_loss": -9.712658882141113, "global_step": 93446, "epoch": 556} {"train_loss": -9.494709014892578, "global_step": 93447, "epoch": 556} {"train_loss": -9.244905471801758, "global_step": 93448, "epoch": 556} {"train_loss": -9.200421333312988, "global_step": 93449, "epoch": 556} {"train_loss": -9.498224258422852, "global_step": 93450, "epoch": 556} {"train_loss": -9.341312408447266, "global_step": 93451, "epoch": 556} {"train_loss": -9.243928909301758, "global_step": 93452, "epoch": 556} {"train_loss": -9.578351974487305, "global_step": 93453, "epoch": 556} {"train_loss": -8.997715950012207, "global_step": 93454, "epoch": 556} {"train_loss": -9.394723892211914, "global_step": 93455, "epoch": 556} {"train_loss": -9.41160774230957, "global_step": 93456, "epoch": 556} {"train_loss": -9.554452896118164, "global_step": 93457, "epoch": 556} {"train_loss": -9.33791732788086, "global_step": 93458, "epoch": 556} {"train_loss": -9.341959953308105, "global_step": 93459, "epoch": 556} {"train_loss": -9.31387996673584, "global_step": 93460, "epoch": 556} {"train_loss": -9.236281394958496, "global_step": 93461, "epoch": 556} {"train_loss": -9.514293670654297, "global_step": 93462, "epoch": 556} {"train_loss": -9.162105560302734, "global_step": 93463, "epoch": 556} {"train_loss": -9.404397010803223, "global_step": 93464, "epoch": 556} {"train_loss": -9.208645820617676, "global_step": 93465, "epoch": 556} {"train_loss": -9.3406982421875, "global_step": 93466, "epoch": 556} {"train_loss": -9.235798835754395, "global_step": 93467, "epoch": 556} {"train_loss": -9.168973922729492, "global_step": 93468, "epoch": 556} {"train_loss": -9.147268295288086, "global_step": 93469, "epoch": 556} {"train_loss": -9.40718936920166, "global_step": 93470, "epoch": 556} {"train_loss": -8.79029655456543, "global_step": 93471, "epoch": 556} {"train_loss": -9.399687767028809, "global_step": 93472, "epoch": 556} {"train_loss": -9.148618698120117, "global_step": 93473, "epoch": 556} {"train_loss": -9.514631271362305, "global_step": 93474, "epoch": 556} {"train_loss": -8.879997253417969, "global_step": 93475, "epoch": 556} {"train_loss": -9.278929710388184, "global_step": 93476, "epoch": 556} {"train_loss": -9.164731979370117, "global_step": 93477, "epoch": 556} {"train_loss": -9.289483070373535, "global_step": 93478, "epoch": 556} {"train_loss": -9.487178802490234, "global_step": 93479, "epoch": 556} {"train_loss": -9.539119720458984, "global_step": 93480, "epoch": 556} {"train_loss": -9.370776176452637, "global_step": 93481, "epoch": 556} {"train_loss": -9.573387145996094, "global_step": 93482, "epoch": 556} {"train_loss": -9.308462142944336, "global_step": 93483, "epoch": 556} {"train_loss": -9.430171966552734, "global_step": 93484, "epoch": 556} {"train_loss": -9.511935234069824, "global_step": 93485, "epoch": 556} {"train_loss": -9.462029457092285, "global_step": 93486, "epoch": 556} {"train_loss": -9.651199340820312, "global_step": 93487, "epoch": 556} {"train_loss": -9.68522834777832, "global_step": 93488, "epoch": 556} {"train_loss": -9.683140754699707, "global_step": 93489, "epoch": 556} {"train_loss": -9.576257705688477, "global_step": 93490, "epoch": 556} {"train_loss": -9.691173553466797, "global_step": 93491, "epoch": 556} {"train_loss": -9.733559608459473, "global_step": 93492, "epoch": 556} {"train_loss": -9.914417266845703, "global_step": 93493, "epoch": 556} {"train_loss": -9.735669136047363, "global_step": 93494, "epoch": 556} {"train_loss": -9.813562393188477, "global_step": 93495, "epoch": 556} {"train_loss": -9.526398658752441, "global_step": 93496, "epoch": 556} {"train_loss": -9.698013305664062, "global_step": 93497, "epoch": 556} {"train_loss": -9.634915351867676, "global_step": 93498, "epoch": 556} {"train_loss": -9.795193672180176, "global_step": 93499, "epoch": 556} {"train_loss": -9.801814079284668, "global_step": 93500, "epoch": 556} {"train_loss": -9.550739288330078, "global_step": 93501, "epoch": 556} {"train_loss": -9.58720588684082, "global_step": 93502, "epoch": 556} {"train_loss": -9.555631637573242, "global_step": 93503, "epoch": 556} {"train_loss": -9.774303436279297, "global_step": 93504, "epoch": 556} {"train_loss": -9.748064041137695, "global_step": 93505, "epoch": 556} {"train_loss": -9.67844009399414, "global_step": 93506, "epoch": 556} {"train_loss": -9.689233779907227, "global_step": 93507, "epoch": 556} {"train_loss": -9.696916580200195, "global_step": 93508, "epoch": 556} {"train_loss": -9.356624603271484, "global_step": 93509, "epoch": 556} {"train_loss": -9.88701057434082, "global_step": 93510, "epoch": 556} {"train_loss": -9.599711418151855, "global_step": 93511, "epoch": 556} {"train_loss": -9.459877014160156, "global_step": 93512, "epoch": 556} {"train_loss": -9.528755187988281, "global_step": 93513, "epoch": 556} {"train_loss": -9.695099830627441, "global_step": 93514, "epoch": 556} {"train_loss": -9.611150741577148, "global_step": 93515, "epoch": 556} {"train_loss": -9.474971771240234, "global_step": 93516, "epoch": 556} {"train_loss": -9.478363990783691, "global_step": 93517, "epoch": 556} {"train_loss": -9.348236083984375, "global_step": 93518, "epoch": 556} {"train_loss": -9.354787826538086, "global_step": 93519, "epoch": 556} {"train_loss": -9.268172264099121, "global_step": 93520, "epoch": 556} {"train_loss": -9.68321418762207, "global_step": 93521, "epoch": 556} {"train_loss": -9.129859924316406, "global_step": 93522, "epoch": 556} {"train_loss": -9.110595703125, "global_step": 93523, "epoch": 556} {"train_loss": -9.528417587280273, "global_step": 93524, "epoch": 556} {"train_loss": -9.346078872680664, "global_step": 93525, "epoch": 556} {"train_loss": -9.472694396972656, "global_step": 93526, "epoch": 556} {"train_loss": -9.398137092590332, "global_step": 93527, "epoch": 556} {"train_loss": -9.219539642333984, "global_step": 93528, "epoch": 556} {"train_loss": -9.091230392456055, "global_step": 93529, "epoch": 556} {"train_loss": -9.693310737609863, "global_step": 93530, "epoch": 556} {"train_loss": -9.449191093444824, "global_step": 93531, "epoch": 556} {"train_loss": -9.484716415405273, "global_step": 93532, "epoch": 556} {"train_loss": -9.70747184753418, "global_step": 93533, "epoch": 556} {"train_loss": -9.565000534057617, "global_step": 93534, "epoch": 556} {"train_loss": -9.414361953735352, "global_step": 93535, "epoch": 556} {"train_loss": -9.761724472045898, "global_step": 93536, "epoch": 556} {"train_loss": -9.686042785644531, "global_step": 93537, "epoch": 556} {"train_loss": -9.348978042602539, "global_step": 93538, "epoch": 556} {"train_loss": -9.61272144317627, "global_step": 93539, "epoch": 556} {"train_loss": -9.629663467407227, "global_step": 93540, "epoch": 556} {"train_loss": -9.412165641784668, "global_step": 93541, "epoch": 556} {"train_loss": -9.506723403930664, "global_step": 93542, "epoch": 556} {"train_loss": -9.331395149230957, "global_step": 93543, "epoch": 556} {"train_loss": -9.440046310424805, "global_step": 93544, "epoch": 556} {"train_loss": -9.46163558959961, "global_step": 93545, "epoch": 556} {"train_loss": -9.296557426452637, "global_step": 93546, "epoch": 556} {"train_loss": -9.58792495727539, "global_step": 93547, "epoch": 556} {"train_loss": -9.454757690429688, "global_step": 93548, "epoch": 556} {"train_loss": -9.41008186340332, "global_step": 93549, "epoch": 556} {"train_loss": -9.398645401000977, "global_step": 93550, "epoch": 556} {"train_loss": -9.348713874816895, "global_step": 93551, "epoch": 556} {"train_loss": -9.71490478515625, "global_step": 93552, "epoch": 556} {"train_loss": -9.36844253540039, "global_step": 93553, "epoch": 556} {"train_loss": -9.553716659545898, "global_step": 93554, "epoch": 556} {"train_loss": -9.611778259277344, "global_step": 93555, "epoch": 556} {"train_loss": -9.39720630645752, "global_step": 93556, "epoch": 556} {"train_loss": -9.423599243164062, "global_step": 93557, "epoch": 556} {"train_loss": -9.06994342803955, "global_step": 93558, "epoch": 556} {"train_loss": -9.262992858886719, "global_step": 93559, "epoch": 556} {"train_loss": -9.608417510986328, "global_step": 93560, "epoch": 556} {"train_loss": -9.437834739685059, "global_step": 93561, "epoch": 556} {"train_loss": -9.556276321411133, "global_step": 93562, "epoch": 556} {"train_loss": -9.286255836486816, "global_step": 93563, "epoch": 556} {"train_loss": -9.501521110534668, "global_step": 93564, "epoch": 556} {"train_loss": -9.344682693481445, "global_step": 93565, "epoch": 556} {"train_loss": -9.50014877319336, "global_step": 93566, "epoch": 556} {"train_loss": -9.294163703918457, "global_step": 93567, "epoch": 556} {"train_loss": -9.38909912109375, "global_step": 93568, "epoch": 556} {"train_loss": -9.341215133666992, "global_step": 93569, "epoch": 556} {"train_loss": -8.876371383666992, "global_step": 93570, "epoch": 556} {"train_loss": -9.307710647583008, "global_step": 93571, "epoch": 556} {"train_loss": -9.200857162475586, "global_step": 93572, "epoch": 556} {"train_loss": -9.318902015686035, "global_step": 93573, "epoch": 556} {"train_loss": -9.090503692626953, "global_step": 93574, "epoch": 556} {"train_loss": -9.453479517073859, "global_step": 93575, "epoch": 556, "val_loss": 203664.078125} {"train_loss": -9.228201866149902, "global_step": 93576, "epoch": 557} {"train_loss": -9.246964454650879, "global_step": 93577, "epoch": 557} {"train_loss": -9.273702621459961, "global_step": 93578, "epoch": 557} {"train_loss": -9.386222839355469, "global_step": 93579, "epoch": 557} {"train_loss": -9.567358016967773, "global_step": 93580, "epoch": 557} {"train_loss": -9.023698806762695, "global_step": 93581, "epoch": 557} {"train_loss": -9.521665573120117, "global_step": 93582, "epoch": 557} {"train_loss": -9.380189895629883, "global_step": 93583, "epoch": 557} {"train_loss": -9.36276626586914, "global_step": 93584, "epoch": 557} {"train_loss": -9.509757041931152, "global_step": 93585, "epoch": 557} {"train_loss": -9.542337417602539, "global_step": 93586, "epoch": 557} {"train_loss": -9.585994720458984, "global_step": 93587, "epoch": 557} {"train_loss": -9.539213180541992, "global_step": 93588, "epoch": 557} {"train_loss": -9.530309677124023, "global_step": 93589, "epoch": 557} {"train_loss": -9.75120735168457, "global_step": 93590, "epoch": 557} {"train_loss": -9.5228853225708, "global_step": 93591, "epoch": 557} {"train_loss": -9.752921104431152, "global_step": 93592, "epoch": 557} {"train_loss": -9.736262321472168, "global_step": 93593, "epoch": 557} {"train_loss": -9.477771759033203, "global_step": 93594, "epoch": 557} {"train_loss": -9.609825134277344, "global_step": 93595, "epoch": 557} {"train_loss": -9.591621398925781, "global_step": 93596, "epoch": 557} {"train_loss": -9.733346939086914, "global_step": 93597, "epoch": 557} {"train_loss": -9.681222915649414, "global_step": 93598, "epoch": 557} {"train_loss": -9.788406372070312, "global_step": 93599, "epoch": 557} {"train_loss": -9.731000900268555, "global_step": 93600, "epoch": 557} {"train_loss": -9.897344589233398, "global_step": 93601, "epoch": 557} {"train_loss": -9.38245677947998, "global_step": 93602, "epoch": 557} {"train_loss": -9.912559509277344, "global_step": 93603, "epoch": 557} {"train_loss": -9.753162384033203, "global_step": 93604, "epoch": 557} {"train_loss": -9.904844284057617, "global_step": 93605, "epoch": 557} {"train_loss": -9.407279014587402, "global_step": 93606, "epoch": 557} {"train_loss": -9.581338882446289, "global_step": 93607, "epoch": 557} {"train_loss": -9.694135665893555, "global_step": 93608, "epoch": 557} {"train_loss": -9.336849212646484, "global_step": 93609, "epoch": 557} {"train_loss": -9.834856986999512, "global_step": 93610, "epoch": 557} {"train_loss": -9.224251747131348, "global_step": 93611, "epoch": 557} {"train_loss": -9.484725952148438, "global_step": 93612, "epoch": 557} {"train_loss": -9.283036231994629, "global_step": 93613, "epoch": 557} {"train_loss": -9.498416900634766, "global_step": 93614, "epoch": 557} {"train_loss": -9.39259147644043, "global_step": 93615, "epoch": 557} {"train_loss": -9.513330459594727, "global_step": 93616, "epoch": 557} {"train_loss": -9.355168342590332, "global_step": 93617, "epoch": 557} {"train_loss": -9.2823486328125, "global_step": 93618, "epoch": 557} {"train_loss": -9.504352569580078, "global_step": 93619, "epoch": 557} {"train_loss": -9.36562728881836, "global_step": 93620, "epoch": 557} {"train_loss": -9.440729141235352, "global_step": 93621, "epoch": 557} {"train_loss": -9.564229011535645, "global_step": 93622, "epoch": 557} {"train_loss": -9.48062515258789, "global_step": 93623, "epoch": 557} {"train_loss": -9.70738697052002, "global_step": 93624, "epoch": 557} {"train_loss": -9.437602996826172, "global_step": 93625, "epoch": 557} {"train_loss": -9.509438514709473, "global_step": 93626, "epoch": 557} {"train_loss": -9.405628204345703, "global_step": 93627, "epoch": 557} {"train_loss": -9.614243507385254, "global_step": 93628, "epoch": 557} {"train_loss": -9.433073043823242, "global_step": 93629, "epoch": 557} {"train_loss": -9.829642295837402, "global_step": 93630, "epoch": 557} {"train_loss": -9.19005298614502, "global_step": 93631, "epoch": 557} {"train_loss": -9.537834167480469, "global_step": 93632, "epoch": 557} {"train_loss": -9.363893508911133, "global_step": 93633, "epoch": 557} {"train_loss": -9.417156219482422, "global_step": 93634, "epoch": 557} {"train_loss": -9.403661727905273, "global_step": 93635, "epoch": 557} {"train_loss": -9.478353500366211, "global_step": 93636, "epoch": 557} {"train_loss": -9.538764953613281, "global_step": 93637, "epoch": 557} {"train_loss": -9.64907455444336, "global_step": 93638, "epoch": 557} {"train_loss": -9.402600288391113, "global_step": 93639, "epoch": 557} {"train_loss": -9.599197387695312, "global_step": 93640, "epoch": 557} {"train_loss": -9.462998390197754, "global_step": 93641, "epoch": 557} {"train_loss": -9.542819023132324, "global_step": 93642, "epoch": 557} {"train_loss": -9.626333236694336, "global_step": 93643, "epoch": 557} {"train_loss": -9.671507835388184, "global_step": 93644, "epoch": 557} {"train_loss": -9.371767044067383, "global_step": 93645, "epoch": 557} {"train_loss": -9.574785232543945, "global_step": 93646, "epoch": 557} {"train_loss": -9.631110191345215, "global_step": 93647, "epoch": 557} {"train_loss": -9.593252182006836, "global_step": 93648, "epoch": 557} {"train_loss": -9.70697021484375, "global_step": 93649, "epoch": 557} {"train_loss": -9.471914291381836, "global_step": 93650, "epoch": 557} {"train_loss": -9.832527160644531, "global_step": 93651, "epoch": 557} {"train_loss": -9.456602096557617, "global_step": 93652, "epoch": 557} {"train_loss": -9.088363647460938, "global_step": 93653, "epoch": 557} {"train_loss": -9.615328788757324, "global_step": 93654, "epoch": 557} {"train_loss": -9.259315490722656, "global_step": 93655, "epoch": 557} {"train_loss": -9.740509986877441, "global_step": 93656, "epoch": 557} {"train_loss": -9.537100791931152, "global_step": 93657, "epoch": 557} {"train_loss": -9.485920906066895, "global_step": 93658, "epoch": 557} {"train_loss": -9.389366149902344, "global_step": 93659, "epoch": 557} {"train_loss": -9.414165496826172, "global_step": 93660, "epoch": 557} {"train_loss": -9.42958927154541, "global_step": 93661, "epoch": 557} {"train_loss": -9.540216445922852, "global_step": 93662, "epoch": 557} {"train_loss": -9.56960678100586, "global_step": 93663, "epoch": 557} {"train_loss": -9.158772468566895, "global_step": 93664, "epoch": 557} {"train_loss": -9.554140090942383, "global_step": 93665, "epoch": 557} {"train_loss": -9.458626747131348, "global_step": 93666, "epoch": 557} {"train_loss": -9.532659530639648, "global_step": 93667, "epoch": 557} {"train_loss": -9.307106018066406, "global_step": 93668, "epoch": 557} {"train_loss": -9.795659065246582, "global_step": 93669, "epoch": 557} {"train_loss": -9.583526611328125, "global_step": 93670, "epoch": 557} {"train_loss": -9.181859016418457, "global_step": 93671, "epoch": 557} {"train_loss": -9.479607582092285, "global_step": 93672, "epoch": 557} {"train_loss": -9.180780410766602, "global_step": 93673, "epoch": 557} {"train_loss": -9.424798965454102, "global_step": 93674, "epoch": 557} {"train_loss": -9.671829223632812, "global_step": 93675, "epoch": 557} {"train_loss": -9.537368774414062, "global_step": 93676, "epoch": 557} {"train_loss": -9.473299026489258, "global_step": 93677, "epoch": 557} {"train_loss": -9.50561237335205, "global_step": 93678, "epoch": 557} {"train_loss": -9.35594367980957, "global_step": 93679, "epoch": 557} {"train_loss": -9.231820106506348, "global_step": 93680, "epoch": 557} {"train_loss": -9.342915534973145, "global_step": 93681, "epoch": 557} {"train_loss": -9.720673561096191, "global_step": 93682, "epoch": 557} {"train_loss": -9.439075469970703, "global_step": 93683, "epoch": 557} {"train_loss": -9.647088050842285, "global_step": 93684, "epoch": 557} {"train_loss": -9.427658081054688, "global_step": 93685, "epoch": 557} {"train_loss": -9.35881233215332, "global_step": 93686, "epoch": 557} {"train_loss": -9.162415504455566, "global_step": 93687, "epoch": 557} {"train_loss": -9.29203987121582, "global_step": 93688, "epoch": 557} {"train_loss": -9.228525161743164, "global_step": 93689, "epoch": 557} {"train_loss": -9.338379859924316, "global_step": 93690, "epoch": 557} {"train_loss": -9.494152069091797, "global_step": 93691, "epoch": 557} {"train_loss": -9.121845245361328, "global_step": 93692, "epoch": 557} {"train_loss": -9.266432762145996, "global_step": 93693, "epoch": 557} {"train_loss": -9.223653793334961, "global_step": 93694, "epoch": 557} {"train_loss": -9.418377876281738, "global_step": 93695, "epoch": 557} {"train_loss": -9.322696685791016, "global_step": 93696, "epoch": 557} {"train_loss": -9.526972770690918, "global_step": 93697, "epoch": 557} {"train_loss": -9.645866394042969, "global_step": 93698, "epoch": 557} {"train_loss": -9.547550201416016, "global_step": 93699, "epoch": 557} {"train_loss": -9.337333679199219, "global_step": 93700, "epoch": 557} {"train_loss": -9.194948196411133, "global_step": 93701, "epoch": 557} {"train_loss": -9.518316268920898, "global_step": 93702, "epoch": 557} {"train_loss": -9.117334365844727, "global_step": 93703, "epoch": 557} {"train_loss": -9.885406494140625, "global_step": 93704, "epoch": 557} {"train_loss": -9.267890930175781, "global_step": 93705, "epoch": 557} {"train_loss": -9.670185089111328, "global_step": 93706, "epoch": 557} {"train_loss": -9.324670791625977, "global_step": 93707, "epoch": 557} {"train_loss": -9.42379379272461, "global_step": 93708, "epoch": 557} {"train_loss": -9.549420356750488, "global_step": 93709, "epoch": 557} {"train_loss": -9.434852600097656, "global_step": 93710, "epoch": 557} {"train_loss": -9.602155685424805, "global_step": 93711, "epoch": 557} {"train_loss": -9.555782318115234, "global_step": 93712, "epoch": 557} {"train_loss": -9.260944366455078, "global_step": 93713, "epoch": 557} {"train_loss": -9.6233491897583, "global_step": 93714, "epoch": 557} {"train_loss": -9.60578727722168, "global_step": 93715, "epoch": 557} {"train_loss": -9.277734756469727, "global_step": 93716, "epoch": 557} {"train_loss": -9.624618530273438, "global_step": 93717, "epoch": 557} {"train_loss": -9.661783218383789, "global_step": 93718, "epoch": 557} {"train_loss": -9.3795166015625, "global_step": 93719, "epoch": 557} {"train_loss": -9.536864280700684, "global_step": 93720, "epoch": 557} {"train_loss": -9.586465835571289, "global_step": 93721, "epoch": 557} {"train_loss": -9.383328437805176, "global_step": 93722, "epoch": 557} {"train_loss": -9.619148254394531, "global_step": 93723, "epoch": 557} {"train_loss": -9.73449420928955, "global_step": 93724, "epoch": 557} {"train_loss": -9.938597679138184, "global_step": 93725, "epoch": 557} {"train_loss": -9.47498893737793, "global_step": 93726, "epoch": 557} {"train_loss": -9.57059097290039, "global_step": 93727, "epoch": 557} {"train_loss": -9.545892715454102, "global_step": 93728, "epoch": 557} {"train_loss": -9.279614448547363, "global_step": 93729, "epoch": 557} {"train_loss": -9.546188354492188, "global_step": 93730, "epoch": 557} {"train_loss": -9.426804542541504, "global_step": 93731, "epoch": 557} {"train_loss": -9.366966247558594, "global_step": 93732, "epoch": 557} {"train_loss": -9.260421752929688, "global_step": 93733, "epoch": 557} {"train_loss": -9.227496147155762, "global_step": 93734, "epoch": 557} {"train_loss": -9.477620124816895, "global_step": 93735, "epoch": 557} {"train_loss": -9.486207962036133, "global_step": 93736, "epoch": 557} {"train_loss": -9.42837142944336, "global_step": 93737, "epoch": 557} {"train_loss": -9.408622741699219, "global_step": 93738, "epoch": 557} {"train_loss": -9.481727600097656, "global_step": 93739, "epoch": 557} {"train_loss": -9.24814224243164, "global_step": 93740, "epoch": 557} {"train_loss": -9.510225296020508, "global_step": 93741, "epoch": 557} {"train_loss": -9.409690856933594, "global_step": 93742, "epoch": 557} {"train_loss": -9.479970773061117, "global_step": 93743, "epoch": 557, "val_loss": 204104.03125} {"train_loss": -9.63637924194336, "global_step": 93744, "epoch": 558} {"train_loss": -9.310848236083984, "global_step": 93745, "epoch": 558} {"train_loss": -9.133724212646484, "global_step": 93746, "epoch": 558} {"train_loss": -9.34170913696289, "global_step": 93747, "epoch": 558} {"train_loss": -9.350746154785156, "global_step": 93748, "epoch": 558} {"train_loss": -9.399848937988281, "global_step": 93749, "epoch": 558} {"train_loss": -9.587398529052734, "global_step": 93750, "epoch": 558} {"train_loss": -9.523353576660156, "global_step": 93751, "epoch": 558} {"train_loss": -9.340431213378906, "global_step": 93752, "epoch": 558} {"train_loss": -9.704777717590332, "global_step": 93753, "epoch": 558} {"train_loss": -9.504911422729492, "global_step": 93754, "epoch": 558} {"train_loss": -9.637252807617188, "global_step": 93755, "epoch": 558} {"train_loss": -9.278948783874512, "global_step": 93756, "epoch": 558} {"train_loss": -9.420713424682617, "global_step": 93757, "epoch": 558} {"train_loss": -9.587203979492188, "global_step": 93758, "epoch": 558} {"train_loss": -9.59103775024414, "global_step": 93759, "epoch": 558} {"train_loss": -9.583390235900879, "global_step": 93760, "epoch": 558} {"train_loss": -9.557318687438965, "global_step": 93761, "epoch": 558} {"train_loss": -9.679333686828613, "global_step": 93762, "epoch": 558} {"train_loss": -9.624479293823242, "global_step": 93763, "epoch": 558} {"train_loss": -9.44890022277832, "global_step": 93764, "epoch": 558} {"train_loss": -9.680986404418945, "global_step": 93765, "epoch": 558} {"train_loss": -9.591657638549805, "global_step": 93766, "epoch": 558} {"train_loss": -9.304015159606934, "global_step": 93767, "epoch": 558} {"train_loss": -9.621484756469727, "global_step": 93768, "epoch": 558} {"train_loss": -9.360757827758789, "global_step": 93769, "epoch": 558} {"train_loss": -9.461201667785645, "global_step": 93770, "epoch": 558} {"train_loss": -9.71565055847168, "global_step": 93771, "epoch": 558} {"train_loss": -9.513270378112793, "global_step": 93772, "epoch": 558} {"train_loss": -9.730642318725586, "global_step": 93773, "epoch": 558} {"train_loss": -9.634361267089844, "global_step": 93774, "epoch": 558} {"train_loss": -9.787271499633789, "global_step": 93775, "epoch": 558} {"train_loss": -9.437807083129883, "global_step": 93776, "epoch": 558} {"train_loss": -9.724763870239258, "global_step": 93777, "epoch": 558} {"train_loss": -9.523998260498047, "global_step": 93778, "epoch": 558} {"train_loss": -9.493204116821289, "global_step": 93779, "epoch": 558} {"train_loss": -9.512578964233398, "global_step": 93780, "epoch": 558} {"train_loss": -9.632572174072266, "global_step": 93781, "epoch": 558} {"train_loss": -9.432746887207031, "global_step": 93782, "epoch": 558} {"train_loss": -9.489304542541504, "global_step": 93783, "epoch": 558} {"train_loss": -9.4990234375, "global_step": 93784, "epoch": 558} {"train_loss": -9.341062545776367, "global_step": 93785, "epoch": 558} {"train_loss": -9.396980285644531, "global_step": 93786, "epoch": 558} {"train_loss": -9.473641395568848, "global_step": 93787, "epoch": 558} {"train_loss": -9.413681983947754, "global_step": 93788, "epoch": 558} {"train_loss": -9.20589542388916, "global_step": 93789, "epoch": 558} {"train_loss": -9.281045913696289, "global_step": 93790, "epoch": 558} {"train_loss": -9.470182418823242, "global_step": 93791, "epoch": 558} {"train_loss": -9.60396957397461, "global_step": 93792, "epoch": 558} {"train_loss": -9.573667526245117, "global_step": 93793, "epoch": 558} {"train_loss": -9.62036418914795, "global_step": 93794, "epoch": 558} {"train_loss": -9.575506210327148, "global_step": 93795, "epoch": 558} {"train_loss": -9.581709861755371, "global_step": 93796, "epoch": 558} {"train_loss": -9.35055160522461, "global_step": 93797, "epoch": 558} {"train_loss": -9.522151947021484, "global_step": 93798, "epoch": 558} {"train_loss": -9.696340560913086, "global_step": 93799, "epoch": 558} {"train_loss": -9.644227027893066, "global_step": 93800, "epoch": 558} {"train_loss": -9.7813720703125, "global_step": 93801, "epoch": 558} {"train_loss": -9.764856338500977, "global_step": 93802, "epoch": 558} {"train_loss": -9.837821006774902, "global_step": 93803, "epoch": 558} {"train_loss": -9.675862312316895, "global_step": 93804, "epoch": 558} {"train_loss": -9.709529876708984, "global_step": 93805, "epoch": 558} {"train_loss": -9.56654167175293, "global_step": 93806, "epoch": 558} {"train_loss": -9.76318359375, "global_step": 93807, "epoch": 558} {"train_loss": -10.056015014648438, "global_step": 93808, "epoch": 558} {"train_loss": -9.311503410339355, "global_step": 93809, "epoch": 558} {"train_loss": -9.468582153320312, "global_step": 93810, "epoch": 558} {"train_loss": -9.767641067504883, "global_step": 93811, "epoch": 558} {"train_loss": -9.218071937561035, "global_step": 93812, "epoch": 558} {"train_loss": -9.64906120300293, "global_step": 93813, "epoch": 558} {"train_loss": -9.62346076965332, "global_step": 93814, "epoch": 558} {"train_loss": -9.228057861328125, "global_step": 93815, "epoch": 558} {"train_loss": -9.323395729064941, "global_step": 93816, "epoch": 558} {"train_loss": -9.729767799377441, "global_step": 93817, "epoch": 558} {"train_loss": -9.984946250915527, "global_step": 93818, "epoch": 558} {"train_loss": -9.372225761413574, "global_step": 93819, "epoch": 558} {"train_loss": -9.406291007995605, "global_step": 93820, "epoch": 558} {"train_loss": -9.195924758911133, "global_step": 93821, "epoch": 558} {"train_loss": -9.39353084564209, "global_step": 93822, "epoch": 558} {"train_loss": -9.546574592590332, "global_step": 93823, "epoch": 558} {"train_loss": -9.208130836486816, "global_step": 93824, "epoch": 558} {"train_loss": -9.653942108154297, "global_step": 93825, "epoch": 558} {"train_loss": -9.061697006225586, "global_step": 93826, "epoch": 558} {"train_loss": -9.45050048828125, "global_step": 93827, "epoch": 558} {"train_loss": -9.197673797607422, "global_step": 93828, "epoch": 558} {"train_loss": -9.455577850341797, "global_step": 93829, "epoch": 558} {"train_loss": -9.003851890563965, "global_step": 93830, "epoch": 558} {"train_loss": -9.286754608154297, "global_step": 93831, "epoch": 558} {"train_loss": -9.154440879821777, "global_step": 93832, "epoch": 558} {"train_loss": -9.215563774108887, "global_step": 93833, "epoch": 558} {"train_loss": -9.219322204589844, "global_step": 93834, "epoch": 558} {"train_loss": -9.49389934539795, "global_step": 93835, "epoch": 558} {"train_loss": -9.332167625427246, "global_step": 93836, "epoch": 558} {"train_loss": -9.51170825958252, "global_step": 93837, "epoch": 558} {"train_loss": -9.482532501220703, "global_step": 93838, "epoch": 558} {"train_loss": -9.892822265625, "global_step": 93839, "epoch": 558} {"train_loss": -9.507564544677734, "global_step": 93840, "epoch": 558} {"train_loss": -9.59201431274414, "global_step": 93841, "epoch": 558} {"train_loss": -9.62563705444336, "global_step": 93842, "epoch": 558} {"train_loss": -9.598295211791992, "global_step": 93843, "epoch": 558} {"train_loss": -9.702339172363281, "global_step": 93844, "epoch": 558} {"train_loss": -9.48276424407959, "global_step": 93845, "epoch": 558} {"train_loss": -9.195451736450195, "global_step": 93846, "epoch": 558} {"train_loss": -9.675615310668945, "global_step": 93847, "epoch": 558} {"train_loss": -9.654666900634766, "global_step": 93848, "epoch": 558} {"train_loss": -9.49951171875, "global_step": 93849, "epoch": 558} {"train_loss": -9.409872055053711, "global_step": 93850, "epoch": 558} {"train_loss": -9.614280700683594, "global_step": 93851, "epoch": 558} {"train_loss": -9.625997543334961, "global_step": 93852, "epoch": 558} {"train_loss": -9.529495239257812, "global_step": 93853, "epoch": 558} {"train_loss": -9.347356796264648, "global_step": 93854, "epoch": 558} {"train_loss": -9.526470184326172, "global_step": 93855, "epoch": 558} {"train_loss": -9.345271110534668, "global_step": 93856, "epoch": 558} {"train_loss": -9.359415054321289, "global_step": 93857, "epoch": 558} {"train_loss": -9.327923774719238, "global_step": 93858, "epoch": 558} {"train_loss": -9.199149131774902, "global_step": 93859, "epoch": 558} {"train_loss": -9.288783073425293, "global_step": 93860, "epoch": 558} {"train_loss": -9.273174285888672, "global_step": 93861, "epoch": 558} {"train_loss": -9.426115036010742, "global_step": 93862, "epoch": 558} {"train_loss": -9.507429122924805, "global_step": 93863, "epoch": 558} {"train_loss": -9.447052001953125, "global_step": 93864, "epoch": 558} {"train_loss": -9.338516235351562, "global_step": 93865, "epoch": 558} {"train_loss": -9.609442710876465, "global_step": 93866, "epoch": 558} {"train_loss": -9.32127571105957, "global_step": 93867, "epoch": 558} {"train_loss": -9.752212524414062, "global_step": 93868, "epoch": 558} {"train_loss": -9.495132446289062, "global_step": 93869, "epoch": 558} {"train_loss": -9.315972328186035, "global_step": 93870, "epoch": 558} {"train_loss": -9.630880355834961, "global_step": 93871, "epoch": 558} {"train_loss": -9.658382415771484, "global_step": 93872, "epoch": 558} {"train_loss": -9.596673965454102, "global_step": 93873, "epoch": 558} {"train_loss": -9.512097358703613, "global_step": 93874, "epoch": 558} {"train_loss": -9.455429077148438, "global_step": 93875, "epoch": 558} {"train_loss": -9.793949127197266, "global_step": 93876, "epoch": 558} {"train_loss": -9.532014846801758, "global_step": 93877, "epoch": 558} {"train_loss": -9.697607040405273, "global_step": 93878, "epoch": 558} {"train_loss": -9.781065940856934, "global_step": 93879, "epoch": 558} {"train_loss": -9.80683708190918, "global_step": 93880, "epoch": 558} {"train_loss": -9.891525268554688, "global_step": 93881, "epoch": 558} {"train_loss": -9.751279830932617, "global_step": 93882, "epoch": 558} {"train_loss": -9.58473014831543, "global_step": 93883, "epoch": 558} {"train_loss": -9.816286087036133, "global_step": 93884, "epoch": 558} {"train_loss": -9.730079650878906, "global_step": 93885, "epoch": 558} {"train_loss": -9.773669242858887, "global_step": 93886, "epoch": 558} {"train_loss": -9.828468322753906, "global_step": 93887, "epoch": 558} {"train_loss": -9.731316566467285, "global_step": 93888, "epoch": 558} {"train_loss": -9.543169021606445, "global_step": 93889, "epoch": 558} {"train_loss": -9.801637649536133, "global_step": 93890, "epoch": 558} {"train_loss": -9.644676208496094, "global_step": 93891, "epoch": 558} {"train_loss": -9.594062805175781, "global_step": 93892, "epoch": 558} {"train_loss": -9.572929382324219, "global_step": 93893, "epoch": 558} {"train_loss": -9.894247055053711, "global_step": 93894, "epoch": 558} {"train_loss": -9.544105529785156, "global_step": 93895, "epoch": 558} {"train_loss": -9.678348541259766, "global_step": 93896, "epoch": 558} {"train_loss": -9.911649703979492, "global_step": 93897, "epoch": 558} {"train_loss": -9.282883644104004, "global_step": 93898, "epoch": 558} {"train_loss": -9.49406623840332, "global_step": 93899, "epoch": 558} {"train_loss": -8.997781753540039, "global_step": 93900, "epoch": 558} {"train_loss": -9.487333297729492, "global_step": 93901, "epoch": 558} {"train_loss": -9.871492385864258, "global_step": 93902, "epoch": 558} {"train_loss": -9.224690437316895, "global_step": 93903, "epoch": 558} {"train_loss": -9.29345703125, "global_step": 93904, "epoch": 558} {"train_loss": -9.179380416870117, "global_step": 93905, "epoch": 558} {"train_loss": -9.285562515258789, "global_step": 93906, "epoch": 558} {"train_loss": -8.963118553161621, "global_step": 93907, "epoch": 558} {"train_loss": -9.054220199584961, "global_step": 93908, "epoch": 558} {"train_loss": -9.278596878051758, "global_step": 93909, "epoch": 558} {"train_loss": -8.54963493347168, "global_step": 93910, "epoch": 558} {"train_loss": -9.504030239014398, "global_step": 93911, "epoch": 558, "val_loss": 202054.1875} {"train_loss": -8.79842758178711, "global_step": 93912, "epoch": 559} {"train_loss": -8.920571327209473, "global_step": 93913, "epoch": 559} {"train_loss": -9.385875701904297, "global_step": 93914, "epoch": 559} {"train_loss": -8.858745574951172, "global_step": 93915, "epoch": 559} {"train_loss": -9.204671859741211, "global_step": 93916, "epoch": 559} {"train_loss": -8.941993713378906, "global_step": 93917, "epoch": 559} {"train_loss": -9.035467147827148, "global_step": 93918, "epoch": 559} {"train_loss": -9.196929931640625, "global_step": 93919, "epoch": 559} {"train_loss": -9.181604385375977, "global_step": 93920, "epoch": 559} {"train_loss": -9.411174774169922, "global_step": 93921, "epoch": 559} {"train_loss": -9.136336326599121, "global_step": 93922, "epoch": 559} {"train_loss": -9.25474739074707, "global_step": 93923, "epoch": 559} {"train_loss": -9.324464797973633, "global_step": 93924, "epoch": 559} {"train_loss": -9.161545753479004, "global_step": 93925, "epoch": 559} {"train_loss": -9.319929122924805, "global_step": 93926, "epoch": 559} {"train_loss": -9.356866836547852, "global_step": 93927, "epoch": 559} {"train_loss": -9.370044708251953, "global_step": 93928, "epoch": 559} {"train_loss": -9.55093765258789, "global_step": 93929, "epoch": 559} {"train_loss": -9.5660400390625, "global_step": 93930, "epoch": 559} {"train_loss": -9.444738388061523, "global_step": 93931, "epoch": 559} {"train_loss": -9.485010147094727, "global_step": 93932, "epoch": 559} {"train_loss": -9.297868728637695, "global_step": 93933, "epoch": 559} {"train_loss": -9.334637641906738, "global_step": 93934, "epoch": 559} {"train_loss": -8.97749137878418, "global_step": 93935, "epoch": 559} {"train_loss": -9.523723602294922, "global_step": 93936, "epoch": 559} {"train_loss": -9.140901565551758, "global_step": 93937, "epoch": 559} {"train_loss": -9.36744213104248, "global_step": 93938, "epoch": 559} {"train_loss": -9.253093719482422, "global_step": 93939, "epoch": 559} {"train_loss": -9.14625358581543, "global_step": 93940, "epoch": 559} {"train_loss": -8.884748458862305, "global_step": 93941, "epoch": 559} {"train_loss": -9.146531105041504, "global_step": 93942, "epoch": 559} {"train_loss": -9.165367126464844, "global_step": 93943, "epoch": 559} {"train_loss": -9.359796524047852, "global_step": 93944, "epoch": 559} {"train_loss": -8.8763427734375, "global_step": 93945, "epoch": 559} {"train_loss": -9.367269515991211, "global_step": 93946, "epoch": 559} {"train_loss": -8.78221321105957, "global_step": 93947, "epoch": 559} {"train_loss": -9.1959228515625, "global_step": 93948, "epoch": 559} {"train_loss": -8.808647155761719, "global_step": 93949, "epoch": 559} {"train_loss": -9.149587631225586, "global_step": 93950, "epoch": 559} {"train_loss": -9.20111083984375, "global_step": 93951, "epoch": 559} {"train_loss": -9.210725784301758, "global_step": 93952, "epoch": 559} {"train_loss": -9.411262512207031, "global_step": 93953, "epoch": 559} {"train_loss": -9.355146408081055, "global_step": 93954, "epoch": 559} {"train_loss": -9.074212074279785, "global_step": 93955, "epoch": 559} {"train_loss": -9.315428733825684, "global_step": 93956, "epoch": 559} {"train_loss": -9.488018035888672, "global_step": 93957, "epoch": 559} {"train_loss": -9.415719985961914, "global_step": 93958, "epoch": 559} {"train_loss": -9.315122604370117, "global_step": 93959, "epoch": 559} {"train_loss": -9.342933654785156, "global_step": 93960, "epoch": 559} {"train_loss": -9.461312294006348, "global_step": 93961, "epoch": 559} {"train_loss": -9.633089065551758, "global_step": 93962, "epoch": 559} {"train_loss": -9.638723373413086, "global_step": 93963, "epoch": 559} {"train_loss": -9.74533462524414, "global_step": 93964, "epoch": 559} {"train_loss": -9.671365737915039, "global_step": 93965, "epoch": 559} {"train_loss": -9.504898071289062, "global_step": 93966, "epoch": 559} {"train_loss": -9.5020170211792, "global_step": 93967, "epoch": 559} {"train_loss": -9.535980224609375, "global_step": 93968, "epoch": 559} {"train_loss": -9.24991226196289, "global_step": 93969, "epoch": 559} {"train_loss": -9.930452346801758, "global_step": 93970, "epoch": 559} {"train_loss": -9.190423011779785, "global_step": 93971, "epoch": 559} {"train_loss": -9.456106185913086, "global_step": 93972, "epoch": 559} {"train_loss": -9.640836715698242, "global_step": 93973, "epoch": 559} {"train_loss": -9.74789047241211, "global_step": 93974, "epoch": 559} {"train_loss": -9.61752700805664, "global_step": 93975, "epoch": 559} {"train_loss": -9.5354642868042, "global_step": 93976, "epoch": 559} {"train_loss": -9.662428855895996, "global_step": 93977, "epoch": 559} {"train_loss": -9.707937240600586, "global_step": 93978, "epoch": 559} {"train_loss": -9.75243854522705, "global_step": 93979, "epoch": 559} {"train_loss": -9.989396095275879, "global_step": 93980, "epoch": 559} {"train_loss": -9.574906349182129, "global_step": 93981, "epoch": 559} {"train_loss": -9.632003784179688, "global_step": 93982, "epoch": 559} {"train_loss": -9.649803161621094, "global_step": 93983, "epoch": 559} {"train_loss": -9.515235900878906, "global_step": 93984, "epoch": 559} {"train_loss": -9.604450225830078, "global_step": 93985, "epoch": 559} {"train_loss": -9.583269119262695, "global_step": 93986, "epoch": 559} {"train_loss": -9.60953140258789, "global_step": 93987, "epoch": 559} {"train_loss": -9.328714370727539, "global_step": 93988, "epoch": 559} {"train_loss": -9.512921333312988, "global_step": 93989, "epoch": 559} {"train_loss": -9.416816711425781, "global_step": 93990, "epoch": 559} {"train_loss": -9.561717987060547, "global_step": 93991, "epoch": 559} {"train_loss": -9.564824104309082, "global_step": 93992, "epoch": 559} {"train_loss": -9.086280822753906, "global_step": 93993, "epoch": 559} {"train_loss": -9.124030113220215, "global_step": 93994, "epoch": 559} {"train_loss": -9.473689079284668, "global_step": 93995, "epoch": 559} {"train_loss": -9.437845230102539, "global_step": 93996, "epoch": 559} {"train_loss": -9.046368598937988, "global_step": 93997, "epoch": 559} {"train_loss": -9.224788665771484, "global_step": 93998, "epoch": 559} {"train_loss": -9.164163589477539, "global_step": 93999, "epoch": 559} {"train_loss": -9.236068725585938, "global_step": 94000, "epoch": 559} {"train_loss": -9.365203857421875, "global_step": 94001, "epoch": 559} {"train_loss": -9.235984802246094, "global_step": 94002, "epoch": 559} {"train_loss": -9.022357940673828, "global_step": 94003, "epoch": 559} {"train_loss": -8.863530158996582, "global_step": 94004, "epoch": 559} {"train_loss": -9.452071189880371, "global_step": 94005, "epoch": 559} {"train_loss": -9.536386489868164, "global_step": 94006, "epoch": 559} {"train_loss": -9.053915023803711, "global_step": 94007, "epoch": 559} {"train_loss": -9.404563903808594, "global_step": 94008, "epoch": 559} {"train_loss": -9.393949508666992, "global_step": 94009, "epoch": 559} {"train_loss": -9.653083801269531, "global_step": 94010, "epoch": 559} {"train_loss": -9.505207061767578, "global_step": 94011, "epoch": 559} {"train_loss": -8.967168807983398, "global_step": 94012, "epoch": 559} {"train_loss": -9.32772445678711, "global_step": 94013, "epoch": 559} {"train_loss": -9.347991943359375, "global_step": 94014, "epoch": 559} {"train_loss": -9.59280014038086, "global_step": 94015, "epoch": 559} {"train_loss": -9.604841232299805, "global_step": 94016, "epoch": 559} {"train_loss": -9.449796676635742, "global_step": 94017, "epoch": 559} {"train_loss": -9.479652404785156, "global_step": 94018, "epoch": 559} {"train_loss": -9.709304809570312, "global_step": 94019, "epoch": 559} {"train_loss": -9.320980072021484, "global_step": 94020, "epoch": 559} {"train_loss": -9.59372329711914, "global_step": 94021, "epoch": 559} {"train_loss": -9.73519229888916, "global_step": 94022, "epoch": 559} {"train_loss": -9.558042526245117, "global_step": 94023, "epoch": 559} {"train_loss": -9.533292770385742, "global_step": 94024, "epoch": 559} {"train_loss": -9.604917526245117, "global_step": 94025, "epoch": 559} {"train_loss": -9.608604431152344, "global_step": 94026, "epoch": 559} {"train_loss": -9.852720260620117, "global_step": 94027, "epoch": 559} {"train_loss": -9.464691162109375, "global_step": 94028, "epoch": 559} {"train_loss": -9.398393630981445, "global_step": 94029, "epoch": 559} {"train_loss": -9.670873641967773, "global_step": 94030, "epoch": 559} {"train_loss": -9.62884521484375, "global_step": 94031, "epoch": 559} {"train_loss": -9.449762344360352, "global_step": 94032, "epoch": 559} {"train_loss": -9.372810363769531, "global_step": 94033, "epoch": 559} {"train_loss": -9.381388664245605, "global_step": 94034, "epoch": 559} {"train_loss": -9.36802864074707, "global_step": 94035, "epoch": 559} {"train_loss": -9.39543342590332, "global_step": 94036, "epoch": 559} {"train_loss": -9.541203498840332, "global_step": 94037, "epoch": 559} {"train_loss": -9.261028289794922, "global_step": 94038, "epoch": 559} {"train_loss": -9.626802444458008, "global_step": 94039, "epoch": 559} {"train_loss": -9.377288818359375, "global_step": 94040, "epoch": 559} {"train_loss": -9.417773246765137, "global_step": 94041, "epoch": 559} {"train_loss": -9.674640655517578, "global_step": 94042, "epoch": 559} {"train_loss": -9.189172744750977, "global_step": 94043, "epoch": 559} {"train_loss": -9.488317489624023, "global_step": 94044, "epoch": 559} {"train_loss": -9.340967178344727, "global_step": 94045, "epoch": 559} {"train_loss": -9.400276184082031, "global_step": 94046, "epoch": 559} {"train_loss": -9.561867713928223, "global_step": 94047, "epoch": 559} {"train_loss": -9.580801010131836, "global_step": 94048, "epoch": 559} {"train_loss": -9.45333480834961, "global_step": 94049, "epoch": 559} {"train_loss": -9.493223190307617, "global_step": 94050, "epoch": 559} {"train_loss": -9.525676727294922, "global_step": 94051, "epoch": 559} {"train_loss": -9.659347534179688, "global_step": 94052, "epoch": 559} {"train_loss": -9.419946670532227, "global_step": 94053, "epoch": 559} {"train_loss": -9.248495101928711, "global_step": 94054, "epoch": 559} {"train_loss": -9.43157958984375, "global_step": 94055, "epoch": 559} {"train_loss": -9.3897705078125, "global_step": 94056, "epoch": 559} {"train_loss": -9.272976875305176, "global_step": 94057, "epoch": 559} {"train_loss": -9.639171600341797, "global_step": 94058, "epoch": 559} {"train_loss": -9.683560371398926, "global_step": 94059, "epoch": 559} {"train_loss": -9.477163314819336, "global_step": 94060, "epoch": 559} {"train_loss": -9.653854370117188, "global_step": 94061, "epoch": 559} {"train_loss": -9.405284881591797, "global_step": 94062, "epoch": 559} {"train_loss": -9.553155899047852, "global_step": 94063, "epoch": 559} {"train_loss": -9.698444366455078, "global_step": 94064, "epoch": 559} {"train_loss": -9.561988830566406, "global_step": 94065, "epoch": 559} {"train_loss": -9.659971237182617, "global_step": 94066, "epoch": 559} {"train_loss": -9.58975601196289, "global_step": 94067, "epoch": 559} {"train_loss": -9.767053604125977, "global_step": 94068, "epoch": 559} {"train_loss": -9.570528030395508, "global_step": 94069, "epoch": 559} {"train_loss": -9.761251449584961, "global_step": 94070, "epoch": 559} {"train_loss": -9.522714614868164, "global_step": 94071, "epoch": 559} {"train_loss": -9.45853042602539, "global_step": 94072, "epoch": 559} {"train_loss": -9.510564804077148, "global_step": 94073, "epoch": 559} {"train_loss": -9.457776069641113, "global_step": 94074, "epoch": 559} {"train_loss": -9.418998718261719, "global_step": 94075, "epoch": 559} {"train_loss": -9.390273094177246, "global_step": 94076, "epoch": 559} {"train_loss": -9.409866333007812, "global_step": 94077, "epoch": 559} {"train_loss": -9.466218948364258, "global_step": 94078, "epoch": 559} {"train_loss": -9.409372959818159, "global_step": 94079, "epoch": 559, "val_loss": 204528.421875} {"train_loss": -9.463528633117676, "global_step": 94080, "epoch": 560} {"train_loss": -9.123779296875, "global_step": 94081, "epoch": 560} {"train_loss": -9.441286087036133, "global_step": 94082, "epoch": 560} {"train_loss": -8.931539535522461, "global_step": 94083, "epoch": 560} {"train_loss": -9.151609420776367, "global_step": 94084, "epoch": 560} {"train_loss": -9.46165657043457, "global_step": 94085, "epoch": 560} {"train_loss": -9.310843467712402, "global_step": 94086, "epoch": 560} {"train_loss": -9.552130699157715, "global_step": 94087, "epoch": 560} {"train_loss": -9.409594535827637, "global_step": 94088, "epoch": 560} {"train_loss": -9.512819290161133, "global_step": 94089, "epoch": 560} {"train_loss": -9.226930618286133, "global_step": 94090, "epoch": 560} {"train_loss": -9.456531524658203, "global_step": 94091, "epoch": 560} {"train_loss": -9.44981575012207, "global_step": 94092, "epoch": 560} {"train_loss": -9.644554138183594, "global_step": 94093, "epoch": 560} {"train_loss": -9.396278381347656, "global_step": 94094, "epoch": 560} {"train_loss": -9.68587589263916, "global_step": 94095, "epoch": 560} {"train_loss": -9.676609992980957, "global_step": 94096, "epoch": 560} {"train_loss": -9.510395050048828, "global_step": 94097, "epoch": 560} {"train_loss": -9.304381370544434, "global_step": 94098, "epoch": 560} {"train_loss": -9.434232711791992, "global_step": 94099, "epoch": 560} {"train_loss": -9.84765338897705, "global_step": 94100, "epoch": 560} {"train_loss": -9.84683609008789, "global_step": 94101, "epoch": 560} {"train_loss": -9.72933578491211, "global_step": 94102, "epoch": 560} {"train_loss": -9.799938201904297, "global_step": 94103, "epoch": 560} {"train_loss": -9.685640335083008, "global_step": 94104, "epoch": 560} {"train_loss": -9.853014945983887, "global_step": 94105, "epoch": 560} {"train_loss": -9.622962951660156, "global_step": 94106, "epoch": 560} {"train_loss": -9.682697296142578, "global_step": 94107, "epoch": 560} {"train_loss": -9.883333206176758, "global_step": 94108, "epoch": 560} {"train_loss": -9.693687438964844, "global_step": 94109, "epoch": 560} {"train_loss": -9.848796844482422, "global_step": 94110, "epoch": 560} {"train_loss": -9.625929832458496, "global_step": 94111, "epoch": 560} {"train_loss": -9.135169982910156, "global_step": 94112, "epoch": 560} {"train_loss": -9.568537712097168, "global_step": 94113, "epoch": 560} {"train_loss": -9.393763542175293, "global_step": 94114, "epoch": 560} {"train_loss": -9.548431396484375, "global_step": 94115, "epoch": 560} {"train_loss": -9.286214828491211, "global_step": 94116, "epoch": 560} {"train_loss": -9.592290878295898, "global_step": 94117, "epoch": 560} {"train_loss": -9.397552490234375, "global_step": 94118, "epoch": 560} {"train_loss": -9.524542808532715, "global_step": 94119, "epoch": 560} {"train_loss": -9.719470977783203, "global_step": 94120, "epoch": 560} {"train_loss": -9.460660934448242, "global_step": 94121, "epoch": 560} {"train_loss": -9.741080284118652, "global_step": 94122, "epoch": 560} {"train_loss": -9.598881721496582, "global_step": 94123, "epoch": 560} {"train_loss": -9.493398666381836, "global_step": 94124, "epoch": 560} {"train_loss": -9.656818389892578, "global_step": 94125, "epoch": 560} {"train_loss": -9.614688873291016, "global_step": 94126, "epoch": 560} {"train_loss": -9.513823509216309, "global_step": 94127, "epoch": 560} {"train_loss": -9.42373275756836, "global_step": 94128, "epoch": 560} {"train_loss": -9.660552978515625, "global_step": 94129, "epoch": 560} {"train_loss": -9.985406875610352, "global_step": 94130, "epoch": 560} {"train_loss": -9.747888565063477, "global_step": 94131, "epoch": 560} {"train_loss": -9.75403881072998, "global_step": 94132, "epoch": 560} {"train_loss": -9.52469253540039, "global_step": 94133, "epoch": 560} {"train_loss": -9.750676155090332, "global_step": 94134, "epoch": 560} {"train_loss": -10.085674285888672, "global_step": 94135, "epoch": 560} {"train_loss": -9.663490295410156, "global_step": 94136, "epoch": 560} {"train_loss": -9.753307342529297, "global_step": 94137, "epoch": 560} {"train_loss": -9.72968578338623, "global_step": 94138, "epoch": 560} {"train_loss": -9.155839920043945, "global_step": 94139, "epoch": 560} {"train_loss": -9.63589096069336, "global_step": 94140, "epoch": 560} {"train_loss": -9.5430326461792, "global_step": 94141, "epoch": 560} {"train_loss": -9.83777141571045, "global_step": 94142, "epoch": 560} {"train_loss": -9.429553985595703, "global_step": 94143, "epoch": 560} {"train_loss": -9.56491470336914, "global_step": 94144, "epoch": 560} {"train_loss": -9.428537368774414, "global_step": 94145, "epoch": 560} {"train_loss": -9.308368682861328, "global_step": 94146, "epoch": 560} {"train_loss": -9.736342430114746, "global_step": 94147, "epoch": 560} {"train_loss": -9.640510559082031, "global_step": 94148, "epoch": 560} {"train_loss": -9.529841423034668, "global_step": 94149, "epoch": 560} {"train_loss": -9.512210845947266, "global_step": 94150, "epoch": 560} {"train_loss": -9.287296295166016, "global_step": 94151, "epoch": 560} {"train_loss": -9.398712158203125, "global_step": 94152, "epoch": 560} {"train_loss": -9.518505096435547, "global_step": 94153, "epoch": 560} {"train_loss": -9.789993286132812, "global_step": 94154, "epoch": 560} {"train_loss": -9.39659309387207, "global_step": 94155, "epoch": 560} {"train_loss": -9.61034870147705, "global_step": 94156, "epoch": 560} {"train_loss": -9.258636474609375, "global_step": 94157, "epoch": 560} {"train_loss": -9.46898078918457, "global_step": 94158, "epoch": 560} {"train_loss": -9.479974746704102, "global_step": 94159, "epoch": 560} {"train_loss": -9.522624969482422, "global_step": 94160, "epoch": 560} {"train_loss": -9.545454978942871, "global_step": 94161, "epoch": 560} {"train_loss": -9.699599266052246, "global_step": 94162, "epoch": 560} {"train_loss": -9.67329216003418, "global_step": 94163, "epoch": 560} {"train_loss": -9.537689208984375, "global_step": 94164, "epoch": 560} {"train_loss": -9.616968154907227, "global_step": 94165, "epoch": 560} {"train_loss": -9.310855865478516, "global_step": 94166, "epoch": 560} {"train_loss": -9.620095252990723, "global_step": 94167, "epoch": 560} {"train_loss": -9.46581745147705, "global_step": 94168, "epoch": 560} {"train_loss": -9.405843734741211, "global_step": 94169, "epoch": 560} {"train_loss": -9.331854820251465, "global_step": 94170, "epoch": 560} {"train_loss": -9.493292808532715, "global_step": 94171, "epoch": 560} {"train_loss": -9.370321273803711, "global_step": 94172, "epoch": 560} {"train_loss": -9.72872543334961, "global_step": 94173, "epoch": 560} {"train_loss": -9.642232894897461, "global_step": 94174, "epoch": 560} {"train_loss": -9.739551544189453, "global_step": 94175, "epoch": 560} {"train_loss": -9.774977684020996, "global_step": 94176, "epoch": 560} {"train_loss": -9.665304183959961, "global_step": 94177, "epoch": 560} {"train_loss": -9.586074829101562, "global_step": 94178, "epoch": 560} {"train_loss": -9.957818984985352, "global_step": 94179, "epoch": 560} {"train_loss": -9.721641540527344, "global_step": 94180, "epoch": 560} {"train_loss": -9.773588180541992, "global_step": 94181, "epoch": 560} {"train_loss": -9.583828926086426, "global_step": 94182, "epoch": 560} {"train_loss": -9.66009521484375, "global_step": 94183, "epoch": 560} {"train_loss": -9.553426742553711, "global_step": 94184, "epoch": 560} {"train_loss": -9.687232971191406, "global_step": 94185, "epoch": 560} {"train_loss": -9.827486038208008, "global_step": 94186, "epoch": 560} {"train_loss": -9.689188003540039, "global_step": 94187, "epoch": 560} {"train_loss": -9.836906433105469, "global_step": 94188, "epoch": 560} {"train_loss": -9.770231246948242, "global_step": 94189, "epoch": 560} {"train_loss": -9.88996410369873, "global_step": 94190, "epoch": 560} {"train_loss": -9.786459922790527, "global_step": 94191, "epoch": 560} {"train_loss": -9.573991775512695, "global_step": 94192, "epoch": 560} {"train_loss": -9.527260780334473, "global_step": 94193, "epoch": 560} {"train_loss": -9.400369644165039, "global_step": 94194, "epoch": 560} {"train_loss": -9.608572006225586, "global_step": 94195, "epoch": 560} {"train_loss": -9.77712631225586, "global_step": 94196, "epoch": 560} {"train_loss": -9.609245300292969, "global_step": 94197, "epoch": 560} {"train_loss": -9.592504501342773, "global_step": 94198, "epoch": 560} {"train_loss": -9.551962852478027, "global_step": 94199, "epoch": 560} {"train_loss": -9.809659957885742, "global_step": 94200, "epoch": 560} {"train_loss": -9.377248764038086, "global_step": 94201, "epoch": 560} {"train_loss": -9.358159065246582, "global_step": 94202, "epoch": 560} {"train_loss": -9.196636199951172, "global_step": 94203, "epoch": 560} {"train_loss": -9.358939170837402, "global_step": 94204, "epoch": 560} {"train_loss": -9.464225769042969, "global_step": 94205, "epoch": 560} {"train_loss": -9.359699249267578, "global_step": 94206, "epoch": 560} {"train_loss": -9.56039047241211, "global_step": 94207, "epoch": 560} {"train_loss": -9.220352172851562, "global_step": 94208, "epoch": 560} {"train_loss": -9.668253898620605, "global_step": 94209, "epoch": 560} {"train_loss": -9.444145202636719, "global_step": 94210, "epoch": 560} {"train_loss": -9.333420753479004, "global_step": 94211, "epoch": 560} {"train_loss": -9.536552429199219, "global_step": 94212, "epoch": 560} {"train_loss": -9.478546142578125, "global_step": 94213, "epoch": 560} {"train_loss": -9.629663467407227, "global_step": 94214, "epoch": 560} {"train_loss": -9.551136016845703, "global_step": 94215, "epoch": 560} {"train_loss": -9.660493850708008, "global_step": 94216, "epoch": 560} {"train_loss": -9.792654037475586, "global_step": 94217, "epoch": 560} {"train_loss": -9.409589767456055, "global_step": 94218, "epoch": 560} {"train_loss": -9.544965744018555, "global_step": 94219, "epoch": 560} {"train_loss": -9.910000801086426, "global_step": 94220, "epoch": 560} {"train_loss": -9.612059593200684, "global_step": 94221, "epoch": 560} {"train_loss": -9.817243576049805, "global_step": 94222, "epoch": 560} {"train_loss": -9.624634742736816, "global_step": 94223, "epoch": 560} {"train_loss": -9.472339630126953, "global_step": 94224, "epoch": 560} {"train_loss": -9.670639038085938, "global_step": 94225, "epoch": 560} {"train_loss": -9.27669620513916, "global_step": 94226, "epoch": 560} {"train_loss": -9.588785171508789, "global_step": 94227, "epoch": 560} {"train_loss": -9.798052787780762, "global_step": 94228, "epoch": 560} {"train_loss": -9.613811492919922, "global_step": 94229, "epoch": 560} {"train_loss": -9.652429580688477, "global_step": 94230, "epoch": 560} {"train_loss": -9.712617874145508, "global_step": 94231, "epoch": 560} {"train_loss": -9.530767440795898, "global_step": 94232, "epoch": 560} {"train_loss": -9.812535285949707, "global_step": 94233, "epoch": 560} {"train_loss": -9.617663383483887, "global_step": 94234, "epoch": 560} {"train_loss": -9.986486434936523, "global_step": 94235, "epoch": 560} {"train_loss": -9.614990234375, "global_step": 94236, "epoch": 560} {"train_loss": -9.989876747131348, "global_step": 94237, "epoch": 560} {"train_loss": -9.730058670043945, "global_step": 94238, "epoch": 560} {"train_loss": -9.721702575683594, "global_step": 94239, "epoch": 560} {"train_loss": -9.748576164245605, "global_step": 94240, "epoch": 560} {"train_loss": -9.666139602661133, "global_step": 94241, "epoch": 560} {"train_loss": -9.614080429077148, "global_step": 94242, "epoch": 560} {"train_loss": -9.436298370361328, "global_step": 94243, "epoch": 560} {"train_loss": -9.540706634521484, "global_step": 94244, "epoch": 560} {"train_loss": -9.518627166748047, "global_step": 94245, "epoch": 560} {"train_loss": -9.439634323120117, "global_step": 94246, "epoch": 560} {"train_loss": -9.57828354267847, "global_step": 94247, "epoch": 560, "val_loss": 203017.96875, "train_action_mse_error": 4.1769304275512695} {"train_loss": -9.373128890991211, "global_step": 94248, "epoch": 561} {"train_loss": -9.287736892700195, "global_step": 94249, "epoch": 561} {"train_loss": -9.349570274353027, "global_step": 94250, "epoch": 561} {"train_loss": -9.317734718322754, "global_step": 94251, "epoch": 561} {"train_loss": -9.225862503051758, "global_step": 94252, "epoch": 561} {"train_loss": -9.770971298217773, "global_step": 94253, "epoch": 561} {"train_loss": -9.420385360717773, "global_step": 94254, "epoch": 561} {"train_loss": -9.311354637145996, "global_step": 94255, "epoch": 561} {"train_loss": -9.551434516906738, "global_step": 94256, "epoch": 561} {"train_loss": -9.358905792236328, "global_step": 94257, "epoch": 561} {"train_loss": -9.152996063232422, "global_step": 94258, "epoch": 561} {"train_loss": -9.350982666015625, "global_step": 94259, "epoch": 561} {"train_loss": -9.475988388061523, "global_step": 94260, "epoch": 561} {"train_loss": -9.282173156738281, "global_step": 94261, "epoch": 561} {"train_loss": -9.458538055419922, "global_step": 94262, "epoch": 561} {"train_loss": -9.226943969726562, "global_step": 94263, "epoch": 561} {"train_loss": -9.45423698425293, "global_step": 94264, "epoch": 561} {"train_loss": -9.65278434753418, "global_step": 94265, "epoch": 561} {"train_loss": -9.66683578491211, "global_step": 94266, "epoch": 561} {"train_loss": -9.519701957702637, "global_step": 94267, "epoch": 561} {"train_loss": -9.58803653717041, "global_step": 94268, "epoch": 561} {"train_loss": -9.43229866027832, "global_step": 94269, "epoch": 561} {"train_loss": -9.496030807495117, "global_step": 94270, "epoch": 561} {"train_loss": -9.28554630279541, "global_step": 94271, "epoch": 561} {"train_loss": -9.56633186340332, "global_step": 94272, "epoch": 561} {"train_loss": -9.667037963867188, "global_step": 94273, "epoch": 561} {"train_loss": -9.514436721801758, "global_step": 94274, "epoch": 561} {"train_loss": -9.744665145874023, "global_step": 94275, "epoch": 561} {"train_loss": -9.42275619506836, "global_step": 94276, "epoch": 561} {"train_loss": -9.613277435302734, "global_step": 94277, "epoch": 561} {"train_loss": -9.517556190490723, "global_step": 94278, "epoch": 561} {"train_loss": -9.663846969604492, "global_step": 94279, "epoch": 561} {"train_loss": -9.735176086425781, "global_step": 94280, "epoch": 561} {"train_loss": -9.66202163696289, "global_step": 94281, "epoch": 561} {"train_loss": -9.677495002746582, "global_step": 94282, "epoch": 561} {"train_loss": -9.63741683959961, "global_step": 94283, "epoch": 561} {"train_loss": -9.5810546875, "global_step": 94284, "epoch": 561} {"train_loss": -9.423543930053711, "global_step": 94285, "epoch": 561} {"train_loss": -9.34278392791748, "global_step": 94286, "epoch": 561} {"train_loss": -9.49262809753418, "global_step": 94287, "epoch": 561} {"train_loss": -9.846624374389648, "global_step": 94288, "epoch": 561} {"train_loss": -9.617317199707031, "global_step": 94289, "epoch": 561} {"train_loss": -9.669336318969727, "global_step": 94290, "epoch": 561} {"train_loss": -9.647700309753418, "global_step": 94291, "epoch": 561} {"train_loss": -9.731413841247559, "global_step": 94292, "epoch": 561} {"train_loss": -9.73541259765625, "global_step": 94293, "epoch": 561} {"train_loss": -9.710289001464844, "global_step": 94294, "epoch": 561} {"train_loss": -9.5593843460083, "global_step": 94295, "epoch": 561} {"train_loss": -9.615767478942871, "global_step": 94296, "epoch": 561} {"train_loss": -9.570880889892578, "global_step": 94297, "epoch": 561} {"train_loss": -9.187618255615234, "global_step": 94298, "epoch": 561} {"train_loss": -9.628280639648438, "global_step": 94299, "epoch": 561} {"train_loss": -9.5029878616333, "global_step": 94300, "epoch": 561} {"train_loss": -9.445613861083984, "global_step": 94301, "epoch": 561} {"train_loss": -9.609809875488281, "global_step": 94302, "epoch": 561} {"train_loss": -9.770687103271484, "global_step": 94303, "epoch": 561} {"train_loss": -9.602006912231445, "global_step": 94304, "epoch": 561} {"train_loss": -9.37755012512207, "global_step": 94305, "epoch": 561} {"train_loss": -9.59728717803955, "global_step": 94306, "epoch": 561} {"train_loss": -9.64047908782959, "global_step": 94307, "epoch": 561} {"train_loss": -9.6943941116333, "global_step": 94308, "epoch": 561} {"train_loss": -9.721407890319824, "global_step": 94309, "epoch": 561} {"train_loss": -9.613729476928711, "global_step": 94310, "epoch": 561} {"train_loss": -9.776632308959961, "global_step": 94311, "epoch": 561} {"train_loss": -9.55160903930664, "global_step": 94312, "epoch": 561} {"train_loss": -9.528766632080078, "global_step": 94313, "epoch": 561} {"train_loss": -9.84600830078125, "global_step": 94314, "epoch": 561} {"train_loss": -9.28250789642334, "global_step": 94315, "epoch": 561} {"train_loss": -9.673762321472168, "global_step": 94316, "epoch": 561} {"train_loss": -9.79413890838623, "global_step": 94317, "epoch": 561} {"train_loss": -9.307785034179688, "global_step": 94318, "epoch": 561} {"train_loss": -9.099163055419922, "global_step": 94319, "epoch": 561} {"train_loss": -9.4276762008667, "global_step": 94320, "epoch": 561} {"train_loss": -9.156794548034668, "global_step": 94321, "epoch": 561} {"train_loss": -9.242297172546387, "global_step": 94322, "epoch": 561} {"train_loss": -9.530256271362305, "global_step": 94323, "epoch": 561} {"train_loss": -9.590907096862793, "global_step": 94324, "epoch": 561} {"train_loss": -9.543275833129883, "global_step": 94325, "epoch": 561} {"train_loss": -9.401557922363281, "global_step": 94326, "epoch": 561} {"train_loss": -9.516519546508789, "global_step": 94327, "epoch": 561} {"train_loss": -9.603192329406738, "global_step": 94328, "epoch": 561} {"train_loss": -9.464092254638672, "global_step": 94329, "epoch": 561} {"train_loss": -9.439888954162598, "global_step": 94330, "epoch": 561} {"train_loss": -9.763982772827148, "global_step": 94331, "epoch": 561} {"train_loss": -9.223691940307617, "global_step": 94332, "epoch": 561} {"train_loss": -9.150859832763672, "global_step": 94333, "epoch": 561} {"train_loss": -9.403079986572266, "global_step": 94334, "epoch": 561} {"train_loss": -9.12095832824707, "global_step": 94335, "epoch": 561} {"train_loss": -9.83450698852539, "global_step": 94336, "epoch": 561} {"train_loss": -9.148662567138672, "global_step": 94337, "epoch": 561} {"train_loss": -9.442398071289062, "global_step": 94338, "epoch": 561} {"train_loss": -9.659692764282227, "global_step": 94339, "epoch": 561} {"train_loss": -9.473047256469727, "global_step": 94340, "epoch": 561} {"train_loss": -9.523775100708008, "global_step": 94341, "epoch": 561} {"train_loss": -9.708623886108398, "global_step": 94342, "epoch": 561} {"train_loss": -9.622903823852539, "global_step": 94343, "epoch": 561} {"train_loss": -9.412355422973633, "global_step": 94344, "epoch": 561} {"train_loss": -9.668902397155762, "global_step": 94345, "epoch": 561} {"train_loss": -9.368630409240723, "global_step": 94346, "epoch": 561} {"train_loss": -9.364696502685547, "global_step": 94347, "epoch": 561} {"train_loss": -9.458364486694336, "global_step": 94348, "epoch": 561} {"train_loss": -9.770580291748047, "global_step": 94349, "epoch": 561} {"train_loss": -9.499101638793945, "global_step": 94350, "epoch": 561} {"train_loss": -9.742851257324219, "global_step": 94351, "epoch": 561} {"train_loss": -9.73681640625, "global_step": 94352, "epoch": 561} {"train_loss": -9.678009033203125, "global_step": 94353, "epoch": 561} {"train_loss": -9.710823059082031, "global_step": 94354, "epoch": 561} {"train_loss": -9.580568313598633, "global_step": 94355, "epoch": 561} {"train_loss": -9.32253360748291, "global_step": 94356, "epoch": 561} {"train_loss": -9.746295928955078, "global_step": 94357, "epoch": 561} {"train_loss": -9.473109245300293, "global_step": 94358, "epoch": 561} {"train_loss": -9.450443267822266, "global_step": 94359, "epoch": 561} {"train_loss": -9.691725730895996, "global_step": 94360, "epoch": 561} {"train_loss": -9.10689640045166, "global_step": 94361, "epoch": 561} {"train_loss": -9.648416519165039, "global_step": 94362, "epoch": 561} {"train_loss": -9.51558780670166, "global_step": 94363, "epoch": 561} {"train_loss": -9.317113876342773, "global_step": 94364, "epoch": 561} {"train_loss": -9.25522518157959, "global_step": 94365, "epoch": 561} {"train_loss": -9.526060104370117, "global_step": 94366, "epoch": 561} {"train_loss": -9.602100372314453, "global_step": 94367, "epoch": 561} {"train_loss": -9.527074813842773, "global_step": 94368, "epoch": 561} {"train_loss": -9.662455558776855, "global_step": 94369, "epoch": 561} {"train_loss": -9.662210464477539, "global_step": 94370, "epoch": 561} {"train_loss": -9.509919166564941, "global_step": 94371, "epoch": 561} {"train_loss": -9.46701717376709, "global_step": 94372, "epoch": 561} {"train_loss": -9.574922561645508, "global_step": 94373, "epoch": 561} {"train_loss": -9.463018417358398, "global_step": 94374, "epoch": 561} {"train_loss": -9.68493366241455, "global_step": 94375, "epoch": 561} {"train_loss": -9.613245010375977, "global_step": 94376, "epoch": 561} {"train_loss": -9.64621353149414, "global_step": 94377, "epoch": 561} {"train_loss": -9.511597633361816, "global_step": 94378, "epoch": 561} {"train_loss": -9.625683784484863, "global_step": 94379, "epoch": 561} {"train_loss": -9.502908706665039, "global_step": 94380, "epoch": 561} {"train_loss": -9.533084869384766, "global_step": 94381, "epoch": 561} {"train_loss": -9.332610130310059, "global_step": 94382, "epoch": 561} {"train_loss": -8.660198211669922, "global_step": 94383, "epoch": 561} {"train_loss": -9.540133476257324, "global_step": 94384, "epoch": 561} {"train_loss": -9.346428871154785, "global_step": 94385, "epoch": 561} {"train_loss": -9.007411003112793, "global_step": 94386, "epoch": 561} {"train_loss": -9.293554306030273, "global_step": 94387, "epoch": 561} {"train_loss": -8.775249481201172, "global_step": 94388, "epoch": 561} {"train_loss": -9.283538818359375, "global_step": 94389, "epoch": 561} {"train_loss": -9.340688705444336, "global_step": 94390, "epoch": 561} {"train_loss": -9.172865867614746, "global_step": 94391, "epoch": 561} {"train_loss": -9.467050552368164, "global_step": 94392, "epoch": 561} {"train_loss": -9.312026023864746, "global_step": 94393, "epoch": 561} {"train_loss": -9.334737777709961, "global_step": 94394, "epoch": 561} {"train_loss": -9.351003646850586, "global_step": 94395, "epoch": 561} {"train_loss": -9.155013084411621, "global_step": 94396, "epoch": 561} {"train_loss": -9.206274032592773, "global_step": 94397, "epoch": 561} {"train_loss": -8.923929214477539, "global_step": 94398, "epoch": 561} {"train_loss": -9.360719680786133, "global_step": 94399, "epoch": 561} {"train_loss": -9.09227466583252, "global_step": 94400, "epoch": 561} {"train_loss": -9.443010330200195, "global_step": 94401, "epoch": 561} {"train_loss": -8.873125076293945, "global_step": 94402, "epoch": 561} {"train_loss": -9.153656005859375, "global_step": 94403, "epoch": 561} {"train_loss": -9.33922004699707, "global_step": 94404, "epoch": 561} {"train_loss": -9.192527770996094, "global_step": 94405, "epoch": 561} {"train_loss": -9.322328567504883, "global_step": 94406, "epoch": 561} {"train_loss": -9.45012378692627, "global_step": 94407, "epoch": 561} {"train_loss": -9.520712852478027, "global_step": 94408, "epoch": 561} {"train_loss": -9.303232192993164, "global_step": 94409, "epoch": 561} {"train_loss": -9.405829429626465, "global_step": 94410, "epoch": 561} {"train_loss": -9.576303482055664, "global_step": 94411, "epoch": 561} {"train_loss": -9.631401062011719, "global_step": 94412, "epoch": 561} {"train_loss": -9.555692672729492, "global_step": 94413, "epoch": 561} {"train_loss": -9.39716625213623, "global_step": 94414, "epoch": 561} {"train_loss": -9.473960059029716, "global_step": 94415, "epoch": 561, "val_loss": 205831.359375} {"train_loss": -9.610954284667969, "global_step": 94416, "epoch": 562} {"train_loss": -9.610794067382812, "global_step": 94417, "epoch": 562} {"train_loss": -9.557700157165527, "global_step": 94418, "epoch": 562} {"train_loss": -9.64138412475586, "global_step": 94419, "epoch": 562} {"train_loss": -9.639204025268555, "global_step": 94420, "epoch": 562} {"train_loss": -9.873939514160156, "global_step": 94421, "epoch": 562} {"train_loss": -9.743122100830078, "global_step": 94422, "epoch": 562} {"train_loss": -9.51090145111084, "global_step": 94423, "epoch": 562} {"train_loss": -9.870086669921875, "global_step": 94424, "epoch": 562} {"train_loss": -9.965337753295898, "global_step": 94425, "epoch": 562} {"train_loss": -9.801603317260742, "global_step": 94426, "epoch": 562} {"train_loss": -9.878042221069336, "global_step": 94427, "epoch": 562} {"train_loss": -9.938344955444336, "global_step": 94428, "epoch": 562} {"train_loss": -9.746551513671875, "global_step": 94429, "epoch": 562} {"train_loss": -9.682012557983398, "global_step": 94430, "epoch": 562} {"train_loss": -9.51435661315918, "global_step": 94431, "epoch": 562} {"train_loss": -9.786836624145508, "global_step": 94432, "epoch": 562} {"train_loss": -9.668075561523438, "global_step": 94433, "epoch": 562} {"train_loss": -9.883113861083984, "global_step": 94434, "epoch": 562} {"train_loss": -9.101123809814453, "global_step": 94435, "epoch": 562} {"train_loss": -9.60107421875, "global_step": 94436, "epoch": 562} {"train_loss": -9.505342483520508, "global_step": 94437, "epoch": 562} {"train_loss": -8.860869407653809, "global_step": 94438, "epoch": 562} {"train_loss": -9.204864501953125, "global_step": 94439, "epoch": 562} {"train_loss": -8.670379638671875, "global_step": 94440, "epoch": 562} {"train_loss": -9.16089153289795, "global_step": 94441, "epoch": 562} {"train_loss": -8.481647491455078, "global_step": 94442, "epoch": 562} {"train_loss": -9.30593490600586, "global_step": 94443, "epoch": 562} {"train_loss": -8.697659492492676, "global_step": 94444, "epoch": 562} {"train_loss": -9.538955688476562, "global_step": 94445, "epoch": 562} {"train_loss": -9.204560279846191, "global_step": 94446, "epoch": 562} {"train_loss": -9.4457426071167, "global_step": 94447, "epoch": 562} {"train_loss": -9.481184005737305, "global_step": 94448, "epoch": 562} {"train_loss": -9.527068138122559, "global_step": 94449, "epoch": 562} {"train_loss": -9.423593521118164, "global_step": 94450, "epoch": 562} {"train_loss": -9.324060440063477, "global_step": 94451, "epoch": 562} {"train_loss": -9.520336151123047, "global_step": 94452, "epoch": 562} {"train_loss": -9.55611515045166, "global_step": 94453, "epoch": 562} {"train_loss": -9.641542434692383, "global_step": 94454, "epoch": 562} {"train_loss": -9.437204360961914, "global_step": 94455, "epoch": 562} {"train_loss": -9.577350616455078, "global_step": 94456, "epoch": 562} {"train_loss": -9.472420692443848, "global_step": 94457, "epoch": 562} {"train_loss": -9.603154182434082, "global_step": 94458, "epoch": 562} {"train_loss": -9.531614303588867, "global_step": 94459, "epoch": 562} {"train_loss": -9.602033615112305, "global_step": 94460, "epoch": 562} {"train_loss": -9.54236888885498, "global_step": 94461, "epoch": 562} {"train_loss": -9.486557960510254, "global_step": 94462, "epoch": 562} {"train_loss": -9.645179748535156, "global_step": 94463, "epoch": 562} {"train_loss": -9.407064437866211, "global_step": 94464, "epoch": 562} {"train_loss": -9.482447624206543, "global_step": 94465, "epoch": 562} {"train_loss": -9.580196380615234, "global_step": 94466, "epoch": 562} {"train_loss": -9.614694595336914, "global_step": 94467, "epoch": 562} {"train_loss": -9.610604286193848, "global_step": 94468, "epoch": 562} {"train_loss": -9.687454223632812, "global_step": 94469, "epoch": 562} {"train_loss": -9.612557411193848, "global_step": 94470, "epoch": 562} {"train_loss": -9.804733276367188, "global_step": 94471, "epoch": 562} {"train_loss": -9.425363540649414, "global_step": 94472, "epoch": 562} {"train_loss": -9.663434028625488, "global_step": 94473, "epoch": 562} {"train_loss": -9.693414688110352, "global_step": 94474, "epoch": 562} {"train_loss": -9.59592342376709, "global_step": 94475, "epoch": 562} {"train_loss": -9.651717185974121, "global_step": 94476, "epoch": 562} {"train_loss": -9.838019371032715, "global_step": 94477, "epoch": 562} {"train_loss": -9.651792526245117, "global_step": 94478, "epoch": 562} {"train_loss": -9.699546813964844, "global_step": 94479, "epoch": 562} {"train_loss": -9.62864875793457, "global_step": 94480, "epoch": 562} {"train_loss": -9.911750793457031, "global_step": 94481, "epoch": 562} {"train_loss": -9.380853652954102, "global_step": 94482, "epoch": 562} {"train_loss": -9.357056617736816, "global_step": 94483, "epoch": 562} {"train_loss": -9.820032119750977, "global_step": 94484, "epoch": 562} {"train_loss": -9.764644622802734, "global_step": 94485, "epoch": 562} {"train_loss": -9.657236099243164, "global_step": 94486, "epoch": 562} {"train_loss": -9.43215560913086, "global_step": 94487, "epoch": 562} {"train_loss": -9.80064868927002, "global_step": 94488, "epoch": 562} {"train_loss": -9.436320304870605, "global_step": 94489, "epoch": 562} {"train_loss": -9.671564102172852, "global_step": 94490, "epoch": 562} {"train_loss": -9.603233337402344, "global_step": 94491, "epoch": 562} {"train_loss": -9.756799697875977, "global_step": 94492, "epoch": 562} {"train_loss": -9.79035758972168, "global_step": 94493, "epoch": 562} {"train_loss": -9.849860191345215, "global_step": 94494, "epoch": 562} {"train_loss": -9.822673797607422, "global_step": 94495, "epoch": 562} {"train_loss": -9.67111587524414, "global_step": 94496, "epoch": 562} {"train_loss": -9.676467895507812, "global_step": 94497, "epoch": 562} {"train_loss": -9.760721206665039, "global_step": 94498, "epoch": 562} {"train_loss": -9.652070999145508, "global_step": 94499, "epoch": 562} {"train_loss": -9.440604209899902, "global_step": 94500, "epoch": 562} {"train_loss": -9.450199127197266, "global_step": 94501, "epoch": 562} {"train_loss": -9.621862411499023, "global_step": 94502, "epoch": 562} {"train_loss": -9.481999397277832, "global_step": 94503, "epoch": 562} {"train_loss": -9.381926536560059, "global_step": 94504, "epoch": 562} {"train_loss": -9.752474784851074, "global_step": 94505, "epoch": 562} {"train_loss": -9.60733413696289, "global_step": 94506, "epoch": 562} {"train_loss": -9.669666290283203, "global_step": 94507, "epoch": 562} {"train_loss": -9.463165283203125, "global_step": 94508, "epoch": 562} {"train_loss": -9.857902526855469, "global_step": 94509, "epoch": 562} {"train_loss": -9.650970458984375, "global_step": 94510, "epoch": 562} {"train_loss": -9.611151695251465, "global_step": 94511, "epoch": 562} {"train_loss": -9.49276065826416, "global_step": 94512, "epoch": 562} {"train_loss": -9.567736625671387, "global_step": 94513, "epoch": 562} {"train_loss": -9.661089897155762, "global_step": 94514, "epoch": 562} {"train_loss": -9.847620010375977, "global_step": 94515, "epoch": 562} {"train_loss": -9.721565246582031, "global_step": 94516, "epoch": 562} {"train_loss": -9.70081901550293, "global_step": 94517, "epoch": 562} {"train_loss": -9.764741897583008, "global_step": 94518, "epoch": 562} {"train_loss": -9.577478408813477, "global_step": 94519, "epoch": 562} {"train_loss": -9.41903305053711, "global_step": 94520, "epoch": 562} {"train_loss": -9.80096435546875, "global_step": 94521, "epoch": 562} {"train_loss": -9.558155059814453, "global_step": 94522, "epoch": 562} {"train_loss": -9.823400497436523, "global_step": 94523, "epoch": 562} {"train_loss": -9.835851669311523, "global_step": 94524, "epoch": 562} {"train_loss": -9.504961013793945, "global_step": 94525, "epoch": 562} {"train_loss": -9.764762878417969, "global_step": 94526, "epoch": 562} {"train_loss": -9.761184692382812, "global_step": 94527, "epoch": 562} {"train_loss": -9.861442565917969, "global_step": 94528, "epoch": 562} {"train_loss": -9.425455093383789, "global_step": 94529, "epoch": 562} {"train_loss": -9.796432495117188, "global_step": 94530, "epoch": 562} {"train_loss": -9.823543548583984, "global_step": 94531, "epoch": 562} {"train_loss": -9.79654312133789, "global_step": 94532, "epoch": 562} {"train_loss": -9.77485179901123, "global_step": 94533, "epoch": 562} {"train_loss": -9.617752075195312, "global_step": 94534, "epoch": 562} {"train_loss": -9.463842391967773, "global_step": 94535, "epoch": 562} {"train_loss": -9.527223587036133, "global_step": 94536, "epoch": 562} {"train_loss": -9.384693145751953, "global_step": 94537, "epoch": 562} {"train_loss": -9.228379249572754, "global_step": 94538, "epoch": 562} {"train_loss": -9.193668365478516, "global_step": 94539, "epoch": 562} {"train_loss": -9.397846221923828, "global_step": 94540, "epoch": 562} {"train_loss": -9.533592224121094, "global_step": 94541, "epoch": 562} {"train_loss": -9.288707733154297, "global_step": 94542, "epoch": 562} {"train_loss": -9.484439849853516, "global_step": 94543, "epoch": 562} {"train_loss": -9.557239532470703, "global_step": 94544, "epoch": 562} {"train_loss": -9.634420394897461, "global_step": 94545, "epoch": 562} {"train_loss": -9.522198677062988, "global_step": 94546, "epoch": 562} {"train_loss": -9.469999313354492, "global_step": 94547, "epoch": 562} {"train_loss": -9.715723037719727, "global_step": 94548, "epoch": 562} {"train_loss": -9.71700668334961, "global_step": 94549, "epoch": 562} {"train_loss": -9.728326797485352, "global_step": 94550, "epoch": 562} {"train_loss": -9.565227508544922, "global_step": 94551, "epoch": 562} {"train_loss": -9.464941024780273, "global_step": 94552, "epoch": 562} {"train_loss": -9.563140869140625, "global_step": 94553, "epoch": 562} {"train_loss": -9.142881393432617, "global_step": 94554, "epoch": 562} {"train_loss": -9.52894115447998, "global_step": 94555, "epoch": 562} {"train_loss": -9.428851127624512, "global_step": 94556, "epoch": 562} {"train_loss": -9.842430114746094, "global_step": 94557, "epoch": 562} {"train_loss": -9.488249778747559, "global_step": 94558, "epoch": 562} {"train_loss": -9.66335391998291, "global_step": 94559, "epoch": 562} {"train_loss": -9.74958610534668, "global_step": 94560, "epoch": 562} {"train_loss": -9.612771987915039, "global_step": 94561, "epoch": 562} {"train_loss": -9.378576278686523, "global_step": 94562, "epoch": 562} {"train_loss": -9.489505767822266, "global_step": 94563, "epoch": 562} {"train_loss": -9.235234260559082, "global_step": 94564, "epoch": 562} {"train_loss": -9.599397659301758, "global_step": 94565, "epoch": 562} {"train_loss": -9.223215103149414, "global_step": 94566, "epoch": 562} {"train_loss": -9.52713394165039, "global_step": 94567, "epoch": 562} {"train_loss": -9.442289352416992, "global_step": 94568, "epoch": 562} {"train_loss": -9.6470308303833, "global_step": 94569, "epoch": 562} {"train_loss": -9.434608459472656, "global_step": 94570, "epoch": 562} {"train_loss": -9.299321174621582, "global_step": 94571, "epoch": 562} {"train_loss": -9.266447067260742, "global_step": 94572, "epoch": 562} {"train_loss": -9.66738510131836, "global_step": 94573, "epoch": 562} {"train_loss": -9.18874740600586, "global_step": 94574, "epoch": 562} {"train_loss": -9.62662124633789, "global_step": 94575, "epoch": 562} {"train_loss": -9.758796691894531, "global_step": 94576, "epoch": 562} {"train_loss": -9.441219329833984, "global_step": 94577, "epoch": 562} {"train_loss": -9.479907035827637, "global_step": 94578, "epoch": 562} {"train_loss": -9.736257553100586, "global_step": 94579, "epoch": 562} {"train_loss": -9.550148010253906, "global_step": 94580, "epoch": 562} {"train_loss": -9.498494148254395, "global_step": 94581, "epoch": 562} {"train_loss": -9.427143096923828, "global_step": 94582, "epoch": 562} {"train_loss": -9.562124570210775, "global_step": 94583, "epoch": 562, "val_loss": 203568.921875} {"train_loss": -9.498626708984375, "global_step": 94584, "epoch": 563} {"train_loss": -9.638711929321289, "global_step": 94585, "epoch": 563} {"train_loss": -9.30775260925293, "global_step": 94586, "epoch": 563} {"train_loss": -9.591005325317383, "global_step": 94587, "epoch": 563} {"train_loss": -9.676979064941406, "global_step": 94588, "epoch": 563} {"train_loss": -9.205875396728516, "global_step": 94589, "epoch": 563} {"train_loss": -9.50742244720459, "global_step": 94590, "epoch": 563} {"train_loss": -9.33620548248291, "global_step": 94591, "epoch": 563} {"train_loss": -9.382078170776367, "global_step": 94592, "epoch": 563} {"train_loss": -9.423307418823242, "global_step": 94593, "epoch": 563} {"train_loss": -9.321017265319824, "global_step": 94594, "epoch": 563} {"train_loss": -9.495783805847168, "global_step": 94595, "epoch": 563} {"train_loss": -9.178730964660645, "global_step": 94596, "epoch": 563} {"train_loss": -9.236062049865723, "global_step": 94597, "epoch": 563} {"train_loss": -9.340509414672852, "global_step": 94598, "epoch": 563} {"train_loss": -9.459428787231445, "global_step": 94599, "epoch": 563} {"train_loss": -9.436090469360352, "global_step": 94600, "epoch": 563} {"train_loss": -9.481393814086914, "global_step": 94601, "epoch": 563} {"train_loss": -9.713799476623535, "global_step": 94602, "epoch": 563} {"train_loss": -9.466453552246094, "global_step": 94603, "epoch": 563} {"train_loss": -9.466678619384766, "global_step": 94604, "epoch": 563} {"train_loss": -9.682395935058594, "global_step": 94605, "epoch": 563} {"train_loss": -9.602327346801758, "global_step": 94606, "epoch": 563} {"train_loss": -9.72463607788086, "global_step": 94607, "epoch": 563} {"train_loss": -9.672874450683594, "global_step": 94608, "epoch": 563} {"train_loss": -9.72643756866455, "global_step": 94609, "epoch": 563} {"train_loss": -9.597770690917969, "global_step": 94610, "epoch": 563} {"train_loss": -9.563095092773438, "global_step": 94611, "epoch": 563} {"train_loss": -9.735572814941406, "global_step": 94612, "epoch": 563} {"train_loss": -9.537424087524414, "global_step": 94613, "epoch": 563} {"train_loss": -9.643287658691406, "global_step": 94614, "epoch": 563} {"train_loss": -9.497182846069336, "global_step": 94615, "epoch": 563} {"train_loss": -9.75211238861084, "global_step": 94616, "epoch": 563} {"train_loss": -9.755348205566406, "global_step": 94617, "epoch": 563} {"train_loss": -9.495285034179688, "global_step": 94618, "epoch": 563} {"train_loss": -9.606414794921875, "global_step": 94619, "epoch": 563} {"train_loss": -9.869772911071777, "global_step": 94620, "epoch": 563} {"train_loss": -9.661279678344727, "global_step": 94621, "epoch": 563} {"train_loss": -9.681947708129883, "global_step": 94622, "epoch": 563} {"train_loss": -9.689017295837402, "global_step": 94623, "epoch": 563} {"train_loss": -9.878679275512695, "global_step": 94624, "epoch": 563} {"train_loss": -9.689634323120117, "global_step": 94625, "epoch": 563} {"train_loss": -9.690290451049805, "global_step": 94626, "epoch": 563} {"train_loss": -9.802316665649414, "global_step": 94627, "epoch": 563} {"train_loss": -9.635265350341797, "global_step": 94628, "epoch": 563} {"train_loss": -9.726378440856934, "global_step": 94629, "epoch": 563} {"train_loss": -9.754988670349121, "global_step": 94630, "epoch": 563} {"train_loss": -9.691446304321289, "global_step": 94631, "epoch": 563} {"train_loss": -9.507259368896484, "global_step": 94632, "epoch": 563} {"train_loss": -9.592948913574219, "global_step": 94633, "epoch": 563} {"train_loss": -9.914773941040039, "global_step": 94634, "epoch": 563} {"train_loss": -9.796701431274414, "global_step": 94635, "epoch": 563} {"train_loss": -9.817154884338379, "global_step": 94636, "epoch": 563} {"train_loss": -9.17398452758789, "global_step": 94637, "epoch": 563} {"train_loss": -9.152828216552734, "global_step": 94638, "epoch": 563} {"train_loss": -9.340285301208496, "global_step": 94639, "epoch": 563} {"train_loss": -9.34446907043457, "global_step": 94640, "epoch": 563} {"train_loss": -9.328292846679688, "global_step": 94641, "epoch": 563} {"train_loss": -9.40580940246582, "global_step": 94642, "epoch": 563} {"train_loss": -9.096000671386719, "global_step": 94643, "epoch": 563} {"train_loss": -9.134971618652344, "global_step": 94644, "epoch": 563} {"train_loss": -9.49356746673584, "global_step": 94645, "epoch": 563} {"train_loss": -9.518699645996094, "global_step": 94646, "epoch": 563} {"train_loss": -9.553976058959961, "global_step": 94647, "epoch": 563} {"train_loss": -9.678808212280273, "global_step": 94648, "epoch": 563} {"train_loss": -9.552410125732422, "global_step": 94649, "epoch": 563} {"train_loss": -9.356451988220215, "global_step": 94650, "epoch": 563} {"train_loss": -9.48063850402832, "global_step": 94651, "epoch": 563} {"train_loss": -9.571972846984863, "global_step": 94652, "epoch": 563} {"train_loss": -9.553424835205078, "global_step": 94653, "epoch": 563} {"train_loss": -9.575499534606934, "global_step": 94654, "epoch": 563} {"train_loss": -9.72048568725586, "global_step": 94655, "epoch": 563} {"train_loss": -9.766136169433594, "global_step": 94656, "epoch": 563} {"train_loss": -9.81950569152832, "global_step": 94657, "epoch": 563} {"train_loss": -9.650367736816406, "global_step": 94658, "epoch": 563} {"train_loss": -9.67146110534668, "global_step": 94659, "epoch": 563} {"train_loss": -9.80126667022705, "global_step": 94660, "epoch": 563} {"train_loss": -9.6041898727417, "global_step": 94661, "epoch": 563} {"train_loss": -9.663970947265625, "global_step": 94662, "epoch": 563} {"train_loss": -10.009925842285156, "global_step": 94663, "epoch": 563} {"train_loss": -9.779672622680664, "global_step": 94664, "epoch": 563} {"train_loss": -9.440849304199219, "global_step": 94665, "epoch": 563} {"train_loss": -9.774547576904297, "global_step": 94666, "epoch": 563} {"train_loss": -9.628204345703125, "global_step": 94667, "epoch": 563} {"train_loss": -9.685016632080078, "global_step": 94668, "epoch": 563} {"train_loss": -9.65805435180664, "global_step": 94669, "epoch": 563} {"train_loss": -9.578205108642578, "global_step": 94670, "epoch": 563} {"train_loss": -9.734886169433594, "global_step": 94671, "epoch": 563} {"train_loss": -9.494791030883789, "global_step": 94672, "epoch": 563} {"train_loss": -9.53952693939209, "global_step": 94673, "epoch": 563} {"train_loss": -9.596940994262695, "global_step": 94674, "epoch": 563} {"train_loss": -9.33443832397461, "global_step": 94675, "epoch": 563} {"train_loss": -9.547656059265137, "global_step": 94676, "epoch": 563} {"train_loss": -9.21432876586914, "global_step": 94677, "epoch": 563} {"train_loss": -9.610219955444336, "global_step": 94678, "epoch": 563} {"train_loss": -9.354568481445312, "global_step": 94679, "epoch": 563} {"train_loss": -9.442061424255371, "global_step": 94680, "epoch": 563} {"train_loss": -9.51736068725586, "global_step": 94681, "epoch": 563} {"train_loss": -9.455819129943848, "global_step": 94682, "epoch": 563} {"train_loss": -9.274565696716309, "global_step": 94683, "epoch": 563} {"train_loss": -9.544137954711914, "global_step": 94684, "epoch": 563} {"train_loss": -9.44466781616211, "global_step": 94685, "epoch": 563} {"train_loss": -9.668978691101074, "global_step": 94686, "epoch": 563} {"train_loss": -9.541704177856445, "global_step": 94687, "epoch": 563} {"train_loss": -9.66035270690918, "global_step": 94688, "epoch": 563} {"train_loss": -9.721295356750488, "global_step": 94689, "epoch": 563} {"train_loss": -9.426645278930664, "global_step": 94690, "epoch": 563} {"train_loss": -9.734821319580078, "global_step": 94691, "epoch": 563} {"train_loss": -9.6351318359375, "global_step": 94692, "epoch": 563} {"train_loss": -9.5908842086792, "global_step": 94693, "epoch": 563} {"train_loss": -9.457599639892578, "global_step": 94694, "epoch": 563} {"train_loss": -9.816906929016113, "global_step": 94695, "epoch": 563} {"train_loss": -9.494810104370117, "global_step": 94696, "epoch": 563} {"train_loss": -9.7940092086792, "global_step": 94697, "epoch": 563} {"train_loss": -9.53631591796875, "global_step": 94698, "epoch": 563} {"train_loss": -9.73346996307373, "global_step": 94699, "epoch": 563} {"train_loss": -9.408035278320312, "global_step": 94700, "epoch": 563} {"train_loss": -9.780862808227539, "global_step": 94701, "epoch": 563} {"train_loss": -9.531808853149414, "global_step": 94702, "epoch": 563} {"train_loss": -9.737264633178711, "global_step": 94703, "epoch": 563} {"train_loss": -9.685348510742188, "global_step": 94704, "epoch": 563} {"train_loss": -9.42931079864502, "global_step": 94705, "epoch": 563} {"train_loss": -9.733808517456055, "global_step": 94706, "epoch": 563} {"train_loss": -9.423189163208008, "global_step": 94707, "epoch": 563} {"train_loss": -9.509747505187988, "global_step": 94708, "epoch": 563} {"train_loss": -9.597175598144531, "global_step": 94709, "epoch": 563} {"train_loss": -9.736738204956055, "global_step": 94710, "epoch": 563} {"train_loss": -9.177377700805664, "global_step": 94711, "epoch": 563} {"train_loss": -9.583353042602539, "global_step": 94712, "epoch": 563} {"train_loss": -9.624414443969727, "global_step": 94713, "epoch": 563} {"train_loss": -9.297876358032227, "global_step": 94714, "epoch": 563} {"train_loss": -9.610430717468262, "global_step": 94715, "epoch": 563} {"train_loss": -9.432826042175293, "global_step": 94716, "epoch": 563} {"train_loss": -9.76537036895752, "global_step": 94717, "epoch": 563} {"train_loss": -9.343795776367188, "global_step": 94718, "epoch": 563} {"train_loss": -9.653192520141602, "global_step": 94719, "epoch": 563} {"train_loss": -9.703367233276367, "global_step": 94720, "epoch": 563} {"train_loss": -9.292999267578125, "global_step": 94721, "epoch": 563} {"train_loss": -8.864782333374023, "global_step": 94722, "epoch": 563} {"train_loss": -9.552247047424316, "global_step": 94723, "epoch": 563} {"train_loss": -9.208866119384766, "global_step": 94724, "epoch": 563} {"train_loss": -8.988266944885254, "global_step": 94725, "epoch": 563} {"train_loss": -9.432854652404785, "global_step": 94726, "epoch": 563} {"train_loss": -9.285179138183594, "global_step": 94727, "epoch": 563} {"train_loss": -9.212614059448242, "global_step": 94728, "epoch": 563} {"train_loss": -9.69510269165039, "global_step": 94729, "epoch": 563} {"train_loss": -9.419822692871094, "global_step": 94730, "epoch": 563} {"train_loss": -9.295244216918945, "global_step": 94731, "epoch": 563} {"train_loss": -9.423199653625488, "global_step": 94732, "epoch": 563} {"train_loss": -9.086182594299316, "global_step": 94733, "epoch": 563} {"train_loss": -9.411767959594727, "global_step": 94734, "epoch": 563} {"train_loss": -9.522295951843262, "global_step": 94735, "epoch": 563} {"train_loss": -9.250970840454102, "global_step": 94736, "epoch": 563} {"train_loss": -9.478038787841797, "global_step": 94737, "epoch": 563} {"train_loss": -9.508459091186523, "global_step": 94738, "epoch": 563} {"train_loss": -9.347345352172852, "global_step": 94739, "epoch": 563} {"train_loss": -9.452493667602539, "global_step": 94740, "epoch": 563} {"train_loss": -9.42515754699707, "global_step": 94741, "epoch": 563} {"train_loss": -9.553367614746094, "global_step": 94742, "epoch": 563} {"train_loss": -9.091790199279785, "global_step": 94743, "epoch": 563} {"train_loss": -9.490336418151855, "global_step": 94744, "epoch": 563} {"train_loss": -9.45115852355957, "global_step": 94745, "epoch": 563} {"train_loss": -9.73035717010498, "global_step": 94746, "epoch": 563} {"train_loss": -9.467416763305664, "global_step": 94747, "epoch": 563} {"train_loss": -9.429780960083008, "global_step": 94748, "epoch": 563} {"train_loss": -9.218982696533203, "global_step": 94749, "epoch": 563} {"train_loss": -9.231332778930664, "global_step": 94750, "epoch": 563} {"train_loss": -9.527431913784572, "global_step": 94751, "epoch": 563, "val_loss": 205106.515625} {"train_loss": -9.414352416992188, "global_step": 94752, "epoch": 564} {"train_loss": -9.312141418457031, "global_step": 94753, "epoch": 564} {"train_loss": -9.644466400146484, "global_step": 94754, "epoch": 564} {"train_loss": -9.698326110839844, "global_step": 94755, "epoch": 564} {"train_loss": -9.415046691894531, "global_step": 94756, "epoch": 564} {"train_loss": -9.585188865661621, "global_step": 94757, "epoch": 564} {"train_loss": -9.565591812133789, "global_step": 94758, "epoch": 564} {"train_loss": -9.742218017578125, "global_step": 94759, "epoch": 564} {"train_loss": -9.797266960144043, "global_step": 94760, "epoch": 564} {"train_loss": -9.71577262878418, "global_step": 94761, "epoch": 564} {"train_loss": -9.560715675354004, "global_step": 94762, "epoch": 564} {"train_loss": -9.764484405517578, "global_step": 94763, "epoch": 564} {"train_loss": -9.607046127319336, "global_step": 94764, "epoch": 564} {"train_loss": -9.656596183776855, "global_step": 94765, "epoch": 564} {"train_loss": -9.609816551208496, "global_step": 94766, "epoch": 564} {"train_loss": -9.602415084838867, "global_step": 94767, "epoch": 564} {"train_loss": -9.894550323486328, "global_step": 94768, "epoch": 564} {"train_loss": -9.73746395111084, "global_step": 94769, "epoch": 564} {"train_loss": -9.656557083129883, "global_step": 94770, "epoch": 564} {"train_loss": -9.567617416381836, "global_step": 94771, "epoch": 564} {"train_loss": -9.903491973876953, "global_step": 94772, "epoch": 564} {"train_loss": -9.804609298706055, "global_step": 94773, "epoch": 564} {"train_loss": -9.67251968383789, "global_step": 94774, "epoch": 564} {"train_loss": -9.653069496154785, "global_step": 94775, "epoch": 564} {"train_loss": -9.425108909606934, "global_step": 94776, "epoch": 564} {"train_loss": -9.613275527954102, "global_step": 94777, "epoch": 564} {"train_loss": -9.783561706542969, "global_step": 94778, "epoch": 564} {"train_loss": -9.843082427978516, "global_step": 94779, "epoch": 564} {"train_loss": -10.010467529296875, "global_step": 94780, "epoch": 564} {"train_loss": -9.650192260742188, "global_step": 94781, "epoch": 564} {"train_loss": -9.295707702636719, "global_step": 94782, "epoch": 564} {"train_loss": -9.600001335144043, "global_step": 94783, "epoch": 564} {"train_loss": -9.757322311401367, "global_step": 94784, "epoch": 564} {"train_loss": -9.542903900146484, "global_step": 94785, "epoch": 564} {"train_loss": -9.553808212280273, "global_step": 94786, "epoch": 564} {"train_loss": -9.826383590698242, "global_step": 94787, "epoch": 564} {"train_loss": -9.512767791748047, "global_step": 94788, "epoch": 564} {"train_loss": -9.743518829345703, "global_step": 94789, "epoch": 564} {"train_loss": -9.518808364868164, "global_step": 94790, "epoch": 564} {"train_loss": -9.51113510131836, "global_step": 94791, "epoch": 564} {"train_loss": -9.511235237121582, "global_step": 94792, "epoch": 564} {"train_loss": -9.093746185302734, "global_step": 94793, "epoch": 564} {"train_loss": -9.189155578613281, "global_step": 94794, "epoch": 564} {"train_loss": -9.487011909484863, "global_step": 94795, "epoch": 564} {"train_loss": -9.31010627746582, "global_step": 94796, "epoch": 564} {"train_loss": -9.41169548034668, "global_step": 94797, "epoch": 564} {"train_loss": -9.52070140838623, "global_step": 94798, "epoch": 564} {"train_loss": -9.045333862304688, "global_step": 94799, "epoch": 564} {"train_loss": -9.496432304382324, "global_step": 94800, "epoch": 564} {"train_loss": -9.503686904907227, "global_step": 94801, "epoch": 564} {"train_loss": -9.350340843200684, "global_step": 94802, "epoch": 564} {"train_loss": -9.562028884887695, "global_step": 94803, "epoch": 564} {"train_loss": -9.377344131469727, "global_step": 94804, "epoch": 564} {"train_loss": -9.613445281982422, "global_step": 94805, "epoch": 564} {"train_loss": -9.453428268432617, "global_step": 94806, "epoch": 564} {"train_loss": -9.391395568847656, "global_step": 94807, "epoch": 564} {"train_loss": -9.429301261901855, "global_step": 94808, "epoch": 564} {"train_loss": -9.595855712890625, "global_step": 94809, "epoch": 564} {"train_loss": -9.391510963439941, "global_step": 94810, "epoch": 564} {"train_loss": -9.33299446105957, "global_step": 94811, "epoch": 564} {"train_loss": -9.365484237670898, "global_step": 94812, "epoch": 564} {"train_loss": -9.344268798828125, "global_step": 94813, "epoch": 564} {"train_loss": -9.57236385345459, "global_step": 94814, "epoch": 564} {"train_loss": -9.528295516967773, "global_step": 94815, "epoch": 564} {"train_loss": -9.486444473266602, "global_step": 94816, "epoch": 564} {"train_loss": -9.215597152709961, "global_step": 94817, "epoch": 564} {"train_loss": -9.54098129272461, "global_step": 94818, "epoch": 564} {"train_loss": -9.552539825439453, "global_step": 94819, "epoch": 564} {"train_loss": -9.617879867553711, "global_step": 94820, "epoch": 564} {"train_loss": -9.454647064208984, "global_step": 94821, "epoch": 564} {"train_loss": -9.716971397399902, "global_step": 94822, "epoch": 564} {"train_loss": -9.626070022583008, "global_step": 94823, "epoch": 564} {"train_loss": -9.78585433959961, "global_step": 94824, "epoch": 564} {"train_loss": -9.70271110534668, "global_step": 94825, "epoch": 564} {"train_loss": -9.81118106842041, "global_step": 94826, "epoch": 564} {"train_loss": -9.84597396850586, "global_step": 94827, "epoch": 564} {"train_loss": -9.585195541381836, "global_step": 94828, "epoch": 564} {"train_loss": -9.692658424377441, "global_step": 94829, "epoch": 564} {"train_loss": -9.487655639648438, "global_step": 94830, "epoch": 564} {"train_loss": -9.709354400634766, "global_step": 94831, "epoch": 564} {"train_loss": -9.718835830688477, "global_step": 94832, "epoch": 564} {"train_loss": -9.587135314941406, "global_step": 94833, "epoch": 564} {"train_loss": -9.953031539916992, "global_step": 94834, "epoch": 564} {"train_loss": -9.684755325317383, "global_step": 94835, "epoch": 564} {"train_loss": -9.644701957702637, "global_step": 94836, "epoch": 564} {"train_loss": -9.523515701293945, "global_step": 94837, "epoch": 564} {"train_loss": -9.701323509216309, "global_step": 94838, "epoch": 564} {"train_loss": -9.795496940612793, "global_step": 94839, "epoch": 564} {"train_loss": -9.723235130310059, "global_step": 94840, "epoch": 564} {"train_loss": -9.868330955505371, "global_step": 94841, "epoch": 564} {"train_loss": -9.594758033752441, "global_step": 94842, "epoch": 564} {"train_loss": -9.601351737976074, "global_step": 94843, "epoch": 564} {"train_loss": -9.329065322875977, "global_step": 94844, "epoch": 564} {"train_loss": -8.91126537322998, "global_step": 94845, "epoch": 564} {"train_loss": -9.437965393066406, "global_step": 94846, "epoch": 564} {"train_loss": -9.4381685256958, "global_step": 94847, "epoch": 564} {"train_loss": -9.560054779052734, "global_step": 94848, "epoch": 564} {"train_loss": -9.352943420410156, "global_step": 94849, "epoch": 564} {"train_loss": -9.530317306518555, "global_step": 94850, "epoch": 564} {"train_loss": -9.335201263427734, "global_step": 94851, "epoch": 564} {"train_loss": -9.596412658691406, "global_step": 94852, "epoch": 564} {"train_loss": -9.665557861328125, "global_step": 94853, "epoch": 564} {"train_loss": -9.610929489135742, "global_step": 94854, "epoch": 564} {"train_loss": -9.521371841430664, "global_step": 94855, "epoch": 564} {"train_loss": -9.303232192993164, "global_step": 94856, "epoch": 564} {"train_loss": -9.424495697021484, "global_step": 94857, "epoch": 564} {"train_loss": -9.105416297912598, "global_step": 94858, "epoch": 564} {"train_loss": -9.573080062866211, "global_step": 94859, "epoch": 564} {"train_loss": -9.270336151123047, "global_step": 94860, "epoch": 564} {"train_loss": -9.489486694335938, "global_step": 94861, "epoch": 564} {"train_loss": -9.557106018066406, "global_step": 94862, "epoch": 564} {"train_loss": -9.59298324584961, "global_step": 94863, "epoch": 564} {"train_loss": -9.518442153930664, "global_step": 94864, "epoch": 564} {"train_loss": -9.129314422607422, "global_step": 94865, "epoch": 564} {"train_loss": -9.673770904541016, "global_step": 94866, "epoch": 564} {"train_loss": -9.363068580627441, "global_step": 94867, "epoch": 564} {"train_loss": -9.39120864868164, "global_step": 94868, "epoch": 564} {"train_loss": -9.47140884399414, "global_step": 94869, "epoch": 564} {"train_loss": -9.462165832519531, "global_step": 94870, "epoch": 564} {"train_loss": -9.240296363830566, "global_step": 94871, "epoch": 564} {"train_loss": -9.52491569519043, "global_step": 94872, "epoch": 564} {"train_loss": -9.583799362182617, "global_step": 94873, "epoch": 564} {"train_loss": -9.391081809997559, "global_step": 94874, "epoch": 564} {"train_loss": -9.708215713500977, "global_step": 94875, "epoch": 564} {"train_loss": -9.183563232421875, "global_step": 94876, "epoch": 564} {"train_loss": -9.693267822265625, "global_step": 94877, "epoch": 564} {"train_loss": -9.548212051391602, "global_step": 94878, "epoch": 564} {"train_loss": -9.50248908996582, "global_step": 94879, "epoch": 564} {"train_loss": -9.557239532470703, "global_step": 94880, "epoch": 564} {"train_loss": -9.584860801696777, "global_step": 94881, "epoch": 564} {"train_loss": -9.663375854492188, "global_step": 94882, "epoch": 564} {"train_loss": -9.405561447143555, "global_step": 94883, "epoch": 564} {"train_loss": -9.74323844909668, "global_step": 94884, "epoch": 564} {"train_loss": -9.594991683959961, "global_step": 94885, "epoch": 564} {"train_loss": -9.57939338684082, "global_step": 94886, "epoch": 564} {"train_loss": -9.667356491088867, "global_step": 94887, "epoch": 564} {"train_loss": -9.760822296142578, "global_step": 94888, "epoch": 564} {"train_loss": -9.547760009765625, "global_step": 94889, "epoch": 564} {"train_loss": -9.779823303222656, "global_step": 94890, "epoch": 564} {"train_loss": -9.766095161437988, "global_step": 94891, "epoch": 564} {"train_loss": -9.645727157592773, "global_step": 94892, "epoch": 564} {"train_loss": -9.618858337402344, "global_step": 94893, "epoch": 564} {"train_loss": -9.728282928466797, "global_step": 94894, "epoch": 564} {"train_loss": -9.623677253723145, "global_step": 94895, "epoch": 564} {"train_loss": -9.68355941772461, "global_step": 94896, "epoch": 564} {"train_loss": -9.896533966064453, "global_step": 94897, "epoch": 564} {"train_loss": -9.798900604248047, "global_step": 94898, "epoch": 564} {"train_loss": -9.610671043395996, "global_step": 94899, "epoch": 564} {"train_loss": -9.576482772827148, "global_step": 94900, "epoch": 564} {"train_loss": -9.574496269226074, "global_step": 94901, "epoch": 564} {"train_loss": -9.418686866760254, "global_step": 94902, "epoch": 564} {"train_loss": -9.619951248168945, "global_step": 94903, "epoch": 564} {"train_loss": -9.628608703613281, "global_step": 94904, "epoch": 564} {"train_loss": -9.371002197265625, "global_step": 94905, "epoch": 564} {"train_loss": -9.772041320800781, "global_step": 94906, "epoch": 564} {"train_loss": -9.648870468139648, "global_step": 94907, "epoch": 564} {"train_loss": -9.492494583129883, "global_step": 94908, "epoch": 564} {"train_loss": -9.583208084106445, "global_step": 94909, "epoch": 564} {"train_loss": -9.734489440917969, "global_step": 94910, "epoch": 564} {"train_loss": -9.540781021118164, "global_step": 94911, "epoch": 564} {"train_loss": -9.497188568115234, "global_step": 94912, "epoch": 564} {"train_loss": -9.494745254516602, "global_step": 94913, "epoch": 564} {"train_loss": -9.600732803344727, "global_step": 94914, "epoch": 564} {"train_loss": -9.500995635986328, "global_step": 94915, "epoch": 564} {"train_loss": -9.628870010375977, "global_step": 94916, "epoch": 564} {"train_loss": -9.493169784545898, "global_step": 94917, "epoch": 564} {"train_loss": -9.359349250793457, "global_step": 94918, "epoch": 564} {"train_loss": -9.559436139606294, "global_step": 94919, "epoch": 564, "val_loss": 202738.125} {"train_loss": -9.12769889831543, "global_step": 94920, "epoch": 565} {"train_loss": -9.458322525024414, "global_step": 94921, "epoch": 565} {"train_loss": -9.098690032958984, "global_step": 94922, "epoch": 565} {"train_loss": -8.813837051391602, "global_step": 94923, "epoch": 565} {"train_loss": -9.31105899810791, "global_step": 94924, "epoch": 565} {"train_loss": -9.05809211730957, "global_step": 94925, "epoch": 565} {"train_loss": -9.416231155395508, "global_step": 94926, "epoch": 565} {"train_loss": -9.172565460205078, "global_step": 94927, "epoch": 565} {"train_loss": -9.124578475952148, "global_step": 94928, "epoch": 565} {"train_loss": -9.261136054992676, "global_step": 94929, "epoch": 565} {"train_loss": -9.10024356842041, "global_step": 94930, "epoch": 565} {"train_loss": -9.214720726013184, "global_step": 94931, "epoch": 565} {"train_loss": -9.180883407592773, "global_step": 94932, "epoch": 565} {"train_loss": -9.374787330627441, "global_step": 94933, "epoch": 565} {"train_loss": -9.305195808410645, "global_step": 94934, "epoch": 565} {"train_loss": -9.296365737915039, "global_step": 94935, "epoch": 565} {"train_loss": -9.422386169433594, "global_step": 94936, "epoch": 565} {"train_loss": -9.53256607055664, "global_step": 94937, "epoch": 565} {"train_loss": -9.361297607421875, "global_step": 94938, "epoch": 565} {"train_loss": -9.534467697143555, "global_step": 94939, "epoch": 565} {"train_loss": -9.422404289245605, "global_step": 94940, "epoch": 565} {"train_loss": -9.43516731262207, "global_step": 94941, "epoch": 565} {"train_loss": -9.48824691772461, "global_step": 94942, "epoch": 565} {"train_loss": -9.436042785644531, "global_step": 94943, "epoch": 565} {"train_loss": -9.575161933898926, "global_step": 94944, "epoch": 565} {"train_loss": -9.446991920471191, "global_step": 94945, "epoch": 565} {"train_loss": -9.569522857666016, "global_step": 94946, "epoch": 565} {"train_loss": -9.65302562713623, "global_step": 94947, "epoch": 565} {"train_loss": -9.386006355285645, "global_step": 94948, "epoch": 565} {"train_loss": -9.2953462600708, "global_step": 94949, "epoch": 565} {"train_loss": -9.15744400024414, "global_step": 94950, "epoch": 565} {"train_loss": -9.52532958984375, "global_step": 94951, "epoch": 565} {"train_loss": -9.618109703063965, "global_step": 94952, "epoch": 565} {"train_loss": -9.439305305480957, "global_step": 94953, "epoch": 565} {"train_loss": -9.153047561645508, "global_step": 94954, "epoch": 565} {"train_loss": -9.679218292236328, "global_step": 94955, "epoch": 565} {"train_loss": -9.372084617614746, "global_step": 94956, "epoch": 565} {"train_loss": -9.24106216430664, "global_step": 94957, "epoch": 565} {"train_loss": -9.068609237670898, "global_step": 94958, "epoch": 565} {"train_loss": -9.329023361206055, "global_step": 94959, "epoch": 565} {"train_loss": -9.11063003540039, "global_step": 94960, "epoch": 565} {"train_loss": -9.438802719116211, "global_step": 94961, "epoch": 565} {"train_loss": -9.441390037536621, "global_step": 94962, "epoch": 565} {"train_loss": -9.074507713317871, "global_step": 94963, "epoch": 565} {"train_loss": -9.18714427947998, "global_step": 94964, "epoch": 565} {"train_loss": -8.929750442504883, "global_step": 94965, "epoch": 565} {"train_loss": -9.552302360534668, "global_step": 94966, "epoch": 565} {"train_loss": -9.305257797241211, "global_step": 94967, "epoch": 565} {"train_loss": -9.157249450683594, "global_step": 94968, "epoch": 565} {"train_loss": -9.182746887207031, "global_step": 94969, "epoch": 565} {"train_loss": -9.250877380371094, "global_step": 94970, "epoch": 565} {"train_loss": -9.167144775390625, "global_step": 94971, "epoch": 565} {"train_loss": -9.19013786315918, "global_step": 94972, "epoch": 565} {"train_loss": -9.587459564208984, "global_step": 94973, "epoch": 565} {"train_loss": -9.573866844177246, "global_step": 94974, "epoch": 565} {"train_loss": -9.533116340637207, "global_step": 94975, "epoch": 565} {"train_loss": -9.483647346496582, "global_step": 94976, "epoch": 565} {"train_loss": -9.357306480407715, "global_step": 94977, "epoch": 565} {"train_loss": -9.703888893127441, "global_step": 94978, "epoch": 565} {"train_loss": -9.588863372802734, "global_step": 94979, "epoch": 565} {"train_loss": -9.588706016540527, "global_step": 94980, "epoch": 565} {"train_loss": -9.705012321472168, "global_step": 94981, "epoch": 565} {"train_loss": -9.600584030151367, "global_step": 94982, "epoch": 565} {"train_loss": -9.671566009521484, "global_step": 94983, "epoch": 565} {"train_loss": -9.830490112304688, "global_step": 94984, "epoch": 565} {"train_loss": -9.661306381225586, "global_step": 94985, "epoch": 565} {"train_loss": -9.89055061340332, "global_step": 94986, "epoch": 565} {"train_loss": -9.565221786499023, "global_step": 94987, "epoch": 565} {"train_loss": -9.846001625061035, "global_step": 94988, "epoch": 565} {"train_loss": -9.56189250946045, "global_step": 94989, "epoch": 565} {"train_loss": -9.910938262939453, "global_step": 94990, "epoch": 565} {"train_loss": -9.758228302001953, "global_step": 94991, "epoch": 565} {"train_loss": -9.633952140808105, "global_step": 94992, "epoch": 565} {"train_loss": -9.611085891723633, "global_step": 94993, "epoch": 565} {"train_loss": -9.863759994506836, "global_step": 94994, "epoch": 565} {"train_loss": -9.275379180908203, "global_step": 94995, "epoch": 565} {"train_loss": -9.422883033752441, "global_step": 94996, "epoch": 565} {"train_loss": -9.853137969970703, "global_step": 94997, "epoch": 565} {"train_loss": -9.62777042388916, "global_step": 94998, "epoch": 565} {"train_loss": -9.2515287399292, "global_step": 94999, "epoch": 565} {"train_loss": -9.392012596130371, "global_step": 95000, "epoch": 565} {"train_loss": -9.525304794311523, "global_step": 95001, "epoch": 565} {"train_loss": -9.486572265625, "global_step": 95002, "epoch": 565} {"train_loss": -9.700410842895508, "global_step": 95003, "epoch": 565} {"train_loss": -9.661822319030762, "global_step": 95004, "epoch": 565} {"train_loss": -9.547439575195312, "global_step": 95005, "epoch": 565} {"train_loss": -9.703999519348145, "global_step": 95006, "epoch": 565} {"train_loss": -9.597846031188965, "global_step": 95007, "epoch": 565} {"train_loss": -9.535564422607422, "global_step": 95008, "epoch": 565} {"train_loss": -9.813018798828125, "global_step": 95009, "epoch": 565} {"train_loss": -9.529607772827148, "global_step": 95010, "epoch": 565} {"train_loss": -9.686144828796387, "global_step": 95011, "epoch": 565} {"train_loss": -9.491479873657227, "global_step": 95012, "epoch": 565} {"train_loss": -9.595829963684082, "global_step": 95013, "epoch": 565} {"train_loss": -9.647978782653809, "global_step": 95014, "epoch": 565} {"train_loss": -9.666614532470703, "global_step": 95015, "epoch": 565} {"train_loss": -9.775075912475586, "global_step": 95016, "epoch": 565} {"train_loss": -9.549759864807129, "global_step": 95017, "epoch": 565} {"train_loss": -9.636075973510742, "global_step": 95018, "epoch": 565} {"train_loss": -9.524310111999512, "global_step": 95019, "epoch": 565} {"train_loss": -9.457202911376953, "global_step": 95020, "epoch": 565} {"train_loss": -9.7008056640625, "global_step": 95021, "epoch": 565} {"train_loss": -9.712244033813477, "global_step": 95022, "epoch": 565} {"train_loss": -9.678104400634766, "global_step": 95023, "epoch": 565} {"train_loss": -9.569499969482422, "global_step": 95024, "epoch": 565} {"train_loss": -9.734569549560547, "global_step": 95025, "epoch": 565} {"train_loss": -9.606128692626953, "global_step": 95026, "epoch": 565} {"train_loss": -9.768440246582031, "global_step": 95027, "epoch": 565} {"train_loss": -9.803730010986328, "global_step": 95028, "epoch": 565} {"train_loss": -9.592000007629395, "global_step": 95029, "epoch": 565} {"train_loss": -9.781681060791016, "global_step": 95030, "epoch": 565} {"train_loss": -9.734493255615234, "global_step": 95031, "epoch": 565} {"train_loss": -9.678439140319824, "global_step": 95032, "epoch": 565} {"train_loss": -9.613506317138672, "global_step": 95033, "epoch": 565} {"train_loss": -9.291464805603027, "global_step": 95034, "epoch": 565} {"train_loss": -9.472480773925781, "global_step": 95035, "epoch": 565} {"train_loss": -9.692744255065918, "global_step": 95036, "epoch": 565} {"train_loss": -9.580617904663086, "global_step": 95037, "epoch": 565} {"train_loss": -9.335658073425293, "global_step": 95038, "epoch": 565} {"train_loss": -9.802638053894043, "global_step": 95039, "epoch": 565} {"train_loss": -9.602048873901367, "global_step": 95040, "epoch": 565} {"train_loss": -9.539852142333984, "global_step": 95041, "epoch": 565} {"train_loss": -9.738870620727539, "global_step": 95042, "epoch": 565} {"train_loss": -9.992668151855469, "global_step": 95043, "epoch": 565} {"train_loss": -9.900602340698242, "global_step": 95044, "epoch": 565} {"train_loss": -9.824552536010742, "global_step": 95045, "epoch": 565} {"train_loss": -9.62597942352295, "global_step": 95046, "epoch": 565} {"train_loss": -9.588890075683594, "global_step": 95047, "epoch": 565} {"train_loss": -9.578750610351562, "global_step": 95048, "epoch": 565} {"train_loss": -9.98938274383545, "global_step": 95049, "epoch": 565} {"train_loss": -9.921976089477539, "global_step": 95050, "epoch": 565} {"train_loss": -9.854232788085938, "global_step": 95051, "epoch": 565} {"train_loss": -9.5592041015625, "global_step": 95052, "epoch": 565} {"train_loss": -9.636098861694336, "global_step": 95053, "epoch": 565} {"train_loss": -9.378746032714844, "global_step": 95054, "epoch": 565} {"train_loss": -9.450300216674805, "global_step": 95055, "epoch": 565} {"train_loss": -9.61644172668457, "global_step": 95056, "epoch": 565} {"train_loss": -9.479385375976562, "global_step": 95057, "epoch": 565} {"train_loss": -9.621548652648926, "global_step": 95058, "epoch": 565} {"train_loss": -9.289412498474121, "global_step": 95059, "epoch": 565} {"train_loss": -9.510828018188477, "global_step": 95060, "epoch": 565} {"train_loss": -9.701255798339844, "global_step": 95061, "epoch": 565} {"train_loss": -9.676855087280273, "global_step": 95062, "epoch": 565} {"train_loss": -9.442625999450684, "global_step": 95063, "epoch": 565} {"train_loss": -9.416584014892578, "global_step": 95064, "epoch": 565} {"train_loss": -9.260699272155762, "global_step": 95065, "epoch": 565} {"train_loss": -9.471637725830078, "global_step": 95066, "epoch": 565} {"train_loss": -9.00961685180664, "global_step": 95067, "epoch": 565} {"train_loss": -9.54180908203125, "global_step": 95068, "epoch": 565} {"train_loss": -8.93690299987793, "global_step": 95069, "epoch": 565} {"train_loss": -9.46035385131836, "global_step": 95070, "epoch": 565} {"train_loss": -9.203649520874023, "global_step": 95071, "epoch": 565} {"train_loss": -9.229673385620117, "global_step": 95072, "epoch": 565} {"train_loss": -9.539647102355957, "global_step": 95073, "epoch": 565} {"train_loss": -9.148294448852539, "global_step": 95074, "epoch": 565} {"train_loss": -9.334627151489258, "global_step": 95075, "epoch": 565} {"train_loss": -9.140480995178223, "global_step": 95076, "epoch": 565} {"train_loss": -9.340648651123047, "global_step": 95077, "epoch": 565} {"train_loss": -9.41926383972168, "global_step": 95078, "epoch": 565} {"train_loss": -9.275632858276367, "global_step": 95079, "epoch": 565} {"train_loss": -9.600555419921875, "global_step": 95080, "epoch": 565} {"train_loss": -9.382383346557617, "global_step": 95081, "epoch": 565} {"train_loss": -9.489276885986328, "global_step": 95082, "epoch": 565} {"train_loss": -9.619425773620605, "global_step": 95083, "epoch": 565} {"train_loss": -9.418188095092773, "global_step": 95084, "epoch": 565} {"train_loss": -9.614168167114258, "global_step": 95085, "epoch": 565} {"train_loss": -9.357540130615234, "global_step": 95086, "epoch": 565} {"train_loss": -9.489219001361302, "global_step": 95087, "epoch": 565, "val_loss": 204633.890625, "train_action_mse_error": 1.7102398872375488} {"train_loss": -9.059982299804688, "global_step": 95088, "epoch": 566} {"train_loss": -9.595911026000977, "global_step": 95089, "epoch": 566} {"train_loss": -9.751249313354492, "global_step": 95090, "epoch": 566} {"train_loss": -9.54892349243164, "global_step": 95091, "epoch": 566} {"train_loss": -9.620047569274902, "global_step": 95092, "epoch": 566} {"train_loss": -9.58457088470459, "global_step": 95093, "epoch": 566} {"train_loss": -9.527994155883789, "global_step": 95094, "epoch": 566} {"train_loss": -9.155057907104492, "global_step": 95095, "epoch": 566} {"train_loss": -9.356966972351074, "global_step": 95096, "epoch": 566} {"train_loss": -9.46580696105957, "global_step": 95097, "epoch": 566} {"train_loss": -9.546518325805664, "global_step": 95098, "epoch": 566} {"train_loss": -9.507389068603516, "global_step": 95099, "epoch": 566} {"train_loss": -9.423375129699707, "global_step": 95100, "epoch": 566} {"train_loss": -9.395431518554688, "global_step": 95101, "epoch": 566} {"train_loss": -9.388677597045898, "global_step": 95102, "epoch": 566} {"train_loss": -9.57598876953125, "global_step": 95103, "epoch": 566} {"train_loss": -9.703546524047852, "global_step": 95104, "epoch": 566} {"train_loss": -9.674555778503418, "global_step": 95105, "epoch": 566} {"train_loss": -9.376896858215332, "global_step": 95106, "epoch": 566} {"train_loss": -9.67314624786377, "global_step": 95107, "epoch": 566} {"train_loss": -9.658077239990234, "global_step": 95108, "epoch": 566} {"train_loss": -9.900432586669922, "global_step": 95109, "epoch": 566} {"train_loss": -9.628154754638672, "global_step": 95110, "epoch": 566} {"train_loss": -9.364770889282227, "global_step": 95111, "epoch": 566} {"train_loss": -9.661467552185059, "global_step": 95112, "epoch": 566} {"train_loss": -9.692853927612305, "global_step": 95113, "epoch": 566} {"train_loss": -9.802766799926758, "global_step": 95114, "epoch": 566} {"train_loss": -9.626285552978516, "global_step": 95115, "epoch": 566} {"train_loss": -9.68116569519043, "global_step": 95116, "epoch": 566} {"train_loss": -9.659189224243164, "global_step": 95117, "epoch": 566} {"train_loss": -9.574633598327637, "global_step": 95118, "epoch": 566} {"train_loss": -9.569912910461426, "global_step": 95119, "epoch": 566} {"train_loss": -9.421987533569336, "global_step": 95120, "epoch": 566} {"train_loss": -9.501479148864746, "global_step": 95121, "epoch": 566} {"train_loss": -9.449847221374512, "global_step": 95122, "epoch": 566} {"train_loss": -9.427909851074219, "global_step": 95123, "epoch": 566} {"train_loss": -9.376029014587402, "global_step": 95124, "epoch": 566} {"train_loss": -9.42640495300293, "global_step": 95125, "epoch": 566} {"train_loss": -9.781744003295898, "global_step": 95126, "epoch": 566} {"train_loss": -9.515509605407715, "global_step": 95127, "epoch": 566} {"train_loss": -9.597538948059082, "global_step": 95128, "epoch": 566} {"train_loss": -9.59426498413086, "global_step": 95129, "epoch": 566} {"train_loss": -8.991533279418945, "global_step": 95130, "epoch": 566} {"train_loss": -9.96426773071289, "global_step": 95131, "epoch": 566} {"train_loss": -9.45506477355957, "global_step": 95132, "epoch": 566} {"train_loss": -9.540119171142578, "global_step": 95133, "epoch": 566} {"train_loss": -9.352110862731934, "global_step": 95134, "epoch": 566} {"train_loss": -9.56965446472168, "global_step": 95135, "epoch": 566} {"train_loss": -9.539802551269531, "global_step": 95136, "epoch": 566} {"train_loss": -9.735292434692383, "global_step": 95137, "epoch": 566} {"train_loss": -9.751692771911621, "global_step": 95138, "epoch": 566} {"train_loss": -9.800117492675781, "global_step": 95139, "epoch": 566} {"train_loss": -9.855730056762695, "global_step": 95140, "epoch": 566} {"train_loss": -9.86361312866211, "global_step": 95141, "epoch": 566} {"train_loss": -9.697864532470703, "global_step": 95142, "epoch": 566} {"train_loss": -9.477859497070312, "global_step": 95143, "epoch": 566} {"train_loss": -9.562536239624023, "global_step": 95144, "epoch": 566} {"train_loss": -9.714960098266602, "global_step": 95145, "epoch": 566} {"train_loss": -9.79826831817627, "global_step": 95146, "epoch": 566} {"train_loss": -9.6621675491333, "global_step": 95147, "epoch": 566} {"train_loss": -9.487377166748047, "global_step": 95148, "epoch": 566} {"train_loss": -9.78516960144043, "global_step": 95149, "epoch": 566} {"train_loss": -9.878271102905273, "global_step": 95150, "epoch": 566} {"train_loss": -9.6083984375, "global_step": 95151, "epoch": 566} {"train_loss": -9.856122970581055, "global_step": 95152, "epoch": 566} {"train_loss": -9.536540031433105, "global_step": 95153, "epoch": 566} {"train_loss": -9.729549407958984, "global_step": 95154, "epoch": 566} {"train_loss": -9.809724807739258, "global_step": 95155, "epoch": 566} {"train_loss": -9.602008819580078, "global_step": 95156, "epoch": 566} {"train_loss": -9.20806884765625, "global_step": 95157, "epoch": 566} {"train_loss": -9.462003707885742, "global_step": 95158, "epoch": 566} {"train_loss": -9.363847732543945, "global_step": 95159, "epoch": 566} {"train_loss": -9.35076904296875, "global_step": 95160, "epoch": 566} {"train_loss": -9.390214920043945, "global_step": 95161, "epoch": 566} {"train_loss": -9.399147033691406, "global_step": 95162, "epoch": 566} {"train_loss": -9.407114028930664, "global_step": 95163, "epoch": 566} {"train_loss": -9.34099292755127, "global_step": 95164, "epoch": 566} {"train_loss": -8.994152069091797, "global_step": 95165, "epoch": 566} {"train_loss": -9.198936462402344, "global_step": 95166, "epoch": 566} {"train_loss": -9.362250328063965, "global_step": 95167, "epoch": 566} {"train_loss": -9.511009216308594, "global_step": 95168, "epoch": 566} {"train_loss": -9.407330513000488, "global_step": 95169, "epoch": 566} {"train_loss": -9.46863842010498, "global_step": 95170, "epoch": 566} {"train_loss": -9.41915512084961, "global_step": 95171, "epoch": 566} {"train_loss": -9.574843406677246, "global_step": 95172, "epoch": 566} {"train_loss": -9.327576637268066, "global_step": 95173, "epoch": 566} {"train_loss": -9.359901428222656, "global_step": 95174, "epoch": 566} {"train_loss": -9.510419845581055, "global_step": 95175, "epoch": 566} {"train_loss": -9.233247756958008, "global_step": 95176, "epoch": 566} {"train_loss": -9.539497375488281, "global_step": 95177, "epoch": 566} {"train_loss": -9.36001205444336, "global_step": 95178, "epoch": 566} {"train_loss": -9.618724822998047, "global_step": 95179, "epoch": 566} {"train_loss": -9.298503875732422, "global_step": 95180, "epoch": 566} {"train_loss": -9.574357986450195, "global_step": 95181, "epoch": 566} {"train_loss": -9.378765106201172, "global_step": 95182, "epoch": 566} {"train_loss": -9.384467124938965, "global_step": 95183, "epoch": 566} {"train_loss": -9.685291290283203, "global_step": 95184, "epoch": 566} {"train_loss": -9.525354385375977, "global_step": 95185, "epoch": 566} {"train_loss": -9.454909324645996, "global_step": 95186, "epoch": 566} {"train_loss": -9.670175552368164, "global_step": 95187, "epoch": 566} {"train_loss": -9.30984878540039, "global_step": 95188, "epoch": 566} {"train_loss": -9.703962326049805, "global_step": 95189, "epoch": 566} {"train_loss": -9.511343955993652, "global_step": 95190, "epoch": 566} {"train_loss": -9.33000659942627, "global_step": 95191, "epoch": 566} {"train_loss": -9.720081329345703, "global_step": 95192, "epoch": 566} {"train_loss": -9.241630554199219, "global_step": 95193, "epoch": 566} {"train_loss": -9.119382858276367, "global_step": 95194, "epoch": 566} {"train_loss": -9.343788146972656, "global_step": 95195, "epoch": 566} {"train_loss": -8.991738319396973, "global_step": 95196, "epoch": 566} {"train_loss": -9.625200271606445, "global_step": 95197, "epoch": 566} {"train_loss": -9.122552871704102, "global_step": 95198, "epoch": 566} {"train_loss": -9.458870887756348, "global_step": 95199, "epoch": 566} {"train_loss": -9.20781135559082, "global_step": 95200, "epoch": 566} {"train_loss": -9.118106842041016, "global_step": 95201, "epoch": 566} {"train_loss": -8.29046630859375, "global_step": 95202, "epoch": 566} {"train_loss": -9.20568561553955, "global_step": 95203, "epoch": 566} {"train_loss": -9.200382232666016, "global_step": 95204, "epoch": 566} {"train_loss": -8.942039489746094, "global_step": 95205, "epoch": 566} {"train_loss": -8.80501651763916, "global_step": 95206, "epoch": 566} {"train_loss": -8.839969635009766, "global_step": 95207, "epoch": 566} {"train_loss": -8.675697326660156, "global_step": 95208, "epoch": 566} {"train_loss": -8.912843704223633, "global_step": 95209, "epoch": 566} {"train_loss": -9.09524917602539, "global_step": 95210, "epoch": 566} {"train_loss": -9.336864471435547, "global_step": 95211, "epoch": 566} {"train_loss": -8.798752784729004, "global_step": 95212, "epoch": 566} {"train_loss": -9.247958183288574, "global_step": 95213, "epoch": 566} {"train_loss": -9.221641540527344, "global_step": 95214, "epoch": 566} {"train_loss": -9.239002227783203, "global_step": 95215, "epoch": 566} {"train_loss": -9.325946807861328, "global_step": 95216, "epoch": 566} {"train_loss": -9.433710098266602, "global_step": 95217, "epoch": 566} {"train_loss": -9.392414093017578, "global_step": 95218, "epoch": 566} {"train_loss": -9.290620803833008, "global_step": 95219, "epoch": 566} {"train_loss": -9.572993278503418, "global_step": 95220, "epoch": 566} {"train_loss": -9.399785041809082, "global_step": 95221, "epoch": 566} {"train_loss": -9.350419998168945, "global_step": 95222, "epoch": 566} {"train_loss": -9.370044708251953, "global_step": 95223, "epoch": 566} {"train_loss": -9.416329383850098, "global_step": 95224, "epoch": 566} {"train_loss": -9.432985305786133, "global_step": 95225, "epoch": 566} {"train_loss": -9.518868446350098, "global_step": 95226, "epoch": 566} {"train_loss": -9.398584365844727, "global_step": 95227, "epoch": 566} {"train_loss": -9.374746322631836, "global_step": 95228, "epoch": 566} {"train_loss": -9.44059944152832, "global_step": 95229, "epoch": 566} {"train_loss": -9.68899917602539, "global_step": 95230, "epoch": 566} {"train_loss": -9.826001167297363, "global_step": 95231, "epoch": 566} {"train_loss": -9.483760833740234, "global_step": 95232, "epoch": 566} {"train_loss": -9.755792617797852, "global_step": 95233, "epoch": 566} {"train_loss": -9.772930145263672, "global_step": 95234, "epoch": 566} {"train_loss": -9.429957389831543, "global_step": 95235, "epoch": 566} {"train_loss": -9.721230506896973, "global_step": 95236, "epoch": 566} {"train_loss": -9.774834632873535, "global_step": 95237, "epoch": 566} {"train_loss": -9.551714897155762, "global_step": 95238, "epoch": 566} {"train_loss": -9.790258407592773, "global_step": 95239, "epoch": 566} {"train_loss": -9.608406066894531, "global_step": 95240, "epoch": 566} {"train_loss": -9.672816276550293, "global_step": 95241, "epoch": 566} {"train_loss": -9.808158874511719, "global_step": 95242, "epoch": 566} {"train_loss": -9.692808151245117, "global_step": 95243, "epoch": 566} {"train_loss": -9.509666442871094, "global_step": 95244, "epoch": 566} {"train_loss": -9.8095064163208, "global_step": 95245, "epoch": 566} {"train_loss": -9.787059783935547, "global_step": 95246, "epoch": 566} {"train_loss": -9.640405654907227, "global_step": 95247, "epoch": 566} {"train_loss": -9.88180923461914, "global_step": 95248, "epoch": 566} {"train_loss": -9.377192497253418, "global_step": 95249, "epoch": 566} {"train_loss": -9.100399017333984, "global_step": 95250, "epoch": 566} {"train_loss": -9.612345695495605, "global_step": 95251, "epoch": 566} {"train_loss": -9.6384916305542, "global_step": 95252, "epoch": 566} {"train_loss": -9.432918548583984, "global_step": 95253, "epoch": 566} {"train_loss": -9.71590805053711, "global_step": 95254, "epoch": 566} {"train_loss": -9.478440500441051, "global_step": 95255, "epoch": 566, "val_loss": 205413.171875} {"train_loss": -9.294390678405762, "global_step": 95256, "epoch": 567} {"train_loss": -9.42393684387207, "global_step": 95257, "epoch": 567} {"train_loss": -9.530797958374023, "global_step": 95258, "epoch": 567} {"train_loss": -9.076509475708008, "global_step": 95259, "epoch": 567} {"train_loss": -9.215873718261719, "global_step": 95260, "epoch": 567} {"train_loss": -9.558175086975098, "global_step": 95261, "epoch": 567} {"train_loss": -9.220704078674316, "global_step": 95262, "epoch": 567} {"train_loss": -9.18259048461914, "global_step": 95263, "epoch": 567} {"train_loss": -9.386017799377441, "global_step": 95264, "epoch": 567} {"train_loss": -9.072492599487305, "global_step": 95265, "epoch": 567} {"train_loss": -9.463729858398438, "global_step": 95266, "epoch": 567} {"train_loss": -9.210129737854004, "global_step": 95267, "epoch": 567} {"train_loss": -9.41723918914795, "global_step": 95268, "epoch": 567} {"train_loss": -9.234450340270996, "global_step": 95269, "epoch": 567} {"train_loss": -9.005451202392578, "global_step": 95270, "epoch": 567} {"train_loss": -9.317046165466309, "global_step": 95271, "epoch": 567} {"train_loss": -9.209444999694824, "global_step": 95272, "epoch": 567} {"train_loss": -9.344793319702148, "global_step": 95273, "epoch": 567} {"train_loss": -9.210135459899902, "global_step": 95274, "epoch": 567} {"train_loss": -9.416485786437988, "global_step": 95275, "epoch": 567} {"train_loss": -9.342729568481445, "global_step": 95276, "epoch": 567} {"train_loss": -9.302739143371582, "global_step": 95277, "epoch": 567} {"train_loss": -9.153402328491211, "global_step": 95278, "epoch": 567} {"train_loss": -9.434649467468262, "global_step": 95279, "epoch": 567} {"train_loss": -9.398442268371582, "global_step": 95280, "epoch": 567} {"train_loss": -9.25019645690918, "global_step": 95281, "epoch": 567} {"train_loss": -9.489702224731445, "global_step": 95282, "epoch": 567} {"train_loss": -9.618450164794922, "global_step": 95283, "epoch": 567} {"train_loss": -9.611213684082031, "global_step": 95284, "epoch": 567} {"train_loss": -9.51620101928711, "global_step": 95285, "epoch": 567} {"train_loss": -9.275447845458984, "global_step": 95286, "epoch": 567} {"train_loss": -9.555870056152344, "global_step": 95287, "epoch": 567} {"train_loss": -9.680391311645508, "global_step": 95288, "epoch": 567} {"train_loss": -9.585147857666016, "global_step": 95289, "epoch": 567} {"train_loss": -9.767223358154297, "global_step": 95290, "epoch": 567} {"train_loss": -9.599453926086426, "global_step": 95291, "epoch": 567} {"train_loss": -9.667652130126953, "global_step": 95292, "epoch": 567} {"train_loss": -9.525148391723633, "global_step": 95293, "epoch": 567} {"train_loss": -9.859477996826172, "global_step": 95294, "epoch": 567} {"train_loss": -9.862283706665039, "global_step": 95295, "epoch": 567} {"train_loss": -9.62405014038086, "global_step": 95296, "epoch": 567} {"train_loss": -9.666271209716797, "global_step": 95297, "epoch": 567} {"train_loss": -9.645500183105469, "global_step": 95298, "epoch": 567} {"train_loss": -9.58267879486084, "global_step": 95299, "epoch": 567} {"train_loss": -9.687856674194336, "global_step": 95300, "epoch": 567} {"train_loss": -9.314916610717773, "global_step": 95301, "epoch": 567} {"train_loss": -9.623111724853516, "global_step": 95302, "epoch": 567} {"train_loss": -9.534409523010254, "global_step": 95303, "epoch": 567} {"train_loss": -9.519943237304688, "global_step": 95304, "epoch": 567} {"train_loss": -9.526811599731445, "global_step": 95305, "epoch": 567} {"train_loss": -9.65912914276123, "global_step": 95306, "epoch": 567} {"train_loss": -9.783990859985352, "global_step": 95307, "epoch": 567} {"train_loss": -9.494994163513184, "global_step": 95308, "epoch": 567} {"train_loss": -9.480833053588867, "global_step": 95309, "epoch": 567} {"train_loss": -9.274087905883789, "global_step": 95310, "epoch": 567} {"train_loss": -9.636526107788086, "global_step": 95311, "epoch": 567} {"train_loss": -9.685203552246094, "global_step": 95312, "epoch": 567} {"train_loss": -9.419036865234375, "global_step": 95313, "epoch": 567} {"train_loss": -9.540051460266113, "global_step": 95314, "epoch": 567} {"train_loss": -9.45964241027832, "global_step": 95315, "epoch": 567} {"train_loss": -9.397079467773438, "global_step": 95316, "epoch": 567} {"train_loss": -9.644632339477539, "global_step": 95317, "epoch": 567} {"train_loss": -9.652173042297363, "global_step": 95318, "epoch": 567} {"train_loss": -9.347140312194824, "global_step": 95319, "epoch": 567} {"train_loss": -9.298198699951172, "global_step": 95320, "epoch": 567} {"train_loss": -9.402837753295898, "global_step": 95321, "epoch": 567} {"train_loss": -9.424910545349121, "global_step": 95322, "epoch": 567} {"train_loss": -9.518218994140625, "global_step": 95323, "epoch": 567} {"train_loss": -9.49851131439209, "global_step": 95324, "epoch": 567} {"train_loss": -9.618204116821289, "global_step": 95325, "epoch": 567} {"train_loss": -9.357468605041504, "global_step": 95326, "epoch": 567} {"train_loss": -9.628807067871094, "global_step": 95327, "epoch": 567} {"train_loss": -9.342843055725098, "global_step": 95328, "epoch": 567} {"train_loss": -9.611072540283203, "global_step": 95329, "epoch": 567} {"train_loss": -9.48493766784668, "global_step": 95330, "epoch": 567} {"train_loss": -9.711642265319824, "global_step": 95331, "epoch": 567} {"train_loss": -9.601814270019531, "global_step": 95332, "epoch": 567} {"train_loss": -9.55301570892334, "global_step": 95333, "epoch": 567} {"train_loss": -9.708772659301758, "global_step": 95334, "epoch": 567} {"train_loss": -9.573478698730469, "global_step": 95335, "epoch": 567} {"train_loss": -9.561530113220215, "global_step": 95336, "epoch": 567} {"train_loss": -9.745542526245117, "global_step": 95337, "epoch": 567} {"train_loss": -9.730040550231934, "global_step": 95338, "epoch": 567} {"train_loss": -9.784072875976562, "global_step": 95339, "epoch": 567} {"train_loss": -9.281960487365723, "global_step": 95340, "epoch": 567} {"train_loss": -9.038562774658203, "global_step": 95341, "epoch": 567} {"train_loss": -9.300397872924805, "global_step": 95342, "epoch": 567} {"train_loss": -8.80014419555664, "global_step": 95343, "epoch": 567} {"train_loss": -9.661382675170898, "global_step": 95344, "epoch": 567} {"train_loss": -9.146638870239258, "global_step": 95345, "epoch": 567} {"train_loss": -9.160086631774902, "global_step": 95346, "epoch": 567} {"train_loss": -9.509332656860352, "global_step": 95347, "epoch": 567} {"train_loss": -9.501947402954102, "global_step": 95348, "epoch": 567} {"train_loss": -9.129630088806152, "global_step": 95349, "epoch": 567} {"train_loss": -9.414828300476074, "global_step": 95350, "epoch": 567} {"train_loss": -9.444544792175293, "global_step": 95351, "epoch": 567} {"train_loss": -9.369174003601074, "global_step": 95352, "epoch": 567} {"train_loss": -9.375248908996582, "global_step": 95353, "epoch": 567} {"train_loss": -9.427539825439453, "global_step": 95354, "epoch": 567} {"train_loss": -9.527015686035156, "global_step": 95355, "epoch": 567} {"train_loss": -9.759952545166016, "global_step": 95356, "epoch": 567} {"train_loss": -9.66596508026123, "global_step": 95357, "epoch": 567} {"train_loss": -9.634069442749023, "global_step": 95358, "epoch": 567} {"train_loss": -9.521627426147461, "global_step": 95359, "epoch": 567} {"train_loss": -9.591816902160645, "global_step": 95360, "epoch": 567} {"train_loss": -9.641729354858398, "global_step": 95361, "epoch": 567} {"train_loss": -9.330416679382324, "global_step": 95362, "epoch": 567} {"train_loss": -9.610968589782715, "global_step": 95363, "epoch": 567} {"train_loss": -9.73149585723877, "global_step": 95364, "epoch": 567} {"train_loss": -9.7177734375, "global_step": 95365, "epoch": 567} {"train_loss": -9.63669204711914, "global_step": 95366, "epoch": 567} {"train_loss": -9.514143943786621, "global_step": 95367, "epoch": 567} {"train_loss": -9.612716674804688, "global_step": 95368, "epoch": 567} {"train_loss": -9.548498153686523, "global_step": 95369, "epoch": 567} {"train_loss": -9.842848777770996, "global_step": 95370, "epoch": 567} {"train_loss": -9.684903144836426, "global_step": 95371, "epoch": 567} {"train_loss": -9.697760581970215, "global_step": 95372, "epoch": 567} {"train_loss": -9.753215789794922, "global_step": 95373, "epoch": 567} {"train_loss": -9.377362251281738, "global_step": 95374, "epoch": 567} {"train_loss": -9.663679122924805, "global_step": 95375, "epoch": 567} {"train_loss": -9.738504409790039, "global_step": 95376, "epoch": 567} {"train_loss": -9.781314849853516, "global_step": 95377, "epoch": 567} {"train_loss": -9.73244857788086, "global_step": 95378, "epoch": 567} {"train_loss": -9.780385971069336, "global_step": 95379, "epoch": 567} {"train_loss": -9.608530044555664, "global_step": 95380, "epoch": 567} {"train_loss": -9.660079956054688, "global_step": 95381, "epoch": 567} {"train_loss": -9.811063766479492, "global_step": 95382, "epoch": 567} {"train_loss": -9.582655906677246, "global_step": 95383, "epoch": 567} {"train_loss": -9.506346702575684, "global_step": 95384, "epoch": 567} {"train_loss": -9.607470512390137, "global_step": 95385, "epoch": 567} {"train_loss": -9.678169250488281, "global_step": 95386, "epoch": 567} {"train_loss": -9.78033447265625, "global_step": 95387, "epoch": 567} {"train_loss": -9.691460609436035, "global_step": 95388, "epoch": 567} {"train_loss": -9.689103126525879, "global_step": 95389, "epoch": 567} {"train_loss": -9.455339431762695, "global_step": 95390, "epoch": 567} {"train_loss": -9.45334243774414, "global_step": 95391, "epoch": 567} {"train_loss": -9.761630058288574, "global_step": 95392, "epoch": 567} {"train_loss": -9.524866104125977, "global_step": 95393, "epoch": 567} {"train_loss": -9.661654472351074, "global_step": 95394, "epoch": 567} {"train_loss": -9.525981903076172, "global_step": 95395, "epoch": 567} {"train_loss": -9.817535400390625, "global_step": 95396, "epoch": 567} {"train_loss": -9.429876327514648, "global_step": 95397, "epoch": 567} {"train_loss": -8.970352172851562, "global_step": 95398, "epoch": 567} {"train_loss": -9.501909255981445, "global_step": 95399, "epoch": 567} {"train_loss": -9.372053146362305, "global_step": 95400, "epoch": 567} {"train_loss": -9.359476089477539, "global_step": 95401, "epoch": 567} {"train_loss": -9.345261573791504, "global_step": 95402, "epoch": 567} {"train_loss": -9.115942001342773, "global_step": 95403, "epoch": 567} {"train_loss": -9.241358757019043, "global_step": 95404, "epoch": 567} {"train_loss": -9.290895462036133, "global_step": 95405, "epoch": 567} {"train_loss": -9.351395606994629, "global_step": 95406, "epoch": 567} {"train_loss": -9.305402755737305, "global_step": 95407, "epoch": 567} {"train_loss": -9.359759330749512, "global_step": 95408, "epoch": 567} {"train_loss": -9.344243049621582, "global_step": 95409, "epoch": 567} {"train_loss": -9.36136531829834, "global_step": 95410, "epoch": 567} {"train_loss": -9.313335418701172, "global_step": 95411, "epoch": 567} {"train_loss": -9.665059089660645, "global_step": 95412, "epoch": 567} {"train_loss": -9.03408432006836, "global_step": 95413, "epoch": 567} {"train_loss": -9.541254043579102, "global_step": 95414, "epoch": 567} {"train_loss": -9.061049461364746, "global_step": 95415, "epoch": 567} {"train_loss": -9.22269058227539, "global_step": 95416, "epoch": 567} {"train_loss": -9.274847984313965, "global_step": 95417, "epoch": 567} {"train_loss": -9.314898490905762, "global_step": 95418, "epoch": 567} {"train_loss": -9.173765182495117, "global_step": 95419, "epoch": 567} {"train_loss": -9.142165184020996, "global_step": 95420, "epoch": 567} {"train_loss": -9.45988655090332, "global_step": 95421, "epoch": 567} {"train_loss": -9.320087432861328, "global_step": 95422, "epoch": 567} {"train_loss": -9.47883371512095, "global_step": 95423, "epoch": 567, "val_loss": 204592.1875} {"train_loss": -9.553722381591797, "global_step": 95424, "epoch": 568} {"train_loss": -9.429868698120117, "global_step": 95425, "epoch": 568} {"train_loss": -9.380718231201172, "global_step": 95426, "epoch": 568} {"train_loss": -9.493162155151367, "global_step": 95427, "epoch": 568} {"train_loss": -9.409285545349121, "global_step": 95428, "epoch": 568} {"train_loss": -9.460359573364258, "global_step": 95429, "epoch": 568} {"train_loss": -9.56924819946289, "global_step": 95430, "epoch": 568} {"train_loss": -9.545469284057617, "global_step": 95431, "epoch": 568} {"train_loss": -9.440908432006836, "global_step": 95432, "epoch": 568} {"train_loss": -9.490049362182617, "global_step": 95433, "epoch": 568} {"train_loss": -9.441411018371582, "global_step": 95434, "epoch": 568} {"train_loss": -9.403694152832031, "global_step": 95435, "epoch": 568} {"train_loss": -9.373454093933105, "global_step": 95436, "epoch": 568} {"train_loss": -9.525700569152832, "global_step": 95437, "epoch": 568} {"train_loss": -9.471480369567871, "global_step": 95438, "epoch": 568} {"train_loss": -9.318592071533203, "global_step": 95439, "epoch": 568} {"train_loss": -9.341489791870117, "global_step": 95440, "epoch": 568} {"train_loss": -9.466084480285645, "global_step": 95441, "epoch": 568} {"train_loss": -9.42926025390625, "global_step": 95442, "epoch": 568} {"train_loss": -9.581350326538086, "global_step": 95443, "epoch": 568} {"train_loss": -9.690956115722656, "global_step": 95444, "epoch": 568} {"train_loss": -9.447917938232422, "global_step": 95445, "epoch": 568} {"train_loss": -9.703664779663086, "global_step": 95446, "epoch": 568} {"train_loss": -9.442752838134766, "global_step": 95447, "epoch": 568} {"train_loss": -9.407215118408203, "global_step": 95448, "epoch": 568} {"train_loss": -9.77705192565918, "global_step": 95449, "epoch": 568} {"train_loss": -9.384993553161621, "global_step": 95450, "epoch": 568} {"train_loss": -9.284566879272461, "global_step": 95451, "epoch": 568} {"train_loss": -9.731931686401367, "global_step": 95452, "epoch": 568} {"train_loss": -9.574600219726562, "global_step": 95453, "epoch": 568} {"train_loss": -9.570096969604492, "global_step": 95454, "epoch": 568} {"train_loss": -9.533402442932129, "global_step": 95455, "epoch": 568} {"train_loss": -9.523158073425293, "global_step": 95456, "epoch": 568} {"train_loss": -9.498894691467285, "global_step": 95457, "epoch": 568} {"train_loss": -9.35208797454834, "global_step": 95458, "epoch": 568} {"train_loss": -9.689709663391113, "global_step": 95459, "epoch": 568} {"train_loss": -9.337905883789062, "global_step": 95460, "epoch": 568} {"train_loss": -9.62160873413086, "global_step": 95461, "epoch": 568} {"train_loss": -9.114853858947754, "global_step": 95462, "epoch": 568} {"train_loss": -9.524055480957031, "global_step": 95463, "epoch": 568} {"train_loss": -9.45042610168457, "global_step": 95464, "epoch": 568} {"train_loss": -9.48764705657959, "global_step": 95465, "epoch": 568} {"train_loss": -9.787042617797852, "global_step": 95466, "epoch": 568} {"train_loss": -9.52420425415039, "global_step": 95467, "epoch": 568} {"train_loss": -9.566521644592285, "global_step": 95468, "epoch": 568} {"train_loss": -9.326863288879395, "global_step": 95469, "epoch": 568} {"train_loss": -9.699514389038086, "global_step": 95470, "epoch": 568} {"train_loss": -9.502535820007324, "global_step": 95471, "epoch": 568} {"train_loss": -9.537965774536133, "global_step": 95472, "epoch": 568} {"train_loss": -9.458698272705078, "global_step": 95473, "epoch": 568} {"train_loss": -9.722658157348633, "global_step": 95474, "epoch": 568} {"train_loss": -9.09366226196289, "global_step": 95475, "epoch": 568} {"train_loss": -9.706567764282227, "global_step": 95476, "epoch": 568} {"train_loss": -9.644979476928711, "global_step": 95477, "epoch": 568} {"train_loss": -9.301427841186523, "global_step": 95478, "epoch": 568} {"train_loss": -9.802891731262207, "global_step": 95479, "epoch": 568} {"train_loss": -9.622690200805664, "global_step": 95480, "epoch": 568} {"train_loss": -9.865398406982422, "global_step": 95481, "epoch": 568} {"train_loss": -9.47396469116211, "global_step": 95482, "epoch": 568} {"train_loss": -9.508508682250977, "global_step": 95483, "epoch": 568} {"train_loss": -9.552933692932129, "global_step": 95484, "epoch": 568} {"train_loss": -9.677567481994629, "global_step": 95485, "epoch": 568} {"train_loss": -9.366384506225586, "global_step": 95486, "epoch": 568} {"train_loss": -9.375019073486328, "global_step": 95487, "epoch": 568} {"train_loss": -9.834056854248047, "global_step": 95488, "epoch": 568} {"train_loss": -8.973405838012695, "global_step": 95489, "epoch": 568} {"train_loss": -9.65245246887207, "global_step": 95490, "epoch": 568} {"train_loss": -9.310702323913574, "global_step": 95491, "epoch": 568} {"train_loss": -9.594982147216797, "global_step": 95492, "epoch": 568} {"train_loss": -9.225528717041016, "global_step": 95493, "epoch": 568} {"train_loss": -9.293407440185547, "global_step": 95494, "epoch": 568} {"train_loss": -9.575254440307617, "global_step": 95495, "epoch": 568} {"train_loss": -9.240957260131836, "global_step": 95496, "epoch": 568} {"train_loss": -9.585933685302734, "global_step": 95497, "epoch": 568} {"train_loss": -9.721342086791992, "global_step": 95498, "epoch": 568} {"train_loss": -9.60047721862793, "global_step": 95499, "epoch": 568} {"train_loss": -9.494382858276367, "global_step": 95500, "epoch": 568} {"train_loss": -9.776283264160156, "global_step": 95501, "epoch": 568} {"train_loss": -9.734208106994629, "global_step": 95502, "epoch": 568} {"train_loss": -9.381340980529785, "global_step": 95503, "epoch": 568} {"train_loss": -9.640531539916992, "global_step": 95504, "epoch": 568} {"train_loss": -9.722105979919434, "global_step": 95505, "epoch": 568} {"train_loss": -9.544347763061523, "global_step": 95506, "epoch": 568} {"train_loss": -9.62493896484375, "global_step": 95507, "epoch": 568} {"train_loss": -9.734855651855469, "global_step": 95508, "epoch": 568} {"train_loss": -9.744293212890625, "global_step": 95509, "epoch": 568} {"train_loss": -9.661396026611328, "global_step": 95510, "epoch": 568} {"train_loss": -9.468811988830566, "global_step": 95511, "epoch": 568} {"train_loss": -9.551190376281738, "global_step": 95512, "epoch": 568} {"train_loss": -9.577522277832031, "global_step": 95513, "epoch": 568} {"train_loss": -9.688392639160156, "global_step": 95514, "epoch": 568} {"train_loss": -9.523748397827148, "global_step": 95515, "epoch": 568} {"train_loss": -9.696404457092285, "global_step": 95516, "epoch": 568} {"train_loss": -9.635822296142578, "global_step": 95517, "epoch": 568} {"train_loss": -9.653643608093262, "global_step": 95518, "epoch": 568} {"train_loss": -9.838329315185547, "global_step": 95519, "epoch": 568} {"train_loss": -9.645957946777344, "global_step": 95520, "epoch": 568} {"train_loss": -9.609285354614258, "global_step": 95521, "epoch": 568} {"train_loss": -9.750411987304688, "global_step": 95522, "epoch": 568} {"train_loss": -9.666069030761719, "global_step": 95523, "epoch": 568} {"train_loss": -9.82780647277832, "global_step": 95524, "epoch": 568} {"train_loss": -9.51284408569336, "global_step": 95525, "epoch": 568} {"train_loss": -9.866918563842773, "global_step": 95526, "epoch": 568} {"train_loss": -9.48878002166748, "global_step": 95527, "epoch": 568} {"train_loss": -9.51800537109375, "global_step": 95528, "epoch": 568} {"train_loss": -9.854536056518555, "global_step": 95529, "epoch": 568} {"train_loss": -9.762216567993164, "global_step": 95530, "epoch": 568} {"train_loss": -9.662590026855469, "global_step": 95531, "epoch": 568} {"train_loss": -9.446944236755371, "global_step": 95532, "epoch": 568} {"train_loss": -9.574419021606445, "global_step": 95533, "epoch": 568} {"train_loss": -9.103109359741211, "global_step": 95534, "epoch": 568} {"train_loss": -9.750425338745117, "global_step": 95535, "epoch": 568} {"train_loss": -9.35638427734375, "global_step": 95536, "epoch": 568} {"train_loss": -8.979490280151367, "global_step": 95537, "epoch": 568} {"train_loss": -9.331270217895508, "global_step": 95538, "epoch": 568} {"train_loss": -9.500341415405273, "global_step": 95539, "epoch": 568} {"train_loss": -9.479893684387207, "global_step": 95540, "epoch": 568} {"train_loss": -9.766145706176758, "global_step": 95541, "epoch": 568} {"train_loss": -9.151419639587402, "global_step": 95542, "epoch": 568} {"train_loss": -9.282312393188477, "global_step": 95543, "epoch": 568} {"train_loss": -9.503036499023438, "global_step": 95544, "epoch": 568} {"train_loss": -9.08380126953125, "global_step": 95545, "epoch": 568} {"train_loss": -9.539897918701172, "global_step": 95546, "epoch": 568} {"train_loss": -9.191733360290527, "global_step": 95547, "epoch": 568} {"train_loss": -9.38162899017334, "global_step": 95548, "epoch": 568} {"train_loss": -9.051689147949219, "global_step": 95549, "epoch": 568} {"train_loss": -9.254054069519043, "global_step": 95550, "epoch": 568} {"train_loss": -9.143354415893555, "global_step": 95551, "epoch": 568} {"train_loss": -9.757156372070312, "global_step": 95552, "epoch": 568} {"train_loss": -9.460564613342285, "global_step": 95553, "epoch": 568} {"train_loss": -9.643295288085938, "global_step": 95554, "epoch": 568} {"train_loss": -9.537484169006348, "global_step": 95555, "epoch": 568} {"train_loss": -9.762954711914062, "global_step": 95556, "epoch": 568} {"train_loss": -9.717671394348145, "global_step": 95557, "epoch": 568} {"train_loss": -9.699974060058594, "global_step": 95558, "epoch": 568} {"train_loss": -9.648934364318848, "global_step": 95559, "epoch": 568} {"train_loss": -9.893455505371094, "global_step": 95560, "epoch": 568} {"train_loss": -9.650535583496094, "global_step": 95561, "epoch": 568} {"train_loss": -9.833938598632812, "global_step": 95562, "epoch": 568} {"train_loss": -9.358760833740234, "global_step": 95563, "epoch": 568} {"train_loss": -9.580124855041504, "global_step": 95564, "epoch": 568} {"train_loss": -9.526714324951172, "global_step": 95565, "epoch": 568} {"train_loss": -9.680181503295898, "global_step": 95566, "epoch": 568} {"train_loss": -9.804947853088379, "global_step": 95567, "epoch": 568} {"train_loss": -9.569469451904297, "global_step": 95568, "epoch": 568} {"train_loss": -9.657842636108398, "global_step": 95569, "epoch": 568} {"train_loss": -9.52800178527832, "global_step": 95570, "epoch": 568} {"train_loss": -9.265558242797852, "global_step": 95571, "epoch": 568} {"train_loss": -9.731239318847656, "global_step": 95572, "epoch": 568} {"train_loss": -9.468356132507324, "global_step": 95573, "epoch": 568} {"train_loss": -9.50732421875, "global_step": 95574, "epoch": 568} {"train_loss": -9.627155303955078, "global_step": 95575, "epoch": 568} {"train_loss": -9.545722961425781, "global_step": 95576, "epoch": 568} {"train_loss": -9.447118759155273, "global_step": 95577, "epoch": 568} {"train_loss": -9.555473327636719, "global_step": 95578, "epoch": 568} {"train_loss": -9.403030395507812, "global_step": 95579, "epoch": 568} {"train_loss": -9.908475875854492, "global_step": 95580, "epoch": 568} {"train_loss": -9.526081085205078, "global_step": 95581, "epoch": 568} {"train_loss": -9.595848083496094, "global_step": 95582, "epoch": 568} {"train_loss": -9.427573204040527, "global_step": 95583, "epoch": 568} {"train_loss": -9.41359806060791, "global_step": 95584, "epoch": 568} {"train_loss": -9.5021333694458, "global_step": 95585, "epoch": 568} {"train_loss": -9.509565353393555, "global_step": 95586, "epoch": 568} {"train_loss": -9.728675842285156, "global_step": 95587, "epoch": 568} {"train_loss": -9.625926971435547, "global_step": 95588, "epoch": 568} {"train_loss": -9.805349349975586, "global_step": 95589, "epoch": 568} {"train_loss": -9.564591407775879, "global_step": 95590, "epoch": 568} {"train_loss": -9.533320302054996, "global_step": 95591, "epoch": 568, "val_loss": 205276.46875} {"train_loss": -9.499311447143555, "global_step": 95592, "epoch": 569} {"train_loss": -9.38784122467041, "global_step": 95593, "epoch": 569} {"train_loss": -9.290899276733398, "global_step": 95594, "epoch": 569} {"train_loss": -9.395393371582031, "global_step": 95595, "epoch": 569} {"train_loss": -9.607856750488281, "global_step": 95596, "epoch": 569} {"train_loss": -9.585247039794922, "global_step": 95597, "epoch": 569} {"train_loss": -9.129541397094727, "global_step": 95598, "epoch": 569} {"train_loss": -9.353623390197754, "global_step": 95599, "epoch": 569} {"train_loss": -9.335678100585938, "global_step": 95600, "epoch": 569} {"train_loss": -9.535745620727539, "global_step": 95601, "epoch": 569} {"train_loss": -9.228240966796875, "global_step": 95602, "epoch": 569} {"train_loss": -9.262027740478516, "global_step": 95603, "epoch": 569} {"train_loss": -9.534843444824219, "global_step": 95604, "epoch": 569} {"train_loss": -9.386263847351074, "global_step": 95605, "epoch": 569} {"train_loss": -9.213854789733887, "global_step": 95606, "epoch": 569} {"train_loss": -9.671483039855957, "global_step": 95607, "epoch": 569} {"train_loss": -9.381089210510254, "global_step": 95608, "epoch": 569} {"train_loss": -9.715855598449707, "global_step": 95609, "epoch": 569} {"train_loss": -9.678149223327637, "global_step": 95610, "epoch": 569} {"train_loss": -9.323012351989746, "global_step": 95611, "epoch": 569} {"train_loss": -9.527167320251465, "global_step": 95612, "epoch": 569} {"train_loss": -9.643136978149414, "global_step": 95613, "epoch": 569} {"train_loss": -9.683271408081055, "global_step": 95614, "epoch": 569} {"train_loss": -9.548360824584961, "global_step": 95615, "epoch": 569} {"train_loss": -9.374608993530273, "global_step": 95616, "epoch": 569} {"train_loss": -9.742727279663086, "global_step": 95617, "epoch": 569} {"train_loss": -9.596463203430176, "global_step": 95618, "epoch": 569} {"train_loss": -9.467733383178711, "global_step": 95619, "epoch": 569} {"train_loss": -9.633941650390625, "global_step": 95620, "epoch": 569} {"train_loss": -9.478809356689453, "global_step": 95621, "epoch": 569} {"train_loss": -9.136638641357422, "global_step": 95622, "epoch": 569} {"train_loss": -9.753747940063477, "global_step": 95623, "epoch": 569} {"train_loss": -9.281865119934082, "global_step": 95624, "epoch": 569} {"train_loss": -9.305496215820312, "global_step": 95625, "epoch": 569} {"train_loss": -9.118485450744629, "global_step": 95626, "epoch": 569} {"train_loss": -9.835994720458984, "global_step": 95627, "epoch": 569} {"train_loss": -9.487091064453125, "global_step": 95628, "epoch": 569} {"train_loss": -9.805778503417969, "global_step": 95629, "epoch": 569} {"train_loss": -9.743871688842773, "global_step": 95630, "epoch": 569} {"train_loss": -9.703851699829102, "global_step": 95631, "epoch": 569} {"train_loss": -9.519573211669922, "global_step": 95632, "epoch": 569} {"train_loss": -9.40341854095459, "global_step": 95633, "epoch": 569} {"train_loss": -10.03885269165039, "global_step": 95634, "epoch": 569} {"train_loss": -9.623260498046875, "global_step": 95635, "epoch": 569} {"train_loss": -9.842195510864258, "global_step": 95636, "epoch": 569} {"train_loss": -9.67542839050293, "global_step": 95637, "epoch": 569} {"train_loss": -9.663778305053711, "global_step": 95638, "epoch": 569} {"train_loss": -9.659418106079102, "global_step": 95639, "epoch": 569} {"train_loss": -9.713276863098145, "global_step": 95640, "epoch": 569} {"train_loss": -9.463356018066406, "global_step": 95641, "epoch": 569} {"train_loss": -9.506775856018066, "global_step": 95642, "epoch": 569} {"train_loss": -9.755470275878906, "global_step": 95643, "epoch": 569} {"train_loss": -9.752445220947266, "global_step": 95644, "epoch": 569} {"train_loss": -9.794486999511719, "global_step": 95645, "epoch": 569} {"train_loss": -9.393056869506836, "global_step": 95646, "epoch": 569} {"train_loss": -9.726533889770508, "global_step": 95647, "epoch": 569} {"train_loss": -9.658119201660156, "global_step": 95648, "epoch": 569} {"train_loss": -9.502620697021484, "global_step": 95649, "epoch": 569} {"train_loss": -9.666927337646484, "global_step": 95650, "epoch": 569} {"train_loss": -9.615165710449219, "global_step": 95651, "epoch": 569} {"train_loss": -9.802399635314941, "global_step": 95652, "epoch": 569} {"train_loss": -9.536582946777344, "global_step": 95653, "epoch": 569} {"train_loss": -9.59384536743164, "global_step": 95654, "epoch": 569} {"train_loss": -9.267230987548828, "global_step": 95655, "epoch": 569} {"train_loss": -9.76203727722168, "global_step": 95656, "epoch": 569} {"train_loss": -9.189249038696289, "global_step": 95657, "epoch": 569} {"train_loss": -9.769018173217773, "global_step": 95658, "epoch": 569} {"train_loss": -9.648538589477539, "global_step": 95659, "epoch": 569} {"train_loss": -9.443359375, "global_step": 95660, "epoch": 569} {"train_loss": -9.626103401184082, "global_step": 95661, "epoch": 569} {"train_loss": -9.413010597229004, "global_step": 95662, "epoch": 569} {"train_loss": -9.596601486206055, "global_step": 95663, "epoch": 569} {"train_loss": -9.37705135345459, "global_step": 95664, "epoch": 569} {"train_loss": -9.438148498535156, "global_step": 95665, "epoch": 569} {"train_loss": -9.534614562988281, "global_step": 95666, "epoch": 569} {"train_loss": -9.758465766906738, "global_step": 95667, "epoch": 569} {"train_loss": -9.625764846801758, "global_step": 95668, "epoch": 569} {"train_loss": -9.578160285949707, "global_step": 95669, "epoch": 569} {"train_loss": -9.483524322509766, "global_step": 95670, "epoch": 569} {"train_loss": -9.431087493896484, "global_step": 95671, "epoch": 569} {"train_loss": -9.091032028198242, "global_step": 95672, "epoch": 569} {"train_loss": -9.578902244567871, "global_step": 95673, "epoch": 569} {"train_loss": -9.216814994812012, "global_step": 95674, "epoch": 569} {"train_loss": -9.4581937789917, "global_step": 95675, "epoch": 569} {"train_loss": -9.450657844543457, "global_step": 95676, "epoch": 569} {"train_loss": -9.169319152832031, "global_step": 95677, "epoch": 569} {"train_loss": -9.590795516967773, "global_step": 95678, "epoch": 569} {"train_loss": -9.43539810180664, "global_step": 95679, "epoch": 569} {"train_loss": -9.485635757446289, "global_step": 95680, "epoch": 569} {"train_loss": -9.393983840942383, "global_step": 95681, "epoch": 569} {"train_loss": -9.236438751220703, "global_step": 95682, "epoch": 569} {"train_loss": -9.536407470703125, "global_step": 95683, "epoch": 569} {"train_loss": -9.29585075378418, "global_step": 95684, "epoch": 569} {"train_loss": -9.52379035949707, "global_step": 95685, "epoch": 569} {"train_loss": -9.097824096679688, "global_step": 95686, "epoch": 569} {"train_loss": -9.663989067077637, "global_step": 95687, "epoch": 569} {"train_loss": -9.142227172851562, "global_step": 95688, "epoch": 569} {"train_loss": -9.7500581741333, "global_step": 95689, "epoch": 569} {"train_loss": -9.225221633911133, "global_step": 95690, "epoch": 569} {"train_loss": -9.617618560791016, "global_step": 95691, "epoch": 569} {"train_loss": -9.320964813232422, "global_step": 95692, "epoch": 569} {"train_loss": -9.600690841674805, "global_step": 95693, "epoch": 569} {"train_loss": -9.486700057983398, "global_step": 95694, "epoch": 569} {"train_loss": -9.500109672546387, "global_step": 95695, "epoch": 569} {"train_loss": -9.8587007522583, "global_step": 95696, "epoch": 569} {"train_loss": -9.479036331176758, "global_step": 95697, "epoch": 569} {"train_loss": -9.646750450134277, "global_step": 95698, "epoch": 569} {"train_loss": -9.633977890014648, "global_step": 95699, "epoch": 569} {"train_loss": -9.627742767333984, "global_step": 95700, "epoch": 569} {"train_loss": -9.675260543823242, "global_step": 95701, "epoch": 569} {"train_loss": -9.626296043395996, "global_step": 95702, "epoch": 569} {"train_loss": -9.682380676269531, "global_step": 95703, "epoch": 569} {"train_loss": -9.36048698425293, "global_step": 95704, "epoch": 569} {"train_loss": -9.420520782470703, "global_step": 95705, "epoch": 569} {"train_loss": -9.382484436035156, "global_step": 95706, "epoch": 569} {"train_loss": -9.852145195007324, "global_step": 95707, "epoch": 569} {"train_loss": -9.417657852172852, "global_step": 95708, "epoch": 569} {"train_loss": -9.587236404418945, "global_step": 95709, "epoch": 569} {"train_loss": -9.623649597167969, "global_step": 95710, "epoch": 569} {"train_loss": -9.821807861328125, "global_step": 95711, "epoch": 569} {"train_loss": -9.860511779785156, "global_step": 95712, "epoch": 569} {"train_loss": -9.566391944885254, "global_step": 95713, "epoch": 569} {"train_loss": -9.747920989990234, "global_step": 95714, "epoch": 569} {"train_loss": -9.707786560058594, "global_step": 95715, "epoch": 569} {"train_loss": -9.321561813354492, "global_step": 95716, "epoch": 569} {"train_loss": -9.568490982055664, "global_step": 95717, "epoch": 569} {"train_loss": -9.531135559082031, "global_step": 95718, "epoch": 569} {"train_loss": -9.614141464233398, "global_step": 95719, "epoch": 569} {"train_loss": -9.74770736694336, "global_step": 95720, "epoch": 569} {"train_loss": -9.75285530090332, "global_step": 95721, "epoch": 569} {"train_loss": -9.738943099975586, "global_step": 95722, "epoch": 569} {"train_loss": -9.773879051208496, "global_step": 95723, "epoch": 569} {"train_loss": -9.749411582946777, "global_step": 95724, "epoch": 569} {"train_loss": -9.674996376037598, "global_step": 95725, "epoch": 569} {"train_loss": -9.790031433105469, "global_step": 95726, "epoch": 569} {"train_loss": -9.445489883422852, "global_step": 95727, "epoch": 569} {"train_loss": -9.785652160644531, "global_step": 95728, "epoch": 569} {"train_loss": -9.089665412902832, "global_step": 95729, "epoch": 569} {"train_loss": -9.317808151245117, "global_step": 95730, "epoch": 569} {"train_loss": -9.614602088928223, "global_step": 95731, "epoch": 569} {"train_loss": -9.083107948303223, "global_step": 95732, "epoch": 569} {"train_loss": -9.543144226074219, "global_step": 95733, "epoch": 569} {"train_loss": -9.222541809082031, "global_step": 95734, "epoch": 569} {"train_loss": -9.397981643676758, "global_step": 95735, "epoch": 569} {"train_loss": -9.579379081726074, "global_step": 95736, "epoch": 569} {"train_loss": -9.499788284301758, "global_step": 95737, "epoch": 569} {"train_loss": -9.59558391571045, "global_step": 95738, "epoch": 569} {"train_loss": -9.76065444946289, "global_step": 95739, "epoch": 569} {"train_loss": -9.742254257202148, "global_step": 95740, "epoch": 569} {"train_loss": -9.770315170288086, "global_step": 95741, "epoch": 569} {"train_loss": -9.696967124938965, "global_step": 95742, "epoch": 569} {"train_loss": -9.655423164367676, "global_step": 95743, "epoch": 569} {"train_loss": -9.346452713012695, "global_step": 95744, "epoch": 569} {"train_loss": -9.600257873535156, "global_step": 95745, "epoch": 569} {"train_loss": -9.906326293945312, "global_step": 95746, "epoch": 569} {"train_loss": -9.553960800170898, "global_step": 95747, "epoch": 569} {"train_loss": -9.700159072875977, "global_step": 95748, "epoch": 569} {"train_loss": -9.506037712097168, "global_step": 95749, "epoch": 569} {"train_loss": -9.57255744934082, "global_step": 95750, "epoch": 569} {"train_loss": -9.267642974853516, "global_step": 95751, "epoch": 569} {"train_loss": -9.534399032592773, "global_step": 95752, "epoch": 569} {"train_loss": -9.151721954345703, "global_step": 95753, "epoch": 569} {"train_loss": -9.578573226928711, "global_step": 95754, "epoch": 569} {"train_loss": -9.170928955078125, "global_step": 95755, "epoch": 569} {"train_loss": -9.588773727416992, "global_step": 95756, "epoch": 569} {"train_loss": -9.413147926330566, "global_step": 95757, "epoch": 569} {"train_loss": -9.567142486572266, "global_step": 95758, "epoch": 569} {"train_loss": -9.532144336473374, "global_step": 95759, "epoch": 569, "val_loss": 205305.796875} {"train_loss": -9.142328262329102, "global_step": 95760, "epoch": 570} {"train_loss": -9.300333976745605, "global_step": 95761, "epoch": 570} {"train_loss": -9.366591453552246, "global_step": 95762, "epoch": 570} {"train_loss": -9.301950454711914, "global_step": 95763, "epoch": 570} {"train_loss": -9.54461669921875, "global_step": 95764, "epoch": 570} {"train_loss": -9.422531127929688, "global_step": 95765, "epoch": 570} {"train_loss": -9.421723365783691, "global_step": 95766, "epoch": 570} {"train_loss": -9.514497756958008, "global_step": 95767, "epoch": 570} {"train_loss": -9.234399795532227, "global_step": 95768, "epoch": 570} {"train_loss": -9.395999908447266, "global_step": 95769, "epoch": 570} {"train_loss": -9.518135070800781, "global_step": 95770, "epoch": 570} {"train_loss": -9.355512619018555, "global_step": 95771, "epoch": 570} {"train_loss": -9.480924606323242, "global_step": 95772, "epoch": 570} {"train_loss": -9.457204818725586, "global_step": 95773, "epoch": 570} {"train_loss": -9.427350997924805, "global_step": 95774, "epoch": 570} {"train_loss": -9.514899253845215, "global_step": 95775, "epoch": 570} {"train_loss": -9.501550674438477, "global_step": 95776, "epoch": 570} {"train_loss": -9.47637939453125, "global_step": 95777, "epoch": 570} {"train_loss": -9.421319007873535, "global_step": 95778, "epoch": 570} {"train_loss": -9.361186027526855, "global_step": 95779, "epoch": 570} {"train_loss": -9.682382583618164, "global_step": 95780, "epoch": 570} {"train_loss": -9.587477684020996, "global_step": 95781, "epoch": 570} {"train_loss": -9.728271484375, "global_step": 95782, "epoch": 570} {"train_loss": -9.616888046264648, "global_step": 95783, "epoch": 570} {"train_loss": -9.456808090209961, "global_step": 95784, "epoch": 570} {"train_loss": -9.595863342285156, "global_step": 95785, "epoch": 570} {"train_loss": -9.765440940856934, "global_step": 95786, "epoch": 570} {"train_loss": -9.625015258789062, "global_step": 95787, "epoch": 570} {"train_loss": -9.462873458862305, "global_step": 95788, "epoch": 570} {"train_loss": -9.740924835205078, "global_step": 95789, "epoch": 570} {"train_loss": -9.480391502380371, "global_step": 95790, "epoch": 570} {"train_loss": -9.614126205444336, "global_step": 95791, "epoch": 570} {"train_loss": -9.80559253692627, "global_step": 95792, "epoch": 570} {"train_loss": -9.677069664001465, "global_step": 95793, "epoch": 570} {"train_loss": -9.7747802734375, "global_step": 95794, "epoch": 570} {"train_loss": -9.630406379699707, "global_step": 95795, "epoch": 570} {"train_loss": -9.737207412719727, "global_step": 95796, "epoch": 570} {"train_loss": -9.626826286315918, "global_step": 95797, "epoch": 570} {"train_loss": -9.68239974975586, "global_step": 95798, "epoch": 570} {"train_loss": -9.576532363891602, "global_step": 95799, "epoch": 570} {"train_loss": -9.657424926757812, "global_step": 95800, "epoch": 570} {"train_loss": -9.694686889648438, "global_step": 95801, "epoch": 570} {"train_loss": -9.55151081085205, "global_step": 95802, "epoch": 570} {"train_loss": -9.90279769897461, "global_step": 95803, "epoch": 570} {"train_loss": -9.598907470703125, "global_step": 95804, "epoch": 570} {"train_loss": -9.1227445602417, "global_step": 95805, "epoch": 570} {"train_loss": -9.432674407958984, "global_step": 95806, "epoch": 570} {"train_loss": -9.366071701049805, "global_step": 95807, "epoch": 570} {"train_loss": -9.433101654052734, "global_step": 95808, "epoch": 570} {"train_loss": -9.485815048217773, "global_step": 95809, "epoch": 570} {"train_loss": -9.629806518554688, "global_step": 95810, "epoch": 570} {"train_loss": -9.036470413208008, "global_step": 95811, "epoch": 570} {"train_loss": -9.485260009765625, "global_step": 95812, "epoch": 570} {"train_loss": -9.357194900512695, "global_step": 95813, "epoch": 570} {"train_loss": -9.54486083984375, "global_step": 95814, "epoch": 570} {"train_loss": -9.324782371520996, "global_step": 95815, "epoch": 570} {"train_loss": -9.782630920410156, "global_step": 95816, "epoch": 570} {"train_loss": -9.675873756408691, "global_step": 95817, "epoch": 570} {"train_loss": -9.749536514282227, "global_step": 95818, "epoch": 570} {"train_loss": -9.721861839294434, "global_step": 95819, "epoch": 570} {"train_loss": -9.612173080444336, "global_step": 95820, "epoch": 570} {"train_loss": -9.774561882019043, "global_step": 95821, "epoch": 570} {"train_loss": -9.395211219787598, "global_step": 95822, "epoch": 570} {"train_loss": -9.335840225219727, "global_step": 95823, "epoch": 570} {"train_loss": -9.727346420288086, "global_step": 95824, "epoch": 570} {"train_loss": -9.621294021606445, "global_step": 95825, "epoch": 570} {"train_loss": -9.864335060119629, "global_step": 95826, "epoch": 570} {"train_loss": -9.415304183959961, "global_step": 95827, "epoch": 570} {"train_loss": -9.469877243041992, "global_step": 95828, "epoch": 570} {"train_loss": -9.662260055541992, "global_step": 95829, "epoch": 570} {"train_loss": -9.863517761230469, "global_step": 95830, "epoch": 570} {"train_loss": -9.65633773803711, "global_step": 95831, "epoch": 570} {"train_loss": -9.84333324432373, "global_step": 95832, "epoch": 570} {"train_loss": -9.802011489868164, "global_step": 95833, "epoch": 570} {"train_loss": -9.768845558166504, "global_step": 95834, "epoch": 570} {"train_loss": -9.889851570129395, "global_step": 95835, "epoch": 570} {"train_loss": -9.767601013183594, "global_step": 95836, "epoch": 570} {"train_loss": -9.85632038116455, "global_step": 95837, "epoch": 570} {"train_loss": -9.54340934753418, "global_step": 95838, "epoch": 570} {"train_loss": -9.642030715942383, "global_step": 95839, "epoch": 570} {"train_loss": -9.42535400390625, "global_step": 95840, "epoch": 570} {"train_loss": -9.668450355529785, "global_step": 95841, "epoch": 570} {"train_loss": -9.740571975708008, "global_step": 95842, "epoch": 570} {"train_loss": -9.623054504394531, "global_step": 95843, "epoch": 570} {"train_loss": -9.582585334777832, "global_step": 95844, "epoch": 570} {"train_loss": -9.9837064743042, "global_step": 95845, "epoch": 570} {"train_loss": -9.745741844177246, "global_step": 95846, "epoch": 570} {"train_loss": -9.732354164123535, "global_step": 95847, "epoch": 570} {"train_loss": -9.586959838867188, "global_step": 95848, "epoch": 570} {"train_loss": -9.89684009552002, "global_step": 95849, "epoch": 570} {"train_loss": -9.522603988647461, "global_step": 95850, "epoch": 570} {"train_loss": -10.104692459106445, "global_step": 95851, "epoch": 570} {"train_loss": -9.686920166015625, "global_step": 95852, "epoch": 570} {"train_loss": -9.769742012023926, "global_step": 95853, "epoch": 570} {"train_loss": -9.635625839233398, "global_step": 95854, "epoch": 570} {"train_loss": -9.623222351074219, "global_step": 95855, "epoch": 570} {"train_loss": -9.472230911254883, "global_step": 95856, "epoch": 570} {"train_loss": -9.685700416564941, "global_step": 95857, "epoch": 570} {"train_loss": -8.99946403503418, "global_step": 95858, "epoch": 570} {"train_loss": -9.498786926269531, "global_step": 95859, "epoch": 570} {"train_loss": -8.83697509765625, "global_step": 95860, "epoch": 570} {"train_loss": -9.190570831298828, "global_step": 95861, "epoch": 570} {"train_loss": -8.948182106018066, "global_step": 95862, "epoch": 570} {"train_loss": -9.384685516357422, "global_step": 95863, "epoch": 570} {"train_loss": -9.170215606689453, "global_step": 95864, "epoch": 570} {"train_loss": -9.271310806274414, "global_step": 95865, "epoch": 570} {"train_loss": -9.106581687927246, "global_step": 95866, "epoch": 570} {"train_loss": -9.220712661743164, "global_step": 95867, "epoch": 570} {"train_loss": -8.927379608154297, "global_step": 95868, "epoch": 570} {"train_loss": -9.322534561157227, "global_step": 95869, "epoch": 570} {"train_loss": -9.29511833190918, "global_step": 95870, "epoch": 570} {"train_loss": -9.0077543258667, "global_step": 95871, "epoch": 570} {"train_loss": -9.321327209472656, "global_step": 95872, "epoch": 570} {"train_loss": -9.147224426269531, "global_step": 95873, "epoch": 570} {"train_loss": -9.41142749786377, "global_step": 95874, "epoch": 570} {"train_loss": -9.33669662475586, "global_step": 95875, "epoch": 570} {"train_loss": -9.36977767944336, "global_step": 95876, "epoch": 570} {"train_loss": -9.488668441772461, "global_step": 95877, "epoch": 570} {"train_loss": -9.319656372070312, "global_step": 95878, "epoch": 570} {"train_loss": -9.233541488647461, "global_step": 95879, "epoch": 570} {"train_loss": -9.284420013427734, "global_step": 95880, "epoch": 570} {"train_loss": -9.554113388061523, "global_step": 95881, "epoch": 570} {"train_loss": -9.647869110107422, "global_step": 95882, "epoch": 570} {"train_loss": -9.57368278503418, "global_step": 95883, "epoch": 570} {"train_loss": -9.685336112976074, "global_step": 95884, "epoch": 570} {"train_loss": -9.676332473754883, "global_step": 95885, "epoch": 570} {"train_loss": -9.76789665222168, "global_step": 95886, "epoch": 570} {"train_loss": -9.6827974319458, "global_step": 95887, "epoch": 570} {"train_loss": -9.634114265441895, "global_step": 95888, "epoch": 570} {"train_loss": -9.771097183227539, "global_step": 95889, "epoch": 570} {"train_loss": -9.770184516906738, "global_step": 95890, "epoch": 570} {"train_loss": -9.773454666137695, "global_step": 95891, "epoch": 570} {"train_loss": -9.87740707397461, "global_step": 95892, "epoch": 570} {"train_loss": -9.806111335754395, "global_step": 95893, "epoch": 570} {"train_loss": -9.650259971618652, "global_step": 95894, "epoch": 570} {"train_loss": -9.83951187133789, "global_step": 95895, "epoch": 570} {"train_loss": -9.484796524047852, "global_step": 95896, "epoch": 570} {"train_loss": -9.845304489135742, "global_step": 95897, "epoch": 570} {"train_loss": -9.383255004882812, "global_step": 95898, "epoch": 570} {"train_loss": -9.822896957397461, "global_step": 95899, "epoch": 570} {"train_loss": -9.30789566040039, "global_step": 95900, "epoch": 570} {"train_loss": -9.274614334106445, "global_step": 95901, "epoch": 570} {"train_loss": -9.486845016479492, "global_step": 95902, "epoch": 570} {"train_loss": -9.300352096557617, "global_step": 95903, "epoch": 570} {"train_loss": -9.26839828491211, "global_step": 95904, "epoch": 570} {"train_loss": -9.659263610839844, "global_step": 95905, "epoch": 570} {"train_loss": -9.246219635009766, "global_step": 95906, "epoch": 570} {"train_loss": -9.79256820678711, "global_step": 95907, "epoch": 570} {"train_loss": -9.275054931640625, "global_step": 95908, "epoch": 570} {"train_loss": -9.690218925476074, "global_step": 95909, "epoch": 570} {"train_loss": -9.479454040527344, "global_step": 95910, "epoch": 570} {"train_loss": -9.702113151550293, "global_step": 95911, "epoch": 570} {"train_loss": -9.48143482208252, "global_step": 95912, "epoch": 570} {"train_loss": -9.437356948852539, "global_step": 95913, "epoch": 570} {"train_loss": -9.33114242553711, "global_step": 95914, "epoch": 570} {"train_loss": -9.427755355834961, "global_step": 95915, "epoch": 570} {"train_loss": -9.30308723449707, "global_step": 95916, "epoch": 570} {"train_loss": -9.560051918029785, "global_step": 95917, "epoch": 570} {"train_loss": -9.556413650512695, "global_step": 95918, "epoch": 570} {"train_loss": -9.332489013671875, "global_step": 95919, "epoch": 570} {"train_loss": -9.509359359741211, "global_step": 95920, "epoch": 570} {"train_loss": -9.584799766540527, "global_step": 95921, "epoch": 570} {"train_loss": -9.733678817749023, "global_step": 95922, "epoch": 570} {"train_loss": -9.699398040771484, "global_step": 95923, "epoch": 570} {"train_loss": -9.504694938659668, "global_step": 95924, "epoch": 570} {"train_loss": -9.64463996887207, "global_step": 95925, "epoch": 570} {"train_loss": -9.72181224822998, "global_step": 95926, "epoch": 570} {"train_loss": -9.53577819324675, "global_step": 95927, "epoch": 570, "val_loss": 203512.15625, "train_action_mse_error": 4.148360252380371} {"train_loss": -9.647689819335938, "global_step": 95928, "epoch": 571} {"train_loss": -9.765853881835938, "global_step": 95929, "epoch": 571} {"train_loss": -9.75509262084961, "global_step": 95930, "epoch": 571} {"train_loss": -9.750279426574707, "global_step": 95931, "epoch": 571} {"train_loss": -9.552618026733398, "global_step": 95932, "epoch": 571} {"train_loss": -9.421934127807617, "global_step": 95933, "epoch": 571} {"train_loss": -9.424922943115234, "global_step": 95934, "epoch": 571} {"train_loss": -9.629629135131836, "global_step": 95935, "epoch": 571} {"train_loss": -9.151520729064941, "global_step": 95936, "epoch": 571} {"train_loss": -9.813440322875977, "global_step": 95937, "epoch": 571} {"train_loss": -9.532381057739258, "global_step": 95938, "epoch": 571} {"train_loss": -9.46571159362793, "global_step": 95939, "epoch": 571} {"train_loss": -9.20820426940918, "global_step": 95940, "epoch": 571} {"train_loss": -9.411023139953613, "global_step": 95941, "epoch": 571} {"train_loss": -9.273916244506836, "global_step": 95942, "epoch": 571} {"train_loss": -9.568864822387695, "global_step": 95943, "epoch": 571} {"train_loss": -9.233221054077148, "global_step": 95944, "epoch": 571} {"train_loss": -9.410351753234863, "global_step": 95945, "epoch": 571} {"train_loss": -9.304344177246094, "global_step": 95946, "epoch": 571} {"train_loss": -9.211977005004883, "global_step": 95947, "epoch": 571} {"train_loss": -9.292142868041992, "global_step": 95948, "epoch": 571} {"train_loss": -9.256996154785156, "global_step": 95949, "epoch": 571} {"train_loss": -9.448568344116211, "global_step": 95950, "epoch": 571} {"train_loss": -9.599109649658203, "global_step": 95951, "epoch": 571} {"train_loss": -9.102682113647461, "global_step": 95952, "epoch": 571} {"train_loss": -9.345259666442871, "global_step": 95953, "epoch": 571} {"train_loss": -9.343978881835938, "global_step": 95954, "epoch": 571} {"train_loss": -9.338488578796387, "global_step": 95955, "epoch": 571} {"train_loss": -9.417501449584961, "global_step": 95956, "epoch": 571} {"train_loss": -9.690601348876953, "global_step": 95957, "epoch": 571} {"train_loss": -9.362117767333984, "global_step": 95958, "epoch": 571} {"train_loss": -9.750372886657715, "global_step": 95959, "epoch": 571} {"train_loss": -9.307733535766602, "global_step": 95960, "epoch": 571} {"train_loss": -9.31948471069336, "global_step": 95961, "epoch": 571} {"train_loss": -9.23328971862793, "global_step": 95962, "epoch": 571} {"train_loss": -9.81654167175293, "global_step": 95963, "epoch": 571} {"train_loss": -9.70004653930664, "global_step": 95964, "epoch": 571} {"train_loss": -9.567656517028809, "global_step": 95965, "epoch": 571} {"train_loss": -9.719511032104492, "global_step": 95966, "epoch": 571} {"train_loss": -9.534067153930664, "global_step": 95967, "epoch": 571} {"train_loss": -9.680683135986328, "global_step": 95968, "epoch": 571} {"train_loss": -9.452795028686523, "global_step": 95969, "epoch": 571} {"train_loss": -9.616387367248535, "global_step": 95970, "epoch": 571} {"train_loss": -9.715211868286133, "global_step": 95971, "epoch": 571} {"train_loss": -9.750425338745117, "global_step": 95972, "epoch": 571} {"train_loss": -9.363627433776855, "global_step": 95973, "epoch": 571} {"train_loss": -9.526357650756836, "global_step": 95974, "epoch": 571} {"train_loss": -9.557546615600586, "global_step": 95975, "epoch": 571} {"train_loss": -9.489892959594727, "global_step": 95976, "epoch": 571} {"train_loss": -9.769165992736816, "global_step": 95977, "epoch": 571} {"train_loss": -9.271724700927734, "global_step": 95978, "epoch": 571} {"train_loss": -9.913782119750977, "global_step": 95979, "epoch": 571} {"train_loss": -9.558883666992188, "global_step": 95980, "epoch": 571} {"train_loss": -9.551366806030273, "global_step": 95981, "epoch": 571} {"train_loss": -9.681377410888672, "global_step": 95982, "epoch": 571} {"train_loss": -9.635299682617188, "global_step": 95983, "epoch": 571} {"train_loss": -9.42269515991211, "global_step": 95984, "epoch": 571} {"train_loss": -9.545845031738281, "global_step": 95985, "epoch": 571} {"train_loss": -9.851405143737793, "global_step": 95986, "epoch": 571} {"train_loss": -9.591896057128906, "global_step": 95987, "epoch": 571} {"train_loss": -9.82178020477295, "global_step": 95988, "epoch": 571} {"train_loss": -9.652486801147461, "global_step": 95989, "epoch": 571} {"train_loss": -9.529646873474121, "global_step": 95990, "epoch": 571} {"train_loss": -9.894408226013184, "global_step": 95991, "epoch": 571} {"train_loss": -9.513155937194824, "global_step": 95992, "epoch": 571} {"train_loss": -9.372527122497559, "global_step": 95993, "epoch": 571} {"train_loss": -9.507007598876953, "global_step": 95994, "epoch": 571} {"train_loss": -9.389776229858398, "global_step": 95995, "epoch": 571} {"train_loss": -9.692928314208984, "global_step": 95996, "epoch": 571} {"train_loss": -9.702879905700684, "global_step": 95997, "epoch": 571} {"train_loss": -9.619927406311035, "global_step": 95998, "epoch": 571} {"train_loss": -9.66353988647461, "global_step": 95999, "epoch": 571} {"train_loss": -9.550436973571777, "global_step": 96000, "epoch": 571} {"train_loss": -9.657875061035156, "global_step": 96001, "epoch": 571} {"train_loss": -9.514474868774414, "global_step": 96002, "epoch": 571} {"train_loss": -9.706620216369629, "global_step": 96003, "epoch": 571} {"train_loss": -9.462942123413086, "global_step": 96004, "epoch": 571} {"train_loss": -9.603894233703613, "global_step": 96005, "epoch": 571} {"train_loss": -9.419652938842773, "global_step": 96006, "epoch": 571} {"train_loss": -9.717148780822754, "global_step": 96007, "epoch": 571} {"train_loss": -9.468657493591309, "global_step": 96008, "epoch": 571} {"train_loss": -9.329317092895508, "global_step": 96009, "epoch": 571} {"train_loss": -9.461729049682617, "global_step": 96010, "epoch": 571} {"train_loss": -9.446479797363281, "global_step": 96011, "epoch": 571} {"train_loss": -9.512383460998535, "global_step": 96012, "epoch": 571} {"train_loss": -8.820987701416016, "global_step": 96013, "epoch": 571} {"train_loss": -9.468406677246094, "global_step": 96014, "epoch": 571} {"train_loss": -9.06947135925293, "global_step": 96015, "epoch": 571} {"train_loss": -9.474712371826172, "global_step": 96016, "epoch": 571} {"train_loss": -9.392059326171875, "global_step": 96017, "epoch": 571} {"train_loss": -9.464290618896484, "global_step": 96018, "epoch": 571} {"train_loss": -9.560760498046875, "global_step": 96019, "epoch": 571} {"train_loss": -9.162062644958496, "global_step": 96020, "epoch": 571} {"train_loss": -9.562838554382324, "global_step": 96021, "epoch": 571} {"train_loss": -9.108975410461426, "global_step": 96022, "epoch": 571} {"train_loss": -9.423759460449219, "global_step": 96023, "epoch": 571} {"train_loss": -9.61966323852539, "global_step": 96024, "epoch": 571} {"train_loss": -9.154200553894043, "global_step": 96025, "epoch": 571} {"train_loss": -9.5148344039917, "global_step": 96026, "epoch": 571} {"train_loss": -9.317743301391602, "global_step": 96027, "epoch": 571} {"train_loss": -9.485200881958008, "global_step": 96028, "epoch": 571} {"train_loss": -9.35837173461914, "global_step": 96029, "epoch": 571} {"train_loss": -9.260958671569824, "global_step": 96030, "epoch": 571} {"train_loss": -9.401376724243164, "global_step": 96031, "epoch": 571} {"train_loss": -9.556873321533203, "global_step": 96032, "epoch": 571} {"train_loss": -9.548297882080078, "global_step": 96033, "epoch": 571} {"train_loss": -9.488143920898438, "global_step": 96034, "epoch": 571} {"train_loss": -9.53696060180664, "global_step": 96035, "epoch": 571} {"train_loss": -9.461383819580078, "global_step": 96036, "epoch": 571} {"train_loss": -9.650055885314941, "global_step": 96037, "epoch": 571} {"train_loss": -9.377607345581055, "global_step": 96038, "epoch": 571} {"train_loss": -9.625452041625977, "global_step": 96039, "epoch": 571} {"train_loss": -9.525762557983398, "global_step": 96040, "epoch": 571} {"train_loss": -9.34837532043457, "global_step": 96041, "epoch": 571} {"train_loss": -9.719301223754883, "global_step": 96042, "epoch": 571} {"train_loss": -9.484957695007324, "global_step": 96043, "epoch": 571} {"train_loss": -9.703351974487305, "global_step": 96044, "epoch": 571} {"train_loss": -9.724348068237305, "global_step": 96045, "epoch": 571} {"train_loss": -9.733553886413574, "global_step": 96046, "epoch": 571} {"train_loss": -9.740835189819336, "global_step": 96047, "epoch": 571} {"train_loss": -9.612141609191895, "global_step": 96048, "epoch": 571} {"train_loss": -9.765384674072266, "global_step": 96049, "epoch": 571} {"train_loss": -9.395466804504395, "global_step": 96050, "epoch": 571} {"train_loss": -9.786367416381836, "global_step": 96051, "epoch": 571} {"train_loss": -9.554485321044922, "global_step": 96052, "epoch": 571} {"train_loss": -9.76638126373291, "global_step": 96053, "epoch": 571} {"train_loss": -9.431851387023926, "global_step": 96054, "epoch": 571} {"train_loss": -9.929702758789062, "global_step": 96055, "epoch": 571} {"train_loss": -9.379355430603027, "global_step": 96056, "epoch": 571} {"train_loss": -9.867284774780273, "global_step": 96057, "epoch": 571} {"train_loss": -9.653024673461914, "global_step": 96058, "epoch": 571} {"train_loss": -9.869827270507812, "global_step": 96059, "epoch": 571} {"train_loss": -9.806550979614258, "global_step": 96060, "epoch": 571} {"train_loss": -9.415176391601562, "global_step": 96061, "epoch": 571} {"train_loss": -9.84548568725586, "global_step": 96062, "epoch": 571} {"train_loss": -9.548877716064453, "global_step": 96063, "epoch": 571} {"train_loss": -9.612366676330566, "global_step": 96064, "epoch": 571} {"train_loss": -9.45769214630127, "global_step": 96065, "epoch": 571} {"train_loss": -9.523435592651367, "global_step": 96066, "epoch": 571} {"train_loss": -9.582528114318848, "global_step": 96067, "epoch": 571} {"train_loss": -8.933578491210938, "global_step": 96068, "epoch": 571} {"train_loss": -9.327829360961914, "global_step": 96069, "epoch": 571} {"train_loss": -9.527755737304688, "global_step": 96070, "epoch": 571} {"train_loss": -9.005265235900879, "global_step": 96071, "epoch": 571} {"train_loss": -9.632280349731445, "global_step": 96072, "epoch": 571} {"train_loss": -9.364944458007812, "global_step": 96073, "epoch": 571} {"train_loss": -9.226110458374023, "global_step": 96074, "epoch": 571} {"train_loss": -8.901352882385254, "global_step": 96075, "epoch": 571} {"train_loss": -9.425739288330078, "global_step": 96076, "epoch": 571} {"train_loss": -9.514297485351562, "global_step": 96077, "epoch": 571} {"train_loss": -9.311761856079102, "global_step": 96078, "epoch": 571} {"train_loss": -9.342479705810547, "global_step": 96079, "epoch": 571} {"train_loss": -9.512633323669434, "global_step": 96080, "epoch": 571} {"train_loss": -9.2227783203125, "global_step": 96081, "epoch": 571} {"train_loss": -9.499213218688965, "global_step": 96082, "epoch": 571} {"train_loss": -9.312559127807617, "global_step": 96083, "epoch": 571} {"train_loss": -9.428670883178711, "global_step": 96084, "epoch": 571} {"train_loss": -9.61897087097168, "global_step": 96085, "epoch": 571} {"train_loss": -9.636733055114746, "global_step": 96086, "epoch": 571} {"train_loss": -9.421243667602539, "global_step": 96087, "epoch": 571} {"train_loss": -9.409734725952148, "global_step": 96088, "epoch": 571} {"train_loss": -9.602375030517578, "global_step": 96089, "epoch": 571} {"train_loss": -9.458251953125, "global_step": 96090, "epoch": 571} {"train_loss": -9.59067153930664, "global_step": 96091, "epoch": 571} {"train_loss": -9.614409446716309, "global_step": 96092, "epoch": 571} {"train_loss": -9.447633743286133, "global_step": 96093, "epoch": 571} {"train_loss": -9.618896484375, "global_step": 96094, "epoch": 571} {"train_loss": -9.50582035950252, "global_step": 96095, "epoch": 571, "val_loss": 205221.984375} {"train_loss": -9.727832794189453, "global_step": 96096, "epoch": 572} {"train_loss": -9.770148277282715, "global_step": 96097, "epoch": 572} {"train_loss": -9.514860153198242, "global_step": 96098, "epoch": 572} {"train_loss": -9.525758743286133, "global_step": 96099, "epoch": 572} {"train_loss": -9.478697776794434, "global_step": 96100, "epoch": 572} {"train_loss": -9.76656436920166, "global_step": 96101, "epoch": 572} {"train_loss": -9.389719009399414, "global_step": 96102, "epoch": 572} {"train_loss": -9.717693328857422, "global_step": 96103, "epoch": 572} {"train_loss": -9.45219612121582, "global_step": 96104, "epoch": 572} {"train_loss": -9.564221382141113, "global_step": 96105, "epoch": 572} {"train_loss": -9.653956413269043, "global_step": 96106, "epoch": 572} {"train_loss": -9.690984725952148, "global_step": 96107, "epoch": 572} {"train_loss": -9.560670852661133, "global_step": 96108, "epoch": 572} {"train_loss": -9.737300872802734, "global_step": 96109, "epoch": 572} {"train_loss": -9.741013526916504, "global_step": 96110, "epoch": 572} {"train_loss": -9.810126304626465, "global_step": 96111, "epoch": 572} {"train_loss": -9.653387069702148, "global_step": 96112, "epoch": 572} {"train_loss": -9.797502517700195, "global_step": 96113, "epoch": 572} {"train_loss": -9.781621932983398, "global_step": 96114, "epoch": 572} {"train_loss": -9.834312438964844, "global_step": 96115, "epoch": 572} {"train_loss": -9.74627685546875, "global_step": 96116, "epoch": 572} {"train_loss": -9.676087379455566, "global_step": 96117, "epoch": 572} {"train_loss": -9.534746170043945, "global_step": 96118, "epoch": 572} {"train_loss": -9.778020858764648, "global_step": 96119, "epoch": 572} {"train_loss": -9.667548179626465, "global_step": 96120, "epoch": 572} {"train_loss": -9.501863479614258, "global_step": 96121, "epoch": 572} {"train_loss": -9.373401641845703, "global_step": 96122, "epoch": 572} {"train_loss": -9.748172760009766, "global_step": 96123, "epoch": 572} {"train_loss": -9.571457862854004, "global_step": 96124, "epoch": 572} {"train_loss": -9.931113243103027, "global_step": 96125, "epoch": 572} {"train_loss": -9.714052200317383, "global_step": 96126, "epoch": 572} {"train_loss": -9.818658828735352, "global_step": 96127, "epoch": 572} {"train_loss": -9.728445053100586, "global_step": 96128, "epoch": 572} {"train_loss": -9.755563735961914, "global_step": 96129, "epoch": 572} {"train_loss": -9.582597732543945, "global_step": 96130, "epoch": 572} {"train_loss": -9.451870918273926, "global_step": 96131, "epoch": 572} {"train_loss": -9.565611839294434, "global_step": 96132, "epoch": 572} {"train_loss": -9.512313842773438, "global_step": 96133, "epoch": 572} {"train_loss": -9.635868072509766, "global_step": 96134, "epoch": 572} {"train_loss": -9.50516128540039, "global_step": 96135, "epoch": 572} {"train_loss": -9.713844299316406, "global_step": 96136, "epoch": 572} {"train_loss": -9.220259666442871, "global_step": 96137, "epoch": 572} {"train_loss": -9.414787292480469, "global_step": 96138, "epoch": 572} {"train_loss": -9.689972877502441, "global_step": 96139, "epoch": 572} {"train_loss": -9.219171524047852, "global_step": 96140, "epoch": 572} {"train_loss": -9.60699462890625, "global_step": 96141, "epoch": 572} {"train_loss": -9.657711029052734, "global_step": 96142, "epoch": 572} {"train_loss": -9.502274513244629, "global_step": 96143, "epoch": 572} {"train_loss": -9.493505477905273, "global_step": 96144, "epoch": 572} {"train_loss": -9.18803596496582, "global_step": 96145, "epoch": 572} {"train_loss": -9.563803672790527, "global_step": 96146, "epoch": 572} {"train_loss": -9.342655181884766, "global_step": 96147, "epoch": 572} {"train_loss": -9.024903297424316, "global_step": 96148, "epoch": 572} {"train_loss": -9.558727264404297, "global_step": 96149, "epoch": 572} {"train_loss": -9.369598388671875, "global_step": 96150, "epoch": 572} {"train_loss": -9.523171424865723, "global_step": 96151, "epoch": 572} {"train_loss": -9.40654182434082, "global_step": 96152, "epoch": 572} {"train_loss": -9.68539810180664, "global_step": 96153, "epoch": 572} {"train_loss": -9.598861694335938, "global_step": 96154, "epoch": 572} {"train_loss": -9.331193923950195, "global_step": 96155, "epoch": 572} {"train_loss": -9.554827690124512, "global_step": 96156, "epoch": 572} {"train_loss": -9.687074661254883, "global_step": 96157, "epoch": 572} {"train_loss": -9.55457592010498, "global_step": 96158, "epoch": 572} {"train_loss": -9.664520263671875, "global_step": 96159, "epoch": 572} {"train_loss": -9.551658630371094, "global_step": 96160, "epoch": 572} {"train_loss": -9.688108444213867, "global_step": 96161, "epoch": 572} {"train_loss": -9.69581413269043, "global_step": 96162, "epoch": 572} {"train_loss": -9.70559310913086, "global_step": 96163, "epoch": 572} {"train_loss": -9.649471282958984, "global_step": 96164, "epoch": 572} {"train_loss": -9.67862606048584, "global_step": 96165, "epoch": 572} {"train_loss": -9.607357025146484, "global_step": 96166, "epoch": 572} {"train_loss": -9.79161262512207, "global_step": 96167, "epoch": 572} {"train_loss": -9.600582122802734, "global_step": 96168, "epoch": 572} {"train_loss": -9.763500213623047, "global_step": 96169, "epoch": 572} {"train_loss": -9.976512908935547, "global_step": 96170, "epoch": 572} {"train_loss": -9.80234146118164, "global_step": 96171, "epoch": 572} {"train_loss": -9.555073738098145, "global_step": 96172, "epoch": 572} {"train_loss": -9.86812973022461, "global_step": 96173, "epoch": 572} {"train_loss": -9.789873123168945, "global_step": 96174, "epoch": 572} {"train_loss": -9.695940017700195, "global_step": 96175, "epoch": 572} {"train_loss": -9.611446380615234, "global_step": 96176, "epoch": 572} {"train_loss": -9.501367568969727, "global_step": 96177, "epoch": 572} {"train_loss": -9.891164779663086, "global_step": 96178, "epoch": 572} {"train_loss": -9.215911865234375, "global_step": 96179, "epoch": 572} {"train_loss": -9.29079818725586, "global_step": 96180, "epoch": 572} {"train_loss": -8.950607299804688, "global_step": 96181, "epoch": 572} {"train_loss": -9.125619888305664, "global_step": 96182, "epoch": 572} {"train_loss": -9.669604301452637, "global_step": 96183, "epoch": 572} {"train_loss": -8.95337200164795, "global_step": 96184, "epoch": 572} {"train_loss": -9.696735382080078, "global_step": 96185, "epoch": 572} {"train_loss": -9.191818237304688, "global_step": 96186, "epoch": 572} {"train_loss": -9.54510498046875, "global_step": 96187, "epoch": 572} {"train_loss": -9.016317367553711, "global_step": 96188, "epoch": 572} {"train_loss": -9.418663024902344, "global_step": 96189, "epoch": 572} {"train_loss": -9.011165618896484, "global_step": 96190, "epoch": 572} {"train_loss": -9.465160369873047, "global_step": 96191, "epoch": 572} {"train_loss": -9.364095687866211, "global_step": 96192, "epoch": 572} {"train_loss": -9.413724899291992, "global_step": 96193, "epoch": 572} {"train_loss": -9.645425796508789, "global_step": 96194, "epoch": 572} {"train_loss": -9.45602035522461, "global_step": 96195, "epoch": 572} {"train_loss": -9.600460052490234, "global_step": 96196, "epoch": 572} {"train_loss": -9.44878101348877, "global_step": 96197, "epoch": 572} {"train_loss": -9.697259902954102, "global_step": 96198, "epoch": 572} {"train_loss": -9.50429916381836, "global_step": 96199, "epoch": 572} {"train_loss": -9.64145278930664, "global_step": 96200, "epoch": 572} {"train_loss": -9.719427108764648, "global_step": 96201, "epoch": 572} {"train_loss": -9.553716659545898, "global_step": 96202, "epoch": 572} {"train_loss": -9.396010398864746, "global_step": 96203, "epoch": 572} {"train_loss": -9.523658752441406, "global_step": 96204, "epoch": 572} {"train_loss": -9.560050964355469, "global_step": 96205, "epoch": 572} {"train_loss": -9.908376693725586, "global_step": 96206, "epoch": 572} {"train_loss": -9.490143775939941, "global_step": 96207, "epoch": 572} {"train_loss": -9.466994285583496, "global_step": 96208, "epoch": 572} {"train_loss": -9.675004959106445, "global_step": 96209, "epoch": 572} {"train_loss": -9.52681827545166, "global_step": 96210, "epoch": 572} {"train_loss": -9.675146102905273, "global_step": 96211, "epoch": 572} {"train_loss": -9.688926696777344, "global_step": 96212, "epoch": 572} {"train_loss": -9.759076118469238, "global_step": 96213, "epoch": 572} {"train_loss": -9.803613662719727, "global_step": 96214, "epoch": 572} {"train_loss": -9.648956298828125, "global_step": 96215, "epoch": 572} {"train_loss": -9.438838005065918, "global_step": 96216, "epoch": 572} {"train_loss": -9.722970962524414, "global_step": 96217, "epoch": 572} {"train_loss": -9.45151424407959, "global_step": 96218, "epoch": 572} {"train_loss": -9.71894359588623, "global_step": 96219, "epoch": 572} {"train_loss": -9.852636337280273, "global_step": 96220, "epoch": 572} {"train_loss": -9.70121955871582, "global_step": 96221, "epoch": 572} {"train_loss": -9.561025619506836, "global_step": 96222, "epoch": 572} {"train_loss": -9.748702049255371, "global_step": 96223, "epoch": 572} {"train_loss": -9.767029762268066, "global_step": 96224, "epoch": 572} {"train_loss": -9.833919525146484, "global_step": 96225, "epoch": 572} {"train_loss": -9.631336212158203, "global_step": 96226, "epoch": 572} {"train_loss": -9.88369369506836, "global_step": 96227, "epoch": 572} {"train_loss": -9.677206993103027, "global_step": 96228, "epoch": 572} {"train_loss": -9.78663444519043, "global_step": 96229, "epoch": 572} {"train_loss": -9.436500549316406, "global_step": 96230, "epoch": 572} {"train_loss": -9.759270668029785, "global_step": 96231, "epoch": 572} {"train_loss": -9.725327491760254, "global_step": 96232, "epoch": 572} {"train_loss": -9.750152587890625, "global_step": 96233, "epoch": 572} {"train_loss": -9.856678009033203, "global_step": 96234, "epoch": 572} {"train_loss": -10.027921676635742, "global_step": 96235, "epoch": 572} {"train_loss": -9.660820007324219, "global_step": 96236, "epoch": 572} {"train_loss": -9.744665145874023, "global_step": 96237, "epoch": 572} {"train_loss": -9.394366264343262, "global_step": 96238, "epoch": 572} {"train_loss": -9.57111930847168, "global_step": 96239, "epoch": 572} {"train_loss": -9.433671951293945, "global_step": 96240, "epoch": 572} {"train_loss": -9.551352500915527, "global_step": 96241, "epoch": 572} {"train_loss": -9.476795196533203, "global_step": 96242, "epoch": 572} {"train_loss": -9.644659042358398, "global_step": 96243, "epoch": 572} {"train_loss": -9.418519973754883, "global_step": 96244, "epoch": 572} {"train_loss": -9.744674682617188, "global_step": 96245, "epoch": 572} {"train_loss": -9.636556625366211, "global_step": 96246, "epoch": 572} {"train_loss": -9.762138366699219, "global_step": 96247, "epoch": 572} {"train_loss": -9.545251846313477, "global_step": 96248, "epoch": 572} {"train_loss": -9.462312698364258, "global_step": 96249, "epoch": 572} {"train_loss": -9.668815612792969, "global_step": 96250, "epoch": 572} {"train_loss": -9.292016983032227, "global_step": 96251, "epoch": 572} {"train_loss": -9.736214637756348, "global_step": 96252, "epoch": 572} {"train_loss": -9.496053695678711, "global_step": 96253, "epoch": 572} {"train_loss": -9.290461540222168, "global_step": 96254, "epoch": 572} {"train_loss": -9.355850219726562, "global_step": 96255, "epoch": 572} {"train_loss": -9.415447235107422, "global_step": 96256, "epoch": 572} {"train_loss": -9.382352828979492, "global_step": 96257, "epoch": 572} {"train_loss": -9.654668807983398, "global_step": 96258, "epoch": 572} {"train_loss": -9.57807445526123, "global_step": 96259, "epoch": 572} {"train_loss": -9.563385009765625, "global_step": 96260, "epoch": 572} {"train_loss": -9.709789276123047, "global_step": 96261, "epoch": 572} {"train_loss": -9.791948318481445, "global_step": 96262, "epoch": 572} {"train_loss": -9.586794648851667, "global_step": 96263, "epoch": 572, "val_loss": 204205.6875} {"train_loss": -9.684117317199707, "global_step": 96264, "epoch": 573} {"train_loss": -9.655513763427734, "global_step": 96265, "epoch": 573} {"train_loss": -9.90354061126709, "global_step": 96266, "epoch": 573} {"train_loss": -9.545774459838867, "global_step": 96267, "epoch": 573} {"train_loss": -9.879512786865234, "global_step": 96268, "epoch": 573} {"train_loss": -9.759481430053711, "global_step": 96269, "epoch": 573} {"train_loss": -9.65915298461914, "global_step": 96270, "epoch": 573} {"train_loss": -9.688323974609375, "global_step": 96271, "epoch": 573} {"train_loss": -9.5750732421875, "global_step": 96272, "epoch": 573} {"train_loss": -9.846479415893555, "global_step": 96273, "epoch": 573} {"train_loss": -9.768665313720703, "global_step": 96274, "epoch": 573} {"train_loss": -9.803886413574219, "global_step": 96275, "epoch": 573} {"train_loss": -9.686285018920898, "global_step": 96276, "epoch": 573} {"train_loss": -9.747945785522461, "global_step": 96277, "epoch": 573} {"train_loss": -9.734319686889648, "global_step": 96278, "epoch": 573} {"train_loss": -9.62928581237793, "global_step": 96279, "epoch": 573} {"train_loss": -9.903341293334961, "global_step": 96280, "epoch": 573} {"train_loss": -9.60617446899414, "global_step": 96281, "epoch": 573} {"train_loss": -9.49598503112793, "global_step": 96282, "epoch": 573} {"train_loss": -9.7501859664917, "global_step": 96283, "epoch": 573} {"train_loss": -9.822854995727539, "global_step": 96284, "epoch": 573} {"train_loss": -9.428873062133789, "global_step": 96285, "epoch": 573} {"train_loss": -9.886835098266602, "global_step": 96286, "epoch": 573} {"train_loss": -9.502707481384277, "global_step": 96287, "epoch": 573} {"train_loss": -9.63825798034668, "global_step": 96288, "epoch": 573} {"train_loss": -9.52147102355957, "global_step": 96289, "epoch": 573} {"train_loss": -9.380350112915039, "global_step": 96290, "epoch": 573} {"train_loss": -9.662761688232422, "global_step": 96291, "epoch": 573} {"train_loss": -9.678650856018066, "global_step": 96292, "epoch": 573} {"train_loss": -9.519951820373535, "global_step": 96293, "epoch": 573} {"train_loss": -9.252374649047852, "global_step": 96294, "epoch": 573} {"train_loss": -9.74155044555664, "global_step": 96295, "epoch": 573} {"train_loss": -9.549091339111328, "global_step": 96296, "epoch": 573} {"train_loss": -9.390809059143066, "global_step": 96297, "epoch": 573} {"train_loss": -9.486513137817383, "global_step": 96298, "epoch": 573} {"train_loss": -9.378963470458984, "global_step": 96299, "epoch": 573} {"train_loss": -9.737817764282227, "global_step": 96300, "epoch": 573} {"train_loss": -9.179117202758789, "global_step": 96301, "epoch": 573} {"train_loss": -9.506129264831543, "global_step": 96302, "epoch": 573} {"train_loss": -9.48611068725586, "global_step": 96303, "epoch": 573} {"train_loss": -9.473400115966797, "global_step": 96304, "epoch": 573} {"train_loss": -9.573647499084473, "global_step": 96305, "epoch": 573} {"train_loss": -9.639459609985352, "global_step": 96306, "epoch": 573} {"train_loss": -9.745927810668945, "global_step": 96307, "epoch": 573} {"train_loss": -9.866734504699707, "global_step": 96308, "epoch": 573} {"train_loss": -9.471038818359375, "global_step": 96309, "epoch": 573} {"train_loss": -9.52734661102295, "global_step": 96310, "epoch": 573} {"train_loss": -9.660347938537598, "global_step": 96311, "epoch": 573} {"train_loss": -9.629026412963867, "global_step": 96312, "epoch": 573} {"train_loss": -9.51307487487793, "global_step": 96313, "epoch": 573} {"train_loss": -9.860193252563477, "global_step": 96314, "epoch": 573} {"train_loss": -9.487354278564453, "global_step": 96315, "epoch": 573} {"train_loss": -9.750968933105469, "global_step": 96316, "epoch": 573} {"train_loss": -9.686508178710938, "global_step": 96317, "epoch": 573} {"train_loss": -9.753202438354492, "global_step": 96318, "epoch": 573} {"train_loss": -9.472028732299805, "global_step": 96319, "epoch": 573} {"train_loss": -9.274871826171875, "global_step": 96320, "epoch": 573} {"train_loss": -9.176485061645508, "global_step": 96321, "epoch": 573} {"train_loss": -9.620482444763184, "global_step": 96322, "epoch": 573} {"train_loss": -9.595710754394531, "global_step": 96323, "epoch": 573} {"train_loss": -9.602887153625488, "global_step": 96324, "epoch": 573} {"train_loss": -9.349319458007812, "global_step": 96325, "epoch": 573} {"train_loss": -9.564105033874512, "global_step": 96326, "epoch": 573} {"train_loss": -9.42133903503418, "global_step": 96327, "epoch": 573} {"train_loss": -9.680445671081543, "global_step": 96328, "epoch": 573} {"train_loss": -9.287069320678711, "global_step": 96329, "epoch": 573} {"train_loss": -9.591503143310547, "global_step": 96330, "epoch": 573} {"train_loss": -9.622961044311523, "global_step": 96331, "epoch": 573} {"train_loss": -9.393843650817871, "global_step": 96332, "epoch": 573} {"train_loss": -9.644161224365234, "global_step": 96333, "epoch": 573} {"train_loss": -9.358757019042969, "global_step": 96334, "epoch": 573} {"train_loss": -9.600465774536133, "global_step": 96335, "epoch": 573} {"train_loss": -9.30289077758789, "global_step": 96336, "epoch": 573} {"train_loss": -9.699594497680664, "global_step": 96337, "epoch": 573} {"train_loss": -9.404206275939941, "global_step": 96338, "epoch": 573} {"train_loss": -9.436448097229004, "global_step": 96339, "epoch": 573} {"train_loss": -9.394293785095215, "global_step": 96340, "epoch": 573} {"train_loss": -9.496682167053223, "global_step": 96341, "epoch": 573} {"train_loss": -9.563459396362305, "global_step": 96342, "epoch": 573} {"train_loss": -9.300516128540039, "global_step": 96343, "epoch": 573} {"train_loss": -9.46622371673584, "global_step": 96344, "epoch": 573} {"train_loss": -9.554634094238281, "global_step": 96345, "epoch": 573} {"train_loss": -9.61314582824707, "global_step": 96346, "epoch": 573} {"train_loss": -9.455009460449219, "global_step": 96347, "epoch": 573} {"train_loss": -9.666452407836914, "global_step": 96348, "epoch": 573} {"train_loss": -9.175344467163086, "global_step": 96349, "epoch": 573} {"train_loss": -9.700063705444336, "global_step": 96350, "epoch": 573} {"train_loss": -9.554475784301758, "global_step": 96351, "epoch": 573} {"train_loss": -9.440671920776367, "global_step": 96352, "epoch": 573} {"train_loss": -9.506311416625977, "global_step": 96353, "epoch": 573} {"train_loss": -9.489105224609375, "global_step": 96354, "epoch": 573} {"train_loss": -9.418407440185547, "global_step": 96355, "epoch": 573} {"train_loss": -9.546488761901855, "global_step": 96356, "epoch": 573} {"train_loss": -9.538263320922852, "global_step": 96357, "epoch": 573} {"train_loss": -9.286577224731445, "global_step": 96358, "epoch": 573} {"train_loss": -9.656713485717773, "global_step": 96359, "epoch": 573} {"train_loss": -9.282254219055176, "global_step": 96360, "epoch": 573} {"train_loss": -9.54654312133789, "global_step": 96361, "epoch": 573} {"train_loss": -9.641845703125, "global_step": 96362, "epoch": 573} {"train_loss": -9.288676261901855, "global_step": 96363, "epoch": 573} {"train_loss": -9.516944885253906, "global_step": 96364, "epoch": 573} {"train_loss": -9.623828887939453, "global_step": 96365, "epoch": 573} {"train_loss": -9.407289505004883, "global_step": 96366, "epoch": 573} {"train_loss": -9.770120620727539, "global_step": 96367, "epoch": 573} {"train_loss": -9.625715255737305, "global_step": 96368, "epoch": 573} {"train_loss": -9.552892684936523, "global_step": 96369, "epoch": 573} {"train_loss": -9.812000274658203, "global_step": 96370, "epoch": 573} {"train_loss": -9.495359420776367, "global_step": 96371, "epoch": 573} {"train_loss": -9.321882247924805, "global_step": 96372, "epoch": 573} {"train_loss": -9.815312385559082, "global_step": 96373, "epoch": 573} {"train_loss": -9.49050235748291, "global_step": 96374, "epoch": 573} {"train_loss": -9.635503768920898, "global_step": 96375, "epoch": 573} {"train_loss": -9.661968231201172, "global_step": 96376, "epoch": 573} {"train_loss": -9.586702346801758, "global_step": 96377, "epoch": 573} {"train_loss": -9.58590030670166, "global_step": 96378, "epoch": 573} {"train_loss": -9.951629638671875, "global_step": 96379, "epoch": 573} {"train_loss": -9.942485809326172, "global_step": 96380, "epoch": 573} {"train_loss": -9.669368743896484, "global_step": 96381, "epoch": 573} {"train_loss": -9.781278610229492, "global_step": 96382, "epoch": 573} {"train_loss": -9.513838768005371, "global_step": 96383, "epoch": 573} {"train_loss": -9.56045150756836, "global_step": 96384, "epoch": 573} {"train_loss": -9.520444869995117, "global_step": 96385, "epoch": 573} {"train_loss": -9.598207473754883, "global_step": 96386, "epoch": 573} {"train_loss": -9.342620849609375, "global_step": 96387, "epoch": 573} {"train_loss": -9.782144546508789, "global_step": 96388, "epoch": 573} {"train_loss": -9.80363941192627, "global_step": 96389, "epoch": 573} {"train_loss": -9.509740829467773, "global_step": 96390, "epoch": 573} {"train_loss": -9.767443656921387, "global_step": 96391, "epoch": 573} {"train_loss": -9.76905345916748, "global_step": 96392, "epoch": 573} {"train_loss": -9.743244171142578, "global_step": 96393, "epoch": 573} {"train_loss": -9.679864883422852, "global_step": 96394, "epoch": 573} {"train_loss": -9.654537200927734, "global_step": 96395, "epoch": 573} {"train_loss": -9.807266235351562, "global_step": 96396, "epoch": 573} {"train_loss": -9.868112564086914, "global_step": 96397, "epoch": 573} {"train_loss": -9.583639144897461, "global_step": 96398, "epoch": 573} {"train_loss": -9.973974227905273, "global_step": 96399, "epoch": 573} {"train_loss": -9.653724670410156, "global_step": 96400, "epoch": 573} {"train_loss": -9.835517883300781, "global_step": 96401, "epoch": 573} {"train_loss": -9.79809856414795, "global_step": 96402, "epoch": 573} {"train_loss": -9.7841157913208, "global_step": 96403, "epoch": 573} {"train_loss": -9.947763442993164, "global_step": 96404, "epoch": 573} {"train_loss": -9.825870513916016, "global_step": 96405, "epoch": 573} {"train_loss": -9.644818305969238, "global_step": 96406, "epoch": 573} {"train_loss": -9.643645286560059, "global_step": 96407, "epoch": 573} {"train_loss": -9.685674667358398, "global_step": 96408, "epoch": 573} {"train_loss": -9.843179702758789, "global_step": 96409, "epoch": 573} {"train_loss": -9.60989761352539, "global_step": 96410, "epoch": 573} {"train_loss": -9.625380516052246, "global_step": 96411, "epoch": 573} {"train_loss": -9.446285247802734, "global_step": 96412, "epoch": 573} {"train_loss": -9.83827018737793, "global_step": 96413, "epoch": 573} {"train_loss": -9.611724853515625, "global_step": 96414, "epoch": 573} {"train_loss": -9.540315628051758, "global_step": 96415, "epoch": 573} {"train_loss": -9.556022644042969, "global_step": 96416, "epoch": 573} {"train_loss": -9.757394790649414, "global_step": 96417, "epoch": 573} {"train_loss": -9.754058837890625, "global_step": 96418, "epoch": 573} {"train_loss": -9.214670181274414, "global_step": 96419, "epoch": 573} {"train_loss": -9.762028694152832, "global_step": 96420, "epoch": 573} {"train_loss": -9.326981544494629, "global_step": 96421, "epoch": 573} {"train_loss": -9.525833129882812, "global_step": 96422, "epoch": 573} {"train_loss": -9.338458061218262, "global_step": 96423, "epoch": 573} {"train_loss": -9.141042709350586, "global_step": 96424, "epoch": 573} {"train_loss": -9.6444091796875, "global_step": 96425, "epoch": 573} {"train_loss": -9.461012840270996, "global_step": 96426, "epoch": 573} {"train_loss": -9.518814086914062, "global_step": 96427, "epoch": 573} {"train_loss": -9.430570602416992, "global_step": 96428, "epoch": 573} {"train_loss": -9.213207244873047, "global_step": 96429, "epoch": 573} {"train_loss": -9.115263938903809, "global_step": 96430, "epoch": 573} {"train_loss": -9.585219587598528, "global_step": 96431, "epoch": 573, "val_loss": 204893.390625} {"train_loss": -9.377681732177734, "global_step": 96432, "epoch": 574} {"train_loss": -9.395241737365723, "global_step": 96433, "epoch": 574} {"train_loss": -9.456473350524902, "global_step": 96434, "epoch": 574} {"train_loss": -9.445623397827148, "global_step": 96435, "epoch": 574} {"train_loss": -9.215710639953613, "global_step": 96436, "epoch": 574} {"train_loss": -9.37002182006836, "global_step": 96437, "epoch": 574} {"train_loss": -9.195182800292969, "global_step": 96438, "epoch": 574} {"train_loss": -9.372549057006836, "global_step": 96439, "epoch": 574} {"train_loss": -9.220968246459961, "global_step": 96440, "epoch": 574} {"train_loss": -9.283140182495117, "global_step": 96441, "epoch": 574} {"train_loss": -9.27413272857666, "global_step": 96442, "epoch": 574} {"train_loss": -9.341915130615234, "global_step": 96443, "epoch": 574} {"train_loss": -9.378629684448242, "global_step": 96444, "epoch": 574} {"train_loss": -9.505051612854004, "global_step": 96445, "epoch": 574} {"train_loss": -9.6263427734375, "global_step": 96446, "epoch": 574} {"train_loss": -9.38248062133789, "global_step": 96447, "epoch": 574} {"train_loss": -9.519804000854492, "global_step": 96448, "epoch": 574} {"train_loss": -9.415519714355469, "global_step": 96449, "epoch": 574} {"train_loss": -9.410539627075195, "global_step": 96450, "epoch": 574} {"train_loss": -9.608478546142578, "global_step": 96451, "epoch": 574} {"train_loss": -9.569113731384277, "global_step": 96452, "epoch": 574} {"train_loss": -9.643360137939453, "global_step": 96453, "epoch": 574} {"train_loss": -9.527444839477539, "global_step": 96454, "epoch": 574} {"train_loss": -9.565359115600586, "global_step": 96455, "epoch": 574} {"train_loss": -9.765730857849121, "global_step": 96456, "epoch": 574} {"train_loss": -9.674190521240234, "global_step": 96457, "epoch": 574} {"train_loss": -9.694862365722656, "global_step": 96458, "epoch": 574} {"train_loss": -9.324256896972656, "global_step": 96459, "epoch": 574} {"train_loss": -9.788339614868164, "global_step": 96460, "epoch": 574} {"train_loss": -9.817300796508789, "global_step": 96461, "epoch": 574} {"train_loss": -9.708911895751953, "global_step": 96462, "epoch": 574} {"train_loss": -9.652966499328613, "global_step": 96463, "epoch": 574} {"train_loss": -9.70619010925293, "global_step": 96464, "epoch": 574} {"train_loss": -9.890501976013184, "global_step": 96465, "epoch": 574} {"train_loss": -9.518322944641113, "global_step": 96466, "epoch": 574} {"train_loss": -9.565239906311035, "global_step": 96467, "epoch": 574} {"train_loss": -9.62172794342041, "global_step": 96468, "epoch": 574} {"train_loss": -9.406543731689453, "global_step": 96469, "epoch": 574} {"train_loss": -9.679020881652832, "global_step": 96470, "epoch": 574} {"train_loss": -9.51345443725586, "global_step": 96471, "epoch": 574} {"train_loss": -9.562429428100586, "global_step": 96472, "epoch": 574} {"train_loss": -9.45973014831543, "global_step": 96473, "epoch": 574} {"train_loss": -9.777639389038086, "global_step": 96474, "epoch": 574} {"train_loss": -9.549736022949219, "global_step": 96475, "epoch": 574} {"train_loss": -9.476238250732422, "global_step": 96476, "epoch": 574} {"train_loss": -9.670820236206055, "global_step": 96477, "epoch": 574} {"train_loss": -9.759246826171875, "global_step": 96478, "epoch": 574} {"train_loss": -9.252381324768066, "global_step": 96479, "epoch": 574} {"train_loss": -8.762840270996094, "global_step": 96480, "epoch": 574} {"train_loss": -9.671987533569336, "global_step": 96481, "epoch": 574} {"train_loss": -9.33679485321045, "global_step": 96482, "epoch": 574} {"train_loss": -9.501388549804688, "global_step": 96483, "epoch": 574} {"train_loss": -9.498835563659668, "global_step": 96484, "epoch": 574} {"train_loss": -9.405439376831055, "global_step": 96485, "epoch": 574} {"train_loss": -9.511041641235352, "global_step": 96486, "epoch": 574} {"train_loss": -9.378349304199219, "global_step": 96487, "epoch": 574} {"train_loss": -9.550361633300781, "global_step": 96488, "epoch": 574} {"train_loss": -9.77619743347168, "global_step": 96489, "epoch": 574} {"train_loss": -9.745597839355469, "global_step": 96490, "epoch": 574} {"train_loss": -9.698948860168457, "global_step": 96491, "epoch": 574} {"train_loss": -9.659406661987305, "global_step": 96492, "epoch": 574} {"train_loss": -9.642452239990234, "global_step": 96493, "epoch": 574} {"train_loss": -9.651476860046387, "global_step": 96494, "epoch": 574} {"train_loss": -9.753292083740234, "global_step": 96495, "epoch": 574} {"train_loss": -9.535120964050293, "global_step": 96496, "epoch": 574} {"train_loss": -9.670553207397461, "global_step": 96497, "epoch": 574} {"train_loss": -9.632817268371582, "global_step": 96498, "epoch": 574} {"train_loss": -9.280725479125977, "global_step": 96499, "epoch": 574} {"train_loss": -9.668399810791016, "global_step": 96500, "epoch": 574} {"train_loss": -9.720020294189453, "global_step": 96501, "epoch": 574} {"train_loss": -9.727090835571289, "global_step": 96502, "epoch": 574} {"train_loss": -9.737672805786133, "global_step": 96503, "epoch": 574} {"train_loss": -9.748119354248047, "global_step": 96504, "epoch": 574} {"train_loss": -9.467333793640137, "global_step": 96505, "epoch": 574} {"train_loss": -9.85958480834961, "global_step": 96506, "epoch": 574} {"train_loss": -9.661699295043945, "global_step": 96507, "epoch": 574} {"train_loss": -9.983879089355469, "global_step": 96508, "epoch": 574} {"train_loss": -9.69973373413086, "global_step": 96509, "epoch": 574} {"train_loss": -9.798542022705078, "global_step": 96510, "epoch": 574} {"train_loss": -9.6845703125, "global_step": 96511, "epoch": 574} {"train_loss": -9.24073600769043, "global_step": 96512, "epoch": 574} {"train_loss": -9.332357406616211, "global_step": 96513, "epoch": 574} {"train_loss": -9.280538558959961, "global_step": 96514, "epoch": 574} {"train_loss": -9.519021987915039, "global_step": 96515, "epoch": 574} {"train_loss": -9.51766300201416, "global_step": 96516, "epoch": 574} {"train_loss": -9.453590393066406, "global_step": 96517, "epoch": 574} {"train_loss": -9.669617652893066, "global_step": 96518, "epoch": 574} {"train_loss": -9.521112442016602, "global_step": 96519, "epoch": 574} {"train_loss": -9.353791236877441, "global_step": 96520, "epoch": 574} {"train_loss": -9.687347412109375, "global_step": 96521, "epoch": 574} {"train_loss": -9.285554885864258, "global_step": 96522, "epoch": 574} {"train_loss": -9.65762996673584, "global_step": 96523, "epoch": 574} {"train_loss": -9.702751159667969, "global_step": 96524, "epoch": 574} {"train_loss": -9.447299003601074, "global_step": 96525, "epoch": 574} {"train_loss": -9.540980339050293, "global_step": 96526, "epoch": 574} {"train_loss": -9.658798217773438, "global_step": 96527, "epoch": 574} {"train_loss": -9.368524551391602, "global_step": 96528, "epoch": 574} {"train_loss": -9.792867660522461, "global_step": 96529, "epoch": 574} {"train_loss": -9.740394592285156, "global_step": 96530, "epoch": 574} {"train_loss": -9.474006652832031, "global_step": 96531, "epoch": 574} {"train_loss": -9.998451232910156, "global_step": 96532, "epoch": 574} {"train_loss": -9.664471626281738, "global_step": 96533, "epoch": 574} {"train_loss": -9.706650733947754, "global_step": 96534, "epoch": 574} {"train_loss": -9.540790557861328, "global_step": 96535, "epoch": 574} {"train_loss": -9.680169105529785, "global_step": 96536, "epoch": 574} {"train_loss": -9.564214706420898, "global_step": 96537, "epoch": 574} {"train_loss": -9.546035766601562, "global_step": 96538, "epoch": 574} {"train_loss": -9.548072814941406, "global_step": 96539, "epoch": 574} {"train_loss": -9.543561935424805, "global_step": 96540, "epoch": 574} {"train_loss": -9.63565444946289, "global_step": 96541, "epoch": 574} {"train_loss": -9.35096549987793, "global_step": 96542, "epoch": 574} {"train_loss": -9.48000431060791, "global_step": 96543, "epoch": 574} {"train_loss": -9.223334312438965, "global_step": 96544, "epoch": 574} {"train_loss": -9.160367012023926, "global_step": 96545, "epoch": 574} {"train_loss": -9.359837532043457, "global_step": 96546, "epoch": 574} {"train_loss": -9.260417938232422, "global_step": 96547, "epoch": 574} {"train_loss": -9.596736907958984, "global_step": 96548, "epoch": 574} {"train_loss": -9.439558029174805, "global_step": 96549, "epoch": 574} {"train_loss": -9.111627578735352, "global_step": 96550, "epoch": 574} {"train_loss": -9.431924819946289, "global_step": 96551, "epoch": 574} {"train_loss": -9.294573783874512, "global_step": 96552, "epoch": 574} {"train_loss": -9.469551086425781, "global_step": 96553, "epoch": 574} {"train_loss": -9.081459999084473, "global_step": 96554, "epoch": 574} {"train_loss": -9.697193145751953, "global_step": 96555, "epoch": 574} {"train_loss": -9.425883293151855, "global_step": 96556, "epoch": 574} {"train_loss": -9.505716323852539, "global_step": 96557, "epoch": 574} {"train_loss": -9.411624908447266, "global_step": 96558, "epoch": 574} {"train_loss": -9.545889854431152, "global_step": 96559, "epoch": 574} {"train_loss": -9.582366943359375, "global_step": 96560, "epoch": 574} {"train_loss": -9.838838577270508, "global_step": 96561, "epoch": 574} {"train_loss": -9.618144989013672, "global_step": 96562, "epoch": 574} {"train_loss": -9.522733688354492, "global_step": 96563, "epoch": 574} {"train_loss": -9.674555778503418, "global_step": 96564, "epoch": 574} {"train_loss": -9.601419448852539, "global_step": 96565, "epoch": 574} {"train_loss": -9.552460670471191, "global_step": 96566, "epoch": 574} {"train_loss": -9.678304672241211, "global_step": 96567, "epoch": 574} {"train_loss": -9.958334922790527, "global_step": 96568, "epoch": 574} {"train_loss": -9.55199909210205, "global_step": 96569, "epoch": 574} {"train_loss": -9.822582244873047, "global_step": 96570, "epoch": 574} {"train_loss": -9.835155487060547, "global_step": 96571, "epoch": 574} {"train_loss": -9.934147834777832, "global_step": 96572, "epoch": 574} {"train_loss": -9.518582344055176, "global_step": 96573, "epoch": 574} {"train_loss": -9.682306289672852, "global_step": 96574, "epoch": 574} {"train_loss": -9.476248741149902, "global_step": 96575, "epoch": 574} {"train_loss": -9.821046829223633, "global_step": 96576, "epoch": 574} {"train_loss": -9.8209810256958, "global_step": 96577, "epoch": 574} {"train_loss": -9.906183242797852, "global_step": 96578, "epoch": 574} {"train_loss": -9.607707023620605, "global_step": 96579, "epoch": 574} {"train_loss": -9.881505966186523, "global_step": 96580, "epoch": 574} {"train_loss": -9.4725341796875, "global_step": 96581, "epoch": 574} {"train_loss": -9.714356422424316, "global_step": 96582, "epoch": 574} {"train_loss": -9.502899169921875, "global_step": 96583, "epoch": 574} {"train_loss": -9.501256942749023, "global_step": 96584, "epoch": 574} {"train_loss": -9.740561485290527, "global_step": 96585, "epoch": 574} {"train_loss": -9.324111938476562, "global_step": 96586, "epoch": 574} {"train_loss": -9.390756607055664, "global_step": 96587, "epoch": 574} {"train_loss": -9.48582649230957, "global_step": 96588, "epoch": 574} {"train_loss": -9.551372528076172, "global_step": 96589, "epoch": 574} {"train_loss": -9.86954116821289, "global_step": 96590, "epoch": 574} {"train_loss": -9.424955368041992, "global_step": 96591, "epoch": 574} {"train_loss": -9.559930801391602, "global_step": 96592, "epoch": 574} {"train_loss": -9.769950866699219, "global_step": 96593, "epoch": 574} {"train_loss": -9.325090408325195, "global_step": 96594, "epoch": 574} {"train_loss": -9.622579574584961, "global_step": 96595, "epoch": 574} {"train_loss": -9.631592750549316, "global_step": 96596, "epoch": 574} {"train_loss": -9.739306449890137, "global_step": 96597, "epoch": 574} {"train_loss": -9.488533020019531, "global_step": 96598, "epoch": 574} {"train_loss": -9.557515167054676, "global_step": 96599, "epoch": 574, "val_loss": 205322.6875} {"train_loss": -9.311418533325195, "global_step": 96600, "epoch": 575} {"train_loss": -9.144335746765137, "global_step": 96601, "epoch": 575} {"train_loss": -9.16291332244873, "global_step": 96602, "epoch": 575} {"train_loss": -9.408895492553711, "global_step": 96603, "epoch": 575} {"train_loss": -9.265061378479004, "global_step": 96604, "epoch": 575} {"train_loss": -9.474803924560547, "global_step": 96605, "epoch": 575} {"train_loss": -8.9634370803833, "global_step": 96606, "epoch": 575} {"train_loss": -9.081060409545898, "global_step": 96607, "epoch": 575} {"train_loss": -8.735858917236328, "global_step": 96608, "epoch": 575} {"train_loss": -9.221978187561035, "global_step": 96609, "epoch": 575} {"train_loss": -9.396352767944336, "global_step": 96610, "epoch": 575} {"train_loss": -9.022043228149414, "global_step": 96611, "epoch": 575} {"train_loss": -9.309890747070312, "global_step": 96612, "epoch": 575} {"train_loss": -8.927602767944336, "global_step": 96613, "epoch": 575} {"train_loss": -9.381775856018066, "global_step": 96614, "epoch": 575} {"train_loss": -9.138898849487305, "global_step": 96615, "epoch": 575} {"train_loss": -9.099443435668945, "global_step": 96616, "epoch": 575} {"train_loss": -9.208890914916992, "global_step": 96617, "epoch": 575} {"train_loss": -9.01246452331543, "global_step": 96618, "epoch": 575} {"train_loss": -9.390769958496094, "global_step": 96619, "epoch": 575} {"train_loss": -9.516738891601562, "global_step": 96620, "epoch": 575} {"train_loss": -9.15589714050293, "global_step": 96621, "epoch": 575} {"train_loss": -9.707342147827148, "global_step": 96622, "epoch": 575} {"train_loss": -9.482942581176758, "global_step": 96623, "epoch": 575} {"train_loss": -9.503805160522461, "global_step": 96624, "epoch": 575} {"train_loss": -9.367507934570312, "global_step": 96625, "epoch": 575} {"train_loss": -9.400045394897461, "global_step": 96626, "epoch": 575} {"train_loss": -9.260251998901367, "global_step": 96627, "epoch": 575} {"train_loss": -9.467714309692383, "global_step": 96628, "epoch": 575} {"train_loss": -9.43940544128418, "global_step": 96629, "epoch": 575} {"train_loss": -9.33006477355957, "global_step": 96630, "epoch": 575} {"train_loss": -9.606905937194824, "global_step": 96631, "epoch": 575} {"train_loss": -9.763700485229492, "global_step": 96632, "epoch": 575} {"train_loss": -9.465190887451172, "global_step": 96633, "epoch": 575} {"train_loss": -9.484723091125488, "global_step": 96634, "epoch": 575} {"train_loss": -9.612194061279297, "global_step": 96635, "epoch": 575} {"train_loss": -9.535325050354004, "global_step": 96636, "epoch": 575} {"train_loss": -9.703693389892578, "global_step": 96637, "epoch": 575} {"train_loss": -9.899702072143555, "global_step": 96638, "epoch": 575} {"train_loss": -9.666179656982422, "global_step": 96639, "epoch": 575} {"train_loss": -9.77208423614502, "global_step": 96640, "epoch": 575} {"train_loss": -9.804605484008789, "global_step": 96641, "epoch": 575} {"train_loss": -9.710664749145508, "global_step": 96642, "epoch": 575} {"train_loss": -9.641005516052246, "global_step": 96643, "epoch": 575} {"train_loss": -9.82934856414795, "global_step": 96644, "epoch": 575} {"train_loss": -9.824960708618164, "global_step": 96645, "epoch": 575} {"train_loss": -9.894808769226074, "global_step": 96646, "epoch": 575} {"train_loss": -9.775120735168457, "global_step": 96647, "epoch": 575} {"train_loss": -9.727901458740234, "global_step": 96648, "epoch": 575} {"train_loss": -9.700249671936035, "global_step": 96649, "epoch": 575} {"train_loss": -9.860005378723145, "global_step": 96650, "epoch": 575} {"train_loss": -9.922529220581055, "global_step": 96651, "epoch": 575} {"train_loss": -9.664413452148438, "global_step": 96652, "epoch": 575} {"train_loss": -9.853910446166992, "global_step": 96653, "epoch": 575} {"train_loss": -9.645145416259766, "global_step": 96654, "epoch": 575} {"train_loss": -9.616949081420898, "global_step": 96655, "epoch": 575} {"train_loss": -9.282318115234375, "global_step": 96656, "epoch": 575} {"train_loss": -9.503087043762207, "global_step": 96657, "epoch": 575} {"train_loss": -9.490869522094727, "global_step": 96658, "epoch": 575} {"train_loss": -8.949445724487305, "global_step": 96659, "epoch": 575} {"train_loss": -9.414728164672852, "global_step": 96660, "epoch": 575} {"train_loss": -9.728719711303711, "global_step": 96661, "epoch": 575} {"train_loss": -9.192230224609375, "global_step": 96662, "epoch": 575} {"train_loss": -9.29454231262207, "global_step": 96663, "epoch": 575} {"train_loss": -9.294037818908691, "global_step": 96664, "epoch": 575} {"train_loss": -8.974449157714844, "global_step": 96665, "epoch": 575} {"train_loss": -9.362363815307617, "global_step": 96666, "epoch": 575} {"train_loss": -9.373055458068848, "global_step": 96667, "epoch": 575} {"train_loss": -9.644790649414062, "global_step": 96668, "epoch": 575} {"train_loss": -9.046220779418945, "global_step": 96669, "epoch": 575} {"train_loss": -9.421879768371582, "global_step": 96670, "epoch": 575} {"train_loss": -9.520825386047363, "global_step": 96671, "epoch": 575} {"train_loss": -9.437702178955078, "global_step": 96672, "epoch": 575} {"train_loss": -9.207769393920898, "global_step": 96673, "epoch": 575} {"train_loss": -9.644709587097168, "global_step": 96674, "epoch": 575} {"train_loss": -9.43326473236084, "global_step": 96675, "epoch": 575} {"train_loss": -9.726759910583496, "global_step": 96676, "epoch": 575} {"train_loss": -9.595481872558594, "global_step": 96677, "epoch": 575} {"train_loss": -9.695731163024902, "global_step": 96678, "epoch": 575} {"train_loss": -9.57284164428711, "global_step": 96679, "epoch": 575} {"train_loss": -9.685606002807617, "global_step": 96680, "epoch": 575} {"train_loss": -9.579404830932617, "global_step": 96681, "epoch": 575} {"train_loss": -9.57608413696289, "global_step": 96682, "epoch": 575} {"train_loss": -9.562132835388184, "global_step": 96683, "epoch": 575} {"train_loss": -9.55664348602295, "global_step": 96684, "epoch": 575} {"train_loss": -9.729686737060547, "global_step": 96685, "epoch": 575} {"train_loss": -9.677544593811035, "global_step": 96686, "epoch": 575} {"train_loss": -9.649954795837402, "global_step": 96687, "epoch": 575} {"train_loss": -9.584474563598633, "global_step": 96688, "epoch": 575} {"train_loss": -9.793813705444336, "global_step": 96689, "epoch": 575} {"train_loss": -9.799232482910156, "global_step": 96690, "epoch": 575} {"train_loss": -9.790945053100586, "global_step": 96691, "epoch": 575} {"train_loss": -9.797008514404297, "global_step": 96692, "epoch": 575} {"train_loss": -9.666959762573242, "global_step": 96693, "epoch": 575} {"train_loss": -9.80191707611084, "global_step": 96694, "epoch": 575} {"train_loss": -9.502748489379883, "global_step": 96695, "epoch": 575} {"train_loss": -9.80777359008789, "global_step": 96696, "epoch": 575} {"train_loss": -9.713115692138672, "global_step": 96697, "epoch": 575} {"train_loss": -9.442306518554688, "global_step": 96698, "epoch": 575} {"train_loss": -9.710779190063477, "global_step": 96699, "epoch": 575} {"train_loss": -9.73122501373291, "global_step": 96700, "epoch": 575} {"train_loss": -9.579920768737793, "global_step": 96701, "epoch": 575} {"train_loss": -9.576486587524414, "global_step": 96702, "epoch": 575} {"train_loss": -9.855409622192383, "global_step": 96703, "epoch": 575} {"train_loss": -9.827875137329102, "global_step": 96704, "epoch": 575} {"train_loss": -9.64359188079834, "global_step": 96705, "epoch": 575} {"train_loss": -9.518770217895508, "global_step": 96706, "epoch": 575} {"train_loss": -9.976898193359375, "global_step": 96707, "epoch": 575} {"train_loss": -9.823796272277832, "global_step": 96708, "epoch": 575} {"train_loss": -9.597478866577148, "global_step": 96709, "epoch": 575} {"train_loss": -9.854488372802734, "global_step": 96710, "epoch": 575} {"train_loss": -9.568403244018555, "global_step": 96711, "epoch": 575} {"train_loss": -9.592582702636719, "global_step": 96712, "epoch": 575} {"train_loss": -9.856505393981934, "global_step": 96713, "epoch": 575} {"train_loss": -9.186868667602539, "global_step": 96714, "epoch": 575} {"train_loss": -9.904104232788086, "global_step": 96715, "epoch": 575} {"train_loss": -9.612653732299805, "global_step": 96716, "epoch": 575} {"train_loss": -9.27591323852539, "global_step": 96717, "epoch": 575} {"train_loss": -9.662125587463379, "global_step": 96718, "epoch": 575} {"train_loss": -9.198801040649414, "global_step": 96719, "epoch": 575} {"train_loss": -9.304217338562012, "global_step": 96720, "epoch": 575} {"train_loss": -9.485929489135742, "global_step": 96721, "epoch": 575} {"train_loss": -9.311769485473633, "global_step": 96722, "epoch": 575} {"train_loss": -9.759536743164062, "global_step": 96723, "epoch": 575} {"train_loss": -9.46479606628418, "global_step": 96724, "epoch": 575} {"train_loss": -9.586029052734375, "global_step": 96725, "epoch": 575} {"train_loss": -9.263821601867676, "global_step": 96726, "epoch": 575} {"train_loss": -9.71357536315918, "global_step": 96727, "epoch": 575} {"train_loss": -9.30644416809082, "global_step": 96728, "epoch": 575} {"train_loss": -9.491090774536133, "global_step": 96729, "epoch": 575} {"train_loss": -9.30168342590332, "global_step": 96730, "epoch": 575} {"train_loss": -9.428282737731934, "global_step": 96731, "epoch": 575} {"train_loss": -9.504151344299316, "global_step": 96732, "epoch": 575} {"train_loss": -9.675432205200195, "global_step": 96733, "epoch": 575} {"train_loss": -9.58498764038086, "global_step": 96734, "epoch": 575} {"train_loss": -9.805581092834473, "global_step": 96735, "epoch": 575} {"train_loss": -9.204678535461426, "global_step": 96736, "epoch": 575} {"train_loss": -9.552556991577148, "global_step": 96737, "epoch": 575} {"train_loss": -9.153637886047363, "global_step": 96738, "epoch": 575} {"train_loss": -9.57319450378418, "global_step": 96739, "epoch": 575} {"train_loss": -9.343954086303711, "global_step": 96740, "epoch": 575} {"train_loss": -9.531095504760742, "global_step": 96741, "epoch": 575} {"train_loss": -9.515946388244629, "global_step": 96742, "epoch": 575} {"train_loss": -9.649681091308594, "global_step": 96743, "epoch": 575} {"train_loss": -9.61213493347168, "global_step": 96744, "epoch": 575} {"train_loss": -9.632721900939941, "global_step": 96745, "epoch": 575} {"train_loss": -9.233312606811523, "global_step": 96746, "epoch": 575} {"train_loss": -9.54173469543457, "global_step": 96747, "epoch": 575} {"train_loss": -9.544416427612305, "global_step": 96748, "epoch": 575} {"train_loss": -9.888678550720215, "global_step": 96749, "epoch": 575} {"train_loss": -9.436233520507812, "global_step": 96750, "epoch": 575} {"train_loss": -9.919720649719238, "global_step": 96751, "epoch": 575} {"train_loss": -9.590980529785156, "global_step": 96752, "epoch": 575} {"train_loss": -9.80222225189209, "global_step": 96753, "epoch": 575} {"train_loss": -9.704675674438477, "global_step": 96754, "epoch": 575} {"train_loss": -9.479532241821289, "global_step": 96755, "epoch": 575} {"train_loss": -9.88871955871582, "global_step": 96756, "epoch": 575} {"train_loss": -9.655122756958008, "global_step": 96757, "epoch": 575} {"train_loss": -9.675273895263672, "global_step": 96758, "epoch": 575} {"train_loss": -9.657431602478027, "global_step": 96759, "epoch": 575} {"train_loss": -9.72543716430664, "global_step": 96760, "epoch": 575} {"train_loss": -9.65766716003418, "global_step": 96761, "epoch": 575} {"train_loss": -9.720405578613281, "global_step": 96762, "epoch": 575} {"train_loss": -9.628303527832031, "global_step": 96763, "epoch": 575} {"train_loss": -9.763184547424316, "global_step": 96764, "epoch": 575} {"train_loss": -9.623486518859863, "global_step": 96765, "epoch": 575} {"train_loss": -9.663433074951172, "global_step": 96766, "epoch": 575} {"train_loss": -9.533993164698282, "global_step": 96767, "epoch": 575, "val_loss": 205605.78125, "train_action_mse_error": 2.1384153366088867} {"train_loss": -9.524406433105469, "global_step": 96768, "epoch": 576} {"train_loss": -9.735306739807129, "global_step": 96769, "epoch": 576} {"train_loss": -9.505189895629883, "global_step": 96770, "epoch": 576} {"train_loss": -9.713637351989746, "global_step": 96771, "epoch": 576} {"train_loss": -9.46489143371582, "global_step": 96772, "epoch": 576} {"train_loss": -9.310893058776855, "global_step": 96773, "epoch": 576} {"train_loss": -9.745121002197266, "global_step": 96774, "epoch": 576} {"train_loss": -9.512458801269531, "global_step": 96775, "epoch": 576} {"train_loss": -9.520086288452148, "global_step": 96776, "epoch": 576} {"train_loss": -9.396261215209961, "global_step": 96777, "epoch": 576} {"train_loss": -9.180424690246582, "global_step": 96778, "epoch": 576} {"train_loss": -9.531916618347168, "global_step": 96779, "epoch": 576} {"train_loss": -9.158645629882812, "global_step": 96780, "epoch": 576} {"train_loss": -9.538509368896484, "global_step": 96781, "epoch": 576} {"train_loss": -9.300383567810059, "global_step": 96782, "epoch": 576} {"train_loss": -9.41925048828125, "global_step": 96783, "epoch": 576} {"train_loss": -9.18913459777832, "global_step": 96784, "epoch": 576} {"train_loss": -9.251983642578125, "global_step": 96785, "epoch": 576} {"train_loss": -9.255807876586914, "global_step": 96786, "epoch": 576} {"train_loss": -9.433126449584961, "global_step": 96787, "epoch": 576} {"train_loss": -9.60064697265625, "global_step": 96788, "epoch": 576} {"train_loss": -9.464643478393555, "global_step": 96789, "epoch": 576} {"train_loss": -9.422689437866211, "global_step": 96790, "epoch": 576} {"train_loss": -9.355975151062012, "global_step": 96791, "epoch": 576} {"train_loss": -9.605740547180176, "global_step": 96792, "epoch": 576} {"train_loss": -9.59605598449707, "global_step": 96793, "epoch": 576} {"train_loss": -9.59857177734375, "global_step": 96794, "epoch": 576} {"train_loss": -9.704244613647461, "global_step": 96795, "epoch": 576} {"train_loss": -9.316856384277344, "global_step": 96796, "epoch": 576} {"train_loss": -9.422080993652344, "global_step": 96797, "epoch": 576} {"train_loss": -9.72030258178711, "global_step": 96798, "epoch": 576} {"train_loss": -9.276514053344727, "global_step": 96799, "epoch": 576} {"train_loss": -9.506206512451172, "global_step": 96800, "epoch": 576} {"train_loss": -9.71835708618164, "global_step": 96801, "epoch": 576} {"train_loss": -9.565641403198242, "global_step": 96802, "epoch": 576} {"train_loss": -9.474902153015137, "global_step": 96803, "epoch": 576} {"train_loss": -9.440343856811523, "global_step": 96804, "epoch": 576} {"train_loss": -9.559946060180664, "global_step": 96805, "epoch": 576} {"train_loss": -9.580900192260742, "global_step": 96806, "epoch": 576} {"train_loss": -9.713106155395508, "global_step": 96807, "epoch": 576} {"train_loss": -9.715538024902344, "global_step": 96808, "epoch": 576} {"train_loss": -9.947839736938477, "global_step": 96809, "epoch": 576} {"train_loss": -9.654224395751953, "global_step": 96810, "epoch": 576} {"train_loss": -9.745506286621094, "global_step": 96811, "epoch": 576} {"train_loss": -9.655184745788574, "global_step": 96812, "epoch": 576} {"train_loss": -9.827032089233398, "global_step": 96813, "epoch": 576} {"train_loss": -9.637916564941406, "global_step": 96814, "epoch": 576} {"train_loss": -9.729737281799316, "global_step": 96815, "epoch": 576} {"train_loss": -9.836551666259766, "global_step": 96816, "epoch": 576} {"train_loss": -9.871593475341797, "global_step": 96817, "epoch": 576} {"train_loss": -9.935405731201172, "global_step": 96818, "epoch": 576} {"train_loss": -9.916213035583496, "global_step": 96819, "epoch": 576} {"train_loss": -9.874443054199219, "global_step": 96820, "epoch": 576} {"train_loss": -9.68288516998291, "global_step": 96821, "epoch": 576} {"train_loss": -9.7743558883667, "global_step": 96822, "epoch": 576} {"train_loss": -9.815942764282227, "global_step": 96823, "epoch": 576} {"train_loss": -9.954727172851562, "global_step": 96824, "epoch": 576} {"train_loss": -9.668128967285156, "global_step": 96825, "epoch": 576} {"train_loss": -9.32174301147461, "global_step": 96826, "epoch": 576} {"train_loss": -9.450698852539062, "global_step": 96827, "epoch": 576} {"train_loss": -9.892033576965332, "global_step": 96828, "epoch": 576} {"train_loss": -9.40129280090332, "global_step": 96829, "epoch": 576} {"train_loss": -10.001178741455078, "global_step": 96830, "epoch": 576} {"train_loss": -9.761903762817383, "global_step": 96831, "epoch": 576} {"train_loss": -9.632119178771973, "global_step": 96832, "epoch": 576} {"train_loss": -9.67760181427002, "global_step": 96833, "epoch": 576} {"train_loss": -9.395952224731445, "global_step": 96834, "epoch": 576} {"train_loss": -9.50007152557373, "global_step": 96835, "epoch": 576} {"train_loss": -9.971807479858398, "global_step": 96836, "epoch": 576} {"train_loss": -9.302864074707031, "global_step": 96837, "epoch": 576} {"train_loss": -9.534646987915039, "global_step": 96838, "epoch": 576} {"train_loss": -9.374198913574219, "global_step": 96839, "epoch": 576} {"train_loss": -9.679389953613281, "global_step": 96840, "epoch": 576} {"train_loss": -9.58409309387207, "global_step": 96841, "epoch": 576} {"train_loss": -9.677616119384766, "global_step": 96842, "epoch": 576} {"train_loss": -9.590502738952637, "global_step": 96843, "epoch": 576} {"train_loss": -9.58713436126709, "global_step": 96844, "epoch": 576} {"train_loss": -9.454916000366211, "global_step": 96845, "epoch": 576} {"train_loss": -9.474066734313965, "global_step": 96846, "epoch": 576} {"train_loss": -9.482046127319336, "global_step": 96847, "epoch": 576} {"train_loss": -9.320679664611816, "global_step": 96848, "epoch": 576} {"train_loss": -9.54538345336914, "global_step": 96849, "epoch": 576} {"train_loss": -9.617053985595703, "global_step": 96850, "epoch": 576} {"train_loss": -9.603967666625977, "global_step": 96851, "epoch": 576} {"train_loss": -9.171934127807617, "global_step": 96852, "epoch": 576} {"train_loss": -9.399480819702148, "global_step": 96853, "epoch": 576} {"train_loss": -9.487805366516113, "global_step": 96854, "epoch": 576} {"train_loss": -9.430830001831055, "global_step": 96855, "epoch": 576} {"train_loss": -9.691964149475098, "global_step": 96856, "epoch": 576} {"train_loss": -9.514945983886719, "global_step": 96857, "epoch": 576} {"train_loss": -9.763976097106934, "global_step": 96858, "epoch": 576} {"train_loss": -9.98826789855957, "global_step": 96859, "epoch": 576} {"train_loss": -9.662786483764648, "global_step": 96860, "epoch": 576} {"train_loss": -9.643571853637695, "global_step": 96861, "epoch": 576} {"train_loss": -9.513675689697266, "global_step": 96862, "epoch": 576} {"train_loss": -9.643070220947266, "global_step": 96863, "epoch": 576} {"train_loss": -9.686595916748047, "global_step": 96864, "epoch": 576} {"train_loss": -9.573517799377441, "global_step": 96865, "epoch": 576} {"train_loss": -9.63502025604248, "global_step": 96866, "epoch": 576} {"train_loss": -9.627724647521973, "global_step": 96867, "epoch": 576} {"train_loss": -9.8222074508667, "global_step": 96868, "epoch": 576} {"train_loss": -9.732239723205566, "global_step": 96869, "epoch": 576} {"train_loss": -9.75920295715332, "global_step": 96870, "epoch": 576} {"train_loss": -9.69890022277832, "global_step": 96871, "epoch": 576} {"train_loss": -9.773804664611816, "global_step": 96872, "epoch": 576} {"train_loss": -9.6984224319458, "global_step": 96873, "epoch": 576} {"train_loss": -9.937128067016602, "global_step": 96874, "epoch": 576} {"train_loss": -9.98084831237793, "global_step": 96875, "epoch": 576} {"train_loss": -9.651495933532715, "global_step": 96876, "epoch": 576} {"train_loss": -9.67216968536377, "global_step": 96877, "epoch": 576} {"train_loss": -9.3859224319458, "global_step": 96878, "epoch": 576} {"train_loss": -9.336931228637695, "global_step": 96879, "epoch": 576} {"train_loss": -9.796228408813477, "global_step": 96880, "epoch": 576} {"train_loss": -9.540082931518555, "global_step": 96881, "epoch": 576} {"train_loss": -9.436017990112305, "global_step": 96882, "epoch": 576} {"train_loss": -9.738265991210938, "global_step": 96883, "epoch": 576} {"train_loss": -9.865823745727539, "global_step": 96884, "epoch": 576} {"train_loss": -9.592029571533203, "global_step": 96885, "epoch": 576} {"train_loss": -9.434114456176758, "global_step": 96886, "epoch": 576} {"train_loss": -9.540510177612305, "global_step": 96887, "epoch": 576} {"train_loss": -9.383865356445312, "global_step": 96888, "epoch": 576} {"train_loss": -9.437435150146484, "global_step": 96889, "epoch": 576} {"train_loss": -9.758613586425781, "global_step": 96890, "epoch": 576} {"train_loss": -9.607656478881836, "global_step": 96891, "epoch": 576} {"train_loss": -9.47785758972168, "global_step": 96892, "epoch": 576} {"train_loss": -9.711015701293945, "global_step": 96893, "epoch": 576} {"train_loss": -9.523122787475586, "global_step": 96894, "epoch": 576} {"train_loss": -9.787429809570312, "global_step": 96895, "epoch": 576} {"train_loss": -9.623027801513672, "global_step": 96896, "epoch": 576} {"train_loss": -9.812224388122559, "global_step": 96897, "epoch": 576} {"train_loss": -9.581769943237305, "global_step": 96898, "epoch": 576} {"train_loss": -9.831530570983887, "global_step": 96899, "epoch": 576} {"train_loss": -9.770650863647461, "global_step": 96900, "epoch": 576} {"train_loss": -9.746796607971191, "global_step": 96901, "epoch": 576} {"train_loss": -9.844865798950195, "global_step": 96902, "epoch": 576} {"train_loss": -9.869504928588867, "global_step": 96903, "epoch": 576} {"train_loss": -9.715489387512207, "global_step": 96904, "epoch": 576} {"train_loss": -9.675092697143555, "global_step": 96905, "epoch": 576} {"train_loss": -9.777963638305664, "global_step": 96906, "epoch": 576} {"train_loss": -9.721473693847656, "global_step": 96907, "epoch": 576} {"train_loss": -9.494413375854492, "global_step": 96908, "epoch": 576} {"train_loss": -9.744440078735352, "global_step": 96909, "epoch": 576} {"train_loss": -9.74930477142334, "global_step": 96910, "epoch": 576} {"train_loss": -9.584953308105469, "global_step": 96911, "epoch": 576} {"train_loss": -9.6661958694458, "global_step": 96912, "epoch": 576} {"train_loss": -9.60913372039795, "global_step": 96913, "epoch": 576} {"train_loss": -9.758719444274902, "global_step": 96914, "epoch": 576} {"train_loss": -9.637819290161133, "global_step": 96915, "epoch": 576} {"train_loss": -9.348642349243164, "global_step": 96916, "epoch": 576} {"train_loss": -9.937239646911621, "global_step": 96917, "epoch": 576} {"train_loss": -9.39474868774414, "global_step": 96918, "epoch": 576} {"train_loss": -9.628376007080078, "global_step": 96919, "epoch": 576} {"train_loss": -9.6220703125, "global_step": 96920, "epoch": 576} {"train_loss": -9.372011184692383, "global_step": 96921, "epoch": 576} {"train_loss": -9.814577102661133, "global_step": 96922, "epoch": 576} {"train_loss": -9.53466510772705, "global_step": 96923, "epoch": 576} {"train_loss": -9.490659713745117, "global_step": 96924, "epoch": 576} {"train_loss": -9.347976684570312, "global_step": 96925, "epoch": 576} {"train_loss": -9.334214210510254, "global_step": 96926, "epoch": 576} {"train_loss": -9.831436157226562, "global_step": 96927, "epoch": 576} {"train_loss": -9.494019508361816, "global_step": 96928, "epoch": 576} {"train_loss": -9.472301483154297, "global_step": 96929, "epoch": 576} {"train_loss": -9.58993911743164, "global_step": 96930, "epoch": 576} {"train_loss": -9.254182815551758, "global_step": 96931, "epoch": 576} {"train_loss": -9.705718040466309, "global_step": 96932, "epoch": 576} {"train_loss": -9.49135971069336, "global_step": 96933, "epoch": 576} {"train_loss": -9.784137725830078, "global_step": 96934, "epoch": 576} {"train_loss": -9.601641779854184, "global_step": 96935, "epoch": 576, "val_loss": 207280.515625} {"train_loss": -9.621185302734375, "global_step": 96936, "epoch": 577} {"train_loss": -9.412660598754883, "global_step": 96937, "epoch": 577} {"train_loss": -9.891839981079102, "global_step": 96938, "epoch": 577} {"train_loss": -9.676301002502441, "global_step": 96939, "epoch": 577} {"train_loss": -9.756637573242188, "global_step": 96940, "epoch": 577} {"train_loss": -9.594078063964844, "global_step": 96941, "epoch": 577} {"train_loss": -9.667323112487793, "global_step": 96942, "epoch": 577} {"train_loss": -9.595745086669922, "global_step": 96943, "epoch": 577} {"train_loss": -9.643148422241211, "global_step": 96944, "epoch": 577} {"train_loss": -9.573027610778809, "global_step": 96945, "epoch": 577} {"train_loss": -9.311223983764648, "global_step": 96946, "epoch": 577} {"train_loss": -9.62076473236084, "global_step": 96947, "epoch": 577} {"train_loss": -8.885066032409668, "global_step": 96948, "epoch": 577} {"train_loss": -9.584105491638184, "global_step": 96949, "epoch": 577} {"train_loss": -9.404770851135254, "global_step": 96950, "epoch": 577} {"train_loss": -9.46546745300293, "global_step": 96951, "epoch": 577} {"train_loss": -9.444786071777344, "global_step": 96952, "epoch": 577} {"train_loss": -9.58702564239502, "global_step": 96953, "epoch": 577} {"train_loss": -9.532968521118164, "global_step": 96954, "epoch": 577} {"train_loss": -9.641314506530762, "global_step": 96955, "epoch": 577} {"train_loss": -9.590851783752441, "global_step": 96956, "epoch": 577} {"train_loss": -9.524795532226562, "global_step": 96957, "epoch": 577} {"train_loss": -9.642614364624023, "global_step": 96958, "epoch": 577} {"train_loss": -9.904829025268555, "global_step": 96959, "epoch": 577} {"train_loss": -9.492191314697266, "global_step": 96960, "epoch": 577} {"train_loss": -9.397781372070312, "global_step": 96961, "epoch": 577} {"train_loss": -9.656429290771484, "global_step": 96962, "epoch": 577} {"train_loss": -9.370762825012207, "global_step": 96963, "epoch": 577} {"train_loss": -9.756200790405273, "global_step": 96964, "epoch": 577} {"train_loss": -9.595821380615234, "global_step": 96965, "epoch": 577} {"train_loss": -9.610211372375488, "global_step": 96966, "epoch": 577} {"train_loss": -9.861207962036133, "global_step": 96967, "epoch": 577} {"train_loss": -9.61962890625, "global_step": 96968, "epoch": 577} {"train_loss": -9.393575668334961, "global_step": 96969, "epoch": 577} {"train_loss": -9.656116485595703, "global_step": 96970, "epoch": 577} {"train_loss": -9.700468063354492, "global_step": 96971, "epoch": 577} {"train_loss": -9.478063583374023, "global_step": 96972, "epoch": 577} {"train_loss": -9.891084671020508, "global_step": 96973, "epoch": 577} {"train_loss": -9.587318420410156, "global_step": 96974, "epoch": 577} {"train_loss": -9.515769958496094, "global_step": 96975, "epoch": 577} {"train_loss": -9.825998306274414, "global_step": 96976, "epoch": 577} {"train_loss": -9.418198585510254, "global_step": 96977, "epoch": 577} {"train_loss": -9.558006286621094, "global_step": 96978, "epoch": 577} {"train_loss": -9.781267166137695, "global_step": 96979, "epoch": 577} {"train_loss": -9.291963577270508, "global_step": 96980, "epoch": 577} {"train_loss": -9.525117874145508, "global_step": 96981, "epoch": 577} {"train_loss": -9.377859115600586, "global_step": 96982, "epoch": 577} {"train_loss": -9.481328964233398, "global_step": 96983, "epoch": 577} {"train_loss": -9.19748592376709, "global_step": 96984, "epoch": 577} {"train_loss": -9.684061050415039, "global_step": 96985, "epoch": 577} {"train_loss": -9.572425842285156, "global_step": 96986, "epoch": 577} {"train_loss": -9.151409149169922, "global_step": 96987, "epoch": 577} {"train_loss": -9.504871368408203, "global_step": 96988, "epoch": 577} {"train_loss": -9.396797180175781, "global_step": 96989, "epoch": 577} {"train_loss": -9.409477233886719, "global_step": 96990, "epoch": 577} {"train_loss": -9.644051551818848, "global_step": 96991, "epoch": 577} {"train_loss": -9.272012710571289, "global_step": 96992, "epoch": 577} {"train_loss": -9.928167343139648, "global_step": 96993, "epoch": 577} {"train_loss": -9.138533592224121, "global_step": 96994, "epoch": 577} {"train_loss": -9.559501647949219, "global_step": 96995, "epoch": 577} {"train_loss": -9.315109252929688, "global_step": 96996, "epoch": 577} {"train_loss": -9.56982421875, "global_step": 96997, "epoch": 577} {"train_loss": -9.542701721191406, "global_step": 96998, "epoch": 577} {"train_loss": -9.733566284179688, "global_step": 96999, "epoch": 577} {"train_loss": -9.410346031188965, "global_step": 97000, "epoch": 577} {"train_loss": -9.57908821105957, "global_step": 97001, "epoch": 577} {"train_loss": -9.4541015625, "global_step": 97002, "epoch": 577} {"train_loss": -9.432945251464844, "global_step": 97003, "epoch": 577} {"train_loss": -9.30265998840332, "global_step": 97004, "epoch": 577} {"train_loss": -9.881872177124023, "global_step": 97005, "epoch": 577} {"train_loss": -9.569613456726074, "global_step": 97006, "epoch": 577} {"train_loss": -9.425848007202148, "global_step": 97007, "epoch": 577} {"train_loss": -9.343799591064453, "global_step": 97008, "epoch": 577} {"train_loss": -9.572388648986816, "global_step": 97009, "epoch": 577} {"train_loss": -9.35809326171875, "global_step": 97010, "epoch": 577} {"train_loss": -9.636314392089844, "global_step": 97011, "epoch": 577} {"train_loss": -9.688848495483398, "global_step": 97012, "epoch": 577} {"train_loss": -9.019131660461426, "global_step": 97013, "epoch": 577} {"train_loss": -9.425708770751953, "global_step": 97014, "epoch": 577} {"train_loss": -9.362926483154297, "global_step": 97015, "epoch": 577} {"train_loss": -9.3753662109375, "global_step": 97016, "epoch": 577} {"train_loss": -9.68212890625, "global_step": 97017, "epoch": 577} {"train_loss": -9.591205596923828, "global_step": 97018, "epoch": 577} {"train_loss": -9.614847183227539, "global_step": 97019, "epoch": 577} {"train_loss": -9.569021224975586, "global_step": 97020, "epoch": 577} {"train_loss": -9.765277862548828, "global_step": 97021, "epoch": 577} {"train_loss": -9.527875900268555, "global_step": 97022, "epoch": 577} {"train_loss": -9.529050827026367, "global_step": 97023, "epoch": 577} {"train_loss": -9.573721885681152, "global_step": 97024, "epoch": 577} {"train_loss": -9.81872272491455, "global_step": 97025, "epoch": 577} {"train_loss": -9.641393661499023, "global_step": 97026, "epoch": 577} {"train_loss": -9.83529281616211, "global_step": 97027, "epoch": 577} {"train_loss": -9.757352828979492, "global_step": 97028, "epoch": 577} {"train_loss": -9.426673889160156, "global_step": 97029, "epoch": 577} {"train_loss": -9.860946655273438, "global_step": 97030, "epoch": 577} {"train_loss": -9.661006927490234, "global_step": 97031, "epoch": 577} {"train_loss": -9.737066268920898, "global_step": 97032, "epoch": 577} {"train_loss": -9.484857559204102, "global_step": 97033, "epoch": 577} {"train_loss": -9.588492393493652, "global_step": 97034, "epoch": 577} {"train_loss": -9.440814018249512, "global_step": 97035, "epoch": 577} {"train_loss": -9.521259307861328, "global_step": 97036, "epoch": 577} {"train_loss": -9.43698501586914, "global_step": 97037, "epoch": 577} {"train_loss": -9.651433944702148, "global_step": 97038, "epoch": 577} {"train_loss": -9.293863296508789, "global_step": 97039, "epoch": 577} {"train_loss": -9.641626358032227, "global_step": 97040, "epoch": 577} {"train_loss": -9.110437393188477, "global_step": 97041, "epoch": 577} {"train_loss": -9.561765670776367, "global_step": 97042, "epoch": 577} {"train_loss": -9.36752986907959, "global_step": 97043, "epoch": 577} {"train_loss": -9.225746154785156, "global_step": 97044, "epoch": 577} {"train_loss": -9.173768997192383, "global_step": 97045, "epoch": 577} {"train_loss": -9.498213768005371, "global_step": 97046, "epoch": 577} {"train_loss": -9.489269256591797, "global_step": 97047, "epoch": 577} {"train_loss": -9.288534164428711, "global_step": 97048, "epoch": 577} {"train_loss": -9.698396682739258, "global_step": 97049, "epoch": 577} {"train_loss": -9.454130172729492, "global_step": 97050, "epoch": 577} {"train_loss": -9.617565155029297, "global_step": 97051, "epoch": 577} {"train_loss": -9.572959899902344, "global_step": 97052, "epoch": 577} {"train_loss": -9.609956741333008, "global_step": 97053, "epoch": 577} {"train_loss": -9.46918773651123, "global_step": 97054, "epoch": 577} {"train_loss": -9.479055404663086, "global_step": 97055, "epoch": 577} {"train_loss": -9.444742202758789, "global_step": 97056, "epoch": 577} {"train_loss": -9.80816650390625, "global_step": 97057, "epoch": 577} {"train_loss": -9.671241760253906, "global_step": 97058, "epoch": 577} {"train_loss": -9.512659072875977, "global_step": 97059, "epoch": 577} {"train_loss": -9.893794059753418, "global_step": 97060, "epoch": 577} {"train_loss": -9.647560119628906, "global_step": 97061, "epoch": 577} {"train_loss": -9.565107345581055, "global_step": 97062, "epoch": 577} {"train_loss": -9.557022094726562, "global_step": 97063, "epoch": 577} {"train_loss": -9.710416793823242, "global_step": 97064, "epoch": 577} {"train_loss": -9.69973373413086, "global_step": 97065, "epoch": 577} {"train_loss": -9.840744972229004, "global_step": 97066, "epoch": 577} {"train_loss": -9.762715339660645, "global_step": 97067, "epoch": 577} {"train_loss": -9.71008014678955, "global_step": 97068, "epoch": 577} {"train_loss": -9.817620277404785, "global_step": 97069, "epoch": 577} {"train_loss": -9.678142547607422, "global_step": 97070, "epoch": 577} {"train_loss": -9.805732727050781, "global_step": 97071, "epoch": 577} {"train_loss": -9.803583145141602, "global_step": 97072, "epoch": 577} {"train_loss": -9.537687301635742, "global_step": 97073, "epoch": 577} {"train_loss": -9.38636589050293, "global_step": 97074, "epoch": 577} {"train_loss": -9.415960311889648, "global_step": 97075, "epoch": 577} {"train_loss": -9.548470497131348, "global_step": 97076, "epoch": 577} {"train_loss": -9.60256576538086, "global_step": 97077, "epoch": 577} {"train_loss": -9.548942565917969, "global_step": 97078, "epoch": 577} {"train_loss": -9.44117546081543, "global_step": 97079, "epoch": 577} {"train_loss": -9.463937759399414, "global_step": 97080, "epoch": 577} {"train_loss": -9.828104019165039, "global_step": 97081, "epoch": 577} {"train_loss": -9.694818496704102, "global_step": 97082, "epoch": 577} {"train_loss": -9.519372940063477, "global_step": 97083, "epoch": 577} {"train_loss": -9.412633895874023, "global_step": 97084, "epoch": 577} {"train_loss": -9.319487571716309, "global_step": 97085, "epoch": 577} {"train_loss": -9.316787719726562, "global_step": 97086, "epoch": 577} {"train_loss": -9.378280639648438, "global_step": 97087, "epoch": 577} {"train_loss": -9.395461082458496, "global_step": 97088, "epoch": 577} {"train_loss": -8.992924690246582, "global_step": 97089, "epoch": 577} {"train_loss": -9.53787612915039, "global_step": 97090, "epoch": 577} {"train_loss": -9.303059577941895, "global_step": 97091, "epoch": 577} {"train_loss": -9.32038402557373, "global_step": 97092, "epoch": 577} {"train_loss": -9.45145034790039, "global_step": 97093, "epoch": 577} {"train_loss": -9.321354866027832, "global_step": 97094, "epoch": 577} {"train_loss": -9.263114929199219, "global_step": 97095, "epoch": 577} {"train_loss": -9.50728988647461, "global_step": 97096, "epoch": 577} {"train_loss": -9.296792984008789, "global_step": 97097, "epoch": 577} {"train_loss": -9.268937110900879, "global_step": 97098, "epoch": 577} {"train_loss": -9.78693962097168, "global_step": 97099, "epoch": 577} {"train_loss": -9.518621444702148, "global_step": 97100, "epoch": 577} {"train_loss": -9.567566871643066, "global_step": 97101, "epoch": 577} {"train_loss": -9.601505279541016, "global_step": 97102, "epoch": 577} {"train_loss": -9.537716570354643, "global_step": 97103, "epoch": 577, "val_loss": 205597.75} {"train_loss": -9.655171394348145, "global_step": 97104, "epoch": 578} {"train_loss": -9.447906494140625, "global_step": 97105, "epoch": 578} {"train_loss": -9.712039947509766, "global_step": 97106, "epoch": 578} {"train_loss": -9.560311317443848, "global_step": 97107, "epoch": 578} {"train_loss": -9.669947624206543, "global_step": 97108, "epoch": 578} {"train_loss": -9.813800811767578, "global_step": 97109, "epoch": 578} {"train_loss": -9.518377304077148, "global_step": 97110, "epoch": 578} {"train_loss": -9.511531829833984, "global_step": 97111, "epoch": 578} {"train_loss": -9.899887084960938, "global_step": 97112, "epoch": 578} {"train_loss": -9.717634201049805, "global_step": 97113, "epoch": 578} {"train_loss": -9.894309997558594, "global_step": 97114, "epoch": 578} {"train_loss": -9.840373992919922, "global_step": 97115, "epoch": 578} {"train_loss": -9.509048461914062, "global_step": 97116, "epoch": 578} {"train_loss": -9.556200981140137, "global_step": 97117, "epoch": 578} {"train_loss": -9.865743637084961, "global_step": 97118, "epoch": 578} {"train_loss": -9.56946849822998, "global_step": 97119, "epoch": 578} {"train_loss": -9.758200645446777, "global_step": 97120, "epoch": 578} {"train_loss": -9.71010971069336, "global_step": 97121, "epoch": 578} {"train_loss": -9.58659839630127, "global_step": 97122, "epoch": 578} {"train_loss": -9.65306282043457, "global_step": 97123, "epoch": 578} {"train_loss": -9.533315658569336, "global_step": 97124, "epoch": 578} {"train_loss": -9.652509689331055, "global_step": 97125, "epoch": 578} {"train_loss": -9.529787063598633, "global_step": 97126, "epoch": 578} {"train_loss": -9.482243537902832, "global_step": 97127, "epoch": 578} {"train_loss": -9.946595191955566, "global_step": 97128, "epoch": 578} {"train_loss": -9.739526748657227, "global_step": 97129, "epoch": 578} {"train_loss": -9.925898551940918, "global_step": 97130, "epoch": 578} {"train_loss": -9.715215682983398, "global_step": 97131, "epoch": 578} {"train_loss": -10.120681762695312, "global_step": 97132, "epoch": 578} {"train_loss": -9.822908401489258, "global_step": 97133, "epoch": 578} {"train_loss": -9.902562141418457, "global_step": 97134, "epoch": 578} {"train_loss": -9.944077491760254, "global_step": 97135, "epoch": 578} {"train_loss": -9.957745552062988, "global_step": 97136, "epoch": 578} {"train_loss": -9.646453857421875, "global_step": 97137, "epoch": 578} {"train_loss": -9.97589111328125, "global_step": 97138, "epoch": 578} {"train_loss": -9.914791107177734, "global_step": 97139, "epoch": 578} {"train_loss": -9.949183464050293, "global_step": 97140, "epoch": 578} {"train_loss": -10.067791938781738, "global_step": 97141, "epoch": 578} {"train_loss": -9.513537406921387, "global_step": 97142, "epoch": 578} {"train_loss": -9.209711074829102, "global_step": 97143, "epoch": 578} {"train_loss": -9.492504119873047, "global_step": 97144, "epoch": 578} {"train_loss": -9.330436706542969, "global_step": 97145, "epoch": 578} {"train_loss": -9.183902740478516, "global_step": 97146, "epoch": 578} {"train_loss": -9.534214973449707, "global_step": 97147, "epoch": 578} {"train_loss": -9.575369834899902, "global_step": 97148, "epoch": 578} {"train_loss": -8.917482376098633, "global_step": 97149, "epoch": 578} {"train_loss": -9.55859661102295, "global_step": 97150, "epoch": 578} {"train_loss": -9.145359992980957, "global_step": 97151, "epoch": 578} {"train_loss": -9.198195457458496, "global_step": 97152, "epoch": 578} {"train_loss": -9.610727310180664, "global_step": 97153, "epoch": 578} {"train_loss": -9.080297470092773, "global_step": 97154, "epoch": 578} {"train_loss": -9.260024070739746, "global_step": 97155, "epoch": 578} {"train_loss": -9.163677215576172, "global_step": 97156, "epoch": 578} {"train_loss": -9.493829727172852, "global_step": 97157, "epoch": 578} {"train_loss": -9.46200942993164, "global_step": 97158, "epoch": 578} {"train_loss": -9.46368408203125, "global_step": 97159, "epoch": 578} {"train_loss": -9.532022476196289, "global_step": 97160, "epoch": 578} {"train_loss": -9.688499450683594, "global_step": 97161, "epoch": 578} {"train_loss": -9.363472938537598, "global_step": 97162, "epoch": 578} {"train_loss": -9.477147102355957, "global_step": 97163, "epoch": 578} {"train_loss": -9.510136604309082, "global_step": 97164, "epoch": 578} {"train_loss": -9.343335151672363, "global_step": 97165, "epoch": 578} {"train_loss": -9.447929382324219, "global_step": 97166, "epoch": 578} {"train_loss": -9.349618911743164, "global_step": 97167, "epoch": 578} {"train_loss": -9.448473930358887, "global_step": 97168, "epoch": 578} {"train_loss": -9.525274276733398, "global_step": 97169, "epoch": 578} {"train_loss": -9.2814302444458, "global_step": 97170, "epoch": 578} {"train_loss": -9.729324340820312, "global_step": 97171, "epoch": 578} {"train_loss": -9.196688652038574, "global_step": 97172, "epoch": 578} {"train_loss": -9.726264953613281, "global_step": 97173, "epoch": 578} {"train_loss": -9.485971450805664, "global_step": 97174, "epoch": 578} {"train_loss": -9.771238327026367, "global_step": 97175, "epoch": 578} {"train_loss": -9.416242599487305, "global_step": 97176, "epoch": 578} {"train_loss": -10.012999534606934, "global_step": 97177, "epoch": 578} {"train_loss": -9.390137672424316, "global_step": 97178, "epoch": 578} {"train_loss": -9.386890411376953, "global_step": 97179, "epoch": 578} {"train_loss": -9.501188278198242, "global_step": 97180, "epoch": 578} {"train_loss": -9.61828327178955, "global_step": 97181, "epoch": 578} {"train_loss": -9.598325729370117, "global_step": 97182, "epoch": 578} {"train_loss": -9.7670316696167, "global_step": 97183, "epoch": 578} {"train_loss": -9.70356559753418, "global_step": 97184, "epoch": 578} {"train_loss": -9.607619285583496, "global_step": 97185, "epoch": 578} {"train_loss": -9.870025634765625, "global_step": 97186, "epoch": 578} {"train_loss": -9.877195358276367, "global_step": 97187, "epoch": 578} {"train_loss": -9.655618667602539, "global_step": 97188, "epoch": 578} {"train_loss": -9.832250595092773, "global_step": 97189, "epoch": 578} {"train_loss": -9.740421295166016, "global_step": 97190, "epoch": 578} {"train_loss": -9.845417976379395, "global_step": 97191, "epoch": 578} {"train_loss": -9.939157485961914, "global_step": 97192, "epoch": 578} {"train_loss": -9.538164138793945, "global_step": 97193, "epoch": 578} {"train_loss": -9.637147903442383, "global_step": 97194, "epoch": 578} {"train_loss": -9.937562942504883, "global_step": 97195, "epoch": 578} {"train_loss": -9.589374542236328, "global_step": 97196, "epoch": 578} {"train_loss": -9.545220375061035, "global_step": 97197, "epoch": 578} {"train_loss": -9.777566909790039, "global_step": 97198, "epoch": 578} {"train_loss": -9.836095809936523, "global_step": 97199, "epoch": 578} {"train_loss": -9.706499099731445, "global_step": 97200, "epoch": 578} {"train_loss": -9.818060874938965, "global_step": 97201, "epoch": 578} {"train_loss": -9.572805404663086, "global_step": 97202, "epoch": 578} {"train_loss": -9.74583911895752, "global_step": 97203, "epoch": 578} {"train_loss": -9.63278865814209, "global_step": 97204, "epoch": 578} {"train_loss": -9.732176780700684, "global_step": 97205, "epoch": 578} {"train_loss": -9.593791961669922, "global_step": 97206, "epoch": 578} {"train_loss": -9.36790943145752, "global_step": 97207, "epoch": 578} {"train_loss": -9.779556274414062, "global_step": 97208, "epoch": 578} {"train_loss": -9.368600845336914, "global_step": 97209, "epoch": 578} {"train_loss": -9.338582038879395, "global_step": 97210, "epoch": 578} {"train_loss": -9.722655296325684, "global_step": 97211, "epoch": 578} {"train_loss": -9.45011043548584, "global_step": 97212, "epoch": 578} {"train_loss": -9.728558540344238, "global_step": 97213, "epoch": 578} {"train_loss": -9.826821327209473, "global_step": 97214, "epoch": 578} {"train_loss": -9.362435340881348, "global_step": 97215, "epoch": 578} {"train_loss": -9.664434432983398, "global_step": 97216, "epoch": 578} {"train_loss": -9.517473220825195, "global_step": 97217, "epoch": 578} {"train_loss": -9.374961853027344, "global_step": 97218, "epoch": 578} {"train_loss": -9.788911819458008, "global_step": 97219, "epoch": 578} {"train_loss": -9.422208786010742, "global_step": 97220, "epoch": 578} {"train_loss": -9.625676155090332, "global_step": 97221, "epoch": 578} {"train_loss": -9.667318344116211, "global_step": 97222, "epoch": 578} {"train_loss": -9.784794807434082, "global_step": 97223, "epoch": 578} {"train_loss": -9.590518951416016, "global_step": 97224, "epoch": 578} {"train_loss": -9.649908065795898, "global_step": 97225, "epoch": 578} {"train_loss": -9.63680648803711, "global_step": 97226, "epoch": 578} {"train_loss": -9.970998764038086, "global_step": 97227, "epoch": 578} {"train_loss": -9.89295768737793, "global_step": 97228, "epoch": 578} {"train_loss": -9.594498634338379, "global_step": 97229, "epoch": 578} {"train_loss": -9.826507568359375, "global_step": 97230, "epoch": 578} {"train_loss": -9.771110534667969, "global_step": 97231, "epoch": 578} {"train_loss": -9.895866394042969, "global_step": 97232, "epoch": 578} {"train_loss": -9.600883483886719, "global_step": 97233, "epoch": 578} {"train_loss": -9.925832748413086, "global_step": 97234, "epoch": 578} {"train_loss": -9.532917022705078, "global_step": 97235, "epoch": 578} {"train_loss": -9.745018005371094, "global_step": 97236, "epoch": 578} {"train_loss": -9.643655776977539, "global_step": 97237, "epoch": 578} {"train_loss": -9.713632583618164, "global_step": 97238, "epoch": 578} {"train_loss": -9.612508773803711, "global_step": 97239, "epoch": 578} {"train_loss": -9.60598373413086, "global_step": 97240, "epoch": 578} {"train_loss": -9.799224853515625, "global_step": 97241, "epoch": 578} {"train_loss": -9.628170013427734, "global_step": 97242, "epoch": 578} {"train_loss": -9.87571907043457, "global_step": 97243, "epoch": 578} {"train_loss": -9.712738990783691, "global_step": 97244, "epoch": 578} {"train_loss": -9.743894577026367, "global_step": 97245, "epoch": 578} {"train_loss": -9.973700523376465, "global_step": 97246, "epoch": 578} {"train_loss": -9.710949897766113, "global_step": 97247, "epoch": 578} {"train_loss": -9.613703727722168, "global_step": 97248, "epoch": 578} {"train_loss": -9.695642471313477, "global_step": 97249, "epoch": 578} {"train_loss": -9.859517097473145, "global_step": 97250, "epoch": 578} {"train_loss": -9.758342742919922, "global_step": 97251, "epoch": 578} {"train_loss": -9.768718719482422, "global_step": 97252, "epoch": 578} {"train_loss": -9.858261108398438, "global_step": 97253, "epoch": 578} {"train_loss": -9.257312774658203, "global_step": 97254, "epoch": 578} {"train_loss": -9.408032417297363, "global_step": 97255, "epoch": 578} {"train_loss": -8.966657638549805, "global_step": 97256, "epoch": 578} {"train_loss": -9.773049354553223, "global_step": 97257, "epoch": 578} {"train_loss": -9.307453155517578, "global_step": 97258, "epoch": 578} {"train_loss": -9.449963569641113, "global_step": 97259, "epoch": 578} {"train_loss": -9.510723114013672, "global_step": 97260, "epoch": 578} {"train_loss": -9.298259735107422, "global_step": 97261, "epoch": 578} {"train_loss": -9.62472915649414, "global_step": 97262, "epoch": 578} {"train_loss": -9.243388175964355, "global_step": 97263, "epoch": 578} {"train_loss": -9.470315933227539, "global_step": 97264, "epoch": 578} {"train_loss": -9.314363479614258, "global_step": 97265, "epoch": 578} {"train_loss": -9.660537719726562, "global_step": 97266, "epoch": 578} {"train_loss": -9.342342376708984, "global_step": 97267, "epoch": 578} {"train_loss": -9.332601547241211, "global_step": 97268, "epoch": 578} {"train_loss": -9.403146743774414, "global_step": 97269, "epoch": 578} {"train_loss": -9.487970352172852, "global_step": 97270, "epoch": 578} {"train_loss": -9.613547069685799, "global_step": 97271, "epoch": 578, "val_loss": 203434.34375} {"train_loss": -9.390403747558594, "global_step": 97272, "epoch": 579} {"train_loss": -9.539512634277344, "global_step": 97273, "epoch": 579} {"train_loss": -9.525350570678711, "global_step": 97274, "epoch": 579} {"train_loss": -9.61172103881836, "global_step": 97275, "epoch": 579} {"train_loss": -9.640594482421875, "global_step": 97276, "epoch": 579} {"train_loss": -9.786989212036133, "global_step": 97277, "epoch": 579} {"train_loss": -9.404167175292969, "global_step": 97278, "epoch": 579} {"train_loss": -9.608282089233398, "global_step": 97279, "epoch": 579} {"train_loss": -9.720033645629883, "global_step": 97280, "epoch": 579} {"train_loss": -9.551217079162598, "global_step": 97281, "epoch": 579} {"train_loss": -9.683390617370605, "global_step": 97282, "epoch": 579} {"train_loss": -9.624210357666016, "global_step": 97283, "epoch": 579} {"train_loss": -9.813419342041016, "global_step": 97284, "epoch": 579} {"train_loss": -9.794126510620117, "global_step": 97285, "epoch": 579} {"train_loss": -9.667276382446289, "global_step": 97286, "epoch": 579} {"train_loss": -9.586546897888184, "global_step": 97287, "epoch": 579} {"train_loss": -9.871715545654297, "global_step": 97288, "epoch": 579} {"train_loss": -9.736252784729004, "global_step": 97289, "epoch": 579} {"train_loss": -9.6507568359375, "global_step": 97290, "epoch": 579} {"train_loss": -9.815534591674805, "global_step": 97291, "epoch": 579} {"train_loss": -9.561930656433105, "global_step": 97292, "epoch": 579} {"train_loss": -9.575222969055176, "global_step": 97293, "epoch": 579} {"train_loss": -9.470480918884277, "global_step": 97294, "epoch": 579} {"train_loss": -9.629386901855469, "global_step": 97295, "epoch": 579} {"train_loss": -9.71729564666748, "global_step": 97296, "epoch": 579} {"train_loss": -9.700927734375, "global_step": 97297, "epoch": 579} {"train_loss": -9.541519165039062, "global_step": 97298, "epoch": 579} {"train_loss": -9.771943092346191, "global_step": 97299, "epoch": 579} {"train_loss": -9.497568130493164, "global_step": 97300, "epoch": 579} {"train_loss": -9.655224800109863, "global_step": 97301, "epoch": 579} {"train_loss": -9.542640686035156, "global_step": 97302, "epoch": 579} {"train_loss": -9.7425537109375, "global_step": 97303, "epoch": 579} {"train_loss": -9.668620109558105, "global_step": 97304, "epoch": 579} {"train_loss": -9.626184463500977, "global_step": 97305, "epoch": 579} {"train_loss": -9.730203628540039, "global_step": 97306, "epoch": 579} {"train_loss": -9.724639892578125, "global_step": 97307, "epoch": 579} {"train_loss": -9.743890762329102, "global_step": 97308, "epoch": 579} {"train_loss": -9.929546356201172, "global_step": 97309, "epoch": 579} {"train_loss": -9.553455352783203, "global_step": 97310, "epoch": 579} {"train_loss": -9.580791473388672, "global_step": 97311, "epoch": 579} {"train_loss": -9.523199081420898, "global_step": 97312, "epoch": 579} {"train_loss": -9.44777774810791, "global_step": 97313, "epoch": 579} {"train_loss": -9.476799011230469, "global_step": 97314, "epoch": 579} {"train_loss": -9.538263320922852, "global_step": 97315, "epoch": 579} {"train_loss": -9.679590225219727, "global_step": 97316, "epoch": 579} {"train_loss": -9.569802284240723, "global_step": 97317, "epoch": 579} {"train_loss": -9.83991813659668, "global_step": 97318, "epoch": 579} {"train_loss": -9.400129318237305, "global_step": 97319, "epoch": 579} {"train_loss": -9.548928260803223, "global_step": 97320, "epoch": 579} {"train_loss": -9.264425277709961, "global_step": 97321, "epoch": 579} {"train_loss": -9.560928344726562, "global_step": 97322, "epoch": 579} {"train_loss": -9.211315155029297, "global_step": 97323, "epoch": 579} {"train_loss": -9.379096984863281, "global_step": 97324, "epoch": 579} {"train_loss": -8.999698638916016, "global_step": 97325, "epoch": 579} {"train_loss": -9.440422058105469, "global_step": 97326, "epoch": 579} {"train_loss": -9.100675582885742, "global_step": 97327, "epoch": 579} {"train_loss": -9.505615234375, "global_step": 97328, "epoch": 579} {"train_loss": -9.417470932006836, "global_step": 97329, "epoch": 579} {"train_loss": -9.169214248657227, "global_step": 97330, "epoch": 579} {"train_loss": -9.682286262512207, "global_step": 97331, "epoch": 579} {"train_loss": -9.455321311950684, "global_step": 97332, "epoch": 579} {"train_loss": -9.387012481689453, "global_step": 97333, "epoch": 579} {"train_loss": -9.547473907470703, "global_step": 97334, "epoch": 579} {"train_loss": -9.614883422851562, "global_step": 97335, "epoch": 579} {"train_loss": -9.563003540039062, "global_step": 97336, "epoch": 579} {"train_loss": -9.743620872497559, "global_step": 97337, "epoch": 579} {"train_loss": -9.696454048156738, "global_step": 97338, "epoch": 579} {"train_loss": -9.74972152709961, "global_step": 97339, "epoch": 579} {"train_loss": -9.746112823486328, "global_step": 97340, "epoch": 579} {"train_loss": -9.226789474487305, "global_step": 97341, "epoch": 579} {"train_loss": -9.60938549041748, "global_step": 97342, "epoch": 579} {"train_loss": -9.547069549560547, "global_step": 97343, "epoch": 579} {"train_loss": -9.726611137390137, "global_step": 97344, "epoch": 579} {"train_loss": -9.905068397521973, "global_step": 97345, "epoch": 579} {"train_loss": -9.819765090942383, "global_step": 97346, "epoch": 579} {"train_loss": -9.7640380859375, "global_step": 97347, "epoch": 579} {"train_loss": -9.584813117980957, "global_step": 97348, "epoch": 579} {"train_loss": -9.736677169799805, "global_step": 97349, "epoch": 579} {"train_loss": -9.77049732208252, "global_step": 97350, "epoch": 579} {"train_loss": -9.749765396118164, "global_step": 97351, "epoch": 579} {"train_loss": -9.572208404541016, "global_step": 97352, "epoch": 579} {"train_loss": -9.69863224029541, "global_step": 97353, "epoch": 579} {"train_loss": -9.61935043334961, "global_step": 97354, "epoch": 579} {"train_loss": -9.668630599975586, "global_step": 97355, "epoch": 579} {"train_loss": -9.797430038452148, "global_step": 97356, "epoch": 579} {"train_loss": -9.680096626281738, "global_step": 97357, "epoch": 579} {"train_loss": -9.8958101272583, "global_step": 97358, "epoch": 579} {"train_loss": -9.862698554992676, "global_step": 97359, "epoch": 579} {"train_loss": -9.750886917114258, "global_step": 97360, "epoch": 579} {"train_loss": -9.893251419067383, "global_step": 97361, "epoch": 579} {"train_loss": -9.499479293823242, "global_step": 97362, "epoch": 579} {"train_loss": -9.541074752807617, "global_step": 97363, "epoch": 579} {"train_loss": -9.944704055786133, "global_step": 97364, "epoch": 579} {"train_loss": -9.747655868530273, "global_step": 97365, "epoch": 579} {"train_loss": -9.90555191040039, "global_step": 97366, "epoch": 579} {"train_loss": -9.678171157836914, "global_step": 97367, "epoch": 579} {"train_loss": -9.792409896850586, "global_step": 97368, "epoch": 579} {"train_loss": -9.695514678955078, "global_step": 97369, "epoch": 579} {"train_loss": -9.657732963562012, "global_step": 97370, "epoch": 579} {"train_loss": -9.748394966125488, "global_step": 97371, "epoch": 579} {"train_loss": -9.419645309448242, "global_step": 97372, "epoch": 579} {"train_loss": -9.556557655334473, "global_step": 97373, "epoch": 579} {"train_loss": -9.590062141418457, "global_step": 97374, "epoch": 579} {"train_loss": -9.689319610595703, "global_step": 97375, "epoch": 579} {"train_loss": -9.802236557006836, "global_step": 97376, "epoch": 579} {"train_loss": -9.717408180236816, "global_step": 97377, "epoch": 579} {"train_loss": -9.767781257629395, "global_step": 97378, "epoch": 579} {"train_loss": -9.730947494506836, "global_step": 97379, "epoch": 579} {"train_loss": -9.645798683166504, "global_step": 97380, "epoch": 579} {"train_loss": -9.640218734741211, "global_step": 97381, "epoch": 579} {"train_loss": -9.685070037841797, "global_step": 97382, "epoch": 579} {"train_loss": -9.663022994995117, "global_step": 97383, "epoch": 579} {"train_loss": -9.781107902526855, "global_step": 97384, "epoch": 579} {"train_loss": -9.647974967956543, "global_step": 97385, "epoch": 579} {"train_loss": -9.696371078491211, "global_step": 97386, "epoch": 579} {"train_loss": -9.646053314208984, "global_step": 97387, "epoch": 579} {"train_loss": -9.746118545532227, "global_step": 97388, "epoch": 579} {"train_loss": -9.715726852416992, "global_step": 97389, "epoch": 579} {"train_loss": -9.41762924194336, "global_step": 97390, "epoch": 579} {"train_loss": -9.39593505859375, "global_step": 97391, "epoch": 579} {"train_loss": -9.799446105957031, "global_step": 97392, "epoch": 579} {"train_loss": -9.647834777832031, "global_step": 97393, "epoch": 579} {"train_loss": -9.17393684387207, "global_step": 97394, "epoch": 579} {"train_loss": -9.660741806030273, "global_step": 97395, "epoch": 579} {"train_loss": -9.603700637817383, "global_step": 97396, "epoch": 579} {"train_loss": -9.267351150512695, "global_step": 97397, "epoch": 579} {"train_loss": -9.358846664428711, "global_step": 97398, "epoch": 579} {"train_loss": -9.288475036621094, "global_step": 97399, "epoch": 579} {"train_loss": -9.342191696166992, "global_step": 97400, "epoch": 579} {"train_loss": -9.092462539672852, "global_step": 97401, "epoch": 579} {"train_loss": -9.405197143554688, "global_step": 97402, "epoch": 579} {"train_loss": -9.41341781616211, "global_step": 97403, "epoch": 579} {"train_loss": -9.273881912231445, "global_step": 97404, "epoch": 579} {"train_loss": -9.34839916229248, "global_step": 97405, "epoch": 579} {"train_loss": -9.539772033691406, "global_step": 97406, "epoch": 579} {"train_loss": -9.34987735748291, "global_step": 97407, "epoch": 579} {"train_loss": -9.5195951461792, "global_step": 97408, "epoch": 579} {"train_loss": -9.49860668182373, "global_step": 97409, "epoch": 579} {"train_loss": -9.582176208496094, "global_step": 97410, "epoch": 579} {"train_loss": -9.277392387390137, "global_step": 97411, "epoch": 579} {"train_loss": -9.32351303100586, "global_step": 97412, "epoch": 579} {"train_loss": -9.50813102722168, "global_step": 97413, "epoch": 579} {"train_loss": -9.486391067504883, "global_step": 97414, "epoch": 579} {"train_loss": -9.509392738342285, "global_step": 97415, "epoch": 579} {"train_loss": -9.53176498413086, "global_step": 97416, "epoch": 579} {"train_loss": -9.586681365966797, "global_step": 97417, "epoch": 579} {"train_loss": -9.574017524719238, "global_step": 97418, "epoch": 579} {"train_loss": -9.793730735778809, "global_step": 97419, "epoch": 579} {"train_loss": -9.606657028198242, "global_step": 97420, "epoch": 579} {"train_loss": -9.87840461730957, "global_step": 97421, "epoch": 579} {"train_loss": -9.657442092895508, "global_step": 97422, "epoch": 579} {"train_loss": -9.60644245147705, "global_step": 97423, "epoch": 579} {"train_loss": -9.683462142944336, "global_step": 97424, "epoch": 579} {"train_loss": -9.40145206451416, "global_step": 97425, "epoch": 579} {"train_loss": -9.524486541748047, "global_step": 97426, "epoch": 579} {"train_loss": -9.309782981872559, "global_step": 97427, "epoch": 579} {"train_loss": -9.449285507202148, "global_step": 97428, "epoch": 579} {"train_loss": -9.481608390808105, "global_step": 97429, "epoch": 579} {"train_loss": -9.543039321899414, "global_step": 97430, "epoch": 579} {"train_loss": -9.759117126464844, "global_step": 97431, "epoch": 579} {"train_loss": -9.391117095947266, "global_step": 97432, "epoch": 579} {"train_loss": -9.839512825012207, "global_step": 97433, "epoch": 579} {"train_loss": -9.778678894042969, "global_step": 97434, "epoch": 579} {"train_loss": -9.75111198425293, "global_step": 97435, "epoch": 579} {"train_loss": -9.419998168945312, "global_step": 97436, "epoch": 579} {"train_loss": -9.713827133178711, "global_step": 97437, "epoch": 579} {"train_loss": -9.711026191711426, "global_step": 97438, "epoch": 579} {"train_loss": -9.595942213421775, "global_step": 97439, "epoch": 579, "val_loss": 204366.015625} {"train_loss": -9.066712379455566, "global_step": 97440, "epoch": 580} {"train_loss": -9.61584758758545, "global_step": 97441, "epoch": 580} {"train_loss": -9.343494415283203, "global_step": 97442, "epoch": 580} {"train_loss": -9.373847961425781, "global_step": 97443, "epoch": 580} {"train_loss": -9.406047821044922, "global_step": 97444, "epoch": 580} {"train_loss": -9.521706581115723, "global_step": 97445, "epoch": 580} {"train_loss": -9.61625862121582, "global_step": 97446, "epoch": 580} {"train_loss": -9.958566665649414, "global_step": 97447, "epoch": 580} {"train_loss": -9.310822486877441, "global_step": 97448, "epoch": 580} {"train_loss": -9.382353782653809, "global_step": 97449, "epoch": 580} {"train_loss": -8.992456436157227, "global_step": 97450, "epoch": 580} {"train_loss": -9.291095733642578, "global_step": 97451, "epoch": 580} {"train_loss": -8.384495735168457, "global_step": 97452, "epoch": 580} {"train_loss": -9.438135147094727, "global_step": 97453, "epoch": 580} {"train_loss": -9.099710464477539, "global_step": 97454, "epoch": 580} {"train_loss": -8.948617935180664, "global_step": 97455, "epoch": 580} {"train_loss": -8.889228820800781, "global_step": 97456, "epoch": 580} {"train_loss": -8.981462478637695, "global_step": 97457, "epoch": 580} {"train_loss": -9.165380477905273, "global_step": 97458, "epoch": 580} {"train_loss": -9.171863555908203, "global_step": 97459, "epoch": 580} {"train_loss": -9.348095893859863, "global_step": 97460, "epoch": 580} {"train_loss": -9.007722854614258, "global_step": 97461, "epoch": 580} {"train_loss": -9.03972053527832, "global_step": 97462, "epoch": 580} {"train_loss": -8.839609146118164, "global_step": 97463, "epoch": 580} {"train_loss": -9.414772033691406, "global_step": 97464, "epoch": 580} {"train_loss": -8.864818572998047, "global_step": 97465, "epoch": 580} {"train_loss": -9.37698745727539, "global_step": 97466, "epoch": 580} {"train_loss": -9.084096908569336, "global_step": 97467, "epoch": 580} {"train_loss": -9.287750244140625, "global_step": 97468, "epoch": 580} {"train_loss": -9.095001220703125, "global_step": 97469, "epoch": 580} {"train_loss": -9.34981918334961, "global_step": 97470, "epoch": 580} {"train_loss": -9.1917724609375, "global_step": 97471, "epoch": 580} {"train_loss": -9.271753311157227, "global_step": 97472, "epoch": 580} {"train_loss": -9.2975435256958, "global_step": 97473, "epoch": 580} {"train_loss": -9.390447616577148, "global_step": 97474, "epoch": 580} {"train_loss": -9.203869819641113, "global_step": 97475, "epoch": 580} {"train_loss": -8.927543640136719, "global_step": 97476, "epoch": 580} {"train_loss": -9.356941223144531, "global_step": 97477, "epoch": 580} {"train_loss": -9.419843673706055, "global_step": 97478, "epoch": 580} {"train_loss": -9.479494094848633, "global_step": 97479, "epoch": 580} {"train_loss": -9.393223762512207, "global_step": 97480, "epoch": 580} {"train_loss": -9.571651458740234, "global_step": 97481, "epoch": 580} {"train_loss": -9.642786026000977, "global_step": 97482, "epoch": 580} {"train_loss": -9.447738647460938, "global_step": 97483, "epoch": 580} {"train_loss": -9.735296249389648, "global_step": 97484, "epoch": 580} {"train_loss": -9.57376480102539, "global_step": 97485, "epoch": 580} {"train_loss": -9.576053619384766, "global_step": 97486, "epoch": 580} {"train_loss": -9.65592098236084, "global_step": 97487, "epoch": 580} {"train_loss": -9.75291633605957, "global_step": 97488, "epoch": 580} {"train_loss": -9.667661666870117, "global_step": 97489, "epoch": 580} {"train_loss": -9.806161880493164, "global_step": 97490, "epoch": 580} {"train_loss": -9.638015747070312, "global_step": 97491, "epoch": 580} {"train_loss": -9.847064018249512, "global_step": 97492, "epoch": 580} {"train_loss": -9.674606323242188, "global_step": 97493, "epoch": 580} {"train_loss": -9.776395797729492, "global_step": 97494, "epoch": 580} {"train_loss": -9.972244262695312, "global_step": 97495, "epoch": 580} {"train_loss": -9.72081184387207, "global_step": 97496, "epoch": 580} {"train_loss": -9.814748764038086, "global_step": 97497, "epoch": 580} {"train_loss": -9.477079391479492, "global_step": 97498, "epoch": 580} {"train_loss": -9.496466636657715, "global_step": 97499, "epoch": 580} {"train_loss": -9.53957462310791, "global_step": 97500, "epoch": 580} {"train_loss": -9.672443389892578, "global_step": 97501, "epoch": 580} {"train_loss": -9.682923316955566, "global_step": 97502, "epoch": 580} {"train_loss": -9.518170356750488, "global_step": 97503, "epoch": 580} {"train_loss": -9.69931697845459, "global_step": 97504, "epoch": 580} {"train_loss": -9.258271217346191, "global_step": 97505, "epoch": 580} {"train_loss": -9.732645988464355, "global_step": 97506, "epoch": 580} {"train_loss": -9.458215713500977, "global_step": 97507, "epoch": 580} {"train_loss": -9.76363754272461, "global_step": 97508, "epoch": 580} {"train_loss": -9.557596206665039, "global_step": 97509, "epoch": 580} {"train_loss": -9.694009780883789, "global_step": 97510, "epoch": 580} {"train_loss": -9.784534454345703, "global_step": 97511, "epoch": 580} {"train_loss": -9.437328338623047, "global_step": 97512, "epoch": 580} {"train_loss": -9.62498950958252, "global_step": 97513, "epoch": 580} {"train_loss": -9.664709091186523, "global_step": 97514, "epoch": 580} {"train_loss": -9.594422340393066, "global_step": 97515, "epoch": 580} {"train_loss": -9.683610916137695, "global_step": 97516, "epoch": 580} {"train_loss": -9.613290786743164, "global_step": 97517, "epoch": 580} {"train_loss": -9.855936050415039, "global_step": 97518, "epoch": 580} {"train_loss": -9.789692878723145, "global_step": 97519, "epoch": 580} {"train_loss": -9.551825523376465, "global_step": 97520, "epoch": 580} {"train_loss": -9.55822467803955, "global_step": 97521, "epoch": 580} {"train_loss": -9.48790168762207, "global_step": 97522, "epoch": 580} {"train_loss": -9.799325942993164, "global_step": 97523, "epoch": 580} {"train_loss": -9.617725372314453, "global_step": 97524, "epoch": 580} {"train_loss": -9.545458793640137, "global_step": 97525, "epoch": 580} {"train_loss": -9.716540336608887, "global_step": 97526, "epoch": 580} {"train_loss": -9.694149017333984, "global_step": 97527, "epoch": 580} {"train_loss": -9.487258911132812, "global_step": 97528, "epoch": 580} {"train_loss": -9.707500457763672, "global_step": 97529, "epoch": 580} {"train_loss": -9.34477710723877, "global_step": 97530, "epoch": 580} {"train_loss": -9.78311538696289, "global_step": 97531, "epoch": 580} {"train_loss": -9.60521125793457, "global_step": 97532, "epoch": 580} {"train_loss": -9.315258026123047, "global_step": 97533, "epoch": 580} {"train_loss": -9.32110595703125, "global_step": 97534, "epoch": 580} {"train_loss": -9.830423355102539, "global_step": 97535, "epoch": 580} {"train_loss": -9.603179931640625, "global_step": 97536, "epoch": 580} {"train_loss": -9.757668495178223, "global_step": 97537, "epoch": 580} {"train_loss": -9.613308906555176, "global_step": 97538, "epoch": 580} {"train_loss": -9.39545726776123, "global_step": 97539, "epoch": 580} {"train_loss": -9.477365493774414, "global_step": 97540, "epoch": 580} {"train_loss": -9.316442489624023, "global_step": 97541, "epoch": 580} {"train_loss": -9.428771018981934, "global_step": 97542, "epoch": 580} {"train_loss": -9.502307891845703, "global_step": 97543, "epoch": 580} {"train_loss": -9.42357063293457, "global_step": 97544, "epoch": 580} {"train_loss": -9.496365547180176, "global_step": 97545, "epoch": 580} {"train_loss": -9.269298553466797, "global_step": 97546, "epoch": 580} {"train_loss": -9.717060089111328, "global_step": 97547, "epoch": 580} {"train_loss": -9.596145629882812, "global_step": 97548, "epoch": 580} {"train_loss": -9.594898223876953, "global_step": 97549, "epoch": 580} {"train_loss": -9.642473220825195, "global_step": 97550, "epoch": 580} {"train_loss": -9.464038848876953, "global_step": 97551, "epoch": 580} {"train_loss": -9.333779335021973, "global_step": 97552, "epoch": 580} {"train_loss": -9.774860382080078, "global_step": 97553, "epoch": 580} {"train_loss": -9.655604362487793, "global_step": 97554, "epoch": 580} {"train_loss": -9.926137924194336, "global_step": 97555, "epoch": 580} {"train_loss": -9.607882499694824, "global_step": 97556, "epoch": 580} {"train_loss": -9.688467025756836, "global_step": 97557, "epoch": 580} {"train_loss": -9.755441665649414, "global_step": 97558, "epoch": 580} {"train_loss": -9.762435913085938, "global_step": 97559, "epoch": 580} {"train_loss": -9.721551895141602, "global_step": 97560, "epoch": 580} {"train_loss": -9.881865501403809, "global_step": 97561, "epoch": 580} {"train_loss": -9.663511276245117, "global_step": 97562, "epoch": 580} {"train_loss": -9.701215744018555, "global_step": 97563, "epoch": 580} {"train_loss": -9.635007858276367, "global_step": 97564, "epoch": 580} {"train_loss": -9.585176467895508, "global_step": 97565, "epoch": 580} {"train_loss": -9.87017822265625, "global_step": 97566, "epoch": 580} {"train_loss": -9.445035934448242, "global_step": 97567, "epoch": 580} {"train_loss": -9.664495468139648, "global_step": 97568, "epoch": 580} {"train_loss": -9.55270767211914, "global_step": 97569, "epoch": 580} {"train_loss": -9.396658897399902, "global_step": 97570, "epoch": 580} {"train_loss": -9.361858367919922, "global_step": 97571, "epoch": 580} {"train_loss": -9.887316703796387, "global_step": 97572, "epoch": 580} {"train_loss": -9.583700180053711, "global_step": 97573, "epoch": 580} {"train_loss": -9.55850601196289, "global_step": 97574, "epoch": 580} {"train_loss": -9.274045944213867, "global_step": 97575, "epoch": 580} {"train_loss": -9.637548446655273, "global_step": 97576, "epoch": 580} {"train_loss": -9.852937698364258, "global_step": 97577, "epoch": 580} {"train_loss": -9.639541625976562, "global_step": 97578, "epoch": 580} {"train_loss": -9.62800407409668, "global_step": 97579, "epoch": 580} {"train_loss": -9.684833526611328, "global_step": 97580, "epoch": 580} {"train_loss": -9.208196640014648, "global_step": 97581, "epoch": 580} {"train_loss": -9.545056343078613, "global_step": 97582, "epoch": 580} {"train_loss": -9.47778034210205, "global_step": 97583, "epoch": 580} {"train_loss": -9.355119705200195, "global_step": 97584, "epoch": 580} {"train_loss": -9.146086692810059, "global_step": 97585, "epoch": 580} {"train_loss": -9.676445960998535, "global_step": 97586, "epoch": 580} {"train_loss": -9.283331871032715, "global_step": 97587, "epoch": 580} {"train_loss": -9.340363502502441, "global_step": 97588, "epoch": 580} {"train_loss": -9.448020935058594, "global_step": 97589, "epoch": 580} {"train_loss": -9.238359451293945, "global_step": 97590, "epoch": 580} {"train_loss": -9.266181945800781, "global_step": 97591, "epoch": 580} {"train_loss": -9.346824645996094, "global_step": 97592, "epoch": 580} {"train_loss": -9.616839408874512, "global_step": 97593, "epoch": 580} {"train_loss": -9.04046630859375, "global_step": 97594, "epoch": 580} {"train_loss": -9.720937728881836, "global_step": 97595, "epoch": 580} {"train_loss": -9.363525390625, "global_step": 97596, "epoch": 580} {"train_loss": -9.522523880004883, "global_step": 97597, "epoch": 580} {"train_loss": -9.490094184875488, "global_step": 97598, "epoch": 580} {"train_loss": -9.262260437011719, "global_step": 97599, "epoch": 580} {"train_loss": -9.416720390319824, "global_step": 97600, "epoch": 580} {"train_loss": -9.464517593383789, "global_step": 97601, "epoch": 580} {"train_loss": -9.118047714233398, "global_step": 97602, "epoch": 580} {"train_loss": -9.000679969787598, "global_step": 97603, "epoch": 580} {"train_loss": -9.633668899536133, "global_step": 97604, "epoch": 580} {"train_loss": -9.062156677246094, "global_step": 97605, "epoch": 580} {"train_loss": -9.811963081359863, "global_step": 97606, "epoch": 580} {"train_loss": -9.484258651733398, "global_step": 97607, "epoch": 580, "val_loss": 203821.140625, "train_action_mse_error": 6.82203483581543} {"train_loss": -9.614733695983887, "global_step": 97608, "epoch": 581} {"train_loss": -9.337658882141113, "global_step": 97609, "epoch": 581} {"train_loss": -9.125537872314453, "global_step": 97610, "epoch": 581} {"train_loss": -9.405757904052734, "global_step": 97611, "epoch": 581} {"train_loss": -9.484359741210938, "global_step": 97612, "epoch": 581} {"train_loss": -9.553292274475098, "global_step": 97613, "epoch": 581} {"train_loss": -9.223207473754883, "global_step": 97614, "epoch": 581} {"train_loss": -9.535146713256836, "global_step": 97615, "epoch": 581} {"train_loss": -9.439291000366211, "global_step": 97616, "epoch": 581} {"train_loss": -9.6935453414917, "global_step": 97617, "epoch": 581} {"train_loss": -9.511137008666992, "global_step": 97618, "epoch": 581} {"train_loss": -9.91868782043457, "global_step": 97619, "epoch": 581} {"train_loss": -9.593280792236328, "global_step": 97620, "epoch": 581} {"train_loss": -9.535858154296875, "global_step": 97621, "epoch": 581} {"train_loss": -9.670071601867676, "global_step": 97622, "epoch": 581} {"train_loss": -9.630064010620117, "global_step": 97623, "epoch": 581} {"train_loss": -9.557548522949219, "global_step": 97624, "epoch": 581} {"train_loss": -9.671684265136719, "global_step": 97625, "epoch": 581} {"train_loss": -9.772921562194824, "global_step": 97626, "epoch": 581} {"train_loss": -9.791399002075195, "global_step": 97627, "epoch": 581} {"train_loss": -9.78422737121582, "global_step": 97628, "epoch": 581} {"train_loss": -9.821907997131348, "global_step": 97629, "epoch": 581} {"train_loss": -9.81837272644043, "global_step": 97630, "epoch": 581} {"train_loss": -9.853203773498535, "global_step": 97631, "epoch": 581} {"train_loss": -9.743936538696289, "global_step": 97632, "epoch": 581} {"train_loss": -9.917871475219727, "global_step": 97633, "epoch": 581} {"train_loss": -9.992497444152832, "global_step": 97634, "epoch": 581} {"train_loss": -9.721816062927246, "global_step": 97635, "epoch": 581} {"train_loss": -9.809606552124023, "global_step": 97636, "epoch": 581} {"train_loss": -10.001382827758789, "global_step": 97637, "epoch": 581} {"train_loss": -9.757820129394531, "global_step": 97638, "epoch": 581} {"train_loss": -9.937153816223145, "global_step": 97639, "epoch": 581} {"train_loss": -9.643421173095703, "global_step": 97640, "epoch": 581} {"train_loss": -9.740901947021484, "global_step": 97641, "epoch": 581} {"train_loss": -9.955578804016113, "global_step": 97642, "epoch": 581} {"train_loss": -9.708236694335938, "global_step": 97643, "epoch": 581} {"train_loss": -9.750787734985352, "global_step": 97644, "epoch": 581} {"train_loss": -9.676285743713379, "global_step": 97645, "epoch": 581} {"train_loss": -9.69391918182373, "global_step": 97646, "epoch": 581} {"train_loss": -10.009956359863281, "global_step": 97647, "epoch": 581} {"train_loss": -9.579818725585938, "global_step": 97648, "epoch": 581} {"train_loss": -9.632955551147461, "global_step": 97649, "epoch": 581} {"train_loss": -9.793437957763672, "global_step": 97650, "epoch": 581} {"train_loss": -9.356985092163086, "global_step": 97651, "epoch": 581} {"train_loss": -9.652528762817383, "global_step": 97652, "epoch": 581} {"train_loss": -10.049717903137207, "global_step": 97653, "epoch": 581} {"train_loss": -10.073989868164062, "global_step": 97654, "epoch": 581} {"train_loss": -9.513771057128906, "global_step": 97655, "epoch": 581} {"train_loss": -9.388460159301758, "global_step": 97656, "epoch": 581} {"train_loss": -9.714417457580566, "global_step": 97657, "epoch": 581} {"train_loss": -9.655179977416992, "global_step": 97658, "epoch": 581} {"train_loss": -9.83642292022705, "global_step": 97659, "epoch": 581} {"train_loss": -9.820929527282715, "global_step": 97660, "epoch": 581} {"train_loss": -9.887474060058594, "global_step": 97661, "epoch": 581} {"train_loss": -9.472625732421875, "global_step": 97662, "epoch": 581} {"train_loss": -9.606728553771973, "global_step": 97663, "epoch": 581} {"train_loss": -9.451103210449219, "global_step": 97664, "epoch": 581} {"train_loss": -9.499011039733887, "global_step": 97665, "epoch": 581} {"train_loss": -9.340425491333008, "global_step": 97666, "epoch": 581} {"train_loss": -9.593633651733398, "global_step": 97667, "epoch": 581} {"train_loss": -9.502495765686035, "global_step": 97668, "epoch": 581} {"train_loss": -9.690362930297852, "global_step": 97669, "epoch": 581} {"train_loss": -9.631265640258789, "global_step": 97670, "epoch": 581} {"train_loss": -9.428709030151367, "global_step": 97671, "epoch": 581} {"train_loss": -9.545766830444336, "global_step": 97672, "epoch": 581} {"train_loss": -9.07052230834961, "global_step": 97673, "epoch": 581} {"train_loss": -9.51054573059082, "global_step": 97674, "epoch": 581} {"train_loss": -9.407425880432129, "global_step": 97675, "epoch": 581} {"train_loss": -9.704999923706055, "global_step": 97676, "epoch": 581} {"train_loss": -9.645748138427734, "global_step": 97677, "epoch": 581} {"train_loss": -9.695791244506836, "global_step": 97678, "epoch": 581} {"train_loss": -9.393096923828125, "global_step": 97679, "epoch": 581} {"train_loss": -9.641342163085938, "global_step": 97680, "epoch": 581} {"train_loss": -9.605578422546387, "global_step": 97681, "epoch": 581} {"train_loss": -9.743669509887695, "global_step": 97682, "epoch": 581} {"train_loss": -9.702047348022461, "global_step": 97683, "epoch": 581} {"train_loss": -9.553848266601562, "global_step": 97684, "epoch": 581} {"train_loss": -9.384986877441406, "global_step": 97685, "epoch": 581} {"train_loss": -9.729508399963379, "global_step": 97686, "epoch": 581} {"train_loss": -9.712380409240723, "global_step": 97687, "epoch": 581} {"train_loss": -9.571718215942383, "global_step": 97688, "epoch": 581} {"train_loss": -9.639825820922852, "global_step": 97689, "epoch": 581} {"train_loss": -9.83297348022461, "global_step": 97690, "epoch": 581} {"train_loss": -9.731172561645508, "global_step": 97691, "epoch": 581} {"train_loss": -9.491762161254883, "global_step": 97692, "epoch": 581} {"train_loss": -9.791471481323242, "global_step": 97693, "epoch": 581} {"train_loss": -9.908945083618164, "global_step": 97694, "epoch": 581} {"train_loss": -9.585332870483398, "global_step": 97695, "epoch": 581} {"train_loss": -9.768357276916504, "global_step": 97696, "epoch": 581} {"train_loss": -9.88884162902832, "global_step": 97697, "epoch": 581} {"train_loss": -9.557210922241211, "global_step": 97698, "epoch": 581} {"train_loss": -9.89006233215332, "global_step": 97699, "epoch": 581} {"train_loss": -9.663583755493164, "global_step": 97700, "epoch": 581} {"train_loss": -9.73093032836914, "global_step": 97701, "epoch": 581} {"train_loss": -9.845998764038086, "global_step": 97702, "epoch": 581} {"train_loss": -9.601893424987793, "global_step": 97703, "epoch": 581} {"train_loss": -9.624812126159668, "global_step": 97704, "epoch": 581} {"train_loss": -9.277616500854492, "global_step": 97705, "epoch": 581} {"train_loss": -9.648843765258789, "global_step": 97706, "epoch": 581} {"train_loss": -9.760242462158203, "global_step": 97707, "epoch": 581} {"train_loss": -9.874214172363281, "global_step": 97708, "epoch": 581} {"train_loss": -9.831581115722656, "global_step": 97709, "epoch": 581} {"train_loss": -9.926566123962402, "global_step": 97710, "epoch": 581} {"train_loss": -9.847679138183594, "global_step": 97711, "epoch": 581} {"train_loss": -9.690400123596191, "global_step": 97712, "epoch": 581} {"train_loss": -9.739740371704102, "global_step": 97713, "epoch": 581} {"train_loss": -9.978740692138672, "global_step": 97714, "epoch": 581} {"train_loss": -9.343517303466797, "global_step": 97715, "epoch": 581} {"train_loss": -9.739324569702148, "global_step": 97716, "epoch": 581} {"train_loss": -9.7467622756958, "global_step": 97717, "epoch": 581} {"train_loss": -9.6695556640625, "global_step": 97718, "epoch": 581} {"train_loss": -9.663338661193848, "global_step": 97719, "epoch": 581} {"train_loss": -9.780029296875, "global_step": 97720, "epoch": 581} {"train_loss": -9.821365356445312, "global_step": 97721, "epoch": 581} {"train_loss": -9.949213027954102, "global_step": 97722, "epoch": 581} {"train_loss": -9.774978637695312, "global_step": 97723, "epoch": 581} {"train_loss": -9.585423469543457, "global_step": 97724, "epoch": 581} {"train_loss": -9.804267883300781, "global_step": 97725, "epoch": 581} {"train_loss": -9.645137786865234, "global_step": 97726, "epoch": 581} {"train_loss": -9.677653312683105, "global_step": 97727, "epoch": 581} {"train_loss": -9.834640502929688, "global_step": 97728, "epoch": 581} {"train_loss": -9.834676742553711, "global_step": 97729, "epoch": 581} {"train_loss": -9.940442085266113, "global_step": 97730, "epoch": 581} {"train_loss": -9.98568344116211, "global_step": 97731, "epoch": 581} {"train_loss": -9.794655799865723, "global_step": 97732, "epoch": 581} {"train_loss": -9.61839771270752, "global_step": 97733, "epoch": 581} {"train_loss": -9.740362167358398, "global_step": 97734, "epoch": 581} {"train_loss": -9.54607105255127, "global_step": 97735, "epoch": 581} {"train_loss": -9.635232925415039, "global_step": 97736, "epoch": 581} {"train_loss": -9.656148910522461, "global_step": 97737, "epoch": 581} {"train_loss": -9.367152214050293, "global_step": 97738, "epoch": 581} {"train_loss": -9.791446685791016, "global_step": 97739, "epoch": 581} {"train_loss": -8.906434059143066, "global_step": 97740, "epoch": 581} {"train_loss": -9.453790664672852, "global_step": 97741, "epoch": 581} {"train_loss": -9.187591552734375, "global_step": 97742, "epoch": 581} {"train_loss": -9.514810562133789, "global_step": 97743, "epoch": 581} {"train_loss": -9.61851692199707, "global_step": 97744, "epoch": 581} {"train_loss": -9.395211219787598, "global_step": 97745, "epoch": 581} {"train_loss": -9.348881721496582, "global_step": 97746, "epoch": 581} {"train_loss": -9.312403678894043, "global_step": 97747, "epoch": 581} {"train_loss": -9.548179626464844, "global_step": 97748, "epoch": 581} {"train_loss": -9.351353645324707, "global_step": 97749, "epoch": 581} {"train_loss": -9.486845016479492, "global_step": 97750, "epoch": 581} {"train_loss": -9.300867080688477, "global_step": 97751, "epoch": 581} {"train_loss": -9.153889656066895, "global_step": 97752, "epoch": 581} {"train_loss": -9.47195053100586, "global_step": 97753, "epoch": 581} {"train_loss": -9.629742622375488, "global_step": 97754, "epoch": 581} {"train_loss": -9.216952323913574, "global_step": 97755, "epoch": 581} {"train_loss": -9.557283401489258, "global_step": 97756, "epoch": 581} {"train_loss": -9.482156753540039, "global_step": 97757, "epoch": 581} {"train_loss": -9.4592866897583, "global_step": 97758, "epoch": 581} {"train_loss": -9.42061996459961, "global_step": 97759, "epoch": 581} {"train_loss": -9.743144989013672, "global_step": 97760, "epoch": 581} {"train_loss": -9.814408302307129, "global_step": 97761, "epoch": 581} {"train_loss": -9.720970153808594, "global_step": 97762, "epoch": 581} {"train_loss": -9.811052322387695, "global_step": 97763, "epoch": 581} {"train_loss": -9.871014595031738, "global_step": 97764, "epoch": 581} {"train_loss": -9.691540718078613, "global_step": 97765, "epoch": 581} {"train_loss": -9.834855079650879, "global_step": 97766, "epoch": 581} {"train_loss": -9.655206680297852, "global_step": 97767, "epoch": 581} {"train_loss": -9.642251968383789, "global_step": 97768, "epoch": 581} {"train_loss": -9.698148727416992, "global_step": 97769, "epoch": 581} {"train_loss": -9.873178482055664, "global_step": 97770, "epoch": 581} {"train_loss": -9.565961837768555, "global_step": 97771, "epoch": 581} {"train_loss": -9.761271476745605, "global_step": 97772, "epoch": 581} {"train_loss": -9.89981746673584, "global_step": 97773, "epoch": 581} {"train_loss": -9.720643997192383, "global_step": 97774, "epoch": 581} {"train_loss": -9.648781424476987, "global_step": 97775, "epoch": 581, "val_loss": 205416.6875} {"train_loss": -9.385954856872559, "global_step": 97776, "epoch": 582} {"train_loss": -9.62798023223877, "global_step": 97777, "epoch": 582} {"train_loss": -9.650863647460938, "global_step": 97778, "epoch": 582} {"train_loss": -9.427674293518066, "global_step": 97779, "epoch": 582} {"train_loss": -9.604812622070312, "global_step": 97780, "epoch": 582} {"train_loss": -9.706819534301758, "global_step": 97781, "epoch": 582} {"train_loss": -9.589509963989258, "global_step": 97782, "epoch": 582} {"train_loss": -9.573421478271484, "global_step": 97783, "epoch": 582} {"train_loss": -9.815641403198242, "global_step": 97784, "epoch": 582} {"train_loss": -9.89309024810791, "global_step": 97785, "epoch": 582} {"train_loss": -9.413732528686523, "global_step": 97786, "epoch": 582} {"train_loss": -9.375628471374512, "global_step": 97787, "epoch": 582} {"train_loss": -9.297359466552734, "global_step": 97788, "epoch": 582} {"train_loss": -9.141671180725098, "global_step": 97789, "epoch": 582} {"train_loss": -9.389608383178711, "global_step": 97790, "epoch": 582} {"train_loss": -9.40377426147461, "global_step": 97791, "epoch": 582} {"train_loss": -9.318520545959473, "global_step": 97792, "epoch": 582} {"train_loss": -9.287665367126465, "global_step": 97793, "epoch": 582} {"train_loss": -9.501471519470215, "global_step": 97794, "epoch": 582} {"train_loss": -9.530166625976562, "global_step": 97795, "epoch": 582} {"train_loss": -9.403096199035645, "global_step": 97796, "epoch": 582} {"train_loss": -9.31912899017334, "global_step": 97797, "epoch": 582} {"train_loss": -9.399145126342773, "global_step": 97798, "epoch": 582} {"train_loss": -9.364175796508789, "global_step": 97799, "epoch": 582} {"train_loss": -9.370019912719727, "global_step": 97800, "epoch": 582} {"train_loss": -9.259597778320312, "global_step": 97801, "epoch": 582} {"train_loss": -9.597358703613281, "global_step": 97802, "epoch": 582} {"train_loss": -9.262065887451172, "global_step": 97803, "epoch": 582} {"train_loss": -9.278517723083496, "global_step": 97804, "epoch": 582} {"train_loss": -9.635797500610352, "global_step": 97805, "epoch": 582} {"train_loss": -9.339537620544434, "global_step": 97806, "epoch": 582} {"train_loss": -9.58046817779541, "global_step": 97807, "epoch": 582} {"train_loss": -9.696189880371094, "global_step": 97808, "epoch": 582} {"train_loss": -9.417597770690918, "global_step": 97809, "epoch": 582} {"train_loss": -9.494837760925293, "global_step": 97810, "epoch": 582} {"train_loss": -9.45741081237793, "global_step": 97811, "epoch": 582} {"train_loss": -9.611089706420898, "global_step": 97812, "epoch": 582} {"train_loss": -9.665695190429688, "global_step": 97813, "epoch": 582} {"train_loss": -9.535184860229492, "global_step": 97814, "epoch": 582} {"train_loss": -9.1290864944458, "global_step": 97815, "epoch": 582} {"train_loss": -9.758455276489258, "global_step": 97816, "epoch": 582} {"train_loss": -9.743000030517578, "global_step": 97817, "epoch": 582} {"train_loss": -9.650527954101562, "global_step": 97818, "epoch": 582} {"train_loss": -9.955633163452148, "global_step": 97819, "epoch": 582} {"train_loss": -9.433429718017578, "global_step": 97820, "epoch": 582} {"train_loss": -9.69035530090332, "global_step": 97821, "epoch": 582} {"train_loss": -9.723275184631348, "global_step": 97822, "epoch": 582} {"train_loss": -9.660369873046875, "global_step": 97823, "epoch": 582} {"train_loss": -9.694499969482422, "global_step": 97824, "epoch": 582} {"train_loss": -9.806856155395508, "global_step": 97825, "epoch": 582} {"train_loss": -9.703241348266602, "global_step": 97826, "epoch": 582} {"train_loss": -9.808915138244629, "global_step": 97827, "epoch": 582} {"train_loss": -9.703605651855469, "global_step": 97828, "epoch": 582} {"train_loss": -9.623539924621582, "global_step": 97829, "epoch": 582} {"train_loss": -9.91239070892334, "global_step": 97830, "epoch": 582} {"train_loss": -9.643301010131836, "global_step": 97831, "epoch": 582} {"train_loss": -9.787422180175781, "global_step": 97832, "epoch": 582} {"train_loss": -9.865020751953125, "global_step": 97833, "epoch": 582} {"train_loss": -10.009014129638672, "global_step": 97834, "epoch": 582} {"train_loss": -9.732139587402344, "global_step": 97835, "epoch": 582} {"train_loss": -9.724791526794434, "global_step": 97836, "epoch": 582} {"train_loss": -9.75522232055664, "global_step": 97837, "epoch": 582} {"train_loss": -9.99946403503418, "global_step": 97838, "epoch": 582} {"train_loss": -9.834051132202148, "global_step": 97839, "epoch": 582} {"train_loss": -9.61003303527832, "global_step": 97840, "epoch": 582} {"train_loss": -9.435285568237305, "global_step": 97841, "epoch": 582} {"train_loss": -9.831815719604492, "global_step": 97842, "epoch": 582} {"train_loss": -9.619596481323242, "global_step": 97843, "epoch": 582} {"train_loss": -9.8151216506958, "global_step": 97844, "epoch": 582} {"train_loss": -9.642158508300781, "global_step": 97845, "epoch": 582} {"train_loss": -9.68718433380127, "global_step": 97846, "epoch": 582} {"train_loss": -9.747694969177246, "global_step": 97847, "epoch": 582} {"train_loss": -9.749260902404785, "global_step": 97848, "epoch": 582} {"train_loss": -9.934057235717773, "global_step": 97849, "epoch": 582} {"train_loss": -9.70553970336914, "global_step": 97850, "epoch": 582} {"train_loss": -9.812026977539062, "global_step": 97851, "epoch": 582} {"train_loss": -9.64241886138916, "global_step": 97852, "epoch": 582} {"train_loss": -9.486859321594238, "global_step": 97853, "epoch": 582} {"train_loss": -9.794946670532227, "global_step": 97854, "epoch": 582} {"train_loss": -9.711711883544922, "global_step": 97855, "epoch": 582} {"train_loss": -9.436903953552246, "global_step": 97856, "epoch": 582} {"train_loss": -9.803366661071777, "global_step": 97857, "epoch": 582} {"train_loss": -9.50567626953125, "global_step": 97858, "epoch": 582} {"train_loss": -9.269094467163086, "global_step": 97859, "epoch": 582} {"train_loss": -9.236211776733398, "global_step": 97860, "epoch": 582} {"train_loss": -8.526309967041016, "global_step": 97861, "epoch": 582} {"train_loss": -9.531661987304688, "global_step": 97862, "epoch": 582} {"train_loss": -9.240180015563965, "global_step": 97863, "epoch": 582} {"train_loss": -9.445276260375977, "global_step": 97864, "epoch": 582} {"train_loss": -9.358710289001465, "global_step": 97865, "epoch": 582} {"train_loss": -9.551435470581055, "global_step": 97866, "epoch": 582} {"train_loss": -9.425834655761719, "global_step": 97867, "epoch": 582} {"train_loss": -9.617583274841309, "global_step": 97868, "epoch": 582} {"train_loss": -9.400074005126953, "global_step": 97869, "epoch": 582} {"train_loss": -8.927835464477539, "global_step": 97870, "epoch": 582} {"train_loss": -9.523947715759277, "global_step": 97871, "epoch": 582} {"train_loss": -9.360769271850586, "global_step": 97872, "epoch": 582} {"train_loss": -9.478744506835938, "global_step": 97873, "epoch": 582} {"train_loss": -9.382866859436035, "global_step": 97874, "epoch": 582} {"train_loss": -9.640825271606445, "global_step": 97875, "epoch": 582} {"train_loss": -9.544811248779297, "global_step": 97876, "epoch": 582} {"train_loss": -9.816361427307129, "global_step": 97877, "epoch": 582} {"train_loss": -9.481069564819336, "global_step": 97878, "epoch": 582} {"train_loss": -9.566682815551758, "global_step": 97879, "epoch": 582} {"train_loss": -9.564491271972656, "global_step": 97880, "epoch": 582} {"train_loss": -9.822090148925781, "global_step": 97881, "epoch": 582} {"train_loss": -9.567548751831055, "global_step": 97882, "epoch": 582} {"train_loss": -9.4840087890625, "global_step": 97883, "epoch": 582} {"train_loss": -9.686033248901367, "global_step": 97884, "epoch": 582} {"train_loss": -9.58222770690918, "global_step": 97885, "epoch": 582} {"train_loss": -9.699239730834961, "global_step": 97886, "epoch": 582} {"train_loss": -9.692171096801758, "global_step": 97887, "epoch": 582} {"train_loss": -9.315621376037598, "global_step": 97888, "epoch": 582} {"train_loss": -9.785948753356934, "global_step": 97889, "epoch": 582} {"train_loss": -9.37823486328125, "global_step": 97890, "epoch": 582} {"train_loss": -9.627798080444336, "global_step": 97891, "epoch": 582} {"train_loss": -9.450368881225586, "global_step": 97892, "epoch": 582} {"train_loss": -9.687993049621582, "global_step": 97893, "epoch": 582} {"train_loss": -9.099411010742188, "global_step": 97894, "epoch": 582} {"train_loss": -9.573641777038574, "global_step": 97895, "epoch": 582} {"train_loss": -9.636106491088867, "global_step": 97896, "epoch": 582} {"train_loss": -9.520057678222656, "global_step": 97897, "epoch": 582} {"train_loss": -9.727248191833496, "global_step": 97898, "epoch": 582} {"train_loss": -9.596148490905762, "global_step": 97899, "epoch": 582} {"train_loss": -9.414323806762695, "global_step": 97900, "epoch": 582} {"train_loss": -9.36196517944336, "global_step": 97901, "epoch": 582} {"train_loss": -9.610176086425781, "global_step": 97902, "epoch": 582} {"train_loss": -9.320598602294922, "global_step": 97903, "epoch": 582} {"train_loss": -9.85973072052002, "global_step": 97904, "epoch": 582} {"train_loss": -9.344808578491211, "global_step": 97905, "epoch": 582} {"train_loss": -9.803704261779785, "global_step": 97906, "epoch": 582} {"train_loss": -9.795778274536133, "global_step": 97907, "epoch": 582} {"train_loss": -9.619815826416016, "global_step": 97908, "epoch": 582} {"train_loss": -9.669347763061523, "global_step": 97909, "epoch": 582} {"train_loss": -9.75917911529541, "global_step": 97910, "epoch": 582} {"train_loss": -9.638900756835938, "global_step": 97911, "epoch": 582} {"train_loss": -9.657524108886719, "global_step": 97912, "epoch": 582} {"train_loss": -9.607715606689453, "global_step": 97913, "epoch": 582} {"train_loss": -9.764759063720703, "global_step": 97914, "epoch": 582} {"train_loss": -9.543323516845703, "global_step": 97915, "epoch": 582} {"train_loss": -9.585428237915039, "global_step": 97916, "epoch": 582} {"train_loss": -9.543567657470703, "global_step": 97917, "epoch": 582} {"train_loss": -9.713427543640137, "global_step": 97918, "epoch": 582} {"train_loss": -9.564784049987793, "global_step": 97919, "epoch": 582} {"train_loss": -9.785074234008789, "global_step": 97920, "epoch": 582} {"train_loss": -9.63066291809082, "global_step": 97921, "epoch": 582} {"train_loss": -9.765607833862305, "global_step": 97922, "epoch": 582} {"train_loss": -9.586915016174316, "global_step": 97923, "epoch": 582} {"train_loss": -9.550737380981445, "global_step": 97924, "epoch": 582} {"train_loss": -9.572961807250977, "global_step": 97925, "epoch": 582} {"train_loss": -9.365428924560547, "global_step": 97926, "epoch": 582} {"train_loss": -9.55880355834961, "global_step": 97927, "epoch": 582} {"train_loss": -9.32254409790039, "global_step": 97928, "epoch": 582} {"train_loss": -9.385027885437012, "global_step": 97929, "epoch": 582} {"train_loss": -9.262956619262695, "global_step": 97930, "epoch": 582} {"train_loss": -9.60727596282959, "global_step": 97931, "epoch": 582} {"train_loss": -9.352987289428711, "global_step": 97932, "epoch": 582} {"train_loss": -9.670745849609375, "global_step": 97933, "epoch": 582} {"train_loss": -9.316141128540039, "global_step": 97934, "epoch": 582} {"train_loss": -9.268355369567871, "global_step": 97935, "epoch": 582} {"train_loss": -9.642302513122559, "global_step": 97936, "epoch": 582} {"train_loss": -9.505546569824219, "global_step": 97937, "epoch": 582} {"train_loss": -9.747941970825195, "global_step": 97938, "epoch": 582} {"train_loss": -9.64185905456543, "global_step": 97939, "epoch": 582} {"train_loss": -9.634407997131348, "global_step": 97940, "epoch": 582} {"train_loss": -9.561806678771973, "global_step": 97941, "epoch": 582} {"train_loss": -9.868824005126953, "global_step": 97942, "epoch": 582} {"train_loss": -9.564907891409737, "global_step": 97943, "epoch": 582, "val_loss": 207324.203125} {"train_loss": -9.778570175170898, "global_step": 97944, "epoch": 583} {"train_loss": -9.552803039550781, "global_step": 97945, "epoch": 583} {"train_loss": -9.562089920043945, "global_step": 97946, "epoch": 583} {"train_loss": -9.734546661376953, "global_step": 97947, "epoch": 583} {"train_loss": -9.879171371459961, "global_step": 97948, "epoch": 583} {"train_loss": -9.64702033996582, "global_step": 97949, "epoch": 583} {"train_loss": -9.630054473876953, "global_step": 97950, "epoch": 583} {"train_loss": -9.605646133422852, "global_step": 97951, "epoch": 583} {"train_loss": -9.659902572631836, "global_step": 97952, "epoch": 583} {"train_loss": -9.998985290527344, "global_step": 97953, "epoch": 583} {"train_loss": -9.695211410522461, "global_step": 97954, "epoch": 583} {"train_loss": -9.781607627868652, "global_step": 97955, "epoch": 583} {"train_loss": -10.027761459350586, "global_step": 97956, "epoch": 583} {"train_loss": -9.516634941101074, "global_step": 97957, "epoch": 583} {"train_loss": -9.861810684204102, "global_step": 97958, "epoch": 583} {"train_loss": -9.851874351501465, "global_step": 97959, "epoch": 583} {"train_loss": -9.539913177490234, "global_step": 97960, "epoch": 583} {"train_loss": -9.972867965698242, "global_step": 97961, "epoch": 583} {"train_loss": -9.567323684692383, "global_step": 97962, "epoch": 583} {"train_loss": -9.590002059936523, "global_step": 97963, "epoch": 583} {"train_loss": -9.896869659423828, "global_step": 97964, "epoch": 583} {"train_loss": -9.136656761169434, "global_step": 97965, "epoch": 583} {"train_loss": -9.566036224365234, "global_step": 97966, "epoch": 583} {"train_loss": -9.52710247039795, "global_step": 97967, "epoch": 583} {"train_loss": -9.613718032836914, "global_step": 97968, "epoch": 583} {"train_loss": -9.661598205566406, "global_step": 97969, "epoch": 583} {"train_loss": -9.807038307189941, "global_step": 97970, "epoch": 583} {"train_loss": -9.397429466247559, "global_step": 97971, "epoch": 583} {"train_loss": -9.952224731445312, "global_step": 97972, "epoch": 583} {"train_loss": -9.231325149536133, "global_step": 97973, "epoch": 583} {"train_loss": -9.74847412109375, "global_step": 97974, "epoch": 583} {"train_loss": -9.597513198852539, "global_step": 97975, "epoch": 583} {"train_loss": -9.723989486694336, "global_step": 97976, "epoch": 583} {"train_loss": -9.629853248596191, "global_step": 97977, "epoch": 583} {"train_loss": -9.351455688476562, "global_step": 97978, "epoch": 583} {"train_loss": -9.549503326416016, "global_step": 97979, "epoch": 583} {"train_loss": -9.479080200195312, "global_step": 97980, "epoch": 583} {"train_loss": -9.549983978271484, "global_step": 97981, "epoch": 583} {"train_loss": -9.367953300476074, "global_step": 97982, "epoch": 583} {"train_loss": -9.673965454101562, "global_step": 97983, "epoch": 583} {"train_loss": -9.308605194091797, "global_step": 97984, "epoch": 583} {"train_loss": -9.551496505737305, "global_step": 97985, "epoch": 583} {"train_loss": -9.537383079528809, "global_step": 97986, "epoch": 583} {"train_loss": -9.693166732788086, "global_step": 97987, "epoch": 583} {"train_loss": -9.537374496459961, "global_step": 97988, "epoch": 583} {"train_loss": -9.59030532836914, "global_step": 97989, "epoch": 583} {"train_loss": -9.793315887451172, "global_step": 97990, "epoch": 583} {"train_loss": -9.817570686340332, "global_step": 97991, "epoch": 583} {"train_loss": -9.751885414123535, "global_step": 97992, "epoch": 583} {"train_loss": -9.8541898727417, "global_step": 97993, "epoch": 583} {"train_loss": -9.405712127685547, "global_step": 97994, "epoch": 583} {"train_loss": -9.816518783569336, "global_step": 97995, "epoch": 583} {"train_loss": -9.790595054626465, "global_step": 97996, "epoch": 583} {"train_loss": -9.550130844116211, "global_step": 97997, "epoch": 583} {"train_loss": -9.645257949829102, "global_step": 97998, "epoch": 583} {"train_loss": -9.653271675109863, "global_step": 97999, "epoch": 583} {"train_loss": -9.802234649658203, "global_step": 98000, "epoch": 583} {"train_loss": -9.767450332641602, "global_step": 98001, "epoch": 583} {"train_loss": -9.767786026000977, "global_step": 98002, "epoch": 583} {"train_loss": -9.685434341430664, "global_step": 98003, "epoch": 583} {"train_loss": -9.880464553833008, "global_step": 98004, "epoch": 583} {"train_loss": -9.620346069335938, "global_step": 98005, "epoch": 583} {"train_loss": -9.78127670288086, "global_step": 98006, "epoch": 583} {"train_loss": -9.488861083984375, "global_step": 98007, "epoch": 583} {"train_loss": -9.848112106323242, "global_step": 98008, "epoch": 583} {"train_loss": -10.04957389831543, "global_step": 98009, "epoch": 583} {"train_loss": -9.576534271240234, "global_step": 98010, "epoch": 583} {"train_loss": -9.791919708251953, "global_step": 98011, "epoch": 583} {"train_loss": -9.803988456726074, "global_step": 98012, "epoch": 583} {"train_loss": -9.829059600830078, "global_step": 98013, "epoch": 583} {"train_loss": -9.763154983520508, "global_step": 98014, "epoch": 583} {"train_loss": -10.042471885681152, "global_step": 98015, "epoch": 583} {"train_loss": -9.685627937316895, "global_step": 98016, "epoch": 583} {"train_loss": -9.73420238494873, "global_step": 98017, "epoch": 583} {"train_loss": -9.617080688476562, "global_step": 98018, "epoch": 583} {"train_loss": -9.508548736572266, "global_step": 98019, "epoch": 583} {"train_loss": -9.486274719238281, "global_step": 98020, "epoch": 583} {"train_loss": -9.459932327270508, "global_step": 98021, "epoch": 583} {"train_loss": -9.236721992492676, "global_step": 98022, "epoch": 583} {"train_loss": -9.115293502807617, "global_step": 98023, "epoch": 583} {"train_loss": -9.631824493408203, "global_step": 98024, "epoch": 583} {"train_loss": -9.417659759521484, "global_step": 98025, "epoch": 583} {"train_loss": -9.52925968170166, "global_step": 98026, "epoch": 583} {"train_loss": -9.49930191040039, "global_step": 98027, "epoch": 583} {"train_loss": -9.37925910949707, "global_step": 98028, "epoch": 583} {"train_loss": -9.425071716308594, "global_step": 98029, "epoch": 583} {"train_loss": -9.30233383178711, "global_step": 98030, "epoch": 583} {"train_loss": -9.226094245910645, "global_step": 98031, "epoch": 583} {"train_loss": -9.555707931518555, "global_step": 98032, "epoch": 583} {"train_loss": -9.487140655517578, "global_step": 98033, "epoch": 583} {"train_loss": -9.255484580993652, "global_step": 98034, "epoch": 583} {"train_loss": -9.22303581237793, "global_step": 98035, "epoch": 583} {"train_loss": -9.577465057373047, "global_step": 98036, "epoch": 583} {"train_loss": -9.392080307006836, "global_step": 98037, "epoch": 583} {"train_loss": -9.447731018066406, "global_step": 98038, "epoch": 583} {"train_loss": -9.601692199707031, "global_step": 98039, "epoch": 583} {"train_loss": -9.526811599731445, "global_step": 98040, "epoch": 583} {"train_loss": -9.419644355773926, "global_step": 98041, "epoch": 583} {"train_loss": -9.762748718261719, "global_step": 98042, "epoch": 583} {"train_loss": -9.415648460388184, "global_step": 98043, "epoch": 583} {"train_loss": -9.496515274047852, "global_step": 98044, "epoch": 583} {"train_loss": -9.586316108703613, "global_step": 98045, "epoch": 583} {"train_loss": -9.851238250732422, "global_step": 98046, "epoch": 583} {"train_loss": -9.377918243408203, "global_step": 98047, "epoch": 583} {"train_loss": -9.755937576293945, "global_step": 98048, "epoch": 583} {"train_loss": -9.66939640045166, "global_step": 98049, "epoch": 583} {"train_loss": -9.651272773742676, "global_step": 98050, "epoch": 583} {"train_loss": -9.512843132019043, "global_step": 98051, "epoch": 583} {"train_loss": -9.450779914855957, "global_step": 98052, "epoch": 583} {"train_loss": -9.790460586547852, "global_step": 98053, "epoch": 583} {"train_loss": -9.510586738586426, "global_step": 98054, "epoch": 583} {"train_loss": -9.616720199584961, "global_step": 98055, "epoch": 583} {"train_loss": -9.605966567993164, "global_step": 98056, "epoch": 583} {"train_loss": -9.745454788208008, "global_step": 98057, "epoch": 583} {"train_loss": -9.477376937866211, "global_step": 98058, "epoch": 583} {"train_loss": -9.757186889648438, "global_step": 98059, "epoch": 583} {"train_loss": -9.704402923583984, "global_step": 98060, "epoch": 583} {"train_loss": -9.834417343139648, "global_step": 98061, "epoch": 583} {"train_loss": -9.509306907653809, "global_step": 98062, "epoch": 583} {"train_loss": -9.64723014831543, "global_step": 98063, "epoch": 583} {"train_loss": -9.317676544189453, "global_step": 98064, "epoch": 583} {"train_loss": -9.365760803222656, "global_step": 98065, "epoch": 583} {"train_loss": -9.495031356811523, "global_step": 98066, "epoch": 583} {"train_loss": -9.616836547851562, "global_step": 98067, "epoch": 583} {"train_loss": -9.487449645996094, "global_step": 98068, "epoch": 583} {"train_loss": -9.515196800231934, "global_step": 98069, "epoch": 583} {"train_loss": -8.892435073852539, "global_step": 98070, "epoch": 583} {"train_loss": -9.192474365234375, "global_step": 98071, "epoch": 583} {"train_loss": -9.384867668151855, "global_step": 98072, "epoch": 583} {"train_loss": -8.659948348999023, "global_step": 98073, "epoch": 583} {"train_loss": -9.417842864990234, "global_step": 98074, "epoch": 583} {"train_loss": -8.753547668457031, "global_step": 98075, "epoch": 583} {"train_loss": -9.135623931884766, "global_step": 98076, "epoch": 583} {"train_loss": -9.199382781982422, "global_step": 98077, "epoch": 583} {"train_loss": -9.070542335510254, "global_step": 98078, "epoch": 583} {"train_loss": -9.269697189331055, "global_step": 98079, "epoch": 583} {"train_loss": -9.022403717041016, "global_step": 98080, "epoch": 583} {"train_loss": -9.260289192199707, "global_step": 98081, "epoch": 583} {"train_loss": -9.329180717468262, "global_step": 98082, "epoch": 583} {"train_loss": -9.30501651763916, "global_step": 98083, "epoch": 583} {"train_loss": -9.376367568969727, "global_step": 98084, "epoch": 583} {"train_loss": -9.53181266784668, "global_step": 98085, "epoch": 583} {"train_loss": -9.428496360778809, "global_step": 98086, "epoch": 583} {"train_loss": -9.304468154907227, "global_step": 98087, "epoch": 583} {"train_loss": -9.26218032836914, "global_step": 98088, "epoch": 583} {"train_loss": -9.469620704650879, "global_step": 98089, "epoch": 583} {"train_loss": -9.35481071472168, "global_step": 98090, "epoch": 583} {"train_loss": -9.294239044189453, "global_step": 98091, "epoch": 583} {"train_loss": -9.059635162353516, "global_step": 98092, "epoch": 583} {"train_loss": -9.415159225463867, "global_step": 98093, "epoch": 583} {"train_loss": -9.136775016784668, "global_step": 98094, "epoch": 583} {"train_loss": -9.085220336914062, "global_step": 98095, "epoch": 583} {"train_loss": -9.372047424316406, "global_step": 98096, "epoch": 583} {"train_loss": -9.216712951660156, "global_step": 98097, "epoch": 583} {"train_loss": -9.406306266784668, "global_step": 98098, "epoch": 583} {"train_loss": -9.595159530639648, "global_step": 98099, "epoch": 583} {"train_loss": -9.31067180633545, "global_step": 98100, "epoch": 583} {"train_loss": -9.447637557983398, "global_step": 98101, "epoch": 583} {"train_loss": -9.58293342590332, "global_step": 98102, "epoch": 583} {"train_loss": -9.408958435058594, "global_step": 98103, "epoch": 583} {"train_loss": -9.451026916503906, "global_step": 98104, "epoch": 583} {"train_loss": -9.657073974609375, "global_step": 98105, "epoch": 583} {"train_loss": -9.61077880859375, "global_step": 98106, "epoch": 583} {"train_loss": -9.755752563476562, "global_step": 98107, "epoch": 583} {"train_loss": -9.747207641601562, "global_step": 98108, "epoch": 583} {"train_loss": -9.85820198059082, "global_step": 98109, "epoch": 583} {"train_loss": -9.708223342895508, "global_step": 98110, "epoch": 583} {"train_loss": -9.543119759786697, "global_step": 98111, "epoch": 583, "val_loss": 205716.890625} {"train_loss": -9.786173820495605, "global_step": 98112, "epoch": 584} {"train_loss": -9.734315872192383, "global_step": 98113, "epoch": 584} {"train_loss": -9.600249290466309, "global_step": 98114, "epoch": 584} {"train_loss": -9.641191482543945, "global_step": 98115, "epoch": 584} {"train_loss": -9.720181465148926, "global_step": 98116, "epoch": 584} {"train_loss": -9.860918998718262, "global_step": 98117, "epoch": 584} {"train_loss": -9.808172225952148, "global_step": 98118, "epoch": 584} {"train_loss": -9.59577751159668, "global_step": 98119, "epoch": 584} {"train_loss": -9.565156936645508, "global_step": 98120, "epoch": 584} {"train_loss": -9.344923973083496, "global_step": 98121, "epoch": 584} {"train_loss": -9.510612487792969, "global_step": 98122, "epoch": 584} {"train_loss": -9.492145538330078, "global_step": 98123, "epoch": 584} {"train_loss": -9.805164337158203, "global_step": 98124, "epoch": 584} {"train_loss": -9.4366455078125, "global_step": 98125, "epoch": 584} {"train_loss": -9.784469604492188, "global_step": 98126, "epoch": 584} {"train_loss": -9.596899032592773, "global_step": 98127, "epoch": 584} {"train_loss": -9.913187026977539, "global_step": 98128, "epoch": 584} {"train_loss": -9.713374137878418, "global_step": 98129, "epoch": 584} {"train_loss": -9.650020599365234, "global_step": 98130, "epoch": 584} {"train_loss": -9.672712326049805, "global_step": 98131, "epoch": 584} {"train_loss": -9.84000015258789, "global_step": 98132, "epoch": 584} {"train_loss": -9.655736923217773, "global_step": 98133, "epoch": 584} {"train_loss": -9.761495590209961, "global_step": 98134, "epoch": 584} {"train_loss": -9.763581275939941, "global_step": 98135, "epoch": 584} {"train_loss": -9.483234405517578, "global_step": 98136, "epoch": 584} {"train_loss": -9.681713104248047, "global_step": 98137, "epoch": 584} {"train_loss": -9.693794250488281, "global_step": 98138, "epoch": 584} {"train_loss": -9.676711082458496, "global_step": 98139, "epoch": 584} {"train_loss": -9.931707382202148, "global_step": 98140, "epoch": 584} {"train_loss": -9.698064804077148, "global_step": 98141, "epoch": 584} {"train_loss": -9.742622375488281, "global_step": 98142, "epoch": 584} {"train_loss": -9.865234375, "global_step": 98143, "epoch": 584} {"train_loss": -9.599757194519043, "global_step": 98144, "epoch": 584} {"train_loss": -9.76340389251709, "global_step": 98145, "epoch": 584} {"train_loss": -9.466062545776367, "global_step": 98146, "epoch": 584} {"train_loss": -9.67885971069336, "global_step": 98147, "epoch": 584} {"train_loss": -9.505487442016602, "global_step": 98148, "epoch": 584} {"train_loss": -9.79196548461914, "global_step": 98149, "epoch": 584} {"train_loss": -9.503039360046387, "global_step": 98150, "epoch": 584} {"train_loss": -9.736665725708008, "global_step": 98151, "epoch": 584} {"train_loss": -9.45309829711914, "global_step": 98152, "epoch": 584} {"train_loss": -9.806001663208008, "global_step": 98153, "epoch": 584} {"train_loss": -9.537906646728516, "global_step": 98154, "epoch": 584} {"train_loss": -9.583074569702148, "global_step": 98155, "epoch": 584} {"train_loss": -9.647639274597168, "global_step": 98156, "epoch": 584} {"train_loss": -9.488239288330078, "global_step": 98157, "epoch": 584} {"train_loss": -9.660310745239258, "global_step": 98158, "epoch": 584} {"train_loss": -9.541460037231445, "global_step": 98159, "epoch": 584} {"train_loss": -9.717462539672852, "global_step": 98160, "epoch": 584} {"train_loss": -9.526840209960938, "global_step": 98161, "epoch": 584} {"train_loss": -9.872001647949219, "global_step": 98162, "epoch": 584} {"train_loss": -9.722578048706055, "global_step": 98163, "epoch": 584} {"train_loss": -9.505239486694336, "global_step": 98164, "epoch": 584} {"train_loss": -9.522743225097656, "global_step": 98165, "epoch": 584} {"train_loss": -9.188844680786133, "global_step": 98166, "epoch": 584} {"train_loss": -9.70679759979248, "global_step": 98167, "epoch": 584} {"train_loss": -9.273478507995605, "global_step": 98168, "epoch": 584} {"train_loss": -9.190324783325195, "global_step": 98169, "epoch": 584} {"train_loss": -9.602975845336914, "global_step": 98170, "epoch": 584} {"train_loss": -9.383021354675293, "global_step": 98171, "epoch": 584} {"train_loss": -9.777655601501465, "global_step": 98172, "epoch": 584} {"train_loss": -9.81384563446045, "global_step": 98173, "epoch": 584} {"train_loss": -9.365339279174805, "global_step": 98174, "epoch": 584} {"train_loss": -9.461971282958984, "global_step": 98175, "epoch": 584} {"train_loss": -9.491471290588379, "global_step": 98176, "epoch": 584} {"train_loss": -9.463767051696777, "global_step": 98177, "epoch": 584} {"train_loss": -9.672861099243164, "global_step": 98178, "epoch": 584} {"train_loss": -9.234521865844727, "global_step": 98179, "epoch": 584} {"train_loss": -9.624860763549805, "global_step": 98180, "epoch": 584} {"train_loss": -9.079804420471191, "global_step": 98181, "epoch": 584} {"train_loss": -9.682334899902344, "global_step": 98182, "epoch": 584} {"train_loss": -9.746222496032715, "global_step": 98183, "epoch": 584} {"train_loss": -9.7445068359375, "global_step": 98184, "epoch": 584} {"train_loss": -9.511758804321289, "global_step": 98185, "epoch": 584} {"train_loss": -9.592398643493652, "global_step": 98186, "epoch": 584} {"train_loss": -9.637550354003906, "global_step": 98187, "epoch": 584} {"train_loss": -9.707056999206543, "global_step": 98188, "epoch": 584} {"train_loss": -9.618324279785156, "global_step": 98189, "epoch": 584} {"train_loss": -9.489456176757812, "global_step": 98190, "epoch": 584} {"train_loss": -10.0158052444458, "global_step": 98191, "epoch": 584} {"train_loss": -9.499269485473633, "global_step": 98192, "epoch": 584} {"train_loss": -9.521782875061035, "global_step": 98193, "epoch": 584} {"train_loss": -9.72769546508789, "global_step": 98194, "epoch": 584} {"train_loss": -9.560798645019531, "global_step": 98195, "epoch": 584} {"train_loss": -9.967855453491211, "global_step": 98196, "epoch": 584} {"train_loss": -9.70132064819336, "global_step": 98197, "epoch": 584} {"train_loss": -9.648786544799805, "global_step": 98198, "epoch": 584} {"train_loss": -9.577346801757812, "global_step": 98199, "epoch": 584} {"train_loss": -9.452939987182617, "global_step": 98200, "epoch": 584} {"train_loss": -9.965307235717773, "global_step": 98201, "epoch": 584} {"train_loss": -9.484445571899414, "global_step": 98202, "epoch": 584} {"train_loss": -9.781463623046875, "global_step": 98203, "epoch": 584} {"train_loss": -9.50783920288086, "global_step": 98204, "epoch": 584} {"train_loss": -9.848530769348145, "global_step": 98205, "epoch": 584} {"train_loss": -9.895772933959961, "global_step": 98206, "epoch": 584} {"train_loss": -9.986286163330078, "global_step": 98207, "epoch": 584} {"train_loss": -9.205570220947266, "global_step": 98208, "epoch": 584} {"train_loss": -9.438053131103516, "global_step": 98209, "epoch": 584} {"train_loss": -8.628185272216797, "global_step": 98210, "epoch": 584} {"train_loss": -9.315434455871582, "global_step": 98211, "epoch": 584} {"train_loss": -8.520328521728516, "global_step": 98212, "epoch": 584} {"train_loss": -9.1652250289917, "global_step": 98213, "epoch": 584} {"train_loss": -9.068307876586914, "global_step": 98214, "epoch": 584} {"train_loss": -9.142029762268066, "global_step": 98215, "epoch": 584} {"train_loss": -8.750802993774414, "global_step": 98216, "epoch": 584} {"train_loss": -9.542946815490723, "global_step": 98217, "epoch": 584} {"train_loss": -9.3794527053833, "global_step": 98218, "epoch": 584} {"train_loss": -9.359689712524414, "global_step": 98219, "epoch": 584} {"train_loss": -9.401664733886719, "global_step": 98220, "epoch": 584} {"train_loss": -9.466634750366211, "global_step": 98221, "epoch": 584} {"train_loss": -9.35551643371582, "global_step": 98222, "epoch": 584} {"train_loss": -9.394706726074219, "global_step": 98223, "epoch": 584} {"train_loss": -9.64140510559082, "global_step": 98224, "epoch": 584} {"train_loss": -9.347423553466797, "global_step": 98225, "epoch": 584} {"train_loss": -9.343636512756348, "global_step": 98226, "epoch": 584} {"train_loss": -9.561765670776367, "global_step": 98227, "epoch": 584} {"train_loss": -9.651365280151367, "global_step": 98228, "epoch": 584} {"train_loss": -9.620484352111816, "global_step": 98229, "epoch": 584} {"train_loss": -9.622762680053711, "global_step": 98230, "epoch": 584} {"train_loss": -9.708120346069336, "global_step": 98231, "epoch": 584} {"train_loss": -9.325489044189453, "global_step": 98232, "epoch": 584} {"train_loss": -9.66689682006836, "global_step": 98233, "epoch": 584} {"train_loss": -9.53024959564209, "global_step": 98234, "epoch": 584} {"train_loss": -9.536062240600586, "global_step": 98235, "epoch": 584} {"train_loss": -9.195892333984375, "global_step": 98236, "epoch": 584} {"train_loss": -9.649165153503418, "global_step": 98237, "epoch": 584} {"train_loss": -9.28797721862793, "global_step": 98238, "epoch": 584} {"train_loss": -9.407553672790527, "global_step": 98239, "epoch": 584} {"train_loss": -9.536100387573242, "global_step": 98240, "epoch": 584} {"train_loss": -9.376728057861328, "global_step": 98241, "epoch": 584} {"train_loss": -9.62164306640625, "global_step": 98242, "epoch": 584} {"train_loss": -9.80816650390625, "global_step": 98243, "epoch": 584} {"train_loss": -9.822502136230469, "global_step": 98244, "epoch": 584} {"train_loss": -9.653386116027832, "global_step": 98245, "epoch": 584} {"train_loss": -9.848220825195312, "global_step": 98246, "epoch": 584} {"train_loss": -9.903413772583008, "global_step": 98247, "epoch": 584} {"train_loss": -9.821700096130371, "global_step": 98248, "epoch": 584} {"train_loss": -9.453802108764648, "global_step": 98249, "epoch": 584} {"train_loss": -9.788006782531738, "global_step": 98250, "epoch": 584} {"train_loss": -9.647284507751465, "global_step": 98251, "epoch": 584} {"train_loss": -9.462844848632812, "global_step": 98252, "epoch": 584} {"train_loss": -9.632848739624023, "global_step": 98253, "epoch": 584} {"train_loss": -9.734095573425293, "global_step": 98254, "epoch": 584} {"train_loss": -9.658549308776855, "global_step": 98255, "epoch": 584} {"train_loss": -9.598403930664062, "global_step": 98256, "epoch": 584} {"train_loss": -9.549856185913086, "global_step": 98257, "epoch": 584} {"train_loss": -9.592148780822754, "global_step": 98258, "epoch": 584} {"train_loss": -9.631595611572266, "global_step": 98259, "epoch": 584} {"train_loss": -9.641912460327148, "global_step": 98260, "epoch": 584} {"train_loss": -9.56704330444336, "global_step": 98261, "epoch": 584} {"train_loss": -9.665855407714844, "global_step": 98262, "epoch": 584} {"train_loss": -9.540950775146484, "global_step": 98263, "epoch": 584} {"train_loss": -9.380289077758789, "global_step": 98264, "epoch": 584} {"train_loss": -9.453535079956055, "global_step": 98265, "epoch": 584} {"train_loss": -9.268585205078125, "global_step": 98266, "epoch": 584} {"train_loss": -9.48095703125, "global_step": 98267, "epoch": 584} {"train_loss": -9.460216522216797, "global_step": 98268, "epoch": 584} {"train_loss": -9.613798141479492, "global_step": 98269, "epoch": 584} {"train_loss": -9.417840957641602, "global_step": 98270, "epoch": 584} {"train_loss": -9.37272834777832, "global_step": 98271, "epoch": 584} {"train_loss": -9.379459381103516, "global_step": 98272, "epoch": 584} {"train_loss": -9.751178741455078, "global_step": 98273, "epoch": 584} {"train_loss": -9.613486289978027, "global_step": 98274, "epoch": 584} {"train_loss": -9.45849323272705, "global_step": 98275, "epoch": 584} {"train_loss": -9.553346633911133, "global_step": 98276, "epoch": 584} {"train_loss": -9.123788833618164, "global_step": 98277, "epoch": 584} {"train_loss": -9.597808837890625, "global_step": 98278, "epoch": 584} {"train_loss": -9.566022435824076, "global_step": 98279, "epoch": 584, "val_loss": 206503.453125} {"train_loss": -9.676675796508789, "global_step": 98280, "epoch": 585} {"train_loss": -9.722007751464844, "global_step": 98281, "epoch": 585} {"train_loss": -9.69179916381836, "global_step": 98282, "epoch": 585} {"train_loss": -9.558253288269043, "global_step": 98283, "epoch": 585} {"train_loss": -9.58953857421875, "global_step": 98284, "epoch": 585} {"train_loss": -9.569504737854004, "global_step": 98285, "epoch": 585} {"train_loss": -9.429666519165039, "global_step": 98286, "epoch": 585} {"train_loss": -9.557165145874023, "global_step": 98287, "epoch": 585} {"train_loss": -9.451652526855469, "global_step": 98288, "epoch": 585} {"train_loss": -9.510461807250977, "global_step": 98289, "epoch": 585} {"train_loss": -9.494169235229492, "global_step": 98290, "epoch": 585} {"train_loss": -9.720121383666992, "global_step": 98291, "epoch": 585} {"train_loss": -9.604738235473633, "global_step": 98292, "epoch": 585} {"train_loss": -9.59748649597168, "global_step": 98293, "epoch": 585} {"train_loss": -9.613746643066406, "global_step": 98294, "epoch": 585} {"train_loss": -9.643049240112305, "global_step": 98295, "epoch": 585} {"train_loss": -9.87007999420166, "global_step": 98296, "epoch": 585} {"train_loss": -9.629084587097168, "global_step": 98297, "epoch": 585} {"train_loss": -9.8195161819458, "global_step": 98298, "epoch": 585} {"train_loss": -9.570886611938477, "global_step": 98299, "epoch": 585} {"train_loss": -9.578670501708984, "global_step": 98300, "epoch": 585} {"train_loss": -9.37276554107666, "global_step": 98301, "epoch": 585} {"train_loss": -9.707544326782227, "global_step": 98302, "epoch": 585} {"train_loss": -9.990995407104492, "global_step": 98303, "epoch": 585} {"train_loss": -9.824602127075195, "global_step": 98304, "epoch": 585} {"train_loss": -9.798971176147461, "global_step": 98305, "epoch": 585} {"train_loss": -9.675370216369629, "global_step": 98306, "epoch": 585} {"train_loss": -10.008894920349121, "global_step": 98307, "epoch": 585} {"train_loss": -9.678747177124023, "global_step": 98308, "epoch": 585} {"train_loss": -9.651154518127441, "global_step": 98309, "epoch": 585} {"train_loss": -9.757730484008789, "global_step": 98310, "epoch": 585} {"train_loss": -9.496408462524414, "global_step": 98311, "epoch": 585} {"train_loss": -9.76909065246582, "global_step": 98312, "epoch": 585} {"train_loss": -9.473587036132812, "global_step": 98313, "epoch": 585} {"train_loss": -9.256914138793945, "global_step": 98314, "epoch": 585} {"train_loss": -9.649662017822266, "global_step": 98315, "epoch": 585} {"train_loss": -9.71650505065918, "global_step": 98316, "epoch": 585} {"train_loss": -9.34321403503418, "global_step": 98317, "epoch": 585} {"train_loss": -9.624567985534668, "global_step": 98318, "epoch": 585} {"train_loss": -9.607616424560547, "global_step": 98319, "epoch": 585} {"train_loss": -9.811984062194824, "global_step": 98320, "epoch": 585} {"train_loss": -9.495466232299805, "global_step": 98321, "epoch": 585} {"train_loss": -9.700252532958984, "global_step": 98322, "epoch": 585} {"train_loss": -9.649085998535156, "global_step": 98323, "epoch": 585} {"train_loss": -10.003092765808105, "global_step": 98324, "epoch": 585} {"train_loss": -9.51661491394043, "global_step": 98325, "epoch": 585} {"train_loss": -9.860025405883789, "global_step": 98326, "epoch": 585} {"train_loss": -9.085878372192383, "global_step": 98327, "epoch": 585} {"train_loss": -9.626254081726074, "global_step": 98328, "epoch": 585} {"train_loss": -9.347423553466797, "global_step": 98329, "epoch": 585} {"train_loss": -9.195919036865234, "global_step": 98330, "epoch": 585} {"train_loss": -8.906819343566895, "global_step": 98331, "epoch": 585} {"train_loss": -9.607196807861328, "global_step": 98332, "epoch": 585} {"train_loss": -8.603811264038086, "global_step": 98333, "epoch": 585} {"train_loss": -9.456514358520508, "global_step": 98334, "epoch": 585} {"train_loss": -9.115195274353027, "global_step": 98335, "epoch": 585} {"train_loss": -9.314032554626465, "global_step": 98336, "epoch": 585} {"train_loss": -9.415048599243164, "global_step": 98337, "epoch": 585} {"train_loss": -9.3561429977417, "global_step": 98338, "epoch": 585} {"train_loss": -9.269842147827148, "global_step": 98339, "epoch": 585} {"train_loss": -9.391067504882812, "global_step": 98340, "epoch": 585} {"train_loss": -9.43781566619873, "global_step": 98341, "epoch": 585} {"train_loss": -9.54126262664795, "global_step": 98342, "epoch": 585} {"train_loss": -9.239542007446289, "global_step": 98343, "epoch": 585} {"train_loss": -9.535567283630371, "global_step": 98344, "epoch": 585} {"train_loss": -9.198741912841797, "global_step": 98345, "epoch": 585} {"train_loss": -9.316781997680664, "global_step": 98346, "epoch": 585} {"train_loss": -9.28845500946045, "global_step": 98347, "epoch": 585} {"train_loss": -9.3907470703125, "global_step": 98348, "epoch": 585} {"train_loss": -9.538287162780762, "global_step": 98349, "epoch": 585} {"train_loss": -9.415468215942383, "global_step": 98350, "epoch": 585} {"train_loss": -9.592995643615723, "global_step": 98351, "epoch": 585} {"train_loss": -9.447172164916992, "global_step": 98352, "epoch": 585} {"train_loss": -9.577515602111816, "global_step": 98353, "epoch": 585} {"train_loss": -9.403976440429688, "global_step": 98354, "epoch": 585} {"train_loss": -9.471320152282715, "global_step": 98355, "epoch": 585} {"train_loss": -9.476016998291016, "global_step": 98356, "epoch": 585} {"train_loss": -9.396907806396484, "global_step": 98357, "epoch": 585} {"train_loss": -9.74090576171875, "global_step": 98358, "epoch": 585} {"train_loss": -9.704290390014648, "global_step": 98359, "epoch": 585} {"train_loss": -9.691608428955078, "global_step": 98360, "epoch": 585} {"train_loss": -9.664362907409668, "global_step": 98361, "epoch": 585} {"train_loss": -9.714042663574219, "global_step": 98362, "epoch": 585} {"train_loss": -9.496003150939941, "global_step": 98363, "epoch": 585} {"train_loss": -9.789205551147461, "global_step": 98364, "epoch": 585} {"train_loss": -9.720291137695312, "global_step": 98365, "epoch": 585} {"train_loss": -9.790716171264648, "global_step": 98366, "epoch": 585} {"train_loss": -9.301713943481445, "global_step": 98367, "epoch": 585} {"train_loss": -9.925230979919434, "global_step": 98368, "epoch": 585} {"train_loss": -9.607086181640625, "global_step": 98369, "epoch": 585} {"train_loss": -9.707540512084961, "global_step": 98370, "epoch": 585} {"train_loss": -9.766820907592773, "global_step": 98371, "epoch": 585} {"train_loss": -9.804268836975098, "global_step": 98372, "epoch": 585} {"train_loss": -9.77414321899414, "global_step": 98373, "epoch": 585} {"train_loss": -9.868267059326172, "global_step": 98374, "epoch": 585} {"train_loss": -9.860121726989746, "global_step": 98375, "epoch": 585} {"train_loss": -9.514822006225586, "global_step": 98376, "epoch": 585} {"train_loss": -9.694132804870605, "global_step": 98377, "epoch": 585} {"train_loss": -9.63400936126709, "global_step": 98378, "epoch": 585} {"train_loss": -9.988526344299316, "global_step": 98379, "epoch": 585} {"train_loss": -9.494616508483887, "global_step": 98380, "epoch": 585} {"train_loss": -10.106608390808105, "global_step": 98381, "epoch": 585} {"train_loss": -9.617119789123535, "global_step": 98382, "epoch": 585} {"train_loss": -9.803117752075195, "global_step": 98383, "epoch": 585} {"train_loss": -9.384340286254883, "global_step": 98384, "epoch": 585} {"train_loss": -9.535232543945312, "global_step": 98385, "epoch": 585} {"train_loss": -9.741886138916016, "global_step": 98386, "epoch": 585} {"train_loss": -9.89214038848877, "global_step": 98387, "epoch": 585} {"train_loss": -9.175052642822266, "global_step": 98388, "epoch": 585} {"train_loss": -9.531898498535156, "global_step": 98389, "epoch": 585} {"train_loss": -9.69064998626709, "global_step": 98390, "epoch": 585} {"train_loss": -9.549148559570312, "global_step": 98391, "epoch": 585} {"train_loss": -9.738420486450195, "global_step": 98392, "epoch": 585} {"train_loss": -9.463102340698242, "global_step": 98393, "epoch": 585} {"train_loss": -9.903451919555664, "global_step": 98394, "epoch": 585} {"train_loss": -9.496541023254395, "global_step": 98395, "epoch": 585} {"train_loss": -9.814311981201172, "global_step": 98396, "epoch": 585} {"train_loss": -9.644500732421875, "global_step": 98397, "epoch": 585} {"train_loss": -9.751002311706543, "global_step": 98398, "epoch": 585} {"train_loss": -9.549339294433594, "global_step": 98399, "epoch": 585} {"train_loss": -9.825254440307617, "global_step": 98400, "epoch": 585} {"train_loss": -9.805375099182129, "global_step": 98401, "epoch": 585} {"train_loss": -9.972253799438477, "global_step": 98402, "epoch": 585} {"train_loss": -9.595775604248047, "global_step": 98403, "epoch": 585} {"train_loss": -9.811097145080566, "global_step": 98404, "epoch": 585} {"train_loss": -9.870128631591797, "global_step": 98405, "epoch": 585} {"train_loss": -9.671409606933594, "global_step": 98406, "epoch": 585} {"train_loss": -9.856535911560059, "global_step": 98407, "epoch": 585} {"train_loss": -9.650239944458008, "global_step": 98408, "epoch": 585} {"train_loss": -9.50585651397705, "global_step": 98409, "epoch": 585} {"train_loss": -9.694862365722656, "global_step": 98410, "epoch": 585} {"train_loss": -9.416481971740723, "global_step": 98411, "epoch": 585} {"train_loss": -9.84002685546875, "global_step": 98412, "epoch": 585} {"train_loss": -9.136828422546387, "global_step": 98413, "epoch": 585} {"train_loss": -9.65816879272461, "global_step": 98414, "epoch": 585} {"train_loss": -9.631221771240234, "global_step": 98415, "epoch": 585} {"train_loss": -9.31070327758789, "global_step": 98416, "epoch": 585} {"train_loss": -9.726238250732422, "global_step": 98417, "epoch": 585} {"train_loss": -9.513448715209961, "global_step": 98418, "epoch": 585} {"train_loss": -9.785085678100586, "global_step": 98419, "epoch": 585} {"train_loss": -9.684310913085938, "global_step": 98420, "epoch": 585} {"train_loss": -9.24556827545166, "global_step": 98421, "epoch": 585} {"train_loss": -9.546442031860352, "global_step": 98422, "epoch": 585} {"train_loss": -9.507617950439453, "global_step": 98423, "epoch": 585} {"train_loss": -9.698169708251953, "global_step": 98424, "epoch": 585} {"train_loss": -9.52842903137207, "global_step": 98425, "epoch": 585} {"train_loss": -9.355352401733398, "global_step": 98426, "epoch": 585} {"train_loss": -9.50539493560791, "global_step": 98427, "epoch": 585} {"train_loss": -9.605340957641602, "global_step": 98428, "epoch": 585} {"train_loss": -9.184433937072754, "global_step": 98429, "epoch": 585} {"train_loss": -9.531720161437988, "global_step": 98430, "epoch": 585} {"train_loss": -9.075102806091309, "global_step": 98431, "epoch": 585} {"train_loss": -9.445480346679688, "global_step": 98432, "epoch": 585} {"train_loss": -9.617241859436035, "global_step": 98433, "epoch": 585} {"train_loss": -9.579297065734863, "global_step": 98434, "epoch": 585} {"train_loss": -9.707168579101562, "global_step": 98435, "epoch": 585} {"train_loss": -9.57880973815918, "global_step": 98436, "epoch": 585} {"train_loss": -9.597414016723633, "global_step": 98437, "epoch": 585} {"train_loss": -9.445478439331055, "global_step": 98438, "epoch": 585} {"train_loss": -9.580549240112305, "global_step": 98439, "epoch": 585} {"train_loss": -9.701797485351562, "global_step": 98440, "epoch": 585} {"train_loss": -9.578096389770508, "global_step": 98441, "epoch": 585} {"train_loss": -9.845544815063477, "global_step": 98442, "epoch": 585} {"train_loss": -9.741565704345703, "global_step": 98443, "epoch": 585} {"train_loss": -9.786508560180664, "global_step": 98444, "epoch": 585} {"train_loss": -9.709100723266602, "global_step": 98445, "epoch": 585} {"train_loss": -9.661214828491211, "global_step": 98446, "epoch": 585} {"train_loss": -9.589093702180046, "global_step": 98447, "epoch": 585, "val_loss": 206808.90625, "train_action_mse_error": 4.662440299987793} {"train_loss": -9.766874313354492, "global_step": 98448, "epoch": 586} {"train_loss": -9.830772399902344, "global_step": 98449, "epoch": 586} {"train_loss": -9.789578437805176, "global_step": 98450, "epoch": 586} {"train_loss": -9.741523742675781, "global_step": 98451, "epoch": 586} {"train_loss": -9.530172348022461, "global_step": 98452, "epoch": 586} {"train_loss": -9.887372970581055, "global_step": 98453, "epoch": 586} {"train_loss": -9.679374694824219, "global_step": 98454, "epoch": 586} {"train_loss": -9.778341293334961, "global_step": 98455, "epoch": 586} {"train_loss": -9.614046096801758, "global_step": 98456, "epoch": 586} {"train_loss": -9.485692024230957, "global_step": 98457, "epoch": 586} {"train_loss": -9.848158836364746, "global_step": 98458, "epoch": 586} {"train_loss": -9.674602508544922, "global_step": 98459, "epoch": 586} {"train_loss": -10.071660995483398, "global_step": 98460, "epoch": 586} {"train_loss": -9.609524726867676, "global_step": 98461, "epoch": 586} {"train_loss": -9.699751853942871, "global_step": 98462, "epoch": 586} {"train_loss": -9.432950973510742, "global_step": 98463, "epoch": 586} {"train_loss": -9.59632682800293, "global_step": 98464, "epoch": 586} {"train_loss": -9.699167251586914, "global_step": 98465, "epoch": 586} {"train_loss": -9.539146423339844, "global_step": 98466, "epoch": 586} {"train_loss": -9.772951126098633, "global_step": 98467, "epoch": 586} {"train_loss": -9.675674438476562, "global_step": 98468, "epoch": 586} {"train_loss": -9.633684158325195, "global_step": 98469, "epoch": 586} {"train_loss": -9.764034271240234, "global_step": 98470, "epoch": 586} {"train_loss": -9.668037414550781, "global_step": 98471, "epoch": 586} {"train_loss": -9.929425239562988, "global_step": 98472, "epoch": 586} {"train_loss": -9.725460052490234, "global_step": 98473, "epoch": 586} {"train_loss": -9.652471542358398, "global_step": 98474, "epoch": 586} {"train_loss": -9.596972465515137, "global_step": 98475, "epoch": 586} {"train_loss": -9.764892578125, "global_step": 98476, "epoch": 586} {"train_loss": -9.675800323486328, "global_step": 98477, "epoch": 586} {"train_loss": -9.497727394104004, "global_step": 98478, "epoch": 586} {"train_loss": -9.875290870666504, "global_step": 98479, "epoch": 586} {"train_loss": -9.521224975585938, "global_step": 98480, "epoch": 586} {"train_loss": -9.854022979736328, "global_step": 98481, "epoch": 586} {"train_loss": -9.51541519165039, "global_step": 98482, "epoch": 586} {"train_loss": -9.528799057006836, "global_step": 98483, "epoch": 586} {"train_loss": -9.692740440368652, "global_step": 98484, "epoch": 586} {"train_loss": -9.628591537475586, "global_step": 98485, "epoch": 586} {"train_loss": -9.786932945251465, "global_step": 98486, "epoch": 586} {"train_loss": -9.244359970092773, "global_step": 98487, "epoch": 586} {"train_loss": -9.677712440490723, "global_step": 98488, "epoch": 586} {"train_loss": -9.513463973999023, "global_step": 98489, "epoch": 586} {"train_loss": -9.454643249511719, "global_step": 98490, "epoch": 586} {"train_loss": -9.599605560302734, "global_step": 98491, "epoch": 586} {"train_loss": -9.143877983093262, "global_step": 98492, "epoch": 586} {"train_loss": -9.463767051696777, "global_step": 98493, "epoch": 586} {"train_loss": -9.48212718963623, "global_step": 98494, "epoch": 586} {"train_loss": -9.482072830200195, "global_step": 98495, "epoch": 586} {"train_loss": -9.560001373291016, "global_step": 98496, "epoch": 586} {"train_loss": -9.607629776000977, "global_step": 98497, "epoch": 586} {"train_loss": -9.34560489654541, "global_step": 98498, "epoch": 586} {"train_loss": -9.718862533569336, "global_step": 98499, "epoch": 586} {"train_loss": -9.71249771118164, "global_step": 98500, "epoch": 586} {"train_loss": -9.61290168762207, "global_step": 98501, "epoch": 586} {"train_loss": -9.458948135375977, "global_step": 98502, "epoch": 586} {"train_loss": -9.743488311767578, "global_step": 98503, "epoch": 586} {"train_loss": -9.759356498718262, "global_step": 98504, "epoch": 586} {"train_loss": -9.660402297973633, "global_step": 98505, "epoch": 586} {"train_loss": -9.571316719055176, "global_step": 98506, "epoch": 586} {"train_loss": -9.547361373901367, "global_step": 98507, "epoch": 586} {"train_loss": -9.807380676269531, "global_step": 98508, "epoch": 586} {"train_loss": -9.717690467834473, "global_step": 98509, "epoch": 586} {"train_loss": -9.692736625671387, "global_step": 98510, "epoch": 586} {"train_loss": -9.640464782714844, "global_step": 98511, "epoch": 586} {"train_loss": -9.750433921813965, "global_step": 98512, "epoch": 586} {"train_loss": -9.800097465515137, "global_step": 98513, "epoch": 586} {"train_loss": -9.761343002319336, "global_step": 98514, "epoch": 586} {"train_loss": -9.619848251342773, "global_step": 98515, "epoch": 586} {"train_loss": -9.856487274169922, "global_step": 98516, "epoch": 586} {"train_loss": -9.830461502075195, "global_step": 98517, "epoch": 586} {"train_loss": -9.84765625, "global_step": 98518, "epoch": 586} {"train_loss": -9.621557235717773, "global_step": 98519, "epoch": 586} {"train_loss": -9.880918502807617, "global_step": 98520, "epoch": 586} {"train_loss": -9.813294410705566, "global_step": 98521, "epoch": 586} {"train_loss": -9.672015190124512, "global_step": 98522, "epoch": 586} {"train_loss": -9.765201568603516, "global_step": 98523, "epoch": 586} {"train_loss": -9.469804763793945, "global_step": 98524, "epoch": 586} {"train_loss": -9.177436828613281, "global_step": 98525, "epoch": 586} {"train_loss": -9.6900634765625, "global_step": 98526, "epoch": 586} {"train_loss": -9.56389045715332, "global_step": 98527, "epoch": 586} {"train_loss": -9.4317626953125, "global_step": 98528, "epoch": 586} {"train_loss": -9.693890571594238, "global_step": 98529, "epoch": 586} {"train_loss": -9.667404174804688, "global_step": 98530, "epoch": 586} {"train_loss": -9.451805114746094, "global_step": 98531, "epoch": 586} {"train_loss": -9.831781387329102, "global_step": 98532, "epoch": 586} {"train_loss": -9.54877758026123, "global_step": 98533, "epoch": 586} {"train_loss": -9.527863502502441, "global_step": 98534, "epoch": 586} {"train_loss": -9.732566833496094, "global_step": 98535, "epoch": 586} {"train_loss": -9.288422584533691, "global_step": 98536, "epoch": 586} {"train_loss": -9.847599983215332, "global_step": 98537, "epoch": 586} {"train_loss": -9.343671798706055, "global_step": 98538, "epoch": 586} {"train_loss": -9.638090133666992, "global_step": 98539, "epoch": 586} {"train_loss": -9.621648788452148, "global_step": 98540, "epoch": 586} {"train_loss": -9.643150329589844, "global_step": 98541, "epoch": 586} {"train_loss": -9.789179801940918, "global_step": 98542, "epoch": 586} {"train_loss": -9.281543731689453, "global_step": 98543, "epoch": 586} {"train_loss": -9.677433967590332, "global_step": 98544, "epoch": 586} {"train_loss": -9.431209564208984, "global_step": 98545, "epoch": 586} {"train_loss": -9.635052680969238, "global_step": 98546, "epoch": 586} {"train_loss": -9.264653205871582, "global_step": 98547, "epoch": 586} {"train_loss": -9.798440933227539, "global_step": 98548, "epoch": 586} {"train_loss": -9.3781156539917, "global_step": 98549, "epoch": 586} {"train_loss": -9.601696014404297, "global_step": 98550, "epoch": 586} {"train_loss": -9.67132568359375, "global_step": 98551, "epoch": 586} {"train_loss": -9.684873580932617, "global_step": 98552, "epoch": 586} {"train_loss": -9.636763572692871, "global_step": 98553, "epoch": 586} {"train_loss": -9.880069732666016, "global_step": 98554, "epoch": 586} {"train_loss": -9.833966255187988, "global_step": 98555, "epoch": 586} {"train_loss": -9.8511962890625, "global_step": 98556, "epoch": 586} {"train_loss": -9.73105239868164, "global_step": 98557, "epoch": 586} {"train_loss": -9.580013275146484, "global_step": 98558, "epoch": 586} {"train_loss": -9.922861099243164, "global_step": 98559, "epoch": 586} {"train_loss": -9.821968078613281, "global_step": 98560, "epoch": 586} {"train_loss": -9.77507209777832, "global_step": 98561, "epoch": 586} {"train_loss": -9.649197578430176, "global_step": 98562, "epoch": 586} {"train_loss": -9.635847091674805, "global_step": 98563, "epoch": 586} {"train_loss": -9.800783157348633, "global_step": 98564, "epoch": 586} {"train_loss": -9.910125732421875, "global_step": 98565, "epoch": 586} {"train_loss": -9.699259757995605, "global_step": 98566, "epoch": 586} {"train_loss": -9.807106018066406, "global_step": 98567, "epoch": 586} {"train_loss": -9.523122787475586, "global_step": 98568, "epoch": 586} {"train_loss": -9.903542518615723, "global_step": 98569, "epoch": 586} {"train_loss": -9.90432071685791, "global_step": 98570, "epoch": 586} {"train_loss": -9.448594093322754, "global_step": 98571, "epoch": 586} {"train_loss": -9.643562316894531, "global_step": 98572, "epoch": 586} {"train_loss": -9.481805801391602, "global_step": 98573, "epoch": 586} {"train_loss": -9.211896896362305, "global_step": 98574, "epoch": 586} {"train_loss": -9.571235656738281, "global_step": 98575, "epoch": 586} {"train_loss": -9.483057975769043, "global_step": 98576, "epoch": 586} {"train_loss": -9.000778198242188, "global_step": 98577, "epoch": 586} {"train_loss": -9.474822998046875, "global_step": 98578, "epoch": 586} {"train_loss": -9.157527923583984, "global_step": 98579, "epoch": 586} {"train_loss": -9.203393936157227, "global_step": 98580, "epoch": 586} {"train_loss": -9.77189826965332, "global_step": 98581, "epoch": 586} {"train_loss": -9.057857513427734, "global_step": 98582, "epoch": 586} {"train_loss": -9.658931732177734, "global_step": 98583, "epoch": 586} {"train_loss": -9.260040283203125, "global_step": 98584, "epoch": 586} {"train_loss": -9.559491157531738, "global_step": 98585, "epoch": 586} {"train_loss": -9.281293869018555, "global_step": 98586, "epoch": 586} {"train_loss": -9.794307708740234, "global_step": 98587, "epoch": 586} {"train_loss": -9.33991527557373, "global_step": 98588, "epoch": 586} {"train_loss": -9.394936561584473, "global_step": 98589, "epoch": 586} {"train_loss": -9.623496055603027, "global_step": 98590, "epoch": 586} {"train_loss": -9.250909805297852, "global_step": 98591, "epoch": 586} {"train_loss": -9.578675270080566, "global_step": 98592, "epoch": 586} {"train_loss": -9.658705711364746, "global_step": 98593, "epoch": 586} {"train_loss": -9.491085052490234, "global_step": 98594, "epoch": 586} {"train_loss": -9.431615829467773, "global_step": 98595, "epoch": 586} {"train_loss": -9.410429954528809, "global_step": 98596, "epoch": 586} {"train_loss": -9.580114364624023, "global_step": 98597, "epoch": 586} {"train_loss": -9.309713363647461, "global_step": 98598, "epoch": 586} {"train_loss": -9.62500286102295, "global_step": 98599, "epoch": 586} {"train_loss": -9.640573501586914, "global_step": 98600, "epoch": 586} {"train_loss": -9.667732238769531, "global_step": 98601, "epoch": 586} {"train_loss": -9.584149360656738, "global_step": 98602, "epoch": 586} {"train_loss": -9.73366928100586, "global_step": 98603, "epoch": 586} {"train_loss": -9.679450035095215, "global_step": 98604, "epoch": 586} {"train_loss": -9.782161712646484, "global_step": 98605, "epoch": 586} {"train_loss": -9.659439086914062, "global_step": 98606, "epoch": 586} {"train_loss": -9.950765609741211, "global_step": 98607, "epoch": 586} {"train_loss": -9.66673469543457, "global_step": 98608, "epoch": 586} {"train_loss": -9.732234954833984, "global_step": 98609, "epoch": 586} {"train_loss": -9.7503023147583, "global_step": 98610, "epoch": 586} {"train_loss": -9.830377578735352, "global_step": 98611, "epoch": 586} {"train_loss": -9.596303939819336, "global_step": 98612, "epoch": 586} {"train_loss": -9.788305282592773, "global_step": 98613, "epoch": 586} {"train_loss": -9.646450996398926, "global_step": 98614, "epoch": 586} {"train_loss": -9.622046402522496, "global_step": 98615, "epoch": 586, "val_loss": 208729.40625} {"train_loss": -9.449874877929688, "global_step": 98616, "epoch": 587} {"train_loss": -9.716156959533691, "global_step": 98617, "epoch": 587} {"train_loss": -9.75606918334961, "global_step": 98618, "epoch": 587} {"train_loss": -9.818902969360352, "global_step": 98619, "epoch": 587} {"train_loss": -9.578149795532227, "global_step": 98620, "epoch": 587} {"train_loss": -9.838465690612793, "global_step": 98621, "epoch": 587} {"train_loss": -9.719558715820312, "global_step": 98622, "epoch": 587} {"train_loss": -9.994653701782227, "global_step": 98623, "epoch": 587} {"train_loss": -9.777639389038086, "global_step": 98624, "epoch": 587} {"train_loss": -9.845317840576172, "global_step": 98625, "epoch": 587} {"train_loss": -9.910531044006348, "global_step": 98626, "epoch": 587} {"train_loss": -9.707929611206055, "global_step": 98627, "epoch": 587} {"train_loss": -9.935523986816406, "global_step": 98628, "epoch": 587} {"train_loss": -9.779562950134277, "global_step": 98629, "epoch": 587} {"train_loss": -9.617977142333984, "global_step": 98630, "epoch": 587} {"train_loss": -9.4949951171875, "global_step": 98631, "epoch": 587} {"train_loss": -9.514965057373047, "global_step": 98632, "epoch": 587} {"train_loss": -9.75654125213623, "global_step": 98633, "epoch": 587} {"train_loss": -9.82410717010498, "global_step": 98634, "epoch": 587} {"train_loss": -9.615488052368164, "global_step": 98635, "epoch": 587} {"train_loss": -9.623062133789062, "global_step": 98636, "epoch": 587} {"train_loss": -9.63659381866455, "global_step": 98637, "epoch": 587} {"train_loss": -9.655638694763184, "global_step": 98638, "epoch": 587} {"train_loss": -9.577170372009277, "global_step": 98639, "epoch": 587} {"train_loss": -9.458699226379395, "global_step": 98640, "epoch": 587} {"train_loss": -9.592597961425781, "global_step": 98641, "epoch": 587} {"train_loss": -9.622299194335938, "global_step": 98642, "epoch": 587} {"train_loss": -9.810806274414062, "global_step": 98643, "epoch": 587} {"train_loss": -9.552717208862305, "global_step": 98644, "epoch": 587} {"train_loss": -9.840998649597168, "global_step": 98645, "epoch": 587} {"train_loss": -9.74787425994873, "global_step": 98646, "epoch": 587} {"train_loss": -9.66433334350586, "global_step": 98647, "epoch": 587} {"train_loss": -9.612266540527344, "global_step": 98648, "epoch": 587} {"train_loss": -9.491218566894531, "global_step": 98649, "epoch": 587} {"train_loss": -9.441707611083984, "global_step": 98650, "epoch": 587} {"train_loss": -9.28141975402832, "global_step": 98651, "epoch": 587} {"train_loss": -9.509116172790527, "global_step": 98652, "epoch": 587} {"train_loss": -9.515928268432617, "global_step": 98653, "epoch": 587} {"train_loss": -9.753145217895508, "global_step": 98654, "epoch": 587} {"train_loss": -9.722723007202148, "global_step": 98655, "epoch": 587} {"train_loss": -9.925488471984863, "global_step": 98656, "epoch": 587} {"train_loss": -9.634088516235352, "global_step": 98657, "epoch": 587} {"train_loss": -9.285030364990234, "global_step": 98658, "epoch": 587} {"train_loss": -9.569286346435547, "global_step": 98659, "epoch": 587} {"train_loss": -9.753589630126953, "global_step": 98660, "epoch": 587} {"train_loss": -9.49864387512207, "global_step": 98661, "epoch": 587} {"train_loss": -9.758698463439941, "global_step": 98662, "epoch": 587} {"train_loss": -9.755022048950195, "global_step": 98663, "epoch": 587} {"train_loss": -9.47659969329834, "global_step": 98664, "epoch": 587} {"train_loss": -9.196321487426758, "global_step": 98665, "epoch": 587} {"train_loss": -9.723114013671875, "global_step": 98666, "epoch": 587} {"train_loss": -9.83719539642334, "global_step": 98667, "epoch": 587} {"train_loss": -9.432714462280273, "global_step": 98668, "epoch": 587} {"train_loss": -9.651232719421387, "global_step": 98669, "epoch": 587} {"train_loss": -9.013019561767578, "global_step": 98670, "epoch": 587} {"train_loss": -9.447397232055664, "global_step": 98671, "epoch": 587} {"train_loss": -9.554036140441895, "global_step": 98672, "epoch": 587} {"train_loss": -9.392875671386719, "global_step": 98673, "epoch": 587} {"train_loss": -9.6307373046875, "global_step": 98674, "epoch": 587} {"train_loss": -9.84428882598877, "global_step": 98675, "epoch": 587} {"train_loss": -9.653919219970703, "global_step": 98676, "epoch": 587} {"train_loss": -9.551149368286133, "global_step": 98677, "epoch": 587} {"train_loss": -9.815451622009277, "global_step": 98678, "epoch": 587} {"train_loss": -9.581876754760742, "global_step": 98679, "epoch": 587} {"train_loss": -9.69168472290039, "global_step": 98680, "epoch": 587} {"train_loss": -9.702371597290039, "global_step": 98681, "epoch": 587} {"train_loss": -9.656394004821777, "global_step": 98682, "epoch": 587} {"train_loss": -9.635870933532715, "global_step": 98683, "epoch": 587} {"train_loss": -9.612183570861816, "global_step": 98684, "epoch": 587} {"train_loss": -9.64826488494873, "global_step": 98685, "epoch": 587} {"train_loss": -9.558122634887695, "global_step": 98686, "epoch": 587} {"train_loss": -9.47258472442627, "global_step": 98687, "epoch": 587} {"train_loss": -9.86572551727295, "global_step": 98688, "epoch": 587} {"train_loss": -9.395933151245117, "global_step": 98689, "epoch": 587} {"train_loss": -9.822805404663086, "global_step": 98690, "epoch": 587} {"train_loss": -9.708778381347656, "global_step": 98691, "epoch": 587} {"train_loss": -9.803146362304688, "global_step": 98692, "epoch": 587} {"train_loss": -10.099206924438477, "global_step": 98693, "epoch": 587} {"train_loss": -9.539390563964844, "global_step": 98694, "epoch": 587} {"train_loss": -9.908609390258789, "global_step": 98695, "epoch": 587} {"train_loss": -9.869543075561523, "global_step": 98696, "epoch": 587} {"train_loss": -9.938918113708496, "global_step": 98697, "epoch": 587} {"train_loss": -9.864400863647461, "global_step": 98698, "epoch": 587} {"train_loss": -9.82965087890625, "global_step": 98699, "epoch": 587} {"train_loss": -9.798782348632812, "global_step": 98700, "epoch": 587} {"train_loss": -9.934835433959961, "global_step": 98701, "epoch": 587} {"train_loss": -9.456720352172852, "global_step": 98702, "epoch": 587} {"train_loss": -9.965677261352539, "global_step": 98703, "epoch": 587} {"train_loss": -9.628966331481934, "global_step": 98704, "epoch": 587} {"train_loss": -9.92192268371582, "global_step": 98705, "epoch": 587} {"train_loss": -9.920516014099121, "global_step": 98706, "epoch": 587} {"train_loss": -10.115650177001953, "global_step": 98707, "epoch": 587} {"train_loss": -10.024784088134766, "global_step": 98708, "epoch": 587} {"train_loss": -9.599586486816406, "global_step": 98709, "epoch": 587} {"train_loss": -9.758016586303711, "global_step": 98710, "epoch": 587} {"train_loss": -9.593999862670898, "global_step": 98711, "epoch": 587} {"train_loss": -9.886470794677734, "global_step": 98712, "epoch": 587} {"train_loss": -9.651777267456055, "global_step": 98713, "epoch": 587} {"train_loss": -9.61863899230957, "global_step": 98714, "epoch": 587} {"train_loss": -10.074056625366211, "global_step": 98715, "epoch": 587} {"train_loss": -9.596643447875977, "global_step": 98716, "epoch": 587} {"train_loss": -9.905990600585938, "global_step": 98717, "epoch": 587} {"train_loss": -9.931619644165039, "global_step": 98718, "epoch": 587} {"train_loss": -9.267119407653809, "global_step": 98719, "epoch": 587} {"train_loss": -9.461841583251953, "global_step": 98720, "epoch": 587} {"train_loss": -9.922148704528809, "global_step": 98721, "epoch": 587} {"train_loss": -9.561023712158203, "global_step": 98722, "epoch": 587} {"train_loss": -9.420119285583496, "global_step": 98723, "epoch": 587} {"train_loss": -9.26655387878418, "global_step": 98724, "epoch": 587} {"train_loss": -9.141318321228027, "global_step": 98725, "epoch": 587} {"train_loss": -8.745835304260254, "global_step": 98726, "epoch": 587} {"train_loss": -8.504206657409668, "global_step": 98727, "epoch": 587} {"train_loss": -8.781500816345215, "global_step": 98728, "epoch": 587} {"train_loss": -8.761510848999023, "global_step": 98729, "epoch": 587} {"train_loss": -8.374249458312988, "global_step": 98730, "epoch": 587} {"train_loss": -9.013816833496094, "global_step": 98731, "epoch": 587} {"train_loss": -8.98025894165039, "global_step": 98732, "epoch": 587} {"train_loss": -8.464624404907227, "global_step": 98733, "epoch": 587} {"train_loss": -8.871347427368164, "global_step": 98734, "epoch": 587} {"train_loss": -8.990654945373535, "global_step": 98735, "epoch": 587} {"train_loss": -9.131255149841309, "global_step": 98736, "epoch": 587} {"train_loss": -8.827383041381836, "global_step": 98737, "epoch": 587} {"train_loss": -9.139654159545898, "global_step": 98738, "epoch": 587} {"train_loss": -9.41148567199707, "global_step": 98739, "epoch": 587} {"train_loss": -8.932945251464844, "global_step": 98740, "epoch": 587} {"train_loss": -9.131637573242188, "global_step": 98741, "epoch": 587} {"train_loss": -9.189001083374023, "global_step": 98742, "epoch": 587} {"train_loss": -9.017095565795898, "global_step": 98743, "epoch": 587} {"train_loss": -9.344087600708008, "global_step": 98744, "epoch": 587} {"train_loss": -9.243146896362305, "global_step": 98745, "epoch": 587} {"train_loss": -9.013826370239258, "global_step": 98746, "epoch": 587} {"train_loss": -8.983600616455078, "global_step": 98747, "epoch": 587} {"train_loss": -9.204778671264648, "global_step": 98748, "epoch": 587} {"train_loss": -9.067688941955566, "global_step": 98749, "epoch": 587} {"train_loss": -9.243785858154297, "global_step": 98750, "epoch": 587} {"train_loss": -9.208724975585938, "global_step": 98751, "epoch": 587} {"train_loss": -9.459365844726562, "global_step": 98752, "epoch": 587} {"train_loss": -9.484537124633789, "global_step": 98753, "epoch": 587} {"train_loss": -9.417247772216797, "global_step": 98754, "epoch": 587} {"train_loss": -9.265771865844727, "global_step": 98755, "epoch": 587} {"train_loss": -9.486835479736328, "global_step": 98756, "epoch": 587} {"train_loss": -9.512264251708984, "global_step": 98757, "epoch": 587} {"train_loss": -9.47722053527832, "global_step": 98758, "epoch": 587} {"train_loss": -9.501712799072266, "global_step": 98759, "epoch": 587} {"train_loss": -9.927677154541016, "global_step": 98760, "epoch": 587} {"train_loss": -9.538678169250488, "global_step": 98761, "epoch": 587} {"train_loss": -9.563802719116211, "global_step": 98762, "epoch": 587} {"train_loss": -9.581859588623047, "global_step": 98763, "epoch": 587} {"train_loss": -9.5924072265625, "global_step": 98764, "epoch": 587} {"train_loss": -9.576741218566895, "global_step": 98765, "epoch": 587} {"train_loss": -9.618614196777344, "global_step": 98766, "epoch": 587} {"train_loss": -9.605283737182617, "global_step": 98767, "epoch": 587} {"train_loss": -9.841007232666016, "global_step": 98768, "epoch": 587} {"train_loss": -9.48961067199707, "global_step": 98769, "epoch": 587} {"train_loss": -9.69455337524414, "global_step": 98770, "epoch": 587} {"train_loss": -9.616777420043945, "global_step": 98771, "epoch": 587} {"train_loss": -10.03939437866211, "global_step": 98772, "epoch": 587} {"train_loss": -9.956184387207031, "global_step": 98773, "epoch": 587} {"train_loss": -9.43563461303711, "global_step": 98774, "epoch": 587} {"train_loss": -9.85912036895752, "global_step": 98775, "epoch": 587} {"train_loss": -9.835700988769531, "global_step": 98776, "epoch": 587} {"train_loss": -9.530725479125977, "global_step": 98777, "epoch": 587} {"train_loss": -9.475780487060547, "global_step": 98778, "epoch": 587} {"train_loss": -9.601411819458008, "global_step": 98779, "epoch": 587} {"train_loss": -9.384306907653809, "global_step": 98780, "epoch": 587} {"train_loss": -9.790993690490723, "global_step": 98781, "epoch": 587} {"train_loss": -9.483765602111816, "global_step": 98782, "epoch": 587} {"train_loss": -9.549016015870231, "global_step": 98783, "epoch": 587, "val_loss": 207786.96875} {"train_loss": -9.573332786560059, "global_step": 98784, "epoch": 588} {"train_loss": -8.567774772644043, "global_step": 98785, "epoch": 588} {"train_loss": -9.518078804016113, "global_step": 98786, "epoch": 588} {"train_loss": -8.953412055969238, "global_step": 98787, "epoch": 588} {"train_loss": -8.843732833862305, "global_step": 98788, "epoch": 588} {"train_loss": -9.360109329223633, "global_step": 98789, "epoch": 588} {"train_loss": -9.56185531616211, "global_step": 98790, "epoch": 588} {"train_loss": -8.941057205200195, "global_step": 98791, "epoch": 588} {"train_loss": -9.128335952758789, "global_step": 98792, "epoch": 588} {"train_loss": -9.280624389648438, "global_step": 98793, "epoch": 588} {"train_loss": -9.067232131958008, "global_step": 98794, "epoch": 588} {"train_loss": -9.43044376373291, "global_step": 98795, "epoch": 588} {"train_loss": -8.92112922668457, "global_step": 98796, "epoch": 588} {"train_loss": -9.653229713439941, "global_step": 98797, "epoch": 588} {"train_loss": -8.993898391723633, "global_step": 98798, "epoch": 588} {"train_loss": -9.126774787902832, "global_step": 98799, "epoch": 588} {"train_loss": -9.337321281433105, "global_step": 98800, "epoch": 588} {"train_loss": -9.259136199951172, "global_step": 98801, "epoch": 588} {"train_loss": -9.534929275512695, "global_step": 98802, "epoch": 588} {"train_loss": -9.463407516479492, "global_step": 98803, "epoch": 588} {"train_loss": -9.538183212280273, "global_step": 98804, "epoch": 588} {"train_loss": -9.331984519958496, "global_step": 98805, "epoch": 588} {"train_loss": -9.5299654006958, "global_step": 98806, "epoch": 588} {"train_loss": -9.60616397857666, "global_step": 98807, "epoch": 588} {"train_loss": -9.368656158447266, "global_step": 98808, "epoch": 588} {"train_loss": -9.766526222229004, "global_step": 98809, "epoch": 588} {"train_loss": -9.411886215209961, "global_step": 98810, "epoch": 588} {"train_loss": -9.661362648010254, "global_step": 98811, "epoch": 588} {"train_loss": -9.658604621887207, "global_step": 98812, "epoch": 588} {"train_loss": -9.55079460144043, "global_step": 98813, "epoch": 588} {"train_loss": -9.536382675170898, "global_step": 98814, "epoch": 588} {"train_loss": -9.755732536315918, "global_step": 98815, "epoch": 588} {"train_loss": -9.646406173706055, "global_step": 98816, "epoch": 588} {"train_loss": -9.515738487243652, "global_step": 98817, "epoch": 588} {"train_loss": -9.814010620117188, "global_step": 98818, "epoch": 588} {"train_loss": -9.791487693786621, "global_step": 98819, "epoch": 588} {"train_loss": -9.828388214111328, "global_step": 98820, "epoch": 588} {"train_loss": -9.766490936279297, "global_step": 98821, "epoch": 588} {"train_loss": -9.829795837402344, "global_step": 98822, "epoch": 588} {"train_loss": -9.819825172424316, "global_step": 98823, "epoch": 588} {"train_loss": -9.949649810791016, "global_step": 98824, "epoch": 588} {"train_loss": -9.731322288513184, "global_step": 98825, "epoch": 588} {"train_loss": -9.679056167602539, "global_step": 98826, "epoch": 588} {"train_loss": -9.906007766723633, "global_step": 98827, "epoch": 588} {"train_loss": -9.556381225585938, "global_step": 98828, "epoch": 588} {"train_loss": -9.850486755371094, "global_step": 98829, "epoch": 588} {"train_loss": -9.813599586486816, "global_step": 98830, "epoch": 588} {"train_loss": -9.865859985351562, "global_step": 98831, "epoch": 588} {"train_loss": -9.827919006347656, "global_step": 98832, "epoch": 588} {"train_loss": -9.717329025268555, "global_step": 98833, "epoch": 588} {"train_loss": -9.603508949279785, "global_step": 98834, "epoch": 588} {"train_loss": -9.683391571044922, "global_step": 98835, "epoch": 588} {"train_loss": -9.692720413208008, "global_step": 98836, "epoch": 588} {"train_loss": -9.525186538696289, "global_step": 98837, "epoch": 588} {"train_loss": -9.929957389831543, "global_step": 98838, "epoch": 588} {"train_loss": -9.697742462158203, "global_step": 98839, "epoch": 588} {"train_loss": -9.98601245880127, "global_step": 98840, "epoch": 588} {"train_loss": -9.391952514648438, "global_step": 98841, "epoch": 588} {"train_loss": -9.742692947387695, "global_step": 98842, "epoch": 588} {"train_loss": -9.67419147491455, "global_step": 98843, "epoch": 588} {"train_loss": -9.865493774414062, "global_step": 98844, "epoch": 588} {"train_loss": -9.630043029785156, "global_step": 98845, "epoch": 588} {"train_loss": -9.814233779907227, "global_step": 98846, "epoch": 588} {"train_loss": -9.7750244140625, "global_step": 98847, "epoch": 588} {"train_loss": -9.770257949829102, "global_step": 98848, "epoch": 588} {"train_loss": -9.664215087890625, "global_step": 98849, "epoch": 588} {"train_loss": -9.755983352661133, "global_step": 98850, "epoch": 588} {"train_loss": -9.295774459838867, "global_step": 98851, "epoch": 588} {"train_loss": -9.443471908569336, "global_step": 98852, "epoch": 588} {"train_loss": -9.729320526123047, "global_step": 98853, "epoch": 588} {"train_loss": -9.477325439453125, "global_step": 98854, "epoch": 588} {"train_loss": -9.571624755859375, "global_step": 98855, "epoch": 588} {"train_loss": -9.499444961547852, "global_step": 98856, "epoch": 588} {"train_loss": -9.604619026184082, "global_step": 98857, "epoch": 588} {"train_loss": -9.733720779418945, "global_step": 98858, "epoch": 588} {"train_loss": -9.4564790725708, "global_step": 98859, "epoch": 588} {"train_loss": -9.848859786987305, "global_step": 98860, "epoch": 588} {"train_loss": -9.546073913574219, "global_step": 98861, "epoch": 588} {"train_loss": -9.684846878051758, "global_step": 98862, "epoch": 588} {"train_loss": -9.450763702392578, "global_step": 98863, "epoch": 588} {"train_loss": -9.571733474731445, "global_step": 98864, "epoch": 588} {"train_loss": -9.69516372680664, "global_step": 98865, "epoch": 588} {"train_loss": -9.73939323425293, "global_step": 98866, "epoch": 588} {"train_loss": -9.794940948486328, "global_step": 98867, "epoch": 588} {"train_loss": -9.790096282958984, "global_step": 98868, "epoch": 588} {"train_loss": -9.868419647216797, "global_step": 98869, "epoch": 588} {"train_loss": -9.789117813110352, "global_step": 98870, "epoch": 588} {"train_loss": -9.741948127746582, "global_step": 98871, "epoch": 588} {"train_loss": -9.836124420166016, "global_step": 98872, "epoch": 588} {"train_loss": -9.849259376525879, "global_step": 98873, "epoch": 588} {"train_loss": -9.693309783935547, "global_step": 98874, "epoch": 588} {"train_loss": -9.874032974243164, "global_step": 98875, "epoch": 588} {"train_loss": -9.731948852539062, "global_step": 98876, "epoch": 588} {"train_loss": -9.68631362915039, "global_step": 98877, "epoch": 588} {"train_loss": -9.577390670776367, "global_step": 98878, "epoch": 588} {"train_loss": -9.78544807434082, "global_step": 98879, "epoch": 588} {"train_loss": -9.58502197265625, "global_step": 98880, "epoch": 588} {"train_loss": -9.259745597839355, "global_step": 98881, "epoch": 588} {"train_loss": -9.5594482421875, "global_step": 98882, "epoch": 588} {"train_loss": -9.585742950439453, "global_step": 98883, "epoch": 588} {"train_loss": -9.949159622192383, "global_step": 98884, "epoch": 588} {"train_loss": -9.686832427978516, "global_step": 98885, "epoch": 588} {"train_loss": -9.698894500732422, "global_step": 98886, "epoch": 588} {"train_loss": -9.443815231323242, "global_step": 98887, "epoch": 588} {"train_loss": -9.934530258178711, "global_step": 98888, "epoch": 588} {"train_loss": -9.744840621948242, "global_step": 98889, "epoch": 588} {"train_loss": -9.726788520812988, "global_step": 98890, "epoch": 588} {"train_loss": -9.641105651855469, "global_step": 98891, "epoch": 588} {"train_loss": -9.779348373413086, "global_step": 98892, "epoch": 588} {"train_loss": -9.87946891784668, "global_step": 98893, "epoch": 588} {"train_loss": -10.00338363647461, "global_step": 98894, "epoch": 588} {"train_loss": -9.63604736328125, "global_step": 98895, "epoch": 588} {"train_loss": -10.010176658630371, "global_step": 98896, "epoch": 588} {"train_loss": -9.520954132080078, "global_step": 98897, "epoch": 588} {"train_loss": -9.453289031982422, "global_step": 98898, "epoch": 588} {"train_loss": -9.911608695983887, "global_step": 98899, "epoch": 588} {"train_loss": -9.394515991210938, "global_step": 98900, "epoch": 588} {"train_loss": -9.481796264648438, "global_step": 98901, "epoch": 588} {"train_loss": -9.76119327545166, "global_step": 98902, "epoch": 588} {"train_loss": -9.515188217163086, "global_step": 98903, "epoch": 588} {"train_loss": -9.219435691833496, "global_step": 98904, "epoch": 588} {"train_loss": -9.400737762451172, "global_step": 98905, "epoch": 588} {"train_loss": -9.461567878723145, "global_step": 98906, "epoch": 588} {"train_loss": -9.638898849487305, "global_step": 98907, "epoch": 588} {"train_loss": -9.613029479980469, "global_step": 98908, "epoch": 588} {"train_loss": -9.631223678588867, "global_step": 98909, "epoch": 588} {"train_loss": -9.493741989135742, "global_step": 98910, "epoch": 588} {"train_loss": -9.531356811523438, "global_step": 98911, "epoch": 588} {"train_loss": -9.6037015914917, "global_step": 98912, "epoch": 588} {"train_loss": -9.726577758789062, "global_step": 98913, "epoch": 588} {"train_loss": -9.817115783691406, "global_step": 98914, "epoch": 588} {"train_loss": -9.423356056213379, "global_step": 98915, "epoch": 588} {"train_loss": -9.739824295043945, "global_step": 98916, "epoch": 588} {"train_loss": -9.640737533569336, "global_step": 98917, "epoch": 588} {"train_loss": -9.650228500366211, "global_step": 98918, "epoch": 588} {"train_loss": -9.757610321044922, "global_step": 98919, "epoch": 588} {"train_loss": -9.673445701599121, "global_step": 98920, "epoch": 588} {"train_loss": -9.693902969360352, "global_step": 98921, "epoch": 588} {"train_loss": -9.437978744506836, "global_step": 98922, "epoch": 588} {"train_loss": -9.086888313293457, "global_step": 98923, "epoch": 588} {"train_loss": -9.362298965454102, "global_step": 98924, "epoch": 588} {"train_loss": -9.104581832885742, "global_step": 98925, "epoch": 588} {"train_loss": -9.387258529663086, "global_step": 98926, "epoch": 588} {"train_loss": -9.208978652954102, "global_step": 98927, "epoch": 588} {"train_loss": -9.63988208770752, "global_step": 98928, "epoch": 588} {"train_loss": -9.465457916259766, "global_step": 98929, "epoch": 588} {"train_loss": -9.84382438659668, "global_step": 98930, "epoch": 588} {"train_loss": -9.401786804199219, "global_step": 98931, "epoch": 588} {"train_loss": -9.578184127807617, "global_step": 98932, "epoch": 588} {"train_loss": -9.705989837646484, "global_step": 98933, "epoch": 588} {"train_loss": -9.516592025756836, "global_step": 98934, "epoch": 588} {"train_loss": -9.723211288452148, "global_step": 98935, "epoch": 588} {"train_loss": -9.562811851501465, "global_step": 98936, "epoch": 588} {"train_loss": -9.634637832641602, "global_step": 98937, "epoch": 588} {"train_loss": -9.583314895629883, "global_step": 98938, "epoch": 588} {"train_loss": -9.584417343139648, "global_step": 98939, "epoch": 588} {"train_loss": -9.63923168182373, "global_step": 98940, "epoch": 588} {"train_loss": -9.587759017944336, "global_step": 98941, "epoch": 588} {"train_loss": -9.881338119506836, "global_step": 98942, "epoch": 588} {"train_loss": -9.75204086303711, "global_step": 98943, "epoch": 588} {"train_loss": -9.691547393798828, "global_step": 98944, "epoch": 588} {"train_loss": -9.669851303100586, "global_step": 98945, "epoch": 588} {"train_loss": -9.78221321105957, "global_step": 98946, "epoch": 588} {"train_loss": -9.679829597473145, "global_step": 98947, "epoch": 588} {"train_loss": -9.746849060058594, "global_step": 98948, "epoch": 588} {"train_loss": -9.595151901245117, "global_step": 98949, "epoch": 588} {"train_loss": -9.802178382873535, "global_step": 98950, "epoch": 588} {"train_loss": -9.60267718633016, "global_step": 98951, "epoch": 588, "val_loss": 205124.171875} {"train_loss": -9.526169776916504, "global_step": 98952, "epoch": 589} {"train_loss": -9.404191017150879, "global_step": 98953, "epoch": 589} {"train_loss": -9.685508728027344, "global_step": 98954, "epoch": 589} {"train_loss": -9.649019241333008, "global_step": 98955, "epoch": 589} {"train_loss": -9.766622543334961, "global_step": 98956, "epoch": 589} {"train_loss": -9.891498565673828, "global_step": 98957, "epoch": 589} {"train_loss": -9.929981231689453, "global_step": 98958, "epoch": 589} {"train_loss": -9.62005615234375, "global_step": 98959, "epoch": 589} {"train_loss": -9.885420799255371, "global_step": 98960, "epoch": 589} {"train_loss": -9.800615310668945, "global_step": 98961, "epoch": 589} {"train_loss": -9.778799057006836, "global_step": 98962, "epoch": 589} {"train_loss": -9.91415786743164, "global_step": 98963, "epoch": 589} {"train_loss": -9.993894577026367, "global_step": 98964, "epoch": 589} {"train_loss": -9.820250511169434, "global_step": 98965, "epoch": 589} {"train_loss": -9.819612503051758, "global_step": 98966, "epoch": 589} {"train_loss": -10.159708023071289, "global_step": 98967, "epoch": 589} {"train_loss": -9.647934913635254, "global_step": 98968, "epoch": 589} {"train_loss": -9.83204460144043, "global_step": 98969, "epoch": 589} {"train_loss": -9.792778015136719, "global_step": 98970, "epoch": 589} {"train_loss": -9.879356384277344, "global_step": 98971, "epoch": 589} {"train_loss": -9.89350700378418, "global_step": 98972, "epoch": 589} {"train_loss": -9.984294891357422, "global_step": 98973, "epoch": 589} {"train_loss": -9.74074935913086, "global_step": 98974, "epoch": 589} {"train_loss": -9.886465072631836, "global_step": 98975, "epoch": 589} {"train_loss": -9.755870819091797, "global_step": 98976, "epoch": 589} {"train_loss": -9.881595611572266, "global_step": 98977, "epoch": 589} {"train_loss": -9.90746021270752, "global_step": 98978, "epoch": 589} {"train_loss": -9.487892150878906, "global_step": 98979, "epoch": 589} {"train_loss": -9.801531791687012, "global_step": 98980, "epoch": 589} {"train_loss": -9.737664222717285, "global_step": 98981, "epoch": 589} {"train_loss": -9.708701133728027, "global_step": 98982, "epoch": 589} {"train_loss": -9.44028377532959, "global_step": 98983, "epoch": 589} {"train_loss": -9.777782440185547, "global_step": 98984, "epoch": 589} {"train_loss": -9.792564392089844, "global_step": 98985, "epoch": 589} {"train_loss": -9.80729866027832, "global_step": 98986, "epoch": 589} {"train_loss": -9.797648429870605, "global_step": 98987, "epoch": 589} {"train_loss": -9.599201202392578, "global_step": 98988, "epoch": 589} {"train_loss": -10.045405387878418, "global_step": 98989, "epoch": 589} {"train_loss": -9.506665229797363, "global_step": 98990, "epoch": 589} {"train_loss": -9.794866561889648, "global_step": 98991, "epoch": 589} {"train_loss": -9.636598587036133, "global_step": 98992, "epoch": 589} {"train_loss": -9.908575057983398, "global_step": 98993, "epoch": 589} {"train_loss": -9.531930923461914, "global_step": 98994, "epoch": 589} {"train_loss": -9.825902938842773, "global_step": 98995, "epoch": 589} {"train_loss": -9.748418807983398, "global_step": 98996, "epoch": 589} {"train_loss": -9.685157775878906, "global_step": 98997, "epoch": 589} {"train_loss": -9.545260429382324, "global_step": 98998, "epoch": 589} {"train_loss": -9.740690231323242, "global_step": 98999, "epoch": 589} {"train_loss": -9.742107391357422, "global_step": 99000, "epoch": 589} {"train_loss": -9.563070297241211, "global_step": 99001, "epoch": 589} {"train_loss": -9.529040336608887, "global_step": 99002, "epoch": 589} {"train_loss": -9.756603240966797, "global_step": 99003, "epoch": 589} {"train_loss": -9.386834144592285, "global_step": 99004, "epoch": 589} {"train_loss": -9.609088897705078, "global_step": 99005, "epoch": 589} {"train_loss": -9.655299186706543, "global_step": 99006, "epoch": 589} {"train_loss": -9.49543571472168, "global_step": 99007, "epoch": 589} {"train_loss": -9.691667556762695, "global_step": 99008, "epoch": 589} {"train_loss": -9.429866790771484, "global_step": 99009, "epoch": 589} {"train_loss": -9.476444244384766, "global_step": 99010, "epoch": 589} {"train_loss": -9.526168823242188, "global_step": 99011, "epoch": 589} {"train_loss": -9.53133773803711, "global_step": 99012, "epoch": 589} {"train_loss": -9.519560813903809, "global_step": 99013, "epoch": 589} {"train_loss": -9.672083854675293, "global_step": 99014, "epoch": 589} {"train_loss": -9.703409194946289, "global_step": 99015, "epoch": 589} {"train_loss": -9.634679794311523, "global_step": 99016, "epoch": 589} {"train_loss": -9.392709732055664, "global_step": 99017, "epoch": 589} {"train_loss": -9.698307037353516, "global_step": 99018, "epoch": 589} {"train_loss": -9.26087760925293, "global_step": 99019, "epoch": 589} {"train_loss": -9.648262023925781, "global_step": 99020, "epoch": 589} {"train_loss": -9.566475868225098, "global_step": 99021, "epoch": 589} {"train_loss": -9.74921989440918, "global_step": 99022, "epoch": 589} {"train_loss": -9.704817771911621, "global_step": 99023, "epoch": 589} {"train_loss": -9.783456802368164, "global_step": 99024, "epoch": 589} {"train_loss": -9.474372863769531, "global_step": 99025, "epoch": 589} {"train_loss": -9.570072174072266, "global_step": 99026, "epoch": 589} {"train_loss": -9.30398941040039, "global_step": 99027, "epoch": 589} {"train_loss": -9.557685852050781, "global_step": 99028, "epoch": 589} {"train_loss": -9.338624000549316, "global_step": 99029, "epoch": 589} {"train_loss": -8.888603210449219, "global_step": 99030, "epoch": 589} {"train_loss": -9.44023323059082, "global_step": 99031, "epoch": 589} {"train_loss": -9.357416152954102, "global_step": 99032, "epoch": 589} {"train_loss": -9.120170593261719, "global_step": 99033, "epoch": 589} {"train_loss": -9.534087181091309, "global_step": 99034, "epoch": 589} {"train_loss": -9.230731964111328, "global_step": 99035, "epoch": 589} {"train_loss": -9.644986152648926, "global_step": 99036, "epoch": 589} {"train_loss": -8.8255615234375, "global_step": 99037, "epoch": 589} {"train_loss": -9.512924194335938, "global_step": 99038, "epoch": 589} {"train_loss": -9.35994815826416, "global_step": 99039, "epoch": 589} {"train_loss": -9.582732200622559, "global_step": 99040, "epoch": 589} {"train_loss": -9.461711883544922, "global_step": 99041, "epoch": 589} {"train_loss": -9.255937576293945, "global_step": 99042, "epoch": 589} {"train_loss": -9.56381607055664, "global_step": 99043, "epoch": 589} {"train_loss": -9.77882194519043, "global_step": 99044, "epoch": 589} {"train_loss": -9.456932067871094, "global_step": 99045, "epoch": 589} {"train_loss": -9.595565795898438, "global_step": 99046, "epoch": 589} {"train_loss": -9.594217300415039, "global_step": 99047, "epoch": 589} {"train_loss": -9.392576217651367, "global_step": 99048, "epoch": 589} {"train_loss": -9.550824165344238, "global_step": 99049, "epoch": 589} {"train_loss": -9.808816909790039, "global_step": 99050, "epoch": 589} {"train_loss": -9.69310188293457, "global_step": 99051, "epoch": 589} {"train_loss": -9.68265151977539, "global_step": 99052, "epoch": 589} {"train_loss": -9.611757278442383, "global_step": 99053, "epoch": 589} {"train_loss": -9.743051528930664, "global_step": 99054, "epoch": 589} {"train_loss": -9.689178466796875, "global_step": 99055, "epoch": 589} {"train_loss": -9.957968711853027, "global_step": 99056, "epoch": 589} {"train_loss": -9.668227195739746, "global_step": 99057, "epoch": 589} {"train_loss": -9.758353233337402, "global_step": 99058, "epoch": 589} {"train_loss": -9.845157623291016, "global_step": 99059, "epoch": 589} {"train_loss": -9.896034240722656, "global_step": 99060, "epoch": 589} {"train_loss": -10.001810073852539, "global_step": 99061, "epoch": 589} {"train_loss": -9.884498596191406, "global_step": 99062, "epoch": 589} {"train_loss": -10.036873817443848, "global_step": 99063, "epoch": 589} {"train_loss": -9.937644958496094, "global_step": 99064, "epoch": 589} {"train_loss": -9.795536041259766, "global_step": 99065, "epoch": 589} {"train_loss": -9.949831008911133, "global_step": 99066, "epoch": 589} {"train_loss": -9.840311050415039, "global_step": 99067, "epoch": 589} {"train_loss": -9.597269058227539, "global_step": 99068, "epoch": 589} {"train_loss": -9.782388687133789, "global_step": 99069, "epoch": 589} {"train_loss": -9.565546035766602, "global_step": 99070, "epoch": 589} {"train_loss": -9.820764541625977, "global_step": 99071, "epoch": 589} {"train_loss": -9.627191543579102, "global_step": 99072, "epoch": 589} {"train_loss": -9.604068756103516, "global_step": 99073, "epoch": 589} {"train_loss": -9.944302558898926, "global_step": 99074, "epoch": 589} {"train_loss": -9.611268997192383, "global_step": 99075, "epoch": 589} {"train_loss": -9.652617454528809, "global_step": 99076, "epoch": 589} {"train_loss": -9.796257972717285, "global_step": 99077, "epoch": 589} {"train_loss": -9.328971862792969, "global_step": 99078, "epoch": 589} {"train_loss": -9.739213943481445, "global_step": 99079, "epoch": 589} {"train_loss": -9.431876182556152, "global_step": 99080, "epoch": 589} {"train_loss": -9.648528099060059, "global_step": 99081, "epoch": 589} {"train_loss": -9.729141235351562, "global_step": 99082, "epoch": 589} {"train_loss": -9.681001663208008, "global_step": 99083, "epoch": 589} {"train_loss": -9.711335182189941, "global_step": 99084, "epoch": 589} {"train_loss": -9.50992488861084, "global_step": 99085, "epoch": 589} {"train_loss": -9.620241165161133, "global_step": 99086, "epoch": 589} {"train_loss": -9.243093490600586, "global_step": 99087, "epoch": 589} {"train_loss": -9.885686874389648, "global_step": 99088, "epoch": 589} {"train_loss": -9.651934623718262, "global_step": 99089, "epoch": 589} {"train_loss": -9.839043617248535, "global_step": 99090, "epoch": 589} {"train_loss": -9.677919387817383, "global_step": 99091, "epoch": 589} {"train_loss": -9.845966339111328, "global_step": 99092, "epoch": 589} {"train_loss": -9.579140663146973, "global_step": 99093, "epoch": 589} {"train_loss": -9.830880165100098, "global_step": 99094, "epoch": 589} {"train_loss": -9.518421173095703, "global_step": 99095, "epoch": 589} {"train_loss": -9.539044380187988, "global_step": 99096, "epoch": 589} {"train_loss": -9.827104568481445, "global_step": 99097, "epoch": 589} {"train_loss": -9.718344688415527, "global_step": 99098, "epoch": 589} {"train_loss": -9.61827278137207, "global_step": 99099, "epoch": 589} {"train_loss": -9.802624702453613, "global_step": 99100, "epoch": 589} {"train_loss": -9.630184173583984, "global_step": 99101, "epoch": 589} {"train_loss": -9.832525253295898, "global_step": 99102, "epoch": 589} {"train_loss": -9.786681175231934, "global_step": 99103, "epoch": 589} {"train_loss": -9.432841300964355, "global_step": 99104, "epoch": 589} {"train_loss": -9.564764976501465, "global_step": 99105, "epoch": 589} {"train_loss": -9.724077224731445, "global_step": 99106, "epoch": 589} {"train_loss": -9.852736473083496, "global_step": 99107, "epoch": 589} {"train_loss": -9.603717803955078, "global_step": 99108, "epoch": 589} {"train_loss": -9.857084274291992, "global_step": 99109, "epoch": 589} {"train_loss": -9.620453834533691, "global_step": 99110, "epoch": 589} {"train_loss": -9.482881546020508, "global_step": 99111, "epoch": 589} {"train_loss": -9.750052452087402, "global_step": 99112, "epoch": 589} {"train_loss": -9.783549308776855, "global_step": 99113, "epoch": 589} {"train_loss": -9.902154922485352, "global_step": 99114, "epoch": 589} {"train_loss": -9.81953239440918, "global_step": 99115, "epoch": 589} {"train_loss": -9.642857551574707, "global_step": 99116, "epoch": 589} {"train_loss": -9.811450004577637, "global_step": 99117, "epoch": 589} {"train_loss": -10.058723449707031, "global_step": 99118, "epoch": 589} {"train_loss": -9.668845119930449, "global_step": 99119, "epoch": 589, "val_loss": 207422.546875} {"train_loss": -9.793669700622559, "global_step": 99120, "epoch": 590} {"train_loss": -9.855905532836914, "global_step": 99121, "epoch": 590} {"train_loss": -9.758872985839844, "global_step": 99122, "epoch": 590} {"train_loss": -9.875138282775879, "global_step": 99123, "epoch": 590} {"train_loss": -9.799468040466309, "global_step": 99124, "epoch": 590} {"train_loss": -9.625677108764648, "global_step": 99125, "epoch": 590} {"train_loss": -9.723979949951172, "global_step": 99126, "epoch": 590} {"train_loss": -9.513643264770508, "global_step": 99127, "epoch": 590} {"train_loss": -9.778258323669434, "global_step": 99128, "epoch": 590} {"train_loss": -9.643324851989746, "global_step": 99129, "epoch": 590} {"train_loss": -9.982603073120117, "global_step": 99130, "epoch": 590} {"train_loss": -9.38935375213623, "global_step": 99131, "epoch": 590} {"train_loss": -9.70571517944336, "global_step": 99132, "epoch": 590} {"train_loss": -9.891763687133789, "global_step": 99133, "epoch": 590} {"train_loss": -9.586183547973633, "global_step": 99134, "epoch": 590} {"train_loss": -9.81320571899414, "global_step": 99135, "epoch": 590} {"train_loss": -9.892515182495117, "global_step": 99136, "epoch": 590} {"train_loss": -9.861059188842773, "global_step": 99137, "epoch": 590} {"train_loss": -9.839022636413574, "global_step": 99138, "epoch": 590} {"train_loss": -9.717531204223633, "global_step": 99139, "epoch": 590} {"train_loss": -9.696796417236328, "global_step": 99140, "epoch": 590} {"train_loss": -9.785280227661133, "global_step": 99141, "epoch": 590} {"train_loss": -9.630208969116211, "global_step": 99142, "epoch": 590} {"train_loss": -9.93399429321289, "global_step": 99143, "epoch": 590} {"train_loss": -9.86288070678711, "global_step": 99144, "epoch": 590} {"train_loss": -9.813230514526367, "global_step": 99145, "epoch": 590} {"train_loss": -9.73165512084961, "global_step": 99146, "epoch": 590} {"train_loss": -9.843177795410156, "global_step": 99147, "epoch": 590} {"train_loss": -9.379449844360352, "global_step": 99148, "epoch": 590} {"train_loss": -9.532384872436523, "global_step": 99149, "epoch": 590} {"train_loss": -9.763702392578125, "global_step": 99150, "epoch": 590} {"train_loss": -9.642515182495117, "global_step": 99151, "epoch": 590} {"train_loss": -9.792594909667969, "global_step": 99152, "epoch": 590} {"train_loss": -9.275362968444824, "global_step": 99153, "epoch": 590} {"train_loss": -9.913986206054688, "global_step": 99154, "epoch": 590} {"train_loss": -9.718286514282227, "global_step": 99155, "epoch": 590} {"train_loss": -9.644914627075195, "global_step": 99156, "epoch": 590} {"train_loss": -9.649581909179688, "global_step": 99157, "epoch": 590} {"train_loss": -9.446636199951172, "global_step": 99158, "epoch": 590} {"train_loss": -9.667984008789062, "global_step": 99159, "epoch": 590} {"train_loss": -9.785568237304688, "global_step": 99160, "epoch": 590} {"train_loss": -9.580059051513672, "global_step": 99161, "epoch": 590} {"train_loss": -9.752649307250977, "global_step": 99162, "epoch": 590} {"train_loss": -9.278059959411621, "global_step": 99163, "epoch": 590} {"train_loss": -9.558509826660156, "global_step": 99164, "epoch": 590} {"train_loss": -9.458245277404785, "global_step": 99165, "epoch": 590} {"train_loss": -9.551088333129883, "global_step": 99166, "epoch": 590} {"train_loss": -9.543706893920898, "global_step": 99167, "epoch": 590} {"train_loss": -9.624801635742188, "global_step": 99168, "epoch": 590} {"train_loss": -9.160679817199707, "global_step": 99169, "epoch": 590} {"train_loss": -9.682489395141602, "global_step": 99170, "epoch": 590} {"train_loss": -9.498773574829102, "global_step": 99171, "epoch": 590} {"train_loss": -9.451025009155273, "global_step": 99172, "epoch": 590} {"train_loss": -9.51917552947998, "global_step": 99173, "epoch": 590} {"train_loss": -9.587281227111816, "global_step": 99174, "epoch": 590} {"train_loss": -9.653091430664062, "global_step": 99175, "epoch": 590} {"train_loss": -9.719330787658691, "global_step": 99176, "epoch": 590} {"train_loss": -9.440511703491211, "global_step": 99177, "epoch": 590} {"train_loss": -9.69238567352295, "global_step": 99178, "epoch": 590} {"train_loss": -9.551370620727539, "global_step": 99179, "epoch": 590} {"train_loss": -9.424392700195312, "global_step": 99180, "epoch": 590} {"train_loss": -9.50590991973877, "global_step": 99181, "epoch": 590} {"train_loss": -9.738468170166016, "global_step": 99182, "epoch": 590} {"train_loss": -9.703243255615234, "global_step": 99183, "epoch": 590} {"train_loss": -9.625421524047852, "global_step": 99184, "epoch": 590} {"train_loss": -9.631628036499023, "global_step": 99185, "epoch": 590} {"train_loss": -9.688994407653809, "global_step": 99186, "epoch": 590} {"train_loss": -9.947437286376953, "global_step": 99187, "epoch": 590} {"train_loss": -9.656038284301758, "global_step": 99188, "epoch": 590} {"train_loss": -9.788464546203613, "global_step": 99189, "epoch": 590} {"train_loss": -9.539482116699219, "global_step": 99190, "epoch": 590} {"train_loss": -9.93372631072998, "global_step": 99191, "epoch": 590} {"train_loss": -9.81951904296875, "global_step": 99192, "epoch": 590} {"train_loss": -9.582762718200684, "global_step": 99193, "epoch": 590} {"train_loss": -9.82365894317627, "global_step": 99194, "epoch": 590} {"train_loss": -9.705187797546387, "global_step": 99195, "epoch": 590} {"train_loss": -9.686971664428711, "global_step": 99196, "epoch": 590} {"train_loss": -9.708904266357422, "global_step": 99197, "epoch": 590} {"train_loss": -9.871152877807617, "global_step": 99198, "epoch": 590} {"train_loss": -9.672919273376465, "global_step": 99199, "epoch": 590} {"train_loss": -9.398321151733398, "global_step": 99200, "epoch": 590} {"train_loss": -9.672858238220215, "global_step": 99201, "epoch": 590} {"train_loss": -9.272541046142578, "global_step": 99202, "epoch": 590} {"train_loss": -9.42630386352539, "global_step": 99203, "epoch": 590} {"train_loss": -9.856046676635742, "global_step": 99204, "epoch": 590} {"train_loss": -9.563760757446289, "global_step": 99205, "epoch": 590} {"train_loss": -9.826242446899414, "global_step": 99206, "epoch": 590} {"train_loss": -9.781084060668945, "global_step": 99207, "epoch": 590} {"train_loss": -9.679551124572754, "global_step": 99208, "epoch": 590} {"train_loss": -9.56022834777832, "global_step": 99209, "epoch": 590} {"train_loss": -9.780442237854004, "global_step": 99210, "epoch": 590} {"train_loss": -9.236824035644531, "global_step": 99211, "epoch": 590} {"train_loss": -9.509889602661133, "global_step": 99212, "epoch": 590} {"train_loss": -9.3575439453125, "global_step": 99213, "epoch": 590} {"train_loss": -9.688702583312988, "global_step": 99214, "epoch": 590} {"train_loss": -9.394174575805664, "global_step": 99215, "epoch": 590} {"train_loss": -9.83363151550293, "global_step": 99216, "epoch": 590} {"train_loss": -9.588573455810547, "global_step": 99217, "epoch": 590} {"train_loss": -9.772897720336914, "global_step": 99218, "epoch": 590} {"train_loss": -9.871047973632812, "global_step": 99219, "epoch": 590} {"train_loss": -9.761887550354004, "global_step": 99220, "epoch": 590} {"train_loss": -9.701620101928711, "global_step": 99221, "epoch": 590} {"train_loss": -9.787705421447754, "global_step": 99222, "epoch": 590} {"train_loss": -9.84055233001709, "global_step": 99223, "epoch": 590} {"train_loss": -9.781953811645508, "global_step": 99224, "epoch": 590} {"train_loss": -9.759970664978027, "global_step": 99225, "epoch": 590} {"train_loss": -9.863523483276367, "global_step": 99226, "epoch": 590} {"train_loss": -9.794001579284668, "global_step": 99227, "epoch": 590} {"train_loss": -9.793466567993164, "global_step": 99228, "epoch": 590} {"train_loss": -9.723419189453125, "global_step": 99229, "epoch": 590} {"train_loss": -9.503009796142578, "global_step": 99230, "epoch": 590} {"train_loss": -9.71259593963623, "global_step": 99231, "epoch": 590} {"train_loss": -9.995548248291016, "global_step": 99232, "epoch": 590} {"train_loss": -9.677787780761719, "global_step": 99233, "epoch": 590} {"train_loss": -9.928433418273926, "global_step": 99234, "epoch": 590} {"train_loss": -9.732853889465332, "global_step": 99235, "epoch": 590} {"train_loss": -9.585403442382812, "global_step": 99236, "epoch": 590} {"train_loss": -10.064369201660156, "global_step": 99237, "epoch": 590} {"train_loss": -9.705615997314453, "global_step": 99238, "epoch": 590} {"train_loss": -10.001901626586914, "global_step": 99239, "epoch": 590} {"train_loss": -9.707442283630371, "global_step": 99240, "epoch": 590} {"train_loss": -9.877934455871582, "global_step": 99241, "epoch": 590} {"train_loss": -9.905553817749023, "global_step": 99242, "epoch": 590} {"train_loss": -9.618419647216797, "global_step": 99243, "epoch": 590} {"train_loss": -9.836735725402832, "global_step": 99244, "epoch": 590} {"train_loss": -9.814018249511719, "global_step": 99245, "epoch": 590} {"train_loss": -10.013660430908203, "global_step": 99246, "epoch": 590} {"train_loss": -9.637045860290527, "global_step": 99247, "epoch": 590} {"train_loss": -9.918681144714355, "global_step": 99248, "epoch": 590} {"train_loss": -9.960227012634277, "global_step": 99249, "epoch": 590} {"train_loss": -9.778079986572266, "global_step": 99250, "epoch": 590} {"train_loss": -9.894935607910156, "global_step": 99251, "epoch": 590} {"train_loss": -9.917242050170898, "global_step": 99252, "epoch": 590} {"train_loss": -9.758559226989746, "global_step": 99253, "epoch": 590} {"train_loss": -9.905009269714355, "global_step": 99254, "epoch": 590} {"train_loss": -9.770317077636719, "global_step": 99255, "epoch": 590} {"train_loss": -9.794038772583008, "global_step": 99256, "epoch": 590} {"train_loss": -9.987588882446289, "global_step": 99257, "epoch": 590} {"train_loss": -9.850870132446289, "global_step": 99258, "epoch": 590} {"train_loss": -9.451557159423828, "global_step": 99259, "epoch": 590} {"train_loss": -9.551025390625, "global_step": 99260, "epoch": 590} {"train_loss": -9.83290958404541, "global_step": 99261, "epoch": 590} {"train_loss": -9.641731262207031, "global_step": 99262, "epoch": 590} {"train_loss": -9.464645385742188, "global_step": 99263, "epoch": 590} {"train_loss": -9.463835716247559, "global_step": 99264, "epoch": 590} {"train_loss": -9.69566822052002, "global_step": 99265, "epoch": 590} {"train_loss": -9.766040802001953, "global_step": 99266, "epoch": 590} {"train_loss": -9.710373878479004, "global_step": 99267, "epoch": 590} {"train_loss": -9.458108901977539, "global_step": 99268, "epoch": 590} {"train_loss": -9.85359001159668, "global_step": 99269, "epoch": 590} {"train_loss": -9.704839706420898, "global_step": 99270, "epoch": 590} {"train_loss": -9.070237159729004, "global_step": 99271, "epoch": 590} {"train_loss": -9.908926010131836, "global_step": 99272, "epoch": 590} {"train_loss": -9.298049926757812, "global_step": 99273, "epoch": 590} {"train_loss": -9.68308162689209, "global_step": 99274, "epoch": 590} {"train_loss": -9.675176620483398, "global_step": 99275, "epoch": 590} {"train_loss": -8.8885498046875, "global_step": 99276, "epoch": 590} {"train_loss": -9.386091232299805, "global_step": 99277, "epoch": 590} {"train_loss": -9.448779106140137, "global_step": 99278, "epoch": 590} {"train_loss": -9.50976276397705, "global_step": 99279, "epoch": 590} {"train_loss": -9.57502555847168, "global_step": 99280, "epoch": 590} {"train_loss": -9.51205825805664, "global_step": 99281, "epoch": 590} {"train_loss": -9.583826065063477, "global_step": 99282, "epoch": 590} {"train_loss": -9.708585739135742, "global_step": 99283, "epoch": 590} {"train_loss": -9.739171981811523, "global_step": 99284, "epoch": 590} {"train_loss": -9.491024017333984, "global_step": 99285, "epoch": 590} {"train_loss": -9.600306510925293, "global_step": 99286, "epoch": 590} {"train_loss": -9.678832956722804, "global_step": 99287, "epoch": 590, "val_loss": 206537.21875, "train_action_mse_error": 3.7592101097106934} {"train_loss": -9.594736099243164, "global_step": 99288, "epoch": 591} {"train_loss": -9.591167449951172, "global_step": 99289, "epoch": 591} {"train_loss": -9.535451889038086, "global_step": 99290, "epoch": 591} {"train_loss": -9.634689331054688, "global_step": 99291, "epoch": 591} {"train_loss": -9.596686363220215, "global_step": 99292, "epoch": 591} {"train_loss": -9.81219482421875, "global_step": 99293, "epoch": 591} {"train_loss": -9.59672737121582, "global_step": 99294, "epoch": 591} {"train_loss": -9.606853485107422, "global_step": 99295, "epoch": 591} {"train_loss": -9.707603454589844, "global_step": 99296, "epoch": 591} {"train_loss": -9.702427864074707, "global_step": 99297, "epoch": 591} {"train_loss": -9.936408996582031, "global_step": 99298, "epoch": 591} {"train_loss": -9.684222221374512, "global_step": 99299, "epoch": 591} {"train_loss": -9.634387969970703, "global_step": 99300, "epoch": 591} {"train_loss": -9.571443557739258, "global_step": 99301, "epoch": 591} {"train_loss": -9.86870002746582, "global_step": 99302, "epoch": 591} {"train_loss": -9.818119049072266, "global_step": 99303, "epoch": 591} {"train_loss": -9.773591995239258, "global_step": 99304, "epoch": 591} {"train_loss": -9.521247863769531, "global_step": 99305, "epoch": 591} {"train_loss": -9.714454650878906, "global_step": 99306, "epoch": 591} {"train_loss": -9.91633129119873, "global_step": 99307, "epoch": 591} {"train_loss": -9.752300262451172, "global_step": 99308, "epoch": 591} {"train_loss": -9.777190208435059, "global_step": 99309, "epoch": 591} {"train_loss": -9.545747756958008, "global_step": 99310, "epoch": 591} {"train_loss": -9.64370059967041, "global_step": 99311, "epoch": 591} {"train_loss": -9.739778518676758, "global_step": 99312, "epoch": 591} {"train_loss": -9.677255630493164, "global_step": 99313, "epoch": 591} {"train_loss": -9.612525939941406, "global_step": 99314, "epoch": 591} {"train_loss": -9.709217071533203, "global_step": 99315, "epoch": 591} {"train_loss": -9.832633972167969, "global_step": 99316, "epoch": 591} {"train_loss": -9.96562385559082, "global_step": 99317, "epoch": 591} {"train_loss": -9.684747695922852, "global_step": 99318, "epoch": 591} {"train_loss": -9.935009002685547, "global_step": 99319, "epoch": 591} {"train_loss": -10.125240325927734, "global_step": 99320, "epoch": 591} {"train_loss": -9.761377334594727, "global_step": 99321, "epoch": 591} {"train_loss": -9.817581176757812, "global_step": 99322, "epoch": 591} {"train_loss": -9.992982864379883, "global_step": 99323, "epoch": 591} {"train_loss": -9.927836418151855, "global_step": 99324, "epoch": 591} {"train_loss": -9.708633422851562, "global_step": 99325, "epoch": 591} {"train_loss": -9.925003051757812, "global_step": 99326, "epoch": 591} {"train_loss": -10.161815643310547, "global_step": 99327, "epoch": 591} {"train_loss": -10.04046630859375, "global_step": 99328, "epoch": 591} {"train_loss": -9.871421813964844, "global_step": 99329, "epoch": 591} {"train_loss": -9.966545104980469, "global_step": 99330, "epoch": 591} {"train_loss": -9.938145637512207, "global_step": 99331, "epoch": 591} {"train_loss": -10.032605171203613, "global_step": 99332, "epoch": 591} {"train_loss": -9.840544700622559, "global_step": 99333, "epoch": 591} {"train_loss": -9.167989730834961, "global_step": 99334, "epoch": 591} {"train_loss": -9.749662399291992, "global_step": 99335, "epoch": 591} {"train_loss": -9.630345344543457, "global_step": 99336, "epoch": 591} {"train_loss": -9.642524719238281, "global_step": 99337, "epoch": 591} {"train_loss": -9.545210838317871, "global_step": 99338, "epoch": 591} {"train_loss": -9.514888763427734, "global_step": 99339, "epoch": 591} {"train_loss": -9.744039535522461, "global_step": 99340, "epoch": 591} {"train_loss": -9.310327529907227, "global_step": 99341, "epoch": 591} {"train_loss": -9.246706008911133, "global_step": 99342, "epoch": 591} {"train_loss": -9.623273849487305, "global_step": 99343, "epoch": 591} {"train_loss": -8.963798522949219, "global_step": 99344, "epoch": 591} {"train_loss": -9.59614086151123, "global_step": 99345, "epoch": 591} {"train_loss": -9.267853736877441, "global_step": 99346, "epoch": 591} {"train_loss": -9.75405502319336, "global_step": 99347, "epoch": 591} {"train_loss": -9.346999168395996, "global_step": 99348, "epoch": 591} {"train_loss": -9.642354011535645, "global_step": 99349, "epoch": 591} {"train_loss": -9.45705795288086, "global_step": 99350, "epoch": 591} {"train_loss": -9.7218017578125, "global_step": 99351, "epoch": 591} {"train_loss": -9.452765464782715, "global_step": 99352, "epoch": 591} {"train_loss": -9.600893020629883, "global_step": 99353, "epoch": 591} {"train_loss": -9.488598823547363, "global_step": 99354, "epoch": 591} {"train_loss": -9.60322093963623, "global_step": 99355, "epoch": 591} {"train_loss": -9.536933898925781, "global_step": 99356, "epoch": 591} {"train_loss": -9.587750434875488, "global_step": 99357, "epoch": 591} {"train_loss": -9.535957336425781, "global_step": 99358, "epoch": 591} {"train_loss": -9.737163543701172, "global_step": 99359, "epoch": 591} {"train_loss": -9.562573432922363, "global_step": 99360, "epoch": 591} {"train_loss": -9.48925495147705, "global_step": 99361, "epoch": 591} {"train_loss": -9.374486923217773, "global_step": 99362, "epoch": 591} {"train_loss": -9.642926216125488, "global_step": 99363, "epoch": 591} {"train_loss": -9.536297798156738, "global_step": 99364, "epoch": 591} {"train_loss": -9.47990608215332, "global_step": 99365, "epoch": 591} {"train_loss": -9.2781343460083, "global_step": 99366, "epoch": 591} {"train_loss": -9.623613357543945, "global_step": 99367, "epoch": 591} {"train_loss": -8.989898681640625, "global_step": 99368, "epoch": 591} {"train_loss": -9.438000679016113, "global_step": 99369, "epoch": 591} {"train_loss": -9.37254524230957, "global_step": 99370, "epoch": 591} {"train_loss": -9.257160186767578, "global_step": 99371, "epoch": 591} {"train_loss": -9.243430137634277, "global_step": 99372, "epoch": 591} {"train_loss": -9.705142974853516, "global_step": 99373, "epoch": 591} {"train_loss": -9.061790466308594, "global_step": 99374, "epoch": 591} {"train_loss": -9.250767707824707, "global_step": 99375, "epoch": 591} {"train_loss": -9.35456657409668, "global_step": 99376, "epoch": 591} {"train_loss": -9.289688110351562, "global_step": 99377, "epoch": 591} {"train_loss": -9.274904251098633, "global_step": 99378, "epoch": 591} {"train_loss": -9.341806411743164, "global_step": 99379, "epoch": 591} {"train_loss": -9.536166191101074, "global_step": 99380, "epoch": 591} {"train_loss": -9.253325462341309, "global_step": 99381, "epoch": 591} {"train_loss": -9.363783836364746, "global_step": 99382, "epoch": 591} {"train_loss": -9.453632354736328, "global_step": 99383, "epoch": 591} {"train_loss": -9.638540267944336, "global_step": 99384, "epoch": 591} {"train_loss": -9.626731872558594, "global_step": 99385, "epoch": 591} {"train_loss": -9.68425464630127, "global_step": 99386, "epoch": 591} {"train_loss": -9.434633255004883, "global_step": 99387, "epoch": 591} {"train_loss": -9.735931396484375, "global_step": 99388, "epoch": 591} {"train_loss": -9.449910163879395, "global_step": 99389, "epoch": 591} {"train_loss": -9.528423309326172, "global_step": 99390, "epoch": 591} {"train_loss": -9.706684112548828, "global_step": 99391, "epoch": 591} {"train_loss": -9.643152236938477, "global_step": 99392, "epoch": 591} {"train_loss": -9.962125778198242, "global_step": 99393, "epoch": 591} {"train_loss": -9.742349624633789, "global_step": 99394, "epoch": 591} {"train_loss": -9.783714294433594, "global_step": 99395, "epoch": 591} {"train_loss": -9.55246353149414, "global_step": 99396, "epoch": 591} {"train_loss": -9.630126953125, "global_step": 99397, "epoch": 591} {"train_loss": -9.832412719726562, "global_step": 99398, "epoch": 591} {"train_loss": -9.664804458618164, "global_step": 99399, "epoch": 591} {"train_loss": -9.7530517578125, "global_step": 99400, "epoch": 591} {"train_loss": -9.791055679321289, "global_step": 99401, "epoch": 591} {"train_loss": -9.496070861816406, "global_step": 99402, "epoch": 591} {"train_loss": -9.918031692504883, "global_step": 99403, "epoch": 591} {"train_loss": -9.89665699005127, "global_step": 99404, "epoch": 591} {"train_loss": -9.36468505859375, "global_step": 99405, "epoch": 591} {"train_loss": -9.432428359985352, "global_step": 99406, "epoch": 591} {"train_loss": -9.499839782714844, "global_step": 99407, "epoch": 591} {"train_loss": -9.14089584350586, "global_step": 99408, "epoch": 591} {"train_loss": -9.467386245727539, "global_step": 99409, "epoch": 591} {"train_loss": -9.271187782287598, "global_step": 99410, "epoch": 591} {"train_loss": -9.381346702575684, "global_step": 99411, "epoch": 591} {"train_loss": -9.55015754699707, "global_step": 99412, "epoch": 591} {"train_loss": -9.024068832397461, "global_step": 99413, "epoch": 591} {"train_loss": -9.356391906738281, "global_step": 99414, "epoch": 591} {"train_loss": -9.359049797058105, "global_step": 99415, "epoch": 591} {"train_loss": -9.434837341308594, "global_step": 99416, "epoch": 591} {"train_loss": -9.422240257263184, "global_step": 99417, "epoch": 591} {"train_loss": -9.414810180664062, "global_step": 99418, "epoch": 591} {"train_loss": -9.676329612731934, "global_step": 99419, "epoch": 591} {"train_loss": -9.440244674682617, "global_step": 99420, "epoch": 591} {"train_loss": -9.630029678344727, "global_step": 99421, "epoch": 591} {"train_loss": -9.272390365600586, "global_step": 99422, "epoch": 591} {"train_loss": -9.651910781860352, "global_step": 99423, "epoch": 591} {"train_loss": -9.164602279663086, "global_step": 99424, "epoch": 591} {"train_loss": -9.506641387939453, "global_step": 99425, "epoch": 591} {"train_loss": -9.50727653503418, "global_step": 99426, "epoch": 591} {"train_loss": -9.605875015258789, "global_step": 99427, "epoch": 591} {"train_loss": -9.378318786621094, "global_step": 99428, "epoch": 591} {"train_loss": -9.785045623779297, "global_step": 99429, "epoch": 591} {"train_loss": -9.637121200561523, "global_step": 99430, "epoch": 591} {"train_loss": -9.51628303527832, "global_step": 99431, "epoch": 591} {"train_loss": -9.440034866333008, "global_step": 99432, "epoch": 591} {"train_loss": -9.743768692016602, "global_step": 99433, "epoch": 591} {"train_loss": -9.681768417358398, "global_step": 99434, "epoch": 591} {"train_loss": -9.300768852233887, "global_step": 99435, "epoch": 591} {"train_loss": -9.53266429901123, "global_step": 99436, "epoch": 591} {"train_loss": -9.354039192199707, "global_step": 99437, "epoch": 591} {"train_loss": -9.512968063354492, "global_step": 99438, "epoch": 591} {"train_loss": -9.359172821044922, "global_step": 99439, "epoch": 591} {"train_loss": -9.814212799072266, "global_step": 99440, "epoch": 591} {"train_loss": -9.462644577026367, "global_step": 99441, "epoch": 591} {"train_loss": -9.449501037597656, "global_step": 99442, "epoch": 591} {"train_loss": -9.794463157653809, "global_step": 99443, "epoch": 591} {"train_loss": -9.449808120727539, "global_step": 99444, "epoch": 591} {"train_loss": -9.765426635742188, "global_step": 99445, "epoch": 591} {"train_loss": -9.589507102966309, "global_step": 99446, "epoch": 591} {"train_loss": -9.582686424255371, "global_step": 99447, "epoch": 591} {"train_loss": -9.56542682647705, "global_step": 99448, "epoch": 591} {"train_loss": -9.627277374267578, "global_step": 99449, "epoch": 591} {"train_loss": -9.520288467407227, "global_step": 99450, "epoch": 591} {"train_loss": -9.765789985656738, "global_step": 99451, "epoch": 591} {"train_loss": -9.467061042785645, "global_step": 99452, "epoch": 591} {"train_loss": -9.612494468688965, "global_step": 99453, "epoch": 591} {"train_loss": -9.648481369018555, "global_step": 99454, "epoch": 591} {"train_loss": -9.586515137127467, "global_step": 99455, "epoch": 591, "val_loss": 205908.734375} {"train_loss": -9.72788143157959, "global_step": 99456, "epoch": 592} {"train_loss": -9.650399208068848, "global_step": 99457, "epoch": 592} {"train_loss": -9.682092666625977, "global_step": 99458, "epoch": 592} {"train_loss": -9.541736602783203, "global_step": 99459, "epoch": 592} {"train_loss": -9.558202743530273, "global_step": 99460, "epoch": 592} {"train_loss": -9.583905220031738, "global_step": 99461, "epoch": 592} {"train_loss": -9.804912567138672, "global_step": 99462, "epoch": 592} {"train_loss": -9.40700912475586, "global_step": 99463, "epoch": 592} {"train_loss": -9.756049156188965, "global_step": 99464, "epoch": 592} {"train_loss": -9.504554748535156, "global_step": 99465, "epoch": 592} {"train_loss": -9.616764068603516, "global_step": 99466, "epoch": 592} {"train_loss": -9.915853500366211, "global_step": 99467, "epoch": 592} {"train_loss": -9.890539169311523, "global_step": 99468, "epoch": 592} {"train_loss": -9.45324420928955, "global_step": 99469, "epoch": 592} {"train_loss": -9.840740203857422, "global_step": 99470, "epoch": 592} {"train_loss": -9.695779800415039, "global_step": 99471, "epoch": 592} {"train_loss": -9.73398494720459, "global_step": 99472, "epoch": 592} {"train_loss": -9.681048393249512, "global_step": 99473, "epoch": 592} {"train_loss": -9.304871559143066, "global_step": 99474, "epoch": 592} {"train_loss": -9.99099063873291, "global_step": 99475, "epoch": 592} {"train_loss": -9.451485633850098, "global_step": 99476, "epoch": 592} {"train_loss": -9.694116592407227, "global_step": 99477, "epoch": 592} {"train_loss": -9.817926406860352, "global_step": 99478, "epoch": 592} {"train_loss": -9.639893531799316, "global_step": 99479, "epoch": 592} {"train_loss": -9.432601928710938, "global_step": 99480, "epoch": 592} {"train_loss": -9.743727684020996, "global_step": 99481, "epoch": 592} {"train_loss": -9.670039176940918, "global_step": 99482, "epoch": 592} {"train_loss": -9.606878280639648, "global_step": 99483, "epoch": 592} {"train_loss": -9.631694793701172, "global_step": 99484, "epoch": 592} {"train_loss": -9.76405143737793, "global_step": 99485, "epoch": 592} {"train_loss": -9.428560256958008, "global_step": 99486, "epoch": 592} {"train_loss": -9.67257022857666, "global_step": 99487, "epoch": 592} {"train_loss": -9.627972602844238, "global_step": 99488, "epoch": 592} {"train_loss": -9.734176635742188, "global_step": 99489, "epoch": 592} {"train_loss": -9.633642196655273, "global_step": 99490, "epoch": 592} {"train_loss": -9.807580947875977, "global_step": 99491, "epoch": 592} {"train_loss": -9.613245010375977, "global_step": 99492, "epoch": 592} {"train_loss": -9.57560920715332, "global_step": 99493, "epoch": 592} {"train_loss": -9.675008773803711, "global_step": 99494, "epoch": 592} {"train_loss": -9.53096866607666, "global_step": 99495, "epoch": 592} {"train_loss": -9.783984184265137, "global_step": 99496, "epoch": 592} {"train_loss": -9.65986156463623, "global_step": 99497, "epoch": 592} {"train_loss": -9.86314868927002, "global_step": 99498, "epoch": 592} {"train_loss": -9.903038024902344, "global_step": 99499, "epoch": 592} {"train_loss": -9.599974632263184, "global_step": 99500, "epoch": 592} {"train_loss": -9.892319679260254, "global_step": 99501, "epoch": 592} {"train_loss": -9.772077560424805, "global_step": 99502, "epoch": 592} {"train_loss": -9.738218307495117, "global_step": 99503, "epoch": 592} {"train_loss": -9.756242752075195, "global_step": 99504, "epoch": 592} {"train_loss": -9.874951362609863, "global_step": 99505, "epoch": 592} {"train_loss": -9.614214897155762, "global_step": 99506, "epoch": 592} {"train_loss": -9.83662223815918, "global_step": 99507, "epoch": 592} {"train_loss": -9.800812721252441, "global_step": 99508, "epoch": 592} {"train_loss": -9.767705917358398, "global_step": 99509, "epoch": 592} {"train_loss": -9.998808860778809, "global_step": 99510, "epoch": 592} {"train_loss": -9.712043762207031, "global_step": 99511, "epoch": 592} {"train_loss": -9.723384857177734, "global_step": 99512, "epoch": 592} {"train_loss": -9.7210054397583, "global_step": 99513, "epoch": 592} {"train_loss": -9.673056602478027, "global_step": 99514, "epoch": 592} {"train_loss": -9.616705894470215, "global_step": 99515, "epoch": 592} {"train_loss": -9.698958396911621, "global_step": 99516, "epoch": 592} {"train_loss": -9.598796844482422, "global_step": 99517, "epoch": 592} {"train_loss": -9.774683952331543, "global_step": 99518, "epoch": 592} {"train_loss": -9.331904411315918, "global_step": 99519, "epoch": 592} {"train_loss": -9.896566390991211, "global_step": 99520, "epoch": 592} {"train_loss": -9.612653732299805, "global_step": 99521, "epoch": 592} {"train_loss": -9.354981422424316, "global_step": 99522, "epoch": 592} {"train_loss": -9.656087875366211, "global_step": 99523, "epoch": 592} {"train_loss": -9.171860694885254, "global_step": 99524, "epoch": 592} {"train_loss": -9.358476638793945, "global_step": 99525, "epoch": 592} {"train_loss": -9.278857231140137, "global_step": 99526, "epoch": 592} {"train_loss": -8.976852416992188, "global_step": 99527, "epoch": 592} {"train_loss": -9.094476699829102, "global_step": 99528, "epoch": 592} {"train_loss": -9.412410736083984, "global_step": 99529, "epoch": 592} {"train_loss": -9.051694869995117, "global_step": 99530, "epoch": 592} {"train_loss": -9.139800071716309, "global_step": 99531, "epoch": 592} {"train_loss": -8.868955612182617, "global_step": 99532, "epoch": 592} {"train_loss": -8.81776237487793, "global_step": 99533, "epoch": 592} {"train_loss": -8.753867149353027, "global_step": 99534, "epoch": 592} {"train_loss": -9.123887062072754, "global_step": 99535, "epoch": 592} {"train_loss": -9.23968505859375, "global_step": 99536, "epoch": 592} {"train_loss": -9.11427116394043, "global_step": 99537, "epoch": 592} {"train_loss": -9.461372375488281, "global_step": 99538, "epoch": 592} {"train_loss": -9.068020820617676, "global_step": 99539, "epoch": 592} {"train_loss": -9.534347534179688, "global_step": 99540, "epoch": 592} {"train_loss": -9.29279899597168, "global_step": 99541, "epoch": 592} {"train_loss": -9.467684745788574, "global_step": 99542, "epoch": 592} {"train_loss": -9.486968994140625, "global_step": 99543, "epoch": 592} {"train_loss": -9.39542007446289, "global_step": 99544, "epoch": 592} {"train_loss": -9.540395736694336, "global_step": 99545, "epoch": 592} {"train_loss": -9.106195449829102, "global_step": 99546, "epoch": 592} {"train_loss": -9.550331115722656, "global_step": 99547, "epoch": 592} {"train_loss": -9.475580215454102, "global_step": 99548, "epoch": 592} {"train_loss": -9.567499160766602, "global_step": 99549, "epoch": 592} {"train_loss": -9.595237731933594, "global_step": 99550, "epoch": 592} {"train_loss": -9.522466659545898, "global_step": 99551, "epoch": 592} {"train_loss": -9.60250186920166, "global_step": 99552, "epoch": 592} {"train_loss": -9.532403945922852, "global_step": 99553, "epoch": 592} {"train_loss": -9.770318984985352, "global_step": 99554, "epoch": 592} {"train_loss": -9.728281021118164, "global_step": 99555, "epoch": 592} {"train_loss": -9.87661075592041, "global_step": 99556, "epoch": 592} {"train_loss": -9.731571197509766, "global_step": 99557, "epoch": 592} {"train_loss": -9.841083526611328, "global_step": 99558, "epoch": 592} {"train_loss": -9.921219825744629, "global_step": 99559, "epoch": 592} {"train_loss": -9.786746978759766, "global_step": 99560, "epoch": 592} {"train_loss": -9.611599922180176, "global_step": 99561, "epoch": 592} {"train_loss": -9.850726127624512, "global_step": 99562, "epoch": 592} {"train_loss": -9.872018814086914, "global_step": 99563, "epoch": 592} {"train_loss": -9.901079177856445, "global_step": 99564, "epoch": 592} {"train_loss": -9.717122077941895, "global_step": 99565, "epoch": 592} {"train_loss": -9.881429672241211, "global_step": 99566, "epoch": 592} {"train_loss": -9.83203411102295, "global_step": 99567, "epoch": 592} {"train_loss": -10.08118724822998, "global_step": 99568, "epoch": 592} {"train_loss": -9.874303817749023, "global_step": 99569, "epoch": 592} {"train_loss": -9.756095886230469, "global_step": 99570, "epoch": 592} {"train_loss": -9.67752742767334, "global_step": 99571, "epoch": 592} {"train_loss": -9.695900917053223, "global_step": 99572, "epoch": 592} {"train_loss": -9.595085144042969, "global_step": 99573, "epoch": 592} {"train_loss": -9.174992561340332, "global_step": 99574, "epoch": 592} {"train_loss": -9.739090919494629, "global_step": 99575, "epoch": 592} {"train_loss": -9.253150939941406, "global_step": 99576, "epoch": 592} {"train_loss": -9.446039199829102, "global_step": 99577, "epoch": 592} {"train_loss": -9.983087539672852, "global_step": 99578, "epoch": 592} {"train_loss": -9.274035453796387, "global_step": 99579, "epoch": 592} {"train_loss": -9.489397048950195, "global_step": 99580, "epoch": 592} {"train_loss": -9.440513610839844, "global_step": 99581, "epoch": 592} {"train_loss": -9.50282096862793, "global_step": 99582, "epoch": 592} {"train_loss": -9.266118049621582, "global_step": 99583, "epoch": 592} {"train_loss": -9.665144920349121, "global_step": 99584, "epoch": 592} {"train_loss": -9.723371505737305, "global_step": 99585, "epoch": 592} {"train_loss": -9.416851043701172, "global_step": 99586, "epoch": 592} {"train_loss": -9.76962947845459, "global_step": 99587, "epoch": 592} {"train_loss": -9.62109375, "global_step": 99588, "epoch": 592} {"train_loss": -9.735218048095703, "global_step": 99589, "epoch": 592} {"train_loss": -9.76011848449707, "global_step": 99590, "epoch": 592} {"train_loss": -9.489978790283203, "global_step": 99591, "epoch": 592} {"train_loss": -9.689901351928711, "global_step": 99592, "epoch": 592} {"train_loss": -9.652289390563965, "global_step": 99593, "epoch": 592} {"train_loss": -9.748698234558105, "global_step": 99594, "epoch": 592} {"train_loss": -9.575569152832031, "global_step": 99595, "epoch": 592} {"train_loss": -9.819110870361328, "global_step": 99596, "epoch": 592} {"train_loss": -9.55859375, "global_step": 99597, "epoch": 592} {"train_loss": -9.68034839630127, "global_step": 99598, "epoch": 592} {"train_loss": -9.589529037475586, "global_step": 99599, "epoch": 592} {"train_loss": -9.805065155029297, "global_step": 99600, "epoch": 592} {"train_loss": -9.638490676879883, "global_step": 99601, "epoch": 592} {"train_loss": -9.793810844421387, "global_step": 99602, "epoch": 592} {"train_loss": -9.747685432434082, "global_step": 99603, "epoch": 592} {"train_loss": -9.701547622680664, "global_step": 99604, "epoch": 592} {"train_loss": -9.697729110717773, "global_step": 99605, "epoch": 592} {"train_loss": -9.610488891601562, "global_step": 99606, "epoch": 592} {"train_loss": -9.676730155944824, "global_step": 99607, "epoch": 592} {"train_loss": -9.376331329345703, "global_step": 99608, "epoch": 592} {"train_loss": -9.55654525756836, "global_step": 99609, "epoch": 592} {"train_loss": -9.331897735595703, "global_step": 99610, "epoch": 592} {"train_loss": -9.772457122802734, "global_step": 99611, "epoch": 592} {"train_loss": -9.351802825927734, "global_step": 99612, "epoch": 592} {"train_loss": -9.474936485290527, "global_step": 99613, "epoch": 592} {"train_loss": -9.660297393798828, "global_step": 99614, "epoch": 592} {"train_loss": -9.525169372558594, "global_step": 99615, "epoch": 592} {"train_loss": -9.578327178955078, "global_step": 99616, "epoch": 592} {"train_loss": -9.60430908203125, "global_step": 99617, "epoch": 592} {"train_loss": -9.633079528808594, "global_step": 99618, "epoch": 592} {"train_loss": -9.829726219177246, "global_step": 99619, "epoch": 592} {"train_loss": -9.84292221069336, "global_step": 99620, "epoch": 592} {"train_loss": -9.657037734985352, "global_step": 99621, "epoch": 592} {"train_loss": -9.611612319946289, "global_step": 99622, "epoch": 592} {"train_loss": -9.601609241394769, "global_step": 99623, "epoch": 592, "val_loss": 206670.15625} {"train_loss": -9.751480102539062, "global_step": 99624, "epoch": 593} {"train_loss": -9.801389694213867, "global_step": 99625, "epoch": 593} {"train_loss": -9.837804794311523, "global_step": 99626, "epoch": 593} {"train_loss": -9.739083290100098, "global_step": 99627, "epoch": 593} {"train_loss": -9.65555477142334, "global_step": 99628, "epoch": 593} {"train_loss": -9.798145294189453, "global_step": 99629, "epoch": 593} {"train_loss": -9.539981842041016, "global_step": 99630, "epoch": 593} {"train_loss": -9.663467407226562, "global_step": 99631, "epoch": 593} {"train_loss": -9.654773712158203, "global_step": 99632, "epoch": 593} {"train_loss": -9.824670791625977, "global_step": 99633, "epoch": 593} {"train_loss": -9.55975341796875, "global_step": 99634, "epoch": 593} {"train_loss": -9.788567543029785, "global_step": 99635, "epoch": 593} {"train_loss": -9.657283782958984, "global_step": 99636, "epoch": 593} {"train_loss": -9.621316909790039, "global_step": 99637, "epoch": 593} {"train_loss": -9.66377067565918, "global_step": 99638, "epoch": 593} {"train_loss": -9.669535636901855, "global_step": 99639, "epoch": 593} {"train_loss": -9.483064651489258, "global_step": 99640, "epoch": 593} {"train_loss": -9.689866065979004, "global_step": 99641, "epoch": 593} {"train_loss": -9.679738998413086, "global_step": 99642, "epoch": 593} {"train_loss": -9.583505630493164, "global_step": 99643, "epoch": 593} {"train_loss": -9.764232635498047, "global_step": 99644, "epoch": 593} {"train_loss": -9.46225643157959, "global_step": 99645, "epoch": 593} {"train_loss": -9.759407997131348, "global_step": 99646, "epoch": 593} {"train_loss": -9.476800918579102, "global_step": 99647, "epoch": 593} {"train_loss": -9.676993370056152, "global_step": 99648, "epoch": 593} {"train_loss": -9.242706298828125, "global_step": 99649, "epoch": 593} {"train_loss": -9.096055030822754, "global_step": 99650, "epoch": 593} {"train_loss": -9.325240135192871, "global_step": 99651, "epoch": 593} {"train_loss": -9.260767936706543, "global_step": 99652, "epoch": 593} {"train_loss": -9.35399055480957, "global_step": 99653, "epoch": 593} {"train_loss": -9.510507583618164, "global_step": 99654, "epoch": 593} {"train_loss": -9.081620216369629, "global_step": 99655, "epoch": 593} {"train_loss": -9.882509231567383, "global_step": 99656, "epoch": 593} {"train_loss": -9.529559135437012, "global_step": 99657, "epoch": 593} {"train_loss": -9.497823715209961, "global_step": 99658, "epoch": 593} {"train_loss": -9.487051010131836, "global_step": 99659, "epoch": 593} {"train_loss": -9.630291938781738, "global_step": 99660, "epoch": 593} {"train_loss": -9.625396728515625, "global_step": 99661, "epoch": 593} {"train_loss": -9.872883796691895, "global_step": 99662, "epoch": 593} {"train_loss": -9.580276489257812, "global_step": 99663, "epoch": 593} {"train_loss": -9.792887687683105, "global_step": 99664, "epoch": 593} {"train_loss": -9.679849624633789, "global_step": 99665, "epoch": 593} {"train_loss": -9.814861297607422, "global_step": 99666, "epoch": 593} {"train_loss": -9.779929161071777, "global_step": 99667, "epoch": 593} {"train_loss": -9.606664657592773, "global_step": 99668, "epoch": 593} {"train_loss": -9.70957088470459, "global_step": 99669, "epoch": 593} {"train_loss": -9.625222206115723, "global_step": 99670, "epoch": 593} {"train_loss": -9.644304275512695, "global_step": 99671, "epoch": 593} {"train_loss": -9.802650451660156, "global_step": 99672, "epoch": 593} {"train_loss": -9.65037727355957, "global_step": 99673, "epoch": 593} {"train_loss": -9.751272201538086, "global_step": 99674, "epoch": 593} {"train_loss": -9.657062530517578, "global_step": 99675, "epoch": 593} {"train_loss": -9.825225830078125, "global_step": 99676, "epoch": 593} {"train_loss": -9.716909408569336, "global_step": 99677, "epoch": 593} {"train_loss": -9.70592975616455, "global_step": 99678, "epoch": 593} {"train_loss": -9.752955436706543, "global_step": 99679, "epoch": 593} {"train_loss": -9.701541900634766, "global_step": 99680, "epoch": 593} {"train_loss": -9.482988357543945, "global_step": 99681, "epoch": 593} {"train_loss": -9.920607566833496, "global_step": 99682, "epoch": 593} {"train_loss": -9.736988067626953, "global_step": 99683, "epoch": 593} {"train_loss": -9.855046272277832, "global_step": 99684, "epoch": 593} {"train_loss": -9.691753387451172, "global_step": 99685, "epoch": 593} {"train_loss": -9.76724910736084, "global_step": 99686, "epoch": 593} {"train_loss": -9.76364517211914, "global_step": 99687, "epoch": 593} {"train_loss": -9.75907039642334, "global_step": 99688, "epoch": 593} {"train_loss": -9.64868450164795, "global_step": 99689, "epoch": 593} {"train_loss": -9.38012981414795, "global_step": 99690, "epoch": 593} {"train_loss": -9.735596656799316, "global_step": 99691, "epoch": 593} {"train_loss": -9.837876319885254, "global_step": 99692, "epoch": 593} {"train_loss": -9.25586223602295, "global_step": 99693, "epoch": 593} {"train_loss": -9.427119255065918, "global_step": 99694, "epoch": 593} {"train_loss": -9.81495475769043, "global_step": 99695, "epoch": 593} {"train_loss": -9.486501693725586, "global_step": 99696, "epoch": 593} {"train_loss": -9.518220901489258, "global_step": 99697, "epoch": 593} {"train_loss": -9.754281997680664, "global_step": 99698, "epoch": 593} {"train_loss": -9.56485366821289, "global_step": 99699, "epoch": 593} {"train_loss": -9.40091323852539, "global_step": 99700, "epoch": 593} {"train_loss": -9.645157814025879, "global_step": 99701, "epoch": 593} {"train_loss": -9.216176986694336, "global_step": 99702, "epoch": 593} {"train_loss": -9.863423347473145, "global_step": 99703, "epoch": 593} {"train_loss": -9.539430618286133, "global_step": 99704, "epoch": 593} {"train_loss": -9.731874465942383, "global_step": 99705, "epoch": 593} {"train_loss": -9.710975646972656, "global_step": 99706, "epoch": 593} {"train_loss": -9.60932731628418, "global_step": 99707, "epoch": 593} {"train_loss": -9.56294059753418, "global_step": 99708, "epoch": 593} {"train_loss": -9.859149932861328, "global_step": 99709, "epoch": 593} {"train_loss": -9.919283866882324, "global_step": 99710, "epoch": 593} {"train_loss": -9.737918853759766, "global_step": 99711, "epoch": 593} {"train_loss": -9.76692008972168, "global_step": 99712, "epoch": 593} {"train_loss": -9.563365936279297, "global_step": 99713, "epoch": 593} {"train_loss": -9.802106857299805, "global_step": 99714, "epoch": 593} {"train_loss": -9.759033203125, "global_step": 99715, "epoch": 593} {"train_loss": -9.914176940917969, "global_step": 99716, "epoch": 593} {"train_loss": -9.8176851272583, "global_step": 99717, "epoch": 593} {"train_loss": -9.820512771606445, "global_step": 99718, "epoch": 593} {"train_loss": -9.76000690460205, "global_step": 99719, "epoch": 593} {"train_loss": -9.807486534118652, "global_step": 99720, "epoch": 593} {"train_loss": -9.581408500671387, "global_step": 99721, "epoch": 593} {"train_loss": -10.008769989013672, "global_step": 99722, "epoch": 593} {"train_loss": -9.632427215576172, "global_step": 99723, "epoch": 593} {"train_loss": -9.954030990600586, "global_step": 99724, "epoch": 593} {"train_loss": -9.778393745422363, "global_step": 99725, "epoch": 593} {"train_loss": -9.927994728088379, "global_step": 99726, "epoch": 593} {"train_loss": -10.094684600830078, "global_step": 99727, "epoch": 593} {"train_loss": -9.660192489624023, "global_step": 99728, "epoch": 593} {"train_loss": -9.983922958374023, "global_step": 99729, "epoch": 593} {"train_loss": -9.841242790222168, "global_step": 99730, "epoch": 593} {"train_loss": -9.59150218963623, "global_step": 99731, "epoch": 593} {"train_loss": -9.845419883728027, "global_step": 99732, "epoch": 593} {"train_loss": -9.837806701660156, "global_step": 99733, "epoch": 593} {"train_loss": -9.488306045532227, "global_step": 99734, "epoch": 593} {"train_loss": -9.933172225952148, "global_step": 99735, "epoch": 593} {"train_loss": -9.442220687866211, "global_step": 99736, "epoch": 593} {"train_loss": -9.406753540039062, "global_step": 99737, "epoch": 593} {"train_loss": -9.293282508850098, "global_step": 99738, "epoch": 593} {"train_loss": -9.382532119750977, "global_step": 99739, "epoch": 593} {"train_loss": -9.017364501953125, "global_step": 99740, "epoch": 593} {"train_loss": -9.866451263427734, "global_step": 99741, "epoch": 593} {"train_loss": -9.452559471130371, "global_step": 99742, "epoch": 593} {"train_loss": -9.689332962036133, "global_step": 99743, "epoch": 593} {"train_loss": -9.707287788391113, "global_step": 99744, "epoch": 593} {"train_loss": -9.295028686523438, "global_step": 99745, "epoch": 593} {"train_loss": -9.53139877319336, "global_step": 99746, "epoch": 593} {"train_loss": -9.325334548950195, "global_step": 99747, "epoch": 593} {"train_loss": -9.64596939086914, "global_step": 99748, "epoch": 593} {"train_loss": -9.712066650390625, "global_step": 99749, "epoch": 593} {"train_loss": -9.5720853805542, "global_step": 99750, "epoch": 593} {"train_loss": -9.598381042480469, "global_step": 99751, "epoch": 593} {"train_loss": -9.63076114654541, "global_step": 99752, "epoch": 593} {"train_loss": -9.867015838623047, "global_step": 99753, "epoch": 593} {"train_loss": -9.639627456665039, "global_step": 99754, "epoch": 593} {"train_loss": -9.678669929504395, "global_step": 99755, "epoch": 593} {"train_loss": -9.595527648925781, "global_step": 99756, "epoch": 593} {"train_loss": -9.835981369018555, "global_step": 99757, "epoch": 593} {"train_loss": -9.684654235839844, "global_step": 99758, "epoch": 593} {"train_loss": -9.860530853271484, "global_step": 99759, "epoch": 593} {"train_loss": -9.763527870178223, "global_step": 99760, "epoch": 593} {"train_loss": -9.81321907043457, "global_step": 99761, "epoch": 593} {"train_loss": -9.772218704223633, "global_step": 99762, "epoch": 593} {"train_loss": -9.786327362060547, "global_step": 99763, "epoch": 593} {"train_loss": -9.772378921508789, "global_step": 99764, "epoch": 593} {"train_loss": -10.017499923706055, "global_step": 99765, "epoch": 593} {"train_loss": -9.698129653930664, "global_step": 99766, "epoch": 593} {"train_loss": -9.911296844482422, "global_step": 99767, "epoch": 593} {"train_loss": -9.75006103515625, "global_step": 99768, "epoch": 593} {"train_loss": -9.603737831115723, "global_step": 99769, "epoch": 593} {"train_loss": -9.865493774414062, "global_step": 99770, "epoch": 593} {"train_loss": -9.747950553894043, "global_step": 99771, "epoch": 593} {"train_loss": -9.737571716308594, "global_step": 99772, "epoch": 593} {"train_loss": -9.864898681640625, "global_step": 99773, "epoch": 593} {"train_loss": -9.87501335144043, "global_step": 99774, "epoch": 593} {"train_loss": -9.741090774536133, "global_step": 99775, "epoch": 593} {"train_loss": -10.019244194030762, "global_step": 99776, "epoch": 593} {"train_loss": -9.587096214294434, "global_step": 99777, "epoch": 593} {"train_loss": -9.979605674743652, "global_step": 99778, "epoch": 593} {"train_loss": -10.096071243286133, "global_step": 99779, "epoch": 593} {"train_loss": -9.823978424072266, "global_step": 99780, "epoch": 593} {"train_loss": -9.751994132995605, "global_step": 99781, "epoch": 593} {"train_loss": -9.53957748413086, "global_step": 99782, "epoch": 593} {"train_loss": -9.930347442626953, "global_step": 99783, "epoch": 593} {"train_loss": -9.677847862243652, "global_step": 99784, "epoch": 593} {"train_loss": -9.383649826049805, "global_step": 99785, "epoch": 593} {"train_loss": -9.749058723449707, "global_step": 99786, "epoch": 593} {"train_loss": -9.682415008544922, "global_step": 99787, "epoch": 593} {"train_loss": -9.760744094848633, "global_step": 99788, "epoch": 593} {"train_loss": -9.464676856994629, "global_step": 99789, "epoch": 593} {"train_loss": -9.398103713989258, "global_step": 99790, "epoch": 593} {"train_loss": -9.674862106641134, "global_step": 99791, "epoch": 593, "val_loss": 207297.8125} {"train_loss": -9.6825532913208, "global_step": 99792, "epoch": 594} {"train_loss": -9.938804626464844, "global_step": 99793, "epoch": 594} {"train_loss": -9.578764915466309, "global_step": 99794, "epoch": 594} {"train_loss": -9.67312240600586, "global_step": 99795, "epoch": 594} {"train_loss": -9.259462356567383, "global_step": 99796, "epoch": 594} {"train_loss": -9.862346649169922, "global_step": 99797, "epoch": 594} {"train_loss": -9.710165977478027, "global_step": 99798, "epoch": 594} {"train_loss": -9.652615547180176, "global_step": 99799, "epoch": 594} {"train_loss": -9.727581024169922, "global_step": 99800, "epoch": 594} {"train_loss": -9.341232299804688, "global_step": 99801, "epoch": 594} {"train_loss": -9.490863800048828, "global_step": 99802, "epoch": 594} {"train_loss": -9.430200576782227, "global_step": 99803, "epoch": 594} {"train_loss": -9.621238708496094, "global_step": 99804, "epoch": 594} {"train_loss": -9.66860294342041, "global_step": 99805, "epoch": 594} {"train_loss": -9.45622444152832, "global_step": 99806, "epoch": 594} {"train_loss": -9.400922775268555, "global_step": 99807, "epoch": 594} {"train_loss": -9.524105072021484, "global_step": 99808, "epoch": 594} {"train_loss": -9.289104461669922, "global_step": 99809, "epoch": 594} {"train_loss": -9.747966766357422, "global_step": 99810, "epoch": 594} {"train_loss": -9.488554954528809, "global_step": 99811, "epoch": 594} {"train_loss": -9.773531913757324, "global_step": 99812, "epoch": 594} {"train_loss": -9.63364028930664, "global_step": 99813, "epoch": 594} {"train_loss": -9.542633056640625, "global_step": 99814, "epoch": 594} {"train_loss": -9.725555419921875, "global_step": 99815, "epoch": 594} {"train_loss": -9.941102981567383, "global_step": 99816, "epoch": 594} {"train_loss": -9.498950958251953, "global_step": 99817, "epoch": 594} {"train_loss": -9.94851303100586, "global_step": 99818, "epoch": 594} {"train_loss": -9.773574829101562, "global_step": 99819, "epoch": 594} {"train_loss": -9.405384063720703, "global_step": 99820, "epoch": 594} {"train_loss": -9.616555213928223, "global_step": 99821, "epoch": 594} {"train_loss": -9.479225158691406, "global_step": 99822, "epoch": 594} {"train_loss": -9.659972190856934, "global_step": 99823, "epoch": 594} {"train_loss": -9.481220245361328, "global_step": 99824, "epoch": 594} {"train_loss": -9.67402458190918, "global_step": 99825, "epoch": 594} {"train_loss": -9.958927154541016, "global_step": 99826, "epoch": 594} {"train_loss": -9.53702449798584, "global_step": 99827, "epoch": 594} {"train_loss": -9.687309265136719, "global_step": 99828, "epoch": 594} {"train_loss": -9.664192199707031, "global_step": 99829, "epoch": 594} {"train_loss": -9.516480445861816, "global_step": 99830, "epoch": 594} {"train_loss": -9.937049865722656, "global_step": 99831, "epoch": 594} {"train_loss": -9.755884170532227, "global_step": 99832, "epoch": 594} {"train_loss": -9.845337867736816, "global_step": 99833, "epoch": 594} {"train_loss": -9.575363159179688, "global_step": 99834, "epoch": 594} {"train_loss": -9.869670867919922, "global_step": 99835, "epoch": 594} {"train_loss": -9.537353515625, "global_step": 99836, "epoch": 594} {"train_loss": -9.448667526245117, "global_step": 99837, "epoch": 594} {"train_loss": -9.646062850952148, "global_step": 99838, "epoch": 594} {"train_loss": -9.768936157226562, "global_step": 99839, "epoch": 594} {"train_loss": -9.314006805419922, "global_step": 99840, "epoch": 594} {"train_loss": -9.767781257629395, "global_step": 99841, "epoch": 594} {"train_loss": -9.344715118408203, "global_step": 99842, "epoch": 594} {"train_loss": -9.592436790466309, "global_step": 99843, "epoch": 594} {"train_loss": -9.450626373291016, "global_step": 99844, "epoch": 594} {"train_loss": -9.749728202819824, "global_step": 99845, "epoch": 594} {"train_loss": -9.42668342590332, "global_step": 99846, "epoch": 594} {"train_loss": -9.791817665100098, "global_step": 99847, "epoch": 594} {"train_loss": -9.439102172851562, "global_step": 99848, "epoch": 594} {"train_loss": -9.704002380371094, "global_step": 99849, "epoch": 594} {"train_loss": -9.258241653442383, "global_step": 99850, "epoch": 594} {"train_loss": -9.648599624633789, "global_step": 99851, "epoch": 594} {"train_loss": -9.050774574279785, "global_step": 99852, "epoch": 594} {"train_loss": -9.530723571777344, "global_step": 99853, "epoch": 594} {"train_loss": -9.031408309936523, "global_step": 99854, "epoch": 594} {"train_loss": -9.475921630859375, "global_step": 99855, "epoch": 594} {"train_loss": -9.374160766601562, "global_step": 99856, "epoch": 594} {"train_loss": -9.633291244506836, "global_step": 99857, "epoch": 594} {"train_loss": -9.331125259399414, "global_step": 99858, "epoch": 594} {"train_loss": -9.189779281616211, "global_step": 99859, "epoch": 594} {"train_loss": -9.631916999816895, "global_step": 99860, "epoch": 594} {"train_loss": -9.505475997924805, "global_step": 99861, "epoch": 594} {"train_loss": -9.494876861572266, "global_step": 99862, "epoch": 594} {"train_loss": -9.513465881347656, "global_step": 99863, "epoch": 594} {"train_loss": -9.511760711669922, "global_step": 99864, "epoch": 594} {"train_loss": -9.499554634094238, "global_step": 99865, "epoch": 594} {"train_loss": -9.53815746307373, "global_step": 99866, "epoch": 594} {"train_loss": -9.530076026916504, "global_step": 99867, "epoch": 594} {"train_loss": -9.315742492675781, "global_step": 99868, "epoch": 594} {"train_loss": -9.529335975646973, "global_step": 99869, "epoch": 594} {"train_loss": -9.44858169555664, "global_step": 99870, "epoch": 594} {"train_loss": -9.228089332580566, "global_step": 99871, "epoch": 594} {"train_loss": -9.72265911102295, "global_step": 99872, "epoch": 594} {"train_loss": -9.41917610168457, "global_step": 99873, "epoch": 594} {"train_loss": -9.546106338500977, "global_step": 99874, "epoch": 594} {"train_loss": -9.641874313354492, "global_step": 99875, "epoch": 594} {"train_loss": -9.744775772094727, "global_step": 99876, "epoch": 594} {"train_loss": -9.645540237426758, "global_step": 99877, "epoch": 594} {"train_loss": -9.487194061279297, "global_step": 99878, "epoch": 594} {"train_loss": -9.660331726074219, "global_step": 99879, "epoch": 594} {"train_loss": -9.585521697998047, "global_step": 99880, "epoch": 594} {"train_loss": -9.476996421813965, "global_step": 99881, "epoch": 594} {"train_loss": -9.493074417114258, "global_step": 99882, "epoch": 594} {"train_loss": -9.550920486450195, "global_step": 99883, "epoch": 594} {"train_loss": -9.320114135742188, "global_step": 99884, "epoch": 594} {"train_loss": -9.504236221313477, "global_step": 99885, "epoch": 594} {"train_loss": -9.381606101989746, "global_step": 99886, "epoch": 594} {"train_loss": -9.797538757324219, "global_step": 99887, "epoch": 594} {"train_loss": -9.554977416992188, "global_step": 99888, "epoch": 594} {"train_loss": -9.778871536254883, "global_step": 99889, "epoch": 594} {"train_loss": -9.401415824890137, "global_step": 99890, "epoch": 594} {"train_loss": -9.883241653442383, "global_step": 99891, "epoch": 594} {"train_loss": -9.534448623657227, "global_step": 99892, "epoch": 594} {"train_loss": -10.095478057861328, "global_step": 99893, "epoch": 594} {"train_loss": -9.511966705322266, "global_step": 99894, "epoch": 594} {"train_loss": -9.850125312805176, "global_step": 99895, "epoch": 594} {"train_loss": -9.560076713562012, "global_step": 99896, "epoch": 594} {"train_loss": -9.738594055175781, "global_step": 99897, "epoch": 594} {"train_loss": -9.81474494934082, "global_step": 99898, "epoch": 594} {"train_loss": -9.714559555053711, "global_step": 99899, "epoch": 594} {"train_loss": -9.822509765625, "global_step": 99900, "epoch": 594} {"train_loss": -9.985214233398438, "global_step": 99901, "epoch": 594} {"train_loss": -9.948844909667969, "global_step": 99902, "epoch": 594} {"train_loss": -9.82807731628418, "global_step": 99903, "epoch": 594} {"train_loss": -9.80468463897705, "global_step": 99904, "epoch": 594} {"train_loss": -9.920906066894531, "global_step": 99905, "epoch": 594} {"train_loss": -9.82516860961914, "global_step": 99906, "epoch": 594} {"train_loss": -9.919401168823242, "global_step": 99907, "epoch": 594} {"train_loss": -9.642680168151855, "global_step": 99908, "epoch": 594} {"train_loss": -9.600885391235352, "global_step": 99909, "epoch": 594} {"train_loss": -9.694189071655273, "global_step": 99910, "epoch": 594} {"train_loss": -9.852724075317383, "global_step": 99911, "epoch": 594} {"train_loss": -9.591970443725586, "global_step": 99912, "epoch": 594} {"train_loss": -9.913056373596191, "global_step": 99913, "epoch": 594} {"train_loss": -9.817869186401367, "global_step": 99914, "epoch": 594} {"train_loss": -9.699480056762695, "global_step": 99915, "epoch": 594} {"train_loss": -9.999146461486816, "global_step": 99916, "epoch": 594} {"train_loss": -9.855825424194336, "global_step": 99917, "epoch": 594} {"train_loss": -9.758163452148438, "global_step": 99918, "epoch": 594} {"train_loss": -9.737762451171875, "global_step": 99919, "epoch": 594} {"train_loss": -9.73680305480957, "global_step": 99920, "epoch": 594} {"train_loss": -9.720633506774902, "global_step": 99921, "epoch": 594} {"train_loss": -10.102758407592773, "global_step": 99922, "epoch": 594} {"train_loss": -9.875556945800781, "global_step": 99923, "epoch": 594} {"train_loss": -9.667383193969727, "global_step": 99924, "epoch": 594} {"train_loss": -9.605819702148438, "global_step": 99925, "epoch": 594} {"train_loss": -10.011198043823242, "global_step": 99926, "epoch": 594} {"train_loss": -9.722301483154297, "global_step": 99927, "epoch": 594} {"train_loss": -9.89745044708252, "global_step": 99928, "epoch": 594} {"train_loss": -10.001005172729492, "global_step": 99929, "epoch": 594} {"train_loss": -9.757099151611328, "global_step": 99930, "epoch": 594} {"train_loss": -9.884292602539062, "global_step": 99931, "epoch": 594} {"train_loss": -9.966959953308105, "global_step": 99932, "epoch": 594} {"train_loss": -9.779143333435059, "global_step": 99933, "epoch": 594} {"train_loss": -9.825886726379395, "global_step": 99934, "epoch": 594} {"train_loss": -9.798702239990234, "global_step": 99935, "epoch": 594} {"train_loss": -10.033241271972656, "global_step": 99936, "epoch": 594} {"train_loss": -9.834352493286133, "global_step": 99937, "epoch": 594} {"train_loss": -9.556665420532227, "global_step": 99938, "epoch": 594} {"train_loss": -9.701825141906738, "global_step": 99939, "epoch": 594} {"train_loss": -9.883768081665039, "global_step": 99940, "epoch": 594} {"train_loss": -9.037432670593262, "global_step": 99941, "epoch": 594} {"train_loss": -9.851913452148438, "global_step": 99942, "epoch": 594} {"train_loss": -8.357650756835938, "global_step": 99943, "epoch": 594} {"train_loss": -8.576194763183594, "global_step": 99944, "epoch": 594} {"train_loss": -8.161432266235352, "global_step": 99945, "epoch": 594} {"train_loss": -8.936346054077148, "global_step": 99946, "epoch": 594} {"train_loss": -9.146011352539062, "global_step": 99947, "epoch": 594} {"train_loss": -8.494307518005371, "global_step": 99948, "epoch": 594} {"train_loss": -9.220191955566406, "global_step": 99949, "epoch": 594} {"train_loss": -8.688823699951172, "global_step": 99950, "epoch": 594} {"train_loss": -8.694096565246582, "global_step": 99951, "epoch": 594} {"train_loss": -9.134157180786133, "global_step": 99952, "epoch": 594} {"train_loss": -8.852524757385254, "global_step": 99953, "epoch": 594} {"train_loss": -8.509264945983887, "global_step": 99954, "epoch": 594} {"train_loss": -8.643729209899902, "global_step": 99955, "epoch": 594} {"train_loss": -8.930170059204102, "global_step": 99956, "epoch": 594} {"train_loss": -8.962371826171875, "global_step": 99957, "epoch": 594} {"train_loss": -8.863673210144043, "global_step": 99958, "epoch": 594} {"train_loss": -9.553575907434736, "global_step": 99959, "epoch": 594, "val_loss": 200540.859375} {"train_loss": -9.03158950805664, "global_step": 99960, "epoch": 595} {"train_loss": -8.872051239013672, "global_step": 99961, "epoch": 595} {"train_loss": -9.080482482910156, "global_step": 99962, "epoch": 595} {"train_loss": -8.96468734741211, "global_step": 99963, "epoch": 595} {"train_loss": -8.896810531616211, "global_step": 99964, "epoch": 595} {"train_loss": -9.055127143859863, "global_step": 99965, "epoch": 595} {"train_loss": -9.044422149658203, "global_step": 99966, "epoch": 595} {"train_loss": -8.897900581359863, "global_step": 99967, "epoch": 595} {"train_loss": -9.093526840209961, "global_step": 99968, "epoch": 595} {"train_loss": -9.34973430633545, "global_step": 99969, "epoch": 595} {"train_loss": -9.277338027954102, "global_step": 99970, "epoch": 595} {"train_loss": -9.19449234008789, "global_step": 99971, "epoch": 595} {"train_loss": -9.335561752319336, "global_step": 99972, "epoch": 595} {"train_loss": -9.233675003051758, "global_step": 99973, "epoch": 595} {"train_loss": -9.271415710449219, "global_step": 99974, "epoch": 595} {"train_loss": -9.228507995605469, "global_step": 99975, "epoch": 595} {"train_loss": -9.305442810058594, "global_step": 99976, "epoch": 595} {"train_loss": -9.101713180541992, "global_step": 99977, "epoch": 595} {"train_loss": -9.489774703979492, "global_step": 99978, "epoch": 595} {"train_loss": -9.3607816696167, "global_step": 99979, "epoch": 595} {"train_loss": -9.585784912109375, "global_step": 99980, "epoch": 595} {"train_loss": -9.494659423828125, "global_step": 99981, "epoch": 595} {"train_loss": -9.543238639831543, "global_step": 99982, "epoch": 595} {"train_loss": -9.781850814819336, "global_step": 99983, "epoch": 595} {"train_loss": -9.380181312561035, "global_step": 99984, "epoch": 595} {"train_loss": -9.781396865844727, "global_step": 99985, "epoch": 595} {"train_loss": -9.688909530639648, "global_step": 99986, "epoch": 595} {"train_loss": -9.703506469726562, "global_step": 99987, "epoch": 595} {"train_loss": -9.628833770751953, "global_step": 99988, "epoch": 595} {"train_loss": -9.930980682373047, "global_step": 99989, "epoch": 595} {"train_loss": -9.734878540039062, "global_step": 99990, "epoch": 595} {"train_loss": -9.704880714416504, "global_step": 99991, "epoch": 595} {"train_loss": -9.641576766967773, "global_step": 99992, "epoch": 595} {"train_loss": -9.863786697387695, "global_step": 99993, "epoch": 595} {"train_loss": -9.836578369140625, "global_step": 99994, "epoch": 595} {"train_loss": -9.818451881408691, "global_step": 99995, "epoch": 595} {"train_loss": -10.050821304321289, "global_step": 99996, "epoch": 595} {"train_loss": -9.868003845214844, "global_step": 99997, "epoch": 595} {"train_loss": -9.968530654907227, "global_step": 99998, "epoch": 595} {"train_loss": -9.958325386047363, "global_step": 99999, "epoch": 595} {"train_loss": -9.695853233337402, "global_step": 100000, "epoch": 595} {"train_loss": -9.989420890808105, "global_step": 100001, "epoch": 595} {"train_loss": -9.933928489685059, "global_step": 100002, "epoch": 595} {"train_loss": -9.887723922729492, "global_step": 100003, "epoch": 595} {"train_loss": -10.19882869720459, "global_step": 100004, "epoch": 595} {"train_loss": -9.786591529846191, "global_step": 100005, "epoch": 595} {"train_loss": -9.930787086486816, "global_step": 100006, "epoch": 595} {"train_loss": -9.91451358795166, "global_step": 100007, "epoch": 595} {"train_loss": -9.617074012756348, "global_step": 100008, "epoch": 595} {"train_loss": -9.802081108093262, "global_step": 100009, "epoch": 595} {"train_loss": -9.817495346069336, "global_step": 100010, "epoch": 595} {"train_loss": -9.835769653320312, "global_step": 100011, "epoch": 595} {"train_loss": -9.86955451965332, "global_step": 100012, "epoch": 595} {"train_loss": -9.746304512023926, "global_step": 100013, "epoch": 595} {"train_loss": -9.634003639221191, "global_step": 100014, "epoch": 595} {"train_loss": -9.48448371887207, "global_step": 100015, "epoch": 595} {"train_loss": -10.11330795288086, "global_step": 100016, "epoch": 595} {"train_loss": -9.859936714172363, "global_step": 100017, "epoch": 595} {"train_loss": -9.856796264648438, "global_step": 100018, "epoch": 595} {"train_loss": -9.716513633728027, "global_step": 100019, "epoch": 595} {"train_loss": -9.583710670471191, "global_step": 100020, "epoch": 595} {"train_loss": -9.763815879821777, "global_step": 100021, "epoch": 595} {"train_loss": -9.537111282348633, "global_step": 100022, "epoch": 595} {"train_loss": -9.923312187194824, "global_step": 100023, "epoch": 595} {"train_loss": -9.756853103637695, "global_step": 100024, "epoch": 595} {"train_loss": -9.611227035522461, "global_step": 100025, "epoch": 595} {"train_loss": -9.713025093078613, "global_step": 100026, "epoch": 595} {"train_loss": -9.402840614318848, "global_step": 100027, "epoch": 595} {"train_loss": -8.947181701660156, "global_step": 100028, "epoch": 595} {"train_loss": -9.843305587768555, "global_step": 100029, "epoch": 595} {"train_loss": -9.356216430664062, "global_step": 100030, "epoch": 595} {"train_loss": -9.680356979370117, "global_step": 100031, "epoch": 595} {"train_loss": -9.48170280456543, "global_step": 100032, "epoch": 595} {"train_loss": -9.49130630493164, "global_step": 100033, "epoch": 595} {"train_loss": -9.655922889709473, "global_step": 100034, "epoch": 595} {"train_loss": -9.38305950164795, "global_step": 100035, "epoch": 595} {"train_loss": -9.754752159118652, "global_step": 100036, "epoch": 595} {"train_loss": -9.521417617797852, "global_step": 100037, "epoch": 595} {"train_loss": -9.530920028686523, "global_step": 100038, "epoch": 595} {"train_loss": -9.775754928588867, "global_step": 100039, "epoch": 595} {"train_loss": -9.746084213256836, "global_step": 100040, "epoch": 595} {"train_loss": -9.759096145629883, "global_step": 100041, "epoch": 595} {"train_loss": -9.631376266479492, "global_step": 100042, "epoch": 595} {"train_loss": -9.538999557495117, "global_step": 100043, "epoch": 595} {"train_loss": -9.3045015335083, "global_step": 100044, "epoch": 595} {"train_loss": -9.366931915283203, "global_step": 100045, "epoch": 595} {"train_loss": -9.79341983795166, "global_step": 100046, "epoch": 595} {"train_loss": -9.487631797790527, "global_step": 100047, "epoch": 595} {"train_loss": -9.810792922973633, "global_step": 100048, "epoch": 595} {"train_loss": -9.873941421508789, "global_step": 100049, "epoch": 595} {"train_loss": -9.612079620361328, "global_step": 100050, "epoch": 595} {"train_loss": -9.923583030700684, "global_step": 100051, "epoch": 595} {"train_loss": -9.646524429321289, "global_step": 100052, "epoch": 595} {"train_loss": -9.402442932128906, "global_step": 100053, "epoch": 595} {"train_loss": -9.74891471862793, "global_step": 100054, "epoch": 595} {"train_loss": -9.769296646118164, "global_step": 100055, "epoch": 595} {"train_loss": -9.565979957580566, "global_step": 100056, "epoch": 595} {"train_loss": -9.871747970581055, "global_step": 100057, "epoch": 595} {"train_loss": -9.437772750854492, "global_step": 100058, "epoch": 595} {"train_loss": -9.751941680908203, "global_step": 100059, "epoch": 595} {"train_loss": -9.934197425842285, "global_step": 100060, "epoch": 595} {"train_loss": -9.445945739746094, "global_step": 100061, "epoch": 595} {"train_loss": -9.453828811645508, "global_step": 100062, "epoch": 595} {"train_loss": -9.475521087646484, "global_step": 100063, "epoch": 595} {"train_loss": -9.467334747314453, "global_step": 100064, "epoch": 595} {"train_loss": -9.597750663757324, "global_step": 100065, "epoch": 595} {"train_loss": -9.671965599060059, "global_step": 100066, "epoch": 595} {"train_loss": -9.350298881530762, "global_step": 100067, "epoch": 595} {"train_loss": -9.240360260009766, "global_step": 100068, "epoch": 595} {"train_loss": -9.657941818237305, "global_step": 100069, "epoch": 595} {"train_loss": -9.180933952331543, "global_step": 100070, "epoch": 595} {"train_loss": -9.682861328125, "global_step": 100071, "epoch": 595} {"train_loss": -9.616117477416992, "global_step": 100072, "epoch": 595} {"train_loss": -9.351848602294922, "global_step": 100073, "epoch": 595} {"train_loss": -9.602348327636719, "global_step": 100074, "epoch": 595} {"train_loss": -9.707193374633789, "global_step": 100075, "epoch": 595} {"train_loss": -9.382493019104004, "global_step": 100076, "epoch": 595} {"train_loss": -9.189401626586914, "global_step": 100077, "epoch": 595} {"train_loss": -9.728151321411133, "global_step": 100078, "epoch": 595} {"train_loss": -9.063684463500977, "global_step": 100079, "epoch": 595} {"train_loss": -9.537578582763672, "global_step": 100080, "epoch": 595} {"train_loss": -9.180338859558105, "global_step": 100081, "epoch": 595} {"train_loss": -9.55129623413086, "global_step": 100082, "epoch": 595} {"train_loss": -9.62660026550293, "global_step": 100083, "epoch": 595} {"train_loss": -9.357792854309082, "global_step": 100084, "epoch": 595} {"train_loss": -9.582741737365723, "global_step": 100085, "epoch": 595} {"train_loss": -9.66714859008789, "global_step": 100086, "epoch": 595} {"train_loss": -9.531942367553711, "global_step": 100087, "epoch": 595} {"train_loss": -9.653589248657227, "global_step": 100088, "epoch": 595} {"train_loss": -9.524965286254883, "global_step": 100089, "epoch": 595} {"train_loss": -9.648855209350586, "global_step": 100090, "epoch": 595} {"train_loss": -9.633261680603027, "global_step": 100091, "epoch": 595} {"train_loss": -9.764183044433594, "global_step": 100092, "epoch": 595} {"train_loss": -9.531615257263184, "global_step": 100093, "epoch": 595} {"train_loss": -9.630852699279785, "global_step": 100094, "epoch": 595} {"train_loss": -9.810644149780273, "global_step": 100095, "epoch": 595} {"train_loss": -9.519976615905762, "global_step": 100096, "epoch": 595} {"train_loss": -9.906706809997559, "global_step": 100097, "epoch": 595} {"train_loss": -9.733083724975586, "global_step": 100098, "epoch": 595} {"train_loss": -9.781454086303711, "global_step": 100099, "epoch": 595} {"train_loss": -9.850055694580078, "global_step": 100100, "epoch": 595} {"train_loss": -9.934624671936035, "global_step": 100101, "epoch": 595} {"train_loss": -9.85342025756836, "global_step": 100102, "epoch": 595} {"train_loss": -9.801212310791016, "global_step": 100103, "epoch": 595} {"train_loss": -9.665022850036621, "global_step": 100104, "epoch": 595} {"train_loss": -9.399736404418945, "global_step": 100105, "epoch": 595} {"train_loss": -9.558115005493164, "global_step": 100106, "epoch": 595} {"train_loss": -9.895602226257324, "global_step": 100107, "epoch": 595} {"train_loss": -9.804774284362793, "global_step": 100108, "epoch": 595} {"train_loss": -10.00890827178955, "global_step": 100109, "epoch": 595} {"train_loss": -9.694886207580566, "global_step": 100110, "epoch": 595} {"train_loss": -9.722772598266602, "global_step": 100111, "epoch": 595} {"train_loss": -9.901782989501953, "global_step": 100112, "epoch": 595} {"train_loss": -9.602901458740234, "global_step": 100113, "epoch": 595} {"train_loss": -9.799762725830078, "global_step": 100114, "epoch": 595} {"train_loss": -9.912220001220703, "global_step": 100115, "epoch": 595} {"train_loss": -9.292991638183594, "global_step": 100116, "epoch": 595} {"train_loss": -9.617849349975586, "global_step": 100117, "epoch": 595} {"train_loss": -9.404657363891602, "global_step": 100118, "epoch": 595} {"train_loss": -9.4576416015625, "global_step": 100119, "epoch": 595} {"train_loss": -9.5025053024292, "global_step": 100120, "epoch": 595} {"train_loss": -10.051050186157227, "global_step": 100121, "epoch": 595} {"train_loss": -9.547396659851074, "global_step": 100122, "epoch": 595} {"train_loss": -9.911102294921875, "global_step": 100123, "epoch": 595} {"train_loss": -9.549478530883789, "global_step": 100124, "epoch": 595} {"train_loss": -9.418418884277344, "global_step": 100125, "epoch": 595} {"train_loss": -9.815153121948242, "global_step": 100126, "epoch": 595} {"train_loss": -9.602806897390456, "global_step": 100127, "epoch": 595, "val_loss": 206038.03125, "train_action_mse_error": 2.489795207977295} {"train_loss": -9.860857009887695, "global_step": 100128, "epoch": 596} {"train_loss": -9.601705551147461, "global_step": 100129, "epoch": 596} {"train_loss": -9.802536010742188, "global_step": 100130, "epoch": 596} {"train_loss": -9.605103492736816, "global_step": 100131, "epoch": 596} {"train_loss": -9.50615119934082, "global_step": 100132, "epoch": 596} {"train_loss": -9.511238098144531, "global_step": 100133, "epoch": 596} {"train_loss": -9.423362731933594, "global_step": 100134, "epoch": 596} {"train_loss": -9.529450416564941, "global_step": 100135, "epoch": 596} {"train_loss": -9.851475715637207, "global_step": 100136, "epoch": 596} {"train_loss": -9.442926406860352, "global_step": 100137, "epoch": 596} {"train_loss": -9.627153396606445, "global_step": 100138, "epoch": 596} {"train_loss": -9.735618591308594, "global_step": 100139, "epoch": 596} {"train_loss": -9.197542190551758, "global_step": 100140, "epoch": 596} {"train_loss": -9.813142776489258, "global_step": 100141, "epoch": 596} {"train_loss": -9.187671661376953, "global_step": 100142, "epoch": 596} {"train_loss": -9.601396560668945, "global_step": 100143, "epoch": 596} {"train_loss": -9.58845329284668, "global_step": 100144, "epoch": 596} {"train_loss": -10.009510040283203, "global_step": 100145, "epoch": 596} {"train_loss": -9.68100357055664, "global_step": 100146, "epoch": 596} {"train_loss": -9.872528076171875, "global_step": 100147, "epoch": 596} {"train_loss": -9.553643226623535, "global_step": 100148, "epoch": 596} {"train_loss": -9.678956031799316, "global_step": 100149, "epoch": 596} {"train_loss": -9.911946296691895, "global_step": 100150, "epoch": 596} {"train_loss": -9.739423751831055, "global_step": 100151, "epoch": 596} {"train_loss": -9.524352073669434, "global_step": 100152, "epoch": 596} {"train_loss": -9.675569534301758, "global_step": 100153, "epoch": 596} {"train_loss": -9.94778823852539, "global_step": 100154, "epoch": 596} {"train_loss": -9.669050216674805, "global_step": 100155, "epoch": 596} {"train_loss": -9.881997108459473, "global_step": 100156, "epoch": 596} {"train_loss": -9.676397323608398, "global_step": 100157, "epoch": 596} {"train_loss": -9.806243896484375, "global_step": 100158, "epoch": 596} {"train_loss": -9.962067604064941, "global_step": 100159, "epoch": 596} {"train_loss": -9.881402015686035, "global_step": 100160, "epoch": 596} {"train_loss": -9.806474685668945, "global_step": 100161, "epoch": 596} {"train_loss": -9.975987434387207, "global_step": 100162, "epoch": 596} {"train_loss": -9.761286735534668, "global_step": 100163, "epoch": 596} {"train_loss": -9.890511512756348, "global_step": 100164, "epoch": 596} {"train_loss": -9.672761917114258, "global_step": 100165, "epoch": 596} {"train_loss": -9.825761795043945, "global_step": 100166, "epoch": 596} {"train_loss": -9.53154182434082, "global_step": 100167, "epoch": 596} {"train_loss": -9.719449996948242, "global_step": 100168, "epoch": 596} {"train_loss": -9.74492073059082, "global_step": 100169, "epoch": 596} {"train_loss": -9.911630630493164, "global_step": 100170, "epoch": 596} {"train_loss": -9.686260223388672, "global_step": 100171, "epoch": 596} {"train_loss": -9.87344741821289, "global_step": 100172, "epoch": 596} {"train_loss": -9.408149719238281, "global_step": 100173, "epoch": 596} {"train_loss": -9.518900871276855, "global_step": 100174, "epoch": 596} {"train_loss": -9.618106842041016, "global_step": 100175, "epoch": 596} {"train_loss": -9.483930587768555, "global_step": 100176, "epoch": 596} {"train_loss": -9.70058536529541, "global_step": 100177, "epoch": 596} {"train_loss": -9.399709701538086, "global_step": 100178, "epoch": 596} {"train_loss": -9.783370971679688, "global_step": 100179, "epoch": 596} {"train_loss": -9.384026527404785, "global_step": 100180, "epoch": 596} {"train_loss": -9.628395080566406, "global_step": 100181, "epoch": 596} {"train_loss": -9.222000122070312, "global_step": 100182, "epoch": 596} {"train_loss": -9.820716857910156, "global_step": 100183, "epoch": 596} {"train_loss": -9.274192810058594, "global_step": 100184, "epoch": 596} {"train_loss": -9.689517974853516, "global_step": 100185, "epoch": 596} {"train_loss": -9.365974426269531, "global_step": 100186, "epoch": 596} {"train_loss": -9.681660652160645, "global_step": 100187, "epoch": 596} {"train_loss": -9.731948852539062, "global_step": 100188, "epoch": 596} {"train_loss": -9.52955436706543, "global_step": 100189, "epoch": 596} {"train_loss": -9.734272956848145, "global_step": 100190, "epoch": 596} {"train_loss": -9.896075248718262, "global_step": 100191, "epoch": 596} {"train_loss": -9.609073638916016, "global_step": 100192, "epoch": 596} {"train_loss": -9.926226615905762, "global_step": 100193, "epoch": 596} {"train_loss": -9.787337303161621, "global_step": 100194, "epoch": 596} {"train_loss": -9.64525318145752, "global_step": 100195, "epoch": 596} {"train_loss": -9.670076370239258, "global_step": 100196, "epoch": 596} {"train_loss": -9.552650451660156, "global_step": 100197, "epoch": 596} {"train_loss": -9.761899948120117, "global_step": 100198, "epoch": 596} {"train_loss": -9.643476486206055, "global_step": 100199, "epoch": 596} {"train_loss": -9.751900672912598, "global_step": 100200, "epoch": 596} {"train_loss": -9.899666786193848, "global_step": 100201, "epoch": 596} {"train_loss": -9.950272560119629, "global_step": 100202, "epoch": 596} {"train_loss": -9.695262908935547, "global_step": 100203, "epoch": 596} {"train_loss": -9.853462219238281, "global_step": 100204, "epoch": 596} {"train_loss": -9.6768217086792, "global_step": 100205, "epoch": 596} {"train_loss": -9.820980072021484, "global_step": 100206, "epoch": 596} {"train_loss": -9.581424713134766, "global_step": 100207, "epoch": 596} {"train_loss": -9.611141204833984, "global_step": 100208, "epoch": 596} {"train_loss": -9.274847030639648, "global_step": 100209, "epoch": 596} {"train_loss": -9.75770092010498, "global_step": 100210, "epoch": 596} {"train_loss": -9.408401489257812, "global_step": 100211, "epoch": 596} {"train_loss": -9.301931381225586, "global_step": 100212, "epoch": 596} {"train_loss": -9.252605438232422, "global_step": 100213, "epoch": 596} {"train_loss": -9.217863082885742, "global_step": 100214, "epoch": 596} {"train_loss": -9.592130661010742, "global_step": 100215, "epoch": 596} {"train_loss": -8.894606590270996, "global_step": 100216, "epoch": 596} {"train_loss": -9.056519508361816, "global_step": 100217, "epoch": 596} {"train_loss": -9.360157012939453, "global_step": 100218, "epoch": 596} {"train_loss": -9.493865013122559, "global_step": 100219, "epoch": 596} {"train_loss": -9.426895141601562, "global_step": 100220, "epoch": 596} {"train_loss": -9.47828197479248, "global_step": 100221, "epoch": 596} {"train_loss": -9.91666030883789, "global_step": 100222, "epoch": 596} {"train_loss": -9.42739486694336, "global_step": 100223, "epoch": 596} {"train_loss": -9.79902458190918, "global_step": 100224, "epoch": 596} {"train_loss": -9.263961791992188, "global_step": 100225, "epoch": 596} {"train_loss": -9.876618385314941, "global_step": 100226, "epoch": 596} {"train_loss": -9.636707305908203, "global_step": 100227, "epoch": 596} {"train_loss": -9.473179817199707, "global_step": 100228, "epoch": 596} {"train_loss": -9.598519325256348, "global_step": 100229, "epoch": 596} {"train_loss": -9.552753448486328, "global_step": 100230, "epoch": 596} {"train_loss": -9.71546459197998, "global_step": 100231, "epoch": 596} {"train_loss": -9.578875541687012, "global_step": 100232, "epoch": 596} {"train_loss": -9.671098709106445, "global_step": 100233, "epoch": 596} {"train_loss": -9.670215606689453, "global_step": 100234, "epoch": 596} {"train_loss": -9.681007385253906, "global_step": 100235, "epoch": 596} {"train_loss": -9.744954109191895, "global_step": 100236, "epoch": 596} {"train_loss": -9.726892471313477, "global_step": 100237, "epoch": 596} {"train_loss": -9.819952011108398, "global_step": 100238, "epoch": 596} {"train_loss": -9.634510040283203, "global_step": 100239, "epoch": 596} {"train_loss": -9.849525451660156, "global_step": 100240, "epoch": 596} {"train_loss": -9.886873245239258, "global_step": 100241, "epoch": 596} {"train_loss": -9.67313003540039, "global_step": 100242, "epoch": 596} {"train_loss": -9.721435546875, "global_step": 100243, "epoch": 596} {"train_loss": -9.915135383605957, "global_step": 100244, "epoch": 596} {"train_loss": -9.757997512817383, "global_step": 100245, "epoch": 596} {"train_loss": -9.922809600830078, "global_step": 100246, "epoch": 596} {"train_loss": -9.91190242767334, "global_step": 100247, "epoch": 596} {"train_loss": -10.005578994750977, "global_step": 100248, "epoch": 596} {"train_loss": -9.81112289428711, "global_step": 100249, "epoch": 596} {"train_loss": -9.770612716674805, "global_step": 100250, "epoch": 596} {"train_loss": -9.716279983520508, "global_step": 100251, "epoch": 596} {"train_loss": -9.873929977416992, "global_step": 100252, "epoch": 596} {"train_loss": -9.677314758300781, "global_step": 100253, "epoch": 596} {"train_loss": -9.611496925354004, "global_step": 100254, "epoch": 596} {"train_loss": -9.37852668762207, "global_step": 100255, "epoch": 596} {"train_loss": -9.487981796264648, "global_step": 100256, "epoch": 596} {"train_loss": -9.741949081420898, "global_step": 100257, "epoch": 596} {"train_loss": -9.471380233764648, "global_step": 100258, "epoch": 596} {"train_loss": -9.509479522705078, "global_step": 100259, "epoch": 596} {"train_loss": -9.155214309692383, "global_step": 100260, "epoch": 596} {"train_loss": -9.729576110839844, "global_step": 100261, "epoch": 596} {"train_loss": -9.554570198059082, "global_step": 100262, "epoch": 596} {"train_loss": -9.32337760925293, "global_step": 100263, "epoch": 596} {"train_loss": -9.46406364440918, "global_step": 100264, "epoch": 596} {"train_loss": -9.284961700439453, "global_step": 100265, "epoch": 596} {"train_loss": -9.337846755981445, "global_step": 100266, "epoch": 596} {"train_loss": -9.27753734588623, "global_step": 100267, "epoch": 596} {"train_loss": -9.367910385131836, "global_step": 100268, "epoch": 596} {"train_loss": -9.572200775146484, "global_step": 100269, "epoch": 596} {"train_loss": -9.592121124267578, "global_step": 100270, "epoch": 596} {"train_loss": -9.626322746276855, "global_step": 100271, "epoch": 596} {"train_loss": -9.472623825073242, "global_step": 100272, "epoch": 596} {"train_loss": -9.585328102111816, "global_step": 100273, "epoch": 596} {"train_loss": -9.520025253295898, "global_step": 100274, "epoch": 596} {"train_loss": -9.701972961425781, "global_step": 100275, "epoch": 596} {"train_loss": -9.569503784179688, "global_step": 100276, "epoch": 596} {"train_loss": -9.913664817810059, "global_step": 100277, "epoch": 596} {"train_loss": -9.812376022338867, "global_step": 100278, "epoch": 596} {"train_loss": -9.687650680541992, "global_step": 100279, "epoch": 596} {"train_loss": -9.675626754760742, "global_step": 100280, "epoch": 596} {"train_loss": -9.648689270019531, "global_step": 100281, "epoch": 596} {"train_loss": -9.714034080505371, "global_step": 100282, "epoch": 596} {"train_loss": -9.645015716552734, "global_step": 100283, "epoch": 596} {"train_loss": -9.80567741394043, "global_step": 100284, "epoch": 596} {"train_loss": -9.71388053894043, "global_step": 100285, "epoch": 596} {"train_loss": -9.81128215789795, "global_step": 100286, "epoch": 596} {"train_loss": -9.602781295776367, "global_step": 100287, "epoch": 596} {"train_loss": -9.731382369995117, "global_step": 100288, "epoch": 596} {"train_loss": -9.704765319824219, "global_step": 100289, "epoch": 596} {"train_loss": -9.776060104370117, "global_step": 100290, "epoch": 596} {"train_loss": -9.701268196105957, "global_step": 100291, "epoch": 596} {"train_loss": -9.54686164855957, "global_step": 100292, "epoch": 596} {"train_loss": -9.773971557617188, "global_step": 100293, "epoch": 596} {"train_loss": -9.75942611694336, "global_step": 100294, "epoch": 596} {"train_loss": -9.64341138090406, "global_step": 100295, "epoch": 596, "val_loss": 206243.171875} {"train_loss": -9.618532180786133, "global_step": 100296, "epoch": 597} {"train_loss": -9.683637619018555, "global_step": 100297, "epoch": 597} {"train_loss": -9.7628755569458, "global_step": 100298, "epoch": 597} {"train_loss": -9.418333053588867, "global_step": 100299, "epoch": 597} {"train_loss": -9.213215827941895, "global_step": 100300, "epoch": 597} {"train_loss": -9.814318656921387, "global_step": 100301, "epoch": 597} {"train_loss": -9.55429458618164, "global_step": 100302, "epoch": 597} {"train_loss": -9.423664093017578, "global_step": 100303, "epoch": 597} {"train_loss": -9.66181468963623, "global_step": 100304, "epoch": 597} {"train_loss": -9.367918014526367, "global_step": 100305, "epoch": 597} {"train_loss": -9.677574157714844, "global_step": 100306, "epoch": 597} {"train_loss": -9.795633316040039, "global_step": 100307, "epoch": 597} {"train_loss": -9.881887435913086, "global_step": 100308, "epoch": 597} {"train_loss": -9.61491584777832, "global_step": 100309, "epoch": 597} {"train_loss": -9.707082748413086, "global_step": 100310, "epoch": 597} {"train_loss": -9.64972972869873, "global_step": 100311, "epoch": 597} {"train_loss": -9.275339126586914, "global_step": 100312, "epoch": 597} {"train_loss": -9.848260879516602, "global_step": 100313, "epoch": 597} {"train_loss": -9.764233589172363, "global_step": 100314, "epoch": 597} {"train_loss": -9.61252498626709, "global_step": 100315, "epoch": 597} {"train_loss": -9.59941577911377, "global_step": 100316, "epoch": 597} {"train_loss": -9.690042495727539, "global_step": 100317, "epoch": 597} {"train_loss": -9.686610221862793, "global_step": 100318, "epoch": 597} {"train_loss": -9.819133758544922, "global_step": 100319, "epoch": 597} {"train_loss": -9.79887580871582, "global_step": 100320, "epoch": 597} {"train_loss": -9.705831527709961, "global_step": 100321, "epoch": 597} {"train_loss": -9.882807731628418, "global_step": 100322, "epoch": 597} {"train_loss": -9.525991439819336, "global_step": 100323, "epoch": 597} {"train_loss": -9.558106422424316, "global_step": 100324, "epoch": 597} {"train_loss": -9.979394912719727, "global_step": 100325, "epoch": 597} {"train_loss": -9.436728477478027, "global_step": 100326, "epoch": 597} {"train_loss": -9.517108917236328, "global_step": 100327, "epoch": 597} {"train_loss": -9.765472412109375, "global_step": 100328, "epoch": 597} {"train_loss": -9.552188873291016, "global_step": 100329, "epoch": 597} {"train_loss": -9.8011474609375, "global_step": 100330, "epoch": 597} {"train_loss": -9.739619255065918, "global_step": 100331, "epoch": 597} {"train_loss": -9.90890121459961, "global_step": 100332, "epoch": 597} {"train_loss": -9.752344131469727, "global_step": 100333, "epoch": 597} {"train_loss": -9.906675338745117, "global_step": 100334, "epoch": 597} {"train_loss": -10.038627624511719, "global_step": 100335, "epoch": 597} {"train_loss": -9.913825988769531, "global_step": 100336, "epoch": 597} {"train_loss": -10.035154342651367, "global_step": 100337, "epoch": 597} {"train_loss": -9.912723541259766, "global_step": 100338, "epoch": 597} {"train_loss": -9.481168746948242, "global_step": 100339, "epoch": 597} {"train_loss": -9.938404083251953, "global_step": 100340, "epoch": 597} {"train_loss": -9.759218215942383, "global_step": 100341, "epoch": 597} {"train_loss": -10.028264999389648, "global_step": 100342, "epoch": 597} {"train_loss": -9.798937797546387, "global_step": 100343, "epoch": 597} {"train_loss": -9.87586784362793, "global_step": 100344, "epoch": 597} {"train_loss": -10.096574783325195, "global_step": 100345, "epoch": 597} {"train_loss": -9.97204303741455, "global_step": 100346, "epoch": 597} {"train_loss": -9.668074607849121, "global_step": 100347, "epoch": 597} {"train_loss": -9.638171195983887, "global_step": 100348, "epoch": 597} {"train_loss": -9.82016372680664, "global_step": 100349, "epoch": 597} {"train_loss": -9.756539344787598, "global_step": 100350, "epoch": 597} {"train_loss": -9.96911334991455, "global_step": 100351, "epoch": 597} {"train_loss": -9.551508903503418, "global_step": 100352, "epoch": 597} {"train_loss": -9.635641098022461, "global_step": 100353, "epoch": 597} {"train_loss": -9.819482803344727, "global_step": 100354, "epoch": 597} {"train_loss": -9.594011306762695, "global_step": 100355, "epoch": 597} {"train_loss": -9.581902503967285, "global_step": 100356, "epoch": 597} {"train_loss": -9.97813606262207, "global_step": 100357, "epoch": 597} {"train_loss": -9.610422134399414, "global_step": 100358, "epoch": 597} {"train_loss": -9.817875862121582, "global_step": 100359, "epoch": 597} {"train_loss": -9.765727996826172, "global_step": 100360, "epoch": 597} {"train_loss": -9.37076187133789, "global_step": 100361, "epoch": 597} {"train_loss": -9.645262718200684, "global_step": 100362, "epoch": 597} {"train_loss": -9.639412879943848, "global_step": 100363, "epoch": 597} {"train_loss": -9.426395416259766, "global_step": 100364, "epoch": 597} {"train_loss": -9.614004135131836, "global_step": 100365, "epoch": 597} {"train_loss": -9.339134216308594, "global_step": 100366, "epoch": 597} {"train_loss": -9.226846694946289, "global_step": 100367, "epoch": 597} {"train_loss": -9.662284851074219, "global_step": 100368, "epoch": 597} {"train_loss": -9.219321250915527, "global_step": 100369, "epoch": 597} {"train_loss": -9.482759475708008, "global_step": 100370, "epoch": 597} {"train_loss": -9.468088150024414, "global_step": 100371, "epoch": 597} {"train_loss": -9.238374710083008, "global_step": 100372, "epoch": 597} {"train_loss": -9.799448013305664, "global_step": 100373, "epoch": 597} {"train_loss": -9.397409439086914, "global_step": 100374, "epoch": 597} {"train_loss": -9.54939079284668, "global_step": 100375, "epoch": 597} {"train_loss": -9.693601608276367, "global_step": 100376, "epoch": 597} {"train_loss": -9.722282409667969, "global_step": 100377, "epoch": 597} {"train_loss": -9.588705062866211, "global_step": 100378, "epoch": 597} {"train_loss": -9.679533958435059, "global_step": 100379, "epoch": 597} {"train_loss": -9.582510948181152, "global_step": 100380, "epoch": 597} {"train_loss": -9.734481811523438, "global_step": 100381, "epoch": 597} {"train_loss": -9.706851959228516, "global_step": 100382, "epoch": 597} {"train_loss": -10.063523292541504, "global_step": 100383, "epoch": 597} {"train_loss": -9.463722229003906, "global_step": 100384, "epoch": 597} {"train_loss": -9.817222595214844, "global_step": 100385, "epoch": 597} {"train_loss": -9.739737510681152, "global_step": 100386, "epoch": 597} {"train_loss": -9.683273315429688, "global_step": 100387, "epoch": 597} {"train_loss": -9.864463806152344, "global_step": 100388, "epoch": 597} {"train_loss": -9.431535720825195, "global_step": 100389, "epoch": 597} {"train_loss": -9.794299125671387, "global_step": 100390, "epoch": 597} {"train_loss": -9.713229179382324, "global_step": 100391, "epoch": 597} {"train_loss": -9.727094650268555, "global_step": 100392, "epoch": 597} {"train_loss": -9.673507690429688, "global_step": 100393, "epoch": 597} {"train_loss": -9.503860473632812, "global_step": 100394, "epoch": 597} {"train_loss": -9.754780769348145, "global_step": 100395, "epoch": 597} {"train_loss": -9.57132339477539, "global_step": 100396, "epoch": 597} {"train_loss": -9.775163650512695, "global_step": 100397, "epoch": 597} {"train_loss": -9.52243423461914, "global_step": 100398, "epoch": 597} {"train_loss": -9.538905143737793, "global_step": 100399, "epoch": 597} {"train_loss": -9.565471649169922, "global_step": 100400, "epoch": 597} {"train_loss": -9.573729515075684, "global_step": 100401, "epoch": 597} {"train_loss": -9.654613494873047, "global_step": 100402, "epoch": 597} {"train_loss": -9.750008583068848, "global_step": 100403, "epoch": 597} {"train_loss": -9.36990737915039, "global_step": 100404, "epoch": 597} {"train_loss": -9.686237335205078, "global_step": 100405, "epoch": 597} {"train_loss": -9.957569122314453, "global_step": 100406, "epoch": 597} {"train_loss": -9.59414005279541, "global_step": 100407, "epoch": 597} {"train_loss": -9.85169792175293, "global_step": 100408, "epoch": 597} {"train_loss": -9.550262451171875, "global_step": 100409, "epoch": 597} {"train_loss": -9.620567321777344, "global_step": 100410, "epoch": 597} {"train_loss": -9.487531661987305, "global_step": 100411, "epoch": 597} {"train_loss": -9.641430854797363, "global_step": 100412, "epoch": 597} {"train_loss": -9.84823989868164, "global_step": 100413, "epoch": 597} {"train_loss": -9.517791748046875, "global_step": 100414, "epoch": 597} {"train_loss": -9.5296630859375, "global_step": 100415, "epoch": 597} {"train_loss": -9.989303588867188, "global_step": 100416, "epoch": 597} {"train_loss": -9.387245178222656, "global_step": 100417, "epoch": 597} {"train_loss": -9.82638168334961, "global_step": 100418, "epoch": 597} {"train_loss": -9.778735160827637, "global_step": 100419, "epoch": 597} {"train_loss": -9.716377258300781, "global_step": 100420, "epoch": 597} {"train_loss": -9.611481666564941, "global_step": 100421, "epoch": 597} {"train_loss": -9.66474723815918, "global_step": 100422, "epoch": 597} {"train_loss": -9.847516059875488, "global_step": 100423, "epoch": 597} {"train_loss": -9.632291793823242, "global_step": 100424, "epoch": 597} {"train_loss": -10.008047103881836, "global_step": 100425, "epoch": 597} {"train_loss": -9.687146186828613, "global_step": 100426, "epoch": 597} {"train_loss": -9.86819076538086, "global_step": 100427, "epoch": 597} {"train_loss": -9.486068725585938, "global_step": 100428, "epoch": 597} {"train_loss": -9.708958625793457, "global_step": 100429, "epoch": 597} {"train_loss": -9.754398345947266, "global_step": 100430, "epoch": 597} {"train_loss": -9.832630157470703, "global_step": 100431, "epoch": 597} {"train_loss": -9.799060821533203, "global_step": 100432, "epoch": 597} {"train_loss": -9.962469100952148, "global_step": 100433, "epoch": 597} {"train_loss": -9.787227630615234, "global_step": 100434, "epoch": 597} {"train_loss": -10.16092300415039, "global_step": 100435, "epoch": 597} {"train_loss": -9.847173690795898, "global_step": 100436, "epoch": 597} {"train_loss": -9.776100158691406, "global_step": 100437, "epoch": 597} {"train_loss": -9.840287208557129, "global_step": 100438, "epoch": 597} {"train_loss": -9.905717849731445, "global_step": 100439, "epoch": 597} {"train_loss": -9.872627258300781, "global_step": 100440, "epoch": 597} {"train_loss": -9.95380687713623, "global_step": 100441, "epoch": 597} {"train_loss": -9.750251770019531, "global_step": 100442, "epoch": 597} {"train_loss": -10.032217979431152, "global_step": 100443, "epoch": 597} {"train_loss": -9.546368598937988, "global_step": 100444, "epoch": 597} {"train_loss": -9.89277458190918, "global_step": 100445, "epoch": 597} {"train_loss": -9.628091812133789, "global_step": 100446, "epoch": 597} {"train_loss": -9.48508071899414, "global_step": 100447, "epoch": 597} {"train_loss": -10.074913024902344, "global_step": 100448, "epoch": 597} {"train_loss": -9.577482223510742, "global_step": 100449, "epoch": 597} {"train_loss": -9.703466415405273, "global_step": 100450, "epoch": 597} {"train_loss": -9.59119987487793, "global_step": 100451, "epoch": 597} {"train_loss": -9.770362854003906, "global_step": 100452, "epoch": 597} {"train_loss": -9.722356796264648, "global_step": 100453, "epoch": 597} {"train_loss": -9.586511611938477, "global_step": 100454, "epoch": 597} {"train_loss": -9.954046249389648, "global_step": 100455, "epoch": 597} {"train_loss": -9.500051498413086, "global_step": 100456, "epoch": 597} {"train_loss": -9.528703689575195, "global_step": 100457, "epoch": 597} {"train_loss": -9.427657127380371, "global_step": 100458, "epoch": 597} {"train_loss": -9.708198547363281, "global_step": 100459, "epoch": 597} {"train_loss": -9.648859024047852, "global_step": 100460, "epoch": 597} {"train_loss": -9.78221607208252, "global_step": 100461, "epoch": 597} {"train_loss": -9.613128662109375, "global_step": 100462, "epoch": 597} {"train_loss": -9.69383694444384, "global_step": 100463, "epoch": 597, "val_loss": 207752.703125} {"train_loss": -9.455005645751953, "global_step": 100464, "epoch": 598} {"train_loss": -9.817215919494629, "global_step": 100465, "epoch": 598} {"train_loss": -9.309947967529297, "global_step": 100466, "epoch": 598} {"train_loss": -9.641256332397461, "global_step": 100467, "epoch": 598} {"train_loss": -9.765249252319336, "global_step": 100468, "epoch": 598} {"train_loss": -9.432694435119629, "global_step": 100469, "epoch": 598} {"train_loss": -9.581562995910645, "global_step": 100470, "epoch": 598} {"train_loss": -9.517463684082031, "global_step": 100471, "epoch": 598} {"train_loss": -9.692085266113281, "global_step": 100472, "epoch": 598} {"train_loss": -9.6578369140625, "global_step": 100473, "epoch": 598} {"train_loss": -9.56542682647705, "global_step": 100474, "epoch": 598} {"train_loss": -9.584981918334961, "global_step": 100475, "epoch": 598} {"train_loss": -9.513197898864746, "global_step": 100476, "epoch": 598} {"train_loss": -9.656267166137695, "global_step": 100477, "epoch": 598} {"train_loss": -9.8629150390625, "global_step": 100478, "epoch": 598} {"train_loss": -9.381549835205078, "global_step": 100479, "epoch": 598} {"train_loss": -9.433319091796875, "global_step": 100480, "epoch": 598} {"train_loss": -9.625689506530762, "global_step": 100481, "epoch": 598} {"train_loss": -9.75547981262207, "global_step": 100482, "epoch": 598} {"train_loss": -9.981815338134766, "global_step": 100483, "epoch": 598} {"train_loss": -9.52924633026123, "global_step": 100484, "epoch": 598} {"train_loss": -9.68894100189209, "global_step": 100485, "epoch": 598} {"train_loss": -9.672675132751465, "global_step": 100486, "epoch": 598} {"train_loss": -9.726544380187988, "global_step": 100487, "epoch": 598} {"train_loss": -9.642133712768555, "global_step": 100488, "epoch": 598} {"train_loss": -9.752664566040039, "global_step": 100489, "epoch": 598} {"train_loss": -9.842203140258789, "global_step": 100490, "epoch": 598} {"train_loss": -9.868317604064941, "global_step": 100491, "epoch": 598} {"train_loss": -9.581205368041992, "global_step": 100492, "epoch": 598} {"train_loss": -9.649003028869629, "global_step": 100493, "epoch": 598} {"train_loss": -9.667481422424316, "global_step": 100494, "epoch": 598} {"train_loss": -9.875310897827148, "global_step": 100495, "epoch": 598} {"train_loss": -9.684818267822266, "global_step": 100496, "epoch": 598} {"train_loss": -9.863500595092773, "global_step": 100497, "epoch": 598} {"train_loss": -9.832582473754883, "global_step": 100498, "epoch": 598} {"train_loss": -9.83466911315918, "global_step": 100499, "epoch": 598} {"train_loss": -10.039709091186523, "global_step": 100500, "epoch": 598} {"train_loss": -10.000216484069824, "global_step": 100501, "epoch": 598} {"train_loss": -10.024435043334961, "global_step": 100502, "epoch": 598} {"train_loss": -9.936226844787598, "global_step": 100503, "epoch": 598} {"train_loss": -9.679826736450195, "global_step": 100504, "epoch": 598} {"train_loss": -9.758267402648926, "global_step": 100505, "epoch": 598} {"train_loss": -9.804034233093262, "global_step": 100506, "epoch": 598} {"train_loss": -9.94403076171875, "global_step": 100507, "epoch": 598} {"train_loss": -9.717491149902344, "global_step": 100508, "epoch": 598} {"train_loss": -9.586104393005371, "global_step": 100509, "epoch": 598} {"train_loss": -9.804790496826172, "global_step": 100510, "epoch": 598} {"train_loss": -9.213600158691406, "global_step": 100511, "epoch": 598} {"train_loss": -9.809242248535156, "global_step": 100512, "epoch": 598} {"train_loss": -9.469588279724121, "global_step": 100513, "epoch": 598} {"train_loss": -9.848575592041016, "global_step": 100514, "epoch": 598} {"train_loss": -9.614113807678223, "global_step": 100515, "epoch": 598} {"train_loss": -9.560873985290527, "global_step": 100516, "epoch": 598} {"train_loss": -9.959554672241211, "global_step": 100517, "epoch": 598} {"train_loss": -9.89760971069336, "global_step": 100518, "epoch": 598} {"train_loss": -9.504484176635742, "global_step": 100519, "epoch": 598} {"train_loss": -9.63561725616455, "global_step": 100520, "epoch": 598} {"train_loss": -9.759963989257812, "global_step": 100521, "epoch": 598} {"train_loss": -9.510953903198242, "global_step": 100522, "epoch": 598} {"train_loss": -9.530109405517578, "global_step": 100523, "epoch": 598} {"train_loss": -9.618181228637695, "global_step": 100524, "epoch": 598} {"train_loss": -9.411497116088867, "global_step": 100525, "epoch": 598} {"train_loss": -9.736940383911133, "global_step": 100526, "epoch": 598} {"train_loss": -9.417984962463379, "global_step": 100527, "epoch": 598} {"train_loss": -9.514815330505371, "global_step": 100528, "epoch": 598} {"train_loss": -9.30398941040039, "global_step": 100529, "epoch": 598} {"train_loss": -9.61971378326416, "global_step": 100530, "epoch": 598} {"train_loss": -8.829557418823242, "global_step": 100531, "epoch": 598} {"train_loss": -9.63606071472168, "global_step": 100532, "epoch": 598} {"train_loss": -9.222561836242676, "global_step": 100533, "epoch": 598} {"train_loss": -9.19708251953125, "global_step": 100534, "epoch": 598} {"train_loss": -9.540645599365234, "global_step": 100535, "epoch": 598} {"train_loss": -9.234743118286133, "global_step": 100536, "epoch": 598} {"train_loss": -9.321252822875977, "global_step": 100537, "epoch": 598} {"train_loss": -9.647872924804688, "global_step": 100538, "epoch": 598} {"train_loss": -9.52523422241211, "global_step": 100539, "epoch": 598} {"train_loss": -9.468547821044922, "global_step": 100540, "epoch": 598} {"train_loss": -9.381295204162598, "global_step": 100541, "epoch": 598} {"train_loss": -9.401758193969727, "global_step": 100542, "epoch": 598} {"train_loss": -9.551944732666016, "global_step": 100543, "epoch": 598} {"train_loss": -9.452692031860352, "global_step": 100544, "epoch": 598} {"train_loss": -9.60855484008789, "global_step": 100545, "epoch": 598} {"train_loss": -9.729564666748047, "global_step": 100546, "epoch": 598} {"train_loss": -9.580217361450195, "global_step": 100547, "epoch": 598} {"train_loss": -9.857582092285156, "global_step": 100548, "epoch": 598} {"train_loss": -9.684579849243164, "global_step": 100549, "epoch": 598} {"train_loss": -9.475906372070312, "global_step": 100550, "epoch": 598} {"train_loss": -9.907039642333984, "global_step": 100551, "epoch": 598} {"train_loss": -9.39095401763916, "global_step": 100552, "epoch": 598} {"train_loss": -9.870511054992676, "global_step": 100553, "epoch": 598} {"train_loss": -9.659730911254883, "global_step": 100554, "epoch": 598} {"train_loss": -9.399510383605957, "global_step": 100555, "epoch": 598} {"train_loss": -9.535733222961426, "global_step": 100556, "epoch": 598} {"train_loss": -9.577495574951172, "global_step": 100557, "epoch": 598} {"train_loss": -9.614656448364258, "global_step": 100558, "epoch": 598} {"train_loss": -9.872810363769531, "global_step": 100559, "epoch": 598} {"train_loss": -9.798334121704102, "global_step": 100560, "epoch": 598} {"train_loss": -9.784027099609375, "global_step": 100561, "epoch": 598} {"train_loss": -9.805010795593262, "global_step": 100562, "epoch": 598} {"train_loss": -9.750858306884766, "global_step": 100563, "epoch": 598} {"train_loss": -9.780741691589355, "global_step": 100564, "epoch": 598} {"train_loss": -10.013526916503906, "global_step": 100565, "epoch": 598} {"train_loss": -9.675323486328125, "global_step": 100566, "epoch": 598} {"train_loss": -9.836149215698242, "global_step": 100567, "epoch": 598} {"train_loss": -10.00365161895752, "global_step": 100568, "epoch": 598} {"train_loss": -9.611873626708984, "global_step": 100569, "epoch": 598} {"train_loss": -9.612926483154297, "global_step": 100570, "epoch": 598} {"train_loss": -9.827672004699707, "global_step": 100571, "epoch": 598} {"train_loss": -9.679618835449219, "global_step": 100572, "epoch": 598} {"train_loss": -10.021869659423828, "global_step": 100573, "epoch": 598} {"train_loss": -9.83659839630127, "global_step": 100574, "epoch": 598} {"train_loss": -9.575105667114258, "global_step": 100575, "epoch": 598} {"train_loss": -9.933013916015625, "global_step": 100576, "epoch": 598} {"train_loss": -9.718609809875488, "global_step": 100577, "epoch": 598} {"train_loss": -9.759079933166504, "global_step": 100578, "epoch": 598} {"train_loss": -9.738815307617188, "global_step": 100579, "epoch": 598} {"train_loss": -9.760787963867188, "global_step": 100580, "epoch": 598} {"train_loss": -10.112752914428711, "global_step": 100581, "epoch": 598} {"train_loss": -9.830621719360352, "global_step": 100582, "epoch": 598} {"train_loss": -9.956604957580566, "global_step": 100583, "epoch": 598} {"train_loss": -9.910545349121094, "global_step": 100584, "epoch": 598} {"train_loss": -9.882841110229492, "global_step": 100585, "epoch": 598} {"train_loss": -9.849929809570312, "global_step": 100586, "epoch": 598} {"train_loss": -9.576518058776855, "global_step": 100587, "epoch": 598} {"train_loss": -10.053762435913086, "global_step": 100588, "epoch": 598} {"train_loss": -9.766395568847656, "global_step": 100589, "epoch": 598} {"train_loss": -10.132546424865723, "global_step": 100590, "epoch": 598} {"train_loss": -9.614336967468262, "global_step": 100591, "epoch": 598} {"train_loss": -10.089944839477539, "global_step": 100592, "epoch": 598} {"train_loss": -9.942649841308594, "global_step": 100593, "epoch": 598} {"train_loss": -9.961568832397461, "global_step": 100594, "epoch": 598} {"train_loss": -9.699097633361816, "global_step": 100595, "epoch": 598} {"train_loss": -10.070252418518066, "global_step": 100596, "epoch": 598} {"train_loss": -9.784679412841797, "global_step": 100597, "epoch": 598} {"train_loss": -9.73196792602539, "global_step": 100598, "epoch": 598} {"train_loss": -9.836738586425781, "global_step": 100599, "epoch": 598} {"train_loss": -9.628511428833008, "global_step": 100600, "epoch": 598} {"train_loss": -9.32668685913086, "global_step": 100601, "epoch": 598} {"train_loss": -9.659040451049805, "global_step": 100602, "epoch": 598} {"train_loss": -9.0421142578125, "global_step": 100603, "epoch": 598} {"train_loss": -9.643026351928711, "global_step": 100604, "epoch": 598} {"train_loss": -9.467569351196289, "global_step": 100605, "epoch": 598} {"train_loss": -9.665992736816406, "global_step": 100606, "epoch": 598} {"train_loss": -9.873405456542969, "global_step": 100607, "epoch": 598} {"train_loss": -9.653826713562012, "global_step": 100608, "epoch": 598} {"train_loss": -9.657743453979492, "global_step": 100609, "epoch": 598} {"train_loss": -9.512849807739258, "global_step": 100610, "epoch": 598} {"train_loss": -9.560807228088379, "global_step": 100611, "epoch": 598} {"train_loss": -9.617816925048828, "global_step": 100612, "epoch": 598} {"train_loss": -9.749469757080078, "global_step": 100613, "epoch": 598} {"train_loss": -9.761813163757324, "global_step": 100614, "epoch": 598} {"train_loss": -9.397577285766602, "global_step": 100615, "epoch": 598} {"train_loss": -9.844263076782227, "global_step": 100616, "epoch": 598} {"train_loss": -9.826374053955078, "global_step": 100617, "epoch": 598} {"train_loss": -9.755393981933594, "global_step": 100618, "epoch": 598} {"train_loss": -9.930766105651855, "global_step": 100619, "epoch": 598} {"train_loss": -9.66015338897705, "global_step": 100620, "epoch": 598} {"train_loss": -10.020130157470703, "global_step": 100621, "epoch": 598} {"train_loss": -10.018525123596191, "global_step": 100622, "epoch": 598} {"train_loss": -9.88283920288086, "global_step": 100623, "epoch": 598} {"train_loss": -9.868645668029785, "global_step": 100624, "epoch": 598} {"train_loss": -9.951396942138672, "global_step": 100625, "epoch": 598} {"train_loss": -9.916339874267578, "global_step": 100626, "epoch": 598} {"train_loss": -10.173904418945312, "global_step": 100627, "epoch": 598} {"train_loss": -9.643098831176758, "global_step": 100628, "epoch": 598} {"train_loss": -9.821401596069336, "global_step": 100629, "epoch": 598} {"train_loss": -9.684577941894531, "global_step": 100630, "epoch": 598} {"train_loss": -9.694810123670669, "global_step": 100631, "epoch": 598, "val_loss": 208496.734375} {"train_loss": -9.78290843963623, "global_step": 100632, "epoch": 599} {"train_loss": -9.699848175048828, "global_step": 100633, "epoch": 599} {"train_loss": -9.745306015014648, "global_step": 100634, "epoch": 599} {"train_loss": -9.978015899658203, "global_step": 100635, "epoch": 599} {"train_loss": -9.875734329223633, "global_step": 100636, "epoch": 599} {"train_loss": -9.957315444946289, "global_step": 100637, "epoch": 599} {"train_loss": -9.755460739135742, "global_step": 100638, "epoch": 599} {"train_loss": -9.469036102294922, "global_step": 100639, "epoch": 599} {"train_loss": -9.891899108886719, "global_step": 100640, "epoch": 599} {"train_loss": -9.504136085510254, "global_step": 100641, "epoch": 599} {"train_loss": -9.701972961425781, "global_step": 100642, "epoch": 599} {"train_loss": -9.873894691467285, "global_step": 100643, "epoch": 599} {"train_loss": -9.285037994384766, "global_step": 100644, "epoch": 599} {"train_loss": -9.801886558532715, "global_step": 100645, "epoch": 599} {"train_loss": -9.709917068481445, "global_step": 100646, "epoch": 599} {"train_loss": -9.579977989196777, "global_step": 100647, "epoch": 599} {"train_loss": -9.935691833496094, "global_step": 100648, "epoch": 599} {"train_loss": -9.68950366973877, "global_step": 100649, "epoch": 599} {"train_loss": -9.8274564743042, "global_step": 100650, "epoch": 599} {"train_loss": -9.893932342529297, "global_step": 100651, "epoch": 599} {"train_loss": -9.533645629882812, "global_step": 100652, "epoch": 599} {"train_loss": -9.852025985717773, "global_step": 100653, "epoch": 599} {"train_loss": -9.274199485778809, "global_step": 100654, "epoch": 599} {"train_loss": -9.726900100708008, "global_step": 100655, "epoch": 599} {"train_loss": -9.610837936401367, "global_step": 100656, "epoch": 599} {"train_loss": -9.580406188964844, "global_step": 100657, "epoch": 599} {"train_loss": -9.429180145263672, "global_step": 100658, "epoch": 599} {"train_loss": -9.709278106689453, "global_step": 100659, "epoch": 599} {"train_loss": -9.51541519165039, "global_step": 100660, "epoch": 599} {"train_loss": -9.74453353881836, "global_step": 100661, "epoch": 599} {"train_loss": -9.629117012023926, "global_step": 100662, "epoch": 599} {"train_loss": -9.33021354675293, "global_step": 100663, "epoch": 599} {"train_loss": -9.757959365844727, "global_step": 100664, "epoch": 599} {"train_loss": -9.509498596191406, "global_step": 100665, "epoch": 599} {"train_loss": -9.561820983886719, "global_step": 100666, "epoch": 599} {"train_loss": -9.502323150634766, "global_step": 100667, "epoch": 599} {"train_loss": -9.819401741027832, "global_step": 100668, "epoch": 599} {"train_loss": -9.794167518615723, "global_step": 100669, "epoch": 599} {"train_loss": -9.597594261169434, "global_step": 100670, "epoch": 599} {"train_loss": -9.555879592895508, "global_step": 100671, "epoch": 599} {"train_loss": -9.774356842041016, "global_step": 100672, "epoch": 599} {"train_loss": -9.620756149291992, "global_step": 100673, "epoch": 599} {"train_loss": -9.76840591430664, "global_step": 100674, "epoch": 599} {"train_loss": -9.823787689208984, "global_step": 100675, "epoch": 599} {"train_loss": -9.477493286132812, "global_step": 100676, "epoch": 599} {"train_loss": -9.441266059875488, "global_step": 100677, "epoch": 599} {"train_loss": -9.643526077270508, "global_step": 100678, "epoch": 599} {"train_loss": -10.006542205810547, "global_step": 100679, "epoch": 599} {"train_loss": -9.476655960083008, "global_step": 100680, "epoch": 599} {"train_loss": -9.581060409545898, "global_step": 100681, "epoch": 599} {"train_loss": -9.441112518310547, "global_step": 100682, "epoch": 599} {"train_loss": -9.667501449584961, "global_step": 100683, "epoch": 599} {"train_loss": -9.715108871459961, "global_step": 100684, "epoch": 599} {"train_loss": -9.38698959350586, "global_step": 100685, "epoch": 599} {"train_loss": -9.643766403198242, "global_step": 100686, "epoch": 599} {"train_loss": -9.716438293457031, "global_step": 100687, "epoch": 599} {"train_loss": -9.947685241699219, "global_step": 100688, "epoch": 599} {"train_loss": -9.696151733398438, "global_step": 100689, "epoch": 599} {"train_loss": -9.463983535766602, "global_step": 100690, "epoch": 599} {"train_loss": -9.77960205078125, "global_step": 100691, "epoch": 599} {"train_loss": -9.388935089111328, "global_step": 100692, "epoch": 599} {"train_loss": -9.767346382141113, "global_step": 100693, "epoch": 599} {"train_loss": -9.968635559082031, "global_step": 100694, "epoch": 599} {"train_loss": -9.757984161376953, "global_step": 100695, "epoch": 599} {"train_loss": -9.76492691040039, "global_step": 100696, "epoch": 599} {"train_loss": -9.901947021484375, "global_step": 100697, "epoch": 599} {"train_loss": -9.622097969055176, "global_step": 100698, "epoch": 599} {"train_loss": -9.810155868530273, "global_step": 100699, "epoch": 599} {"train_loss": -9.951126098632812, "global_step": 100700, "epoch": 599} {"train_loss": -9.631185531616211, "global_step": 100701, "epoch": 599} {"train_loss": -10.031774520874023, "global_step": 100702, "epoch": 599} {"train_loss": -9.872579574584961, "global_step": 100703, "epoch": 599} {"train_loss": -10.011811256408691, "global_step": 100704, "epoch": 599} {"train_loss": -10.024857521057129, "global_step": 100705, "epoch": 599} {"train_loss": -9.85732650756836, "global_step": 100706, "epoch": 599} {"train_loss": -10.032417297363281, "global_step": 100707, "epoch": 599} {"train_loss": -10.003637313842773, "global_step": 100708, "epoch": 599} {"train_loss": -9.866936683654785, "global_step": 100709, "epoch": 599} {"train_loss": -9.924722671508789, "global_step": 100710, "epoch": 599} {"train_loss": -9.884016036987305, "global_step": 100711, "epoch": 599} {"train_loss": -9.979207992553711, "global_step": 100712, "epoch": 599} {"train_loss": -10.092992782592773, "global_step": 100713, "epoch": 599} {"train_loss": -9.893654823303223, "global_step": 100714, "epoch": 599} {"train_loss": -9.915544509887695, "global_step": 100715, "epoch": 599} {"train_loss": -10.044378280639648, "global_step": 100716, "epoch": 599} {"train_loss": -9.70284366607666, "global_step": 100717, "epoch": 599} {"train_loss": -9.479764938354492, "global_step": 100718, "epoch": 599} {"train_loss": -9.728578567504883, "global_step": 100719, "epoch": 599} {"train_loss": -10.02127456665039, "global_step": 100720, "epoch": 599} {"train_loss": -9.6740083694458, "global_step": 100721, "epoch": 599} {"train_loss": -9.606012344360352, "global_step": 100722, "epoch": 599} {"train_loss": -9.930641174316406, "global_step": 100723, "epoch": 599} {"train_loss": -9.726018905639648, "global_step": 100724, "epoch": 599} {"train_loss": -9.83602237701416, "global_step": 100725, "epoch": 599} {"train_loss": -9.8970308303833, "global_step": 100726, "epoch": 599} {"train_loss": -9.825872421264648, "global_step": 100727, "epoch": 599} {"train_loss": -9.915903091430664, "global_step": 100728, "epoch": 599} {"train_loss": -9.81910514831543, "global_step": 100729, "epoch": 599} {"train_loss": -9.887690544128418, "global_step": 100730, "epoch": 599} {"train_loss": -9.923360824584961, "global_step": 100731, "epoch": 599} {"train_loss": -9.851821899414062, "global_step": 100732, "epoch": 599} {"train_loss": -10.03496265411377, "global_step": 100733, "epoch": 599} {"train_loss": -9.759862899780273, "global_step": 100734, "epoch": 599} {"train_loss": -9.557989120483398, "global_step": 100735, "epoch": 599} {"train_loss": -9.898391723632812, "global_step": 100736, "epoch": 599} {"train_loss": -9.961407661437988, "global_step": 100737, "epoch": 599} {"train_loss": -9.56694221496582, "global_step": 100738, "epoch": 599} {"train_loss": -9.70060920715332, "global_step": 100739, "epoch": 599} {"train_loss": -9.326573371887207, "global_step": 100740, "epoch": 599} {"train_loss": -9.330497741699219, "global_step": 100741, "epoch": 599} {"train_loss": -9.51957893371582, "global_step": 100742, "epoch": 599} {"train_loss": -9.378536224365234, "global_step": 100743, "epoch": 599} {"train_loss": -9.247895240783691, "global_step": 100744, "epoch": 599} {"train_loss": -9.282899856567383, "global_step": 100745, "epoch": 599} {"train_loss": -9.304428100585938, "global_step": 100746, "epoch": 599} {"train_loss": -9.414501190185547, "global_step": 100747, "epoch": 599} {"train_loss": -9.314340591430664, "global_step": 100748, "epoch": 599} {"train_loss": -9.659000396728516, "global_step": 100749, "epoch": 599} {"train_loss": -9.482367515563965, "global_step": 100750, "epoch": 599} {"train_loss": -9.530038833618164, "global_step": 100751, "epoch": 599} {"train_loss": -9.695404052734375, "global_step": 100752, "epoch": 599} {"train_loss": -9.417247772216797, "global_step": 100753, "epoch": 599} {"train_loss": -9.70163631439209, "global_step": 100754, "epoch": 599} {"train_loss": -9.596407890319824, "global_step": 100755, "epoch": 599} {"train_loss": -9.425145149230957, "global_step": 100756, "epoch": 599} {"train_loss": -9.735321044921875, "global_step": 100757, "epoch": 599} {"train_loss": -9.722219467163086, "global_step": 100758, "epoch": 599} {"train_loss": -9.899465560913086, "global_step": 100759, "epoch": 599} {"train_loss": -9.583401679992676, "global_step": 100760, "epoch": 599} {"train_loss": -9.522088050842285, "global_step": 100761, "epoch": 599} {"train_loss": -9.289955139160156, "global_step": 100762, "epoch": 599} {"train_loss": -9.942953109741211, "global_step": 100763, "epoch": 599} {"train_loss": -9.27371597290039, "global_step": 100764, "epoch": 599} {"train_loss": -9.637154579162598, "global_step": 100765, "epoch": 599} {"train_loss": -9.999591827392578, "global_step": 100766, "epoch": 599} {"train_loss": -9.6727294921875, "global_step": 100767, "epoch": 599} {"train_loss": -9.68012809753418, "global_step": 100768, "epoch": 599} {"train_loss": -9.940916061401367, "global_step": 100769, "epoch": 599} {"train_loss": -9.500211715698242, "global_step": 100770, "epoch": 599} {"train_loss": -9.593921661376953, "global_step": 100771, "epoch": 599} {"train_loss": -9.337746620178223, "global_step": 100772, "epoch": 599} {"train_loss": -9.88304615020752, "global_step": 100773, "epoch": 599} {"train_loss": -9.655889511108398, "global_step": 100774, "epoch": 599} {"train_loss": -9.544424057006836, "global_step": 100775, "epoch": 599} {"train_loss": -9.708982467651367, "global_step": 100776, "epoch": 599} {"train_loss": -9.818840026855469, "global_step": 100777, "epoch": 599} {"train_loss": -9.620553970336914, "global_step": 100778, "epoch": 599} {"train_loss": -9.877304077148438, "global_step": 100779, "epoch": 599} {"train_loss": -9.552898406982422, "global_step": 100780, "epoch": 599} {"train_loss": -9.799114227294922, "global_step": 100781, "epoch": 599} {"train_loss": -9.76156997680664, "global_step": 100782, "epoch": 599} {"train_loss": -9.911478042602539, "global_step": 100783, "epoch": 599} {"train_loss": -9.801277160644531, "global_step": 100784, "epoch": 599} {"train_loss": -9.870376586914062, "global_step": 100785, "epoch": 599} {"train_loss": -9.7047119140625, "global_step": 100786, "epoch": 599} {"train_loss": -9.791155815124512, "global_step": 100787, "epoch": 599} {"train_loss": -9.282691955566406, "global_step": 100788, "epoch": 599} {"train_loss": -9.9622163772583, "global_step": 100789, "epoch": 599} {"train_loss": -8.913508415222168, "global_step": 100790, "epoch": 599} {"train_loss": -9.308324813842773, "global_step": 100791, "epoch": 599} {"train_loss": -9.438661575317383, "global_step": 100792, "epoch": 599} {"train_loss": -9.484334945678711, "global_step": 100793, "epoch": 599} {"train_loss": -9.260147094726562, "global_step": 100794, "epoch": 599} {"train_loss": -9.755743980407715, "global_step": 100795, "epoch": 599} {"train_loss": -9.231765747070312, "global_step": 100796, "epoch": 599} {"train_loss": -9.533269882202148, "global_step": 100797, "epoch": 599} {"train_loss": -9.270720481872559, "global_step": 100798, "epoch": 599} {"train_loss": -9.681375128882271, "global_step": 100799, "epoch": 599, "val_loss": 206061.515625} {"train_loss": -9.636895179748535, "global_step": 100800, "epoch": 600} {"train_loss": -9.64048957824707, "global_step": 100801, "epoch": 600} {"train_loss": -9.425613403320312, "global_step": 100802, "epoch": 600} {"train_loss": -9.506704330444336, "global_step": 100803, "epoch": 600} {"train_loss": -9.680839538574219, "global_step": 100804, "epoch": 600} {"train_loss": -9.643136978149414, "global_step": 100805, "epoch": 600} {"train_loss": -9.626408576965332, "global_step": 100806, "epoch": 600} {"train_loss": -9.547468185424805, "global_step": 100807, "epoch": 600} {"train_loss": -9.62444019317627, "global_step": 100808, "epoch": 600} {"train_loss": -9.654542922973633, "global_step": 100809, "epoch": 600} {"train_loss": -9.690237045288086, "global_step": 100810, "epoch": 600} {"train_loss": -9.656259536743164, "global_step": 100811, "epoch": 600} {"train_loss": -9.704026222229004, "global_step": 100812, "epoch": 600} {"train_loss": -9.737964630126953, "global_step": 100813, "epoch": 600} {"train_loss": -10.03611946105957, "global_step": 100814, "epoch": 600} {"train_loss": -9.827991485595703, "global_step": 100815, "epoch": 600} {"train_loss": -9.73176383972168, "global_step": 100816, "epoch": 600} {"train_loss": -9.77962875366211, "global_step": 100817, "epoch": 600} {"train_loss": -9.9798002243042, "global_step": 100818, "epoch": 600} {"train_loss": -9.680824279785156, "global_step": 100819, "epoch": 600} {"train_loss": -9.878681182861328, "global_step": 100820, "epoch": 600} {"train_loss": -9.803024291992188, "global_step": 100821, "epoch": 600} {"train_loss": -9.54145336151123, "global_step": 100822, "epoch": 600} {"train_loss": -9.685653686523438, "global_step": 100823, "epoch": 600} {"train_loss": -9.783097267150879, "global_step": 100824, "epoch": 600} {"train_loss": -9.990307807922363, "global_step": 100825, "epoch": 600} {"train_loss": -10.051267623901367, "global_step": 100826, "epoch": 600} {"train_loss": -9.86989974975586, "global_step": 100827, "epoch": 600} {"train_loss": -9.92388916015625, "global_step": 100828, "epoch": 600} {"train_loss": -9.553895950317383, "global_step": 100829, "epoch": 600} {"train_loss": -9.962250709533691, "global_step": 100830, "epoch": 600} {"train_loss": -9.38044261932373, "global_step": 100831, "epoch": 600} {"train_loss": -9.804669380187988, "global_step": 100832, "epoch": 600} {"train_loss": -9.694708824157715, "global_step": 100833, "epoch": 600} {"train_loss": -9.683671951293945, "global_step": 100834, "epoch": 600} {"train_loss": -9.206741333007812, "global_step": 100835, "epoch": 600} {"train_loss": -9.168689727783203, "global_step": 100836, "epoch": 600} {"train_loss": -9.867975234985352, "global_step": 100837, "epoch": 600} {"train_loss": -9.403846740722656, "global_step": 100838, "epoch": 600} {"train_loss": -9.638696670532227, "global_step": 100839, "epoch": 600} {"train_loss": -9.449628829956055, "global_step": 100840, "epoch": 600} {"train_loss": -9.516905784606934, "global_step": 100841, "epoch": 600} {"train_loss": -9.591960906982422, "global_step": 100842, "epoch": 600} {"train_loss": -9.600427627563477, "global_step": 100843, "epoch": 600} {"train_loss": -9.071168899536133, "global_step": 100844, "epoch": 600} {"train_loss": -9.406787872314453, "global_step": 100845, "epoch": 600} {"train_loss": -9.504035949707031, "global_step": 100846, "epoch": 600} {"train_loss": -9.273879051208496, "global_step": 100847, "epoch": 600} {"train_loss": -9.537418365478516, "global_step": 100848, "epoch": 600} {"train_loss": -9.2384672164917, "global_step": 100849, "epoch": 600} {"train_loss": -9.316977500915527, "global_step": 100850, "epoch": 600} {"train_loss": -9.657629013061523, "global_step": 100851, "epoch": 600} {"train_loss": -9.192035675048828, "global_step": 100852, "epoch": 600} {"train_loss": -9.712158203125, "global_step": 100853, "epoch": 600} {"train_loss": -9.148516654968262, "global_step": 100854, "epoch": 600} {"train_loss": -9.900289535522461, "global_step": 100855, "epoch": 600} {"train_loss": -9.468080520629883, "global_step": 100856, "epoch": 600} {"train_loss": -9.699888229370117, "global_step": 100857, "epoch": 600} {"train_loss": -9.461666107177734, "global_step": 100858, "epoch": 600} {"train_loss": -9.751507759094238, "global_step": 100859, "epoch": 600} {"train_loss": -9.699114799499512, "global_step": 100860, "epoch": 600} {"train_loss": -9.721378326416016, "global_step": 100861, "epoch": 600} {"train_loss": -9.747262954711914, "global_step": 100862, "epoch": 600} {"train_loss": -9.649789810180664, "global_step": 100863, "epoch": 600} {"train_loss": -9.523134231567383, "global_step": 100864, "epoch": 600} {"train_loss": -9.747312545776367, "global_step": 100865, "epoch": 600} {"train_loss": -9.607544898986816, "global_step": 100866, "epoch": 600} {"train_loss": -9.706170082092285, "global_step": 100867, "epoch": 600} {"train_loss": -9.778057098388672, "global_step": 100868, "epoch": 600} {"train_loss": -9.684228897094727, "global_step": 100869, "epoch": 600} {"train_loss": -9.603078842163086, "global_step": 100870, "epoch": 600} {"train_loss": -9.881942749023438, "global_step": 100871, "epoch": 600} {"train_loss": -9.718189239501953, "global_step": 100872, "epoch": 600} {"train_loss": -9.679028511047363, "global_step": 100873, "epoch": 600} {"train_loss": -9.84710693359375, "global_step": 100874, "epoch": 600} {"train_loss": -9.886470794677734, "global_step": 100875, "epoch": 600} {"train_loss": -9.908926010131836, "global_step": 100876, "epoch": 600} {"train_loss": -9.832450866699219, "global_step": 100877, "epoch": 600} {"train_loss": -9.94692611694336, "global_step": 100878, "epoch": 600} {"train_loss": -9.917564392089844, "global_step": 100879, "epoch": 600} {"train_loss": -9.922039031982422, "global_step": 100880, "epoch": 600} {"train_loss": -9.838079452514648, "global_step": 100881, "epoch": 600} {"train_loss": -9.939208984375, "global_step": 100882, "epoch": 600} {"train_loss": -10.169220924377441, "global_step": 100883, "epoch": 600} {"train_loss": -9.908613204956055, "global_step": 100884, "epoch": 600} {"train_loss": -9.894634246826172, "global_step": 100885, "epoch": 600} {"train_loss": -9.974258422851562, "global_step": 100886, "epoch": 600} {"train_loss": -9.963521957397461, "global_step": 100887, "epoch": 600} {"train_loss": -9.592155456542969, "global_step": 100888, "epoch": 600} {"train_loss": -9.48917007446289, "global_step": 100889, "epoch": 600} {"train_loss": -9.886821746826172, "global_step": 100890, "epoch": 600} {"train_loss": -9.720755577087402, "global_step": 100891, "epoch": 600} {"train_loss": -9.88729190826416, "global_step": 100892, "epoch": 600} {"train_loss": -9.770183563232422, "global_step": 100893, "epoch": 600} {"train_loss": -9.71889877319336, "global_step": 100894, "epoch": 600} {"train_loss": -10.124648094177246, "global_step": 100895, "epoch": 600} {"train_loss": -9.700907707214355, "global_step": 100896, "epoch": 600} {"train_loss": -9.9722900390625, "global_step": 100897, "epoch": 600} {"train_loss": -9.723665237426758, "global_step": 100898, "epoch": 600} {"train_loss": -9.85644245147705, "global_step": 100899, "epoch": 600} {"train_loss": -10.05201244354248, "global_step": 100900, "epoch": 600} {"train_loss": -9.700416564941406, "global_step": 100901, "epoch": 600} {"train_loss": -9.385374069213867, "global_step": 100902, "epoch": 600} {"train_loss": -10.06838607788086, "global_step": 100903, "epoch": 600} {"train_loss": -9.7386474609375, "global_step": 100904, "epoch": 600} {"train_loss": -9.951738357543945, "global_step": 100905, "epoch": 600} {"train_loss": -9.942354202270508, "global_step": 100906, "epoch": 600} {"train_loss": -9.533756256103516, "global_step": 100907, "epoch": 600} {"train_loss": -9.826129913330078, "global_step": 100908, "epoch": 600} {"train_loss": -9.868619918823242, "global_step": 100909, "epoch": 600} {"train_loss": -9.813446044921875, "global_step": 100910, "epoch": 600} {"train_loss": -9.89829158782959, "global_step": 100911, "epoch": 600} {"train_loss": -9.600591659545898, "global_step": 100912, "epoch": 600} {"train_loss": -9.621386528015137, "global_step": 100913, "epoch": 600} {"train_loss": -9.404168128967285, "global_step": 100914, "epoch": 600} {"train_loss": -9.587794303894043, "global_step": 100915, "epoch": 600} {"train_loss": -9.422868728637695, "global_step": 100916, "epoch": 600} {"train_loss": -9.539502143859863, "global_step": 100917, "epoch": 600} {"train_loss": -9.193397521972656, "global_step": 100918, "epoch": 600} {"train_loss": -9.501335144042969, "global_step": 100919, "epoch": 600} {"train_loss": -9.657663345336914, "global_step": 100920, "epoch": 600} {"train_loss": -9.62813949584961, "global_step": 100921, "epoch": 600} {"train_loss": -9.61212158203125, "global_step": 100922, "epoch": 600} {"train_loss": -9.493766784667969, "global_step": 100923, "epoch": 600} {"train_loss": -9.748790740966797, "global_step": 100924, "epoch": 600} {"train_loss": -9.606219291687012, "global_step": 100925, "epoch": 600} {"train_loss": -9.855623245239258, "global_step": 100926, "epoch": 600} {"train_loss": -9.77102279663086, "global_step": 100927, "epoch": 600} {"train_loss": -9.886242866516113, "global_step": 100928, "epoch": 600} {"train_loss": -9.686479568481445, "global_step": 100929, "epoch": 600} {"train_loss": -10.025981903076172, "global_step": 100930, "epoch": 600} {"train_loss": -9.733880043029785, "global_step": 100931, "epoch": 600} {"train_loss": -9.431626319885254, "global_step": 100932, "epoch": 600} {"train_loss": -9.670479774475098, "global_step": 100933, "epoch": 600} {"train_loss": -9.439523696899414, "global_step": 100934, "epoch": 600} {"train_loss": -9.848280906677246, "global_step": 100935, "epoch": 600} {"train_loss": -9.614023208618164, "global_step": 100936, "epoch": 600} {"train_loss": -9.716574668884277, "global_step": 100937, "epoch": 600} {"train_loss": -9.879549980163574, "global_step": 100938, "epoch": 600} {"train_loss": -9.65865707397461, "global_step": 100939, "epoch": 600} {"train_loss": -9.848747253417969, "global_step": 100940, "epoch": 600} {"train_loss": -9.766449928283691, "global_step": 100941, "epoch": 600} {"train_loss": -9.85515022277832, "global_step": 100942, "epoch": 600} {"train_loss": -9.748722076416016, "global_step": 100943, "epoch": 600} {"train_loss": -9.74824047088623, "global_step": 100944, "epoch": 600} {"train_loss": -9.915494918823242, "global_step": 100945, "epoch": 600} {"train_loss": -9.29003620147705, "global_step": 100946, "epoch": 600} {"train_loss": -9.76951789855957, "global_step": 100947, "epoch": 600} {"train_loss": -9.572056770324707, "global_step": 100948, "epoch": 600} {"train_loss": -9.436498641967773, "global_step": 100949, "epoch": 600} {"train_loss": -9.61085319519043, "global_step": 100950, "epoch": 600} {"train_loss": -9.58951187133789, "global_step": 100951, "epoch": 600} {"train_loss": -9.538061141967773, "global_step": 100952, "epoch": 600} {"train_loss": -9.559168815612793, "global_step": 100953, "epoch": 600} {"train_loss": -9.742412567138672, "global_step": 100954, "epoch": 600} {"train_loss": -9.474828720092773, "global_step": 100955, "epoch": 600} {"train_loss": -9.786420822143555, "global_step": 100956, "epoch": 600} {"train_loss": -9.472222328186035, "global_step": 100957, "epoch": 600} {"train_loss": -9.847996711730957, "global_step": 100958, "epoch": 600} {"train_loss": -9.791362762451172, "global_step": 100959, "epoch": 600} {"train_loss": -9.680317878723145, "global_step": 100960, "epoch": 600} {"train_loss": -9.509452819824219, "global_step": 100961, "epoch": 600} {"train_loss": -9.848876953125, "global_step": 100962, "epoch": 600} {"train_loss": -9.714502334594727, "global_step": 100963, "epoch": 600} {"train_loss": -9.531457901000977, "global_step": 100964, "epoch": 600} {"train_loss": -9.46194076538086, "global_step": 100965, "epoch": 600} {"train_loss": -9.355567932128906, "global_step": 100966, "epoch": 600} {"train_loss": -9.682147911616735, "global_step": 100967, "epoch": 600, "train/sim_max_reward_0": 0.3522054999493143, "train/sim_max_reward_1": 0.9881817586253582, "train/sim_max_reward_2": 0.6303880554497321, "train/sim_max_reward_3": 0.6662650092352842, "train/sim_max_reward_4": 0.96392273770438, "train/sim_max_reward_5": 0.5623642323978444, "test/sim_max_reward_4400000": 0.24677777049544505, "test/sim_max_reward_4400001": 0.4595768049812558, "test/sim_max_reward_4400002": 0.06178782399342734, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 0.8063497117097552, "test/sim_max_reward_4400007": 0.8690145766305962, "test/sim_max_reward_4400008": 0.5596416276371099, "test/sim_max_reward_4400009": 0.38457224364740306, "test/sim_max_reward_4400010": 0.4496060718962145, "test/sim_max_reward_4400011": 0.8824503703751598, "test/sim_max_reward_4400012": 0.984865097403823, "test/sim_max_reward_4400013": 0.9857861259562859, "test/sim_max_reward_4400014": 0.5253398619236779, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.12466241082965675, "test/sim_max_reward_4400018": 0.8549918759224713, "test/sim_max_reward_4400019": 0.46465837486729045, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.6705458899297988, "test/sim_max_reward_4400022": 0.9791339006965581, "test/sim_max_reward_4400023": 1.0, "test/sim_max_reward_4400024": 1.0, "test/sim_max_reward_4400025": 0.6740327487539489, "test/sim_max_reward_4400026": 0.9698972056398667, "test/sim_max_reward_4400027": 0.47434094011668565, "test/sim_max_reward_4400028": 0.6959299018815316, "test/sim_max_reward_4400029": 0.5047509561920369, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.1747965011916499, "test/sim_max_reward_4400033": 0.16271188240470108, "test/sim_max_reward_4400034": 0.9707856459091243, "test/sim_max_reward_4400035": 0.31715140189094254, "test/sim_max_reward_4400036": 0.377312717610469, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9537569425564427, "test/sim_max_reward_4400042": 0.9929339477604823, "test/sim_max_reward_4400043": 0.9983363096466706, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.4243422483747976, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6938878822269855, "test/mean_score": 0.6082518910535866, "val_loss": 206778.453125, "train_action_mse_error": 1.388688087463379} {"train_loss": -9.564737319946289, "global_step": 100968, "epoch": 601} {"train_loss": -9.304557800292969, "global_step": 100969, "epoch": 601} {"train_loss": -9.295720100402832, "global_step": 100970, "epoch": 601} {"train_loss": -9.697101593017578, "global_step": 100971, "epoch": 601} {"train_loss": -9.094353675842285, "global_step": 100972, "epoch": 601} {"train_loss": -9.402263641357422, "global_step": 100973, "epoch": 601} {"train_loss": -9.051618576049805, "global_step": 100974, "epoch": 601} {"train_loss": -9.283371925354004, "global_step": 100975, "epoch": 601} {"train_loss": -9.237628936767578, "global_step": 100976, "epoch": 601} {"train_loss": -8.665647506713867, "global_step": 100977, "epoch": 601} {"train_loss": -9.267723083496094, "global_step": 100978, "epoch": 601} {"train_loss": -8.943733215332031, "global_step": 100979, "epoch": 601} {"train_loss": -9.230981826782227, "global_step": 100980, "epoch": 601} {"train_loss": -8.930107116699219, "global_step": 100981, "epoch": 601} {"train_loss": -9.587104797363281, "global_step": 100982, "epoch": 601} {"train_loss": -9.097402572631836, "global_step": 100983, "epoch": 601} {"train_loss": -9.3472900390625, "global_step": 100984, "epoch": 601} {"train_loss": -9.367364883422852, "global_step": 100985, "epoch": 601} {"train_loss": -9.187572479248047, "global_step": 100986, "epoch": 601} {"train_loss": -9.464472770690918, "global_step": 100987, "epoch": 601} {"train_loss": -9.262046813964844, "global_step": 100988, "epoch": 601} {"train_loss": -9.343539237976074, "global_step": 100989, "epoch": 601} {"train_loss": -9.6160306930542, "global_step": 100990, "epoch": 601} {"train_loss": -9.323124885559082, "global_step": 100991, "epoch": 601} {"train_loss": -9.524774551391602, "global_step": 100992, "epoch": 601} {"train_loss": -9.42703628540039, "global_step": 100993, "epoch": 601} {"train_loss": -9.611817359924316, "global_step": 100994, "epoch": 601} {"train_loss": -9.44603443145752, "global_step": 100995, "epoch": 601} {"train_loss": -9.509775161743164, "global_step": 100996, "epoch": 601} {"train_loss": -9.749759674072266, "global_step": 100997, "epoch": 601} {"train_loss": -9.635794639587402, "global_step": 100998, "epoch": 601} {"train_loss": -9.663097381591797, "global_step": 100999, "epoch": 601} {"train_loss": -9.58416748046875, "global_step": 101000, "epoch": 601} {"train_loss": -9.553871154785156, "global_step": 101001, "epoch": 601} {"train_loss": -9.645263671875, "global_step": 101002, "epoch": 601} {"train_loss": -9.639863967895508, "global_step": 101003, "epoch": 601} {"train_loss": -9.617209434509277, "global_step": 101004, "epoch": 601} {"train_loss": -9.900247573852539, "global_step": 101005, "epoch": 601} {"train_loss": -9.728462219238281, "global_step": 101006, "epoch": 601} {"train_loss": -9.808309555053711, "global_step": 101007, "epoch": 601} {"train_loss": -9.624855041503906, "global_step": 101008, "epoch": 601} {"train_loss": -9.820638656616211, "global_step": 101009, "epoch": 601} {"train_loss": -9.658571243286133, "global_step": 101010, "epoch": 601} {"train_loss": -9.677331924438477, "global_step": 101011, "epoch": 601} {"train_loss": -9.753978729248047, "global_step": 101012, "epoch": 601} {"train_loss": -9.77321720123291, "global_step": 101013, "epoch": 601} {"train_loss": -9.737425804138184, "global_step": 101014, "epoch": 601} {"train_loss": -9.928199768066406, "global_step": 101015, "epoch": 601} {"train_loss": -9.912938117980957, "global_step": 101016, "epoch": 601} {"train_loss": -9.935157775878906, "global_step": 101017, "epoch": 601} {"train_loss": -9.486285209655762, "global_step": 101018, "epoch": 601} {"train_loss": -9.906667709350586, "global_step": 101019, "epoch": 601} {"train_loss": -9.382389068603516, "global_step": 101020, "epoch": 601} {"train_loss": -9.981038093566895, "global_step": 101021, "epoch": 601} {"train_loss": -9.87370491027832, "global_step": 101022, "epoch": 601} {"train_loss": -9.519783020019531, "global_step": 101023, "epoch": 601} {"train_loss": -9.76137638092041, "global_step": 101024, "epoch": 601} {"train_loss": -10.052852630615234, "global_step": 101025, "epoch": 601} {"train_loss": -9.238545417785645, "global_step": 101026, "epoch": 601} {"train_loss": -9.279644012451172, "global_step": 101027, "epoch": 601} {"train_loss": -9.420989990234375, "global_step": 101028, "epoch": 601} {"train_loss": -8.721900939941406, "global_step": 101029, "epoch": 601} {"train_loss": -9.934810638427734, "global_step": 101030, "epoch": 601} {"train_loss": -9.277202606201172, "global_step": 101031, "epoch": 601} {"train_loss": -9.738992691040039, "global_step": 101032, "epoch": 601} {"train_loss": -9.528040885925293, "global_step": 101033, "epoch": 601} {"train_loss": -9.509232521057129, "global_step": 101034, "epoch": 601} {"train_loss": -9.412102699279785, "global_step": 101035, "epoch": 601} {"train_loss": -9.265751838684082, "global_step": 101036, "epoch": 601} {"train_loss": -9.554647445678711, "global_step": 101037, "epoch": 601} {"train_loss": -9.722970008850098, "global_step": 101038, "epoch": 601} {"train_loss": -9.105646133422852, "global_step": 101039, "epoch": 601} {"train_loss": -9.767470359802246, "global_step": 101040, "epoch": 601} {"train_loss": -9.176698684692383, "global_step": 101041, "epoch": 601} {"train_loss": -9.498492240905762, "global_step": 101042, "epoch": 601} {"train_loss": -9.344892501831055, "global_step": 101043, "epoch": 601} {"train_loss": -9.439290046691895, "global_step": 101044, "epoch": 601} {"train_loss": -9.671022415161133, "global_step": 101045, "epoch": 601} {"train_loss": -9.795053482055664, "global_step": 101046, "epoch": 601} {"train_loss": -9.341631889343262, "global_step": 101047, "epoch": 601} {"train_loss": -9.858513832092285, "global_step": 101048, "epoch": 601} {"train_loss": -9.788004875183105, "global_step": 101049, "epoch": 601} {"train_loss": -9.808113098144531, "global_step": 101050, "epoch": 601} {"train_loss": -9.689799308776855, "global_step": 101051, "epoch": 601} {"train_loss": -9.807358741760254, "global_step": 101052, "epoch": 601} {"train_loss": -9.822651863098145, "global_step": 101053, "epoch": 601} {"train_loss": -9.700782775878906, "global_step": 101054, "epoch": 601} {"train_loss": -9.61468505859375, "global_step": 101055, "epoch": 601} {"train_loss": -9.710406303405762, "global_step": 101056, "epoch": 601} {"train_loss": -9.390470504760742, "global_step": 101057, "epoch": 601} {"train_loss": -9.749261856079102, "global_step": 101058, "epoch": 601} {"train_loss": -9.496235847473145, "global_step": 101059, "epoch": 601} {"train_loss": -9.857748985290527, "global_step": 101060, "epoch": 601} {"train_loss": -9.639286041259766, "global_step": 101061, "epoch": 601} {"train_loss": -9.989099502563477, "global_step": 101062, "epoch": 601} {"train_loss": -9.73259162902832, "global_step": 101063, "epoch": 601} {"train_loss": -9.913612365722656, "global_step": 101064, "epoch": 601} {"train_loss": -9.774274826049805, "global_step": 101065, "epoch": 601} {"train_loss": -9.805904388427734, "global_step": 101066, "epoch": 601} {"train_loss": -9.729949951171875, "global_step": 101067, "epoch": 601} {"train_loss": -9.754510879516602, "global_step": 101068, "epoch": 601} {"train_loss": -9.549031257629395, "global_step": 101069, "epoch": 601} {"train_loss": -9.836980819702148, "global_step": 101070, "epoch": 601} {"train_loss": -9.487530708312988, "global_step": 101071, "epoch": 601} {"train_loss": -9.712906837463379, "global_step": 101072, "epoch": 601} {"train_loss": -9.669240951538086, "global_step": 101073, "epoch": 601} {"train_loss": -9.779036521911621, "global_step": 101074, "epoch": 601} {"train_loss": -9.684019088745117, "global_step": 101075, "epoch": 601} {"train_loss": -9.899322509765625, "global_step": 101076, "epoch": 601} {"train_loss": -9.573833465576172, "global_step": 101077, "epoch": 601} {"train_loss": -9.494991302490234, "global_step": 101078, "epoch": 601} {"train_loss": -9.518360137939453, "global_step": 101079, "epoch": 601} {"train_loss": -9.89941120147705, "global_step": 101080, "epoch": 601} {"train_loss": -9.492852210998535, "global_step": 101081, "epoch": 601} {"train_loss": -9.34842586517334, "global_step": 101082, "epoch": 601} {"train_loss": -9.474567413330078, "global_step": 101083, "epoch": 601} {"train_loss": -9.692289352416992, "global_step": 101084, "epoch": 601} {"train_loss": -9.31831169128418, "global_step": 101085, "epoch": 601} {"train_loss": -9.75599479675293, "global_step": 101086, "epoch": 601} {"train_loss": -9.283082962036133, "global_step": 101087, "epoch": 601} {"train_loss": -9.505327224731445, "global_step": 101088, "epoch": 601} {"train_loss": -9.84400463104248, "global_step": 101089, "epoch": 601} {"train_loss": -9.54245376586914, "global_step": 101090, "epoch": 601} {"train_loss": -9.84518814086914, "global_step": 101091, "epoch": 601} {"train_loss": -9.674410820007324, "global_step": 101092, "epoch": 601} {"train_loss": -9.474696159362793, "global_step": 101093, "epoch": 601} {"train_loss": -9.620538711547852, "global_step": 101094, "epoch": 601} {"train_loss": -9.701369285583496, "global_step": 101095, "epoch": 601} {"train_loss": -9.806771278381348, "global_step": 101096, "epoch": 601} {"train_loss": -9.727109909057617, "global_step": 101097, "epoch": 601} {"train_loss": -9.57138442993164, "global_step": 101098, "epoch": 601} {"train_loss": -9.906137466430664, "global_step": 101099, "epoch": 601} {"train_loss": -9.88032054901123, "global_step": 101100, "epoch": 601} {"train_loss": -9.294862747192383, "global_step": 101101, "epoch": 601} {"train_loss": -9.842082023620605, "global_step": 101102, "epoch": 601} {"train_loss": -9.639486312866211, "global_step": 101103, "epoch": 601} {"train_loss": -9.564501762390137, "global_step": 101104, "epoch": 601} {"train_loss": -9.814288139343262, "global_step": 101105, "epoch": 601} {"train_loss": -9.273584365844727, "global_step": 101106, "epoch": 601} {"train_loss": -9.275678634643555, "global_step": 101107, "epoch": 601} {"train_loss": -9.405345916748047, "global_step": 101108, "epoch": 601} {"train_loss": -9.627284049987793, "global_step": 101109, "epoch": 601} {"train_loss": -9.817560195922852, "global_step": 101110, "epoch": 601} {"train_loss": -9.499760627746582, "global_step": 101111, "epoch": 601} {"train_loss": -9.752401351928711, "global_step": 101112, "epoch": 601} {"train_loss": -9.772001266479492, "global_step": 101113, "epoch": 601} {"train_loss": -9.735710144042969, "global_step": 101114, "epoch": 601} {"train_loss": -9.999174118041992, "global_step": 101115, "epoch": 601} {"train_loss": -9.809064865112305, "global_step": 101116, "epoch": 601} {"train_loss": -9.87962532043457, "global_step": 101117, "epoch": 601} {"train_loss": -9.843910217285156, "global_step": 101118, "epoch": 601} {"train_loss": -9.830399513244629, "global_step": 101119, "epoch": 601} {"train_loss": -9.748628616333008, "global_step": 101120, "epoch": 601} {"train_loss": -10.005731582641602, "global_step": 101121, "epoch": 601} {"train_loss": -9.995401382446289, "global_step": 101122, "epoch": 601} {"train_loss": -9.934759140014648, "global_step": 101123, "epoch": 601} {"train_loss": -9.659745216369629, "global_step": 101124, "epoch": 601} {"train_loss": -9.522533416748047, "global_step": 101125, "epoch": 601} {"train_loss": -9.82325553894043, "global_step": 101126, "epoch": 601} {"train_loss": -10.106003761291504, "global_step": 101127, "epoch": 601} {"train_loss": -9.756711959838867, "global_step": 101128, "epoch": 601} {"train_loss": -10.155303001403809, "global_step": 101129, "epoch": 601} {"train_loss": -9.695438385009766, "global_step": 101130, "epoch": 601} {"train_loss": -9.645650863647461, "global_step": 101131, "epoch": 601} {"train_loss": -9.356155395507812, "global_step": 101132, "epoch": 601} {"train_loss": -9.884929656982422, "global_step": 101133, "epoch": 601} {"train_loss": -8.975534439086914, "global_step": 101134, "epoch": 601} {"train_loss": -9.599382797876993, "global_step": 101135, "epoch": 601, "val_loss": 204683.359375} {"train_loss": -9.31808853149414, "global_step": 101136, "epoch": 602} {"train_loss": -9.215361595153809, "global_step": 101137, "epoch": 602} {"train_loss": -9.30715560913086, "global_step": 101138, "epoch": 602} {"train_loss": -9.608720779418945, "global_step": 101139, "epoch": 602} {"train_loss": -9.362166404724121, "global_step": 101140, "epoch": 602} {"train_loss": -9.61583423614502, "global_step": 101141, "epoch": 602} {"train_loss": -9.480978012084961, "global_step": 101142, "epoch": 602} {"train_loss": -9.566829681396484, "global_step": 101143, "epoch": 602} {"train_loss": -9.324058532714844, "global_step": 101144, "epoch": 602} {"train_loss": -9.61489486694336, "global_step": 101145, "epoch": 602} {"train_loss": -9.508810043334961, "global_step": 101146, "epoch": 602} {"train_loss": -9.121648788452148, "global_step": 101147, "epoch": 602} {"train_loss": -9.293725967407227, "global_step": 101148, "epoch": 602} {"train_loss": -9.200675964355469, "global_step": 101149, "epoch": 602} {"train_loss": -9.618378639221191, "global_step": 101150, "epoch": 602} {"train_loss": -9.34458065032959, "global_step": 101151, "epoch": 602} {"train_loss": -9.429758071899414, "global_step": 101152, "epoch": 602} {"train_loss": -9.663066864013672, "global_step": 101153, "epoch": 602} {"train_loss": -9.519668579101562, "global_step": 101154, "epoch": 602} {"train_loss": -9.640460014343262, "global_step": 101155, "epoch": 602} {"train_loss": -9.3609037399292, "global_step": 101156, "epoch": 602} {"train_loss": -9.5859375, "global_step": 101157, "epoch": 602} {"train_loss": -9.207944869995117, "global_step": 101158, "epoch": 602} {"train_loss": -9.621322631835938, "global_step": 101159, "epoch": 602} {"train_loss": -9.596044540405273, "global_step": 101160, "epoch": 602} {"train_loss": -9.378493309020996, "global_step": 101161, "epoch": 602} {"train_loss": -9.72018051147461, "global_step": 101162, "epoch": 602} {"train_loss": -9.69485855102539, "global_step": 101163, "epoch": 602} {"train_loss": -9.790107727050781, "global_step": 101164, "epoch": 602} {"train_loss": -9.541841506958008, "global_step": 101165, "epoch": 602} {"train_loss": -9.523225784301758, "global_step": 101166, "epoch": 602} {"train_loss": -9.651047706604004, "global_step": 101167, "epoch": 602} {"train_loss": -9.595767974853516, "global_step": 101168, "epoch": 602} {"train_loss": -9.884805679321289, "global_step": 101169, "epoch": 602} {"train_loss": -9.493242263793945, "global_step": 101170, "epoch": 602} {"train_loss": -9.791768074035645, "global_step": 101171, "epoch": 602} {"train_loss": -9.860393524169922, "global_step": 101172, "epoch": 602} {"train_loss": -9.708039283752441, "global_step": 101173, "epoch": 602} {"train_loss": -9.792760848999023, "global_step": 101174, "epoch": 602} {"train_loss": -9.750679016113281, "global_step": 101175, "epoch": 602} {"train_loss": -9.760265350341797, "global_step": 101176, "epoch": 602} {"train_loss": -9.88230037689209, "global_step": 101177, "epoch": 602} {"train_loss": -9.811986923217773, "global_step": 101178, "epoch": 602} {"train_loss": -9.972973823547363, "global_step": 101179, "epoch": 602} {"train_loss": -9.673747062683105, "global_step": 101180, "epoch": 602} {"train_loss": -9.847423553466797, "global_step": 101181, "epoch": 602} {"train_loss": -9.58591365814209, "global_step": 101182, "epoch": 602} {"train_loss": -9.908350944519043, "global_step": 101183, "epoch": 602} {"train_loss": -10.071077346801758, "global_step": 101184, "epoch": 602} {"train_loss": -9.919693946838379, "global_step": 101185, "epoch": 602} {"train_loss": -9.961175918579102, "global_step": 101186, "epoch": 602} {"train_loss": -9.537649154663086, "global_step": 101187, "epoch": 602} {"train_loss": -9.88956069946289, "global_step": 101188, "epoch": 602} {"train_loss": -9.771242141723633, "global_step": 101189, "epoch": 602} {"train_loss": -10.015945434570312, "global_step": 101190, "epoch": 602} {"train_loss": -9.746772766113281, "global_step": 101191, "epoch": 602} {"train_loss": -9.36623764038086, "global_step": 101192, "epoch": 602} {"train_loss": -9.697957992553711, "global_step": 101193, "epoch": 602} {"train_loss": -9.371040344238281, "global_step": 101194, "epoch": 602} {"train_loss": -9.98080825805664, "global_step": 101195, "epoch": 602} {"train_loss": -9.586770057678223, "global_step": 101196, "epoch": 602} {"train_loss": -9.87304973602295, "global_step": 101197, "epoch": 602} {"train_loss": -9.792306900024414, "global_step": 101198, "epoch": 602} {"train_loss": -9.41308879852295, "global_step": 101199, "epoch": 602} {"train_loss": -9.911779403686523, "global_step": 101200, "epoch": 602} {"train_loss": -9.58755111694336, "global_step": 101201, "epoch": 602} {"train_loss": -9.480230331420898, "global_step": 101202, "epoch": 602} {"train_loss": -9.605988502502441, "global_step": 101203, "epoch": 602} {"train_loss": -9.445364952087402, "global_step": 101204, "epoch": 602} {"train_loss": -9.5596342086792, "global_step": 101205, "epoch": 602} {"train_loss": -9.779403686523438, "global_step": 101206, "epoch": 602} {"train_loss": -9.567142486572266, "global_step": 101207, "epoch": 602} {"train_loss": -9.593111991882324, "global_step": 101208, "epoch": 602} {"train_loss": -9.794798851013184, "global_step": 101209, "epoch": 602} {"train_loss": -9.657548904418945, "global_step": 101210, "epoch": 602} {"train_loss": -9.870023727416992, "global_step": 101211, "epoch": 602} {"train_loss": -9.818984031677246, "global_step": 101212, "epoch": 602} {"train_loss": -9.897096633911133, "global_step": 101213, "epoch": 602} {"train_loss": -9.781230926513672, "global_step": 101214, "epoch": 602} {"train_loss": -9.881650924682617, "global_step": 101215, "epoch": 602} {"train_loss": -9.733892440795898, "global_step": 101216, "epoch": 602} {"train_loss": -9.46939754486084, "global_step": 101217, "epoch": 602} {"train_loss": -9.518808364868164, "global_step": 101218, "epoch": 602} {"train_loss": -9.918564796447754, "global_step": 101219, "epoch": 602} {"train_loss": -9.677416801452637, "global_step": 101220, "epoch": 602} {"train_loss": -9.64034652709961, "global_step": 101221, "epoch": 602} {"train_loss": -9.84738540649414, "global_step": 101222, "epoch": 602} {"train_loss": -9.792621612548828, "global_step": 101223, "epoch": 602} {"train_loss": -9.51137924194336, "global_step": 101224, "epoch": 602} {"train_loss": -9.768096923828125, "global_step": 101225, "epoch": 602} {"train_loss": -9.84642219543457, "global_step": 101226, "epoch": 602} {"train_loss": -9.720490455627441, "global_step": 101227, "epoch": 602} {"train_loss": -9.838054656982422, "global_step": 101228, "epoch": 602} {"train_loss": -9.897653579711914, "global_step": 101229, "epoch": 602} {"train_loss": -9.577367782592773, "global_step": 101230, "epoch": 602} {"train_loss": -9.741554260253906, "global_step": 101231, "epoch": 602} {"train_loss": -9.905394554138184, "global_step": 101232, "epoch": 602} {"train_loss": -9.843551635742188, "global_step": 101233, "epoch": 602} {"train_loss": -9.942853927612305, "global_step": 101234, "epoch": 602} {"train_loss": -9.971940994262695, "global_step": 101235, "epoch": 602} {"train_loss": -10.10002326965332, "global_step": 101236, "epoch": 602} {"train_loss": -9.93450927734375, "global_step": 101237, "epoch": 602} {"train_loss": -9.76522159576416, "global_step": 101238, "epoch": 602} {"train_loss": -9.951007843017578, "global_step": 101239, "epoch": 602} {"train_loss": -9.676713943481445, "global_step": 101240, "epoch": 602} {"train_loss": -10.143570899963379, "global_step": 101241, "epoch": 602} {"train_loss": -9.941000938415527, "global_step": 101242, "epoch": 602} {"train_loss": -9.92237377166748, "global_step": 101243, "epoch": 602} {"train_loss": -9.9194917678833, "global_step": 101244, "epoch": 602} {"train_loss": -9.352865219116211, "global_step": 101245, "epoch": 602} {"train_loss": -9.478559494018555, "global_step": 101246, "epoch": 602} {"train_loss": -9.611274719238281, "global_step": 101247, "epoch": 602} {"train_loss": -9.381138801574707, "global_step": 101248, "epoch": 602} {"train_loss": -9.7532320022583, "global_step": 101249, "epoch": 602} {"train_loss": -9.78518295288086, "global_step": 101250, "epoch": 602} {"train_loss": -9.391538619995117, "global_step": 101251, "epoch": 602} {"train_loss": -9.705007553100586, "global_step": 101252, "epoch": 602} {"train_loss": -9.609621047973633, "global_step": 101253, "epoch": 602} {"train_loss": -9.5219087600708, "global_step": 101254, "epoch": 602} {"train_loss": -9.784858703613281, "global_step": 101255, "epoch": 602} {"train_loss": -9.474620819091797, "global_step": 101256, "epoch": 602} {"train_loss": -9.636249542236328, "global_step": 101257, "epoch": 602} {"train_loss": -9.827753067016602, "global_step": 101258, "epoch": 602} {"train_loss": -9.471774101257324, "global_step": 101259, "epoch": 602} {"train_loss": -9.856657028198242, "global_step": 101260, "epoch": 602} {"train_loss": -9.735363960266113, "global_step": 101261, "epoch": 602} {"train_loss": -9.658788681030273, "global_step": 101262, "epoch": 602} {"train_loss": -9.758024215698242, "global_step": 101263, "epoch": 602} {"train_loss": -9.539816856384277, "global_step": 101264, "epoch": 602} {"train_loss": -9.687515258789062, "global_step": 101265, "epoch": 602} {"train_loss": -9.442695617675781, "global_step": 101266, "epoch": 602} {"train_loss": -9.718667984008789, "global_step": 101267, "epoch": 602} {"train_loss": -9.751789093017578, "global_step": 101268, "epoch": 602} {"train_loss": -9.664344787597656, "global_step": 101269, "epoch": 602} {"train_loss": -9.830011367797852, "global_step": 101270, "epoch": 602} {"train_loss": -9.774717330932617, "global_step": 101271, "epoch": 602} {"train_loss": -9.748617172241211, "global_step": 101272, "epoch": 602} {"train_loss": -9.673307418823242, "global_step": 101273, "epoch": 602} {"train_loss": -9.65211296081543, "global_step": 101274, "epoch": 602} {"train_loss": -9.849842071533203, "global_step": 101275, "epoch": 602} {"train_loss": -9.78404426574707, "global_step": 101276, "epoch": 602} {"train_loss": -9.740224838256836, "global_step": 101277, "epoch": 602} {"train_loss": -9.777652740478516, "global_step": 101278, "epoch": 602} {"train_loss": -9.710741996765137, "global_step": 101279, "epoch": 602} {"train_loss": -9.265274047851562, "global_step": 101280, "epoch": 602} {"train_loss": -9.557991027832031, "global_step": 101281, "epoch": 602} {"train_loss": -9.82625961303711, "global_step": 101282, "epoch": 602} {"train_loss": -9.658387184143066, "global_step": 101283, "epoch": 602} {"train_loss": -9.952093124389648, "global_step": 101284, "epoch": 602} {"train_loss": -9.869020462036133, "global_step": 101285, "epoch": 602} {"train_loss": -9.84044075012207, "global_step": 101286, "epoch": 602} {"train_loss": -9.82647705078125, "global_step": 101287, "epoch": 602} {"train_loss": -9.393433570861816, "global_step": 101288, "epoch": 602} {"train_loss": -9.925012588500977, "global_step": 101289, "epoch": 602} {"train_loss": -9.901002883911133, "global_step": 101290, "epoch": 602} {"train_loss": -10.052351951599121, "global_step": 101291, "epoch": 602} {"train_loss": -10.003780364990234, "global_step": 101292, "epoch": 602} {"train_loss": -9.856300354003906, "global_step": 101293, "epoch": 602} {"train_loss": -9.88377571105957, "global_step": 101294, "epoch": 602} {"train_loss": -9.827451705932617, "global_step": 101295, "epoch": 602} {"train_loss": -9.646064758300781, "global_step": 101296, "epoch": 602} {"train_loss": -9.71794605255127, "global_step": 101297, "epoch": 602} {"train_loss": -9.780384063720703, "global_step": 101298, "epoch": 602} {"train_loss": -9.749871253967285, "global_step": 101299, "epoch": 602} {"train_loss": -9.769177436828613, "global_step": 101300, "epoch": 602} {"train_loss": -9.868108749389648, "global_step": 101301, "epoch": 602} {"train_loss": -9.819398880004883, "global_step": 101302, "epoch": 602} {"train_loss": -9.688129583994547, "global_step": 101303, "epoch": 602, "val_loss": 205771.390625} {"train_loss": -8.679975509643555, "global_step": 101304, "epoch": 603} {"train_loss": -9.29216194152832, "global_step": 101305, "epoch": 603} {"train_loss": -8.166818618774414, "global_step": 101306, "epoch": 603} {"train_loss": -8.62911605834961, "global_step": 101307, "epoch": 603} {"train_loss": -9.254167556762695, "global_step": 101308, "epoch": 603} {"train_loss": -8.923900604248047, "global_step": 101309, "epoch": 603} {"train_loss": -9.523876190185547, "global_step": 101310, "epoch": 603} {"train_loss": -8.775581359863281, "global_step": 101311, "epoch": 603} {"train_loss": -9.12458610534668, "global_step": 101312, "epoch": 603} {"train_loss": -8.925307273864746, "global_step": 101313, "epoch": 603} {"train_loss": -9.369632720947266, "global_step": 101314, "epoch": 603} {"train_loss": -8.993148803710938, "global_step": 101315, "epoch": 603} {"train_loss": -8.83962345123291, "global_step": 101316, "epoch": 603} {"train_loss": -9.485713005065918, "global_step": 101317, "epoch": 603} {"train_loss": -9.045479774475098, "global_step": 101318, "epoch": 603} {"train_loss": -9.209634780883789, "global_step": 101319, "epoch": 603} {"train_loss": -8.900243759155273, "global_step": 101320, "epoch": 603} {"train_loss": -8.905323028564453, "global_step": 101321, "epoch": 603} {"train_loss": -9.311125755310059, "global_step": 101322, "epoch": 603} {"train_loss": -8.94692325592041, "global_step": 101323, "epoch": 603} {"train_loss": -9.551727294921875, "global_step": 101324, "epoch": 603} {"train_loss": -9.590517044067383, "global_step": 101325, "epoch": 603} {"train_loss": -9.242897033691406, "global_step": 101326, "epoch": 603} {"train_loss": -9.475988388061523, "global_step": 101327, "epoch": 603} {"train_loss": -9.719156265258789, "global_step": 101328, "epoch": 603} {"train_loss": -9.453239440917969, "global_step": 101329, "epoch": 603} {"train_loss": -9.44874382019043, "global_step": 101330, "epoch": 603} {"train_loss": -9.390851974487305, "global_step": 101331, "epoch": 603} {"train_loss": -9.444245338439941, "global_step": 101332, "epoch": 603} {"train_loss": -9.722136497497559, "global_step": 101333, "epoch": 603} {"train_loss": -9.497169494628906, "global_step": 101334, "epoch": 603} {"train_loss": -9.665664672851562, "global_step": 101335, "epoch": 603} {"train_loss": -9.452704429626465, "global_step": 101336, "epoch": 603} {"train_loss": -9.597843170166016, "global_step": 101337, "epoch": 603} {"train_loss": -9.559133529663086, "global_step": 101338, "epoch": 603} {"train_loss": -9.692682266235352, "global_step": 101339, "epoch": 603} {"train_loss": -9.579414367675781, "global_step": 101340, "epoch": 603} {"train_loss": -9.808639526367188, "global_step": 101341, "epoch": 603} {"train_loss": -9.753236770629883, "global_step": 101342, "epoch": 603} {"train_loss": -9.799514770507812, "global_step": 101343, "epoch": 603} {"train_loss": -9.768136978149414, "global_step": 101344, "epoch": 603} {"train_loss": -9.744377136230469, "global_step": 101345, "epoch": 603} {"train_loss": -9.935384750366211, "global_step": 101346, "epoch": 603} {"train_loss": -9.829225540161133, "global_step": 101347, "epoch": 603} {"train_loss": -9.933109283447266, "global_step": 101348, "epoch": 603} {"train_loss": -9.866755485534668, "global_step": 101349, "epoch": 603} {"train_loss": -9.881217956542969, "global_step": 101350, "epoch": 603} {"train_loss": -9.933341026306152, "global_step": 101351, "epoch": 603} {"train_loss": -10.069368362426758, "global_step": 101352, "epoch": 603} {"train_loss": -9.804954528808594, "global_step": 101353, "epoch": 603} {"train_loss": -9.877949714660645, "global_step": 101354, "epoch": 603} {"train_loss": -9.995460510253906, "global_step": 101355, "epoch": 603} {"train_loss": -9.870948791503906, "global_step": 101356, "epoch": 603} {"train_loss": -10.224811553955078, "global_step": 101357, "epoch": 603} {"train_loss": -9.965145111083984, "global_step": 101358, "epoch": 603} {"train_loss": -9.838674545288086, "global_step": 101359, "epoch": 603} {"train_loss": -10.237642288208008, "global_step": 101360, "epoch": 603} {"train_loss": -9.969029426574707, "global_step": 101361, "epoch": 603} {"train_loss": -9.981435775756836, "global_step": 101362, "epoch": 603} {"train_loss": -9.68001937866211, "global_step": 101363, "epoch": 603} {"train_loss": -9.494138717651367, "global_step": 101364, "epoch": 603} {"train_loss": -9.922017097473145, "global_step": 101365, "epoch": 603} {"train_loss": -9.906347274780273, "global_step": 101366, "epoch": 603} {"train_loss": -9.644440650939941, "global_step": 101367, "epoch": 603} {"train_loss": -9.850138664245605, "global_step": 101368, "epoch": 603} {"train_loss": -9.924436569213867, "global_step": 101369, "epoch": 603} {"train_loss": -9.850793838500977, "global_step": 101370, "epoch": 603} {"train_loss": -9.862658500671387, "global_step": 101371, "epoch": 603} {"train_loss": -9.816341400146484, "global_step": 101372, "epoch": 603} {"train_loss": -9.647768020629883, "global_step": 101373, "epoch": 603} {"train_loss": -9.959169387817383, "global_step": 101374, "epoch": 603} {"train_loss": -9.77816390991211, "global_step": 101375, "epoch": 603} {"train_loss": -9.926942825317383, "global_step": 101376, "epoch": 603} {"train_loss": -10.004491806030273, "global_step": 101377, "epoch": 603} {"train_loss": -10.05322551727295, "global_step": 101378, "epoch": 603} {"train_loss": -9.222146987915039, "global_step": 101379, "epoch": 603} {"train_loss": -9.68073844909668, "global_step": 101380, "epoch": 603} {"train_loss": -9.483011245727539, "global_step": 101381, "epoch": 603} {"train_loss": -9.541343688964844, "global_step": 101382, "epoch": 603} {"train_loss": -9.854455947875977, "global_step": 101383, "epoch": 603} {"train_loss": -9.574909210205078, "global_step": 101384, "epoch": 603} {"train_loss": -9.505361557006836, "global_step": 101385, "epoch": 603} {"train_loss": -9.433342933654785, "global_step": 101386, "epoch": 603} {"train_loss": -9.815092086791992, "global_step": 101387, "epoch": 603} {"train_loss": -9.6298189163208, "global_step": 101388, "epoch": 603} {"train_loss": -9.959966659545898, "global_step": 101389, "epoch": 603} {"train_loss": -9.308293342590332, "global_step": 101390, "epoch": 603} {"train_loss": -9.634328842163086, "global_step": 101391, "epoch": 603} {"train_loss": -9.482820510864258, "global_step": 101392, "epoch": 603} {"train_loss": -9.440165519714355, "global_step": 101393, "epoch": 603} {"train_loss": -9.546016693115234, "global_step": 101394, "epoch": 603} {"train_loss": -9.603912353515625, "global_step": 101395, "epoch": 603} {"train_loss": -9.229927062988281, "global_step": 101396, "epoch": 603} {"train_loss": -9.564863204956055, "global_step": 101397, "epoch": 603} {"train_loss": -9.567024230957031, "global_step": 101398, "epoch": 603} {"train_loss": -9.128480911254883, "global_step": 101399, "epoch": 603} {"train_loss": -9.508988380432129, "global_step": 101400, "epoch": 603} {"train_loss": -9.512439727783203, "global_step": 101401, "epoch": 603} {"train_loss": -9.645700454711914, "global_step": 101402, "epoch": 603} {"train_loss": -9.521302223205566, "global_step": 101403, "epoch": 603} {"train_loss": -9.571712493896484, "global_step": 101404, "epoch": 603} {"train_loss": -9.387142181396484, "global_step": 101405, "epoch": 603} {"train_loss": -9.38559341430664, "global_step": 101406, "epoch": 603} {"train_loss": -9.481550216674805, "global_step": 101407, "epoch": 603} {"train_loss": -9.375962257385254, "global_step": 101408, "epoch": 603} {"train_loss": -9.67912483215332, "global_step": 101409, "epoch": 603} {"train_loss": -9.763620376586914, "global_step": 101410, "epoch": 603} {"train_loss": -9.590435981750488, "global_step": 101411, "epoch": 603} {"train_loss": -9.527267456054688, "global_step": 101412, "epoch": 603} {"train_loss": -9.761699676513672, "global_step": 101413, "epoch": 603} {"train_loss": -9.641240119934082, "global_step": 101414, "epoch": 603} {"train_loss": -9.757933616638184, "global_step": 101415, "epoch": 603} {"train_loss": -9.842288970947266, "global_step": 101416, "epoch": 603} {"train_loss": -9.800207138061523, "global_step": 101417, "epoch": 603} {"train_loss": -9.989230155944824, "global_step": 101418, "epoch": 603} {"train_loss": -9.805717468261719, "global_step": 101419, "epoch": 603} {"train_loss": -9.842728614807129, "global_step": 101420, "epoch": 603} {"train_loss": -9.941682815551758, "global_step": 101421, "epoch": 603} {"train_loss": -9.703664779663086, "global_step": 101422, "epoch": 603} {"train_loss": -9.988862037658691, "global_step": 101423, "epoch": 603} {"train_loss": -9.549240112304688, "global_step": 101424, "epoch": 603} {"train_loss": -9.954130172729492, "global_step": 101425, "epoch": 603} {"train_loss": -9.960359573364258, "global_step": 101426, "epoch": 603} {"train_loss": -9.873297691345215, "global_step": 101427, "epoch": 603} {"train_loss": -9.753141403198242, "global_step": 101428, "epoch": 603} {"train_loss": -9.730695724487305, "global_step": 101429, "epoch": 603} {"train_loss": -9.553348541259766, "global_step": 101430, "epoch": 603} {"train_loss": -9.563621520996094, "global_step": 101431, "epoch": 603} {"train_loss": -9.969746589660645, "global_step": 101432, "epoch": 603} {"train_loss": -9.425012588500977, "global_step": 101433, "epoch": 603} {"train_loss": -9.980681419372559, "global_step": 101434, "epoch": 603} {"train_loss": -9.873129844665527, "global_step": 101435, "epoch": 603} {"train_loss": -9.858827590942383, "global_step": 101436, "epoch": 603} {"train_loss": -9.813106536865234, "global_step": 101437, "epoch": 603} {"train_loss": -9.660772323608398, "global_step": 101438, "epoch": 603} {"train_loss": -9.973901748657227, "global_step": 101439, "epoch": 603} {"train_loss": -9.91917610168457, "global_step": 101440, "epoch": 603} {"train_loss": -9.86479377746582, "global_step": 101441, "epoch": 603} {"train_loss": -9.870429039001465, "global_step": 101442, "epoch": 603} {"train_loss": -9.762534141540527, "global_step": 101443, "epoch": 603} {"train_loss": -9.646284103393555, "global_step": 101444, "epoch": 603} {"train_loss": -9.831440925598145, "global_step": 101445, "epoch": 603} {"train_loss": -9.365226745605469, "global_step": 101446, "epoch": 603} {"train_loss": -9.715291023254395, "global_step": 101447, "epoch": 603} {"train_loss": -9.622065544128418, "global_step": 101448, "epoch": 603} {"train_loss": -9.115692138671875, "global_step": 101449, "epoch": 603} {"train_loss": -9.826916694641113, "global_step": 101450, "epoch": 603} {"train_loss": -9.560142517089844, "global_step": 101451, "epoch": 603} {"train_loss": -9.678932189941406, "global_step": 101452, "epoch": 603} {"train_loss": -9.501689910888672, "global_step": 101453, "epoch": 603} {"train_loss": -9.565128326416016, "global_step": 101454, "epoch": 603} {"train_loss": -9.909374237060547, "global_step": 101455, "epoch": 603} {"train_loss": -9.649507522583008, "global_step": 101456, "epoch": 603} {"train_loss": -9.736095428466797, "global_step": 101457, "epoch": 603} {"train_loss": -9.625608444213867, "global_step": 101458, "epoch": 603} {"train_loss": -9.544515609741211, "global_step": 101459, "epoch": 603} {"train_loss": -9.652928352355957, "global_step": 101460, "epoch": 603} {"train_loss": -9.218378067016602, "global_step": 101461, "epoch": 603} {"train_loss": -9.672683715820312, "global_step": 101462, "epoch": 603} {"train_loss": -9.468622207641602, "global_step": 101463, "epoch": 603} {"train_loss": -9.617691040039062, "global_step": 101464, "epoch": 603} {"train_loss": -9.511205673217773, "global_step": 101465, "epoch": 603} {"train_loss": -9.650206565856934, "global_step": 101466, "epoch": 603} {"train_loss": -9.365355491638184, "global_step": 101467, "epoch": 603} {"train_loss": -9.949978828430176, "global_step": 101468, "epoch": 603} {"train_loss": -9.555170059204102, "global_step": 101469, "epoch": 603} {"train_loss": -9.599359512329102, "global_step": 101470, "epoch": 603} {"train_loss": -9.6120685509273, "global_step": 101471, "epoch": 603, "val_loss": 205995.265625} {"train_loss": -9.57461929321289, "global_step": 101472, "epoch": 604} {"train_loss": -9.561922073364258, "global_step": 101473, "epoch": 604} {"train_loss": -9.797553062438965, "global_step": 101474, "epoch": 604} {"train_loss": -9.769705772399902, "global_step": 101475, "epoch": 604} {"train_loss": -9.562313079833984, "global_step": 101476, "epoch": 604} {"train_loss": -9.676311492919922, "global_step": 101477, "epoch": 604} {"train_loss": -9.5709810256958, "global_step": 101478, "epoch": 604} {"train_loss": -9.718864440917969, "global_step": 101479, "epoch": 604} {"train_loss": -9.84373664855957, "global_step": 101480, "epoch": 604} {"train_loss": -9.461111068725586, "global_step": 101481, "epoch": 604} {"train_loss": -10.009278297424316, "global_step": 101482, "epoch": 604} {"train_loss": -9.740497589111328, "global_step": 101483, "epoch": 604} {"train_loss": -9.785843849182129, "global_step": 101484, "epoch": 604} {"train_loss": -9.427107810974121, "global_step": 101485, "epoch": 604} {"train_loss": -9.635480880737305, "global_step": 101486, "epoch": 604} {"train_loss": -9.66872787475586, "global_step": 101487, "epoch": 604} {"train_loss": -9.743646621704102, "global_step": 101488, "epoch": 604} {"train_loss": -9.978824615478516, "global_step": 101489, "epoch": 604} {"train_loss": -9.896634101867676, "global_step": 101490, "epoch": 604} {"train_loss": -9.931411743164062, "global_step": 101491, "epoch": 604} {"train_loss": -10.12109661102295, "global_step": 101492, "epoch": 604} {"train_loss": -9.909416198730469, "global_step": 101493, "epoch": 604} {"train_loss": -9.829041481018066, "global_step": 101494, "epoch": 604} {"train_loss": -9.747663497924805, "global_step": 101495, "epoch": 604} {"train_loss": -9.854846954345703, "global_step": 101496, "epoch": 604} {"train_loss": -9.946182250976562, "global_step": 101497, "epoch": 604} {"train_loss": -9.806809425354004, "global_step": 101498, "epoch": 604} {"train_loss": -9.663124084472656, "global_step": 101499, "epoch": 604} {"train_loss": -9.931336402893066, "global_step": 101500, "epoch": 604} {"train_loss": -9.5903959274292, "global_step": 101501, "epoch": 604} {"train_loss": -9.737521171569824, "global_step": 101502, "epoch": 604} {"train_loss": -9.587936401367188, "global_step": 101503, "epoch": 604} {"train_loss": -9.64323616027832, "global_step": 101504, "epoch": 604} {"train_loss": -9.810617446899414, "global_step": 101505, "epoch": 604} {"train_loss": -9.531085968017578, "global_step": 101506, "epoch": 604} {"train_loss": -9.710126876831055, "global_step": 101507, "epoch": 604} {"train_loss": -9.890373229980469, "global_step": 101508, "epoch": 604} {"train_loss": -9.810160636901855, "global_step": 101509, "epoch": 604} {"train_loss": -9.73017692565918, "global_step": 101510, "epoch": 604} {"train_loss": -9.757858276367188, "global_step": 101511, "epoch": 604} {"train_loss": -10.05352783203125, "global_step": 101512, "epoch": 604} {"train_loss": -9.467512130737305, "global_step": 101513, "epoch": 604} {"train_loss": -9.888772010803223, "global_step": 101514, "epoch": 604} {"train_loss": -9.75289249420166, "global_step": 101515, "epoch": 604} {"train_loss": -9.81546688079834, "global_step": 101516, "epoch": 604} {"train_loss": -9.808828353881836, "global_step": 101517, "epoch": 604} {"train_loss": -9.859065055847168, "global_step": 101518, "epoch": 604} {"train_loss": -9.63199234008789, "global_step": 101519, "epoch": 604} {"train_loss": -9.820290565490723, "global_step": 101520, "epoch": 604} {"train_loss": -10.00482177734375, "global_step": 101521, "epoch": 604} {"train_loss": -10.05739974975586, "global_step": 101522, "epoch": 604} {"train_loss": -9.76732063293457, "global_step": 101523, "epoch": 604} {"train_loss": -10.032018661499023, "global_step": 101524, "epoch": 604} {"train_loss": -9.713136672973633, "global_step": 101525, "epoch": 604} {"train_loss": -9.60963249206543, "global_step": 101526, "epoch": 604} {"train_loss": -9.693113327026367, "global_step": 101527, "epoch": 604} {"train_loss": -9.406152725219727, "global_step": 101528, "epoch": 604} {"train_loss": -9.939004898071289, "global_step": 101529, "epoch": 604} {"train_loss": -9.545084953308105, "global_step": 101530, "epoch": 604} {"train_loss": -9.666841506958008, "global_step": 101531, "epoch": 604} {"train_loss": -9.728140830993652, "global_step": 101532, "epoch": 604} {"train_loss": -9.591217994689941, "global_step": 101533, "epoch": 604} {"train_loss": -9.925827026367188, "global_step": 101534, "epoch": 604} {"train_loss": -9.632084846496582, "global_step": 101535, "epoch": 604} {"train_loss": -9.98924446105957, "global_step": 101536, "epoch": 604} {"train_loss": -9.723708152770996, "global_step": 101537, "epoch": 604} {"train_loss": -9.920246124267578, "global_step": 101538, "epoch": 604} {"train_loss": -9.762275695800781, "global_step": 101539, "epoch": 604} {"train_loss": -9.859678268432617, "global_step": 101540, "epoch": 604} {"train_loss": -10.063325881958008, "global_step": 101541, "epoch": 604} {"train_loss": -9.966264724731445, "global_step": 101542, "epoch": 604} {"train_loss": -9.995429039001465, "global_step": 101543, "epoch": 604} {"train_loss": -9.866369247436523, "global_step": 101544, "epoch": 604} {"train_loss": -9.754608154296875, "global_step": 101545, "epoch": 604} {"train_loss": -9.89837646484375, "global_step": 101546, "epoch": 604} {"train_loss": -9.79655647277832, "global_step": 101547, "epoch": 604} {"train_loss": -9.990750312805176, "global_step": 101548, "epoch": 604} {"train_loss": -9.918813705444336, "global_step": 101549, "epoch": 604} {"train_loss": -10.052892684936523, "global_step": 101550, "epoch": 604} {"train_loss": -9.874908447265625, "global_step": 101551, "epoch": 604} {"train_loss": -9.777244567871094, "global_step": 101552, "epoch": 604} {"train_loss": -9.960546493530273, "global_step": 101553, "epoch": 604} {"train_loss": -9.634897232055664, "global_step": 101554, "epoch": 604} {"train_loss": -9.686769485473633, "global_step": 101555, "epoch": 604} {"train_loss": -9.645500183105469, "global_step": 101556, "epoch": 604} {"train_loss": -9.574094772338867, "global_step": 101557, "epoch": 604} {"train_loss": -9.930008888244629, "global_step": 101558, "epoch": 604} {"train_loss": -9.535909652709961, "global_step": 101559, "epoch": 604} {"train_loss": -9.333610534667969, "global_step": 101560, "epoch": 604} {"train_loss": -9.528302192687988, "global_step": 101561, "epoch": 604} {"train_loss": -9.189163208007812, "global_step": 101562, "epoch": 604} {"train_loss": -9.809953689575195, "global_step": 101563, "epoch": 604} {"train_loss": -9.171205520629883, "global_step": 101564, "epoch": 604} {"train_loss": -9.696009635925293, "global_step": 101565, "epoch": 604} {"train_loss": -9.560632705688477, "global_step": 101566, "epoch": 604} {"train_loss": -9.76158332824707, "global_step": 101567, "epoch": 604} {"train_loss": -9.854873657226562, "global_step": 101568, "epoch": 604} {"train_loss": -9.225320816040039, "global_step": 101569, "epoch": 604} {"train_loss": -9.806363105773926, "global_step": 101570, "epoch": 604} {"train_loss": -9.175397872924805, "global_step": 101571, "epoch": 604} {"train_loss": -9.781110763549805, "global_step": 101572, "epoch": 604} {"train_loss": -9.309032440185547, "global_step": 101573, "epoch": 604} {"train_loss": -9.927136421203613, "global_step": 101574, "epoch": 604} {"train_loss": -9.365132331848145, "global_step": 101575, "epoch": 604} {"train_loss": -9.542140007019043, "global_step": 101576, "epoch": 604} {"train_loss": -9.473488807678223, "global_step": 101577, "epoch": 604} {"train_loss": -9.613282203674316, "global_step": 101578, "epoch": 604} {"train_loss": -9.433195114135742, "global_step": 101579, "epoch": 604} {"train_loss": -9.597259521484375, "global_step": 101580, "epoch": 604} {"train_loss": -9.682490348815918, "global_step": 101581, "epoch": 604} {"train_loss": -9.751180648803711, "global_step": 101582, "epoch": 604} {"train_loss": -9.547782897949219, "global_step": 101583, "epoch": 604} {"train_loss": -9.711984634399414, "global_step": 101584, "epoch": 604} {"train_loss": -9.900569915771484, "global_step": 101585, "epoch": 604} {"train_loss": -9.798158645629883, "global_step": 101586, "epoch": 604} {"train_loss": -9.820865631103516, "global_step": 101587, "epoch": 604} {"train_loss": -9.986221313476562, "global_step": 101588, "epoch": 604} {"train_loss": -9.85228157043457, "global_step": 101589, "epoch": 604} {"train_loss": -9.902947425842285, "global_step": 101590, "epoch": 604} {"train_loss": -9.927913665771484, "global_step": 101591, "epoch": 604} {"train_loss": -9.944978713989258, "global_step": 101592, "epoch": 604} {"train_loss": -9.82528305053711, "global_step": 101593, "epoch": 604} {"train_loss": -9.876258850097656, "global_step": 101594, "epoch": 604} {"train_loss": -9.836320877075195, "global_step": 101595, "epoch": 604} {"train_loss": -9.72535514831543, "global_step": 101596, "epoch": 604} {"train_loss": -10.071647644042969, "global_step": 101597, "epoch": 604} {"train_loss": -9.670143127441406, "global_step": 101598, "epoch": 604} {"train_loss": -9.893131256103516, "global_step": 101599, "epoch": 604} {"train_loss": -9.919231414794922, "global_step": 101600, "epoch": 604} {"train_loss": -9.805813789367676, "global_step": 101601, "epoch": 604} {"train_loss": -9.892333984375, "global_step": 101602, "epoch": 604} {"train_loss": -9.850871086120605, "global_step": 101603, "epoch": 604} {"train_loss": -9.694124221801758, "global_step": 101604, "epoch": 604} {"train_loss": -9.718390464782715, "global_step": 101605, "epoch": 604} {"train_loss": -9.653398513793945, "global_step": 101606, "epoch": 604} {"train_loss": -9.522326469421387, "global_step": 101607, "epoch": 604} {"train_loss": -9.90693473815918, "global_step": 101608, "epoch": 604} {"train_loss": -9.73475456237793, "global_step": 101609, "epoch": 604} {"train_loss": -9.823202133178711, "global_step": 101610, "epoch": 604} {"train_loss": -9.772644996643066, "global_step": 101611, "epoch": 604} {"train_loss": -9.762453079223633, "global_step": 101612, "epoch": 604} {"train_loss": -9.880319595336914, "global_step": 101613, "epoch": 604} {"train_loss": -9.875105857849121, "global_step": 101614, "epoch": 604} {"train_loss": -9.690028190612793, "global_step": 101615, "epoch": 604} {"train_loss": -10.028482437133789, "global_step": 101616, "epoch": 604} {"train_loss": -9.350303649902344, "global_step": 101617, "epoch": 604} {"train_loss": -9.644914627075195, "global_step": 101618, "epoch": 604} {"train_loss": -9.586372375488281, "global_step": 101619, "epoch": 604} {"train_loss": -9.458073616027832, "global_step": 101620, "epoch": 604} {"train_loss": -9.482340812683105, "global_step": 101621, "epoch": 604} {"train_loss": -9.745448112487793, "global_step": 101622, "epoch": 604} {"train_loss": -9.258994102478027, "global_step": 101623, "epoch": 604} {"train_loss": -9.291121482849121, "global_step": 101624, "epoch": 604} {"train_loss": -9.459358215332031, "global_step": 101625, "epoch": 604} {"train_loss": -9.224876403808594, "global_step": 101626, "epoch": 604} {"train_loss": -9.75515365600586, "global_step": 101627, "epoch": 604} {"train_loss": -9.326525688171387, "global_step": 101628, "epoch": 604} {"train_loss": -9.806967735290527, "global_step": 101629, "epoch": 604} {"train_loss": -9.50156021118164, "global_step": 101630, "epoch": 604} {"train_loss": -9.693709373474121, "global_step": 101631, "epoch": 604} {"train_loss": -9.63379192352295, "global_step": 101632, "epoch": 604} {"train_loss": -9.781224250793457, "global_step": 101633, "epoch": 604} {"train_loss": -9.626049041748047, "global_step": 101634, "epoch": 604} {"train_loss": -9.65131950378418, "global_step": 101635, "epoch": 604} {"train_loss": -9.161761283874512, "global_step": 101636, "epoch": 604} {"train_loss": -9.755908966064453, "global_step": 101637, "epoch": 604} {"train_loss": -9.417657852172852, "global_step": 101638, "epoch": 604} {"train_loss": -9.721489293234688, "global_step": 101639, "epoch": 604, "val_loss": 206397.703125} {"train_loss": -9.387176513671875, "global_step": 101640, "epoch": 605} {"train_loss": -9.578371047973633, "global_step": 101641, "epoch": 605} {"train_loss": -9.233570098876953, "global_step": 101642, "epoch": 605} {"train_loss": -9.572519302368164, "global_step": 101643, "epoch": 605} {"train_loss": -9.333892822265625, "global_step": 101644, "epoch": 605} {"train_loss": -9.564027786254883, "global_step": 101645, "epoch": 605} {"train_loss": -9.662198066711426, "global_step": 101646, "epoch": 605} {"train_loss": -9.446218490600586, "global_step": 101647, "epoch": 605} {"train_loss": -9.868561744689941, "global_step": 101648, "epoch": 605} {"train_loss": -9.65134048461914, "global_step": 101649, "epoch": 605} {"train_loss": -9.765792846679688, "global_step": 101650, "epoch": 605} {"train_loss": -9.626408576965332, "global_step": 101651, "epoch": 605} {"train_loss": -9.697954177856445, "global_step": 101652, "epoch": 605} {"train_loss": -9.67592716217041, "global_step": 101653, "epoch": 605} {"train_loss": -9.634953498840332, "global_step": 101654, "epoch": 605} {"train_loss": -9.819620132446289, "global_step": 101655, "epoch": 605} {"train_loss": -9.596672058105469, "global_step": 101656, "epoch": 605} {"train_loss": -9.906686782836914, "global_step": 101657, "epoch": 605} {"train_loss": -9.684610366821289, "global_step": 101658, "epoch": 605} {"train_loss": -9.871349334716797, "global_step": 101659, "epoch": 605} {"train_loss": -9.834776878356934, "global_step": 101660, "epoch": 605} {"train_loss": -9.863340377807617, "global_step": 101661, "epoch": 605} {"train_loss": -9.97938346862793, "global_step": 101662, "epoch": 605} {"train_loss": -9.948724746704102, "global_step": 101663, "epoch": 605} {"train_loss": -10.023250579833984, "global_step": 101664, "epoch": 605} {"train_loss": -9.815452575683594, "global_step": 101665, "epoch": 605} {"train_loss": -9.932045936584473, "global_step": 101666, "epoch": 605} {"train_loss": -10.054040908813477, "global_step": 101667, "epoch": 605} {"train_loss": -9.867437362670898, "global_step": 101668, "epoch": 605} {"train_loss": -9.757425308227539, "global_step": 101669, "epoch": 605} {"train_loss": -9.995222091674805, "global_step": 101670, "epoch": 605} {"train_loss": -10.095354080200195, "global_step": 101671, "epoch": 605} {"train_loss": -9.718433380126953, "global_step": 101672, "epoch": 605} {"train_loss": -10.049701690673828, "global_step": 101673, "epoch": 605} {"train_loss": -9.80843734741211, "global_step": 101674, "epoch": 605} {"train_loss": -9.793584823608398, "global_step": 101675, "epoch": 605} {"train_loss": -9.69017219543457, "global_step": 101676, "epoch": 605} {"train_loss": -9.562519073486328, "global_step": 101677, "epoch": 605} {"train_loss": -9.947637557983398, "global_step": 101678, "epoch": 605} {"train_loss": -9.870186805725098, "global_step": 101679, "epoch": 605} {"train_loss": -9.751806259155273, "global_step": 101680, "epoch": 605} {"train_loss": -9.849235534667969, "global_step": 101681, "epoch": 605} {"train_loss": -9.974238395690918, "global_step": 101682, "epoch": 605} {"train_loss": -9.621208190917969, "global_step": 101683, "epoch": 605} {"train_loss": -9.793464660644531, "global_step": 101684, "epoch": 605} {"train_loss": -9.810237884521484, "global_step": 101685, "epoch": 605} {"train_loss": -9.812104225158691, "global_step": 101686, "epoch": 605} {"train_loss": -9.629064559936523, "global_step": 101687, "epoch": 605} {"train_loss": -9.678897857666016, "global_step": 101688, "epoch": 605} {"train_loss": -9.859567642211914, "global_step": 101689, "epoch": 605} {"train_loss": -9.506674766540527, "global_step": 101690, "epoch": 605} {"train_loss": -9.53386402130127, "global_step": 101691, "epoch": 605} {"train_loss": -9.686667442321777, "global_step": 101692, "epoch": 605} {"train_loss": -9.612317085266113, "global_step": 101693, "epoch": 605} {"train_loss": -9.892157554626465, "global_step": 101694, "epoch": 605} {"train_loss": -9.616460800170898, "global_step": 101695, "epoch": 605} {"train_loss": -9.643224716186523, "global_step": 101696, "epoch": 605} {"train_loss": -9.489221572875977, "global_step": 101697, "epoch": 605} {"train_loss": -9.55544662475586, "global_step": 101698, "epoch": 605} {"train_loss": -9.550552368164062, "global_step": 101699, "epoch": 605} {"train_loss": -9.884650230407715, "global_step": 101700, "epoch": 605} {"train_loss": -9.349945068359375, "global_step": 101701, "epoch": 605} {"train_loss": -9.28229808807373, "global_step": 101702, "epoch": 605} {"train_loss": -9.342227935791016, "global_step": 101703, "epoch": 605} {"train_loss": -9.642053604125977, "global_step": 101704, "epoch": 605} {"train_loss": -9.235624313354492, "global_step": 101705, "epoch": 605} {"train_loss": -9.586820602416992, "global_step": 101706, "epoch": 605} {"train_loss": -9.564547538757324, "global_step": 101707, "epoch": 605} {"train_loss": -9.696809768676758, "global_step": 101708, "epoch": 605} {"train_loss": -9.99229621887207, "global_step": 101709, "epoch": 605} {"train_loss": -9.658021926879883, "global_step": 101710, "epoch": 605} {"train_loss": -9.548783302307129, "global_step": 101711, "epoch": 605} {"train_loss": -9.747570037841797, "global_step": 101712, "epoch": 605} {"train_loss": -9.77706527709961, "global_step": 101713, "epoch": 605} {"train_loss": -9.48344612121582, "global_step": 101714, "epoch": 605} {"train_loss": -9.667230606079102, "global_step": 101715, "epoch": 605} {"train_loss": -9.867870330810547, "global_step": 101716, "epoch": 605} {"train_loss": -9.611067771911621, "global_step": 101717, "epoch": 605} {"train_loss": -9.782588005065918, "global_step": 101718, "epoch": 605} {"train_loss": -9.968165397644043, "global_step": 101719, "epoch": 605} {"train_loss": -9.649507522583008, "global_step": 101720, "epoch": 605} {"train_loss": -9.706926345825195, "global_step": 101721, "epoch": 605} {"train_loss": -9.848556518554688, "global_step": 101722, "epoch": 605} {"train_loss": -9.539477348327637, "global_step": 101723, "epoch": 605} {"train_loss": -9.696414947509766, "global_step": 101724, "epoch": 605} {"train_loss": -9.770652770996094, "global_step": 101725, "epoch": 605} {"train_loss": -9.943403244018555, "global_step": 101726, "epoch": 605} {"train_loss": -9.842463493347168, "global_step": 101727, "epoch": 605} {"train_loss": -9.472305297851562, "global_step": 101728, "epoch": 605} {"train_loss": -9.787287712097168, "global_step": 101729, "epoch": 605} {"train_loss": -9.743770599365234, "global_step": 101730, "epoch": 605} {"train_loss": -9.850625038146973, "global_step": 101731, "epoch": 605} {"train_loss": -9.766081809997559, "global_step": 101732, "epoch": 605} {"train_loss": -9.502431869506836, "global_step": 101733, "epoch": 605} {"train_loss": -9.816658020019531, "global_step": 101734, "epoch": 605} {"train_loss": -9.832572937011719, "global_step": 101735, "epoch": 605} {"train_loss": -9.805259704589844, "global_step": 101736, "epoch": 605} {"train_loss": -9.847400665283203, "global_step": 101737, "epoch": 605} {"train_loss": -9.575738906860352, "global_step": 101738, "epoch": 605} {"train_loss": -9.854259490966797, "global_step": 101739, "epoch": 605} {"train_loss": -9.629406929016113, "global_step": 101740, "epoch": 605} {"train_loss": -9.188520431518555, "global_step": 101741, "epoch": 605} {"train_loss": -9.82978630065918, "global_step": 101742, "epoch": 605} {"train_loss": -9.631414413452148, "global_step": 101743, "epoch": 605} {"train_loss": -9.761201858520508, "global_step": 101744, "epoch": 605} {"train_loss": -9.650396347045898, "global_step": 101745, "epoch": 605} {"train_loss": -9.320167541503906, "global_step": 101746, "epoch": 605} {"train_loss": -9.749664306640625, "global_step": 101747, "epoch": 605} {"train_loss": -9.788039207458496, "global_step": 101748, "epoch": 605} {"train_loss": -9.825586318969727, "global_step": 101749, "epoch": 605} {"train_loss": -9.787004470825195, "global_step": 101750, "epoch": 605} {"train_loss": -9.709968566894531, "global_step": 101751, "epoch": 605} {"train_loss": -9.697901725769043, "global_step": 101752, "epoch": 605} {"train_loss": -10.030435562133789, "global_step": 101753, "epoch": 605} {"train_loss": -9.62827205657959, "global_step": 101754, "epoch": 605} {"train_loss": -9.69825553894043, "global_step": 101755, "epoch": 605} {"train_loss": -9.783763885498047, "global_step": 101756, "epoch": 605} {"train_loss": -9.678464889526367, "global_step": 101757, "epoch": 605} {"train_loss": -9.931026458740234, "global_step": 101758, "epoch": 605} {"train_loss": -9.840646743774414, "global_step": 101759, "epoch": 605} {"train_loss": -9.619125366210938, "global_step": 101760, "epoch": 605} {"train_loss": -9.940180778503418, "global_step": 101761, "epoch": 605} {"train_loss": -9.529796600341797, "global_step": 101762, "epoch": 605} {"train_loss": -10.03118896484375, "global_step": 101763, "epoch": 605} {"train_loss": -9.937782287597656, "global_step": 101764, "epoch": 605} {"train_loss": -9.896551132202148, "global_step": 101765, "epoch": 605} {"train_loss": -9.777946472167969, "global_step": 101766, "epoch": 605} {"train_loss": -9.413131713867188, "global_step": 101767, "epoch": 605} {"train_loss": -9.544891357421875, "global_step": 101768, "epoch": 605} {"train_loss": -9.910048484802246, "global_step": 101769, "epoch": 605} {"train_loss": -9.819502830505371, "global_step": 101770, "epoch": 605} {"train_loss": -9.72182846069336, "global_step": 101771, "epoch": 605} {"train_loss": -9.836082458496094, "global_step": 101772, "epoch": 605} {"train_loss": -9.582928657531738, "global_step": 101773, "epoch": 605} {"train_loss": -9.986215591430664, "global_step": 101774, "epoch": 605} {"train_loss": -9.51568603515625, "global_step": 101775, "epoch": 605} {"train_loss": -9.701005935668945, "global_step": 101776, "epoch": 605} {"train_loss": -9.955562591552734, "global_step": 101777, "epoch": 605} {"train_loss": -9.383785247802734, "global_step": 101778, "epoch": 605} {"train_loss": -10.070058822631836, "global_step": 101779, "epoch": 605} {"train_loss": -8.938932418823242, "global_step": 101780, "epoch": 605} {"train_loss": -9.4737548828125, "global_step": 101781, "epoch": 605} {"train_loss": -9.419214248657227, "global_step": 101782, "epoch": 605} {"train_loss": -9.564065933227539, "global_step": 101783, "epoch": 605} {"train_loss": -9.400995254516602, "global_step": 101784, "epoch": 605} {"train_loss": -9.557966232299805, "global_step": 101785, "epoch": 605} {"train_loss": -9.66364860534668, "global_step": 101786, "epoch": 605} {"train_loss": -9.637075424194336, "global_step": 101787, "epoch": 605} {"train_loss": -9.482803344726562, "global_step": 101788, "epoch": 605} {"train_loss": -9.727025985717773, "global_step": 101789, "epoch": 605} {"train_loss": -9.40959358215332, "global_step": 101790, "epoch": 605} {"train_loss": -9.679343223571777, "global_step": 101791, "epoch": 605} {"train_loss": -9.607643127441406, "global_step": 101792, "epoch": 605} {"train_loss": -9.775529861450195, "global_step": 101793, "epoch": 605} {"train_loss": -9.704319953918457, "global_step": 101794, "epoch": 605} {"train_loss": -9.732747077941895, "global_step": 101795, "epoch": 605} {"train_loss": -9.656055450439453, "global_step": 101796, "epoch": 605} {"train_loss": -9.580429077148438, "global_step": 101797, "epoch": 605} {"train_loss": -9.618326187133789, "global_step": 101798, "epoch": 605} {"train_loss": -9.72658634185791, "global_step": 101799, "epoch": 605} {"train_loss": -9.56809139251709, "global_step": 101800, "epoch": 605} {"train_loss": -9.463510513305664, "global_step": 101801, "epoch": 605} {"train_loss": -9.835500717163086, "global_step": 101802, "epoch": 605} {"train_loss": -9.597776412963867, "global_step": 101803, "epoch": 605} {"train_loss": -9.606470108032227, "global_step": 101804, "epoch": 605} {"train_loss": -9.84217357635498, "global_step": 101805, "epoch": 605} {"train_loss": -9.721550941467285, "global_step": 101806, "epoch": 605} {"train_loss": -9.700567500931877, "global_step": 101807, "epoch": 605, "val_loss": 206986.140625, "train_action_mse_error": 3.5371007919311523} {"train_loss": -9.758638381958008, "global_step": 101808, "epoch": 606} {"train_loss": -9.82031536102295, "global_step": 101809, "epoch": 606} {"train_loss": -9.369112014770508, "global_step": 101810, "epoch": 606} {"train_loss": -9.940231323242188, "global_step": 101811, "epoch": 606} {"train_loss": -9.23513412475586, "global_step": 101812, "epoch": 606} {"train_loss": -9.233659744262695, "global_step": 101813, "epoch": 606} {"train_loss": -9.341019630432129, "global_step": 101814, "epoch": 606} {"train_loss": -9.516434669494629, "global_step": 101815, "epoch": 606} {"train_loss": -9.811782836914062, "global_step": 101816, "epoch": 606} {"train_loss": -9.41051959991455, "global_step": 101817, "epoch": 606} {"train_loss": -9.575773239135742, "global_step": 101818, "epoch": 606} {"train_loss": -9.404844284057617, "global_step": 101819, "epoch": 606} {"train_loss": -9.556394577026367, "global_step": 101820, "epoch": 606} {"train_loss": -9.454994201660156, "global_step": 101821, "epoch": 606} {"train_loss": -9.398161888122559, "global_step": 101822, "epoch": 606} {"train_loss": -9.459092140197754, "global_step": 101823, "epoch": 606} {"train_loss": -9.632652282714844, "global_step": 101824, "epoch": 606} {"train_loss": -9.749370574951172, "global_step": 101825, "epoch": 606} {"train_loss": -9.685404777526855, "global_step": 101826, "epoch": 606} {"train_loss": -9.588369369506836, "global_step": 101827, "epoch": 606} {"train_loss": -9.763381958007812, "global_step": 101828, "epoch": 606} {"train_loss": -9.371830940246582, "global_step": 101829, "epoch": 606} {"train_loss": -9.547825813293457, "global_step": 101830, "epoch": 606} {"train_loss": -9.326869010925293, "global_step": 101831, "epoch": 606} {"train_loss": -9.799633026123047, "global_step": 101832, "epoch": 606} {"train_loss": -9.644086837768555, "global_step": 101833, "epoch": 606} {"train_loss": -9.699935913085938, "global_step": 101834, "epoch": 606} {"train_loss": -9.724737167358398, "global_step": 101835, "epoch": 606} {"train_loss": -9.629108428955078, "global_step": 101836, "epoch": 606} {"train_loss": -9.648930549621582, "global_step": 101837, "epoch": 606} {"train_loss": -9.685851097106934, "global_step": 101838, "epoch": 606} {"train_loss": -9.678699493408203, "global_step": 101839, "epoch": 606} {"train_loss": -9.788832664489746, "global_step": 101840, "epoch": 606} {"train_loss": -9.766668319702148, "global_step": 101841, "epoch": 606} {"train_loss": -9.690328598022461, "global_step": 101842, "epoch": 606} {"train_loss": -9.727079391479492, "global_step": 101843, "epoch": 606} {"train_loss": -9.832488059997559, "global_step": 101844, "epoch": 606} {"train_loss": -9.766214370727539, "global_step": 101845, "epoch": 606} {"train_loss": -9.810966491699219, "global_step": 101846, "epoch": 606} {"train_loss": -9.766558647155762, "global_step": 101847, "epoch": 606} {"train_loss": -9.717265129089355, "global_step": 101848, "epoch": 606} {"train_loss": -9.921454429626465, "global_step": 101849, "epoch": 606} {"train_loss": -9.947546005249023, "global_step": 101850, "epoch": 606} {"train_loss": -9.826805114746094, "global_step": 101851, "epoch": 606} {"train_loss": -9.784626960754395, "global_step": 101852, "epoch": 606} {"train_loss": -9.731889724731445, "global_step": 101853, "epoch": 606} {"train_loss": -9.743986129760742, "global_step": 101854, "epoch": 606} {"train_loss": -9.787077903747559, "global_step": 101855, "epoch": 606} {"train_loss": -9.637596130371094, "global_step": 101856, "epoch": 606} {"train_loss": -9.942069053649902, "global_step": 101857, "epoch": 606} {"train_loss": -9.870051383972168, "global_step": 101858, "epoch": 606} {"train_loss": -9.755338668823242, "global_step": 101859, "epoch": 606} {"train_loss": -9.930980682373047, "global_step": 101860, "epoch": 606} {"train_loss": -9.710707664489746, "global_step": 101861, "epoch": 606} {"train_loss": -9.548727035522461, "global_step": 101862, "epoch": 606} {"train_loss": -9.713451385498047, "global_step": 101863, "epoch": 606} {"train_loss": -10.249515533447266, "global_step": 101864, "epoch": 606} {"train_loss": -9.609655380249023, "global_step": 101865, "epoch": 606} {"train_loss": -9.871095657348633, "global_step": 101866, "epoch": 606} {"train_loss": -9.905319213867188, "global_step": 101867, "epoch": 606} {"train_loss": -9.750433921813965, "global_step": 101868, "epoch": 606} {"train_loss": -9.755714416503906, "global_step": 101869, "epoch": 606} {"train_loss": -10.014030456542969, "global_step": 101870, "epoch": 606} {"train_loss": -9.690869331359863, "global_step": 101871, "epoch": 606} {"train_loss": -10.06271743774414, "global_step": 101872, "epoch": 606} {"train_loss": -9.841483116149902, "global_step": 101873, "epoch": 606} {"train_loss": -9.896154403686523, "global_step": 101874, "epoch": 606} {"train_loss": -9.774618148803711, "global_step": 101875, "epoch": 606} {"train_loss": -9.686662673950195, "global_step": 101876, "epoch": 606} {"train_loss": -10.107244491577148, "global_step": 101877, "epoch": 606} {"train_loss": -9.809974670410156, "global_step": 101878, "epoch": 606} {"train_loss": -9.859796524047852, "global_step": 101879, "epoch": 606} {"train_loss": -9.706541061401367, "global_step": 101880, "epoch": 606} {"train_loss": -9.659936904907227, "global_step": 101881, "epoch": 606} {"train_loss": -9.56568431854248, "global_step": 101882, "epoch": 606} {"train_loss": -9.470396041870117, "global_step": 101883, "epoch": 606} {"train_loss": -9.596696853637695, "global_step": 101884, "epoch": 606} {"train_loss": -9.738110542297363, "global_step": 101885, "epoch": 606} {"train_loss": -8.864446640014648, "global_step": 101886, "epoch": 606} {"train_loss": -9.927095413208008, "global_step": 101887, "epoch": 606} {"train_loss": -9.018505096435547, "global_step": 101888, "epoch": 606} {"train_loss": -9.32109260559082, "global_step": 101889, "epoch": 606} {"train_loss": -9.544665336608887, "global_step": 101890, "epoch": 606} {"train_loss": -9.530824661254883, "global_step": 101891, "epoch": 606} {"train_loss": -9.444918632507324, "global_step": 101892, "epoch": 606} {"train_loss": -9.23797607421875, "global_step": 101893, "epoch": 606} {"train_loss": -9.455472946166992, "global_step": 101894, "epoch": 606} {"train_loss": -9.213329315185547, "global_step": 101895, "epoch": 606} {"train_loss": -9.598395347595215, "global_step": 101896, "epoch": 606} {"train_loss": -9.181957244873047, "global_step": 101897, "epoch": 606} {"train_loss": -9.374112129211426, "global_step": 101898, "epoch": 606} {"train_loss": -9.47850227355957, "global_step": 101899, "epoch": 606} {"train_loss": -9.27244758605957, "global_step": 101900, "epoch": 606} {"train_loss": -9.379098892211914, "global_step": 101901, "epoch": 606} {"train_loss": -9.29381275177002, "global_step": 101902, "epoch": 606} {"train_loss": -9.360910415649414, "global_step": 101903, "epoch": 606} {"train_loss": -9.14313793182373, "global_step": 101904, "epoch": 606} {"train_loss": -9.737070083618164, "global_step": 101905, "epoch": 606} {"train_loss": -9.741351127624512, "global_step": 101906, "epoch": 606} {"train_loss": -9.401416778564453, "global_step": 101907, "epoch": 606} {"train_loss": -9.733011245727539, "global_step": 101908, "epoch": 606} {"train_loss": -9.693001747131348, "global_step": 101909, "epoch": 606} {"train_loss": -9.480636596679688, "global_step": 101910, "epoch": 606} {"train_loss": -9.523054122924805, "global_step": 101911, "epoch": 606} {"train_loss": -9.575837135314941, "global_step": 101912, "epoch": 606} {"train_loss": -9.722677230834961, "global_step": 101913, "epoch": 606} {"train_loss": -9.677350997924805, "global_step": 101914, "epoch": 606} {"train_loss": -9.77347183227539, "global_step": 101915, "epoch": 606} {"train_loss": -9.721487045288086, "global_step": 101916, "epoch": 606} {"train_loss": -9.573291778564453, "global_step": 101917, "epoch": 606} {"train_loss": -9.591836929321289, "global_step": 101918, "epoch": 606} {"train_loss": -9.768152236938477, "global_step": 101919, "epoch": 606} {"train_loss": -9.838628768920898, "global_step": 101920, "epoch": 606} {"train_loss": -9.754011154174805, "global_step": 101921, "epoch": 606} {"train_loss": -9.697608947753906, "global_step": 101922, "epoch": 606} {"train_loss": -9.78553295135498, "global_step": 101923, "epoch": 606} {"train_loss": -9.613116264343262, "global_step": 101924, "epoch": 606} {"train_loss": -9.927387237548828, "global_step": 101925, "epoch": 606} {"train_loss": -9.728784561157227, "global_step": 101926, "epoch": 606} {"train_loss": -9.819084167480469, "global_step": 101927, "epoch": 606} {"train_loss": -9.920254707336426, "global_step": 101928, "epoch": 606} {"train_loss": -9.861613273620605, "global_step": 101929, "epoch": 606} {"train_loss": -9.824056625366211, "global_step": 101930, "epoch": 606} {"train_loss": -9.756330490112305, "global_step": 101931, "epoch": 606} {"train_loss": -9.640226364135742, "global_step": 101932, "epoch": 606} {"train_loss": -9.828584671020508, "global_step": 101933, "epoch": 606} {"train_loss": -9.856245040893555, "global_step": 101934, "epoch": 606} {"train_loss": -9.85080623626709, "global_step": 101935, "epoch": 606} {"train_loss": -9.858619689941406, "global_step": 101936, "epoch": 606} {"train_loss": -9.861638069152832, "global_step": 101937, "epoch": 606} {"train_loss": -9.938100814819336, "global_step": 101938, "epoch": 606} {"train_loss": -9.92319393157959, "global_step": 101939, "epoch": 606} {"train_loss": -9.54050064086914, "global_step": 101940, "epoch": 606} {"train_loss": -10.123037338256836, "global_step": 101941, "epoch": 606} {"train_loss": -9.69327163696289, "global_step": 101942, "epoch": 606} {"train_loss": -9.802290916442871, "global_step": 101943, "epoch": 606} {"train_loss": -9.888964653015137, "global_step": 101944, "epoch": 606} {"train_loss": -9.928691864013672, "global_step": 101945, "epoch": 606} {"train_loss": -9.942865371704102, "global_step": 101946, "epoch": 606} {"train_loss": -9.952688217163086, "global_step": 101947, "epoch": 606} {"train_loss": -9.779794692993164, "global_step": 101948, "epoch": 606} {"train_loss": -9.820297241210938, "global_step": 101949, "epoch": 606} {"train_loss": -9.581779479980469, "global_step": 101950, "epoch": 606} {"train_loss": -9.556109428405762, "global_step": 101951, "epoch": 606} {"train_loss": -9.689286231994629, "global_step": 101952, "epoch": 606} {"train_loss": -9.567961692810059, "global_step": 101953, "epoch": 606} {"train_loss": -9.803874969482422, "global_step": 101954, "epoch": 606} {"train_loss": -9.605080604553223, "global_step": 101955, "epoch": 606} {"train_loss": -9.82528305053711, "global_step": 101956, "epoch": 606} {"train_loss": -9.448532104492188, "global_step": 101957, "epoch": 606} {"train_loss": -9.680562973022461, "global_step": 101958, "epoch": 606} {"train_loss": -9.558483123779297, "global_step": 101959, "epoch": 606} {"train_loss": -9.87885856628418, "global_step": 101960, "epoch": 606} {"train_loss": -9.771951675415039, "global_step": 101961, "epoch": 606} {"train_loss": -9.651567459106445, "global_step": 101962, "epoch": 606} {"train_loss": -9.752212524414062, "global_step": 101963, "epoch": 606} {"train_loss": -9.643050193786621, "global_step": 101964, "epoch": 606} {"train_loss": -9.90585994720459, "global_step": 101965, "epoch": 606} {"train_loss": -9.8125, "global_step": 101966, "epoch": 606} {"train_loss": -9.69662857055664, "global_step": 101967, "epoch": 606} {"train_loss": -9.794458389282227, "global_step": 101968, "epoch": 606} {"train_loss": -9.794841766357422, "global_step": 101969, "epoch": 606} {"train_loss": -9.842414855957031, "global_step": 101970, "epoch": 606} {"train_loss": -9.94662094116211, "global_step": 101971, "epoch": 606} {"train_loss": -9.831958770751953, "global_step": 101972, "epoch": 606} {"train_loss": -9.8058443069458, "global_step": 101973, "epoch": 606} {"train_loss": -9.887170791625977, "global_step": 101974, "epoch": 606} {"train_loss": -9.685841605776833, "global_step": 101975, "epoch": 606, "val_loss": 206329.9375} {"train_loss": -9.931448936462402, "global_step": 101976, "epoch": 607} {"train_loss": -9.856992721557617, "global_step": 101977, "epoch": 607} {"train_loss": -9.876609802246094, "global_step": 101978, "epoch": 607} {"train_loss": -9.648239135742188, "global_step": 101979, "epoch": 607} {"train_loss": -9.780595779418945, "global_step": 101980, "epoch": 607} {"train_loss": -9.921929359436035, "global_step": 101981, "epoch": 607} {"train_loss": -9.67901611328125, "global_step": 101982, "epoch": 607} {"train_loss": -9.648855209350586, "global_step": 101983, "epoch": 607} {"train_loss": -9.561073303222656, "global_step": 101984, "epoch": 607} {"train_loss": -9.803715705871582, "global_step": 101985, "epoch": 607} {"train_loss": -9.387155532836914, "global_step": 101986, "epoch": 607} {"train_loss": -10.032690048217773, "global_step": 101987, "epoch": 607} {"train_loss": -9.612164497375488, "global_step": 101988, "epoch": 607} {"train_loss": -9.640380859375, "global_step": 101989, "epoch": 607} {"train_loss": -9.720836639404297, "global_step": 101990, "epoch": 607} {"train_loss": -9.55026626586914, "global_step": 101991, "epoch": 607} {"train_loss": -9.608627319335938, "global_step": 101992, "epoch": 607} {"train_loss": -9.68402099609375, "global_step": 101993, "epoch": 607} {"train_loss": -9.737417221069336, "global_step": 101994, "epoch": 607} {"train_loss": -9.894967079162598, "global_step": 101995, "epoch": 607} {"train_loss": -9.730597496032715, "global_step": 101996, "epoch": 607} {"train_loss": -9.773794174194336, "global_step": 101997, "epoch": 607} {"train_loss": -9.910120010375977, "global_step": 101998, "epoch": 607} {"train_loss": -9.791160583496094, "global_step": 101999, "epoch": 607} {"train_loss": -9.757586479187012, "global_step": 102000, "epoch": 607} {"train_loss": -9.966102600097656, "global_step": 102001, "epoch": 607} {"train_loss": -9.918159484863281, "global_step": 102002, "epoch": 607} {"train_loss": -9.461832046508789, "global_step": 102003, "epoch": 607} {"train_loss": -9.921128273010254, "global_step": 102004, "epoch": 607} {"train_loss": -9.825553894042969, "global_step": 102005, "epoch": 607} {"train_loss": -9.961810111999512, "global_step": 102006, "epoch": 607} {"train_loss": -9.69133186340332, "global_step": 102007, "epoch": 607} {"train_loss": -9.910041809082031, "global_step": 102008, "epoch": 607} {"train_loss": -9.753055572509766, "global_step": 102009, "epoch": 607} {"train_loss": -9.741510391235352, "global_step": 102010, "epoch": 607} {"train_loss": -9.871339797973633, "global_step": 102011, "epoch": 607} {"train_loss": -10.043695449829102, "global_step": 102012, "epoch": 607} {"train_loss": -9.723451614379883, "global_step": 102013, "epoch": 607} {"train_loss": -10.165349006652832, "global_step": 102014, "epoch": 607} {"train_loss": -9.70517349243164, "global_step": 102015, "epoch": 607} {"train_loss": -10.008406639099121, "global_step": 102016, "epoch": 607} {"train_loss": -9.871683120727539, "global_step": 102017, "epoch": 607} {"train_loss": -10.10966968536377, "global_step": 102018, "epoch": 607} {"train_loss": -10.025169372558594, "global_step": 102019, "epoch": 607} {"train_loss": -9.834121704101562, "global_step": 102020, "epoch": 607} {"train_loss": -9.978107452392578, "global_step": 102021, "epoch": 607} {"train_loss": -9.995891571044922, "global_step": 102022, "epoch": 607} {"train_loss": -9.767326354980469, "global_step": 102023, "epoch": 607} {"train_loss": -9.962114334106445, "global_step": 102024, "epoch": 607} {"train_loss": -9.84274673461914, "global_step": 102025, "epoch": 607} {"train_loss": -9.82138442993164, "global_step": 102026, "epoch": 607} {"train_loss": -9.906002044677734, "global_step": 102027, "epoch": 607} {"train_loss": -10.023334503173828, "global_step": 102028, "epoch": 607} {"train_loss": -9.948383331298828, "global_step": 102029, "epoch": 607} {"train_loss": -10.09385871887207, "global_step": 102030, "epoch": 607} {"train_loss": -9.97602653503418, "global_step": 102031, "epoch": 607} {"train_loss": -9.787169456481934, "global_step": 102032, "epoch": 607} {"train_loss": -10.04863452911377, "global_step": 102033, "epoch": 607} {"train_loss": -10.020634651184082, "global_step": 102034, "epoch": 607} {"train_loss": -10.009950637817383, "global_step": 102035, "epoch": 607} {"train_loss": -9.733335494995117, "global_step": 102036, "epoch": 607} {"train_loss": -10.056476593017578, "global_step": 102037, "epoch": 607} {"train_loss": -9.862276077270508, "global_step": 102038, "epoch": 607} {"train_loss": -10.054264068603516, "global_step": 102039, "epoch": 607} {"train_loss": -9.932683944702148, "global_step": 102040, "epoch": 607} {"train_loss": -9.640459060668945, "global_step": 102041, "epoch": 607} {"train_loss": -10.114011764526367, "global_step": 102042, "epoch": 607} {"train_loss": -9.850566864013672, "global_step": 102043, "epoch": 607} {"train_loss": -9.778799057006836, "global_step": 102044, "epoch": 607} {"train_loss": -9.84365177154541, "global_step": 102045, "epoch": 607} {"train_loss": -9.640304565429688, "global_step": 102046, "epoch": 607} {"train_loss": -9.713226318359375, "global_step": 102047, "epoch": 607} {"train_loss": -9.555154800415039, "global_step": 102048, "epoch": 607} {"train_loss": -9.872304916381836, "global_step": 102049, "epoch": 607} {"train_loss": -9.687727928161621, "global_step": 102050, "epoch": 607} {"train_loss": -9.699810981750488, "global_step": 102051, "epoch": 607} {"train_loss": -10.053205490112305, "global_step": 102052, "epoch": 607} {"train_loss": -10.012069702148438, "global_step": 102053, "epoch": 607} {"train_loss": -9.953056335449219, "global_step": 102054, "epoch": 607} {"train_loss": -9.998574256896973, "global_step": 102055, "epoch": 607} {"train_loss": -9.408090591430664, "global_step": 102056, "epoch": 607} {"train_loss": -9.511947631835938, "global_step": 102057, "epoch": 607} {"train_loss": -9.82767105102539, "global_step": 102058, "epoch": 607} {"train_loss": -9.320159912109375, "global_step": 102059, "epoch": 607} {"train_loss": -9.836837768554688, "global_step": 102060, "epoch": 607} {"train_loss": -9.678861618041992, "global_step": 102061, "epoch": 607} {"train_loss": -9.41314697265625, "global_step": 102062, "epoch": 607} {"train_loss": -9.959331512451172, "global_step": 102063, "epoch": 607} {"train_loss": -9.511336326599121, "global_step": 102064, "epoch": 607} {"train_loss": -9.692983627319336, "global_step": 102065, "epoch": 607} {"train_loss": -9.603050231933594, "global_step": 102066, "epoch": 607} {"train_loss": -9.445402145385742, "global_step": 102067, "epoch": 607} {"train_loss": -9.449764251708984, "global_step": 102068, "epoch": 607} {"train_loss": -9.529960632324219, "global_step": 102069, "epoch": 607} {"train_loss": -9.359683990478516, "global_step": 102070, "epoch": 607} {"train_loss": -9.602592468261719, "global_step": 102071, "epoch": 607} {"train_loss": -9.474855422973633, "global_step": 102072, "epoch": 607} {"train_loss": -9.571329116821289, "global_step": 102073, "epoch": 607} {"train_loss": -9.383074760437012, "global_step": 102074, "epoch": 607} {"train_loss": -9.314763069152832, "global_step": 102075, "epoch": 607} {"train_loss": -9.473774909973145, "global_step": 102076, "epoch": 607} {"train_loss": -9.782794952392578, "global_step": 102077, "epoch": 607} {"train_loss": -9.469529151916504, "global_step": 102078, "epoch": 607} {"train_loss": -9.880796432495117, "global_step": 102079, "epoch": 607} {"train_loss": -9.89956283569336, "global_step": 102080, "epoch": 607} {"train_loss": -9.912744522094727, "global_step": 102081, "epoch": 607} {"train_loss": -9.646129608154297, "global_step": 102082, "epoch": 607} {"train_loss": -9.904987335205078, "global_step": 102083, "epoch": 607} {"train_loss": -9.816444396972656, "global_step": 102084, "epoch": 607} {"train_loss": -9.769978523254395, "global_step": 102085, "epoch": 607} {"train_loss": -9.617032051086426, "global_step": 102086, "epoch": 607} {"train_loss": -10.012737274169922, "global_step": 102087, "epoch": 607} {"train_loss": -9.869393348693848, "global_step": 102088, "epoch": 607} {"train_loss": -9.990655899047852, "global_step": 102089, "epoch": 607} {"train_loss": -9.834259033203125, "global_step": 102090, "epoch": 607} {"train_loss": -10.02536392211914, "global_step": 102091, "epoch": 607} {"train_loss": -9.9818115234375, "global_step": 102092, "epoch": 607} {"train_loss": -9.941877365112305, "global_step": 102093, "epoch": 607} {"train_loss": -9.588166236877441, "global_step": 102094, "epoch": 607} {"train_loss": -9.64567756652832, "global_step": 102095, "epoch": 607} {"train_loss": -9.823243141174316, "global_step": 102096, "epoch": 607} {"train_loss": -9.843238830566406, "global_step": 102097, "epoch": 607} {"train_loss": -9.632120132446289, "global_step": 102098, "epoch": 607} {"train_loss": -9.822879791259766, "global_step": 102099, "epoch": 607} {"train_loss": -9.74298095703125, "global_step": 102100, "epoch": 607} {"train_loss": -9.707073211669922, "global_step": 102101, "epoch": 607} {"train_loss": -9.789299964904785, "global_step": 102102, "epoch": 607} {"train_loss": -9.824506759643555, "global_step": 102103, "epoch": 607} {"train_loss": -9.734962463378906, "global_step": 102104, "epoch": 607} {"train_loss": -9.646520614624023, "global_step": 102105, "epoch": 607} {"train_loss": -9.77035903930664, "global_step": 102106, "epoch": 607} {"train_loss": -9.281715393066406, "global_step": 102107, "epoch": 607} {"train_loss": -9.482912063598633, "global_step": 102108, "epoch": 607} {"train_loss": -9.75481128692627, "global_step": 102109, "epoch": 607} {"train_loss": -9.434832572937012, "global_step": 102110, "epoch": 607} {"train_loss": -9.590373039245605, "global_step": 102111, "epoch": 607} {"train_loss": -9.417106628417969, "global_step": 102112, "epoch": 607} {"train_loss": -9.822649002075195, "global_step": 102113, "epoch": 607} {"train_loss": -9.558137893676758, "global_step": 102114, "epoch": 607} {"train_loss": -9.66566276550293, "global_step": 102115, "epoch": 607} {"train_loss": -9.769243240356445, "global_step": 102116, "epoch": 607} {"train_loss": -9.526962280273438, "global_step": 102117, "epoch": 607} {"train_loss": -9.403436660766602, "global_step": 102118, "epoch": 607} {"train_loss": -9.548368453979492, "global_step": 102119, "epoch": 607} {"train_loss": -9.273534774780273, "global_step": 102120, "epoch": 607} {"train_loss": -9.466758728027344, "global_step": 102121, "epoch": 607} {"train_loss": -9.400123596191406, "global_step": 102122, "epoch": 607} {"train_loss": -9.348325729370117, "global_step": 102123, "epoch": 607} {"train_loss": -9.598701477050781, "global_step": 102124, "epoch": 607} {"train_loss": -9.22393798828125, "global_step": 102125, "epoch": 607} {"train_loss": -9.602190017700195, "global_step": 102126, "epoch": 607} {"train_loss": -9.677377700805664, "global_step": 102127, "epoch": 607} {"train_loss": -9.442352294921875, "global_step": 102128, "epoch": 607} {"train_loss": -9.404305458068848, "global_step": 102129, "epoch": 607} {"train_loss": -9.760528564453125, "global_step": 102130, "epoch": 607} {"train_loss": -9.545862197875977, "global_step": 102131, "epoch": 607} {"train_loss": -9.854354858398438, "global_step": 102132, "epoch": 607} {"train_loss": -9.732671737670898, "global_step": 102133, "epoch": 607} {"train_loss": -9.83473014831543, "global_step": 102134, "epoch": 607} {"train_loss": -9.854333877563477, "global_step": 102135, "epoch": 607} {"train_loss": -9.81938362121582, "global_step": 102136, "epoch": 607} {"train_loss": -9.793197631835938, "global_step": 102137, "epoch": 607} {"train_loss": -9.686803817749023, "global_step": 102138, "epoch": 607} {"train_loss": -9.773324012756348, "global_step": 102139, "epoch": 607} {"train_loss": -9.919772148132324, "global_step": 102140, "epoch": 607} {"train_loss": -9.704055786132812, "global_step": 102141, "epoch": 607} {"train_loss": -9.878877639770508, "global_step": 102142, "epoch": 607} {"train_loss": -9.746384416307722, "global_step": 102143, "epoch": 607, "val_loss": 206467.28125} {"train_loss": -9.664304733276367, "global_step": 102144, "epoch": 608} {"train_loss": -9.767799377441406, "global_step": 102145, "epoch": 608} {"train_loss": -9.825031280517578, "global_step": 102146, "epoch": 608} {"train_loss": -9.879085540771484, "global_step": 102147, "epoch": 608} {"train_loss": -10.05456829071045, "global_step": 102148, "epoch": 608} {"train_loss": -9.84592056274414, "global_step": 102149, "epoch": 608} {"train_loss": -9.959062576293945, "global_step": 102150, "epoch": 608} {"train_loss": -9.828787803649902, "global_step": 102151, "epoch": 608} {"train_loss": -9.89992904663086, "global_step": 102152, "epoch": 608} {"train_loss": -10.021753311157227, "global_step": 102153, "epoch": 608} {"train_loss": -9.987756729125977, "global_step": 102154, "epoch": 608} {"train_loss": -9.917757034301758, "global_step": 102155, "epoch": 608} {"train_loss": -9.954513549804688, "global_step": 102156, "epoch": 608} {"train_loss": -9.817136764526367, "global_step": 102157, "epoch": 608} {"train_loss": -9.803314208984375, "global_step": 102158, "epoch": 608} {"train_loss": -10.169867515563965, "global_step": 102159, "epoch": 608} {"train_loss": -9.762760162353516, "global_step": 102160, "epoch": 608} {"train_loss": -10.031272888183594, "global_step": 102161, "epoch": 608} {"train_loss": -9.982410430908203, "global_step": 102162, "epoch": 608} {"train_loss": -9.874713897705078, "global_step": 102163, "epoch": 608} {"train_loss": -9.97852897644043, "global_step": 102164, "epoch": 608} {"train_loss": -9.869792938232422, "global_step": 102165, "epoch": 608} {"train_loss": -9.573904037475586, "global_step": 102166, "epoch": 608} {"train_loss": -9.783266067504883, "global_step": 102167, "epoch": 608} {"train_loss": -9.859054565429688, "global_step": 102168, "epoch": 608} {"train_loss": -9.26445484161377, "global_step": 102169, "epoch": 608} {"train_loss": -9.53683853149414, "global_step": 102170, "epoch": 608} {"train_loss": -9.523029327392578, "global_step": 102171, "epoch": 608} {"train_loss": -9.745893478393555, "global_step": 102172, "epoch": 608} {"train_loss": -9.38217544555664, "global_step": 102173, "epoch": 608} {"train_loss": -9.212639808654785, "global_step": 102174, "epoch": 608} {"train_loss": -9.636104583740234, "global_step": 102175, "epoch": 608} {"train_loss": -9.50361442565918, "global_step": 102176, "epoch": 608} {"train_loss": -9.588709831237793, "global_step": 102177, "epoch": 608} {"train_loss": -9.468523025512695, "global_step": 102178, "epoch": 608} {"train_loss": -9.37913990020752, "global_step": 102179, "epoch": 608} {"train_loss": -9.692523956298828, "global_step": 102180, "epoch": 608} {"train_loss": -9.465980529785156, "global_step": 102181, "epoch": 608} {"train_loss": -9.586322784423828, "global_step": 102182, "epoch": 608} {"train_loss": -9.881231307983398, "global_step": 102183, "epoch": 608} {"train_loss": -9.422882080078125, "global_step": 102184, "epoch": 608} {"train_loss": -9.810761451721191, "global_step": 102185, "epoch": 608} {"train_loss": -9.48959732055664, "global_step": 102186, "epoch": 608} {"train_loss": -9.58266830444336, "global_step": 102187, "epoch": 608} {"train_loss": -9.77126407623291, "global_step": 102188, "epoch": 608} {"train_loss": -9.492857933044434, "global_step": 102189, "epoch": 608} {"train_loss": -9.72455883026123, "global_step": 102190, "epoch": 608} {"train_loss": -9.824034690856934, "global_step": 102191, "epoch": 608} {"train_loss": -9.767210006713867, "global_step": 102192, "epoch": 608} {"train_loss": -10.002748489379883, "global_step": 102193, "epoch": 608} {"train_loss": -9.698768615722656, "global_step": 102194, "epoch": 608} {"train_loss": -9.996383666992188, "global_step": 102195, "epoch": 608} {"train_loss": -9.844552993774414, "global_step": 102196, "epoch": 608} {"train_loss": -9.67020034790039, "global_step": 102197, "epoch": 608} {"train_loss": -9.521175384521484, "global_step": 102198, "epoch": 608} {"train_loss": -9.78856086730957, "global_step": 102199, "epoch": 608} {"train_loss": -9.900660514831543, "global_step": 102200, "epoch": 608} {"train_loss": -9.752846717834473, "global_step": 102201, "epoch": 608} {"train_loss": -9.838383674621582, "global_step": 102202, "epoch": 608} {"train_loss": -9.788778305053711, "global_step": 102203, "epoch": 608} {"train_loss": -9.72735595703125, "global_step": 102204, "epoch": 608} {"train_loss": -9.635152816772461, "global_step": 102205, "epoch": 608} {"train_loss": -9.606219291687012, "global_step": 102206, "epoch": 608} {"train_loss": -9.542106628417969, "global_step": 102207, "epoch": 608} {"train_loss": -9.935688972473145, "global_step": 102208, "epoch": 608} {"train_loss": -9.769719123840332, "global_step": 102209, "epoch": 608} {"train_loss": -9.92648983001709, "global_step": 102210, "epoch": 608} {"train_loss": -10.152342796325684, "global_step": 102211, "epoch": 608} {"train_loss": -9.793903350830078, "global_step": 102212, "epoch": 608} {"train_loss": -9.717665672302246, "global_step": 102213, "epoch": 608} {"train_loss": -10.104435920715332, "global_step": 102214, "epoch": 608} {"train_loss": -9.798192024230957, "global_step": 102215, "epoch": 608} {"train_loss": -9.786579132080078, "global_step": 102216, "epoch": 608} {"train_loss": -9.432043075561523, "global_step": 102217, "epoch": 608} {"train_loss": -9.711905479431152, "global_step": 102218, "epoch": 608} {"train_loss": -9.177932739257812, "global_step": 102219, "epoch": 608} {"train_loss": -9.45293140411377, "global_step": 102220, "epoch": 608} {"train_loss": -9.41139030456543, "global_step": 102221, "epoch": 608} {"train_loss": -9.798866271972656, "global_step": 102222, "epoch": 608} {"train_loss": -9.323356628417969, "global_step": 102223, "epoch": 608} {"train_loss": -9.198248863220215, "global_step": 102224, "epoch": 608} {"train_loss": -9.635053634643555, "global_step": 102225, "epoch": 608} {"train_loss": -9.529912948608398, "global_step": 102226, "epoch": 608} {"train_loss": -9.694028854370117, "global_step": 102227, "epoch": 608} {"train_loss": -9.613897323608398, "global_step": 102228, "epoch": 608} {"train_loss": -9.791576385498047, "global_step": 102229, "epoch": 608} {"train_loss": -9.693521499633789, "global_step": 102230, "epoch": 608} {"train_loss": -9.84019660949707, "global_step": 102231, "epoch": 608} {"train_loss": -9.691930770874023, "global_step": 102232, "epoch": 608} {"train_loss": -9.614629745483398, "global_step": 102233, "epoch": 608} {"train_loss": -9.739311218261719, "global_step": 102234, "epoch": 608} {"train_loss": -9.522537231445312, "global_step": 102235, "epoch": 608} {"train_loss": -9.741607666015625, "global_step": 102236, "epoch": 608} {"train_loss": -9.857864379882812, "global_step": 102237, "epoch": 608} {"train_loss": -9.541313171386719, "global_step": 102238, "epoch": 608} {"train_loss": -9.920343399047852, "global_step": 102239, "epoch": 608} {"train_loss": -9.886423110961914, "global_step": 102240, "epoch": 608} {"train_loss": -9.764976501464844, "global_step": 102241, "epoch": 608} {"train_loss": -10.03149127960205, "global_step": 102242, "epoch": 608} {"train_loss": -9.69986343383789, "global_step": 102243, "epoch": 608} {"train_loss": -9.808767318725586, "global_step": 102244, "epoch": 608} {"train_loss": -9.975386619567871, "global_step": 102245, "epoch": 608} {"train_loss": -9.70266342163086, "global_step": 102246, "epoch": 608} {"train_loss": -9.998590469360352, "global_step": 102247, "epoch": 608} {"train_loss": -9.849388122558594, "global_step": 102248, "epoch": 608} {"train_loss": -10.028472900390625, "global_step": 102249, "epoch": 608} {"train_loss": -9.944912910461426, "global_step": 102250, "epoch": 608} {"train_loss": -10.026498794555664, "global_step": 102251, "epoch": 608} {"train_loss": -9.664648056030273, "global_step": 102252, "epoch": 608} {"train_loss": -10.039085388183594, "global_step": 102253, "epoch": 608} {"train_loss": -9.833307266235352, "global_step": 102254, "epoch": 608} {"train_loss": -9.636449813842773, "global_step": 102255, "epoch": 608} {"train_loss": -9.974455833435059, "global_step": 102256, "epoch": 608} {"train_loss": -9.618021011352539, "global_step": 102257, "epoch": 608} {"train_loss": -10.033706665039062, "global_step": 102258, "epoch": 608} {"train_loss": -9.732711791992188, "global_step": 102259, "epoch": 608} {"train_loss": -9.759929656982422, "global_step": 102260, "epoch": 608} {"train_loss": -9.825180053710938, "global_step": 102261, "epoch": 608} {"train_loss": -9.616205215454102, "global_step": 102262, "epoch": 608} {"train_loss": -9.883289337158203, "global_step": 102263, "epoch": 608} {"train_loss": -9.812973022460938, "global_step": 102264, "epoch": 608} {"train_loss": -10.100424766540527, "global_step": 102265, "epoch": 608} {"train_loss": -10.086453437805176, "global_step": 102266, "epoch": 608} {"train_loss": -9.887279510498047, "global_step": 102267, "epoch": 608} {"train_loss": -9.916343688964844, "global_step": 102268, "epoch": 608} {"train_loss": -9.79896354675293, "global_step": 102269, "epoch": 608} {"train_loss": -9.910672187805176, "global_step": 102270, "epoch": 608} {"train_loss": -9.654820442199707, "global_step": 102271, "epoch": 608} {"train_loss": -9.755102157592773, "global_step": 102272, "epoch": 608} {"train_loss": -9.537693977355957, "global_step": 102273, "epoch": 608} {"train_loss": -9.965097427368164, "global_step": 102274, "epoch": 608} {"train_loss": -9.770009994506836, "global_step": 102275, "epoch": 608} {"train_loss": -9.344993591308594, "global_step": 102276, "epoch": 608} {"train_loss": -9.846580505371094, "global_step": 102277, "epoch": 608} {"train_loss": -9.416641235351562, "global_step": 102278, "epoch": 608} {"train_loss": -9.91435432434082, "global_step": 102279, "epoch": 608} {"train_loss": -9.525247573852539, "global_step": 102280, "epoch": 608} {"train_loss": -9.909725189208984, "global_step": 102281, "epoch": 608} {"train_loss": -9.736396789550781, "global_step": 102282, "epoch": 608} {"train_loss": -9.82418441772461, "global_step": 102283, "epoch": 608} {"train_loss": -9.942909240722656, "global_step": 102284, "epoch": 608} {"train_loss": -9.767712593078613, "global_step": 102285, "epoch": 608} {"train_loss": -9.779916763305664, "global_step": 102286, "epoch": 608} {"train_loss": -10.175861358642578, "global_step": 102287, "epoch": 608} {"train_loss": -9.595609664916992, "global_step": 102288, "epoch": 608} {"train_loss": -9.59360408782959, "global_step": 102289, "epoch": 608} {"train_loss": -9.472436904907227, "global_step": 102290, "epoch": 608} {"train_loss": -9.298107147216797, "global_step": 102291, "epoch": 608} {"train_loss": -9.494300842285156, "global_step": 102292, "epoch": 608} {"train_loss": -8.83871078491211, "global_step": 102293, "epoch": 608} {"train_loss": -8.856756210327148, "global_step": 102294, "epoch": 608} {"train_loss": -8.747777938842773, "global_step": 102295, "epoch": 608} {"train_loss": -9.007547378540039, "global_step": 102296, "epoch": 608} {"train_loss": -8.978012084960938, "global_step": 102297, "epoch": 608} {"train_loss": -9.131325721740723, "global_step": 102298, "epoch": 608} {"train_loss": -9.081924438476562, "global_step": 102299, "epoch": 608} {"train_loss": -9.069517135620117, "global_step": 102300, "epoch": 608} {"train_loss": -9.30412483215332, "global_step": 102301, "epoch": 608} {"train_loss": -9.176037788391113, "global_step": 102302, "epoch": 608} {"train_loss": -9.540352821350098, "global_step": 102303, "epoch": 608} {"train_loss": -9.420284271240234, "global_step": 102304, "epoch": 608} {"train_loss": -9.59363842010498, "global_step": 102305, "epoch": 608} {"train_loss": -9.65726375579834, "global_step": 102306, "epoch": 608} {"train_loss": -9.311956405639648, "global_step": 102307, "epoch": 608} {"train_loss": -9.564000129699707, "global_step": 102308, "epoch": 608} {"train_loss": -9.53969955444336, "global_step": 102309, "epoch": 608} {"train_loss": -9.532620429992676, "global_step": 102310, "epoch": 608} {"train_loss": -9.691282113393148, "global_step": 102311, "epoch": 608, "val_loss": 205684.828125} {"train_loss": -9.793615341186523, "global_step": 102312, "epoch": 609} {"train_loss": -9.550689697265625, "global_step": 102313, "epoch": 609} {"train_loss": -9.484596252441406, "global_step": 102314, "epoch": 609} {"train_loss": -9.719531059265137, "global_step": 102315, "epoch": 609} {"train_loss": -9.564680099487305, "global_step": 102316, "epoch": 609} {"train_loss": -9.598549842834473, "global_step": 102317, "epoch": 609} {"train_loss": -9.580232620239258, "global_step": 102318, "epoch": 609} {"train_loss": -9.840887069702148, "global_step": 102319, "epoch": 609} {"train_loss": -9.843241691589355, "global_step": 102320, "epoch": 609} {"train_loss": -9.834226608276367, "global_step": 102321, "epoch": 609} {"train_loss": -9.722829818725586, "global_step": 102322, "epoch": 609} {"train_loss": -9.71446418762207, "global_step": 102323, "epoch": 609} {"train_loss": -9.847328186035156, "global_step": 102324, "epoch": 609} {"train_loss": -9.709766387939453, "global_step": 102325, "epoch": 609} {"train_loss": -9.788843154907227, "global_step": 102326, "epoch": 609} {"train_loss": -9.700777053833008, "global_step": 102327, "epoch": 609} {"train_loss": -9.964271545410156, "global_step": 102328, "epoch": 609} {"train_loss": -9.797517776489258, "global_step": 102329, "epoch": 609} {"train_loss": -9.94179630279541, "global_step": 102330, "epoch": 609} {"train_loss": -9.879048347473145, "global_step": 102331, "epoch": 609} {"train_loss": -9.95950984954834, "global_step": 102332, "epoch": 609} {"train_loss": -10.011238098144531, "global_step": 102333, "epoch": 609} {"train_loss": -10.085071563720703, "global_step": 102334, "epoch": 609} {"train_loss": -9.762271881103516, "global_step": 102335, "epoch": 609} {"train_loss": -10.096744537353516, "global_step": 102336, "epoch": 609} {"train_loss": -10.029075622558594, "global_step": 102337, "epoch": 609} {"train_loss": -10.043697357177734, "global_step": 102338, "epoch": 609} {"train_loss": -9.92839527130127, "global_step": 102339, "epoch": 609} {"train_loss": -10.056625366210938, "global_step": 102340, "epoch": 609} {"train_loss": -9.814924240112305, "global_step": 102341, "epoch": 609} {"train_loss": -9.46147346496582, "global_step": 102342, "epoch": 609} {"train_loss": -9.911846160888672, "global_step": 102343, "epoch": 609} {"train_loss": -9.923181533813477, "global_step": 102344, "epoch": 609} {"train_loss": -9.713570594787598, "global_step": 102345, "epoch": 609} {"train_loss": -9.956273078918457, "global_step": 102346, "epoch": 609} {"train_loss": -9.950793266296387, "global_step": 102347, "epoch": 609} {"train_loss": -9.855956077575684, "global_step": 102348, "epoch": 609} {"train_loss": -8.844441413879395, "global_step": 102349, "epoch": 609} {"train_loss": -8.942144393920898, "global_step": 102350, "epoch": 609} {"train_loss": -9.407763481140137, "global_step": 102351, "epoch": 609} {"train_loss": -8.40986442565918, "global_step": 102352, "epoch": 609} {"train_loss": -9.402341842651367, "global_step": 102353, "epoch": 609} {"train_loss": -8.560153007507324, "global_step": 102354, "epoch": 609} {"train_loss": -9.140946388244629, "global_step": 102355, "epoch": 609} {"train_loss": -8.98973274230957, "global_step": 102356, "epoch": 609} {"train_loss": -8.813443183898926, "global_step": 102357, "epoch": 609} {"train_loss": -9.243160247802734, "global_step": 102358, "epoch": 609} {"train_loss": -8.721220970153809, "global_step": 102359, "epoch": 609} {"train_loss": -9.06088924407959, "global_step": 102360, "epoch": 609} {"train_loss": -9.186676025390625, "global_step": 102361, "epoch": 609} {"train_loss": -9.365509033203125, "global_step": 102362, "epoch": 609} {"train_loss": -9.443257331848145, "global_step": 102363, "epoch": 609} {"train_loss": -9.136695861816406, "global_step": 102364, "epoch": 609} {"train_loss": -9.45164680480957, "global_step": 102365, "epoch": 609} {"train_loss": -9.355141639709473, "global_step": 102366, "epoch": 609} {"train_loss": -9.043558120727539, "global_step": 102367, "epoch": 609} {"train_loss": -8.983297348022461, "global_step": 102368, "epoch": 609} {"train_loss": -9.361822128295898, "global_step": 102369, "epoch": 609} {"train_loss": -9.385812759399414, "global_step": 102370, "epoch": 609} {"train_loss": -9.233880996704102, "global_step": 102371, "epoch": 609} {"train_loss": -9.261093139648438, "global_step": 102372, "epoch": 609} {"train_loss": -9.48714542388916, "global_step": 102373, "epoch": 609} {"train_loss": -9.583025932312012, "global_step": 102374, "epoch": 609} {"train_loss": -9.416032791137695, "global_step": 102375, "epoch": 609} {"train_loss": -9.422362327575684, "global_step": 102376, "epoch": 609} {"train_loss": -9.625617980957031, "global_step": 102377, "epoch": 609} {"train_loss": -9.567988395690918, "global_step": 102378, "epoch": 609} {"train_loss": -9.326714515686035, "global_step": 102379, "epoch": 609} {"train_loss": -9.676952362060547, "global_step": 102380, "epoch": 609} {"train_loss": -9.666742324829102, "global_step": 102381, "epoch": 609} {"train_loss": -9.605608940124512, "global_step": 102382, "epoch": 609} {"train_loss": -9.793229103088379, "global_step": 102383, "epoch": 609} {"train_loss": -9.620723724365234, "global_step": 102384, "epoch": 609} {"train_loss": -9.696786880493164, "global_step": 102385, "epoch": 609} {"train_loss": -9.689964294433594, "global_step": 102386, "epoch": 609} {"train_loss": -9.624672889709473, "global_step": 102387, "epoch": 609} {"train_loss": -9.721349716186523, "global_step": 102388, "epoch": 609} {"train_loss": -9.678979873657227, "global_step": 102389, "epoch": 609} {"train_loss": -9.691011428833008, "global_step": 102390, "epoch": 609} {"train_loss": -9.859415054321289, "global_step": 102391, "epoch": 609} {"train_loss": -9.414701461791992, "global_step": 102392, "epoch": 609} {"train_loss": -9.67872142791748, "global_step": 102393, "epoch": 609} {"train_loss": -9.54201602935791, "global_step": 102394, "epoch": 609} {"train_loss": -9.676728248596191, "global_step": 102395, "epoch": 609} {"train_loss": -10.020746231079102, "global_step": 102396, "epoch": 609} {"train_loss": -9.5358304977417, "global_step": 102397, "epoch": 609} {"train_loss": -9.643560409545898, "global_step": 102398, "epoch": 609} {"train_loss": -9.743438720703125, "global_step": 102399, "epoch": 609} {"train_loss": -9.691774368286133, "global_step": 102400, "epoch": 609} {"train_loss": -9.753881454467773, "global_step": 102401, "epoch": 609} {"train_loss": -9.715295791625977, "global_step": 102402, "epoch": 609} {"train_loss": -9.85546588897705, "global_step": 102403, "epoch": 609} {"train_loss": -9.98483657836914, "global_step": 102404, "epoch": 609} {"train_loss": -9.922416687011719, "global_step": 102405, "epoch": 609} {"train_loss": -9.63339614868164, "global_step": 102406, "epoch": 609} {"train_loss": -9.995140075683594, "global_step": 102407, "epoch": 609} {"train_loss": -9.645584106445312, "global_step": 102408, "epoch": 609} {"train_loss": -9.933952331542969, "global_step": 102409, "epoch": 609} {"train_loss": -9.767004013061523, "global_step": 102410, "epoch": 609} {"train_loss": -9.182684898376465, "global_step": 102411, "epoch": 609} {"train_loss": -9.85365104675293, "global_step": 102412, "epoch": 609} {"train_loss": -9.51120376586914, "global_step": 102413, "epoch": 609} {"train_loss": -9.857471466064453, "global_step": 102414, "epoch": 609} {"train_loss": -9.71706485748291, "global_step": 102415, "epoch": 609} {"train_loss": -9.975767135620117, "global_step": 102416, "epoch": 609} {"train_loss": -9.961864471435547, "global_step": 102417, "epoch": 609} {"train_loss": -9.796427726745605, "global_step": 102418, "epoch": 609} {"train_loss": -9.748271942138672, "global_step": 102419, "epoch": 609} {"train_loss": -9.945439338684082, "global_step": 102420, "epoch": 609} {"train_loss": -9.554611206054688, "global_step": 102421, "epoch": 609} {"train_loss": -9.752388954162598, "global_step": 102422, "epoch": 609} {"train_loss": -9.905227661132812, "global_step": 102423, "epoch": 609} {"train_loss": -9.372518539428711, "global_step": 102424, "epoch": 609} {"train_loss": -10.041631698608398, "global_step": 102425, "epoch": 609} {"train_loss": -9.568624496459961, "global_step": 102426, "epoch": 609} {"train_loss": -9.847147941589355, "global_step": 102427, "epoch": 609} {"train_loss": -9.496649742126465, "global_step": 102428, "epoch": 609} {"train_loss": -9.68977165222168, "global_step": 102429, "epoch": 609} {"train_loss": -10.000082015991211, "global_step": 102430, "epoch": 609} {"train_loss": -9.69462776184082, "global_step": 102431, "epoch": 609} {"train_loss": -9.787246704101562, "global_step": 102432, "epoch": 609} {"train_loss": -9.557896614074707, "global_step": 102433, "epoch": 609} {"train_loss": -9.659721374511719, "global_step": 102434, "epoch": 609} {"train_loss": -9.955486297607422, "global_step": 102435, "epoch": 609} {"train_loss": -9.867076873779297, "global_step": 102436, "epoch": 609} {"train_loss": -9.786907196044922, "global_step": 102437, "epoch": 609} {"train_loss": -9.703882217407227, "global_step": 102438, "epoch": 609} {"train_loss": -10.160589218139648, "global_step": 102439, "epoch": 609} {"train_loss": -9.880443572998047, "global_step": 102440, "epoch": 609} {"train_loss": -10.161605834960938, "global_step": 102441, "epoch": 609} {"train_loss": -9.978168487548828, "global_step": 102442, "epoch": 609} {"train_loss": -9.635669708251953, "global_step": 102443, "epoch": 609} {"train_loss": -9.678022384643555, "global_step": 102444, "epoch": 609} {"train_loss": -9.983850479125977, "global_step": 102445, "epoch": 609} {"train_loss": -9.937677383422852, "global_step": 102446, "epoch": 609} {"train_loss": -9.939173698425293, "global_step": 102447, "epoch": 609} {"train_loss": -9.72212028503418, "global_step": 102448, "epoch": 609} {"train_loss": -10.010438919067383, "global_step": 102449, "epoch": 609} {"train_loss": -9.66224479675293, "global_step": 102450, "epoch": 609} {"train_loss": -9.67158317565918, "global_step": 102451, "epoch": 609} {"train_loss": -10.262722969055176, "global_step": 102452, "epoch": 609} {"train_loss": -9.965179443359375, "global_step": 102453, "epoch": 609} {"train_loss": -9.930130004882812, "global_step": 102454, "epoch": 609} {"train_loss": -9.798916816711426, "global_step": 102455, "epoch": 609} {"train_loss": -9.713441848754883, "global_step": 102456, "epoch": 609} {"train_loss": -9.580060958862305, "global_step": 102457, "epoch": 609} {"train_loss": -9.432906150817871, "global_step": 102458, "epoch": 609} {"train_loss": -9.83338737487793, "global_step": 102459, "epoch": 609} {"train_loss": -9.582358360290527, "global_step": 102460, "epoch": 609} {"train_loss": -9.65298843383789, "global_step": 102461, "epoch": 609} {"train_loss": -9.605353355407715, "global_step": 102462, "epoch": 609} {"train_loss": -9.794576644897461, "global_step": 102463, "epoch": 609} {"train_loss": -9.199463844299316, "global_step": 102464, "epoch": 609} {"train_loss": -9.204215049743652, "global_step": 102465, "epoch": 609} {"train_loss": -9.856800079345703, "global_step": 102466, "epoch": 609} {"train_loss": -9.284586906433105, "global_step": 102467, "epoch": 609} {"train_loss": -9.905023574829102, "global_step": 102468, "epoch": 609} {"train_loss": -9.355666160583496, "global_step": 102469, "epoch": 609} {"train_loss": -9.568885803222656, "global_step": 102470, "epoch": 609} {"train_loss": -9.74567985534668, "global_step": 102471, "epoch": 609} {"train_loss": -9.4371976852417, "global_step": 102472, "epoch": 609} {"train_loss": -9.407565116882324, "global_step": 102473, "epoch": 609} {"train_loss": -9.569171905517578, "global_step": 102474, "epoch": 609} {"train_loss": -9.491711616516113, "global_step": 102475, "epoch": 609} {"train_loss": -9.61009407043457, "global_step": 102476, "epoch": 609} {"train_loss": -9.530957221984863, "global_step": 102477, "epoch": 609} {"train_loss": -9.732144355773926, "global_step": 102478, "epoch": 609} {"train_loss": -9.645492695626759, "global_step": 102479, "epoch": 609, "val_loss": 208380.609375} {"train_loss": -9.685747146606445, "global_step": 102480, "epoch": 610} {"train_loss": -9.575459480285645, "global_step": 102481, "epoch": 610} {"train_loss": -9.487686157226562, "global_step": 102482, "epoch": 610} {"train_loss": -9.415973663330078, "global_step": 102483, "epoch": 610} {"train_loss": -9.362447738647461, "global_step": 102484, "epoch": 610} {"train_loss": -9.659149169921875, "global_step": 102485, "epoch": 610} {"train_loss": -9.381669998168945, "global_step": 102486, "epoch": 610} {"train_loss": -9.621617317199707, "global_step": 102487, "epoch": 610} {"train_loss": -9.484746932983398, "global_step": 102488, "epoch": 610} {"train_loss": -9.791104316711426, "global_step": 102489, "epoch": 610} {"train_loss": -9.594059944152832, "global_step": 102490, "epoch": 610} {"train_loss": -9.66316032409668, "global_step": 102491, "epoch": 610} {"train_loss": -9.526290893554688, "global_step": 102492, "epoch": 610} {"train_loss": -9.590374946594238, "global_step": 102493, "epoch": 610} {"train_loss": -9.837430953979492, "global_step": 102494, "epoch": 610} {"train_loss": -9.709531784057617, "global_step": 102495, "epoch": 610} {"train_loss": -9.684837341308594, "global_step": 102496, "epoch": 610} {"train_loss": -9.84630012512207, "global_step": 102497, "epoch": 610} {"train_loss": -9.904430389404297, "global_step": 102498, "epoch": 610} {"train_loss": -9.857054710388184, "global_step": 102499, "epoch": 610} {"train_loss": -10.072641372680664, "global_step": 102500, "epoch": 610} {"train_loss": -9.79968547821045, "global_step": 102501, "epoch": 610} {"train_loss": -10.024209022521973, "global_step": 102502, "epoch": 610} {"train_loss": -9.767768859863281, "global_step": 102503, "epoch": 610} {"train_loss": -9.543142318725586, "global_step": 102504, "epoch": 610} {"train_loss": -10.034258842468262, "global_step": 102505, "epoch": 610} {"train_loss": -9.706165313720703, "global_step": 102506, "epoch": 610} {"train_loss": -9.903759956359863, "global_step": 102507, "epoch": 610} {"train_loss": -9.919190406799316, "global_step": 102508, "epoch": 610} {"train_loss": -9.921186447143555, "global_step": 102509, "epoch": 610} {"train_loss": -9.965219497680664, "global_step": 102510, "epoch": 610} {"train_loss": -9.71182918548584, "global_step": 102511, "epoch": 610} {"train_loss": -9.817514419555664, "global_step": 102512, "epoch": 610} {"train_loss": -9.887567520141602, "global_step": 102513, "epoch": 610} {"train_loss": -9.905029296875, "global_step": 102514, "epoch": 610} {"train_loss": -9.971866607666016, "global_step": 102515, "epoch": 610} {"train_loss": -10.090028762817383, "global_step": 102516, "epoch": 610} {"train_loss": -9.936452865600586, "global_step": 102517, "epoch": 610} {"train_loss": -9.831913948059082, "global_step": 102518, "epoch": 610} {"train_loss": -9.78022575378418, "global_step": 102519, "epoch": 610} {"train_loss": -9.71187973022461, "global_step": 102520, "epoch": 610} {"train_loss": -9.746746063232422, "global_step": 102521, "epoch": 610} {"train_loss": -9.760945320129395, "global_step": 102522, "epoch": 610} {"train_loss": -9.747888565063477, "global_step": 102523, "epoch": 610} {"train_loss": -9.380327224731445, "global_step": 102524, "epoch": 610} {"train_loss": -10.122894287109375, "global_step": 102525, "epoch": 610} {"train_loss": -9.442619323730469, "global_step": 102526, "epoch": 610} {"train_loss": -9.734203338623047, "global_step": 102527, "epoch": 610} {"train_loss": -9.683645248413086, "global_step": 102528, "epoch": 610} {"train_loss": -9.566788673400879, "global_step": 102529, "epoch": 610} {"train_loss": -9.639699935913086, "global_step": 102530, "epoch": 610} {"train_loss": -9.544170379638672, "global_step": 102531, "epoch": 610} {"train_loss": -9.698253631591797, "global_step": 102532, "epoch": 610} {"train_loss": -9.937761306762695, "global_step": 102533, "epoch": 610} {"train_loss": -9.628242492675781, "global_step": 102534, "epoch": 610} {"train_loss": -9.805551528930664, "global_step": 102535, "epoch": 610} {"train_loss": -9.826486587524414, "global_step": 102536, "epoch": 610} {"train_loss": -9.920180320739746, "global_step": 102537, "epoch": 610} {"train_loss": -9.549768447875977, "global_step": 102538, "epoch": 610} {"train_loss": -9.572172164916992, "global_step": 102539, "epoch": 610} {"train_loss": -9.506111145019531, "global_step": 102540, "epoch": 610} {"train_loss": -9.739727020263672, "global_step": 102541, "epoch": 610} {"train_loss": -9.369047164916992, "global_step": 102542, "epoch": 610} {"train_loss": -9.418197631835938, "global_step": 102543, "epoch": 610} {"train_loss": -9.72550106048584, "global_step": 102544, "epoch": 610} {"train_loss": -9.574483871459961, "global_step": 102545, "epoch": 610} {"train_loss": -9.620867729187012, "global_step": 102546, "epoch": 610} {"train_loss": -10.007078170776367, "global_step": 102547, "epoch": 610} {"train_loss": -9.811471939086914, "global_step": 102548, "epoch": 610} {"train_loss": -9.806391716003418, "global_step": 102549, "epoch": 610} {"train_loss": -9.780425071716309, "global_step": 102550, "epoch": 610} {"train_loss": -9.85495376586914, "global_step": 102551, "epoch": 610} {"train_loss": -10.020655632019043, "global_step": 102552, "epoch": 610} {"train_loss": -9.851421356201172, "global_step": 102553, "epoch": 610} {"train_loss": -9.429337501525879, "global_step": 102554, "epoch": 610} {"train_loss": -9.765332221984863, "global_step": 102555, "epoch": 610} {"train_loss": -9.701740264892578, "global_step": 102556, "epoch": 610} {"train_loss": -10.040348052978516, "global_step": 102557, "epoch": 610} {"train_loss": -9.741169929504395, "global_step": 102558, "epoch": 610} {"train_loss": -9.59260082244873, "global_step": 102559, "epoch": 610} {"train_loss": -9.794652938842773, "global_step": 102560, "epoch": 610} {"train_loss": -9.756189346313477, "global_step": 102561, "epoch": 610} {"train_loss": -9.83443832397461, "global_step": 102562, "epoch": 610} {"train_loss": -9.84153938293457, "global_step": 102563, "epoch": 610} {"train_loss": -9.624454498291016, "global_step": 102564, "epoch": 610} {"train_loss": -10.101261138916016, "global_step": 102565, "epoch": 610} {"train_loss": -9.520780563354492, "global_step": 102566, "epoch": 610} {"train_loss": -9.488393783569336, "global_step": 102567, "epoch": 610} {"train_loss": -9.687614440917969, "global_step": 102568, "epoch": 610} {"train_loss": -9.564473152160645, "global_step": 102569, "epoch": 610} {"train_loss": -9.537129402160645, "global_step": 102570, "epoch": 610} {"train_loss": -9.628253936767578, "global_step": 102571, "epoch": 610} {"train_loss": -9.905497550964355, "global_step": 102572, "epoch": 610} {"train_loss": -9.522239685058594, "global_step": 102573, "epoch": 610} {"train_loss": -9.920429229736328, "global_step": 102574, "epoch": 610} {"train_loss": -9.413965225219727, "global_step": 102575, "epoch": 610} {"train_loss": -9.919736862182617, "global_step": 102576, "epoch": 610} {"train_loss": -9.570691108703613, "global_step": 102577, "epoch": 610} {"train_loss": -9.91227912902832, "global_step": 102578, "epoch": 610} {"train_loss": -9.769287109375, "global_step": 102579, "epoch": 610} {"train_loss": -9.552627563476562, "global_step": 102580, "epoch": 610} {"train_loss": -9.910826683044434, "global_step": 102581, "epoch": 610} {"train_loss": -9.55790901184082, "global_step": 102582, "epoch": 610} {"train_loss": -9.844258308410645, "global_step": 102583, "epoch": 610} {"train_loss": -9.757329940795898, "global_step": 102584, "epoch": 610} {"train_loss": -9.69642448425293, "global_step": 102585, "epoch": 610} {"train_loss": -9.732178688049316, "global_step": 102586, "epoch": 610} {"train_loss": -9.582154273986816, "global_step": 102587, "epoch": 610} {"train_loss": -9.638322830200195, "global_step": 102588, "epoch": 610} {"train_loss": -9.69968032836914, "global_step": 102589, "epoch": 610} {"train_loss": -9.771932601928711, "global_step": 102590, "epoch": 610} {"train_loss": -9.472360610961914, "global_step": 102591, "epoch": 610} {"train_loss": -9.829282760620117, "global_step": 102592, "epoch": 610} {"train_loss": -9.686163902282715, "global_step": 102593, "epoch": 610} {"train_loss": -9.74993896484375, "global_step": 102594, "epoch": 610} {"train_loss": -9.657844543457031, "global_step": 102595, "epoch": 610} {"train_loss": -9.576515197753906, "global_step": 102596, "epoch": 610} {"train_loss": -9.582504272460938, "global_step": 102597, "epoch": 610} {"train_loss": -9.637530326843262, "global_step": 102598, "epoch": 610} {"train_loss": -9.87921142578125, "global_step": 102599, "epoch": 610} {"train_loss": -9.742822647094727, "global_step": 102600, "epoch": 610} {"train_loss": -9.894330024719238, "global_step": 102601, "epoch": 610} {"train_loss": -9.618518829345703, "global_step": 102602, "epoch": 610} {"train_loss": -9.907112121582031, "global_step": 102603, "epoch": 610} {"train_loss": -9.734375, "global_step": 102604, "epoch": 610} {"train_loss": -9.909049034118652, "global_step": 102605, "epoch": 610} {"train_loss": -9.767048835754395, "global_step": 102606, "epoch": 610} {"train_loss": -9.97913646697998, "global_step": 102607, "epoch": 610} {"train_loss": -9.662944793701172, "global_step": 102608, "epoch": 610} {"train_loss": -10.063617706298828, "global_step": 102609, "epoch": 610} {"train_loss": -9.94171142578125, "global_step": 102610, "epoch": 610} {"train_loss": -9.862421035766602, "global_step": 102611, "epoch": 610} {"train_loss": -9.925373077392578, "global_step": 102612, "epoch": 610} {"train_loss": -9.953142166137695, "global_step": 102613, "epoch": 610} {"train_loss": -9.977790832519531, "global_step": 102614, "epoch": 610} {"train_loss": -9.919928550720215, "global_step": 102615, "epoch": 610} {"train_loss": -9.998046875, "global_step": 102616, "epoch": 610} {"train_loss": -9.60757827758789, "global_step": 102617, "epoch": 610} {"train_loss": -9.955028533935547, "global_step": 102618, "epoch": 610} {"train_loss": -9.865193367004395, "global_step": 102619, "epoch": 610} {"train_loss": -10.106681823730469, "global_step": 102620, "epoch": 610} {"train_loss": -9.942719459533691, "global_step": 102621, "epoch": 610} {"train_loss": -10.177995681762695, "global_step": 102622, "epoch": 610} {"train_loss": -9.974149703979492, "global_step": 102623, "epoch": 610} {"train_loss": -9.969903945922852, "global_step": 102624, "epoch": 610} {"train_loss": -9.974313735961914, "global_step": 102625, "epoch": 610} {"train_loss": -9.76445198059082, "global_step": 102626, "epoch": 610} {"train_loss": -9.941344261169434, "global_step": 102627, "epoch": 610} {"train_loss": -9.60108757019043, "global_step": 102628, "epoch": 610} {"train_loss": -9.780067443847656, "global_step": 102629, "epoch": 610} {"train_loss": -9.961507797241211, "global_step": 102630, "epoch": 610} {"train_loss": -9.636791229248047, "global_step": 102631, "epoch": 610} {"train_loss": -9.8489408493042, "global_step": 102632, "epoch": 610} {"train_loss": -10.013866424560547, "global_step": 102633, "epoch": 610} {"train_loss": -9.644780158996582, "global_step": 102634, "epoch": 610} {"train_loss": -9.848404884338379, "global_step": 102635, "epoch": 610} {"train_loss": -9.811323165893555, "global_step": 102636, "epoch": 610} {"train_loss": -9.79786491394043, "global_step": 102637, "epoch": 610} {"train_loss": -9.671916007995605, "global_step": 102638, "epoch": 610} {"train_loss": -9.77049446105957, "global_step": 102639, "epoch": 610} {"train_loss": -9.65488052368164, "global_step": 102640, "epoch": 610} {"train_loss": -9.096555709838867, "global_step": 102641, "epoch": 610} {"train_loss": -9.961087226867676, "global_step": 102642, "epoch": 610} {"train_loss": -9.352749824523926, "global_step": 102643, "epoch": 610} {"train_loss": -9.224302291870117, "global_step": 102644, "epoch": 610} {"train_loss": -9.732522964477539, "global_step": 102645, "epoch": 610} {"train_loss": -8.831676483154297, "global_step": 102646, "epoch": 610} {"train_loss": -9.741728708857583, "global_step": 102647, "epoch": 610, "val_loss": 208195.34375, "train_action_mse_error": 2.9677839279174805} {"train_loss": -9.398027420043945, "global_step": 102648, "epoch": 611} {"train_loss": -9.464218139648438, "global_step": 102649, "epoch": 611} {"train_loss": -9.58511734008789, "global_step": 102650, "epoch": 611} {"train_loss": -9.4760103225708, "global_step": 102651, "epoch": 611} {"train_loss": -9.699689865112305, "global_step": 102652, "epoch": 611} {"train_loss": -9.669235229492188, "global_step": 102653, "epoch": 611} {"train_loss": -9.571863174438477, "global_step": 102654, "epoch": 611} {"train_loss": -9.701786041259766, "global_step": 102655, "epoch": 611} {"train_loss": -9.406681060791016, "global_step": 102656, "epoch": 611} {"train_loss": -9.57558822631836, "global_step": 102657, "epoch": 611} {"train_loss": -9.641847610473633, "global_step": 102658, "epoch": 611} {"train_loss": -9.537790298461914, "global_step": 102659, "epoch": 611} {"train_loss": -9.953651428222656, "global_step": 102660, "epoch": 611} {"train_loss": -9.625856399536133, "global_step": 102661, "epoch": 611} {"train_loss": -9.426139831542969, "global_step": 102662, "epoch": 611} {"train_loss": -9.906949996948242, "global_step": 102663, "epoch": 611} {"train_loss": -9.481953620910645, "global_step": 102664, "epoch": 611} {"train_loss": -9.793713569641113, "global_step": 102665, "epoch": 611} {"train_loss": -9.617842674255371, "global_step": 102666, "epoch": 611} {"train_loss": -9.461607933044434, "global_step": 102667, "epoch": 611} {"train_loss": -9.928964614868164, "global_step": 102668, "epoch": 611} {"train_loss": -9.702011108398438, "global_step": 102669, "epoch": 611} {"train_loss": -9.80815315246582, "global_step": 102670, "epoch": 611} {"train_loss": -9.709470748901367, "global_step": 102671, "epoch": 611} {"train_loss": -9.915664672851562, "global_step": 102672, "epoch": 611} {"train_loss": -9.796918869018555, "global_step": 102673, "epoch": 611} {"train_loss": -9.507375717163086, "global_step": 102674, "epoch": 611} {"train_loss": -9.931205749511719, "global_step": 102675, "epoch": 611} {"train_loss": -9.636514663696289, "global_step": 102676, "epoch": 611} {"train_loss": -9.842191696166992, "global_step": 102677, "epoch": 611} {"train_loss": -9.653474807739258, "global_step": 102678, "epoch": 611} {"train_loss": -9.760866165161133, "global_step": 102679, "epoch": 611} {"train_loss": -9.809313774108887, "global_step": 102680, "epoch": 611} {"train_loss": -10.003098487854004, "global_step": 102681, "epoch": 611} {"train_loss": -9.673473358154297, "global_step": 102682, "epoch": 611} {"train_loss": -9.800498008728027, "global_step": 102683, "epoch": 611} {"train_loss": -9.898153305053711, "global_step": 102684, "epoch": 611} {"train_loss": -9.977184295654297, "global_step": 102685, "epoch": 611} {"train_loss": -10.048524856567383, "global_step": 102686, "epoch": 611} {"train_loss": -9.916618347167969, "global_step": 102687, "epoch": 611} {"train_loss": -10.070352554321289, "global_step": 102688, "epoch": 611} {"train_loss": -10.069093704223633, "global_step": 102689, "epoch": 611} {"train_loss": -9.821281433105469, "global_step": 102690, "epoch": 611} {"train_loss": -9.983854293823242, "global_step": 102691, "epoch": 611} {"train_loss": -9.918497085571289, "global_step": 102692, "epoch": 611} {"train_loss": -9.700239181518555, "global_step": 102693, "epoch": 611} {"train_loss": -9.930805206298828, "global_step": 102694, "epoch": 611} {"train_loss": -9.387406349182129, "global_step": 102695, "epoch": 611} {"train_loss": -9.839425086975098, "global_step": 102696, "epoch": 611} {"train_loss": -9.891042709350586, "global_step": 102697, "epoch": 611} {"train_loss": -9.111194610595703, "global_step": 102698, "epoch": 611} {"train_loss": -9.890647888183594, "global_step": 102699, "epoch": 611} {"train_loss": -9.625528335571289, "global_step": 102700, "epoch": 611} {"train_loss": -9.497164726257324, "global_step": 102701, "epoch": 611} {"train_loss": -10.031797409057617, "global_step": 102702, "epoch": 611} {"train_loss": -9.305169105529785, "global_step": 102703, "epoch": 611} {"train_loss": -9.416923522949219, "global_step": 102704, "epoch": 611} {"train_loss": -9.471567153930664, "global_step": 102705, "epoch": 611} {"train_loss": -9.273296356201172, "global_step": 102706, "epoch": 611} {"train_loss": -9.54703426361084, "global_step": 102707, "epoch": 611} {"train_loss": -9.131422996520996, "global_step": 102708, "epoch": 611} {"train_loss": -9.333412170410156, "global_step": 102709, "epoch": 611} {"train_loss": -9.568788528442383, "global_step": 102710, "epoch": 611} {"train_loss": -9.360967636108398, "global_step": 102711, "epoch": 611} {"train_loss": -9.264333724975586, "global_step": 102712, "epoch": 611} {"train_loss": -9.368913650512695, "global_step": 102713, "epoch": 611} {"train_loss": -9.447135925292969, "global_step": 102714, "epoch": 611} {"train_loss": -9.278923034667969, "global_step": 102715, "epoch": 611} {"train_loss": -9.461801528930664, "global_step": 102716, "epoch": 611} {"train_loss": -9.522364616394043, "global_step": 102717, "epoch": 611} {"train_loss": -9.566417694091797, "global_step": 102718, "epoch": 611} {"train_loss": -9.47886848449707, "global_step": 102719, "epoch": 611} {"train_loss": -9.821091651916504, "global_step": 102720, "epoch": 611} {"train_loss": -9.40826416015625, "global_step": 102721, "epoch": 611} {"train_loss": -9.689837455749512, "global_step": 102722, "epoch": 611} {"train_loss": -9.676143646240234, "global_step": 102723, "epoch": 611} {"train_loss": -9.292821884155273, "global_step": 102724, "epoch": 611} {"train_loss": -9.777880668640137, "global_step": 102725, "epoch": 611} {"train_loss": -9.416423797607422, "global_step": 102726, "epoch": 611} {"train_loss": -9.629379272460938, "global_step": 102727, "epoch": 611} {"train_loss": -9.577144622802734, "global_step": 102728, "epoch": 611} {"train_loss": -9.648702621459961, "global_step": 102729, "epoch": 611} {"train_loss": -9.431600570678711, "global_step": 102730, "epoch": 611} {"train_loss": -9.879354476928711, "global_step": 102731, "epoch": 611} {"train_loss": -9.7791109085083, "global_step": 102732, "epoch": 611} {"train_loss": -9.812280654907227, "global_step": 102733, "epoch": 611} {"train_loss": -9.696399688720703, "global_step": 102734, "epoch": 611} {"train_loss": -9.957611083984375, "global_step": 102735, "epoch": 611} {"train_loss": -9.730801582336426, "global_step": 102736, "epoch": 611} {"train_loss": -9.766010284423828, "global_step": 102737, "epoch": 611} {"train_loss": -9.735062599182129, "global_step": 102738, "epoch": 611} {"train_loss": -9.662940979003906, "global_step": 102739, "epoch": 611} {"train_loss": -9.660740852355957, "global_step": 102740, "epoch": 611} {"train_loss": -10.045797348022461, "global_step": 102741, "epoch": 611} {"train_loss": -9.755573272705078, "global_step": 102742, "epoch": 611} {"train_loss": -9.668465614318848, "global_step": 102743, "epoch": 611} {"train_loss": -9.479268074035645, "global_step": 102744, "epoch": 611} {"train_loss": -9.58734130859375, "global_step": 102745, "epoch": 611} {"train_loss": -9.611130714416504, "global_step": 102746, "epoch": 611} {"train_loss": -9.578227043151855, "global_step": 102747, "epoch": 611} {"train_loss": -9.777505874633789, "global_step": 102748, "epoch": 611} {"train_loss": -9.503255844116211, "global_step": 102749, "epoch": 611} {"train_loss": -9.91531753540039, "global_step": 102750, "epoch": 611} {"train_loss": -9.400943756103516, "global_step": 102751, "epoch": 611} {"train_loss": -9.72625732421875, "global_step": 102752, "epoch": 611} {"train_loss": -9.41738510131836, "global_step": 102753, "epoch": 611} {"train_loss": -9.707389831542969, "global_step": 102754, "epoch": 611} {"train_loss": -9.738554000854492, "global_step": 102755, "epoch": 611} {"train_loss": -9.581432342529297, "global_step": 102756, "epoch": 611} {"train_loss": -9.606403350830078, "global_step": 102757, "epoch": 611} {"train_loss": -9.779434204101562, "global_step": 102758, "epoch": 611} {"train_loss": -9.459209442138672, "global_step": 102759, "epoch": 611} {"train_loss": -9.713046073913574, "global_step": 102760, "epoch": 611} {"train_loss": -9.613771438598633, "global_step": 102761, "epoch": 611} {"train_loss": -9.867481231689453, "global_step": 102762, "epoch": 611} {"train_loss": -9.953446388244629, "global_step": 102763, "epoch": 611} {"train_loss": -9.705476760864258, "global_step": 102764, "epoch": 611} {"train_loss": -9.74370002746582, "global_step": 102765, "epoch": 611} {"train_loss": -9.652900695800781, "global_step": 102766, "epoch": 611} {"train_loss": -9.783526420593262, "global_step": 102767, "epoch": 611} {"train_loss": -9.896665573120117, "global_step": 102768, "epoch": 611} {"train_loss": -9.746859550476074, "global_step": 102769, "epoch": 611} {"train_loss": -9.753500938415527, "global_step": 102770, "epoch": 611} {"train_loss": -9.49776840209961, "global_step": 102771, "epoch": 611} {"train_loss": -9.668766021728516, "global_step": 102772, "epoch": 611} {"train_loss": -9.563499450683594, "global_step": 102773, "epoch": 611} {"train_loss": -9.93901252746582, "global_step": 102774, "epoch": 611} {"train_loss": -9.486373901367188, "global_step": 102775, "epoch": 611} {"train_loss": -9.65618896484375, "global_step": 102776, "epoch": 611} {"train_loss": -9.513510704040527, "global_step": 102777, "epoch": 611} {"train_loss": -9.294530868530273, "global_step": 102778, "epoch": 611} {"train_loss": -9.61929702758789, "global_step": 102779, "epoch": 611} {"train_loss": -9.717742919921875, "global_step": 102780, "epoch": 611} {"train_loss": -9.569073677062988, "global_step": 102781, "epoch": 611} {"train_loss": -9.356966018676758, "global_step": 102782, "epoch": 611} {"train_loss": -9.494668960571289, "global_step": 102783, "epoch": 611} {"train_loss": -9.38414192199707, "global_step": 102784, "epoch": 611} {"train_loss": -9.928230285644531, "global_step": 102785, "epoch": 611} {"train_loss": -9.384612083435059, "global_step": 102786, "epoch": 611} {"train_loss": -9.636907577514648, "global_step": 102787, "epoch": 611} {"train_loss": -9.902403831481934, "global_step": 102788, "epoch": 611} {"train_loss": -9.565773010253906, "global_step": 102789, "epoch": 611} {"train_loss": -9.784660339355469, "global_step": 102790, "epoch": 611} {"train_loss": -9.858447074890137, "global_step": 102791, "epoch": 611} {"train_loss": -9.601729393005371, "global_step": 102792, "epoch": 611} {"train_loss": -9.984130859375, "global_step": 102793, "epoch": 611} {"train_loss": -9.901448249816895, "global_step": 102794, "epoch": 611} {"train_loss": -9.869315147399902, "global_step": 102795, "epoch": 611} {"train_loss": -9.936686515808105, "global_step": 102796, "epoch": 611} {"train_loss": -9.682504653930664, "global_step": 102797, "epoch": 611} {"train_loss": -9.909293174743652, "global_step": 102798, "epoch": 611} {"train_loss": -9.914970397949219, "global_step": 102799, "epoch": 611} {"train_loss": -9.953773498535156, "global_step": 102800, "epoch": 611} {"train_loss": -9.909151077270508, "global_step": 102801, "epoch": 611} {"train_loss": -9.8736572265625, "global_step": 102802, "epoch": 611} {"train_loss": -9.980127334594727, "global_step": 102803, "epoch": 611} {"train_loss": -9.797492980957031, "global_step": 102804, "epoch": 611} {"train_loss": -10.051986694335938, "global_step": 102805, "epoch": 611} {"train_loss": -9.872923851013184, "global_step": 102806, "epoch": 611} {"train_loss": -9.805426597595215, "global_step": 102807, "epoch": 611} {"train_loss": -10.178478240966797, "global_step": 102808, "epoch": 611} {"train_loss": -9.715181350708008, "global_step": 102809, "epoch": 611} {"train_loss": -9.924980163574219, "global_step": 102810, "epoch": 611} {"train_loss": -9.920143127441406, "global_step": 102811, "epoch": 611} {"train_loss": -9.801115036010742, "global_step": 102812, "epoch": 611} {"train_loss": -9.745450973510742, "global_step": 102813, "epoch": 611} {"train_loss": -9.855542182922363, "global_step": 102814, "epoch": 611} {"train_loss": -9.689070048786345, "global_step": 102815, "epoch": 611, "val_loss": 206767.203125} {"train_loss": -9.542047500610352, "global_step": 102816, "epoch": 612} {"train_loss": -9.714313507080078, "global_step": 102817, "epoch": 612} {"train_loss": -9.588397979736328, "global_step": 102818, "epoch": 612} {"train_loss": -9.642574310302734, "global_step": 102819, "epoch": 612} {"train_loss": -9.713665962219238, "global_step": 102820, "epoch": 612} {"train_loss": -9.510313034057617, "global_step": 102821, "epoch": 612} {"train_loss": -9.590486526489258, "global_step": 102822, "epoch": 612} {"train_loss": -9.558534622192383, "global_step": 102823, "epoch": 612} {"train_loss": -9.46820068359375, "global_step": 102824, "epoch": 612} {"train_loss": -9.587675094604492, "global_step": 102825, "epoch": 612} {"train_loss": -9.688638687133789, "global_step": 102826, "epoch": 612} {"train_loss": -9.594027519226074, "global_step": 102827, "epoch": 612} {"train_loss": -9.951713562011719, "global_step": 102828, "epoch": 612} {"train_loss": -9.644023895263672, "global_step": 102829, "epoch": 612} {"train_loss": -9.515191078186035, "global_step": 102830, "epoch": 612} {"train_loss": -9.784823417663574, "global_step": 102831, "epoch": 612} {"train_loss": -9.250043869018555, "global_step": 102832, "epoch": 612} {"train_loss": -9.707193374633789, "global_step": 102833, "epoch": 612} {"train_loss": -9.196846008300781, "global_step": 102834, "epoch": 612} {"train_loss": -9.826375007629395, "global_step": 102835, "epoch": 612} {"train_loss": -9.34521770477295, "global_step": 102836, "epoch": 612} {"train_loss": -9.728257179260254, "global_step": 102837, "epoch": 612} {"train_loss": -9.346004486083984, "global_step": 102838, "epoch": 612} {"train_loss": -9.732362747192383, "global_step": 102839, "epoch": 612} {"train_loss": -9.658306121826172, "global_step": 102840, "epoch": 612} {"train_loss": -9.589411735534668, "global_step": 102841, "epoch": 612} {"train_loss": -9.89353084564209, "global_step": 102842, "epoch": 612} {"train_loss": -9.613999366760254, "global_step": 102843, "epoch": 612} {"train_loss": -9.895337104797363, "global_step": 102844, "epoch": 612} {"train_loss": -9.869604110717773, "global_step": 102845, "epoch": 612} {"train_loss": -9.819435119628906, "global_step": 102846, "epoch": 612} {"train_loss": -9.678689956665039, "global_step": 102847, "epoch": 612} {"train_loss": -9.937907218933105, "global_step": 102848, "epoch": 612} {"train_loss": -9.678324699401855, "global_step": 102849, "epoch": 612} {"train_loss": -9.758646011352539, "global_step": 102850, "epoch": 612} {"train_loss": -9.843975067138672, "global_step": 102851, "epoch": 612} {"train_loss": -9.709266662597656, "global_step": 102852, "epoch": 612} {"train_loss": -9.845010757446289, "global_step": 102853, "epoch": 612} {"train_loss": -9.612841606140137, "global_step": 102854, "epoch": 612} {"train_loss": -9.914502143859863, "global_step": 102855, "epoch": 612} {"train_loss": -9.852607727050781, "global_step": 102856, "epoch": 612} {"train_loss": -9.875555038452148, "global_step": 102857, "epoch": 612} {"train_loss": -9.908004760742188, "global_step": 102858, "epoch": 612} {"train_loss": -9.847389221191406, "global_step": 102859, "epoch": 612} {"train_loss": -9.978750228881836, "global_step": 102860, "epoch": 612} {"train_loss": -9.934589385986328, "global_step": 102861, "epoch": 612} {"train_loss": -10.028560638427734, "global_step": 102862, "epoch": 612} {"train_loss": -9.771175384521484, "global_step": 102863, "epoch": 612} {"train_loss": -9.74577522277832, "global_step": 102864, "epoch": 612} {"train_loss": -9.862427711486816, "global_step": 102865, "epoch": 612} {"train_loss": -10.00303840637207, "global_step": 102866, "epoch": 612} {"train_loss": -9.883173942565918, "global_step": 102867, "epoch": 612} {"train_loss": -9.84903335571289, "global_step": 102868, "epoch": 612} {"train_loss": -10.040148735046387, "global_step": 102869, "epoch": 612} {"train_loss": -10.021760940551758, "global_step": 102870, "epoch": 612} {"train_loss": -9.950212478637695, "global_step": 102871, "epoch": 612} {"train_loss": -9.923738479614258, "global_step": 102872, "epoch": 612} {"train_loss": -9.813840866088867, "global_step": 102873, "epoch": 612} {"train_loss": -9.716279029846191, "global_step": 102874, "epoch": 612} {"train_loss": -9.703567504882812, "global_step": 102875, "epoch": 612} {"train_loss": -9.726938247680664, "global_step": 102876, "epoch": 612} {"train_loss": -10.211763381958008, "global_step": 102877, "epoch": 612} {"train_loss": -9.876266479492188, "global_step": 102878, "epoch": 612} {"train_loss": -9.670629501342773, "global_step": 102879, "epoch": 612} {"train_loss": -9.335386276245117, "global_step": 102880, "epoch": 612} {"train_loss": -9.765783309936523, "global_step": 102881, "epoch": 612} {"train_loss": -9.546316146850586, "global_step": 102882, "epoch": 612} {"train_loss": -9.455558776855469, "global_step": 102883, "epoch": 612} {"train_loss": -9.734357833862305, "global_step": 102884, "epoch": 612} {"train_loss": -9.372056007385254, "global_step": 102885, "epoch": 612} {"train_loss": -9.991436004638672, "global_step": 102886, "epoch": 612} {"train_loss": -9.439682006835938, "global_step": 102887, "epoch": 612} {"train_loss": -9.660365104675293, "global_step": 102888, "epoch": 612} {"train_loss": -9.98869800567627, "global_step": 102889, "epoch": 612} {"train_loss": -9.505132675170898, "global_step": 102890, "epoch": 612} {"train_loss": -9.806800842285156, "global_step": 102891, "epoch": 612} {"train_loss": -9.61909294128418, "global_step": 102892, "epoch": 612} {"train_loss": -9.496633529663086, "global_step": 102893, "epoch": 612} {"train_loss": -9.667608261108398, "global_step": 102894, "epoch": 612} {"train_loss": -9.486949920654297, "global_step": 102895, "epoch": 612} {"train_loss": -9.600388526916504, "global_step": 102896, "epoch": 612} {"train_loss": -9.593334197998047, "global_step": 102897, "epoch": 612} {"train_loss": -9.422341346740723, "global_step": 102898, "epoch": 612} {"train_loss": -9.55993938446045, "global_step": 102899, "epoch": 612} {"train_loss": -9.277627944946289, "global_step": 102900, "epoch": 612} {"train_loss": -9.32075309753418, "global_step": 102901, "epoch": 612} {"train_loss": -9.235757827758789, "global_step": 102902, "epoch": 612} {"train_loss": -9.542518615722656, "global_step": 102903, "epoch": 612} {"train_loss": -9.46546745300293, "global_step": 102904, "epoch": 612} {"train_loss": -9.701014518737793, "global_step": 102905, "epoch": 612} {"train_loss": -9.529132843017578, "global_step": 102906, "epoch": 612} {"train_loss": -9.586092948913574, "global_step": 102907, "epoch": 612} {"train_loss": -9.714457511901855, "global_step": 102908, "epoch": 612} {"train_loss": -9.457710266113281, "global_step": 102909, "epoch": 612} {"train_loss": -9.722579002380371, "global_step": 102910, "epoch": 612} {"train_loss": -9.507010459899902, "global_step": 102911, "epoch": 612} {"train_loss": -9.411930084228516, "global_step": 102912, "epoch": 612} {"train_loss": -9.851279258728027, "global_step": 102913, "epoch": 612} {"train_loss": -9.800278663635254, "global_step": 102914, "epoch": 612} {"train_loss": -9.823479652404785, "global_step": 102915, "epoch": 612} {"train_loss": -9.945886611938477, "global_step": 102916, "epoch": 612} {"train_loss": -9.851104736328125, "global_step": 102917, "epoch": 612} {"train_loss": -9.726605415344238, "global_step": 102918, "epoch": 612} {"train_loss": -9.9368314743042, "global_step": 102919, "epoch": 612} {"train_loss": -9.834638595581055, "global_step": 102920, "epoch": 612} {"train_loss": -9.587717056274414, "global_step": 102921, "epoch": 612} {"train_loss": -9.835677146911621, "global_step": 102922, "epoch": 612} {"train_loss": -9.734923362731934, "global_step": 102923, "epoch": 612} {"train_loss": -9.821406364440918, "global_step": 102924, "epoch": 612} {"train_loss": -10.006258964538574, "global_step": 102925, "epoch": 612} {"train_loss": -9.827886581420898, "global_step": 102926, "epoch": 612} {"train_loss": -10.096092224121094, "global_step": 102927, "epoch": 612} {"train_loss": -9.74563217163086, "global_step": 102928, "epoch": 612} {"train_loss": -10.028947830200195, "global_step": 102929, "epoch": 612} {"train_loss": -9.93486213684082, "global_step": 102930, "epoch": 612} {"train_loss": -10.17453670501709, "global_step": 102931, "epoch": 612} {"train_loss": -10.154247283935547, "global_step": 102932, "epoch": 612} {"train_loss": -10.022782325744629, "global_step": 102933, "epoch": 612} {"train_loss": -9.9478759765625, "global_step": 102934, "epoch": 612} {"train_loss": -10.028544425964355, "global_step": 102935, "epoch": 612} {"train_loss": -9.79110336303711, "global_step": 102936, "epoch": 612} {"train_loss": -9.979774475097656, "global_step": 102937, "epoch": 612} {"train_loss": -10.08759880065918, "global_step": 102938, "epoch": 612} {"train_loss": -9.979621887207031, "global_step": 102939, "epoch": 612} {"train_loss": -10.098968505859375, "global_step": 102940, "epoch": 612} {"train_loss": -9.906545639038086, "global_step": 102941, "epoch": 612} {"train_loss": -9.824430465698242, "global_step": 102942, "epoch": 612} {"train_loss": -10.177286148071289, "global_step": 102943, "epoch": 612} {"train_loss": -10.013681411743164, "global_step": 102944, "epoch": 612} {"train_loss": -9.950618743896484, "global_step": 102945, "epoch": 612} {"train_loss": -10.151533126831055, "global_step": 102946, "epoch": 612} {"train_loss": -10.21328353881836, "global_step": 102947, "epoch": 612} {"train_loss": -9.980469703674316, "global_step": 102948, "epoch": 612} {"train_loss": -9.712766647338867, "global_step": 102949, "epoch": 612} {"train_loss": -10.209434509277344, "global_step": 102950, "epoch": 612} {"train_loss": -9.476325035095215, "global_step": 102951, "epoch": 612} {"train_loss": -9.681428909301758, "global_step": 102952, "epoch": 612} {"train_loss": -9.95089340209961, "global_step": 102953, "epoch": 612} {"train_loss": -8.974815368652344, "global_step": 102954, "epoch": 612} {"train_loss": -9.658904075622559, "global_step": 102955, "epoch": 612} {"train_loss": -9.626716613769531, "global_step": 102956, "epoch": 612} {"train_loss": -9.538743019104004, "global_step": 102957, "epoch": 612} {"train_loss": -10.142215728759766, "global_step": 102958, "epoch": 612} {"train_loss": -9.266550064086914, "global_step": 102959, "epoch": 612} {"train_loss": -10.035918235778809, "global_step": 102960, "epoch": 612} {"train_loss": -9.25773811340332, "global_step": 102961, "epoch": 612} {"train_loss": -9.71420669555664, "global_step": 102962, "epoch": 612} {"train_loss": -9.489875793457031, "global_step": 102963, "epoch": 612} {"train_loss": -9.491823196411133, "global_step": 102964, "epoch": 612} {"train_loss": -9.386879920959473, "global_step": 102965, "epoch": 612} {"train_loss": -9.638899803161621, "global_step": 102966, "epoch": 612} {"train_loss": -9.386070251464844, "global_step": 102967, "epoch": 612} {"train_loss": -9.778388977050781, "global_step": 102968, "epoch": 612} {"train_loss": -9.297602653503418, "global_step": 102969, "epoch": 612} {"train_loss": -9.511104583740234, "global_step": 102970, "epoch": 612} {"train_loss": -9.093690872192383, "global_step": 102971, "epoch": 612} {"train_loss": -9.579581260681152, "global_step": 102972, "epoch": 612} {"train_loss": -9.278240203857422, "global_step": 102973, "epoch": 612} {"train_loss": -9.659543991088867, "global_step": 102974, "epoch": 612} {"train_loss": -9.612995147705078, "global_step": 102975, "epoch": 612} {"train_loss": -9.661277770996094, "global_step": 102976, "epoch": 612} {"train_loss": -9.602258682250977, "global_step": 102977, "epoch": 612} {"train_loss": -9.524796485900879, "global_step": 102978, "epoch": 612} {"train_loss": -9.503532409667969, "global_step": 102979, "epoch": 612} {"train_loss": -9.60551929473877, "global_step": 102980, "epoch": 612} {"train_loss": -9.567808151245117, "global_step": 102981, "epoch": 612} {"train_loss": -9.664381980895996, "global_step": 102982, "epoch": 612} {"train_loss": -9.714665850003561, "global_step": 102983, "epoch": 612, "val_loss": 206799.40625} {"train_loss": -9.889298439025879, "global_step": 102984, "epoch": 613} {"train_loss": -9.435150146484375, "global_step": 102985, "epoch": 613} {"train_loss": -9.650883674621582, "global_step": 102986, "epoch": 613} {"train_loss": -9.075298309326172, "global_step": 102987, "epoch": 613} {"train_loss": -9.300844192504883, "global_step": 102988, "epoch": 613} {"train_loss": -9.787367820739746, "global_step": 102989, "epoch": 613} {"train_loss": -9.45803451538086, "global_step": 102990, "epoch": 613} {"train_loss": -9.674381256103516, "global_step": 102991, "epoch": 613} {"train_loss": -9.604642868041992, "global_step": 102992, "epoch": 613} {"train_loss": -9.521218299865723, "global_step": 102993, "epoch": 613} {"train_loss": -9.838933944702148, "global_step": 102994, "epoch": 613} {"train_loss": -9.6631498336792, "global_step": 102995, "epoch": 613} {"train_loss": -10.016316413879395, "global_step": 102996, "epoch": 613} {"train_loss": -9.718417167663574, "global_step": 102997, "epoch": 613} {"train_loss": -9.90208625793457, "global_step": 102998, "epoch": 613} {"train_loss": -9.800239562988281, "global_step": 102999, "epoch": 613} {"train_loss": -9.944034576416016, "global_step": 103000, "epoch": 613} {"train_loss": -9.727206230163574, "global_step": 103001, "epoch": 613} {"train_loss": -9.824967384338379, "global_step": 103002, "epoch": 613} {"train_loss": -10.009689331054688, "global_step": 103003, "epoch": 613} {"train_loss": -9.619807243347168, "global_step": 103004, "epoch": 613} {"train_loss": -9.896211624145508, "global_step": 103005, "epoch": 613} {"train_loss": -9.877174377441406, "global_step": 103006, "epoch": 613} {"train_loss": -9.940486907958984, "global_step": 103007, "epoch": 613} {"train_loss": -10.064498901367188, "global_step": 103008, "epoch": 613} {"train_loss": -9.926179885864258, "global_step": 103009, "epoch": 613} {"train_loss": -9.86799144744873, "global_step": 103010, "epoch": 613} {"train_loss": -9.797447204589844, "global_step": 103011, "epoch": 613} {"train_loss": -10.042192459106445, "global_step": 103012, "epoch": 613} {"train_loss": -9.993120193481445, "global_step": 103013, "epoch": 613} {"train_loss": -10.25448989868164, "global_step": 103014, "epoch": 613} {"train_loss": -10.104608535766602, "global_step": 103015, "epoch": 613} {"train_loss": -10.127480506896973, "global_step": 103016, "epoch": 613} {"train_loss": -10.066999435424805, "global_step": 103017, "epoch": 613} {"train_loss": -10.028108596801758, "global_step": 103018, "epoch": 613} {"train_loss": -9.78677749633789, "global_step": 103019, "epoch": 613} {"train_loss": -10.184256553649902, "global_step": 103020, "epoch": 613} {"train_loss": -10.062419891357422, "global_step": 103021, "epoch": 613} {"train_loss": -10.128780364990234, "global_step": 103022, "epoch": 613} {"train_loss": -10.2556734085083, "global_step": 103023, "epoch": 613} {"train_loss": -10.017623901367188, "global_step": 103024, "epoch": 613} {"train_loss": -10.166403770446777, "global_step": 103025, "epoch": 613} {"train_loss": -9.887152671813965, "global_step": 103026, "epoch": 613} {"train_loss": -9.739461898803711, "global_step": 103027, "epoch": 613} {"train_loss": -9.821874618530273, "global_step": 103028, "epoch": 613} {"train_loss": -9.81439208984375, "global_step": 103029, "epoch": 613} {"train_loss": -9.819807052612305, "global_step": 103030, "epoch": 613} {"train_loss": -9.819565773010254, "global_step": 103031, "epoch": 613} {"train_loss": -9.791496276855469, "global_step": 103032, "epoch": 613} {"train_loss": -9.612480163574219, "global_step": 103033, "epoch": 613} {"train_loss": -9.197164535522461, "global_step": 103034, "epoch": 613} {"train_loss": -9.858566284179688, "global_step": 103035, "epoch": 613} {"train_loss": -9.163235664367676, "global_step": 103036, "epoch": 613} {"train_loss": -9.345052719116211, "global_step": 103037, "epoch": 613} {"train_loss": -9.747318267822266, "global_step": 103038, "epoch": 613} {"train_loss": -9.049747467041016, "global_step": 103039, "epoch": 613} {"train_loss": -9.944990158081055, "global_step": 103040, "epoch": 613} {"train_loss": -9.451793670654297, "global_step": 103041, "epoch": 613} {"train_loss": -9.681875228881836, "global_step": 103042, "epoch": 613} {"train_loss": -9.554590225219727, "global_step": 103043, "epoch": 613} {"train_loss": -9.504703521728516, "global_step": 103044, "epoch": 613} {"train_loss": -9.767312049865723, "global_step": 103045, "epoch": 613} {"train_loss": -9.961885452270508, "global_step": 103046, "epoch": 613} {"train_loss": -9.61596965789795, "global_step": 103047, "epoch": 613} {"train_loss": -9.666095733642578, "global_step": 103048, "epoch": 613} {"train_loss": -9.576665878295898, "global_step": 103049, "epoch": 613} {"train_loss": -9.882518768310547, "global_step": 103050, "epoch": 613} {"train_loss": -9.787901878356934, "global_step": 103051, "epoch": 613} {"train_loss": -9.732715606689453, "global_step": 103052, "epoch": 613} {"train_loss": -9.859875679016113, "global_step": 103053, "epoch": 613} {"train_loss": -9.829999923706055, "global_step": 103054, "epoch": 613} {"train_loss": -9.904441833496094, "global_step": 103055, "epoch": 613} {"train_loss": -9.60488510131836, "global_step": 103056, "epoch": 613} {"train_loss": -9.810722351074219, "global_step": 103057, "epoch": 613} {"train_loss": -9.696842193603516, "global_step": 103058, "epoch": 613} {"train_loss": -9.784305572509766, "global_step": 103059, "epoch": 613} {"train_loss": -9.483602523803711, "global_step": 103060, "epoch": 613} {"train_loss": -9.683149337768555, "global_step": 103061, "epoch": 613} {"train_loss": -9.402865409851074, "global_step": 103062, "epoch": 613} {"train_loss": -9.749279975891113, "global_step": 103063, "epoch": 613} {"train_loss": -9.38546371459961, "global_step": 103064, "epoch": 613} {"train_loss": -9.874471664428711, "global_step": 103065, "epoch": 613} {"train_loss": -9.721504211425781, "global_step": 103066, "epoch": 613} {"train_loss": -9.76165771484375, "global_step": 103067, "epoch": 613} {"train_loss": -9.67310619354248, "global_step": 103068, "epoch": 613} {"train_loss": -10.023310661315918, "global_step": 103069, "epoch": 613} {"train_loss": -9.4881591796875, "global_step": 103070, "epoch": 613} {"train_loss": -9.74449348449707, "global_step": 103071, "epoch": 613} {"train_loss": -9.576343536376953, "global_step": 103072, "epoch": 613} {"train_loss": -9.701131820678711, "global_step": 103073, "epoch": 613} {"train_loss": -9.773807525634766, "global_step": 103074, "epoch": 613} {"train_loss": -9.757576942443848, "global_step": 103075, "epoch": 613} {"train_loss": -9.730751037597656, "global_step": 103076, "epoch": 613} {"train_loss": -9.671958923339844, "global_step": 103077, "epoch": 613} {"train_loss": -9.735183715820312, "global_step": 103078, "epoch": 613} {"train_loss": -9.539596557617188, "global_step": 103079, "epoch": 613} {"train_loss": -9.906001091003418, "global_step": 103080, "epoch": 613} {"train_loss": -9.60484790802002, "global_step": 103081, "epoch": 613} {"train_loss": -9.710599899291992, "global_step": 103082, "epoch": 613} {"train_loss": -9.923761367797852, "global_step": 103083, "epoch": 613} {"train_loss": -9.587594985961914, "global_step": 103084, "epoch": 613} {"train_loss": -9.737772941589355, "global_step": 103085, "epoch": 613} {"train_loss": -9.8464994430542, "global_step": 103086, "epoch": 613} {"train_loss": -9.83675479888916, "global_step": 103087, "epoch": 613} {"train_loss": -9.801074981689453, "global_step": 103088, "epoch": 613} {"train_loss": -9.970439910888672, "global_step": 103089, "epoch": 613} {"train_loss": -9.744842529296875, "global_step": 103090, "epoch": 613} {"train_loss": -9.568063735961914, "global_step": 103091, "epoch": 613} {"train_loss": -9.834793090820312, "global_step": 103092, "epoch": 613} {"train_loss": -9.421527862548828, "global_step": 103093, "epoch": 613} {"train_loss": -9.466739654541016, "global_step": 103094, "epoch": 613} {"train_loss": -9.140218734741211, "global_step": 103095, "epoch": 613} {"train_loss": -9.157079696655273, "global_step": 103096, "epoch": 613} {"train_loss": -8.945476531982422, "global_step": 103097, "epoch": 613} {"train_loss": -9.332420349121094, "global_step": 103098, "epoch": 613} {"train_loss": -9.060312271118164, "global_step": 103099, "epoch": 613} {"train_loss": -8.559530258178711, "global_step": 103100, "epoch": 613} {"train_loss": -9.317097663879395, "global_step": 103101, "epoch": 613} {"train_loss": -9.152233123779297, "global_step": 103102, "epoch": 613} {"train_loss": -9.462632179260254, "global_step": 103103, "epoch": 613} {"train_loss": -9.54823112487793, "global_step": 103104, "epoch": 613} {"train_loss": -9.393945693969727, "global_step": 103105, "epoch": 613} {"train_loss": -9.164385795593262, "global_step": 103106, "epoch": 613} {"train_loss": -9.540288925170898, "global_step": 103107, "epoch": 613} {"train_loss": -9.050536155700684, "global_step": 103108, "epoch": 613} {"train_loss": -9.66252326965332, "global_step": 103109, "epoch": 613} {"train_loss": -9.268781661987305, "global_step": 103110, "epoch": 613} {"train_loss": -9.643059730529785, "global_step": 103111, "epoch": 613} {"train_loss": -9.234687805175781, "global_step": 103112, "epoch": 613} {"train_loss": -9.376482009887695, "global_step": 103113, "epoch": 613} {"train_loss": -9.495689392089844, "global_step": 103114, "epoch": 613} {"train_loss": -9.291996002197266, "global_step": 103115, "epoch": 613} {"train_loss": -9.671514511108398, "global_step": 103116, "epoch": 613} {"train_loss": -9.557905197143555, "global_step": 103117, "epoch": 613} {"train_loss": -9.713823318481445, "global_step": 103118, "epoch": 613} {"train_loss": -9.85438346862793, "global_step": 103119, "epoch": 613} {"train_loss": -9.529271125793457, "global_step": 103120, "epoch": 613} {"train_loss": -9.665643692016602, "global_step": 103121, "epoch": 613} {"train_loss": -9.557905197143555, "global_step": 103122, "epoch": 613} {"train_loss": -9.82214641571045, "global_step": 103123, "epoch": 613} {"train_loss": -9.718648910522461, "global_step": 103124, "epoch": 613} {"train_loss": -9.631662368774414, "global_step": 103125, "epoch": 613} {"train_loss": -9.620439529418945, "global_step": 103126, "epoch": 613} {"train_loss": -9.976985931396484, "global_step": 103127, "epoch": 613} {"train_loss": -9.59883975982666, "global_step": 103128, "epoch": 613} {"train_loss": -9.847716331481934, "global_step": 103129, "epoch": 613} {"train_loss": -9.97083568572998, "global_step": 103130, "epoch": 613} {"train_loss": -10.08457088470459, "global_step": 103131, "epoch": 613} {"train_loss": -9.911483764648438, "global_step": 103132, "epoch": 613} {"train_loss": -9.921212196350098, "global_step": 103133, "epoch": 613} {"train_loss": -9.777626037597656, "global_step": 103134, "epoch": 613} {"train_loss": -9.818708419799805, "global_step": 103135, "epoch": 613} {"train_loss": -9.908571243286133, "global_step": 103136, "epoch": 613} {"train_loss": -9.872172355651855, "global_step": 103137, "epoch": 613} {"train_loss": -10.033374786376953, "global_step": 103138, "epoch": 613} {"train_loss": -9.902734756469727, "global_step": 103139, "epoch": 613} {"train_loss": -9.55712604522705, "global_step": 103140, "epoch": 613} {"train_loss": -9.74327278137207, "global_step": 103141, "epoch": 613} {"train_loss": -9.870055198669434, "global_step": 103142, "epoch": 613} {"train_loss": -9.421576499938965, "global_step": 103143, "epoch": 613} {"train_loss": -9.776649475097656, "global_step": 103144, "epoch": 613} {"train_loss": -9.496926307678223, "global_step": 103145, "epoch": 613} {"train_loss": -9.242660522460938, "global_step": 103146, "epoch": 613} {"train_loss": -9.83911418914795, "global_step": 103147, "epoch": 613} {"train_loss": -8.934412002563477, "global_step": 103148, "epoch": 613} {"train_loss": -9.658357620239258, "global_step": 103149, "epoch": 613} {"train_loss": -9.255383491516113, "global_step": 103150, "epoch": 613} {"train_loss": -9.685152672585987, "global_step": 103151, "epoch": 613, "val_loss": 205980.984375} {"train_loss": -9.25777816772461, "global_step": 103152, "epoch": 614} {"train_loss": -9.385310173034668, "global_step": 103153, "epoch": 614} {"train_loss": -9.452911376953125, "global_step": 103154, "epoch": 614} {"train_loss": -9.503808975219727, "global_step": 103155, "epoch": 614} {"train_loss": -9.542083740234375, "global_step": 103156, "epoch": 614} {"train_loss": -9.552988052368164, "global_step": 103157, "epoch": 614} {"train_loss": -9.3468017578125, "global_step": 103158, "epoch": 614} {"train_loss": -9.629114151000977, "global_step": 103159, "epoch": 614} {"train_loss": -9.345815658569336, "global_step": 103160, "epoch": 614} {"train_loss": -9.600801467895508, "global_step": 103161, "epoch": 614} {"train_loss": -9.04592514038086, "global_step": 103162, "epoch": 614} {"train_loss": -9.3854398727417, "global_step": 103163, "epoch": 614} {"train_loss": -9.483268737792969, "global_step": 103164, "epoch": 614} {"train_loss": -9.529153823852539, "global_step": 103165, "epoch": 614} {"train_loss": -9.642988204956055, "global_step": 103166, "epoch": 614} {"train_loss": -9.513087272644043, "global_step": 103167, "epoch": 614} {"train_loss": -9.522924423217773, "global_step": 103168, "epoch": 614} {"train_loss": -9.40497875213623, "global_step": 103169, "epoch": 614} {"train_loss": -9.3091459274292, "global_step": 103170, "epoch": 614} {"train_loss": -9.725114822387695, "global_step": 103171, "epoch": 614} {"train_loss": -9.648467063903809, "global_step": 103172, "epoch": 614} {"train_loss": -9.765546798706055, "global_step": 103173, "epoch": 614} {"train_loss": -9.659074783325195, "global_step": 103174, "epoch": 614} {"train_loss": -9.747231483459473, "global_step": 103175, "epoch": 614} {"train_loss": -9.901498794555664, "global_step": 103176, "epoch": 614} {"train_loss": -9.650699615478516, "global_step": 103177, "epoch": 614} {"train_loss": -9.726935386657715, "global_step": 103178, "epoch": 614} {"train_loss": -9.799506187438965, "global_step": 103179, "epoch": 614} {"train_loss": -9.891531944274902, "global_step": 103180, "epoch": 614} {"train_loss": -9.6617431640625, "global_step": 103181, "epoch": 614} {"train_loss": -10.061441421508789, "global_step": 103182, "epoch": 614} {"train_loss": -9.827329635620117, "global_step": 103183, "epoch": 614} {"train_loss": -9.824344635009766, "global_step": 103184, "epoch": 614} {"train_loss": -9.991683006286621, "global_step": 103185, "epoch": 614} {"train_loss": -9.959217071533203, "global_step": 103186, "epoch": 614} {"train_loss": -9.869131088256836, "global_step": 103187, "epoch": 614} {"train_loss": -9.984086990356445, "global_step": 103188, "epoch": 614} {"train_loss": -10.05617904663086, "global_step": 103189, "epoch": 614} {"train_loss": -9.826980590820312, "global_step": 103190, "epoch": 614} {"train_loss": -10.113309860229492, "global_step": 103191, "epoch": 614} {"train_loss": -9.862081527709961, "global_step": 103192, "epoch": 614} {"train_loss": -9.899843215942383, "global_step": 103193, "epoch": 614} {"train_loss": -9.736470222473145, "global_step": 103194, "epoch": 614} {"train_loss": -10.022217750549316, "global_step": 103195, "epoch": 614} {"train_loss": -9.943660736083984, "global_step": 103196, "epoch": 614} {"train_loss": -10.159682273864746, "global_step": 103197, "epoch": 614} {"train_loss": -10.204994201660156, "global_step": 103198, "epoch": 614} {"train_loss": -9.905303001403809, "global_step": 103199, "epoch": 614} {"train_loss": -9.859262466430664, "global_step": 103200, "epoch": 614} {"train_loss": -10.072263717651367, "global_step": 103201, "epoch": 614} {"train_loss": -9.749637603759766, "global_step": 103202, "epoch": 614} {"train_loss": -9.797027587890625, "global_step": 103203, "epoch": 614} {"train_loss": -9.840211868286133, "global_step": 103204, "epoch": 614} {"train_loss": -9.645794868469238, "global_step": 103205, "epoch": 614} {"train_loss": -10.106067657470703, "global_step": 103206, "epoch": 614} {"train_loss": -10.036542892456055, "global_step": 103207, "epoch": 614} {"train_loss": -9.97341537475586, "global_step": 103208, "epoch": 614} {"train_loss": -9.794990539550781, "global_step": 103209, "epoch": 614} {"train_loss": -9.945476531982422, "global_step": 103210, "epoch": 614} {"train_loss": -9.926167488098145, "global_step": 103211, "epoch": 614} {"train_loss": -10.013198852539062, "global_step": 103212, "epoch": 614} {"train_loss": -10.020862579345703, "global_step": 103213, "epoch": 614} {"train_loss": -9.735176086425781, "global_step": 103214, "epoch": 614} {"train_loss": -9.943582534790039, "global_step": 103215, "epoch": 614} {"train_loss": -9.481316566467285, "global_step": 103216, "epoch": 614} {"train_loss": -9.844308853149414, "global_step": 103217, "epoch": 614} {"train_loss": -9.747215270996094, "global_step": 103218, "epoch": 614} {"train_loss": -9.804353713989258, "global_step": 103219, "epoch": 614} {"train_loss": -10.019911766052246, "global_step": 103220, "epoch": 614} {"train_loss": -9.932979583740234, "global_step": 103221, "epoch": 614} {"train_loss": -9.952264785766602, "global_step": 103222, "epoch": 614} {"train_loss": -9.989399909973145, "global_step": 103223, "epoch": 614} {"train_loss": -9.75393295288086, "global_step": 103224, "epoch": 614} {"train_loss": -9.620441436767578, "global_step": 103225, "epoch": 614} {"train_loss": -9.927490234375, "global_step": 103226, "epoch": 614} {"train_loss": -9.841955184936523, "global_step": 103227, "epoch": 614} {"train_loss": -10.026126861572266, "global_step": 103228, "epoch": 614} {"train_loss": -9.951750755310059, "global_step": 103229, "epoch": 614} {"train_loss": -10.097192764282227, "global_step": 103230, "epoch": 614} {"train_loss": -10.029494285583496, "global_step": 103231, "epoch": 614} {"train_loss": -9.951997756958008, "global_step": 103232, "epoch": 614} {"train_loss": -9.923497200012207, "global_step": 103233, "epoch": 614} {"train_loss": -10.061153411865234, "global_step": 103234, "epoch": 614} {"train_loss": -9.796358108520508, "global_step": 103235, "epoch": 614} {"train_loss": -10.058279037475586, "global_step": 103236, "epoch": 614} {"train_loss": -9.830205917358398, "global_step": 103237, "epoch": 614} {"train_loss": -9.86369800567627, "global_step": 103238, "epoch": 614} {"train_loss": -9.869939804077148, "global_step": 103239, "epoch": 614} {"train_loss": -9.88691520690918, "global_step": 103240, "epoch": 614} {"train_loss": -9.881017684936523, "global_step": 103241, "epoch": 614} {"train_loss": -9.590071678161621, "global_step": 103242, "epoch": 614} {"train_loss": -9.728598594665527, "global_step": 103243, "epoch": 614} {"train_loss": -9.77038860321045, "global_step": 103244, "epoch": 614} {"train_loss": -10.012039184570312, "global_step": 103245, "epoch": 614} {"train_loss": -9.906573295593262, "global_step": 103246, "epoch": 614} {"train_loss": -9.84684944152832, "global_step": 103247, "epoch": 614} {"train_loss": -10.084343910217285, "global_step": 103248, "epoch": 614} {"train_loss": -9.783711433410645, "global_step": 103249, "epoch": 614} {"train_loss": -9.98797607421875, "global_step": 103250, "epoch": 614} {"train_loss": -9.65971851348877, "global_step": 103251, "epoch": 614} {"train_loss": -9.74041748046875, "global_step": 103252, "epoch": 614} {"train_loss": -10.018064498901367, "global_step": 103253, "epoch": 614} {"train_loss": -9.857318878173828, "global_step": 103254, "epoch": 614} {"train_loss": -10.012557029724121, "global_step": 103255, "epoch": 614} {"train_loss": -9.773681640625, "global_step": 103256, "epoch": 614} {"train_loss": -9.746652603149414, "global_step": 103257, "epoch": 614} {"train_loss": -10.014225006103516, "global_step": 103258, "epoch": 614} {"train_loss": -9.788981437683105, "global_step": 103259, "epoch": 614} {"train_loss": -9.812623977661133, "global_step": 103260, "epoch": 614} {"train_loss": -9.745336532592773, "global_step": 103261, "epoch": 614} {"train_loss": -10.004430770874023, "global_step": 103262, "epoch": 614} {"train_loss": -9.915870666503906, "global_step": 103263, "epoch": 614} {"train_loss": -9.734070777893066, "global_step": 103264, "epoch": 614} {"train_loss": -9.970926284790039, "global_step": 103265, "epoch": 614} {"train_loss": -9.767890930175781, "global_step": 103266, "epoch": 614} {"train_loss": -9.489151000976562, "global_step": 103267, "epoch": 614} {"train_loss": -9.69112777709961, "global_step": 103268, "epoch": 614} {"train_loss": -9.023335456848145, "global_step": 103269, "epoch": 614} {"train_loss": -9.739419937133789, "global_step": 103270, "epoch": 614} {"train_loss": -9.240182876586914, "global_step": 103271, "epoch": 614} {"train_loss": -9.84010124206543, "global_step": 103272, "epoch": 614} {"train_loss": -9.189435958862305, "global_step": 103273, "epoch": 614} {"train_loss": -10.000431060791016, "global_step": 103274, "epoch": 614} {"train_loss": -9.735594749450684, "global_step": 103275, "epoch": 614} {"train_loss": -9.657295227050781, "global_step": 103276, "epoch": 614} {"train_loss": -9.823968887329102, "global_step": 103277, "epoch": 614} {"train_loss": -9.473845481872559, "global_step": 103278, "epoch": 614} {"train_loss": -9.535318374633789, "global_step": 103279, "epoch": 614} {"train_loss": -9.555265426635742, "global_step": 103280, "epoch": 614} {"train_loss": -9.611112594604492, "global_step": 103281, "epoch": 614} {"train_loss": -9.581775665283203, "global_step": 103282, "epoch": 614} {"train_loss": -9.714727401733398, "global_step": 103283, "epoch": 614} {"train_loss": -9.744731903076172, "global_step": 103284, "epoch": 614} {"train_loss": -9.432411193847656, "global_step": 103285, "epoch": 614} {"train_loss": -9.79141616821289, "global_step": 103286, "epoch": 614} {"train_loss": -9.755319595336914, "global_step": 103287, "epoch": 614} {"train_loss": -9.765959739685059, "global_step": 103288, "epoch": 614} {"train_loss": -9.805060386657715, "global_step": 103289, "epoch": 614} {"train_loss": -9.876205444335938, "global_step": 103290, "epoch": 614} {"train_loss": -10.066797256469727, "global_step": 103291, "epoch": 614} {"train_loss": -9.768896102905273, "global_step": 103292, "epoch": 614} {"train_loss": -9.978058815002441, "global_step": 103293, "epoch": 614} {"train_loss": -9.750755310058594, "global_step": 103294, "epoch": 614} {"train_loss": -10.048402786254883, "global_step": 103295, "epoch": 614} {"train_loss": -9.630918502807617, "global_step": 103296, "epoch": 614} {"train_loss": -9.983907699584961, "global_step": 103297, "epoch": 614} {"train_loss": -9.734480857849121, "global_step": 103298, "epoch": 614} {"train_loss": -9.985990524291992, "global_step": 103299, "epoch": 614} {"train_loss": -9.980611801147461, "global_step": 103300, "epoch": 614} {"train_loss": -9.839377403259277, "global_step": 103301, "epoch": 614} {"train_loss": -9.842273712158203, "global_step": 103302, "epoch": 614} {"train_loss": -9.885010719299316, "global_step": 103303, "epoch": 614} {"train_loss": -9.848076820373535, "global_step": 103304, "epoch": 614} {"train_loss": -9.774969100952148, "global_step": 103305, "epoch": 614} {"train_loss": -9.76268196105957, "global_step": 103306, "epoch": 614} {"train_loss": -9.900018692016602, "global_step": 103307, "epoch": 614} {"train_loss": -9.390371322631836, "global_step": 103308, "epoch": 614} {"train_loss": -9.472617149353027, "global_step": 103309, "epoch": 614} {"train_loss": -9.468925476074219, "global_step": 103310, "epoch": 614} {"train_loss": -9.770186424255371, "global_step": 103311, "epoch": 614} {"train_loss": -9.887100219726562, "global_step": 103312, "epoch": 614} {"train_loss": -9.835850715637207, "global_step": 103313, "epoch": 614} {"train_loss": -9.735686302185059, "global_step": 103314, "epoch": 614} {"train_loss": -9.783303260803223, "global_step": 103315, "epoch": 614} {"train_loss": -9.719282150268555, "global_step": 103316, "epoch": 614} {"train_loss": -9.64055061340332, "global_step": 103317, "epoch": 614} {"train_loss": -9.582376480102539, "global_step": 103318, "epoch": 614} {"train_loss": -9.779489063081288, "global_step": 103319, "epoch": 614, "val_loss": 209295.5} {"train_loss": -9.892827987670898, "global_step": 103320, "epoch": 615} {"train_loss": -9.842174530029297, "global_step": 103321, "epoch": 615} {"train_loss": -10.012447357177734, "global_step": 103322, "epoch": 615} {"train_loss": -9.692767143249512, "global_step": 103323, "epoch": 615} {"train_loss": -9.721399307250977, "global_step": 103324, "epoch": 615} {"train_loss": -9.626565933227539, "global_step": 103325, "epoch": 615} {"train_loss": -9.569931030273438, "global_step": 103326, "epoch": 615} {"train_loss": -9.76412582397461, "global_step": 103327, "epoch": 615} {"train_loss": -9.818319320678711, "global_step": 103328, "epoch": 615} {"train_loss": -9.847253799438477, "global_step": 103329, "epoch": 615} {"train_loss": -9.323343276977539, "global_step": 103330, "epoch": 615} {"train_loss": -9.725580215454102, "global_step": 103331, "epoch": 615} {"train_loss": -9.606548309326172, "global_step": 103332, "epoch": 615} {"train_loss": -9.725654602050781, "global_step": 103333, "epoch": 615} {"train_loss": -9.699750900268555, "global_step": 103334, "epoch": 615} {"train_loss": -9.552101135253906, "global_step": 103335, "epoch": 615} {"train_loss": -9.74319076538086, "global_step": 103336, "epoch": 615} {"train_loss": -9.944282531738281, "global_step": 103337, "epoch": 615} {"train_loss": -9.68807315826416, "global_step": 103338, "epoch": 615} {"train_loss": -9.577352523803711, "global_step": 103339, "epoch": 615} {"train_loss": -9.805307388305664, "global_step": 103340, "epoch": 615} {"train_loss": -9.55753231048584, "global_step": 103341, "epoch": 615} {"train_loss": -9.876208305358887, "global_step": 103342, "epoch": 615} {"train_loss": -10.021530151367188, "global_step": 103343, "epoch": 615} {"train_loss": -9.691661834716797, "global_step": 103344, "epoch": 615} {"train_loss": -9.929730415344238, "global_step": 103345, "epoch": 615} {"train_loss": -9.9053316116333, "global_step": 103346, "epoch": 615} {"train_loss": -9.820353507995605, "global_step": 103347, "epoch": 615} {"train_loss": -9.916254043579102, "global_step": 103348, "epoch": 615} {"train_loss": -9.961640357971191, "global_step": 103349, "epoch": 615} {"train_loss": -9.973068237304688, "global_step": 103350, "epoch": 615} {"train_loss": -10.018893241882324, "global_step": 103351, "epoch": 615} {"train_loss": -9.727234840393066, "global_step": 103352, "epoch": 615} {"train_loss": -9.86184310913086, "global_step": 103353, "epoch": 615} {"train_loss": -9.863834381103516, "global_step": 103354, "epoch": 615} {"train_loss": -10.021834373474121, "global_step": 103355, "epoch": 615} {"train_loss": -9.584159851074219, "global_step": 103356, "epoch": 615} {"train_loss": -9.771324157714844, "global_step": 103357, "epoch": 615} {"train_loss": -10.079057693481445, "global_step": 103358, "epoch": 615} {"train_loss": -9.854677200317383, "global_step": 103359, "epoch": 615} {"train_loss": -10.007251739501953, "global_step": 103360, "epoch": 615} {"train_loss": -9.976318359375, "global_step": 103361, "epoch": 615} {"train_loss": -9.970844268798828, "global_step": 103362, "epoch": 615} {"train_loss": -9.885278701782227, "global_step": 103363, "epoch": 615} {"train_loss": -9.960575103759766, "global_step": 103364, "epoch": 615} {"train_loss": -9.912805557250977, "global_step": 103365, "epoch": 615} {"train_loss": -9.786685943603516, "global_step": 103366, "epoch": 615} {"train_loss": -9.779155731201172, "global_step": 103367, "epoch": 615} {"train_loss": -9.781375885009766, "global_step": 103368, "epoch": 615} {"train_loss": -9.791667938232422, "global_step": 103369, "epoch": 615} {"train_loss": -9.972293853759766, "global_step": 103370, "epoch": 615} {"train_loss": -9.729228973388672, "global_step": 103371, "epoch": 615} {"train_loss": -9.92630386352539, "global_step": 103372, "epoch": 615} {"train_loss": -9.821392059326172, "global_step": 103373, "epoch": 615} {"train_loss": -9.772871017456055, "global_step": 103374, "epoch": 615} {"train_loss": -9.754478454589844, "global_step": 103375, "epoch": 615} {"train_loss": -9.733291625976562, "global_step": 103376, "epoch": 615} {"train_loss": -9.891332626342773, "global_step": 103377, "epoch": 615} {"train_loss": -9.919238090515137, "global_step": 103378, "epoch": 615} {"train_loss": -9.849363327026367, "global_step": 103379, "epoch": 615} {"train_loss": -9.755500793457031, "global_step": 103380, "epoch": 615} {"train_loss": -9.552478790283203, "global_step": 103381, "epoch": 615} {"train_loss": -9.65802001953125, "global_step": 103382, "epoch": 615} {"train_loss": -9.863863945007324, "global_step": 103383, "epoch": 615} {"train_loss": -9.833295822143555, "global_step": 103384, "epoch": 615} {"train_loss": -9.612024307250977, "global_step": 103385, "epoch": 615} {"train_loss": -9.840265274047852, "global_step": 103386, "epoch": 615} {"train_loss": -9.58686637878418, "global_step": 103387, "epoch": 615} {"train_loss": -9.71202278137207, "global_step": 103388, "epoch": 615} {"train_loss": -9.03918170928955, "global_step": 103389, "epoch": 615} {"train_loss": -9.711745262145996, "global_step": 103390, "epoch": 615} {"train_loss": -9.523826599121094, "global_step": 103391, "epoch": 615} {"train_loss": -9.808526992797852, "global_step": 103392, "epoch": 615} {"train_loss": -9.624016761779785, "global_step": 103393, "epoch": 615} {"train_loss": -9.583564758300781, "global_step": 103394, "epoch": 615} {"train_loss": -9.696456909179688, "global_step": 103395, "epoch": 615} {"train_loss": -9.097217559814453, "global_step": 103396, "epoch": 615} {"train_loss": -9.968025207519531, "global_step": 103397, "epoch": 615} {"train_loss": -9.292579650878906, "global_step": 103398, "epoch": 615} {"train_loss": -9.81479263305664, "global_step": 103399, "epoch": 615} {"train_loss": -9.525848388671875, "global_step": 103400, "epoch": 615} {"train_loss": -9.736021041870117, "global_step": 103401, "epoch": 615} {"train_loss": -9.569448471069336, "global_step": 103402, "epoch": 615} {"train_loss": -9.897457122802734, "global_step": 103403, "epoch": 615} {"train_loss": -9.66313362121582, "global_step": 103404, "epoch": 615} {"train_loss": -9.863232612609863, "global_step": 103405, "epoch": 615} {"train_loss": -9.56584358215332, "global_step": 103406, "epoch": 615} {"train_loss": -9.853023529052734, "global_step": 103407, "epoch": 615} {"train_loss": -9.641061782836914, "global_step": 103408, "epoch": 615} {"train_loss": -9.763641357421875, "global_step": 103409, "epoch": 615} {"train_loss": -9.871872901916504, "global_step": 103410, "epoch": 615} {"train_loss": -9.658422470092773, "global_step": 103411, "epoch": 615} {"train_loss": -9.628154754638672, "global_step": 103412, "epoch": 615} {"train_loss": -9.89428424835205, "global_step": 103413, "epoch": 615} {"train_loss": -9.642417907714844, "global_step": 103414, "epoch": 615} {"train_loss": -10.103647232055664, "global_step": 103415, "epoch": 615} {"train_loss": -9.636751174926758, "global_step": 103416, "epoch": 615} {"train_loss": -9.672040939331055, "global_step": 103417, "epoch": 615} {"train_loss": -9.815128326416016, "global_step": 103418, "epoch": 615} {"train_loss": -9.763901710510254, "global_step": 103419, "epoch": 615} {"train_loss": -9.903482437133789, "global_step": 103420, "epoch": 615} {"train_loss": -9.58674144744873, "global_step": 103421, "epoch": 615} {"train_loss": -9.576193809509277, "global_step": 103422, "epoch": 615} {"train_loss": -9.21188735961914, "global_step": 103423, "epoch": 615} {"train_loss": -9.68766975402832, "global_step": 103424, "epoch": 615} {"train_loss": -9.475645065307617, "global_step": 103425, "epoch": 615} {"train_loss": -9.949455261230469, "global_step": 103426, "epoch": 615} {"train_loss": -9.518953323364258, "global_step": 103427, "epoch": 615} {"train_loss": -9.749008178710938, "global_step": 103428, "epoch": 615} {"train_loss": -9.262537002563477, "global_step": 103429, "epoch": 615} {"train_loss": -9.739141464233398, "global_step": 103430, "epoch": 615} {"train_loss": -9.422690391540527, "global_step": 103431, "epoch": 615} {"train_loss": -9.606677055358887, "global_step": 103432, "epoch": 615} {"train_loss": -9.648820877075195, "global_step": 103433, "epoch": 615} {"train_loss": -9.60771369934082, "global_step": 103434, "epoch": 615} {"train_loss": -9.628717422485352, "global_step": 103435, "epoch": 615} {"train_loss": -9.402395248413086, "global_step": 103436, "epoch": 615} {"train_loss": -9.574880599975586, "global_step": 103437, "epoch": 615} {"train_loss": -9.607036590576172, "global_step": 103438, "epoch": 615} {"train_loss": -9.709309577941895, "global_step": 103439, "epoch": 615} {"train_loss": -9.683737754821777, "global_step": 103440, "epoch": 615} {"train_loss": -9.708002090454102, "global_step": 103441, "epoch": 615} {"train_loss": -9.787328720092773, "global_step": 103442, "epoch": 615} {"train_loss": -9.905454635620117, "global_step": 103443, "epoch": 615} {"train_loss": -9.661184310913086, "global_step": 103444, "epoch": 615} {"train_loss": -9.729758262634277, "global_step": 103445, "epoch": 615} {"train_loss": -9.39261245727539, "global_step": 103446, "epoch": 615} {"train_loss": -10.023494720458984, "global_step": 103447, "epoch": 615} {"train_loss": -9.590091705322266, "global_step": 103448, "epoch": 615} {"train_loss": -9.698410987854004, "global_step": 103449, "epoch": 615} {"train_loss": -9.672639846801758, "global_step": 103450, "epoch": 615} {"train_loss": -9.828863143920898, "global_step": 103451, "epoch": 615} {"train_loss": -9.769041061401367, "global_step": 103452, "epoch": 615} {"train_loss": -9.532892227172852, "global_step": 103453, "epoch": 615} {"train_loss": -9.544418334960938, "global_step": 103454, "epoch": 615} {"train_loss": -9.795604705810547, "global_step": 103455, "epoch": 615} {"train_loss": -9.852285385131836, "global_step": 103456, "epoch": 615} {"train_loss": -9.787130355834961, "global_step": 103457, "epoch": 615} {"train_loss": -9.82012939453125, "global_step": 103458, "epoch": 615} {"train_loss": -9.792402267456055, "global_step": 103459, "epoch": 615} {"train_loss": -9.936370849609375, "global_step": 103460, "epoch": 615} {"train_loss": -9.721935272216797, "global_step": 103461, "epoch": 615} {"train_loss": -10.073354721069336, "global_step": 103462, "epoch": 615} {"train_loss": -9.66735553741455, "global_step": 103463, "epoch": 615} {"train_loss": -10.076762199401855, "global_step": 103464, "epoch": 615} {"train_loss": -9.883035659790039, "global_step": 103465, "epoch": 615} {"train_loss": -9.865591049194336, "global_step": 103466, "epoch": 615} {"train_loss": -10.090312957763672, "global_step": 103467, "epoch": 615} {"train_loss": -10.01232624053955, "global_step": 103468, "epoch": 615} {"train_loss": -10.037723541259766, "global_step": 103469, "epoch": 615} {"train_loss": -10.00676155090332, "global_step": 103470, "epoch": 615} {"train_loss": -10.057538986206055, "global_step": 103471, "epoch": 615} {"train_loss": -9.939727783203125, "global_step": 103472, "epoch": 615} {"train_loss": -9.659579277038574, "global_step": 103473, "epoch": 615} {"train_loss": -9.713654518127441, "global_step": 103474, "epoch": 615} {"train_loss": -9.777804374694824, "global_step": 103475, "epoch": 615} {"train_loss": -9.710427284240723, "global_step": 103476, "epoch": 615} {"train_loss": -9.597628593444824, "global_step": 103477, "epoch": 615} {"train_loss": -9.286312103271484, "global_step": 103478, "epoch": 615} {"train_loss": -9.892304420471191, "global_step": 103479, "epoch": 615} {"train_loss": -9.623465538024902, "global_step": 103480, "epoch": 615} {"train_loss": -9.883598327636719, "global_step": 103481, "epoch": 615} {"train_loss": -9.911523818969727, "global_step": 103482, "epoch": 615} {"train_loss": -9.746896743774414, "global_step": 103483, "epoch": 615} {"train_loss": -9.894314765930176, "global_step": 103484, "epoch": 615} {"train_loss": -9.926105499267578, "global_step": 103485, "epoch": 615} {"train_loss": -9.80681037902832, "global_step": 103486, "epoch": 615} {"train_loss": -9.751438986687432, "global_step": 103487, "epoch": 615, "val_loss": 205382.6875, "train_action_mse_error": 3.891542911529541} {"train_loss": -9.77586841583252, "global_step": 103488, "epoch": 616} {"train_loss": -9.874540328979492, "global_step": 103489, "epoch": 616} {"train_loss": -9.776748657226562, "global_step": 103490, "epoch": 616} {"train_loss": -9.7355318069458, "global_step": 103491, "epoch": 616} {"train_loss": -9.507322311401367, "global_step": 103492, "epoch": 616} {"train_loss": -9.578068733215332, "global_step": 103493, "epoch": 616} {"train_loss": -9.470949172973633, "global_step": 103494, "epoch": 616} {"train_loss": -9.811275482177734, "global_step": 103495, "epoch": 616} {"train_loss": -9.33660888671875, "global_step": 103496, "epoch": 616} {"train_loss": -9.734953880310059, "global_step": 103497, "epoch": 616} {"train_loss": -9.340091705322266, "global_step": 103498, "epoch": 616} {"train_loss": -9.640430450439453, "global_step": 103499, "epoch": 616} {"train_loss": -9.647695541381836, "global_step": 103500, "epoch": 616} {"train_loss": -9.930371284484863, "global_step": 103501, "epoch": 616} {"train_loss": -9.911310195922852, "global_step": 103502, "epoch": 616} {"train_loss": -9.854411125183105, "global_step": 103503, "epoch": 616} {"train_loss": -9.876566886901855, "global_step": 103504, "epoch": 616} {"train_loss": -9.785482406616211, "global_step": 103505, "epoch": 616} {"train_loss": -9.881860733032227, "global_step": 103506, "epoch": 616} {"train_loss": -9.845808029174805, "global_step": 103507, "epoch": 616} {"train_loss": -9.73685359954834, "global_step": 103508, "epoch": 616} {"train_loss": -9.756160736083984, "global_step": 103509, "epoch": 616} {"train_loss": -9.90591049194336, "global_step": 103510, "epoch": 616} {"train_loss": -9.935869216918945, "global_step": 103511, "epoch": 616} {"train_loss": -9.885875701904297, "global_step": 103512, "epoch": 616} {"train_loss": -9.968592643737793, "global_step": 103513, "epoch": 616} {"train_loss": -9.88713550567627, "global_step": 103514, "epoch": 616} {"train_loss": -9.796466827392578, "global_step": 103515, "epoch": 616} {"train_loss": -10.033992767333984, "global_step": 103516, "epoch": 616} {"train_loss": -9.872737884521484, "global_step": 103517, "epoch": 616} {"train_loss": -9.935331344604492, "global_step": 103518, "epoch": 616} {"train_loss": -9.852816581726074, "global_step": 103519, "epoch": 616} {"train_loss": -9.707547187805176, "global_step": 103520, "epoch": 616} {"train_loss": -9.858640670776367, "global_step": 103521, "epoch": 616} {"train_loss": -10.037311553955078, "global_step": 103522, "epoch": 616} {"train_loss": -9.737746238708496, "global_step": 103523, "epoch": 616} {"train_loss": -10.238615989685059, "global_step": 103524, "epoch": 616} {"train_loss": -9.721402168273926, "global_step": 103525, "epoch": 616} {"train_loss": -9.980332374572754, "global_step": 103526, "epoch": 616} {"train_loss": -9.913755416870117, "global_step": 103527, "epoch": 616} {"train_loss": -9.606354713439941, "global_step": 103528, "epoch": 616} {"train_loss": -9.623966217041016, "global_step": 103529, "epoch": 616} {"train_loss": -9.523205757141113, "global_step": 103530, "epoch": 616} {"train_loss": -9.143705368041992, "global_step": 103531, "epoch": 616} {"train_loss": -9.774360656738281, "global_step": 103532, "epoch": 616} {"train_loss": -9.669724464416504, "global_step": 103533, "epoch": 616} {"train_loss": -9.648634910583496, "global_step": 103534, "epoch": 616} {"train_loss": -9.9951171875, "global_step": 103535, "epoch": 616} {"train_loss": -9.818093299865723, "global_step": 103536, "epoch": 616} {"train_loss": -9.836271286010742, "global_step": 103537, "epoch": 616} {"train_loss": -9.793624877929688, "global_step": 103538, "epoch": 616} {"train_loss": -9.793892860412598, "global_step": 103539, "epoch": 616} {"train_loss": -9.868661880493164, "global_step": 103540, "epoch": 616} {"train_loss": -9.606958389282227, "global_step": 103541, "epoch": 616} {"train_loss": -10.081907272338867, "global_step": 103542, "epoch": 616} {"train_loss": -9.802483558654785, "global_step": 103543, "epoch": 616} {"train_loss": -9.63484001159668, "global_step": 103544, "epoch": 616} {"train_loss": -9.602636337280273, "global_step": 103545, "epoch": 616} {"train_loss": -9.986053466796875, "global_step": 103546, "epoch": 616} {"train_loss": -9.51309585571289, "global_step": 103547, "epoch": 616} {"train_loss": -9.937499046325684, "global_step": 103548, "epoch": 616} {"train_loss": -9.388925552368164, "global_step": 103549, "epoch": 616} {"train_loss": -9.834572792053223, "global_step": 103550, "epoch": 616} {"train_loss": -9.295222282409668, "global_step": 103551, "epoch": 616} {"train_loss": -9.45106315612793, "global_step": 103552, "epoch": 616} {"train_loss": -9.611413955688477, "global_step": 103553, "epoch": 616} {"train_loss": -9.80120849609375, "global_step": 103554, "epoch": 616} {"train_loss": -9.519489288330078, "global_step": 103555, "epoch": 616} {"train_loss": -9.956815719604492, "global_step": 103556, "epoch": 616} {"train_loss": -9.671485900878906, "global_step": 103557, "epoch": 616} {"train_loss": -9.819059371948242, "global_step": 103558, "epoch": 616} {"train_loss": -9.674013137817383, "global_step": 103559, "epoch": 616} {"train_loss": -9.714818954467773, "global_step": 103560, "epoch": 616} {"train_loss": -9.911467552185059, "global_step": 103561, "epoch": 616} {"train_loss": -9.751346588134766, "global_step": 103562, "epoch": 616} {"train_loss": -9.68722152709961, "global_step": 103563, "epoch": 616} {"train_loss": -9.781787872314453, "global_step": 103564, "epoch": 616} {"train_loss": -9.826613426208496, "global_step": 103565, "epoch": 616} {"train_loss": -9.865394592285156, "global_step": 103566, "epoch": 616} {"train_loss": -9.855794906616211, "global_step": 103567, "epoch": 616} {"train_loss": -9.976810455322266, "global_step": 103568, "epoch": 616} {"train_loss": -9.72863483428955, "global_step": 103569, "epoch": 616} {"train_loss": -10.030706405639648, "global_step": 103570, "epoch": 616} {"train_loss": -10.006852149963379, "global_step": 103571, "epoch": 616} {"train_loss": -10.09541130065918, "global_step": 103572, "epoch": 616} {"train_loss": -9.906042098999023, "global_step": 103573, "epoch": 616} {"train_loss": -9.803459167480469, "global_step": 103574, "epoch": 616} {"train_loss": -9.978168487548828, "global_step": 103575, "epoch": 616} {"train_loss": -9.82791805267334, "global_step": 103576, "epoch": 616} {"train_loss": -9.962955474853516, "global_step": 103577, "epoch": 616} {"train_loss": -9.944944381713867, "global_step": 103578, "epoch": 616} {"train_loss": -9.685752868652344, "global_step": 103579, "epoch": 616} {"train_loss": -9.880247116088867, "global_step": 103580, "epoch": 616} {"train_loss": -9.866044998168945, "global_step": 103581, "epoch": 616} {"train_loss": -10.0006742477417, "global_step": 103582, "epoch": 616} {"train_loss": -10.037055969238281, "global_step": 103583, "epoch": 616} {"train_loss": -10.264030456542969, "global_step": 103584, "epoch": 616} {"train_loss": -10.306639671325684, "global_step": 103585, "epoch": 616} {"train_loss": -9.811458587646484, "global_step": 103586, "epoch": 616} {"train_loss": -9.959376335144043, "global_step": 103587, "epoch": 616} {"train_loss": -9.459545135498047, "global_step": 103588, "epoch": 616} {"train_loss": -10.068025588989258, "global_step": 103589, "epoch": 616} {"train_loss": -9.328546524047852, "global_step": 103590, "epoch": 616} {"train_loss": -9.451964378356934, "global_step": 103591, "epoch": 616} {"train_loss": -10.129193305969238, "global_step": 103592, "epoch": 616} {"train_loss": -9.214177131652832, "global_step": 103593, "epoch": 616} {"train_loss": -9.69443130493164, "global_step": 103594, "epoch": 616} {"train_loss": -9.596528053283691, "global_step": 103595, "epoch": 616} {"train_loss": -9.512624740600586, "global_step": 103596, "epoch": 616} {"train_loss": -9.581692695617676, "global_step": 103597, "epoch": 616} {"train_loss": -9.184928894042969, "global_step": 103598, "epoch": 616} {"train_loss": -9.469358444213867, "global_step": 103599, "epoch": 616} {"train_loss": -9.791353225708008, "global_step": 103600, "epoch": 616} {"train_loss": -9.320038795471191, "global_step": 103601, "epoch": 616} {"train_loss": -9.812407493591309, "global_step": 103602, "epoch": 616} {"train_loss": -9.783413887023926, "global_step": 103603, "epoch": 616} {"train_loss": -9.673530578613281, "global_step": 103604, "epoch": 616} {"train_loss": -9.612008094787598, "global_step": 103605, "epoch": 616} {"train_loss": -9.830381393432617, "global_step": 103606, "epoch": 616} {"train_loss": -9.450331687927246, "global_step": 103607, "epoch": 616} {"train_loss": -9.946052551269531, "global_step": 103608, "epoch": 616} {"train_loss": -9.710952758789062, "global_step": 103609, "epoch": 616} {"train_loss": -9.552915573120117, "global_step": 103610, "epoch": 616} {"train_loss": -9.817830085754395, "global_step": 103611, "epoch": 616} {"train_loss": -9.768695831298828, "global_step": 103612, "epoch": 616} {"train_loss": -9.752668380737305, "global_step": 103613, "epoch": 616} {"train_loss": -9.929119110107422, "global_step": 103614, "epoch": 616} {"train_loss": -9.761819839477539, "global_step": 103615, "epoch": 616} {"train_loss": -9.8950834274292, "global_step": 103616, "epoch": 616} {"train_loss": -9.77707576751709, "global_step": 103617, "epoch": 616} {"train_loss": -9.716329574584961, "global_step": 103618, "epoch": 616} {"train_loss": -10.020444869995117, "global_step": 103619, "epoch": 616} {"train_loss": -9.965163230895996, "global_step": 103620, "epoch": 616} {"train_loss": -9.918194770812988, "global_step": 103621, "epoch": 616} {"train_loss": -9.912960052490234, "global_step": 103622, "epoch": 616} {"train_loss": -9.807710647583008, "global_step": 103623, "epoch": 616} {"train_loss": -9.849076271057129, "global_step": 103624, "epoch": 616} {"train_loss": -9.803905487060547, "global_step": 103625, "epoch": 616} {"train_loss": -9.873309135437012, "global_step": 103626, "epoch": 616} {"train_loss": -9.651222229003906, "global_step": 103627, "epoch": 616} {"train_loss": -9.95068073272705, "global_step": 103628, "epoch": 616} {"train_loss": -9.8545560836792, "global_step": 103629, "epoch": 616} {"train_loss": -10.120542526245117, "global_step": 103630, "epoch": 616} {"train_loss": -9.655665397644043, "global_step": 103631, "epoch": 616} {"train_loss": -9.870708465576172, "global_step": 103632, "epoch": 616} {"train_loss": -9.910895347595215, "global_step": 103633, "epoch": 616} {"train_loss": -9.879461288452148, "global_step": 103634, "epoch": 616} {"train_loss": -9.7610445022583, "global_step": 103635, "epoch": 616} {"train_loss": -9.920827865600586, "global_step": 103636, "epoch": 616} {"train_loss": -10.054194450378418, "global_step": 103637, "epoch": 616} {"train_loss": -10.086353302001953, "global_step": 103638, "epoch": 616} {"train_loss": -10.176922798156738, "global_step": 103639, "epoch": 616} {"train_loss": -9.972784042358398, "global_step": 103640, "epoch": 616} {"train_loss": -9.942331314086914, "global_step": 103641, "epoch": 616} {"train_loss": -9.961124420166016, "global_step": 103642, "epoch": 616} {"train_loss": -10.03676986694336, "global_step": 103643, "epoch": 616} {"train_loss": -10.050914764404297, "global_step": 103644, "epoch": 616} {"train_loss": -9.753423690795898, "global_step": 103645, "epoch": 616} {"train_loss": -9.932465553283691, "global_step": 103646, "epoch": 616} {"train_loss": -9.732934951782227, "global_step": 103647, "epoch": 616} {"train_loss": -9.88187026977539, "global_step": 103648, "epoch": 616} {"train_loss": -10.076025009155273, "global_step": 103649, "epoch": 616} {"train_loss": -9.56873607635498, "global_step": 103650, "epoch": 616} {"train_loss": -10.079051971435547, "global_step": 103651, "epoch": 616} {"train_loss": -9.899385452270508, "global_step": 103652, "epoch": 616} {"train_loss": -9.418502807617188, "global_step": 103653, "epoch": 616} {"train_loss": -9.55614185333252, "global_step": 103654, "epoch": 616} {"train_loss": -9.789254233950661, "global_step": 103655, "epoch": 616, "val_loss": 208397.65625} {"train_loss": -8.38165283203125, "global_step": 103656, "epoch": 617} {"train_loss": -9.532869338989258, "global_step": 103657, "epoch": 617} {"train_loss": -9.369324684143066, "global_step": 103658, "epoch": 617} {"train_loss": -9.42656135559082, "global_step": 103659, "epoch": 617} {"train_loss": -9.225740432739258, "global_step": 103660, "epoch": 617} {"train_loss": -9.403441429138184, "global_step": 103661, "epoch": 617} {"train_loss": -9.458717346191406, "global_step": 103662, "epoch": 617} {"train_loss": -9.341400146484375, "global_step": 103663, "epoch": 617} {"train_loss": -9.58627700805664, "global_step": 103664, "epoch": 617} {"train_loss": -9.26453971862793, "global_step": 103665, "epoch": 617} {"train_loss": -9.576952934265137, "global_step": 103666, "epoch": 617} {"train_loss": -9.765915870666504, "global_step": 103667, "epoch": 617} {"train_loss": -9.603157043457031, "global_step": 103668, "epoch": 617} {"train_loss": -9.484750747680664, "global_step": 103669, "epoch": 617} {"train_loss": -9.416333198547363, "global_step": 103670, "epoch": 617} {"train_loss": -9.53189754486084, "global_step": 103671, "epoch": 617} {"train_loss": -9.516868591308594, "global_step": 103672, "epoch": 617} {"train_loss": -9.735347747802734, "global_step": 103673, "epoch": 617} {"train_loss": -9.421327590942383, "global_step": 103674, "epoch": 617} {"train_loss": -9.624629974365234, "global_step": 103675, "epoch": 617} {"train_loss": -9.717548370361328, "global_step": 103676, "epoch": 617} {"train_loss": -9.333782196044922, "global_step": 103677, "epoch": 617} {"train_loss": -9.564266204833984, "global_step": 103678, "epoch": 617} {"train_loss": -9.366342544555664, "global_step": 103679, "epoch": 617} {"train_loss": -9.76152515411377, "global_step": 103680, "epoch": 617} {"train_loss": -9.528606414794922, "global_step": 103681, "epoch": 617} {"train_loss": -9.895774841308594, "global_step": 103682, "epoch": 617} {"train_loss": -9.837553024291992, "global_step": 103683, "epoch": 617} {"train_loss": -9.672857284545898, "global_step": 103684, "epoch": 617} {"train_loss": -9.83127212524414, "global_step": 103685, "epoch": 617} {"train_loss": -9.944841384887695, "global_step": 103686, "epoch": 617} {"train_loss": -9.69900894165039, "global_step": 103687, "epoch": 617} {"train_loss": -9.643643379211426, "global_step": 103688, "epoch": 617} {"train_loss": -9.97464370727539, "global_step": 103689, "epoch": 617} {"train_loss": -10.087382316589355, "global_step": 103690, "epoch": 617} {"train_loss": -9.547231674194336, "global_step": 103691, "epoch": 617} {"train_loss": -9.881089210510254, "global_step": 103692, "epoch": 617} {"train_loss": -9.675107955932617, "global_step": 103693, "epoch": 617} {"train_loss": -9.823575019836426, "global_step": 103694, "epoch": 617} {"train_loss": -9.668766975402832, "global_step": 103695, "epoch": 617} {"train_loss": -9.682059288024902, "global_step": 103696, "epoch": 617} {"train_loss": -9.869783401489258, "global_step": 103697, "epoch": 617} {"train_loss": -9.20829963684082, "global_step": 103698, "epoch": 617} {"train_loss": -9.972892761230469, "global_step": 103699, "epoch": 617} {"train_loss": -9.698989868164062, "global_step": 103700, "epoch": 617} {"train_loss": -9.897876739501953, "global_step": 103701, "epoch": 617} {"train_loss": -9.887152671813965, "global_step": 103702, "epoch": 617} {"train_loss": -9.603100776672363, "global_step": 103703, "epoch": 617} {"train_loss": -9.68666934967041, "global_step": 103704, "epoch": 617} {"train_loss": -9.591556549072266, "global_step": 103705, "epoch": 617} {"train_loss": -9.885765075683594, "global_step": 103706, "epoch": 617} {"train_loss": -9.444053649902344, "global_step": 103707, "epoch": 617} {"train_loss": -9.708696365356445, "global_step": 103708, "epoch": 617} {"train_loss": -9.456740379333496, "global_step": 103709, "epoch": 617} {"train_loss": -9.723647117614746, "global_step": 103710, "epoch": 617} {"train_loss": -9.643623352050781, "global_step": 103711, "epoch": 617} {"train_loss": -9.360933303833008, "global_step": 103712, "epoch": 617} {"train_loss": -9.762046813964844, "global_step": 103713, "epoch": 617} {"train_loss": -9.70589828491211, "global_step": 103714, "epoch": 617} {"train_loss": -9.430418014526367, "global_step": 103715, "epoch": 617} {"train_loss": -9.891947746276855, "global_step": 103716, "epoch": 617} {"train_loss": -9.489053726196289, "global_step": 103717, "epoch": 617} {"train_loss": -9.616159439086914, "global_step": 103718, "epoch": 617} {"train_loss": -9.530783653259277, "global_step": 103719, "epoch": 617} {"train_loss": -9.519367218017578, "global_step": 103720, "epoch": 617} {"train_loss": -9.522706985473633, "global_step": 103721, "epoch": 617} {"train_loss": -9.670389175415039, "global_step": 103722, "epoch": 617} {"train_loss": -9.494539260864258, "global_step": 103723, "epoch": 617} {"train_loss": -9.894224166870117, "global_step": 103724, "epoch": 617} {"train_loss": -9.751461029052734, "global_step": 103725, "epoch": 617} {"train_loss": -9.810628890991211, "global_step": 103726, "epoch": 617} {"train_loss": -9.401143074035645, "global_step": 103727, "epoch": 617} {"train_loss": -9.84013557434082, "global_step": 103728, "epoch": 617} {"train_loss": -9.389730453491211, "global_step": 103729, "epoch": 617} {"train_loss": -9.745866775512695, "global_step": 103730, "epoch": 617} {"train_loss": -9.784195899963379, "global_step": 103731, "epoch": 617} {"train_loss": -9.537558555603027, "global_step": 103732, "epoch": 617} {"train_loss": -9.573915481567383, "global_step": 103733, "epoch": 617} {"train_loss": -9.620260238647461, "global_step": 103734, "epoch": 617} {"train_loss": -9.294288635253906, "global_step": 103735, "epoch": 617} {"train_loss": -9.396065711975098, "global_step": 103736, "epoch": 617} {"train_loss": -9.595488548278809, "global_step": 103737, "epoch": 617} {"train_loss": -9.199170112609863, "global_step": 103738, "epoch": 617} {"train_loss": -9.679442405700684, "global_step": 103739, "epoch": 617} {"train_loss": -9.62208366394043, "global_step": 103740, "epoch": 617} {"train_loss": -9.464868545532227, "global_step": 103741, "epoch": 617} {"train_loss": -9.292366027832031, "global_step": 103742, "epoch": 617} {"train_loss": -9.736534118652344, "global_step": 103743, "epoch": 617} {"train_loss": -9.561636924743652, "global_step": 103744, "epoch": 617} {"train_loss": -9.35783576965332, "global_step": 103745, "epoch": 617} {"train_loss": -9.356039047241211, "global_step": 103746, "epoch": 617} {"train_loss": -9.218364715576172, "global_step": 103747, "epoch": 617} {"train_loss": -9.266222953796387, "global_step": 103748, "epoch": 617} {"train_loss": -9.694892883300781, "global_step": 103749, "epoch": 617} {"train_loss": -9.2785005569458, "global_step": 103750, "epoch": 617} {"train_loss": -9.199657440185547, "global_step": 103751, "epoch": 617} {"train_loss": -9.682615280151367, "global_step": 103752, "epoch": 617} {"train_loss": -9.371257781982422, "global_step": 103753, "epoch": 617} {"train_loss": -9.335578918457031, "global_step": 103754, "epoch": 617} {"train_loss": -9.762368202209473, "global_step": 103755, "epoch": 617} {"train_loss": -9.501816749572754, "global_step": 103756, "epoch": 617} {"train_loss": -9.485477447509766, "global_step": 103757, "epoch": 617} {"train_loss": -9.62098503112793, "global_step": 103758, "epoch": 617} {"train_loss": -9.717488288879395, "global_step": 103759, "epoch": 617} {"train_loss": -9.584965705871582, "global_step": 103760, "epoch": 617} {"train_loss": -9.919447898864746, "global_step": 103761, "epoch": 617} {"train_loss": -9.717971801757812, "global_step": 103762, "epoch": 617} {"train_loss": -9.67747974395752, "global_step": 103763, "epoch": 617} {"train_loss": -9.8231201171875, "global_step": 103764, "epoch": 617} {"train_loss": -9.885818481445312, "global_step": 103765, "epoch": 617} {"train_loss": -9.823775291442871, "global_step": 103766, "epoch": 617} {"train_loss": -9.902181625366211, "global_step": 103767, "epoch": 617} {"train_loss": -9.793350219726562, "global_step": 103768, "epoch": 617} {"train_loss": -9.808876037597656, "global_step": 103769, "epoch": 617} {"train_loss": -9.851825714111328, "global_step": 103770, "epoch": 617} {"train_loss": -9.984561920166016, "global_step": 103771, "epoch": 617} {"train_loss": -9.824935913085938, "global_step": 103772, "epoch": 617} {"train_loss": -9.926799774169922, "global_step": 103773, "epoch": 617} {"train_loss": -10.029565811157227, "global_step": 103774, "epoch": 617} {"train_loss": -9.896584510803223, "global_step": 103775, "epoch": 617} {"train_loss": -9.917506217956543, "global_step": 103776, "epoch": 617} {"train_loss": -10.096696853637695, "global_step": 103777, "epoch": 617} {"train_loss": -10.013839721679688, "global_step": 103778, "epoch": 617} {"train_loss": -10.019262313842773, "global_step": 103779, "epoch": 617} {"train_loss": -10.211517333984375, "global_step": 103780, "epoch": 617} {"train_loss": -10.018245697021484, "global_step": 103781, "epoch": 617} {"train_loss": -10.098188400268555, "global_step": 103782, "epoch": 617} {"train_loss": -10.075704574584961, "global_step": 103783, "epoch": 617} {"train_loss": -10.17123031616211, "global_step": 103784, "epoch": 617} {"train_loss": -10.007326126098633, "global_step": 103785, "epoch": 617} {"train_loss": -10.026134490966797, "global_step": 103786, "epoch": 617} {"train_loss": -10.076812744140625, "global_step": 103787, "epoch": 617} {"train_loss": -9.93688678741455, "global_step": 103788, "epoch": 617} {"train_loss": -10.05691146850586, "global_step": 103789, "epoch": 617} {"train_loss": -9.98306655883789, "global_step": 103790, "epoch": 617} {"train_loss": -9.711395263671875, "global_step": 103791, "epoch": 617} {"train_loss": -9.879302024841309, "global_step": 103792, "epoch": 617} {"train_loss": -10.086933135986328, "global_step": 103793, "epoch": 617} {"train_loss": -10.056602478027344, "global_step": 103794, "epoch": 617} {"train_loss": -10.29238510131836, "global_step": 103795, "epoch": 617} {"train_loss": -10.119832992553711, "global_step": 103796, "epoch": 617} {"train_loss": -10.092020034790039, "global_step": 103797, "epoch": 617} {"train_loss": -9.935848236083984, "global_step": 103798, "epoch": 617} {"train_loss": -10.126134872436523, "global_step": 103799, "epoch": 617} {"train_loss": -9.562963485717773, "global_step": 103800, "epoch": 617} {"train_loss": -9.843816757202148, "global_step": 103801, "epoch": 617} {"train_loss": -10.144205093383789, "global_step": 103802, "epoch": 617} {"train_loss": -9.938050270080566, "global_step": 103803, "epoch": 617} {"train_loss": -9.977360725402832, "global_step": 103804, "epoch": 617} {"train_loss": -9.898964881896973, "global_step": 103805, "epoch": 617} {"train_loss": -9.849588394165039, "global_step": 103806, "epoch": 617} {"train_loss": -10.094062805175781, "global_step": 103807, "epoch": 617} {"train_loss": -10.13958740234375, "global_step": 103808, "epoch": 617} {"train_loss": -9.96749496459961, "global_step": 103809, "epoch": 617} {"train_loss": -10.208308219909668, "global_step": 103810, "epoch": 617} {"train_loss": -9.88619613647461, "global_step": 103811, "epoch": 617} {"train_loss": -9.92425537109375, "global_step": 103812, "epoch": 617} {"train_loss": -9.9108247756958, "global_step": 103813, "epoch": 617} {"train_loss": -9.882211685180664, "global_step": 103814, "epoch": 617} {"train_loss": -9.884448051452637, "global_step": 103815, "epoch": 617} {"train_loss": -9.880712509155273, "global_step": 103816, "epoch": 617} {"train_loss": -9.809772491455078, "global_step": 103817, "epoch": 617} {"train_loss": -10.018575668334961, "global_step": 103818, "epoch": 617} {"train_loss": -9.789644241333008, "global_step": 103819, "epoch": 617} {"train_loss": -9.713048934936523, "global_step": 103820, "epoch": 617} {"train_loss": -9.264995574951172, "global_step": 103821, "epoch": 617} {"train_loss": -9.567547798156738, "global_step": 103822, "epoch": 617} {"train_loss": -9.71189870720818, "global_step": 103823, "epoch": 617, "val_loss": 208026.6875} {"train_loss": -9.743490219116211, "global_step": 103824, "epoch": 618} {"train_loss": -9.728416442871094, "global_step": 103825, "epoch": 618} {"train_loss": -9.90544319152832, "global_step": 103826, "epoch": 618} {"train_loss": -9.866551399230957, "global_step": 103827, "epoch": 618} {"train_loss": -9.915985107421875, "global_step": 103828, "epoch": 618} {"train_loss": -9.723867416381836, "global_step": 103829, "epoch": 618} {"train_loss": -9.764345169067383, "global_step": 103830, "epoch": 618} {"train_loss": -9.775988578796387, "global_step": 103831, "epoch": 618} {"train_loss": -9.381196975708008, "global_step": 103832, "epoch": 618} {"train_loss": -9.825387954711914, "global_step": 103833, "epoch": 618} {"train_loss": -9.671991348266602, "global_step": 103834, "epoch": 618} {"train_loss": -9.765420913696289, "global_step": 103835, "epoch": 618} {"train_loss": -9.618814468383789, "global_step": 103836, "epoch": 618} {"train_loss": -9.885465621948242, "global_step": 103837, "epoch": 618} {"train_loss": -9.790857315063477, "global_step": 103838, "epoch": 618} {"train_loss": -9.810859680175781, "global_step": 103839, "epoch": 618} {"train_loss": -9.82789421081543, "global_step": 103840, "epoch": 618} {"train_loss": -9.868057250976562, "global_step": 103841, "epoch": 618} {"train_loss": -9.800060272216797, "global_step": 103842, "epoch": 618} {"train_loss": -9.95501708984375, "global_step": 103843, "epoch": 618} {"train_loss": -9.603412628173828, "global_step": 103844, "epoch": 618} {"train_loss": -9.75898265838623, "global_step": 103845, "epoch": 618} {"train_loss": -9.819894790649414, "global_step": 103846, "epoch": 618} {"train_loss": -9.928983688354492, "global_step": 103847, "epoch": 618} {"train_loss": -9.902959823608398, "global_step": 103848, "epoch": 618} {"train_loss": -9.558372497558594, "global_step": 103849, "epoch": 618} {"train_loss": -9.794939041137695, "global_step": 103850, "epoch": 618} {"train_loss": -9.851705551147461, "global_step": 103851, "epoch": 618} {"train_loss": -9.623205184936523, "global_step": 103852, "epoch": 618} {"train_loss": -9.723146438598633, "global_step": 103853, "epoch": 618} {"train_loss": -9.852483749389648, "global_step": 103854, "epoch": 618} {"train_loss": -9.855792045593262, "global_step": 103855, "epoch": 618} {"train_loss": -9.863584518432617, "global_step": 103856, "epoch": 618} {"train_loss": -9.72336196899414, "global_step": 103857, "epoch": 618} {"train_loss": -9.689159393310547, "global_step": 103858, "epoch": 618} {"train_loss": -9.78445816040039, "global_step": 103859, "epoch": 618} {"train_loss": -9.826803207397461, "global_step": 103860, "epoch": 618} {"train_loss": -9.900413513183594, "global_step": 103861, "epoch": 618} {"train_loss": -9.665488243103027, "global_step": 103862, "epoch": 618} {"train_loss": -9.787211418151855, "global_step": 103863, "epoch": 618} {"train_loss": -9.538236618041992, "global_step": 103864, "epoch": 618} {"train_loss": -9.570301055908203, "global_step": 103865, "epoch": 618} {"train_loss": -9.786503791809082, "global_step": 103866, "epoch": 618} {"train_loss": -9.449508666992188, "global_step": 103867, "epoch": 618} {"train_loss": -9.76632022857666, "global_step": 103868, "epoch": 618} {"train_loss": -9.435550689697266, "global_step": 103869, "epoch": 618} {"train_loss": -9.48836612701416, "global_step": 103870, "epoch": 618} {"train_loss": -9.804288864135742, "global_step": 103871, "epoch": 618} {"train_loss": -9.264144897460938, "global_step": 103872, "epoch": 618} {"train_loss": -9.51082706451416, "global_step": 103873, "epoch": 618} {"train_loss": -9.206512451171875, "global_step": 103874, "epoch": 618} {"train_loss": -9.780061721801758, "global_step": 103875, "epoch": 618} {"train_loss": -9.542587280273438, "global_step": 103876, "epoch": 618} {"train_loss": -9.448436737060547, "global_step": 103877, "epoch": 618} {"train_loss": -9.538473129272461, "global_step": 103878, "epoch": 618} {"train_loss": -9.161979675292969, "global_step": 103879, "epoch": 618} {"train_loss": -9.792985916137695, "global_step": 103880, "epoch": 618} {"train_loss": -9.449426651000977, "global_step": 103881, "epoch": 618} {"train_loss": -9.688091278076172, "global_step": 103882, "epoch": 618} {"train_loss": -9.172030448913574, "global_step": 103883, "epoch": 618} {"train_loss": -9.85880184173584, "global_step": 103884, "epoch": 618} {"train_loss": -9.353202819824219, "global_step": 103885, "epoch": 618} {"train_loss": -9.207308769226074, "global_step": 103886, "epoch": 618} {"train_loss": -9.276762962341309, "global_step": 103887, "epoch": 618} {"train_loss": -9.679133415222168, "global_step": 103888, "epoch": 618} {"train_loss": -9.293405532836914, "global_step": 103889, "epoch": 618} {"train_loss": -9.448848724365234, "global_step": 103890, "epoch": 618} {"train_loss": -9.334997177124023, "global_step": 103891, "epoch": 618} {"train_loss": -9.50881576538086, "global_step": 103892, "epoch": 618} {"train_loss": -9.445645332336426, "global_step": 103893, "epoch": 618} {"train_loss": -9.32232666015625, "global_step": 103894, "epoch": 618} {"train_loss": -9.742441177368164, "global_step": 103895, "epoch": 618} {"train_loss": -9.242742538452148, "global_step": 103896, "epoch": 618} {"train_loss": -9.471543312072754, "global_step": 103897, "epoch": 618} {"train_loss": -9.8311767578125, "global_step": 103898, "epoch": 618} {"train_loss": -9.663609504699707, "global_step": 103899, "epoch": 618} {"train_loss": -9.569765090942383, "global_step": 103900, "epoch": 618} {"train_loss": -9.69894027709961, "global_step": 103901, "epoch": 618} {"train_loss": -10.008441925048828, "global_step": 103902, "epoch": 618} {"train_loss": -9.855788230895996, "global_step": 103903, "epoch": 618} {"train_loss": -9.532329559326172, "global_step": 103904, "epoch": 618} {"train_loss": -9.827127456665039, "global_step": 103905, "epoch": 618} {"train_loss": -10.100574493408203, "global_step": 103906, "epoch": 618} {"train_loss": -9.773221015930176, "global_step": 103907, "epoch": 618} {"train_loss": -9.674728393554688, "global_step": 103908, "epoch": 618} {"train_loss": -9.903802871704102, "global_step": 103909, "epoch": 618} {"train_loss": -9.904932022094727, "global_step": 103910, "epoch": 618} {"train_loss": -9.69943618774414, "global_step": 103911, "epoch": 618} {"train_loss": -9.672271728515625, "global_step": 103912, "epoch": 618} {"train_loss": -9.769113540649414, "global_step": 103913, "epoch": 618} {"train_loss": -9.928665161132812, "global_step": 103914, "epoch": 618} {"train_loss": -9.722246170043945, "global_step": 103915, "epoch": 618} {"train_loss": -9.820076942443848, "global_step": 103916, "epoch": 618} {"train_loss": -9.869034767150879, "global_step": 103917, "epoch": 618} {"train_loss": -9.800814628601074, "global_step": 103918, "epoch": 618} {"train_loss": -9.791488647460938, "global_step": 103919, "epoch": 618} {"train_loss": -9.966737747192383, "global_step": 103920, "epoch": 618} {"train_loss": -9.771663665771484, "global_step": 103921, "epoch": 618} {"train_loss": -9.84682846069336, "global_step": 103922, "epoch": 618} {"train_loss": -9.992347717285156, "global_step": 103923, "epoch": 618} {"train_loss": -9.93734073638916, "global_step": 103924, "epoch": 618} {"train_loss": -9.819711685180664, "global_step": 103925, "epoch": 618} {"train_loss": -9.980512619018555, "global_step": 103926, "epoch": 618} {"train_loss": -9.664175033569336, "global_step": 103927, "epoch": 618} {"train_loss": -9.897506713867188, "global_step": 103928, "epoch": 618} {"train_loss": -9.57638931274414, "global_step": 103929, "epoch": 618} {"train_loss": -9.715313911437988, "global_step": 103930, "epoch": 618} {"train_loss": -9.45798397064209, "global_step": 103931, "epoch": 618} {"train_loss": -9.920623779296875, "global_step": 103932, "epoch": 618} {"train_loss": -9.344141006469727, "global_step": 103933, "epoch": 618} {"train_loss": -9.342296600341797, "global_step": 103934, "epoch": 618} {"train_loss": -9.724669456481934, "global_step": 103935, "epoch": 618} {"train_loss": -9.618616104125977, "global_step": 103936, "epoch": 618} {"train_loss": -9.262331008911133, "global_step": 103937, "epoch": 618} {"train_loss": -9.495247840881348, "global_step": 103938, "epoch": 618} {"train_loss": -9.277181625366211, "global_step": 103939, "epoch": 618} {"train_loss": -9.339183807373047, "global_step": 103940, "epoch": 618} {"train_loss": -9.417213439941406, "global_step": 103941, "epoch": 618} {"train_loss": -9.559271812438965, "global_step": 103942, "epoch": 618} {"train_loss": -9.31056022644043, "global_step": 103943, "epoch": 618} {"train_loss": -9.423465728759766, "global_step": 103944, "epoch": 618} {"train_loss": -9.646121978759766, "global_step": 103945, "epoch": 618} {"train_loss": -9.366630554199219, "global_step": 103946, "epoch": 618} {"train_loss": -9.612674713134766, "global_step": 103947, "epoch": 618} {"train_loss": -9.412620544433594, "global_step": 103948, "epoch": 618} {"train_loss": -9.754486083984375, "global_step": 103949, "epoch": 618} {"train_loss": -9.696380615234375, "global_step": 103950, "epoch": 618} {"train_loss": -9.857626914978027, "global_step": 103951, "epoch": 618} {"train_loss": -9.650456428527832, "global_step": 103952, "epoch": 618} {"train_loss": -9.805828094482422, "global_step": 103953, "epoch": 618} {"train_loss": -9.861078262329102, "global_step": 103954, "epoch": 618} {"train_loss": -9.630882263183594, "global_step": 103955, "epoch": 618} {"train_loss": -9.965166091918945, "global_step": 103956, "epoch": 618} {"train_loss": -9.6856050491333, "global_step": 103957, "epoch": 618} {"train_loss": -9.95676040649414, "global_step": 103958, "epoch": 618} {"train_loss": -9.573741912841797, "global_step": 103959, "epoch": 618} {"train_loss": -9.80720329284668, "global_step": 103960, "epoch": 618} {"train_loss": -9.828737258911133, "global_step": 103961, "epoch": 618} {"train_loss": -9.949201583862305, "global_step": 103962, "epoch": 618} {"train_loss": -9.96762466430664, "global_step": 103963, "epoch": 618} {"train_loss": -9.79423999786377, "global_step": 103964, "epoch": 618} {"train_loss": -9.928024291992188, "global_step": 103965, "epoch": 618} {"train_loss": -10.136844635009766, "global_step": 103966, "epoch": 618} {"train_loss": -9.914571762084961, "global_step": 103967, "epoch": 618} {"train_loss": -10.048735618591309, "global_step": 103968, "epoch": 618} {"train_loss": -9.96462345123291, "global_step": 103969, "epoch": 618} {"train_loss": -9.755243301391602, "global_step": 103970, "epoch": 618} {"train_loss": -10.205628395080566, "global_step": 103971, "epoch": 618} {"train_loss": -9.504976272583008, "global_step": 103972, "epoch": 618} {"train_loss": -9.807116508483887, "global_step": 103973, "epoch": 618} {"train_loss": -9.900552749633789, "global_step": 103974, "epoch": 618} {"train_loss": -9.783921241760254, "global_step": 103975, "epoch": 618} {"train_loss": -9.848711013793945, "global_step": 103976, "epoch": 618} {"train_loss": -9.620950698852539, "global_step": 103977, "epoch": 618} {"train_loss": -9.44953727722168, "global_step": 103978, "epoch": 618} {"train_loss": -9.908349990844727, "global_step": 103979, "epoch": 618} {"train_loss": -9.519704818725586, "global_step": 103980, "epoch": 618} {"train_loss": -9.663683891296387, "global_step": 103981, "epoch": 618} {"train_loss": -9.620942115783691, "global_step": 103982, "epoch": 618} {"train_loss": -9.743616104125977, "global_step": 103983, "epoch": 618} {"train_loss": -9.919763565063477, "global_step": 103984, "epoch": 618} {"train_loss": -9.829776763916016, "global_step": 103985, "epoch": 618} {"train_loss": -9.75711441040039, "global_step": 103986, "epoch": 618} {"train_loss": -9.284892082214355, "global_step": 103987, "epoch": 618} {"train_loss": -9.78145980834961, "global_step": 103988, "epoch": 618} {"train_loss": -9.628596305847168, "global_step": 103989, "epoch": 618} {"train_loss": -9.631298065185547, "global_step": 103990, "epoch": 618} {"train_loss": -9.692037633487157, "global_step": 103991, "epoch": 618, "val_loss": 206827.546875} {"train_loss": -9.379240989685059, "global_step": 103992, "epoch": 619} {"train_loss": -9.685281753540039, "global_step": 103993, "epoch": 619} {"train_loss": -9.180791854858398, "global_step": 103994, "epoch": 619} {"train_loss": -9.500078201293945, "global_step": 103995, "epoch": 619} {"train_loss": -9.667110443115234, "global_step": 103996, "epoch": 619} {"train_loss": -9.225486755371094, "global_step": 103997, "epoch": 619} {"train_loss": -9.6144380569458, "global_step": 103998, "epoch": 619} {"train_loss": -9.52883243560791, "global_step": 103999, "epoch": 619} {"train_loss": -9.297369956970215, "global_step": 104000, "epoch": 619} {"train_loss": -9.826803207397461, "global_step": 104001, "epoch": 619} {"train_loss": -9.389429092407227, "global_step": 104002, "epoch": 619} {"train_loss": -9.600323677062988, "global_step": 104003, "epoch": 619} {"train_loss": -9.788911819458008, "global_step": 104004, "epoch": 619} {"train_loss": -9.694499015808105, "global_step": 104005, "epoch": 619} {"train_loss": -9.541936874389648, "global_step": 104006, "epoch": 619} {"train_loss": -9.65660285949707, "global_step": 104007, "epoch": 619} {"train_loss": -9.65648365020752, "global_step": 104008, "epoch": 619} {"train_loss": -9.774552345275879, "global_step": 104009, "epoch": 619} {"train_loss": -9.569412231445312, "global_step": 104010, "epoch": 619} {"train_loss": -9.749138832092285, "global_step": 104011, "epoch": 619} {"train_loss": -9.871739387512207, "global_step": 104012, "epoch": 619} {"train_loss": -9.793732643127441, "global_step": 104013, "epoch": 619} {"train_loss": -9.976423263549805, "global_step": 104014, "epoch": 619} {"train_loss": -9.94613265991211, "global_step": 104015, "epoch": 619} {"train_loss": -10.038339614868164, "global_step": 104016, "epoch": 619} {"train_loss": -9.938783645629883, "global_step": 104017, "epoch": 619} {"train_loss": -9.818108558654785, "global_step": 104018, "epoch": 619} {"train_loss": -9.786205291748047, "global_step": 104019, "epoch": 619} {"train_loss": -9.911792755126953, "global_step": 104020, "epoch": 619} {"train_loss": -9.995655059814453, "global_step": 104021, "epoch": 619} {"train_loss": -10.0557279586792, "global_step": 104022, "epoch": 619} {"train_loss": -9.828824996948242, "global_step": 104023, "epoch": 619} {"train_loss": -9.985544204711914, "global_step": 104024, "epoch": 619} {"train_loss": -9.833198547363281, "global_step": 104025, "epoch": 619} {"train_loss": -10.053126335144043, "global_step": 104026, "epoch": 619} {"train_loss": -9.699548721313477, "global_step": 104027, "epoch": 619} {"train_loss": -10.03226375579834, "global_step": 104028, "epoch": 619} {"train_loss": -9.802846908569336, "global_step": 104029, "epoch": 619} {"train_loss": -9.68657112121582, "global_step": 104030, "epoch": 619} {"train_loss": -9.664592742919922, "global_step": 104031, "epoch": 619} {"train_loss": -9.845684051513672, "global_step": 104032, "epoch": 619} {"train_loss": -9.8812255859375, "global_step": 104033, "epoch": 619} {"train_loss": -9.99379825592041, "global_step": 104034, "epoch": 619} {"train_loss": -9.873960494995117, "global_step": 104035, "epoch": 619} {"train_loss": -9.97181224822998, "global_step": 104036, "epoch": 619} {"train_loss": -9.8223295211792, "global_step": 104037, "epoch": 619} {"train_loss": -10.068345069885254, "global_step": 104038, "epoch": 619} {"train_loss": -10.026214599609375, "global_step": 104039, "epoch": 619} {"train_loss": -9.952698707580566, "global_step": 104040, "epoch": 619} {"train_loss": -9.994701385498047, "global_step": 104041, "epoch": 619} {"train_loss": -10.130638122558594, "global_step": 104042, "epoch": 619} {"train_loss": -9.933387756347656, "global_step": 104043, "epoch": 619} {"train_loss": -10.135845184326172, "global_step": 104044, "epoch": 619} {"train_loss": -9.889358520507812, "global_step": 104045, "epoch": 619} {"train_loss": -10.187143325805664, "global_step": 104046, "epoch": 619} {"train_loss": -9.920082092285156, "global_step": 104047, "epoch": 619} {"train_loss": -9.880354881286621, "global_step": 104048, "epoch": 619} {"train_loss": -9.975847244262695, "global_step": 104049, "epoch": 619} {"train_loss": -9.781732559204102, "global_step": 104050, "epoch": 619} {"train_loss": -10.110511779785156, "global_step": 104051, "epoch": 619} {"train_loss": -9.654047012329102, "global_step": 104052, "epoch": 619} {"train_loss": -10.145801544189453, "global_step": 104053, "epoch": 619} {"train_loss": -10.198602676391602, "global_step": 104054, "epoch": 619} {"train_loss": -9.685575485229492, "global_step": 104055, "epoch": 619} {"train_loss": -10.001676559448242, "global_step": 104056, "epoch": 619} {"train_loss": -9.631805419921875, "global_step": 104057, "epoch": 619} {"train_loss": -9.531759262084961, "global_step": 104058, "epoch": 619} {"train_loss": -9.794371604919434, "global_step": 104059, "epoch": 619} {"train_loss": -9.259445190429688, "global_step": 104060, "epoch": 619} {"train_loss": -9.317121505737305, "global_step": 104061, "epoch": 619} {"train_loss": -9.370649337768555, "global_step": 104062, "epoch": 619} {"train_loss": -9.152052879333496, "global_step": 104063, "epoch": 619} {"train_loss": -9.677999496459961, "global_step": 104064, "epoch": 619} {"train_loss": -9.268562316894531, "global_step": 104065, "epoch": 619} {"train_loss": -9.710411071777344, "global_step": 104066, "epoch": 619} {"train_loss": -9.546980857849121, "global_step": 104067, "epoch": 619} {"train_loss": -9.380094528198242, "global_step": 104068, "epoch": 619} {"train_loss": -9.631105422973633, "global_step": 104069, "epoch": 619} {"train_loss": -9.822956085205078, "global_step": 104070, "epoch": 619} {"train_loss": -9.610586166381836, "global_step": 104071, "epoch": 619} {"train_loss": -9.729438781738281, "global_step": 104072, "epoch": 619} {"train_loss": -9.383190155029297, "global_step": 104073, "epoch": 619} {"train_loss": -9.814289093017578, "global_step": 104074, "epoch": 619} {"train_loss": -9.480033874511719, "global_step": 104075, "epoch": 619} {"train_loss": -9.484453201293945, "global_step": 104076, "epoch": 619} {"train_loss": -9.713141441345215, "global_step": 104077, "epoch": 619} {"train_loss": -9.709456443786621, "global_step": 104078, "epoch": 619} {"train_loss": -9.896416664123535, "global_step": 104079, "epoch": 619} {"train_loss": -9.7296781539917, "global_step": 104080, "epoch": 619} {"train_loss": -9.654672622680664, "global_step": 104081, "epoch": 619} {"train_loss": -9.709099769592285, "global_step": 104082, "epoch": 619} {"train_loss": -9.982013702392578, "global_step": 104083, "epoch": 619} {"train_loss": -9.746871948242188, "global_step": 104084, "epoch": 619} {"train_loss": -9.940696716308594, "global_step": 104085, "epoch": 619} {"train_loss": -9.660470962524414, "global_step": 104086, "epoch": 619} {"train_loss": -9.952820777893066, "global_step": 104087, "epoch": 619} {"train_loss": -9.98546028137207, "global_step": 104088, "epoch": 619} {"train_loss": -9.721395492553711, "global_step": 104089, "epoch": 619} {"train_loss": -9.826952934265137, "global_step": 104090, "epoch": 619} {"train_loss": -9.627620697021484, "global_step": 104091, "epoch": 619} {"train_loss": -9.987122535705566, "global_step": 104092, "epoch": 619} {"train_loss": -9.92435073852539, "global_step": 104093, "epoch": 619} {"train_loss": -9.839178085327148, "global_step": 104094, "epoch": 619} {"train_loss": -9.708332061767578, "global_step": 104095, "epoch": 619} {"train_loss": -9.997014999389648, "global_step": 104096, "epoch": 619} {"train_loss": -9.993934631347656, "global_step": 104097, "epoch": 619} {"train_loss": -10.017946243286133, "global_step": 104098, "epoch": 619} {"train_loss": -10.122849464416504, "global_step": 104099, "epoch": 619} {"train_loss": -9.960538864135742, "global_step": 104100, "epoch": 619} {"train_loss": -10.034132957458496, "global_step": 104101, "epoch": 619} {"train_loss": -9.863171577453613, "global_step": 104102, "epoch": 619} {"train_loss": -10.11984920501709, "global_step": 104103, "epoch": 619} {"train_loss": -10.189899444580078, "global_step": 104104, "epoch": 619} {"train_loss": -9.979297637939453, "global_step": 104105, "epoch": 619} {"train_loss": -10.187828063964844, "global_step": 104106, "epoch": 619} {"train_loss": -10.12440299987793, "global_step": 104107, "epoch": 619} {"train_loss": -9.962919235229492, "global_step": 104108, "epoch": 619} {"train_loss": -9.980644226074219, "global_step": 104109, "epoch": 619} {"train_loss": -10.288331985473633, "global_step": 104110, "epoch": 619} {"train_loss": -10.245758056640625, "global_step": 104111, "epoch": 619} {"train_loss": -9.732773780822754, "global_step": 104112, "epoch": 619} {"train_loss": -10.030983924865723, "global_step": 104113, "epoch": 619} {"train_loss": -9.925090789794922, "global_step": 104114, "epoch": 619} {"train_loss": -10.10239028930664, "global_step": 104115, "epoch": 619} {"train_loss": -9.80856704711914, "global_step": 104116, "epoch": 619} {"train_loss": -9.958497047424316, "global_step": 104117, "epoch": 619} {"train_loss": -9.866029739379883, "global_step": 104118, "epoch": 619} {"train_loss": -9.565434455871582, "global_step": 104119, "epoch": 619} {"train_loss": -9.823698043823242, "global_step": 104120, "epoch": 619} {"train_loss": -10.01913833618164, "global_step": 104121, "epoch": 619} {"train_loss": -9.794157028198242, "global_step": 104122, "epoch": 619} {"train_loss": -10.12241268157959, "global_step": 104123, "epoch": 619} {"train_loss": -10.181253433227539, "global_step": 104124, "epoch": 619} {"train_loss": -10.215645790100098, "global_step": 104125, "epoch": 619} {"train_loss": -9.972545623779297, "global_step": 104126, "epoch": 619} {"train_loss": -10.225713729858398, "global_step": 104127, "epoch": 619} {"train_loss": -9.959691047668457, "global_step": 104128, "epoch": 619} {"train_loss": -9.96328353881836, "global_step": 104129, "epoch": 619} {"train_loss": -9.665716171264648, "global_step": 104130, "epoch": 619} {"train_loss": -9.829544067382812, "global_step": 104131, "epoch": 619} {"train_loss": -10.024369239807129, "global_step": 104132, "epoch": 619} {"train_loss": -9.252767562866211, "global_step": 104133, "epoch": 619} {"train_loss": -9.263997077941895, "global_step": 104134, "epoch": 619} {"train_loss": -9.64132308959961, "global_step": 104135, "epoch": 619} {"train_loss": -9.229472160339355, "global_step": 104136, "epoch": 619} {"train_loss": -9.476728439331055, "global_step": 104137, "epoch": 619} {"train_loss": -9.538116455078125, "global_step": 104138, "epoch": 619} {"train_loss": -9.357584953308105, "global_step": 104139, "epoch": 619} {"train_loss": -9.418962478637695, "global_step": 104140, "epoch": 619} {"train_loss": -9.407883644104004, "global_step": 104141, "epoch": 619} {"train_loss": -9.538326263427734, "global_step": 104142, "epoch": 619} {"train_loss": -9.720235824584961, "global_step": 104143, "epoch": 619} {"train_loss": -9.330024719238281, "global_step": 104144, "epoch": 619} {"train_loss": -9.443561553955078, "global_step": 104145, "epoch": 619} {"train_loss": -9.489543914794922, "global_step": 104146, "epoch": 619} {"train_loss": -9.651836395263672, "global_step": 104147, "epoch": 619} {"train_loss": -9.09908676147461, "global_step": 104148, "epoch": 619} {"train_loss": -9.8577241897583, "global_step": 104149, "epoch": 619} {"train_loss": -9.214499473571777, "global_step": 104150, "epoch": 619} {"train_loss": -9.519692420959473, "global_step": 104151, "epoch": 619} {"train_loss": -9.54953384399414, "global_step": 104152, "epoch": 619} {"train_loss": -9.572026252746582, "global_step": 104153, "epoch": 619} {"train_loss": -9.56645679473877, "global_step": 104154, "epoch": 619} {"train_loss": -9.363948822021484, "global_step": 104155, "epoch": 619} {"train_loss": -9.320619583129883, "global_step": 104156, "epoch": 619} {"train_loss": -9.536952018737793, "global_step": 104157, "epoch": 619} {"train_loss": -9.707204818725586, "global_step": 104158, "epoch": 619} {"train_loss": -9.764942918504987, "global_step": 104159, "epoch": 619, "val_loss": 205608.515625} {"train_loss": -9.836477279663086, "global_step": 104160, "epoch": 620} {"train_loss": -9.473031997680664, "global_step": 104161, "epoch": 620} {"train_loss": -9.713094711303711, "global_step": 104162, "epoch": 620} {"train_loss": -9.849040985107422, "global_step": 104163, "epoch": 620} {"train_loss": -9.603341102600098, "global_step": 104164, "epoch": 620} {"train_loss": -9.838014602661133, "global_step": 104165, "epoch": 620} {"train_loss": -9.655893325805664, "global_step": 104166, "epoch": 620} {"train_loss": -9.605366706848145, "global_step": 104167, "epoch": 620} {"train_loss": -9.87048053741455, "global_step": 104168, "epoch": 620} {"train_loss": -9.814559936523438, "global_step": 104169, "epoch": 620} {"train_loss": -9.768935203552246, "global_step": 104170, "epoch": 620} {"train_loss": -9.946723937988281, "global_step": 104171, "epoch": 620} {"train_loss": -9.600260734558105, "global_step": 104172, "epoch": 620} {"train_loss": -10.004793167114258, "global_step": 104173, "epoch": 620} {"train_loss": -9.930233001708984, "global_step": 104174, "epoch": 620} {"train_loss": -9.913209915161133, "global_step": 104175, "epoch": 620} {"train_loss": -10.033872604370117, "global_step": 104176, "epoch": 620} {"train_loss": -9.890130996704102, "global_step": 104177, "epoch": 620} {"train_loss": -9.952722549438477, "global_step": 104178, "epoch": 620} {"train_loss": -9.942916870117188, "global_step": 104179, "epoch": 620} {"train_loss": -9.765426635742188, "global_step": 104180, "epoch": 620} {"train_loss": -10.212478637695312, "global_step": 104181, "epoch": 620} {"train_loss": -10.142984390258789, "global_step": 104182, "epoch": 620} {"train_loss": -10.166229248046875, "global_step": 104183, "epoch": 620} {"train_loss": -9.970002174377441, "global_step": 104184, "epoch": 620} {"train_loss": -10.187955856323242, "global_step": 104185, "epoch": 620} {"train_loss": -10.24073600769043, "global_step": 104186, "epoch": 620} {"train_loss": -9.992462158203125, "global_step": 104187, "epoch": 620} {"train_loss": -10.240341186523438, "global_step": 104188, "epoch": 620} {"train_loss": -10.065764427185059, "global_step": 104189, "epoch": 620} {"train_loss": -9.94286823272705, "global_step": 104190, "epoch": 620} {"train_loss": -10.04938793182373, "global_step": 104191, "epoch": 620} {"train_loss": -10.004493713378906, "global_step": 104192, "epoch": 620} {"train_loss": -10.125286102294922, "global_step": 104193, "epoch": 620} {"train_loss": -10.162079811096191, "global_step": 104194, "epoch": 620} {"train_loss": -10.061145782470703, "global_step": 104195, "epoch": 620} {"train_loss": -10.071792602539062, "global_step": 104196, "epoch": 620} {"train_loss": -10.057302474975586, "global_step": 104197, "epoch": 620} {"train_loss": -9.806215286254883, "global_step": 104198, "epoch": 620} {"train_loss": -10.068893432617188, "global_step": 104199, "epoch": 620} {"train_loss": -10.176994323730469, "global_step": 104200, "epoch": 620} {"train_loss": -9.723775863647461, "global_step": 104201, "epoch": 620} {"train_loss": -9.348791122436523, "global_step": 104202, "epoch": 620} {"train_loss": -9.651988983154297, "global_step": 104203, "epoch": 620} {"train_loss": -9.981391906738281, "global_step": 104204, "epoch": 620} {"train_loss": -9.29813289642334, "global_step": 104205, "epoch": 620} {"train_loss": -9.63673210144043, "global_step": 104206, "epoch": 620} {"train_loss": -9.287822723388672, "global_step": 104207, "epoch": 620} {"train_loss": -9.024295806884766, "global_step": 104208, "epoch": 620} {"train_loss": -8.03878402709961, "global_step": 104209, "epoch": 620} {"train_loss": -8.949136734008789, "global_step": 104210, "epoch": 620} {"train_loss": -7.882451057434082, "global_step": 104211, "epoch": 620} {"train_loss": -9.09160041809082, "global_step": 104212, "epoch": 620} {"train_loss": -8.377750396728516, "global_step": 104213, "epoch": 620} {"train_loss": -8.177245140075684, "global_step": 104214, "epoch": 620} {"train_loss": -8.786913871765137, "global_step": 104215, "epoch": 620} {"train_loss": -8.373808860778809, "global_step": 104216, "epoch": 620} {"train_loss": -8.78445053100586, "global_step": 104217, "epoch": 620} {"train_loss": -9.124581336975098, "global_step": 104218, "epoch": 620} {"train_loss": -9.088578224182129, "global_step": 104219, "epoch": 620} {"train_loss": -9.3064546585083, "global_step": 104220, "epoch": 620} {"train_loss": -9.121467590332031, "global_step": 104221, "epoch": 620} {"train_loss": -9.43081283569336, "global_step": 104222, "epoch": 620} {"train_loss": -9.526557922363281, "global_step": 104223, "epoch": 620} {"train_loss": -9.135330200195312, "global_step": 104224, "epoch": 620} {"train_loss": -9.313089370727539, "global_step": 104225, "epoch": 620} {"train_loss": -9.477148056030273, "global_step": 104226, "epoch": 620} {"train_loss": -9.318275451660156, "global_step": 104227, "epoch": 620} {"train_loss": -9.397454261779785, "global_step": 104228, "epoch": 620} {"train_loss": -9.505087852478027, "global_step": 104229, "epoch": 620} {"train_loss": -9.443477630615234, "global_step": 104230, "epoch": 620} {"train_loss": -9.36393928527832, "global_step": 104231, "epoch": 620} {"train_loss": -9.533502578735352, "global_step": 104232, "epoch": 620} {"train_loss": -9.600576400756836, "global_step": 104233, "epoch": 620} {"train_loss": -9.495498657226562, "global_step": 104234, "epoch": 620} {"train_loss": -9.59353256225586, "global_step": 104235, "epoch": 620} {"train_loss": -9.795811653137207, "global_step": 104236, "epoch": 620} {"train_loss": -9.581610679626465, "global_step": 104237, "epoch": 620} {"train_loss": -9.94880199432373, "global_step": 104238, "epoch": 620} {"train_loss": -9.624412536621094, "global_step": 104239, "epoch": 620} {"train_loss": -9.845169067382812, "global_step": 104240, "epoch": 620} {"train_loss": -9.835561752319336, "global_step": 104241, "epoch": 620} {"train_loss": -9.776725769042969, "global_step": 104242, "epoch": 620} {"train_loss": -9.97153091430664, "global_step": 104243, "epoch": 620} {"train_loss": -10.002178192138672, "global_step": 104244, "epoch": 620} {"train_loss": -9.731270790100098, "global_step": 104245, "epoch": 620} {"train_loss": -9.80695915222168, "global_step": 104246, "epoch": 620} {"train_loss": -9.851396560668945, "global_step": 104247, "epoch": 620} {"train_loss": -9.994848251342773, "global_step": 104248, "epoch": 620} {"train_loss": -9.695326805114746, "global_step": 104249, "epoch": 620} {"train_loss": -9.870153427124023, "global_step": 104250, "epoch": 620} {"train_loss": -9.657073974609375, "global_step": 104251, "epoch": 620} {"train_loss": -9.920059204101562, "global_step": 104252, "epoch": 620} {"train_loss": -9.96657943725586, "global_step": 104253, "epoch": 620} {"train_loss": -9.565774917602539, "global_step": 104254, "epoch": 620} {"train_loss": -9.7455472946167, "global_step": 104255, "epoch": 620} {"train_loss": -10.043319702148438, "global_step": 104256, "epoch": 620} {"train_loss": -9.869112968444824, "global_step": 104257, "epoch": 620} {"train_loss": -9.879796028137207, "global_step": 104258, "epoch": 620} {"train_loss": -9.983511924743652, "global_step": 104259, "epoch": 620} {"train_loss": -10.043440818786621, "global_step": 104260, "epoch": 620} {"train_loss": -9.938636779785156, "global_step": 104261, "epoch": 620} {"train_loss": -9.803378105163574, "global_step": 104262, "epoch": 620} {"train_loss": -9.86777400970459, "global_step": 104263, "epoch": 620} {"train_loss": -9.815589904785156, "global_step": 104264, "epoch": 620} {"train_loss": -9.881620407104492, "global_step": 104265, "epoch": 620} {"train_loss": -9.914663314819336, "global_step": 104266, "epoch": 620} {"train_loss": -9.928529739379883, "global_step": 104267, "epoch": 620} {"train_loss": -9.592592239379883, "global_step": 104268, "epoch": 620} {"train_loss": -9.80553913116455, "global_step": 104269, "epoch": 620} {"train_loss": -9.315388679504395, "global_step": 104270, "epoch": 620} {"train_loss": -10.016395568847656, "global_step": 104271, "epoch": 620} {"train_loss": -9.597684860229492, "global_step": 104272, "epoch": 620} {"train_loss": -10.005428314208984, "global_step": 104273, "epoch": 620} {"train_loss": -9.685976028442383, "global_step": 104274, "epoch": 620} {"train_loss": -9.597881317138672, "global_step": 104275, "epoch": 620} {"train_loss": -9.829193115234375, "global_step": 104276, "epoch": 620} {"train_loss": -9.934048652648926, "global_step": 104277, "epoch": 620} {"train_loss": -9.894564628601074, "global_step": 104278, "epoch": 620} {"train_loss": -9.678430557250977, "global_step": 104279, "epoch": 620} {"train_loss": -10.058282852172852, "global_step": 104280, "epoch": 620} {"train_loss": -9.860854148864746, "global_step": 104281, "epoch": 620} {"train_loss": -9.91351318359375, "global_step": 104282, "epoch": 620} {"train_loss": -9.398423194885254, "global_step": 104283, "epoch": 620} {"train_loss": -9.721172332763672, "global_step": 104284, "epoch": 620} {"train_loss": -9.546854019165039, "global_step": 104285, "epoch": 620} {"train_loss": -8.926551818847656, "global_step": 104286, "epoch": 620} {"train_loss": -9.885229110717773, "global_step": 104287, "epoch": 620} {"train_loss": -9.50255298614502, "global_step": 104288, "epoch": 620} {"train_loss": -9.486251831054688, "global_step": 104289, "epoch": 620} {"train_loss": -9.69620132446289, "global_step": 104290, "epoch": 620} {"train_loss": -9.470526695251465, "global_step": 104291, "epoch": 620} {"train_loss": -9.766831398010254, "global_step": 104292, "epoch": 620} {"train_loss": -9.499964714050293, "global_step": 104293, "epoch": 620} {"train_loss": -9.79104995727539, "global_step": 104294, "epoch": 620} {"train_loss": -9.727773666381836, "global_step": 104295, "epoch": 620} {"train_loss": -9.65460205078125, "global_step": 104296, "epoch": 620} {"train_loss": -9.60605525970459, "global_step": 104297, "epoch": 620} {"train_loss": -9.824390411376953, "global_step": 104298, "epoch": 620} {"train_loss": -9.814406394958496, "global_step": 104299, "epoch": 620} {"train_loss": -9.842243194580078, "global_step": 104300, "epoch": 620} {"train_loss": -9.753913879394531, "global_step": 104301, "epoch": 620} {"train_loss": -9.837616920471191, "global_step": 104302, "epoch": 620} {"train_loss": -9.854525566101074, "global_step": 104303, "epoch": 620} {"train_loss": -9.803976058959961, "global_step": 104304, "epoch": 620} {"train_loss": -9.869729042053223, "global_step": 104305, "epoch": 620} {"train_loss": -10.002155303955078, "global_step": 104306, "epoch": 620} {"train_loss": -9.768054962158203, "global_step": 104307, "epoch": 620} {"train_loss": -9.864645004272461, "global_step": 104308, "epoch": 620} {"train_loss": -10.053544998168945, "global_step": 104309, "epoch": 620} {"train_loss": -9.94906234741211, "global_step": 104310, "epoch": 620} {"train_loss": -10.114748001098633, "global_step": 104311, "epoch": 620} {"train_loss": -9.951006889343262, "global_step": 104312, "epoch": 620} {"train_loss": -10.046810150146484, "global_step": 104313, "epoch": 620} {"train_loss": -10.145331382751465, "global_step": 104314, "epoch": 620} {"train_loss": -9.913910865783691, "global_step": 104315, "epoch": 620} {"train_loss": -10.006484031677246, "global_step": 104316, "epoch": 620} {"train_loss": -9.995562553405762, "global_step": 104317, "epoch": 620} {"train_loss": -10.049628257751465, "global_step": 104318, "epoch": 620} {"train_loss": -9.943443298339844, "global_step": 104319, "epoch": 620} {"train_loss": -10.213227272033691, "global_step": 104320, "epoch": 620} {"train_loss": -9.952004432678223, "global_step": 104321, "epoch": 620} {"train_loss": -9.951070785522461, "global_step": 104322, "epoch": 620} {"train_loss": -9.979059219360352, "global_step": 104323, "epoch": 620} {"train_loss": -9.971540451049805, "global_step": 104324, "epoch": 620} {"train_loss": -10.31140422821045, "global_step": 104325, "epoch": 620} {"train_loss": -9.852227210998535, "global_step": 104326, "epoch": 620} {"train_loss": -9.719905296961466, "global_step": 104327, "epoch": 620, "val_loss": 208587.75, "train_action_mse_error": 6.585391521453857} {"train_loss": -9.384442329406738, "global_step": 104328, "epoch": 621} {"train_loss": -9.938066482543945, "global_step": 104329, "epoch": 621} {"train_loss": -9.32707405090332, "global_step": 104330, "epoch": 621} {"train_loss": -9.468073844909668, "global_step": 104331, "epoch": 621} {"train_loss": -9.647558212280273, "global_step": 104332, "epoch": 621} {"train_loss": -9.226326942443848, "global_step": 104333, "epoch": 621} {"train_loss": -9.674723625183105, "global_step": 104334, "epoch": 621} {"train_loss": -9.195775985717773, "global_step": 104335, "epoch": 621} {"train_loss": -9.508956909179688, "global_step": 104336, "epoch": 621} {"train_loss": -9.54637336730957, "global_step": 104337, "epoch": 621} {"train_loss": -9.24046516418457, "global_step": 104338, "epoch": 621} {"train_loss": -9.580923080444336, "global_step": 104339, "epoch": 621} {"train_loss": -9.67297649383545, "global_step": 104340, "epoch": 621} {"train_loss": -9.162971496582031, "global_step": 104341, "epoch": 621} {"train_loss": -9.318077087402344, "global_step": 104342, "epoch": 621} {"train_loss": -9.42422866821289, "global_step": 104343, "epoch": 621} {"train_loss": -9.441587448120117, "global_step": 104344, "epoch": 621} {"train_loss": -9.333086013793945, "global_step": 104345, "epoch": 621} {"train_loss": -9.523160934448242, "global_step": 104346, "epoch": 621} {"train_loss": -9.387998580932617, "global_step": 104347, "epoch": 621} {"train_loss": -9.314620971679688, "global_step": 104348, "epoch": 621} {"train_loss": -9.444278717041016, "global_step": 104349, "epoch": 621} {"train_loss": -9.546485900878906, "global_step": 104350, "epoch": 621} {"train_loss": -9.310235023498535, "global_step": 104351, "epoch": 621} {"train_loss": -9.19786262512207, "global_step": 104352, "epoch": 621} {"train_loss": -9.508705139160156, "global_step": 104353, "epoch": 621} {"train_loss": -9.010160446166992, "global_step": 104354, "epoch": 621} {"train_loss": -9.584300994873047, "global_step": 104355, "epoch": 621} {"train_loss": -9.375320434570312, "global_step": 104356, "epoch": 621} {"train_loss": -9.611392974853516, "global_step": 104357, "epoch": 621} {"train_loss": -9.535688400268555, "global_step": 104358, "epoch": 621} {"train_loss": -9.392742156982422, "global_step": 104359, "epoch": 621} {"train_loss": -9.720345497131348, "global_step": 104360, "epoch": 621} {"train_loss": -9.125722885131836, "global_step": 104361, "epoch": 621} {"train_loss": -9.302882194519043, "global_step": 104362, "epoch": 621} {"train_loss": -9.233721733093262, "global_step": 104363, "epoch": 621} {"train_loss": -9.600212097167969, "global_step": 104364, "epoch": 621} {"train_loss": -9.50898551940918, "global_step": 104365, "epoch": 621} {"train_loss": -9.71385669708252, "global_step": 104366, "epoch": 621} {"train_loss": -9.904753684997559, "global_step": 104367, "epoch": 621} {"train_loss": -9.771960258483887, "global_step": 104368, "epoch": 621} {"train_loss": -9.622024536132812, "global_step": 104369, "epoch": 621} {"train_loss": -9.879756927490234, "global_step": 104370, "epoch": 621} {"train_loss": -9.571307182312012, "global_step": 104371, "epoch": 621} {"train_loss": -9.66221809387207, "global_step": 104372, "epoch": 621} {"train_loss": -9.899435043334961, "global_step": 104373, "epoch": 621} {"train_loss": -9.824398040771484, "global_step": 104374, "epoch": 621} {"train_loss": -9.844058990478516, "global_step": 104375, "epoch": 621} {"train_loss": -9.922243118286133, "global_step": 104376, "epoch": 621} {"train_loss": -9.971465110778809, "global_step": 104377, "epoch": 621} {"train_loss": -9.793298721313477, "global_step": 104378, "epoch": 621} {"train_loss": -10.098869323730469, "global_step": 104379, "epoch": 621} {"train_loss": -9.903966903686523, "global_step": 104380, "epoch": 621} {"train_loss": -9.85711669921875, "global_step": 104381, "epoch": 621} {"train_loss": -9.912322998046875, "global_step": 104382, "epoch": 621} {"train_loss": -9.978608131408691, "global_step": 104383, "epoch": 621} {"train_loss": -10.025654792785645, "global_step": 104384, "epoch": 621} {"train_loss": -9.685128211975098, "global_step": 104385, "epoch": 621} {"train_loss": -9.395990371704102, "global_step": 104386, "epoch": 621} {"train_loss": -9.65894603729248, "global_step": 104387, "epoch": 621} {"train_loss": -9.609378814697266, "global_step": 104388, "epoch": 621} {"train_loss": -8.961358070373535, "global_step": 104389, "epoch": 621} {"train_loss": -9.344412803649902, "global_step": 104390, "epoch": 621} {"train_loss": -9.873634338378906, "global_step": 104391, "epoch": 621} {"train_loss": -9.875716209411621, "global_step": 104392, "epoch": 621} {"train_loss": -9.590917587280273, "global_step": 104393, "epoch": 621} {"train_loss": -9.883834838867188, "global_step": 104394, "epoch": 621} {"train_loss": -9.846017837524414, "global_step": 104395, "epoch": 621} {"train_loss": -9.86062240600586, "global_step": 104396, "epoch": 621} {"train_loss": -9.851678848266602, "global_step": 104397, "epoch": 621} {"train_loss": -9.50759506225586, "global_step": 104398, "epoch": 621} {"train_loss": -9.833858489990234, "global_step": 104399, "epoch": 621} {"train_loss": -9.711288452148438, "global_step": 104400, "epoch": 621} {"train_loss": -9.75694465637207, "global_step": 104401, "epoch": 621} {"train_loss": -9.819986343383789, "global_step": 104402, "epoch": 621} {"train_loss": -9.744427680969238, "global_step": 104403, "epoch": 621} {"train_loss": -9.865514755249023, "global_step": 104404, "epoch": 621} {"train_loss": -9.764325141906738, "global_step": 104405, "epoch": 621} {"train_loss": -9.352272033691406, "global_step": 104406, "epoch": 621} {"train_loss": -9.646493911743164, "global_step": 104407, "epoch": 621} {"train_loss": -10.00566291809082, "global_step": 104408, "epoch": 621} {"train_loss": -9.490650177001953, "global_step": 104409, "epoch": 621} {"train_loss": -9.946511268615723, "global_step": 104410, "epoch": 621} {"train_loss": -9.664011001586914, "global_step": 104411, "epoch": 621} {"train_loss": -9.795449256896973, "global_step": 104412, "epoch": 621} {"train_loss": -9.610148429870605, "global_step": 104413, "epoch": 621} {"train_loss": -9.76689338684082, "global_step": 104414, "epoch": 621} {"train_loss": -9.740036010742188, "global_step": 104415, "epoch": 621} {"train_loss": -9.60885238647461, "global_step": 104416, "epoch": 621} {"train_loss": -9.580026626586914, "global_step": 104417, "epoch": 621} {"train_loss": -9.895058631896973, "global_step": 104418, "epoch": 621} {"train_loss": -9.640759468078613, "global_step": 104419, "epoch": 621} {"train_loss": -9.961915969848633, "global_step": 104420, "epoch": 621} {"train_loss": -9.645584106445312, "global_step": 104421, "epoch": 621} {"train_loss": -9.791847229003906, "global_step": 104422, "epoch": 621} {"train_loss": -9.899762153625488, "global_step": 104423, "epoch": 621} {"train_loss": -9.59941577911377, "global_step": 104424, "epoch": 621} {"train_loss": -9.854312896728516, "global_step": 104425, "epoch": 621} {"train_loss": -9.770450592041016, "global_step": 104426, "epoch": 621} {"train_loss": -9.739154815673828, "global_step": 104427, "epoch": 621} {"train_loss": -9.831647872924805, "global_step": 104428, "epoch": 621} {"train_loss": -9.843217849731445, "global_step": 104429, "epoch": 621} {"train_loss": -9.85276985168457, "global_step": 104430, "epoch": 621} {"train_loss": -10.107963562011719, "global_step": 104431, "epoch": 621} {"train_loss": -9.856603622436523, "global_step": 104432, "epoch": 621} {"train_loss": -9.77640151977539, "global_step": 104433, "epoch": 621} {"train_loss": -9.946406364440918, "global_step": 104434, "epoch": 621} {"train_loss": -10.062362670898438, "global_step": 104435, "epoch": 621} {"train_loss": -9.730555534362793, "global_step": 104436, "epoch": 621} {"train_loss": -10.095518112182617, "global_step": 104437, "epoch": 621} {"train_loss": -9.736175537109375, "global_step": 104438, "epoch": 621} {"train_loss": -10.055391311645508, "global_step": 104439, "epoch": 621} {"train_loss": -9.827590942382812, "global_step": 104440, "epoch": 621} {"train_loss": -9.640861511230469, "global_step": 104441, "epoch": 621} {"train_loss": -10.023213386535645, "global_step": 104442, "epoch": 621} {"train_loss": -9.583230972290039, "global_step": 104443, "epoch": 621} {"train_loss": -9.741043090820312, "global_step": 104444, "epoch": 621} {"train_loss": -9.368474006652832, "global_step": 104445, "epoch": 621} {"train_loss": -9.611948013305664, "global_step": 104446, "epoch": 621} {"train_loss": -9.717889785766602, "global_step": 104447, "epoch": 621} {"train_loss": -9.643345832824707, "global_step": 104448, "epoch": 621} {"train_loss": -9.490071296691895, "global_step": 104449, "epoch": 621} {"train_loss": -9.678451538085938, "global_step": 104450, "epoch": 621} {"train_loss": -9.64454460144043, "global_step": 104451, "epoch": 621} {"train_loss": -9.656902313232422, "global_step": 104452, "epoch": 621} {"train_loss": -9.25347900390625, "global_step": 104453, "epoch": 621} {"train_loss": -9.785686492919922, "global_step": 104454, "epoch": 621} {"train_loss": -9.371770858764648, "global_step": 104455, "epoch": 621} {"train_loss": -9.784062385559082, "global_step": 104456, "epoch": 621} {"train_loss": -9.705667495727539, "global_step": 104457, "epoch": 621} {"train_loss": -9.689796447753906, "global_step": 104458, "epoch": 621} {"train_loss": -9.513814926147461, "global_step": 104459, "epoch": 621} {"train_loss": -9.8632230758667, "global_step": 104460, "epoch": 621} {"train_loss": -9.627571105957031, "global_step": 104461, "epoch": 621} {"train_loss": -9.76427173614502, "global_step": 104462, "epoch": 621} {"train_loss": -9.648435592651367, "global_step": 104463, "epoch": 621} {"train_loss": -9.756237030029297, "global_step": 104464, "epoch": 621} {"train_loss": -9.643659591674805, "global_step": 104465, "epoch": 621} {"train_loss": -9.735506057739258, "global_step": 104466, "epoch": 621} {"train_loss": -9.913579940795898, "global_step": 104467, "epoch": 621} {"train_loss": -9.596919059753418, "global_step": 104468, "epoch": 621} {"train_loss": -9.713977813720703, "global_step": 104469, "epoch": 621} {"train_loss": -9.54332160949707, "global_step": 104470, "epoch": 621} {"train_loss": -9.96799087524414, "global_step": 104471, "epoch": 621} {"train_loss": -9.542801856994629, "global_step": 104472, "epoch": 621} {"train_loss": -9.896848678588867, "global_step": 104473, "epoch": 621} {"train_loss": -9.800727844238281, "global_step": 104474, "epoch": 621} {"train_loss": -9.982622146606445, "global_step": 104475, "epoch": 621} {"train_loss": -9.78565502166748, "global_step": 104476, "epoch": 621} {"train_loss": -9.6934175491333, "global_step": 104477, "epoch": 621} {"train_loss": -9.6629638671875, "global_step": 104478, "epoch": 621} {"train_loss": -9.629895210266113, "global_step": 104479, "epoch": 621} {"train_loss": -9.642072677612305, "global_step": 104480, "epoch": 621} {"train_loss": -9.678045272827148, "global_step": 104481, "epoch": 621} {"train_loss": -9.932928085327148, "global_step": 104482, "epoch": 621} {"train_loss": -9.655180931091309, "global_step": 104483, "epoch": 621} {"train_loss": -9.901670455932617, "global_step": 104484, "epoch": 621} {"train_loss": -9.543449401855469, "global_step": 104485, "epoch": 621} {"train_loss": -9.743768692016602, "global_step": 104486, "epoch": 621} {"train_loss": -9.469942092895508, "global_step": 104487, "epoch": 621} {"train_loss": -9.912179946899414, "global_step": 104488, "epoch": 621} {"train_loss": -9.702415466308594, "global_step": 104489, "epoch": 621} {"train_loss": -9.841776847839355, "global_step": 104490, "epoch": 621} {"train_loss": -9.697075843811035, "global_step": 104491, "epoch": 621} {"train_loss": -9.685256958007812, "global_step": 104492, "epoch": 621} {"train_loss": -9.422176361083984, "global_step": 104493, "epoch": 621} {"train_loss": -9.861287117004395, "global_step": 104494, "epoch": 621} {"train_loss": -9.669516007105509, "global_step": 104495, "epoch": 621, "val_loss": 208819.578125} {"train_loss": -9.624124526977539, "global_step": 104496, "epoch": 622} {"train_loss": -9.83018684387207, "global_step": 104497, "epoch": 622} {"train_loss": -9.597732543945312, "global_step": 104498, "epoch": 622} {"train_loss": -9.753180503845215, "global_step": 104499, "epoch": 622} {"train_loss": -9.426925659179688, "global_step": 104500, "epoch": 622} {"train_loss": -9.643576622009277, "global_step": 104501, "epoch": 622} {"train_loss": -9.581546783447266, "global_step": 104502, "epoch": 622} {"train_loss": -9.944427490234375, "global_step": 104503, "epoch": 622} {"train_loss": -9.70826530456543, "global_step": 104504, "epoch": 622} {"train_loss": -9.866156578063965, "global_step": 104505, "epoch": 622} {"train_loss": -9.729524612426758, "global_step": 104506, "epoch": 622} {"train_loss": -9.793603897094727, "global_step": 104507, "epoch": 622} {"train_loss": -10.024224281311035, "global_step": 104508, "epoch": 622} {"train_loss": -10.190001487731934, "global_step": 104509, "epoch": 622} {"train_loss": -9.916633605957031, "global_step": 104510, "epoch": 622} {"train_loss": -9.908658027648926, "global_step": 104511, "epoch": 622} {"train_loss": -9.989448547363281, "global_step": 104512, "epoch": 622} {"train_loss": -9.829458236694336, "global_step": 104513, "epoch": 622} {"train_loss": -9.777522087097168, "global_step": 104514, "epoch": 622} {"train_loss": -9.984949111938477, "global_step": 104515, "epoch": 622} {"train_loss": -9.415606498718262, "global_step": 104516, "epoch": 622} {"train_loss": -10.033302307128906, "global_step": 104517, "epoch": 622} {"train_loss": -9.537630081176758, "global_step": 104518, "epoch": 622} {"train_loss": -9.35063362121582, "global_step": 104519, "epoch": 622} {"train_loss": -9.786636352539062, "global_step": 104520, "epoch": 622} {"train_loss": -9.348093032836914, "global_step": 104521, "epoch": 622} {"train_loss": -9.514719009399414, "global_step": 104522, "epoch": 622} {"train_loss": -9.596110343933105, "global_step": 104523, "epoch": 622} {"train_loss": -9.559497833251953, "global_step": 104524, "epoch": 622} {"train_loss": -9.708039283752441, "global_step": 104525, "epoch": 622} {"train_loss": -9.71689224243164, "global_step": 104526, "epoch": 622} {"train_loss": -9.724111557006836, "global_step": 104527, "epoch": 622} {"train_loss": -9.851774215698242, "global_step": 104528, "epoch": 622} {"train_loss": -9.986648559570312, "global_step": 104529, "epoch": 622} {"train_loss": -9.240524291992188, "global_step": 104530, "epoch": 622} {"train_loss": -9.900699615478516, "global_step": 104531, "epoch": 622} {"train_loss": -9.633512496948242, "global_step": 104532, "epoch": 622} {"train_loss": -9.926811218261719, "global_step": 104533, "epoch": 622} {"train_loss": -9.300179481506348, "global_step": 104534, "epoch": 622} {"train_loss": -9.69894790649414, "global_step": 104535, "epoch": 622} {"train_loss": -9.747822761535645, "global_step": 104536, "epoch": 622} {"train_loss": -9.73090934753418, "global_step": 104537, "epoch": 622} {"train_loss": -9.736483573913574, "global_step": 104538, "epoch": 622} {"train_loss": -9.812311172485352, "global_step": 104539, "epoch": 622} {"train_loss": -9.848670959472656, "global_step": 104540, "epoch": 622} {"train_loss": -9.842007637023926, "global_step": 104541, "epoch": 622} {"train_loss": -9.785896301269531, "global_step": 104542, "epoch": 622} {"train_loss": -9.957277297973633, "global_step": 104543, "epoch": 622} {"train_loss": -9.82120132446289, "global_step": 104544, "epoch": 622} {"train_loss": -10.004327774047852, "global_step": 104545, "epoch": 622} {"train_loss": -10.091315269470215, "global_step": 104546, "epoch": 622} {"train_loss": -10.022737503051758, "global_step": 104547, "epoch": 622} {"train_loss": -9.83993148803711, "global_step": 104548, "epoch": 622} {"train_loss": -9.881673812866211, "global_step": 104549, "epoch": 622} {"train_loss": -9.715087890625, "global_step": 104550, "epoch": 622} {"train_loss": -9.931716918945312, "global_step": 104551, "epoch": 622} {"train_loss": -10.02785873413086, "global_step": 104552, "epoch": 622} {"train_loss": -10.09384536743164, "global_step": 104553, "epoch": 622} {"train_loss": -9.94479751586914, "global_step": 104554, "epoch": 622} {"train_loss": -9.950155258178711, "global_step": 104555, "epoch": 622} {"train_loss": -9.936785697937012, "global_step": 104556, "epoch": 622} {"train_loss": -9.665542602539062, "global_step": 104557, "epoch": 622} {"train_loss": -10.011457443237305, "global_step": 104558, "epoch": 622} {"train_loss": -9.372353553771973, "global_step": 104559, "epoch": 622} {"train_loss": -9.728011131286621, "global_step": 104560, "epoch": 622} {"train_loss": -9.606285095214844, "global_step": 104561, "epoch": 622} {"train_loss": -10.176494598388672, "global_step": 104562, "epoch": 622} {"train_loss": -9.068500518798828, "global_step": 104563, "epoch": 622} {"train_loss": -9.82119083404541, "global_step": 104564, "epoch": 622} {"train_loss": -9.50582504272461, "global_step": 104565, "epoch": 622} {"train_loss": -10.021270751953125, "global_step": 104566, "epoch": 622} {"train_loss": -9.835426330566406, "global_step": 104567, "epoch": 622} {"train_loss": -9.812797546386719, "global_step": 104568, "epoch": 622} {"train_loss": -9.856740951538086, "global_step": 104569, "epoch": 622} {"train_loss": -9.836709022521973, "global_step": 104570, "epoch": 622} {"train_loss": -9.83824348449707, "global_step": 104571, "epoch": 622} {"train_loss": -9.786577224731445, "global_step": 104572, "epoch": 622} {"train_loss": -10.199116706848145, "global_step": 104573, "epoch": 622} {"train_loss": -9.28476333618164, "global_step": 104574, "epoch": 622} {"train_loss": -9.714599609375, "global_step": 104575, "epoch": 622} {"train_loss": -8.96365737915039, "global_step": 104576, "epoch": 622} {"train_loss": -9.834710121154785, "global_step": 104577, "epoch": 622} {"train_loss": -9.604593276977539, "global_step": 104578, "epoch": 622} {"train_loss": -9.679131507873535, "global_step": 104579, "epoch": 622} {"train_loss": -9.198923110961914, "global_step": 104580, "epoch": 622} {"train_loss": -9.495460510253906, "global_step": 104581, "epoch": 622} {"train_loss": -9.704951286315918, "global_step": 104582, "epoch": 622} {"train_loss": -9.487825393676758, "global_step": 104583, "epoch": 622} {"train_loss": -9.442194938659668, "global_step": 104584, "epoch": 622} {"train_loss": -9.605830192565918, "global_step": 104585, "epoch": 622} {"train_loss": -9.499971389770508, "global_step": 104586, "epoch": 622} {"train_loss": -9.752941131591797, "global_step": 104587, "epoch": 622} {"train_loss": -9.810041427612305, "global_step": 104588, "epoch": 622} {"train_loss": -9.622396469116211, "global_step": 104589, "epoch": 622} {"train_loss": -9.787752151489258, "global_step": 104590, "epoch": 622} {"train_loss": -9.89373779296875, "global_step": 104591, "epoch": 622} {"train_loss": -9.849246978759766, "global_step": 104592, "epoch": 622} {"train_loss": -9.856215476989746, "global_step": 104593, "epoch": 622} {"train_loss": -9.846399307250977, "global_step": 104594, "epoch": 622} {"train_loss": -9.989153861999512, "global_step": 104595, "epoch": 622} {"train_loss": -9.889552116394043, "global_step": 104596, "epoch": 622} {"train_loss": -9.847256660461426, "global_step": 104597, "epoch": 622} {"train_loss": -9.881195068359375, "global_step": 104598, "epoch": 622} {"train_loss": -10.114034652709961, "global_step": 104599, "epoch": 622} {"train_loss": -10.07028865814209, "global_step": 104600, "epoch": 622} {"train_loss": -9.957368850708008, "global_step": 104601, "epoch": 622} {"train_loss": -9.869638442993164, "global_step": 104602, "epoch": 622} {"train_loss": -10.062782287597656, "global_step": 104603, "epoch": 622} {"train_loss": -10.091534614562988, "global_step": 104604, "epoch": 622} {"train_loss": -9.864667892456055, "global_step": 104605, "epoch": 622} {"train_loss": -9.931089401245117, "global_step": 104606, "epoch": 622} {"train_loss": -10.064253807067871, "global_step": 104607, "epoch": 622} {"train_loss": -9.804983139038086, "global_step": 104608, "epoch": 622} {"train_loss": -9.796708106994629, "global_step": 104609, "epoch": 622} {"train_loss": -10.025467872619629, "global_step": 104610, "epoch": 622} {"train_loss": -9.919280052185059, "global_step": 104611, "epoch": 622} {"train_loss": -10.019340515136719, "global_step": 104612, "epoch": 622} {"train_loss": -9.99398422241211, "global_step": 104613, "epoch": 622} {"train_loss": -10.076964378356934, "global_step": 104614, "epoch": 622} {"train_loss": -9.903181076049805, "global_step": 104615, "epoch": 622} {"train_loss": -9.94156265258789, "global_step": 104616, "epoch": 622} {"train_loss": -9.806221008300781, "global_step": 104617, "epoch": 622} {"train_loss": -9.864029884338379, "global_step": 104618, "epoch": 622} {"train_loss": -10.084699630737305, "global_step": 104619, "epoch": 622} {"train_loss": -9.685394287109375, "global_step": 104620, "epoch": 622} {"train_loss": -9.736360549926758, "global_step": 104621, "epoch": 622} {"train_loss": -9.895049095153809, "global_step": 104622, "epoch": 622} {"train_loss": -10.02761173248291, "global_step": 104623, "epoch": 622} {"train_loss": -9.97041130065918, "global_step": 104624, "epoch": 622} {"train_loss": -9.765176773071289, "global_step": 104625, "epoch": 622} {"train_loss": -9.86411190032959, "global_step": 104626, "epoch": 622} {"train_loss": -9.94284439086914, "global_step": 104627, "epoch": 622} {"train_loss": -9.84469985961914, "global_step": 104628, "epoch": 622} {"train_loss": -9.957571029663086, "global_step": 104629, "epoch": 622} {"train_loss": -9.542374610900879, "global_step": 104630, "epoch": 622} {"train_loss": -9.802427291870117, "global_step": 104631, "epoch": 622} {"train_loss": -9.3189115524292, "global_step": 104632, "epoch": 622} {"train_loss": -9.681897163391113, "global_step": 104633, "epoch": 622} {"train_loss": -10.018556594848633, "global_step": 104634, "epoch": 622} {"train_loss": -9.576931953430176, "global_step": 104635, "epoch": 622} {"train_loss": -9.700582504272461, "global_step": 104636, "epoch": 622} {"train_loss": -9.80887222290039, "global_step": 104637, "epoch": 622} {"train_loss": -9.514963150024414, "global_step": 104638, "epoch": 622} {"train_loss": -9.757854461669922, "global_step": 104639, "epoch": 622} {"train_loss": -9.639408111572266, "global_step": 104640, "epoch": 622} {"train_loss": -9.467260360717773, "global_step": 104641, "epoch": 622} {"train_loss": -9.490653991699219, "global_step": 104642, "epoch": 622} {"train_loss": -9.280119895935059, "global_step": 104643, "epoch": 622} {"train_loss": -9.679510116577148, "global_step": 104644, "epoch": 622} {"train_loss": -9.640796661376953, "global_step": 104645, "epoch": 622} {"train_loss": -9.890702247619629, "global_step": 104646, "epoch": 622} {"train_loss": -9.310894966125488, "global_step": 104647, "epoch": 622} {"train_loss": -9.921907424926758, "global_step": 104648, "epoch": 622} {"train_loss": -9.38749885559082, "global_step": 104649, "epoch": 622} {"train_loss": -9.80970287322998, "global_step": 104650, "epoch": 622} {"train_loss": -9.37171459197998, "global_step": 104651, "epoch": 622} {"train_loss": -9.771726608276367, "global_step": 104652, "epoch": 622} {"train_loss": -9.898415565490723, "global_step": 104653, "epoch": 622} {"train_loss": -9.70399284362793, "global_step": 104654, "epoch": 622} {"train_loss": -9.66847038269043, "global_step": 104655, "epoch": 622} {"train_loss": -9.832052230834961, "global_step": 104656, "epoch": 622} {"train_loss": -9.390228271484375, "global_step": 104657, "epoch": 622} {"train_loss": -9.551295280456543, "global_step": 104658, "epoch": 622} {"train_loss": -9.858081817626953, "global_step": 104659, "epoch": 622} {"train_loss": -9.57819652557373, "global_step": 104660, "epoch": 622} {"train_loss": -9.840827941894531, "global_step": 104661, "epoch": 622} {"train_loss": -9.379537582397461, "global_step": 104662, "epoch": 622} {"train_loss": -9.761865059534708, "global_step": 104663, "epoch": 622, "val_loss": 211070.234375} {"train_loss": -9.524070739746094, "global_step": 104664, "epoch": 623} {"train_loss": -9.660429954528809, "global_step": 104665, "epoch": 623} {"train_loss": -9.413604736328125, "global_step": 104666, "epoch": 623} {"train_loss": -9.75070571899414, "global_step": 104667, "epoch": 623} {"train_loss": -9.540752410888672, "global_step": 104668, "epoch": 623} {"train_loss": -9.618733406066895, "global_step": 104669, "epoch": 623} {"train_loss": -9.501757621765137, "global_step": 104670, "epoch": 623} {"train_loss": -9.474784851074219, "global_step": 104671, "epoch": 623} {"train_loss": -9.892791748046875, "global_step": 104672, "epoch": 623} {"train_loss": -9.798822402954102, "global_step": 104673, "epoch": 623} {"train_loss": -9.50505256652832, "global_step": 104674, "epoch": 623} {"train_loss": -9.596028327941895, "global_step": 104675, "epoch": 623} {"train_loss": -9.992586135864258, "global_step": 104676, "epoch": 623} {"train_loss": -9.63755989074707, "global_step": 104677, "epoch": 623} {"train_loss": -9.569327354431152, "global_step": 104678, "epoch": 623} {"train_loss": -10.035076141357422, "global_step": 104679, "epoch": 623} {"train_loss": -9.723796844482422, "global_step": 104680, "epoch": 623} {"train_loss": -9.897872924804688, "global_step": 104681, "epoch": 623} {"train_loss": -9.863542556762695, "global_step": 104682, "epoch": 623} {"train_loss": -9.961698532104492, "global_step": 104683, "epoch": 623} {"train_loss": -9.79627799987793, "global_step": 104684, "epoch": 623} {"train_loss": -9.576132774353027, "global_step": 104685, "epoch": 623} {"train_loss": -9.785099983215332, "global_step": 104686, "epoch": 623} {"train_loss": -9.856201171875, "global_step": 104687, "epoch": 623} {"train_loss": -9.79315185546875, "global_step": 104688, "epoch": 623} {"train_loss": -9.927533149719238, "global_step": 104689, "epoch": 623} {"train_loss": -9.663942337036133, "global_step": 104690, "epoch": 623} {"train_loss": -9.879720687866211, "global_step": 104691, "epoch": 623} {"train_loss": -9.558853149414062, "global_step": 104692, "epoch": 623} {"train_loss": -9.64116096496582, "global_step": 104693, "epoch": 623} {"train_loss": -9.730117797851562, "global_step": 104694, "epoch": 623} {"train_loss": -9.764394760131836, "global_step": 104695, "epoch": 623} {"train_loss": -9.538236618041992, "global_step": 104696, "epoch": 623} {"train_loss": -9.648419380187988, "global_step": 104697, "epoch": 623} {"train_loss": -9.957662582397461, "global_step": 104698, "epoch": 623} {"train_loss": -9.64820671081543, "global_step": 104699, "epoch": 623} {"train_loss": -9.815844535827637, "global_step": 104700, "epoch": 623} {"train_loss": -9.921439170837402, "global_step": 104701, "epoch": 623} {"train_loss": -9.997735977172852, "global_step": 104702, "epoch": 623} {"train_loss": -9.657927513122559, "global_step": 104703, "epoch": 623} {"train_loss": -9.937081336975098, "global_step": 104704, "epoch": 623} {"train_loss": -9.532144546508789, "global_step": 104705, "epoch": 623} {"train_loss": -9.749871253967285, "global_step": 104706, "epoch": 623} {"train_loss": -9.49775505065918, "global_step": 104707, "epoch": 623} {"train_loss": -9.312176704406738, "global_step": 104708, "epoch": 623} {"train_loss": -9.642885208129883, "global_step": 104709, "epoch": 623} {"train_loss": -9.617393493652344, "global_step": 104710, "epoch": 623} {"train_loss": -9.337240219116211, "global_step": 104711, "epoch": 623} {"train_loss": -9.470100402832031, "global_step": 104712, "epoch": 623} {"train_loss": -9.46011734008789, "global_step": 104713, "epoch": 623} {"train_loss": -8.877388000488281, "global_step": 104714, "epoch": 623} {"train_loss": -9.640851974487305, "global_step": 104715, "epoch": 623} {"train_loss": -9.119186401367188, "global_step": 104716, "epoch": 623} {"train_loss": -9.691764831542969, "global_step": 104717, "epoch": 623} {"train_loss": -9.517309188842773, "global_step": 104718, "epoch": 623} {"train_loss": -9.896724700927734, "global_step": 104719, "epoch": 623} {"train_loss": -9.555185317993164, "global_step": 104720, "epoch": 623} {"train_loss": -9.658053398132324, "global_step": 104721, "epoch": 623} {"train_loss": -9.412403106689453, "global_step": 104722, "epoch": 623} {"train_loss": -9.402950286865234, "global_step": 104723, "epoch": 623} {"train_loss": -9.6790771484375, "global_step": 104724, "epoch": 623} {"train_loss": -9.476751327514648, "global_step": 104725, "epoch": 623} {"train_loss": -9.909902572631836, "global_step": 104726, "epoch": 623} {"train_loss": -9.640380859375, "global_step": 104727, "epoch": 623} {"train_loss": -9.799795150756836, "global_step": 104728, "epoch": 623} {"train_loss": -9.891057968139648, "global_step": 104729, "epoch": 623} {"train_loss": -9.768860816955566, "global_step": 104730, "epoch": 623} {"train_loss": -9.771913528442383, "global_step": 104731, "epoch": 623} {"train_loss": -9.887627601623535, "global_step": 104732, "epoch": 623} {"train_loss": -9.893539428710938, "global_step": 104733, "epoch": 623} {"train_loss": -9.842689514160156, "global_step": 104734, "epoch": 623} {"train_loss": -9.738441467285156, "global_step": 104735, "epoch": 623} {"train_loss": -9.6322660446167, "global_step": 104736, "epoch": 623} {"train_loss": -9.727821350097656, "global_step": 104737, "epoch": 623} {"train_loss": -10.03795337677002, "global_step": 104738, "epoch": 623} {"train_loss": -9.9212646484375, "global_step": 104739, "epoch": 623} {"train_loss": -10.030662536621094, "global_step": 104740, "epoch": 623} {"train_loss": -10.088886260986328, "global_step": 104741, "epoch": 623} {"train_loss": -9.879308700561523, "global_step": 104742, "epoch": 623} {"train_loss": -9.832141876220703, "global_step": 104743, "epoch": 623} {"train_loss": -10.266656875610352, "global_step": 104744, "epoch": 623} {"train_loss": -10.142919540405273, "global_step": 104745, "epoch": 623} {"train_loss": -9.96641731262207, "global_step": 104746, "epoch": 623} {"train_loss": -10.010828018188477, "global_step": 104747, "epoch": 623} {"train_loss": -9.92510986328125, "global_step": 104748, "epoch": 623} {"train_loss": -9.801105499267578, "global_step": 104749, "epoch": 623} {"train_loss": -9.914260864257812, "global_step": 104750, "epoch": 623} {"train_loss": -9.934185028076172, "global_step": 104751, "epoch": 623} {"train_loss": -10.045537948608398, "global_step": 104752, "epoch": 623} {"train_loss": -9.605086326599121, "global_step": 104753, "epoch": 623} {"train_loss": -9.950782775878906, "global_step": 104754, "epoch": 623} {"train_loss": -9.879318237304688, "global_step": 104755, "epoch": 623} {"train_loss": -10.119444847106934, "global_step": 104756, "epoch": 623} {"train_loss": -9.889179229736328, "global_step": 104757, "epoch": 623} {"train_loss": -9.976554870605469, "global_step": 104758, "epoch": 623} {"train_loss": -10.070587158203125, "global_step": 104759, "epoch": 623} {"train_loss": -9.896236419677734, "global_step": 104760, "epoch": 623} {"train_loss": -9.750772476196289, "global_step": 104761, "epoch": 623} {"train_loss": -9.980114936828613, "global_step": 104762, "epoch": 623} {"train_loss": -9.57494068145752, "global_step": 104763, "epoch": 623} {"train_loss": -9.97036361694336, "global_step": 104764, "epoch": 623} {"train_loss": -9.827777862548828, "global_step": 104765, "epoch": 623} {"train_loss": -10.040145874023438, "global_step": 104766, "epoch": 623} {"train_loss": -9.928704261779785, "global_step": 104767, "epoch": 623} {"train_loss": -10.166101455688477, "global_step": 104768, "epoch": 623} {"train_loss": -9.877214431762695, "global_step": 104769, "epoch": 623} {"train_loss": -9.696958541870117, "global_step": 104770, "epoch": 623} {"train_loss": -9.812291145324707, "global_step": 104771, "epoch": 623} {"train_loss": -9.88486099243164, "global_step": 104772, "epoch": 623} {"train_loss": -9.909899711608887, "global_step": 104773, "epoch": 623} {"train_loss": -9.568479537963867, "global_step": 104774, "epoch": 623} {"train_loss": -9.813232421875, "global_step": 104775, "epoch": 623} {"train_loss": -9.498324394226074, "global_step": 104776, "epoch": 623} {"train_loss": -9.831198692321777, "global_step": 104777, "epoch": 623} {"train_loss": -9.986553192138672, "global_step": 104778, "epoch": 623} {"train_loss": -9.40419864654541, "global_step": 104779, "epoch": 623} {"train_loss": -9.950946807861328, "global_step": 104780, "epoch": 623} {"train_loss": -9.588512420654297, "global_step": 104781, "epoch": 623} {"train_loss": -9.84264087677002, "global_step": 104782, "epoch": 623} {"train_loss": -9.624700546264648, "global_step": 104783, "epoch": 623} {"train_loss": -9.581464767456055, "global_step": 104784, "epoch": 623} {"train_loss": -9.617116928100586, "global_step": 104785, "epoch": 623} {"train_loss": -9.695777893066406, "global_step": 104786, "epoch": 623} {"train_loss": -9.671527862548828, "global_step": 104787, "epoch": 623} {"train_loss": -10.034560203552246, "global_step": 104788, "epoch": 623} {"train_loss": -9.491288185119629, "global_step": 104789, "epoch": 623} {"train_loss": -9.729944229125977, "global_step": 104790, "epoch": 623} {"train_loss": -9.846319198608398, "global_step": 104791, "epoch": 623} {"train_loss": -9.627256393432617, "global_step": 104792, "epoch": 623} {"train_loss": -9.747401237487793, "global_step": 104793, "epoch": 623} {"train_loss": -9.75604248046875, "global_step": 104794, "epoch": 623} {"train_loss": -9.585931777954102, "global_step": 104795, "epoch": 623} {"train_loss": -9.763559341430664, "global_step": 104796, "epoch": 623} {"train_loss": -9.622909545898438, "global_step": 104797, "epoch": 623} {"train_loss": -9.956496238708496, "global_step": 104798, "epoch": 623} {"train_loss": -10.038082122802734, "global_step": 104799, "epoch": 623} {"train_loss": -9.874801635742188, "global_step": 104800, "epoch": 623} {"train_loss": -9.779630661010742, "global_step": 104801, "epoch": 623} {"train_loss": -9.89625358581543, "global_step": 104802, "epoch": 623} {"train_loss": -9.911721229553223, "global_step": 104803, "epoch": 623} {"train_loss": -9.916086196899414, "global_step": 104804, "epoch": 623} {"train_loss": -9.911079406738281, "global_step": 104805, "epoch": 623} {"train_loss": -9.859807968139648, "global_step": 104806, "epoch": 623} {"train_loss": -9.966434478759766, "global_step": 104807, "epoch": 623} {"train_loss": -9.757123947143555, "global_step": 104808, "epoch": 623} {"train_loss": -9.718484878540039, "global_step": 104809, "epoch": 623} {"train_loss": -10.020195960998535, "global_step": 104810, "epoch": 623} {"train_loss": -9.572062492370605, "global_step": 104811, "epoch": 623} {"train_loss": -9.965072631835938, "global_step": 104812, "epoch": 623} {"train_loss": -9.901716232299805, "global_step": 104813, "epoch": 623} {"train_loss": -10.131542205810547, "global_step": 104814, "epoch": 623} {"train_loss": -9.980768203735352, "global_step": 104815, "epoch": 623} {"train_loss": -10.047840118408203, "global_step": 104816, "epoch": 623} {"train_loss": -10.14246940612793, "global_step": 104817, "epoch": 623} {"train_loss": -9.947792053222656, "global_step": 104818, "epoch": 623} {"train_loss": -9.857588768005371, "global_step": 104819, "epoch": 623} {"train_loss": -10.019725799560547, "global_step": 104820, "epoch": 623} {"train_loss": -9.959165573120117, "global_step": 104821, "epoch": 623} {"train_loss": -10.229952812194824, "global_step": 104822, "epoch": 623} {"train_loss": -9.90908432006836, "global_step": 104823, "epoch": 623} {"train_loss": -10.236539840698242, "global_step": 104824, "epoch": 623} {"train_loss": -9.721311569213867, "global_step": 104825, "epoch": 623} {"train_loss": -9.911369323730469, "global_step": 104826, "epoch": 623} {"train_loss": -10.078857421875, "global_step": 104827, "epoch": 623} {"train_loss": -9.930316925048828, "global_step": 104828, "epoch": 623} {"train_loss": -9.869348526000977, "global_step": 104829, "epoch": 623} {"train_loss": -9.89239501953125, "global_step": 104830, "epoch": 623} {"train_loss": -9.787856839952015, "global_step": 104831, "epoch": 623, "val_loss": 209310.734375} {"train_loss": -9.797691345214844, "global_step": 104832, "epoch": 624} {"train_loss": -9.899670600891113, "global_step": 104833, "epoch": 624} {"train_loss": -9.847978591918945, "global_step": 104834, "epoch": 624} {"train_loss": -10.016136169433594, "global_step": 104835, "epoch": 624} {"train_loss": -10.199637413024902, "global_step": 104836, "epoch": 624} {"train_loss": -9.763681411743164, "global_step": 104837, "epoch": 624} {"train_loss": -9.827610969543457, "global_step": 104838, "epoch": 624} {"train_loss": -9.770586013793945, "global_step": 104839, "epoch": 624} {"train_loss": -9.669462203979492, "global_step": 104840, "epoch": 624} {"train_loss": -9.909599304199219, "global_step": 104841, "epoch": 624} {"train_loss": -9.429790496826172, "global_step": 104842, "epoch": 624} {"train_loss": -9.725349426269531, "global_step": 104843, "epoch": 624} {"train_loss": -9.703299522399902, "global_step": 104844, "epoch": 624} {"train_loss": -9.759883880615234, "global_step": 104845, "epoch": 624} {"train_loss": -9.855069160461426, "global_step": 104846, "epoch": 624} {"train_loss": -9.665910720825195, "global_step": 104847, "epoch": 624} {"train_loss": -9.751092910766602, "global_step": 104848, "epoch": 624} {"train_loss": -9.853560447692871, "global_step": 104849, "epoch": 624} {"train_loss": -9.601507186889648, "global_step": 104850, "epoch": 624} {"train_loss": -9.935088157653809, "global_step": 104851, "epoch": 624} {"train_loss": -9.660961151123047, "global_step": 104852, "epoch": 624} {"train_loss": -9.848884582519531, "global_step": 104853, "epoch": 624} {"train_loss": -9.679049491882324, "global_step": 104854, "epoch": 624} {"train_loss": -9.871440887451172, "global_step": 104855, "epoch": 624} {"train_loss": -9.720624923706055, "global_step": 104856, "epoch": 624} {"train_loss": -9.971636772155762, "global_step": 104857, "epoch": 624} {"train_loss": -9.71711540222168, "global_step": 104858, "epoch": 624} {"train_loss": -9.99443244934082, "global_step": 104859, "epoch": 624} {"train_loss": -9.791413307189941, "global_step": 104860, "epoch": 624} {"train_loss": -10.02830696105957, "global_step": 104861, "epoch": 624} {"train_loss": -9.581442832946777, "global_step": 104862, "epoch": 624} {"train_loss": -9.815651893615723, "global_step": 104863, "epoch": 624} {"train_loss": -9.64303207397461, "global_step": 104864, "epoch": 624} {"train_loss": -9.566987991333008, "global_step": 104865, "epoch": 624} {"train_loss": -9.921137809753418, "global_step": 104866, "epoch": 624} {"train_loss": -9.690642356872559, "global_step": 104867, "epoch": 624} {"train_loss": -10.026039123535156, "global_step": 104868, "epoch": 624} {"train_loss": -9.601251602172852, "global_step": 104869, "epoch": 624} {"train_loss": -9.735013961791992, "global_step": 104870, "epoch": 624} {"train_loss": -9.693897247314453, "global_step": 104871, "epoch": 624} {"train_loss": -9.627473831176758, "global_step": 104872, "epoch": 624} {"train_loss": -10.005379676818848, "global_step": 104873, "epoch": 624} {"train_loss": -9.84639835357666, "global_step": 104874, "epoch": 624} {"train_loss": -9.82925796508789, "global_step": 104875, "epoch": 624} {"train_loss": -9.87397575378418, "global_step": 104876, "epoch": 624} {"train_loss": -9.74094009399414, "global_step": 104877, "epoch": 624} {"train_loss": -9.744370460510254, "global_step": 104878, "epoch": 624} {"train_loss": -9.979652404785156, "global_step": 104879, "epoch": 624} {"train_loss": -9.360055923461914, "global_step": 104880, "epoch": 624} {"train_loss": -10.02783203125, "global_step": 104881, "epoch": 624} {"train_loss": -9.92492389678955, "global_step": 104882, "epoch": 624} {"train_loss": -9.689424514770508, "global_step": 104883, "epoch": 624} {"train_loss": -9.891630172729492, "global_step": 104884, "epoch": 624} {"train_loss": -9.526554107666016, "global_step": 104885, "epoch": 624} {"train_loss": -9.500752449035645, "global_step": 104886, "epoch": 624} {"train_loss": -9.620267868041992, "global_step": 104887, "epoch": 624} {"train_loss": -9.780020713806152, "global_step": 104888, "epoch": 624} {"train_loss": -9.82394027709961, "global_step": 104889, "epoch": 624} {"train_loss": -9.852447509765625, "global_step": 104890, "epoch": 624} {"train_loss": -9.724525451660156, "global_step": 104891, "epoch": 624} {"train_loss": -9.900615692138672, "global_step": 104892, "epoch": 624} {"train_loss": -9.675003051757812, "global_step": 104893, "epoch": 624} {"train_loss": -9.892592430114746, "global_step": 104894, "epoch": 624} {"train_loss": -9.915220260620117, "global_step": 104895, "epoch": 624} {"train_loss": -9.719968795776367, "global_step": 104896, "epoch": 624} {"train_loss": -9.743934631347656, "global_step": 104897, "epoch": 624} {"train_loss": -10.15036392211914, "global_step": 104898, "epoch": 624} {"train_loss": -9.698457717895508, "global_step": 104899, "epoch": 624} {"train_loss": -9.985088348388672, "global_step": 104900, "epoch": 624} {"train_loss": -9.766950607299805, "global_step": 104901, "epoch": 624} {"train_loss": -9.407156944274902, "global_step": 104902, "epoch": 624} {"train_loss": -9.940457344055176, "global_step": 104903, "epoch": 624} {"train_loss": -9.606466293334961, "global_step": 104904, "epoch": 624} {"train_loss": -9.548523902893066, "global_step": 104905, "epoch": 624} {"train_loss": -9.815134048461914, "global_step": 104906, "epoch": 624} {"train_loss": -9.697282791137695, "global_step": 104907, "epoch": 624} {"train_loss": -9.865558624267578, "global_step": 104908, "epoch": 624} {"train_loss": -9.91542911529541, "global_step": 104909, "epoch": 624} {"train_loss": -9.621553421020508, "global_step": 104910, "epoch": 624} {"train_loss": -9.951254844665527, "global_step": 104911, "epoch": 624} {"train_loss": -9.855499267578125, "global_step": 104912, "epoch": 624} {"train_loss": -9.595466613769531, "global_step": 104913, "epoch": 624} {"train_loss": -9.898394584655762, "global_step": 104914, "epoch": 624} {"train_loss": -9.954423904418945, "global_step": 104915, "epoch": 624} {"train_loss": -9.640451431274414, "global_step": 104916, "epoch": 624} {"train_loss": -9.748215675354004, "global_step": 104917, "epoch": 624} {"train_loss": -10.075091361999512, "global_step": 104918, "epoch": 624} {"train_loss": -9.653202056884766, "global_step": 104919, "epoch": 624} {"train_loss": -9.882196426391602, "global_step": 104920, "epoch": 624} {"train_loss": -9.767684936523438, "global_step": 104921, "epoch": 624} {"train_loss": -9.80916976928711, "global_step": 104922, "epoch": 624} {"train_loss": -9.931925773620605, "global_step": 104923, "epoch": 624} {"train_loss": -9.851886749267578, "global_step": 104924, "epoch": 624} {"train_loss": -9.695648193359375, "global_step": 104925, "epoch": 624} {"train_loss": -9.836421966552734, "global_step": 104926, "epoch": 624} {"train_loss": -9.812641143798828, "global_step": 104927, "epoch": 624} {"train_loss": -9.437474250793457, "global_step": 104928, "epoch": 624} {"train_loss": -9.983135223388672, "global_step": 104929, "epoch": 624} {"train_loss": -9.600715637207031, "global_step": 104930, "epoch": 624} {"train_loss": -9.91290283203125, "global_step": 104931, "epoch": 624} {"train_loss": -9.746800422668457, "global_step": 104932, "epoch": 624} {"train_loss": -9.506925582885742, "global_step": 104933, "epoch": 624} {"train_loss": -9.870199203491211, "global_step": 104934, "epoch": 624} {"train_loss": -9.709460258483887, "global_step": 104935, "epoch": 624} {"train_loss": -9.612383842468262, "global_step": 104936, "epoch": 624} {"train_loss": -9.640002250671387, "global_step": 104937, "epoch": 624} {"train_loss": -9.545145988464355, "global_step": 104938, "epoch": 624} {"train_loss": -9.594362258911133, "global_step": 104939, "epoch": 624} {"train_loss": -9.784942626953125, "global_step": 104940, "epoch": 624} {"train_loss": -9.377609252929688, "global_step": 104941, "epoch": 624} {"train_loss": -9.505125045776367, "global_step": 104942, "epoch": 624} {"train_loss": -9.539239883422852, "global_step": 104943, "epoch": 624} {"train_loss": -9.312677383422852, "global_step": 104944, "epoch": 624} {"train_loss": -9.693448066711426, "global_step": 104945, "epoch": 624} {"train_loss": -9.642335891723633, "global_step": 104946, "epoch": 624} {"train_loss": -9.575919151306152, "global_step": 104947, "epoch": 624} {"train_loss": -9.797796249389648, "global_step": 104948, "epoch": 624} {"train_loss": -9.759419441223145, "global_step": 104949, "epoch": 624} {"train_loss": -9.852181434631348, "global_step": 104950, "epoch": 624} {"train_loss": -9.791570663452148, "global_step": 104951, "epoch": 624} {"train_loss": -9.572739601135254, "global_step": 104952, "epoch": 624} {"train_loss": -9.82079792022705, "global_step": 104953, "epoch": 624} {"train_loss": -9.805143356323242, "global_step": 104954, "epoch": 624} {"train_loss": -9.690345764160156, "global_step": 104955, "epoch": 624} {"train_loss": -9.763632774353027, "global_step": 104956, "epoch": 624} {"train_loss": -9.687326431274414, "global_step": 104957, "epoch": 624} {"train_loss": -9.614302635192871, "global_step": 104958, "epoch": 624} {"train_loss": -9.871400833129883, "global_step": 104959, "epoch": 624} {"train_loss": -9.86734390258789, "global_step": 104960, "epoch": 624} {"train_loss": -9.506507873535156, "global_step": 104961, "epoch": 624} {"train_loss": -9.961738586425781, "global_step": 104962, "epoch": 624} {"train_loss": -9.823920249938965, "global_step": 104963, "epoch": 624} {"train_loss": -9.958719253540039, "global_step": 104964, "epoch": 624} {"train_loss": -9.382732391357422, "global_step": 104965, "epoch": 624} {"train_loss": -9.988027572631836, "global_step": 104966, "epoch": 624} {"train_loss": -9.423373222351074, "global_step": 104967, "epoch": 624} {"train_loss": -9.785161018371582, "global_step": 104968, "epoch": 624} {"train_loss": -9.658100128173828, "global_step": 104969, "epoch": 624} {"train_loss": -9.857746124267578, "global_step": 104970, "epoch": 624} {"train_loss": -9.80893325805664, "global_step": 104971, "epoch": 624} {"train_loss": -10.08293342590332, "global_step": 104972, "epoch": 624} {"train_loss": -9.977476119995117, "global_step": 104973, "epoch": 624} {"train_loss": -9.92719554901123, "global_step": 104974, "epoch": 624} {"train_loss": -9.837271690368652, "global_step": 104975, "epoch": 624} {"train_loss": -9.844267845153809, "global_step": 104976, "epoch": 624} {"train_loss": -9.955657958984375, "global_step": 104977, "epoch": 624} {"train_loss": -10.029273986816406, "global_step": 104978, "epoch": 624} {"train_loss": -10.00910758972168, "global_step": 104979, "epoch": 624} {"train_loss": -9.954479217529297, "global_step": 104980, "epoch": 624} {"train_loss": -9.814533233642578, "global_step": 104981, "epoch": 624} {"train_loss": -9.980560302734375, "global_step": 104982, "epoch": 624} {"train_loss": -9.878579139709473, "global_step": 104983, "epoch": 624} {"train_loss": -10.070053100585938, "global_step": 104984, "epoch": 624} {"train_loss": -10.162346839904785, "global_step": 104985, "epoch": 624} {"train_loss": -9.984527587890625, "global_step": 104986, "epoch": 624} {"train_loss": -9.99454116821289, "global_step": 104987, "epoch": 624} {"train_loss": -10.01673412322998, "global_step": 104988, "epoch": 624} {"train_loss": -9.973443031311035, "global_step": 104989, "epoch": 624} {"train_loss": -9.698867797851562, "global_step": 104990, "epoch": 624} {"train_loss": -9.917133331298828, "global_step": 104991, "epoch": 624} {"train_loss": -9.809886932373047, "global_step": 104992, "epoch": 624} {"train_loss": -9.971819877624512, "global_step": 104993, "epoch": 624} {"train_loss": -9.519598007202148, "global_step": 104994, "epoch": 624} {"train_loss": -9.924928665161133, "global_step": 104995, "epoch": 624} {"train_loss": -9.109505653381348, "global_step": 104996, "epoch": 624} {"train_loss": -9.438844680786133, "global_step": 104997, "epoch": 624} {"train_loss": -9.40267276763916, "global_step": 104998, "epoch": 624} {"train_loss": -9.77639869848887, "global_step": 104999, "epoch": 624, "val_loss": 207221.34375} {"train_loss": -9.571944236755371, "global_step": 105000, "epoch": 625} {"train_loss": -9.93172550201416, "global_step": 105001, "epoch": 625} {"train_loss": -9.713568687438965, "global_step": 105002, "epoch": 625} {"train_loss": -9.464313507080078, "global_step": 105003, "epoch": 625} {"train_loss": -9.562047958374023, "global_step": 105004, "epoch": 625} {"train_loss": -9.763167381286621, "global_step": 105005, "epoch": 625} {"train_loss": -9.799253463745117, "global_step": 105006, "epoch": 625} {"train_loss": -9.6790771484375, "global_step": 105007, "epoch": 625} {"train_loss": -9.721968650817871, "global_step": 105008, "epoch": 625} {"train_loss": -9.699698448181152, "global_step": 105009, "epoch": 625} {"train_loss": -9.663963317871094, "global_step": 105010, "epoch": 625} {"train_loss": -9.68028450012207, "global_step": 105011, "epoch": 625} {"train_loss": -9.858478546142578, "global_step": 105012, "epoch": 625} {"train_loss": -9.833110809326172, "global_step": 105013, "epoch": 625} {"train_loss": -9.690479278564453, "global_step": 105014, "epoch": 625} {"train_loss": -9.621232032775879, "global_step": 105015, "epoch": 625} {"train_loss": -9.850506782531738, "global_step": 105016, "epoch": 625} {"train_loss": -9.599769592285156, "global_step": 105017, "epoch": 625} {"train_loss": -9.790854454040527, "global_step": 105018, "epoch": 625} {"train_loss": -9.679494857788086, "global_step": 105019, "epoch": 625} {"train_loss": -9.616937637329102, "global_step": 105020, "epoch": 625} {"train_loss": -9.671388626098633, "global_step": 105021, "epoch": 625} {"train_loss": -9.87095832824707, "global_step": 105022, "epoch": 625} {"train_loss": -9.918617248535156, "global_step": 105023, "epoch": 625} {"train_loss": -9.82400131225586, "global_step": 105024, "epoch": 625} {"train_loss": -10.092601776123047, "global_step": 105025, "epoch": 625} {"train_loss": -9.901261329650879, "global_step": 105026, "epoch": 625} {"train_loss": -9.803680419921875, "global_step": 105027, "epoch": 625} {"train_loss": -9.867511749267578, "global_step": 105028, "epoch": 625} {"train_loss": -10.132406234741211, "global_step": 105029, "epoch": 625} {"train_loss": -10.01659870147705, "global_step": 105030, "epoch": 625} {"train_loss": -9.920211791992188, "global_step": 105031, "epoch": 625} {"train_loss": -10.015626907348633, "global_step": 105032, "epoch": 625} {"train_loss": -9.808481216430664, "global_step": 105033, "epoch": 625} {"train_loss": -9.814217567443848, "global_step": 105034, "epoch": 625} {"train_loss": -9.682851791381836, "global_step": 105035, "epoch": 625} {"train_loss": -10.048044204711914, "global_step": 105036, "epoch": 625} {"train_loss": -9.116435050964355, "global_step": 105037, "epoch": 625} {"train_loss": -9.908018112182617, "global_step": 105038, "epoch": 625} {"train_loss": -9.487701416015625, "global_step": 105039, "epoch": 625} {"train_loss": -9.175045013427734, "global_step": 105040, "epoch": 625} {"train_loss": -9.776436805725098, "global_step": 105041, "epoch": 625} {"train_loss": -9.081367492675781, "global_step": 105042, "epoch": 625} {"train_loss": -9.38691520690918, "global_step": 105043, "epoch": 625} {"train_loss": -9.43030071258545, "global_step": 105044, "epoch": 625} {"train_loss": -9.627351760864258, "global_step": 105045, "epoch": 625} {"train_loss": -9.259906768798828, "global_step": 105046, "epoch": 625} {"train_loss": -9.51835823059082, "global_step": 105047, "epoch": 625} {"train_loss": -9.755229949951172, "global_step": 105048, "epoch": 625} {"train_loss": -9.607621192932129, "global_step": 105049, "epoch": 625} {"train_loss": -9.745594024658203, "global_step": 105050, "epoch": 625} {"train_loss": -9.741214752197266, "global_step": 105051, "epoch": 625} {"train_loss": -9.65235424041748, "global_step": 105052, "epoch": 625} {"train_loss": -9.792041778564453, "global_step": 105053, "epoch": 625} {"train_loss": -9.837946891784668, "global_step": 105054, "epoch": 625} {"train_loss": -9.729462623596191, "global_step": 105055, "epoch": 625} {"train_loss": -9.596929550170898, "global_step": 105056, "epoch": 625} {"train_loss": -9.724709510803223, "global_step": 105057, "epoch": 625} {"train_loss": -9.938233375549316, "global_step": 105058, "epoch": 625} {"train_loss": -9.594520568847656, "global_step": 105059, "epoch": 625} {"train_loss": -9.976211547851562, "global_step": 105060, "epoch": 625} {"train_loss": -10.064519882202148, "global_step": 105061, "epoch": 625} {"train_loss": -9.79368782043457, "global_step": 105062, "epoch": 625} {"train_loss": -9.82468318939209, "global_step": 105063, "epoch": 625} {"train_loss": -10.069642066955566, "global_step": 105064, "epoch": 625} {"train_loss": -9.984794616699219, "global_step": 105065, "epoch": 625} {"train_loss": -9.939815521240234, "global_step": 105066, "epoch": 625} {"train_loss": -9.962657928466797, "global_step": 105067, "epoch": 625} {"train_loss": -10.073015213012695, "global_step": 105068, "epoch": 625} {"train_loss": -10.066446304321289, "global_step": 105069, "epoch": 625} {"train_loss": -9.862405776977539, "global_step": 105070, "epoch": 625} {"train_loss": -9.990450859069824, "global_step": 105071, "epoch": 625} {"train_loss": -10.045855522155762, "global_step": 105072, "epoch": 625} {"train_loss": -10.095312118530273, "global_step": 105073, "epoch": 625} {"train_loss": -9.880901336669922, "global_step": 105074, "epoch": 625} {"train_loss": -9.971179962158203, "global_step": 105075, "epoch": 625} {"train_loss": -9.930599212646484, "global_step": 105076, "epoch": 625} {"train_loss": -9.891487121582031, "global_step": 105077, "epoch": 625} {"train_loss": -10.12270450592041, "global_step": 105078, "epoch": 625} {"train_loss": -9.897204399108887, "global_step": 105079, "epoch": 625} {"train_loss": -10.244306564331055, "global_step": 105080, "epoch": 625} {"train_loss": -10.21627426147461, "global_step": 105081, "epoch": 625} {"train_loss": -10.036845207214355, "global_step": 105082, "epoch": 625} {"train_loss": -9.854927062988281, "global_step": 105083, "epoch": 625} {"train_loss": -10.199857711791992, "global_step": 105084, "epoch": 625} {"train_loss": -9.878280639648438, "global_step": 105085, "epoch": 625} {"train_loss": -10.105201721191406, "global_step": 105086, "epoch": 625} {"train_loss": -9.96586799621582, "global_step": 105087, "epoch": 625} {"train_loss": -9.495811462402344, "global_step": 105088, "epoch": 625} {"train_loss": -9.687077522277832, "global_step": 105089, "epoch": 625} {"train_loss": -9.588508605957031, "global_step": 105090, "epoch": 625} {"train_loss": -9.425195693969727, "global_step": 105091, "epoch": 625} {"train_loss": -9.525557518005371, "global_step": 105092, "epoch": 625} {"train_loss": -9.107328414916992, "global_step": 105093, "epoch": 625} {"train_loss": -10.027467727661133, "global_step": 105094, "epoch": 625} {"train_loss": -8.633895874023438, "global_step": 105095, "epoch": 625} {"train_loss": -8.941490173339844, "global_step": 105096, "epoch": 625} {"train_loss": -8.980688095092773, "global_step": 105097, "epoch": 625} {"train_loss": -9.442120552062988, "global_step": 105098, "epoch": 625} {"train_loss": -9.202457427978516, "global_step": 105099, "epoch": 625} {"train_loss": -9.861244201660156, "global_step": 105100, "epoch": 625} {"train_loss": -9.242770195007324, "global_step": 105101, "epoch": 625} {"train_loss": -9.359395027160645, "global_step": 105102, "epoch": 625} {"train_loss": -9.61860466003418, "global_step": 105103, "epoch": 625} {"train_loss": -9.6383056640625, "global_step": 105104, "epoch": 625} {"train_loss": -9.57994270324707, "global_step": 105105, "epoch": 625} {"train_loss": -9.764838218688965, "global_step": 105106, "epoch": 625} {"train_loss": -9.504980087280273, "global_step": 105107, "epoch": 625} {"train_loss": -9.490053176879883, "global_step": 105108, "epoch": 625} {"train_loss": -9.694795608520508, "global_step": 105109, "epoch": 625} {"train_loss": -9.367044448852539, "global_step": 105110, "epoch": 625} {"train_loss": -9.661455154418945, "global_step": 105111, "epoch": 625} {"train_loss": -9.531848907470703, "global_step": 105112, "epoch": 625} {"train_loss": -9.547768592834473, "global_step": 105113, "epoch": 625} {"train_loss": -9.77127742767334, "global_step": 105114, "epoch": 625} {"train_loss": -9.663082122802734, "global_step": 105115, "epoch": 625} {"train_loss": -9.69942855834961, "global_step": 105116, "epoch": 625} {"train_loss": -9.75774097442627, "global_step": 105117, "epoch": 625} {"train_loss": -9.426900863647461, "global_step": 105118, "epoch": 625} {"train_loss": -9.74835205078125, "global_step": 105119, "epoch": 625} {"train_loss": -9.521602630615234, "global_step": 105120, "epoch": 625} {"train_loss": -9.820049285888672, "global_step": 105121, "epoch": 625} {"train_loss": -9.904561996459961, "global_step": 105122, "epoch": 625} {"train_loss": -9.862131118774414, "global_step": 105123, "epoch": 625} {"train_loss": -9.766393661499023, "global_step": 105124, "epoch": 625} {"train_loss": -9.797685623168945, "global_step": 105125, "epoch": 625} {"train_loss": -9.887323379516602, "global_step": 105126, "epoch": 625} {"train_loss": -9.34875202178955, "global_step": 105127, "epoch": 625} {"train_loss": -9.800394058227539, "global_step": 105128, "epoch": 625} {"train_loss": -9.867490768432617, "global_step": 105129, "epoch": 625} {"train_loss": -9.858108520507812, "global_step": 105130, "epoch": 625} {"train_loss": -9.87982177734375, "global_step": 105131, "epoch": 625} {"train_loss": -9.864884376525879, "global_step": 105132, "epoch": 625} {"train_loss": -9.898300170898438, "global_step": 105133, "epoch": 625} {"train_loss": -9.94721794128418, "global_step": 105134, "epoch": 625} {"train_loss": -9.668567657470703, "global_step": 105135, "epoch": 625} {"train_loss": -9.912786483764648, "global_step": 105136, "epoch": 625} {"train_loss": -9.859426498413086, "global_step": 105137, "epoch": 625} {"train_loss": -9.932538986206055, "global_step": 105138, "epoch": 625} {"train_loss": -9.733423233032227, "global_step": 105139, "epoch": 625} {"train_loss": -9.961153030395508, "global_step": 105140, "epoch": 625} {"train_loss": -10.071617126464844, "global_step": 105141, "epoch": 625} {"train_loss": -10.008593559265137, "global_step": 105142, "epoch": 625} {"train_loss": -9.976240158081055, "global_step": 105143, "epoch": 625} {"train_loss": -9.884973526000977, "global_step": 105144, "epoch": 625} {"train_loss": -9.934015274047852, "global_step": 105145, "epoch": 625} {"train_loss": -9.91136360168457, "global_step": 105146, "epoch": 625} {"train_loss": -9.759529113769531, "global_step": 105147, "epoch": 625} {"train_loss": -10.086997985839844, "global_step": 105148, "epoch": 625} {"train_loss": -10.026514053344727, "global_step": 105149, "epoch": 625} {"train_loss": -9.840801239013672, "global_step": 105150, "epoch": 625} {"train_loss": -10.028916358947754, "global_step": 105151, "epoch": 625} {"train_loss": -9.927505493164062, "global_step": 105152, "epoch": 625} {"train_loss": -9.859075546264648, "global_step": 105153, "epoch": 625} {"train_loss": -9.90182113647461, "global_step": 105154, "epoch": 625} {"train_loss": -9.718536376953125, "global_step": 105155, "epoch": 625} {"train_loss": -9.88382625579834, "global_step": 105156, "epoch": 625} {"train_loss": -9.643915176391602, "global_step": 105157, "epoch": 625} {"train_loss": -9.974483489990234, "global_step": 105158, "epoch": 625} {"train_loss": -9.341976165771484, "global_step": 105159, "epoch": 625} {"train_loss": -9.63876724243164, "global_step": 105160, "epoch": 625} {"train_loss": -9.972234725952148, "global_step": 105161, "epoch": 625} {"train_loss": -9.567584991455078, "global_step": 105162, "epoch": 625} {"train_loss": -9.913162231445312, "global_step": 105163, "epoch": 625} {"train_loss": -9.777091979980469, "global_step": 105164, "epoch": 625} {"train_loss": -9.977575302124023, "global_step": 105165, "epoch": 625} {"train_loss": -9.793959617614746, "global_step": 105166, "epoch": 625} {"train_loss": -9.752645089512779, "global_step": 105167, "epoch": 625, "val_loss": 205872.71875, "train_action_mse_error": 2.543576240539551} {"train_loss": -9.969959259033203, "global_step": 105168, "epoch": 626} {"train_loss": -9.46644401550293, "global_step": 105169, "epoch": 626} {"train_loss": -9.879618644714355, "global_step": 105170, "epoch": 626} {"train_loss": -9.55058765411377, "global_step": 105171, "epoch": 626} {"train_loss": -10.011007308959961, "global_step": 105172, "epoch": 626} {"train_loss": -9.550331115722656, "global_step": 105173, "epoch": 626} {"train_loss": -9.742324829101562, "global_step": 105174, "epoch": 626} {"train_loss": -9.877201080322266, "global_step": 105175, "epoch": 626} {"train_loss": -9.769343376159668, "global_step": 105176, "epoch": 626} {"train_loss": -9.698704719543457, "global_step": 105177, "epoch": 626} {"train_loss": -9.923685073852539, "global_step": 105178, "epoch": 626} {"train_loss": -9.807741165161133, "global_step": 105179, "epoch": 626} {"train_loss": -9.887140274047852, "global_step": 105180, "epoch": 626} {"train_loss": -9.673713684082031, "global_step": 105181, "epoch": 626} {"train_loss": -9.887893676757812, "global_step": 105182, "epoch": 626} {"train_loss": -9.846772193908691, "global_step": 105183, "epoch": 626} {"train_loss": -9.684085845947266, "global_step": 105184, "epoch": 626} {"train_loss": -9.846799850463867, "global_step": 105185, "epoch": 626} {"train_loss": -9.535377502441406, "global_step": 105186, "epoch": 626} {"train_loss": -9.832489013671875, "global_step": 105187, "epoch": 626} {"train_loss": -10.074604034423828, "global_step": 105188, "epoch": 626} {"train_loss": -9.689014434814453, "global_step": 105189, "epoch": 626} {"train_loss": -9.940101623535156, "global_step": 105190, "epoch": 626} {"train_loss": -9.844837188720703, "global_step": 105191, "epoch": 626} {"train_loss": -9.56039047241211, "global_step": 105192, "epoch": 626} {"train_loss": -9.85818862915039, "global_step": 105193, "epoch": 626} {"train_loss": -10.013666152954102, "global_step": 105194, "epoch": 626} {"train_loss": -9.917702674865723, "global_step": 105195, "epoch": 626} {"train_loss": -9.877756118774414, "global_step": 105196, "epoch": 626} {"train_loss": -9.895614624023438, "global_step": 105197, "epoch": 626} {"train_loss": -9.76563835144043, "global_step": 105198, "epoch": 626} {"train_loss": -10.122671127319336, "global_step": 105199, "epoch": 626} {"train_loss": -9.97366714477539, "global_step": 105200, "epoch": 626} {"train_loss": -9.77196979522705, "global_step": 105201, "epoch": 626} {"train_loss": -9.98508071899414, "global_step": 105202, "epoch": 626} {"train_loss": -9.909086227416992, "global_step": 105203, "epoch": 626} {"train_loss": -9.7184476852417, "global_step": 105204, "epoch": 626} {"train_loss": -10.016155242919922, "global_step": 105205, "epoch": 626} {"train_loss": -9.666102409362793, "global_step": 105206, "epoch": 626} {"train_loss": -9.824167251586914, "global_step": 105207, "epoch": 626} {"train_loss": -9.707998275756836, "global_step": 105208, "epoch": 626} {"train_loss": -9.90411376953125, "global_step": 105209, "epoch": 626} {"train_loss": -9.659399032592773, "global_step": 105210, "epoch": 626} {"train_loss": -9.740274429321289, "global_step": 105211, "epoch": 626} {"train_loss": -9.768722534179688, "global_step": 105212, "epoch": 626} {"train_loss": -10.006176948547363, "global_step": 105213, "epoch": 626} {"train_loss": -9.517120361328125, "global_step": 105214, "epoch": 626} {"train_loss": -9.947138786315918, "global_step": 105215, "epoch": 626} {"train_loss": -9.900814056396484, "global_step": 105216, "epoch": 626} {"train_loss": -9.36326789855957, "global_step": 105217, "epoch": 626} {"train_loss": -9.748703002929688, "global_step": 105218, "epoch": 626} {"train_loss": -9.702746391296387, "global_step": 105219, "epoch": 626} {"train_loss": -9.303915977478027, "global_step": 105220, "epoch": 626} {"train_loss": -9.77445125579834, "global_step": 105221, "epoch": 626} {"train_loss": -9.382292747497559, "global_step": 105222, "epoch": 626} {"train_loss": -9.272798538208008, "global_step": 105223, "epoch": 626} {"train_loss": -9.719446182250977, "global_step": 105224, "epoch": 626} {"train_loss": -9.462427139282227, "global_step": 105225, "epoch": 626} {"train_loss": -9.602898597717285, "global_step": 105226, "epoch": 626} {"train_loss": -9.952699661254883, "global_step": 105227, "epoch": 626} {"train_loss": -9.820877075195312, "global_step": 105228, "epoch": 626} {"train_loss": -9.89738655090332, "global_step": 105229, "epoch": 626} {"train_loss": -9.822236061096191, "global_step": 105230, "epoch": 626} {"train_loss": -9.325313568115234, "global_step": 105231, "epoch": 626} {"train_loss": -9.803340911865234, "global_step": 105232, "epoch": 626} {"train_loss": -9.579692840576172, "global_step": 105233, "epoch": 626} {"train_loss": -9.759557723999023, "global_step": 105234, "epoch": 626} {"train_loss": -9.959285736083984, "global_step": 105235, "epoch": 626} {"train_loss": -9.817537307739258, "global_step": 105236, "epoch": 626} {"train_loss": -9.84492301940918, "global_step": 105237, "epoch": 626} {"train_loss": -9.777944564819336, "global_step": 105238, "epoch": 626} {"train_loss": -9.663028717041016, "global_step": 105239, "epoch": 626} {"train_loss": -9.514762878417969, "global_step": 105240, "epoch": 626} {"train_loss": -9.729934692382812, "global_step": 105241, "epoch": 626} {"train_loss": -9.556252479553223, "global_step": 105242, "epoch": 626} {"train_loss": -9.844499588012695, "global_step": 105243, "epoch": 626} {"train_loss": -9.713085174560547, "global_step": 105244, "epoch": 626} {"train_loss": -9.855499267578125, "global_step": 105245, "epoch": 626} {"train_loss": -9.89792251586914, "global_step": 105246, "epoch": 626} {"train_loss": -9.518653869628906, "global_step": 105247, "epoch": 626} {"train_loss": -9.56060791015625, "global_step": 105248, "epoch": 626} {"train_loss": -9.416658401489258, "global_step": 105249, "epoch": 626} {"train_loss": -9.641385078430176, "global_step": 105250, "epoch": 626} {"train_loss": -9.38104248046875, "global_step": 105251, "epoch": 626} {"train_loss": -9.60820198059082, "global_step": 105252, "epoch": 626} {"train_loss": -9.098366737365723, "global_step": 105253, "epoch": 626} {"train_loss": -9.716577529907227, "global_step": 105254, "epoch": 626} {"train_loss": -9.284343719482422, "global_step": 105255, "epoch": 626} {"train_loss": -9.953397750854492, "global_step": 105256, "epoch": 626} {"train_loss": -9.578839302062988, "global_step": 105257, "epoch": 626} {"train_loss": -9.706700325012207, "global_step": 105258, "epoch": 626} {"train_loss": -9.816365242004395, "global_step": 105259, "epoch": 626} {"train_loss": -9.500044822692871, "global_step": 105260, "epoch": 626} {"train_loss": -9.808116912841797, "global_step": 105261, "epoch": 626} {"train_loss": -9.655428886413574, "global_step": 105262, "epoch": 626} {"train_loss": -9.891042709350586, "global_step": 105263, "epoch": 626} {"train_loss": -9.925914764404297, "global_step": 105264, "epoch": 626} {"train_loss": -9.954170227050781, "global_step": 105265, "epoch": 626} {"train_loss": -9.901993751525879, "global_step": 105266, "epoch": 626} {"train_loss": -9.639217376708984, "global_step": 105267, "epoch": 626} {"train_loss": -9.625860214233398, "global_step": 105268, "epoch": 626} {"train_loss": -9.609121322631836, "global_step": 105269, "epoch": 626} {"train_loss": -10.10319995880127, "global_step": 105270, "epoch": 626} {"train_loss": -9.939781188964844, "global_step": 105271, "epoch": 626} {"train_loss": -9.765625, "global_step": 105272, "epoch": 626} {"train_loss": -9.869373321533203, "global_step": 105273, "epoch": 626} {"train_loss": -10.007692337036133, "global_step": 105274, "epoch": 626} {"train_loss": -10.076476097106934, "global_step": 105275, "epoch": 626} {"train_loss": -10.126585006713867, "global_step": 105276, "epoch": 626} {"train_loss": -10.158882141113281, "global_step": 105277, "epoch": 626} {"train_loss": -10.025472640991211, "global_step": 105278, "epoch": 626} {"train_loss": -10.12200927734375, "global_step": 105279, "epoch": 626} {"train_loss": -10.027430534362793, "global_step": 105280, "epoch": 626} {"train_loss": -10.113895416259766, "global_step": 105281, "epoch": 626} {"train_loss": -9.9776029586792, "global_step": 105282, "epoch": 626} {"train_loss": -9.981147766113281, "global_step": 105283, "epoch": 626} {"train_loss": -10.014081001281738, "global_step": 105284, "epoch": 626} {"train_loss": -10.042272567749023, "global_step": 105285, "epoch": 626} {"train_loss": -10.161308288574219, "global_step": 105286, "epoch": 626} {"train_loss": -9.881893157958984, "global_step": 105287, "epoch": 626} {"train_loss": -9.754226684570312, "global_step": 105288, "epoch": 626} {"train_loss": -9.907243728637695, "global_step": 105289, "epoch": 626} {"train_loss": -9.716650009155273, "global_step": 105290, "epoch": 626} {"train_loss": -10.07913875579834, "global_step": 105291, "epoch": 626} {"train_loss": -10.16081428527832, "global_step": 105292, "epoch": 626} {"train_loss": -9.900945663452148, "global_step": 105293, "epoch": 626} {"train_loss": -10.320395469665527, "global_step": 105294, "epoch": 626} {"train_loss": -10.035423278808594, "global_step": 105295, "epoch": 626} {"train_loss": -9.806700706481934, "global_step": 105296, "epoch": 626} {"train_loss": -10.20057201385498, "global_step": 105297, "epoch": 626} {"train_loss": -10.157349586486816, "global_step": 105298, "epoch": 626} {"train_loss": -10.054588317871094, "global_step": 105299, "epoch": 626} {"train_loss": -10.045791625976562, "global_step": 105300, "epoch": 626} {"train_loss": -10.094121932983398, "global_step": 105301, "epoch": 626} {"train_loss": -10.015937805175781, "global_step": 105302, "epoch": 626} {"train_loss": -10.300185203552246, "global_step": 105303, "epoch": 626} {"train_loss": -9.870792388916016, "global_step": 105304, "epoch": 626} {"train_loss": -10.065262794494629, "global_step": 105305, "epoch": 626} {"train_loss": -9.87454605102539, "global_step": 105306, "epoch": 626} {"train_loss": -10.063825607299805, "global_step": 105307, "epoch": 626} {"train_loss": -10.130256652832031, "global_step": 105308, "epoch": 626} {"train_loss": -10.002300262451172, "global_step": 105309, "epoch": 626} {"train_loss": -9.663431167602539, "global_step": 105310, "epoch": 626} {"train_loss": -10.04380989074707, "global_step": 105311, "epoch": 626} {"train_loss": -10.227558135986328, "global_step": 105312, "epoch": 626} {"train_loss": -10.105443954467773, "global_step": 105313, "epoch": 626} {"train_loss": -10.113054275512695, "global_step": 105314, "epoch": 626} {"train_loss": -10.123998641967773, "global_step": 105315, "epoch": 626} {"train_loss": -10.045927047729492, "global_step": 105316, "epoch": 626} {"train_loss": -9.99649715423584, "global_step": 105317, "epoch": 626} {"train_loss": -9.720806121826172, "global_step": 105318, "epoch": 626} {"train_loss": -10.065220832824707, "global_step": 105319, "epoch": 626} {"train_loss": -9.421525955200195, "global_step": 105320, "epoch": 626} {"train_loss": -9.470390319824219, "global_step": 105321, "epoch": 626} {"train_loss": -9.9927978515625, "global_step": 105322, "epoch": 626} {"train_loss": -8.972142219543457, "global_step": 105323, "epoch": 626} {"train_loss": -9.722216606140137, "global_step": 105324, "epoch": 626} {"train_loss": -9.600528717041016, "global_step": 105325, "epoch": 626} {"train_loss": -8.940141677856445, "global_step": 105326, "epoch": 626} {"train_loss": -10.06348705291748, "global_step": 105327, "epoch": 626} {"train_loss": -9.734716415405273, "global_step": 105328, "epoch": 626} {"train_loss": -9.437795639038086, "global_step": 105329, "epoch": 626} {"train_loss": -9.745527267456055, "global_step": 105330, "epoch": 626} {"train_loss": -9.586280822753906, "global_step": 105331, "epoch": 626} {"train_loss": -9.437360763549805, "global_step": 105332, "epoch": 626} {"train_loss": -9.773860931396484, "global_step": 105333, "epoch": 626} {"train_loss": -9.501677513122559, "global_step": 105334, "epoch": 626} {"train_loss": -9.805615743001303, "global_step": 105335, "epoch": 626, "val_loss": 208850.234375} {"train_loss": -9.678122520446777, "global_step": 105336, "epoch": 627} {"train_loss": -9.431285858154297, "global_step": 105337, "epoch": 627} {"train_loss": -9.594855308532715, "global_step": 105338, "epoch": 627} {"train_loss": -9.760160446166992, "global_step": 105339, "epoch": 627} {"train_loss": -9.337069511413574, "global_step": 105340, "epoch": 627} {"train_loss": -9.882237434387207, "global_step": 105341, "epoch": 627} {"train_loss": -9.304983139038086, "global_step": 105342, "epoch": 627} {"train_loss": -9.19178581237793, "global_step": 105343, "epoch": 627} {"train_loss": -9.680512428283691, "global_step": 105344, "epoch": 627} {"train_loss": -9.571891784667969, "global_step": 105345, "epoch": 627} {"train_loss": -9.677729606628418, "global_step": 105346, "epoch": 627} {"train_loss": -9.62734317779541, "global_step": 105347, "epoch": 627} {"train_loss": -9.693032264709473, "global_step": 105348, "epoch": 627} {"train_loss": -9.493768692016602, "global_step": 105349, "epoch": 627} {"train_loss": -9.898931503295898, "global_step": 105350, "epoch": 627} {"train_loss": -9.841644287109375, "global_step": 105351, "epoch": 627} {"train_loss": -9.790331840515137, "global_step": 105352, "epoch": 627} {"train_loss": -9.880412101745605, "global_step": 105353, "epoch": 627} {"train_loss": -10.016473770141602, "global_step": 105354, "epoch": 627} {"train_loss": -9.832534790039062, "global_step": 105355, "epoch": 627} {"train_loss": -9.769651412963867, "global_step": 105356, "epoch": 627} {"train_loss": -9.506399154663086, "global_step": 105357, "epoch": 627} {"train_loss": -9.799372673034668, "global_step": 105358, "epoch": 627} {"train_loss": -9.742691993713379, "global_step": 105359, "epoch": 627} {"train_loss": -9.839944839477539, "global_step": 105360, "epoch": 627} {"train_loss": -9.980759620666504, "global_step": 105361, "epoch": 627} {"train_loss": -9.498820304870605, "global_step": 105362, "epoch": 627} {"train_loss": -10.072711944580078, "global_step": 105363, "epoch": 627} {"train_loss": -9.569276809692383, "global_step": 105364, "epoch": 627} {"train_loss": -9.760238647460938, "global_step": 105365, "epoch": 627} {"train_loss": -9.67249870300293, "global_step": 105366, "epoch": 627} {"train_loss": -9.990785598754883, "global_step": 105367, "epoch": 627} {"train_loss": -9.540281295776367, "global_step": 105368, "epoch": 627} {"train_loss": -9.884048461914062, "global_step": 105369, "epoch": 627} {"train_loss": -9.732172966003418, "global_step": 105370, "epoch": 627} {"train_loss": -9.670766830444336, "global_step": 105371, "epoch": 627} {"train_loss": -9.58713436126709, "global_step": 105372, "epoch": 627} {"train_loss": -9.620645523071289, "global_step": 105373, "epoch": 627} {"train_loss": -9.527872085571289, "global_step": 105374, "epoch": 627} {"train_loss": -9.78554916381836, "global_step": 105375, "epoch": 627} {"train_loss": -9.711322784423828, "global_step": 105376, "epoch": 627} {"train_loss": -9.899307250976562, "global_step": 105377, "epoch": 627} {"train_loss": -9.80477237701416, "global_step": 105378, "epoch": 627} {"train_loss": -9.691843032836914, "global_step": 105379, "epoch": 627} {"train_loss": -9.844611167907715, "global_step": 105380, "epoch": 627} {"train_loss": -9.706534385681152, "global_step": 105381, "epoch": 627} {"train_loss": -9.854114532470703, "global_step": 105382, "epoch": 627} {"train_loss": -9.50582504272461, "global_step": 105383, "epoch": 627} {"train_loss": -9.787637710571289, "global_step": 105384, "epoch": 627} {"train_loss": -9.553474426269531, "global_step": 105385, "epoch": 627} {"train_loss": -9.410276412963867, "global_step": 105386, "epoch": 627} {"train_loss": -9.529410362243652, "global_step": 105387, "epoch": 627} {"train_loss": -9.939958572387695, "global_step": 105388, "epoch": 627} {"train_loss": -9.885625839233398, "global_step": 105389, "epoch": 627} {"train_loss": -9.579108238220215, "global_step": 105390, "epoch": 627} {"train_loss": -9.691863059997559, "global_step": 105391, "epoch": 627} {"train_loss": -9.911558151245117, "global_step": 105392, "epoch": 627} {"train_loss": -9.8569917678833, "global_step": 105393, "epoch": 627} {"train_loss": -9.87864875793457, "global_step": 105394, "epoch": 627} {"train_loss": -9.5936918258667, "global_step": 105395, "epoch": 627} {"train_loss": -9.850606918334961, "global_step": 105396, "epoch": 627} {"train_loss": -9.916545867919922, "global_step": 105397, "epoch": 627} {"train_loss": -9.804597854614258, "global_step": 105398, "epoch": 627} {"train_loss": -9.770312309265137, "global_step": 105399, "epoch": 627} {"train_loss": -9.950566291809082, "global_step": 105400, "epoch": 627} {"train_loss": -9.59516716003418, "global_step": 105401, "epoch": 627} {"train_loss": -9.79922103881836, "global_step": 105402, "epoch": 627} {"train_loss": -9.827248573303223, "global_step": 105403, "epoch": 627} {"train_loss": -9.95823860168457, "global_step": 105404, "epoch": 627} {"train_loss": -9.725969314575195, "global_step": 105405, "epoch": 627} {"train_loss": -9.549385070800781, "global_step": 105406, "epoch": 627} {"train_loss": -9.768390655517578, "global_step": 105407, "epoch": 627} {"train_loss": -9.557985305786133, "global_step": 105408, "epoch": 627} {"train_loss": -9.696325302124023, "global_step": 105409, "epoch": 627} {"train_loss": -9.985860824584961, "global_step": 105410, "epoch": 627} {"train_loss": -9.504508018493652, "global_step": 105411, "epoch": 627} {"train_loss": -9.725410461425781, "global_step": 105412, "epoch": 627} {"train_loss": -9.416658401489258, "global_step": 105413, "epoch": 627} {"train_loss": -9.932807922363281, "global_step": 105414, "epoch": 627} {"train_loss": -9.893256187438965, "global_step": 105415, "epoch": 627} {"train_loss": -9.80447006225586, "global_step": 105416, "epoch": 627} {"train_loss": -10.01665210723877, "global_step": 105417, "epoch": 627} {"train_loss": -9.738750457763672, "global_step": 105418, "epoch": 627} {"train_loss": -9.643165588378906, "global_step": 105419, "epoch": 627} {"train_loss": -9.643156051635742, "global_step": 105420, "epoch": 627} {"train_loss": -9.629273414611816, "global_step": 105421, "epoch": 627} {"train_loss": -9.493138313293457, "global_step": 105422, "epoch": 627} {"train_loss": -9.91336727142334, "global_step": 105423, "epoch": 627} {"train_loss": -9.774436950683594, "global_step": 105424, "epoch": 627} {"train_loss": -10.00715446472168, "global_step": 105425, "epoch": 627} {"train_loss": -9.539935111999512, "global_step": 105426, "epoch": 627} {"train_loss": -10.069571495056152, "global_step": 105427, "epoch": 627} {"train_loss": -9.75245189666748, "global_step": 105428, "epoch": 627} {"train_loss": -9.90336799621582, "global_step": 105429, "epoch": 627} {"train_loss": -9.598438262939453, "global_step": 105430, "epoch": 627} {"train_loss": -9.773462295532227, "global_step": 105431, "epoch": 627} {"train_loss": -9.7767333984375, "global_step": 105432, "epoch": 627} {"train_loss": -10.051673889160156, "global_step": 105433, "epoch": 627} {"train_loss": -9.861356735229492, "global_step": 105434, "epoch": 627} {"train_loss": -9.96426010131836, "global_step": 105435, "epoch": 627} {"train_loss": -9.725071907043457, "global_step": 105436, "epoch": 627} {"train_loss": -9.951492309570312, "global_step": 105437, "epoch": 627} {"train_loss": -9.936664581298828, "global_step": 105438, "epoch": 627} {"train_loss": -9.839601516723633, "global_step": 105439, "epoch": 627} {"train_loss": -9.951244354248047, "global_step": 105440, "epoch": 627} {"train_loss": -9.923744201660156, "global_step": 105441, "epoch": 627} {"train_loss": -10.000431060791016, "global_step": 105442, "epoch": 627} {"train_loss": -9.718050956726074, "global_step": 105443, "epoch": 627} {"train_loss": -9.946349143981934, "global_step": 105444, "epoch": 627} {"train_loss": -9.788339614868164, "global_step": 105445, "epoch": 627} {"train_loss": -9.49128532409668, "global_step": 105446, "epoch": 627} {"train_loss": -9.757140159606934, "global_step": 105447, "epoch": 627} {"train_loss": -10.11191177368164, "global_step": 105448, "epoch": 627} {"train_loss": -9.371797561645508, "global_step": 105449, "epoch": 627} {"train_loss": -9.727054595947266, "global_step": 105450, "epoch": 627} {"train_loss": -9.792261123657227, "global_step": 105451, "epoch": 627} {"train_loss": -9.73993968963623, "global_step": 105452, "epoch": 627} {"train_loss": -9.725982666015625, "global_step": 105453, "epoch": 627} {"train_loss": -9.56215763092041, "global_step": 105454, "epoch": 627} {"train_loss": -9.964289665222168, "global_step": 105455, "epoch": 627} {"train_loss": -9.570695877075195, "global_step": 105456, "epoch": 627} {"train_loss": -9.411565780639648, "global_step": 105457, "epoch": 627} {"train_loss": -10.131876945495605, "global_step": 105458, "epoch": 627} {"train_loss": -9.683109283447266, "global_step": 105459, "epoch": 627} {"train_loss": -9.850968360900879, "global_step": 105460, "epoch": 627} {"train_loss": -9.922595024108887, "global_step": 105461, "epoch": 627} {"train_loss": -9.701166152954102, "global_step": 105462, "epoch": 627} {"train_loss": -9.977860450744629, "global_step": 105463, "epoch": 627} {"train_loss": -9.573692321777344, "global_step": 105464, "epoch": 627} {"train_loss": -9.932430267333984, "global_step": 105465, "epoch": 627} {"train_loss": -10.081417083740234, "global_step": 105466, "epoch": 627} {"train_loss": -9.779441833496094, "global_step": 105467, "epoch": 627} {"train_loss": -9.912822723388672, "global_step": 105468, "epoch": 627} {"train_loss": -9.938155174255371, "global_step": 105469, "epoch": 627} {"train_loss": -9.793952941894531, "global_step": 105470, "epoch": 627} {"train_loss": -9.984370231628418, "global_step": 105471, "epoch": 627} {"train_loss": -10.03615951538086, "global_step": 105472, "epoch": 627} {"train_loss": -9.709391593933105, "global_step": 105473, "epoch": 627} {"train_loss": -9.886622428894043, "global_step": 105474, "epoch": 627} {"train_loss": -9.791460037231445, "global_step": 105475, "epoch": 627} {"train_loss": -10.011978149414062, "global_step": 105476, "epoch": 627} {"train_loss": -9.651555061340332, "global_step": 105477, "epoch": 627} {"train_loss": -9.987354278564453, "global_step": 105478, "epoch": 627} {"train_loss": -9.585329055786133, "global_step": 105479, "epoch": 627} {"train_loss": -9.92704963684082, "global_step": 105480, "epoch": 627} {"train_loss": -9.892755508422852, "global_step": 105481, "epoch": 627} {"train_loss": -9.551429748535156, "global_step": 105482, "epoch": 627} {"train_loss": -9.959278106689453, "global_step": 105483, "epoch": 627} {"train_loss": -10.039822578430176, "global_step": 105484, "epoch": 627} {"train_loss": -9.463895797729492, "global_step": 105485, "epoch": 627} {"train_loss": -9.968425750732422, "global_step": 105486, "epoch": 627} {"train_loss": -9.917671203613281, "global_step": 105487, "epoch": 627} {"train_loss": -9.548727035522461, "global_step": 105488, "epoch": 627} {"train_loss": -9.736211776733398, "global_step": 105489, "epoch": 627} {"train_loss": -9.559646606445312, "global_step": 105490, "epoch": 627} {"train_loss": -9.91904354095459, "global_step": 105491, "epoch": 627} {"train_loss": -9.808283805847168, "global_step": 105492, "epoch": 627} {"train_loss": -9.74630355834961, "global_step": 105493, "epoch": 627} {"train_loss": -9.958054542541504, "global_step": 105494, "epoch": 627} {"train_loss": -10.004799842834473, "global_step": 105495, "epoch": 627} {"train_loss": -9.880285263061523, "global_step": 105496, "epoch": 627} {"train_loss": -9.823665618896484, "global_step": 105497, "epoch": 627} {"train_loss": -9.947324752807617, "global_step": 105498, "epoch": 627} {"train_loss": -9.883575439453125, "global_step": 105499, "epoch": 627} {"train_loss": -9.761064529418945, "global_step": 105500, "epoch": 627} {"train_loss": -9.617392539978027, "global_step": 105501, "epoch": 627} {"train_loss": -9.825491905212402, "global_step": 105502, "epoch": 627} {"train_loss": -9.766544886997767, "global_step": 105503, "epoch": 627, "val_loss": 207284.0625} {"train_loss": -9.810752868652344, "global_step": 105504, "epoch": 628} {"train_loss": -9.662933349609375, "global_step": 105505, "epoch": 628} {"train_loss": -9.794572830200195, "global_step": 105506, "epoch": 628} {"train_loss": -9.822552680969238, "global_step": 105507, "epoch": 628} {"train_loss": -9.663063049316406, "global_step": 105508, "epoch": 628} {"train_loss": -9.639178276062012, "global_step": 105509, "epoch": 628} {"train_loss": -9.580384254455566, "global_step": 105510, "epoch": 628} {"train_loss": -9.69014835357666, "global_step": 105511, "epoch": 628} {"train_loss": -9.494080543518066, "global_step": 105512, "epoch": 628} {"train_loss": -9.765933990478516, "global_step": 105513, "epoch": 628} {"train_loss": -9.757675170898438, "global_step": 105514, "epoch": 628} {"train_loss": -9.669203758239746, "global_step": 105515, "epoch": 628} {"train_loss": -9.669637680053711, "global_step": 105516, "epoch": 628} {"train_loss": -9.451332092285156, "global_step": 105517, "epoch": 628} {"train_loss": -9.801631927490234, "global_step": 105518, "epoch": 628} {"train_loss": -9.78482723236084, "global_step": 105519, "epoch": 628} {"train_loss": -9.80408763885498, "global_step": 105520, "epoch": 628} {"train_loss": -9.6227388381958, "global_step": 105521, "epoch": 628} {"train_loss": -9.698545455932617, "global_step": 105522, "epoch": 628} {"train_loss": -9.762584686279297, "global_step": 105523, "epoch": 628} {"train_loss": -9.709783554077148, "global_step": 105524, "epoch": 628} {"train_loss": -10.086549758911133, "global_step": 105525, "epoch": 628} {"train_loss": -9.814764976501465, "global_step": 105526, "epoch": 628} {"train_loss": -10.142364501953125, "global_step": 105527, "epoch": 628} {"train_loss": -9.868865966796875, "global_step": 105528, "epoch": 628} {"train_loss": -10.067354202270508, "global_step": 105529, "epoch": 628} {"train_loss": -9.880672454833984, "global_step": 105530, "epoch": 628} {"train_loss": -10.105278968811035, "global_step": 105531, "epoch": 628} {"train_loss": -9.939550399780273, "global_step": 105532, "epoch": 628} {"train_loss": -9.853790283203125, "global_step": 105533, "epoch": 628} {"train_loss": -9.837279319763184, "global_step": 105534, "epoch": 628} {"train_loss": -9.597942352294922, "global_step": 105535, "epoch": 628} {"train_loss": -9.728521347045898, "global_step": 105536, "epoch": 628} {"train_loss": -9.717049598693848, "global_step": 105537, "epoch": 628} {"train_loss": -9.921812057495117, "global_step": 105538, "epoch": 628} {"train_loss": -9.882999420166016, "global_step": 105539, "epoch": 628} {"train_loss": -9.842482566833496, "global_step": 105540, "epoch": 628} {"train_loss": -9.701643943786621, "global_step": 105541, "epoch": 628} {"train_loss": -10.162290573120117, "global_step": 105542, "epoch": 628} {"train_loss": -9.642147064208984, "global_step": 105543, "epoch": 628} {"train_loss": -9.988692283630371, "global_step": 105544, "epoch": 628} {"train_loss": -9.862457275390625, "global_step": 105545, "epoch": 628} {"train_loss": -10.124876022338867, "global_step": 105546, "epoch": 628} {"train_loss": -9.827198028564453, "global_step": 105547, "epoch": 628} {"train_loss": -10.059008598327637, "global_step": 105548, "epoch": 628} {"train_loss": -10.039377212524414, "global_step": 105549, "epoch": 628} {"train_loss": -9.706904411315918, "global_step": 105550, "epoch": 628} {"train_loss": -10.05359172821045, "global_step": 105551, "epoch": 628} {"train_loss": -9.65835952758789, "global_step": 105552, "epoch": 628} {"train_loss": -9.946233749389648, "global_step": 105553, "epoch": 628} {"train_loss": -9.835205078125, "global_step": 105554, "epoch": 628} {"train_loss": -9.4856538772583, "global_step": 105555, "epoch": 628} {"train_loss": -10.023326873779297, "global_step": 105556, "epoch": 628} {"train_loss": -9.814751625061035, "global_step": 105557, "epoch": 628} {"train_loss": -9.71387004852295, "global_step": 105558, "epoch": 628} {"train_loss": -9.616531372070312, "global_step": 105559, "epoch": 628} {"train_loss": -9.611006736755371, "global_step": 105560, "epoch": 628} {"train_loss": -10.037605285644531, "global_step": 105561, "epoch": 628} {"train_loss": -9.84321403503418, "global_step": 105562, "epoch": 628} {"train_loss": -9.973257064819336, "global_step": 105563, "epoch": 628} {"train_loss": -9.624568939208984, "global_step": 105564, "epoch": 628} {"train_loss": -9.90893268585205, "global_step": 105565, "epoch": 628} {"train_loss": -10.145944595336914, "global_step": 105566, "epoch": 628} {"train_loss": -9.844842910766602, "global_step": 105567, "epoch": 628} {"train_loss": -9.6539306640625, "global_step": 105568, "epoch": 628} {"train_loss": -9.890369415283203, "global_step": 105569, "epoch": 628} {"train_loss": -9.439451217651367, "global_step": 105570, "epoch": 628} {"train_loss": -9.896919250488281, "global_step": 105571, "epoch": 628} {"train_loss": -9.276391983032227, "global_step": 105572, "epoch": 628} {"train_loss": -10.021464347839355, "global_step": 105573, "epoch": 628} {"train_loss": -9.614084243774414, "global_step": 105574, "epoch": 628} {"train_loss": -10.12082576751709, "global_step": 105575, "epoch": 628} {"train_loss": -9.448362350463867, "global_step": 105576, "epoch": 628} {"train_loss": -9.948165893554688, "global_step": 105577, "epoch": 628} {"train_loss": -9.71260929107666, "global_step": 105578, "epoch": 628} {"train_loss": -9.921627044677734, "global_step": 105579, "epoch": 628} {"train_loss": -9.62930965423584, "global_step": 105580, "epoch": 628} {"train_loss": -9.704303741455078, "global_step": 105581, "epoch": 628} {"train_loss": -9.833898544311523, "global_step": 105582, "epoch": 628} {"train_loss": -9.770040512084961, "global_step": 105583, "epoch": 628} {"train_loss": -9.519453048706055, "global_step": 105584, "epoch": 628} {"train_loss": -9.878315925598145, "global_step": 105585, "epoch": 628} {"train_loss": -9.642513275146484, "global_step": 105586, "epoch": 628} {"train_loss": -9.606330871582031, "global_step": 105587, "epoch": 628} {"train_loss": -9.93086051940918, "global_step": 105588, "epoch": 628} {"train_loss": -9.688117980957031, "global_step": 105589, "epoch": 628} {"train_loss": -9.769002914428711, "global_step": 105590, "epoch": 628} {"train_loss": -9.8995361328125, "global_step": 105591, "epoch": 628} {"train_loss": -9.52310848236084, "global_step": 105592, "epoch": 628} {"train_loss": -9.951337814331055, "global_step": 105593, "epoch": 628} {"train_loss": -9.56234073638916, "global_step": 105594, "epoch": 628} {"train_loss": -9.772546768188477, "global_step": 105595, "epoch": 628} {"train_loss": -9.789770126342773, "global_step": 105596, "epoch": 628} {"train_loss": -9.758639335632324, "global_step": 105597, "epoch": 628} {"train_loss": -10.10141658782959, "global_step": 105598, "epoch": 628} {"train_loss": -9.781982421875, "global_step": 105599, "epoch": 628} {"train_loss": -9.826803207397461, "global_step": 105600, "epoch": 628} {"train_loss": -9.930778503417969, "global_step": 105601, "epoch": 628} {"train_loss": -9.899335861206055, "global_step": 105602, "epoch": 628} {"train_loss": -9.826746940612793, "global_step": 105603, "epoch": 628} {"train_loss": -9.547889709472656, "global_step": 105604, "epoch": 628} {"train_loss": -9.861173629760742, "global_step": 105605, "epoch": 628} {"train_loss": -9.867035865783691, "global_step": 105606, "epoch": 628} {"train_loss": -10.193603515625, "global_step": 105607, "epoch": 628} {"train_loss": -9.673462867736816, "global_step": 105608, "epoch": 628} {"train_loss": -10.007413864135742, "global_step": 105609, "epoch": 628} {"train_loss": -9.41079044342041, "global_step": 105610, "epoch": 628} {"train_loss": -9.672672271728516, "global_step": 105611, "epoch": 628} {"train_loss": -9.741398811340332, "global_step": 105612, "epoch": 628} {"train_loss": -9.851219177246094, "global_step": 105613, "epoch": 628} {"train_loss": -9.771035194396973, "global_step": 105614, "epoch": 628} {"train_loss": -10.00901985168457, "global_step": 105615, "epoch": 628} {"train_loss": -9.851109504699707, "global_step": 105616, "epoch": 628} {"train_loss": -9.418586730957031, "global_step": 105617, "epoch": 628} {"train_loss": -9.463750839233398, "global_step": 105618, "epoch": 628} {"train_loss": -9.56875991821289, "global_step": 105619, "epoch": 628} {"train_loss": -9.828596115112305, "global_step": 105620, "epoch": 628} {"train_loss": -10.04745864868164, "global_step": 105621, "epoch": 628} {"train_loss": -9.859527587890625, "global_step": 105622, "epoch": 628} {"train_loss": -9.759449005126953, "global_step": 105623, "epoch": 628} {"train_loss": -9.649345397949219, "global_step": 105624, "epoch": 628} {"train_loss": -9.686866760253906, "global_step": 105625, "epoch": 628} {"train_loss": -9.715153694152832, "global_step": 105626, "epoch": 628} {"train_loss": -9.707239151000977, "global_step": 105627, "epoch": 628} {"train_loss": -9.535028457641602, "global_step": 105628, "epoch": 628} {"train_loss": -9.52157974243164, "global_step": 105629, "epoch": 628} {"train_loss": -9.688506126403809, "global_step": 105630, "epoch": 628} {"train_loss": -9.682899475097656, "global_step": 105631, "epoch": 628} {"train_loss": -9.700353622436523, "global_step": 105632, "epoch": 628} {"train_loss": -9.919574737548828, "global_step": 105633, "epoch": 628} {"train_loss": -9.320639610290527, "global_step": 105634, "epoch": 628} {"train_loss": -9.83586597442627, "global_step": 105635, "epoch": 628} {"train_loss": -9.602437973022461, "global_step": 105636, "epoch": 628} {"train_loss": -9.694501876831055, "global_step": 105637, "epoch": 628} {"train_loss": -9.854279518127441, "global_step": 105638, "epoch": 628} {"train_loss": -9.616415023803711, "global_step": 105639, "epoch": 628} {"train_loss": -9.936773300170898, "global_step": 105640, "epoch": 628} {"train_loss": -9.753894805908203, "global_step": 105641, "epoch": 628} {"train_loss": -9.847567558288574, "global_step": 105642, "epoch": 628} {"train_loss": -9.425664901733398, "global_step": 105643, "epoch": 628} {"train_loss": -9.919872283935547, "global_step": 105644, "epoch": 628} {"train_loss": -9.728221893310547, "global_step": 105645, "epoch": 628} {"train_loss": -10.03342056274414, "global_step": 105646, "epoch": 628} {"train_loss": -9.76097297668457, "global_step": 105647, "epoch": 628} {"train_loss": -9.768898010253906, "global_step": 105648, "epoch": 628} {"train_loss": -9.817740440368652, "global_step": 105649, "epoch": 628} {"train_loss": -9.858158111572266, "global_step": 105650, "epoch": 628} {"train_loss": -9.83056640625, "global_step": 105651, "epoch": 628} {"train_loss": -9.624311447143555, "global_step": 105652, "epoch": 628} {"train_loss": -9.993045806884766, "global_step": 105653, "epoch": 628} {"train_loss": -9.728744506835938, "global_step": 105654, "epoch": 628} {"train_loss": -9.882902145385742, "global_step": 105655, "epoch": 628} {"train_loss": -9.663728713989258, "global_step": 105656, "epoch": 628} {"train_loss": -9.858732223510742, "global_step": 105657, "epoch": 628} {"train_loss": -10.050728797912598, "global_step": 105658, "epoch": 628} {"train_loss": -9.861968994140625, "global_step": 105659, "epoch": 628} {"train_loss": -9.95445728302002, "global_step": 105660, "epoch": 628} {"train_loss": -10.066885948181152, "global_step": 105661, "epoch": 628} {"train_loss": -9.847024917602539, "global_step": 105662, "epoch": 628} {"train_loss": -10.01976203918457, "global_step": 105663, "epoch": 628} {"train_loss": -9.784927368164062, "global_step": 105664, "epoch": 628} {"train_loss": -9.891582489013672, "global_step": 105665, "epoch": 628} {"train_loss": -9.75401782989502, "global_step": 105666, "epoch": 628} {"train_loss": -9.702569961547852, "global_step": 105667, "epoch": 628} {"train_loss": -9.962223052978516, "global_step": 105668, "epoch": 628} {"train_loss": -10.027811050415039, "global_step": 105669, "epoch": 628} {"train_loss": -9.61439323425293, "global_step": 105670, "epoch": 628} {"train_loss": -9.79085141704196, "global_step": 105671, "epoch": 628, "val_loss": 208140.90625} {"train_loss": -9.712890625, "global_step": 105672, "epoch": 629} {"train_loss": -10.104394912719727, "global_step": 105673, "epoch": 629} {"train_loss": -9.944559097290039, "global_step": 105674, "epoch": 629} {"train_loss": -9.82548999786377, "global_step": 105675, "epoch": 629} {"train_loss": -9.71270751953125, "global_step": 105676, "epoch": 629} {"train_loss": -9.934267044067383, "global_step": 105677, "epoch": 629} {"train_loss": -9.987968444824219, "global_step": 105678, "epoch": 629} {"train_loss": -9.855314254760742, "global_step": 105679, "epoch": 629} {"train_loss": -9.7501802444458, "global_step": 105680, "epoch": 629} {"train_loss": -9.917497634887695, "global_step": 105681, "epoch": 629} {"train_loss": -9.877391815185547, "global_step": 105682, "epoch": 629} {"train_loss": -10.082159042358398, "global_step": 105683, "epoch": 629} {"train_loss": -9.702356338500977, "global_step": 105684, "epoch": 629} {"train_loss": -10.000490188598633, "global_step": 105685, "epoch": 629} {"train_loss": -9.947442054748535, "global_step": 105686, "epoch": 629} {"train_loss": -10.247369766235352, "global_step": 105687, "epoch": 629} {"train_loss": -9.642071723937988, "global_step": 105688, "epoch": 629} {"train_loss": -9.8938627243042, "global_step": 105689, "epoch": 629} {"train_loss": -10.096933364868164, "global_step": 105690, "epoch": 629} {"train_loss": -9.527446746826172, "global_step": 105691, "epoch": 629} {"train_loss": -9.774235725402832, "global_step": 105692, "epoch": 629} {"train_loss": -9.863231658935547, "global_step": 105693, "epoch": 629} {"train_loss": -9.553736686706543, "global_step": 105694, "epoch": 629} {"train_loss": -9.979866027832031, "global_step": 105695, "epoch": 629} {"train_loss": -9.91225528717041, "global_step": 105696, "epoch": 629} {"train_loss": -10.16253662109375, "global_step": 105697, "epoch": 629} {"train_loss": -9.78865909576416, "global_step": 105698, "epoch": 629} {"train_loss": -9.869176864624023, "global_step": 105699, "epoch": 629} {"train_loss": -9.656606674194336, "global_step": 105700, "epoch": 629} {"train_loss": -9.806988716125488, "global_step": 105701, "epoch": 629} {"train_loss": -9.7754545211792, "global_step": 105702, "epoch": 629} {"train_loss": -9.790192604064941, "global_step": 105703, "epoch": 629} {"train_loss": -9.84323501586914, "global_step": 105704, "epoch": 629} {"train_loss": -9.977681159973145, "global_step": 105705, "epoch": 629} {"train_loss": -9.577142715454102, "global_step": 105706, "epoch": 629} {"train_loss": -9.644819259643555, "global_step": 105707, "epoch": 629} {"train_loss": -9.512144088745117, "global_step": 105708, "epoch": 629} {"train_loss": -9.31308364868164, "global_step": 105709, "epoch": 629} {"train_loss": -9.621709823608398, "global_step": 105710, "epoch": 629} {"train_loss": -9.52682876586914, "global_step": 105711, "epoch": 629} {"train_loss": -9.656322479248047, "global_step": 105712, "epoch": 629} {"train_loss": -9.612253189086914, "global_step": 105713, "epoch": 629} {"train_loss": -9.877439498901367, "global_step": 105714, "epoch": 629} {"train_loss": -9.548685073852539, "global_step": 105715, "epoch": 629} {"train_loss": -9.823993682861328, "global_step": 105716, "epoch": 629} {"train_loss": -9.817522048950195, "global_step": 105717, "epoch": 629} {"train_loss": -9.286046981811523, "global_step": 105718, "epoch": 629} {"train_loss": -9.864992141723633, "global_step": 105719, "epoch": 629} {"train_loss": -9.749054908752441, "global_step": 105720, "epoch": 629} {"train_loss": -9.870269775390625, "global_step": 105721, "epoch": 629} {"train_loss": -9.761306762695312, "global_step": 105722, "epoch": 629} {"train_loss": -9.953058242797852, "global_step": 105723, "epoch": 629} {"train_loss": -9.83694839477539, "global_step": 105724, "epoch": 629} {"train_loss": -9.902313232421875, "global_step": 105725, "epoch": 629} {"train_loss": -9.886529922485352, "global_step": 105726, "epoch": 629} {"train_loss": -9.617912292480469, "global_step": 105727, "epoch": 629} {"train_loss": -9.961771011352539, "global_step": 105728, "epoch": 629} {"train_loss": -9.935132026672363, "global_step": 105729, "epoch": 629} {"train_loss": -10.02825927734375, "global_step": 105730, "epoch": 629} {"train_loss": -9.765620231628418, "global_step": 105731, "epoch": 629} {"train_loss": -10.02252197265625, "global_step": 105732, "epoch": 629} {"train_loss": -9.800924301147461, "global_step": 105733, "epoch": 629} {"train_loss": -10.002237319946289, "global_step": 105734, "epoch": 629} {"train_loss": -10.067777633666992, "global_step": 105735, "epoch": 629} {"train_loss": -9.96664047241211, "global_step": 105736, "epoch": 629} {"train_loss": -10.229362487792969, "global_step": 105737, "epoch": 629} {"train_loss": -10.205771446228027, "global_step": 105738, "epoch": 629} {"train_loss": -10.064096450805664, "global_step": 105739, "epoch": 629} {"train_loss": -9.877593994140625, "global_step": 105740, "epoch": 629} {"train_loss": -9.985662460327148, "global_step": 105741, "epoch": 629} {"train_loss": -10.060442924499512, "global_step": 105742, "epoch": 629} {"train_loss": -9.912827491760254, "global_step": 105743, "epoch": 629} {"train_loss": -9.602749824523926, "global_step": 105744, "epoch": 629} {"train_loss": -9.582143783569336, "global_step": 105745, "epoch": 629} {"train_loss": -9.891854286193848, "global_step": 105746, "epoch": 629} {"train_loss": -9.255766868591309, "global_step": 105747, "epoch": 629} {"train_loss": -9.608777046203613, "global_step": 105748, "epoch": 629} {"train_loss": -9.471205711364746, "global_step": 105749, "epoch": 629} {"train_loss": -9.790884971618652, "global_step": 105750, "epoch": 629} {"train_loss": -9.596600532531738, "global_step": 105751, "epoch": 629} {"train_loss": -9.83898639678955, "global_step": 105752, "epoch": 629} {"train_loss": -9.643976211547852, "global_step": 105753, "epoch": 629} {"train_loss": -9.915804862976074, "global_step": 105754, "epoch": 629} {"train_loss": -9.778383255004883, "global_step": 105755, "epoch": 629} {"train_loss": -9.967964172363281, "global_step": 105756, "epoch": 629} {"train_loss": -9.677639961242676, "global_step": 105757, "epoch": 629} {"train_loss": -9.8668851852417, "global_step": 105758, "epoch": 629} {"train_loss": -9.662495613098145, "global_step": 105759, "epoch": 629} {"train_loss": -10.081913948059082, "global_step": 105760, "epoch": 629} {"train_loss": -9.564095497131348, "global_step": 105761, "epoch": 629} {"train_loss": -10.106315612792969, "global_step": 105762, "epoch": 629} {"train_loss": -9.824050903320312, "global_step": 105763, "epoch": 629} {"train_loss": -9.974630355834961, "global_step": 105764, "epoch": 629} {"train_loss": -9.664897918701172, "global_step": 105765, "epoch": 629} {"train_loss": -9.675546646118164, "global_step": 105766, "epoch": 629} {"train_loss": -10.04437255859375, "global_step": 105767, "epoch": 629} {"train_loss": -10.172740936279297, "global_step": 105768, "epoch": 629} {"train_loss": -9.958276748657227, "global_step": 105769, "epoch": 629} {"train_loss": -9.581156730651855, "global_step": 105770, "epoch": 629} {"train_loss": -9.948555946350098, "global_step": 105771, "epoch": 629} {"train_loss": -9.627341270446777, "global_step": 105772, "epoch": 629} {"train_loss": -9.877581596374512, "global_step": 105773, "epoch": 629} {"train_loss": -9.926546096801758, "global_step": 105774, "epoch": 629} {"train_loss": -9.74838924407959, "global_step": 105775, "epoch": 629} {"train_loss": -10.169742584228516, "global_step": 105776, "epoch": 629} {"train_loss": -9.728948593139648, "global_step": 105777, "epoch": 629} {"train_loss": -9.776371955871582, "global_step": 105778, "epoch": 629} {"train_loss": -9.953808784484863, "global_step": 105779, "epoch": 629} {"train_loss": -9.481730461120605, "global_step": 105780, "epoch": 629} {"train_loss": -9.708871841430664, "global_step": 105781, "epoch": 629} {"train_loss": -9.364452362060547, "global_step": 105782, "epoch": 629} {"train_loss": -9.896453857421875, "global_step": 105783, "epoch": 629} {"train_loss": -9.037904739379883, "global_step": 105784, "epoch": 629} {"train_loss": -9.90450382232666, "global_step": 105785, "epoch": 629} {"train_loss": -9.577054977416992, "global_step": 105786, "epoch": 629} {"train_loss": -9.691343307495117, "global_step": 105787, "epoch": 629} {"train_loss": -9.625638961791992, "global_step": 105788, "epoch": 629} {"train_loss": -9.553709030151367, "global_step": 105789, "epoch": 629} {"train_loss": -10.082651138305664, "global_step": 105790, "epoch": 629} {"train_loss": -9.85964584350586, "global_step": 105791, "epoch": 629} {"train_loss": -10.03508186340332, "global_step": 105792, "epoch": 629} {"train_loss": -9.63326644897461, "global_step": 105793, "epoch": 629} {"train_loss": -9.718648910522461, "global_step": 105794, "epoch": 629} {"train_loss": -9.493494987487793, "global_step": 105795, "epoch": 629} {"train_loss": -9.763540267944336, "global_step": 105796, "epoch": 629} {"train_loss": -9.572187423706055, "global_step": 105797, "epoch": 629} {"train_loss": -9.838350296020508, "global_step": 105798, "epoch": 629} {"train_loss": -9.611465454101562, "global_step": 105799, "epoch": 629} {"train_loss": -9.669078826904297, "global_step": 105800, "epoch": 629} {"train_loss": -9.929216384887695, "global_step": 105801, "epoch": 629} {"train_loss": -9.749958038330078, "global_step": 105802, "epoch": 629} {"train_loss": -9.717647552490234, "global_step": 105803, "epoch": 629} {"train_loss": -9.806801795959473, "global_step": 105804, "epoch": 629} {"train_loss": -9.734518051147461, "global_step": 105805, "epoch": 629} {"train_loss": -9.682706832885742, "global_step": 105806, "epoch": 629} {"train_loss": -9.99839973449707, "global_step": 105807, "epoch": 629} {"train_loss": -9.710484504699707, "global_step": 105808, "epoch": 629} {"train_loss": -9.538164138793945, "global_step": 105809, "epoch": 629} {"train_loss": -9.736734390258789, "global_step": 105810, "epoch": 629} {"train_loss": -9.82693099975586, "global_step": 105811, "epoch": 629} {"train_loss": -9.683613777160645, "global_step": 105812, "epoch": 629} {"train_loss": -9.916388511657715, "global_step": 105813, "epoch": 629} {"train_loss": -10.059778213500977, "global_step": 105814, "epoch": 629} {"train_loss": -9.734164237976074, "global_step": 105815, "epoch": 629} {"train_loss": -9.795726776123047, "global_step": 105816, "epoch": 629} {"train_loss": -9.86880111694336, "global_step": 105817, "epoch": 629} {"train_loss": -9.755897521972656, "global_step": 105818, "epoch": 629} {"train_loss": -9.31964111328125, "global_step": 105819, "epoch": 629} {"train_loss": -9.899751663208008, "global_step": 105820, "epoch": 629} {"train_loss": -9.408080101013184, "global_step": 105821, "epoch": 629} {"train_loss": -9.862451553344727, "global_step": 105822, "epoch": 629} {"train_loss": -9.79813003540039, "global_step": 105823, "epoch": 629} {"train_loss": -9.46252155303955, "global_step": 105824, "epoch": 629} {"train_loss": -9.706514358520508, "global_step": 105825, "epoch": 629} {"train_loss": -9.368941307067871, "global_step": 105826, "epoch": 629} {"train_loss": -9.983081817626953, "global_step": 105827, "epoch": 629} {"train_loss": -8.773725509643555, "global_step": 105828, "epoch": 629} {"train_loss": -9.94204044342041, "global_step": 105829, "epoch": 629} {"train_loss": -9.417501449584961, "global_step": 105830, "epoch": 629} {"train_loss": -9.733041763305664, "global_step": 105831, "epoch": 629} {"train_loss": -9.439984321594238, "global_step": 105832, "epoch": 629} {"train_loss": -9.262088775634766, "global_step": 105833, "epoch": 629} {"train_loss": -9.7221040725708, "global_step": 105834, "epoch": 629} {"train_loss": -9.634146690368652, "global_step": 105835, "epoch": 629} {"train_loss": -9.707688331604004, "global_step": 105836, "epoch": 629} {"train_loss": -9.970016479492188, "global_step": 105837, "epoch": 629} {"train_loss": -9.738344192504883, "global_step": 105838, "epoch": 629} {"train_loss": -9.775789777437845, "global_step": 105839, "epoch": 629, "val_loss": 208198.9375} {"train_loss": -9.677288055419922, "global_step": 105840, "epoch": 630} {"train_loss": -9.762977600097656, "global_step": 105841, "epoch": 630} {"train_loss": -9.735443115234375, "global_step": 105842, "epoch": 630} {"train_loss": -9.850189208984375, "global_step": 105843, "epoch": 630} {"train_loss": -9.984037399291992, "global_step": 105844, "epoch": 630} {"train_loss": -9.893866539001465, "global_step": 105845, "epoch": 630} {"train_loss": -9.962992668151855, "global_step": 105846, "epoch": 630} {"train_loss": -9.672775268554688, "global_step": 105847, "epoch": 630} {"train_loss": -10.061357498168945, "global_step": 105848, "epoch": 630} {"train_loss": -9.695283889770508, "global_step": 105849, "epoch": 630} {"train_loss": -10.139934539794922, "global_step": 105850, "epoch": 630} {"train_loss": -9.98325252532959, "global_step": 105851, "epoch": 630} {"train_loss": -9.858497619628906, "global_step": 105852, "epoch": 630} {"train_loss": -9.742269515991211, "global_step": 105853, "epoch": 630} {"train_loss": -9.940757751464844, "global_step": 105854, "epoch": 630} {"train_loss": -9.980165481567383, "global_step": 105855, "epoch": 630} {"train_loss": -9.968639373779297, "global_step": 105856, "epoch": 630} {"train_loss": -10.010037422180176, "global_step": 105857, "epoch": 630} {"train_loss": -9.922403335571289, "global_step": 105858, "epoch": 630} {"train_loss": -9.903450965881348, "global_step": 105859, "epoch": 630} {"train_loss": -10.026389122009277, "global_step": 105860, "epoch": 630} {"train_loss": -9.701601028442383, "global_step": 105861, "epoch": 630} {"train_loss": -9.96293830871582, "global_step": 105862, "epoch": 630} {"train_loss": -10.095379829406738, "global_step": 105863, "epoch": 630} {"train_loss": -9.817843437194824, "global_step": 105864, "epoch": 630} {"train_loss": -9.866432189941406, "global_step": 105865, "epoch": 630} {"train_loss": -10.058137893676758, "global_step": 105866, "epoch": 630} {"train_loss": -10.023908615112305, "global_step": 105867, "epoch": 630} {"train_loss": -9.851804733276367, "global_step": 105868, "epoch": 630} {"train_loss": -9.847478866577148, "global_step": 105869, "epoch": 630} {"train_loss": -9.78662395477295, "global_step": 105870, "epoch": 630} {"train_loss": -10.132209777832031, "global_step": 105871, "epoch": 630} {"train_loss": -9.65252685546875, "global_step": 105872, "epoch": 630} {"train_loss": -10.019134521484375, "global_step": 105873, "epoch": 630} {"train_loss": -9.573226928710938, "global_step": 105874, "epoch": 630} {"train_loss": -10.096735000610352, "global_step": 105875, "epoch": 630} {"train_loss": -10.014053344726562, "global_step": 105876, "epoch": 630} {"train_loss": -9.683318138122559, "global_step": 105877, "epoch": 630} {"train_loss": -9.409987449645996, "global_step": 105878, "epoch": 630} {"train_loss": -9.801578521728516, "global_step": 105879, "epoch": 630} {"train_loss": -9.419729232788086, "global_step": 105880, "epoch": 630} {"train_loss": -9.754534721374512, "global_step": 105881, "epoch": 630} {"train_loss": -9.937910079956055, "global_step": 105882, "epoch": 630} {"train_loss": -9.75172233581543, "global_step": 105883, "epoch": 630} {"train_loss": -9.857638359069824, "global_step": 105884, "epoch": 630} {"train_loss": -9.887100219726562, "global_step": 105885, "epoch": 630} {"train_loss": -10.067508697509766, "global_step": 105886, "epoch": 630} {"train_loss": -9.956087112426758, "global_step": 105887, "epoch": 630} {"train_loss": -9.830684661865234, "global_step": 105888, "epoch": 630} {"train_loss": -10.22897720336914, "global_step": 105889, "epoch": 630} {"train_loss": -9.772769927978516, "global_step": 105890, "epoch": 630} {"train_loss": -10.10871696472168, "global_step": 105891, "epoch": 630} {"train_loss": -9.929969787597656, "global_step": 105892, "epoch": 630} {"train_loss": -9.972397804260254, "global_step": 105893, "epoch": 630} {"train_loss": -9.974580764770508, "global_step": 105894, "epoch": 630} {"train_loss": -9.795552253723145, "global_step": 105895, "epoch": 630} {"train_loss": -10.201017379760742, "global_step": 105896, "epoch": 630} {"train_loss": -9.775896072387695, "global_step": 105897, "epoch": 630} {"train_loss": -9.738531112670898, "global_step": 105898, "epoch": 630} {"train_loss": -9.982333183288574, "global_step": 105899, "epoch": 630} {"train_loss": -10.095041275024414, "global_step": 105900, "epoch": 630} {"train_loss": -9.50054931640625, "global_step": 105901, "epoch": 630} {"train_loss": -9.727729797363281, "global_step": 105902, "epoch": 630} {"train_loss": -9.854455947875977, "global_step": 105903, "epoch": 630} {"train_loss": -10.14999008178711, "global_step": 105904, "epoch": 630} {"train_loss": -10.108345031738281, "global_step": 105905, "epoch": 630} {"train_loss": -9.928796768188477, "global_step": 105906, "epoch": 630} {"train_loss": -9.936983108520508, "global_step": 105907, "epoch": 630} {"train_loss": -9.385116577148438, "global_step": 105908, "epoch": 630} {"train_loss": -10.110088348388672, "global_step": 105909, "epoch": 630} {"train_loss": -9.476484298706055, "global_step": 105910, "epoch": 630} {"train_loss": -9.976534843444824, "global_step": 105911, "epoch": 630} {"train_loss": -9.85501766204834, "global_step": 105912, "epoch": 630} {"train_loss": -9.938034057617188, "global_step": 105913, "epoch": 630} {"train_loss": -9.557101249694824, "global_step": 105914, "epoch": 630} {"train_loss": -9.73049545288086, "global_step": 105915, "epoch": 630} {"train_loss": -10.030457496643066, "global_step": 105916, "epoch": 630} {"train_loss": -9.614774703979492, "global_step": 105917, "epoch": 630} {"train_loss": -9.84150218963623, "global_step": 105918, "epoch": 630} {"train_loss": -9.739013671875, "global_step": 105919, "epoch": 630} {"train_loss": -9.9252290725708, "global_step": 105920, "epoch": 630} {"train_loss": -9.882345199584961, "global_step": 105921, "epoch": 630} {"train_loss": -10.067363739013672, "global_step": 105922, "epoch": 630} {"train_loss": -9.614861488342285, "global_step": 105923, "epoch": 630} {"train_loss": -10.142372131347656, "global_step": 105924, "epoch": 630} {"train_loss": -9.973556518554688, "global_step": 105925, "epoch": 630} {"train_loss": -9.658320426940918, "global_step": 105926, "epoch": 630} {"train_loss": -10.128264427185059, "global_step": 105927, "epoch": 630} {"train_loss": -10.063191413879395, "global_step": 105928, "epoch": 630} {"train_loss": -9.99477767944336, "global_step": 105929, "epoch": 630} {"train_loss": -9.720497131347656, "global_step": 105930, "epoch": 630} {"train_loss": -10.006986618041992, "global_step": 105931, "epoch": 630} {"train_loss": -9.852924346923828, "global_step": 105932, "epoch": 630} {"train_loss": -9.503342628479004, "global_step": 105933, "epoch": 630} {"train_loss": -10.00895881652832, "global_step": 105934, "epoch": 630} {"train_loss": -9.776031494140625, "global_step": 105935, "epoch": 630} {"train_loss": -9.899654388427734, "global_step": 105936, "epoch": 630} {"train_loss": -9.711084365844727, "global_step": 105937, "epoch": 630} {"train_loss": -9.993452072143555, "global_step": 105938, "epoch": 630} {"train_loss": -9.785140991210938, "global_step": 105939, "epoch": 630} {"train_loss": -9.516176223754883, "global_step": 105940, "epoch": 630} {"train_loss": -10.038346290588379, "global_step": 105941, "epoch": 630} {"train_loss": -9.651413917541504, "global_step": 105942, "epoch": 630} {"train_loss": -9.922390937805176, "global_step": 105943, "epoch": 630} {"train_loss": -9.628393173217773, "global_step": 105944, "epoch": 630} {"train_loss": -9.854270935058594, "global_step": 105945, "epoch": 630} {"train_loss": -10.052135467529297, "global_step": 105946, "epoch": 630} {"train_loss": -9.502645492553711, "global_step": 105947, "epoch": 630} {"train_loss": -9.777131080627441, "global_step": 105948, "epoch": 630} {"train_loss": -9.54197883605957, "global_step": 105949, "epoch": 630} {"train_loss": -9.732152938842773, "global_step": 105950, "epoch": 630} {"train_loss": -9.624643325805664, "global_step": 105951, "epoch": 630} {"train_loss": -9.64028263092041, "global_step": 105952, "epoch": 630} {"train_loss": -9.636280059814453, "global_step": 105953, "epoch": 630} {"train_loss": -9.581887245178223, "global_step": 105954, "epoch": 630} {"train_loss": -9.759557723999023, "global_step": 105955, "epoch": 630} {"train_loss": -9.652802467346191, "global_step": 105956, "epoch": 630} {"train_loss": -9.836593627929688, "global_step": 105957, "epoch": 630} {"train_loss": -9.775731086730957, "global_step": 105958, "epoch": 630} {"train_loss": -10.04379940032959, "global_step": 105959, "epoch": 630} {"train_loss": -9.684008598327637, "global_step": 105960, "epoch": 630} {"train_loss": -10.07217788696289, "global_step": 105961, "epoch": 630} {"train_loss": -9.675724029541016, "global_step": 105962, "epoch": 630} {"train_loss": -9.780248641967773, "global_step": 105963, "epoch": 630} {"train_loss": -9.931279182434082, "global_step": 105964, "epoch": 630} {"train_loss": -9.899105072021484, "global_step": 105965, "epoch": 630} {"train_loss": -9.437868118286133, "global_step": 105966, "epoch": 630} {"train_loss": -10.146384239196777, "global_step": 105967, "epoch": 630} {"train_loss": -9.416830062866211, "global_step": 105968, "epoch": 630} {"train_loss": -9.710039138793945, "global_step": 105969, "epoch": 630} {"train_loss": -9.598801612854004, "global_step": 105970, "epoch": 630} {"train_loss": -9.833306312561035, "global_step": 105971, "epoch": 630} {"train_loss": -9.628107070922852, "global_step": 105972, "epoch": 630} {"train_loss": -9.642692565917969, "global_step": 105973, "epoch": 630} {"train_loss": -9.822994232177734, "global_step": 105974, "epoch": 630} {"train_loss": -9.613121032714844, "global_step": 105975, "epoch": 630} {"train_loss": -9.69922924041748, "global_step": 105976, "epoch": 630} {"train_loss": -9.995012283325195, "global_step": 105977, "epoch": 630} {"train_loss": -10.034024238586426, "global_step": 105978, "epoch": 630} {"train_loss": -9.97462272644043, "global_step": 105979, "epoch": 630} {"train_loss": -10.047861099243164, "global_step": 105980, "epoch": 630} {"train_loss": -10.008018493652344, "global_step": 105981, "epoch": 630} {"train_loss": -9.71033763885498, "global_step": 105982, "epoch": 630} {"train_loss": -9.938525199890137, "global_step": 105983, "epoch": 630} {"train_loss": -9.759101867675781, "global_step": 105984, "epoch": 630} {"train_loss": -9.810215950012207, "global_step": 105985, "epoch": 630} {"train_loss": -10.0960693359375, "global_step": 105986, "epoch": 630} {"train_loss": -9.984914779663086, "global_step": 105987, "epoch": 630} {"train_loss": -10.145726203918457, "global_step": 105988, "epoch": 630} {"train_loss": -9.590871810913086, "global_step": 105989, "epoch": 630} {"train_loss": -10.064332008361816, "global_step": 105990, "epoch": 630} {"train_loss": -9.460472106933594, "global_step": 105991, "epoch": 630} {"train_loss": -10.073172569274902, "global_step": 105992, "epoch": 630} {"train_loss": -9.594512939453125, "global_step": 105993, "epoch": 630} {"train_loss": -10.133593559265137, "global_step": 105994, "epoch": 630} {"train_loss": -9.587993621826172, "global_step": 105995, "epoch": 630} {"train_loss": -10.081130981445312, "global_step": 105996, "epoch": 630} {"train_loss": -9.532143592834473, "global_step": 105997, "epoch": 630} {"train_loss": -9.999561309814453, "global_step": 105998, "epoch": 630} {"train_loss": -9.798585891723633, "global_step": 105999, "epoch": 630} {"train_loss": -9.759403228759766, "global_step": 106000, "epoch": 630} {"train_loss": -9.478368759155273, "global_step": 106001, "epoch": 630} {"train_loss": -9.855659484863281, "global_step": 106002, "epoch": 630} {"train_loss": -9.524542808532715, "global_step": 106003, "epoch": 630} {"train_loss": -9.846142768859863, "global_step": 106004, "epoch": 630} {"train_loss": -9.771352767944336, "global_step": 106005, "epoch": 630} {"train_loss": -9.446891784667969, "global_step": 106006, "epoch": 630} {"train_loss": -9.838239232699076, "global_step": 106007, "epoch": 630, "val_loss": 208753.59375, "train_action_mse_error": 4.359128952026367} {"train_loss": -9.626152992248535, "global_step": 106008, "epoch": 631} {"train_loss": -9.868989944458008, "global_step": 106009, "epoch": 631} {"train_loss": -9.581987380981445, "global_step": 106010, "epoch": 631} {"train_loss": -9.775688171386719, "global_step": 106011, "epoch": 631} {"train_loss": -9.701238632202148, "global_step": 106012, "epoch": 631} {"train_loss": -9.842667579650879, "global_step": 106013, "epoch": 631} {"train_loss": -9.95498275756836, "global_step": 106014, "epoch": 631} {"train_loss": -10.19085693359375, "global_step": 106015, "epoch": 631} {"train_loss": -9.927903175354004, "global_step": 106016, "epoch": 631} {"train_loss": -9.855524063110352, "global_step": 106017, "epoch": 631} {"train_loss": -10.008328437805176, "global_step": 106018, "epoch": 631} {"train_loss": -10.022418975830078, "global_step": 106019, "epoch": 631} {"train_loss": -9.99394416809082, "global_step": 106020, "epoch": 631} {"train_loss": -9.96235466003418, "global_step": 106021, "epoch": 631} {"train_loss": -10.07418441772461, "global_step": 106022, "epoch": 631} {"train_loss": -10.010226249694824, "global_step": 106023, "epoch": 631} {"train_loss": -10.168756484985352, "global_step": 106024, "epoch": 631} {"train_loss": -10.061118125915527, "global_step": 106025, "epoch": 631} {"train_loss": -9.606918334960938, "global_step": 106026, "epoch": 631} {"train_loss": -10.071950912475586, "global_step": 106027, "epoch": 631} {"train_loss": -9.655524253845215, "global_step": 106028, "epoch": 631} {"train_loss": -9.835421562194824, "global_step": 106029, "epoch": 631} {"train_loss": -10.10245418548584, "global_step": 106030, "epoch": 631} {"train_loss": -9.799125671386719, "global_step": 106031, "epoch": 631} {"train_loss": -10.043905258178711, "global_step": 106032, "epoch": 631} {"train_loss": -9.927789688110352, "global_step": 106033, "epoch": 631} {"train_loss": -9.971692085266113, "global_step": 106034, "epoch": 631} {"train_loss": -9.899981498718262, "global_step": 106035, "epoch": 631} {"train_loss": -9.813457489013672, "global_step": 106036, "epoch": 631} {"train_loss": -10.108417510986328, "global_step": 106037, "epoch": 631} {"train_loss": -9.735193252563477, "global_step": 106038, "epoch": 631} {"train_loss": -10.194229125976562, "global_step": 106039, "epoch": 631} {"train_loss": -9.977689743041992, "global_step": 106040, "epoch": 631} {"train_loss": -9.923836708068848, "global_step": 106041, "epoch": 631} {"train_loss": -9.86546516418457, "global_step": 106042, "epoch": 631} {"train_loss": -10.000499725341797, "global_step": 106043, "epoch": 631} {"train_loss": -9.907953262329102, "global_step": 106044, "epoch": 631} {"train_loss": -9.963875770568848, "global_step": 106045, "epoch": 631} {"train_loss": -9.741618156433105, "global_step": 106046, "epoch": 631} {"train_loss": -9.473465919494629, "global_step": 106047, "epoch": 631} {"train_loss": -9.342737197875977, "global_step": 106048, "epoch": 631} {"train_loss": -9.65367317199707, "global_step": 106049, "epoch": 631} {"train_loss": -9.716452598571777, "global_step": 106050, "epoch": 631} {"train_loss": -9.647872924804688, "global_step": 106051, "epoch": 631} {"train_loss": -9.61657428741455, "global_step": 106052, "epoch": 631} {"train_loss": -9.430730819702148, "global_step": 106053, "epoch": 631} {"train_loss": -9.446057319641113, "global_step": 106054, "epoch": 631} {"train_loss": -9.433952331542969, "global_step": 106055, "epoch": 631} {"train_loss": -9.427175521850586, "global_step": 106056, "epoch": 631} {"train_loss": -9.107381820678711, "global_step": 106057, "epoch": 631} {"train_loss": -9.680451393127441, "global_step": 106058, "epoch": 631} {"train_loss": -9.597314834594727, "global_step": 106059, "epoch": 631} {"train_loss": -9.920278549194336, "global_step": 106060, "epoch": 631} {"train_loss": -9.718725204467773, "global_step": 106061, "epoch": 631} {"train_loss": -9.408452987670898, "global_step": 106062, "epoch": 631} {"train_loss": -9.860635757446289, "global_step": 106063, "epoch": 631} {"train_loss": -9.399813652038574, "global_step": 106064, "epoch": 631} {"train_loss": -9.851000785827637, "global_step": 106065, "epoch": 631} {"train_loss": -9.522613525390625, "global_step": 106066, "epoch": 631} {"train_loss": -9.766180038452148, "global_step": 106067, "epoch": 631} {"train_loss": -9.535605430603027, "global_step": 106068, "epoch": 631} {"train_loss": -9.794417381286621, "global_step": 106069, "epoch": 631} {"train_loss": -9.405835151672363, "global_step": 106070, "epoch": 631} {"train_loss": -9.971996307373047, "global_step": 106071, "epoch": 631} {"train_loss": -9.883686065673828, "global_step": 106072, "epoch": 631} {"train_loss": -9.804954528808594, "global_step": 106073, "epoch": 631} {"train_loss": -9.809349060058594, "global_step": 106074, "epoch": 631} {"train_loss": -9.767311096191406, "global_step": 106075, "epoch": 631} {"train_loss": -9.783215522766113, "global_step": 106076, "epoch": 631} {"train_loss": -9.953312873840332, "global_step": 106077, "epoch": 631} {"train_loss": -9.698942184448242, "global_step": 106078, "epoch": 631} {"train_loss": -9.869808197021484, "global_step": 106079, "epoch": 631} {"train_loss": -9.851375579833984, "global_step": 106080, "epoch": 631} {"train_loss": -9.819456100463867, "global_step": 106081, "epoch": 631} {"train_loss": -9.67500114440918, "global_step": 106082, "epoch": 631} {"train_loss": -10.009698867797852, "global_step": 106083, "epoch": 631} {"train_loss": -9.807059288024902, "global_step": 106084, "epoch": 631} {"train_loss": -9.923185348510742, "global_step": 106085, "epoch": 631} {"train_loss": -9.695930480957031, "global_step": 106086, "epoch": 631} {"train_loss": -9.762086868286133, "global_step": 106087, "epoch": 631} {"train_loss": -9.638781547546387, "global_step": 106088, "epoch": 631} {"train_loss": -9.488754272460938, "global_step": 106089, "epoch": 631} {"train_loss": -9.578039169311523, "global_step": 106090, "epoch": 631} {"train_loss": -9.434452056884766, "global_step": 106091, "epoch": 631} {"train_loss": -9.659399032592773, "global_step": 106092, "epoch": 631} {"train_loss": -9.784364700317383, "global_step": 106093, "epoch": 631} {"train_loss": -9.502748489379883, "global_step": 106094, "epoch": 631} {"train_loss": -9.576156616210938, "global_step": 106095, "epoch": 631} {"train_loss": -9.839942932128906, "global_step": 106096, "epoch": 631} {"train_loss": -9.66980266571045, "global_step": 106097, "epoch": 631} {"train_loss": -9.890657424926758, "global_step": 106098, "epoch": 631} {"train_loss": -9.907405853271484, "global_step": 106099, "epoch": 631} {"train_loss": -9.524134635925293, "global_step": 106100, "epoch": 631} {"train_loss": -9.912407875061035, "global_step": 106101, "epoch": 631} {"train_loss": -9.593057632446289, "global_step": 106102, "epoch": 631} {"train_loss": -9.613868713378906, "global_step": 106103, "epoch": 631} {"train_loss": -9.913737297058105, "global_step": 106104, "epoch": 631} {"train_loss": -9.562580108642578, "global_step": 106105, "epoch": 631} {"train_loss": -9.806968688964844, "global_step": 106106, "epoch": 631} {"train_loss": -9.786693572998047, "global_step": 106107, "epoch": 631} {"train_loss": -9.895051956176758, "global_step": 106108, "epoch": 631} {"train_loss": -9.880756378173828, "global_step": 106109, "epoch": 631} {"train_loss": -10.043220520019531, "global_step": 106110, "epoch": 631} {"train_loss": -10.10173511505127, "global_step": 106111, "epoch": 631} {"train_loss": -9.965682029724121, "global_step": 106112, "epoch": 631} {"train_loss": -9.966619491577148, "global_step": 106113, "epoch": 631} {"train_loss": -9.980957984924316, "global_step": 106114, "epoch": 631} {"train_loss": -10.037487983703613, "global_step": 106115, "epoch": 631} {"train_loss": -9.982551574707031, "global_step": 106116, "epoch": 631} {"train_loss": -9.86531925201416, "global_step": 106117, "epoch": 631} {"train_loss": -10.232827186584473, "global_step": 106118, "epoch": 631} {"train_loss": -9.974058151245117, "global_step": 106119, "epoch": 631} {"train_loss": -9.9583740234375, "global_step": 106120, "epoch": 631} {"train_loss": -10.016343116760254, "global_step": 106121, "epoch": 631} {"train_loss": -10.148519515991211, "global_step": 106122, "epoch": 631} {"train_loss": -10.098847389221191, "global_step": 106123, "epoch": 631} {"train_loss": -9.755899429321289, "global_step": 106124, "epoch": 631} {"train_loss": -10.02249813079834, "global_step": 106125, "epoch": 631} {"train_loss": -9.559770584106445, "global_step": 106126, "epoch": 631} {"train_loss": -9.786174774169922, "global_step": 106127, "epoch": 631} {"train_loss": -9.59681224822998, "global_step": 106128, "epoch": 631} {"train_loss": -9.451081275939941, "global_step": 106129, "epoch": 631} {"train_loss": -9.614523887634277, "global_step": 106130, "epoch": 631} {"train_loss": -9.363670349121094, "global_step": 106131, "epoch": 631} {"train_loss": -9.577064514160156, "global_step": 106132, "epoch": 631} {"train_loss": -9.50990104675293, "global_step": 106133, "epoch": 631} {"train_loss": -9.74169921875, "global_step": 106134, "epoch": 631} {"train_loss": -9.50584888458252, "global_step": 106135, "epoch": 631} {"train_loss": -9.882160186767578, "global_step": 106136, "epoch": 631} {"train_loss": -9.768350601196289, "global_step": 106137, "epoch": 631} {"train_loss": -9.812762260437012, "global_step": 106138, "epoch": 631} {"train_loss": -9.603349685668945, "global_step": 106139, "epoch": 631} {"train_loss": -9.791688919067383, "global_step": 106140, "epoch": 631} {"train_loss": -9.525304794311523, "global_step": 106141, "epoch": 631} {"train_loss": -9.484811782836914, "global_step": 106142, "epoch": 631} {"train_loss": -9.569177627563477, "global_step": 106143, "epoch": 631} {"train_loss": -9.701057434082031, "global_step": 106144, "epoch": 631} {"train_loss": -9.557825088500977, "global_step": 106145, "epoch": 631} {"train_loss": -9.636603355407715, "global_step": 106146, "epoch": 631} {"train_loss": -9.924371719360352, "global_step": 106147, "epoch": 631} {"train_loss": -9.683067321777344, "global_step": 106148, "epoch": 631} {"train_loss": -9.912016868591309, "global_step": 106149, "epoch": 631} {"train_loss": -9.857004165649414, "global_step": 106150, "epoch": 631} {"train_loss": -9.958063125610352, "global_step": 106151, "epoch": 631} {"train_loss": -9.832809448242188, "global_step": 106152, "epoch": 631} {"train_loss": -9.906038284301758, "global_step": 106153, "epoch": 631} {"train_loss": -9.911514282226562, "global_step": 106154, "epoch": 631} {"train_loss": -9.954968452453613, "global_step": 106155, "epoch": 631} {"train_loss": -9.859803199768066, "global_step": 106156, "epoch": 631} {"train_loss": -9.985137939453125, "global_step": 106157, "epoch": 631} {"train_loss": -9.935638427734375, "global_step": 106158, "epoch": 631} {"train_loss": -10.312055587768555, "global_step": 106159, "epoch": 631} {"train_loss": -9.899147033691406, "global_step": 106160, "epoch": 631} {"train_loss": -10.058842658996582, "global_step": 106161, "epoch": 631} {"train_loss": -9.841180801391602, "global_step": 106162, "epoch": 631} {"train_loss": -9.945919036865234, "global_step": 106163, "epoch": 631} {"train_loss": -9.919696807861328, "global_step": 106164, "epoch": 631} {"train_loss": -9.848184585571289, "global_step": 106165, "epoch": 631} {"train_loss": -9.911225318908691, "global_step": 106166, "epoch": 631} {"train_loss": -9.75894832611084, "global_step": 106167, "epoch": 631} {"train_loss": -9.912178039550781, "global_step": 106168, "epoch": 631} {"train_loss": -9.893190383911133, "global_step": 106169, "epoch": 631} {"train_loss": -9.742958068847656, "global_step": 106170, "epoch": 631} {"train_loss": -9.867950439453125, "global_step": 106171, "epoch": 631} {"train_loss": -9.895440101623535, "global_step": 106172, "epoch": 631} {"train_loss": -9.682910919189453, "global_step": 106173, "epoch": 631} {"train_loss": -10.070724487304688, "global_step": 106174, "epoch": 631} {"train_loss": -9.797534914243789, "global_step": 106175, "epoch": 631, "val_loss": 207526.8125} {"train_loss": -9.623956680297852, "global_step": 106176, "epoch": 632} {"train_loss": -9.771141052246094, "global_step": 106177, "epoch": 632} {"train_loss": -9.482401847839355, "global_step": 106178, "epoch": 632} {"train_loss": -9.993016242980957, "global_step": 106179, "epoch": 632} {"train_loss": -9.939840316772461, "global_step": 106180, "epoch": 632} {"train_loss": -9.877639770507812, "global_step": 106181, "epoch": 632} {"train_loss": -9.650154113769531, "global_step": 106182, "epoch": 632} {"train_loss": -9.87501335144043, "global_step": 106183, "epoch": 632} {"train_loss": -9.878843307495117, "global_step": 106184, "epoch": 632} {"train_loss": -9.592483520507812, "global_step": 106185, "epoch": 632} {"train_loss": -9.63040828704834, "global_step": 106186, "epoch": 632} {"train_loss": -9.835748672485352, "global_step": 106187, "epoch": 632} {"train_loss": -9.697972297668457, "global_step": 106188, "epoch": 632} {"train_loss": -9.85571575164795, "global_step": 106189, "epoch": 632} {"train_loss": -10.05813980102539, "global_step": 106190, "epoch": 632} {"train_loss": -9.913328170776367, "global_step": 106191, "epoch": 632} {"train_loss": -9.870108604431152, "global_step": 106192, "epoch": 632} {"train_loss": -9.966653823852539, "global_step": 106193, "epoch": 632} {"train_loss": -9.997166633605957, "global_step": 106194, "epoch": 632} {"train_loss": -9.907590866088867, "global_step": 106195, "epoch": 632} {"train_loss": -9.56975269317627, "global_step": 106196, "epoch": 632} {"train_loss": -9.849493026733398, "global_step": 106197, "epoch": 632} {"train_loss": -9.884909629821777, "global_step": 106198, "epoch": 632} {"train_loss": -9.905430793762207, "global_step": 106199, "epoch": 632} {"train_loss": -9.41262149810791, "global_step": 106200, "epoch": 632} {"train_loss": -9.89295768737793, "global_step": 106201, "epoch": 632} {"train_loss": -9.719978332519531, "global_step": 106202, "epoch": 632} {"train_loss": -9.874813079833984, "global_step": 106203, "epoch": 632} {"train_loss": -9.445879936218262, "global_step": 106204, "epoch": 632} {"train_loss": -10.16904067993164, "global_step": 106205, "epoch": 632} {"train_loss": -9.707778930664062, "global_step": 106206, "epoch": 632} {"train_loss": -9.88060188293457, "global_step": 106207, "epoch": 632} {"train_loss": -9.783897399902344, "global_step": 106208, "epoch": 632} {"train_loss": -9.91425895690918, "global_step": 106209, "epoch": 632} {"train_loss": -9.871622085571289, "global_step": 106210, "epoch": 632} {"train_loss": -9.84689998626709, "global_step": 106211, "epoch": 632} {"train_loss": -9.789063453674316, "global_step": 106212, "epoch": 632} {"train_loss": -9.752771377563477, "global_step": 106213, "epoch": 632} {"train_loss": -9.85843276977539, "global_step": 106214, "epoch": 632} {"train_loss": -9.970588684082031, "global_step": 106215, "epoch": 632} {"train_loss": -10.024173736572266, "global_step": 106216, "epoch": 632} {"train_loss": -9.436271667480469, "global_step": 106217, "epoch": 632} {"train_loss": -9.866936683654785, "global_step": 106218, "epoch": 632} {"train_loss": -9.917257308959961, "global_step": 106219, "epoch": 632} {"train_loss": -9.843560218811035, "global_step": 106220, "epoch": 632} {"train_loss": -9.823267936706543, "global_step": 106221, "epoch": 632} {"train_loss": -9.925886154174805, "global_step": 106222, "epoch": 632} {"train_loss": -9.838315963745117, "global_step": 106223, "epoch": 632} {"train_loss": -9.619678497314453, "global_step": 106224, "epoch": 632} {"train_loss": -9.704690933227539, "global_step": 106225, "epoch": 632} {"train_loss": -9.652311325073242, "global_step": 106226, "epoch": 632} {"train_loss": -9.814939498901367, "global_step": 106227, "epoch": 632} {"train_loss": -9.934429168701172, "global_step": 106228, "epoch": 632} {"train_loss": -9.203384399414062, "global_step": 106229, "epoch": 632} {"train_loss": -9.990363121032715, "global_step": 106230, "epoch": 632} {"train_loss": -9.675100326538086, "global_step": 106231, "epoch": 632} {"train_loss": -9.78708267211914, "global_step": 106232, "epoch": 632} {"train_loss": -9.572307586669922, "global_step": 106233, "epoch": 632} {"train_loss": -9.668251037597656, "global_step": 106234, "epoch": 632} {"train_loss": -9.646927833557129, "global_step": 106235, "epoch": 632} {"train_loss": -9.922807693481445, "global_step": 106236, "epoch": 632} {"train_loss": -9.605775833129883, "global_step": 106237, "epoch": 632} {"train_loss": -9.91169548034668, "global_step": 106238, "epoch": 632} {"train_loss": -9.679221153259277, "global_step": 106239, "epoch": 632} {"train_loss": -10.047296524047852, "global_step": 106240, "epoch": 632} {"train_loss": -9.86741828918457, "global_step": 106241, "epoch": 632} {"train_loss": -9.884767532348633, "global_step": 106242, "epoch": 632} {"train_loss": -9.717236518859863, "global_step": 106243, "epoch": 632} {"train_loss": -9.675081253051758, "global_step": 106244, "epoch": 632} {"train_loss": -9.975479125976562, "global_step": 106245, "epoch": 632} {"train_loss": -10.072461128234863, "global_step": 106246, "epoch": 632} {"train_loss": -9.741283416748047, "global_step": 106247, "epoch": 632} {"train_loss": -9.82040786743164, "global_step": 106248, "epoch": 632} {"train_loss": -9.919580459594727, "global_step": 106249, "epoch": 632} {"train_loss": -9.812755584716797, "global_step": 106250, "epoch": 632} {"train_loss": -9.991631507873535, "global_step": 106251, "epoch": 632} {"train_loss": -9.906299591064453, "global_step": 106252, "epoch": 632} {"train_loss": -9.66193962097168, "global_step": 106253, "epoch": 632} {"train_loss": -9.9186429977417, "global_step": 106254, "epoch": 632} {"train_loss": -9.831306457519531, "global_step": 106255, "epoch": 632} {"train_loss": -9.859973907470703, "global_step": 106256, "epoch": 632} {"train_loss": -10.047719955444336, "global_step": 106257, "epoch": 632} {"train_loss": -9.834295272827148, "global_step": 106258, "epoch": 632} {"train_loss": -10.02415657043457, "global_step": 106259, "epoch": 632} {"train_loss": -10.068735122680664, "global_step": 106260, "epoch": 632} {"train_loss": -10.064606666564941, "global_step": 106261, "epoch": 632} {"train_loss": -9.981689453125, "global_step": 106262, "epoch": 632} {"train_loss": -9.997529983520508, "global_step": 106263, "epoch": 632} {"train_loss": -9.755783081054688, "global_step": 106264, "epoch": 632} {"train_loss": -10.121803283691406, "global_step": 106265, "epoch": 632} {"train_loss": -10.045602798461914, "global_step": 106266, "epoch": 632} {"train_loss": -9.830289840698242, "global_step": 106267, "epoch": 632} {"train_loss": -9.936976432800293, "global_step": 106268, "epoch": 632} {"train_loss": -9.912307739257812, "global_step": 106269, "epoch": 632} {"train_loss": -9.943939208984375, "global_step": 106270, "epoch": 632} {"train_loss": -9.94935417175293, "global_step": 106271, "epoch": 632} {"train_loss": -9.79642105102539, "global_step": 106272, "epoch": 632} {"train_loss": -9.90064811706543, "global_step": 106273, "epoch": 632} {"train_loss": -9.72333812713623, "global_step": 106274, "epoch": 632} {"train_loss": -9.985234260559082, "global_step": 106275, "epoch": 632} {"train_loss": -10.165879249572754, "global_step": 106276, "epoch": 632} {"train_loss": -9.468976974487305, "global_step": 106277, "epoch": 632} {"train_loss": -9.908770561218262, "global_step": 106278, "epoch": 632} {"train_loss": -9.862224578857422, "global_step": 106279, "epoch": 632} {"train_loss": -9.897956848144531, "global_step": 106280, "epoch": 632} {"train_loss": -10.094820976257324, "global_step": 106281, "epoch": 632} {"train_loss": -9.926427841186523, "global_step": 106282, "epoch": 632} {"train_loss": -10.001252174377441, "global_step": 106283, "epoch": 632} {"train_loss": -9.948705673217773, "global_step": 106284, "epoch": 632} {"train_loss": -9.818065643310547, "global_step": 106285, "epoch": 632} {"train_loss": -9.886014938354492, "global_step": 106286, "epoch": 632} {"train_loss": -10.036147117614746, "global_step": 106287, "epoch": 632} {"train_loss": -9.848926544189453, "global_step": 106288, "epoch": 632} {"train_loss": -10.080998420715332, "global_step": 106289, "epoch": 632} {"train_loss": -9.859649658203125, "global_step": 106290, "epoch": 632} {"train_loss": -9.790107727050781, "global_step": 106291, "epoch": 632} {"train_loss": -9.896705627441406, "global_step": 106292, "epoch": 632} {"train_loss": -9.380126953125, "global_step": 106293, "epoch": 632} {"train_loss": -10.071527481079102, "global_step": 106294, "epoch": 632} {"train_loss": -9.752013206481934, "global_step": 106295, "epoch": 632} {"train_loss": -9.945457458496094, "global_step": 106296, "epoch": 632} {"train_loss": -9.632367134094238, "global_step": 106297, "epoch": 632} {"train_loss": -10.046409606933594, "global_step": 106298, "epoch": 632} {"train_loss": -9.125907897949219, "global_step": 106299, "epoch": 632} {"train_loss": -10.046198844909668, "global_step": 106300, "epoch": 632} {"train_loss": -9.508438110351562, "global_step": 106301, "epoch": 632} {"train_loss": -10.160558700561523, "global_step": 106302, "epoch": 632} {"train_loss": -9.627424240112305, "global_step": 106303, "epoch": 632} {"train_loss": -9.9989595413208, "global_step": 106304, "epoch": 632} {"train_loss": -9.921830177307129, "global_step": 106305, "epoch": 632} {"train_loss": -10.026820182800293, "global_step": 106306, "epoch": 632} {"train_loss": -9.683456420898438, "global_step": 106307, "epoch": 632} {"train_loss": -9.998675346374512, "global_step": 106308, "epoch": 632} {"train_loss": -9.53890323638916, "global_step": 106309, "epoch": 632} {"train_loss": -9.850667953491211, "global_step": 106310, "epoch": 632} {"train_loss": -9.573984146118164, "global_step": 106311, "epoch": 632} {"train_loss": -9.816031455993652, "global_step": 106312, "epoch": 632} {"train_loss": -9.766557693481445, "global_step": 106313, "epoch": 632} {"train_loss": -9.589086532592773, "global_step": 106314, "epoch": 632} {"train_loss": -9.980667114257812, "global_step": 106315, "epoch": 632} {"train_loss": -9.634149551391602, "global_step": 106316, "epoch": 632} {"train_loss": -9.812251091003418, "global_step": 106317, "epoch": 632} {"train_loss": -9.842782974243164, "global_step": 106318, "epoch": 632} {"train_loss": -9.420225143432617, "global_step": 106319, "epoch": 632} {"train_loss": -9.59931468963623, "global_step": 106320, "epoch": 632} {"train_loss": -9.837562561035156, "global_step": 106321, "epoch": 632} {"train_loss": -9.860841751098633, "global_step": 106322, "epoch": 632} {"train_loss": -9.590473175048828, "global_step": 106323, "epoch": 632} {"train_loss": -9.601919174194336, "global_step": 106324, "epoch": 632} {"train_loss": -9.7962646484375, "global_step": 106325, "epoch": 632} {"train_loss": -9.664529800415039, "global_step": 106326, "epoch": 632} {"train_loss": -9.662406921386719, "global_step": 106327, "epoch": 632} {"train_loss": -9.574012756347656, "global_step": 106328, "epoch": 632} {"train_loss": -9.955333709716797, "global_step": 106329, "epoch": 632} {"train_loss": -9.480199813842773, "global_step": 106330, "epoch": 632} {"train_loss": -9.632589340209961, "global_step": 106331, "epoch": 632} {"train_loss": -9.817750930786133, "global_step": 106332, "epoch": 632} {"train_loss": -9.820249557495117, "global_step": 106333, "epoch": 632} {"train_loss": -9.764892578125, "global_step": 106334, "epoch": 632} {"train_loss": -9.990373611450195, "global_step": 106335, "epoch": 632} {"train_loss": -9.958808898925781, "global_step": 106336, "epoch": 632} {"train_loss": -10.052785873413086, "global_step": 106337, "epoch": 632} {"train_loss": -9.558160781860352, "global_step": 106338, "epoch": 632} {"train_loss": -9.975723266601562, "global_step": 106339, "epoch": 632} {"train_loss": -9.583274841308594, "global_step": 106340, "epoch": 632} {"train_loss": -9.843866348266602, "global_step": 106341, "epoch": 632} {"train_loss": -9.912954330444336, "global_step": 106342, "epoch": 632} {"train_loss": -9.821153368268694, "global_step": 106343, "epoch": 632, "val_loss": 207462.25} {"train_loss": -9.819160461425781, "global_step": 106344, "epoch": 633} {"train_loss": -10.030647277832031, "global_step": 106345, "epoch": 633} {"train_loss": -9.941855430603027, "global_step": 106346, "epoch": 633} {"train_loss": -9.777891159057617, "global_step": 106347, "epoch": 633} {"train_loss": -9.860044479370117, "global_step": 106348, "epoch": 633} {"train_loss": -9.897392272949219, "global_step": 106349, "epoch": 633} {"train_loss": -10.011205673217773, "global_step": 106350, "epoch": 633} {"train_loss": -9.825533866882324, "global_step": 106351, "epoch": 633} {"train_loss": -9.920282363891602, "global_step": 106352, "epoch": 633} {"train_loss": -9.751697540283203, "global_step": 106353, "epoch": 633} {"train_loss": -9.859675407409668, "global_step": 106354, "epoch": 633} {"train_loss": -9.77647590637207, "global_step": 106355, "epoch": 633} {"train_loss": -10.033491134643555, "global_step": 106356, "epoch": 633} {"train_loss": -9.866935729980469, "global_step": 106357, "epoch": 633} {"train_loss": -9.930181503295898, "global_step": 106358, "epoch": 633} {"train_loss": -9.778398513793945, "global_step": 106359, "epoch": 633} {"train_loss": -10.244365692138672, "global_step": 106360, "epoch": 633} {"train_loss": -9.75054931640625, "global_step": 106361, "epoch": 633} {"train_loss": -9.861568450927734, "global_step": 106362, "epoch": 633} {"train_loss": -10.112781524658203, "global_step": 106363, "epoch": 633} {"train_loss": -9.976028442382812, "global_step": 106364, "epoch": 633} {"train_loss": -10.054872512817383, "global_step": 106365, "epoch": 633} {"train_loss": -9.995010375976562, "global_step": 106366, "epoch": 633} {"train_loss": -9.645174026489258, "global_step": 106367, "epoch": 633} {"train_loss": -9.926525115966797, "global_step": 106368, "epoch": 633} {"train_loss": -9.712850570678711, "global_step": 106369, "epoch": 633} {"train_loss": -9.963451385498047, "global_step": 106370, "epoch": 633} {"train_loss": -9.877554893493652, "global_step": 106371, "epoch": 633} {"train_loss": -9.918502807617188, "global_step": 106372, "epoch": 633} {"train_loss": -10.025293350219727, "global_step": 106373, "epoch": 633} {"train_loss": -9.996386528015137, "global_step": 106374, "epoch": 633} {"train_loss": -10.045215606689453, "global_step": 106375, "epoch": 633} {"train_loss": -10.045928001403809, "global_step": 106376, "epoch": 633} {"train_loss": -9.921871185302734, "global_step": 106377, "epoch": 633} {"train_loss": -9.950239181518555, "global_step": 106378, "epoch": 633} {"train_loss": -9.794364929199219, "global_step": 106379, "epoch": 633} {"train_loss": -10.235661506652832, "global_step": 106380, "epoch": 633} {"train_loss": -9.977136611938477, "global_step": 106381, "epoch": 633} {"train_loss": -10.003424644470215, "global_step": 106382, "epoch": 633} {"train_loss": -10.070372581481934, "global_step": 106383, "epoch": 633} {"train_loss": -9.835394859313965, "global_step": 106384, "epoch": 633} {"train_loss": -10.191463470458984, "global_step": 106385, "epoch": 633} {"train_loss": -10.014457702636719, "global_step": 106386, "epoch": 633} {"train_loss": -9.977630615234375, "global_step": 106387, "epoch": 633} {"train_loss": -10.176114082336426, "global_step": 106388, "epoch": 633} {"train_loss": -10.029045104980469, "global_step": 106389, "epoch": 633} {"train_loss": -10.139039993286133, "global_step": 106390, "epoch": 633} {"train_loss": -10.094573974609375, "global_step": 106391, "epoch": 633} {"train_loss": -9.481371879577637, "global_step": 106392, "epoch": 633} {"train_loss": -9.894155502319336, "global_step": 106393, "epoch": 633} {"train_loss": -9.834518432617188, "global_step": 106394, "epoch": 633} {"train_loss": -9.683887481689453, "global_step": 106395, "epoch": 633} {"train_loss": -9.878801345825195, "global_step": 106396, "epoch": 633} {"train_loss": -9.927995681762695, "global_step": 106397, "epoch": 633} {"train_loss": -9.907654762268066, "global_step": 106398, "epoch": 633} {"train_loss": -10.042969703674316, "global_step": 106399, "epoch": 633} {"train_loss": -9.742164611816406, "global_step": 106400, "epoch": 633} {"train_loss": -10.076654434204102, "global_step": 106401, "epoch": 633} {"train_loss": -9.668537139892578, "global_step": 106402, "epoch": 633} {"train_loss": -9.816609382629395, "global_step": 106403, "epoch": 633} {"train_loss": -9.873823165893555, "global_step": 106404, "epoch": 633} {"train_loss": -9.848114013671875, "global_step": 106405, "epoch": 633} {"train_loss": -9.660648345947266, "global_step": 106406, "epoch": 633} {"train_loss": -9.578776359558105, "global_step": 106407, "epoch": 633} {"train_loss": -10.012349128723145, "global_step": 106408, "epoch": 633} {"train_loss": -9.864860534667969, "global_step": 106409, "epoch": 633} {"train_loss": -9.777313232421875, "global_step": 106410, "epoch": 633} {"train_loss": -9.94881820678711, "global_step": 106411, "epoch": 633} {"train_loss": -9.770349502563477, "global_step": 106412, "epoch": 633} {"train_loss": -9.715688705444336, "global_step": 106413, "epoch": 633} {"train_loss": -9.892288208007812, "global_step": 106414, "epoch": 633} {"train_loss": -9.993183135986328, "global_step": 106415, "epoch": 633} {"train_loss": -9.922561645507812, "global_step": 106416, "epoch": 633} {"train_loss": -10.146943092346191, "global_step": 106417, "epoch": 633} {"train_loss": -10.079349517822266, "global_step": 106418, "epoch": 633} {"train_loss": -9.754958152770996, "global_step": 106419, "epoch": 633} {"train_loss": -10.027718544006348, "global_step": 106420, "epoch": 633} {"train_loss": -10.016658782958984, "global_step": 106421, "epoch": 633} {"train_loss": -10.03361701965332, "global_step": 106422, "epoch": 633} {"train_loss": -10.131957054138184, "global_step": 106423, "epoch": 633} {"train_loss": -10.008613586425781, "global_step": 106424, "epoch": 633} {"train_loss": -10.040511131286621, "global_step": 106425, "epoch": 633} {"train_loss": -9.738913536071777, "global_step": 106426, "epoch": 633} {"train_loss": -10.094656944274902, "global_step": 106427, "epoch": 633} {"train_loss": -9.695484161376953, "global_step": 106428, "epoch": 633} {"train_loss": -9.795259475708008, "global_step": 106429, "epoch": 633} {"train_loss": -9.842312812805176, "global_step": 106430, "epoch": 633} {"train_loss": -9.409852027893066, "global_step": 106431, "epoch": 633} {"train_loss": -9.71668815612793, "global_step": 106432, "epoch": 633} {"train_loss": -9.782356262207031, "global_step": 106433, "epoch": 633} {"train_loss": -9.27518367767334, "global_step": 106434, "epoch": 633} {"train_loss": -9.704338073730469, "global_step": 106435, "epoch": 633} {"train_loss": -9.463401794433594, "global_step": 106436, "epoch": 633} {"train_loss": -9.034211158752441, "global_step": 106437, "epoch": 633} {"train_loss": -10.074458122253418, "global_step": 106438, "epoch": 633} {"train_loss": -9.51123046875, "global_step": 106439, "epoch": 633} {"train_loss": -9.712858200073242, "global_step": 106440, "epoch": 633} {"train_loss": -9.371235847473145, "global_step": 106441, "epoch": 633} {"train_loss": -9.516843795776367, "global_step": 106442, "epoch": 633} {"train_loss": -8.956157684326172, "global_step": 106443, "epoch": 633} {"train_loss": -9.8206148147583, "global_step": 106444, "epoch": 633} {"train_loss": -9.169206619262695, "global_step": 106445, "epoch": 633} {"train_loss": -9.262250900268555, "global_step": 106446, "epoch": 633} {"train_loss": -9.192895889282227, "global_step": 106447, "epoch": 633} {"train_loss": -9.243623733520508, "global_step": 106448, "epoch": 633} {"train_loss": -9.570886611938477, "global_step": 106449, "epoch": 633} {"train_loss": -9.258386611938477, "global_step": 106450, "epoch": 633} {"train_loss": -9.50160026550293, "global_step": 106451, "epoch": 633} {"train_loss": -9.26909351348877, "global_step": 106452, "epoch": 633} {"train_loss": -9.712308883666992, "global_step": 106453, "epoch": 633} {"train_loss": -9.609862327575684, "global_step": 106454, "epoch": 633} {"train_loss": -9.533914566040039, "global_step": 106455, "epoch": 633} {"train_loss": -9.746323585510254, "global_step": 106456, "epoch": 633} {"train_loss": -9.603445053100586, "global_step": 106457, "epoch": 633} {"train_loss": -9.864974975585938, "global_step": 106458, "epoch": 633} {"train_loss": -9.727457046508789, "global_step": 106459, "epoch": 633} {"train_loss": -9.73276138305664, "global_step": 106460, "epoch": 633} {"train_loss": -9.870945930480957, "global_step": 106461, "epoch": 633} {"train_loss": -9.507590293884277, "global_step": 106462, "epoch": 633} {"train_loss": -9.835966110229492, "global_step": 106463, "epoch": 633} {"train_loss": -9.682098388671875, "global_step": 106464, "epoch": 633} {"train_loss": -9.718257904052734, "global_step": 106465, "epoch": 633} {"train_loss": -9.757484436035156, "global_step": 106466, "epoch": 633} {"train_loss": -9.864218711853027, "global_step": 106467, "epoch": 633} {"train_loss": -9.843111038208008, "global_step": 106468, "epoch": 633} {"train_loss": -9.706206321716309, "global_step": 106469, "epoch": 633} {"train_loss": -10.015667915344238, "global_step": 106470, "epoch": 633} {"train_loss": -9.887687683105469, "global_step": 106471, "epoch": 633} {"train_loss": -10.019673347473145, "global_step": 106472, "epoch": 633} {"train_loss": -9.711187362670898, "global_step": 106473, "epoch": 633} {"train_loss": -9.883777618408203, "global_step": 106474, "epoch": 633} {"train_loss": -10.012528419494629, "global_step": 106475, "epoch": 633} {"train_loss": -10.051177024841309, "global_step": 106476, "epoch": 633} {"train_loss": -10.059937477111816, "global_step": 106477, "epoch": 633} {"train_loss": -10.095869064331055, "global_step": 106478, "epoch": 633} {"train_loss": -10.04995346069336, "global_step": 106479, "epoch": 633} {"train_loss": -9.979507446289062, "global_step": 106480, "epoch": 633} {"train_loss": -10.199129104614258, "global_step": 106481, "epoch": 633} {"train_loss": -10.263263702392578, "global_step": 106482, "epoch": 633} {"train_loss": -10.202266693115234, "global_step": 106483, "epoch": 633} {"train_loss": -10.192329406738281, "global_step": 106484, "epoch": 633} {"train_loss": -10.072701454162598, "global_step": 106485, "epoch": 633} {"train_loss": -10.152469635009766, "global_step": 106486, "epoch": 633} {"train_loss": -10.257352828979492, "global_step": 106487, "epoch": 633} {"train_loss": -9.935067176818848, "global_step": 106488, "epoch": 633} {"train_loss": -10.037087440490723, "global_step": 106489, "epoch": 633} {"train_loss": -10.051265716552734, "global_step": 106490, "epoch": 633} {"train_loss": -9.98639965057373, "global_step": 106491, "epoch": 633} {"train_loss": -9.445531845092773, "global_step": 106492, "epoch": 633} {"train_loss": -9.291810989379883, "global_step": 106493, "epoch": 633} {"train_loss": -9.707317352294922, "global_step": 106494, "epoch": 633} {"train_loss": -9.159650802612305, "global_step": 106495, "epoch": 633} {"train_loss": -9.490869522094727, "global_step": 106496, "epoch": 633} {"train_loss": -9.242033958435059, "global_step": 106497, "epoch": 633} {"train_loss": -8.454588890075684, "global_step": 106498, "epoch": 633} {"train_loss": -9.431922912597656, "global_step": 106499, "epoch": 633} {"train_loss": -7.90578031539917, "global_step": 106500, "epoch": 633} {"train_loss": -8.752498626708984, "global_step": 106501, "epoch": 633} {"train_loss": -8.849020004272461, "global_step": 106502, "epoch": 633} {"train_loss": -9.4680814743042, "global_step": 106503, "epoch": 633} {"train_loss": -9.296894073486328, "global_step": 106504, "epoch": 633} {"train_loss": -8.807710647583008, "global_step": 106505, "epoch": 633} {"train_loss": -9.571674346923828, "global_step": 106506, "epoch": 633} {"train_loss": -9.464509963989258, "global_step": 106507, "epoch": 633} {"train_loss": -9.111640930175781, "global_step": 106508, "epoch": 633} {"train_loss": -9.568806648254395, "global_step": 106509, "epoch": 633} {"train_loss": -9.111608505249023, "global_step": 106510, "epoch": 633} {"train_loss": -9.766963927518754, "global_step": 106511, "epoch": 633, "val_loss": 209552.125} {"train_loss": -9.28732681274414, "global_step": 106512, "epoch": 634} {"train_loss": -9.228200912475586, "global_step": 106513, "epoch": 634} {"train_loss": -9.5992431640625, "global_step": 106514, "epoch": 634} {"train_loss": -9.362683296203613, "global_step": 106515, "epoch": 634} {"train_loss": -9.239702224731445, "global_step": 106516, "epoch": 634} {"train_loss": -9.622842788696289, "global_step": 106517, "epoch": 634} {"train_loss": -9.526416778564453, "global_step": 106518, "epoch": 634} {"train_loss": -9.590492248535156, "global_step": 106519, "epoch": 634} {"train_loss": -9.569633483886719, "global_step": 106520, "epoch": 634} {"train_loss": -9.509252548217773, "global_step": 106521, "epoch": 634} {"train_loss": -9.523422241210938, "global_step": 106522, "epoch": 634} {"train_loss": -9.407065391540527, "global_step": 106523, "epoch": 634} {"train_loss": -9.658702850341797, "global_step": 106524, "epoch": 634} {"train_loss": -9.468809127807617, "global_step": 106525, "epoch": 634} {"train_loss": -9.5414400100708, "global_step": 106526, "epoch": 634} {"train_loss": -9.801568031311035, "global_step": 106527, "epoch": 634} {"train_loss": -9.544151306152344, "global_step": 106528, "epoch": 634} {"train_loss": -9.78305435180664, "global_step": 106529, "epoch": 634} {"train_loss": -9.741791725158691, "global_step": 106530, "epoch": 634} {"train_loss": -9.70040225982666, "global_step": 106531, "epoch": 634} {"train_loss": -9.376249313354492, "global_step": 106532, "epoch": 634} {"train_loss": -9.59071159362793, "global_step": 106533, "epoch": 634} {"train_loss": -9.368751525878906, "global_step": 106534, "epoch": 634} {"train_loss": -9.533720016479492, "global_step": 106535, "epoch": 634} {"train_loss": -9.718647956848145, "global_step": 106536, "epoch": 634} {"train_loss": -9.825587272644043, "global_step": 106537, "epoch": 634} {"train_loss": -9.736665725708008, "global_step": 106538, "epoch": 634} {"train_loss": -9.384998321533203, "global_step": 106539, "epoch": 634} {"train_loss": -9.72100830078125, "global_step": 106540, "epoch": 634} {"train_loss": -9.64752197265625, "global_step": 106541, "epoch": 634} {"train_loss": -9.695094108581543, "global_step": 106542, "epoch": 634} {"train_loss": -9.622383117675781, "global_step": 106543, "epoch": 634} {"train_loss": -9.560367584228516, "global_step": 106544, "epoch": 634} {"train_loss": -9.753863334655762, "global_step": 106545, "epoch": 634} {"train_loss": -9.237274169921875, "global_step": 106546, "epoch": 634} {"train_loss": -9.60940170288086, "global_step": 106547, "epoch": 634} {"train_loss": -9.802206993103027, "global_step": 106548, "epoch": 634} {"train_loss": -9.503210067749023, "global_step": 106549, "epoch": 634} {"train_loss": -9.56982135772705, "global_step": 106550, "epoch": 634} {"train_loss": -9.834738731384277, "global_step": 106551, "epoch": 634} {"train_loss": -9.743155479431152, "global_step": 106552, "epoch": 634} {"train_loss": -9.73115062713623, "global_step": 106553, "epoch": 634} {"train_loss": -9.876060485839844, "global_step": 106554, "epoch": 634} {"train_loss": -9.606447219848633, "global_step": 106555, "epoch": 634} {"train_loss": -9.968266487121582, "global_step": 106556, "epoch": 634} {"train_loss": -9.742979049682617, "global_step": 106557, "epoch": 634} {"train_loss": -9.77341079711914, "global_step": 106558, "epoch": 634} {"train_loss": -9.827533721923828, "global_step": 106559, "epoch": 634} {"train_loss": -10.038997650146484, "global_step": 106560, "epoch": 634} {"train_loss": -9.560161590576172, "global_step": 106561, "epoch": 634} {"train_loss": -9.924464225769043, "global_step": 106562, "epoch": 634} {"train_loss": -9.33328628540039, "global_step": 106563, "epoch": 634} {"train_loss": -9.944668769836426, "global_step": 106564, "epoch": 634} {"train_loss": -9.619991302490234, "global_step": 106565, "epoch": 634} {"train_loss": -10.028326988220215, "global_step": 106566, "epoch": 634} {"train_loss": -9.6248140335083, "global_step": 106567, "epoch": 634} {"train_loss": -9.904108047485352, "global_step": 106568, "epoch": 634} {"train_loss": -9.458598136901855, "global_step": 106569, "epoch": 634} {"train_loss": -9.844728469848633, "global_step": 106570, "epoch": 634} {"train_loss": -9.715147018432617, "global_step": 106571, "epoch": 634} {"train_loss": -10.106401443481445, "global_step": 106572, "epoch": 634} {"train_loss": -9.93641471862793, "global_step": 106573, "epoch": 634} {"train_loss": -9.967803955078125, "global_step": 106574, "epoch": 634} {"train_loss": -10.038006782531738, "global_step": 106575, "epoch": 634} {"train_loss": -10.076041221618652, "global_step": 106576, "epoch": 634} {"train_loss": -10.132465362548828, "global_step": 106577, "epoch": 634} {"train_loss": -10.049474716186523, "global_step": 106578, "epoch": 634} {"train_loss": -9.881166458129883, "global_step": 106579, "epoch": 634} {"train_loss": -10.234413146972656, "global_step": 106580, "epoch": 634} {"train_loss": -10.15695858001709, "global_step": 106581, "epoch": 634} {"train_loss": -9.983596801757812, "global_step": 106582, "epoch": 634} {"train_loss": -10.311989784240723, "global_step": 106583, "epoch": 634} {"train_loss": -9.613763809204102, "global_step": 106584, "epoch": 634} {"train_loss": -9.599899291992188, "global_step": 106585, "epoch": 634} {"train_loss": -10.037141799926758, "global_step": 106586, "epoch": 634} {"train_loss": -9.608314514160156, "global_step": 106587, "epoch": 634} {"train_loss": -9.788020133972168, "global_step": 106588, "epoch": 634} {"train_loss": -9.64232349395752, "global_step": 106589, "epoch": 634} {"train_loss": -9.963647842407227, "global_step": 106590, "epoch": 634} {"train_loss": -9.877796173095703, "global_step": 106591, "epoch": 634} {"train_loss": -9.9710693359375, "global_step": 106592, "epoch": 634} {"train_loss": -10.036588668823242, "global_step": 106593, "epoch": 634} {"train_loss": -9.780433654785156, "global_step": 106594, "epoch": 634} {"train_loss": -9.889398574829102, "global_step": 106595, "epoch": 634} {"train_loss": -9.862375259399414, "global_step": 106596, "epoch": 634} {"train_loss": -9.812939643859863, "global_step": 106597, "epoch": 634} {"train_loss": -9.892136573791504, "global_step": 106598, "epoch": 634} {"train_loss": -9.716214179992676, "global_step": 106599, "epoch": 634} {"train_loss": -9.915176391601562, "global_step": 106600, "epoch": 634} {"train_loss": -9.939624786376953, "global_step": 106601, "epoch": 634} {"train_loss": -9.722963333129883, "global_step": 106602, "epoch": 634} {"train_loss": -10.079659461975098, "global_step": 106603, "epoch": 634} {"train_loss": -9.832525253295898, "global_step": 106604, "epoch": 634} {"train_loss": -10.028010368347168, "global_step": 106605, "epoch": 634} {"train_loss": -10.1104736328125, "global_step": 106606, "epoch": 634} {"train_loss": -9.97555160522461, "global_step": 106607, "epoch": 634} {"train_loss": -10.08431625366211, "global_step": 106608, "epoch": 634} {"train_loss": -10.045684814453125, "global_step": 106609, "epoch": 634} {"train_loss": -9.910968780517578, "global_step": 106610, "epoch": 634} {"train_loss": -10.159253120422363, "global_step": 106611, "epoch": 634} {"train_loss": -9.925355911254883, "global_step": 106612, "epoch": 634} {"train_loss": -9.664342880249023, "global_step": 106613, "epoch": 634} {"train_loss": -9.858952522277832, "global_step": 106614, "epoch": 634} {"train_loss": -9.74307632446289, "global_step": 106615, "epoch": 634} {"train_loss": -9.756290435791016, "global_step": 106616, "epoch": 634} {"train_loss": -9.834775924682617, "global_step": 106617, "epoch": 634} {"train_loss": -10.013537406921387, "global_step": 106618, "epoch": 634} {"train_loss": -10.137859344482422, "global_step": 106619, "epoch": 634} {"train_loss": -9.951810836791992, "global_step": 106620, "epoch": 634} {"train_loss": -9.959486961364746, "global_step": 106621, "epoch": 634} {"train_loss": -9.751155853271484, "global_step": 106622, "epoch": 634} {"train_loss": -9.895048141479492, "global_step": 106623, "epoch": 634} {"train_loss": -9.890114784240723, "global_step": 106624, "epoch": 634} {"train_loss": -9.874274253845215, "global_step": 106625, "epoch": 634} {"train_loss": -10.068751335144043, "global_step": 106626, "epoch": 634} {"train_loss": -9.83538818359375, "global_step": 106627, "epoch": 634} {"train_loss": -10.052430152893066, "global_step": 106628, "epoch": 634} {"train_loss": -10.055971145629883, "global_step": 106629, "epoch": 634} {"train_loss": -9.894988059997559, "global_step": 106630, "epoch": 634} {"train_loss": -9.991174697875977, "global_step": 106631, "epoch": 634} {"train_loss": -10.239334106445312, "global_step": 106632, "epoch": 634} {"train_loss": -10.123334884643555, "global_step": 106633, "epoch": 634} {"train_loss": -9.934015274047852, "global_step": 106634, "epoch": 634} {"train_loss": -9.63653564453125, "global_step": 106635, "epoch": 634} {"train_loss": -9.950885772705078, "global_step": 106636, "epoch": 634} {"train_loss": -9.742096900939941, "global_step": 106637, "epoch": 634} {"train_loss": -9.989645957946777, "global_step": 106638, "epoch": 634} {"train_loss": -10.14126968383789, "global_step": 106639, "epoch": 634} {"train_loss": -10.163320541381836, "global_step": 106640, "epoch": 634} {"train_loss": -10.079763412475586, "global_step": 106641, "epoch": 634} {"train_loss": -10.090702056884766, "global_step": 106642, "epoch": 634} {"train_loss": -9.666914939880371, "global_step": 106643, "epoch": 634} {"train_loss": -9.910614013671875, "global_step": 106644, "epoch": 634} {"train_loss": -9.89758586883545, "global_step": 106645, "epoch": 634} {"train_loss": -9.891578674316406, "global_step": 106646, "epoch": 634} {"train_loss": -10.011190414428711, "global_step": 106647, "epoch": 634} {"train_loss": -9.977002143859863, "global_step": 106648, "epoch": 634} {"train_loss": -10.022716522216797, "global_step": 106649, "epoch": 634} {"train_loss": -10.129329681396484, "global_step": 106650, "epoch": 634} {"train_loss": -9.958847045898438, "global_step": 106651, "epoch": 634} {"train_loss": -10.157164573669434, "global_step": 106652, "epoch": 634} {"train_loss": -10.021768569946289, "global_step": 106653, "epoch": 634} {"train_loss": -10.153777122497559, "global_step": 106654, "epoch": 634} {"train_loss": -9.894062042236328, "global_step": 106655, "epoch": 634} {"train_loss": -9.56402587890625, "global_step": 106656, "epoch": 634} {"train_loss": -10.132949829101562, "global_step": 106657, "epoch": 634} {"train_loss": -9.696846961975098, "global_step": 106658, "epoch": 634} {"train_loss": -9.897340774536133, "global_step": 106659, "epoch": 634} {"train_loss": -9.712308883666992, "global_step": 106660, "epoch": 634} {"train_loss": -10.245769500732422, "global_step": 106661, "epoch": 634} {"train_loss": -9.98036003112793, "global_step": 106662, "epoch": 634} {"train_loss": -9.430327415466309, "global_step": 106663, "epoch": 634} {"train_loss": -9.715215682983398, "global_step": 106664, "epoch": 634} {"train_loss": -9.722663879394531, "global_step": 106665, "epoch": 634} {"train_loss": -9.47148323059082, "global_step": 106666, "epoch": 634} {"train_loss": -9.429351806640625, "global_step": 106667, "epoch": 634} {"train_loss": -9.305547714233398, "global_step": 106668, "epoch": 634} {"train_loss": -9.70840072631836, "global_step": 106669, "epoch": 634} {"train_loss": -9.205781936645508, "global_step": 106670, "epoch": 634} {"train_loss": -9.669201850891113, "global_step": 106671, "epoch": 634} {"train_loss": -9.37264633178711, "global_step": 106672, "epoch": 634} {"train_loss": -9.995760917663574, "global_step": 106673, "epoch": 634} {"train_loss": -9.468616485595703, "global_step": 106674, "epoch": 634} {"train_loss": -9.717256546020508, "global_step": 106675, "epoch": 634} {"train_loss": -9.610280990600586, "global_step": 106676, "epoch": 634} {"train_loss": -9.959122657775879, "global_step": 106677, "epoch": 634} {"train_loss": -9.591789245605469, "global_step": 106678, "epoch": 634} {"train_loss": -9.798161075228737, "global_step": 106679, "epoch": 634, "val_loss": 207639.5625} {"train_loss": -9.58326244354248, "global_step": 106680, "epoch": 635} {"train_loss": -9.686361312866211, "global_step": 106681, "epoch": 635} {"train_loss": -9.702366828918457, "global_step": 106682, "epoch": 635} {"train_loss": -9.239595413208008, "global_step": 106683, "epoch": 635} {"train_loss": -9.706399917602539, "global_step": 106684, "epoch": 635} {"train_loss": -9.65270709991455, "global_step": 106685, "epoch": 635} {"train_loss": -9.768001556396484, "global_step": 106686, "epoch": 635} {"train_loss": -9.607662200927734, "global_step": 106687, "epoch": 635} {"train_loss": -9.787176132202148, "global_step": 106688, "epoch": 635} {"train_loss": -9.694746017456055, "global_step": 106689, "epoch": 635} {"train_loss": -9.798345565795898, "global_step": 106690, "epoch": 635} {"train_loss": -9.913885116577148, "global_step": 106691, "epoch": 635} {"train_loss": -9.83633041381836, "global_step": 106692, "epoch": 635} {"train_loss": -10.006559371948242, "global_step": 106693, "epoch": 635} {"train_loss": -9.638461112976074, "global_step": 106694, "epoch": 635} {"train_loss": -10.117655754089355, "global_step": 106695, "epoch": 635} {"train_loss": -9.662642478942871, "global_step": 106696, "epoch": 635} {"train_loss": -9.771743774414062, "global_step": 106697, "epoch": 635} {"train_loss": -9.672200202941895, "global_step": 106698, "epoch": 635} {"train_loss": -9.862974166870117, "global_step": 106699, "epoch": 635} {"train_loss": -9.79966926574707, "global_step": 106700, "epoch": 635} {"train_loss": -9.961864471435547, "global_step": 106701, "epoch": 635} {"train_loss": -10.109429359436035, "global_step": 106702, "epoch": 635} {"train_loss": -10.02928352355957, "global_step": 106703, "epoch": 635} {"train_loss": -9.775894165039062, "global_step": 106704, "epoch": 635} {"train_loss": -9.752681732177734, "global_step": 106705, "epoch": 635} {"train_loss": -9.716632843017578, "global_step": 106706, "epoch": 635} {"train_loss": -9.91143798828125, "global_step": 106707, "epoch": 635} {"train_loss": -9.670174598693848, "global_step": 106708, "epoch": 635} {"train_loss": -10.122563362121582, "global_step": 106709, "epoch": 635} {"train_loss": -9.808955192565918, "global_step": 106710, "epoch": 635} {"train_loss": -9.736946105957031, "global_step": 106711, "epoch": 635} {"train_loss": -9.901853561401367, "global_step": 106712, "epoch": 635} {"train_loss": -9.941335678100586, "global_step": 106713, "epoch": 635} {"train_loss": -10.227729797363281, "global_step": 106714, "epoch": 635} {"train_loss": -10.277599334716797, "global_step": 106715, "epoch": 635} {"train_loss": -10.113395690917969, "global_step": 106716, "epoch": 635} {"train_loss": -10.030733108520508, "global_step": 106717, "epoch": 635} {"train_loss": -10.12618350982666, "global_step": 106718, "epoch": 635} {"train_loss": -10.12681770324707, "global_step": 106719, "epoch": 635} {"train_loss": -9.820306777954102, "global_step": 106720, "epoch": 635} {"train_loss": -10.113189697265625, "global_step": 106721, "epoch": 635} {"train_loss": -10.069995880126953, "global_step": 106722, "epoch": 635} {"train_loss": -10.179698944091797, "global_step": 106723, "epoch": 635} {"train_loss": -10.131385803222656, "global_step": 106724, "epoch": 635} {"train_loss": -10.214893341064453, "global_step": 106725, "epoch": 635} {"train_loss": -9.997628211975098, "global_step": 106726, "epoch": 635} {"train_loss": -10.033223152160645, "global_step": 106727, "epoch": 635} {"train_loss": -10.081783294677734, "global_step": 106728, "epoch": 635} {"train_loss": -10.126581192016602, "global_step": 106729, "epoch": 635} {"train_loss": -10.116483688354492, "global_step": 106730, "epoch": 635} {"train_loss": -10.181326866149902, "global_step": 106731, "epoch": 635} {"train_loss": -10.131175994873047, "global_step": 106732, "epoch": 635} {"train_loss": -10.023980140686035, "global_step": 106733, "epoch": 635} {"train_loss": -9.907940864562988, "global_step": 106734, "epoch": 635} {"train_loss": -9.903331756591797, "global_step": 106735, "epoch": 635} {"train_loss": -9.971529960632324, "global_step": 106736, "epoch": 635} {"train_loss": -9.673723220825195, "global_step": 106737, "epoch": 635} {"train_loss": -10.241593360900879, "global_step": 106738, "epoch": 635} {"train_loss": -9.695005416870117, "global_step": 106739, "epoch": 635} {"train_loss": -10.014322280883789, "global_step": 106740, "epoch": 635} {"train_loss": -9.718496322631836, "global_step": 106741, "epoch": 635} {"train_loss": -9.822931289672852, "global_step": 106742, "epoch": 635} {"train_loss": -9.651712417602539, "global_step": 106743, "epoch": 635} {"train_loss": -9.752631187438965, "global_step": 106744, "epoch": 635} {"train_loss": -9.697650909423828, "global_step": 106745, "epoch": 635} {"train_loss": -10.125687599182129, "global_step": 106746, "epoch": 635} {"train_loss": -9.613211631774902, "global_step": 106747, "epoch": 635} {"train_loss": -9.658135414123535, "global_step": 106748, "epoch": 635} {"train_loss": -9.804401397705078, "global_step": 106749, "epoch": 635} {"train_loss": -9.894083023071289, "global_step": 106750, "epoch": 635} {"train_loss": -9.663461685180664, "global_step": 106751, "epoch": 635} {"train_loss": -9.173480987548828, "global_step": 106752, "epoch": 635} {"train_loss": -9.867846488952637, "global_step": 106753, "epoch": 635} {"train_loss": -9.816407203674316, "global_step": 106754, "epoch": 635} {"train_loss": -9.609288215637207, "global_step": 106755, "epoch": 635} {"train_loss": -9.650794982910156, "global_step": 106756, "epoch": 635} {"train_loss": -9.367979049682617, "global_step": 106757, "epoch": 635} {"train_loss": -9.417594909667969, "global_step": 106758, "epoch": 635} {"train_loss": -9.473621368408203, "global_step": 106759, "epoch": 635} {"train_loss": -9.98439884185791, "global_step": 106760, "epoch": 635} {"train_loss": -9.157611846923828, "global_step": 106761, "epoch": 635} {"train_loss": -9.43440055847168, "global_step": 106762, "epoch": 635} {"train_loss": -9.46495246887207, "global_step": 106763, "epoch": 635} {"train_loss": -9.411684036254883, "global_step": 106764, "epoch": 635} {"train_loss": -9.38473892211914, "global_step": 106765, "epoch": 635} {"train_loss": -9.837345123291016, "global_step": 106766, "epoch": 635} {"train_loss": -9.46403980255127, "global_step": 106767, "epoch": 635} {"train_loss": -9.66059398651123, "global_step": 106768, "epoch": 635} {"train_loss": -9.818503379821777, "global_step": 106769, "epoch": 635} {"train_loss": -9.328272819519043, "global_step": 106770, "epoch": 635} {"train_loss": -9.647636413574219, "global_step": 106771, "epoch": 635} {"train_loss": -9.925490379333496, "global_step": 106772, "epoch": 635} {"train_loss": -9.575069427490234, "global_step": 106773, "epoch": 635} {"train_loss": -9.574172973632812, "global_step": 106774, "epoch": 635} {"train_loss": -9.555049896240234, "global_step": 106775, "epoch": 635} {"train_loss": -10.001249313354492, "global_step": 106776, "epoch": 635} {"train_loss": -9.504853248596191, "global_step": 106777, "epoch": 635} {"train_loss": -9.905014991760254, "global_step": 106778, "epoch": 635} {"train_loss": -9.791303634643555, "global_step": 106779, "epoch": 635} {"train_loss": -9.872745513916016, "global_step": 106780, "epoch": 635} {"train_loss": -9.916555404663086, "global_step": 106781, "epoch": 635} {"train_loss": -9.72801399230957, "global_step": 106782, "epoch": 635} {"train_loss": -10.016395568847656, "global_step": 106783, "epoch": 635} {"train_loss": -9.852627754211426, "global_step": 106784, "epoch": 635} {"train_loss": -9.845542907714844, "global_step": 106785, "epoch": 635} {"train_loss": -9.728256225585938, "global_step": 106786, "epoch": 635} {"train_loss": -10.009967803955078, "global_step": 106787, "epoch": 635} {"train_loss": -9.95058822631836, "global_step": 106788, "epoch": 635} {"train_loss": -9.871248245239258, "global_step": 106789, "epoch": 635} {"train_loss": -10.003543853759766, "global_step": 106790, "epoch": 635} {"train_loss": -10.00847339630127, "global_step": 106791, "epoch": 635} {"train_loss": -9.917021751403809, "global_step": 106792, "epoch": 635} {"train_loss": -10.219579696655273, "global_step": 106793, "epoch": 635} {"train_loss": -10.123412132263184, "global_step": 106794, "epoch": 635} {"train_loss": -9.984918594360352, "global_step": 106795, "epoch": 635} {"train_loss": -10.066524505615234, "global_step": 106796, "epoch": 635} {"train_loss": -9.866039276123047, "global_step": 106797, "epoch": 635} {"train_loss": -10.093113899230957, "global_step": 106798, "epoch": 635} {"train_loss": -10.303215026855469, "global_step": 106799, "epoch": 635} {"train_loss": -9.948086738586426, "global_step": 106800, "epoch": 635} {"train_loss": -9.559049606323242, "global_step": 106801, "epoch": 635} {"train_loss": -9.99773120880127, "global_step": 106802, "epoch": 635} {"train_loss": -9.837495803833008, "global_step": 106803, "epoch": 635} {"train_loss": -9.383222579956055, "global_step": 106804, "epoch": 635} {"train_loss": -9.996452331542969, "global_step": 106805, "epoch": 635} {"train_loss": -8.980159759521484, "global_step": 106806, "epoch": 635} {"train_loss": -9.68668270111084, "global_step": 106807, "epoch": 635} {"train_loss": -9.896910667419434, "global_step": 106808, "epoch": 635} {"train_loss": -9.587767601013184, "global_step": 106809, "epoch": 635} {"train_loss": -9.737942695617676, "global_step": 106810, "epoch": 635} {"train_loss": -9.822236061096191, "global_step": 106811, "epoch": 635} {"train_loss": -9.589847564697266, "global_step": 106812, "epoch": 635} {"train_loss": -9.735345840454102, "global_step": 106813, "epoch": 635} {"train_loss": -9.770158767700195, "global_step": 106814, "epoch": 635} {"train_loss": -9.54938793182373, "global_step": 106815, "epoch": 635} {"train_loss": -9.613920211791992, "global_step": 106816, "epoch": 635} {"train_loss": -9.761159896850586, "global_step": 106817, "epoch": 635} {"train_loss": -9.483418464660645, "global_step": 106818, "epoch": 635} {"train_loss": -9.874763488769531, "global_step": 106819, "epoch": 635} {"train_loss": -9.742316246032715, "global_step": 106820, "epoch": 635} {"train_loss": -9.57883071899414, "global_step": 106821, "epoch": 635} {"train_loss": -9.647967338562012, "global_step": 106822, "epoch": 635} {"train_loss": -9.506525993347168, "global_step": 106823, "epoch": 635} {"train_loss": -9.513257026672363, "global_step": 106824, "epoch": 635} {"train_loss": -9.890159606933594, "global_step": 106825, "epoch": 635} {"train_loss": -9.826529502868652, "global_step": 106826, "epoch": 635} {"train_loss": -9.75893783569336, "global_step": 106827, "epoch": 635} {"train_loss": -9.784904479980469, "global_step": 106828, "epoch": 635} {"train_loss": -9.595970153808594, "global_step": 106829, "epoch": 635} {"train_loss": -9.898646354675293, "global_step": 106830, "epoch": 635} {"train_loss": -9.967580795288086, "global_step": 106831, "epoch": 635} {"train_loss": -9.750340461730957, "global_step": 106832, "epoch": 635} {"train_loss": -9.861342430114746, "global_step": 106833, "epoch": 635} {"train_loss": -9.649889945983887, "global_step": 106834, "epoch": 635} {"train_loss": -9.732536315917969, "global_step": 106835, "epoch": 635} {"train_loss": -9.975269317626953, "global_step": 106836, "epoch": 635} {"train_loss": -9.8846435546875, "global_step": 106837, "epoch": 635} {"train_loss": -9.842048645019531, "global_step": 106838, "epoch": 635} {"train_loss": -9.964427947998047, "global_step": 106839, "epoch": 635} {"train_loss": -9.965568542480469, "global_step": 106840, "epoch": 635} {"train_loss": -9.807737350463867, "global_step": 106841, "epoch": 635} {"train_loss": -9.85198974609375, "global_step": 106842, "epoch": 635} {"train_loss": -9.91614818572998, "global_step": 106843, "epoch": 635} {"train_loss": -9.807315826416016, "global_step": 106844, "epoch": 635} {"train_loss": -9.968384742736816, "global_step": 106845, "epoch": 635} {"train_loss": -9.645572662353516, "global_step": 106846, "epoch": 635} {"train_loss": -9.809569903782435, "global_step": 106847, "epoch": 635, "val_loss": 208493.15625, "train_action_mse_error": 6.556380748748779} {"train_loss": -9.506572723388672, "global_step": 106848, "epoch": 636} {"train_loss": -9.404829025268555, "global_step": 106849, "epoch": 636} {"train_loss": -9.824018478393555, "global_step": 106850, "epoch": 636} {"train_loss": -8.927193641662598, "global_step": 106851, "epoch": 636} {"train_loss": -9.760963439941406, "global_step": 106852, "epoch": 636} {"train_loss": -8.29472541809082, "global_step": 106853, "epoch": 636} {"train_loss": -9.393007278442383, "global_step": 106854, "epoch": 636} {"train_loss": -8.94468879699707, "global_step": 106855, "epoch": 636} {"train_loss": -9.409202575683594, "global_step": 106856, "epoch": 636} {"train_loss": -8.974538803100586, "global_step": 106857, "epoch": 636} {"train_loss": -9.666630744934082, "global_step": 106858, "epoch": 636} {"train_loss": -9.188872337341309, "global_step": 106859, "epoch": 636} {"train_loss": -9.089498519897461, "global_step": 106860, "epoch": 636} {"train_loss": -9.227156639099121, "global_step": 106861, "epoch": 636} {"train_loss": -9.127798080444336, "global_step": 106862, "epoch": 636} {"train_loss": -9.315694808959961, "global_step": 106863, "epoch": 636} {"train_loss": -8.46617603302002, "global_step": 106864, "epoch": 636} {"train_loss": -9.293838500976562, "global_step": 106865, "epoch": 636} {"train_loss": -9.40967082977295, "global_step": 106866, "epoch": 636} {"train_loss": -8.655815124511719, "global_step": 106867, "epoch": 636} {"train_loss": -9.275988578796387, "global_step": 106868, "epoch": 636} {"train_loss": -9.441473007202148, "global_step": 106869, "epoch": 636} {"train_loss": -8.824445724487305, "global_step": 106870, "epoch": 636} {"train_loss": -9.075035095214844, "global_step": 106871, "epoch": 636} {"train_loss": -9.219606399536133, "global_step": 106872, "epoch": 636} {"train_loss": -8.8711576461792, "global_step": 106873, "epoch": 636} {"train_loss": -9.256534576416016, "global_step": 106874, "epoch": 636} {"train_loss": -9.409933090209961, "global_step": 106875, "epoch": 636} {"train_loss": -8.802664756774902, "global_step": 106876, "epoch": 636} {"train_loss": -9.116982460021973, "global_step": 106877, "epoch": 636} {"train_loss": -9.62837028503418, "global_step": 106878, "epoch": 636} {"train_loss": -9.413300514221191, "global_step": 106879, "epoch": 636} {"train_loss": -9.39811897277832, "global_step": 106880, "epoch": 636} {"train_loss": -9.401378631591797, "global_step": 106881, "epoch": 636} {"train_loss": -9.690193176269531, "global_step": 106882, "epoch": 636} {"train_loss": -9.515535354614258, "global_step": 106883, "epoch": 636} {"train_loss": -9.507218360900879, "global_step": 106884, "epoch": 636} {"train_loss": -9.517772674560547, "global_step": 106885, "epoch": 636} {"train_loss": -9.655980110168457, "global_step": 106886, "epoch": 636} {"train_loss": -9.506637573242188, "global_step": 106887, "epoch": 636} {"train_loss": -9.679229736328125, "global_step": 106888, "epoch": 636} {"train_loss": -9.691824913024902, "global_step": 106889, "epoch": 636} {"train_loss": -9.690114974975586, "global_step": 106890, "epoch": 636} {"train_loss": -9.697163581848145, "global_step": 106891, "epoch": 636} {"train_loss": -9.90124797821045, "global_step": 106892, "epoch": 636} {"train_loss": -9.564117431640625, "global_step": 106893, "epoch": 636} {"train_loss": -9.69941520690918, "global_step": 106894, "epoch": 636} {"train_loss": -9.896844863891602, "global_step": 106895, "epoch": 636} {"train_loss": -9.663961410522461, "global_step": 106896, "epoch": 636} {"train_loss": -9.805129051208496, "global_step": 106897, "epoch": 636} {"train_loss": -9.961908340454102, "global_step": 106898, "epoch": 636} {"train_loss": -9.803773880004883, "global_step": 106899, "epoch": 636} {"train_loss": -10.020038604736328, "global_step": 106900, "epoch": 636} {"train_loss": -10.156951904296875, "global_step": 106901, "epoch": 636} {"train_loss": -10.111244201660156, "global_step": 106902, "epoch": 636} {"train_loss": -10.175376892089844, "global_step": 106903, "epoch": 636} {"train_loss": -10.001681327819824, "global_step": 106904, "epoch": 636} {"train_loss": -10.33273696899414, "global_step": 106905, "epoch": 636} {"train_loss": -10.178592681884766, "global_step": 106906, "epoch": 636} {"train_loss": -9.944413185119629, "global_step": 106907, "epoch": 636} {"train_loss": -10.001344680786133, "global_step": 106908, "epoch": 636} {"train_loss": -10.070876121520996, "global_step": 106909, "epoch": 636} {"train_loss": -10.039758682250977, "global_step": 106910, "epoch": 636} {"train_loss": -10.089115142822266, "global_step": 106911, "epoch": 636} {"train_loss": -10.145454406738281, "global_step": 106912, "epoch": 636} {"train_loss": -9.760116577148438, "global_step": 106913, "epoch": 636} {"train_loss": -9.991764068603516, "global_step": 106914, "epoch": 636} {"train_loss": -9.445926666259766, "global_step": 106915, "epoch": 636} {"train_loss": -9.417221069335938, "global_step": 106916, "epoch": 636} {"train_loss": -10.078593254089355, "global_step": 106917, "epoch": 636} {"train_loss": -9.761691093444824, "global_step": 106918, "epoch": 636} {"train_loss": -9.583978652954102, "global_step": 106919, "epoch": 636} {"train_loss": -9.917282104492188, "global_step": 106920, "epoch": 636} {"train_loss": -9.652020454406738, "global_step": 106921, "epoch": 636} {"train_loss": -9.870240211486816, "global_step": 106922, "epoch": 636} {"train_loss": -10.189037322998047, "global_step": 106923, "epoch": 636} {"train_loss": -9.993581771850586, "global_step": 106924, "epoch": 636} {"train_loss": -9.869437217712402, "global_step": 106925, "epoch": 636} {"train_loss": -9.700130462646484, "global_step": 106926, "epoch": 636} {"train_loss": -9.878150939941406, "global_step": 106927, "epoch": 636} {"train_loss": -9.82874870300293, "global_step": 106928, "epoch": 636} {"train_loss": -9.973847389221191, "global_step": 106929, "epoch": 636} {"train_loss": -9.905841827392578, "global_step": 106930, "epoch": 636} {"train_loss": -9.96493911743164, "global_step": 106931, "epoch": 636} {"train_loss": -9.83700942993164, "global_step": 106932, "epoch": 636} {"train_loss": -9.575153350830078, "global_step": 106933, "epoch": 636} {"train_loss": -9.492183685302734, "global_step": 106934, "epoch": 636} {"train_loss": -9.707165718078613, "global_step": 106935, "epoch": 636} {"train_loss": -9.788331031799316, "global_step": 106936, "epoch": 636} {"train_loss": -9.71825885772705, "global_step": 106937, "epoch": 636} {"train_loss": -9.816572189331055, "global_step": 106938, "epoch": 636} {"train_loss": -9.466324806213379, "global_step": 106939, "epoch": 636} {"train_loss": -9.372381210327148, "global_step": 106940, "epoch": 636} {"train_loss": -9.639856338500977, "global_step": 106941, "epoch": 636} {"train_loss": -9.672924041748047, "global_step": 106942, "epoch": 636} {"train_loss": -8.705845832824707, "global_step": 106943, "epoch": 636} {"train_loss": -9.410832405090332, "global_step": 106944, "epoch": 636} {"train_loss": -9.000936508178711, "global_step": 106945, "epoch": 636} {"train_loss": -9.427238464355469, "global_step": 106946, "epoch": 636} {"train_loss": -9.728059768676758, "global_step": 106947, "epoch": 636} {"train_loss": -9.395055770874023, "global_step": 106948, "epoch": 636} {"train_loss": -9.665058135986328, "global_step": 106949, "epoch": 636} {"train_loss": -9.595947265625, "global_step": 106950, "epoch": 636} {"train_loss": -9.165559768676758, "global_step": 106951, "epoch": 636} {"train_loss": -9.428162574768066, "global_step": 106952, "epoch": 636} {"train_loss": -9.701925277709961, "global_step": 106953, "epoch": 636} {"train_loss": -9.219289779663086, "global_step": 106954, "epoch": 636} {"train_loss": -9.803197860717773, "global_step": 106955, "epoch": 636} {"train_loss": -9.51650619506836, "global_step": 106956, "epoch": 636} {"train_loss": -9.331634521484375, "global_step": 106957, "epoch": 636} {"train_loss": -9.489736557006836, "global_step": 106958, "epoch": 636} {"train_loss": -9.622516632080078, "global_step": 106959, "epoch": 636} {"train_loss": -9.244802474975586, "global_step": 106960, "epoch": 636} {"train_loss": -9.447898864746094, "global_step": 106961, "epoch": 636} {"train_loss": -9.439596176147461, "global_step": 106962, "epoch": 636} {"train_loss": -9.404306411743164, "global_step": 106963, "epoch": 636} {"train_loss": -9.465532302856445, "global_step": 106964, "epoch": 636} {"train_loss": -9.597345352172852, "global_step": 106965, "epoch": 636} {"train_loss": -9.413246154785156, "global_step": 106966, "epoch": 636} {"train_loss": -9.547355651855469, "global_step": 106967, "epoch": 636} {"train_loss": -9.6353759765625, "global_step": 106968, "epoch": 636} {"train_loss": -9.446147918701172, "global_step": 106969, "epoch": 636} {"train_loss": -9.43873405456543, "global_step": 106970, "epoch": 636} {"train_loss": -9.785612106323242, "global_step": 106971, "epoch": 636} {"train_loss": -9.373762130737305, "global_step": 106972, "epoch": 636} {"train_loss": -9.664000511169434, "global_step": 106973, "epoch": 636} {"train_loss": -9.682760238647461, "global_step": 106974, "epoch": 636} {"train_loss": -9.850833892822266, "global_step": 106975, "epoch": 636} {"train_loss": -9.659404754638672, "global_step": 106976, "epoch": 636} {"train_loss": -9.899187088012695, "global_step": 106977, "epoch": 636} {"train_loss": -9.823600769042969, "global_step": 106978, "epoch": 636} {"train_loss": -9.671110153198242, "global_step": 106979, "epoch": 636} {"train_loss": -9.95369815826416, "global_step": 106980, "epoch": 636} {"train_loss": -9.726183891296387, "global_step": 106981, "epoch": 636} {"train_loss": -10.007949829101562, "global_step": 106982, "epoch": 636} {"train_loss": -10.016706466674805, "global_step": 106983, "epoch": 636} {"train_loss": -10.009786605834961, "global_step": 106984, "epoch": 636} {"train_loss": -10.131211280822754, "global_step": 106985, "epoch": 636} {"train_loss": -9.66341781616211, "global_step": 106986, "epoch": 636} {"train_loss": -9.963356018066406, "global_step": 106987, "epoch": 636} {"train_loss": -9.888459205627441, "global_step": 106988, "epoch": 636} {"train_loss": -10.087644577026367, "global_step": 106989, "epoch": 636} {"train_loss": -9.964391708374023, "global_step": 106990, "epoch": 636} {"train_loss": -9.886436462402344, "global_step": 106991, "epoch": 636} {"train_loss": -9.957640647888184, "global_step": 106992, "epoch": 636} {"train_loss": -9.908967971801758, "global_step": 106993, "epoch": 636} {"train_loss": -10.075810432434082, "global_step": 106994, "epoch": 636} {"train_loss": -9.995443344116211, "global_step": 106995, "epoch": 636} {"train_loss": -10.152840614318848, "global_step": 106996, "epoch": 636} {"train_loss": -9.910843849182129, "global_step": 106997, "epoch": 636} {"train_loss": -10.118097305297852, "global_step": 106998, "epoch": 636} {"train_loss": -9.774324417114258, "global_step": 106999, "epoch": 636} {"train_loss": -10.212896347045898, "global_step": 107000, "epoch": 636} {"train_loss": -9.859023094177246, "global_step": 107001, "epoch": 636} {"train_loss": -10.042490005493164, "global_step": 107002, "epoch": 636} {"train_loss": -10.082080841064453, "global_step": 107003, "epoch": 636} {"train_loss": -9.975858688354492, "global_step": 107004, "epoch": 636} {"train_loss": -9.930741310119629, "global_step": 107005, "epoch": 636} {"train_loss": -10.149993896484375, "global_step": 107006, "epoch": 636} {"train_loss": -9.413127899169922, "global_step": 107007, "epoch": 636} {"train_loss": -10.057148933410645, "global_step": 107008, "epoch": 636} {"train_loss": -9.889508247375488, "global_step": 107009, "epoch": 636} {"train_loss": -9.868667602539062, "global_step": 107010, "epoch": 636} {"train_loss": -10.068914413452148, "global_step": 107011, "epoch": 636} {"train_loss": -9.595221519470215, "global_step": 107012, "epoch": 636} {"train_loss": -10.112615585327148, "global_step": 107013, "epoch": 636} {"train_loss": -9.55542278289795, "global_step": 107014, "epoch": 636} {"train_loss": -9.647519588470459, "global_step": 107015, "epoch": 636, "val_loss": 207944.984375} {"train_loss": -9.58072566986084, "global_step": 107016, "epoch": 637} {"train_loss": -9.486669540405273, "global_step": 107017, "epoch": 637} {"train_loss": -9.359899520874023, "global_step": 107018, "epoch": 637} {"train_loss": -9.644072532653809, "global_step": 107019, "epoch": 637} {"train_loss": -9.46287727355957, "global_step": 107020, "epoch": 637} {"train_loss": -9.430171966552734, "global_step": 107021, "epoch": 637} {"train_loss": -10.123933792114258, "global_step": 107022, "epoch": 637} {"train_loss": -9.239835739135742, "global_step": 107023, "epoch": 637} {"train_loss": -9.97248363494873, "global_step": 107024, "epoch": 637} {"train_loss": -9.563000679016113, "global_step": 107025, "epoch": 637} {"train_loss": -9.694543838500977, "global_step": 107026, "epoch": 637} {"train_loss": -9.462505340576172, "global_step": 107027, "epoch": 637} {"train_loss": -9.915332794189453, "global_step": 107028, "epoch": 637} {"train_loss": -9.263586044311523, "global_step": 107029, "epoch": 637} {"train_loss": -10.015445709228516, "global_step": 107030, "epoch": 637} {"train_loss": -9.51756477355957, "global_step": 107031, "epoch": 637} {"train_loss": -9.818363189697266, "global_step": 107032, "epoch": 637} {"train_loss": -9.543424606323242, "global_step": 107033, "epoch": 637} {"train_loss": -9.998499870300293, "global_step": 107034, "epoch": 637} {"train_loss": -9.456893920898438, "global_step": 107035, "epoch": 637} {"train_loss": -9.863336563110352, "global_step": 107036, "epoch": 637} {"train_loss": -9.780701637268066, "global_step": 107037, "epoch": 637} {"train_loss": -9.71519660949707, "global_step": 107038, "epoch": 637} {"train_loss": -9.745141983032227, "global_step": 107039, "epoch": 637} {"train_loss": -9.807056427001953, "global_step": 107040, "epoch": 637} {"train_loss": -9.948010444641113, "global_step": 107041, "epoch": 637} {"train_loss": -9.797115325927734, "global_step": 107042, "epoch": 637} {"train_loss": -9.925186157226562, "global_step": 107043, "epoch": 637} {"train_loss": -9.827902793884277, "global_step": 107044, "epoch": 637} {"train_loss": -9.998336791992188, "global_step": 107045, "epoch": 637} {"train_loss": -9.74190902709961, "global_step": 107046, "epoch": 637} {"train_loss": -10.239117622375488, "global_step": 107047, "epoch": 637} {"train_loss": -10.073711395263672, "global_step": 107048, "epoch": 637} {"train_loss": -9.927130699157715, "global_step": 107049, "epoch": 637} {"train_loss": -10.002685546875, "global_step": 107050, "epoch": 637} {"train_loss": -10.044315338134766, "global_step": 107051, "epoch": 637} {"train_loss": -10.143665313720703, "global_step": 107052, "epoch": 637} {"train_loss": -9.856709480285645, "global_step": 107053, "epoch": 637} {"train_loss": -10.012617111206055, "global_step": 107054, "epoch": 637} {"train_loss": -10.004507064819336, "global_step": 107055, "epoch": 637} {"train_loss": -9.979315757751465, "global_step": 107056, "epoch": 637} {"train_loss": -9.942314147949219, "global_step": 107057, "epoch": 637} {"train_loss": -10.000740051269531, "global_step": 107058, "epoch": 637} {"train_loss": -10.1260986328125, "global_step": 107059, "epoch": 637} {"train_loss": -10.146892547607422, "global_step": 107060, "epoch": 637} {"train_loss": -9.77701187133789, "global_step": 107061, "epoch": 637} {"train_loss": -10.297624588012695, "global_step": 107062, "epoch": 637} {"train_loss": -9.603060722351074, "global_step": 107063, "epoch": 637} {"train_loss": -9.60529899597168, "global_step": 107064, "epoch": 637} {"train_loss": -10.187137603759766, "global_step": 107065, "epoch": 637} {"train_loss": -9.656858444213867, "global_step": 107066, "epoch": 637} {"train_loss": -10.156661987304688, "global_step": 107067, "epoch": 637} {"train_loss": -9.720087051391602, "global_step": 107068, "epoch": 637} {"train_loss": -10.074384689331055, "global_step": 107069, "epoch": 637} {"train_loss": -9.744546890258789, "global_step": 107070, "epoch": 637} {"train_loss": -10.196626663208008, "global_step": 107071, "epoch": 637} {"train_loss": -9.804998397827148, "global_step": 107072, "epoch": 637} {"train_loss": -10.194165229797363, "global_step": 107073, "epoch": 637} {"train_loss": -9.958985328674316, "global_step": 107074, "epoch": 637} {"train_loss": -10.012324333190918, "global_step": 107075, "epoch": 637} {"train_loss": -10.01699447631836, "global_step": 107076, "epoch": 637} {"train_loss": -9.879923820495605, "global_step": 107077, "epoch": 637} {"train_loss": -10.275640487670898, "global_step": 107078, "epoch": 637} {"train_loss": -9.795592308044434, "global_step": 107079, "epoch": 637} {"train_loss": -9.7991943359375, "global_step": 107080, "epoch": 637} {"train_loss": -10.10844612121582, "global_step": 107081, "epoch": 637} {"train_loss": -10.165766716003418, "global_step": 107082, "epoch": 637} {"train_loss": -9.703524589538574, "global_step": 107083, "epoch": 637} {"train_loss": -9.919639587402344, "global_step": 107084, "epoch": 637} {"train_loss": -10.112665176391602, "global_step": 107085, "epoch": 637} {"train_loss": -9.819473266601562, "global_step": 107086, "epoch": 637} {"train_loss": -9.424577713012695, "global_step": 107087, "epoch": 637} {"train_loss": -9.785882949829102, "global_step": 107088, "epoch": 637} {"train_loss": -9.83856201171875, "global_step": 107089, "epoch": 637} {"train_loss": -9.526962280273438, "global_step": 107090, "epoch": 637} {"train_loss": -9.610055923461914, "global_step": 107091, "epoch": 637} {"train_loss": -9.657809257507324, "global_step": 107092, "epoch": 637} {"train_loss": -9.412050247192383, "global_step": 107093, "epoch": 637} {"train_loss": -9.891441345214844, "global_step": 107094, "epoch": 637} {"train_loss": -9.425027847290039, "global_step": 107095, "epoch": 637} {"train_loss": -9.263642311096191, "global_step": 107096, "epoch": 637} {"train_loss": -9.449579238891602, "global_step": 107097, "epoch": 637} {"train_loss": -8.99990177154541, "global_step": 107098, "epoch": 637} {"train_loss": -9.298158645629883, "global_step": 107099, "epoch": 637} {"train_loss": -9.216611862182617, "global_step": 107100, "epoch": 637} {"train_loss": -9.658263206481934, "global_step": 107101, "epoch": 637} {"train_loss": -9.385942459106445, "global_step": 107102, "epoch": 637} {"train_loss": -9.41340160369873, "global_step": 107103, "epoch": 637} {"train_loss": -9.501384735107422, "global_step": 107104, "epoch": 637} {"train_loss": -9.706274032592773, "global_step": 107105, "epoch": 637} {"train_loss": -9.440803527832031, "global_step": 107106, "epoch": 637} {"train_loss": -9.407135009765625, "global_step": 107107, "epoch": 637} {"train_loss": -9.909671783447266, "global_step": 107108, "epoch": 637} {"train_loss": -9.812155723571777, "global_step": 107109, "epoch": 637} {"train_loss": -9.291528701782227, "global_step": 107110, "epoch": 637} {"train_loss": -9.565715789794922, "global_step": 107111, "epoch": 637} {"train_loss": -9.353517532348633, "global_step": 107112, "epoch": 637} {"train_loss": -9.558860778808594, "global_step": 107113, "epoch": 637} {"train_loss": -9.380781173706055, "global_step": 107114, "epoch": 637} {"train_loss": -9.568086624145508, "global_step": 107115, "epoch": 637} {"train_loss": -9.746374130249023, "global_step": 107116, "epoch": 637} {"train_loss": -9.522405624389648, "global_step": 107117, "epoch": 637} {"train_loss": -9.913458824157715, "global_step": 107118, "epoch": 637} {"train_loss": -9.622483253479004, "global_step": 107119, "epoch": 637} {"train_loss": -9.824722290039062, "global_step": 107120, "epoch": 637} {"train_loss": -9.740999221801758, "global_step": 107121, "epoch": 637} {"train_loss": -9.755624771118164, "global_step": 107122, "epoch": 637} {"train_loss": -9.678483963012695, "global_step": 107123, "epoch": 637} {"train_loss": -9.633070945739746, "global_step": 107124, "epoch": 637} {"train_loss": -9.72047233581543, "global_step": 107125, "epoch": 637} {"train_loss": -9.673195838928223, "global_step": 107126, "epoch": 637} {"train_loss": -9.987086296081543, "global_step": 107127, "epoch": 637} {"train_loss": -9.657499313354492, "global_step": 107128, "epoch": 637} {"train_loss": -9.74968147277832, "global_step": 107129, "epoch": 637} {"train_loss": -9.994062423706055, "global_step": 107130, "epoch": 637} {"train_loss": -9.857864379882812, "global_step": 107131, "epoch": 637} {"train_loss": -9.837446212768555, "global_step": 107132, "epoch": 637} {"train_loss": -9.943412780761719, "global_step": 107133, "epoch": 637} {"train_loss": -9.728839874267578, "global_step": 107134, "epoch": 637} {"train_loss": -10.051602363586426, "global_step": 107135, "epoch": 637} {"train_loss": -9.959829330444336, "global_step": 107136, "epoch": 637} {"train_loss": -9.840580940246582, "global_step": 107137, "epoch": 637} {"train_loss": -10.132196426391602, "global_step": 107138, "epoch": 637} {"train_loss": -9.757976531982422, "global_step": 107139, "epoch": 637} {"train_loss": -10.166635513305664, "global_step": 107140, "epoch": 637} {"train_loss": -9.78592300415039, "global_step": 107141, "epoch": 637} {"train_loss": -10.205745697021484, "global_step": 107142, "epoch": 637} {"train_loss": -9.865402221679688, "global_step": 107143, "epoch": 637} {"train_loss": -9.832000732421875, "global_step": 107144, "epoch": 637} {"train_loss": -10.002044677734375, "global_step": 107145, "epoch": 637} {"train_loss": -10.06353759765625, "global_step": 107146, "epoch": 637} {"train_loss": -9.991924285888672, "global_step": 107147, "epoch": 637} {"train_loss": -9.994770050048828, "global_step": 107148, "epoch": 637} {"train_loss": -10.139678001403809, "global_step": 107149, "epoch": 637} {"train_loss": -10.050247192382812, "global_step": 107150, "epoch": 637} {"train_loss": -10.059465408325195, "global_step": 107151, "epoch": 637} {"train_loss": -9.84383487701416, "global_step": 107152, "epoch": 637} {"train_loss": -9.965676307678223, "global_step": 107153, "epoch": 637} {"train_loss": -9.925167083740234, "global_step": 107154, "epoch": 637} {"train_loss": -9.972188949584961, "global_step": 107155, "epoch": 637} {"train_loss": -9.924283981323242, "global_step": 107156, "epoch": 637} {"train_loss": -10.185835838317871, "global_step": 107157, "epoch": 637} {"train_loss": -9.830333709716797, "global_step": 107158, "epoch": 637} {"train_loss": -9.88622760772705, "global_step": 107159, "epoch": 637} {"train_loss": -9.994213104248047, "global_step": 107160, "epoch": 637} {"train_loss": -9.979894638061523, "global_step": 107161, "epoch": 637} {"train_loss": -10.124433517456055, "global_step": 107162, "epoch": 637} {"train_loss": -9.8937349319458, "global_step": 107163, "epoch": 637} {"train_loss": -9.676080703735352, "global_step": 107164, "epoch": 637} {"train_loss": -9.516485214233398, "global_step": 107165, "epoch": 637} {"train_loss": -10.051884651184082, "global_step": 107166, "epoch": 637} {"train_loss": -8.969929695129395, "global_step": 107167, "epoch": 637} {"train_loss": -9.799644470214844, "global_step": 107168, "epoch": 637} {"train_loss": -9.682716369628906, "global_step": 107169, "epoch": 637} {"train_loss": -9.672662734985352, "global_step": 107170, "epoch": 637} {"train_loss": -10.007230758666992, "global_step": 107171, "epoch": 637} {"train_loss": -9.796390533447266, "global_step": 107172, "epoch": 637} {"train_loss": -9.727666854858398, "global_step": 107173, "epoch": 637} {"train_loss": -9.841533660888672, "global_step": 107174, "epoch": 637} {"train_loss": -9.701004028320312, "global_step": 107175, "epoch": 637} {"train_loss": -9.630514144897461, "global_step": 107176, "epoch": 637} {"train_loss": -9.683242797851562, "global_step": 107177, "epoch": 637} {"train_loss": -9.87582015991211, "global_step": 107178, "epoch": 637} {"train_loss": -9.720940589904785, "global_step": 107179, "epoch": 637} {"train_loss": -10.082975387573242, "global_step": 107180, "epoch": 637} {"train_loss": -9.86739730834961, "global_step": 107181, "epoch": 637} {"train_loss": -10.048148155212402, "global_step": 107182, "epoch": 637} {"train_loss": -9.796998898188273, "global_step": 107183, "epoch": 637, "val_loss": 207773.96875} {"train_loss": -9.969549179077148, "global_step": 107184, "epoch": 638} {"train_loss": -9.681465148925781, "global_step": 107185, "epoch": 638} {"train_loss": -10.102115631103516, "global_step": 107186, "epoch": 638} {"train_loss": -10.02185344696045, "global_step": 107187, "epoch": 638} {"train_loss": -9.99288558959961, "global_step": 107188, "epoch": 638} {"train_loss": -10.003082275390625, "global_step": 107189, "epoch": 638} {"train_loss": -10.017430305480957, "global_step": 107190, "epoch": 638} {"train_loss": -10.04610538482666, "global_step": 107191, "epoch": 638} {"train_loss": -9.959794998168945, "global_step": 107192, "epoch": 638} {"train_loss": -10.0357666015625, "global_step": 107193, "epoch": 638} {"train_loss": -9.856571197509766, "global_step": 107194, "epoch": 638} {"train_loss": -9.877869606018066, "global_step": 107195, "epoch": 638} {"train_loss": -9.833352088928223, "global_step": 107196, "epoch": 638} {"train_loss": -9.991926193237305, "global_step": 107197, "epoch": 638} {"train_loss": -9.687419891357422, "global_step": 107198, "epoch": 638} {"train_loss": -9.767586708068848, "global_step": 107199, "epoch": 638} {"train_loss": -9.999996185302734, "global_step": 107200, "epoch": 638} {"train_loss": -10.157156944274902, "global_step": 107201, "epoch": 638} {"train_loss": -9.605069160461426, "global_step": 107202, "epoch": 638} {"train_loss": -10.197879791259766, "global_step": 107203, "epoch": 638} {"train_loss": -9.936590194702148, "global_step": 107204, "epoch": 638} {"train_loss": -10.022124290466309, "global_step": 107205, "epoch": 638} {"train_loss": -10.214742660522461, "global_step": 107206, "epoch": 638} {"train_loss": -10.027941703796387, "global_step": 107207, "epoch": 638} {"train_loss": -10.039604187011719, "global_step": 107208, "epoch": 638} {"train_loss": -9.68575668334961, "global_step": 107209, "epoch": 638} {"train_loss": -9.585071563720703, "global_step": 107210, "epoch": 638} {"train_loss": -9.973299026489258, "global_step": 107211, "epoch": 638} {"train_loss": -9.608999252319336, "global_step": 107212, "epoch": 638} {"train_loss": -9.968473434448242, "global_step": 107213, "epoch": 638} {"train_loss": -9.646020889282227, "global_step": 107214, "epoch": 638} {"train_loss": -9.612783432006836, "global_step": 107215, "epoch": 638} {"train_loss": -9.678634643554688, "global_step": 107216, "epoch": 638} {"train_loss": -9.84421157836914, "global_step": 107217, "epoch": 638} {"train_loss": -9.751399993896484, "global_step": 107218, "epoch": 638} {"train_loss": -10.0874662399292, "global_step": 107219, "epoch": 638} {"train_loss": -10.105051040649414, "global_step": 107220, "epoch": 638} {"train_loss": -9.933893203735352, "global_step": 107221, "epoch": 638} {"train_loss": -9.973973274230957, "global_step": 107222, "epoch": 638} {"train_loss": -9.800477027893066, "global_step": 107223, "epoch": 638} {"train_loss": -9.565754890441895, "global_step": 107224, "epoch": 638} {"train_loss": -9.718839645385742, "global_step": 107225, "epoch": 638} {"train_loss": -10.06583309173584, "global_step": 107226, "epoch": 638} {"train_loss": -9.912556648254395, "global_step": 107227, "epoch": 638} {"train_loss": -9.988954544067383, "global_step": 107228, "epoch": 638} {"train_loss": -10.159126281738281, "global_step": 107229, "epoch": 638} {"train_loss": -9.740198135375977, "global_step": 107230, "epoch": 638} {"train_loss": -9.93901538848877, "global_step": 107231, "epoch": 638} {"train_loss": -9.715816497802734, "global_step": 107232, "epoch": 638} {"train_loss": -9.775760650634766, "global_step": 107233, "epoch": 638} {"train_loss": -9.740992546081543, "global_step": 107234, "epoch": 638} {"train_loss": -9.63911247253418, "global_step": 107235, "epoch": 638} {"train_loss": -9.868293762207031, "global_step": 107236, "epoch": 638} {"train_loss": -9.7857027053833, "global_step": 107237, "epoch": 638} {"train_loss": -9.663064956665039, "global_step": 107238, "epoch": 638} {"train_loss": -9.689536094665527, "global_step": 107239, "epoch": 638} {"train_loss": -9.206062316894531, "global_step": 107240, "epoch": 638} {"train_loss": -10.069231033325195, "global_step": 107241, "epoch": 638} {"train_loss": -9.715115547180176, "global_step": 107242, "epoch": 638} {"train_loss": -9.950501441955566, "global_step": 107243, "epoch": 638} {"train_loss": -9.859349250793457, "global_step": 107244, "epoch": 638} {"train_loss": -9.693378448486328, "global_step": 107245, "epoch": 638} {"train_loss": -9.714160919189453, "global_step": 107246, "epoch": 638} {"train_loss": -9.524005889892578, "global_step": 107247, "epoch": 638} {"train_loss": -9.743952751159668, "global_step": 107248, "epoch": 638} {"train_loss": -9.696758270263672, "global_step": 107249, "epoch": 638} {"train_loss": -9.912673950195312, "global_step": 107250, "epoch": 638} {"train_loss": -9.323958396911621, "global_step": 107251, "epoch": 638} {"train_loss": -9.98346996307373, "global_step": 107252, "epoch": 638} {"train_loss": -9.44578742980957, "global_step": 107253, "epoch": 638} {"train_loss": -9.711057662963867, "global_step": 107254, "epoch": 638} {"train_loss": -9.541450500488281, "global_step": 107255, "epoch": 638} {"train_loss": -9.654349327087402, "global_step": 107256, "epoch": 638} {"train_loss": -9.417045593261719, "global_step": 107257, "epoch": 638} {"train_loss": -9.848091125488281, "global_step": 107258, "epoch": 638} {"train_loss": -9.457927703857422, "global_step": 107259, "epoch": 638} {"train_loss": -9.476631164550781, "global_step": 107260, "epoch": 638} {"train_loss": -9.527924537658691, "global_step": 107261, "epoch": 638} {"train_loss": -9.31483268737793, "global_step": 107262, "epoch": 638} {"train_loss": -9.549263000488281, "global_step": 107263, "epoch": 638} {"train_loss": -9.740499496459961, "global_step": 107264, "epoch": 638} {"train_loss": -9.499610900878906, "global_step": 107265, "epoch": 638} {"train_loss": -9.682929992675781, "global_step": 107266, "epoch": 638} {"train_loss": -9.773431777954102, "global_step": 107267, "epoch": 638} {"train_loss": -9.924568176269531, "global_step": 107268, "epoch": 638} {"train_loss": -9.65650463104248, "global_step": 107269, "epoch": 638} {"train_loss": -9.745657920837402, "global_step": 107270, "epoch": 638} {"train_loss": -9.425958633422852, "global_step": 107271, "epoch": 638} {"train_loss": -9.983389854431152, "global_step": 107272, "epoch": 638} {"train_loss": -9.556411743164062, "global_step": 107273, "epoch": 638} {"train_loss": -10.08899211883545, "global_step": 107274, "epoch": 638} {"train_loss": -9.632135391235352, "global_step": 107275, "epoch": 638} {"train_loss": -9.840197563171387, "global_step": 107276, "epoch": 638} {"train_loss": -9.695892333984375, "global_step": 107277, "epoch": 638} {"train_loss": -9.825789451599121, "global_step": 107278, "epoch": 638} {"train_loss": -9.660928726196289, "global_step": 107279, "epoch": 638} {"train_loss": -9.417791366577148, "global_step": 107280, "epoch": 638} {"train_loss": -10.127365112304688, "global_step": 107281, "epoch": 638} {"train_loss": -9.906145095825195, "global_step": 107282, "epoch": 638} {"train_loss": -9.836888313293457, "global_step": 107283, "epoch": 638} {"train_loss": -9.463510513305664, "global_step": 107284, "epoch": 638} {"train_loss": -9.83542537689209, "global_step": 107285, "epoch": 638} {"train_loss": -9.81224250793457, "global_step": 107286, "epoch": 638} {"train_loss": -9.847599029541016, "global_step": 107287, "epoch": 638} {"train_loss": -9.853590965270996, "global_step": 107288, "epoch": 638} {"train_loss": -9.740362167358398, "global_step": 107289, "epoch": 638} {"train_loss": -10.106949806213379, "global_step": 107290, "epoch": 638} {"train_loss": -9.742673873901367, "global_step": 107291, "epoch": 638} {"train_loss": -9.741646766662598, "global_step": 107292, "epoch": 638} {"train_loss": -9.682148933410645, "global_step": 107293, "epoch": 638} {"train_loss": -9.704570770263672, "global_step": 107294, "epoch": 638} {"train_loss": -9.9454984664917, "global_step": 107295, "epoch": 638} {"train_loss": -9.907085418701172, "global_step": 107296, "epoch": 638} {"train_loss": -10.084659576416016, "global_step": 107297, "epoch": 638} {"train_loss": -9.795553207397461, "global_step": 107298, "epoch": 638} {"train_loss": -10.103198051452637, "global_step": 107299, "epoch": 638} {"train_loss": -9.564157485961914, "global_step": 107300, "epoch": 638} {"train_loss": -9.74479866027832, "global_step": 107301, "epoch": 638} {"train_loss": -9.896232604980469, "global_step": 107302, "epoch": 638} {"train_loss": -9.931347846984863, "global_step": 107303, "epoch": 638} {"train_loss": -9.87374496459961, "global_step": 107304, "epoch": 638} {"train_loss": -9.915706634521484, "global_step": 107305, "epoch": 638} {"train_loss": -9.973976135253906, "global_step": 107306, "epoch": 638} {"train_loss": -10.012516021728516, "global_step": 107307, "epoch": 638} {"train_loss": -9.618042945861816, "global_step": 107308, "epoch": 638} {"train_loss": -10.001924514770508, "global_step": 107309, "epoch": 638} {"train_loss": -9.761040687561035, "global_step": 107310, "epoch": 638} {"train_loss": -10.298933029174805, "global_step": 107311, "epoch": 638} {"train_loss": -9.633323669433594, "global_step": 107312, "epoch": 638} {"train_loss": -9.929128646850586, "global_step": 107313, "epoch": 638} {"train_loss": -9.920797348022461, "global_step": 107314, "epoch": 638} {"train_loss": -9.795177459716797, "global_step": 107315, "epoch": 638} {"train_loss": -9.945934295654297, "global_step": 107316, "epoch": 638} {"train_loss": -9.626333236694336, "global_step": 107317, "epoch": 638} {"train_loss": -9.891109466552734, "global_step": 107318, "epoch": 638} {"train_loss": -9.580083847045898, "global_step": 107319, "epoch": 638} {"train_loss": -9.774856567382812, "global_step": 107320, "epoch": 638} {"train_loss": -9.910518646240234, "global_step": 107321, "epoch": 638} {"train_loss": -9.869501113891602, "global_step": 107322, "epoch": 638} {"train_loss": -9.900887489318848, "global_step": 107323, "epoch": 638} {"train_loss": -9.83306884765625, "global_step": 107324, "epoch": 638} {"train_loss": -9.960592269897461, "global_step": 107325, "epoch": 638} {"train_loss": -10.134193420410156, "global_step": 107326, "epoch": 638} {"train_loss": -9.842390060424805, "global_step": 107327, "epoch": 638} {"train_loss": -9.865559577941895, "global_step": 107328, "epoch": 638} {"train_loss": -10.15268611907959, "global_step": 107329, "epoch": 638} {"train_loss": -9.820021629333496, "global_step": 107330, "epoch": 638} {"train_loss": -10.01484489440918, "global_step": 107331, "epoch": 638} {"train_loss": -10.247825622558594, "global_step": 107332, "epoch": 638} {"train_loss": -9.897798538208008, "global_step": 107333, "epoch": 638} {"train_loss": -9.774778366088867, "global_step": 107334, "epoch": 638} {"train_loss": -9.949018478393555, "global_step": 107335, "epoch": 638} {"train_loss": -9.806110382080078, "global_step": 107336, "epoch": 638} {"train_loss": -9.617706298828125, "global_step": 107337, "epoch": 638} {"train_loss": -10.004039764404297, "global_step": 107338, "epoch": 638} {"train_loss": -9.909149169921875, "global_step": 107339, "epoch": 638} {"train_loss": -9.632177352905273, "global_step": 107340, "epoch": 638} {"train_loss": -10.069826126098633, "global_step": 107341, "epoch": 638} {"train_loss": -9.76171875, "global_step": 107342, "epoch": 638} {"train_loss": -10.13599681854248, "global_step": 107343, "epoch": 638} {"train_loss": -9.825862884521484, "global_step": 107344, "epoch": 638} {"train_loss": -9.809324264526367, "global_step": 107345, "epoch": 638} {"train_loss": -9.847650527954102, "global_step": 107346, "epoch": 638} {"train_loss": -9.850178718566895, "global_step": 107347, "epoch": 638} {"train_loss": -9.829524040222168, "global_step": 107348, "epoch": 638} {"train_loss": -10.09156322479248, "global_step": 107349, "epoch": 638} {"train_loss": -9.705907821655273, "global_step": 107350, "epoch": 638} {"train_loss": -9.826495380628677, "global_step": 107351, "epoch": 638, "val_loss": 209691.625} {"train_loss": -9.916414260864258, "global_step": 107352, "epoch": 639} {"train_loss": -9.829166412353516, "global_step": 107353, "epoch": 639} {"train_loss": -9.769474029541016, "global_step": 107354, "epoch": 639} {"train_loss": -10.170073509216309, "global_step": 107355, "epoch": 639} {"train_loss": -9.740312576293945, "global_step": 107356, "epoch": 639} {"train_loss": -9.931079864501953, "global_step": 107357, "epoch": 639} {"train_loss": -9.965574264526367, "global_step": 107358, "epoch": 639} {"train_loss": -9.643186569213867, "global_step": 107359, "epoch": 639} {"train_loss": -9.945767402648926, "global_step": 107360, "epoch": 639} {"train_loss": -10.091480255126953, "global_step": 107361, "epoch": 639} {"train_loss": -10.015642166137695, "global_step": 107362, "epoch": 639} {"train_loss": -10.031326293945312, "global_step": 107363, "epoch": 639} {"train_loss": -9.905313491821289, "global_step": 107364, "epoch": 639} {"train_loss": -10.116104125976562, "global_step": 107365, "epoch": 639} {"train_loss": -9.900055885314941, "global_step": 107366, "epoch": 639} {"train_loss": -9.939604759216309, "global_step": 107367, "epoch": 639} {"train_loss": -9.549585342407227, "global_step": 107368, "epoch": 639} {"train_loss": -10.01683235168457, "global_step": 107369, "epoch": 639} {"train_loss": -9.666181564331055, "global_step": 107370, "epoch": 639} {"train_loss": -10.142339706420898, "global_step": 107371, "epoch": 639} {"train_loss": -10.053339004516602, "global_step": 107372, "epoch": 639} {"train_loss": -9.611644744873047, "global_step": 107373, "epoch": 639} {"train_loss": -10.075946807861328, "global_step": 107374, "epoch": 639} {"train_loss": -10.026769638061523, "global_step": 107375, "epoch": 639} {"train_loss": -9.661412239074707, "global_step": 107376, "epoch": 639} {"train_loss": -10.101318359375, "global_step": 107377, "epoch": 639} {"train_loss": -9.866290092468262, "global_step": 107378, "epoch": 639} {"train_loss": -10.044282913208008, "global_step": 107379, "epoch": 639} {"train_loss": -10.02691650390625, "global_step": 107380, "epoch": 639} {"train_loss": -10.095969200134277, "global_step": 107381, "epoch": 639} {"train_loss": -9.87263298034668, "global_step": 107382, "epoch": 639} {"train_loss": -10.073436737060547, "global_step": 107383, "epoch": 639} {"train_loss": -10.035971641540527, "global_step": 107384, "epoch": 639} {"train_loss": -10.100746154785156, "global_step": 107385, "epoch": 639} {"train_loss": -10.007229804992676, "global_step": 107386, "epoch": 639} {"train_loss": -9.848259925842285, "global_step": 107387, "epoch": 639} {"train_loss": -10.02524185180664, "global_step": 107388, "epoch": 639} {"train_loss": -10.016196250915527, "global_step": 107389, "epoch": 639} {"train_loss": -9.907182693481445, "global_step": 107390, "epoch": 639} {"train_loss": -10.226639747619629, "global_step": 107391, "epoch": 639} {"train_loss": -10.387968063354492, "global_step": 107392, "epoch": 639} {"train_loss": -10.186910629272461, "global_step": 107393, "epoch": 639} {"train_loss": -10.050638198852539, "global_step": 107394, "epoch": 639} {"train_loss": -9.656981468200684, "global_step": 107395, "epoch": 639} {"train_loss": -10.056570053100586, "global_step": 107396, "epoch": 639} {"train_loss": -9.66673469543457, "global_step": 107397, "epoch": 639} {"train_loss": -9.359960556030273, "global_step": 107398, "epoch": 639} {"train_loss": -9.635677337646484, "global_step": 107399, "epoch": 639} {"train_loss": -9.600618362426758, "global_step": 107400, "epoch": 639} {"train_loss": -9.6986722946167, "global_step": 107401, "epoch": 639} {"train_loss": -10.028589248657227, "global_step": 107402, "epoch": 639} {"train_loss": -9.617472648620605, "global_step": 107403, "epoch": 639} {"train_loss": -9.650345802307129, "global_step": 107404, "epoch": 639} {"train_loss": -9.950925827026367, "global_step": 107405, "epoch": 639} {"train_loss": -9.835914611816406, "global_step": 107406, "epoch": 639} {"train_loss": -9.747495651245117, "global_step": 107407, "epoch": 639} {"train_loss": -9.854467391967773, "global_step": 107408, "epoch": 639} {"train_loss": -9.983207702636719, "global_step": 107409, "epoch": 639} {"train_loss": -9.808380126953125, "global_step": 107410, "epoch": 639} {"train_loss": -9.896369934082031, "global_step": 107411, "epoch": 639} {"train_loss": -10.065616607666016, "global_step": 107412, "epoch": 639} {"train_loss": -9.71755313873291, "global_step": 107413, "epoch": 639} {"train_loss": -9.92819595336914, "global_step": 107414, "epoch": 639} {"train_loss": -9.932445526123047, "global_step": 107415, "epoch": 639} {"train_loss": -10.07640266418457, "global_step": 107416, "epoch": 639} {"train_loss": -9.50870132446289, "global_step": 107417, "epoch": 639} {"train_loss": -9.804601669311523, "global_step": 107418, "epoch": 639} {"train_loss": -9.472960472106934, "global_step": 107419, "epoch": 639} {"train_loss": -9.96851634979248, "global_step": 107420, "epoch": 639} {"train_loss": -9.606176376342773, "global_step": 107421, "epoch": 639} {"train_loss": -9.694547653198242, "global_step": 107422, "epoch": 639} {"train_loss": -9.468551635742188, "global_step": 107423, "epoch": 639} {"train_loss": -9.57160472869873, "global_step": 107424, "epoch": 639} {"train_loss": -9.390836715698242, "global_step": 107425, "epoch": 639} {"train_loss": -9.484041213989258, "global_step": 107426, "epoch": 639} {"train_loss": -9.48959732055664, "global_step": 107427, "epoch": 639} {"train_loss": -9.629484176635742, "global_step": 107428, "epoch": 639} {"train_loss": -9.526327133178711, "global_step": 107429, "epoch": 639} {"train_loss": -9.768671989440918, "global_step": 107430, "epoch": 639} {"train_loss": -9.848697662353516, "global_step": 107431, "epoch": 639} {"train_loss": -9.975578308105469, "global_step": 107432, "epoch": 639} {"train_loss": -9.692253112792969, "global_step": 107433, "epoch": 639} {"train_loss": -9.940179824829102, "global_step": 107434, "epoch": 639} {"train_loss": -9.617795944213867, "global_step": 107435, "epoch": 639} {"train_loss": -9.699453353881836, "global_step": 107436, "epoch": 639} {"train_loss": -9.737279891967773, "global_step": 107437, "epoch": 639} {"train_loss": -9.848865509033203, "global_step": 107438, "epoch": 639} {"train_loss": -9.681230545043945, "global_step": 107439, "epoch": 639} {"train_loss": -10.060685157775879, "global_step": 107440, "epoch": 639} {"train_loss": -9.587672233581543, "global_step": 107441, "epoch": 639} {"train_loss": -9.89882755279541, "global_step": 107442, "epoch": 639} {"train_loss": -9.691832542419434, "global_step": 107443, "epoch": 639} {"train_loss": -9.83470344543457, "global_step": 107444, "epoch": 639} {"train_loss": -9.622441291809082, "global_step": 107445, "epoch": 639} {"train_loss": -9.945590019226074, "global_step": 107446, "epoch": 639} {"train_loss": -9.509807586669922, "global_step": 107447, "epoch": 639} {"train_loss": -9.885970115661621, "global_step": 107448, "epoch": 639} {"train_loss": -9.797952651977539, "global_step": 107449, "epoch": 639} {"train_loss": -9.55002212524414, "global_step": 107450, "epoch": 639} {"train_loss": -9.7576904296875, "global_step": 107451, "epoch": 639} {"train_loss": -10.126096725463867, "global_step": 107452, "epoch": 639} {"train_loss": -9.87511157989502, "global_step": 107453, "epoch": 639} {"train_loss": -9.655285835266113, "global_step": 107454, "epoch": 639} {"train_loss": -9.793997764587402, "global_step": 107455, "epoch": 639} {"train_loss": -10.06014633178711, "global_step": 107456, "epoch": 639} {"train_loss": -9.97880744934082, "global_step": 107457, "epoch": 639} {"train_loss": -9.999357223510742, "global_step": 107458, "epoch": 639} {"train_loss": -9.919720649719238, "global_step": 107459, "epoch": 639} {"train_loss": -9.734615325927734, "global_step": 107460, "epoch": 639} {"train_loss": -9.9371337890625, "global_step": 107461, "epoch": 639} {"train_loss": -9.737360000610352, "global_step": 107462, "epoch": 639} {"train_loss": -9.978193283081055, "global_step": 107463, "epoch": 639} {"train_loss": -9.761951446533203, "global_step": 107464, "epoch": 639} {"train_loss": -9.962624549865723, "global_step": 107465, "epoch": 639} {"train_loss": -9.689212799072266, "global_step": 107466, "epoch": 639} {"train_loss": -10.065831184387207, "global_step": 107467, "epoch": 639} {"train_loss": -9.735576629638672, "global_step": 107468, "epoch": 639} {"train_loss": -9.188633918762207, "global_step": 107469, "epoch": 639} {"train_loss": -9.838449478149414, "global_step": 107470, "epoch": 639} {"train_loss": -9.380329132080078, "global_step": 107471, "epoch": 639} {"train_loss": -9.6729154586792, "global_step": 107472, "epoch": 639} {"train_loss": -9.456600189208984, "global_step": 107473, "epoch": 639} {"train_loss": -9.905858993530273, "global_step": 107474, "epoch": 639} {"train_loss": -9.483656883239746, "global_step": 107475, "epoch": 639} {"train_loss": -9.952657699584961, "global_step": 107476, "epoch": 639} {"train_loss": -9.085871696472168, "global_step": 107477, "epoch": 639} {"train_loss": -9.732170104980469, "global_step": 107478, "epoch": 639} {"train_loss": -9.40748405456543, "global_step": 107479, "epoch": 639} {"train_loss": -9.71395492553711, "global_step": 107480, "epoch": 639} {"train_loss": -9.619674682617188, "global_step": 107481, "epoch": 639} {"train_loss": -9.6563138961792, "global_step": 107482, "epoch": 639} {"train_loss": -9.655373573303223, "global_step": 107483, "epoch": 639} {"train_loss": -9.808601379394531, "global_step": 107484, "epoch": 639} {"train_loss": -9.687843322753906, "global_step": 107485, "epoch": 639} {"train_loss": -9.383835792541504, "global_step": 107486, "epoch": 639} {"train_loss": -9.814408302307129, "global_step": 107487, "epoch": 639} {"train_loss": -9.982561111450195, "global_step": 107488, "epoch": 639} {"train_loss": -9.483598709106445, "global_step": 107489, "epoch": 639} {"train_loss": -9.794281959533691, "global_step": 107490, "epoch": 639} {"train_loss": -9.55831527709961, "global_step": 107491, "epoch": 639} {"train_loss": -9.823502540588379, "global_step": 107492, "epoch": 639} {"train_loss": -9.785001754760742, "global_step": 107493, "epoch": 639} {"train_loss": -9.721562385559082, "global_step": 107494, "epoch": 639} {"train_loss": -9.958481788635254, "global_step": 107495, "epoch": 639} {"train_loss": -9.987540245056152, "global_step": 107496, "epoch": 639} {"train_loss": -9.830488204956055, "global_step": 107497, "epoch": 639} {"train_loss": -10.057435989379883, "global_step": 107498, "epoch": 639} {"train_loss": -9.9181547164917, "global_step": 107499, "epoch": 639} {"train_loss": -9.444464683532715, "global_step": 107500, "epoch": 639} {"train_loss": -9.904272079467773, "global_step": 107501, "epoch": 639} {"train_loss": -9.565479278564453, "global_step": 107502, "epoch": 639} {"train_loss": -10.133268356323242, "global_step": 107503, "epoch": 639} {"train_loss": -9.775113105773926, "global_step": 107504, "epoch": 639} {"train_loss": -9.858231544494629, "global_step": 107505, "epoch": 639} {"train_loss": -10.077835083007812, "global_step": 107506, "epoch": 639} {"train_loss": -9.996735572814941, "global_step": 107507, "epoch": 639} {"train_loss": -9.961055755615234, "global_step": 107508, "epoch": 639} {"train_loss": -9.768217086791992, "global_step": 107509, "epoch": 639} {"train_loss": -10.062599182128906, "global_step": 107510, "epoch": 639} {"train_loss": -9.962172508239746, "global_step": 107511, "epoch": 639} {"train_loss": -10.141266822814941, "global_step": 107512, "epoch": 639} {"train_loss": -10.038331985473633, "global_step": 107513, "epoch": 639} {"train_loss": -10.178089141845703, "global_step": 107514, "epoch": 639} {"train_loss": -10.10078239440918, "global_step": 107515, "epoch": 639} {"train_loss": -9.964942932128906, "global_step": 107516, "epoch": 639} {"train_loss": -10.361599922180176, "global_step": 107517, "epoch": 639} {"train_loss": -10.270715713500977, "global_step": 107518, "epoch": 639} {"train_loss": -9.83447497799283, "global_step": 107519, "epoch": 639, "val_loss": 208547.171875} {"train_loss": -10.266143798828125, "global_step": 107520, "epoch": 640} {"train_loss": -9.914749145507812, "global_step": 107521, "epoch": 640} {"train_loss": -10.214095115661621, "global_step": 107522, "epoch": 640} {"train_loss": -9.769489288330078, "global_step": 107523, "epoch": 640} {"train_loss": -9.741373062133789, "global_step": 107524, "epoch": 640} {"train_loss": -9.922812461853027, "global_step": 107525, "epoch": 640} {"train_loss": -9.74531364440918, "global_step": 107526, "epoch": 640} {"train_loss": -10.054208755493164, "global_step": 107527, "epoch": 640} {"train_loss": -9.877939224243164, "global_step": 107528, "epoch": 640} {"train_loss": -9.757280349731445, "global_step": 107529, "epoch": 640} {"train_loss": -10.063592910766602, "global_step": 107530, "epoch": 640} {"train_loss": -9.560993194580078, "global_step": 107531, "epoch": 640} {"train_loss": -9.23500919342041, "global_step": 107532, "epoch": 640} {"train_loss": -9.676778793334961, "global_step": 107533, "epoch": 640} {"train_loss": -9.375358581542969, "global_step": 107534, "epoch": 640} {"train_loss": -9.952842712402344, "global_step": 107535, "epoch": 640} {"train_loss": -8.756026268005371, "global_step": 107536, "epoch": 640} {"train_loss": -9.502274513244629, "global_step": 107537, "epoch": 640} {"train_loss": -8.797130584716797, "global_step": 107538, "epoch": 640} {"train_loss": -9.748634338378906, "global_step": 107539, "epoch": 640} {"train_loss": -8.752784729003906, "global_step": 107540, "epoch": 640} {"train_loss": -9.686360359191895, "global_step": 107541, "epoch": 640} {"train_loss": -9.160625457763672, "global_step": 107542, "epoch": 640} {"train_loss": -9.169309616088867, "global_step": 107543, "epoch": 640} {"train_loss": -9.64059066772461, "global_step": 107544, "epoch": 640} {"train_loss": -9.287759780883789, "global_step": 107545, "epoch": 640} {"train_loss": -9.479183197021484, "global_step": 107546, "epoch": 640} {"train_loss": -8.775753021240234, "global_step": 107547, "epoch": 640} {"train_loss": -9.357446670532227, "global_step": 107548, "epoch": 640} {"train_loss": -9.486335754394531, "global_step": 107549, "epoch": 640} {"train_loss": -9.017984390258789, "global_step": 107550, "epoch": 640} {"train_loss": -9.28274917602539, "global_step": 107551, "epoch": 640} {"train_loss": -9.354982376098633, "global_step": 107552, "epoch": 640} {"train_loss": -9.00394344329834, "global_step": 107553, "epoch": 640} {"train_loss": -9.761200904846191, "global_step": 107554, "epoch": 640} {"train_loss": -9.131404876708984, "global_step": 107555, "epoch": 640} {"train_loss": -9.250178337097168, "global_step": 107556, "epoch": 640} {"train_loss": -9.561777114868164, "global_step": 107557, "epoch": 640} {"train_loss": -9.604841232299805, "global_step": 107558, "epoch": 640} {"train_loss": -9.442304611206055, "global_step": 107559, "epoch": 640} {"train_loss": -9.476815223693848, "global_step": 107560, "epoch": 640} {"train_loss": -9.55387020111084, "global_step": 107561, "epoch": 640} {"train_loss": -9.37938404083252, "global_step": 107562, "epoch": 640} {"train_loss": -9.582359313964844, "global_step": 107563, "epoch": 640} {"train_loss": -9.233200073242188, "global_step": 107564, "epoch": 640} {"train_loss": -9.524606704711914, "global_step": 107565, "epoch": 640} {"train_loss": -9.591588973999023, "global_step": 107566, "epoch": 640} {"train_loss": -9.361288070678711, "global_step": 107567, "epoch": 640} {"train_loss": -9.587190628051758, "global_step": 107568, "epoch": 640} {"train_loss": -9.5787353515625, "global_step": 107569, "epoch": 640} {"train_loss": -9.699913024902344, "global_step": 107570, "epoch": 640} {"train_loss": -9.728411674499512, "global_step": 107571, "epoch": 640} {"train_loss": -9.608194351196289, "global_step": 107572, "epoch": 640} {"train_loss": -9.821931838989258, "global_step": 107573, "epoch": 640} {"train_loss": -9.976187705993652, "global_step": 107574, "epoch": 640} {"train_loss": -9.647001266479492, "global_step": 107575, "epoch": 640} {"train_loss": -9.798744201660156, "global_step": 107576, "epoch": 640} {"train_loss": -9.784841537475586, "global_step": 107577, "epoch": 640} {"train_loss": -9.714970588684082, "global_step": 107578, "epoch": 640} {"train_loss": -9.818077087402344, "global_step": 107579, "epoch": 640} {"train_loss": -9.61665153503418, "global_step": 107580, "epoch": 640} {"train_loss": -9.998111724853516, "global_step": 107581, "epoch": 640} {"train_loss": -9.931526184082031, "global_step": 107582, "epoch": 640} {"train_loss": -9.960819244384766, "global_step": 107583, "epoch": 640} {"train_loss": -10.123170852661133, "global_step": 107584, "epoch": 640} {"train_loss": -9.91008186340332, "global_step": 107585, "epoch": 640} {"train_loss": -10.14645767211914, "global_step": 107586, "epoch": 640} {"train_loss": -9.787435531616211, "global_step": 107587, "epoch": 640} {"train_loss": -9.879140853881836, "global_step": 107588, "epoch": 640} {"train_loss": -9.993721008300781, "global_step": 107589, "epoch": 640} {"train_loss": -10.008535385131836, "global_step": 107590, "epoch": 640} {"train_loss": -10.12840747833252, "global_step": 107591, "epoch": 640} {"train_loss": -9.997814178466797, "global_step": 107592, "epoch": 640} {"train_loss": -10.081531524658203, "global_step": 107593, "epoch": 640} {"train_loss": -10.267007827758789, "global_step": 107594, "epoch": 640} {"train_loss": -10.16062068939209, "global_step": 107595, "epoch": 640} {"train_loss": -9.949621200561523, "global_step": 107596, "epoch": 640} {"train_loss": -10.236400604248047, "global_step": 107597, "epoch": 640} {"train_loss": -10.22158432006836, "global_step": 107598, "epoch": 640} {"train_loss": -10.03464126586914, "global_step": 107599, "epoch": 640} {"train_loss": -9.880315780639648, "global_step": 107600, "epoch": 640} {"train_loss": -10.109073638916016, "global_step": 107601, "epoch": 640} {"train_loss": -9.894987106323242, "global_step": 107602, "epoch": 640} {"train_loss": -9.50543212890625, "global_step": 107603, "epoch": 640} {"train_loss": -9.243073463439941, "global_step": 107604, "epoch": 640} {"train_loss": -9.82165813446045, "global_step": 107605, "epoch": 640} {"train_loss": -8.980928421020508, "global_step": 107606, "epoch": 640} {"train_loss": -9.522499084472656, "global_step": 107607, "epoch": 640} {"train_loss": -9.471680641174316, "global_step": 107608, "epoch": 640} {"train_loss": -9.741717338562012, "global_step": 107609, "epoch": 640} {"train_loss": -9.476383209228516, "global_step": 107610, "epoch": 640} {"train_loss": -9.059236526489258, "global_step": 107611, "epoch": 640} {"train_loss": -9.570256233215332, "global_step": 107612, "epoch": 640} {"train_loss": -9.38489818572998, "global_step": 107613, "epoch": 640} {"train_loss": -9.58359432220459, "global_step": 107614, "epoch": 640} {"train_loss": -9.602012634277344, "global_step": 107615, "epoch": 640} {"train_loss": -9.640844345092773, "global_step": 107616, "epoch": 640} {"train_loss": -9.40414810180664, "global_step": 107617, "epoch": 640} {"train_loss": -9.834716796875, "global_step": 107618, "epoch": 640} {"train_loss": -9.35875415802002, "global_step": 107619, "epoch": 640} {"train_loss": -9.692937850952148, "global_step": 107620, "epoch": 640} {"train_loss": -9.499750137329102, "global_step": 107621, "epoch": 640} {"train_loss": -9.659278869628906, "global_step": 107622, "epoch": 640} {"train_loss": -9.374765396118164, "global_step": 107623, "epoch": 640} {"train_loss": -9.81395435333252, "global_step": 107624, "epoch": 640} {"train_loss": -9.63371467590332, "global_step": 107625, "epoch": 640} {"train_loss": -9.673910140991211, "global_step": 107626, "epoch": 640} {"train_loss": -9.713516235351562, "global_step": 107627, "epoch": 640} {"train_loss": -9.824350357055664, "global_step": 107628, "epoch": 640} {"train_loss": -9.744675636291504, "global_step": 107629, "epoch": 640} {"train_loss": -9.75475025177002, "global_step": 107630, "epoch": 640} {"train_loss": -9.992488861083984, "global_step": 107631, "epoch": 640} {"train_loss": -9.81163215637207, "global_step": 107632, "epoch": 640} {"train_loss": -9.630500793457031, "global_step": 107633, "epoch": 640} {"train_loss": -9.63984203338623, "global_step": 107634, "epoch": 640} {"train_loss": -9.757135391235352, "global_step": 107635, "epoch": 640} {"train_loss": -9.589588165283203, "global_step": 107636, "epoch": 640} {"train_loss": -9.915014266967773, "global_step": 107637, "epoch": 640} {"train_loss": -9.914589881896973, "global_step": 107638, "epoch": 640} {"train_loss": -9.73031997680664, "global_step": 107639, "epoch": 640} {"train_loss": -9.948602676391602, "global_step": 107640, "epoch": 640} {"train_loss": -9.924002647399902, "global_step": 107641, "epoch": 640} {"train_loss": -9.904444694519043, "global_step": 107642, "epoch": 640} {"train_loss": -9.792218208312988, "global_step": 107643, "epoch": 640} {"train_loss": -10.156529426574707, "global_step": 107644, "epoch": 640} {"train_loss": -9.92084789276123, "global_step": 107645, "epoch": 640} {"train_loss": -9.849979400634766, "global_step": 107646, "epoch": 640} {"train_loss": -10.076464653015137, "global_step": 107647, "epoch": 640} {"train_loss": -9.967496871948242, "global_step": 107648, "epoch": 640} {"train_loss": -10.312803268432617, "global_step": 107649, "epoch": 640} {"train_loss": -10.04777717590332, "global_step": 107650, "epoch": 640} {"train_loss": -9.997295379638672, "global_step": 107651, "epoch": 640} {"train_loss": -9.933506965637207, "global_step": 107652, "epoch": 640} {"train_loss": -10.04047966003418, "global_step": 107653, "epoch": 640} {"train_loss": -10.158700942993164, "global_step": 107654, "epoch": 640} {"train_loss": -10.282247543334961, "global_step": 107655, "epoch": 640} {"train_loss": -9.935641288757324, "global_step": 107656, "epoch": 640} {"train_loss": -10.0935697555542, "global_step": 107657, "epoch": 640} {"train_loss": -10.105480194091797, "global_step": 107658, "epoch": 640} {"train_loss": -10.061845779418945, "global_step": 107659, "epoch": 640} {"train_loss": -10.173563003540039, "global_step": 107660, "epoch": 640} {"train_loss": -9.855218887329102, "global_step": 107661, "epoch": 640} {"train_loss": -10.130739212036133, "global_step": 107662, "epoch": 640} {"train_loss": -10.002443313598633, "global_step": 107663, "epoch": 640} {"train_loss": -10.395674705505371, "global_step": 107664, "epoch": 640} {"train_loss": -10.280874252319336, "global_step": 107665, "epoch": 640} {"train_loss": -9.739360809326172, "global_step": 107666, "epoch": 640} {"train_loss": -9.952534675598145, "global_step": 107667, "epoch": 640} {"train_loss": -10.068758010864258, "global_step": 107668, "epoch": 640} {"train_loss": -9.274538040161133, "global_step": 107669, "epoch": 640} {"train_loss": -9.944886207580566, "global_step": 107670, "epoch": 640} {"train_loss": -10.200020790100098, "global_step": 107671, "epoch": 640} {"train_loss": -9.758869171142578, "global_step": 107672, "epoch": 640} {"train_loss": -10.164854049682617, "global_step": 107673, "epoch": 640} {"train_loss": -9.553293228149414, "global_step": 107674, "epoch": 640} {"train_loss": -10.15633773803711, "global_step": 107675, "epoch": 640} {"train_loss": -9.607636451721191, "global_step": 107676, "epoch": 640} {"train_loss": -9.975370407104492, "global_step": 107677, "epoch": 640} {"train_loss": -9.685127258300781, "global_step": 107678, "epoch": 640} {"train_loss": -9.600637435913086, "global_step": 107679, "epoch": 640} {"train_loss": -9.850517272949219, "global_step": 107680, "epoch": 640} {"train_loss": -9.760540008544922, "global_step": 107681, "epoch": 640} {"train_loss": -10.023508071899414, "global_step": 107682, "epoch": 640} {"train_loss": -9.555231094360352, "global_step": 107683, "epoch": 640} {"train_loss": -9.881598472595215, "global_step": 107684, "epoch": 640} {"train_loss": -9.893658638000488, "global_step": 107685, "epoch": 640} {"train_loss": -9.918030738830566, "global_step": 107686, "epoch": 640} {"train_loss": -9.737740533692497, "global_step": 107687, "epoch": 640, "val_loss": 209627.40625, "train_action_mse_error": 2.043252468109131} {"train_loss": -9.866141319274902, "global_step": 107688, "epoch": 641} {"train_loss": -9.62092399597168, "global_step": 107689, "epoch": 641} {"train_loss": -9.518531799316406, "global_step": 107690, "epoch": 641} {"train_loss": -9.623876571655273, "global_step": 107691, "epoch": 641} {"train_loss": -9.763999938964844, "global_step": 107692, "epoch": 641} {"train_loss": -9.59840202331543, "global_step": 107693, "epoch": 641} {"train_loss": -9.707742691040039, "global_step": 107694, "epoch": 641} {"train_loss": -9.723088264465332, "global_step": 107695, "epoch": 641} {"train_loss": -9.57457160949707, "global_step": 107696, "epoch": 641} {"train_loss": -9.888030052185059, "global_step": 107697, "epoch": 641} {"train_loss": -9.817564964294434, "global_step": 107698, "epoch": 641} {"train_loss": -9.848228454589844, "global_step": 107699, "epoch": 641} {"train_loss": -9.8662109375, "global_step": 107700, "epoch": 641} {"train_loss": -9.855323791503906, "global_step": 107701, "epoch": 641} {"train_loss": -9.6209716796875, "global_step": 107702, "epoch": 641} {"train_loss": -9.707113265991211, "global_step": 107703, "epoch": 641} {"train_loss": -9.86655044555664, "global_step": 107704, "epoch": 641} {"train_loss": -10.136066436767578, "global_step": 107705, "epoch": 641} {"train_loss": -9.80337142944336, "global_step": 107706, "epoch": 641} {"train_loss": -9.853230476379395, "global_step": 107707, "epoch": 641} {"train_loss": -9.57364273071289, "global_step": 107708, "epoch": 641} {"train_loss": -10.006216049194336, "global_step": 107709, "epoch": 641} {"train_loss": -9.956421852111816, "global_step": 107710, "epoch": 641} {"train_loss": -9.942394256591797, "global_step": 107711, "epoch": 641} {"train_loss": -10.024563789367676, "global_step": 107712, "epoch": 641} {"train_loss": -9.727664947509766, "global_step": 107713, "epoch": 641} {"train_loss": -9.99927043914795, "global_step": 107714, "epoch": 641} {"train_loss": -9.878555297851562, "global_step": 107715, "epoch": 641} {"train_loss": -10.051328659057617, "global_step": 107716, "epoch": 641} {"train_loss": -10.011238098144531, "global_step": 107717, "epoch": 641} {"train_loss": -9.931821823120117, "global_step": 107718, "epoch": 641} {"train_loss": -9.875232696533203, "global_step": 107719, "epoch": 641} {"train_loss": -10.037759780883789, "global_step": 107720, "epoch": 641} {"train_loss": -10.180135726928711, "global_step": 107721, "epoch": 641} {"train_loss": -10.26137924194336, "global_step": 107722, "epoch": 641} {"train_loss": -10.016023635864258, "global_step": 107723, "epoch": 641} {"train_loss": -10.093901634216309, "global_step": 107724, "epoch": 641} {"train_loss": -10.193609237670898, "global_step": 107725, "epoch": 641} {"train_loss": -10.142072677612305, "global_step": 107726, "epoch": 641} {"train_loss": -9.74134635925293, "global_step": 107727, "epoch": 641} {"train_loss": -10.15603256225586, "global_step": 107728, "epoch": 641} {"train_loss": -9.872776985168457, "global_step": 107729, "epoch": 641} {"train_loss": -10.110664367675781, "global_step": 107730, "epoch": 641} {"train_loss": -10.08248233795166, "global_step": 107731, "epoch": 641} {"train_loss": -9.825056076049805, "global_step": 107732, "epoch": 641} {"train_loss": -10.067630767822266, "global_step": 107733, "epoch": 641} {"train_loss": -10.017803192138672, "global_step": 107734, "epoch": 641} {"train_loss": -9.670157432556152, "global_step": 107735, "epoch": 641} {"train_loss": -9.42514419555664, "global_step": 107736, "epoch": 641} {"train_loss": -10.150310516357422, "global_step": 107737, "epoch": 641} {"train_loss": -9.586156845092773, "global_step": 107738, "epoch": 641} {"train_loss": -9.918843269348145, "global_step": 107739, "epoch": 641} {"train_loss": -9.54227352142334, "global_step": 107740, "epoch": 641} {"train_loss": -9.484437942504883, "global_step": 107741, "epoch": 641} {"train_loss": -9.830196380615234, "global_step": 107742, "epoch": 641} {"train_loss": -9.783939361572266, "global_step": 107743, "epoch": 641} {"train_loss": -9.921966552734375, "global_step": 107744, "epoch": 641} {"train_loss": -9.694449424743652, "global_step": 107745, "epoch": 641} {"train_loss": -9.748245239257812, "global_step": 107746, "epoch": 641} {"train_loss": -9.768388748168945, "global_step": 107747, "epoch": 641} {"train_loss": -9.935501098632812, "global_step": 107748, "epoch": 641} {"train_loss": -9.345855712890625, "global_step": 107749, "epoch": 641} {"train_loss": -9.613119125366211, "global_step": 107750, "epoch": 641} {"train_loss": -10.086454391479492, "global_step": 107751, "epoch": 641} {"train_loss": -9.665501594543457, "global_step": 107752, "epoch": 641} {"train_loss": -9.931134223937988, "global_step": 107753, "epoch": 641} {"train_loss": -9.687408447265625, "global_step": 107754, "epoch": 641} {"train_loss": -9.857028007507324, "global_step": 107755, "epoch": 641} {"train_loss": -9.809226989746094, "global_step": 107756, "epoch": 641} {"train_loss": -9.770891189575195, "global_step": 107757, "epoch": 641} {"train_loss": -9.85529899597168, "global_step": 107758, "epoch": 641} {"train_loss": -9.965456008911133, "global_step": 107759, "epoch": 641} {"train_loss": -9.80754566192627, "global_step": 107760, "epoch": 641} {"train_loss": -9.877769470214844, "global_step": 107761, "epoch": 641} {"train_loss": -9.956913948059082, "global_step": 107762, "epoch": 641} {"train_loss": -10.07541275024414, "global_step": 107763, "epoch": 641} {"train_loss": -9.85589599609375, "global_step": 107764, "epoch": 641} {"train_loss": -9.993949890136719, "global_step": 107765, "epoch": 641} {"train_loss": -9.84670639038086, "global_step": 107766, "epoch": 641} {"train_loss": -9.842912673950195, "global_step": 107767, "epoch": 641} {"train_loss": -9.878591537475586, "global_step": 107768, "epoch": 641} {"train_loss": -9.5582914352417, "global_step": 107769, "epoch": 641} {"train_loss": -9.900108337402344, "global_step": 107770, "epoch": 641} {"train_loss": -9.512596130371094, "global_step": 107771, "epoch": 641} {"train_loss": -9.81527328491211, "global_step": 107772, "epoch": 641} {"train_loss": -9.831808090209961, "global_step": 107773, "epoch": 641} {"train_loss": -9.894231796264648, "global_step": 107774, "epoch": 641} {"train_loss": -9.731372833251953, "global_step": 107775, "epoch": 641} {"train_loss": -9.790313720703125, "global_step": 107776, "epoch": 641} {"train_loss": -9.57269287109375, "global_step": 107777, "epoch": 641} {"train_loss": -9.885108947753906, "global_step": 107778, "epoch": 641} {"train_loss": -9.620180130004883, "global_step": 107779, "epoch": 641} {"train_loss": -9.80350399017334, "global_step": 107780, "epoch": 641} {"train_loss": -10.039775848388672, "global_step": 107781, "epoch": 641} {"train_loss": -9.869135856628418, "global_step": 107782, "epoch": 641} {"train_loss": -9.96510124206543, "global_step": 107783, "epoch": 641} {"train_loss": -10.135293960571289, "global_step": 107784, "epoch": 641} {"train_loss": -9.934855461120605, "global_step": 107785, "epoch": 641} {"train_loss": -9.837181091308594, "global_step": 107786, "epoch": 641} {"train_loss": -10.008840560913086, "global_step": 107787, "epoch": 641} {"train_loss": -10.0463228225708, "global_step": 107788, "epoch": 641} {"train_loss": -10.083833694458008, "global_step": 107789, "epoch": 641} {"train_loss": -9.956099510192871, "global_step": 107790, "epoch": 641} {"train_loss": -10.279510498046875, "global_step": 107791, "epoch": 641} {"train_loss": -9.898795127868652, "global_step": 107792, "epoch": 641} {"train_loss": -9.897842407226562, "global_step": 107793, "epoch": 641} {"train_loss": -9.904256820678711, "global_step": 107794, "epoch": 641} {"train_loss": -10.084772109985352, "global_step": 107795, "epoch": 641} {"train_loss": -9.94930362701416, "global_step": 107796, "epoch": 641} {"train_loss": -9.996511459350586, "global_step": 107797, "epoch": 641} {"train_loss": -10.046915054321289, "global_step": 107798, "epoch": 641} {"train_loss": -9.651674270629883, "global_step": 107799, "epoch": 641} {"train_loss": -10.047019004821777, "global_step": 107800, "epoch": 641} {"train_loss": -9.82508659362793, "global_step": 107801, "epoch": 641} {"train_loss": -10.061861038208008, "global_step": 107802, "epoch": 641} {"train_loss": -9.884260177612305, "global_step": 107803, "epoch": 641} {"train_loss": -9.942825317382812, "global_step": 107804, "epoch": 641} {"train_loss": -10.157097816467285, "global_step": 107805, "epoch": 641} {"train_loss": -9.633134841918945, "global_step": 107806, "epoch": 641} {"train_loss": -10.13086223602295, "global_step": 107807, "epoch": 641} {"train_loss": -9.06527042388916, "global_step": 107808, "epoch": 641} {"train_loss": -9.579235076904297, "global_step": 107809, "epoch": 641} {"train_loss": -9.135766983032227, "global_step": 107810, "epoch": 641} {"train_loss": -9.67790412902832, "global_step": 107811, "epoch": 641} {"train_loss": -9.538366317749023, "global_step": 107812, "epoch": 641} {"train_loss": -9.802933692932129, "global_step": 107813, "epoch": 641} {"train_loss": -9.794469833374023, "global_step": 107814, "epoch": 641} {"train_loss": -9.531621932983398, "global_step": 107815, "epoch": 641} {"train_loss": -9.986494064331055, "global_step": 107816, "epoch": 641} {"train_loss": -9.72575855255127, "global_step": 107817, "epoch": 641} {"train_loss": -9.872804641723633, "global_step": 107818, "epoch": 641} {"train_loss": -9.685906410217285, "global_step": 107819, "epoch": 641} {"train_loss": -9.442055702209473, "global_step": 107820, "epoch": 641} {"train_loss": -9.285261154174805, "global_step": 107821, "epoch": 641} {"train_loss": -9.436164855957031, "global_step": 107822, "epoch": 641} {"train_loss": -9.351691246032715, "global_step": 107823, "epoch": 641} {"train_loss": -9.766833305358887, "global_step": 107824, "epoch": 641} {"train_loss": -9.622661590576172, "global_step": 107825, "epoch": 641} {"train_loss": -9.360641479492188, "global_step": 107826, "epoch": 641} {"train_loss": -9.738128662109375, "global_step": 107827, "epoch": 641} {"train_loss": -9.329658508300781, "global_step": 107828, "epoch": 641} {"train_loss": -9.317644119262695, "global_step": 107829, "epoch": 641} {"train_loss": -9.597545623779297, "global_step": 107830, "epoch": 641} {"train_loss": -9.644189834594727, "global_step": 107831, "epoch": 641} {"train_loss": -9.384239196777344, "global_step": 107832, "epoch": 641} {"train_loss": -9.612404823303223, "global_step": 107833, "epoch": 641} {"train_loss": -9.753817558288574, "global_step": 107834, "epoch": 641} {"train_loss": -9.706266403198242, "global_step": 107835, "epoch": 641} {"train_loss": -9.719148635864258, "global_step": 107836, "epoch": 641} {"train_loss": -9.845893859863281, "global_step": 107837, "epoch": 641} {"train_loss": -10.117864608764648, "global_step": 107838, "epoch": 641} {"train_loss": -9.756305694580078, "global_step": 107839, "epoch": 641} {"train_loss": -9.903982162475586, "global_step": 107840, "epoch": 641} {"train_loss": -9.909802436828613, "global_step": 107841, "epoch": 641} {"train_loss": -9.717570304870605, "global_step": 107842, "epoch": 641} {"train_loss": -9.842046737670898, "global_step": 107843, "epoch": 641} {"train_loss": -9.812332153320312, "global_step": 107844, "epoch": 641} {"train_loss": -9.895989418029785, "global_step": 107845, "epoch": 641} {"train_loss": -9.916618347167969, "global_step": 107846, "epoch": 641} {"train_loss": -10.085745811462402, "global_step": 107847, "epoch": 641} {"train_loss": -9.907475471496582, "global_step": 107848, "epoch": 641} {"train_loss": -9.84901237487793, "global_step": 107849, "epoch": 641} {"train_loss": -9.872617721557617, "global_step": 107850, "epoch": 641} {"train_loss": -9.697728157043457, "global_step": 107851, "epoch": 641} {"train_loss": -9.7457857131958, "global_step": 107852, "epoch": 641} {"train_loss": -9.594998359680176, "global_step": 107853, "epoch": 641} {"train_loss": -9.73017406463623, "global_step": 107854, "epoch": 641} {"train_loss": -9.81605427038102, "global_step": 107855, "epoch": 641, "val_loss": 208032.546875} {"train_loss": -9.972455978393555, "global_step": 107856, "epoch": 642} {"train_loss": -9.818460464477539, "global_step": 107857, "epoch": 642} {"train_loss": -9.754730224609375, "global_step": 107858, "epoch": 642} {"train_loss": -9.865636825561523, "global_step": 107859, "epoch": 642} {"train_loss": -9.752067565917969, "global_step": 107860, "epoch": 642} {"train_loss": -9.931100845336914, "global_step": 107861, "epoch": 642} {"train_loss": -9.659370422363281, "global_step": 107862, "epoch": 642} {"train_loss": -9.581591606140137, "global_step": 107863, "epoch": 642} {"train_loss": -9.605108261108398, "global_step": 107864, "epoch": 642} {"train_loss": -9.718716621398926, "global_step": 107865, "epoch": 642} {"train_loss": -9.59775161743164, "global_step": 107866, "epoch": 642} {"train_loss": -9.754295349121094, "global_step": 107867, "epoch": 642} {"train_loss": -9.971908569335938, "global_step": 107868, "epoch": 642} {"train_loss": -9.784370422363281, "global_step": 107869, "epoch": 642} {"train_loss": -9.964158058166504, "global_step": 107870, "epoch": 642} {"train_loss": -9.735458374023438, "global_step": 107871, "epoch": 642} {"train_loss": -9.757132530212402, "global_step": 107872, "epoch": 642} {"train_loss": -9.944107055664062, "global_step": 107873, "epoch": 642} {"train_loss": -9.576986312866211, "global_step": 107874, "epoch": 642} {"train_loss": -9.260908126831055, "global_step": 107875, "epoch": 642} {"train_loss": -9.903563499450684, "global_step": 107876, "epoch": 642} {"train_loss": -9.805931091308594, "global_step": 107877, "epoch": 642} {"train_loss": -9.736112594604492, "global_step": 107878, "epoch": 642} {"train_loss": -10.043357849121094, "global_step": 107879, "epoch": 642} {"train_loss": -9.888484954833984, "global_step": 107880, "epoch": 642} {"train_loss": -10.189477920532227, "global_step": 107881, "epoch": 642} {"train_loss": -9.767578125, "global_step": 107882, "epoch": 642} {"train_loss": -9.892351150512695, "global_step": 107883, "epoch": 642} {"train_loss": -10.091684341430664, "global_step": 107884, "epoch": 642} {"train_loss": -9.797828674316406, "global_step": 107885, "epoch": 642} {"train_loss": -10.026248931884766, "global_step": 107886, "epoch": 642} {"train_loss": -9.876148223876953, "global_step": 107887, "epoch": 642} {"train_loss": -9.890315055847168, "global_step": 107888, "epoch": 642} {"train_loss": -10.142433166503906, "global_step": 107889, "epoch": 642} {"train_loss": -9.691466331481934, "global_step": 107890, "epoch": 642} {"train_loss": -10.02552604675293, "global_step": 107891, "epoch": 642} {"train_loss": -9.805659294128418, "global_step": 107892, "epoch": 642} {"train_loss": -9.870433807373047, "global_step": 107893, "epoch": 642} {"train_loss": -9.72882080078125, "global_step": 107894, "epoch": 642} {"train_loss": -9.841662406921387, "global_step": 107895, "epoch": 642} {"train_loss": -9.6631498336792, "global_step": 107896, "epoch": 642} {"train_loss": -9.594407081604004, "global_step": 107897, "epoch": 642} {"train_loss": -9.928349494934082, "global_step": 107898, "epoch": 642} {"train_loss": -9.837159156799316, "global_step": 107899, "epoch": 642} {"train_loss": -10.04102897644043, "global_step": 107900, "epoch": 642} {"train_loss": -9.940705299377441, "global_step": 107901, "epoch": 642} {"train_loss": -9.887964248657227, "global_step": 107902, "epoch": 642} {"train_loss": -9.867950439453125, "global_step": 107903, "epoch": 642} {"train_loss": -9.656600952148438, "global_step": 107904, "epoch": 642} {"train_loss": -10.00078010559082, "global_step": 107905, "epoch": 642} {"train_loss": -9.87061882019043, "global_step": 107906, "epoch": 642} {"train_loss": -9.961060523986816, "global_step": 107907, "epoch": 642} {"train_loss": -9.90740966796875, "global_step": 107908, "epoch": 642} {"train_loss": -10.100936889648438, "global_step": 107909, "epoch": 642} {"train_loss": -10.110776901245117, "global_step": 107910, "epoch": 642} {"train_loss": -10.069194793701172, "global_step": 107911, "epoch": 642} {"train_loss": -10.14350700378418, "global_step": 107912, "epoch": 642} {"train_loss": -9.968267440795898, "global_step": 107913, "epoch": 642} {"train_loss": -9.994009971618652, "global_step": 107914, "epoch": 642} {"train_loss": -10.139104843139648, "global_step": 107915, "epoch": 642} {"train_loss": -10.25391960144043, "global_step": 107916, "epoch": 642} {"train_loss": -10.012590408325195, "global_step": 107917, "epoch": 642} {"train_loss": -10.240628242492676, "global_step": 107918, "epoch": 642} {"train_loss": -9.872221946716309, "global_step": 107919, "epoch": 642} {"train_loss": -9.972001075744629, "global_step": 107920, "epoch": 642} {"train_loss": -10.039612770080566, "global_step": 107921, "epoch": 642} {"train_loss": -10.083864212036133, "global_step": 107922, "epoch": 642} {"train_loss": -9.886157989501953, "global_step": 107923, "epoch": 642} {"train_loss": -9.938129425048828, "global_step": 107924, "epoch": 642} {"train_loss": -10.04837417602539, "global_step": 107925, "epoch": 642} {"train_loss": -9.598038673400879, "global_step": 107926, "epoch": 642} {"train_loss": -10.068973541259766, "global_step": 107927, "epoch": 642} {"train_loss": -9.691675186157227, "global_step": 107928, "epoch": 642} {"train_loss": -9.515663146972656, "global_step": 107929, "epoch": 642} {"train_loss": -9.953295707702637, "global_step": 107930, "epoch": 642} {"train_loss": -9.157898902893066, "global_step": 107931, "epoch": 642} {"train_loss": -10.035842895507812, "global_step": 107932, "epoch": 642} {"train_loss": -9.78098201751709, "global_step": 107933, "epoch": 642} {"train_loss": -9.440156936645508, "global_step": 107934, "epoch": 642} {"train_loss": -9.783171653747559, "global_step": 107935, "epoch": 642} {"train_loss": -9.376094818115234, "global_step": 107936, "epoch": 642} {"train_loss": -9.867327690124512, "global_step": 107937, "epoch": 642} {"train_loss": -9.505609512329102, "global_step": 107938, "epoch": 642} {"train_loss": -9.638628959655762, "global_step": 107939, "epoch": 642} {"train_loss": -9.895401000976562, "global_step": 107940, "epoch": 642} {"train_loss": -9.561595916748047, "global_step": 107941, "epoch": 642} {"train_loss": -9.564979553222656, "global_step": 107942, "epoch": 642} {"train_loss": -9.370584487915039, "global_step": 107943, "epoch": 642} {"train_loss": -9.726296424865723, "global_step": 107944, "epoch": 642} {"train_loss": -9.768220901489258, "global_step": 107945, "epoch": 642} {"train_loss": -9.566845893859863, "global_step": 107946, "epoch": 642} {"train_loss": -9.558700561523438, "global_step": 107947, "epoch": 642} {"train_loss": -9.292160987854004, "global_step": 107948, "epoch": 642} {"train_loss": -9.524312019348145, "global_step": 107949, "epoch": 642} {"train_loss": -9.656540870666504, "global_step": 107950, "epoch": 642} {"train_loss": -9.919620513916016, "global_step": 107951, "epoch": 642} {"train_loss": -9.445259094238281, "global_step": 107952, "epoch": 642} {"train_loss": -9.808719635009766, "global_step": 107953, "epoch": 642} {"train_loss": -9.738221168518066, "global_step": 107954, "epoch": 642} {"train_loss": -9.519424438476562, "global_step": 107955, "epoch": 642} {"train_loss": -9.495542526245117, "global_step": 107956, "epoch": 642} {"train_loss": -9.607837677001953, "global_step": 107957, "epoch": 642} {"train_loss": -9.724526405334473, "global_step": 107958, "epoch": 642} {"train_loss": -9.669927597045898, "global_step": 107959, "epoch": 642} {"train_loss": -9.811668395996094, "global_step": 107960, "epoch": 642} {"train_loss": -9.47817611694336, "global_step": 107961, "epoch": 642} {"train_loss": -9.68500804901123, "global_step": 107962, "epoch": 642} {"train_loss": -9.23974609375, "global_step": 107963, "epoch": 642} {"train_loss": -10.047175407409668, "global_step": 107964, "epoch": 642} {"train_loss": -9.504560470581055, "global_step": 107965, "epoch": 642} {"train_loss": -9.65411376953125, "global_step": 107966, "epoch": 642} {"train_loss": -9.430805206298828, "global_step": 107967, "epoch": 642} {"train_loss": -9.597192764282227, "global_step": 107968, "epoch": 642} {"train_loss": -9.651949882507324, "global_step": 107969, "epoch": 642} {"train_loss": -9.418612480163574, "global_step": 107970, "epoch": 642} {"train_loss": -9.947038650512695, "global_step": 107971, "epoch": 642} {"train_loss": -9.54008960723877, "global_step": 107972, "epoch": 642} {"train_loss": -9.977169036865234, "global_step": 107973, "epoch": 642} {"train_loss": -9.574945449829102, "global_step": 107974, "epoch": 642} {"train_loss": -9.713335037231445, "global_step": 107975, "epoch": 642} {"train_loss": -9.973691940307617, "global_step": 107976, "epoch": 642} {"train_loss": -9.679960250854492, "global_step": 107977, "epoch": 642} {"train_loss": -9.870321273803711, "global_step": 107978, "epoch": 642} {"train_loss": -9.759515762329102, "global_step": 107979, "epoch": 642} {"train_loss": -9.93529224395752, "global_step": 107980, "epoch": 642} {"train_loss": -9.87969970703125, "global_step": 107981, "epoch": 642} {"train_loss": -9.874366760253906, "global_step": 107982, "epoch": 642} {"train_loss": -9.885828018188477, "global_step": 107983, "epoch": 642} {"train_loss": -9.870933532714844, "global_step": 107984, "epoch": 642} {"train_loss": -9.96579360961914, "global_step": 107985, "epoch": 642} {"train_loss": -10.036290168762207, "global_step": 107986, "epoch": 642} {"train_loss": -9.792489051818848, "global_step": 107987, "epoch": 642} {"train_loss": -9.987784385681152, "global_step": 107988, "epoch": 642} {"train_loss": -9.97900390625, "global_step": 107989, "epoch": 642} {"train_loss": -9.992929458618164, "global_step": 107990, "epoch": 642} {"train_loss": -9.998750686645508, "global_step": 107991, "epoch": 642} {"train_loss": -10.060955047607422, "global_step": 107992, "epoch": 642} {"train_loss": -9.991667747497559, "global_step": 107993, "epoch": 642} {"train_loss": -10.093053817749023, "global_step": 107994, "epoch": 642} {"train_loss": -10.140942573547363, "global_step": 107995, "epoch": 642} {"train_loss": -10.111686706542969, "global_step": 107996, "epoch": 642} {"train_loss": -10.108174324035645, "global_step": 107997, "epoch": 642} {"train_loss": -10.082977294921875, "global_step": 107998, "epoch": 642} {"train_loss": -9.95059871673584, "global_step": 107999, "epoch": 642} {"train_loss": -9.439504623413086, "global_step": 108000, "epoch": 642} {"train_loss": -10.248917579650879, "global_step": 108001, "epoch": 642} {"train_loss": -9.476176261901855, "global_step": 108002, "epoch": 642} {"train_loss": -9.627325057983398, "global_step": 108003, "epoch": 642} {"train_loss": -9.832723617553711, "global_step": 108004, "epoch": 642} {"train_loss": -9.301931381225586, "global_step": 108005, "epoch": 642} {"train_loss": -9.77696418762207, "global_step": 108006, "epoch": 642} {"train_loss": -9.987983703613281, "global_step": 108007, "epoch": 642} {"train_loss": -9.385123252868652, "global_step": 108008, "epoch": 642} {"train_loss": -10.116250991821289, "global_step": 108009, "epoch": 642} {"train_loss": -9.511358261108398, "global_step": 108010, "epoch": 642} {"train_loss": -9.052896499633789, "global_step": 108011, "epoch": 642} {"train_loss": -9.458702087402344, "global_step": 108012, "epoch": 642} {"train_loss": -9.807891845703125, "global_step": 108013, "epoch": 642} {"train_loss": -9.579833030700684, "global_step": 108014, "epoch": 642} {"train_loss": -9.403757095336914, "global_step": 108015, "epoch": 642} {"train_loss": -9.454887390136719, "global_step": 108016, "epoch": 642} {"train_loss": -9.704462051391602, "global_step": 108017, "epoch": 642} {"train_loss": -9.19605827331543, "global_step": 108018, "epoch": 642} {"train_loss": -9.616228103637695, "global_step": 108019, "epoch": 642} {"train_loss": -9.42845344543457, "global_step": 108020, "epoch": 642} {"train_loss": -9.144844055175781, "global_step": 108021, "epoch": 642} {"train_loss": -9.759737014770508, "global_step": 108022, "epoch": 642} {"train_loss": -9.780543088912964, "global_step": 108023, "epoch": 642, "val_loss": 209305.8125} {"train_loss": -9.706474304199219, "global_step": 108024, "epoch": 643} {"train_loss": -9.632767677307129, "global_step": 108025, "epoch": 643} {"train_loss": -9.861289024353027, "global_step": 108026, "epoch": 643} {"train_loss": -9.56280517578125, "global_step": 108027, "epoch": 643} {"train_loss": -10.023252487182617, "global_step": 108028, "epoch": 643} {"train_loss": -9.899353981018066, "global_step": 108029, "epoch": 643} {"train_loss": -9.733720779418945, "global_step": 108030, "epoch": 643} {"train_loss": -9.943028450012207, "global_step": 108031, "epoch": 643} {"train_loss": -9.937788963317871, "global_step": 108032, "epoch": 643} {"train_loss": -9.742300033569336, "global_step": 108033, "epoch": 643} {"train_loss": -9.946881294250488, "global_step": 108034, "epoch": 643} {"train_loss": -9.776264190673828, "global_step": 108035, "epoch": 643} {"train_loss": -9.961978912353516, "global_step": 108036, "epoch": 643} {"train_loss": -9.786712646484375, "global_step": 108037, "epoch": 643} {"train_loss": -9.937065124511719, "global_step": 108038, "epoch": 643} {"train_loss": -9.834468841552734, "global_step": 108039, "epoch": 643} {"train_loss": -9.979799270629883, "global_step": 108040, "epoch": 643} {"train_loss": -9.929380416870117, "global_step": 108041, "epoch": 643} {"train_loss": -10.131267547607422, "global_step": 108042, "epoch": 643} {"train_loss": -9.991186141967773, "global_step": 108043, "epoch": 643} {"train_loss": -9.78795051574707, "global_step": 108044, "epoch": 643} {"train_loss": -10.000782012939453, "global_step": 108045, "epoch": 643} {"train_loss": -10.020973205566406, "global_step": 108046, "epoch": 643} {"train_loss": -10.074544906616211, "global_step": 108047, "epoch": 643} {"train_loss": -9.60579776763916, "global_step": 108048, "epoch": 643} {"train_loss": -9.931687355041504, "global_step": 108049, "epoch": 643} {"train_loss": -9.518343925476074, "global_step": 108050, "epoch": 643} {"train_loss": -9.653192520141602, "global_step": 108051, "epoch": 643} {"train_loss": -9.965202331542969, "global_step": 108052, "epoch": 643} {"train_loss": -9.560318946838379, "global_step": 108053, "epoch": 643} {"train_loss": -9.93041706085205, "global_step": 108054, "epoch": 643} {"train_loss": -9.601566314697266, "global_step": 108055, "epoch": 643} {"train_loss": -10.15293025970459, "global_step": 108056, "epoch": 643} {"train_loss": -9.698175430297852, "global_step": 108057, "epoch": 643} {"train_loss": -10.018928527832031, "global_step": 108058, "epoch": 643} {"train_loss": -9.76759147644043, "global_step": 108059, "epoch": 643} {"train_loss": -9.998917579650879, "global_step": 108060, "epoch": 643} {"train_loss": -9.733556747436523, "global_step": 108061, "epoch": 643} {"train_loss": -10.276750564575195, "global_step": 108062, "epoch": 643} {"train_loss": -9.860631942749023, "global_step": 108063, "epoch": 643} {"train_loss": -9.9507474899292, "global_step": 108064, "epoch": 643} {"train_loss": -9.501311302185059, "global_step": 108065, "epoch": 643} {"train_loss": -9.993483543395996, "global_step": 108066, "epoch": 643} {"train_loss": -9.931756019592285, "global_step": 108067, "epoch": 643} {"train_loss": -9.767687797546387, "global_step": 108068, "epoch": 643} {"train_loss": -9.709417343139648, "global_step": 108069, "epoch": 643} {"train_loss": -9.659966468811035, "global_step": 108070, "epoch": 643} {"train_loss": -9.706042289733887, "global_step": 108071, "epoch": 643} {"train_loss": -9.834207534790039, "global_step": 108072, "epoch": 643} {"train_loss": -10.073892593383789, "global_step": 108073, "epoch": 643} {"train_loss": -9.807197570800781, "global_step": 108074, "epoch": 643} {"train_loss": -9.906549453735352, "global_step": 108075, "epoch": 643} {"train_loss": -9.883071899414062, "global_step": 108076, "epoch": 643} {"train_loss": -10.067168235778809, "global_step": 108077, "epoch": 643} {"train_loss": -9.959794998168945, "global_step": 108078, "epoch": 643} {"train_loss": -9.707273483276367, "global_step": 108079, "epoch": 643} {"train_loss": -9.835384368896484, "global_step": 108080, "epoch": 643} {"train_loss": -9.865121841430664, "global_step": 108081, "epoch": 643} {"train_loss": -10.078516006469727, "global_step": 108082, "epoch": 643} {"train_loss": -10.010835647583008, "global_step": 108083, "epoch": 643} {"train_loss": -10.283123016357422, "global_step": 108084, "epoch": 643} {"train_loss": -9.787187576293945, "global_step": 108085, "epoch": 643} {"train_loss": -10.087728500366211, "global_step": 108086, "epoch": 643} {"train_loss": -9.938020706176758, "global_step": 108087, "epoch": 643} {"train_loss": -9.956695556640625, "global_step": 108088, "epoch": 643} {"train_loss": -10.184229850769043, "global_step": 108089, "epoch": 643} {"train_loss": -9.968429565429688, "global_step": 108090, "epoch": 643} {"train_loss": -9.989873886108398, "global_step": 108091, "epoch": 643} {"train_loss": -9.967557907104492, "global_step": 108092, "epoch": 643} {"train_loss": -9.789738655090332, "global_step": 108093, "epoch": 643} {"train_loss": -9.866377830505371, "global_step": 108094, "epoch": 643} {"train_loss": -9.700523376464844, "global_step": 108095, "epoch": 643} {"train_loss": -10.201263427734375, "global_step": 108096, "epoch": 643} {"train_loss": -9.347747802734375, "global_step": 108097, "epoch": 643} {"train_loss": -9.6521635055542, "global_step": 108098, "epoch": 643} {"train_loss": -10.015985488891602, "global_step": 108099, "epoch": 643} {"train_loss": -9.09022331237793, "global_step": 108100, "epoch": 643} {"train_loss": -10.262870788574219, "global_step": 108101, "epoch": 643} {"train_loss": -9.435506820678711, "global_step": 108102, "epoch": 643} {"train_loss": -9.33905029296875, "global_step": 108103, "epoch": 643} {"train_loss": -9.279152870178223, "global_step": 108104, "epoch": 643} {"train_loss": -9.734406471252441, "global_step": 108105, "epoch": 643} {"train_loss": -9.221738815307617, "global_step": 108106, "epoch": 643} {"train_loss": -9.028316497802734, "global_step": 108107, "epoch": 643} {"train_loss": -8.695175170898438, "global_step": 108108, "epoch": 643} {"train_loss": -9.661834716796875, "global_step": 108109, "epoch": 643} {"train_loss": -8.921241760253906, "global_step": 108110, "epoch": 643} {"train_loss": -9.702628135681152, "global_step": 108111, "epoch": 643} {"train_loss": -9.077030181884766, "global_step": 108112, "epoch": 643} {"train_loss": -9.699231147766113, "global_step": 108113, "epoch": 643} {"train_loss": -9.215578079223633, "global_step": 108114, "epoch": 643} {"train_loss": -9.235450744628906, "global_step": 108115, "epoch": 643} {"train_loss": -9.610980987548828, "global_step": 108116, "epoch": 643} {"train_loss": -9.503499031066895, "global_step": 108117, "epoch": 643} {"train_loss": -9.721456527709961, "global_step": 108118, "epoch": 643} {"train_loss": -9.66413688659668, "global_step": 108119, "epoch": 643} {"train_loss": -9.643141746520996, "global_step": 108120, "epoch": 643} {"train_loss": -9.597823143005371, "global_step": 108121, "epoch": 643} {"train_loss": -9.523481369018555, "global_step": 108122, "epoch": 643} {"train_loss": -9.627317428588867, "global_step": 108123, "epoch": 643} {"train_loss": -9.476778984069824, "global_step": 108124, "epoch": 643} {"train_loss": -9.292217254638672, "global_step": 108125, "epoch": 643} {"train_loss": -9.542529106140137, "global_step": 108126, "epoch": 643} {"train_loss": -9.741020202636719, "global_step": 108127, "epoch": 643} {"train_loss": -9.557065963745117, "global_step": 108128, "epoch": 643} {"train_loss": -9.456779479980469, "global_step": 108129, "epoch": 643} {"train_loss": -9.585725784301758, "global_step": 108130, "epoch": 643} {"train_loss": -9.455187797546387, "global_step": 108131, "epoch": 643} {"train_loss": -9.196439743041992, "global_step": 108132, "epoch": 643} {"train_loss": -9.351710319519043, "global_step": 108133, "epoch": 643} {"train_loss": -9.637552261352539, "global_step": 108134, "epoch": 643} {"train_loss": -9.688244819641113, "global_step": 108135, "epoch": 643} {"train_loss": -9.301368713378906, "global_step": 108136, "epoch": 643} {"train_loss": -9.615352630615234, "global_step": 108137, "epoch": 643} {"train_loss": -9.774124145507812, "global_step": 108138, "epoch": 643} {"train_loss": -9.178230285644531, "global_step": 108139, "epoch": 643} {"train_loss": -9.804814338684082, "global_step": 108140, "epoch": 643} {"train_loss": -9.955429077148438, "global_step": 108141, "epoch": 643} {"train_loss": -9.726521492004395, "global_step": 108142, "epoch": 643} {"train_loss": -9.838920593261719, "global_step": 108143, "epoch": 643} {"train_loss": -9.683884620666504, "global_step": 108144, "epoch": 643} {"train_loss": -9.703631401062012, "global_step": 108145, "epoch": 643} {"train_loss": -9.82365894317627, "global_step": 108146, "epoch": 643} {"train_loss": -9.658063888549805, "global_step": 108147, "epoch": 643} {"train_loss": -9.5096435546875, "global_step": 108148, "epoch": 643} {"train_loss": -9.942541122436523, "global_step": 108149, "epoch": 643} {"train_loss": -9.670969009399414, "global_step": 108150, "epoch": 643} {"train_loss": -10.030366897583008, "global_step": 108151, "epoch": 643} {"train_loss": -10.065065383911133, "global_step": 108152, "epoch": 643} {"train_loss": -10.11178970336914, "global_step": 108153, "epoch": 643} {"train_loss": -9.95486831665039, "global_step": 108154, "epoch": 643} {"train_loss": -10.039405822753906, "global_step": 108155, "epoch": 643} {"train_loss": -10.051273345947266, "global_step": 108156, "epoch": 643} {"train_loss": -9.756784439086914, "global_step": 108157, "epoch": 643} {"train_loss": -10.179779052734375, "global_step": 108158, "epoch": 643} {"train_loss": -10.021631240844727, "global_step": 108159, "epoch": 643} {"train_loss": -10.016012191772461, "global_step": 108160, "epoch": 643} {"train_loss": -10.007376670837402, "global_step": 108161, "epoch": 643} {"train_loss": -10.071544647216797, "global_step": 108162, "epoch": 643} {"train_loss": -10.057012557983398, "global_step": 108163, "epoch": 643} {"train_loss": -10.158845901489258, "global_step": 108164, "epoch": 643} {"train_loss": -9.640989303588867, "global_step": 108165, "epoch": 643} {"train_loss": -9.994510650634766, "global_step": 108166, "epoch": 643} {"train_loss": -9.658049583435059, "global_step": 108167, "epoch": 643} {"train_loss": -9.733628273010254, "global_step": 108168, "epoch": 643} {"train_loss": -10.010651588439941, "global_step": 108169, "epoch": 643} {"train_loss": -9.326761245727539, "global_step": 108170, "epoch": 643} {"train_loss": -10.139518737792969, "global_step": 108171, "epoch": 643} {"train_loss": -9.065400123596191, "global_step": 108172, "epoch": 643} {"train_loss": -9.81635570526123, "global_step": 108173, "epoch": 643} {"train_loss": -9.82913589477539, "global_step": 108174, "epoch": 643} {"train_loss": -9.648513793945312, "global_step": 108175, "epoch": 643} {"train_loss": -9.729270935058594, "global_step": 108176, "epoch": 643} {"train_loss": -9.645156860351562, "global_step": 108177, "epoch": 643} {"train_loss": -9.932289123535156, "global_step": 108178, "epoch": 643} {"train_loss": -9.960050582885742, "global_step": 108179, "epoch": 643} {"train_loss": -9.923856735229492, "global_step": 108180, "epoch": 643} {"train_loss": -9.927413940429688, "global_step": 108181, "epoch": 643} {"train_loss": -9.795286178588867, "global_step": 108182, "epoch": 643} {"train_loss": -9.893229484558105, "global_step": 108183, "epoch": 643} {"train_loss": -9.983109474182129, "global_step": 108184, "epoch": 643} {"train_loss": -9.900629043579102, "global_step": 108185, "epoch": 643} {"train_loss": -9.857475280761719, "global_step": 108186, "epoch": 643} {"train_loss": -9.84260368347168, "global_step": 108187, "epoch": 643} {"train_loss": -10.240609169006348, "global_step": 108188, "epoch": 643} {"train_loss": -10.078041076660156, "global_step": 108189, "epoch": 643} {"train_loss": -10.01705551147461, "global_step": 108190, "epoch": 643} {"train_loss": -9.775617082913717, "global_step": 108191, "epoch": 643, "val_loss": 208106.921875} {"train_loss": -10.004288673400879, "global_step": 108192, "epoch": 644} {"train_loss": -9.65150260925293, "global_step": 108193, "epoch": 644} {"train_loss": -9.895696640014648, "global_step": 108194, "epoch": 644} {"train_loss": -9.968009948730469, "global_step": 108195, "epoch": 644} {"train_loss": -10.012100219726562, "global_step": 108196, "epoch": 644} {"train_loss": -9.86737060546875, "global_step": 108197, "epoch": 644} {"train_loss": -9.948355674743652, "global_step": 108198, "epoch": 644} {"train_loss": -9.552848815917969, "global_step": 108199, "epoch": 644} {"train_loss": -9.834343910217285, "global_step": 108200, "epoch": 644} {"train_loss": -9.689270973205566, "global_step": 108201, "epoch": 644} {"train_loss": -9.727336883544922, "global_step": 108202, "epoch": 644} {"train_loss": -9.954248428344727, "global_step": 108203, "epoch": 644} {"train_loss": -9.595636367797852, "global_step": 108204, "epoch": 644} {"train_loss": -9.930826187133789, "global_step": 108205, "epoch": 644} {"train_loss": -9.846689224243164, "global_step": 108206, "epoch": 644} {"train_loss": -9.8848876953125, "global_step": 108207, "epoch": 644} {"train_loss": -9.972259521484375, "global_step": 108208, "epoch": 644} {"train_loss": -9.826072692871094, "global_step": 108209, "epoch": 644} {"train_loss": -10.104362487792969, "global_step": 108210, "epoch": 644} {"train_loss": -9.830704689025879, "global_step": 108211, "epoch": 644} {"train_loss": -9.880885124206543, "global_step": 108212, "epoch": 644} {"train_loss": -10.159674644470215, "global_step": 108213, "epoch": 644} {"train_loss": -9.891544342041016, "global_step": 108214, "epoch": 644} {"train_loss": -9.905318260192871, "global_step": 108215, "epoch": 644} {"train_loss": -10.027402877807617, "global_step": 108216, "epoch": 644} {"train_loss": -9.909147262573242, "global_step": 108217, "epoch": 644} {"train_loss": -10.132911682128906, "global_step": 108218, "epoch": 644} {"train_loss": -9.869304656982422, "global_step": 108219, "epoch": 644} {"train_loss": -10.199702262878418, "global_step": 108220, "epoch": 644} {"train_loss": -9.914146423339844, "global_step": 108221, "epoch": 644} {"train_loss": -10.142202377319336, "global_step": 108222, "epoch": 644} {"train_loss": -10.153558731079102, "global_step": 108223, "epoch": 644} {"train_loss": -9.78978443145752, "global_step": 108224, "epoch": 644} {"train_loss": -9.997282028198242, "global_step": 108225, "epoch": 644} {"train_loss": -9.804676055908203, "global_step": 108226, "epoch": 644} {"train_loss": -9.940771102905273, "global_step": 108227, "epoch": 644} {"train_loss": -9.75657844543457, "global_step": 108228, "epoch": 644} {"train_loss": -9.596046447753906, "global_step": 108229, "epoch": 644} {"train_loss": -10.42628288269043, "global_step": 108230, "epoch": 644} {"train_loss": -9.761438369750977, "global_step": 108231, "epoch": 644} {"train_loss": -9.748149871826172, "global_step": 108232, "epoch": 644} {"train_loss": -10.015514373779297, "global_step": 108233, "epoch": 644} {"train_loss": -9.637796401977539, "global_step": 108234, "epoch": 644} {"train_loss": -10.327356338500977, "global_step": 108235, "epoch": 644} {"train_loss": -9.520164489746094, "global_step": 108236, "epoch": 644} {"train_loss": -9.65311050415039, "global_step": 108237, "epoch": 644} {"train_loss": -9.994880676269531, "global_step": 108238, "epoch": 644} {"train_loss": -9.645813941955566, "global_step": 108239, "epoch": 644} {"train_loss": -9.94404411315918, "global_step": 108240, "epoch": 644} {"train_loss": -10.015438079833984, "global_step": 108241, "epoch": 644} {"train_loss": -9.847217559814453, "global_step": 108242, "epoch": 644} {"train_loss": -10.131440162658691, "global_step": 108243, "epoch": 644} {"train_loss": -9.744403839111328, "global_step": 108244, "epoch": 644} {"train_loss": -10.066703796386719, "global_step": 108245, "epoch": 644} {"train_loss": -9.848644256591797, "global_step": 108246, "epoch": 644} {"train_loss": -9.827216148376465, "global_step": 108247, "epoch": 644} {"train_loss": -9.940696716308594, "global_step": 108248, "epoch": 644} {"train_loss": -9.509986877441406, "global_step": 108249, "epoch": 644} {"train_loss": -9.640883445739746, "global_step": 108250, "epoch": 644} {"train_loss": -9.577371597290039, "global_step": 108251, "epoch": 644} {"train_loss": -9.925721168518066, "global_step": 108252, "epoch": 644} {"train_loss": -9.773595809936523, "global_step": 108253, "epoch": 644} {"train_loss": -9.830047607421875, "global_step": 108254, "epoch": 644} {"train_loss": -10.005159378051758, "global_step": 108255, "epoch": 644} {"train_loss": -9.567916870117188, "global_step": 108256, "epoch": 644} {"train_loss": -9.983952522277832, "global_step": 108257, "epoch": 644} {"train_loss": -9.977455139160156, "global_step": 108258, "epoch": 644} {"train_loss": -9.396224975585938, "global_step": 108259, "epoch": 644} {"train_loss": -9.48912239074707, "global_step": 108260, "epoch": 644} {"train_loss": -9.780975341796875, "global_step": 108261, "epoch": 644} {"train_loss": -9.530484199523926, "global_step": 108262, "epoch": 644} {"train_loss": -9.787367820739746, "global_step": 108263, "epoch": 644} {"train_loss": -9.518893241882324, "global_step": 108264, "epoch": 644} {"train_loss": -9.981281280517578, "global_step": 108265, "epoch": 644} {"train_loss": -9.838336944580078, "global_step": 108266, "epoch": 644} {"train_loss": -9.829584121704102, "global_step": 108267, "epoch": 644} {"train_loss": -9.658951759338379, "global_step": 108268, "epoch": 644} {"train_loss": -9.949280738830566, "global_step": 108269, "epoch": 644} {"train_loss": -9.70438003540039, "global_step": 108270, "epoch": 644} {"train_loss": -9.96737003326416, "global_step": 108271, "epoch": 644} {"train_loss": -9.797368049621582, "global_step": 108272, "epoch": 644} {"train_loss": -10.00124740600586, "global_step": 108273, "epoch": 644} {"train_loss": -9.88325309753418, "global_step": 108274, "epoch": 644} {"train_loss": -9.98592758178711, "global_step": 108275, "epoch": 644} {"train_loss": -10.031805992126465, "global_step": 108276, "epoch": 644} {"train_loss": -9.957489013671875, "global_step": 108277, "epoch": 644} {"train_loss": -9.843408584594727, "global_step": 108278, "epoch": 644} {"train_loss": -9.96929931640625, "global_step": 108279, "epoch": 644} {"train_loss": -9.89720344543457, "global_step": 108280, "epoch": 644} {"train_loss": -9.860143661499023, "global_step": 108281, "epoch": 644} {"train_loss": -9.916044235229492, "global_step": 108282, "epoch": 644} {"train_loss": -9.89876937866211, "global_step": 108283, "epoch": 644} {"train_loss": -9.853625297546387, "global_step": 108284, "epoch": 644} {"train_loss": -9.954736709594727, "global_step": 108285, "epoch": 644} {"train_loss": -10.089083671569824, "global_step": 108286, "epoch": 644} {"train_loss": -10.155397415161133, "global_step": 108287, "epoch": 644} {"train_loss": -9.849313735961914, "global_step": 108288, "epoch": 644} {"train_loss": -10.184791564941406, "global_step": 108289, "epoch": 644} {"train_loss": -10.176111221313477, "global_step": 108290, "epoch": 644} {"train_loss": -10.157768249511719, "global_step": 108291, "epoch": 644} {"train_loss": -10.080240249633789, "global_step": 108292, "epoch": 644} {"train_loss": -10.018342971801758, "global_step": 108293, "epoch": 644} {"train_loss": -10.084798812866211, "global_step": 108294, "epoch": 644} {"train_loss": -10.03073501586914, "global_step": 108295, "epoch": 644} {"train_loss": -10.07846450805664, "global_step": 108296, "epoch": 644} {"train_loss": -9.98110294342041, "global_step": 108297, "epoch": 644} {"train_loss": -10.103616714477539, "global_step": 108298, "epoch": 644} {"train_loss": -10.315113067626953, "global_step": 108299, "epoch": 644} {"train_loss": -10.321032524108887, "global_step": 108300, "epoch": 644} {"train_loss": -10.012170791625977, "global_step": 108301, "epoch": 644} {"train_loss": -10.042333602905273, "global_step": 108302, "epoch": 644} {"train_loss": -9.8826265335083, "global_step": 108303, "epoch": 644} {"train_loss": -10.210165023803711, "global_step": 108304, "epoch": 644} {"train_loss": -9.953100204467773, "global_step": 108305, "epoch": 644} {"train_loss": -10.016068458557129, "global_step": 108306, "epoch": 644} {"train_loss": -9.915362358093262, "global_step": 108307, "epoch": 644} {"train_loss": -10.120189666748047, "global_step": 108308, "epoch": 644} {"train_loss": -9.837596893310547, "global_step": 108309, "epoch": 644} {"train_loss": -10.038673400878906, "global_step": 108310, "epoch": 644} {"train_loss": -9.918834686279297, "global_step": 108311, "epoch": 644} {"train_loss": -9.755965232849121, "global_step": 108312, "epoch": 644} {"train_loss": -9.892637252807617, "global_step": 108313, "epoch": 644} {"train_loss": -10.003517150878906, "global_step": 108314, "epoch": 644} {"train_loss": -9.834233283996582, "global_step": 108315, "epoch": 644} {"train_loss": -9.564146995544434, "global_step": 108316, "epoch": 644} {"train_loss": -9.863800048828125, "global_step": 108317, "epoch": 644} {"train_loss": -9.809799194335938, "global_step": 108318, "epoch": 644} {"train_loss": -9.927131652832031, "global_step": 108319, "epoch": 644} {"train_loss": -9.880340576171875, "global_step": 108320, "epoch": 644} {"train_loss": -9.832819938659668, "global_step": 108321, "epoch": 644} {"train_loss": -10.038501739501953, "global_step": 108322, "epoch": 644} {"train_loss": -9.63385009765625, "global_step": 108323, "epoch": 644} {"train_loss": -9.763897895812988, "global_step": 108324, "epoch": 644} {"train_loss": -9.814821243286133, "global_step": 108325, "epoch": 644} {"train_loss": -9.792601585388184, "global_step": 108326, "epoch": 644} {"train_loss": -9.708537101745605, "global_step": 108327, "epoch": 644} {"train_loss": -9.356847763061523, "global_step": 108328, "epoch": 644} {"train_loss": -10.118937492370605, "global_step": 108329, "epoch": 644} {"train_loss": -9.584552764892578, "global_step": 108330, "epoch": 644} {"train_loss": -10.041343688964844, "global_step": 108331, "epoch": 644} {"train_loss": -9.832945823669434, "global_step": 108332, "epoch": 644} {"train_loss": -9.850495338439941, "global_step": 108333, "epoch": 644} {"train_loss": -9.913314819335938, "global_step": 108334, "epoch": 644} {"train_loss": -9.72411823272705, "global_step": 108335, "epoch": 644} {"train_loss": -9.832658767700195, "global_step": 108336, "epoch": 644} {"train_loss": -9.930845260620117, "global_step": 108337, "epoch": 644} {"train_loss": -9.865486145019531, "global_step": 108338, "epoch": 644} {"train_loss": -10.048398971557617, "global_step": 108339, "epoch": 644} {"train_loss": -9.905685424804688, "global_step": 108340, "epoch": 644} {"train_loss": -10.014785766601562, "global_step": 108341, "epoch": 644} {"train_loss": -9.85354232788086, "global_step": 108342, "epoch": 644} {"train_loss": -9.958120346069336, "global_step": 108343, "epoch": 644} {"train_loss": -9.525857925415039, "global_step": 108344, "epoch": 644} {"train_loss": -9.66615104675293, "global_step": 108345, "epoch": 644} {"train_loss": -9.767406463623047, "global_step": 108346, "epoch": 644} {"train_loss": -9.476667404174805, "global_step": 108347, "epoch": 644} {"train_loss": -9.700000762939453, "global_step": 108348, "epoch": 644} {"train_loss": -9.565531730651855, "global_step": 108349, "epoch": 644} {"train_loss": -9.852604866027832, "global_step": 108350, "epoch": 644} {"train_loss": -9.79356861114502, "global_step": 108351, "epoch": 644} {"train_loss": -9.962678909301758, "global_step": 108352, "epoch": 644} {"train_loss": -10.093536376953125, "global_step": 108353, "epoch": 644} {"train_loss": -9.799115180969238, "global_step": 108354, "epoch": 644} {"train_loss": -9.960285186767578, "global_step": 108355, "epoch": 644} {"train_loss": -9.778230667114258, "global_step": 108356, "epoch": 644} {"train_loss": -9.924753189086914, "global_step": 108357, "epoch": 644} {"train_loss": -10.066934585571289, "global_step": 108358, "epoch": 644} {"train_loss": -9.88460920538221, "global_step": 108359, "epoch": 644, "val_loss": 208319.65625} {"train_loss": -9.781482696533203, "global_step": 108360, "epoch": 645} {"train_loss": -10.168298721313477, "global_step": 108361, "epoch": 645} {"train_loss": -9.796878814697266, "global_step": 108362, "epoch": 645} {"train_loss": -9.95857048034668, "global_step": 108363, "epoch": 645} {"train_loss": -9.897235870361328, "global_step": 108364, "epoch": 645} {"train_loss": -9.965341567993164, "global_step": 108365, "epoch": 645} {"train_loss": -10.070653915405273, "global_step": 108366, "epoch": 645} {"train_loss": -9.940606117248535, "global_step": 108367, "epoch": 645} {"train_loss": -10.104040145874023, "global_step": 108368, "epoch": 645} {"train_loss": -9.96817398071289, "global_step": 108369, "epoch": 645} {"train_loss": -9.983284950256348, "global_step": 108370, "epoch": 645} {"train_loss": -10.13180160522461, "global_step": 108371, "epoch": 645} {"train_loss": -9.980001449584961, "global_step": 108372, "epoch": 645} {"train_loss": -9.991888046264648, "global_step": 108373, "epoch": 645} {"train_loss": -10.084805488586426, "global_step": 108374, "epoch": 645} {"train_loss": -10.101114273071289, "global_step": 108375, "epoch": 645} {"train_loss": -9.958301544189453, "global_step": 108376, "epoch": 645} {"train_loss": -9.90274715423584, "global_step": 108377, "epoch": 645} {"train_loss": -10.121402740478516, "global_step": 108378, "epoch": 645} {"train_loss": -9.809686660766602, "global_step": 108379, "epoch": 645} {"train_loss": -9.912078857421875, "global_step": 108380, "epoch": 645} {"train_loss": -10.154988288879395, "global_step": 108381, "epoch": 645} {"train_loss": -9.755196571350098, "global_step": 108382, "epoch": 645} {"train_loss": -9.965835571289062, "global_step": 108383, "epoch": 645} {"train_loss": -9.904146194458008, "global_step": 108384, "epoch": 645} {"train_loss": -10.265409469604492, "global_step": 108385, "epoch": 645} {"train_loss": -10.272760391235352, "global_step": 108386, "epoch": 645} {"train_loss": -9.358604431152344, "global_step": 108387, "epoch": 645} {"train_loss": -9.711180686950684, "global_step": 108388, "epoch": 645} {"train_loss": -9.286380767822266, "global_step": 108389, "epoch": 645} {"train_loss": -9.379110336303711, "global_step": 108390, "epoch": 645} {"train_loss": -9.772951126098633, "global_step": 108391, "epoch": 645} {"train_loss": -9.492403984069824, "global_step": 108392, "epoch": 645} {"train_loss": -9.692596435546875, "global_step": 108393, "epoch": 645} {"train_loss": -9.528797149658203, "global_step": 108394, "epoch": 645} {"train_loss": -10.141438484191895, "global_step": 108395, "epoch": 645} {"train_loss": -9.754319190979004, "global_step": 108396, "epoch": 645} {"train_loss": -9.683030128479004, "global_step": 108397, "epoch": 645} {"train_loss": -9.507467269897461, "global_step": 108398, "epoch": 645} {"train_loss": -9.643091201782227, "global_step": 108399, "epoch": 645} {"train_loss": -9.738353729248047, "global_step": 108400, "epoch": 645} {"train_loss": -9.83711051940918, "global_step": 108401, "epoch": 645} {"train_loss": -9.46328353881836, "global_step": 108402, "epoch": 645} {"train_loss": -9.907991409301758, "global_step": 108403, "epoch": 645} {"train_loss": -9.94268798828125, "global_step": 108404, "epoch": 645} {"train_loss": -9.880240440368652, "global_step": 108405, "epoch": 645} {"train_loss": -9.974987030029297, "global_step": 108406, "epoch": 645} {"train_loss": -9.678411483764648, "global_step": 108407, "epoch": 645} {"train_loss": -10.133848190307617, "global_step": 108408, "epoch": 645} {"train_loss": -9.89553451538086, "global_step": 108409, "epoch": 645} {"train_loss": -9.875038146972656, "global_step": 108410, "epoch": 645} {"train_loss": -9.739602088928223, "global_step": 108411, "epoch": 645} {"train_loss": -9.967334747314453, "global_step": 108412, "epoch": 645} {"train_loss": -9.716222763061523, "global_step": 108413, "epoch": 645} {"train_loss": -10.028350830078125, "global_step": 108414, "epoch": 645} {"train_loss": -10.073797225952148, "global_step": 108415, "epoch": 645} {"train_loss": -10.101465225219727, "global_step": 108416, "epoch": 645} {"train_loss": -9.905616760253906, "global_step": 108417, "epoch": 645} {"train_loss": -9.904325485229492, "global_step": 108418, "epoch": 645} {"train_loss": -10.086738586425781, "global_step": 108419, "epoch": 645} {"train_loss": -9.763510704040527, "global_step": 108420, "epoch": 645} {"train_loss": -10.202905654907227, "global_step": 108421, "epoch": 645} {"train_loss": -9.898073196411133, "global_step": 108422, "epoch": 645} {"train_loss": -9.908095359802246, "global_step": 108423, "epoch": 645} {"train_loss": -9.98604965209961, "global_step": 108424, "epoch": 645} {"train_loss": -10.004531860351562, "global_step": 108425, "epoch": 645} {"train_loss": -10.162595748901367, "global_step": 108426, "epoch": 645} {"train_loss": -9.966917037963867, "global_step": 108427, "epoch": 645} {"train_loss": -9.728303909301758, "global_step": 108428, "epoch": 645} {"train_loss": -9.89565372467041, "global_step": 108429, "epoch": 645} {"train_loss": -9.99063491821289, "global_step": 108430, "epoch": 645} {"train_loss": -9.965444564819336, "global_step": 108431, "epoch": 645} {"train_loss": -10.054914474487305, "global_step": 108432, "epoch": 645} {"train_loss": -10.004507064819336, "global_step": 108433, "epoch": 645} {"train_loss": -10.020774841308594, "global_step": 108434, "epoch": 645} {"train_loss": -9.85858154296875, "global_step": 108435, "epoch": 645} {"train_loss": -10.009867668151855, "global_step": 108436, "epoch": 645} {"train_loss": -9.542051315307617, "global_step": 108437, "epoch": 645} {"train_loss": -9.669663429260254, "global_step": 108438, "epoch": 645} {"train_loss": -10.083455085754395, "global_step": 108439, "epoch": 645} {"train_loss": -9.78849983215332, "global_step": 108440, "epoch": 645} {"train_loss": -9.97567367553711, "global_step": 108441, "epoch": 645} {"train_loss": -9.863157272338867, "global_step": 108442, "epoch": 645} {"train_loss": -9.973838806152344, "global_step": 108443, "epoch": 645} {"train_loss": -10.062793731689453, "global_step": 108444, "epoch": 645} {"train_loss": -9.95057487487793, "global_step": 108445, "epoch": 645} {"train_loss": -9.834997177124023, "global_step": 108446, "epoch": 645} {"train_loss": -10.13687515258789, "global_step": 108447, "epoch": 645} {"train_loss": -9.880845069885254, "global_step": 108448, "epoch": 645} {"train_loss": -9.759611129760742, "global_step": 108449, "epoch": 645} {"train_loss": -9.831466674804688, "global_step": 108450, "epoch": 645} {"train_loss": -9.557755470275879, "global_step": 108451, "epoch": 645} {"train_loss": -9.881370544433594, "global_step": 108452, "epoch": 645} {"train_loss": -10.141386032104492, "global_step": 108453, "epoch": 645} {"train_loss": -9.669967651367188, "global_step": 108454, "epoch": 645} {"train_loss": -9.968836784362793, "global_step": 108455, "epoch": 645} {"train_loss": -9.900566101074219, "global_step": 108456, "epoch": 645} {"train_loss": -9.800580978393555, "global_step": 108457, "epoch": 645} {"train_loss": -9.681061744689941, "global_step": 108458, "epoch": 645} {"train_loss": -9.591197967529297, "global_step": 108459, "epoch": 645} {"train_loss": -9.604578018188477, "global_step": 108460, "epoch": 645} {"train_loss": -9.707857131958008, "global_step": 108461, "epoch": 645} {"train_loss": -9.655720710754395, "global_step": 108462, "epoch": 645} {"train_loss": -9.56286907196045, "global_step": 108463, "epoch": 645} {"train_loss": -9.541510581970215, "global_step": 108464, "epoch": 645} {"train_loss": -9.032286643981934, "global_step": 108465, "epoch": 645} {"train_loss": -9.998411178588867, "global_step": 108466, "epoch": 645} {"train_loss": -9.507555961608887, "global_step": 108467, "epoch": 645} {"train_loss": -9.94217300415039, "global_step": 108468, "epoch": 645} {"train_loss": -9.714338302612305, "global_step": 108469, "epoch": 645} {"train_loss": -9.459165573120117, "global_step": 108470, "epoch": 645} {"train_loss": -9.665128707885742, "global_step": 108471, "epoch": 645} {"train_loss": -9.59327220916748, "global_step": 108472, "epoch": 645} {"train_loss": -9.771421432495117, "global_step": 108473, "epoch": 645} {"train_loss": -9.512523651123047, "global_step": 108474, "epoch": 645} {"train_loss": -9.435089111328125, "global_step": 108475, "epoch": 645} {"train_loss": -9.87509536743164, "global_step": 108476, "epoch": 645} {"train_loss": -9.846232414245605, "global_step": 108477, "epoch": 645} {"train_loss": -9.58908748626709, "global_step": 108478, "epoch": 645} {"train_loss": -9.851892471313477, "global_step": 108479, "epoch": 645} {"train_loss": -9.9608793258667, "global_step": 108480, "epoch": 645} {"train_loss": -9.30785083770752, "global_step": 108481, "epoch": 645} {"train_loss": -9.673336029052734, "global_step": 108482, "epoch": 645} {"train_loss": -9.524673461914062, "global_step": 108483, "epoch": 645} {"train_loss": -9.748420715332031, "global_step": 108484, "epoch": 645} {"train_loss": -9.48065185546875, "global_step": 108485, "epoch": 645} {"train_loss": -9.930390357971191, "global_step": 108486, "epoch": 645} {"train_loss": -9.519412994384766, "global_step": 108487, "epoch": 645} {"train_loss": -9.856474876403809, "global_step": 108488, "epoch": 645} {"train_loss": -9.65070915222168, "global_step": 108489, "epoch": 645} {"train_loss": -9.64167594909668, "global_step": 108490, "epoch": 645} {"train_loss": -9.59850025177002, "global_step": 108491, "epoch": 645} {"train_loss": -9.832176208496094, "global_step": 108492, "epoch": 645} {"train_loss": -9.69906997680664, "global_step": 108493, "epoch": 645} {"train_loss": -9.740524291992188, "global_step": 108494, "epoch": 645} {"train_loss": -9.903631210327148, "global_step": 108495, "epoch": 645} {"train_loss": -9.934019088745117, "global_step": 108496, "epoch": 645} {"train_loss": -9.923139572143555, "global_step": 108497, "epoch": 645} {"train_loss": -9.964149475097656, "global_step": 108498, "epoch": 645} {"train_loss": -9.853769302368164, "global_step": 108499, "epoch": 645} {"train_loss": -10.120984077453613, "global_step": 108500, "epoch": 645} {"train_loss": -9.889447212219238, "global_step": 108501, "epoch": 645} {"train_loss": -9.870102882385254, "global_step": 108502, "epoch": 645} {"train_loss": -9.995193481445312, "global_step": 108503, "epoch": 645} {"train_loss": -9.968999862670898, "global_step": 108504, "epoch": 645} {"train_loss": -9.927047729492188, "global_step": 108505, "epoch": 645} {"train_loss": -9.909042358398438, "global_step": 108506, "epoch": 645} {"train_loss": -10.190887451171875, "global_step": 108507, "epoch": 645} {"train_loss": -10.024742126464844, "global_step": 108508, "epoch": 645} {"train_loss": -10.146615028381348, "global_step": 108509, "epoch": 645} {"train_loss": -9.908913612365723, "global_step": 108510, "epoch": 645} {"train_loss": -9.898896217346191, "global_step": 108511, "epoch": 645} {"train_loss": -10.102211952209473, "global_step": 108512, "epoch": 645} {"train_loss": -9.9208345413208, "global_step": 108513, "epoch": 645} {"train_loss": -10.145322799682617, "global_step": 108514, "epoch": 645} {"train_loss": -9.682709693908691, "global_step": 108515, "epoch": 645} {"train_loss": -9.929676055908203, "global_step": 108516, "epoch": 645} {"train_loss": -9.989875793457031, "global_step": 108517, "epoch": 645} {"train_loss": -10.028854370117188, "global_step": 108518, "epoch": 645} {"train_loss": -10.088632583618164, "global_step": 108519, "epoch": 645} {"train_loss": -10.103100776672363, "global_step": 108520, "epoch": 645} {"train_loss": -10.122695922851562, "global_step": 108521, "epoch": 645} {"train_loss": -9.98519515991211, "global_step": 108522, "epoch": 645} {"train_loss": -9.910066604614258, "global_step": 108523, "epoch": 645} {"train_loss": -10.12496280670166, "global_step": 108524, "epoch": 645} {"train_loss": -10.053388595581055, "global_step": 108525, "epoch": 645} {"train_loss": -10.261322975158691, "global_step": 108526, "epoch": 645} {"train_loss": -9.861549956457955, "global_step": 108527, "epoch": 645, "val_loss": 210203.671875, "train_action_mse_error": 1.358452320098877} {"train_loss": -10.048552513122559, "global_step": 108528, "epoch": 646} {"train_loss": -10.274701118469238, "global_step": 108529, "epoch": 646} {"train_loss": -10.329484939575195, "global_step": 108530, "epoch": 646} {"train_loss": -9.86520767211914, "global_step": 108531, "epoch": 646} {"train_loss": -9.856940269470215, "global_step": 108532, "epoch": 646} {"train_loss": -10.235343933105469, "global_step": 108533, "epoch": 646} {"train_loss": -9.717403411865234, "global_step": 108534, "epoch": 646} {"train_loss": -9.814262390136719, "global_step": 108535, "epoch": 646} {"train_loss": -9.930607795715332, "global_step": 108536, "epoch": 646} {"train_loss": -9.669761657714844, "global_step": 108537, "epoch": 646} {"train_loss": -10.038920402526855, "global_step": 108538, "epoch": 646} {"train_loss": -9.71652603149414, "global_step": 108539, "epoch": 646} {"train_loss": -9.667333602905273, "global_step": 108540, "epoch": 646} {"train_loss": -10.016149520874023, "global_step": 108541, "epoch": 646} {"train_loss": -9.555900573730469, "global_step": 108542, "epoch": 646} {"train_loss": -9.555723190307617, "global_step": 108543, "epoch": 646} {"train_loss": -9.337166786193848, "global_step": 108544, "epoch": 646} {"train_loss": -9.801340103149414, "global_step": 108545, "epoch": 646} {"train_loss": -9.386640548706055, "global_step": 108546, "epoch": 646} {"train_loss": -9.376672744750977, "global_step": 108547, "epoch": 646} {"train_loss": -9.798019409179688, "global_step": 108548, "epoch": 646} {"train_loss": -9.531081199645996, "global_step": 108549, "epoch": 646} {"train_loss": -9.542930603027344, "global_step": 108550, "epoch": 646} {"train_loss": -9.80221176147461, "global_step": 108551, "epoch": 646} {"train_loss": -9.836621284484863, "global_step": 108552, "epoch": 646} {"train_loss": -9.473470687866211, "global_step": 108553, "epoch": 646} {"train_loss": -9.715755462646484, "global_step": 108554, "epoch": 646} {"train_loss": -9.197259902954102, "global_step": 108555, "epoch": 646} {"train_loss": -9.598934173583984, "global_step": 108556, "epoch": 646} {"train_loss": -9.488524436950684, "global_step": 108557, "epoch": 646} {"train_loss": -9.619331359863281, "global_step": 108558, "epoch": 646} {"train_loss": -9.765413284301758, "global_step": 108559, "epoch": 646} {"train_loss": -9.840402603149414, "global_step": 108560, "epoch": 646} {"train_loss": -9.383539199829102, "global_step": 108561, "epoch": 646} {"train_loss": -9.295772552490234, "global_step": 108562, "epoch": 646} {"train_loss": -9.638792037963867, "global_step": 108563, "epoch": 646} {"train_loss": -9.3572998046875, "global_step": 108564, "epoch": 646} {"train_loss": -9.569672584533691, "global_step": 108565, "epoch": 646} {"train_loss": -9.638859748840332, "global_step": 108566, "epoch": 646} {"train_loss": -9.782920837402344, "global_step": 108567, "epoch": 646} {"train_loss": -9.692527770996094, "global_step": 108568, "epoch": 646} {"train_loss": -9.83169174194336, "global_step": 108569, "epoch": 646} {"train_loss": -9.848342895507812, "global_step": 108570, "epoch": 646} {"train_loss": -9.898828506469727, "global_step": 108571, "epoch": 646} {"train_loss": -9.761495590209961, "global_step": 108572, "epoch": 646} {"train_loss": -9.759788513183594, "global_step": 108573, "epoch": 646} {"train_loss": -9.941083908081055, "global_step": 108574, "epoch": 646} {"train_loss": -9.868326187133789, "global_step": 108575, "epoch": 646} {"train_loss": -9.659178733825684, "global_step": 108576, "epoch": 646} {"train_loss": -9.876734733581543, "global_step": 108577, "epoch": 646} {"train_loss": -9.988823890686035, "global_step": 108578, "epoch": 646} {"train_loss": -10.049079895019531, "global_step": 108579, "epoch": 646} {"train_loss": -9.92902946472168, "global_step": 108580, "epoch": 646} {"train_loss": -9.901018142700195, "global_step": 108581, "epoch": 646} {"train_loss": -9.920392990112305, "global_step": 108582, "epoch": 646} {"train_loss": -9.957948684692383, "global_step": 108583, "epoch": 646} {"train_loss": -10.037322044372559, "global_step": 108584, "epoch": 646} {"train_loss": -10.178704261779785, "global_step": 108585, "epoch": 646} {"train_loss": -10.01742935180664, "global_step": 108586, "epoch": 646} {"train_loss": -10.094891548156738, "global_step": 108587, "epoch": 646} {"train_loss": -10.046600341796875, "global_step": 108588, "epoch": 646} {"train_loss": -9.846457481384277, "global_step": 108589, "epoch": 646} {"train_loss": -9.964390754699707, "global_step": 108590, "epoch": 646} {"train_loss": -10.171260833740234, "global_step": 108591, "epoch": 646} {"train_loss": -9.954891204833984, "global_step": 108592, "epoch": 646} {"train_loss": -10.052925109863281, "global_step": 108593, "epoch": 646} {"train_loss": -10.13325023651123, "global_step": 108594, "epoch": 646} {"train_loss": -10.080985069274902, "global_step": 108595, "epoch": 646} {"train_loss": -10.222290992736816, "global_step": 108596, "epoch": 646} {"train_loss": -10.035240173339844, "global_step": 108597, "epoch": 646} {"train_loss": -9.908554077148438, "global_step": 108598, "epoch": 646} {"train_loss": -9.722871780395508, "global_step": 108599, "epoch": 646} {"train_loss": -10.293854713439941, "global_step": 108600, "epoch": 646} {"train_loss": -10.174898147583008, "global_step": 108601, "epoch": 646} {"train_loss": -10.102378845214844, "global_step": 108602, "epoch": 646} {"train_loss": -10.11771297454834, "global_step": 108603, "epoch": 646} {"train_loss": -10.128683090209961, "global_step": 108604, "epoch": 646} {"train_loss": -10.151473999023438, "global_step": 108605, "epoch": 646} {"train_loss": -10.256689071655273, "global_step": 108606, "epoch": 646} {"train_loss": -9.968616485595703, "global_step": 108607, "epoch": 646} {"train_loss": -10.073948860168457, "global_step": 108608, "epoch": 646} {"train_loss": -9.921262741088867, "global_step": 108609, "epoch": 646} {"train_loss": -10.017671585083008, "global_step": 108610, "epoch": 646} {"train_loss": -9.851841926574707, "global_step": 108611, "epoch": 646} {"train_loss": -9.89045524597168, "global_step": 108612, "epoch": 646} {"train_loss": -9.664886474609375, "global_step": 108613, "epoch": 646} {"train_loss": -10.167555809020996, "global_step": 108614, "epoch": 646} {"train_loss": -9.618671417236328, "global_step": 108615, "epoch": 646} {"train_loss": -10.156798362731934, "global_step": 108616, "epoch": 646} {"train_loss": -10.029106140136719, "global_step": 108617, "epoch": 646} {"train_loss": -9.950525283813477, "global_step": 108618, "epoch": 646} {"train_loss": -9.87359619140625, "global_step": 108619, "epoch": 646} {"train_loss": -10.11691665649414, "global_step": 108620, "epoch": 646} {"train_loss": -9.70124340057373, "global_step": 108621, "epoch": 646} {"train_loss": -9.886646270751953, "global_step": 108622, "epoch": 646} {"train_loss": -9.746142387390137, "global_step": 108623, "epoch": 646} {"train_loss": -9.554045677185059, "global_step": 108624, "epoch": 646} {"train_loss": -10.045368194580078, "global_step": 108625, "epoch": 646} {"train_loss": -9.819711685180664, "global_step": 108626, "epoch": 646} {"train_loss": -9.498661994934082, "global_step": 108627, "epoch": 646} {"train_loss": -10.060661315917969, "global_step": 108628, "epoch": 646} {"train_loss": -9.307409286499023, "global_step": 108629, "epoch": 646} {"train_loss": -9.804094314575195, "global_step": 108630, "epoch": 646} {"train_loss": -9.526226043701172, "global_step": 108631, "epoch": 646} {"train_loss": -9.833707809448242, "global_step": 108632, "epoch": 646} {"train_loss": -9.200550079345703, "global_step": 108633, "epoch": 646} {"train_loss": -9.585651397705078, "global_step": 108634, "epoch": 646} {"train_loss": -9.661083221435547, "global_step": 108635, "epoch": 646} {"train_loss": -9.68618392944336, "global_step": 108636, "epoch": 646} {"train_loss": -9.386764526367188, "global_step": 108637, "epoch": 646} {"train_loss": -9.731704711914062, "global_step": 108638, "epoch": 646} {"train_loss": -9.372138977050781, "global_step": 108639, "epoch": 646} {"train_loss": -9.988118171691895, "global_step": 108640, "epoch": 646} {"train_loss": -9.496855735778809, "global_step": 108641, "epoch": 646} {"train_loss": -10.004500389099121, "global_step": 108642, "epoch": 646} {"train_loss": -9.749299049377441, "global_step": 108643, "epoch": 646} {"train_loss": -9.83260726928711, "global_step": 108644, "epoch": 646} {"train_loss": -9.66292953491211, "global_step": 108645, "epoch": 646} {"train_loss": -9.828372955322266, "global_step": 108646, "epoch": 646} {"train_loss": -9.818272590637207, "global_step": 108647, "epoch": 646} {"train_loss": -9.822412490844727, "global_step": 108648, "epoch": 646} {"train_loss": -9.776309967041016, "global_step": 108649, "epoch": 646} {"train_loss": -9.914958000183105, "global_step": 108650, "epoch": 646} {"train_loss": -10.041358947753906, "global_step": 108651, "epoch": 646} {"train_loss": -9.803018569946289, "global_step": 108652, "epoch": 646} {"train_loss": -9.990389823913574, "global_step": 108653, "epoch": 646} {"train_loss": -9.898941040039062, "global_step": 108654, "epoch": 646} {"train_loss": -10.073840141296387, "global_step": 108655, "epoch": 646} {"train_loss": -10.019954681396484, "global_step": 108656, "epoch": 646} {"train_loss": -10.097978591918945, "global_step": 108657, "epoch": 646} {"train_loss": -10.01053237915039, "global_step": 108658, "epoch": 646} {"train_loss": -10.10822868347168, "global_step": 108659, "epoch": 646} {"train_loss": -9.813150405883789, "global_step": 108660, "epoch": 646} {"train_loss": -10.166386604309082, "global_step": 108661, "epoch": 646} {"train_loss": -10.042316436767578, "global_step": 108662, "epoch": 646} {"train_loss": -9.89957046508789, "global_step": 108663, "epoch": 646} {"train_loss": -10.118768692016602, "global_step": 108664, "epoch": 646} {"train_loss": -10.006117820739746, "global_step": 108665, "epoch": 646} {"train_loss": -10.07608413696289, "global_step": 108666, "epoch": 646} {"train_loss": -10.065165519714355, "global_step": 108667, "epoch": 646} {"train_loss": -10.14205265045166, "global_step": 108668, "epoch": 646} {"train_loss": -10.080961227416992, "global_step": 108669, "epoch": 646} {"train_loss": -10.152252197265625, "global_step": 108670, "epoch": 646} {"train_loss": -10.081993103027344, "global_step": 108671, "epoch": 646} {"train_loss": -10.154208183288574, "global_step": 108672, "epoch": 646} {"train_loss": -10.27009105682373, "global_step": 108673, "epoch": 646} {"train_loss": -10.093952178955078, "global_step": 108674, "epoch": 646} {"train_loss": -10.0543212890625, "global_step": 108675, "epoch": 646} {"train_loss": -10.115367889404297, "global_step": 108676, "epoch": 646} {"train_loss": -9.855409622192383, "global_step": 108677, "epoch": 646} {"train_loss": -9.986204147338867, "global_step": 108678, "epoch": 646} {"train_loss": -9.919443130493164, "global_step": 108679, "epoch": 646} {"train_loss": -9.92666244506836, "global_step": 108680, "epoch": 646} {"train_loss": -10.05020523071289, "global_step": 108681, "epoch": 646} {"train_loss": -9.830028533935547, "global_step": 108682, "epoch": 646} {"train_loss": -10.18252944946289, "global_step": 108683, "epoch": 646} {"train_loss": -9.925684928894043, "global_step": 108684, "epoch": 646} {"train_loss": -9.993755340576172, "global_step": 108685, "epoch": 646} {"train_loss": -9.191787719726562, "global_step": 108686, "epoch": 646} {"train_loss": -9.897741317749023, "global_step": 108687, "epoch": 646} {"train_loss": -10.13858413696289, "global_step": 108688, "epoch": 646} {"train_loss": -8.924215316772461, "global_step": 108689, "epoch": 646} {"train_loss": -9.576723098754883, "global_step": 108690, "epoch": 646} {"train_loss": -9.519149780273438, "global_step": 108691, "epoch": 646} {"train_loss": -8.650428771972656, "global_step": 108692, "epoch": 646} {"train_loss": -10.010062217712402, "global_step": 108693, "epoch": 646} {"train_loss": -8.760415077209473, "global_step": 108694, "epoch": 646} {"train_loss": -9.840934566089086, "global_step": 108695, "epoch": 646, "val_loss": 208155.8125} {"train_loss": -8.845115661621094, "global_step": 108696, "epoch": 647} {"train_loss": -8.986637115478516, "global_step": 108697, "epoch": 647} {"train_loss": -9.229564666748047, "global_step": 108698, "epoch": 647} {"train_loss": -8.654073715209961, "global_step": 108699, "epoch": 647} {"train_loss": -9.429765701293945, "global_step": 108700, "epoch": 647} {"train_loss": -9.26535701751709, "global_step": 108701, "epoch": 647} {"train_loss": -9.68645191192627, "global_step": 108702, "epoch": 647} {"train_loss": -9.507171630859375, "global_step": 108703, "epoch": 647} {"train_loss": -9.320130348205566, "global_step": 108704, "epoch": 647} {"train_loss": -10.01925277709961, "global_step": 108705, "epoch": 647} {"train_loss": -9.650655746459961, "global_step": 108706, "epoch": 647} {"train_loss": -9.608901977539062, "global_step": 108707, "epoch": 647} {"train_loss": -9.820352554321289, "global_step": 108708, "epoch": 647} {"train_loss": -9.508630752563477, "global_step": 108709, "epoch": 647} {"train_loss": -9.638526916503906, "global_step": 108710, "epoch": 647} {"train_loss": -9.686643600463867, "global_step": 108711, "epoch": 647} {"train_loss": -9.68606948852539, "global_step": 108712, "epoch": 647} {"train_loss": -9.780397415161133, "global_step": 108713, "epoch": 647} {"train_loss": -9.730081558227539, "global_step": 108714, "epoch": 647} {"train_loss": -9.77731704711914, "global_step": 108715, "epoch": 647} {"train_loss": -9.79334831237793, "global_step": 108716, "epoch": 647} {"train_loss": -10.009387016296387, "global_step": 108717, "epoch": 647} {"train_loss": -10.023956298828125, "global_step": 108718, "epoch": 647} {"train_loss": -9.948806762695312, "global_step": 108719, "epoch": 647} {"train_loss": -9.841516494750977, "global_step": 108720, "epoch": 647} {"train_loss": -9.800376892089844, "global_step": 108721, "epoch": 647} {"train_loss": -9.785776138305664, "global_step": 108722, "epoch": 647} {"train_loss": -9.944428443908691, "global_step": 108723, "epoch": 647} {"train_loss": -10.032691955566406, "global_step": 108724, "epoch": 647} {"train_loss": -9.953609466552734, "global_step": 108725, "epoch": 647} {"train_loss": -9.77313232421875, "global_step": 108726, "epoch": 647} {"train_loss": -10.131584167480469, "global_step": 108727, "epoch": 647} {"train_loss": -10.102945327758789, "global_step": 108728, "epoch": 647} {"train_loss": -10.003084182739258, "global_step": 108729, "epoch": 647} {"train_loss": -9.890298843383789, "global_step": 108730, "epoch": 647} {"train_loss": -9.900554656982422, "global_step": 108731, "epoch": 647} {"train_loss": -9.714774131774902, "global_step": 108732, "epoch": 647} {"train_loss": -10.006706237792969, "global_step": 108733, "epoch": 647} {"train_loss": -9.896842002868652, "global_step": 108734, "epoch": 647} {"train_loss": -10.065500259399414, "global_step": 108735, "epoch": 647} {"train_loss": -9.938884735107422, "global_step": 108736, "epoch": 647} {"train_loss": -10.091227531433105, "global_step": 108737, "epoch": 647} {"train_loss": -10.085236549377441, "global_step": 108738, "epoch": 647} {"train_loss": -10.122663497924805, "global_step": 108739, "epoch": 647} {"train_loss": -10.204789161682129, "global_step": 108740, "epoch": 647} {"train_loss": -10.21713638305664, "global_step": 108741, "epoch": 647} {"train_loss": -10.366153717041016, "global_step": 108742, "epoch": 647} {"train_loss": -10.043073654174805, "global_step": 108743, "epoch": 647} {"train_loss": -9.94719123840332, "global_step": 108744, "epoch": 647} {"train_loss": -10.020605087280273, "global_step": 108745, "epoch": 647} {"train_loss": -10.093582153320312, "global_step": 108746, "epoch": 647} {"train_loss": -10.097148895263672, "global_step": 108747, "epoch": 647} {"train_loss": -9.905137062072754, "global_step": 108748, "epoch": 647} {"train_loss": -10.159507751464844, "global_step": 108749, "epoch": 647} {"train_loss": -10.136833190917969, "global_step": 108750, "epoch": 647} {"train_loss": -10.065366744995117, "global_step": 108751, "epoch": 647} {"train_loss": -10.092926025390625, "global_step": 108752, "epoch": 647} {"train_loss": -9.952651023864746, "global_step": 108753, "epoch": 647} {"train_loss": -9.89156723022461, "global_step": 108754, "epoch": 647} {"train_loss": -10.130133628845215, "global_step": 108755, "epoch": 647} {"train_loss": -10.230313301086426, "global_step": 108756, "epoch": 647} {"train_loss": -10.170159339904785, "global_step": 108757, "epoch": 647} {"train_loss": -10.116388320922852, "global_step": 108758, "epoch": 647} {"train_loss": -9.936670303344727, "global_step": 108759, "epoch": 647} {"train_loss": -10.021382331848145, "global_step": 108760, "epoch": 647} {"train_loss": -9.636459350585938, "global_step": 108761, "epoch": 647} {"train_loss": -9.795228958129883, "global_step": 108762, "epoch": 647} {"train_loss": -10.172858238220215, "global_step": 108763, "epoch": 647} {"train_loss": -9.396712303161621, "global_step": 108764, "epoch": 647} {"train_loss": -10.095367431640625, "global_step": 108765, "epoch": 647} {"train_loss": -9.862268447875977, "global_step": 108766, "epoch": 647} {"train_loss": -9.565021514892578, "global_step": 108767, "epoch": 647} {"train_loss": -9.839035034179688, "global_step": 108768, "epoch": 647} {"train_loss": -9.571205139160156, "global_step": 108769, "epoch": 647} {"train_loss": -9.858163833618164, "global_step": 108770, "epoch": 647} {"train_loss": -9.702832221984863, "global_step": 108771, "epoch": 647} {"train_loss": -9.80019760131836, "global_step": 108772, "epoch": 647} {"train_loss": -9.679473876953125, "global_step": 108773, "epoch": 647} {"train_loss": -10.022320747375488, "global_step": 108774, "epoch": 647} {"train_loss": -9.688125610351562, "global_step": 108775, "epoch": 647} {"train_loss": -9.453394889831543, "global_step": 108776, "epoch": 647} {"train_loss": -9.843036651611328, "global_step": 108777, "epoch": 647} {"train_loss": -9.938167572021484, "global_step": 108778, "epoch": 647} {"train_loss": -9.762168884277344, "global_step": 108779, "epoch": 647} {"train_loss": -9.203134536743164, "global_step": 108780, "epoch": 647} {"train_loss": -9.89133358001709, "global_step": 108781, "epoch": 647} {"train_loss": -9.152984619140625, "global_step": 108782, "epoch": 647} {"train_loss": -9.542669296264648, "global_step": 108783, "epoch": 647} {"train_loss": -9.359739303588867, "global_step": 108784, "epoch": 647} {"train_loss": -9.710550308227539, "global_step": 108785, "epoch": 647} {"train_loss": -9.20938491821289, "global_step": 108786, "epoch": 647} {"train_loss": -9.699316024780273, "global_step": 108787, "epoch": 647} {"train_loss": -9.276172637939453, "global_step": 108788, "epoch": 647} {"train_loss": -9.311274528503418, "global_step": 108789, "epoch": 647} {"train_loss": -9.504685401916504, "global_step": 108790, "epoch": 647} {"train_loss": -9.871757507324219, "global_step": 108791, "epoch": 647} {"train_loss": -9.583304405212402, "global_step": 108792, "epoch": 647} {"train_loss": -9.581457138061523, "global_step": 108793, "epoch": 647} {"train_loss": -9.649173736572266, "global_step": 108794, "epoch": 647} {"train_loss": -9.41280460357666, "global_step": 108795, "epoch": 647} {"train_loss": -9.969286918640137, "global_step": 108796, "epoch": 647} {"train_loss": -9.575567245483398, "global_step": 108797, "epoch": 647} {"train_loss": -9.684244155883789, "global_step": 108798, "epoch": 647} {"train_loss": -9.842918395996094, "global_step": 108799, "epoch": 647} {"train_loss": -9.717276573181152, "global_step": 108800, "epoch": 647} {"train_loss": -9.728006362915039, "global_step": 108801, "epoch": 647} {"train_loss": -9.911237716674805, "global_step": 108802, "epoch": 647} {"train_loss": -9.948753356933594, "global_step": 108803, "epoch": 647} {"train_loss": -9.83523178100586, "global_step": 108804, "epoch": 647} {"train_loss": -9.73507308959961, "global_step": 108805, "epoch": 647} {"train_loss": -9.652436256408691, "global_step": 108806, "epoch": 647} {"train_loss": -9.754683494567871, "global_step": 108807, "epoch": 647} {"train_loss": -9.744361877441406, "global_step": 108808, "epoch": 647} {"train_loss": -10.104780197143555, "global_step": 108809, "epoch": 647} {"train_loss": -9.826589584350586, "global_step": 108810, "epoch": 647} {"train_loss": -10.118053436279297, "global_step": 108811, "epoch": 647} {"train_loss": -10.172420501708984, "global_step": 108812, "epoch": 647} {"train_loss": -9.85525131225586, "global_step": 108813, "epoch": 647} {"train_loss": -10.1203031539917, "global_step": 108814, "epoch": 647} {"train_loss": -10.171335220336914, "global_step": 108815, "epoch": 647} {"train_loss": -9.887239456176758, "global_step": 108816, "epoch": 647} {"train_loss": -10.206120491027832, "global_step": 108817, "epoch": 647} {"train_loss": -9.905954360961914, "global_step": 108818, "epoch": 647} {"train_loss": -10.118488311767578, "global_step": 108819, "epoch": 647} {"train_loss": -10.085624694824219, "global_step": 108820, "epoch": 647} {"train_loss": -9.824312210083008, "global_step": 108821, "epoch": 647} {"train_loss": -9.813628196716309, "global_step": 108822, "epoch": 647} {"train_loss": -10.18958854675293, "global_step": 108823, "epoch": 647} {"train_loss": -9.812945365905762, "global_step": 108824, "epoch": 647} {"train_loss": -10.005258560180664, "global_step": 108825, "epoch": 647} {"train_loss": -10.228431701660156, "global_step": 108826, "epoch": 647} {"train_loss": -10.009262084960938, "global_step": 108827, "epoch": 647} {"train_loss": -10.199613571166992, "global_step": 108828, "epoch": 647} {"train_loss": -10.076013565063477, "global_step": 108829, "epoch": 647} {"train_loss": -10.138076782226562, "global_step": 108830, "epoch": 647} {"train_loss": -10.042525291442871, "global_step": 108831, "epoch": 647} {"train_loss": -10.312150955200195, "global_step": 108832, "epoch": 647} {"train_loss": -9.850608825683594, "global_step": 108833, "epoch": 647} {"train_loss": -10.122050285339355, "global_step": 108834, "epoch": 647} {"train_loss": -10.154315948486328, "global_step": 108835, "epoch": 647} {"train_loss": -10.085443496704102, "global_step": 108836, "epoch": 647} {"train_loss": -10.220552444458008, "global_step": 108837, "epoch": 647} {"train_loss": -10.051247596740723, "global_step": 108838, "epoch": 647} {"train_loss": -10.381461143493652, "global_step": 108839, "epoch": 647} {"train_loss": -10.160398483276367, "global_step": 108840, "epoch": 647} {"train_loss": -10.101205825805664, "global_step": 108841, "epoch": 647} {"train_loss": -10.357474327087402, "global_step": 108842, "epoch": 647} {"train_loss": -10.250191688537598, "global_step": 108843, "epoch": 647} {"train_loss": -10.25045394897461, "global_step": 108844, "epoch": 647} {"train_loss": -10.08177375793457, "global_step": 108845, "epoch": 647} {"train_loss": -9.712565422058105, "global_step": 108846, "epoch": 647} {"train_loss": -9.831562042236328, "global_step": 108847, "epoch": 647} {"train_loss": -10.015731811523438, "global_step": 108848, "epoch": 647} {"train_loss": -10.177925109863281, "global_step": 108849, "epoch": 647} {"train_loss": -10.067266464233398, "global_step": 108850, "epoch": 647} {"train_loss": -9.652235984802246, "global_step": 108851, "epoch": 647} {"train_loss": -10.298470497131348, "global_step": 108852, "epoch": 647} {"train_loss": -9.99812126159668, "global_step": 108853, "epoch": 647} {"train_loss": -10.03886604309082, "global_step": 108854, "epoch": 647} {"train_loss": -10.24642276763916, "global_step": 108855, "epoch": 647} {"train_loss": -10.05233383178711, "global_step": 108856, "epoch": 647} {"train_loss": -9.361671447753906, "global_step": 108857, "epoch": 647} {"train_loss": -9.00313949584961, "global_step": 108858, "epoch": 647} {"train_loss": -10.233049392700195, "global_step": 108859, "epoch": 647} {"train_loss": -9.477620124816895, "global_step": 108860, "epoch": 647} {"train_loss": -8.874671936035156, "global_step": 108861, "epoch": 647} {"train_loss": -8.84358024597168, "global_step": 108862, "epoch": 647} {"train_loss": -9.844203818412055, "global_step": 108863, "epoch": 647, "val_loss": 209662.296875} {"train_loss": -9.022388458251953, "global_step": 108864, "epoch": 648} {"train_loss": -9.415236473083496, "global_step": 108865, "epoch": 648} {"train_loss": -9.027200698852539, "global_step": 108866, "epoch": 648} {"train_loss": -9.92626953125, "global_step": 108867, "epoch": 648} {"train_loss": -9.134838104248047, "global_step": 108868, "epoch": 648} {"train_loss": -9.434785842895508, "global_step": 108869, "epoch": 648} {"train_loss": -9.691086769104004, "global_step": 108870, "epoch": 648} {"train_loss": -9.264440536499023, "global_step": 108871, "epoch": 648} {"train_loss": -9.65258502960205, "global_step": 108872, "epoch": 648} {"train_loss": -9.700777053833008, "global_step": 108873, "epoch": 648} {"train_loss": -9.461785316467285, "global_step": 108874, "epoch": 648} {"train_loss": -9.711935997009277, "global_step": 108875, "epoch": 648} {"train_loss": -9.61381721496582, "global_step": 108876, "epoch": 648} {"train_loss": -9.592567443847656, "global_step": 108877, "epoch": 648} {"train_loss": -9.664087295532227, "global_step": 108878, "epoch": 648} {"train_loss": -9.483675003051758, "global_step": 108879, "epoch": 648} {"train_loss": -9.711016654968262, "global_step": 108880, "epoch": 648} {"train_loss": -9.7274169921875, "global_step": 108881, "epoch": 648} {"train_loss": -9.99502182006836, "global_step": 108882, "epoch": 648} {"train_loss": -9.921476364135742, "global_step": 108883, "epoch": 648} {"train_loss": -9.886162757873535, "global_step": 108884, "epoch": 648} {"train_loss": -9.826175689697266, "global_step": 108885, "epoch": 648} {"train_loss": -9.7799654006958, "global_step": 108886, "epoch": 648} {"train_loss": -9.961387634277344, "global_step": 108887, "epoch": 648} {"train_loss": -9.912046432495117, "global_step": 108888, "epoch": 648} {"train_loss": -9.908710479736328, "global_step": 108889, "epoch": 648} {"train_loss": -10.06093692779541, "global_step": 108890, "epoch": 648} {"train_loss": -9.909103393554688, "global_step": 108891, "epoch": 648} {"train_loss": -10.116889953613281, "global_step": 108892, "epoch": 648} {"train_loss": -10.0155611038208, "global_step": 108893, "epoch": 648} {"train_loss": -9.782533645629883, "global_step": 108894, "epoch": 648} {"train_loss": -9.947033882141113, "global_step": 108895, "epoch": 648} {"train_loss": -10.004379272460938, "global_step": 108896, "epoch": 648} {"train_loss": -9.931550025939941, "global_step": 108897, "epoch": 648} {"train_loss": -10.040738105773926, "global_step": 108898, "epoch": 648} {"train_loss": -10.105681419372559, "global_step": 108899, "epoch": 648} {"train_loss": -10.186810493469238, "global_step": 108900, "epoch": 648} {"train_loss": -9.854888916015625, "global_step": 108901, "epoch": 648} {"train_loss": -10.01336669921875, "global_step": 108902, "epoch": 648} {"train_loss": -10.105806350708008, "global_step": 108903, "epoch": 648} {"train_loss": -9.810379028320312, "global_step": 108904, "epoch": 648} {"train_loss": -10.145687103271484, "global_step": 108905, "epoch": 648} {"train_loss": -10.170150756835938, "global_step": 108906, "epoch": 648} {"train_loss": -10.061753273010254, "global_step": 108907, "epoch": 648} {"train_loss": -10.236698150634766, "global_step": 108908, "epoch": 648} {"train_loss": -10.273773193359375, "global_step": 108909, "epoch": 648} {"train_loss": -10.077707290649414, "global_step": 108910, "epoch": 648} {"train_loss": -10.156841278076172, "global_step": 108911, "epoch": 648} {"train_loss": -10.182300567626953, "global_step": 108912, "epoch": 648} {"train_loss": -10.083471298217773, "global_step": 108913, "epoch": 648} {"train_loss": -10.242990493774414, "global_step": 108914, "epoch": 648} {"train_loss": -10.049918174743652, "global_step": 108915, "epoch": 648} {"train_loss": -10.15114974975586, "global_step": 108916, "epoch": 648} {"train_loss": -9.306081771850586, "global_step": 108917, "epoch": 648} {"train_loss": -9.229040145874023, "global_step": 108918, "epoch": 648} {"train_loss": -9.549263000488281, "global_step": 108919, "epoch": 648} {"train_loss": -10.0421142578125, "global_step": 108920, "epoch": 648} {"train_loss": -9.749967575073242, "global_step": 108921, "epoch": 648} {"train_loss": -9.82259464263916, "global_step": 108922, "epoch": 648} {"train_loss": -9.9231538772583, "global_step": 108923, "epoch": 648} {"train_loss": -9.70394515991211, "global_step": 108924, "epoch": 648} {"train_loss": -9.89984130859375, "global_step": 108925, "epoch": 648} {"train_loss": -9.3720703125, "global_step": 108926, "epoch": 648} {"train_loss": -9.868945121765137, "global_step": 108927, "epoch": 648} {"train_loss": -9.602255821228027, "global_step": 108928, "epoch": 648} {"train_loss": -9.250080108642578, "global_step": 108929, "epoch": 648} {"train_loss": -10.111763000488281, "global_step": 108930, "epoch": 648} {"train_loss": -9.38236141204834, "global_step": 108931, "epoch": 648} {"train_loss": -9.78264045715332, "global_step": 108932, "epoch": 648} {"train_loss": -9.900789260864258, "global_step": 108933, "epoch": 648} {"train_loss": -9.347528457641602, "global_step": 108934, "epoch": 648} {"train_loss": -9.934547424316406, "global_step": 108935, "epoch": 648} {"train_loss": -9.951841354370117, "global_step": 108936, "epoch": 648} {"train_loss": -9.615163803100586, "global_step": 108937, "epoch": 648} {"train_loss": -9.961954116821289, "global_step": 108938, "epoch": 648} {"train_loss": -9.77143383026123, "global_step": 108939, "epoch": 648} {"train_loss": -9.993621826171875, "global_step": 108940, "epoch": 648} {"train_loss": -9.713704109191895, "global_step": 108941, "epoch": 648} {"train_loss": -9.855487823486328, "global_step": 108942, "epoch": 648} {"train_loss": -9.681612014770508, "global_step": 108943, "epoch": 648} {"train_loss": -9.809320449829102, "global_step": 108944, "epoch": 648} {"train_loss": -9.916351318359375, "global_step": 108945, "epoch": 648} {"train_loss": -9.864313125610352, "global_step": 108946, "epoch": 648} {"train_loss": -9.53990364074707, "global_step": 108947, "epoch": 648} {"train_loss": -9.969888687133789, "global_step": 108948, "epoch": 648} {"train_loss": -9.532022476196289, "global_step": 108949, "epoch": 648} {"train_loss": -9.698497772216797, "global_step": 108950, "epoch": 648} {"train_loss": -9.973272323608398, "global_step": 108951, "epoch": 648} {"train_loss": -9.773538589477539, "global_step": 108952, "epoch": 648} {"train_loss": -9.556747436523438, "global_step": 108953, "epoch": 648} {"train_loss": -9.724071502685547, "global_step": 108954, "epoch": 648} {"train_loss": -9.757875442504883, "global_step": 108955, "epoch": 648} {"train_loss": -9.573492050170898, "global_step": 108956, "epoch": 648} {"train_loss": -10.127113342285156, "global_step": 108957, "epoch": 648} {"train_loss": -9.745760917663574, "global_step": 108958, "epoch": 648} {"train_loss": -9.714406967163086, "global_step": 108959, "epoch": 648} {"train_loss": -9.876487731933594, "global_step": 108960, "epoch": 648} {"train_loss": -10.02699089050293, "global_step": 108961, "epoch": 648} {"train_loss": -9.850896835327148, "global_step": 108962, "epoch": 648} {"train_loss": -10.037193298339844, "global_step": 108963, "epoch": 648} {"train_loss": -10.02046012878418, "global_step": 108964, "epoch": 648} {"train_loss": -9.935667037963867, "global_step": 108965, "epoch": 648} {"train_loss": -10.02595043182373, "global_step": 108966, "epoch": 648} {"train_loss": -9.894973754882812, "global_step": 108967, "epoch": 648} {"train_loss": -10.017427444458008, "global_step": 108968, "epoch": 648} {"train_loss": -9.750001907348633, "global_step": 108969, "epoch": 648} {"train_loss": -10.0972900390625, "global_step": 108970, "epoch": 648} {"train_loss": -9.797094345092773, "global_step": 108971, "epoch": 648} {"train_loss": -9.864270210266113, "global_step": 108972, "epoch": 648} {"train_loss": -9.861547470092773, "global_step": 108973, "epoch": 648} {"train_loss": -9.972135543823242, "global_step": 108974, "epoch": 648} {"train_loss": -9.817758560180664, "global_step": 108975, "epoch": 648} {"train_loss": -10.17676067352295, "global_step": 108976, "epoch": 648} {"train_loss": -9.783515930175781, "global_step": 108977, "epoch": 648} {"train_loss": -9.768980026245117, "global_step": 108978, "epoch": 648} {"train_loss": -10.149081230163574, "global_step": 108979, "epoch": 648} {"train_loss": -10.230056762695312, "global_step": 108980, "epoch": 648} {"train_loss": -9.986856460571289, "global_step": 108981, "epoch": 648} {"train_loss": -10.052099227905273, "global_step": 108982, "epoch": 648} {"train_loss": -9.988981246948242, "global_step": 108983, "epoch": 648} {"train_loss": -9.803339004516602, "global_step": 108984, "epoch": 648} {"train_loss": -9.912528991699219, "global_step": 108985, "epoch": 648} {"train_loss": -9.806089401245117, "global_step": 108986, "epoch": 648} {"train_loss": -9.963092803955078, "global_step": 108987, "epoch": 648} {"train_loss": -9.850372314453125, "global_step": 108988, "epoch": 648} {"train_loss": -9.850125312805176, "global_step": 108989, "epoch": 648} {"train_loss": -9.868936538696289, "global_step": 108990, "epoch": 648} {"train_loss": -9.774248123168945, "global_step": 108991, "epoch": 648} {"train_loss": -9.729511260986328, "global_step": 108992, "epoch": 648} {"train_loss": -9.75788688659668, "global_step": 108993, "epoch": 648} {"train_loss": -9.543458938598633, "global_step": 108994, "epoch": 648} {"train_loss": -9.96802806854248, "global_step": 108995, "epoch": 648} {"train_loss": -9.623148918151855, "global_step": 108996, "epoch": 648} {"train_loss": -9.671599388122559, "global_step": 108997, "epoch": 648} {"train_loss": -9.968185424804688, "global_step": 108998, "epoch": 648} {"train_loss": -9.792926788330078, "global_step": 108999, "epoch": 648} {"train_loss": -9.973945617675781, "global_step": 109000, "epoch": 648} {"train_loss": -9.719053268432617, "global_step": 109001, "epoch": 648} {"train_loss": -9.957855224609375, "global_step": 109002, "epoch": 648} {"train_loss": -9.954615592956543, "global_step": 109003, "epoch": 648} {"train_loss": -9.929354667663574, "global_step": 109004, "epoch": 648} {"train_loss": -10.087347030639648, "global_step": 109005, "epoch": 648} {"train_loss": -10.123804092407227, "global_step": 109006, "epoch": 648} {"train_loss": -9.880891799926758, "global_step": 109007, "epoch": 648} {"train_loss": -9.878357887268066, "global_step": 109008, "epoch": 648} {"train_loss": -9.870565414428711, "global_step": 109009, "epoch": 648} {"train_loss": -9.913676261901855, "global_step": 109010, "epoch": 648} {"train_loss": -10.115795135498047, "global_step": 109011, "epoch": 648} {"train_loss": -9.800618171691895, "global_step": 109012, "epoch": 648} {"train_loss": -9.89171028137207, "global_step": 109013, "epoch": 648} {"train_loss": -9.740945816040039, "global_step": 109014, "epoch": 648} {"train_loss": -9.651124954223633, "global_step": 109015, "epoch": 648} {"train_loss": -10.03887939453125, "global_step": 109016, "epoch": 648} {"train_loss": -9.811267852783203, "global_step": 109017, "epoch": 648} {"train_loss": -9.874595642089844, "global_step": 109018, "epoch": 648} {"train_loss": -9.89321517944336, "global_step": 109019, "epoch": 648} {"train_loss": -9.9642972946167, "global_step": 109020, "epoch": 648} {"train_loss": -10.124943733215332, "global_step": 109021, "epoch": 648} {"train_loss": -9.900810241699219, "global_step": 109022, "epoch": 648} {"train_loss": -10.117267608642578, "global_step": 109023, "epoch": 648} {"train_loss": -9.915464401245117, "global_step": 109024, "epoch": 648} {"train_loss": -9.955266952514648, "global_step": 109025, "epoch": 648} {"train_loss": -10.21511459350586, "global_step": 109026, "epoch": 648} {"train_loss": -9.810420989990234, "global_step": 109027, "epoch": 648} {"train_loss": -9.872058868408203, "global_step": 109028, "epoch": 648} {"train_loss": -10.004380226135254, "global_step": 109029, "epoch": 648} {"train_loss": -9.983903884887695, "global_step": 109030, "epoch": 648} {"train_loss": -9.848518666766939, "global_step": 109031, "epoch": 648, "val_loss": 208734.96875} {"train_loss": -10.026704788208008, "global_step": 109032, "epoch": 649} {"train_loss": -9.98842716217041, "global_step": 109033, "epoch": 649} {"train_loss": -9.905729293823242, "global_step": 109034, "epoch": 649} {"train_loss": -10.028227806091309, "global_step": 109035, "epoch": 649} {"train_loss": -9.946898460388184, "global_step": 109036, "epoch": 649} {"train_loss": -10.045144081115723, "global_step": 109037, "epoch": 649} {"train_loss": -10.028307914733887, "global_step": 109038, "epoch": 649} {"train_loss": -9.900474548339844, "global_step": 109039, "epoch": 649} {"train_loss": -10.16458797454834, "global_step": 109040, "epoch": 649} {"train_loss": -9.998651504516602, "global_step": 109041, "epoch": 649} {"train_loss": -10.069365501403809, "global_step": 109042, "epoch": 649} {"train_loss": -10.20756721496582, "global_step": 109043, "epoch": 649} {"train_loss": -9.783329963684082, "global_step": 109044, "epoch": 649} {"train_loss": -10.236886978149414, "global_step": 109045, "epoch": 649} {"train_loss": -10.064373016357422, "global_step": 109046, "epoch": 649} {"train_loss": -9.832603454589844, "global_step": 109047, "epoch": 649} {"train_loss": -9.929064750671387, "global_step": 109048, "epoch": 649} {"train_loss": -10.054327011108398, "global_step": 109049, "epoch": 649} {"train_loss": -9.792019844055176, "global_step": 109050, "epoch": 649} {"train_loss": -9.74915885925293, "global_step": 109051, "epoch": 649} {"train_loss": -9.731990814208984, "global_step": 109052, "epoch": 649} {"train_loss": -9.60291862487793, "global_step": 109053, "epoch": 649} {"train_loss": -9.287793159484863, "global_step": 109054, "epoch": 649} {"train_loss": -10.051909446716309, "global_step": 109055, "epoch": 649} {"train_loss": -9.481481552124023, "global_step": 109056, "epoch": 649} {"train_loss": -9.849931716918945, "global_step": 109057, "epoch": 649} {"train_loss": -9.937898635864258, "global_step": 109058, "epoch": 649} {"train_loss": -9.484981536865234, "global_step": 109059, "epoch": 649} {"train_loss": -9.709147453308105, "global_step": 109060, "epoch": 649} {"train_loss": -9.810966491699219, "global_step": 109061, "epoch": 649} {"train_loss": -10.025649070739746, "global_step": 109062, "epoch": 649} {"train_loss": -9.80713176727295, "global_step": 109063, "epoch": 649} {"train_loss": -9.966075897216797, "global_step": 109064, "epoch": 649} {"train_loss": -9.969255447387695, "global_step": 109065, "epoch": 649} {"train_loss": -9.876051902770996, "global_step": 109066, "epoch": 649} {"train_loss": -9.912166595458984, "global_step": 109067, "epoch": 649} {"train_loss": -10.129255294799805, "global_step": 109068, "epoch": 649} {"train_loss": -9.65744400024414, "global_step": 109069, "epoch": 649} {"train_loss": -9.881831169128418, "global_step": 109070, "epoch": 649} {"train_loss": -9.698783874511719, "global_step": 109071, "epoch": 649} {"train_loss": -9.872889518737793, "global_step": 109072, "epoch": 649} {"train_loss": -9.740559577941895, "global_step": 109073, "epoch": 649} {"train_loss": -10.006385803222656, "global_step": 109074, "epoch": 649} {"train_loss": -10.15713119506836, "global_step": 109075, "epoch": 649} {"train_loss": -10.1437406539917, "global_step": 109076, "epoch": 649} {"train_loss": -9.986001968383789, "global_step": 109077, "epoch": 649} {"train_loss": -9.74972152709961, "global_step": 109078, "epoch": 649} {"train_loss": -10.250716209411621, "global_step": 109079, "epoch": 649} {"train_loss": -10.02475357055664, "global_step": 109080, "epoch": 649} {"train_loss": -10.212443351745605, "global_step": 109081, "epoch": 649} {"train_loss": -9.97779655456543, "global_step": 109082, "epoch": 649} {"train_loss": -10.09425163269043, "global_step": 109083, "epoch": 649} {"train_loss": -10.11197280883789, "global_step": 109084, "epoch": 649} {"train_loss": -10.195981979370117, "global_step": 109085, "epoch": 649} {"train_loss": -9.817785263061523, "global_step": 109086, "epoch": 649} {"train_loss": -10.000567436218262, "global_step": 109087, "epoch": 649} {"train_loss": -9.9187593460083, "global_step": 109088, "epoch": 649} {"train_loss": -10.23836898803711, "global_step": 109089, "epoch": 649} {"train_loss": -9.970399856567383, "global_step": 109090, "epoch": 649} {"train_loss": -10.085906982421875, "global_step": 109091, "epoch": 649} {"train_loss": -9.946056365966797, "global_step": 109092, "epoch": 649} {"train_loss": -10.319060325622559, "global_step": 109093, "epoch": 649} {"train_loss": -10.142274856567383, "global_step": 109094, "epoch": 649} {"train_loss": -10.086640357971191, "global_step": 109095, "epoch": 649} {"train_loss": -10.043115615844727, "global_step": 109096, "epoch": 649} {"train_loss": -10.159083366394043, "global_step": 109097, "epoch": 649} {"train_loss": -10.089620590209961, "global_step": 109098, "epoch": 649} {"train_loss": -10.178597450256348, "global_step": 109099, "epoch": 649} {"train_loss": -9.987704277038574, "global_step": 109100, "epoch": 649} {"train_loss": -9.971078872680664, "global_step": 109101, "epoch": 649} {"train_loss": -9.871248245239258, "global_step": 109102, "epoch": 649} {"train_loss": -9.987762451171875, "global_step": 109103, "epoch": 649} {"train_loss": -10.154693603515625, "global_step": 109104, "epoch": 649} {"train_loss": -9.907034873962402, "global_step": 109105, "epoch": 649} {"train_loss": -10.183849334716797, "global_step": 109106, "epoch": 649} {"train_loss": -9.784994125366211, "global_step": 109107, "epoch": 649} {"train_loss": -9.736600875854492, "global_step": 109108, "epoch": 649} {"train_loss": -10.075779914855957, "global_step": 109109, "epoch": 649} {"train_loss": -9.175697326660156, "global_step": 109110, "epoch": 649} {"train_loss": -9.776598930358887, "global_step": 109111, "epoch": 649} {"train_loss": -9.665936470031738, "global_step": 109112, "epoch": 649} {"train_loss": -9.507101058959961, "global_step": 109113, "epoch": 649} {"train_loss": -9.817569732666016, "global_step": 109114, "epoch": 649} {"train_loss": -9.40742301940918, "global_step": 109115, "epoch": 649} {"train_loss": -9.521867752075195, "global_step": 109116, "epoch": 649} {"train_loss": -9.533020973205566, "global_step": 109117, "epoch": 649} {"train_loss": -9.729759216308594, "global_step": 109118, "epoch": 649} {"train_loss": -9.783269882202148, "global_step": 109119, "epoch": 649} {"train_loss": -9.636543273925781, "global_step": 109120, "epoch": 649} {"train_loss": -9.505691528320312, "global_step": 109121, "epoch": 649} {"train_loss": -9.814081192016602, "global_step": 109122, "epoch": 649} {"train_loss": -9.708294868469238, "global_step": 109123, "epoch": 649} {"train_loss": -9.934067726135254, "global_step": 109124, "epoch": 649} {"train_loss": -9.681941986083984, "global_step": 109125, "epoch": 649} {"train_loss": -9.751653671264648, "global_step": 109126, "epoch": 649} {"train_loss": -9.811800956726074, "global_step": 109127, "epoch": 649} {"train_loss": -9.758606910705566, "global_step": 109128, "epoch": 649} {"train_loss": -9.533100128173828, "global_step": 109129, "epoch": 649} {"train_loss": -9.804250717163086, "global_step": 109130, "epoch": 649} {"train_loss": -10.000243186950684, "global_step": 109131, "epoch": 649} {"train_loss": -9.763399124145508, "global_step": 109132, "epoch": 649} {"train_loss": -9.705522537231445, "global_step": 109133, "epoch": 649} {"train_loss": -9.98190689086914, "global_step": 109134, "epoch": 649} {"train_loss": -9.841598510742188, "global_step": 109135, "epoch": 649} {"train_loss": -9.953104972839355, "global_step": 109136, "epoch": 649} {"train_loss": -10.033937454223633, "global_step": 109137, "epoch": 649} {"train_loss": -9.97850227355957, "global_step": 109138, "epoch": 649} {"train_loss": -10.023721694946289, "global_step": 109139, "epoch": 649} {"train_loss": -9.99039077758789, "global_step": 109140, "epoch": 649} {"train_loss": -9.960606575012207, "global_step": 109141, "epoch": 649} {"train_loss": -9.87051010131836, "global_step": 109142, "epoch": 649} {"train_loss": -9.99261474609375, "global_step": 109143, "epoch": 649} {"train_loss": -10.167482376098633, "global_step": 109144, "epoch": 649} {"train_loss": -10.186424255371094, "global_step": 109145, "epoch": 649} {"train_loss": -9.871405601501465, "global_step": 109146, "epoch": 649} {"train_loss": -9.872804641723633, "global_step": 109147, "epoch": 649} {"train_loss": -10.057764053344727, "global_step": 109148, "epoch": 649} {"train_loss": -9.596030235290527, "global_step": 109149, "epoch": 649} {"train_loss": -10.085397720336914, "global_step": 109150, "epoch": 649} {"train_loss": -9.839004516601562, "global_step": 109151, "epoch": 649} {"train_loss": -9.825709342956543, "global_step": 109152, "epoch": 649} {"train_loss": -10.080488204956055, "global_step": 109153, "epoch": 649} {"train_loss": -9.84379768371582, "global_step": 109154, "epoch": 649} {"train_loss": -10.028972625732422, "global_step": 109155, "epoch": 649} {"train_loss": -9.953923225402832, "global_step": 109156, "epoch": 649} {"train_loss": -9.79001235961914, "global_step": 109157, "epoch": 649} {"train_loss": -9.989543914794922, "global_step": 109158, "epoch": 649} {"train_loss": -9.944798469543457, "global_step": 109159, "epoch": 649} {"train_loss": -10.009045600891113, "global_step": 109160, "epoch": 649} {"train_loss": -10.14822769165039, "global_step": 109161, "epoch": 649} {"train_loss": -9.592482566833496, "global_step": 109162, "epoch": 649} {"train_loss": -9.90147876739502, "global_step": 109163, "epoch": 649} {"train_loss": -10.104098320007324, "global_step": 109164, "epoch": 649} {"train_loss": -9.641592025756836, "global_step": 109165, "epoch": 649} {"train_loss": -10.065095901489258, "global_step": 109166, "epoch": 649} {"train_loss": -9.330814361572266, "global_step": 109167, "epoch": 649} {"train_loss": -9.900798797607422, "global_step": 109168, "epoch": 649} {"train_loss": -9.833000183105469, "global_step": 109169, "epoch": 649} {"train_loss": -10.137286186218262, "global_step": 109170, "epoch": 649} {"train_loss": -10.121362686157227, "global_step": 109171, "epoch": 649} {"train_loss": -9.905330657958984, "global_step": 109172, "epoch": 649} {"train_loss": -10.103248596191406, "global_step": 109173, "epoch": 649} {"train_loss": -9.981236457824707, "global_step": 109174, "epoch": 649} {"train_loss": -10.018595695495605, "global_step": 109175, "epoch": 649} {"train_loss": -10.019067764282227, "global_step": 109176, "epoch": 649} {"train_loss": -10.0615873336792, "global_step": 109177, "epoch": 649} {"train_loss": -10.19241714477539, "global_step": 109178, "epoch": 649} {"train_loss": -9.968055725097656, "global_step": 109179, "epoch": 649} {"train_loss": -9.956121444702148, "global_step": 109180, "epoch": 649} {"train_loss": -9.915735244750977, "global_step": 109181, "epoch": 649} {"train_loss": -9.909625053405762, "global_step": 109182, "epoch": 649} {"train_loss": -10.250787734985352, "global_step": 109183, "epoch": 649} {"train_loss": -10.0129976272583, "global_step": 109184, "epoch": 649} {"train_loss": -10.077123641967773, "global_step": 109185, "epoch": 649} {"train_loss": -9.781953811645508, "global_step": 109186, "epoch": 649} {"train_loss": -10.0891695022583, "global_step": 109187, "epoch": 649} {"train_loss": -10.195968627929688, "global_step": 109188, "epoch": 649} {"train_loss": -9.593088150024414, "global_step": 109189, "epoch": 649} {"train_loss": -10.316121101379395, "global_step": 109190, "epoch": 649} {"train_loss": -9.706459045410156, "global_step": 109191, "epoch": 649} {"train_loss": -9.976327896118164, "global_step": 109192, "epoch": 649} {"train_loss": -9.930383682250977, "global_step": 109193, "epoch": 649} {"train_loss": -9.80473518371582, "global_step": 109194, "epoch": 649} {"train_loss": -10.099081039428711, "global_step": 109195, "epoch": 649} {"train_loss": -9.713529586791992, "global_step": 109196, "epoch": 649} {"train_loss": -10.056777954101562, "global_step": 109197, "epoch": 649} {"train_loss": -9.710738182067871, "global_step": 109198, "epoch": 649} {"train_loss": -9.915621286346799, "global_step": 109199, "epoch": 649, "val_loss": 208630.90625} {"train_loss": -9.814682006835938, "global_step": 109200, "epoch": 650} {"train_loss": -9.7608642578125, "global_step": 109201, "epoch": 650} {"train_loss": -9.817403793334961, "global_step": 109202, "epoch": 650} {"train_loss": -9.928707122802734, "global_step": 109203, "epoch": 650} {"train_loss": -9.946195602416992, "global_step": 109204, "epoch": 650} {"train_loss": -10.029401779174805, "global_step": 109205, "epoch": 650} {"train_loss": -9.89938735961914, "global_step": 109206, "epoch": 650} {"train_loss": -10.04818058013916, "global_step": 109207, "epoch": 650} {"train_loss": -10.017776489257812, "global_step": 109208, "epoch": 650} {"train_loss": -9.79112720489502, "global_step": 109209, "epoch": 650} {"train_loss": -9.75474739074707, "global_step": 109210, "epoch": 650} {"train_loss": -9.78799819946289, "global_step": 109211, "epoch": 650} {"train_loss": -9.9490966796875, "global_step": 109212, "epoch": 650} {"train_loss": -9.887557029724121, "global_step": 109213, "epoch": 650} {"train_loss": -9.828866958618164, "global_step": 109214, "epoch": 650} {"train_loss": -9.937788009643555, "global_step": 109215, "epoch": 650} {"train_loss": -9.684404373168945, "global_step": 109216, "epoch": 650} {"train_loss": -9.703182220458984, "global_step": 109217, "epoch": 650} {"train_loss": -9.853229522705078, "global_step": 109218, "epoch": 650} {"train_loss": -9.786910057067871, "global_step": 109219, "epoch": 650} {"train_loss": -9.68140983581543, "global_step": 109220, "epoch": 650} {"train_loss": -9.92069149017334, "global_step": 109221, "epoch": 650} {"train_loss": -9.771313667297363, "global_step": 109222, "epoch": 650} {"train_loss": -9.834173202514648, "global_step": 109223, "epoch": 650} {"train_loss": -9.793230056762695, "global_step": 109224, "epoch": 650} {"train_loss": -9.769876480102539, "global_step": 109225, "epoch": 650} {"train_loss": -10.08458423614502, "global_step": 109226, "epoch": 650} {"train_loss": -9.747653007507324, "global_step": 109227, "epoch": 650} {"train_loss": -10.092182159423828, "global_step": 109228, "epoch": 650} {"train_loss": -9.855899810791016, "global_step": 109229, "epoch": 650} {"train_loss": -10.035786628723145, "global_step": 109230, "epoch": 650} {"train_loss": -9.706218719482422, "global_step": 109231, "epoch": 650} {"train_loss": -9.73281478881836, "global_step": 109232, "epoch": 650} {"train_loss": -9.784210205078125, "global_step": 109233, "epoch": 650} {"train_loss": -10.134754180908203, "global_step": 109234, "epoch": 650} {"train_loss": -9.773889541625977, "global_step": 109235, "epoch": 650} {"train_loss": -10.382164001464844, "global_step": 109236, "epoch": 650} {"train_loss": -9.372259140014648, "global_step": 109237, "epoch": 650} {"train_loss": -9.879842758178711, "global_step": 109238, "epoch": 650} {"train_loss": -9.946784973144531, "global_step": 109239, "epoch": 650} {"train_loss": -9.76863956451416, "global_step": 109240, "epoch": 650} {"train_loss": -9.919870376586914, "global_step": 109241, "epoch": 650} {"train_loss": -10.167051315307617, "global_step": 109242, "epoch": 650} {"train_loss": -9.817670822143555, "global_step": 109243, "epoch": 650} {"train_loss": -10.068584442138672, "global_step": 109244, "epoch": 650} {"train_loss": -9.945337295532227, "global_step": 109245, "epoch": 650} {"train_loss": -9.836041450500488, "global_step": 109246, "epoch": 650} {"train_loss": -9.959016799926758, "global_step": 109247, "epoch": 650} {"train_loss": -9.96985149383545, "global_step": 109248, "epoch": 650} {"train_loss": -9.98635196685791, "global_step": 109249, "epoch": 650} {"train_loss": -9.761177062988281, "global_step": 109250, "epoch": 650} {"train_loss": -9.75448226928711, "global_step": 109251, "epoch": 650} {"train_loss": -9.859415054321289, "global_step": 109252, "epoch": 650} {"train_loss": -9.914896965026855, "global_step": 109253, "epoch": 650} {"train_loss": -9.721905708312988, "global_step": 109254, "epoch": 650} {"train_loss": -9.430828094482422, "global_step": 109255, "epoch": 650} {"train_loss": -10.144912719726562, "global_step": 109256, "epoch": 650} {"train_loss": -9.14220142364502, "global_step": 109257, "epoch": 650} {"train_loss": -9.755472183227539, "global_step": 109258, "epoch": 650} {"train_loss": -9.13475513458252, "global_step": 109259, "epoch": 650} {"train_loss": -9.640670776367188, "global_step": 109260, "epoch": 650} {"train_loss": -9.209665298461914, "global_step": 109261, "epoch": 650} {"train_loss": -9.60838508605957, "global_step": 109262, "epoch": 650} {"train_loss": -9.499073028564453, "global_step": 109263, "epoch": 650} {"train_loss": -9.518472671508789, "global_step": 109264, "epoch": 650} {"train_loss": -9.895133972167969, "global_step": 109265, "epoch": 650} {"train_loss": -9.753633499145508, "global_step": 109266, "epoch": 650} {"train_loss": -9.655265808105469, "global_step": 109267, "epoch": 650} {"train_loss": -9.77197265625, "global_step": 109268, "epoch": 650} {"train_loss": -9.687259674072266, "global_step": 109269, "epoch": 650} {"train_loss": -9.508238792419434, "global_step": 109270, "epoch": 650} {"train_loss": -9.830652236938477, "global_step": 109271, "epoch": 650} {"train_loss": -9.717395782470703, "global_step": 109272, "epoch": 650} {"train_loss": -9.662323951721191, "global_step": 109273, "epoch": 650} {"train_loss": -9.808284759521484, "global_step": 109274, "epoch": 650} {"train_loss": -9.613560676574707, "global_step": 109275, "epoch": 650} {"train_loss": -9.981618881225586, "global_step": 109276, "epoch": 650} {"train_loss": -9.783044815063477, "global_step": 109277, "epoch": 650} {"train_loss": -10.019515991210938, "global_step": 109278, "epoch": 650} {"train_loss": -9.668427467346191, "global_step": 109279, "epoch": 650} {"train_loss": -9.992452621459961, "global_step": 109280, "epoch": 650} {"train_loss": -9.883855819702148, "global_step": 109281, "epoch": 650} {"train_loss": -9.592611312866211, "global_step": 109282, "epoch": 650} {"train_loss": -9.964302062988281, "global_step": 109283, "epoch": 650} {"train_loss": -9.834388732910156, "global_step": 109284, "epoch": 650} {"train_loss": -9.854812622070312, "global_step": 109285, "epoch": 650} {"train_loss": -9.8628568649292, "global_step": 109286, "epoch": 650} {"train_loss": -9.727346420288086, "global_step": 109287, "epoch": 650} {"train_loss": -9.753467559814453, "global_step": 109288, "epoch": 650} {"train_loss": -9.833839416503906, "global_step": 109289, "epoch": 650} {"train_loss": -9.862541198730469, "global_step": 109290, "epoch": 650} {"train_loss": -10.111369132995605, "global_step": 109291, "epoch": 650} {"train_loss": -9.70400619506836, "global_step": 109292, "epoch": 650} {"train_loss": -9.601792335510254, "global_step": 109293, "epoch": 650} {"train_loss": -9.946036338806152, "global_step": 109294, "epoch": 650} {"train_loss": -9.852341651916504, "global_step": 109295, "epoch": 650} {"train_loss": -9.889951705932617, "global_step": 109296, "epoch": 650} {"train_loss": -9.910551071166992, "global_step": 109297, "epoch": 650} {"train_loss": -10.27192497253418, "global_step": 109298, "epoch": 650} {"train_loss": -9.593194961547852, "global_step": 109299, "epoch": 650} {"train_loss": -10.066015243530273, "global_step": 109300, "epoch": 650} {"train_loss": -9.682624816894531, "global_step": 109301, "epoch": 650} {"train_loss": -9.929341316223145, "global_step": 109302, "epoch": 650} {"train_loss": -9.695257186889648, "global_step": 109303, "epoch": 650} {"train_loss": -9.90673542022705, "global_step": 109304, "epoch": 650} {"train_loss": -10.020264625549316, "global_step": 109305, "epoch": 650} {"train_loss": -10.113558769226074, "global_step": 109306, "epoch": 650} {"train_loss": -9.904464721679688, "global_step": 109307, "epoch": 650} {"train_loss": -9.706403732299805, "global_step": 109308, "epoch": 650} {"train_loss": -9.987321853637695, "global_step": 109309, "epoch": 650} {"train_loss": -10.003092765808105, "global_step": 109310, "epoch": 650} {"train_loss": -9.960861206054688, "global_step": 109311, "epoch": 650} {"train_loss": -9.962642669677734, "global_step": 109312, "epoch": 650} {"train_loss": -9.966960906982422, "global_step": 109313, "epoch": 650} {"train_loss": -9.939343452453613, "global_step": 109314, "epoch": 650} {"train_loss": -10.025199890136719, "global_step": 109315, "epoch": 650} {"train_loss": -10.199304580688477, "global_step": 109316, "epoch": 650} {"train_loss": -10.017292976379395, "global_step": 109317, "epoch": 650} {"train_loss": -10.135331153869629, "global_step": 109318, "epoch": 650} {"train_loss": -10.005221366882324, "global_step": 109319, "epoch": 650} {"train_loss": -9.861519813537598, "global_step": 109320, "epoch": 650} {"train_loss": -9.902950286865234, "global_step": 109321, "epoch": 650} {"train_loss": -9.994779586791992, "global_step": 109322, "epoch": 650} {"train_loss": -9.891307830810547, "global_step": 109323, "epoch": 650} {"train_loss": -10.241827964782715, "global_step": 109324, "epoch": 650} {"train_loss": -9.914283752441406, "global_step": 109325, "epoch": 650} {"train_loss": -9.951593399047852, "global_step": 109326, "epoch": 650} {"train_loss": -9.861146926879883, "global_step": 109327, "epoch": 650} {"train_loss": -9.988212585449219, "global_step": 109328, "epoch": 650} {"train_loss": -10.084321975708008, "global_step": 109329, "epoch": 650} {"train_loss": -9.911460876464844, "global_step": 109330, "epoch": 650} {"train_loss": -10.065646171569824, "global_step": 109331, "epoch": 650} {"train_loss": -9.961244583129883, "global_step": 109332, "epoch": 650} {"train_loss": -10.072160720825195, "global_step": 109333, "epoch": 650} {"train_loss": -10.184659957885742, "global_step": 109334, "epoch": 650} {"train_loss": -9.924821853637695, "global_step": 109335, "epoch": 650} {"train_loss": -9.587374687194824, "global_step": 109336, "epoch": 650} {"train_loss": -10.141741752624512, "global_step": 109337, "epoch": 650} {"train_loss": -9.833917617797852, "global_step": 109338, "epoch": 650} {"train_loss": -10.088644027709961, "global_step": 109339, "epoch": 650} {"train_loss": -9.318812370300293, "global_step": 109340, "epoch": 650} {"train_loss": -10.031925201416016, "global_step": 109341, "epoch": 650} {"train_loss": -9.890199661254883, "global_step": 109342, "epoch": 650} {"train_loss": -10.102157592773438, "global_step": 109343, "epoch": 650} {"train_loss": -9.620162010192871, "global_step": 109344, "epoch": 650} {"train_loss": -10.091277122497559, "global_step": 109345, "epoch": 650} {"train_loss": -9.923016548156738, "global_step": 109346, "epoch": 650} {"train_loss": -9.689679145812988, "global_step": 109347, "epoch": 650} {"train_loss": -9.808577537536621, "global_step": 109348, "epoch": 650} {"train_loss": -9.57339859008789, "global_step": 109349, "epoch": 650} {"train_loss": -9.896817207336426, "global_step": 109350, "epoch": 650} {"train_loss": -9.664647102355957, "global_step": 109351, "epoch": 650} {"train_loss": -9.650381088256836, "global_step": 109352, "epoch": 650} {"train_loss": -9.717981338500977, "global_step": 109353, "epoch": 650} {"train_loss": -9.512688636779785, "global_step": 109354, "epoch": 650} {"train_loss": -9.569622039794922, "global_step": 109355, "epoch": 650} {"train_loss": -9.314310073852539, "global_step": 109356, "epoch": 650} {"train_loss": -9.849711418151855, "global_step": 109357, "epoch": 650} {"train_loss": -9.511382102966309, "global_step": 109358, "epoch": 650} {"train_loss": -9.40166187286377, "global_step": 109359, "epoch": 650} {"train_loss": -9.8152437210083, "global_step": 109360, "epoch": 650} {"train_loss": -9.574142456054688, "global_step": 109361, "epoch": 650} {"train_loss": -10.039952278137207, "global_step": 109362, "epoch": 650} {"train_loss": -9.687747955322266, "global_step": 109363, "epoch": 650} {"train_loss": -9.846799850463867, "global_step": 109364, "epoch": 650} {"train_loss": -9.41778564453125, "global_step": 109365, "epoch": 650} {"train_loss": -9.839149475097656, "global_step": 109366, "epoch": 650} {"train_loss": -9.833981417474293, "global_step": 109367, "epoch": 650, "train/sim_max_reward_0": 0.440029486524949, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.006679449111793195, "train/sim_max_reward_3": 0.6213802237013631, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.5062623839873658, "test/sim_max_reward_4400000": 0.2783347627479508, "test/sim_max_reward_4400001": 0.3598310866967035, "test/sim_max_reward_4400002": 0.5118681887565469, "test/sim_max_reward_4400003": 0.3267023627986985, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 0.9757881672807215, "test/sim_max_reward_4400006": 0.4025502470610227, "test/sim_max_reward_4400007": 0.9803797148095572, "test/sim_max_reward_4400008": 0.7227441478125345, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 0.23792081236994736, "test/sim_max_reward_4400011": 0.8896315893201134, "test/sim_max_reward_4400012": 0.9895138387958022, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.6442112294667752, "test/sim_max_reward_4400015": 0.9803123580930755, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9644512478009889, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9916854235251605, "test/sim_max_reward_4400023": 0.14412286948624708, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.6199318423207238, "test/sim_max_reward_4400026": 0.6236396827419782, "test/sim_max_reward_4400027": 0.45312708844516725, "test/sim_max_reward_4400028": 0.7073696890997878, "test/sim_max_reward_4400029": 1.0, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9900345947997612, "test/sim_max_reward_4400034": 0.9814766597411438, "test/sim_max_reward_4400035": 0.8293544750124653, "test/sim_max_reward_4400036": 0.37421961767721207, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.721714869185234, "test/sim_max_reward_4400042": 0.9985557078031563, "test/sim_max_reward_4400043": 0.9510371066697154, "test/sim_max_reward_4400044": 0.9459865149173932, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.5957252572209119, "test/mean_score": 0.6399419028563451, "val_loss": 208644.8125, "train_action_mse_error": 2.9301652908325195} {"train_loss": -10.029062271118164, "global_step": 109368, "epoch": 651} {"train_loss": -9.872154235839844, "global_step": 109369, "epoch": 651} {"train_loss": -9.631455421447754, "global_step": 109370, "epoch": 651} {"train_loss": -9.76747989654541, "global_step": 109371, "epoch": 651} {"train_loss": -9.400341033935547, "global_step": 109372, "epoch": 651} {"train_loss": -9.852640151977539, "global_step": 109373, "epoch": 651} {"train_loss": -9.206035614013672, "global_step": 109374, "epoch": 651} {"train_loss": -9.909379005432129, "global_step": 109375, "epoch": 651} {"train_loss": -9.456185340881348, "global_step": 109376, "epoch": 651} {"train_loss": -9.82245922088623, "global_step": 109377, "epoch": 651} {"train_loss": -9.763208389282227, "global_step": 109378, "epoch": 651} {"train_loss": -9.993709564208984, "global_step": 109379, "epoch": 651} {"train_loss": -9.811710357666016, "global_step": 109380, "epoch": 651} {"train_loss": -9.879959106445312, "global_step": 109381, "epoch": 651} {"train_loss": -9.52639389038086, "global_step": 109382, "epoch": 651} {"train_loss": -9.894265174865723, "global_step": 109383, "epoch": 651} {"train_loss": -9.8408203125, "global_step": 109384, "epoch": 651} {"train_loss": -9.996458053588867, "global_step": 109385, "epoch": 651} {"train_loss": -9.680343627929688, "global_step": 109386, "epoch": 651} {"train_loss": -9.822933197021484, "global_step": 109387, "epoch": 651} {"train_loss": -10.130393981933594, "global_step": 109388, "epoch": 651} {"train_loss": -9.677412033081055, "global_step": 109389, "epoch": 651} {"train_loss": -9.778875350952148, "global_step": 109390, "epoch": 651} {"train_loss": -9.909636497497559, "global_step": 109391, "epoch": 651} {"train_loss": -9.930498123168945, "global_step": 109392, "epoch": 651} {"train_loss": -10.062068939208984, "global_step": 109393, "epoch": 651} {"train_loss": -10.209096908569336, "global_step": 109394, "epoch": 651} {"train_loss": -10.118997573852539, "global_step": 109395, "epoch": 651} {"train_loss": -9.913352966308594, "global_step": 109396, "epoch": 651} {"train_loss": -10.029532432556152, "global_step": 109397, "epoch": 651} {"train_loss": -9.690574645996094, "global_step": 109398, "epoch": 651} {"train_loss": -10.093554496765137, "global_step": 109399, "epoch": 651} {"train_loss": -9.863773345947266, "global_step": 109400, "epoch": 651} {"train_loss": -9.81234073638916, "global_step": 109401, "epoch": 651} {"train_loss": -10.09678840637207, "global_step": 109402, "epoch": 651} {"train_loss": -10.065685272216797, "global_step": 109403, "epoch": 651} {"train_loss": -10.28915023803711, "global_step": 109404, "epoch": 651} {"train_loss": -10.096563339233398, "global_step": 109405, "epoch": 651} {"train_loss": -10.221630096435547, "global_step": 109406, "epoch": 651} {"train_loss": -10.231283187866211, "global_step": 109407, "epoch": 651} {"train_loss": -10.10040283203125, "global_step": 109408, "epoch": 651} {"train_loss": -10.223697662353516, "global_step": 109409, "epoch": 651} {"train_loss": -10.237311363220215, "global_step": 109410, "epoch": 651} {"train_loss": -10.216124534606934, "global_step": 109411, "epoch": 651} {"train_loss": -10.042928695678711, "global_step": 109412, "epoch": 651} {"train_loss": -10.039522171020508, "global_step": 109413, "epoch": 651} {"train_loss": -10.224000930786133, "global_step": 109414, "epoch": 651} {"train_loss": -9.915912628173828, "global_step": 109415, "epoch": 651} {"train_loss": -10.290088653564453, "global_step": 109416, "epoch": 651} {"train_loss": -9.903097152709961, "global_step": 109417, "epoch": 651} {"train_loss": -10.01087760925293, "global_step": 109418, "epoch": 651} {"train_loss": -10.175771713256836, "global_step": 109419, "epoch": 651} {"train_loss": -10.044591903686523, "global_step": 109420, "epoch": 651} {"train_loss": -9.824127197265625, "global_step": 109421, "epoch": 651} {"train_loss": -9.705854415893555, "global_step": 109422, "epoch": 651} {"train_loss": -9.671749114990234, "global_step": 109423, "epoch": 651} {"train_loss": -9.72642993927002, "global_step": 109424, "epoch": 651} {"train_loss": -10.010822296142578, "global_step": 109425, "epoch": 651} {"train_loss": -9.817237854003906, "global_step": 109426, "epoch": 651} {"train_loss": -9.553308486938477, "global_step": 109427, "epoch": 651} {"train_loss": -10.044979095458984, "global_step": 109428, "epoch": 651} {"train_loss": -9.369094848632812, "global_step": 109429, "epoch": 651} {"train_loss": -9.30760383605957, "global_step": 109430, "epoch": 651} {"train_loss": -9.654294967651367, "global_step": 109431, "epoch": 651} {"train_loss": -9.393163681030273, "global_step": 109432, "epoch": 651} {"train_loss": -9.34528636932373, "global_step": 109433, "epoch": 651} {"train_loss": -10.069159507751465, "global_step": 109434, "epoch": 651} {"train_loss": -9.578683853149414, "global_step": 109435, "epoch": 651} {"train_loss": -9.740447998046875, "global_step": 109436, "epoch": 651} {"train_loss": -9.705852508544922, "global_step": 109437, "epoch": 651} {"train_loss": -9.669113159179688, "global_step": 109438, "epoch": 651} {"train_loss": -9.625404357910156, "global_step": 109439, "epoch": 651} {"train_loss": -9.777244567871094, "global_step": 109440, "epoch": 651} {"train_loss": -9.905834197998047, "global_step": 109441, "epoch": 651} {"train_loss": -9.665136337280273, "global_step": 109442, "epoch": 651} {"train_loss": -9.743308067321777, "global_step": 109443, "epoch": 651} {"train_loss": -9.976175308227539, "global_step": 109444, "epoch": 651} {"train_loss": -9.748432159423828, "global_step": 109445, "epoch": 651} {"train_loss": -9.713726043701172, "global_step": 109446, "epoch": 651} {"train_loss": -9.943448066711426, "global_step": 109447, "epoch": 651} {"train_loss": -9.70029067993164, "global_step": 109448, "epoch": 651} {"train_loss": -9.653369903564453, "global_step": 109449, "epoch": 651} {"train_loss": -9.735862731933594, "global_step": 109450, "epoch": 651} {"train_loss": -9.711897850036621, "global_step": 109451, "epoch": 651} {"train_loss": -9.98638916015625, "global_step": 109452, "epoch": 651} {"train_loss": -9.769159317016602, "global_step": 109453, "epoch": 651} {"train_loss": -9.942646026611328, "global_step": 109454, "epoch": 651} {"train_loss": -9.833224296569824, "global_step": 109455, "epoch": 651} {"train_loss": -10.210371017456055, "global_step": 109456, "epoch": 651} {"train_loss": -9.766087532043457, "global_step": 109457, "epoch": 651} {"train_loss": -9.87162971496582, "global_step": 109458, "epoch": 651} {"train_loss": -9.920641899108887, "global_step": 109459, "epoch": 651} {"train_loss": -10.016429901123047, "global_step": 109460, "epoch": 651} {"train_loss": -9.920270919799805, "global_step": 109461, "epoch": 651} {"train_loss": -10.09397029876709, "global_step": 109462, "epoch": 651} {"train_loss": -10.082715034484863, "global_step": 109463, "epoch": 651} {"train_loss": -9.821802139282227, "global_step": 109464, "epoch": 651} {"train_loss": -10.128410339355469, "global_step": 109465, "epoch": 651} {"train_loss": -10.069377899169922, "global_step": 109466, "epoch": 651} {"train_loss": -9.983511924743652, "global_step": 109467, "epoch": 651} {"train_loss": -10.13272762298584, "global_step": 109468, "epoch": 651} {"train_loss": -10.045440673828125, "global_step": 109469, "epoch": 651} {"train_loss": -9.876289367675781, "global_step": 109470, "epoch": 651} {"train_loss": -10.062127113342285, "global_step": 109471, "epoch": 651} {"train_loss": -9.911069869995117, "global_step": 109472, "epoch": 651} {"train_loss": -10.000619888305664, "global_step": 109473, "epoch": 651} {"train_loss": -9.53921890258789, "global_step": 109474, "epoch": 651} {"train_loss": -9.966629981994629, "global_step": 109475, "epoch": 651} {"train_loss": -9.850743293762207, "global_step": 109476, "epoch": 651} {"train_loss": -9.880905151367188, "global_step": 109477, "epoch": 651} {"train_loss": -9.693485260009766, "global_step": 109478, "epoch": 651} {"train_loss": -10.058582305908203, "global_step": 109479, "epoch": 651} {"train_loss": -10.055683135986328, "global_step": 109480, "epoch": 651} {"train_loss": -10.21528148651123, "global_step": 109481, "epoch": 651} {"train_loss": -10.092914581298828, "global_step": 109482, "epoch": 651} {"train_loss": -10.054576873779297, "global_step": 109483, "epoch": 651} {"train_loss": -10.23787784576416, "global_step": 109484, "epoch": 651} {"train_loss": -10.044910430908203, "global_step": 109485, "epoch": 651} {"train_loss": -10.05844497680664, "global_step": 109486, "epoch": 651} {"train_loss": -10.037785530090332, "global_step": 109487, "epoch": 651} {"train_loss": -9.972818374633789, "global_step": 109488, "epoch": 651} {"train_loss": -10.084297180175781, "global_step": 109489, "epoch": 651} {"train_loss": -9.994771957397461, "global_step": 109490, "epoch": 651} {"train_loss": -10.008398056030273, "global_step": 109491, "epoch": 651} {"train_loss": -10.03032112121582, "global_step": 109492, "epoch": 651} {"train_loss": -10.152345657348633, "global_step": 109493, "epoch": 651} {"train_loss": -10.058472633361816, "global_step": 109494, "epoch": 651} {"train_loss": -9.997161865234375, "global_step": 109495, "epoch": 651} {"train_loss": -9.807890892028809, "global_step": 109496, "epoch": 651} {"train_loss": -10.125871658325195, "global_step": 109497, "epoch": 651} {"train_loss": -10.213958740234375, "global_step": 109498, "epoch": 651} {"train_loss": -9.916595458984375, "global_step": 109499, "epoch": 651} {"train_loss": -10.124780654907227, "global_step": 109500, "epoch": 651} {"train_loss": -10.109780311584473, "global_step": 109501, "epoch": 651} {"train_loss": -10.14126205444336, "global_step": 109502, "epoch": 651} {"train_loss": -9.924633026123047, "global_step": 109503, "epoch": 651} {"train_loss": -10.034770965576172, "global_step": 109504, "epoch": 651} {"train_loss": -9.693693161010742, "global_step": 109505, "epoch": 651} {"train_loss": -10.116015434265137, "global_step": 109506, "epoch": 651} {"train_loss": -9.82625961303711, "global_step": 109507, "epoch": 651} {"train_loss": -10.027111053466797, "global_step": 109508, "epoch": 651} {"train_loss": -9.984870910644531, "global_step": 109509, "epoch": 651} {"train_loss": -9.944353103637695, "global_step": 109510, "epoch": 651} {"train_loss": -10.061318397521973, "global_step": 109511, "epoch": 651} {"train_loss": -9.96465015411377, "global_step": 109512, "epoch": 651} {"train_loss": -10.201055526733398, "global_step": 109513, "epoch": 651} {"train_loss": -10.017991065979004, "global_step": 109514, "epoch": 651} {"train_loss": -10.04542350769043, "global_step": 109515, "epoch": 651} {"train_loss": -10.024827003479004, "global_step": 109516, "epoch": 651} {"train_loss": -9.886911392211914, "global_step": 109517, "epoch": 651} {"train_loss": -9.94087028503418, "global_step": 109518, "epoch": 651} {"train_loss": -9.954263687133789, "global_step": 109519, "epoch": 651} {"train_loss": -10.196747779846191, "global_step": 109520, "epoch": 651} {"train_loss": -10.127607345581055, "global_step": 109521, "epoch": 651} {"train_loss": -9.793047904968262, "global_step": 109522, "epoch": 651} {"train_loss": -10.075052261352539, "global_step": 109523, "epoch": 651} {"train_loss": -10.172739028930664, "global_step": 109524, "epoch": 651} {"train_loss": -10.102405548095703, "global_step": 109525, "epoch": 651} {"train_loss": -10.17715835571289, "global_step": 109526, "epoch": 651} {"train_loss": -10.00253677368164, "global_step": 109527, "epoch": 651} {"train_loss": -9.997598648071289, "global_step": 109528, "epoch": 651} {"train_loss": -10.147634506225586, "global_step": 109529, "epoch": 651} {"train_loss": -10.31656551361084, "global_step": 109530, "epoch": 651} {"train_loss": -9.990602493286133, "global_step": 109531, "epoch": 651} {"train_loss": -9.865813255310059, "global_step": 109532, "epoch": 651} {"train_loss": -9.698920249938965, "global_step": 109533, "epoch": 651} {"train_loss": -9.86327075958252, "global_step": 109534, "epoch": 651} {"train_loss": -9.928423592022487, "global_step": 109535, "epoch": 651, "val_loss": 207800.875} {"train_loss": -9.75003433227539, "global_step": 109536, "epoch": 652} {"train_loss": -9.742510795593262, "global_step": 109537, "epoch": 652} {"train_loss": -9.393560409545898, "global_step": 109538, "epoch": 652} {"train_loss": -9.784479141235352, "global_step": 109539, "epoch": 652} {"train_loss": -9.498641014099121, "global_step": 109540, "epoch": 652} {"train_loss": -9.970662117004395, "global_step": 109541, "epoch": 652} {"train_loss": -9.964560508728027, "global_step": 109542, "epoch": 652} {"train_loss": -9.725954055786133, "global_step": 109543, "epoch": 652} {"train_loss": -9.941853523254395, "global_step": 109544, "epoch": 652} {"train_loss": -9.49428939819336, "global_step": 109545, "epoch": 652} {"train_loss": -9.970848083496094, "global_step": 109546, "epoch": 652} {"train_loss": -9.845409393310547, "global_step": 109547, "epoch": 652} {"train_loss": -9.915945053100586, "global_step": 109548, "epoch": 652} {"train_loss": -10.033422470092773, "global_step": 109549, "epoch": 652} {"train_loss": -9.636371612548828, "global_step": 109550, "epoch": 652} {"train_loss": -10.038623809814453, "global_step": 109551, "epoch": 652} {"train_loss": -9.941693305969238, "global_step": 109552, "epoch": 652} {"train_loss": -10.014694213867188, "global_step": 109553, "epoch": 652} {"train_loss": -10.004535675048828, "global_step": 109554, "epoch": 652} {"train_loss": -9.617671012878418, "global_step": 109555, "epoch": 652} {"train_loss": -9.79626750946045, "global_step": 109556, "epoch": 652} {"train_loss": -10.100961685180664, "global_step": 109557, "epoch": 652} {"train_loss": -9.94291877746582, "global_step": 109558, "epoch": 652} {"train_loss": -9.868156433105469, "global_step": 109559, "epoch": 652} {"train_loss": -10.012012481689453, "global_step": 109560, "epoch": 652} {"train_loss": -10.10690689086914, "global_step": 109561, "epoch": 652} {"train_loss": -9.890324592590332, "global_step": 109562, "epoch": 652} {"train_loss": -9.748880386352539, "global_step": 109563, "epoch": 652} {"train_loss": -10.128676414489746, "global_step": 109564, "epoch": 652} {"train_loss": -9.797002792358398, "global_step": 109565, "epoch": 652} {"train_loss": -10.166500091552734, "global_step": 109566, "epoch": 652} {"train_loss": -10.057647705078125, "global_step": 109567, "epoch": 652} {"train_loss": -9.902868270874023, "global_step": 109568, "epoch": 652} {"train_loss": -9.954025268554688, "global_step": 109569, "epoch": 652} {"train_loss": -10.161478042602539, "global_step": 109570, "epoch": 652} {"train_loss": -10.097236633300781, "global_step": 109571, "epoch": 652} {"train_loss": -9.823180198669434, "global_step": 109572, "epoch": 652} {"train_loss": -9.845990180969238, "global_step": 109573, "epoch": 652} {"train_loss": -9.702727317810059, "global_step": 109574, "epoch": 652} {"train_loss": -10.025949478149414, "global_step": 109575, "epoch": 652} {"train_loss": -9.719220161437988, "global_step": 109576, "epoch": 652} {"train_loss": -9.815813064575195, "global_step": 109577, "epoch": 652} {"train_loss": -9.909433364868164, "global_step": 109578, "epoch": 652} {"train_loss": -9.713274002075195, "global_step": 109579, "epoch": 652} {"train_loss": -9.991704940795898, "global_step": 109580, "epoch": 652} {"train_loss": -9.424121856689453, "global_step": 109581, "epoch": 652} {"train_loss": -9.980236053466797, "global_step": 109582, "epoch": 652} {"train_loss": -9.741660118103027, "global_step": 109583, "epoch": 652} {"train_loss": -9.653031349182129, "global_step": 109584, "epoch": 652} {"train_loss": -9.924605369567871, "global_step": 109585, "epoch": 652} {"train_loss": -9.909093856811523, "global_step": 109586, "epoch": 652} {"train_loss": -9.54017448425293, "global_step": 109587, "epoch": 652} {"train_loss": -9.857269287109375, "global_step": 109588, "epoch": 652} {"train_loss": -9.942850112915039, "global_step": 109589, "epoch": 652} {"train_loss": -9.113950729370117, "global_step": 109590, "epoch": 652} {"train_loss": -9.509843826293945, "global_step": 109591, "epoch": 652} {"train_loss": -8.994818687438965, "global_step": 109592, "epoch": 652} {"train_loss": -9.303014755249023, "global_step": 109593, "epoch": 652} {"train_loss": -9.572000503540039, "global_step": 109594, "epoch": 652} {"train_loss": -9.851829528808594, "global_step": 109595, "epoch": 652} {"train_loss": -9.505220413208008, "global_step": 109596, "epoch": 652} {"train_loss": -9.849103927612305, "global_step": 109597, "epoch": 652} {"train_loss": -9.25766372680664, "global_step": 109598, "epoch": 652} {"train_loss": -9.905791282653809, "global_step": 109599, "epoch": 652} {"train_loss": -9.511054992675781, "global_step": 109600, "epoch": 652} {"train_loss": -9.796278953552246, "global_step": 109601, "epoch": 652} {"train_loss": -9.421874046325684, "global_step": 109602, "epoch": 652} {"train_loss": -9.669886589050293, "global_step": 109603, "epoch": 652} {"train_loss": -9.680120468139648, "global_step": 109604, "epoch": 652} {"train_loss": -9.925920486450195, "global_step": 109605, "epoch": 652} {"train_loss": -9.538728713989258, "global_step": 109606, "epoch": 652} {"train_loss": -10.04647445678711, "global_step": 109607, "epoch": 652} {"train_loss": -9.7171049118042, "global_step": 109608, "epoch": 652} {"train_loss": -9.809879302978516, "global_step": 109609, "epoch": 652} {"train_loss": -9.960412979125977, "global_step": 109610, "epoch": 652} {"train_loss": -9.978231430053711, "global_step": 109611, "epoch": 652} {"train_loss": -9.924589157104492, "global_step": 109612, "epoch": 652} {"train_loss": -9.908580780029297, "global_step": 109613, "epoch": 652} {"train_loss": -9.908767700195312, "global_step": 109614, "epoch": 652} {"train_loss": -9.933094024658203, "global_step": 109615, "epoch": 652} {"train_loss": -9.871148109436035, "global_step": 109616, "epoch": 652} {"train_loss": -9.749287605285645, "global_step": 109617, "epoch": 652} {"train_loss": -9.902841567993164, "global_step": 109618, "epoch": 652} {"train_loss": -10.006038665771484, "global_step": 109619, "epoch": 652} {"train_loss": -10.017784118652344, "global_step": 109620, "epoch": 652} {"train_loss": -9.227354049682617, "global_step": 109621, "epoch": 652} {"train_loss": -9.65331745147705, "global_step": 109622, "epoch": 652} {"train_loss": -9.426753044128418, "global_step": 109623, "epoch": 652} {"train_loss": -9.606422424316406, "global_step": 109624, "epoch": 652} {"train_loss": -9.401987075805664, "global_step": 109625, "epoch": 652} {"train_loss": -9.494606971740723, "global_step": 109626, "epoch": 652} {"train_loss": -9.90837287902832, "global_step": 109627, "epoch": 652} {"train_loss": -9.587244033813477, "global_step": 109628, "epoch": 652} {"train_loss": -9.73558521270752, "global_step": 109629, "epoch": 652} {"train_loss": -9.72743034362793, "global_step": 109630, "epoch": 652} {"train_loss": -9.781225204467773, "global_step": 109631, "epoch": 652} {"train_loss": -9.584939956665039, "global_step": 109632, "epoch": 652} {"train_loss": -9.747295379638672, "global_step": 109633, "epoch": 652} {"train_loss": -9.755733489990234, "global_step": 109634, "epoch": 652} {"train_loss": -9.701946258544922, "global_step": 109635, "epoch": 652} {"train_loss": -9.687607765197754, "global_step": 109636, "epoch": 652} {"train_loss": -9.88014030456543, "global_step": 109637, "epoch": 652} {"train_loss": -9.878965377807617, "global_step": 109638, "epoch": 652} {"train_loss": -10.002299308776855, "global_step": 109639, "epoch": 652} {"train_loss": -9.74524211883545, "global_step": 109640, "epoch": 652} {"train_loss": -9.629583358764648, "global_step": 109641, "epoch": 652} {"train_loss": -9.997193336486816, "global_step": 109642, "epoch": 652} {"train_loss": -9.436620712280273, "global_step": 109643, "epoch": 652} {"train_loss": -10.112110137939453, "global_step": 109644, "epoch": 652} {"train_loss": -9.847549438476562, "global_step": 109645, "epoch": 652} {"train_loss": -9.939181327819824, "global_step": 109646, "epoch": 652} {"train_loss": -9.490100860595703, "global_step": 109647, "epoch": 652} {"train_loss": -9.758430480957031, "global_step": 109648, "epoch": 652} {"train_loss": -9.109092712402344, "global_step": 109649, "epoch": 652} {"train_loss": -10.010103225708008, "global_step": 109650, "epoch": 652} {"train_loss": -9.204469680786133, "global_step": 109651, "epoch": 652} {"train_loss": -10.210027694702148, "global_step": 109652, "epoch": 652} {"train_loss": -9.656017303466797, "global_step": 109653, "epoch": 652} {"train_loss": -10.047368049621582, "global_step": 109654, "epoch": 652} {"train_loss": -9.530163764953613, "global_step": 109655, "epoch": 652} {"train_loss": -9.778560638427734, "global_step": 109656, "epoch": 652} {"train_loss": -9.772907257080078, "global_step": 109657, "epoch": 652} {"train_loss": -10.095940589904785, "global_step": 109658, "epoch": 652} {"train_loss": -9.669820785522461, "global_step": 109659, "epoch": 652} {"train_loss": -9.948137283325195, "global_step": 109660, "epoch": 652} {"train_loss": -9.706498146057129, "global_step": 109661, "epoch": 652} {"train_loss": -9.622589111328125, "global_step": 109662, "epoch": 652} {"train_loss": -9.947042465209961, "global_step": 109663, "epoch": 652} {"train_loss": -9.805414199829102, "global_step": 109664, "epoch": 652} {"train_loss": -9.72032356262207, "global_step": 109665, "epoch": 652} {"train_loss": -9.964624404907227, "global_step": 109666, "epoch": 652} {"train_loss": -9.761190414428711, "global_step": 109667, "epoch": 652} {"train_loss": -9.854117393493652, "global_step": 109668, "epoch": 652} {"train_loss": -10.05700397491455, "global_step": 109669, "epoch": 652} {"train_loss": -9.947826385498047, "global_step": 109670, "epoch": 652} {"train_loss": -9.896139144897461, "global_step": 109671, "epoch": 652} {"train_loss": -10.079980850219727, "global_step": 109672, "epoch": 652} {"train_loss": -9.936287879943848, "global_step": 109673, "epoch": 652} {"train_loss": -9.893099784851074, "global_step": 109674, "epoch": 652} {"train_loss": -10.079870223999023, "global_step": 109675, "epoch": 652} {"train_loss": -10.028003692626953, "global_step": 109676, "epoch": 652} {"train_loss": -10.006523132324219, "global_step": 109677, "epoch": 652} {"train_loss": -9.546930313110352, "global_step": 109678, "epoch": 652} {"train_loss": -9.974528312683105, "global_step": 109679, "epoch": 652} {"train_loss": -9.76019287109375, "global_step": 109680, "epoch": 652} {"train_loss": -10.10658073425293, "global_step": 109681, "epoch": 652} {"train_loss": -9.816030502319336, "global_step": 109682, "epoch": 652} {"train_loss": -10.027673721313477, "global_step": 109683, "epoch": 652} {"train_loss": -10.013971328735352, "global_step": 109684, "epoch": 652} {"train_loss": -9.978879928588867, "global_step": 109685, "epoch": 652} {"train_loss": -9.892379760742188, "global_step": 109686, "epoch": 652} {"train_loss": -9.695781707763672, "global_step": 109687, "epoch": 652} {"train_loss": -10.299793243408203, "global_step": 109688, "epoch": 652} {"train_loss": -10.341024398803711, "global_step": 109689, "epoch": 652} {"train_loss": -10.14781665802002, "global_step": 109690, "epoch": 652} {"train_loss": -9.84337329864502, "global_step": 109691, "epoch": 652} {"train_loss": -10.296557426452637, "global_step": 109692, "epoch": 652} {"train_loss": -9.984671592712402, "global_step": 109693, "epoch": 652} {"train_loss": -9.643943786621094, "global_step": 109694, "epoch": 652} {"train_loss": -10.36003303527832, "global_step": 109695, "epoch": 652} {"train_loss": -9.85730266571045, "global_step": 109696, "epoch": 652} {"train_loss": -10.070444107055664, "global_step": 109697, "epoch": 652} {"train_loss": -9.978997230529785, "global_step": 109698, "epoch": 652} {"train_loss": -9.785292625427246, "global_step": 109699, "epoch": 652} {"train_loss": -10.205709457397461, "global_step": 109700, "epoch": 652} {"train_loss": -9.554985046386719, "global_step": 109701, "epoch": 652} {"train_loss": -9.346549987792969, "global_step": 109702, "epoch": 652} {"train_loss": -9.815371712048849, "global_step": 109703, "epoch": 652, "val_loss": 211550.75} {"train_loss": -9.865646362304688, "global_step": 109704, "epoch": 653} {"train_loss": -9.651156425476074, "global_step": 109705, "epoch": 653} {"train_loss": -9.648591995239258, "global_step": 109706, "epoch": 653} {"train_loss": -10.074528694152832, "global_step": 109707, "epoch": 653} {"train_loss": -9.69180965423584, "global_step": 109708, "epoch": 653} {"train_loss": -9.595773696899414, "global_step": 109709, "epoch": 653} {"train_loss": -10.092899322509766, "global_step": 109710, "epoch": 653} {"train_loss": -9.098480224609375, "global_step": 109711, "epoch": 653} {"train_loss": -9.973841667175293, "global_step": 109712, "epoch": 653} {"train_loss": -9.492565155029297, "global_step": 109713, "epoch": 653} {"train_loss": -9.750875473022461, "global_step": 109714, "epoch": 653} {"train_loss": -9.72746753692627, "global_step": 109715, "epoch": 653} {"train_loss": -9.695320129394531, "global_step": 109716, "epoch": 653} {"train_loss": -9.772493362426758, "global_step": 109717, "epoch": 653} {"train_loss": -10.007735252380371, "global_step": 109718, "epoch": 653} {"train_loss": -9.965824127197266, "global_step": 109719, "epoch": 653} {"train_loss": -9.686659812927246, "global_step": 109720, "epoch": 653} {"train_loss": -9.851058959960938, "global_step": 109721, "epoch": 653} {"train_loss": -9.771085739135742, "global_step": 109722, "epoch": 653} {"train_loss": -10.09542179107666, "global_step": 109723, "epoch": 653} {"train_loss": -9.657378196716309, "global_step": 109724, "epoch": 653} {"train_loss": -10.013958930969238, "global_step": 109725, "epoch": 653} {"train_loss": -9.620452880859375, "global_step": 109726, "epoch": 653} {"train_loss": -9.77849006652832, "global_step": 109727, "epoch": 653} {"train_loss": -9.849309921264648, "global_step": 109728, "epoch": 653} {"train_loss": -9.697550773620605, "global_step": 109729, "epoch": 653} {"train_loss": -9.965166091918945, "global_step": 109730, "epoch": 653} {"train_loss": -10.056831359863281, "global_step": 109731, "epoch": 653} {"train_loss": -9.888731002807617, "global_step": 109732, "epoch": 653} {"train_loss": -10.034137725830078, "global_step": 109733, "epoch": 653} {"train_loss": -9.944822311401367, "global_step": 109734, "epoch": 653} {"train_loss": -9.854982376098633, "global_step": 109735, "epoch": 653} {"train_loss": -10.196722030639648, "global_step": 109736, "epoch": 653} {"train_loss": -10.023908615112305, "global_step": 109737, "epoch": 653} {"train_loss": -9.996969223022461, "global_step": 109738, "epoch": 653} {"train_loss": -9.984447479248047, "global_step": 109739, "epoch": 653} {"train_loss": -9.80080795288086, "global_step": 109740, "epoch": 653} {"train_loss": -10.131826400756836, "global_step": 109741, "epoch": 653} {"train_loss": -10.004963874816895, "global_step": 109742, "epoch": 653} {"train_loss": -10.021730422973633, "global_step": 109743, "epoch": 653} {"train_loss": -10.014581680297852, "global_step": 109744, "epoch": 653} {"train_loss": -9.2938814163208, "global_step": 109745, "epoch": 653} {"train_loss": -10.337867736816406, "global_step": 109746, "epoch": 653} {"train_loss": -9.431636810302734, "global_step": 109747, "epoch": 653} {"train_loss": -9.850008010864258, "global_step": 109748, "epoch": 653} {"train_loss": -9.77437686920166, "global_step": 109749, "epoch": 653} {"train_loss": -9.398177146911621, "global_step": 109750, "epoch": 653} {"train_loss": -9.942449569702148, "global_step": 109751, "epoch": 653} {"train_loss": -9.812721252441406, "global_step": 109752, "epoch": 653} {"train_loss": -9.845842361450195, "global_step": 109753, "epoch": 653} {"train_loss": -10.385459899902344, "global_step": 109754, "epoch": 653} {"train_loss": -9.881324768066406, "global_step": 109755, "epoch": 653} {"train_loss": -10.251961708068848, "global_step": 109756, "epoch": 653} {"train_loss": -10.043054580688477, "global_step": 109757, "epoch": 653} {"train_loss": -10.115592002868652, "global_step": 109758, "epoch": 653} {"train_loss": -9.878775596618652, "global_step": 109759, "epoch": 653} {"train_loss": -10.173175811767578, "global_step": 109760, "epoch": 653} {"train_loss": -9.990253448486328, "global_step": 109761, "epoch": 653} {"train_loss": -10.063594818115234, "global_step": 109762, "epoch": 653} {"train_loss": -10.291141510009766, "global_step": 109763, "epoch": 653} {"train_loss": -10.125141143798828, "global_step": 109764, "epoch": 653} {"train_loss": -10.29196834564209, "global_step": 109765, "epoch": 653} {"train_loss": -10.012031555175781, "global_step": 109766, "epoch": 653} {"train_loss": -10.200650215148926, "global_step": 109767, "epoch": 653} {"train_loss": -10.044839859008789, "global_step": 109768, "epoch": 653} {"train_loss": -10.061332702636719, "global_step": 109769, "epoch": 653} {"train_loss": -9.788481712341309, "global_step": 109770, "epoch": 653} {"train_loss": -10.039302825927734, "global_step": 109771, "epoch": 653} {"train_loss": -9.725223541259766, "global_step": 109772, "epoch": 653} {"train_loss": -9.098090171813965, "global_step": 109773, "epoch": 653} {"train_loss": -10.013398170471191, "global_step": 109774, "epoch": 653} {"train_loss": -9.331911087036133, "global_step": 109775, "epoch": 653} {"train_loss": -9.608799934387207, "global_step": 109776, "epoch": 653} {"train_loss": -9.09543514251709, "global_step": 109777, "epoch": 653} {"train_loss": -9.182069778442383, "global_step": 109778, "epoch": 653} {"train_loss": -9.770360946655273, "global_step": 109779, "epoch": 653} {"train_loss": -9.146668434143066, "global_step": 109780, "epoch": 653} {"train_loss": -9.511346817016602, "global_step": 109781, "epoch": 653} {"train_loss": -8.821039199829102, "global_step": 109782, "epoch": 653} {"train_loss": -9.417073249816895, "global_step": 109783, "epoch": 653} {"train_loss": -8.943546295166016, "global_step": 109784, "epoch": 653} {"train_loss": -9.35873031616211, "global_step": 109785, "epoch": 653} {"train_loss": -9.009462356567383, "global_step": 109786, "epoch": 653} {"train_loss": -9.282440185546875, "global_step": 109787, "epoch": 653} {"train_loss": -9.369738578796387, "global_step": 109788, "epoch": 653} {"train_loss": -8.885822296142578, "global_step": 109789, "epoch": 653} {"train_loss": -9.417423248291016, "global_step": 109790, "epoch": 653} {"train_loss": -9.743673324584961, "global_step": 109791, "epoch": 653} {"train_loss": -9.135595321655273, "global_step": 109792, "epoch": 653} {"train_loss": -9.417060852050781, "global_step": 109793, "epoch": 653} {"train_loss": -9.568872451782227, "global_step": 109794, "epoch": 653} {"train_loss": -9.491605758666992, "global_step": 109795, "epoch": 653} {"train_loss": -9.51605224609375, "global_step": 109796, "epoch": 653} {"train_loss": -9.286968231201172, "global_step": 109797, "epoch": 653} {"train_loss": -9.735811233520508, "global_step": 109798, "epoch": 653} {"train_loss": -9.494768142700195, "global_step": 109799, "epoch": 653} {"train_loss": -9.659395217895508, "global_step": 109800, "epoch": 653} {"train_loss": -9.615592956542969, "global_step": 109801, "epoch": 653} {"train_loss": -9.72995662689209, "global_step": 109802, "epoch": 653} {"train_loss": -9.6331148147583, "global_step": 109803, "epoch": 653} {"train_loss": -8.842422485351562, "global_step": 109804, "epoch": 653} {"train_loss": -9.974231719970703, "global_step": 109805, "epoch": 653} {"train_loss": -9.539009094238281, "global_step": 109806, "epoch": 653} {"train_loss": -9.795206069946289, "global_step": 109807, "epoch": 653} {"train_loss": -9.783535957336426, "global_step": 109808, "epoch": 653} {"train_loss": -9.789135932922363, "global_step": 109809, "epoch": 653} {"train_loss": -9.886224746704102, "global_step": 109810, "epoch": 653} {"train_loss": -9.921871185302734, "global_step": 109811, "epoch": 653} {"train_loss": -9.812427520751953, "global_step": 109812, "epoch": 653} {"train_loss": -10.073050498962402, "global_step": 109813, "epoch": 653} {"train_loss": -10.092121124267578, "global_step": 109814, "epoch": 653} {"train_loss": -9.786009788513184, "global_step": 109815, "epoch": 653} {"train_loss": -9.939704895019531, "global_step": 109816, "epoch": 653} {"train_loss": -9.896537780761719, "global_step": 109817, "epoch": 653} {"train_loss": -9.908011436462402, "global_step": 109818, "epoch": 653} {"train_loss": -9.952249526977539, "global_step": 109819, "epoch": 653} {"train_loss": -9.837750434875488, "global_step": 109820, "epoch": 653} {"train_loss": -10.052125930786133, "global_step": 109821, "epoch": 653} {"train_loss": -9.98609447479248, "global_step": 109822, "epoch": 653} {"train_loss": -9.980606079101562, "global_step": 109823, "epoch": 653} {"train_loss": -10.280450820922852, "global_step": 109824, "epoch": 653} {"train_loss": -9.789101600646973, "global_step": 109825, "epoch": 653} {"train_loss": -9.728367805480957, "global_step": 109826, "epoch": 653} {"train_loss": -10.070568084716797, "global_step": 109827, "epoch": 653} {"train_loss": -9.629966735839844, "global_step": 109828, "epoch": 653} {"train_loss": -9.978083610534668, "global_step": 109829, "epoch": 653} {"train_loss": -10.049373626708984, "global_step": 109830, "epoch": 653} {"train_loss": -9.97187328338623, "global_step": 109831, "epoch": 653} {"train_loss": -10.160537719726562, "global_step": 109832, "epoch": 653} {"train_loss": -10.030799865722656, "global_step": 109833, "epoch": 653} {"train_loss": -10.022859573364258, "global_step": 109834, "epoch": 653} {"train_loss": -10.108779907226562, "global_step": 109835, "epoch": 653} {"train_loss": -10.099702835083008, "global_step": 109836, "epoch": 653} {"train_loss": -9.993467330932617, "global_step": 109837, "epoch": 653} {"train_loss": -9.980152130126953, "global_step": 109838, "epoch": 653} {"train_loss": -10.259575843811035, "global_step": 109839, "epoch": 653} {"train_loss": -10.075809478759766, "global_step": 109840, "epoch": 653} {"train_loss": -10.022747039794922, "global_step": 109841, "epoch": 653} {"train_loss": -10.101228713989258, "global_step": 109842, "epoch": 653} {"train_loss": -10.05838394165039, "global_step": 109843, "epoch": 653} {"train_loss": -10.007450103759766, "global_step": 109844, "epoch": 653} {"train_loss": -9.704121589660645, "global_step": 109845, "epoch": 653} {"train_loss": -9.969724655151367, "global_step": 109846, "epoch": 653} {"train_loss": -9.878501892089844, "global_step": 109847, "epoch": 653} {"train_loss": -9.661046981811523, "global_step": 109848, "epoch": 653} {"train_loss": -9.118867874145508, "global_step": 109849, "epoch": 653} {"train_loss": -10.024040222167969, "global_step": 109850, "epoch": 653} {"train_loss": -9.024068832397461, "global_step": 109851, "epoch": 653} {"train_loss": -9.875582695007324, "global_step": 109852, "epoch": 653} {"train_loss": -9.913766860961914, "global_step": 109853, "epoch": 653} {"train_loss": -9.516937255859375, "global_step": 109854, "epoch": 653} {"train_loss": -9.4047212600708, "global_step": 109855, "epoch": 653} {"train_loss": -8.965778350830078, "global_step": 109856, "epoch": 653} {"train_loss": -9.708442687988281, "global_step": 109857, "epoch": 653} {"train_loss": -9.78157901763916, "global_step": 109858, "epoch": 653} {"train_loss": -9.504725456237793, "global_step": 109859, "epoch": 653} {"train_loss": -9.578857421875, "global_step": 109860, "epoch": 653} {"train_loss": -9.871698379516602, "global_step": 109861, "epoch": 653} {"train_loss": -9.8006010055542, "global_step": 109862, "epoch": 653} {"train_loss": -9.917278289794922, "global_step": 109863, "epoch": 653} {"train_loss": -9.915029525756836, "global_step": 109864, "epoch": 653} {"train_loss": -9.761163711547852, "global_step": 109865, "epoch": 653} {"train_loss": -10.126035690307617, "global_step": 109866, "epoch": 653} {"train_loss": -9.60851001739502, "global_step": 109867, "epoch": 653} {"train_loss": -9.953073501586914, "global_step": 109868, "epoch": 653} {"train_loss": -9.849931716918945, "global_step": 109869, "epoch": 653} {"train_loss": -9.974611282348633, "global_step": 109870, "epoch": 653} {"train_loss": -9.785753340948196, "global_step": 109871, "epoch": 653, "val_loss": 210620.171875} {"train_loss": -9.860801696777344, "global_step": 109872, "epoch": 654} {"train_loss": -9.796582221984863, "global_step": 109873, "epoch": 654} {"train_loss": -10.160406112670898, "global_step": 109874, "epoch": 654} {"train_loss": -9.909098625183105, "global_step": 109875, "epoch": 654} {"train_loss": -10.251861572265625, "global_step": 109876, "epoch": 654} {"train_loss": -10.026208877563477, "global_step": 109877, "epoch": 654} {"train_loss": -10.076891899108887, "global_step": 109878, "epoch": 654} {"train_loss": -9.960515975952148, "global_step": 109879, "epoch": 654} {"train_loss": -10.044380187988281, "global_step": 109880, "epoch": 654} {"train_loss": -10.182321548461914, "global_step": 109881, "epoch": 654} {"train_loss": -9.795984268188477, "global_step": 109882, "epoch": 654} {"train_loss": -10.078590393066406, "global_step": 109883, "epoch": 654} {"train_loss": -10.13949966430664, "global_step": 109884, "epoch": 654} {"train_loss": -9.974895477294922, "global_step": 109885, "epoch": 654} {"train_loss": -9.955161094665527, "global_step": 109886, "epoch": 654} {"train_loss": -10.0117826461792, "global_step": 109887, "epoch": 654} {"train_loss": -10.072786331176758, "global_step": 109888, "epoch": 654} {"train_loss": -10.012208938598633, "global_step": 109889, "epoch": 654} {"train_loss": -10.280317306518555, "global_step": 109890, "epoch": 654} {"train_loss": -9.870372772216797, "global_step": 109891, "epoch": 654} {"train_loss": -10.145425796508789, "global_step": 109892, "epoch": 654} {"train_loss": -10.047811508178711, "global_step": 109893, "epoch": 654} {"train_loss": -9.991340637207031, "global_step": 109894, "epoch": 654} {"train_loss": -9.947948455810547, "global_step": 109895, "epoch": 654} {"train_loss": -10.180435180664062, "global_step": 109896, "epoch": 654} {"train_loss": -9.874288558959961, "global_step": 109897, "epoch": 654} {"train_loss": -9.893793106079102, "global_step": 109898, "epoch": 654} {"train_loss": -9.798341751098633, "global_step": 109899, "epoch": 654} {"train_loss": -9.726933479309082, "global_step": 109900, "epoch": 654} {"train_loss": -9.324714660644531, "global_step": 109901, "epoch": 654} {"train_loss": -9.969090461730957, "global_step": 109902, "epoch": 654} {"train_loss": -9.687284469604492, "global_step": 109903, "epoch": 654} {"train_loss": -9.66851806640625, "global_step": 109904, "epoch": 654} {"train_loss": -9.289087295532227, "global_step": 109905, "epoch": 654} {"train_loss": -9.469788551330566, "global_step": 109906, "epoch": 654} {"train_loss": -8.860651969909668, "global_step": 109907, "epoch": 654} {"train_loss": -9.233959197998047, "global_step": 109908, "epoch": 654} {"train_loss": -9.361576080322266, "global_step": 109909, "epoch": 654} {"train_loss": -9.308039665222168, "global_step": 109910, "epoch": 654} {"train_loss": -9.577985763549805, "global_step": 109911, "epoch": 654} {"train_loss": -9.811792373657227, "global_step": 109912, "epoch": 654} {"train_loss": -9.490339279174805, "global_step": 109913, "epoch": 654} {"train_loss": -9.846248626708984, "global_step": 109914, "epoch": 654} {"train_loss": -9.41285228729248, "global_step": 109915, "epoch": 654} {"train_loss": -9.605049133300781, "global_step": 109916, "epoch": 654} {"train_loss": -9.725662231445312, "global_step": 109917, "epoch": 654} {"train_loss": -9.737920761108398, "global_step": 109918, "epoch": 654} {"train_loss": -9.495317459106445, "global_step": 109919, "epoch": 654} {"train_loss": -9.916364669799805, "global_step": 109920, "epoch": 654} {"train_loss": -9.539468765258789, "global_step": 109921, "epoch": 654} {"train_loss": -9.443426132202148, "global_step": 109922, "epoch": 654} {"train_loss": -9.889814376831055, "global_step": 109923, "epoch": 654} {"train_loss": -9.772823333740234, "global_step": 109924, "epoch": 654} {"train_loss": -10.08430290222168, "global_step": 109925, "epoch": 654} {"train_loss": -9.998305320739746, "global_step": 109926, "epoch": 654} {"train_loss": -9.832511901855469, "global_step": 109927, "epoch": 654} {"train_loss": -9.774093627929688, "global_step": 109928, "epoch": 654} {"train_loss": -10.11910629272461, "global_step": 109929, "epoch": 654} {"train_loss": -9.70975112915039, "global_step": 109930, "epoch": 654} {"train_loss": -9.945978164672852, "global_step": 109931, "epoch": 654} {"train_loss": -9.86568546295166, "global_step": 109932, "epoch": 654} {"train_loss": -9.786160469055176, "global_step": 109933, "epoch": 654} {"train_loss": -10.122769355773926, "global_step": 109934, "epoch": 654} {"train_loss": -9.922723770141602, "global_step": 109935, "epoch": 654} {"train_loss": -10.066511154174805, "global_step": 109936, "epoch": 654} {"train_loss": -10.276788711547852, "global_step": 109937, "epoch": 654} {"train_loss": -10.102336883544922, "global_step": 109938, "epoch": 654} {"train_loss": -9.880559921264648, "global_step": 109939, "epoch": 654} {"train_loss": -9.945810317993164, "global_step": 109940, "epoch": 654} {"train_loss": -9.889566421508789, "global_step": 109941, "epoch": 654} {"train_loss": -9.947127342224121, "global_step": 109942, "epoch": 654} {"train_loss": -9.981961250305176, "global_step": 109943, "epoch": 654} {"train_loss": -10.030050277709961, "global_step": 109944, "epoch": 654} {"train_loss": -10.207554817199707, "global_step": 109945, "epoch": 654} {"train_loss": -10.045684814453125, "global_step": 109946, "epoch": 654} {"train_loss": -9.954381942749023, "global_step": 109947, "epoch": 654} {"train_loss": -10.080657005310059, "global_step": 109948, "epoch": 654} {"train_loss": -10.307910919189453, "global_step": 109949, "epoch": 654} {"train_loss": -9.56514835357666, "global_step": 109950, "epoch": 654} {"train_loss": -9.942212104797363, "global_step": 109951, "epoch": 654} {"train_loss": -9.764400482177734, "global_step": 109952, "epoch": 654} {"train_loss": -10.248826026916504, "global_step": 109953, "epoch": 654} {"train_loss": -9.874221801757812, "global_step": 109954, "epoch": 654} {"train_loss": -9.705564498901367, "global_step": 109955, "epoch": 654} {"train_loss": -10.121345520019531, "global_step": 109956, "epoch": 654} {"train_loss": -9.845146179199219, "global_step": 109957, "epoch": 654} {"train_loss": -10.013744354248047, "global_step": 109958, "epoch": 654} {"train_loss": -10.049230575561523, "global_step": 109959, "epoch": 654} {"train_loss": -9.92330551147461, "global_step": 109960, "epoch": 654} {"train_loss": -10.034244537353516, "global_step": 109961, "epoch": 654} {"train_loss": -9.694835662841797, "global_step": 109962, "epoch": 654} {"train_loss": -9.842695236206055, "global_step": 109963, "epoch": 654} {"train_loss": -9.713750839233398, "global_step": 109964, "epoch": 654} {"train_loss": -10.100960731506348, "global_step": 109965, "epoch": 654} {"train_loss": -9.802294731140137, "global_step": 109966, "epoch": 654} {"train_loss": -9.722770690917969, "global_step": 109967, "epoch": 654} {"train_loss": -9.716991424560547, "global_step": 109968, "epoch": 654} {"train_loss": -9.857455253601074, "global_step": 109969, "epoch": 654} {"train_loss": -9.611064910888672, "global_step": 109970, "epoch": 654} {"train_loss": -9.887547492980957, "global_step": 109971, "epoch": 654} {"train_loss": -9.498271942138672, "global_step": 109972, "epoch": 654} {"train_loss": -9.828595161437988, "global_step": 109973, "epoch": 654} {"train_loss": -9.569154739379883, "global_step": 109974, "epoch": 654} {"train_loss": -9.66923999786377, "global_step": 109975, "epoch": 654} {"train_loss": -9.873601913452148, "global_step": 109976, "epoch": 654} {"train_loss": -9.471576690673828, "global_step": 109977, "epoch": 654} {"train_loss": -10.114253044128418, "global_step": 109978, "epoch": 654} {"train_loss": -9.577981948852539, "global_step": 109979, "epoch": 654} {"train_loss": -9.9376859664917, "global_step": 109980, "epoch": 654} {"train_loss": -9.717936515808105, "global_step": 109981, "epoch": 654} {"train_loss": -9.934690475463867, "global_step": 109982, "epoch": 654} {"train_loss": -9.678178787231445, "global_step": 109983, "epoch": 654} {"train_loss": -9.961749076843262, "global_step": 109984, "epoch": 654} {"train_loss": -9.539300918579102, "global_step": 109985, "epoch": 654} {"train_loss": -9.841160774230957, "global_step": 109986, "epoch": 654} {"train_loss": -9.470443725585938, "global_step": 109987, "epoch": 654} {"train_loss": -9.903535842895508, "global_step": 109988, "epoch": 654} {"train_loss": -9.624307632446289, "global_step": 109989, "epoch": 654} {"train_loss": -9.64069652557373, "global_step": 109990, "epoch": 654} {"train_loss": -10.146438598632812, "global_step": 109991, "epoch": 654} {"train_loss": -9.649099349975586, "global_step": 109992, "epoch": 654} {"train_loss": -9.956388473510742, "global_step": 109993, "epoch": 654} {"train_loss": -9.77414321899414, "global_step": 109994, "epoch": 654} {"train_loss": -9.827207565307617, "global_step": 109995, "epoch": 654} {"train_loss": -9.881093978881836, "global_step": 109996, "epoch": 654} {"train_loss": -9.700508117675781, "global_step": 109997, "epoch": 654} {"train_loss": -9.969317436218262, "global_step": 109998, "epoch": 654} {"train_loss": -10.08969783782959, "global_step": 109999, "epoch": 654} {"train_loss": -10.087831497192383, "global_step": 110000, "epoch": 654} {"train_loss": -10.082759857177734, "global_step": 110001, "epoch": 654} {"train_loss": -9.976871490478516, "global_step": 110002, "epoch": 654} {"train_loss": -9.878887176513672, "global_step": 110003, "epoch": 654} {"train_loss": -9.864709854125977, "global_step": 110004, "epoch": 654} {"train_loss": -9.992608070373535, "global_step": 110005, "epoch": 654} {"train_loss": -10.025466918945312, "global_step": 110006, "epoch": 654} {"train_loss": -9.919609069824219, "global_step": 110007, "epoch": 654} {"train_loss": -9.956467628479004, "global_step": 110008, "epoch": 654} {"train_loss": -10.275910377502441, "global_step": 110009, "epoch": 654} {"train_loss": -9.974699974060059, "global_step": 110010, "epoch": 654} {"train_loss": -10.243460655212402, "global_step": 110011, "epoch": 654} {"train_loss": -10.124235153198242, "global_step": 110012, "epoch": 654} {"train_loss": -9.998101234436035, "global_step": 110013, "epoch": 654} {"train_loss": -10.044997215270996, "global_step": 110014, "epoch": 654} {"train_loss": -10.152205467224121, "global_step": 110015, "epoch": 654} {"train_loss": -10.007758140563965, "global_step": 110016, "epoch": 654} {"train_loss": -9.836727142333984, "global_step": 110017, "epoch": 654} {"train_loss": -10.110040664672852, "global_step": 110018, "epoch": 654} {"train_loss": -9.854723930358887, "global_step": 110019, "epoch": 654} {"train_loss": -10.143608093261719, "global_step": 110020, "epoch": 654} {"train_loss": -10.04387092590332, "global_step": 110021, "epoch": 654} {"train_loss": -10.26536750793457, "global_step": 110022, "epoch": 654} {"train_loss": -10.023898124694824, "global_step": 110023, "epoch": 654} {"train_loss": -10.164072036743164, "global_step": 110024, "epoch": 654} {"train_loss": -10.004111289978027, "global_step": 110025, "epoch": 654} {"train_loss": -10.24264907836914, "global_step": 110026, "epoch": 654} {"train_loss": -10.132949829101562, "global_step": 110027, "epoch": 654} {"train_loss": -10.009380340576172, "global_step": 110028, "epoch": 654} {"train_loss": -10.139704704284668, "global_step": 110029, "epoch": 654} {"train_loss": -10.083686828613281, "global_step": 110030, "epoch": 654} {"train_loss": -9.729007720947266, "global_step": 110031, "epoch": 654} {"train_loss": -10.108392715454102, "global_step": 110032, "epoch": 654} {"train_loss": -9.734946250915527, "global_step": 110033, "epoch": 654} {"train_loss": -10.07067584991455, "global_step": 110034, "epoch": 654} {"train_loss": -10.060710906982422, "global_step": 110035, "epoch": 654} {"train_loss": -9.899307250976562, "global_step": 110036, "epoch": 654} {"train_loss": -9.740690231323242, "global_step": 110037, "epoch": 654} {"train_loss": -9.993317604064941, "global_step": 110038, "epoch": 654} {"train_loss": -9.88544880208515, "global_step": 110039, "epoch": 654, "val_loss": 211044.765625} {"train_loss": -9.69931411743164, "global_step": 110040, "epoch": 655} {"train_loss": -10.067780494689941, "global_step": 110041, "epoch": 655} {"train_loss": -9.640735626220703, "global_step": 110042, "epoch": 655} {"train_loss": -9.722661018371582, "global_step": 110043, "epoch": 655} {"train_loss": -9.663701057434082, "global_step": 110044, "epoch": 655} {"train_loss": -9.849449157714844, "global_step": 110045, "epoch": 655} {"train_loss": -9.777824401855469, "global_step": 110046, "epoch": 655} {"train_loss": -9.647270202636719, "global_step": 110047, "epoch": 655} {"train_loss": -9.776213645935059, "global_step": 110048, "epoch": 655} {"train_loss": -9.616765975952148, "global_step": 110049, "epoch": 655} {"train_loss": -9.761383056640625, "global_step": 110050, "epoch": 655} {"train_loss": -9.755184173583984, "global_step": 110051, "epoch": 655} {"train_loss": -9.710186004638672, "global_step": 110052, "epoch": 655} {"train_loss": -9.962921142578125, "global_step": 110053, "epoch": 655} {"train_loss": -9.683059692382812, "global_step": 110054, "epoch": 655} {"train_loss": -9.814567565917969, "global_step": 110055, "epoch": 655} {"train_loss": -9.945838928222656, "global_step": 110056, "epoch": 655} {"train_loss": -9.511404991149902, "global_step": 110057, "epoch": 655} {"train_loss": -9.85130500793457, "global_step": 110058, "epoch": 655} {"train_loss": -9.887035369873047, "global_step": 110059, "epoch": 655} {"train_loss": -9.829937934875488, "global_step": 110060, "epoch": 655} {"train_loss": -9.886817932128906, "global_step": 110061, "epoch": 655} {"train_loss": -9.785148620605469, "global_step": 110062, "epoch": 655} {"train_loss": -10.033183097839355, "global_step": 110063, "epoch": 655} {"train_loss": -10.08818244934082, "global_step": 110064, "epoch": 655} {"train_loss": -10.040400505065918, "global_step": 110065, "epoch": 655} {"train_loss": -10.13264274597168, "global_step": 110066, "epoch": 655} {"train_loss": -9.777929306030273, "global_step": 110067, "epoch": 655} {"train_loss": -9.975854873657227, "global_step": 110068, "epoch": 655} {"train_loss": -10.101627349853516, "global_step": 110069, "epoch": 655} {"train_loss": -9.820980072021484, "global_step": 110070, "epoch": 655} {"train_loss": -9.890470504760742, "global_step": 110071, "epoch": 655} {"train_loss": -9.988245010375977, "global_step": 110072, "epoch": 655} {"train_loss": -9.769919395446777, "global_step": 110073, "epoch": 655} {"train_loss": -10.060291290283203, "global_step": 110074, "epoch": 655} {"train_loss": -9.770450592041016, "global_step": 110075, "epoch": 655} {"train_loss": -9.959358215332031, "global_step": 110076, "epoch": 655} {"train_loss": -9.84532356262207, "global_step": 110077, "epoch": 655} {"train_loss": -9.87727165222168, "global_step": 110078, "epoch": 655} {"train_loss": -10.034303665161133, "global_step": 110079, "epoch": 655} {"train_loss": -9.994397163391113, "global_step": 110080, "epoch": 655} {"train_loss": -10.25027847290039, "global_step": 110081, "epoch": 655} {"train_loss": -9.948147773742676, "global_step": 110082, "epoch": 655} {"train_loss": -10.195314407348633, "global_step": 110083, "epoch": 655} {"train_loss": -9.8115234375, "global_step": 110084, "epoch": 655} {"train_loss": -10.098061561584473, "global_step": 110085, "epoch": 655} {"train_loss": -10.068331718444824, "global_step": 110086, "epoch": 655} {"train_loss": -10.051534652709961, "global_step": 110087, "epoch": 655} {"train_loss": -10.079532623291016, "global_step": 110088, "epoch": 655} {"train_loss": -10.04983139038086, "global_step": 110089, "epoch": 655} {"train_loss": -9.805811882019043, "global_step": 110090, "epoch": 655} {"train_loss": -9.95306396484375, "global_step": 110091, "epoch": 655} {"train_loss": -9.988933563232422, "global_step": 110092, "epoch": 655} {"train_loss": -10.126361846923828, "global_step": 110093, "epoch": 655} {"train_loss": -10.017853736877441, "global_step": 110094, "epoch": 655} {"train_loss": -9.942954063415527, "global_step": 110095, "epoch": 655} {"train_loss": -9.991008758544922, "global_step": 110096, "epoch": 655} {"train_loss": -9.739686965942383, "global_step": 110097, "epoch": 655} {"train_loss": -9.546791076660156, "global_step": 110098, "epoch": 655} {"train_loss": -10.048583984375, "global_step": 110099, "epoch": 655} {"train_loss": -9.832517623901367, "global_step": 110100, "epoch": 655} {"train_loss": -9.666180610656738, "global_step": 110101, "epoch": 655} {"train_loss": -10.191568374633789, "global_step": 110102, "epoch": 655} {"train_loss": -9.920827865600586, "global_step": 110103, "epoch": 655} {"train_loss": -9.352203369140625, "global_step": 110104, "epoch": 655} {"train_loss": -9.388893127441406, "global_step": 110105, "epoch": 655} {"train_loss": -9.919086456298828, "global_step": 110106, "epoch": 655} {"train_loss": -9.666536331176758, "global_step": 110107, "epoch": 655} {"train_loss": -9.649819374084473, "global_step": 110108, "epoch": 655} {"train_loss": -9.695122718811035, "global_step": 110109, "epoch": 655} {"train_loss": -9.471012115478516, "global_step": 110110, "epoch": 655} {"train_loss": -9.803380966186523, "global_step": 110111, "epoch": 655} {"train_loss": -9.749856948852539, "global_step": 110112, "epoch": 655} {"train_loss": -9.96252155303955, "global_step": 110113, "epoch": 655} {"train_loss": -9.963705062866211, "global_step": 110114, "epoch": 655} {"train_loss": -9.458032608032227, "global_step": 110115, "epoch": 655} {"train_loss": -10.23993968963623, "global_step": 110116, "epoch": 655} {"train_loss": -9.828481674194336, "global_step": 110117, "epoch": 655} {"train_loss": -9.578771591186523, "global_step": 110118, "epoch": 655} {"train_loss": -9.77459716796875, "global_step": 110119, "epoch": 655} {"train_loss": -9.90235710144043, "global_step": 110120, "epoch": 655} {"train_loss": -9.513853073120117, "global_step": 110121, "epoch": 655} {"train_loss": -9.767024993896484, "global_step": 110122, "epoch": 655} {"train_loss": -9.86097526550293, "global_step": 110123, "epoch": 655} {"train_loss": -9.931795120239258, "global_step": 110124, "epoch": 655} {"train_loss": -9.736671447753906, "global_step": 110125, "epoch": 655} {"train_loss": -9.8990478515625, "global_step": 110126, "epoch": 655} {"train_loss": -9.826526641845703, "global_step": 110127, "epoch": 655} {"train_loss": -9.877996444702148, "global_step": 110128, "epoch": 655} {"train_loss": -9.704422950744629, "global_step": 110129, "epoch": 655} {"train_loss": -9.598725318908691, "global_step": 110130, "epoch": 655} {"train_loss": -9.421545028686523, "global_step": 110131, "epoch": 655} {"train_loss": -9.96052360534668, "global_step": 110132, "epoch": 655} {"train_loss": -9.939066886901855, "global_step": 110133, "epoch": 655} {"train_loss": -9.877889633178711, "global_step": 110134, "epoch": 655} {"train_loss": -9.629744529724121, "global_step": 110135, "epoch": 655} {"train_loss": -9.90914535522461, "global_step": 110136, "epoch": 655} {"train_loss": -10.0324068069458, "global_step": 110137, "epoch": 655} {"train_loss": -9.919878959655762, "global_step": 110138, "epoch": 655} {"train_loss": -9.597987174987793, "global_step": 110139, "epoch": 655} {"train_loss": -9.869091033935547, "global_step": 110140, "epoch": 655} {"train_loss": -9.404109954833984, "global_step": 110141, "epoch": 655} {"train_loss": -9.937616348266602, "global_step": 110142, "epoch": 655} {"train_loss": -9.618613243103027, "global_step": 110143, "epoch": 655} {"train_loss": -9.448917388916016, "global_step": 110144, "epoch": 655} {"train_loss": -9.854005813598633, "global_step": 110145, "epoch": 655} {"train_loss": -9.512063026428223, "global_step": 110146, "epoch": 655} {"train_loss": -10.090034484863281, "global_step": 110147, "epoch": 655} {"train_loss": -9.76196575164795, "global_step": 110148, "epoch": 655} {"train_loss": -9.973692893981934, "global_step": 110149, "epoch": 655} {"train_loss": -9.758045196533203, "global_step": 110150, "epoch": 655} {"train_loss": -10.16897201538086, "global_step": 110151, "epoch": 655} {"train_loss": -9.949722290039062, "global_step": 110152, "epoch": 655} {"train_loss": -10.124967575073242, "global_step": 110153, "epoch": 655} {"train_loss": -9.982795715332031, "global_step": 110154, "epoch": 655} {"train_loss": -9.927146911621094, "global_step": 110155, "epoch": 655} {"train_loss": -9.851905822753906, "global_step": 110156, "epoch": 655} {"train_loss": -9.995179176330566, "global_step": 110157, "epoch": 655} {"train_loss": -9.77630615234375, "global_step": 110158, "epoch": 655} {"train_loss": -9.999996185302734, "global_step": 110159, "epoch": 655} {"train_loss": -9.879615783691406, "global_step": 110160, "epoch": 655} {"train_loss": -9.96053695678711, "global_step": 110161, "epoch": 655} {"train_loss": -9.585846900939941, "global_step": 110162, "epoch": 655} {"train_loss": -9.845975875854492, "global_step": 110163, "epoch": 655} {"train_loss": -9.71623706817627, "global_step": 110164, "epoch": 655} {"train_loss": -9.867406845092773, "global_step": 110165, "epoch": 655} {"train_loss": -9.851837158203125, "global_step": 110166, "epoch": 655} {"train_loss": -10.14990234375, "global_step": 110167, "epoch": 655} {"train_loss": -9.906097412109375, "global_step": 110168, "epoch": 655} {"train_loss": -10.172067642211914, "global_step": 110169, "epoch": 655} {"train_loss": -10.027008056640625, "global_step": 110170, "epoch": 655} {"train_loss": -9.999650955200195, "global_step": 110171, "epoch": 655} {"train_loss": -9.871206283569336, "global_step": 110172, "epoch": 655} {"train_loss": -9.818451881408691, "global_step": 110173, "epoch": 655} {"train_loss": -9.842758178710938, "global_step": 110174, "epoch": 655} {"train_loss": -10.036355972290039, "global_step": 110175, "epoch": 655} {"train_loss": -10.03108024597168, "global_step": 110176, "epoch": 655} {"train_loss": -9.915495872497559, "global_step": 110177, "epoch": 655} {"train_loss": -10.055022239685059, "global_step": 110178, "epoch": 655} {"train_loss": -10.094220161437988, "global_step": 110179, "epoch": 655} {"train_loss": -9.957700729370117, "global_step": 110180, "epoch": 655} {"train_loss": -9.926511764526367, "global_step": 110181, "epoch": 655} {"train_loss": -10.040290832519531, "global_step": 110182, "epoch": 655} {"train_loss": -9.550987243652344, "global_step": 110183, "epoch": 655} {"train_loss": -10.12605094909668, "global_step": 110184, "epoch": 655} {"train_loss": -9.92340087890625, "global_step": 110185, "epoch": 655} {"train_loss": -9.967376708984375, "global_step": 110186, "epoch": 655} {"train_loss": -9.62788200378418, "global_step": 110187, "epoch": 655} {"train_loss": -10.124123573303223, "global_step": 110188, "epoch": 655} {"train_loss": -9.634092330932617, "global_step": 110189, "epoch": 655} {"train_loss": -9.984007835388184, "global_step": 110190, "epoch": 655} {"train_loss": -9.98228645324707, "global_step": 110191, "epoch": 655} {"train_loss": -10.086316108703613, "global_step": 110192, "epoch": 655} {"train_loss": -9.896366119384766, "global_step": 110193, "epoch": 655} {"train_loss": -9.97653579711914, "global_step": 110194, "epoch": 655} {"train_loss": -9.838898658752441, "global_step": 110195, "epoch": 655} {"train_loss": -10.286114692687988, "global_step": 110196, "epoch": 655} {"train_loss": -9.922463417053223, "global_step": 110197, "epoch": 655} {"train_loss": -10.135709762573242, "global_step": 110198, "epoch": 655} {"train_loss": -9.881599426269531, "global_step": 110199, "epoch": 655} {"train_loss": -10.002887725830078, "global_step": 110200, "epoch": 655} {"train_loss": -9.947854995727539, "global_step": 110201, "epoch": 655} {"train_loss": -10.142130851745605, "global_step": 110202, "epoch": 655} {"train_loss": -9.743917465209961, "global_step": 110203, "epoch": 655} {"train_loss": -10.058340072631836, "global_step": 110204, "epoch": 655} {"train_loss": -9.984495162963867, "global_step": 110205, "epoch": 655} {"train_loss": -9.941093444824219, "global_step": 110206, "epoch": 655} {"train_loss": -9.87613822732653, "global_step": 110207, "epoch": 655, "val_loss": 209278.234375, "train_action_mse_error": 5.748773574829102} {"train_loss": -10.023589134216309, "global_step": 110208, "epoch": 656} {"train_loss": -10.069210052490234, "global_step": 110209, "epoch": 656} {"train_loss": -10.24801254272461, "global_step": 110210, "epoch": 656} {"train_loss": -10.151580810546875, "global_step": 110211, "epoch": 656} {"train_loss": -10.009716033935547, "global_step": 110212, "epoch": 656} {"train_loss": -10.323628425598145, "global_step": 110213, "epoch": 656} {"train_loss": -10.094259262084961, "global_step": 110214, "epoch": 656} {"train_loss": -9.975915908813477, "global_step": 110215, "epoch": 656} {"train_loss": -10.294055938720703, "global_step": 110216, "epoch": 656} {"train_loss": -10.027100563049316, "global_step": 110217, "epoch": 656} {"train_loss": -9.639769554138184, "global_step": 110218, "epoch": 656} {"train_loss": -10.203441619873047, "global_step": 110219, "epoch": 656} {"train_loss": -9.447220802307129, "global_step": 110220, "epoch": 656} {"train_loss": -9.399369239807129, "global_step": 110221, "epoch": 656} {"train_loss": -9.668034553527832, "global_step": 110222, "epoch": 656} {"train_loss": -9.279902458190918, "global_step": 110223, "epoch": 656} {"train_loss": -9.808940887451172, "global_step": 110224, "epoch": 656} {"train_loss": -8.500877380371094, "global_step": 110225, "epoch": 656} {"train_loss": -9.406147003173828, "global_step": 110226, "epoch": 656} {"train_loss": -8.818063735961914, "global_step": 110227, "epoch": 656} {"train_loss": -9.565134048461914, "global_step": 110228, "epoch": 656} {"train_loss": -9.311918258666992, "global_step": 110229, "epoch": 656} {"train_loss": -9.547268867492676, "global_step": 110230, "epoch": 656} {"train_loss": -9.226095199584961, "global_step": 110231, "epoch": 656} {"train_loss": -9.161439895629883, "global_step": 110232, "epoch": 656} {"train_loss": -9.365954399108887, "global_step": 110233, "epoch": 656} {"train_loss": -9.538115501403809, "global_step": 110234, "epoch": 656} {"train_loss": -8.95144271850586, "global_step": 110235, "epoch": 656} {"train_loss": -9.67379093170166, "global_step": 110236, "epoch": 656} {"train_loss": -9.09235954284668, "global_step": 110237, "epoch": 656} {"train_loss": -9.468330383300781, "global_step": 110238, "epoch": 656} {"train_loss": -9.608661651611328, "global_step": 110239, "epoch": 656} {"train_loss": -9.645033836364746, "global_step": 110240, "epoch": 656} {"train_loss": -9.512661933898926, "global_step": 110241, "epoch": 656} {"train_loss": -9.855487823486328, "global_step": 110242, "epoch": 656} {"train_loss": -9.633515357971191, "global_step": 110243, "epoch": 656} {"train_loss": -9.491366386413574, "global_step": 110244, "epoch": 656} {"train_loss": -9.71621322631836, "global_step": 110245, "epoch": 656} {"train_loss": -9.762849807739258, "global_step": 110246, "epoch": 656} {"train_loss": -9.678889274597168, "global_step": 110247, "epoch": 656} {"train_loss": -9.762595176696777, "global_step": 110248, "epoch": 656} {"train_loss": -9.871232986450195, "global_step": 110249, "epoch": 656} {"train_loss": -9.552221298217773, "global_step": 110250, "epoch": 656} {"train_loss": -9.536388397216797, "global_step": 110251, "epoch": 656} {"train_loss": -9.761652946472168, "global_step": 110252, "epoch": 656} {"train_loss": -10.037590026855469, "global_step": 110253, "epoch": 656} {"train_loss": -9.863561630249023, "global_step": 110254, "epoch": 656} {"train_loss": -9.87011432647705, "global_step": 110255, "epoch": 656} {"train_loss": -9.917119979858398, "global_step": 110256, "epoch": 656} {"train_loss": -9.830766677856445, "global_step": 110257, "epoch": 656} {"train_loss": -10.031478881835938, "global_step": 110258, "epoch": 656} {"train_loss": -9.909687042236328, "global_step": 110259, "epoch": 656} {"train_loss": -10.026010513305664, "global_step": 110260, "epoch": 656} {"train_loss": -9.865309715270996, "global_step": 110261, "epoch": 656} {"train_loss": -9.836830139160156, "global_step": 110262, "epoch": 656} {"train_loss": -10.031518936157227, "global_step": 110263, "epoch": 656} {"train_loss": -9.845710754394531, "global_step": 110264, "epoch": 656} {"train_loss": -9.916885375976562, "global_step": 110265, "epoch": 656} {"train_loss": -9.766792297363281, "global_step": 110266, "epoch": 656} {"train_loss": -9.977947235107422, "global_step": 110267, "epoch": 656} {"train_loss": -10.021641731262207, "global_step": 110268, "epoch": 656} {"train_loss": -9.79300594329834, "global_step": 110269, "epoch": 656} {"train_loss": -9.859487533569336, "global_step": 110270, "epoch": 656} {"train_loss": -9.749324798583984, "global_step": 110271, "epoch": 656} {"train_loss": -9.811381340026855, "global_step": 110272, "epoch": 656} {"train_loss": -10.18608283996582, "global_step": 110273, "epoch": 656} {"train_loss": -9.605335235595703, "global_step": 110274, "epoch": 656} {"train_loss": -9.831899642944336, "global_step": 110275, "epoch": 656} {"train_loss": -10.212501525878906, "global_step": 110276, "epoch": 656} {"train_loss": -9.870655059814453, "global_step": 110277, "epoch": 656} {"train_loss": -9.796964645385742, "global_step": 110278, "epoch": 656} {"train_loss": -10.138338088989258, "global_step": 110279, "epoch": 656} {"train_loss": -10.177006721496582, "global_step": 110280, "epoch": 656} {"train_loss": -10.039346694946289, "global_step": 110281, "epoch": 656} {"train_loss": -10.02078628540039, "global_step": 110282, "epoch": 656} {"train_loss": -10.169292449951172, "global_step": 110283, "epoch": 656} {"train_loss": -9.867758750915527, "global_step": 110284, "epoch": 656} {"train_loss": -9.927284240722656, "global_step": 110285, "epoch": 656} {"train_loss": -9.94551944732666, "global_step": 110286, "epoch": 656} {"train_loss": -10.02625846862793, "global_step": 110287, "epoch": 656} {"train_loss": -10.207247734069824, "global_step": 110288, "epoch": 656} {"train_loss": -9.764427185058594, "global_step": 110289, "epoch": 656} {"train_loss": -9.717830657958984, "global_step": 110290, "epoch": 656} {"train_loss": -9.364484786987305, "global_step": 110291, "epoch": 656} {"train_loss": -9.485611915588379, "global_step": 110292, "epoch": 656} {"train_loss": -9.871210098266602, "global_step": 110293, "epoch": 656} {"train_loss": -9.272918701171875, "global_step": 110294, "epoch": 656} {"train_loss": -9.810887336730957, "global_step": 110295, "epoch": 656} {"train_loss": -9.787851333618164, "global_step": 110296, "epoch": 656} {"train_loss": -9.749053001403809, "global_step": 110297, "epoch": 656} {"train_loss": -9.671897888183594, "global_step": 110298, "epoch": 656} {"train_loss": -9.637863159179688, "global_step": 110299, "epoch": 656} {"train_loss": -9.630387306213379, "global_step": 110300, "epoch": 656} {"train_loss": -9.867990493774414, "global_step": 110301, "epoch": 656} {"train_loss": -9.814737319946289, "global_step": 110302, "epoch": 656} {"train_loss": -9.65497875213623, "global_step": 110303, "epoch": 656} {"train_loss": -10.118221282958984, "global_step": 110304, "epoch": 656} {"train_loss": -9.814741134643555, "global_step": 110305, "epoch": 656} {"train_loss": -9.650764465332031, "global_step": 110306, "epoch": 656} {"train_loss": -9.941488265991211, "global_step": 110307, "epoch": 656} {"train_loss": -9.787318229675293, "global_step": 110308, "epoch": 656} {"train_loss": -10.039300918579102, "global_step": 110309, "epoch": 656} {"train_loss": -9.934783935546875, "global_step": 110310, "epoch": 656} {"train_loss": -9.818623542785645, "global_step": 110311, "epoch": 656} {"train_loss": -10.001081466674805, "global_step": 110312, "epoch": 656} {"train_loss": -10.020484924316406, "global_step": 110313, "epoch": 656} {"train_loss": -9.939895629882812, "global_step": 110314, "epoch": 656} {"train_loss": -9.947021484375, "global_step": 110315, "epoch": 656} {"train_loss": -10.06015396118164, "global_step": 110316, "epoch": 656} {"train_loss": -10.168627738952637, "global_step": 110317, "epoch": 656} {"train_loss": -10.240583419799805, "global_step": 110318, "epoch": 656} {"train_loss": -10.063170433044434, "global_step": 110319, "epoch": 656} {"train_loss": -10.132026672363281, "global_step": 110320, "epoch": 656} {"train_loss": -10.203156471252441, "global_step": 110321, "epoch": 656} {"train_loss": -10.055084228515625, "global_step": 110322, "epoch": 656} {"train_loss": -10.047811508178711, "global_step": 110323, "epoch": 656} {"train_loss": -10.069181442260742, "global_step": 110324, "epoch": 656} {"train_loss": -10.124917030334473, "global_step": 110325, "epoch": 656} {"train_loss": -10.250757217407227, "global_step": 110326, "epoch": 656} {"train_loss": -10.124374389648438, "global_step": 110327, "epoch": 656} {"train_loss": -10.170293807983398, "global_step": 110328, "epoch": 656} {"train_loss": -9.889728546142578, "global_step": 110329, "epoch": 656} {"train_loss": -9.982407569885254, "global_step": 110330, "epoch": 656} {"train_loss": -10.034749984741211, "global_step": 110331, "epoch": 656} {"train_loss": -9.757356643676758, "global_step": 110332, "epoch": 656} {"train_loss": -9.92758846282959, "global_step": 110333, "epoch": 656} {"train_loss": -10.013803482055664, "global_step": 110334, "epoch": 656} {"train_loss": -9.634908676147461, "global_step": 110335, "epoch": 656} {"train_loss": -10.056809425354004, "global_step": 110336, "epoch": 656} {"train_loss": -9.704208374023438, "global_step": 110337, "epoch": 656} {"train_loss": -9.93856143951416, "global_step": 110338, "epoch": 656} {"train_loss": -9.963011741638184, "global_step": 110339, "epoch": 656} {"train_loss": -9.967470169067383, "global_step": 110340, "epoch": 656} {"train_loss": -9.684814453125, "global_step": 110341, "epoch": 656} {"train_loss": -9.863933563232422, "global_step": 110342, "epoch": 656} {"train_loss": -9.920583724975586, "global_step": 110343, "epoch": 656} {"train_loss": -9.826364517211914, "global_step": 110344, "epoch": 656} {"train_loss": -10.095109939575195, "global_step": 110345, "epoch": 656} {"train_loss": -9.957918167114258, "global_step": 110346, "epoch": 656} {"train_loss": -9.919517517089844, "global_step": 110347, "epoch": 656} {"train_loss": -9.918493270874023, "global_step": 110348, "epoch": 656} {"train_loss": -10.134689331054688, "global_step": 110349, "epoch": 656} {"train_loss": -9.670787811279297, "global_step": 110350, "epoch": 656} {"train_loss": -10.018928527832031, "global_step": 110351, "epoch": 656} {"train_loss": -10.163326263427734, "global_step": 110352, "epoch": 656} {"train_loss": -9.950325965881348, "global_step": 110353, "epoch": 656} {"train_loss": -10.143964767456055, "global_step": 110354, "epoch": 656} {"train_loss": -10.231062889099121, "global_step": 110355, "epoch": 656} {"train_loss": -9.904060363769531, "global_step": 110356, "epoch": 656} {"train_loss": -10.035747528076172, "global_step": 110357, "epoch": 656} {"train_loss": -9.88825511932373, "global_step": 110358, "epoch": 656} {"train_loss": -10.022889137268066, "global_step": 110359, "epoch": 656} {"train_loss": -10.004060745239258, "global_step": 110360, "epoch": 656} {"train_loss": -10.398036003112793, "global_step": 110361, "epoch": 656} {"train_loss": -9.92078685760498, "global_step": 110362, "epoch": 656} {"train_loss": -10.258028030395508, "global_step": 110363, "epoch": 656} {"train_loss": -9.71662712097168, "global_step": 110364, "epoch": 656} {"train_loss": -9.978221893310547, "global_step": 110365, "epoch": 656} {"train_loss": -9.575630187988281, "global_step": 110366, "epoch": 656} {"train_loss": -9.891948699951172, "global_step": 110367, "epoch": 656} {"train_loss": -9.695895195007324, "global_step": 110368, "epoch": 656} {"train_loss": -9.819936752319336, "global_step": 110369, "epoch": 656} {"train_loss": -9.962272644042969, "global_step": 110370, "epoch": 656} {"train_loss": -9.685995101928711, "global_step": 110371, "epoch": 656} {"train_loss": -9.8101224899292, "global_step": 110372, "epoch": 656} {"train_loss": -9.804651260375977, "global_step": 110373, "epoch": 656} {"train_loss": -9.579620361328125, "global_step": 110374, "epoch": 656} {"train_loss": -9.8425342241923, "global_step": 110375, "epoch": 656, "val_loss": 211545.4375} {"train_loss": -9.801597595214844, "global_step": 110376, "epoch": 657} {"train_loss": -9.333351135253906, "global_step": 110377, "epoch": 657} {"train_loss": -9.54419994354248, "global_step": 110378, "epoch": 657} {"train_loss": -9.369495391845703, "global_step": 110379, "epoch": 657} {"train_loss": -9.81450080871582, "global_step": 110380, "epoch": 657} {"train_loss": -9.431719779968262, "global_step": 110381, "epoch": 657} {"train_loss": -9.847000122070312, "global_step": 110382, "epoch": 657} {"train_loss": -9.450064659118652, "global_step": 110383, "epoch": 657} {"train_loss": -9.57617473602295, "global_step": 110384, "epoch": 657} {"train_loss": -9.876209259033203, "global_step": 110385, "epoch": 657} {"train_loss": -9.792838096618652, "global_step": 110386, "epoch": 657} {"train_loss": -9.98730182647705, "global_step": 110387, "epoch": 657} {"train_loss": -9.74047565460205, "global_step": 110388, "epoch": 657} {"train_loss": -9.931243896484375, "global_step": 110389, "epoch": 657} {"train_loss": -9.747041702270508, "global_step": 110390, "epoch": 657} {"train_loss": -10.130182266235352, "global_step": 110391, "epoch": 657} {"train_loss": -9.902902603149414, "global_step": 110392, "epoch": 657} {"train_loss": -10.238996505737305, "global_step": 110393, "epoch": 657} {"train_loss": -9.80428695678711, "global_step": 110394, "epoch": 657} {"train_loss": -9.942451477050781, "global_step": 110395, "epoch": 657} {"train_loss": -9.843734741210938, "global_step": 110396, "epoch": 657} {"train_loss": -9.880053520202637, "global_step": 110397, "epoch": 657} {"train_loss": -9.972814559936523, "global_step": 110398, "epoch": 657} {"train_loss": -9.934234619140625, "global_step": 110399, "epoch": 657} {"train_loss": -9.760160446166992, "global_step": 110400, "epoch": 657} {"train_loss": -9.832511901855469, "global_step": 110401, "epoch": 657} {"train_loss": -10.177080154418945, "global_step": 110402, "epoch": 657} {"train_loss": -9.7367582321167, "global_step": 110403, "epoch": 657} {"train_loss": -10.071998596191406, "global_step": 110404, "epoch": 657} {"train_loss": -10.159256935119629, "global_step": 110405, "epoch": 657} {"train_loss": -10.254864692687988, "global_step": 110406, "epoch": 657} {"train_loss": -10.0516939163208, "global_step": 110407, "epoch": 657} {"train_loss": -10.1635160446167, "global_step": 110408, "epoch": 657} {"train_loss": -10.039064407348633, "global_step": 110409, "epoch": 657} {"train_loss": -9.987449645996094, "global_step": 110410, "epoch": 657} {"train_loss": -10.060267448425293, "global_step": 110411, "epoch": 657} {"train_loss": -9.954687118530273, "global_step": 110412, "epoch": 657} {"train_loss": -10.052284240722656, "global_step": 110413, "epoch": 657} {"train_loss": -9.859539031982422, "global_step": 110414, "epoch": 657} {"train_loss": -9.797122955322266, "global_step": 110415, "epoch": 657} {"train_loss": -9.328153610229492, "global_step": 110416, "epoch": 657} {"train_loss": -9.537452697753906, "global_step": 110417, "epoch": 657} {"train_loss": -9.714702606201172, "global_step": 110418, "epoch": 657} {"train_loss": -9.617107391357422, "global_step": 110419, "epoch": 657} {"train_loss": -9.668315887451172, "global_step": 110420, "epoch": 657} {"train_loss": -9.861331939697266, "global_step": 110421, "epoch": 657} {"train_loss": -9.444067001342773, "global_step": 110422, "epoch": 657} {"train_loss": -9.813694953918457, "global_step": 110423, "epoch": 657} {"train_loss": -9.595922470092773, "global_step": 110424, "epoch": 657} {"train_loss": -9.900778770446777, "global_step": 110425, "epoch": 657} {"train_loss": -9.442098617553711, "global_step": 110426, "epoch": 657} {"train_loss": -10.0592679977417, "global_step": 110427, "epoch": 657} {"train_loss": -9.908392906188965, "global_step": 110428, "epoch": 657} {"train_loss": -9.733232498168945, "global_step": 110429, "epoch": 657} {"train_loss": -9.519426345825195, "global_step": 110430, "epoch": 657} {"train_loss": -9.840513229370117, "global_step": 110431, "epoch": 657} {"train_loss": -9.342551231384277, "global_step": 110432, "epoch": 657} {"train_loss": -9.895851135253906, "global_step": 110433, "epoch": 657} {"train_loss": -9.682696342468262, "global_step": 110434, "epoch": 657} {"train_loss": -9.632349967956543, "global_step": 110435, "epoch": 657} {"train_loss": -9.616741180419922, "global_step": 110436, "epoch": 657} {"train_loss": -9.554840087890625, "global_step": 110437, "epoch": 657} {"train_loss": -9.804771423339844, "global_step": 110438, "epoch": 657} {"train_loss": -9.760449409484863, "global_step": 110439, "epoch": 657} {"train_loss": -9.790081024169922, "global_step": 110440, "epoch": 657} {"train_loss": -9.775165557861328, "global_step": 110441, "epoch": 657} {"train_loss": -9.624139785766602, "global_step": 110442, "epoch": 657} {"train_loss": -9.849227905273438, "global_step": 110443, "epoch": 657} {"train_loss": -9.594175338745117, "global_step": 110444, "epoch": 657} {"train_loss": -9.668242454528809, "global_step": 110445, "epoch": 657} {"train_loss": -9.890931129455566, "global_step": 110446, "epoch": 657} {"train_loss": -9.878763198852539, "global_step": 110447, "epoch": 657} {"train_loss": -9.48535442352295, "global_step": 110448, "epoch": 657} {"train_loss": -10.012002944946289, "global_step": 110449, "epoch": 657} {"train_loss": -9.617936134338379, "global_step": 110450, "epoch": 657} {"train_loss": -10.085127830505371, "global_step": 110451, "epoch": 657} {"train_loss": -9.82965087890625, "global_step": 110452, "epoch": 657} {"train_loss": -9.992335319519043, "global_step": 110453, "epoch": 657} {"train_loss": -9.817058563232422, "global_step": 110454, "epoch": 657} {"train_loss": -9.948366165161133, "global_step": 110455, "epoch": 657} {"train_loss": -10.075825691223145, "global_step": 110456, "epoch": 657} {"train_loss": -10.074808120727539, "global_step": 110457, "epoch": 657} {"train_loss": -10.197613716125488, "global_step": 110458, "epoch": 657} {"train_loss": -9.942159652709961, "global_step": 110459, "epoch": 657} {"train_loss": -10.14674186706543, "global_step": 110460, "epoch": 657} {"train_loss": -10.080830574035645, "global_step": 110461, "epoch": 657} {"train_loss": -10.182107925415039, "global_step": 110462, "epoch": 657} {"train_loss": -9.89382553100586, "global_step": 110463, "epoch": 657} {"train_loss": -10.103260040283203, "global_step": 110464, "epoch": 657} {"train_loss": -10.12668228149414, "global_step": 110465, "epoch": 657} {"train_loss": -10.292871475219727, "global_step": 110466, "epoch": 657} {"train_loss": -10.130041122436523, "global_step": 110467, "epoch": 657} {"train_loss": -10.086124420166016, "global_step": 110468, "epoch": 657} {"train_loss": -10.365888595581055, "global_step": 110469, "epoch": 657} {"train_loss": -10.24061107635498, "global_step": 110470, "epoch": 657} {"train_loss": -10.248720169067383, "global_step": 110471, "epoch": 657} {"train_loss": -10.178179740905762, "global_step": 110472, "epoch": 657} {"train_loss": -9.933672904968262, "global_step": 110473, "epoch": 657} {"train_loss": -10.19560432434082, "global_step": 110474, "epoch": 657} {"train_loss": -9.937588691711426, "global_step": 110475, "epoch": 657} {"train_loss": -9.98680305480957, "global_step": 110476, "epoch": 657} {"train_loss": -9.918158531188965, "global_step": 110477, "epoch": 657} {"train_loss": -10.330940246582031, "global_step": 110478, "epoch": 657} {"train_loss": -10.019413948059082, "global_step": 110479, "epoch": 657} {"train_loss": -10.311954498291016, "global_step": 110480, "epoch": 657} {"train_loss": -9.795989036560059, "global_step": 110481, "epoch": 657} {"train_loss": -10.281271934509277, "global_step": 110482, "epoch": 657} {"train_loss": -9.862936019897461, "global_step": 110483, "epoch": 657} {"train_loss": -9.34166145324707, "global_step": 110484, "epoch": 657} {"train_loss": -9.528921127319336, "global_step": 110485, "epoch": 657} {"train_loss": -9.57525634765625, "global_step": 110486, "epoch": 657} {"train_loss": -10.028913497924805, "global_step": 110487, "epoch": 657} {"train_loss": -9.827033996582031, "global_step": 110488, "epoch": 657} {"train_loss": -9.933123588562012, "global_step": 110489, "epoch": 657} {"train_loss": -9.886371612548828, "global_step": 110490, "epoch": 657} {"train_loss": -10.065823554992676, "global_step": 110491, "epoch": 657} {"train_loss": -9.592218399047852, "global_step": 110492, "epoch": 657} {"train_loss": -10.131462097167969, "global_step": 110493, "epoch": 657} {"train_loss": -9.596808433532715, "global_step": 110494, "epoch": 657} {"train_loss": -10.204426765441895, "global_step": 110495, "epoch": 657} {"train_loss": -9.61805534362793, "global_step": 110496, "epoch": 657} {"train_loss": -9.71012020111084, "global_step": 110497, "epoch": 657} {"train_loss": -9.839028358459473, "global_step": 110498, "epoch": 657} {"train_loss": -9.853521347045898, "global_step": 110499, "epoch": 657} {"train_loss": -9.314751625061035, "global_step": 110500, "epoch": 657} {"train_loss": -9.708053588867188, "global_step": 110501, "epoch": 657} {"train_loss": -9.613508224487305, "global_step": 110502, "epoch": 657} {"train_loss": -10.02570629119873, "global_step": 110503, "epoch": 657} {"train_loss": -9.91402816772461, "global_step": 110504, "epoch": 657} {"train_loss": -9.402570724487305, "global_step": 110505, "epoch": 657} {"train_loss": -9.708501815795898, "global_step": 110506, "epoch": 657} {"train_loss": -10.176094055175781, "global_step": 110507, "epoch": 657} {"train_loss": -9.454293251037598, "global_step": 110508, "epoch": 657} {"train_loss": -10.072751998901367, "global_step": 110509, "epoch": 657} {"train_loss": -9.970544815063477, "global_step": 110510, "epoch": 657} {"train_loss": -9.940711975097656, "global_step": 110511, "epoch": 657} {"train_loss": -9.999251365661621, "global_step": 110512, "epoch": 657} {"train_loss": -9.703359603881836, "global_step": 110513, "epoch": 657} {"train_loss": -9.69521713256836, "global_step": 110514, "epoch": 657} {"train_loss": -9.679819107055664, "global_step": 110515, "epoch": 657} {"train_loss": -9.880328178405762, "global_step": 110516, "epoch": 657} {"train_loss": -9.814384460449219, "global_step": 110517, "epoch": 657} {"train_loss": -9.798965454101562, "global_step": 110518, "epoch": 657} {"train_loss": -10.010686874389648, "global_step": 110519, "epoch": 657} {"train_loss": -9.910429000854492, "global_step": 110520, "epoch": 657} {"train_loss": -9.920577049255371, "global_step": 110521, "epoch": 657} {"train_loss": -9.928179740905762, "global_step": 110522, "epoch": 657} {"train_loss": -10.150581359863281, "global_step": 110523, "epoch": 657} {"train_loss": -9.935626983642578, "global_step": 110524, "epoch": 657} {"train_loss": -9.78558349609375, "global_step": 110525, "epoch": 657} {"train_loss": -9.993025779724121, "global_step": 110526, "epoch": 657} {"train_loss": -10.016569137573242, "global_step": 110527, "epoch": 657} {"train_loss": -9.789751052856445, "global_step": 110528, "epoch": 657} {"train_loss": -10.07561206817627, "global_step": 110529, "epoch": 657} {"train_loss": -10.108978271484375, "global_step": 110530, "epoch": 657} {"train_loss": -10.093637466430664, "global_step": 110531, "epoch": 657} {"train_loss": -10.070289611816406, "global_step": 110532, "epoch": 657} {"train_loss": -10.1744384765625, "global_step": 110533, "epoch": 657} {"train_loss": -9.928152084350586, "global_step": 110534, "epoch": 657} {"train_loss": -10.14003849029541, "global_step": 110535, "epoch": 657} {"train_loss": -10.263566970825195, "global_step": 110536, "epoch": 657} {"train_loss": -10.17173957824707, "global_step": 110537, "epoch": 657} {"train_loss": -10.02199649810791, "global_step": 110538, "epoch": 657} {"train_loss": -10.125884056091309, "global_step": 110539, "epoch": 657} {"train_loss": -10.091662406921387, "global_step": 110540, "epoch": 657} {"train_loss": -9.458934783935547, "global_step": 110541, "epoch": 657} {"train_loss": -9.916404724121094, "global_step": 110542, "epoch": 657} {"train_loss": -9.879591760181246, "global_step": 110543, "epoch": 657, "val_loss": 211536.71875} {"train_loss": -9.554656982421875, "global_step": 110544, "epoch": 658} {"train_loss": -10.124454498291016, "global_step": 110545, "epoch": 658} {"train_loss": -8.663480758666992, "global_step": 110546, "epoch": 658} {"train_loss": -9.479534149169922, "global_step": 110547, "epoch": 658} {"train_loss": -9.265243530273438, "global_step": 110548, "epoch": 658} {"train_loss": -8.925270080566406, "global_step": 110549, "epoch": 658} {"train_loss": -9.021028518676758, "global_step": 110550, "epoch": 658} {"train_loss": -10.013063430786133, "global_step": 110551, "epoch": 658} {"train_loss": -9.072088241577148, "global_step": 110552, "epoch": 658} {"train_loss": -9.485346794128418, "global_step": 110553, "epoch": 658} {"train_loss": -9.503345489501953, "global_step": 110554, "epoch": 658} {"train_loss": -9.489892959594727, "global_step": 110555, "epoch": 658} {"train_loss": -8.87625503540039, "global_step": 110556, "epoch": 658} {"train_loss": -9.879287719726562, "global_step": 110557, "epoch": 658} {"train_loss": -8.567602157592773, "global_step": 110558, "epoch": 658} {"train_loss": -9.635232925415039, "global_step": 110559, "epoch": 658} {"train_loss": -9.285089492797852, "global_step": 110560, "epoch": 658} {"train_loss": -9.719523429870605, "global_step": 110561, "epoch": 658} {"train_loss": -9.478926658630371, "global_step": 110562, "epoch": 658} {"train_loss": -9.39657974243164, "global_step": 110563, "epoch": 658} {"train_loss": -9.670618057250977, "global_step": 110564, "epoch": 658} {"train_loss": -9.1698579788208, "global_step": 110565, "epoch": 658} {"train_loss": -9.4208984375, "global_step": 110566, "epoch": 658} {"train_loss": -9.583673477172852, "global_step": 110567, "epoch": 658} {"train_loss": -9.688440322875977, "global_step": 110568, "epoch": 658} {"train_loss": -9.514293670654297, "global_step": 110569, "epoch": 658} {"train_loss": -9.804437637329102, "global_step": 110570, "epoch": 658} {"train_loss": -9.63979434967041, "global_step": 110571, "epoch": 658} {"train_loss": -9.3504638671875, "global_step": 110572, "epoch": 658} {"train_loss": -9.654454231262207, "global_step": 110573, "epoch": 658} {"train_loss": -9.880033493041992, "global_step": 110574, "epoch": 658} {"train_loss": -9.750753402709961, "global_step": 110575, "epoch": 658} {"train_loss": -9.788189888000488, "global_step": 110576, "epoch": 658} {"train_loss": -10.01137924194336, "global_step": 110577, "epoch": 658} {"train_loss": -9.665969848632812, "global_step": 110578, "epoch": 658} {"train_loss": -9.67751693725586, "global_step": 110579, "epoch": 658} {"train_loss": -9.565950393676758, "global_step": 110580, "epoch": 658} {"train_loss": -9.903501510620117, "global_step": 110581, "epoch": 658} {"train_loss": -9.532093048095703, "global_step": 110582, "epoch": 658} {"train_loss": -9.93923568725586, "global_step": 110583, "epoch": 658} {"train_loss": -9.91600227355957, "global_step": 110584, "epoch": 658} {"train_loss": -9.74830436706543, "global_step": 110585, "epoch": 658} {"train_loss": -9.847529411315918, "global_step": 110586, "epoch": 658} {"train_loss": -9.793440818786621, "global_step": 110587, "epoch": 658} {"train_loss": -9.539593696594238, "global_step": 110588, "epoch": 658} {"train_loss": -9.882233619689941, "global_step": 110589, "epoch": 658} {"train_loss": -9.763975143432617, "global_step": 110590, "epoch": 658} {"train_loss": -9.947904586791992, "global_step": 110591, "epoch": 658} {"train_loss": -9.914453506469727, "global_step": 110592, "epoch": 658} {"train_loss": -9.706501960754395, "global_step": 110593, "epoch": 658} {"train_loss": -9.984313011169434, "global_step": 110594, "epoch": 658} {"train_loss": -10.149367332458496, "global_step": 110595, "epoch": 658} {"train_loss": -10.281380653381348, "global_step": 110596, "epoch": 658} {"train_loss": -9.99315071105957, "global_step": 110597, "epoch": 658} {"train_loss": -10.05830192565918, "global_step": 110598, "epoch": 658} {"train_loss": -10.10825252532959, "global_step": 110599, "epoch": 658} {"train_loss": -9.781563758850098, "global_step": 110600, "epoch": 658} {"train_loss": -9.785114288330078, "global_step": 110601, "epoch": 658} {"train_loss": -10.081796646118164, "global_step": 110602, "epoch": 658} {"train_loss": -10.161243438720703, "global_step": 110603, "epoch": 658} {"train_loss": -10.071382522583008, "global_step": 110604, "epoch": 658} {"train_loss": -9.937685012817383, "global_step": 110605, "epoch": 658} {"train_loss": -10.193344116210938, "global_step": 110606, "epoch": 658} {"train_loss": -9.994945526123047, "global_step": 110607, "epoch": 658} {"train_loss": -10.045852661132812, "global_step": 110608, "epoch": 658} {"train_loss": -9.996825218200684, "global_step": 110609, "epoch": 658} {"train_loss": -9.852306365966797, "global_step": 110610, "epoch": 658} {"train_loss": -9.839405059814453, "global_step": 110611, "epoch": 658} {"train_loss": -10.107731819152832, "global_step": 110612, "epoch": 658} {"train_loss": -9.775390625, "global_step": 110613, "epoch": 658} {"train_loss": -10.100010871887207, "global_step": 110614, "epoch": 658} {"train_loss": -9.980666160583496, "global_step": 110615, "epoch": 658} {"train_loss": -10.086463928222656, "global_step": 110616, "epoch": 658} {"train_loss": -9.792319297790527, "global_step": 110617, "epoch": 658} {"train_loss": -10.16235065460205, "global_step": 110618, "epoch": 658} {"train_loss": -9.814626693725586, "global_step": 110619, "epoch": 658} {"train_loss": -10.172452926635742, "global_step": 110620, "epoch": 658} {"train_loss": -9.990925788879395, "global_step": 110621, "epoch": 658} {"train_loss": -9.94008731842041, "global_step": 110622, "epoch": 658} {"train_loss": -10.050016403198242, "global_step": 110623, "epoch": 658} {"train_loss": -10.101522445678711, "global_step": 110624, "epoch": 658} {"train_loss": -10.00337028503418, "global_step": 110625, "epoch": 658} {"train_loss": -9.754146575927734, "global_step": 110626, "epoch": 658} {"train_loss": -10.074880599975586, "global_step": 110627, "epoch": 658} {"train_loss": -9.936554908752441, "global_step": 110628, "epoch": 658} {"train_loss": -10.018573760986328, "global_step": 110629, "epoch": 658} {"train_loss": -9.698047637939453, "global_step": 110630, "epoch": 658} {"train_loss": -10.083494186401367, "global_step": 110631, "epoch": 658} {"train_loss": -10.128739356994629, "global_step": 110632, "epoch": 658} {"train_loss": -9.931114196777344, "global_step": 110633, "epoch": 658} {"train_loss": -10.239723205566406, "global_step": 110634, "epoch": 658} {"train_loss": -10.003901481628418, "global_step": 110635, "epoch": 658} {"train_loss": -9.473821640014648, "global_step": 110636, "epoch": 658} {"train_loss": -9.872589111328125, "global_step": 110637, "epoch": 658} {"train_loss": -10.039714813232422, "global_step": 110638, "epoch": 658} {"train_loss": -9.912630081176758, "global_step": 110639, "epoch": 658} {"train_loss": -9.870497703552246, "global_step": 110640, "epoch": 658} {"train_loss": -9.99746322631836, "global_step": 110641, "epoch": 658} {"train_loss": -9.87437629699707, "global_step": 110642, "epoch": 658} {"train_loss": -9.854568481445312, "global_step": 110643, "epoch": 658} {"train_loss": -9.802732467651367, "global_step": 110644, "epoch": 658} {"train_loss": -9.436874389648438, "global_step": 110645, "epoch": 658} {"train_loss": -9.76102066040039, "global_step": 110646, "epoch": 658} {"train_loss": -9.68785285949707, "global_step": 110647, "epoch": 658} {"train_loss": -9.173385620117188, "global_step": 110648, "epoch": 658} {"train_loss": -10.209877967834473, "global_step": 110649, "epoch": 658} {"train_loss": -9.768962860107422, "global_step": 110650, "epoch": 658} {"train_loss": -9.732122421264648, "global_step": 110651, "epoch": 658} {"train_loss": -10.052580833435059, "global_step": 110652, "epoch": 658} {"train_loss": -9.915122032165527, "global_step": 110653, "epoch": 658} {"train_loss": -9.660480499267578, "global_step": 110654, "epoch": 658} {"train_loss": -9.855369567871094, "global_step": 110655, "epoch": 658} {"train_loss": -9.99053955078125, "global_step": 110656, "epoch": 658} {"train_loss": -9.684341430664062, "global_step": 110657, "epoch": 658} {"train_loss": -10.039471626281738, "global_step": 110658, "epoch": 658} {"train_loss": -10.07579231262207, "global_step": 110659, "epoch": 658} {"train_loss": -9.702232360839844, "global_step": 110660, "epoch": 658} {"train_loss": -9.74467658996582, "global_step": 110661, "epoch": 658} {"train_loss": -10.02750015258789, "global_step": 110662, "epoch": 658} {"train_loss": -9.914047241210938, "global_step": 110663, "epoch": 658} {"train_loss": -9.920066833496094, "global_step": 110664, "epoch": 658} {"train_loss": -10.024703979492188, "global_step": 110665, "epoch": 658} {"train_loss": -9.880483627319336, "global_step": 110666, "epoch": 658} {"train_loss": -9.715571403503418, "global_step": 110667, "epoch": 658} {"train_loss": -10.343564987182617, "global_step": 110668, "epoch": 658} {"train_loss": -10.124868392944336, "global_step": 110669, "epoch": 658} {"train_loss": -9.895025253295898, "global_step": 110670, "epoch": 658} {"train_loss": -9.905691146850586, "global_step": 110671, "epoch": 658} {"train_loss": -10.178950309753418, "global_step": 110672, "epoch": 658} {"train_loss": -10.116156578063965, "global_step": 110673, "epoch": 658} {"train_loss": -10.075305938720703, "global_step": 110674, "epoch": 658} {"train_loss": -10.060827255249023, "global_step": 110675, "epoch": 658} {"train_loss": -9.989776611328125, "global_step": 110676, "epoch": 658} {"train_loss": -10.11790943145752, "global_step": 110677, "epoch": 658} {"train_loss": -9.893592834472656, "global_step": 110678, "epoch": 658} {"train_loss": -9.990584373474121, "global_step": 110679, "epoch": 658} {"train_loss": -9.737621307373047, "global_step": 110680, "epoch": 658} {"train_loss": -10.141053199768066, "global_step": 110681, "epoch": 658} {"train_loss": -10.276083946228027, "global_step": 110682, "epoch": 658} {"train_loss": -9.871725082397461, "global_step": 110683, "epoch": 658} {"train_loss": -9.991556167602539, "global_step": 110684, "epoch": 658} {"train_loss": -10.180842399597168, "global_step": 110685, "epoch": 658} {"train_loss": -9.978170394897461, "global_step": 110686, "epoch": 658} {"train_loss": -9.992071151733398, "global_step": 110687, "epoch": 658} {"train_loss": -9.969902038574219, "global_step": 110688, "epoch": 658} {"train_loss": -9.902582168579102, "global_step": 110689, "epoch": 658} {"train_loss": -10.02593994140625, "global_step": 110690, "epoch": 658} {"train_loss": -9.514093399047852, "global_step": 110691, "epoch": 658} {"train_loss": -10.090986251831055, "global_step": 110692, "epoch": 658} {"train_loss": -9.395631790161133, "global_step": 110693, "epoch": 658} {"train_loss": -10.044808387756348, "global_step": 110694, "epoch": 658} {"train_loss": -9.806427955627441, "global_step": 110695, "epoch": 658} {"train_loss": -9.762195587158203, "global_step": 110696, "epoch": 658} {"train_loss": -9.748163223266602, "global_step": 110697, "epoch": 658} {"train_loss": -9.835458755493164, "global_step": 110698, "epoch": 658} {"train_loss": -9.777287483215332, "global_step": 110699, "epoch": 658} {"train_loss": -10.100133895874023, "global_step": 110700, "epoch": 658} {"train_loss": -9.907991409301758, "global_step": 110701, "epoch": 658} {"train_loss": -9.947774887084961, "global_step": 110702, "epoch": 658} {"train_loss": -9.924177169799805, "global_step": 110703, "epoch": 658} {"train_loss": -10.062206268310547, "global_step": 110704, "epoch": 658} {"train_loss": -10.28599739074707, "global_step": 110705, "epoch": 658} {"train_loss": -9.958535194396973, "global_step": 110706, "epoch": 658} {"train_loss": -10.027705192565918, "global_step": 110707, "epoch": 658} {"train_loss": -10.139755249023438, "global_step": 110708, "epoch": 658} {"train_loss": -10.227177619934082, "global_step": 110709, "epoch": 658} {"train_loss": -9.9617919921875, "global_step": 110710, "epoch": 658} {"train_loss": -9.838706652323404, "global_step": 110711, "epoch": 658, "val_loss": 211811.96875} {"train_loss": -10.048882484436035, "global_step": 110712, "epoch": 659} {"train_loss": -9.852394104003906, "global_step": 110713, "epoch": 659} {"train_loss": -9.780797958374023, "global_step": 110714, "epoch": 659} {"train_loss": -9.535655975341797, "global_step": 110715, "epoch": 659} {"train_loss": -10.141142845153809, "global_step": 110716, "epoch": 659} {"train_loss": -9.988202095031738, "global_step": 110717, "epoch": 659} {"train_loss": -9.916635513305664, "global_step": 110718, "epoch": 659} {"train_loss": -9.753198623657227, "global_step": 110719, "epoch": 659} {"train_loss": -9.950794219970703, "global_step": 110720, "epoch": 659} {"train_loss": -9.591233253479004, "global_step": 110721, "epoch": 659} {"train_loss": -9.70185375213623, "global_step": 110722, "epoch": 659} {"train_loss": -9.751265525817871, "global_step": 110723, "epoch": 659} {"train_loss": -9.548480033874512, "global_step": 110724, "epoch": 659} {"train_loss": -10.11572265625, "global_step": 110725, "epoch": 659} {"train_loss": -9.260396957397461, "global_step": 110726, "epoch": 659} {"train_loss": -9.827764511108398, "global_step": 110727, "epoch": 659} {"train_loss": -9.749223709106445, "global_step": 110728, "epoch": 659} {"train_loss": -9.834310531616211, "global_step": 110729, "epoch": 659} {"train_loss": -9.921957015991211, "global_step": 110730, "epoch": 659} {"train_loss": -9.86451530456543, "global_step": 110731, "epoch": 659} {"train_loss": -9.958349227905273, "global_step": 110732, "epoch": 659} {"train_loss": -9.94888973236084, "global_step": 110733, "epoch": 659} {"train_loss": -9.841286659240723, "global_step": 110734, "epoch": 659} {"train_loss": -10.09048843383789, "global_step": 110735, "epoch": 659} {"train_loss": -9.909751892089844, "global_step": 110736, "epoch": 659} {"train_loss": -9.911581039428711, "global_step": 110737, "epoch": 659} {"train_loss": -10.134751319885254, "global_step": 110738, "epoch": 659} {"train_loss": -9.861937522888184, "global_step": 110739, "epoch": 659} {"train_loss": -10.072454452514648, "global_step": 110740, "epoch": 659} {"train_loss": -9.877185821533203, "global_step": 110741, "epoch": 659} {"train_loss": -10.11404800415039, "global_step": 110742, "epoch": 659} {"train_loss": -9.892824172973633, "global_step": 110743, "epoch": 659} {"train_loss": -10.037395477294922, "global_step": 110744, "epoch": 659} {"train_loss": -10.174029350280762, "global_step": 110745, "epoch": 659} {"train_loss": -9.920068740844727, "global_step": 110746, "epoch": 659} {"train_loss": -10.080175399780273, "global_step": 110747, "epoch": 659} {"train_loss": -10.180989265441895, "global_step": 110748, "epoch": 659} {"train_loss": -9.951290130615234, "global_step": 110749, "epoch": 659} {"train_loss": -10.026535987854004, "global_step": 110750, "epoch": 659} {"train_loss": -10.219350814819336, "global_step": 110751, "epoch": 659} {"train_loss": -9.986082077026367, "global_step": 110752, "epoch": 659} {"train_loss": -9.973310470581055, "global_step": 110753, "epoch": 659} {"train_loss": -10.065093994140625, "global_step": 110754, "epoch": 659} {"train_loss": -10.1414213180542, "global_step": 110755, "epoch": 659} {"train_loss": -9.803898811340332, "global_step": 110756, "epoch": 659} {"train_loss": -9.775991439819336, "global_step": 110757, "epoch": 659} {"train_loss": -9.963305473327637, "global_step": 110758, "epoch": 659} {"train_loss": -9.712142944335938, "global_step": 110759, "epoch": 659} {"train_loss": -10.092775344848633, "global_step": 110760, "epoch": 659} {"train_loss": -10.138066291809082, "global_step": 110761, "epoch": 659} {"train_loss": -10.177326202392578, "global_step": 110762, "epoch": 659} {"train_loss": -10.025032043457031, "global_step": 110763, "epoch": 659} {"train_loss": -10.202811241149902, "global_step": 110764, "epoch": 659} {"train_loss": -9.837326049804688, "global_step": 110765, "epoch": 659} {"train_loss": -9.740053176879883, "global_step": 110766, "epoch": 659} {"train_loss": -9.955854415893555, "global_step": 110767, "epoch": 659} {"train_loss": -9.878396987915039, "global_step": 110768, "epoch": 659} {"train_loss": -9.823953628540039, "global_step": 110769, "epoch": 659} {"train_loss": -9.87819766998291, "global_step": 110770, "epoch": 659} {"train_loss": -9.9320068359375, "global_step": 110771, "epoch": 659} {"train_loss": -10.054442405700684, "global_step": 110772, "epoch": 659} {"train_loss": -9.723653793334961, "global_step": 110773, "epoch": 659} {"train_loss": -10.002646446228027, "global_step": 110774, "epoch": 659} {"train_loss": -10.007682800292969, "global_step": 110775, "epoch": 659} {"train_loss": -9.865781784057617, "global_step": 110776, "epoch": 659} {"train_loss": -9.961697578430176, "global_step": 110777, "epoch": 659} {"train_loss": -9.616373062133789, "global_step": 110778, "epoch": 659} {"train_loss": -9.822221755981445, "global_step": 110779, "epoch": 659} {"train_loss": -9.87053108215332, "global_step": 110780, "epoch": 659} {"train_loss": -9.811201095581055, "global_step": 110781, "epoch": 659} {"train_loss": -9.69752311706543, "global_step": 110782, "epoch": 659} {"train_loss": -10.065832138061523, "global_step": 110783, "epoch": 659} {"train_loss": -9.403096199035645, "global_step": 110784, "epoch": 659} {"train_loss": -9.63861083984375, "global_step": 110785, "epoch": 659} {"train_loss": -9.795740127563477, "global_step": 110786, "epoch": 659} {"train_loss": -9.696884155273438, "global_step": 110787, "epoch": 659} {"train_loss": -9.964251518249512, "global_step": 110788, "epoch": 659} {"train_loss": -10.066679000854492, "global_step": 110789, "epoch": 659} {"train_loss": -9.703512191772461, "global_step": 110790, "epoch": 659} {"train_loss": -9.827238082885742, "global_step": 110791, "epoch": 659} {"train_loss": -9.853759765625, "global_step": 110792, "epoch": 659} {"train_loss": -9.809853553771973, "global_step": 110793, "epoch": 659} {"train_loss": -9.718966484069824, "global_step": 110794, "epoch": 659} {"train_loss": -10.183082580566406, "global_step": 110795, "epoch": 659} {"train_loss": -9.977951049804688, "global_step": 110796, "epoch": 659} {"train_loss": -10.25084400177002, "global_step": 110797, "epoch": 659} {"train_loss": -9.856014251708984, "global_step": 110798, "epoch": 659} {"train_loss": -10.039044380187988, "global_step": 110799, "epoch": 659} {"train_loss": -9.89739990234375, "global_step": 110800, "epoch": 659} {"train_loss": -9.896489143371582, "global_step": 110801, "epoch": 659} {"train_loss": -9.925840377807617, "global_step": 110802, "epoch": 659} {"train_loss": -10.265981674194336, "global_step": 110803, "epoch": 659} {"train_loss": -10.081869125366211, "global_step": 110804, "epoch": 659} {"train_loss": -9.925291061401367, "global_step": 110805, "epoch": 659} {"train_loss": -10.216131210327148, "global_step": 110806, "epoch": 659} {"train_loss": -9.74642562866211, "global_step": 110807, "epoch": 659} {"train_loss": -9.78811264038086, "global_step": 110808, "epoch": 659} {"train_loss": -9.780677795410156, "global_step": 110809, "epoch": 659} {"train_loss": -10.065542221069336, "global_step": 110810, "epoch": 659} {"train_loss": -9.64600658416748, "global_step": 110811, "epoch": 659} {"train_loss": -9.873621940612793, "global_step": 110812, "epoch": 659} {"train_loss": -10.09343147277832, "global_step": 110813, "epoch": 659} {"train_loss": -9.955584526062012, "global_step": 110814, "epoch": 659} {"train_loss": -9.957620620727539, "global_step": 110815, "epoch": 659} {"train_loss": -9.911165237426758, "global_step": 110816, "epoch": 659} {"train_loss": -9.72492790222168, "global_step": 110817, "epoch": 659} {"train_loss": -10.003838539123535, "global_step": 110818, "epoch": 659} {"train_loss": -10.235363960266113, "global_step": 110819, "epoch": 659} {"train_loss": -9.710378646850586, "global_step": 110820, "epoch": 659} {"train_loss": -10.039204597473145, "global_step": 110821, "epoch": 659} {"train_loss": -9.954689025878906, "global_step": 110822, "epoch": 659} {"train_loss": -10.039730072021484, "global_step": 110823, "epoch": 659} {"train_loss": -9.910843849182129, "global_step": 110824, "epoch": 659} {"train_loss": -10.115053176879883, "global_step": 110825, "epoch": 659} {"train_loss": -10.037126541137695, "global_step": 110826, "epoch": 659} {"train_loss": -9.775679588317871, "global_step": 110827, "epoch": 659} {"train_loss": -9.987672805786133, "global_step": 110828, "epoch": 659} {"train_loss": -10.018120765686035, "global_step": 110829, "epoch": 659} {"train_loss": -10.041973114013672, "global_step": 110830, "epoch": 659} {"train_loss": -9.87732219696045, "global_step": 110831, "epoch": 659} {"train_loss": -10.098078727722168, "global_step": 110832, "epoch": 659} {"train_loss": -9.664121627807617, "global_step": 110833, "epoch": 659} {"train_loss": -10.07475471496582, "global_step": 110834, "epoch": 659} {"train_loss": -9.927179336547852, "global_step": 110835, "epoch": 659} {"train_loss": -9.97806167602539, "global_step": 110836, "epoch": 659} {"train_loss": -10.085783004760742, "global_step": 110837, "epoch": 659} {"train_loss": -9.885860443115234, "global_step": 110838, "epoch": 659} {"train_loss": -9.853343963623047, "global_step": 110839, "epoch": 659} {"train_loss": -9.60037612915039, "global_step": 110840, "epoch": 659} {"train_loss": -10.066783905029297, "global_step": 110841, "epoch": 659} {"train_loss": -9.45534896850586, "global_step": 110842, "epoch": 659} {"train_loss": -10.275020599365234, "global_step": 110843, "epoch": 659} {"train_loss": -9.608707427978516, "global_step": 110844, "epoch": 659} {"train_loss": -9.890115737915039, "global_step": 110845, "epoch": 659} {"train_loss": -9.793307304382324, "global_step": 110846, "epoch": 659} {"train_loss": -9.9491548538208, "global_step": 110847, "epoch": 659} {"train_loss": -9.977313995361328, "global_step": 110848, "epoch": 659} {"train_loss": -9.919197082519531, "global_step": 110849, "epoch": 659} {"train_loss": -9.980547904968262, "global_step": 110850, "epoch": 659} {"train_loss": -10.191783905029297, "global_step": 110851, "epoch": 659} {"train_loss": -10.27587890625, "global_step": 110852, "epoch": 659} {"train_loss": -10.172236442565918, "global_step": 110853, "epoch": 659} {"train_loss": -10.250215530395508, "global_step": 110854, "epoch": 659} {"train_loss": -10.099809646606445, "global_step": 110855, "epoch": 659} {"train_loss": -10.127652168273926, "global_step": 110856, "epoch": 659} {"train_loss": -10.263174057006836, "global_step": 110857, "epoch": 659} {"train_loss": -10.045494079589844, "global_step": 110858, "epoch": 659} {"train_loss": -10.05372428894043, "global_step": 110859, "epoch": 659} {"train_loss": -10.283224105834961, "global_step": 110860, "epoch": 659} {"train_loss": -10.09849739074707, "global_step": 110861, "epoch": 659} {"train_loss": -10.025603294372559, "global_step": 110862, "epoch": 659} {"train_loss": -10.263832092285156, "global_step": 110863, "epoch": 659} {"train_loss": -9.88125228881836, "global_step": 110864, "epoch": 659} {"train_loss": -10.200149536132812, "global_step": 110865, "epoch": 659} {"train_loss": -9.903331756591797, "global_step": 110866, "epoch": 659} {"train_loss": -9.817252159118652, "global_step": 110867, "epoch": 659} {"train_loss": -10.139680862426758, "global_step": 110868, "epoch": 659} {"train_loss": -9.834158897399902, "global_step": 110869, "epoch": 659} {"train_loss": -10.246731758117676, "global_step": 110870, "epoch": 659} {"train_loss": -9.708284378051758, "global_step": 110871, "epoch": 659} {"train_loss": -9.6546049118042, "global_step": 110872, "epoch": 659} {"train_loss": -10.211965560913086, "global_step": 110873, "epoch": 659} {"train_loss": -9.676901817321777, "global_step": 110874, "epoch": 659} {"train_loss": -10.297510147094727, "global_step": 110875, "epoch": 659} {"train_loss": -9.80624008178711, "global_step": 110876, "epoch": 659} {"train_loss": -9.915386199951172, "global_step": 110877, "epoch": 659} {"train_loss": -9.964287757873535, "global_step": 110878, "epoch": 659} {"train_loss": -9.9366504521597, "global_step": 110879, "epoch": 659, "val_loss": 210674.03125} {"train_loss": -9.948221206665039, "global_step": 110880, "epoch": 660} {"train_loss": -9.221548080444336, "global_step": 110881, "epoch": 660} {"train_loss": -10.236230850219727, "global_step": 110882, "epoch": 660} {"train_loss": -9.496411323547363, "global_step": 110883, "epoch": 660} {"train_loss": -9.728177070617676, "global_step": 110884, "epoch": 660} {"train_loss": -9.797555923461914, "global_step": 110885, "epoch": 660} {"train_loss": -9.839008331298828, "global_step": 110886, "epoch": 660} {"train_loss": -9.593236923217773, "global_step": 110887, "epoch": 660} {"train_loss": -9.926153182983398, "global_step": 110888, "epoch": 660} {"train_loss": -9.633283615112305, "global_step": 110889, "epoch": 660} {"train_loss": -9.409919738769531, "global_step": 110890, "epoch": 660} {"train_loss": -9.743772506713867, "global_step": 110891, "epoch": 660} {"train_loss": -9.357964515686035, "global_step": 110892, "epoch": 660} {"train_loss": -9.485163688659668, "global_step": 110893, "epoch": 660} {"train_loss": -9.88292121887207, "global_step": 110894, "epoch": 660} {"train_loss": -9.620706558227539, "global_step": 110895, "epoch": 660} {"train_loss": -9.845076560974121, "global_step": 110896, "epoch": 660} {"train_loss": -9.961824417114258, "global_step": 110897, "epoch": 660} {"train_loss": -9.838725090026855, "global_step": 110898, "epoch": 660} {"train_loss": -9.890121459960938, "global_step": 110899, "epoch": 660} {"train_loss": -10.426284790039062, "global_step": 110900, "epoch": 660} {"train_loss": -9.97221565246582, "global_step": 110901, "epoch": 660} {"train_loss": -10.00271224975586, "global_step": 110902, "epoch": 660} {"train_loss": -9.749205589294434, "global_step": 110903, "epoch": 660} {"train_loss": -9.77778434753418, "global_step": 110904, "epoch": 660} {"train_loss": -9.736520767211914, "global_step": 110905, "epoch": 660} {"train_loss": -9.591485977172852, "global_step": 110906, "epoch": 660} {"train_loss": -9.831392288208008, "global_step": 110907, "epoch": 660} {"train_loss": -9.46246337890625, "global_step": 110908, "epoch": 660} {"train_loss": -9.519998550415039, "global_step": 110909, "epoch": 660} {"train_loss": -9.933229446411133, "global_step": 110910, "epoch": 660} {"train_loss": -9.855788230895996, "global_step": 110911, "epoch": 660} {"train_loss": -9.570857048034668, "global_step": 110912, "epoch": 660} {"train_loss": -9.825664520263672, "global_step": 110913, "epoch": 660} {"train_loss": -9.9248046875, "global_step": 110914, "epoch": 660} {"train_loss": -9.446855545043945, "global_step": 110915, "epoch": 660} {"train_loss": -10.047733306884766, "global_step": 110916, "epoch": 660} {"train_loss": -9.775938034057617, "global_step": 110917, "epoch": 660} {"train_loss": -9.505345344543457, "global_step": 110918, "epoch": 660} {"train_loss": -9.868589401245117, "global_step": 110919, "epoch": 660} {"train_loss": -9.912202835083008, "global_step": 110920, "epoch": 660} {"train_loss": -10.043941497802734, "global_step": 110921, "epoch": 660} {"train_loss": -9.795714378356934, "global_step": 110922, "epoch": 660} {"train_loss": -9.888433456420898, "global_step": 110923, "epoch": 660} {"train_loss": -9.842220306396484, "global_step": 110924, "epoch": 660} {"train_loss": -9.884079933166504, "global_step": 110925, "epoch": 660} {"train_loss": -10.075544357299805, "global_step": 110926, "epoch": 660} {"train_loss": -9.9237642288208, "global_step": 110927, "epoch": 660} {"train_loss": -9.828651428222656, "global_step": 110928, "epoch": 660} {"train_loss": -10.018495559692383, "global_step": 110929, "epoch": 660} {"train_loss": -9.914270401000977, "global_step": 110930, "epoch": 660} {"train_loss": -9.935282707214355, "global_step": 110931, "epoch": 660} {"train_loss": -9.87183666229248, "global_step": 110932, "epoch": 660} {"train_loss": -10.1024751663208, "global_step": 110933, "epoch": 660} {"train_loss": -10.011171340942383, "global_step": 110934, "epoch": 660} {"train_loss": -10.017576217651367, "global_step": 110935, "epoch": 660} {"train_loss": -10.157511711120605, "global_step": 110936, "epoch": 660} {"train_loss": -10.092109680175781, "global_step": 110937, "epoch": 660} {"train_loss": -10.279027938842773, "global_step": 110938, "epoch": 660} {"train_loss": -10.031108856201172, "global_step": 110939, "epoch": 660} {"train_loss": -10.133665084838867, "global_step": 110940, "epoch": 660} {"train_loss": -10.355401992797852, "global_step": 110941, "epoch": 660} {"train_loss": -10.106724739074707, "global_step": 110942, "epoch": 660} {"train_loss": -10.425251007080078, "global_step": 110943, "epoch": 660} {"train_loss": -9.604447364807129, "global_step": 110944, "epoch": 660} {"train_loss": -9.710756301879883, "global_step": 110945, "epoch": 660} {"train_loss": -10.178420066833496, "global_step": 110946, "epoch": 660} {"train_loss": -9.964092254638672, "global_step": 110947, "epoch": 660} {"train_loss": -9.976164817810059, "global_step": 110948, "epoch": 660} {"train_loss": -9.936262130737305, "global_step": 110949, "epoch": 660} {"train_loss": -9.236066818237305, "global_step": 110950, "epoch": 660} {"train_loss": -10.24490737915039, "global_step": 110951, "epoch": 660} {"train_loss": -9.622028350830078, "global_step": 110952, "epoch": 660} {"train_loss": -9.629137992858887, "global_step": 110953, "epoch": 660} {"train_loss": -9.952342987060547, "global_step": 110954, "epoch": 660} {"train_loss": -9.19477367401123, "global_step": 110955, "epoch": 660} {"train_loss": -9.817201614379883, "global_step": 110956, "epoch": 660} {"train_loss": -9.68059253692627, "global_step": 110957, "epoch": 660} {"train_loss": -9.798913955688477, "global_step": 110958, "epoch": 660} {"train_loss": -9.95294189453125, "global_step": 110959, "epoch": 660} {"train_loss": -9.733044624328613, "global_step": 110960, "epoch": 660} {"train_loss": -9.676055908203125, "global_step": 110961, "epoch": 660} {"train_loss": -9.500267028808594, "global_step": 110962, "epoch": 660} {"train_loss": -9.845418930053711, "global_step": 110963, "epoch": 660} {"train_loss": -9.089122772216797, "global_step": 110964, "epoch": 660} {"train_loss": -9.595930099487305, "global_step": 110965, "epoch": 660} {"train_loss": -9.631895065307617, "global_step": 110966, "epoch": 660} {"train_loss": -9.873701095581055, "global_step": 110967, "epoch": 660} {"train_loss": -9.570913314819336, "global_step": 110968, "epoch": 660} {"train_loss": -9.953319549560547, "global_step": 110969, "epoch": 660} {"train_loss": -9.799806594848633, "global_step": 110970, "epoch": 660} {"train_loss": -10.037117958068848, "global_step": 110971, "epoch": 660} {"train_loss": -9.697122573852539, "global_step": 110972, "epoch": 660} {"train_loss": -9.882759094238281, "global_step": 110973, "epoch": 660} {"train_loss": -9.970830917358398, "global_step": 110974, "epoch": 660} {"train_loss": -9.65800666809082, "global_step": 110975, "epoch": 660} {"train_loss": -10.055603981018066, "global_step": 110976, "epoch": 660} {"train_loss": -10.007977485656738, "global_step": 110977, "epoch": 660} {"train_loss": -9.948328018188477, "global_step": 110978, "epoch": 660} {"train_loss": -9.761892318725586, "global_step": 110979, "epoch": 660} {"train_loss": -10.000955581665039, "global_step": 110980, "epoch": 660} {"train_loss": -9.855962753295898, "global_step": 110981, "epoch": 660} {"train_loss": -10.16836166381836, "global_step": 110982, "epoch": 660} {"train_loss": -10.098538398742676, "global_step": 110983, "epoch": 660} {"train_loss": -9.953924179077148, "global_step": 110984, "epoch": 660} {"train_loss": -10.09006118774414, "global_step": 110985, "epoch": 660} {"train_loss": -10.334602355957031, "global_step": 110986, "epoch": 660} {"train_loss": -10.186544418334961, "global_step": 110987, "epoch": 660} {"train_loss": -10.195981979370117, "global_step": 110988, "epoch": 660} {"train_loss": -10.239896774291992, "global_step": 110989, "epoch": 660} {"train_loss": -10.178423881530762, "global_step": 110990, "epoch": 660} {"train_loss": -10.164571762084961, "global_step": 110991, "epoch": 660} {"train_loss": -10.286422729492188, "global_step": 110992, "epoch": 660} {"train_loss": -10.069808959960938, "global_step": 110993, "epoch": 660} {"train_loss": -9.771974563598633, "global_step": 110994, "epoch": 660} {"train_loss": -10.101037979125977, "global_step": 110995, "epoch": 660} {"train_loss": -9.737615585327148, "global_step": 110996, "epoch": 660} {"train_loss": -10.076902389526367, "global_step": 110997, "epoch": 660} {"train_loss": -9.756586074829102, "global_step": 110998, "epoch": 660} {"train_loss": -10.10879898071289, "global_step": 110999, "epoch": 660} {"train_loss": -9.955938339233398, "global_step": 111000, "epoch": 660} {"train_loss": -10.129192352294922, "global_step": 111001, "epoch": 660} {"train_loss": -10.004598617553711, "global_step": 111002, "epoch": 660} {"train_loss": -10.201221466064453, "global_step": 111003, "epoch": 660} {"train_loss": -10.238800048828125, "global_step": 111004, "epoch": 660} {"train_loss": -10.083786010742188, "global_step": 111005, "epoch": 660} {"train_loss": -10.27383804321289, "global_step": 111006, "epoch": 660} {"train_loss": -10.390390396118164, "global_step": 111007, "epoch": 660} {"train_loss": -9.950636863708496, "global_step": 111008, "epoch": 660} {"train_loss": -10.168485641479492, "global_step": 111009, "epoch": 660} {"train_loss": -10.018533706665039, "global_step": 111010, "epoch": 660} {"train_loss": -9.954713821411133, "global_step": 111011, "epoch": 660} {"train_loss": -10.283467292785645, "global_step": 111012, "epoch": 660} {"train_loss": -9.897151947021484, "global_step": 111013, "epoch": 660} {"train_loss": -10.461539268493652, "global_step": 111014, "epoch": 660} {"train_loss": -9.920312881469727, "global_step": 111015, "epoch": 660} {"train_loss": -9.875896453857422, "global_step": 111016, "epoch": 660} {"train_loss": -9.762218475341797, "global_step": 111017, "epoch": 660} {"train_loss": -9.510555267333984, "global_step": 111018, "epoch": 660} {"train_loss": -9.800114631652832, "global_step": 111019, "epoch": 660} {"train_loss": -10.000532150268555, "global_step": 111020, "epoch": 660} {"train_loss": -9.225663185119629, "global_step": 111021, "epoch": 660} {"train_loss": -9.520121574401855, "global_step": 111022, "epoch": 660} {"train_loss": -9.772683143615723, "global_step": 111023, "epoch": 660} {"train_loss": -9.560853004455566, "global_step": 111024, "epoch": 660} {"train_loss": -9.623136520385742, "global_step": 111025, "epoch": 660} {"train_loss": -9.350486755371094, "global_step": 111026, "epoch": 660} {"train_loss": -9.606733322143555, "global_step": 111027, "epoch": 660} {"train_loss": -9.27077579498291, "global_step": 111028, "epoch": 660} {"train_loss": -9.381402969360352, "global_step": 111029, "epoch": 660} {"train_loss": -9.67045783996582, "global_step": 111030, "epoch": 660} {"train_loss": -9.500361442565918, "global_step": 111031, "epoch": 660} {"train_loss": -9.985315322875977, "global_step": 111032, "epoch": 660} {"train_loss": -9.866423606872559, "global_step": 111033, "epoch": 660} {"train_loss": -9.785823822021484, "global_step": 111034, "epoch": 660} {"train_loss": -9.848560333251953, "global_step": 111035, "epoch": 660} {"train_loss": -9.690759658813477, "global_step": 111036, "epoch": 660} {"train_loss": -9.685572624206543, "global_step": 111037, "epoch": 660} {"train_loss": -9.83377456665039, "global_step": 111038, "epoch": 660} {"train_loss": -9.943000793457031, "global_step": 111039, "epoch": 660} {"train_loss": -9.749004364013672, "global_step": 111040, "epoch": 660} {"train_loss": -9.987350463867188, "global_step": 111041, "epoch": 660} {"train_loss": -9.764619827270508, "global_step": 111042, "epoch": 660} {"train_loss": -9.777851104736328, "global_step": 111043, "epoch": 660} {"train_loss": -9.612537384033203, "global_step": 111044, "epoch": 660} {"train_loss": -10.188350677490234, "global_step": 111045, "epoch": 660} {"train_loss": -9.835609436035156, "global_step": 111046, "epoch": 660} {"train_loss": -9.861769227754502, "global_step": 111047, "epoch": 660, "val_loss": 211636.328125, "train_action_mse_error": 3.448490619659424} {"train_loss": -9.695554733276367, "global_step": 111048, "epoch": 661} {"train_loss": -9.688837051391602, "global_step": 111049, "epoch": 661} {"train_loss": -10.240745544433594, "global_step": 111050, "epoch": 661} {"train_loss": -10.00826358795166, "global_step": 111051, "epoch": 661} {"train_loss": -10.04901123046875, "global_step": 111052, "epoch": 661} {"train_loss": -10.004667282104492, "global_step": 111053, "epoch": 661} {"train_loss": -10.009414672851562, "global_step": 111054, "epoch": 661} {"train_loss": -10.108394622802734, "global_step": 111055, "epoch": 661} {"train_loss": -10.133766174316406, "global_step": 111056, "epoch": 661} {"train_loss": -10.038741111755371, "global_step": 111057, "epoch": 661} {"train_loss": -9.983619689941406, "global_step": 111058, "epoch": 661} {"train_loss": -10.150829315185547, "global_step": 111059, "epoch": 661} {"train_loss": -10.139667510986328, "global_step": 111060, "epoch": 661} {"train_loss": -10.162094116210938, "global_step": 111061, "epoch": 661} {"train_loss": -10.302825927734375, "global_step": 111062, "epoch": 661} {"train_loss": -10.175872802734375, "global_step": 111063, "epoch": 661} {"train_loss": -9.93429183959961, "global_step": 111064, "epoch": 661} {"train_loss": -10.348411560058594, "global_step": 111065, "epoch": 661} {"train_loss": -10.137048721313477, "global_step": 111066, "epoch": 661} {"train_loss": -9.99634075164795, "global_step": 111067, "epoch": 661} {"train_loss": -10.087947845458984, "global_step": 111068, "epoch": 661} {"train_loss": -10.176351547241211, "global_step": 111069, "epoch": 661} {"train_loss": -10.128440856933594, "global_step": 111070, "epoch": 661} {"train_loss": -9.929046630859375, "global_step": 111071, "epoch": 661} {"train_loss": -10.417625427246094, "global_step": 111072, "epoch": 661} {"train_loss": -9.965188980102539, "global_step": 111073, "epoch": 661} {"train_loss": -10.167915344238281, "global_step": 111074, "epoch": 661} {"train_loss": -10.32990837097168, "global_step": 111075, "epoch": 661} {"train_loss": -10.272947311401367, "global_step": 111076, "epoch": 661} {"train_loss": -10.079202651977539, "global_step": 111077, "epoch": 661} {"train_loss": -10.2935791015625, "global_step": 111078, "epoch": 661} {"train_loss": -9.985252380371094, "global_step": 111079, "epoch": 661} {"train_loss": -9.99867057800293, "global_step": 111080, "epoch": 661} {"train_loss": -10.162582397460938, "global_step": 111081, "epoch": 661} {"train_loss": -9.96599006652832, "global_step": 111082, "epoch": 661} {"train_loss": -9.87526798248291, "global_step": 111083, "epoch": 661} {"train_loss": -10.11705493927002, "global_step": 111084, "epoch": 661} {"train_loss": -10.117218017578125, "global_step": 111085, "epoch": 661} {"train_loss": -9.500250816345215, "global_step": 111086, "epoch": 661} {"train_loss": -10.127565383911133, "global_step": 111087, "epoch": 661} {"train_loss": -10.037569999694824, "global_step": 111088, "epoch": 661} {"train_loss": -9.818289756774902, "global_step": 111089, "epoch": 661} {"train_loss": -9.803794860839844, "global_step": 111090, "epoch": 661} {"train_loss": -9.794463157653809, "global_step": 111091, "epoch": 661} {"train_loss": -9.756084442138672, "global_step": 111092, "epoch": 661} {"train_loss": -9.78392219543457, "global_step": 111093, "epoch": 661} {"train_loss": -9.822362899780273, "global_step": 111094, "epoch": 661} {"train_loss": -9.347936630249023, "global_step": 111095, "epoch": 661} {"train_loss": -10.06049633026123, "global_step": 111096, "epoch": 661} {"train_loss": -9.523776054382324, "global_step": 111097, "epoch": 661} {"train_loss": -9.601890563964844, "global_step": 111098, "epoch": 661} {"train_loss": -9.759799003601074, "global_step": 111099, "epoch": 661} {"train_loss": -9.74591064453125, "global_step": 111100, "epoch": 661} {"train_loss": -9.946783065795898, "global_step": 111101, "epoch": 661} {"train_loss": -9.446931838989258, "global_step": 111102, "epoch": 661} {"train_loss": -9.883819580078125, "global_step": 111103, "epoch": 661} {"train_loss": -8.718457221984863, "global_step": 111104, "epoch": 661} {"train_loss": -9.884584426879883, "global_step": 111105, "epoch": 661} {"train_loss": -9.357897758483887, "global_step": 111106, "epoch": 661} {"train_loss": -10.096257209777832, "global_step": 111107, "epoch": 661} {"train_loss": -9.522281646728516, "global_step": 111108, "epoch": 661} {"train_loss": -9.945117950439453, "global_step": 111109, "epoch": 661} {"train_loss": -9.823163986206055, "global_step": 111110, "epoch": 661} {"train_loss": -9.416443824768066, "global_step": 111111, "epoch": 661} {"train_loss": -9.761696815490723, "global_step": 111112, "epoch": 661} {"train_loss": -9.447132110595703, "global_step": 111113, "epoch": 661} {"train_loss": -9.798089981079102, "global_step": 111114, "epoch": 661} {"train_loss": -9.725521087646484, "global_step": 111115, "epoch": 661} {"train_loss": -9.757781982421875, "global_step": 111116, "epoch": 661} {"train_loss": -9.862011909484863, "global_step": 111117, "epoch": 661} {"train_loss": -9.867743492126465, "global_step": 111118, "epoch": 661} {"train_loss": -10.171234130859375, "global_step": 111119, "epoch": 661} {"train_loss": -9.794257164001465, "global_step": 111120, "epoch": 661} {"train_loss": -9.696020126342773, "global_step": 111121, "epoch": 661} {"train_loss": -9.749788284301758, "global_step": 111122, "epoch": 661} {"train_loss": -9.548693656921387, "global_step": 111123, "epoch": 661} {"train_loss": -9.775790214538574, "global_step": 111124, "epoch": 661} {"train_loss": -9.796329498291016, "global_step": 111125, "epoch": 661} {"train_loss": -10.003660202026367, "global_step": 111126, "epoch": 661} {"train_loss": -9.994887351989746, "global_step": 111127, "epoch": 661} {"train_loss": -9.986696243286133, "global_step": 111128, "epoch": 661} {"train_loss": -9.904842376708984, "global_step": 111129, "epoch": 661} {"train_loss": -10.145485877990723, "global_step": 111130, "epoch": 661} {"train_loss": -10.052971839904785, "global_step": 111131, "epoch": 661} {"train_loss": -10.241290092468262, "global_step": 111132, "epoch": 661} {"train_loss": -10.056699752807617, "global_step": 111133, "epoch": 661} {"train_loss": -9.848590850830078, "global_step": 111134, "epoch": 661} {"train_loss": -9.874089241027832, "global_step": 111135, "epoch": 661} {"train_loss": -9.949539184570312, "global_step": 111136, "epoch": 661} {"train_loss": -9.815289497375488, "global_step": 111137, "epoch": 661} {"train_loss": -10.146259307861328, "global_step": 111138, "epoch": 661} {"train_loss": -10.015954971313477, "global_step": 111139, "epoch": 661} {"train_loss": -10.008939743041992, "global_step": 111140, "epoch": 661} {"train_loss": -9.995712280273438, "global_step": 111141, "epoch": 661} {"train_loss": -9.771427154541016, "global_step": 111142, "epoch": 661} {"train_loss": -10.236141204833984, "global_step": 111143, "epoch": 661} {"train_loss": -10.063167572021484, "global_step": 111144, "epoch": 661} {"train_loss": -10.149320602416992, "global_step": 111145, "epoch": 661} {"train_loss": -9.967089653015137, "global_step": 111146, "epoch": 661} {"train_loss": -9.784417152404785, "global_step": 111147, "epoch": 661} {"train_loss": -10.333627700805664, "global_step": 111148, "epoch": 661} {"train_loss": -9.860067367553711, "global_step": 111149, "epoch": 661} {"train_loss": -9.875724792480469, "global_step": 111150, "epoch": 661} {"train_loss": -10.076631546020508, "global_step": 111151, "epoch": 661} {"train_loss": -9.851373672485352, "global_step": 111152, "epoch": 661} {"train_loss": -10.185417175292969, "global_step": 111153, "epoch": 661} {"train_loss": -10.084236145019531, "global_step": 111154, "epoch": 661} {"train_loss": -9.772686004638672, "global_step": 111155, "epoch": 661} {"train_loss": -10.095634460449219, "global_step": 111156, "epoch": 661} {"train_loss": -9.817754745483398, "global_step": 111157, "epoch": 661} {"train_loss": -9.98143196105957, "global_step": 111158, "epoch": 661} {"train_loss": -10.166444778442383, "global_step": 111159, "epoch": 661} {"train_loss": -10.163819313049316, "global_step": 111160, "epoch": 661} {"train_loss": -10.21826457977295, "global_step": 111161, "epoch": 661} {"train_loss": -10.023658752441406, "global_step": 111162, "epoch": 661} {"train_loss": -10.19723892211914, "global_step": 111163, "epoch": 661} {"train_loss": -10.056234359741211, "global_step": 111164, "epoch": 661} {"train_loss": -10.115724563598633, "global_step": 111165, "epoch": 661} {"train_loss": -9.78469467163086, "global_step": 111166, "epoch": 661} {"train_loss": -10.046537399291992, "global_step": 111167, "epoch": 661} {"train_loss": -9.966907501220703, "global_step": 111168, "epoch": 661} {"train_loss": -10.070083618164062, "global_step": 111169, "epoch": 661} {"train_loss": -9.517005920410156, "global_step": 111170, "epoch": 661} {"train_loss": -10.097564697265625, "global_step": 111171, "epoch": 661} {"train_loss": -9.59295654296875, "global_step": 111172, "epoch": 661} {"train_loss": -10.242851257324219, "global_step": 111173, "epoch": 661} {"train_loss": -9.521770477294922, "global_step": 111174, "epoch": 661} {"train_loss": -9.870275497436523, "global_step": 111175, "epoch": 661} {"train_loss": -10.206758499145508, "global_step": 111176, "epoch": 661} {"train_loss": -9.665422439575195, "global_step": 111177, "epoch": 661} {"train_loss": -10.208663940429688, "global_step": 111178, "epoch": 661} {"train_loss": -9.619837760925293, "global_step": 111179, "epoch": 661} {"train_loss": -9.900404930114746, "global_step": 111180, "epoch": 661} {"train_loss": -10.160049438476562, "global_step": 111181, "epoch": 661} {"train_loss": -9.793656349182129, "global_step": 111182, "epoch": 661} {"train_loss": -9.75865364074707, "global_step": 111183, "epoch": 661} {"train_loss": -10.192180633544922, "global_step": 111184, "epoch": 661} {"train_loss": -9.833052635192871, "global_step": 111185, "epoch": 661} {"train_loss": -10.015998840332031, "global_step": 111186, "epoch": 661} {"train_loss": -9.938445091247559, "global_step": 111187, "epoch": 661} {"train_loss": -9.959810256958008, "global_step": 111188, "epoch": 661} {"train_loss": -9.94277572631836, "global_step": 111189, "epoch": 661} {"train_loss": -9.741189956665039, "global_step": 111190, "epoch": 661} {"train_loss": -10.070995330810547, "global_step": 111191, "epoch": 661} {"train_loss": -10.36617374420166, "global_step": 111192, "epoch": 661} {"train_loss": -10.066844940185547, "global_step": 111193, "epoch": 661} {"train_loss": -10.291374206542969, "global_step": 111194, "epoch": 661} {"train_loss": -10.361632347106934, "global_step": 111195, "epoch": 661} {"train_loss": -9.876708030700684, "global_step": 111196, "epoch": 661} {"train_loss": -10.020630836486816, "global_step": 111197, "epoch": 661} {"train_loss": -10.221054077148438, "global_step": 111198, "epoch": 661} {"train_loss": -9.955556869506836, "global_step": 111199, "epoch": 661} {"train_loss": -9.825790405273438, "global_step": 111200, "epoch": 661} {"train_loss": -10.140212059020996, "global_step": 111201, "epoch": 661} {"train_loss": -10.367149353027344, "global_step": 111202, "epoch": 661} {"train_loss": -9.947488784790039, "global_step": 111203, "epoch": 661} {"train_loss": -10.048944473266602, "global_step": 111204, "epoch": 661} {"train_loss": -10.270491600036621, "global_step": 111205, "epoch": 661} {"train_loss": -10.165245056152344, "global_step": 111206, "epoch": 661} {"train_loss": -10.119471549987793, "global_step": 111207, "epoch": 661} {"train_loss": -10.065217971801758, "global_step": 111208, "epoch": 661} {"train_loss": -10.214753150939941, "global_step": 111209, "epoch": 661} {"train_loss": -10.287393569946289, "global_step": 111210, "epoch": 661} {"train_loss": -10.113996505737305, "global_step": 111211, "epoch": 661} {"train_loss": -10.281490325927734, "global_step": 111212, "epoch": 661} {"train_loss": -9.992445945739746, "global_step": 111213, "epoch": 661} {"train_loss": -10.17654037475586, "global_step": 111214, "epoch": 661} {"train_loss": -9.966189038185846, "global_step": 111215, "epoch": 661, "val_loss": 211379.703125} {"train_loss": -9.838083267211914, "global_step": 111216, "epoch": 662} {"train_loss": -9.712955474853516, "global_step": 111217, "epoch": 662} {"train_loss": -10.288826942443848, "global_step": 111218, "epoch": 662} {"train_loss": -9.666277885437012, "global_step": 111219, "epoch": 662} {"train_loss": -10.097569465637207, "global_step": 111220, "epoch": 662} {"train_loss": -9.15101146697998, "global_step": 111221, "epoch": 662} {"train_loss": -9.798592567443848, "global_step": 111222, "epoch": 662} {"train_loss": -9.810094833374023, "global_step": 111223, "epoch": 662} {"train_loss": -9.769821166992188, "global_step": 111224, "epoch": 662} {"train_loss": -9.805734634399414, "global_step": 111225, "epoch": 662} {"train_loss": -9.571033477783203, "global_step": 111226, "epoch": 662} {"train_loss": -9.836318969726562, "global_step": 111227, "epoch": 662} {"train_loss": -9.827117919921875, "global_step": 111228, "epoch": 662} {"train_loss": -9.715208053588867, "global_step": 111229, "epoch": 662} {"train_loss": -9.766401290893555, "global_step": 111230, "epoch": 662} {"train_loss": -9.341294288635254, "global_step": 111231, "epoch": 662} {"train_loss": -9.967918395996094, "global_step": 111232, "epoch": 662} {"train_loss": -9.723543167114258, "global_step": 111233, "epoch": 662} {"train_loss": -9.672693252563477, "global_step": 111234, "epoch": 662} {"train_loss": -10.060234069824219, "global_step": 111235, "epoch": 662} {"train_loss": -9.476354598999023, "global_step": 111236, "epoch": 662} {"train_loss": -9.982359886169434, "global_step": 111237, "epoch": 662} {"train_loss": -9.667757034301758, "global_step": 111238, "epoch": 662} {"train_loss": -9.74991226196289, "global_step": 111239, "epoch": 662} {"train_loss": -9.867956161499023, "global_step": 111240, "epoch": 662} {"train_loss": -9.918984413146973, "global_step": 111241, "epoch": 662} {"train_loss": -9.853776931762695, "global_step": 111242, "epoch": 662} {"train_loss": -9.899711608886719, "global_step": 111243, "epoch": 662} {"train_loss": -9.88941764831543, "global_step": 111244, "epoch": 662} {"train_loss": -9.767425537109375, "global_step": 111245, "epoch": 662} {"train_loss": -9.603534698486328, "global_step": 111246, "epoch": 662} {"train_loss": -9.949092864990234, "global_step": 111247, "epoch": 662} {"train_loss": -9.961576461791992, "global_step": 111248, "epoch": 662} {"train_loss": -9.907815933227539, "global_step": 111249, "epoch": 662} {"train_loss": -10.12882137298584, "global_step": 111250, "epoch": 662} {"train_loss": -9.917768478393555, "global_step": 111251, "epoch": 662} {"train_loss": -10.026748657226562, "global_step": 111252, "epoch": 662} {"train_loss": -9.830432891845703, "global_step": 111253, "epoch": 662} {"train_loss": -9.95625114440918, "global_step": 111254, "epoch": 662} {"train_loss": -10.113945007324219, "global_step": 111255, "epoch": 662} {"train_loss": -9.864742279052734, "global_step": 111256, "epoch": 662} {"train_loss": -10.08737564086914, "global_step": 111257, "epoch": 662} {"train_loss": -10.148479461669922, "global_step": 111258, "epoch": 662} {"train_loss": -9.928699493408203, "global_step": 111259, "epoch": 662} {"train_loss": -10.281123161315918, "global_step": 111260, "epoch": 662} {"train_loss": -10.045097351074219, "global_step": 111261, "epoch": 662} {"train_loss": -9.866344451904297, "global_step": 111262, "epoch": 662} {"train_loss": -10.146236419677734, "global_step": 111263, "epoch": 662} {"train_loss": -10.153000831604004, "global_step": 111264, "epoch": 662} {"train_loss": -10.211799621582031, "global_step": 111265, "epoch": 662} {"train_loss": -10.220128059387207, "global_step": 111266, "epoch": 662} {"train_loss": -10.209698677062988, "global_step": 111267, "epoch": 662} {"train_loss": -10.170032501220703, "global_step": 111268, "epoch": 662} {"train_loss": -10.349170684814453, "global_step": 111269, "epoch": 662} {"train_loss": -10.080314636230469, "global_step": 111270, "epoch": 662} {"train_loss": -10.078651428222656, "global_step": 111271, "epoch": 662} {"train_loss": -10.062313079833984, "global_step": 111272, "epoch": 662} {"train_loss": -10.076162338256836, "global_step": 111273, "epoch": 662} {"train_loss": -10.20962905883789, "global_step": 111274, "epoch": 662} {"train_loss": -10.157522201538086, "global_step": 111275, "epoch": 662} {"train_loss": -10.100313186645508, "global_step": 111276, "epoch": 662} {"train_loss": -9.719682693481445, "global_step": 111277, "epoch": 662} {"train_loss": -9.906842231750488, "global_step": 111278, "epoch": 662} {"train_loss": -10.064637184143066, "global_step": 111279, "epoch": 662} {"train_loss": -9.75027084350586, "global_step": 111280, "epoch": 662} {"train_loss": -9.926187515258789, "global_step": 111281, "epoch": 662} {"train_loss": -9.984354972839355, "global_step": 111282, "epoch": 662} {"train_loss": -9.937969207763672, "global_step": 111283, "epoch": 662} {"train_loss": -9.511957168579102, "global_step": 111284, "epoch": 662} {"train_loss": -9.990392684936523, "global_step": 111285, "epoch": 662} {"train_loss": -9.72761058807373, "global_step": 111286, "epoch": 662} {"train_loss": -9.335350036621094, "global_step": 111287, "epoch": 662} {"train_loss": -9.570032119750977, "global_step": 111288, "epoch": 662} {"train_loss": -9.382866859436035, "global_step": 111289, "epoch": 662} {"train_loss": -9.840995788574219, "global_step": 111290, "epoch": 662} {"train_loss": -9.720948219299316, "global_step": 111291, "epoch": 662} {"train_loss": -9.43583869934082, "global_step": 111292, "epoch": 662} {"train_loss": -9.638761520385742, "global_step": 111293, "epoch": 662} {"train_loss": -9.294332504272461, "global_step": 111294, "epoch": 662} {"train_loss": -9.746715545654297, "global_step": 111295, "epoch": 662} {"train_loss": -9.509445190429688, "global_step": 111296, "epoch": 662} {"train_loss": -9.889358520507812, "global_step": 111297, "epoch": 662} {"train_loss": -9.459362030029297, "global_step": 111298, "epoch": 662} {"train_loss": -10.001253128051758, "global_step": 111299, "epoch": 662} {"train_loss": -9.95947265625, "global_step": 111300, "epoch": 662} {"train_loss": -9.927143096923828, "global_step": 111301, "epoch": 662} {"train_loss": -9.642024993896484, "global_step": 111302, "epoch": 662} {"train_loss": -9.783061981201172, "global_step": 111303, "epoch": 662} {"train_loss": -9.772686004638672, "global_step": 111304, "epoch": 662} {"train_loss": -10.144119262695312, "global_step": 111305, "epoch": 662} {"train_loss": -9.688867568969727, "global_step": 111306, "epoch": 662} {"train_loss": -9.742738723754883, "global_step": 111307, "epoch": 662} {"train_loss": -9.865083694458008, "global_step": 111308, "epoch": 662} {"train_loss": -9.901446342468262, "global_step": 111309, "epoch": 662} {"train_loss": -9.70697021484375, "global_step": 111310, "epoch": 662} {"train_loss": -10.021862983703613, "global_step": 111311, "epoch": 662} {"train_loss": -9.942573547363281, "global_step": 111312, "epoch": 662} {"train_loss": -10.035794258117676, "global_step": 111313, "epoch": 662} {"train_loss": -9.863202095031738, "global_step": 111314, "epoch": 662} {"train_loss": -10.134780883789062, "global_step": 111315, "epoch": 662} {"train_loss": -9.961089134216309, "global_step": 111316, "epoch": 662} {"train_loss": -10.08260440826416, "global_step": 111317, "epoch": 662} {"train_loss": -9.86370849609375, "global_step": 111318, "epoch": 662} {"train_loss": -9.725573539733887, "global_step": 111319, "epoch": 662} {"train_loss": -10.082714080810547, "global_step": 111320, "epoch": 662} {"train_loss": -9.960722923278809, "global_step": 111321, "epoch": 662} {"train_loss": -10.002264022827148, "global_step": 111322, "epoch": 662} {"train_loss": -10.127967834472656, "global_step": 111323, "epoch": 662} {"train_loss": -10.173524856567383, "global_step": 111324, "epoch": 662} {"train_loss": -9.955854415893555, "global_step": 111325, "epoch": 662} {"train_loss": -10.022859573364258, "global_step": 111326, "epoch": 662} {"train_loss": -9.89947509765625, "global_step": 111327, "epoch": 662} {"train_loss": -9.715249061584473, "global_step": 111328, "epoch": 662} {"train_loss": -9.760952949523926, "global_step": 111329, "epoch": 662} {"train_loss": -10.082606315612793, "global_step": 111330, "epoch": 662} {"train_loss": -9.57787036895752, "global_step": 111331, "epoch": 662} {"train_loss": -9.930471420288086, "global_step": 111332, "epoch": 662} {"train_loss": -10.012194633483887, "global_step": 111333, "epoch": 662} {"train_loss": -9.814224243164062, "global_step": 111334, "epoch": 662} {"train_loss": -10.105012893676758, "global_step": 111335, "epoch": 662} {"train_loss": -9.883479118347168, "global_step": 111336, "epoch": 662} {"train_loss": -10.276116371154785, "global_step": 111337, "epoch": 662} {"train_loss": -9.851966857910156, "global_step": 111338, "epoch": 662} {"train_loss": -10.003350257873535, "global_step": 111339, "epoch": 662} {"train_loss": -9.99706745147705, "global_step": 111340, "epoch": 662} {"train_loss": -10.001174926757812, "global_step": 111341, "epoch": 662} {"train_loss": -9.647905349731445, "global_step": 111342, "epoch": 662} {"train_loss": -9.681090354919434, "global_step": 111343, "epoch": 662} {"train_loss": -9.595968246459961, "global_step": 111344, "epoch": 662} {"train_loss": -9.762786865234375, "global_step": 111345, "epoch": 662} {"train_loss": -9.663688659667969, "global_step": 111346, "epoch": 662} {"train_loss": -9.731014251708984, "global_step": 111347, "epoch": 662} {"train_loss": -9.998283386230469, "global_step": 111348, "epoch": 662} {"train_loss": -9.716360092163086, "global_step": 111349, "epoch": 662} {"train_loss": -10.028817176818848, "global_step": 111350, "epoch": 662} {"train_loss": -9.689708709716797, "global_step": 111351, "epoch": 662} {"train_loss": -9.914278030395508, "global_step": 111352, "epoch": 662} {"train_loss": -9.38713550567627, "global_step": 111353, "epoch": 662} {"train_loss": -10.168143272399902, "global_step": 111354, "epoch": 662} {"train_loss": -9.8018217086792, "global_step": 111355, "epoch": 662} {"train_loss": -9.95767593383789, "global_step": 111356, "epoch": 662} {"train_loss": -9.910558700561523, "global_step": 111357, "epoch": 662} {"train_loss": -9.919069290161133, "global_step": 111358, "epoch": 662} {"train_loss": -9.93480110168457, "global_step": 111359, "epoch": 662} {"train_loss": -9.976336479187012, "global_step": 111360, "epoch": 662} {"train_loss": -10.10300064086914, "global_step": 111361, "epoch": 662} {"train_loss": -10.225139617919922, "global_step": 111362, "epoch": 662} {"train_loss": -10.121597290039062, "global_step": 111363, "epoch": 662} {"train_loss": -9.937047958374023, "global_step": 111364, "epoch": 662} {"train_loss": -10.05038833618164, "global_step": 111365, "epoch": 662} {"train_loss": -10.299602508544922, "global_step": 111366, "epoch": 662} {"train_loss": -10.340313911437988, "global_step": 111367, "epoch": 662} {"train_loss": -10.104986190795898, "global_step": 111368, "epoch": 662} {"train_loss": -10.170784950256348, "global_step": 111369, "epoch": 662} {"train_loss": -10.204174041748047, "global_step": 111370, "epoch": 662} {"train_loss": -10.127190589904785, "global_step": 111371, "epoch": 662} {"train_loss": -9.918033599853516, "global_step": 111372, "epoch": 662} {"train_loss": -10.261919021606445, "global_step": 111373, "epoch": 662} {"train_loss": -9.973968505859375, "global_step": 111374, "epoch": 662} {"train_loss": -10.177352905273438, "global_step": 111375, "epoch": 662} {"train_loss": -10.11017894744873, "global_step": 111376, "epoch": 662} {"train_loss": -10.060696601867676, "global_step": 111377, "epoch": 662} {"train_loss": -10.071367263793945, "global_step": 111378, "epoch": 662} {"train_loss": -9.921762466430664, "global_step": 111379, "epoch": 662} {"train_loss": -10.04594612121582, "global_step": 111380, "epoch": 662} {"train_loss": -9.813848495483398, "global_step": 111381, "epoch": 662} {"train_loss": -10.155474662780762, "global_step": 111382, "epoch": 662} {"train_loss": -9.906151913461231, "global_step": 111383, "epoch": 662, "val_loss": 210881.921875} {"train_loss": -9.893269538879395, "global_step": 111384, "epoch": 663} {"train_loss": -9.93761157989502, "global_step": 111385, "epoch": 663} {"train_loss": -10.017867088317871, "global_step": 111386, "epoch": 663} {"train_loss": -9.699082374572754, "global_step": 111387, "epoch": 663} {"train_loss": -10.232595443725586, "global_step": 111388, "epoch": 663} {"train_loss": -9.609321594238281, "global_step": 111389, "epoch": 663} {"train_loss": -10.100520133972168, "global_step": 111390, "epoch": 663} {"train_loss": -9.803727149963379, "global_step": 111391, "epoch": 663} {"train_loss": -9.986449241638184, "global_step": 111392, "epoch": 663} {"train_loss": -9.99393081665039, "global_step": 111393, "epoch": 663} {"train_loss": -9.735797882080078, "global_step": 111394, "epoch": 663} {"train_loss": -10.065191268920898, "global_step": 111395, "epoch": 663} {"train_loss": -10.016063690185547, "global_step": 111396, "epoch": 663} {"train_loss": -10.070070266723633, "global_step": 111397, "epoch": 663} {"train_loss": -9.92148208618164, "global_step": 111398, "epoch": 663} {"train_loss": -9.684391021728516, "global_step": 111399, "epoch": 663} {"train_loss": -9.87784481048584, "global_step": 111400, "epoch": 663} {"train_loss": -9.723343849182129, "global_step": 111401, "epoch": 663} {"train_loss": -9.765588760375977, "global_step": 111402, "epoch": 663} {"train_loss": -9.604279518127441, "global_step": 111403, "epoch": 663} {"train_loss": -9.867042541503906, "global_step": 111404, "epoch": 663} {"train_loss": -9.253450393676758, "global_step": 111405, "epoch": 663} {"train_loss": -9.897146224975586, "global_step": 111406, "epoch": 663} {"train_loss": -10.099889755249023, "global_step": 111407, "epoch": 663} {"train_loss": -9.680960655212402, "global_step": 111408, "epoch": 663} {"train_loss": -9.75722885131836, "global_step": 111409, "epoch": 663} {"train_loss": -10.056398391723633, "global_step": 111410, "epoch": 663} {"train_loss": -9.726845741271973, "global_step": 111411, "epoch": 663} {"train_loss": -9.864402770996094, "global_step": 111412, "epoch": 663} {"train_loss": -9.436113357543945, "global_step": 111413, "epoch": 663} {"train_loss": -9.852010726928711, "global_step": 111414, "epoch": 663} {"train_loss": -9.521883010864258, "global_step": 111415, "epoch": 663} {"train_loss": -9.93246841430664, "global_step": 111416, "epoch": 663} {"train_loss": -9.648372650146484, "global_step": 111417, "epoch": 663} {"train_loss": -9.746451377868652, "global_step": 111418, "epoch": 663} {"train_loss": -9.951030731201172, "global_step": 111419, "epoch": 663} {"train_loss": -9.880366325378418, "global_step": 111420, "epoch": 663} {"train_loss": -9.835862159729004, "global_step": 111421, "epoch": 663} {"train_loss": -9.654450416564941, "global_step": 111422, "epoch": 663} {"train_loss": -9.983621597290039, "global_step": 111423, "epoch": 663} {"train_loss": -9.428105354309082, "global_step": 111424, "epoch": 663} {"train_loss": -9.945280075073242, "global_step": 111425, "epoch": 663} {"train_loss": -9.478851318359375, "global_step": 111426, "epoch": 663} {"train_loss": -10.028118133544922, "global_step": 111427, "epoch": 663} {"train_loss": -9.487724304199219, "global_step": 111428, "epoch": 663} {"train_loss": -9.905985832214355, "global_step": 111429, "epoch": 663} {"train_loss": -8.734055519104004, "global_step": 111430, "epoch": 663} {"train_loss": -9.876949310302734, "global_step": 111431, "epoch": 663} {"train_loss": -9.651418685913086, "global_step": 111432, "epoch": 663} {"train_loss": -9.733426094055176, "global_step": 111433, "epoch": 663} {"train_loss": -9.578483581542969, "global_step": 111434, "epoch": 663} {"train_loss": -9.892881393432617, "global_step": 111435, "epoch": 663} {"train_loss": -9.773519515991211, "global_step": 111436, "epoch": 663} {"train_loss": -9.846197128295898, "global_step": 111437, "epoch": 663} {"train_loss": -9.953392028808594, "global_step": 111438, "epoch": 663} {"train_loss": -9.686734199523926, "global_step": 111439, "epoch": 663} {"train_loss": -9.742572784423828, "global_step": 111440, "epoch": 663} {"train_loss": -9.781501770019531, "global_step": 111441, "epoch": 663} {"train_loss": -10.030096054077148, "global_step": 111442, "epoch": 663} {"train_loss": -10.015592575073242, "global_step": 111443, "epoch": 663} {"train_loss": -10.08342170715332, "global_step": 111444, "epoch": 663} {"train_loss": -9.886557579040527, "global_step": 111445, "epoch": 663} {"train_loss": -9.943380355834961, "global_step": 111446, "epoch": 663} {"train_loss": -10.119710922241211, "global_step": 111447, "epoch": 663} {"train_loss": -9.940231323242188, "global_step": 111448, "epoch": 663} {"train_loss": -10.0267972946167, "global_step": 111449, "epoch": 663} {"train_loss": -10.218208312988281, "global_step": 111450, "epoch": 663} {"train_loss": -10.118682861328125, "global_step": 111451, "epoch": 663} {"train_loss": -10.1796875, "global_step": 111452, "epoch": 663} {"train_loss": -10.18470573425293, "global_step": 111453, "epoch": 663} {"train_loss": -10.100794792175293, "global_step": 111454, "epoch": 663} {"train_loss": -10.226448059082031, "global_step": 111455, "epoch": 663} {"train_loss": -9.983108520507812, "global_step": 111456, "epoch": 663} {"train_loss": -10.298778533935547, "global_step": 111457, "epoch": 663} {"train_loss": -9.966304779052734, "global_step": 111458, "epoch": 663} {"train_loss": -10.072336196899414, "global_step": 111459, "epoch": 663} {"train_loss": -10.204444885253906, "global_step": 111460, "epoch": 663} {"train_loss": -10.259681701660156, "global_step": 111461, "epoch": 663} {"train_loss": -10.408012390136719, "global_step": 111462, "epoch": 663} {"train_loss": -9.635866165161133, "global_step": 111463, "epoch": 663} {"train_loss": -10.060952186584473, "global_step": 111464, "epoch": 663} {"train_loss": -9.807205200195312, "global_step": 111465, "epoch": 663} {"train_loss": -9.947208404541016, "global_step": 111466, "epoch": 663} {"train_loss": -9.632471084594727, "global_step": 111467, "epoch": 663} {"train_loss": -9.837728500366211, "global_step": 111468, "epoch": 663} {"train_loss": -9.2437744140625, "global_step": 111469, "epoch": 663} {"train_loss": -9.470481872558594, "global_step": 111470, "epoch": 663} {"train_loss": -9.979555130004883, "global_step": 111471, "epoch": 663} {"train_loss": -9.777236938476562, "global_step": 111472, "epoch": 663} {"train_loss": -9.490843772888184, "global_step": 111473, "epoch": 663} {"train_loss": -9.94373893737793, "global_step": 111474, "epoch": 663} {"train_loss": -9.587671279907227, "global_step": 111475, "epoch": 663} {"train_loss": -9.39579963684082, "global_step": 111476, "epoch": 663} {"train_loss": -9.990997314453125, "global_step": 111477, "epoch": 663} {"train_loss": -9.280599594116211, "global_step": 111478, "epoch": 663} {"train_loss": -10.103482246398926, "global_step": 111479, "epoch": 663} {"train_loss": -9.28937816619873, "global_step": 111480, "epoch": 663} {"train_loss": -9.801827430725098, "global_step": 111481, "epoch": 663} {"train_loss": -9.640190124511719, "global_step": 111482, "epoch": 663} {"train_loss": -10.058534622192383, "global_step": 111483, "epoch": 663} {"train_loss": -9.590896606445312, "global_step": 111484, "epoch": 663} {"train_loss": -10.027466773986816, "global_step": 111485, "epoch": 663} {"train_loss": -9.598978042602539, "global_step": 111486, "epoch": 663} {"train_loss": -9.858972549438477, "global_step": 111487, "epoch": 663} {"train_loss": -9.738103866577148, "global_step": 111488, "epoch": 663} {"train_loss": -10.124171257019043, "global_step": 111489, "epoch": 663} {"train_loss": -9.694814682006836, "global_step": 111490, "epoch": 663} {"train_loss": -10.143985748291016, "global_step": 111491, "epoch": 663} {"train_loss": -9.841837882995605, "global_step": 111492, "epoch": 663} {"train_loss": -9.783148765563965, "global_step": 111493, "epoch": 663} {"train_loss": -9.97249984741211, "global_step": 111494, "epoch": 663} {"train_loss": -9.87812614440918, "global_step": 111495, "epoch": 663} {"train_loss": -10.048419952392578, "global_step": 111496, "epoch": 663} {"train_loss": -10.089366912841797, "global_step": 111497, "epoch": 663} {"train_loss": -10.016633987426758, "global_step": 111498, "epoch": 663} {"train_loss": -10.046125411987305, "global_step": 111499, "epoch": 663} {"train_loss": -9.956219673156738, "global_step": 111500, "epoch": 663} {"train_loss": -9.694270133972168, "global_step": 111501, "epoch": 663} {"train_loss": -10.144329071044922, "global_step": 111502, "epoch": 663} {"train_loss": -9.801279067993164, "global_step": 111503, "epoch": 663} {"train_loss": -9.825479507446289, "global_step": 111504, "epoch": 663} {"train_loss": -9.850442886352539, "global_step": 111505, "epoch": 663} {"train_loss": -10.047130584716797, "global_step": 111506, "epoch": 663} {"train_loss": -10.145366668701172, "global_step": 111507, "epoch": 663} {"train_loss": -9.853984832763672, "global_step": 111508, "epoch": 663} {"train_loss": -9.877618789672852, "global_step": 111509, "epoch": 663} {"train_loss": -9.850992202758789, "global_step": 111510, "epoch": 663} {"train_loss": -10.024062156677246, "global_step": 111511, "epoch": 663} {"train_loss": -10.101404190063477, "global_step": 111512, "epoch": 663} {"train_loss": -10.155790328979492, "global_step": 111513, "epoch": 663} {"train_loss": -9.844656944274902, "global_step": 111514, "epoch": 663} {"train_loss": -10.151056289672852, "global_step": 111515, "epoch": 663} {"train_loss": -9.986626625061035, "global_step": 111516, "epoch": 663} {"train_loss": -9.759990692138672, "global_step": 111517, "epoch": 663} {"train_loss": -9.845486640930176, "global_step": 111518, "epoch": 663} {"train_loss": -10.145179748535156, "global_step": 111519, "epoch": 663} {"train_loss": -9.90831470489502, "global_step": 111520, "epoch": 663} {"train_loss": -9.964399337768555, "global_step": 111521, "epoch": 663} {"train_loss": -10.105995178222656, "global_step": 111522, "epoch": 663} {"train_loss": -10.12012004852295, "global_step": 111523, "epoch": 663} {"train_loss": -10.474750518798828, "global_step": 111524, "epoch": 663} {"train_loss": -10.171245574951172, "global_step": 111525, "epoch": 663} {"train_loss": -10.005722045898438, "global_step": 111526, "epoch": 663} {"train_loss": -10.076276779174805, "global_step": 111527, "epoch": 663} {"train_loss": -10.119054794311523, "global_step": 111528, "epoch": 663} {"train_loss": -10.210542678833008, "global_step": 111529, "epoch": 663} {"train_loss": -10.088876724243164, "global_step": 111530, "epoch": 663} {"train_loss": -10.084320068359375, "global_step": 111531, "epoch": 663} {"train_loss": -9.966056823730469, "global_step": 111532, "epoch": 663} {"train_loss": -10.243958473205566, "global_step": 111533, "epoch": 663} {"train_loss": -9.841094970703125, "global_step": 111534, "epoch": 663} {"train_loss": -10.043672561645508, "global_step": 111535, "epoch": 663} {"train_loss": -10.028162956237793, "global_step": 111536, "epoch": 663} {"train_loss": -10.280200004577637, "global_step": 111537, "epoch": 663} {"train_loss": -9.99554443359375, "global_step": 111538, "epoch": 663} {"train_loss": -10.104341506958008, "global_step": 111539, "epoch": 663} {"train_loss": -9.964378356933594, "global_step": 111540, "epoch": 663} {"train_loss": -9.947949409484863, "global_step": 111541, "epoch": 663} {"train_loss": -10.198681831359863, "global_step": 111542, "epoch": 663} {"train_loss": -9.499381065368652, "global_step": 111543, "epoch": 663} {"train_loss": -9.863016128540039, "global_step": 111544, "epoch": 663} {"train_loss": -9.298470497131348, "global_step": 111545, "epoch": 663} {"train_loss": -9.865097999572754, "global_step": 111546, "epoch": 663} {"train_loss": -9.998579978942871, "global_step": 111547, "epoch": 663} {"train_loss": -9.276369094848633, "global_step": 111548, "epoch": 663} {"train_loss": -10.008554458618164, "global_step": 111549, "epoch": 663} {"train_loss": -9.560762405395508, "global_step": 111550, "epoch": 663} {"train_loss": -9.886596452622186, "global_step": 111551, "epoch": 663, "val_loss": 207893.34375} {"train_loss": -10.149755477905273, "global_step": 111552, "epoch": 664} {"train_loss": -9.505605697631836, "global_step": 111553, "epoch": 664} {"train_loss": -10.012310028076172, "global_step": 111554, "epoch": 664} {"train_loss": -9.789422988891602, "global_step": 111555, "epoch": 664} {"train_loss": -9.819284439086914, "global_step": 111556, "epoch": 664} {"train_loss": -10.149433135986328, "global_step": 111557, "epoch": 664} {"train_loss": -9.665593147277832, "global_step": 111558, "epoch": 664} {"train_loss": -9.842304229736328, "global_step": 111559, "epoch": 664} {"train_loss": -9.758594512939453, "global_step": 111560, "epoch": 664} {"train_loss": -9.79735279083252, "global_step": 111561, "epoch": 664} {"train_loss": -9.846070289611816, "global_step": 111562, "epoch": 664} {"train_loss": -9.769882202148438, "global_step": 111563, "epoch": 664} {"train_loss": -9.889528274536133, "global_step": 111564, "epoch": 664} {"train_loss": -10.027120590209961, "global_step": 111565, "epoch": 664} {"train_loss": -9.903017044067383, "global_step": 111566, "epoch": 664} {"train_loss": -9.835013389587402, "global_step": 111567, "epoch": 664} {"train_loss": -9.614341735839844, "global_step": 111568, "epoch": 664} {"train_loss": -9.806353569030762, "global_step": 111569, "epoch": 664} {"train_loss": -9.69906997680664, "global_step": 111570, "epoch": 664} {"train_loss": -9.93858814239502, "global_step": 111571, "epoch": 664} {"train_loss": -9.844988822937012, "global_step": 111572, "epoch": 664} {"train_loss": -9.966472625732422, "global_step": 111573, "epoch": 664} {"train_loss": -10.006734848022461, "global_step": 111574, "epoch": 664} {"train_loss": -9.806818962097168, "global_step": 111575, "epoch": 664} {"train_loss": -10.117448806762695, "global_step": 111576, "epoch": 664} {"train_loss": -9.998296737670898, "global_step": 111577, "epoch": 664} {"train_loss": -9.953065872192383, "global_step": 111578, "epoch": 664} {"train_loss": -9.980674743652344, "global_step": 111579, "epoch": 664} {"train_loss": -10.121146202087402, "global_step": 111580, "epoch": 664} {"train_loss": -9.991670608520508, "global_step": 111581, "epoch": 664} {"train_loss": -9.98991584777832, "global_step": 111582, "epoch": 664} {"train_loss": -9.815632820129395, "global_step": 111583, "epoch": 664} {"train_loss": -9.795793533325195, "global_step": 111584, "epoch": 664} {"train_loss": -10.25340461730957, "global_step": 111585, "epoch": 664} {"train_loss": -10.140812873840332, "global_step": 111586, "epoch": 664} {"train_loss": -9.866546630859375, "global_step": 111587, "epoch": 664} {"train_loss": -10.057535171508789, "global_step": 111588, "epoch": 664} {"train_loss": -10.028307914733887, "global_step": 111589, "epoch": 664} {"train_loss": -9.914539337158203, "global_step": 111590, "epoch": 664} {"train_loss": -9.78376293182373, "global_step": 111591, "epoch": 664} {"train_loss": -9.825325012207031, "global_step": 111592, "epoch": 664} {"train_loss": -9.99297046661377, "global_step": 111593, "epoch": 664} {"train_loss": -9.80493450164795, "global_step": 111594, "epoch": 664} {"train_loss": -9.762380599975586, "global_step": 111595, "epoch": 664} {"train_loss": -9.631053924560547, "global_step": 111596, "epoch": 664} {"train_loss": -9.820857048034668, "global_step": 111597, "epoch": 664} {"train_loss": -9.781402587890625, "global_step": 111598, "epoch": 664} {"train_loss": -9.7511568069458, "global_step": 111599, "epoch": 664} {"train_loss": -10.093557357788086, "global_step": 111600, "epoch": 664} {"train_loss": -9.909570693969727, "global_step": 111601, "epoch": 664} {"train_loss": -9.874088287353516, "global_step": 111602, "epoch": 664} {"train_loss": -9.663228988647461, "global_step": 111603, "epoch": 664} {"train_loss": -9.877514839172363, "global_step": 111604, "epoch": 664} {"train_loss": -10.134441375732422, "global_step": 111605, "epoch": 664} {"train_loss": -9.952674865722656, "global_step": 111606, "epoch": 664} {"train_loss": -9.667627334594727, "global_step": 111607, "epoch": 664} {"train_loss": -10.046269416809082, "global_step": 111608, "epoch": 664} {"train_loss": -9.727840423583984, "global_step": 111609, "epoch": 664} {"train_loss": -9.834405899047852, "global_step": 111610, "epoch": 664} {"train_loss": -9.66693115234375, "global_step": 111611, "epoch": 664} {"train_loss": -9.979019165039062, "global_step": 111612, "epoch": 664} {"train_loss": -9.41425895690918, "global_step": 111613, "epoch": 664} {"train_loss": -10.017593383789062, "global_step": 111614, "epoch": 664} {"train_loss": -9.673359870910645, "global_step": 111615, "epoch": 664} {"train_loss": -9.836962699890137, "global_step": 111616, "epoch": 664} {"train_loss": -9.514307022094727, "global_step": 111617, "epoch": 664} {"train_loss": -9.888654708862305, "global_step": 111618, "epoch": 664} {"train_loss": -9.320176124572754, "global_step": 111619, "epoch": 664} {"train_loss": -10.256946563720703, "global_step": 111620, "epoch": 664} {"train_loss": -9.9415922164917, "global_step": 111621, "epoch": 664} {"train_loss": -9.750287055969238, "global_step": 111622, "epoch": 664} {"train_loss": -10.136655807495117, "global_step": 111623, "epoch": 664} {"train_loss": -10.036510467529297, "global_step": 111624, "epoch": 664} {"train_loss": -10.080968856811523, "global_step": 111625, "epoch": 664} {"train_loss": -9.789815902709961, "global_step": 111626, "epoch": 664} {"train_loss": -10.095888137817383, "global_step": 111627, "epoch": 664} {"train_loss": -10.034207344055176, "global_step": 111628, "epoch": 664} {"train_loss": -10.151017189025879, "global_step": 111629, "epoch": 664} {"train_loss": -9.918333053588867, "global_step": 111630, "epoch": 664} {"train_loss": -10.069395065307617, "global_step": 111631, "epoch": 664} {"train_loss": -10.104902267456055, "global_step": 111632, "epoch": 664} {"train_loss": -10.042237281799316, "global_step": 111633, "epoch": 664} {"train_loss": -10.140064239501953, "global_step": 111634, "epoch": 664} {"train_loss": -10.299482345581055, "global_step": 111635, "epoch": 664} {"train_loss": -10.087032318115234, "global_step": 111636, "epoch": 664} {"train_loss": -10.429498672485352, "global_step": 111637, "epoch": 664} {"train_loss": -9.983071327209473, "global_step": 111638, "epoch": 664} {"train_loss": -9.753087043762207, "global_step": 111639, "epoch": 664} {"train_loss": -10.178986549377441, "global_step": 111640, "epoch": 664} {"train_loss": -9.879331588745117, "global_step": 111641, "epoch": 664} {"train_loss": -10.061090469360352, "global_step": 111642, "epoch": 664} {"train_loss": -10.198395729064941, "global_step": 111643, "epoch": 664} {"train_loss": -9.806488037109375, "global_step": 111644, "epoch": 664} {"train_loss": -10.306981086730957, "global_step": 111645, "epoch": 664} {"train_loss": -9.929434776306152, "global_step": 111646, "epoch": 664} {"train_loss": -10.123151779174805, "global_step": 111647, "epoch": 664} {"train_loss": -10.179019927978516, "global_step": 111648, "epoch": 664} {"train_loss": -10.085161209106445, "global_step": 111649, "epoch": 664} {"train_loss": -9.828941345214844, "global_step": 111650, "epoch": 664} {"train_loss": -10.301365852355957, "global_step": 111651, "epoch": 664} {"train_loss": -10.102128028869629, "global_step": 111652, "epoch": 664} {"train_loss": -10.225647926330566, "global_step": 111653, "epoch": 664} {"train_loss": -10.171409606933594, "global_step": 111654, "epoch": 664} {"train_loss": -9.826231002807617, "global_step": 111655, "epoch": 664} {"train_loss": -10.082867622375488, "global_step": 111656, "epoch": 664} {"train_loss": -10.196247100830078, "global_step": 111657, "epoch": 664} {"train_loss": -9.8717041015625, "global_step": 111658, "epoch": 664} {"train_loss": -10.21302318572998, "global_step": 111659, "epoch": 664} {"train_loss": -9.833640098571777, "global_step": 111660, "epoch": 664} {"train_loss": -10.136832237243652, "global_step": 111661, "epoch": 664} {"train_loss": -10.130169868469238, "global_step": 111662, "epoch": 664} {"train_loss": -9.936407089233398, "global_step": 111663, "epoch": 664} {"train_loss": -10.144270896911621, "global_step": 111664, "epoch": 664} {"train_loss": -9.966976165771484, "global_step": 111665, "epoch": 664} {"train_loss": -9.843356132507324, "global_step": 111666, "epoch": 664} {"train_loss": -10.220344543457031, "global_step": 111667, "epoch": 664} {"train_loss": -10.10049819946289, "global_step": 111668, "epoch": 664} {"train_loss": -10.364598274230957, "global_step": 111669, "epoch": 664} {"train_loss": -10.059492111206055, "global_step": 111670, "epoch": 664} {"train_loss": -9.917448997497559, "global_step": 111671, "epoch": 664} {"train_loss": -9.873241424560547, "global_step": 111672, "epoch": 664} {"train_loss": -9.84769058227539, "global_step": 111673, "epoch": 664} {"train_loss": -9.458208084106445, "global_step": 111674, "epoch": 664} {"train_loss": -9.380149841308594, "global_step": 111675, "epoch": 664} {"train_loss": -9.70773983001709, "global_step": 111676, "epoch": 664} {"train_loss": -9.869234085083008, "global_step": 111677, "epoch": 664} {"train_loss": -9.287683486938477, "global_step": 111678, "epoch": 664} {"train_loss": -9.893270492553711, "global_step": 111679, "epoch": 664} {"train_loss": -9.727462768554688, "global_step": 111680, "epoch": 664} {"train_loss": -9.654560089111328, "global_step": 111681, "epoch": 664} {"train_loss": -9.829841613769531, "global_step": 111682, "epoch": 664} {"train_loss": -9.504575729370117, "global_step": 111683, "epoch": 664} {"train_loss": -9.663190841674805, "global_step": 111684, "epoch": 664} {"train_loss": -9.521596908569336, "global_step": 111685, "epoch": 664} {"train_loss": -9.628814697265625, "global_step": 111686, "epoch": 664} {"train_loss": -9.694504737854004, "global_step": 111687, "epoch": 664} {"train_loss": -9.835762977600098, "global_step": 111688, "epoch": 664} {"train_loss": -9.710052490234375, "global_step": 111689, "epoch": 664} {"train_loss": -9.878360748291016, "global_step": 111690, "epoch": 664} {"train_loss": -9.784188270568848, "global_step": 111691, "epoch": 664} {"train_loss": -9.94023609161377, "global_step": 111692, "epoch": 664} {"train_loss": -9.694814682006836, "global_step": 111693, "epoch": 664} {"train_loss": -10.097146987915039, "global_step": 111694, "epoch": 664} {"train_loss": -9.897714614868164, "global_step": 111695, "epoch": 664} {"train_loss": -9.648992538452148, "global_step": 111696, "epoch": 664} {"train_loss": -9.657052993774414, "global_step": 111697, "epoch": 664} {"train_loss": -9.833442687988281, "global_step": 111698, "epoch": 664} {"train_loss": -9.383211135864258, "global_step": 111699, "epoch": 664} {"train_loss": -9.87226676940918, "global_step": 111700, "epoch": 664} {"train_loss": -9.580331802368164, "global_step": 111701, "epoch": 664} {"train_loss": -9.561566352844238, "global_step": 111702, "epoch": 664} {"train_loss": -9.443597793579102, "global_step": 111703, "epoch": 664} {"train_loss": -9.810441970825195, "global_step": 111704, "epoch": 664} {"train_loss": -9.645023345947266, "global_step": 111705, "epoch": 664} {"train_loss": -9.894603729248047, "global_step": 111706, "epoch": 664} {"train_loss": -9.938922882080078, "global_step": 111707, "epoch": 664} {"train_loss": -9.732820510864258, "global_step": 111708, "epoch": 664} {"train_loss": -9.884683609008789, "global_step": 111709, "epoch": 664} {"train_loss": -9.743057250976562, "global_step": 111710, "epoch": 664} {"train_loss": -9.949089050292969, "global_step": 111711, "epoch": 664} {"train_loss": -9.575343132019043, "global_step": 111712, "epoch": 664} {"train_loss": -9.854227066040039, "global_step": 111713, "epoch": 664} {"train_loss": -9.882723808288574, "global_step": 111714, "epoch": 664} {"train_loss": -9.843847274780273, "global_step": 111715, "epoch": 664} {"train_loss": -9.955131530761719, "global_step": 111716, "epoch": 664} {"train_loss": -10.10893440246582, "global_step": 111717, "epoch": 664} {"train_loss": -9.96371078491211, "global_step": 111718, "epoch": 664} {"train_loss": -9.89345858210609, "global_step": 111719, "epoch": 664, "val_loss": 213296.234375} {"train_loss": -10.08940315246582, "global_step": 111720, "epoch": 665} {"train_loss": -10.037153244018555, "global_step": 111721, "epoch": 665} {"train_loss": -10.010388374328613, "global_step": 111722, "epoch": 665} {"train_loss": -10.193613052368164, "global_step": 111723, "epoch": 665} {"train_loss": -9.970333099365234, "global_step": 111724, "epoch": 665} {"train_loss": -10.26473617553711, "global_step": 111725, "epoch": 665} {"train_loss": -10.328872680664062, "global_step": 111726, "epoch": 665} {"train_loss": -10.10901165008545, "global_step": 111727, "epoch": 665} {"train_loss": -10.143238067626953, "global_step": 111728, "epoch": 665} {"train_loss": -9.884779930114746, "global_step": 111729, "epoch": 665} {"train_loss": -10.29109001159668, "global_step": 111730, "epoch": 665} {"train_loss": -10.280464172363281, "global_step": 111731, "epoch": 665} {"train_loss": -9.986028671264648, "global_step": 111732, "epoch": 665} {"train_loss": -10.289928436279297, "global_step": 111733, "epoch": 665} {"train_loss": -9.887689590454102, "global_step": 111734, "epoch": 665} {"train_loss": -10.121774673461914, "global_step": 111735, "epoch": 665} {"train_loss": -10.006782531738281, "global_step": 111736, "epoch": 665} {"train_loss": -10.277120590209961, "global_step": 111737, "epoch": 665} {"train_loss": -9.959643363952637, "global_step": 111738, "epoch": 665} {"train_loss": -10.170488357543945, "global_step": 111739, "epoch": 665} {"train_loss": -10.081476211547852, "global_step": 111740, "epoch": 665} {"train_loss": -9.893028259277344, "global_step": 111741, "epoch": 665} {"train_loss": -9.833101272583008, "global_step": 111742, "epoch": 665} {"train_loss": -10.26312255859375, "global_step": 111743, "epoch": 665} {"train_loss": -10.084676742553711, "global_step": 111744, "epoch": 665} {"train_loss": -9.685131072998047, "global_step": 111745, "epoch": 665} {"train_loss": -10.10894775390625, "global_step": 111746, "epoch": 665} {"train_loss": -10.058123588562012, "global_step": 111747, "epoch": 665} {"train_loss": -10.22380256652832, "global_step": 111748, "epoch": 665} {"train_loss": -9.986427307128906, "global_step": 111749, "epoch": 665} {"train_loss": -9.976088523864746, "global_step": 111750, "epoch": 665} {"train_loss": -9.72317123413086, "global_step": 111751, "epoch": 665} {"train_loss": -9.427436828613281, "global_step": 111752, "epoch": 665} {"train_loss": -9.978607177734375, "global_step": 111753, "epoch": 665} {"train_loss": -9.10169792175293, "global_step": 111754, "epoch": 665} {"train_loss": -9.867650032043457, "global_step": 111755, "epoch": 665} {"train_loss": -9.361055374145508, "global_step": 111756, "epoch": 665} {"train_loss": -9.789863586425781, "global_step": 111757, "epoch": 665} {"train_loss": -9.765351295471191, "global_step": 111758, "epoch": 665} {"train_loss": -9.930681228637695, "global_step": 111759, "epoch": 665} {"train_loss": -10.016883850097656, "global_step": 111760, "epoch": 665} {"train_loss": -9.676702499389648, "global_step": 111761, "epoch": 665} {"train_loss": -10.165925979614258, "global_step": 111762, "epoch": 665} {"train_loss": -9.841182708740234, "global_step": 111763, "epoch": 665} {"train_loss": -9.889206886291504, "global_step": 111764, "epoch": 665} {"train_loss": -10.102697372436523, "global_step": 111765, "epoch": 665} {"train_loss": -10.061983108520508, "global_step": 111766, "epoch": 665} {"train_loss": -10.063187599182129, "global_step": 111767, "epoch": 665} {"train_loss": -10.169294357299805, "global_step": 111768, "epoch": 665} {"train_loss": -9.923221588134766, "global_step": 111769, "epoch": 665} {"train_loss": -10.068591117858887, "global_step": 111770, "epoch": 665} {"train_loss": -10.078922271728516, "global_step": 111771, "epoch": 665} {"train_loss": -10.007685661315918, "global_step": 111772, "epoch": 665} {"train_loss": -10.206298828125, "global_step": 111773, "epoch": 665} {"train_loss": -10.025489807128906, "global_step": 111774, "epoch": 665} {"train_loss": -10.092608451843262, "global_step": 111775, "epoch": 665} {"train_loss": -10.137035369873047, "global_step": 111776, "epoch": 665} {"train_loss": -9.787796020507812, "global_step": 111777, "epoch": 665} {"train_loss": -10.127435684204102, "global_step": 111778, "epoch": 665} {"train_loss": -10.085289001464844, "global_step": 111779, "epoch": 665} {"train_loss": -10.10867691040039, "global_step": 111780, "epoch": 665} {"train_loss": -9.917463302612305, "global_step": 111781, "epoch": 665} {"train_loss": -9.990348815917969, "global_step": 111782, "epoch": 665} {"train_loss": -10.056146621704102, "global_step": 111783, "epoch": 665} {"train_loss": -9.846818923950195, "global_step": 111784, "epoch": 665} {"train_loss": -10.130136489868164, "global_step": 111785, "epoch": 665} {"train_loss": -9.976617813110352, "global_step": 111786, "epoch": 665} {"train_loss": -10.183944702148438, "global_step": 111787, "epoch": 665} {"train_loss": -9.981096267700195, "global_step": 111788, "epoch": 665} {"train_loss": -10.229748725891113, "global_step": 111789, "epoch": 665} {"train_loss": -10.159740447998047, "global_step": 111790, "epoch": 665} {"train_loss": -10.170276641845703, "global_step": 111791, "epoch": 665} {"train_loss": -9.855146408081055, "global_step": 111792, "epoch": 665} {"train_loss": -9.785762786865234, "global_step": 111793, "epoch": 665} {"train_loss": -9.720483779907227, "global_step": 111794, "epoch": 665} {"train_loss": -9.612882614135742, "global_step": 111795, "epoch": 665} {"train_loss": -10.404047012329102, "global_step": 111796, "epoch": 665} {"train_loss": -9.799240112304688, "global_step": 111797, "epoch": 665} {"train_loss": -10.040270805358887, "global_step": 111798, "epoch": 665} {"train_loss": -10.293862342834473, "global_step": 111799, "epoch": 665} {"train_loss": -9.941457748413086, "global_step": 111800, "epoch": 665} {"train_loss": -10.033370971679688, "global_step": 111801, "epoch": 665} {"train_loss": -9.985507011413574, "global_step": 111802, "epoch": 665} {"train_loss": -9.761186599731445, "global_step": 111803, "epoch": 665} {"train_loss": -10.059557914733887, "global_step": 111804, "epoch": 665} {"train_loss": -10.221893310546875, "global_step": 111805, "epoch": 665} {"train_loss": -10.155380249023438, "global_step": 111806, "epoch": 665} {"train_loss": -10.33288860321045, "global_step": 111807, "epoch": 665} {"train_loss": -10.109006881713867, "global_step": 111808, "epoch": 665} {"train_loss": -10.023801803588867, "global_step": 111809, "epoch": 665} {"train_loss": -10.122232437133789, "global_step": 111810, "epoch": 665} {"train_loss": -10.368391036987305, "global_step": 111811, "epoch": 665} {"train_loss": -10.128599166870117, "global_step": 111812, "epoch": 665} {"train_loss": -10.241464614868164, "global_step": 111813, "epoch": 665} {"train_loss": -10.040091514587402, "global_step": 111814, "epoch": 665} {"train_loss": -10.01279354095459, "global_step": 111815, "epoch": 665} {"train_loss": -10.151811599731445, "global_step": 111816, "epoch": 665} {"train_loss": -10.060964584350586, "global_step": 111817, "epoch": 665} {"train_loss": -10.30797004699707, "global_step": 111818, "epoch": 665} {"train_loss": -10.08045768737793, "global_step": 111819, "epoch": 665} {"train_loss": -10.022209167480469, "global_step": 111820, "epoch": 665} {"train_loss": -10.002307891845703, "global_step": 111821, "epoch": 665} {"train_loss": -10.0360107421875, "global_step": 111822, "epoch": 665} {"train_loss": -10.041308403015137, "global_step": 111823, "epoch": 665} {"train_loss": -9.880643844604492, "global_step": 111824, "epoch": 665} {"train_loss": -9.94401741027832, "global_step": 111825, "epoch": 665} {"train_loss": -9.867536544799805, "global_step": 111826, "epoch": 665} {"train_loss": -9.870997428894043, "global_step": 111827, "epoch": 665} {"train_loss": -9.929253578186035, "global_step": 111828, "epoch": 665} {"train_loss": -9.725218772888184, "global_step": 111829, "epoch": 665} {"train_loss": -10.01915168762207, "global_step": 111830, "epoch": 665} {"train_loss": -9.870197296142578, "global_step": 111831, "epoch": 665} {"train_loss": -10.220096588134766, "global_step": 111832, "epoch": 665} {"train_loss": -9.988884925842285, "global_step": 111833, "epoch": 665} {"train_loss": -10.275223731994629, "global_step": 111834, "epoch": 665} {"train_loss": -9.834135055541992, "global_step": 111835, "epoch": 665} {"train_loss": -9.685981750488281, "global_step": 111836, "epoch": 665} {"train_loss": -9.952590942382812, "global_step": 111837, "epoch": 665} {"train_loss": -9.831328392028809, "global_step": 111838, "epoch": 665} {"train_loss": -10.038395881652832, "global_step": 111839, "epoch": 665} {"train_loss": -10.081643104553223, "global_step": 111840, "epoch": 665} {"train_loss": -9.712541580200195, "global_step": 111841, "epoch": 665} {"train_loss": -10.237942695617676, "global_step": 111842, "epoch": 665} {"train_loss": -9.781608581542969, "global_step": 111843, "epoch": 665} {"train_loss": -9.835212707519531, "global_step": 111844, "epoch": 665} {"train_loss": -9.906858444213867, "global_step": 111845, "epoch": 665} {"train_loss": -9.925788879394531, "global_step": 111846, "epoch": 665} {"train_loss": -9.592235565185547, "global_step": 111847, "epoch": 665} {"train_loss": -9.651702880859375, "global_step": 111848, "epoch": 665} {"train_loss": -9.920794486999512, "global_step": 111849, "epoch": 665} {"train_loss": -9.863245010375977, "global_step": 111850, "epoch": 665} {"train_loss": -9.898604393005371, "global_step": 111851, "epoch": 665} {"train_loss": -9.488609313964844, "global_step": 111852, "epoch": 665} {"train_loss": -10.134468078613281, "global_step": 111853, "epoch": 665} {"train_loss": -9.494539260864258, "global_step": 111854, "epoch": 665} {"train_loss": -9.938596725463867, "global_step": 111855, "epoch": 665} {"train_loss": -9.51726245880127, "global_step": 111856, "epoch": 665} {"train_loss": -9.718332290649414, "global_step": 111857, "epoch": 665} {"train_loss": -9.846226692199707, "global_step": 111858, "epoch": 665} {"train_loss": -9.921300888061523, "global_step": 111859, "epoch": 665} {"train_loss": -9.612068176269531, "global_step": 111860, "epoch": 665} {"train_loss": -9.700037956237793, "global_step": 111861, "epoch": 665} {"train_loss": -9.712445259094238, "global_step": 111862, "epoch": 665} {"train_loss": -9.880207061767578, "global_step": 111863, "epoch": 665} {"train_loss": -9.684626579284668, "global_step": 111864, "epoch": 665} {"train_loss": -9.790102005004883, "global_step": 111865, "epoch": 665} {"train_loss": -9.976101875305176, "global_step": 111866, "epoch": 665} {"train_loss": -9.563194274902344, "global_step": 111867, "epoch": 665} {"train_loss": -10.007913589477539, "global_step": 111868, "epoch": 665} {"train_loss": -9.87232780456543, "global_step": 111869, "epoch": 665} {"train_loss": -9.760108947753906, "global_step": 111870, "epoch": 665} {"train_loss": -9.65001392364502, "global_step": 111871, "epoch": 665} {"train_loss": -9.877233505249023, "global_step": 111872, "epoch": 665} {"train_loss": -9.948546409606934, "global_step": 111873, "epoch": 665} {"train_loss": -9.829338073730469, "global_step": 111874, "epoch": 665} {"train_loss": -9.763644218444824, "global_step": 111875, "epoch": 665} {"train_loss": -9.862136840820312, "global_step": 111876, "epoch": 665} {"train_loss": -9.95781421661377, "global_step": 111877, "epoch": 665} {"train_loss": -9.852757453918457, "global_step": 111878, "epoch": 665} {"train_loss": -9.864112854003906, "global_step": 111879, "epoch": 665} {"train_loss": -10.06959342956543, "global_step": 111880, "epoch": 665} {"train_loss": -9.768148422241211, "global_step": 111881, "epoch": 665} {"train_loss": -9.94576644897461, "global_step": 111882, "epoch": 665} {"train_loss": -10.111764907836914, "global_step": 111883, "epoch": 665} {"train_loss": -9.98946762084961, "global_step": 111884, "epoch": 665} {"train_loss": -9.98885726928711, "global_step": 111885, "epoch": 665} {"train_loss": -9.996232986450195, "global_step": 111886, "epoch": 665} {"train_loss": -9.96296645346142, "global_step": 111887, "epoch": 665, "val_loss": 211669.0625, "train_action_mse_error": 2.377131462097168} {"train_loss": -9.948101043701172, "global_step": 111888, "epoch": 666} {"train_loss": -10.016697883605957, "global_step": 111889, "epoch": 666} {"train_loss": -9.57796859741211, "global_step": 111890, "epoch": 666} {"train_loss": -10.024904251098633, "global_step": 111891, "epoch": 666} {"train_loss": -9.829455375671387, "global_step": 111892, "epoch": 666} {"train_loss": -10.023712158203125, "global_step": 111893, "epoch": 666} {"train_loss": -9.997953414916992, "global_step": 111894, "epoch": 666} {"train_loss": -9.616071701049805, "global_step": 111895, "epoch": 666} {"train_loss": -10.177959442138672, "global_step": 111896, "epoch": 666} {"train_loss": -9.79746150970459, "global_step": 111897, "epoch": 666} {"train_loss": -10.043304443359375, "global_step": 111898, "epoch": 666} {"train_loss": -9.85236930847168, "global_step": 111899, "epoch": 666} {"train_loss": -10.095085144042969, "global_step": 111900, "epoch": 666} {"train_loss": -9.654582977294922, "global_step": 111901, "epoch": 666} {"train_loss": -10.237417221069336, "global_step": 111902, "epoch": 666} {"train_loss": -9.499624252319336, "global_step": 111903, "epoch": 666} {"train_loss": -9.982583999633789, "global_step": 111904, "epoch": 666} {"train_loss": -9.50062370300293, "global_step": 111905, "epoch": 666} {"train_loss": -10.250903129577637, "global_step": 111906, "epoch": 666} {"train_loss": -9.909399032592773, "global_step": 111907, "epoch": 666} {"train_loss": -9.82863998413086, "global_step": 111908, "epoch": 666} {"train_loss": -9.760882377624512, "global_step": 111909, "epoch": 666} {"train_loss": -10.018087387084961, "global_step": 111910, "epoch": 666} {"train_loss": -9.818744659423828, "global_step": 111911, "epoch": 666} {"train_loss": -10.196003913879395, "global_step": 111912, "epoch": 666} {"train_loss": -9.528003692626953, "global_step": 111913, "epoch": 666} {"train_loss": -10.069978713989258, "global_step": 111914, "epoch": 666} {"train_loss": -9.565530776977539, "global_step": 111915, "epoch": 666} {"train_loss": -9.783614158630371, "global_step": 111916, "epoch": 666} {"train_loss": -9.85917854309082, "global_step": 111917, "epoch": 666} {"train_loss": -10.08035659790039, "global_step": 111918, "epoch": 666} {"train_loss": -10.167558670043945, "global_step": 111919, "epoch": 666} {"train_loss": -10.008136749267578, "global_step": 111920, "epoch": 666} {"train_loss": -10.026979446411133, "global_step": 111921, "epoch": 666} {"train_loss": -10.251713752746582, "global_step": 111922, "epoch": 666} {"train_loss": -9.835101127624512, "global_step": 111923, "epoch": 666} {"train_loss": -10.0325927734375, "global_step": 111924, "epoch": 666} {"train_loss": -10.06266975402832, "global_step": 111925, "epoch": 666} {"train_loss": -10.099576950073242, "global_step": 111926, "epoch": 666} {"train_loss": -9.992637634277344, "global_step": 111927, "epoch": 666} {"train_loss": -10.021689414978027, "global_step": 111928, "epoch": 666} {"train_loss": -10.028924942016602, "global_step": 111929, "epoch": 666} {"train_loss": -10.147759437561035, "global_step": 111930, "epoch": 666} {"train_loss": -10.159988403320312, "global_step": 111931, "epoch": 666} {"train_loss": -10.104582786560059, "global_step": 111932, "epoch": 666} {"train_loss": -9.84582805633545, "global_step": 111933, "epoch": 666} {"train_loss": -9.738862991333008, "global_step": 111934, "epoch": 666} {"train_loss": -9.932764053344727, "global_step": 111935, "epoch": 666} {"train_loss": -9.895528793334961, "global_step": 111936, "epoch": 666} {"train_loss": -9.94216537475586, "global_step": 111937, "epoch": 666} {"train_loss": -9.958576202392578, "global_step": 111938, "epoch": 666} {"train_loss": -10.088777542114258, "global_step": 111939, "epoch": 666} {"train_loss": -9.883522987365723, "global_step": 111940, "epoch": 666} {"train_loss": -9.88150691986084, "global_step": 111941, "epoch": 666} {"train_loss": -9.820991516113281, "global_step": 111942, "epoch": 666} {"train_loss": -10.081196784973145, "global_step": 111943, "epoch": 666} {"train_loss": -9.75435733795166, "global_step": 111944, "epoch": 666} {"train_loss": -10.110825538635254, "global_step": 111945, "epoch": 666} {"train_loss": -9.726103782653809, "global_step": 111946, "epoch": 666} {"train_loss": -10.219883918762207, "global_step": 111947, "epoch": 666} {"train_loss": -9.904745101928711, "global_step": 111948, "epoch": 666} {"train_loss": -10.1661376953125, "global_step": 111949, "epoch": 666} {"train_loss": -9.936553955078125, "global_step": 111950, "epoch": 666} {"train_loss": -10.201689720153809, "global_step": 111951, "epoch": 666} {"train_loss": -9.878215789794922, "global_step": 111952, "epoch": 666} {"train_loss": -9.980952262878418, "global_step": 111953, "epoch": 666} {"train_loss": -9.998948097229004, "global_step": 111954, "epoch": 666} {"train_loss": -9.994287490844727, "global_step": 111955, "epoch": 666} {"train_loss": -10.118354797363281, "global_step": 111956, "epoch": 666} {"train_loss": -9.884613990783691, "global_step": 111957, "epoch": 666} {"train_loss": -10.359432220458984, "global_step": 111958, "epoch": 666} {"train_loss": -10.015541076660156, "global_step": 111959, "epoch": 666} {"train_loss": -9.918460845947266, "global_step": 111960, "epoch": 666} {"train_loss": -10.081832885742188, "global_step": 111961, "epoch": 666} {"train_loss": -9.79018783569336, "global_step": 111962, "epoch": 666} {"train_loss": -10.2733793258667, "global_step": 111963, "epoch": 666} {"train_loss": -10.204316139221191, "global_step": 111964, "epoch": 666} {"train_loss": -9.698587417602539, "global_step": 111965, "epoch": 666} {"train_loss": -9.912737846374512, "global_step": 111966, "epoch": 666} {"train_loss": -9.579750061035156, "global_step": 111967, "epoch": 666} {"train_loss": -10.067671775817871, "global_step": 111968, "epoch": 666} {"train_loss": -9.996969223022461, "global_step": 111969, "epoch": 666} {"train_loss": -9.90045166015625, "global_step": 111970, "epoch": 666} {"train_loss": -9.919426918029785, "global_step": 111971, "epoch": 666} {"train_loss": -10.12961483001709, "global_step": 111972, "epoch": 666} {"train_loss": -9.906854629516602, "global_step": 111973, "epoch": 666} {"train_loss": -10.041205406188965, "global_step": 111974, "epoch": 666} {"train_loss": -10.067913055419922, "global_step": 111975, "epoch": 666} {"train_loss": -10.305561065673828, "global_step": 111976, "epoch": 666} {"train_loss": -9.745683670043945, "global_step": 111977, "epoch": 666} {"train_loss": -9.95937442779541, "global_step": 111978, "epoch": 666} {"train_loss": -9.962991714477539, "global_step": 111979, "epoch": 666} {"train_loss": -10.233318328857422, "global_step": 111980, "epoch": 666} {"train_loss": -10.090645790100098, "global_step": 111981, "epoch": 666} {"train_loss": -9.94059944152832, "global_step": 111982, "epoch": 666} {"train_loss": -10.055212020874023, "global_step": 111983, "epoch": 666} {"train_loss": -9.893095970153809, "global_step": 111984, "epoch": 666} {"train_loss": -10.309306144714355, "global_step": 111985, "epoch": 666} {"train_loss": -10.132152557373047, "global_step": 111986, "epoch": 666} {"train_loss": -10.096529960632324, "global_step": 111987, "epoch": 666} {"train_loss": -10.337018966674805, "global_step": 111988, "epoch": 666} {"train_loss": -10.058670043945312, "global_step": 111989, "epoch": 666} {"train_loss": -10.267617225646973, "global_step": 111990, "epoch": 666} {"train_loss": -10.168221473693848, "global_step": 111991, "epoch": 666} {"train_loss": -10.186136245727539, "global_step": 111992, "epoch": 666} {"train_loss": -10.179336547851562, "global_step": 111993, "epoch": 666} {"train_loss": -10.040657997131348, "global_step": 111994, "epoch": 666} {"train_loss": -10.177488327026367, "global_step": 111995, "epoch": 666} {"train_loss": -10.162158966064453, "global_step": 111996, "epoch": 666} {"train_loss": -10.050983428955078, "global_step": 111997, "epoch": 666} {"train_loss": -10.235060691833496, "global_step": 111998, "epoch": 666} {"train_loss": -10.151219367980957, "global_step": 111999, "epoch": 666} {"train_loss": -9.967057228088379, "global_step": 112000, "epoch": 666} {"train_loss": -10.333272933959961, "global_step": 112001, "epoch": 666} {"train_loss": -10.212021827697754, "global_step": 112002, "epoch": 666} {"train_loss": -10.029491424560547, "global_step": 112003, "epoch": 666} {"train_loss": -10.213028907775879, "global_step": 112004, "epoch": 666} {"train_loss": -10.351016998291016, "global_step": 112005, "epoch": 666} {"train_loss": -9.94365119934082, "global_step": 112006, "epoch": 666} {"train_loss": -9.974091529846191, "global_step": 112007, "epoch": 666} {"train_loss": -9.870414733886719, "global_step": 112008, "epoch": 666} {"train_loss": -9.975536346435547, "global_step": 112009, "epoch": 666} {"train_loss": -10.203516960144043, "global_step": 112010, "epoch": 666} {"train_loss": -9.94555377960205, "global_step": 112011, "epoch": 666} {"train_loss": -9.744359970092773, "global_step": 112012, "epoch": 666} {"train_loss": -9.910722732543945, "global_step": 112013, "epoch": 666} {"train_loss": -9.999982833862305, "global_step": 112014, "epoch": 666} {"train_loss": -9.628312110900879, "global_step": 112015, "epoch": 666} {"train_loss": -9.8951997756958, "global_step": 112016, "epoch": 666} {"train_loss": -9.866643905639648, "global_step": 112017, "epoch": 666} {"train_loss": -9.469582557678223, "global_step": 112018, "epoch": 666} {"train_loss": -10.239072799682617, "global_step": 112019, "epoch": 666} {"train_loss": -9.385604858398438, "global_step": 112020, "epoch": 666} {"train_loss": -9.860746383666992, "global_step": 112021, "epoch": 666} {"train_loss": -9.915958404541016, "global_step": 112022, "epoch": 666} {"train_loss": -9.98399543762207, "global_step": 112023, "epoch": 666} {"train_loss": -9.977134704589844, "global_step": 112024, "epoch": 666} {"train_loss": -10.074502944946289, "global_step": 112025, "epoch": 666} {"train_loss": -10.068745613098145, "global_step": 112026, "epoch": 666} {"train_loss": -10.067858695983887, "global_step": 112027, "epoch": 666} {"train_loss": -10.01024341583252, "global_step": 112028, "epoch": 666} {"train_loss": -10.134350776672363, "global_step": 112029, "epoch": 666} {"train_loss": -10.027409553527832, "global_step": 112030, "epoch": 666} {"train_loss": -9.943524360656738, "global_step": 112031, "epoch": 666} {"train_loss": -10.260505676269531, "global_step": 112032, "epoch": 666} {"train_loss": -9.660069465637207, "global_step": 112033, "epoch": 666} {"train_loss": -10.14053726196289, "global_step": 112034, "epoch": 666} {"train_loss": -10.028251647949219, "global_step": 112035, "epoch": 666} {"train_loss": -9.700555801391602, "global_step": 112036, "epoch": 666} {"train_loss": -10.092249870300293, "global_step": 112037, "epoch": 666} {"train_loss": -9.828225135803223, "global_step": 112038, "epoch": 666} {"train_loss": -10.040654182434082, "global_step": 112039, "epoch": 666} {"train_loss": -10.006049156188965, "global_step": 112040, "epoch": 666} {"train_loss": -10.00358772277832, "global_step": 112041, "epoch": 666} {"train_loss": -9.911494255065918, "global_step": 112042, "epoch": 666} {"train_loss": -9.872568130493164, "global_step": 112043, "epoch": 666} {"train_loss": -9.873571395874023, "global_step": 112044, "epoch": 666} {"train_loss": -9.813084602355957, "global_step": 112045, "epoch": 666} {"train_loss": -9.956399917602539, "global_step": 112046, "epoch": 666} {"train_loss": -9.774503707885742, "global_step": 112047, "epoch": 666} {"train_loss": -9.559056282043457, "global_step": 112048, "epoch": 666} {"train_loss": -9.869277954101562, "global_step": 112049, "epoch": 666} {"train_loss": -9.371256828308105, "global_step": 112050, "epoch": 666} {"train_loss": -9.76163101196289, "global_step": 112051, "epoch": 666} {"train_loss": -9.49188232421875, "global_step": 112052, "epoch": 666} {"train_loss": -9.623720169067383, "global_step": 112053, "epoch": 666} {"train_loss": -9.330066680908203, "global_step": 112054, "epoch": 666} {"train_loss": -9.963303032375517, "global_step": 112055, "epoch": 666, "val_loss": 211448.09375} {"train_loss": -9.15798282623291, "global_step": 112056, "epoch": 667} {"train_loss": -10.137049674987793, "global_step": 112057, "epoch": 667} {"train_loss": -8.611648559570312, "global_step": 112058, "epoch": 667} {"train_loss": -9.985084533691406, "global_step": 112059, "epoch": 667} {"train_loss": -8.966596603393555, "global_step": 112060, "epoch": 667} {"train_loss": -9.433904647827148, "global_step": 112061, "epoch": 667} {"train_loss": -9.475720405578613, "global_step": 112062, "epoch": 667} {"train_loss": -9.189866065979004, "global_step": 112063, "epoch": 667} {"train_loss": -9.875078201293945, "global_step": 112064, "epoch": 667} {"train_loss": -9.082099914550781, "global_step": 112065, "epoch": 667} {"train_loss": -9.572117805480957, "global_step": 112066, "epoch": 667} {"train_loss": -9.115245819091797, "global_step": 112067, "epoch": 667} {"train_loss": -9.458539962768555, "global_step": 112068, "epoch": 667} {"train_loss": -9.828574180603027, "global_step": 112069, "epoch": 667} {"train_loss": -9.495388984680176, "global_step": 112070, "epoch": 667} {"train_loss": -9.351821899414062, "global_step": 112071, "epoch": 667} {"train_loss": -9.76219654083252, "global_step": 112072, "epoch": 667} {"train_loss": -9.643397331237793, "global_step": 112073, "epoch": 667} {"train_loss": -9.79473876953125, "global_step": 112074, "epoch": 667} {"train_loss": -9.772351264953613, "global_step": 112075, "epoch": 667} {"train_loss": -9.828592300415039, "global_step": 112076, "epoch": 667} {"train_loss": -9.715153694152832, "global_step": 112077, "epoch": 667} {"train_loss": -9.51961898803711, "global_step": 112078, "epoch": 667} {"train_loss": -9.908055305480957, "global_step": 112079, "epoch": 667} {"train_loss": -9.57404899597168, "global_step": 112080, "epoch": 667} {"train_loss": -9.826290130615234, "global_step": 112081, "epoch": 667} {"train_loss": -9.809625625610352, "global_step": 112082, "epoch": 667} {"train_loss": -9.591578483581543, "global_step": 112083, "epoch": 667} {"train_loss": -9.858152389526367, "global_step": 112084, "epoch": 667} {"train_loss": -9.995221138000488, "global_step": 112085, "epoch": 667} {"train_loss": -10.227636337280273, "global_step": 112086, "epoch": 667} {"train_loss": -9.80524730682373, "global_step": 112087, "epoch": 667} {"train_loss": -9.988846778869629, "global_step": 112088, "epoch": 667} {"train_loss": -9.95808219909668, "global_step": 112089, "epoch": 667} {"train_loss": -9.969803810119629, "global_step": 112090, "epoch": 667} {"train_loss": -10.184626579284668, "global_step": 112091, "epoch": 667} {"train_loss": -9.855116844177246, "global_step": 112092, "epoch": 667} {"train_loss": -9.921762466430664, "global_step": 112093, "epoch": 667} {"train_loss": -9.83154296875, "global_step": 112094, "epoch": 667} {"train_loss": -9.984172821044922, "global_step": 112095, "epoch": 667} {"train_loss": -9.799741744995117, "global_step": 112096, "epoch": 667} {"train_loss": -10.060312271118164, "global_step": 112097, "epoch": 667} {"train_loss": -9.641633987426758, "global_step": 112098, "epoch": 667} {"train_loss": -9.961929321289062, "global_step": 112099, "epoch": 667} {"train_loss": -10.08458137512207, "global_step": 112100, "epoch": 667} {"train_loss": -9.835826873779297, "global_step": 112101, "epoch": 667} {"train_loss": -9.994637489318848, "global_step": 112102, "epoch": 667} {"train_loss": -9.826263427734375, "global_step": 112103, "epoch": 667} {"train_loss": -10.15210247039795, "global_step": 112104, "epoch": 667} {"train_loss": -9.91596794128418, "global_step": 112105, "epoch": 667} {"train_loss": -10.028846740722656, "global_step": 112106, "epoch": 667} {"train_loss": -9.943453788757324, "global_step": 112107, "epoch": 667} {"train_loss": -10.026573181152344, "global_step": 112108, "epoch": 667} {"train_loss": -9.6954927444458, "global_step": 112109, "epoch": 667} {"train_loss": -9.92398738861084, "global_step": 112110, "epoch": 667} {"train_loss": -9.824475288391113, "global_step": 112111, "epoch": 667} {"train_loss": -9.746763229370117, "global_step": 112112, "epoch": 667} {"train_loss": -10.037073135375977, "global_step": 112113, "epoch": 667} {"train_loss": -9.96976375579834, "global_step": 112114, "epoch": 667} {"train_loss": -9.875879287719727, "global_step": 112115, "epoch": 667} {"train_loss": -10.168277740478516, "global_step": 112116, "epoch": 667} {"train_loss": -10.05078125, "global_step": 112117, "epoch": 667} {"train_loss": -9.919397354125977, "global_step": 112118, "epoch": 667} {"train_loss": -9.839117050170898, "global_step": 112119, "epoch": 667} {"train_loss": -9.690577507019043, "global_step": 112120, "epoch": 667} {"train_loss": -9.633322715759277, "global_step": 112121, "epoch": 667} {"train_loss": -9.884411811828613, "global_step": 112122, "epoch": 667} {"train_loss": -9.576950073242188, "global_step": 112123, "epoch": 667} {"train_loss": -9.435914993286133, "global_step": 112124, "epoch": 667} {"train_loss": -9.960126876831055, "global_step": 112125, "epoch": 667} {"train_loss": -9.989681243896484, "global_step": 112126, "epoch": 667} {"train_loss": -9.22079086303711, "global_step": 112127, "epoch": 667} {"train_loss": -9.676164627075195, "global_step": 112128, "epoch": 667} {"train_loss": -9.674386978149414, "global_step": 112129, "epoch": 667} {"train_loss": -9.550386428833008, "global_step": 112130, "epoch": 667} {"train_loss": -9.956820487976074, "global_step": 112131, "epoch": 667} {"train_loss": -9.633373260498047, "global_step": 112132, "epoch": 667} {"train_loss": -10.047647476196289, "global_step": 112133, "epoch": 667} {"train_loss": -10.010393142700195, "global_step": 112134, "epoch": 667} {"train_loss": -9.77851390838623, "global_step": 112135, "epoch": 667} {"train_loss": -9.606014251708984, "global_step": 112136, "epoch": 667} {"train_loss": -9.94883918762207, "global_step": 112137, "epoch": 667} {"train_loss": -9.739203453063965, "global_step": 112138, "epoch": 667} {"train_loss": -9.821870803833008, "global_step": 112139, "epoch": 667} {"train_loss": -10.089057922363281, "global_step": 112140, "epoch": 667} {"train_loss": -9.337820053100586, "global_step": 112141, "epoch": 667} {"train_loss": -9.975187301635742, "global_step": 112142, "epoch": 667} {"train_loss": -9.738961219787598, "global_step": 112143, "epoch": 667} {"train_loss": -10.151721954345703, "global_step": 112144, "epoch": 667} {"train_loss": -9.917936325073242, "global_step": 112145, "epoch": 667} {"train_loss": -9.98031997680664, "global_step": 112146, "epoch": 667} {"train_loss": -10.0762939453125, "global_step": 112147, "epoch": 667} {"train_loss": -9.889802932739258, "global_step": 112148, "epoch": 667} {"train_loss": -9.981396675109863, "global_step": 112149, "epoch": 667} {"train_loss": -10.18364143371582, "global_step": 112150, "epoch": 667} {"train_loss": -10.200427055358887, "global_step": 112151, "epoch": 667} {"train_loss": -10.075485229492188, "global_step": 112152, "epoch": 667} {"train_loss": -10.14941120147705, "global_step": 112153, "epoch": 667} {"train_loss": -9.985541343688965, "global_step": 112154, "epoch": 667} {"train_loss": -10.126620292663574, "global_step": 112155, "epoch": 667} {"train_loss": -9.94375228881836, "global_step": 112156, "epoch": 667} {"train_loss": -10.154272079467773, "global_step": 112157, "epoch": 667} {"train_loss": -10.11465072631836, "global_step": 112158, "epoch": 667} {"train_loss": -10.222992897033691, "global_step": 112159, "epoch": 667} {"train_loss": -10.020133972167969, "global_step": 112160, "epoch": 667} {"train_loss": -10.19377613067627, "global_step": 112161, "epoch": 667} {"train_loss": -9.891841888427734, "global_step": 112162, "epoch": 667} {"train_loss": -10.086224555969238, "global_step": 112163, "epoch": 667} {"train_loss": -10.143051147460938, "global_step": 112164, "epoch": 667} {"train_loss": -10.152700424194336, "global_step": 112165, "epoch": 667} {"train_loss": -10.286890029907227, "global_step": 112166, "epoch": 667} {"train_loss": -10.13508415222168, "global_step": 112167, "epoch": 667} {"train_loss": -10.195014953613281, "global_step": 112168, "epoch": 667} {"train_loss": -10.058262825012207, "global_step": 112169, "epoch": 667} {"train_loss": -10.277263641357422, "global_step": 112170, "epoch": 667} {"train_loss": -10.326090812683105, "global_step": 112171, "epoch": 667} {"train_loss": -10.175820350646973, "global_step": 112172, "epoch": 667} {"train_loss": -10.11722183227539, "global_step": 112173, "epoch": 667} {"train_loss": -9.790047645568848, "global_step": 112174, "epoch": 667} {"train_loss": -10.162760734558105, "global_step": 112175, "epoch": 667} {"train_loss": -10.183643341064453, "global_step": 112176, "epoch": 667} {"train_loss": -10.18547534942627, "global_step": 112177, "epoch": 667} {"train_loss": -9.892048835754395, "global_step": 112178, "epoch": 667} {"train_loss": -10.239084243774414, "global_step": 112179, "epoch": 667} {"train_loss": -10.076899528503418, "global_step": 112180, "epoch": 667} {"train_loss": -10.303756713867188, "global_step": 112181, "epoch": 667} {"train_loss": -10.11552906036377, "global_step": 112182, "epoch": 667} {"train_loss": -10.077220916748047, "global_step": 112183, "epoch": 667} {"train_loss": -10.217214584350586, "global_step": 112184, "epoch": 667} {"train_loss": -10.061752319335938, "global_step": 112185, "epoch": 667} {"train_loss": -10.162836074829102, "global_step": 112186, "epoch": 667} {"train_loss": -10.35954475402832, "global_step": 112187, "epoch": 667} {"train_loss": -10.421917915344238, "global_step": 112188, "epoch": 667} {"train_loss": -10.156335830688477, "global_step": 112189, "epoch": 667} {"train_loss": -10.012672424316406, "global_step": 112190, "epoch": 667} {"train_loss": -10.177023887634277, "global_step": 112191, "epoch": 667} {"train_loss": -10.013930320739746, "global_step": 112192, "epoch": 667} {"train_loss": -9.911460876464844, "global_step": 112193, "epoch": 667} {"train_loss": -10.42708683013916, "global_step": 112194, "epoch": 667} {"train_loss": -10.076656341552734, "global_step": 112195, "epoch": 667} {"train_loss": -10.232145309448242, "global_step": 112196, "epoch": 667} {"train_loss": -10.056900024414062, "global_step": 112197, "epoch": 667} {"train_loss": -10.071903228759766, "global_step": 112198, "epoch": 667} {"train_loss": -10.298786163330078, "global_step": 112199, "epoch": 667} {"train_loss": -10.05526351928711, "global_step": 112200, "epoch": 667} {"train_loss": -10.144638061523438, "global_step": 112201, "epoch": 667} {"train_loss": -9.56309700012207, "global_step": 112202, "epoch": 667} {"train_loss": -9.880247116088867, "global_step": 112203, "epoch": 667} {"train_loss": -9.696107864379883, "global_step": 112204, "epoch": 667} {"train_loss": -9.684555053710938, "global_step": 112205, "epoch": 667} {"train_loss": -9.784162521362305, "global_step": 112206, "epoch": 667} {"train_loss": -9.92973518371582, "global_step": 112207, "epoch": 667} {"train_loss": -9.748590469360352, "global_step": 112208, "epoch": 667} {"train_loss": -9.279703140258789, "global_step": 112209, "epoch": 667} {"train_loss": -9.775442123413086, "global_step": 112210, "epoch": 667} {"train_loss": -9.791946411132812, "global_step": 112211, "epoch": 667} {"train_loss": -9.647195816040039, "global_step": 112212, "epoch": 667} {"train_loss": -10.072729110717773, "global_step": 112213, "epoch": 667} {"train_loss": -9.763264656066895, "global_step": 112214, "epoch": 667} {"train_loss": -10.015985488891602, "global_step": 112215, "epoch": 667} {"train_loss": -9.543855667114258, "global_step": 112216, "epoch": 667} {"train_loss": -9.582688331604004, "global_step": 112217, "epoch": 667} {"train_loss": -9.67390251159668, "global_step": 112218, "epoch": 667} {"train_loss": -9.945463180541992, "global_step": 112219, "epoch": 667} {"train_loss": -9.845390319824219, "global_step": 112220, "epoch": 667} {"train_loss": -9.987314224243164, "global_step": 112221, "epoch": 667} {"train_loss": -9.730056762695312, "global_step": 112222, "epoch": 667} {"train_loss": -9.885112779481071, "global_step": 112223, "epoch": 667, "val_loss": 211132.0} {"train_loss": -8.974649429321289, "global_step": 112224, "epoch": 668} {"train_loss": -9.803421974182129, "global_step": 112225, "epoch": 668} {"train_loss": -9.466418266296387, "global_step": 112226, "epoch": 668} {"train_loss": -9.548563003540039, "global_step": 112227, "epoch": 668} {"train_loss": -9.540426254272461, "global_step": 112228, "epoch": 668} {"train_loss": -9.654644012451172, "global_step": 112229, "epoch": 668} {"train_loss": -9.48746395111084, "global_step": 112230, "epoch": 668} {"train_loss": -9.76048469543457, "global_step": 112231, "epoch": 668} {"train_loss": -9.410310745239258, "global_step": 112232, "epoch": 668} {"train_loss": -9.631170272827148, "global_step": 112233, "epoch": 668} {"train_loss": -9.552896499633789, "global_step": 112234, "epoch": 668} {"train_loss": -9.527009010314941, "global_step": 112235, "epoch": 668} {"train_loss": -9.668017387390137, "global_step": 112236, "epoch": 668} {"train_loss": -9.645172119140625, "global_step": 112237, "epoch": 668} {"train_loss": -9.504392623901367, "global_step": 112238, "epoch": 668} {"train_loss": -9.456199645996094, "global_step": 112239, "epoch": 668} {"train_loss": -9.828910827636719, "global_step": 112240, "epoch": 668} {"train_loss": -9.558066368103027, "global_step": 112241, "epoch": 668} {"train_loss": -9.83561897277832, "global_step": 112242, "epoch": 668} {"train_loss": -9.725078582763672, "global_step": 112243, "epoch": 668} {"train_loss": -9.64254379272461, "global_step": 112244, "epoch": 668} {"train_loss": -9.904574394226074, "global_step": 112245, "epoch": 668} {"train_loss": -9.56543254852295, "global_step": 112246, "epoch": 668} {"train_loss": -9.832001686096191, "global_step": 112247, "epoch": 668} {"train_loss": -9.640711784362793, "global_step": 112248, "epoch": 668} {"train_loss": -9.923850059509277, "global_step": 112249, "epoch": 668} {"train_loss": -9.729446411132812, "global_step": 112250, "epoch": 668} {"train_loss": -9.752496719360352, "global_step": 112251, "epoch": 668} {"train_loss": -9.98430061340332, "global_step": 112252, "epoch": 668} {"train_loss": -9.660499572753906, "global_step": 112253, "epoch": 668} {"train_loss": -9.811634063720703, "global_step": 112254, "epoch": 668} {"train_loss": -9.479161262512207, "global_step": 112255, "epoch": 668} {"train_loss": -10.006017684936523, "global_step": 112256, "epoch": 668} {"train_loss": -9.815801620483398, "global_step": 112257, "epoch": 668} {"train_loss": -9.925420761108398, "global_step": 112258, "epoch": 668} {"train_loss": -9.736078262329102, "global_step": 112259, "epoch": 668} {"train_loss": -9.659826278686523, "global_step": 112260, "epoch": 668} {"train_loss": -9.978147506713867, "global_step": 112261, "epoch": 668} {"train_loss": -10.004749298095703, "global_step": 112262, "epoch": 668} {"train_loss": -9.917089462280273, "global_step": 112263, "epoch": 668} {"train_loss": -10.002606391906738, "global_step": 112264, "epoch": 668} {"train_loss": -10.071381568908691, "global_step": 112265, "epoch": 668} {"train_loss": -9.616691589355469, "global_step": 112266, "epoch": 668} {"train_loss": -10.190863609313965, "global_step": 112267, "epoch": 668} {"train_loss": -9.882828712463379, "global_step": 112268, "epoch": 668} {"train_loss": -10.080587387084961, "global_step": 112269, "epoch": 668} {"train_loss": -9.746253967285156, "global_step": 112270, "epoch": 668} {"train_loss": -10.092594146728516, "global_step": 112271, "epoch": 668} {"train_loss": -9.825267791748047, "global_step": 112272, "epoch": 668} {"train_loss": -10.092604637145996, "global_step": 112273, "epoch": 668} {"train_loss": -10.022438049316406, "global_step": 112274, "epoch": 668} {"train_loss": -10.018869400024414, "global_step": 112275, "epoch": 668} {"train_loss": -10.084239959716797, "global_step": 112276, "epoch": 668} {"train_loss": -10.088634490966797, "global_step": 112277, "epoch": 668} {"train_loss": -10.197250366210938, "global_step": 112278, "epoch": 668} {"train_loss": -10.231669425964355, "global_step": 112279, "epoch": 668} {"train_loss": -10.286016464233398, "global_step": 112280, "epoch": 668} {"train_loss": -10.163126945495605, "global_step": 112281, "epoch": 668} {"train_loss": -10.260810852050781, "global_step": 112282, "epoch": 668} {"train_loss": -10.287083625793457, "global_step": 112283, "epoch": 668} {"train_loss": -10.154918670654297, "global_step": 112284, "epoch": 668} {"train_loss": -10.062333106994629, "global_step": 112285, "epoch": 668} {"train_loss": -10.206705093383789, "global_step": 112286, "epoch": 668} {"train_loss": -9.902812957763672, "global_step": 112287, "epoch": 668} {"train_loss": -10.198219299316406, "global_step": 112288, "epoch": 668} {"train_loss": -9.913045883178711, "global_step": 112289, "epoch": 668} {"train_loss": -10.017950057983398, "global_step": 112290, "epoch": 668} {"train_loss": -9.729022026062012, "global_step": 112291, "epoch": 668} {"train_loss": -9.670877456665039, "global_step": 112292, "epoch": 668} {"train_loss": -9.929998397827148, "global_step": 112293, "epoch": 668} {"train_loss": -10.008330345153809, "global_step": 112294, "epoch": 668} {"train_loss": -9.8389253616333, "global_step": 112295, "epoch": 668} {"train_loss": -10.134696006774902, "global_step": 112296, "epoch": 668} {"train_loss": -9.807927131652832, "global_step": 112297, "epoch": 668} {"train_loss": -10.170215606689453, "global_step": 112298, "epoch": 668} {"train_loss": -9.881954193115234, "global_step": 112299, "epoch": 668} {"train_loss": -9.421463966369629, "global_step": 112300, "epoch": 668} {"train_loss": -10.143058776855469, "global_step": 112301, "epoch": 668} {"train_loss": -9.539458274841309, "global_step": 112302, "epoch": 668} {"train_loss": -10.237756729125977, "global_step": 112303, "epoch": 668} {"train_loss": -10.058697700500488, "global_step": 112304, "epoch": 668} {"train_loss": -9.814481735229492, "global_step": 112305, "epoch": 668} {"train_loss": -9.807167053222656, "global_step": 112306, "epoch": 668} {"train_loss": -10.005435943603516, "global_step": 112307, "epoch": 668} {"train_loss": -9.4091796875, "global_step": 112308, "epoch": 668} {"train_loss": -10.185422897338867, "global_step": 112309, "epoch": 668} {"train_loss": -9.860151290893555, "global_step": 112310, "epoch": 668} {"train_loss": -10.065403938293457, "global_step": 112311, "epoch": 668} {"train_loss": -10.10116958618164, "global_step": 112312, "epoch": 668} {"train_loss": -9.914596557617188, "global_step": 112313, "epoch": 668} {"train_loss": -9.97756576538086, "global_step": 112314, "epoch": 668} {"train_loss": -10.134984016418457, "global_step": 112315, "epoch": 668} {"train_loss": -10.28050422668457, "global_step": 112316, "epoch": 668} {"train_loss": -10.062249183654785, "global_step": 112317, "epoch": 668} {"train_loss": -10.181253433227539, "global_step": 112318, "epoch": 668} {"train_loss": -9.986358642578125, "global_step": 112319, "epoch": 668} {"train_loss": -10.164287567138672, "global_step": 112320, "epoch": 668} {"train_loss": -10.16966438293457, "global_step": 112321, "epoch": 668} {"train_loss": -10.15747356414795, "global_step": 112322, "epoch": 668} {"train_loss": -9.62862777709961, "global_step": 112323, "epoch": 668} {"train_loss": -10.05373764038086, "global_step": 112324, "epoch": 668} {"train_loss": -10.104803085327148, "global_step": 112325, "epoch": 668} {"train_loss": -9.692259788513184, "global_step": 112326, "epoch": 668} {"train_loss": -10.046652793884277, "global_step": 112327, "epoch": 668} {"train_loss": -9.778976440429688, "global_step": 112328, "epoch": 668} {"train_loss": -9.841592788696289, "global_step": 112329, "epoch": 668} {"train_loss": -9.87226676940918, "global_step": 112330, "epoch": 668} {"train_loss": -10.188434600830078, "global_step": 112331, "epoch": 668} {"train_loss": -10.101715087890625, "global_step": 112332, "epoch": 668} {"train_loss": -9.868667602539062, "global_step": 112333, "epoch": 668} {"train_loss": -10.304758071899414, "global_step": 112334, "epoch": 668} {"train_loss": -9.933521270751953, "global_step": 112335, "epoch": 668} {"train_loss": -9.907368659973145, "global_step": 112336, "epoch": 668} {"train_loss": -9.990055084228516, "global_step": 112337, "epoch": 668} {"train_loss": -10.040082931518555, "global_step": 112338, "epoch": 668} {"train_loss": -9.951288223266602, "global_step": 112339, "epoch": 668} {"train_loss": -10.134912490844727, "global_step": 112340, "epoch": 668} {"train_loss": -9.976858139038086, "global_step": 112341, "epoch": 668} {"train_loss": -10.228607177734375, "global_step": 112342, "epoch": 668} {"train_loss": -10.068120002746582, "global_step": 112343, "epoch": 668} {"train_loss": -10.07913589477539, "global_step": 112344, "epoch": 668} {"train_loss": -10.033658027648926, "global_step": 112345, "epoch": 668} {"train_loss": -10.27682876586914, "global_step": 112346, "epoch": 668} {"train_loss": -10.403122901916504, "global_step": 112347, "epoch": 668} {"train_loss": -10.03361701965332, "global_step": 112348, "epoch": 668} {"train_loss": -9.939926147460938, "global_step": 112349, "epoch": 668} {"train_loss": -10.253019332885742, "global_step": 112350, "epoch": 668} {"train_loss": -9.942893981933594, "global_step": 112351, "epoch": 668} {"train_loss": -9.499134063720703, "global_step": 112352, "epoch": 668} {"train_loss": -9.877172470092773, "global_step": 112353, "epoch": 668} {"train_loss": -10.008152961730957, "global_step": 112354, "epoch": 668} {"train_loss": -9.803019523620605, "global_step": 112355, "epoch": 668} {"train_loss": -9.635592460632324, "global_step": 112356, "epoch": 668} {"train_loss": -9.491711616516113, "global_step": 112357, "epoch": 668} {"train_loss": -9.41754150390625, "global_step": 112358, "epoch": 668} {"train_loss": -8.878783226013184, "global_step": 112359, "epoch": 668} {"train_loss": -10.090572357177734, "global_step": 112360, "epoch": 668} {"train_loss": -9.471526145935059, "global_step": 112361, "epoch": 668} {"train_loss": -9.753081321716309, "global_step": 112362, "epoch": 668} {"train_loss": -9.724874496459961, "global_step": 112363, "epoch": 668} {"train_loss": -9.732438087463379, "global_step": 112364, "epoch": 668} {"train_loss": -9.632331848144531, "global_step": 112365, "epoch": 668} {"train_loss": -9.697010040283203, "global_step": 112366, "epoch": 668} {"train_loss": -9.590047836303711, "global_step": 112367, "epoch": 668} {"train_loss": -9.665788650512695, "global_step": 112368, "epoch": 668} {"train_loss": -9.843334197998047, "global_step": 112369, "epoch": 668} {"train_loss": -9.707470893859863, "global_step": 112370, "epoch": 668} {"train_loss": -9.951702117919922, "global_step": 112371, "epoch": 668} {"train_loss": -9.801356315612793, "global_step": 112372, "epoch": 668} {"train_loss": -10.062555313110352, "global_step": 112373, "epoch": 668} {"train_loss": -9.848899841308594, "global_step": 112374, "epoch": 668} {"train_loss": -9.8773193359375, "global_step": 112375, "epoch": 668} {"train_loss": -9.911760330200195, "global_step": 112376, "epoch": 668} {"train_loss": -9.937509536743164, "global_step": 112377, "epoch": 668} {"train_loss": -9.98582935333252, "global_step": 112378, "epoch": 668} {"train_loss": -10.089237213134766, "global_step": 112379, "epoch": 668} {"train_loss": -10.018495559692383, "global_step": 112380, "epoch": 668} {"train_loss": -10.141236305236816, "global_step": 112381, "epoch": 668} {"train_loss": -10.112469673156738, "global_step": 112382, "epoch": 668} {"train_loss": -10.05646800994873, "global_step": 112383, "epoch": 668} {"train_loss": -9.761499404907227, "global_step": 112384, "epoch": 668} {"train_loss": -10.408960342407227, "global_step": 112385, "epoch": 668} {"train_loss": -10.077091217041016, "global_step": 112386, "epoch": 668} {"train_loss": -10.17995834350586, "global_step": 112387, "epoch": 668} {"train_loss": -9.536161422729492, "global_step": 112388, "epoch": 668} {"train_loss": -10.177267074584961, "global_step": 112389, "epoch": 668} {"train_loss": -10.117255210876465, "global_step": 112390, "epoch": 668} {"train_loss": -9.894257477351598, "global_step": 112391, "epoch": 668, "val_loss": 212166.78125} {"train_loss": -9.920791625976562, "global_step": 112392, "epoch": 669} {"train_loss": -10.007224082946777, "global_step": 112393, "epoch": 669} {"train_loss": -10.210179328918457, "global_step": 112394, "epoch": 669} {"train_loss": -10.304662704467773, "global_step": 112395, "epoch": 669} {"train_loss": -9.866958618164062, "global_step": 112396, "epoch": 669} {"train_loss": -10.14402961730957, "global_step": 112397, "epoch": 669} {"train_loss": -9.641840934753418, "global_step": 112398, "epoch": 669} {"train_loss": -10.089547157287598, "global_step": 112399, "epoch": 669} {"train_loss": -10.131558418273926, "global_step": 112400, "epoch": 669} {"train_loss": -9.868060111999512, "global_step": 112401, "epoch": 669} {"train_loss": -10.071457862854004, "global_step": 112402, "epoch": 669} {"train_loss": -9.747332572937012, "global_step": 112403, "epoch": 669} {"train_loss": -9.93647575378418, "global_step": 112404, "epoch": 669} {"train_loss": -9.791675567626953, "global_step": 112405, "epoch": 669} {"train_loss": -10.236385345458984, "global_step": 112406, "epoch": 669} {"train_loss": -10.072625160217285, "global_step": 112407, "epoch": 669} {"train_loss": -10.215078353881836, "global_step": 112408, "epoch": 669} {"train_loss": -10.2724609375, "global_step": 112409, "epoch": 669} {"train_loss": -9.910822868347168, "global_step": 112410, "epoch": 669} {"train_loss": -10.25861930847168, "global_step": 112411, "epoch": 669} {"train_loss": -10.004490852355957, "global_step": 112412, "epoch": 669} {"train_loss": -10.132460594177246, "global_step": 112413, "epoch": 669} {"train_loss": -10.18138313293457, "global_step": 112414, "epoch": 669} {"train_loss": -10.242121696472168, "global_step": 112415, "epoch": 669} {"train_loss": -10.14697265625, "global_step": 112416, "epoch": 669} {"train_loss": -10.21092700958252, "global_step": 112417, "epoch": 669} {"train_loss": -10.026905059814453, "global_step": 112418, "epoch": 669} {"train_loss": -10.202777862548828, "global_step": 112419, "epoch": 669} {"train_loss": -9.943145751953125, "global_step": 112420, "epoch": 669} {"train_loss": -10.113203048706055, "global_step": 112421, "epoch": 669} {"train_loss": -10.047901153564453, "global_step": 112422, "epoch": 669} {"train_loss": -10.20013427734375, "global_step": 112423, "epoch": 669} {"train_loss": -9.917623519897461, "global_step": 112424, "epoch": 669} {"train_loss": -10.349626541137695, "global_step": 112425, "epoch": 669} {"train_loss": -10.012310981750488, "global_step": 112426, "epoch": 669} {"train_loss": -10.174436569213867, "global_step": 112427, "epoch": 669} {"train_loss": -10.121993064880371, "global_step": 112428, "epoch": 669} {"train_loss": -10.294966697692871, "global_step": 112429, "epoch": 669} {"train_loss": -9.425407409667969, "global_step": 112430, "epoch": 669} {"train_loss": -10.017719268798828, "global_step": 112431, "epoch": 669} {"train_loss": -9.88505744934082, "global_step": 112432, "epoch": 669} {"train_loss": -10.204070091247559, "global_step": 112433, "epoch": 669} {"train_loss": -9.826451301574707, "global_step": 112434, "epoch": 669} {"train_loss": -9.915580749511719, "global_step": 112435, "epoch": 669} {"train_loss": -9.938253402709961, "global_step": 112436, "epoch": 669} {"train_loss": -10.081060409545898, "global_step": 112437, "epoch": 669} {"train_loss": -9.906925201416016, "global_step": 112438, "epoch": 669} {"train_loss": -9.876758575439453, "global_step": 112439, "epoch": 669} {"train_loss": -9.822166442871094, "global_step": 112440, "epoch": 669} {"train_loss": -9.995365142822266, "global_step": 112441, "epoch": 669} {"train_loss": -9.433080673217773, "global_step": 112442, "epoch": 669} {"train_loss": -9.847578048706055, "global_step": 112443, "epoch": 669} {"train_loss": -9.71749496459961, "global_step": 112444, "epoch": 669} {"train_loss": -9.552522659301758, "global_step": 112445, "epoch": 669} {"train_loss": -10.181009292602539, "global_step": 112446, "epoch": 669} {"train_loss": -9.753715515136719, "global_step": 112447, "epoch": 669} {"train_loss": -9.727518081665039, "global_step": 112448, "epoch": 669} {"train_loss": -10.100919723510742, "global_step": 112449, "epoch": 669} {"train_loss": -9.734079360961914, "global_step": 112450, "epoch": 669} {"train_loss": -10.133077621459961, "global_step": 112451, "epoch": 669} {"train_loss": -9.618706703186035, "global_step": 112452, "epoch": 669} {"train_loss": -10.05313491821289, "global_step": 112453, "epoch": 669} {"train_loss": -9.817987442016602, "global_step": 112454, "epoch": 669} {"train_loss": -10.044503211975098, "global_step": 112455, "epoch": 669} {"train_loss": -10.045324325561523, "global_step": 112456, "epoch": 669} {"train_loss": -10.152839660644531, "global_step": 112457, "epoch": 669} {"train_loss": -9.93398666381836, "global_step": 112458, "epoch": 669} {"train_loss": -10.081596374511719, "global_step": 112459, "epoch": 669} {"train_loss": -9.97022819519043, "global_step": 112460, "epoch": 669} {"train_loss": -10.085384368896484, "global_step": 112461, "epoch": 669} {"train_loss": -10.168509483337402, "global_step": 112462, "epoch": 669} {"train_loss": -10.040468215942383, "global_step": 112463, "epoch": 669} {"train_loss": -10.027588844299316, "global_step": 112464, "epoch": 669} {"train_loss": -10.026376724243164, "global_step": 112465, "epoch": 669} {"train_loss": -9.920883178710938, "global_step": 112466, "epoch": 669} {"train_loss": -9.725610733032227, "global_step": 112467, "epoch": 669} {"train_loss": -10.020023345947266, "global_step": 112468, "epoch": 669} {"train_loss": -9.089518547058105, "global_step": 112469, "epoch": 669} {"train_loss": -9.821868896484375, "global_step": 112470, "epoch": 669} {"train_loss": -9.814533233642578, "global_step": 112471, "epoch": 669} {"train_loss": -9.917537689208984, "global_step": 112472, "epoch": 669} {"train_loss": -9.74049186706543, "global_step": 112473, "epoch": 669} {"train_loss": -9.759208679199219, "global_step": 112474, "epoch": 669} {"train_loss": -9.988813400268555, "global_step": 112475, "epoch": 669} {"train_loss": -9.397525787353516, "global_step": 112476, "epoch": 669} {"train_loss": -10.212648391723633, "global_step": 112477, "epoch": 669} {"train_loss": -9.495977401733398, "global_step": 112478, "epoch": 669} {"train_loss": -9.968456268310547, "global_step": 112479, "epoch": 669} {"train_loss": -9.93033218383789, "global_step": 112480, "epoch": 669} {"train_loss": -9.902975082397461, "global_step": 112481, "epoch": 669} {"train_loss": -10.20666217803955, "global_step": 112482, "epoch": 669} {"train_loss": -9.642047882080078, "global_step": 112483, "epoch": 669} {"train_loss": -9.851119995117188, "global_step": 112484, "epoch": 669} {"train_loss": -10.151534080505371, "global_step": 112485, "epoch": 669} {"train_loss": -9.683614730834961, "global_step": 112486, "epoch": 669} {"train_loss": -9.896919250488281, "global_step": 112487, "epoch": 669} {"train_loss": -10.237991333007812, "global_step": 112488, "epoch": 669} {"train_loss": -9.935775756835938, "global_step": 112489, "epoch": 669} {"train_loss": -9.827875137329102, "global_step": 112490, "epoch": 669} {"train_loss": -9.980548858642578, "global_step": 112491, "epoch": 669} {"train_loss": -9.935018539428711, "global_step": 112492, "epoch": 669} {"train_loss": -10.238565444946289, "global_step": 112493, "epoch": 669} {"train_loss": -9.779584884643555, "global_step": 112494, "epoch": 669} {"train_loss": -10.274059295654297, "global_step": 112495, "epoch": 669} {"train_loss": -9.75006103515625, "global_step": 112496, "epoch": 669} {"train_loss": -10.049327850341797, "global_step": 112497, "epoch": 669} {"train_loss": -9.92981243133545, "global_step": 112498, "epoch": 669} {"train_loss": -10.196500778198242, "global_step": 112499, "epoch": 669} {"train_loss": -10.010651588439941, "global_step": 112500, "epoch": 669} {"train_loss": -10.032720565795898, "global_step": 112501, "epoch": 669} {"train_loss": -10.190267562866211, "global_step": 112502, "epoch": 669} {"train_loss": -10.017739295959473, "global_step": 112503, "epoch": 669} {"train_loss": -10.051167488098145, "global_step": 112504, "epoch": 669} {"train_loss": -10.356607437133789, "global_step": 112505, "epoch": 669} {"train_loss": -10.220855712890625, "global_step": 112506, "epoch": 669} {"train_loss": -10.205275535583496, "global_step": 112507, "epoch": 669} {"train_loss": -10.2161865234375, "global_step": 112508, "epoch": 669} {"train_loss": -9.995370864868164, "global_step": 112509, "epoch": 669} {"train_loss": -10.16633415222168, "global_step": 112510, "epoch": 669} {"train_loss": -9.833242416381836, "global_step": 112511, "epoch": 669} {"train_loss": -10.034196853637695, "global_step": 112512, "epoch": 669} {"train_loss": -10.12959098815918, "global_step": 112513, "epoch": 669} {"train_loss": -9.690109252929688, "global_step": 112514, "epoch": 669} {"train_loss": -10.354626655578613, "global_step": 112515, "epoch": 669} {"train_loss": -9.809443473815918, "global_step": 112516, "epoch": 669} {"train_loss": -9.914213180541992, "global_step": 112517, "epoch": 669} {"train_loss": -10.133611679077148, "global_step": 112518, "epoch": 669} {"train_loss": -9.766095161437988, "global_step": 112519, "epoch": 669} {"train_loss": -10.25859260559082, "global_step": 112520, "epoch": 669} {"train_loss": -9.58558464050293, "global_step": 112521, "epoch": 669} {"train_loss": -10.20730209350586, "global_step": 112522, "epoch": 669} {"train_loss": -9.960091590881348, "global_step": 112523, "epoch": 669} {"train_loss": -10.146634101867676, "global_step": 112524, "epoch": 669} {"train_loss": -10.036310195922852, "global_step": 112525, "epoch": 669} {"train_loss": -10.019400596618652, "global_step": 112526, "epoch": 669} {"train_loss": -9.985112190246582, "global_step": 112527, "epoch": 669} {"train_loss": -9.910365104675293, "global_step": 112528, "epoch": 669} {"train_loss": -9.9548921585083, "global_step": 112529, "epoch": 669} {"train_loss": -9.69757080078125, "global_step": 112530, "epoch": 669} {"train_loss": -10.152851104736328, "global_step": 112531, "epoch": 669} {"train_loss": -9.765012741088867, "global_step": 112532, "epoch": 669} {"train_loss": -10.253676414489746, "global_step": 112533, "epoch": 669} {"train_loss": -10.154294967651367, "global_step": 112534, "epoch": 669} {"train_loss": -10.035333633422852, "global_step": 112535, "epoch": 669} {"train_loss": -9.92982006072998, "global_step": 112536, "epoch": 669} {"train_loss": -10.094274520874023, "global_step": 112537, "epoch": 669} {"train_loss": -9.44505500793457, "global_step": 112538, "epoch": 669} {"train_loss": -9.882123947143555, "global_step": 112539, "epoch": 669} {"train_loss": -10.300724029541016, "global_step": 112540, "epoch": 669} {"train_loss": -9.862706184387207, "global_step": 112541, "epoch": 669} {"train_loss": -10.201440811157227, "global_step": 112542, "epoch": 669} {"train_loss": -9.977020263671875, "global_step": 112543, "epoch": 669} {"train_loss": -10.02660083770752, "global_step": 112544, "epoch": 669} {"train_loss": -9.918779373168945, "global_step": 112545, "epoch": 669} {"train_loss": -9.775259971618652, "global_step": 112546, "epoch": 669} {"train_loss": -10.072603225708008, "global_step": 112547, "epoch": 669} {"train_loss": -9.320475578308105, "global_step": 112548, "epoch": 669} {"train_loss": -10.07376766204834, "global_step": 112549, "epoch": 669} {"train_loss": -9.376628875732422, "global_step": 112550, "epoch": 669} {"train_loss": -8.772543907165527, "global_step": 112551, "epoch": 669} {"train_loss": -7.697932243347168, "global_step": 112552, "epoch": 669} {"train_loss": -8.078912734985352, "global_step": 112553, "epoch": 669} {"train_loss": -9.264715194702148, "global_step": 112554, "epoch": 669} {"train_loss": -8.56337833404541, "global_step": 112555, "epoch": 669} {"train_loss": -9.081358909606934, "global_step": 112556, "epoch": 669} {"train_loss": -8.453919410705566, "global_step": 112557, "epoch": 669} {"train_loss": -9.709768295288086, "global_step": 112558, "epoch": 669} {"train_loss": -9.905389229456583, "global_step": 112559, "epoch": 669, "val_loss": 206341.34375} {"train_loss": -9.593525886535645, "global_step": 112560, "epoch": 670} {"train_loss": -9.230751037597656, "global_step": 112561, "epoch": 670} {"train_loss": -9.326870918273926, "global_step": 112562, "epoch": 670} {"train_loss": -9.568406105041504, "global_step": 112563, "epoch": 670} {"train_loss": -9.358036041259766, "global_step": 112564, "epoch": 670} {"train_loss": -9.131248474121094, "global_step": 112565, "epoch": 670} {"train_loss": -9.174056053161621, "global_step": 112566, "epoch": 670} {"train_loss": -9.186511993408203, "global_step": 112567, "epoch": 670} {"train_loss": -9.421277046203613, "global_step": 112568, "epoch": 670} {"train_loss": -9.500056266784668, "global_step": 112569, "epoch": 670} {"train_loss": -9.522527694702148, "global_step": 112570, "epoch": 670} {"train_loss": -9.36447525024414, "global_step": 112571, "epoch": 670} {"train_loss": -9.380617141723633, "global_step": 112572, "epoch": 670} {"train_loss": -9.807550430297852, "global_step": 112573, "epoch": 670} {"train_loss": -9.701711654663086, "global_step": 112574, "epoch": 670} {"train_loss": -9.48727035522461, "global_step": 112575, "epoch": 670} {"train_loss": -9.384514808654785, "global_step": 112576, "epoch": 670} {"train_loss": -9.771276473999023, "global_step": 112577, "epoch": 670} {"train_loss": -9.581005096435547, "global_step": 112578, "epoch": 670} {"train_loss": -9.55074405670166, "global_step": 112579, "epoch": 670} {"train_loss": -9.912591934204102, "global_step": 112580, "epoch": 670} {"train_loss": -9.828009605407715, "global_step": 112581, "epoch": 670} {"train_loss": -9.824287414550781, "global_step": 112582, "epoch": 670} {"train_loss": -9.959989547729492, "global_step": 112583, "epoch": 670} {"train_loss": -9.815165519714355, "global_step": 112584, "epoch": 670} {"train_loss": -9.882513999938965, "global_step": 112585, "epoch": 670} {"train_loss": -9.769638061523438, "global_step": 112586, "epoch": 670} {"train_loss": -9.790661811828613, "global_step": 112587, "epoch": 670} {"train_loss": -10.182294845581055, "global_step": 112588, "epoch": 670} {"train_loss": -9.863687515258789, "global_step": 112589, "epoch": 670} {"train_loss": -9.974905014038086, "global_step": 112590, "epoch": 670} {"train_loss": -10.070602416992188, "global_step": 112591, "epoch": 670} {"train_loss": -9.930191040039062, "global_step": 112592, "epoch": 670} {"train_loss": -10.168331146240234, "global_step": 112593, "epoch": 670} {"train_loss": -10.042827606201172, "global_step": 112594, "epoch": 670} {"train_loss": -10.108732223510742, "global_step": 112595, "epoch": 670} {"train_loss": -10.082403182983398, "global_step": 112596, "epoch": 670} {"train_loss": -9.975082397460938, "global_step": 112597, "epoch": 670} {"train_loss": -10.225390434265137, "global_step": 112598, "epoch": 670} {"train_loss": -10.181674003601074, "global_step": 112599, "epoch": 670} {"train_loss": -10.188591003417969, "global_step": 112600, "epoch": 670} {"train_loss": -9.948049545288086, "global_step": 112601, "epoch": 670} {"train_loss": -10.145256042480469, "global_step": 112602, "epoch": 670} {"train_loss": -10.242254257202148, "global_step": 112603, "epoch": 670} {"train_loss": -10.186572074890137, "global_step": 112604, "epoch": 670} {"train_loss": -10.070915222167969, "global_step": 112605, "epoch": 670} {"train_loss": -10.142824172973633, "global_step": 112606, "epoch": 670} {"train_loss": -10.269903182983398, "global_step": 112607, "epoch": 670} {"train_loss": -10.112619400024414, "global_step": 112608, "epoch": 670} {"train_loss": -10.042009353637695, "global_step": 112609, "epoch": 670} {"train_loss": -10.183206558227539, "global_step": 112610, "epoch": 670} {"train_loss": -10.283650398254395, "global_step": 112611, "epoch": 670} {"train_loss": -9.972610473632812, "global_step": 112612, "epoch": 670} {"train_loss": -10.241411209106445, "global_step": 112613, "epoch": 670} {"train_loss": -10.008056640625, "global_step": 112614, "epoch": 670} {"train_loss": -10.312600135803223, "global_step": 112615, "epoch": 670} {"train_loss": -9.866034507751465, "global_step": 112616, "epoch": 670} {"train_loss": -9.160493850708008, "global_step": 112617, "epoch": 670} {"train_loss": -10.376927375793457, "global_step": 112618, "epoch": 670} {"train_loss": -9.10069465637207, "global_step": 112619, "epoch": 670} {"train_loss": -9.038423538208008, "global_step": 112620, "epoch": 670} {"train_loss": -8.409646987915039, "global_step": 112621, "epoch": 670} {"train_loss": -8.871021270751953, "global_step": 112622, "epoch": 670} {"train_loss": -9.11484146118164, "global_step": 112623, "epoch": 670} {"train_loss": -9.429924011230469, "global_step": 112624, "epoch": 670} {"train_loss": -9.290239334106445, "global_step": 112625, "epoch": 670} {"train_loss": -8.90595531463623, "global_step": 112626, "epoch": 670} {"train_loss": -9.950345993041992, "global_step": 112627, "epoch": 670} {"train_loss": -8.933795928955078, "global_step": 112628, "epoch": 670} {"train_loss": -9.600728988647461, "global_step": 112629, "epoch": 670} {"train_loss": -9.581438064575195, "global_step": 112630, "epoch": 670} {"train_loss": -9.629648208618164, "global_step": 112631, "epoch": 670} {"train_loss": -9.573980331420898, "global_step": 112632, "epoch": 670} {"train_loss": -9.72437858581543, "global_step": 112633, "epoch": 670} {"train_loss": -9.504392623901367, "global_step": 112634, "epoch": 670} {"train_loss": -9.76738166809082, "global_step": 112635, "epoch": 670} {"train_loss": -9.780611038208008, "global_step": 112636, "epoch": 670} {"train_loss": -9.577842712402344, "global_step": 112637, "epoch": 670} {"train_loss": -9.767487525939941, "global_step": 112638, "epoch": 670} {"train_loss": -9.845794677734375, "global_step": 112639, "epoch": 670} {"train_loss": -9.76318359375, "global_step": 112640, "epoch": 670} {"train_loss": -9.66984748840332, "global_step": 112641, "epoch": 670} {"train_loss": -9.73359489440918, "global_step": 112642, "epoch": 670} {"train_loss": -9.750776290893555, "global_step": 112643, "epoch": 670} {"train_loss": -9.423165321350098, "global_step": 112644, "epoch": 670} {"train_loss": -9.751455307006836, "global_step": 112645, "epoch": 670} {"train_loss": -9.803462028503418, "global_step": 112646, "epoch": 670} {"train_loss": -9.983044624328613, "global_step": 112647, "epoch": 670} {"train_loss": -9.661865234375, "global_step": 112648, "epoch": 670} {"train_loss": -9.95954418182373, "global_step": 112649, "epoch": 670} {"train_loss": -10.110902786254883, "global_step": 112650, "epoch": 670} {"train_loss": -9.934124946594238, "global_step": 112651, "epoch": 670} {"train_loss": -9.992172241210938, "global_step": 112652, "epoch": 670} {"train_loss": -9.88296890258789, "global_step": 112653, "epoch": 670} {"train_loss": -9.91769790649414, "global_step": 112654, "epoch": 670} {"train_loss": -10.112833023071289, "global_step": 112655, "epoch": 670} {"train_loss": -9.849294662475586, "global_step": 112656, "epoch": 670} {"train_loss": -9.957351684570312, "global_step": 112657, "epoch": 670} {"train_loss": -9.975561141967773, "global_step": 112658, "epoch": 670} {"train_loss": -9.907390594482422, "global_step": 112659, "epoch": 670} {"train_loss": -10.127065658569336, "global_step": 112660, "epoch": 670} {"train_loss": -10.056291580200195, "global_step": 112661, "epoch": 670} {"train_loss": -9.972386360168457, "global_step": 112662, "epoch": 670} {"train_loss": -10.031834602355957, "global_step": 112663, "epoch": 670} {"train_loss": -10.189102172851562, "global_step": 112664, "epoch": 670} {"train_loss": -10.048870086669922, "global_step": 112665, "epoch": 670} {"train_loss": -9.911776542663574, "global_step": 112666, "epoch": 670} {"train_loss": -9.703192710876465, "global_step": 112667, "epoch": 670} {"train_loss": -10.149059295654297, "global_step": 112668, "epoch": 670} {"train_loss": -9.70493221282959, "global_step": 112669, "epoch": 670} {"train_loss": -10.045580863952637, "global_step": 112670, "epoch": 670} {"train_loss": -10.0048828125, "global_step": 112671, "epoch": 670} {"train_loss": -10.082242965698242, "global_step": 112672, "epoch": 670} {"train_loss": -10.006776809692383, "global_step": 112673, "epoch": 670} {"train_loss": -10.119478225708008, "global_step": 112674, "epoch": 670} {"train_loss": -10.037370681762695, "global_step": 112675, "epoch": 670} {"train_loss": -10.085664749145508, "global_step": 112676, "epoch": 670} {"train_loss": -10.15575885772705, "global_step": 112677, "epoch": 670} {"train_loss": -9.98271369934082, "global_step": 112678, "epoch": 670} {"train_loss": -10.069209098815918, "global_step": 112679, "epoch": 670} {"train_loss": -10.045154571533203, "global_step": 112680, "epoch": 670} {"train_loss": -9.934947967529297, "global_step": 112681, "epoch": 670} {"train_loss": -9.841570854187012, "global_step": 112682, "epoch": 670} {"train_loss": -9.745266914367676, "global_step": 112683, "epoch": 670} {"train_loss": -9.66616153717041, "global_step": 112684, "epoch": 670} {"train_loss": -10.17386531829834, "global_step": 112685, "epoch": 670} {"train_loss": -9.98280143737793, "global_step": 112686, "epoch": 670} {"train_loss": -10.246237754821777, "global_step": 112687, "epoch": 670} {"train_loss": -10.363264083862305, "global_step": 112688, "epoch": 670} {"train_loss": -10.200701713562012, "global_step": 112689, "epoch": 670} {"train_loss": -10.164260864257812, "global_step": 112690, "epoch": 670} {"train_loss": -9.897974014282227, "global_step": 112691, "epoch": 670} {"train_loss": -9.849016189575195, "global_step": 112692, "epoch": 670} {"train_loss": -10.051353454589844, "global_step": 112693, "epoch": 670} {"train_loss": -9.982686042785645, "global_step": 112694, "epoch": 670} {"train_loss": -10.02131175994873, "global_step": 112695, "epoch": 670} {"train_loss": -9.9030179977417, "global_step": 112696, "epoch": 670} {"train_loss": -9.855016708374023, "global_step": 112697, "epoch": 670} {"train_loss": -10.009431838989258, "global_step": 112698, "epoch": 670} {"train_loss": -9.656427383422852, "global_step": 112699, "epoch": 670} {"train_loss": -10.076942443847656, "global_step": 112700, "epoch": 670} {"train_loss": -10.156262397766113, "global_step": 112701, "epoch": 670} {"train_loss": -9.979496002197266, "global_step": 112702, "epoch": 670} {"train_loss": -9.968974113464355, "global_step": 112703, "epoch": 670} {"train_loss": -10.036654472351074, "global_step": 112704, "epoch": 670} {"train_loss": -10.086593627929688, "global_step": 112705, "epoch": 670} {"train_loss": -9.805669784545898, "global_step": 112706, "epoch": 670} {"train_loss": -9.633594512939453, "global_step": 112707, "epoch": 670} {"train_loss": -10.00978946685791, "global_step": 112708, "epoch": 670} {"train_loss": -9.987213134765625, "global_step": 112709, "epoch": 670} {"train_loss": -9.718092918395996, "global_step": 112710, "epoch": 670} {"train_loss": -10.022475242614746, "global_step": 112711, "epoch": 670} {"train_loss": -9.953519821166992, "global_step": 112712, "epoch": 670} {"train_loss": -9.976037979125977, "global_step": 112713, "epoch": 670} {"train_loss": -10.190667152404785, "global_step": 112714, "epoch": 670} {"train_loss": -9.967184066772461, "global_step": 112715, "epoch": 670} {"train_loss": -10.032411575317383, "global_step": 112716, "epoch": 670} {"train_loss": -10.042919158935547, "global_step": 112717, "epoch": 670} {"train_loss": -9.932806968688965, "global_step": 112718, "epoch": 670} {"train_loss": -10.134578704833984, "global_step": 112719, "epoch": 670} {"train_loss": -9.933164596557617, "global_step": 112720, "epoch": 670} {"train_loss": -10.082738876342773, "global_step": 112721, "epoch": 670} {"train_loss": -10.059925079345703, "global_step": 112722, "epoch": 670} {"train_loss": -10.211892127990723, "global_step": 112723, "epoch": 670} {"train_loss": -10.065620422363281, "global_step": 112724, "epoch": 670} {"train_loss": -10.155904769897461, "global_step": 112725, "epoch": 670} {"train_loss": -10.007390022277832, "global_step": 112726, "epoch": 670} {"train_loss": -9.854297081629435, "global_step": 112727, "epoch": 670, "val_loss": 207175.21875, "train_action_mse_error": 3.2082858085632324} {"train_loss": -9.370058059692383, "global_step": 112728, "epoch": 671} {"train_loss": -9.689332962036133, "global_step": 112729, "epoch": 671} {"train_loss": -9.404425621032715, "global_step": 112730, "epoch": 671} {"train_loss": -10.154823303222656, "global_step": 112731, "epoch": 671} {"train_loss": -9.657876968383789, "global_step": 112732, "epoch": 671} {"train_loss": -9.608589172363281, "global_step": 112733, "epoch": 671} {"train_loss": -9.945793151855469, "global_step": 112734, "epoch": 671} {"train_loss": -9.532824516296387, "global_step": 112735, "epoch": 671} {"train_loss": -9.811280250549316, "global_step": 112736, "epoch": 671} {"train_loss": -9.863783836364746, "global_step": 112737, "epoch": 671} {"train_loss": -9.444587707519531, "global_step": 112738, "epoch": 671} {"train_loss": -9.813220977783203, "global_step": 112739, "epoch": 671} {"train_loss": -9.915152549743652, "global_step": 112740, "epoch": 671} {"train_loss": -9.757709503173828, "global_step": 112741, "epoch": 671} {"train_loss": -9.985459327697754, "global_step": 112742, "epoch": 671} {"train_loss": -9.754375457763672, "global_step": 112743, "epoch": 671} {"train_loss": -9.939901351928711, "global_step": 112744, "epoch": 671} {"train_loss": -9.726239204406738, "global_step": 112745, "epoch": 671} {"train_loss": -10.079967498779297, "global_step": 112746, "epoch": 671} {"train_loss": -9.795400619506836, "global_step": 112747, "epoch": 671} {"train_loss": -9.725772857666016, "global_step": 112748, "epoch": 671} {"train_loss": -9.679158210754395, "global_step": 112749, "epoch": 671} {"train_loss": -9.764107704162598, "global_step": 112750, "epoch": 671} {"train_loss": -9.661661148071289, "global_step": 112751, "epoch": 671} {"train_loss": -9.85745620727539, "global_step": 112752, "epoch": 671} {"train_loss": -9.501333236694336, "global_step": 112753, "epoch": 671} {"train_loss": -9.929539680480957, "global_step": 112754, "epoch": 671} {"train_loss": -9.70836067199707, "global_step": 112755, "epoch": 671} {"train_loss": -9.851118087768555, "global_step": 112756, "epoch": 671} {"train_loss": -9.755182266235352, "global_step": 112757, "epoch": 671} {"train_loss": -9.669198989868164, "global_step": 112758, "epoch": 671} {"train_loss": -9.442695617675781, "global_step": 112759, "epoch": 671} {"train_loss": -9.76164436340332, "global_step": 112760, "epoch": 671} {"train_loss": -9.440656661987305, "global_step": 112761, "epoch": 671} {"train_loss": -10.093158721923828, "global_step": 112762, "epoch": 671} {"train_loss": -9.377415657043457, "global_step": 112763, "epoch": 671} {"train_loss": -9.750656127929688, "global_step": 112764, "epoch": 671} {"train_loss": -9.81539535522461, "global_step": 112765, "epoch": 671} {"train_loss": -10.013579368591309, "global_step": 112766, "epoch": 671} {"train_loss": -9.798138618469238, "global_step": 112767, "epoch": 671} {"train_loss": -10.116519927978516, "global_step": 112768, "epoch": 671} {"train_loss": -9.736957550048828, "global_step": 112769, "epoch": 671} {"train_loss": -9.952033996582031, "global_step": 112770, "epoch": 671} {"train_loss": -9.99767780303955, "global_step": 112771, "epoch": 671} {"train_loss": -10.054461479187012, "global_step": 112772, "epoch": 671} {"train_loss": -9.868425369262695, "global_step": 112773, "epoch": 671} {"train_loss": -10.171903610229492, "global_step": 112774, "epoch": 671} {"train_loss": -9.977863311767578, "global_step": 112775, "epoch": 671} {"train_loss": -10.155600547790527, "global_step": 112776, "epoch": 671} {"train_loss": -10.100876808166504, "global_step": 112777, "epoch": 671} {"train_loss": -10.107852935791016, "global_step": 112778, "epoch": 671} {"train_loss": -9.878984451293945, "global_step": 112779, "epoch": 671} {"train_loss": -10.244538307189941, "global_step": 112780, "epoch": 671} {"train_loss": -10.06467056274414, "global_step": 112781, "epoch": 671} {"train_loss": -10.36288070678711, "global_step": 112782, "epoch": 671} {"train_loss": -10.003657341003418, "global_step": 112783, "epoch": 671} {"train_loss": -10.044636726379395, "global_step": 112784, "epoch": 671} {"train_loss": -10.0236177444458, "global_step": 112785, "epoch": 671} {"train_loss": -10.116926193237305, "global_step": 112786, "epoch": 671} {"train_loss": -10.293683052062988, "global_step": 112787, "epoch": 671} {"train_loss": -10.238180160522461, "global_step": 112788, "epoch": 671} {"train_loss": -10.151595115661621, "global_step": 112789, "epoch": 671} {"train_loss": -10.304376602172852, "global_step": 112790, "epoch": 671} {"train_loss": -10.224287033081055, "global_step": 112791, "epoch": 671} {"train_loss": -9.969032287597656, "global_step": 112792, "epoch": 671} {"train_loss": -10.361706733703613, "global_step": 112793, "epoch": 671} {"train_loss": -10.008182525634766, "global_step": 112794, "epoch": 671} {"train_loss": -10.315366744995117, "global_step": 112795, "epoch": 671} {"train_loss": -10.312883377075195, "global_step": 112796, "epoch": 671} {"train_loss": -9.647543907165527, "global_step": 112797, "epoch": 671} {"train_loss": -9.69448471069336, "global_step": 112798, "epoch": 671} {"train_loss": -10.019940376281738, "global_step": 112799, "epoch": 671} {"train_loss": -10.177131652832031, "global_step": 112800, "epoch": 671} {"train_loss": -9.700772285461426, "global_step": 112801, "epoch": 671} {"train_loss": -10.269079208374023, "global_step": 112802, "epoch": 671} {"train_loss": -9.586161613464355, "global_step": 112803, "epoch": 671} {"train_loss": -9.830994606018066, "global_step": 112804, "epoch": 671} {"train_loss": -9.883193016052246, "global_step": 112805, "epoch": 671} {"train_loss": -9.366863250732422, "global_step": 112806, "epoch": 671} {"train_loss": -9.858402252197266, "global_step": 112807, "epoch": 671} {"train_loss": -9.205999374389648, "global_step": 112808, "epoch": 671} {"train_loss": -9.667364120483398, "global_step": 112809, "epoch": 671} {"train_loss": -8.672849655151367, "global_step": 112810, "epoch": 671} {"train_loss": -10.029023170471191, "global_step": 112811, "epoch": 671} {"train_loss": -8.645657539367676, "global_step": 112812, "epoch": 671} {"train_loss": -9.683977127075195, "global_step": 112813, "epoch": 671} {"train_loss": -9.157513618469238, "global_step": 112814, "epoch": 671} {"train_loss": -9.826626777648926, "global_step": 112815, "epoch": 671} {"train_loss": -9.013710975646973, "global_step": 112816, "epoch": 671} {"train_loss": -9.340730667114258, "global_step": 112817, "epoch": 671} {"train_loss": -9.434710502624512, "global_step": 112818, "epoch": 671} {"train_loss": -9.092658042907715, "global_step": 112819, "epoch": 671} {"train_loss": -9.562061309814453, "global_step": 112820, "epoch": 671} {"train_loss": -9.203246116638184, "global_step": 112821, "epoch": 671} {"train_loss": -9.822388648986816, "global_step": 112822, "epoch": 671} {"train_loss": -9.437417984008789, "global_step": 112823, "epoch": 671} {"train_loss": -9.591004371643066, "global_step": 112824, "epoch": 671} {"train_loss": -9.890764236450195, "global_step": 112825, "epoch": 671} {"train_loss": -9.713971138000488, "global_step": 112826, "epoch": 671} {"train_loss": -9.795684814453125, "global_step": 112827, "epoch": 671} {"train_loss": -9.717446327209473, "global_step": 112828, "epoch": 671} {"train_loss": -9.865249633789062, "global_step": 112829, "epoch": 671} {"train_loss": -9.81435775756836, "global_step": 112830, "epoch": 671} {"train_loss": -9.613027572631836, "global_step": 112831, "epoch": 671} {"train_loss": -9.94981575012207, "global_step": 112832, "epoch": 671} {"train_loss": -9.682839393615723, "global_step": 112833, "epoch": 671} {"train_loss": -10.010407447814941, "global_step": 112834, "epoch": 671} {"train_loss": -10.151860237121582, "global_step": 112835, "epoch": 671} {"train_loss": -9.787368774414062, "global_step": 112836, "epoch": 671} {"train_loss": -9.938987731933594, "global_step": 112837, "epoch": 671} {"train_loss": -9.831816673278809, "global_step": 112838, "epoch": 671} {"train_loss": -9.997998237609863, "global_step": 112839, "epoch": 671} {"train_loss": -9.89610481262207, "global_step": 112840, "epoch": 671} {"train_loss": -9.591702461242676, "global_step": 112841, "epoch": 671} {"train_loss": -10.063295364379883, "global_step": 112842, "epoch": 671} {"train_loss": -9.64171028137207, "global_step": 112843, "epoch": 671} {"train_loss": -9.845882415771484, "global_step": 112844, "epoch": 671} {"train_loss": -9.860946655273438, "global_step": 112845, "epoch": 671} {"train_loss": -10.08568000793457, "global_step": 112846, "epoch": 671} {"train_loss": -9.987178802490234, "global_step": 112847, "epoch": 671} {"train_loss": -10.046516418457031, "global_step": 112848, "epoch": 671} {"train_loss": -10.273859024047852, "global_step": 112849, "epoch": 671} {"train_loss": -9.8837308883667, "global_step": 112850, "epoch": 671} {"train_loss": -10.394979476928711, "global_step": 112851, "epoch": 671} {"train_loss": -10.09389877319336, "global_step": 112852, "epoch": 671} {"train_loss": -10.178730010986328, "global_step": 112853, "epoch": 671} {"train_loss": -10.02570915222168, "global_step": 112854, "epoch": 671} {"train_loss": -10.156166076660156, "global_step": 112855, "epoch": 671} {"train_loss": -10.090890884399414, "global_step": 112856, "epoch": 671} {"train_loss": -10.221050262451172, "global_step": 112857, "epoch": 671} {"train_loss": -10.019481658935547, "global_step": 112858, "epoch": 671} {"train_loss": -10.175458908081055, "global_step": 112859, "epoch": 671} {"train_loss": -9.993314743041992, "global_step": 112860, "epoch": 671} {"train_loss": -9.894777297973633, "global_step": 112861, "epoch": 671} {"train_loss": -9.871006965637207, "global_step": 112862, "epoch": 671} {"train_loss": -10.098503112792969, "global_step": 112863, "epoch": 671} {"train_loss": -9.87611198425293, "global_step": 112864, "epoch": 671} {"train_loss": -10.09583854675293, "global_step": 112865, "epoch": 671} {"train_loss": -9.937244415283203, "global_step": 112866, "epoch": 671} {"train_loss": -10.283689498901367, "global_step": 112867, "epoch": 671} {"train_loss": -10.011335372924805, "global_step": 112868, "epoch": 671} {"train_loss": -9.958719253540039, "global_step": 112869, "epoch": 671} {"train_loss": -10.043989181518555, "global_step": 112870, "epoch": 671} {"train_loss": -9.940889358520508, "global_step": 112871, "epoch": 671} {"train_loss": -10.084637641906738, "global_step": 112872, "epoch": 671} {"train_loss": -9.989919662475586, "global_step": 112873, "epoch": 671} {"train_loss": -10.13625431060791, "global_step": 112874, "epoch": 671} {"train_loss": -10.070966720581055, "global_step": 112875, "epoch": 671} {"train_loss": -10.229999542236328, "global_step": 112876, "epoch": 671} {"train_loss": -9.842636108398438, "global_step": 112877, "epoch": 671} {"train_loss": -10.094879150390625, "global_step": 112878, "epoch": 671} {"train_loss": -10.09696102142334, "global_step": 112879, "epoch": 671} {"train_loss": -10.01207447052002, "global_step": 112880, "epoch": 671} {"train_loss": -10.048925399780273, "global_step": 112881, "epoch": 671} {"train_loss": -10.063539505004883, "global_step": 112882, "epoch": 671} {"train_loss": -10.320671081542969, "global_step": 112883, "epoch": 671} {"train_loss": -10.209582328796387, "global_step": 112884, "epoch": 671} {"train_loss": -10.092565536499023, "global_step": 112885, "epoch": 671} {"train_loss": -10.241900444030762, "global_step": 112886, "epoch": 671} {"train_loss": -10.081758499145508, "global_step": 112887, "epoch": 671} {"train_loss": -10.145435333251953, "global_step": 112888, "epoch": 671} {"train_loss": -9.902462005615234, "global_step": 112889, "epoch": 671} {"train_loss": -9.966531753540039, "global_step": 112890, "epoch": 671} {"train_loss": -10.1708345413208, "global_step": 112891, "epoch": 671} {"train_loss": -10.093772888183594, "global_step": 112892, "epoch": 671} {"train_loss": -10.154502868652344, "global_step": 112893, "epoch": 671} {"train_loss": -9.990727424621582, "global_step": 112894, "epoch": 671} {"train_loss": -9.884337510381426, "global_step": 112895, "epoch": 671, "val_loss": 212790.703125} {"train_loss": -9.793340682983398, "global_step": 112896, "epoch": 672} {"train_loss": -9.795419692993164, "global_step": 112897, "epoch": 672} {"train_loss": -9.821102142333984, "global_step": 112898, "epoch": 672} {"train_loss": -9.03879165649414, "global_step": 112899, "epoch": 672} {"train_loss": -9.999931335449219, "global_step": 112900, "epoch": 672} {"train_loss": -9.765634536743164, "global_step": 112901, "epoch": 672} {"train_loss": -9.423562049865723, "global_step": 112902, "epoch": 672} {"train_loss": -10.096030235290527, "global_step": 112903, "epoch": 672} {"train_loss": -9.61262321472168, "global_step": 112904, "epoch": 672} {"train_loss": -9.852901458740234, "global_step": 112905, "epoch": 672} {"train_loss": -9.977225303649902, "global_step": 112906, "epoch": 672} {"train_loss": -9.877413749694824, "global_step": 112907, "epoch": 672} {"train_loss": -10.107686996459961, "global_step": 112908, "epoch": 672} {"train_loss": -9.792970657348633, "global_step": 112909, "epoch": 672} {"train_loss": -10.022377014160156, "global_step": 112910, "epoch": 672} {"train_loss": -9.79871940612793, "global_step": 112911, "epoch": 672} {"train_loss": -9.963899612426758, "global_step": 112912, "epoch": 672} {"train_loss": -9.809853553771973, "global_step": 112913, "epoch": 672} {"train_loss": -9.727354049682617, "global_step": 112914, "epoch": 672} {"train_loss": -10.118953704833984, "global_step": 112915, "epoch": 672} {"train_loss": -9.739700317382812, "global_step": 112916, "epoch": 672} {"train_loss": -10.083976745605469, "global_step": 112917, "epoch": 672} {"train_loss": -10.169271469116211, "global_step": 112918, "epoch": 672} {"train_loss": -9.927656173706055, "global_step": 112919, "epoch": 672} {"train_loss": -10.013338088989258, "global_step": 112920, "epoch": 672} {"train_loss": -9.860457420349121, "global_step": 112921, "epoch": 672} {"train_loss": -9.57093620300293, "global_step": 112922, "epoch": 672} {"train_loss": -9.860511779785156, "global_step": 112923, "epoch": 672} {"train_loss": -10.003389358520508, "global_step": 112924, "epoch": 672} {"train_loss": -9.752145767211914, "global_step": 112925, "epoch": 672} {"train_loss": -9.986627578735352, "global_step": 112926, "epoch": 672} {"train_loss": -9.753708839416504, "global_step": 112927, "epoch": 672} {"train_loss": -10.133565902709961, "global_step": 112928, "epoch": 672} {"train_loss": -10.15009593963623, "global_step": 112929, "epoch": 672} {"train_loss": -9.98889446258545, "global_step": 112930, "epoch": 672} {"train_loss": -10.245264053344727, "global_step": 112931, "epoch": 672} {"train_loss": -10.024965286254883, "global_step": 112932, "epoch": 672} {"train_loss": -9.89527702331543, "global_step": 112933, "epoch": 672} {"train_loss": -10.173307418823242, "global_step": 112934, "epoch": 672} {"train_loss": -10.009446144104004, "global_step": 112935, "epoch": 672} {"train_loss": -9.857362747192383, "global_step": 112936, "epoch": 672} {"train_loss": -10.057469367980957, "global_step": 112937, "epoch": 672} {"train_loss": -9.571409225463867, "global_step": 112938, "epoch": 672} {"train_loss": -10.095649719238281, "global_step": 112939, "epoch": 672} {"train_loss": -9.551465034484863, "global_step": 112940, "epoch": 672} {"train_loss": -9.825862884521484, "global_step": 112941, "epoch": 672} {"train_loss": -9.778141021728516, "global_step": 112942, "epoch": 672} {"train_loss": -8.979373931884766, "global_step": 112943, "epoch": 672} {"train_loss": -9.779073715209961, "global_step": 112944, "epoch": 672} {"train_loss": -9.309659957885742, "global_step": 112945, "epoch": 672} {"train_loss": -9.565620422363281, "global_step": 112946, "epoch": 672} {"train_loss": -9.271048545837402, "global_step": 112947, "epoch": 672} {"train_loss": -9.761467933654785, "global_step": 112948, "epoch": 672} {"train_loss": -9.247491836547852, "global_step": 112949, "epoch": 672} {"train_loss": -9.655149459838867, "global_step": 112950, "epoch": 672} {"train_loss": -9.004919052124023, "global_step": 112951, "epoch": 672} {"train_loss": -9.454160690307617, "global_step": 112952, "epoch": 672} {"train_loss": -9.49942684173584, "global_step": 112953, "epoch": 672} {"train_loss": -9.677323341369629, "global_step": 112954, "epoch": 672} {"train_loss": -9.714273452758789, "global_step": 112955, "epoch": 672} {"train_loss": -9.636323928833008, "global_step": 112956, "epoch": 672} {"train_loss": -9.717266082763672, "global_step": 112957, "epoch": 672} {"train_loss": -9.653684616088867, "global_step": 112958, "epoch": 672} {"train_loss": -9.651344299316406, "global_step": 112959, "epoch": 672} {"train_loss": -9.58248519897461, "global_step": 112960, "epoch": 672} {"train_loss": -9.629989624023438, "global_step": 112961, "epoch": 672} {"train_loss": -9.867631912231445, "global_step": 112962, "epoch": 672} {"train_loss": -9.66317367553711, "global_step": 112963, "epoch": 672} {"train_loss": -9.935810089111328, "global_step": 112964, "epoch": 672} {"train_loss": -9.654510498046875, "global_step": 112965, "epoch": 672} {"train_loss": -9.863313674926758, "global_step": 112966, "epoch": 672} {"train_loss": -9.581504821777344, "global_step": 112967, "epoch": 672} {"train_loss": -9.93520450592041, "global_step": 112968, "epoch": 672} {"train_loss": -9.742496490478516, "global_step": 112969, "epoch": 672} {"train_loss": -9.878534317016602, "global_step": 112970, "epoch": 672} {"train_loss": -9.861701965332031, "global_step": 112971, "epoch": 672} {"train_loss": -9.432743072509766, "global_step": 112972, "epoch": 672} {"train_loss": -9.93643569946289, "global_step": 112973, "epoch": 672} {"train_loss": -10.047627449035645, "global_step": 112974, "epoch": 672} {"train_loss": -9.789047241210938, "global_step": 112975, "epoch": 672} {"train_loss": -9.59585952758789, "global_step": 112976, "epoch": 672} {"train_loss": -9.99077320098877, "global_step": 112977, "epoch": 672} {"train_loss": -9.874999046325684, "global_step": 112978, "epoch": 672} {"train_loss": -9.7054443359375, "global_step": 112979, "epoch": 672} {"train_loss": -10.090597152709961, "global_step": 112980, "epoch": 672} {"train_loss": -9.922233581542969, "global_step": 112981, "epoch": 672} {"train_loss": -9.88782024383545, "global_step": 112982, "epoch": 672} {"train_loss": -10.091056823730469, "global_step": 112983, "epoch": 672} {"train_loss": -10.063034057617188, "global_step": 112984, "epoch": 672} {"train_loss": -9.880660057067871, "global_step": 112985, "epoch": 672} {"train_loss": -10.266600608825684, "global_step": 112986, "epoch": 672} {"train_loss": -9.835012435913086, "global_step": 112987, "epoch": 672} {"train_loss": -10.154282569885254, "global_step": 112988, "epoch": 672} {"train_loss": -9.991188049316406, "global_step": 112989, "epoch": 672} {"train_loss": -10.346735000610352, "global_step": 112990, "epoch": 672} {"train_loss": -10.163281440734863, "global_step": 112991, "epoch": 672} {"train_loss": -10.150741577148438, "global_step": 112992, "epoch": 672} {"train_loss": -10.448126792907715, "global_step": 112993, "epoch": 672} {"train_loss": -10.035730361938477, "global_step": 112994, "epoch": 672} {"train_loss": -9.765203475952148, "global_step": 112995, "epoch": 672} {"train_loss": -10.2160005569458, "global_step": 112996, "epoch": 672} {"train_loss": -10.31333065032959, "global_step": 112997, "epoch": 672} {"train_loss": -9.850796699523926, "global_step": 112998, "epoch": 672} {"train_loss": -10.18678092956543, "global_step": 112999, "epoch": 672} {"train_loss": -9.360518455505371, "global_step": 113000, "epoch": 672} {"train_loss": -9.99233341217041, "global_step": 113001, "epoch": 672} {"train_loss": -10.25869083404541, "global_step": 113002, "epoch": 672} {"train_loss": -9.834903717041016, "global_step": 113003, "epoch": 672} {"train_loss": -10.068315505981445, "global_step": 113004, "epoch": 672} {"train_loss": -9.838981628417969, "global_step": 113005, "epoch": 672} {"train_loss": -10.182083129882812, "global_step": 113006, "epoch": 672} {"train_loss": -10.217941284179688, "global_step": 113007, "epoch": 672} {"train_loss": -9.93704605102539, "global_step": 113008, "epoch": 672} {"train_loss": -10.131893157958984, "global_step": 113009, "epoch": 672} {"train_loss": -10.26959228515625, "global_step": 113010, "epoch": 672} {"train_loss": -9.980890274047852, "global_step": 113011, "epoch": 672} {"train_loss": -10.076395988464355, "global_step": 113012, "epoch": 672} {"train_loss": -9.981422424316406, "global_step": 113013, "epoch": 672} {"train_loss": -10.164169311523438, "global_step": 113014, "epoch": 672} {"train_loss": -9.9244966506958, "global_step": 113015, "epoch": 672} {"train_loss": -10.020009994506836, "global_step": 113016, "epoch": 672} {"train_loss": -9.79230785369873, "global_step": 113017, "epoch": 672} {"train_loss": -10.07687759399414, "global_step": 113018, "epoch": 672} {"train_loss": -9.691512107849121, "global_step": 113019, "epoch": 672} {"train_loss": -10.19216537475586, "global_step": 113020, "epoch": 672} {"train_loss": -9.643272399902344, "global_step": 113021, "epoch": 672} {"train_loss": -10.078822135925293, "global_step": 113022, "epoch": 672} {"train_loss": -9.975624084472656, "global_step": 113023, "epoch": 672} {"train_loss": -9.51771354675293, "global_step": 113024, "epoch": 672} {"train_loss": -9.960748672485352, "global_step": 113025, "epoch": 672} {"train_loss": -9.176502227783203, "global_step": 113026, "epoch": 672} {"train_loss": -9.86115837097168, "global_step": 113027, "epoch": 672} {"train_loss": -9.882856369018555, "global_step": 113028, "epoch": 672} {"train_loss": -9.694282531738281, "global_step": 113029, "epoch": 672} {"train_loss": -9.866157531738281, "global_step": 113030, "epoch": 672} {"train_loss": -10.041662216186523, "global_step": 113031, "epoch": 672} {"train_loss": -9.75728988647461, "global_step": 113032, "epoch": 672} {"train_loss": -10.103824615478516, "global_step": 113033, "epoch": 672} {"train_loss": -9.95449447631836, "global_step": 113034, "epoch": 672} {"train_loss": -9.947131156921387, "global_step": 113035, "epoch": 672} {"train_loss": -9.787141799926758, "global_step": 113036, "epoch": 672} {"train_loss": -9.976289749145508, "global_step": 113037, "epoch": 672} {"train_loss": -10.01649284362793, "global_step": 113038, "epoch": 672} {"train_loss": -10.104923248291016, "global_step": 113039, "epoch": 672} {"train_loss": -9.93629264831543, "global_step": 113040, "epoch": 672} {"train_loss": -9.939777374267578, "global_step": 113041, "epoch": 672} {"train_loss": -10.08013916015625, "global_step": 113042, "epoch": 672} {"train_loss": -10.029510498046875, "global_step": 113043, "epoch": 672} {"train_loss": -9.944305419921875, "global_step": 113044, "epoch": 672} {"train_loss": -10.18354320526123, "global_step": 113045, "epoch": 672} {"train_loss": -10.094745635986328, "global_step": 113046, "epoch": 672} {"train_loss": -9.698991775512695, "global_step": 113047, "epoch": 672} {"train_loss": -10.047191619873047, "global_step": 113048, "epoch": 672} {"train_loss": -9.645234107971191, "global_step": 113049, "epoch": 672} {"train_loss": -9.937196731567383, "global_step": 113050, "epoch": 672} {"train_loss": -10.047595024108887, "global_step": 113051, "epoch": 672} {"train_loss": -10.128292083740234, "global_step": 113052, "epoch": 672} {"train_loss": -9.438077926635742, "global_step": 113053, "epoch": 672} {"train_loss": -10.08114242553711, "global_step": 113054, "epoch": 672} {"train_loss": -10.04647445678711, "global_step": 113055, "epoch": 672} {"train_loss": -10.106415748596191, "global_step": 113056, "epoch": 672} {"train_loss": -10.099903106689453, "global_step": 113057, "epoch": 672} {"train_loss": -10.035974502563477, "global_step": 113058, "epoch": 672} {"train_loss": -10.168672561645508, "global_step": 113059, "epoch": 672} {"train_loss": -10.073639869689941, "global_step": 113060, "epoch": 672} {"train_loss": -9.849569320678711, "global_step": 113061, "epoch": 672} {"train_loss": -10.149175643920898, "global_step": 113062, "epoch": 672} {"train_loss": -9.88131715002514, "global_step": 113063, "epoch": 672, "val_loss": 212961.703125} {"train_loss": -9.644132614135742, "global_step": 113064, "epoch": 673} {"train_loss": -9.866495132446289, "global_step": 113065, "epoch": 673} {"train_loss": -9.352834701538086, "global_step": 113066, "epoch": 673} {"train_loss": -10.15837287902832, "global_step": 113067, "epoch": 673} {"train_loss": -9.368185997009277, "global_step": 113068, "epoch": 673} {"train_loss": -10.190974235534668, "global_step": 113069, "epoch": 673} {"train_loss": -9.491315841674805, "global_step": 113070, "epoch": 673} {"train_loss": -9.833162307739258, "global_step": 113071, "epoch": 673} {"train_loss": -9.506824493408203, "global_step": 113072, "epoch": 673} {"train_loss": -9.828364372253418, "global_step": 113073, "epoch": 673} {"train_loss": -9.537307739257812, "global_step": 113074, "epoch": 673} {"train_loss": -9.76274299621582, "global_step": 113075, "epoch": 673} {"train_loss": -9.781545639038086, "global_step": 113076, "epoch": 673} {"train_loss": -9.88354778289795, "global_step": 113077, "epoch": 673} {"train_loss": -9.876530647277832, "global_step": 113078, "epoch": 673} {"train_loss": -9.882269859313965, "global_step": 113079, "epoch": 673} {"train_loss": -9.947225570678711, "global_step": 113080, "epoch": 673} {"train_loss": -10.024354934692383, "global_step": 113081, "epoch": 673} {"train_loss": -9.959104537963867, "global_step": 113082, "epoch": 673} {"train_loss": -9.990321159362793, "global_step": 113083, "epoch": 673} {"train_loss": -9.870426177978516, "global_step": 113084, "epoch": 673} {"train_loss": -10.170543670654297, "global_step": 113085, "epoch": 673} {"train_loss": -10.038331985473633, "global_step": 113086, "epoch": 673} {"train_loss": -10.102216720581055, "global_step": 113087, "epoch": 673} {"train_loss": -10.185503005981445, "global_step": 113088, "epoch": 673} {"train_loss": -9.89602279663086, "global_step": 113089, "epoch": 673} {"train_loss": -10.055785179138184, "global_step": 113090, "epoch": 673} {"train_loss": -10.062634468078613, "global_step": 113091, "epoch": 673} {"train_loss": -10.066824913024902, "global_step": 113092, "epoch": 673} {"train_loss": -9.876778602600098, "global_step": 113093, "epoch": 673} {"train_loss": -10.18578052520752, "global_step": 113094, "epoch": 673} {"train_loss": -9.93271541595459, "global_step": 113095, "epoch": 673} {"train_loss": -10.12527847290039, "global_step": 113096, "epoch": 673} {"train_loss": -9.925680160522461, "global_step": 113097, "epoch": 673} {"train_loss": -10.447864532470703, "global_step": 113098, "epoch": 673} {"train_loss": -10.009332656860352, "global_step": 113099, "epoch": 673} {"train_loss": -9.907801628112793, "global_step": 113100, "epoch": 673} {"train_loss": -10.102689743041992, "global_step": 113101, "epoch": 673} {"train_loss": -10.140178680419922, "global_step": 113102, "epoch": 673} {"train_loss": -10.097587585449219, "global_step": 113103, "epoch": 673} {"train_loss": -10.2728910446167, "global_step": 113104, "epoch": 673} {"train_loss": -10.246149063110352, "global_step": 113105, "epoch": 673} {"train_loss": -10.30928897857666, "global_step": 113106, "epoch": 673} {"train_loss": -10.326456069946289, "global_step": 113107, "epoch": 673} {"train_loss": -10.217755317687988, "global_step": 113108, "epoch": 673} {"train_loss": -10.131126403808594, "global_step": 113109, "epoch": 673} {"train_loss": -10.024572372436523, "global_step": 113110, "epoch": 673} {"train_loss": -10.464664459228516, "global_step": 113111, "epoch": 673} {"train_loss": -10.033075332641602, "global_step": 113112, "epoch": 673} {"train_loss": -9.732111930847168, "global_step": 113113, "epoch": 673} {"train_loss": -9.833246231079102, "global_step": 113114, "epoch": 673} {"train_loss": -9.658794403076172, "global_step": 113115, "epoch": 673} {"train_loss": -10.00522232055664, "global_step": 113116, "epoch": 673} {"train_loss": -9.783565521240234, "global_step": 113117, "epoch": 673} {"train_loss": -9.98775577545166, "global_step": 113118, "epoch": 673} {"train_loss": -9.691278457641602, "global_step": 113119, "epoch": 673} {"train_loss": -9.916547775268555, "global_step": 113120, "epoch": 673} {"train_loss": -10.04046630859375, "global_step": 113121, "epoch": 673} {"train_loss": -9.887626647949219, "global_step": 113122, "epoch": 673} {"train_loss": -10.059016227722168, "global_step": 113123, "epoch": 673} {"train_loss": -9.506948471069336, "global_step": 113124, "epoch": 673} {"train_loss": -9.777973175048828, "global_step": 113125, "epoch": 673} {"train_loss": -9.952409744262695, "global_step": 113126, "epoch": 673} {"train_loss": -9.436872482299805, "global_step": 113127, "epoch": 673} {"train_loss": -10.000163078308105, "global_step": 113128, "epoch": 673} {"train_loss": -9.84206771850586, "global_step": 113129, "epoch": 673} {"train_loss": -10.053102493286133, "global_step": 113130, "epoch": 673} {"train_loss": -9.743500709533691, "global_step": 113131, "epoch": 673} {"train_loss": -9.944099426269531, "global_step": 113132, "epoch": 673} {"train_loss": -10.03233528137207, "global_step": 113133, "epoch": 673} {"train_loss": -10.124933242797852, "global_step": 113134, "epoch": 673} {"train_loss": -9.755470275878906, "global_step": 113135, "epoch": 673} {"train_loss": -10.157282829284668, "global_step": 113136, "epoch": 673} {"train_loss": -9.746063232421875, "global_step": 113137, "epoch": 673} {"train_loss": -9.917614936828613, "global_step": 113138, "epoch": 673} {"train_loss": -9.537412643432617, "global_step": 113139, "epoch": 673} {"train_loss": -9.534761428833008, "global_step": 113140, "epoch": 673} {"train_loss": -9.74948501586914, "global_step": 113141, "epoch": 673} {"train_loss": -9.627270698547363, "global_step": 113142, "epoch": 673} {"train_loss": -9.717035293579102, "global_step": 113143, "epoch": 673} {"train_loss": -9.234014511108398, "global_step": 113144, "epoch": 673} {"train_loss": -9.891647338867188, "global_step": 113145, "epoch": 673} {"train_loss": -9.392230987548828, "global_step": 113146, "epoch": 673} {"train_loss": -9.737676620483398, "global_step": 113147, "epoch": 673} {"train_loss": -9.851103782653809, "global_step": 113148, "epoch": 673} {"train_loss": -9.760696411132812, "global_step": 113149, "epoch": 673} {"train_loss": -9.633040428161621, "global_step": 113150, "epoch": 673} {"train_loss": -10.025933265686035, "global_step": 113151, "epoch": 673} {"train_loss": -9.958512306213379, "global_step": 113152, "epoch": 673} {"train_loss": -9.907031059265137, "global_step": 113153, "epoch": 673} {"train_loss": -10.097539901733398, "global_step": 113154, "epoch": 673} {"train_loss": -9.914798736572266, "global_step": 113155, "epoch": 673} {"train_loss": -9.714757919311523, "global_step": 113156, "epoch": 673} {"train_loss": -10.035304069519043, "global_step": 113157, "epoch": 673} {"train_loss": -9.767826080322266, "global_step": 113158, "epoch": 673} {"train_loss": -9.939608573913574, "global_step": 113159, "epoch": 673} {"train_loss": -10.06075382232666, "global_step": 113160, "epoch": 673} {"train_loss": -9.940829277038574, "global_step": 113161, "epoch": 673} {"train_loss": -10.141502380371094, "global_step": 113162, "epoch": 673} {"train_loss": -10.111038208007812, "global_step": 113163, "epoch": 673} {"train_loss": -10.073705673217773, "global_step": 113164, "epoch": 673} {"train_loss": -10.082971572875977, "global_step": 113165, "epoch": 673} {"train_loss": -10.114367485046387, "global_step": 113166, "epoch": 673} {"train_loss": -10.054763793945312, "global_step": 113167, "epoch": 673} {"train_loss": -10.097148895263672, "global_step": 113168, "epoch": 673} {"train_loss": -10.227226257324219, "global_step": 113169, "epoch": 673} {"train_loss": -9.918630599975586, "global_step": 113170, "epoch": 673} {"train_loss": -10.074882507324219, "global_step": 113171, "epoch": 673} {"train_loss": -9.91448974609375, "global_step": 113172, "epoch": 673} {"train_loss": -9.996631622314453, "global_step": 113173, "epoch": 673} {"train_loss": -10.024473190307617, "global_step": 113174, "epoch": 673} {"train_loss": -9.953361511230469, "global_step": 113175, "epoch": 673} {"train_loss": -10.133588790893555, "global_step": 113176, "epoch": 673} {"train_loss": -9.502766609191895, "global_step": 113177, "epoch": 673} {"train_loss": -10.099987030029297, "global_step": 113178, "epoch": 673} {"train_loss": -9.727733612060547, "global_step": 113179, "epoch": 673} {"train_loss": -9.737117767333984, "global_step": 113180, "epoch": 673} {"train_loss": -9.623736381530762, "global_step": 113181, "epoch": 673} {"train_loss": -9.347535133361816, "global_step": 113182, "epoch": 673} {"train_loss": -9.2237548828125, "global_step": 113183, "epoch": 673} {"train_loss": -9.614034652709961, "global_step": 113184, "epoch": 673} {"train_loss": -9.311676979064941, "global_step": 113185, "epoch": 673} {"train_loss": -10.064468383789062, "global_step": 113186, "epoch": 673} {"train_loss": -9.522841453552246, "global_step": 113187, "epoch": 673} {"train_loss": -9.786676406860352, "global_step": 113188, "epoch": 673} {"train_loss": -9.708344459533691, "global_step": 113189, "epoch": 673} {"train_loss": -9.484868049621582, "global_step": 113190, "epoch": 673} {"train_loss": -9.38337516784668, "global_step": 113191, "epoch": 673} {"train_loss": -9.847576141357422, "global_step": 113192, "epoch": 673} {"train_loss": -9.271227836608887, "global_step": 113193, "epoch": 673} {"train_loss": -10.067994117736816, "global_step": 113194, "epoch": 673} {"train_loss": -9.76173210144043, "global_step": 113195, "epoch": 673} {"train_loss": -9.488505363464355, "global_step": 113196, "epoch": 673} {"train_loss": -9.840289115905762, "global_step": 113197, "epoch": 673} {"train_loss": -9.85593032836914, "global_step": 113198, "epoch": 673} {"train_loss": -9.8700532913208, "global_step": 113199, "epoch": 673} {"train_loss": -9.598633766174316, "global_step": 113200, "epoch": 673} {"train_loss": -9.903336524963379, "global_step": 113201, "epoch": 673} {"train_loss": -9.570226669311523, "global_step": 113202, "epoch": 673} {"train_loss": -9.850662231445312, "global_step": 113203, "epoch": 673} {"train_loss": -9.650091171264648, "global_step": 113204, "epoch": 673} {"train_loss": -9.89858627319336, "global_step": 113205, "epoch": 673} {"train_loss": -9.574331283569336, "global_step": 113206, "epoch": 673} {"train_loss": -9.775940895080566, "global_step": 113207, "epoch": 673} {"train_loss": -9.369874954223633, "global_step": 113208, "epoch": 673} {"train_loss": -9.984635353088379, "global_step": 113209, "epoch": 673} {"train_loss": -9.86695384979248, "global_step": 113210, "epoch": 673} {"train_loss": -9.719963073730469, "global_step": 113211, "epoch": 673} {"train_loss": -10.069303512573242, "global_step": 113212, "epoch": 673} {"train_loss": -10.002620697021484, "global_step": 113213, "epoch": 673} {"train_loss": -9.954018592834473, "global_step": 113214, "epoch": 673} {"train_loss": -9.952861785888672, "global_step": 113215, "epoch": 673} {"train_loss": -10.042091369628906, "global_step": 113216, "epoch": 673} {"train_loss": -9.959030151367188, "global_step": 113217, "epoch": 673} {"train_loss": -10.048355102539062, "global_step": 113218, "epoch": 673} {"train_loss": -9.79511833190918, "global_step": 113219, "epoch": 673} {"train_loss": -9.960967063903809, "global_step": 113220, "epoch": 673} {"train_loss": -9.910564422607422, "global_step": 113221, "epoch": 673} {"train_loss": -9.768954277038574, "global_step": 113222, "epoch": 673} {"train_loss": -10.270621299743652, "global_step": 113223, "epoch": 673} {"train_loss": -10.000783920288086, "global_step": 113224, "epoch": 673} {"train_loss": -10.07768440246582, "global_step": 113225, "epoch": 673} {"train_loss": -9.967024803161621, "global_step": 113226, "epoch": 673} {"train_loss": -10.304479598999023, "global_step": 113227, "epoch": 673} {"train_loss": -10.163997650146484, "global_step": 113228, "epoch": 673} {"train_loss": -10.48516845703125, "global_step": 113229, "epoch": 673} {"train_loss": -10.343287467956543, "global_step": 113230, "epoch": 673} {"train_loss": -9.893279563812982, "global_step": 113231, "epoch": 673, "val_loss": 212066.828125} {"train_loss": -10.274630546569824, "global_step": 113232, "epoch": 674} {"train_loss": -10.317525863647461, "global_step": 113233, "epoch": 674} {"train_loss": -10.179107666015625, "global_step": 113234, "epoch": 674} {"train_loss": -10.389198303222656, "global_step": 113235, "epoch": 674} {"train_loss": -10.389655113220215, "global_step": 113236, "epoch": 674} {"train_loss": -10.320413589477539, "global_step": 113237, "epoch": 674} {"train_loss": -10.355110168457031, "global_step": 113238, "epoch": 674} {"train_loss": -10.36242389678955, "global_step": 113239, "epoch": 674} {"train_loss": -10.357223510742188, "global_step": 113240, "epoch": 674} {"train_loss": -10.487654685974121, "global_step": 113241, "epoch": 674} {"train_loss": -10.119169235229492, "global_step": 113242, "epoch": 674} {"train_loss": -10.290875434875488, "global_step": 113243, "epoch": 674} {"train_loss": -10.45546817779541, "global_step": 113244, "epoch": 674} {"train_loss": -10.342411994934082, "global_step": 113245, "epoch": 674} {"train_loss": -10.260637283325195, "global_step": 113246, "epoch": 674} {"train_loss": -10.241873741149902, "global_step": 113247, "epoch": 674} {"train_loss": -10.182157516479492, "global_step": 113248, "epoch": 674} {"train_loss": -10.2562837600708, "global_step": 113249, "epoch": 674} {"train_loss": -10.125876426696777, "global_step": 113250, "epoch": 674} {"train_loss": -10.353693008422852, "global_step": 113251, "epoch": 674} {"train_loss": -10.00550651550293, "global_step": 113252, "epoch": 674} {"train_loss": -9.933040618896484, "global_step": 113253, "epoch": 674} {"train_loss": -10.130426406860352, "global_step": 113254, "epoch": 674} {"train_loss": -10.184768676757812, "global_step": 113255, "epoch": 674} {"train_loss": -10.13627815246582, "global_step": 113256, "epoch": 674} {"train_loss": -9.892343521118164, "global_step": 113257, "epoch": 674} {"train_loss": -9.972455978393555, "global_step": 113258, "epoch": 674} {"train_loss": -9.095035552978516, "global_step": 113259, "epoch": 674} {"train_loss": -9.837236404418945, "global_step": 113260, "epoch": 674} {"train_loss": -9.659975051879883, "global_step": 113261, "epoch": 674} {"train_loss": -8.810848236083984, "global_step": 113262, "epoch": 674} {"train_loss": -9.238346099853516, "global_step": 113263, "epoch": 674} {"train_loss": -8.30023193359375, "global_step": 113264, "epoch": 674} {"train_loss": -9.613326072692871, "global_step": 113265, "epoch": 674} {"train_loss": -9.577824592590332, "global_step": 113266, "epoch": 674} {"train_loss": -9.566287994384766, "global_step": 113267, "epoch": 674} {"train_loss": -8.574756622314453, "global_step": 113268, "epoch": 674} {"train_loss": -9.71064567565918, "global_step": 113269, "epoch": 674} {"train_loss": -9.099357604980469, "global_step": 113270, "epoch": 674} {"train_loss": -9.70531177520752, "global_step": 113271, "epoch": 674} {"train_loss": -9.421649932861328, "global_step": 113272, "epoch": 674} {"train_loss": -9.612225532531738, "global_step": 113273, "epoch": 674} {"train_loss": -9.458296775817871, "global_step": 113274, "epoch": 674} {"train_loss": -9.734439849853516, "global_step": 113275, "epoch": 674} {"train_loss": -9.537786483764648, "global_step": 113276, "epoch": 674} {"train_loss": -9.690572738647461, "global_step": 113277, "epoch": 674} {"train_loss": -9.599993705749512, "global_step": 113278, "epoch": 674} {"train_loss": -9.53430461883545, "global_step": 113279, "epoch": 674} {"train_loss": -9.791019439697266, "global_step": 113280, "epoch": 674} {"train_loss": -9.567573547363281, "global_step": 113281, "epoch": 674} {"train_loss": -9.515201568603516, "global_step": 113282, "epoch": 674} {"train_loss": -9.731254577636719, "global_step": 113283, "epoch": 674} {"train_loss": -9.69015884399414, "global_step": 113284, "epoch": 674} {"train_loss": -9.789408683776855, "global_step": 113285, "epoch": 674} {"train_loss": -9.94516372680664, "global_step": 113286, "epoch": 674} {"train_loss": -9.977925300598145, "global_step": 113287, "epoch": 674} {"train_loss": -9.780691146850586, "global_step": 113288, "epoch": 674} {"train_loss": -10.106636047363281, "global_step": 113289, "epoch": 674} {"train_loss": -10.167360305786133, "global_step": 113290, "epoch": 674} {"train_loss": -9.96337890625, "global_step": 113291, "epoch": 674} {"train_loss": -10.071927070617676, "global_step": 113292, "epoch": 674} {"train_loss": -10.153521537780762, "global_step": 113293, "epoch": 674} {"train_loss": -10.107036590576172, "global_step": 113294, "epoch": 674} {"train_loss": -9.959818840026855, "global_step": 113295, "epoch": 674} {"train_loss": -10.140199661254883, "global_step": 113296, "epoch": 674} {"train_loss": -9.618781089782715, "global_step": 113297, "epoch": 674} {"train_loss": -10.109098434448242, "global_step": 113298, "epoch": 674} {"train_loss": -9.776139259338379, "global_step": 113299, "epoch": 674} {"train_loss": -10.027417182922363, "global_step": 113300, "epoch": 674} {"train_loss": -10.023235321044922, "global_step": 113301, "epoch": 674} {"train_loss": -10.01367473602295, "global_step": 113302, "epoch": 674} {"train_loss": -10.086801528930664, "global_step": 113303, "epoch": 674} {"train_loss": -10.025364875793457, "global_step": 113304, "epoch": 674} {"train_loss": -10.137218475341797, "global_step": 113305, "epoch": 674} {"train_loss": -10.232036590576172, "global_step": 113306, "epoch": 674} {"train_loss": -10.034618377685547, "global_step": 113307, "epoch": 674} {"train_loss": -10.098094940185547, "global_step": 113308, "epoch": 674} {"train_loss": -9.9521484375, "global_step": 113309, "epoch": 674} {"train_loss": -10.06800651550293, "global_step": 113310, "epoch": 674} {"train_loss": -10.02321720123291, "global_step": 113311, "epoch": 674} {"train_loss": -10.020965576171875, "global_step": 113312, "epoch": 674} {"train_loss": -10.258453369140625, "global_step": 113313, "epoch": 674} {"train_loss": -9.871305465698242, "global_step": 113314, "epoch": 674} {"train_loss": -9.988612174987793, "global_step": 113315, "epoch": 674} {"train_loss": -10.01904582977295, "global_step": 113316, "epoch": 674} {"train_loss": -10.109259605407715, "global_step": 113317, "epoch": 674} {"train_loss": -10.146097183227539, "global_step": 113318, "epoch": 674} {"train_loss": -10.231427192687988, "global_step": 113319, "epoch": 674} {"train_loss": -10.23330307006836, "global_step": 113320, "epoch": 674} {"train_loss": -10.376819610595703, "global_step": 113321, "epoch": 674} {"train_loss": -10.385539054870605, "global_step": 113322, "epoch": 674} {"train_loss": -10.038991928100586, "global_step": 113323, "epoch": 674} {"train_loss": -10.111368179321289, "global_step": 113324, "epoch": 674} {"train_loss": -10.236808776855469, "global_step": 113325, "epoch": 674} {"train_loss": -10.206998825073242, "global_step": 113326, "epoch": 674} {"train_loss": -10.334365844726562, "global_step": 113327, "epoch": 674} {"train_loss": -10.15549087524414, "global_step": 113328, "epoch": 674} {"train_loss": -9.84465217590332, "global_step": 113329, "epoch": 674} {"train_loss": -9.828925132751465, "global_step": 113330, "epoch": 674} {"train_loss": -9.956989288330078, "global_step": 113331, "epoch": 674} {"train_loss": -9.617525100708008, "global_step": 113332, "epoch": 674} {"train_loss": -10.3251371383667, "global_step": 113333, "epoch": 674} {"train_loss": -9.562617301940918, "global_step": 113334, "epoch": 674} {"train_loss": -9.678328514099121, "global_step": 113335, "epoch": 674} {"train_loss": -9.689455032348633, "global_step": 113336, "epoch": 674} {"train_loss": -9.649368286132812, "global_step": 113337, "epoch": 674} {"train_loss": -9.736991882324219, "global_step": 113338, "epoch": 674} {"train_loss": -9.778963088989258, "global_step": 113339, "epoch": 674} {"train_loss": -10.000412940979004, "global_step": 113340, "epoch": 674} {"train_loss": -9.617594718933105, "global_step": 113341, "epoch": 674} {"train_loss": -9.973298072814941, "global_step": 113342, "epoch": 674} {"train_loss": -9.66951847076416, "global_step": 113343, "epoch": 674} {"train_loss": -9.926046371459961, "global_step": 113344, "epoch": 674} {"train_loss": -9.803390502929688, "global_step": 113345, "epoch": 674} {"train_loss": -9.583782196044922, "global_step": 113346, "epoch": 674} {"train_loss": -9.978616714477539, "global_step": 113347, "epoch": 674} {"train_loss": -9.803483963012695, "global_step": 113348, "epoch": 674} {"train_loss": -9.89856243133545, "global_step": 113349, "epoch": 674} {"train_loss": -9.632583618164062, "global_step": 113350, "epoch": 674} {"train_loss": -9.945633888244629, "global_step": 113351, "epoch": 674} {"train_loss": -9.451438903808594, "global_step": 113352, "epoch": 674} {"train_loss": -9.826343536376953, "global_step": 113353, "epoch": 674} {"train_loss": -9.582865715026855, "global_step": 113354, "epoch": 674} {"train_loss": -9.836523056030273, "global_step": 113355, "epoch": 674} {"train_loss": -9.642434120178223, "global_step": 113356, "epoch": 674} {"train_loss": -9.856359481811523, "global_step": 113357, "epoch": 674} {"train_loss": -9.490044593811035, "global_step": 113358, "epoch": 674} {"train_loss": -10.043140411376953, "global_step": 113359, "epoch": 674} {"train_loss": -9.743415832519531, "global_step": 113360, "epoch": 674} {"train_loss": -9.931577682495117, "global_step": 113361, "epoch": 674} {"train_loss": -9.840232849121094, "global_step": 113362, "epoch": 674} {"train_loss": -10.040313720703125, "global_step": 113363, "epoch": 674} {"train_loss": -9.591217041015625, "global_step": 113364, "epoch": 674} {"train_loss": -10.148453712463379, "global_step": 113365, "epoch": 674} {"train_loss": -9.96572494506836, "global_step": 113366, "epoch": 674} {"train_loss": -9.728507041931152, "global_step": 113367, "epoch": 674} {"train_loss": -9.932583808898926, "global_step": 113368, "epoch": 674} {"train_loss": -9.968310356140137, "global_step": 113369, "epoch": 674} {"train_loss": -10.141646385192871, "global_step": 113370, "epoch": 674} {"train_loss": -10.064352989196777, "global_step": 113371, "epoch": 674} {"train_loss": -9.956890106201172, "global_step": 113372, "epoch": 674} {"train_loss": -9.944111824035645, "global_step": 113373, "epoch": 674} {"train_loss": -9.953783988952637, "global_step": 113374, "epoch": 674} {"train_loss": -9.98520565032959, "global_step": 113375, "epoch": 674} {"train_loss": -9.993284225463867, "global_step": 113376, "epoch": 674} {"train_loss": -10.001968383789062, "global_step": 113377, "epoch": 674} {"train_loss": -10.014568328857422, "global_step": 113378, "epoch": 674} {"train_loss": -10.015472412109375, "global_step": 113379, "epoch": 674} {"train_loss": -10.15290355682373, "global_step": 113380, "epoch": 674} {"train_loss": -10.002857208251953, "global_step": 113381, "epoch": 674} {"train_loss": -10.38247013092041, "global_step": 113382, "epoch": 674} {"train_loss": -10.011463165283203, "global_step": 113383, "epoch": 674} {"train_loss": -10.061269760131836, "global_step": 113384, "epoch": 674} {"train_loss": -10.215983390808105, "global_step": 113385, "epoch": 674} {"train_loss": -10.033990859985352, "global_step": 113386, "epoch": 674} {"train_loss": -10.042337417602539, "global_step": 113387, "epoch": 674} {"train_loss": -10.096122741699219, "global_step": 113388, "epoch": 674} {"train_loss": -10.29270076751709, "global_step": 113389, "epoch": 674} {"train_loss": -10.29530143737793, "global_step": 113390, "epoch": 674} {"train_loss": -10.03917121887207, "global_step": 113391, "epoch": 674} {"train_loss": -10.259366989135742, "global_step": 113392, "epoch": 674} {"train_loss": -10.132132530212402, "global_step": 113393, "epoch": 674} {"train_loss": -10.049978256225586, "global_step": 113394, "epoch": 674} {"train_loss": -10.33414363861084, "global_step": 113395, "epoch": 674} {"train_loss": -9.963773727416992, "global_step": 113396, "epoch": 674} {"train_loss": -9.829389572143555, "global_step": 113397, "epoch": 674} {"train_loss": -10.272768020629883, "global_step": 113398, "epoch": 674} {"train_loss": -9.939914413860865, "global_step": 113399, "epoch": 674, "val_loss": 214223.921875} {"train_loss": -10.064002990722656, "global_step": 113400, "epoch": 675} {"train_loss": -10.298681259155273, "global_step": 113401, "epoch": 675} {"train_loss": -10.457128524780273, "global_step": 113402, "epoch": 675} {"train_loss": -9.996512413024902, "global_step": 113403, "epoch": 675} {"train_loss": -10.068601608276367, "global_step": 113404, "epoch": 675} {"train_loss": -10.245916366577148, "global_step": 113405, "epoch": 675} {"train_loss": -10.289457321166992, "global_step": 113406, "epoch": 675} {"train_loss": -9.876550674438477, "global_step": 113407, "epoch": 675} {"train_loss": -10.027772903442383, "global_step": 113408, "epoch": 675} {"train_loss": -10.040769577026367, "global_step": 113409, "epoch": 675} {"train_loss": -10.392192840576172, "global_step": 113410, "epoch": 675} {"train_loss": -9.870870590209961, "global_step": 113411, "epoch": 675} {"train_loss": -9.628727912902832, "global_step": 113412, "epoch": 675} {"train_loss": -9.705392837524414, "global_step": 113413, "epoch": 675} {"train_loss": -9.834661483764648, "global_step": 113414, "epoch": 675} {"train_loss": -10.122245788574219, "global_step": 113415, "epoch": 675} {"train_loss": -9.784428596496582, "global_step": 113416, "epoch": 675} {"train_loss": -10.029624938964844, "global_step": 113417, "epoch": 675} {"train_loss": -9.958635330200195, "global_step": 113418, "epoch": 675} {"train_loss": -10.076804161071777, "global_step": 113419, "epoch": 675} {"train_loss": -9.732845306396484, "global_step": 113420, "epoch": 675} {"train_loss": -9.93600845336914, "global_step": 113421, "epoch": 675} {"train_loss": -9.832466125488281, "global_step": 113422, "epoch": 675} {"train_loss": -9.916383743286133, "global_step": 113423, "epoch": 675} {"train_loss": -9.845451354980469, "global_step": 113424, "epoch": 675} {"train_loss": -9.852090835571289, "global_step": 113425, "epoch": 675} {"train_loss": -9.985706329345703, "global_step": 113426, "epoch": 675} {"train_loss": -10.120065689086914, "global_step": 113427, "epoch": 675} {"train_loss": -9.919979095458984, "global_step": 113428, "epoch": 675} {"train_loss": -9.723184585571289, "global_step": 113429, "epoch": 675} {"train_loss": -10.030492782592773, "global_step": 113430, "epoch": 675} {"train_loss": -10.069639205932617, "global_step": 113431, "epoch": 675} {"train_loss": -10.02083969116211, "global_step": 113432, "epoch": 675} {"train_loss": -10.133575439453125, "global_step": 113433, "epoch": 675} {"train_loss": -9.817391395568848, "global_step": 113434, "epoch": 675} {"train_loss": -10.187850952148438, "global_step": 113435, "epoch": 675} {"train_loss": -10.073482513427734, "global_step": 113436, "epoch": 675} {"train_loss": -10.101140975952148, "global_step": 113437, "epoch": 675} {"train_loss": -10.1233491897583, "global_step": 113438, "epoch": 675} {"train_loss": -10.234820365905762, "global_step": 113439, "epoch": 675} {"train_loss": -9.898741722106934, "global_step": 113440, "epoch": 675} {"train_loss": -10.161317825317383, "global_step": 113441, "epoch": 675} {"train_loss": -9.791610717773438, "global_step": 113442, "epoch": 675} {"train_loss": -10.065703392028809, "global_step": 113443, "epoch": 675} {"train_loss": -9.928409576416016, "global_step": 113444, "epoch": 675} {"train_loss": -10.00954532623291, "global_step": 113445, "epoch": 675} {"train_loss": -10.165582656860352, "global_step": 113446, "epoch": 675} {"train_loss": -10.177422523498535, "global_step": 113447, "epoch": 675} {"train_loss": -9.871781349182129, "global_step": 113448, "epoch": 675} {"train_loss": -9.86397933959961, "global_step": 113449, "epoch": 675} {"train_loss": -9.645528793334961, "global_step": 113450, "epoch": 675} {"train_loss": -10.155950546264648, "global_step": 113451, "epoch": 675} {"train_loss": -9.786796569824219, "global_step": 113452, "epoch": 675} {"train_loss": -10.13138198852539, "global_step": 113453, "epoch": 675} {"train_loss": -9.47004508972168, "global_step": 113454, "epoch": 675} {"train_loss": -9.873126983642578, "global_step": 113455, "epoch": 675} {"train_loss": -9.753225326538086, "global_step": 113456, "epoch": 675} {"train_loss": -10.118114471435547, "global_step": 113457, "epoch": 675} {"train_loss": -9.637126922607422, "global_step": 113458, "epoch": 675} {"train_loss": -10.187479019165039, "global_step": 113459, "epoch": 675} {"train_loss": -9.706319808959961, "global_step": 113460, "epoch": 675} {"train_loss": -9.818967819213867, "global_step": 113461, "epoch": 675} {"train_loss": -9.504924774169922, "global_step": 113462, "epoch": 675} {"train_loss": -9.974723815917969, "global_step": 113463, "epoch": 675} {"train_loss": -9.80852222442627, "global_step": 113464, "epoch": 675} {"train_loss": -10.119522094726562, "global_step": 113465, "epoch": 675} {"train_loss": -10.094002723693848, "global_step": 113466, "epoch": 675} {"train_loss": -10.030717849731445, "global_step": 113467, "epoch": 675} {"train_loss": -10.175710678100586, "global_step": 113468, "epoch": 675} {"train_loss": -10.004690170288086, "global_step": 113469, "epoch": 675} {"train_loss": -10.227388381958008, "global_step": 113470, "epoch": 675} {"train_loss": -9.898386001586914, "global_step": 113471, "epoch": 675} {"train_loss": -9.743124961853027, "global_step": 113472, "epoch": 675} {"train_loss": -9.763692855834961, "global_step": 113473, "epoch": 675} {"train_loss": -9.814783096313477, "global_step": 113474, "epoch": 675} {"train_loss": -9.663183212280273, "global_step": 113475, "epoch": 675} {"train_loss": -10.236717224121094, "global_step": 113476, "epoch": 675} {"train_loss": -9.942489624023438, "global_step": 113477, "epoch": 675} {"train_loss": -9.684455871582031, "global_step": 113478, "epoch": 675} {"train_loss": -10.07539176940918, "global_step": 113479, "epoch": 675} {"train_loss": -9.588418960571289, "global_step": 113480, "epoch": 675} {"train_loss": -10.040143966674805, "global_step": 113481, "epoch": 675} {"train_loss": -9.824349403381348, "global_step": 113482, "epoch": 675} {"train_loss": -9.844975471496582, "global_step": 113483, "epoch": 675} {"train_loss": -9.984039306640625, "global_step": 113484, "epoch": 675} {"train_loss": -9.972399711608887, "global_step": 113485, "epoch": 675} {"train_loss": -9.910818099975586, "global_step": 113486, "epoch": 675} {"train_loss": -10.00153636932373, "global_step": 113487, "epoch": 675} {"train_loss": -9.919957160949707, "global_step": 113488, "epoch": 675} {"train_loss": -9.823872566223145, "global_step": 113489, "epoch": 675} {"train_loss": -10.016834259033203, "global_step": 113490, "epoch": 675} {"train_loss": -9.902339935302734, "global_step": 113491, "epoch": 675} {"train_loss": -9.896728515625, "global_step": 113492, "epoch": 675} {"train_loss": -10.291234970092773, "global_step": 113493, "epoch": 675} {"train_loss": -9.927717208862305, "global_step": 113494, "epoch": 675} {"train_loss": -9.992995262145996, "global_step": 113495, "epoch": 675} {"train_loss": -10.047743797302246, "global_step": 113496, "epoch": 675} {"train_loss": -10.040143966674805, "global_step": 113497, "epoch": 675} {"train_loss": -10.012359619140625, "global_step": 113498, "epoch": 675} {"train_loss": -10.162925720214844, "global_step": 113499, "epoch": 675} {"train_loss": -9.95064926147461, "global_step": 113500, "epoch": 675} {"train_loss": -10.129653930664062, "global_step": 113501, "epoch": 675} {"train_loss": -10.145359992980957, "global_step": 113502, "epoch": 675} {"train_loss": -10.127243041992188, "global_step": 113503, "epoch": 675} {"train_loss": -9.984375953674316, "global_step": 113504, "epoch": 675} {"train_loss": -10.339892387390137, "global_step": 113505, "epoch": 675} {"train_loss": -10.053535461425781, "global_step": 113506, "epoch": 675} {"train_loss": -10.331745147705078, "global_step": 113507, "epoch": 675} {"train_loss": -10.323018074035645, "global_step": 113508, "epoch": 675} {"train_loss": -10.458954811096191, "global_step": 113509, "epoch": 675} {"train_loss": -10.07236385345459, "global_step": 113510, "epoch": 675} {"train_loss": -10.160978317260742, "global_step": 113511, "epoch": 675} {"train_loss": -9.967342376708984, "global_step": 113512, "epoch": 675} {"train_loss": -10.20803165435791, "global_step": 113513, "epoch": 675} {"train_loss": -10.202841758728027, "global_step": 113514, "epoch": 675} {"train_loss": -10.107669830322266, "global_step": 113515, "epoch": 675} {"train_loss": -10.071274757385254, "global_step": 113516, "epoch": 675} {"train_loss": -10.270730972290039, "global_step": 113517, "epoch": 675} {"train_loss": -10.061403274536133, "global_step": 113518, "epoch": 675} {"train_loss": -10.172989845275879, "global_step": 113519, "epoch": 675} {"train_loss": -10.296091079711914, "global_step": 113520, "epoch": 675} {"train_loss": -9.882079124450684, "global_step": 113521, "epoch": 675} {"train_loss": -9.651372909545898, "global_step": 113522, "epoch": 675} {"train_loss": -9.557589530944824, "global_step": 113523, "epoch": 675} {"train_loss": -10.203369140625, "global_step": 113524, "epoch": 675} {"train_loss": -9.68542766571045, "global_step": 113525, "epoch": 675} {"train_loss": -9.597569465637207, "global_step": 113526, "epoch": 675} {"train_loss": -10.107560157775879, "global_step": 113527, "epoch": 675} {"train_loss": -9.473340034484863, "global_step": 113528, "epoch": 675} {"train_loss": -9.773209571838379, "global_step": 113529, "epoch": 675} {"train_loss": -9.919870376586914, "global_step": 113530, "epoch": 675} {"train_loss": -9.526769638061523, "global_step": 113531, "epoch": 675} {"train_loss": -9.657393455505371, "global_step": 113532, "epoch": 675} {"train_loss": -9.044168472290039, "global_step": 113533, "epoch": 675} {"train_loss": -9.977447509765625, "global_step": 113534, "epoch": 675} {"train_loss": -9.522783279418945, "global_step": 113535, "epoch": 675} {"train_loss": -9.849273681640625, "global_step": 113536, "epoch": 675} {"train_loss": -9.766542434692383, "global_step": 113537, "epoch": 675} {"train_loss": -10.061726570129395, "global_step": 113538, "epoch": 675} {"train_loss": -9.810613632202148, "global_step": 113539, "epoch": 675} {"train_loss": -10.090551376342773, "global_step": 113540, "epoch": 675} {"train_loss": -9.73375415802002, "global_step": 113541, "epoch": 675} {"train_loss": -9.952679634094238, "global_step": 113542, "epoch": 675} {"train_loss": -9.734041213989258, "global_step": 113543, "epoch": 675} {"train_loss": -10.027076721191406, "global_step": 113544, "epoch": 675} {"train_loss": -9.912450790405273, "global_step": 113545, "epoch": 675} {"train_loss": -9.670053482055664, "global_step": 113546, "epoch": 675} {"train_loss": -10.193351745605469, "global_step": 113547, "epoch": 675} {"train_loss": -9.676154136657715, "global_step": 113548, "epoch": 675} {"train_loss": -9.801838874816895, "global_step": 113549, "epoch": 675} {"train_loss": -9.848740577697754, "global_step": 113550, "epoch": 675} {"train_loss": -10.154081344604492, "global_step": 113551, "epoch": 675} {"train_loss": -10.108573913574219, "global_step": 113552, "epoch": 675} {"train_loss": -10.083868026733398, "global_step": 113553, "epoch": 675} {"train_loss": -9.914251327514648, "global_step": 113554, "epoch": 675} {"train_loss": -9.942483901977539, "global_step": 113555, "epoch": 675} {"train_loss": -10.121800422668457, "global_step": 113556, "epoch": 675} {"train_loss": -9.810283660888672, "global_step": 113557, "epoch": 675} {"train_loss": -10.035542488098145, "global_step": 113558, "epoch": 675} {"train_loss": -10.000083923339844, "global_step": 113559, "epoch": 675} {"train_loss": -9.960247039794922, "global_step": 113560, "epoch": 675} {"train_loss": -9.900978088378906, "global_step": 113561, "epoch": 675} {"train_loss": -9.886222839355469, "global_step": 113562, "epoch": 675} {"train_loss": -10.00543212890625, "global_step": 113563, "epoch": 675} {"train_loss": -10.0154390335083, "global_step": 113564, "epoch": 675} {"train_loss": -9.820411682128906, "global_step": 113565, "epoch": 675} {"train_loss": -9.882814407348633, "global_step": 113566, "epoch": 675} {"train_loss": -9.960312519754682, "global_step": 113567, "epoch": 675, "val_loss": 213111.53125, "train_action_mse_error": 2.3029770851135254} {"train_loss": -9.65511417388916, "global_step": 113568, "epoch": 676} {"train_loss": -10.052213668823242, "global_step": 113569, "epoch": 676} {"train_loss": -9.690068244934082, "global_step": 113570, "epoch": 676} {"train_loss": -9.945898056030273, "global_step": 113571, "epoch": 676} {"train_loss": -9.550634384155273, "global_step": 113572, "epoch": 676} {"train_loss": -10.164894104003906, "global_step": 113573, "epoch": 676} {"train_loss": -9.069214820861816, "global_step": 113574, "epoch": 676} {"train_loss": -9.730369567871094, "global_step": 113575, "epoch": 676} {"train_loss": -9.336005210876465, "global_step": 113576, "epoch": 676} {"train_loss": -9.551054000854492, "global_step": 113577, "epoch": 676} {"train_loss": -9.355162620544434, "global_step": 113578, "epoch": 676} {"train_loss": -9.45728874206543, "global_step": 113579, "epoch": 676} {"train_loss": -9.917255401611328, "global_step": 113580, "epoch": 676} {"train_loss": -9.83509635925293, "global_step": 113581, "epoch": 676} {"train_loss": -9.911499977111816, "global_step": 113582, "epoch": 676} {"train_loss": -9.939054489135742, "global_step": 113583, "epoch": 676} {"train_loss": -9.869649887084961, "global_step": 113584, "epoch": 676} {"train_loss": -9.913423538208008, "global_step": 113585, "epoch": 676} {"train_loss": -9.940159797668457, "global_step": 113586, "epoch": 676} {"train_loss": -9.919873237609863, "global_step": 113587, "epoch": 676} {"train_loss": -9.804088592529297, "global_step": 113588, "epoch": 676} {"train_loss": -10.11252498626709, "global_step": 113589, "epoch": 676} {"train_loss": -9.938796043395996, "global_step": 113590, "epoch": 676} {"train_loss": -9.816173553466797, "global_step": 113591, "epoch": 676} {"train_loss": -10.166914939880371, "global_step": 113592, "epoch": 676} {"train_loss": -10.042632102966309, "global_step": 113593, "epoch": 676} {"train_loss": -9.89884090423584, "global_step": 113594, "epoch": 676} {"train_loss": -10.146114349365234, "global_step": 113595, "epoch": 676} {"train_loss": -10.21790885925293, "global_step": 113596, "epoch": 676} {"train_loss": -10.027504920959473, "global_step": 113597, "epoch": 676} {"train_loss": -10.071346282958984, "global_step": 113598, "epoch": 676} {"train_loss": -10.069320678710938, "global_step": 113599, "epoch": 676} {"train_loss": -9.996696472167969, "global_step": 113600, "epoch": 676} {"train_loss": -10.265727996826172, "global_step": 113601, "epoch": 676} {"train_loss": -10.251049041748047, "global_step": 113602, "epoch": 676} {"train_loss": -10.20959758758545, "global_step": 113603, "epoch": 676} {"train_loss": -10.447192192077637, "global_step": 113604, "epoch": 676} {"train_loss": -10.062013626098633, "global_step": 113605, "epoch": 676} {"train_loss": -10.29823112487793, "global_step": 113606, "epoch": 676} {"train_loss": -10.194421768188477, "global_step": 113607, "epoch": 676} {"train_loss": -10.267251014709473, "global_step": 113608, "epoch": 676} {"train_loss": -10.249992370605469, "global_step": 113609, "epoch": 676} {"train_loss": -10.144697189331055, "global_step": 113610, "epoch": 676} {"train_loss": -9.842120170593262, "global_step": 113611, "epoch": 676} {"train_loss": -9.819585800170898, "global_step": 113612, "epoch": 676} {"train_loss": -10.284801483154297, "global_step": 113613, "epoch": 676} {"train_loss": -9.751235961914062, "global_step": 113614, "epoch": 676} {"train_loss": -9.93313217163086, "global_step": 113615, "epoch": 676} {"train_loss": -9.618332862854004, "global_step": 113616, "epoch": 676} {"train_loss": -10.088752746582031, "global_step": 113617, "epoch": 676} {"train_loss": -9.737104415893555, "global_step": 113618, "epoch": 676} {"train_loss": -9.84450912475586, "global_step": 113619, "epoch": 676} {"train_loss": -10.308296203613281, "global_step": 113620, "epoch": 676} {"train_loss": -9.819726943969727, "global_step": 113621, "epoch": 676} {"train_loss": -9.940741539001465, "global_step": 113622, "epoch": 676} {"train_loss": -9.677207946777344, "global_step": 113623, "epoch": 676} {"train_loss": -9.810115814208984, "global_step": 113624, "epoch": 676} {"train_loss": -9.988832473754883, "global_step": 113625, "epoch": 676} {"train_loss": -10.047435760498047, "global_step": 113626, "epoch": 676} {"train_loss": -9.86674690246582, "global_step": 113627, "epoch": 676} {"train_loss": -9.85976791381836, "global_step": 113628, "epoch": 676} {"train_loss": -10.020849227905273, "global_step": 113629, "epoch": 676} {"train_loss": -9.679252624511719, "global_step": 113630, "epoch": 676} {"train_loss": -10.215709686279297, "global_step": 113631, "epoch": 676} {"train_loss": -9.941557884216309, "global_step": 113632, "epoch": 676} {"train_loss": -10.124582290649414, "global_step": 113633, "epoch": 676} {"train_loss": -10.194808959960938, "global_step": 113634, "epoch": 676} {"train_loss": -9.565741539001465, "global_step": 113635, "epoch": 676} {"train_loss": -10.138809204101562, "global_step": 113636, "epoch": 676} {"train_loss": -9.880840301513672, "global_step": 113637, "epoch": 676} {"train_loss": -10.095293998718262, "global_step": 113638, "epoch": 676} {"train_loss": -10.136099815368652, "global_step": 113639, "epoch": 676} {"train_loss": -10.085847854614258, "global_step": 113640, "epoch": 676} {"train_loss": -10.276582717895508, "global_step": 113641, "epoch": 676} {"train_loss": -10.06601333618164, "global_step": 113642, "epoch": 676} {"train_loss": -10.105623245239258, "global_step": 113643, "epoch": 676} {"train_loss": -9.802082061767578, "global_step": 113644, "epoch": 676} {"train_loss": -10.246545791625977, "global_step": 113645, "epoch": 676} {"train_loss": -10.00979995727539, "global_step": 113646, "epoch": 676} {"train_loss": -10.08096694946289, "global_step": 113647, "epoch": 676} {"train_loss": -10.193208694458008, "global_step": 113648, "epoch": 676} {"train_loss": -10.093358993530273, "global_step": 113649, "epoch": 676} {"train_loss": -10.193534851074219, "global_step": 113650, "epoch": 676} {"train_loss": -10.314546585083008, "global_step": 113651, "epoch": 676} {"train_loss": -10.15839958190918, "global_step": 113652, "epoch": 676} {"train_loss": -10.274883270263672, "global_step": 113653, "epoch": 676} {"train_loss": -9.879864692687988, "global_step": 113654, "epoch": 676} {"train_loss": -10.04340934753418, "global_step": 113655, "epoch": 676} {"train_loss": -10.08775806427002, "global_step": 113656, "epoch": 676} {"train_loss": -10.111213684082031, "global_step": 113657, "epoch": 676} {"train_loss": -10.111686706542969, "global_step": 113658, "epoch": 676} {"train_loss": -9.83689022064209, "global_step": 113659, "epoch": 676} {"train_loss": -10.114957809448242, "global_step": 113660, "epoch": 676} {"train_loss": -10.045001983642578, "global_step": 113661, "epoch": 676} {"train_loss": -9.860312461853027, "global_step": 113662, "epoch": 676} {"train_loss": -9.678766250610352, "global_step": 113663, "epoch": 676} {"train_loss": -9.325141906738281, "global_step": 113664, "epoch": 676} {"train_loss": -10.033578872680664, "global_step": 113665, "epoch": 676} {"train_loss": -9.967826843261719, "global_step": 113666, "epoch": 676} {"train_loss": -10.128780364990234, "global_step": 113667, "epoch": 676} {"train_loss": -10.334638595581055, "global_step": 113668, "epoch": 676} {"train_loss": -10.14179801940918, "global_step": 113669, "epoch": 676} {"train_loss": -10.056469917297363, "global_step": 113670, "epoch": 676} {"train_loss": -10.080621719360352, "global_step": 113671, "epoch": 676} {"train_loss": -10.179224014282227, "global_step": 113672, "epoch": 676} {"train_loss": -10.036510467529297, "global_step": 113673, "epoch": 676} {"train_loss": -10.098417282104492, "global_step": 113674, "epoch": 676} {"train_loss": -10.323554992675781, "global_step": 113675, "epoch": 676} {"train_loss": -10.336468696594238, "global_step": 113676, "epoch": 676} {"train_loss": -10.33944320678711, "global_step": 113677, "epoch": 676} {"train_loss": -9.978939056396484, "global_step": 113678, "epoch": 676} {"train_loss": -10.364046096801758, "global_step": 113679, "epoch": 676} {"train_loss": -9.897591590881348, "global_step": 113680, "epoch": 676} {"train_loss": -10.026402473449707, "global_step": 113681, "epoch": 676} {"train_loss": -10.146866798400879, "global_step": 113682, "epoch": 676} {"train_loss": -9.838845252990723, "global_step": 113683, "epoch": 676} {"train_loss": -10.111854553222656, "global_step": 113684, "epoch": 676} {"train_loss": -9.759506225585938, "global_step": 113685, "epoch": 676} {"train_loss": -9.902153015136719, "global_step": 113686, "epoch": 676} {"train_loss": -10.17641544342041, "global_step": 113687, "epoch": 676} {"train_loss": -10.028406143188477, "global_step": 113688, "epoch": 676} {"train_loss": -9.811760902404785, "global_step": 113689, "epoch": 676} {"train_loss": -9.641286849975586, "global_step": 113690, "epoch": 676} {"train_loss": -10.265962600708008, "global_step": 113691, "epoch": 676} {"train_loss": -9.857610702514648, "global_step": 113692, "epoch": 676} {"train_loss": -10.057470321655273, "global_step": 113693, "epoch": 676} {"train_loss": -10.284586906433105, "global_step": 113694, "epoch": 676} {"train_loss": -9.654607772827148, "global_step": 113695, "epoch": 676} {"train_loss": -9.850648880004883, "global_step": 113696, "epoch": 676} {"train_loss": -10.061145782470703, "global_step": 113697, "epoch": 676} {"train_loss": -10.051946640014648, "global_step": 113698, "epoch": 676} {"train_loss": -10.189743041992188, "global_step": 113699, "epoch": 676} {"train_loss": -10.293524742126465, "global_step": 113700, "epoch": 676} {"train_loss": -10.244760513305664, "global_step": 113701, "epoch": 676} {"train_loss": -10.318609237670898, "global_step": 113702, "epoch": 676} {"train_loss": -10.271854400634766, "global_step": 113703, "epoch": 676} {"train_loss": -10.385737419128418, "global_step": 113704, "epoch": 676} {"train_loss": -10.142871856689453, "global_step": 113705, "epoch": 676} {"train_loss": -10.301576614379883, "global_step": 113706, "epoch": 676} {"train_loss": -10.088778495788574, "global_step": 113707, "epoch": 676} {"train_loss": -10.278665542602539, "global_step": 113708, "epoch": 676} {"train_loss": -10.183734893798828, "global_step": 113709, "epoch": 676} {"train_loss": -10.085248947143555, "global_step": 113710, "epoch": 676} {"train_loss": -10.262467384338379, "global_step": 113711, "epoch": 676} {"train_loss": -10.257288932800293, "global_step": 113712, "epoch": 676} {"train_loss": -10.360517501831055, "global_step": 113713, "epoch": 676} {"train_loss": -10.177949905395508, "global_step": 113714, "epoch": 676} {"train_loss": -10.344636917114258, "global_step": 113715, "epoch": 676} {"train_loss": -10.300237655639648, "global_step": 113716, "epoch": 676} {"train_loss": -9.985941886901855, "global_step": 113717, "epoch": 676} {"train_loss": -10.100967407226562, "global_step": 113718, "epoch": 676} {"train_loss": -10.076345443725586, "global_step": 113719, "epoch": 676} {"train_loss": -9.910476684570312, "global_step": 113720, "epoch": 676} {"train_loss": -10.162755966186523, "global_step": 113721, "epoch": 676} {"train_loss": -10.240135192871094, "global_step": 113722, "epoch": 676} {"train_loss": -10.019752502441406, "global_step": 113723, "epoch": 676} {"train_loss": -10.211560249328613, "global_step": 113724, "epoch": 676} {"train_loss": -9.946531295776367, "global_step": 113725, "epoch": 676} {"train_loss": -9.838173866271973, "global_step": 113726, "epoch": 676} {"train_loss": -10.175718307495117, "global_step": 113727, "epoch": 676} {"train_loss": -9.782881736755371, "global_step": 113728, "epoch": 676} {"train_loss": -9.843746185302734, "global_step": 113729, "epoch": 676} {"train_loss": -10.105245590209961, "global_step": 113730, "epoch": 676} {"train_loss": -9.926519393920898, "global_step": 113731, "epoch": 676} {"train_loss": -10.16472053527832, "global_step": 113732, "epoch": 676} {"train_loss": -10.287822723388672, "global_step": 113733, "epoch": 676} {"train_loss": -9.996939659118652, "global_step": 113734, "epoch": 676} {"train_loss": -10.024171727044243, "global_step": 113735, "epoch": 676, "val_loss": 214792.953125} {"train_loss": -10.229080200195312, "global_step": 113736, "epoch": 677} {"train_loss": -9.949447631835938, "global_step": 113737, "epoch": 677} {"train_loss": -10.077359199523926, "global_step": 113738, "epoch": 677} {"train_loss": -10.212234497070312, "global_step": 113739, "epoch": 677} {"train_loss": -10.170428276062012, "global_step": 113740, "epoch": 677} {"train_loss": -9.893808364868164, "global_step": 113741, "epoch": 677} {"train_loss": -10.188041687011719, "global_step": 113742, "epoch": 677} {"train_loss": -10.064949035644531, "global_step": 113743, "epoch": 677} {"train_loss": -9.854551315307617, "global_step": 113744, "epoch": 677} {"train_loss": -10.175395965576172, "global_step": 113745, "epoch": 677} {"train_loss": -9.93354606628418, "global_step": 113746, "epoch": 677} {"train_loss": -9.577646255493164, "global_step": 113747, "epoch": 677} {"train_loss": -10.001346588134766, "global_step": 113748, "epoch": 677} {"train_loss": -9.598167419433594, "global_step": 113749, "epoch": 677} {"train_loss": -10.057136535644531, "global_step": 113750, "epoch": 677} {"train_loss": -9.461906433105469, "global_step": 113751, "epoch": 677} {"train_loss": -9.761112213134766, "global_step": 113752, "epoch": 677} {"train_loss": -9.075531959533691, "global_step": 113753, "epoch": 677} {"train_loss": -9.422317504882812, "global_step": 113754, "epoch": 677} {"train_loss": -9.689011573791504, "global_step": 113755, "epoch": 677} {"train_loss": -9.764373779296875, "global_step": 113756, "epoch": 677} {"train_loss": -10.003698348999023, "global_step": 113757, "epoch": 677} {"train_loss": -9.922630310058594, "global_step": 113758, "epoch": 677} {"train_loss": -9.551090240478516, "global_step": 113759, "epoch": 677} {"train_loss": -10.010246276855469, "global_step": 113760, "epoch": 677} {"train_loss": -9.64523696899414, "global_step": 113761, "epoch": 677} {"train_loss": -9.858907699584961, "global_step": 113762, "epoch": 677} {"train_loss": -9.729452133178711, "global_step": 113763, "epoch": 677} {"train_loss": -9.799461364746094, "global_step": 113764, "epoch": 677} {"train_loss": -9.668804168701172, "global_step": 113765, "epoch": 677} {"train_loss": -9.911094665527344, "global_step": 113766, "epoch": 677} {"train_loss": -9.672956466674805, "global_step": 113767, "epoch": 677} {"train_loss": -9.77256965637207, "global_step": 113768, "epoch": 677} {"train_loss": -9.620436668395996, "global_step": 113769, "epoch": 677} {"train_loss": -9.620075225830078, "global_step": 113770, "epoch": 677} {"train_loss": -10.043510437011719, "global_step": 113771, "epoch": 677} {"train_loss": -9.746031761169434, "global_step": 113772, "epoch": 677} {"train_loss": -10.11379337310791, "global_step": 113773, "epoch": 677} {"train_loss": -10.065450668334961, "global_step": 113774, "epoch": 677} {"train_loss": -9.917609214782715, "global_step": 113775, "epoch": 677} {"train_loss": -10.222267150878906, "global_step": 113776, "epoch": 677} {"train_loss": -9.850760459899902, "global_step": 113777, "epoch": 677} {"train_loss": -10.226348876953125, "global_step": 113778, "epoch": 677} {"train_loss": -10.079605102539062, "global_step": 113779, "epoch": 677} {"train_loss": -10.00139045715332, "global_step": 113780, "epoch": 677} {"train_loss": -10.090347290039062, "global_step": 113781, "epoch": 677} {"train_loss": -10.140169143676758, "global_step": 113782, "epoch": 677} {"train_loss": -10.042224884033203, "global_step": 113783, "epoch": 677} {"train_loss": -10.18875503540039, "global_step": 113784, "epoch": 677} {"train_loss": -10.087825775146484, "global_step": 113785, "epoch": 677} {"train_loss": -10.097620010375977, "global_step": 113786, "epoch": 677} {"train_loss": -10.273578643798828, "global_step": 113787, "epoch": 677} {"train_loss": -10.332620620727539, "global_step": 113788, "epoch": 677} {"train_loss": -10.538936614990234, "global_step": 113789, "epoch": 677} {"train_loss": -10.20553207397461, "global_step": 113790, "epoch": 677} {"train_loss": -10.221275329589844, "global_step": 113791, "epoch": 677} {"train_loss": -10.320358276367188, "global_step": 113792, "epoch": 677} {"train_loss": -10.178385734558105, "global_step": 113793, "epoch": 677} {"train_loss": -10.06370735168457, "global_step": 113794, "epoch": 677} {"train_loss": -10.327156066894531, "global_step": 113795, "epoch": 677} {"train_loss": -10.216642379760742, "global_step": 113796, "epoch": 677} {"train_loss": -10.293351173400879, "global_step": 113797, "epoch": 677} {"train_loss": -10.22113037109375, "global_step": 113798, "epoch": 677} {"train_loss": -10.45012092590332, "global_step": 113799, "epoch": 677} {"train_loss": -10.348711013793945, "global_step": 113800, "epoch": 677} {"train_loss": -10.425102233886719, "global_step": 113801, "epoch": 677} {"train_loss": -10.156912803649902, "global_step": 113802, "epoch": 677} {"train_loss": -10.346749305725098, "global_step": 113803, "epoch": 677} {"train_loss": -10.342448234558105, "global_step": 113804, "epoch": 677} {"train_loss": -10.316203117370605, "global_step": 113805, "epoch": 677} {"train_loss": -10.102216720581055, "global_step": 113806, "epoch": 677} {"train_loss": -10.152901649475098, "global_step": 113807, "epoch": 677} {"train_loss": -10.091571807861328, "global_step": 113808, "epoch": 677} {"train_loss": -9.664199829101562, "global_step": 113809, "epoch": 677} {"train_loss": -9.767471313476562, "global_step": 113810, "epoch": 677} {"train_loss": -9.951546669006348, "global_step": 113811, "epoch": 677} {"train_loss": -9.228545188903809, "global_step": 113812, "epoch": 677} {"train_loss": -9.598522186279297, "global_step": 113813, "epoch": 677} {"train_loss": -9.980539321899414, "global_step": 113814, "epoch": 677} {"train_loss": -10.101518630981445, "global_step": 113815, "epoch": 677} {"train_loss": -10.243316650390625, "global_step": 113816, "epoch": 677} {"train_loss": -9.9789457321167, "global_step": 113817, "epoch": 677} {"train_loss": -10.11744213104248, "global_step": 113818, "epoch": 677} {"train_loss": -10.147473335266113, "global_step": 113819, "epoch": 677} {"train_loss": -10.194936752319336, "global_step": 113820, "epoch": 677} {"train_loss": -10.103496551513672, "global_step": 113821, "epoch": 677} {"train_loss": -10.203054428100586, "global_step": 113822, "epoch": 677} {"train_loss": -10.189188003540039, "global_step": 113823, "epoch": 677} {"train_loss": -10.086536407470703, "global_step": 113824, "epoch": 677} {"train_loss": -10.057064056396484, "global_step": 113825, "epoch": 677} {"train_loss": -10.140152931213379, "global_step": 113826, "epoch": 677} {"train_loss": -10.09469985961914, "global_step": 113827, "epoch": 677} {"train_loss": -10.117181777954102, "global_step": 113828, "epoch": 677} {"train_loss": -10.198966979980469, "global_step": 113829, "epoch": 677} {"train_loss": -9.916833877563477, "global_step": 113830, "epoch": 677} {"train_loss": -9.944246292114258, "global_step": 113831, "epoch": 677} {"train_loss": -9.900825500488281, "global_step": 113832, "epoch": 677} {"train_loss": -9.774441719055176, "global_step": 113833, "epoch": 677} {"train_loss": -9.6220121383667, "global_step": 113834, "epoch": 677} {"train_loss": -10.360366821289062, "global_step": 113835, "epoch": 677} {"train_loss": -9.89474105834961, "global_step": 113836, "epoch": 677} {"train_loss": -10.095340728759766, "global_step": 113837, "epoch": 677} {"train_loss": -9.940905570983887, "global_step": 113838, "epoch": 677} {"train_loss": -10.37024211883545, "global_step": 113839, "epoch": 677} {"train_loss": -10.054389953613281, "global_step": 113840, "epoch": 677} {"train_loss": -10.082368850708008, "global_step": 113841, "epoch": 677} {"train_loss": -10.02117919921875, "global_step": 113842, "epoch": 677} {"train_loss": -10.245437622070312, "global_step": 113843, "epoch": 677} {"train_loss": -9.81772232055664, "global_step": 113844, "epoch": 677} {"train_loss": -10.1826810836792, "global_step": 113845, "epoch": 677} {"train_loss": -9.866918563842773, "global_step": 113846, "epoch": 677} {"train_loss": -9.558734893798828, "global_step": 113847, "epoch": 677} {"train_loss": -9.574467658996582, "global_step": 113848, "epoch": 677} {"train_loss": -9.617547988891602, "global_step": 113849, "epoch": 677} {"train_loss": -10.043113708496094, "global_step": 113850, "epoch": 677} {"train_loss": -9.460508346557617, "global_step": 113851, "epoch": 677} {"train_loss": -9.962017059326172, "global_step": 113852, "epoch": 677} {"train_loss": -9.566106796264648, "global_step": 113853, "epoch": 677} {"train_loss": -10.122064590454102, "global_step": 113854, "epoch": 677} {"train_loss": -9.595304489135742, "global_step": 113855, "epoch": 677} {"train_loss": -9.998361587524414, "global_step": 113856, "epoch": 677} {"train_loss": -9.739872932434082, "global_step": 113857, "epoch": 677} {"train_loss": -10.04958438873291, "global_step": 113858, "epoch": 677} {"train_loss": -9.782188415527344, "global_step": 113859, "epoch": 677} {"train_loss": -9.92574405670166, "global_step": 113860, "epoch": 677} {"train_loss": -10.008831024169922, "global_step": 113861, "epoch": 677} {"train_loss": -9.64901351928711, "global_step": 113862, "epoch": 677} {"train_loss": -9.905770301818848, "global_step": 113863, "epoch": 677} {"train_loss": -10.02381706237793, "global_step": 113864, "epoch": 677} {"train_loss": -9.836153984069824, "global_step": 113865, "epoch": 677} {"train_loss": -9.895889282226562, "global_step": 113866, "epoch": 677} {"train_loss": -10.005775451660156, "global_step": 113867, "epoch": 677} {"train_loss": -10.04586410522461, "global_step": 113868, "epoch": 677} {"train_loss": -9.724238395690918, "global_step": 113869, "epoch": 677} {"train_loss": -10.07223129272461, "global_step": 113870, "epoch": 677} {"train_loss": -9.834157943725586, "global_step": 113871, "epoch": 677} {"train_loss": -10.19499397277832, "global_step": 113872, "epoch": 677} {"train_loss": -9.96004581451416, "global_step": 113873, "epoch": 677} {"train_loss": -9.959281921386719, "global_step": 113874, "epoch": 677} {"train_loss": -10.086631774902344, "global_step": 113875, "epoch": 677} {"train_loss": -10.150411605834961, "global_step": 113876, "epoch": 677} {"train_loss": -9.835836410522461, "global_step": 113877, "epoch": 677} {"train_loss": -10.196586608886719, "global_step": 113878, "epoch": 677} {"train_loss": -10.08226203918457, "global_step": 113879, "epoch": 677} {"train_loss": -10.14710807800293, "global_step": 113880, "epoch": 677} {"train_loss": -10.145087242126465, "global_step": 113881, "epoch": 677} {"train_loss": -10.138333320617676, "global_step": 113882, "epoch": 677} {"train_loss": -9.852899551391602, "global_step": 113883, "epoch": 677} {"train_loss": -9.927526473999023, "global_step": 113884, "epoch": 677} {"train_loss": -10.140501022338867, "global_step": 113885, "epoch": 677} {"train_loss": -9.913784980773926, "global_step": 113886, "epoch": 677} {"train_loss": -10.168414115905762, "global_step": 113887, "epoch": 677} {"train_loss": -10.189970016479492, "global_step": 113888, "epoch": 677} {"train_loss": -10.060968399047852, "global_step": 113889, "epoch": 677} {"train_loss": -10.368888854980469, "global_step": 113890, "epoch": 677} {"train_loss": -10.216495513916016, "global_step": 113891, "epoch": 677} {"train_loss": -10.20145034790039, "global_step": 113892, "epoch": 677} {"train_loss": -10.231849670410156, "global_step": 113893, "epoch": 677} {"train_loss": -10.103001594543457, "global_step": 113894, "epoch": 677} {"train_loss": -10.167299270629883, "global_step": 113895, "epoch": 677} {"train_loss": -9.766288757324219, "global_step": 113896, "epoch": 677} {"train_loss": -9.893439292907715, "global_step": 113897, "epoch": 677} {"train_loss": -10.307090759277344, "global_step": 113898, "epoch": 677} {"train_loss": -10.112147331237793, "global_step": 113899, "epoch": 677} {"train_loss": -9.876002311706543, "global_step": 113900, "epoch": 677} {"train_loss": -10.194183349609375, "global_step": 113901, "epoch": 677} {"train_loss": -10.287531852722168, "global_step": 113902, "epoch": 677} {"train_loss": -10.001359786306109, "global_step": 113903, "epoch": 677, "val_loss": 210664.28125} {"train_loss": -10.184545516967773, "global_step": 113904, "epoch": 678} {"train_loss": -10.030706405639648, "global_step": 113905, "epoch": 678} {"train_loss": -10.054224014282227, "global_step": 113906, "epoch": 678} {"train_loss": -9.69782829284668, "global_step": 113907, "epoch": 678} {"train_loss": -9.98394775390625, "global_step": 113908, "epoch": 678} {"train_loss": -9.967483520507812, "global_step": 113909, "epoch": 678} {"train_loss": -9.145153045654297, "global_step": 113910, "epoch": 678} {"train_loss": -9.906623840332031, "global_step": 113911, "epoch": 678} {"train_loss": -9.39444351196289, "global_step": 113912, "epoch": 678} {"train_loss": -9.491521835327148, "global_step": 113913, "epoch": 678} {"train_loss": -9.358482360839844, "global_step": 113914, "epoch": 678} {"train_loss": -8.860795021057129, "global_step": 113915, "epoch": 678} {"train_loss": -9.703001022338867, "global_step": 113916, "epoch": 678} {"train_loss": -9.100893020629883, "global_step": 113917, "epoch": 678} {"train_loss": -9.816049575805664, "global_step": 113918, "epoch": 678} {"train_loss": -8.599583625793457, "global_step": 113919, "epoch": 678} {"train_loss": -9.57086181640625, "global_step": 113920, "epoch": 678} {"train_loss": -9.21139907836914, "global_step": 113921, "epoch": 678} {"train_loss": -9.687158584594727, "global_step": 113922, "epoch": 678} {"train_loss": -9.364067077636719, "global_step": 113923, "epoch": 678} {"train_loss": -9.236356735229492, "global_step": 113924, "epoch": 678} {"train_loss": -9.449312210083008, "global_step": 113925, "epoch": 678} {"train_loss": -9.174995422363281, "global_step": 113926, "epoch": 678} {"train_loss": -9.85899543762207, "global_step": 113927, "epoch": 678} {"train_loss": -9.64639663696289, "global_step": 113928, "epoch": 678} {"train_loss": -9.594911575317383, "global_step": 113929, "epoch": 678} {"train_loss": -9.675496101379395, "global_step": 113930, "epoch": 678} {"train_loss": -9.79444694519043, "global_step": 113931, "epoch": 678} {"train_loss": -9.511273384094238, "global_step": 113932, "epoch": 678} {"train_loss": -9.956387519836426, "global_step": 113933, "epoch": 678} {"train_loss": -9.388750076293945, "global_step": 113934, "epoch": 678} {"train_loss": -9.804084777832031, "global_step": 113935, "epoch": 678} {"train_loss": -9.714510917663574, "global_step": 113936, "epoch": 678} {"train_loss": -9.783110618591309, "global_step": 113937, "epoch": 678} {"train_loss": -9.935935974121094, "global_step": 113938, "epoch": 678} {"train_loss": -9.8019437789917, "global_step": 113939, "epoch": 678} {"train_loss": -9.905582427978516, "global_step": 113940, "epoch": 678} {"train_loss": -9.671335220336914, "global_step": 113941, "epoch": 678} {"train_loss": -9.776010513305664, "global_step": 113942, "epoch": 678} {"train_loss": -10.030021667480469, "global_step": 113943, "epoch": 678} {"train_loss": -9.745051383972168, "global_step": 113944, "epoch": 678} {"train_loss": -9.852235794067383, "global_step": 113945, "epoch": 678} {"train_loss": -10.052799224853516, "global_step": 113946, "epoch": 678} {"train_loss": -9.908550262451172, "global_step": 113947, "epoch": 678} {"train_loss": -10.111459732055664, "global_step": 113948, "epoch": 678} {"train_loss": -10.065947532653809, "global_step": 113949, "epoch": 678} {"train_loss": -10.25133228302002, "global_step": 113950, "epoch": 678} {"train_loss": -9.95069408416748, "global_step": 113951, "epoch": 678} {"train_loss": -9.95911979675293, "global_step": 113952, "epoch": 678} {"train_loss": -10.296124458312988, "global_step": 113953, "epoch": 678} {"train_loss": -9.958150863647461, "global_step": 113954, "epoch": 678} {"train_loss": -10.225976943969727, "global_step": 113955, "epoch": 678} {"train_loss": -9.870706558227539, "global_step": 113956, "epoch": 678} {"train_loss": -10.148247718811035, "global_step": 113957, "epoch": 678} {"train_loss": -10.399904251098633, "global_step": 113958, "epoch": 678} {"train_loss": -10.232813835144043, "global_step": 113959, "epoch": 678} {"train_loss": -10.193053245544434, "global_step": 113960, "epoch": 678} {"train_loss": -10.36857795715332, "global_step": 113961, "epoch": 678} {"train_loss": -10.168536186218262, "global_step": 113962, "epoch": 678} {"train_loss": -10.152486801147461, "global_step": 113963, "epoch": 678} {"train_loss": -10.193161010742188, "global_step": 113964, "epoch": 678} {"train_loss": -10.227922439575195, "global_step": 113965, "epoch": 678} {"train_loss": -10.456055641174316, "global_step": 113966, "epoch": 678} {"train_loss": -10.297323226928711, "global_step": 113967, "epoch": 678} {"train_loss": -10.377238273620605, "global_step": 113968, "epoch": 678} {"train_loss": -10.464781761169434, "global_step": 113969, "epoch": 678} {"train_loss": -10.294672966003418, "global_step": 113970, "epoch": 678} {"train_loss": -10.093062400817871, "global_step": 113971, "epoch": 678} {"train_loss": -10.055280685424805, "global_step": 113972, "epoch": 678} {"train_loss": -10.133338928222656, "global_step": 113973, "epoch": 678} {"train_loss": -9.374679565429688, "global_step": 113974, "epoch": 678} {"train_loss": -9.026374816894531, "global_step": 113975, "epoch": 678} {"train_loss": -10.006769180297852, "global_step": 113976, "epoch": 678} {"train_loss": -8.878181457519531, "global_step": 113977, "epoch": 678} {"train_loss": -9.76187515258789, "global_step": 113978, "epoch": 678} {"train_loss": -9.665122985839844, "global_step": 113979, "epoch": 678} {"train_loss": -9.562302589416504, "global_step": 113980, "epoch": 678} {"train_loss": -9.850414276123047, "global_step": 113981, "epoch": 678} {"train_loss": -9.501861572265625, "global_step": 113982, "epoch": 678} {"train_loss": -9.80968952178955, "global_step": 113983, "epoch": 678} {"train_loss": -9.494087219238281, "global_step": 113984, "epoch": 678} {"train_loss": -9.958639144897461, "global_step": 113985, "epoch": 678} {"train_loss": -9.974447250366211, "global_step": 113986, "epoch": 678} {"train_loss": -9.916618347167969, "global_step": 113987, "epoch": 678} {"train_loss": -9.274405479431152, "global_step": 113988, "epoch": 678} {"train_loss": -9.72437572479248, "global_step": 113989, "epoch": 678} {"train_loss": -9.261980056762695, "global_step": 113990, "epoch": 678} {"train_loss": -9.498842239379883, "global_step": 113991, "epoch": 678} {"train_loss": -9.339826583862305, "global_step": 113992, "epoch": 678} {"train_loss": -9.230684280395508, "global_step": 113993, "epoch": 678} {"train_loss": -8.757883071899414, "global_step": 113994, "epoch": 678} {"train_loss": -9.899055480957031, "global_step": 113995, "epoch": 678} {"train_loss": -9.311373710632324, "global_step": 113996, "epoch": 678} {"train_loss": -9.226667404174805, "global_step": 113997, "epoch": 678} {"train_loss": -9.581001281738281, "global_step": 113998, "epoch": 678} {"train_loss": -9.210064888000488, "global_step": 113999, "epoch": 678} {"train_loss": -9.390069007873535, "global_step": 114000, "epoch": 678} {"train_loss": -9.407327651977539, "global_step": 114001, "epoch": 678} {"train_loss": -9.433441162109375, "global_step": 114002, "epoch": 678} {"train_loss": -9.586090087890625, "global_step": 114003, "epoch": 678} {"train_loss": -9.39179801940918, "global_step": 114004, "epoch": 678} {"train_loss": -9.364655494689941, "global_step": 114005, "epoch": 678} {"train_loss": -10.019994735717773, "global_step": 114006, "epoch": 678} {"train_loss": -9.645502090454102, "global_step": 114007, "epoch": 678} {"train_loss": -9.675973892211914, "global_step": 114008, "epoch": 678} {"train_loss": -9.786076545715332, "global_step": 114009, "epoch": 678} {"train_loss": -9.532133102416992, "global_step": 114010, "epoch": 678} {"train_loss": -9.641454696655273, "global_step": 114011, "epoch": 678} {"train_loss": -9.753281593322754, "global_step": 114012, "epoch": 678} {"train_loss": -9.71310806274414, "global_step": 114013, "epoch": 678} {"train_loss": -10.004661560058594, "global_step": 114014, "epoch": 678} {"train_loss": -9.674318313598633, "global_step": 114015, "epoch": 678} {"train_loss": -9.527837753295898, "global_step": 114016, "epoch": 678} {"train_loss": -9.985973358154297, "global_step": 114017, "epoch": 678} {"train_loss": -9.601983070373535, "global_step": 114018, "epoch": 678} {"train_loss": -10.062795639038086, "global_step": 114019, "epoch": 678} {"train_loss": -9.853922843933105, "global_step": 114020, "epoch": 678} {"train_loss": -9.791101455688477, "global_step": 114021, "epoch": 678} {"train_loss": -10.088301658630371, "global_step": 114022, "epoch": 678} {"train_loss": -9.921571731567383, "global_step": 114023, "epoch": 678} {"train_loss": -9.951602935791016, "global_step": 114024, "epoch": 678} {"train_loss": -10.090816497802734, "global_step": 114025, "epoch": 678} {"train_loss": -10.136906623840332, "global_step": 114026, "epoch": 678} {"train_loss": -9.999639511108398, "global_step": 114027, "epoch": 678} {"train_loss": -10.177483558654785, "global_step": 114028, "epoch": 678} {"train_loss": -9.991581916809082, "global_step": 114029, "epoch": 678} {"train_loss": -10.146915435791016, "global_step": 114030, "epoch": 678} {"train_loss": -10.233179092407227, "global_step": 114031, "epoch": 678} {"train_loss": -10.291126251220703, "global_step": 114032, "epoch": 678} {"train_loss": -10.302590370178223, "global_step": 114033, "epoch": 678} {"train_loss": -10.143024444580078, "global_step": 114034, "epoch": 678} {"train_loss": -10.0181245803833, "global_step": 114035, "epoch": 678} {"train_loss": -10.233139038085938, "global_step": 114036, "epoch": 678} {"train_loss": -10.280647277832031, "global_step": 114037, "epoch": 678} {"train_loss": -10.366975784301758, "global_step": 114038, "epoch": 678} {"train_loss": -10.33251953125, "global_step": 114039, "epoch": 678} {"train_loss": -10.371711730957031, "global_step": 114040, "epoch": 678} {"train_loss": -10.227258682250977, "global_step": 114041, "epoch": 678} {"train_loss": -10.243213653564453, "global_step": 114042, "epoch": 678} {"train_loss": -10.392671585083008, "global_step": 114043, "epoch": 678} {"train_loss": -10.157343864440918, "global_step": 114044, "epoch": 678} {"train_loss": -10.255598068237305, "global_step": 114045, "epoch": 678} {"train_loss": -10.387502670288086, "global_step": 114046, "epoch": 678} {"train_loss": -10.486734390258789, "global_step": 114047, "epoch": 678} {"train_loss": -10.24648666381836, "global_step": 114048, "epoch": 678} {"train_loss": -10.190317153930664, "global_step": 114049, "epoch": 678} {"train_loss": -10.439229965209961, "global_step": 114050, "epoch": 678} {"train_loss": -10.321220397949219, "global_step": 114051, "epoch": 678} {"train_loss": -10.542043685913086, "global_step": 114052, "epoch": 678} {"train_loss": -9.890667915344238, "global_step": 114053, "epoch": 678} {"train_loss": -10.393510818481445, "global_step": 114054, "epoch": 678} {"train_loss": -10.132119178771973, "global_step": 114055, "epoch": 678} {"train_loss": -9.91865348815918, "global_step": 114056, "epoch": 678} {"train_loss": -9.762859344482422, "global_step": 114057, "epoch": 678} {"train_loss": -10.006681442260742, "global_step": 114058, "epoch": 678} {"train_loss": -9.875402450561523, "global_step": 114059, "epoch": 678} {"train_loss": -9.532913208007812, "global_step": 114060, "epoch": 678} {"train_loss": -9.054368019104004, "global_step": 114061, "epoch": 678} {"train_loss": -9.863723754882812, "global_step": 114062, "epoch": 678} {"train_loss": -9.485301971435547, "global_step": 114063, "epoch": 678} {"train_loss": -9.76323127746582, "global_step": 114064, "epoch": 678} {"train_loss": -9.80234432220459, "global_step": 114065, "epoch": 678} {"train_loss": -9.917206764221191, "global_step": 114066, "epoch": 678} {"train_loss": -9.79659652709961, "global_step": 114067, "epoch": 678} {"train_loss": -9.657050132751465, "global_step": 114068, "epoch": 678} {"train_loss": -9.844474792480469, "global_step": 114069, "epoch": 678} {"train_loss": -9.656225204467773, "global_step": 114070, "epoch": 678} {"train_loss": -9.83652500879197, "global_step": 114071, "epoch": 678, "val_loss": 210435.0} {"train_loss": -9.945858001708984, "global_step": 114072, "epoch": 679} {"train_loss": -9.97739028930664, "global_step": 114073, "epoch": 679} {"train_loss": -9.99223518371582, "global_step": 114074, "epoch": 679} {"train_loss": -9.998855590820312, "global_step": 114075, "epoch": 679} {"train_loss": -10.088201522827148, "global_step": 114076, "epoch": 679} {"train_loss": -9.979900360107422, "global_step": 114077, "epoch": 679} {"train_loss": -9.971895217895508, "global_step": 114078, "epoch": 679} {"train_loss": -9.974008560180664, "global_step": 114079, "epoch": 679} {"train_loss": -10.085190773010254, "global_step": 114080, "epoch": 679} {"train_loss": -9.660049438476562, "global_step": 114081, "epoch": 679} {"train_loss": -9.890357971191406, "global_step": 114082, "epoch": 679} {"train_loss": -10.012907028198242, "global_step": 114083, "epoch": 679} {"train_loss": -9.999457359313965, "global_step": 114084, "epoch": 679} {"train_loss": -10.18226146697998, "global_step": 114085, "epoch": 679} {"train_loss": -9.797674179077148, "global_step": 114086, "epoch": 679} {"train_loss": -9.843905448913574, "global_step": 114087, "epoch": 679} {"train_loss": -10.010111808776855, "global_step": 114088, "epoch": 679} {"train_loss": -9.782783508300781, "global_step": 114089, "epoch": 679} {"train_loss": -9.912107467651367, "global_step": 114090, "epoch": 679} {"train_loss": -10.04172420501709, "global_step": 114091, "epoch": 679} {"train_loss": -9.899164199829102, "global_step": 114092, "epoch": 679} {"train_loss": -10.166444778442383, "global_step": 114093, "epoch": 679} {"train_loss": -9.625635147094727, "global_step": 114094, "epoch": 679} {"train_loss": -9.918736457824707, "global_step": 114095, "epoch": 679} {"train_loss": -9.54773235321045, "global_step": 114096, "epoch": 679} {"train_loss": -9.932096481323242, "global_step": 114097, "epoch": 679} {"train_loss": -9.822840690612793, "global_step": 114098, "epoch": 679} {"train_loss": -10.240859985351562, "global_step": 114099, "epoch": 679} {"train_loss": -9.845255851745605, "global_step": 114100, "epoch": 679} {"train_loss": -9.911937713623047, "global_step": 114101, "epoch": 679} {"train_loss": -10.164658546447754, "global_step": 114102, "epoch": 679} {"train_loss": -10.268257141113281, "global_step": 114103, "epoch": 679} {"train_loss": -10.209925651550293, "global_step": 114104, "epoch": 679} {"train_loss": -9.986177444458008, "global_step": 114105, "epoch": 679} {"train_loss": -10.275846481323242, "global_step": 114106, "epoch": 679} {"train_loss": -10.011407852172852, "global_step": 114107, "epoch": 679} {"train_loss": -10.185602188110352, "global_step": 114108, "epoch": 679} {"train_loss": -10.040618896484375, "global_step": 114109, "epoch": 679} {"train_loss": -10.117155075073242, "global_step": 114110, "epoch": 679} {"train_loss": -10.296915054321289, "global_step": 114111, "epoch": 679} {"train_loss": -10.055560111999512, "global_step": 114112, "epoch": 679} {"train_loss": -9.843672752380371, "global_step": 114113, "epoch": 679} {"train_loss": -9.988494873046875, "global_step": 114114, "epoch": 679} {"train_loss": -9.967132568359375, "global_step": 114115, "epoch": 679} {"train_loss": -9.947355270385742, "global_step": 114116, "epoch": 679} {"train_loss": -10.271522521972656, "global_step": 114117, "epoch": 679} {"train_loss": -10.49350643157959, "global_step": 114118, "epoch": 679} {"train_loss": -10.089286804199219, "global_step": 114119, "epoch": 679} {"train_loss": -10.077598571777344, "global_step": 114120, "epoch": 679} {"train_loss": -10.21847915649414, "global_step": 114121, "epoch": 679} {"train_loss": -10.117728233337402, "global_step": 114122, "epoch": 679} {"train_loss": -10.268312454223633, "global_step": 114123, "epoch": 679} {"train_loss": -10.110048294067383, "global_step": 114124, "epoch": 679} {"train_loss": -9.748802185058594, "global_step": 114125, "epoch": 679} {"train_loss": -9.836037635803223, "global_step": 114126, "epoch": 679} {"train_loss": -9.961488723754883, "global_step": 114127, "epoch": 679} {"train_loss": -9.754903793334961, "global_step": 114128, "epoch": 679} {"train_loss": -10.08268928527832, "global_step": 114129, "epoch": 679} {"train_loss": -10.010804176330566, "global_step": 114130, "epoch": 679} {"train_loss": -9.993205070495605, "global_step": 114131, "epoch": 679} {"train_loss": -10.248788833618164, "global_step": 114132, "epoch": 679} {"train_loss": -10.114505767822266, "global_step": 114133, "epoch": 679} {"train_loss": -10.051539421081543, "global_step": 114134, "epoch": 679} {"train_loss": -9.819586753845215, "global_step": 114135, "epoch": 679} {"train_loss": -10.034811019897461, "global_step": 114136, "epoch": 679} {"train_loss": -10.165700912475586, "global_step": 114137, "epoch": 679} {"train_loss": -10.068009376525879, "global_step": 114138, "epoch": 679} {"train_loss": -10.44777774810791, "global_step": 114139, "epoch": 679} {"train_loss": -10.243602752685547, "global_step": 114140, "epoch": 679} {"train_loss": -10.205923080444336, "global_step": 114141, "epoch": 679} {"train_loss": -10.06229019165039, "global_step": 114142, "epoch": 679} {"train_loss": -10.049640655517578, "global_step": 114143, "epoch": 679} {"train_loss": -10.092232704162598, "global_step": 114144, "epoch": 679} {"train_loss": -10.015091896057129, "global_step": 114145, "epoch": 679} {"train_loss": -10.214082717895508, "global_step": 114146, "epoch": 679} {"train_loss": -10.170562744140625, "global_step": 114147, "epoch": 679} {"train_loss": -10.137649536132812, "global_step": 114148, "epoch": 679} {"train_loss": -10.26738166809082, "global_step": 114149, "epoch": 679} {"train_loss": -10.174530029296875, "global_step": 114150, "epoch": 679} {"train_loss": -10.027925491333008, "global_step": 114151, "epoch": 679} {"train_loss": -10.146326065063477, "global_step": 114152, "epoch": 679} {"train_loss": -10.429437637329102, "global_step": 114153, "epoch": 679} {"train_loss": -10.20260238647461, "global_step": 114154, "epoch": 679} {"train_loss": -10.226600646972656, "global_step": 114155, "epoch": 679} {"train_loss": -10.136231422424316, "global_step": 114156, "epoch": 679} {"train_loss": -9.954212188720703, "global_step": 114157, "epoch": 679} {"train_loss": -10.137615203857422, "global_step": 114158, "epoch": 679} {"train_loss": -10.140565872192383, "global_step": 114159, "epoch": 679} {"train_loss": -9.966730117797852, "global_step": 114160, "epoch": 679} {"train_loss": -10.230116844177246, "global_step": 114161, "epoch": 679} {"train_loss": -9.693622589111328, "global_step": 114162, "epoch": 679} {"train_loss": -9.88088607788086, "global_step": 114163, "epoch": 679} {"train_loss": -10.258304595947266, "global_step": 114164, "epoch": 679} {"train_loss": -9.859342575073242, "global_step": 114165, "epoch": 679} {"train_loss": -10.286487579345703, "global_step": 114166, "epoch": 679} {"train_loss": -9.864629745483398, "global_step": 114167, "epoch": 679} {"train_loss": -10.278894424438477, "global_step": 114168, "epoch": 679} {"train_loss": -9.953330993652344, "global_step": 114169, "epoch": 679} {"train_loss": -10.05537223815918, "global_step": 114170, "epoch": 679} {"train_loss": -10.336841583251953, "global_step": 114171, "epoch": 679} {"train_loss": -10.129789352416992, "global_step": 114172, "epoch": 679} {"train_loss": -9.967296600341797, "global_step": 114173, "epoch": 679} {"train_loss": -9.772436141967773, "global_step": 114174, "epoch": 679} {"train_loss": -10.063434600830078, "global_step": 114175, "epoch": 679} {"train_loss": -9.884202003479004, "global_step": 114176, "epoch": 679} {"train_loss": -9.82159423828125, "global_step": 114177, "epoch": 679} {"train_loss": -9.825850486755371, "global_step": 114178, "epoch": 679} {"train_loss": -9.876954078674316, "global_step": 114179, "epoch": 679} {"train_loss": -10.260719299316406, "global_step": 114180, "epoch": 679} {"train_loss": -10.34062671661377, "global_step": 114181, "epoch": 679} {"train_loss": -9.97606086730957, "global_step": 114182, "epoch": 679} {"train_loss": -10.091076850891113, "global_step": 114183, "epoch": 679} {"train_loss": -10.06818675994873, "global_step": 114184, "epoch": 679} {"train_loss": -9.574451446533203, "global_step": 114185, "epoch": 679} {"train_loss": -9.97701644897461, "global_step": 114186, "epoch": 679} {"train_loss": -10.113031387329102, "global_step": 114187, "epoch": 679} {"train_loss": -9.958038330078125, "global_step": 114188, "epoch": 679} {"train_loss": -9.844770431518555, "global_step": 114189, "epoch": 679} {"train_loss": -9.9241361618042, "global_step": 114190, "epoch": 679} {"train_loss": -9.970244407653809, "global_step": 114191, "epoch": 679} {"train_loss": -9.90100383758545, "global_step": 114192, "epoch": 679} {"train_loss": -9.758808135986328, "global_step": 114193, "epoch": 679} {"train_loss": -9.61731243133545, "global_step": 114194, "epoch": 679} {"train_loss": -9.821751594543457, "global_step": 114195, "epoch": 679} {"train_loss": -9.605269432067871, "global_step": 114196, "epoch": 679} {"train_loss": -9.811399459838867, "global_step": 114197, "epoch": 679} {"train_loss": -9.82510757446289, "global_step": 114198, "epoch": 679} {"train_loss": -9.779296875, "global_step": 114199, "epoch": 679} {"train_loss": -10.165848731994629, "global_step": 114200, "epoch": 679} {"train_loss": -9.577947616577148, "global_step": 114201, "epoch": 679} {"train_loss": -9.98778247833252, "global_step": 114202, "epoch": 679} {"train_loss": -10.012792587280273, "global_step": 114203, "epoch": 679} {"train_loss": -9.814985275268555, "global_step": 114204, "epoch": 679} {"train_loss": -10.232061386108398, "global_step": 114205, "epoch": 679} {"train_loss": -9.945259094238281, "global_step": 114206, "epoch": 679} {"train_loss": -9.993233680725098, "global_step": 114207, "epoch": 679} {"train_loss": -10.008987426757812, "global_step": 114208, "epoch": 679} {"train_loss": -10.043512344360352, "global_step": 114209, "epoch": 679} {"train_loss": -10.216733932495117, "global_step": 114210, "epoch": 679} {"train_loss": -10.141853332519531, "global_step": 114211, "epoch": 679} {"train_loss": -10.09271240234375, "global_step": 114212, "epoch": 679} {"train_loss": -10.170679092407227, "global_step": 114213, "epoch": 679} {"train_loss": -10.0809326171875, "global_step": 114214, "epoch": 679} {"train_loss": -9.853677749633789, "global_step": 114215, "epoch": 679} {"train_loss": -10.068559646606445, "global_step": 114216, "epoch": 679} {"train_loss": -9.991710662841797, "global_step": 114217, "epoch": 679} {"train_loss": -10.017887115478516, "global_step": 114218, "epoch": 679} {"train_loss": -10.145870208740234, "global_step": 114219, "epoch": 679} {"train_loss": -10.279144287109375, "global_step": 114220, "epoch": 679} {"train_loss": -10.21324348449707, "global_step": 114221, "epoch": 679} {"train_loss": -10.008075714111328, "global_step": 114222, "epoch": 679} {"train_loss": -10.222923278808594, "global_step": 114223, "epoch": 679} {"train_loss": -9.991960525512695, "global_step": 114224, "epoch": 679} {"train_loss": -9.915201187133789, "global_step": 114225, "epoch": 679} {"train_loss": -9.93785572052002, "global_step": 114226, "epoch": 679} {"train_loss": -9.83781623840332, "global_step": 114227, "epoch": 679} {"train_loss": -9.941232681274414, "global_step": 114228, "epoch": 679} {"train_loss": -10.157144546508789, "global_step": 114229, "epoch": 679} {"train_loss": -10.310077667236328, "global_step": 114230, "epoch": 679} {"train_loss": -10.156179428100586, "global_step": 114231, "epoch": 679} {"train_loss": -10.186673164367676, "global_step": 114232, "epoch": 679} {"train_loss": -10.19366455078125, "global_step": 114233, "epoch": 679} {"train_loss": -10.152195930480957, "global_step": 114234, "epoch": 679} {"train_loss": -10.313243865966797, "global_step": 114235, "epoch": 679} {"train_loss": -10.207048416137695, "global_step": 114236, "epoch": 679} {"train_loss": -10.347128868103027, "global_step": 114237, "epoch": 679} {"train_loss": -9.887441635131836, "global_step": 114238, "epoch": 679} {"train_loss": -10.031032970973424, "global_step": 114239, "epoch": 679, "val_loss": 213516.359375} {"train_loss": -9.865018844604492, "global_step": 114240, "epoch": 680} {"train_loss": -9.47915267944336, "global_step": 114241, "epoch": 680} {"train_loss": -9.998757362365723, "global_step": 114242, "epoch": 680} {"train_loss": -9.3325777053833, "global_step": 114243, "epoch": 680} {"train_loss": -9.553927421569824, "global_step": 114244, "epoch": 680} {"train_loss": -9.404376983642578, "global_step": 114245, "epoch": 680} {"train_loss": -9.592910766601562, "global_step": 114246, "epoch": 680} {"train_loss": -9.861740112304688, "global_step": 114247, "epoch": 680} {"train_loss": -9.469026565551758, "global_step": 114248, "epoch": 680} {"train_loss": -9.821428298950195, "global_step": 114249, "epoch": 680} {"train_loss": -9.815868377685547, "global_step": 114250, "epoch": 680} {"train_loss": -9.441847801208496, "global_step": 114251, "epoch": 680} {"train_loss": -10.039077758789062, "global_step": 114252, "epoch": 680} {"train_loss": -9.636140823364258, "global_step": 114253, "epoch": 680} {"train_loss": -9.82357120513916, "global_step": 114254, "epoch": 680} {"train_loss": -9.946123123168945, "global_step": 114255, "epoch": 680} {"train_loss": -9.696939468383789, "global_step": 114256, "epoch": 680} {"train_loss": -9.870222091674805, "global_step": 114257, "epoch": 680} {"train_loss": -9.618122100830078, "global_step": 114258, "epoch": 680} {"train_loss": -10.07861328125, "global_step": 114259, "epoch": 680} {"train_loss": -9.960662841796875, "global_step": 114260, "epoch": 680} {"train_loss": -9.748727798461914, "global_step": 114261, "epoch": 680} {"train_loss": -9.902655601501465, "global_step": 114262, "epoch": 680} {"train_loss": -9.917983055114746, "global_step": 114263, "epoch": 680} {"train_loss": -9.801952362060547, "global_step": 114264, "epoch": 680} {"train_loss": -10.19532585144043, "global_step": 114265, "epoch": 680} {"train_loss": -10.074833869934082, "global_step": 114266, "epoch": 680} {"train_loss": -9.6287841796875, "global_step": 114267, "epoch": 680} {"train_loss": -10.11407470703125, "global_step": 114268, "epoch": 680} {"train_loss": -9.674694061279297, "global_step": 114269, "epoch": 680} {"train_loss": -10.006555557250977, "global_step": 114270, "epoch": 680} {"train_loss": -10.056468963623047, "global_step": 114271, "epoch": 680} {"train_loss": -9.988648414611816, "global_step": 114272, "epoch": 680} {"train_loss": -9.980656623840332, "global_step": 114273, "epoch": 680} {"train_loss": -10.228231430053711, "global_step": 114274, "epoch": 680} {"train_loss": -9.793210983276367, "global_step": 114275, "epoch": 680} {"train_loss": -10.399576187133789, "global_step": 114276, "epoch": 680} {"train_loss": -9.94420051574707, "global_step": 114277, "epoch": 680} {"train_loss": -10.171957015991211, "global_step": 114278, "epoch": 680} {"train_loss": -10.313386917114258, "global_step": 114279, "epoch": 680} {"train_loss": -10.126532554626465, "global_step": 114280, "epoch": 680} {"train_loss": -10.12520980834961, "global_step": 114281, "epoch": 680} {"train_loss": -10.287836074829102, "global_step": 114282, "epoch": 680} {"train_loss": -10.09094524383545, "global_step": 114283, "epoch": 680} {"train_loss": -10.203556060791016, "global_step": 114284, "epoch": 680} {"train_loss": -10.121023178100586, "global_step": 114285, "epoch": 680} {"train_loss": -10.129329681396484, "global_step": 114286, "epoch": 680} {"train_loss": -10.077751159667969, "global_step": 114287, "epoch": 680} {"train_loss": -10.167986869812012, "global_step": 114288, "epoch": 680} {"train_loss": -10.070392608642578, "global_step": 114289, "epoch": 680} {"train_loss": -10.450027465820312, "global_step": 114290, "epoch": 680} {"train_loss": -9.960047721862793, "global_step": 114291, "epoch": 680} {"train_loss": -10.33657169342041, "global_step": 114292, "epoch": 680} {"train_loss": -10.426323890686035, "global_step": 114293, "epoch": 680} {"train_loss": -10.014516830444336, "global_step": 114294, "epoch": 680} {"train_loss": -10.158546447753906, "global_step": 114295, "epoch": 680} {"train_loss": -10.206864356994629, "global_step": 114296, "epoch": 680} {"train_loss": -10.318022727966309, "global_step": 114297, "epoch": 680} {"train_loss": -9.988600730895996, "global_step": 114298, "epoch": 680} {"train_loss": -10.328926086425781, "global_step": 114299, "epoch": 680} {"train_loss": -10.140819549560547, "global_step": 114300, "epoch": 680} {"train_loss": -10.025827407836914, "global_step": 114301, "epoch": 680} {"train_loss": -10.418152809143066, "global_step": 114302, "epoch": 680} {"train_loss": -9.756449699401855, "global_step": 114303, "epoch": 680} {"train_loss": -9.695402145385742, "global_step": 114304, "epoch": 680} {"train_loss": -10.443571090698242, "global_step": 114305, "epoch": 680} {"train_loss": -10.064118385314941, "global_step": 114306, "epoch": 680} {"train_loss": -10.078729629516602, "global_step": 114307, "epoch": 680} {"train_loss": -9.827556610107422, "global_step": 114308, "epoch": 680} {"train_loss": -9.969537734985352, "global_step": 114309, "epoch": 680} {"train_loss": -9.803277969360352, "global_step": 114310, "epoch": 680} {"train_loss": -10.011271476745605, "global_step": 114311, "epoch": 680} {"train_loss": -10.158636093139648, "global_step": 114312, "epoch": 680} {"train_loss": -10.258604049682617, "global_step": 114313, "epoch": 680} {"train_loss": -9.981743812561035, "global_step": 114314, "epoch": 680} {"train_loss": -10.116605758666992, "global_step": 114315, "epoch": 680} {"train_loss": -10.111236572265625, "global_step": 114316, "epoch": 680} {"train_loss": -10.097428321838379, "global_step": 114317, "epoch": 680} {"train_loss": -10.31732177734375, "global_step": 114318, "epoch": 680} {"train_loss": -9.581241607666016, "global_step": 114319, "epoch": 680} {"train_loss": -9.999930381774902, "global_step": 114320, "epoch": 680} {"train_loss": -9.78223705291748, "global_step": 114321, "epoch": 680} {"train_loss": -9.378454208374023, "global_step": 114322, "epoch": 680} {"train_loss": -10.013465881347656, "global_step": 114323, "epoch": 680} {"train_loss": -9.36518669128418, "global_step": 114324, "epoch": 680} {"train_loss": -10.028573989868164, "global_step": 114325, "epoch": 680} {"train_loss": -9.935495376586914, "global_step": 114326, "epoch": 680} {"train_loss": -9.984638214111328, "global_step": 114327, "epoch": 680} {"train_loss": -10.074017524719238, "global_step": 114328, "epoch": 680} {"train_loss": -10.169063568115234, "global_step": 114329, "epoch": 680} {"train_loss": -9.79940414428711, "global_step": 114330, "epoch": 680} {"train_loss": -9.9850492477417, "global_step": 114331, "epoch": 680} {"train_loss": -9.794733047485352, "global_step": 114332, "epoch": 680} {"train_loss": -9.941854476928711, "global_step": 114333, "epoch": 680} {"train_loss": -10.01579475402832, "global_step": 114334, "epoch": 680} {"train_loss": -10.113617897033691, "global_step": 114335, "epoch": 680} {"train_loss": -10.259286880493164, "global_step": 114336, "epoch": 680} {"train_loss": -10.057306289672852, "global_step": 114337, "epoch": 680} {"train_loss": -9.77859878540039, "global_step": 114338, "epoch": 680} {"train_loss": -10.101363182067871, "global_step": 114339, "epoch": 680} {"train_loss": -9.847579002380371, "global_step": 114340, "epoch": 680} {"train_loss": -10.123085021972656, "global_step": 114341, "epoch": 680} {"train_loss": -10.076047897338867, "global_step": 114342, "epoch": 680} {"train_loss": -9.742408752441406, "global_step": 114343, "epoch": 680} {"train_loss": -10.033401489257812, "global_step": 114344, "epoch": 680} {"train_loss": -9.700033187866211, "global_step": 114345, "epoch": 680} {"train_loss": -10.163278579711914, "global_step": 114346, "epoch": 680} {"train_loss": -10.01809310913086, "global_step": 114347, "epoch": 680} {"train_loss": -9.984786987304688, "global_step": 114348, "epoch": 680} {"train_loss": -9.923341751098633, "global_step": 114349, "epoch": 680} {"train_loss": -9.937345504760742, "global_step": 114350, "epoch": 680} {"train_loss": -9.93541431427002, "global_step": 114351, "epoch": 680} {"train_loss": -10.316471099853516, "global_step": 114352, "epoch": 680} {"train_loss": -10.056822776794434, "global_step": 114353, "epoch": 680} {"train_loss": -9.868386268615723, "global_step": 114354, "epoch": 680} {"train_loss": -9.941177368164062, "global_step": 114355, "epoch": 680} {"train_loss": -9.740211486816406, "global_step": 114356, "epoch": 680} {"train_loss": -9.966001510620117, "global_step": 114357, "epoch": 680} {"train_loss": -9.716154098510742, "global_step": 114358, "epoch": 680} {"train_loss": -9.558384895324707, "global_step": 114359, "epoch": 680} {"train_loss": -9.54656982421875, "global_step": 114360, "epoch": 680} {"train_loss": -10.039901733398438, "global_step": 114361, "epoch": 680} {"train_loss": -9.764317512512207, "global_step": 114362, "epoch": 680} {"train_loss": -9.93078899383545, "global_step": 114363, "epoch": 680} {"train_loss": -10.147674560546875, "global_step": 114364, "epoch": 680} {"train_loss": -9.271240234375, "global_step": 114365, "epoch": 680} {"train_loss": -10.14012622833252, "global_step": 114366, "epoch": 680} {"train_loss": -9.898015975952148, "global_step": 114367, "epoch": 680} {"train_loss": -10.225394248962402, "global_step": 114368, "epoch": 680} {"train_loss": -9.80966567993164, "global_step": 114369, "epoch": 680} {"train_loss": -9.55252742767334, "global_step": 114370, "epoch": 680} {"train_loss": -9.779516220092773, "global_step": 114371, "epoch": 680} {"train_loss": -9.692012786865234, "global_step": 114372, "epoch": 680} {"train_loss": -9.835506439208984, "global_step": 114373, "epoch": 680} {"train_loss": -9.7129487991333, "global_step": 114374, "epoch": 680} {"train_loss": -10.095808029174805, "global_step": 114375, "epoch": 680} {"train_loss": -9.855180740356445, "global_step": 114376, "epoch": 680} {"train_loss": -9.997339248657227, "global_step": 114377, "epoch": 680} {"train_loss": -9.895695686340332, "global_step": 114378, "epoch": 680} {"train_loss": -9.86214828491211, "global_step": 114379, "epoch": 680} {"train_loss": -9.957820892333984, "global_step": 114380, "epoch": 680} {"train_loss": -10.230865478515625, "global_step": 114381, "epoch": 680} {"train_loss": -9.924348831176758, "global_step": 114382, "epoch": 680} {"train_loss": -9.99695110321045, "global_step": 114383, "epoch": 680} {"train_loss": -10.100298881530762, "global_step": 114384, "epoch": 680} {"train_loss": -10.078801155090332, "global_step": 114385, "epoch": 680} {"train_loss": -10.058384895324707, "global_step": 114386, "epoch": 680} {"train_loss": -10.116385459899902, "global_step": 114387, "epoch": 680} {"train_loss": -10.149429321289062, "global_step": 114388, "epoch": 680} {"train_loss": -10.048940658569336, "global_step": 114389, "epoch": 680} {"train_loss": -10.228893280029297, "global_step": 114390, "epoch": 680} {"train_loss": -10.122430801391602, "global_step": 114391, "epoch": 680} {"train_loss": -10.140491485595703, "global_step": 114392, "epoch": 680} {"train_loss": -10.227765083312988, "global_step": 114393, "epoch": 680} {"train_loss": -10.071942329406738, "global_step": 114394, "epoch": 680} {"train_loss": -10.105158805847168, "global_step": 114395, "epoch": 680} {"train_loss": -10.230195045471191, "global_step": 114396, "epoch": 680} {"train_loss": -10.276249885559082, "global_step": 114397, "epoch": 680} {"train_loss": -9.69314193725586, "global_step": 114398, "epoch": 680} {"train_loss": -10.19206428527832, "global_step": 114399, "epoch": 680} {"train_loss": -9.887223243713379, "global_step": 114400, "epoch": 680} {"train_loss": -9.5543794631958, "global_step": 114401, "epoch": 680} {"train_loss": -9.863418579101562, "global_step": 114402, "epoch": 680} {"train_loss": -9.490066528320312, "global_step": 114403, "epoch": 680} {"train_loss": -9.623246192932129, "global_step": 114404, "epoch": 680} {"train_loss": -9.450540542602539, "global_step": 114405, "epoch": 680} {"train_loss": -9.167524337768555, "global_step": 114406, "epoch": 680} {"train_loss": -9.952853736423311, "global_step": 114407, "epoch": 680, "val_loss": 214259.1875, "train_action_mse_error": 9.979772567749023} {"train_loss": -9.389999389648438, "global_step": 114408, "epoch": 681} {"train_loss": -9.911476135253906, "global_step": 114409, "epoch": 681} {"train_loss": -8.869340896606445, "global_step": 114410, "epoch": 681} {"train_loss": -10.060474395751953, "global_step": 114411, "epoch": 681} {"train_loss": -9.300063133239746, "global_step": 114412, "epoch": 681} {"train_loss": -10.058411598205566, "global_step": 114413, "epoch": 681} {"train_loss": -9.321720123291016, "global_step": 114414, "epoch": 681} {"train_loss": -10.085456848144531, "global_step": 114415, "epoch": 681} {"train_loss": -9.781073570251465, "global_step": 114416, "epoch": 681} {"train_loss": -9.762046813964844, "global_step": 114417, "epoch": 681} {"train_loss": -9.83067512512207, "global_step": 114418, "epoch": 681} {"train_loss": -9.824173927307129, "global_step": 114419, "epoch": 681} {"train_loss": -10.141314506530762, "global_step": 114420, "epoch": 681} {"train_loss": -9.909683227539062, "global_step": 114421, "epoch": 681} {"train_loss": -10.174346923828125, "global_step": 114422, "epoch": 681} {"train_loss": -10.156974792480469, "global_step": 114423, "epoch": 681} {"train_loss": -9.964345932006836, "global_step": 114424, "epoch": 681} {"train_loss": -10.015134811401367, "global_step": 114425, "epoch": 681} {"train_loss": -9.89691162109375, "global_step": 114426, "epoch": 681} {"train_loss": -10.138367652893066, "global_step": 114427, "epoch": 681} {"train_loss": -9.90133285522461, "global_step": 114428, "epoch": 681} {"train_loss": -10.065430641174316, "global_step": 114429, "epoch": 681} {"train_loss": -9.98090934753418, "global_step": 114430, "epoch": 681} {"train_loss": -9.87261962890625, "global_step": 114431, "epoch": 681} {"train_loss": -9.794936180114746, "global_step": 114432, "epoch": 681} {"train_loss": -9.960554122924805, "global_step": 114433, "epoch": 681} {"train_loss": -9.920347213745117, "global_step": 114434, "epoch": 681} {"train_loss": -10.054464340209961, "global_step": 114435, "epoch": 681} {"train_loss": -10.090131759643555, "global_step": 114436, "epoch": 681} {"train_loss": -9.879034042358398, "global_step": 114437, "epoch": 681} {"train_loss": -10.331188201904297, "global_step": 114438, "epoch": 681} {"train_loss": -10.101401329040527, "global_step": 114439, "epoch": 681} {"train_loss": -10.240362167358398, "global_step": 114440, "epoch": 681} {"train_loss": -10.155345916748047, "global_step": 114441, "epoch": 681} {"train_loss": -10.297916412353516, "global_step": 114442, "epoch": 681} {"train_loss": -10.149803161621094, "global_step": 114443, "epoch": 681} {"train_loss": -9.771041870117188, "global_step": 114444, "epoch": 681} {"train_loss": -9.890978813171387, "global_step": 114445, "epoch": 681} {"train_loss": -10.071817398071289, "global_step": 114446, "epoch": 681} {"train_loss": -9.97224235534668, "global_step": 114447, "epoch": 681} {"train_loss": -10.15229320526123, "global_step": 114448, "epoch": 681} {"train_loss": -10.00216293334961, "global_step": 114449, "epoch": 681} {"train_loss": -10.01408576965332, "global_step": 114450, "epoch": 681} {"train_loss": -10.31620979309082, "global_step": 114451, "epoch": 681} {"train_loss": -10.18427848815918, "global_step": 114452, "epoch": 681} {"train_loss": -9.85735034942627, "global_step": 114453, "epoch": 681} {"train_loss": -9.958913803100586, "global_step": 114454, "epoch": 681} {"train_loss": -10.15151596069336, "global_step": 114455, "epoch": 681} {"train_loss": -10.139883995056152, "global_step": 114456, "epoch": 681} {"train_loss": -10.055693626403809, "global_step": 114457, "epoch": 681} {"train_loss": -10.183778762817383, "global_step": 114458, "epoch": 681} {"train_loss": -10.256631851196289, "global_step": 114459, "epoch": 681} {"train_loss": -9.962251663208008, "global_step": 114460, "epoch": 681} {"train_loss": -10.415231704711914, "global_step": 114461, "epoch": 681} {"train_loss": -10.107185363769531, "global_step": 114462, "epoch": 681} {"train_loss": -10.396154403686523, "global_step": 114463, "epoch": 681} {"train_loss": -10.178343772888184, "global_step": 114464, "epoch": 681} {"train_loss": -10.531106948852539, "global_step": 114465, "epoch": 681} {"train_loss": -10.078765869140625, "global_step": 114466, "epoch": 681} {"train_loss": -10.148687362670898, "global_step": 114467, "epoch": 681} {"train_loss": -10.260807991027832, "global_step": 114468, "epoch": 681} {"train_loss": -10.406185150146484, "global_step": 114469, "epoch": 681} {"train_loss": -10.174773216247559, "global_step": 114470, "epoch": 681} {"train_loss": -10.179065704345703, "global_step": 114471, "epoch": 681} {"train_loss": -9.978466033935547, "global_step": 114472, "epoch": 681} {"train_loss": -10.255331993103027, "global_step": 114473, "epoch": 681} {"train_loss": -10.138038635253906, "global_step": 114474, "epoch": 681} {"train_loss": -9.946609497070312, "global_step": 114475, "epoch": 681} {"train_loss": -10.05981731414795, "global_step": 114476, "epoch": 681} {"train_loss": -10.345283508300781, "global_step": 114477, "epoch": 681} {"train_loss": -9.909198760986328, "global_step": 114478, "epoch": 681} {"train_loss": -10.225972175598145, "global_step": 114479, "epoch": 681} {"train_loss": -9.949163436889648, "global_step": 114480, "epoch": 681} {"train_loss": -9.89175033569336, "global_step": 114481, "epoch": 681} {"train_loss": -10.348306655883789, "global_step": 114482, "epoch": 681} {"train_loss": -9.96293830871582, "global_step": 114483, "epoch": 681} {"train_loss": -10.235770225524902, "global_step": 114484, "epoch": 681} {"train_loss": -9.922832489013672, "global_step": 114485, "epoch": 681} {"train_loss": -10.197047233581543, "global_step": 114486, "epoch": 681} {"train_loss": -9.920965194702148, "global_step": 114487, "epoch": 681} {"train_loss": -10.164270401000977, "global_step": 114488, "epoch": 681} {"train_loss": -10.009414672851562, "global_step": 114489, "epoch": 681} {"train_loss": -10.551918029785156, "global_step": 114490, "epoch": 681} {"train_loss": -10.087163925170898, "global_step": 114491, "epoch": 681} {"train_loss": -10.02089786529541, "global_step": 114492, "epoch": 681} {"train_loss": -9.701112747192383, "global_step": 114493, "epoch": 681} {"train_loss": -9.155710220336914, "global_step": 114494, "epoch": 681} {"train_loss": -10.032466888427734, "global_step": 114495, "epoch": 681} {"train_loss": -9.330373764038086, "global_step": 114496, "epoch": 681} {"train_loss": -9.431388854980469, "global_step": 114497, "epoch": 681} {"train_loss": -9.721545219421387, "global_step": 114498, "epoch": 681} {"train_loss": -9.908124923706055, "global_step": 114499, "epoch": 681} {"train_loss": -9.9762544631958, "global_step": 114500, "epoch": 681} {"train_loss": -9.591618537902832, "global_step": 114501, "epoch": 681} {"train_loss": -9.82874870300293, "global_step": 114502, "epoch": 681} {"train_loss": -9.828322410583496, "global_step": 114503, "epoch": 681} {"train_loss": -10.310943603515625, "global_step": 114504, "epoch": 681} {"train_loss": -9.823308944702148, "global_step": 114505, "epoch": 681} {"train_loss": -9.880464553833008, "global_step": 114506, "epoch": 681} {"train_loss": -10.168013572692871, "global_step": 114507, "epoch": 681} {"train_loss": -10.053084373474121, "global_step": 114508, "epoch": 681} {"train_loss": -10.457104682922363, "global_step": 114509, "epoch": 681} {"train_loss": -9.982524871826172, "global_step": 114510, "epoch": 681} {"train_loss": -9.95987606048584, "global_step": 114511, "epoch": 681} {"train_loss": -9.983487129211426, "global_step": 114512, "epoch": 681} {"train_loss": -10.037131309509277, "global_step": 114513, "epoch": 681} {"train_loss": -10.138679504394531, "global_step": 114514, "epoch": 681} {"train_loss": -10.168789863586426, "global_step": 114515, "epoch": 681} {"train_loss": -10.305795669555664, "global_step": 114516, "epoch": 681} {"train_loss": -10.459192276000977, "global_step": 114517, "epoch": 681} {"train_loss": -10.241090774536133, "global_step": 114518, "epoch": 681} {"train_loss": -10.104146957397461, "global_step": 114519, "epoch": 681} {"train_loss": -10.337894439697266, "global_step": 114520, "epoch": 681} {"train_loss": -10.186497688293457, "global_step": 114521, "epoch": 681} {"train_loss": -10.253890991210938, "global_step": 114522, "epoch": 681} {"train_loss": -10.338768005371094, "global_step": 114523, "epoch": 681} {"train_loss": -10.402999877929688, "global_step": 114524, "epoch": 681} {"train_loss": -10.371684074401855, "global_step": 114525, "epoch": 681} {"train_loss": -10.268632888793945, "global_step": 114526, "epoch": 681} {"train_loss": -10.318050384521484, "global_step": 114527, "epoch": 681} {"train_loss": -10.337005615234375, "global_step": 114528, "epoch": 681} {"train_loss": -10.276933670043945, "global_step": 114529, "epoch": 681} {"train_loss": -10.197795867919922, "global_step": 114530, "epoch": 681} {"train_loss": -10.261841773986816, "global_step": 114531, "epoch": 681} {"train_loss": -10.157225608825684, "global_step": 114532, "epoch": 681} {"train_loss": -10.428033828735352, "global_step": 114533, "epoch": 681} {"train_loss": -10.099542617797852, "global_step": 114534, "epoch": 681} {"train_loss": -9.843011856079102, "global_step": 114535, "epoch": 681} {"train_loss": -10.058743476867676, "global_step": 114536, "epoch": 681} {"train_loss": -10.047403335571289, "global_step": 114537, "epoch": 681} {"train_loss": -10.264545440673828, "global_step": 114538, "epoch": 681} {"train_loss": -10.110956192016602, "global_step": 114539, "epoch": 681} {"train_loss": -10.417718887329102, "global_step": 114540, "epoch": 681} {"train_loss": -9.601303100585938, "global_step": 114541, "epoch": 681} {"train_loss": -10.176945686340332, "global_step": 114542, "epoch": 681} {"train_loss": -9.755946159362793, "global_step": 114543, "epoch": 681} {"train_loss": -10.023406982421875, "global_step": 114544, "epoch": 681} {"train_loss": -9.39883804321289, "global_step": 114545, "epoch": 681} {"train_loss": -9.741479873657227, "global_step": 114546, "epoch": 681} {"train_loss": -9.779130935668945, "global_step": 114547, "epoch": 681} {"train_loss": -9.930185317993164, "global_step": 114548, "epoch": 681} {"train_loss": -9.961220741271973, "global_step": 114549, "epoch": 681} {"train_loss": -10.124378204345703, "global_step": 114550, "epoch": 681} {"train_loss": -10.043875694274902, "global_step": 114551, "epoch": 681} {"train_loss": -9.768442153930664, "global_step": 114552, "epoch": 681} {"train_loss": -10.033761024475098, "global_step": 114553, "epoch": 681} {"train_loss": -9.801980972290039, "global_step": 114554, "epoch": 681} {"train_loss": -10.084214210510254, "global_step": 114555, "epoch": 681} {"train_loss": -9.896368980407715, "global_step": 114556, "epoch": 681} {"train_loss": -9.968120574951172, "global_step": 114557, "epoch": 681} {"train_loss": -10.07967472076416, "global_step": 114558, "epoch": 681} {"train_loss": -9.683435440063477, "global_step": 114559, "epoch": 681} {"train_loss": -10.247848510742188, "global_step": 114560, "epoch": 681} {"train_loss": -10.257369995117188, "global_step": 114561, "epoch": 681} {"train_loss": -10.078518867492676, "global_step": 114562, "epoch": 681} {"train_loss": -10.128911972045898, "global_step": 114563, "epoch": 681} {"train_loss": -9.865377426147461, "global_step": 114564, "epoch": 681} {"train_loss": -10.092557907104492, "global_step": 114565, "epoch": 681} {"train_loss": -10.057575225830078, "global_step": 114566, "epoch": 681} {"train_loss": -10.203697204589844, "global_step": 114567, "epoch": 681} {"train_loss": -9.432933807373047, "global_step": 114568, "epoch": 681} {"train_loss": -9.980792999267578, "global_step": 114569, "epoch": 681} {"train_loss": -10.257125854492188, "global_step": 114570, "epoch": 681} {"train_loss": -10.033220291137695, "global_step": 114571, "epoch": 681} {"train_loss": -9.880950927734375, "global_step": 114572, "epoch": 681} {"train_loss": -10.066458702087402, "global_step": 114573, "epoch": 681} {"train_loss": -10.269044876098633, "global_step": 114574, "epoch": 681} {"train_loss": -10.034235812368847, "global_step": 114575, "epoch": 681, "val_loss": 214538.65625} {"train_loss": -10.07995891571045, "global_step": 114576, "epoch": 682} {"train_loss": -10.118515968322754, "global_step": 114577, "epoch": 682} {"train_loss": -10.023274421691895, "global_step": 114578, "epoch": 682} {"train_loss": -9.969321250915527, "global_step": 114579, "epoch": 682} {"train_loss": -10.221359252929688, "global_step": 114580, "epoch": 682} {"train_loss": -10.24227523803711, "global_step": 114581, "epoch": 682} {"train_loss": -10.299102783203125, "global_step": 114582, "epoch": 682} {"train_loss": -10.246879577636719, "global_step": 114583, "epoch": 682} {"train_loss": -10.208168983459473, "global_step": 114584, "epoch": 682} {"train_loss": -10.269248962402344, "global_step": 114585, "epoch": 682} {"train_loss": -10.12575912475586, "global_step": 114586, "epoch": 682} {"train_loss": -10.151912689208984, "global_step": 114587, "epoch": 682} {"train_loss": -10.295042991638184, "global_step": 114588, "epoch": 682} {"train_loss": -10.208463668823242, "global_step": 114589, "epoch": 682} {"train_loss": -10.375726699829102, "global_step": 114590, "epoch": 682} {"train_loss": -10.397167205810547, "global_step": 114591, "epoch": 682} {"train_loss": -10.132747650146484, "global_step": 114592, "epoch": 682} {"train_loss": -9.844573974609375, "global_step": 114593, "epoch": 682} {"train_loss": -10.308889389038086, "global_step": 114594, "epoch": 682} {"train_loss": -10.317609786987305, "global_step": 114595, "epoch": 682} {"train_loss": -10.224714279174805, "global_step": 114596, "epoch": 682} {"train_loss": -10.491949081420898, "global_step": 114597, "epoch": 682} {"train_loss": -10.316787719726562, "global_step": 114598, "epoch": 682} {"train_loss": -10.226078987121582, "global_step": 114599, "epoch": 682} {"train_loss": -10.170907974243164, "global_step": 114600, "epoch": 682} {"train_loss": -10.339603424072266, "global_step": 114601, "epoch": 682} {"train_loss": -9.884234428405762, "global_step": 114602, "epoch": 682} {"train_loss": -9.719804763793945, "global_step": 114603, "epoch": 682} {"train_loss": -10.170808792114258, "global_step": 114604, "epoch": 682} {"train_loss": -9.813393592834473, "global_step": 114605, "epoch": 682} {"train_loss": -10.132991790771484, "global_step": 114606, "epoch": 682} {"train_loss": -9.49485969543457, "global_step": 114607, "epoch": 682} {"train_loss": -9.93222713470459, "global_step": 114608, "epoch": 682} {"train_loss": -9.771451950073242, "global_step": 114609, "epoch": 682} {"train_loss": -9.841346740722656, "global_step": 114610, "epoch": 682} {"train_loss": -10.010063171386719, "global_step": 114611, "epoch": 682} {"train_loss": -9.901844024658203, "global_step": 114612, "epoch": 682} {"train_loss": -9.731934547424316, "global_step": 114613, "epoch": 682} {"train_loss": -9.835586547851562, "global_step": 114614, "epoch": 682} {"train_loss": -10.044539451599121, "global_step": 114615, "epoch": 682} {"train_loss": -9.590983390808105, "global_step": 114616, "epoch": 682} {"train_loss": -10.093573570251465, "global_step": 114617, "epoch": 682} {"train_loss": -9.728421211242676, "global_step": 114618, "epoch": 682} {"train_loss": -9.686084747314453, "global_step": 114619, "epoch": 682} {"train_loss": -9.817310333251953, "global_step": 114620, "epoch": 682} {"train_loss": -9.718818664550781, "global_step": 114621, "epoch": 682} {"train_loss": -9.501379013061523, "global_step": 114622, "epoch": 682} {"train_loss": -9.808089256286621, "global_step": 114623, "epoch": 682} {"train_loss": -9.712240219116211, "global_step": 114624, "epoch": 682} {"train_loss": -9.97618579864502, "global_step": 114625, "epoch": 682} {"train_loss": -9.574203491210938, "global_step": 114626, "epoch": 682} {"train_loss": -9.891828536987305, "global_step": 114627, "epoch": 682} {"train_loss": -9.843134880065918, "global_step": 114628, "epoch": 682} {"train_loss": -9.755922317504883, "global_step": 114629, "epoch": 682} {"train_loss": -9.681965827941895, "global_step": 114630, "epoch": 682} {"train_loss": -9.719423294067383, "global_step": 114631, "epoch": 682} {"train_loss": -9.390950202941895, "global_step": 114632, "epoch": 682} {"train_loss": -10.086078643798828, "global_step": 114633, "epoch": 682} {"train_loss": -9.644862174987793, "global_step": 114634, "epoch": 682} {"train_loss": -9.78183650970459, "global_step": 114635, "epoch": 682} {"train_loss": -9.810306549072266, "global_step": 114636, "epoch": 682} {"train_loss": -10.127484321594238, "global_step": 114637, "epoch": 682} {"train_loss": -9.938163757324219, "global_step": 114638, "epoch": 682} {"train_loss": -10.039017677307129, "global_step": 114639, "epoch": 682} {"train_loss": -9.829811096191406, "global_step": 114640, "epoch": 682} {"train_loss": -9.758731842041016, "global_step": 114641, "epoch": 682} {"train_loss": -9.858171463012695, "global_step": 114642, "epoch": 682} {"train_loss": -10.071011543273926, "global_step": 114643, "epoch": 682} {"train_loss": -9.772784233093262, "global_step": 114644, "epoch": 682} {"train_loss": -10.172443389892578, "global_step": 114645, "epoch": 682} {"train_loss": -10.000133514404297, "global_step": 114646, "epoch": 682} {"train_loss": -10.276106834411621, "global_step": 114647, "epoch": 682} {"train_loss": -9.803200721740723, "global_step": 114648, "epoch": 682} {"train_loss": -10.205425262451172, "global_step": 114649, "epoch": 682} {"train_loss": -10.151971817016602, "global_step": 114650, "epoch": 682} {"train_loss": -10.273992538452148, "global_step": 114651, "epoch": 682} {"train_loss": -10.026586532592773, "global_step": 114652, "epoch": 682} {"train_loss": -10.224498748779297, "global_step": 114653, "epoch": 682} {"train_loss": -10.046182632446289, "global_step": 114654, "epoch": 682} {"train_loss": -10.167303085327148, "global_step": 114655, "epoch": 682} {"train_loss": -9.731136322021484, "global_step": 114656, "epoch": 682} {"train_loss": -10.112895965576172, "global_step": 114657, "epoch": 682} {"train_loss": -10.035810470581055, "global_step": 114658, "epoch": 682} {"train_loss": -10.01335620880127, "global_step": 114659, "epoch": 682} {"train_loss": -9.888344764709473, "global_step": 114660, "epoch": 682} {"train_loss": -10.083837509155273, "global_step": 114661, "epoch": 682} {"train_loss": -10.075773239135742, "global_step": 114662, "epoch": 682} {"train_loss": -10.236700057983398, "global_step": 114663, "epoch": 682} {"train_loss": -9.87557601928711, "global_step": 114664, "epoch": 682} {"train_loss": -10.108708381652832, "global_step": 114665, "epoch": 682} {"train_loss": -9.910073280334473, "global_step": 114666, "epoch": 682} {"train_loss": -10.191140174865723, "global_step": 114667, "epoch": 682} {"train_loss": -9.797794342041016, "global_step": 114668, "epoch": 682} {"train_loss": -10.223882675170898, "global_step": 114669, "epoch": 682} {"train_loss": -10.198491096496582, "global_step": 114670, "epoch": 682} {"train_loss": -9.77281379699707, "global_step": 114671, "epoch": 682} {"train_loss": -10.02486515045166, "global_step": 114672, "epoch": 682} {"train_loss": -10.049545288085938, "global_step": 114673, "epoch": 682} {"train_loss": -10.241896629333496, "global_step": 114674, "epoch": 682} {"train_loss": -9.844594955444336, "global_step": 114675, "epoch": 682} {"train_loss": -9.655128479003906, "global_step": 114676, "epoch": 682} {"train_loss": -9.814733505249023, "global_step": 114677, "epoch": 682} {"train_loss": -9.478324890136719, "global_step": 114678, "epoch": 682} {"train_loss": -9.630794525146484, "global_step": 114679, "epoch": 682} {"train_loss": -9.120513916015625, "global_step": 114680, "epoch": 682} {"train_loss": -8.554084777832031, "global_step": 114681, "epoch": 682} {"train_loss": -10.011970520019531, "global_step": 114682, "epoch": 682} {"train_loss": -8.954318046569824, "global_step": 114683, "epoch": 682} {"train_loss": -9.816045761108398, "global_step": 114684, "epoch": 682} {"train_loss": -9.272172927856445, "global_step": 114685, "epoch": 682} {"train_loss": -9.688943862915039, "global_step": 114686, "epoch": 682} {"train_loss": -9.166807174682617, "global_step": 114687, "epoch": 682} {"train_loss": -9.00428581237793, "global_step": 114688, "epoch": 682} {"train_loss": -9.736565589904785, "global_step": 114689, "epoch": 682} {"train_loss": -9.439496994018555, "global_step": 114690, "epoch": 682} {"train_loss": -9.698509216308594, "global_step": 114691, "epoch": 682} {"train_loss": -9.781695365905762, "global_step": 114692, "epoch": 682} {"train_loss": -9.857706069946289, "global_step": 114693, "epoch": 682} {"train_loss": -9.538747787475586, "global_step": 114694, "epoch": 682} {"train_loss": -9.48806095123291, "global_step": 114695, "epoch": 682} {"train_loss": -9.851640701293945, "global_step": 114696, "epoch": 682} {"train_loss": -9.491065979003906, "global_step": 114697, "epoch": 682} {"train_loss": -9.42180061340332, "global_step": 114698, "epoch": 682} {"train_loss": -9.847040176391602, "global_step": 114699, "epoch": 682} {"train_loss": -9.478790283203125, "global_step": 114700, "epoch": 682} {"train_loss": -9.869714736938477, "global_step": 114701, "epoch": 682} {"train_loss": -9.8877534866333, "global_step": 114702, "epoch": 682} {"train_loss": -10.093832015991211, "global_step": 114703, "epoch": 682} {"train_loss": -9.983894348144531, "global_step": 114704, "epoch": 682} {"train_loss": -9.98237419128418, "global_step": 114705, "epoch": 682} {"train_loss": -9.958706855773926, "global_step": 114706, "epoch": 682} {"train_loss": -10.000408172607422, "global_step": 114707, "epoch": 682} {"train_loss": -9.764965057373047, "global_step": 114708, "epoch": 682} {"train_loss": -10.09699821472168, "global_step": 114709, "epoch": 682} {"train_loss": -10.180586814880371, "global_step": 114710, "epoch": 682} {"train_loss": -10.074426651000977, "global_step": 114711, "epoch": 682} {"train_loss": -10.341388702392578, "global_step": 114712, "epoch": 682} {"train_loss": -10.33791732788086, "global_step": 114713, "epoch": 682} {"train_loss": -10.185892105102539, "global_step": 114714, "epoch": 682} {"train_loss": -10.111387252807617, "global_step": 114715, "epoch": 682} {"train_loss": -10.290072441101074, "global_step": 114716, "epoch": 682} {"train_loss": -10.171415328979492, "global_step": 114717, "epoch": 682} {"train_loss": -10.080788612365723, "global_step": 114718, "epoch": 682} {"train_loss": -10.230344772338867, "global_step": 114719, "epoch": 682} {"train_loss": -10.174023628234863, "global_step": 114720, "epoch": 682} {"train_loss": -10.137067794799805, "global_step": 114721, "epoch": 682} {"train_loss": -10.160362243652344, "global_step": 114722, "epoch": 682} {"train_loss": -10.161064147949219, "global_step": 114723, "epoch": 682} {"train_loss": -10.113044738769531, "global_step": 114724, "epoch": 682} {"train_loss": -10.231949806213379, "global_step": 114725, "epoch": 682} {"train_loss": -10.255790710449219, "global_step": 114726, "epoch": 682} {"train_loss": -10.42558479309082, "global_step": 114727, "epoch": 682} {"train_loss": -10.104140281677246, "global_step": 114728, "epoch": 682} {"train_loss": -10.160408973693848, "global_step": 114729, "epoch": 682} {"train_loss": -10.506718635559082, "global_step": 114730, "epoch": 682} {"train_loss": -10.439886093139648, "global_step": 114731, "epoch": 682} {"train_loss": -10.240826606750488, "global_step": 114732, "epoch": 682} {"train_loss": -10.386150360107422, "global_step": 114733, "epoch": 682} {"train_loss": -10.166152954101562, "global_step": 114734, "epoch": 682} {"train_loss": -10.269729614257812, "global_step": 114735, "epoch": 682} {"train_loss": -10.299057006835938, "global_step": 114736, "epoch": 682} {"train_loss": -10.246610641479492, "global_step": 114737, "epoch": 682} {"train_loss": -10.325017929077148, "global_step": 114738, "epoch": 682} {"train_loss": -10.295886039733887, "global_step": 114739, "epoch": 682} {"train_loss": -10.166189193725586, "global_step": 114740, "epoch": 682} {"train_loss": -9.794271469116211, "global_step": 114741, "epoch": 682} {"train_loss": -10.325944900512695, "global_step": 114742, "epoch": 682} {"train_loss": -9.969405696505593, "global_step": 114743, "epoch": 682, "val_loss": 211705.859375} {"train_loss": -10.27220344543457, "global_step": 114744, "epoch": 683} {"train_loss": -10.157951354980469, "global_step": 114745, "epoch": 683} {"train_loss": -10.11007308959961, "global_step": 114746, "epoch": 683} {"train_loss": -9.912158012390137, "global_step": 114747, "epoch": 683} {"train_loss": -9.794297218322754, "global_step": 114748, "epoch": 683} {"train_loss": -10.326020240783691, "global_step": 114749, "epoch": 683} {"train_loss": -10.087518692016602, "global_step": 114750, "epoch": 683} {"train_loss": -9.770085334777832, "global_step": 114751, "epoch": 683} {"train_loss": -10.080811500549316, "global_step": 114752, "epoch": 683} {"train_loss": -9.808982849121094, "global_step": 114753, "epoch": 683} {"train_loss": -10.069923400878906, "global_step": 114754, "epoch": 683} {"train_loss": -10.261465072631836, "global_step": 114755, "epoch": 683} {"train_loss": -10.240232467651367, "global_step": 114756, "epoch": 683} {"train_loss": -10.128656387329102, "global_step": 114757, "epoch": 683} {"train_loss": -9.956366539001465, "global_step": 114758, "epoch": 683} {"train_loss": -9.864635467529297, "global_step": 114759, "epoch": 683} {"train_loss": -10.004236221313477, "global_step": 114760, "epoch": 683} {"train_loss": -9.881677627563477, "global_step": 114761, "epoch": 683} {"train_loss": -9.826347351074219, "global_step": 114762, "epoch": 683} {"train_loss": -10.148236274719238, "global_step": 114763, "epoch": 683} {"train_loss": -10.012332916259766, "global_step": 114764, "epoch": 683} {"train_loss": -10.31783676147461, "global_step": 114765, "epoch": 683} {"train_loss": -9.944002151489258, "global_step": 114766, "epoch": 683} {"train_loss": -9.965289115905762, "global_step": 114767, "epoch": 683} {"train_loss": -9.770788192749023, "global_step": 114768, "epoch": 683} {"train_loss": -9.99333381652832, "global_step": 114769, "epoch": 683} {"train_loss": -10.014507293701172, "global_step": 114770, "epoch": 683} {"train_loss": -9.99352741241455, "global_step": 114771, "epoch": 683} {"train_loss": -10.06509017944336, "global_step": 114772, "epoch": 683} {"train_loss": -9.881072998046875, "global_step": 114773, "epoch": 683} {"train_loss": -10.252058029174805, "global_step": 114774, "epoch": 683} {"train_loss": -9.901859283447266, "global_step": 114775, "epoch": 683} {"train_loss": -10.085272789001465, "global_step": 114776, "epoch": 683} {"train_loss": -9.988459587097168, "global_step": 114777, "epoch": 683} {"train_loss": -10.200834274291992, "global_step": 114778, "epoch": 683} {"train_loss": -9.817502975463867, "global_step": 114779, "epoch": 683} {"train_loss": -10.243207931518555, "global_step": 114780, "epoch": 683} {"train_loss": -9.865392684936523, "global_step": 114781, "epoch": 683} {"train_loss": -10.187777519226074, "global_step": 114782, "epoch": 683} {"train_loss": -9.969090461730957, "global_step": 114783, "epoch": 683} {"train_loss": -9.994364738464355, "global_step": 114784, "epoch": 683} {"train_loss": -10.1165189743042, "global_step": 114785, "epoch": 683} {"train_loss": -10.010229110717773, "global_step": 114786, "epoch": 683} {"train_loss": -9.905827522277832, "global_step": 114787, "epoch": 683} {"train_loss": -10.153009414672852, "global_step": 114788, "epoch": 683} {"train_loss": -10.203215599060059, "global_step": 114789, "epoch": 683} {"train_loss": -10.13493824005127, "global_step": 114790, "epoch": 683} {"train_loss": -10.016142845153809, "global_step": 114791, "epoch": 683} {"train_loss": -10.293035507202148, "global_step": 114792, "epoch": 683} {"train_loss": -10.160715103149414, "global_step": 114793, "epoch": 683} {"train_loss": -10.156684875488281, "global_step": 114794, "epoch": 683} {"train_loss": -10.202900886535645, "global_step": 114795, "epoch": 683} {"train_loss": -10.138737678527832, "global_step": 114796, "epoch": 683} {"train_loss": -10.068730354309082, "global_step": 114797, "epoch": 683} {"train_loss": -10.285741806030273, "global_step": 114798, "epoch": 683} {"train_loss": -10.161139488220215, "global_step": 114799, "epoch": 683} {"train_loss": -10.221875190734863, "global_step": 114800, "epoch": 683} {"train_loss": -10.245810508728027, "global_step": 114801, "epoch": 683} {"train_loss": -10.107038497924805, "global_step": 114802, "epoch": 683} {"train_loss": -10.035476684570312, "global_step": 114803, "epoch": 683} {"train_loss": -10.382229804992676, "global_step": 114804, "epoch": 683} {"train_loss": -10.288043975830078, "global_step": 114805, "epoch": 683} {"train_loss": -10.153448104858398, "global_step": 114806, "epoch": 683} {"train_loss": -10.138147354125977, "global_step": 114807, "epoch": 683} {"train_loss": -10.22846794128418, "global_step": 114808, "epoch": 683} {"train_loss": -10.230314254760742, "global_step": 114809, "epoch": 683} {"train_loss": -10.30753231048584, "global_step": 114810, "epoch": 683} {"train_loss": -10.260695457458496, "global_step": 114811, "epoch": 683} {"train_loss": -9.975637435913086, "global_step": 114812, "epoch": 683} {"train_loss": -10.300378799438477, "global_step": 114813, "epoch": 683} {"train_loss": -10.241591453552246, "global_step": 114814, "epoch": 683} {"train_loss": -10.140552520751953, "global_step": 114815, "epoch": 683} {"train_loss": -10.28030776977539, "global_step": 114816, "epoch": 683} {"train_loss": -10.178611755371094, "global_step": 114817, "epoch": 683} {"train_loss": -10.050325393676758, "global_step": 114818, "epoch": 683} {"train_loss": -9.930452346801758, "global_step": 114819, "epoch": 683} {"train_loss": -9.77159595489502, "global_step": 114820, "epoch": 683} {"train_loss": -9.920188903808594, "global_step": 114821, "epoch": 683} {"train_loss": -10.293872833251953, "global_step": 114822, "epoch": 683} {"train_loss": -9.381375312805176, "global_step": 114823, "epoch": 683} {"train_loss": -10.023033142089844, "global_step": 114824, "epoch": 683} {"train_loss": -9.776198387145996, "global_step": 114825, "epoch": 683} {"train_loss": -9.4839448928833, "global_step": 114826, "epoch": 683} {"train_loss": -10.145228385925293, "global_step": 114827, "epoch": 683} {"train_loss": -8.32442855834961, "global_step": 114828, "epoch": 683} {"train_loss": -9.429178237915039, "global_step": 114829, "epoch": 683} {"train_loss": -9.618383407592773, "global_step": 114830, "epoch": 683} {"train_loss": -9.142918586730957, "global_step": 114831, "epoch": 683} {"train_loss": -9.976421356201172, "global_step": 114832, "epoch": 683} {"train_loss": -9.33531379699707, "global_step": 114833, "epoch": 683} {"train_loss": -9.982492446899414, "global_step": 114834, "epoch": 683} {"train_loss": -9.558788299560547, "global_step": 114835, "epoch": 683} {"train_loss": -9.791595458984375, "global_step": 114836, "epoch": 683} {"train_loss": -9.403120040893555, "global_step": 114837, "epoch": 683} {"train_loss": -9.713750839233398, "global_step": 114838, "epoch": 683} {"train_loss": -8.948027610778809, "global_step": 114839, "epoch": 683} {"train_loss": -9.653358459472656, "global_step": 114840, "epoch": 683} {"train_loss": -9.612876892089844, "global_step": 114841, "epoch": 683} {"train_loss": -9.515016555786133, "global_step": 114842, "epoch": 683} {"train_loss": -9.645055770874023, "global_step": 114843, "epoch": 683} {"train_loss": -9.670093536376953, "global_step": 114844, "epoch": 683} {"train_loss": -9.6065034866333, "global_step": 114845, "epoch": 683} {"train_loss": -9.451539039611816, "global_step": 114846, "epoch": 683} {"train_loss": -9.757020950317383, "global_step": 114847, "epoch": 683} {"train_loss": -9.576488494873047, "global_step": 114848, "epoch": 683} {"train_loss": -9.034536361694336, "global_step": 114849, "epoch": 683} {"train_loss": -9.623926162719727, "global_step": 114850, "epoch": 683} {"train_loss": -9.72978687286377, "global_step": 114851, "epoch": 683} {"train_loss": -9.088273048400879, "global_step": 114852, "epoch": 683} {"train_loss": -9.746044158935547, "global_step": 114853, "epoch": 683} {"train_loss": -9.88278579711914, "global_step": 114854, "epoch": 683} {"train_loss": -9.357538223266602, "global_step": 114855, "epoch": 683} {"train_loss": -9.864139556884766, "global_step": 114856, "epoch": 683} {"train_loss": -9.618550300598145, "global_step": 114857, "epoch": 683} {"train_loss": -10.109275817871094, "global_step": 114858, "epoch": 683} {"train_loss": -9.67280101776123, "global_step": 114859, "epoch": 683} {"train_loss": -9.814399719238281, "global_step": 114860, "epoch": 683} {"train_loss": -9.737822532653809, "global_step": 114861, "epoch": 683} {"train_loss": -9.981769561767578, "global_step": 114862, "epoch": 683} {"train_loss": -10.133224487304688, "global_step": 114863, "epoch": 683} {"train_loss": -9.759566307067871, "global_step": 114864, "epoch": 683} {"train_loss": -9.93376350402832, "global_step": 114865, "epoch": 683} {"train_loss": -9.96341323852539, "global_step": 114866, "epoch": 683} {"train_loss": -10.042770385742188, "global_step": 114867, "epoch": 683} {"train_loss": -10.097135543823242, "global_step": 114868, "epoch": 683} {"train_loss": -10.061670303344727, "global_step": 114869, "epoch": 683} {"train_loss": -9.967244148254395, "global_step": 114870, "epoch": 683} {"train_loss": -10.072090148925781, "global_step": 114871, "epoch": 683} {"train_loss": -9.8291015625, "global_step": 114872, "epoch": 683} {"train_loss": -10.030769348144531, "global_step": 114873, "epoch": 683} {"train_loss": -10.388181686401367, "global_step": 114874, "epoch": 683} {"train_loss": -10.155305862426758, "global_step": 114875, "epoch": 683} {"train_loss": -10.094383239746094, "global_step": 114876, "epoch": 683} {"train_loss": -10.191605567932129, "global_step": 114877, "epoch": 683} {"train_loss": -10.141127586364746, "global_step": 114878, "epoch": 683} {"train_loss": -10.131163597106934, "global_step": 114879, "epoch": 683} {"train_loss": -10.084760665893555, "global_step": 114880, "epoch": 683} {"train_loss": -10.074914932250977, "global_step": 114881, "epoch": 683} {"train_loss": -10.214057922363281, "global_step": 114882, "epoch": 683} {"train_loss": -9.881271362304688, "global_step": 114883, "epoch": 683} {"train_loss": -10.407308578491211, "global_step": 114884, "epoch": 683} {"train_loss": -10.145882606506348, "global_step": 114885, "epoch": 683} {"train_loss": -10.191643714904785, "global_step": 114886, "epoch": 683} {"train_loss": -10.379463195800781, "global_step": 114887, "epoch": 683} {"train_loss": -9.997537612915039, "global_step": 114888, "epoch": 683} {"train_loss": -10.340082168579102, "global_step": 114889, "epoch": 683} {"train_loss": -10.005514144897461, "global_step": 114890, "epoch": 683} {"train_loss": -10.32957649230957, "global_step": 114891, "epoch": 683} {"train_loss": -10.061895370483398, "global_step": 114892, "epoch": 683} {"train_loss": -10.170001029968262, "global_step": 114893, "epoch": 683} {"train_loss": -10.168593406677246, "global_step": 114894, "epoch": 683} {"train_loss": -10.129289627075195, "global_step": 114895, "epoch": 683} {"train_loss": -9.899477005004883, "global_step": 114896, "epoch": 683} {"train_loss": -9.44974422454834, "global_step": 114897, "epoch": 683} {"train_loss": -9.669424057006836, "global_step": 114898, "epoch": 683} {"train_loss": -9.976099014282227, "global_step": 114899, "epoch": 683} {"train_loss": -9.603959083557129, "global_step": 114900, "epoch": 683} {"train_loss": -10.161794662475586, "global_step": 114901, "epoch": 683} {"train_loss": -9.692761421203613, "global_step": 114902, "epoch": 683} {"train_loss": -10.217751502990723, "global_step": 114903, "epoch": 683} {"train_loss": -9.649417877197266, "global_step": 114904, "epoch": 683} {"train_loss": -9.971879959106445, "global_step": 114905, "epoch": 683} {"train_loss": -10.114534378051758, "global_step": 114906, "epoch": 683} {"train_loss": -9.943655967712402, "global_step": 114907, "epoch": 683} {"train_loss": -9.859077453613281, "global_step": 114908, "epoch": 683} {"train_loss": -10.197700500488281, "global_step": 114909, "epoch": 683} {"train_loss": -9.923203468322754, "global_step": 114910, "epoch": 683} {"train_loss": -9.953986701511202, "global_step": 114911, "epoch": 683, "val_loss": 212652.078125} {"train_loss": -9.973862648010254, "global_step": 114912, "epoch": 684} {"train_loss": -9.959442138671875, "global_step": 114913, "epoch": 684} {"train_loss": -9.929281234741211, "global_step": 114914, "epoch": 684} {"train_loss": -9.661596298217773, "global_step": 114915, "epoch": 684} {"train_loss": -10.049485206604004, "global_step": 114916, "epoch": 684} {"train_loss": -9.486886978149414, "global_step": 114917, "epoch": 684} {"train_loss": -9.76003646850586, "global_step": 114918, "epoch": 684} {"train_loss": -9.516874313354492, "global_step": 114919, "epoch": 684} {"train_loss": -10.000263214111328, "global_step": 114920, "epoch": 684} {"train_loss": -9.800163269042969, "global_step": 114921, "epoch": 684} {"train_loss": -9.91464614868164, "global_step": 114922, "epoch": 684} {"train_loss": -10.09925365447998, "global_step": 114923, "epoch": 684} {"train_loss": -9.807939529418945, "global_step": 114924, "epoch": 684} {"train_loss": -10.078393936157227, "global_step": 114925, "epoch": 684} {"train_loss": -9.801849365234375, "global_step": 114926, "epoch": 684} {"train_loss": -9.974855422973633, "global_step": 114927, "epoch": 684} {"train_loss": -10.004871368408203, "global_step": 114928, "epoch": 684} {"train_loss": -9.9474458694458, "global_step": 114929, "epoch": 684} {"train_loss": -10.297527313232422, "global_step": 114930, "epoch": 684} {"train_loss": -9.86221694946289, "global_step": 114931, "epoch": 684} {"train_loss": -10.113399505615234, "global_step": 114932, "epoch": 684} {"train_loss": -10.049356460571289, "global_step": 114933, "epoch": 684} {"train_loss": -9.902750015258789, "global_step": 114934, "epoch": 684} {"train_loss": -9.967925071716309, "global_step": 114935, "epoch": 684} {"train_loss": -9.763858795166016, "global_step": 114936, "epoch": 684} {"train_loss": -9.976972579956055, "global_step": 114937, "epoch": 684} {"train_loss": -9.983400344848633, "global_step": 114938, "epoch": 684} {"train_loss": -9.990835189819336, "global_step": 114939, "epoch": 684} {"train_loss": -9.91826057434082, "global_step": 114940, "epoch": 684} {"train_loss": -10.38499641418457, "global_step": 114941, "epoch": 684} {"train_loss": -10.136805534362793, "global_step": 114942, "epoch": 684} {"train_loss": -9.980184555053711, "global_step": 114943, "epoch": 684} {"train_loss": -10.096397399902344, "global_step": 114944, "epoch": 684} {"train_loss": -10.103939056396484, "global_step": 114945, "epoch": 684} {"train_loss": -10.13894271850586, "global_step": 114946, "epoch": 684} {"train_loss": -10.013359069824219, "global_step": 114947, "epoch": 684} {"train_loss": -10.313176155090332, "global_step": 114948, "epoch": 684} {"train_loss": -10.202259063720703, "global_step": 114949, "epoch": 684} {"train_loss": -9.921430587768555, "global_step": 114950, "epoch": 684} {"train_loss": -10.018179893493652, "global_step": 114951, "epoch": 684} {"train_loss": -10.027244567871094, "global_step": 114952, "epoch": 684} {"train_loss": -10.453186988830566, "global_step": 114953, "epoch": 684} {"train_loss": -10.182149887084961, "global_step": 114954, "epoch": 684} {"train_loss": -10.361272811889648, "global_step": 114955, "epoch": 684} {"train_loss": -10.165653228759766, "global_step": 114956, "epoch": 684} {"train_loss": -9.98638916015625, "global_step": 114957, "epoch": 684} {"train_loss": -10.128754615783691, "global_step": 114958, "epoch": 684} {"train_loss": -10.089774131774902, "global_step": 114959, "epoch": 684} {"train_loss": -10.267189979553223, "global_step": 114960, "epoch": 684} {"train_loss": -10.155218124389648, "global_step": 114961, "epoch": 684} {"train_loss": -10.150917053222656, "global_step": 114962, "epoch": 684} {"train_loss": -10.15510082244873, "global_step": 114963, "epoch": 684} {"train_loss": -10.028973579406738, "global_step": 114964, "epoch": 684} {"train_loss": -10.342185020446777, "global_step": 114965, "epoch": 684} {"train_loss": -10.063047409057617, "global_step": 114966, "epoch": 684} {"train_loss": -10.493603706359863, "global_step": 114967, "epoch": 684} {"train_loss": -10.496674537658691, "global_step": 114968, "epoch": 684} {"train_loss": -10.014469146728516, "global_step": 114969, "epoch": 684} {"train_loss": -10.244471549987793, "global_step": 114970, "epoch": 684} {"train_loss": -10.409139633178711, "global_step": 114971, "epoch": 684} {"train_loss": -10.294258117675781, "global_step": 114972, "epoch": 684} {"train_loss": -10.320755004882812, "global_step": 114973, "epoch": 684} {"train_loss": -10.323172569274902, "global_step": 114974, "epoch": 684} {"train_loss": -10.31501579284668, "global_step": 114975, "epoch": 684} {"train_loss": -10.331355094909668, "global_step": 114976, "epoch": 684} {"train_loss": -10.221521377563477, "global_step": 114977, "epoch": 684} {"train_loss": -10.06949520111084, "global_step": 114978, "epoch": 684} {"train_loss": -9.851648330688477, "global_step": 114979, "epoch": 684} {"train_loss": -10.264013290405273, "global_step": 114980, "epoch": 684} {"train_loss": -10.26891803741455, "global_step": 114981, "epoch": 684} {"train_loss": -9.960489273071289, "global_step": 114982, "epoch": 684} {"train_loss": -9.519937515258789, "global_step": 114983, "epoch": 684} {"train_loss": -10.155616760253906, "global_step": 114984, "epoch": 684} {"train_loss": -10.08728313446045, "global_step": 114985, "epoch": 684} {"train_loss": -9.561651229858398, "global_step": 114986, "epoch": 684} {"train_loss": -9.87089729309082, "global_step": 114987, "epoch": 684} {"train_loss": -9.257014274597168, "global_step": 114988, "epoch": 684} {"train_loss": -9.925477981567383, "global_step": 114989, "epoch": 684} {"train_loss": -8.916207313537598, "global_step": 114990, "epoch": 684} {"train_loss": -9.586624145507812, "global_step": 114991, "epoch": 684} {"train_loss": -9.52420425415039, "global_step": 114992, "epoch": 684} {"train_loss": -9.18825626373291, "global_step": 114993, "epoch": 684} {"train_loss": -9.419859886169434, "global_step": 114994, "epoch": 684} {"train_loss": -9.691669464111328, "global_step": 114995, "epoch": 684} {"train_loss": -9.543349266052246, "global_step": 114996, "epoch": 684} {"train_loss": -9.83868408203125, "global_step": 114997, "epoch": 684} {"train_loss": -9.656829833984375, "global_step": 114998, "epoch": 684} {"train_loss": -10.028560638427734, "global_step": 114999, "epoch": 684} {"train_loss": -10.01911449432373, "global_step": 115000, "epoch": 684} {"train_loss": -9.44253158569336, "global_step": 115001, "epoch": 684} {"train_loss": -9.953269958496094, "global_step": 115002, "epoch": 684} {"train_loss": -9.727972984313965, "global_step": 115003, "epoch": 684} {"train_loss": -9.929550170898438, "global_step": 115004, "epoch": 684} {"train_loss": -9.813072204589844, "global_step": 115005, "epoch": 684} {"train_loss": -9.808599472045898, "global_step": 115006, "epoch": 684} {"train_loss": -9.85369873046875, "global_step": 115007, "epoch": 684} {"train_loss": -9.985207557678223, "global_step": 115008, "epoch": 684} {"train_loss": -9.717146873474121, "global_step": 115009, "epoch": 684} {"train_loss": -9.960687637329102, "global_step": 115010, "epoch": 684} {"train_loss": -9.89271354675293, "global_step": 115011, "epoch": 684} {"train_loss": -9.593290328979492, "global_step": 115012, "epoch": 684} {"train_loss": -9.929096221923828, "global_step": 115013, "epoch": 684} {"train_loss": -9.636907577514648, "global_step": 115014, "epoch": 684} {"train_loss": -9.781013488769531, "global_step": 115015, "epoch": 684} {"train_loss": -9.870445251464844, "global_step": 115016, "epoch": 684} {"train_loss": -9.910335540771484, "global_step": 115017, "epoch": 684} {"train_loss": -9.697569847106934, "global_step": 115018, "epoch": 684} {"train_loss": -9.770084381103516, "global_step": 115019, "epoch": 684} {"train_loss": -9.836220741271973, "global_step": 115020, "epoch": 684} {"train_loss": -10.118342399597168, "global_step": 115021, "epoch": 684} {"train_loss": -9.563594818115234, "global_step": 115022, "epoch": 684} {"train_loss": -9.823585510253906, "global_step": 115023, "epoch": 684} {"train_loss": -9.678304672241211, "global_step": 115024, "epoch": 684} {"train_loss": -10.104005813598633, "global_step": 115025, "epoch": 684} {"train_loss": -9.588762283325195, "global_step": 115026, "epoch": 684} {"train_loss": -9.923643112182617, "global_step": 115027, "epoch": 684} {"train_loss": -9.930212020874023, "global_step": 115028, "epoch": 684} {"train_loss": -9.835037231445312, "global_step": 115029, "epoch": 684} {"train_loss": -10.014726638793945, "global_step": 115030, "epoch": 684} {"train_loss": -9.562349319458008, "global_step": 115031, "epoch": 684} {"train_loss": -10.087569236755371, "global_step": 115032, "epoch": 684} {"train_loss": -9.79923152923584, "global_step": 115033, "epoch": 684} {"train_loss": -9.95712661743164, "global_step": 115034, "epoch": 684} {"train_loss": -10.226261138916016, "global_step": 115035, "epoch": 684} {"train_loss": -10.29472541809082, "global_step": 115036, "epoch": 684} {"train_loss": -9.975227355957031, "global_step": 115037, "epoch": 684} {"train_loss": -9.982229232788086, "global_step": 115038, "epoch": 684} {"train_loss": -9.85644245147705, "global_step": 115039, "epoch": 684} {"train_loss": -10.07939338684082, "global_step": 115040, "epoch": 684} {"train_loss": -10.190288543701172, "global_step": 115041, "epoch": 684} {"train_loss": -10.075885772705078, "global_step": 115042, "epoch": 684} {"train_loss": -10.010562896728516, "global_step": 115043, "epoch": 684} {"train_loss": -10.194210052490234, "global_step": 115044, "epoch": 684} {"train_loss": -9.988752365112305, "global_step": 115045, "epoch": 684} {"train_loss": -10.209712982177734, "global_step": 115046, "epoch": 684} {"train_loss": -10.159269332885742, "global_step": 115047, "epoch": 684} {"train_loss": -9.901835441589355, "global_step": 115048, "epoch": 684} {"train_loss": -10.280029296875, "global_step": 115049, "epoch": 684} {"train_loss": -9.99819564819336, "global_step": 115050, "epoch": 684} {"train_loss": -10.295652389526367, "global_step": 115051, "epoch": 684} {"train_loss": -10.065292358398438, "global_step": 115052, "epoch": 684} {"train_loss": -9.929448127746582, "global_step": 115053, "epoch": 684} {"train_loss": -10.07322883605957, "global_step": 115054, "epoch": 684} {"train_loss": -10.188636779785156, "global_step": 115055, "epoch": 684} {"train_loss": -9.909250259399414, "global_step": 115056, "epoch": 684} {"train_loss": -10.136984825134277, "global_step": 115057, "epoch": 684} {"train_loss": -9.774871826171875, "global_step": 115058, "epoch": 684} {"train_loss": -10.01774787902832, "global_step": 115059, "epoch": 684} {"train_loss": -10.051445960998535, "global_step": 115060, "epoch": 684} {"train_loss": -9.918315887451172, "global_step": 115061, "epoch": 684} {"train_loss": -9.746817588806152, "global_step": 115062, "epoch": 684} {"train_loss": -10.220499038696289, "global_step": 115063, "epoch": 684} {"train_loss": -9.340652465820312, "global_step": 115064, "epoch": 684} {"train_loss": -10.258829116821289, "global_step": 115065, "epoch": 684} {"train_loss": -9.443281173706055, "global_step": 115066, "epoch": 684} {"train_loss": -10.091590881347656, "global_step": 115067, "epoch": 684} {"train_loss": -10.089917182922363, "global_step": 115068, "epoch": 684} {"train_loss": -9.436315536499023, "global_step": 115069, "epoch": 684} {"train_loss": -10.200799942016602, "global_step": 115070, "epoch": 684} {"train_loss": -9.644739151000977, "global_step": 115071, "epoch": 684} {"train_loss": -9.69184684753418, "global_step": 115072, "epoch": 684} {"train_loss": -9.229643821716309, "global_step": 115073, "epoch": 684} {"train_loss": -9.224164009094238, "global_step": 115074, "epoch": 684} {"train_loss": -9.08896255493164, "global_step": 115075, "epoch": 684} {"train_loss": -9.135207176208496, "global_step": 115076, "epoch": 684} {"train_loss": -9.99763298034668, "global_step": 115077, "epoch": 684} {"train_loss": -9.414092063903809, "global_step": 115078, "epoch": 684} {"train_loss": -9.93549380983625, "global_step": 115079, "epoch": 684, "val_loss": 213772.5625} {"train_loss": -9.517229080200195, "global_step": 115080, "epoch": 685} {"train_loss": -9.712850570678711, "global_step": 115081, "epoch": 685} {"train_loss": -9.659923553466797, "global_step": 115082, "epoch": 685} {"train_loss": -9.592456817626953, "global_step": 115083, "epoch": 685} {"train_loss": -9.648758888244629, "global_step": 115084, "epoch": 685} {"train_loss": -9.762744903564453, "global_step": 115085, "epoch": 685} {"train_loss": -9.597293853759766, "global_step": 115086, "epoch": 685} {"train_loss": -9.42959976196289, "global_step": 115087, "epoch": 685} {"train_loss": -9.792038917541504, "global_step": 115088, "epoch": 685} {"train_loss": -9.860429763793945, "global_step": 115089, "epoch": 685} {"train_loss": -9.304168701171875, "global_step": 115090, "epoch": 685} {"train_loss": -10.232317924499512, "global_step": 115091, "epoch": 685} {"train_loss": -9.646810531616211, "global_step": 115092, "epoch": 685} {"train_loss": -9.679590225219727, "global_step": 115093, "epoch": 685} {"train_loss": -9.957609176635742, "global_step": 115094, "epoch": 685} {"train_loss": -9.804571151733398, "global_step": 115095, "epoch": 685} {"train_loss": -9.889080047607422, "global_step": 115096, "epoch": 685} {"train_loss": -9.935125350952148, "global_step": 115097, "epoch": 685} {"train_loss": -9.795482635498047, "global_step": 115098, "epoch": 685} {"train_loss": -10.018848419189453, "global_step": 115099, "epoch": 685} {"train_loss": -10.02303695678711, "global_step": 115100, "epoch": 685} {"train_loss": -9.98237419128418, "global_step": 115101, "epoch": 685} {"train_loss": -9.869332313537598, "global_step": 115102, "epoch": 685} {"train_loss": -10.044635772705078, "global_step": 115103, "epoch": 685} {"train_loss": -10.064131736755371, "global_step": 115104, "epoch": 685} {"train_loss": -9.994576454162598, "global_step": 115105, "epoch": 685} {"train_loss": -9.70859146118164, "global_step": 115106, "epoch": 685} {"train_loss": -9.978158950805664, "global_step": 115107, "epoch": 685} {"train_loss": -9.911048889160156, "global_step": 115108, "epoch": 685} {"train_loss": -9.904473304748535, "global_step": 115109, "epoch": 685} {"train_loss": -9.94697380065918, "global_step": 115110, "epoch": 685} {"train_loss": -10.122968673706055, "global_step": 115111, "epoch": 685} {"train_loss": -10.218894958496094, "global_step": 115112, "epoch": 685} {"train_loss": -9.894647598266602, "global_step": 115113, "epoch": 685} {"train_loss": -10.199555397033691, "global_step": 115114, "epoch": 685} {"train_loss": -10.1542387008667, "global_step": 115115, "epoch": 685} {"train_loss": -10.204678535461426, "global_step": 115116, "epoch": 685} {"train_loss": -10.418015480041504, "global_step": 115117, "epoch": 685} {"train_loss": -10.154335021972656, "global_step": 115118, "epoch": 685} {"train_loss": -10.245756149291992, "global_step": 115119, "epoch": 685} {"train_loss": -10.240373611450195, "global_step": 115120, "epoch": 685} {"train_loss": -10.286312103271484, "global_step": 115121, "epoch": 685} {"train_loss": -10.283821105957031, "global_step": 115122, "epoch": 685} {"train_loss": -10.26229190826416, "global_step": 115123, "epoch": 685} {"train_loss": -10.086421966552734, "global_step": 115124, "epoch": 685} {"train_loss": -10.324536323547363, "global_step": 115125, "epoch": 685} {"train_loss": -10.169780731201172, "global_step": 115126, "epoch": 685} {"train_loss": -10.422344207763672, "global_step": 115127, "epoch": 685} {"train_loss": -10.140327453613281, "global_step": 115128, "epoch": 685} {"train_loss": -10.422199249267578, "global_step": 115129, "epoch": 685} {"train_loss": -10.241856575012207, "global_step": 115130, "epoch": 685} {"train_loss": -10.164695739746094, "global_step": 115131, "epoch": 685} {"train_loss": -10.211817741394043, "global_step": 115132, "epoch": 685} {"train_loss": -10.149471282958984, "global_step": 115133, "epoch": 685} {"train_loss": -9.913686752319336, "global_step": 115134, "epoch": 685} {"train_loss": -10.147014617919922, "global_step": 115135, "epoch": 685} {"train_loss": -10.326156616210938, "global_step": 115136, "epoch": 685} {"train_loss": -9.706737518310547, "global_step": 115137, "epoch": 685} {"train_loss": -10.082012176513672, "global_step": 115138, "epoch": 685} {"train_loss": -10.003008842468262, "global_step": 115139, "epoch": 685} {"train_loss": -9.679378509521484, "global_step": 115140, "epoch": 685} {"train_loss": -10.412007331848145, "global_step": 115141, "epoch": 685} {"train_loss": -10.021873474121094, "global_step": 115142, "epoch": 685} {"train_loss": -10.066086769104004, "global_step": 115143, "epoch": 685} {"train_loss": -10.292173385620117, "global_step": 115144, "epoch": 685} {"train_loss": -9.99048137664795, "global_step": 115145, "epoch": 685} {"train_loss": -10.26331901550293, "global_step": 115146, "epoch": 685} {"train_loss": -10.249927520751953, "global_step": 115147, "epoch": 685} {"train_loss": -10.056028366088867, "global_step": 115148, "epoch": 685} {"train_loss": -10.101248741149902, "global_step": 115149, "epoch": 685} {"train_loss": -10.395920753479004, "global_step": 115150, "epoch": 685} {"train_loss": -9.627829551696777, "global_step": 115151, "epoch": 685} {"train_loss": -9.938413619995117, "global_step": 115152, "epoch": 685} {"train_loss": -10.250007629394531, "global_step": 115153, "epoch": 685} {"train_loss": -10.007515907287598, "global_step": 115154, "epoch": 685} {"train_loss": -10.143226623535156, "global_step": 115155, "epoch": 685} {"train_loss": -9.532167434692383, "global_step": 115156, "epoch": 685} {"train_loss": -9.909686088562012, "global_step": 115157, "epoch": 685} {"train_loss": -10.02805233001709, "global_step": 115158, "epoch": 685} {"train_loss": -10.156219482421875, "global_step": 115159, "epoch": 685} {"train_loss": -10.351572036743164, "global_step": 115160, "epoch": 685} {"train_loss": -10.012609481811523, "global_step": 115161, "epoch": 685} {"train_loss": -10.100387573242188, "global_step": 115162, "epoch": 685} {"train_loss": -9.906744003295898, "global_step": 115163, "epoch": 685} {"train_loss": -9.144752502441406, "global_step": 115164, "epoch": 685} {"train_loss": -9.77333927154541, "global_step": 115165, "epoch": 685} {"train_loss": -9.30500602722168, "global_step": 115166, "epoch": 685} {"train_loss": -9.587907791137695, "global_step": 115167, "epoch": 685} {"train_loss": -9.58411979675293, "global_step": 115168, "epoch": 685} {"train_loss": -9.60888671875, "global_step": 115169, "epoch": 685} {"train_loss": -9.355389595031738, "global_step": 115170, "epoch": 685} {"train_loss": -9.587345123291016, "global_step": 115171, "epoch": 685} {"train_loss": -9.321833610534668, "global_step": 115172, "epoch": 685} {"train_loss": -9.757314682006836, "global_step": 115173, "epoch": 685} {"train_loss": -9.254074096679688, "global_step": 115174, "epoch": 685} {"train_loss": -9.494471549987793, "global_step": 115175, "epoch": 685} {"train_loss": -9.717931747436523, "global_step": 115176, "epoch": 685} {"train_loss": -9.46288013458252, "global_step": 115177, "epoch": 685} {"train_loss": -9.897039413452148, "global_step": 115178, "epoch": 685} {"train_loss": -9.608366012573242, "global_step": 115179, "epoch": 685} {"train_loss": -9.808553695678711, "global_step": 115180, "epoch": 685} {"train_loss": -9.878327369689941, "global_step": 115181, "epoch": 685} {"train_loss": -9.9857177734375, "global_step": 115182, "epoch": 685} {"train_loss": -9.805703163146973, "global_step": 115183, "epoch": 685} {"train_loss": -10.018454551696777, "global_step": 115184, "epoch": 685} {"train_loss": -9.866133689880371, "global_step": 115185, "epoch": 685} {"train_loss": -9.872424125671387, "global_step": 115186, "epoch": 685} {"train_loss": -10.160921096801758, "global_step": 115187, "epoch": 685} {"train_loss": -10.061903953552246, "global_step": 115188, "epoch": 685} {"train_loss": -10.197593688964844, "global_step": 115189, "epoch": 685} {"train_loss": -10.01365852355957, "global_step": 115190, "epoch": 685} {"train_loss": -9.959177017211914, "global_step": 115191, "epoch": 685} {"train_loss": -10.22707748413086, "global_step": 115192, "epoch": 685} {"train_loss": -10.012043952941895, "global_step": 115193, "epoch": 685} {"train_loss": -10.146956443786621, "global_step": 115194, "epoch": 685} {"train_loss": -9.99869155883789, "global_step": 115195, "epoch": 685} {"train_loss": -9.977134704589844, "global_step": 115196, "epoch": 685} {"train_loss": -10.273475646972656, "global_step": 115197, "epoch": 685} {"train_loss": -10.054567337036133, "global_step": 115198, "epoch": 685} {"train_loss": -10.00485610961914, "global_step": 115199, "epoch": 685} {"train_loss": -10.228704452514648, "global_step": 115200, "epoch": 685} {"train_loss": -10.086217880249023, "global_step": 115201, "epoch": 685} {"train_loss": -10.176462173461914, "global_step": 115202, "epoch": 685} {"train_loss": -10.028817176818848, "global_step": 115203, "epoch": 685} {"train_loss": -10.162732124328613, "global_step": 115204, "epoch": 685} {"train_loss": -10.132150650024414, "global_step": 115205, "epoch": 685} {"train_loss": -9.918425559997559, "global_step": 115206, "epoch": 685} {"train_loss": -10.158878326416016, "global_step": 115207, "epoch": 685} {"train_loss": -10.097942352294922, "global_step": 115208, "epoch": 685} {"train_loss": -10.0682373046875, "global_step": 115209, "epoch": 685} {"train_loss": -10.256351470947266, "global_step": 115210, "epoch": 685} {"train_loss": -10.317622184753418, "global_step": 115211, "epoch": 685} {"train_loss": -10.204753875732422, "global_step": 115212, "epoch": 685} {"train_loss": -10.215753555297852, "global_step": 115213, "epoch": 685} {"train_loss": -10.328644752502441, "global_step": 115214, "epoch": 685} {"train_loss": -10.169687271118164, "global_step": 115215, "epoch": 685} {"train_loss": -10.375454902648926, "global_step": 115216, "epoch": 685} {"train_loss": -10.111695289611816, "global_step": 115217, "epoch": 685} {"train_loss": -10.104616165161133, "global_step": 115218, "epoch": 685} {"train_loss": -10.318864822387695, "global_step": 115219, "epoch": 685} {"train_loss": -10.026761054992676, "global_step": 115220, "epoch": 685} {"train_loss": -10.170116424560547, "global_step": 115221, "epoch": 685} {"train_loss": -10.456005096435547, "global_step": 115222, "epoch": 685} {"train_loss": -10.110304832458496, "global_step": 115223, "epoch": 685} {"train_loss": -10.344974517822266, "global_step": 115224, "epoch": 685} {"train_loss": -10.042618751525879, "global_step": 115225, "epoch": 685} {"train_loss": -10.169675827026367, "global_step": 115226, "epoch": 685} {"train_loss": -10.289328575134277, "global_step": 115227, "epoch": 685} {"train_loss": -10.412577629089355, "global_step": 115228, "epoch": 685} {"train_loss": -10.337379455566406, "global_step": 115229, "epoch": 685} {"train_loss": -10.065231323242188, "global_step": 115230, "epoch": 685} {"train_loss": -10.173049926757812, "global_step": 115231, "epoch": 685} {"train_loss": -9.936393737792969, "global_step": 115232, "epoch": 685} {"train_loss": -10.105055809020996, "global_step": 115233, "epoch": 685} {"train_loss": -9.993587493896484, "global_step": 115234, "epoch": 685} {"train_loss": -10.184733390808105, "global_step": 115235, "epoch": 685} {"train_loss": -10.153736114501953, "global_step": 115236, "epoch": 685} {"train_loss": -10.00829029083252, "global_step": 115237, "epoch": 685} {"train_loss": -10.282959938049316, "global_step": 115238, "epoch": 685} {"train_loss": -10.217710494995117, "global_step": 115239, "epoch": 685} {"train_loss": -10.310335159301758, "global_step": 115240, "epoch": 685} {"train_loss": -10.190832138061523, "global_step": 115241, "epoch": 685} {"train_loss": -10.038436889648438, "global_step": 115242, "epoch": 685} {"train_loss": -10.219646453857422, "global_step": 115243, "epoch": 685} {"train_loss": -9.987541198730469, "global_step": 115244, "epoch": 685} {"train_loss": -10.062335968017578, "global_step": 115245, "epoch": 685} {"train_loss": -9.704268455505371, "global_step": 115246, "epoch": 685} {"train_loss": -10.00699900445484, "global_step": 115247, "epoch": 685, "val_loss": 213511.3125, "train_action_mse_error": 7.700716972351074} {"train_loss": -9.719192504882812, "global_step": 115248, "epoch": 686} {"train_loss": -9.510623931884766, "global_step": 115249, "epoch": 686} {"train_loss": -9.982686996459961, "global_step": 115250, "epoch": 686} {"train_loss": -9.647676467895508, "global_step": 115251, "epoch": 686} {"train_loss": -9.86760425567627, "global_step": 115252, "epoch": 686} {"train_loss": -9.986045837402344, "global_step": 115253, "epoch": 686} {"train_loss": -9.90538501739502, "global_step": 115254, "epoch": 686} {"train_loss": -9.593732833862305, "global_step": 115255, "epoch": 686} {"train_loss": -9.821006774902344, "global_step": 115256, "epoch": 686} {"train_loss": -9.281635284423828, "global_step": 115257, "epoch": 686} {"train_loss": -9.984432220458984, "global_step": 115258, "epoch": 686} {"train_loss": -9.637518882751465, "global_step": 115259, "epoch": 686} {"train_loss": -9.894697189331055, "global_step": 115260, "epoch": 686} {"train_loss": -10.005435943603516, "global_step": 115261, "epoch": 686} {"train_loss": -10.033071517944336, "global_step": 115262, "epoch": 686} {"train_loss": -9.89853286743164, "global_step": 115263, "epoch": 686} {"train_loss": -9.774551391601562, "global_step": 115264, "epoch": 686} {"train_loss": -9.864830017089844, "global_step": 115265, "epoch": 686} {"train_loss": -10.078849792480469, "global_step": 115266, "epoch": 686} {"train_loss": -9.831271171569824, "global_step": 115267, "epoch": 686} {"train_loss": -9.961532592773438, "global_step": 115268, "epoch": 686} {"train_loss": -9.933773040771484, "global_step": 115269, "epoch": 686} {"train_loss": -9.924488067626953, "global_step": 115270, "epoch": 686} {"train_loss": -10.056657791137695, "global_step": 115271, "epoch": 686} {"train_loss": -10.074283599853516, "global_step": 115272, "epoch": 686} {"train_loss": -9.642948150634766, "global_step": 115273, "epoch": 686} {"train_loss": -9.926048278808594, "global_step": 115274, "epoch": 686} {"train_loss": -9.773260116577148, "global_step": 115275, "epoch": 686} {"train_loss": -9.82763957977295, "global_step": 115276, "epoch": 686} {"train_loss": -10.163213729858398, "global_step": 115277, "epoch": 686} {"train_loss": -10.010939598083496, "global_step": 115278, "epoch": 686} {"train_loss": -10.013385772705078, "global_step": 115279, "epoch": 686} {"train_loss": -9.81344223022461, "global_step": 115280, "epoch": 686} {"train_loss": -9.887062072753906, "global_step": 115281, "epoch": 686} {"train_loss": -10.104238510131836, "global_step": 115282, "epoch": 686} {"train_loss": -10.234955787658691, "global_step": 115283, "epoch": 686} {"train_loss": -9.996248245239258, "global_step": 115284, "epoch": 686} {"train_loss": -10.015301704406738, "global_step": 115285, "epoch": 686} {"train_loss": -10.156882286071777, "global_step": 115286, "epoch": 686} {"train_loss": -9.938411712646484, "global_step": 115287, "epoch": 686} {"train_loss": -10.073068618774414, "global_step": 115288, "epoch": 686} {"train_loss": -10.204090118408203, "global_step": 115289, "epoch": 686} {"train_loss": -10.25045394897461, "global_step": 115290, "epoch": 686} {"train_loss": -9.980480194091797, "global_step": 115291, "epoch": 686} {"train_loss": -10.150200843811035, "global_step": 115292, "epoch": 686} {"train_loss": -9.958768844604492, "global_step": 115293, "epoch": 686} {"train_loss": -10.038318634033203, "global_step": 115294, "epoch": 686} {"train_loss": -9.813791275024414, "global_step": 115295, "epoch": 686} {"train_loss": -9.890965461730957, "global_step": 115296, "epoch": 686} {"train_loss": -10.196343421936035, "global_step": 115297, "epoch": 686} {"train_loss": -10.05613899230957, "global_step": 115298, "epoch": 686} {"train_loss": -10.124916076660156, "global_step": 115299, "epoch": 686} {"train_loss": -9.99367618560791, "global_step": 115300, "epoch": 686} {"train_loss": -9.609333992004395, "global_step": 115301, "epoch": 686} {"train_loss": -10.429180145263672, "global_step": 115302, "epoch": 686} {"train_loss": -9.491384506225586, "global_step": 115303, "epoch": 686} {"train_loss": -9.929232597351074, "global_step": 115304, "epoch": 686} {"train_loss": -9.759891510009766, "global_step": 115305, "epoch": 686} {"train_loss": -9.970562934875488, "global_step": 115306, "epoch": 686} {"train_loss": -9.83881950378418, "global_step": 115307, "epoch": 686} {"train_loss": -9.558233261108398, "global_step": 115308, "epoch": 686} {"train_loss": -10.012954711914062, "global_step": 115309, "epoch": 686} {"train_loss": -9.64676284790039, "global_step": 115310, "epoch": 686} {"train_loss": -9.605819702148438, "global_step": 115311, "epoch": 686} {"train_loss": -9.808404922485352, "global_step": 115312, "epoch": 686} {"train_loss": -9.880521774291992, "global_step": 115313, "epoch": 686} {"train_loss": -9.466124534606934, "global_step": 115314, "epoch": 686} {"train_loss": -9.923385620117188, "global_step": 115315, "epoch": 686} {"train_loss": -9.848798751831055, "global_step": 115316, "epoch": 686} {"train_loss": -9.827594757080078, "global_step": 115317, "epoch": 686} {"train_loss": -9.795555114746094, "global_step": 115318, "epoch": 686} {"train_loss": -9.745868682861328, "global_step": 115319, "epoch": 686} {"train_loss": -10.053657531738281, "global_step": 115320, "epoch": 686} {"train_loss": -9.288247108459473, "global_step": 115321, "epoch": 686} {"train_loss": -9.861444473266602, "global_step": 115322, "epoch": 686} {"train_loss": -9.995765686035156, "global_step": 115323, "epoch": 686} {"train_loss": -9.918485641479492, "global_step": 115324, "epoch": 686} {"train_loss": -10.037454605102539, "global_step": 115325, "epoch": 686} {"train_loss": -9.921249389648438, "global_step": 115326, "epoch": 686} {"train_loss": -9.884998321533203, "global_step": 115327, "epoch": 686} {"train_loss": -9.904836654663086, "global_step": 115328, "epoch": 686} {"train_loss": -10.020071029663086, "global_step": 115329, "epoch": 686} {"train_loss": -9.936847686767578, "global_step": 115330, "epoch": 686} {"train_loss": -9.853462219238281, "global_step": 115331, "epoch": 686} {"train_loss": -10.04005241394043, "global_step": 115332, "epoch": 686} {"train_loss": -9.924978256225586, "global_step": 115333, "epoch": 686} {"train_loss": -10.005104064941406, "global_step": 115334, "epoch": 686} {"train_loss": -10.166604042053223, "global_step": 115335, "epoch": 686} {"train_loss": -10.174470901489258, "global_step": 115336, "epoch": 686} {"train_loss": -9.995284080505371, "global_step": 115337, "epoch": 686} {"train_loss": -10.366315841674805, "global_step": 115338, "epoch": 686} {"train_loss": -10.10922908782959, "global_step": 115339, "epoch": 686} {"train_loss": -10.359331130981445, "global_step": 115340, "epoch": 686} {"train_loss": -10.053173065185547, "global_step": 115341, "epoch": 686} {"train_loss": -10.113572120666504, "global_step": 115342, "epoch": 686} {"train_loss": -10.11324691772461, "global_step": 115343, "epoch": 686} {"train_loss": -10.120476722717285, "global_step": 115344, "epoch": 686} {"train_loss": -10.392732620239258, "global_step": 115345, "epoch": 686} {"train_loss": -10.308089256286621, "global_step": 115346, "epoch": 686} {"train_loss": -9.978338241577148, "global_step": 115347, "epoch": 686} {"train_loss": -10.159948348999023, "global_step": 115348, "epoch": 686} {"train_loss": -10.156047821044922, "global_step": 115349, "epoch": 686} {"train_loss": -10.072744369506836, "global_step": 115350, "epoch": 686} {"train_loss": -10.457000732421875, "global_step": 115351, "epoch": 686} {"train_loss": -10.202832221984863, "global_step": 115352, "epoch": 686} {"train_loss": -10.115126609802246, "global_step": 115353, "epoch": 686} {"train_loss": -10.130149841308594, "global_step": 115354, "epoch": 686} {"train_loss": -10.208616256713867, "global_step": 115355, "epoch": 686} {"train_loss": -10.329792022705078, "global_step": 115356, "epoch": 686} {"train_loss": -10.23630428314209, "global_step": 115357, "epoch": 686} {"train_loss": -10.245306015014648, "global_step": 115358, "epoch": 686} {"train_loss": -10.202985763549805, "global_step": 115359, "epoch": 686} {"train_loss": -10.154163360595703, "global_step": 115360, "epoch": 686} {"train_loss": -10.438187599182129, "global_step": 115361, "epoch": 686} {"train_loss": -9.888758659362793, "global_step": 115362, "epoch": 686} {"train_loss": -10.317789077758789, "global_step": 115363, "epoch": 686} {"train_loss": -10.083074569702148, "global_step": 115364, "epoch": 686} {"train_loss": -9.962230682373047, "global_step": 115365, "epoch": 686} {"train_loss": -10.21422004699707, "global_step": 115366, "epoch": 686} {"train_loss": -10.056438446044922, "global_step": 115367, "epoch": 686} {"train_loss": -9.868738174438477, "global_step": 115368, "epoch": 686} {"train_loss": -9.993061065673828, "global_step": 115369, "epoch": 686} {"train_loss": -10.279176712036133, "global_step": 115370, "epoch": 686} {"train_loss": -10.239885330200195, "global_step": 115371, "epoch": 686} {"train_loss": -9.941980361938477, "global_step": 115372, "epoch": 686} {"train_loss": -10.334121704101562, "global_step": 115373, "epoch": 686} {"train_loss": -9.990961074829102, "global_step": 115374, "epoch": 686} {"train_loss": -10.26024341583252, "global_step": 115375, "epoch": 686} {"train_loss": -10.299829483032227, "global_step": 115376, "epoch": 686} {"train_loss": -10.124553680419922, "global_step": 115377, "epoch": 686} {"train_loss": -10.15041732788086, "global_step": 115378, "epoch": 686} {"train_loss": -9.876570701599121, "global_step": 115379, "epoch": 686} {"train_loss": -10.133666038513184, "global_step": 115380, "epoch": 686} {"train_loss": -10.008125305175781, "global_step": 115381, "epoch": 686} {"train_loss": -10.103468894958496, "global_step": 115382, "epoch": 686} {"train_loss": -9.974746704101562, "global_step": 115383, "epoch": 686} {"train_loss": -9.874797821044922, "global_step": 115384, "epoch": 686} {"train_loss": -9.990084648132324, "global_step": 115385, "epoch": 686} {"train_loss": -10.199432373046875, "global_step": 115386, "epoch": 686} {"train_loss": -10.19911003112793, "global_step": 115387, "epoch": 686} {"train_loss": -9.977551460266113, "global_step": 115388, "epoch": 686} {"train_loss": -9.933067321777344, "global_step": 115389, "epoch": 686} {"train_loss": -10.095475196838379, "global_step": 115390, "epoch": 686} {"train_loss": -9.87307357788086, "global_step": 115391, "epoch": 686} {"train_loss": -9.847654342651367, "global_step": 115392, "epoch": 686} {"train_loss": -9.852336883544922, "global_step": 115393, "epoch": 686} {"train_loss": -9.612020492553711, "global_step": 115394, "epoch": 686} {"train_loss": -9.981467247009277, "global_step": 115395, "epoch": 686} {"train_loss": -9.748481750488281, "global_step": 115396, "epoch": 686} {"train_loss": -10.119169235229492, "global_step": 115397, "epoch": 686} {"train_loss": -9.98147964477539, "global_step": 115398, "epoch": 686} {"train_loss": -9.883623123168945, "global_step": 115399, "epoch": 686} {"train_loss": -9.661582946777344, "global_step": 115400, "epoch": 686} {"train_loss": -9.87155532836914, "global_step": 115401, "epoch": 686} {"train_loss": -9.827656745910645, "global_step": 115402, "epoch": 686} {"train_loss": -10.042104721069336, "global_step": 115403, "epoch": 686} {"train_loss": -9.851335525512695, "global_step": 115404, "epoch": 686} {"train_loss": -9.950095176696777, "global_step": 115405, "epoch": 686} {"train_loss": -9.928045272827148, "global_step": 115406, "epoch": 686} {"train_loss": -9.033559799194336, "global_step": 115407, "epoch": 686} {"train_loss": -10.111013412475586, "global_step": 115408, "epoch": 686} {"train_loss": -9.308368682861328, "global_step": 115409, "epoch": 686} {"train_loss": -10.020805358886719, "global_step": 115410, "epoch": 686} {"train_loss": -9.251869201660156, "global_step": 115411, "epoch": 686} {"train_loss": -10.249699592590332, "global_step": 115412, "epoch": 686} {"train_loss": -9.51077651977539, "global_step": 115413, "epoch": 686} {"train_loss": -9.875123977661133, "global_step": 115414, "epoch": 686} {"train_loss": -9.966589836847215, "global_step": 115415, "epoch": 686, "val_loss": 215049.484375} {"train_loss": -9.876409530639648, "global_step": 115416, "epoch": 687} {"train_loss": -9.624347686767578, "global_step": 115417, "epoch": 687} {"train_loss": -9.9501314163208, "global_step": 115418, "epoch": 687} {"train_loss": -9.736204147338867, "global_step": 115419, "epoch": 687} {"train_loss": -10.01076602935791, "global_step": 115420, "epoch": 687} {"train_loss": -10.101673126220703, "global_step": 115421, "epoch": 687} {"train_loss": -9.844085693359375, "global_step": 115422, "epoch": 687} {"train_loss": -9.851210594177246, "global_step": 115423, "epoch": 687} {"train_loss": -9.898361206054688, "global_step": 115424, "epoch": 687} {"train_loss": -10.134319305419922, "global_step": 115425, "epoch": 687} {"train_loss": -10.075750350952148, "global_step": 115426, "epoch": 687} {"train_loss": -10.170053482055664, "global_step": 115427, "epoch": 687} {"train_loss": -9.945211410522461, "global_step": 115428, "epoch": 687} {"train_loss": -10.270718574523926, "global_step": 115429, "epoch": 687} {"train_loss": -9.806593894958496, "global_step": 115430, "epoch": 687} {"train_loss": -10.236234664916992, "global_step": 115431, "epoch": 687} {"train_loss": -9.820873260498047, "global_step": 115432, "epoch": 687} {"train_loss": -10.312385559082031, "global_step": 115433, "epoch": 687} {"train_loss": -9.83388900756836, "global_step": 115434, "epoch": 687} {"train_loss": -10.30573844909668, "global_step": 115435, "epoch": 687} {"train_loss": -9.863574981689453, "global_step": 115436, "epoch": 687} {"train_loss": -10.258888244628906, "global_step": 115437, "epoch": 687} {"train_loss": -9.98906135559082, "global_step": 115438, "epoch": 687} {"train_loss": -10.218735694885254, "global_step": 115439, "epoch": 687} {"train_loss": -9.942058563232422, "global_step": 115440, "epoch": 687} {"train_loss": -10.025634765625, "global_step": 115441, "epoch": 687} {"train_loss": -10.043632507324219, "global_step": 115442, "epoch": 687} {"train_loss": -9.957908630371094, "global_step": 115443, "epoch": 687} {"train_loss": -10.122093200683594, "global_step": 115444, "epoch": 687} {"train_loss": -9.911683082580566, "global_step": 115445, "epoch": 687} {"train_loss": -10.28289794921875, "global_step": 115446, "epoch": 687} {"train_loss": -10.117927551269531, "global_step": 115447, "epoch": 687} {"train_loss": -10.079444885253906, "global_step": 115448, "epoch": 687} {"train_loss": -10.34383773803711, "global_step": 115449, "epoch": 687} {"train_loss": -10.061902046203613, "global_step": 115450, "epoch": 687} {"train_loss": -10.293656349182129, "global_step": 115451, "epoch": 687} {"train_loss": -10.272647857666016, "global_step": 115452, "epoch": 687} {"train_loss": -10.09604263305664, "global_step": 115453, "epoch": 687} {"train_loss": -10.139442443847656, "global_step": 115454, "epoch": 687} {"train_loss": -9.94278621673584, "global_step": 115455, "epoch": 687} {"train_loss": -10.113944053649902, "global_step": 115456, "epoch": 687} {"train_loss": -10.383672714233398, "global_step": 115457, "epoch": 687} {"train_loss": -10.211200714111328, "global_step": 115458, "epoch": 687} {"train_loss": -10.442790985107422, "global_step": 115459, "epoch": 687} {"train_loss": -10.517091751098633, "global_step": 115460, "epoch": 687} {"train_loss": -10.318790435791016, "global_step": 115461, "epoch": 687} {"train_loss": -10.212736129760742, "global_step": 115462, "epoch": 687} {"train_loss": -10.186369895935059, "global_step": 115463, "epoch": 687} {"train_loss": -10.145103454589844, "global_step": 115464, "epoch": 687} {"train_loss": -9.938272476196289, "global_step": 115465, "epoch": 687} {"train_loss": -10.079546928405762, "global_step": 115466, "epoch": 687} {"train_loss": -10.4031982421875, "global_step": 115467, "epoch": 687} {"train_loss": -9.91024398803711, "global_step": 115468, "epoch": 687} {"train_loss": -9.780115127563477, "global_step": 115469, "epoch": 687} {"train_loss": -10.199594497680664, "global_step": 115470, "epoch": 687} {"train_loss": -10.108320236206055, "global_step": 115471, "epoch": 687} {"train_loss": -10.072423934936523, "global_step": 115472, "epoch": 687} {"train_loss": -9.582343101501465, "global_step": 115473, "epoch": 687} {"train_loss": -9.968849182128906, "global_step": 115474, "epoch": 687} {"train_loss": -9.926979064941406, "global_step": 115475, "epoch": 687} {"train_loss": -9.882665634155273, "global_step": 115476, "epoch": 687} {"train_loss": -10.042770385742188, "global_step": 115477, "epoch": 687} {"train_loss": -10.140851020812988, "global_step": 115478, "epoch": 687} {"train_loss": -9.897982597351074, "global_step": 115479, "epoch": 687} {"train_loss": -10.124320983886719, "global_step": 115480, "epoch": 687} {"train_loss": -9.910662651062012, "global_step": 115481, "epoch": 687} {"train_loss": -10.101070404052734, "global_step": 115482, "epoch": 687} {"train_loss": -9.770471572875977, "global_step": 115483, "epoch": 687} {"train_loss": -10.019052505493164, "global_step": 115484, "epoch": 687} {"train_loss": -9.684099197387695, "global_step": 115485, "epoch": 687} {"train_loss": -9.906440734863281, "global_step": 115486, "epoch": 687} {"train_loss": -9.768033981323242, "global_step": 115487, "epoch": 687} {"train_loss": -9.882585525512695, "global_step": 115488, "epoch": 687} {"train_loss": -10.118904113769531, "global_step": 115489, "epoch": 687} {"train_loss": -9.877847671508789, "global_step": 115490, "epoch": 687} {"train_loss": -10.088665008544922, "global_step": 115491, "epoch": 687} {"train_loss": -9.637996673583984, "global_step": 115492, "epoch": 687} {"train_loss": -9.932966232299805, "global_step": 115493, "epoch": 687} {"train_loss": -9.851581573486328, "global_step": 115494, "epoch": 687} {"train_loss": -9.871184349060059, "global_step": 115495, "epoch": 687} {"train_loss": -9.584174156188965, "global_step": 115496, "epoch": 687} {"train_loss": -9.865188598632812, "global_step": 115497, "epoch": 687} {"train_loss": -9.66912841796875, "global_step": 115498, "epoch": 687} {"train_loss": -9.927358627319336, "global_step": 115499, "epoch": 687} {"train_loss": -10.042312622070312, "global_step": 115500, "epoch": 687} {"train_loss": -9.964849472045898, "global_step": 115501, "epoch": 687} {"train_loss": -10.22323989868164, "global_step": 115502, "epoch": 687} {"train_loss": -10.236515045166016, "global_step": 115503, "epoch": 687} {"train_loss": -10.065267562866211, "global_step": 115504, "epoch": 687} {"train_loss": -10.052068710327148, "global_step": 115505, "epoch": 687} {"train_loss": -10.056417465209961, "global_step": 115506, "epoch": 687} {"train_loss": -10.175403594970703, "global_step": 115507, "epoch": 687} {"train_loss": -9.886486053466797, "global_step": 115508, "epoch": 687} {"train_loss": -10.355454444885254, "global_step": 115509, "epoch": 687} {"train_loss": -10.111896514892578, "global_step": 115510, "epoch": 687} {"train_loss": -10.081411361694336, "global_step": 115511, "epoch": 687} {"train_loss": -10.291046142578125, "global_step": 115512, "epoch": 687} {"train_loss": -10.120377540588379, "global_step": 115513, "epoch": 687} {"train_loss": -10.212636947631836, "global_step": 115514, "epoch": 687} {"train_loss": -9.766093254089355, "global_step": 115515, "epoch": 687} {"train_loss": -10.026788711547852, "global_step": 115516, "epoch": 687} {"train_loss": -9.99538803100586, "global_step": 115517, "epoch": 687} {"train_loss": -10.003974914550781, "global_step": 115518, "epoch": 687} {"train_loss": -9.875001907348633, "global_step": 115519, "epoch": 687} {"train_loss": -10.186241149902344, "global_step": 115520, "epoch": 687} {"train_loss": -10.242361068725586, "global_step": 115521, "epoch": 687} {"train_loss": -10.02078628540039, "global_step": 115522, "epoch": 687} {"train_loss": -10.137378692626953, "global_step": 115523, "epoch": 687} {"train_loss": -9.925714492797852, "global_step": 115524, "epoch": 687} {"train_loss": -10.057347297668457, "global_step": 115525, "epoch": 687} {"train_loss": -10.140172004699707, "global_step": 115526, "epoch": 687} {"train_loss": -10.316791534423828, "global_step": 115527, "epoch": 687} {"train_loss": -10.253625869750977, "global_step": 115528, "epoch": 687} {"train_loss": -10.084864616394043, "global_step": 115529, "epoch": 687} {"train_loss": -10.200721740722656, "global_step": 115530, "epoch": 687} {"train_loss": -10.180699348449707, "global_step": 115531, "epoch": 687} {"train_loss": -10.399160385131836, "global_step": 115532, "epoch": 687} {"train_loss": -10.190302848815918, "global_step": 115533, "epoch": 687} {"train_loss": -9.992000579833984, "global_step": 115534, "epoch": 687} {"train_loss": -9.676849365234375, "global_step": 115535, "epoch": 687} {"train_loss": -9.926932334899902, "global_step": 115536, "epoch": 687} {"train_loss": -9.908403396606445, "global_step": 115537, "epoch": 687} {"train_loss": -9.934830665588379, "global_step": 115538, "epoch": 687} {"train_loss": -9.531647682189941, "global_step": 115539, "epoch": 687} {"train_loss": -9.96088981628418, "global_step": 115540, "epoch": 687} {"train_loss": -9.677356719970703, "global_step": 115541, "epoch": 687} {"train_loss": -9.57013988494873, "global_step": 115542, "epoch": 687} {"train_loss": -10.2230224609375, "global_step": 115543, "epoch": 687} {"train_loss": -9.491780281066895, "global_step": 115544, "epoch": 687} {"train_loss": -10.069408416748047, "global_step": 115545, "epoch": 687} {"train_loss": -9.711567878723145, "global_step": 115546, "epoch": 687} {"train_loss": -9.73535442352295, "global_step": 115547, "epoch": 687} {"train_loss": -9.87716293334961, "global_step": 115548, "epoch": 687} {"train_loss": -9.469558715820312, "global_step": 115549, "epoch": 687} {"train_loss": -9.632972717285156, "global_step": 115550, "epoch": 687} {"train_loss": -9.63496208190918, "global_step": 115551, "epoch": 687} {"train_loss": -9.917594909667969, "global_step": 115552, "epoch": 687} {"train_loss": -9.545044898986816, "global_step": 115553, "epoch": 687} {"train_loss": -10.064895629882812, "global_step": 115554, "epoch": 687} {"train_loss": -9.612096786499023, "global_step": 115555, "epoch": 687} {"train_loss": -9.817460060119629, "global_step": 115556, "epoch": 687} {"train_loss": -9.761393547058105, "global_step": 115557, "epoch": 687} {"train_loss": -9.855195999145508, "global_step": 115558, "epoch": 687} {"train_loss": -9.96320629119873, "global_step": 115559, "epoch": 687} {"train_loss": -10.070013046264648, "global_step": 115560, "epoch": 687} {"train_loss": -9.820585250854492, "global_step": 115561, "epoch": 687} {"train_loss": -9.737524032592773, "global_step": 115562, "epoch": 687} {"train_loss": -9.805826187133789, "global_step": 115563, "epoch": 687} {"train_loss": -10.024974822998047, "global_step": 115564, "epoch": 687} {"train_loss": -9.881914138793945, "global_step": 115565, "epoch": 687} {"train_loss": -10.066131591796875, "global_step": 115566, "epoch": 687} {"train_loss": -9.658918380737305, "global_step": 115567, "epoch": 687} {"train_loss": -10.025032043457031, "global_step": 115568, "epoch": 687} {"train_loss": -9.627679824829102, "global_step": 115569, "epoch": 687} {"train_loss": -9.945099830627441, "global_step": 115570, "epoch": 687} {"train_loss": -9.717140197753906, "global_step": 115571, "epoch": 687} {"train_loss": -9.875448226928711, "global_step": 115572, "epoch": 687} {"train_loss": -9.664094924926758, "global_step": 115573, "epoch": 687} {"train_loss": -10.208402633666992, "global_step": 115574, "epoch": 687} {"train_loss": -9.878633499145508, "global_step": 115575, "epoch": 687} {"train_loss": -9.957963943481445, "global_step": 115576, "epoch": 687} {"train_loss": -10.04374885559082, "global_step": 115577, "epoch": 687} {"train_loss": -10.0105562210083, "global_step": 115578, "epoch": 687} {"train_loss": -10.170954704284668, "global_step": 115579, "epoch": 687} {"train_loss": -10.201726913452148, "global_step": 115580, "epoch": 687} {"train_loss": -10.101362228393555, "global_step": 115581, "epoch": 687} {"train_loss": -9.851700782775879, "global_step": 115582, "epoch": 687} {"train_loss": -9.992272223745074, "global_step": 115583, "epoch": 687, "val_loss": 214204.859375} {"train_loss": -10.309173583984375, "global_step": 115584, "epoch": 688} {"train_loss": -10.085926055908203, "global_step": 115585, "epoch": 688} {"train_loss": -10.069528579711914, "global_step": 115586, "epoch": 688} {"train_loss": -10.26064682006836, "global_step": 115587, "epoch": 688} {"train_loss": -10.276433944702148, "global_step": 115588, "epoch": 688} {"train_loss": -10.166500091552734, "global_step": 115589, "epoch": 688} {"train_loss": -10.22304916381836, "global_step": 115590, "epoch": 688} {"train_loss": -10.042154312133789, "global_step": 115591, "epoch": 688} {"train_loss": -10.231484413146973, "global_step": 115592, "epoch": 688} {"train_loss": -10.098577499389648, "global_step": 115593, "epoch": 688} {"train_loss": -10.375553131103516, "global_step": 115594, "epoch": 688} {"train_loss": -10.001996994018555, "global_step": 115595, "epoch": 688} {"train_loss": -10.256233215332031, "global_step": 115596, "epoch": 688} {"train_loss": -9.97580337524414, "global_step": 115597, "epoch": 688} {"train_loss": -10.233388900756836, "global_step": 115598, "epoch": 688} {"train_loss": -10.189149856567383, "global_step": 115599, "epoch": 688} {"train_loss": -9.829154014587402, "global_step": 115600, "epoch": 688} {"train_loss": -10.32423210144043, "global_step": 115601, "epoch": 688} {"train_loss": -10.249847412109375, "global_step": 115602, "epoch": 688} {"train_loss": -10.217156410217285, "global_step": 115603, "epoch": 688} {"train_loss": -10.065729141235352, "global_step": 115604, "epoch": 688} {"train_loss": -10.19269847869873, "global_step": 115605, "epoch": 688} {"train_loss": -10.318967819213867, "global_step": 115606, "epoch": 688} {"train_loss": -9.903545379638672, "global_step": 115607, "epoch": 688} {"train_loss": -10.397832870483398, "global_step": 115608, "epoch": 688} {"train_loss": -9.975963592529297, "global_step": 115609, "epoch": 688} {"train_loss": -10.317610740661621, "global_step": 115610, "epoch": 688} {"train_loss": -10.345812797546387, "global_step": 115611, "epoch": 688} {"train_loss": -10.14448356628418, "global_step": 115612, "epoch": 688} {"train_loss": -10.119864463806152, "global_step": 115613, "epoch": 688} {"train_loss": -10.348066329956055, "global_step": 115614, "epoch": 688} {"train_loss": -10.373750686645508, "global_step": 115615, "epoch": 688} {"train_loss": -10.352800369262695, "global_step": 115616, "epoch": 688} {"train_loss": -10.056340217590332, "global_step": 115617, "epoch": 688} {"train_loss": -10.23546028137207, "global_step": 115618, "epoch": 688} {"train_loss": -10.446382522583008, "global_step": 115619, "epoch": 688} {"train_loss": -10.315572738647461, "global_step": 115620, "epoch": 688} {"train_loss": -9.659875869750977, "global_step": 115621, "epoch": 688} {"train_loss": -10.101274490356445, "global_step": 115622, "epoch": 688} {"train_loss": -10.27983570098877, "global_step": 115623, "epoch": 688} {"train_loss": -9.528440475463867, "global_step": 115624, "epoch": 688} {"train_loss": -10.379106521606445, "global_step": 115625, "epoch": 688} {"train_loss": -9.619775772094727, "global_step": 115626, "epoch": 688} {"train_loss": -10.1674165725708, "global_step": 115627, "epoch": 688} {"train_loss": -9.92892837524414, "global_step": 115628, "epoch": 688} {"train_loss": -10.056390762329102, "global_step": 115629, "epoch": 688} {"train_loss": -10.280906677246094, "global_step": 115630, "epoch": 688} {"train_loss": -9.77591323852539, "global_step": 115631, "epoch": 688} {"train_loss": -9.859429359436035, "global_step": 115632, "epoch": 688} {"train_loss": -9.730047225952148, "global_step": 115633, "epoch": 688} {"train_loss": -10.379351615905762, "global_step": 115634, "epoch": 688} {"train_loss": -9.744562149047852, "global_step": 115635, "epoch": 688} {"train_loss": -10.091972351074219, "global_step": 115636, "epoch": 688} {"train_loss": -10.224102020263672, "global_step": 115637, "epoch": 688} {"train_loss": -9.948853492736816, "global_step": 115638, "epoch": 688} {"train_loss": -9.951601028442383, "global_step": 115639, "epoch": 688} {"train_loss": -9.884066581726074, "global_step": 115640, "epoch": 688} {"train_loss": -10.092214584350586, "global_step": 115641, "epoch": 688} {"train_loss": -9.983148574829102, "global_step": 115642, "epoch": 688} {"train_loss": -10.201723098754883, "global_step": 115643, "epoch": 688} {"train_loss": -10.250245094299316, "global_step": 115644, "epoch": 688} {"train_loss": -9.996318817138672, "global_step": 115645, "epoch": 688} {"train_loss": -9.91417407989502, "global_step": 115646, "epoch": 688} {"train_loss": -9.827817916870117, "global_step": 115647, "epoch": 688} {"train_loss": -10.016936302185059, "global_step": 115648, "epoch": 688} {"train_loss": -10.235450744628906, "global_step": 115649, "epoch": 688} {"train_loss": -9.34925365447998, "global_step": 115650, "epoch": 688} {"train_loss": -10.12559986114502, "global_step": 115651, "epoch": 688} {"train_loss": -9.938554763793945, "global_step": 115652, "epoch": 688} {"train_loss": -9.914852142333984, "global_step": 115653, "epoch": 688} {"train_loss": -10.040809631347656, "global_step": 115654, "epoch": 688} {"train_loss": -9.952022552490234, "global_step": 115655, "epoch": 688} {"train_loss": -10.292980194091797, "global_step": 115656, "epoch": 688} {"train_loss": -9.97395133972168, "global_step": 115657, "epoch": 688} {"train_loss": -10.273845672607422, "global_step": 115658, "epoch": 688} {"train_loss": -9.870721817016602, "global_step": 115659, "epoch": 688} {"train_loss": -10.202499389648438, "global_step": 115660, "epoch": 688} {"train_loss": -10.261449813842773, "global_step": 115661, "epoch": 688} {"train_loss": -10.247869491577148, "global_step": 115662, "epoch": 688} {"train_loss": -10.178718566894531, "global_step": 115663, "epoch": 688} {"train_loss": -10.196981430053711, "global_step": 115664, "epoch": 688} {"train_loss": -10.268593788146973, "global_step": 115665, "epoch": 688} {"train_loss": -10.082008361816406, "global_step": 115666, "epoch": 688} {"train_loss": -10.165992736816406, "global_step": 115667, "epoch": 688} {"train_loss": -10.070192337036133, "global_step": 115668, "epoch": 688} {"train_loss": -9.835355758666992, "global_step": 115669, "epoch": 688} {"train_loss": -10.16201114654541, "global_step": 115670, "epoch": 688} {"train_loss": -10.105331420898438, "global_step": 115671, "epoch": 688} {"train_loss": -10.110261917114258, "global_step": 115672, "epoch": 688} {"train_loss": -9.914860725402832, "global_step": 115673, "epoch": 688} {"train_loss": -10.222376823425293, "global_step": 115674, "epoch": 688} {"train_loss": -9.94703483581543, "global_step": 115675, "epoch": 688} {"train_loss": -9.873887062072754, "global_step": 115676, "epoch": 688} {"train_loss": -10.11104965209961, "global_step": 115677, "epoch": 688} {"train_loss": -9.47223949432373, "global_step": 115678, "epoch": 688} {"train_loss": -10.066129684448242, "global_step": 115679, "epoch": 688} {"train_loss": -9.948739051818848, "global_step": 115680, "epoch": 688} {"train_loss": -10.049905776977539, "global_step": 115681, "epoch": 688} {"train_loss": -10.179948806762695, "global_step": 115682, "epoch": 688} {"train_loss": -9.926048278808594, "global_step": 115683, "epoch": 688} {"train_loss": -10.188203811645508, "global_step": 115684, "epoch": 688} {"train_loss": -9.8701171875, "global_step": 115685, "epoch": 688} {"train_loss": -9.930635452270508, "global_step": 115686, "epoch": 688} {"train_loss": -9.6981782913208, "global_step": 115687, "epoch": 688} {"train_loss": -10.260366439819336, "global_step": 115688, "epoch": 688} {"train_loss": -10.276397705078125, "global_step": 115689, "epoch": 688} {"train_loss": -10.239252090454102, "global_step": 115690, "epoch": 688} {"train_loss": -10.191305160522461, "global_step": 115691, "epoch": 688} {"train_loss": -9.907722473144531, "global_step": 115692, "epoch": 688} {"train_loss": -10.063577651977539, "global_step": 115693, "epoch": 688} {"train_loss": -10.078805923461914, "global_step": 115694, "epoch": 688} {"train_loss": -10.1138277053833, "global_step": 115695, "epoch": 688} {"train_loss": -10.146268844604492, "global_step": 115696, "epoch": 688} {"train_loss": -10.05392074584961, "global_step": 115697, "epoch": 688} {"train_loss": -10.06203842163086, "global_step": 115698, "epoch": 688} {"train_loss": -9.964750289916992, "global_step": 115699, "epoch": 688} {"train_loss": -10.28898811340332, "global_step": 115700, "epoch": 688} {"train_loss": -9.865129470825195, "global_step": 115701, "epoch": 688} {"train_loss": -10.152458190917969, "global_step": 115702, "epoch": 688} {"train_loss": -10.142974853515625, "global_step": 115703, "epoch": 688} {"train_loss": -10.075614929199219, "global_step": 115704, "epoch": 688} {"train_loss": -10.305098533630371, "global_step": 115705, "epoch": 688} {"train_loss": -10.12239933013916, "global_step": 115706, "epoch": 688} {"train_loss": -10.00473403930664, "global_step": 115707, "epoch": 688} {"train_loss": -9.984880447387695, "global_step": 115708, "epoch": 688} {"train_loss": -10.167793273925781, "global_step": 115709, "epoch": 688} {"train_loss": -10.255936622619629, "global_step": 115710, "epoch": 688} {"train_loss": -10.20484733581543, "global_step": 115711, "epoch": 688} {"train_loss": -10.235897064208984, "global_step": 115712, "epoch": 688} {"train_loss": -9.962778091430664, "global_step": 115713, "epoch": 688} {"train_loss": -9.974834442138672, "global_step": 115714, "epoch": 688} {"train_loss": -9.993144989013672, "global_step": 115715, "epoch": 688} {"train_loss": -9.952964782714844, "global_step": 115716, "epoch": 688} {"train_loss": -9.987309455871582, "global_step": 115717, "epoch": 688} {"train_loss": -10.051694869995117, "global_step": 115718, "epoch": 688} {"train_loss": -9.790458679199219, "global_step": 115719, "epoch": 688} {"train_loss": -10.111547470092773, "global_step": 115720, "epoch": 688} {"train_loss": -9.818520545959473, "global_step": 115721, "epoch": 688} {"train_loss": -9.973143577575684, "global_step": 115722, "epoch": 688} {"train_loss": -9.765620231628418, "global_step": 115723, "epoch": 688} {"train_loss": -9.77953052520752, "global_step": 115724, "epoch": 688} {"train_loss": -10.038106918334961, "global_step": 115725, "epoch": 688} {"train_loss": -9.714714050292969, "global_step": 115726, "epoch": 688} {"train_loss": -10.001626968383789, "global_step": 115727, "epoch": 688} {"train_loss": -10.129650115966797, "global_step": 115728, "epoch": 688} {"train_loss": -9.898488998413086, "global_step": 115729, "epoch": 688} {"train_loss": -9.881170272827148, "global_step": 115730, "epoch": 688} {"train_loss": -9.959782600402832, "global_step": 115731, "epoch": 688} {"train_loss": -10.11499309539795, "global_step": 115732, "epoch": 688} {"train_loss": -10.033605575561523, "global_step": 115733, "epoch": 688} {"train_loss": -10.078219413757324, "global_step": 115734, "epoch": 688} {"train_loss": -9.874824523925781, "global_step": 115735, "epoch": 688} {"train_loss": -9.943164825439453, "global_step": 115736, "epoch": 688} {"train_loss": -9.962238311767578, "global_step": 115737, "epoch": 688} {"train_loss": -10.414009094238281, "global_step": 115738, "epoch": 688} {"train_loss": -10.03577709197998, "global_step": 115739, "epoch": 688} {"train_loss": -9.959589004516602, "global_step": 115740, "epoch": 688} {"train_loss": -9.952959060668945, "global_step": 115741, "epoch": 688} {"train_loss": -10.320927619934082, "global_step": 115742, "epoch": 688} {"train_loss": -10.083698272705078, "global_step": 115743, "epoch": 688} {"train_loss": -10.249106407165527, "global_step": 115744, "epoch": 688} {"train_loss": -10.046316146850586, "global_step": 115745, "epoch": 688} {"train_loss": -10.365068435668945, "global_step": 115746, "epoch": 688} {"train_loss": -10.224964141845703, "global_step": 115747, "epoch": 688} {"train_loss": -10.099766731262207, "global_step": 115748, "epoch": 688} {"train_loss": -10.158514022827148, "global_step": 115749, "epoch": 688} {"train_loss": -10.006019592285156, "global_step": 115750, "epoch": 688} {"train_loss": -10.072857510475885, "global_step": 115751, "epoch": 688, "val_loss": 214972.703125} {"train_loss": -9.677667617797852, "global_step": 115752, "epoch": 689} {"train_loss": -9.973751068115234, "global_step": 115753, "epoch": 689} {"train_loss": -9.94586181640625, "global_step": 115754, "epoch": 689} {"train_loss": -9.966629028320312, "global_step": 115755, "epoch": 689} {"train_loss": -10.091043472290039, "global_step": 115756, "epoch": 689} {"train_loss": -9.535301208496094, "global_step": 115757, "epoch": 689} {"train_loss": -9.719949722290039, "global_step": 115758, "epoch": 689} {"train_loss": -9.52841567993164, "global_step": 115759, "epoch": 689} {"train_loss": -9.857644081115723, "global_step": 115760, "epoch": 689} {"train_loss": -10.096365928649902, "global_step": 115761, "epoch": 689} {"train_loss": -9.641486167907715, "global_step": 115762, "epoch": 689} {"train_loss": -10.18935489654541, "global_step": 115763, "epoch": 689} {"train_loss": -9.493188858032227, "global_step": 115764, "epoch": 689} {"train_loss": -9.90240478515625, "global_step": 115765, "epoch": 689} {"train_loss": -10.088638305664062, "global_step": 115766, "epoch": 689} {"train_loss": -9.6651029586792, "global_step": 115767, "epoch": 689} {"train_loss": -9.97822380065918, "global_step": 115768, "epoch": 689} {"train_loss": -9.872220993041992, "global_step": 115769, "epoch": 689} {"train_loss": -9.600645065307617, "global_step": 115770, "epoch": 689} {"train_loss": -9.896130561828613, "global_step": 115771, "epoch": 689} {"train_loss": -9.987386703491211, "global_step": 115772, "epoch": 689} {"train_loss": -9.88638687133789, "global_step": 115773, "epoch": 689} {"train_loss": -10.080472946166992, "global_step": 115774, "epoch": 689} {"train_loss": -10.324492454528809, "global_step": 115775, "epoch": 689} {"train_loss": -9.907249450683594, "global_step": 115776, "epoch": 689} {"train_loss": -9.943811416625977, "global_step": 115777, "epoch": 689} {"train_loss": -10.073975563049316, "global_step": 115778, "epoch": 689} {"train_loss": -9.677790641784668, "global_step": 115779, "epoch": 689} {"train_loss": -10.059598922729492, "global_step": 115780, "epoch": 689} {"train_loss": -9.984909057617188, "global_step": 115781, "epoch": 689} {"train_loss": -9.899332046508789, "global_step": 115782, "epoch": 689} {"train_loss": -9.93616008758545, "global_step": 115783, "epoch": 689} {"train_loss": -10.156254768371582, "global_step": 115784, "epoch": 689} {"train_loss": -10.12139892578125, "global_step": 115785, "epoch": 689} {"train_loss": -9.958582878112793, "global_step": 115786, "epoch": 689} {"train_loss": -10.027637481689453, "global_step": 115787, "epoch": 689} {"train_loss": -9.996088981628418, "global_step": 115788, "epoch": 689} {"train_loss": -9.913579940795898, "global_step": 115789, "epoch": 689} {"train_loss": -10.27908992767334, "global_step": 115790, "epoch": 689} {"train_loss": -9.689498901367188, "global_step": 115791, "epoch": 689} {"train_loss": -10.22680950164795, "global_step": 115792, "epoch": 689} {"train_loss": -10.10609245300293, "global_step": 115793, "epoch": 689} {"train_loss": -9.774900436401367, "global_step": 115794, "epoch": 689} {"train_loss": -10.11927604675293, "global_step": 115795, "epoch": 689} {"train_loss": -9.539670944213867, "global_step": 115796, "epoch": 689} {"train_loss": -9.957828521728516, "global_step": 115797, "epoch": 689} {"train_loss": -9.741243362426758, "global_step": 115798, "epoch": 689} {"train_loss": -10.078010559082031, "global_step": 115799, "epoch": 689} {"train_loss": -10.245739936828613, "global_step": 115800, "epoch": 689} {"train_loss": -9.82441520690918, "global_step": 115801, "epoch": 689} {"train_loss": -10.007979393005371, "global_step": 115802, "epoch": 689} {"train_loss": -10.051872253417969, "global_step": 115803, "epoch": 689} {"train_loss": -9.942991256713867, "global_step": 115804, "epoch": 689} {"train_loss": -9.954839706420898, "global_step": 115805, "epoch": 689} {"train_loss": -9.916816711425781, "global_step": 115806, "epoch": 689} {"train_loss": -10.052007675170898, "global_step": 115807, "epoch": 689} {"train_loss": -10.367725372314453, "global_step": 115808, "epoch": 689} {"train_loss": -10.27810287475586, "global_step": 115809, "epoch": 689} {"train_loss": -9.942256927490234, "global_step": 115810, "epoch": 689} {"train_loss": -10.326557159423828, "global_step": 115811, "epoch": 689} {"train_loss": -10.079262733459473, "global_step": 115812, "epoch": 689} {"train_loss": -9.894131660461426, "global_step": 115813, "epoch": 689} {"train_loss": -10.322334289550781, "global_step": 115814, "epoch": 689} {"train_loss": -10.028412818908691, "global_step": 115815, "epoch": 689} {"train_loss": -9.84530258178711, "global_step": 115816, "epoch": 689} {"train_loss": -10.136817932128906, "global_step": 115817, "epoch": 689} {"train_loss": -9.97134780883789, "global_step": 115818, "epoch": 689} {"train_loss": -10.196306228637695, "global_step": 115819, "epoch": 689} {"train_loss": -10.077913284301758, "global_step": 115820, "epoch": 689} {"train_loss": -10.137045860290527, "global_step": 115821, "epoch": 689} {"train_loss": -10.243606567382812, "global_step": 115822, "epoch": 689} {"train_loss": -10.041158676147461, "global_step": 115823, "epoch": 689} {"train_loss": -10.398404121398926, "global_step": 115824, "epoch": 689} {"train_loss": -10.050477981567383, "global_step": 115825, "epoch": 689} {"train_loss": -10.102837562561035, "global_step": 115826, "epoch": 689} {"train_loss": -10.133709907531738, "global_step": 115827, "epoch": 689} {"train_loss": -9.960208892822266, "global_step": 115828, "epoch": 689} {"train_loss": -10.24494743347168, "global_step": 115829, "epoch": 689} {"train_loss": -9.91839599609375, "global_step": 115830, "epoch": 689} {"train_loss": -9.866493225097656, "global_step": 115831, "epoch": 689} {"train_loss": -10.061573028564453, "global_step": 115832, "epoch": 689} {"train_loss": -9.866661071777344, "global_step": 115833, "epoch": 689} {"train_loss": -9.937379837036133, "global_step": 115834, "epoch": 689} {"train_loss": -10.232684135437012, "global_step": 115835, "epoch": 689} {"train_loss": -9.684100151062012, "global_step": 115836, "epoch": 689} {"train_loss": -9.952520370483398, "global_step": 115837, "epoch": 689} {"train_loss": -9.63619613647461, "global_step": 115838, "epoch": 689} {"train_loss": -10.104283332824707, "global_step": 115839, "epoch": 689} {"train_loss": -9.460651397705078, "global_step": 115840, "epoch": 689} {"train_loss": -10.242441177368164, "global_step": 115841, "epoch": 689} {"train_loss": -9.906652450561523, "global_step": 115842, "epoch": 689} {"train_loss": -10.197742462158203, "global_step": 115843, "epoch": 689} {"train_loss": -9.761439323425293, "global_step": 115844, "epoch": 689} {"train_loss": -10.385843276977539, "global_step": 115845, "epoch": 689} {"train_loss": -10.018123626708984, "global_step": 115846, "epoch": 689} {"train_loss": -10.065149307250977, "global_step": 115847, "epoch": 689} {"train_loss": -10.304903984069824, "global_step": 115848, "epoch": 689} {"train_loss": -9.823118209838867, "global_step": 115849, "epoch": 689} {"train_loss": -10.33512020111084, "global_step": 115850, "epoch": 689} {"train_loss": -10.019821166992188, "global_step": 115851, "epoch": 689} {"train_loss": -10.046985626220703, "global_step": 115852, "epoch": 689} {"train_loss": -10.043621063232422, "global_step": 115853, "epoch": 689} {"train_loss": -10.007472038269043, "global_step": 115854, "epoch": 689} {"train_loss": -9.889104843139648, "global_step": 115855, "epoch": 689} {"train_loss": -9.695070266723633, "global_step": 115856, "epoch": 689} {"train_loss": -9.958349227905273, "global_step": 115857, "epoch": 689} {"train_loss": -9.498455047607422, "global_step": 115858, "epoch": 689} {"train_loss": -10.173299789428711, "global_step": 115859, "epoch": 689} {"train_loss": -9.744157791137695, "global_step": 115860, "epoch": 689} {"train_loss": -9.893356323242188, "global_step": 115861, "epoch": 689} {"train_loss": -9.212031364440918, "global_step": 115862, "epoch": 689} {"train_loss": -9.750066757202148, "global_step": 115863, "epoch": 689} {"train_loss": -9.877902030944824, "global_step": 115864, "epoch": 689} {"train_loss": -9.44072151184082, "global_step": 115865, "epoch": 689} {"train_loss": -9.623461723327637, "global_step": 115866, "epoch": 689} {"train_loss": -9.614627838134766, "global_step": 115867, "epoch": 689} {"train_loss": -9.753786087036133, "global_step": 115868, "epoch": 689} {"train_loss": -9.893265724182129, "global_step": 115869, "epoch": 689} {"train_loss": -9.852108001708984, "global_step": 115870, "epoch": 689} {"train_loss": -9.666902542114258, "global_step": 115871, "epoch": 689} {"train_loss": -10.00963020324707, "global_step": 115872, "epoch": 689} {"train_loss": -9.956037521362305, "global_step": 115873, "epoch": 689} {"train_loss": -9.761754035949707, "global_step": 115874, "epoch": 689} {"train_loss": -10.173198699951172, "global_step": 115875, "epoch": 689} {"train_loss": -10.032974243164062, "global_step": 115876, "epoch": 689} {"train_loss": -9.868436813354492, "global_step": 115877, "epoch": 689} {"train_loss": -10.041147232055664, "global_step": 115878, "epoch": 689} {"train_loss": -10.071782112121582, "global_step": 115879, "epoch": 689} {"train_loss": -9.992371559143066, "global_step": 115880, "epoch": 689} {"train_loss": -10.17623519897461, "global_step": 115881, "epoch": 689} {"train_loss": -10.162933349609375, "global_step": 115882, "epoch": 689} {"train_loss": -9.98624038696289, "global_step": 115883, "epoch": 689} {"train_loss": -10.215784072875977, "global_step": 115884, "epoch": 689} {"train_loss": -10.338991165161133, "global_step": 115885, "epoch": 689} {"train_loss": -9.942327499389648, "global_step": 115886, "epoch": 689} {"train_loss": -9.865522384643555, "global_step": 115887, "epoch": 689} {"train_loss": -9.93217945098877, "global_step": 115888, "epoch": 689} {"train_loss": -9.809978485107422, "global_step": 115889, "epoch": 689} {"train_loss": -10.315345764160156, "global_step": 115890, "epoch": 689} {"train_loss": -9.488702774047852, "global_step": 115891, "epoch": 689} {"train_loss": -9.999391555786133, "global_step": 115892, "epoch": 689} {"train_loss": -10.092631340026855, "global_step": 115893, "epoch": 689} {"train_loss": -10.164144515991211, "global_step": 115894, "epoch": 689} {"train_loss": -10.206192970275879, "global_step": 115895, "epoch": 689} {"train_loss": -9.836092948913574, "global_step": 115896, "epoch": 689} {"train_loss": -10.069382667541504, "global_step": 115897, "epoch": 689} {"train_loss": -9.933786392211914, "global_step": 115898, "epoch": 689} {"train_loss": -10.128715515136719, "global_step": 115899, "epoch": 689} {"train_loss": -10.147500991821289, "global_step": 115900, "epoch": 689} {"train_loss": -10.241255760192871, "global_step": 115901, "epoch": 689} {"train_loss": -10.319866180419922, "global_step": 115902, "epoch": 689} {"train_loss": -10.233158111572266, "global_step": 115903, "epoch": 689} {"train_loss": -10.198095321655273, "global_step": 115904, "epoch": 689} {"train_loss": -10.260139465332031, "global_step": 115905, "epoch": 689} {"train_loss": -10.129291534423828, "global_step": 115906, "epoch": 689} {"train_loss": -10.286550521850586, "global_step": 115907, "epoch": 689} {"train_loss": -10.116079330444336, "global_step": 115908, "epoch": 689} {"train_loss": -10.170761108398438, "global_step": 115909, "epoch": 689} {"train_loss": -10.268239974975586, "global_step": 115910, "epoch": 689} {"train_loss": -10.242046356201172, "global_step": 115911, "epoch": 689} {"train_loss": -10.307546615600586, "global_step": 115912, "epoch": 689} {"train_loss": -10.214009284973145, "global_step": 115913, "epoch": 689} {"train_loss": -10.427461624145508, "global_step": 115914, "epoch": 689} {"train_loss": -10.215518951416016, "global_step": 115915, "epoch": 689} {"train_loss": -10.328969955444336, "global_step": 115916, "epoch": 689} {"train_loss": -10.373380661010742, "global_step": 115917, "epoch": 689} {"train_loss": -10.232402801513672, "global_step": 115918, "epoch": 689} {"train_loss": -9.999074748584203, "global_step": 115919, "epoch": 689, "val_loss": 213051.828125} {"train_loss": -10.381980895996094, "global_step": 115920, "epoch": 690} {"train_loss": -10.296968460083008, "global_step": 115921, "epoch": 690} {"train_loss": -10.423602104187012, "global_step": 115922, "epoch": 690} {"train_loss": -10.105362892150879, "global_step": 115923, "epoch": 690} {"train_loss": -10.335036277770996, "global_step": 115924, "epoch": 690} {"train_loss": -10.306779861450195, "global_step": 115925, "epoch": 690} {"train_loss": -10.471924781799316, "global_step": 115926, "epoch": 690} {"train_loss": -10.152482986450195, "global_step": 115927, "epoch": 690} {"train_loss": -10.086345672607422, "global_step": 115928, "epoch": 690} {"train_loss": -10.299081802368164, "global_step": 115929, "epoch": 690} {"train_loss": -10.393558502197266, "global_step": 115930, "epoch": 690} {"train_loss": -10.14120101928711, "global_step": 115931, "epoch": 690} {"train_loss": -10.215705871582031, "global_step": 115932, "epoch": 690} {"train_loss": -10.249422073364258, "global_step": 115933, "epoch": 690} {"train_loss": -10.059393882751465, "global_step": 115934, "epoch": 690} {"train_loss": -9.141853332519531, "global_step": 115935, "epoch": 690} {"train_loss": -10.248342514038086, "global_step": 115936, "epoch": 690} {"train_loss": -9.111592292785645, "global_step": 115937, "epoch": 690} {"train_loss": -9.430688858032227, "global_step": 115938, "epoch": 690} {"train_loss": -9.700154304504395, "global_step": 115939, "epoch": 690} {"train_loss": -8.908053398132324, "global_step": 115940, "epoch": 690} {"train_loss": -9.882081985473633, "global_step": 115941, "epoch": 690} {"train_loss": -9.395785331726074, "global_step": 115942, "epoch": 690} {"train_loss": -10.146949768066406, "global_step": 115943, "epoch": 690} {"train_loss": -9.399538040161133, "global_step": 115944, "epoch": 690} {"train_loss": -10.100526809692383, "global_step": 115945, "epoch": 690} {"train_loss": -9.818990707397461, "global_step": 115946, "epoch": 690} {"train_loss": -10.035270690917969, "global_step": 115947, "epoch": 690} {"train_loss": -9.681647300720215, "global_step": 115948, "epoch": 690} {"train_loss": -10.09060287475586, "global_step": 115949, "epoch": 690} {"train_loss": -9.815126419067383, "global_step": 115950, "epoch": 690} {"train_loss": -10.100286483764648, "global_step": 115951, "epoch": 690} {"train_loss": -9.641141891479492, "global_step": 115952, "epoch": 690} {"train_loss": -9.94455337524414, "global_step": 115953, "epoch": 690} {"train_loss": -10.010915756225586, "global_step": 115954, "epoch": 690} {"train_loss": -10.17679214477539, "global_step": 115955, "epoch": 690} {"train_loss": -9.777336120605469, "global_step": 115956, "epoch": 690} {"train_loss": -10.143218040466309, "global_step": 115957, "epoch": 690} {"train_loss": -10.134584426879883, "global_step": 115958, "epoch": 690} {"train_loss": -9.917657852172852, "global_step": 115959, "epoch": 690} {"train_loss": -10.136300086975098, "global_step": 115960, "epoch": 690} {"train_loss": -9.987213134765625, "global_step": 115961, "epoch": 690} {"train_loss": -10.227502822875977, "global_step": 115962, "epoch": 690} {"train_loss": -10.039152145385742, "global_step": 115963, "epoch": 690} {"train_loss": -9.977706909179688, "global_step": 115964, "epoch": 690} {"train_loss": -10.140411376953125, "global_step": 115965, "epoch": 690} {"train_loss": -10.07385540008545, "global_step": 115966, "epoch": 690} {"train_loss": -10.02808666229248, "global_step": 115967, "epoch": 690} {"train_loss": -9.756877899169922, "global_step": 115968, "epoch": 690} {"train_loss": -10.16196060180664, "global_step": 115969, "epoch": 690} {"train_loss": -10.074424743652344, "global_step": 115970, "epoch": 690} {"train_loss": -10.114992141723633, "global_step": 115971, "epoch": 690} {"train_loss": -10.115145683288574, "global_step": 115972, "epoch": 690} {"train_loss": -10.19321346282959, "global_step": 115973, "epoch": 690} {"train_loss": -10.104633331298828, "global_step": 115974, "epoch": 690} {"train_loss": -10.06652545928955, "global_step": 115975, "epoch": 690} {"train_loss": -9.980266571044922, "global_step": 115976, "epoch": 690} {"train_loss": -10.095170021057129, "global_step": 115977, "epoch": 690} {"train_loss": -10.195792198181152, "global_step": 115978, "epoch": 690} {"train_loss": -10.155921936035156, "global_step": 115979, "epoch": 690} {"train_loss": -10.265819549560547, "global_step": 115980, "epoch": 690} {"train_loss": -10.00291633605957, "global_step": 115981, "epoch": 690} {"train_loss": -10.045818328857422, "global_step": 115982, "epoch": 690} {"train_loss": -10.130826950073242, "global_step": 115983, "epoch": 690} {"train_loss": -10.161590576171875, "global_step": 115984, "epoch": 690} {"train_loss": -10.224169731140137, "global_step": 115985, "epoch": 690} {"train_loss": -10.12087345123291, "global_step": 115986, "epoch": 690} {"train_loss": -10.172341346740723, "global_step": 115987, "epoch": 690} {"train_loss": -10.26507568359375, "global_step": 115988, "epoch": 690} {"train_loss": -10.39780044555664, "global_step": 115989, "epoch": 690} {"train_loss": -10.444869995117188, "global_step": 115990, "epoch": 690} {"train_loss": -10.290445327758789, "global_step": 115991, "epoch": 690} {"train_loss": -10.363465309143066, "global_step": 115992, "epoch": 690} {"train_loss": -10.203771591186523, "global_step": 115993, "epoch": 690} {"train_loss": -10.017986297607422, "global_step": 115994, "epoch": 690} {"train_loss": -10.448325157165527, "global_step": 115995, "epoch": 690} {"train_loss": -10.557366371154785, "global_step": 115996, "epoch": 690} {"train_loss": -9.972894668579102, "global_step": 115997, "epoch": 690} {"train_loss": -10.232401847839355, "global_step": 115998, "epoch": 690} {"train_loss": -10.362333297729492, "global_step": 115999, "epoch": 690} {"train_loss": -9.996732711791992, "global_step": 116000, "epoch": 690} {"train_loss": -10.421719551086426, "global_step": 116001, "epoch": 690} {"train_loss": -10.195228576660156, "global_step": 116002, "epoch": 690} {"train_loss": -10.122928619384766, "global_step": 116003, "epoch": 690} {"train_loss": -10.083196640014648, "global_step": 116004, "epoch": 690} {"train_loss": -10.293432235717773, "global_step": 116005, "epoch": 690} {"train_loss": -9.845534324645996, "global_step": 116006, "epoch": 690} {"train_loss": -10.041396141052246, "global_step": 116007, "epoch": 690} {"train_loss": -10.276573181152344, "global_step": 116008, "epoch": 690} {"train_loss": -9.910489082336426, "global_step": 116009, "epoch": 690} {"train_loss": -9.868906021118164, "global_step": 116010, "epoch": 690} {"train_loss": -10.16926383972168, "global_step": 116011, "epoch": 690} {"train_loss": -9.269495010375977, "global_step": 116012, "epoch": 690} {"train_loss": -9.91197395324707, "global_step": 116013, "epoch": 690} {"train_loss": -9.996946334838867, "global_step": 116014, "epoch": 690} {"train_loss": -9.738189697265625, "global_step": 116015, "epoch": 690} {"train_loss": -9.947290420532227, "global_step": 116016, "epoch": 690} {"train_loss": -9.807489395141602, "global_step": 116017, "epoch": 690} {"train_loss": -9.761856079101562, "global_step": 116018, "epoch": 690} {"train_loss": -9.87318229675293, "global_step": 116019, "epoch": 690} {"train_loss": -10.114662170410156, "global_step": 116020, "epoch": 690} {"train_loss": -9.799484252929688, "global_step": 116021, "epoch": 690} {"train_loss": -9.68498706817627, "global_step": 116022, "epoch": 690} {"train_loss": -9.956645965576172, "global_step": 116023, "epoch": 690} {"train_loss": -10.074441909790039, "global_step": 116024, "epoch": 690} {"train_loss": -9.60590934753418, "global_step": 116025, "epoch": 690} {"train_loss": -9.732303619384766, "global_step": 116026, "epoch": 690} {"train_loss": -9.787796974182129, "global_step": 116027, "epoch": 690} {"train_loss": -9.690391540527344, "global_step": 116028, "epoch": 690} {"train_loss": -9.538124084472656, "global_step": 116029, "epoch": 690} {"train_loss": -9.818259239196777, "global_step": 116030, "epoch": 690} {"train_loss": -9.697944641113281, "global_step": 116031, "epoch": 690} {"train_loss": -10.03693962097168, "global_step": 116032, "epoch": 690} {"train_loss": -10.099637985229492, "global_step": 116033, "epoch": 690} {"train_loss": -9.760372161865234, "global_step": 116034, "epoch": 690} {"train_loss": -9.95854377746582, "global_step": 116035, "epoch": 690} {"train_loss": -9.918936729431152, "global_step": 116036, "epoch": 690} {"train_loss": -9.983489036560059, "global_step": 116037, "epoch": 690} {"train_loss": -10.210094451904297, "global_step": 116038, "epoch": 690} {"train_loss": -10.021417617797852, "global_step": 116039, "epoch": 690} {"train_loss": -9.874698638916016, "global_step": 116040, "epoch": 690} {"train_loss": -9.996838569641113, "global_step": 116041, "epoch": 690} {"train_loss": -10.173269271850586, "global_step": 116042, "epoch": 690} {"train_loss": -10.253931045532227, "global_step": 116043, "epoch": 690} {"train_loss": -10.164159774780273, "global_step": 116044, "epoch": 690} {"train_loss": -10.205585479736328, "global_step": 116045, "epoch": 690} {"train_loss": -10.124734878540039, "global_step": 116046, "epoch": 690} {"train_loss": -10.164400100708008, "global_step": 116047, "epoch": 690} {"train_loss": -10.118372917175293, "global_step": 116048, "epoch": 690} {"train_loss": -10.094615936279297, "global_step": 116049, "epoch": 690} {"train_loss": -9.954221725463867, "global_step": 116050, "epoch": 690} {"train_loss": -10.329801559448242, "global_step": 116051, "epoch": 690} {"train_loss": -10.108606338500977, "global_step": 116052, "epoch": 690} {"train_loss": -10.063470840454102, "global_step": 116053, "epoch": 690} {"train_loss": -10.216436386108398, "global_step": 116054, "epoch": 690} {"train_loss": -9.838943481445312, "global_step": 116055, "epoch": 690} {"train_loss": -10.338757514953613, "global_step": 116056, "epoch": 690} {"train_loss": -10.109972953796387, "global_step": 116057, "epoch": 690} {"train_loss": -10.24527359008789, "global_step": 116058, "epoch": 690} {"train_loss": -10.332555770874023, "global_step": 116059, "epoch": 690} {"train_loss": -10.286754608154297, "global_step": 116060, "epoch": 690} {"train_loss": -10.088072776794434, "global_step": 116061, "epoch": 690} {"train_loss": -10.154195785522461, "global_step": 116062, "epoch": 690} {"train_loss": -10.186336517333984, "global_step": 116063, "epoch": 690} {"train_loss": -10.069683074951172, "global_step": 116064, "epoch": 690} {"train_loss": -10.124570846557617, "global_step": 116065, "epoch": 690} {"train_loss": -9.933601379394531, "global_step": 116066, "epoch": 690} {"train_loss": -10.037400245666504, "global_step": 116067, "epoch": 690} {"train_loss": -9.974172592163086, "global_step": 116068, "epoch": 690} {"train_loss": -10.271064758300781, "global_step": 116069, "epoch": 690} {"train_loss": -10.050700187683105, "global_step": 116070, "epoch": 690} {"train_loss": -10.199440956115723, "global_step": 116071, "epoch": 690} {"train_loss": -9.867406845092773, "global_step": 116072, "epoch": 690} {"train_loss": -10.111736297607422, "global_step": 116073, "epoch": 690} {"train_loss": -10.110010147094727, "global_step": 116074, "epoch": 690} {"train_loss": -9.639694213867188, "global_step": 116075, "epoch": 690} {"train_loss": -9.683941841125488, "global_step": 116076, "epoch": 690} {"train_loss": -9.710061073303223, "global_step": 116077, "epoch": 690} {"train_loss": -9.140007019042969, "global_step": 116078, "epoch": 690} {"train_loss": -9.54240608215332, "global_step": 116079, "epoch": 690} {"train_loss": -10.016509056091309, "global_step": 116080, "epoch": 690} {"train_loss": -8.946167945861816, "global_step": 116081, "epoch": 690} {"train_loss": -9.131132125854492, "global_step": 116082, "epoch": 690} {"train_loss": -8.514466285705566, "global_step": 116083, "epoch": 690} {"train_loss": -9.472990989685059, "global_step": 116084, "epoch": 690} {"train_loss": -9.564728736877441, "global_step": 116085, "epoch": 690} {"train_loss": -9.14646053314209, "global_step": 116086, "epoch": 690} {"train_loss": -9.990933037939525, "global_step": 116087, "epoch": 690, "val_loss": 209873.6875, "train_action_mse_error": 6.710464000701904} {"train_loss": -9.522796630859375, "global_step": 116088, "epoch": 691} {"train_loss": -9.511659622192383, "global_step": 116089, "epoch": 691} {"train_loss": -9.461579322814941, "global_step": 116090, "epoch": 691} {"train_loss": -9.936891555786133, "global_step": 116091, "epoch": 691} {"train_loss": -9.896745681762695, "global_step": 116092, "epoch": 691} {"train_loss": -9.765556335449219, "global_step": 116093, "epoch": 691} {"train_loss": -9.710912704467773, "global_step": 116094, "epoch": 691} {"train_loss": -9.629348754882812, "global_step": 116095, "epoch": 691} {"train_loss": -9.791440963745117, "global_step": 116096, "epoch": 691} {"train_loss": -9.748760223388672, "global_step": 116097, "epoch": 691} {"train_loss": -9.821662902832031, "global_step": 116098, "epoch": 691} {"train_loss": -9.796411514282227, "global_step": 116099, "epoch": 691} {"train_loss": -9.753704071044922, "global_step": 116100, "epoch": 691} {"train_loss": -10.227209091186523, "global_step": 116101, "epoch": 691} {"train_loss": -9.688034057617188, "global_step": 116102, "epoch": 691} {"train_loss": -9.941335678100586, "global_step": 116103, "epoch": 691} {"train_loss": -9.939085006713867, "global_step": 116104, "epoch": 691} {"train_loss": -9.825606346130371, "global_step": 116105, "epoch": 691} {"train_loss": -10.050849914550781, "global_step": 116106, "epoch": 691} {"train_loss": -9.89970588684082, "global_step": 116107, "epoch": 691} {"train_loss": -9.866765975952148, "global_step": 116108, "epoch": 691} {"train_loss": -9.876092910766602, "global_step": 116109, "epoch": 691} {"train_loss": -9.993585586547852, "global_step": 116110, "epoch": 691} {"train_loss": -9.919605255126953, "global_step": 116111, "epoch": 691} {"train_loss": -10.229890823364258, "global_step": 116112, "epoch": 691} {"train_loss": -9.875511169433594, "global_step": 116113, "epoch": 691} {"train_loss": -10.118996620178223, "global_step": 116114, "epoch": 691} {"train_loss": -10.09378433227539, "global_step": 116115, "epoch": 691} {"train_loss": -10.046546936035156, "global_step": 116116, "epoch": 691} {"train_loss": -10.18458080291748, "global_step": 116117, "epoch": 691} {"train_loss": -9.918662071228027, "global_step": 116118, "epoch": 691} {"train_loss": -10.058539390563965, "global_step": 116119, "epoch": 691} {"train_loss": -10.031123161315918, "global_step": 116120, "epoch": 691} {"train_loss": -10.137418746948242, "global_step": 116121, "epoch": 691} {"train_loss": -10.067456245422363, "global_step": 116122, "epoch": 691} {"train_loss": -10.280566215515137, "global_step": 116123, "epoch": 691} {"train_loss": -9.808948516845703, "global_step": 116124, "epoch": 691} {"train_loss": -10.180326461791992, "global_step": 116125, "epoch": 691} {"train_loss": -9.865839004516602, "global_step": 116126, "epoch": 691} {"train_loss": -10.240234375, "global_step": 116127, "epoch": 691} {"train_loss": -9.71225643157959, "global_step": 116128, "epoch": 691} {"train_loss": -10.140619277954102, "global_step": 116129, "epoch": 691} {"train_loss": -10.278985977172852, "global_step": 116130, "epoch": 691} {"train_loss": -9.955841064453125, "global_step": 116131, "epoch": 691} {"train_loss": -10.280929565429688, "global_step": 116132, "epoch": 691} {"train_loss": -9.965633392333984, "global_step": 116133, "epoch": 691} {"train_loss": -10.172210693359375, "global_step": 116134, "epoch": 691} {"train_loss": -10.083629608154297, "global_step": 116135, "epoch": 691} {"train_loss": -10.078422546386719, "global_step": 116136, "epoch": 691} {"train_loss": -10.190801620483398, "global_step": 116137, "epoch": 691} {"train_loss": -9.982967376708984, "global_step": 116138, "epoch": 691} {"train_loss": -10.162056922912598, "global_step": 116139, "epoch": 691} {"train_loss": -10.195899963378906, "global_step": 116140, "epoch": 691} {"train_loss": -10.101478576660156, "global_step": 116141, "epoch": 691} {"train_loss": -10.25355052947998, "global_step": 116142, "epoch": 691} {"train_loss": -10.151453018188477, "global_step": 116143, "epoch": 691} {"train_loss": -10.115518569946289, "global_step": 116144, "epoch": 691} {"train_loss": -10.412439346313477, "global_step": 116145, "epoch": 691} {"train_loss": -10.275421142578125, "global_step": 116146, "epoch": 691} {"train_loss": -10.193147659301758, "global_step": 116147, "epoch": 691} {"train_loss": -10.266948699951172, "global_step": 116148, "epoch": 691} {"train_loss": -10.195367813110352, "global_step": 116149, "epoch": 691} {"train_loss": -10.07468032836914, "global_step": 116150, "epoch": 691} {"train_loss": -10.106715202331543, "global_step": 116151, "epoch": 691} {"train_loss": -10.005513191223145, "global_step": 116152, "epoch": 691} {"train_loss": -10.147281646728516, "global_step": 116153, "epoch": 691} {"train_loss": -10.359664916992188, "global_step": 116154, "epoch": 691} {"train_loss": -10.115038871765137, "global_step": 116155, "epoch": 691} {"train_loss": -10.238090515136719, "global_step": 116156, "epoch": 691} {"train_loss": -10.073222160339355, "global_step": 116157, "epoch": 691} {"train_loss": -10.454395294189453, "global_step": 116158, "epoch": 691} {"train_loss": -10.10948657989502, "global_step": 116159, "epoch": 691} {"train_loss": -9.981551170349121, "global_step": 116160, "epoch": 691} {"train_loss": -9.92880630493164, "global_step": 116161, "epoch": 691} {"train_loss": -10.131682395935059, "global_step": 116162, "epoch": 691} {"train_loss": -9.866527557373047, "global_step": 116163, "epoch": 691} {"train_loss": -10.11153793334961, "global_step": 116164, "epoch": 691} {"train_loss": -9.7117919921875, "global_step": 116165, "epoch": 691} {"train_loss": -9.785234451293945, "global_step": 116166, "epoch": 691} {"train_loss": -10.001656532287598, "global_step": 116167, "epoch": 691} {"train_loss": -9.646690368652344, "global_step": 116168, "epoch": 691} {"train_loss": -9.492524147033691, "global_step": 116169, "epoch": 691} {"train_loss": -9.851935386657715, "global_step": 116170, "epoch": 691} {"train_loss": -9.812807083129883, "global_step": 116171, "epoch": 691} {"train_loss": -10.033136367797852, "global_step": 116172, "epoch": 691} {"train_loss": -9.855804443359375, "global_step": 116173, "epoch": 691} {"train_loss": -9.724084854125977, "global_step": 116174, "epoch": 691} {"train_loss": -9.783414840698242, "global_step": 116175, "epoch": 691} {"train_loss": -9.714797973632812, "global_step": 116176, "epoch": 691} {"train_loss": -9.83260726928711, "global_step": 116177, "epoch": 691} {"train_loss": -9.915996551513672, "global_step": 116178, "epoch": 691} {"train_loss": -9.646177291870117, "global_step": 116179, "epoch": 691} {"train_loss": -9.902397155761719, "global_step": 116180, "epoch": 691} {"train_loss": -9.658807754516602, "global_step": 116181, "epoch": 691} {"train_loss": -9.654108047485352, "global_step": 116182, "epoch": 691} {"train_loss": -9.74898624420166, "global_step": 116183, "epoch": 691} {"train_loss": -9.788236618041992, "global_step": 116184, "epoch": 691} {"train_loss": -9.89632511138916, "global_step": 116185, "epoch": 691} {"train_loss": -9.846808433532715, "global_step": 116186, "epoch": 691} {"train_loss": -9.598172187805176, "global_step": 116187, "epoch": 691} {"train_loss": -10.16073989868164, "global_step": 116188, "epoch": 691} {"train_loss": -9.779727935791016, "global_step": 116189, "epoch": 691} {"train_loss": -9.71166706085205, "global_step": 116190, "epoch": 691} {"train_loss": -10.038887977600098, "global_step": 116191, "epoch": 691} {"train_loss": -9.792129516601562, "global_step": 116192, "epoch": 691} {"train_loss": -9.875984191894531, "global_step": 116193, "epoch": 691} {"train_loss": -10.024026870727539, "global_step": 116194, "epoch": 691} {"train_loss": -10.003873825073242, "global_step": 116195, "epoch": 691} {"train_loss": -9.906041145324707, "global_step": 116196, "epoch": 691} {"train_loss": -10.001657485961914, "global_step": 116197, "epoch": 691} {"train_loss": -9.861995697021484, "global_step": 116198, "epoch": 691} {"train_loss": -10.168514251708984, "global_step": 116199, "epoch": 691} {"train_loss": -9.862955093383789, "global_step": 116200, "epoch": 691} {"train_loss": -10.01636028289795, "global_step": 116201, "epoch": 691} {"train_loss": -9.834550857543945, "global_step": 116202, "epoch": 691} {"train_loss": -9.999613761901855, "global_step": 116203, "epoch": 691} {"train_loss": -9.866315841674805, "global_step": 116204, "epoch": 691} {"train_loss": -10.151518821716309, "global_step": 116205, "epoch": 691} {"train_loss": -10.011024475097656, "global_step": 116206, "epoch": 691} {"train_loss": -9.766329765319824, "global_step": 116207, "epoch": 691} {"train_loss": -10.064496994018555, "global_step": 116208, "epoch": 691} {"train_loss": -10.062726020812988, "global_step": 116209, "epoch": 691} {"train_loss": -9.558998107910156, "global_step": 116210, "epoch": 691} {"train_loss": -10.059638977050781, "global_step": 116211, "epoch": 691} {"train_loss": -9.6524658203125, "global_step": 116212, "epoch": 691} {"train_loss": -9.843613624572754, "global_step": 116213, "epoch": 691} {"train_loss": -10.02705192565918, "global_step": 116214, "epoch": 691} {"train_loss": -9.877857208251953, "global_step": 116215, "epoch": 691} {"train_loss": -9.826868057250977, "global_step": 116216, "epoch": 691} {"train_loss": -10.222315788269043, "global_step": 116217, "epoch": 691} {"train_loss": -9.893899917602539, "global_step": 116218, "epoch": 691} {"train_loss": -9.972466468811035, "global_step": 116219, "epoch": 691} {"train_loss": -10.097753524780273, "global_step": 116220, "epoch": 691} {"train_loss": -10.17023754119873, "global_step": 116221, "epoch": 691} {"train_loss": -10.05073070526123, "global_step": 116222, "epoch": 691} {"train_loss": -10.110642433166504, "global_step": 116223, "epoch": 691} {"train_loss": -10.138670921325684, "global_step": 116224, "epoch": 691} {"train_loss": -9.710285186767578, "global_step": 116225, "epoch": 691} {"train_loss": -9.992263793945312, "global_step": 116226, "epoch": 691} {"train_loss": -9.939422607421875, "global_step": 116227, "epoch": 691} {"train_loss": -10.195560455322266, "global_step": 116228, "epoch": 691} {"train_loss": -9.599102973937988, "global_step": 116229, "epoch": 691} {"train_loss": -10.213312149047852, "global_step": 116230, "epoch": 691} {"train_loss": -9.734817504882812, "global_step": 116231, "epoch": 691} {"train_loss": -10.328145980834961, "global_step": 116232, "epoch": 691} {"train_loss": -9.940595626831055, "global_step": 116233, "epoch": 691} {"train_loss": -10.365044593811035, "global_step": 116234, "epoch": 691} {"train_loss": -9.890592575073242, "global_step": 116235, "epoch": 691} {"train_loss": -10.393094062805176, "global_step": 116236, "epoch": 691} {"train_loss": -9.848084449768066, "global_step": 116237, "epoch": 691} {"train_loss": -10.292634010314941, "global_step": 116238, "epoch": 691} {"train_loss": -10.012269973754883, "global_step": 116239, "epoch": 691} {"train_loss": -10.398153305053711, "global_step": 116240, "epoch": 691} {"train_loss": -10.097338676452637, "global_step": 116241, "epoch": 691} {"train_loss": -10.147406578063965, "global_step": 116242, "epoch": 691} {"train_loss": -10.253372192382812, "global_step": 116243, "epoch": 691} {"train_loss": -10.145735740661621, "global_step": 116244, "epoch": 691} {"train_loss": -10.056306838989258, "global_step": 116245, "epoch": 691} {"train_loss": -10.21162223815918, "global_step": 116246, "epoch": 691} {"train_loss": -10.075174331665039, "global_step": 116247, "epoch": 691} {"train_loss": -9.943306922912598, "global_step": 116248, "epoch": 691} {"train_loss": -10.338848114013672, "global_step": 116249, "epoch": 691} {"train_loss": -10.019206047058105, "global_step": 116250, "epoch": 691} {"train_loss": -10.246870994567871, "global_step": 116251, "epoch": 691} {"train_loss": -10.121335983276367, "global_step": 116252, "epoch": 691} {"train_loss": -10.076959609985352, "global_step": 116253, "epoch": 691} {"train_loss": -10.122008323669434, "global_step": 116254, "epoch": 691} {"train_loss": -9.98617570740836, "global_step": 116255, "epoch": 691, "val_loss": 212259.5625} {"train_loss": -10.182693481445312, "global_step": 116256, "epoch": 692} {"train_loss": -9.957091331481934, "global_step": 116257, "epoch": 692} {"train_loss": -10.136798858642578, "global_step": 116258, "epoch": 692} {"train_loss": -10.053321838378906, "global_step": 116259, "epoch": 692} {"train_loss": -10.127664566040039, "global_step": 116260, "epoch": 692} {"train_loss": -10.098424911499023, "global_step": 116261, "epoch": 692} {"train_loss": -10.05886173248291, "global_step": 116262, "epoch": 692} {"train_loss": -10.286515235900879, "global_step": 116263, "epoch": 692} {"train_loss": -10.118922233581543, "global_step": 116264, "epoch": 692} {"train_loss": -10.042461395263672, "global_step": 116265, "epoch": 692} {"train_loss": -10.255659103393555, "global_step": 116266, "epoch": 692} {"train_loss": -10.120199203491211, "global_step": 116267, "epoch": 692} {"train_loss": -10.082913398742676, "global_step": 116268, "epoch": 692} {"train_loss": -9.90664005279541, "global_step": 116269, "epoch": 692} {"train_loss": -9.989948272705078, "global_step": 116270, "epoch": 692} {"train_loss": -10.294567108154297, "global_step": 116271, "epoch": 692} {"train_loss": -9.949210166931152, "global_step": 116272, "epoch": 692} {"train_loss": -10.264429092407227, "global_step": 116273, "epoch": 692} {"train_loss": -10.156805992126465, "global_step": 116274, "epoch": 692} {"train_loss": -10.36795425415039, "global_step": 116275, "epoch": 692} {"train_loss": -10.31471061706543, "global_step": 116276, "epoch": 692} {"train_loss": -10.254220008850098, "global_step": 116277, "epoch": 692} {"train_loss": -10.176095962524414, "global_step": 116278, "epoch": 692} {"train_loss": -10.361530303955078, "global_step": 116279, "epoch": 692} {"train_loss": -10.040348052978516, "global_step": 116280, "epoch": 692} {"train_loss": -9.918914794921875, "global_step": 116281, "epoch": 692} {"train_loss": -10.254971504211426, "global_step": 116282, "epoch": 692} {"train_loss": -10.279240608215332, "global_step": 116283, "epoch": 692} {"train_loss": -10.378567695617676, "global_step": 116284, "epoch": 692} {"train_loss": -10.408721923828125, "global_step": 116285, "epoch": 692} {"train_loss": -10.212454795837402, "global_step": 116286, "epoch": 692} {"train_loss": -10.400121688842773, "global_step": 116287, "epoch": 692} {"train_loss": -10.061756134033203, "global_step": 116288, "epoch": 692} {"train_loss": -10.095645904541016, "global_step": 116289, "epoch": 692} {"train_loss": -9.936920166015625, "global_step": 116290, "epoch": 692} {"train_loss": -10.087756156921387, "global_step": 116291, "epoch": 692} {"train_loss": -10.208348274230957, "global_step": 116292, "epoch": 692} {"train_loss": -10.133733749389648, "global_step": 116293, "epoch": 692} {"train_loss": -9.757680892944336, "global_step": 116294, "epoch": 692} {"train_loss": -10.010830879211426, "global_step": 116295, "epoch": 692} {"train_loss": -10.202288627624512, "global_step": 116296, "epoch": 692} {"train_loss": -9.967597961425781, "global_step": 116297, "epoch": 692} {"train_loss": -10.089960098266602, "global_step": 116298, "epoch": 692} {"train_loss": -9.853242874145508, "global_step": 116299, "epoch": 692} {"train_loss": -10.062679290771484, "global_step": 116300, "epoch": 692} {"train_loss": -9.847028732299805, "global_step": 116301, "epoch": 692} {"train_loss": -9.730293273925781, "global_step": 116302, "epoch": 692} {"train_loss": -9.592910766601562, "global_step": 116303, "epoch": 692} {"train_loss": -10.310741424560547, "global_step": 116304, "epoch": 692} {"train_loss": -9.906850814819336, "global_step": 116305, "epoch": 692} {"train_loss": -9.871153831481934, "global_step": 116306, "epoch": 692} {"train_loss": -10.21345329284668, "global_step": 116307, "epoch": 692} {"train_loss": -9.941368103027344, "global_step": 116308, "epoch": 692} {"train_loss": -10.208478927612305, "global_step": 116309, "epoch": 692} {"train_loss": -10.250030517578125, "global_step": 116310, "epoch": 692} {"train_loss": -10.153339385986328, "global_step": 116311, "epoch": 692} {"train_loss": -10.148664474487305, "global_step": 116312, "epoch": 692} {"train_loss": -10.055368423461914, "global_step": 116313, "epoch": 692} {"train_loss": -9.826553344726562, "global_step": 116314, "epoch": 692} {"train_loss": -9.940092086791992, "global_step": 116315, "epoch": 692} {"train_loss": -9.535870552062988, "global_step": 116316, "epoch": 692} {"train_loss": -9.891077995300293, "global_step": 116317, "epoch": 692} {"train_loss": -9.642147064208984, "global_step": 116318, "epoch": 692} {"train_loss": -9.537518501281738, "global_step": 116319, "epoch": 692} {"train_loss": -10.171384811401367, "global_step": 116320, "epoch": 692} {"train_loss": -9.653305053710938, "global_step": 116321, "epoch": 692} {"train_loss": -9.610082626342773, "global_step": 116322, "epoch": 692} {"train_loss": -9.948131561279297, "global_step": 116323, "epoch": 692} {"train_loss": -9.357149124145508, "global_step": 116324, "epoch": 692} {"train_loss": -9.753860473632812, "global_step": 116325, "epoch": 692} {"train_loss": -10.165672302246094, "global_step": 116326, "epoch": 692} {"train_loss": -9.722221374511719, "global_step": 116327, "epoch": 692} {"train_loss": -10.006148338317871, "global_step": 116328, "epoch": 692} {"train_loss": -10.064943313598633, "global_step": 116329, "epoch": 692} {"train_loss": -9.987940788269043, "global_step": 116330, "epoch": 692} {"train_loss": -9.822225570678711, "global_step": 116331, "epoch": 692} {"train_loss": -10.177902221679688, "global_step": 116332, "epoch": 692} {"train_loss": -9.942742347717285, "global_step": 116333, "epoch": 692} {"train_loss": -9.76833724975586, "global_step": 116334, "epoch": 692} {"train_loss": -9.90304183959961, "global_step": 116335, "epoch": 692} {"train_loss": -9.876773834228516, "global_step": 116336, "epoch": 692} {"train_loss": -9.939004898071289, "global_step": 116337, "epoch": 692} {"train_loss": -9.847082138061523, "global_step": 116338, "epoch": 692} {"train_loss": -9.988493919372559, "global_step": 116339, "epoch": 692} {"train_loss": -9.616920471191406, "global_step": 116340, "epoch": 692} {"train_loss": -10.200519561767578, "global_step": 116341, "epoch": 692} {"train_loss": -10.048476219177246, "global_step": 116342, "epoch": 692} {"train_loss": -9.973551750183105, "global_step": 116343, "epoch": 692} {"train_loss": -10.225809097290039, "global_step": 116344, "epoch": 692} {"train_loss": -10.028345108032227, "global_step": 116345, "epoch": 692} {"train_loss": -10.040895462036133, "global_step": 116346, "epoch": 692} {"train_loss": -10.096839904785156, "global_step": 116347, "epoch": 692} {"train_loss": -9.924306869506836, "global_step": 116348, "epoch": 692} {"train_loss": -10.00589370727539, "global_step": 116349, "epoch": 692} {"train_loss": -10.35958480834961, "global_step": 116350, "epoch": 692} {"train_loss": -10.06816291809082, "global_step": 116351, "epoch": 692} {"train_loss": -10.252573013305664, "global_step": 116352, "epoch": 692} {"train_loss": -9.976043701171875, "global_step": 116353, "epoch": 692} {"train_loss": -10.159982681274414, "global_step": 116354, "epoch": 692} {"train_loss": -9.938150405883789, "global_step": 116355, "epoch": 692} {"train_loss": -10.179389953613281, "global_step": 116356, "epoch": 692} {"train_loss": -10.154036521911621, "global_step": 116357, "epoch": 692} {"train_loss": -10.210029602050781, "global_step": 116358, "epoch": 692} {"train_loss": -10.045156478881836, "global_step": 116359, "epoch": 692} {"train_loss": -10.173493385314941, "global_step": 116360, "epoch": 692} {"train_loss": -10.128629684448242, "global_step": 116361, "epoch": 692} {"train_loss": -10.070941925048828, "global_step": 116362, "epoch": 692} {"train_loss": -9.889753341674805, "global_step": 116363, "epoch": 692} {"train_loss": -9.756315231323242, "global_step": 116364, "epoch": 692} {"train_loss": -9.90678882598877, "global_step": 116365, "epoch": 692} {"train_loss": -9.881965637207031, "global_step": 116366, "epoch": 692} {"train_loss": -9.703743934631348, "global_step": 116367, "epoch": 692} {"train_loss": -10.175044059753418, "global_step": 116368, "epoch": 692} {"train_loss": -9.84317398071289, "global_step": 116369, "epoch": 692} {"train_loss": -10.136543273925781, "global_step": 116370, "epoch": 692} {"train_loss": -9.984663009643555, "global_step": 116371, "epoch": 692} {"train_loss": -10.044196128845215, "global_step": 116372, "epoch": 692} {"train_loss": -9.432594299316406, "global_step": 116373, "epoch": 692} {"train_loss": -9.780863761901855, "global_step": 116374, "epoch": 692} {"train_loss": -9.675543785095215, "global_step": 116375, "epoch": 692} {"train_loss": -9.470016479492188, "global_step": 116376, "epoch": 692} {"train_loss": -10.088418960571289, "global_step": 116377, "epoch": 692} {"train_loss": -9.275879859924316, "global_step": 116378, "epoch": 692} {"train_loss": -9.887165069580078, "global_step": 116379, "epoch": 692} {"train_loss": -9.26589584350586, "global_step": 116380, "epoch": 692} {"train_loss": -9.483962059020996, "global_step": 116381, "epoch": 692} {"train_loss": -9.59982681274414, "global_step": 116382, "epoch": 692} {"train_loss": -9.91685676574707, "global_step": 116383, "epoch": 692} {"train_loss": -9.741518020629883, "global_step": 116384, "epoch": 692} {"train_loss": -9.752670288085938, "global_step": 116385, "epoch": 692} {"train_loss": -10.139595031738281, "global_step": 116386, "epoch": 692} {"train_loss": -10.007211685180664, "global_step": 116387, "epoch": 692} {"train_loss": -9.871478080749512, "global_step": 116388, "epoch": 692} {"train_loss": -9.941380500793457, "global_step": 116389, "epoch": 692} {"train_loss": -9.92304801940918, "global_step": 116390, "epoch": 692} {"train_loss": -10.013062477111816, "global_step": 116391, "epoch": 692} {"train_loss": -10.090463638305664, "global_step": 116392, "epoch": 692} {"train_loss": -10.026296615600586, "global_step": 116393, "epoch": 692} {"train_loss": -10.017729759216309, "global_step": 116394, "epoch": 692} {"train_loss": -9.979911804199219, "global_step": 116395, "epoch": 692} {"train_loss": -10.102795600891113, "global_step": 116396, "epoch": 692} {"train_loss": -10.072346687316895, "global_step": 116397, "epoch": 692} {"train_loss": -9.990314483642578, "global_step": 116398, "epoch": 692} {"train_loss": -10.07113265991211, "global_step": 116399, "epoch": 692} {"train_loss": -10.145255088806152, "global_step": 116400, "epoch": 692} {"train_loss": -10.092500686645508, "global_step": 116401, "epoch": 692} {"train_loss": -10.142993927001953, "global_step": 116402, "epoch": 692} {"train_loss": -10.245457649230957, "global_step": 116403, "epoch": 692} {"train_loss": -10.364215850830078, "global_step": 116404, "epoch": 692} {"train_loss": -10.250158309936523, "global_step": 116405, "epoch": 692} {"train_loss": -10.284623146057129, "global_step": 116406, "epoch": 692} {"train_loss": -10.27526569366455, "global_step": 116407, "epoch": 692} {"train_loss": -10.29123592376709, "global_step": 116408, "epoch": 692} {"train_loss": -10.276865005493164, "global_step": 116409, "epoch": 692} {"train_loss": -10.062112808227539, "global_step": 116410, "epoch": 692} {"train_loss": -10.2722749710083, "global_step": 116411, "epoch": 692} {"train_loss": -10.244879722595215, "global_step": 116412, "epoch": 692} {"train_loss": -10.117658615112305, "global_step": 116413, "epoch": 692} {"train_loss": -9.989032745361328, "global_step": 116414, "epoch": 692} {"train_loss": -10.004329681396484, "global_step": 116415, "epoch": 692} {"train_loss": -9.96261215209961, "global_step": 116416, "epoch": 692} {"train_loss": -10.351709365844727, "global_step": 116417, "epoch": 692} {"train_loss": -9.811273574829102, "global_step": 116418, "epoch": 692} {"train_loss": -10.27472972869873, "global_step": 116419, "epoch": 692} {"train_loss": -10.092135429382324, "global_step": 116420, "epoch": 692} {"train_loss": -9.480975151062012, "global_step": 116421, "epoch": 692} {"train_loss": -10.003744125366211, "global_step": 116422, "epoch": 692} {"train_loss": -10.013309280077616, "global_step": 116423, "epoch": 692, "val_loss": 209518.6875} {"train_loss": -9.718774795532227, "global_step": 116424, "epoch": 693} {"train_loss": -10.076799392700195, "global_step": 116425, "epoch": 693} {"train_loss": -9.766175270080566, "global_step": 116426, "epoch": 693} {"train_loss": -10.088930130004883, "global_step": 116427, "epoch": 693} {"train_loss": -10.273517608642578, "global_step": 116428, "epoch": 693} {"train_loss": -9.702797889709473, "global_step": 116429, "epoch": 693} {"train_loss": -10.215564727783203, "global_step": 116430, "epoch": 693} {"train_loss": -10.163829803466797, "global_step": 116431, "epoch": 693} {"train_loss": -10.221637725830078, "global_step": 116432, "epoch": 693} {"train_loss": -10.165735244750977, "global_step": 116433, "epoch": 693} {"train_loss": -9.869711875915527, "global_step": 116434, "epoch": 693} {"train_loss": -10.149942398071289, "global_step": 116435, "epoch": 693} {"train_loss": -10.130316734313965, "global_step": 116436, "epoch": 693} {"train_loss": -10.00075912475586, "global_step": 116437, "epoch": 693} {"train_loss": -10.3302001953125, "global_step": 116438, "epoch": 693} {"train_loss": -10.136879920959473, "global_step": 116439, "epoch": 693} {"train_loss": -10.25416088104248, "global_step": 116440, "epoch": 693} {"train_loss": -10.11148452758789, "global_step": 116441, "epoch": 693} {"train_loss": -10.35368537902832, "global_step": 116442, "epoch": 693} {"train_loss": -9.825460433959961, "global_step": 116443, "epoch": 693} {"train_loss": -9.969791412353516, "global_step": 116444, "epoch": 693} {"train_loss": -10.167381286621094, "global_step": 116445, "epoch": 693} {"train_loss": -9.40155029296875, "global_step": 116446, "epoch": 693} {"train_loss": -10.203842163085938, "global_step": 116447, "epoch": 693} {"train_loss": -9.618597030639648, "global_step": 116448, "epoch": 693} {"train_loss": -9.777767181396484, "global_step": 116449, "epoch": 693} {"train_loss": -9.577064514160156, "global_step": 116450, "epoch": 693} {"train_loss": -9.602964401245117, "global_step": 116451, "epoch": 693} {"train_loss": -9.686542510986328, "global_step": 116452, "epoch": 693} {"train_loss": -9.798542022705078, "global_step": 116453, "epoch": 693} {"train_loss": -10.044839859008789, "global_step": 116454, "epoch": 693} {"train_loss": -9.737966537475586, "global_step": 116455, "epoch": 693} {"train_loss": -9.674090385437012, "global_step": 116456, "epoch": 693} {"train_loss": -9.91195297241211, "global_step": 116457, "epoch": 693} {"train_loss": -9.47659683227539, "global_step": 116458, "epoch": 693} {"train_loss": -9.942679405212402, "global_step": 116459, "epoch": 693} {"train_loss": -9.886646270751953, "global_step": 116460, "epoch": 693} {"train_loss": -9.50340461730957, "global_step": 116461, "epoch": 693} {"train_loss": -9.598344802856445, "global_step": 116462, "epoch": 693} {"train_loss": -9.988770484924316, "global_step": 116463, "epoch": 693} {"train_loss": -9.605062484741211, "global_step": 116464, "epoch": 693} {"train_loss": -9.782243728637695, "global_step": 116465, "epoch": 693} {"train_loss": -9.679306030273438, "global_step": 116466, "epoch": 693} {"train_loss": -9.934812545776367, "global_step": 116467, "epoch": 693} {"train_loss": -10.15290641784668, "global_step": 116468, "epoch": 693} {"train_loss": -9.833219528198242, "global_step": 116469, "epoch": 693} {"train_loss": -9.951611518859863, "global_step": 116470, "epoch": 693} {"train_loss": -9.893758773803711, "global_step": 116471, "epoch": 693} {"train_loss": -10.041153907775879, "global_step": 116472, "epoch": 693} {"train_loss": -10.140214920043945, "global_step": 116473, "epoch": 693} {"train_loss": -9.698164939880371, "global_step": 116474, "epoch": 693} {"train_loss": -10.275440216064453, "global_step": 116475, "epoch": 693} {"train_loss": -9.978950500488281, "global_step": 116476, "epoch": 693} {"train_loss": -10.106284141540527, "global_step": 116477, "epoch": 693} {"train_loss": -10.067768096923828, "global_step": 116478, "epoch": 693} {"train_loss": -9.911482810974121, "global_step": 116479, "epoch": 693} {"train_loss": -10.171126365661621, "global_step": 116480, "epoch": 693} {"train_loss": -10.121045112609863, "global_step": 116481, "epoch": 693} {"train_loss": -10.15099811553955, "global_step": 116482, "epoch": 693} {"train_loss": -10.101289749145508, "global_step": 116483, "epoch": 693} {"train_loss": -10.216787338256836, "global_step": 116484, "epoch": 693} {"train_loss": -10.344725608825684, "global_step": 116485, "epoch": 693} {"train_loss": -10.249810218811035, "global_step": 116486, "epoch": 693} {"train_loss": -10.234405517578125, "global_step": 116487, "epoch": 693} {"train_loss": -10.451056480407715, "global_step": 116488, "epoch": 693} {"train_loss": -10.337944030761719, "global_step": 116489, "epoch": 693} {"train_loss": -10.319792747497559, "global_step": 116490, "epoch": 693} {"train_loss": -10.197940826416016, "global_step": 116491, "epoch": 693} {"train_loss": -10.355489730834961, "global_step": 116492, "epoch": 693} {"train_loss": -10.32902717590332, "global_step": 116493, "epoch": 693} {"train_loss": -10.589338302612305, "global_step": 116494, "epoch": 693} {"train_loss": -10.3096284866333, "global_step": 116495, "epoch": 693} {"train_loss": -10.292622566223145, "global_step": 116496, "epoch": 693} {"train_loss": -10.253732681274414, "global_step": 116497, "epoch": 693} {"train_loss": -10.094633102416992, "global_step": 116498, "epoch": 693} {"train_loss": -10.512468338012695, "global_step": 116499, "epoch": 693} {"train_loss": -10.134198188781738, "global_step": 116500, "epoch": 693} {"train_loss": -10.4044189453125, "global_step": 116501, "epoch": 693} {"train_loss": -10.240968704223633, "global_step": 116502, "epoch": 693} {"train_loss": -10.600870132446289, "global_step": 116503, "epoch": 693} {"train_loss": -10.420625686645508, "global_step": 116504, "epoch": 693} {"train_loss": -10.460295677185059, "global_step": 116505, "epoch": 693} {"train_loss": -10.40474796295166, "global_step": 116506, "epoch": 693} {"train_loss": -10.425294876098633, "global_step": 116507, "epoch": 693} {"train_loss": -10.432184219360352, "global_step": 116508, "epoch": 693} {"train_loss": -10.368681907653809, "global_step": 116509, "epoch": 693} {"train_loss": -10.605031967163086, "global_step": 116510, "epoch": 693} {"train_loss": -10.08755111694336, "global_step": 116511, "epoch": 693} {"train_loss": -10.140833854675293, "global_step": 116512, "epoch": 693} {"train_loss": -10.045831680297852, "global_step": 116513, "epoch": 693} {"train_loss": -9.637629508972168, "global_step": 116514, "epoch": 693} {"train_loss": -9.427153587341309, "global_step": 116515, "epoch": 693} {"train_loss": -9.879007339477539, "global_step": 116516, "epoch": 693} {"train_loss": -9.44322395324707, "global_step": 116517, "epoch": 693} {"train_loss": -8.50912857055664, "global_step": 116518, "epoch": 693} {"train_loss": -9.5538969039917, "global_step": 116519, "epoch": 693} {"train_loss": -7.345682621002197, "global_step": 116520, "epoch": 693} {"train_loss": -9.929895401000977, "global_step": 116521, "epoch": 693} {"train_loss": -9.023266792297363, "global_step": 116522, "epoch": 693} {"train_loss": -9.776679992675781, "global_step": 116523, "epoch": 693} {"train_loss": -8.619186401367188, "global_step": 116524, "epoch": 693} {"train_loss": -9.65933609008789, "global_step": 116525, "epoch": 693} {"train_loss": -9.041688919067383, "global_step": 116526, "epoch": 693} {"train_loss": -9.478803634643555, "global_step": 116527, "epoch": 693} {"train_loss": -9.230596542358398, "global_step": 116528, "epoch": 693} {"train_loss": -9.798273086547852, "global_step": 116529, "epoch": 693} {"train_loss": -9.42238998413086, "global_step": 116530, "epoch": 693} {"train_loss": -9.436931610107422, "global_step": 116531, "epoch": 693} {"train_loss": -9.930309295654297, "global_step": 116532, "epoch": 693} {"train_loss": -9.445497512817383, "global_step": 116533, "epoch": 693} {"train_loss": -9.808411598205566, "global_step": 116534, "epoch": 693} {"train_loss": -9.75294303894043, "global_step": 116535, "epoch": 693} {"train_loss": -9.739234924316406, "global_step": 116536, "epoch": 693} {"train_loss": -9.659050941467285, "global_step": 116537, "epoch": 693} {"train_loss": -9.736825942993164, "global_step": 116538, "epoch": 693} {"train_loss": -9.936978340148926, "global_step": 116539, "epoch": 693} {"train_loss": -9.591115951538086, "global_step": 116540, "epoch": 693} {"train_loss": -9.797370910644531, "global_step": 116541, "epoch": 693} {"train_loss": -9.80221939086914, "global_step": 116542, "epoch": 693} {"train_loss": -9.766672134399414, "global_step": 116543, "epoch": 693} {"train_loss": -9.790674209594727, "global_step": 116544, "epoch": 693} {"train_loss": -9.972843170166016, "global_step": 116545, "epoch": 693} {"train_loss": -9.781810760498047, "global_step": 116546, "epoch": 693} {"train_loss": -9.983026504516602, "global_step": 116547, "epoch": 693} {"train_loss": -9.817604064941406, "global_step": 116548, "epoch": 693} {"train_loss": -9.877243995666504, "global_step": 116549, "epoch": 693} {"train_loss": -9.963787078857422, "global_step": 116550, "epoch": 693} {"train_loss": -10.024107933044434, "global_step": 116551, "epoch": 693} {"train_loss": -9.974630355834961, "global_step": 116552, "epoch": 693} {"train_loss": -9.977258682250977, "global_step": 116553, "epoch": 693} {"train_loss": -10.048928260803223, "global_step": 116554, "epoch": 693} {"train_loss": -10.246847152709961, "global_step": 116555, "epoch": 693} {"train_loss": -9.987006187438965, "global_step": 116556, "epoch": 693} {"train_loss": -10.074592590332031, "global_step": 116557, "epoch": 693} {"train_loss": -10.07727336883545, "global_step": 116558, "epoch": 693} {"train_loss": -10.278251647949219, "global_step": 116559, "epoch": 693} {"train_loss": -10.01755142211914, "global_step": 116560, "epoch": 693} {"train_loss": -10.185182571411133, "global_step": 116561, "epoch": 693} {"train_loss": -10.142091751098633, "global_step": 116562, "epoch": 693} {"train_loss": -10.029062271118164, "global_step": 116563, "epoch": 693} {"train_loss": -10.170838356018066, "global_step": 116564, "epoch": 693} {"train_loss": -10.18120002746582, "global_step": 116565, "epoch": 693} {"train_loss": -10.14707088470459, "global_step": 116566, "epoch": 693} {"train_loss": -10.08559799194336, "global_step": 116567, "epoch": 693} {"train_loss": -10.436514854431152, "global_step": 116568, "epoch": 693} {"train_loss": -10.341211318969727, "global_step": 116569, "epoch": 693} {"train_loss": -10.33405876159668, "global_step": 116570, "epoch": 693} {"train_loss": -10.281445503234863, "global_step": 116571, "epoch": 693} {"train_loss": -10.025168418884277, "global_step": 116572, "epoch": 693} {"train_loss": -10.540655136108398, "global_step": 116573, "epoch": 693} {"train_loss": -10.421121597290039, "global_step": 116574, "epoch": 693} {"train_loss": -10.386357307434082, "global_step": 116575, "epoch": 693} {"train_loss": -10.413158416748047, "global_step": 116576, "epoch": 693} {"train_loss": -10.32751750946045, "global_step": 116577, "epoch": 693} {"train_loss": -10.049882888793945, "global_step": 116578, "epoch": 693} {"train_loss": -10.526666641235352, "global_step": 116579, "epoch": 693} {"train_loss": -10.112628936767578, "global_step": 116580, "epoch": 693} {"train_loss": -10.244710922241211, "global_step": 116581, "epoch": 693} {"train_loss": -9.61668586730957, "global_step": 116582, "epoch": 693} {"train_loss": -9.573493957519531, "global_step": 116583, "epoch": 693} {"train_loss": -9.893512725830078, "global_step": 116584, "epoch": 693} {"train_loss": -9.357367515563965, "global_step": 116585, "epoch": 693} {"train_loss": -9.825199127197266, "global_step": 116586, "epoch": 693} {"train_loss": -9.856979370117188, "global_step": 116587, "epoch": 693} {"train_loss": -9.1300687789917, "global_step": 116588, "epoch": 693} {"train_loss": -10.122539520263672, "global_step": 116589, "epoch": 693} {"train_loss": -9.907571792602539, "global_step": 116590, "epoch": 693} {"train_loss": -9.959102446124668, "global_step": 116591, "epoch": 693, "val_loss": 212425.546875} {"train_loss": -9.882987976074219, "global_step": 116592, "epoch": 694} {"train_loss": -9.693276405334473, "global_step": 116593, "epoch": 694} {"train_loss": -9.780681610107422, "global_step": 116594, "epoch": 694} {"train_loss": -9.662927627563477, "global_step": 116595, "epoch": 694} {"train_loss": -9.783754348754883, "global_step": 116596, "epoch": 694} {"train_loss": -9.54909896850586, "global_step": 116597, "epoch": 694} {"train_loss": -9.904745101928711, "global_step": 116598, "epoch": 694} {"train_loss": -9.50875186920166, "global_step": 116599, "epoch": 694} {"train_loss": -9.213203430175781, "global_step": 116600, "epoch": 694} {"train_loss": -9.951090812683105, "global_step": 116601, "epoch": 694} {"train_loss": -9.405486106872559, "global_step": 116602, "epoch": 694} {"train_loss": -9.601170539855957, "global_step": 116603, "epoch": 694} {"train_loss": -9.560846328735352, "global_step": 116604, "epoch": 694} {"train_loss": -9.956110954284668, "global_step": 116605, "epoch": 694} {"train_loss": -9.412778854370117, "global_step": 116606, "epoch": 694} {"train_loss": -9.96501636505127, "global_step": 116607, "epoch": 694} {"train_loss": -9.778421401977539, "global_step": 116608, "epoch": 694} {"train_loss": -9.865766525268555, "global_step": 116609, "epoch": 694} {"train_loss": -9.586109161376953, "global_step": 116610, "epoch": 694} {"train_loss": -9.841060638427734, "global_step": 116611, "epoch": 694} {"train_loss": -9.694474220275879, "global_step": 116612, "epoch": 694} {"train_loss": -9.902328491210938, "global_step": 116613, "epoch": 694} {"train_loss": -10.009830474853516, "global_step": 116614, "epoch": 694} {"train_loss": -9.887569427490234, "global_step": 116615, "epoch": 694} {"train_loss": -9.983137130737305, "global_step": 116616, "epoch": 694} {"train_loss": -10.209114074707031, "global_step": 116617, "epoch": 694} {"train_loss": -9.798806190490723, "global_step": 116618, "epoch": 694} {"train_loss": -9.99458122253418, "global_step": 116619, "epoch": 694} {"train_loss": -9.959230422973633, "global_step": 116620, "epoch": 694} {"train_loss": -10.043150901794434, "global_step": 116621, "epoch": 694} {"train_loss": -10.08291244506836, "global_step": 116622, "epoch": 694} {"train_loss": -10.070867538452148, "global_step": 116623, "epoch": 694} {"train_loss": -9.786985397338867, "global_step": 116624, "epoch": 694} {"train_loss": -10.015889167785645, "global_step": 116625, "epoch": 694} {"train_loss": -10.187047958374023, "global_step": 116626, "epoch": 694} {"train_loss": -10.070756912231445, "global_step": 116627, "epoch": 694} {"train_loss": -10.00122356414795, "global_step": 116628, "epoch": 694} {"train_loss": -9.999923706054688, "global_step": 116629, "epoch": 694} {"train_loss": -10.00649642944336, "global_step": 116630, "epoch": 694} {"train_loss": -10.157655715942383, "global_step": 116631, "epoch": 694} {"train_loss": -10.122511863708496, "global_step": 116632, "epoch": 694} {"train_loss": -10.042506217956543, "global_step": 116633, "epoch": 694} {"train_loss": -9.828964233398438, "global_step": 116634, "epoch": 694} {"train_loss": -10.171656608581543, "global_step": 116635, "epoch": 694} {"train_loss": -10.341733932495117, "global_step": 116636, "epoch": 694} {"train_loss": -9.958839416503906, "global_step": 116637, "epoch": 694} {"train_loss": -10.133420944213867, "global_step": 116638, "epoch": 694} {"train_loss": -10.08348274230957, "global_step": 116639, "epoch": 694} {"train_loss": -10.227992057800293, "global_step": 116640, "epoch": 694} {"train_loss": -9.94999885559082, "global_step": 116641, "epoch": 694} {"train_loss": -10.271778106689453, "global_step": 116642, "epoch": 694} {"train_loss": -10.142154693603516, "global_step": 116643, "epoch": 694} {"train_loss": -10.263788223266602, "global_step": 116644, "epoch": 694} {"train_loss": -10.077369689941406, "global_step": 116645, "epoch": 694} {"train_loss": -9.869099617004395, "global_step": 116646, "epoch": 694} {"train_loss": -10.00493049621582, "global_step": 116647, "epoch": 694} {"train_loss": -9.80398178100586, "global_step": 116648, "epoch": 694} {"train_loss": -10.135717391967773, "global_step": 116649, "epoch": 694} {"train_loss": -10.223543167114258, "global_step": 116650, "epoch": 694} {"train_loss": -10.263137817382812, "global_step": 116651, "epoch": 694} {"train_loss": -10.324718475341797, "global_step": 116652, "epoch": 694} {"train_loss": -10.092402458190918, "global_step": 116653, "epoch": 694} {"train_loss": -10.071329116821289, "global_step": 116654, "epoch": 694} {"train_loss": -10.03726577758789, "global_step": 116655, "epoch": 694} {"train_loss": -10.067449569702148, "global_step": 116656, "epoch": 694} {"train_loss": -10.100824356079102, "global_step": 116657, "epoch": 694} {"train_loss": -10.123787879943848, "global_step": 116658, "epoch": 694} {"train_loss": -10.259434700012207, "global_step": 116659, "epoch": 694} {"train_loss": -10.049946784973145, "global_step": 116660, "epoch": 694} {"train_loss": -10.378110885620117, "global_step": 116661, "epoch": 694} {"train_loss": -10.162343978881836, "global_step": 116662, "epoch": 694} {"train_loss": -10.328706741333008, "global_step": 116663, "epoch": 694} {"train_loss": -10.094154357910156, "global_step": 116664, "epoch": 694} {"train_loss": -10.207411766052246, "global_step": 116665, "epoch": 694} {"train_loss": -10.274073600769043, "global_step": 116666, "epoch": 694} {"train_loss": -10.382336616516113, "global_step": 116667, "epoch": 694} {"train_loss": -10.161296844482422, "global_step": 116668, "epoch": 694} {"train_loss": -10.160444259643555, "global_step": 116669, "epoch": 694} {"train_loss": -10.019108772277832, "global_step": 116670, "epoch": 694} {"train_loss": -10.309541702270508, "global_step": 116671, "epoch": 694} {"train_loss": -9.839972496032715, "global_step": 116672, "epoch": 694} {"train_loss": -9.794405937194824, "global_step": 116673, "epoch": 694} {"train_loss": -10.144842147827148, "global_step": 116674, "epoch": 694} {"train_loss": -10.034219741821289, "global_step": 116675, "epoch": 694} {"train_loss": -10.383892059326172, "global_step": 116676, "epoch": 694} {"train_loss": -9.847111701965332, "global_step": 116677, "epoch": 694} {"train_loss": -10.139580726623535, "global_step": 116678, "epoch": 694} {"train_loss": -9.985389709472656, "global_step": 116679, "epoch": 694} {"train_loss": -10.114688873291016, "global_step": 116680, "epoch": 694} {"train_loss": -9.83456039428711, "global_step": 116681, "epoch": 694} {"train_loss": -9.787639617919922, "global_step": 116682, "epoch": 694} {"train_loss": -9.752446174621582, "global_step": 116683, "epoch": 694} {"train_loss": -10.069486618041992, "global_step": 116684, "epoch": 694} {"train_loss": -10.142373085021973, "global_step": 116685, "epoch": 694} {"train_loss": -10.339529037475586, "global_step": 116686, "epoch": 694} {"train_loss": -10.252326011657715, "global_step": 116687, "epoch": 694} {"train_loss": -9.94244384765625, "global_step": 116688, "epoch": 694} {"train_loss": -10.338371276855469, "global_step": 116689, "epoch": 694} {"train_loss": -9.956841468811035, "global_step": 116690, "epoch": 694} {"train_loss": -10.29234790802002, "global_step": 116691, "epoch": 694} {"train_loss": -10.112567901611328, "global_step": 116692, "epoch": 694} {"train_loss": -9.953266143798828, "global_step": 116693, "epoch": 694} {"train_loss": -10.111541748046875, "global_step": 116694, "epoch": 694} {"train_loss": -10.210046768188477, "global_step": 116695, "epoch": 694} {"train_loss": -10.13428020477295, "global_step": 116696, "epoch": 694} {"train_loss": -9.87529182434082, "global_step": 116697, "epoch": 694} {"train_loss": -10.35061264038086, "global_step": 116698, "epoch": 694} {"train_loss": -10.05124282836914, "global_step": 116699, "epoch": 694} {"train_loss": -10.459134101867676, "global_step": 116700, "epoch": 694} {"train_loss": -9.886699676513672, "global_step": 116701, "epoch": 694} {"train_loss": -10.170537948608398, "global_step": 116702, "epoch": 694} {"train_loss": -10.159236907958984, "global_step": 116703, "epoch": 694} {"train_loss": -9.922830581665039, "global_step": 116704, "epoch": 694} {"train_loss": -10.055216789245605, "global_step": 116705, "epoch": 694} {"train_loss": -10.05040168762207, "global_step": 116706, "epoch": 694} {"train_loss": -10.234140396118164, "global_step": 116707, "epoch": 694} {"train_loss": -9.76030158996582, "global_step": 116708, "epoch": 694} {"train_loss": -10.180509567260742, "global_step": 116709, "epoch": 694} {"train_loss": -10.151127815246582, "global_step": 116710, "epoch": 694} {"train_loss": -9.85860824584961, "global_step": 116711, "epoch": 694} {"train_loss": -9.98509407043457, "global_step": 116712, "epoch": 694} {"train_loss": -9.834526062011719, "global_step": 116713, "epoch": 694} {"train_loss": -9.917322158813477, "global_step": 116714, "epoch": 694} {"train_loss": -10.229177474975586, "global_step": 116715, "epoch": 694} {"train_loss": -9.739567756652832, "global_step": 116716, "epoch": 694} {"train_loss": -10.358322143554688, "global_step": 116717, "epoch": 694} {"train_loss": -10.13072395324707, "global_step": 116718, "epoch": 694} {"train_loss": -9.84527587890625, "global_step": 116719, "epoch": 694} {"train_loss": -10.327337265014648, "global_step": 116720, "epoch": 694} {"train_loss": -9.944284439086914, "global_step": 116721, "epoch": 694} {"train_loss": -10.348562240600586, "global_step": 116722, "epoch": 694} {"train_loss": -10.1483154296875, "global_step": 116723, "epoch": 694} {"train_loss": -10.0736083984375, "global_step": 116724, "epoch": 694} {"train_loss": -10.12625789642334, "global_step": 116725, "epoch": 694} {"train_loss": -10.398688316345215, "global_step": 116726, "epoch": 694} {"train_loss": -10.36494255065918, "global_step": 116727, "epoch": 694} {"train_loss": -10.222923278808594, "global_step": 116728, "epoch": 694} {"train_loss": -10.32174015045166, "global_step": 116729, "epoch": 694} {"train_loss": -10.14299488067627, "global_step": 116730, "epoch": 694} {"train_loss": -10.228776931762695, "global_step": 116731, "epoch": 694} {"train_loss": -10.087780952453613, "global_step": 116732, "epoch": 694} {"train_loss": -10.069845199584961, "global_step": 116733, "epoch": 694} {"train_loss": -9.85003662109375, "global_step": 116734, "epoch": 694} {"train_loss": -9.985492706298828, "global_step": 116735, "epoch": 694} {"train_loss": -10.085323333740234, "global_step": 116736, "epoch": 694} {"train_loss": -10.12272834777832, "global_step": 116737, "epoch": 694} {"train_loss": -10.060336112976074, "global_step": 116738, "epoch": 694} {"train_loss": -10.04393196105957, "global_step": 116739, "epoch": 694} {"train_loss": -10.225703239440918, "global_step": 116740, "epoch": 694} {"train_loss": -10.195657730102539, "global_step": 116741, "epoch": 694} {"train_loss": -10.09015941619873, "global_step": 116742, "epoch": 694} {"train_loss": -10.036176681518555, "global_step": 116743, "epoch": 694} {"train_loss": -10.204212188720703, "global_step": 116744, "epoch": 694} {"train_loss": -9.836092948913574, "global_step": 116745, "epoch": 694} {"train_loss": -10.309574127197266, "global_step": 116746, "epoch": 694} {"train_loss": -10.037607192993164, "global_step": 116747, "epoch": 694} {"train_loss": -10.121180534362793, "global_step": 116748, "epoch": 694} {"train_loss": -9.819755554199219, "global_step": 116749, "epoch": 694} {"train_loss": -9.966506958007812, "global_step": 116750, "epoch": 694} {"train_loss": -10.026158332824707, "global_step": 116751, "epoch": 694} {"train_loss": -9.959493637084961, "global_step": 116752, "epoch": 694} {"train_loss": -9.864461898803711, "global_step": 116753, "epoch": 694} {"train_loss": -10.004368782043457, "global_step": 116754, "epoch": 694} {"train_loss": -10.096891403198242, "global_step": 116755, "epoch": 694} {"train_loss": -10.081318855285645, "global_step": 116756, "epoch": 694} {"train_loss": -9.521592140197754, "global_step": 116757, "epoch": 694} {"train_loss": -10.095890045166016, "global_step": 116758, "epoch": 694} {"train_loss": -10.033863147099813, "global_step": 116759, "epoch": 694, "val_loss": 212742.34375} {"train_loss": -9.946329116821289, "global_step": 116760, "epoch": 695} {"train_loss": -10.167749404907227, "global_step": 116761, "epoch": 695} {"train_loss": -9.599915504455566, "global_step": 116762, "epoch": 695} {"train_loss": -9.951860427856445, "global_step": 116763, "epoch": 695} {"train_loss": -10.205528259277344, "global_step": 116764, "epoch": 695} {"train_loss": -9.996183395385742, "global_step": 116765, "epoch": 695} {"train_loss": -9.966913223266602, "global_step": 116766, "epoch": 695} {"train_loss": -10.17989444732666, "global_step": 116767, "epoch": 695} {"train_loss": -9.799681663513184, "global_step": 116768, "epoch": 695} {"train_loss": -9.93447208404541, "global_step": 116769, "epoch": 695} {"train_loss": -9.754720687866211, "global_step": 116770, "epoch": 695} {"train_loss": -9.805206298828125, "global_step": 116771, "epoch": 695} {"train_loss": -9.859151840209961, "global_step": 116772, "epoch": 695} {"train_loss": -9.983646392822266, "global_step": 116773, "epoch": 695} {"train_loss": -10.00722599029541, "global_step": 116774, "epoch": 695} {"train_loss": -10.048955917358398, "global_step": 116775, "epoch": 695} {"train_loss": -9.998297691345215, "global_step": 116776, "epoch": 695} {"train_loss": -9.967531204223633, "global_step": 116777, "epoch": 695} {"train_loss": -10.021661758422852, "global_step": 116778, "epoch": 695} {"train_loss": -9.972618103027344, "global_step": 116779, "epoch": 695} {"train_loss": -9.59428596496582, "global_step": 116780, "epoch": 695} {"train_loss": -10.076467514038086, "global_step": 116781, "epoch": 695} {"train_loss": -9.660781860351562, "global_step": 116782, "epoch": 695} {"train_loss": -10.168703079223633, "global_step": 116783, "epoch": 695} {"train_loss": -9.998761177062988, "global_step": 116784, "epoch": 695} {"train_loss": -9.833781242370605, "global_step": 116785, "epoch": 695} {"train_loss": -10.071325302124023, "global_step": 116786, "epoch": 695} {"train_loss": -10.012672424316406, "global_step": 116787, "epoch": 695} {"train_loss": -9.890298843383789, "global_step": 116788, "epoch": 695} {"train_loss": -9.846532821655273, "global_step": 116789, "epoch": 695} {"train_loss": -9.937686920166016, "global_step": 116790, "epoch": 695} {"train_loss": -10.057785034179688, "global_step": 116791, "epoch": 695} {"train_loss": -9.687017440795898, "global_step": 116792, "epoch": 695} {"train_loss": -9.78181266784668, "global_step": 116793, "epoch": 695} {"train_loss": -9.946876525878906, "global_step": 116794, "epoch": 695} {"train_loss": -9.496694564819336, "global_step": 116795, "epoch": 695} {"train_loss": -10.033744812011719, "global_step": 116796, "epoch": 695} {"train_loss": -9.599157333374023, "global_step": 116797, "epoch": 695} {"train_loss": -9.342873573303223, "global_step": 116798, "epoch": 695} {"train_loss": -10.034709930419922, "global_step": 116799, "epoch": 695} {"train_loss": -9.863166809082031, "global_step": 116800, "epoch": 695} {"train_loss": -9.838159561157227, "global_step": 116801, "epoch": 695} {"train_loss": -10.037391662597656, "global_step": 116802, "epoch": 695} {"train_loss": -9.73930549621582, "global_step": 116803, "epoch": 695} {"train_loss": -9.899396896362305, "global_step": 116804, "epoch": 695} {"train_loss": -9.922182083129883, "global_step": 116805, "epoch": 695} {"train_loss": -10.110565185546875, "global_step": 116806, "epoch": 695} {"train_loss": -9.779828071594238, "global_step": 116807, "epoch": 695} {"train_loss": -10.115080833435059, "global_step": 116808, "epoch": 695} {"train_loss": -9.518529891967773, "global_step": 116809, "epoch": 695} {"train_loss": -10.210926055908203, "global_step": 116810, "epoch": 695} {"train_loss": -9.799309730529785, "global_step": 116811, "epoch": 695} {"train_loss": -9.93290901184082, "global_step": 116812, "epoch": 695} {"train_loss": -9.763416290283203, "global_step": 116813, "epoch": 695} {"train_loss": -9.799964904785156, "global_step": 116814, "epoch": 695} {"train_loss": -9.630247116088867, "global_step": 116815, "epoch": 695} {"train_loss": -9.968348503112793, "global_step": 116816, "epoch": 695} {"train_loss": -9.891927719116211, "global_step": 116817, "epoch": 695} {"train_loss": -9.707524299621582, "global_step": 116818, "epoch": 695} {"train_loss": -10.121625900268555, "global_step": 116819, "epoch": 695} {"train_loss": -9.860177040100098, "global_step": 116820, "epoch": 695} {"train_loss": -9.974174499511719, "global_step": 116821, "epoch": 695} {"train_loss": -10.124310493469238, "global_step": 116822, "epoch": 695} {"train_loss": -9.825762748718262, "global_step": 116823, "epoch": 695} {"train_loss": -10.172262191772461, "global_step": 116824, "epoch": 695} {"train_loss": -10.099991798400879, "global_step": 116825, "epoch": 695} {"train_loss": -10.04571533203125, "global_step": 116826, "epoch": 695} {"train_loss": -10.180536270141602, "global_step": 116827, "epoch": 695} {"train_loss": -10.033378601074219, "global_step": 116828, "epoch": 695} {"train_loss": -10.320223808288574, "global_step": 116829, "epoch": 695} {"train_loss": -10.034444808959961, "global_step": 116830, "epoch": 695} {"train_loss": -10.327500343322754, "global_step": 116831, "epoch": 695} {"train_loss": -10.199110984802246, "global_step": 116832, "epoch": 695} {"train_loss": -10.104691505432129, "global_step": 116833, "epoch": 695} {"train_loss": -10.200862884521484, "global_step": 116834, "epoch": 695} {"train_loss": -10.177854537963867, "global_step": 116835, "epoch": 695} {"train_loss": -10.25387954711914, "global_step": 116836, "epoch": 695} {"train_loss": -10.134052276611328, "global_step": 116837, "epoch": 695} {"train_loss": -10.230842590332031, "global_step": 116838, "epoch": 695} {"train_loss": -10.081751823425293, "global_step": 116839, "epoch": 695} {"train_loss": -10.444330215454102, "global_step": 116840, "epoch": 695} {"train_loss": -10.205907821655273, "global_step": 116841, "epoch": 695} {"train_loss": -10.214780807495117, "global_step": 116842, "epoch": 695} {"train_loss": -10.119547843933105, "global_step": 116843, "epoch": 695} {"train_loss": -10.219904899597168, "global_step": 116844, "epoch": 695} {"train_loss": -10.365558624267578, "global_step": 116845, "epoch": 695} {"train_loss": -10.171709060668945, "global_step": 116846, "epoch": 695} {"train_loss": -9.983587265014648, "global_step": 116847, "epoch": 695} {"train_loss": -9.939260482788086, "global_step": 116848, "epoch": 695} {"train_loss": -9.802154541015625, "global_step": 116849, "epoch": 695} {"train_loss": -9.94400691986084, "global_step": 116850, "epoch": 695} {"train_loss": -10.07070255279541, "global_step": 116851, "epoch": 695} {"train_loss": -9.883811950683594, "global_step": 116852, "epoch": 695} {"train_loss": -9.754426956176758, "global_step": 116853, "epoch": 695} {"train_loss": -9.684858322143555, "global_step": 116854, "epoch": 695} {"train_loss": -10.20816707611084, "global_step": 116855, "epoch": 695} {"train_loss": -9.664290428161621, "global_step": 116856, "epoch": 695} {"train_loss": -10.241886138916016, "global_step": 116857, "epoch": 695} {"train_loss": -10.22760009765625, "global_step": 116858, "epoch": 695} {"train_loss": -9.677271842956543, "global_step": 116859, "epoch": 695} {"train_loss": -10.293455123901367, "global_step": 116860, "epoch": 695} {"train_loss": -9.782196044921875, "global_step": 116861, "epoch": 695} {"train_loss": -10.084001541137695, "global_step": 116862, "epoch": 695} {"train_loss": -10.032000541687012, "global_step": 116863, "epoch": 695} {"train_loss": -9.964641571044922, "global_step": 116864, "epoch": 695} {"train_loss": -10.192063331604004, "global_step": 116865, "epoch": 695} {"train_loss": -10.176230430603027, "global_step": 116866, "epoch": 695} {"train_loss": -10.092625617980957, "global_step": 116867, "epoch": 695} {"train_loss": -10.165048599243164, "global_step": 116868, "epoch": 695} {"train_loss": -10.160608291625977, "global_step": 116869, "epoch": 695} {"train_loss": -9.75108528137207, "global_step": 116870, "epoch": 695} {"train_loss": -9.934069633483887, "global_step": 116871, "epoch": 695} {"train_loss": -9.725325584411621, "global_step": 116872, "epoch": 695} {"train_loss": -10.122798919677734, "global_step": 116873, "epoch": 695} {"train_loss": -10.042520523071289, "global_step": 116874, "epoch": 695} {"train_loss": -9.982187271118164, "global_step": 116875, "epoch": 695} {"train_loss": -9.71096420288086, "global_step": 116876, "epoch": 695} {"train_loss": -9.845821380615234, "global_step": 116877, "epoch": 695} {"train_loss": -10.006254196166992, "global_step": 116878, "epoch": 695} {"train_loss": -9.698744773864746, "global_step": 116879, "epoch": 695} {"train_loss": -10.257040023803711, "global_step": 116880, "epoch": 695} {"train_loss": -9.795428276062012, "global_step": 116881, "epoch": 695} {"train_loss": -9.809713363647461, "global_step": 116882, "epoch": 695} {"train_loss": -9.917071342468262, "global_step": 116883, "epoch": 695} {"train_loss": -9.71492862701416, "global_step": 116884, "epoch": 695} {"train_loss": -10.114578247070312, "global_step": 116885, "epoch": 695} {"train_loss": -9.822271347045898, "global_step": 116886, "epoch": 695} {"train_loss": -9.896249771118164, "global_step": 116887, "epoch": 695} {"train_loss": -9.842844009399414, "global_step": 116888, "epoch": 695} {"train_loss": -9.902740478515625, "global_step": 116889, "epoch": 695} {"train_loss": -10.040536880493164, "global_step": 116890, "epoch": 695} {"train_loss": -9.737838745117188, "global_step": 116891, "epoch": 695} {"train_loss": -10.13193130493164, "global_step": 116892, "epoch": 695} {"train_loss": -10.010793685913086, "global_step": 116893, "epoch": 695} {"train_loss": -10.211475372314453, "global_step": 116894, "epoch": 695} {"train_loss": -10.18021011352539, "global_step": 116895, "epoch": 695} {"train_loss": -9.73719596862793, "global_step": 116896, "epoch": 695} {"train_loss": -10.127274513244629, "global_step": 116897, "epoch": 695} {"train_loss": -9.703868865966797, "global_step": 116898, "epoch": 695} {"train_loss": -9.96894645690918, "global_step": 116899, "epoch": 695} {"train_loss": -9.882121086120605, "global_step": 116900, "epoch": 695} {"train_loss": -9.865121841430664, "global_step": 116901, "epoch": 695} {"train_loss": -9.652360916137695, "global_step": 116902, "epoch": 695} {"train_loss": -10.081417083740234, "global_step": 116903, "epoch": 695} {"train_loss": -10.004491806030273, "global_step": 116904, "epoch": 695} {"train_loss": -10.04472541809082, "global_step": 116905, "epoch": 695} {"train_loss": -10.077656745910645, "global_step": 116906, "epoch": 695} {"train_loss": -9.997013092041016, "global_step": 116907, "epoch": 695} {"train_loss": -10.174436569213867, "global_step": 116908, "epoch": 695} {"train_loss": -10.25689697265625, "global_step": 116909, "epoch": 695} {"train_loss": -9.828672409057617, "global_step": 116910, "epoch": 695} {"train_loss": -10.245861053466797, "global_step": 116911, "epoch": 695} {"train_loss": -10.184816360473633, "global_step": 116912, "epoch": 695} {"train_loss": -10.268461227416992, "global_step": 116913, "epoch": 695} {"train_loss": -10.083065032958984, "global_step": 116914, "epoch": 695} {"train_loss": -10.475175857543945, "global_step": 116915, "epoch": 695} {"train_loss": -10.177599906921387, "global_step": 116916, "epoch": 695} {"train_loss": -10.34164810180664, "global_step": 116917, "epoch": 695} {"train_loss": -10.14244270324707, "global_step": 116918, "epoch": 695} {"train_loss": -10.189114570617676, "global_step": 116919, "epoch": 695} {"train_loss": -10.094714164733887, "global_step": 116920, "epoch": 695} {"train_loss": -10.307641983032227, "global_step": 116921, "epoch": 695} {"train_loss": -10.21455192565918, "global_step": 116922, "epoch": 695} {"train_loss": -10.129096984863281, "global_step": 116923, "epoch": 695} {"train_loss": -10.11451530456543, "global_step": 116924, "epoch": 695} {"train_loss": -10.353599548339844, "global_step": 116925, "epoch": 695} {"train_loss": -10.196441650390625, "global_step": 116926, "epoch": 695} {"train_loss": -9.993521781194778, "global_step": 116927, "epoch": 695, "val_loss": 213173.4375, "train_action_mse_error": 1.695832371711731} {"train_loss": -10.095529556274414, "global_step": 116928, "epoch": 696} {"train_loss": -10.443513870239258, "global_step": 116929, "epoch": 696} {"train_loss": -10.141977310180664, "global_step": 116930, "epoch": 696} {"train_loss": -10.57321548461914, "global_step": 116931, "epoch": 696} {"train_loss": -10.306974411010742, "global_step": 116932, "epoch": 696} {"train_loss": -10.322751998901367, "global_step": 116933, "epoch": 696} {"train_loss": -10.307594299316406, "global_step": 116934, "epoch": 696} {"train_loss": -10.282516479492188, "global_step": 116935, "epoch": 696} {"train_loss": -10.266336441040039, "global_step": 116936, "epoch": 696} {"train_loss": -10.403407096862793, "global_step": 116937, "epoch": 696} {"train_loss": -9.937517166137695, "global_step": 116938, "epoch": 696} {"train_loss": -10.37697696685791, "global_step": 116939, "epoch": 696} {"train_loss": -9.964919090270996, "global_step": 116940, "epoch": 696} {"train_loss": -10.29098892211914, "global_step": 116941, "epoch": 696} {"train_loss": -10.279624938964844, "global_step": 116942, "epoch": 696} {"train_loss": -10.307281494140625, "global_step": 116943, "epoch": 696} {"train_loss": -10.10556411743164, "global_step": 116944, "epoch": 696} {"train_loss": -10.318660736083984, "global_step": 116945, "epoch": 696} {"train_loss": -10.220976829528809, "global_step": 116946, "epoch": 696} {"train_loss": -10.135875701904297, "global_step": 116947, "epoch": 696} {"train_loss": -10.460536003112793, "global_step": 116948, "epoch": 696} {"train_loss": -10.253314018249512, "global_step": 116949, "epoch": 696} {"train_loss": -9.992668151855469, "global_step": 116950, "epoch": 696} {"train_loss": -10.008501052856445, "global_step": 116951, "epoch": 696} {"train_loss": -10.40207290649414, "global_step": 116952, "epoch": 696} {"train_loss": -9.630928039550781, "global_step": 116953, "epoch": 696} {"train_loss": -9.675178527832031, "global_step": 116954, "epoch": 696} {"train_loss": -10.321281433105469, "global_step": 116955, "epoch": 696} {"train_loss": -9.817927360534668, "global_step": 116956, "epoch": 696} {"train_loss": -9.322802543640137, "global_step": 116957, "epoch": 696} {"train_loss": -9.762232780456543, "global_step": 116958, "epoch": 696} {"train_loss": -8.740042686462402, "global_step": 116959, "epoch": 696} {"train_loss": -9.144248008728027, "global_step": 116960, "epoch": 696} {"train_loss": -9.24208927154541, "global_step": 116961, "epoch": 696} {"train_loss": -9.507730484008789, "global_step": 116962, "epoch": 696} {"train_loss": -9.224859237670898, "global_step": 116963, "epoch": 696} {"train_loss": -9.922340393066406, "global_step": 116964, "epoch": 696} {"train_loss": -9.329887390136719, "global_step": 116965, "epoch": 696} {"train_loss": -9.758838653564453, "global_step": 116966, "epoch": 696} {"train_loss": -9.733600616455078, "global_step": 116967, "epoch": 696} {"train_loss": -9.518791198730469, "global_step": 116968, "epoch": 696} {"train_loss": -9.716449737548828, "global_step": 116969, "epoch": 696} {"train_loss": -9.998966217041016, "global_step": 116970, "epoch": 696} {"train_loss": -9.504640579223633, "global_step": 116971, "epoch": 696} {"train_loss": -9.827529907226562, "global_step": 116972, "epoch": 696} {"train_loss": -9.911663055419922, "global_step": 116973, "epoch": 696} {"train_loss": -9.896625518798828, "global_step": 116974, "epoch": 696} {"train_loss": -9.78504753112793, "global_step": 116975, "epoch": 696} {"train_loss": -10.068050384521484, "global_step": 116976, "epoch": 696} {"train_loss": -9.95029067993164, "global_step": 116977, "epoch": 696} {"train_loss": -9.83609390258789, "global_step": 116978, "epoch": 696} {"train_loss": -9.880926132202148, "global_step": 116979, "epoch": 696} {"train_loss": -10.142179489135742, "global_step": 116980, "epoch": 696} {"train_loss": -9.943011283874512, "global_step": 116981, "epoch": 696} {"train_loss": -9.933975219726562, "global_step": 116982, "epoch": 696} {"train_loss": -10.015085220336914, "global_step": 116983, "epoch": 696} {"train_loss": -10.034404754638672, "global_step": 116984, "epoch": 696} {"train_loss": -10.175860404968262, "global_step": 116985, "epoch": 696} {"train_loss": -10.054301261901855, "global_step": 116986, "epoch": 696} {"train_loss": -9.87336540222168, "global_step": 116987, "epoch": 696} {"train_loss": -9.864339828491211, "global_step": 116988, "epoch": 696} {"train_loss": -10.034514427185059, "global_step": 116989, "epoch": 696} {"train_loss": -10.069157600402832, "global_step": 116990, "epoch": 696} {"train_loss": -9.977805137634277, "global_step": 116991, "epoch": 696} {"train_loss": -10.119853973388672, "global_step": 116992, "epoch": 696} {"train_loss": -10.13251781463623, "global_step": 116993, "epoch": 696} {"train_loss": -9.750940322875977, "global_step": 116994, "epoch": 696} {"train_loss": -10.348579406738281, "global_step": 116995, "epoch": 696} {"train_loss": -9.874321937561035, "global_step": 116996, "epoch": 696} {"train_loss": -10.194366455078125, "global_step": 116997, "epoch": 696} {"train_loss": -9.86833381652832, "global_step": 116998, "epoch": 696} {"train_loss": -10.288192749023438, "global_step": 116999, "epoch": 696} {"train_loss": -9.824918746948242, "global_step": 117000, "epoch": 696} {"train_loss": -10.356801986694336, "global_step": 117001, "epoch": 696} {"train_loss": -10.025609970092773, "global_step": 117002, "epoch": 696} {"train_loss": -10.078384399414062, "global_step": 117003, "epoch": 696} {"train_loss": -10.15802001953125, "global_step": 117004, "epoch": 696} {"train_loss": -9.66316032409668, "global_step": 117005, "epoch": 696} {"train_loss": -10.001615524291992, "global_step": 117006, "epoch": 696} {"train_loss": -10.017837524414062, "global_step": 117007, "epoch": 696} {"train_loss": -9.964962005615234, "global_step": 117008, "epoch": 696} {"train_loss": -9.913986206054688, "global_step": 117009, "epoch": 696} {"train_loss": -10.238537788391113, "global_step": 117010, "epoch": 696} {"train_loss": -9.982791900634766, "global_step": 117011, "epoch": 696} {"train_loss": -10.284156799316406, "global_step": 117012, "epoch": 696} {"train_loss": -9.880727767944336, "global_step": 117013, "epoch": 696} {"train_loss": -9.94414234161377, "global_step": 117014, "epoch": 696} {"train_loss": -10.040982246398926, "global_step": 117015, "epoch": 696} {"train_loss": -9.556617736816406, "global_step": 117016, "epoch": 696} {"train_loss": -9.940857887268066, "global_step": 117017, "epoch": 696} {"train_loss": -10.035989761352539, "global_step": 117018, "epoch": 696} {"train_loss": -9.454766273498535, "global_step": 117019, "epoch": 696} {"train_loss": -10.055004119873047, "global_step": 117020, "epoch": 696} {"train_loss": -9.518608093261719, "global_step": 117021, "epoch": 696} {"train_loss": -9.855023384094238, "global_step": 117022, "epoch": 696} {"train_loss": -9.636597633361816, "global_step": 117023, "epoch": 696} {"train_loss": -9.804987907409668, "global_step": 117024, "epoch": 696} {"train_loss": -9.68124008178711, "global_step": 117025, "epoch": 696} {"train_loss": -9.793052673339844, "global_step": 117026, "epoch": 696} {"train_loss": -9.884208679199219, "global_step": 117027, "epoch": 696} {"train_loss": -10.096059799194336, "global_step": 117028, "epoch": 696} {"train_loss": -10.026039123535156, "global_step": 117029, "epoch": 696} {"train_loss": -9.946693420410156, "global_step": 117030, "epoch": 696} {"train_loss": -9.945695877075195, "global_step": 117031, "epoch": 696} {"train_loss": -10.124347686767578, "global_step": 117032, "epoch": 696} {"train_loss": -9.99553108215332, "global_step": 117033, "epoch": 696} {"train_loss": -9.905021667480469, "global_step": 117034, "epoch": 696} {"train_loss": -9.892728805541992, "global_step": 117035, "epoch": 696} {"train_loss": -9.772927284240723, "global_step": 117036, "epoch": 696} {"train_loss": -10.178224563598633, "global_step": 117037, "epoch": 696} {"train_loss": -9.961509704589844, "global_step": 117038, "epoch": 696} {"train_loss": -9.902688980102539, "global_step": 117039, "epoch": 696} {"train_loss": -10.100362777709961, "global_step": 117040, "epoch": 696} {"train_loss": -9.92186164855957, "global_step": 117041, "epoch": 696} {"train_loss": -9.986190795898438, "global_step": 117042, "epoch": 696} {"train_loss": -9.938146591186523, "global_step": 117043, "epoch": 696} {"train_loss": -10.204524993896484, "global_step": 117044, "epoch": 696} {"train_loss": -10.078042984008789, "global_step": 117045, "epoch": 696} {"train_loss": -10.244001388549805, "global_step": 117046, "epoch": 696} {"train_loss": -10.055747985839844, "global_step": 117047, "epoch": 696} {"train_loss": -10.033655166625977, "global_step": 117048, "epoch": 696} {"train_loss": -10.13747501373291, "global_step": 117049, "epoch": 696} {"train_loss": -10.1174955368042, "global_step": 117050, "epoch": 696} {"train_loss": -10.211514472961426, "global_step": 117051, "epoch": 696} {"train_loss": -10.097606658935547, "global_step": 117052, "epoch": 696} {"train_loss": -10.435609817504883, "global_step": 117053, "epoch": 696} {"train_loss": -10.290548324584961, "global_step": 117054, "epoch": 696} {"train_loss": -10.332773208618164, "global_step": 117055, "epoch": 696} {"train_loss": -10.495752334594727, "global_step": 117056, "epoch": 696} {"train_loss": -10.388908386230469, "global_step": 117057, "epoch": 696} {"train_loss": -10.345048904418945, "global_step": 117058, "epoch": 696} {"train_loss": -10.177511215209961, "global_step": 117059, "epoch": 696} {"train_loss": -10.313674926757812, "global_step": 117060, "epoch": 696} {"train_loss": -10.396577835083008, "global_step": 117061, "epoch": 696} {"train_loss": -10.421159744262695, "global_step": 117062, "epoch": 696} {"train_loss": -10.309843063354492, "global_step": 117063, "epoch": 696} {"train_loss": -10.152762413024902, "global_step": 117064, "epoch": 696} {"train_loss": -10.419395446777344, "global_step": 117065, "epoch": 696} {"train_loss": -10.077274322509766, "global_step": 117066, "epoch": 696} {"train_loss": -10.211712837219238, "global_step": 117067, "epoch": 696} {"train_loss": -10.146324157714844, "global_step": 117068, "epoch": 696} {"train_loss": -9.293251991271973, "global_step": 117069, "epoch": 696} {"train_loss": -9.865972518920898, "global_step": 117070, "epoch": 696} {"train_loss": -10.211691856384277, "global_step": 117071, "epoch": 696} {"train_loss": -9.316947937011719, "global_step": 117072, "epoch": 696} {"train_loss": -9.788999557495117, "global_step": 117073, "epoch": 696} {"train_loss": -10.079564094543457, "global_step": 117074, "epoch": 696} {"train_loss": -10.102834701538086, "global_step": 117075, "epoch": 696} {"train_loss": -9.884393692016602, "global_step": 117076, "epoch": 696} {"train_loss": -10.055096626281738, "global_step": 117077, "epoch": 696} {"train_loss": -9.375802993774414, "global_step": 117078, "epoch": 696} {"train_loss": -9.905488967895508, "global_step": 117079, "epoch": 696} {"train_loss": -9.827729225158691, "global_step": 117080, "epoch": 696} {"train_loss": -9.477751731872559, "global_step": 117081, "epoch": 696} {"train_loss": -9.450782775878906, "global_step": 117082, "epoch": 696} {"train_loss": -9.857086181640625, "global_step": 117083, "epoch": 696} {"train_loss": -9.597883224487305, "global_step": 117084, "epoch": 696} {"train_loss": -9.6790132522583, "global_step": 117085, "epoch": 696} {"train_loss": -9.583733558654785, "global_step": 117086, "epoch": 696} {"train_loss": -9.822800636291504, "global_step": 117087, "epoch": 696} {"train_loss": -9.36629867553711, "global_step": 117088, "epoch": 696} {"train_loss": -9.978069305419922, "global_step": 117089, "epoch": 696} {"train_loss": -9.53563117980957, "global_step": 117090, "epoch": 696} {"train_loss": -9.565702438354492, "global_step": 117091, "epoch": 696} {"train_loss": -10.062484741210938, "global_step": 117092, "epoch": 696} {"train_loss": -9.514425277709961, "global_step": 117093, "epoch": 696} {"train_loss": -9.975869178771973, "global_step": 117094, "epoch": 696} {"train_loss": -9.966589683578128, "global_step": 117095, "epoch": 696, "val_loss": 212876.296875} {"train_loss": -9.896872520446777, "global_step": 117096, "epoch": 697} {"train_loss": -9.898694038391113, "global_step": 117097, "epoch": 697} {"train_loss": -9.792219161987305, "global_step": 117098, "epoch": 697} {"train_loss": -9.94102668762207, "global_step": 117099, "epoch": 697} {"train_loss": -9.881966590881348, "global_step": 117100, "epoch": 697} {"train_loss": -9.849576950073242, "global_step": 117101, "epoch": 697} {"train_loss": -10.101956367492676, "global_step": 117102, "epoch": 697} {"train_loss": -9.984930992126465, "global_step": 117103, "epoch": 697} {"train_loss": -10.063828468322754, "global_step": 117104, "epoch": 697} {"train_loss": -9.79127311706543, "global_step": 117105, "epoch": 697} {"train_loss": -9.976875305175781, "global_step": 117106, "epoch": 697} {"train_loss": -10.117863655090332, "global_step": 117107, "epoch": 697} {"train_loss": -9.770989418029785, "global_step": 117108, "epoch": 697} {"train_loss": -10.022890090942383, "global_step": 117109, "epoch": 697} {"train_loss": -10.089799880981445, "global_step": 117110, "epoch": 697} {"train_loss": -9.966110229492188, "global_step": 117111, "epoch": 697} {"train_loss": -9.998554229736328, "global_step": 117112, "epoch": 697} {"train_loss": -10.073493003845215, "global_step": 117113, "epoch": 697} {"train_loss": -9.960491180419922, "global_step": 117114, "epoch": 697} {"train_loss": -10.096049308776855, "global_step": 117115, "epoch": 697} {"train_loss": -10.102502822875977, "global_step": 117116, "epoch": 697} {"train_loss": -9.89328384399414, "global_step": 117117, "epoch": 697} {"train_loss": -10.27083969116211, "global_step": 117118, "epoch": 697} {"train_loss": -10.368427276611328, "global_step": 117119, "epoch": 697} {"train_loss": -10.056068420410156, "global_step": 117120, "epoch": 697} {"train_loss": -10.239635467529297, "global_step": 117121, "epoch": 697} {"train_loss": -10.235921859741211, "global_step": 117122, "epoch": 697} {"train_loss": -10.244388580322266, "global_step": 117123, "epoch": 697} {"train_loss": -10.261499404907227, "global_step": 117124, "epoch": 697} {"train_loss": -10.548959732055664, "global_step": 117125, "epoch": 697} {"train_loss": -10.288726806640625, "global_step": 117126, "epoch": 697} {"train_loss": -10.430322647094727, "global_step": 117127, "epoch": 697} {"train_loss": -10.391508102416992, "global_step": 117128, "epoch": 697} {"train_loss": -10.181123733520508, "global_step": 117129, "epoch": 697} {"train_loss": -10.295663833618164, "global_step": 117130, "epoch": 697} {"train_loss": -10.392224311828613, "global_step": 117131, "epoch": 697} {"train_loss": -10.055807113647461, "global_step": 117132, "epoch": 697} {"train_loss": -10.185073852539062, "global_step": 117133, "epoch": 697} {"train_loss": -10.3624849319458, "global_step": 117134, "epoch": 697} {"train_loss": -9.69847297668457, "global_step": 117135, "epoch": 697} {"train_loss": -9.739200592041016, "global_step": 117136, "epoch": 697} {"train_loss": -10.207443237304688, "global_step": 117137, "epoch": 697} {"train_loss": -10.120699882507324, "global_step": 117138, "epoch": 697} {"train_loss": -10.447966575622559, "global_step": 117139, "epoch": 697} {"train_loss": -10.076510429382324, "global_step": 117140, "epoch": 697} {"train_loss": -9.981843948364258, "global_step": 117141, "epoch": 697} {"train_loss": -10.07470989227295, "global_step": 117142, "epoch": 697} {"train_loss": -9.962366104125977, "global_step": 117143, "epoch": 697} {"train_loss": -10.12564468383789, "global_step": 117144, "epoch": 697} {"train_loss": -9.725969314575195, "global_step": 117145, "epoch": 697} {"train_loss": -9.705665588378906, "global_step": 117146, "epoch": 697} {"train_loss": -9.967437744140625, "global_step": 117147, "epoch": 697} {"train_loss": -9.390571594238281, "global_step": 117148, "epoch": 697} {"train_loss": -9.458561897277832, "global_step": 117149, "epoch": 697} {"train_loss": -9.603107452392578, "global_step": 117150, "epoch": 697} {"train_loss": -9.822244644165039, "global_step": 117151, "epoch": 697} {"train_loss": -9.789844512939453, "global_step": 117152, "epoch": 697} {"train_loss": -9.70306396484375, "global_step": 117153, "epoch": 697} {"train_loss": -9.963712692260742, "global_step": 117154, "epoch": 697} {"train_loss": -9.579292297363281, "global_step": 117155, "epoch": 697} {"train_loss": -9.469552993774414, "global_step": 117156, "epoch": 697} {"train_loss": -9.321582794189453, "global_step": 117157, "epoch": 697} {"train_loss": -9.542169570922852, "global_step": 117158, "epoch": 697} {"train_loss": -9.41984748840332, "global_step": 117159, "epoch": 697} {"train_loss": -9.830011367797852, "global_step": 117160, "epoch": 697} {"train_loss": -9.669736862182617, "global_step": 117161, "epoch": 697} {"train_loss": -9.516902923583984, "global_step": 117162, "epoch": 697} {"train_loss": -9.781221389770508, "global_step": 117163, "epoch": 697} {"train_loss": -9.904217720031738, "global_step": 117164, "epoch": 697} {"train_loss": -9.212093353271484, "global_step": 117165, "epoch": 697} {"train_loss": -9.94327163696289, "global_step": 117166, "epoch": 697} {"train_loss": -9.711697578430176, "global_step": 117167, "epoch": 697} {"train_loss": -9.664047241210938, "global_step": 117168, "epoch": 697} {"train_loss": -9.844382286071777, "global_step": 117169, "epoch": 697} {"train_loss": -9.672677040100098, "global_step": 117170, "epoch": 697} {"train_loss": -9.78536605834961, "global_step": 117171, "epoch": 697} {"train_loss": -9.9793701171875, "global_step": 117172, "epoch": 697} {"train_loss": -10.008118629455566, "global_step": 117173, "epoch": 697} {"train_loss": -9.972196578979492, "global_step": 117174, "epoch": 697} {"train_loss": -9.994599342346191, "global_step": 117175, "epoch": 697} {"train_loss": -9.754283905029297, "global_step": 117176, "epoch": 697} {"train_loss": -10.082012176513672, "global_step": 117177, "epoch": 697} {"train_loss": -10.065666198730469, "global_step": 117178, "epoch": 697} {"train_loss": -10.082494735717773, "global_step": 117179, "epoch": 697} {"train_loss": -10.02600383758545, "global_step": 117180, "epoch": 697} {"train_loss": -10.103233337402344, "global_step": 117181, "epoch": 697} {"train_loss": -10.070558547973633, "global_step": 117182, "epoch": 697} {"train_loss": -9.87006950378418, "global_step": 117183, "epoch": 697} {"train_loss": -10.1976318359375, "global_step": 117184, "epoch": 697} {"train_loss": -10.222400665283203, "global_step": 117185, "epoch": 697} {"train_loss": -10.26673412322998, "global_step": 117186, "epoch": 697} {"train_loss": -10.089778900146484, "global_step": 117187, "epoch": 697} {"train_loss": -10.255810737609863, "global_step": 117188, "epoch": 697} {"train_loss": -10.356656074523926, "global_step": 117189, "epoch": 697} {"train_loss": -10.238520622253418, "global_step": 117190, "epoch": 697} {"train_loss": -10.373659133911133, "global_step": 117191, "epoch": 697} {"train_loss": -10.430817604064941, "global_step": 117192, "epoch": 697} {"train_loss": -10.312101364135742, "global_step": 117193, "epoch": 697} {"train_loss": -10.373250961303711, "global_step": 117194, "epoch": 697} {"train_loss": -10.308028221130371, "global_step": 117195, "epoch": 697} {"train_loss": -10.269770622253418, "global_step": 117196, "epoch": 697} {"train_loss": -10.595385551452637, "global_step": 117197, "epoch": 697} {"train_loss": -10.224695205688477, "global_step": 117198, "epoch": 697} {"train_loss": -10.454038619995117, "global_step": 117199, "epoch": 697} {"train_loss": -10.167807579040527, "global_step": 117200, "epoch": 697} {"train_loss": -10.410423278808594, "global_step": 117201, "epoch": 697} {"train_loss": -10.231086730957031, "global_step": 117202, "epoch": 697} {"train_loss": -10.519832611083984, "global_step": 117203, "epoch": 697} {"train_loss": -10.16856861114502, "global_step": 117204, "epoch": 697} {"train_loss": -10.178783416748047, "global_step": 117205, "epoch": 697} {"train_loss": -10.325770378112793, "global_step": 117206, "epoch": 697} {"train_loss": -9.93558120727539, "global_step": 117207, "epoch": 697} {"train_loss": -10.384405136108398, "global_step": 117208, "epoch": 697} {"train_loss": -10.466495513916016, "global_step": 117209, "epoch": 697} {"train_loss": -10.35494327545166, "global_step": 117210, "epoch": 697} {"train_loss": -10.207418441772461, "global_step": 117211, "epoch": 697} {"train_loss": -10.23527717590332, "global_step": 117212, "epoch": 697} {"train_loss": -9.896028518676758, "global_step": 117213, "epoch": 697} {"train_loss": -9.914094924926758, "global_step": 117214, "epoch": 697} {"train_loss": -10.103415489196777, "global_step": 117215, "epoch": 697} {"train_loss": -9.693973541259766, "global_step": 117216, "epoch": 697} {"train_loss": -9.861653327941895, "global_step": 117217, "epoch": 697} {"train_loss": -9.668702125549316, "global_step": 117218, "epoch": 697} {"train_loss": -9.46112060546875, "global_step": 117219, "epoch": 697} {"train_loss": -9.567792892456055, "global_step": 117220, "epoch": 697} {"train_loss": -10.01609992980957, "global_step": 117221, "epoch": 697} {"train_loss": -9.75339126586914, "global_step": 117222, "epoch": 697} {"train_loss": -9.931066513061523, "global_step": 117223, "epoch": 697} {"train_loss": -9.70015811920166, "global_step": 117224, "epoch": 697} {"train_loss": -10.178245544433594, "global_step": 117225, "epoch": 697} {"train_loss": -9.784738540649414, "global_step": 117226, "epoch": 697} {"train_loss": -9.798505783081055, "global_step": 117227, "epoch": 697} {"train_loss": -9.700200080871582, "global_step": 117228, "epoch": 697} {"train_loss": -9.807514190673828, "global_step": 117229, "epoch": 697} {"train_loss": -9.65894889831543, "global_step": 117230, "epoch": 697} {"train_loss": -9.868901252746582, "global_step": 117231, "epoch": 697} {"train_loss": -9.793850898742676, "global_step": 117232, "epoch": 697} {"train_loss": -10.032197952270508, "global_step": 117233, "epoch": 697} {"train_loss": -10.005873680114746, "global_step": 117234, "epoch": 697} {"train_loss": -9.665541648864746, "global_step": 117235, "epoch": 697} {"train_loss": -10.083372116088867, "global_step": 117236, "epoch": 697} {"train_loss": -9.895265579223633, "global_step": 117237, "epoch": 697} {"train_loss": -9.842276573181152, "global_step": 117238, "epoch": 697} {"train_loss": -10.047148704528809, "global_step": 117239, "epoch": 697} {"train_loss": -9.689453125, "global_step": 117240, "epoch": 697} {"train_loss": -10.039600372314453, "global_step": 117241, "epoch": 697} {"train_loss": -10.046114921569824, "global_step": 117242, "epoch": 697} {"train_loss": -9.678085327148438, "global_step": 117243, "epoch": 697} {"train_loss": -10.067874908447266, "global_step": 117244, "epoch": 697} {"train_loss": -10.045797348022461, "global_step": 117245, "epoch": 697} {"train_loss": -9.81075382232666, "global_step": 117246, "epoch": 697} {"train_loss": -10.270700454711914, "global_step": 117247, "epoch": 697} {"train_loss": -9.993680000305176, "global_step": 117248, "epoch": 697} {"train_loss": -10.248469352722168, "global_step": 117249, "epoch": 697} {"train_loss": -10.140048027038574, "global_step": 117250, "epoch": 697} {"train_loss": -10.098846435546875, "global_step": 117251, "epoch": 697} {"train_loss": -10.187366485595703, "global_step": 117252, "epoch": 697} {"train_loss": -10.042766571044922, "global_step": 117253, "epoch": 697} {"train_loss": -10.063065528869629, "global_step": 117254, "epoch": 697} {"train_loss": -10.169973373413086, "global_step": 117255, "epoch": 697} {"train_loss": -9.955574035644531, "global_step": 117256, "epoch": 697} {"train_loss": -9.802042007446289, "global_step": 117257, "epoch": 697} {"train_loss": -10.136341094970703, "global_step": 117258, "epoch": 697} {"train_loss": -9.978994369506836, "global_step": 117259, "epoch": 697} {"train_loss": -10.16557502746582, "global_step": 117260, "epoch": 697} {"train_loss": -10.072891235351562, "global_step": 117261, "epoch": 697} {"train_loss": -10.134801864624023, "global_step": 117262, "epoch": 697} {"train_loss": -10.005173439071292, "global_step": 117263, "epoch": 697, "val_loss": 214998.671875} {"train_loss": -10.189590454101562, "global_step": 117264, "epoch": 698} {"train_loss": -10.178777694702148, "global_step": 117265, "epoch": 698} {"train_loss": -10.251017570495605, "global_step": 117266, "epoch": 698} {"train_loss": -10.313043594360352, "global_step": 117267, "epoch": 698} {"train_loss": -10.210363388061523, "global_step": 117268, "epoch": 698} {"train_loss": -10.158489227294922, "global_step": 117269, "epoch": 698} {"train_loss": -10.307577133178711, "global_step": 117270, "epoch": 698} {"train_loss": -10.344898223876953, "global_step": 117271, "epoch": 698} {"train_loss": -10.287976264953613, "global_step": 117272, "epoch": 698} {"train_loss": -10.402509689331055, "global_step": 117273, "epoch": 698} {"train_loss": -10.424232482910156, "global_step": 117274, "epoch": 698} {"train_loss": -10.363080978393555, "global_step": 117275, "epoch": 698} {"train_loss": -10.628459930419922, "global_step": 117276, "epoch": 698} {"train_loss": -10.407849311828613, "global_step": 117277, "epoch": 698} {"train_loss": -10.248387336730957, "global_step": 117278, "epoch": 698} {"train_loss": -10.296252250671387, "global_step": 117279, "epoch": 698} {"train_loss": -10.400262832641602, "global_step": 117280, "epoch": 698} {"train_loss": -10.383140563964844, "global_step": 117281, "epoch": 698} {"train_loss": -10.135151863098145, "global_step": 117282, "epoch": 698} {"train_loss": -10.37053108215332, "global_step": 117283, "epoch": 698} {"train_loss": -9.859066009521484, "global_step": 117284, "epoch": 698} {"train_loss": -10.252829551696777, "global_step": 117285, "epoch": 698} {"train_loss": -10.357295989990234, "global_step": 117286, "epoch": 698} {"train_loss": -9.819364547729492, "global_step": 117287, "epoch": 698} {"train_loss": -10.097541809082031, "global_step": 117288, "epoch": 698} {"train_loss": -9.999641418457031, "global_step": 117289, "epoch": 698} {"train_loss": -9.924394607543945, "global_step": 117290, "epoch": 698} {"train_loss": -9.814725875854492, "global_step": 117291, "epoch": 698} {"train_loss": -9.986732482910156, "global_step": 117292, "epoch": 698} {"train_loss": -9.724454879760742, "global_step": 117293, "epoch": 698} {"train_loss": -9.961319923400879, "global_step": 117294, "epoch": 698} {"train_loss": -9.59323501586914, "global_step": 117295, "epoch": 698} {"train_loss": -9.490592002868652, "global_step": 117296, "epoch": 698} {"train_loss": -9.89864730834961, "global_step": 117297, "epoch": 698} {"train_loss": -9.03220272064209, "global_step": 117298, "epoch": 698} {"train_loss": -9.352703094482422, "global_step": 117299, "epoch": 698} {"train_loss": -9.573984146118164, "global_step": 117300, "epoch": 698} {"train_loss": -9.817805290222168, "global_step": 117301, "epoch": 698} {"train_loss": -9.393575668334961, "global_step": 117302, "epoch": 698} {"train_loss": -9.486353874206543, "global_step": 117303, "epoch": 698} {"train_loss": -9.54638671875, "global_step": 117304, "epoch": 698} {"train_loss": -9.262760162353516, "global_step": 117305, "epoch": 698} {"train_loss": -9.954825401306152, "global_step": 117306, "epoch": 698} {"train_loss": -9.199542045593262, "global_step": 117307, "epoch": 698} {"train_loss": -9.881067276000977, "global_step": 117308, "epoch": 698} {"train_loss": -9.235679626464844, "global_step": 117309, "epoch": 698} {"train_loss": -9.664791107177734, "global_step": 117310, "epoch": 698} {"train_loss": -9.203699111938477, "global_step": 117311, "epoch": 698} {"train_loss": -9.369218826293945, "global_step": 117312, "epoch": 698} {"train_loss": -10.01644229888916, "global_step": 117313, "epoch": 698} {"train_loss": -9.497133255004883, "global_step": 117314, "epoch": 698} {"train_loss": -9.665830612182617, "global_step": 117315, "epoch": 698} {"train_loss": -9.829568862915039, "global_step": 117316, "epoch": 698} {"train_loss": -9.557126998901367, "global_step": 117317, "epoch": 698} {"train_loss": -9.590291976928711, "global_step": 117318, "epoch": 698} {"train_loss": -9.620813369750977, "global_step": 117319, "epoch": 698} {"train_loss": -9.774238586425781, "global_step": 117320, "epoch": 698} {"train_loss": -9.697151184082031, "global_step": 117321, "epoch": 698} {"train_loss": -9.776384353637695, "global_step": 117322, "epoch": 698} {"train_loss": -9.686589241027832, "global_step": 117323, "epoch": 698} {"train_loss": -9.847076416015625, "global_step": 117324, "epoch": 698} {"train_loss": -9.931705474853516, "global_step": 117325, "epoch": 698} {"train_loss": -9.887775421142578, "global_step": 117326, "epoch": 698} {"train_loss": -9.784575462341309, "global_step": 117327, "epoch": 698} {"train_loss": -9.979395866394043, "global_step": 117328, "epoch": 698} {"train_loss": -10.03628921508789, "global_step": 117329, "epoch": 698} {"train_loss": -9.951627731323242, "global_step": 117330, "epoch": 698} {"train_loss": -9.835576057434082, "global_step": 117331, "epoch": 698} {"train_loss": -9.966155052185059, "global_step": 117332, "epoch": 698} {"train_loss": -10.015179634094238, "global_step": 117333, "epoch": 698} {"train_loss": -9.95977783203125, "global_step": 117334, "epoch": 698} {"train_loss": -10.326130867004395, "global_step": 117335, "epoch": 698} {"train_loss": -10.261590003967285, "global_step": 117336, "epoch": 698} {"train_loss": -10.105386734008789, "global_step": 117337, "epoch": 698} {"train_loss": -9.998666763305664, "global_step": 117338, "epoch": 698} {"train_loss": -10.293764114379883, "global_step": 117339, "epoch": 698} {"train_loss": -10.208332061767578, "global_step": 117340, "epoch": 698} {"train_loss": -10.110845565795898, "global_step": 117341, "epoch": 698} {"train_loss": -10.291580200195312, "global_step": 117342, "epoch": 698} {"train_loss": -10.093174934387207, "global_step": 117343, "epoch": 698} {"train_loss": -10.288983345031738, "global_step": 117344, "epoch": 698} {"train_loss": -10.116823196411133, "global_step": 117345, "epoch": 698} {"train_loss": -10.112414360046387, "global_step": 117346, "epoch": 698} {"train_loss": -10.266843795776367, "global_step": 117347, "epoch": 698} {"train_loss": -10.426860809326172, "global_step": 117348, "epoch": 698} {"train_loss": -10.43067741394043, "global_step": 117349, "epoch": 698} {"train_loss": -10.357902526855469, "global_step": 117350, "epoch": 698} {"train_loss": -10.459610939025879, "global_step": 117351, "epoch": 698} {"train_loss": -9.841460227966309, "global_step": 117352, "epoch": 698} {"train_loss": -9.576744079589844, "global_step": 117353, "epoch": 698} {"train_loss": -9.848608016967773, "global_step": 117354, "epoch": 698} {"train_loss": -10.159200668334961, "global_step": 117355, "epoch": 698} {"train_loss": -10.227452278137207, "global_step": 117356, "epoch": 698} {"train_loss": -10.158439636230469, "global_step": 117357, "epoch": 698} {"train_loss": -10.134902000427246, "global_step": 117358, "epoch": 698} {"train_loss": -10.067248344421387, "global_step": 117359, "epoch": 698} {"train_loss": -9.261375427246094, "global_step": 117360, "epoch": 698} {"train_loss": -9.730012893676758, "global_step": 117361, "epoch": 698} {"train_loss": -10.054595947265625, "global_step": 117362, "epoch": 698} {"train_loss": -9.969627380371094, "global_step": 117363, "epoch": 698} {"train_loss": -9.839268684387207, "global_step": 117364, "epoch": 698} {"train_loss": -10.193204879760742, "global_step": 117365, "epoch": 698} {"train_loss": -10.001333236694336, "global_step": 117366, "epoch": 698} {"train_loss": -10.286952018737793, "global_step": 117367, "epoch": 698} {"train_loss": -10.20919418334961, "global_step": 117368, "epoch": 698} {"train_loss": -10.122783660888672, "global_step": 117369, "epoch": 698} {"train_loss": -10.141620635986328, "global_step": 117370, "epoch": 698} {"train_loss": -10.171449661254883, "global_step": 117371, "epoch": 698} {"train_loss": -9.834423065185547, "global_step": 117372, "epoch": 698} {"train_loss": -10.326555252075195, "global_step": 117373, "epoch": 698} {"train_loss": -9.895683288574219, "global_step": 117374, "epoch": 698} {"train_loss": -10.258171081542969, "global_step": 117375, "epoch": 698} {"train_loss": -10.017292976379395, "global_step": 117376, "epoch": 698} {"train_loss": -9.864355087280273, "global_step": 117377, "epoch": 698} {"train_loss": -10.315319061279297, "global_step": 117378, "epoch": 698} {"train_loss": -10.198318481445312, "global_step": 117379, "epoch": 698} {"train_loss": -10.005711555480957, "global_step": 117380, "epoch": 698} {"train_loss": -10.345769882202148, "global_step": 117381, "epoch": 698} {"train_loss": -10.040586471557617, "global_step": 117382, "epoch": 698} {"train_loss": -10.218883514404297, "global_step": 117383, "epoch": 698} {"train_loss": -9.875269889831543, "global_step": 117384, "epoch": 698} {"train_loss": -9.968839645385742, "global_step": 117385, "epoch": 698} {"train_loss": -9.955178260803223, "global_step": 117386, "epoch": 698} {"train_loss": -10.26986026763916, "global_step": 117387, "epoch": 698} {"train_loss": -9.789143562316895, "global_step": 117388, "epoch": 698} {"train_loss": -10.295695304870605, "global_step": 117389, "epoch": 698} {"train_loss": -10.066751480102539, "global_step": 117390, "epoch": 698} {"train_loss": -10.185234069824219, "global_step": 117391, "epoch": 698} {"train_loss": -10.280801773071289, "global_step": 117392, "epoch": 698} {"train_loss": -9.995089530944824, "global_step": 117393, "epoch": 698} {"train_loss": -9.891359329223633, "global_step": 117394, "epoch": 698} {"train_loss": -9.85059928894043, "global_step": 117395, "epoch": 698} {"train_loss": -10.272772789001465, "global_step": 117396, "epoch": 698} {"train_loss": -9.95418930053711, "global_step": 117397, "epoch": 698} {"train_loss": -10.07919692993164, "global_step": 117398, "epoch": 698} {"train_loss": -9.868288040161133, "global_step": 117399, "epoch": 698} {"train_loss": -10.086195945739746, "global_step": 117400, "epoch": 698} {"train_loss": -9.994110107421875, "global_step": 117401, "epoch": 698} {"train_loss": -10.138900756835938, "global_step": 117402, "epoch": 698} {"train_loss": -9.893684387207031, "global_step": 117403, "epoch": 698} {"train_loss": -10.132894515991211, "global_step": 117404, "epoch": 698} {"train_loss": -10.17475700378418, "global_step": 117405, "epoch": 698} {"train_loss": -10.03952693939209, "global_step": 117406, "epoch": 698} {"train_loss": -10.143688201904297, "global_step": 117407, "epoch": 698} {"train_loss": -10.392667770385742, "global_step": 117408, "epoch": 698} {"train_loss": -9.91550064086914, "global_step": 117409, "epoch": 698} {"train_loss": -10.333237648010254, "global_step": 117410, "epoch": 698} {"train_loss": -10.316619873046875, "global_step": 117411, "epoch": 698} {"train_loss": -10.262560844421387, "global_step": 117412, "epoch": 698} {"train_loss": -10.269383430480957, "global_step": 117413, "epoch": 698} {"train_loss": -10.163223266601562, "global_step": 117414, "epoch": 698} {"train_loss": -9.904928207397461, "global_step": 117415, "epoch": 698} {"train_loss": -10.383047103881836, "global_step": 117416, "epoch": 698} {"train_loss": -9.98327350616455, "global_step": 117417, "epoch": 698} {"train_loss": -9.885824203491211, "global_step": 117418, "epoch": 698} {"train_loss": -10.206513404846191, "global_step": 117419, "epoch": 698} {"train_loss": -9.556715965270996, "global_step": 117420, "epoch": 698} {"train_loss": -10.291374206542969, "global_step": 117421, "epoch": 698} {"train_loss": -9.983798027038574, "global_step": 117422, "epoch": 698} {"train_loss": -9.434738159179688, "global_step": 117423, "epoch": 698} {"train_loss": -10.14283275604248, "global_step": 117424, "epoch": 698} {"train_loss": -9.719870567321777, "global_step": 117425, "epoch": 698} {"train_loss": -9.819069862365723, "global_step": 117426, "epoch": 698} {"train_loss": -9.854981422424316, "global_step": 117427, "epoch": 698} {"train_loss": -9.633661270141602, "global_step": 117428, "epoch": 698} {"train_loss": -9.912882804870605, "global_step": 117429, "epoch": 698} {"train_loss": -9.584077835083008, "global_step": 117430, "epoch": 698} {"train_loss": -9.995424060594468, "global_step": 117431, "epoch": 698, "val_loss": 212311.625} {"train_loss": -9.8285493850708, "global_step": 117432, "epoch": 699} {"train_loss": -9.862838745117188, "global_step": 117433, "epoch": 699} {"train_loss": -9.607288360595703, "global_step": 117434, "epoch": 699} {"train_loss": -10.042951583862305, "global_step": 117435, "epoch": 699} {"train_loss": -9.82075309753418, "global_step": 117436, "epoch": 699} {"train_loss": -9.693134307861328, "global_step": 117437, "epoch": 699} {"train_loss": -9.963701248168945, "global_step": 117438, "epoch": 699} {"train_loss": -10.05305290222168, "global_step": 117439, "epoch": 699} {"train_loss": -9.701154708862305, "global_step": 117440, "epoch": 699} {"train_loss": -10.025203704833984, "global_step": 117441, "epoch": 699} {"train_loss": -9.848410606384277, "global_step": 117442, "epoch": 699} {"train_loss": -9.925029754638672, "global_step": 117443, "epoch": 699} {"train_loss": -10.008923530578613, "global_step": 117444, "epoch": 699} {"train_loss": -10.139801025390625, "global_step": 117445, "epoch": 699} {"train_loss": -9.780912399291992, "global_step": 117446, "epoch": 699} {"train_loss": -10.218711853027344, "global_step": 117447, "epoch": 699} {"train_loss": -9.71025276184082, "global_step": 117448, "epoch": 699} {"train_loss": -10.248095512390137, "global_step": 117449, "epoch": 699} {"train_loss": -9.97580337524414, "global_step": 117450, "epoch": 699} {"train_loss": -10.325772285461426, "global_step": 117451, "epoch": 699} {"train_loss": -10.084274291992188, "global_step": 117452, "epoch": 699} {"train_loss": -10.22148323059082, "global_step": 117453, "epoch": 699} {"train_loss": -10.196492195129395, "global_step": 117454, "epoch": 699} {"train_loss": -9.952067375183105, "global_step": 117455, "epoch": 699} {"train_loss": -10.113323211669922, "global_step": 117456, "epoch": 699} {"train_loss": -10.11634635925293, "global_step": 117457, "epoch": 699} {"train_loss": -10.27459716796875, "global_step": 117458, "epoch": 699} {"train_loss": -10.341449737548828, "global_step": 117459, "epoch": 699} {"train_loss": -9.98747444152832, "global_step": 117460, "epoch": 699} {"train_loss": -10.336990356445312, "global_step": 117461, "epoch": 699} {"train_loss": -10.089569091796875, "global_step": 117462, "epoch": 699} {"train_loss": -9.675736427307129, "global_step": 117463, "epoch": 699} {"train_loss": -10.330093383789062, "global_step": 117464, "epoch": 699} {"train_loss": -9.923357009887695, "global_step": 117465, "epoch": 699} {"train_loss": -10.291460037231445, "global_step": 117466, "epoch": 699} {"train_loss": -10.051225662231445, "global_step": 117467, "epoch": 699} {"train_loss": -10.273488998413086, "global_step": 117468, "epoch": 699} {"train_loss": -10.114309310913086, "global_step": 117469, "epoch": 699} {"train_loss": -10.296416282653809, "global_step": 117470, "epoch": 699} {"train_loss": -9.997298240661621, "global_step": 117471, "epoch": 699} {"train_loss": -10.239106178283691, "global_step": 117472, "epoch": 699} {"train_loss": -10.221381187438965, "global_step": 117473, "epoch": 699} {"train_loss": -10.264004707336426, "global_step": 117474, "epoch": 699} {"train_loss": -10.140621185302734, "global_step": 117475, "epoch": 699} {"train_loss": -10.424188613891602, "global_step": 117476, "epoch": 699} {"train_loss": -9.933270454406738, "global_step": 117477, "epoch": 699} {"train_loss": -10.493911743164062, "global_step": 117478, "epoch": 699} {"train_loss": -10.216020584106445, "global_step": 117479, "epoch": 699} {"train_loss": -10.120555877685547, "global_step": 117480, "epoch": 699} {"train_loss": -9.819462776184082, "global_step": 117481, "epoch": 699} {"train_loss": -9.875823974609375, "global_step": 117482, "epoch": 699} {"train_loss": -10.285883903503418, "global_step": 117483, "epoch": 699} {"train_loss": -10.168739318847656, "global_step": 117484, "epoch": 699} {"train_loss": -10.430397033691406, "global_step": 117485, "epoch": 699} {"train_loss": -10.298629760742188, "global_step": 117486, "epoch": 699} {"train_loss": -10.458871841430664, "global_step": 117487, "epoch": 699} {"train_loss": -10.253047943115234, "global_step": 117488, "epoch": 699} {"train_loss": -10.088446617126465, "global_step": 117489, "epoch": 699} {"train_loss": -10.212363243103027, "global_step": 117490, "epoch": 699} {"train_loss": -9.621696472167969, "global_step": 117491, "epoch": 699} {"train_loss": -10.036069869995117, "global_step": 117492, "epoch": 699} {"train_loss": -10.190813064575195, "global_step": 117493, "epoch": 699} {"train_loss": -9.755874633789062, "global_step": 117494, "epoch": 699} {"train_loss": -10.294419288635254, "global_step": 117495, "epoch": 699} {"train_loss": -10.100359916687012, "global_step": 117496, "epoch": 699} {"train_loss": -9.805849075317383, "global_step": 117497, "epoch": 699} {"train_loss": -10.213956832885742, "global_step": 117498, "epoch": 699} {"train_loss": -9.951766014099121, "global_step": 117499, "epoch": 699} {"train_loss": -9.474250793457031, "global_step": 117500, "epoch": 699} {"train_loss": -10.500631332397461, "global_step": 117501, "epoch": 699} {"train_loss": -9.654891014099121, "global_step": 117502, "epoch": 699} {"train_loss": -9.499990463256836, "global_step": 117503, "epoch": 699} {"train_loss": -10.014835357666016, "global_step": 117504, "epoch": 699} {"train_loss": -9.726340293884277, "global_step": 117505, "epoch": 699} {"train_loss": -9.902633666992188, "global_step": 117506, "epoch": 699} {"train_loss": -9.90988540649414, "global_step": 117507, "epoch": 699} {"train_loss": -9.795543670654297, "global_step": 117508, "epoch": 699} {"train_loss": -9.58750057220459, "global_step": 117509, "epoch": 699} {"train_loss": -9.775829315185547, "global_step": 117510, "epoch": 699} {"train_loss": -9.320093154907227, "global_step": 117511, "epoch": 699} {"train_loss": -9.556190490722656, "global_step": 117512, "epoch": 699} {"train_loss": -9.811870574951172, "global_step": 117513, "epoch": 699} {"train_loss": -9.862130165100098, "global_step": 117514, "epoch": 699} {"train_loss": -9.649760246276855, "global_step": 117515, "epoch": 699} {"train_loss": -10.197308540344238, "global_step": 117516, "epoch": 699} {"train_loss": -9.940126419067383, "global_step": 117517, "epoch": 699} {"train_loss": -10.110036849975586, "global_step": 117518, "epoch": 699} {"train_loss": -9.897782325744629, "global_step": 117519, "epoch": 699} {"train_loss": -10.161911010742188, "global_step": 117520, "epoch": 699} {"train_loss": -9.860074043273926, "global_step": 117521, "epoch": 699} {"train_loss": -10.123510360717773, "global_step": 117522, "epoch": 699} {"train_loss": -9.94005298614502, "global_step": 117523, "epoch": 699} {"train_loss": -9.97021198272705, "global_step": 117524, "epoch": 699} {"train_loss": -9.625459671020508, "global_step": 117525, "epoch": 699} {"train_loss": -10.058059692382812, "global_step": 117526, "epoch": 699} {"train_loss": -10.181758880615234, "global_step": 117527, "epoch": 699} {"train_loss": -9.597366333007812, "global_step": 117528, "epoch": 699} {"train_loss": -10.358261108398438, "global_step": 117529, "epoch": 699} {"train_loss": -9.869338989257812, "global_step": 117530, "epoch": 699} {"train_loss": -10.12807846069336, "global_step": 117531, "epoch": 699} {"train_loss": -10.007951736450195, "global_step": 117532, "epoch": 699} {"train_loss": -10.151844024658203, "global_step": 117533, "epoch": 699} {"train_loss": -9.755460739135742, "global_step": 117534, "epoch": 699} {"train_loss": -10.315671920776367, "global_step": 117535, "epoch": 699} {"train_loss": -10.035026550292969, "global_step": 117536, "epoch": 699} {"train_loss": -9.997373580932617, "global_step": 117537, "epoch": 699} {"train_loss": -10.139564514160156, "global_step": 117538, "epoch": 699} {"train_loss": -10.271852493286133, "global_step": 117539, "epoch": 699} {"train_loss": -9.925127029418945, "global_step": 117540, "epoch": 699} {"train_loss": -10.311975479125977, "global_step": 117541, "epoch": 699} {"train_loss": -10.282801628112793, "global_step": 117542, "epoch": 699} {"train_loss": -10.181235313415527, "global_step": 117543, "epoch": 699} {"train_loss": -10.255373001098633, "global_step": 117544, "epoch": 699} {"train_loss": -9.787138938903809, "global_step": 117545, "epoch": 699} {"train_loss": -10.14439582824707, "global_step": 117546, "epoch": 699} {"train_loss": -10.250438690185547, "global_step": 117547, "epoch": 699} {"train_loss": -10.272315979003906, "global_step": 117548, "epoch": 699} {"train_loss": -10.2570219039917, "global_step": 117549, "epoch": 699} {"train_loss": -10.349272727966309, "global_step": 117550, "epoch": 699} {"train_loss": -10.124967575073242, "global_step": 117551, "epoch": 699} {"train_loss": -10.351469993591309, "global_step": 117552, "epoch": 699} {"train_loss": -10.259759902954102, "global_step": 117553, "epoch": 699} {"train_loss": -10.089263916015625, "global_step": 117554, "epoch": 699} {"train_loss": -10.32317066192627, "global_step": 117555, "epoch": 699} {"train_loss": -10.271398544311523, "global_step": 117556, "epoch": 699} {"train_loss": -10.173730850219727, "global_step": 117557, "epoch": 699} {"train_loss": -10.138269424438477, "global_step": 117558, "epoch": 699} {"train_loss": -10.116032600402832, "global_step": 117559, "epoch": 699} {"train_loss": -10.589609146118164, "global_step": 117560, "epoch": 699} {"train_loss": -10.235477447509766, "global_step": 117561, "epoch": 699} {"train_loss": -10.232118606567383, "global_step": 117562, "epoch": 699} {"train_loss": -10.104743957519531, "global_step": 117563, "epoch": 699} {"train_loss": -10.402156829833984, "global_step": 117564, "epoch": 699} {"train_loss": -10.577089309692383, "global_step": 117565, "epoch": 699} {"train_loss": -10.32591438293457, "global_step": 117566, "epoch": 699} {"train_loss": -10.265541076660156, "global_step": 117567, "epoch": 699} {"train_loss": -10.158954620361328, "global_step": 117568, "epoch": 699} {"train_loss": -9.896095275878906, "global_step": 117569, "epoch": 699} {"train_loss": -10.399223327636719, "global_step": 117570, "epoch": 699} {"train_loss": -9.97916316986084, "global_step": 117571, "epoch": 699} {"train_loss": -10.183788299560547, "global_step": 117572, "epoch": 699} {"train_loss": -10.428866386413574, "global_step": 117573, "epoch": 699} {"train_loss": -10.242988586425781, "global_step": 117574, "epoch": 699} {"train_loss": -10.078293800354004, "global_step": 117575, "epoch": 699} {"train_loss": -10.445627212524414, "global_step": 117576, "epoch": 699} {"train_loss": -10.040992736816406, "global_step": 117577, "epoch": 699} {"train_loss": -10.093476295471191, "global_step": 117578, "epoch": 699} {"train_loss": -10.22437858581543, "global_step": 117579, "epoch": 699} {"train_loss": -10.074666023254395, "global_step": 117580, "epoch": 699} {"train_loss": -9.794755935668945, "global_step": 117581, "epoch": 699} {"train_loss": -10.343315124511719, "global_step": 117582, "epoch": 699} {"train_loss": -9.438604354858398, "global_step": 117583, "epoch": 699} {"train_loss": -10.13390064239502, "global_step": 117584, "epoch": 699} {"train_loss": -9.736917495727539, "global_step": 117585, "epoch": 699} {"train_loss": -9.603623390197754, "global_step": 117586, "epoch": 699} {"train_loss": -10.09404182434082, "global_step": 117587, "epoch": 699} {"train_loss": -9.524188995361328, "global_step": 117588, "epoch": 699} {"train_loss": -10.264524459838867, "global_step": 117589, "epoch": 699} {"train_loss": -9.72380542755127, "global_step": 117590, "epoch": 699} {"train_loss": -9.879347801208496, "global_step": 117591, "epoch": 699} {"train_loss": -10.209912300109863, "global_step": 117592, "epoch": 699} {"train_loss": -9.90360164642334, "global_step": 117593, "epoch": 699} {"train_loss": -10.11941909790039, "global_step": 117594, "epoch": 699} {"train_loss": -9.86004638671875, "global_step": 117595, "epoch": 699} {"train_loss": -9.989814758300781, "global_step": 117596, "epoch": 699} {"train_loss": -9.732518196105957, "global_step": 117597, "epoch": 699} {"train_loss": -10.227618217468262, "global_step": 117598, "epoch": 699} {"train_loss": -10.052977885518755, "global_step": 117599, "epoch": 699, "val_loss": 211455.484375} {"train_loss": -10.008171081542969, "global_step": 117600, "epoch": 700} {"train_loss": -10.0255126953125, "global_step": 117601, "epoch": 700} {"train_loss": -10.225770950317383, "global_step": 117602, "epoch": 700} {"train_loss": -9.75324821472168, "global_step": 117603, "epoch": 700} {"train_loss": -9.936094284057617, "global_step": 117604, "epoch": 700} {"train_loss": -9.928160667419434, "global_step": 117605, "epoch": 700} {"train_loss": -10.220874786376953, "global_step": 117606, "epoch": 700} {"train_loss": -10.053047180175781, "global_step": 117607, "epoch": 700} {"train_loss": -10.277543067932129, "global_step": 117608, "epoch": 700} {"train_loss": -9.981588363647461, "global_step": 117609, "epoch": 700} {"train_loss": -10.308420181274414, "global_step": 117610, "epoch": 700} {"train_loss": -9.987354278564453, "global_step": 117611, "epoch": 700} {"train_loss": -10.335229873657227, "global_step": 117612, "epoch": 700} {"train_loss": -10.233020782470703, "global_step": 117613, "epoch": 700} {"train_loss": -10.253436088562012, "global_step": 117614, "epoch": 700} {"train_loss": -10.397445678710938, "global_step": 117615, "epoch": 700} {"train_loss": -10.18298625946045, "global_step": 117616, "epoch": 700} {"train_loss": -10.078712463378906, "global_step": 117617, "epoch": 700} {"train_loss": -10.16274642944336, "global_step": 117618, "epoch": 700} {"train_loss": -10.120698928833008, "global_step": 117619, "epoch": 700} {"train_loss": -9.531901359558105, "global_step": 117620, "epoch": 700} {"train_loss": -9.84090805053711, "global_step": 117621, "epoch": 700} {"train_loss": -9.55146598815918, "global_step": 117622, "epoch": 700} {"train_loss": -9.912858963012695, "global_step": 117623, "epoch": 700} {"train_loss": -9.623912811279297, "global_step": 117624, "epoch": 700} {"train_loss": -9.855563163757324, "global_step": 117625, "epoch": 700} {"train_loss": -9.76262092590332, "global_step": 117626, "epoch": 700} {"train_loss": -10.070442199707031, "global_step": 117627, "epoch": 700} {"train_loss": -10.074015617370605, "global_step": 117628, "epoch": 700} {"train_loss": -10.021196365356445, "global_step": 117629, "epoch": 700} {"train_loss": -10.221948623657227, "global_step": 117630, "epoch": 700} {"train_loss": -10.08662223815918, "global_step": 117631, "epoch": 700} {"train_loss": -10.260198593139648, "global_step": 117632, "epoch": 700} {"train_loss": -10.275883674621582, "global_step": 117633, "epoch": 700} {"train_loss": -10.270965576171875, "global_step": 117634, "epoch": 700} {"train_loss": -10.307201385498047, "global_step": 117635, "epoch": 700} {"train_loss": -10.167223930358887, "global_step": 117636, "epoch": 700} {"train_loss": -10.391836166381836, "global_step": 117637, "epoch": 700} {"train_loss": -10.020366668701172, "global_step": 117638, "epoch": 700} {"train_loss": -10.173089981079102, "global_step": 117639, "epoch": 700} {"train_loss": -10.288983345031738, "global_step": 117640, "epoch": 700} {"train_loss": -10.385171890258789, "global_step": 117641, "epoch": 700} {"train_loss": -10.063023567199707, "global_step": 117642, "epoch": 700} {"train_loss": -10.1173095703125, "global_step": 117643, "epoch": 700} {"train_loss": -10.339561462402344, "global_step": 117644, "epoch": 700} {"train_loss": -10.363767623901367, "global_step": 117645, "epoch": 700} {"train_loss": -10.3363618850708, "global_step": 117646, "epoch": 700} {"train_loss": -10.295604705810547, "global_step": 117647, "epoch": 700} {"train_loss": -10.204527854919434, "global_step": 117648, "epoch": 700} {"train_loss": -10.041783332824707, "global_step": 117649, "epoch": 700} {"train_loss": -10.153083801269531, "global_step": 117650, "epoch": 700} {"train_loss": -9.927391052246094, "global_step": 117651, "epoch": 700} {"train_loss": -10.227066040039062, "global_step": 117652, "epoch": 700} {"train_loss": -10.254953384399414, "global_step": 117653, "epoch": 700} {"train_loss": -10.164987564086914, "global_step": 117654, "epoch": 700} {"train_loss": -10.303365707397461, "global_step": 117655, "epoch": 700} {"train_loss": -9.850809097290039, "global_step": 117656, "epoch": 700} {"train_loss": -10.505937576293945, "global_step": 117657, "epoch": 700} {"train_loss": -9.712409973144531, "global_step": 117658, "epoch": 700} {"train_loss": -10.000783920288086, "global_step": 117659, "epoch": 700} {"train_loss": -9.882047653198242, "global_step": 117660, "epoch": 700} {"train_loss": -9.452007293701172, "global_step": 117661, "epoch": 700} {"train_loss": -10.217635154724121, "global_step": 117662, "epoch": 700} {"train_loss": -9.713396072387695, "global_step": 117663, "epoch": 700} {"train_loss": -10.121131896972656, "global_step": 117664, "epoch": 700} {"train_loss": -9.750568389892578, "global_step": 117665, "epoch": 700} {"train_loss": -9.789177894592285, "global_step": 117666, "epoch": 700} {"train_loss": -10.260950088500977, "global_step": 117667, "epoch": 700} {"train_loss": -9.811534881591797, "global_step": 117668, "epoch": 700} {"train_loss": -9.950552940368652, "global_step": 117669, "epoch": 700} {"train_loss": -9.789350509643555, "global_step": 117670, "epoch": 700} {"train_loss": -10.080198287963867, "global_step": 117671, "epoch": 700} {"train_loss": -9.917226791381836, "global_step": 117672, "epoch": 700} {"train_loss": -9.929708480834961, "global_step": 117673, "epoch": 700} {"train_loss": -9.709685325622559, "global_step": 117674, "epoch": 700} {"train_loss": -10.117417335510254, "global_step": 117675, "epoch": 700} {"train_loss": -10.050888061523438, "global_step": 117676, "epoch": 700} {"train_loss": -9.955663681030273, "global_step": 117677, "epoch": 700} {"train_loss": -10.136589050292969, "global_step": 117678, "epoch": 700} {"train_loss": -10.256223678588867, "global_step": 117679, "epoch": 700} {"train_loss": -10.113887786865234, "global_step": 117680, "epoch": 700} {"train_loss": -10.09404468536377, "global_step": 117681, "epoch": 700} {"train_loss": -9.898272514343262, "global_step": 117682, "epoch": 700} {"train_loss": -10.241214752197266, "global_step": 117683, "epoch": 700} {"train_loss": -9.879563331604004, "global_step": 117684, "epoch": 700} {"train_loss": -10.254913330078125, "global_step": 117685, "epoch": 700} {"train_loss": -9.977023124694824, "global_step": 117686, "epoch": 700} {"train_loss": -10.189142227172852, "global_step": 117687, "epoch": 700} {"train_loss": -10.146380424499512, "global_step": 117688, "epoch": 700} {"train_loss": -10.141866683959961, "global_step": 117689, "epoch": 700} {"train_loss": -10.29853630065918, "global_step": 117690, "epoch": 700} {"train_loss": -10.270726203918457, "global_step": 117691, "epoch": 700} {"train_loss": -10.029062271118164, "global_step": 117692, "epoch": 700} {"train_loss": -10.162602424621582, "global_step": 117693, "epoch": 700} {"train_loss": -10.117254257202148, "global_step": 117694, "epoch": 700} {"train_loss": -10.086099624633789, "global_step": 117695, "epoch": 700} {"train_loss": -10.008810043334961, "global_step": 117696, "epoch": 700} {"train_loss": -10.23828125, "global_step": 117697, "epoch": 700} {"train_loss": -10.048417091369629, "global_step": 117698, "epoch": 700} {"train_loss": -10.275489807128906, "global_step": 117699, "epoch": 700} {"train_loss": -10.319640159606934, "global_step": 117700, "epoch": 700} {"train_loss": -10.195148468017578, "global_step": 117701, "epoch": 700} {"train_loss": -10.140077590942383, "global_step": 117702, "epoch": 700} {"train_loss": -10.098485946655273, "global_step": 117703, "epoch": 700} {"train_loss": -10.21746826171875, "global_step": 117704, "epoch": 700} {"train_loss": -10.360218048095703, "global_step": 117705, "epoch": 700} {"train_loss": -10.228893280029297, "global_step": 117706, "epoch": 700} {"train_loss": -10.200021743774414, "global_step": 117707, "epoch": 700} {"train_loss": -10.106115341186523, "global_step": 117708, "epoch": 700} {"train_loss": -10.026638984680176, "global_step": 117709, "epoch": 700} {"train_loss": -9.962846755981445, "global_step": 117710, "epoch": 700} {"train_loss": -10.145183563232422, "global_step": 117711, "epoch": 700} {"train_loss": -9.81814193725586, "global_step": 117712, "epoch": 700} {"train_loss": -10.162174224853516, "global_step": 117713, "epoch": 700} {"train_loss": -10.223608016967773, "global_step": 117714, "epoch": 700} {"train_loss": -9.942190170288086, "global_step": 117715, "epoch": 700} {"train_loss": -10.033882141113281, "global_step": 117716, "epoch": 700} {"train_loss": -9.839574813842773, "global_step": 117717, "epoch": 700} {"train_loss": -10.38519287109375, "global_step": 117718, "epoch": 700} {"train_loss": -10.207938194274902, "global_step": 117719, "epoch": 700} {"train_loss": -10.317550659179688, "global_step": 117720, "epoch": 700} {"train_loss": -10.225503921508789, "global_step": 117721, "epoch": 700} {"train_loss": -10.067222595214844, "global_step": 117722, "epoch": 700} {"train_loss": -10.066834449768066, "global_step": 117723, "epoch": 700} {"train_loss": -9.853423118591309, "global_step": 117724, "epoch": 700} {"train_loss": -10.040067672729492, "global_step": 117725, "epoch": 700} {"train_loss": -10.011210441589355, "global_step": 117726, "epoch": 700} {"train_loss": -10.220993995666504, "global_step": 117727, "epoch": 700} {"train_loss": -10.06771469116211, "global_step": 117728, "epoch": 700} {"train_loss": -10.006162643432617, "global_step": 117729, "epoch": 700} {"train_loss": -9.943174362182617, "global_step": 117730, "epoch": 700} {"train_loss": -9.676361083984375, "global_step": 117731, "epoch": 700} {"train_loss": -10.092119216918945, "global_step": 117732, "epoch": 700} {"train_loss": -10.27310848236084, "global_step": 117733, "epoch": 700} {"train_loss": -9.640351295471191, "global_step": 117734, "epoch": 700} {"train_loss": -10.132821083068848, "global_step": 117735, "epoch": 700} {"train_loss": -10.06049633026123, "global_step": 117736, "epoch": 700} {"train_loss": -10.236437797546387, "global_step": 117737, "epoch": 700} {"train_loss": -9.90223503112793, "global_step": 117738, "epoch": 700} {"train_loss": -10.179475784301758, "global_step": 117739, "epoch": 700} {"train_loss": -10.122331619262695, "global_step": 117740, "epoch": 700} {"train_loss": -10.259025573730469, "global_step": 117741, "epoch": 700} {"train_loss": -10.169534683227539, "global_step": 117742, "epoch": 700} {"train_loss": -10.148274421691895, "global_step": 117743, "epoch": 700} {"train_loss": -10.243452072143555, "global_step": 117744, "epoch": 700} {"train_loss": -10.198905944824219, "global_step": 117745, "epoch": 700} {"train_loss": -10.168493270874023, "global_step": 117746, "epoch": 700} {"train_loss": -10.315499305725098, "global_step": 117747, "epoch": 700} {"train_loss": -10.233837127685547, "global_step": 117748, "epoch": 700} {"train_loss": -10.202573776245117, "global_step": 117749, "epoch": 700} {"train_loss": -10.02929973602295, "global_step": 117750, "epoch": 700} {"train_loss": -10.346307754516602, "global_step": 117751, "epoch": 700} {"train_loss": -10.202835083007812, "global_step": 117752, "epoch": 700} {"train_loss": -10.207324981689453, "global_step": 117753, "epoch": 700} {"train_loss": -10.317591667175293, "global_step": 117754, "epoch": 700} {"train_loss": -10.219112396240234, "global_step": 117755, "epoch": 700} {"train_loss": -10.210923194885254, "global_step": 117756, "epoch": 700} {"train_loss": -10.354154586791992, "global_step": 117757, "epoch": 700} {"train_loss": -10.040538787841797, "global_step": 117758, "epoch": 700} {"train_loss": -10.331266403198242, "global_step": 117759, "epoch": 700} {"train_loss": -10.009261131286621, "global_step": 117760, "epoch": 700} {"train_loss": -9.919137954711914, "global_step": 117761, "epoch": 700} {"train_loss": -10.231463432312012, "global_step": 117762, "epoch": 700} {"train_loss": -9.940215110778809, "global_step": 117763, "epoch": 700} {"train_loss": -10.02716064453125, "global_step": 117764, "epoch": 700} {"train_loss": -10.322410583496094, "global_step": 117765, "epoch": 700} {"train_loss": -9.908300399780273, "global_step": 117766, "epoch": 700} {"train_loss": -10.096732128234137, "global_step": 117767, "epoch": 700, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.0024409500416016326, "train/sim_max_reward_3": 0.12950594823926406, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.9943826856754151, "test/sim_max_reward_4400000": 0.2683044559680594, "test/sim_max_reward_4400001": 0.5909060190527388, "test/sim_max_reward_4400002": 0.9998429645296651, "test/sim_max_reward_4400003": 0.4996414344092382, "test/sim_max_reward_4400004": 0.37387494095770324, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 0.6226979055589913, "test/sim_max_reward_4400007": 0.7851079086219415, "test/sim_max_reward_4400008": 0.540362263685363, "test/sim_max_reward_4400009": 0.4298633275642299, "test/sim_max_reward_4400010": 0.27626881765959566, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.6855758075424803, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 0.4399411922076705, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.9744690508361807, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.9843902511527118, "test/sim_max_reward_4400024": 0.700899353030437, "test/sim_max_reward_4400025": 0.5162650412212435, "test/sim_max_reward_4400026": 1.0, "test/sim_max_reward_4400027": 1.0, "test/sim_max_reward_4400028": 1.0, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9965221121054236, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.7206218461675049, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.37590315376351413, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.9935696821843074, "test/sim_max_reward_4400040": 0.11267991923207034, "test/sim_max_reward_4400041": 0.4897979329731858, "test/sim_max_reward_4400042": 0.08223554263307402, "test/sim_max_reward_4400043": 0.6788787980335047, "test/sim_max_reward_4400044": 0.9677007270755986, "test/sim_max_reward_4400045": 0.42728810971005543, "test/sim_max_reward_4400046": 0.9939910643037904, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6877215973260468, "test/mean_score": 0.6362385041310461, "val_loss": 214186.28125, "train_action_mse_error": 1.9098711013793945} {"train_loss": -10.145161628723145, "global_step": 117768, "epoch": 701} {"train_loss": -9.868253707885742, "global_step": 117769, "epoch": 701} {"train_loss": -10.458841323852539, "global_step": 117770, "epoch": 701} {"train_loss": -9.975512504577637, "global_step": 117771, "epoch": 701} {"train_loss": -10.335637092590332, "global_step": 117772, "epoch": 701} {"train_loss": -9.964338302612305, "global_step": 117773, "epoch": 701} {"train_loss": -9.974696159362793, "global_step": 117774, "epoch": 701} {"train_loss": -10.366495132446289, "global_step": 117775, "epoch": 701} {"train_loss": -9.778423309326172, "global_step": 117776, "epoch": 701} {"train_loss": -9.797006607055664, "global_step": 117777, "epoch": 701} {"train_loss": -10.235158920288086, "global_step": 117778, "epoch": 701} {"train_loss": -9.66300106048584, "global_step": 117779, "epoch": 701} {"train_loss": -10.204046249389648, "global_step": 117780, "epoch": 701} {"train_loss": -9.76986312866211, "global_step": 117781, "epoch": 701} {"train_loss": -9.92175579071045, "global_step": 117782, "epoch": 701} {"train_loss": -10.066617965698242, "global_step": 117783, "epoch": 701} {"train_loss": -9.865436553955078, "global_step": 117784, "epoch": 701} {"train_loss": -10.066850662231445, "global_step": 117785, "epoch": 701} {"train_loss": -10.189103126525879, "global_step": 117786, "epoch": 701} {"train_loss": -9.894134521484375, "global_step": 117787, "epoch": 701} {"train_loss": -10.1998872756958, "global_step": 117788, "epoch": 701} {"train_loss": -10.053556442260742, "global_step": 117789, "epoch": 701} {"train_loss": -10.336953163146973, "global_step": 117790, "epoch": 701} {"train_loss": -10.045501708984375, "global_step": 117791, "epoch": 701} {"train_loss": -10.246236801147461, "global_step": 117792, "epoch": 701} {"train_loss": -10.007980346679688, "global_step": 117793, "epoch": 701} {"train_loss": -9.860633850097656, "global_step": 117794, "epoch": 701} {"train_loss": -9.912641525268555, "global_step": 117795, "epoch": 701} {"train_loss": -10.1925048828125, "global_step": 117796, "epoch": 701} {"train_loss": -9.970545768737793, "global_step": 117797, "epoch": 701} {"train_loss": -10.220596313476562, "global_step": 117798, "epoch": 701} {"train_loss": -10.096444129943848, "global_step": 117799, "epoch": 701} {"train_loss": -10.20693588256836, "global_step": 117800, "epoch": 701} {"train_loss": -10.023103713989258, "global_step": 117801, "epoch": 701} {"train_loss": -10.222814559936523, "global_step": 117802, "epoch": 701} {"train_loss": -10.040328979492188, "global_step": 117803, "epoch": 701} {"train_loss": -10.162206649780273, "global_step": 117804, "epoch": 701} {"train_loss": -10.137088775634766, "global_step": 117805, "epoch": 701} {"train_loss": -10.268346786499023, "global_step": 117806, "epoch": 701} {"train_loss": -10.332775115966797, "global_step": 117807, "epoch": 701} {"train_loss": -10.30869197845459, "global_step": 117808, "epoch": 701} {"train_loss": -10.3248291015625, "global_step": 117809, "epoch": 701} {"train_loss": -10.138935089111328, "global_step": 117810, "epoch": 701} {"train_loss": -10.194043159484863, "global_step": 117811, "epoch": 701} {"train_loss": -10.345952033996582, "global_step": 117812, "epoch": 701} {"train_loss": -10.31796646118164, "global_step": 117813, "epoch": 701} {"train_loss": -10.566351890563965, "global_step": 117814, "epoch": 701} {"train_loss": -10.414342880249023, "global_step": 117815, "epoch": 701} {"train_loss": -10.484662055969238, "global_step": 117816, "epoch": 701} {"train_loss": -10.37632942199707, "global_step": 117817, "epoch": 701} {"train_loss": -10.22465991973877, "global_step": 117818, "epoch": 701} {"train_loss": -10.219528198242188, "global_step": 117819, "epoch": 701} {"train_loss": -10.6729736328125, "global_step": 117820, "epoch": 701} {"train_loss": -9.76767635345459, "global_step": 117821, "epoch": 701} {"train_loss": -9.987898826599121, "global_step": 117822, "epoch": 701} {"train_loss": -10.078279495239258, "global_step": 117823, "epoch": 701} {"train_loss": -10.373491287231445, "global_step": 117824, "epoch": 701} {"train_loss": -9.881365776062012, "global_step": 117825, "epoch": 701} {"train_loss": -10.25391674041748, "global_step": 117826, "epoch": 701} {"train_loss": -10.09299373626709, "global_step": 117827, "epoch": 701} {"train_loss": -9.74853515625, "global_step": 117828, "epoch": 701} {"train_loss": -9.94613265991211, "global_step": 117829, "epoch": 701} {"train_loss": -9.353141784667969, "global_step": 117830, "epoch": 701} {"train_loss": -10.226070404052734, "global_step": 117831, "epoch": 701} {"train_loss": -9.80578899383545, "global_step": 117832, "epoch": 701} {"train_loss": -10.037374496459961, "global_step": 117833, "epoch": 701} {"train_loss": -9.768020629882812, "global_step": 117834, "epoch": 701} {"train_loss": -10.140766143798828, "global_step": 117835, "epoch": 701} {"train_loss": -9.952062606811523, "global_step": 117836, "epoch": 701} {"train_loss": -9.917065620422363, "global_step": 117837, "epoch": 701} {"train_loss": -10.077044486999512, "global_step": 117838, "epoch": 701} {"train_loss": -10.159910202026367, "global_step": 117839, "epoch": 701} {"train_loss": -10.12829303741455, "global_step": 117840, "epoch": 701} {"train_loss": -10.04824447631836, "global_step": 117841, "epoch": 701} {"train_loss": -10.103710174560547, "global_step": 117842, "epoch": 701} {"train_loss": -10.257200241088867, "global_step": 117843, "epoch": 701} {"train_loss": -10.155252456665039, "global_step": 117844, "epoch": 701} {"train_loss": -9.935792922973633, "global_step": 117845, "epoch": 701} {"train_loss": -10.453014373779297, "global_step": 117846, "epoch": 701} {"train_loss": -10.074361801147461, "global_step": 117847, "epoch": 701} {"train_loss": -10.254905700683594, "global_step": 117848, "epoch": 701} {"train_loss": -10.327142715454102, "global_step": 117849, "epoch": 701} {"train_loss": -10.104608535766602, "global_step": 117850, "epoch": 701} {"train_loss": -10.195211410522461, "global_step": 117851, "epoch": 701} {"train_loss": -10.35683822631836, "global_step": 117852, "epoch": 701} {"train_loss": -10.130110740661621, "global_step": 117853, "epoch": 701} {"train_loss": -9.923990249633789, "global_step": 117854, "epoch": 701} {"train_loss": -10.01008415222168, "global_step": 117855, "epoch": 701} {"train_loss": -10.212689399719238, "global_step": 117856, "epoch": 701} {"train_loss": -10.177452087402344, "global_step": 117857, "epoch": 701} {"train_loss": -10.212438583374023, "global_step": 117858, "epoch": 701} {"train_loss": -10.036994934082031, "global_step": 117859, "epoch": 701} {"train_loss": -10.345544815063477, "global_step": 117860, "epoch": 701} {"train_loss": -9.770151138305664, "global_step": 117861, "epoch": 701} {"train_loss": -10.127470016479492, "global_step": 117862, "epoch": 701} {"train_loss": -9.867314338684082, "global_step": 117863, "epoch": 701} {"train_loss": -10.103838920593262, "global_step": 117864, "epoch": 701} {"train_loss": -10.407124519348145, "global_step": 117865, "epoch": 701} {"train_loss": -10.060277938842773, "global_step": 117866, "epoch": 701} {"train_loss": -10.409845352172852, "global_step": 117867, "epoch": 701} {"train_loss": -9.935335159301758, "global_step": 117868, "epoch": 701} {"train_loss": -10.13809871673584, "global_step": 117869, "epoch": 701} {"train_loss": -9.921947479248047, "global_step": 117870, "epoch": 701} {"train_loss": -10.21904182434082, "global_step": 117871, "epoch": 701} {"train_loss": -10.148576736450195, "global_step": 117872, "epoch": 701} {"train_loss": -10.105168342590332, "global_step": 117873, "epoch": 701} {"train_loss": -10.081353187561035, "global_step": 117874, "epoch": 701} {"train_loss": -10.095949172973633, "global_step": 117875, "epoch": 701} {"train_loss": -10.114890098571777, "global_step": 117876, "epoch": 701} {"train_loss": -10.073206901550293, "global_step": 117877, "epoch": 701} {"train_loss": -10.284929275512695, "global_step": 117878, "epoch": 701} {"train_loss": -9.958501815795898, "global_step": 117879, "epoch": 701} {"train_loss": -10.038055419921875, "global_step": 117880, "epoch": 701} {"train_loss": -10.159996032714844, "global_step": 117881, "epoch": 701} {"train_loss": -10.021953582763672, "global_step": 117882, "epoch": 701} {"train_loss": -10.47479248046875, "global_step": 117883, "epoch": 701} {"train_loss": -9.758750915527344, "global_step": 117884, "epoch": 701} {"train_loss": -10.169187545776367, "global_step": 117885, "epoch": 701} {"train_loss": -9.950952529907227, "global_step": 117886, "epoch": 701} {"train_loss": -10.021751403808594, "global_step": 117887, "epoch": 701} {"train_loss": -9.983810424804688, "global_step": 117888, "epoch": 701} {"train_loss": -9.812198638916016, "global_step": 117889, "epoch": 701} {"train_loss": -10.075655937194824, "global_step": 117890, "epoch": 701} {"train_loss": -9.786593437194824, "global_step": 117891, "epoch": 701} {"train_loss": -9.992485046386719, "global_step": 117892, "epoch": 701} {"train_loss": -9.834911346435547, "global_step": 117893, "epoch": 701} {"train_loss": -10.048646926879883, "global_step": 117894, "epoch": 701} {"train_loss": -10.295984268188477, "global_step": 117895, "epoch": 701} {"train_loss": -9.812553405761719, "global_step": 117896, "epoch": 701} {"train_loss": -10.119970321655273, "global_step": 117897, "epoch": 701} {"train_loss": -10.217957496643066, "global_step": 117898, "epoch": 701} {"train_loss": -10.009263038635254, "global_step": 117899, "epoch": 701} {"train_loss": -10.291175842285156, "global_step": 117900, "epoch": 701} {"train_loss": -9.879046440124512, "global_step": 117901, "epoch": 701} {"train_loss": -10.289701461791992, "global_step": 117902, "epoch": 701} {"train_loss": -10.094300270080566, "global_step": 117903, "epoch": 701} {"train_loss": -9.984073638916016, "global_step": 117904, "epoch": 701} {"train_loss": -10.184571266174316, "global_step": 117905, "epoch": 701} {"train_loss": -9.82634162902832, "global_step": 117906, "epoch": 701} {"train_loss": -9.936007499694824, "global_step": 117907, "epoch": 701} {"train_loss": -9.847127914428711, "global_step": 117908, "epoch": 701} {"train_loss": -10.047303199768066, "global_step": 117909, "epoch": 701} {"train_loss": -9.796060562133789, "global_step": 117910, "epoch": 701} {"train_loss": -9.882328033447266, "global_step": 117911, "epoch": 701} {"train_loss": -9.848021507263184, "global_step": 117912, "epoch": 701} {"train_loss": -9.711433410644531, "global_step": 117913, "epoch": 701} {"train_loss": -9.965230941772461, "global_step": 117914, "epoch": 701} {"train_loss": -9.553500175476074, "global_step": 117915, "epoch": 701} {"train_loss": -10.279191970825195, "global_step": 117916, "epoch": 701} {"train_loss": -9.715764999389648, "global_step": 117917, "epoch": 701} {"train_loss": -9.793304443359375, "global_step": 117918, "epoch": 701} {"train_loss": -10.338994026184082, "global_step": 117919, "epoch": 701} {"train_loss": -9.979421615600586, "global_step": 117920, "epoch": 701} {"train_loss": -10.018813133239746, "global_step": 117921, "epoch": 701} {"train_loss": -9.843914985656738, "global_step": 117922, "epoch": 701} {"train_loss": -10.092367172241211, "global_step": 117923, "epoch": 701} {"train_loss": -9.836236953735352, "global_step": 117924, "epoch": 701} {"train_loss": -10.28451156616211, "global_step": 117925, "epoch": 701} {"train_loss": -9.929778099060059, "global_step": 117926, "epoch": 701} {"train_loss": -10.267889022827148, "global_step": 117927, "epoch": 701} {"train_loss": -10.245080947875977, "global_step": 117928, "epoch": 701} {"train_loss": -10.148826599121094, "global_step": 117929, "epoch": 701} {"train_loss": -10.035399436950684, "global_step": 117930, "epoch": 701} {"train_loss": -10.172361373901367, "global_step": 117931, "epoch": 701} {"train_loss": -10.351648330688477, "global_step": 117932, "epoch": 701} {"train_loss": -10.233041763305664, "global_step": 117933, "epoch": 701} {"train_loss": -10.390390396118164, "global_step": 117934, "epoch": 701} {"train_loss": -10.084743953886486, "global_step": 117935, "epoch": 701, "val_loss": 212245.1875} {"train_loss": -10.387649536132812, "global_step": 117936, "epoch": 702} {"train_loss": -10.21210765838623, "global_step": 117937, "epoch": 702} {"train_loss": -10.314730644226074, "global_step": 117938, "epoch": 702} {"train_loss": -10.303659439086914, "global_step": 117939, "epoch": 702} {"train_loss": -10.123631477355957, "global_step": 117940, "epoch": 702} {"train_loss": -10.29239273071289, "global_step": 117941, "epoch": 702} {"train_loss": -10.28590202331543, "global_step": 117942, "epoch": 702} {"train_loss": -10.07304573059082, "global_step": 117943, "epoch": 702} {"train_loss": -10.256006240844727, "global_step": 117944, "epoch": 702} {"train_loss": -10.127456665039062, "global_step": 117945, "epoch": 702} {"train_loss": -10.2115478515625, "global_step": 117946, "epoch": 702} {"train_loss": -10.107101440429688, "global_step": 117947, "epoch": 702} {"train_loss": -10.128747940063477, "global_step": 117948, "epoch": 702} {"train_loss": -10.130189895629883, "global_step": 117949, "epoch": 702} {"train_loss": -10.211044311523438, "global_step": 117950, "epoch": 702} {"train_loss": -9.827142715454102, "global_step": 117951, "epoch": 702} {"train_loss": -9.67721176147461, "global_step": 117952, "epoch": 702} {"train_loss": -10.442270278930664, "global_step": 117953, "epoch": 702} {"train_loss": -10.202699661254883, "global_step": 117954, "epoch": 702} {"train_loss": -10.429729461669922, "global_step": 117955, "epoch": 702} {"train_loss": -10.356889724731445, "global_step": 117956, "epoch": 702} {"train_loss": -10.04068660736084, "global_step": 117957, "epoch": 702} {"train_loss": -10.160024642944336, "global_step": 117958, "epoch": 702} {"train_loss": -9.963117599487305, "global_step": 117959, "epoch": 702} {"train_loss": -10.499494552612305, "global_step": 117960, "epoch": 702} {"train_loss": -10.037052154541016, "global_step": 117961, "epoch": 702} {"train_loss": -10.338764190673828, "global_step": 117962, "epoch": 702} {"train_loss": -10.111799240112305, "global_step": 117963, "epoch": 702} {"train_loss": -9.998004913330078, "global_step": 117964, "epoch": 702} {"train_loss": -10.23419189453125, "global_step": 117965, "epoch": 702} {"train_loss": -10.109405517578125, "global_step": 117966, "epoch": 702} {"train_loss": -10.000468254089355, "global_step": 117967, "epoch": 702} {"train_loss": -10.02171516418457, "global_step": 117968, "epoch": 702} {"train_loss": -9.993067741394043, "global_step": 117969, "epoch": 702} {"train_loss": -10.124896049499512, "global_step": 117970, "epoch": 702} {"train_loss": -9.913566589355469, "global_step": 117971, "epoch": 702} {"train_loss": -10.099472045898438, "global_step": 117972, "epoch": 702} {"train_loss": -10.104470252990723, "global_step": 117973, "epoch": 702} {"train_loss": -9.998078346252441, "global_step": 117974, "epoch": 702} {"train_loss": -10.253271102905273, "global_step": 117975, "epoch": 702} {"train_loss": -10.350008010864258, "global_step": 117976, "epoch": 702} {"train_loss": -10.200479507446289, "global_step": 117977, "epoch": 702} {"train_loss": -9.955549240112305, "global_step": 117978, "epoch": 702} {"train_loss": -10.088356018066406, "global_step": 117979, "epoch": 702} {"train_loss": -10.200248718261719, "global_step": 117980, "epoch": 702} {"train_loss": -10.191999435424805, "global_step": 117981, "epoch": 702} {"train_loss": -10.229379653930664, "global_step": 117982, "epoch": 702} {"train_loss": -10.180290222167969, "global_step": 117983, "epoch": 702} {"train_loss": -9.82046890258789, "global_step": 117984, "epoch": 702} {"train_loss": -10.430133819580078, "global_step": 117985, "epoch": 702} {"train_loss": -9.976142883300781, "global_step": 117986, "epoch": 702} {"train_loss": -10.377325057983398, "global_step": 117987, "epoch": 702} {"train_loss": -10.28742790222168, "global_step": 117988, "epoch": 702} {"train_loss": -10.19011402130127, "global_step": 117989, "epoch": 702} {"train_loss": -9.95921516418457, "global_step": 117990, "epoch": 702} {"train_loss": -10.343847274780273, "global_step": 117991, "epoch": 702} {"train_loss": -10.205944061279297, "global_step": 117992, "epoch": 702} {"train_loss": -10.239110946655273, "global_step": 117993, "epoch": 702} {"train_loss": -10.369237899780273, "global_step": 117994, "epoch": 702} {"train_loss": -10.257546424865723, "global_step": 117995, "epoch": 702} {"train_loss": -10.28328800201416, "global_step": 117996, "epoch": 702} {"train_loss": -10.5037202835083, "global_step": 117997, "epoch": 702} {"train_loss": -10.277515411376953, "global_step": 117998, "epoch": 702} {"train_loss": -10.334478378295898, "global_step": 117999, "epoch": 702} {"train_loss": -10.270746231079102, "global_step": 118000, "epoch": 702} {"train_loss": -10.178354263305664, "global_step": 118001, "epoch": 702} {"train_loss": -10.348062515258789, "global_step": 118002, "epoch": 702} {"train_loss": -10.105669021606445, "global_step": 118003, "epoch": 702} {"train_loss": -10.284645080566406, "global_step": 118004, "epoch": 702} {"train_loss": -10.364452362060547, "global_step": 118005, "epoch": 702} {"train_loss": -10.266300201416016, "global_step": 118006, "epoch": 702} {"train_loss": -10.385046005249023, "global_step": 118007, "epoch": 702} {"train_loss": -10.174915313720703, "global_step": 118008, "epoch": 702} {"train_loss": -10.228931427001953, "global_step": 118009, "epoch": 702} {"train_loss": -10.056480407714844, "global_step": 118010, "epoch": 702} {"train_loss": -10.194385528564453, "global_step": 118011, "epoch": 702} {"train_loss": -10.200937271118164, "global_step": 118012, "epoch": 702} {"train_loss": -10.131990432739258, "global_step": 118013, "epoch": 702} {"train_loss": -10.326131820678711, "global_step": 118014, "epoch": 702} {"train_loss": -10.072395324707031, "global_step": 118015, "epoch": 702} {"train_loss": -9.994903564453125, "global_step": 118016, "epoch": 702} {"train_loss": -9.855997085571289, "global_step": 118017, "epoch": 702} {"train_loss": -9.488578796386719, "global_step": 118018, "epoch": 702} {"train_loss": -9.620269775390625, "global_step": 118019, "epoch": 702} {"train_loss": -8.783441543579102, "global_step": 118020, "epoch": 702} {"train_loss": -9.087837219238281, "global_step": 118021, "epoch": 702} {"train_loss": -9.325777053833008, "global_step": 118022, "epoch": 702} {"train_loss": -9.493576049804688, "global_step": 118023, "epoch": 702} {"train_loss": -9.39360523223877, "global_step": 118024, "epoch": 702} {"train_loss": -9.328389167785645, "global_step": 118025, "epoch": 702} {"train_loss": -9.69205379486084, "global_step": 118026, "epoch": 702} {"train_loss": -9.557342529296875, "global_step": 118027, "epoch": 702} {"train_loss": -9.935872077941895, "global_step": 118028, "epoch": 702} {"train_loss": -9.746949195861816, "global_step": 118029, "epoch": 702} {"train_loss": -9.808152198791504, "global_step": 118030, "epoch": 702} {"train_loss": -9.63302993774414, "global_step": 118031, "epoch": 702} {"train_loss": -9.391647338867188, "global_step": 118032, "epoch": 702} {"train_loss": -9.31103229522705, "global_step": 118033, "epoch": 702} {"train_loss": -9.544036865234375, "global_step": 118034, "epoch": 702} {"train_loss": -9.88729476928711, "global_step": 118035, "epoch": 702} {"train_loss": -9.361953735351562, "global_step": 118036, "epoch": 702} {"train_loss": -9.984392166137695, "global_step": 118037, "epoch": 702} {"train_loss": -9.4072904586792, "global_step": 118038, "epoch": 702} {"train_loss": -9.625639915466309, "global_step": 118039, "epoch": 702} {"train_loss": -9.830644607543945, "global_step": 118040, "epoch": 702} {"train_loss": -9.476936340332031, "global_step": 118041, "epoch": 702} {"train_loss": -9.730283737182617, "global_step": 118042, "epoch": 702} {"train_loss": -9.849621772766113, "global_step": 118043, "epoch": 702} {"train_loss": -9.862054824829102, "global_step": 118044, "epoch": 702} {"train_loss": -9.734748840332031, "global_step": 118045, "epoch": 702} {"train_loss": -9.878155708312988, "global_step": 118046, "epoch": 702} {"train_loss": -9.870241165161133, "global_step": 118047, "epoch": 702} {"train_loss": -9.798702239990234, "global_step": 118048, "epoch": 702} {"train_loss": -10.089734077453613, "global_step": 118049, "epoch": 702} {"train_loss": -9.845881462097168, "global_step": 118050, "epoch": 702} {"train_loss": -9.937417984008789, "global_step": 118051, "epoch": 702} {"train_loss": -9.957878112792969, "global_step": 118052, "epoch": 702} {"train_loss": -9.862936973571777, "global_step": 118053, "epoch": 702} {"train_loss": -10.129634857177734, "global_step": 118054, "epoch": 702} {"train_loss": -9.931053161621094, "global_step": 118055, "epoch": 702} {"train_loss": -9.949918746948242, "global_step": 118056, "epoch": 702} {"train_loss": -10.256392478942871, "global_step": 118057, "epoch": 702} {"train_loss": -9.81643009185791, "global_step": 118058, "epoch": 702} {"train_loss": -10.228409767150879, "global_step": 118059, "epoch": 702} {"train_loss": -10.136835098266602, "global_step": 118060, "epoch": 702} {"train_loss": -10.206462860107422, "global_step": 118061, "epoch": 702} {"train_loss": -10.085007667541504, "global_step": 118062, "epoch": 702} {"train_loss": -10.111855506896973, "global_step": 118063, "epoch": 702} {"train_loss": -10.253710746765137, "global_step": 118064, "epoch": 702} {"train_loss": -10.133749008178711, "global_step": 118065, "epoch": 702} {"train_loss": -10.112548828125, "global_step": 118066, "epoch": 702} {"train_loss": -10.267005920410156, "global_step": 118067, "epoch": 702} {"train_loss": -10.293307304382324, "global_step": 118068, "epoch": 702} {"train_loss": -10.243677139282227, "global_step": 118069, "epoch": 702} {"train_loss": -10.462095260620117, "global_step": 118070, "epoch": 702} {"train_loss": -10.241020202636719, "global_step": 118071, "epoch": 702} {"train_loss": -10.436110496520996, "global_step": 118072, "epoch": 702} {"train_loss": -10.327964782714844, "global_step": 118073, "epoch": 702} {"train_loss": -10.584049224853516, "global_step": 118074, "epoch": 702} {"train_loss": -10.162845611572266, "global_step": 118075, "epoch": 702} {"train_loss": -10.351067543029785, "global_step": 118076, "epoch": 702} {"train_loss": -10.268442153930664, "global_step": 118077, "epoch": 702} {"train_loss": -10.309294700622559, "global_step": 118078, "epoch": 702} {"train_loss": -9.883328437805176, "global_step": 118079, "epoch": 702} {"train_loss": -10.31432056427002, "global_step": 118080, "epoch": 702} {"train_loss": -10.375370025634766, "global_step": 118081, "epoch": 702} {"train_loss": -10.430025100708008, "global_step": 118082, "epoch": 702} {"train_loss": -10.114642143249512, "global_step": 118083, "epoch": 702} {"train_loss": -10.305591583251953, "global_step": 118084, "epoch": 702} {"train_loss": -10.182367324829102, "global_step": 118085, "epoch": 702} {"train_loss": -9.808065414428711, "global_step": 118086, "epoch": 702} {"train_loss": -10.34792423248291, "global_step": 118087, "epoch": 702} {"train_loss": -9.976217269897461, "global_step": 118088, "epoch": 702} {"train_loss": -9.822887420654297, "global_step": 118089, "epoch": 702} {"train_loss": -9.827975273132324, "global_step": 118090, "epoch": 702} {"train_loss": -10.132993698120117, "global_step": 118091, "epoch": 702} {"train_loss": -10.046216011047363, "global_step": 118092, "epoch": 702} {"train_loss": -10.225345611572266, "global_step": 118093, "epoch": 702} {"train_loss": -10.084534645080566, "global_step": 118094, "epoch": 702} {"train_loss": -10.235536575317383, "global_step": 118095, "epoch": 702} {"train_loss": -10.370466232299805, "global_step": 118096, "epoch": 702} {"train_loss": -10.153778076171875, "global_step": 118097, "epoch": 702} {"train_loss": -9.964157104492188, "global_step": 118098, "epoch": 702} {"train_loss": -10.213568687438965, "global_step": 118099, "epoch": 702} {"train_loss": -10.141416549682617, "global_step": 118100, "epoch": 702} {"train_loss": -10.128151893615723, "global_step": 118101, "epoch": 702} {"train_loss": -9.820791244506836, "global_step": 118102, "epoch": 702} {"train_loss": -10.060342277799334, "global_step": 118103, "epoch": 702, "val_loss": 211958.734375} {"train_loss": -10.079839706420898, "global_step": 118104, "epoch": 703} {"train_loss": -10.118789672851562, "global_step": 118105, "epoch": 703} {"train_loss": -10.02421760559082, "global_step": 118106, "epoch": 703} {"train_loss": -10.120203018188477, "global_step": 118107, "epoch": 703} {"train_loss": -10.086895942687988, "global_step": 118108, "epoch": 703} {"train_loss": -10.175506591796875, "global_step": 118109, "epoch": 703} {"train_loss": -10.168817520141602, "global_step": 118110, "epoch": 703} {"train_loss": -10.090883255004883, "global_step": 118111, "epoch": 703} {"train_loss": -9.79046630859375, "global_step": 118112, "epoch": 703} {"train_loss": -10.250076293945312, "global_step": 118113, "epoch": 703} {"train_loss": -9.687726020812988, "global_step": 118114, "epoch": 703} {"train_loss": -10.260191917419434, "global_step": 118115, "epoch": 703} {"train_loss": -9.816932678222656, "global_step": 118116, "epoch": 703} {"train_loss": -10.174985885620117, "global_step": 118117, "epoch": 703} {"train_loss": -9.954427719116211, "global_step": 118118, "epoch": 703} {"train_loss": -10.202284812927246, "global_step": 118119, "epoch": 703} {"train_loss": -9.918724060058594, "global_step": 118120, "epoch": 703} {"train_loss": -10.138368606567383, "global_step": 118121, "epoch": 703} {"train_loss": -10.00833511352539, "global_step": 118122, "epoch": 703} {"train_loss": -10.114416122436523, "global_step": 118123, "epoch": 703} {"train_loss": -9.96470832824707, "global_step": 118124, "epoch": 703} {"train_loss": -9.886527061462402, "global_step": 118125, "epoch": 703} {"train_loss": -9.912336349487305, "global_step": 118126, "epoch": 703} {"train_loss": -9.936668395996094, "global_step": 118127, "epoch": 703} {"train_loss": -9.579414367675781, "global_step": 118128, "epoch": 703} {"train_loss": -10.339496612548828, "global_step": 118129, "epoch": 703} {"train_loss": -9.728157043457031, "global_step": 118130, "epoch": 703} {"train_loss": -10.065872192382812, "global_step": 118131, "epoch": 703} {"train_loss": -9.976703643798828, "global_step": 118132, "epoch": 703} {"train_loss": -10.16219425201416, "global_step": 118133, "epoch": 703} {"train_loss": -9.922603607177734, "global_step": 118134, "epoch": 703} {"train_loss": -10.018330574035645, "global_step": 118135, "epoch": 703} {"train_loss": -9.698169708251953, "global_step": 118136, "epoch": 703} {"train_loss": -10.217523574829102, "global_step": 118137, "epoch": 703} {"train_loss": -9.852787017822266, "global_step": 118138, "epoch": 703} {"train_loss": -9.747736930847168, "global_step": 118139, "epoch": 703} {"train_loss": -9.840723037719727, "global_step": 118140, "epoch": 703} {"train_loss": -9.45473861694336, "global_step": 118141, "epoch": 703} {"train_loss": -9.960049629211426, "global_step": 118142, "epoch": 703} {"train_loss": -9.505946159362793, "global_step": 118143, "epoch": 703} {"train_loss": -9.770355224609375, "global_step": 118144, "epoch": 703} {"train_loss": -9.882716178894043, "global_step": 118145, "epoch": 703} {"train_loss": -9.430983543395996, "global_step": 118146, "epoch": 703} {"train_loss": -9.836960792541504, "global_step": 118147, "epoch": 703} {"train_loss": -9.364962577819824, "global_step": 118148, "epoch": 703} {"train_loss": -9.652240753173828, "global_step": 118149, "epoch": 703} {"train_loss": -9.523645401000977, "global_step": 118150, "epoch": 703} {"train_loss": -9.839787483215332, "global_step": 118151, "epoch": 703} {"train_loss": -9.67139720916748, "global_step": 118152, "epoch": 703} {"train_loss": -9.62573528289795, "global_step": 118153, "epoch": 703} {"train_loss": -10.24468994140625, "global_step": 118154, "epoch": 703} {"train_loss": -9.714558601379395, "global_step": 118155, "epoch": 703} {"train_loss": -9.843931198120117, "global_step": 118156, "epoch": 703} {"train_loss": -9.73554515838623, "global_step": 118157, "epoch": 703} {"train_loss": -10.105457305908203, "global_step": 118158, "epoch": 703} {"train_loss": -9.764203071594238, "global_step": 118159, "epoch": 703} {"train_loss": -10.019323348999023, "global_step": 118160, "epoch": 703} {"train_loss": -9.817452430725098, "global_step": 118161, "epoch": 703} {"train_loss": -9.952377319335938, "global_step": 118162, "epoch": 703} {"train_loss": -10.158143997192383, "global_step": 118163, "epoch": 703} {"train_loss": -10.052215576171875, "global_step": 118164, "epoch": 703} {"train_loss": -10.101807594299316, "global_step": 118165, "epoch": 703} {"train_loss": -10.133761405944824, "global_step": 118166, "epoch": 703} {"train_loss": -9.970183372497559, "global_step": 118167, "epoch": 703} {"train_loss": -10.01486587524414, "global_step": 118168, "epoch": 703} {"train_loss": -10.092965126037598, "global_step": 118169, "epoch": 703} {"train_loss": -10.198928833007812, "global_step": 118170, "epoch": 703} {"train_loss": -10.094022750854492, "global_step": 118171, "epoch": 703} {"train_loss": -10.083831787109375, "global_step": 118172, "epoch": 703} {"train_loss": -10.120466232299805, "global_step": 118173, "epoch": 703} {"train_loss": -10.148067474365234, "global_step": 118174, "epoch": 703} {"train_loss": -10.099916458129883, "global_step": 118175, "epoch": 703} {"train_loss": -10.220328330993652, "global_step": 118176, "epoch": 703} {"train_loss": -9.918216705322266, "global_step": 118177, "epoch": 703} {"train_loss": -10.429910659790039, "global_step": 118178, "epoch": 703} {"train_loss": -10.15147590637207, "global_step": 118179, "epoch": 703} {"train_loss": -10.096189498901367, "global_step": 118180, "epoch": 703} {"train_loss": -10.179211616516113, "global_step": 118181, "epoch": 703} {"train_loss": -10.014822959899902, "global_step": 118182, "epoch": 703} {"train_loss": -10.13657283782959, "global_step": 118183, "epoch": 703} {"train_loss": -10.064474105834961, "global_step": 118184, "epoch": 703} {"train_loss": -10.006168365478516, "global_step": 118185, "epoch": 703} {"train_loss": -10.249076843261719, "global_step": 118186, "epoch": 703} {"train_loss": -10.365392684936523, "global_step": 118187, "epoch": 703} {"train_loss": -10.302865982055664, "global_step": 118188, "epoch": 703} {"train_loss": -10.208444595336914, "global_step": 118189, "epoch": 703} {"train_loss": -10.080177307128906, "global_step": 118190, "epoch": 703} {"train_loss": -10.387898445129395, "global_step": 118191, "epoch": 703} {"train_loss": -10.279229164123535, "global_step": 118192, "epoch": 703} {"train_loss": -10.148599624633789, "global_step": 118193, "epoch": 703} {"train_loss": -10.134265899658203, "global_step": 118194, "epoch": 703} {"train_loss": -10.423364639282227, "global_step": 118195, "epoch": 703} {"train_loss": -10.292236328125, "global_step": 118196, "epoch": 703} {"train_loss": -10.15180492401123, "global_step": 118197, "epoch": 703} {"train_loss": -10.19675350189209, "global_step": 118198, "epoch": 703} {"train_loss": -10.272321701049805, "global_step": 118199, "epoch": 703} {"train_loss": -10.470759391784668, "global_step": 118200, "epoch": 703} {"train_loss": -10.450732231140137, "global_step": 118201, "epoch": 703} {"train_loss": -10.062932968139648, "global_step": 118202, "epoch": 703} {"train_loss": -10.246188163757324, "global_step": 118203, "epoch": 703} {"train_loss": -10.389798164367676, "global_step": 118204, "epoch": 703} {"train_loss": -10.36850357055664, "global_step": 118205, "epoch": 703} {"train_loss": -10.212518692016602, "global_step": 118206, "epoch": 703} {"train_loss": -10.373580932617188, "global_step": 118207, "epoch": 703} {"train_loss": -10.155728340148926, "global_step": 118208, "epoch": 703} {"train_loss": -10.080491065979004, "global_step": 118209, "epoch": 703} {"train_loss": -10.344063758850098, "global_step": 118210, "epoch": 703} {"train_loss": -10.237613677978516, "global_step": 118211, "epoch": 703} {"train_loss": -10.201275825500488, "global_step": 118212, "epoch": 703} {"train_loss": -10.302197456359863, "global_step": 118213, "epoch": 703} {"train_loss": -10.157543182373047, "global_step": 118214, "epoch": 703} {"train_loss": -10.094888687133789, "global_step": 118215, "epoch": 703} {"train_loss": -10.195352554321289, "global_step": 118216, "epoch": 703} {"train_loss": -10.26730728149414, "global_step": 118217, "epoch": 703} {"train_loss": -10.069753646850586, "global_step": 118218, "epoch": 703} {"train_loss": -9.842660903930664, "global_step": 118219, "epoch": 703} {"train_loss": -10.189420700073242, "global_step": 118220, "epoch": 703} {"train_loss": -9.968605041503906, "global_step": 118221, "epoch": 703} {"train_loss": -10.160506248474121, "global_step": 118222, "epoch": 703} {"train_loss": -10.09873104095459, "global_step": 118223, "epoch": 703} {"train_loss": -9.853752136230469, "global_step": 118224, "epoch": 703} {"train_loss": -10.270668983459473, "global_step": 118225, "epoch": 703} {"train_loss": -9.807046890258789, "global_step": 118226, "epoch": 703} {"train_loss": -10.421527862548828, "global_step": 118227, "epoch": 703} {"train_loss": -9.729902267456055, "global_step": 118228, "epoch": 703} {"train_loss": -10.043498992919922, "global_step": 118229, "epoch": 703} {"train_loss": -10.170438766479492, "global_step": 118230, "epoch": 703} {"train_loss": -9.921905517578125, "global_step": 118231, "epoch": 703} {"train_loss": -10.411861419677734, "global_step": 118232, "epoch": 703} {"train_loss": -10.240175247192383, "global_step": 118233, "epoch": 703} {"train_loss": -10.099709510803223, "global_step": 118234, "epoch": 703} {"train_loss": -10.23159122467041, "global_step": 118235, "epoch": 703} {"train_loss": -10.269575119018555, "global_step": 118236, "epoch": 703} {"train_loss": -10.110849380493164, "global_step": 118237, "epoch": 703} {"train_loss": -10.042839050292969, "global_step": 118238, "epoch": 703} {"train_loss": -9.725303649902344, "global_step": 118239, "epoch": 703} {"train_loss": -9.932670593261719, "global_step": 118240, "epoch": 703} {"train_loss": -10.07205581665039, "global_step": 118241, "epoch": 703} {"train_loss": -10.14244270324707, "global_step": 118242, "epoch": 703} {"train_loss": -10.195423126220703, "global_step": 118243, "epoch": 703} {"train_loss": -10.181049346923828, "global_step": 118244, "epoch": 703} {"train_loss": -9.934377670288086, "global_step": 118245, "epoch": 703} {"train_loss": -9.957084655761719, "global_step": 118246, "epoch": 703} {"train_loss": -10.085094451904297, "global_step": 118247, "epoch": 703} {"train_loss": -10.144810676574707, "global_step": 118248, "epoch": 703} {"train_loss": -10.38217544555664, "global_step": 118249, "epoch": 703} {"train_loss": -10.296039581298828, "global_step": 118250, "epoch": 703} {"train_loss": -10.241935729980469, "global_step": 118251, "epoch": 703} {"train_loss": -10.316373825073242, "global_step": 118252, "epoch": 703} {"train_loss": -10.235429763793945, "global_step": 118253, "epoch": 703} {"train_loss": -10.296868324279785, "global_step": 118254, "epoch": 703} {"train_loss": -10.262226104736328, "global_step": 118255, "epoch": 703} {"train_loss": -10.211822509765625, "global_step": 118256, "epoch": 703} {"train_loss": -10.215388298034668, "global_step": 118257, "epoch": 703} {"train_loss": -10.33875560760498, "global_step": 118258, "epoch": 703} {"train_loss": -10.037364959716797, "global_step": 118259, "epoch": 703} {"train_loss": -10.219079971313477, "global_step": 118260, "epoch": 703} {"train_loss": -10.427791595458984, "global_step": 118261, "epoch": 703} {"train_loss": -9.946470260620117, "global_step": 118262, "epoch": 703} {"train_loss": -10.178333282470703, "global_step": 118263, "epoch": 703} {"train_loss": -10.333026885986328, "global_step": 118264, "epoch": 703} {"train_loss": -10.245010375976562, "global_step": 118265, "epoch": 703} {"train_loss": -9.964759826660156, "global_step": 118266, "epoch": 703} {"train_loss": -10.272832870483398, "global_step": 118267, "epoch": 703} {"train_loss": -9.8145112991333, "global_step": 118268, "epoch": 703} {"train_loss": -10.099936485290527, "global_step": 118269, "epoch": 703} {"train_loss": -9.90353012084961, "global_step": 118270, "epoch": 703} {"train_loss": -10.06833665143876, "global_step": 118271, "epoch": 703, "val_loss": 213135.109375} {"train_loss": -10.033649444580078, "global_step": 118272, "epoch": 704} {"train_loss": -10.322782516479492, "global_step": 118273, "epoch": 704} {"train_loss": -10.050475120544434, "global_step": 118274, "epoch": 704} {"train_loss": -10.105901718139648, "global_step": 118275, "epoch": 704} {"train_loss": -9.846470832824707, "global_step": 118276, "epoch": 704} {"train_loss": -10.343406677246094, "global_step": 118277, "epoch": 704} {"train_loss": -9.828500747680664, "global_step": 118278, "epoch": 704} {"train_loss": -10.001912117004395, "global_step": 118279, "epoch": 704} {"train_loss": -10.075715065002441, "global_step": 118280, "epoch": 704} {"train_loss": -10.148019790649414, "global_step": 118281, "epoch": 704} {"train_loss": -10.434471130371094, "global_step": 118282, "epoch": 704} {"train_loss": -10.230856895446777, "global_step": 118283, "epoch": 704} {"train_loss": -10.420970916748047, "global_step": 118284, "epoch": 704} {"train_loss": -9.987659454345703, "global_step": 118285, "epoch": 704} {"train_loss": -10.240859985351562, "global_step": 118286, "epoch": 704} {"train_loss": -10.301551818847656, "global_step": 118287, "epoch": 704} {"train_loss": -10.068964004516602, "global_step": 118288, "epoch": 704} {"train_loss": -10.27651596069336, "global_step": 118289, "epoch": 704} {"train_loss": -10.255678176879883, "global_step": 118290, "epoch": 704} {"train_loss": -10.256597518920898, "global_step": 118291, "epoch": 704} {"train_loss": -10.511706352233887, "global_step": 118292, "epoch": 704} {"train_loss": -10.026130676269531, "global_step": 118293, "epoch": 704} {"train_loss": -10.406490325927734, "global_step": 118294, "epoch": 704} {"train_loss": -9.969606399536133, "global_step": 118295, "epoch": 704} {"train_loss": -10.230239868164062, "global_step": 118296, "epoch": 704} {"train_loss": -10.175056457519531, "global_step": 118297, "epoch": 704} {"train_loss": -10.327552795410156, "global_step": 118298, "epoch": 704} {"train_loss": -10.03719711303711, "global_step": 118299, "epoch": 704} {"train_loss": -9.992315292358398, "global_step": 118300, "epoch": 704} {"train_loss": -10.151268005371094, "global_step": 118301, "epoch": 704} {"train_loss": -10.07489013671875, "global_step": 118302, "epoch": 704} {"train_loss": -10.176738739013672, "global_step": 118303, "epoch": 704} {"train_loss": -9.996774673461914, "global_step": 118304, "epoch": 704} {"train_loss": -10.028522491455078, "global_step": 118305, "epoch": 704} {"train_loss": -9.40833854675293, "global_step": 118306, "epoch": 704} {"train_loss": -10.005115509033203, "global_step": 118307, "epoch": 704} {"train_loss": -9.733824729919434, "global_step": 118308, "epoch": 704} {"train_loss": -9.25912094116211, "global_step": 118309, "epoch": 704} {"train_loss": -10.057483673095703, "global_step": 118310, "epoch": 704} {"train_loss": -9.279029846191406, "global_step": 118311, "epoch": 704} {"train_loss": -10.199626922607422, "global_step": 118312, "epoch": 704} {"train_loss": -9.518436431884766, "global_step": 118313, "epoch": 704} {"train_loss": -10.020910263061523, "global_step": 118314, "epoch": 704} {"train_loss": -9.938477516174316, "global_step": 118315, "epoch": 704} {"train_loss": -9.516797065734863, "global_step": 118316, "epoch": 704} {"train_loss": -10.184967041015625, "global_step": 118317, "epoch": 704} {"train_loss": -9.851016998291016, "global_step": 118318, "epoch": 704} {"train_loss": -9.857621192932129, "global_step": 118319, "epoch": 704} {"train_loss": -9.759504318237305, "global_step": 118320, "epoch": 704} {"train_loss": -9.720970153808594, "global_step": 118321, "epoch": 704} {"train_loss": -9.822113037109375, "global_step": 118322, "epoch": 704} {"train_loss": -9.677644729614258, "global_step": 118323, "epoch": 704} {"train_loss": -9.770753860473633, "global_step": 118324, "epoch": 704} {"train_loss": -9.417570114135742, "global_step": 118325, "epoch": 704} {"train_loss": -9.597297668457031, "global_step": 118326, "epoch": 704} {"train_loss": -9.398829460144043, "global_step": 118327, "epoch": 704} {"train_loss": -9.97620964050293, "global_step": 118328, "epoch": 704} {"train_loss": -9.60239028930664, "global_step": 118329, "epoch": 704} {"train_loss": -10.004671096801758, "global_step": 118330, "epoch": 704} {"train_loss": -9.523346900939941, "global_step": 118331, "epoch": 704} {"train_loss": -9.748309135437012, "global_step": 118332, "epoch": 704} {"train_loss": -9.887198448181152, "global_step": 118333, "epoch": 704} {"train_loss": -9.964591979980469, "global_step": 118334, "epoch": 704} {"train_loss": -9.73464584350586, "global_step": 118335, "epoch": 704} {"train_loss": -9.998102188110352, "global_step": 118336, "epoch": 704} {"train_loss": -9.88082504272461, "global_step": 118337, "epoch": 704} {"train_loss": -10.02349853515625, "global_step": 118338, "epoch": 704} {"train_loss": -9.714424133300781, "global_step": 118339, "epoch": 704} {"train_loss": -10.047094345092773, "global_step": 118340, "epoch": 704} {"train_loss": -9.940006256103516, "global_step": 118341, "epoch": 704} {"train_loss": -10.02552604675293, "global_step": 118342, "epoch": 704} {"train_loss": -9.974522590637207, "global_step": 118343, "epoch": 704} {"train_loss": -10.124387741088867, "global_step": 118344, "epoch": 704} {"train_loss": -10.039907455444336, "global_step": 118345, "epoch": 704} {"train_loss": -10.075260162353516, "global_step": 118346, "epoch": 704} {"train_loss": -9.898209571838379, "global_step": 118347, "epoch": 704} {"train_loss": -10.208159446716309, "global_step": 118348, "epoch": 704} {"train_loss": -10.243468284606934, "global_step": 118349, "epoch": 704} {"train_loss": -10.355743408203125, "global_step": 118350, "epoch": 704} {"train_loss": -10.336130142211914, "global_step": 118351, "epoch": 704} {"train_loss": -10.100147247314453, "global_step": 118352, "epoch": 704} {"train_loss": -10.370227813720703, "global_step": 118353, "epoch": 704} {"train_loss": -10.256084442138672, "global_step": 118354, "epoch": 704} {"train_loss": -10.290700912475586, "global_step": 118355, "epoch": 704} {"train_loss": -10.405252456665039, "global_step": 118356, "epoch": 704} {"train_loss": -10.013171195983887, "global_step": 118357, "epoch": 704} {"train_loss": -10.228392601013184, "global_step": 118358, "epoch": 704} {"train_loss": -10.355958938598633, "global_step": 118359, "epoch": 704} {"train_loss": -10.508411407470703, "global_step": 118360, "epoch": 704} {"train_loss": -10.522890090942383, "global_step": 118361, "epoch": 704} {"train_loss": -10.281587600708008, "global_step": 118362, "epoch": 704} {"train_loss": -10.367572784423828, "global_step": 118363, "epoch": 704} {"train_loss": -10.277504920959473, "global_step": 118364, "epoch": 704} {"train_loss": -10.49321174621582, "global_step": 118365, "epoch": 704} {"train_loss": -10.360343933105469, "global_step": 118366, "epoch": 704} {"train_loss": -9.94751262664795, "global_step": 118367, "epoch": 704} {"train_loss": -10.497308731079102, "global_step": 118368, "epoch": 704} {"train_loss": -10.010897636413574, "global_step": 118369, "epoch": 704} {"train_loss": -10.419731140136719, "global_step": 118370, "epoch": 704} {"train_loss": -9.698261260986328, "global_step": 118371, "epoch": 704} {"train_loss": -9.736428260803223, "global_step": 118372, "epoch": 704} {"train_loss": -10.374689102172852, "global_step": 118373, "epoch": 704} {"train_loss": -9.278895378112793, "global_step": 118374, "epoch": 704} {"train_loss": -9.78774356842041, "global_step": 118375, "epoch": 704} {"train_loss": -10.084775924682617, "global_step": 118376, "epoch": 704} {"train_loss": -9.98533821105957, "global_step": 118377, "epoch": 704} {"train_loss": -10.094114303588867, "global_step": 118378, "epoch": 704} {"train_loss": -9.326786041259766, "global_step": 118379, "epoch": 704} {"train_loss": -10.291418075561523, "global_step": 118380, "epoch": 704} {"train_loss": -9.790570259094238, "global_step": 118381, "epoch": 704} {"train_loss": -10.018218994140625, "global_step": 118382, "epoch": 704} {"train_loss": -10.128491401672363, "global_step": 118383, "epoch": 704} {"train_loss": -9.960550308227539, "global_step": 118384, "epoch": 704} {"train_loss": -10.163717269897461, "global_step": 118385, "epoch": 704} {"train_loss": -10.214741706848145, "global_step": 118386, "epoch": 704} {"train_loss": -10.180554389953613, "global_step": 118387, "epoch": 704} {"train_loss": -10.105390548706055, "global_step": 118388, "epoch": 704} {"train_loss": -10.144577980041504, "global_step": 118389, "epoch": 704} {"train_loss": -10.31039047241211, "global_step": 118390, "epoch": 704} {"train_loss": -10.106501579284668, "global_step": 118391, "epoch": 704} {"train_loss": -10.224231719970703, "global_step": 118392, "epoch": 704} {"train_loss": -9.888957023620605, "global_step": 118393, "epoch": 704} {"train_loss": -10.035606384277344, "global_step": 118394, "epoch": 704} {"train_loss": -9.854220390319824, "global_step": 118395, "epoch": 704} {"train_loss": -10.32111644744873, "global_step": 118396, "epoch": 704} {"train_loss": -10.154805183410645, "global_step": 118397, "epoch": 704} {"train_loss": -10.159310340881348, "global_step": 118398, "epoch": 704} {"train_loss": -10.139023780822754, "global_step": 118399, "epoch": 704} {"train_loss": -10.062509536743164, "global_step": 118400, "epoch": 704} {"train_loss": -10.428339004516602, "global_step": 118401, "epoch": 704} {"train_loss": -10.108491897583008, "global_step": 118402, "epoch": 704} {"train_loss": -10.266733169555664, "global_step": 118403, "epoch": 704} {"train_loss": -10.030537605285645, "global_step": 118404, "epoch": 704} {"train_loss": -10.138761520385742, "global_step": 118405, "epoch": 704} {"train_loss": -10.18198299407959, "global_step": 118406, "epoch": 704} {"train_loss": -10.11953353881836, "global_step": 118407, "epoch": 704} {"train_loss": -10.320976257324219, "global_step": 118408, "epoch": 704} {"train_loss": -10.23373794555664, "global_step": 118409, "epoch": 704} {"train_loss": -9.780850410461426, "global_step": 118410, "epoch": 704} {"train_loss": -10.286331176757812, "global_step": 118411, "epoch": 704} {"train_loss": -9.639824867248535, "global_step": 118412, "epoch": 704} {"train_loss": -10.098078727722168, "global_step": 118413, "epoch": 704} {"train_loss": -9.732967376708984, "global_step": 118414, "epoch": 704} {"train_loss": -10.251152038574219, "global_step": 118415, "epoch": 704} {"train_loss": -9.875710487365723, "global_step": 118416, "epoch": 704} {"train_loss": -10.080591201782227, "global_step": 118417, "epoch": 704} {"train_loss": -10.159906387329102, "global_step": 118418, "epoch": 704} {"train_loss": -10.049603462219238, "global_step": 118419, "epoch": 704} {"train_loss": -10.20813274383545, "global_step": 118420, "epoch": 704} {"train_loss": -10.176702499389648, "global_step": 118421, "epoch": 704} {"train_loss": -10.302754402160645, "global_step": 118422, "epoch": 704} {"train_loss": -10.085088729858398, "global_step": 118423, "epoch": 704} {"train_loss": -10.198419570922852, "global_step": 118424, "epoch": 704} {"train_loss": -10.101152420043945, "global_step": 118425, "epoch": 704} {"train_loss": -10.353472709655762, "global_step": 118426, "epoch": 704} {"train_loss": -10.164926528930664, "global_step": 118427, "epoch": 704} {"train_loss": -10.342979431152344, "global_step": 118428, "epoch": 704} {"train_loss": -9.90172290802002, "global_step": 118429, "epoch": 704} {"train_loss": -9.692785263061523, "global_step": 118430, "epoch": 704} {"train_loss": -10.110496520996094, "global_step": 118431, "epoch": 704} {"train_loss": -9.998117446899414, "global_step": 118432, "epoch": 704} {"train_loss": -10.134742736816406, "global_step": 118433, "epoch": 704} {"train_loss": -9.970867156982422, "global_step": 118434, "epoch": 704} {"train_loss": -10.209044456481934, "global_step": 118435, "epoch": 704} {"train_loss": -9.717519760131836, "global_step": 118436, "epoch": 704} {"train_loss": -10.440486907958984, "global_step": 118437, "epoch": 704} {"train_loss": -9.785618782043457, "global_step": 118438, "epoch": 704} {"train_loss": -10.055122528757368, "global_step": 118439, "epoch": 704, "val_loss": 214238.3125} {"train_loss": -9.60566520690918, "global_step": 118440, "epoch": 705} {"train_loss": -10.098653793334961, "global_step": 118441, "epoch": 705} {"train_loss": -10.110013961791992, "global_step": 118442, "epoch": 705} {"train_loss": -10.111076354980469, "global_step": 118443, "epoch": 705} {"train_loss": -9.903139114379883, "global_step": 118444, "epoch": 705} {"train_loss": -10.168615341186523, "global_step": 118445, "epoch": 705} {"train_loss": -9.46169662475586, "global_step": 118446, "epoch": 705} {"train_loss": -9.770343780517578, "global_step": 118447, "epoch": 705} {"train_loss": -9.585393905639648, "global_step": 118448, "epoch": 705} {"train_loss": -9.717100143432617, "global_step": 118449, "epoch": 705} {"train_loss": -9.642180442810059, "global_step": 118450, "epoch": 705} {"train_loss": -10.030134201049805, "global_step": 118451, "epoch": 705} {"train_loss": -9.47028636932373, "global_step": 118452, "epoch": 705} {"train_loss": -9.903800964355469, "global_step": 118453, "epoch": 705} {"train_loss": -9.7597017288208, "global_step": 118454, "epoch": 705} {"train_loss": -9.569390296936035, "global_step": 118455, "epoch": 705} {"train_loss": -10.076251983642578, "global_step": 118456, "epoch": 705} {"train_loss": -9.906457901000977, "global_step": 118457, "epoch": 705} {"train_loss": -9.840566635131836, "global_step": 118458, "epoch": 705} {"train_loss": -10.23360824584961, "global_step": 118459, "epoch": 705} {"train_loss": -9.926130294799805, "global_step": 118460, "epoch": 705} {"train_loss": -10.02894401550293, "global_step": 118461, "epoch": 705} {"train_loss": -9.920514106750488, "global_step": 118462, "epoch": 705} {"train_loss": -10.162958145141602, "global_step": 118463, "epoch": 705} {"train_loss": -9.81521987915039, "global_step": 118464, "epoch": 705} {"train_loss": -9.955058097839355, "global_step": 118465, "epoch": 705} {"train_loss": -9.906818389892578, "global_step": 118466, "epoch": 705} {"train_loss": -9.929227828979492, "global_step": 118467, "epoch": 705} {"train_loss": -9.92393684387207, "global_step": 118468, "epoch": 705} {"train_loss": -9.873522758483887, "global_step": 118469, "epoch": 705} {"train_loss": -9.854239463806152, "global_step": 118470, "epoch": 705} {"train_loss": -10.283918380737305, "global_step": 118471, "epoch": 705} {"train_loss": -10.04201889038086, "global_step": 118472, "epoch": 705} {"train_loss": -9.768412590026855, "global_step": 118473, "epoch": 705} {"train_loss": -10.123482704162598, "global_step": 118474, "epoch": 705} {"train_loss": -10.062052726745605, "global_step": 118475, "epoch": 705} {"train_loss": -10.121356964111328, "global_step": 118476, "epoch": 705} {"train_loss": -9.891359329223633, "global_step": 118477, "epoch": 705} {"train_loss": -10.239341735839844, "global_step": 118478, "epoch": 705} {"train_loss": -10.087820053100586, "global_step": 118479, "epoch": 705} {"train_loss": -10.314475059509277, "global_step": 118480, "epoch": 705} {"train_loss": -10.319591522216797, "global_step": 118481, "epoch": 705} {"train_loss": -9.984578132629395, "global_step": 118482, "epoch": 705} {"train_loss": -10.331515312194824, "global_step": 118483, "epoch": 705} {"train_loss": -10.287887573242188, "global_step": 118484, "epoch": 705} {"train_loss": -10.192402839660645, "global_step": 118485, "epoch": 705} {"train_loss": -10.422626495361328, "global_step": 118486, "epoch": 705} {"train_loss": -10.203630447387695, "global_step": 118487, "epoch": 705} {"train_loss": -10.358665466308594, "global_step": 118488, "epoch": 705} {"train_loss": -10.341217041015625, "global_step": 118489, "epoch": 705} {"train_loss": -10.190391540527344, "global_step": 118490, "epoch": 705} {"train_loss": -10.083637237548828, "global_step": 118491, "epoch": 705} {"train_loss": -10.457013130187988, "global_step": 118492, "epoch": 705} {"train_loss": -10.205635070800781, "global_step": 118493, "epoch": 705} {"train_loss": -10.324386596679688, "global_step": 118494, "epoch": 705} {"train_loss": -10.284037590026855, "global_step": 118495, "epoch": 705} {"train_loss": -10.466327667236328, "global_step": 118496, "epoch": 705} {"train_loss": -10.190698623657227, "global_step": 118497, "epoch": 705} {"train_loss": -9.930486679077148, "global_step": 118498, "epoch": 705} {"train_loss": -10.218505859375, "global_step": 118499, "epoch": 705} {"train_loss": -10.292072296142578, "global_step": 118500, "epoch": 705} {"train_loss": -10.02015495300293, "global_step": 118501, "epoch": 705} {"train_loss": -9.918421745300293, "global_step": 118502, "epoch": 705} {"train_loss": -10.434416770935059, "global_step": 118503, "epoch": 705} {"train_loss": -10.172836303710938, "global_step": 118504, "epoch": 705} {"train_loss": -10.409536361694336, "global_step": 118505, "epoch": 705} {"train_loss": -10.124698638916016, "global_step": 118506, "epoch": 705} {"train_loss": -10.332733154296875, "global_step": 118507, "epoch": 705} {"train_loss": -9.84754753112793, "global_step": 118508, "epoch": 705} {"train_loss": -10.033966064453125, "global_step": 118509, "epoch": 705} {"train_loss": -9.879908561706543, "global_step": 118510, "epoch": 705} {"train_loss": -9.77192497253418, "global_step": 118511, "epoch": 705} {"train_loss": -10.077104568481445, "global_step": 118512, "epoch": 705} {"train_loss": -9.605155944824219, "global_step": 118513, "epoch": 705} {"train_loss": -9.75074291229248, "global_step": 118514, "epoch": 705} {"train_loss": -10.078888893127441, "global_step": 118515, "epoch": 705} {"train_loss": -9.997457504272461, "global_step": 118516, "epoch": 705} {"train_loss": -10.159881591796875, "global_step": 118517, "epoch": 705} {"train_loss": -10.159311294555664, "global_step": 118518, "epoch": 705} {"train_loss": -9.884543418884277, "global_step": 118519, "epoch": 705} {"train_loss": -9.94467544555664, "global_step": 118520, "epoch": 705} {"train_loss": -10.020543098449707, "global_step": 118521, "epoch": 705} {"train_loss": -9.921010971069336, "global_step": 118522, "epoch": 705} {"train_loss": -9.986642837524414, "global_step": 118523, "epoch": 705} {"train_loss": -9.61512565612793, "global_step": 118524, "epoch": 705} {"train_loss": -9.76677131652832, "global_step": 118525, "epoch": 705} {"train_loss": -9.776512145996094, "global_step": 118526, "epoch": 705} {"train_loss": -9.974267959594727, "global_step": 118527, "epoch": 705} {"train_loss": -10.044656753540039, "global_step": 118528, "epoch": 705} {"train_loss": -9.986328125, "global_step": 118529, "epoch": 705} {"train_loss": -9.902149200439453, "global_step": 118530, "epoch": 705} {"train_loss": -9.582967758178711, "global_step": 118531, "epoch": 705} {"train_loss": -10.072912216186523, "global_step": 118532, "epoch": 705} {"train_loss": -9.595135688781738, "global_step": 118533, "epoch": 705} {"train_loss": -9.7951021194458, "global_step": 118534, "epoch": 705} {"train_loss": -9.926968574523926, "global_step": 118535, "epoch": 705} {"train_loss": -10.297125816345215, "global_step": 118536, "epoch": 705} {"train_loss": -9.93527889251709, "global_step": 118537, "epoch": 705} {"train_loss": -10.114643096923828, "global_step": 118538, "epoch": 705} {"train_loss": -9.791269302368164, "global_step": 118539, "epoch": 705} {"train_loss": -9.794775009155273, "global_step": 118540, "epoch": 705} {"train_loss": -10.230025291442871, "global_step": 118541, "epoch": 705} {"train_loss": -9.948823928833008, "global_step": 118542, "epoch": 705} {"train_loss": -10.105104446411133, "global_step": 118543, "epoch": 705} {"train_loss": -10.202552795410156, "global_step": 118544, "epoch": 705} {"train_loss": -10.217337608337402, "global_step": 118545, "epoch": 705} {"train_loss": -10.022523880004883, "global_step": 118546, "epoch": 705} {"train_loss": -10.308225631713867, "global_step": 118547, "epoch": 705} {"train_loss": -10.103469848632812, "global_step": 118548, "epoch": 705} {"train_loss": -10.109365463256836, "global_step": 118549, "epoch": 705} {"train_loss": -10.13119125366211, "global_step": 118550, "epoch": 705} {"train_loss": -10.411629676818848, "global_step": 118551, "epoch": 705} {"train_loss": -10.107136726379395, "global_step": 118552, "epoch": 705} {"train_loss": -10.22502326965332, "global_step": 118553, "epoch": 705} {"train_loss": -10.364598274230957, "global_step": 118554, "epoch": 705} {"train_loss": -10.095539093017578, "global_step": 118555, "epoch": 705} {"train_loss": -9.947145462036133, "global_step": 118556, "epoch": 705} {"train_loss": -10.22205924987793, "global_step": 118557, "epoch": 705} {"train_loss": -10.20579719543457, "global_step": 118558, "epoch": 705} {"train_loss": -10.251811981201172, "global_step": 118559, "epoch": 705} {"train_loss": -10.266281127929688, "global_step": 118560, "epoch": 705} {"train_loss": -10.162322998046875, "global_step": 118561, "epoch": 705} {"train_loss": -10.27560806274414, "global_step": 118562, "epoch": 705} {"train_loss": -9.917484283447266, "global_step": 118563, "epoch": 705} {"train_loss": -10.049844741821289, "global_step": 118564, "epoch": 705} {"train_loss": -10.160773277282715, "global_step": 118565, "epoch": 705} {"train_loss": -10.124796867370605, "global_step": 118566, "epoch": 705} {"train_loss": -10.20657730102539, "global_step": 118567, "epoch": 705} {"train_loss": -9.996047973632812, "global_step": 118568, "epoch": 705} {"train_loss": -10.245030403137207, "global_step": 118569, "epoch": 705} {"train_loss": -10.233429908752441, "global_step": 118570, "epoch": 705} {"train_loss": -9.973587036132812, "global_step": 118571, "epoch": 705} {"train_loss": -10.160629272460938, "global_step": 118572, "epoch": 705} {"train_loss": -10.100057601928711, "global_step": 118573, "epoch": 705} {"train_loss": -10.120057106018066, "global_step": 118574, "epoch": 705} {"train_loss": -10.246784210205078, "global_step": 118575, "epoch": 705} {"train_loss": -10.297357559204102, "global_step": 118576, "epoch": 705} {"train_loss": -10.125351905822754, "global_step": 118577, "epoch": 705} {"train_loss": -10.322410583496094, "global_step": 118578, "epoch": 705} {"train_loss": -10.231511116027832, "global_step": 118579, "epoch": 705} {"train_loss": -10.239206314086914, "global_step": 118580, "epoch": 705} {"train_loss": -10.291282653808594, "global_step": 118581, "epoch": 705} {"train_loss": -10.505928039550781, "global_step": 118582, "epoch": 705} {"train_loss": -10.409248352050781, "global_step": 118583, "epoch": 705} {"train_loss": -10.077048301696777, "global_step": 118584, "epoch": 705} {"train_loss": -10.254293441772461, "global_step": 118585, "epoch": 705} {"train_loss": -10.228422164916992, "global_step": 118586, "epoch": 705} {"train_loss": -10.553925514221191, "global_step": 118587, "epoch": 705} {"train_loss": -10.156526565551758, "global_step": 118588, "epoch": 705} {"train_loss": -10.470239639282227, "global_step": 118589, "epoch": 705} {"train_loss": -9.949159622192383, "global_step": 118590, "epoch": 705} {"train_loss": -10.25699234008789, "global_step": 118591, "epoch": 705} {"train_loss": -10.091794967651367, "global_step": 118592, "epoch": 705} {"train_loss": -10.135507583618164, "global_step": 118593, "epoch": 705} {"train_loss": -10.013956069946289, "global_step": 118594, "epoch": 705} {"train_loss": -9.938838958740234, "global_step": 118595, "epoch": 705} {"train_loss": -10.131455421447754, "global_step": 118596, "epoch": 705} {"train_loss": -9.941021919250488, "global_step": 118597, "epoch": 705} {"train_loss": -10.16238021850586, "global_step": 118598, "epoch": 705} {"train_loss": -10.193693161010742, "global_step": 118599, "epoch": 705} {"train_loss": -10.247138977050781, "global_step": 118600, "epoch": 705} {"train_loss": -10.412888526916504, "global_step": 118601, "epoch": 705} {"train_loss": -10.173782348632812, "global_step": 118602, "epoch": 705} {"train_loss": -10.202200889587402, "global_step": 118603, "epoch": 705} {"train_loss": -10.316888809204102, "global_step": 118604, "epoch": 705} {"train_loss": -10.424511909484863, "global_step": 118605, "epoch": 705} {"train_loss": -10.182004928588867, "global_step": 118606, "epoch": 705} {"train_loss": -10.080086089315868, "global_step": 118607, "epoch": 705, "val_loss": 214926.453125, "train_action_mse_error": 3.688042640686035} {"train_loss": -10.304204940795898, "global_step": 118608, "epoch": 706} {"train_loss": -10.379486083984375, "global_step": 118609, "epoch": 706} {"train_loss": -10.399853706359863, "global_step": 118610, "epoch": 706} {"train_loss": -10.22354793548584, "global_step": 118611, "epoch": 706} {"train_loss": -10.528938293457031, "global_step": 118612, "epoch": 706} {"train_loss": -10.25019645690918, "global_step": 118613, "epoch": 706} {"train_loss": -10.101846694946289, "global_step": 118614, "epoch": 706} {"train_loss": -10.286301612854004, "global_step": 118615, "epoch": 706} {"train_loss": -10.28162956237793, "global_step": 118616, "epoch": 706} {"train_loss": -10.07844352722168, "global_step": 118617, "epoch": 706} {"train_loss": -10.288369178771973, "global_step": 118618, "epoch": 706} {"train_loss": -10.321599960327148, "global_step": 118619, "epoch": 706} {"train_loss": -10.244731903076172, "global_step": 118620, "epoch": 706} {"train_loss": -10.334769248962402, "global_step": 118621, "epoch": 706} {"train_loss": -10.326841354370117, "global_step": 118622, "epoch": 706} {"train_loss": -10.413867950439453, "global_step": 118623, "epoch": 706} {"train_loss": -10.218973159790039, "global_step": 118624, "epoch": 706} {"train_loss": -10.594720840454102, "global_step": 118625, "epoch": 706} {"train_loss": -10.252801895141602, "global_step": 118626, "epoch": 706} {"train_loss": -10.358297348022461, "global_step": 118627, "epoch": 706} {"train_loss": -10.324481010437012, "global_step": 118628, "epoch": 706} {"train_loss": -10.020415306091309, "global_step": 118629, "epoch": 706} {"train_loss": -10.314192771911621, "global_step": 118630, "epoch": 706} {"train_loss": -10.061386108398438, "global_step": 118631, "epoch": 706} {"train_loss": -10.355423927307129, "global_step": 118632, "epoch": 706} {"train_loss": -9.810770034790039, "global_step": 118633, "epoch": 706} {"train_loss": -10.049205780029297, "global_step": 118634, "epoch": 706} {"train_loss": -10.140127182006836, "global_step": 118635, "epoch": 706} {"train_loss": -10.12796688079834, "global_step": 118636, "epoch": 706} {"train_loss": -10.172937393188477, "global_step": 118637, "epoch": 706} {"train_loss": -10.153534889221191, "global_step": 118638, "epoch": 706} {"train_loss": -10.051766395568848, "global_step": 118639, "epoch": 706} {"train_loss": -9.961555480957031, "global_step": 118640, "epoch": 706} {"train_loss": -10.130891799926758, "global_step": 118641, "epoch": 706} {"train_loss": -9.98341178894043, "global_step": 118642, "epoch": 706} {"train_loss": -9.668222427368164, "global_step": 118643, "epoch": 706} {"train_loss": -10.275566101074219, "global_step": 118644, "epoch": 706} {"train_loss": -9.613637924194336, "global_step": 118645, "epoch": 706} {"train_loss": -10.211503028869629, "global_step": 118646, "epoch": 706} {"train_loss": -9.671415328979492, "global_step": 118647, "epoch": 706} {"train_loss": -9.73686408996582, "global_step": 118648, "epoch": 706} {"train_loss": -9.954448699951172, "global_step": 118649, "epoch": 706} {"train_loss": -9.533880233764648, "global_step": 118650, "epoch": 706} {"train_loss": -10.067642211914062, "global_step": 118651, "epoch": 706} {"train_loss": -8.680455207824707, "global_step": 118652, "epoch": 706} {"train_loss": -10.009819984436035, "global_step": 118653, "epoch": 706} {"train_loss": -9.766449928283691, "global_step": 118654, "epoch": 706} {"train_loss": -10.021284103393555, "global_step": 118655, "epoch": 706} {"train_loss": -10.011048316955566, "global_step": 118656, "epoch": 706} {"train_loss": -10.124485969543457, "global_step": 118657, "epoch": 706} {"train_loss": -10.184021949768066, "global_step": 118658, "epoch": 706} {"train_loss": -9.969671249389648, "global_step": 118659, "epoch": 706} {"train_loss": -10.110664367675781, "global_step": 118660, "epoch": 706} {"train_loss": -10.265886306762695, "global_step": 118661, "epoch": 706} {"train_loss": -10.106254577636719, "global_step": 118662, "epoch": 706} {"train_loss": -10.042993545532227, "global_step": 118663, "epoch": 706} {"train_loss": -10.327444076538086, "global_step": 118664, "epoch": 706} {"train_loss": -10.056939125061035, "global_step": 118665, "epoch": 706} {"train_loss": -10.185819625854492, "global_step": 118666, "epoch": 706} {"train_loss": -9.818418502807617, "global_step": 118667, "epoch": 706} {"train_loss": -10.182668685913086, "global_step": 118668, "epoch": 706} {"train_loss": -9.822921752929688, "global_step": 118669, "epoch": 706} {"train_loss": -10.041574478149414, "global_step": 118670, "epoch": 706} {"train_loss": -9.899114608764648, "global_step": 118671, "epoch": 706} {"train_loss": -10.087076187133789, "global_step": 118672, "epoch": 706} {"train_loss": -9.914535522460938, "global_step": 118673, "epoch": 706} {"train_loss": -10.06155014038086, "global_step": 118674, "epoch": 706} {"train_loss": -10.201530456542969, "global_step": 118675, "epoch": 706} {"train_loss": -10.293296813964844, "global_step": 118676, "epoch": 706} {"train_loss": -10.106693267822266, "global_step": 118677, "epoch": 706} {"train_loss": -9.949939727783203, "global_step": 118678, "epoch": 706} {"train_loss": -9.955543518066406, "global_step": 118679, "epoch": 706} {"train_loss": -9.903772354125977, "global_step": 118680, "epoch": 706} {"train_loss": -10.141019821166992, "global_step": 118681, "epoch": 706} {"train_loss": -10.148824691772461, "global_step": 118682, "epoch": 706} {"train_loss": -9.860590934753418, "global_step": 118683, "epoch": 706} {"train_loss": -9.703991889953613, "global_step": 118684, "epoch": 706} {"train_loss": -9.776369094848633, "global_step": 118685, "epoch": 706} {"train_loss": -10.226717948913574, "global_step": 118686, "epoch": 706} {"train_loss": -9.4769287109375, "global_step": 118687, "epoch": 706} {"train_loss": -10.156097412109375, "global_step": 118688, "epoch": 706} {"train_loss": -9.535074234008789, "global_step": 118689, "epoch": 706} {"train_loss": -10.223742485046387, "global_step": 118690, "epoch": 706} {"train_loss": -9.6904296875, "global_step": 118691, "epoch": 706} {"train_loss": -9.97384262084961, "global_step": 118692, "epoch": 706} {"train_loss": -9.959710121154785, "global_step": 118693, "epoch": 706} {"train_loss": -10.222132682800293, "global_step": 118694, "epoch": 706} {"train_loss": -10.133096694946289, "global_step": 118695, "epoch": 706} {"train_loss": -10.141197204589844, "global_step": 118696, "epoch": 706} {"train_loss": -10.217296600341797, "global_step": 118697, "epoch": 706} {"train_loss": -10.161725997924805, "global_step": 118698, "epoch": 706} {"train_loss": -9.985923767089844, "global_step": 118699, "epoch": 706} {"train_loss": -10.356636047363281, "global_step": 118700, "epoch": 706} {"train_loss": -10.121813774108887, "global_step": 118701, "epoch": 706} {"train_loss": -10.405820846557617, "global_step": 118702, "epoch": 706} {"train_loss": -10.300569534301758, "global_step": 118703, "epoch": 706} {"train_loss": -10.288423538208008, "global_step": 118704, "epoch": 706} {"train_loss": -10.22726058959961, "global_step": 118705, "epoch": 706} {"train_loss": -10.07255744934082, "global_step": 118706, "epoch": 706} {"train_loss": -10.19940185546875, "global_step": 118707, "epoch": 706} {"train_loss": -10.363184928894043, "global_step": 118708, "epoch": 706} {"train_loss": -9.864623069763184, "global_step": 118709, "epoch": 706} {"train_loss": -10.280603408813477, "global_step": 118710, "epoch": 706} {"train_loss": -10.402412414550781, "global_step": 118711, "epoch": 706} {"train_loss": -10.293174743652344, "global_step": 118712, "epoch": 706} {"train_loss": -10.222837448120117, "global_step": 118713, "epoch": 706} {"train_loss": -10.259695053100586, "global_step": 118714, "epoch": 706} {"train_loss": -10.285836219787598, "global_step": 118715, "epoch": 706} {"train_loss": -10.326591491699219, "global_step": 118716, "epoch": 706} {"train_loss": -10.378152847290039, "global_step": 118717, "epoch": 706} {"train_loss": -10.191919326782227, "global_step": 118718, "epoch": 706} {"train_loss": -10.183507919311523, "global_step": 118719, "epoch": 706} {"train_loss": -10.514612197875977, "global_step": 118720, "epoch": 706} {"train_loss": -10.148435592651367, "global_step": 118721, "epoch": 706} {"train_loss": -10.171833038330078, "global_step": 118722, "epoch": 706} {"train_loss": -10.28797721862793, "global_step": 118723, "epoch": 706} {"train_loss": -9.848451614379883, "global_step": 118724, "epoch": 706} {"train_loss": -10.423757553100586, "global_step": 118725, "epoch": 706} {"train_loss": -9.783060073852539, "global_step": 118726, "epoch": 706} {"train_loss": -10.602458953857422, "global_step": 118727, "epoch": 706} {"train_loss": -10.148019790649414, "global_step": 118728, "epoch": 706} {"train_loss": -10.28743839263916, "global_step": 118729, "epoch": 706} {"train_loss": -10.432384490966797, "global_step": 118730, "epoch": 706} {"train_loss": -10.086507797241211, "global_step": 118731, "epoch": 706} {"train_loss": -10.094954490661621, "global_step": 118732, "epoch": 706} {"train_loss": -10.472768783569336, "global_step": 118733, "epoch": 706} {"train_loss": -10.251733779907227, "global_step": 118734, "epoch": 706} {"train_loss": -10.040538787841797, "global_step": 118735, "epoch": 706} {"train_loss": -9.985880851745605, "global_step": 118736, "epoch": 706} {"train_loss": -10.026091575622559, "global_step": 118737, "epoch": 706} {"train_loss": -9.62748908996582, "global_step": 118738, "epoch": 706} {"train_loss": -9.926025390625, "global_step": 118739, "epoch": 706} {"train_loss": -9.776708602905273, "global_step": 118740, "epoch": 706} {"train_loss": -9.775717735290527, "global_step": 118741, "epoch": 706} {"train_loss": -10.106786727905273, "global_step": 118742, "epoch": 706} {"train_loss": -10.009435653686523, "global_step": 118743, "epoch": 706} {"train_loss": -9.64999008178711, "global_step": 118744, "epoch": 706} {"train_loss": -10.121901512145996, "global_step": 118745, "epoch": 706} {"train_loss": -9.846959114074707, "global_step": 118746, "epoch": 706} {"train_loss": -10.259208679199219, "global_step": 118747, "epoch": 706} {"train_loss": -9.803173065185547, "global_step": 118748, "epoch": 706} {"train_loss": -9.924625396728516, "global_step": 118749, "epoch": 706} {"train_loss": -9.790843963623047, "global_step": 118750, "epoch": 706} {"train_loss": -9.740607261657715, "global_step": 118751, "epoch": 706} {"train_loss": -10.030879020690918, "global_step": 118752, "epoch": 706} {"train_loss": -9.518138885498047, "global_step": 118753, "epoch": 706} {"train_loss": -9.859573364257812, "global_step": 118754, "epoch": 706} {"train_loss": -9.680220603942871, "global_step": 118755, "epoch": 706} {"train_loss": -9.761796951293945, "global_step": 118756, "epoch": 706} {"train_loss": -9.686809539794922, "global_step": 118757, "epoch": 706} {"train_loss": -9.643060684204102, "global_step": 118758, "epoch": 706} {"train_loss": -8.976102828979492, "global_step": 118759, "epoch": 706} {"train_loss": -9.589001655578613, "global_step": 118760, "epoch": 706} {"train_loss": -9.404386520385742, "global_step": 118761, "epoch": 706} {"train_loss": -9.622551918029785, "global_step": 118762, "epoch": 706} {"train_loss": -9.156488418579102, "global_step": 118763, "epoch": 706} {"train_loss": -9.849966049194336, "global_step": 118764, "epoch": 706} {"train_loss": -8.952238082885742, "global_step": 118765, "epoch": 706} {"train_loss": -10.151519775390625, "global_step": 118766, "epoch": 706} {"train_loss": -9.090736389160156, "global_step": 118767, "epoch": 706} {"train_loss": -9.677425384521484, "global_step": 118768, "epoch": 706} {"train_loss": -9.624969482421875, "global_step": 118769, "epoch": 706} {"train_loss": -9.095664024353027, "global_step": 118770, "epoch": 706} {"train_loss": -10.101303100585938, "global_step": 118771, "epoch": 706} {"train_loss": -9.4750394821167, "global_step": 118772, "epoch": 706} {"train_loss": -9.74592399597168, "global_step": 118773, "epoch": 706} {"train_loss": -10.077207565307617, "global_step": 118774, "epoch": 706} {"train_loss": -10.02357067948296, "global_step": 118775, "epoch": 706, "val_loss": 212876.09375} {"train_loss": -9.597505569458008, "global_step": 118776, "epoch": 707} {"train_loss": -9.523456573486328, "global_step": 118777, "epoch": 707} {"train_loss": -9.78387451171875, "global_step": 118778, "epoch": 707} {"train_loss": -9.47146987915039, "global_step": 118779, "epoch": 707} {"train_loss": -9.600730895996094, "global_step": 118780, "epoch": 707} {"train_loss": -9.531116485595703, "global_step": 118781, "epoch": 707} {"train_loss": -9.727982521057129, "global_step": 118782, "epoch": 707} {"train_loss": -10.025064468383789, "global_step": 118783, "epoch": 707} {"train_loss": -9.595111846923828, "global_step": 118784, "epoch": 707} {"train_loss": -9.87110424041748, "global_step": 118785, "epoch": 707} {"train_loss": -9.955862998962402, "global_step": 118786, "epoch": 707} {"train_loss": -9.769298553466797, "global_step": 118787, "epoch": 707} {"train_loss": -9.920188903808594, "global_step": 118788, "epoch": 707} {"train_loss": -10.057518005371094, "global_step": 118789, "epoch": 707} {"train_loss": -9.868809700012207, "global_step": 118790, "epoch": 707} {"train_loss": -10.00560474395752, "global_step": 118791, "epoch": 707} {"train_loss": -9.931407928466797, "global_step": 118792, "epoch": 707} {"train_loss": -10.07424259185791, "global_step": 118793, "epoch": 707} {"train_loss": -9.720769882202148, "global_step": 118794, "epoch": 707} {"train_loss": -10.12582778930664, "global_step": 118795, "epoch": 707} {"train_loss": -10.055755615234375, "global_step": 118796, "epoch": 707} {"train_loss": -10.127507209777832, "global_step": 118797, "epoch": 707} {"train_loss": -10.045223236083984, "global_step": 118798, "epoch": 707} {"train_loss": -10.304607391357422, "global_step": 118799, "epoch": 707} {"train_loss": -10.168842315673828, "global_step": 118800, "epoch": 707} {"train_loss": -9.867669105529785, "global_step": 118801, "epoch": 707} {"train_loss": -10.247611999511719, "global_step": 118802, "epoch": 707} {"train_loss": -10.174592018127441, "global_step": 118803, "epoch": 707} {"train_loss": -10.2130765914917, "global_step": 118804, "epoch": 707} {"train_loss": -10.353103637695312, "global_step": 118805, "epoch": 707} {"train_loss": -9.954388618469238, "global_step": 118806, "epoch": 707} {"train_loss": -9.848535537719727, "global_step": 118807, "epoch": 707} {"train_loss": -10.315044403076172, "global_step": 118808, "epoch": 707} {"train_loss": -9.952686309814453, "global_step": 118809, "epoch": 707} {"train_loss": -10.04216194152832, "global_step": 118810, "epoch": 707} {"train_loss": -9.965816497802734, "global_step": 118811, "epoch": 707} {"train_loss": -10.175292015075684, "global_step": 118812, "epoch": 707} {"train_loss": -10.206094741821289, "global_step": 118813, "epoch": 707} {"train_loss": -10.211523056030273, "global_step": 118814, "epoch": 707} {"train_loss": -9.945558547973633, "global_step": 118815, "epoch": 707} {"train_loss": -10.148612976074219, "global_step": 118816, "epoch": 707} {"train_loss": -10.199853897094727, "global_step": 118817, "epoch": 707} {"train_loss": -10.212024688720703, "global_step": 118818, "epoch": 707} {"train_loss": -10.206987380981445, "global_step": 118819, "epoch": 707} {"train_loss": -10.17391586303711, "global_step": 118820, "epoch": 707} {"train_loss": -10.194421768188477, "global_step": 118821, "epoch": 707} {"train_loss": -10.308469772338867, "global_step": 118822, "epoch": 707} {"train_loss": -9.871315002441406, "global_step": 118823, "epoch": 707} {"train_loss": -10.318689346313477, "global_step": 118824, "epoch": 707} {"train_loss": -10.205294609069824, "global_step": 118825, "epoch": 707} {"train_loss": -10.190248489379883, "global_step": 118826, "epoch": 707} {"train_loss": -10.337882995605469, "global_step": 118827, "epoch": 707} {"train_loss": -10.024253845214844, "global_step": 118828, "epoch": 707} {"train_loss": -10.122371673583984, "global_step": 118829, "epoch": 707} {"train_loss": -10.11419677734375, "global_step": 118830, "epoch": 707} {"train_loss": -9.884326934814453, "global_step": 118831, "epoch": 707} {"train_loss": -10.095067977905273, "global_step": 118832, "epoch": 707} {"train_loss": -10.12841796875, "global_step": 118833, "epoch": 707} {"train_loss": -9.907318115234375, "global_step": 118834, "epoch": 707} {"train_loss": -10.175901412963867, "global_step": 118835, "epoch": 707} {"train_loss": -10.07442855834961, "global_step": 118836, "epoch": 707} {"train_loss": -9.999261856079102, "global_step": 118837, "epoch": 707} {"train_loss": -10.312527656555176, "global_step": 118838, "epoch": 707} {"train_loss": -10.195480346679688, "global_step": 118839, "epoch": 707} {"train_loss": -10.100951194763184, "global_step": 118840, "epoch": 707} {"train_loss": -10.438726425170898, "global_step": 118841, "epoch": 707} {"train_loss": -9.721268653869629, "global_step": 118842, "epoch": 707} {"train_loss": -10.278499603271484, "global_step": 118843, "epoch": 707} {"train_loss": -9.9492826461792, "global_step": 118844, "epoch": 707} {"train_loss": -10.259828567504883, "global_step": 118845, "epoch": 707} {"train_loss": -10.150711059570312, "global_step": 118846, "epoch": 707} {"train_loss": -9.808891296386719, "global_step": 118847, "epoch": 707} {"train_loss": -9.945978164672852, "global_step": 118848, "epoch": 707} {"train_loss": -10.142836570739746, "global_step": 118849, "epoch": 707} {"train_loss": -10.329959869384766, "global_step": 118850, "epoch": 707} {"train_loss": -10.180131912231445, "global_step": 118851, "epoch": 707} {"train_loss": -10.0379638671875, "global_step": 118852, "epoch": 707} {"train_loss": -10.286523818969727, "global_step": 118853, "epoch": 707} {"train_loss": -10.12899398803711, "global_step": 118854, "epoch": 707} {"train_loss": -10.172128677368164, "global_step": 118855, "epoch": 707} {"train_loss": -9.857739448547363, "global_step": 118856, "epoch": 707} {"train_loss": -9.922243118286133, "global_step": 118857, "epoch": 707} {"train_loss": -10.092411041259766, "global_step": 118858, "epoch": 707} {"train_loss": -10.016751289367676, "global_step": 118859, "epoch": 707} {"train_loss": -10.212891578674316, "global_step": 118860, "epoch": 707} {"train_loss": -10.080242156982422, "global_step": 118861, "epoch": 707} {"train_loss": -10.067146301269531, "global_step": 118862, "epoch": 707} {"train_loss": -10.082491874694824, "global_step": 118863, "epoch": 707} {"train_loss": -10.481325149536133, "global_step": 118864, "epoch": 707} {"train_loss": -10.22258472442627, "global_step": 118865, "epoch": 707} {"train_loss": -10.330551147460938, "global_step": 118866, "epoch": 707} {"train_loss": -10.081900596618652, "global_step": 118867, "epoch": 707} {"train_loss": -10.097965240478516, "global_step": 118868, "epoch": 707} {"train_loss": -10.026314735412598, "global_step": 118869, "epoch": 707} {"train_loss": -10.252321243286133, "global_step": 118870, "epoch": 707} {"train_loss": -10.229079246520996, "global_step": 118871, "epoch": 707} {"train_loss": -10.478882789611816, "global_step": 118872, "epoch": 707} {"train_loss": -10.095585823059082, "global_step": 118873, "epoch": 707} {"train_loss": -10.199853897094727, "global_step": 118874, "epoch": 707} {"train_loss": -10.468438148498535, "global_step": 118875, "epoch": 707} {"train_loss": -10.126604080200195, "global_step": 118876, "epoch": 707} {"train_loss": -10.281937599182129, "global_step": 118877, "epoch": 707} {"train_loss": -9.633569717407227, "global_step": 118878, "epoch": 707} {"train_loss": -9.856605529785156, "global_step": 118879, "epoch": 707} {"train_loss": -10.006030082702637, "global_step": 118880, "epoch": 707} {"train_loss": -9.981147766113281, "global_step": 118881, "epoch": 707} {"train_loss": -10.113472938537598, "global_step": 118882, "epoch": 707} {"train_loss": -9.883222579956055, "global_step": 118883, "epoch": 707} {"train_loss": -9.884221076965332, "global_step": 118884, "epoch": 707} {"train_loss": -9.828812599182129, "global_step": 118885, "epoch": 707} {"train_loss": -9.86824893951416, "global_step": 118886, "epoch": 707} {"train_loss": -9.547496795654297, "global_step": 118887, "epoch": 707} {"train_loss": -10.087335586547852, "global_step": 118888, "epoch": 707} {"train_loss": -9.765929222106934, "global_step": 118889, "epoch": 707} {"train_loss": -10.107162475585938, "global_step": 118890, "epoch": 707} {"train_loss": -9.811590194702148, "global_step": 118891, "epoch": 707} {"train_loss": -10.108148574829102, "global_step": 118892, "epoch": 707} {"train_loss": -10.03320026397705, "global_step": 118893, "epoch": 707} {"train_loss": -9.927857398986816, "global_step": 118894, "epoch": 707} {"train_loss": -9.739663124084473, "global_step": 118895, "epoch": 707} {"train_loss": -10.085472106933594, "global_step": 118896, "epoch": 707} {"train_loss": -9.887290954589844, "global_step": 118897, "epoch": 707} {"train_loss": -9.86760139465332, "global_step": 118898, "epoch": 707} {"train_loss": -10.112922668457031, "global_step": 118899, "epoch": 707} {"train_loss": -9.878625869750977, "global_step": 118900, "epoch": 707} {"train_loss": -10.134313583374023, "global_step": 118901, "epoch": 707} {"train_loss": -9.965066909790039, "global_step": 118902, "epoch": 707} {"train_loss": -10.045716285705566, "global_step": 118903, "epoch": 707} {"train_loss": -9.796184539794922, "global_step": 118904, "epoch": 707} {"train_loss": -9.95683479309082, "global_step": 118905, "epoch": 707} {"train_loss": -10.020120620727539, "global_step": 118906, "epoch": 707} {"train_loss": -9.877753257751465, "global_step": 118907, "epoch": 707} {"train_loss": -9.957149505615234, "global_step": 118908, "epoch": 707} {"train_loss": -10.048364639282227, "global_step": 118909, "epoch": 707} {"train_loss": -9.889827728271484, "global_step": 118910, "epoch": 707} {"train_loss": -9.873254776000977, "global_step": 118911, "epoch": 707} {"train_loss": -10.193592071533203, "global_step": 118912, "epoch": 707} {"train_loss": -10.025188446044922, "global_step": 118913, "epoch": 707} {"train_loss": -9.912288665771484, "global_step": 118914, "epoch": 707} {"train_loss": -9.90120792388916, "global_step": 118915, "epoch": 707} {"train_loss": -9.75378704071045, "global_step": 118916, "epoch": 707} {"train_loss": -9.974319458007812, "global_step": 118917, "epoch": 707} {"train_loss": -9.828058242797852, "global_step": 118918, "epoch": 707} {"train_loss": -9.974056243896484, "global_step": 118919, "epoch": 707} {"train_loss": -10.036250114440918, "global_step": 118920, "epoch": 707} {"train_loss": -10.185272216796875, "global_step": 118921, "epoch": 707} {"train_loss": -9.924454689025879, "global_step": 118922, "epoch": 707} {"train_loss": -10.445481300354004, "global_step": 118923, "epoch": 707} {"train_loss": -9.796557426452637, "global_step": 118924, "epoch": 707} {"train_loss": -10.239449501037598, "global_step": 118925, "epoch": 707} {"train_loss": -9.979493141174316, "global_step": 118926, "epoch": 707} {"train_loss": -10.251947402954102, "global_step": 118927, "epoch": 707} {"train_loss": -9.897869110107422, "global_step": 118928, "epoch": 707} {"train_loss": -10.17261028289795, "global_step": 118929, "epoch": 707} {"train_loss": -10.026451110839844, "global_step": 118930, "epoch": 707} {"train_loss": -10.081570625305176, "global_step": 118931, "epoch": 707} {"train_loss": -10.067138671875, "global_step": 118932, "epoch": 707} {"train_loss": -10.331531524658203, "global_step": 118933, "epoch": 707} {"train_loss": -10.202062606811523, "global_step": 118934, "epoch": 707} {"train_loss": -10.461897850036621, "global_step": 118935, "epoch": 707} {"train_loss": -10.442239761352539, "global_step": 118936, "epoch": 707} {"train_loss": -10.48702621459961, "global_step": 118937, "epoch": 707} {"train_loss": -10.344583511352539, "global_step": 118938, "epoch": 707} {"train_loss": -10.204296112060547, "global_step": 118939, "epoch": 707} {"train_loss": -10.334196090698242, "global_step": 118940, "epoch": 707} {"train_loss": -10.26833724975586, "global_step": 118941, "epoch": 707} {"train_loss": -10.343304634094238, "global_step": 118942, "epoch": 707} {"train_loss": -10.054693818092346, "global_step": 118943, "epoch": 707, "val_loss": 214540.015625} {"train_loss": -10.415912628173828, "global_step": 118944, "epoch": 708} {"train_loss": -10.216043472290039, "global_step": 118945, "epoch": 708} {"train_loss": -10.2703275680542, "global_step": 118946, "epoch": 708} {"train_loss": -10.376361846923828, "global_step": 118947, "epoch": 708} {"train_loss": -9.986141204833984, "global_step": 118948, "epoch": 708} {"train_loss": -10.378334999084473, "global_step": 118949, "epoch": 708} {"train_loss": -10.10041618347168, "global_step": 118950, "epoch": 708} {"train_loss": -10.052618026733398, "global_step": 118951, "epoch": 708} {"train_loss": -10.19145393371582, "global_step": 118952, "epoch": 708} {"train_loss": -9.693202018737793, "global_step": 118953, "epoch": 708} {"train_loss": -10.132675170898438, "global_step": 118954, "epoch": 708} {"train_loss": -9.800573348999023, "global_step": 118955, "epoch": 708} {"train_loss": -9.666757583618164, "global_step": 118956, "epoch": 708} {"train_loss": -10.431364059448242, "global_step": 118957, "epoch": 708} {"train_loss": -9.548680305480957, "global_step": 118958, "epoch": 708} {"train_loss": -10.06797981262207, "global_step": 118959, "epoch": 708} {"train_loss": -10.290678024291992, "global_step": 118960, "epoch": 708} {"train_loss": -9.938697814941406, "global_step": 118961, "epoch": 708} {"train_loss": -10.178018569946289, "global_step": 118962, "epoch": 708} {"train_loss": -10.152740478515625, "global_step": 118963, "epoch": 708} {"train_loss": -10.033493041992188, "global_step": 118964, "epoch": 708} {"train_loss": -10.189664840698242, "global_step": 118965, "epoch": 708} {"train_loss": -10.030073165893555, "global_step": 118966, "epoch": 708} {"train_loss": -10.135400772094727, "global_step": 118967, "epoch": 708} {"train_loss": -9.938631057739258, "global_step": 118968, "epoch": 708} {"train_loss": -10.04515266418457, "global_step": 118969, "epoch": 708} {"train_loss": -10.10991382598877, "global_step": 118970, "epoch": 708} {"train_loss": -9.840188980102539, "global_step": 118971, "epoch": 708} {"train_loss": -9.959270477294922, "global_step": 118972, "epoch": 708} {"train_loss": -9.696571350097656, "global_step": 118973, "epoch": 708} {"train_loss": -10.102542877197266, "global_step": 118974, "epoch": 708} {"train_loss": -10.05521011352539, "global_step": 118975, "epoch": 708} {"train_loss": -9.82513427734375, "global_step": 118976, "epoch": 708} {"train_loss": -9.908825874328613, "global_step": 118977, "epoch": 708} {"train_loss": -10.047800064086914, "global_step": 118978, "epoch": 708} {"train_loss": -9.910551071166992, "global_step": 118979, "epoch": 708} {"train_loss": -9.954599380493164, "global_step": 118980, "epoch": 708} {"train_loss": -10.041149139404297, "global_step": 118981, "epoch": 708} {"train_loss": -9.874099731445312, "global_step": 118982, "epoch": 708} {"train_loss": -10.057838439941406, "global_step": 118983, "epoch": 708} {"train_loss": -10.17921257019043, "global_step": 118984, "epoch": 708} {"train_loss": -9.93050765991211, "global_step": 118985, "epoch": 708} {"train_loss": -10.318204879760742, "global_step": 118986, "epoch": 708} {"train_loss": -10.146512985229492, "global_step": 118987, "epoch": 708} {"train_loss": -10.242013931274414, "global_step": 118988, "epoch": 708} {"train_loss": -10.34615707397461, "global_step": 118989, "epoch": 708} {"train_loss": -10.224283218383789, "global_step": 118990, "epoch": 708} {"train_loss": -10.272218704223633, "global_step": 118991, "epoch": 708} {"train_loss": -10.148712158203125, "global_step": 118992, "epoch": 708} {"train_loss": -10.143425941467285, "global_step": 118993, "epoch": 708} {"train_loss": -10.264305114746094, "global_step": 118994, "epoch": 708} {"train_loss": -10.367837905883789, "global_step": 118995, "epoch": 708} {"train_loss": -10.177000045776367, "global_step": 118996, "epoch": 708} {"train_loss": -10.36013126373291, "global_step": 118997, "epoch": 708} {"train_loss": -10.56754207611084, "global_step": 118998, "epoch": 708} {"train_loss": -10.35096549987793, "global_step": 118999, "epoch": 708} {"train_loss": -10.384597778320312, "global_step": 119000, "epoch": 708} {"train_loss": -10.185226440429688, "global_step": 119001, "epoch": 708} {"train_loss": -10.336813926696777, "global_step": 119002, "epoch": 708} {"train_loss": -10.435463905334473, "global_step": 119003, "epoch": 708} {"train_loss": -10.469002723693848, "global_step": 119004, "epoch": 708} {"train_loss": -10.257623672485352, "global_step": 119005, "epoch": 708} {"train_loss": -10.359102249145508, "global_step": 119006, "epoch": 708} {"train_loss": -10.432425498962402, "global_step": 119007, "epoch": 708} {"train_loss": -10.370218276977539, "global_step": 119008, "epoch": 708} {"train_loss": -10.534366607666016, "global_step": 119009, "epoch": 708} {"train_loss": -10.340646743774414, "global_step": 119010, "epoch": 708} {"train_loss": -10.226676940917969, "global_step": 119011, "epoch": 708} {"train_loss": -10.209531784057617, "global_step": 119012, "epoch": 708} {"train_loss": -10.190359115600586, "global_step": 119013, "epoch": 708} {"train_loss": -10.398193359375, "global_step": 119014, "epoch": 708} {"train_loss": -9.944421768188477, "global_step": 119015, "epoch": 708} {"train_loss": -9.652551651000977, "global_step": 119016, "epoch": 708} {"train_loss": -9.848430633544922, "global_step": 119017, "epoch": 708} {"train_loss": -9.893427848815918, "global_step": 119018, "epoch": 708} {"train_loss": -9.983922958374023, "global_step": 119019, "epoch": 708} {"train_loss": -10.150379180908203, "global_step": 119020, "epoch": 708} {"train_loss": -10.275968551635742, "global_step": 119021, "epoch": 708} {"train_loss": -9.632848739624023, "global_step": 119022, "epoch": 708} {"train_loss": -10.406290054321289, "global_step": 119023, "epoch": 708} {"train_loss": -9.953306198120117, "global_step": 119024, "epoch": 708} {"train_loss": -9.817319869995117, "global_step": 119025, "epoch": 708} {"train_loss": -10.214457511901855, "global_step": 119026, "epoch": 708} {"train_loss": -10.013752937316895, "global_step": 119027, "epoch": 708} {"train_loss": -10.162446975708008, "global_step": 119028, "epoch": 708} {"train_loss": -9.97845458984375, "global_step": 119029, "epoch": 708} {"train_loss": -10.08487319946289, "global_step": 119030, "epoch": 708} {"train_loss": -9.966764450073242, "global_step": 119031, "epoch": 708} {"train_loss": -10.141197204589844, "global_step": 119032, "epoch": 708} {"train_loss": -9.990511894226074, "global_step": 119033, "epoch": 708} {"train_loss": -10.261283874511719, "global_step": 119034, "epoch": 708} {"train_loss": -10.060853958129883, "global_step": 119035, "epoch": 708} {"train_loss": -10.191865921020508, "global_step": 119036, "epoch": 708} {"train_loss": -10.311071395874023, "global_step": 119037, "epoch": 708} {"train_loss": -10.073341369628906, "global_step": 119038, "epoch": 708} {"train_loss": -10.329084396362305, "global_step": 119039, "epoch": 708} {"train_loss": -10.267143249511719, "global_step": 119040, "epoch": 708} {"train_loss": -10.18765640258789, "global_step": 119041, "epoch": 708} {"train_loss": -10.052480697631836, "global_step": 119042, "epoch": 708} {"train_loss": -10.054384231567383, "global_step": 119043, "epoch": 708} {"train_loss": -9.923340797424316, "global_step": 119044, "epoch": 708} {"train_loss": -9.927000999450684, "global_step": 119045, "epoch": 708} {"train_loss": -10.093252182006836, "global_step": 119046, "epoch": 708} {"train_loss": -9.563704490661621, "global_step": 119047, "epoch": 708} {"train_loss": -10.217350006103516, "global_step": 119048, "epoch": 708} {"train_loss": -10.057183265686035, "global_step": 119049, "epoch": 708} {"train_loss": -9.923601150512695, "global_step": 119050, "epoch": 708} {"train_loss": -10.144331932067871, "global_step": 119051, "epoch": 708} {"train_loss": -9.869750022888184, "global_step": 119052, "epoch": 708} {"train_loss": -10.426782608032227, "global_step": 119053, "epoch": 708} {"train_loss": -9.517006874084473, "global_step": 119054, "epoch": 708} {"train_loss": -9.948578834533691, "global_step": 119055, "epoch": 708} {"train_loss": -10.252405166625977, "global_step": 119056, "epoch": 708} {"train_loss": -9.784011840820312, "global_step": 119057, "epoch": 708} {"train_loss": -10.127994537353516, "global_step": 119058, "epoch": 708} {"train_loss": -9.735816955566406, "global_step": 119059, "epoch": 708} {"train_loss": -10.050332069396973, "global_step": 119060, "epoch": 708} {"train_loss": -9.718635559082031, "global_step": 119061, "epoch": 708} {"train_loss": -10.034608840942383, "global_step": 119062, "epoch": 708} {"train_loss": -9.9790620803833, "global_step": 119063, "epoch": 708} {"train_loss": -10.312664985656738, "global_step": 119064, "epoch": 708} {"train_loss": -9.981645584106445, "global_step": 119065, "epoch": 708} {"train_loss": -9.690738677978516, "global_step": 119066, "epoch": 708} {"train_loss": -10.095819473266602, "global_step": 119067, "epoch": 708} {"train_loss": -9.925167083740234, "global_step": 119068, "epoch": 708} {"train_loss": -10.119756698608398, "global_step": 119069, "epoch": 708} {"train_loss": -10.012384414672852, "global_step": 119070, "epoch": 708} {"train_loss": -10.091818809509277, "global_step": 119071, "epoch": 708} {"train_loss": -10.26877212524414, "global_step": 119072, "epoch": 708} {"train_loss": -9.836082458496094, "global_step": 119073, "epoch": 708} {"train_loss": -10.258462905883789, "global_step": 119074, "epoch": 708} {"train_loss": -10.072308540344238, "global_step": 119075, "epoch": 708} {"train_loss": -10.066585540771484, "global_step": 119076, "epoch": 708} {"train_loss": -10.228245735168457, "global_step": 119077, "epoch": 708} {"train_loss": -10.332999229431152, "global_step": 119078, "epoch": 708} {"train_loss": -9.803397178649902, "global_step": 119079, "epoch": 708} {"train_loss": -10.264744758605957, "global_step": 119080, "epoch": 708} {"train_loss": -10.073816299438477, "global_step": 119081, "epoch": 708} {"train_loss": -10.17411994934082, "global_step": 119082, "epoch": 708} {"train_loss": -10.302360534667969, "global_step": 119083, "epoch": 708} {"train_loss": -10.203676223754883, "global_step": 119084, "epoch": 708} {"train_loss": -10.18321704864502, "global_step": 119085, "epoch": 708} {"train_loss": -10.042832374572754, "global_step": 119086, "epoch": 708} {"train_loss": -10.271135330200195, "global_step": 119087, "epoch": 708} {"train_loss": -10.055145263671875, "global_step": 119088, "epoch": 708} {"train_loss": -10.289199829101562, "global_step": 119089, "epoch": 708} {"train_loss": -10.297504425048828, "global_step": 119090, "epoch": 708} {"train_loss": -10.347860336303711, "global_step": 119091, "epoch": 708} {"train_loss": -10.107600212097168, "global_step": 119092, "epoch": 708} {"train_loss": -10.153841018676758, "global_step": 119093, "epoch": 708} {"train_loss": -9.99561882019043, "global_step": 119094, "epoch": 708} {"train_loss": -10.18740177154541, "global_step": 119095, "epoch": 708} {"train_loss": -10.31077766418457, "global_step": 119096, "epoch": 708} {"train_loss": -10.334701538085938, "global_step": 119097, "epoch": 708} {"train_loss": -10.070175170898438, "global_step": 119098, "epoch": 708} {"train_loss": -10.039052963256836, "global_step": 119099, "epoch": 708} {"train_loss": -10.089142799377441, "global_step": 119100, "epoch": 708} {"train_loss": -9.74588394165039, "global_step": 119101, "epoch": 708} {"train_loss": -10.23898983001709, "global_step": 119102, "epoch": 708} {"train_loss": -10.427141189575195, "global_step": 119103, "epoch": 708} {"train_loss": -9.330500602722168, "global_step": 119104, "epoch": 708} {"train_loss": -10.320516586303711, "global_step": 119105, "epoch": 708} {"train_loss": -9.653470039367676, "global_step": 119106, "epoch": 708} {"train_loss": -9.141316413879395, "global_step": 119107, "epoch": 708} {"train_loss": -9.368154525756836, "global_step": 119108, "epoch": 708} {"train_loss": -9.17483901977539, "global_step": 119109, "epoch": 708} {"train_loss": -8.633662223815918, "global_step": 119110, "epoch": 708} {"train_loss": -10.07009938785008, "global_step": 119111, "epoch": 708, "val_loss": 214564.609375} {"train_loss": -8.226856231689453, "global_step": 119112, "epoch": 709} {"train_loss": -10.134815216064453, "global_step": 119113, "epoch": 709} {"train_loss": -8.687300682067871, "global_step": 119114, "epoch": 709} {"train_loss": -9.864351272583008, "global_step": 119115, "epoch": 709} {"train_loss": -9.709035873413086, "global_step": 119116, "epoch": 709} {"train_loss": -9.3340482711792, "global_step": 119117, "epoch": 709} {"train_loss": -10.053337097167969, "global_step": 119118, "epoch": 709} {"train_loss": -9.36922836303711, "global_step": 119119, "epoch": 709} {"train_loss": -9.824909210205078, "global_step": 119120, "epoch": 709} {"train_loss": -9.650969505310059, "global_step": 119121, "epoch": 709} {"train_loss": -9.613027572631836, "global_step": 119122, "epoch": 709} {"train_loss": -9.912874221801758, "global_step": 119123, "epoch": 709} {"train_loss": -9.729076385498047, "global_step": 119124, "epoch": 709} {"train_loss": -10.01557731628418, "global_step": 119125, "epoch": 709} {"train_loss": -10.14989185333252, "global_step": 119126, "epoch": 709} {"train_loss": -9.634685516357422, "global_step": 119127, "epoch": 709} {"train_loss": -10.145275115966797, "global_step": 119128, "epoch": 709} {"train_loss": -9.949136734008789, "global_step": 119129, "epoch": 709} {"train_loss": -9.843050003051758, "global_step": 119130, "epoch": 709} {"train_loss": -10.0309419631958, "global_step": 119131, "epoch": 709} {"train_loss": -10.066046714782715, "global_step": 119132, "epoch": 709} {"train_loss": -9.995677947998047, "global_step": 119133, "epoch": 709} {"train_loss": -9.925010681152344, "global_step": 119134, "epoch": 709} {"train_loss": -9.963193893432617, "global_step": 119135, "epoch": 709} {"train_loss": -9.965180397033691, "global_step": 119136, "epoch": 709} {"train_loss": -9.821617126464844, "global_step": 119137, "epoch": 709} {"train_loss": -10.008796691894531, "global_step": 119138, "epoch": 709} {"train_loss": -10.254039764404297, "global_step": 119139, "epoch": 709} {"train_loss": -9.878727912902832, "global_step": 119140, "epoch": 709} {"train_loss": -10.184401512145996, "global_step": 119141, "epoch": 709} {"train_loss": -10.034066200256348, "global_step": 119142, "epoch": 709} {"train_loss": -9.705551147460938, "global_step": 119143, "epoch": 709} {"train_loss": -10.351953506469727, "global_step": 119144, "epoch": 709} {"train_loss": -9.806633949279785, "global_step": 119145, "epoch": 709} {"train_loss": -9.816555976867676, "global_step": 119146, "epoch": 709} {"train_loss": -10.214286804199219, "global_step": 119147, "epoch": 709} {"train_loss": -10.152582168579102, "global_step": 119148, "epoch": 709} {"train_loss": -10.127518653869629, "global_step": 119149, "epoch": 709} {"train_loss": -10.142566680908203, "global_step": 119150, "epoch": 709} {"train_loss": -10.324576377868652, "global_step": 119151, "epoch": 709} {"train_loss": -10.064136505126953, "global_step": 119152, "epoch": 709} {"train_loss": -10.050037384033203, "global_step": 119153, "epoch": 709} {"train_loss": -9.805193901062012, "global_step": 119154, "epoch": 709} {"train_loss": -9.89517593383789, "global_step": 119155, "epoch": 709} {"train_loss": -9.941741943359375, "global_step": 119156, "epoch": 709} {"train_loss": -10.042994499206543, "global_step": 119157, "epoch": 709} {"train_loss": -9.707094192504883, "global_step": 119158, "epoch": 709} {"train_loss": -10.031686782836914, "global_step": 119159, "epoch": 709} {"train_loss": -10.04531478881836, "global_step": 119160, "epoch": 709} {"train_loss": -9.78441047668457, "global_step": 119161, "epoch": 709} {"train_loss": -9.973392486572266, "global_step": 119162, "epoch": 709} {"train_loss": -10.101982116699219, "global_step": 119163, "epoch": 709} {"train_loss": -9.67642593383789, "global_step": 119164, "epoch": 709} {"train_loss": -9.292461395263672, "global_step": 119165, "epoch": 709} {"train_loss": -9.689216613769531, "global_step": 119166, "epoch": 709} {"train_loss": -9.306386947631836, "global_step": 119167, "epoch": 709} {"train_loss": -9.675760269165039, "global_step": 119168, "epoch": 709} {"train_loss": -9.779870986938477, "global_step": 119169, "epoch": 709} {"train_loss": -9.490665435791016, "global_step": 119170, "epoch": 709} {"train_loss": -9.92155647277832, "global_step": 119171, "epoch": 709} {"train_loss": -9.744081497192383, "global_step": 119172, "epoch": 709} {"train_loss": -9.654446601867676, "global_step": 119173, "epoch": 709} {"train_loss": -9.653253555297852, "global_step": 119174, "epoch": 709} {"train_loss": -10.01165771484375, "global_step": 119175, "epoch": 709} {"train_loss": -9.815997123718262, "global_step": 119176, "epoch": 709} {"train_loss": -9.944252014160156, "global_step": 119177, "epoch": 709} {"train_loss": -9.955659866333008, "global_step": 119178, "epoch": 709} {"train_loss": -10.040568351745605, "global_step": 119179, "epoch": 709} {"train_loss": -9.684921264648438, "global_step": 119180, "epoch": 709} {"train_loss": -10.10742473602295, "global_step": 119181, "epoch": 709} {"train_loss": -10.094996452331543, "global_step": 119182, "epoch": 709} {"train_loss": -10.085759162902832, "global_step": 119183, "epoch": 709} {"train_loss": -10.029048919677734, "global_step": 119184, "epoch": 709} {"train_loss": -10.189945220947266, "global_step": 119185, "epoch": 709} {"train_loss": -10.261917114257812, "global_step": 119186, "epoch": 709} {"train_loss": -10.058426856994629, "global_step": 119187, "epoch": 709} {"train_loss": -10.197154998779297, "global_step": 119188, "epoch": 709} {"train_loss": -10.394527435302734, "global_step": 119189, "epoch": 709} {"train_loss": -10.272266387939453, "global_step": 119190, "epoch": 709} {"train_loss": -10.045164108276367, "global_step": 119191, "epoch": 709} {"train_loss": -10.317024230957031, "global_step": 119192, "epoch": 709} {"train_loss": -10.210689544677734, "global_step": 119193, "epoch": 709} {"train_loss": -10.099677085876465, "global_step": 119194, "epoch": 709} {"train_loss": -10.210350036621094, "global_step": 119195, "epoch": 709} {"train_loss": -10.11828899383545, "global_step": 119196, "epoch": 709} {"train_loss": -10.432287216186523, "global_step": 119197, "epoch": 709} {"train_loss": -10.296382904052734, "global_step": 119198, "epoch": 709} {"train_loss": -10.297710418701172, "global_step": 119199, "epoch": 709} {"train_loss": -10.259706497192383, "global_step": 119200, "epoch": 709} {"train_loss": -10.031716346740723, "global_step": 119201, "epoch": 709} {"train_loss": -10.191238403320312, "global_step": 119202, "epoch": 709} {"train_loss": -10.13748550415039, "global_step": 119203, "epoch": 709} {"train_loss": -10.38552188873291, "global_step": 119204, "epoch": 709} {"train_loss": -10.268411636352539, "global_step": 119205, "epoch": 709} {"train_loss": -10.347978591918945, "global_step": 119206, "epoch": 709} {"train_loss": -10.0857572555542, "global_step": 119207, "epoch": 709} {"train_loss": -10.475194931030273, "global_step": 119208, "epoch": 709} {"train_loss": -10.179094314575195, "global_step": 119209, "epoch": 709} {"train_loss": -10.36755657196045, "global_step": 119210, "epoch": 709} {"train_loss": -10.213455200195312, "global_step": 119211, "epoch": 709} {"train_loss": -10.048547744750977, "global_step": 119212, "epoch": 709} {"train_loss": -9.837930679321289, "global_step": 119213, "epoch": 709} {"train_loss": -9.992405891418457, "global_step": 119214, "epoch": 709} {"train_loss": -9.76264762878418, "global_step": 119215, "epoch": 709} {"train_loss": -10.12995719909668, "global_step": 119216, "epoch": 709} {"train_loss": -10.602392196655273, "global_step": 119217, "epoch": 709} {"train_loss": -10.002684593200684, "global_step": 119218, "epoch": 709} {"train_loss": -10.296137809753418, "global_step": 119219, "epoch": 709} {"train_loss": -10.466314315795898, "global_step": 119220, "epoch": 709} {"train_loss": -10.149118423461914, "global_step": 119221, "epoch": 709} {"train_loss": -10.229576110839844, "global_step": 119222, "epoch": 709} {"train_loss": -10.26196575164795, "global_step": 119223, "epoch": 709} {"train_loss": -10.257616996765137, "global_step": 119224, "epoch": 709} {"train_loss": -10.074230194091797, "global_step": 119225, "epoch": 709} {"train_loss": -10.107645034790039, "global_step": 119226, "epoch": 709} {"train_loss": -10.284564018249512, "global_step": 119227, "epoch": 709} {"train_loss": -10.074504852294922, "global_step": 119228, "epoch": 709} {"train_loss": -10.335289001464844, "global_step": 119229, "epoch": 709} {"train_loss": -10.137575149536133, "global_step": 119230, "epoch": 709} {"train_loss": -10.239526748657227, "global_step": 119231, "epoch": 709} {"train_loss": -10.213737487792969, "global_step": 119232, "epoch": 709} {"train_loss": -10.179094314575195, "global_step": 119233, "epoch": 709} {"train_loss": -10.29914665222168, "global_step": 119234, "epoch": 709} {"train_loss": -10.319524765014648, "global_step": 119235, "epoch": 709} {"train_loss": -10.27896499633789, "global_step": 119236, "epoch": 709} {"train_loss": -10.374481201171875, "global_step": 119237, "epoch": 709} {"train_loss": -10.445697784423828, "global_step": 119238, "epoch": 709} {"train_loss": -10.12618637084961, "global_step": 119239, "epoch": 709} {"train_loss": -10.070556640625, "global_step": 119240, "epoch": 709} {"train_loss": -10.154653549194336, "global_step": 119241, "epoch": 709} {"train_loss": -10.145066261291504, "global_step": 119242, "epoch": 709} {"train_loss": -10.41386604309082, "global_step": 119243, "epoch": 709} {"train_loss": -10.336310386657715, "global_step": 119244, "epoch": 709} {"train_loss": -10.125101089477539, "global_step": 119245, "epoch": 709} {"train_loss": -10.348807334899902, "global_step": 119246, "epoch": 709} {"train_loss": -10.238031387329102, "global_step": 119247, "epoch": 709} {"train_loss": -10.390559196472168, "global_step": 119248, "epoch": 709} {"train_loss": -10.196447372436523, "global_step": 119249, "epoch": 709} {"train_loss": -10.342321395874023, "global_step": 119250, "epoch": 709} {"train_loss": -10.547608375549316, "global_step": 119251, "epoch": 709} {"train_loss": -10.421318054199219, "global_step": 119252, "epoch": 709} {"train_loss": -10.441381454467773, "global_step": 119253, "epoch": 709} {"train_loss": -10.424489974975586, "global_step": 119254, "epoch": 709} {"train_loss": -10.17388916015625, "global_step": 119255, "epoch": 709} {"train_loss": -10.172388076782227, "global_step": 119256, "epoch": 709} {"train_loss": -10.257160186767578, "global_step": 119257, "epoch": 709} {"train_loss": -9.793588638305664, "global_step": 119258, "epoch": 709} {"train_loss": -10.4753999710083, "global_step": 119259, "epoch": 709} {"train_loss": -9.77492904663086, "global_step": 119260, "epoch": 709} {"train_loss": -10.091373443603516, "global_step": 119261, "epoch": 709} {"train_loss": -10.096212387084961, "global_step": 119262, "epoch": 709} {"train_loss": -9.965071678161621, "global_step": 119263, "epoch": 709} {"train_loss": -9.594462394714355, "global_step": 119264, "epoch": 709} {"train_loss": -9.585890769958496, "global_step": 119265, "epoch": 709} {"train_loss": -10.24805736541748, "global_step": 119266, "epoch": 709} {"train_loss": -9.542485237121582, "global_step": 119267, "epoch": 709} {"train_loss": -10.154006958007812, "global_step": 119268, "epoch": 709} {"train_loss": -10.015408515930176, "global_step": 119269, "epoch": 709} {"train_loss": -9.76529598236084, "global_step": 119270, "epoch": 709} {"train_loss": -9.85318374633789, "global_step": 119271, "epoch": 709} {"train_loss": -9.5736665725708, "global_step": 119272, "epoch": 709} {"train_loss": -10.087458610534668, "global_step": 119273, "epoch": 709} {"train_loss": -9.941452980041504, "global_step": 119274, "epoch": 709} {"train_loss": -9.972787857055664, "global_step": 119275, "epoch": 709} {"train_loss": -9.829989433288574, "global_step": 119276, "epoch": 709} {"train_loss": -9.877184867858887, "global_step": 119277, "epoch": 709} {"train_loss": -9.706754684448242, "global_step": 119278, "epoch": 709} {"train_loss": -10.025285993303571, "global_step": 119279, "epoch": 709, "val_loss": 213548.59375} {"train_loss": -10.113273620605469, "global_step": 119280, "epoch": 710} {"train_loss": -9.641950607299805, "global_step": 119281, "epoch": 710} {"train_loss": -10.177855491638184, "global_step": 119282, "epoch": 710} {"train_loss": -9.830619812011719, "global_step": 119283, "epoch": 710} {"train_loss": -10.15854263305664, "global_step": 119284, "epoch": 710} {"train_loss": -9.727676391601562, "global_step": 119285, "epoch": 710} {"train_loss": -10.201427459716797, "global_step": 119286, "epoch": 710} {"train_loss": -9.769205093383789, "global_step": 119287, "epoch": 710} {"train_loss": -10.206016540527344, "global_step": 119288, "epoch": 710} {"train_loss": -9.986284255981445, "global_step": 119289, "epoch": 710} {"train_loss": -10.006841659545898, "global_step": 119290, "epoch": 710} {"train_loss": -10.192527770996094, "global_step": 119291, "epoch": 710} {"train_loss": -9.956815719604492, "global_step": 119292, "epoch": 710} {"train_loss": -10.211877822875977, "global_step": 119293, "epoch": 710} {"train_loss": -10.144777297973633, "global_step": 119294, "epoch": 710} {"train_loss": -10.335306167602539, "global_step": 119295, "epoch": 710} {"train_loss": -10.177837371826172, "global_step": 119296, "epoch": 710} {"train_loss": -10.37352180480957, "global_step": 119297, "epoch": 710} {"train_loss": -10.145147323608398, "global_step": 119298, "epoch": 710} {"train_loss": -10.176719665527344, "global_step": 119299, "epoch": 710} {"train_loss": -10.291982650756836, "global_step": 119300, "epoch": 710} {"train_loss": -10.224828720092773, "global_step": 119301, "epoch": 710} {"train_loss": -10.36341667175293, "global_step": 119302, "epoch": 710} {"train_loss": -10.341611862182617, "global_step": 119303, "epoch": 710} {"train_loss": -10.403153419494629, "global_step": 119304, "epoch": 710} {"train_loss": -10.308121681213379, "global_step": 119305, "epoch": 710} {"train_loss": -10.581122398376465, "global_step": 119306, "epoch": 710} {"train_loss": -10.412328720092773, "global_step": 119307, "epoch": 710} {"train_loss": -10.462991714477539, "global_step": 119308, "epoch": 710} {"train_loss": -10.405508041381836, "global_step": 119309, "epoch": 710} {"train_loss": -10.334362030029297, "global_step": 119310, "epoch": 710} {"train_loss": -10.274213790893555, "global_step": 119311, "epoch": 710} {"train_loss": -10.265317916870117, "global_step": 119312, "epoch": 710} {"train_loss": -10.410959243774414, "global_step": 119313, "epoch": 710} {"train_loss": -10.338361740112305, "global_step": 119314, "epoch": 710} {"train_loss": -10.235601425170898, "global_step": 119315, "epoch": 710} {"train_loss": -10.484546661376953, "global_step": 119316, "epoch": 710} {"train_loss": -10.489611625671387, "global_step": 119317, "epoch": 710} {"train_loss": -10.400297164916992, "global_step": 119318, "epoch": 710} {"train_loss": -10.526527404785156, "global_step": 119319, "epoch": 710} {"train_loss": -10.417379379272461, "global_step": 119320, "epoch": 710} {"train_loss": -10.081716537475586, "global_step": 119321, "epoch": 710} {"train_loss": -9.97116470336914, "global_step": 119322, "epoch": 710} {"train_loss": -10.426820755004883, "global_step": 119323, "epoch": 710} {"train_loss": -9.871063232421875, "global_step": 119324, "epoch": 710} {"train_loss": -10.271961212158203, "global_step": 119325, "epoch": 710} {"train_loss": -10.01218032836914, "global_step": 119326, "epoch": 710} {"train_loss": -9.687515258789062, "global_step": 119327, "epoch": 710} {"train_loss": -10.112936973571777, "global_step": 119328, "epoch": 710} {"train_loss": -9.769159317016602, "global_step": 119329, "epoch": 710} {"train_loss": -9.909709930419922, "global_step": 119330, "epoch": 710} {"train_loss": -10.272989273071289, "global_step": 119331, "epoch": 710} {"train_loss": -10.16101360321045, "global_step": 119332, "epoch": 710} {"train_loss": -10.044811248779297, "global_step": 119333, "epoch": 710} {"train_loss": -9.870321273803711, "global_step": 119334, "epoch": 710} {"train_loss": -10.278617858886719, "global_step": 119335, "epoch": 710} {"train_loss": -9.901895523071289, "global_step": 119336, "epoch": 710} {"train_loss": -9.99146556854248, "global_step": 119337, "epoch": 710} {"train_loss": -10.103850364685059, "global_step": 119338, "epoch": 710} {"train_loss": -9.75514030456543, "global_step": 119339, "epoch": 710} {"train_loss": -10.244667053222656, "global_step": 119340, "epoch": 710} {"train_loss": -9.786828994750977, "global_step": 119341, "epoch": 710} {"train_loss": -10.06851577758789, "global_step": 119342, "epoch": 710} {"train_loss": -9.742868423461914, "global_step": 119343, "epoch": 710} {"train_loss": -10.115732192993164, "global_step": 119344, "epoch": 710} {"train_loss": -9.843839645385742, "global_step": 119345, "epoch": 710} {"train_loss": -10.082330703735352, "global_step": 119346, "epoch": 710} {"train_loss": -10.019149780273438, "global_step": 119347, "epoch": 710} {"train_loss": -10.263919830322266, "global_step": 119348, "epoch": 710} {"train_loss": -9.99618911743164, "global_step": 119349, "epoch": 710} {"train_loss": -9.645759582519531, "global_step": 119350, "epoch": 710} {"train_loss": -9.80057430267334, "global_step": 119351, "epoch": 710} {"train_loss": -9.824361801147461, "global_step": 119352, "epoch": 710} {"train_loss": -10.015565872192383, "global_step": 119353, "epoch": 710} {"train_loss": -9.841621398925781, "global_step": 119354, "epoch": 710} {"train_loss": -9.963338851928711, "global_step": 119355, "epoch": 710} {"train_loss": -9.972827911376953, "global_step": 119356, "epoch": 710} {"train_loss": -9.974992752075195, "global_step": 119357, "epoch": 710} {"train_loss": -10.307738304138184, "global_step": 119358, "epoch": 710} {"train_loss": -10.137361526489258, "global_step": 119359, "epoch": 710} {"train_loss": -10.047231674194336, "global_step": 119360, "epoch": 710} {"train_loss": -10.287873268127441, "global_step": 119361, "epoch": 710} {"train_loss": -10.120179176330566, "global_step": 119362, "epoch": 710} {"train_loss": -10.024635314941406, "global_step": 119363, "epoch": 710} {"train_loss": -10.150930404663086, "global_step": 119364, "epoch": 710} {"train_loss": -10.025484085083008, "global_step": 119365, "epoch": 710} {"train_loss": -10.320545196533203, "global_step": 119366, "epoch": 710} {"train_loss": -10.14348030090332, "global_step": 119367, "epoch": 710} {"train_loss": -10.083841323852539, "global_step": 119368, "epoch": 710} {"train_loss": -10.123984336853027, "global_step": 119369, "epoch": 710} {"train_loss": -10.087553024291992, "global_step": 119370, "epoch": 710} {"train_loss": -10.300064086914062, "global_step": 119371, "epoch": 710} {"train_loss": -10.117141723632812, "global_step": 119372, "epoch": 710} {"train_loss": -10.06116771697998, "global_step": 119373, "epoch": 710} {"train_loss": -10.141034126281738, "global_step": 119374, "epoch": 710} {"train_loss": -10.311013221740723, "global_step": 119375, "epoch": 710} {"train_loss": -10.139402389526367, "global_step": 119376, "epoch": 710} {"train_loss": -10.185216903686523, "global_step": 119377, "epoch": 710} {"train_loss": -10.259230613708496, "global_step": 119378, "epoch": 710} {"train_loss": -9.543601036071777, "global_step": 119379, "epoch": 710} {"train_loss": -10.366111755371094, "global_step": 119380, "epoch": 710} {"train_loss": -9.821050643920898, "global_step": 119381, "epoch": 710} {"train_loss": -9.827247619628906, "global_step": 119382, "epoch": 710} {"train_loss": -10.353959083557129, "global_step": 119383, "epoch": 710} {"train_loss": -9.705810546875, "global_step": 119384, "epoch": 710} {"train_loss": -10.069419860839844, "global_step": 119385, "epoch": 710} {"train_loss": -9.744060516357422, "global_step": 119386, "epoch": 710} {"train_loss": -9.74776840209961, "global_step": 119387, "epoch": 710} {"train_loss": -9.602995872497559, "global_step": 119388, "epoch": 710} {"train_loss": -9.663312911987305, "global_step": 119389, "epoch": 710} {"train_loss": -10.112226486206055, "global_step": 119390, "epoch": 710} {"train_loss": -9.868528366088867, "global_step": 119391, "epoch": 710} {"train_loss": -9.742000579833984, "global_step": 119392, "epoch": 710} {"train_loss": -9.942944526672363, "global_step": 119393, "epoch": 710} {"train_loss": -9.523728370666504, "global_step": 119394, "epoch": 710} {"train_loss": -10.222861289978027, "global_step": 119395, "epoch": 710} {"train_loss": -10.064281463623047, "global_step": 119396, "epoch": 710} {"train_loss": -9.859180450439453, "global_step": 119397, "epoch": 710} {"train_loss": -10.304400444030762, "global_step": 119398, "epoch": 710} {"train_loss": -10.105818748474121, "global_step": 119399, "epoch": 710} {"train_loss": -9.973230361938477, "global_step": 119400, "epoch": 710} {"train_loss": -9.86163330078125, "global_step": 119401, "epoch": 710} {"train_loss": -10.122963905334473, "global_step": 119402, "epoch": 710} {"train_loss": -10.086519241333008, "global_step": 119403, "epoch": 710} {"train_loss": -10.186161994934082, "global_step": 119404, "epoch": 710} {"train_loss": -10.229681968688965, "global_step": 119405, "epoch": 710} {"train_loss": -10.178301811218262, "global_step": 119406, "epoch": 710} {"train_loss": -10.096586227416992, "global_step": 119407, "epoch": 710} {"train_loss": -10.309433937072754, "global_step": 119408, "epoch": 710} {"train_loss": -10.497230529785156, "global_step": 119409, "epoch": 710} {"train_loss": -10.251605987548828, "global_step": 119410, "epoch": 710} {"train_loss": -10.308279037475586, "global_step": 119411, "epoch": 710} {"train_loss": -10.250336647033691, "global_step": 119412, "epoch": 710} {"train_loss": -10.125785827636719, "global_step": 119413, "epoch": 710} {"train_loss": -10.200762748718262, "global_step": 119414, "epoch": 710} {"train_loss": -10.421921730041504, "global_step": 119415, "epoch": 710} {"train_loss": -10.380091667175293, "global_step": 119416, "epoch": 710} {"train_loss": -10.297100067138672, "global_step": 119417, "epoch": 710} {"train_loss": -10.277334213256836, "global_step": 119418, "epoch": 710} {"train_loss": -10.262575149536133, "global_step": 119419, "epoch": 710} {"train_loss": -10.297464370727539, "global_step": 119420, "epoch": 710} {"train_loss": -10.25014877319336, "global_step": 119421, "epoch": 710} {"train_loss": -10.254606246948242, "global_step": 119422, "epoch": 710} {"train_loss": -10.251049041748047, "global_step": 119423, "epoch": 710} {"train_loss": -10.129776954650879, "global_step": 119424, "epoch": 710} {"train_loss": -10.117033004760742, "global_step": 119425, "epoch": 710} {"train_loss": -10.132833480834961, "global_step": 119426, "epoch": 710} {"train_loss": -9.795276641845703, "global_step": 119427, "epoch": 710} {"train_loss": -10.51795768737793, "global_step": 119428, "epoch": 710} {"train_loss": -10.14012336730957, "global_step": 119429, "epoch": 710} {"train_loss": -10.279899597167969, "global_step": 119430, "epoch": 710} {"train_loss": -10.258214950561523, "global_step": 119431, "epoch": 710} {"train_loss": -10.33384895324707, "global_step": 119432, "epoch": 710} {"train_loss": -10.166141510009766, "global_step": 119433, "epoch": 710} {"train_loss": -10.306388854980469, "global_step": 119434, "epoch": 710} {"train_loss": -10.057300567626953, "global_step": 119435, "epoch": 710} {"train_loss": -10.031012535095215, "global_step": 119436, "epoch": 710} {"train_loss": -9.986242294311523, "global_step": 119437, "epoch": 710} {"train_loss": -9.656171798706055, "global_step": 119438, "epoch": 710} {"train_loss": -10.19224739074707, "global_step": 119439, "epoch": 710} {"train_loss": -9.542255401611328, "global_step": 119440, "epoch": 710} {"train_loss": -10.247682571411133, "global_step": 119441, "epoch": 710} {"train_loss": -9.829957008361816, "global_step": 119442, "epoch": 710} {"train_loss": -10.183097839355469, "global_step": 119443, "epoch": 710} {"train_loss": -10.30286979675293, "global_step": 119444, "epoch": 710} {"train_loss": -9.833553314208984, "global_step": 119445, "epoch": 710} {"train_loss": -9.720873832702637, "global_step": 119446, "epoch": 710} {"train_loss": -10.107503981817336, "global_step": 119447, "epoch": 710, "val_loss": 213510.9375, "train_action_mse_error": 2.329102039337158} {"train_loss": -9.53079605102539, "global_step": 119448, "epoch": 711} {"train_loss": -9.550163269042969, "global_step": 119449, "epoch": 711} {"train_loss": -10.22800064086914, "global_step": 119450, "epoch": 711} {"train_loss": -9.490714073181152, "global_step": 119451, "epoch": 711} {"train_loss": -10.29489517211914, "global_step": 119452, "epoch": 711} {"train_loss": -9.652149200439453, "global_step": 119453, "epoch": 711} {"train_loss": -9.644255638122559, "global_step": 119454, "epoch": 711} {"train_loss": -10.10276985168457, "global_step": 119455, "epoch": 711} {"train_loss": -9.852313041687012, "global_step": 119456, "epoch": 711} {"train_loss": -9.943145751953125, "global_step": 119457, "epoch": 711} {"train_loss": -9.869890213012695, "global_step": 119458, "epoch": 711} {"train_loss": -10.073504447937012, "global_step": 119459, "epoch": 711} {"train_loss": -10.081055641174316, "global_step": 119460, "epoch": 711} {"train_loss": -9.912440299987793, "global_step": 119461, "epoch": 711} {"train_loss": -10.038925170898438, "global_step": 119462, "epoch": 711} {"train_loss": -10.157028198242188, "global_step": 119463, "epoch": 711} {"train_loss": -9.97502326965332, "global_step": 119464, "epoch": 711} {"train_loss": -10.103303909301758, "global_step": 119465, "epoch": 711} {"train_loss": -9.86193561553955, "global_step": 119466, "epoch": 711} {"train_loss": -10.272933006286621, "global_step": 119467, "epoch": 711} {"train_loss": -10.060714721679688, "global_step": 119468, "epoch": 711} {"train_loss": -10.098714828491211, "global_step": 119469, "epoch": 711} {"train_loss": -10.272363662719727, "global_step": 119470, "epoch": 711} {"train_loss": -10.340967178344727, "global_step": 119471, "epoch": 711} {"train_loss": -10.285163879394531, "global_step": 119472, "epoch": 711} {"train_loss": -10.080459594726562, "global_step": 119473, "epoch": 711} {"train_loss": -10.28795051574707, "global_step": 119474, "epoch": 711} {"train_loss": -10.286829948425293, "global_step": 119475, "epoch": 711} {"train_loss": -10.334970474243164, "global_step": 119476, "epoch": 711} {"train_loss": -10.20112419128418, "global_step": 119477, "epoch": 711} {"train_loss": -10.167668342590332, "global_step": 119478, "epoch": 711} {"train_loss": -10.230058670043945, "global_step": 119479, "epoch": 711} {"train_loss": -10.31292724609375, "global_step": 119480, "epoch": 711} {"train_loss": -10.17986011505127, "global_step": 119481, "epoch": 711} {"train_loss": -10.453947067260742, "global_step": 119482, "epoch": 711} {"train_loss": -10.263921737670898, "global_step": 119483, "epoch": 711} {"train_loss": -10.421594619750977, "global_step": 119484, "epoch": 711} {"train_loss": -10.379966735839844, "global_step": 119485, "epoch": 711} {"train_loss": -10.23035717010498, "global_step": 119486, "epoch": 711} {"train_loss": -10.418078422546387, "global_step": 119487, "epoch": 711} {"train_loss": -10.410693168640137, "global_step": 119488, "epoch": 711} {"train_loss": -10.320646286010742, "global_step": 119489, "epoch": 711} {"train_loss": -10.196863174438477, "global_step": 119490, "epoch": 711} {"train_loss": -10.209878921508789, "global_step": 119491, "epoch": 711} {"train_loss": -9.865880012512207, "global_step": 119492, "epoch": 711} {"train_loss": -10.33081340789795, "global_step": 119493, "epoch": 711} {"train_loss": -9.903909683227539, "global_step": 119494, "epoch": 711} {"train_loss": -10.173521041870117, "global_step": 119495, "epoch": 711} {"train_loss": -10.190404891967773, "global_step": 119496, "epoch": 711} {"train_loss": -9.93152904510498, "global_step": 119497, "epoch": 711} {"train_loss": -9.948135375976562, "global_step": 119498, "epoch": 711} {"train_loss": -10.233375549316406, "global_step": 119499, "epoch": 711} {"train_loss": -9.753252029418945, "global_step": 119500, "epoch": 711} {"train_loss": -9.818521499633789, "global_step": 119501, "epoch": 711} {"train_loss": -10.080148696899414, "global_step": 119502, "epoch": 711} {"train_loss": -9.616571426391602, "global_step": 119503, "epoch": 711} {"train_loss": -10.032441139221191, "global_step": 119504, "epoch": 711} {"train_loss": -9.740721702575684, "global_step": 119505, "epoch": 711} {"train_loss": -10.129186630249023, "global_step": 119506, "epoch": 711} {"train_loss": -9.97873306274414, "global_step": 119507, "epoch": 711} {"train_loss": -9.855627059936523, "global_step": 119508, "epoch": 711} {"train_loss": -9.912275314331055, "global_step": 119509, "epoch": 711} {"train_loss": -10.106239318847656, "global_step": 119510, "epoch": 711} {"train_loss": -9.49848747253418, "global_step": 119511, "epoch": 711} {"train_loss": -10.177020072937012, "global_step": 119512, "epoch": 711} {"train_loss": -9.67178726196289, "global_step": 119513, "epoch": 711} {"train_loss": -9.755013465881348, "global_step": 119514, "epoch": 711} {"train_loss": -9.548142433166504, "global_step": 119515, "epoch": 711} {"train_loss": -9.508898735046387, "global_step": 119516, "epoch": 711} {"train_loss": -9.692625045776367, "global_step": 119517, "epoch": 711} {"train_loss": -9.803121566772461, "global_step": 119518, "epoch": 711} {"train_loss": -9.876691818237305, "global_step": 119519, "epoch": 711} {"train_loss": -9.689279556274414, "global_step": 119520, "epoch": 711} {"train_loss": -10.019847869873047, "global_step": 119521, "epoch": 711} {"train_loss": -9.772943496704102, "global_step": 119522, "epoch": 711} {"train_loss": -10.166688919067383, "global_step": 119523, "epoch": 711} {"train_loss": -9.87952995300293, "global_step": 119524, "epoch": 711} {"train_loss": -9.944276809692383, "global_step": 119525, "epoch": 711} {"train_loss": -9.658873558044434, "global_step": 119526, "epoch": 711} {"train_loss": -10.213010787963867, "global_step": 119527, "epoch": 711} {"train_loss": -9.919404983520508, "global_step": 119528, "epoch": 711} {"train_loss": -9.81624984741211, "global_step": 119529, "epoch": 711} {"train_loss": -10.250286102294922, "global_step": 119530, "epoch": 711} {"train_loss": -9.976649284362793, "global_step": 119531, "epoch": 711} {"train_loss": -10.054670333862305, "global_step": 119532, "epoch": 711} {"train_loss": -10.155534744262695, "global_step": 119533, "epoch": 711} {"train_loss": -10.131179809570312, "global_step": 119534, "epoch": 711} {"train_loss": -9.77333927154541, "global_step": 119535, "epoch": 711} {"train_loss": -10.005443572998047, "global_step": 119536, "epoch": 711} {"train_loss": -9.9390869140625, "global_step": 119537, "epoch": 711} {"train_loss": -10.082467079162598, "global_step": 119538, "epoch": 711} {"train_loss": -10.090629577636719, "global_step": 119539, "epoch": 711} {"train_loss": -9.787294387817383, "global_step": 119540, "epoch": 711} {"train_loss": -10.19321060180664, "global_step": 119541, "epoch": 711} {"train_loss": -10.245150566101074, "global_step": 119542, "epoch": 711} {"train_loss": -10.284509658813477, "global_step": 119543, "epoch": 711} {"train_loss": -10.303750038146973, "global_step": 119544, "epoch": 711} {"train_loss": -10.33871078491211, "global_step": 119545, "epoch": 711} {"train_loss": -10.278656959533691, "global_step": 119546, "epoch": 711} {"train_loss": -10.341885566711426, "global_step": 119547, "epoch": 711} {"train_loss": -10.26889419555664, "global_step": 119548, "epoch": 711} {"train_loss": -10.23831558227539, "global_step": 119549, "epoch": 711} {"train_loss": -10.363960266113281, "global_step": 119550, "epoch": 711} {"train_loss": -10.266772270202637, "global_step": 119551, "epoch": 711} {"train_loss": -10.303430557250977, "global_step": 119552, "epoch": 711} {"train_loss": -10.348787307739258, "global_step": 119553, "epoch": 711} {"train_loss": -10.101531982421875, "global_step": 119554, "epoch": 711} {"train_loss": -10.239389419555664, "global_step": 119555, "epoch": 711} {"train_loss": -10.13136100769043, "global_step": 119556, "epoch": 711} {"train_loss": -10.276998519897461, "global_step": 119557, "epoch": 711} {"train_loss": -10.109538078308105, "global_step": 119558, "epoch": 711} {"train_loss": -10.57734203338623, "global_step": 119559, "epoch": 711} {"train_loss": -10.17477035522461, "global_step": 119560, "epoch": 711} {"train_loss": -10.46236515045166, "global_step": 119561, "epoch": 711} {"train_loss": -10.257701873779297, "global_step": 119562, "epoch": 711} {"train_loss": -10.40754508972168, "global_step": 119563, "epoch": 711} {"train_loss": -10.067317962646484, "global_step": 119564, "epoch": 711} {"train_loss": -10.320554733276367, "global_step": 119565, "epoch": 711} {"train_loss": -10.090494155883789, "global_step": 119566, "epoch": 711} {"train_loss": -9.209667205810547, "global_step": 119567, "epoch": 711} {"train_loss": -10.51217269897461, "global_step": 119568, "epoch": 711} {"train_loss": -8.623428344726562, "global_step": 119569, "epoch": 711} {"train_loss": -8.668107986450195, "global_step": 119570, "epoch": 711} {"train_loss": -8.317195892333984, "global_step": 119571, "epoch": 711} {"train_loss": -8.567466735839844, "global_step": 119572, "epoch": 711} {"train_loss": -8.146764755249023, "global_step": 119573, "epoch": 711} {"train_loss": -9.51309585571289, "global_step": 119574, "epoch": 711} {"train_loss": -8.447444915771484, "global_step": 119575, "epoch": 711} {"train_loss": -8.722126960754395, "global_step": 119576, "epoch": 711} {"train_loss": -9.043766021728516, "global_step": 119577, "epoch": 711} {"train_loss": -8.845054626464844, "global_step": 119578, "epoch": 711} {"train_loss": -8.987356185913086, "global_step": 119579, "epoch": 711} {"train_loss": -9.211706161499023, "global_step": 119580, "epoch": 711} {"train_loss": -9.457599639892578, "global_step": 119581, "epoch": 711} {"train_loss": -9.424640655517578, "global_step": 119582, "epoch": 711} {"train_loss": -9.450187683105469, "global_step": 119583, "epoch": 711} {"train_loss": -9.769925117492676, "global_step": 119584, "epoch": 711} {"train_loss": -9.280057907104492, "global_step": 119585, "epoch": 711} {"train_loss": -9.881142616271973, "global_step": 119586, "epoch": 711} {"train_loss": -9.736799240112305, "global_step": 119587, "epoch": 711} {"train_loss": -9.814231872558594, "global_step": 119588, "epoch": 711} {"train_loss": -9.834489822387695, "global_step": 119589, "epoch": 711} {"train_loss": -9.810306549072266, "global_step": 119590, "epoch": 711} {"train_loss": -9.698091506958008, "global_step": 119591, "epoch": 711} {"train_loss": -9.571893692016602, "global_step": 119592, "epoch": 711} {"train_loss": -9.767580032348633, "global_step": 119593, "epoch": 711} {"train_loss": -9.845048904418945, "global_step": 119594, "epoch": 711} {"train_loss": -9.904541969299316, "global_step": 119595, "epoch": 711} {"train_loss": -10.045494079589844, "global_step": 119596, "epoch": 711} {"train_loss": -9.804275512695312, "global_step": 119597, "epoch": 711} {"train_loss": -9.726358413696289, "global_step": 119598, "epoch": 711} {"train_loss": -9.910813331604004, "global_step": 119599, "epoch": 711} {"train_loss": -9.82645034790039, "global_step": 119600, "epoch": 711} {"train_loss": -10.076719284057617, "global_step": 119601, "epoch": 711} {"train_loss": -9.889640808105469, "global_step": 119602, "epoch": 711} {"train_loss": -10.01859188079834, "global_step": 119603, "epoch": 711} {"train_loss": -10.243227005004883, "global_step": 119604, "epoch": 711} {"train_loss": -9.799334526062012, "global_step": 119605, "epoch": 711} {"train_loss": -10.053476333618164, "global_step": 119606, "epoch": 711} {"train_loss": -10.186668395996094, "global_step": 119607, "epoch": 711} {"train_loss": -10.175037384033203, "global_step": 119608, "epoch": 711} {"train_loss": -10.165279388427734, "global_step": 119609, "epoch": 711} {"train_loss": -10.029909133911133, "global_step": 119610, "epoch": 711} {"train_loss": -10.163288116455078, "global_step": 119611, "epoch": 711} {"train_loss": -10.141008377075195, "global_step": 119612, "epoch": 711} {"train_loss": -10.179729461669922, "global_step": 119613, "epoch": 711} {"train_loss": -10.494237899780273, "global_step": 119614, "epoch": 711} {"train_loss": -9.937703950064522, "global_step": 119615, "epoch": 711, "val_loss": 202710.921875} {"train_loss": -10.099737167358398, "global_step": 119616, "epoch": 712} {"train_loss": -10.471177101135254, "global_step": 119617, "epoch": 712} {"train_loss": -10.047294616699219, "global_step": 119618, "epoch": 712} {"train_loss": -10.267648696899414, "global_step": 119619, "epoch": 712} {"train_loss": -10.223548889160156, "global_step": 119620, "epoch": 712} {"train_loss": -10.15073013305664, "global_step": 119621, "epoch": 712} {"train_loss": -10.226951599121094, "global_step": 119622, "epoch": 712} {"train_loss": -10.067401885986328, "global_step": 119623, "epoch": 712} {"train_loss": -9.821856498718262, "global_step": 119624, "epoch": 712} {"train_loss": -10.174975395202637, "global_step": 119625, "epoch": 712} {"train_loss": -10.153268814086914, "global_step": 119626, "epoch": 712} {"train_loss": -10.221489906311035, "global_step": 119627, "epoch": 712} {"train_loss": -10.208690643310547, "global_step": 119628, "epoch": 712} {"train_loss": -9.930685997009277, "global_step": 119629, "epoch": 712} {"train_loss": -9.975464820861816, "global_step": 119630, "epoch": 712} {"train_loss": -9.59417724609375, "global_step": 119631, "epoch": 712} {"train_loss": -9.016895294189453, "global_step": 119632, "epoch": 712} {"train_loss": -10.13669204711914, "global_step": 119633, "epoch": 712} {"train_loss": -9.128999710083008, "global_step": 119634, "epoch": 712} {"train_loss": -9.243818283081055, "global_step": 119635, "epoch": 712} {"train_loss": -9.873184204101562, "global_step": 119636, "epoch": 712} {"train_loss": -9.52963638305664, "global_step": 119637, "epoch": 712} {"train_loss": -10.045696258544922, "global_step": 119638, "epoch": 712} {"train_loss": -9.145833969116211, "global_step": 119639, "epoch": 712} {"train_loss": -9.746208190917969, "global_step": 119640, "epoch": 712} {"train_loss": -10.04334831237793, "global_step": 119641, "epoch": 712} {"train_loss": -9.750630378723145, "global_step": 119642, "epoch": 712} {"train_loss": -9.963046073913574, "global_step": 119643, "epoch": 712} {"train_loss": -10.057926177978516, "global_step": 119644, "epoch": 712} {"train_loss": -9.916202545166016, "global_step": 119645, "epoch": 712} {"train_loss": -9.834758758544922, "global_step": 119646, "epoch": 712} {"train_loss": -10.082679748535156, "global_step": 119647, "epoch": 712} {"train_loss": -10.099516868591309, "global_step": 119648, "epoch": 712} {"train_loss": -10.067244529724121, "global_step": 119649, "epoch": 712} {"train_loss": -9.754762649536133, "global_step": 119650, "epoch": 712} {"train_loss": -9.611474990844727, "global_step": 119651, "epoch": 712} {"train_loss": -9.97947883605957, "global_step": 119652, "epoch": 712} {"train_loss": -9.996708869934082, "global_step": 119653, "epoch": 712} {"train_loss": -10.101847648620605, "global_step": 119654, "epoch": 712} {"train_loss": -9.995842933654785, "global_step": 119655, "epoch": 712} {"train_loss": -9.972256660461426, "global_step": 119656, "epoch": 712} {"train_loss": -10.222766876220703, "global_step": 119657, "epoch": 712} {"train_loss": -10.131349563598633, "global_step": 119658, "epoch": 712} {"train_loss": -10.210378646850586, "global_step": 119659, "epoch": 712} {"train_loss": -10.286513328552246, "global_step": 119660, "epoch": 712} {"train_loss": -9.981707572937012, "global_step": 119661, "epoch": 712} {"train_loss": -10.022571563720703, "global_step": 119662, "epoch": 712} {"train_loss": -10.26390266418457, "global_step": 119663, "epoch": 712} {"train_loss": -9.738405227661133, "global_step": 119664, "epoch": 712} {"train_loss": -10.069005966186523, "global_step": 119665, "epoch": 712} {"train_loss": -9.946271896362305, "global_step": 119666, "epoch": 712} {"train_loss": -10.062368392944336, "global_step": 119667, "epoch": 712} {"train_loss": -9.918571472167969, "global_step": 119668, "epoch": 712} {"train_loss": -10.138794898986816, "global_step": 119669, "epoch": 712} {"train_loss": -10.084300994873047, "global_step": 119670, "epoch": 712} {"train_loss": -10.171113967895508, "global_step": 119671, "epoch": 712} {"train_loss": -10.154245376586914, "global_step": 119672, "epoch": 712} {"train_loss": -9.96733283996582, "global_step": 119673, "epoch": 712} {"train_loss": -9.985154151916504, "global_step": 119674, "epoch": 712} {"train_loss": -10.2135648727417, "global_step": 119675, "epoch": 712} {"train_loss": -9.909459114074707, "global_step": 119676, "epoch": 712} {"train_loss": -10.010655403137207, "global_step": 119677, "epoch": 712} {"train_loss": -10.235410690307617, "global_step": 119678, "epoch": 712} {"train_loss": -10.217798233032227, "global_step": 119679, "epoch": 712} {"train_loss": -10.12230110168457, "global_step": 119680, "epoch": 712} {"train_loss": -9.809137344360352, "global_step": 119681, "epoch": 712} {"train_loss": -10.490251541137695, "global_step": 119682, "epoch": 712} {"train_loss": -9.45309829711914, "global_step": 119683, "epoch": 712} {"train_loss": -9.992269515991211, "global_step": 119684, "epoch": 712} {"train_loss": -9.841238021850586, "global_step": 119685, "epoch": 712} {"train_loss": -9.490886688232422, "global_step": 119686, "epoch": 712} {"train_loss": -10.179204940795898, "global_step": 119687, "epoch": 712} {"train_loss": -9.964613914489746, "global_step": 119688, "epoch": 712} {"train_loss": -9.658803939819336, "global_step": 119689, "epoch": 712} {"train_loss": -10.168338775634766, "global_step": 119690, "epoch": 712} {"train_loss": -10.042597770690918, "global_step": 119691, "epoch": 712} {"train_loss": -10.190776824951172, "global_step": 119692, "epoch": 712} {"train_loss": -9.840789794921875, "global_step": 119693, "epoch": 712} {"train_loss": -9.925630569458008, "global_step": 119694, "epoch": 712} {"train_loss": -9.79050064086914, "global_step": 119695, "epoch": 712} {"train_loss": -9.916101455688477, "global_step": 119696, "epoch": 712} {"train_loss": -9.846600532531738, "global_step": 119697, "epoch": 712} {"train_loss": -10.12377643585205, "global_step": 119698, "epoch": 712} {"train_loss": -9.807300567626953, "global_step": 119699, "epoch": 712} {"train_loss": -10.276637077331543, "global_step": 119700, "epoch": 712} {"train_loss": -10.10975456237793, "global_step": 119701, "epoch": 712} {"train_loss": -10.115251541137695, "global_step": 119702, "epoch": 712} {"train_loss": -10.380819320678711, "global_step": 119703, "epoch": 712} {"train_loss": -9.813106536865234, "global_step": 119704, "epoch": 712} {"train_loss": -10.273050308227539, "global_step": 119705, "epoch": 712} {"train_loss": -9.877754211425781, "global_step": 119706, "epoch": 712} {"train_loss": -9.908638000488281, "global_step": 119707, "epoch": 712} {"train_loss": -10.164403915405273, "global_step": 119708, "epoch": 712} {"train_loss": -10.009336471557617, "global_step": 119709, "epoch": 712} {"train_loss": -10.273751258850098, "global_step": 119710, "epoch": 712} {"train_loss": -9.744024276733398, "global_step": 119711, "epoch": 712} {"train_loss": -10.258833885192871, "global_step": 119712, "epoch": 712} {"train_loss": -9.941875457763672, "global_step": 119713, "epoch": 712} {"train_loss": -10.233139991760254, "global_step": 119714, "epoch": 712} {"train_loss": -9.687690734863281, "global_step": 119715, "epoch": 712} {"train_loss": -10.120841979980469, "global_step": 119716, "epoch": 712} {"train_loss": -9.907007217407227, "global_step": 119717, "epoch": 712} {"train_loss": -9.948015213012695, "global_step": 119718, "epoch": 712} {"train_loss": -10.196191787719727, "global_step": 119719, "epoch": 712} {"train_loss": -10.324409484863281, "global_step": 119720, "epoch": 712} {"train_loss": -10.253019332885742, "global_step": 119721, "epoch": 712} {"train_loss": -10.075807571411133, "global_step": 119722, "epoch": 712} {"train_loss": -10.19232177734375, "global_step": 119723, "epoch": 712} {"train_loss": -10.060588836669922, "global_step": 119724, "epoch": 712} {"train_loss": -10.238759994506836, "global_step": 119725, "epoch": 712} {"train_loss": -10.084697723388672, "global_step": 119726, "epoch": 712} {"train_loss": -10.437173843383789, "global_step": 119727, "epoch": 712} {"train_loss": -9.764608383178711, "global_step": 119728, "epoch": 712} {"train_loss": -10.03680419921875, "global_step": 119729, "epoch": 712} {"train_loss": -9.9740629196167, "global_step": 119730, "epoch": 712} {"train_loss": -10.024354934692383, "global_step": 119731, "epoch": 712} {"train_loss": -10.399145126342773, "global_step": 119732, "epoch": 712} {"train_loss": -9.441070556640625, "global_step": 119733, "epoch": 712} {"train_loss": -9.904814720153809, "global_step": 119734, "epoch": 712} {"train_loss": -10.00310230255127, "global_step": 119735, "epoch": 712} {"train_loss": -10.110309600830078, "global_step": 119736, "epoch": 712} {"train_loss": -10.213214874267578, "global_step": 119737, "epoch": 712} {"train_loss": -9.503900527954102, "global_step": 119738, "epoch": 712} {"train_loss": -9.760523796081543, "global_step": 119739, "epoch": 712} {"train_loss": -9.819864273071289, "global_step": 119740, "epoch": 712} {"train_loss": -9.757840156555176, "global_step": 119741, "epoch": 712} {"train_loss": -9.695235252380371, "global_step": 119742, "epoch": 712} {"train_loss": -9.666252136230469, "global_step": 119743, "epoch": 712} {"train_loss": -9.874734878540039, "global_step": 119744, "epoch": 712} {"train_loss": -9.344873428344727, "global_step": 119745, "epoch": 712} {"train_loss": -9.899559020996094, "global_step": 119746, "epoch": 712} {"train_loss": -9.698010444641113, "global_step": 119747, "epoch": 712} {"train_loss": -9.417543411254883, "global_step": 119748, "epoch": 712} {"train_loss": -9.794483184814453, "global_step": 119749, "epoch": 712} {"train_loss": -9.844785690307617, "global_step": 119750, "epoch": 712} {"train_loss": -9.807016372680664, "global_step": 119751, "epoch": 712} {"train_loss": -9.745980262756348, "global_step": 119752, "epoch": 712} {"train_loss": -10.11749267578125, "global_step": 119753, "epoch": 712} {"train_loss": -9.738016128540039, "global_step": 119754, "epoch": 712} {"train_loss": -9.789957046508789, "global_step": 119755, "epoch": 712} {"train_loss": -10.067604064941406, "global_step": 119756, "epoch": 712} {"train_loss": -9.669198989868164, "global_step": 119757, "epoch": 712} {"train_loss": -10.106744766235352, "global_step": 119758, "epoch": 712} {"train_loss": -9.915478706359863, "global_step": 119759, "epoch": 712} {"train_loss": -9.843894958496094, "global_step": 119760, "epoch": 712} {"train_loss": -10.179737091064453, "global_step": 119761, "epoch": 712} {"train_loss": -9.738214492797852, "global_step": 119762, "epoch": 712} {"train_loss": -9.831666946411133, "global_step": 119763, "epoch": 712} {"train_loss": -10.247304916381836, "global_step": 119764, "epoch": 712} {"train_loss": -10.192560195922852, "global_step": 119765, "epoch": 712} {"train_loss": -9.852665901184082, "global_step": 119766, "epoch": 712} {"train_loss": -10.27307415008545, "global_step": 119767, "epoch": 712} {"train_loss": -10.125420570373535, "global_step": 119768, "epoch": 712} {"train_loss": -9.966104507446289, "global_step": 119769, "epoch": 712} {"train_loss": -10.089132308959961, "global_step": 119770, "epoch": 712} {"train_loss": -10.20566463470459, "global_step": 119771, "epoch": 712} {"train_loss": -10.23533821105957, "global_step": 119772, "epoch": 712} {"train_loss": -10.167346954345703, "global_step": 119773, "epoch": 712} {"train_loss": -10.266727447509766, "global_step": 119774, "epoch": 712} {"train_loss": -10.127412796020508, "global_step": 119775, "epoch": 712} {"train_loss": -10.259370803833008, "global_step": 119776, "epoch": 712} {"train_loss": -10.341865539550781, "global_step": 119777, "epoch": 712} {"train_loss": -10.260690689086914, "global_step": 119778, "epoch": 712} {"train_loss": -10.460441589355469, "global_step": 119779, "epoch": 712} {"train_loss": -10.133798599243164, "global_step": 119780, "epoch": 712} {"train_loss": -10.404372215270996, "global_step": 119781, "epoch": 712} {"train_loss": -10.185196876525879, "global_step": 119782, "epoch": 712} {"train_loss": -9.993107699212574, "global_step": 119783, "epoch": 712, "val_loss": 214074.921875} {"train_loss": -10.395116806030273, "global_step": 119784, "epoch": 713} {"train_loss": -10.226873397827148, "global_step": 119785, "epoch": 713} {"train_loss": -10.066648483276367, "global_step": 119786, "epoch": 713} {"train_loss": -10.417718887329102, "global_step": 119787, "epoch": 713} {"train_loss": -10.440120697021484, "global_step": 119788, "epoch": 713} {"train_loss": -10.334075927734375, "global_step": 119789, "epoch": 713} {"train_loss": -10.379857063293457, "global_step": 119790, "epoch": 713} {"train_loss": -10.452400207519531, "global_step": 119791, "epoch": 713} {"train_loss": -10.337849617004395, "global_step": 119792, "epoch": 713} {"train_loss": -10.329328536987305, "global_step": 119793, "epoch": 713} {"train_loss": -10.005559921264648, "global_step": 119794, "epoch": 713} {"train_loss": -9.914852142333984, "global_step": 119795, "epoch": 713} {"train_loss": -10.138579368591309, "global_step": 119796, "epoch": 713} {"train_loss": -9.838258743286133, "global_step": 119797, "epoch": 713} {"train_loss": -9.966574668884277, "global_step": 119798, "epoch": 713} {"train_loss": -10.003103256225586, "global_step": 119799, "epoch": 713} {"train_loss": -9.527717590332031, "global_step": 119800, "epoch": 713} {"train_loss": -10.01348876953125, "global_step": 119801, "epoch": 713} {"train_loss": -9.83731746673584, "global_step": 119802, "epoch": 713} {"train_loss": -9.980300903320312, "global_step": 119803, "epoch": 713} {"train_loss": -10.073565483093262, "global_step": 119804, "epoch": 713} {"train_loss": -9.818851470947266, "global_step": 119805, "epoch": 713} {"train_loss": -10.202859878540039, "global_step": 119806, "epoch": 713} {"train_loss": -9.99270248413086, "global_step": 119807, "epoch": 713} {"train_loss": -10.074271202087402, "global_step": 119808, "epoch": 713} {"train_loss": -10.239603042602539, "global_step": 119809, "epoch": 713} {"train_loss": -10.432476043701172, "global_step": 119810, "epoch": 713} {"train_loss": -9.718633651733398, "global_step": 119811, "epoch": 713} {"train_loss": -10.56635856628418, "global_step": 119812, "epoch": 713} {"train_loss": -9.991666793823242, "global_step": 119813, "epoch": 713} {"train_loss": -10.044561386108398, "global_step": 119814, "epoch": 713} {"train_loss": -9.927668571472168, "global_step": 119815, "epoch": 713} {"train_loss": -9.915081024169922, "global_step": 119816, "epoch": 713} {"train_loss": -10.11544418334961, "global_step": 119817, "epoch": 713} {"train_loss": -10.143136978149414, "global_step": 119818, "epoch": 713} {"train_loss": -10.233903884887695, "global_step": 119819, "epoch": 713} {"train_loss": -10.353346824645996, "global_step": 119820, "epoch": 713} {"train_loss": -10.429683685302734, "global_step": 119821, "epoch": 713} {"train_loss": -10.505006790161133, "global_step": 119822, "epoch": 713} {"train_loss": -10.261165618896484, "global_step": 119823, "epoch": 713} {"train_loss": -10.465667724609375, "global_step": 119824, "epoch": 713} {"train_loss": -10.322795867919922, "global_step": 119825, "epoch": 713} {"train_loss": -10.098627090454102, "global_step": 119826, "epoch": 713} {"train_loss": -10.387670516967773, "global_step": 119827, "epoch": 713} {"train_loss": -10.233269691467285, "global_step": 119828, "epoch": 713} {"train_loss": -10.373527526855469, "global_step": 119829, "epoch": 713} {"train_loss": -10.1005220413208, "global_step": 119830, "epoch": 713} {"train_loss": -10.351095199584961, "global_step": 119831, "epoch": 713} {"train_loss": -10.437054634094238, "global_step": 119832, "epoch": 713} {"train_loss": -10.158485412597656, "global_step": 119833, "epoch": 713} {"train_loss": -10.304449081420898, "global_step": 119834, "epoch": 713} {"train_loss": -10.069005966186523, "global_step": 119835, "epoch": 713} {"train_loss": -10.183280944824219, "global_step": 119836, "epoch": 713} {"train_loss": -10.096721649169922, "global_step": 119837, "epoch": 713} {"train_loss": -10.180212020874023, "global_step": 119838, "epoch": 713} {"train_loss": -9.898065567016602, "global_step": 119839, "epoch": 713} {"train_loss": -10.388038635253906, "global_step": 119840, "epoch": 713} {"train_loss": -10.005910873413086, "global_step": 119841, "epoch": 713} {"train_loss": -10.341583251953125, "global_step": 119842, "epoch": 713} {"train_loss": -10.137470245361328, "global_step": 119843, "epoch": 713} {"train_loss": -10.175994873046875, "global_step": 119844, "epoch": 713} {"train_loss": -10.214864730834961, "global_step": 119845, "epoch": 713} {"train_loss": -9.664179801940918, "global_step": 119846, "epoch": 713} {"train_loss": -10.37924575805664, "global_step": 119847, "epoch": 713} {"train_loss": -9.90444564819336, "global_step": 119848, "epoch": 713} {"train_loss": -10.316041946411133, "global_step": 119849, "epoch": 713} {"train_loss": -9.879814147949219, "global_step": 119850, "epoch": 713} {"train_loss": -10.379064559936523, "global_step": 119851, "epoch": 713} {"train_loss": -10.00227165222168, "global_step": 119852, "epoch": 713} {"train_loss": -10.15971565246582, "global_step": 119853, "epoch": 713} {"train_loss": -10.355724334716797, "global_step": 119854, "epoch": 713} {"train_loss": -10.465810775756836, "global_step": 119855, "epoch": 713} {"train_loss": -10.203798294067383, "global_step": 119856, "epoch": 713} {"train_loss": -10.259571075439453, "global_step": 119857, "epoch": 713} {"train_loss": -10.444683074951172, "global_step": 119858, "epoch": 713} {"train_loss": -10.055940628051758, "global_step": 119859, "epoch": 713} {"train_loss": -10.50373649597168, "global_step": 119860, "epoch": 713} {"train_loss": -10.265521049499512, "global_step": 119861, "epoch": 713} {"train_loss": -10.137035369873047, "global_step": 119862, "epoch": 713} {"train_loss": -10.106893539428711, "global_step": 119863, "epoch": 713} {"train_loss": -10.189294815063477, "global_step": 119864, "epoch": 713} {"train_loss": -10.131125450134277, "global_step": 119865, "epoch": 713} {"train_loss": -10.293012619018555, "global_step": 119866, "epoch": 713} {"train_loss": -10.363707542419434, "global_step": 119867, "epoch": 713} {"train_loss": -10.053792953491211, "global_step": 119868, "epoch": 713} {"train_loss": -10.290668487548828, "global_step": 119869, "epoch": 713} {"train_loss": -10.130297660827637, "global_step": 119870, "epoch": 713} {"train_loss": -10.20120906829834, "global_step": 119871, "epoch": 713} {"train_loss": -10.09737491607666, "global_step": 119872, "epoch": 713} {"train_loss": -9.68481731414795, "global_step": 119873, "epoch": 713} {"train_loss": -9.914791107177734, "global_step": 119874, "epoch": 713} {"train_loss": -10.35354232788086, "global_step": 119875, "epoch": 713} {"train_loss": -9.544533729553223, "global_step": 119876, "epoch": 713} {"train_loss": -10.170886993408203, "global_step": 119877, "epoch": 713} {"train_loss": -10.340058326721191, "global_step": 119878, "epoch": 713} {"train_loss": -10.122148513793945, "global_step": 119879, "epoch": 713} {"train_loss": -10.224021911621094, "global_step": 119880, "epoch": 713} {"train_loss": -9.843644142150879, "global_step": 119881, "epoch": 713} {"train_loss": -10.02682113647461, "global_step": 119882, "epoch": 713} {"train_loss": -10.00767707824707, "global_step": 119883, "epoch": 713} {"train_loss": -10.072481155395508, "global_step": 119884, "epoch": 713} {"train_loss": -10.240792274475098, "global_step": 119885, "epoch": 713} {"train_loss": -10.015491485595703, "global_step": 119886, "epoch": 713} {"train_loss": -10.287155151367188, "global_step": 119887, "epoch": 713} {"train_loss": -10.07236385345459, "global_step": 119888, "epoch": 713} {"train_loss": -10.345739364624023, "global_step": 119889, "epoch": 713} {"train_loss": -10.267831802368164, "global_step": 119890, "epoch": 713} {"train_loss": -9.92331314086914, "global_step": 119891, "epoch": 713} {"train_loss": -10.382534980773926, "global_step": 119892, "epoch": 713} {"train_loss": -9.997359275817871, "global_step": 119893, "epoch": 713} {"train_loss": -10.501541137695312, "global_step": 119894, "epoch": 713} {"train_loss": -10.254348754882812, "global_step": 119895, "epoch": 713} {"train_loss": -10.223865509033203, "global_step": 119896, "epoch": 713} {"train_loss": -9.7212495803833, "global_step": 119897, "epoch": 713} {"train_loss": -10.352041244506836, "global_step": 119898, "epoch": 713} {"train_loss": -10.096267700195312, "global_step": 119899, "epoch": 713} {"train_loss": -10.128767013549805, "global_step": 119900, "epoch": 713} {"train_loss": -10.262258529663086, "global_step": 119901, "epoch": 713} {"train_loss": -10.116571426391602, "global_step": 119902, "epoch": 713} {"train_loss": -9.869322776794434, "global_step": 119903, "epoch": 713} {"train_loss": -10.322930335998535, "global_step": 119904, "epoch": 713} {"train_loss": -10.353548049926758, "global_step": 119905, "epoch": 713} {"train_loss": -10.197905540466309, "global_step": 119906, "epoch": 713} {"train_loss": -10.337390899658203, "global_step": 119907, "epoch": 713} {"train_loss": -10.0423583984375, "global_step": 119908, "epoch": 713} {"train_loss": -10.077651023864746, "global_step": 119909, "epoch": 713} {"train_loss": -10.318381309509277, "global_step": 119910, "epoch": 713} {"train_loss": -10.109731674194336, "global_step": 119911, "epoch": 713} {"train_loss": -10.448980331420898, "global_step": 119912, "epoch": 713} {"train_loss": -9.978584289550781, "global_step": 119913, "epoch": 713} {"train_loss": -10.289590835571289, "global_step": 119914, "epoch": 713} {"train_loss": -10.039862632751465, "global_step": 119915, "epoch": 713} {"train_loss": -9.735916137695312, "global_step": 119916, "epoch": 713} {"train_loss": -9.897260665893555, "global_step": 119917, "epoch": 713} {"train_loss": -10.279035568237305, "global_step": 119918, "epoch": 713} {"train_loss": -9.753950119018555, "global_step": 119919, "epoch": 713} {"train_loss": -9.958972930908203, "global_step": 119920, "epoch": 713} {"train_loss": -10.258967399597168, "global_step": 119921, "epoch": 713} {"train_loss": -9.624090194702148, "global_step": 119922, "epoch": 713} {"train_loss": -10.108423233032227, "global_step": 119923, "epoch": 713} {"train_loss": -9.13797664642334, "global_step": 119924, "epoch": 713} {"train_loss": -10.099533081054688, "global_step": 119925, "epoch": 713} {"train_loss": -10.034611701965332, "global_step": 119926, "epoch": 713} {"train_loss": -9.98423957824707, "global_step": 119927, "epoch": 713} {"train_loss": -9.819892883300781, "global_step": 119928, "epoch": 713} {"train_loss": -9.982433319091797, "global_step": 119929, "epoch": 713} {"train_loss": -10.149818420410156, "global_step": 119930, "epoch": 713} {"train_loss": -9.866754531860352, "global_step": 119931, "epoch": 713} {"train_loss": -10.236055374145508, "global_step": 119932, "epoch": 713} {"train_loss": -10.055265426635742, "global_step": 119933, "epoch": 713} {"train_loss": -10.227006912231445, "global_step": 119934, "epoch": 713} {"train_loss": -10.416531562805176, "global_step": 119935, "epoch": 713} {"train_loss": -10.162208557128906, "global_step": 119936, "epoch": 713} {"train_loss": -10.40645694732666, "global_step": 119937, "epoch": 713} {"train_loss": -10.186424255371094, "global_step": 119938, "epoch": 713} {"train_loss": -10.149681091308594, "global_step": 119939, "epoch": 713} {"train_loss": -10.530029296875, "global_step": 119940, "epoch": 713} {"train_loss": -10.07751178741455, "global_step": 119941, "epoch": 713} {"train_loss": -10.272913932800293, "global_step": 119942, "epoch": 713} {"train_loss": -10.225500106811523, "global_step": 119943, "epoch": 713} {"train_loss": -10.142013549804688, "global_step": 119944, "epoch": 713} {"train_loss": -10.261659622192383, "global_step": 119945, "epoch": 713} {"train_loss": -10.346578598022461, "global_step": 119946, "epoch": 713} {"train_loss": -10.05301570892334, "global_step": 119947, "epoch": 713} {"train_loss": -10.315834045410156, "global_step": 119948, "epoch": 713} {"train_loss": -10.262852668762207, "global_step": 119949, "epoch": 713} {"train_loss": -10.222557067871094, "global_step": 119950, "epoch": 713} {"train_loss": -10.147708853085836, "global_step": 119951, "epoch": 713, "val_loss": 213816.296875} {"train_loss": -9.728261947631836, "global_step": 119952, "epoch": 714} {"train_loss": -10.21707534790039, "global_step": 119953, "epoch": 714} {"train_loss": -10.111719131469727, "global_step": 119954, "epoch": 714} {"train_loss": -10.223352432250977, "global_step": 119955, "epoch": 714} {"train_loss": -10.249101638793945, "global_step": 119956, "epoch": 714} {"train_loss": -10.268269538879395, "global_step": 119957, "epoch": 714} {"train_loss": -10.408210754394531, "global_step": 119958, "epoch": 714} {"train_loss": -10.474700927734375, "global_step": 119959, "epoch": 714} {"train_loss": -10.391618728637695, "global_step": 119960, "epoch": 714} {"train_loss": -10.306695938110352, "global_step": 119961, "epoch": 714} {"train_loss": -10.2095365524292, "global_step": 119962, "epoch": 714} {"train_loss": -10.225299835205078, "global_step": 119963, "epoch": 714} {"train_loss": -10.077817916870117, "global_step": 119964, "epoch": 714} {"train_loss": -10.257413864135742, "global_step": 119965, "epoch": 714} {"train_loss": -9.761251449584961, "global_step": 119966, "epoch": 714} {"train_loss": -10.364399909973145, "global_step": 119967, "epoch": 714} {"train_loss": -10.191197395324707, "global_step": 119968, "epoch": 714} {"train_loss": -9.951248168945312, "global_step": 119969, "epoch": 714} {"train_loss": -10.101471900939941, "global_step": 119970, "epoch": 714} {"train_loss": -10.036031723022461, "global_step": 119971, "epoch": 714} {"train_loss": -9.699102401733398, "global_step": 119972, "epoch": 714} {"train_loss": -9.80369758605957, "global_step": 119973, "epoch": 714} {"train_loss": -10.336305618286133, "global_step": 119974, "epoch": 714} {"train_loss": -10.140475273132324, "global_step": 119975, "epoch": 714} {"train_loss": -10.126821517944336, "global_step": 119976, "epoch": 714} {"train_loss": -9.790287017822266, "global_step": 119977, "epoch": 714} {"train_loss": -10.009531021118164, "global_step": 119978, "epoch": 714} {"train_loss": -9.90210247039795, "global_step": 119979, "epoch": 714} {"train_loss": -9.939984321594238, "global_step": 119980, "epoch": 714} {"train_loss": -10.162786483764648, "global_step": 119981, "epoch": 714} {"train_loss": -10.015005111694336, "global_step": 119982, "epoch": 714} {"train_loss": -10.266568183898926, "global_step": 119983, "epoch": 714} {"train_loss": -10.056304931640625, "global_step": 119984, "epoch": 714} {"train_loss": -10.210158348083496, "global_step": 119985, "epoch": 714} {"train_loss": -10.230524063110352, "global_step": 119986, "epoch": 714} {"train_loss": -9.847074508666992, "global_step": 119987, "epoch": 714} {"train_loss": -10.109334945678711, "global_step": 119988, "epoch": 714} {"train_loss": -10.054847717285156, "global_step": 119989, "epoch": 714} {"train_loss": -10.011377334594727, "global_step": 119990, "epoch": 714} {"train_loss": -10.10727310180664, "global_step": 119991, "epoch": 714} {"train_loss": -10.419578552246094, "global_step": 119992, "epoch": 714} {"train_loss": -10.018774032592773, "global_step": 119993, "epoch": 714} {"train_loss": -10.269777297973633, "global_step": 119994, "epoch": 714} {"train_loss": -10.124849319458008, "global_step": 119995, "epoch": 714} {"train_loss": -10.026535034179688, "global_step": 119996, "epoch": 714} {"train_loss": -10.345229148864746, "global_step": 119997, "epoch": 714} {"train_loss": -10.134875297546387, "global_step": 119998, "epoch": 714} {"train_loss": -10.455056190490723, "global_step": 119999, "epoch": 714} {"train_loss": -10.049386024475098, "global_step": 120000, "epoch": 714} {"train_loss": -10.281774520874023, "global_step": 120001, "epoch": 714} {"train_loss": -9.97125244140625, "global_step": 120002, "epoch": 714} {"train_loss": -10.249343872070312, "global_step": 120003, "epoch": 714} {"train_loss": -10.365142822265625, "global_step": 120004, "epoch": 714} {"train_loss": -9.78433895111084, "global_step": 120005, "epoch": 714} {"train_loss": -10.418612480163574, "global_step": 120006, "epoch": 714} {"train_loss": -10.074396133422852, "global_step": 120007, "epoch": 714} {"train_loss": -10.405776977539062, "global_step": 120008, "epoch": 714} {"train_loss": -10.022064208984375, "global_step": 120009, "epoch": 714} {"train_loss": -10.144608497619629, "global_step": 120010, "epoch": 714} {"train_loss": -10.065788269042969, "global_step": 120011, "epoch": 714} {"train_loss": -10.107177734375, "global_step": 120012, "epoch": 714} {"train_loss": -10.343629837036133, "global_step": 120013, "epoch": 714} {"train_loss": -9.974618911743164, "global_step": 120014, "epoch": 714} {"train_loss": -10.32258415222168, "global_step": 120015, "epoch": 714} {"train_loss": -10.075929641723633, "global_step": 120016, "epoch": 714} {"train_loss": -10.249185562133789, "global_step": 120017, "epoch": 714} {"train_loss": -10.239272117614746, "global_step": 120018, "epoch": 714} {"train_loss": -10.093584060668945, "global_step": 120019, "epoch": 714} {"train_loss": -10.3662691116333, "global_step": 120020, "epoch": 714} {"train_loss": -10.152052879333496, "global_step": 120021, "epoch": 714} {"train_loss": -10.268229484558105, "global_step": 120022, "epoch": 714} {"train_loss": -10.151176452636719, "global_step": 120023, "epoch": 714} {"train_loss": -10.103514671325684, "global_step": 120024, "epoch": 714} {"train_loss": -10.025346755981445, "global_step": 120025, "epoch": 714} {"train_loss": -10.321650505065918, "global_step": 120026, "epoch": 714} {"train_loss": -10.025968551635742, "global_step": 120027, "epoch": 714} {"train_loss": -9.941015243530273, "global_step": 120028, "epoch": 714} {"train_loss": -10.447697639465332, "global_step": 120029, "epoch": 714} {"train_loss": -9.867815017700195, "global_step": 120030, "epoch": 714} {"train_loss": -10.338414192199707, "global_step": 120031, "epoch": 714} {"train_loss": -10.000378608703613, "global_step": 120032, "epoch": 714} {"train_loss": -9.970430374145508, "global_step": 120033, "epoch": 714} {"train_loss": -10.308064460754395, "global_step": 120034, "epoch": 714} {"train_loss": -10.071362495422363, "global_step": 120035, "epoch": 714} {"train_loss": -10.265830039978027, "global_step": 120036, "epoch": 714} {"train_loss": -10.104982376098633, "global_step": 120037, "epoch": 714} {"train_loss": -10.21241569519043, "global_step": 120038, "epoch": 714} {"train_loss": -9.89700698852539, "global_step": 120039, "epoch": 714} {"train_loss": -9.850704193115234, "global_step": 120040, "epoch": 714} {"train_loss": -9.810776710510254, "global_step": 120041, "epoch": 714} {"train_loss": -9.481204986572266, "global_step": 120042, "epoch": 714} {"train_loss": -10.43423080444336, "global_step": 120043, "epoch": 714} {"train_loss": -9.400545120239258, "global_step": 120044, "epoch": 714} {"train_loss": -10.00031852722168, "global_step": 120045, "epoch": 714} {"train_loss": -9.698932647705078, "global_step": 120046, "epoch": 714} {"train_loss": -9.92241096496582, "global_step": 120047, "epoch": 714} {"train_loss": -9.499655723571777, "global_step": 120048, "epoch": 714} {"train_loss": -9.517858505249023, "global_step": 120049, "epoch": 714} {"train_loss": -9.507994651794434, "global_step": 120050, "epoch": 714} {"train_loss": -9.256590843200684, "global_step": 120051, "epoch": 714} {"train_loss": -9.135711669921875, "global_step": 120052, "epoch": 714} {"train_loss": -9.255587577819824, "global_step": 120053, "epoch": 714} {"train_loss": -9.590362548828125, "global_step": 120054, "epoch": 714} {"train_loss": -9.126432418823242, "global_step": 120055, "epoch": 714} {"train_loss": -9.608884811401367, "global_step": 120056, "epoch": 714} {"train_loss": -9.925514221191406, "global_step": 120057, "epoch": 714} {"train_loss": -9.694976806640625, "global_step": 120058, "epoch": 714} {"train_loss": -9.6470308303833, "global_step": 120059, "epoch": 714} {"train_loss": -10.282588958740234, "global_step": 120060, "epoch": 714} {"train_loss": -9.798247337341309, "global_step": 120061, "epoch": 714} {"train_loss": -9.741920471191406, "global_step": 120062, "epoch": 714} {"train_loss": -9.871367454528809, "global_step": 120063, "epoch": 714} {"train_loss": -9.975763320922852, "global_step": 120064, "epoch": 714} {"train_loss": -9.80880355834961, "global_step": 120065, "epoch": 714} {"train_loss": -9.801803588867188, "global_step": 120066, "epoch": 714} {"train_loss": -9.876067161560059, "global_step": 120067, "epoch": 714} {"train_loss": -10.136337280273438, "global_step": 120068, "epoch": 714} {"train_loss": -9.417824745178223, "global_step": 120069, "epoch": 714} {"train_loss": -10.116724967956543, "global_step": 120070, "epoch": 714} {"train_loss": -9.787376403808594, "global_step": 120071, "epoch": 714} {"train_loss": -9.577467918395996, "global_step": 120072, "epoch": 714} {"train_loss": -10.085538864135742, "global_step": 120073, "epoch": 714} {"train_loss": -9.913492202758789, "global_step": 120074, "epoch": 714} {"train_loss": -10.164013862609863, "global_step": 120075, "epoch": 714} {"train_loss": -10.012454986572266, "global_step": 120076, "epoch": 714} {"train_loss": -10.073930740356445, "global_step": 120077, "epoch": 714} {"train_loss": -10.143056869506836, "global_step": 120078, "epoch": 714} {"train_loss": -10.120271682739258, "global_step": 120079, "epoch": 714} {"train_loss": -10.00652027130127, "global_step": 120080, "epoch": 714} {"train_loss": -10.181775093078613, "global_step": 120081, "epoch": 714} {"train_loss": -9.993961334228516, "global_step": 120082, "epoch": 714} {"train_loss": -10.280464172363281, "global_step": 120083, "epoch": 714} {"train_loss": -10.072317123413086, "global_step": 120084, "epoch": 714} {"train_loss": -10.327566146850586, "global_step": 120085, "epoch": 714} {"train_loss": -10.487154960632324, "global_step": 120086, "epoch": 714} {"train_loss": -10.352039337158203, "global_step": 120087, "epoch": 714} {"train_loss": -10.47971248626709, "global_step": 120088, "epoch": 714} {"train_loss": -10.500713348388672, "global_step": 120089, "epoch": 714} {"train_loss": -10.303544998168945, "global_step": 120090, "epoch": 714} {"train_loss": -10.555612564086914, "global_step": 120091, "epoch": 714} {"train_loss": -10.414046287536621, "global_step": 120092, "epoch": 714} {"train_loss": -10.319778442382812, "global_step": 120093, "epoch": 714} {"train_loss": -10.640335083007812, "global_step": 120094, "epoch": 714} {"train_loss": -10.599867820739746, "global_step": 120095, "epoch": 714} {"train_loss": -10.429132461547852, "global_step": 120096, "epoch": 714} {"train_loss": -10.602046966552734, "global_step": 120097, "epoch": 714} {"train_loss": -10.44115161895752, "global_step": 120098, "epoch": 714} {"train_loss": -10.26443862915039, "global_step": 120099, "epoch": 714} {"train_loss": -10.505945205688477, "global_step": 120100, "epoch": 714} {"train_loss": -10.478107452392578, "global_step": 120101, "epoch": 714} {"train_loss": -10.488255500793457, "global_step": 120102, "epoch": 714} {"train_loss": -10.407907485961914, "global_step": 120103, "epoch": 714} {"train_loss": -10.657092094421387, "global_step": 120104, "epoch": 714} {"train_loss": -10.469348907470703, "global_step": 120105, "epoch": 714} {"train_loss": -10.23460578918457, "global_step": 120106, "epoch": 714} {"train_loss": -10.510083198547363, "global_step": 120107, "epoch": 714} {"train_loss": -10.309274673461914, "global_step": 120108, "epoch": 714} {"train_loss": -10.585351943969727, "global_step": 120109, "epoch": 714} {"train_loss": -9.889315605163574, "global_step": 120110, "epoch": 714} {"train_loss": -9.787751197814941, "global_step": 120111, "epoch": 714} {"train_loss": -9.797769546508789, "global_step": 120112, "epoch": 714} {"train_loss": -9.207113265991211, "global_step": 120113, "epoch": 714} {"train_loss": -9.813611030578613, "global_step": 120114, "epoch": 714} {"train_loss": -9.79425048828125, "global_step": 120115, "epoch": 714} {"train_loss": -9.018155097961426, "global_step": 120116, "epoch": 714} {"train_loss": -9.881490707397461, "global_step": 120117, "epoch": 714} {"train_loss": -9.215725898742676, "global_step": 120118, "epoch": 714} {"train_loss": -10.068818080992926, "global_step": 120119, "epoch": 714, "val_loss": 214052.78125} {"train_loss": -9.816665649414062, "global_step": 120120, "epoch": 715} {"train_loss": -9.900707244873047, "global_step": 120121, "epoch": 715} {"train_loss": -9.573387145996094, "global_step": 120122, "epoch": 715} {"train_loss": -10.078910827636719, "global_step": 120123, "epoch": 715} {"train_loss": -9.632108688354492, "global_step": 120124, "epoch": 715} {"train_loss": -9.961261749267578, "global_step": 120125, "epoch": 715} {"train_loss": -9.449758529663086, "global_step": 120126, "epoch": 715} {"train_loss": -9.872089385986328, "global_step": 120127, "epoch": 715} {"train_loss": -8.99512767791748, "global_step": 120128, "epoch": 715} {"train_loss": -9.764581680297852, "global_step": 120129, "epoch": 715} {"train_loss": -8.981576919555664, "global_step": 120130, "epoch": 715} {"train_loss": -9.563117980957031, "global_step": 120131, "epoch": 715} {"train_loss": -9.782703399658203, "global_step": 120132, "epoch": 715} {"train_loss": -9.582846641540527, "global_step": 120133, "epoch": 715} {"train_loss": -10.059812545776367, "global_step": 120134, "epoch": 715} {"train_loss": -10.121917724609375, "global_step": 120135, "epoch": 715} {"train_loss": -9.934940338134766, "global_step": 120136, "epoch": 715} {"train_loss": -9.778715133666992, "global_step": 120137, "epoch": 715} {"train_loss": -9.898028373718262, "global_step": 120138, "epoch": 715} {"train_loss": -9.731106758117676, "global_step": 120139, "epoch": 715} {"train_loss": -10.136950492858887, "global_step": 120140, "epoch": 715} {"train_loss": -9.993358612060547, "global_step": 120141, "epoch": 715} {"train_loss": -9.889869689941406, "global_step": 120142, "epoch": 715} {"train_loss": -9.745147705078125, "global_step": 120143, "epoch": 715} {"train_loss": -10.234980583190918, "global_step": 120144, "epoch": 715} {"train_loss": -9.9336576461792, "global_step": 120145, "epoch": 715} {"train_loss": -9.794729232788086, "global_step": 120146, "epoch": 715} {"train_loss": -9.845197677612305, "global_step": 120147, "epoch": 715} {"train_loss": -9.85597038269043, "global_step": 120148, "epoch": 715} {"train_loss": -9.889527320861816, "global_step": 120149, "epoch": 715} {"train_loss": -9.766571044921875, "global_step": 120150, "epoch": 715} {"train_loss": -9.921552658081055, "global_step": 120151, "epoch": 715} {"train_loss": -9.972524642944336, "global_step": 120152, "epoch": 715} {"train_loss": -10.108943939208984, "global_step": 120153, "epoch": 715} {"train_loss": -10.006036758422852, "global_step": 120154, "epoch": 715} {"train_loss": -10.108686447143555, "global_step": 120155, "epoch": 715} {"train_loss": -10.054834365844727, "global_step": 120156, "epoch": 715} {"train_loss": -9.880717277526855, "global_step": 120157, "epoch": 715} {"train_loss": -10.295036315917969, "global_step": 120158, "epoch": 715} {"train_loss": -10.032913208007812, "global_step": 120159, "epoch": 715} {"train_loss": -10.251045227050781, "global_step": 120160, "epoch": 715} {"train_loss": -10.356283187866211, "global_step": 120161, "epoch": 715} {"train_loss": -10.157997131347656, "global_step": 120162, "epoch": 715} {"train_loss": -10.196870803833008, "global_step": 120163, "epoch": 715} {"train_loss": -10.301825523376465, "global_step": 120164, "epoch": 715} {"train_loss": -10.050613403320312, "global_step": 120165, "epoch": 715} {"train_loss": -10.171476364135742, "global_step": 120166, "epoch": 715} {"train_loss": -10.046177864074707, "global_step": 120167, "epoch": 715} {"train_loss": -10.260660171508789, "global_step": 120168, "epoch": 715} {"train_loss": -10.309122085571289, "global_step": 120169, "epoch": 715} {"train_loss": -10.538565635681152, "global_step": 120170, "epoch": 715} {"train_loss": -10.335694313049316, "global_step": 120171, "epoch": 715} {"train_loss": -10.358417510986328, "global_step": 120172, "epoch": 715} {"train_loss": -10.293289184570312, "global_step": 120173, "epoch": 715} {"train_loss": -10.358012199401855, "global_step": 120174, "epoch": 715} {"train_loss": -10.19856071472168, "global_step": 120175, "epoch": 715} {"train_loss": -10.404439926147461, "global_step": 120176, "epoch": 715} {"train_loss": -10.094184875488281, "global_step": 120177, "epoch": 715} {"train_loss": -10.379249572753906, "global_step": 120178, "epoch": 715} {"train_loss": -10.391349792480469, "global_step": 120179, "epoch": 715} {"train_loss": -10.443870544433594, "global_step": 120180, "epoch": 715} {"train_loss": -10.471240997314453, "global_step": 120181, "epoch": 715} {"train_loss": -10.268362045288086, "global_step": 120182, "epoch": 715} {"train_loss": -10.235516548156738, "global_step": 120183, "epoch": 715} {"train_loss": -10.538670539855957, "global_step": 120184, "epoch": 715} {"train_loss": -10.137134552001953, "global_step": 120185, "epoch": 715} {"train_loss": -10.530990600585938, "global_step": 120186, "epoch": 715} {"train_loss": -10.436683654785156, "global_step": 120187, "epoch": 715} {"train_loss": -10.35091781616211, "global_step": 120188, "epoch": 715} {"train_loss": -10.237253189086914, "global_step": 120189, "epoch": 715} {"train_loss": -10.41248607635498, "global_step": 120190, "epoch": 715} {"train_loss": -10.056929588317871, "global_step": 120191, "epoch": 715} {"train_loss": -9.99416732788086, "global_step": 120192, "epoch": 715} {"train_loss": -10.273479461669922, "global_step": 120193, "epoch": 715} {"train_loss": -10.24526309967041, "global_step": 120194, "epoch": 715} {"train_loss": -9.779897689819336, "global_step": 120195, "epoch": 715} {"train_loss": -10.191169738769531, "global_step": 120196, "epoch": 715} {"train_loss": -10.16937255859375, "global_step": 120197, "epoch": 715} {"train_loss": -10.117964744567871, "global_step": 120198, "epoch": 715} {"train_loss": -10.26150894165039, "global_step": 120199, "epoch": 715} {"train_loss": -9.825078964233398, "global_step": 120200, "epoch": 715} {"train_loss": -10.359899520874023, "global_step": 120201, "epoch": 715} {"train_loss": -9.970444679260254, "global_step": 120202, "epoch": 715} {"train_loss": -9.62521743774414, "global_step": 120203, "epoch": 715} {"train_loss": -10.246585845947266, "global_step": 120204, "epoch": 715} {"train_loss": -9.765260696411133, "global_step": 120205, "epoch": 715} {"train_loss": -10.333162307739258, "global_step": 120206, "epoch": 715} {"train_loss": -10.162222862243652, "global_step": 120207, "epoch": 715} {"train_loss": -10.123976707458496, "global_step": 120208, "epoch": 715} {"train_loss": -9.912789344787598, "global_step": 120209, "epoch": 715} {"train_loss": -9.699413299560547, "global_step": 120210, "epoch": 715} {"train_loss": -10.096786499023438, "global_step": 120211, "epoch": 715} {"train_loss": -9.635769844055176, "global_step": 120212, "epoch": 715} {"train_loss": -10.23282527923584, "global_step": 120213, "epoch": 715} {"train_loss": -9.764493942260742, "global_step": 120214, "epoch": 715} {"train_loss": -10.343717575073242, "global_step": 120215, "epoch": 715} {"train_loss": -9.987534523010254, "global_step": 120216, "epoch": 715} {"train_loss": -10.281170845031738, "global_step": 120217, "epoch": 715} {"train_loss": -9.95076847076416, "global_step": 120218, "epoch": 715} {"train_loss": -10.23415756225586, "global_step": 120219, "epoch": 715} {"train_loss": -10.14003849029541, "global_step": 120220, "epoch": 715} {"train_loss": -10.022221565246582, "global_step": 120221, "epoch": 715} {"train_loss": -10.000782012939453, "global_step": 120222, "epoch": 715} {"train_loss": -10.00484848022461, "global_step": 120223, "epoch": 715} {"train_loss": -9.931722640991211, "global_step": 120224, "epoch": 715} {"train_loss": -10.11541748046875, "global_step": 120225, "epoch": 715} {"train_loss": -10.0294771194458, "global_step": 120226, "epoch": 715} {"train_loss": -10.08500862121582, "global_step": 120227, "epoch": 715} {"train_loss": -10.198328018188477, "global_step": 120228, "epoch": 715} {"train_loss": -10.235901832580566, "global_step": 120229, "epoch": 715} {"train_loss": -10.105430603027344, "global_step": 120230, "epoch": 715} {"train_loss": -10.226673126220703, "global_step": 120231, "epoch": 715} {"train_loss": -10.269132614135742, "global_step": 120232, "epoch": 715} {"train_loss": -10.086122512817383, "global_step": 120233, "epoch": 715} {"train_loss": -10.336725234985352, "global_step": 120234, "epoch": 715} {"train_loss": -10.158896446228027, "global_step": 120235, "epoch": 715} {"train_loss": -10.210415840148926, "global_step": 120236, "epoch": 715} {"train_loss": -10.190732955932617, "global_step": 120237, "epoch": 715} {"train_loss": -10.111968040466309, "global_step": 120238, "epoch": 715} {"train_loss": -10.061479568481445, "global_step": 120239, "epoch": 715} {"train_loss": -10.172100067138672, "global_step": 120240, "epoch": 715} {"train_loss": -10.164155960083008, "global_step": 120241, "epoch": 715} {"train_loss": -10.232156753540039, "global_step": 120242, "epoch": 715} {"train_loss": -9.961830139160156, "global_step": 120243, "epoch": 715} {"train_loss": -10.101244926452637, "global_step": 120244, "epoch": 715} {"train_loss": -10.014023780822754, "global_step": 120245, "epoch": 715} {"train_loss": -10.228704452514648, "global_step": 120246, "epoch": 715} {"train_loss": -10.169795989990234, "global_step": 120247, "epoch": 715} {"train_loss": -10.127705574035645, "global_step": 120248, "epoch": 715} {"train_loss": -10.412398338317871, "global_step": 120249, "epoch": 715} {"train_loss": -9.956659317016602, "global_step": 120250, "epoch": 715} {"train_loss": -10.381391525268555, "global_step": 120251, "epoch": 715} {"train_loss": -10.231122970581055, "global_step": 120252, "epoch": 715} {"train_loss": -10.334930419921875, "global_step": 120253, "epoch": 715} {"train_loss": -10.213687896728516, "global_step": 120254, "epoch": 715} {"train_loss": -10.267004013061523, "global_step": 120255, "epoch": 715} {"train_loss": -10.15230941772461, "global_step": 120256, "epoch": 715} {"train_loss": -10.251659393310547, "global_step": 120257, "epoch": 715} {"train_loss": -10.063949584960938, "global_step": 120258, "epoch": 715} {"train_loss": -10.190340042114258, "global_step": 120259, "epoch": 715} {"train_loss": -10.362752914428711, "global_step": 120260, "epoch": 715} {"train_loss": -9.959922790527344, "global_step": 120261, "epoch": 715} {"train_loss": -10.183842658996582, "global_step": 120262, "epoch": 715} {"train_loss": -10.244000434875488, "global_step": 120263, "epoch": 715} {"train_loss": -10.29935073852539, "global_step": 120264, "epoch": 715} {"train_loss": -10.184581756591797, "global_step": 120265, "epoch": 715} {"train_loss": -10.200364112854004, "global_step": 120266, "epoch": 715} {"train_loss": -10.271382331848145, "global_step": 120267, "epoch": 715} {"train_loss": -10.258590698242188, "global_step": 120268, "epoch": 715} {"train_loss": -10.153273582458496, "global_step": 120269, "epoch": 715} {"train_loss": -10.199054718017578, "global_step": 120270, "epoch": 715} {"train_loss": -10.050193786621094, "global_step": 120271, "epoch": 715} {"train_loss": -9.91175651550293, "global_step": 120272, "epoch": 715} {"train_loss": -10.290019035339355, "global_step": 120273, "epoch": 715} {"train_loss": -10.168044090270996, "global_step": 120274, "epoch": 715} {"train_loss": -9.958585739135742, "global_step": 120275, "epoch": 715} {"train_loss": -10.371631622314453, "global_step": 120276, "epoch": 715} {"train_loss": -10.230207443237305, "global_step": 120277, "epoch": 715} {"train_loss": -10.55129623413086, "global_step": 120278, "epoch": 715} {"train_loss": -10.567047119140625, "global_step": 120279, "epoch": 715} {"train_loss": -10.276407241821289, "global_step": 120280, "epoch": 715} {"train_loss": -10.38711929321289, "global_step": 120281, "epoch": 715} {"train_loss": -10.166879653930664, "global_step": 120282, "epoch": 715} {"train_loss": -10.303425788879395, "global_step": 120283, "epoch": 715} {"train_loss": -10.190637588500977, "global_step": 120284, "epoch": 715} {"train_loss": -10.361734390258789, "global_step": 120285, "epoch": 715} {"train_loss": -10.390689849853516, "global_step": 120286, "epoch": 715} {"train_loss": -10.107385124479022, "global_step": 120287, "epoch": 715, "val_loss": 214899.1875, "train_action_mse_error": 2.327949285507202} {"train_loss": -10.49651050567627, "global_step": 120288, "epoch": 716} {"train_loss": -10.222715377807617, "global_step": 120289, "epoch": 716} {"train_loss": -10.573396682739258, "global_step": 120290, "epoch": 716} {"train_loss": -10.459640502929688, "global_step": 120291, "epoch": 716} {"train_loss": -10.238994598388672, "global_step": 120292, "epoch": 716} {"train_loss": -10.441916465759277, "global_step": 120293, "epoch": 716} {"train_loss": -10.128820419311523, "global_step": 120294, "epoch": 716} {"train_loss": -10.295759201049805, "global_step": 120295, "epoch": 716} {"train_loss": -10.320589065551758, "global_step": 120296, "epoch": 716} {"train_loss": -10.024860382080078, "global_step": 120297, "epoch": 716} {"train_loss": -10.412428855895996, "global_step": 120298, "epoch": 716} {"train_loss": -10.086483001708984, "global_step": 120299, "epoch": 716} {"train_loss": -10.108797073364258, "global_step": 120300, "epoch": 716} {"train_loss": -10.3751220703125, "global_step": 120301, "epoch": 716} {"train_loss": -9.894416809082031, "global_step": 120302, "epoch": 716} {"train_loss": -10.2819185256958, "global_step": 120303, "epoch": 716} {"train_loss": -9.909043312072754, "global_step": 120304, "epoch": 716} {"train_loss": -10.180534362792969, "global_step": 120305, "epoch": 716} {"train_loss": -10.424514770507812, "global_step": 120306, "epoch": 716} {"train_loss": -9.846202850341797, "global_step": 120307, "epoch": 716} {"train_loss": -10.131778717041016, "global_step": 120308, "epoch": 716} {"train_loss": -10.103729248046875, "global_step": 120309, "epoch": 716} {"train_loss": -10.018378257751465, "global_step": 120310, "epoch": 716} {"train_loss": -9.992523193359375, "global_step": 120311, "epoch": 716} {"train_loss": -9.952079772949219, "global_step": 120312, "epoch": 716} {"train_loss": -9.898804664611816, "global_step": 120313, "epoch": 716} {"train_loss": -9.4404878616333, "global_step": 120314, "epoch": 716} {"train_loss": -9.969463348388672, "global_step": 120315, "epoch": 716} {"train_loss": -9.32602596282959, "global_step": 120316, "epoch": 716} {"train_loss": -10.163045883178711, "global_step": 120317, "epoch": 716} {"train_loss": -9.511232376098633, "global_step": 120318, "epoch": 716} {"train_loss": -9.75476360321045, "global_step": 120319, "epoch": 716} {"train_loss": -9.662866592407227, "global_step": 120320, "epoch": 716} {"train_loss": -9.672309875488281, "global_step": 120321, "epoch": 716} {"train_loss": -9.689321517944336, "global_step": 120322, "epoch": 716} {"train_loss": -9.981834411621094, "global_step": 120323, "epoch": 716} {"train_loss": -9.628843307495117, "global_step": 120324, "epoch": 716} {"train_loss": -9.887062072753906, "global_step": 120325, "epoch": 716} {"train_loss": -9.75729751586914, "global_step": 120326, "epoch": 716} {"train_loss": -9.355944633483887, "global_step": 120327, "epoch": 716} {"train_loss": -9.938028335571289, "global_step": 120328, "epoch": 716} {"train_loss": -9.716796875, "global_step": 120329, "epoch": 716} {"train_loss": -9.615644454956055, "global_step": 120330, "epoch": 716} {"train_loss": -10.044769287109375, "global_step": 120331, "epoch": 716} {"train_loss": -9.760231018066406, "global_step": 120332, "epoch": 716} {"train_loss": -10.077024459838867, "global_step": 120333, "epoch": 716} {"train_loss": -9.786081314086914, "global_step": 120334, "epoch": 716} {"train_loss": -10.164169311523438, "global_step": 120335, "epoch": 716} {"train_loss": -9.940978050231934, "global_step": 120336, "epoch": 716} {"train_loss": -10.103021621704102, "global_step": 120337, "epoch": 716} {"train_loss": -9.921961784362793, "global_step": 120338, "epoch": 716} {"train_loss": -10.073648452758789, "global_step": 120339, "epoch": 716} {"train_loss": -10.193780899047852, "global_step": 120340, "epoch": 716} {"train_loss": -10.11337661743164, "global_step": 120341, "epoch": 716} {"train_loss": -10.242950439453125, "global_step": 120342, "epoch": 716} {"train_loss": -10.081795692443848, "global_step": 120343, "epoch": 716} {"train_loss": -10.210153579711914, "global_step": 120344, "epoch": 716} {"train_loss": -10.199893951416016, "global_step": 120345, "epoch": 716} {"train_loss": -10.313151359558105, "global_step": 120346, "epoch": 716} {"train_loss": -10.294888496398926, "global_step": 120347, "epoch": 716} {"train_loss": -10.198200225830078, "global_step": 120348, "epoch": 716} {"train_loss": -10.393695831298828, "global_step": 120349, "epoch": 716} {"train_loss": -10.107033729553223, "global_step": 120350, "epoch": 716} {"train_loss": -10.265735626220703, "global_step": 120351, "epoch": 716} {"train_loss": -10.245699882507324, "global_step": 120352, "epoch": 716} {"train_loss": -10.34857177734375, "global_step": 120353, "epoch": 716} {"train_loss": -10.419994354248047, "global_step": 120354, "epoch": 716} {"train_loss": -10.278481483459473, "global_step": 120355, "epoch": 716} {"train_loss": -10.24488639831543, "global_step": 120356, "epoch": 716} {"train_loss": -10.443486213684082, "global_step": 120357, "epoch": 716} {"train_loss": -10.368715286254883, "global_step": 120358, "epoch": 716} {"train_loss": -10.54806900024414, "global_step": 120359, "epoch": 716} {"train_loss": -10.290899276733398, "global_step": 120360, "epoch": 716} {"train_loss": -10.42818832397461, "global_step": 120361, "epoch": 716} {"train_loss": -10.363862037658691, "global_step": 120362, "epoch": 716} {"train_loss": -10.327588081359863, "global_step": 120363, "epoch": 716} {"train_loss": -10.275350570678711, "global_step": 120364, "epoch": 716} {"train_loss": -10.394625663757324, "global_step": 120365, "epoch": 716} {"train_loss": -9.934645652770996, "global_step": 120366, "epoch": 716} {"train_loss": -10.05667495727539, "global_step": 120367, "epoch": 716} {"train_loss": -9.852527618408203, "global_step": 120368, "epoch": 716} {"train_loss": -10.162349700927734, "global_step": 120369, "epoch": 716} {"train_loss": -10.02193832397461, "global_step": 120370, "epoch": 716} {"train_loss": -10.31058120727539, "global_step": 120371, "epoch": 716} {"train_loss": -9.795280456542969, "global_step": 120372, "epoch": 716} {"train_loss": -9.42812728881836, "global_step": 120373, "epoch": 716} {"train_loss": -10.351019859313965, "global_step": 120374, "epoch": 716} {"train_loss": -9.669540405273438, "global_step": 120375, "epoch": 716} {"train_loss": -9.901912689208984, "global_step": 120376, "epoch": 716} {"train_loss": -9.627918243408203, "global_step": 120377, "epoch": 716} {"train_loss": -9.789998054504395, "global_step": 120378, "epoch": 716} {"train_loss": -9.518869400024414, "global_step": 120379, "epoch": 716} {"train_loss": -9.555490493774414, "global_step": 120380, "epoch": 716} {"train_loss": -9.792160987854004, "global_step": 120381, "epoch": 716} {"train_loss": -9.500556945800781, "global_step": 120382, "epoch": 716} {"train_loss": -9.506972312927246, "global_step": 120383, "epoch": 716} {"train_loss": -9.885348320007324, "global_step": 120384, "epoch": 716} {"train_loss": -9.787782669067383, "global_step": 120385, "epoch": 716} {"train_loss": -10.1753511428833, "global_step": 120386, "epoch": 716} {"train_loss": -9.854844093322754, "global_step": 120387, "epoch": 716} {"train_loss": -9.777231216430664, "global_step": 120388, "epoch": 716} {"train_loss": -9.736151695251465, "global_step": 120389, "epoch": 716} {"train_loss": -9.681482315063477, "global_step": 120390, "epoch": 716} {"train_loss": -9.726951599121094, "global_step": 120391, "epoch": 716} {"train_loss": -9.738410949707031, "global_step": 120392, "epoch": 716} {"train_loss": -9.92504596710205, "global_step": 120393, "epoch": 716} {"train_loss": -9.845270156860352, "global_step": 120394, "epoch": 716} {"train_loss": -9.998591423034668, "global_step": 120395, "epoch": 716} {"train_loss": -10.060166358947754, "global_step": 120396, "epoch": 716} {"train_loss": -9.881980895996094, "global_step": 120397, "epoch": 716} {"train_loss": -9.723365783691406, "global_step": 120398, "epoch": 716} {"train_loss": -9.962833404541016, "global_step": 120399, "epoch": 716} {"train_loss": -10.156290054321289, "global_step": 120400, "epoch": 716} {"train_loss": -10.215224266052246, "global_step": 120401, "epoch": 716} {"train_loss": -9.654138565063477, "global_step": 120402, "epoch": 716} {"train_loss": -9.95483684539795, "global_step": 120403, "epoch": 716} {"train_loss": -9.984868049621582, "global_step": 120404, "epoch": 716} {"train_loss": -9.780126571655273, "global_step": 120405, "epoch": 716} {"train_loss": -9.6632080078125, "global_step": 120406, "epoch": 716} {"train_loss": -10.020002365112305, "global_step": 120407, "epoch": 716} {"train_loss": -9.913634300231934, "global_step": 120408, "epoch": 716} {"train_loss": -10.009933471679688, "global_step": 120409, "epoch": 716} {"train_loss": -10.191136360168457, "global_step": 120410, "epoch": 716} {"train_loss": -10.026793479919434, "global_step": 120411, "epoch": 716} {"train_loss": -9.838479042053223, "global_step": 120412, "epoch": 716} {"train_loss": -10.113887786865234, "global_step": 120413, "epoch": 716} {"train_loss": -9.87700366973877, "global_step": 120414, "epoch": 716} {"train_loss": -9.796350479125977, "global_step": 120415, "epoch": 716} {"train_loss": -10.13953971862793, "global_step": 120416, "epoch": 716} {"train_loss": -10.042339324951172, "global_step": 120417, "epoch": 716} {"train_loss": -10.148300170898438, "global_step": 120418, "epoch": 716} {"train_loss": -10.188822746276855, "global_step": 120419, "epoch": 716} {"train_loss": -9.826606750488281, "global_step": 120420, "epoch": 716} {"train_loss": -10.184364318847656, "global_step": 120421, "epoch": 716} {"train_loss": -10.333162307739258, "global_step": 120422, "epoch": 716} {"train_loss": -10.113668441772461, "global_step": 120423, "epoch": 716} {"train_loss": -10.185111999511719, "global_step": 120424, "epoch": 716} {"train_loss": -10.175813674926758, "global_step": 120425, "epoch": 716} {"train_loss": -10.25190258026123, "global_step": 120426, "epoch": 716} {"train_loss": -10.061717987060547, "global_step": 120427, "epoch": 716} {"train_loss": -10.238725662231445, "global_step": 120428, "epoch": 716} {"train_loss": -9.760595321655273, "global_step": 120429, "epoch": 716} {"train_loss": -10.34433364868164, "global_step": 120430, "epoch": 716} {"train_loss": -9.908025741577148, "global_step": 120431, "epoch": 716} {"train_loss": -9.634584426879883, "global_step": 120432, "epoch": 716} {"train_loss": -10.322298049926758, "global_step": 120433, "epoch": 716} {"train_loss": -10.01626968383789, "global_step": 120434, "epoch": 716} {"train_loss": -10.205926895141602, "global_step": 120435, "epoch": 716} {"train_loss": -10.355123519897461, "global_step": 120436, "epoch": 716} {"train_loss": -10.07640552520752, "global_step": 120437, "epoch": 716} {"train_loss": -10.419991493225098, "global_step": 120438, "epoch": 716} {"train_loss": -10.309059143066406, "global_step": 120439, "epoch": 716} {"train_loss": -10.479543685913086, "global_step": 120440, "epoch": 716} {"train_loss": -9.870643615722656, "global_step": 120441, "epoch": 716} {"train_loss": -10.480046272277832, "global_step": 120442, "epoch": 716} {"train_loss": -10.064194679260254, "global_step": 120443, "epoch": 716} {"train_loss": -10.203193664550781, "global_step": 120444, "epoch": 716} {"train_loss": -10.049450874328613, "global_step": 120445, "epoch": 716} {"train_loss": -10.004201889038086, "global_step": 120446, "epoch": 716} {"train_loss": -10.20503044128418, "global_step": 120447, "epoch": 716} {"train_loss": -10.201589584350586, "global_step": 120448, "epoch": 716} {"train_loss": -10.145501136779785, "global_step": 120449, "epoch": 716} {"train_loss": -9.930237770080566, "global_step": 120450, "epoch": 716} {"train_loss": -10.339696884155273, "global_step": 120451, "epoch": 716} {"train_loss": -9.92091178894043, "global_step": 120452, "epoch": 716} {"train_loss": -9.889708518981934, "global_step": 120453, "epoch": 716} {"train_loss": -10.324188232421875, "global_step": 120454, "epoch": 716} {"train_loss": -10.03900366737729, "global_step": 120455, "epoch": 716, "val_loss": 216284.234375} {"train_loss": -10.119361877441406, "global_step": 120456, "epoch": 717} {"train_loss": -10.279441833496094, "global_step": 120457, "epoch": 717} {"train_loss": -10.319472312927246, "global_step": 120458, "epoch": 717} {"train_loss": -10.086849212646484, "global_step": 120459, "epoch": 717} {"train_loss": -10.314159393310547, "global_step": 120460, "epoch": 717} {"train_loss": -10.058772087097168, "global_step": 120461, "epoch": 717} {"train_loss": -10.336797714233398, "global_step": 120462, "epoch": 717} {"train_loss": -10.015003204345703, "global_step": 120463, "epoch": 717} {"train_loss": -10.214530944824219, "global_step": 120464, "epoch": 717} {"train_loss": -10.213752746582031, "global_step": 120465, "epoch": 717} {"train_loss": -9.98006820678711, "global_step": 120466, "epoch": 717} {"train_loss": -9.939449310302734, "global_step": 120467, "epoch": 717} {"train_loss": -10.107351303100586, "global_step": 120468, "epoch": 717} {"train_loss": -10.176334381103516, "global_step": 120469, "epoch": 717} {"train_loss": -10.125091552734375, "global_step": 120470, "epoch": 717} {"train_loss": -10.303476333618164, "global_step": 120471, "epoch": 717} {"train_loss": -9.917383193969727, "global_step": 120472, "epoch": 717} {"train_loss": -10.225654602050781, "global_step": 120473, "epoch": 717} {"train_loss": -10.037090301513672, "global_step": 120474, "epoch": 717} {"train_loss": -10.303050994873047, "global_step": 120475, "epoch": 717} {"train_loss": -10.084220886230469, "global_step": 120476, "epoch": 717} {"train_loss": -10.083155632019043, "global_step": 120477, "epoch": 717} {"train_loss": -10.340827941894531, "global_step": 120478, "epoch": 717} {"train_loss": -9.964386940002441, "global_step": 120479, "epoch": 717} {"train_loss": -10.411552429199219, "global_step": 120480, "epoch": 717} {"train_loss": -10.023361206054688, "global_step": 120481, "epoch": 717} {"train_loss": -10.219264030456543, "global_step": 120482, "epoch": 717} {"train_loss": -10.42827033996582, "global_step": 120483, "epoch": 717} {"train_loss": -10.162240982055664, "global_step": 120484, "epoch": 717} {"train_loss": -10.195785522460938, "global_step": 120485, "epoch": 717} {"train_loss": -10.19444751739502, "global_step": 120486, "epoch": 717} {"train_loss": -10.416244506835938, "global_step": 120487, "epoch": 717} {"train_loss": -10.340723037719727, "global_step": 120488, "epoch": 717} {"train_loss": -10.417085647583008, "global_step": 120489, "epoch": 717} {"train_loss": -10.267077445983887, "global_step": 120490, "epoch": 717} {"train_loss": -10.395700454711914, "global_step": 120491, "epoch": 717} {"train_loss": -10.081093788146973, "global_step": 120492, "epoch": 717} {"train_loss": -10.136253356933594, "global_step": 120493, "epoch": 717} {"train_loss": -9.76943588256836, "global_step": 120494, "epoch": 717} {"train_loss": -9.922330856323242, "global_step": 120495, "epoch": 717} {"train_loss": -10.146417617797852, "global_step": 120496, "epoch": 717} {"train_loss": -9.934412002563477, "global_step": 120497, "epoch": 717} {"train_loss": -10.204458236694336, "global_step": 120498, "epoch": 717} {"train_loss": -10.058438301086426, "global_step": 120499, "epoch": 717} {"train_loss": -10.292617797851562, "global_step": 120500, "epoch": 717} {"train_loss": -10.0860013961792, "global_step": 120501, "epoch": 717} {"train_loss": -10.416690826416016, "global_step": 120502, "epoch": 717} {"train_loss": -10.336616516113281, "global_step": 120503, "epoch": 717} {"train_loss": -10.208247184753418, "global_step": 120504, "epoch": 717} {"train_loss": -10.353023529052734, "global_step": 120505, "epoch": 717} {"train_loss": -9.634251594543457, "global_step": 120506, "epoch": 717} {"train_loss": -10.24828815460205, "global_step": 120507, "epoch": 717} {"train_loss": -9.48680591583252, "global_step": 120508, "epoch": 717} {"train_loss": -9.288581848144531, "global_step": 120509, "epoch": 717} {"train_loss": -10.194726943969727, "global_step": 120510, "epoch": 717} {"train_loss": -9.501136779785156, "global_step": 120511, "epoch": 717} {"train_loss": -9.683881759643555, "global_step": 120512, "epoch": 717} {"train_loss": -10.009777069091797, "global_step": 120513, "epoch": 717} {"train_loss": -9.36452865600586, "global_step": 120514, "epoch": 717} {"train_loss": -9.825178146362305, "global_step": 120515, "epoch": 717} {"train_loss": -9.720726013183594, "global_step": 120516, "epoch": 717} {"train_loss": -10.094061851501465, "global_step": 120517, "epoch": 717} {"train_loss": -9.822677612304688, "global_step": 120518, "epoch": 717} {"train_loss": -9.790157318115234, "global_step": 120519, "epoch": 717} {"train_loss": -10.047831535339355, "global_step": 120520, "epoch": 717} {"train_loss": -10.027203559875488, "global_step": 120521, "epoch": 717} {"train_loss": -10.045021057128906, "global_step": 120522, "epoch": 717} {"train_loss": -9.820636749267578, "global_step": 120523, "epoch": 717} {"train_loss": -10.10941219329834, "global_step": 120524, "epoch": 717} {"train_loss": -9.602937698364258, "global_step": 120525, "epoch": 717} {"train_loss": -10.07619857788086, "global_step": 120526, "epoch": 717} {"train_loss": -9.950101852416992, "global_step": 120527, "epoch": 717} {"train_loss": -9.825702667236328, "global_step": 120528, "epoch": 717} {"train_loss": -9.765022277832031, "global_step": 120529, "epoch": 717} {"train_loss": -9.830891609191895, "global_step": 120530, "epoch": 717} {"train_loss": -9.895975112915039, "global_step": 120531, "epoch": 717} {"train_loss": -9.793938636779785, "global_step": 120532, "epoch": 717} {"train_loss": -10.164894104003906, "global_step": 120533, "epoch": 717} {"train_loss": -9.99194622039795, "global_step": 120534, "epoch": 717} {"train_loss": -9.975421905517578, "global_step": 120535, "epoch": 717} {"train_loss": -10.082122802734375, "global_step": 120536, "epoch": 717} {"train_loss": -9.877340316772461, "global_step": 120537, "epoch": 717} {"train_loss": -10.139181137084961, "global_step": 120538, "epoch": 717} {"train_loss": -10.243054389953613, "global_step": 120539, "epoch": 717} {"train_loss": -10.188387870788574, "global_step": 120540, "epoch": 717} {"train_loss": -10.12222671508789, "global_step": 120541, "epoch": 717} {"train_loss": -10.197389602661133, "global_step": 120542, "epoch": 717} {"train_loss": -10.175567626953125, "global_step": 120543, "epoch": 717} {"train_loss": -10.189530372619629, "global_step": 120544, "epoch": 717} {"train_loss": -10.315784454345703, "global_step": 120545, "epoch": 717} {"train_loss": -10.18543815612793, "global_step": 120546, "epoch": 717} {"train_loss": -10.24079704284668, "global_step": 120547, "epoch": 717} {"train_loss": -10.17263412475586, "global_step": 120548, "epoch": 717} {"train_loss": -10.371302604675293, "global_step": 120549, "epoch": 717} {"train_loss": -10.151651382446289, "global_step": 120550, "epoch": 717} {"train_loss": -10.478134155273438, "global_step": 120551, "epoch": 717} {"train_loss": -10.231393814086914, "global_step": 120552, "epoch": 717} {"train_loss": -10.129814147949219, "global_step": 120553, "epoch": 717} {"train_loss": -10.231637954711914, "global_step": 120554, "epoch": 717} {"train_loss": -10.129562377929688, "global_step": 120555, "epoch": 717} {"train_loss": -10.313302993774414, "global_step": 120556, "epoch": 717} {"train_loss": -10.206103324890137, "global_step": 120557, "epoch": 717} {"train_loss": -10.048057556152344, "global_step": 120558, "epoch": 717} {"train_loss": -10.297820091247559, "global_step": 120559, "epoch": 717} {"train_loss": -9.949790954589844, "global_step": 120560, "epoch": 717} {"train_loss": -10.344280242919922, "global_step": 120561, "epoch": 717} {"train_loss": -10.485559463500977, "global_step": 120562, "epoch": 717} {"train_loss": -10.441900253295898, "global_step": 120563, "epoch": 717} {"train_loss": -10.51917839050293, "global_step": 120564, "epoch": 717} {"train_loss": -10.213813781738281, "global_step": 120565, "epoch": 717} {"train_loss": -10.33169937133789, "global_step": 120566, "epoch": 717} {"train_loss": -10.236181259155273, "global_step": 120567, "epoch": 717} {"train_loss": -10.449277877807617, "global_step": 120568, "epoch": 717} {"train_loss": -10.240032196044922, "global_step": 120569, "epoch": 717} {"train_loss": -10.400959014892578, "global_step": 120570, "epoch": 717} {"train_loss": -10.325602531433105, "global_step": 120571, "epoch": 717} {"train_loss": -10.411417007446289, "global_step": 120572, "epoch": 717} {"train_loss": -10.50222396850586, "global_step": 120573, "epoch": 717} {"train_loss": -10.352836608886719, "global_step": 120574, "epoch": 717} {"train_loss": -10.445110321044922, "global_step": 120575, "epoch": 717} {"train_loss": -10.367061614990234, "global_step": 120576, "epoch": 717} {"train_loss": -10.104921340942383, "global_step": 120577, "epoch": 717} {"train_loss": -10.215248107910156, "global_step": 120578, "epoch": 717} {"train_loss": -9.857012748718262, "global_step": 120579, "epoch": 717} {"train_loss": -10.203474998474121, "global_step": 120580, "epoch": 717} {"train_loss": -10.351336479187012, "global_step": 120581, "epoch": 717} {"train_loss": -10.503765106201172, "global_step": 120582, "epoch": 717} {"train_loss": -10.50766658782959, "global_step": 120583, "epoch": 717} {"train_loss": -10.247480392456055, "global_step": 120584, "epoch": 717} {"train_loss": -10.49204158782959, "global_step": 120585, "epoch": 717} {"train_loss": -9.926408767700195, "global_step": 120586, "epoch": 717} {"train_loss": -10.244501113891602, "global_step": 120587, "epoch": 717} {"train_loss": -10.315577507019043, "global_step": 120588, "epoch": 717} {"train_loss": -10.02954387664795, "global_step": 120589, "epoch": 717} {"train_loss": -10.158304214477539, "global_step": 120590, "epoch": 717} {"train_loss": -10.225406646728516, "global_step": 120591, "epoch": 717} {"train_loss": -9.987438201904297, "global_step": 120592, "epoch": 717} {"train_loss": -10.464762687683105, "global_step": 120593, "epoch": 717} {"train_loss": -9.983287811279297, "global_step": 120594, "epoch": 717} {"train_loss": -10.332870483398438, "global_step": 120595, "epoch": 717} {"train_loss": -10.088445663452148, "global_step": 120596, "epoch": 717} {"train_loss": -10.332429885864258, "global_step": 120597, "epoch": 717} {"train_loss": -10.176168441772461, "global_step": 120598, "epoch": 717} {"train_loss": -9.990615844726562, "global_step": 120599, "epoch": 717} {"train_loss": -10.406259536743164, "global_step": 120600, "epoch": 717} {"train_loss": -10.249378204345703, "global_step": 120601, "epoch": 717} {"train_loss": -10.407660484313965, "global_step": 120602, "epoch": 717} {"train_loss": -10.185545921325684, "global_step": 120603, "epoch": 717} {"train_loss": -10.044790267944336, "global_step": 120604, "epoch": 717} {"train_loss": -10.355168342590332, "global_step": 120605, "epoch": 717} {"train_loss": -9.865028381347656, "global_step": 120606, "epoch": 717} {"train_loss": -10.446792602539062, "global_step": 120607, "epoch": 717} {"train_loss": -10.461233139038086, "global_step": 120608, "epoch": 717} {"train_loss": -9.604507446289062, "global_step": 120609, "epoch": 717} {"train_loss": -10.283300399780273, "global_step": 120610, "epoch": 717} {"train_loss": -9.526143074035645, "global_step": 120611, "epoch": 717} {"train_loss": -10.112906455993652, "global_step": 120612, "epoch": 717} {"train_loss": -10.031766891479492, "global_step": 120613, "epoch": 717} {"train_loss": -9.617995262145996, "global_step": 120614, "epoch": 717} {"train_loss": -10.376346588134766, "global_step": 120615, "epoch": 717} {"train_loss": -9.952445030212402, "global_step": 120616, "epoch": 717} {"train_loss": -10.019035339355469, "global_step": 120617, "epoch": 717} {"train_loss": -10.167407035827637, "global_step": 120618, "epoch": 717} {"train_loss": -9.898035049438477, "global_step": 120619, "epoch": 717} {"train_loss": -10.138911247253418, "global_step": 120620, "epoch": 717} {"train_loss": -10.050545692443848, "global_step": 120621, "epoch": 717} {"train_loss": -10.156942367553711, "global_step": 120622, "epoch": 717} {"train_loss": -10.133038288071042, "global_step": 120623, "epoch": 717, "val_loss": 211589.296875} {"train_loss": -10.067642211914062, "global_step": 120624, "epoch": 718} {"train_loss": -9.966424942016602, "global_step": 120625, "epoch": 718} {"train_loss": -10.094902992248535, "global_step": 120626, "epoch": 718} {"train_loss": -9.846580505371094, "global_step": 120627, "epoch": 718} {"train_loss": -10.244089126586914, "global_step": 120628, "epoch": 718} {"train_loss": -10.163484573364258, "global_step": 120629, "epoch": 718} {"train_loss": -10.068416595458984, "global_step": 120630, "epoch": 718} {"train_loss": -9.837831497192383, "global_step": 120631, "epoch": 718} {"train_loss": -9.82634162902832, "global_step": 120632, "epoch": 718} {"train_loss": -10.224842071533203, "global_step": 120633, "epoch": 718} {"train_loss": -10.090691566467285, "global_step": 120634, "epoch": 718} {"train_loss": -10.1213960647583, "global_step": 120635, "epoch": 718} {"train_loss": -10.085878372192383, "global_step": 120636, "epoch": 718} {"train_loss": -10.146431922912598, "global_step": 120637, "epoch": 718} {"train_loss": -10.198179244995117, "global_step": 120638, "epoch": 718} {"train_loss": -10.221233367919922, "global_step": 120639, "epoch": 718} {"train_loss": -10.346510887145996, "global_step": 120640, "epoch": 718} {"train_loss": -9.872625350952148, "global_step": 120641, "epoch": 718} {"train_loss": -10.216718673706055, "global_step": 120642, "epoch": 718} {"train_loss": -10.289496421813965, "global_step": 120643, "epoch": 718} {"train_loss": -10.198877334594727, "global_step": 120644, "epoch": 718} {"train_loss": -10.365521430969238, "global_step": 120645, "epoch": 718} {"train_loss": -10.182841300964355, "global_step": 120646, "epoch": 718} {"train_loss": -10.338294982910156, "global_step": 120647, "epoch": 718} {"train_loss": -10.059954643249512, "global_step": 120648, "epoch": 718} {"train_loss": -10.35083293914795, "global_step": 120649, "epoch": 718} {"train_loss": -10.179595947265625, "global_step": 120650, "epoch": 718} {"train_loss": -10.452598571777344, "global_step": 120651, "epoch": 718} {"train_loss": -10.159486770629883, "global_step": 120652, "epoch": 718} {"train_loss": -10.459844589233398, "global_step": 120653, "epoch": 718} {"train_loss": -10.498860359191895, "global_step": 120654, "epoch": 718} {"train_loss": -10.38360595703125, "global_step": 120655, "epoch": 718} {"train_loss": -10.323089599609375, "global_step": 120656, "epoch": 718} {"train_loss": -10.462163925170898, "global_step": 120657, "epoch": 718} {"train_loss": -10.284547805786133, "global_step": 120658, "epoch": 718} {"train_loss": -10.19753646850586, "global_step": 120659, "epoch": 718} {"train_loss": -10.581626892089844, "global_step": 120660, "epoch": 718} {"train_loss": -10.212100982666016, "global_step": 120661, "epoch": 718} {"train_loss": -10.372200012207031, "global_step": 120662, "epoch": 718} {"train_loss": -10.302337646484375, "global_step": 120663, "epoch": 718} {"train_loss": -10.172159194946289, "global_step": 120664, "epoch": 718} {"train_loss": -10.179311752319336, "global_step": 120665, "epoch": 718} {"train_loss": -10.299654006958008, "global_step": 120666, "epoch": 718} {"train_loss": -10.29472541809082, "global_step": 120667, "epoch": 718} {"train_loss": -10.27239990234375, "global_step": 120668, "epoch": 718} {"train_loss": -9.994401931762695, "global_step": 120669, "epoch": 718} {"train_loss": -10.047809600830078, "global_step": 120670, "epoch": 718} {"train_loss": -9.691705703735352, "global_step": 120671, "epoch": 718} {"train_loss": -10.097270965576172, "global_step": 120672, "epoch": 718} {"train_loss": -9.549884796142578, "global_step": 120673, "epoch": 718} {"train_loss": -9.806683540344238, "global_step": 120674, "epoch": 718} {"train_loss": -9.932621002197266, "global_step": 120675, "epoch": 718} {"train_loss": -9.477816581726074, "global_step": 120676, "epoch": 718} {"train_loss": -10.115060806274414, "global_step": 120677, "epoch": 718} {"train_loss": -9.625490188598633, "global_step": 120678, "epoch": 718} {"train_loss": -9.970293998718262, "global_step": 120679, "epoch": 718} {"train_loss": -10.144704818725586, "global_step": 120680, "epoch": 718} {"train_loss": -10.063285827636719, "global_step": 120681, "epoch": 718} {"train_loss": -10.213508605957031, "global_step": 120682, "epoch": 718} {"train_loss": -9.7526273727417, "global_step": 120683, "epoch": 718} {"train_loss": -9.948101043701172, "global_step": 120684, "epoch": 718} {"train_loss": -9.826045989990234, "global_step": 120685, "epoch": 718} {"train_loss": -9.990734100341797, "global_step": 120686, "epoch": 718} {"train_loss": -9.901707649230957, "global_step": 120687, "epoch": 718} {"train_loss": -10.25772762298584, "global_step": 120688, "epoch": 718} {"train_loss": -10.005607604980469, "global_step": 120689, "epoch": 718} {"train_loss": -10.054997444152832, "global_step": 120690, "epoch": 718} {"train_loss": -10.224090576171875, "global_step": 120691, "epoch": 718} {"train_loss": -9.968399047851562, "global_step": 120692, "epoch": 718} {"train_loss": -10.297006607055664, "global_step": 120693, "epoch": 718} {"train_loss": -10.137990951538086, "global_step": 120694, "epoch": 718} {"train_loss": -9.950702667236328, "global_step": 120695, "epoch": 718} {"train_loss": -10.30511474609375, "global_step": 120696, "epoch": 718} {"train_loss": -10.163371086120605, "global_step": 120697, "epoch": 718} {"train_loss": -10.278103828430176, "global_step": 120698, "epoch": 718} {"train_loss": -10.325191497802734, "global_step": 120699, "epoch": 718} {"train_loss": -10.005085945129395, "global_step": 120700, "epoch": 718} {"train_loss": -10.392282485961914, "global_step": 120701, "epoch": 718} {"train_loss": -10.44716739654541, "global_step": 120702, "epoch": 718} {"train_loss": -9.879796028137207, "global_step": 120703, "epoch": 718} {"train_loss": -10.102416038513184, "global_step": 120704, "epoch": 718} {"train_loss": -10.440020561218262, "global_step": 120705, "epoch": 718} {"train_loss": -10.366415023803711, "global_step": 120706, "epoch": 718} {"train_loss": -10.326088905334473, "global_step": 120707, "epoch": 718} {"train_loss": -10.42096996307373, "global_step": 120708, "epoch": 718} {"train_loss": -10.247919082641602, "global_step": 120709, "epoch": 718} {"train_loss": -10.108150482177734, "global_step": 120710, "epoch": 718} {"train_loss": -10.314455032348633, "global_step": 120711, "epoch": 718} {"train_loss": -10.089151382446289, "global_step": 120712, "epoch": 718} {"train_loss": -10.181439399719238, "global_step": 120713, "epoch": 718} {"train_loss": -10.491740226745605, "global_step": 120714, "epoch": 718} {"train_loss": -9.887060165405273, "global_step": 120715, "epoch": 718} {"train_loss": -10.092673301696777, "global_step": 120716, "epoch": 718} {"train_loss": -10.10837459564209, "global_step": 120717, "epoch": 718} {"train_loss": -10.112298965454102, "global_step": 120718, "epoch": 718} {"train_loss": -10.066036224365234, "global_step": 120719, "epoch": 718} {"train_loss": -9.744820594787598, "global_step": 120720, "epoch": 718} {"train_loss": -10.56185531616211, "global_step": 120721, "epoch": 718} {"train_loss": -9.551363945007324, "global_step": 120722, "epoch": 718} {"train_loss": -10.406612396240234, "global_step": 120723, "epoch": 718} {"train_loss": -9.742518424987793, "global_step": 120724, "epoch": 718} {"train_loss": -9.97870922088623, "global_step": 120725, "epoch": 718} {"train_loss": -9.754019737243652, "global_step": 120726, "epoch": 718} {"train_loss": -10.099054336547852, "global_step": 120727, "epoch": 718} {"train_loss": -9.64328670501709, "global_step": 120728, "epoch": 718} {"train_loss": -10.037456512451172, "global_step": 120729, "epoch": 718} {"train_loss": -9.668338775634766, "global_step": 120730, "epoch": 718} {"train_loss": -10.033435821533203, "global_step": 120731, "epoch": 718} {"train_loss": -9.474169731140137, "global_step": 120732, "epoch": 718} {"train_loss": -9.651031494140625, "global_step": 120733, "epoch": 718} {"train_loss": -9.622947692871094, "global_step": 120734, "epoch": 718} {"train_loss": -10.114374160766602, "global_step": 120735, "epoch": 718} {"train_loss": -9.451663970947266, "global_step": 120736, "epoch": 718} {"train_loss": -9.990667343139648, "global_step": 120737, "epoch": 718} {"train_loss": -9.834022521972656, "global_step": 120738, "epoch": 718} {"train_loss": -9.83462905883789, "global_step": 120739, "epoch": 718} {"train_loss": -9.929374694824219, "global_step": 120740, "epoch": 718} {"train_loss": -9.939539909362793, "global_step": 120741, "epoch": 718} {"train_loss": -9.667964935302734, "global_step": 120742, "epoch": 718} {"train_loss": -10.087699890136719, "global_step": 120743, "epoch": 718} {"train_loss": -9.78131103515625, "global_step": 120744, "epoch": 718} {"train_loss": -10.123345375061035, "global_step": 120745, "epoch": 718} {"train_loss": -9.7745943069458, "global_step": 120746, "epoch": 718} {"train_loss": -10.069110870361328, "global_step": 120747, "epoch": 718} {"train_loss": -9.867728233337402, "global_step": 120748, "epoch": 718} {"train_loss": -10.414649963378906, "global_step": 120749, "epoch": 718} {"train_loss": -9.989774703979492, "global_step": 120750, "epoch": 718} {"train_loss": -10.206974029541016, "global_step": 120751, "epoch": 718} {"train_loss": -10.275239944458008, "global_step": 120752, "epoch": 718} {"train_loss": -10.218206405639648, "global_step": 120753, "epoch": 718} {"train_loss": -10.387715339660645, "global_step": 120754, "epoch": 718} {"train_loss": -10.290290832519531, "global_step": 120755, "epoch": 718} {"train_loss": -10.080329895019531, "global_step": 120756, "epoch": 718} {"train_loss": -10.208639144897461, "global_step": 120757, "epoch": 718} {"train_loss": -10.32546615600586, "global_step": 120758, "epoch": 718} {"train_loss": -10.1070556640625, "global_step": 120759, "epoch": 718} {"train_loss": -10.28903865814209, "global_step": 120760, "epoch": 718} {"train_loss": -10.280851364135742, "global_step": 120761, "epoch": 718} {"train_loss": -10.206905364990234, "global_step": 120762, "epoch": 718} {"train_loss": -10.463430404663086, "global_step": 120763, "epoch": 718} {"train_loss": -10.355846405029297, "global_step": 120764, "epoch": 718} {"train_loss": -10.475095748901367, "global_step": 120765, "epoch": 718} {"train_loss": -10.454721450805664, "global_step": 120766, "epoch": 718} {"train_loss": -10.504728317260742, "global_step": 120767, "epoch": 718} {"train_loss": -10.21855640411377, "global_step": 120768, "epoch": 718} {"train_loss": -10.092830657958984, "global_step": 120769, "epoch": 718} {"train_loss": -10.562508583068848, "global_step": 120770, "epoch": 718} {"train_loss": -10.394062042236328, "global_step": 120771, "epoch": 718} {"train_loss": -10.557905197143555, "global_step": 120772, "epoch": 718} {"train_loss": -10.366802215576172, "global_step": 120773, "epoch": 718} {"train_loss": -10.362215995788574, "global_step": 120774, "epoch": 718} {"train_loss": -10.314611434936523, "global_step": 120775, "epoch": 718} {"train_loss": -10.2234525680542, "global_step": 120776, "epoch": 718} {"train_loss": -10.310946464538574, "global_step": 120777, "epoch": 718} {"train_loss": -10.459798812866211, "global_step": 120778, "epoch": 718} {"train_loss": -10.392119407653809, "global_step": 120779, "epoch": 718} {"train_loss": -10.585600852966309, "global_step": 120780, "epoch": 718} {"train_loss": -10.368547439575195, "global_step": 120781, "epoch": 718} {"train_loss": -10.125471115112305, "global_step": 120782, "epoch": 718} {"train_loss": -10.524820327758789, "global_step": 120783, "epoch": 718} {"train_loss": -10.363460540771484, "global_step": 120784, "epoch": 718} {"train_loss": -10.207954406738281, "global_step": 120785, "epoch": 718} {"train_loss": -10.315502166748047, "global_step": 120786, "epoch": 718} {"train_loss": -10.263506889343262, "global_step": 120787, "epoch": 718} {"train_loss": -10.198573112487793, "global_step": 120788, "epoch": 718} {"train_loss": -10.463167190551758, "global_step": 120789, "epoch": 718} {"train_loss": -9.621246337890625, "global_step": 120790, "epoch": 718} {"train_loss": -10.139184134347099, "global_step": 120791, "epoch": 718, "val_loss": 216938.921875} {"train_loss": -9.930293083190918, "global_step": 120792, "epoch": 719} {"train_loss": -10.11846923828125, "global_step": 120793, "epoch": 719} {"train_loss": -10.10761833190918, "global_step": 120794, "epoch": 719} {"train_loss": -9.778238296508789, "global_step": 120795, "epoch": 719} {"train_loss": -10.113495826721191, "global_step": 120796, "epoch": 719} {"train_loss": -10.066156387329102, "global_step": 120797, "epoch": 719} {"train_loss": -9.68536376953125, "global_step": 120798, "epoch": 719} {"train_loss": -10.13783073425293, "global_step": 120799, "epoch": 719} {"train_loss": -9.960145950317383, "global_step": 120800, "epoch": 719} {"train_loss": -10.326761245727539, "global_step": 120801, "epoch": 719} {"train_loss": -10.176751136779785, "global_step": 120802, "epoch": 719} {"train_loss": -10.102644920349121, "global_step": 120803, "epoch": 719} {"train_loss": -10.06568717956543, "global_step": 120804, "epoch": 719} {"train_loss": -10.313680648803711, "global_step": 120805, "epoch": 719} {"train_loss": -10.225790023803711, "global_step": 120806, "epoch": 719} {"train_loss": -10.394070625305176, "global_step": 120807, "epoch": 719} {"train_loss": -10.227964401245117, "global_step": 120808, "epoch": 719} {"train_loss": -10.198585510253906, "global_step": 120809, "epoch": 719} {"train_loss": -10.351659774780273, "global_step": 120810, "epoch": 719} {"train_loss": -10.013328552246094, "global_step": 120811, "epoch": 719} {"train_loss": -10.09357738494873, "global_step": 120812, "epoch": 719} {"train_loss": -9.962587356567383, "global_step": 120813, "epoch": 719} {"train_loss": -9.638528823852539, "global_step": 120814, "epoch": 719} {"train_loss": -9.868820190429688, "global_step": 120815, "epoch": 719} {"train_loss": -9.887626647949219, "global_step": 120816, "epoch": 719} {"train_loss": -9.95226764678955, "global_step": 120817, "epoch": 719} {"train_loss": -9.77536392211914, "global_step": 120818, "epoch": 719} {"train_loss": -9.952335357666016, "global_step": 120819, "epoch": 719} {"train_loss": -10.312065124511719, "global_step": 120820, "epoch": 719} {"train_loss": -9.663773536682129, "global_step": 120821, "epoch": 719} {"train_loss": -10.09581184387207, "global_step": 120822, "epoch": 719} {"train_loss": -10.097980499267578, "global_step": 120823, "epoch": 719} {"train_loss": -9.8449125289917, "global_step": 120824, "epoch": 719} {"train_loss": -10.218128204345703, "global_step": 120825, "epoch": 719} {"train_loss": -9.903891563415527, "global_step": 120826, "epoch": 719} {"train_loss": -10.032218933105469, "global_step": 120827, "epoch": 719} {"train_loss": -10.184870719909668, "global_step": 120828, "epoch": 719} {"train_loss": -9.89150619506836, "global_step": 120829, "epoch": 719} {"train_loss": -9.96607780456543, "global_step": 120830, "epoch": 719} {"train_loss": -9.96013355255127, "global_step": 120831, "epoch": 719} {"train_loss": -10.148573875427246, "global_step": 120832, "epoch": 719} {"train_loss": -9.832561492919922, "global_step": 120833, "epoch": 719} {"train_loss": -9.870612144470215, "global_step": 120834, "epoch": 719} {"train_loss": -9.944314956665039, "global_step": 120835, "epoch": 719} {"train_loss": -9.552328109741211, "global_step": 120836, "epoch": 719} {"train_loss": -9.939827919006348, "global_step": 120837, "epoch": 719} {"train_loss": -9.995254516601562, "global_step": 120838, "epoch": 719} {"train_loss": -9.538030624389648, "global_step": 120839, "epoch": 719} {"train_loss": -10.26820182800293, "global_step": 120840, "epoch": 719} {"train_loss": -10.32929515838623, "global_step": 120841, "epoch": 719} {"train_loss": -9.928332328796387, "global_step": 120842, "epoch": 719} {"train_loss": -10.123669624328613, "global_step": 120843, "epoch": 719} {"train_loss": -10.205167770385742, "global_step": 120844, "epoch": 719} {"train_loss": -10.263771057128906, "global_step": 120845, "epoch": 719} {"train_loss": -9.902769088745117, "global_step": 120846, "epoch": 719} {"train_loss": -10.103514671325684, "global_step": 120847, "epoch": 719} {"train_loss": -10.101102828979492, "global_step": 120848, "epoch": 719} {"train_loss": -10.249460220336914, "global_step": 120849, "epoch": 719} {"train_loss": -10.079331398010254, "global_step": 120850, "epoch": 719} {"train_loss": -10.471717834472656, "global_step": 120851, "epoch": 719} {"train_loss": -10.118566513061523, "global_step": 120852, "epoch": 719} {"train_loss": -10.102804183959961, "global_step": 120853, "epoch": 719} {"train_loss": -9.979780197143555, "global_step": 120854, "epoch": 719} {"train_loss": -9.829109191894531, "global_step": 120855, "epoch": 719} {"train_loss": -10.312484741210938, "global_step": 120856, "epoch": 719} {"train_loss": -9.9244966506958, "global_step": 120857, "epoch": 719} {"train_loss": -10.245019912719727, "global_step": 120858, "epoch": 719} {"train_loss": -10.402637481689453, "global_step": 120859, "epoch": 719} {"train_loss": -9.987649917602539, "global_step": 120860, "epoch": 719} {"train_loss": -10.031487464904785, "global_step": 120861, "epoch": 719} {"train_loss": -9.685603141784668, "global_step": 120862, "epoch": 719} {"train_loss": -9.974584579467773, "global_step": 120863, "epoch": 719} {"train_loss": -9.679943084716797, "global_step": 120864, "epoch": 719} {"train_loss": -10.00296401977539, "global_step": 120865, "epoch": 719} {"train_loss": -10.143415451049805, "global_step": 120866, "epoch": 719} {"train_loss": -9.722345352172852, "global_step": 120867, "epoch": 719} {"train_loss": -10.180968284606934, "global_step": 120868, "epoch": 719} {"train_loss": -9.854533195495605, "global_step": 120869, "epoch": 719} {"train_loss": -10.103006362915039, "global_step": 120870, "epoch": 719} {"train_loss": -10.165470123291016, "global_step": 120871, "epoch": 719} {"train_loss": -10.188070297241211, "global_step": 120872, "epoch": 719} {"train_loss": -10.208357810974121, "global_step": 120873, "epoch": 719} {"train_loss": -9.442773818969727, "global_step": 120874, "epoch": 719} {"train_loss": -10.253097534179688, "global_step": 120875, "epoch": 719} {"train_loss": -9.75794506072998, "global_step": 120876, "epoch": 719} {"train_loss": -10.308928489685059, "global_step": 120877, "epoch": 719} {"train_loss": -10.115936279296875, "global_step": 120878, "epoch": 719} {"train_loss": -10.02186107635498, "global_step": 120879, "epoch": 719} {"train_loss": -10.341124534606934, "global_step": 120880, "epoch": 719} {"train_loss": -10.144464492797852, "global_step": 120881, "epoch": 719} {"train_loss": -10.155303001403809, "global_step": 120882, "epoch": 719} {"train_loss": -10.219837188720703, "global_step": 120883, "epoch": 719} {"train_loss": -10.086507797241211, "global_step": 120884, "epoch": 719} {"train_loss": -10.104493141174316, "global_step": 120885, "epoch": 719} {"train_loss": -10.431805610656738, "global_step": 120886, "epoch": 719} {"train_loss": -10.20870590209961, "global_step": 120887, "epoch": 719} {"train_loss": -10.173465728759766, "global_step": 120888, "epoch": 719} {"train_loss": -10.27242660522461, "global_step": 120889, "epoch": 719} {"train_loss": -10.375709533691406, "global_step": 120890, "epoch": 719} {"train_loss": -10.237900733947754, "global_step": 120891, "epoch": 719} {"train_loss": -10.176737785339355, "global_step": 120892, "epoch": 719} {"train_loss": -10.167116165161133, "global_step": 120893, "epoch": 719} {"train_loss": -10.32965087890625, "global_step": 120894, "epoch": 719} {"train_loss": -10.452262878417969, "global_step": 120895, "epoch": 719} {"train_loss": -10.200788497924805, "global_step": 120896, "epoch": 719} {"train_loss": -10.361068725585938, "global_step": 120897, "epoch": 719} {"train_loss": -10.489060401916504, "global_step": 120898, "epoch": 719} {"train_loss": -10.287128448486328, "global_step": 120899, "epoch": 719} {"train_loss": -10.587190628051758, "global_step": 120900, "epoch": 719} {"train_loss": -10.274641036987305, "global_step": 120901, "epoch": 719} {"train_loss": -10.286445617675781, "global_step": 120902, "epoch": 719} {"train_loss": -10.346742630004883, "global_step": 120903, "epoch": 719} {"train_loss": -10.287474632263184, "global_step": 120904, "epoch": 719} {"train_loss": -10.133722305297852, "global_step": 120905, "epoch": 719} {"train_loss": -10.167551040649414, "global_step": 120906, "epoch": 719} {"train_loss": -10.394247055053711, "global_step": 120907, "epoch": 719} {"train_loss": -10.37202262878418, "global_step": 120908, "epoch": 719} {"train_loss": -10.146150588989258, "global_step": 120909, "epoch": 719} {"train_loss": -10.42269515991211, "global_step": 120910, "epoch": 719} {"train_loss": -10.356918334960938, "global_step": 120911, "epoch": 719} {"train_loss": -10.225150108337402, "global_step": 120912, "epoch": 719} {"train_loss": -10.449546813964844, "global_step": 120913, "epoch": 719} {"train_loss": -10.2792387008667, "global_step": 120914, "epoch": 719} {"train_loss": -10.399478912353516, "global_step": 120915, "epoch": 719} {"train_loss": -10.328371047973633, "global_step": 120916, "epoch": 719} {"train_loss": -10.33709716796875, "global_step": 120917, "epoch": 719} {"train_loss": -10.215993881225586, "global_step": 120918, "epoch": 719} {"train_loss": -10.295753479003906, "global_step": 120919, "epoch": 719} {"train_loss": -10.273599624633789, "global_step": 120920, "epoch": 719} {"train_loss": -9.600881576538086, "global_step": 120921, "epoch": 719} {"train_loss": -9.375926971435547, "global_step": 120922, "epoch": 719} {"train_loss": -10.039359092712402, "global_step": 120923, "epoch": 719} {"train_loss": -7.9126434326171875, "global_step": 120924, "epoch": 719} {"train_loss": -9.960504531860352, "global_step": 120925, "epoch": 719} {"train_loss": -8.270515441894531, "global_step": 120926, "epoch": 719} {"train_loss": -9.430644989013672, "global_step": 120927, "epoch": 719} {"train_loss": -9.367815017700195, "global_step": 120928, "epoch": 719} {"train_loss": -9.47031021118164, "global_step": 120929, "epoch": 719} {"train_loss": -9.329913139343262, "global_step": 120930, "epoch": 719} {"train_loss": -8.954038619995117, "global_step": 120931, "epoch": 719} {"train_loss": -9.733291625976562, "global_step": 120932, "epoch": 719} {"train_loss": -9.20368766784668, "global_step": 120933, "epoch": 719} {"train_loss": -9.749380111694336, "global_step": 120934, "epoch": 719} {"train_loss": -9.370940208435059, "global_step": 120935, "epoch": 719} {"train_loss": -9.64604377746582, "global_step": 120936, "epoch": 719} {"train_loss": -9.615604400634766, "global_step": 120937, "epoch": 719} {"train_loss": -9.923208236694336, "global_step": 120938, "epoch": 719} {"train_loss": -9.787576675415039, "global_step": 120939, "epoch": 719} {"train_loss": -9.54922103881836, "global_step": 120940, "epoch": 719} {"train_loss": -9.84416389465332, "global_step": 120941, "epoch": 719} {"train_loss": -9.666881561279297, "global_step": 120942, "epoch": 719} {"train_loss": -9.99654483795166, "global_step": 120943, "epoch": 719} {"train_loss": -9.712644577026367, "global_step": 120944, "epoch": 719} {"train_loss": -9.826298713684082, "global_step": 120945, "epoch": 719} {"train_loss": -9.725775718688965, "global_step": 120946, "epoch": 719} {"train_loss": -10.032079696655273, "global_step": 120947, "epoch": 719} {"train_loss": -9.686147689819336, "global_step": 120948, "epoch": 719} {"train_loss": -9.97045612335205, "global_step": 120949, "epoch": 719} {"train_loss": -9.693560600280762, "global_step": 120950, "epoch": 719} {"train_loss": -10.132278442382812, "global_step": 120951, "epoch": 719} {"train_loss": -9.885002136230469, "global_step": 120952, "epoch": 719} {"train_loss": -10.147424697875977, "global_step": 120953, "epoch": 719} {"train_loss": -9.980761528015137, "global_step": 120954, "epoch": 719} {"train_loss": -9.791275024414062, "global_step": 120955, "epoch": 719} {"train_loss": -10.099319458007812, "global_step": 120956, "epoch": 719} {"train_loss": -9.95417594909668, "global_step": 120957, "epoch": 719} {"train_loss": -10.112221717834473, "global_step": 120958, "epoch": 719} {"train_loss": -10.007923404375711, "global_step": 120959, "epoch": 719, "val_loss": 210965.84375} {"train_loss": -10.186148643493652, "global_step": 120960, "epoch": 720} {"train_loss": -10.365324974060059, "global_step": 120961, "epoch": 720} {"train_loss": -10.099327087402344, "global_step": 120962, "epoch": 720} {"train_loss": -10.162443161010742, "global_step": 120963, "epoch": 720} {"train_loss": -10.265237808227539, "global_step": 120964, "epoch": 720} {"train_loss": -10.097280502319336, "global_step": 120965, "epoch": 720} {"train_loss": -10.384115219116211, "global_step": 120966, "epoch": 720} {"train_loss": -10.266769409179688, "global_step": 120967, "epoch": 720} {"train_loss": -10.11030101776123, "global_step": 120968, "epoch": 720} {"train_loss": -10.260747909545898, "global_step": 120969, "epoch": 720} {"train_loss": -10.137290954589844, "global_step": 120970, "epoch": 720} {"train_loss": -10.37851619720459, "global_step": 120971, "epoch": 720} {"train_loss": -10.204679489135742, "global_step": 120972, "epoch": 720} {"train_loss": -10.420783996582031, "global_step": 120973, "epoch": 720} {"train_loss": -10.411883354187012, "global_step": 120974, "epoch": 720} {"train_loss": -10.379097938537598, "global_step": 120975, "epoch": 720} {"train_loss": -10.352113723754883, "global_step": 120976, "epoch": 720} {"train_loss": -10.461491584777832, "global_step": 120977, "epoch": 720} {"train_loss": -10.165779113769531, "global_step": 120978, "epoch": 720} {"train_loss": -10.473386764526367, "global_step": 120979, "epoch": 720} {"train_loss": -10.42959213256836, "global_step": 120980, "epoch": 720} {"train_loss": -10.296903610229492, "global_step": 120981, "epoch": 720} {"train_loss": -10.497821807861328, "global_step": 120982, "epoch": 720} {"train_loss": -10.359371185302734, "global_step": 120983, "epoch": 720} {"train_loss": -10.4718599319458, "global_step": 120984, "epoch": 720} {"train_loss": -10.526651382446289, "global_step": 120985, "epoch": 720} {"train_loss": -10.176578521728516, "global_step": 120986, "epoch": 720} {"train_loss": -10.35978889465332, "global_step": 120987, "epoch": 720} {"train_loss": -10.21837329864502, "global_step": 120988, "epoch": 720} {"train_loss": -10.210395812988281, "global_step": 120989, "epoch": 720} {"train_loss": -10.159623146057129, "global_step": 120990, "epoch": 720} {"train_loss": -10.459857940673828, "global_step": 120991, "epoch": 720} {"train_loss": -10.169222831726074, "global_step": 120992, "epoch": 720} {"train_loss": -10.075887680053711, "global_step": 120993, "epoch": 720} {"train_loss": -10.174199104309082, "global_step": 120994, "epoch": 720} {"train_loss": -10.342702865600586, "global_step": 120995, "epoch": 720} {"train_loss": -9.457235336303711, "global_step": 120996, "epoch": 720} {"train_loss": -10.113079071044922, "global_step": 120997, "epoch": 720} {"train_loss": -10.421401977539062, "global_step": 120998, "epoch": 720} {"train_loss": -10.397658348083496, "global_step": 120999, "epoch": 720} {"train_loss": -10.140462875366211, "global_step": 121000, "epoch": 720} {"train_loss": -10.387945175170898, "global_step": 121001, "epoch": 720} {"train_loss": -10.555716514587402, "global_step": 121002, "epoch": 720} {"train_loss": -9.939165115356445, "global_step": 121003, "epoch": 720} {"train_loss": -10.502614974975586, "global_step": 121004, "epoch": 720} {"train_loss": -10.044917106628418, "global_step": 121005, "epoch": 720} {"train_loss": -10.039363861083984, "global_step": 121006, "epoch": 720} {"train_loss": -10.420539855957031, "global_step": 121007, "epoch": 720} {"train_loss": -10.450138092041016, "global_step": 121008, "epoch": 720} {"train_loss": -10.223931312561035, "global_step": 121009, "epoch": 720} {"train_loss": -10.271171569824219, "global_step": 121010, "epoch": 720} {"train_loss": -10.367843627929688, "global_step": 121011, "epoch": 720} {"train_loss": -10.126297950744629, "global_step": 121012, "epoch": 720} {"train_loss": -10.347551345825195, "global_step": 121013, "epoch": 720} {"train_loss": -9.953267097473145, "global_step": 121014, "epoch": 720} {"train_loss": -10.401360511779785, "global_step": 121015, "epoch": 720} {"train_loss": -9.946072578430176, "global_step": 121016, "epoch": 720} {"train_loss": -9.958982467651367, "global_step": 121017, "epoch": 720} {"train_loss": -10.121488571166992, "global_step": 121018, "epoch": 720} {"train_loss": -9.841377258300781, "global_step": 121019, "epoch": 720} {"train_loss": -10.096843719482422, "global_step": 121020, "epoch": 720} {"train_loss": -9.634963989257812, "global_step": 121021, "epoch": 720} {"train_loss": -10.319648742675781, "global_step": 121022, "epoch": 720} {"train_loss": -9.070618629455566, "global_step": 121023, "epoch": 720} {"train_loss": -9.95077896118164, "global_step": 121024, "epoch": 720} {"train_loss": -9.42431354522705, "global_step": 121025, "epoch": 720} {"train_loss": -9.76004409790039, "global_step": 121026, "epoch": 720} {"train_loss": -9.545398712158203, "global_step": 121027, "epoch": 720} {"train_loss": -9.779536247253418, "global_step": 121028, "epoch": 720} {"train_loss": -9.355628967285156, "global_step": 121029, "epoch": 720} {"train_loss": -9.618721961975098, "global_step": 121030, "epoch": 720} {"train_loss": -9.488666534423828, "global_step": 121031, "epoch": 720} {"train_loss": -9.850132942199707, "global_step": 121032, "epoch": 720} {"train_loss": -9.888016700744629, "global_step": 121033, "epoch": 720} {"train_loss": -9.722236633300781, "global_step": 121034, "epoch": 720} {"train_loss": -9.988686561584473, "global_step": 121035, "epoch": 720} {"train_loss": -9.669061660766602, "global_step": 121036, "epoch": 720} {"train_loss": -9.877484321594238, "global_step": 121037, "epoch": 720} {"train_loss": -9.75966739654541, "global_step": 121038, "epoch": 720} {"train_loss": -10.12249755859375, "global_step": 121039, "epoch": 720} {"train_loss": -9.409197807312012, "global_step": 121040, "epoch": 720} {"train_loss": -9.975301742553711, "global_step": 121041, "epoch": 720} {"train_loss": -9.945457458496094, "global_step": 121042, "epoch": 720} {"train_loss": -9.998960494995117, "global_step": 121043, "epoch": 720} {"train_loss": -10.018301963806152, "global_step": 121044, "epoch": 720} {"train_loss": -10.168652534484863, "global_step": 121045, "epoch": 720} {"train_loss": -9.930425643920898, "global_step": 121046, "epoch": 720} {"train_loss": -10.113824844360352, "global_step": 121047, "epoch": 720} {"train_loss": -10.249981880187988, "global_step": 121048, "epoch": 720} {"train_loss": -9.999656677246094, "global_step": 121049, "epoch": 720} {"train_loss": -10.26641845703125, "global_step": 121050, "epoch": 720} {"train_loss": -10.36087417602539, "global_step": 121051, "epoch": 720} {"train_loss": -10.091293334960938, "global_step": 121052, "epoch": 720} {"train_loss": -10.105188369750977, "global_step": 121053, "epoch": 720} {"train_loss": -10.229669570922852, "global_step": 121054, "epoch": 720} {"train_loss": -10.432010650634766, "global_step": 121055, "epoch": 720} {"train_loss": -10.087944030761719, "global_step": 121056, "epoch": 720} {"train_loss": -10.131362915039062, "global_step": 121057, "epoch": 720} {"train_loss": -10.096700668334961, "global_step": 121058, "epoch": 720} {"train_loss": -10.137330055236816, "global_step": 121059, "epoch": 720} {"train_loss": -10.101375579833984, "global_step": 121060, "epoch": 720} {"train_loss": -10.593766212463379, "global_step": 121061, "epoch": 720} {"train_loss": -10.130367279052734, "global_step": 121062, "epoch": 720} {"train_loss": -10.36913776397705, "global_step": 121063, "epoch": 720} {"train_loss": -10.272523880004883, "global_step": 121064, "epoch": 720} {"train_loss": -10.317765235900879, "global_step": 121065, "epoch": 720} {"train_loss": -10.631307601928711, "global_step": 121066, "epoch": 720} {"train_loss": -10.171425819396973, "global_step": 121067, "epoch": 720} {"train_loss": -10.272417068481445, "global_step": 121068, "epoch": 720} {"train_loss": -10.125349998474121, "global_step": 121069, "epoch": 720} {"train_loss": -10.248767852783203, "global_step": 121070, "epoch": 720} {"train_loss": -9.963957786560059, "global_step": 121071, "epoch": 720} {"train_loss": -10.23031234741211, "global_step": 121072, "epoch": 720} {"train_loss": -10.134499549865723, "global_step": 121073, "epoch": 720} {"train_loss": -10.294923782348633, "global_step": 121074, "epoch": 720} {"train_loss": -10.003193855285645, "global_step": 121075, "epoch": 720} {"train_loss": -10.120550155639648, "global_step": 121076, "epoch": 720} {"train_loss": -9.597883224487305, "global_step": 121077, "epoch": 720} {"train_loss": -8.866920471191406, "global_step": 121078, "epoch": 720} {"train_loss": -9.91070556640625, "global_step": 121079, "epoch": 720} {"train_loss": -8.72932243347168, "global_step": 121080, "epoch": 720} {"train_loss": -8.945966720581055, "global_step": 121081, "epoch": 720} {"train_loss": -8.631874084472656, "global_step": 121082, "epoch": 720} {"train_loss": -9.59145736694336, "global_step": 121083, "epoch": 720} {"train_loss": -8.572944641113281, "global_step": 121084, "epoch": 720} {"train_loss": -9.592645645141602, "global_step": 121085, "epoch": 720} {"train_loss": -8.885408401489258, "global_step": 121086, "epoch": 720} {"train_loss": -9.55771255493164, "global_step": 121087, "epoch": 720} {"train_loss": -9.146596908569336, "global_step": 121088, "epoch": 720} {"train_loss": -9.31784439086914, "global_step": 121089, "epoch": 720} {"train_loss": -9.477983474731445, "global_step": 121090, "epoch": 720} {"train_loss": -9.437515258789062, "global_step": 121091, "epoch": 720} {"train_loss": -9.354413986206055, "global_step": 121092, "epoch": 720} {"train_loss": -9.533273696899414, "global_step": 121093, "epoch": 720} {"train_loss": -9.605993270874023, "global_step": 121094, "epoch": 720} {"train_loss": -9.46705150604248, "global_step": 121095, "epoch": 720} {"train_loss": -9.829073905944824, "global_step": 121096, "epoch": 720} {"train_loss": -9.49319076538086, "global_step": 121097, "epoch": 720} {"train_loss": -9.20412826538086, "global_step": 121098, "epoch": 720} {"train_loss": -9.860188484191895, "global_step": 121099, "epoch": 720} {"train_loss": -9.593827247619629, "global_step": 121100, "epoch": 720} {"train_loss": -9.142051696777344, "global_step": 121101, "epoch": 720} {"train_loss": -9.443829536437988, "global_step": 121102, "epoch": 720} {"train_loss": -9.51329231262207, "global_step": 121103, "epoch": 720} {"train_loss": -9.638256072998047, "global_step": 121104, "epoch": 720} {"train_loss": -9.195448875427246, "global_step": 121105, "epoch": 720} {"train_loss": -9.477849960327148, "global_step": 121106, "epoch": 720} {"train_loss": -9.600921630859375, "global_step": 121107, "epoch": 720} {"train_loss": -9.62795352935791, "global_step": 121108, "epoch": 720} {"train_loss": -9.549431800842285, "global_step": 121109, "epoch": 720} {"train_loss": -9.616033554077148, "global_step": 121110, "epoch": 720} {"train_loss": -9.701129913330078, "global_step": 121111, "epoch": 720} {"train_loss": -9.802013397216797, "global_step": 121112, "epoch": 720} {"train_loss": -9.636431694030762, "global_step": 121113, "epoch": 720} {"train_loss": -9.753576278686523, "global_step": 121114, "epoch": 720} {"train_loss": -9.91229248046875, "global_step": 121115, "epoch": 720} {"train_loss": -9.74981689453125, "global_step": 121116, "epoch": 720} {"train_loss": -10.016497611999512, "global_step": 121117, "epoch": 720} {"train_loss": -9.560571670532227, "global_step": 121118, "epoch": 720} {"train_loss": -9.624183654785156, "global_step": 121119, "epoch": 720} {"train_loss": -9.912256240844727, "global_step": 121120, "epoch": 720} {"train_loss": -9.515172004699707, "global_step": 121121, "epoch": 720} {"train_loss": -9.981988906860352, "global_step": 121122, "epoch": 720} {"train_loss": -9.934648513793945, "global_step": 121123, "epoch": 720} {"train_loss": -9.862640380859375, "global_step": 121124, "epoch": 720} {"train_loss": -9.921279907226562, "global_step": 121125, "epoch": 720} {"train_loss": -9.899787902832031, "global_step": 121126, "epoch": 720} {"train_loss": -9.949128951345172, "global_step": 121127, "epoch": 720, "val_loss": 211992.0, "train_action_mse_error": 1.97072434425354} {"train_loss": -9.94122314453125, "global_step": 121128, "epoch": 721} {"train_loss": -10.090956687927246, "global_step": 121129, "epoch": 721} {"train_loss": -9.943937301635742, "global_step": 121130, "epoch": 721} {"train_loss": -10.453341484069824, "global_step": 121131, "epoch": 721} {"train_loss": -10.117639541625977, "global_step": 121132, "epoch": 721} {"train_loss": -10.127391815185547, "global_step": 121133, "epoch": 721} {"train_loss": -10.133737564086914, "global_step": 121134, "epoch": 721} {"train_loss": -10.008125305175781, "global_step": 121135, "epoch": 721} {"train_loss": -10.247448921203613, "global_step": 121136, "epoch": 721} {"train_loss": -10.138657569885254, "global_step": 121137, "epoch": 721} {"train_loss": -10.206376075744629, "global_step": 121138, "epoch": 721} {"train_loss": -10.347976684570312, "global_step": 121139, "epoch": 721} {"train_loss": -10.013209342956543, "global_step": 121140, "epoch": 721} {"train_loss": -10.231245994567871, "global_step": 121141, "epoch": 721} {"train_loss": -10.121490478515625, "global_step": 121142, "epoch": 721} {"train_loss": -10.258089065551758, "global_step": 121143, "epoch": 721} {"train_loss": -10.181692123413086, "global_step": 121144, "epoch": 721} {"train_loss": -10.16899299621582, "global_step": 121145, "epoch": 721} {"train_loss": -10.15256404876709, "global_step": 121146, "epoch": 721} {"train_loss": -10.341907501220703, "global_step": 121147, "epoch": 721} {"train_loss": -10.009206771850586, "global_step": 121148, "epoch": 721} {"train_loss": -10.262954711914062, "global_step": 121149, "epoch": 721} {"train_loss": -10.437629699707031, "global_step": 121150, "epoch": 721} {"train_loss": -10.116653442382812, "global_step": 121151, "epoch": 721} {"train_loss": -10.272722244262695, "global_step": 121152, "epoch": 721} {"train_loss": -10.14605712890625, "global_step": 121153, "epoch": 721} {"train_loss": -10.132125854492188, "global_step": 121154, "epoch": 721} {"train_loss": -10.194206237792969, "global_step": 121155, "epoch": 721} {"train_loss": -10.225204467773438, "global_step": 121156, "epoch": 721} {"train_loss": -10.355798721313477, "global_step": 121157, "epoch": 721} {"train_loss": -9.852643966674805, "global_step": 121158, "epoch": 721} {"train_loss": -10.439750671386719, "global_step": 121159, "epoch": 721} {"train_loss": -9.803203582763672, "global_step": 121160, "epoch": 721} {"train_loss": -9.972414016723633, "global_step": 121161, "epoch": 721} {"train_loss": -10.323726654052734, "global_step": 121162, "epoch": 721} {"train_loss": -9.889974594116211, "global_step": 121163, "epoch": 721} {"train_loss": -10.096978187561035, "global_step": 121164, "epoch": 721} {"train_loss": -10.256175994873047, "global_step": 121165, "epoch": 721} {"train_loss": -10.038991928100586, "global_step": 121166, "epoch": 721} {"train_loss": -10.414647102355957, "global_step": 121167, "epoch": 721} {"train_loss": -10.116668701171875, "global_step": 121168, "epoch": 721} {"train_loss": -10.054563522338867, "global_step": 121169, "epoch": 721} {"train_loss": -10.203908920288086, "global_step": 121170, "epoch": 721} {"train_loss": -9.736411094665527, "global_step": 121171, "epoch": 721} {"train_loss": -10.273943901062012, "global_step": 121172, "epoch": 721} {"train_loss": -9.752941131591797, "global_step": 121173, "epoch": 721} {"train_loss": -9.660772323608398, "global_step": 121174, "epoch": 721} {"train_loss": -10.069957733154297, "global_step": 121175, "epoch": 721} {"train_loss": -10.11012077331543, "global_step": 121176, "epoch": 721} {"train_loss": -10.256216049194336, "global_step": 121177, "epoch": 721} {"train_loss": -9.996641159057617, "global_step": 121178, "epoch": 721} {"train_loss": -10.227335929870605, "global_step": 121179, "epoch": 721} {"train_loss": -9.997169494628906, "global_step": 121180, "epoch": 721} {"train_loss": -10.223140716552734, "global_step": 121181, "epoch": 721} {"train_loss": -9.975274085998535, "global_step": 121182, "epoch": 721} {"train_loss": -10.270292282104492, "global_step": 121183, "epoch": 721} {"train_loss": -10.10570240020752, "global_step": 121184, "epoch": 721} {"train_loss": -10.302563667297363, "global_step": 121185, "epoch": 721} {"train_loss": -10.432358741760254, "global_step": 121186, "epoch": 721} {"train_loss": -10.274311065673828, "global_step": 121187, "epoch": 721} {"train_loss": -9.848981857299805, "global_step": 121188, "epoch": 721} {"train_loss": -10.24350357055664, "global_step": 121189, "epoch": 721} {"train_loss": -10.258506774902344, "global_step": 121190, "epoch": 721} {"train_loss": -10.041608810424805, "global_step": 121191, "epoch": 721} {"train_loss": -10.307449340820312, "global_step": 121192, "epoch": 721} {"train_loss": -10.078300476074219, "global_step": 121193, "epoch": 721} {"train_loss": -10.023754119873047, "global_step": 121194, "epoch": 721} {"train_loss": -10.355315208435059, "global_step": 121195, "epoch": 721} {"train_loss": -10.246986389160156, "global_step": 121196, "epoch": 721} {"train_loss": -10.425243377685547, "global_step": 121197, "epoch": 721} {"train_loss": -10.245566368103027, "global_step": 121198, "epoch": 721} {"train_loss": -10.107881546020508, "global_step": 121199, "epoch": 721} {"train_loss": -10.236530303955078, "global_step": 121200, "epoch": 721} {"train_loss": -9.808744430541992, "global_step": 121201, "epoch": 721} {"train_loss": -10.284709930419922, "global_step": 121202, "epoch": 721} {"train_loss": -9.891844749450684, "global_step": 121203, "epoch": 721} {"train_loss": -9.647296905517578, "global_step": 121204, "epoch": 721} {"train_loss": -9.163741111755371, "global_step": 121205, "epoch": 721} {"train_loss": -9.654569625854492, "global_step": 121206, "epoch": 721} {"train_loss": -9.772581100463867, "global_step": 121207, "epoch": 721} {"train_loss": -10.050312042236328, "global_step": 121208, "epoch": 721} {"train_loss": -9.67271614074707, "global_step": 121209, "epoch": 721} {"train_loss": -9.951957702636719, "global_step": 121210, "epoch": 721} {"train_loss": -10.081069946289062, "global_step": 121211, "epoch": 721} {"train_loss": -9.83125114440918, "global_step": 121212, "epoch": 721} {"train_loss": -9.956613540649414, "global_step": 121213, "epoch": 721} {"train_loss": -9.887006759643555, "global_step": 121214, "epoch": 721} {"train_loss": -10.121862411499023, "global_step": 121215, "epoch": 721} {"train_loss": -10.258131980895996, "global_step": 121216, "epoch": 721} {"train_loss": -10.093343734741211, "global_step": 121217, "epoch": 721} {"train_loss": -9.969874382019043, "global_step": 121218, "epoch": 721} {"train_loss": -10.164314270019531, "global_step": 121219, "epoch": 721} {"train_loss": -10.239294052124023, "global_step": 121220, "epoch": 721} {"train_loss": -10.229124069213867, "global_step": 121221, "epoch": 721} {"train_loss": -10.216816902160645, "global_step": 121222, "epoch": 721} {"train_loss": -10.033885955810547, "global_step": 121223, "epoch": 721} {"train_loss": -10.214176177978516, "global_step": 121224, "epoch": 721} {"train_loss": -10.306105613708496, "global_step": 121225, "epoch": 721} {"train_loss": -9.771652221679688, "global_step": 121226, "epoch": 721} {"train_loss": -10.24740219116211, "global_step": 121227, "epoch": 721} {"train_loss": -10.266094207763672, "global_step": 121228, "epoch": 721} {"train_loss": -10.074258804321289, "global_step": 121229, "epoch": 721} {"train_loss": -10.28624153137207, "global_step": 121230, "epoch": 721} {"train_loss": -10.28443717956543, "global_step": 121231, "epoch": 721} {"train_loss": -10.351554870605469, "global_step": 121232, "epoch": 721} {"train_loss": -10.265525817871094, "global_step": 121233, "epoch": 721} {"train_loss": -10.235183715820312, "global_step": 121234, "epoch": 721} {"train_loss": -10.25650691986084, "global_step": 121235, "epoch": 721} {"train_loss": -10.166876792907715, "global_step": 121236, "epoch": 721} {"train_loss": -10.050408363342285, "global_step": 121237, "epoch": 721} {"train_loss": -10.531002044677734, "global_step": 121238, "epoch": 721} {"train_loss": -10.081991195678711, "global_step": 121239, "epoch": 721} {"train_loss": -10.115732192993164, "global_step": 121240, "epoch": 721} {"train_loss": -10.24582290649414, "global_step": 121241, "epoch": 721} {"train_loss": -10.23228645324707, "global_step": 121242, "epoch": 721} {"train_loss": -10.170597076416016, "global_step": 121243, "epoch": 721} {"train_loss": -10.180231094360352, "global_step": 121244, "epoch": 721} {"train_loss": -10.051606178283691, "global_step": 121245, "epoch": 721} {"train_loss": -9.914152145385742, "global_step": 121246, "epoch": 721} {"train_loss": -10.197732925415039, "global_step": 121247, "epoch": 721} {"train_loss": -10.271900177001953, "global_step": 121248, "epoch": 721} {"train_loss": -10.280658721923828, "global_step": 121249, "epoch": 721} {"train_loss": -10.076663970947266, "global_step": 121250, "epoch": 721} {"train_loss": -10.407659530639648, "global_step": 121251, "epoch": 721} {"train_loss": -10.050477027893066, "global_step": 121252, "epoch": 721} {"train_loss": -10.184188842773438, "global_step": 121253, "epoch": 721} {"train_loss": -9.90922737121582, "global_step": 121254, "epoch": 721} {"train_loss": -10.283551216125488, "global_step": 121255, "epoch": 721} {"train_loss": -10.066211700439453, "global_step": 121256, "epoch": 721} {"train_loss": -10.332486152648926, "global_step": 121257, "epoch": 721} {"train_loss": -10.356220245361328, "global_step": 121258, "epoch": 721} {"train_loss": -10.135151863098145, "global_step": 121259, "epoch": 721} {"train_loss": -10.163561820983887, "global_step": 121260, "epoch": 721} {"train_loss": -10.277966499328613, "global_step": 121261, "epoch": 721} {"train_loss": -10.117752075195312, "global_step": 121262, "epoch": 721} {"train_loss": -10.272586822509766, "global_step": 121263, "epoch": 721} {"train_loss": -9.988388061523438, "global_step": 121264, "epoch": 721} {"train_loss": -10.202030181884766, "global_step": 121265, "epoch": 721} {"train_loss": -9.840693473815918, "global_step": 121266, "epoch": 721} {"train_loss": -10.378438949584961, "global_step": 121267, "epoch": 721} {"train_loss": -10.219071388244629, "global_step": 121268, "epoch": 721} {"train_loss": -10.219697952270508, "global_step": 121269, "epoch": 721} {"train_loss": -9.881854057312012, "global_step": 121270, "epoch": 721} {"train_loss": -10.1559476852417, "global_step": 121271, "epoch": 721} {"train_loss": -10.116067886352539, "global_step": 121272, "epoch": 721} {"train_loss": -10.034518241882324, "global_step": 121273, "epoch": 721} {"train_loss": -10.045055389404297, "global_step": 121274, "epoch": 721} {"train_loss": -10.207253456115723, "global_step": 121275, "epoch": 721} {"train_loss": -10.147218704223633, "global_step": 121276, "epoch": 721} {"train_loss": -10.069385528564453, "global_step": 121277, "epoch": 721} {"train_loss": -10.110936164855957, "global_step": 121278, "epoch": 721} {"train_loss": -10.048688888549805, "global_step": 121279, "epoch": 721} {"train_loss": -10.129987716674805, "global_step": 121280, "epoch": 721} {"train_loss": -10.034719467163086, "global_step": 121281, "epoch": 721} {"train_loss": -10.153600692749023, "global_step": 121282, "epoch": 721} {"train_loss": -10.06051254272461, "global_step": 121283, "epoch": 721} {"train_loss": -10.203991889953613, "global_step": 121284, "epoch": 721} {"train_loss": -10.132308006286621, "global_step": 121285, "epoch": 721} {"train_loss": -10.161545753479004, "global_step": 121286, "epoch": 721} {"train_loss": -9.843883514404297, "global_step": 121287, "epoch": 721} {"train_loss": -10.006114959716797, "global_step": 121288, "epoch": 721} {"train_loss": -10.348864555358887, "global_step": 121289, "epoch": 721} {"train_loss": -9.893375396728516, "global_step": 121290, "epoch": 721} {"train_loss": -10.170502662658691, "global_step": 121291, "epoch": 721} {"train_loss": -9.486687660217285, "global_step": 121292, "epoch": 721} {"train_loss": -10.138101577758789, "global_step": 121293, "epoch": 721} {"train_loss": -9.759590148925781, "global_step": 121294, "epoch": 721} {"train_loss": -10.112776722226824, "global_step": 121295, "epoch": 721, "val_loss": 216123.796875} {"train_loss": -9.968399047851562, "global_step": 121296, "epoch": 722} {"train_loss": -9.577651977539062, "global_step": 121297, "epoch": 722} {"train_loss": -10.214309692382812, "global_step": 121298, "epoch": 722} {"train_loss": -9.828204154968262, "global_step": 121299, "epoch": 722} {"train_loss": -9.527228355407715, "global_step": 121300, "epoch": 722} {"train_loss": -9.966530799865723, "global_step": 121301, "epoch": 722} {"train_loss": -9.969371795654297, "global_step": 121302, "epoch": 722} {"train_loss": -9.444070816040039, "global_step": 121303, "epoch": 722} {"train_loss": -10.214118003845215, "global_step": 121304, "epoch": 722} {"train_loss": -9.958735466003418, "global_step": 121305, "epoch": 722} {"train_loss": -9.828551292419434, "global_step": 121306, "epoch": 722} {"train_loss": -9.935565948486328, "global_step": 121307, "epoch": 722} {"train_loss": -10.181474685668945, "global_step": 121308, "epoch": 722} {"train_loss": -10.01402473449707, "global_step": 121309, "epoch": 722} {"train_loss": -10.228996276855469, "global_step": 121310, "epoch": 722} {"train_loss": -10.06014347076416, "global_step": 121311, "epoch": 722} {"train_loss": -10.28495979309082, "global_step": 121312, "epoch": 722} {"train_loss": -10.355728149414062, "global_step": 121313, "epoch": 722} {"train_loss": -10.116816520690918, "global_step": 121314, "epoch": 722} {"train_loss": -10.290010452270508, "global_step": 121315, "epoch": 722} {"train_loss": -10.22372817993164, "global_step": 121316, "epoch": 722} {"train_loss": -10.275348663330078, "global_step": 121317, "epoch": 722} {"train_loss": -10.457490921020508, "global_step": 121318, "epoch": 722} {"train_loss": -10.312562942504883, "global_step": 121319, "epoch": 722} {"train_loss": -10.313576698303223, "global_step": 121320, "epoch": 722} {"train_loss": -10.296011924743652, "global_step": 121321, "epoch": 722} {"train_loss": -10.150028228759766, "global_step": 121322, "epoch": 722} {"train_loss": -10.34592056274414, "global_step": 121323, "epoch": 722} {"train_loss": -10.354373931884766, "global_step": 121324, "epoch": 722} {"train_loss": -10.220976829528809, "global_step": 121325, "epoch": 722} {"train_loss": -10.317009925842285, "global_step": 121326, "epoch": 722} {"train_loss": -10.27457046508789, "global_step": 121327, "epoch": 722} {"train_loss": -10.448249816894531, "global_step": 121328, "epoch": 722} {"train_loss": -10.510481834411621, "global_step": 121329, "epoch": 722} {"train_loss": -10.266658782958984, "global_step": 121330, "epoch": 722} {"train_loss": -10.445504188537598, "global_step": 121331, "epoch": 722} {"train_loss": -10.203280448913574, "global_step": 121332, "epoch": 722} {"train_loss": -10.575603485107422, "global_step": 121333, "epoch": 722} {"train_loss": -10.24157428741455, "global_step": 121334, "epoch": 722} {"train_loss": -10.448923110961914, "global_step": 121335, "epoch": 722} {"train_loss": -10.464723587036133, "global_step": 121336, "epoch": 722} {"train_loss": -10.368669509887695, "global_step": 121337, "epoch": 722} {"train_loss": -10.546164512634277, "global_step": 121338, "epoch": 722} {"train_loss": -10.36799430847168, "global_step": 121339, "epoch": 722} {"train_loss": -10.362786293029785, "global_step": 121340, "epoch": 722} {"train_loss": -10.279119491577148, "global_step": 121341, "epoch": 722} {"train_loss": -10.528507232666016, "global_step": 121342, "epoch": 722} {"train_loss": -10.598705291748047, "global_step": 121343, "epoch": 722} {"train_loss": -10.440069198608398, "global_step": 121344, "epoch": 722} {"train_loss": -10.508282661437988, "global_step": 121345, "epoch": 722} {"train_loss": -10.297552108764648, "global_step": 121346, "epoch": 722} {"train_loss": -10.090599060058594, "global_step": 121347, "epoch": 722} {"train_loss": -10.531075477600098, "global_step": 121348, "epoch": 722} {"train_loss": -9.778545379638672, "global_step": 121349, "epoch": 722} {"train_loss": -10.546210289001465, "global_step": 121350, "epoch": 722} {"train_loss": -10.509160995483398, "global_step": 121351, "epoch": 722} {"train_loss": -10.430234909057617, "global_step": 121352, "epoch": 722} {"train_loss": -9.913661003112793, "global_step": 121353, "epoch": 722} {"train_loss": -10.560920715332031, "global_step": 121354, "epoch": 722} {"train_loss": -10.139900207519531, "global_step": 121355, "epoch": 722} {"train_loss": -9.898075103759766, "global_step": 121356, "epoch": 722} {"train_loss": -9.23377513885498, "global_step": 121357, "epoch": 722} {"train_loss": -9.48594856262207, "global_step": 121358, "epoch": 722} {"train_loss": -9.231801986694336, "global_step": 121359, "epoch": 722} {"train_loss": -9.6397705078125, "global_step": 121360, "epoch": 722} {"train_loss": -9.713272094726562, "global_step": 121361, "epoch": 722} {"train_loss": -9.277166366577148, "global_step": 121362, "epoch": 722} {"train_loss": -10.332256317138672, "global_step": 121363, "epoch": 722} {"train_loss": -9.087770462036133, "global_step": 121364, "epoch": 722} {"train_loss": -9.694392204284668, "global_step": 121365, "epoch": 722} {"train_loss": -9.02410888671875, "global_step": 121366, "epoch": 722} {"train_loss": -10.06611442565918, "global_step": 121367, "epoch": 722} {"train_loss": -9.054553031921387, "global_step": 121368, "epoch": 722} {"train_loss": -9.856438636779785, "global_step": 121369, "epoch": 722} {"train_loss": -9.120367050170898, "global_step": 121370, "epoch": 722} {"train_loss": -8.980218887329102, "global_step": 121371, "epoch": 722} {"train_loss": -9.508270263671875, "global_step": 121372, "epoch": 722} {"train_loss": -9.520944595336914, "global_step": 121373, "epoch": 722} {"train_loss": -9.64210319519043, "global_step": 121374, "epoch": 722} {"train_loss": -9.62606143951416, "global_step": 121375, "epoch": 722} {"train_loss": -9.397924423217773, "global_step": 121376, "epoch": 722} {"train_loss": -9.75197982788086, "global_step": 121377, "epoch": 722} {"train_loss": -9.64069938659668, "global_step": 121378, "epoch": 722} {"train_loss": -9.818888664245605, "global_step": 121379, "epoch": 722} {"train_loss": -9.519364356994629, "global_step": 121380, "epoch": 722} {"train_loss": -9.789194107055664, "global_step": 121381, "epoch": 722} {"train_loss": -9.683221817016602, "global_step": 121382, "epoch": 722} {"train_loss": -9.870174407958984, "global_step": 121383, "epoch": 722} {"train_loss": -10.074918746948242, "global_step": 121384, "epoch": 722} {"train_loss": -9.86392593383789, "global_step": 121385, "epoch": 722} {"train_loss": -9.877857208251953, "global_step": 121386, "epoch": 722} {"train_loss": -10.105411529541016, "global_step": 121387, "epoch": 722} {"train_loss": -10.040806770324707, "global_step": 121388, "epoch": 722} {"train_loss": -9.97669792175293, "global_step": 121389, "epoch": 722} {"train_loss": -10.134842872619629, "global_step": 121390, "epoch": 722} {"train_loss": -10.09764575958252, "global_step": 121391, "epoch": 722} {"train_loss": -10.2574462890625, "global_step": 121392, "epoch": 722} {"train_loss": -9.613723754882812, "global_step": 121393, "epoch": 722} {"train_loss": -9.897516250610352, "global_step": 121394, "epoch": 722} {"train_loss": -10.231829643249512, "global_step": 121395, "epoch": 722} {"train_loss": -10.130453109741211, "global_step": 121396, "epoch": 722} {"train_loss": -10.179847717285156, "global_step": 121397, "epoch": 722} {"train_loss": -10.394997596740723, "global_step": 121398, "epoch": 722} {"train_loss": -10.090719223022461, "global_step": 121399, "epoch": 722} {"train_loss": -9.997610092163086, "global_step": 121400, "epoch": 722} {"train_loss": -10.184881210327148, "global_step": 121401, "epoch": 722} {"train_loss": -10.21199893951416, "global_step": 121402, "epoch": 722} {"train_loss": -10.189379692077637, "global_step": 121403, "epoch": 722} {"train_loss": -10.219019889831543, "global_step": 121404, "epoch": 722} {"train_loss": -10.28685188293457, "global_step": 121405, "epoch": 722} {"train_loss": -9.980348587036133, "global_step": 121406, "epoch": 722} {"train_loss": -10.184804916381836, "global_step": 121407, "epoch": 722} {"train_loss": -10.187332153320312, "global_step": 121408, "epoch": 722} {"train_loss": -10.231239318847656, "global_step": 121409, "epoch": 722} {"train_loss": -10.401649475097656, "global_step": 121410, "epoch": 722} {"train_loss": -10.14516830444336, "global_step": 121411, "epoch": 722} {"train_loss": -10.104363441467285, "global_step": 121412, "epoch": 722} {"train_loss": -10.244937896728516, "global_step": 121413, "epoch": 722} {"train_loss": -9.970587730407715, "global_step": 121414, "epoch": 722} {"train_loss": -10.100757598876953, "global_step": 121415, "epoch": 722} {"train_loss": -10.21146297454834, "global_step": 121416, "epoch": 722} {"train_loss": -10.14492416381836, "global_step": 121417, "epoch": 722} {"train_loss": -10.004436492919922, "global_step": 121418, "epoch": 722} {"train_loss": -10.235782623291016, "global_step": 121419, "epoch": 722} {"train_loss": -10.058206558227539, "global_step": 121420, "epoch": 722} {"train_loss": -9.871114730834961, "global_step": 121421, "epoch": 722} {"train_loss": -9.960458755493164, "global_step": 121422, "epoch": 722} {"train_loss": -10.324326515197754, "global_step": 121423, "epoch": 722} {"train_loss": -10.077085494995117, "global_step": 121424, "epoch": 722} {"train_loss": -10.08504581451416, "global_step": 121425, "epoch": 722} {"train_loss": -10.180797576904297, "global_step": 121426, "epoch": 722} {"train_loss": -10.1548490524292, "global_step": 121427, "epoch": 722} {"train_loss": -10.18867301940918, "global_step": 121428, "epoch": 722} {"train_loss": -9.990116119384766, "global_step": 121429, "epoch": 722} {"train_loss": -10.513564109802246, "global_step": 121430, "epoch": 722} {"train_loss": -10.041162490844727, "global_step": 121431, "epoch": 722} {"train_loss": -10.258427619934082, "global_step": 121432, "epoch": 722} {"train_loss": -10.355424880981445, "global_step": 121433, "epoch": 722} {"train_loss": -10.247551918029785, "global_step": 121434, "epoch": 722} {"train_loss": -10.290064811706543, "global_step": 121435, "epoch": 722} {"train_loss": -10.292449951171875, "global_step": 121436, "epoch": 722} {"train_loss": -10.309403419494629, "global_step": 121437, "epoch": 722} {"train_loss": -10.087472915649414, "global_step": 121438, "epoch": 722} {"train_loss": -10.199365615844727, "global_step": 121439, "epoch": 722} {"train_loss": -9.73239517211914, "global_step": 121440, "epoch": 722} {"train_loss": -9.985505104064941, "global_step": 121441, "epoch": 722} {"train_loss": -10.13248062133789, "global_step": 121442, "epoch": 722} {"train_loss": -9.582408905029297, "global_step": 121443, "epoch": 722} {"train_loss": -10.09145736694336, "global_step": 121444, "epoch": 722} {"train_loss": -9.839967727661133, "global_step": 121445, "epoch": 722} {"train_loss": -9.686092376708984, "global_step": 121446, "epoch": 722} {"train_loss": -10.20366096496582, "global_step": 121447, "epoch": 722} {"train_loss": -9.877716064453125, "global_step": 121448, "epoch": 722} {"train_loss": -9.635722160339355, "global_step": 121449, "epoch": 722} {"train_loss": -10.32162094116211, "global_step": 121450, "epoch": 722} {"train_loss": -9.647378921508789, "global_step": 121451, "epoch": 722} {"train_loss": -9.727241516113281, "global_step": 121452, "epoch": 722} {"train_loss": -9.92121696472168, "global_step": 121453, "epoch": 722} {"train_loss": -9.945556640625, "global_step": 121454, "epoch": 722} {"train_loss": -9.859823226928711, "global_step": 121455, "epoch": 722} {"train_loss": -9.943822860717773, "global_step": 121456, "epoch": 722} {"train_loss": -9.880151748657227, "global_step": 121457, "epoch": 722} {"train_loss": -9.898944854736328, "global_step": 121458, "epoch": 722} {"train_loss": -9.695724487304688, "global_step": 121459, "epoch": 722} {"train_loss": -10.091190338134766, "global_step": 121460, "epoch": 722} {"train_loss": -10.176061630249023, "global_step": 121461, "epoch": 722} {"train_loss": -10.142929077148438, "global_step": 121462, "epoch": 722} {"train_loss": -10.042157553491139, "global_step": 121463, "epoch": 722, "val_loss": 214280.296875} {"train_loss": -9.977420806884766, "global_step": 121464, "epoch": 723} {"train_loss": -10.324026107788086, "global_step": 121465, "epoch": 723} {"train_loss": -10.400228500366211, "global_step": 121466, "epoch": 723} {"train_loss": -9.84600830078125, "global_step": 121467, "epoch": 723} {"train_loss": -10.182626724243164, "global_step": 121468, "epoch": 723} {"train_loss": -10.265251159667969, "global_step": 121469, "epoch": 723} {"train_loss": -10.271955490112305, "global_step": 121470, "epoch": 723} {"train_loss": -10.085466384887695, "global_step": 121471, "epoch": 723} {"train_loss": -10.168169021606445, "global_step": 121472, "epoch": 723} {"train_loss": -10.049968719482422, "global_step": 121473, "epoch": 723} {"train_loss": -10.439776420593262, "global_step": 121474, "epoch": 723} {"train_loss": -10.196504592895508, "global_step": 121475, "epoch": 723} {"train_loss": -10.29124641418457, "global_step": 121476, "epoch": 723} {"train_loss": -10.206123352050781, "global_step": 121477, "epoch": 723} {"train_loss": -10.410074234008789, "global_step": 121478, "epoch": 723} {"train_loss": -10.188910484313965, "global_step": 121479, "epoch": 723} {"train_loss": -10.276151657104492, "global_step": 121480, "epoch": 723} {"train_loss": -10.205829620361328, "global_step": 121481, "epoch": 723} {"train_loss": -10.00893783569336, "global_step": 121482, "epoch": 723} {"train_loss": -10.3192777633667, "global_step": 121483, "epoch": 723} {"train_loss": -10.426860809326172, "global_step": 121484, "epoch": 723} {"train_loss": -10.48033618927002, "global_step": 121485, "epoch": 723} {"train_loss": -10.29703140258789, "global_step": 121486, "epoch": 723} {"train_loss": -10.418182373046875, "global_step": 121487, "epoch": 723} {"train_loss": -10.330522537231445, "global_step": 121488, "epoch": 723} {"train_loss": -10.175519943237305, "global_step": 121489, "epoch": 723} {"train_loss": -10.081452369689941, "global_step": 121490, "epoch": 723} {"train_loss": -9.730488777160645, "global_step": 121491, "epoch": 723} {"train_loss": -10.465755462646484, "global_step": 121492, "epoch": 723} {"train_loss": -10.366497039794922, "global_step": 121493, "epoch": 723} {"train_loss": -10.207115173339844, "global_step": 121494, "epoch": 723} {"train_loss": -10.076457023620605, "global_step": 121495, "epoch": 723} {"train_loss": -10.172005653381348, "global_step": 121496, "epoch": 723} {"train_loss": -10.019277572631836, "global_step": 121497, "epoch": 723} {"train_loss": -10.081178665161133, "global_step": 121498, "epoch": 723} {"train_loss": -10.277894973754883, "global_step": 121499, "epoch": 723} {"train_loss": -9.99428939819336, "global_step": 121500, "epoch": 723} {"train_loss": -9.920745849609375, "global_step": 121501, "epoch": 723} {"train_loss": -10.287569046020508, "global_step": 121502, "epoch": 723} {"train_loss": -10.480993270874023, "global_step": 121503, "epoch": 723} {"train_loss": -10.551973342895508, "global_step": 121504, "epoch": 723} {"train_loss": -10.322668075561523, "global_step": 121505, "epoch": 723} {"train_loss": -10.415590286254883, "global_step": 121506, "epoch": 723} {"train_loss": -10.33430290222168, "global_step": 121507, "epoch": 723} {"train_loss": -10.61981201171875, "global_step": 121508, "epoch": 723} {"train_loss": -10.398566246032715, "global_step": 121509, "epoch": 723} {"train_loss": -10.529914855957031, "global_step": 121510, "epoch": 723} {"train_loss": -10.418121337890625, "global_step": 121511, "epoch": 723} {"train_loss": -9.996334075927734, "global_step": 121512, "epoch": 723} {"train_loss": -10.342578887939453, "global_step": 121513, "epoch": 723} {"train_loss": -10.21124267578125, "global_step": 121514, "epoch": 723} {"train_loss": -10.263312339782715, "global_step": 121515, "epoch": 723} {"train_loss": -10.478935241699219, "global_step": 121516, "epoch": 723} {"train_loss": -10.151630401611328, "global_step": 121517, "epoch": 723} {"train_loss": -9.993942260742188, "global_step": 121518, "epoch": 723} {"train_loss": -10.276729583740234, "global_step": 121519, "epoch": 723} {"train_loss": -10.245565414428711, "global_step": 121520, "epoch": 723} {"train_loss": -10.199899673461914, "global_step": 121521, "epoch": 723} {"train_loss": -10.062186241149902, "global_step": 121522, "epoch": 723} {"train_loss": -9.961073875427246, "global_step": 121523, "epoch": 723} {"train_loss": -10.141439437866211, "global_step": 121524, "epoch": 723} {"train_loss": -10.100637435913086, "global_step": 121525, "epoch": 723} {"train_loss": -10.05541706085205, "global_step": 121526, "epoch": 723} {"train_loss": -10.141559600830078, "global_step": 121527, "epoch": 723} {"train_loss": -10.07176399230957, "global_step": 121528, "epoch": 723} {"train_loss": -9.532212257385254, "global_step": 121529, "epoch": 723} {"train_loss": -10.222116470336914, "global_step": 121530, "epoch": 723} {"train_loss": -10.24901008605957, "global_step": 121531, "epoch": 723} {"train_loss": -9.563949584960938, "global_step": 121532, "epoch": 723} {"train_loss": -10.333229064941406, "global_step": 121533, "epoch": 723} {"train_loss": -9.30046558380127, "global_step": 121534, "epoch": 723} {"train_loss": -10.003633499145508, "global_step": 121535, "epoch": 723} {"train_loss": -10.18320083618164, "global_step": 121536, "epoch": 723} {"train_loss": -10.018871307373047, "global_step": 121537, "epoch": 723} {"train_loss": -10.153165817260742, "global_step": 121538, "epoch": 723} {"train_loss": -9.948420524597168, "global_step": 121539, "epoch": 723} {"train_loss": -10.010967254638672, "global_step": 121540, "epoch": 723} {"train_loss": -9.845381736755371, "global_step": 121541, "epoch": 723} {"train_loss": -9.879493713378906, "global_step": 121542, "epoch": 723} {"train_loss": -10.090426445007324, "global_step": 121543, "epoch": 723} {"train_loss": -9.890892028808594, "global_step": 121544, "epoch": 723} {"train_loss": -9.968931198120117, "global_step": 121545, "epoch": 723} {"train_loss": -9.956486701965332, "global_step": 121546, "epoch": 723} {"train_loss": -10.057218551635742, "global_step": 121547, "epoch": 723} {"train_loss": -10.188196182250977, "global_step": 121548, "epoch": 723} {"train_loss": -10.191018104553223, "global_step": 121549, "epoch": 723} {"train_loss": -9.795707702636719, "global_step": 121550, "epoch": 723} {"train_loss": -10.08781623840332, "global_step": 121551, "epoch": 723} {"train_loss": -9.685644149780273, "global_step": 121552, "epoch": 723} {"train_loss": -10.290670394897461, "global_step": 121553, "epoch": 723} {"train_loss": -9.879732131958008, "global_step": 121554, "epoch": 723} {"train_loss": -10.201913833618164, "global_step": 121555, "epoch": 723} {"train_loss": -9.717561721801758, "global_step": 121556, "epoch": 723} {"train_loss": -10.200480461120605, "global_step": 121557, "epoch": 723} {"train_loss": -10.03219223022461, "global_step": 121558, "epoch": 723} {"train_loss": -10.154993057250977, "global_step": 121559, "epoch": 723} {"train_loss": -9.852021217346191, "global_step": 121560, "epoch": 723} {"train_loss": -10.137290954589844, "global_step": 121561, "epoch": 723} {"train_loss": -10.081506729125977, "global_step": 121562, "epoch": 723} {"train_loss": -9.90677261352539, "global_step": 121563, "epoch": 723} {"train_loss": -10.272348403930664, "global_step": 121564, "epoch": 723} {"train_loss": -10.178487777709961, "global_step": 121565, "epoch": 723} {"train_loss": -10.30360221862793, "global_step": 121566, "epoch": 723} {"train_loss": -9.837458610534668, "global_step": 121567, "epoch": 723} {"train_loss": -10.375473976135254, "global_step": 121568, "epoch": 723} {"train_loss": -10.05446720123291, "global_step": 121569, "epoch": 723} {"train_loss": -10.09542179107666, "global_step": 121570, "epoch": 723} {"train_loss": -10.213187217712402, "global_step": 121571, "epoch": 723} {"train_loss": -10.120290756225586, "global_step": 121572, "epoch": 723} {"train_loss": -10.075830459594727, "global_step": 121573, "epoch": 723} {"train_loss": -10.18681526184082, "global_step": 121574, "epoch": 723} {"train_loss": -9.954621315002441, "global_step": 121575, "epoch": 723} {"train_loss": -10.415412902832031, "global_step": 121576, "epoch": 723} {"train_loss": -10.023062705993652, "global_step": 121577, "epoch": 723} {"train_loss": -10.4064359664917, "global_step": 121578, "epoch": 723} {"train_loss": -10.032764434814453, "global_step": 121579, "epoch": 723} {"train_loss": -10.001819610595703, "global_step": 121580, "epoch": 723} {"train_loss": -10.186655044555664, "global_step": 121581, "epoch": 723} {"train_loss": -9.799415588378906, "global_step": 121582, "epoch": 723} {"train_loss": -10.186332702636719, "global_step": 121583, "epoch": 723} {"train_loss": -10.234025955200195, "global_step": 121584, "epoch": 723} {"train_loss": -10.071680068969727, "global_step": 121585, "epoch": 723} {"train_loss": -10.124910354614258, "global_step": 121586, "epoch": 723} {"train_loss": -10.192544937133789, "global_step": 121587, "epoch": 723} {"train_loss": -10.153940200805664, "global_step": 121588, "epoch": 723} {"train_loss": -10.243545532226562, "global_step": 121589, "epoch": 723} {"train_loss": -10.064454078674316, "global_step": 121590, "epoch": 723} {"train_loss": -10.289595603942871, "global_step": 121591, "epoch": 723} {"train_loss": -10.016427993774414, "global_step": 121592, "epoch": 723} {"train_loss": -9.94776439666748, "global_step": 121593, "epoch": 723} {"train_loss": -10.4467134475708, "global_step": 121594, "epoch": 723} {"train_loss": -10.144665718078613, "global_step": 121595, "epoch": 723} {"train_loss": -10.053686141967773, "global_step": 121596, "epoch": 723} {"train_loss": -10.258524894714355, "global_step": 121597, "epoch": 723} {"train_loss": -10.08508586883545, "global_step": 121598, "epoch": 723} {"train_loss": -10.500764846801758, "global_step": 121599, "epoch": 723} {"train_loss": -10.180038452148438, "global_step": 121600, "epoch": 723} {"train_loss": -10.10336685180664, "global_step": 121601, "epoch": 723} {"train_loss": -9.843875885009766, "global_step": 121602, "epoch": 723} {"train_loss": -10.16191291809082, "global_step": 121603, "epoch": 723} {"train_loss": -10.357088088989258, "global_step": 121604, "epoch": 723} {"train_loss": -10.029372215270996, "global_step": 121605, "epoch": 723} {"train_loss": -10.30766487121582, "global_step": 121606, "epoch": 723} {"train_loss": -9.814976692199707, "global_step": 121607, "epoch": 723} {"train_loss": -9.976231575012207, "global_step": 121608, "epoch": 723} {"train_loss": -10.030921936035156, "global_step": 121609, "epoch": 723} {"train_loss": -9.9744291305542, "global_step": 121610, "epoch": 723} {"train_loss": -10.273059844970703, "global_step": 121611, "epoch": 723} {"train_loss": -9.631487846374512, "global_step": 121612, "epoch": 723} {"train_loss": -9.968278884887695, "global_step": 121613, "epoch": 723} {"train_loss": -9.82621955871582, "global_step": 121614, "epoch": 723} {"train_loss": -9.936774253845215, "global_step": 121615, "epoch": 723} {"train_loss": -10.22003173828125, "global_step": 121616, "epoch": 723} {"train_loss": -10.067508697509766, "global_step": 121617, "epoch": 723} {"train_loss": -10.367145538330078, "global_step": 121618, "epoch": 723} {"train_loss": -10.304386138916016, "global_step": 121619, "epoch": 723} {"train_loss": -10.463403701782227, "global_step": 121620, "epoch": 723} {"train_loss": -10.344376564025879, "global_step": 121621, "epoch": 723} {"train_loss": -10.305017471313477, "global_step": 121622, "epoch": 723} {"train_loss": -10.091053009033203, "global_step": 121623, "epoch": 723} {"train_loss": -10.43203067779541, "global_step": 121624, "epoch": 723} {"train_loss": -10.327778816223145, "global_step": 121625, "epoch": 723} {"train_loss": -10.274665832519531, "global_step": 121626, "epoch": 723} {"train_loss": -10.290596008300781, "global_step": 121627, "epoch": 723} {"train_loss": -10.480353355407715, "global_step": 121628, "epoch": 723} {"train_loss": -10.327753067016602, "global_step": 121629, "epoch": 723} {"train_loss": -10.152195930480957, "global_step": 121630, "epoch": 723} {"train_loss": -10.147977993601845, "global_step": 121631, "epoch": 723, "val_loss": 214989.84375} {"train_loss": -9.976062774658203, "global_step": 121632, "epoch": 724} {"train_loss": -10.512195587158203, "global_step": 121633, "epoch": 724} {"train_loss": -10.244385719299316, "global_step": 121634, "epoch": 724} {"train_loss": -10.229089736938477, "global_step": 121635, "epoch": 724} {"train_loss": -10.340225219726562, "global_step": 121636, "epoch": 724} {"train_loss": -9.66774845123291, "global_step": 121637, "epoch": 724} {"train_loss": -10.173583984375, "global_step": 121638, "epoch": 724} {"train_loss": -9.875253677368164, "global_step": 121639, "epoch": 724} {"train_loss": -9.828039169311523, "global_step": 121640, "epoch": 724} {"train_loss": -9.929282188415527, "global_step": 121641, "epoch": 724} {"train_loss": -10.109676361083984, "global_step": 121642, "epoch": 724} {"train_loss": -10.088224411010742, "global_step": 121643, "epoch": 724} {"train_loss": -9.925792694091797, "global_step": 121644, "epoch": 724} {"train_loss": -10.270917892456055, "global_step": 121645, "epoch": 724} {"train_loss": -10.323620796203613, "global_step": 121646, "epoch": 724} {"train_loss": -9.922910690307617, "global_step": 121647, "epoch": 724} {"train_loss": -10.198685646057129, "global_step": 121648, "epoch": 724} {"train_loss": -10.057125091552734, "global_step": 121649, "epoch": 724} {"train_loss": -10.23602294921875, "global_step": 121650, "epoch": 724} {"train_loss": -10.058819770812988, "global_step": 121651, "epoch": 724} {"train_loss": -10.139278411865234, "global_step": 121652, "epoch": 724} {"train_loss": -10.065643310546875, "global_step": 121653, "epoch": 724} {"train_loss": -9.94301986694336, "global_step": 121654, "epoch": 724} {"train_loss": -10.518388748168945, "global_step": 121655, "epoch": 724} {"train_loss": -9.878253936767578, "global_step": 121656, "epoch": 724} {"train_loss": -10.15905475616455, "global_step": 121657, "epoch": 724} {"train_loss": -9.995925903320312, "global_step": 121658, "epoch": 724} {"train_loss": -9.649532318115234, "global_step": 121659, "epoch": 724} {"train_loss": -10.226033210754395, "global_step": 121660, "epoch": 724} {"train_loss": -10.127012252807617, "global_step": 121661, "epoch": 724} {"train_loss": -10.329524993896484, "global_step": 121662, "epoch": 724} {"train_loss": -10.50700855255127, "global_step": 121663, "epoch": 724} {"train_loss": -10.257166862487793, "global_step": 121664, "epoch": 724} {"train_loss": -10.139507293701172, "global_step": 121665, "epoch": 724} {"train_loss": -10.326700210571289, "global_step": 121666, "epoch": 724} {"train_loss": -10.258539199829102, "global_step": 121667, "epoch": 724} {"train_loss": -9.959640502929688, "global_step": 121668, "epoch": 724} {"train_loss": -10.155843734741211, "global_step": 121669, "epoch": 724} {"train_loss": -10.143291473388672, "global_step": 121670, "epoch": 724} {"train_loss": -10.093058586120605, "global_step": 121671, "epoch": 724} {"train_loss": -10.128128051757812, "global_step": 121672, "epoch": 724} {"train_loss": -10.427395820617676, "global_step": 121673, "epoch": 724} {"train_loss": -10.151151657104492, "global_step": 121674, "epoch": 724} {"train_loss": -10.502386093139648, "global_step": 121675, "epoch": 724} {"train_loss": -10.337632179260254, "global_step": 121676, "epoch": 724} {"train_loss": -10.236303329467773, "global_step": 121677, "epoch": 724} {"train_loss": -10.343830108642578, "global_step": 121678, "epoch": 724} {"train_loss": -10.107473373413086, "global_step": 121679, "epoch": 724} {"train_loss": -10.339096069335938, "global_step": 121680, "epoch": 724} {"train_loss": -10.389236450195312, "global_step": 121681, "epoch": 724} {"train_loss": -10.368919372558594, "global_step": 121682, "epoch": 724} {"train_loss": -10.239606857299805, "global_step": 121683, "epoch": 724} {"train_loss": -10.077362060546875, "global_step": 121684, "epoch": 724} {"train_loss": -10.109260559082031, "global_step": 121685, "epoch": 724} {"train_loss": -10.191620826721191, "global_step": 121686, "epoch": 724} {"train_loss": -9.965930938720703, "global_step": 121687, "epoch": 724} {"train_loss": -10.42550277709961, "global_step": 121688, "epoch": 724} {"train_loss": -10.049514770507812, "global_step": 121689, "epoch": 724} {"train_loss": -10.364025115966797, "global_step": 121690, "epoch": 724} {"train_loss": -10.337549209594727, "global_step": 121691, "epoch": 724} {"train_loss": -10.334028244018555, "global_step": 121692, "epoch": 724} {"train_loss": -10.190168380737305, "global_step": 121693, "epoch": 724} {"train_loss": -9.849252700805664, "global_step": 121694, "epoch": 724} {"train_loss": -10.092874526977539, "global_step": 121695, "epoch": 724} {"train_loss": -10.25584602355957, "global_step": 121696, "epoch": 724} {"train_loss": -10.24927043914795, "global_step": 121697, "epoch": 724} {"train_loss": -10.254837989807129, "global_step": 121698, "epoch": 724} {"train_loss": -10.226146697998047, "global_step": 121699, "epoch": 724} {"train_loss": -10.283937454223633, "global_step": 121700, "epoch": 724} {"train_loss": -10.180425643920898, "global_step": 121701, "epoch": 724} {"train_loss": -9.95848274230957, "global_step": 121702, "epoch": 724} {"train_loss": -10.19659423828125, "global_step": 121703, "epoch": 724} {"train_loss": -9.992148399353027, "global_step": 121704, "epoch": 724} {"train_loss": -10.30210018157959, "global_step": 121705, "epoch": 724} {"train_loss": -9.928228378295898, "global_step": 121706, "epoch": 724} {"train_loss": -10.167289733886719, "global_step": 121707, "epoch": 724} {"train_loss": -10.271029472351074, "global_step": 121708, "epoch": 724} {"train_loss": -9.808384895324707, "global_step": 121709, "epoch": 724} {"train_loss": -10.33683967590332, "global_step": 121710, "epoch": 724} {"train_loss": -9.83521842956543, "global_step": 121711, "epoch": 724} {"train_loss": -10.047310829162598, "global_step": 121712, "epoch": 724} {"train_loss": -10.130156517028809, "global_step": 121713, "epoch": 724} {"train_loss": -10.065824508666992, "global_step": 121714, "epoch": 724} {"train_loss": -10.018563270568848, "global_step": 121715, "epoch": 724} {"train_loss": -10.171463966369629, "global_step": 121716, "epoch": 724} {"train_loss": -10.14654541015625, "global_step": 121717, "epoch": 724} {"train_loss": -10.042269706726074, "global_step": 121718, "epoch": 724} {"train_loss": -10.147575378417969, "global_step": 121719, "epoch": 724} {"train_loss": -10.112303733825684, "global_step": 121720, "epoch": 724} {"train_loss": -9.869942665100098, "global_step": 121721, "epoch": 724} {"train_loss": -9.8983793258667, "global_step": 121722, "epoch": 724} {"train_loss": -9.926885604858398, "global_step": 121723, "epoch": 724} {"train_loss": -10.178007125854492, "global_step": 121724, "epoch": 724} {"train_loss": -10.122868537902832, "global_step": 121725, "epoch": 724} {"train_loss": -10.138556480407715, "global_step": 121726, "epoch": 724} {"train_loss": -10.096349716186523, "global_step": 121727, "epoch": 724} {"train_loss": -9.964029312133789, "global_step": 121728, "epoch": 724} {"train_loss": -10.192678451538086, "global_step": 121729, "epoch": 724} {"train_loss": -10.172115325927734, "global_step": 121730, "epoch": 724} {"train_loss": -10.296426773071289, "global_step": 121731, "epoch": 724} {"train_loss": -10.12490463256836, "global_step": 121732, "epoch": 724} {"train_loss": -10.320592880249023, "global_step": 121733, "epoch": 724} {"train_loss": -9.675518035888672, "global_step": 121734, "epoch": 724} {"train_loss": -10.273530006408691, "global_step": 121735, "epoch": 724} {"train_loss": -9.990596771240234, "global_step": 121736, "epoch": 724} {"train_loss": -10.435674667358398, "global_step": 121737, "epoch": 724} {"train_loss": -9.748523712158203, "global_step": 121738, "epoch": 724} {"train_loss": -10.191383361816406, "global_step": 121739, "epoch": 724} {"train_loss": -9.821704864501953, "global_step": 121740, "epoch": 724} {"train_loss": -10.331918716430664, "global_step": 121741, "epoch": 724} {"train_loss": -10.201705932617188, "global_step": 121742, "epoch": 724} {"train_loss": -10.052490234375, "global_step": 121743, "epoch": 724} {"train_loss": -10.261672973632812, "global_step": 121744, "epoch": 724} {"train_loss": -10.330695152282715, "global_step": 121745, "epoch": 724} {"train_loss": -10.09288215637207, "global_step": 121746, "epoch": 724} {"train_loss": -10.352394104003906, "global_step": 121747, "epoch": 724} {"train_loss": -10.25082778930664, "global_step": 121748, "epoch": 724} {"train_loss": -10.173439979553223, "global_step": 121749, "epoch": 724} {"train_loss": -10.254323959350586, "global_step": 121750, "epoch": 724} {"train_loss": -9.971988677978516, "global_step": 121751, "epoch": 724} {"train_loss": -10.34388256072998, "global_step": 121752, "epoch": 724} {"train_loss": -10.300885200500488, "global_step": 121753, "epoch": 724} {"train_loss": -10.352743148803711, "global_step": 121754, "epoch": 724} {"train_loss": -10.374019622802734, "global_step": 121755, "epoch": 724} {"train_loss": -10.372509002685547, "global_step": 121756, "epoch": 724} {"train_loss": -10.405760765075684, "global_step": 121757, "epoch": 724} {"train_loss": -10.141483306884766, "global_step": 121758, "epoch": 724} {"train_loss": -10.102816581726074, "global_step": 121759, "epoch": 724} {"train_loss": -10.131623268127441, "global_step": 121760, "epoch": 724} {"train_loss": -10.526430130004883, "global_step": 121761, "epoch": 724} {"train_loss": -10.170061111450195, "global_step": 121762, "epoch": 724} {"train_loss": -10.487300872802734, "global_step": 121763, "epoch": 724} {"train_loss": -10.057534217834473, "global_step": 121764, "epoch": 724} {"train_loss": -10.416678428649902, "global_step": 121765, "epoch": 724} {"train_loss": -10.182906150817871, "global_step": 121766, "epoch": 724} {"train_loss": -10.222579956054688, "global_step": 121767, "epoch": 724} {"train_loss": -10.375356674194336, "global_step": 121768, "epoch": 724} {"train_loss": -10.098649978637695, "global_step": 121769, "epoch": 724} {"train_loss": -10.20545482635498, "global_step": 121770, "epoch": 724} {"train_loss": -10.36802864074707, "global_step": 121771, "epoch": 724} {"train_loss": -10.244832992553711, "global_step": 121772, "epoch": 724} {"train_loss": -10.242959022521973, "global_step": 121773, "epoch": 724} {"train_loss": -10.090131759643555, "global_step": 121774, "epoch": 724} {"train_loss": -10.311694145202637, "global_step": 121775, "epoch": 724} {"train_loss": -10.102945327758789, "global_step": 121776, "epoch": 724} {"train_loss": -10.389549255371094, "global_step": 121777, "epoch": 724} {"train_loss": -9.994187355041504, "global_step": 121778, "epoch": 724} {"train_loss": -10.143377304077148, "global_step": 121779, "epoch": 724} {"train_loss": -10.463676452636719, "global_step": 121780, "epoch": 724} {"train_loss": -10.521525382995605, "global_step": 121781, "epoch": 724} {"train_loss": -9.865341186523438, "global_step": 121782, "epoch": 724} {"train_loss": -10.458578109741211, "global_step": 121783, "epoch": 724} {"train_loss": -10.547285079956055, "global_step": 121784, "epoch": 724} {"train_loss": -10.168325424194336, "global_step": 121785, "epoch": 724} {"train_loss": -10.175392150878906, "global_step": 121786, "epoch": 724} {"train_loss": -9.072811126708984, "global_step": 121787, "epoch": 724} {"train_loss": -9.925580978393555, "global_step": 121788, "epoch": 724} {"train_loss": -9.659027099609375, "global_step": 121789, "epoch": 724} {"train_loss": -9.87765121459961, "global_step": 121790, "epoch": 724} {"train_loss": -9.785394668579102, "global_step": 121791, "epoch": 724} {"train_loss": -9.234713554382324, "global_step": 121792, "epoch": 724} {"train_loss": -9.961114883422852, "global_step": 121793, "epoch": 724} {"train_loss": -8.840166091918945, "global_step": 121794, "epoch": 724} {"train_loss": -9.846376419067383, "global_step": 121795, "epoch": 724} {"train_loss": -7.836273670196533, "global_step": 121796, "epoch": 724} {"train_loss": -8.798662185668945, "global_step": 121797, "epoch": 724} {"train_loss": -8.96091079711914, "global_step": 121798, "epoch": 724} {"train_loss": -10.103252561319442, "global_step": 121799, "epoch": 724, "val_loss": 209497.65625} {"train_loss": -9.532171249389648, "global_step": 121800, "epoch": 725} {"train_loss": -9.854480743408203, "global_step": 121801, "epoch": 725} {"train_loss": -9.740005493164062, "global_step": 121802, "epoch": 725} {"train_loss": -9.522436141967773, "global_step": 121803, "epoch": 725} {"train_loss": -9.626635551452637, "global_step": 121804, "epoch": 725} {"train_loss": -9.921217918395996, "global_step": 121805, "epoch": 725} {"train_loss": -9.755759239196777, "global_step": 121806, "epoch": 725} {"train_loss": -9.645963668823242, "global_step": 121807, "epoch": 725} {"train_loss": -9.735246658325195, "global_step": 121808, "epoch": 725} {"train_loss": -9.842592239379883, "global_step": 121809, "epoch": 725} {"train_loss": -9.814404487609863, "global_step": 121810, "epoch": 725} {"train_loss": -9.918573379516602, "global_step": 121811, "epoch": 725} {"train_loss": -10.050058364868164, "global_step": 121812, "epoch": 725} {"train_loss": -9.980417251586914, "global_step": 121813, "epoch": 725} {"train_loss": -9.923746109008789, "global_step": 121814, "epoch": 725} {"train_loss": -10.026698112487793, "global_step": 121815, "epoch": 725} {"train_loss": -9.984623908996582, "global_step": 121816, "epoch": 725} {"train_loss": -9.88348388671875, "global_step": 121817, "epoch": 725} {"train_loss": -9.968832969665527, "global_step": 121818, "epoch": 725} {"train_loss": -9.902929306030273, "global_step": 121819, "epoch": 725} {"train_loss": -10.096090316772461, "global_step": 121820, "epoch": 725} {"train_loss": -10.210282325744629, "global_step": 121821, "epoch": 725} {"train_loss": -9.973970413208008, "global_step": 121822, "epoch": 725} {"train_loss": -10.098796844482422, "global_step": 121823, "epoch": 725} {"train_loss": -10.113851547241211, "global_step": 121824, "epoch": 725} {"train_loss": -10.328261375427246, "global_step": 121825, "epoch": 725} {"train_loss": -10.407207489013672, "global_step": 121826, "epoch": 725} {"train_loss": -10.315529823303223, "global_step": 121827, "epoch": 725} {"train_loss": -10.154619216918945, "global_step": 121828, "epoch": 725} {"train_loss": -10.166886329650879, "global_step": 121829, "epoch": 725} {"train_loss": -9.972129821777344, "global_step": 121830, "epoch": 725} {"train_loss": -10.090580940246582, "global_step": 121831, "epoch": 725} {"train_loss": -10.374634742736816, "global_step": 121832, "epoch": 725} {"train_loss": -10.282941818237305, "global_step": 121833, "epoch": 725} {"train_loss": -10.248285293579102, "global_step": 121834, "epoch": 725} {"train_loss": -10.160490036010742, "global_step": 121835, "epoch": 725} {"train_loss": -10.58251667022705, "global_step": 121836, "epoch": 725} {"train_loss": -10.322299003601074, "global_step": 121837, "epoch": 725} {"train_loss": -10.123991012573242, "global_step": 121838, "epoch": 725} {"train_loss": -10.358627319335938, "global_step": 121839, "epoch": 725} {"train_loss": -10.071300506591797, "global_step": 121840, "epoch": 725} {"train_loss": -10.093036651611328, "global_step": 121841, "epoch": 725} {"train_loss": -10.334061622619629, "global_step": 121842, "epoch": 725} {"train_loss": -10.421989440917969, "global_step": 121843, "epoch": 725} {"train_loss": -10.436041831970215, "global_step": 121844, "epoch": 725} {"train_loss": -9.990968704223633, "global_step": 121845, "epoch": 725} {"train_loss": -10.313484191894531, "global_step": 121846, "epoch": 725} {"train_loss": -10.191375732421875, "global_step": 121847, "epoch": 725} {"train_loss": -10.431575775146484, "global_step": 121848, "epoch": 725} {"train_loss": -9.915107727050781, "global_step": 121849, "epoch": 725} {"train_loss": -10.41506576538086, "global_step": 121850, "epoch": 725} {"train_loss": -10.259653091430664, "global_step": 121851, "epoch": 725} {"train_loss": -9.936445236206055, "global_step": 121852, "epoch": 725} {"train_loss": -10.532724380493164, "global_step": 121853, "epoch": 725} {"train_loss": -10.378259658813477, "global_step": 121854, "epoch": 725} {"train_loss": -10.48505687713623, "global_step": 121855, "epoch": 725} {"train_loss": -10.348684310913086, "global_step": 121856, "epoch": 725} {"train_loss": -10.367648124694824, "global_step": 121857, "epoch": 725} {"train_loss": -10.479887962341309, "global_step": 121858, "epoch": 725} {"train_loss": -10.313155174255371, "global_step": 121859, "epoch": 725} {"train_loss": -10.46717643737793, "global_step": 121860, "epoch": 725} {"train_loss": -10.391288757324219, "global_step": 121861, "epoch": 725} {"train_loss": -10.227126121520996, "global_step": 121862, "epoch": 725} {"train_loss": -10.35639762878418, "global_step": 121863, "epoch": 725} {"train_loss": -10.467185974121094, "global_step": 121864, "epoch": 725} {"train_loss": -10.609941482543945, "global_step": 121865, "epoch": 725} {"train_loss": -9.952831268310547, "global_step": 121866, "epoch": 725} {"train_loss": -10.071044921875, "global_step": 121867, "epoch": 725} {"train_loss": -9.792924880981445, "global_step": 121868, "epoch": 725} {"train_loss": -10.132363319396973, "global_step": 121869, "epoch": 725} {"train_loss": -10.25811767578125, "global_step": 121870, "epoch": 725} {"train_loss": -10.31113052368164, "global_step": 121871, "epoch": 725} {"train_loss": -10.400803565979004, "global_step": 121872, "epoch": 725} {"train_loss": -9.944886207580566, "global_step": 121873, "epoch": 725} {"train_loss": -10.291024208068848, "global_step": 121874, "epoch": 725} {"train_loss": -10.354911804199219, "global_step": 121875, "epoch": 725} {"train_loss": -9.776065826416016, "global_step": 121876, "epoch": 725} {"train_loss": -10.016107559204102, "global_step": 121877, "epoch": 725} {"train_loss": -9.938056945800781, "global_step": 121878, "epoch": 725} {"train_loss": -9.247790336608887, "global_step": 121879, "epoch": 725} {"train_loss": -9.235713958740234, "global_step": 121880, "epoch": 725} {"train_loss": -9.838733673095703, "global_step": 121881, "epoch": 725} {"train_loss": -8.638471603393555, "global_step": 121882, "epoch": 725} {"train_loss": -9.978181838989258, "global_step": 121883, "epoch": 725} {"train_loss": -8.862388610839844, "global_step": 121884, "epoch": 725} {"train_loss": -10.09848403930664, "global_step": 121885, "epoch": 725} {"train_loss": -9.091060638427734, "global_step": 121886, "epoch": 725} {"train_loss": -10.209806442260742, "global_step": 121887, "epoch": 725} {"train_loss": -9.475004196166992, "global_step": 121888, "epoch": 725} {"train_loss": -9.697787284851074, "global_step": 121889, "epoch": 725} {"train_loss": -9.593931198120117, "global_step": 121890, "epoch": 725} {"train_loss": -9.905733108520508, "global_step": 121891, "epoch": 725} {"train_loss": -9.553357124328613, "global_step": 121892, "epoch": 725} {"train_loss": -9.706050872802734, "global_step": 121893, "epoch": 725} {"train_loss": -10.02187728881836, "global_step": 121894, "epoch": 725} {"train_loss": -9.35063362121582, "global_step": 121895, "epoch": 725} {"train_loss": -10.07367992401123, "global_step": 121896, "epoch": 725} {"train_loss": -9.44978141784668, "global_step": 121897, "epoch": 725} {"train_loss": -9.7828369140625, "global_step": 121898, "epoch": 725} {"train_loss": -9.35252571105957, "global_step": 121899, "epoch": 725} {"train_loss": -9.479362487792969, "global_step": 121900, "epoch": 725} {"train_loss": -9.845087051391602, "global_step": 121901, "epoch": 725} {"train_loss": -9.586750030517578, "global_step": 121902, "epoch": 725} {"train_loss": -10.059882164001465, "global_step": 121903, "epoch": 725} {"train_loss": -9.761298179626465, "global_step": 121904, "epoch": 725} {"train_loss": -9.831833839416504, "global_step": 121905, "epoch": 725} {"train_loss": -9.951173782348633, "global_step": 121906, "epoch": 725} {"train_loss": -9.79545783996582, "global_step": 121907, "epoch": 725} {"train_loss": -10.051714897155762, "global_step": 121908, "epoch": 725} {"train_loss": -9.952066421508789, "global_step": 121909, "epoch": 725} {"train_loss": -9.92683219909668, "global_step": 121910, "epoch": 725} {"train_loss": -9.807706832885742, "global_step": 121911, "epoch": 725} {"train_loss": -10.108612060546875, "global_step": 121912, "epoch": 725} {"train_loss": -10.13492488861084, "global_step": 121913, "epoch": 725} {"train_loss": -10.177783012390137, "global_step": 121914, "epoch": 725} {"train_loss": -10.297385215759277, "global_step": 121915, "epoch": 725} {"train_loss": -10.21979808807373, "global_step": 121916, "epoch": 725} {"train_loss": -10.20191764831543, "global_step": 121917, "epoch": 725} {"train_loss": -10.246063232421875, "global_step": 121918, "epoch": 725} {"train_loss": -10.199317932128906, "global_step": 121919, "epoch": 725} {"train_loss": -10.20837688446045, "global_step": 121920, "epoch": 725} {"train_loss": -10.213669776916504, "global_step": 121921, "epoch": 725} {"train_loss": -10.4528226852417, "global_step": 121922, "epoch": 725} {"train_loss": -10.240301132202148, "global_step": 121923, "epoch": 725} {"train_loss": -10.342453002929688, "global_step": 121924, "epoch": 725} {"train_loss": -10.020244598388672, "global_step": 121925, "epoch": 725} {"train_loss": -10.342750549316406, "global_step": 121926, "epoch": 725} {"train_loss": -10.321672439575195, "global_step": 121927, "epoch": 725} {"train_loss": -10.256270408630371, "global_step": 121928, "epoch": 725} {"train_loss": -10.326309204101562, "global_step": 121929, "epoch": 725} {"train_loss": -10.513410568237305, "global_step": 121930, "epoch": 725} {"train_loss": -10.314031600952148, "global_step": 121931, "epoch": 725} {"train_loss": -10.327411651611328, "global_step": 121932, "epoch": 725} {"train_loss": -10.623149871826172, "global_step": 121933, "epoch": 725} {"train_loss": -10.395950317382812, "global_step": 121934, "epoch": 725} {"train_loss": -10.282560348510742, "global_step": 121935, "epoch": 725} {"train_loss": -9.967721939086914, "global_step": 121936, "epoch": 725} {"train_loss": -10.446751594543457, "global_step": 121937, "epoch": 725} {"train_loss": -10.023336410522461, "global_step": 121938, "epoch": 725} {"train_loss": -10.240737915039062, "global_step": 121939, "epoch": 725} {"train_loss": -10.332376480102539, "global_step": 121940, "epoch": 725} {"train_loss": -10.443181037902832, "global_step": 121941, "epoch": 725} {"train_loss": -10.310710906982422, "global_step": 121942, "epoch": 725} {"train_loss": -10.069206237792969, "global_step": 121943, "epoch": 725} {"train_loss": -10.540300369262695, "global_step": 121944, "epoch": 725} {"train_loss": -10.097894668579102, "global_step": 121945, "epoch": 725} {"train_loss": -10.469780921936035, "global_step": 121946, "epoch": 725} {"train_loss": -9.954700469970703, "global_step": 121947, "epoch": 725} {"train_loss": -10.052021026611328, "global_step": 121948, "epoch": 725} {"train_loss": -9.732184410095215, "global_step": 121949, "epoch": 725} {"train_loss": -9.727505683898926, "global_step": 121950, "epoch": 725} {"train_loss": -10.142051696777344, "global_step": 121951, "epoch": 725} {"train_loss": -8.949991226196289, "global_step": 121952, "epoch": 725} {"train_loss": -9.648231506347656, "global_step": 121953, "epoch": 725} {"train_loss": -9.668081283569336, "global_step": 121954, "epoch": 725} {"train_loss": -10.10611343383789, "global_step": 121955, "epoch": 725} {"train_loss": -9.177687644958496, "global_step": 121956, "epoch": 725} {"train_loss": -9.9402437210083, "global_step": 121957, "epoch": 725} {"train_loss": -9.556819915771484, "global_step": 121958, "epoch": 725} {"train_loss": -9.989261627197266, "global_step": 121959, "epoch": 725} {"train_loss": -9.913288116455078, "global_step": 121960, "epoch": 725} {"train_loss": -9.790218353271484, "global_step": 121961, "epoch": 725} {"train_loss": -9.67618465423584, "global_step": 121962, "epoch": 725} {"train_loss": -10.073280334472656, "global_step": 121963, "epoch": 725} {"train_loss": -9.941530227661133, "global_step": 121964, "epoch": 725} {"train_loss": -10.191003799438477, "global_step": 121965, "epoch": 725} {"train_loss": -9.8778076171875, "global_step": 121966, "epoch": 725} {"train_loss": -10.035166706357684, "global_step": 121967, "epoch": 725, "val_loss": 212837.609375, "train_action_mse_error": 1.348681092262268} {"train_loss": -9.942522048950195, "global_step": 121968, "epoch": 726} {"train_loss": -10.108026504516602, "global_step": 121969, "epoch": 726} {"train_loss": -10.116825103759766, "global_step": 121970, "epoch": 726} {"train_loss": -10.16152572631836, "global_step": 121971, "epoch": 726} {"train_loss": -10.29642105102539, "global_step": 121972, "epoch": 726} {"train_loss": -10.334259033203125, "global_step": 121973, "epoch": 726} {"train_loss": -10.179300308227539, "global_step": 121974, "epoch": 726} {"train_loss": -9.844818115234375, "global_step": 121975, "epoch": 726} {"train_loss": -10.152727127075195, "global_step": 121976, "epoch": 726} {"train_loss": -9.852909088134766, "global_step": 121977, "epoch": 726} {"train_loss": -10.275678634643555, "global_step": 121978, "epoch": 726} {"train_loss": -10.047710418701172, "global_step": 121979, "epoch": 726} {"train_loss": -10.246448516845703, "global_step": 121980, "epoch": 726} {"train_loss": -10.110700607299805, "global_step": 121981, "epoch": 726} {"train_loss": -10.379072189331055, "global_step": 121982, "epoch": 726} {"train_loss": -10.082776069641113, "global_step": 121983, "epoch": 726} {"train_loss": -10.174751281738281, "global_step": 121984, "epoch": 726} {"train_loss": -10.327778816223145, "global_step": 121985, "epoch": 726} {"train_loss": -10.117570877075195, "global_step": 121986, "epoch": 726} {"train_loss": -9.975184440612793, "global_step": 121987, "epoch": 726} {"train_loss": -10.219741821289062, "global_step": 121988, "epoch": 726} {"train_loss": -10.216023445129395, "global_step": 121989, "epoch": 726} {"train_loss": -10.236411094665527, "global_step": 121990, "epoch": 726} {"train_loss": -10.352033615112305, "global_step": 121991, "epoch": 726} {"train_loss": -10.587530136108398, "global_step": 121992, "epoch": 726} {"train_loss": -10.52713680267334, "global_step": 121993, "epoch": 726} {"train_loss": -10.409811019897461, "global_step": 121994, "epoch": 726} {"train_loss": -10.401704788208008, "global_step": 121995, "epoch": 726} {"train_loss": -10.433515548706055, "global_step": 121996, "epoch": 726} {"train_loss": -10.302380561828613, "global_step": 121997, "epoch": 726} {"train_loss": -10.408807754516602, "global_step": 121998, "epoch": 726} {"train_loss": -10.121809959411621, "global_step": 121999, "epoch": 726} {"train_loss": -10.221893310546875, "global_step": 122000, "epoch": 726} {"train_loss": -10.293218612670898, "global_step": 122001, "epoch": 726} {"train_loss": -9.909891128540039, "global_step": 122002, "epoch": 726} {"train_loss": -10.436097145080566, "global_step": 122003, "epoch": 726} {"train_loss": -9.978246688842773, "global_step": 122004, "epoch": 726} {"train_loss": -9.972782135009766, "global_step": 122005, "epoch": 726} {"train_loss": -10.29119873046875, "global_step": 122006, "epoch": 726} {"train_loss": -9.908065795898438, "global_step": 122007, "epoch": 726} {"train_loss": -10.402384757995605, "global_step": 122008, "epoch": 726} {"train_loss": -10.314316749572754, "global_step": 122009, "epoch": 726} {"train_loss": -10.314355850219727, "global_step": 122010, "epoch": 726} {"train_loss": -10.094066619873047, "global_step": 122011, "epoch": 726} {"train_loss": -9.987064361572266, "global_step": 122012, "epoch": 726} {"train_loss": -10.002420425415039, "global_step": 122013, "epoch": 726} {"train_loss": -10.12350082397461, "global_step": 122014, "epoch": 726} {"train_loss": -10.322914123535156, "global_step": 122015, "epoch": 726} {"train_loss": -10.295333862304688, "global_step": 122016, "epoch": 726} {"train_loss": -10.273082733154297, "global_step": 122017, "epoch": 726} {"train_loss": -10.166869163513184, "global_step": 122018, "epoch": 726} {"train_loss": -10.221860885620117, "global_step": 122019, "epoch": 726} {"train_loss": -9.777095794677734, "global_step": 122020, "epoch": 726} {"train_loss": -10.377339363098145, "global_step": 122021, "epoch": 726} {"train_loss": -10.088754653930664, "global_step": 122022, "epoch": 726} {"train_loss": -10.311391830444336, "global_step": 122023, "epoch": 726} {"train_loss": -9.935403823852539, "global_step": 122024, "epoch": 726} {"train_loss": -10.221986770629883, "global_step": 122025, "epoch": 726} {"train_loss": -9.937463760375977, "global_step": 122026, "epoch": 726} {"train_loss": -10.11846923828125, "global_step": 122027, "epoch": 726} {"train_loss": -10.067974090576172, "global_step": 122028, "epoch": 726} {"train_loss": -10.247299194335938, "global_step": 122029, "epoch": 726} {"train_loss": -10.060522079467773, "global_step": 122030, "epoch": 726} {"train_loss": -10.341511726379395, "global_step": 122031, "epoch": 726} {"train_loss": -10.205702781677246, "global_step": 122032, "epoch": 726} {"train_loss": -10.300323486328125, "global_step": 122033, "epoch": 726} {"train_loss": -10.309100151062012, "global_step": 122034, "epoch": 726} {"train_loss": -10.458929061889648, "global_step": 122035, "epoch": 726} {"train_loss": -9.916815757751465, "global_step": 122036, "epoch": 726} {"train_loss": -10.28345012664795, "global_step": 122037, "epoch": 726} {"train_loss": -10.316909790039062, "global_step": 122038, "epoch": 726} {"train_loss": -10.176359176635742, "global_step": 122039, "epoch": 726} {"train_loss": -10.348937034606934, "global_step": 122040, "epoch": 726} {"train_loss": -10.035331726074219, "global_step": 122041, "epoch": 726} {"train_loss": -10.433554649353027, "global_step": 122042, "epoch": 726} {"train_loss": -10.156515121459961, "global_step": 122043, "epoch": 726} {"train_loss": -10.121964454650879, "global_step": 122044, "epoch": 726} {"train_loss": -10.199862480163574, "global_step": 122045, "epoch": 726} {"train_loss": -10.125870704650879, "global_step": 122046, "epoch": 726} {"train_loss": -10.338669776916504, "global_step": 122047, "epoch": 726} {"train_loss": -10.087297439575195, "global_step": 122048, "epoch": 726} {"train_loss": -10.005393981933594, "global_step": 122049, "epoch": 726} {"train_loss": -9.90555191040039, "global_step": 122050, "epoch": 726} {"train_loss": -9.850696563720703, "global_step": 122051, "epoch": 726} {"train_loss": -9.584425926208496, "global_step": 122052, "epoch": 726} {"train_loss": -9.888797760009766, "global_step": 122053, "epoch": 726} {"train_loss": -9.801250457763672, "global_step": 122054, "epoch": 726} {"train_loss": -9.862776756286621, "global_step": 122055, "epoch": 726} {"train_loss": -9.294661521911621, "global_step": 122056, "epoch": 726} {"train_loss": -10.004684448242188, "global_step": 122057, "epoch": 726} {"train_loss": -9.567667007446289, "global_step": 122058, "epoch": 726} {"train_loss": -9.637829780578613, "global_step": 122059, "epoch": 726} {"train_loss": -9.859293937683105, "global_step": 122060, "epoch": 726} {"train_loss": -9.727952003479004, "global_step": 122061, "epoch": 726} {"train_loss": -9.464048385620117, "global_step": 122062, "epoch": 726} {"train_loss": -10.303203582763672, "global_step": 122063, "epoch": 726} {"train_loss": -9.493776321411133, "global_step": 122064, "epoch": 726} {"train_loss": -9.839086532592773, "global_step": 122065, "epoch": 726} {"train_loss": -9.958406448364258, "global_step": 122066, "epoch": 726} {"train_loss": -9.75108528137207, "global_step": 122067, "epoch": 726} {"train_loss": -9.904205322265625, "global_step": 122068, "epoch": 726} {"train_loss": -10.200735092163086, "global_step": 122069, "epoch": 726} {"train_loss": -9.905202865600586, "global_step": 122070, "epoch": 726} {"train_loss": -10.006673812866211, "global_step": 122071, "epoch": 726} {"train_loss": -9.939454078674316, "global_step": 122072, "epoch": 726} {"train_loss": -10.061594009399414, "global_step": 122073, "epoch": 726} {"train_loss": -9.968297958374023, "global_step": 122074, "epoch": 726} {"train_loss": -9.828084945678711, "global_step": 122075, "epoch": 726} {"train_loss": -10.082208633422852, "global_step": 122076, "epoch": 726} {"train_loss": -10.04317855834961, "global_step": 122077, "epoch": 726} {"train_loss": -10.146528244018555, "global_step": 122078, "epoch": 726} {"train_loss": -9.980813980102539, "global_step": 122079, "epoch": 726} {"train_loss": -10.17951774597168, "global_step": 122080, "epoch": 726} {"train_loss": -10.266631126403809, "global_step": 122081, "epoch": 726} {"train_loss": -10.1880464553833, "global_step": 122082, "epoch": 726} {"train_loss": -10.145320892333984, "global_step": 122083, "epoch": 726} {"train_loss": -10.265453338623047, "global_step": 122084, "epoch": 726} {"train_loss": -10.253693580627441, "global_step": 122085, "epoch": 726} {"train_loss": -10.197341918945312, "global_step": 122086, "epoch": 726} {"train_loss": -10.241973876953125, "global_step": 122087, "epoch": 726} {"train_loss": -10.235387802124023, "global_step": 122088, "epoch": 726} {"train_loss": -10.634833335876465, "global_step": 122089, "epoch": 726} {"train_loss": -10.388324737548828, "global_step": 122090, "epoch": 726} {"train_loss": -10.362471580505371, "global_step": 122091, "epoch": 726} {"train_loss": -10.231710433959961, "global_step": 122092, "epoch": 726} {"train_loss": -10.340679168701172, "global_step": 122093, "epoch": 726} {"train_loss": -10.513874053955078, "global_step": 122094, "epoch": 726} {"train_loss": -10.3165864944458, "global_step": 122095, "epoch": 726} {"train_loss": -10.348775863647461, "global_step": 122096, "epoch": 726} {"train_loss": -10.347938537597656, "global_step": 122097, "epoch": 726} {"train_loss": -10.342814445495605, "global_step": 122098, "epoch": 726} {"train_loss": -10.167823791503906, "global_step": 122099, "epoch": 726} {"train_loss": -10.290849685668945, "global_step": 122100, "epoch": 726} {"train_loss": -10.548553466796875, "global_step": 122101, "epoch": 726} {"train_loss": -10.399433135986328, "global_step": 122102, "epoch": 726} {"train_loss": -10.236873626708984, "global_step": 122103, "epoch": 726} {"train_loss": -10.111700057983398, "global_step": 122104, "epoch": 726} {"train_loss": -10.329303741455078, "global_step": 122105, "epoch": 726} {"train_loss": -10.40034008026123, "global_step": 122106, "epoch": 726} {"train_loss": -10.514568328857422, "global_step": 122107, "epoch": 726} {"train_loss": -10.427170753479004, "global_step": 122108, "epoch": 726} {"train_loss": -10.362089157104492, "global_step": 122109, "epoch": 726} {"train_loss": -10.427851676940918, "global_step": 122110, "epoch": 726} {"train_loss": -10.045018196105957, "global_step": 122111, "epoch": 726} {"train_loss": -10.286433219909668, "global_step": 122112, "epoch": 726} {"train_loss": -10.255289077758789, "global_step": 122113, "epoch": 726} {"train_loss": -10.399145126342773, "global_step": 122114, "epoch": 726} {"train_loss": -9.604755401611328, "global_step": 122115, "epoch": 726} {"train_loss": -10.532323837280273, "global_step": 122116, "epoch": 726} {"train_loss": -10.216623306274414, "global_step": 122117, "epoch": 726} {"train_loss": -10.045778274536133, "global_step": 122118, "epoch": 726} {"train_loss": -10.426170349121094, "global_step": 122119, "epoch": 726} {"train_loss": -10.231285095214844, "global_step": 122120, "epoch": 726} {"train_loss": -10.130575180053711, "global_step": 122121, "epoch": 726} {"train_loss": -10.603883743286133, "global_step": 122122, "epoch": 726} {"train_loss": -10.47066879272461, "global_step": 122123, "epoch": 726} {"train_loss": -10.395523071289062, "global_step": 122124, "epoch": 726} {"train_loss": -10.248517990112305, "global_step": 122125, "epoch": 726} {"train_loss": -10.20562744140625, "global_step": 122126, "epoch": 726} {"train_loss": -10.480010032653809, "global_step": 122127, "epoch": 726} {"train_loss": -10.435150146484375, "global_step": 122128, "epoch": 726} {"train_loss": -10.561208724975586, "global_step": 122129, "epoch": 726} {"train_loss": -10.369457244873047, "global_step": 122130, "epoch": 726} {"train_loss": -10.369832038879395, "global_step": 122131, "epoch": 726} {"train_loss": -10.472615242004395, "global_step": 122132, "epoch": 726} {"train_loss": -10.309240341186523, "global_step": 122133, "epoch": 726} {"train_loss": -10.407818794250488, "global_step": 122134, "epoch": 726} {"train_loss": -10.175889798573085, "global_step": 122135, "epoch": 726, "val_loss": 215103.09375} {"train_loss": -10.302035331726074, "global_step": 122136, "epoch": 727} {"train_loss": -10.534942626953125, "global_step": 122137, "epoch": 727} {"train_loss": -10.261905670166016, "global_step": 122138, "epoch": 727} {"train_loss": -10.304760932922363, "global_step": 122139, "epoch": 727} {"train_loss": -10.545524597167969, "global_step": 122140, "epoch": 727} {"train_loss": -10.42627239227295, "global_step": 122141, "epoch": 727} {"train_loss": -10.327679634094238, "global_step": 122142, "epoch": 727} {"train_loss": -10.344108581542969, "global_step": 122143, "epoch": 727} {"train_loss": -10.42802906036377, "global_step": 122144, "epoch": 727} {"train_loss": -10.390883445739746, "global_step": 122145, "epoch": 727} {"train_loss": -10.269075393676758, "global_step": 122146, "epoch": 727} {"train_loss": -10.159971237182617, "global_step": 122147, "epoch": 727} {"train_loss": -10.232264518737793, "global_step": 122148, "epoch": 727} {"train_loss": -10.293256759643555, "global_step": 122149, "epoch": 727} {"train_loss": -10.404121398925781, "global_step": 122150, "epoch": 727} {"train_loss": -10.222923278808594, "global_step": 122151, "epoch": 727} {"train_loss": -9.976853370666504, "global_step": 122152, "epoch": 727} {"train_loss": -10.104246139526367, "global_step": 122153, "epoch": 727} {"train_loss": -10.364601135253906, "global_step": 122154, "epoch": 727} {"train_loss": -9.152088165283203, "global_step": 122155, "epoch": 727} {"train_loss": -10.187675476074219, "global_step": 122156, "epoch": 727} {"train_loss": -9.853755950927734, "global_step": 122157, "epoch": 727} {"train_loss": -9.366305351257324, "global_step": 122158, "epoch": 727} {"train_loss": -10.0850830078125, "global_step": 122159, "epoch": 727} {"train_loss": -9.17059326171875, "global_step": 122160, "epoch": 727} {"train_loss": -10.052753448486328, "global_step": 122161, "epoch": 727} {"train_loss": -9.964418411254883, "global_step": 122162, "epoch": 727} {"train_loss": -10.21512222290039, "global_step": 122163, "epoch": 727} {"train_loss": -9.707572937011719, "global_step": 122164, "epoch": 727} {"train_loss": -10.181214332580566, "global_step": 122165, "epoch": 727} {"train_loss": -9.820873260498047, "global_step": 122166, "epoch": 727} {"train_loss": -10.101524353027344, "global_step": 122167, "epoch": 727} {"train_loss": -9.797396659851074, "global_step": 122168, "epoch": 727} {"train_loss": -10.039615631103516, "global_step": 122169, "epoch": 727} {"train_loss": -9.938480377197266, "global_step": 122170, "epoch": 727} {"train_loss": -9.447344779968262, "global_step": 122171, "epoch": 727} {"train_loss": -9.711772918701172, "global_step": 122172, "epoch": 727} {"train_loss": -9.948476791381836, "global_step": 122173, "epoch": 727} {"train_loss": -9.981383323669434, "global_step": 122174, "epoch": 727} {"train_loss": -9.974066734313965, "global_step": 122175, "epoch": 727} {"train_loss": -10.001821517944336, "global_step": 122176, "epoch": 727} {"train_loss": -9.958702087402344, "global_step": 122177, "epoch": 727} {"train_loss": -9.913457870483398, "global_step": 122178, "epoch": 727} {"train_loss": -10.006717681884766, "global_step": 122179, "epoch": 727} {"train_loss": -9.840396881103516, "global_step": 122180, "epoch": 727} {"train_loss": -10.262578964233398, "global_step": 122181, "epoch": 727} {"train_loss": -10.179444313049316, "global_step": 122182, "epoch": 727} {"train_loss": -10.190576553344727, "global_step": 122183, "epoch": 727} {"train_loss": -9.782815933227539, "global_step": 122184, "epoch": 727} {"train_loss": -10.218032836914062, "global_step": 122185, "epoch": 727} {"train_loss": -10.038476943969727, "global_step": 122186, "epoch": 727} {"train_loss": -10.120816230773926, "global_step": 122187, "epoch": 727} {"train_loss": -10.291910171508789, "global_step": 122188, "epoch": 727} {"train_loss": -10.148321151733398, "global_step": 122189, "epoch": 727} {"train_loss": -10.229255676269531, "global_step": 122190, "epoch": 727} {"train_loss": -10.203638076782227, "global_step": 122191, "epoch": 727} {"train_loss": -10.387445449829102, "global_step": 122192, "epoch": 727} {"train_loss": -10.176704406738281, "global_step": 122193, "epoch": 727} {"train_loss": -10.004764556884766, "global_step": 122194, "epoch": 727} {"train_loss": -10.305720329284668, "global_step": 122195, "epoch": 727} {"train_loss": -10.110933303833008, "global_step": 122196, "epoch": 727} {"train_loss": -10.083524703979492, "global_step": 122197, "epoch": 727} {"train_loss": -10.37585735321045, "global_step": 122198, "epoch": 727} {"train_loss": -10.251740455627441, "global_step": 122199, "epoch": 727} {"train_loss": -10.03413200378418, "global_step": 122200, "epoch": 727} {"train_loss": -10.38754653930664, "global_step": 122201, "epoch": 727} {"train_loss": -10.336946487426758, "global_step": 122202, "epoch": 727} {"train_loss": -10.434611320495605, "global_step": 122203, "epoch": 727} {"train_loss": -10.65086841583252, "global_step": 122204, "epoch": 727} {"train_loss": -10.010799407958984, "global_step": 122205, "epoch": 727} {"train_loss": -10.424543380737305, "global_step": 122206, "epoch": 727} {"train_loss": -10.254127502441406, "global_step": 122207, "epoch": 727} {"train_loss": -10.267820358276367, "global_step": 122208, "epoch": 727} {"train_loss": -10.619369506835938, "global_step": 122209, "epoch": 727} {"train_loss": -10.324353218078613, "global_step": 122210, "epoch": 727} {"train_loss": -10.102458953857422, "global_step": 122211, "epoch": 727} {"train_loss": -10.476049423217773, "global_step": 122212, "epoch": 727} {"train_loss": -10.389412879943848, "global_step": 122213, "epoch": 727} {"train_loss": -9.422121047973633, "global_step": 122214, "epoch": 727} {"train_loss": -9.549943923950195, "global_step": 122215, "epoch": 727} {"train_loss": -10.304298400878906, "global_step": 122216, "epoch": 727} {"train_loss": -9.766829490661621, "global_step": 122217, "epoch": 727} {"train_loss": -9.835907936096191, "global_step": 122218, "epoch": 727} {"train_loss": -10.24755859375, "global_step": 122219, "epoch": 727} {"train_loss": -10.431180000305176, "global_step": 122220, "epoch": 727} {"train_loss": -9.836759567260742, "global_step": 122221, "epoch": 727} {"train_loss": -10.280487060546875, "global_step": 122222, "epoch": 727} {"train_loss": -10.226430892944336, "global_step": 122223, "epoch": 727} {"train_loss": -10.232820510864258, "global_step": 122224, "epoch": 727} {"train_loss": -10.418869972229004, "global_step": 122225, "epoch": 727} {"train_loss": -10.331930160522461, "global_step": 122226, "epoch": 727} {"train_loss": -10.490043640136719, "global_step": 122227, "epoch": 727} {"train_loss": -10.269916534423828, "global_step": 122228, "epoch": 727} {"train_loss": -10.243002891540527, "global_step": 122229, "epoch": 727} {"train_loss": -10.10573959350586, "global_step": 122230, "epoch": 727} {"train_loss": -10.329090118408203, "global_step": 122231, "epoch": 727} {"train_loss": -10.308723449707031, "global_step": 122232, "epoch": 727} {"train_loss": -10.428582191467285, "global_step": 122233, "epoch": 727} {"train_loss": -10.132434844970703, "global_step": 122234, "epoch": 727} {"train_loss": -10.373945236206055, "global_step": 122235, "epoch": 727} {"train_loss": -10.396272659301758, "global_step": 122236, "epoch": 727} {"train_loss": -10.28708267211914, "global_step": 122237, "epoch": 727} {"train_loss": -10.45938777923584, "global_step": 122238, "epoch": 727} {"train_loss": -10.335411071777344, "global_step": 122239, "epoch": 727} {"train_loss": -10.16204833984375, "global_step": 122240, "epoch": 727} {"train_loss": -10.470014572143555, "global_step": 122241, "epoch": 727} {"train_loss": -10.374624252319336, "global_step": 122242, "epoch": 727} {"train_loss": -10.529434204101562, "global_step": 122243, "epoch": 727} {"train_loss": -10.504801750183105, "global_step": 122244, "epoch": 727} {"train_loss": -10.282137870788574, "global_step": 122245, "epoch": 727} {"train_loss": -10.31747055053711, "global_step": 122246, "epoch": 727} {"train_loss": -10.271307945251465, "global_step": 122247, "epoch": 727} {"train_loss": -10.40580940246582, "global_step": 122248, "epoch": 727} {"train_loss": -10.189775466918945, "global_step": 122249, "epoch": 727} {"train_loss": -10.554012298583984, "global_step": 122250, "epoch": 727} {"train_loss": -10.324989318847656, "global_step": 122251, "epoch": 727} {"train_loss": -10.442502975463867, "global_step": 122252, "epoch": 727} {"train_loss": -10.390214920043945, "global_step": 122253, "epoch": 727} {"train_loss": -10.6611909866333, "global_step": 122254, "epoch": 727} {"train_loss": -10.528078079223633, "global_step": 122255, "epoch": 727} {"train_loss": -10.509567260742188, "global_step": 122256, "epoch": 727} {"train_loss": -10.345178604125977, "global_step": 122257, "epoch": 727} {"train_loss": -10.48298454284668, "global_step": 122258, "epoch": 727} {"train_loss": -10.351587295532227, "global_step": 122259, "epoch": 727} {"train_loss": -9.9658203125, "global_step": 122260, "epoch": 727} {"train_loss": -10.007143020629883, "global_step": 122261, "epoch": 727} {"train_loss": -10.370522499084473, "global_step": 122262, "epoch": 727} {"train_loss": -9.93080997467041, "global_step": 122263, "epoch": 727} {"train_loss": -10.113748550415039, "global_step": 122264, "epoch": 727} {"train_loss": -10.315252304077148, "global_step": 122265, "epoch": 727} {"train_loss": -10.378426551818848, "global_step": 122266, "epoch": 727} {"train_loss": -10.134797096252441, "global_step": 122267, "epoch": 727} {"train_loss": -10.337489128112793, "global_step": 122268, "epoch": 727} {"train_loss": -9.858711242675781, "global_step": 122269, "epoch": 727} {"train_loss": -10.161699295043945, "global_step": 122270, "epoch": 727} {"train_loss": -10.385735511779785, "global_step": 122271, "epoch": 727} {"train_loss": -9.939908027648926, "global_step": 122272, "epoch": 727} {"train_loss": -10.150060653686523, "global_step": 122273, "epoch": 727} {"train_loss": -10.167156219482422, "global_step": 122274, "epoch": 727} {"train_loss": -10.163952827453613, "global_step": 122275, "epoch": 727} {"train_loss": -10.182210922241211, "global_step": 122276, "epoch": 727} {"train_loss": -10.310073852539062, "global_step": 122277, "epoch": 727} {"train_loss": -10.246413230895996, "global_step": 122278, "epoch": 727} {"train_loss": -10.38500690460205, "global_step": 122279, "epoch": 727} {"train_loss": -10.299997329711914, "global_step": 122280, "epoch": 727} {"train_loss": -10.341028213500977, "global_step": 122281, "epoch": 727} {"train_loss": -9.948102951049805, "global_step": 122282, "epoch": 727} {"train_loss": -10.29863452911377, "global_step": 122283, "epoch": 727} {"train_loss": -10.179190635681152, "global_step": 122284, "epoch": 727} {"train_loss": -10.349504470825195, "global_step": 122285, "epoch": 727} {"train_loss": -10.059062004089355, "global_step": 122286, "epoch": 727} {"train_loss": -10.062505722045898, "global_step": 122287, "epoch": 727} {"train_loss": -10.120933532714844, "global_step": 122288, "epoch": 727} {"train_loss": -9.833412170410156, "global_step": 122289, "epoch": 727} {"train_loss": -9.836727142333984, "global_step": 122290, "epoch": 727} {"train_loss": -9.827960968017578, "global_step": 122291, "epoch": 727} {"train_loss": -9.593196868896484, "global_step": 122292, "epoch": 727} {"train_loss": -9.85598373413086, "global_step": 122293, "epoch": 727} {"train_loss": -9.905088424682617, "global_step": 122294, "epoch": 727} {"train_loss": -9.947959899902344, "global_step": 122295, "epoch": 727} {"train_loss": -9.941709518432617, "global_step": 122296, "epoch": 727} {"train_loss": -10.383159637451172, "global_step": 122297, "epoch": 727} {"train_loss": -9.87984848022461, "global_step": 122298, "epoch": 727} {"train_loss": -9.782317161560059, "global_step": 122299, "epoch": 727} {"train_loss": -10.13972282409668, "global_step": 122300, "epoch": 727} {"train_loss": -10.083345413208008, "global_step": 122301, "epoch": 727} {"train_loss": -10.082315444946289, "global_step": 122302, "epoch": 727} {"train_loss": -10.163456315086002, "global_step": 122303, "epoch": 727, "val_loss": 215164.921875} {"train_loss": -9.94862174987793, "global_step": 122304, "epoch": 728} {"train_loss": -10.17436408996582, "global_step": 122305, "epoch": 728} {"train_loss": -10.22701358795166, "global_step": 122306, "epoch": 728} {"train_loss": -10.038759231567383, "global_step": 122307, "epoch": 728} {"train_loss": -10.23921012878418, "global_step": 122308, "epoch": 728} {"train_loss": -10.201637268066406, "global_step": 122309, "epoch": 728} {"train_loss": -10.210245132446289, "global_step": 122310, "epoch": 728} {"train_loss": -10.06231689453125, "global_step": 122311, "epoch": 728} {"train_loss": -10.219074249267578, "global_step": 122312, "epoch": 728} {"train_loss": -10.196700096130371, "global_step": 122313, "epoch": 728} {"train_loss": -10.384391784667969, "global_step": 122314, "epoch": 728} {"train_loss": -10.300850868225098, "global_step": 122315, "epoch": 728} {"train_loss": -10.471617698669434, "global_step": 122316, "epoch": 728} {"train_loss": -10.2960786819458, "global_step": 122317, "epoch": 728} {"train_loss": -10.261666297912598, "global_step": 122318, "epoch": 728} {"train_loss": -10.469324111938477, "global_step": 122319, "epoch": 728} {"train_loss": -10.399721145629883, "global_step": 122320, "epoch": 728} {"train_loss": -10.27753734588623, "global_step": 122321, "epoch": 728} {"train_loss": -10.445493698120117, "global_step": 122322, "epoch": 728} {"train_loss": -10.313484191894531, "global_step": 122323, "epoch": 728} {"train_loss": -10.45484733581543, "global_step": 122324, "epoch": 728} {"train_loss": -10.412790298461914, "global_step": 122325, "epoch": 728} {"train_loss": -10.327367782592773, "global_step": 122326, "epoch": 728} {"train_loss": -10.505775451660156, "global_step": 122327, "epoch": 728} {"train_loss": -10.282886505126953, "global_step": 122328, "epoch": 728} {"train_loss": -10.421344757080078, "global_step": 122329, "epoch": 728} {"train_loss": -10.503389358520508, "global_step": 122330, "epoch": 728} {"train_loss": -10.39963436126709, "global_step": 122331, "epoch": 728} {"train_loss": -10.126699447631836, "global_step": 122332, "epoch": 728} {"train_loss": -10.415658950805664, "global_step": 122333, "epoch": 728} {"train_loss": -10.358505249023438, "global_step": 122334, "epoch": 728} {"train_loss": -9.907991409301758, "global_step": 122335, "epoch": 728} {"train_loss": -10.585112571716309, "global_step": 122336, "epoch": 728} {"train_loss": -9.31885814666748, "global_step": 122337, "epoch": 728} {"train_loss": -9.715509414672852, "global_step": 122338, "epoch": 728} {"train_loss": -10.370372772216797, "global_step": 122339, "epoch": 728} {"train_loss": -9.456082344055176, "global_step": 122340, "epoch": 728} {"train_loss": -10.332398414611816, "global_step": 122341, "epoch": 728} {"train_loss": -9.786676406860352, "global_step": 122342, "epoch": 728} {"train_loss": -10.077829360961914, "global_step": 122343, "epoch": 728} {"train_loss": -9.925813674926758, "global_step": 122344, "epoch": 728} {"train_loss": -10.187850952148438, "global_step": 122345, "epoch": 728} {"train_loss": -10.323831558227539, "global_step": 122346, "epoch": 728} {"train_loss": -10.354325294494629, "global_step": 122347, "epoch": 728} {"train_loss": -10.19910717010498, "global_step": 122348, "epoch": 728} {"train_loss": -10.219980239868164, "global_step": 122349, "epoch": 728} {"train_loss": -10.221451759338379, "global_step": 122350, "epoch": 728} {"train_loss": -10.408369064331055, "global_step": 122351, "epoch": 728} {"train_loss": -10.28475570678711, "global_step": 122352, "epoch": 728} {"train_loss": -10.464011192321777, "global_step": 122353, "epoch": 728} {"train_loss": -10.348287582397461, "global_step": 122354, "epoch": 728} {"train_loss": -10.198881149291992, "global_step": 122355, "epoch": 728} {"train_loss": -10.300201416015625, "global_step": 122356, "epoch": 728} {"train_loss": -10.150620460510254, "global_step": 122357, "epoch": 728} {"train_loss": -10.375242233276367, "global_step": 122358, "epoch": 728} {"train_loss": -10.263065338134766, "global_step": 122359, "epoch": 728} {"train_loss": -10.095715522766113, "global_step": 122360, "epoch": 728} {"train_loss": -10.199616432189941, "global_step": 122361, "epoch": 728} {"train_loss": -10.222878456115723, "global_step": 122362, "epoch": 728} {"train_loss": -10.425243377685547, "global_step": 122363, "epoch": 728} {"train_loss": -10.392655372619629, "global_step": 122364, "epoch": 728} {"train_loss": -10.42462158203125, "global_step": 122365, "epoch": 728} {"train_loss": -10.337284088134766, "global_step": 122366, "epoch": 728} {"train_loss": -10.368453979492188, "global_step": 122367, "epoch": 728} {"train_loss": -10.485755920410156, "global_step": 122368, "epoch": 728} {"train_loss": -10.284591674804688, "global_step": 122369, "epoch": 728} {"train_loss": -10.289889335632324, "global_step": 122370, "epoch": 728} {"train_loss": -10.182720184326172, "global_step": 122371, "epoch": 728} {"train_loss": -10.620553970336914, "global_step": 122372, "epoch": 728} {"train_loss": -10.378167152404785, "global_step": 122373, "epoch": 728} {"train_loss": -10.153231620788574, "global_step": 122374, "epoch": 728} {"train_loss": -10.334176063537598, "global_step": 122375, "epoch": 728} {"train_loss": -9.676965713500977, "global_step": 122376, "epoch": 728} {"train_loss": -10.277505874633789, "global_step": 122377, "epoch": 728} {"train_loss": -10.194494247436523, "global_step": 122378, "epoch": 728} {"train_loss": -10.189937591552734, "global_step": 122379, "epoch": 728} {"train_loss": -10.318351745605469, "global_step": 122380, "epoch": 728} {"train_loss": -10.434636116027832, "global_step": 122381, "epoch": 728} {"train_loss": -10.444625854492188, "global_step": 122382, "epoch": 728} {"train_loss": -10.23516845703125, "global_step": 122383, "epoch": 728} {"train_loss": -10.084365844726562, "global_step": 122384, "epoch": 728} {"train_loss": -10.218548774719238, "global_step": 122385, "epoch": 728} {"train_loss": -9.921793937683105, "global_step": 122386, "epoch": 728} {"train_loss": -10.149194717407227, "global_step": 122387, "epoch": 728} {"train_loss": -9.998744010925293, "global_step": 122388, "epoch": 728} {"train_loss": -10.412985801696777, "global_step": 122389, "epoch": 728} {"train_loss": -10.214803695678711, "global_step": 122390, "epoch": 728} {"train_loss": -10.379561424255371, "global_step": 122391, "epoch": 728} {"train_loss": -10.261348724365234, "global_step": 122392, "epoch": 728} {"train_loss": -10.372783660888672, "global_step": 122393, "epoch": 728} {"train_loss": -10.182591438293457, "global_step": 122394, "epoch": 728} {"train_loss": -10.252790451049805, "global_step": 122395, "epoch": 728} {"train_loss": -10.090841293334961, "global_step": 122396, "epoch": 728} {"train_loss": -10.307546615600586, "global_step": 122397, "epoch": 728} {"train_loss": -10.532790184020996, "global_step": 122398, "epoch": 728} {"train_loss": -10.287799835205078, "global_step": 122399, "epoch": 728} {"train_loss": -10.240942001342773, "global_step": 122400, "epoch": 728} {"train_loss": -10.331966400146484, "global_step": 122401, "epoch": 728} {"train_loss": -10.321611404418945, "global_step": 122402, "epoch": 728} {"train_loss": -10.40001106262207, "global_step": 122403, "epoch": 728} {"train_loss": -10.249329566955566, "global_step": 122404, "epoch": 728} {"train_loss": -10.236942291259766, "global_step": 122405, "epoch": 728} {"train_loss": -10.258626937866211, "global_step": 122406, "epoch": 728} {"train_loss": -10.325860977172852, "global_step": 122407, "epoch": 728} {"train_loss": -10.037980079650879, "global_step": 122408, "epoch": 728} {"train_loss": -10.350173950195312, "global_step": 122409, "epoch": 728} {"train_loss": -10.392372131347656, "global_step": 122410, "epoch": 728} {"train_loss": -10.206008911132812, "global_step": 122411, "epoch": 728} {"train_loss": -10.283803939819336, "global_step": 122412, "epoch": 728} {"train_loss": -10.06531047821045, "global_step": 122413, "epoch": 728} {"train_loss": -10.166885375976562, "global_step": 122414, "epoch": 728} {"train_loss": -9.948516845703125, "global_step": 122415, "epoch": 728} {"train_loss": -9.97677230834961, "global_step": 122416, "epoch": 728} {"train_loss": -9.984582901000977, "global_step": 122417, "epoch": 728} {"train_loss": -10.273910522460938, "global_step": 122418, "epoch": 728} {"train_loss": -10.138957023620605, "global_step": 122419, "epoch": 728} {"train_loss": -10.187289237976074, "global_step": 122420, "epoch": 728} {"train_loss": -10.311469078063965, "global_step": 122421, "epoch": 728} {"train_loss": -10.208942413330078, "global_step": 122422, "epoch": 728} {"train_loss": -10.255125045776367, "global_step": 122423, "epoch": 728} {"train_loss": -10.407596588134766, "global_step": 122424, "epoch": 728} {"train_loss": -10.197820663452148, "global_step": 122425, "epoch": 728} {"train_loss": -10.218045234680176, "global_step": 122426, "epoch": 728} {"train_loss": -10.456905364990234, "global_step": 122427, "epoch": 728} {"train_loss": -10.298261642456055, "global_step": 122428, "epoch": 728} {"train_loss": -10.471334457397461, "global_step": 122429, "epoch": 728} {"train_loss": -10.367594718933105, "global_step": 122430, "epoch": 728} {"train_loss": -10.35919189453125, "global_step": 122431, "epoch": 728} {"train_loss": -10.392729759216309, "global_step": 122432, "epoch": 728} {"train_loss": -10.299234390258789, "global_step": 122433, "epoch": 728} {"train_loss": -10.166631698608398, "global_step": 122434, "epoch": 728} {"train_loss": -10.473138809204102, "global_step": 122435, "epoch": 728} {"train_loss": -10.204415321350098, "global_step": 122436, "epoch": 728} {"train_loss": -10.165389060974121, "global_step": 122437, "epoch": 728} {"train_loss": -10.215983390808105, "global_step": 122438, "epoch": 728} {"train_loss": -10.504152297973633, "global_step": 122439, "epoch": 728} {"train_loss": -10.072409629821777, "global_step": 122440, "epoch": 728} {"train_loss": -10.189117431640625, "global_step": 122441, "epoch": 728} {"train_loss": -10.356632232666016, "global_step": 122442, "epoch": 728} {"train_loss": -9.99649429321289, "global_step": 122443, "epoch": 728} {"train_loss": -10.30282211303711, "global_step": 122444, "epoch": 728} {"train_loss": -10.159345626831055, "global_step": 122445, "epoch": 728} {"train_loss": -10.302513122558594, "global_step": 122446, "epoch": 728} {"train_loss": -10.330256462097168, "global_step": 122447, "epoch": 728} {"train_loss": -10.096919059753418, "global_step": 122448, "epoch": 728} {"train_loss": -10.438410758972168, "global_step": 122449, "epoch": 728} {"train_loss": -10.187803268432617, "global_step": 122450, "epoch": 728} {"train_loss": -10.092966079711914, "global_step": 122451, "epoch": 728} {"train_loss": -10.116297721862793, "global_step": 122452, "epoch": 728} {"train_loss": -10.138228416442871, "global_step": 122453, "epoch": 728} {"train_loss": -9.907541275024414, "global_step": 122454, "epoch": 728} {"train_loss": -10.130477905273438, "global_step": 122455, "epoch": 728} {"train_loss": -9.861343383789062, "global_step": 122456, "epoch": 728} {"train_loss": -10.252551078796387, "global_step": 122457, "epoch": 728} {"train_loss": -10.065654754638672, "global_step": 122458, "epoch": 728} {"train_loss": -10.212141036987305, "global_step": 122459, "epoch": 728} {"train_loss": -10.43669319152832, "global_step": 122460, "epoch": 728} {"train_loss": -10.085199356079102, "global_step": 122461, "epoch": 728} {"train_loss": -10.34617805480957, "global_step": 122462, "epoch": 728} {"train_loss": -9.865262031555176, "global_step": 122463, "epoch": 728} {"train_loss": -10.380378723144531, "global_step": 122464, "epoch": 728} {"train_loss": -9.861785888671875, "global_step": 122465, "epoch": 728} {"train_loss": -10.251548767089844, "global_step": 122466, "epoch": 728} {"train_loss": -9.93535327911377, "global_step": 122467, "epoch": 728} {"train_loss": -10.255175590515137, "global_step": 122468, "epoch": 728} {"train_loss": -10.180559158325195, "global_step": 122469, "epoch": 728} {"train_loss": -10.229116439819336, "global_step": 122470, "epoch": 728} {"train_loss": -10.235324768793015, "global_step": 122471, "epoch": 728, "val_loss": 215681.8125} {"train_loss": -10.40605354309082, "global_step": 122472, "epoch": 729} {"train_loss": -10.419618606567383, "global_step": 122473, "epoch": 729} {"train_loss": -10.46146011352539, "global_step": 122474, "epoch": 729} {"train_loss": -10.393293380737305, "global_step": 122475, "epoch": 729} {"train_loss": -10.345181465148926, "global_step": 122476, "epoch": 729} {"train_loss": -10.359983444213867, "global_step": 122477, "epoch": 729} {"train_loss": -10.130857467651367, "global_step": 122478, "epoch": 729} {"train_loss": -10.263007164001465, "global_step": 122479, "epoch": 729} {"train_loss": -9.972491264343262, "global_step": 122480, "epoch": 729} {"train_loss": -10.258163452148438, "global_step": 122481, "epoch": 729} {"train_loss": -10.079486846923828, "global_step": 122482, "epoch": 729} {"train_loss": -10.340545654296875, "global_step": 122483, "epoch": 729} {"train_loss": -10.36845874786377, "global_step": 122484, "epoch": 729} {"train_loss": -10.16596794128418, "global_step": 122485, "epoch": 729} {"train_loss": -10.31650161743164, "global_step": 122486, "epoch": 729} {"train_loss": -10.046144485473633, "global_step": 122487, "epoch": 729} {"train_loss": -10.231148719787598, "global_step": 122488, "epoch": 729} {"train_loss": -9.895578384399414, "global_step": 122489, "epoch": 729} {"train_loss": -10.21863079071045, "global_step": 122490, "epoch": 729} {"train_loss": -10.491630554199219, "global_step": 122491, "epoch": 729} {"train_loss": -10.048257827758789, "global_step": 122492, "epoch": 729} {"train_loss": -10.274264335632324, "global_step": 122493, "epoch": 729} {"train_loss": -10.095254898071289, "global_step": 122494, "epoch": 729} {"train_loss": -10.350539207458496, "global_step": 122495, "epoch": 729} {"train_loss": -10.43893814086914, "global_step": 122496, "epoch": 729} {"train_loss": -10.451423645019531, "global_step": 122497, "epoch": 729} {"train_loss": -10.423969268798828, "global_step": 122498, "epoch": 729} {"train_loss": -9.96650505065918, "global_step": 122499, "epoch": 729} {"train_loss": -10.425127029418945, "global_step": 122500, "epoch": 729} {"train_loss": -10.179262161254883, "global_step": 122501, "epoch": 729} {"train_loss": -10.004807472229004, "global_step": 122502, "epoch": 729} {"train_loss": -10.341870307922363, "global_step": 122503, "epoch": 729} {"train_loss": -10.327310562133789, "global_step": 122504, "epoch": 729} {"train_loss": -10.394309997558594, "global_step": 122505, "epoch": 729} {"train_loss": -10.206968307495117, "global_step": 122506, "epoch": 729} {"train_loss": -10.318483352661133, "global_step": 122507, "epoch": 729} {"train_loss": -10.158514976501465, "global_step": 122508, "epoch": 729} {"train_loss": -10.487096786499023, "global_step": 122509, "epoch": 729} {"train_loss": -10.259933471679688, "global_step": 122510, "epoch": 729} {"train_loss": -10.42563247680664, "global_step": 122511, "epoch": 729} {"train_loss": -10.146896362304688, "global_step": 122512, "epoch": 729} {"train_loss": -10.318294525146484, "global_step": 122513, "epoch": 729} {"train_loss": -9.9105224609375, "global_step": 122514, "epoch": 729} {"train_loss": -10.291743278503418, "global_step": 122515, "epoch": 729} {"train_loss": -10.309118270874023, "global_step": 122516, "epoch": 729} {"train_loss": -10.266841888427734, "global_step": 122517, "epoch": 729} {"train_loss": -9.914724349975586, "global_step": 122518, "epoch": 729} {"train_loss": -9.923006057739258, "global_step": 122519, "epoch": 729} {"train_loss": -10.0287446975708, "global_step": 122520, "epoch": 729} {"train_loss": -9.80009937286377, "global_step": 122521, "epoch": 729} {"train_loss": -10.010957717895508, "global_step": 122522, "epoch": 729} {"train_loss": -9.830123901367188, "global_step": 122523, "epoch": 729} {"train_loss": -9.735536575317383, "global_step": 122524, "epoch": 729} {"train_loss": -10.25094985961914, "global_step": 122525, "epoch": 729} {"train_loss": -10.027226448059082, "global_step": 122526, "epoch": 729} {"train_loss": -10.11591625213623, "global_step": 122527, "epoch": 729} {"train_loss": -9.95484733581543, "global_step": 122528, "epoch": 729} {"train_loss": -10.03087043762207, "global_step": 122529, "epoch": 729} {"train_loss": -9.851290702819824, "global_step": 122530, "epoch": 729} {"train_loss": -10.250467300415039, "global_step": 122531, "epoch": 729} {"train_loss": -10.285477638244629, "global_step": 122532, "epoch": 729} {"train_loss": -9.62834358215332, "global_step": 122533, "epoch": 729} {"train_loss": -10.018587112426758, "global_step": 122534, "epoch": 729} {"train_loss": -10.406523704528809, "global_step": 122535, "epoch": 729} {"train_loss": -9.949583053588867, "global_step": 122536, "epoch": 729} {"train_loss": -10.042285919189453, "global_step": 122537, "epoch": 729} {"train_loss": -10.186692237854004, "global_step": 122538, "epoch": 729} {"train_loss": -10.358802795410156, "global_step": 122539, "epoch": 729} {"train_loss": -10.039642333984375, "global_step": 122540, "epoch": 729} {"train_loss": -10.272011756896973, "global_step": 122541, "epoch": 729} {"train_loss": -9.880634307861328, "global_step": 122542, "epoch": 729} {"train_loss": -10.429048538208008, "global_step": 122543, "epoch": 729} {"train_loss": -9.89665699005127, "global_step": 122544, "epoch": 729} {"train_loss": -9.738869667053223, "global_step": 122545, "epoch": 729} {"train_loss": -10.112560272216797, "global_step": 122546, "epoch": 729} {"train_loss": -9.430710792541504, "global_step": 122547, "epoch": 729} {"train_loss": -10.562820434570312, "global_step": 122548, "epoch": 729} {"train_loss": -9.690653800964355, "global_step": 122549, "epoch": 729} {"train_loss": -10.200606346130371, "global_step": 122550, "epoch": 729} {"train_loss": -9.970685005187988, "global_step": 122551, "epoch": 729} {"train_loss": -10.095184326171875, "global_step": 122552, "epoch": 729} {"train_loss": -10.096811294555664, "global_step": 122553, "epoch": 729} {"train_loss": -10.147233963012695, "global_step": 122554, "epoch": 729} {"train_loss": -10.143739700317383, "global_step": 122555, "epoch": 729} {"train_loss": -10.280767440795898, "global_step": 122556, "epoch": 729} {"train_loss": -10.407504081726074, "global_step": 122557, "epoch": 729} {"train_loss": -10.093443870544434, "global_step": 122558, "epoch": 729} {"train_loss": -10.197277069091797, "global_step": 122559, "epoch": 729} {"train_loss": -10.260907173156738, "global_step": 122560, "epoch": 729} {"train_loss": -10.223067283630371, "global_step": 122561, "epoch": 729} {"train_loss": -10.304235458374023, "global_step": 122562, "epoch": 729} {"train_loss": -10.15825080871582, "global_step": 122563, "epoch": 729} {"train_loss": -10.178409576416016, "global_step": 122564, "epoch": 729} {"train_loss": -10.35063648223877, "global_step": 122565, "epoch": 729} {"train_loss": -9.895118713378906, "global_step": 122566, "epoch": 729} {"train_loss": -10.299723625183105, "global_step": 122567, "epoch": 729} {"train_loss": -10.231121063232422, "global_step": 122568, "epoch": 729} {"train_loss": -10.230825424194336, "global_step": 122569, "epoch": 729} {"train_loss": -10.180768966674805, "global_step": 122570, "epoch": 729} {"train_loss": -10.193265914916992, "global_step": 122571, "epoch": 729} {"train_loss": -9.9981107711792, "global_step": 122572, "epoch": 729} {"train_loss": -10.182064056396484, "global_step": 122573, "epoch": 729} {"train_loss": -10.179482460021973, "global_step": 122574, "epoch": 729} {"train_loss": -10.361519813537598, "global_step": 122575, "epoch": 729} {"train_loss": -10.204793930053711, "global_step": 122576, "epoch": 729} {"train_loss": -10.421588897705078, "global_step": 122577, "epoch": 729} {"train_loss": -10.14798355102539, "global_step": 122578, "epoch": 729} {"train_loss": -9.973127365112305, "global_step": 122579, "epoch": 729} {"train_loss": -10.3062105178833, "global_step": 122580, "epoch": 729} {"train_loss": -10.369210243225098, "global_step": 122581, "epoch": 729} {"train_loss": -10.21739387512207, "global_step": 122582, "epoch": 729} {"train_loss": -10.209169387817383, "global_step": 122583, "epoch": 729} {"train_loss": -9.808052062988281, "global_step": 122584, "epoch": 729} {"train_loss": -10.357690811157227, "global_step": 122585, "epoch": 729} {"train_loss": -10.293664932250977, "global_step": 122586, "epoch": 729} {"train_loss": -10.28154182434082, "global_step": 122587, "epoch": 729} {"train_loss": -10.382057189941406, "global_step": 122588, "epoch": 729} {"train_loss": -9.72918701171875, "global_step": 122589, "epoch": 729} {"train_loss": -10.315593719482422, "global_step": 122590, "epoch": 729} {"train_loss": -9.833088874816895, "global_step": 122591, "epoch": 729} {"train_loss": -10.176870346069336, "global_step": 122592, "epoch": 729} {"train_loss": -9.791001319885254, "global_step": 122593, "epoch": 729} {"train_loss": -9.151239395141602, "global_step": 122594, "epoch": 729} {"train_loss": -9.910343170166016, "global_step": 122595, "epoch": 729} {"train_loss": -9.840622901916504, "global_step": 122596, "epoch": 729} {"train_loss": -9.665729522705078, "global_step": 122597, "epoch": 729} {"train_loss": -9.690324783325195, "global_step": 122598, "epoch": 729} {"train_loss": -9.834970474243164, "global_step": 122599, "epoch": 729} {"train_loss": -9.627212524414062, "global_step": 122600, "epoch": 729} {"train_loss": -10.021684646606445, "global_step": 122601, "epoch": 729} {"train_loss": -9.291765213012695, "global_step": 122602, "epoch": 729} {"train_loss": -9.705907821655273, "global_step": 122603, "epoch": 729} {"train_loss": -10.028176307678223, "global_step": 122604, "epoch": 729} {"train_loss": -9.4142484664917, "global_step": 122605, "epoch": 729} {"train_loss": -9.632030487060547, "global_step": 122606, "epoch": 729} {"train_loss": -9.739683151245117, "global_step": 122607, "epoch": 729} {"train_loss": -9.66682243347168, "global_step": 122608, "epoch": 729} {"train_loss": -9.981626510620117, "global_step": 122609, "epoch": 729} {"train_loss": -9.881953239440918, "global_step": 122610, "epoch": 729} {"train_loss": -9.682559967041016, "global_step": 122611, "epoch": 729} {"train_loss": -10.028297424316406, "global_step": 122612, "epoch": 729} {"train_loss": -9.991230964660645, "global_step": 122613, "epoch": 729} {"train_loss": -9.926355361938477, "global_step": 122614, "epoch": 729} {"train_loss": -9.649446487426758, "global_step": 122615, "epoch": 729} {"train_loss": -10.282366752624512, "global_step": 122616, "epoch": 729} {"train_loss": -9.821743965148926, "global_step": 122617, "epoch": 729} {"train_loss": -9.92171859741211, "global_step": 122618, "epoch": 729} {"train_loss": -10.051776885986328, "global_step": 122619, "epoch": 729} {"train_loss": -10.117008209228516, "global_step": 122620, "epoch": 729} {"train_loss": -9.975456237792969, "global_step": 122621, "epoch": 729} {"train_loss": -10.122063636779785, "global_step": 122622, "epoch": 729} {"train_loss": -10.402141571044922, "global_step": 122623, "epoch": 729} {"train_loss": -10.04642105102539, "global_step": 122624, "epoch": 729} {"train_loss": -9.913484573364258, "global_step": 122625, "epoch": 729} {"train_loss": -10.127988815307617, "global_step": 122626, "epoch": 729} {"train_loss": -10.17861557006836, "global_step": 122627, "epoch": 729} {"train_loss": -10.089251518249512, "global_step": 122628, "epoch": 729} {"train_loss": -10.140401840209961, "global_step": 122629, "epoch": 729} {"train_loss": -10.208282470703125, "global_step": 122630, "epoch": 729} {"train_loss": -10.259773254394531, "global_step": 122631, "epoch": 729} {"train_loss": -10.377976417541504, "global_step": 122632, "epoch": 729} {"train_loss": -10.291996002197266, "global_step": 122633, "epoch": 729} {"train_loss": -10.264389038085938, "global_step": 122634, "epoch": 729} {"train_loss": -10.295361518859863, "global_step": 122635, "epoch": 729} {"train_loss": -10.341512680053711, "global_step": 122636, "epoch": 729} {"train_loss": -10.514023780822754, "global_step": 122637, "epoch": 729} {"train_loss": -10.548529624938965, "global_step": 122638, "epoch": 729} {"train_loss": -10.114919917924064, "global_step": 122639, "epoch": 729, "val_loss": 215330.203125} {"train_loss": -10.45237922668457, "global_step": 122640, "epoch": 730} {"train_loss": -10.4583101272583, "global_step": 122641, "epoch": 730} {"train_loss": -10.42669677734375, "global_step": 122642, "epoch": 730} {"train_loss": -10.498403549194336, "global_step": 122643, "epoch": 730} {"train_loss": -10.355123519897461, "global_step": 122644, "epoch": 730} {"train_loss": -10.50504207611084, "global_step": 122645, "epoch": 730} {"train_loss": -10.618293762207031, "global_step": 122646, "epoch": 730} {"train_loss": -10.333524703979492, "global_step": 122647, "epoch": 730} {"train_loss": -10.541894912719727, "global_step": 122648, "epoch": 730} {"train_loss": -10.444174766540527, "global_step": 122649, "epoch": 730} {"train_loss": -10.528841018676758, "global_step": 122650, "epoch": 730} {"train_loss": -10.304509162902832, "global_step": 122651, "epoch": 730} {"train_loss": -10.503003120422363, "global_step": 122652, "epoch": 730} {"train_loss": -10.389432907104492, "global_step": 122653, "epoch": 730} {"train_loss": -10.433048248291016, "global_step": 122654, "epoch": 730} {"train_loss": -10.617729187011719, "global_step": 122655, "epoch": 730} {"train_loss": -10.438995361328125, "global_step": 122656, "epoch": 730} {"train_loss": -9.948917388916016, "global_step": 122657, "epoch": 730} {"train_loss": -10.237960815429688, "global_step": 122658, "epoch": 730} {"train_loss": -9.564565658569336, "global_step": 122659, "epoch": 730} {"train_loss": -9.179391860961914, "global_step": 122660, "epoch": 730} {"train_loss": -10.102160453796387, "global_step": 122661, "epoch": 730} {"train_loss": -10.315763473510742, "global_step": 122662, "epoch": 730} {"train_loss": -9.959228515625, "global_step": 122663, "epoch": 730} {"train_loss": -10.49074935913086, "global_step": 122664, "epoch": 730} {"train_loss": -9.864557266235352, "global_step": 122665, "epoch": 730} {"train_loss": -9.85903549194336, "global_step": 122666, "epoch": 730} {"train_loss": -10.017751693725586, "global_step": 122667, "epoch": 730} {"train_loss": -9.377996444702148, "global_step": 122668, "epoch": 730} {"train_loss": -8.840645790100098, "global_step": 122669, "epoch": 730} {"train_loss": -9.972782135009766, "global_step": 122670, "epoch": 730} {"train_loss": -9.46423625946045, "global_step": 122671, "epoch": 730} {"train_loss": -9.535953521728516, "global_step": 122672, "epoch": 730} {"train_loss": -9.892217636108398, "global_step": 122673, "epoch": 730} {"train_loss": -9.624798774719238, "global_step": 122674, "epoch": 730} {"train_loss": -9.586528778076172, "global_step": 122675, "epoch": 730} {"train_loss": -9.841460227966309, "global_step": 122676, "epoch": 730} {"train_loss": -9.82115364074707, "global_step": 122677, "epoch": 730} {"train_loss": -9.6403169631958, "global_step": 122678, "epoch": 730} {"train_loss": -10.06352424621582, "global_step": 122679, "epoch": 730} {"train_loss": -9.843809127807617, "global_step": 122680, "epoch": 730} {"train_loss": -9.520994186401367, "global_step": 122681, "epoch": 730} {"train_loss": -10.056736946105957, "global_step": 122682, "epoch": 730} {"train_loss": -9.994388580322266, "global_step": 122683, "epoch": 730} {"train_loss": -9.758895874023438, "global_step": 122684, "epoch": 730} {"train_loss": -10.170679092407227, "global_step": 122685, "epoch": 730} {"train_loss": -9.579097747802734, "global_step": 122686, "epoch": 730} {"train_loss": -9.783792495727539, "global_step": 122687, "epoch": 730} {"train_loss": -10.163091659545898, "global_step": 122688, "epoch": 730} {"train_loss": -9.851432800292969, "global_step": 122689, "epoch": 730} {"train_loss": -9.99756908416748, "global_step": 122690, "epoch": 730} {"train_loss": -10.108386993408203, "global_step": 122691, "epoch": 730} {"train_loss": -9.681890487670898, "global_step": 122692, "epoch": 730} {"train_loss": -10.00149154663086, "global_step": 122693, "epoch": 730} {"train_loss": -10.024313926696777, "global_step": 122694, "epoch": 730} {"train_loss": -10.085378646850586, "global_step": 122695, "epoch": 730} {"train_loss": -10.041723251342773, "global_step": 122696, "epoch": 730} {"train_loss": -10.19373893737793, "global_step": 122697, "epoch": 730} {"train_loss": -10.015027046203613, "global_step": 122698, "epoch": 730} {"train_loss": -10.120041847229004, "global_step": 122699, "epoch": 730} {"train_loss": -10.246042251586914, "global_step": 122700, "epoch": 730} {"train_loss": -10.108226776123047, "global_step": 122701, "epoch": 730} {"train_loss": -10.1976957321167, "global_step": 122702, "epoch": 730} {"train_loss": -10.286428451538086, "global_step": 122703, "epoch": 730} {"train_loss": -10.173866271972656, "global_step": 122704, "epoch": 730} {"train_loss": -10.192054748535156, "global_step": 122705, "epoch": 730} {"train_loss": -10.221939086914062, "global_step": 122706, "epoch": 730} {"train_loss": -10.171725273132324, "global_step": 122707, "epoch": 730} {"train_loss": -10.182267189025879, "global_step": 122708, "epoch": 730} {"train_loss": -10.206186294555664, "global_step": 122709, "epoch": 730} {"train_loss": -10.184415817260742, "global_step": 122710, "epoch": 730} {"train_loss": -10.384886741638184, "global_step": 122711, "epoch": 730} {"train_loss": -10.09152603149414, "global_step": 122712, "epoch": 730} {"train_loss": -10.256940841674805, "global_step": 122713, "epoch": 730} {"train_loss": -10.450387954711914, "global_step": 122714, "epoch": 730} {"train_loss": -10.301342010498047, "global_step": 122715, "epoch": 730} {"train_loss": -10.38729476928711, "global_step": 122716, "epoch": 730} {"train_loss": -10.364425659179688, "global_step": 122717, "epoch": 730} {"train_loss": -10.215154647827148, "global_step": 122718, "epoch": 730} {"train_loss": -10.570466041564941, "global_step": 122719, "epoch": 730} {"train_loss": -10.303241729736328, "global_step": 122720, "epoch": 730} {"train_loss": -10.334556579589844, "global_step": 122721, "epoch": 730} {"train_loss": -10.42225456237793, "global_step": 122722, "epoch": 730} {"train_loss": -10.191312789916992, "global_step": 122723, "epoch": 730} {"train_loss": -10.433032989501953, "global_step": 122724, "epoch": 730} {"train_loss": -10.257562637329102, "global_step": 122725, "epoch": 730} {"train_loss": -10.443355560302734, "global_step": 122726, "epoch": 730} {"train_loss": -10.657089233398438, "global_step": 122727, "epoch": 730} {"train_loss": -10.166194915771484, "global_step": 122728, "epoch": 730} {"train_loss": -10.405159950256348, "global_step": 122729, "epoch": 730} {"train_loss": -10.559578895568848, "global_step": 122730, "epoch": 730} {"train_loss": -10.1468505859375, "global_step": 122731, "epoch": 730} {"train_loss": -10.073905944824219, "global_step": 122732, "epoch": 730} {"train_loss": -10.366891860961914, "global_step": 122733, "epoch": 730} {"train_loss": -10.312755584716797, "global_step": 122734, "epoch": 730} {"train_loss": -10.544599533081055, "global_step": 122735, "epoch": 730} {"train_loss": -10.409823417663574, "global_step": 122736, "epoch": 730} {"train_loss": -10.60420036315918, "global_step": 122737, "epoch": 730} {"train_loss": -10.08588981628418, "global_step": 122738, "epoch": 730} {"train_loss": -9.920998573303223, "global_step": 122739, "epoch": 730} {"train_loss": -10.425006866455078, "global_step": 122740, "epoch": 730} {"train_loss": -9.60346794128418, "global_step": 122741, "epoch": 730} {"train_loss": -9.864359855651855, "global_step": 122742, "epoch": 730} {"train_loss": -10.27945613861084, "global_step": 122743, "epoch": 730} {"train_loss": -9.663971900939941, "global_step": 122744, "epoch": 730} {"train_loss": -10.366325378417969, "global_step": 122745, "epoch": 730} {"train_loss": -10.078325271606445, "global_step": 122746, "epoch": 730} {"train_loss": -9.37515640258789, "global_step": 122747, "epoch": 730} {"train_loss": -10.505760192871094, "global_step": 122748, "epoch": 730} {"train_loss": -9.50751781463623, "global_step": 122749, "epoch": 730} {"train_loss": -10.14296817779541, "global_step": 122750, "epoch": 730} {"train_loss": -10.12750244140625, "global_step": 122751, "epoch": 730} {"train_loss": -9.767091751098633, "global_step": 122752, "epoch": 730} {"train_loss": -10.126797676086426, "global_step": 122753, "epoch": 730} {"train_loss": -9.73775577545166, "global_step": 122754, "epoch": 730} {"train_loss": -10.370845794677734, "global_step": 122755, "epoch": 730} {"train_loss": -9.681804656982422, "global_step": 122756, "epoch": 730} {"train_loss": -10.324466705322266, "global_step": 122757, "epoch": 730} {"train_loss": -9.644835472106934, "global_step": 122758, "epoch": 730} {"train_loss": -10.158184051513672, "global_step": 122759, "epoch": 730} {"train_loss": -10.058120727539062, "global_step": 122760, "epoch": 730} {"train_loss": -10.230755805969238, "global_step": 122761, "epoch": 730} {"train_loss": -9.66263484954834, "global_step": 122762, "epoch": 730} {"train_loss": -10.2680025100708, "global_step": 122763, "epoch": 730} {"train_loss": -9.886665344238281, "global_step": 122764, "epoch": 730} {"train_loss": -10.379676818847656, "global_step": 122765, "epoch": 730} {"train_loss": -9.822847366333008, "global_step": 122766, "epoch": 730} {"train_loss": -10.020330429077148, "global_step": 122767, "epoch": 730} {"train_loss": -10.082174301147461, "global_step": 122768, "epoch": 730} {"train_loss": -10.025585174560547, "global_step": 122769, "epoch": 730} {"train_loss": -9.753173828125, "global_step": 122770, "epoch": 730} {"train_loss": -10.288618087768555, "global_step": 122771, "epoch": 730} {"train_loss": -9.966904640197754, "global_step": 122772, "epoch": 730} {"train_loss": -10.3876953125, "global_step": 122773, "epoch": 730} {"train_loss": -9.974966049194336, "global_step": 122774, "epoch": 730} {"train_loss": -10.12086009979248, "global_step": 122775, "epoch": 730} {"train_loss": -10.120946884155273, "global_step": 122776, "epoch": 730} {"train_loss": -10.148113250732422, "global_step": 122777, "epoch": 730} {"train_loss": -9.969335556030273, "global_step": 122778, "epoch": 730} {"train_loss": -10.088700294494629, "global_step": 122779, "epoch": 730} {"train_loss": -9.992415428161621, "global_step": 122780, "epoch": 730} {"train_loss": -10.102933883666992, "global_step": 122781, "epoch": 730} {"train_loss": -10.417675018310547, "global_step": 122782, "epoch": 730} {"train_loss": -9.925637245178223, "global_step": 122783, "epoch": 730} {"train_loss": -10.206436157226562, "global_step": 122784, "epoch": 730} {"train_loss": -9.934507369995117, "global_step": 122785, "epoch": 730} {"train_loss": -9.953963279724121, "global_step": 122786, "epoch": 730} {"train_loss": -9.818988800048828, "global_step": 122787, "epoch": 730} {"train_loss": -10.208111763000488, "global_step": 122788, "epoch": 730} {"train_loss": -9.758929252624512, "global_step": 122789, "epoch": 730} {"train_loss": -9.790693283081055, "global_step": 122790, "epoch": 730} {"train_loss": -10.19178581237793, "global_step": 122791, "epoch": 730} {"train_loss": -9.619364738464355, "global_step": 122792, "epoch": 730} {"train_loss": -10.272623062133789, "global_step": 122793, "epoch": 730} {"train_loss": -10.074980735778809, "global_step": 122794, "epoch": 730} {"train_loss": -9.991460800170898, "global_step": 122795, "epoch": 730} {"train_loss": -9.885577201843262, "global_step": 122796, "epoch": 730} {"train_loss": -9.720277786254883, "global_step": 122797, "epoch": 730} {"train_loss": -9.08558464050293, "global_step": 122798, "epoch": 730} {"train_loss": -9.720525741577148, "global_step": 122799, "epoch": 730} {"train_loss": -9.621194839477539, "global_step": 122800, "epoch": 730} {"train_loss": -9.779756546020508, "global_step": 122801, "epoch": 730} {"train_loss": -9.789368629455566, "global_step": 122802, "epoch": 730} {"train_loss": -9.856693267822266, "global_step": 122803, "epoch": 730} {"train_loss": -9.914762496948242, "global_step": 122804, "epoch": 730} {"train_loss": -10.098459243774414, "global_step": 122805, "epoch": 730} {"train_loss": -9.763311386108398, "global_step": 122806, "epoch": 730} {"train_loss": -10.073687235514322, "global_step": 122807, "epoch": 730, "val_loss": 215532.5625, "train_action_mse_error": 5.858370780944824} {"train_loss": -10.039901733398438, "global_step": 122808, "epoch": 731} {"train_loss": -9.86634635925293, "global_step": 122809, "epoch": 731} {"train_loss": -10.15261459350586, "global_step": 122810, "epoch": 731} {"train_loss": -10.021276473999023, "global_step": 122811, "epoch": 731} {"train_loss": -9.717656135559082, "global_step": 122812, "epoch": 731} {"train_loss": -9.962838172912598, "global_step": 122813, "epoch": 731} {"train_loss": -10.113205909729004, "global_step": 122814, "epoch": 731} {"train_loss": -10.077479362487793, "global_step": 122815, "epoch": 731} {"train_loss": -10.201301574707031, "global_step": 122816, "epoch": 731} {"train_loss": -10.179400444030762, "global_step": 122817, "epoch": 731} {"train_loss": -10.0581693649292, "global_step": 122818, "epoch": 731} {"train_loss": -10.069801330566406, "global_step": 122819, "epoch": 731} {"train_loss": -10.283132553100586, "global_step": 122820, "epoch": 731} {"train_loss": -10.09521198272705, "global_step": 122821, "epoch": 731} {"train_loss": -10.183277130126953, "global_step": 122822, "epoch": 731} {"train_loss": -10.306617736816406, "global_step": 122823, "epoch": 731} {"train_loss": -10.25187873840332, "global_step": 122824, "epoch": 731} {"train_loss": -10.274552345275879, "global_step": 122825, "epoch": 731} {"train_loss": -10.02694320678711, "global_step": 122826, "epoch": 731} {"train_loss": -10.174875259399414, "global_step": 122827, "epoch": 731} {"train_loss": -9.848164558410645, "global_step": 122828, "epoch": 731} {"train_loss": -10.253266334533691, "global_step": 122829, "epoch": 731} {"train_loss": -10.00493049621582, "global_step": 122830, "epoch": 731} {"train_loss": -10.290407180786133, "global_step": 122831, "epoch": 731} {"train_loss": -9.970653533935547, "global_step": 122832, "epoch": 731} {"train_loss": -10.482840538024902, "global_step": 122833, "epoch": 731} {"train_loss": -10.211599349975586, "global_step": 122834, "epoch": 731} {"train_loss": -10.5120849609375, "global_step": 122835, "epoch": 731} {"train_loss": -10.284602165222168, "global_step": 122836, "epoch": 731} {"train_loss": -10.351914405822754, "global_step": 122837, "epoch": 731} {"train_loss": -10.275956153869629, "global_step": 122838, "epoch": 731} {"train_loss": -10.3771333694458, "global_step": 122839, "epoch": 731} {"train_loss": -10.306546211242676, "global_step": 122840, "epoch": 731} {"train_loss": -10.27621841430664, "global_step": 122841, "epoch": 731} {"train_loss": -10.051567077636719, "global_step": 122842, "epoch": 731} {"train_loss": -10.307685852050781, "global_step": 122843, "epoch": 731} {"train_loss": -10.395739555358887, "global_step": 122844, "epoch": 731} {"train_loss": -10.112665176391602, "global_step": 122845, "epoch": 731} {"train_loss": -10.384866714477539, "global_step": 122846, "epoch": 731} {"train_loss": -10.13320541381836, "global_step": 122847, "epoch": 731} {"train_loss": -10.369244575500488, "global_step": 122848, "epoch": 731} {"train_loss": -10.647284507751465, "global_step": 122849, "epoch": 731} {"train_loss": -10.322534561157227, "global_step": 122850, "epoch": 731} {"train_loss": -10.55905532836914, "global_step": 122851, "epoch": 731} {"train_loss": -10.361572265625, "global_step": 122852, "epoch": 731} {"train_loss": -10.438192367553711, "global_step": 122853, "epoch": 731} {"train_loss": -10.378927230834961, "global_step": 122854, "epoch": 731} {"train_loss": -10.169685363769531, "global_step": 122855, "epoch": 731} {"train_loss": -10.521275520324707, "global_step": 122856, "epoch": 731} {"train_loss": -10.325756072998047, "global_step": 122857, "epoch": 731} {"train_loss": -10.394399642944336, "global_step": 122858, "epoch": 731} {"train_loss": -10.63383960723877, "global_step": 122859, "epoch": 731} {"train_loss": -10.219995498657227, "global_step": 122860, "epoch": 731} {"train_loss": -10.350038528442383, "global_step": 122861, "epoch": 731} {"train_loss": -10.392776489257812, "global_step": 122862, "epoch": 731} {"train_loss": -10.476484298706055, "global_step": 122863, "epoch": 731} {"train_loss": -10.273119926452637, "global_step": 122864, "epoch": 731} {"train_loss": -10.37066650390625, "global_step": 122865, "epoch": 731} {"train_loss": -10.618157386779785, "global_step": 122866, "epoch": 731} {"train_loss": -9.774770736694336, "global_step": 122867, "epoch": 731} {"train_loss": -10.201834678649902, "global_step": 122868, "epoch": 731} {"train_loss": -10.398567199707031, "global_step": 122869, "epoch": 731} {"train_loss": -9.578807830810547, "global_step": 122870, "epoch": 731} {"train_loss": -9.495738983154297, "global_step": 122871, "epoch": 731} {"train_loss": -10.024591445922852, "global_step": 122872, "epoch": 731} {"train_loss": -9.811716079711914, "global_step": 122873, "epoch": 731} {"train_loss": -9.578450202941895, "global_step": 122874, "epoch": 731} {"train_loss": -10.357643127441406, "global_step": 122875, "epoch": 731} {"train_loss": -9.991600036621094, "global_step": 122876, "epoch": 731} {"train_loss": -9.912675857543945, "global_step": 122877, "epoch": 731} {"train_loss": -10.515655517578125, "global_step": 122878, "epoch": 731} {"train_loss": -10.092415809631348, "global_step": 122879, "epoch": 731} {"train_loss": -10.24388599395752, "global_step": 122880, "epoch": 731} {"train_loss": -10.352152824401855, "global_step": 122881, "epoch": 731} {"train_loss": -9.86351203918457, "global_step": 122882, "epoch": 731} {"train_loss": -10.310336112976074, "global_step": 122883, "epoch": 731} {"train_loss": -10.057546615600586, "global_step": 122884, "epoch": 731} {"train_loss": -9.97989273071289, "global_step": 122885, "epoch": 731} {"train_loss": -10.083803176879883, "global_step": 122886, "epoch": 731} {"train_loss": -10.461515426635742, "global_step": 122887, "epoch": 731} {"train_loss": -10.431525230407715, "global_step": 122888, "epoch": 731} {"train_loss": -10.108074188232422, "global_step": 122889, "epoch": 731} {"train_loss": -10.109095573425293, "global_step": 122890, "epoch": 731} {"train_loss": -10.379108428955078, "global_step": 122891, "epoch": 731} {"train_loss": -10.33903694152832, "global_step": 122892, "epoch": 731} {"train_loss": -10.468536376953125, "global_step": 122893, "epoch": 731} {"train_loss": -10.440670013427734, "global_step": 122894, "epoch": 731} {"train_loss": -10.412090301513672, "global_step": 122895, "epoch": 731} {"train_loss": -10.16224479675293, "global_step": 122896, "epoch": 731} {"train_loss": -10.374677658081055, "global_step": 122897, "epoch": 731} {"train_loss": -10.134733200073242, "global_step": 122898, "epoch": 731} {"train_loss": -10.3636474609375, "global_step": 122899, "epoch": 731} {"train_loss": -10.37077808380127, "global_step": 122900, "epoch": 731} {"train_loss": -10.013772964477539, "global_step": 122901, "epoch": 731} {"train_loss": -10.446802139282227, "global_step": 122902, "epoch": 731} {"train_loss": -10.181525230407715, "global_step": 122903, "epoch": 731} {"train_loss": -10.236881256103516, "global_step": 122904, "epoch": 731} {"train_loss": -10.303825378417969, "global_step": 122905, "epoch": 731} {"train_loss": -10.137277603149414, "global_step": 122906, "epoch": 731} {"train_loss": -10.431787490844727, "global_step": 122907, "epoch": 731} {"train_loss": -10.124351501464844, "global_step": 122908, "epoch": 731} {"train_loss": -10.354106903076172, "global_step": 122909, "epoch": 731} {"train_loss": -10.333359718322754, "global_step": 122910, "epoch": 731} {"train_loss": -10.406389236450195, "global_step": 122911, "epoch": 731} {"train_loss": -10.2381591796875, "global_step": 122912, "epoch": 731} {"train_loss": -10.440788269042969, "global_step": 122913, "epoch": 731} {"train_loss": -10.200027465820312, "global_step": 122914, "epoch": 731} {"train_loss": -10.094228744506836, "global_step": 122915, "epoch": 731} {"train_loss": -10.031448364257812, "global_step": 122916, "epoch": 731} {"train_loss": -9.991535186767578, "global_step": 122917, "epoch": 731} {"train_loss": -10.233001708984375, "global_step": 122918, "epoch": 731} {"train_loss": -10.332280158996582, "global_step": 122919, "epoch": 731} {"train_loss": -10.008672714233398, "global_step": 122920, "epoch": 731} {"train_loss": -10.157814025878906, "global_step": 122921, "epoch": 731} {"train_loss": -9.838558197021484, "global_step": 122922, "epoch": 731} {"train_loss": -10.299094200134277, "global_step": 122923, "epoch": 731} {"train_loss": -10.084003448486328, "global_step": 122924, "epoch": 731} {"train_loss": -10.075572967529297, "global_step": 122925, "epoch": 731} {"train_loss": -10.346982955932617, "global_step": 122926, "epoch": 731} {"train_loss": -9.543933868408203, "global_step": 122927, "epoch": 731} {"train_loss": -10.167356491088867, "global_step": 122928, "epoch": 731} {"train_loss": -9.663287162780762, "global_step": 122929, "epoch": 731} {"train_loss": -9.910454750061035, "global_step": 122930, "epoch": 731} {"train_loss": -9.50332260131836, "global_step": 122931, "epoch": 731} {"train_loss": -9.835857391357422, "global_step": 122932, "epoch": 731} {"train_loss": -9.718374252319336, "global_step": 122933, "epoch": 731} {"train_loss": -9.690750122070312, "global_step": 122934, "epoch": 731} {"train_loss": -9.483335494995117, "global_step": 122935, "epoch": 731} {"train_loss": -9.96253490447998, "global_step": 122936, "epoch": 731} {"train_loss": -9.998770713806152, "global_step": 122937, "epoch": 731} {"train_loss": -9.55776596069336, "global_step": 122938, "epoch": 731} {"train_loss": -9.600547790527344, "global_step": 122939, "epoch": 731} {"train_loss": -9.617133140563965, "global_step": 122940, "epoch": 731} {"train_loss": -9.803075790405273, "global_step": 122941, "epoch": 731} {"train_loss": -10.272603988647461, "global_step": 122942, "epoch": 731} {"train_loss": -9.529715538024902, "global_step": 122943, "epoch": 731} {"train_loss": -10.126331329345703, "global_step": 122944, "epoch": 731} {"train_loss": -10.121419906616211, "global_step": 122945, "epoch": 731} {"train_loss": -10.156784057617188, "global_step": 122946, "epoch": 731} {"train_loss": -10.019963264465332, "global_step": 122947, "epoch": 731} {"train_loss": -10.13677978515625, "global_step": 122948, "epoch": 731} {"train_loss": -10.200264930725098, "global_step": 122949, "epoch": 731} {"train_loss": -10.152019500732422, "global_step": 122950, "epoch": 731} {"train_loss": -10.261068344116211, "global_step": 122951, "epoch": 731} {"train_loss": -10.203634262084961, "global_step": 122952, "epoch": 731} {"train_loss": -10.323583602905273, "global_step": 122953, "epoch": 731} {"train_loss": -10.467649459838867, "global_step": 122954, "epoch": 731} {"train_loss": -10.237419128417969, "global_step": 122955, "epoch": 731} {"train_loss": -10.423421859741211, "global_step": 122956, "epoch": 731} {"train_loss": -10.198923110961914, "global_step": 122957, "epoch": 731} {"train_loss": -10.324138641357422, "global_step": 122958, "epoch": 731} {"train_loss": -10.152423858642578, "global_step": 122959, "epoch": 731} {"train_loss": -10.250250816345215, "global_step": 122960, "epoch": 731} {"train_loss": -10.176843643188477, "global_step": 122961, "epoch": 731} {"train_loss": -10.020023345947266, "global_step": 122962, "epoch": 731} {"train_loss": -10.345170974731445, "global_step": 122963, "epoch": 731} {"train_loss": -10.351916313171387, "global_step": 122964, "epoch": 731} {"train_loss": -10.496248245239258, "global_step": 122965, "epoch": 731} {"train_loss": -10.008064270019531, "global_step": 122966, "epoch": 731} {"train_loss": -10.542352676391602, "global_step": 122967, "epoch": 731} {"train_loss": -10.257793426513672, "global_step": 122968, "epoch": 731} {"train_loss": -10.134319305419922, "global_step": 122969, "epoch": 731} {"train_loss": -10.45440673828125, "global_step": 122970, "epoch": 731} {"train_loss": -10.179766654968262, "global_step": 122971, "epoch": 731} {"train_loss": -10.37002182006836, "global_step": 122972, "epoch": 731} {"train_loss": -10.405351638793945, "global_step": 122973, "epoch": 731} {"train_loss": -10.565174102783203, "global_step": 122974, "epoch": 731} {"train_loss": -10.17639592715672, "global_step": 122975, "epoch": 731, "val_loss": 214753.765625} {"train_loss": -10.414374351501465, "global_step": 122976, "epoch": 732} {"train_loss": -10.3397855758667, "global_step": 122977, "epoch": 732} {"train_loss": -10.22923469543457, "global_step": 122978, "epoch": 732} {"train_loss": -10.284543991088867, "global_step": 122979, "epoch": 732} {"train_loss": -10.536312103271484, "global_step": 122980, "epoch": 732} {"train_loss": -10.301239967346191, "global_step": 122981, "epoch": 732} {"train_loss": -10.582483291625977, "global_step": 122982, "epoch": 732} {"train_loss": -10.522933959960938, "global_step": 122983, "epoch": 732} {"train_loss": -10.609834671020508, "global_step": 122984, "epoch": 732} {"train_loss": -10.67767333984375, "global_step": 122985, "epoch": 732} {"train_loss": -10.492155075073242, "global_step": 122986, "epoch": 732} {"train_loss": -10.369503021240234, "global_step": 122987, "epoch": 732} {"train_loss": -10.512266159057617, "global_step": 122988, "epoch": 732} {"train_loss": -10.170388221740723, "global_step": 122989, "epoch": 732} {"train_loss": -10.309957504272461, "global_step": 122990, "epoch": 732} {"train_loss": -10.438943862915039, "global_step": 122991, "epoch": 732} {"train_loss": -10.505485534667969, "global_step": 122992, "epoch": 732} {"train_loss": -10.44367504119873, "global_step": 122993, "epoch": 732} {"train_loss": -10.38553524017334, "global_step": 122994, "epoch": 732} {"train_loss": -10.578887939453125, "global_step": 122995, "epoch": 732} {"train_loss": -10.257568359375, "global_step": 122996, "epoch": 732} {"train_loss": -10.45213794708252, "global_step": 122997, "epoch": 732} {"train_loss": -10.064009666442871, "global_step": 122998, "epoch": 732} {"train_loss": -10.088619232177734, "global_step": 122999, "epoch": 732} {"train_loss": -9.953664779663086, "global_step": 123000, "epoch": 732} {"train_loss": -10.247323989868164, "global_step": 123001, "epoch": 732} {"train_loss": -10.164003372192383, "global_step": 123002, "epoch": 732} {"train_loss": -10.0464506149292, "global_step": 123003, "epoch": 732} {"train_loss": -10.315441131591797, "global_step": 123004, "epoch": 732} {"train_loss": -10.065299987792969, "global_step": 123005, "epoch": 732} {"train_loss": -10.144421577453613, "global_step": 123006, "epoch": 732} {"train_loss": -9.81872272491455, "global_step": 123007, "epoch": 732} {"train_loss": -10.103105545043945, "global_step": 123008, "epoch": 732} {"train_loss": -9.365206718444824, "global_step": 123009, "epoch": 732} {"train_loss": -9.73376750946045, "global_step": 123010, "epoch": 732} {"train_loss": -9.561147689819336, "global_step": 123011, "epoch": 732} {"train_loss": -9.826275825500488, "global_step": 123012, "epoch": 732} {"train_loss": -9.676905632019043, "global_step": 123013, "epoch": 732} {"train_loss": -9.90758228302002, "global_step": 123014, "epoch": 732} {"train_loss": -9.512178421020508, "global_step": 123015, "epoch": 732} {"train_loss": -9.91739559173584, "global_step": 123016, "epoch": 732} {"train_loss": -9.08584976196289, "global_step": 123017, "epoch": 732} {"train_loss": -9.857831954956055, "global_step": 123018, "epoch": 732} {"train_loss": -9.067865371704102, "global_step": 123019, "epoch": 732} {"train_loss": -10.088545799255371, "global_step": 123020, "epoch": 732} {"train_loss": -9.267723083496094, "global_step": 123021, "epoch": 732} {"train_loss": -9.59458065032959, "global_step": 123022, "epoch": 732} {"train_loss": -9.740530014038086, "global_step": 123023, "epoch": 732} {"train_loss": -9.410238265991211, "global_step": 123024, "epoch": 732} {"train_loss": -9.32672119140625, "global_step": 123025, "epoch": 732} {"train_loss": -9.745096206665039, "global_step": 123026, "epoch": 732} {"train_loss": -9.816241264343262, "global_step": 123027, "epoch": 732} {"train_loss": -9.385286331176758, "global_step": 123028, "epoch": 732} {"train_loss": -10.007659912109375, "global_step": 123029, "epoch": 732} {"train_loss": -9.59034538269043, "global_step": 123030, "epoch": 732} {"train_loss": -9.706369400024414, "global_step": 123031, "epoch": 732} {"train_loss": -10.14933967590332, "global_step": 123032, "epoch": 732} {"train_loss": -9.585275650024414, "global_step": 123033, "epoch": 732} {"train_loss": -10.043367385864258, "global_step": 123034, "epoch": 732} {"train_loss": -9.604196548461914, "global_step": 123035, "epoch": 732} {"train_loss": -9.476422309875488, "global_step": 123036, "epoch": 732} {"train_loss": -10.104637145996094, "global_step": 123037, "epoch": 732} {"train_loss": -9.939264297485352, "global_step": 123038, "epoch": 732} {"train_loss": -9.906435012817383, "global_step": 123039, "epoch": 732} {"train_loss": -9.895297050476074, "global_step": 123040, "epoch": 732} {"train_loss": -9.880815505981445, "global_step": 123041, "epoch": 732} {"train_loss": -10.109578132629395, "global_step": 123042, "epoch": 732} {"train_loss": -10.094444274902344, "global_step": 123043, "epoch": 732} {"train_loss": -10.102924346923828, "global_step": 123044, "epoch": 732} {"train_loss": -9.978492736816406, "global_step": 123045, "epoch": 732} {"train_loss": -10.259634971618652, "global_step": 123046, "epoch": 732} {"train_loss": -10.231073379516602, "global_step": 123047, "epoch": 732} {"train_loss": -9.873910903930664, "global_step": 123048, "epoch": 732} {"train_loss": -10.219255447387695, "global_step": 123049, "epoch": 732} {"train_loss": -10.188247680664062, "global_step": 123050, "epoch": 732} {"train_loss": -10.11862564086914, "global_step": 123051, "epoch": 732} {"train_loss": -10.149690628051758, "global_step": 123052, "epoch": 732} {"train_loss": -10.339513778686523, "global_step": 123053, "epoch": 732} {"train_loss": -10.277881622314453, "global_step": 123054, "epoch": 732} {"train_loss": -10.098814010620117, "global_step": 123055, "epoch": 732} {"train_loss": -10.29908561706543, "global_step": 123056, "epoch": 732} {"train_loss": -10.189846992492676, "global_step": 123057, "epoch": 732} {"train_loss": -10.245277404785156, "global_step": 123058, "epoch": 732} {"train_loss": -10.29727554321289, "global_step": 123059, "epoch": 732} {"train_loss": -10.306930541992188, "global_step": 123060, "epoch": 732} {"train_loss": -10.1828031539917, "global_step": 123061, "epoch": 732} {"train_loss": -10.370859146118164, "global_step": 123062, "epoch": 732} {"train_loss": -10.029150009155273, "global_step": 123063, "epoch": 732} {"train_loss": -10.358685493469238, "global_step": 123064, "epoch": 732} {"train_loss": -10.3959321975708, "global_step": 123065, "epoch": 732} {"train_loss": -10.346721649169922, "global_step": 123066, "epoch": 732} {"train_loss": -10.533225059509277, "global_step": 123067, "epoch": 732} {"train_loss": -10.603700637817383, "global_step": 123068, "epoch": 732} {"train_loss": -10.482486724853516, "global_step": 123069, "epoch": 732} {"train_loss": -10.339356422424316, "global_step": 123070, "epoch": 732} {"train_loss": -10.464284896850586, "global_step": 123071, "epoch": 732} {"train_loss": -10.306360244750977, "global_step": 123072, "epoch": 732} {"train_loss": -10.31325912475586, "global_step": 123073, "epoch": 732} {"train_loss": -10.401346206665039, "global_step": 123074, "epoch": 732} {"train_loss": -10.146892547607422, "global_step": 123075, "epoch": 732} {"train_loss": -10.278114318847656, "global_step": 123076, "epoch": 732} {"train_loss": -9.984471321105957, "global_step": 123077, "epoch": 732} {"train_loss": -10.242115020751953, "global_step": 123078, "epoch": 732} {"train_loss": -10.338178634643555, "global_step": 123079, "epoch": 732} {"train_loss": -10.437780380249023, "global_step": 123080, "epoch": 732} {"train_loss": -9.922035217285156, "global_step": 123081, "epoch": 732} {"train_loss": -10.488229751586914, "global_step": 123082, "epoch": 732} {"train_loss": -10.109095573425293, "global_step": 123083, "epoch": 732} {"train_loss": -10.26150131225586, "global_step": 123084, "epoch": 732} {"train_loss": -10.296003341674805, "global_step": 123085, "epoch": 732} {"train_loss": -10.120647430419922, "global_step": 123086, "epoch": 732} {"train_loss": -10.407132148742676, "global_step": 123087, "epoch": 732} {"train_loss": -10.236563682556152, "global_step": 123088, "epoch": 732} {"train_loss": -10.619146347045898, "global_step": 123089, "epoch": 732} {"train_loss": -10.161462783813477, "global_step": 123090, "epoch": 732} {"train_loss": -10.262412071228027, "global_step": 123091, "epoch": 732} {"train_loss": -10.162059783935547, "global_step": 123092, "epoch": 732} {"train_loss": -10.165542602539062, "global_step": 123093, "epoch": 732} {"train_loss": -10.099145889282227, "global_step": 123094, "epoch": 732} {"train_loss": -10.076560974121094, "global_step": 123095, "epoch": 732} {"train_loss": -10.216312408447266, "global_step": 123096, "epoch": 732} {"train_loss": -10.211917877197266, "global_step": 123097, "epoch": 732} {"train_loss": -10.081489562988281, "global_step": 123098, "epoch": 732} {"train_loss": -10.141179084777832, "global_step": 123099, "epoch": 732} {"train_loss": -10.147279739379883, "global_step": 123100, "epoch": 732} {"train_loss": -9.946054458618164, "global_step": 123101, "epoch": 732} {"train_loss": -10.042986869812012, "global_step": 123102, "epoch": 732} {"train_loss": -9.992572784423828, "global_step": 123103, "epoch": 732} {"train_loss": -9.672918319702148, "global_step": 123104, "epoch": 732} {"train_loss": -9.820108413696289, "global_step": 123105, "epoch": 732} {"train_loss": -9.626119613647461, "global_step": 123106, "epoch": 732} {"train_loss": -9.549473762512207, "global_step": 123107, "epoch": 732} {"train_loss": -9.986473083496094, "global_step": 123108, "epoch": 732} {"train_loss": -10.015865325927734, "global_step": 123109, "epoch": 732} {"train_loss": -9.619234085083008, "global_step": 123110, "epoch": 732} {"train_loss": -9.880683898925781, "global_step": 123111, "epoch": 732} {"train_loss": -9.803128242492676, "global_step": 123112, "epoch": 732} {"train_loss": -9.705550193786621, "global_step": 123113, "epoch": 732} {"train_loss": -10.255468368530273, "global_step": 123114, "epoch": 732} {"train_loss": -9.457052230834961, "global_step": 123115, "epoch": 732} {"train_loss": -9.972347259521484, "global_step": 123116, "epoch": 732} {"train_loss": -10.031901359558105, "global_step": 123117, "epoch": 732} {"train_loss": -9.789873123168945, "global_step": 123118, "epoch": 732} {"train_loss": -10.145125389099121, "global_step": 123119, "epoch": 732} {"train_loss": -9.861326217651367, "global_step": 123120, "epoch": 732} {"train_loss": -9.841217041015625, "global_step": 123121, "epoch": 732} {"train_loss": -10.403688430786133, "global_step": 123122, "epoch": 732} {"train_loss": -9.793476104736328, "global_step": 123123, "epoch": 732} {"train_loss": -10.078362464904785, "global_step": 123124, "epoch": 732} {"train_loss": -10.249232292175293, "global_step": 123125, "epoch": 732} {"train_loss": -9.97944450378418, "global_step": 123126, "epoch": 732} {"train_loss": -10.096698760986328, "global_step": 123127, "epoch": 732} {"train_loss": -10.094438552856445, "global_step": 123128, "epoch": 732} {"train_loss": -10.184547424316406, "global_step": 123129, "epoch": 732} {"train_loss": -10.058843612670898, "global_step": 123130, "epoch": 732} {"train_loss": -10.309707641601562, "global_step": 123131, "epoch": 732} {"train_loss": -10.129958152770996, "global_step": 123132, "epoch": 732} {"train_loss": -10.226240158081055, "global_step": 123133, "epoch": 732} {"train_loss": -10.295190811157227, "global_step": 123134, "epoch": 732} {"train_loss": -10.290200233459473, "global_step": 123135, "epoch": 732} {"train_loss": -10.299503326416016, "global_step": 123136, "epoch": 732} {"train_loss": -10.16122055053711, "global_step": 123137, "epoch": 732} {"train_loss": -10.148336410522461, "global_step": 123138, "epoch": 732} {"train_loss": -10.075084686279297, "global_step": 123139, "epoch": 732} {"train_loss": -10.290716171264648, "global_step": 123140, "epoch": 732} {"train_loss": -10.353593826293945, "global_step": 123141, "epoch": 732} {"train_loss": -10.171043395996094, "global_step": 123142, "epoch": 732} {"train_loss": -10.091400186220804, "global_step": 123143, "epoch": 732, "val_loss": 214443.546875} {"train_loss": -9.973644256591797, "global_step": 123144, "epoch": 733} {"train_loss": -10.28598403930664, "global_step": 123145, "epoch": 733} {"train_loss": -10.305926322937012, "global_step": 123146, "epoch": 733} {"train_loss": -10.149552345275879, "global_step": 123147, "epoch": 733} {"train_loss": -10.239632606506348, "global_step": 123148, "epoch": 733} {"train_loss": -10.005090713500977, "global_step": 123149, "epoch": 733} {"train_loss": -10.36048698425293, "global_step": 123150, "epoch": 733} {"train_loss": -9.600534439086914, "global_step": 123151, "epoch": 733} {"train_loss": -9.883746147155762, "global_step": 123152, "epoch": 733} {"train_loss": -9.975101470947266, "global_step": 123153, "epoch": 733} {"train_loss": -10.084781646728516, "global_step": 123154, "epoch": 733} {"train_loss": -10.407512664794922, "global_step": 123155, "epoch": 733} {"train_loss": -10.019023895263672, "global_step": 123156, "epoch": 733} {"train_loss": -10.363012313842773, "global_step": 123157, "epoch": 733} {"train_loss": -10.316808700561523, "global_step": 123158, "epoch": 733} {"train_loss": -10.507628440856934, "global_step": 123159, "epoch": 733} {"train_loss": -10.362212181091309, "global_step": 123160, "epoch": 733} {"train_loss": -10.264312744140625, "global_step": 123161, "epoch": 733} {"train_loss": -10.332859992980957, "global_step": 123162, "epoch": 733} {"train_loss": -10.33804988861084, "global_step": 123163, "epoch": 733} {"train_loss": -10.446759223937988, "global_step": 123164, "epoch": 733} {"train_loss": -10.287092208862305, "global_step": 123165, "epoch": 733} {"train_loss": -10.145447731018066, "global_step": 123166, "epoch": 733} {"train_loss": -10.322235107421875, "global_step": 123167, "epoch": 733} {"train_loss": -10.476461410522461, "global_step": 123168, "epoch": 733} {"train_loss": -10.274874687194824, "global_step": 123169, "epoch": 733} {"train_loss": -10.486993789672852, "global_step": 123170, "epoch": 733} {"train_loss": -10.309505462646484, "global_step": 123171, "epoch": 733} {"train_loss": -10.355043411254883, "global_step": 123172, "epoch": 733} {"train_loss": -10.441515922546387, "global_step": 123173, "epoch": 733} {"train_loss": -10.414621353149414, "global_step": 123174, "epoch": 733} {"train_loss": -10.491209030151367, "global_step": 123175, "epoch": 733} {"train_loss": -10.634284973144531, "global_step": 123176, "epoch": 733} {"train_loss": -10.421384811401367, "global_step": 123177, "epoch": 733} {"train_loss": -10.582819938659668, "global_step": 123178, "epoch": 733} {"train_loss": -10.41359806060791, "global_step": 123179, "epoch": 733} {"train_loss": -10.591743469238281, "global_step": 123180, "epoch": 733} {"train_loss": -10.288873672485352, "global_step": 123181, "epoch": 733} {"train_loss": -10.41942024230957, "global_step": 123182, "epoch": 733} {"train_loss": -10.515689849853516, "global_step": 123183, "epoch": 733} {"train_loss": -10.395366668701172, "global_step": 123184, "epoch": 733} {"train_loss": -10.345333099365234, "global_step": 123185, "epoch": 733} {"train_loss": -10.22079086303711, "global_step": 123186, "epoch": 733} {"train_loss": -10.208169937133789, "global_step": 123187, "epoch": 733} {"train_loss": -10.307045936584473, "global_step": 123188, "epoch": 733} {"train_loss": -10.486455917358398, "global_step": 123189, "epoch": 733} {"train_loss": -10.284669876098633, "global_step": 123190, "epoch": 733} {"train_loss": -10.338436126708984, "global_step": 123191, "epoch": 733} {"train_loss": -9.95677661895752, "global_step": 123192, "epoch": 733} {"train_loss": -10.145040512084961, "global_step": 123193, "epoch": 733} {"train_loss": -10.43399715423584, "global_step": 123194, "epoch": 733} {"train_loss": -9.835420608520508, "global_step": 123195, "epoch": 733} {"train_loss": -9.783121109008789, "global_step": 123196, "epoch": 733} {"train_loss": -10.458456039428711, "global_step": 123197, "epoch": 733} {"train_loss": -9.084790229797363, "global_step": 123198, "epoch": 733} {"train_loss": -8.968421936035156, "global_step": 123199, "epoch": 733} {"train_loss": -10.0115966796875, "global_step": 123200, "epoch": 733} {"train_loss": -8.042412757873535, "global_step": 123201, "epoch": 733} {"train_loss": -10.44029712677002, "global_step": 123202, "epoch": 733} {"train_loss": -8.528450012207031, "global_step": 123203, "epoch": 733} {"train_loss": -9.819961547851562, "global_step": 123204, "epoch": 733} {"train_loss": -9.195589065551758, "global_step": 123205, "epoch": 733} {"train_loss": -9.535666465759277, "global_step": 123206, "epoch": 733} {"train_loss": -9.557371139526367, "global_step": 123207, "epoch": 733} {"train_loss": -9.976743698120117, "global_step": 123208, "epoch": 733} {"train_loss": -9.375423431396484, "global_step": 123209, "epoch": 733} {"train_loss": -10.140371322631836, "global_step": 123210, "epoch": 733} {"train_loss": -9.317184448242188, "global_step": 123211, "epoch": 733} {"train_loss": -10.007050514221191, "global_step": 123212, "epoch": 733} {"train_loss": -10.073424339294434, "global_step": 123213, "epoch": 733} {"train_loss": -9.655330657958984, "global_step": 123214, "epoch": 733} {"train_loss": -9.974838256835938, "global_step": 123215, "epoch": 733} {"train_loss": -9.866300582885742, "global_step": 123216, "epoch": 733} {"train_loss": -9.773719787597656, "global_step": 123217, "epoch": 733} {"train_loss": -9.690277099609375, "global_step": 123218, "epoch": 733} {"train_loss": -10.077714920043945, "global_step": 123219, "epoch": 733} {"train_loss": -9.726531982421875, "global_step": 123220, "epoch": 733} {"train_loss": -9.987095832824707, "global_step": 123221, "epoch": 733} {"train_loss": -10.03282642364502, "global_step": 123222, "epoch": 733} {"train_loss": -9.741384506225586, "global_step": 123223, "epoch": 733} {"train_loss": -10.206252098083496, "global_step": 123224, "epoch": 733} {"train_loss": -9.864777565002441, "global_step": 123225, "epoch": 733} {"train_loss": -10.267685890197754, "global_step": 123226, "epoch": 733} {"train_loss": -9.910533905029297, "global_step": 123227, "epoch": 733} {"train_loss": -10.015043258666992, "global_step": 123228, "epoch": 733} {"train_loss": -10.099952697753906, "global_step": 123229, "epoch": 733} {"train_loss": -10.041540145874023, "global_step": 123230, "epoch": 733} {"train_loss": -10.18572998046875, "global_step": 123231, "epoch": 733} {"train_loss": -10.246358871459961, "global_step": 123232, "epoch": 733} {"train_loss": -10.180682182312012, "global_step": 123233, "epoch": 733} {"train_loss": -10.073420524597168, "global_step": 123234, "epoch": 733} {"train_loss": -10.213768005371094, "global_step": 123235, "epoch": 733} {"train_loss": -10.455524444580078, "global_step": 123236, "epoch": 733} {"train_loss": -10.299833297729492, "global_step": 123237, "epoch": 733} {"train_loss": -10.450199127197266, "global_step": 123238, "epoch": 733} {"train_loss": -10.312396049499512, "global_step": 123239, "epoch": 733} {"train_loss": -10.295551300048828, "global_step": 123240, "epoch": 733} {"train_loss": -10.382902145385742, "global_step": 123241, "epoch": 733} {"train_loss": -10.225969314575195, "global_step": 123242, "epoch": 733} {"train_loss": -10.385040283203125, "global_step": 123243, "epoch": 733} {"train_loss": -10.350054740905762, "global_step": 123244, "epoch": 733} {"train_loss": -10.588001251220703, "global_step": 123245, "epoch": 733} {"train_loss": -10.61366081237793, "global_step": 123246, "epoch": 733} {"train_loss": -10.438211441040039, "global_step": 123247, "epoch": 733} {"train_loss": -10.398170471191406, "global_step": 123248, "epoch": 733} {"train_loss": -10.498527526855469, "global_step": 123249, "epoch": 733} {"train_loss": -10.524866104125977, "global_step": 123250, "epoch": 733} {"train_loss": -10.560892105102539, "global_step": 123251, "epoch": 733} {"train_loss": -10.74234390258789, "global_step": 123252, "epoch": 733} {"train_loss": -10.343992233276367, "global_step": 123253, "epoch": 733} {"train_loss": -10.256333351135254, "global_step": 123254, "epoch": 733} {"train_loss": -10.483778953552246, "global_step": 123255, "epoch": 733} {"train_loss": -10.357908248901367, "global_step": 123256, "epoch": 733} {"train_loss": -10.580425262451172, "global_step": 123257, "epoch": 733} {"train_loss": -10.596463203430176, "global_step": 123258, "epoch": 733} {"train_loss": -10.546182632446289, "global_step": 123259, "epoch": 733} {"train_loss": -10.502654075622559, "global_step": 123260, "epoch": 733} {"train_loss": -10.716625213623047, "global_step": 123261, "epoch": 733} {"train_loss": -10.64824104309082, "global_step": 123262, "epoch": 733} {"train_loss": -10.61276626586914, "global_step": 123263, "epoch": 733} {"train_loss": -10.397193908691406, "global_step": 123264, "epoch": 733} {"train_loss": -10.234099388122559, "global_step": 123265, "epoch": 733} {"train_loss": -10.464378356933594, "global_step": 123266, "epoch": 733} {"train_loss": -10.273231506347656, "global_step": 123267, "epoch": 733} {"train_loss": -9.734331130981445, "global_step": 123268, "epoch": 733} {"train_loss": -9.735681533813477, "global_step": 123269, "epoch": 733} {"train_loss": -9.163583755493164, "global_step": 123270, "epoch": 733} {"train_loss": -9.816476821899414, "global_step": 123271, "epoch": 733} {"train_loss": -9.201482772827148, "global_step": 123272, "epoch": 733} {"train_loss": -9.391596794128418, "global_step": 123273, "epoch": 733} {"train_loss": -9.80610466003418, "global_step": 123274, "epoch": 733} {"train_loss": -9.40485954284668, "global_step": 123275, "epoch": 733} {"train_loss": -9.603387832641602, "global_step": 123276, "epoch": 733} {"train_loss": -9.456558227539062, "global_step": 123277, "epoch": 733} {"train_loss": -8.920120239257812, "global_step": 123278, "epoch": 733} {"train_loss": -9.98661994934082, "global_step": 123279, "epoch": 733} {"train_loss": -9.471074104309082, "global_step": 123280, "epoch": 733} {"train_loss": -9.757716178894043, "global_step": 123281, "epoch": 733} {"train_loss": -9.172697067260742, "global_step": 123282, "epoch": 733} {"train_loss": -9.855939865112305, "global_step": 123283, "epoch": 733} {"train_loss": -9.247537612915039, "global_step": 123284, "epoch": 733} {"train_loss": -9.922616958618164, "global_step": 123285, "epoch": 733} {"train_loss": -9.612092971801758, "global_step": 123286, "epoch": 733} {"train_loss": -9.70661449432373, "global_step": 123287, "epoch": 733} {"train_loss": -9.872395515441895, "global_step": 123288, "epoch": 733} {"train_loss": -9.683642387390137, "global_step": 123289, "epoch": 733} {"train_loss": -10.16653823852539, "global_step": 123290, "epoch": 733} {"train_loss": -10.214536666870117, "global_step": 123291, "epoch": 733} {"train_loss": -10.288970947265625, "global_step": 123292, "epoch": 733} {"train_loss": -9.988983154296875, "global_step": 123293, "epoch": 733} {"train_loss": -9.890460968017578, "global_step": 123294, "epoch": 733} {"train_loss": -10.11255168914795, "global_step": 123295, "epoch": 733} {"train_loss": -9.938392639160156, "global_step": 123296, "epoch": 733} {"train_loss": -10.167579650878906, "global_step": 123297, "epoch": 733} {"train_loss": -10.064189910888672, "global_step": 123298, "epoch": 733} {"train_loss": -9.964359283447266, "global_step": 123299, "epoch": 733} {"train_loss": -9.930230140686035, "global_step": 123300, "epoch": 733} {"train_loss": -10.099738121032715, "global_step": 123301, "epoch": 733} {"train_loss": -10.185907363891602, "global_step": 123302, "epoch": 733} {"train_loss": -10.145309448242188, "global_step": 123303, "epoch": 733} {"train_loss": -10.035358428955078, "global_step": 123304, "epoch": 733} {"train_loss": -10.135567665100098, "global_step": 123305, "epoch": 733} {"train_loss": -10.133041381835938, "global_step": 123306, "epoch": 733} {"train_loss": -10.145386695861816, "global_step": 123307, "epoch": 733} {"train_loss": -10.128411293029785, "global_step": 123308, "epoch": 733} {"train_loss": -10.18161678314209, "global_step": 123309, "epoch": 733} {"train_loss": -10.212570190429688, "global_step": 123310, "epoch": 733} {"train_loss": -10.087214203107925, "global_step": 123311, "epoch": 733, "val_loss": 210880.546875} {"train_loss": -10.360233306884766, "global_step": 123312, "epoch": 734} {"train_loss": -10.20467472076416, "global_step": 123313, "epoch": 734} {"train_loss": -10.102598190307617, "global_step": 123314, "epoch": 734} {"train_loss": -10.40896987915039, "global_step": 123315, "epoch": 734} {"train_loss": -10.332368850708008, "global_step": 123316, "epoch": 734} {"train_loss": -10.50586223602295, "global_step": 123317, "epoch": 734} {"train_loss": -10.035469055175781, "global_step": 123318, "epoch": 734} {"train_loss": -10.621328353881836, "global_step": 123319, "epoch": 734} {"train_loss": -10.323866844177246, "global_step": 123320, "epoch": 734} {"train_loss": -10.419504165649414, "global_step": 123321, "epoch": 734} {"train_loss": -10.394264221191406, "global_step": 123322, "epoch": 734} {"train_loss": -10.500978469848633, "global_step": 123323, "epoch": 734} {"train_loss": -10.724082946777344, "global_step": 123324, "epoch": 734} {"train_loss": -10.672874450683594, "global_step": 123325, "epoch": 734} {"train_loss": -10.43227767944336, "global_step": 123326, "epoch": 734} {"train_loss": -10.26717758178711, "global_step": 123327, "epoch": 734} {"train_loss": -10.37426471710205, "global_step": 123328, "epoch": 734} {"train_loss": -10.450490951538086, "global_step": 123329, "epoch": 734} {"train_loss": -10.370772361755371, "global_step": 123330, "epoch": 734} {"train_loss": -10.37781047821045, "global_step": 123331, "epoch": 734} {"train_loss": -10.558965682983398, "global_step": 123332, "epoch": 734} {"train_loss": -10.237431526184082, "global_step": 123333, "epoch": 734} {"train_loss": -10.523904800415039, "global_step": 123334, "epoch": 734} {"train_loss": -10.657970428466797, "global_step": 123335, "epoch": 734} {"train_loss": -9.892614364624023, "global_step": 123336, "epoch": 734} {"train_loss": -10.51809024810791, "global_step": 123337, "epoch": 734} {"train_loss": -9.969043731689453, "global_step": 123338, "epoch": 734} {"train_loss": -10.38961410522461, "global_step": 123339, "epoch": 734} {"train_loss": -10.067937850952148, "global_step": 123340, "epoch": 734} {"train_loss": -10.312217712402344, "global_step": 123341, "epoch": 734} {"train_loss": -10.04395866394043, "global_step": 123342, "epoch": 734} {"train_loss": -10.185367584228516, "global_step": 123343, "epoch": 734} {"train_loss": -10.022405624389648, "global_step": 123344, "epoch": 734} {"train_loss": -9.420550346374512, "global_step": 123345, "epoch": 734} {"train_loss": -10.33864974975586, "global_step": 123346, "epoch": 734} {"train_loss": -9.16887092590332, "global_step": 123347, "epoch": 734} {"train_loss": -10.064092636108398, "global_step": 123348, "epoch": 734} {"train_loss": -9.87286376953125, "global_step": 123349, "epoch": 734} {"train_loss": -10.031332015991211, "global_step": 123350, "epoch": 734} {"train_loss": -10.07438850402832, "global_step": 123351, "epoch": 734} {"train_loss": -9.753732681274414, "global_step": 123352, "epoch": 734} {"train_loss": -10.089849472045898, "global_step": 123353, "epoch": 734} {"train_loss": -10.116233825683594, "global_step": 123354, "epoch": 734} {"train_loss": -10.192846298217773, "global_step": 123355, "epoch": 734} {"train_loss": -10.122598648071289, "global_step": 123356, "epoch": 734} {"train_loss": -10.242964744567871, "global_step": 123357, "epoch": 734} {"train_loss": -9.926223754882812, "global_step": 123358, "epoch": 734} {"train_loss": -10.264426231384277, "global_step": 123359, "epoch": 734} {"train_loss": -9.844597816467285, "global_step": 123360, "epoch": 734} {"train_loss": -10.225870132446289, "global_step": 123361, "epoch": 734} {"train_loss": -9.88284969329834, "global_step": 123362, "epoch": 734} {"train_loss": -10.002420425415039, "global_step": 123363, "epoch": 734} {"train_loss": -10.111628532409668, "global_step": 123364, "epoch": 734} {"train_loss": -10.131452560424805, "global_step": 123365, "epoch": 734} {"train_loss": -10.230676651000977, "global_step": 123366, "epoch": 734} {"train_loss": -10.37147331237793, "global_step": 123367, "epoch": 734} {"train_loss": -10.027059555053711, "global_step": 123368, "epoch": 734} {"train_loss": -9.906513214111328, "global_step": 123369, "epoch": 734} {"train_loss": -10.03813648223877, "global_step": 123370, "epoch": 734} {"train_loss": -10.053407669067383, "global_step": 123371, "epoch": 734} {"train_loss": -9.981256484985352, "global_step": 123372, "epoch": 734} {"train_loss": -10.266314506530762, "global_step": 123373, "epoch": 734} {"train_loss": -10.282970428466797, "global_step": 123374, "epoch": 734} {"train_loss": -10.13907241821289, "global_step": 123375, "epoch": 734} {"train_loss": -10.128284454345703, "global_step": 123376, "epoch": 734} {"train_loss": -9.99772834777832, "global_step": 123377, "epoch": 734} {"train_loss": -10.291725158691406, "global_step": 123378, "epoch": 734} {"train_loss": -10.34564208984375, "global_step": 123379, "epoch": 734} {"train_loss": -10.290733337402344, "global_step": 123380, "epoch": 734} {"train_loss": -10.351875305175781, "global_step": 123381, "epoch": 734} {"train_loss": -10.283122062683105, "global_step": 123382, "epoch": 734} {"train_loss": -10.515096664428711, "global_step": 123383, "epoch": 734} {"train_loss": -10.120536804199219, "global_step": 123384, "epoch": 734} {"train_loss": -10.389410972595215, "global_step": 123385, "epoch": 734} {"train_loss": -10.036243438720703, "global_step": 123386, "epoch": 734} {"train_loss": -10.449980735778809, "global_step": 123387, "epoch": 734} {"train_loss": -10.41185188293457, "global_step": 123388, "epoch": 734} {"train_loss": -10.304736137390137, "global_step": 123389, "epoch": 734} {"train_loss": -10.178165435791016, "global_step": 123390, "epoch": 734} {"train_loss": -10.267559051513672, "global_step": 123391, "epoch": 734} {"train_loss": -10.48615837097168, "global_step": 123392, "epoch": 734} {"train_loss": -10.514358520507812, "global_step": 123393, "epoch": 734} {"train_loss": -10.04342269897461, "global_step": 123394, "epoch": 734} {"train_loss": -10.203920364379883, "global_step": 123395, "epoch": 734} {"train_loss": -10.27785873413086, "global_step": 123396, "epoch": 734} {"train_loss": -9.923349380493164, "global_step": 123397, "epoch": 734} {"train_loss": -10.346824645996094, "global_step": 123398, "epoch": 734} {"train_loss": -10.080233573913574, "global_step": 123399, "epoch": 734} {"train_loss": -9.724102020263672, "global_step": 123400, "epoch": 734} {"train_loss": -10.594741821289062, "global_step": 123401, "epoch": 734} {"train_loss": -9.179014205932617, "global_step": 123402, "epoch": 734} {"train_loss": -10.19317626953125, "global_step": 123403, "epoch": 734} {"train_loss": -9.889945030212402, "global_step": 123404, "epoch": 734} {"train_loss": -9.935218811035156, "global_step": 123405, "epoch": 734} {"train_loss": -9.99550724029541, "global_step": 123406, "epoch": 734} {"train_loss": -9.761247634887695, "global_step": 123407, "epoch": 734} {"train_loss": -9.290162086486816, "global_step": 123408, "epoch": 734} {"train_loss": -9.485443115234375, "global_step": 123409, "epoch": 734} {"train_loss": -10.105945587158203, "global_step": 123410, "epoch": 734} {"train_loss": -9.446791648864746, "global_step": 123411, "epoch": 734} {"train_loss": -9.955292701721191, "global_step": 123412, "epoch": 734} {"train_loss": -9.19365119934082, "global_step": 123413, "epoch": 734} {"train_loss": -10.20690631866455, "global_step": 123414, "epoch": 734} {"train_loss": -9.312616348266602, "global_step": 123415, "epoch": 734} {"train_loss": -10.014945030212402, "global_step": 123416, "epoch": 734} {"train_loss": -9.670884132385254, "global_step": 123417, "epoch": 734} {"train_loss": -10.057968139648438, "global_step": 123418, "epoch": 734} {"train_loss": -9.737048149108887, "global_step": 123419, "epoch": 734} {"train_loss": -10.169652938842773, "global_step": 123420, "epoch": 734} {"train_loss": -9.667074203491211, "global_step": 123421, "epoch": 734} {"train_loss": -10.143564224243164, "global_step": 123422, "epoch": 734} {"train_loss": -10.022830963134766, "global_step": 123423, "epoch": 734} {"train_loss": -9.784355163574219, "global_step": 123424, "epoch": 734} {"train_loss": -9.989642143249512, "global_step": 123425, "epoch": 734} {"train_loss": -9.8954496383667, "global_step": 123426, "epoch": 734} {"train_loss": -9.80147647857666, "global_step": 123427, "epoch": 734} {"train_loss": -9.942756652832031, "global_step": 123428, "epoch": 734} {"train_loss": -9.875901222229004, "global_step": 123429, "epoch": 734} {"train_loss": -9.982357025146484, "global_step": 123430, "epoch": 734} {"train_loss": -10.130155563354492, "global_step": 123431, "epoch": 734} {"train_loss": -9.964216232299805, "global_step": 123432, "epoch": 734} {"train_loss": -9.964752197265625, "global_step": 123433, "epoch": 734} {"train_loss": -10.033647537231445, "global_step": 123434, "epoch": 734} {"train_loss": -9.904480934143066, "global_step": 123435, "epoch": 734} {"train_loss": -9.907292366027832, "global_step": 123436, "epoch": 734} {"train_loss": -10.272140502929688, "global_step": 123437, "epoch": 734} {"train_loss": -10.094747543334961, "global_step": 123438, "epoch": 734} {"train_loss": -10.046835899353027, "global_step": 123439, "epoch": 734} {"train_loss": -9.885480880737305, "global_step": 123440, "epoch": 734} {"train_loss": -10.231184005737305, "global_step": 123441, "epoch": 734} {"train_loss": -10.041996002197266, "global_step": 123442, "epoch": 734} {"train_loss": -9.956656455993652, "global_step": 123443, "epoch": 734} {"train_loss": -10.312629699707031, "global_step": 123444, "epoch": 734} {"train_loss": -9.911591529846191, "global_step": 123445, "epoch": 734} {"train_loss": -10.164283752441406, "global_step": 123446, "epoch": 734} {"train_loss": -10.342191696166992, "global_step": 123447, "epoch": 734} {"train_loss": -10.04391860961914, "global_step": 123448, "epoch": 734} {"train_loss": -10.066766738891602, "global_step": 123449, "epoch": 734} {"train_loss": -10.424421310424805, "global_step": 123450, "epoch": 734} {"train_loss": -10.244688034057617, "global_step": 123451, "epoch": 734} {"train_loss": -10.210566520690918, "global_step": 123452, "epoch": 734} {"train_loss": -10.338360786437988, "global_step": 123453, "epoch": 734} {"train_loss": -10.371541023254395, "global_step": 123454, "epoch": 734} {"train_loss": -10.330598831176758, "global_step": 123455, "epoch": 734} {"train_loss": -10.459510803222656, "global_step": 123456, "epoch": 734} {"train_loss": -10.493894577026367, "global_step": 123457, "epoch": 734} {"train_loss": -10.410400390625, "global_step": 123458, "epoch": 734} {"train_loss": -10.303277969360352, "global_step": 123459, "epoch": 734} {"train_loss": -10.73732852935791, "global_step": 123460, "epoch": 734} {"train_loss": -10.361898422241211, "global_step": 123461, "epoch": 734} {"train_loss": -10.278844833374023, "global_step": 123462, "epoch": 734} {"train_loss": -10.646066665649414, "global_step": 123463, "epoch": 734} {"train_loss": -10.192737579345703, "global_step": 123464, "epoch": 734} {"train_loss": -10.1156644821167, "global_step": 123465, "epoch": 734} {"train_loss": -10.265643119812012, "global_step": 123466, "epoch": 734} {"train_loss": -9.397183418273926, "global_step": 123467, "epoch": 734} {"train_loss": -10.235994338989258, "global_step": 123468, "epoch": 734} {"train_loss": -9.41711139678955, "global_step": 123469, "epoch": 734} {"train_loss": -9.428523063659668, "global_step": 123470, "epoch": 734} {"train_loss": -9.900994300842285, "global_step": 123471, "epoch": 734} {"train_loss": -9.272956848144531, "global_step": 123472, "epoch": 734} {"train_loss": -9.511877059936523, "global_step": 123473, "epoch": 734} {"train_loss": -8.856542587280273, "global_step": 123474, "epoch": 734} {"train_loss": -10.374065399169922, "global_step": 123475, "epoch": 734} {"train_loss": -9.624935150146484, "global_step": 123476, "epoch": 734} {"train_loss": -9.764355659484863, "global_step": 123477, "epoch": 734} {"train_loss": -9.597583770751953, "global_step": 123478, "epoch": 734} {"train_loss": -10.09538421744392, "global_step": 123479, "epoch": 734, "val_loss": 218067.1875} {"train_loss": -9.925247192382812, "global_step": 123480, "epoch": 735} {"train_loss": -9.163808822631836, "global_step": 123481, "epoch": 735} {"train_loss": -9.907114028930664, "global_step": 123482, "epoch": 735} {"train_loss": -9.507537841796875, "global_step": 123483, "epoch": 735} {"train_loss": -9.842018127441406, "global_step": 123484, "epoch": 735} {"train_loss": -9.682621955871582, "global_step": 123485, "epoch": 735} {"train_loss": -9.923723220825195, "global_step": 123486, "epoch": 735} {"train_loss": -10.03823184967041, "global_step": 123487, "epoch": 735} {"train_loss": -9.438961029052734, "global_step": 123488, "epoch": 735} {"train_loss": -10.070258140563965, "global_step": 123489, "epoch": 735} {"train_loss": -9.4622802734375, "global_step": 123490, "epoch": 735} {"train_loss": -9.875728607177734, "global_step": 123491, "epoch": 735} {"train_loss": -10.004115104675293, "global_step": 123492, "epoch": 735} {"train_loss": -9.908051490783691, "global_step": 123493, "epoch": 735} {"train_loss": -10.302337646484375, "global_step": 123494, "epoch": 735} {"train_loss": -9.866232872009277, "global_step": 123495, "epoch": 735} {"train_loss": -9.954111099243164, "global_step": 123496, "epoch": 735} {"train_loss": -9.882792472839355, "global_step": 123497, "epoch": 735} {"train_loss": -10.099222183227539, "global_step": 123498, "epoch": 735} {"train_loss": -10.206971168518066, "global_step": 123499, "epoch": 735} {"train_loss": -10.08373737335205, "global_step": 123500, "epoch": 735} {"train_loss": -10.052154541015625, "global_step": 123501, "epoch": 735} {"train_loss": -10.302640914916992, "global_step": 123502, "epoch": 735} {"train_loss": -10.122640609741211, "global_step": 123503, "epoch": 735} {"train_loss": -10.147043228149414, "global_step": 123504, "epoch": 735} {"train_loss": -10.109537124633789, "global_step": 123505, "epoch": 735} {"train_loss": -10.139638900756836, "global_step": 123506, "epoch": 735} {"train_loss": -10.3641357421875, "global_step": 123507, "epoch": 735} {"train_loss": -10.330527305603027, "global_step": 123508, "epoch": 735} {"train_loss": -10.422486305236816, "global_step": 123509, "epoch": 735} {"train_loss": -10.332040786743164, "global_step": 123510, "epoch": 735} {"train_loss": -10.250040054321289, "global_step": 123511, "epoch": 735} {"train_loss": -10.487419128417969, "global_step": 123512, "epoch": 735} {"train_loss": -10.460567474365234, "global_step": 123513, "epoch": 735} {"train_loss": -10.5845308303833, "global_step": 123514, "epoch": 735} {"train_loss": -10.39808464050293, "global_step": 123515, "epoch": 735} {"train_loss": -10.23723030090332, "global_step": 123516, "epoch": 735} {"train_loss": -10.502115249633789, "global_step": 123517, "epoch": 735} {"train_loss": -10.492426872253418, "global_step": 123518, "epoch": 735} {"train_loss": -10.565286636352539, "global_step": 123519, "epoch": 735} {"train_loss": -10.485157012939453, "global_step": 123520, "epoch": 735} {"train_loss": -10.239749908447266, "global_step": 123521, "epoch": 735} {"train_loss": -10.218152046203613, "global_step": 123522, "epoch": 735} {"train_loss": -10.554659843444824, "global_step": 123523, "epoch": 735} {"train_loss": -10.550237655639648, "global_step": 123524, "epoch": 735} {"train_loss": -10.36520767211914, "global_step": 123525, "epoch": 735} {"train_loss": -10.592107772827148, "global_step": 123526, "epoch": 735} {"train_loss": -10.572172164916992, "global_step": 123527, "epoch": 735} {"train_loss": -10.554542541503906, "global_step": 123528, "epoch": 735} {"train_loss": -10.845294952392578, "global_step": 123529, "epoch": 735} {"train_loss": -10.415742874145508, "global_step": 123530, "epoch": 735} {"train_loss": -10.494935989379883, "global_step": 123531, "epoch": 735} {"train_loss": -10.260838508605957, "global_step": 123532, "epoch": 735} {"train_loss": -10.358874320983887, "global_step": 123533, "epoch": 735} {"train_loss": -10.270696640014648, "global_step": 123534, "epoch": 735} {"train_loss": -10.272716522216797, "global_step": 123535, "epoch": 735} {"train_loss": -10.000429153442383, "global_step": 123536, "epoch": 735} {"train_loss": -10.17470645904541, "global_step": 123537, "epoch": 735} {"train_loss": -9.588029861450195, "global_step": 123538, "epoch": 735} {"train_loss": -9.83973217010498, "global_step": 123539, "epoch": 735} {"train_loss": -9.924490928649902, "global_step": 123540, "epoch": 735} {"train_loss": -9.977611541748047, "global_step": 123541, "epoch": 735} {"train_loss": -9.93113899230957, "global_step": 123542, "epoch": 735} {"train_loss": -10.057561874389648, "global_step": 123543, "epoch": 735} {"train_loss": -9.305241584777832, "global_step": 123544, "epoch": 735} {"train_loss": -10.29813003540039, "global_step": 123545, "epoch": 735} {"train_loss": -8.968101501464844, "global_step": 123546, "epoch": 735} {"train_loss": -10.11014461517334, "global_step": 123547, "epoch": 735} {"train_loss": -9.704090118408203, "global_step": 123548, "epoch": 735} {"train_loss": -10.013219833374023, "global_step": 123549, "epoch": 735} {"train_loss": -9.784248352050781, "global_step": 123550, "epoch": 735} {"train_loss": -10.073932647705078, "global_step": 123551, "epoch": 735} {"train_loss": -10.025354385375977, "global_step": 123552, "epoch": 735} {"train_loss": -9.971680641174316, "global_step": 123553, "epoch": 735} {"train_loss": -9.699136734008789, "global_step": 123554, "epoch": 735} {"train_loss": -9.730127334594727, "global_step": 123555, "epoch": 735} {"train_loss": -9.849544525146484, "global_step": 123556, "epoch": 735} {"train_loss": -10.085813522338867, "global_step": 123557, "epoch": 735} {"train_loss": -9.91147518157959, "global_step": 123558, "epoch": 735} {"train_loss": -9.934761047363281, "global_step": 123559, "epoch": 735} {"train_loss": -10.005112648010254, "global_step": 123560, "epoch": 735} {"train_loss": -9.91114616394043, "global_step": 123561, "epoch": 735} {"train_loss": -9.983017921447754, "global_step": 123562, "epoch": 735} {"train_loss": -10.113748550415039, "global_step": 123563, "epoch": 735} {"train_loss": -10.097801208496094, "global_step": 123564, "epoch": 735} {"train_loss": -10.218860626220703, "global_step": 123565, "epoch": 735} {"train_loss": -10.274285316467285, "global_step": 123566, "epoch": 735} {"train_loss": -9.94935131072998, "global_step": 123567, "epoch": 735} {"train_loss": -10.297707557678223, "global_step": 123568, "epoch": 735} {"train_loss": -10.21748161315918, "global_step": 123569, "epoch": 735} {"train_loss": -10.36319351196289, "global_step": 123570, "epoch": 735} {"train_loss": -9.911178588867188, "global_step": 123571, "epoch": 735} {"train_loss": -10.167618751525879, "global_step": 123572, "epoch": 735} {"train_loss": -10.198652267456055, "global_step": 123573, "epoch": 735} {"train_loss": -10.18643569946289, "global_step": 123574, "epoch": 735} {"train_loss": -10.3466215133667, "global_step": 123575, "epoch": 735} {"train_loss": -10.276012420654297, "global_step": 123576, "epoch": 735} {"train_loss": -10.39555549621582, "global_step": 123577, "epoch": 735} {"train_loss": -10.154903411865234, "global_step": 123578, "epoch": 735} {"train_loss": -10.36623764038086, "global_step": 123579, "epoch": 735} {"train_loss": -10.241254806518555, "global_step": 123580, "epoch": 735} {"train_loss": -10.24499225616455, "global_step": 123581, "epoch": 735} {"train_loss": -10.193401336669922, "global_step": 123582, "epoch": 735} {"train_loss": -10.174126625061035, "global_step": 123583, "epoch": 735} {"train_loss": -10.329081535339355, "global_step": 123584, "epoch": 735} {"train_loss": -9.923103332519531, "global_step": 123585, "epoch": 735} {"train_loss": -10.388822555541992, "global_step": 123586, "epoch": 735} {"train_loss": -9.855287551879883, "global_step": 123587, "epoch": 735} {"train_loss": -10.471920013427734, "global_step": 123588, "epoch": 735} {"train_loss": -9.983078002929688, "global_step": 123589, "epoch": 735} {"train_loss": -10.394678115844727, "global_step": 123590, "epoch": 735} {"train_loss": -10.048462867736816, "global_step": 123591, "epoch": 735} {"train_loss": -10.11172866821289, "global_step": 123592, "epoch": 735} {"train_loss": -10.715886116027832, "global_step": 123593, "epoch": 735} {"train_loss": -9.99332332611084, "global_step": 123594, "epoch": 735} {"train_loss": -10.230405807495117, "global_step": 123595, "epoch": 735} {"train_loss": -10.19093132019043, "global_step": 123596, "epoch": 735} {"train_loss": -9.97608757019043, "global_step": 123597, "epoch": 735} {"train_loss": -10.269793510437012, "global_step": 123598, "epoch": 735} {"train_loss": -10.141746520996094, "global_step": 123599, "epoch": 735} {"train_loss": -10.272825241088867, "global_step": 123600, "epoch": 735} {"train_loss": -10.497613906860352, "global_step": 123601, "epoch": 735} {"train_loss": -10.366405487060547, "global_step": 123602, "epoch": 735} {"train_loss": -10.109628677368164, "global_step": 123603, "epoch": 735} {"train_loss": -10.388218879699707, "global_step": 123604, "epoch": 735} {"train_loss": -10.23056411743164, "global_step": 123605, "epoch": 735} {"train_loss": -10.203715324401855, "global_step": 123606, "epoch": 735} {"train_loss": -10.45859146118164, "global_step": 123607, "epoch": 735} {"train_loss": -10.365453720092773, "global_step": 123608, "epoch": 735} {"train_loss": -10.347447395324707, "global_step": 123609, "epoch": 735} {"train_loss": -10.400903701782227, "global_step": 123610, "epoch": 735} {"train_loss": -9.896150588989258, "global_step": 123611, "epoch": 735} {"train_loss": -10.394938468933105, "global_step": 123612, "epoch": 735} {"train_loss": -10.350841522216797, "global_step": 123613, "epoch": 735} {"train_loss": -10.4605712890625, "global_step": 123614, "epoch": 735} {"train_loss": -10.486971855163574, "global_step": 123615, "epoch": 735} {"train_loss": -10.356929779052734, "global_step": 123616, "epoch": 735} {"train_loss": -10.524981498718262, "global_step": 123617, "epoch": 735} {"train_loss": -10.085060119628906, "global_step": 123618, "epoch": 735} {"train_loss": -10.672054290771484, "global_step": 123619, "epoch": 735} {"train_loss": -10.123241424560547, "global_step": 123620, "epoch": 735} {"train_loss": -10.339954376220703, "global_step": 123621, "epoch": 735} {"train_loss": -10.447488784790039, "global_step": 123622, "epoch": 735} {"train_loss": -10.183212280273438, "global_step": 123623, "epoch": 735} {"train_loss": -10.504684448242188, "global_step": 123624, "epoch": 735} {"train_loss": -10.089634895324707, "global_step": 123625, "epoch": 735} {"train_loss": -10.286487579345703, "global_step": 123626, "epoch": 735} {"train_loss": -10.311040878295898, "global_step": 123627, "epoch": 735} {"train_loss": -10.218918800354004, "global_step": 123628, "epoch": 735} {"train_loss": -10.311075210571289, "global_step": 123629, "epoch": 735} {"train_loss": -10.293717384338379, "global_step": 123630, "epoch": 735} {"train_loss": -10.549203872680664, "global_step": 123631, "epoch": 735} {"train_loss": -10.195001602172852, "global_step": 123632, "epoch": 735} {"train_loss": -10.163875579833984, "global_step": 123633, "epoch": 735} {"train_loss": -10.158918380737305, "global_step": 123634, "epoch": 735} {"train_loss": -10.496847152709961, "global_step": 123635, "epoch": 735} {"train_loss": -10.108867645263672, "global_step": 123636, "epoch": 735} {"train_loss": -10.301528930664062, "global_step": 123637, "epoch": 735} {"train_loss": -10.520818710327148, "global_step": 123638, "epoch": 735} {"train_loss": -10.442866325378418, "global_step": 123639, "epoch": 735} {"train_loss": -10.18058967590332, "global_step": 123640, "epoch": 735} {"train_loss": -10.272224426269531, "global_step": 123641, "epoch": 735} {"train_loss": -10.157292366027832, "global_step": 123642, "epoch": 735} {"train_loss": -10.230195999145508, "global_step": 123643, "epoch": 735} {"train_loss": -10.23491096496582, "global_step": 123644, "epoch": 735} {"train_loss": -10.069111824035645, "global_step": 123645, "epoch": 735} {"train_loss": -10.029369354248047, "global_step": 123646, "epoch": 735} {"train_loss": -10.173189600308737, "global_step": 123647, "epoch": 735, "val_loss": 215318.25, "train_action_mse_error": 1.294553518295288} {"train_loss": -10.24478530883789, "global_step": 123648, "epoch": 736} {"train_loss": -10.17399787902832, "global_step": 123649, "epoch": 736} {"train_loss": -9.979077339172363, "global_step": 123650, "epoch": 736} {"train_loss": -10.099987030029297, "global_step": 123651, "epoch": 736} {"train_loss": -10.182414054870605, "global_step": 123652, "epoch": 736} {"train_loss": -10.319075584411621, "global_step": 123653, "epoch": 736} {"train_loss": -9.82292366027832, "global_step": 123654, "epoch": 736} {"train_loss": -10.179008483886719, "global_step": 123655, "epoch": 736} {"train_loss": -10.111778259277344, "global_step": 123656, "epoch": 736} {"train_loss": -9.73154067993164, "global_step": 123657, "epoch": 736} {"train_loss": -10.27126693725586, "global_step": 123658, "epoch": 736} {"train_loss": -9.900604248046875, "global_step": 123659, "epoch": 736} {"train_loss": -10.069384574890137, "global_step": 123660, "epoch": 736} {"train_loss": -9.461296081542969, "global_step": 123661, "epoch": 736} {"train_loss": -10.093388557434082, "global_step": 123662, "epoch": 736} {"train_loss": -10.066356658935547, "global_step": 123663, "epoch": 736} {"train_loss": -9.850872039794922, "global_step": 123664, "epoch": 736} {"train_loss": -10.014081954956055, "global_step": 123665, "epoch": 736} {"train_loss": -10.424947738647461, "global_step": 123666, "epoch": 736} {"train_loss": -10.012324333190918, "global_step": 123667, "epoch": 736} {"train_loss": -10.097103118896484, "global_step": 123668, "epoch": 736} {"train_loss": -9.992305755615234, "global_step": 123669, "epoch": 736} {"train_loss": -10.424236297607422, "global_step": 123670, "epoch": 736} {"train_loss": -9.593669891357422, "global_step": 123671, "epoch": 736} {"train_loss": -10.309797286987305, "global_step": 123672, "epoch": 736} {"train_loss": -10.100934982299805, "global_step": 123673, "epoch": 736} {"train_loss": -9.906343460083008, "global_step": 123674, "epoch": 736} {"train_loss": -9.902575492858887, "global_step": 123675, "epoch": 736} {"train_loss": -10.303725242614746, "global_step": 123676, "epoch": 736} {"train_loss": -9.834680557250977, "global_step": 123677, "epoch": 736} {"train_loss": -10.400856018066406, "global_step": 123678, "epoch": 736} {"train_loss": -10.061605453491211, "global_step": 123679, "epoch": 736} {"train_loss": -10.233753204345703, "global_step": 123680, "epoch": 736} {"train_loss": -10.28194522857666, "global_step": 123681, "epoch": 736} {"train_loss": -9.973913192749023, "global_step": 123682, "epoch": 736} {"train_loss": -10.340288162231445, "global_step": 123683, "epoch": 736} {"train_loss": -10.259145736694336, "global_step": 123684, "epoch": 736} {"train_loss": -10.489604949951172, "global_step": 123685, "epoch": 736} {"train_loss": -9.972843170166016, "global_step": 123686, "epoch": 736} {"train_loss": -10.498920440673828, "global_step": 123687, "epoch": 736} {"train_loss": -10.067258834838867, "global_step": 123688, "epoch": 736} {"train_loss": -10.124342918395996, "global_step": 123689, "epoch": 736} {"train_loss": -9.816478729248047, "global_step": 123690, "epoch": 736} {"train_loss": -9.71877670288086, "global_step": 123691, "epoch": 736} {"train_loss": -10.192891120910645, "global_step": 123692, "epoch": 736} {"train_loss": -10.216362953186035, "global_step": 123693, "epoch": 736} {"train_loss": -9.841184616088867, "global_step": 123694, "epoch": 736} {"train_loss": -10.080766677856445, "global_step": 123695, "epoch": 736} {"train_loss": -10.228906631469727, "global_step": 123696, "epoch": 736} {"train_loss": -10.067842483520508, "global_step": 123697, "epoch": 736} {"train_loss": -10.436920166015625, "global_step": 123698, "epoch": 736} {"train_loss": -10.267663955688477, "global_step": 123699, "epoch": 736} {"train_loss": -10.184646606445312, "global_step": 123700, "epoch": 736} {"train_loss": -10.204492568969727, "global_step": 123701, "epoch": 736} {"train_loss": -10.388524055480957, "global_step": 123702, "epoch": 736} {"train_loss": -10.298423767089844, "global_step": 123703, "epoch": 736} {"train_loss": -10.356806755065918, "global_step": 123704, "epoch": 736} {"train_loss": -10.264335632324219, "global_step": 123705, "epoch": 736} {"train_loss": -10.171333312988281, "global_step": 123706, "epoch": 736} {"train_loss": -10.211691856384277, "global_step": 123707, "epoch": 736} {"train_loss": -9.99593448638916, "global_step": 123708, "epoch": 736} {"train_loss": -10.335641860961914, "global_step": 123709, "epoch": 736} {"train_loss": -10.257326126098633, "global_step": 123710, "epoch": 736} {"train_loss": -10.180561065673828, "global_step": 123711, "epoch": 736} {"train_loss": -9.989849090576172, "global_step": 123712, "epoch": 736} {"train_loss": -10.063138961791992, "global_step": 123713, "epoch": 736} {"train_loss": -10.359872817993164, "global_step": 123714, "epoch": 736} {"train_loss": -10.091812133789062, "global_step": 123715, "epoch": 736} {"train_loss": -10.486818313598633, "global_step": 123716, "epoch": 736} {"train_loss": -10.01054859161377, "global_step": 123717, "epoch": 736} {"train_loss": -10.324590682983398, "global_step": 123718, "epoch": 736} {"train_loss": -10.234981536865234, "global_step": 123719, "epoch": 736} {"train_loss": -10.297746658325195, "global_step": 123720, "epoch": 736} {"train_loss": -10.217360496520996, "global_step": 123721, "epoch": 736} {"train_loss": -10.475364685058594, "global_step": 123722, "epoch": 736} {"train_loss": -10.24866008758545, "global_step": 123723, "epoch": 736} {"train_loss": -10.303338050842285, "global_step": 123724, "epoch": 736} {"train_loss": -10.506486892700195, "global_step": 123725, "epoch": 736} {"train_loss": -10.605287551879883, "global_step": 123726, "epoch": 736} {"train_loss": -10.205509185791016, "global_step": 123727, "epoch": 736} {"train_loss": -10.185871124267578, "global_step": 123728, "epoch": 736} {"train_loss": -10.371927261352539, "global_step": 123729, "epoch": 736} {"train_loss": -10.277596473693848, "global_step": 123730, "epoch": 736} {"train_loss": -10.41392707824707, "global_step": 123731, "epoch": 736} {"train_loss": -10.45885944366455, "global_step": 123732, "epoch": 736} {"train_loss": -10.501811981201172, "global_step": 123733, "epoch": 736} {"train_loss": -10.501582145690918, "global_step": 123734, "epoch": 736} {"train_loss": -10.435876846313477, "global_step": 123735, "epoch": 736} {"train_loss": -10.387852668762207, "global_step": 123736, "epoch": 736} {"train_loss": -10.591652870178223, "global_step": 123737, "epoch": 736} {"train_loss": -10.33175277709961, "global_step": 123738, "epoch": 736} {"train_loss": -10.434185028076172, "global_step": 123739, "epoch": 736} {"train_loss": -10.460151672363281, "global_step": 123740, "epoch": 736} {"train_loss": -10.581583023071289, "global_step": 123741, "epoch": 736} {"train_loss": -10.067859649658203, "global_step": 123742, "epoch": 736} {"train_loss": -10.48360824584961, "global_step": 123743, "epoch": 736} {"train_loss": -10.222673416137695, "global_step": 123744, "epoch": 736} {"train_loss": -10.402074813842773, "global_step": 123745, "epoch": 736} {"train_loss": -10.643024444580078, "global_step": 123746, "epoch": 736} {"train_loss": -10.617196083068848, "global_step": 123747, "epoch": 736} {"train_loss": -10.529163360595703, "global_step": 123748, "epoch": 736} {"train_loss": -10.362822532653809, "global_step": 123749, "epoch": 736} {"train_loss": -10.561477661132812, "global_step": 123750, "epoch": 736} {"train_loss": -10.689142227172852, "global_step": 123751, "epoch": 736} {"train_loss": -10.663467407226562, "global_step": 123752, "epoch": 736} {"train_loss": -10.505626678466797, "global_step": 123753, "epoch": 736} {"train_loss": -10.335039138793945, "global_step": 123754, "epoch": 736} {"train_loss": -10.749711990356445, "global_step": 123755, "epoch": 736} {"train_loss": -10.65444278717041, "global_step": 123756, "epoch": 736} {"train_loss": -10.629886627197266, "global_step": 123757, "epoch": 736} {"train_loss": -10.54460620880127, "global_step": 123758, "epoch": 736} {"train_loss": -10.416067123413086, "global_step": 123759, "epoch": 736} {"train_loss": -10.668313980102539, "global_step": 123760, "epoch": 736} {"train_loss": -10.45693588256836, "global_step": 123761, "epoch": 736} {"train_loss": -10.614838600158691, "global_step": 123762, "epoch": 736} {"train_loss": -10.223487854003906, "global_step": 123763, "epoch": 736} {"train_loss": -10.366985321044922, "global_step": 123764, "epoch": 736} {"train_loss": -10.284137725830078, "global_step": 123765, "epoch": 736} {"train_loss": -10.452713012695312, "global_step": 123766, "epoch": 736} {"train_loss": -10.360363006591797, "global_step": 123767, "epoch": 736} {"train_loss": -10.544479370117188, "global_step": 123768, "epoch": 736} {"train_loss": -10.286108016967773, "global_step": 123769, "epoch": 736} {"train_loss": -9.910919189453125, "global_step": 123770, "epoch": 736} {"train_loss": -10.18130111694336, "global_step": 123771, "epoch": 736} {"train_loss": -10.020500183105469, "global_step": 123772, "epoch": 736} {"train_loss": -10.128096580505371, "global_step": 123773, "epoch": 736} {"train_loss": -10.152287483215332, "global_step": 123774, "epoch": 736} {"train_loss": -10.321178436279297, "global_step": 123775, "epoch": 736} {"train_loss": -10.137674331665039, "global_step": 123776, "epoch": 736} {"train_loss": -10.180231094360352, "global_step": 123777, "epoch": 736} {"train_loss": -10.106744766235352, "global_step": 123778, "epoch": 736} {"train_loss": -10.366050720214844, "global_step": 123779, "epoch": 736} {"train_loss": -9.956174850463867, "global_step": 123780, "epoch": 736} {"train_loss": -10.424509048461914, "global_step": 123781, "epoch": 736} {"train_loss": -10.073150634765625, "global_step": 123782, "epoch": 736} {"train_loss": -10.277887344360352, "global_step": 123783, "epoch": 736} {"train_loss": -10.110053062438965, "global_step": 123784, "epoch": 736} {"train_loss": -9.844649314880371, "global_step": 123785, "epoch": 736} {"train_loss": -10.11624813079834, "global_step": 123786, "epoch": 736} {"train_loss": -9.780061721801758, "global_step": 123787, "epoch": 736} {"train_loss": -10.171882629394531, "global_step": 123788, "epoch": 736} {"train_loss": -9.417572021484375, "global_step": 123789, "epoch": 736} {"train_loss": -9.245255470275879, "global_step": 123790, "epoch": 736} {"train_loss": -9.839733123779297, "global_step": 123791, "epoch": 736} {"train_loss": -8.720138549804688, "global_step": 123792, "epoch": 736} {"train_loss": -10.093720436096191, "global_step": 123793, "epoch": 736} {"train_loss": -9.342235565185547, "global_step": 123794, "epoch": 736} {"train_loss": -9.788257598876953, "global_step": 123795, "epoch": 736} {"train_loss": -9.577184677124023, "global_step": 123796, "epoch": 736} {"train_loss": -10.07665729522705, "global_step": 123797, "epoch": 736} {"train_loss": -9.542435646057129, "global_step": 123798, "epoch": 736} {"train_loss": -10.003803253173828, "global_step": 123799, "epoch": 736} {"train_loss": -9.266910552978516, "global_step": 123800, "epoch": 736} {"train_loss": -9.887017250061035, "global_step": 123801, "epoch": 736} {"train_loss": -10.007722854614258, "global_step": 123802, "epoch": 736} {"train_loss": -10.009387969970703, "global_step": 123803, "epoch": 736} {"train_loss": -9.91769790649414, "global_step": 123804, "epoch": 736} {"train_loss": -9.764237403869629, "global_step": 123805, "epoch": 736} {"train_loss": -9.802989959716797, "global_step": 123806, "epoch": 736} {"train_loss": -9.907625198364258, "global_step": 123807, "epoch": 736} {"train_loss": -9.328163146972656, "global_step": 123808, "epoch": 736} {"train_loss": -9.881235122680664, "global_step": 123809, "epoch": 736} {"train_loss": -9.531000137329102, "global_step": 123810, "epoch": 736} {"train_loss": -10.179597854614258, "global_step": 123811, "epoch": 736} {"train_loss": -9.411134719848633, "global_step": 123812, "epoch": 736} {"train_loss": -10.083141326904297, "global_step": 123813, "epoch": 736} {"train_loss": -9.913583755493164, "global_step": 123814, "epoch": 736} {"train_loss": -10.156773147128877, "global_step": 123815, "epoch": 736, "val_loss": 214247.265625} {"train_loss": -9.944406509399414, "global_step": 123816, "epoch": 737} {"train_loss": -10.293575286865234, "global_step": 123817, "epoch": 737} {"train_loss": -9.752950668334961, "global_step": 123818, "epoch": 737} {"train_loss": -10.3177490234375, "global_step": 123819, "epoch": 737} {"train_loss": -10.071008682250977, "global_step": 123820, "epoch": 737} {"train_loss": -10.10720443725586, "global_step": 123821, "epoch": 737} {"train_loss": -10.451881408691406, "global_step": 123822, "epoch": 737} {"train_loss": -10.021795272827148, "global_step": 123823, "epoch": 737} {"train_loss": -10.346769332885742, "global_step": 123824, "epoch": 737} {"train_loss": -10.13956069946289, "global_step": 123825, "epoch": 737} {"train_loss": -10.137327194213867, "global_step": 123826, "epoch": 737} {"train_loss": -10.1522855758667, "global_step": 123827, "epoch": 737} {"train_loss": -10.401933670043945, "global_step": 123828, "epoch": 737} {"train_loss": -10.12009048461914, "global_step": 123829, "epoch": 737} {"train_loss": -10.132148742675781, "global_step": 123830, "epoch": 737} {"train_loss": -10.538976669311523, "global_step": 123831, "epoch": 737} {"train_loss": -10.483646392822266, "global_step": 123832, "epoch": 737} {"train_loss": -10.455236434936523, "global_step": 123833, "epoch": 737} {"train_loss": -10.326436996459961, "global_step": 123834, "epoch": 737} {"train_loss": -10.334869384765625, "global_step": 123835, "epoch": 737} {"train_loss": -10.203475952148438, "global_step": 123836, "epoch": 737} {"train_loss": -10.38005542755127, "global_step": 123837, "epoch": 737} {"train_loss": -10.083395004272461, "global_step": 123838, "epoch": 737} {"train_loss": -10.643102645874023, "global_step": 123839, "epoch": 737} {"train_loss": -10.404006004333496, "global_step": 123840, "epoch": 737} {"train_loss": -10.369650840759277, "global_step": 123841, "epoch": 737} {"train_loss": -10.121615409851074, "global_step": 123842, "epoch": 737} {"train_loss": -10.451526641845703, "global_step": 123843, "epoch": 737} {"train_loss": -10.05295181274414, "global_step": 123844, "epoch": 737} {"train_loss": -10.313762664794922, "global_step": 123845, "epoch": 737} {"train_loss": -10.427967071533203, "global_step": 123846, "epoch": 737} {"train_loss": -10.275579452514648, "global_step": 123847, "epoch": 737} {"train_loss": -10.417272567749023, "global_step": 123848, "epoch": 737} {"train_loss": -10.310188293457031, "global_step": 123849, "epoch": 737} {"train_loss": -10.025203704833984, "global_step": 123850, "epoch": 737} {"train_loss": -10.581653594970703, "global_step": 123851, "epoch": 737} {"train_loss": -9.902938842773438, "global_step": 123852, "epoch": 737} {"train_loss": -9.959317207336426, "global_step": 123853, "epoch": 737} {"train_loss": -10.339971542358398, "global_step": 123854, "epoch": 737} {"train_loss": -9.568519592285156, "global_step": 123855, "epoch": 737} {"train_loss": -10.295465469360352, "global_step": 123856, "epoch": 737} {"train_loss": -9.852898597717285, "global_step": 123857, "epoch": 737} {"train_loss": -9.948726654052734, "global_step": 123858, "epoch": 737} {"train_loss": -10.146474838256836, "global_step": 123859, "epoch": 737} {"train_loss": -9.565011978149414, "global_step": 123860, "epoch": 737} {"train_loss": -10.130698204040527, "global_step": 123861, "epoch": 737} {"train_loss": -9.57786750793457, "global_step": 123862, "epoch": 737} {"train_loss": -9.743217468261719, "global_step": 123863, "epoch": 737} {"train_loss": -9.660847663879395, "global_step": 123864, "epoch": 737} {"train_loss": -9.237189292907715, "global_step": 123865, "epoch": 737} {"train_loss": -10.023077011108398, "global_step": 123866, "epoch": 737} {"train_loss": -9.671741485595703, "global_step": 123867, "epoch": 737} {"train_loss": -9.53875732421875, "global_step": 123868, "epoch": 737} {"train_loss": -9.231801986694336, "global_step": 123869, "epoch": 737} {"train_loss": -9.684072494506836, "global_step": 123870, "epoch": 737} {"train_loss": -9.880364418029785, "global_step": 123871, "epoch": 737} {"train_loss": -9.756169319152832, "global_step": 123872, "epoch": 737} {"train_loss": -9.29867172241211, "global_step": 123873, "epoch": 737} {"train_loss": -10.076984405517578, "global_step": 123874, "epoch": 737} {"train_loss": -9.170417785644531, "global_step": 123875, "epoch": 737} {"train_loss": -10.06842041015625, "global_step": 123876, "epoch": 737} {"train_loss": -10.010878562927246, "global_step": 123877, "epoch": 737} {"train_loss": -9.88425350189209, "global_step": 123878, "epoch": 737} {"train_loss": -9.832917213439941, "global_step": 123879, "epoch": 737} {"train_loss": -10.100006103515625, "global_step": 123880, "epoch": 737} {"train_loss": -10.066871643066406, "global_step": 123881, "epoch": 737} {"train_loss": -9.916955947875977, "global_step": 123882, "epoch": 737} {"train_loss": -9.981254577636719, "global_step": 123883, "epoch": 737} {"train_loss": -10.009810447692871, "global_step": 123884, "epoch": 737} {"train_loss": -10.103992462158203, "global_step": 123885, "epoch": 737} {"train_loss": -9.99382209777832, "global_step": 123886, "epoch": 737} {"train_loss": -10.175682067871094, "global_step": 123887, "epoch": 737} {"train_loss": -10.055943489074707, "global_step": 123888, "epoch": 737} {"train_loss": -10.04974365234375, "global_step": 123889, "epoch": 737} {"train_loss": -10.116695404052734, "global_step": 123890, "epoch": 737} {"train_loss": -10.161825180053711, "global_step": 123891, "epoch": 737} {"train_loss": -10.067176818847656, "global_step": 123892, "epoch": 737} {"train_loss": -10.443899154663086, "global_step": 123893, "epoch": 737} {"train_loss": -10.149389266967773, "global_step": 123894, "epoch": 737} {"train_loss": -10.282266616821289, "global_step": 123895, "epoch": 737} {"train_loss": -10.427048683166504, "global_step": 123896, "epoch": 737} {"train_loss": -10.489788055419922, "global_step": 123897, "epoch": 737} {"train_loss": -10.28628158569336, "global_step": 123898, "epoch": 737} {"train_loss": -10.369294166564941, "global_step": 123899, "epoch": 737} {"train_loss": -10.345399856567383, "global_step": 123900, "epoch": 737} {"train_loss": -10.563660621643066, "global_step": 123901, "epoch": 737} {"train_loss": -10.451264381408691, "global_step": 123902, "epoch": 737} {"train_loss": -10.535056114196777, "global_step": 123903, "epoch": 737} {"train_loss": -10.456232070922852, "global_step": 123904, "epoch": 737} {"train_loss": -10.332735061645508, "global_step": 123905, "epoch": 737} {"train_loss": -10.345203399658203, "global_step": 123906, "epoch": 737} {"train_loss": -10.358560562133789, "global_step": 123907, "epoch": 737} {"train_loss": -10.576020240783691, "global_step": 123908, "epoch": 737} {"train_loss": -10.253968238830566, "global_step": 123909, "epoch": 737} {"train_loss": -10.455921173095703, "global_step": 123910, "epoch": 737} {"train_loss": -10.37576961517334, "global_step": 123911, "epoch": 737} {"train_loss": -10.34918212890625, "global_step": 123912, "epoch": 737} {"train_loss": -10.315881729125977, "global_step": 123913, "epoch": 737} {"train_loss": -10.717035293579102, "global_step": 123914, "epoch": 737} {"train_loss": -10.246135711669922, "global_step": 123915, "epoch": 737} {"train_loss": -10.329578399658203, "global_step": 123916, "epoch": 737} {"train_loss": -10.274312973022461, "global_step": 123917, "epoch": 737} {"train_loss": -10.052749633789062, "global_step": 123918, "epoch": 737} {"train_loss": -10.50831127166748, "global_step": 123919, "epoch": 737} {"train_loss": -10.249364852905273, "global_step": 123920, "epoch": 737} {"train_loss": -10.565451622009277, "global_step": 123921, "epoch": 737} {"train_loss": -10.41152572631836, "global_step": 123922, "epoch": 737} {"train_loss": -10.519149780273438, "global_step": 123923, "epoch": 737} {"train_loss": -10.510133743286133, "global_step": 123924, "epoch": 737} {"train_loss": -10.531665802001953, "global_step": 123925, "epoch": 737} {"train_loss": -10.259532928466797, "global_step": 123926, "epoch": 737} {"train_loss": -10.225727081298828, "global_step": 123927, "epoch": 737} {"train_loss": -10.120441436767578, "global_step": 123928, "epoch": 737} {"train_loss": -9.63561725616455, "global_step": 123929, "epoch": 737} {"train_loss": -10.011886596679688, "global_step": 123930, "epoch": 737} {"train_loss": -9.558552742004395, "global_step": 123931, "epoch": 737} {"train_loss": -10.207683563232422, "global_step": 123932, "epoch": 737} {"train_loss": -9.848941802978516, "global_step": 123933, "epoch": 737} {"train_loss": -9.881306648254395, "global_step": 123934, "epoch": 737} {"train_loss": -9.630539894104004, "global_step": 123935, "epoch": 737} {"train_loss": -10.094200134277344, "global_step": 123936, "epoch": 737} {"train_loss": -9.898451805114746, "global_step": 123937, "epoch": 737} {"train_loss": -9.696046829223633, "global_step": 123938, "epoch": 737} {"train_loss": -9.899727821350098, "global_step": 123939, "epoch": 737} {"train_loss": -9.942925453186035, "global_step": 123940, "epoch": 737} {"train_loss": -9.748717308044434, "global_step": 123941, "epoch": 737} {"train_loss": -10.409162521362305, "global_step": 123942, "epoch": 737} {"train_loss": -9.951273918151855, "global_step": 123943, "epoch": 737} {"train_loss": -10.04165267944336, "global_step": 123944, "epoch": 737} {"train_loss": -9.895868301391602, "global_step": 123945, "epoch": 737} {"train_loss": -9.643157005310059, "global_step": 123946, "epoch": 737} {"train_loss": -10.413703918457031, "global_step": 123947, "epoch": 737} {"train_loss": -9.538822174072266, "global_step": 123948, "epoch": 737} {"train_loss": -10.2446870803833, "global_step": 123949, "epoch": 737} {"train_loss": -9.925285339355469, "global_step": 123950, "epoch": 737} {"train_loss": -9.91729736328125, "global_step": 123951, "epoch": 737} {"train_loss": -10.005245208740234, "global_step": 123952, "epoch": 737} {"train_loss": -10.018590927124023, "global_step": 123953, "epoch": 737} {"train_loss": -9.826776504516602, "global_step": 123954, "epoch": 737} {"train_loss": -9.847490310668945, "global_step": 123955, "epoch": 737} {"train_loss": -10.097654342651367, "global_step": 123956, "epoch": 737} {"train_loss": -10.153892517089844, "global_step": 123957, "epoch": 737} {"train_loss": -9.820505142211914, "global_step": 123958, "epoch": 737} {"train_loss": -10.13752555847168, "global_step": 123959, "epoch": 737} {"train_loss": -9.966497421264648, "global_step": 123960, "epoch": 737} {"train_loss": -10.06259822845459, "global_step": 123961, "epoch": 737} {"train_loss": -10.272217750549316, "global_step": 123962, "epoch": 737} {"train_loss": -10.020692825317383, "global_step": 123963, "epoch": 737} {"train_loss": -10.053468704223633, "global_step": 123964, "epoch": 737} {"train_loss": -10.217863082885742, "global_step": 123965, "epoch": 737} {"train_loss": -10.066588401794434, "global_step": 123966, "epoch": 737} {"train_loss": -9.911725044250488, "global_step": 123967, "epoch": 737} {"train_loss": -10.094367980957031, "global_step": 123968, "epoch": 737} {"train_loss": -9.915166854858398, "global_step": 123969, "epoch": 737} {"train_loss": -9.859506607055664, "global_step": 123970, "epoch": 737} {"train_loss": -10.009456634521484, "global_step": 123971, "epoch": 737} {"train_loss": -9.788250923156738, "global_step": 123972, "epoch": 737} {"train_loss": -9.799091339111328, "global_step": 123973, "epoch": 737} {"train_loss": -10.253910064697266, "global_step": 123974, "epoch": 737} {"train_loss": -9.757617950439453, "global_step": 123975, "epoch": 737} {"train_loss": -10.008315086364746, "global_step": 123976, "epoch": 737} {"train_loss": -9.95804500579834, "global_step": 123977, "epoch": 737} {"train_loss": -10.10372257232666, "global_step": 123978, "epoch": 737} {"train_loss": -9.960626602172852, "global_step": 123979, "epoch": 737} {"train_loss": -10.264182090759277, "global_step": 123980, "epoch": 737} {"train_loss": -10.205991744995117, "global_step": 123981, "epoch": 737} {"train_loss": -10.265325546264648, "global_step": 123982, "epoch": 737} {"train_loss": -10.100442460605077, "global_step": 123983, "epoch": 737, "val_loss": 216489.9375} {"train_loss": -10.41324520111084, "global_step": 123984, "epoch": 738} {"train_loss": -10.023069381713867, "global_step": 123985, "epoch": 738} {"train_loss": -10.298879623413086, "global_step": 123986, "epoch": 738} {"train_loss": -10.079776763916016, "global_step": 123987, "epoch": 738} {"train_loss": -10.293201446533203, "global_step": 123988, "epoch": 738} {"train_loss": -10.005573272705078, "global_step": 123989, "epoch": 738} {"train_loss": -10.244190216064453, "global_step": 123990, "epoch": 738} {"train_loss": -10.197677612304688, "global_step": 123991, "epoch": 738} {"train_loss": -10.245408058166504, "global_step": 123992, "epoch": 738} {"train_loss": -10.262741088867188, "global_step": 123993, "epoch": 738} {"train_loss": -10.409561157226562, "global_step": 123994, "epoch": 738} {"train_loss": -10.176807403564453, "global_step": 123995, "epoch": 738} {"train_loss": -10.503326416015625, "global_step": 123996, "epoch": 738} {"train_loss": -10.421072006225586, "global_step": 123997, "epoch": 738} {"train_loss": -10.551161766052246, "global_step": 123998, "epoch": 738} {"train_loss": -10.38984489440918, "global_step": 123999, "epoch": 738} {"train_loss": -10.227824211120605, "global_step": 124000, "epoch": 738} {"train_loss": -10.515302658081055, "global_step": 124001, "epoch": 738} {"train_loss": -10.253393173217773, "global_step": 124002, "epoch": 738} {"train_loss": -10.385919570922852, "global_step": 124003, "epoch": 738} {"train_loss": -10.34321403503418, "global_step": 124004, "epoch": 738} {"train_loss": -10.307470321655273, "global_step": 124005, "epoch": 738} {"train_loss": -10.439399719238281, "global_step": 124006, "epoch": 738} {"train_loss": -10.419898986816406, "global_step": 124007, "epoch": 738} {"train_loss": -10.538435935974121, "global_step": 124008, "epoch": 738} {"train_loss": -9.850133895874023, "global_step": 124009, "epoch": 738} {"train_loss": -10.460954666137695, "global_step": 124010, "epoch": 738} {"train_loss": -10.24106216430664, "global_step": 124011, "epoch": 738} {"train_loss": -9.881912231445312, "global_step": 124012, "epoch": 738} {"train_loss": -9.665027618408203, "global_step": 124013, "epoch": 738} {"train_loss": -9.986672401428223, "global_step": 124014, "epoch": 738} {"train_loss": -10.211463928222656, "global_step": 124015, "epoch": 738} {"train_loss": -9.682937622070312, "global_step": 124016, "epoch": 738} {"train_loss": -10.209676742553711, "global_step": 124017, "epoch": 738} {"train_loss": -9.856582641601562, "global_step": 124018, "epoch": 738} {"train_loss": -10.002664566040039, "global_step": 124019, "epoch": 738} {"train_loss": -9.87561321258545, "global_step": 124020, "epoch": 738} {"train_loss": -10.019495964050293, "global_step": 124021, "epoch": 738} {"train_loss": -9.632972717285156, "global_step": 124022, "epoch": 738} {"train_loss": -9.943347930908203, "global_step": 124023, "epoch": 738} {"train_loss": -10.289884567260742, "global_step": 124024, "epoch": 738} {"train_loss": -10.097087860107422, "global_step": 124025, "epoch": 738} {"train_loss": -9.937766075134277, "global_step": 124026, "epoch": 738} {"train_loss": -9.981706619262695, "global_step": 124027, "epoch": 738} {"train_loss": -9.683612823486328, "global_step": 124028, "epoch": 738} {"train_loss": -9.913095474243164, "global_step": 124029, "epoch": 738} {"train_loss": -9.25747299194336, "global_step": 124030, "epoch": 738} {"train_loss": -9.649513244628906, "global_step": 124031, "epoch": 738} {"train_loss": -9.526387214660645, "global_step": 124032, "epoch": 738} {"train_loss": -10.02249526977539, "global_step": 124033, "epoch": 738} {"train_loss": -9.38293743133545, "global_step": 124034, "epoch": 738} {"train_loss": -10.03062629699707, "global_step": 124035, "epoch": 738} {"train_loss": -9.948083877563477, "global_step": 124036, "epoch": 738} {"train_loss": -10.107156753540039, "global_step": 124037, "epoch": 738} {"train_loss": -10.130786895751953, "global_step": 124038, "epoch": 738} {"train_loss": -10.157379150390625, "global_step": 124039, "epoch": 738} {"train_loss": -10.155951499938965, "global_step": 124040, "epoch": 738} {"train_loss": -10.023645401000977, "global_step": 124041, "epoch": 738} {"train_loss": -10.016773223876953, "global_step": 124042, "epoch": 738} {"train_loss": -10.175844192504883, "global_step": 124043, "epoch": 738} {"train_loss": -10.225116729736328, "global_step": 124044, "epoch": 738} {"train_loss": -10.08855152130127, "global_step": 124045, "epoch": 738} {"train_loss": -10.15625, "global_step": 124046, "epoch": 738} {"train_loss": -10.0927152633667, "global_step": 124047, "epoch": 738} {"train_loss": -10.186201095581055, "global_step": 124048, "epoch": 738} {"train_loss": -9.944573402404785, "global_step": 124049, "epoch": 738} {"train_loss": -9.977029800415039, "global_step": 124050, "epoch": 738} {"train_loss": -10.10359001159668, "global_step": 124051, "epoch": 738} {"train_loss": -10.194937705993652, "global_step": 124052, "epoch": 738} {"train_loss": -10.415031433105469, "global_step": 124053, "epoch": 738} {"train_loss": -10.121051788330078, "global_step": 124054, "epoch": 738} {"train_loss": -10.450983047485352, "global_step": 124055, "epoch": 738} {"train_loss": -10.062284469604492, "global_step": 124056, "epoch": 738} {"train_loss": -10.167827606201172, "global_step": 124057, "epoch": 738} {"train_loss": -10.17016887664795, "global_step": 124058, "epoch": 738} {"train_loss": -10.412952423095703, "global_step": 124059, "epoch": 738} {"train_loss": -9.851068496704102, "global_step": 124060, "epoch": 738} {"train_loss": -9.909370422363281, "global_step": 124061, "epoch": 738} {"train_loss": -10.103611946105957, "global_step": 124062, "epoch": 738} {"train_loss": -10.046640396118164, "global_step": 124063, "epoch": 738} {"train_loss": -10.153974533081055, "global_step": 124064, "epoch": 738} {"train_loss": -10.159870147705078, "global_step": 124065, "epoch": 738} {"train_loss": -10.391458511352539, "global_step": 124066, "epoch": 738} {"train_loss": -10.169210433959961, "global_step": 124067, "epoch": 738} {"train_loss": -10.123174667358398, "global_step": 124068, "epoch": 738} {"train_loss": -9.76026725769043, "global_step": 124069, "epoch": 738} {"train_loss": -10.272932052612305, "global_step": 124070, "epoch": 738} {"train_loss": -10.116756439208984, "global_step": 124071, "epoch": 738} {"train_loss": -10.334444999694824, "global_step": 124072, "epoch": 738} {"train_loss": -10.304615020751953, "global_step": 124073, "epoch": 738} {"train_loss": -9.937501907348633, "global_step": 124074, "epoch": 738} {"train_loss": -10.356714248657227, "global_step": 124075, "epoch": 738} {"train_loss": -9.844436645507812, "global_step": 124076, "epoch": 738} {"train_loss": -10.0191650390625, "global_step": 124077, "epoch": 738} {"train_loss": -10.369762420654297, "global_step": 124078, "epoch": 738} {"train_loss": -9.114017486572266, "global_step": 124079, "epoch": 738} {"train_loss": -9.442957878112793, "global_step": 124080, "epoch": 738} {"train_loss": -8.623941421508789, "global_step": 124081, "epoch": 738} {"train_loss": -9.203714370727539, "global_step": 124082, "epoch": 738} {"train_loss": -9.436553001403809, "global_step": 124083, "epoch": 738} {"train_loss": -9.689715385437012, "global_step": 124084, "epoch": 738} {"train_loss": -9.150793075561523, "global_step": 124085, "epoch": 738} {"train_loss": -10.07845401763916, "global_step": 124086, "epoch": 738} {"train_loss": -9.056211471557617, "global_step": 124087, "epoch": 738} {"train_loss": -9.553557395935059, "global_step": 124088, "epoch": 738} {"train_loss": -9.92718505859375, "global_step": 124089, "epoch": 738} {"train_loss": -9.467551231384277, "global_step": 124090, "epoch": 738} {"train_loss": -9.13206672668457, "global_step": 124091, "epoch": 738} {"train_loss": -9.938121795654297, "global_step": 124092, "epoch": 738} {"train_loss": -10.028556823730469, "global_step": 124093, "epoch": 738} {"train_loss": -9.431620597839355, "global_step": 124094, "epoch": 738} {"train_loss": -9.842811584472656, "global_step": 124095, "epoch": 738} {"train_loss": -10.192708015441895, "global_step": 124096, "epoch": 738} {"train_loss": -10.012229919433594, "global_step": 124097, "epoch": 738} {"train_loss": -9.770833969116211, "global_step": 124098, "epoch": 738} {"train_loss": -10.017292976379395, "global_step": 124099, "epoch": 738} {"train_loss": -9.860550880432129, "global_step": 124100, "epoch": 738} {"train_loss": -9.911787033081055, "global_step": 124101, "epoch": 738} {"train_loss": -9.596941947937012, "global_step": 124102, "epoch": 738} {"train_loss": -10.041929244995117, "global_step": 124103, "epoch": 738} {"train_loss": -9.839624404907227, "global_step": 124104, "epoch": 738} {"train_loss": -10.00775146484375, "global_step": 124105, "epoch": 738} {"train_loss": -9.9168701171875, "global_step": 124106, "epoch": 738} {"train_loss": -10.102566719055176, "global_step": 124107, "epoch": 738} {"train_loss": -10.150657653808594, "global_step": 124108, "epoch": 738} {"train_loss": -10.152088165283203, "global_step": 124109, "epoch": 738} {"train_loss": -10.16064453125, "global_step": 124110, "epoch": 738} {"train_loss": -10.17485523223877, "global_step": 124111, "epoch": 738} {"train_loss": -10.246160507202148, "global_step": 124112, "epoch": 738} {"train_loss": -9.993355751037598, "global_step": 124113, "epoch": 738} {"train_loss": -10.312152862548828, "global_step": 124114, "epoch": 738} {"train_loss": -10.132987976074219, "global_step": 124115, "epoch": 738} {"train_loss": -10.349405288696289, "global_step": 124116, "epoch": 738} {"train_loss": -10.375748634338379, "global_step": 124117, "epoch": 738} {"train_loss": -10.270362854003906, "global_step": 124118, "epoch": 738} {"train_loss": -10.237603187561035, "global_step": 124119, "epoch": 738} {"train_loss": -10.441025733947754, "global_step": 124120, "epoch": 738} {"train_loss": -10.352985382080078, "global_step": 124121, "epoch": 738} {"train_loss": -10.156126022338867, "global_step": 124122, "epoch": 738} {"train_loss": -10.248431205749512, "global_step": 124123, "epoch": 738} {"train_loss": -10.158605575561523, "global_step": 124124, "epoch": 738} {"train_loss": -10.116754531860352, "global_step": 124125, "epoch": 738} {"train_loss": -10.343585968017578, "global_step": 124126, "epoch": 738} {"train_loss": -10.343231201171875, "global_step": 124127, "epoch": 738} {"train_loss": -10.50537395477295, "global_step": 124128, "epoch": 738} {"train_loss": -10.571191787719727, "global_step": 124129, "epoch": 738} {"train_loss": -10.605504035949707, "global_step": 124130, "epoch": 738} {"train_loss": -10.541440963745117, "global_step": 124131, "epoch": 738} {"train_loss": -10.650741577148438, "global_step": 124132, "epoch": 738} {"train_loss": -10.550151824951172, "global_step": 124133, "epoch": 738} {"train_loss": -10.76652717590332, "global_step": 124134, "epoch": 738} {"train_loss": -10.66642951965332, "global_step": 124135, "epoch": 738} {"train_loss": -10.34796142578125, "global_step": 124136, "epoch": 738} {"train_loss": -10.576313018798828, "global_step": 124137, "epoch": 738} {"train_loss": -10.459683418273926, "global_step": 124138, "epoch": 738} {"train_loss": -10.394933700561523, "global_step": 124139, "epoch": 738} {"train_loss": -10.466849327087402, "global_step": 124140, "epoch": 738} {"train_loss": -10.426581382751465, "global_step": 124141, "epoch": 738} {"train_loss": -10.290353775024414, "global_step": 124142, "epoch": 738} {"train_loss": -10.358261108398438, "global_step": 124143, "epoch": 738} {"train_loss": -10.42514419555664, "global_step": 124144, "epoch": 738} {"train_loss": -10.250809669494629, "global_step": 124145, "epoch": 738} {"train_loss": -10.555795669555664, "global_step": 124146, "epoch": 738} {"train_loss": -10.454521179199219, "global_step": 124147, "epoch": 738} {"train_loss": -10.157453536987305, "global_step": 124148, "epoch": 738} {"train_loss": -10.224873542785645, "global_step": 124149, "epoch": 738} {"train_loss": -9.798229217529297, "global_step": 124150, "epoch": 738} {"train_loss": -10.095639279910497, "global_step": 124151, "epoch": 738, "val_loss": 218470.921875} {"train_loss": -10.351062774658203, "global_step": 124152, "epoch": 739} {"train_loss": -9.6963472366333, "global_step": 124153, "epoch": 739} {"train_loss": -9.774353981018066, "global_step": 124154, "epoch": 739} {"train_loss": -10.329021453857422, "global_step": 124155, "epoch": 739} {"train_loss": -9.5911865234375, "global_step": 124156, "epoch": 739} {"train_loss": -10.34168815612793, "global_step": 124157, "epoch": 739} {"train_loss": -10.21445083618164, "global_step": 124158, "epoch": 739} {"train_loss": -9.828094482421875, "global_step": 124159, "epoch": 739} {"train_loss": -9.935094833374023, "global_step": 124160, "epoch": 739} {"train_loss": -10.2110595703125, "global_step": 124161, "epoch": 739} {"train_loss": -9.970582008361816, "global_step": 124162, "epoch": 739} {"train_loss": -10.50566291809082, "global_step": 124163, "epoch": 739} {"train_loss": -10.148611068725586, "global_step": 124164, "epoch": 739} {"train_loss": -10.275140762329102, "global_step": 124165, "epoch": 739} {"train_loss": -10.271965026855469, "global_step": 124166, "epoch": 739} {"train_loss": -10.472113609313965, "global_step": 124167, "epoch": 739} {"train_loss": -10.384173393249512, "global_step": 124168, "epoch": 739} {"train_loss": -10.15135669708252, "global_step": 124169, "epoch": 739} {"train_loss": -10.298089981079102, "global_step": 124170, "epoch": 739} {"train_loss": -10.285481452941895, "global_step": 124171, "epoch": 739} {"train_loss": -10.026246070861816, "global_step": 124172, "epoch": 739} {"train_loss": -10.32882308959961, "global_step": 124173, "epoch": 739} {"train_loss": -10.071352005004883, "global_step": 124174, "epoch": 739} {"train_loss": -9.936230659484863, "global_step": 124175, "epoch": 739} {"train_loss": -10.205679893493652, "global_step": 124176, "epoch": 739} {"train_loss": -9.768487930297852, "global_step": 124177, "epoch": 739} {"train_loss": -10.039480209350586, "global_step": 124178, "epoch": 739} {"train_loss": -9.175716400146484, "global_step": 124179, "epoch": 739} {"train_loss": -8.850479125976562, "global_step": 124180, "epoch": 739} {"train_loss": -9.53322696685791, "global_step": 124181, "epoch": 739} {"train_loss": -9.221433639526367, "global_step": 124182, "epoch": 739} {"train_loss": -8.793581008911133, "global_step": 124183, "epoch": 739} {"train_loss": -9.719583511352539, "global_step": 124184, "epoch": 739} {"train_loss": -9.257761001586914, "global_step": 124185, "epoch": 739} {"train_loss": -9.04887580871582, "global_step": 124186, "epoch": 739} {"train_loss": -9.620436668395996, "global_step": 124187, "epoch": 739} {"train_loss": -9.590873718261719, "global_step": 124188, "epoch": 739} {"train_loss": -9.796873092651367, "global_step": 124189, "epoch": 739} {"train_loss": -9.597240447998047, "global_step": 124190, "epoch": 739} {"train_loss": -9.632009506225586, "global_step": 124191, "epoch": 739} {"train_loss": -9.802406311035156, "global_step": 124192, "epoch": 739} {"train_loss": -9.73184585571289, "global_step": 124193, "epoch": 739} {"train_loss": -10.055468559265137, "global_step": 124194, "epoch": 739} {"train_loss": -9.475533485412598, "global_step": 124195, "epoch": 739} {"train_loss": -10.156394004821777, "global_step": 124196, "epoch": 739} {"train_loss": -9.693233489990234, "global_step": 124197, "epoch": 739} {"train_loss": -9.789656639099121, "global_step": 124198, "epoch": 739} {"train_loss": -9.961318016052246, "global_step": 124199, "epoch": 739} {"train_loss": -10.035593032836914, "global_step": 124200, "epoch": 739} {"train_loss": -10.067282676696777, "global_step": 124201, "epoch": 739} {"train_loss": -9.755718231201172, "global_step": 124202, "epoch": 739} {"train_loss": -10.059152603149414, "global_step": 124203, "epoch": 739} {"train_loss": -10.109909057617188, "global_step": 124204, "epoch": 739} {"train_loss": -9.847723007202148, "global_step": 124205, "epoch": 739} {"train_loss": -10.240621566772461, "global_step": 124206, "epoch": 739} {"train_loss": -10.09494400024414, "global_step": 124207, "epoch": 739} {"train_loss": -10.246840476989746, "global_step": 124208, "epoch": 739} {"train_loss": -10.246295928955078, "global_step": 124209, "epoch": 739} {"train_loss": -10.171904563903809, "global_step": 124210, "epoch": 739} {"train_loss": -10.06856918334961, "global_step": 124211, "epoch": 739} {"train_loss": -10.31985092163086, "global_step": 124212, "epoch": 739} {"train_loss": -10.056500434875488, "global_step": 124213, "epoch": 739} {"train_loss": -10.100850105285645, "global_step": 124214, "epoch": 739} {"train_loss": -10.461750030517578, "global_step": 124215, "epoch": 739} {"train_loss": -10.426366806030273, "global_step": 124216, "epoch": 739} {"train_loss": -10.248218536376953, "global_step": 124217, "epoch": 739} {"train_loss": -10.221165657043457, "global_step": 124218, "epoch": 739} {"train_loss": -10.307576179504395, "global_step": 124219, "epoch": 739} {"train_loss": -10.187973022460938, "global_step": 124220, "epoch": 739} {"train_loss": -10.346785545349121, "global_step": 124221, "epoch": 739} {"train_loss": -10.27447509765625, "global_step": 124222, "epoch": 739} {"train_loss": -10.534547805786133, "global_step": 124223, "epoch": 739} {"train_loss": -10.456304550170898, "global_step": 124224, "epoch": 739} {"train_loss": -10.458089828491211, "global_step": 124225, "epoch": 739} {"train_loss": -10.558440208435059, "global_step": 124226, "epoch": 739} {"train_loss": -10.597906112670898, "global_step": 124227, "epoch": 739} {"train_loss": -10.508516311645508, "global_step": 124228, "epoch": 739} {"train_loss": -10.57328987121582, "global_step": 124229, "epoch": 739} {"train_loss": -10.31820011138916, "global_step": 124230, "epoch": 739} {"train_loss": -10.78573226928711, "global_step": 124231, "epoch": 739} {"train_loss": -10.615974426269531, "global_step": 124232, "epoch": 739} {"train_loss": -10.631014823913574, "global_step": 124233, "epoch": 739} {"train_loss": -10.581327438354492, "global_step": 124234, "epoch": 739} {"train_loss": -10.69808578491211, "global_step": 124235, "epoch": 739} {"train_loss": -10.615877151489258, "global_step": 124236, "epoch": 739} {"train_loss": -10.655889511108398, "global_step": 124237, "epoch": 739} {"train_loss": -10.680399894714355, "global_step": 124238, "epoch": 739} {"train_loss": -10.48763656616211, "global_step": 124239, "epoch": 739} {"train_loss": -10.484987258911133, "global_step": 124240, "epoch": 739} {"train_loss": -10.404449462890625, "global_step": 124241, "epoch": 739} {"train_loss": -10.53674602508545, "global_step": 124242, "epoch": 739} {"train_loss": -10.35641860961914, "global_step": 124243, "epoch": 739} {"train_loss": -10.690507888793945, "global_step": 124244, "epoch": 739} {"train_loss": -10.330162048339844, "global_step": 124245, "epoch": 739} {"train_loss": -9.785139083862305, "global_step": 124246, "epoch": 739} {"train_loss": -9.392719268798828, "global_step": 124247, "epoch": 739} {"train_loss": -9.962652206420898, "global_step": 124248, "epoch": 739} {"train_loss": -10.616109848022461, "global_step": 124249, "epoch": 739} {"train_loss": -9.348772048950195, "global_step": 124250, "epoch": 739} {"train_loss": -9.905232429504395, "global_step": 124251, "epoch": 739} {"train_loss": -9.990310668945312, "global_step": 124252, "epoch": 739} {"train_loss": -9.707198143005371, "global_step": 124253, "epoch": 739} {"train_loss": -9.755498886108398, "global_step": 124254, "epoch": 739} {"train_loss": -10.299243927001953, "global_step": 124255, "epoch": 739} {"train_loss": -9.046337127685547, "global_step": 124256, "epoch": 739} {"train_loss": -10.163703918457031, "global_step": 124257, "epoch": 739} {"train_loss": -9.635232925415039, "global_step": 124258, "epoch": 739} {"train_loss": -9.94876766204834, "global_step": 124259, "epoch": 739} {"train_loss": -10.046506881713867, "global_step": 124260, "epoch": 739} {"train_loss": -9.129403114318848, "global_step": 124261, "epoch": 739} {"train_loss": -10.083584785461426, "global_step": 124262, "epoch": 739} {"train_loss": -9.49690055847168, "global_step": 124263, "epoch": 739} {"train_loss": -9.80728530883789, "global_step": 124264, "epoch": 739} {"train_loss": -9.498884201049805, "global_step": 124265, "epoch": 739} {"train_loss": -9.979103088378906, "global_step": 124266, "epoch": 739} {"train_loss": -9.953874588012695, "global_step": 124267, "epoch": 739} {"train_loss": -9.964567184448242, "global_step": 124268, "epoch": 739} {"train_loss": -10.043722152709961, "global_step": 124269, "epoch": 739} {"train_loss": -9.962457656860352, "global_step": 124270, "epoch": 739} {"train_loss": -9.993795394897461, "global_step": 124271, "epoch": 739} {"train_loss": -9.989652633666992, "global_step": 124272, "epoch": 739} {"train_loss": -10.013670921325684, "global_step": 124273, "epoch": 739} {"train_loss": -10.299365043640137, "global_step": 124274, "epoch": 739} {"train_loss": -10.107076644897461, "global_step": 124275, "epoch": 739} {"train_loss": -10.144940376281738, "global_step": 124276, "epoch": 739} {"train_loss": -10.31064510345459, "global_step": 124277, "epoch": 739} {"train_loss": -10.242833137512207, "global_step": 124278, "epoch": 739} {"train_loss": -10.284193992614746, "global_step": 124279, "epoch": 739} {"train_loss": -10.37129020690918, "global_step": 124280, "epoch": 739} {"train_loss": -10.226381301879883, "global_step": 124281, "epoch": 739} {"train_loss": -10.062906265258789, "global_step": 124282, "epoch": 739} {"train_loss": -10.178650856018066, "global_step": 124283, "epoch": 739} {"train_loss": -10.17732048034668, "global_step": 124284, "epoch": 739} {"train_loss": -10.186756134033203, "global_step": 124285, "epoch": 739} {"train_loss": -10.336116790771484, "global_step": 124286, "epoch": 739} {"train_loss": -10.092764854431152, "global_step": 124287, "epoch": 739} {"train_loss": -10.21246337890625, "global_step": 124288, "epoch": 739} {"train_loss": -10.225975036621094, "global_step": 124289, "epoch": 739} {"train_loss": -10.145915985107422, "global_step": 124290, "epoch": 739} {"train_loss": -10.335214614868164, "global_step": 124291, "epoch": 739} {"train_loss": -10.306835174560547, "global_step": 124292, "epoch": 739} {"train_loss": -10.209888458251953, "global_step": 124293, "epoch": 739} {"train_loss": -10.319849967956543, "global_step": 124294, "epoch": 739} {"train_loss": -10.356075286865234, "global_step": 124295, "epoch": 739} {"train_loss": -10.301298141479492, "global_step": 124296, "epoch": 739} {"train_loss": -10.203067779541016, "global_step": 124297, "epoch": 739} {"train_loss": -10.427359580993652, "global_step": 124298, "epoch": 739} {"train_loss": -10.2810697555542, "global_step": 124299, "epoch": 739} {"train_loss": -10.274658203125, "global_step": 124300, "epoch": 739} {"train_loss": -10.31878662109375, "global_step": 124301, "epoch": 739} {"train_loss": -10.338369369506836, "global_step": 124302, "epoch": 739} {"train_loss": -10.423332214355469, "global_step": 124303, "epoch": 739} {"train_loss": -10.255650520324707, "global_step": 124304, "epoch": 739} {"train_loss": -10.406099319458008, "global_step": 124305, "epoch": 739} {"train_loss": -10.324146270751953, "global_step": 124306, "epoch": 739} {"train_loss": -10.227697372436523, "global_step": 124307, "epoch": 739} {"train_loss": -10.279979705810547, "global_step": 124308, "epoch": 739} {"train_loss": -10.385025978088379, "global_step": 124309, "epoch": 739} {"train_loss": -10.260395050048828, "global_step": 124310, "epoch": 739} {"train_loss": -10.490468978881836, "global_step": 124311, "epoch": 739} {"train_loss": -10.271200180053711, "global_step": 124312, "epoch": 739} {"train_loss": -10.444244384765625, "global_step": 124313, "epoch": 739} {"train_loss": -10.291717529296875, "global_step": 124314, "epoch": 739} {"train_loss": -10.301163673400879, "global_step": 124315, "epoch": 739} {"train_loss": -10.3834810256958, "global_step": 124316, "epoch": 739} {"train_loss": -10.071548461914062, "global_step": 124317, "epoch": 739} {"train_loss": -10.342537879943848, "global_step": 124318, "epoch": 739} {"train_loss": -10.110573223658971, "global_step": 124319, "epoch": 739, "val_loss": 217259.9375} {"train_loss": -9.777896881103516, "global_step": 124320, "epoch": 740} {"train_loss": -10.402969360351562, "global_step": 124321, "epoch": 740} {"train_loss": -10.162884712219238, "global_step": 124322, "epoch": 740} {"train_loss": -9.61947250366211, "global_step": 124323, "epoch": 740} {"train_loss": -10.118326187133789, "global_step": 124324, "epoch": 740} {"train_loss": -10.100484848022461, "global_step": 124325, "epoch": 740} {"train_loss": -9.944931983947754, "global_step": 124326, "epoch": 740} {"train_loss": -10.367105484008789, "global_step": 124327, "epoch": 740} {"train_loss": -10.14045238494873, "global_step": 124328, "epoch": 740} {"train_loss": -9.953699111938477, "global_step": 124329, "epoch": 740} {"train_loss": -10.003633499145508, "global_step": 124330, "epoch": 740} {"train_loss": -9.968998908996582, "global_step": 124331, "epoch": 740} {"train_loss": -9.973529815673828, "global_step": 124332, "epoch": 740} {"train_loss": -10.021234512329102, "global_step": 124333, "epoch": 740} {"train_loss": -9.625442504882812, "global_step": 124334, "epoch": 740} {"train_loss": -10.04554557800293, "global_step": 124335, "epoch": 740} {"train_loss": -9.948700904846191, "global_step": 124336, "epoch": 740} {"train_loss": -10.18658447265625, "global_step": 124337, "epoch": 740} {"train_loss": -9.744306564331055, "global_step": 124338, "epoch": 740} {"train_loss": -10.075702667236328, "global_step": 124339, "epoch": 740} {"train_loss": -9.720636367797852, "global_step": 124340, "epoch": 740} {"train_loss": -10.255987167358398, "global_step": 124341, "epoch": 740} {"train_loss": -9.943546295166016, "global_step": 124342, "epoch": 740} {"train_loss": -10.113078117370605, "global_step": 124343, "epoch": 740} {"train_loss": -9.999034881591797, "global_step": 124344, "epoch": 740} {"train_loss": -10.282045364379883, "global_step": 124345, "epoch": 740} {"train_loss": -10.343314170837402, "global_step": 124346, "epoch": 740} {"train_loss": -10.034468650817871, "global_step": 124347, "epoch": 740} {"train_loss": -10.2310791015625, "global_step": 124348, "epoch": 740} {"train_loss": -9.896524429321289, "global_step": 124349, "epoch": 740} {"train_loss": -10.15411376953125, "global_step": 124350, "epoch": 740} {"train_loss": -10.261669158935547, "global_step": 124351, "epoch": 740} {"train_loss": -10.287959098815918, "global_step": 124352, "epoch": 740} {"train_loss": -10.052228927612305, "global_step": 124353, "epoch": 740} {"train_loss": -10.296239852905273, "global_step": 124354, "epoch": 740} {"train_loss": -10.05648136138916, "global_step": 124355, "epoch": 740} {"train_loss": -10.311513900756836, "global_step": 124356, "epoch": 740} {"train_loss": -10.23060417175293, "global_step": 124357, "epoch": 740} {"train_loss": -10.163738250732422, "global_step": 124358, "epoch": 740} {"train_loss": -10.320205688476562, "global_step": 124359, "epoch": 740} {"train_loss": -10.010498046875, "global_step": 124360, "epoch": 740} {"train_loss": -10.093101501464844, "global_step": 124361, "epoch": 740} {"train_loss": -10.212486267089844, "global_step": 124362, "epoch": 740} {"train_loss": -10.258925437927246, "global_step": 124363, "epoch": 740} {"train_loss": -10.271961212158203, "global_step": 124364, "epoch": 740} {"train_loss": -10.238264083862305, "global_step": 124365, "epoch": 740} {"train_loss": -10.179187774658203, "global_step": 124366, "epoch": 740} {"train_loss": -10.394437789916992, "global_step": 124367, "epoch": 740} {"train_loss": -10.2984619140625, "global_step": 124368, "epoch": 740} {"train_loss": -10.46744155883789, "global_step": 124369, "epoch": 740} {"train_loss": -10.102157592773438, "global_step": 124370, "epoch": 740} {"train_loss": -10.421001434326172, "global_step": 124371, "epoch": 740} {"train_loss": -10.155948638916016, "global_step": 124372, "epoch": 740} {"train_loss": -10.342214584350586, "global_step": 124373, "epoch": 740} {"train_loss": -10.429500579833984, "global_step": 124374, "epoch": 740} {"train_loss": -10.181127548217773, "global_step": 124375, "epoch": 740} {"train_loss": -10.41854476928711, "global_step": 124376, "epoch": 740} {"train_loss": -10.360563278198242, "global_step": 124377, "epoch": 740} {"train_loss": -10.219765663146973, "global_step": 124378, "epoch": 740} {"train_loss": -10.373143196105957, "global_step": 124379, "epoch": 740} {"train_loss": -10.325592994689941, "global_step": 124380, "epoch": 740} {"train_loss": -10.36174201965332, "global_step": 124381, "epoch": 740} {"train_loss": -10.11974048614502, "global_step": 124382, "epoch": 740} {"train_loss": -10.46268081665039, "global_step": 124383, "epoch": 740} {"train_loss": -10.403675079345703, "global_step": 124384, "epoch": 740} {"train_loss": -10.3209228515625, "global_step": 124385, "epoch": 740} {"train_loss": -10.680612564086914, "global_step": 124386, "epoch": 740} {"train_loss": -10.184822082519531, "global_step": 124387, "epoch": 740} {"train_loss": -10.39510726928711, "global_step": 124388, "epoch": 740} {"train_loss": -10.208333969116211, "global_step": 124389, "epoch": 740} {"train_loss": -10.119885444641113, "global_step": 124390, "epoch": 740} {"train_loss": -10.106863975524902, "global_step": 124391, "epoch": 740} {"train_loss": -10.249130249023438, "global_step": 124392, "epoch": 740} {"train_loss": -10.660096168518066, "global_step": 124393, "epoch": 740} {"train_loss": -10.382268905639648, "global_step": 124394, "epoch": 740} {"train_loss": -10.041150093078613, "global_step": 124395, "epoch": 740} {"train_loss": -10.355934143066406, "global_step": 124396, "epoch": 740} {"train_loss": -9.80868148803711, "global_step": 124397, "epoch": 740} {"train_loss": -10.183597564697266, "global_step": 124398, "epoch": 740} {"train_loss": -10.138025283813477, "global_step": 124399, "epoch": 740} {"train_loss": -9.825239181518555, "global_step": 124400, "epoch": 740} {"train_loss": -10.194929122924805, "global_step": 124401, "epoch": 740} {"train_loss": -10.307966232299805, "global_step": 124402, "epoch": 740} {"train_loss": -10.327249526977539, "global_step": 124403, "epoch": 740} {"train_loss": -10.544729232788086, "global_step": 124404, "epoch": 740} {"train_loss": -10.072525978088379, "global_step": 124405, "epoch": 740} {"train_loss": -10.438085556030273, "global_step": 124406, "epoch": 740} {"train_loss": -10.148770332336426, "global_step": 124407, "epoch": 740} {"train_loss": -10.120319366455078, "global_step": 124408, "epoch": 740} {"train_loss": -10.378789901733398, "global_step": 124409, "epoch": 740} {"train_loss": -10.086847305297852, "global_step": 124410, "epoch": 740} {"train_loss": -10.291573524475098, "global_step": 124411, "epoch": 740} {"train_loss": -10.456275939941406, "global_step": 124412, "epoch": 740} {"train_loss": -9.969178199768066, "global_step": 124413, "epoch": 740} {"train_loss": -10.431164741516113, "global_step": 124414, "epoch": 740} {"train_loss": -10.087636947631836, "global_step": 124415, "epoch": 740} {"train_loss": -10.124046325683594, "global_step": 124416, "epoch": 740} {"train_loss": -10.303112983703613, "global_step": 124417, "epoch": 740} {"train_loss": -10.10502815246582, "global_step": 124418, "epoch": 740} {"train_loss": -10.113083839416504, "global_step": 124419, "epoch": 740} {"train_loss": -10.103571891784668, "global_step": 124420, "epoch": 740} {"train_loss": -10.157414436340332, "global_step": 124421, "epoch": 740} {"train_loss": -10.267045021057129, "global_step": 124422, "epoch": 740} {"train_loss": -10.078330993652344, "global_step": 124423, "epoch": 740} {"train_loss": -10.05615234375, "global_step": 124424, "epoch": 740} {"train_loss": -10.137975692749023, "global_step": 124425, "epoch": 740} {"train_loss": -9.683006286621094, "global_step": 124426, "epoch": 740} {"train_loss": -10.273785591125488, "global_step": 124427, "epoch": 740} {"train_loss": -9.594770431518555, "global_step": 124428, "epoch": 740} {"train_loss": -10.021263122558594, "global_step": 124429, "epoch": 740} {"train_loss": -9.960857391357422, "global_step": 124430, "epoch": 740} {"train_loss": -9.830906867980957, "global_step": 124431, "epoch": 740} {"train_loss": -10.262052536010742, "global_step": 124432, "epoch": 740} {"train_loss": -9.832338333129883, "global_step": 124433, "epoch": 740} {"train_loss": -10.228516578674316, "global_step": 124434, "epoch": 740} {"train_loss": -9.905983924865723, "global_step": 124435, "epoch": 740} {"train_loss": -10.143267631530762, "global_step": 124436, "epoch": 740} {"train_loss": -10.07516098022461, "global_step": 124437, "epoch": 740} {"train_loss": -10.077122688293457, "global_step": 124438, "epoch": 740} {"train_loss": -9.978805541992188, "global_step": 124439, "epoch": 740} {"train_loss": -10.35616683959961, "global_step": 124440, "epoch": 740} {"train_loss": -9.942581176757812, "global_step": 124441, "epoch": 740} {"train_loss": -10.222222328186035, "global_step": 124442, "epoch": 740} {"train_loss": -10.104524612426758, "global_step": 124443, "epoch": 740} {"train_loss": -10.13609504699707, "global_step": 124444, "epoch": 740} {"train_loss": -10.019447326660156, "global_step": 124445, "epoch": 740} {"train_loss": -9.958425521850586, "global_step": 124446, "epoch": 740} {"train_loss": -10.275505065917969, "global_step": 124447, "epoch": 740} {"train_loss": -10.18547248840332, "global_step": 124448, "epoch": 740} {"train_loss": -10.11790943145752, "global_step": 124449, "epoch": 740} {"train_loss": -10.142740249633789, "global_step": 124450, "epoch": 740} {"train_loss": -10.012676239013672, "global_step": 124451, "epoch": 740} {"train_loss": -10.229310989379883, "global_step": 124452, "epoch": 740} {"train_loss": -10.129989624023438, "global_step": 124453, "epoch": 740} {"train_loss": -10.327293395996094, "global_step": 124454, "epoch": 740} {"train_loss": -10.361486434936523, "global_step": 124455, "epoch": 740} {"train_loss": -10.30009937286377, "global_step": 124456, "epoch": 740} {"train_loss": -10.355939865112305, "global_step": 124457, "epoch": 740} {"train_loss": -10.180368423461914, "global_step": 124458, "epoch": 740} {"train_loss": -10.177124977111816, "global_step": 124459, "epoch": 740} {"train_loss": -10.40955638885498, "global_step": 124460, "epoch": 740} {"train_loss": -10.311781883239746, "global_step": 124461, "epoch": 740} {"train_loss": -10.418203353881836, "global_step": 124462, "epoch": 740} {"train_loss": -10.112974166870117, "global_step": 124463, "epoch": 740} {"train_loss": -10.416866302490234, "global_step": 124464, "epoch": 740} {"train_loss": -10.415088653564453, "global_step": 124465, "epoch": 740} {"train_loss": -10.512320518493652, "global_step": 124466, "epoch": 740} {"train_loss": -10.481833457946777, "global_step": 124467, "epoch": 740} {"train_loss": -10.3702392578125, "global_step": 124468, "epoch": 740} {"train_loss": -10.54890251159668, "global_step": 124469, "epoch": 740} {"train_loss": -10.519964218139648, "global_step": 124470, "epoch": 740} {"train_loss": -10.494428634643555, "global_step": 124471, "epoch": 740} {"train_loss": -10.435680389404297, "global_step": 124472, "epoch": 740} {"train_loss": -10.33850383758545, "global_step": 124473, "epoch": 740} {"train_loss": -10.309015274047852, "global_step": 124474, "epoch": 740} {"train_loss": -10.426349639892578, "global_step": 124475, "epoch": 740} {"train_loss": -10.595626831054688, "global_step": 124476, "epoch": 740} {"train_loss": -10.276252746582031, "global_step": 124477, "epoch": 740} {"train_loss": -10.285228729248047, "global_step": 124478, "epoch": 740} {"train_loss": -10.648811340332031, "global_step": 124479, "epoch": 740} {"train_loss": -10.165822982788086, "global_step": 124480, "epoch": 740} {"train_loss": -10.476404190063477, "global_step": 124481, "epoch": 740} {"train_loss": -10.175464630126953, "global_step": 124482, "epoch": 740} {"train_loss": -10.417328834533691, "global_step": 124483, "epoch": 740} {"train_loss": -9.789888381958008, "global_step": 124484, "epoch": 740} {"train_loss": -9.814657211303711, "global_step": 124485, "epoch": 740} {"train_loss": -10.132275581359863, "global_step": 124486, "epoch": 740} {"train_loss": -10.192709582192558, "global_step": 124487, "epoch": 740, "val_loss": 218271.3125, "train_action_mse_error": 1.826215147972107} {"train_loss": -9.808847427368164, "global_step": 124488, "epoch": 741} {"train_loss": -10.240225791931152, "global_step": 124489, "epoch": 741} {"train_loss": -10.046102523803711, "global_step": 124490, "epoch": 741} {"train_loss": -10.003883361816406, "global_step": 124491, "epoch": 741} {"train_loss": -10.134611129760742, "global_step": 124492, "epoch": 741} {"train_loss": -9.920503616333008, "global_step": 124493, "epoch": 741} {"train_loss": -10.48898696899414, "global_step": 124494, "epoch": 741} {"train_loss": -10.001252174377441, "global_step": 124495, "epoch": 741} {"train_loss": -10.217090606689453, "global_step": 124496, "epoch": 741} {"train_loss": -10.00839900970459, "global_step": 124497, "epoch": 741} {"train_loss": -10.31258773803711, "global_step": 124498, "epoch": 741} {"train_loss": -10.288236618041992, "global_step": 124499, "epoch": 741} {"train_loss": -10.18548583984375, "global_step": 124500, "epoch": 741} {"train_loss": -10.193682670593262, "global_step": 124501, "epoch": 741} {"train_loss": -10.297601699829102, "global_step": 124502, "epoch": 741} {"train_loss": -10.190227508544922, "global_step": 124503, "epoch": 741} {"train_loss": -10.09968090057373, "global_step": 124504, "epoch": 741} {"train_loss": -10.388757705688477, "global_step": 124505, "epoch": 741} {"train_loss": -10.264801979064941, "global_step": 124506, "epoch": 741} {"train_loss": -10.13286018371582, "global_step": 124507, "epoch": 741} {"train_loss": -10.068645477294922, "global_step": 124508, "epoch": 741} {"train_loss": -9.703795433044434, "global_step": 124509, "epoch": 741} {"train_loss": -10.120304107666016, "global_step": 124510, "epoch": 741} {"train_loss": -9.814680099487305, "global_step": 124511, "epoch": 741} {"train_loss": -9.55392074584961, "global_step": 124512, "epoch": 741} {"train_loss": -9.779167175292969, "global_step": 124513, "epoch": 741} {"train_loss": -9.329103469848633, "global_step": 124514, "epoch": 741} {"train_loss": -10.004323959350586, "global_step": 124515, "epoch": 741} {"train_loss": -9.507488250732422, "global_step": 124516, "epoch": 741} {"train_loss": -10.401901245117188, "global_step": 124517, "epoch": 741} {"train_loss": -9.462788581848145, "global_step": 124518, "epoch": 741} {"train_loss": -10.315832138061523, "global_step": 124519, "epoch": 741} {"train_loss": -9.816450119018555, "global_step": 124520, "epoch": 741} {"train_loss": -10.231721878051758, "global_step": 124521, "epoch": 741} {"train_loss": -9.839704513549805, "global_step": 124522, "epoch": 741} {"train_loss": -9.994510650634766, "global_step": 124523, "epoch": 741} {"train_loss": -10.127723693847656, "global_step": 124524, "epoch": 741} {"train_loss": -10.024333953857422, "global_step": 124525, "epoch": 741} {"train_loss": -10.105645179748535, "global_step": 124526, "epoch": 741} {"train_loss": -10.325248718261719, "global_step": 124527, "epoch": 741} {"train_loss": -9.793380737304688, "global_step": 124528, "epoch": 741} {"train_loss": -9.642841339111328, "global_step": 124529, "epoch": 741} {"train_loss": -10.127429962158203, "global_step": 124530, "epoch": 741} {"train_loss": -9.803153991699219, "global_step": 124531, "epoch": 741} {"train_loss": -9.844478607177734, "global_step": 124532, "epoch": 741} {"train_loss": -9.70829963684082, "global_step": 124533, "epoch": 741} {"train_loss": -9.99155330657959, "global_step": 124534, "epoch": 741} {"train_loss": -9.894704818725586, "global_step": 124535, "epoch": 741} {"train_loss": -10.128759384155273, "global_step": 124536, "epoch": 741} {"train_loss": -9.854927062988281, "global_step": 124537, "epoch": 741} {"train_loss": -9.957568168640137, "global_step": 124538, "epoch": 741} {"train_loss": -10.196969032287598, "global_step": 124539, "epoch": 741} {"train_loss": -9.751394271850586, "global_step": 124540, "epoch": 741} {"train_loss": -10.320066452026367, "global_step": 124541, "epoch": 741} {"train_loss": -9.885986328125, "global_step": 124542, "epoch": 741} {"train_loss": -10.033182144165039, "global_step": 124543, "epoch": 741} {"train_loss": -10.052053451538086, "global_step": 124544, "epoch": 741} {"train_loss": -10.53272819519043, "global_step": 124545, "epoch": 741} {"train_loss": -10.067789077758789, "global_step": 124546, "epoch": 741} {"train_loss": -10.470704078674316, "global_step": 124547, "epoch": 741} {"train_loss": -10.381427764892578, "global_step": 124548, "epoch": 741} {"train_loss": -10.190792083740234, "global_step": 124549, "epoch": 741} {"train_loss": -10.08341121673584, "global_step": 124550, "epoch": 741} {"train_loss": -10.485618591308594, "global_step": 124551, "epoch": 741} {"train_loss": -10.145730972290039, "global_step": 124552, "epoch": 741} {"train_loss": -10.43545150756836, "global_step": 124553, "epoch": 741} {"train_loss": -10.217924118041992, "global_step": 124554, "epoch": 741} {"train_loss": -10.379378318786621, "global_step": 124555, "epoch": 741} {"train_loss": -10.531255722045898, "global_step": 124556, "epoch": 741} {"train_loss": -10.476242065429688, "global_step": 124557, "epoch": 741} {"train_loss": -10.08657169342041, "global_step": 124558, "epoch": 741} {"train_loss": -10.42684268951416, "global_step": 124559, "epoch": 741} {"train_loss": -10.570952415466309, "global_step": 124560, "epoch": 741} {"train_loss": -10.372674942016602, "global_step": 124561, "epoch": 741} {"train_loss": -10.382852554321289, "global_step": 124562, "epoch": 741} {"train_loss": -10.315961837768555, "global_step": 124563, "epoch": 741} {"train_loss": -10.311501502990723, "global_step": 124564, "epoch": 741} {"train_loss": -10.44589614868164, "global_step": 124565, "epoch": 741} {"train_loss": -10.018590927124023, "global_step": 124566, "epoch": 741} {"train_loss": -10.483701705932617, "global_step": 124567, "epoch": 741} {"train_loss": -10.329267501831055, "global_step": 124568, "epoch": 741} {"train_loss": -10.50515365600586, "global_step": 124569, "epoch": 741} {"train_loss": -10.496416091918945, "global_step": 124570, "epoch": 741} {"train_loss": -10.261931419372559, "global_step": 124571, "epoch": 741} {"train_loss": -10.470183372497559, "global_step": 124572, "epoch": 741} {"train_loss": -10.080402374267578, "global_step": 124573, "epoch": 741} {"train_loss": -10.631218910217285, "global_step": 124574, "epoch": 741} {"train_loss": -10.060712814331055, "global_step": 124575, "epoch": 741} {"train_loss": -9.703432083129883, "global_step": 124576, "epoch": 741} {"train_loss": -9.55748176574707, "global_step": 124577, "epoch": 741} {"train_loss": -9.968650817871094, "global_step": 124578, "epoch": 741} {"train_loss": -8.372201919555664, "global_step": 124579, "epoch": 741} {"train_loss": -10.284063339233398, "global_step": 124580, "epoch": 741} {"train_loss": -9.299554824829102, "global_step": 124581, "epoch": 741} {"train_loss": -10.23074722290039, "global_step": 124582, "epoch": 741} {"train_loss": -10.110906600952148, "global_step": 124583, "epoch": 741} {"train_loss": -9.508586883544922, "global_step": 124584, "epoch": 741} {"train_loss": -9.95528793334961, "global_step": 124585, "epoch": 741} {"train_loss": -9.751729965209961, "global_step": 124586, "epoch": 741} {"train_loss": -9.955370903015137, "global_step": 124587, "epoch": 741} {"train_loss": -9.872743606567383, "global_step": 124588, "epoch": 741} {"train_loss": -9.933744430541992, "global_step": 124589, "epoch": 741} {"train_loss": -10.038738250732422, "global_step": 124590, "epoch": 741} {"train_loss": -10.123054504394531, "global_step": 124591, "epoch": 741} {"train_loss": -10.115874290466309, "global_step": 124592, "epoch": 741} {"train_loss": -10.012712478637695, "global_step": 124593, "epoch": 741} {"train_loss": -10.132914543151855, "global_step": 124594, "epoch": 741} {"train_loss": -10.275328636169434, "global_step": 124595, "epoch": 741} {"train_loss": -10.092958450317383, "global_step": 124596, "epoch": 741} {"train_loss": -9.874683380126953, "global_step": 124597, "epoch": 741} {"train_loss": -10.209566116333008, "global_step": 124598, "epoch": 741} {"train_loss": -9.977603912353516, "global_step": 124599, "epoch": 741} {"train_loss": -10.176513671875, "global_step": 124600, "epoch": 741} {"train_loss": -10.148921966552734, "global_step": 124601, "epoch": 741} {"train_loss": -10.180192947387695, "global_step": 124602, "epoch": 741} {"train_loss": -10.090996742248535, "global_step": 124603, "epoch": 741} {"train_loss": -10.12216854095459, "global_step": 124604, "epoch": 741} {"train_loss": -9.9484224319458, "global_step": 124605, "epoch": 741} {"train_loss": -10.09130573272705, "global_step": 124606, "epoch": 741} {"train_loss": -10.138710975646973, "global_step": 124607, "epoch": 741} {"train_loss": -10.15156364440918, "global_step": 124608, "epoch": 741} {"train_loss": -10.181741714477539, "global_step": 124609, "epoch": 741} {"train_loss": -10.253768920898438, "global_step": 124610, "epoch": 741} {"train_loss": -10.230599403381348, "global_step": 124611, "epoch": 741} {"train_loss": -10.051162719726562, "global_step": 124612, "epoch": 741} {"train_loss": -10.30116081237793, "global_step": 124613, "epoch": 741} {"train_loss": -10.141484260559082, "global_step": 124614, "epoch": 741} {"train_loss": -10.213298797607422, "global_step": 124615, "epoch": 741} {"train_loss": -10.01895809173584, "global_step": 124616, "epoch": 741} {"train_loss": -10.066619873046875, "global_step": 124617, "epoch": 741} {"train_loss": -10.115617752075195, "global_step": 124618, "epoch": 741} {"train_loss": -9.794159889221191, "global_step": 124619, "epoch": 741} {"train_loss": -10.430974006652832, "global_step": 124620, "epoch": 741} {"train_loss": -10.384849548339844, "global_step": 124621, "epoch": 741} {"train_loss": -10.115375518798828, "global_step": 124622, "epoch": 741} {"train_loss": -10.34316635131836, "global_step": 124623, "epoch": 741} {"train_loss": -10.33883285522461, "global_step": 124624, "epoch": 741} {"train_loss": -10.106193542480469, "global_step": 124625, "epoch": 741} {"train_loss": -10.372871398925781, "global_step": 124626, "epoch": 741} {"train_loss": -10.187826156616211, "global_step": 124627, "epoch": 741} {"train_loss": -10.368667602539062, "global_step": 124628, "epoch": 741} {"train_loss": -10.282674789428711, "global_step": 124629, "epoch": 741} {"train_loss": -10.478950500488281, "global_step": 124630, "epoch": 741} {"train_loss": -10.414438247680664, "global_step": 124631, "epoch": 741} {"train_loss": -10.098882675170898, "global_step": 124632, "epoch": 741} {"train_loss": -10.361912727355957, "global_step": 124633, "epoch": 741} {"train_loss": -10.410526275634766, "global_step": 124634, "epoch": 741} {"train_loss": -10.486742973327637, "global_step": 124635, "epoch": 741} {"train_loss": -10.354025840759277, "global_step": 124636, "epoch": 741} {"train_loss": -10.63673210144043, "global_step": 124637, "epoch": 741} {"train_loss": -10.607559204101562, "global_step": 124638, "epoch": 741} {"train_loss": -10.346628189086914, "global_step": 124639, "epoch": 741} {"train_loss": -10.631531715393066, "global_step": 124640, "epoch": 741} {"train_loss": -10.21334457397461, "global_step": 124641, "epoch": 741} {"train_loss": -10.599384307861328, "global_step": 124642, "epoch": 741} {"train_loss": -10.027738571166992, "global_step": 124643, "epoch": 741} {"train_loss": -10.30062484741211, "global_step": 124644, "epoch": 741} {"train_loss": -10.125632286071777, "global_step": 124645, "epoch": 741} {"train_loss": -10.085328102111816, "global_step": 124646, "epoch": 741} {"train_loss": -10.110113143920898, "global_step": 124647, "epoch": 741} {"train_loss": -10.300178527832031, "global_step": 124648, "epoch": 741} {"train_loss": -9.948040008544922, "global_step": 124649, "epoch": 741} {"train_loss": -10.629528999328613, "global_step": 124650, "epoch": 741} {"train_loss": -9.848383903503418, "global_step": 124651, "epoch": 741} {"train_loss": -10.160369873046875, "global_step": 124652, "epoch": 741} {"train_loss": -9.87104320526123, "global_step": 124653, "epoch": 741} {"train_loss": -9.823492050170898, "global_step": 124654, "epoch": 741} {"train_loss": -10.12150656041645, "global_step": 124655, "epoch": 741, "val_loss": 215958.5625} {"train_loss": -9.339113235473633, "global_step": 124656, "epoch": 742} {"train_loss": -9.719324111938477, "global_step": 124657, "epoch": 742} {"train_loss": -9.664310455322266, "global_step": 124658, "epoch": 742} {"train_loss": -10.010345458984375, "global_step": 124659, "epoch": 742} {"train_loss": -9.934012413024902, "global_step": 124660, "epoch": 742} {"train_loss": -9.951844215393066, "global_step": 124661, "epoch": 742} {"train_loss": -9.763446807861328, "global_step": 124662, "epoch": 742} {"train_loss": -9.63363265991211, "global_step": 124663, "epoch": 742} {"train_loss": -10.065181732177734, "global_step": 124664, "epoch": 742} {"train_loss": -9.797807693481445, "global_step": 124665, "epoch": 742} {"train_loss": -10.036989212036133, "global_step": 124666, "epoch": 742} {"train_loss": -10.06784439086914, "global_step": 124667, "epoch": 742} {"train_loss": -10.017784118652344, "global_step": 124668, "epoch": 742} {"train_loss": -10.166332244873047, "global_step": 124669, "epoch": 742} {"train_loss": -10.085615158081055, "global_step": 124670, "epoch": 742} {"train_loss": -10.21479606628418, "global_step": 124671, "epoch": 742} {"train_loss": -10.165228843688965, "global_step": 124672, "epoch": 742} {"train_loss": -10.204452514648438, "global_step": 124673, "epoch": 742} {"train_loss": -10.081745147705078, "global_step": 124674, "epoch": 742} {"train_loss": -10.204475402832031, "global_step": 124675, "epoch": 742} {"train_loss": -9.982305526733398, "global_step": 124676, "epoch": 742} {"train_loss": -10.246749877929688, "global_step": 124677, "epoch": 742} {"train_loss": -10.237136840820312, "global_step": 124678, "epoch": 742} {"train_loss": -10.284780502319336, "global_step": 124679, "epoch": 742} {"train_loss": -10.565213203430176, "global_step": 124680, "epoch": 742} {"train_loss": -10.12769889831543, "global_step": 124681, "epoch": 742} {"train_loss": -10.051844596862793, "global_step": 124682, "epoch": 742} {"train_loss": -10.441858291625977, "global_step": 124683, "epoch": 742} {"train_loss": -10.097179412841797, "global_step": 124684, "epoch": 742} {"train_loss": -10.37938117980957, "global_step": 124685, "epoch": 742} {"train_loss": -10.09951114654541, "global_step": 124686, "epoch": 742} {"train_loss": -10.195487976074219, "global_step": 124687, "epoch": 742} {"train_loss": -10.262918472290039, "global_step": 124688, "epoch": 742} {"train_loss": -10.368427276611328, "global_step": 124689, "epoch": 742} {"train_loss": -10.254582405090332, "global_step": 124690, "epoch": 742} {"train_loss": -10.503586769104004, "global_step": 124691, "epoch": 742} {"train_loss": -10.617964744567871, "global_step": 124692, "epoch": 742} {"train_loss": -10.429248809814453, "global_step": 124693, "epoch": 742} {"train_loss": -10.368953704833984, "global_step": 124694, "epoch": 742} {"train_loss": -10.528705596923828, "global_step": 124695, "epoch": 742} {"train_loss": -10.326496124267578, "global_step": 124696, "epoch": 742} {"train_loss": -10.425081253051758, "global_step": 124697, "epoch": 742} {"train_loss": -10.653884887695312, "global_step": 124698, "epoch": 742} {"train_loss": -10.543184280395508, "global_step": 124699, "epoch": 742} {"train_loss": -10.596282958984375, "global_step": 124700, "epoch": 742} {"train_loss": -10.271027565002441, "global_step": 124701, "epoch": 742} {"train_loss": -10.479153633117676, "global_step": 124702, "epoch": 742} {"train_loss": -10.337642669677734, "global_step": 124703, "epoch": 742} {"train_loss": -10.414041519165039, "global_step": 124704, "epoch": 742} {"train_loss": -10.270148277282715, "global_step": 124705, "epoch": 742} {"train_loss": -10.584419250488281, "global_step": 124706, "epoch": 742} {"train_loss": -10.33453369140625, "global_step": 124707, "epoch": 742} {"train_loss": -10.293089866638184, "global_step": 124708, "epoch": 742} {"train_loss": -9.974601745605469, "global_step": 124709, "epoch": 742} {"train_loss": -10.335198402404785, "global_step": 124710, "epoch": 742} {"train_loss": -9.936758995056152, "global_step": 124711, "epoch": 742} {"train_loss": -10.317622184753418, "global_step": 124712, "epoch": 742} {"train_loss": -10.530107498168945, "global_step": 124713, "epoch": 742} {"train_loss": -10.448609352111816, "global_step": 124714, "epoch": 742} {"train_loss": -9.860796928405762, "global_step": 124715, "epoch": 742} {"train_loss": -10.317025184631348, "global_step": 124716, "epoch": 742} {"train_loss": -10.41320514678955, "global_step": 124717, "epoch": 742} {"train_loss": -9.74837875366211, "global_step": 124718, "epoch": 742} {"train_loss": -10.047859191894531, "global_step": 124719, "epoch": 742} {"train_loss": -10.202913284301758, "global_step": 124720, "epoch": 742} {"train_loss": -9.858255386352539, "global_step": 124721, "epoch": 742} {"train_loss": -10.128421783447266, "global_step": 124722, "epoch": 742} {"train_loss": -9.941034317016602, "global_step": 124723, "epoch": 742} {"train_loss": -10.102960586547852, "global_step": 124724, "epoch": 742} {"train_loss": -10.527497291564941, "global_step": 124725, "epoch": 742} {"train_loss": -10.10998249053955, "global_step": 124726, "epoch": 742} {"train_loss": -10.166460990905762, "global_step": 124727, "epoch": 742} {"train_loss": -9.993003845214844, "global_step": 124728, "epoch": 742} {"train_loss": -10.057577133178711, "global_step": 124729, "epoch": 742} {"train_loss": -10.167349815368652, "global_step": 124730, "epoch": 742} {"train_loss": -10.211691856384277, "global_step": 124731, "epoch": 742} {"train_loss": -10.271799087524414, "global_step": 124732, "epoch": 742} {"train_loss": -10.39278793334961, "global_step": 124733, "epoch": 742} {"train_loss": -10.377279281616211, "global_step": 124734, "epoch": 742} {"train_loss": -10.245361328125, "global_step": 124735, "epoch": 742} {"train_loss": -10.347606658935547, "global_step": 124736, "epoch": 742} {"train_loss": -10.26815414428711, "global_step": 124737, "epoch": 742} {"train_loss": -10.332842826843262, "global_step": 124738, "epoch": 742} {"train_loss": -10.376974105834961, "global_step": 124739, "epoch": 742} {"train_loss": -10.301559448242188, "global_step": 124740, "epoch": 742} {"train_loss": -9.908815383911133, "global_step": 124741, "epoch": 742} {"train_loss": -10.405609130859375, "global_step": 124742, "epoch": 742} {"train_loss": -10.180654525756836, "global_step": 124743, "epoch": 742} {"train_loss": -10.109859466552734, "global_step": 124744, "epoch": 742} {"train_loss": -10.329551696777344, "global_step": 124745, "epoch": 742} {"train_loss": -9.852209091186523, "global_step": 124746, "epoch": 742} {"train_loss": -10.373228073120117, "global_step": 124747, "epoch": 742} {"train_loss": -9.838443756103516, "global_step": 124748, "epoch": 742} {"train_loss": -9.83010196685791, "global_step": 124749, "epoch": 742} {"train_loss": -8.499666213989258, "global_step": 124750, "epoch": 742} {"train_loss": -10.429485321044922, "global_step": 124751, "epoch": 742} {"train_loss": -9.759513854980469, "global_step": 124752, "epoch": 742} {"train_loss": -10.100406646728516, "global_step": 124753, "epoch": 742} {"train_loss": -10.044363021850586, "global_step": 124754, "epoch": 742} {"train_loss": -10.334726333618164, "global_step": 124755, "epoch": 742} {"train_loss": -10.157411575317383, "global_step": 124756, "epoch": 742} {"train_loss": -10.38398551940918, "global_step": 124757, "epoch": 742} {"train_loss": -9.602457046508789, "global_step": 124758, "epoch": 742} {"train_loss": -10.232839584350586, "global_step": 124759, "epoch": 742} {"train_loss": -9.909637451171875, "global_step": 124760, "epoch": 742} {"train_loss": -10.139640808105469, "global_step": 124761, "epoch": 742} {"train_loss": -10.156692504882812, "global_step": 124762, "epoch": 742} {"train_loss": -9.89144515991211, "global_step": 124763, "epoch": 742} {"train_loss": -9.963473320007324, "global_step": 124764, "epoch": 742} {"train_loss": -10.125532150268555, "global_step": 124765, "epoch": 742} {"train_loss": -9.822668075561523, "global_step": 124766, "epoch": 742} {"train_loss": -10.145692825317383, "global_step": 124767, "epoch": 742} {"train_loss": -9.913445472717285, "global_step": 124768, "epoch": 742} {"train_loss": -10.113471984863281, "global_step": 124769, "epoch": 742} {"train_loss": -9.954373359680176, "global_step": 124770, "epoch": 742} {"train_loss": -9.991607666015625, "global_step": 124771, "epoch": 742} {"train_loss": -10.11955451965332, "global_step": 124772, "epoch": 742} {"train_loss": -10.138496398925781, "global_step": 124773, "epoch": 742} {"train_loss": -10.098970413208008, "global_step": 124774, "epoch": 742} {"train_loss": -10.364051818847656, "global_step": 124775, "epoch": 742} {"train_loss": -10.29616641998291, "global_step": 124776, "epoch": 742} {"train_loss": -10.244673728942871, "global_step": 124777, "epoch": 742} {"train_loss": -10.101173400878906, "global_step": 124778, "epoch": 742} {"train_loss": -10.241592407226562, "global_step": 124779, "epoch": 742} {"train_loss": -10.26317024230957, "global_step": 124780, "epoch": 742} {"train_loss": -10.272964477539062, "global_step": 124781, "epoch": 742} {"train_loss": -10.39847183227539, "global_step": 124782, "epoch": 742} {"train_loss": -10.31987190246582, "global_step": 124783, "epoch": 742} {"train_loss": -10.3711519241333, "global_step": 124784, "epoch": 742} {"train_loss": -10.512186050415039, "global_step": 124785, "epoch": 742} {"train_loss": -10.350921630859375, "global_step": 124786, "epoch": 742} {"train_loss": -10.555276870727539, "global_step": 124787, "epoch": 742} {"train_loss": -10.423770904541016, "global_step": 124788, "epoch": 742} {"train_loss": -10.339577674865723, "global_step": 124789, "epoch": 742} {"train_loss": -10.409653663635254, "global_step": 124790, "epoch": 742} {"train_loss": -10.35572338104248, "global_step": 124791, "epoch": 742} {"train_loss": -10.541626930236816, "global_step": 124792, "epoch": 742} {"train_loss": -10.605798721313477, "global_step": 124793, "epoch": 742} {"train_loss": -10.556375503540039, "global_step": 124794, "epoch": 742} {"train_loss": -10.507745742797852, "global_step": 124795, "epoch": 742} {"train_loss": -10.558832168579102, "global_step": 124796, "epoch": 742} {"train_loss": -10.550682067871094, "global_step": 124797, "epoch": 742} {"train_loss": -10.651180267333984, "global_step": 124798, "epoch": 742} {"train_loss": -10.502260208129883, "global_step": 124799, "epoch": 742} {"train_loss": -10.524234771728516, "global_step": 124800, "epoch": 742} {"train_loss": -10.390375137329102, "global_step": 124801, "epoch": 742} {"train_loss": -10.570369720458984, "global_step": 124802, "epoch": 742} {"train_loss": -10.676912307739258, "global_step": 124803, "epoch": 742} {"train_loss": -10.341606140136719, "global_step": 124804, "epoch": 742} {"train_loss": -10.588042259216309, "global_step": 124805, "epoch": 742} {"train_loss": -10.708578109741211, "global_step": 124806, "epoch": 742} {"train_loss": -10.404211044311523, "global_step": 124807, "epoch": 742} {"train_loss": -10.500036239624023, "global_step": 124808, "epoch": 742} {"train_loss": -10.495969772338867, "global_step": 124809, "epoch": 742} {"train_loss": -10.323022842407227, "global_step": 124810, "epoch": 742} {"train_loss": -10.261761665344238, "global_step": 124811, "epoch": 742} {"train_loss": -10.405462265014648, "global_step": 124812, "epoch": 742} {"train_loss": -10.473034858703613, "global_step": 124813, "epoch": 742} {"train_loss": -10.30724811553955, "global_step": 124814, "epoch": 742} {"train_loss": -10.129938125610352, "global_step": 124815, "epoch": 742} {"train_loss": -10.727470397949219, "global_step": 124816, "epoch": 742} {"train_loss": -10.57486629486084, "global_step": 124817, "epoch": 742} {"train_loss": -10.431377410888672, "global_step": 124818, "epoch": 742} {"train_loss": -10.404805183410645, "global_step": 124819, "epoch": 742} {"train_loss": -10.542648315429688, "global_step": 124820, "epoch": 742} {"train_loss": -10.210070610046387, "global_step": 124821, "epoch": 742} {"train_loss": -10.518341064453125, "global_step": 124822, "epoch": 742} {"train_loss": -10.23181084224156, "global_step": 124823, "epoch": 742, "val_loss": 215613.859375} {"train_loss": -9.94723892211914, "global_step": 124824, "epoch": 743} {"train_loss": -10.121264457702637, "global_step": 124825, "epoch": 743} {"train_loss": -10.084479331970215, "global_step": 124826, "epoch": 743} {"train_loss": -10.388896942138672, "global_step": 124827, "epoch": 743} {"train_loss": -9.706624984741211, "global_step": 124828, "epoch": 743} {"train_loss": -9.867619514465332, "global_step": 124829, "epoch": 743} {"train_loss": -10.28664779663086, "global_step": 124830, "epoch": 743} {"train_loss": -10.339696884155273, "global_step": 124831, "epoch": 743} {"train_loss": -10.179925918579102, "global_step": 124832, "epoch": 743} {"train_loss": -10.338890075683594, "global_step": 124833, "epoch": 743} {"train_loss": -10.154165267944336, "global_step": 124834, "epoch": 743} {"train_loss": -9.736989974975586, "global_step": 124835, "epoch": 743} {"train_loss": -10.337063789367676, "global_step": 124836, "epoch": 743} {"train_loss": -10.46030330657959, "global_step": 124837, "epoch": 743} {"train_loss": -10.059511184692383, "global_step": 124838, "epoch": 743} {"train_loss": -10.326105117797852, "global_step": 124839, "epoch": 743} {"train_loss": -10.195775985717773, "global_step": 124840, "epoch": 743} {"train_loss": -10.294404029846191, "global_step": 124841, "epoch": 743} {"train_loss": -10.320819854736328, "global_step": 124842, "epoch": 743} {"train_loss": -10.452224731445312, "global_step": 124843, "epoch": 743} {"train_loss": -10.525564193725586, "global_step": 124844, "epoch": 743} {"train_loss": -10.320587158203125, "global_step": 124845, "epoch": 743} {"train_loss": -10.306290626525879, "global_step": 124846, "epoch": 743} {"train_loss": -10.168615341186523, "global_step": 124847, "epoch": 743} {"train_loss": -10.205682754516602, "global_step": 124848, "epoch": 743} {"train_loss": -10.282979965209961, "global_step": 124849, "epoch": 743} {"train_loss": -10.325847625732422, "global_step": 124850, "epoch": 743} {"train_loss": -10.336196899414062, "global_step": 124851, "epoch": 743} {"train_loss": -10.185471534729004, "global_step": 124852, "epoch": 743} {"train_loss": -10.202913284301758, "global_step": 124853, "epoch": 743} {"train_loss": -10.263324737548828, "global_step": 124854, "epoch": 743} {"train_loss": -10.01987361907959, "global_step": 124855, "epoch": 743} {"train_loss": -10.062785148620605, "global_step": 124856, "epoch": 743} {"train_loss": -9.59682559967041, "global_step": 124857, "epoch": 743} {"train_loss": -9.570287704467773, "global_step": 124858, "epoch": 743} {"train_loss": -10.029239654541016, "global_step": 124859, "epoch": 743} {"train_loss": -9.907829284667969, "global_step": 124860, "epoch": 743} {"train_loss": -10.084781646728516, "global_step": 124861, "epoch": 743} {"train_loss": -10.162068367004395, "global_step": 124862, "epoch": 743} {"train_loss": -9.519155502319336, "global_step": 124863, "epoch": 743} {"train_loss": -10.235694885253906, "global_step": 124864, "epoch": 743} {"train_loss": -9.496335983276367, "global_step": 124865, "epoch": 743} {"train_loss": -9.633504867553711, "global_step": 124866, "epoch": 743} {"train_loss": -9.466493606567383, "global_step": 124867, "epoch": 743} {"train_loss": -9.775114059448242, "global_step": 124868, "epoch": 743} {"train_loss": -9.716896057128906, "global_step": 124869, "epoch": 743} {"train_loss": -10.057699203491211, "global_step": 124870, "epoch": 743} {"train_loss": -9.92269515991211, "global_step": 124871, "epoch": 743} {"train_loss": -10.106109619140625, "global_step": 124872, "epoch": 743} {"train_loss": -9.988381385803223, "global_step": 124873, "epoch": 743} {"train_loss": -9.46099853515625, "global_step": 124874, "epoch": 743} {"train_loss": -10.0813570022583, "global_step": 124875, "epoch": 743} {"train_loss": -9.881742477416992, "global_step": 124876, "epoch": 743} {"train_loss": -9.84752082824707, "global_step": 124877, "epoch": 743} {"train_loss": -10.072318077087402, "global_step": 124878, "epoch": 743} {"train_loss": -9.924973487854004, "global_step": 124879, "epoch": 743} {"train_loss": -9.861112594604492, "global_step": 124880, "epoch": 743} {"train_loss": -10.108463287353516, "global_step": 124881, "epoch": 743} {"train_loss": -9.565437316894531, "global_step": 124882, "epoch": 743} {"train_loss": -9.893223762512207, "global_step": 124883, "epoch": 743} {"train_loss": -10.131616592407227, "global_step": 124884, "epoch": 743} {"train_loss": -9.743673324584961, "global_step": 124885, "epoch": 743} {"train_loss": -10.160263061523438, "global_step": 124886, "epoch": 743} {"train_loss": -10.039155960083008, "global_step": 124887, "epoch": 743} {"train_loss": -9.964231491088867, "global_step": 124888, "epoch": 743} {"train_loss": -10.185909271240234, "global_step": 124889, "epoch": 743} {"train_loss": -10.297340393066406, "global_step": 124890, "epoch": 743} {"train_loss": -9.810198783874512, "global_step": 124891, "epoch": 743} {"train_loss": -10.12834358215332, "global_step": 124892, "epoch": 743} {"train_loss": -10.155867576599121, "global_step": 124893, "epoch": 743} {"train_loss": -10.167135238647461, "global_step": 124894, "epoch": 743} {"train_loss": -10.184858322143555, "global_step": 124895, "epoch": 743} {"train_loss": -10.342514038085938, "global_step": 124896, "epoch": 743} {"train_loss": -10.207284927368164, "global_step": 124897, "epoch": 743} {"train_loss": -10.450870513916016, "global_step": 124898, "epoch": 743} {"train_loss": -10.094144821166992, "global_step": 124899, "epoch": 743} {"train_loss": -10.246861457824707, "global_step": 124900, "epoch": 743} {"train_loss": -10.419203758239746, "global_step": 124901, "epoch": 743} {"train_loss": -10.00773811340332, "global_step": 124902, "epoch": 743} {"train_loss": -10.312873840332031, "global_step": 124903, "epoch": 743} {"train_loss": -10.227462768554688, "global_step": 124904, "epoch": 743} {"train_loss": -10.19368839263916, "global_step": 124905, "epoch": 743} {"train_loss": -10.408525466918945, "global_step": 124906, "epoch": 743} {"train_loss": -10.156227111816406, "global_step": 124907, "epoch": 743} {"train_loss": -10.26542854309082, "global_step": 124908, "epoch": 743} {"train_loss": -10.078594207763672, "global_step": 124909, "epoch": 743} {"train_loss": -10.221972465515137, "global_step": 124910, "epoch": 743} {"train_loss": -10.096946716308594, "global_step": 124911, "epoch": 743} {"train_loss": -10.517278671264648, "global_step": 124912, "epoch": 743} {"train_loss": -10.006668090820312, "global_step": 124913, "epoch": 743} {"train_loss": -10.2194185256958, "global_step": 124914, "epoch": 743} {"train_loss": -9.99148178100586, "global_step": 124915, "epoch": 743} {"train_loss": -10.2781400680542, "global_step": 124916, "epoch": 743} {"train_loss": -10.428088188171387, "global_step": 124917, "epoch": 743} {"train_loss": -10.209576606750488, "global_step": 124918, "epoch": 743} {"train_loss": -10.45510482788086, "global_step": 124919, "epoch": 743} {"train_loss": -10.310196876525879, "global_step": 124920, "epoch": 743} {"train_loss": -10.391051292419434, "global_step": 124921, "epoch": 743} {"train_loss": -10.573654174804688, "global_step": 124922, "epoch": 743} {"train_loss": -10.404129981994629, "global_step": 124923, "epoch": 743} {"train_loss": -10.572031021118164, "global_step": 124924, "epoch": 743} {"train_loss": -10.303886413574219, "global_step": 124925, "epoch": 743} {"train_loss": -10.429605484008789, "global_step": 124926, "epoch": 743} {"train_loss": -10.153558731079102, "global_step": 124927, "epoch": 743} {"train_loss": -10.185870170593262, "global_step": 124928, "epoch": 743} {"train_loss": -10.625564575195312, "global_step": 124929, "epoch": 743} {"train_loss": -10.419599533081055, "global_step": 124930, "epoch": 743} {"train_loss": -10.528791427612305, "global_step": 124931, "epoch": 743} {"train_loss": -10.455955505371094, "global_step": 124932, "epoch": 743} {"train_loss": -10.303887367248535, "global_step": 124933, "epoch": 743} {"train_loss": -10.335906982421875, "global_step": 124934, "epoch": 743} {"train_loss": -10.34819221496582, "global_step": 124935, "epoch": 743} {"train_loss": -10.5274658203125, "global_step": 124936, "epoch": 743} {"train_loss": -10.49027156829834, "global_step": 124937, "epoch": 743} {"train_loss": -9.915674209594727, "global_step": 124938, "epoch": 743} {"train_loss": -10.69525146484375, "global_step": 124939, "epoch": 743} {"train_loss": -10.497390747070312, "global_step": 124940, "epoch": 743} {"train_loss": -9.778400421142578, "global_step": 124941, "epoch": 743} {"train_loss": -10.421576499938965, "global_step": 124942, "epoch": 743} {"train_loss": -10.347386360168457, "global_step": 124943, "epoch": 743} {"train_loss": -10.435020446777344, "global_step": 124944, "epoch": 743} {"train_loss": -10.108213424682617, "global_step": 124945, "epoch": 743} {"train_loss": -10.637133598327637, "global_step": 124946, "epoch": 743} {"train_loss": -10.17352294921875, "global_step": 124947, "epoch": 743} {"train_loss": -9.820704460144043, "global_step": 124948, "epoch": 743} {"train_loss": -9.7307767868042, "global_step": 124949, "epoch": 743} {"train_loss": -10.461662292480469, "global_step": 124950, "epoch": 743} {"train_loss": -9.99303913116455, "global_step": 124951, "epoch": 743} {"train_loss": -10.008390426635742, "global_step": 124952, "epoch": 743} {"train_loss": -10.44345760345459, "global_step": 124953, "epoch": 743} {"train_loss": -9.769518852233887, "global_step": 124954, "epoch": 743} {"train_loss": -10.290435791015625, "global_step": 124955, "epoch": 743} {"train_loss": -9.943988800048828, "global_step": 124956, "epoch": 743} {"train_loss": -10.399413108825684, "global_step": 124957, "epoch": 743} {"train_loss": -10.360538482666016, "global_step": 124958, "epoch": 743} {"train_loss": -10.423847198486328, "global_step": 124959, "epoch": 743} {"train_loss": -10.202216148376465, "global_step": 124960, "epoch": 743} {"train_loss": -9.886823654174805, "global_step": 124961, "epoch": 743} {"train_loss": -10.286235809326172, "global_step": 124962, "epoch": 743} {"train_loss": -10.302384376525879, "global_step": 124963, "epoch": 743} {"train_loss": -10.198517799377441, "global_step": 124964, "epoch": 743} {"train_loss": -10.15155029296875, "global_step": 124965, "epoch": 743} {"train_loss": -9.98763370513916, "global_step": 124966, "epoch": 743} {"train_loss": -10.431219100952148, "global_step": 124967, "epoch": 743} {"train_loss": -10.331658363342285, "global_step": 124968, "epoch": 743} {"train_loss": -10.420940399169922, "global_step": 124969, "epoch": 743} {"train_loss": -10.322168350219727, "global_step": 124970, "epoch": 743} {"train_loss": -10.191265106201172, "global_step": 124971, "epoch": 743} {"train_loss": -10.354883193969727, "global_step": 124972, "epoch": 743} {"train_loss": -10.377843856811523, "global_step": 124973, "epoch": 743} {"train_loss": -9.944927215576172, "global_step": 124974, "epoch": 743} {"train_loss": -10.269731521606445, "global_step": 124975, "epoch": 743} {"train_loss": -10.06958293914795, "global_step": 124976, "epoch": 743} {"train_loss": -9.919641494750977, "global_step": 124977, "epoch": 743} {"train_loss": -10.073955535888672, "global_step": 124978, "epoch": 743} {"train_loss": -10.092512130737305, "global_step": 124979, "epoch": 743} {"train_loss": -10.287805557250977, "global_step": 124980, "epoch": 743} {"train_loss": -10.385885238647461, "global_step": 124981, "epoch": 743} {"train_loss": -9.78483772277832, "global_step": 124982, "epoch": 743} {"train_loss": -10.4130277633667, "global_step": 124983, "epoch": 743} {"train_loss": -10.180449485778809, "global_step": 124984, "epoch": 743} {"train_loss": -10.144514083862305, "global_step": 124985, "epoch": 743} {"train_loss": -10.20671272277832, "global_step": 124986, "epoch": 743} {"train_loss": -10.383607864379883, "global_step": 124987, "epoch": 743} {"train_loss": -10.238653182983398, "global_step": 124988, "epoch": 743} {"train_loss": -10.17343521118164, "global_step": 124989, "epoch": 743} {"train_loss": -10.275049209594727, "global_step": 124990, "epoch": 743} {"train_loss": -10.167809543155489, "global_step": 124991, "epoch": 743, "val_loss": 217590.546875} {"train_loss": -10.374799728393555, "global_step": 124992, "epoch": 744} {"train_loss": -10.027814865112305, "global_step": 124993, "epoch": 744} {"train_loss": -10.27668571472168, "global_step": 124994, "epoch": 744} {"train_loss": -10.121919631958008, "global_step": 124995, "epoch": 744} {"train_loss": -10.46464729309082, "global_step": 124996, "epoch": 744} {"train_loss": -9.870939254760742, "global_step": 124997, "epoch": 744} {"train_loss": -10.509674072265625, "global_step": 124998, "epoch": 744} {"train_loss": -9.704297065734863, "global_step": 124999, "epoch": 744} {"train_loss": -10.438240051269531, "global_step": 125000, "epoch": 744} {"train_loss": -9.739773750305176, "global_step": 125001, "epoch": 744} {"train_loss": -10.13270378112793, "global_step": 125002, "epoch": 744} {"train_loss": -10.170109748840332, "global_step": 125003, "epoch": 744} {"train_loss": -10.225997924804688, "global_step": 125004, "epoch": 744} {"train_loss": -10.416706085205078, "global_step": 125005, "epoch": 744} {"train_loss": -9.945302963256836, "global_step": 125006, "epoch": 744} {"train_loss": -10.489728927612305, "global_step": 125007, "epoch": 744} {"train_loss": -9.829446792602539, "global_step": 125008, "epoch": 744} {"train_loss": -10.11922836303711, "global_step": 125009, "epoch": 744} {"train_loss": -9.928606986999512, "global_step": 125010, "epoch": 744} {"train_loss": -10.412701606750488, "global_step": 125011, "epoch": 744} {"train_loss": -9.857014656066895, "global_step": 125012, "epoch": 744} {"train_loss": -9.902420043945312, "global_step": 125013, "epoch": 744} {"train_loss": -9.754915237426758, "global_step": 125014, "epoch": 744} {"train_loss": -10.180323600769043, "global_step": 125015, "epoch": 744} {"train_loss": -9.913162231445312, "global_step": 125016, "epoch": 744} {"train_loss": -10.325979232788086, "global_step": 125017, "epoch": 744} {"train_loss": -9.982625961303711, "global_step": 125018, "epoch": 744} {"train_loss": -10.221303939819336, "global_step": 125019, "epoch": 744} {"train_loss": -10.250008583068848, "global_step": 125020, "epoch": 744} {"train_loss": -9.976311683654785, "global_step": 125021, "epoch": 744} {"train_loss": -10.188579559326172, "global_step": 125022, "epoch": 744} {"train_loss": -10.187908172607422, "global_step": 125023, "epoch": 744} {"train_loss": -10.057273864746094, "global_step": 125024, "epoch": 744} {"train_loss": -10.311016082763672, "global_step": 125025, "epoch": 744} {"train_loss": -10.089694023132324, "global_step": 125026, "epoch": 744} {"train_loss": -10.557596206665039, "global_step": 125027, "epoch": 744} {"train_loss": -10.41171646118164, "global_step": 125028, "epoch": 744} {"train_loss": -10.408687591552734, "global_step": 125029, "epoch": 744} {"train_loss": -10.49673080444336, "global_step": 125030, "epoch": 744} {"train_loss": -10.43806266784668, "global_step": 125031, "epoch": 744} {"train_loss": -10.340563774108887, "global_step": 125032, "epoch": 744} {"train_loss": -10.44841194152832, "global_step": 125033, "epoch": 744} {"train_loss": -10.395423889160156, "global_step": 125034, "epoch": 744} {"train_loss": -10.426656723022461, "global_step": 125035, "epoch": 744} {"train_loss": -10.277475357055664, "global_step": 125036, "epoch": 744} {"train_loss": -10.426773071289062, "global_step": 125037, "epoch": 744} {"train_loss": -10.342164993286133, "global_step": 125038, "epoch": 744} {"train_loss": -10.419792175292969, "global_step": 125039, "epoch": 744} {"train_loss": -10.401556015014648, "global_step": 125040, "epoch": 744} {"train_loss": -10.659221649169922, "global_step": 125041, "epoch": 744} {"train_loss": -10.573492050170898, "global_step": 125042, "epoch": 744} {"train_loss": -10.390667915344238, "global_step": 125043, "epoch": 744} {"train_loss": -10.452309608459473, "global_step": 125044, "epoch": 744} {"train_loss": -10.590548515319824, "global_step": 125045, "epoch": 744} {"train_loss": -10.522489547729492, "global_step": 125046, "epoch": 744} {"train_loss": -10.370979309082031, "global_step": 125047, "epoch": 744} {"train_loss": -10.35812759399414, "global_step": 125048, "epoch": 744} {"train_loss": -10.370015144348145, "global_step": 125049, "epoch": 744} {"train_loss": -10.19883918762207, "global_step": 125050, "epoch": 744} {"train_loss": -10.295583724975586, "global_step": 125051, "epoch": 744} {"train_loss": -9.919962882995605, "global_step": 125052, "epoch": 744} {"train_loss": -10.485494613647461, "global_step": 125053, "epoch": 744} {"train_loss": -10.130544662475586, "global_step": 125054, "epoch": 744} {"train_loss": -10.430171966552734, "global_step": 125055, "epoch": 744} {"train_loss": -10.370954513549805, "global_step": 125056, "epoch": 744} {"train_loss": -10.3529052734375, "global_step": 125057, "epoch": 744} {"train_loss": -10.532175064086914, "global_step": 125058, "epoch": 744} {"train_loss": -10.117510795593262, "global_step": 125059, "epoch": 744} {"train_loss": -10.500801086425781, "global_step": 125060, "epoch": 744} {"train_loss": -10.343626022338867, "global_step": 125061, "epoch": 744} {"train_loss": -9.971346855163574, "global_step": 125062, "epoch": 744} {"train_loss": -10.372689247131348, "global_step": 125063, "epoch": 744} {"train_loss": -10.23531436920166, "global_step": 125064, "epoch": 744} {"train_loss": -10.598220825195312, "global_step": 125065, "epoch": 744} {"train_loss": -10.118449211120605, "global_step": 125066, "epoch": 744} {"train_loss": -10.314776420593262, "global_step": 125067, "epoch": 744} {"train_loss": -10.451879501342773, "global_step": 125068, "epoch": 744} {"train_loss": -10.231476783752441, "global_step": 125069, "epoch": 744} {"train_loss": -10.198373794555664, "global_step": 125070, "epoch": 744} {"train_loss": -10.098992347717285, "global_step": 125071, "epoch": 744} {"train_loss": -10.338933944702148, "global_step": 125072, "epoch": 744} {"train_loss": -10.2674560546875, "global_step": 125073, "epoch": 744} {"train_loss": -10.31873607635498, "global_step": 125074, "epoch": 744} {"train_loss": -10.04981517791748, "global_step": 125075, "epoch": 744} {"train_loss": -10.166954040527344, "global_step": 125076, "epoch": 744} {"train_loss": -10.518274307250977, "global_step": 125077, "epoch": 744} {"train_loss": -10.331585884094238, "global_step": 125078, "epoch": 744} {"train_loss": -10.169706344604492, "global_step": 125079, "epoch": 744} {"train_loss": -10.373922348022461, "global_step": 125080, "epoch": 744} {"train_loss": -9.952166557312012, "global_step": 125081, "epoch": 744} {"train_loss": -10.310665130615234, "global_step": 125082, "epoch": 744} {"train_loss": -10.287294387817383, "global_step": 125083, "epoch": 744} {"train_loss": -10.372611999511719, "global_step": 125084, "epoch": 744} {"train_loss": -10.314138412475586, "global_step": 125085, "epoch": 744} {"train_loss": -10.218071937561035, "global_step": 125086, "epoch": 744} {"train_loss": -10.474864959716797, "global_step": 125087, "epoch": 744} {"train_loss": -10.321884155273438, "global_step": 125088, "epoch": 744} {"train_loss": -10.490635871887207, "global_step": 125089, "epoch": 744} {"train_loss": -10.345863342285156, "global_step": 125090, "epoch": 744} {"train_loss": -10.330215454101562, "global_step": 125091, "epoch": 744} {"train_loss": -10.399621963500977, "global_step": 125092, "epoch": 744} {"train_loss": -10.390705108642578, "global_step": 125093, "epoch": 744} {"train_loss": -10.335710525512695, "global_step": 125094, "epoch": 744} {"train_loss": -10.451459884643555, "global_step": 125095, "epoch": 744} {"train_loss": -10.3764066696167, "global_step": 125096, "epoch": 744} {"train_loss": -10.315715789794922, "global_step": 125097, "epoch": 744} {"train_loss": -10.592131614685059, "global_step": 125098, "epoch": 744} {"train_loss": -10.535346031188965, "global_step": 125099, "epoch": 744} {"train_loss": -10.234784126281738, "global_step": 125100, "epoch": 744} {"train_loss": -10.441764831542969, "global_step": 125101, "epoch": 744} {"train_loss": -10.692025184631348, "global_step": 125102, "epoch": 744} {"train_loss": -10.369224548339844, "global_step": 125103, "epoch": 744} {"train_loss": -10.430801391601562, "global_step": 125104, "epoch": 744} {"train_loss": -10.27612590789795, "global_step": 125105, "epoch": 744} {"train_loss": -10.629608154296875, "global_step": 125106, "epoch": 744} {"train_loss": -10.483304023742676, "global_step": 125107, "epoch": 744} {"train_loss": -10.733025550842285, "global_step": 125108, "epoch": 744} {"train_loss": -10.41893196105957, "global_step": 125109, "epoch": 744} {"train_loss": -10.31784439086914, "global_step": 125110, "epoch": 744} {"train_loss": -10.154967308044434, "global_step": 125111, "epoch": 744} {"train_loss": -10.126201629638672, "global_step": 125112, "epoch": 744} {"train_loss": -10.310832977294922, "global_step": 125113, "epoch": 744} {"train_loss": -10.0484619140625, "global_step": 125114, "epoch": 744} {"train_loss": -9.852867126464844, "global_step": 125115, "epoch": 744} {"train_loss": -10.568157196044922, "global_step": 125116, "epoch": 744} {"train_loss": -9.29010009765625, "global_step": 125117, "epoch": 744} {"train_loss": -10.182376861572266, "global_step": 125118, "epoch": 744} {"train_loss": -9.57043170928955, "global_step": 125119, "epoch": 744} {"train_loss": -10.176496505737305, "global_step": 125120, "epoch": 744} {"train_loss": -9.92251205444336, "global_step": 125121, "epoch": 744} {"train_loss": -9.805509567260742, "global_step": 125122, "epoch": 744} {"train_loss": -9.730690002441406, "global_step": 125123, "epoch": 744} {"train_loss": -9.711112976074219, "global_step": 125124, "epoch": 744} {"train_loss": -10.143026351928711, "global_step": 125125, "epoch": 744} {"train_loss": -9.42831802368164, "global_step": 125126, "epoch": 744} {"train_loss": -9.818140029907227, "global_step": 125127, "epoch": 744} {"train_loss": -9.984368324279785, "global_step": 125128, "epoch": 744} {"train_loss": -9.849854469299316, "global_step": 125129, "epoch": 744} {"train_loss": -9.917104721069336, "global_step": 125130, "epoch": 744} {"train_loss": -10.461674690246582, "global_step": 125131, "epoch": 744} {"train_loss": -10.030017852783203, "global_step": 125132, "epoch": 744} {"train_loss": -10.123767852783203, "global_step": 125133, "epoch": 744} {"train_loss": -10.081682205200195, "global_step": 125134, "epoch": 744} {"train_loss": -10.089214324951172, "global_step": 125135, "epoch": 744} {"train_loss": -10.166728973388672, "global_step": 125136, "epoch": 744} {"train_loss": -10.136178970336914, "global_step": 125137, "epoch": 744} {"train_loss": -10.085679054260254, "global_step": 125138, "epoch": 744} {"train_loss": -10.142769813537598, "global_step": 125139, "epoch": 744} {"train_loss": -10.089397430419922, "global_step": 125140, "epoch": 744} {"train_loss": -10.052345275878906, "global_step": 125141, "epoch": 744} {"train_loss": -10.237641334533691, "global_step": 125142, "epoch": 744} {"train_loss": -10.296662330627441, "global_step": 125143, "epoch": 744} {"train_loss": -10.176248550415039, "global_step": 125144, "epoch": 744} {"train_loss": -10.253533363342285, "global_step": 125145, "epoch": 744} {"train_loss": -10.223919868469238, "global_step": 125146, "epoch": 744} {"train_loss": -10.315736770629883, "global_step": 125147, "epoch": 744} {"train_loss": -9.998558044433594, "global_step": 125148, "epoch": 744} {"train_loss": -10.353611946105957, "global_step": 125149, "epoch": 744} {"train_loss": -10.153974533081055, "global_step": 125150, "epoch": 744} {"train_loss": -10.376319885253906, "global_step": 125151, "epoch": 744} {"train_loss": -9.699013710021973, "global_step": 125152, "epoch": 744} {"train_loss": -10.473995208740234, "global_step": 125153, "epoch": 744} {"train_loss": -9.964988708496094, "global_step": 125154, "epoch": 744} {"train_loss": -10.137505531311035, "global_step": 125155, "epoch": 744} {"train_loss": -9.965436935424805, "global_step": 125156, "epoch": 744} {"train_loss": -10.410050392150879, "global_step": 125157, "epoch": 744} {"train_loss": -10.02375316619873, "global_step": 125158, "epoch": 744} {"train_loss": -10.229716215814863, "global_step": 125159, "epoch": 744, "val_loss": 218218.109375} {"train_loss": -9.942670822143555, "global_step": 125160, "epoch": 745} {"train_loss": -9.941133499145508, "global_step": 125161, "epoch": 745} {"train_loss": -10.036478042602539, "global_step": 125162, "epoch": 745} {"train_loss": -9.889241218566895, "global_step": 125163, "epoch": 745} {"train_loss": -9.93734073638916, "global_step": 125164, "epoch": 745} {"train_loss": -10.242677688598633, "global_step": 125165, "epoch": 745} {"train_loss": -9.674154281616211, "global_step": 125166, "epoch": 745} {"train_loss": -10.2719144821167, "global_step": 125167, "epoch": 745} {"train_loss": -9.549725532531738, "global_step": 125168, "epoch": 745} {"train_loss": -10.055776596069336, "global_step": 125169, "epoch": 745} {"train_loss": -9.759449005126953, "global_step": 125170, "epoch": 745} {"train_loss": -10.256929397583008, "global_step": 125171, "epoch": 745} {"train_loss": -9.828022956848145, "global_step": 125172, "epoch": 745} {"train_loss": -10.22810173034668, "global_step": 125173, "epoch": 745} {"train_loss": -10.08337116241455, "global_step": 125174, "epoch": 745} {"train_loss": -10.14149284362793, "global_step": 125175, "epoch": 745} {"train_loss": -9.986491203308105, "global_step": 125176, "epoch": 745} {"train_loss": -10.232955932617188, "global_step": 125177, "epoch": 745} {"train_loss": -10.330367088317871, "global_step": 125178, "epoch": 745} {"train_loss": -10.453226089477539, "global_step": 125179, "epoch": 745} {"train_loss": -10.176639556884766, "global_step": 125180, "epoch": 745} {"train_loss": -10.237056732177734, "global_step": 125181, "epoch": 745} {"train_loss": -10.07490348815918, "global_step": 125182, "epoch": 745} {"train_loss": -10.232110023498535, "global_step": 125183, "epoch": 745} {"train_loss": -10.344619750976562, "global_step": 125184, "epoch": 745} {"train_loss": -9.971698760986328, "global_step": 125185, "epoch": 745} {"train_loss": -10.393436431884766, "global_step": 125186, "epoch": 745} {"train_loss": -10.338441848754883, "global_step": 125187, "epoch": 745} {"train_loss": -10.299880981445312, "global_step": 125188, "epoch": 745} {"train_loss": -10.213102340698242, "global_step": 125189, "epoch": 745} {"train_loss": -10.46695327758789, "global_step": 125190, "epoch": 745} {"train_loss": -10.387428283691406, "global_step": 125191, "epoch": 745} {"train_loss": -10.346449851989746, "global_step": 125192, "epoch": 745} {"train_loss": -10.549749374389648, "global_step": 125193, "epoch": 745} {"train_loss": -10.227038383483887, "global_step": 125194, "epoch": 745} {"train_loss": -10.329345703125, "global_step": 125195, "epoch": 745} {"train_loss": -10.277006149291992, "global_step": 125196, "epoch": 745} {"train_loss": -10.228832244873047, "global_step": 125197, "epoch": 745} {"train_loss": -10.422086715698242, "global_step": 125198, "epoch": 745} {"train_loss": -10.330302238464355, "global_step": 125199, "epoch": 745} {"train_loss": -10.30810546875, "global_step": 125200, "epoch": 745} {"train_loss": -10.404172897338867, "global_step": 125201, "epoch": 745} {"train_loss": -10.044391632080078, "global_step": 125202, "epoch": 745} {"train_loss": -10.518675804138184, "global_step": 125203, "epoch": 745} {"train_loss": -10.315923690795898, "global_step": 125204, "epoch": 745} {"train_loss": -10.181249618530273, "global_step": 125205, "epoch": 745} {"train_loss": -10.17800521850586, "global_step": 125206, "epoch": 745} {"train_loss": -10.30258560180664, "global_step": 125207, "epoch": 745} {"train_loss": -10.133854866027832, "global_step": 125208, "epoch": 745} {"train_loss": -10.3132905960083, "global_step": 125209, "epoch": 745} {"train_loss": -10.029230117797852, "global_step": 125210, "epoch": 745} {"train_loss": -10.517133712768555, "global_step": 125211, "epoch": 745} {"train_loss": -10.012554168701172, "global_step": 125212, "epoch": 745} {"train_loss": -10.020740509033203, "global_step": 125213, "epoch": 745} {"train_loss": -10.005624771118164, "global_step": 125214, "epoch": 745} {"train_loss": -10.119661331176758, "global_step": 125215, "epoch": 745} {"train_loss": -9.985952377319336, "global_step": 125216, "epoch": 745} {"train_loss": -9.876134872436523, "global_step": 125217, "epoch": 745} {"train_loss": -10.101770401000977, "global_step": 125218, "epoch": 745} {"train_loss": -9.996696472167969, "global_step": 125219, "epoch": 745} {"train_loss": -9.731111526489258, "global_step": 125220, "epoch": 745} {"train_loss": -10.111274719238281, "global_step": 125221, "epoch": 745} {"train_loss": -10.035140991210938, "global_step": 125222, "epoch": 745} {"train_loss": -10.27253246307373, "global_step": 125223, "epoch": 745} {"train_loss": -9.675294876098633, "global_step": 125224, "epoch": 745} {"train_loss": -10.432549476623535, "global_step": 125225, "epoch": 745} {"train_loss": -9.825754165649414, "global_step": 125226, "epoch": 745} {"train_loss": -10.22500228881836, "global_step": 125227, "epoch": 745} {"train_loss": -10.152861595153809, "global_step": 125228, "epoch": 745} {"train_loss": -10.22477912902832, "global_step": 125229, "epoch": 745} {"train_loss": -10.165803909301758, "global_step": 125230, "epoch": 745} {"train_loss": -10.370781898498535, "global_step": 125231, "epoch": 745} {"train_loss": -10.119918823242188, "global_step": 125232, "epoch": 745} {"train_loss": -10.123412132263184, "global_step": 125233, "epoch": 745} {"train_loss": -10.30133056640625, "global_step": 125234, "epoch": 745} {"train_loss": -10.196725845336914, "global_step": 125235, "epoch": 745} {"train_loss": -10.291645050048828, "global_step": 125236, "epoch": 745} {"train_loss": -10.204977035522461, "global_step": 125237, "epoch": 745} {"train_loss": -10.501718521118164, "global_step": 125238, "epoch": 745} {"train_loss": -10.315926551818848, "global_step": 125239, "epoch": 745} {"train_loss": -10.201794624328613, "global_step": 125240, "epoch": 745} {"train_loss": -10.4144868850708, "global_step": 125241, "epoch": 745} {"train_loss": -10.426111221313477, "global_step": 125242, "epoch": 745} {"train_loss": -10.466913223266602, "global_step": 125243, "epoch": 745} {"train_loss": -10.508926391601562, "global_step": 125244, "epoch": 745} {"train_loss": -10.27874755859375, "global_step": 125245, "epoch": 745} {"train_loss": -10.443452835083008, "global_step": 125246, "epoch": 745} {"train_loss": -10.452278137207031, "global_step": 125247, "epoch": 745} {"train_loss": -10.255596160888672, "global_step": 125248, "epoch": 745} {"train_loss": -10.270978927612305, "global_step": 125249, "epoch": 745} {"train_loss": -10.385021209716797, "global_step": 125250, "epoch": 745} {"train_loss": -10.208721160888672, "global_step": 125251, "epoch": 745} {"train_loss": -10.566211700439453, "global_step": 125252, "epoch": 745} {"train_loss": -10.527593612670898, "global_step": 125253, "epoch": 745} {"train_loss": -10.283763885498047, "global_step": 125254, "epoch": 745} {"train_loss": -10.51196575164795, "global_step": 125255, "epoch": 745} {"train_loss": -10.56064510345459, "global_step": 125256, "epoch": 745} {"train_loss": -10.639341354370117, "global_step": 125257, "epoch": 745} {"train_loss": -10.520371437072754, "global_step": 125258, "epoch": 745} {"train_loss": -10.221945762634277, "global_step": 125259, "epoch": 745} {"train_loss": -10.717512130737305, "global_step": 125260, "epoch": 745} {"train_loss": -10.341755867004395, "global_step": 125261, "epoch": 745} {"train_loss": -10.478877067565918, "global_step": 125262, "epoch": 745} {"train_loss": -10.518693923950195, "global_step": 125263, "epoch": 745} {"train_loss": -10.461366653442383, "global_step": 125264, "epoch": 745} {"train_loss": -10.7978515625, "global_step": 125265, "epoch": 745} {"train_loss": -10.565624237060547, "global_step": 125266, "epoch": 745} {"train_loss": -10.593013763427734, "global_step": 125267, "epoch": 745} {"train_loss": -10.380492210388184, "global_step": 125268, "epoch": 745} {"train_loss": -10.59054946899414, "global_step": 125269, "epoch": 745} {"train_loss": -10.477060317993164, "global_step": 125270, "epoch": 745} {"train_loss": -10.182090759277344, "global_step": 125271, "epoch": 745} {"train_loss": -10.038392066955566, "global_step": 125272, "epoch": 745} {"train_loss": -10.442838668823242, "global_step": 125273, "epoch": 745} {"train_loss": -10.392303466796875, "global_step": 125274, "epoch": 745} {"train_loss": -9.706371307373047, "global_step": 125275, "epoch": 745} {"train_loss": -9.944574356079102, "global_step": 125276, "epoch": 745} {"train_loss": -10.127304077148438, "global_step": 125277, "epoch": 745} {"train_loss": -9.484768867492676, "global_step": 125278, "epoch": 745} {"train_loss": -10.199283599853516, "global_step": 125279, "epoch": 745} {"train_loss": -9.945703506469727, "global_step": 125280, "epoch": 745} {"train_loss": -10.122293472290039, "global_step": 125281, "epoch": 745} {"train_loss": -10.134540557861328, "global_step": 125282, "epoch": 745} {"train_loss": -10.561477661132812, "global_step": 125283, "epoch": 745} {"train_loss": -10.39869499206543, "global_step": 125284, "epoch": 745} {"train_loss": -10.61320972442627, "global_step": 125285, "epoch": 745} {"train_loss": -10.491312026977539, "global_step": 125286, "epoch": 745} {"train_loss": -10.126153945922852, "global_step": 125287, "epoch": 745} {"train_loss": -10.206953048706055, "global_step": 125288, "epoch": 745} {"train_loss": -10.106693267822266, "global_step": 125289, "epoch": 745} {"train_loss": -10.234159469604492, "global_step": 125290, "epoch": 745} {"train_loss": -10.043601989746094, "global_step": 125291, "epoch": 745} {"train_loss": -10.234245300292969, "global_step": 125292, "epoch": 745} {"train_loss": -10.208809852600098, "global_step": 125293, "epoch": 745} {"train_loss": -10.503132820129395, "global_step": 125294, "epoch": 745} {"train_loss": -10.341503143310547, "global_step": 125295, "epoch": 745} {"train_loss": -10.274673461914062, "global_step": 125296, "epoch": 745} {"train_loss": -10.232440948486328, "global_step": 125297, "epoch": 745} {"train_loss": -10.338489532470703, "global_step": 125298, "epoch": 745} {"train_loss": -10.125629425048828, "global_step": 125299, "epoch": 745} {"train_loss": -10.206903457641602, "global_step": 125300, "epoch": 745} {"train_loss": -10.364439010620117, "global_step": 125301, "epoch": 745} {"train_loss": -10.408781051635742, "global_step": 125302, "epoch": 745} {"train_loss": -10.305471420288086, "global_step": 125303, "epoch": 745} {"train_loss": -10.525616645812988, "global_step": 125304, "epoch": 745} {"train_loss": -10.288800239562988, "global_step": 125305, "epoch": 745} {"train_loss": -10.110898971557617, "global_step": 125306, "epoch": 745} {"train_loss": -10.180671691894531, "global_step": 125307, "epoch": 745} {"train_loss": -10.36700439453125, "global_step": 125308, "epoch": 745} {"train_loss": -10.099353790283203, "global_step": 125309, "epoch": 745} {"train_loss": -10.06149673461914, "global_step": 125310, "epoch": 745} {"train_loss": -10.057567596435547, "global_step": 125311, "epoch": 745} {"train_loss": -10.083540916442871, "global_step": 125312, "epoch": 745} {"train_loss": -10.125166893005371, "global_step": 125313, "epoch": 745} {"train_loss": -10.376975059509277, "global_step": 125314, "epoch": 745} {"train_loss": -10.42967414855957, "global_step": 125315, "epoch": 745} {"train_loss": -10.283397674560547, "global_step": 125316, "epoch": 745} {"train_loss": -10.3399658203125, "global_step": 125317, "epoch": 745} {"train_loss": -10.032236099243164, "global_step": 125318, "epoch": 745} {"train_loss": -10.493200302124023, "global_step": 125319, "epoch": 745} {"train_loss": -10.145964622497559, "global_step": 125320, "epoch": 745} {"train_loss": -10.63060474395752, "global_step": 125321, "epoch": 745} {"train_loss": -10.36021900177002, "global_step": 125322, "epoch": 745} {"train_loss": -10.231671333312988, "global_step": 125323, "epoch": 745} {"train_loss": -10.31432819366455, "global_step": 125324, "epoch": 745} {"train_loss": -9.970941543579102, "global_step": 125325, "epoch": 745} {"train_loss": -10.248847007751465, "global_step": 125326, "epoch": 745} {"train_loss": -10.24094577630361, "global_step": 125327, "epoch": 745, "val_loss": 218478.421875, "train_action_mse_error": 1.217966079711914} {"train_loss": -10.23185920715332, "global_step": 125328, "epoch": 746} {"train_loss": -10.628439903259277, "global_step": 125329, "epoch": 746} {"train_loss": -10.211013793945312, "global_step": 125330, "epoch": 746} {"train_loss": -10.163872718811035, "global_step": 125331, "epoch": 746} {"train_loss": -9.669344902038574, "global_step": 125332, "epoch": 746} {"train_loss": -10.164077758789062, "global_step": 125333, "epoch": 746} {"train_loss": -9.866104125976562, "global_step": 125334, "epoch": 746} {"train_loss": -10.511066436767578, "global_step": 125335, "epoch": 746} {"train_loss": -10.072712898254395, "global_step": 125336, "epoch": 746} {"train_loss": -10.338064193725586, "global_step": 125337, "epoch": 746} {"train_loss": -10.294163703918457, "global_step": 125338, "epoch": 746} {"train_loss": -10.220105171203613, "global_step": 125339, "epoch": 746} {"train_loss": -10.47845458984375, "global_step": 125340, "epoch": 746} {"train_loss": -10.183666229248047, "global_step": 125341, "epoch": 746} {"train_loss": -10.349055290222168, "global_step": 125342, "epoch": 746} {"train_loss": -10.279388427734375, "global_step": 125343, "epoch": 746} {"train_loss": -10.430902481079102, "global_step": 125344, "epoch": 746} {"train_loss": -10.372968673706055, "global_step": 125345, "epoch": 746} {"train_loss": -10.209512710571289, "global_step": 125346, "epoch": 746} {"train_loss": -10.258750915527344, "global_step": 125347, "epoch": 746} {"train_loss": -10.397464752197266, "global_step": 125348, "epoch": 746} {"train_loss": -10.096917152404785, "global_step": 125349, "epoch": 746} {"train_loss": -10.427511215209961, "global_step": 125350, "epoch": 746} {"train_loss": -10.31778621673584, "global_step": 125351, "epoch": 746} {"train_loss": -10.453438758850098, "global_step": 125352, "epoch": 746} {"train_loss": -10.29378890991211, "global_step": 125353, "epoch": 746} {"train_loss": -9.868101119995117, "global_step": 125354, "epoch": 746} {"train_loss": -9.773777961730957, "global_step": 125355, "epoch": 746} {"train_loss": -10.267772674560547, "global_step": 125356, "epoch": 746} {"train_loss": -9.739295959472656, "global_step": 125357, "epoch": 746} {"train_loss": -9.313928604125977, "global_step": 125358, "epoch": 746} {"train_loss": -10.261504173278809, "global_step": 125359, "epoch": 746} {"train_loss": -9.173120498657227, "global_step": 125360, "epoch": 746} {"train_loss": -9.471196174621582, "global_step": 125361, "epoch": 746} {"train_loss": -9.8594970703125, "global_step": 125362, "epoch": 746} {"train_loss": -9.742170333862305, "global_step": 125363, "epoch": 746} {"train_loss": -9.782501220703125, "global_step": 125364, "epoch": 746} {"train_loss": -9.795302391052246, "global_step": 125365, "epoch": 746} {"train_loss": -9.70195484161377, "global_step": 125366, "epoch": 746} {"train_loss": -9.825596809387207, "global_step": 125367, "epoch": 746} {"train_loss": -10.277433395385742, "global_step": 125368, "epoch": 746} {"train_loss": -9.563484191894531, "global_step": 125369, "epoch": 746} {"train_loss": -10.061966896057129, "global_step": 125370, "epoch": 746} {"train_loss": -10.072758674621582, "global_step": 125371, "epoch": 746} {"train_loss": -9.673004150390625, "global_step": 125372, "epoch": 746} {"train_loss": -10.034355163574219, "global_step": 125373, "epoch": 746} {"train_loss": -10.423008918762207, "global_step": 125374, "epoch": 746} {"train_loss": -9.708198547363281, "global_step": 125375, "epoch": 746} {"train_loss": -10.179487228393555, "global_step": 125376, "epoch": 746} {"train_loss": -10.10055160522461, "global_step": 125377, "epoch": 746} {"train_loss": -9.814997673034668, "global_step": 125378, "epoch": 746} {"train_loss": -10.05634880065918, "global_step": 125379, "epoch": 746} {"train_loss": -10.285049438476562, "global_step": 125380, "epoch": 746} {"train_loss": -9.992450714111328, "global_step": 125381, "epoch": 746} {"train_loss": -10.204011917114258, "global_step": 125382, "epoch": 746} {"train_loss": -10.097673416137695, "global_step": 125383, "epoch": 746} {"train_loss": -10.040678977966309, "global_step": 125384, "epoch": 746} {"train_loss": -9.901256561279297, "global_step": 125385, "epoch": 746} {"train_loss": -10.171716690063477, "global_step": 125386, "epoch": 746} {"train_loss": -10.1543550491333, "global_step": 125387, "epoch": 746} {"train_loss": -10.393365859985352, "global_step": 125388, "epoch": 746} {"train_loss": -10.245802879333496, "global_step": 125389, "epoch": 746} {"train_loss": -10.238130569458008, "global_step": 125390, "epoch": 746} {"train_loss": -10.280328750610352, "global_step": 125391, "epoch": 746} {"train_loss": -10.216007232666016, "global_step": 125392, "epoch": 746} {"train_loss": -10.425752639770508, "global_step": 125393, "epoch": 746} {"train_loss": -10.412317276000977, "global_step": 125394, "epoch": 746} {"train_loss": -10.015453338623047, "global_step": 125395, "epoch": 746} {"train_loss": -10.431159973144531, "global_step": 125396, "epoch": 746} {"train_loss": -10.220442771911621, "global_step": 125397, "epoch": 746} {"train_loss": -10.549726486206055, "global_step": 125398, "epoch": 746} {"train_loss": -10.325621604919434, "global_step": 125399, "epoch": 746} {"train_loss": -10.492687225341797, "global_step": 125400, "epoch": 746} {"train_loss": -10.464954376220703, "global_step": 125401, "epoch": 746} {"train_loss": -10.533265113830566, "global_step": 125402, "epoch": 746} {"train_loss": -10.422294616699219, "global_step": 125403, "epoch": 746} {"train_loss": -10.582173347473145, "global_step": 125404, "epoch": 746} {"train_loss": -10.52817440032959, "global_step": 125405, "epoch": 746} {"train_loss": -10.508588790893555, "global_step": 125406, "epoch": 746} {"train_loss": -10.607933044433594, "global_step": 125407, "epoch": 746} {"train_loss": -10.671964645385742, "global_step": 125408, "epoch": 746} {"train_loss": -10.753061294555664, "global_step": 125409, "epoch": 746} {"train_loss": -10.361656188964844, "global_step": 125410, "epoch": 746} {"train_loss": -10.53864574432373, "global_step": 125411, "epoch": 746} {"train_loss": -10.57274055480957, "global_step": 125412, "epoch": 746} {"train_loss": -10.338333129882812, "global_step": 125413, "epoch": 746} {"train_loss": -10.659607887268066, "global_step": 125414, "epoch": 746} {"train_loss": -10.438037872314453, "global_step": 125415, "epoch": 746} {"train_loss": -10.140153884887695, "global_step": 125416, "epoch": 746} {"train_loss": -10.294386863708496, "global_step": 125417, "epoch": 746} {"train_loss": -9.947345733642578, "global_step": 125418, "epoch": 746} {"train_loss": -10.388036727905273, "global_step": 125419, "epoch": 746} {"train_loss": -9.93725872039795, "global_step": 125420, "epoch": 746} {"train_loss": -9.906688690185547, "global_step": 125421, "epoch": 746} {"train_loss": -10.470194816589355, "global_step": 125422, "epoch": 746} {"train_loss": -10.133086204528809, "global_step": 125423, "epoch": 746} {"train_loss": -10.412802696228027, "global_step": 125424, "epoch": 746} {"train_loss": -10.126311302185059, "global_step": 125425, "epoch": 746} {"train_loss": -9.809606552124023, "global_step": 125426, "epoch": 746} {"train_loss": -10.043313980102539, "global_step": 125427, "epoch": 746} {"train_loss": -10.114950180053711, "global_step": 125428, "epoch": 746} {"train_loss": -9.904987335205078, "global_step": 125429, "epoch": 746} {"train_loss": -10.085897445678711, "global_step": 125430, "epoch": 746} {"train_loss": -10.096681594848633, "global_step": 125431, "epoch": 746} {"train_loss": -8.479284286499023, "global_step": 125432, "epoch": 746} {"train_loss": -10.384544372558594, "global_step": 125433, "epoch": 746} {"train_loss": -9.827640533447266, "global_step": 125434, "epoch": 746} {"train_loss": -9.567785263061523, "global_step": 125435, "epoch": 746} {"train_loss": -10.428149223327637, "global_step": 125436, "epoch": 746} {"train_loss": -9.34421157836914, "global_step": 125437, "epoch": 746} {"train_loss": -9.898859024047852, "global_step": 125438, "epoch": 746} {"train_loss": -9.707921981811523, "global_step": 125439, "epoch": 746} {"train_loss": -9.715274810791016, "global_step": 125440, "epoch": 746} {"train_loss": -9.935501098632812, "global_step": 125441, "epoch": 746} {"train_loss": -9.682077407836914, "global_step": 125442, "epoch": 746} {"train_loss": -9.690775871276855, "global_step": 125443, "epoch": 746} {"train_loss": -10.032585144042969, "global_step": 125444, "epoch": 746} {"train_loss": -9.568735122680664, "global_step": 125445, "epoch": 746} {"train_loss": -10.176361083984375, "global_step": 125446, "epoch": 746} {"train_loss": -9.770879745483398, "global_step": 125447, "epoch": 746} {"train_loss": -9.862555503845215, "global_step": 125448, "epoch": 746} {"train_loss": -10.068605422973633, "global_step": 125449, "epoch": 746} {"train_loss": -10.003013610839844, "global_step": 125450, "epoch": 746} {"train_loss": -10.031606674194336, "global_step": 125451, "epoch": 746} {"train_loss": -9.881047248840332, "global_step": 125452, "epoch": 746} {"train_loss": -10.051593780517578, "global_step": 125453, "epoch": 746} {"train_loss": -9.937576293945312, "global_step": 125454, "epoch": 746} {"train_loss": -10.186848640441895, "global_step": 125455, "epoch": 746} {"train_loss": -10.250974655151367, "global_step": 125456, "epoch": 746} {"train_loss": -10.193342208862305, "global_step": 125457, "epoch": 746} {"train_loss": -9.866460800170898, "global_step": 125458, "epoch": 746} {"train_loss": -10.210518836975098, "global_step": 125459, "epoch": 746} {"train_loss": -10.031466484069824, "global_step": 125460, "epoch": 746} {"train_loss": -10.432348251342773, "global_step": 125461, "epoch": 746} {"train_loss": -10.23067855834961, "global_step": 125462, "epoch": 746} {"train_loss": -10.036853790283203, "global_step": 125463, "epoch": 746} {"train_loss": -9.901695251464844, "global_step": 125464, "epoch": 746} {"train_loss": -10.200363159179688, "global_step": 125465, "epoch": 746} {"train_loss": -10.039514541625977, "global_step": 125466, "epoch": 746} {"train_loss": -10.082659721374512, "global_step": 125467, "epoch": 746} {"train_loss": -9.903068542480469, "global_step": 125468, "epoch": 746} {"train_loss": -9.976318359375, "global_step": 125469, "epoch": 746} {"train_loss": -10.398550033569336, "global_step": 125470, "epoch": 746} {"train_loss": -10.12834358215332, "global_step": 125471, "epoch": 746} {"train_loss": -10.339238166809082, "global_step": 125472, "epoch": 746} {"train_loss": -10.020992279052734, "global_step": 125473, "epoch": 746} {"train_loss": -10.342937469482422, "global_step": 125474, "epoch": 746} {"train_loss": -10.230874061584473, "global_step": 125475, "epoch": 746} {"train_loss": -10.379613876342773, "global_step": 125476, "epoch": 746} {"train_loss": -10.301344871520996, "global_step": 125477, "epoch": 746} {"train_loss": -10.390050888061523, "global_step": 125478, "epoch": 746} {"train_loss": -10.338085174560547, "global_step": 125479, "epoch": 746} {"train_loss": -10.16358757019043, "global_step": 125480, "epoch": 746} {"train_loss": -10.162515640258789, "global_step": 125481, "epoch": 746} {"train_loss": -10.545478820800781, "global_step": 125482, "epoch": 746} {"train_loss": -10.304994583129883, "global_step": 125483, "epoch": 746} {"train_loss": -10.525705337524414, "global_step": 125484, "epoch": 746} {"train_loss": -10.364801406860352, "global_step": 125485, "epoch": 746} {"train_loss": -10.39266586303711, "global_step": 125486, "epoch": 746} {"train_loss": -10.460197448730469, "global_step": 125487, "epoch": 746} {"train_loss": -10.279622077941895, "global_step": 125488, "epoch": 746} {"train_loss": -10.59834098815918, "global_step": 125489, "epoch": 746} {"train_loss": -10.308804512023926, "global_step": 125490, "epoch": 746} {"train_loss": -10.26132869720459, "global_step": 125491, "epoch": 746} {"train_loss": -10.274513244628906, "global_step": 125492, "epoch": 746} {"train_loss": -10.315650939941406, "global_step": 125493, "epoch": 746} {"train_loss": -10.506731986999512, "global_step": 125494, "epoch": 746} {"train_loss": -10.1470140956697, "global_step": 125495, "epoch": 746, "val_loss": 217804.890625} {"train_loss": -10.184025764465332, "global_step": 125496, "epoch": 747} {"train_loss": -10.17367172241211, "global_step": 125497, "epoch": 747} {"train_loss": -10.236711502075195, "global_step": 125498, "epoch": 747} {"train_loss": -10.317924499511719, "global_step": 125499, "epoch": 747} {"train_loss": -10.41770076751709, "global_step": 125500, "epoch": 747} {"train_loss": -10.237611770629883, "global_step": 125501, "epoch": 747} {"train_loss": -9.802579879760742, "global_step": 125502, "epoch": 747} {"train_loss": -9.930227279663086, "global_step": 125503, "epoch": 747} {"train_loss": -9.565974235534668, "global_step": 125504, "epoch": 747} {"train_loss": -10.299310684204102, "global_step": 125505, "epoch": 747} {"train_loss": -9.741706848144531, "global_step": 125506, "epoch": 747} {"train_loss": -10.054941177368164, "global_step": 125507, "epoch": 747} {"train_loss": -9.384732246398926, "global_step": 125508, "epoch": 747} {"train_loss": -9.961758613586426, "global_step": 125509, "epoch": 747} {"train_loss": -10.103048324584961, "global_step": 125510, "epoch": 747} {"train_loss": -9.616415977478027, "global_step": 125511, "epoch": 747} {"train_loss": -9.968368530273438, "global_step": 125512, "epoch": 747} {"train_loss": -9.630683898925781, "global_step": 125513, "epoch": 747} {"train_loss": -10.113668441772461, "global_step": 125514, "epoch": 747} {"train_loss": -10.296634674072266, "global_step": 125515, "epoch": 747} {"train_loss": -10.035774230957031, "global_step": 125516, "epoch": 747} {"train_loss": -10.305967330932617, "global_step": 125517, "epoch": 747} {"train_loss": -10.415666580200195, "global_step": 125518, "epoch": 747} {"train_loss": -10.33144760131836, "global_step": 125519, "epoch": 747} {"train_loss": -10.063650131225586, "global_step": 125520, "epoch": 747} {"train_loss": -10.120556831359863, "global_step": 125521, "epoch": 747} {"train_loss": -10.274856567382812, "global_step": 125522, "epoch": 747} {"train_loss": -10.288751602172852, "global_step": 125523, "epoch": 747} {"train_loss": -10.390588760375977, "global_step": 125524, "epoch": 747} {"train_loss": -10.311172485351562, "global_step": 125525, "epoch": 747} {"train_loss": -10.14301872253418, "global_step": 125526, "epoch": 747} {"train_loss": -10.2246675491333, "global_step": 125527, "epoch": 747} {"train_loss": -10.123489379882812, "global_step": 125528, "epoch": 747} {"train_loss": -10.237601280212402, "global_step": 125529, "epoch": 747} {"train_loss": -10.49667739868164, "global_step": 125530, "epoch": 747} {"train_loss": -10.152283668518066, "global_step": 125531, "epoch": 747} {"train_loss": -10.239762306213379, "global_step": 125532, "epoch": 747} {"train_loss": -10.178323745727539, "global_step": 125533, "epoch": 747} {"train_loss": -10.35315227508545, "global_step": 125534, "epoch": 747} {"train_loss": -10.355958938598633, "global_step": 125535, "epoch": 747} {"train_loss": -10.466647148132324, "global_step": 125536, "epoch": 747} {"train_loss": -10.343560218811035, "global_step": 125537, "epoch": 747} {"train_loss": -10.430045127868652, "global_step": 125538, "epoch": 747} {"train_loss": -10.237567901611328, "global_step": 125539, "epoch": 747} {"train_loss": -10.50732421875, "global_step": 125540, "epoch": 747} {"train_loss": -10.323714256286621, "global_step": 125541, "epoch": 747} {"train_loss": -10.155200958251953, "global_step": 125542, "epoch": 747} {"train_loss": -10.245923042297363, "global_step": 125543, "epoch": 747} {"train_loss": -10.308904647827148, "global_step": 125544, "epoch": 747} {"train_loss": -10.3145170211792, "global_step": 125545, "epoch": 747} {"train_loss": -10.121091842651367, "global_step": 125546, "epoch": 747} {"train_loss": -10.513574600219727, "global_step": 125547, "epoch": 747} {"train_loss": -10.279751777648926, "global_step": 125548, "epoch": 747} {"train_loss": -10.262868881225586, "global_step": 125549, "epoch": 747} {"train_loss": -10.371821403503418, "global_step": 125550, "epoch": 747} {"train_loss": -10.080926895141602, "global_step": 125551, "epoch": 747} {"train_loss": -9.612345695495605, "global_step": 125552, "epoch": 747} {"train_loss": -10.292183876037598, "global_step": 125553, "epoch": 747} {"train_loss": -10.102424621582031, "global_step": 125554, "epoch": 747} {"train_loss": -10.228076934814453, "global_step": 125555, "epoch": 747} {"train_loss": -10.297025680541992, "global_step": 125556, "epoch": 747} {"train_loss": -9.880897521972656, "global_step": 125557, "epoch": 747} {"train_loss": -10.411105155944824, "global_step": 125558, "epoch": 747} {"train_loss": -10.080455780029297, "global_step": 125559, "epoch": 747} {"train_loss": -10.23330020904541, "global_step": 125560, "epoch": 747} {"train_loss": -10.060272216796875, "global_step": 125561, "epoch": 747} {"train_loss": -10.320516586303711, "global_step": 125562, "epoch": 747} {"train_loss": -10.409432411193848, "global_step": 125563, "epoch": 747} {"train_loss": -10.476457595825195, "global_step": 125564, "epoch": 747} {"train_loss": -10.354381561279297, "global_step": 125565, "epoch": 747} {"train_loss": -10.125664710998535, "global_step": 125566, "epoch": 747} {"train_loss": -10.259963989257812, "global_step": 125567, "epoch": 747} {"train_loss": -10.274652481079102, "global_step": 125568, "epoch": 747} {"train_loss": -10.50745677947998, "global_step": 125569, "epoch": 747} {"train_loss": -10.3740234375, "global_step": 125570, "epoch": 747} {"train_loss": -10.487903594970703, "global_step": 125571, "epoch": 747} {"train_loss": -10.370580673217773, "global_step": 125572, "epoch": 747} {"train_loss": -10.318009376525879, "global_step": 125573, "epoch": 747} {"train_loss": -10.31234359741211, "global_step": 125574, "epoch": 747} {"train_loss": -10.560323715209961, "global_step": 125575, "epoch": 747} {"train_loss": -10.498125076293945, "global_step": 125576, "epoch": 747} {"train_loss": -10.176033973693848, "global_step": 125577, "epoch": 747} {"train_loss": -10.33432388305664, "global_step": 125578, "epoch": 747} {"train_loss": -10.244074821472168, "global_step": 125579, "epoch": 747} {"train_loss": -9.999885559082031, "global_step": 125580, "epoch": 747} {"train_loss": -10.486532211303711, "global_step": 125581, "epoch": 747} {"train_loss": -9.820734024047852, "global_step": 125582, "epoch": 747} {"train_loss": -10.334299087524414, "global_step": 125583, "epoch": 747} {"train_loss": -10.110539436340332, "global_step": 125584, "epoch": 747} {"train_loss": -9.986306190490723, "global_step": 125585, "epoch": 747} {"train_loss": -10.309950828552246, "global_step": 125586, "epoch": 747} {"train_loss": -9.93043327331543, "global_step": 125587, "epoch": 747} {"train_loss": -10.105743408203125, "global_step": 125588, "epoch": 747} {"train_loss": -9.788375854492188, "global_step": 125589, "epoch": 747} {"train_loss": -10.033748626708984, "global_step": 125590, "epoch": 747} {"train_loss": -9.896373748779297, "global_step": 125591, "epoch": 747} {"train_loss": -10.318052291870117, "global_step": 125592, "epoch": 747} {"train_loss": -9.535139083862305, "global_step": 125593, "epoch": 747} {"train_loss": -10.590616226196289, "global_step": 125594, "epoch": 747} {"train_loss": -9.752864837646484, "global_step": 125595, "epoch": 747} {"train_loss": -10.296826362609863, "global_step": 125596, "epoch": 747} {"train_loss": -9.947559356689453, "global_step": 125597, "epoch": 747} {"train_loss": -10.185188293457031, "global_step": 125598, "epoch": 747} {"train_loss": -10.241039276123047, "global_step": 125599, "epoch": 747} {"train_loss": -10.356719970703125, "global_step": 125600, "epoch": 747} {"train_loss": -10.224078178405762, "global_step": 125601, "epoch": 747} {"train_loss": -10.342167854309082, "global_step": 125602, "epoch": 747} {"train_loss": -9.936440467834473, "global_step": 125603, "epoch": 747} {"train_loss": -10.328022956848145, "global_step": 125604, "epoch": 747} {"train_loss": -10.263164520263672, "global_step": 125605, "epoch": 747} {"train_loss": -10.15070915222168, "global_step": 125606, "epoch": 747} {"train_loss": -10.183542251586914, "global_step": 125607, "epoch": 747} {"train_loss": -10.07537841796875, "global_step": 125608, "epoch": 747} {"train_loss": -10.611384391784668, "global_step": 125609, "epoch": 747} {"train_loss": -10.34184455871582, "global_step": 125610, "epoch": 747} {"train_loss": -10.280374526977539, "global_step": 125611, "epoch": 747} {"train_loss": -10.223492622375488, "global_step": 125612, "epoch": 747} {"train_loss": -10.144819259643555, "global_step": 125613, "epoch": 747} {"train_loss": -10.439726829528809, "global_step": 125614, "epoch": 747} {"train_loss": -10.11032772064209, "global_step": 125615, "epoch": 747} {"train_loss": -10.16525936126709, "global_step": 125616, "epoch": 747} {"train_loss": -10.097156524658203, "global_step": 125617, "epoch": 747} {"train_loss": -10.360087394714355, "global_step": 125618, "epoch": 747} {"train_loss": -10.29102897644043, "global_step": 125619, "epoch": 747} {"train_loss": -10.403005599975586, "global_step": 125620, "epoch": 747} {"train_loss": -10.224907875061035, "global_step": 125621, "epoch": 747} {"train_loss": -10.304475784301758, "global_step": 125622, "epoch": 747} {"train_loss": -10.272860527038574, "global_step": 125623, "epoch": 747} {"train_loss": -10.260676383972168, "global_step": 125624, "epoch": 747} {"train_loss": -10.48593521118164, "global_step": 125625, "epoch": 747} {"train_loss": -10.15542984008789, "global_step": 125626, "epoch": 747} {"train_loss": -10.393224716186523, "global_step": 125627, "epoch": 747} {"train_loss": -9.817253112792969, "global_step": 125628, "epoch": 747} {"train_loss": -10.578916549682617, "global_step": 125629, "epoch": 747} {"train_loss": -10.139742851257324, "global_step": 125630, "epoch": 747} {"train_loss": -10.279108047485352, "global_step": 125631, "epoch": 747} {"train_loss": -10.600936889648438, "global_step": 125632, "epoch": 747} {"train_loss": -10.148893356323242, "global_step": 125633, "epoch": 747} {"train_loss": -10.470105171203613, "global_step": 125634, "epoch": 747} {"train_loss": -10.239569664001465, "global_step": 125635, "epoch": 747} {"train_loss": -10.259964942932129, "global_step": 125636, "epoch": 747} {"train_loss": -10.27885913848877, "global_step": 125637, "epoch": 747} {"train_loss": -10.449932098388672, "global_step": 125638, "epoch": 747} {"train_loss": -10.215628623962402, "global_step": 125639, "epoch": 747} {"train_loss": -10.699373245239258, "global_step": 125640, "epoch": 747} {"train_loss": -10.222843170166016, "global_step": 125641, "epoch": 747} {"train_loss": -10.249387741088867, "global_step": 125642, "epoch": 747} {"train_loss": -10.452202796936035, "global_step": 125643, "epoch": 747} {"train_loss": -9.919275283813477, "global_step": 125644, "epoch": 747} {"train_loss": -10.343681335449219, "global_step": 125645, "epoch": 747} {"train_loss": -9.968486785888672, "global_step": 125646, "epoch": 747} {"train_loss": -10.367477416992188, "global_step": 125647, "epoch": 747} {"train_loss": -10.354694366455078, "global_step": 125648, "epoch": 747} {"train_loss": -9.88252067565918, "global_step": 125649, "epoch": 747} {"train_loss": -10.409490585327148, "global_step": 125650, "epoch": 747} {"train_loss": -10.026787757873535, "global_step": 125651, "epoch": 747} {"train_loss": -9.959207534790039, "global_step": 125652, "epoch": 747} {"train_loss": -10.361833572387695, "global_step": 125653, "epoch": 747} {"train_loss": -9.675443649291992, "global_step": 125654, "epoch": 747} {"train_loss": -10.252102851867676, "global_step": 125655, "epoch": 747} {"train_loss": -9.869184494018555, "global_step": 125656, "epoch": 747} {"train_loss": -10.130971908569336, "global_step": 125657, "epoch": 747} {"train_loss": -10.194469451904297, "global_step": 125658, "epoch": 747} {"train_loss": -9.684246063232422, "global_step": 125659, "epoch": 747} {"train_loss": -9.429372787475586, "global_step": 125660, "epoch": 747} {"train_loss": -10.228290557861328, "global_step": 125661, "epoch": 747} {"train_loss": -9.169622421264648, "global_step": 125662, "epoch": 747} {"train_loss": -10.193435260227748, "global_step": 125663, "epoch": 747, "val_loss": 218109.984375} {"train_loss": -9.790159225463867, "global_step": 125664, "epoch": 748} {"train_loss": -9.754579544067383, "global_step": 125665, "epoch": 748} {"train_loss": -10.107599258422852, "global_step": 125666, "epoch": 748} {"train_loss": -9.908130645751953, "global_step": 125667, "epoch": 748} {"train_loss": -10.348760604858398, "global_step": 125668, "epoch": 748} {"train_loss": -10.218717575073242, "global_step": 125669, "epoch": 748} {"train_loss": -10.05360221862793, "global_step": 125670, "epoch": 748} {"train_loss": -9.953657150268555, "global_step": 125671, "epoch": 748} {"train_loss": -10.424436569213867, "global_step": 125672, "epoch": 748} {"train_loss": -9.987969398498535, "global_step": 125673, "epoch": 748} {"train_loss": -10.472002029418945, "global_step": 125674, "epoch": 748} {"train_loss": -10.126424789428711, "global_step": 125675, "epoch": 748} {"train_loss": -10.037530899047852, "global_step": 125676, "epoch": 748} {"train_loss": -10.211163520812988, "global_step": 125677, "epoch": 748} {"train_loss": -10.287752151489258, "global_step": 125678, "epoch": 748} {"train_loss": -10.257343292236328, "global_step": 125679, "epoch": 748} {"train_loss": -10.346871376037598, "global_step": 125680, "epoch": 748} {"train_loss": -10.093372344970703, "global_step": 125681, "epoch": 748} {"train_loss": -10.262256622314453, "global_step": 125682, "epoch": 748} {"train_loss": -10.32297134399414, "global_step": 125683, "epoch": 748} {"train_loss": -10.437154769897461, "global_step": 125684, "epoch": 748} {"train_loss": -10.32205581665039, "global_step": 125685, "epoch": 748} {"train_loss": -10.422916412353516, "global_step": 125686, "epoch": 748} {"train_loss": -10.203132629394531, "global_step": 125687, "epoch": 748} {"train_loss": -10.502676010131836, "global_step": 125688, "epoch": 748} {"train_loss": -10.514486312866211, "global_step": 125689, "epoch": 748} {"train_loss": -10.290913581848145, "global_step": 125690, "epoch": 748} {"train_loss": -10.45635986328125, "global_step": 125691, "epoch": 748} {"train_loss": -10.379484176635742, "global_step": 125692, "epoch": 748} {"train_loss": -10.548577308654785, "global_step": 125693, "epoch": 748} {"train_loss": -10.531484603881836, "global_step": 125694, "epoch": 748} {"train_loss": -10.648287773132324, "global_step": 125695, "epoch": 748} {"train_loss": -10.384195327758789, "global_step": 125696, "epoch": 748} {"train_loss": -10.562313079833984, "global_step": 125697, "epoch": 748} {"train_loss": -10.579761505126953, "global_step": 125698, "epoch": 748} {"train_loss": -10.688970565795898, "global_step": 125699, "epoch": 748} {"train_loss": -10.376062393188477, "global_step": 125700, "epoch": 748} {"train_loss": -10.311470985412598, "global_step": 125701, "epoch": 748} {"train_loss": -10.172225952148438, "global_step": 125702, "epoch": 748} {"train_loss": -10.229667663574219, "global_step": 125703, "epoch": 748} {"train_loss": -10.307378768920898, "global_step": 125704, "epoch": 748} {"train_loss": -10.256919860839844, "global_step": 125705, "epoch": 748} {"train_loss": -10.215766906738281, "global_step": 125706, "epoch": 748} {"train_loss": -10.377557754516602, "global_step": 125707, "epoch": 748} {"train_loss": -9.792747497558594, "global_step": 125708, "epoch": 748} {"train_loss": -9.095186233520508, "global_step": 125709, "epoch": 748} {"train_loss": -9.739791870117188, "global_step": 125710, "epoch": 748} {"train_loss": -7.94774866104126, "global_step": 125711, "epoch": 748} {"train_loss": -9.778426170349121, "global_step": 125712, "epoch": 748} {"train_loss": -7.924037933349609, "global_step": 125713, "epoch": 748} {"train_loss": -10.102587699890137, "global_step": 125714, "epoch": 748} {"train_loss": -7.868862152099609, "global_step": 125715, "epoch": 748} {"train_loss": -8.388570785522461, "global_step": 125716, "epoch": 748} {"train_loss": -8.868577003479004, "global_step": 125717, "epoch": 748} {"train_loss": -9.233728408813477, "global_step": 125718, "epoch": 748} {"train_loss": -8.676911354064941, "global_step": 125719, "epoch": 748} {"train_loss": -8.431453704833984, "global_step": 125720, "epoch": 748} {"train_loss": -9.074871063232422, "global_step": 125721, "epoch": 748} {"train_loss": -9.620855331420898, "global_step": 125722, "epoch": 748} {"train_loss": -8.724000930786133, "global_step": 125723, "epoch": 748} {"train_loss": -9.643220901489258, "global_step": 125724, "epoch": 748} {"train_loss": -9.552977561950684, "global_step": 125725, "epoch": 748} {"train_loss": -9.729290962219238, "global_step": 125726, "epoch": 748} {"train_loss": -9.40826416015625, "global_step": 125727, "epoch": 748} {"train_loss": -9.75333023071289, "global_step": 125728, "epoch": 748} {"train_loss": -9.910421371459961, "global_step": 125729, "epoch": 748} {"train_loss": -9.697178840637207, "global_step": 125730, "epoch": 748} {"train_loss": -9.458422660827637, "global_step": 125731, "epoch": 748} {"train_loss": -9.9197359085083, "global_step": 125732, "epoch": 748} {"train_loss": -9.865285873413086, "global_step": 125733, "epoch": 748} {"train_loss": -9.929339408874512, "global_step": 125734, "epoch": 748} {"train_loss": -9.681304931640625, "global_step": 125735, "epoch": 748} {"train_loss": -9.974966049194336, "global_step": 125736, "epoch": 748} {"train_loss": -9.777920722961426, "global_step": 125737, "epoch": 748} {"train_loss": -9.862459182739258, "global_step": 125738, "epoch": 748} {"train_loss": -9.762943267822266, "global_step": 125739, "epoch": 748} {"train_loss": -9.874948501586914, "global_step": 125740, "epoch": 748} {"train_loss": -10.045305252075195, "global_step": 125741, "epoch": 748} {"train_loss": -10.09428882598877, "global_step": 125742, "epoch": 748} {"train_loss": -9.891233444213867, "global_step": 125743, "epoch": 748} {"train_loss": -10.077431678771973, "global_step": 125744, "epoch": 748} {"train_loss": -10.19433879852295, "global_step": 125745, "epoch": 748} {"train_loss": -9.68870735168457, "global_step": 125746, "epoch": 748} {"train_loss": -10.040811538696289, "global_step": 125747, "epoch": 748} {"train_loss": -10.244409561157227, "global_step": 125748, "epoch": 748} {"train_loss": -10.063901901245117, "global_step": 125749, "epoch": 748} {"train_loss": -10.284286499023438, "global_step": 125750, "epoch": 748} {"train_loss": -10.101705551147461, "global_step": 125751, "epoch": 748} {"train_loss": -10.210915565490723, "global_step": 125752, "epoch": 748} {"train_loss": -10.127633094787598, "global_step": 125753, "epoch": 748} {"train_loss": -10.3287353515625, "global_step": 125754, "epoch": 748} {"train_loss": -10.314794540405273, "global_step": 125755, "epoch": 748} {"train_loss": -10.335601806640625, "global_step": 125756, "epoch": 748} {"train_loss": -10.304924011230469, "global_step": 125757, "epoch": 748} {"train_loss": -10.432576179504395, "global_step": 125758, "epoch": 748} {"train_loss": -10.38626480102539, "global_step": 125759, "epoch": 748} {"train_loss": -10.632804870605469, "global_step": 125760, "epoch": 748} {"train_loss": -10.40477466583252, "global_step": 125761, "epoch": 748} {"train_loss": -10.474586486816406, "global_step": 125762, "epoch": 748} {"train_loss": -10.170469284057617, "global_step": 125763, "epoch": 748} {"train_loss": -10.385354995727539, "global_step": 125764, "epoch": 748} {"train_loss": -10.435462951660156, "global_step": 125765, "epoch": 748} {"train_loss": -10.557291984558105, "global_step": 125766, "epoch": 748} {"train_loss": -10.667840003967285, "global_step": 125767, "epoch": 748} {"train_loss": -10.609613418579102, "global_step": 125768, "epoch": 748} {"train_loss": -10.699808120727539, "global_step": 125769, "epoch": 748} {"train_loss": -10.252628326416016, "global_step": 125770, "epoch": 748} {"train_loss": -10.457090377807617, "global_step": 125771, "epoch": 748} {"train_loss": -10.396970748901367, "global_step": 125772, "epoch": 748} {"train_loss": -10.574824333190918, "global_step": 125773, "epoch": 748} {"train_loss": -10.38242244720459, "global_step": 125774, "epoch": 748} {"train_loss": -9.953218460083008, "global_step": 125775, "epoch": 748} {"train_loss": -10.215616226196289, "global_step": 125776, "epoch": 748} {"train_loss": -10.088167190551758, "global_step": 125777, "epoch": 748} {"train_loss": -10.390851974487305, "global_step": 125778, "epoch": 748} {"train_loss": -9.736568450927734, "global_step": 125779, "epoch": 748} {"train_loss": -10.171789169311523, "global_step": 125780, "epoch": 748} {"train_loss": -10.286005020141602, "global_step": 125781, "epoch": 748} {"train_loss": -10.101844787597656, "global_step": 125782, "epoch": 748} {"train_loss": -9.169445037841797, "global_step": 125783, "epoch": 748} {"train_loss": -8.64102554321289, "global_step": 125784, "epoch": 748} {"train_loss": -9.012311935424805, "global_step": 125785, "epoch": 748} {"train_loss": -10.34975814819336, "global_step": 125786, "epoch": 748} {"train_loss": -9.488531112670898, "global_step": 125787, "epoch": 748} {"train_loss": -9.451308250427246, "global_step": 125788, "epoch": 748} {"train_loss": -10.187070846557617, "global_step": 125789, "epoch": 748} {"train_loss": -9.325380325317383, "global_step": 125790, "epoch": 748} {"train_loss": -9.852239608764648, "global_step": 125791, "epoch": 748} {"train_loss": -9.760082244873047, "global_step": 125792, "epoch": 748} {"train_loss": -10.055471420288086, "global_step": 125793, "epoch": 748} {"train_loss": -10.020868301391602, "global_step": 125794, "epoch": 748} {"train_loss": -9.94260025024414, "global_step": 125795, "epoch": 748} {"train_loss": -10.26754379272461, "global_step": 125796, "epoch": 748} {"train_loss": -9.969999313354492, "global_step": 125797, "epoch": 748} {"train_loss": -9.742767333984375, "global_step": 125798, "epoch": 748} {"train_loss": -10.224400520324707, "global_step": 125799, "epoch": 748} {"train_loss": -10.203226089477539, "global_step": 125800, "epoch": 748} {"train_loss": -10.024007797241211, "global_step": 125801, "epoch": 748} {"train_loss": -10.397714614868164, "global_step": 125802, "epoch": 748} {"train_loss": -10.172943115234375, "global_step": 125803, "epoch": 748} {"train_loss": -10.221277236938477, "global_step": 125804, "epoch": 748} {"train_loss": -10.233485221862793, "global_step": 125805, "epoch": 748} {"train_loss": -10.381729125976562, "global_step": 125806, "epoch": 748} {"train_loss": -9.926958084106445, "global_step": 125807, "epoch": 748} {"train_loss": -10.42652702331543, "global_step": 125808, "epoch": 748} {"train_loss": -10.139512062072754, "global_step": 125809, "epoch": 748} {"train_loss": -10.051189422607422, "global_step": 125810, "epoch": 748} {"train_loss": -10.238283157348633, "global_step": 125811, "epoch": 748} {"train_loss": -10.18531608581543, "global_step": 125812, "epoch": 748} {"train_loss": -10.068626403808594, "global_step": 125813, "epoch": 748} {"train_loss": -9.817159652709961, "global_step": 125814, "epoch": 748} {"train_loss": -10.2478666305542, "global_step": 125815, "epoch": 748} {"train_loss": -10.062555313110352, "global_step": 125816, "epoch": 748} {"train_loss": -10.260123252868652, "global_step": 125817, "epoch": 748} {"train_loss": -9.880609512329102, "global_step": 125818, "epoch": 748} {"train_loss": -10.41732120513916, "global_step": 125819, "epoch": 748} {"train_loss": -9.858526229858398, "global_step": 125820, "epoch": 748} {"train_loss": -10.451000213623047, "global_step": 125821, "epoch": 748} {"train_loss": -9.973306655883789, "global_step": 125822, "epoch": 748} {"train_loss": -10.424890518188477, "global_step": 125823, "epoch": 748} {"train_loss": -9.989624977111816, "global_step": 125824, "epoch": 748} {"train_loss": -10.19613265991211, "global_step": 125825, "epoch": 748} {"train_loss": -9.831491470336914, "global_step": 125826, "epoch": 748} {"train_loss": -10.287656784057617, "global_step": 125827, "epoch": 748} {"train_loss": -10.18931770324707, "global_step": 125828, "epoch": 748} {"train_loss": -10.202098846435547, "global_step": 125829, "epoch": 748} {"train_loss": -10.170097351074219, "global_step": 125830, "epoch": 748} {"train_loss": -10.021076352823348, "global_step": 125831, "epoch": 748, "val_loss": 215247.34375} {"train_loss": -9.862493515014648, "global_step": 125832, "epoch": 749} {"train_loss": -10.313735961914062, "global_step": 125833, "epoch": 749} {"train_loss": -9.640807151794434, "global_step": 125834, "epoch": 749} {"train_loss": -10.406318664550781, "global_step": 125835, "epoch": 749} {"train_loss": -9.859352111816406, "global_step": 125836, "epoch": 749} {"train_loss": -9.904058456420898, "global_step": 125837, "epoch": 749} {"train_loss": -9.490964889526367, "global_step": 125838, "epoch": 749} {"train_loss": -10.040471076965332, "global_step": 125839, "epoch": 749} {"train_loss": -9.766746520996094, "global_step": 125840, "epoch": 749} {"train_loss": -10.092193603515625, "global_step": 125841, "epoch": 749} {"train_loss": -9.68386173248291, "global_step": 125842, "epoch": 749} {"train_loss": -10.024591445922852, "global_step": 125843, "epoch": 749} {"train_loss": -10.011167526245117, "global_step": 125844, "epoch": 749} {"train_loss": -9.582555770874023, "global_step": 125845, "epoch": 749} {"train_loss": -10.421043395996094, "global_step": 125846, "epoch": 749} {"train_loss": -9.112049102783203, "global_step": 125847, "epoch": 749} {"train_loss": -10.220754623413086, "global_step": 125848, "epoch": 749} {"train_loss": -9.59019660949707, "global_step": 125849, "epoch": 749} {"train_loss": -9.953765869140625, "global_step": 125850, "epoch": 749} {"train_loss": -9.931379318237305, "global_step": 125851, "epoch": 749} {"train_loss": -10.189655303955078, "global_step": 125852, "epoch": 749} {"train_loss": -10.279718399047852, "global_step": 125853, "epoch": 749} {"train_loss": -9.711462020874023, "global_step": 125854, "epoch": 749} {"train_loss": -10.381895065307617, "global_step": 125855, "epoch": 749} {"train_loss": -10.156621932983398, "global_step": 125856, "epoch": 749} {"train_loss": -9.829679489135742, "global_step": 125857, "epoch": 749} {"train_loss": -10.420377731323242, "global_step": 125858, "epoch": 749} {"train_loss": -10.034387588500977, "global_step": 125859, "epoch": 749} {"train_loss": -10.176546096801758, "global_step": 125860, "epoch": 749} {"train_loss": -10.19667911529541, "global_step": 125861, "epoch": 749} {"train_loss": -10.189449310302734, "global_step": 125862, "epoch": 749} {"train_loss": -9.85378646850586, "global_step": 125863, "epoch": 749} {"train_loss": -10.063617706298828, "global_step": 125864, "epoch": 749} {"train_loss": -10.336676597595215, "global_step": 125865, "epoch": 749} {"train_loss": -10.091075897216797, "global_step": 125866, "epoch": 749} {"train_loss": -10.164582252502441, "global_step": 125867, "epoch": 749} {"train_loss": -10.387253761291504, "global_step": 125868, "epoch": 749} {"train_loss": -10.416993141174316, "global_step": 125869, "epoch": 749} {"train_loss": -10.321819305419922, "global_step": 125870, "epoch": 749} {"train_loss": -10.432939529418945, "global_step": 125871, "epoch": 749} {"train_loss": -10.605260848999023, "global_step": 125872, "epoch": 749} {"train_loss": -10.421001434326172, "global_step": 125873, "epoch": 749} {"train_loss": -10.52065658569336, "global_step": 125874, "epoch": 749} {"train_loss": -10.566156387329102, "global_step": 125875, "epoch": 749} {"train_loss": -10.426212310791016, "global_step": 125876, "epoch": 749} {"train_loss": -10.54393482208252, "global_step": 125877, "epoch": 749} {"train_loss": -10.517176628112793, "global_step": 125878, "epoch": 749} {"train_loss": -10.64512825012207, "global_step": 125879, "epoch": 749} {"train_loss": -10.416756629943848, "global_step": 125880, "epoch": 749} {"train_loss": -10.535136222839355, "global_step": 125881, "epoch": 749} {"train_loss": -10.588469505310059, "global_step": 125882, "epoch": 749} {"train_loss": -10.557941436767578, "global_step": 125883, "epoch": 749} {"train_loss": -10.60074234008789, "global_step": 125884, "epoch": 749} {"train_loss": -10.686870574951172, "global_step": 125885, "epoch": 749} {"train_loss": -10.415243148803711, "global_step": 125886, "epoch": 749} {"train_loss": -10.399432182312012, "global_step": 125887, "epoch": 749} {"train_loss": -10.37372875213623, "global_step": 125888, "epoch": 749} {"train_loss": -10.413110733032227, "global_step": 125889, "epoch": 749} {"train_loss": -10.693582534790039, "global_step": 125890, "epoch": 749} {"train_loss": -10.255401611328125, "global_step": 125891, "epoch": 749} {"train_loss": -9.972238540649414, "global_step": 125892, "epoch": 749} {"train_loss": -10.091904640197754, "global_step": 125893, "epoch": 749} {"train_loss": -10.515527725219727, "global_step": 125894, "epoch": 749} {"train_loss": -10.066570281982422, "global_step": 125895, "epoch": 749} {"train_loss": -10.307124137878418, "global_step": 125896, "epoch": 749} {"train_loss": -10.332817077636719, "global_step": 125897, "epoch": 749} {"train_loss": -10.536788940429688, "global_step": 125898, "epoch": 749} {"train_loss": -10.169209480285645, "global_step": 125899, "epoch": 749} {"train_loss": -10.623880386352539, "global_step": 125900, "epoch": 749} {"train_loss": -10.572739601135254, "global_step": 125901, "epoch": 749} {"train_loss": -10.127765655517578, "global_step": 125902, "epoch": 749} {"train_loss": -10.247591018676758, "global_step": 125903, "epoch": 749} {"train_loss": -9.999460220336914, "global_step": 125904, "epoch": 749} {"train_loss": -10.615458488464355, "global_step": 125905, "epoch": 749} {"train_loss": -10.357686996459961, "global_step": 125906, "epoch": 749} {"train_loss": -9.638457298278809, "global_step": 125907, "epoch": 749} {"train_loss": -10.34212875366211, "global_step": 125908, "epoch": 749} {"train_loss": -9.945192337036133, "global_step": 125909, "epoch": 749} {"train_loss": -9.16301155090332, "global_step": 125910, "epoch": 749} {"train_loss": -10.01605224609375, "global_step": 125911, "epoch": 749} {"train_loss": -8.766600608825684, "global_step": 125912, "epoch": 749} {"train_loss": -10.191819190979004, "global_step": 125913, "epoch": 749} {"train_loss": -9.506078720092773, "global_step": 125914, "epoch": 749} {"train_loss": -9.813892364501953, "global_step": 125915, "epoch": 749} {"train_loss": -10.020750045776367, "global_step": 125916, "epoch": 749} {"train_loss": -10.284303665161133, "global_step": 125917, "epoch": 749} {"train_loss": -10.040373802185059, "global_step": 125918, "epoch": 749} {"train_loss": -10.191449165344238, "global_step": 125919, "epoch": 749} {"train_loss": -9.760919570922852, "global_step": 125920, "epoch": 749} {"train_loss": -9.80726146697998, "global_step": 125921, "epoch": 749} {"train_loss": -10.347414016723633, "global_step": 125922, "epoch": 749} {"train_loss": -10.016552925109863, "global_step": 125923, "epoch": 749} {"train_loss": -10.180182456970215, "global_step": 125924, "epoch": 749} {"train_loss": -10.088501930236816, "global_step": 125925, "epoch": 749} {"train_loss": -9.97743034362793, "global_step": 125926, "epoch": 749} {"train_loss": -10.457304000854492, "global_step": 125927, "epoch": 749} {"train_loss": -10.121628761291504, "global_step": 125928, "epoch": 749} {"train_loss": -10.068145751953125, "global_step": 125929, "epoch": 749} {"train_loss": -10.195001602172852, "global_step": 125930, "epoch": 749} {"train_loss": -10.233078956604004, "global_step": 125931, "epoch": 749} {"train_loss": -10.32199764251709, "global_step": 125932, "epoch": 749} {"train_loss": -10.064188003540039, "global_step": 125933, "epoch": 749} {"train_loss": -10.39228630065918, "global_step": 125934, "epoch": 749} {"train_loss": -10.3173246383667, "global_step": 125935, "epoch": 749} {"train_loss": -10.200502395629883, "global_step": 125936, "epoch": 749} {"train_loss": -10.243080139160156, "global_step": 125937, "epoch": 749} {"train_loss": -10.49453067779541, "global_step": 125938, "epoch": 749} {"train_loss": -10.323596000671387, "global_step": 125939, "epoch": 749} {"train_loss": -10.306138038635254, "global_step": 125940, "epoch": 749} {"train_loss": -10.100946426391602, "global_step": 125941, "epoch": 749} {"train_loss": -10.07998275756836, "global_step": 125942, "epoch": 749} {"train_loss": -10.53442096710205, "global_step": 125943, "epoch": 749} {"train_loss": -10.384982109069824, "global_step": 125944, "epoch": 749} {"train_loss": -10.110583305358887, "global_step": 125945, "epoch": 749} {"train_loss": -10.375195503234863, "global_step": 125946, "epoch": 749} {"train_loss": -10.173377990722656, "global_step": 125947, "epoch": 749} {"train_loss": -10.340845108032227, "global_step": 125948, "epoch": 749} {"train_loss": -10.447222709655762, "global_step": 125949, "epoch": 749} {"train_loss": -10.10555362701416, "global_step": 125950, "epoch": 749} {"train_loss": -10.47708797454834, "global_step": 125951, "epoch": 749} {"train_loss": -10.432114601135254, "global_step": 125952, "epoch": 749} {"train_loss": -10.22891616821289, "global_step": 125953, "epoch": 749} {"train_loss": -10.469244956970215, "global_step": 125954, "epoch": 749} {"train_loss": -10.531829833984375, "global_step": 125955, "epoch": 749} {"train_loss": -10.193746566772461, "global_step": 125956, "epoch": 749} {"train_loss": -10.357599258422852, "global_step": 125957, "epoch": 749} {"train_loss": -10.341111183166504, "global_step": 125958, "epoch": 749} {"train_loss": -10.472990036010742, "global_step": 125959, "epoch": 749} {"train_loss": -10.248856544494629, "global_step": 125960, "epoch": 749} {"train_loss": -10.197672843933105, "global_step": 125961, "epoch": 749} {"train_loss": -10.210189819335938, "global_step": 125962, "epoch": 749} {"train_loss": -10.249211311340332, "global_step": 125963, "epoch": 749} {"train_loss": -10.088235855102539, "global_step": 125964, "epoch": 749} {"train_loss": -10.41458511352539, "global_step": 125965, "epoch": 749} {"train_loss": -10.133261680603027, "global_step": 125966, "epoch": 749} {"train_loss": -10.041074752807617, "global_step": 125967, "epoch": 749} {"train_loss": -10.742815971374512, "global_step": 125968, "epoch": 749} {"train_loss": -9.871989250183105, "global_step": 125969, "epoch": 749} {"train_loss": -10.407039642333984, "global_step": 125970, "epoch": 749} {"train_loss": -10.142068862915039, "global_step": 125971, "epoch": 749} {"train_loss": -9.994741439819336, "global_step": 125972, "epoch": 749} {"train_loss": -10.515531539916992, "global_step": 125973, "epoch": 749} {"train_loss": -9.763116836547852, "global_step": 125974, "epoch": 749} {"train_loss": -9.936392784118652, "global_step": 125975, "epoch": 749} {"train_loss": -9.697835922241211, "global_step": 125976, "epoch": 749} {"train_loss": -9.760343551635742, "global_step": 125977, "epoch": 749} {"train_loss": -10.290115356445312, "global_step": 125978, "epoch": 749} {"train_loss": -9.987530708312988, "global_step": 125979, "epoch": 749} {"train_loss": -10.134668350219727, "global_step": 125980, "epoch": 749} {"train_loss": -10.075654983520508, "global_step": 125981, "epoch": 749} {"train_loss": -10.305022239685059, "global_step": 125982, "epoch": 749} {"train_loss": -9.948460578918457, "global_step": 125983, "epoch": 749} {"train_loss": -10.060144424438477, "global_step": 125984, "epoch": 749} {"train_loss": -10.14339828491211, "global_step": 125985, "epoch": 749} {"train_loss": -9.612835884094238, "global_step": 125986, "epoch": 749} {"train_loss": -10.140033721923828, "global_step": 125987, "epoch": 749} {"train_loss": -9.637907028198242, "global_step": 125988, "epoch": 749} {"train_loss": -10.306467056274414, "global_step": 125989, "epoch": 749} {"train_loss": -10.112838745117188, "global_step": 125990, "epoch": 749} {"train_loss": -10.0406494140625, "global_step": 125991, "epoch": 749} {"train_loss": -10.311659812927246, "global_step": 125992, "epoch": 749} {"train_loss": -9.99184799194336, "global_step": 125993, "epoch": 749} {"train_loss": -10.028585433959961, "global_step": 125994, "epoch": 749} {"train_loss": -10.227601051330566, "global_step": 125995, "epoch": 749} {"train_loss": -10.414314270019531, "global_step": 125996, "epoch": 749} {"train_loss": -10.187302589416504, "global_step": 125997, "epoch": 749} {"train_loss": -10.384654998779297, "global_step": 125998, "epoch": 749} {"train_loss": -10.173266853604998, "global_step": 125999, "epoch": 749, "val_loss": 217208.375} {"train_loss": -10.261591911315918, "global_step": 126000, "epoch": 750} {"train_loss": -9.768421173095703, "global_step": 126001, "epoch": 750} {"train_loss": -9.855386734008789, "global_step": 126002, "epoch": 750} {"train_loss": -9.815494537353516, "global_step": 126003, "epoch": 750} {"train_loss": -10.049029350280762, "global_step": 126004, "epoch": 750} {"train_loss": -9.724328994750977, "global_step": 126005, "epoch": 750} {"train_loss": -10.399188995361328, "global_step": 126006, "epoch": 750} {"train_loss": -9.653474807739258, "global_step": 126007, "epoch": 750} {"train_loss": -10.231741905212402, "global_step": 126008, "epoch": 750} {"train_loss": -10.087029457092285, "global_step": 126009, "epoch": 750} {"train_loss": -10.394874572753906, "global_step": 126010, "epoch": 750} {"train_loss": -10.169389724731445, "global_step": 126011, "epoch": 750} {"train_loss": -10.121402740478516, "global_step": 126012, "epoch": 750} {"train_loss": -10.258440017700195, "global_step": 126013, "epoch": 750} {"train_loss": -10.089723587036133, "global_step": 126014, "epoch": 750} {"train_loss": -9.81786823272705, "global_step": 126015, "epoch": 750} {"train_loss": -10.395751953125, "global_step": 126016, "epoch": 750} {"train_loss": -9.990795135498047, "global_step": 126017, "epoch": 750} {"train_loss": -10.28270149230957, "global_step": 126018, "epoch": 750} {"train_loss": -9.932315826416016, "global_step": 126019, "epoch": 750} {"train_loss": -10.240781784057617, "global_step": 126020, "epoch": 750} {"train_loss": -10.242242813110352, "global_step": 126021, "epoch": 750} {"train_loss": -10.236428260803223, "global_step": 126022, "epoch": 750} {"train_loss": -10.159011840820312, "global_step": 126023, "epoch": 750} {"train_loss": -10.35704231262207, "global_step": 126024, "epoch": 750} {"train_loss": -10.404434204101562, "global_step": 126025, "epoch": 750} {"train_loss": -10.183704376220703, "global_step": 126026, "epoch": 750} {"train_loss": -10.37476634979248, "global_step": 126027, "epoch": 750} {"train_loss": -10.032794952392578, "global_step": 126028, "epoch": 750} {"train_loss": -10.57597827911377, "global_step": 126029, "epoch": 750} {"train_loss": -10.153428077697754, "global_step": 126030, "epoch": 750} {"train_loss": -10.46290397644043, "global_step": 126031, "epoch": 750} {"train_loss": -10.311517715454102, "global_step": 126032, "epoch": 750} {"train_loss": -10.284550666809082, "global_step": 126033, "epoch": 750} {"train_loss": -10.478723526000977, "global_step": 126034, "epoch": 750} {"train_loss": -10.449718475341797, "global_step": 126035, "epoch": 750} {"train_loss": -10.569713592529297, "global_step": 126036, "epoch": 750} {"train_loss": -10.483075141906738, "global_step": 126037, "epoch": 750} {"train_loss": -10.348094940185547, "global_step": 126038, "epoch": 750} {"train_loss": -10.125057220458984, "global_step": 126039, "epoch": 750} {"train_loss": -10.232240676879883, "global_step": 126040, "epoch": 750} {"train_loss": -10.249183654785156, "global_step": 126041, "epoch": 750} {"train_loss": -10.36021614074707, "global_step": 126042, "epoch": 750} {"train_loss": -10.610252380371094, "global_step": 126043, "epoch": 750} {"train_loss": -10.443750381469727, "global_step": 126044, "epoch": 750} {"train_loss": -10.422408103942871, "global_step": 126045, "epoch": 750} {"train_loss": -10.603182792663574, "global_step": 126046, "epoch": 750} {"train_loss": -10.429315567016602, "global_step": 126047, "epoch": 750} {"train_loss": -10.4620943069458, "global_step": 126048, "epoch": 750} {"train_loss": -10.344649314880371, "global_step": 126049, "epoch": 750} {"train_loss": -10.478569030761719, "global_step": 126050, "epoch": 750} {"train_loss": -10.301627159118652, "global_step": 126051, "epoch": 750} {"train_loss": -10.50409984588623, "global_step": 126052, "epoch": 750} {"train_loss": -10.19668197631836, "global_step": 126053, "epoch": 750} {"train_loss": -10.41053581237793, "global_step": 126054, "epoch": 750} {"train_loss": -10.383260726928711, "global_step": 126055, "epoch": 750} {"train_loss": -10.093673706054688, "global_step": 126056, "epoch": 750} {"train_loss": -10.44922924041748, "global_step": 126057, "epoch": 750} {"train_loss": -10.014284133911133, "global_step": 126058, "epoch": 750} {"train_loss": -10.26496696472168, "global_step": 126059, "epoch": 750} {"train_loss": -9.658758163452148, "global_step": 126060, "epoch": 750} {"train_loss": -9.987061500549316, "global_step": 126061, "epoch": 750} {"train_loss": -10.038054466247559, "global_step": 126062, "epoch": 750} {"train_loss": -10.06395149230957, "global_step": 126063, "epoch": 750} {"train_loss": -10.094696998596191, "global_step": 126064, "epoch": 750} {"train_loss": -10.076394081115723, "global_step": 126065, "epoch": 750} {"train_loss": -10.169184684753418, "global_step": 126066, "epoch": 750} {"train_loss": -10.122791290283203, "global_step": 126067, "epoch": 750} {"train_loss": -10.279077529907227, "global_step": 126068, "epoch": 750} {"train_loss": -10.083818435668945, "global_step": 126069, "epoch": 750} {"train_loss": -10.141095161437988, "global_step": 126070, "epoch": 750} {"train_loss": -10.332529067993164, "global_step": 126071, "epoch": 750} {"train_loss": -10.025846481323242, "global_step": 126072, "epoch": 750} {"train_loss": -10.314308166503906, "global_step": 126073, "epoch": 750} {"train_loss": -10.245826721191406, "global_step": 126074, "epoch": 750} {"train_loss": -10.366459846496582, "global_step": 126075, "epoch": 750} {"train_loss": -10.249469757080078, "global_step": 126076, "epoch": 750} {"train_loss": -9.964012145996094, "global_step": 126077, "epoch": 750} {"train_loss": -10.418661117553711, "global_step": 126078, "epoch": 750} {"train_loss": -9.868535995483398, "global_step": 126079, "epoch": 750} {"train_loss": -10.097365379333496, "global_step": 126080, "epoch": 750} {"train_loss": -9.701711654663086, "global_step": 126081, "epoch": 750} {"train_loss": -9.71408462524414, "global_step": 126082, "epoch": 750} {"train_loss": -9.84202766418457, "global_step": 126083, "epoch": 750} {"train_loss": -9.989742279052734, "global_step": 126084, "epoch": 750} {"train_loss": -9.676202774047852, "global_step": 126085, "epoch": 750} {"train_loss": -9.78363037109375, "global_step": 126086, "epoch": 750} {"train_loss": -9.337554931640625, "global_step": 126087, "epoch": 750} {"train_loss": -10.155280113220215, "global_step": 126088, "epoch": 750} {"train_loss": -9.583184242248535, "global_step": 126089, "epoch": 750} {"train_loss": -10.04205322265625, "global_step": 126090, "epoch": 750} {"train_loss": -10.143031120300293, "global_step": 126091, "epoch": 750} {"train_loss": -9.873183250427246, "global_step": 126092, "epoch": 750} {"train_loss": -9.808677673339844, "global_step": 126093, "epoch": 750} {"train_loss": -10.206990242004395, "global_step": 126094, "epoch": 750} {"train_loss": -10.278951644897461, "global_step": 126095, "epoch": 750} {"train_loss": -10.067813873291016, "global_step": 126096, "epoch": 750} {"train_loss": -10.32509994506836, "global_step": 126097, "epoch": 750} {"train_loss": -10.264262199401855, "global_step": 126098, "epoch": 750} {"train_loss": -10.209835052490234, "global_step": 126099, "epoch": 750} {"train_loss": -10.453784942626953, "global_step": 126100, "epoch": 750} {"train_loss": -10.274410247802734, "global_step": 126101, "epoch": 750} {"train_loss": -10.440303802490234, "global_step": 126102, "epoch": 750} {"train_loss": -10.268914222717285, "global_step": 126103, "epoch": 750} {"train_loss": -10.362205505371094, "global_step": 126104, "epoch": 750} {"train_loss": -10.307502746582031, "global_step": 126105, "epoch": 750} {"train_loss": -10.178486824035645, "global_step": 126106, "epoch": 750} {"train_loss": -10.342205047607422, "global_step": 126107, "epoch": 750} {"train_loss": -10.051660537719727, "global_step": 126108, "epoch": 750} {"train_loss": -10.383712768554688, "global_step": 126109, "epoch": 750} {"train_loss": -10.2184476852417, "global_step": 126110, "epoch": 750} {"train_loss": -10.340778350830078, "global_step": 126111, "epoch": 750} {"train_loss": -10.460192680358887, "global_step": 126112, "epoch": 750} {"train_loss": -10.227296829223633, "global_step": 126113, "epoch": 750} {"train_loss": -10.191551208496094, "global_step": 126114, "epoch": 750} {"train_loss": -10.507704734802246, "global_step": 126115, "epoch": 750} {"train_loss": -10.342215538024902, "global_step": 126116, "epoch": 750} {"train_loss": -9.963146209716797, "global_step": 126117, "epoch": 750} {"train_loss": -10.325193405151367, "global_step": 126118, "epoch": 750} {"train_loss": -10.208614349365234, "global_step": 126119, "epoch": 750} {"train_loss": -10.672232627868652, "global_step": 126120, "epoch": 750} {"train_loss": -10.470686912536621, "global_step": 126121, "epoch": 750} {"train_loss": -10.369248390197754, "global_step": 126122, "epoch": 750} {"train_loss": -10.385347366333008, "global_step": 126123, "epoch": 750} {"train_loss": -10.42011833190918, "global_step": 126124, "epoch": 750} {"train_loss": -10.55205249786377, "global_step": 126125, "epoch": 750} {"train_loss": -10.107070922851562, "global_step": 126126, "epoch": 750} {"train_loss": -10.455326080322266, "global_step": 126127, "epoch": 750} {"train_loss": -10.48199462890625, "global_step": 126128, "epoch": 750} {"train_loss": -10.457544326782227, "global_step": 126129, "epoch": 750} {"train_loss": -10.057355880737305, "global_step": 126130, "epoch": 750} {"train_loss": -10.292302131652832, "global_step": 126131, "epoch": 750} {"train_loss": -10.40548038482666, "global_step": 126132, "epoch": 750} {"train_loss": -10.304189682006836, "global_step": 126133, "epoch": 750} {"train_loss": -10.543600082397461, "global_step": 126134, "epoch": 750} {"train_loss": -10.468236923217773, "global_step": 126135, "epoch": 750} {"train_loss": -10.464797019958496, "global_step": 126136, "epoch": 750} {"train_loss": -10.281505584716797, "global_step": 126137, "epoch": 750} {"train_loss": -10.198175430297852, "global_step": 126138, "epoch": 750} {"train_loss": -10.593818664550781, "global_step": 126139, "epoch": 750} {"train_loss": -10.234901428222656, "global_step": 126140, "epoch": 750} {"train_loss": -10.283939361572266, "global_step": 126141, "epoch": 750} {"train_loss": -9.955902099609375, "global_step": 126142, "epoch": 750} {"train_loss": -10.337789535522461, "global_step": 126143, "epoch": 750} {"train_loss": -10.536920547485352, "global_step": 126144, "epoch": 750} {"train_loss": -9.976043701171875, "global_step": 126145, "epoch": 750} {"train_loss": -10.587886810302734, "global_step": 126146, "epoch": 750} {"train_loss": -10.187529563903809, "global_step": 126147, "epoch": 750} {"train_loss": -10.195959091186523, "global_step": 126148, "epoch": 750} {"train_loss": -10.449638366699219, "global_step": 126149, "epoch": 750} {"train_loss": -9.936938285827637, "global_step": 126150, "epoch": 750} {"train_loss": -10.042067527770996, "global_step": 126151, "epoch": 750} {"train_loss": -10.300309181213379, "global_step": 126152, "epoch": 750} {"train_loss": -10.088818550109863, "global_step": 126153, "epoch": 750} {"train_loss": -10.378353118896484, "global_step": 126154, "epoch": 750} {"train_loss": -10.066712379455566, "global_step": 126155, "epoch": 750} {"train_loss": -10.319252967834473, "global_step": 126156, "epoch": 750} {"train_loss": -10.087882995605469, "global_step": 126157, "epoch": 750} {"train_loss": -10.471826553344727, "global_step": 126158, "epoch": 750} {"train_loss": -9.997413635253906, "global_step": 126159, "epoch": 750} {"train_loss": -10.437989234924316, "global_step": 126160, "epoch": 750} {"train_loss": -10.409443855285645, "global_step": 126161, "epoch": 750} {"train_loss": -10.057357788085938, "global_step": 126162, "epoch": 750} {"train_loss": -10.415430068969727, "global_step": 126163, "epoch": 750} {"train_loss": -10.201864242553711, "global_step": 126164, "epoch": 750} {"train_loss": -9.779655456542969, "global_step": 126165, "epoch": 750} {"train_loss": -10.416403770446777, "global_step": 126166, "epoch": 750} {"train_loss": -10.216620859645662, "global_step": 126167, "epoch": 750, "train/sim_max_reward_0": 0.966863179745691, "train/sim_max_reward_1": 0.9576775392783595, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.6230780267827738, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.6017065756777635, "test/sim_max_reward_4400000": 0.23802905927657173, "test/sim_max_reward_4400001": 0.3483977760558242, "test/sim_max_reward_4400002": 0.07942869954051437, "test/sim_max_reward_4400003": 0.11514900036676512, "test/sim_max_reward_4400004": 0.4131312855301149, "test/sim_max_reward_4400005": 0.9688188923205077, "test/sim_max_reward_4400006": 0.5842616497683053, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 0.6517114238520368, "test/sim_max_reward_4400009": 0.4000710573007868, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 0.26254566961175857, "test/sim_max_reward_4400012": 0.9895084257546949, "test/sim_max_reward_4400013": 0.9415810502549274, "test/sim_max_reward_4400014": 0.6205243612170919, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9462125284781812, "test/sim_max_reward_4400019": 0.20364394209875875, "test/sim_max_reward_4400020": 0.5054192976373144, "test/sim_max_reward_4400021": 0.6501466320136146, "test/sim_max_reward_4400022": 0.9561797822168536, "test/sim_max_reward_4400023": 1.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.6101570899268165, "test/sim_max_reward_4400026": 0.04648250872906231, "test/sim_max_reward_4400027": 0.4220930862054356, "test/sim_max_reward_4400028": 0.706232278201285, "test/sim_max_reward_4400029": 0.4484843572112039, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.4841672421241771, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9938320774165719, "test/sim_max_reward_4400034": 0.8028141737322513, "test/sim_max_reward_4400035": 0.9783201784591407, "test/sim_max_reward_4400036": 0.3776987268004369, "test/sim_max_reward_4400037": 0.9922777686018012, "test/sim_max_reward_4400038": 0.9887383154183499, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 1.0, "test/sim_max_reward_4400042": 0.043098176384123874, "test/sim_max_reward_4400043": 0.9721598675988751, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.2898623409955096, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6915542202474313, "test/mean_score": 0.5825897073584261, "val_loss": 215665.96875, "train_action_mse_error": 0.8752051591873169} {"train_loss": -10.300944328308105, "global_step": 126168, "epoch": 751} {"train_loss": -10.305487632751465, "global_step": 126169, "epoch": 751} {"train_loss": -10.2987060546875, "global_step": 126170, "epoch": 751} {"train_loss": -10.54002857208252, "global_step": 126171, "epoch": 751} {"train_loss": -10.321399688720703, "global_step": 126172, "epoch": 751} {"train_loss": -10.329574584960938, "global_step": 126173, "epoch": 751} {"train_loss": -10.473487854003906, "global_step": 126174, "epoch": 751} {"train_loss": -10.4026517868042, "global_step": 126175, "epoch": 751} {"train_loss": -10.491004943847656, "global_step": 126176, "epoch": 751} {"train_loss": -10.396164894104004, "global_step": 126177, "epoch": 751} {"train_loss": -10.614181518554688, "global_step": 126178, "epoch": 751} {"train_loss": -10.50248908996582, "global_step": 126179, "epoch": 751} {"train_loss": -10.433021545410156, "global_step": 126180, "epoch": 751} {"train_loss": -10.504162788391113, "global_step": 126181, "epoch": 751} {"train_loss": -10.649528503417969, "global_step": 126182, "epoch": 751} {"train_loss": -10.599065780639648, "global_step": 126183, "epoch": 751} {"train_loss": -10.62861442565918, "global_step": 126184, "epoch": 751} {"train_loss": -10.23365306854248, "global_step": 126185, "epoch": 751} {"train_loss": -10.379154205322266, "global_step": 126186, "epoch": 751} {"train_loss": -10.537269592285156, "global_step": 126187, "epoch": 751} {"train_loss": -10.627801895141602, "global_step": 126188, "epoch": 751} {"train_loss": -10.463876724243164, "global_step": 126189, "epoch": 751} {"train_loss": -10.62069320678711, "global_step": 126190, "epoch": 751} {"train_loss": -10.559377670288086, "global_step": 126191, "epoch": 751} {"train_loss": -10.69495964050293, "global_step": 126192, "epoch": 751} {"train_loss": -10.404325485229492, "global_step": 126193, "epoch": 751} {"train_loss": -10.64029598236084, "global_step": 126194, "epoch": 751} {"train_loss": -10.473902702331543, "global_step": 126195, "epoch": 751} {"train_loss": -10.455867767333984, "global_step": 126196, "epoch": 751} {"train_loss": -10.41168212890625, "global_step": 126197, "epoch": 751} {"train_loss": -10.079395294189453, "global_step": 126198, "epoch": 751} {"train_loss": -9.875105857849121, "global_step": 126199, "epoch": 751} {"train_loss": -10.200019836425781, "global_step": 126200, "epoch": 751} {"train_loss": -10.572864532470703, "global_step": 126201, "epoch": 751} {"train_loss": -10.051542282104492, "global_step": 126202, "epoch": 751} {"train_loss": -10.446172714233398, "global_step": 126203, "epoch": 751} {"train_loss": -9.547348022460938, "global_step": 126204, "epoch": 751} {"train_loss": -10.243240356445312, "global_step": 126205, "epoch": 751} {"train_loss": -9.705522537231445, "global_step": 126206, "epoch": 751} {"train_loss": -9.572328567504883, "global_step": 126207, "epoch": 751} {"train_loss": -10.14710807800293, "global_step": 126208, "epoch": 751} {"train_loss": -9.553138732910156, "global_step": 126209, "epoch": 751} {"train_loss": -10.16633129119873, "global_step": 126210, "epoch": 751} {"train_loss": -10.373004913330078, "global_step": 126211, "epoch": 751} {"train_loss": -10.179746627807617, "global_step": 126212, "epoch": 751} {"train_loss": -10.282113075256348, "global_step": 126213, "epoch": 751} {"train_loss": -10.170621871948242, "global_step": 126214, "epoch": 751} {"train_loss": -10.232215881347656, "global_step": 126215, "epoch": 751} {"train_loss": -10.340160369873047, "global_step": 126216, "epoch": 751} {"train_loss": -10.079261779785156, "global_step": 126217, "epoch": 751} {"train_loss": -10.068010330200195, "global_step": 126218, "epoch": 751} {"train_loss": -9.799023628234863, "global_step": 126219, "epoch": 751} {"train_loss": -10.215985298156738, "global_step": 126220, "epoch": 751} {"train_loss": -10.10453987121582, "global_step": 126221, "epoch": 751} {"train_loss": -10.174541473388672, "global_step": 126222, "epoch": 751} {"train_loss": -9.639670372009277, "global_step": 126223, "epoch": 751} {"train_loss": -10.321929931640625, "global_step": 126224, "epoch": 751} {"train_loss": -10.257104873657227, "global_step": 126225, "epoch": 751} {"train_loss": -10.121021270751953, "global_step": 126226, "epoch": 751} {"train_loss": -10.27102279663086, "global_step": 126227, "epoch": 751} {"train_loss": -9.954826354980469, "global_step": 126228, "epoch": 751} {"train_loss": -10.227806091308594, "global_step": 126229, "epoch": 751} {"train_loss": -10.359280586242676, "global_step": 126230, "epoch": 751} {"train_loss": -9.81142807006836, "global_step": 126231, "epoch": 751} {"train_loss": -10.352807998657227, "global_step": 126232, "epoch": 751} {"train_loss": -10.133975982666016, "global_step": 126233, "epoch": 751} {"train_loss": -10.532470703125, "global_step": 126234, "epoch": 751} {"train_loss": -10.185057640075684, "global_step": 126235, "epoch": 751} {"train_loss": -10.35212230682373, "global_step": 126236, "epoch": 751} {"train_loss": -10.350278854370117, "global_step": 126237, "epoch": 751} {"train_loss": -10.334356307983398, "global_step": 126238, "epoch": 751} {"train_loss": -10.397830963134766, "global_step": 126239, "epoch": 751} {"train_loss": -10.053982734680176, "global_step": 126240, "epoch": 751} {"train_loss": -10.164265632629395, "global_step": 126241, "epoch": 751} {"train_loss": -10.179542541503906, "global_step": 126242, "epoch": 751} {"train_loss": -10.291964530944824, "global_step": 126243, "epoch": 751} {"train_loss": -10.247333526611328, "global_step": 126244, "epoch": 751} {"train_loss": -10.314860343933105, "global_step": 126245, "epoch": 751} {"train_loss": -10.401031494140625, "global_step": 126246, "epoch": 751} {"train_loss": -10.03531265258789, "global_step": 126247, "epoch": 751} {"train_loss": -10.417862892150879, "global_step": 126248, "epoch": 751} {"train_loss": -10.168861389160156, "global_step": 126249, "epoch": 751} {"train_loss": -9.866305351257324, "global_step": 126250, "epoch": 751} {"train_loss": -10.244758605957031, "global_step": 126251, "epoch": 751} {"train_loss": -10.095202445983887, "global_step": 126252, "epoch": 751} {"train_loss": -10.356311798095703, "global_step": 126253, "epoch": 751} {"train_loss": -9.875923156738281, "global_step": 126254, "epoch": 751} {"train_loss": -10.220252990722656, "global_step": 126255, "epoch": 751} {"train_loss": -10.288714408874512, "global_step": 126256, "epoch": 751} {"train_loss": -10.157136917114258, "global_step": 126257, "epoch": 751} {"train_loss": -10.249404907226562, "global_step": 126258, "epoch": 751} {"train_loss": -10.203709602355957, "global_step": 126259, "epoch": 751} {"train_loss": -10.446791648864746, "global_step": 126260, "epoch": 751} {"train_loss": -10.351387023925781, "global_step": 126261, "epoch": 751} {"train_loss": -10.262141227722168, "global_step": 126262, "epoch": 751} {"train_loss": -10.463375091552734, "global_step": 126263, "epoch": 751} {"train_loss": -10.500819206237793, "global_step": 126264, "epoch": 751} {"train_loss": -10.132058143615723, "global_step": 126265, "epoch": 751} {"train_loss": -10.208881378173828, "global_step": 126266, "epoch": 751} {"train_loss": -10.207197189331055, "global_step": 126267, "epoch": 751} {"train_loss": -10.187067031860352, "global_step": 126268, "epoch": 751} {"train_loss": -10.044198989868164, "global_step": 126269, "epoch": 751} {"train_loss": -10.010915756225586, "global_step": 126270, "epoch": 751} {"train_loss": -10.395965576171875, "global_step": 126271, "epoch": 751} {"train_loss": -10.044031143188477, "global_step": 126272, "epoch": 751} {"train_loss": -10.571200370788574, "global_step": 126273, "epoch": 751} {"train_loss": -9.725440979003906, "global_step": 126274, "epoch": 751} {"train_loss": -10.35086441040039, "global_step": 126275, "epoch": 751} {"train_loss": -9.914514541625977, "global_step": 126276, "epoch": 751} {"train_loss": -10.049936294555664, "global_step": 126277, "epoch": 751} {"train_loss": -10.140703201293945, "global_step": 126278, "epoch": 751} {"train_loss": -9.977592468261719, "global_step": 126279, "epoch": 751} {"train_loss": -10.045698165893555, "global_step": 126280, "epoch": 751} {"train_loss": -9.983234405517578, "global_step": 126281, "epoch": 751} {"train_loss": -10.160430908203125, "global_step": 126282, "epoch": 751} {"train_loss": -9.753847122192383, "global_step": 126283, "epoch": 751} {"train_loss": -10.431187629699707, "global_step": 126284, "epoch": 751} {"train_loss": -10.10642147064209, "global_step": 126285, "epoch": 751} {"train_loss": -9.948175430297852, "global_step": 126286, "epoch": 751} {"train_loss": -10.1080904006958, "global_step": 126287, "epoch": 751} {"train_loss": -10.152620315551758, "global_step": 126288, "epoch": 751} {"train_loss": -10.305269241333008, "global_step": 126289, "epoch": 751} {"train_loss": -10.29898738861084, "global_step": 126290, "epoch": 751} {"train_loss": -10.088920593261719, "global_step": 126291, "epoch": 751} {"train_loss": -10.37220573425293, "global_step": 126292, "epoch": 751} {"train_loss": -9.94484806060791, "global_step": 126293, "epoch": 751} {"train_loss": -10.202095031738281, "global_step": 126294, "epoch": 751} {"train_loss": -10.330881118774414, "global_step": 126295, "epoch": 751} {"train_loss": -9.970039367675781, "global_step": 126296, "epoch": 751} {"train_loss": -10.180145263671875, "global_step": 126297, "epoch": 751} {"train_loss": -10.17953872680664, "global_step": 126298, "epoch": 751} {"train_loss": -10.147953033447266, "global_step": 126299, "epoch": 751} {"train_loss": -10.362066268920898, "global_step": 126300, "epoch": 751} {"train_loss": -10.404727935791016, "global_step": 126301, "epoch": 751} {"train_loss": -10.125167846679688, "global_step": 126302, "epoch": 751} {"train_loss": -10.267372131347656, "global_step": 126303, "epoch": 751} {"train_loss": -9.792935371398926, "global_step": 126304, "epoch": 751} {"train_loss": -10.184921264648438, "global_step": 126305, "epoch": 751} {"train_loss": -9.813281059265137, "global_step": 126306, "epoch": 751} {"train_loss": -9.910775184631348, "global_step": 126307, "epoch": 751} {"train_loss": -9.934056282043457, "global_step": 126308, "epoch": 751} {"train_loss": -9.81371021270752, "global_step": 126309, "epoch": 751} {"train_loss": -10.080713272094727, "global_step": 126310, "epoch": 751} {"train_loss": -9.886030197143555, "global_step": 126311, "epoch": 751} {"train_loss": -10.250028610229492, "global_step": 126312, "epoch": 751} {"train_loss": -9.800310134887695, "global_step": 126313, "epoch": 751} {"train_loss": -10.195409774780273, "global_step": 126314, "epoch": 751} {"train_loss": -10.311544418334961, "global_step": 126315, "epoch": 751} {"train_loss": -9.91578483581543, "global_step": 126316, "epoch": 751} {"train_loss": -10.42152214050293, "global_step": 126317, "epoch": 751} {"train_loss": -9.765804290771484, "global_step": 126318, "epoch": 751} {"train_loss": -9.888519287109375, "global_step": 126319, "epoch": 751} {"train_loss": -10.475272178649902, "global_step": 126320, "epoch": 751} {"train_loss": -10.016353607177734, "global_step": 126321, "epoch": 751} {"train_loss": -10.304672241210938, "global_step": 126322, "epoch": 751} {"train_loss": -10.32918930053711, "global_step": 126323, "epoch": 751} {"train_loss": -10.293780326843262, "global_step": 126324, "epoch": 751} {"train_loss": -10.377063751220703, "global_step": 126325, "epoch": 751} {"train_loss": -10.264896392822266, "global_step": 126326, "epoch": 751} {"train_loss": -10.374065399169922, "global_step": 126327, "epoch": 751} {"train_loss": -10.193647384643555, "global_step": 126328, "epoch": 751} {"train_loss": -10.397621154785156, "global_step": 126329, "epoch": 751} {"train_loss": -10.27208137512207, "global_step": 126330, "epoch": 751} {"train_loss": -10.375839233398438, "global_step": 126331, "epoch": 751} {"train_loss": -10.07386589050293, "global_step": 126332, "epoch": 751} {"train_loss": -10.242523193359375, "global_step": 126333, "epoch": 751} {"train_loss": -10.060725212097168, "global_step": 126334, "epoch": 751} {"train_loss": -10.216289599736532, "global_step": 126335, "epoch": 751, "val_loss": 219198.8125} {"train_loss": -10.206613540649414, "global_step": 126336, "epoch": 752} {"train_loss": -9.746814727783203, "global_step": 126337, "epoch": 752} {"train_loss": -10.43528938293457, "global_step": 126338, "epoch": 752} {"train_loss": -9.347702026367188, "global_step": 126339, "epoch": 752} {"train_loss": -10.17874526977539, "global_step": 126340, "epoch": 752} {"train_loss": -9.67586612701416, "global_step": 126341, "epoch": 752} {"train_loss": -10.210777282714844, "global_step": 126342, "epoch": 752} {"train_loss": -9.960065841674805, "global_step": 126343, "epoch": 752} {"train_loss": -10.259883880615234, "global_step": 126344, "epoch": 752} {"train_loss": -10.102340698242188, "global_step": 126345, "epoch": 752} {"train_loss": -10.206639289855957, "global_step": 126346, "epoch": 752} {"train_loss": -10.137025833129883, "global_step": 126347, "epoch": 752} {"train_loss": -10.307405471801758, "global_step": 126348, "epoch": 752} {"train_loss": -10.394397735595703, "global_step": 126349, "epoch": 752} {"train_loss": -10.114217758178711, "global_step": 126350, "epoch": 752} {"train_loss": -10.336936950683594, "global_step": 126351, "epoch": 752} {"train_loss": -10.160547256469727, "global_step": 126352, "epoch": 752} {"train_loss": -10.442258834838867, "global_step": 126353, "epoch": 752} {"train_loss": -10.339619636535645, "global_step": 126354, "epoch": 752} {"train_loss": -10.33279800415039, "global_step": 126355, "epoch": 752} {"train_loss": -10.316356658935547, "global_step": 126356, "epoch": 752} {"train_loss": -10.46756362915039, "global_step": 126357, "epoch": 752} {"train_loss": -10.190139770507812, "global_step": 126358, "epoch": 752} {"train_loss": -10.513544082641602, "global_step": 126359, "epoch": 752} {"train_loss": -10.258451461791992, "global_step": 126360, "epoch": 752} {"train_loss": -10.224716186523438, "global_step": 126361, "epoch": 752} {"train_loss": -10.345643997192383, "global_step": 126362, "epoch": 752} {"train_loss": -10.484024047851562, "global_step": 126363, "epoch": 752} {"train_loss": -10.295404434204102, "global_step": 126364, "epoch": 752} {"train_loss": -10.205923080444336, "global_step": 126365, "epoch": 752} {"train_loss": -10.439453125, "global_step": 126366, "epoch": 752} {"train_loss": -10.273923873901367, "global_step": 126367, "epoch": 752} {"train_loss": -10.051583290100098, "global_step": 126368, "epoch": 752} {"train_loss": -10.141666412353516, "global_step": 126369, "epoch": 752} {"train_loss": -10.39007568359375, "global_step": 126370, "epoch": 752} {"train_loss": -9.59366226196289, "global_step": 126371, "epoch": 752} {"train_loss": -10.304224967956543, "global_step": 126372, "epoch": 752} {"train_loss": -9.845741271972656, "global_step": 126373, "epoch": 752} {"train_loss": -10.180779457092285, "global_step": 126374, "epoch": 752} {"train_loss": -10.339666366577148, "global_step": 126375, "epoch": 752} {"train_loss": -10.07762336730957, "global_step": 126376, "epoch": 752} {"train_loss": -10.459672927856445, "global_step": 126377, "epoch": 752} {"train_loss": -10.354719161987305, "global_step": 126378, "epoch": 752} {"train_loss": -10.449009895324707, "global_step": 126379, "epoch": 752} {"train_loss": -10.412744522094727, "global_step": 126380, "epoch": 752} {"train_loss": -10.310232162475586, "global_step": 126381, "epoch": 752} {"train_loss": -10.309076309204102, "global_step": 126382, "epoch": 752} {"train_loss": -10.160684585571289, "global_step": 126383, "epoch": 752} {"train_loss": -10.562780380249023, "global_step": 126384, "epoch": 752} {"train_loss": -10.023992538452148, "global_step": 126385, "epoch": 752} {"train_loss": -10.626596450805664, "global_step": 126386, "epoch": 752} {"train_loss": -10.409608840942383, "global_step": 126387, "epoch": 752} {"train_loss": -10.471413612365723, "global_step": 126388, "epoch": 752} {"train_loss": -10.553668975830078, "global_step": 126389, "epoch": 752} {"train_loss": -10.422882080078125, "global_step": 126390, "epoch": 752} {"train_loss": -10.667366027832031, "global_step": 126391, "epoch": 752} {"train_loss": -10.502795219421387, "global_step": 126392, "epoch": 752} {"train_loss": -10.712360382080078, "global_step": 126393, "epoch": 752} {"train_loss": -10.530107498168945, "global_step": 126394, "epoch": 752} {"train_loss": -10.409984588623047, "global_step": 126395, "epoch": 752} {"train_loss": -10.419927597045898, "global_step": 126396, "epoch": 752} {"train_loss": -10.473368644714355, "global_step": 126397, "epoch": 752} {"train_loss": -10.370199203491211, "global_step": 126398, "epoch": 752} {"train_loss": -10.484947204589844, "global_step": 126399, "epoch": 752} {"train_loss": -10.309350967407227, "global_step": 126400, "epoch": 752} {"train_loss": -10.649686813354492, "global_step": 126401, "epoch": 752} {"train_loss": -10.223095893859863, "global_step": 126402, "epoch": 752} {"train_loss": -10.688596725463867, "global_step": 126403, "epoch": 752} {"train_loss": -10.233926773071289, "global_step": 126404, "epoch": 752} {"train_loss": -10.35558795928955, "global_step": 126405, "epoch": 752} {"train_loss": -10.509256362915039, "global_step": 126406, "epoch": 752} {"train_loss": -10.666831970214844, "global_step": 126407, "epoch": 752} {"train_loss": -9.940105438232422, "global_step": 126408, "epoch": 752} {"train_loss": -9.659282684326172, "global_step": 126409, "epoch": 752} {"train_loss": -10.178630828857422, "global_step": 126410, "epoch": 752} {"train_loss": -9.282026290893555, "global_step": 126411, "epoch": 752} {"train_loss": -9.322286605834961, "global_step": 126412, "epoch": 752} {"train_loss": -9.732912063598633, "global_step": 126413, "epoch": 752} {"train_loss": -9.263885498046875, "global_step": 126414, "epoch": 752} {"train_loss": -9.270684242248535, "global_step": 126415, "epoch": 752} {"train_loss": -9.649898529052734, "global_step": 126416, "epoch": 752} {"train_loss": -9.759706497192383, "global_step": 126417, "epoch": 752} {"train_loss": -9.747374534606934, "global_step": 126418, "epoch": 752} {"train_loss": -10.102033615112305, "global_step": 126419, "epoch": 752} {"train_loss": -9.913224220275879, "global_step": 126420, "epoch": 752} {"train_loss": -9.804478645324707, "global_step": 126421, "epoch": 752} {"train_loss": -9.899744033813477, "global_step": 126422, "epoch": 752} {"train_loss": -9.830326080322266, "global_step": 126423, "epoch": 752} {"train_loss": -9.37372875213623, "global_step": 126424, "epoch": 752} {"train_loss": -10.016674041748047, "global_step": 126425, "epoch": 752} {"train_loss": -9.954164505004883, "global_step": 126426, "epoch": 752} {"train_loss": -9.8834228515625, "global_step": 126427, "epoch": 752} {"train_loss": -10.166633605957031, "global_step": 126428, "epoch": 752} {"train_loss": -10.05922794342041, "global_step": 126429, "epoch": 752} {"train_loss": -9.821517944335938, "global_step": 126430, "epoch": 752} {"train_loss": -10.167863845825195, "global_step": 126431, "epoch": 752} {"train_loss": -9.996633529663086, "global_step": 126432, "epoch": 752} {"train_loss": -10.149213790893555, "global_step": 126433, "epoch": 752} {"train_loss": -10.051061630249023, "global_step": 126434, "epoch": 752} {"train_loss": -10.230440139770508, "global_step": 126435, "epoch": 752} {"train_loss": -10.103029251098633, "global_step": 126436, "epoch": 752} {"train_loss": -10.2310152053833, "global_step": 126437, "epoch": 752} {"train_loss": -10.014534950256348, "global_step": 126438, "epoch": 752} {"train_loss": -10.17960262298584, "global_step": 126439, "epoch": 752} {"train_loss": -10.246856689453125, "global_step": 126440, "epoch": 752} {"train_loss": -10.022661209106445, "global_step": 126441, "epoch": 752} {"train_loss": -9.882997512817383, "global_step": 126442, "epoch": 752} {"train_loss": -10.235101699829102, "global_step": 126443, "epoch": 752} {"train_loss": -10.346673011779785, "global_step": 126444, "epoch": 752} {"train_loss": -9.888534545898438, "global_step": 126445, "epoch": 752} {"train_loss": -10.362371444702148, "global_step": 126446, "epoch": 752} {"train_loss": -10.279391288757324, "global_step": 126447, "epoch": 752} {"train_loss": -10.497152328491211, "global_step": 126448, "epoch": 752} {"train_loss": -9.943617820739746, "global_step": 126449, "epoch": 752} {"train_loss": -10.577479362487793, "global_step": 126450, "epoch": 752} {"train_loss": -10.092439651489258, "global_step": 126451, "epoch": 752} {"train_loss": -10.066815376281738, "global_step": 126452, "epoch": 752} {"train_loss": -10.395721435546875, "global_step": 126453, "epoch": 752} {"train_loss": -10.214859008789062, "global_step": 126454, "epoch": 752} {"train_loss": -10.423582077026367, "global_step": 126455, "epoch": 752} {"train_loss": -10.379915237426758, "global_step": 126456, "epoch": 752} {"train_loss": -10.368337631225586, "global_step": 126457, "epoch": 752} {"train_loss": -10.405265808105469, "global_step": 126458, "epoch": 752} {"train_loss": -10.371357917785645, "global_step": 126459, "epoch": 752} {"train_loss": -10.287725448608398, "global_step": 126460, "epoch": 752} {"train_loss": -10.130504608154297, "global_step": 126461, "epoch": 752} {"train_loss": -10.210712432861328, "global_step": 126462, "epoch": 752} {"train_loss": -10.594698905944824, "global_step": 126463, "epoch": 752} {"train_loss": -10.460391998291016, "global_step": 126464, "epoch": 752} {"train_loss": -10.484477043151855, "global_step": 126465, "epoch": 752} {"train_loss": -10.443843841552734, "global_step": 126466, "epoch": 752} {"train_loss": -10.41497802734375, "global_step": 126467, "epoch": 752} {"train_loss": -10.51137638092041, "global_step": 126468, "epoch": 752} {"train_loss": -10.662673950195312, "global_step": 126469, "epoch": 752} {"train_loss": -10.614100456237793, "global_step": 126470, "epoch": 752} {"train_loss": -10.57025146484375, "global_step": 126471, "epoch": 752} {"train_loss": -10.517641067504883, "global_step": 126472, "epoch": 752} {"train_loss": -10.632585525512695, "global_step": 126473, "epoch": 752} {"train_loss": -10.616527557373047, "global_step": 126474, "epoch": 752} {"train_loss": -10.549736022949219, "global_step": 126475, "epoch": 752} {"train_loss": -10.51279354095459, "global_step": 126476, "epoch": 752} {"train_loss": -10.434581756591797, "global_step": 126477, "epoch": 752} {"train_loss": -10.626277923583984, "global_step": 126478, "epoch": 752} {"train_loss": -10.516654968261719, "global_step": 126479, "epoch": 752} {"train_loss": -10.415434837341309, "global_step": 126480, "epoch": 752} {"train_loss": -10.568997383117676, "global_step": 126481, "epoch": 752} {"train_loss": -10.40739631652832, "global_step": 126482, "epoch": 752} {"train_loss": -10.629140853881836, "global_step": 126483, "epoch": 752} {"train_loss": -10.636571884155273, "global_step": 126484, "epoch": 752} {"train_loss": -10.355707168579102, "global_step": 126485, "epoch": 752} {"train_loss": -10.5309476852417, "global_step": 126486, "epoch": 752} {"train_loss": -10.574919700622559, "global_step": 126487, "epoch": 752} {"train_loss": -10.432168960571289, "global_step": 126488, "epoch": 752} {"train_loss": -10.131817817687988, "global_step": 126489, "epoch": 752} {"train_loss": -10.073951721191406, "global_step": 126490, "epoch": 752} {"train_loss": -10.449039459228516, "global_step": 126491, "epoch": 752} {"train_loss": -9.893144607543945, "global_step": 126492, "epoch": 752} {"train_loss": -9.429832458496094, "global_step": 126493, "epoch": 752} {"train_loss": -9.676925659179688, "global_step": 126494, "epoch": 752} {"train_loss": -9.31063461303711, "global_step": 126495, "epoch": 752} {"train_loss": -9.37403392791748, "global_step": 126496, "epoch": 752} {"train_loss": -9.226139068603516, "global_step": 126497, "epoch": 752} {"train_loss": -9.67098617553711, "global_step": 126498, "epoch": 752} {"train_loss": -8.969199180603027, "global_step": 126499, "epoch": 752} {"train_loss": -9.761846542358398, "global_step": 126500, "epoch": 752} {"train_loss": -8.859509468078613, "global_step": 126501, "epoch": 752} {"train_loss": -9.597780227661133, "global_step": 126502, "epoch": 752} {"train_loss": -10.178633423078628, "global_step": 126503, "epoch": 752, "val_loss": 217805.3125} {"train_loss": -10.335893630981445, "global_step": 126504, "epoch": 753} {"train_loss": -8.978796005249023, "global_step": 126505, "epoch": 753} {"train_loss": -9.62500286102295, "global_step": 126506, "epoch": 753} {"train_loss": -9.41082763671875, "global_step": 126507, "epoch": 753} {"train_loss": -9.520467758178711, "global_step": 126508, "epoch": 753} {"train_loss": -9.607629776000977, "global_step": 126509, "epoch": 753} {"train_loss": -9.432830810546875, "global_step": 126510, "epoch": 753} {"train_loss": -9.607196807861328, "global_step": 126511, "epoch": 753} {"train_loss": -9.49001693725586, "global_step": 126512, "epoch": 753} {"train_loss": -9.160926818847656, "global_step": 126513, "epoch": 753} {"train_loss": -10.002588272094727, "global_step": 126514, "epoch": 753} {"train_loss": -9.635770797729492, "global_step": 126515, "epoch": 753} {"train_loss": -9.467914581298828, "global_step": 126516, "epoch": 753} {"train_loss": -9.665069580078125, "global_step": 126517, "epoch": 753} {"train_loss": -9.761180877685547, "global_step": 126518, "epoch": 753} {"train_loss": -9.643357276916504, "global_step": 126519, "epoch": 753} {"train_loss": -9.737735748291016, "global_step": 126520, "epoch": 753} {"train_loss": -9.485925674438477, "global_step": 126521, "epoch": 753} {"train_loss": -9.738523483276367, "global_step": 126522, "epoch": 753} {"train_loss": -10.091450691223145, "global_step": 126523, "epoch": 753} {"train_loss": -9.919207572937012, "global_step": 126524, "epoch": 753} {"train_loss": -9.890604019165039, "global_step": 126525, "epoch": 753} {"train_loss": -9.935098648071289, "global_step": 126526, "epoch": 753} {"train_loss": -10.068866729736328, "global_step": 126527, "epoch": 753} {"train_loss": -10.175664901733398, "global_step": 126528, "epoch": 753} {"train_loss": -10.069854736328125, "global_step": 126529, "epoch": 753} {"train_loss": -9.932374954223633, "global_step": 126530, "epoch": 753} {"train_loss": -10.070293426513672, "global_step": 126531, "epoch": 753} {"train_loss": -10.232967376708984, "global_step": 126532, "epoch": 753} {"train_loss": -10.173382759094238, "global_step": 126533, "epoch": 753} {"train_loss": -10.204298973083496, "global_step": 126534, "epoch": 753} {"train_loss": -10.307699203491211, "global_step": 126535, "epoch": 753} {"train_loss": -10.260553359985352, "global_step": 126536, "epoch": 753} {"train_loss": -10.063409805297852, "global_step": 126537, "epoch": 753} {"train_loss": -10.383598327636719, "global_step": 126538, "epoch": 753} {"train_loss": -10.329601287841797, "global_step": 126539, "epoch": 753} {"train_loss": -10.123930931091309, "global_step": 126540, "epoch": 753} {"train_loss": -10.37891960144043, "global_step": 126541, "epoch": 753} {"train_loss": -10.221017837524414, "global_step": 126542, "epoch": 753} {"train_loss": -10.44594955444336, "global_step": 126543, "epoch": 753} {"train_loss": -10.22815227508545, "global_step": 126544, "epoch": 753} {"train_loss": -10.430946350097656, "global_step": 126545, "epoch": 753} {"train_loss": -10.417699813842773, "global_step": 126546, "epoch": 753} {"train_loss": -10.301916122436523, "global_step": 126547, "epoch": 753} {"train_loss": -10.589743614196777, "global_step": 126548, "epoch": 753} {"train_loss": -10.581877708435059, "global_step": 126549, "epoch": 753} {"train_loss": -10.586648941040039, "global_step": 126550, "epoch": 753} {"train_loss": -10.613343238830566, "global_step": 126551, "epoch": 753} {"train_loss": -10.593656539916992, "global_step": 126552, "epoch": 753} {"train_loss": -10.501335144042969, "global_step": 126553, "epoch": 753} {"train_loss": -10.555895805358887, "global_step": 126554, "epoch": 753} {"train_loss": -10.702795028686523, "global_step": 126555, "epoch": 753} {"train_loss": -10.701730728149414, "global_step": 126556, "epoch": 753} {"train_loss": -10.437054634094238, "global_step": 126557, "epoch": 753} {"train_loss": -10.728477478027344, "global_step": 126558, "epoch": 753} {"train_loss": -10.526986122131348, "global_step": 126559, "epoch": 753} {"train_loss": -10.640186309814453, "global_step": 126560, "epoch": 753} {"train_loss": -10.575769424438477, "global_step": 126561, "epoch": 753} {"train_loss": -10.62741470336914, "global_step": 126562, "epoch": 753} {"train_loss": -10.67186164855957, "global_step": 126563, "epoch": 753} {"train_loss": -10.800049781799316, "global_step": 126564, "epoch": 753} {"train_loss": -10.268630981445312, "global_step": 126565, "epoch": 753} {"train_loss": -10.034252166748047, "global_step": 126566, "epoch": 753} {"train_loss": -9.62371826171875, "global_step": 126567, "epoch": 753} {"train_loss": -10.623895645141602, "global_step": 126568, "epoch": 753} {"train_loss": -9.822586059570312, "global_step": 126569, "epoch": 753} {"train_loss": -9.711784362792969, "global_step": 126570, "epoch": 753} {"train_loss": -9.439531326293945, "global_step": 126571, "epoch": 753} {"train_loss": -9.47622299194336, "global_step": 126572, "epoch": 753} {"train_loss": -9.855080604553223, "global_step": 126573, "epoch": 753} {"train_loss": -9.820598602294922, "global_step": 126574, "epoch": 753} {"train_loss": -9.673575401306152, "global_step": 126575, "epoch": 753} {"train_loss": -10.220970153808594, "global_step": 126576, "epoch": 753} {"train_loss": -10.544584274291992, "global_step": 126577, "epoch": 753} {"train_loss": -10.233323097229004, "global_step": 126578, "epoch": 753} {"train_loss": -10.231058120727539, "global_step": 126579, "epoch": 753} {"train_loss": -10.03816032409668, "global_step": 126580, "epoch": 753} {"train_loss": -9.7672700881958, "global_step": 126581, "epoch": 753} {"train_loss": -10.307669639587402, "global_step": 126582, "epoch": 753} {"train_loss": -10.087620735168457, "global_step": 126583, "epoch": 753} {"train_loss": -9.508126258850098, "global_step": 126584, "epoch": 753} {"train_loss": -9.802804946899414, "global_step": 126585, "epoch": 753} {"train_loss": -9.344470977783203, "global_step": 126586, "epoch": 753} {"train_loss": -10.176206588745117, "global_step": 126587, "epoch": 753} {"train_loss": -9.871742248535156, "global_step": 126588, "epoch": 753} {"train_loss": -9.941795349121094, "global_step": 126589, "epoch": 753} {"train_loss": -9.729798316955566, "global_step": 126590, "epoch": 753} {"train_loss": -10.284730911254883, "global_step": 126591, "epoch": 753} {"train_loss": -9.74790096282959, "global_step": 126592, "epoch": 753} {"train_loss": -10.212350845336914, "global_step": 126593, "epoch": 753} {"train_loss": -9.905896186828613, "global_step": 126594, "epoch": 753} {"train_loss": -9.985551834106445, "global_step": 126595, "epoch": 753} {"train_loss": -9.578168869018555, "global_step": 126596, "epoch": 753} {"train_loss": -10.405508995056152, "global_step": 126597, "epoch": 753} {"train_loss": -9.634017944335938, "global_step": 126598, "epoch": 753} {"train_loss": -10.04487133026123, "global_step": 126599, "epoch": 753} {"train_loss": -9.927403450012207, "global_step": 126600, "epoch": 753} {"train_loss": -10.201411247253418, "global_step": 126601, "epoch": 753} {"train_loss": -9.784439086914062, "global_step": 126602, "epoch": 753} {"train_loss": -10.294092178344727, "global_step": 126603, "epoch": 753} {"train_loss": -9.909627914428711, "global_step": 126604, "epoch": 753} {"train_loss": -10.09533405303955, "global_step": 126605, "epoch": 753} {"train_loss": -9.960031509399414, "global_step": 126606, "epoch": 753} {"train_loss": -9.88720417022705, "global_step": 126607, "epoch": 753} {"train_loss": -10.148185729980469, "global_step": 126608, "epoch": 753} {"train_loss": -10.21019172668457, "global_step": 126609, "epoch": 753} {"train_loss": -10.171944618225098, "global_step": 126610, "epoch": 753} {"train_loss": -10.323348999023438, "global_step": 126611, "epoch": 753} {"train_loss": -10.219132423400879, "global_step": 126612, "epoch": 753} {"train_loss": -10.206409454345703, "global_step": 126613, "epoch": 753} {"train_loss": -10.277936935424805, "global_step": 126614, "epoch": 753} {"train_loss": -10.500718116760254, "global_step": 126615, "epoch": 753} {"train_loss": -10.463558197021484, "global_step": 126616, "epoch": 753} {"train_loss": -10.525784492492676, "global_step": 126617, "epoch": 753} {"train_loss": -10.436563491821289, "global_step": 126618, "epoch": 753} {"train_loss": -10.211570739746094, "global_step": 126619, "epoch": 753} {"train_loss": -10.448131561279297, "global_step": 126620, "epoch": 753} {"train_loss": -10.544530868530273, "global_step": 126621, "epoch": 753} {"train_loss": -10.483512878417969, "global_step": 126622, "epoch": 753} {"train_loss": -10.338854789733887, "global_step": 126623, "epoch": 753} {"train_loss": -10.431090354919434, "global_step": 126624, "epoch": 753} {"train_loss": -10.344228744506836, "global_step": 126625, "epoch": 753} {"train_loss": -10.33581829071045, "global_step": 126626, "epoch": 753} {"train_loss": -10.361896514892578, "global_step": 126627, "epoch": 753} {"train_loss": -10.51729965209961, "global_step": 126628, "epoch": 753} {"train_loss": -10.434708595275879, "global_step": 126629, "epoch": 753} {"train_loss": -10.63795280456543, "global_step": 126630, "epoch": 753} {"train_loss": -10.484430313110352, "global_step": 126631, "epoch": 753} {"train_loss": -10.534967422485352, "global_step": 126632, "epoch": 753} {"train_loss": -10.724592208862305, "global_step": 126633, "epoch": 753} {"train_loss": -10.451200485229492, "global_step": 126634, "epoch": 753} {"train_loss": -10.377466201782227, "global_step": 126635, "epoch": 753} {"train_loss": -10.300239562988281, "global_step": 126636, "epoch": 753} {"train_loss": -10.270216941833496, "global_step": 126637, "epoch": 753} {"train_loss": -10.403383255004883, "global_step": 126638, "epoch": 753} {"train_loss": -10.02084732055664, "global_step": 126639, "epoch": 753} {"train_loss": -10.402557373046875, "global_step": 126640, "epoch": 753} {"train_loss": -10.283331871032715, "global_step": 126641, "epoch": 753} {"train_loss": -10.083171844482422, "global_step": 126642, "epoch": 753} {"train_loss": -10.08358097076416, "global_step": 126643, "epoch": 753} {"train_loss": -9.974725723266602, "global_step": 126644, "epoch": 753} {"train_loss": -9.963857650756836, "global_step": 126645, "epoch": 753} {"train_loss": -9.419620513916016, "global_step": 126646, "epoch": 753} {"train_loss": -9.023246765136719, "global_step": 126647, "epoch": 753} {"train_loss": -10.234325408935547, "global_step": 126648, "epoch": 753} {"train_loss": -8.98735523223877, "global_step": 126649, "epoch": 753} {"train_loss": -10.241689682006836, "global_step": 126650, "epoch": 753} {"train_loss": -9.565933227539062, "global_step": 126651, "epoch": 753} {"train_loss": -9.836649894714355, "global_step": 126652, "epoch": 753} {"train_loss": -9.837000846862793, "global_step": 126653, "epoch": 753} {"train_loss": -10.13834285736084, "global_step": 126654, "epoch": 753} {"train_loss": -9.935922622680664, "global_step": 126655, "epoch": 753} {"train_loss": -10.097190856933594, "global_step": 126656, "epoch": 753} {"train_loss": -10.145101547241211, "global_step": 126657, "epoch": 753} {"train_loss": -10.248287200927734, "global_step": 126658, "epoch": 753} {"train_loss": -9.879164695739746, "global_step": 126659, "epoch": 753} {"train_loss": -10.093503952026367, "global_step": 126660, "epoch": 753} {"train_loss": -10.351078987121582, "global_step": 126661, "epoch": 753} {"train_loss": -9.995166778564453, "global_step": 126662, "epoch": 753} {"train_loss": -10.285848617553711, "global_step": 126663, "epoch": 753} {"train_loss": -9.875362396240234, "global_step": 126664, "epoch": 753} {"train_loss": -10.193509101867676, "global_step": 126665, "epoch": 753} {"train_loss": -10.111709594726562, "global_step": 126666, "epoch": 753} {"train_loss": -9.822534561157227, "global_step": 126667, "epoch": 753} {"train_loss": -10.060734748840332, "global_step": 126668, "epoch": 753} {"train_loss": -10.220793724060059, "global_step": 126669, "epoch": 753} {"train_loss": -9.810342788696289, "global_step": 126670, "epoch": 753} {"train_loss": -10.099745807193575, "global_step": 126671, "epoch": 753, "val_loss": 210015.359375} {"train_loss": -10.140961647033691, "global_step": 126672, "epoch": 754} {"train_loss": -10.003572463989258, "global_step": 126673, "epoch": 754} {"train_loss": -10.245146751403809, "global_step": 126674, "epoch": 754} {"train_loss": -10.002405166625977, "global_step": 126675, "epoch": 754} {"train_loss": -9.834352493286133, "global_step": 126676, "epoch": 754} {"train_loss": -10.445184707641602, "global_step": 126677, "epoch": 754} {"train_loss": -10.071976661682129, "global_step": 126678, "epoch": 754} {"train_loss": -10.337467193603516, "global_step": 126679, "epoch": 754} {"train_loss": -10.200295448303223, "global_step": 126680, "epoch": 754} {"train_loss": -10.25732707977295, "global_step": 126681, "epoch": 754} {"train_loss": -10.264933586120605, "global_step": 126682, "epoch": 754} {"train_loss": -10.188558578491211, "global_step": 126683, "epoch": 754} {"train_loss": -10.165361404418945, "global_step": 126684, "epoch": 754} {"train_loss": -10.160723686218262, "global_step": 126685, "epoch": 754} {"train_loss": -10.283662796020508, "global_step": 126686, "epoch": 754} {"train_loss": -10.136421203613281, "global_step": 126687, "epoch": 754} {"train_loss": -10.255611419677734, "global_step": 126688, "epoch": 754} {"train_loss": -10.284808158874512, "global_step": 126689, "epoch": 754} {"train_loss": -10.317422866821289, "global_step": 126690, "epoch": 754} {"train_loss": -10.354001998901367, "global_step": 126691, "epoch": 754} {"train_loss": -10.381149291992188, "global_step": 126692, "epoch": 754} {"train_loss": -10.489124298095703, "global_step": 126693, "epoch": 754} {"train_loss": -10.560115814208984, "global_step": 126694, "epoch": 754} {"train_loss": -10.481725692749023, "global_step": 126695, "epoch": 754} {"train_loss": -10.402908325195312, "global_step": 126696, "epoch": 754} {"train_loss": -10.461021423339844, "global_step": 126697, "epoch": 754} {"train_loss": -10.460500717163086, "global_step": 126698, "epoch": 754} {"train_loss": -10.337839126586914, "global_step": 126699, "epoch": 754} {"train_loss": -10.394779205322266, "global_step": 126700, "epoch": 754} {"train_loss": -10.463062286376953, "global_step": 126701, "epoch": 754} {"train_loss": -10.488334655761719, "global_step": 126702, "epoch": 754} {"train_loss": -10.31675910949707, "global_step": 126703, "epoch": 754} {"train_loss": -10.455038070678711, "global_step": 126704, "epoch": 754} {"train_loss": -10.392809867858887, "global_step": 126705, "epoch": 754} {"train_loss": -10.477914810180664, "global_step": 126706, "epoch": 754} {"train_loss": -10.40401840209961, "global_step": 126707, "epoch": 754} {"train_loss": -10.247823715209961, "global_step": 126708, "epoch": 754} {"train_loss": -10.058414459228516, "global_step": 126709, "epoch": 754} {"train_loss": -10.007822036743164, "global_step": 126710, "epoch": 754} {"train_loss": -10.094917297363281, "global_step": 126711, "epoch": 754} {"train_loss": -10.151300430297852, "global_step": 126712, "epoch": 754} {"train_loss": -10.404352188110352, "global_step": 126713, "epoch": 754} {"train_loss": -9.998115539550781, "global_step": 126714, "epoch": 754} {"train_loss": -10.291921615600586, "global_step": 126715, "epoch": 754} {"train_loss": -10.39830207824707, "global_step": 126716, "epoch": 754} {"train_loss": -10.466442108154297, "global_step": 126717, "epoch": 754} {"train_loss": -10.689477920532227, "global_step": 126718, "epoch": 754} {"train_loss": -10.240568161010742, "global_step": 126719, "epoch": 754} {"train_loss": -10.32071304321289, "global_step": 126720, "epoch": 754} {"train_loss": -10.345052719116211, "global_step": 126721, "epoch": 754} {"train_loss": -10.570066452026367, "global_step": 126722, "epoch": 754} {"train_loss": -10.084847450256348, "global_step": 126723, "epoch": 754} {"train_loss": -10.666533470153809, "global_step": 126724, "epoch": 754} {"train_loss": -10.52933120727539, "global_step": 126725, "epoch": 754} {"train_loss": -10.100846290588379, "global_step": 126726, "epoch": 754} {"train_loss": -10.407052993774414, "global_step": 126727, "epoch": 754} {"train_loss": -10.014437675476074, "global_step": 126728, "epoch": 754} {"train_loss": -10.04868221282959, "global_step": 126729, "epoch": 754} {"train_loss": -10.050561904907227, "global_step": 126730, "epoch": 754} {"train_loss": -10.537239074707031, "global_step": 126731, "epoch": 754} {"train_loss": -10.103656768798828, "global_step": 126732, "epoch": 754} {"train_loss": -10.183721542358398, "global_step": 126733, "epoch": 754} {"train_loss": -10.18331527709961, "global_step": 126734, "epoch": 754} {"train_loss": -10.084364891052246, "global_step": 126735, "epoch": 754} {"train_loss": -10.41087532043457, "global_step": 126736, "epoch": 754} {"train_loss": -10.10016918182373, "global_step": 126737, "epoch": 754} {"train_loss": -10.191032409667969, "global_step": 126738, "epoch": 754} {"train_loss": -10.150676727294922, "global_step": 126739, "epoch": 754} {"train_loss": -10.154020309448242, "global_step": 126740, "epoch": 754} {"train_loss": -10.034294128417969, "global_step": 126741, "epoch": 754} {"train_loss": -9.89964485168457, "global_step": 126742, "epoch": 754} {"train_loss": -10.20317554473877, "global_step": 126743, "epoch": 754} {"train_loss": -9.60799503326416, "global_step": 126744, "epoch": 754} {"train_loss": -9.823318481445312, "global_step": 126745, "epoch": 754} {"train_loss": -9.419984817504883, "global_step": 126746, "epoch": 754} {"train_loss": -9.66914176940918, "global_step": 126747, "epoch": 754} {"train_loss": -9.458463668823242, "global_step": 126748, "epoch": 754} {"train_loss": -9.803070068359375, "global_step": 126749, "epoch": 754} {"train_loss": -9.594160079956055, "global_step": 126750, "epoch": 754} {"train_loss": -9.874083518981934, "global_step": 126751, "epoch": 754} {"train_loss": -8.688192367553711, "global_step": 126752, "epoch": 754} {"train_loss": -10.167449951171875, "global_step": 126753, "epoch": 754} {"train_loss": -8.828086853027344, "global_step": 126754, "epoch": 754} {"train_loss": -9.672523498535156, "global_step": 126755, "epoch": 754} {"train_loss": -9.404695510864258, "global_step": 126756, "epoch": 754} {"train_loss": -8.612903594970703, "global_step": 126757, "epoch": 754} {"train_loss": -10.025022506713867, "global_step": 126758, "epoch": 754} {"train_loss": -9.439142227172852, "global_step": 126759, "epoch": 754} {"train_loss": -9.931325912475586, "global_step": 126760, "epoch": 754} {"train_loss": -9.67434024810791, "global_step": 126761, "epoch": 754} {"train_loss": -9.150075912475586, "global_step": 126762, "epoch": 754} {"train_loss": -10.147361755371094, "global_step": 126763, "epoch": 754} {"train_loss": -9.446399688720703, "global_step": 126764, "epoch": 754} {"train_loss": -9.873283386230469, "global_step": 126765, "epoch": 754} {"train_loss": -10.165566444396973, "global_step": 126766, "epoch": 754} {"train_loss": -9.774406433105469, "global_step": 126767, "epoch": 754} {"train_loss": -9.935844421386719, "global_step": 126768, "epoch": 754} {"train_loss": -10.086524963378906, "global_step": 126769, "epoch": 754} {"train_loss": -9.86536979675293, "global_step": 126770, "epoch": 754} {"train_loss": -10.192258834838867, "global_step": 126771, "epoch": 754} {"train_loss": -10.091379165649414, "global_step": 126772, "epoch": 754} {"train_loss": -10.063720703125, "global_step": 126773, "epoch": 754} {"train_loss": -10.251646995544434, "global_step": 126774, "epoch": 754} {"train_loss": -10.292466163635254, "global_step": 126775, "epoch": 754} {"train_loss": -10.132318496704102, "global_step": 126776, "epoch": 754} {"train_loss": -10.265313148498535, "global_step": 126777, "epoch": 754} {"train_loss": -10.2597074508667, "global_step": 126778, "epoch": 754} {"train_loss": -10.15742301940918, "global_step": 126779, "epoch": 754} {"train_loss": -10.148488998413086, "global_step": 126780, "epoch": 754} {"train_loss": -10.379213333129883, "global_step": 126781, "epoch": 754} {"train_loss": -10.129176139831543, "global_step": 126782, "epoch": 754} {"train_loss": -10.329930305480957, "global_step": 126783, "epoch": 754} {"train_loss": -10.364812850952148, "global_step": 126784, "epoch": 754} {"train_loss": -10.324085235595703, "global_step": 126785, "epoch": 754} {"train_loss": -10.605073928833008, "global_step": 126786, "epoch": 754} {"train_loss": -10.431053161621094, "global_step": 126787, "epoch": 754} {"train_loss": -10.52798843383789, "global_step": 126788, "epoch": 754} {"train_loss": -10.712736129760742, "global_step": 126789, "epoch": 754} {"train_loss": -10.086884498596191, "global_step": 126790, "epoch": 754} {"train_loss": -10.550527572631836, "global_step": 126791, "epoch": 754} {"train_loss": -10.521932601928711, "global_step": 126792, "epoch": 754} {"train_loss": -10.039889335632324, "global_step": 126793, "epoch": 754} {"train_loss": -10.426441192626953, "global_step": 126794, "epoch": 754} {"train_loss": -10.563620567321777, "global_step": 126795, "epoch": 754} {"train_loss": -10.364784240722656, "global_step": 126796, "epoch": 754} {"train_loss": -10.141210556030273, "global_step": 126797, "epoch": 754} {"train_loss": -10.5438232421875, "global_step": 126798, "epoch": 754} {"train_loss": -10.33922290802002, "global_step": 126799, "epoch": 754} {"train_loss": -10.574844360351562, "global_step": 126800, "epoch": 754} {"train_loss": -10.717950820922852, "global_step": 126801, "epoch": 754} {"train_loss": -10.575023651123047, "global_step": 126802, "epoch": 754} {"train_loss": -10.474157333374023, "global_step": 126803, "epoch": 754} {"train_loss": -10.703981399536133, "global_step": 126804, "epoch": 754} {"train_loss": -10.568535804748535, "global_step": 126805, "epoch": 754} {"train_loss": -10.641992568969727, "global_step": 126806, "epoch": 754} {"train_loss": -10.457077026367188, "global_step": 126807, "epoch": 754} {"train_loss": -10.57121467590332, "global_step": 126808, "epoch": 754} {"train_loss": -10.137604713439941, "global_step": 126809, "epoch": 754} {"train_loss": -10.00174331665039, "global_step": 126810, "epoch": 754} {"train_loss": -10.730827331542969, "global_step": 126811, "epoch": 754} {"train_loss": -9.940973281860352, "global_step": 126812, "epoch": 754} {"train_loss": -9.884467124938965, "global_step": 126813, "epoch": 754} {"train_loss": -10.0383939743042, "global_step": 126814, "epoch": 754} {"train_loss": -9.84347915649414, "global_step": 126815, "epoch": 754} {"train_loss": -10.339693069458008, "global_step": 126816, "epoch": 754} {"train_loss": -9.567412376403809, "global_step": 126817, "epoch": 754} {"train_loss": -9.763622283935547, "global_step": 126818, "epoch": 754} {"train_loss": -9.708733558654785, "global_step": 126819, "epoch": 754} {"train_loss": -9.123810768127441, "global_step": 126820, "epoch": 754} {"train_loss": -9.12858772277832, "global_step": 126821, "epoch": 754} {"train_loss": -10.438756942749023, "global_step": 126822, "epoch": 754} {"train_loss": -9.07972240447998, "global_step": 126823, "epoch": 754} {"train_loss": -9.8284912109375, "global_step": 126824, "epoch": 754} {"train_loss": -9.192737579345703, "global_step": 126825, "epoch": 754} {"train_loss": -9.792988777160645, "global_step": 126826, "epoch": 754} {"train_loss": -9.182050704956055, "global_step": 126827, "epoch": 754} {"train_loss": -9.105741500854492, "global_step": 126828, "epoch": 754} {"train_loss": -10.03558349609375, "global_step": 126829, "epoch": 754} {"train_loss": -9.65504264831543, "global_step": 126830, "epoch": 754} {"train_loss": -9.791094779968262, "global_step": 126831, "epoch": 754} {"train_loss": -9.877089500427246, "global_step": 126832, "epoch": 754} {"train_loss": -9.687917709350586, "global_step": 126833, "epoch": 754} {"train_loss": -9.747993469238281, "global_step": 126834, "epoch": 754} {"train_loss": -10.053497314453125, "global_step": 126835, "epoch": 754} {"train_loss": -10.200122833251953, "global_step": 126836, "epoch": 754} {"train_loss": -9.879976272583008, "global_step": 126837, "epoch": 754} {"train_loss": -10.13880729675293, "global_step": 126838, "epoch": 754} {"train_loss": -10.105576696850004, "global_step": 126839, "epoch": 754, "val_loss": 215774.828125} {"train_loss": -10.15391731262207, "global_step": 126840, "epoch": 755} {"train_loss": -10.03996467590332, "global_step": 126841, "epoch": 755} {"train_loss": -9.964786529541016, "global_step": 126842, "epoch": 755} {"train_loss": -9.914714813232422, "global_step": 126843, "epoch": 755} {"train_loss": -9.876461029052734, "global_step": 126844, "epoch": 755} {"train_loss": -10.174230575561523, "global_step": 126845, "epoch": 755} {"train_loss": -9.86408519744873, "global_step": 126846, "epoch": 755} {"train_loss": -10.059947967529297, "global_step": 126847, "epoch": 755} {"train_loss": -10.047161102294922, "global_step": 126848, "epoch": 755} {"train_loss": -10.128278732299805, "global_step": 126849, "epoch": 755} {"train_loss": -10.13929557800293, "global_step": 126850, "epoch": 755} {"train_loss": -10.269304275512695, "global_step": 126851, "epoch": 755} {"train_loss": -10.321969985961914, "global_step": 126852, "epoch": 755} {"train_loss": -10.045867919921875, "global_step": 126853, "epoch": 755} {"train_loss": -10.168998718261719, "global_step": 126854, "epoch": 755} {"train_loss": -10.49583625793457, "global_step": 126855, "epoch": 755} {"train_loss": -10.23390007019043, "global_step": 126856, "epoch": 755} {"train_loss": -10.242116928100586, "global_step": 126857, "epoch": 755} {"train_loss": -10.420971870422363, "global_step": 126858, "epoch": 755} {"train_loss": -10.250709533691406, "global_step": 126859, "epoch": 755} {"train_loss": -10.325179100036621, "global_step": 126860, "epoch": 755} {"train_loss": -10.307634353637695, "global_step": 126861, "epoch": 755} {"train_loss": -10.11164379119873, "global_step": 126862, "epoch": 755} {"train_loss": -10.38247299194336, "global_step": 126863, "epoch": 755} {"train_loss": -10.127973556518555, "global_step": 126864, "epoch": 755} {"train_loss": -10.38846206665039, "global_step": 126865, "epoch": 755} {"train_loss": -10.336536407470703, "global_step": 126866, "epoch": 755} {"train_loss": -10.365851402282715, "global_step": 126867, "epoch": 755} {"train_loss": -10.493906021118164, "global_step": 126868, "epoch": 755} {"train_loss": -9.79784107208252, "global_step": 126869, "epoch": 755} {"train_loss": -10.41861343383789, "global_step": 126870, "epoch": 755} {"train_loss": -10.076560974121094, "global_step": 126871, "epoch": 755} {"train_loss": -9.995865821838379, "global_step": 126872, "epoch": 755} {"train_loss": -10.277427673339844, "global_step": 126873, "epoch": 755} {"train_loss": -10.38931941986084, "global_step": 126874, "epoch": 755} {"train_loss": -10.271472930908203, "global_step": 126875, "epoch": 755} {"train_loss": -10.472333908081055, "global_step": 126876, "epoch": 755} {"train_loss": -10.021913528442383, "global_step": 126877, "epoch": 755} {"train_loss": -10.383389472961426, "global_step": 126878, "epoch": 755} {"train_loss": -10.055309295654297, "global_step": 126879, "epoch": 755} {"train_loss": -10.087493896484375, "global_step": 126880, "epoch": 755} {"train_loss": -10.506759643554688, "global_step": 126881, "epoch": 755} {"train_loss": -10.124162673950195, "global_step": 126882, "epoch": 755} {"train_loss": -10.321784019470215, "global_step": 126883, "epoch": 755} {"train_loss": -10.1693115234375, "global_step": 126884, "epoch": 755} {"train_loss": -10.384434700012207, "global_step": 126885, "epoch": 755} {"train_loss": -10.409113883972168, "global_step": 126886, "epoch": 755} {"train_loss": -10.292337417602539, "global_step": 126887, "epoch": 755} {"train_loss": -10.016438484191895, "global_step": 126888, "epoch": 755} {"train_loss": -9.781515121459961, "global_step": 126889, "epoch": 755} {"train_loss": -10.361477851867676, "global_step": 126890, "epoch": 755} {"train_loss": -10.082100868225098, "global_step": 126891, "epoch": 755} {"train_loss": -10.327836036682129, "global_step": 126892, "epoch": 755} {"train_loss": -9.87034797668457, "global_step": 126893, "epoch": 755} {"train_loss": -10.015872955322266, "global_step": 126894, "epoch": 755} {"train_loss": -10.390190124511719, "global_step": 126895, "epoch": 755} {"train_loss": -9.96624755859375, "global_step": 126896, "epoch": 755} {"train_loss": -10.284578323364258, "global_step": 126897, "epoch": 755} {"train_loss": -9.919149398803711, "global_step": 126898, "epoch": 755} {"train_loss": -10.251968383789062, "global_step": 126899, "epoch": 755} {"train_loss": -9.742059707641602, "global_step": 126900, "epoch": 755} {"train_loss": -10.362374305725098, "global_step": 126901, "epoch": 755} {"train_loss": -9.574502944946289, "global_step": 126902, "epoch": 755} {"train_loss": -10.046744346618652, "global_step": 126903, "epoch": 755} {"train_loss": -9.614765167236328, "global_step": 126904, "epoch": 755} {"train_loss": -9.963602066040039, "global_step": 126905, "epoch": 755} {"train_loss": -9.273399353027344, "global_step": 126906, "epoch": 755} {"train_loss": -9.899895668029785, "global_step": 126907, "epoch": 755} {"train_loss": -9.734094619750977, "global_step": 126908, "epoch": 755} {"train_loss": -10.371281623840332, "global_step": 126909, "epoch": 755} {"train_loss": -9.268365859985352, "global_step": 126910, "epoch": 755} {"train_loss": -10.197811126708984, "global_step": 126911, "epoch": 755} {"train_loss": -9.632865905761719, "global_step": 126912, "epoch": 755} {"train_loss": -10.25910758972168, "global_step": 126913, "epoch": 755} {"train_loss": -9.705146789550781, "global_step": 126914, "epoch": 755} {"train_loss": -10.01823902130127, "global_step": 126915, "epoch": 755} {"train_loss": -9.761371612548828, "global_step": 126916, "epoch": 755} {"train_loss": -10.380552291870117, "global_step": 126917, "epoch": 755} {"train_loss": -9.959285736083984, "global_step": 126918, "epoch": 755} {"train_loss": -10.292566299438477, "global_step": 126919, "epoch": 755} {"train_loss": -10.284488677978516, "global_step": 126920, "epoch": 755} {"train_loss": -10.084909439086914, "global_step": 126921, "epoch": 755} {"train_loss": -10.296842575073242, "global_step": 126922, "epoch": 755} {"train_loss": -10.12248420715332, "global_step": 126923, "epoch": 755} {"train_loss": -10.32390308380127, "global_step": 126924, "epoch": 755} {"train_loss": -9.972537994384766, "global_step": 126925, "epoch": 755} {"train_loss": -10.228842735290527, "global_step": 126926, "epoch": 755} {"train_loss": -10.10909366607666, "global_step": 126927, "epoch": 755} {"train_loss": -10.201730728149414, "global_step": 126928, "epoch": 755} {"train_loss": -10.235730171203613, "global_step": 126929, "epoch": 755} {"train_loss": -10.253618240356445, "global_step": 126930, "epoch": 755} {"train_loss": -10.218571662902832, "global_step": 126931, "epoch": 755} {"train_loss": -10.120702743530273, "global_step": 126932, "epoch": 755} {"train_loss": -10.246768951416016, "global_step": 126933, "epoch": 755} {"train_loss": -10.307058334350586, "global_step": 126934, "epoch": 755} {"train_loss": -10.4944486618042, "global_step": 126935, "epoch": 755} {"train_loss": -10.254899978637695, "global_step": 126936, "epoch": 755} {"train_loss": -10.580747604370117, "global_step": 126937, "epoch": 755} {"train_loss": -10.17156982421875, "global_step": 126938, "epoch": 755} {"train_loss": -10.493276596069336, "global_step": 126939, "epoch": 755} {"train_loss": -10.475238800048828, "global_step": 126940, "epoch": 755} {"train_loss": -10.446430206298828, "global_step": 126941, "epoch": 755} {"train_loss": -10.239938735961914, "global_step": 126942, "epoch": 755} {"train_loss": -10.561262130737305, "global_step": 126943, "epoch": 755} {"train_loss": -10.305061340332031, "global_step": 126944, "epoch": 755} {"train_loss": -10.63431167602539, "global_step": 126945, "epoch": 755} {"train_loss": -10.287094116210938, "global_step": 126946, "epoch": 755} {"train_loss": -10.33138656616211, "global_step": 126947, "epoch": 755} {"train_loss": -10.556864738464355, "global_step": 126948, "epoch": 755} {"train_loss": -9.838092803955078, "global_step": 126949, "epoch": 755} {"train_loss": -10.124138832092285, "global_step": 126950, "epoch": 755} {"train_loss": -9.850759506225586, "global_step": 126951, "epoch": 755} {"train_loss": -9.95225715637207, "global_step": 126952, "epoch": 755} {"train_loss": -10.178348541259766, "global_step": 126953, "epoch": 755} {"train_loss": -10.053096771240234, "global_step": 126954, "epoch": 755} {"train_loss": -10.527381896972656, "global_step": 126955, "epoch": 755} {"train_loss": -9.173713684082031, "global_step": 126956, "epoch": 755} {"train_loss": -10.594608306884766, "global_step": 126957, "epoch": 755} {"train_loss": -10.135168075561523, "global_step": 126958, "epoch": 755} {"train_loss": -9.790336608886719, "global_step": 126959, "epoch": 755} {"train_loss": -10.414397239685059, "global_step": 126960, "epoch": 755} {"train_loss": -10.073140144348145, "global_step": 126961, "epoch": 755} {"train_loss": -10.18224048614502, "global_step": 126962, "epoch": 755} {"train_loss": -10.319480895996094, "global_step": 126963, "epoch": 755} {"train_loss": -10.16422176361084, "global_step": 126964, "epoch": 755} {"train_loss": -10.290670394897461, "global_step": 126965, "epoch": 755} {"train_loss": -10.102269172668457, "global_step": 126966, "epoch": 755} {"train_loss": -10.194108963012695, "global_step": 126967, "epoch": 755} {"train_loss": -10.350951194763184, "global_step": 126968, "epoch": 755} {"train_loss": -10.422195434570312, "global_step": 126969, "epoch": 755} {"train_loss": -10.28546142578125, "global_step": 126970, "epoch": 755} {"train_loss": -10.132407188415527, "global_step": 126971, "epoch": 755} {"train_loss": -10.33935546875, "global_step": 126972, "epoch": 755} {"train_loss": -10.440735816955566, "global_step": 126973, "epoch": 755} {"train_loss": -10.334330558776855, "global_step": 126974, "epoch": 755} {"train_loss": -10.214214324951172, "global_step": 126975, "epoch": 755} {"train_loss": -10.298303604125977, "global_step": 126976, "epoch": 755} {"train_loss": -10.109687805175781, "global_step": 126977, "epoch": 755} {"train_loss": -10.334195137023926, "global_step": 126978, "epoch": 755} {"train_loss": -9.984481811523438, "global_step": 126979, "epoch": 755} {"train_loss": -10.520956039428711, "global_step": 126980, "epoch": 755} {"train_loss": -9.784235000610352, "global_step": 126981, "epoch": 755} {"train_loss": -10.455375671386719, "global_step": 126982, "epoch": 755} {"train_loss": -10.439958572387695, "global_step": 126983, "epoch": 755} {"train_loss": -10.247522354125977, "global_step": 126984, "epoch": 755} {"train_loss": -10.418892860412598, "global_step": 126985, "epoch": 755} {"train_loss": -10.262890815734863, "global_step": 126986, "epoch": 755} {"train_loss": -10.47339153289795, "global_step": 126987, "epoch": 755} {"train_loss": -10.518939018249512, "global_step": 126988, "epoch": 755} {"train_loss": -10.434322357177734, "global_step": 126989, "epoch": 755} {"train_loss": -10.080446243286133, "global_step": 126990, "epoch": 755} {"train_loss": -10.192002296447754, "global_step": 126991, "epoch": 755} {"train_loss": -10.436830520629883, "global_step": 126992, "epoch": 755} {"train_loss": -10.001838684082031, "global_step": 126993, "epoch": 755} {"train_loss": -10.218070983886719, "global_step": 126994, "epoch": 755} {"train_loss": -9.82996940612793, "global_step": 126995, "epoch": 755} {"train_loss": -10.36622428894043, "global_step": 126996, "epoch": 755} {"train_loss": -9.780557632446289, "global_step": 126997, "epoch": 755} {"train_loss": -10.51517105102539, "global_step": 126998, "epoch": 755} {"train_loss": -9.529821395874023, "global_step": 126999, "epoch": 755} {"train_loss": -10.437232971191406, "global_step": 127000, "epoch": 755} {"train_loss": -10.380565643310547, "global_step": 127001, "epoch": 755} {"train_loss": -10.243056297302246, "global_step": 127002, "epoch": 755} {"train_loss": -10.447100639343262, "global_step": 127003, "epoch": 755} {"train_loss": -10.49266529083252, "global_step": 127004, "epoch": 755} {"train_loss": -10.364059448242188, "global_step": 127005, "epoch": 755} {"train_loss": -10.381852149963379, "global_step": 127006, "epoch": 755} {"train_loss": -10.1858845608575, "global_step": 127007, "epoch": 755, "val_loss": 218329.59375, "train_action_mse_error": 2.189704418182373} {"train_loss": -10.337885856628418, "global_step": 127008, "epoch": 756} {"train_loss": -10.55337142944336, "global_step": 127009, "epoch": 756} {"train_loss": -10.462820053100586, "global_step": 127010, "epoch": 756} {"train_loss": -10.353915214538574, "global_step": 127011, "epoch": 756} {"train_loss": -10.306158065795898, "global_step": 127012, "epoch": 756} {"train_loss": -10.424802780151367, "global_step": 127013, "epoch": 756} {"train_loss": -10.393208503723145, "global_step": 127014, "epoch": 756} {"train_loss": -10.168275833129883, "global_step": 127015, "epoch": 756} {"train_loss": -10.187870025634766, "global_step": 127016, "epoch": 756} {"train_loss": -10.072318077087402, "global_step": 127017, "epoch": 756} {"train_loss": -10.009737014770508, "global_step": 127018, "epoch": 756} {"train_loss": -10.379819869995117, "global_step": 127019, "epoch": 756} {"train_loss": -10.201648712158203, "global_step": 127020, "epoch": 756} {"train_loss": -10.114492416381836, "global_step": 127021, "epoch": 756} {"train_loss": -10.265192031860352, "global_step": 127022, "epoch": 756} {"train_loss": -10.449235916137695, "global_step": 127023, "epoch": 756} {"train_loss": -9.877860069274902, "global_step": 127024, "epoch": 756} {"train_loss": -10.322912216186523, "global_step": 127025, "epoch": 756} {"train_loss": -9.958555221557617, "global_step": 127026, "epoch": 756} {"train_loss": -10.683558464050293, "global_step": 127027, "epoch": 756} {"train_loss": -10.400117874145508, "global_step": 127028, "epoch": 756} {"train_loss": -10.345800399780273, "global_step": 127029, "epoch": 756} {"train_loss": -10.409370422363281, "global_step": 127030, "epoch": 756} {"train_loss": -10.334948539733887, "global_step": 127031, "epoch": 756} {"train_loss": -10.475443840026855, "global_step": 127032, "epoch": 756} {"train_loss": -10.28676986694336, "global_step": 127033, "epoch": 756} {"train_loss": -10.583514213562012, "global_step": 127034, "epoch": 756} {"train_loss": -10.490777969360352, "global_step": 127035, "epoch": 756} {"train_loss": -10.41201400756836, "global_step": 127036, "epoch": 756} {"train_loss": -10.433414459228516, "global_step": 127037, "epoch": 756} {"train_loss": -9.959135055541992, "global_step": 127038, "epoch": 756} {"train_loss": -10.618866920471191, "global_step": 127039, "epoch": 756} {"train_loss": -10.175848960876465, "global_step": 127040, "epoch": 756} {"train_loss": -10.650969505310059, "global_step": 127041, "epoch": 756} {"train_loss": -10.318825721740723, "global_step": 127042, "epoch": 756} {"train_loss": -10.405553817749023, "global_step": 127043, "epoch": 756} {"train_loss": -10.425268173217773, "global_step": 127044, "epoch": 756} {"train_loss": -10.573005676269531, "global_step": 127045, "epoch": 756} {"train_loss": -10.27558708190918, "global_step": 127046, "epoch": 756} {"train_loss": -10.318924903869629, "global_step": 127047, "epoch": 756} {"train_loss": -10.281051635742188, "global_step": 127048, "epoch": 756} {"train_loss": -10.420363426208496, "global_step": 127049, "epoch": 756} {"train_loss": -10.157609939575195, "global_step": 127050, "epoch": 756} {"train_loss": -10.533197402954102, "global_step": 127051, "epoch": 756} {"train_loss": -10.29592227935791, "global_step": 127052, "epoch": 756} {"train_loss": -10.615111351013184, "global_step": 127053, "epoch": 756} {"train_loss": -10.34388542175293, "global_step": 127054, "epoch": 756} {"train_loss": -10.511787414550781, "global_step": 127055, "epoch": 756} {"train_loss": -10.466512680053711, "global_step": 127056, "epoch": 756} {"train_loss": -10.493330001831055, "global_step": 127057, "epoch": 756} {"train_loss": -10.772102355957031, "global_step": 127058, "epoch": 756} {"train_loss": -10.443540573120117, "global_step": 127059, "epoch": 756} {"train_loss": -10.333967208862305, "global_step": 127060, "epoch": 756} {"train_loss": -10.375986099243164, "global_step": 127061, "epoch": 756} {"train_loss": -10.053129196166992, "global_step": 127062, "epoch": 756} {"train_loss": -10.714326858520508, "global_step": 127063, "epoch": 756} {"train_loss": -9.298370361328125, "global_step": 127064, "epoch": 756} {"train_loss": -10.609047889709473, "global_step": 127065, "epoch": 756} {"train_loss": -9.753421783447266, "global_step": 127066, "epoch": 756} {"train_loss": -9.385871887207031, "global_step": 127067, "epoch": 756} {"train_loss": -10.516976356506348, "global_step": 127068, "epoch": 756} {"train_loss": -9.849417686462402, "global_step": 127069, "epoch": 756} {"train_loss": -9.853532791137695, "global_step": 127070, "epoch": 756} {"train_loss": -10.40699577331543, "global_step": 127071, "epoch": 756} {"train_loss": -9.900087356567383, "global_step": 127072, "epoch": 756} {"train_loss": -10.018401145935059, "global_step": 127073, "epoch": 756} {"train_loss": -10.25514030456543, "global_step": 127074, "epoch": 756} {"train_loss": -9.83062744140625, "global_step": 127075, "epoch": 756} {"train_loss": -10.617071151733398, "global_step": 127076, "epoch": 756} {"train_loss": -9.753189086914062, "global_step": 127077, "epoch": 756} {"train_loss": -10.401044845581055, "global_step": 127078, "epoch": 756} {"train_loss": -9.94153118133545, "global_step": 127079, "epoch": 756} {"train_loss": -10.245206832885742, "global_step": 127080, "epoch": 756} {"train_loss": -10.274757385253906, "global_step": 127081, "epoch": 756} {"train_loss": -10.146228790283203, "global_step": 127082, "epoch": 756} {"train_loss": -10.30453109741211, "global_step": 127083, "epoch": 756} {"train_loss": -9.886556625366211, "global_step": 127084, "epoch": 756} {"train_loss": -10.288286209106445, "global_step": 127085, "epoch": 756} {"train_loss": -10.020425796508789, "global_step": 127086, "epoch": 756} {"train_loss": -10.135482788085938, "global_step": 127087, "epoch": 756} {"train_loss": -10.204078674316406, "global_step": 127088, "epoch": 756} {"train_loss": -10.181862831115723, "global_step": 127089, "epoch": 756} {"train_loss": -10.123063087463379, "global_step": 127090, "epoch": 756} {"train_loss": -10.313959121704102, "global_step": 127091, "epoch": 756} {"train_loss": -10.106889724731445, "global_step": 127092, "epoch": 756} {"train_loss": -10.306436538696289, "global_step": 127093, "epoch": 756} {"train_loss": -10.176484107971191, "global_step": 127094, "epoch": 756} {"train_loss": -10.431096076965332, "global_step": 127095, "epoch": 756} {"train_loss": -9.830694198608398, "global_step": 127096, "epoch": 756} {"train_loss": -10.288925170898438, "global_step": 127097, "epoch": 756} {"train_loss": -9.889636039733887, "global_step": 127098, "epoch": 756} {"train_loss": -10.399410247802734, "global_step": 127099, "epoch": 756} {"train_loss": -9.936323165893555, "global_step": 127100, "epoch": 756} {"train_loss": -10.554362297058105, "global_step": 127101, "epoch": 756} {"train_loss": -9.966156005859375, "global_step": 127102, "epoch": 756} {"train_loss": -10.372503280639648, "global_step": 127103, "epoch": 756} {"train_loss": -10.406074523925781, "global_step": 127104, "epoch": 756} {"train_loss": -9.912521362304688, "global_step": 127105, "epoch": 756} {"train_loss": -10.303119659423828, "global_step": 127106, "epoch": 756} {"train_loss": -9.986116409301758, "global_step": 127107, "epoch": 756} {"train_loss": -10.302618026733398, "global_step": 127108, "epoch": 756} {"train_loss": -10.211200714111328, "global_step": 127109, "epoch": 756} {"train_loss": -9.938404083251953, "global_step": 127110, "epoch": 756} {"train_loss": -10.380817413330078, "global_step": 127111, "epoch": 756} {"train_loss": -10.152009963989258, "global_step": 127112, "epoch": 756} {"train_loss": -10.522845268249512, "global_step": 127113, "epoch": 756} {"train_loss": -10.198381423950195, "global_step": 127114, "epoch": 756} {"train_loss": -10.03127384185791, "global_step": 127115, "epoch": 756} {"train_loss": -10.211545944213867, "global_step": 127116, "epoch": 756} {"train_loss": -10.324919700622559, "global_step": 127117, "epoch": 756} {"train_loss": -10.240957260131836, "global_step": 127118, "epoch": 756} {"train_loss": -10.332347869873047, "global_step": 127119, "epoch": 756} {"train_loss": -9.93092155456543, "global_step": 127120, "epoch": 756} {"train_loss": -10.524026870727539, "global_step": 127121, "epoch": 756} {"train_loss": -10.487471580505371, "global_step": 127122, "epoch": 756} {"train_loss": -10.345657348632812, "global_step": 127123, "epoch": 756} {"train_loss": -10.417007446289062, "global_step": 127124, "epoch": 756} {"train_loss": -10.475807189941406, "global_step": 127125, "epoch": 756} {"train_loss": -10.452725410461426, "global_step": 127126, "epoch": 756} {"train_loss": -10.443414688110352, "global_step": 127127, "epoch": 756} {"train_loss": -10.39491081237793, "global_step": 127128, "epoch": 756} {"train_loss": -10.352571487426758, "global_step": 127129, "epoch": 756} {"train_loss": -10.475156784057617, "global_step": 127130, "epoch": 756} {"train_loss": -10.503493309020996, "global_step": 127131, "epoch": 756} {"train_loss": -10.2890625, "global_step": 127132, "epoch": 756} {"train_loss": -10.584392547607422, "global_step": 127133, "epoch": 756} {"train_loss": -10.41790771484375, "global_step": 127134, "epoch": 756} {"train_loss": -10.280789375305176, "global_step": 127135, "epoch": 756} {"train_loss": -10.539262771606445, "global_step": 127136, "epoch": 756} {"train_loss": -10.580558776855469, "global_step": 127137, "epoch": 756} {"train_loss": -10.60593032836914, "global_step": 127138, "epoch": 756} {"train_loss": -10.39799976348877, "global_step": 127139, "epoch": 756} {"train_loss": -10.418617248535156, "global_step": 127140, "epoch": 756} {"train_loss": -10.429170608520508, "global_step": 127141, "epoch": 756} {"train_loss": -10.331846237182617, "global_step": 127142, "epoch": 756} {"train_loss": -10.415876388549805, "global_step": 127143, "epoch": 756} {"train_loss": -9.513134002685547, "global_step": 127144, "epoch": 756} {"train_loss": -10.791807174682617, "global_step": 127145, "epoch": 756} {"train_loss": -10.612167358398438, "global_step": 127146, "epoch": 756} {"train_loss": -10.077022552490234, "global_step": 127147, "epoch": 756} {"train_loss": -10.555179595947266, "global_step": 127148, "epoch": 756} {"train_loss": -10.040487289428711, "global_step": 127149, "epoch": 756} {"train_loss": -10.361139297485352, "global_step": 127150, "epoch": 756} {"train_loss": -10.33418083190918, "global_step": 127151, "epoch": 756} {"train_loss": -10.358078002929688, "global_step": 127152, "epoch": 756} {"train_loss": -10.354692459106445, "global_step": 127153, "epoch": 756} {"train_loss": -10.53564167022705, "global_step": 127154, "epoch": 756} {"train_loss": -10.1314697265625, "global_step": 127155, "epoch": 756} {"train_loss": -10.18658447265625, "global_step": 127156, "epoch": 756} {"train_loss": -9.34125804901123, "global_step": 127157, "epoch": 756} {"train_loss": -10.167473793029785, "global_step": 127158, "epoch": 756} {"train_loss": -10.02676010131836, "global_step": 127159, "epoch": 756} {"train_loss": -9.64572525024414, "global_step": 127160, "epoch": 756} {"train_loss": -9.893289566040039, "global_step": 127161, "epoch": 756} {"train_loss": -9.729564666748047, "global_step": 127162, "epoch": 756} {"train_loss": -9.470366477966309, "global_step": 127163, "epoch": 756} {"train_loss": -9.398441314697266, "global_step": 127164, "epoch": 756} {"train_loss": -10.070585250854492, "global_step": 127165, "epoch": 756} {"train_loss": -9.495389938354492, "global_step": 127166, "epoch": 756} {"train_loss": -9.88477897644043, "global_step": 127167, "epoch": 756} {"train_loss": -9.265151977539062, "global_step": 127168, "epoch": 756} {"train_loss": -9.361906051635742, "global_step": 127169, "epoch": 756} {"train_loss": -8.950559616088867, "global_step": 127170, "epoch": 756} {"train_loss": -9.385383605957031, "global_step": 127171, "epoch": 756} {"train_loss": -9.873290061950684, "global_step": 127172, "epoch": 756} {"train_loss": -9.226292610168457, "global_step": 127173, "epoch": 756} {"train_loss": -10.04679012298584, "global_step": 127174, "epoch": 756} {"train_loss": -10.207813841956002, "global_step": 127175, "epoch": 756, "val_loss": 216655.8125} {"train_loss": -9.817765235900879, "global_step": 127176, "epoch": 757} {"train_loss": -9.392379760742188, "global_step": 127177, "epoch": 757} {"train_loss": -10.090032577514648, "global_step": 127178, "epoch": 757} {"train_loss": -9.342824935913086, "global_step": 127179, "epoch": 757} {"train_loss": -9.915878295898438, "global_step": 127180, "epoch": 757} {"train_loss": -9.916618347167969, "global_step": 127181, "epoch": 757} {"train_loss": -9.457258224487305, "global_step": 127182, "epoch": 757} {"train_loss": -10.12537956237793, "global_step": 127183, "epoch": 757} {"train_loss": -9.936508178710938, "global_step": 127184, "epoch": 757} {"train_loss": -9.86286449432373, "global_step": 127185, "epoch": 757} {"train_loss": -9.930257797241211, "global_step": 127186, "epoch": 757} {"train_loss": -9.543289184570312, "global_step": 127187, "epoch": 757} {"train_loss": -10.088729858398438, "global_step": 127188, "epoch": 757} {"train_loss": -9.899970054626465, "global_step": 127189, "epoch": 757} {"train_loss": -9.991211891174316, "global_step": 127190, "epoch": 757} {"train_loss": -10.107620239257812, "global_step": 127191, "epoch": 757} {"train_loss": -9.803842544555664, "global_step": 127192, "epoch": 757} {"train_loss": -10.252113342285156, "global_step": 127193, "epoch": 757} {"train_loss": -9.930885314941406, "global_step": 127194, "epoch": 757} {"train_loss": -10.144222259521484, "global_step": 127195, "epoch": 757} {"train_loss": -10.299764633178711, "global_step": 127196, "epoch": 757} {"train_loss": -9.919408798217773, "global_step": 127197, "epoch": 757} {"train_loss": -10.213834762573242, "global_step": 127198, "epoch": 757} {"train_loss": -10.283592224121094, "global_step": 127199, "epoch": 757} {"train_loss": -10.103561401367188, "global_step": 127200, "epoch": 757} {"train_loss": -10.314205169677734, "global_step": 127201, "epoch": 757} {"train_loss": -9.973943710327148, "global_step": 127202, "epoch": 757} {"train_loss": -10.242947578430176, "global_step": 127203, "epoch": 757} {"train_loss": -10.09897232055664, "global_step": 127204, "epoch": 757} {"train_loss": -10.340353965759277, "global_step": 127205, "epoch": 757} {"train_loss": -10.315092086791992, "global_step": 127206, "epoch": 757} {"train_loss": -10.286687850952148, "global_step": 127207, "epoch": 757} {"train_loss": -10.332006454467773, "global_step": 127208, "epoch": 757} {"train_loss": -10.415879249572754, "global_step": 127209, "epoch": 757} {"train_loss": -10.443181991577148, "global_step": 127210, "epoch": 757} {"train_loss": -10.450094223022461, "global_step": 127211, "epoch": 757} {"train_loss": -10.481060028076172, "global_step": 127212, "epoch": 757} {"train_loss": -10.664520263671875, "global_step": 127213, "epoch": 757} {"train_loss": -10.469285011291504, "global_step": 127214, "epoch": 757} {"train_loss": -10.547967910766602, "global_step": 127215, "epoch": 757} {"train_loss": -10.749424934387207, "global_step": 127216, "epoch": 757} {"train_loss": -10.442889213562012, "global_step": 127217, "epoch": 757} {"train_loss": -10.695331573486328, "global_step": 127218, "epoch": 757} {"train_loss": -10.2535400390625, "global_step": 127219, "epoch": 757} {"train_loss": -10.436237335205078, "global_step": 127220, "epoch": 757} {"train_loss": -10.532986640930176, "global_step": 127221, "epoch": 757} {"train_loss": -10.500962257385254, "global_step": 127222, "epoch": 757} {"train_loss": -10.596009254455566, "global_step": 127223, "epoch": 757} {"train_loss": -10.486047744750977, "global_step": 127224, "epoch": 757} {"train_loss": -10.614500999450684, "global_step": 127225, "epoch": 757} {"train_loss": -10.521379470825195, "global_step": 127226, "epoch": 757} {"train_loss": -10.139410018920898, "global_step": 127227, "epoch": 757} {"train_loss": -10.266523361206055, "global_step": 127228, "epoch": 757} {"train_loss": -10.441978454589844, "global_step": 127229, "epoch": 757} {"train_loss": -10.025599479675293, "global_step": 127230, "epoch": 757} {"train_loss": -10.426143646240234, "global_step": 127231, "epoch": 757} {"train_loss": -10.431148529052734, "global_step": 127232, "epoch": 757} {"train_loss": -10.460041999816895, "global_step": 127233, "epoch": 757} {"train_loss": -10.47032642364502, "global_step": 127234, "epoch": 757} {"train_loss": -10.104360580444336, "global_step": 127235, "epoch": 757} {"train_loss": -10.277213096618652, "global_step": 127236, "epoch": 757} {"train_loss": -10.59463882446289, "global_step": 127237, "epoch": 757} {"train_loss": -10.192024230957031, "global_step": 127238, "epoch": 757} {"train_loss": -10.6168851852417, "global_step": 127239, "epoch": 757} {"train_loss": -10.744047164916992, "global_step": 127240, "epoch": 757} {"train_loss": -10.594856262207031, "global_step": 127241, "epoch": 757} {"train_loss": -10.391369819641113, "global_step": 127242, "epoch": 757} {"train_loss": -10.66401481628418, "global_step": 127243, "epoch": 757} {"train_loss": -10.383865356445312, "global_step": 127244, "epoch": 757} {"train_loss": -10.483965873718262, "global_step": 127245, "epoch": 757} {"train_loss": -10.356289863586426, "global_step": 127246, "epoch": 757} {"train_loss": -10.20097541809082, "global_step": 127247, "epoch": 757} {"train_loss": -10.335031509399414, "global_step": 127248, "epoch": 757} {"train_loss": -10.37291145324707, "global_step": 127249, "epoch": 757} {"train_loss": -10.508737564086914, "global_step": 127250, "epoch": 757} {"train_loss": -10.339369773864746, "global_step": 127251, "epoch": 757} {"train_loss": -10.419214248657227, "global_step": 127252, "epoch": 757} {"train_loss": -10.321639060974121, "global_step": 127253, "epoch": 757} {"train_loss": -10.596356391906738, "global_step": 127254, "epoch": 757} {"train_loss": -10.17308235168457, "global_step": 127255, "epoch": 757} {"train_loss": -10.399433135986328, "global_step": 127256, "epoch": 757} {"train_loss": -10.451533317565918, "global_step": 127257, "epoch": 757} {"train_loss": -10.355241775512695, "global_step": 127258, "epoch": 757} {"train_loss": -9.907320022583008, "global_step": 127259, "epoch": 757} {"train_loss": -9.880693435668945, "global_step": 127260, "epoch": 757} {"train_loss": -10.009387016296387, "global_step": 127261, "epoch": 757} {"train_loss": -9.927999496459961, "global_step": 127262, "epoch": 757} {"train_loss": -9.930305480957031, "global_step": 127263, "epoch": 757} {"train_loss": -10.129646301269531, "global_step": 127264, "epoch": 757} {"train_loss": -10.152063369750977, "global_step": 127265, "epoch": 757} {"train_loss": -9.992780685424805, "global_step": 127266, "epoch": 757} {"train_loss": -10.158340454101562, "global_step": 127267, "epoch": 757} {"train_loss": -10.171566009521484, "global_step": 127268, "epoch": 757} {"train_loss": -9.877912521362305, "global_step": 127269, "epoch": 757} {"train_loss": -10.16867446899414, "global_step": 127270, "epoch": 757} {"train_loss": -9.741903305053711, "global_step": 127271, "epoch": 757} {"train_loss": -9.777074813842773, "global_step": 127272, "epoch": 757} {"train_loss": -10.149352073669434, "global_step": 127273, "epoch": 757} {"train_loss": -10.001127243041992, "global_step": 127274, "epoch": 757} {"train_loss": -10.142864227294922, "global_step": 127275, "epoch": 757} {"train_loss": -10.132469177246094, "global_step": 127276, "epoch": 757} {"train_loss": -10.13154411315918, "global_step": 127277, "epoch": 757} {"train_loss": -9.747233390808105, "global_step": 127278, "epoch": 757} {"train_loss": -10.166601181030273, "global_step": 127279, "epoch": 757} {"train_loss": -9.512749671936035, "global_step": 127280, "epoch": 757} {"train_loss": -10.000541687011719, "global_step": 127281, "epoch": 757} {"train_loss": -9.818382263183594, "global_step": 127282, "epoch": 757} {"train_loss": -9.988551139831543, "global_step": 127283, "epoch": 757} {"train_loss": -9.917488098144531, "global_step": 127284, "epoch": 757} {"train_loss": -10.149093627929688, "global_step": 127285, "epoch": 757} {"train_loss": -9.888927459716797, "global_step": 127286, "epoch": 757} {"train_loss": -10.059659957885742, "global_step": 127287, "epoch": 757} {"train_loss": -9.6361722946167, "global_step": 127288, "epoch": 757} {"train_loss": -10.209710121154785, "global_step": 127289, "epoch": 757} {"train_loss": -9.981740951538086, "global_step": 127290, "epoch": 757} {"train_loss": -10.116860389709473, "global_step": 127291, "epoch": 757} {"train_loss": -9.912822723388672, "global_step": 127292, "epoch": 757} {"train_loss": -10.25922966003418, "global_step": 127293, "epoch": 757} {"train_loss": -9.928529739379883, "global_step": 127294, "epoch": 757} {"train_loss": -10.196130752563477, "global_step": 127295, "epoch": 757} {"train_loss": -10.101064682006836, "global_step": 127296, "epoch": 757} {"train_loss": -10.127906799316406, "global_step": 127297, "epoch": 757} {"train_loss": -10.40488052368164, "global_step": 127298, "epoch": 757} {"train_loss": -10.092111587524414, "global_step": 127299, "epoch": 757} {"train_loss": -10.238311767578125, "global_step": 127300, "epoch": 757} {"train_loss": -10.330398559570312, "global_step": 127301, "epoch": 757} {"train_loss": -10.315008163452148, "global_step": 127302, "epoch": 757} {"train_loss": -10.264558792114258, "global_step": 127303, "epoch": 757} {"train_loss": -10.39401912689209, "global_step": 127304, "epoch": 757} {"train_loss": -10.178970336914062, "global_step": 127305, "epoch": 757} {"train_loss": -10.29322624206543, "global_step": 127306, "epoch": 757} {"train_loss": -10.040705680847168, "global_step": 127307, "epoch": 757} {"train_loss": -10.198723793029785, "global_step": 127308, "epoch": 757} {"train_loss": -10.372066497802734, "global_step": 127309, "epoch": 757} {"train_loss": -10.242578506469727, "global_step": 127310, "epoch": 757} {"train_loss": -10.35489273071289, "global_step": 127311, "epoch": 757} {"train_loss": -10.574915885925293, "global_step": 127312, "epoch": 757} {"train_loss": -10.64242935180664, "global_step": 127313, "epoch": 757} {"train_loss": -10.72437858581543, "global_step": 127314, "epoch": 757} {"train_loss": -10.366246223449707, "global_step": 127315, "epoch": 757} {"train_loss": -10.355382919311523, "global_step": 127316, "epoch": 757} {"train_loss": -10.489396095275879, "global_step": 127317, "epoch": 757} {"train_loss": -10.279759407043457, "global_step": 127318, "epoch": 757} {"train_loss": -10.432830810546875, "global_step": 127319, "epoch": 757} {"train_loss": -10.385936737060547, "global_step": 127320, "epoch": 757} {"train_loss": -10.56146240234375, "global_step": 127321, "epoch": 757} {"train_loss": -10.295031547546387, "global_step": 127322, "epoch": 757} {"train_loss": -10.511945724487305, "global_step": 127323, "epoch": 757} {"train_loss": -10.017751693725586, "global_step": 127324, "epoch": 757} {"train_loss": -10.15926456451416, "global_step": 127325, "epoch": 757} {"train_loss": -10.49138069152832, "global_step": 127326, "epoch": 757} {"train_loss": -10.330933570861816, "global_step": 127327, "epoch": 757} {"train_loss": -10.456232070922852, "global_step": 127328, "epoch": 757} {"train_loss": -10.345430374145508, "global_step": 127329, "epoch": 757} {"train_loss": -10.360048294067383, "global_step": 127330, "epoch": 757} {"train_loss": -10.553327560424805, "global_step": 127331, "epoch": 757} {"train_loss": -10.445974349975586, "global_step": 127332, "epoch": 757} {"train_loss": -10.567342758178711, "global_step": 127333, "epoch": 757} {"train_loss": -10.536439895629883, "global_step": 127334, "epoch": 757} {"train_loss": -10.691813468933105, "global_step": 127335, "epoch": 757} {"train_loss": -10.351764678955078, "global_step": 127336, "epoch": 757} {"train_loss": -10.731277465820312, "global_step": 127337, "epoch": 757} {"train_loss": -10.637810707092285, "global_step": 127338, "epoch": 757} {"train_loss": -10.740303993225098, "global_step": 127339, "epoch": 757} {"train_loss": -10.466440200805664, "global_step": 127340, "epoch": 757} {"train_loss": -10.64366340637207, "global_step": 127341, "epoch": 757} {"train_loss": -10.594959259033203, "global_step": 127342, "epoch": 757} {"train_loss": -10.246017149516515, "global_step": 127343, "epoch": 757, "val_loss": 217580.734375} {"train_loss": -10.493867874145508, "global_step": 127344, "epoch": 758} {"train_loss": -10.58694076538086, "global_step": 127345, "epoch": 758} {"train_loss": -10.432060241699219, "global_step": 127346, "epoch": 758} {"train_loss": -10.678086280822754, "global_step": 127347, "epoch": 758} {"train_loss": -10.348445892333984, "global_step": 127348, "epoch": 758} {"train_loss": -10.801782608032227, "global_step": 127349, "epoch": 758} {"train_loss": -10.388697624206543, "global_step": 127350, "epoch": 758} {"train_loss": -10.332876205444336, "global_step": 127351, "epoch": 758} {"train_loss": -10.426532745361328, "global_step": 127352, "epoch": 758} {"train_loss": -9.944615364074707, "global_step": 127353, "epoch": 758} {"train_loss": -10.25893497467041, "global_step": 127354, "epoch": 758} {"train_loss": -10.227448463439941, "global_step": 127355, "epoch": 758} {"train_loss": -9.734949111938477, "global_step": 127356, "epoch": 758} {"train_loss": -9.77393627166748, "global_step": 127357, "epoch": 758} {"train_loss": -9.740489959716797, "global_step": 127358, "epoch": 758} {"train_loss": -10.40306282043457, "global_step": 127359, "epoch": 758} {"train_loss": -9.78325080871582, "global_step": 127360, "epoch": 758} {"train_loss": -8.939870834350586, "global_step": 127361, "epoch": 758} {"train_loss": -9.342239379882812, "global_step": 127362, "epoch": 758} {"train_loss": -9.59683609008789, "global_step": 127363, "epoch": 758} {"train_loss": -8.884241104125977, "global_step": 127364, "epoch": 758} {"train_loss": -9.497394561767578, "global_step": 127365, "epoch": 758} {"train_loss": -9.691471099853516, "global_step": 127366, "epoch": 758} {"train_loss": -9.12936019897461, "global_step": 127367, "epoch": 758} {"train_loss": -10.210123062133789, "global_step": 127368, "epoch": 758} {"train_loss": -9.365937232971191, "global_step": 127369, "epoch": 758} {"train_loss": -9.783418655395508, "global_step": 127370, "epoch": 758} {"train_loss": -9.808420181274414, "global_step": 127371, "epoch": 758} {"train_loss": -9.711603164672852, "global_step": 127372, "epoch": 758} {"train_loss": -10.073755264282227, "global_step": 127373, "epoch": 758} {"train_loss": -10.038942337036133, "global_step": 127374, "epoch": 758} {"train_loss": -10.157011985778809, "global_step": 127375, "epoch": 758} {"train_loss": -9.970538139343262, "global_step": 127376, "epoch": 758} {"train_loss": -9.90487289428711, "global_step": 127377, "epoch": 758} {"train_loss": -10.264808654785156, "global_step": 127378, "epoch": 758} {"train_loss": -9.956208229064941, "global_step": 127379, "epoch": 758} {"train_loss": -9.941506385803223, "global_step": 127380, "epoch": 758} {"train_loss": -10.268689155578613, "global_step": 127381, "epoch": 758} {"train_loss": -10.017294883728027, "global_step": 127382, "epoch": 758} {"train_loss": -9.98635196685791, "global_step": 127383, "epoch": 758} {"train_loss": -10.176860809326172, "global_step": 127384, "epoch": 758} {"train_loss": -10.110431671142578, "global_step": 127385, "epoch": 758} {"train_loss": -10.162981033325195, "global_step": 127386, "epoch": 758} {"train_loss": -10.148582458496094, "global_step": 127387, "epoch": 758} {"train_loss": -9.971969604492188, "global_step": 127388, "epoch": 758} {"train_loss": -10.205052375793457, "global_step": 127389, "epoch": 758} {"train_loss": -10.173898696899414, "global_step": 127390, "epoch": 758} {"train_loss": -10.209507942199707, "global_step": 127391, "epoch": 758} {"train_loss": -10.210264205932617, "global_step": 127392, "epoch": 758} {"train_loss": -10.144390106201172, "global_step": 127393, "epoch": 758} {"train_loss": -10.251214027404785, "global_step": 127394, "epoch": 758} {"train_loss": -10.23062515258789, "global_step": 127395, "epoch": 758} {"train_loss": -10.175461769104004, "global_step": 127396, "epoch": 758} {"train_loss": -10.314064025878906, "global_step": 127397, "epoch": 758} {"train_loss": -10.305913925170898, "global_step": 127398, "epoch": 758} {"train_loss": -10.306334495544434, "global_step": 127399, "epoch": 758} {"train_loss": -10.31755256652832, "global_step": 127400, "epoch": 758} {"train_loss": -10.530599594116211, "global_step": 127401, "epoch": 758} {"train_loss": -10.463186264038086, "global_step": 127402, "epoch": 758} {"train_loss": -10.318330764770508, "global_step": 127403, "epoch": 758} {"train_loss": -10.599468231201172, "global_step": 127404, "epoch": 758} {"train_loss": -10.212159156799316, "global_step": 127405, "epoch": 758} {"train_loss": -10.215045928955078, "global_step": 127406, "epoch": 758} {"train_loss": -10.485417366027832, "global_step": 127407, "epoch": 758} {"train_loss": -10.531285285949707, "global_step": 127408, "epoch": 758} {"train_loss": -10.272499084472656, "global_step": 127409, "epoch": 758} {"train_loss": -10.481263160705566, "global_step": 127410, "epoch": 758} {"train_loss": -10.026597023010254, "global_step": 127411, "epoch": 758} {"train_loss": -10.517971992492676, "global_step": 127412, "epoch": 758} {"train_loss": -10.220766067504883, "global_step": 127413, "epoch": 758} {"train_loss": -10.182348251342773, "global_step": 127414, "epoch": 758} {"train_loss": -10.595418930053711, "global_step": 127415, "epoch": 758} {"train_loss": -10.515358924865723, "global_step": 127416, "epoch": 758} {"train_loss": -10.375261306762695, "global_step": 127417, "epoch": 758} {"train_loss": -10.447957992553711, "global_step": 127418, "epoch": 758} {"train_loss": -9.91683292388916, "global_step": 127419, "epoch": 758} {"train_loss": -10.375539779663086, "global_step": 127420, "epoch": 758} {"train_loss": -10.41649341583252, "global_step": 127421, "epoch": 758} {"train_loss": -10.58144760131836, "global_step": 127422, "epoch": 758} {"train_loss": -9.937555313110352, "global_step": 127423, "epoch": 758} {"train_loss": -10.21509075164795, "global_step": 127424, "epoch": 758} {"train_loss": -10.194598197937012, "global_step": 127425, "epoch": 758} {"train_loss": -10.300046920776367, "global_step": 127426, "epoch": 758} {"train_loss": -10.118746757507324, "global_step": 127427, "epoch": 758} {"train_loss": -10.472859382629395, "global_step": 127428, "epoch": 758} {"train_loss": -10.158981323242188, "global_step": 127429, "epoch": 758} {"train_loss": -10.589508056640625, "global_step": 127430, "epoch": 758} {"train_loss": -9.821599960327148, "global_step": 127431, "epoch": 758} {"train_loss": -10.494123458862305, "global_step": 127432, "epoch": 758} {"train_loss": -10.431377410888672, "global_step": 127433, "epoch": 758} {"train_loss": -9.982065200805664, "global_step": 127434, "epoch": 758} {"train_loss": -10.403802871704102, "global_step": 127435, "epoch": 758} {"train_loss": -10.128938674926758, "global_step": 127436, "epoch": 758} {"train_loss": -10.40959358215332, "global_step": 127437, "epoch": 758} {"train_loss": -10.096874237060547, "global_step": 127438, "epoch": 758} {"train_loss": -10.22624683380127, "global_step": 127439, "epoch": 758} {"train_loss": -9.987793922424316, "global_step": 127440, "epoch": 758} {"train_loss": -10.266409873962402, "global_step": 127441, "epoch": 758} {"train_loss": -10.295539855957031, "global_step": 127442, "epoch": 758} {"train_loss": -10.37728214263916, "global_step": 127443, "epoch": 758} {"train_loss": -10.085672378540039, "global_step": 127444, "epoch": 758} {"train_loss": -10.610723495483398, "global_step": 127445, "epoch": 758} {"train_loss": -10.267110824584961, "global_step": 127446, "epoch": 758} {"train_loss": -10.419947624206543, "global_step": 127447, "epoch": 758} {"train_loss": -10.273947715759277, "global_step": 127448, "epoch": 758} {"train_loss": -10.524513244628906, "global_step": 127449, "epoch": 758} {"train_loss": -10.502065658569336, "global_step": 127450, "epoch": 758} {"train_loss": -10.72140884399414, "global_step": 127451, "epoch": 758} {"train_loss": -10.71186637878418, "global_step": 127452, "epoch": 758} {"train_loss": -10.502299308776855, "global_step": 127453, "epoch": 758} {"train_loss": -10.656143188476562, "global_step": 127454, "epoch": 758} {"train_loss": -10.603012084960938, "global_step": 127455, "epoch": 758} {"train_loss": -10.685647964477539, "global_step": 127456, "epoch": 758} {"train_loss": -9.865612030029297, "global_step": 127457, "epoch": 758} {"train_loss": -10.60952377319336, "global_step": 127458, "epoch": 758} {"train_loss": -10.320680618286133, "global_step": 127459, "epoch": 758} {"train_loss": -10.550460815429688, "global_step": 127460, "epoch": 758} {"train_loss": -9.9440279006958, "global_step": 127461, "epoch": 758} {"train_loss": -10.406856536865234, "global_step": 127462, "epoch": 758} {"train_loss": -10.005314826965332, "global_step": 127463, "epoch": 758} {"train_loss": -10.420336723327637, "global_step": 127464, "epoch": 758} {"train_loss": -10.148382186889648, "global_step": 127465, "epoch": 758} {"train_loss": -10.254690170288086, "global_step": 127466, "epoch": 758} {"train_loss": -10.489609718322754, "global_step": 127467, "epoch": 758} {"train_loss": -10.127321243286133, "global_step": 127468, "epoch": 758} {"train_loss": -10.103635787963867, "global_step": 127469, "epoch": 758} {"train_loss": -10.529420852661133, "global_step": 127470, "epoch": 758} {"train_loss": -10.32054328918457, "global_step": 127471, "epoch": 758} {"train_loss": -10.423356056213379, "global_step": 127472, "epoch": 758} {"train_loss": -10.40678596496582, "global_step": 127473, "epoch": 758} {"train_loss": -10.192251205444336, "global_step": 127474, "epoch": 758} {"train_loss": -10.540807723999023, "global_step": 127475, "epoch": 758} {"train_loss": -10.150718688964844, "global_step": 127476, "epoch": 758} {"train_loss": -10.137210845947266, "global_step": 127477, "epoch": 758} {"train_loss": -10.184247970581055, "global_step": 127478, "epoch": 758} {"train_loss": -10.038604736328125, "global_step": 127479, "epoch": 758} {"train_loss": -10.565692901611328, "global_step": 127480, "epoch": 758} {"train_loss": -10.299057960510254, "global_step": 127481, "epoch": 758} {"train_loss": -10.263422966003418, "global_step": 127482, "epoch": 758} {"train_loss": -10.417375564575195, "global_step": 127483, "epoch": 758} {"train_loss": -10.014200210571289, "global_step": 127484, "epoch": 758} {"train_loss": -10.382257461547852, "global_step": 127485, "epoch": 758} {"train_loss": -9.857040405273438, "global_step": 127486, "epoch": 758} {"train_loss": -10.393701553344727, "global_step": 127487, "epoch": 758} {"train_loss": -10.159317970275879, "global_step": 127488, "epoch": 758} {"train_loss": -9.740028381347656, "global_step": 127489, "epoch": 758} {"train_loss": -10.6025390625, "global_step": 127490, "epoch": 758} {"train_loss": -10.408069610595703, "global_step": 127491, "epoch": 758} {"train_loss": -10.091434478759766, "global_step": 127492, "epoch": 758} {"train_loss": -10.455161094665527, "global_step": 127493, "epoch": 758} {"train_loss": -9.99424934387207, "global_step": 127494, "epoch": 758} {"train_loss": -10.006983757019043, "global_step": 127495, "epoch": 758} {"train_loss": -10.183704376220703, "global_step": 127496, "epoch": 758} {"train_loss": -9.944076538085938, "global_step": 127497, "epoch": 758} {"train_loss": -10.323856353759766, "global_step": 127498, "epoch": 758} {"train_loss": -10.042135238647461, "global_step": 127499, "epoch": 758} {"train_loss": -10.060033798217773, "global_step": 127500, "epoch": 758} {"train_loss": -10.265542984008789, "global_step": 127501, "epoch": 758} {"train_loss": -10.080405235290527, "global_step": 127502, "epoch": 758} {"train_loss": -10.444011688232422, "global_step": 127503, "epoch": 758} {"train_loss": -10.139628410339355, "global_step": 127504, "epoch": 758} {"train_loss": -10.256446838378906, "global_step": 127505, "epoch": 758} {"train_loss": -10.026198387145996, "global_step": 127506, "epoch": 758} {"train_loss": -10.128665924072266, "global_step": 127507, "epoch": 758} {"train_loss": -9.913847923278809, "global_step": 127508, "epoch": 758} {"train_loss": -10.2584228515625, "global_step": 127509, "epoch": 758} {"train_loss": -10.413609504699707, "global_step": 127510, "epoch": 758} {"train_loss": -10.20687434786842, "global_step": 127511, "epoch": 758, "val_loss": 219924.078125} {"train_loss": -10.174015998840332, "global_step": 127512, "epoch": 759} {"train_loss": -10.328458786010742, "global_step": 127513, "epoch": 759} {"train_loss": -9.720279693603516, "global_step": 127514, "epoch": 759} {"train_loss": -10.301275253295898, "global_step": 127515, "epoch": 759} {"train_loss": -10.297624588012695, "global_step": 127516, "epoch": 759} {"train_loss": -10.186790466308594, "global_step": 127517, "epoch": 759} {"train_loss": -10.191497802734375, "global_step": 127518, "epoch": 759} {"train_loss": -9.900652885437012, "global_step": 127519, "epoch": 759} {"train_loss": -10.382668495178223, "global_step": 127520, "epoch": 759} {"train_loss": -10.073058128356934, "global_step": 127521, "epoch": 759} {"train_loss": -10.351667404174805, "global_step": 127522, "epoch": 759} {"train_loss": -10.05398941040039, "global_step": 127523, "epoch": 759} {"train_loss": -10.093191146850586, "global_step": 127524, "epoch": 759} {"train_loss": -9.772855758666992, "global_step": 127525, "epoch": 759} {"train_loss": -10.319164276123047, "global_step": 127526, "epoch": 759} {"train_loss": -9.899673461914062, "global_step": 127527, "epoch": 759} {"train_loss": -10.366031646728516, "global_step": 127528, "epoch": 759} {"train_loss": -10.089463233947754, "global_step": 127529, "epoch": 759} {"train_loss": -9.557062149047852, "global_step": 127530, "epoch": 759} {"train_loss": -10.033004760742188, "global_step": 127531, "epoch": 759} {"train_loss": -9.972274780273438, "global_step": 127532, "epoch": 759} {"train_loss": -9.458581924438477, "global_step": 127533, "epoch": 759} {"train_loss": -10.23492431640625, "global_step": 127534, "epoch": 759} {"train_loss": -9.924031257629395, "global_step": 127535, "epoch": 759} {"train_loss": -9.619888305664062, "global_step": 127536, "epoch": 759} {"train_loss": -10.063047409057617, "global_step": 127537, "epoch": 759} {"train_loss": -10.204826354980469, "global_step": 127538, "epoch": 759} {"train_loss": -9.94625186920166, "global_step": 127539, "epoch": 759} {"train_loss": -10.131004333496094, "global_step": 127540, "epoch": 759} {"train_loss": -10.122491836547852, "global_step": 127541, "epoch": 759} {"train_loss": -10.093347549438477, "global_step": 127542, "epoch": 759} {"train_loss": -9.86125373840332, "global_step": 127543, "epoch": 759} {"train_loss": -10.334197998046875, "global_step": 127544, "epoch": 759} {"train_loss": -10.204996109008789, "global_step": 127545, "epoch": 759} {"train_loss": -10.265530586242676, "global_step": 127546, "epoch": 759} {"train_loss": -10.179292678833008, "global_step": 127547, "epoch": 759} {"train_loss": -10.23953914642334, "global_step": 127548, "epoch": 759} {"train_loss": -10.31309700012207, "global_step": 127549, "epoch": 759} {"train_loss": -10.296022415161133, "global_step": 127550, "epoch": 759} {"train_loss": -10.223736763000488, "global_step": 127551, "epoch": 759} {"train_loss": -10.301070213317871, "global_step": 127552, "epoch": 759} {"train_loss": -10.126412391662598, "global_step": 127553, "epoch": 759} {"train_loss": -10.120210647583008, "global_step": 127554, "epoch": 759} {"train_loss": -10.073387145996094, "global_step": 127555, "epoch": 759} {"train_loss": -10.247617721557617, "global_step": 127556, "epoch": 759} {"train_loss": -10.262136459350586, "global_step": 127557, "epoch": 759} {"train_loss": -9.8199462890625, "global_step": 127558, "epoch": 759} {"train_loss": -10.461372375488281, "global_step": 127559, "epoch": 759} {"train_loss": -10.197428703308105, "global_step": 127560, "epoch": 759} {"train_loss": -10.153053283691406, "global_step": 127561, "epoch": 759} {"train_loss": -10.087959289550781, "global_step": 127562, "epoch": 759} {"train_loss": -10.255678176879883, "global_step": 127563, "epoch": 759} {"train_loss": -10.327396392822266, "global_step": 127564, "epoch": 759} {"train_loss": -10.121997833251953, "global_step": 127565, "epoch": 759} {"train_loss": -10.424659729003906, "global_step": 127566, "epoch": 759} {"train_loss": -10.254964828491211, "global_step": 127567, "epoch": 759} {"train_loss": -10.319328308105469, "global_step": 127568, "epoch": 759} {"train_loss": -10.307363510131836, "global_step": 127569, "epoch": 759} {"train_loss": -10.327142715454102, "global_step": 127570, "epoch": 759} {"train_loss": -10.131531715393066, "global_step": 127571, "epoch": 759} {"train_loss": -10.135648727416992, "global_step": 127572, "epoch": 759} {"train_loss": -10.317269325256348, "global_step": 127573, "epoch": 759} {"train_loss": -10.391260147094727, "global_step": 127574, "epoch": 759} {"train_loss": -10.115476608276367, "global_step": 127575, "epoch": 759} {"train_loss": -10.195381164550781, "global_step": 127576, "epoch": 759} {"train_loss": -10.583221435546875, "global_step": 127577, "epoch": 759} {"train_loss": -10.27373218536377, "global_step": 127578, "epoch": 759} {"train_loss": -10.29912281036377, "global_step": 127579, "epoch": 759} {"train_loss": -9.48969841003418, "global_step": 127580, "epoch": 759} {"train_loss": -10.132457733154297, "global_step": 127581, "epoch": 759} {"train_loss": -9.618463516235352, "global_step": 127582, "epoch": 759} {"train_loss": -10.219382286071777, "global_step": 127583, "epoch": 759} {"train_loss": -9.643628120422363, "global_step": 127584, "epoch": 759} {"train_loss": -9.543907165527344, "global_step": 127585, "epoch": 759} {"train_loss": -9.733152389526367, "global_step": 127586, "epoch": 759} {"train_loss": -9.339008331298828, "global_step": 127587, "epoch": 759} {"train_loss": -9.983755111694336, "global_step": 127588, "epoch": 759} {"train_loss": -9.845222473144531, "global_step": 127589, "epoch": 759} {"train_loss": -9.684000015258789, "global_step": 127590, "epoch": 759} {"train_loss": -10.03250503540039, "global_step": 127591, "epoch": 759} {"train_loss": -10.087297439575195, "global_step": 127592, "epoch": 759} {"train_loss": -10.122333526611328, "global_step": 127593, "epoch": 759} {"train_loss": -10.439186096191406, "global_step": 127594, "epoch": 759} {"train_loss": -10.195793151855469, "global_step": 127595, "epoch": 759} {"train_loss": -10.020217895507812, "global_step": 127596, "epoch": 759} {"train_loss": -10.444826126098633, "global_step": 127597, "epoch": 759} {"train_loss": -10.416862487792969, "global_step": 127598, "epoch": 759} {"train_loss": -10.247941970825195, "global_step": 127599, "epoch": 759} {"train_loss": -9.97758674621582, "global_step": 127600, "epoch": 759} {"train_loss": -10.105177879333496, "global_step": 127601, "epoch": 759} {"train_loss": -10.35540771484375, "global_step": 127602, "epoch": 759} {"train_loss": -10.113327026367188, "global_step": 127603, "epoch": 759} {"train_loss": -10.16349983215332, "global_step": 127604, "epoch": 759} {"train_loss": -10.532890319824219, "global_step": 127605, "epoch": 759} {"train_loss": -10.175863265991211, "global_step": 127606, "epoch": 759} {"train_loss": -10.312911987304688, "global_step": 127607, "epoch": 759} {"train_loss": -10.372673034667969, "global_step": 127608, "epoch": 759} {"train_loss": -10.254815101623535, "global_step": 127609, "epoch": 759} {"train_loss": -9.99994945526123, "global_step": 127610, "epoch": 759} {"train_loss": -10.406737327575684, "global_step": 127611, "epoch": 759} {"train_loss": -10.066235542297363, "global_step": 127612, "epoch": 759} {"train_loss": -10.247223854064941, "global_step": 127613, "epoch": 759} {"train_loss": -10.401283264160156, "global_step": 127614, "epoch": 759} {"train_loss": -10.444262504577637, "global_step": 127615, "epoch": 759} {"train_loss": -10.661402702331543, "global_step": 127616, "epoch": 759} {"train_loss": -10.510512351989746, "global_step": 127617, "epoch": 759} {"train_loss": -10.505186080932617, "global_step": 127618, "epoch": 759} {"train_loss": -10.498682022094727, "global_step": 127619, "epoch": 759} {"train_loss": -10.574790954589844, "global_step": 127620, "epoch": 759} {"train_loss": -10.517546653747559, "global_step": 127621, "epoch": 759} {"train_loss": -10.494043350219727, "global_step": 127622, "epoch": 759} {"train_loss": -10.601537704467773, "global_step": 127623, "epoch": 759} {"train_loss": -10.16535758972168, "global_step": 127624, "epoch": 759} {"train_loss": -10.754667282104492, "global_step": 127625, "epoch": 759} {"train_loss": -10.593334197998047, "global_step": 127626, "epoch": 759} {"train_loss": -10.529962539672852, "global_step": 127627, "epoch": 759} {"train_loss": -10.583131790161133, "global_step": 127628, "epoch": 759} {"train_loss": -10.585772514343262, "global_step": 127629, "epoch": 759} {"train_loss": -10.420336723327637, "global_step": 127630, "epoch": 759} {"train_loss": -10.821410179138184, "global_step": 127631, "epoch": 759} {"train_loss": -10.547784805297852, "global_step": 127632, "epoch": 759} {"train_loss": -10.496435165405273, "global_step": 127633, "epoch": 759} {"train_loss": -10.548673629760742, "global_step": 127634, "epoch": 759} {"train_loss": -10.518074035644531, "global_step": 127635, "epoch": 759} {"train_loss": -10.492913246154785, "global_step": 127636, "epoch": 759} {"train_loss": -10.79684829711914, "global_step": 127637, "epoch": 759} {"train_loss": -10.250286102294922, "global_step": 127638, "epoch": 759} {"train_loss": -9.72609806060791, "global_step": 127639, "epoch": 759} {"train_loss": -10.539400100708008, "global_step": 127640, "epoch": 759} {"train_loss": -10.431297302246094, "global_step": 127641, "epoch": 759} {"train_loss": -9.536352157592773, "global_step": 127642, "epoch": 759} {"train_loss": -10.270793914794922, "global_step": 127643, "epoch": 759} {"train_loss": -9.972249984741211, "global_step": 127644, "epoch": 759} {"train_loss": -9.405963897705078, "global_step": 127645, "epoch": 759} {"train_loss": -10.231918334960938, "global_step": 127646, "epoch": 759} {"train_loss": -10.305828094482422, "global_step": 127647, "epoch": 759} {"train_loss": -9.383291244506836, "global_step": 127648, "epoch": 759} {"train_loss": -10.281115531921387, "global_step": 127649, "epoch": 759} {"train_loss": -9.246475219726562, "global_step": 127650, "epoch": 759} {"train_loss": -9.116323471069336, "global_step": 127651, "epoch": 759} {"train_loss": -10.04006576538086, "global_step": 127652, "epoch": 759} {"train_loss": -9.456645965576172, "global_step": 127653, "epoch": 759} {"train_loss": -10.387002944946289, "global_step": 127654, "epoch": 759} {"train_loss": -10.109829902648926, "global_step": 127655, "epoch": 759} {"train_loss": -10.244287490844727, "global_step": 127656, "epoch": 759} {"train_loss": -9.855915069580078, "global_step": 127657, "epoch": 759} {"train_loss": -10.01637077331543, "global_step": 127658, "epoch": 759} {"train_loss": -10.089405059814453, "global_step": 127659, "epoch": 759} {"train_loss": -10.334495544433594, "global_step": 127660, "epoch": 759} {"train_loss": -10.01449966430664, "global_step": 127661, "epoch": 759} {"train_loss": -10.272542953491211, "global_step": 127662, "epoch": 759} {"train_loss": -10.004010200500488, "global_step": 127663, "epoch": 759} {"train_loss": -10.014191627502441, "global_step": 127664, "epoch": 759} {"train_loss": -10.229687690734863, "global_step": 127665, "epoch": 759} {"train_loss": -10.257570266723633, "global_step": 127666, "epoch": 759} {"train_loss": -10.400287628173828, "global_step": 127667, "epoch": 759} {"train_loss": -10.284570693969727, "global_step": 127668, "epoch": 759} {"train_loss": -10.382495880126953, "global_step": 127669, "epoch": 759} {"train_loss": -10.269203186035156, "global_step": 127670, "epoch": 759} {"train_loss": -10.305290222167969, "global_step": 127671, "epoch": 759} {"train_loss": -10.258100509643555, "global_step": 127672, "epoch": 759} {"train_loss": -10.357989311218262, "global_step": 127673, "epoch": 759} {"train_loss": -10.456244468688965, "global_step": 127674, "epoch": 759} {"train_loss": -10.524242401123047, "global_step": 127675, "epoch": 759} {"train_loss": -10.479373931884766, "global_step": 127676, "epoch": 759} {"train_loss": -10.290121078491211, "global_step": 127677, "epoch": 759} {"train_loss": -10.447932243347168, "global_step": 127678, "epoch": 759} {"train_loss": -10.18266643228985, "global_step": 127679, "epoch": 759, "val_loss": 218011.640625} {"train_loss": -10.489070892333984, "global_step": 127680, "epoch": 760} {"train_loss": -10.316527366638184, "global_step": 127681, "epoch": 760} {"train_loss": -10.388162612915039, "global_step": 127682, "epoch": 760} {"train_loss": -10.388171195983887, "global_step": 127683, "epoch": 760} {"train_loss": -10.437003135681152, "global_step": 127684, "epoch": 760} {"train_loss": -10.506013870239258, "global_step": 127685, "epoch": 760} {"train_loss": -10.632264137268066, "global_step": 127686, "epoch": 760} {"train_loss": -10.360859870910645, "global_step": 127687, "epoch": 760} {"train_loss": -10.242755889892578, "global_step": 127688, "epoch": 760} {"train_loss": -10.436870574951172, "global_step": 127689, "epoch": 760} {"train_loss": -10.341619491577148, "global_step": 127690, "epoch": 760} {"train_loss": -10.515439987182617, "global_step": 127691, "epoch": 760} {"train_loss": -10.4480619430542, "global_step": 127692, "epoch": 760} {"train_loss": -10.401742935180664, "global_step": 127693, "epoch": 760} {"train_loss": -10.387107849121094, "global_step": 127694, "epoch": 760} {"train_loss": -10.281339645385742, "global_step": 127695, "epoch": 760} {"train_loss": -10.493368148803711, "global_step": 127696, "epoch": 760} {"train_loss": -10.472051620483398, "global_step": 127697, "epoch": 760} {"train_loss": -10.726356506347656, "global_step": 127698, "epoch": 760} {"train_loss": -10.549345016479492, "global_step": 127699, "epoch": 760} {"train_loss": -10.681386947631836, "global_step": 127700, "epoch": 760} {"train_loss": -10.51014518737793, "global_step": 127701, "epoch": 760} {"train_loss": -10.502849578857422, "global_step": 127702, "epoch": 760} {"train_loss": -10.655679702758789, "global_step": 127703, "epoch": 760} {"train_loss": -10.401394844055176, "global_step": 127704, "epoch": 760} {"train_loss": -10.582840919494629, "global_step": 127705, "epoch": 760} {"train_loss": -10.694137573242188, "global_step": 127706, "epoch": 760} {"train_loss": -10.390026092529297, "global_step": 127707, "epoch": 760} {"train_loss": -10.69747543334961, "global_step": 127708, "epoch": 760} {"train_loss": -10.608928680419922, "global_step": 127709, "epoch": 760} {"train_loss": -10.200334548950195, "global_step": 127710, "epoch": 760} {"train_loss": -10.446529388427734, "global_step": 127711, "epoch": 760} {"train_loss": -10.573402404785156, "global_step": 127712, "epoch": 760} {"train_loss": -10.398818969726562, "global_step": 127713, "epoch": 760} {"train_loss": -10.518030166625977, "global_step": 127714, "epoch": 760} {"train_loss": -10.356170654296875, "global_step": 127715, "epoch": 760} {"train_loss": -10.21529769897461, "global_step": 127716, "epoch": 760} {"train_loss": -10.196920394897461, "global_step": 127717, "epoch": 760} {"train_loss": -9.928993225097656, "global_step": 127718, "epoch": 760} {"train_loss": -10.483717918395996, "global_step": 127719, "epoch": 760} {"train_loss": -10.17523193359375, "global_step": 127720, "epoch": 760} {"train_loss": -9.851784706115723, "global_step": 127721, "epoch": 760} {"train_loss": -9.57758617401123, "global_step": 127722, "epoch": 760} {"train_loss": -9.58568000793457, "global_step": 127723, "epoch": 760} {"train_loss": -9.981586456298828, "global_step": 127724, "epoch": 760} {"train_loss": -10.421998977661133, "global_step": 127725, "epoch": 760} {"train_loss": -9.923951148986816, "global_step": 127726, "epoch": 760} {"train_loss": -10.334287643432617, "global_step": 127727, "epoch": 760} {"train_loss": -10.476024627685547, "global_step": 127728, "epoch": 760} {"train_loss": -10.421228408813477, "global_step": 127729, "epoch": 760} {"train_loss": -10.304943084716797, "global_step": 127730, "epoch": 760} {"train_loss": -10.288667678833008, "global_step": 127731, "epoch": 760} {"train_loss": -9.965803146362305, "global_step": 127732, "epoch": 760} {"train_loss": -10.36935043334961, "global_step": 127733, "epoch": 760} {"train_loss": -10.283018112182617, "global_step": 127734, "epoch": 760} {"train_loss": -10.341642379760742, "global_step": 127735, "epoch": 760} {"train_loss": -10.382613182067871, "global_step": 127736, "epoch": 760} {"train_loss": -10.34907341003418, "global_step": 127737, "epoch": 760} {"train_loss": -10.139142990112305, "global_step": 127738, "epoch": 760} {"train_loss": -10.228567123413086, "global_step": 127739, "epoch": 760} {"train_loss": -10.293725967407227, "global_step": 127740, "epoch": 760} {"train_loss": -10.180456161499023, "global_step": 127741, "epoch": 760} {"train_loss": -10.543068885803223, "global_step": 127742, "epoch": 760} {"train_loss": -10.261958122253418, "global_step": 127743, "epoch": 760} {"train_loss": -10.494725227355957, "global_step": 127744, "epoch": 760} {"train_loss": -10.414901733398438, "global_step": 127745, "epoch": 760} {"train_loss": -10.092035293579102, "global_step": 127746, "epoch": 760} {"train_loss": -10.362325668334961, "global_step": 127747, "epoch": 760} {"train_loss": -9.901959419250488, "global_step": 127748, "epoch": 760} {"train_loss": -10.540112495422363, "global_step": 127749, "epoch": 760} {"train_loss": -10.235502243041992, "global_step": 127750, "epoch": 760} {"train_loss": -10.277921676635742, "global_step": 127751, "epoch": 760} {"train_loss": -10.355928421020508, "global_step": 127752, "epoch": 760} {"train_loss": -10.325292587280273, "global_step": 127753, "epoch": 760} {"train_loss": -10.225152969360352, "global_step": 127754, "epoch": 760} {"train_loss": -10.245473861694336, "global_step": 127755, "epoch": 760} {"train_loss": -10.182186126708984, "global_step": 127756, "epoch": 760} {"train_loss": -10.478224754333496, "global_step": 127757, "epoch": 760} {"train_loss": -10.161531448364258, "global_step": 127758, "epoch": 760} {"train_loss": -10.33498764038086, "global_step": 127759, "epoch": 760} {"train_loss": -10.568204879760742, "global_step": 127760, "epoch": 760} {"train_loss": -9.88497543334961, "global_step": 127761, "epoch": 760} {"train_loss": -10.378934860229492, "global_step": 127762, "epoch": 760} {"train_loss": -10.296269416809082, "global_step": 127763, "epoch": 760} {"train_loss": -10.284334182739258, "global_step": 127764, "epoch": 760} {"train_loss": -10.258456230163574, "global_step": 127765, "epoch": 760} {"train_loss": -10.059089660644531, "global_step": 127766, "epoch": 760} {"train_loss": -10.527568817138672, "global_step": 127767, "epoch": 760} {"train_loss": -10.040172576904297, "global_step": 127768, "epoch": 760} {"train_loss": -10.432479858398438, "global_step": 127769, "epoch": 760} {"train_loss": -10.369522094726562, "global_step": 127770, "epoch": 760} {"train_loss": -10.351353645324707, "global_step": 127771, "epoch": 760} {"train_loss": -10.399688720703125, "global_step": 127772, "epoch": 760} {"train_loss": -10.095148086547852, "global_step": 127773, "epoch": 760} {"train_loss": -10.356827735900879, "global_step": 127774, "epoch": 760} {"train_loss": -10.07774543762207, "global_step": 127775, "epoch": 760} {"train_loss": -10.264025688171387, "global_step": 127776, "epoch": 760} {"train_loss": -10.515644073486328, "global_step": 127777, "epoch": 760} {"train_loss": -10.140610694885254, "global_step": 127778, "epoch": 760} {"train_loss": -10.085203170776367, "global_step": 127779, "epoch": 760} {"train_loss": -10.262054443359375, "global_step": 127780, "epoch": 760} {"train_loss": -10.129217147827148, "global_step": 127781, "epoch": 760} {"train_loss": -10.395602226257324, "global_step": 127782, "epoch": 760} {"train_loss": -10.146867752075195, "global_step": 127783, "epoch": 760} {"train_loss": -10.399353981018066, "global_step": 127784, "epoch": 760} {"train_loss": -10.205305099487305, "global_step": 127785, "epoch": 760} {"train_loss": -10.457931518554688, "global_step": 127786, "epoch": 760} {"train_loss": -10.327350616455078, "global_step": 127787, "epoch": 760} {"train_loss": -10.352235794067383, "global_step": 127788, "epoch": 760} {"train_loss": -10.403329849243164, "global_step": 127789, "epoch": 760} {"train_loss": -10.267496109008789, "global_step": 127790, "epoch": 760} {"train_loss": -10.311094284057617, "global_step": 127791, "epoch": 760} {"train_loss": -10.531063079833984, "global_step": 127792, "epoch": 760} {"train_loss": -10.011507034301758, "global_step": 127793, "epoch": 760} {"train_loss": -10.5470552444458, "global_step": 127794, "epoch": 760} {"train_loss": -10.197839736938477, "global_step": 127795, "epoch": 760} {"train_loss": -10.252758026123047, "global_step": 127796, "epoch": 760} {"train_loss": -10.331111907958984, "global_step": 127797, "epoch": 760} {"train_loss": -9.711847305297852, "global_step": 127798, "epoch": 760} {"train_loss": -10.423650741577148, "global_step": 127799, "epoch": 760} {"train_loss": -10.064031600952148, "global_step": 127800, "epoch": 760} {"train_loss": -10.427750587463379, "global_step": 127801, "epoch": 760} {"train_loss": -10.227333068847656, "global_step": 127802, "epoch": 760} {"train_loss": -9.985679626464844, "global_step": 127803, "epoch": 760} {"train_loss": -10.449684143066406, "global_step": 127804, "epoch": 760} {"train_loss": -10.247295379638672, "global_step": 127805, "epoch": 760} {"train_loss": -10.05003547668457, "global_step": 127806, "epoch": 760} {"train_loss": -10.086618423461914, "global_step": 127807, "epoch": 760} {"train_loss": -9.989477157592773, "global_step": 127808, "epoch": 760} {"train_loss": -10.097261428833008, "global_step": 127809, "epoch": 760} {"train_loss": -9.82291030883789, "global_step": 127810, "epoch": 760} {"train_loss": -10.100301742553711, "global_step": 127811, "epoch": 760} {"train_loss": -10.289165496826172, "global_step": 127812, "epoch": 760} {"train_loss": -10.20937728881836, "global_step": 127813, "epoch": 760} {"train_loss": -10.03841495513916, "global_step": 127814, "epoch": 760} {"train_loss": -10.029213905334473, "global_step": 127815, "epoch": 760} {"train_loss": -10.465789794921875, "global_step": 127816, "epoch": 760} {"train_loss": -10.112594604492188, "global_step": 127817, "epoch": 760} {"train_loss": -10.272848129272461, "global_step": 127818, "epoch": 760} {"train_loss": -10.400430679321289, "global_step": 127819, "epoch": 760} {"train_loss": -10.371322631835938, "global_step": 127820, "epoch": 760} {"train_loss": -10.386417388916016, "global_step": 127821, "epoch": 760} {"train_loss": -10.260494232177734, "global_step": 127822, "epoch": 760} {"train_loss": -10.437708854675293, "global_step": 127823, "epoch": 760} {"train_loss": -10.426541328430176, "global_step": 127824, "epoch": 760} {"train_loss": -10.014490127563477, "global_step": 127825, "epoch": 760} {"train_loss": -10.384389877319336, "global_step": 127826, "epoch": 760} {"train_loss": -10.057164192199707, "global_step": 127827, "epoch": 760} {"train_loss": -10.002241134643555, "global_step": 127828, "epoch": 760} {"train_loss": -10.190173149108887, "global_step": 127829, "epoch": 760} {"train_loss": -10.295968055725098, "global_step": 127830, "epoch": 760} {"train_loss": -10.118467330932617, "global_step": 127831, "epoch": 760} {"train_loss": -10.481866836547852, "global_step": 127832, "epoch": 760} {"train_loss": -9.808151245117188, "global_step": 127833, "epoch": 760} {"train_loss": -9.97424030303955, "global_step": 127834, "epoch": 760} {"train_loss": -10.378040313720703, "global_step": 127835, "epoch": 760} {"train_loss": -9.845340728759766, "global_step": 127836, "epoch": 760} {"train_loss": -10.26486873626709, "global_step": 127837, "epoch": 760} {"train_loss": -9.852653503417969, "global_step": 127838, "epoch": 760} {"train_loss": -10.243053436279297, "global_step": 127839, "epoch": 760} {"train_loss": -9.908506393432617, "global_step": 127840, "epoch": 760} {"train_loss": -10.005210876464844, "global_step": 127841, "epoch": 760} {"train_loss": -10.19715690612793, "global_step": 127842, "epoch": 760} {"train_loss": -10.022806167602539, "global_step": 127843, "epoch": 760} {"train_loss": -10.332377433776855, "global_step": 127844, "epoch": 760} {"train_loss": -10.113767623901367, "global_step": 127845, "epoch": 760} {"train_loss": -9.771366119384766, "global_step": 127846, "epoch": 760} {"train_loss": -10.275466022037325, "global_step": 127847, "epoch": 760, "val_loss": 219567.640625, "train_action_mse_error": 1.7862236499786377} {"train_loss": -10.159160614013672, "global_step": 127848, "epoch": 761} {"train_loss": -10.411334991455078, "global_step": 127849, "epoch": 761} {"train_loss": -10.425846099853516, "global_step": 127850, "epoch": 761} {"train_loss": -10.322826385498047, "global_step": 127851, "epoch": 761} {"train_loss": -10.090228080749512, "global_step": 127852, "epoch": 761} {"train_loss": -10.395035743713379, "global_step": 127853, "epoch": 761} {"train_loss": -10.082867622375488, "global_step": 127854, "epoch": 761} {"train_loss": -10.432878494262695, "global_step": 127855, "epoch": 761} {"train_loss": -10.252833366394043, "global_step": 127856, "epoch": 761} {"train_loss": -10.283707618713379, "global_step": 127857, "epoch": 761} {"train_loss": -10.25547981262207, "global_step": 127858, "epoch": 761} {"train_loss": -10.493345260620117, "global_step": 127859, "epoch": 761} {"train_loss": -10.33583927154541, "global_step": 127860, "epoch": 761} {"train_loss": -10.346807479858398, "global_step": 127861, "epoch": 761} {"train_loss": -10.207761764526367, "global_step": 127862, "epoch": 761} {"train_loss": -10.26085376739502, "global_step": 127863, "epoch": 761} {"train_loss": -10.463350296020508, "global_step": 127864, "epoch": 761} {"train_loss": -10.425878524780273, "global_step": 127865, "epoch": 761} {"train_loss": -10.505440711975098, "global_step": 127866, "epoch": 761} {"train_loss": -10.284635543823242, "global_step": 127867, "epoch": 761} {"train_loss": -10.2676362991333, "global_step": 127868, "epoch": 761} {"train_loss": -10.707149505615234, "global_step": 127869, "epoch": 761} {"train_loss": -10.757015228271484, "global_step": 127870, "epoch": 761} {"train_loss": -10.727155685424805, "global_step": 127871, "epoch": 761} {"train_loss": -10.547109603881836, "global_step": 127872, "epoch": 761} {"train_loss": -10.521951675415039, "global_step": 127873, "epoch": 761} {"train_loss": -10.349136352539062, "global_step": 127874, "epoch": 761} {"train_loss": -10.465840339660645, "global_step": 127875, "epoch": 761} {"train_loss": -10.080259323120117, "global_step": 127876, "epoch": 761} {"train_loss": -10.530784606933594, "global_step": 127877, "epoch": 761} {"train_loss": -10.527729034423828, "global_step": 127878, "epoch": 761} {"train_loss": -10.567514419555664, "global_step": 127879, "epoch": 761} {"train_loss": -10.601572036743164, "global_step": 127880, "epoch": 761} {"train_loss": -10.401710510253906, "global_step": 127881, "epoch": 761} {"train_loss": -10.060888290405273, "global_step": 127882, "epoch": 761} {"train_loss": -10.403553009033203, "global_step": 127883, "epoch": 761} {"train_loss": -10.401729583740234, "global_step": 127884, "epoch": 761} {"train_loss": -9.861515045166016, "global_step": 127885, "epoch": 761} {"train_loss": -10.195247650146484, "global_step": 127886, "epoch": 761} {"train_loss": -10.439083099365234, "global_step": 127887, "epoch": 761} {"train_loss": -10.029598236083984, "global_step": 127888, "epoch": 761} {"train_loss": -10.568857192993164, "global_step": 127889, "epoch": 761} {"train_loss": -10.486469268798828, "global_step": 127890, "epoch": 761} {"train_loss": -10.37315559387207, "global_step": 127891, "epoch": 761} {"train_loss": -10.668001174926758, "global_step": 127892, "epoch": 761} {"train_loss": -10.481941223144531, "global_step": 127893, "epoch": 761} {"train_loss": -10.39095687866211, "global_step": 127894, "epoch": 761} {"train_loss": -10.349746704101562, "global_step": 127895, "epoch": 761} {"train_loss": -10.480484962463379, "global_step": 127896, "epoch": 761} {"train_loss": -10.181451797485352, "global_step": 127897, "epoch": 761} {"train_loss": -10.009269714355469, "global_step": 127898, "epoch": 761} {"train_loss": -10.734930992126465, "global_step": 127899, "epoch": 761} {"train_loss": -9.985260009765625, "global_step": 127900, "epoch": 761} {"train_loss": -10.142243385314941, "global_step": 127901, "epoch": 761} {"train_loss": -10.474976539611816, "global_step": 127902, "epoch": 761} {"train_loss": -10.1300630569458, "global_step": 127903, "epoch": 761} {"train_loss": -10.363014221191406, "global_step": 127904, "epoch": 761} {"train_loss": -9.942642211914062, "global_step": 127905, "epoch": 761} {"train_loss": -10.254802703857422, "global_step": 127906, "epoch": 761} {"train_loss": -10.678442001342773, "global_step": 127907, "epoch": 761} {"train_loss": -9.883272171020508, "global_step": 127908, "epoch": 761} {"train_loss": -10.316104888916016, "global_step": 127909, "epoch": 761} {"train_loss": -10.236745834350586, "global_step": 127910, "epoch": 761} {"train_loss": -10.432716369628906, "global_step": 127911, "epoch": 761} {"train_loss": -10.31563949584961, "global_step": 127912, "epoch": 761} {"train_loss": -10.448493957519531, "global_step": 127913, "epoch": 761} {"train_loss": -10.387943267822266, "global_step": 127914, "epoch": 761} {"train_loss": -10.261200904846191, "global_step": 127915, "epoch": 761} {"train_loss": -10.587194442749023, "global_step": 127916, "epoch": 761} {"train_loss": -10.153365135192871, "global_step": 127917, "epoch": 761} {"train_loss": -10.426645278930664, "global_step": 127918, "epoch": 761} {"train_loss": -10.217541694641113, "global_step": 127919, "epoch": 761} {"train_loss": -10.11676025390625, "global_step": 127920, "epoch": 761} {"train_loss": -10.157920837402344, "global_step": 127921, "epoch": 761} {"train_loss": -10.237314224243164, "global_step": 127922, "epoch": 761} {"train_loss": -10.291360855102539, "global_step": 127923, "epoch": 761} {"train_loss": -10.414274215698242, "global_step": 127924, "epoch": 761} {"train_loss": -10.419143676757812, "global_step": 127925, "epoch": 761} {"train_loss": -10.192556381225586, "global_step": 127926, "epoch": 761} {"train_loss": -10.203030586242676, "global_step": 127927, "epoch": 761} {"train_loss": -10.442710876464844, "global_step": 127928, "epoch": 761} {"train_loss": -10.05013370513916, "global_step": 127929, "epoch": 761} {"train_loss": -10.649401664733887, "global_step": 127930, "epoch": 761} {"train_loss": -10.302385330200195, "global_step": 127931, "epoch": 761} {"train_loss": -10.204171180725098, "global_step": 127932, "epoch": 761} {"train_loss": -10.38527774810791, "global_step": 127933, "epoch": 761} {"train_loss": -10.1416015625, "global_step": 127934, "epoch": 761} {"train_loss": -10.444234848022461, "global_step": 127935, "epoch": 761} {"train_loss": -9.926998138427734, "global_step": 127936, "epoch": 761} {"train_loss": -10.361223220825195, "global_step": 127937, "epoch": 761} {"train_loss": -10.052305221557617, "global_step": 127938, "epoch": 761} {"train_loss": -9.821362495422363, "global_step": 127939, "epoch": 761} {"train_loss": -10.492841720581055, "global_step": 127940, "epoch": 761} {"train_loss": -9.575719833374023, "global_step": 127941, "epoch": 761} {"train_loss": -10.171714782714844, "global_step": 127942, "epoch": 761} {"train_loss": -9.98333740234375, "global_step": 127943, "epoch": 761} {"train_loss": -9.82111930847168, "global_step": 127944, "epoch": 761} {"train_loss": -10.278507232666016, "global_step": 127945, "epoch": 761} {"train_loss": -9.790727615356445, "global_step": 127946, "epoch": 761} {"train_loss": -10.044172286987305, "global_step": 127947, "epoch": 761} {"train_loss": -10.377525329589844, "global_step": 127948, "epoch": 761} {"train_loss": -10.414401054382324, "global_step": 127949, "epoch": 761} {"train_loss": -10.14902400970459, "global_step": 127950, "epoch": 761} {"train_loss": -10.283793449401855, "global_step": 127951, "epoch": 761} {"train_loss": -10.161721229553223, "global_step": 127952, "epoch": 761} {"train_loss": -10.264876365661621, "global_step": 127953, "epoch": 761} {"train_loss": -10.23525619506836, "global_step": 127954, "epoch": 761} {"train_loss": -10.38045883178711, "global_step": 127955, "epoch": 761} {"train_loss": -10.592138290405273, "global_step": 127956, "epoch": 761} {"train_loss": -10.278718948364258, "global_step": 127957, "epoch": 761} {"train_loss": -10.607598304748535, "global_step": 127958, "epoch": 761} {"train_loss": -10.55774211883545, "global_step": 127959, "epoch": 761} {"train_loss": -10.323610305786133, "global_step": 127960, "epoch": 761} {"train_loss": -10.573232650756836, "global_step": 127961, "epoch": 761} {"train_loss": -10.369134902954102, "global_step": 127962, "epoch": 761} {"train_loss": -10.425451278686523, "global_step": 127963, "epoch": 761} {"train_loss": -10.455374717712402, "global_step": 127964, "epoch": 761} {"train_loss": -10.537837028503418, "global_step": 127965, "epoch": 761} {"train_loss": -10.603139877319336, "global_step": 127966, "epoch": 761} {"train_loss": -10.642232894897461, "global_step": 127967, "epoch": 761} {"train_loss": -10.319820404052734, "global_step": 127968, "epoch": 761} {"train_loss": -10.515559196472168, "global_step": 127969, "epoch": 761} {"train_loss": -10.487363815307617, "global_step": 127970, "epoch": 761} {"train_loss": -10.653642654418945, "global_step": 127971, "epoch": 761} {"train_loss": -10.545524597167969, "global_step": 127972, "epoch": 761} {"train_loss": -10.511563301086426, "global_step": 127973, "epoch": 761} {"train_loss": -10.655118942260742, "global_step": 127974, "epoch": 761} {"train_loss": -10.684885025024414, "global_step": 127975, "epoch": 761} {"train_loss": -10.623697280883789, "global_step": 127976, "epoch": 761} {"train_loss": -10.63789176940918, "global_step": 127977, "epoch": 761} {"train_loss": -10.422181129455566, "global_step": 127978, "epoch": 761} {"train_loss": -10.61958122253418, "global_step": 127979, "epoch": 761} {"train_loss": -10.694513320922852, "global_step": 127980, "epoch": 761} {"train_loss": -10.320286750793457, "global_step": 127981, "epoch": 761} {"train_loss": -10.565338134765625, "global_step": 127982, "epoch": 761} {"train_loss": -10.22468376159668, "global_step": 127983, "epoch": 761} {"train_loss": -10.553864479064941, "global_step": 127984, "epoch": 761} {"train_loss": -10.26623249053955, "global_step": 127985, "epoch": 761} {"train_loss": -9.888691902160645, "global_step": 127986, "epoch": 761} {"train_loss": -10.027090072631836, "global_step": 127987, "epoch": 761} {"train_loss": -10.185067176818848, "global_step": 127988, "epoch": 761} {"train_loss": -9.707611083984375, "global_step": 127989, "epoch": 761} {"train_loss": -10.297704696655273, "global_step": 127990, "epoch": 761} {"train_loss": -10.187605857849121, "global_step": 127991, "epoch": 761} {"train_loss": -9.670970916748047, "global_step": 127992, "epoch": 761} {"train_loss": -9.864213943481445, "global_step": 127993, "epoch": 761} {"train_loss": -9.280889511108398, "global_step": 127994, "epoch": 761} {"train_loss": -8.882511138916016, "global_step": 127995, "epoch": 761} {"train_loss": -9.529081344604492, "global_step": 127996, "epoch": 761} {"train_loss": -8.982343673706055, "global_step": 127997, "epoch": 761} {"train_loss": -9.524454116821289, "global_step": 127998, "epoch": 761} {"train_loss": -9.640642166137695, "global_step": 127999, "epoch": 761} {"train_loss": -9.266944885253906, "global_step": 128000, "epoch": 761} {"train_loss": -9.954765319824219, "global_step": 128001, "epoch": 761} {"train_loss": -9.504953384399414, "global_step": 128002, "epoch": 761} {"train_loss": -10.087592124938965, "global_step": 128003, "epoch": 761} {"train_loss": -10.128323554992676, "global_step": 128004, "epoch": 761} {"train_loss": -9.999957084655762, "global_step": 128005, "epoch": 761} {"train_loss": -10.155829429626465, "global_step": 128006, "epoch": 761} {"train_loss": -10.393240928649902, "global_step": 128007, "epoch": 761} {"train_loss": -9.91352367401123, "global_step": 128008, "epoch": 761} {"train_loss": -9.913352966308594, "global_step": 128009, "epoch": 761} {"train_loss": -10.17831802368164, "global_step": 128010, "epoch": 761} {"train_loss": -10.005847930908203, "global_step": 128011, "epoch": 761} {"train_loss": -10.110549926757812, "global_step": 128012, "epoch": 761} {"train_loss": -10.122116088867188, "global_step": 128013, "epoch": 761} {"train_loss": -9.94025993347168, "global_step": 128014, "epoch": 761} {"train_loss": -10.256770917347499, "global_step": 128015, "epoch": 761, "val_loss": 217612.359375} {"train_loss": -9.933558464050293, "global_step": 128016, "epoch": 762} {"train_loss": -9.699556350708008, "global_step": 128017, "epoch": 762} {"train_loss": -10.103442192077637, "global_step": 128018, "epoch": 762} {"train_loss": -9.75666618347168, "global_step": 128019, "epoch": 762} {"train_loss": -10.255725860595703, "global_step": 128020, "epoch": 762} {"train_loss": -10.137910842895508, "global_step": 128021, "epoch": 762} {"train_loss": -10.151219367980957, "global_step": 128022, "epoch": 762} {"train_loss": -10.122013092041016, "global_step": 128023, "epoch": 762} {"train_loss": -10.199089050292969, "global_step": 128024, "epoch": 762} {"train_loss": -10.21884536743164, "global_step": 128025, "epoch": 762} {"train_loss": -10.246227264404297, "global_step": 128026, "epoch": 762} {"train_loss": -10.60958480834961, "global_step": 128027, "epoch": 762} {"train_loss": -10.249679565429688, "global_step": 128028, "epoch": 762} {"train_loss": -10.236178398132324, "global_step": 128029, "epoch": 762} {"train_loss": -10.306221008300781, "global_step": 128030, "epoch": 762} {"train_loss": -10.259757995605469, "global_step": 128031, "epoch": 762} {"train_loss": -10.408551216125488, "global_step": 128032, "epoch": 762} {"train_loss": -10.327646255493164, "global_step": 128033, "epoch": 762} {"train_loss": -10.516688346862793, "global_step": 128034, "epoch": 762} {"train_loss": -10.504083633422852, "global_step": 128035, "epoch": 762} {"train_loss": -10.428848266601562, "global_step": 128036, "epoch": 762} {"train_loss": -10.243040084838867, "global_step": 128037, "epoch": 762} {"train_loss": -10.415838241577148, "global_step": 128038, "epoch": 762} {"train_loss": -10.334651947021484, "global_step": 128039, "epoch": 762} {"train_loss": -10.47384262084961, "global_step": 128040, "epoch": 762} {"train_loss": -10.32623291015625, "global_step": 128041, "epoch": 762} {"train_loss": -10.45291519165039, "global_step": 128042, "epoch": 762} {"train_loss": -10.45702075958252, "global_step": 128043, "epoch": 762} {"train_loss": -10.476327896118164, "global_step": 128044, "epoch": 762} {"train_loss": -10.408733367919922, "global_step": 128045, "epoch": 762} {"train_loss": -10.368504524230957, "global_step": 128046, "epoch": 762} {"train_loss": -10.569128036499023, "global_step": 128047, "epoch": 762} {"train_loss": -10.49640941619873, "global_step": 128048, "epoch": 762} {"train_loss": -10.618224143981934, "global_step": 128049, "epoch": 762} {"train_loss": -10.427942276000977, "global_step": 128050, "epoch": 762} {"train_loss": -10.769783020019531, "global_step": 128051, "epoch": 762} {"train_loss": -10.704154968261719, "global_step": 128052, "epoch": 762} {"train_loss": -10.547786712646484, "global_step": 128053, "epoch": 762} {"train_loss": -10.429264068603516, "global_step": 128054, "epoch": 762} {"train_loss": -10.512948036193848, "global_step": 128055, "epoch": 762} {"train_loss": -10.451238632202148, "global_step": 128056, "epoch": 762} {"train_loss": -10.499245643615723, "global_step": 128057, "epoch": 762} {"train_loss": -10.320295333862305, "global_step": 128058, "epoch": 762} {"train_loss": -10.543421745300293, "global_step": 128059, "epoch": 762} {"train_loss": -10.565930366516113, "global_step": 128060, "epoch": 762} {"train_loss": -10.63776969909668, "global_step": 128061, "epoch": 762} {"train_loss": -10.58139419555664, "global_step": 128062, "epoch": 762} {"train_loss": -10.685165405273438, "global_step": 128063, "epoch": 762} {"train_loss": -10.45710277557373, "global_step": 128064, "epoch": 762} {"train_loss": -10.765748977661133, "global_step": 128065, "epoch": 762} {"train_loss": -10.969754219055176, "global_step": 128066, "epoch": 762} {"train_loss": -10.633020401000977, "global_step": 128067, "epoch": 762} {"train_loss": -10.113163948059082, "global_step": 128068, "epoch": 762} {"train_loss": -10.084260940551758, "global_step": 128069, "epoch": 762} {"train_loss": -10.267000198364258, "global_step": 128070, "epoch": 762} {"train_loss": -9.830185890197754, "global_step": 128071, "epoch": 762} {"train_loss": -9.822216987609863, "global_step": 128072, "epoch": 762} {"train_loss": -10.116199493408203, "global_step": 128073, "epoch": 762} {"train_loss": -10.479177474975586, "global_step": 128074, "epoch": 762} {"train_loss": -9.933645248413086, "global_step": 128075, "epoch": 762} {"train_loss": -10.432140350341797, "global_step": 128076, "epoch": 762} {"train_loss": -10.254278182983398, "global_step": 128077, "epoch": 762} {"train_loss": -9.621317863464355, "global_step": 128078, "epoch": 762} {"train_loss": -10.175063133239746, "global_step": 128079, "epoch": 762} {"train_loss": -9.959135055541992, "global_step": 128080, "epoch": 762} {"train_loss": -9.872152328491211, "global_step": 128081, "epoch": 762} {"train_loss": -9.791208267211914, "global_step": 128082, "epoch": 762} {"train_loss": -9.813512802124023, "global_step": 128083, "epoch": 762} {"train_loss": -10.240013122558594, "global_step": 128084, "epoch": 762} {"train_loss": -9.601167678833008, "global_step": 128085, "epoch": 762} {"train_loss": -10.294042587280273, "global_step": 128086, "epoch": 762} {"train_loss": -10.108426094055176, "global_step": 128087, "epoch": 762} {"train_loss": -10.127080917358398, "global_step": 128088, "epoch": 762} {"train_loss": -10.155017852783203, "global_step": 128089, "epoch": 762} {"train_loss": -9.74323558807373, "global_step": 128090, "epoch": 762} {"train_loss": -10.048089981079102, "global_step": 128091, "epoch": 762} {"train_loss": -9.761642456054688, "global_step": 128092, "epoch": 762} {"train_loss": -10.27238941192627, "global_step": 128093, "epoch": 762} {"train_loss": -10.009740829467773, "global_step": 128094, "epoch": 762} {"train_loss": -10.268072128295898, "global_step": 128095, "epoch": 762} {"train_loss": -10.06806755065918, "global_step": 128096, "epoch": 762} {"train_loss": -10.079874992370605, "global_step": 128097, "epoch": 762} {"train_loss": -9.902482986450195, "global_step": 128098, "epoch": 762} {"train_loss": -10.374472618103027, "global_step": 128099, "epoch": 762} {"train_loss": -10.309940338134766, "global_step": 128100, "epoch": 762} {"train_loss": -10.079755783081055, "global_step": 128101, "epoch": 762} {"train_loss": -10.354854583740234, "global_step": 128102, "epoch": 762} {"train_loss": -10.224550247192383, "global_step": 128103, "epoch": 762} {"train_loss": -10.372371673583984, "global_step": 128104, "epoch": 762} {"train_loss": -10.370302200317383, "global_step": 128105, "epoch": 762} {"train_loss": -10.309326171875, "global_step": 128106, "epoch": 762} {"train_loss": -10.271180152893066, "global_step": 128107, "epoch": 762} {"train_loss": -10.547626495361328, "global_step": 128108, "epoch": 762} {"train_loss": -10.431112289428711, "global_step": 128109, "epoch": 762} {"train_loss": -10.32912826538086, "global_step": 128110, "epoch": 762} {"train_loss": -10.20232105255127, "global_step": 128111, "epoch": 762} {"train_loss": -10.294416427612305, "global_step": 128112, "epoch": 762} {"train_loss": -10.464825630187988, "global_step": 128113, "epoch": 762} {"train_loss": -10.388277053833008, "global_step": 128114, "epoch": 762} {"train_loss": -10.311506271362305, "global_step": 128115, "epoch": 762} {"train_loss": -10.328824996948242, "global_step": 128116, "epoch": 762} {"train_loss": -10.426521301269531, "global_step": 128117, "epoch": 762} {"train_loss": -10.41246223449707, "global_step": 128118, "epoch": 762} {"train_loss": -10.453927993774414, "global_step": 128119, "epoch": 762} {"train_loss": -10.220507621765137, "global_step": 128120, "epoch": 762} {"train_loss": -10.465275764465332, "global_step": 128121, "epoch": 762} {"train_loss": -10.037201881408691, "global_step": 128122, "epoch": 762} {"train_loss": -10.162186622619629, "global_step": 128123, "epoch": 762} {"train_loss": -10.234904289245605, "global_step": 128124, "epoch": 762} {"train_loss": -10.120867729187012, "global_step": 128125, "epoch": 762} {"train_loss": -10.438806533813477, "global_step": 128126, "epoch": 762} {"train_loss": -10.342026710510254, "global_step": 128127, "epoch": 762} {"train_loss": -10.546781539916992, "global_step": 128128, "epoch": 762} {"train_loss": -10.463768005371094, "global_step": 128129, "epoch": 762} {"train_loss": -10.567939758300781, "global_step": 128130, "epoch": 762} {"train_loss": -10.301663398742676, "global_step": 128131, "epoch": 762} {"train_loss": -10.324701309204102, "global_step": 128132, "epoch": 762} {"train_loss": -10.444417953491211, "global_step": 128133, "epoch": 762} {"train_loss": -10.417494773864746, "global_step": 128134, "epoch": 762} {"train_loss": -10.693976402282715, "global_step": 128135, "epoch": 762} {"train_loss": -10.359579086303711, "global_step": 128136, "epoch": 762} {"train_loss": -10.14348030090332, "global_step": 128137, "epoch": 762} {"train_loss": -10.604909896850586, "global_step": 128138, "epoch": 762} {"train_loss": -9.948123931884766, "global_step": 128139, "epoch": 762} {"train_loss": -10.120298385620117, "global_step": 128140, "epoch": 762} {"train_loss": -10.587514877319336, "global_step": 128141, "epoch": 762} {"train_loss": -10.20224380493164, "global_step": 128142, "epoch": 762} {"train_loss": -9.938591003417969, "global_step": 128143, "epoch": 762} {"train_loss": -10.346277236938477, "global_step": 128144, "epoch": 762} {"train_loss": -9.969295501708984, "global_step": 128145, "epoch": 762} {"train_loss": -9.969461441040039, "global_step": 128146, "epoch": 762} {"train_loss": -10.17137622833252, "global_step": 128147, "epoch": 762} {"train_loss": -10.005051612854004, "global_step": 128148, "epoch": 762} {"train_loss": -10.00910758972168, "global_step": 128149, "epoch": 762} {"train_loss": -9.63975715637207, "global_step": 128150, "epoch": 762} {"train_loss": -10.437969207763672, "global_step": 128151, "epoch": 762} {"train_loss": -9.847908020019531, "global_step": 128152, "epoch": 762} {"train_loss": -10.314294815063477, "global_step": 128153, "epoch": 762} {"train_loss": -10.049322128295898, "global_step": 128154, "epoch": 762} {"train_loss": -9.78608512878418, "global_step": 128155, "epoch": 762} {"train_loss": -10.402225494384766, "global_step": 128156, "epoch": 762} {"train_loss": -10.000053405761719, "global_step": 128157, "epoch": 762} {"train_loss": -10.518627166748047, "global_step": 128158, "epoch": 762} {"train_loss": -10.229915618896484, "global_step": 128159, "epoch": 762} {"train_loss": -10.247418403625488, "global_step": 128160, "epoch": 762} {"train_loss": -10.514148712158203, "global_step": 128161, "epoch": 762} {"train_loss": -10.303854942321777, "global_step": 128162, "epoch": 762} {"train_loss": -10.447010040283203, "global_step": 128163, "epoch": 762} {"train_loss": -10.35738754272461, "global_step": 128164, "epoch": 762} {"train_loss": -10.412348747253418, "global_step": 128165, "epoch": 762} {"train_loss": -10.50792407989502, "global_step": 128166, "epoch": 762} {"train_loss": -10.407846450805664, "global_step": 128167, "epoch": 762} {"train_loss": -10.629998207092285, "global_step": 128168, "epoch": 762} {"train_loss": -10.565971374511719, "global_step": 128169, "epoch": 762} {"train_loss": -10.435717582702637, "global_step": 128170, "epoch": 762} {"train_loss": -10.436807632446289, "global_step": 128171, "epoch": 762} {"train_loss": -10.427227973937988, "global_step": 128172, "epoch": 762} {"train_loss": -10.493241310119629, "global_step": 128173, "epoch": 762} {"train_loss": -10.486516952514648, "global_step": 128174, "epoch": 762} {"train_loss": -10.522631645202637, "global_step": 128175, "epoch": 762} {"train_loss": -10.542644500732422, "global_step": 128176, "epoch": 762} {"train_loss": -10.693140983581543, "global_step": 128177, "epoch": 762} {"train_loss": -10.631786346435547, "global_step": 128178, "epoch": 762} {"train_loss": -10.331106185913086, "global_step": 128179, "epoch": 762} {"train_loss": -10.483951568603516, "global_step": 128180, "epoch": 762} {"train_loss": -10.506011009216309, "global_step": 128181, "epoch": 762} {"train_loss": -10.547719955444336, "global_step": 128182, "epoch": 762} {"train_loss": -10.297792077064514, "global_step": 128183, "epoch": 762, "val_loss": 219774.046875} {"train_loss": -10.375523567199707, "global_step": 128184, "epoch": 763} {"train_loss": -9.807584762573242, "global_step": 128185, "epoch": 763} {"train_loss": -10.121685028076172, "global_step": 128186, "epoch": 763} {"train_loss": -10.46566104888916, "global_step": 128187, "epoch": 763} {"train_loss": -9.923648834228516, "global_step": 128188, "epoch": 763} {"train_loss": -10.52403736114502, "global_step": 128189, "epoch": 763} {"train_loss": -10.156098365783691, "global_step": 128190, "epoch": 763} {"train_loss": -10.436779022216797, "global_step": 128191, "epoch": 763} {"train_loss": -10.113544464111328, "global_step": 128192, "epoch": 763} {"train_loss": -10.337664604187012, "global_step": 128193, "epoch": 763} {"train_loss": -10.417792320251465, "global_step": 128194, "epoch": 763} {"train_loss": -10.248147010803223, "global_step": 128195, "epoch": 763} {"train_loss": -10.439821243286133, "global_step": 128196, "epoch": 763} {"train_loss": -10.162492752075195, "global_step": 128197, "epoch": 763} {"train_loss": -10.560365676879883, "global_step": 128198, "epoch": 763} {"train_loss": -10.35892105102539, "global_step": 128199, "epoch": 763} {"train_loss": -10.801664352416992, "global_step": 128200, "epoch": 763} {"train_loss": -10.384336471557617, "global_step": 128201, "epoch": 763} {"train_loss": -10.48973274230957, "global_step": 128202, "epoch": 763} {"train_loss": -10.434907913208008, "global_step": 128203, "epoch": 763} {"train_loss": -10.499166488647461, "global_step": 128204, "epoch": 763} {"train_loss": -10.45622444152832, "global_step": 128205, "epoch": 763} {"train_loss": -10.552401542663574, "global_step": 128206, "epoch": 763} {"train_loss": -10.690662384033203, "global_step": 128207, "epoch": 763} {"train_loss": -10.281627655029297, "global_step": 128208, "epoch": 763} {"train_loss": -10.29472827911377, "global_step": 128209, "epoch": 763} {"train_loss": -10.255166053771973, "global_step": 128210, "epoch": 763} {"train_loss": -10.53976821899414, "global_step": 128211, "epoch": 763} {"train_loss": -10.278165817260742, "global_step": 128212, "epoch": 763} {"train_loss": -10.465383529663086, "global_step": 128213, "epoch": 763} {"train_loss": -10.370301246643066, "global_step": 128214, "epoch": 763} {"train_loss": -10.133795738220215, "global_step": 128215, "epoch": 763} {"train_loss": -10.565000534057617, "global_step": 128216, "epoch": 763} {"train_loss": -10.386404037475586, "global_step": 128217, "epoch": 763} {"train_loss": -10.533608436584473, "global_step": 128218, "epoch": 763} {"train_loss": -10.279047012329102, "global_step": 128219, "epoch": 763} {"train_loss": -10.41952133178711, "global_step": 128220, "epoch": 763} {"train_loss": -10.468310356140137, "global_step": 128221, "epoch": 763} {"train_loss": -10.548052787780762, "global_step": 128222, "epoch": 763} {"train_loss": -10.481681823730469, "global_step": 128223, "epoch": 763} {"train_loss": -10.535680770874023, "global_step": 128224, "epoch": 763} {"train_loss": -10.490845680236816, "global_step": 128225, "epoch": 763} {"train_loss": -10.378271102905273, "global_step": 128226, "epoch": 763} {"train_loss": -10.717449188232422, "global_step": 128227, "epoch": 763} {"train_loss": -10.641718864440918, "global_step": 128228, "epoch": 763} {"train_loss": -10.39754867553711, "global_step": 128229, "epoch": 763} {"train_loss": -10.572946548461914, "global_step": 128230, "epoch": 763} {"train_loss": -10.473468780517578, "global_step": 128231, "epoch": 763} {"train_loss": -10.47217845916748, "global_step": 128232, "epoch": 763} {"train_loss": -9.916727066040039, "global_step": 128233, "epoch": 763} {"train_loss": -10.5621337890625, "global_step": 128234, "epoch": 763} {"train_loss": -10.345468521118164, "global_step": 128235, "epoch": 763} {"train_loss": -10.327922821044922, "global_step": 128236, "epoch": 763} {"train_loss": -10.266111373901367, "global_step": 128237, "epoch": 763} {"train_loss": -10.297016143798828, "global_step": 128238, "epoch": 763} {"train_loss": -10.297527313232422, "global_step": 128239, "epoch": 763} {"train_loss": -10.654983520507812, "global_step": 128240, "epoch": 763} {"train_loss": -10.32503890991211, "global_step": 128241, "epoch": 763} {"train_loss": -10.512836456298828, "global_step": 128242, "epoch": 763} {"train_loss": -10.490482330322266, "global_step": 128243, "epoch": 763} {"train_loss": -10.498493194580078, "global_step": 128244, "epoch": 763} {"train_loss": -10.632062911987305, "global_step": 128245, "epoch": 763} {"train_loss": -10.419336318969727, "global_step": 128246, "epoch": 763} {"train_loss": -10.051904678344727, "global_step": 128247, "epoch": 763} {"train_loss": -10.362747192382812, "global_step": 128248, "epoch": 763} {"train_loss": -9.950660705566406, "global_step": 128249, "epoch": 763} {"train_loss": -8.63911247253418, "global_step": 128250, "epoch": 763} {"train_loss": -10.543166160583496, "global_step": 128251, "epoch": 763} {"train_loss": -8.825611114501953, "global_step": 128252, "epoch": 763} {"train_loss": -9.625633239746094, "global_step": 128253, "epoch": 763} {"train_loss": -10.134048461914062, "global_step": 128254, "epoch": 763} {"train_loss": -9.397725105285645, "global_step": 128255, "epoch": 763} {"train_loss": -9.868805885314941, "global_step": 128256, "epoch": 763} {"train_loss": -9.196846961975098, "global_step": 128257, "epoch": 763} {"train_loss": -10.326505661010742, "global_step": 128258, "epoch": 763} {"train_loss": -8.95361328125, "global_step": 128259, "epoch": 763} {"train_loss": -10.160177230834961, "global_step": 128260, "epoch": 763} {"train_loss": -9.845233917236328, "global_step": 128261, "epoch": 763} {"train_loss": -9.858123779296875, "global_step": 128262, "epoch": 763} {"train_loss": -10.341896057128906, "global_step": 128263, "epoch": 763} {"train_loss": -10.082450866699219, "global_step": 128264, "epoch": 763} {"train_loss": -10.259749412536621, "global_step": 128265, "epoch": 763} {"train_loss": -10.21197509765625, "global_step": 128266, "epoch": 763} {"train_loss": -10.034887313842773, "global_step": 128267, "epoch": 763} {"train_loss": -10.115194320678711, "global_step": 128268, "epoch": 763} {"train_loss": -10.241610527038574, "global_step": 128269, "epoch": 763} {"train_loss": -10.163124084472656, "global_step": 128270, "epoch": 763} {"train_loss": -10.32044792175293, "global_step": 128271, "epoch": 763} {"train_loss": -10.110307693481445, "global_step": 128272, "epoch": 763} {"train_loss": -10.252298355102539, "global_step": 128273, "epoch": 763} {"train_loss": -10.40466594696045, "global_step": 128274, "epoch": 763} {"train_loss": -10.203155517578125, "global_step": 128275, "epoch": 763} {"train_loss": -10.303930282592773, "global_step": 128276, "epoch": 763} {"train_loss": -10.290481567382812, "global_step": 128277, "epoch": 763} {"train_loss": -10.615455627441406, "global_step": 128278, "epoch": 763} {"train_loss": -10.276811599731445, "global_step": 128279, "epoch": 763} {"train_loss": -10.144658088684082, "global_step": 128280, "epoch": 763} {"train_loss": -10.423506736755371, "global_step": 128281, "epoch": 763} {"train_loss": -10.253503799438477, "global_step": 128282, "epoch": 763} {"train_loss": -10.39224624633789, "global_step": 128283, "epoch": 763} {"train_loss": -10.321240425109863, "global_step": 128284, "epoch": 763} {"train_loss": -10.444446563720703, "global_step": 128285, "epoch": 763} {"train_loss": -10.47882080078125, "global_step": 128286, "epoch": 763} {"train_loss": -10.634315490722656, "global_step": 128287, "epoch": 763} {"train_loss": -10.768468856811523, "global_step": 128288, "epoch": 763} {"train_loss": -10.545799255371094, "global_step": 128289, "epoch": 763} {"train_loss": -10.681254386901855, "global_step": 128290, "epoch": 763} {"train_loss": -10.653755187988281, "global_step": 128291, "epoch": 763} {"train_loss": -10.47231674194336, "global_step": 128292, "epoch": 763} {"train_loss": -10.6639404296875, "global_step": 128293, "epoch": 763} {"train_loss": -10.616628646850586, "global_step": 128294, "epoch": 763} {"train_loss": -10.529945373535156, "global_step": 128295, "epoch": 763} {"train_loss": -10.681303024291992, "global_step": 128296, "epoch": 763} {"train_loss": -10.562507629394531, "global_step": 128297, "epoch": 763} {"train_loss": -10.655450820922852, "global_step": 128298, "epoch": 763} {"train_loss": -10.651172637939453, "global_step": 128299, "epoch": 763} {"train_loss": -10.525903701782227, "global_step": 128300, "epoch": 763} {"train_loss": -10.496599197387695, "global_step": 128301, "epoch": 763} {"train_loss": -10.41889762878418, "global_step": 128302, "epoch": 763} {"train_loss": -10.442112922668457, "global_step": 128303, "epoch": 763} {"train_loss": -9.573736190795898, "global_step": 128304, "epoch": 763} {"train_loss": -10.057960510253906, "global_step": 128305, "epoch": 763} {"train_loss": -10.124065399169922, "global_step": 128306, "epoch": 763} {"train_loss": -10.5628023147583, "global_step": 128307, "epoch": 763} {"train_loss": -10.542308807373047, "global_step": 128308, "epoch": 763} {"train_loss": -9.967092514038086, "global_step": 128309, "epoch": 763} {"train_loss": -10.200474739074707, "global_step": 128310, "epoch": 763} {"train_loss": -10.38802719116211, "global_step": 128311, "epoch": 763} {"train_loss": -10.195089340209961, "global_step": 128312, "epoch": 763} {"train_loss": -10.219598770141602, "global_step": 128313, "epoch": 763} {"train_loss": -10.19696044921875, "global_step": 128314, "epoch": 763} {"train_loss": -9.97119140625, "global_step": 128315, "epoch": 763} {"train_loss": -10.017669677734375, "global_step": 128316, "epoch": 763} {"train_loss": -10.42031478881836, "global_step": 128317, "epoch": 763} {"train_loss": -10.203069686889648, "global_step": 128318, "epoch": 763} {"train_loss": -10.423301696777344, "global_step": 128319, "epoch": 763} {"train_loss": -10.276451110839844, "global_step": 128320, "epoch": 763} {"train_loss": -10.071908950805664, "global_step": 128321, "epoch": 763} {"train_loss": -9.932493209838867, "global_step": 128322, "epoch": 763} {"train_loss": -10.037447929382324, "global_step": 128323, "epoch": 763} {"train_loss": -10.072986602783203, "global_step": 128324, "epoch": 763} {"train_loss": -10.055301666259766, "global_step": 128325, "epoch": 763} {"train_loss": -10.401117324829102, "global_step": 128326, "epoch": 763} {"train_loss": -10.061820983886719, "global_step": 128327, "epoch": 763} {"train_loss": -10.4381103515625, "global_step": 128328, "epoch": 763} {"train_loss": -10.220927238464355, "global_step": 128329, "epoch": 763} {"train_loss": -10.308975219726562, "global_step": 128330, "epoch": 763} {"train_loss": -10.360063552856445, "global_step": 128331, "epoch": 763} {"train_loss": -10.326486587524414, "global_step": 128332, "epoch": 763} {"train_loss": -10.378827095031738, "global_step": 128333, "epoch": 763} {"train_loss": -10.26582145690918, "global_step": 128334, "epoch": 763} {"train_loss": -10.383893966674805, "global_step": 128335, "epoch": 763} {"train_loss": -10.12218952178955, "global_step": 128336, "epoch": 763} {"train_loss": -10.441911697387695, "global_step": 128337, "epoch": 763} {"train_loss": -10.439397811889648, "global_step": 128338, "epoch": 763} {"train_loss": -10.268900871276855, "global_step": 128339, "epoch": 763} {"train_loss": -10.257698059082031, "global_step": 128340, "epoch": 763} {"train_loss": -10.24058723449707, "global_step": 128341, "epoch": 763} {"train_loss": -10.399921417236328, "global_step": 128342, "epoch": 763} {"train_loss": -10.203072547912598, "global_step": 128343, "epoch": 763} {"train_loss": -10.34593391418457, "global_step": 128344, "epoch": 763} {"train_loss": -10.11721420288086, "global_step": 128345, "epoch": 763} {"train_loss": -10.353034973144531, "global_step": 128346, "epoch": 763} {"train_loss": -10.054633140563965, "global_step": 128347, "epoch": 763} {"train_loss": -9.90264892578125, "global_step": 128348, "epoch": 763} {"train_loss": -10.289957046508789, "global_step": 128349, "epoch": 763} {"train_loss": -10.386006355285645, "global_step": 128350, "epoch": 763} {"train_loss": -10.288658079646883, "global_step": 128351, "epoch": 763, "val_loss": 212946.546875} {"train_loss": -10.230384826660156, "global_step": 128352, "epoch": 764} {"train_loss": -10.30599308013916, "global_step": 128353, "epoch": 764} {"train_loss": -10.351104736328125, "global_step": 128354, "epoch": 764} {"train_loss": -10.383373260498047, "global_step": 128355, "epoch": 764} {"train_loss": -10.191190719604492, "global_step": 128356, "epoch": 764} {"train_loss": -10.441904067993164, "global_step": 128357, "epoch": 764} {"train_loss": -9.98633098602295, "global_step": 128358, "epoch": 764} {"train_loss": -10.466398239135742, "global_step": 128359, "epoch": 764} {"train_loss": -10.078697204589844, "global_step": 128360, "epoch": 764} {"train_loss": -10.520471572875977, "global_step": 128361, "epoch": 764} {"train_loss": -9.788055419921875, "global_step": 128362, "epoch": 764} {"train_loss": -10.354759216308594, "global_step": 128363, "epoch": 764} {"train_loss": -9.874896049499512, "global_step": 128364, "epoch": 764} {"train_loss": -10.552453994750977, "global_step": 128365, "epoch": 764} {"train_loss": -9.863136291503906, "global_step": 128366, "epoch": 764} {"train_loss": -10.241682052612305, "global_step": 128367, "epoch": 764} {"train_loss": -10.020176887512207, "global_step": 128368, "epoch": 764} {"train_loss": -10.212692260742188, "global_step": 128369, "epoch": 764} {"train_loss": -10.03915023803711, "global_step": 128370, "epoch": 764} {"train_loss": -9.859903335571289, "global_step": 128371, "epoch": 764} {"train_loss": -10.042482376098633, "global_step": 128372, "epoch": 764} {"train_loss": -10.057926177978516, "global_step": 128373, "epoch": 764} {"train_loss": -10.01134204864502, "global_step": 128374, "epoch": 764} {"train_loss": -9.845707893371582, "global_step": 128375, "epoch": 764} {"train_loss": -9.519401550292969, "global_step": 128376, "epoch": 764} {"train_loss": -9.271465301513672, "global_step": 128377, "epoch": 764} {"train_loss": -9.742712020874023, "global_step": 128378, "epoch": 764} {"train_loss": -9.594294548034668, "global_step": 128379, "epoch": 764} {"train_loss": -9.717158317565918, "global_step": 128380, "epoch": 764} {"train_loss": -10.204900741577148, "global_step": 128381, "epoch": 764} {"train_loss": -9.445587158203125, "global_step": 128382, "epoch": 764} {"train_loss": -10.609919548034668, "global_step": 128383, "epoch": 764} {"train_loss": -9.34693431854248, "global_step": 128384, "epoch": 764} {"train_loss": -10.06761360168457, "global_step": 128385, "epoch": 764} {"train_loss": -10.031540870666504, "global_step": 128386, "epoch": 764} {"train_loss": -10.215346336364746, "global_step": 128387, "epoch": 764} {"train_loss": -10.527694702148438, "global_step": 128388, "epoch": 764} {"train_loss": -10.15703010559082, "global_step": 128389, "epoch": 764} {"train_loss": -10.132318496704102, "global_step": 128390, "epoch": 764} {"train_loss": -10.113411903381348, "global_step": 128391, "epoch": 764} {"train_loss": -10.082487106323242, "global_step": 128392, "epoch": 764} {"train_loss": -10.244050979614258, "global_step": 128393, "epoch": 764} {"train_loss": -10.148775100708008, "global_step": 128394, "epoch": 764} {"train_loss": -10.296092987060547, "global_step": 128395, "epoch": 764} {"train_loss": -10.175797462463379, "global_step": 128396, "epoch": 764} {"train_loss": -10.2800931930542, "global_step": 128397, "epoch": 764} {"train_loss": -10.387064933776855, "global_step": 128398, "epoch": 764} {"train_loss": -10.135042190551758, "global_step": 128399, "epoch": 764} {"train_loss": -10.296921730041504, "global_step": 128400, "epoch": 764} {"train_loss": -10.247626304626465, "global_step": 128401, "epoch": 764} {"train_loss": -10.32095718383789, "global_step": 128402, "epoch": 764} {"train_loss": -10.232377052307129, "global_step": 128403, "epoch": 764} {"train_loss": -10.163362503051758, "global_step": 128404, "epoch": 764} {"train_loss": -10.207916259765625, "global_step": 128405, "epoch": 764} {"train_loss": -10.225178718566895, "global_step": 128406, "epoch": 764} {"train_loss": -10.390840530395508, "global_step": 128407, "epoch": 764} {"train_loss": -10.40730094909668, "global_step": 128408, "epoch": 764} {"train_loss": -10.280839920043945, "global_step": 128409, "epoch": 764} {"train_loss": -10.27212905883789, "global_step": 128410, "epoch": 764} {"train_loss": -10.471748352050781, "global_step": 128411, "epoch": 764} {"train_loss": -10.532037734985352, "global_step": 128412, "epoch": 764} {"train_loss": -10.583304405212402, "global_step": 128413, "epoch": 764} {"train_loss": -10.515975952148438, "global_step": 128414, "epoch": 764} {"train_loss": -10.584798812866211, "global_step": 128415, "epoch": 764} {"train_loss": -10.191694259643555, "global_step": 128416, "epoch": 764} {"train_loss": -10.441856384277344, "global_step": 128417, "epoch": 764} {"train_loss": -10.440869331359863, "global_step": 128418, "epoch": 764} {"train_loss": -10.663174629211426, "global_step": 128419, "epoch": 764} {"train_loss": -10.612438201904297, "global_step": 128420, "epoch": 764} {"train_loss": -10.143634796142578, "global_step": 128421, "epoch": 764} {"train_loss": -10.57829475402832, "global_step": 128422, "epoch": 764} {"train_loss": -10.24533462524414, "global_step": 128423, "epoch": 764} {"train_loss": -10.364811897277832, "global_step": 128424, "epoch": 764} {"train_loss": -10.61693286895752, "global_step": 128425, "epoch": 764} {"train_loss": -10.484183311462402, "global_step": 128426, "epoch": 764} {"train_loss": -10.450614929199219, "global_step": 128427, "epoch": 764} {"train_loss": -10.628791809082031, "global_step": 128428, "epoch": 764} {"train_loss": -10.529744148254395, "global_step": 128429, "epoch": 764} {"train_loss": -10.413660049438477, "global_step": 128430, "epoch": 764} {"train_loss": -10.551603317260742, "global_step": 128431, "epoch": 764} {"train_loss": -10.637487411499023, "global_step": 128432, "epoch": 764} {"train_loss": -10.804815292358398, "global_step": 128433, "epoch": 764} {"train_loss": -10.389430046081543, "global_step": 128434, "epoch": 764} {"train_loss": -10.534246444702148, "global_step": 128435, "epoch": 764} {"train_loss": -10.401382446289062, "global_step": 128436, "epoch": 764} {"train_loss": -10.474579811096191, "global_step": 128437, "epoch": 764} {"train_loss": -10.432599067687988, "global_step": 128438, "epoch": 764} {"train_loss": -10.509918212890625, "global_step": 128439, "epoch": 764} {"train_loss": -10.62533950805664, "global_step": 128440, "epoch": 764} {"train_loss": -10.42851448059082, "global_step": 128441, "epoch": 764} {"train_loss": -10.374442100524902, "global_step": 128442, "epoch": 764} {"train_loss": -10.154096603393555, "global_step": 128443, "epoch": 764} {"train_loss": -10.119860649108887, "global_step": 128444, "epoch": 764} {"train_loss": -10.362592697143555, "global_step": 128445, "epoch": 764} {"train_loss": -8.81002426147461, "global_step": 128446, "epoch": 764} {"train_loss": -10.402914047241211, "global_step": 128447, "epoch": 764} {"train_loss": -10.188331604003906, "global_step": 128448, "epoch": 764} {"train_loss": -10.137325286865234, "global_step": 128449, "epoch": 764} {"train_loss": -10.328607559204102, "global_step": 128450, "epoch": 764} {"train_loss": -10.094825744628906, "global_step": 128451, "epoch": 764} {"train_loss": -10.00918197631836, "global_step": 128452, "epoch": 764} {"train_loss": -10.347554206848145, "global_step": 128453, "epoch": 764} {"train_loss": -9.826520919799805, "global_step": 128454, "epoch": 764} {"train_loss": -9.655729293823242, "global_step": 128455, "epoch": 764} {"train_loss": -10.309870719909668, "global_step": 128456, "epoch": 764} {"train_loss": -10.009805679321289, "global_step": 128457, "epoch": 764} {"train_loss": -10.306349754333496, "global_step": 128458, "epoch": 764} {"train_loss": -10.085233688354492, "global_step": 128459, "epoch": 764} {"train_loss": -10.351794242858887, "global_step": 128460, "epoch": 764} {"train_loss": -9.65020751953125, "global_step": 128461, "epoch": 764} {"train_loss": -10.329601287841797, "global_step": 128462, "epoch": 764} {"train_loss": -9.774776458740234, "global_step": 128463, "epoch": 764} {"train_loss": -10.31987190246582, "global_step": 128464, "epoch": 764} {"train_loss": -9.891387939453125, "global_step": 128465, "epoch": 764} {"train_loss": -10.028515815734863, "global_step": 128466, "epoch": 764} {"train_loss": -9.87842082977295, "global_step": 128467, "epoch": 764} {"train_loss": -9.673421859741211, "global_step": 128468, "epoch": 764} {"train_loss": -9.949111938476562, "global_step": 128469, "epoch": 764} {"train_loss": -9.652761459350586, "global_step": 128470, "epoch": 764} {"train_loss": -10.246919631958008, "global_step": 128471, "epoch": 764} {"train_loss": -9.697897911071777, "global_step": 128472, "epoch": 764} {"train_loss": -9.588339805603027, "global_step": 128473, "epoch": 764} {"train_loss": -10.191993713378906, "global_step": 128474, "epoch": 764} {"train_loss": -10.038232803344727, "global_step": 128475, "epoch": 764} {"train_loss": -9.755972862243652, "global_step": 128476, "epoch": 764} {"train_loss": -9.90977954864502, "global_step": 128477, "epoch": 764} {"train_loss": -10.111557006835938, "global_step": 128478, "epoch": 764} {"train_loss": -9.836904525756836, "global_step": 128479, "epoch": 764} {"train_loss": -9.738994598388672, "global_step": 128480, "epoch": 764} {"train_loss": -10.311182975769043, "global_step": 128481, "epoch": 764} {"train_loss": -9.758890151977539, "global_step": 128482, "epoch": 764} {"train_loss": -9.633771896362305, "global_step": 128483, "epoch": 764} {"train_loss": -10.260679244995117, "global_step": 128484, "epoch": 764} {"train_loss": -9.736284255981445, "global_step": 128485, "epoch": 764} {"train_loss": -10.17040729522705, "global_step": 128486, "epoch": 764} {"train_loss": -10.148478507995605, "global_step": 128487, "epoch": 764} {"train_loss": -10.175511360168457, "global_step": 128488, "epoch": 764} {"train_loss": -9.956947326660156, "global_step": 128489, "epoch": 764} {"train_loss": -10.094568252563477, "global_step": 128490, "epoch": 764} {"train_loss": -10.032424926757812, "global_step": 128491, "epoch": 764} {"train_loss": -10.10362720489502, "global_step": 128492, "epoch": 764} {"train_loss": -10.395881652832031, "global_step": 128493, "epoch": 764} {"train_loss": -9.946832656860352, "global_step": 128494, "epoch": 764} {"train_loss": -10.309123039245605, "global_step": 128495, "epoch": 764} {"train_loss": -10.248783111572266, "global_step": 128496, "epoch": 764} {"train_loss": -10.247660636901855, "global_step": 128497, "epoch": 764} {"train_loss": -10.067909240722656, "global_step": 128498, "epoch": 764} {"train_loss": -10.224628448486328, "global_step": 128499, "epoch": 764} {"train_loss": -10.325023651123047, "global_step": 128500, "epoch": 764} {"train_loss": -10.360340118408203, "global_step": 128501, "epoch": 764} {"train_loss": -10.120850563049316, "global_step": 128502, "epoch": 764} {"train_loss": -10.363892555236816, "global_step": 128503, "epoch": 764} {"train_loss": -10.438183784484863, "global_step": 128504, "epoch": 764} {"train_loss": -10.314254760742188, "global_step": 128505, "epoch": 764} {"train_loss": -10.379789352416992, "global_step": 128506, "epoch": 764} {"train_loss": -10.392627716064453, "global_step": 128507, "epoch": 764} {"train_loss": -10.188440322875977, "global_step": 128508, "epoch": 764} {"train_loss": -10.287165641784668, "global_step": 128509, "epoch": 764} {"train_loss": -10.445781707763672, "global_step": 128510, "epoch": 764} {"train_loss": -10.208399772644043, "global_step": 128511, "epoch": 764} {"train_loss": -10.39360237121582, "global_step": 128512, "epoch": 764} {"train_loss": -10.52434253692627, "global_step": 128513, "epoch": 764} {"train_loss": -10.399054527282715, "global_step": 128514, "epoch": 764} {"train_loss": -10.56713581085205, "global_step": 128515, "epoch": 764} {"train_loss": -10.565825462341309, "global_step": 128516, "epoch": 764} {"train_loss": -10.314216613769531, "global_step": 128517, "epoch": 764} {"train_loss": -10.567190170288086, "global_step": 128518, "epoch": 764} {"train_loss": -10.19184694971357, "global_step": 128519, "epoch": 764, "val_loss": 220650.234375} {"train_loss": -10.48320198059082, "global_step": 128520, "epoch": 765} {"train_loss": -10.271295547485352, "global_step": 128521, "epoch": 765} {"train_loss": -10.396965026855469, "global_step": 128522, "epoch": 765} {"train_loss": -10.600486755371094, "global_step": 128523, "epoch": 765} {"train_loss": -10.4305419921875, "global_step": 128524, "epoch": 765} {"train_loss": -10.674692153930664, "global_step": 128525, "epoch": 765} {"train_loss": -10.488739967346191, "global_step": 128526, "epoch": 765} {"train_loss": -10.315665245056152, "global_step": 128527, "epoch": 765} {"train_loss": -10.451705932617188, "global_step": 128528, "epoch": 765} {"train_loss": -10.63322925567627, "global_step": 128529, "epoch": 765} {"train_loss": -10.497230529785156, "global_step": 128530, "epoch": 765} {"train_loss": -10.597522735595703, "global_step": 128531, "epoch": 765} {"train_loss": -10.79818058013916, "global_step": 128532, "epoch": 765} {"train_loss": -10.548149108886719, "global_step": 128533, "epoch": 765} {"train_loss": -10.469905853271484, "global_step": 128534, "epoch": 765} {"train_loss": -10.037184715270996, "global_step": 128535, "epoch": 765} {"train_loss": -10.565875053405762, "global_step": 128536, "epoch": 765} {"train_loss": -10.536022186279297, "global_step": 128537, "epoch": 765} {"train_loss": -10.35165786743164, "global_step": 128538, "epoch": 765} {"train_loss": -10.26991081237793, "global_step": 128539, "epoch": 765} {"train_loss": -10.545485496520996, "global_step": 128540, "epoch": 765} {"train_loss": -10.322517395019531, "global_step": 128541, "epoch": 765} {"train_loss": -10.382436752319336, "global_step": 128542, "epoch": 765} {"train_loss": -10.420334815979004, "global_step": 128543, "epoch": 765} {"train_loss": -10.165319442749023, "global_step": 128544, "epoch": 765} {"train_loss": -9.936555862426758, "global_step": 128545, "epoch": 765} {"train_loss": -10.448701858520508, "global_step": 128546, "epoch": 765} {"train_loss": -10.100225448608398, "global_step": 128547, "epoch": 765} {"train_loss": -10.239984512329102, "global_step": 128548, "epoch": 765} {"train_loss": -10.11164665222168, "global_step": 128549, "epoch": 765} {"train_loss": -10.399171829223633, "global_step": 128550, "epoch": 765} {"train_loss": -10.185622215270996, "global_step": 128551, "epoch": 765} {"train_loss": -9.487646102905273, "global_step": 128552, "epoch": 765} {"train_loss": -10.303732872009277, "global_step": 128553, "epoch": 765} {"train_loss": -9.65870475769043, "global_step": 128554, "epoch": 765} {"train_loss": -9.807256698608398, "global_step": 128555, "epoch": 765} {"train_loss": -9.741512298583984, "global_step": 128556, "epoch": 765} {"train_loss": -9.264504432678223, "global_step": 128557, "epoch": 765} {"train_loss": -8.500733375549316, "global_step": 128558, "epoch": 765} {"train_loss": -10.087868690490723, "global_step": 128559, "epoch": 765} {"train_loss": -10.08629035949707, "global_step": 128560, "epoch": 765} {"train_loss": -9.701946258544922, "global_step": 128561, "epoch": 765} {"train_loss": -10.098450660705566, "global_step": 128562, "epoch": 765} {"train_loss": -10.223814010620117, "global_step": 128563, "epoch": 765} {"train_loss": -9.570079803466797, "global_step": 128564, "epoch": 765} {"train_loss": -10.344704627990723, "global_step": 128565, "epoch": 765} {"train_loss": -9.66329574584961, "global_step": 128566, "epoch": 765} {"train_loss": -10.197113037109375, "global_step": 128567, "epoch": 765} {"train_loss": -9.96456527709961, "global_step": 128568, "epoch": 765} {"train_loss": -9.8546724319458, "global_step": 128569, "epoch": 765} {"train_loss": -10.34017562866211, "global_step": 128570, "epoch": 765} {"train_loss": -10.179022789001465, "global_step": 128571, "epoch": 765} {"train_loss": -10.166807174682617, "global_step": 128572, "epoch": 765} {"train_loss": -10.177940368652344, "global_step": 128573, "epoch": 765} {"train_loss": -9.997518539428711, "global_step": 128574, "epoch": 765} {"train_loss": -10.062119483947754, "global_step": 128575, "epoch": 765} {"train_loss": -9.73377799987793, "global_step": 128576, "epoch": 765} {"train_loss": -10.183740615844727, "global_step": 128577, "epoch": 765} {"train_loss": -10.209420204162598, "global_step": 128578, "epoch": 765} {"train_loss": -10.35873794555664, "global_step": 128579, "epoch": 765} {"train_loss": -10.11658763885498, "global_step": 128580, "epoch": 765} {"train_loss": -10.417724609375, "global_step": 128581, "epoch": 765} {"train_loss": -10.082921981811523, "global_step": 128582, "epoch": 765} {"train_loss": -10.354166030883789, "global_step": 128583, "epoch": 765} {"train_loss": -10.311535835266113, "global_step": 128584, "epoch": 765} {"train_loss": -10.229334831237793, "global_step": 128585, "epoch": 765} {"train_loss": -10.12285041809082, "global_step": 128586, "epoch": 765} {"train_loss": -10.575737953186035, "global_step": 128587, "epoch": 765} {"train_loss": -10.397531509399414, "global_step": 128588, "epoch": 765} {"train_loss": -10.382584571838379, "global_step": 128589, "epoch": 765} {"train_loss": -10.278360366821289, "global_step": 128590, "epoch": 765} {"train_loss": -10.570476531982422, "global_step": 128591, "epoch": 765} {"train_loss": -10.166990280151367, "global_step": 128592, "epoch": 765} {"train_loss": -10.471413612365723, "global_step": 128593, "epoch": 765} {"train_loss": -10.404007911682129, "global_step": 128594, "epoch": 765} {"train_loss": -10.581780433654785, "global_step": 128595, "epoch": 765} {"train_loss": -10.432156562805176, "global_step": 128596, "epoch": 765} {"train_loss": -10.683422088623047, "global_step": 128597, "epoch": 765} {"train_loss": -10.273313522338867, "global_step": 128598, "epoch": 765} {"train_loss": -10.572091102600098, "global_step": 128599, "epoch": 765} {"train_loss": -10.410649299621582, "global_step": 128600, "epoch": 765} {"train_loss": -10.473953247070312, "global_step": 128601, "epoch": 765} {"train_loss": -10.452558517456055, "global_step": 128602, "epoch": 765} {"train_loss": -10.724851608276367, "global_step": 128603, "epoch": 765} {"train_loss": -10.647588729858398, "global_step": 128604, "epoch": 765} {"train_loss": -10.512475967407227, "global_step": 128605, "epoch": 765} {"train_loss": -10.575241088867188, "global_step": 128606, "epoch": 765} {"train_loss": -10.676682472229004, "global_step": 128607, "epoch": 765} {"train_loss": -10.416193008422852, "global_step": 128608, "epoch": 765} {"train_loss": -10.606072425842285, "global_step": 128609, "epoch": 765} {"train_loss": -10.6005220413208, "global_step": 128610, "epoch": 765} {"train_loss": -10.29155158996582, "global_step": 128611, "epoch": 765} {"train_loss": -10.500219345092773, "global_step": 128612, "epoch": 765} {"train_loss": -10.28624153137207, "global_step": 128613, "epoch": 765} {"train_loss": -9.98095417022705, "global_step": 128614, "epoch": 765} {"train_loss": -10.380645751953125, "global_step": 128615, "epoch": 765} {"train_loss": -9.578332901000977, "global_step": 128616, "epoch": 765} {"train_loss": -9.918804168701172, "global_step": 128617, "epoch": 765} {"train_loss": -9.674033164978027, "global_step": 128618, "epoch": 765} {"train_loss": -9.776678085327148, "global_step": 128619, "epoch": 765} {"train_loss": -9.782512664794922, "global_step": 128620, "epoch": 765} {"train_loss": -9.285408020019531, "global_step": 128621, "epoch": 765} {"train_loss": -9.986711502075195, "global_step": 128622, "epoch": 765} {"train_loss": -9.552356719970703, "global_step": 128623, "epoch": 765} {"train_loss": -9.88400650024414, "global_step": 128624, "epoch": 765} {"train_loss": -9.831656455993652, "global_step": 128625, "epoch": 765} {"train_loss": -10.264476776123047, "global_step": 128626, "epoch": 765} {"train_loss": -9.713157653808594, "global_step": 128627, "epoch": 765} {"train_loss": -10.09555435180664, "global_step": 128628, "epoch": 765} {"train_loss": -9.645965576171875, "global_step": 128629, "epoch": 765} {"train_loss": -9.784622192382812, "global_step": 128630, "epoch": 765} {"train_loss": -9.760591506958008, "global_step": 128631, "epoch": 765} {"train_loss": -10.205218315124512, "global_step": 128632, "epoch": 765} {"train_loss": -9.884140014648438, "global_step": 128633, "epoch": 765} {"train_loss": -10.093889236450195, "global_step": 128634, "epoch": 765} {"train_loss": -10.024492263793945, "global_step": 128635, "epoch": 765} {"train_loss": -10.176136016845703, "global_step": 128636, "epoch": 765} {"train_loss": -9.82691764831543, "global_step": 128637, "epoch": 765} {"train_loss": -10.265438079833984, "global_step": 128638, "epoch": 765} {"train_loss": -10.061938285827637, "global_step": 128639, "epoch": 765} {"train_loss": -10.0071382522583, "global_step": 128640, "epoch": 765} {"train_loss": -9.956786155700684, "global_step": 128641, "epoch": 765} {"train_loss": -10.478734970092773, "global_step": 128642, "epoch": 765} {"train_loss": -10.041165351867676, "global_step": 128643, "epoch": 765} {"train_loss": -10.192289352416992, "global_step": 128644, "epoch": 765} {"train_loss": -10.100456237792969, "global_step": 128645, "epoch": 765} {"train_loss": -9.999306678771973, "global_step": 128646, "epoch": 765} {"train_loss": -10.227947235107422, "global_step": 128647, "epoch": 765} {"train_loss": -10.263581275939941, "global_step": 128648, "epoch": 765} {"train_loss": -10.365001678466797, "global_step": 128649, "epoch": 765} {"train_loss": -10.148262023925781, "global_step": 128650, "epoch": 765} {"train_loss": -10.42487907409668, "global_step": 128651, "epoch": 765} {"train_loss": -10.225330352783203, "global_step": 128652, "epoch": 765} {"train_loss": -10.324396133422852, "global_step": 128653, "epoch": 765} {"train_loss": -10.3263521194458, "global_step": 128654, "epoch": 765} {"train_loss": -10.401174545288086, "global_step": 128655, "epoch": 765} {"train_loss": -10.52488899230957, "global_step": 128656, "epoch": 765} {"train_loss": -10.335714340209961, "global_step": 128657, "epoch": 765} {"train_loss": -10.432720184326172, "global_step": 128658, "epoch": 765} {"train_loss": -10.488285064697266, "global_step": 128659, "epoch": 765} {"train_loss": -10.642038345336914, "global_step": 128660, "epoch": 765} {"train_loss": -10.500406265258789, "global_step": 128661, "epoch": 765} {"train_loss": -10.564957618713379, "global_step": 128662, "epoch": 765} {"train_loss": -10.468679428100586, "global_step": 128663, "epoch": 765} {"train_loss": -10.562784194946289, "global_step": 128664, "epoch": 765} {"train_loss": -10.408792495727539, "global_step": 128665, "epoch": 765} {"train_loss": -10.69650650024414, "global_step": 128666, "epoch": 765} {"train_loss": -10.181282043457031, "global_step": 128667, "epoch": 765} {"train_loss": -10.755672454833984, "global_step": 128668, "epoch": 765} {"train_loss": -10.435436248779297, "global_step": 128669, "epoch": 765} {"train_loss": -10.521652221679688, "global_step": 128670, "epoch": 765} {"train_loss": -10.477216720581055, "global_step": 128671, "epoch": 765} {"train_loss": -10.542442321777344, "global_step": 128672, "epoch": 765} {"train_loss": -10.257918357849121, "global_step": 128673, "epoch": 765} {"train_loss": -10.570199012756348, "global_step": 128674, "epoch": 765} {"train_loss": -10.361632347106934, "global_step": 128675, "epoch": 765} {"train_loss": -10.203646659851074, "global_step": 128676, "epoch": 765} {"train_loss": -10.618908882141113, "global_step": 128677, "epoch": 765} {"train_loss": -9.507307052612305, "global_step": 128678, "epoch": 765} {"train_loss": -10.333874702453613, "global_step": 128679, "epoch": 765} {"train_loss": -9.843573570251465, "global_step": 128680, "epoch": 765} {"train_loss": -10.072830200195312, "global_step": 128681, "epoch": 765} {"train_loss": -9.831025123596191, "global_step": 128682, "epoch": 765} {"train_loss": -10.054832458496094, "global_step": 128683, "epoch": 765} {"train_loss": -10.145670890808105, "global_step": 128684, "epoch": 765} {"train_loss": -9.520490646362305, "global_step": 128685, "epoch": 765} {"train_loss": -10.19489860534668, "global_step": 128686, "epoch": 765} {"train_loss": -10.211434500558036, "global_step": 128687, "epoch": 765, "val_loss": 216223.015625, "train_action_mse_error": 0.41402366757392883} {"train_loss": -10.399478912353516, "global_step": 128688, "epoch": 766} {"train_loss": -10.018392562866211, "global_step": 128689, "epoch": 766} {"train_loss": -10.198650360107422, "global_step": 128690, "epoch": 766} {"train_loss": -10.096443176269531, "global_step": 128691, "epoch": 766} {"train_loss": -9.987076759338379, "global_step": 128692, "epoch": 766} {"train_loss": -9.976036071777344, "global_step": 128693, "epoch": 766} {"train_loss": -9.424358367919922, "global_step": 128694, "epoch": 766} {"train_loss": -9.64546012878418, "global_step": 128695, "epoch": 766} {"train_loss": -9.902705192565918, "global_step": 128696, "epoch": 766} {"train_loss": -9.871822357177734, "global_step": 128697, "epoch": 766} {"train_loss": -10.258697509765625, "global_step": 128698, "epoch": 766} {"train_loss": -10.025618553161621, "global_step": 128699, "epoch": 766} {"train_loss": -10.26251220703125, "global_step": 128700, "epoch": 766} {"train_loss": -10.044733047485352, "global_step": 128701, "epoch": 766} {"train_loss": -10.149974822998047, "global_step": 128702, "epoch": 766} {"train_loss": -10.317805290222168, "global_step": 128703, "epoch": 766} {"train_loss": -10.133551597595215, "global_step": 128704, "epoch": 766} {"train_loss": -10.024066925048828, "global_step": 128705, "epoch": 766} {"train_loss": -9.875375747680664, "global_step": 128706, "epoch": 766} {"train_loss": -10.172794342041016, "global_step": 128707, "epoch": 766} {"train_loss": -10.281805038452148, "global_step": 128708, "epoch": 766} {"train_loss": -9.846001625061035, "global_step": 128709, "epoch": 766} {"train_loss": -10.186097145080566, "global_step": 128710, "epoch": 766} {"train_loss": -10.302726745605469, "global_step": 128711, "epoch": 766} {"train_loss": -10.312336921691895, "global_step": 128712, "epoch": 766} {"train_loss": -10.32153034210205, "global_step": 128713, "epoch": 766} {"train_loss": -10.371842384338379, "global_step": 128714, "epoch": 766} {"train_loss": -10.259881973266602, "global_step": 128715, "epoch": 766} {"train_loss": -10.478816986083984, "global_step": 128716, "epoch": 766} {"train_loss": -10.374544143676758, "global_step": 128717, "epoch": 766} {"train_loss": -10.546019554138184, "global_step": 128718, "epoch": 766} {"train_loss": -10.454534530639648, "global_step": 128719, "epoch": 766} {"train_loss": -10.343709945678711, "global_step": 128720, "epoch": 766} {"train_loss": -10.153595924377441, "global_step": 128721, "epoch": 766} {"train_loss": -10.347620964050293, "global_step": 128722, "epoch": 766} {"train_loss": -10.528031349182129, "global_step": 128723, "epoch": 766} {"train_loss": -10.558595657348633, "global_step": 128724, "epoch": 766} {"train_loss": -10.505775451660156, "global_step": 128725, "epoch": 766} {"train_loss": -10.650293350219727, "global_step": 128726, "epoch": 766} {"train_loss": -10.602798461914062, "global_step": 128727, "epoch": 766} {"train_loss": -10.490398406982422, "global_step": 128728, "epoch": 766} {"train_loss": -10.269796371459961, "global_step": 128729, "epoch": 766} {"train_loss": -10.248204231262207, "global_step": 128730, "epoch": 766} {"train_loss": -10.429937362670898, "global_step": 128731, "epoch": 766} {"train_loss": -10.1652193069458, "global_step": 128732, "epoch": 766} {"train_loss": -9.990547180175781, "global_step": 128733, "epoch": 766} {"train_loss": -10.300661087036133, "global_step": 128734, "epoch": 766} {"train_loss": -9.82827377319336, "global_step": 128735, "epoch": 766} {"train_loss": -10.243626594543457, "global_step": 128736, "epoch": 766} {"train_loss": -10.314170837402344, "global_step": 128737, "epoch": 766} {"train_loss": -10.321128845214844, "global_step": 128738, "epoch": 766} {"train_loss": -10.178731918334961, "global_step": 128739, "epoch": 766} {"train_loss": -10.04257583618164, "global_step": 128740, "epoch": 766} {"train_loss": -9.887056350708008, "global_step": 128741, "epoch": 766} {"train_loss": -10.60314655303955, "global_step": 128742, "epoch": 766} {"train_loss": -9.808025360107422, "global_step": 128743, "epoch": 766} {"train_loss": -9.950319290161133, "global_step": 128744, "epoch": 766} {"train_loss": -9.896744728088379, "global_step": 128745, "epoch": 766} {"train_loss": -10.068016052246094, "global_step": 128746, "epoch": 766} {"train_loss": -9.735703468322754, "global_step": 128747, "epoch": 766} {"train_loss": -10.051063537597656, "global_step": 128748, "epoch": 766} {"train_loss": -9.985978126525879, "global_step": 128749, "epoch": 766} {"train_loss": -10.117399215698242, "global_step": 128750, "epoch": 766} {"train_loss": -9.88994312286377, "global_step": 128751, "epoch": 766} {"train_loss": -9.984253883361816, "global_step": 128752, "epoch": 766} {"train_loss": -10.428070068359375, "global_step": 128753, "epoch": 766} {"train_loss": -9.354938507080078, "global_step": 128754, "epoch": 766} {"train_loss": -10.145474433898926, "global_step": 128755, "epoch": 766} {"train_loss": -9.914440155029297, "global_step": 128756, "epoch": 766} {"train_loss": -9.978689193725586, "global_step": 128757, "epoch": 766} {"train_loss": -9.629376411437988, "global_step": 128758, "epoch": 766} {"train_loss": -10.276323318481445, "global_step": 128759, "epoch": 766} {"train_loss": -9.580875396728516, "global_step": 128760, "epoch": 766} {"train_loss": -10.073240280151367, "global_step": 128761, "epoch": 766} {"train_loss": -10.056695938110352, "global_step": 128762, "epoch": 766} {"train_loss": -9.7549409866333, "global_step": 128763, "epoch": 766} {"train_loss": -9.95659351348877, "global_step": 128764, "epoch": 766} {"train_loss": -10.075135231018066, "global_step": 128765, "epoch": 766} {"train_loss": -9.976936340332031, "global_step": 128766, "epoch": 766} {"train_loss": -9.869595527648926, "global_step": 128767, "epoch": 766} {"train_loss": -9.906091690063477, "global_step": 128768, "epoch": 766} {"train_loss": -10.422248840332031, "global_step": 128769, "epoch": 766} {"train_loss": -9.707181930541992, "global_step": 128770, "epoch": 766} {"train_loss": -10.132010459899902, "global_step": 128771, "epoch": 766} {"train_loss": -10.350057601928711, "global_step": 128772, "epoch": 766} {"train_loss": -10.003969192504883, "global_step": 128773, "epoch": 766} {"train_loss": -10.321572303771973, "global_step": 128774, "epoch": 766} {"train_loss": -10.160922050476074, "global_step": 128775, "epoch": 766} {"train_loss": -10.171402931213379, "global_step": 128776, "epoch": 766} {"train_loss": -10.273626327514648, "global_step": 128777, "epoch": 766} {"train_loss": -10.456339836120605, "global_step": 128778, "epoch": 766} {"train_loss": -10.166702270507812, "global_step": 128779, "epoch": 766} {"train_loss": -10.431825637817383, "global_step": 128780, "epoch": 766} {"train_loss": -10.298423767089844, "global_step": 128781, "epoch": 766} {"train_loss": -10.149190902709961, "global_step": 128782, "epoch": 766} {"train_loss": -10.184640884399414, "global_step": 128783, "epoch": 766} {"train_loss": -10.424714088439941, "global_step": 128784, "epoch": 766} {"train_loss": -10.239370346069336, "global_step": 128785, "epoch": 766} {"train_loss": -10.526018142700195, "global_step": 128786, "epoch": 766} {"train_loss": -10.276444435119629, "global_step": 128787, "epoch": 766} {"train_loss": -10.331539154052734, "global_step": 128788, "epoch": 766} {"train_loss": -10.242829322814941, "global_step": 128789, "epoch": 766} {"train_loss": -10.159786224365234, "global_step": 128790, "epoch": 766} {"train_loss": -10.306802749633789, "global_step": 128791, "epoch": 766} {"train_loss": -10.317832946777344, "global_step": 128792, "epoch": 766} {"train_loss": -10.236285209655762, "global_step": 128793, "epoch": 766} {"train_loss": -10.428750038146973, "global_step": 128794, "epoch": 766} {"train_loss": -10.146903991699219, "global_step": 128795, "epoch": 766} {"train_loss": -10.133689880371094, "global_step": 128796, "epoch": 766} {"train_loss": -10.230744361877441, "global_step": 128797, "epoch": 766} {"train_loss": -10.327375411987305, "global_step": 128798, "epoch": 766} {"train_loss": -10.324243545532227, "global_step": 128799, "epoch": 766} {"train_loss": -10.318010330200195, "global_step": 128800, "epoch": 766} {"train_loss": -10.49839973449707, "global_step": 128801, "epoch": 766} {"train_loss": -10.270462036132812, "global_step": 128802, "epoch": 766} {"train_loss": -10.526247024536133, "global_step": 128803, "epoch": 766} {"train_loss": -10.384517669677734, "global_step": 128804, "epoch": 766} {"train_loss": -10.242694854736328, "global_step": 128805, "epoch": 766} {"train_loss": -10.667418479919434, "global_step": 128806, "epoch": 766} {"train_loss": -9.748647689819336, "global_step": 128807, "epoch": 766} {"train_loss": -10.446588516235352, "global_step": 128808, "epoch": 766} {"train_loss": -10.353768348693848, "global_step": 128809, "epoch": 766} {"train_loss": -10.31212329864502, "global_step": 128810, "epoch": 766} {"train_loss": -10.45785140991211, "global_step": 128811, "epoch": 766} {"train_loss": -10.286664962768555, "global_step": 128812, "epoch": 766} {"train_loss": -10.555203437805176, "global_step": 128813, "epoch": 766} {"train_loss": -10.1375093460083, "global_step": 128814, "epoch": 766} {"train_loss": -10.244217872619629, "global_step": 128815, "epoch": 766} {"train_loss": -10.644476890563965, "global_step": 128816, "epoch": 766} {"train_loss": -10.402320861816406, "global_step": 128817, "epoch": 766} {"train_loss": -10.589591979980469, "global_step": 128818, "epoch": 766} {"train_loss": -10.426756858825684, "global_step": 128819, "epoch": 766} {"train_loss": -10.594205856323242, "global_step": 128820, "epoch": 766} {"train_loss": -10.361542701721191, "global_step": 128821, "epoch": 766} {"train_loss": -10.651378631591797, "global_step": 128822, "epoch": 766} {"train_loss": -10.437028884887695, "global_step": 128823, "epoch": 766} {"train_loss": -10.436406135559082, "global_step": 128824, "epoch": 766} {"train_loss": -10.290107727050781, "global_step": 128825, "epoch": 766} {"train_loss": -10.262552261352539, "global_step": 128826, "epoch": 766} {"train_loss": -9.82175064086914, "global_step": 128827, "epoch": 766} {"train_loss": -10.064489364624023, "global_step": 128828, "epoch": 766} {"train_loss": -10.455106735229492, "global_step": 128829, "epoch": 766} {"train_loss": -10.328712463378906, "global_step": 128830, "epoch": 766} {"train_loss": -10.460149765014648, "global_step": 128831, "epoch": 766} {"train_loss": -10.342207908630371, "global_step": 128832, "epoch": 766} {"train_loss": -10.389495849609375, "global_step": 128833, "epoch": 766} {"train_loss": -10.106067657470703, "global_step": 128834, "epoch": 766} {"train_loss": -9.932591438293457, "global_step": 128835, "epoch": 766} {"train_loss": -10.404006958007812, "global_step": 128836, "epoch": 766} {"train_loss": -10.166590690612793, "global_step": 128837, "epoch": 766} {"train_loss": -10.334248542785645, "global_step": 128838, "epoch": 766} {"train_loss": -10.200998306274414, "global_step": 128839, "epoch": 766} {"train_loss": -9.719890594482422, "global_step": 128840, "epoch": 766} {"train_loss": -10.407020568847656, "global_step": 128841, "epoch": 766} {"train_loss": -9.83147144317627, "global_step": 128842, "epoch": 766} {"train_loss": -10.178356170654297, "global_step": 128843, "epoch": 766} {"train_loss": -9.946904182434082, "global_step": 128844, "epoch": 766} {"train_loss": -9.530378341674805, "global_step": 128845, "epoch": 766} {"train_loss": -10.161392211914062, "global_step": 128846, "epoch": 766} {"train_loss": -9.750367164611816, "global_step": 128847, "epoch": 766} {"train_loss": -10.071300506591797, "global_step": 128848, "epoch": 766} {"train_loss": -9.891145706176758, "global_step": 128849, "epoch": 766} {"train_loss": -9.990294456481934, "global_step": 128850, "epoch": 766} {"train_loss": -10.060805320739746, "global_step": 128851, "epoch": 766} {"train_loss": -9.912795066833496, "global_step": 128852, "epoch": 766} {"train_loss": -10.185100555419922, "global_step": 128853, "epoch": 766} {"train_loss": -9.893463134765625, "global_step": 128854, "epoch": 766} {"train_loss": -10.185564285232907, "global_step": 128855, "epoch": 766, "val_loss": 218773.53125} {"train_loss": -9.967789649963379, "global_step": 128856, "epoch": 767} {"train_loss": -10.17741870880127, "global_step": 128857, "epoch": 767} {"train_loss": -10.123649597167969, "global_step": 128858, "epoch": 767} {"train_loss": -10.116803169250488, "global_step": 128859, "epoch": 767} {"train_loss": -10.036108016967773, "global_step": 128860, "epoch": 767} {"train_loss": -10.189112663269043, "global_step": 128861, "epoch": 767} {"train_loss": -10.044288635253906, "global_step": 128862, "epoch": 767} {"train_loss": -10.316009521484375, "global_step": 128863, "epoch": 767} {"train_loss": -10.388205528259277, "global_step": 128864, "epoch": 767} {"train_loss": -10.114189147949219, "global_step": 128865, "epoch": 767} {"train_loss": -10.097445487976074, "global_step": 128866, "epoch": 767} {"train_loss": -10.018030166625977, "global_step": 128867, "epoch": 767} {"train_loss": -10.064129829406738, "global_step": 128868, "epoch": 767} {"train_loss": -10.273177146911621, "global_step": 128869, "epoch": 767} {"train_loss": -10.209657669067383, "global_step": 128870, "epoch": 767} {"train_loss": -10.467947006225586, "global_step": 128871, "epoch": 767} {"train_loss": -10.151816368103027, "global_step": 128872, "epoch": 767} {"train_loss": -10.0983304977417, "global_step": 128873, "epoch": 767} {"train_loss": -10.018181800842285, "global_step": 128874, "epoch": 767} {"train_loss": -10.29781436920166, "global_step": 128875, "epoch": 767} {"train_loss": -10.1146821975708, "global_step": 128876, "epoch": 767} {"train_loss": -10.106698989868164, "global_step": 128877, "epoch": 767} {"train_loss": -9.99761962890625, "global_step": 128878, "epoch": 767} {"train_loss": -10.077958106994629, "global_step": 128879, "epoch": 767} {"train_loss": -10.013167381286621, "global_step": 128880, "epoch": 767} {"train_loss": -10.225822448730469, "global_step": 128881, "epoch": 767} {"train_loss": -9.840526580810547, "global_step": 128882, "epoch": 767} {"train_loss": -10.249685287475586, "global_step": 128883, "epoch": 767} {"train_loss": -10.14050006866455, "global_step": 128884, "epoch": 767} {"train_loss": -10.312494277954102, "global_step": 128885, "epoch": 767} {"train_loss": -10.42130184173584, "global_step": 128886, "epoch": 767} {"train_loss": -10.389571189880371, "global_step": 128887, "epoch": 767} {"train_loss": -10.538612365722656, "global_step": 128888, "epoch": 767} {"train_loss": -10.323357582092285, "global_step": 128889, "epoch": 767} {"train_loss": -10.326446533203125, "global_step": 128890, "epoch": 767} {"train_loss": -10.412355422973633, "global_step": 128891, "epoch": 767} {"train_loss": -10.287771224975586, "global_step": 128892, "epoch": 767} {"train_loss": -10.25085163116455, "global_step": 128893, "epoch": 767} {"train_loss": -10.476511001586914, "global_step": 128894, "epoch": 767} {"train_loss": -10.46855354309082, "global_step": 128895, "epoch": 767} {"train_loss": -10.503244400024414, "global_step": 128896, "epoch": 767} {"train_loss": -10.364837646484375, "global_step": 128897, "epoch": 767} {"train_loss": -10.434761047363281, "global_step": 128898, "epoch": 767} {"train_loss": -10.381058692932129, "global_step": 128899, "epoch": 767} {"train_loss": -10.177896499633789, "global_step": 128900, "epoch": 767} {"train_loss": -10.538211822509766, "global_step": 128901, "epoch": 767} {"train_loss": -10.466355323791504, "global_step": 128902, "epoch": 767} {"train_loss": -10.674400329589844, "global_step": 128903, "epoch": 767} {"train_loss": -10.2470121383667, "global_step": 128904, "epoch": 767} {"train_loss": -10.680683135986328, "global_step": 128905, "epoch": 767} {"train_loss": -10.25466251373291, "global_step": 128906, "epoch": 767} {"train_loss": -10.498296737670898, "global_step": 128907, "epoch": 767} {"train_loss": -10.431032180786133, "global_step": 128908, "epoch": 767} {"train_loss": -10.589035987854004, "global_step": 128909, "epoch": 767} {"train_loss": -10.474523544311523, "global_step": 128910, "epoch": 767} {"train_loss": -10.753244400024414, "global_step": 128911, "epoch": 767} {"train_loss": -10.682483673095703, "global_step": 128912, "epoch": 767} {"train_loss": -10.39962387084961, "global_step": 128913, "epoch": 767} {"train_loss": -10.771831512451172, "global_step": 128914, "epoch": 767} {"train_loss": -10.636354446411133, "global_step": 128915, "epoch": 767} {"train_loss": -10.293478012084961, "global_step": 128916, "epoch": 767} {"train_loss": -10.689675331115723, "global_step": 128917, "epoch": 767} {"train_loss": -10.424032211303711, "global_step": 128918, "epoch": 767} {"train_loss": -10.8189115524292, "global_step": 128919, "epoch": 767} {"train_loss": -10.56931209564209, "global_step": 128920, "epoch": 767} {"train_loss": -10.690810203552246, "global_step": 128921, "epoch": 767} {"train_loss": -10.432781219482422, "global_step": 128922, "epoch": 767} {"train_loss": -10.75963020324707, "global_step": 128923, "epoch": 767} {"train_loss": -10.737113952636719, "global_step": 128924, "epoch": 767} {"train_loss": -10.773561477661133, "global_step": 128925, "epoch": 767} {"train_loss": -10.572397232055664, "global_step": 128926, "epoch": 767} {"train_loss": -10.439861297607422, "global_step": 128927, "epoch": 767} {"train_loss": -10.183544158935547, "global_step": 128928, "epoch": 767} {"train_loss": -10.524849891662598, "global_step": 128929, "epoch": 767} {"train_loss": -10.458057403564453, "global_step": 128930, "epoch": 767} {"train_loss": -10.486129760742188, "global_step": 128931, "epoch": 767} {"train_loss": -10.421762466430664, "global_step": 128932, "epoch": 767} {"train_loss": -10.500066757202148, "global_step": 128933, "epoch": 767} {"train_loss": -10.608945846557617, "global_step": 128934, "epoch": 767} {"train_loss": -10.135201454162598, "global_step": 128935, "epoch": 767} {"train_loss": -10.232011795043945, "global_step": 128936, "epoch": 767} {"train_loss": -10.408305168151855, "global_step": 128937, "epoch": 767} {"train_loss": -10.57818603515625, "global_step": 128938, "epoch": 767} {"train_loss": -9.955153465270996, "global_step": 128939, "epoch": 767} {"train_loss": -10.235330581665039, "global_step": 128940, "epoch": 767} {"train_loss": -10.183126449584961, "global_step": 128941, "epoch": 767} {"train_loss": -10.025700569152832, "global_step": 128942, "epoch": 767} {"train_loss": -9.680801391601562, "global_step": 128943, "epoch": 767} {"train_loss": -10.192888259887695, "global_step": 128944, "epoch": 767} {"train_loss": -9.029471397399902, "global_step": 128945, "epoch": 767} {"train_loss": -10.041692733764648, "global_step": 128946, "epoch": 767} {"train_loss": -9.08992862701416, "global_step": 128947, "epoch": 767} {"train_loss": -10.24498176574707, "global_step": 128948, "epoch": 767} {"train_loss": -9.923225402832031, "global_step": 128949, "epoch": 767} {"train_loss": -10.135284423828125, "global_step": 128950, "epoch": 767} {"train_loss": -10.360605239868164, "global_step": 128951, "epoch": 767} {"train_loss": -9.85072135925293, "global_step": 128952, "epoch": 767} {"train_loss": -10.240612030029297, "global_step": 128953, "epoch": 767} {"train_loss": -10.068513870239258, "global_step": 128954, "epoch": 767} {"train_loss": -10.329216957092285, "global_step": 128955, "epoch": 767} {"train_loss": -10.048076629638672, "global_step": 128956, "epoch": 767} {"train_loss": -10.237253189086914, "global_step": 128957, "epoch": 767} {"train_loss": -10.131368637084961, "global_step": 128958, "epoch": 767} {"train_loss": -10.135994911193848, "global_step": 128959, "epoch": 767} {"train_loss": -10.586782455444336, "global_step": 128960, "epoch": 767} {"train_loss": -10.321832656860352, "global_step": 128961, "epoch": 767} {"train_loss": -10.23353385925293, "global_step": 128962, "epoch": 767} {"train_loss": -10.560564041137695, "global_step": 128963, "epoch": 767} {"train_loss": -10.242877960205078, "global_step": 128964, "epoch": 767} {"train_loss": -10.27423095703125, "global_step": 128965, "epoch": 767} {"train_loss": -10.181863784790039, "global_step": 128966, "epoch": 767} {"train_loss": -10.12881088256836, "global_step": 128967, "epoch": 767} {"train_loss": -10.131097793579102, "global_step": 128968, "epoch": 767} {"train_loss": -10.202810287475586, "global_step": 128969, "epoch": 767} {"train_loss": -10.158798217773438, "global_step": 128970, "epoch": 767} {"train_loss": -10.196735382080078, "global_step": 128971, "epoch": 767} {"train_loss": -10.21894645690918, "global_step": 128972, "epoch": 767} {"train_loss": -10.268619537353516, "global_step": 128973, "epoch": 767} {"train_loss": -10.19306468963623, "global_step": 128974, "epoch": 767} {"train_loss": -10.240240097045898, "global_step": 128975, "epoch": 767} {"train_loss": -10.38198471069336, "global_step": 128976, "epoch": 767} {"train_loss": -9.91378402709961, "global_step": 128977, "epoch": 767} {"train_loss": -10.18856430053711, "global_step": 128978, "epoch": 767} {"train_loss": -10.49085807800293, "global_step": 128979, "epoch": 767} {"train_loss": -10.170682907104492, "global_step": 128980, "epoch": 767} {"train_loss": -10.452457427978516, "global_step": 128981, "epoch": 767} {"train_loss": -10.098020553588867, "global_step": 128982, "epoch": 767} {"train_loss": -10.460716247558594, "global_step": 128983, "epoch": 767} {"train_loss": -10.144477844238281, "global_step": 128984, "epoch": 767} {"train_loss": -10.331818580627441, "global_step": 128985, "epoch": 767} {"train_loss": -10.13591480255127, "global_step": 128986, "epoch": 767} {"train_loss": -10.341468811035156, "global_step": 128987, "epoch": 767} {"train_loss": -10.41356086730957, "global_step": 128988, "epoch": 767} {"train_loss": -10.278263092041016, "global_step": 128989, "epoch": 767} {"train_loss": -10.486745834350586, "global_step": 128990, "epoch": 767} {"train_loss": -10.339224815368652, "global_step": 128991, "epoch": 767} {"train_loss": -10.561178207397461, "global_step": 128992, "epoch": 767} {"train_loss": -10.19090461730957, "global_step": 128993, "epoch": 767} {"train_loss": -10.539446830749512, "global_step": 128994, "epoch": 767} {"train_loss": -10.503019332885742, "global_step": 128995, "epoch": 767} {"train_loss": -10.575531959533691, "global_step": 128996, "epoch": 767} {"train_loss": -10.401456832885742, "global_step": 128997, "epoch": 767} {"train_loss": -10.64005184173584, "global_step": 128998, "epoch": 767} {"train_loss": -10.594654083251953, "global_step": 128999, "epoch": 767} {"train_loss": -10.321542739868164, "global_step": 129000, "epoch": 767} {"train_loss": -10.625417709350586, "global_step": 129001, "epoch": 767} {"train_loss": -10.455682754516602, "global_step": 129002, "epoch": 767} {"train_loss": -10.69369125366211, "global_step": 129003, "epoch": 767} {"train_loss": -10.625298500061035, "global_step": 129004, "epoch": 767} {"train_loss": -10.526395797729492, "global_step": 129005, "epoch": 767} {"train_loss": -10.777379989624023, "global_step": 129006, "epoch": 767} {"train_loss": -10.567314147949219, "global_step": 129007, "epoch": 767} {"train_loss": -10.792535781860352, "global_step": 129008, "epoch": 767} {"train_loss": -10.426765441894531, "global_step": 129009, "epoch": 767} {"train_loss": -10.767436981201172, "global_step": 129010, "epoch": 767} {"train_loss": -10.58931827545166, "global_step": 129011, "epoch": 767} {"train_loss": -10.501199722290039, "global_step": 129012, "epoch": 767} {"train_loss": -10.842859268188477, "global_step": 129013, "epoch": 767} {"train_loss": -10.576862335205078, "global_step": 129014, "epoch": 767} {"train_loss": -10.466672897338867, "global_step": 129015, "epoch": 767} {"train_loss": -10.435518264770508, "global_step": 129016, "epoch": 767} {"train_loss": -10.07981014251709, "global_step": 129017, "epoch": 767} {"train_loss": -9.973888397216797, "global_step": 129018, "epoch": 767} {"train_loss": -10.411983489990234, "global_step": 129019, "epoch": 767} {"train_loss": -9.921936988830566, "global_step": 129020, "epoch": 767} {"train_loss": -9.755777359008789, "global_step": 129021, "epoch": 767} {"train_loss": -9.834593772888184, "global_step": 129022, "epoch": 767} {"train_loss": -10.313087520145235, "global_step": 129023, "epoch": 767, "val_loss": 217842.953125} {"train_loss": -10.018755912780762, "global_step": 129024, "epoch": 768} {"train_loss": -9.672872543334961, "global_step": 129025, "epoch": 768} {"train_loss": -10.287428855895996, "global_step": 129026, "epoch": 768} {"train_loss": -10.035669326782227, "global_step": 129027, "epoch": 768} {"train_loss": -10.522405624389648, "global_step": 129028, "epoch": 768} {"train_loss": -10.04874038696289, "global_step": 129029, "epoch": 768} {"train_loss": -9.343249320983887, "global_step": 129030, "epoch": 768} {"train_loss": -10.235937118530273, "global_step": 129031, "epoch": 768} {"train_loss": -9.724181175231934, "global_step": 129032, "epoch": 768} {"train_loss": -9.352790832519531, "global_step": 129033, "epoch": 768} {"train_loss": -9.526289939880371, "global_step": 129034, "epoch": 768} {"train_loss": -9.754505157470703, "global_step": 129035, "epoch": 768} {"train_loss": -9.47525405883789, "global_step": 129036, "epoch": 768} {"train_loss": -10.296759605407715, "global_step": 129037, "epoch": 768} {"train_loss": -9.398965835571289, "global_step": 129038, "epoch": 768} {"train_loss": -9.85809326171875, "global_step": 129039, "epoch": 768} {"train_loss": -9.713898658752441, "global_step": 129040, "epoch": 768} {"train_loss": -9.596824645996094, "global_step": 129041, "epoch": 768} {"train_loss": -9.79265022277832, "global_step": 129042, "epoch": 768} {"train_loss": -9.831808090209961, "global_step": 129043, "epoch": 768} {"train_loss": -9.516592025756836, "global_step": 129044, "epoch": 768} {"train_loss": -9.82547378540039, "global_step": 129045, "epoch": 768} {"train_loss": -10.051366806030273, "global_step": 129046, "epoch": 768} {"train_loss": -9.749134063720703, "global_step": 129047, "epoch": 768} {"train_loss": -9.615007400512695, "global_step": 129048, "epoch": 768} {"train_loss": -10.030498504638672, "global_step": 129049, "epoch": 768} {"train_loss": -10.013544082641602, "global_step": 129050, "epoch": 768} {"train_loss": -9.837374687194824, "global_step": 129051, "epoch": 768} {"train_loss": -9.865678787231445, "global_step": 129052, "epoch": 768} {"train_loss": -10.17603874206543, "global_step": 129053, "epoch": 768} {"train_loss": -9.8641357421875, "global_step": 129054, "epoch": 768} {"train_loss": -10.250984191894531, "global_step": 129055, "epoch": 768} {"train_loss": -10.210960388183594, "global_step": 129056, "epoch": 768} {"train_loss": -9.944089889526367, "global_step": 129057, "epoch": 768} {"train_loss": -10.211813926696777, "global_step": 129058, "epoch": 768} {"train_loss": -10.394309043884277, "global_step": 129059, "epoch": 768} {"train_loss": -10.114982604980469, "global_step": 129060, "epoch": 768} {"train_loss": -10.169702529907227, "global_step": 129061, "epoch": 768} {"train_loss": -10.195345878601074, "global_step": 129062, "epoch": 768} {"train_loss": -10.410880088806152, "global_step": 129063, "epoch": 768} {"train_loss": -9.968793869018555, "global_step": 129064, "epoch": 768} {"train_loss": -10.241764068603516, "global_step": 129065, "epoch": 768} {"train_loss": -10.435133934020996, "global_step": 129066, "epoch": 768} {"train_loss": -10.237327575683594, "global_step": 129067, "epoch": 768} {"train_loss": -10.467081069946289, "global_step": 129068, "epoch": 768} {"train_loss": -10.248533248901367, "global_step": 129069, "epoch": 768} {"train_loss": -10.378591537475586, "global_step": 129070, "epoch": 768} {"train_loss": -10.301494598388672, "global_step": 129071, "epoch": 768} {"train_loss": -10.278197288513184, "global_step": 129072, "epoch": 768} {"train_loss": -10.571646690368652, "global_step": 129073, "epoch": 768} {"train_loss": -10.32368278503418, "global_step": 129074, "epoch": 768} {"train_loss": -10.488210678100586, "global_step": 129075, "epoch": 768} {"train_loss": -10.509941101074219, "global_step": 129076, "epoch": 768} {"train_loss": -10.264982223510742, "global_step": 129077, "epoch": 768} {"train_loss": -10.510931015014648, "global_step": 129078, "epoch": 768} {"train_loss": -10.539850234985352, "global_step": 129079, "epoch": 768} {"train_loss": -10.529582977294922, "global_step": 129080, "epoch": 768} {"train_loss": -10.599327087402344, "global_step": 129081, "epoch": 768} {"train_loss": -10.635259628295898, "global_step": 129082, "epoch": 768} {"train_loss": -10.641225814819336, "global_step": 129083, "epoch": 768} {"train_loss": -10.737327575683594, "global_step": 129084, "epoch": 768} {"train_loss": -10.379753112792969, "global_step": 129085, "epoch": 768} {"train_loss": -10.635122299194336, "global_step": 129086, "epoch": 768} {"train_loss": -10.469703674316406, "global_step": 129087, "epoch": 768} {"train_loss": -10.566629409790039, "global_step": 129088, "epoch": 768} {"train_loss": -10.34140396118164, "global_step": 129089, "epoch": 768} {"train_loss": -10.811674118041992, "global_step": 129090, "epoch": 768} {"train_loss": -10.445382118225098, "global_step": 129091, "epoch": 768} {"train_loss": -9.983123779296875, "global_step": 129092, "epoch": 768} {"train_loss": -10.567654609680176, "global_step": 129093, "epoch": 768} {"train_loss": -10.017792701721191, "global_step": 129094, "epoch": 768} {"train_loss": -10.197717666625977, "global_step": 129095, "epoch": 768} {"train_loss": -10.348849296569824, "global_step": 129096, "epoch": 768} {"train_loss": -10.12755012512207, "global_step": 129097, "epoch": 768} {"train_loss": -9.954444885253906, "global_step": 129098, "epoch": 768} {"train_loss": -9.87918472290039, "global_step": 129099, "epoch": 768} {"train_loss": -10.26537799835205, "global_step": 129100, "epoch": 768} {"train_loss": -9.82876205444336, "global_step": 129101, "epoch": 768} {"train_loss": -10.251935958862305, "global_step": 129102, "epoch": 768} {"train_loss": -10.178418159484863, "global_step": 129103, "epoch": 768} {"train_loss": -10.02164077758789, "global_step": 129104, "epoch": 768} {"train_loss": -10.209376335144043, "global_step": 129105, "epoch": 768} {"train_loss": -9.880074501037598, "global_step": 129106, "epoch": 768} {"train_loss": -10.28366470336914, "global_step": 129107, "epoch": 768} {"train_loss": -9.877654075622559, "global_step": 129108, "epoch": 768} {"train_loss": -10.355463981628418, "global_step": 129109, "epoch": 768} {"train_loss": -10.145818710327148, "global_step": 129110, "epoch": 768} {"train_loss": -10.288701057434082, "global_step": 129111, "epoch": 768} {"train_loss": -9.874484062194824, "global_step": 129112, "epoch": 768} {"train_loss": -10.36393928527832, "global_step": 129113, "epoch": 768} {"train_loss": -10.057559967041016, "global_step": 129114, "epoch": 768} {"train_loss": -10.469522476196289, "global_step": 129115, "epoch": 768} {"train_loss": -9.773857116699219, "global_step": 129116, "epoch": 768} {"train_loss": -10.153688430786133, "global_step": 129117, "epoch": 768} {"train_loss": -9.761824607849121, "global_step": 129118, "epoch": 768} {"train_loss": -10.435064315795898, "global_step": 129119, "epoch": 768} {"train_loss": -9.831872940063477, "global_step": 129120, "epoch": 768} {"train_loss": -10.446847915649414, "global_step": 129121, "epoch": 768} {"train_loss": -10.284290313720703, "global_step": 129122, "epoch": 768} {"train_loss": -10.411371231079102, "global_step": 129123, "epoch": 768} {"train_loss": -10.417014122009277, "global_step": 129124, "epoch": 768} {"train_loss": -10.476694107055664, "global_step": 129125, "epoch": 768} {"train_loss": -10.206914901733398, "global_step": 129126, "epoch": 768} {"train_loss": -10.468005180358887, "global_step": 129127, "epoch": 768} {"train_loss": -10.201338768005371, "global_step": 129128, "epoch": 768} {"train_loss": -10.397431373596191, "global_step": 129129, "epoch": 768} {"train_loss": -10.49881649017334, "global_step": 129130, "epoch": 768} {"train_loss": -10.39773178100586, "global_step": 129131, "epoch": 768} {"train_loss": -10.491469383239746, "global_step": 129132, "epoch": 768} {"train_loss": -10.426711082458496, "global_step": 129133, "epoch": 768} {"train_loss": -10.618167877197266, "global_step": 129134, "epoch": 768} {"train_loss": -10.58932113647461, "global_step": 129135, "epoch": 768} {"train_loss": -10.42849349975586, "global_step": 129136, "epoch": 768} {"train_loss": -10.644851684570312, "global_step": 129137, "epoch": 768} {"train_loss": -10.51040267944336, "global_step": 129138, "epoch": 768} {"train_loss": -10.628494262695312, "global_step": 129139, "epoch": 768} {"train_loss": -10.531649589538574, "global_step": 129140, "epoch": 768} {"train_loss": -10.49539852142334, "global_step": 129141, "epoch": 768} {"train_loss": -10.32525634765625, "global_step": 129142, "epoch": 768} {"train_loss": -10.548088073730469, "global_step": 129143, "epoch": 768} {"train_loss": -10.366785049438477, "global_step": 129144, "epoch": 768} {"train_loss": -10.636812210083008, "global_step": 129145, "epoch": 768} {"train_loss": -10.46900749206543, "global_step": 129146, "epoch": 768} {"train_loss": -10.285896301269531, "global_step": 129147, "epoch": 768} {"train_loss": -10.369550704956055, "global_step": 129148, "epoch": 768} {"train_loss": -10.574654579162598, "global_step": 129149, "epoch": 768} {"train_loss": -10.559600830078125, "global_step": 129150, "epoch": 768} {"train_loss": -10.442150115966797, "global_step": 129151, "epoch": 768} {"train_loss": -10.293583869934082, "global_step": 129152, "epoch": 768} {"train_loss": -10.607349395751953, "global_step": 129153, "epoch": 768} {"train_loss": -10.529647827148438, "global_step": 129154, "epoch": 768} {"train_loss": -10.264833450317383, "global_step": 129155, "epoch": 768} {"train_loss": -10.216789245605469, "global_step": 129156, "epoch": 768} {"train_loss": -10.333596229553223, "global_step": 129157, "epoch": 768} {"train_loss": -10.146402359008789, "global_step": 129158, "epoch": 768} {"train_loss": -10.095117568969727, "global_step": 129159, "epoch": 768} {"train_loss": -10.273058891296387, "global_step": 129160, "epoch": 768} {"train_loss": -9.52298355102539, "global_step": 129161, "epoch": 768} {"train_loss": -10.079300880432129, "global_step": 129162, "epoch": 768} {"train_loss": -10.55182933807373, "global_step": 129163, "epoch": 768} {"train_loss": -10.31067943572998, "global_step": 129164, "epoch": 768} {"train_loss": -10.53427505493164, "global_step": 129165, "epoch": 768} {"train_loss": -10.279691696166992, "global_step": 129166, "epoch": 768} {"train_loss": -10.518021583557129, "global_step": 129167, "epoch": 768} {"train_loss": -10.505678176879883, "global_step": 129168, "epoch": 768} {"train_loss": -10.513504028320312, "global_step": 129169, "epoch": 768} {"train_loss": -10.493422508239746, "global_step": 129170, "epoch": 768} {"train_loss": -10.537540435791016, "global_step": 129171, "epoch": 768} {"train_loss": -10.368274688720703, "global_step": 129172, "epoch": 768} {"train_loss": -10.706893920898438, "global_step": 129173, "epoch": 768} {"train_loss": -10.580578804016113, "global_step": 129174, "epoch": 768} {"train_loss": -10.432384490966797, "global_step": 129175, "epoch": 768} {"train_loss": -10.64352798461914, "global_step": 129176, "epoch": 768} {"train_loss": -10.577178001403809, "global_step": 129177, "epoch": 768} {"train_loss": -10.494950294494629, "global_step": 129178, "epoch": 768} {"train_loss": -10.435894012451172, "global_step": 129179, "epoch": 768} {"train_loss": -10.744318008422852, "global_step": 129180, "epoch": 768} {"train_loss": -10.593450546264648, "global_step": 129181, "epoch": 768} {"train_loss": -10.598915100097656, "global_step": 129182, "epoch": 768} {"train_loss": -10.614448547363281, "global_step": 129183, "epoch": 768} {"train_loss": -10.34868335723877, "global_step": 129184, "epoch": 768} {"train_loss": -10.522624969482422, "global_step": 129185, "epoch": 768} {"train_loss": -10.570945739746094, "global_step": 129186, "epoch": 768} {"train_loss": -10.462636947631836, "global_step": 129187, "epoch": 768} {"train_loss": -10.505258560180664, "global_step": 129188, "epoch": 768} {"train_loss": -10.890201568603516, "global_step": 129189, "epoch": 768} {"train_loss": -10.495386123657227, "global_step": 129190, "epoch": 768} {"train_loss": -10.265598206293015, "global_step": 129191, "epoch": 768, "val_loss": 219438.703125} {"train_loss": -10.591726303100586, "global_step": 129192, "epoch": 769} {"train_loss": -10.421220779418945, "global_step": 129193, "epoch": 769} {"train_loss": -10.499368667602539, "global_step": 129194, "epoch": 769} {"train_loss": -10.631864547729492, "global_step": 129195, "epoch": 769} {"train_loss": -10.285844802856445, "global_step": 129196, "epoch": 769} {"train_loss": -10.426361083984375, "global_step": 129197, "epoch": 769} {"train_loss": -10.740534782409668, "global_step": 129198, "epoch": 769} {"train_loss": -10.365670204162598, "global_step": 129199, "epoch": 769} {"train_loss": -10.207054138183594, "global_step": 129200, "epoch": 769} {"train_loss": -10.663165092468262, "global_step": 129201, "epoch": 769} {"train_loss": -10.145132064819336, "global_step": 129202, "epoch": 769} {"train_loss": -10.352470397949219, "global_step": 129203, "epoch": 769} {"train_loss": -10.391570091247559, "global_step": 129204, "epoch": 769} {"train_loss": -10.014668464660645, "global_step": 129205, "epoch": 769} {"train_loss": -10.201388359069824, "global_step": 129206, "epoch": 769} {"train_loss": -10.542045593261719, "global_step": 129207, "epoch": 769} {"train_loss": -10.277145385742188, "global_step": 129208, "epoch": 769} {"train_loss": -10.285900115966797, "global_step": 129209, "epoch": 769} {"train_loss": -10.292503356933594, "global_step": 129210, "epoch": 769} {"train_loss": -10.623983383178711, "global_step": 129211, "epoch": 769} {"train_loss": -10.307851791381836, "global_step": 129212, "epoch": 769} {"train_loss": -10.364723205566406, "global_step": 129213, "epoch": 769} {"train_loss": -10.463053703308105, "global_step": 129214, "epoch": 769} {"train_loss": -10.101268768310547, "global_step": 129215, "epoch": 769} {"train_loss": -9.928953170776367, "global_step": 129216, "epoch": 769} {"train_loss": -9.961837768554688, "global_step": 129217, "epoch": 769} {"train_loss": -9.579597473144531, "global_step": 129218, "epoch": 769} {"train_loss": -9.295469284057617, "global_step": 129219, "epoch": 769} {"train_loss": -10.250864028930664, "global_step": 129220, "epoch": 769} {"train_loss": -10.149106979370117, "global_step": 129221, "epoch": 769} {"train_loss": -9.922865867614746, "global_step": 129222, "epoch": 769} {"train_loss": -10.419200897216797, "global_step": 129223, "epoch": 769} {"train_loss": -9.745967864990234, "global_step": 129224, "epoch": 769} {"train_loss": -10.169303894042969, "global_step": 129225, "epoch": 769} {"train_loss": -10.227302551269531, "global_step": 129226, "epoch": 769} {"train_loss": -10.298669815063477, "global_step": 129227, "epoch": 769} {"train_loss": -9.9833402633667, "global_step": 129228, "epoch": 769} {"train_loss": -10.037416458129883, "global_step": 129229, "epoch": 769} {"train_loss": -10.069825172424316, "global_step": 129230, "epoch": 769} {"train_loss": -10.196733474731445, "global_step": 129231, "epoch": 769} {"train_loss": -9.616662979125977, "global_step": 129232, "epoch": 769} {"train_loss": -10.162656784057617, "global_step": 129233, "epoch": 769} {"train_loss": -10.274679183959961, "global_step": 129234, "epoch": 769} {"train_loss": -9.773781776428223, "global_step": 129235, "epoch": 769} {"train_loss": -10.128500938415527, "global_step": 129236, "epoch": 769} {"train_loss": -10.203763961791992, "global_step": 129237, "epoch": 769} {"train_loss": -10.103350639343262, "global_step": 129238, "epoch": 769} {"train_loss": -10.045333862304688, "global_step": 129239, "epoch": 769} {"train_loss": -10.311979293823242, "global_step": 129240, "epoch": 769} {"train_loss": -9.987060546875, "global_step": 129241, "epoch": 769} {"train_loss": -10.232102394104004, "global_step": 129242, "epoch": 769} {"train_loss": -9.947319030761719, "global_step": 129243, "epoch": 769} {"train_loss": -9.96865463256836, "global_step": 129244, "epoch": 769} {"train_loss": -10.312076568603516, "global_step": 129245, "epoch": 769} {"train_loss": -10.191347122192383, "global_step": 129246, "epoch": 769} {"train_loss": -10.134123802185059, "global_step": 129247, "epoch": 769} {"train_loss": -10.081348419189453, "global_step": 129248, "epoch": 769} {"train_loss": -9.60154914855957, "global_step": 129249, "epoch": 769} {"train_loss": -10.17961311340332, "global_step": 129250, "epoch": 769} {"train_loss": -10.109071731567383, "global_step": 129251, "epoch": 769} {"train_loss": -10.139399528503418, "global_step": 129252, "epoch": 769} {"train_loss": -10.610251426696777, "global_step": 129253, "epoch": 769} {"train_loss": -10.082252502441406, "global_step": 129254, "epoch": 769} {"train_loss": -10.175069808959961, "global_step": 129255, "epoch": 769} {"train_loss": -10.399919509887695, "global_step": 129256, "epoch": 769} {"train_loss": -10.31208610534668, "global_step": 129257, "epoch": 769} {"train_loss": -10.209808349609375, "global_step": 129258, "epoch": 769} {"train_loss": -10.380731582641602, "global_step": 129259, "epoch": 769} {"train_loss": -10.678924560546875, "global_step": 129260, "epoch": 769} {"train_loss": -10.40563678741455, "global_step": 129261, "epoch": 769} {"train_loss": -10.365161895751953, "global_step": 129262, "epoch": 769} {"train_loss": -10.486050605773926, "global_step": 129263, "epoch": 769} {"train_loss": -10.285255432128906, "global_step": 129264, "epoch": 769} {"train_loss": -10.515328407287598, "global_step": 129265, "epoch": 769} {"train_loss": -10.220766067504883, "global_step": 129266, "epoch": 769} {"train_loss": -10.465112686157227, "global_step": 129267, "epoch": 769} {"train_loss": -10.443099975585938, "global_step": 129268, "epoch": 769} {"train_loss": -10.479639053344727, "global_step": 129269, "epoch": 769} {"train_loss": -10.660577774047852, "global_step": 129270, "epoch": 769} {"train_loss": -10.576053619384766, "global_step": 129271, "epoch": 769} {"train_loss": -10.669776916503906, "global_step": 129272, "epoch": 769} {"train_loss": -10.640046119689941, "global_step": 129273, "epoch": 769} {"train_loss": -10.440776824951172, "global_step": 129274, "epoch": 769} {"train_loss": -10.685037612915039, "global_step": 129275, "epoch": 769} {"train_loss": -10.631624221801758, "global_step": 129276, "epoch": 769} {"train_loss": -10.633926391601562, "global_step": 129277, "epoch": 769} {"train_loss": -10.688802719116211, "global_step": 129278, "epoch": 769} {"train_loss": -10.50406265258789, "global_step": 129279, "epoch": 769} {"train_loss": -10.638391494750977, "global_step": 129280, "epoch": 769} {"train_loss": -10.702299118041992, "global_step": 129281, "epoch": 769} {"train_loss": -10.800765037536621, "global_step": 129282, "epoch": 769} {"train_loss": -10.501017570495605, "global_step": 129283, "epoch": 769} {"train_loss": -10.550097465515137, "global_step": 129284, "epoch": 769} {"train_loss": -10.593465805053711, "global_step": 129285, "epoch": 769} {"train_loss": -10.678491592407227, "global_step": 129286, "epoch": 769} {"train_loss": -10.73982048034668, "global_step": 129287, "epoch": 769} {"train_loss": -10.592278480529785, "global_step": 129288, "epoch": 769} {"train_loss": -10.796361923217773, "global_step": 129289, "epoch": 769} {"train_loss": -10.584436416625977, "global_step": 129290, "epoch": 769} {"train_loss": -10.563929557800293, "global_step": 129291, "epoch": 769} {"train_loss": -10.283974647521973, "global_step": 129292, "epoch": 769} {"train_loss": -10.655828475952148, "global_step": 129293, "epoch": 769} {"train_loss": -10.524436950683594, "global_step": 129294, "epoch": 769} {"train_loss": -10.087059020996094, "global_step": 129295, "epoch": 769} {"train_loss": -10.044221878051758, "global_step": 129296, "epoch": 769} {"train_loss": -10.56589126586914, "global_step": 129297, "epoch": 769} {"train_loss": -10.31095027923584, "global_step": 129298, "epoch": 769} {"train_loss": -10.116320610046387, "global_step": 129299, "epoch": 769} {"train_loss": -9.987970352172852, "global_step": 129300, "epoch": 769} {"train_loss": -10.40085506439209, "global_step": 129301, "epoch": 769} {"train_loss": -10.5609769821167, "global_step": 129302, "epoch": 769} {"train_loss": -10.576903343200684, "global_step": 129303, "epoch": 769} {"train_loss": -10.296968460083008, "global_step": 129304, "epoch": 769} {"train_loss": -10.436822891235352, "global_step": 129305, "epoch": 769} {"train_loss": -9.698400497436523, "global_step": 129306, "epoch": 769} {"train_loss": -10.17121696472168, "global_step": 129307, "epoch": 769} {"train_loss": -10.054861068725586, "global_step": 129308, "epoch": 769} {"train_loss": -10.163262367248535, "global_step": 129309, "epoch": 769} {"train_loss": -9.930992126464844, "global_step": 129310, "epoch": 769} {"train_loss": -9.536166191101074, "global_step": 129311, "epoch": 769} {"train_loss": -10.170562744140625, "global_step": 129312, "epoch": 769} {"train_loss": -9.045745849609375, "global_step": 129313, "epoch": 769} {"train_loss": -9.765212059020996, "global_step": 129314, "epoch": 769} {"train_loss": -10.002941131591797, "global_step": 129315, "epoch": 769} {"train_loss": -9.576601028442383, "global_step": 129316, "epoch": 769} {"train_loss": -10.071033477783203, "global_step": 129317, "epoch": 769} {"train_loss": -9.967082977294922, "global_step": 129318, "epoch": 769} {"train_loss": -9.44888687133789, "global_step": 129319, "epoch": 769} {"train_loss": -9.848673820495605, "global_step": 129320, "epoch": 769} {"train_loss": -9.815397262573242, "global_step": 129321, "epoch": 769} {"train_loss": -10.131301879882812, "global_step": 129322, "epoch": 769} {"train_loss": -9.874377250671387, "global_step": 129323, "epoch": 769} {"train_loss": -10.195159912109375, "global_step": 129324, "epoch": 769} {"train_loss": -10.008783340454102, "global_step": 129325, "epoch": 769} {"train_loss": -10.2022705078125, "global_step": 129326, "epoch": 769} {"train_loss": -10.162309646606445, "global_step": 129327, "epoch": 769} {"train_loss": -10.146023750305176, "global_step": 129328, "epoch": 769} {"train_loss": -10.103042602539062, "global_step": 129329, "epoch": 769} {"train_loss": -10.338703155517578, "global_step": 129330, "epoch": 769} {"train_loss": -10.112698554992676, "global_step": 129331, "epoch": 769} {"train_loss": -10.191522598266602, "global_step": 129332, "epoch": 769} {"train_loss": -10.316247940063477, "global_step": 129333, "epoch": 769} {"train_loss": -10.202679634094238, "global_step": 129334, "epoch": 769} {"train_loss": -10.353580474853516, "global_step": 129335, "epoch": 769} {"train_loss": -10.085205078125, "global_step": 129336, "epoch": 769} {"train_loss": -10.29475212097168, "global_step": 129337, "epoch": 769} {"train_loss": -10.544736862182617, "global_step": 129338, "epoch": 769} {"train_loss": -10.289772033691406, "global_step": 129339, "epoch": 769} {"train_loss": -10.502580642700195, "global_step": 129340, "epoch": 769} {"train_loss": -10.355833053588867, "global_step": 129341, "epoch": 769} {"train_loss": -10.622941970825195, "global_step": 129342, "epoch": 769} {"train_loss": -10.387398719787598, "global_step": 129343, "epoch": 769} {"train_loss": -10.424995422363281, "global_step": 129344, "epoch": 769} {"train_loss": -10.129647254943848, "global_step": 129345, "epoch": 769} {"train_loss": -10.536216735839844, "global_step": 129346, "epoch": 769} {"train_loss": -10.199304580688477, "global_step": 129347, "epoch": 769} {"train_loss": -10.469175338745117, "global_step": 129348, "epoch": 769} {"train_loss": -10.443822860717773, "global_step": 129349, "epoch": 769} {"train_loss": -10.695394515991211, "global_step": 129350, "epoch": 769} {"train_loss": -10.603078842163086, "global_step": 129351, "epoch": 769} {"train_loss": -10.460412979125977, "global_step": 129352, "epoch": 769} {"train_loss": -10.547802925109863, "global_step": 129353, "epoch": 769} {"train_loss": -10.438129425048828, "global_step": 129354, "epoch": 769} {"train_loss": -10.606827735900879, "global_step": 129355, "epoch": 769} {"train_loss": -10.739665031433105, "global_step": 129356, "epoch": 769} {"train_loss": -10.629487991333008, "global_step": 129357, "epoch": 769} {"train_loss": -10.386816024780273, "global_step": 129358, "epoch": 769} {"train_loss": -10.276783948852902, "global_step": 129359, "epoch": 769, "val_loss": 219408.234375} {"train_loss": -10.692249298095703, "global_step": 129360, "epoch": 770} {"train_loss": -10.710134506225586, "global_step": 129361, "epoch": 770} {"train_loss": -10.681194305419922, "global_step": 129362, "epoch": 770} {"train_loss": -10.548261642456055, "global_step": 129363, "epoch": 770} {"train_loss": -10.479127883911133, "global_step": 129364, "epoch": 770} {"train_loss": -10.68960189819336, "global_step": 129365, "epoch": 770} {"train_loss": -10.646598815917969, "global_step": 129366, "epoch": 770} {"train_loss": -10.528993606567383, "global_step": 129367, "epoch": 770} {"train_loss": -10.724575996398926, "global_step": 129368, "epoch": 770} {"train_loss": -10.666070938110352, "global_step": 129369, "epoch": 770} {"train_loss": -10.337520599365234, "global_step": 129370, "epoch": 770} {"train_loss": -10.729127883911133, "global_step": 129371, "epoch": 770} {"train_loss": -10.399835586547852, "global_step": 129372, "epoch": 770} {"train_loss": -10.604278564453125, "global_step": 129373, "epoch": 770} {"train_loss": -10.27114486694336, "global_step": 129374, "epoch": 770} {"train_loss": -10.419517517089844, "global_step": 129375, "epoch": 770} {"train_loss": -10.202670097351074, "global_step": 129376, "epoch": 770} {"train_loss": -10.492609024047852, "global_step": 129377, "epoch": 770} {"train_loss": -9.9886474609375, "global_step": 129378, "epoch": 770} {"train_loss": -10.385356903076172, "global_step": 129379, "epoch": 770} {"train_loss": -10.009862899780273, "global_step": 129380, "epoch": 770} {"train_loss": -9.786556243896484, "global_step": 129381, "epoch": 770} {"train_loss": -10.438493728637695, "global_step": 129382, "epoch": 770} {"train_loss": -9.476606369018555, "global_step": 129383, "epoch": 770} {"train_loss": -10.027654647827148, "global_step": 129384, "epoch": 770} {"train_loss": -10.266633987426758, "global_step": 129385, "epoch": 770} {"train_loss": -9.058683395385742, "global_step": 129386, "epoch": 770} {"train_loss": -9.687813758850098, "global_step": 129387, "epoch": 770} {"train_loss": -8.982206344604492, "global_step": 129388, "epoch": 770} {"train_loss": -8.2025785446167, "global_step": 129389, "epoch": 770} {"train_loss": -8.527456283569336, "global_step": 129390, "epoch": 770} {"train_loss": -8.917707443237305, "global_step": 129391, "epoch": 770} {"train_loss": -7.979543209075928, "global_step": 129392, "epoch": 770} {"train_loss": -9.212759971618652, "global_step": 129393, "epoch": 770} {"train_loss": -8.9760160446167, "global_step": 129394, "epoch": 770} {"train_loss": -8.79200553894043, "global_step": 129395, "epoch": 770} {"train_loss": -9.17870044708252, "global_step": 129396, "epoch": 770} {"train_loss": -9.587217330932617, "global_step": 129397, "epoch": 770} {"train_loss": -9.138266563415527, "global_step": 129398, "epoch": 770} {"train_loss": -9.541316986083984, "global_step": 129399, "epoch": 770} {"train_loss": -9.09619140625, "global_step": 129400, "epoch": 770} {"train_loss": -9.365167617797852, "global_step": 129401, "epoch": 770} {"train_loss": -9.435216903686523, "global_step": 129402, "epoch": 770} {"train_loss": -9.28050422668457, "global_step": 129403, "epoch": 770} {"train_loss": -9.687045097351074, "global_step": 129404, "epoch": 770} {"train_loss": -9.450035095214844, "global_step": 129405, "epoch": 770} {"train_loss": -9.553095817565918, "global_step": 129406, "epoch": 770} {"train_loss": -9.766456604003906, "global_step": 129407, "epoch": 770} {"train_loss": -9.330028533935547, "global_step": 129408, "epoch": 770} {"train_loss": -9.618623733520508, "global_step": 129409, "epoch": 770} {"train_loss": -9.795970916748047, "global_step": 129410, "epoch": 770} {"train_loss": -9.952792167663574, "global_step": 129411, "epoch": 770} {"train_loss": -9.901646614074707, "global_step": 129412, "epoch": 770} {"train_loss": -9.935749053955078, "global_step": 129413, "epoch": 770} {"train_loss": -9.892562866210938, "global_step": 129414, "epoch": 770} {"train_loss": -9.87356948852539, "global_step": 129415, "epoch": 770} {"train_loss": -9.952930450439453, "global_step": 129416, "epoch": 770} {"train_loss": -9.743490219116211, "global_step": 129417, "epoch": 770} {"train_loss": -9.888921737670898, "global_step": 129418, "epoch": 770} {"train_loss": -10.071064949035645, "global_step": 129419, "epoch": 770} {"train_loss": -10.004096984863281, "global_step": 129420, "epoch": 770} {"train_loss": -9.953458786010742, "global_step": 129421, "epoch": 770} {"train_loss": -10.050752639770508, "global_step": 129422, "epoch": 770} {"train_loss": -9.958223342895508, "global_step": 129423, "epoch": 770} {"train_loss": -10.132999420166016, "global_step": 129424, "epoch": 770} {"train_loss": -10.131941795349121, "global_step": 129425, "epoch": 770} {"train_loss": -10.155177116394043, "global_step": 129426, "epoch": 770} {"train_loss": -10.262310028076172, "global_step": 129427, "epoch": 770} {"train_loss": -10.237844467163086, "global_step": 129428, "epoch": 770} {"train_loss": -10.306118965148926, "global_step": 129429, "epoch": 770} {"train_loss": -10.187417984008789, "global_step": 129430, "epoch": 770} {"train_loss": -10.443603515625, "global_step": 129431, "epoch": 770} {"train_loss": -10.226520538330078, "global_step": 129432, "epoch": 770} {"train_loss": -10.336368560791016, "global_step": 129433, "epoch": 770} {"train_loss": -10.209844589233398, "global_step": 129434, "epoch": 770} {"train_loss": -10.398956298828125, "global_step": 129435, "epoch": 770} {"train_loss": -10.39298152923584, "global_step": 129436, "epoch": 770} {"train_loss": -10.551177978515625, "global_step": 129437, "epoch": 770} {"train_loss": -10.505569458007812, "global_step": 129438, "epoch": 770} {"train_loss": -10.520269393920898, "global_step": 129439, "epoch": 770} {"train_loss": -10.537393569946289, "global_step": 129440, "epoch": 770} {"train_loss": -10.493477821350098, "global_step": 129441, "epoch": 770} {"train_loss": -10.586236000061035, "global_step": 129442, "epoch": 770} {"train_loss": -10.613874435424805, "global_step": 129443, "epoch": 770} {"train_loss": -10.489177703857422, "global_step": 129444, "epoch": 770} {"train_loss": -10.640636444091797, "global_step": 129445, "epoch": 770} {"train_loss": -10.676864624023438, "global_step": 129446, "epoch": 770} {"train_loss": -10.420659065246582, "global_step": 129447, "epoch": 770} {"train_loss": -10.324710845947266, "global_step": 129448, "epoch": 770} {"train_loss": -10.512958526611328, "global_step": 129449, "epoch": 770} {"train_loss": -10.725147247314453, "global_step": 129450, "epoch": 770} {"train_loss": -10.713590621948242, "global_step": 129451, "epoch": 770} {"train_loss": -10.546927452087402, "global_step": 129452, "epoch": 770} {"train_loss": -10.589875221252441, "global_step": 129453, "epoch": 770} {"train_loss": -10.671487808227539, "global_step": 129454, "epoch": 770} {"train_loss": -10.6202974319458, "global_step": 129455, "epoch": 770} {"train_loss": -10.657709121704102, "global_step": 129456, "epoch": 770} {"train_loss": -10.729415893554688, "global_step": 129457, "epoch": 770} {"train_loss": -10.73805046081543, "global_step": 129458, "epoch": 770} {"train_loss": -10.65767765045166, "global_step": 129459, "epoch": 770} {"train_loss": -10.68675708770752, "global_step": 129460, "epoch": 770} {"train_loss": -10.314075469970703, "global_step": 129461, "epoch": 770} {"train_loss": -10.710702896118164, "global_step": 129462, "epoch": 770} {"train_loss": -10.262928009033203, "global_step": 129463, "epoch": 770} {"train_loss": -10.416667938232422, "global_step": 129464, "epoch": 770} {"train_loss": -10.159832000732422, "global_step": 129465, "epoch": 770} {"train_loss": -10.748580932617188, "global_step": 129466, "epoch": 770} {"train_loss": -9.795104026794434, "global_step": 129467, "epoch": 770} {"train_loss": -10.30009651184082, "global_step": 129468, "epoch": 770} {"train_loss": -10.243436813354492, "global_step": 129469, "epoch": 770} {"train_loss": -9.53518295288086, "global_step": 129470, "epoch": 770} {"train_loss": -10.640485763549805, "global_step": 129471, "epoch": 770} {"train_loss": -9.292376518249512, "global_step": 129472, "epoch": 770} {"train_loss": -9.964759826660156, "global_step": 129473, "epoch": 770} {"train_loss": -9.396892547607422, "global_step": 129474, "epoch": 770} {"train_loss": -9.25416374206543, "global_step": 129475, "epoch": 770} {"train_loss": -9.230844497680664, "global_step": 129476, "epoch": 770} {"train_loss": -9.702880859375, "global_step": 129477, "epoch": 770} {"train_loss": -9.707359313964844, "global_step": 129478, "epoch": 770} {"train_loss": -9.524954795837402, "global_step": 129479, "epoch": 770} {"train_loss": -9.623498916625977, "global_step": 129480, "epoch": 770} {"train_loss": -9.373929023742676, "global_step": 129481, "epoch": 770} {"train_loss": -10.154317855834961, "global_step": 129482, "epoch": 770} {"train_loss": -9.165566444396973, "global_step": 129483, "epoch": 770} {"train_loss": -9.56584358215332, "global_step": 129484, "epoch": 770} {"train_loss": -9.904452323913574, "global_step": 129485, "epoch": 770} {"train_loss": -9.4779052734375, "global_step": 129486, "epoch": 770} {"train_loss": -9.591548919677734, "global_step": 129487, "epoch": 770} {"train_loss": -9.757261276245117, "global_step": 129488, "epoch": 770} {"train_loss": -9.620168685913086, "global_step": 129489, "epoch": 770} {"train_loss": -9.731988906860352, "global_step": 129490, "epoch": 770} {"train_loss": -9.781085968017578, "global_step": 129491, "epoch": 770} {"train_loss": -10.039092063903809, "global_step": 129492, "epoch": 770} {"train_loss": -9.798637390136719, "global_step": 129493, "epoch": 770} {"train_loss": -10.146992683410645, "global_step": 129494, "epoch": 770} {"train_loss": -10.0930757522583, "global_step": 129495, "epoch": 770} {"train_loss": -9.982561111450195, "global_step": 129496, "epoch": 770} {"train_loss": -10.035324096679688, "global_step": 129497, "epoch": 770} {"train_loss": -9.939770698547363, "global_step": 129498, "epoch": 770} {"train_loss": -10.264431953430176, "global_step": 129499, "epoch": 770} {"train_loss": -10.143003463745117, "global_step": 129500, "epoch": 770} {"train_loss": -10.116167068481445, "global_step": 129501, "epoch": 770} {"train_loss": -10.089787483215332, "global_step": 129502, "epoch": 770} {"train_loss": -10.016494750976562, "global_step": 129503, "epoch": 770} {"train_loss": -9.965670585632324, "global_step": 129504, "epoch": 770} {"train_loss": -10.25049877166748, "global_step": 129505, "epoch": 770} {"train_loss": -10.410812377929688, "global_step": 129506, "epoch": 770} {"train_loss": -10.041793823242188, "global_step": 129507, "epoch": 770} {"train_loss": -10.416725158691406, "global_step": 129508, "epoch": 770} {"train_loss": -10.315038681030273, "global_step": 129509, "epoch": 770} {"train_loss": -10.024835586547852, "global_step": 129510, "epoch": 770} {"train_loss": -10.351617813110352, "global_step": 129511, "epoch": 770} {"train_loss": -10.270134925842285, "global_step": 129512, "epoch": 770} {"train_loss": -10.352535247802734, "global_step": 129513, "epoch": 770} {"train_loss": -10.377459526062012, "global_step": 129514, "epoch": 770} {"train_loss": -10.541768074035645, "global_step": 129515, "epoch": 770} {"train_loss": -10.470766067504883, "global_step": 129516, "epoch": 770} {"train_loss": -10.475688934326172, "global_step": 129517, "epoch": 770} {"train_loss": -10.522749900817871, "global_step": 129518, "epoch": 770} {"train_loss": -10.718901634216309, "global_step": 129519, "epoch": 770} {"train_loss": -10.580070495605469, "global_step": 129520, "epoch": 770} {"train_loss": -10.345134735107422, "global_step": 129521, "epoch": 770} {"train_loss": -10.485774993896484, "global_step": 129522, "epoch": 770} {"train_loss": -10.6673583984375, "global_step": 129523, "epoch": 770} {"train_loss": -10.441248893737793, "global_step": 129524, "epoch": 770} {"train_loss": -10.616734504699707, "global_step": 129525, "epoch": 770} {"train_loss": -10.71424674987793, "global_step": 129526, "epoch": 770} {"train_loss": -10.076056148324694, "global_step": 129527, "epoch": 770, "val_loss": 220011.265625, "train_action_mse_error": 1.8352549076080322} {"train_loss": -10.616067886352539, "global_step": 129528, "epoch": 771} {"train_loss": -10.622782707214355, "global_step": 129529, "epoch": 771} {"train_loss": -10.432600021362305, "global_step": 129530, "epoch": 771} {"train_loss": -10.656692504882812, "global_step": 129531, "epoch": 771} {"train_loss": -10.458630561828613, "global_step": 129532, "epoch": 771} {"train_loss": -10.701297760009766, "global_step": 129533, "epoch": 771} {"train_loss": -10.664192199707031, "global_step": 129534, "epoch": 771} {"train_loss": -10.765059471130371, "global_step": 129535, "epoch": 771} {"train_loss": -10.538763046264648, "global_step": 129536, "epoch": 771} {"train_loss": -10.907890319824219, "global_step": 129537, "epoch": 771} {"train_loss": -10.451157569885254, "global_step": 129538, "epoch": 771} {"train_loss": -10.451671600341797, "global_step": 129539, "epoch": 771} {"train_loss": -10.60171890258789, "global_step": 129540, "epoch": 771} {"train_loss": -10.580020904541016, "global_step": 129541, "epoch": 771} {"train_loss": -10.816949844360352, "global_step": 129542, "epoch": 771} {"train_loss": -10.736927032470703, "global_step": 129543, "epoch": 771} {"train_loss": -10.685689926147461, "global_step": 129544, "epoch": 771} {"train_loss": -10.734203338623047, "global_step": 129545, "epoch": 771} {"train_loss": -10.616779327392578, "global_step": 129546, "epoch": 771} {"train_loss": -10.274882316589355, "global_step": 129547, "epoch": 771} {"train_loss": -10.416238784790039, "global_step": 129548, "epoch": 771} {"train_loss": -10.839886665344238, "global_step": 129549, "epoch": 771} {"train_loss": -10.35781478881836, "global_step": 129550, "epoch": 771} {"train_loss": -10.385379791259766, "global_step": 129551, "epoch": 771} {"train_loss": -10.56545639038086, "global_step": 129552, "epoch": 771} {"train_loss": -10.34128189086914, "global_step": 129553, "epoch": 771} {"train_loss": -10.506410598754883, "global_step": 129554, "epoch": 771} {"train_loss": -10.619613647460938, "global_step": 129555, "epoch": 771} {"train_loss": -10.574295997619629, "global_step": 129556, "epoch": 771} {"train_loss": -10.442794799804688, "global_step": 129557, "epoch": 771} {"train_loss": -10.057798385620117, "global_step": 129558, "epoch": 771} {"train_loss": -9.873588562011719, "global_step": 129559, "epoch": 771} {"train_loss": -10.196471214294434, "global_step": 129560, "epoch": 771} {"train_loss": -10.035257339477539, "global_step": 129561, "epoch": 771} {"train_loss": -9.381869316101074, "global_step": 129562, "epoch": 771} {"train_loss": -10.252279281616211, "global_step": 129563, "epoch": 771} {"train_loss": -9.780311584472656, "global_step": 129564, "epoch": 771} {"train_loss": -10.101237297058105, "global_step": 129565, "epoch": 771} {"train_loss": -10.094494819641113, "global_step": 129566, "epoch": 771} {"train_loss": -9.947895050048828, "global_step": 129567, "epoch": 771} {"train_loss": -10.224587440490723, "global_step": 129568, "epoch": 771} {"train_loss": -10.392916679382324, "global_step": 129569, "epoch": 771} {"train_loss": -9.860240936279297, "global_step": 129570, "epoch": 771} {"train_loss": -10.293075561523438, "global_step": 129571, "epoch": 771} {"train_loss": -9.599393844604492, "global_step": 129572, "epoch": 771} {"train_loss": -10.48558521270752, "global_step": 129573, "epoch": 771} {"train_loss": -9.851275444030762, "global_step": 129574, "epoch": 771} {"train_loss": -10.026912689208984, "global_step": 129575, "epoch": 771} {"train_loss": -10.271751403808594, "global_step": 129576, "epoch": 771} {"train_loss": -9.963310241699219, "global_step": 129577, "epoch": 771} {"train_loss": -10.193479537963867, "global_step": 129578, "epoch": 771} {"train_loss": -9.775737762451172, "global_step": 129579, "epoch": 771} {"train_loss": -10.434184074401855, "global_step": 129580, "epoch": 771} {"train_loss": -9.962560653686523, "global_step": 129581, "epoch": 771} {"train_loss": -10.426400184631348, "global_step": 129582, "epoch": 771} {"train_loss": -10.355146408081055, "global_step": 129583, "epoch": 771} {"train_loss": -10.442794799804688, "global_step": 129584, "epoch": 771} {"train_loss": -10.331426620483398, "global_step": 129585, "epoch": 771} {"train_loss": -10.239139556884766, "global_step": 129586, "epoch": 771} {"train_loss": -10.286232948303223, "global_step": 129587, "epoch": 771} {"train_loss": -10.598007202148438, "global_step": 129588, "epoch": 771} {"train_loss": -10.29621696472168, "global_step": 129589, "epoch": 771} {"train_loss": -10.311413764953613, "global_step": 129590, "epoch": 771} {"train_loss": -10.2510986328125, "global_step": 129591, "epoch": 771} {"train_loss": -10.307634353637695, "global_step": 129592, "epoch": 771} {"train_loss": -10.656193733215332, "global_step": 129593, "epoch": 771} {"train_loss": -10.313993453979492, "global_step": 129594, "epoch": 771} {"train_loss": -10.240790367126465, "global_step": 129595, "epoch": 771} {"train_loss": -10.125274658203125, "global_step": 129596, "epoch": 771} {"train_loss": -10.391969680786133, "global_step": 129597, "epoch": 771} {"train_loss": -10.488761901855469, "global_step": 129598, "epoch": 771} {"train_loss": -10.129128456115723, "global_step": 129599, "epoch": 771} {"train_loss": -10.678739547729492, "global_step": 129600, "epoch": 771} {"train_loss": -10.459501266479492, "global_step": 129601, "epoch": 771} {"train_loss": -10.437917709350586, "global_step": 129602, "epoch": 771} {"train_loss": -10.48820686340332, "global_step": 129603, "epoch": 771} {"train_loss": -10.541177749633789, "global_step": 129604, "epoch": 771} {"train_loss": -10.663990020751953, "global_step": 129605, "epoch": 771} {"train_loss": -10.583489418029785, "global_step": 129606, "epoch": 771} {"train_loss": -10.577549934387207, "global_step": 129607, "epoch": 771} {"train_loss": -10.524438858032227, "global_step": 129608, "epoch": 771} {"train_loss": -10.553023338317871, "global_step": 129609, "epoch": 771} {"train_loss": -10.333930015563965, "global_step": 129610, "epoch": 771} {"train_loss": -10.372550964355469, "global_step": 129611, "epoch": 771} {"train_loss": -10.519708633422852, "global_step": 129612, "epoch": 771} {"train_loss": -10.483657836914062, "global_step": 129613, "epoch": 771} {"train_loss": -10.23660659790039, "global_step": 129614, "epoch": 771} {"train_loss": -10.619294166564941, "global_step": 129615, "epoch": 771} {"train_loss": -10.323554992675781, "global_step": 129616, "epoch": 771} {"train_loss": -10.346891403198242, "global_step": 129617, "epoch": 771} {"train_loss": -10.417763710021973, "global_step": 129618, "epoch": 771} {"train_loss": -10.314733505249023, "global_step": 129619, "epoch": 771} {"train_loss": -10.478930473327637, "global_step": 129620, "epoch": 771} {"train_loss": -10.242202758789062, "global_step": 129621, "epoch": 771} {"train_loss": -10.276063919067383, "global_step": 129622, "epoch": 771} {"train_loss": -10.430203437805176, "global_step": 129623, "epoch": 771} {"train_loss": -10.194856643676758, "global_step": 129624, "epoch": 771} {"train_loss": -10.126360893249512, "global_step": 129625, "epoch": 771} {"train_loss": -10.560653686523438, "global_step": 129626, "epoch": 771} {"train_loss": -10.176671981811523, "global_step": 129627, "epoch": 771} {"train_loss": -10.513568878173828, "global_step": 129628, "epoch": 771} {"train_loss": -10.248419761657715, "global_step": 129629, "epoch": 771} {"train_loss": -10.273950576782227, "global_step": 129630, "epoch": 771} {"train_loss": -10.375286102294922, "global_step": 129631, "epoch": 771} {"train_loss": -10.247050285339355, "global_step": 129632, "epoch": 771} {"train_loss": -10.210492134094238, "global_step": 129633, "epoch": 771} {"train_loss": -10.480668067932129, "global_step": 129634, "epoch": 771} {"train_loss": -10.242748260498047, "global_step": 129635, "epoch": 771} {"train_loss": -10.186548233032227, "global_step": 129636, "epoch": 771} {"train_loss": -10.380767822265625, "global_step": 129637, "epoch": 771} {"train_loss": -10.184988021850586, "global_step": 129638, "epoch": 771} {"train_loss": -10.14553165435791, "global_step": 129639, "epoch": 771} {"train_loss": -9.841599464416504, "global_step": 129640, "epoch": 771} {"train_loss": -9.99343490600586, "global_step": 129641, "epoch": 771} {"train_loss": -10.347183227539062, "global_step": 129642, "epoch": 771} {"train_loss": -10.133539199829102, "global_step": 129643, "epoch": 771} {"train_loss": -10.186342239379883, "global_step": 129644, "epoch": 771} {"train_loss": -10.233028411865234, "global_step": 129645, "epoch": 771} {"train_loss": -10.063056945800781, "global_step": 129646, "epoch": 771} {"train_loss": -9.497697830200195, "global_step": 129647, "epoch": 771} {"train_loss": -10.219307899475098, "global_step": 129648, "epoch": 771} {"train_loss": -10.071060180664062, "global_step": 129649, "epoch": 771} {"train_loss": -9.581881523132324, "global_step": 129650, "epoch": 771} {"train_loss": -9.599263191223145, "global_step": 129651, "epoch": 771} {"train_loss": -10.16430950164795, "global_step": 129652, "epoch": 771} {"train_loss": -9.711576461791992, "global_step": 129653, "epoch": 771} {"train_loss": -10.230608940124512, "global_step": 129654, "epoch": 771} {"train_loss": -9.999364852905273, "global_step": 129655, "epoch": 771} {"train_loss": -10.215003967285156, "global_step": 129656, "epoch": 771} {"train_loss": -10.231538772583008, "global_step": 129657, "epoch": 771} {"train_loss": -10.330162048339844, "global_step": 129658, "epoch": 771} {"train_loss": -10.202422142028809, "global_step": 129659, "epoch": 771} {"train_loss": -10.079818725585938, "global_step": 129660, "epoch": 771} {"train_loss": -10.092801094055176, "global_step": 129661, "epoch": 771} {"train_loss": -10.21252155303955, "global_step": 129662, "epoch": 771} {"train_loss": -10.241676330566406, "global_step": 129663, "epoch": 771} {"train_loss": -10.087409973144531, "global_step": 129664, "epoch": 771} {"train_loss": -10.242834091186523, "global_step": 129665, "epoch": 771} {"train_loss": -10.472002983093262, "global_step": 129666, "epoch": 771} {"train_loss": -10.025760650634766, "global_step": 129667, "epoch": 771} {"train_loss": -10.308777809143066, "global_step": 129668, "epoch": 771} {"train_loss": -10.405610084533691, "global_step": 129669, "epoch": 771} {"train_loss": -10.214071273803711, "global_step": 129670, "epoch": 771} {"train_loss": -10.438909530639648, "global_step": 129671, "epoch": 771} {"train_loss": -10.424137115478516, "global_step": 129672, "epoch": 771} {"train_loss": -10.287540435791016, "global_step": 129673, "epoch": 771} {"train_loss": -10.514436721801758, "global_step": 129674, "epoch": 771} {"train_loss": -10.321642875671387, "global_step": 129675, "epoch": 771} {"train_loss": -10.487489700317383, "global_step": 129676, "epoch": 771} {"train_loss": -10.418191909790039, "global_step": 129677, "epoch": 771} {"train_loss": -10.528900146484375, "global_step": 129678, "epoch": 771} {"train_loss": -10.687541961669922, "global_step": 129679, "epoch": 771} {"train_loss": -10.564857482910156, "global_step": 129680, "epoch": 771} {"train_loss": -10.37387752532959, "global_step": 129681, "epoch": 771} {"train_loss": -10.622694969177246, "global_step": 129682, "epoch": 771} {"train_loss": -10.598926544189453, "global_step": 129683, "epoch": 771} {"train_loss": -10.274919509887695, "global_step": 129684, "epoch": 771} {"train_loss": -10.38231086730957, "global_step": 129685, "epoch": 771} {"train_loss": -10.405014038085938, "global_step": 129686, "epoch": 771} {"train_loss": -10.435932159423828, "global_step": 129687, "epoch": 771} {"train_loss": -10.695276260375977, "global_step": 129688, "epoch": 771} {"train_loss": -10.539276123046875, "global_step": 129689, "epoch": 771} {"train_loss": -10.68511962890625, "global_step": 129690, "epoch": 771} {"train_loss": -10.842004776000977, "global_step": 129691, "epoch": 771} {"train_loss": -10.85645866394043, "global_step": 129692, "epoch": 771} {"train_loss": -10.442705154418945, "global_step": 129693, "epoch": 771} {"train_loss": -10.243270874023438, "global_step": 129694, "epoch": 771} {"train_loss": -10.333046731494722, "global_step": 129695, "epoch": 771, "val_loss": 220019.84375} {"train_loss": -10.573006629943848, "global_step": 129696, "epoch": 772} {"train_loss": -10.237775802612305, "global_step": 129697, "epoch": 772} {"train_loss": -10.509417533874512, "global_step": 129698, "epoch": 772} {"train_loss": -10.717344284057617, "global_step": 129699, "epoch": 772} {"train_loss": -10.398943901062012, "global_step": 129700, "epoch": 772} {"train_loss": -10.474176406860352, "global_step": 129701, "epoch": 772} {"train_loss": -10.268960952758789, "global_step": 129702, "epoch": 772} {"train_loss": -10.571371078491211, "global_step": 129703, "epoch": 772} {"train_loss": -10.455193519592285, "global_step": 129704, "epoch": 772} {"train_loss": -10.06264591217041, "global_step": 129705, "epoch": 772} {"train_loss": -10.32148551940918, "global_step": 129706, "epoch": 772} {"train_loss": -10.202554702758789, "global_step": 129707, "epoch": 772} {"train_loss": -10.324087142944336, "global_step": 129708, "epoch": 772} {"train_loss": -10.334501266479492, "global_step": 129709, "epoch": 772} {"train_loss": -10.482852935791016, "global_step": 129710, "epoch": 772} {"train_loss": -10.411519050598145, "global_step": 129711, "epoch": 772} {"train_loss": -10.348397254943848, "global_step": 129712, "epoch": 772} {"train_loss": -10.277528762817383, "global_step": 129713, "epoch": 772} {"train_loss": -10.298799514770508, "global_step": 129714, "epoch": 772} {"train_loss": -10.35871696472168, "global_step": 129715, "epoch": 772} {"train_loss": -10.741907119750977, "global_step": 129716, "epoch": 772} {"train_loss": -10.429773330688477, "global_step": 129717, "epoch": 772} {"train_loss": -10.870636940002441, "global_step": 129718, "epoch": 772} {"train_loss": -10.577681541442871, "global_step": 129719, "epoch": 772} {"train_loss": -10.27851390838623, "global_step": 129720, "epoch": 772} {"train_loss": -10.500974655151367, "global_step": 129721, "epoch": 772} {"train_loss": -10.329164505004883, "global_step": 129722, "epoch": 772} {"train_loss": -10.324196815490723, "global_step": 129723, "epoch": 772} {"train_loss": -10.463125228881836, "global_step": 129724, "epoch": 772} {"train_loss": -10.007928848266602, "global_step": 129725, "epoch": 772} {"train_loss": -10.49390983581543, "global_step": 129726, "epoch": 772} {"train_loss": -10.331501007080078, "global_step": 129727, "epoch": 772} {"train_loss": -10.26300048828125, "global_step": 129728, "epoch": 772} {"train_loss": -10.382104873657227, "global_step": 129729, "epoch": 772} {"train_loss": -10.21431827545166, "global_step": 129730, "epoch": 772} {"train_loss": -10.4686279296875, "global_step": 129731, "epoch": 772} {"train_loss": -10.305294036865234, "global_step": 129732, "epoch": 772} {"train_loss": -10.484455108642578, "global_step": 129733, "epoch": 772} {"train_loss": -10.454475402832031, "global_step": 129734, "epoch": 772} {"train_loss": -10.407783508300781, "global_step": 129735, "epoch": 772} {"train_loss": -10.675519943237305, "global_step": 129736, "epoch": 772} {"train_loss": -10.509830474853516, "global_step": 129737, "epoch": 772} {"train_loss": -10.451879501342773, "global_step": 129738, "epoch": 772} {"train_loss": -10.296113967895508, "global_step": 129739, "epoch": 772} {"train_loss": -10.649958610534668, "global_step": 129740, "epoch": 772} {"train_loss": -10.18861198425293, "global_step": 129741, "epoch": 772} {"train_loss": -10.262487411499023, "global_step": 129742, "epoch": 772} {"train_loss": -10.216939926147461, "global_step": 129743, "epoch": 772} {"train_loss": -10.327768325805664, "global_step": 129744, "epoch": 772} {"train_loss": -10.412355422973633, "global_step": 129745, "epoch": 772} {"train_loss": -10.240859985351562, "global_step": 129746, "epoch": 772} {"train_loss": -10.144001007080078, "global_step": 129747, "epoch": 772} {"train_loss": -9.986741065979004, "global_step": 129748, "epoch": 772} {"train_loss": -10.082416534423828, "global_step": 129749, "epoch": 772} {"train_loss": -10.458549499511719, "global_step": 129750, "epoch": 772} {"train_loss": -10.3866605758667, "global_step": 129751, "epoch": 772} {"train_loss": -10.395756721496582, "global_step": 129752, "epoch": 772} {"train_loss": -10.399585723876953, "global_step": 129753, "epoch": 772} {"train_loss": -10.5278902053833, "global_step": 129754, "epoch": 772} {"train_loss": -10.348260879516602, "global_step": 129755, "epoch": 772} {"train_loss": -10.575294494628906, "global_step": 129756, "epoch": 772} {"train_loss": -10.535429000854492, "global_step": 129757, "epoch": 772} {"train_loss": -10.376993179321289, "global_step": 129758, "epoch": 772} {"train_loss": -10.494287490844727, "global_step": 129759, "epoch": 772} {"train_loss": -10.558914184570312, "global_step": 129760, "epoch": 772} {"train_loss": -10.410017967224121, "global_step": 129761, "epoch": 772} {"train_loss": -10.425444602966309, "global_step": 129762, "epoch": 772} {"train_loss": -10.219781875610352, "global_step": 129763, "epoch": 772} {"train_loss": -10.486940383911133, "global_step": 129764, "epoch": 772} {"train_loss": -10.068077087402344, "global_step": 129765, "epoch": 772} {"train_loss": -10.513071060180664, "global_step": 129766, "epoch": 772} {"train_loss": -9.620792388916016, "global_step": 129767, "epoch": 772} {"train_loss": -9.516013145446777, "global_step": 129768, "epoch": 772} {"train_loss": -10.001462936401367, "global_step": 129769, "epoch": 772} {"train_loss": -9.291794776916504, "global_step": 129770, "epoch": 772} {"train_loss": -9.983575820922852, "global_step": 129771, "epoch": 772} {"train_loss": -9.725831985473633, "global_step": 129772, "epoch": 772} {"train_loss": -9.779081344604492, "global_step": 129773, "epoch": 772} {"train_loss": -10.073488235473633, "global_step": 129774, "epoch": 772} {"train_loss": -9.957549095153809, "global_step": 129775, "epoch": 772} {"train_loss": -10.039755821228027, "global_step": 129776, "epoch": 772} {"train_loss": -9.866453170776367, "global_step": 129777, "epoch": 772} {"train_loss": -9.700443267822266, "global_step": 129778, "epoch": 772} {"train_loss": -9.664594650268555, "global_step": 129779, "epoch": 772} {"train_loss": -9.82745361328125, "global_step": 129780, "epoch": 772} {"train_loss": -9.641082763671875, "global_step": 129781, "epoch": 772} {"train_loss": -9.96415901184082, "global_step": 129782, "epoch": 772} {"train_loss": -9.646892547607422, "global_step": 129783, "epoch": 772} {"train_loss": -9.552976608276367, "global_step": 129784, "epoch": 772} {"train_loss": -10.026025772094727, "global_step": 129785, "epoch": 772} {"train_loss": -9.857170104980469, "global_step": 129786, "epoch": 772} {"train_loss": -10.154695510864258, "global_step": 129787, "epoch": 772} {"train_loss": -10.143339157104492, "global_step": 129788, "epoch": 772} {"train_loss": -9.965208053588867, "global_step": 129789, "epoch": 772} {"train_loss": -9.843179702758789, "global_step": 129790, "epoch": 772} {"train_loss": -10.51021957397461, "global_step": 129791, "epoch": 772} {"train_loss": -9.900575637817383, "global_step": 129792, "epoch": 772} {"train_loss": -10.148519515991211, "global_step": 129793, "epoch": 772} {"train_loss": -10.125029563903809, "global_step": 129794, "epoch": 772} {"train_loss": -10.039215087890625, "global_step": 129795, "epoch": 772} {"train_loss": -10.253570556640625, "global_step": 129796, "epoch": 772} {"train_loss": -9.920350074768066, "global_step": 129797, "epoch": 772} {"train_loss": -10.033405303955078, "global_step": 129798, "epoch": 772} {"train_loss": -10.292403221130371, "global_step": 129799, "epoch": 772} {"train_loss": -10.263426780700684, "global_step": 129800, "epoch": 772} {"train_loss": -10.021520614624023, "global_step": 129801, "epoch": 772} {"train_loss": -10.38481616973877, "global_step": 129802, "epoch": 772} {"train_loss": -10.167137145996094, "global_step": 129803, "epoch": 772} {"train_loss": -10.132569313049316, "global_step": 129804, "epoch": 772} {"train_loss": -10.416006088256836, "global_step": 129805, "epoch": 772} {"train_loss": -10.301151275634766, "global_step": 129806, "epoch": 772} {"train_loss": -10.260456085205078, "global_step": 129807, "epoch": 772} {"train_loss": -10.405949592590332, "global_step": 129808, "epoch": 772} {"train_loss": -10.143013000488281, "global_step": 129809, "epoch": 772} {"train_loss": -10.275253295898438, "global_step": 129810, "epoch": 772} {"train_loss": -10.473795890808105, "global_step": 129811, "epoch": 772} {"train_loss": -10.176369667053223, "global_step": 129812, "epoch": 772} {"train_loss": -10.480131149291992, "global_step": 129813, "epoch": 772} {"train_loss": -10.516368865966797, "global_step": 129814, "epoch": 772} {"train_loss": -10.151074409484863, "global_step": 129815, "epoch": 772} {"train_loss": -10.406578063964844, "global_step": 129816, "epoch": 772} {"train_loss": -9.814291954040527, "global_step": 129817, "epoch": 772} {"train_loss": -10.275164604187012, "global_step": 129818, "epoch": 772} {"train_loss": -10.318653106689453, "global_step": 129819, "epoch": 772} {"train_loss": -10.54376220703125, "global_step": 129820, "epoch": 772} {"train_loss": -10.488396644592285, "global_step": 129821, "epoch": 772} {"train_loss": -10.370363235473633, "global_step": 129822, "epoch": 772} {"train_loss": -10.585386276245117, "global_step": 129823, "epoch": 772} {"train_loss": -10.536127090454102, "global_step": 129824, "epoch": 772} {"train_loss": -10.756909370422363, "global_step": 129825, "epoch": 772} {"train_loss": -10.52243423461914, "global_step": 129826, "epoch": 772} {"train_loss": -10.364513397216797, "global_step": 129827, "epoch": 772} {"train_loss": -10.404401779174805, "global_step": 129828, "epoch": 772} {"train_loss": -10.513973236083984, "global_step": 129829, "epoch": 772} {"train_loss": -10.513830184936523, "global_step": 129830, "epoch": 772} {"train_loss": -10.403861999511719, "global_step": 129831, "epoch": 772} {"train_loss": -10.477707862854004, "global_step": 129832, "epoch": 772} {"train_loss": -10.43606185913086, "global_step": 129833, "epoch": 772} {"train_loss": -10.589696884155273, "global_step": 129834, "epoch": 772} {"train_loss": -10.212564468383789, "global_step": 129835, "epoch": 772} {"train_loss": -10.472618103027344, "global_step": 129836, "epoch": 772} {"train_loss": -10.132352828979492, "global_step": 129837, "epoch": 772} {"train_loss": -9.96159553527832, "global_step": 129838, "epoch": 772} {"train_loss": -10.575895309448242, "global_step": 129839, "epoch": 772} {"train_loss": -10.048748016357422, "global_step": 129840, "epoch": 772} {"train_loss": -10.213178634643555, "global_step": 129841, "epoch": 772} {"train_loss": -10.018199920654297, "global_step": 129842, "epoch": 772} {"train_loss": -10.206300735473633, "global_step": 129843, "epoch": 772} {"train_loss": -10.133626937866211, "global_step": 129844, "epoch": 772} {"train_loss": -9.484809875488281, "global_step": 129845, "epoch": 772} {"train_loss": -10.512748718261719, "global_step": 129846, "epoch": 772} {"train_loss": -9.478612899780273, "global_step": 129847, "epoch": 772} {"train_loss": -9.958585739135742, "global_step": 129848, "epoch": 772} {"train_loss": -9.933318138122559, "global_step": 129849, "epoch": 772} {"train_loss": -9.82235050201416, "global_step": 129850, "epoch": 772} {"train_loss": -10.101479530334473, "global_step": 129851, "epoch": 772} {"train_loss": -10.158323287963867, "global_step": 129852, "epoch": 772} {"train_loss": -9.774561882019043, "global_step": 129853, "epoch": 772} {"train_loss": -10.104175567626953, "global_step": 129854, "epoch": 772} {"train_loss": -9.330954551696777, "global_step": 129855, "epoch": 772} {"train_loss": -10.382068634033203, "global_step": 129856, "epoch": 772} {"train_loss": -9.574132919311523, "global_step": 129857, "epoch": 772} {"train_loss": -9.958484649658203, "global_step": 129858, "epoch": 772} {"train_loss": -9.979385375976562, "global_step": 129859, "epoch": 772} {"train_loss": -9.798140525817871, "global_step": 129860, "epoch": 772} {"train_loss": -10.30067253112793, "global_step": 129861, "epoch": 772} {"train_loss": -9.96867561340332, "global_step": 129862, "epoch": 772} {"train_loss": -10.226194489569892, "global_step": 129863, "epoch": 772, "val_loss": 221435.53125} {"train_loss": -10.232797622680664, "global_step": 129864, "epoch": 773} {"train_loss": -10.109643936157227, "global_step": 129865, "epoch": 773} {"train_loss": -10.34716796875, "global_step": 129866, "epoch": 773} {"train_loss": -10.05170726776123, "global_step": 129867, "epoch": 773} {"train_loss": -9.910603523254395, "global_step": 129868, "epoch": 773} {"train_loss": -9.899660110473633, "global_step": 129869, "epoch": 773} {"train_loss": -10.222709655761719, "global_step": 129870, "epoch": 773} {"train_loss": -10.462701797485352, "global_step": 129871, "epoch": 773} {"train_loss": -10.062251091003418, "global_step": 129872, "epoch": 773} {"train_loss": -10.45957088470459, "global_step": 129873, "epoch": 773} {"train_loss": -10.284804344177246, "global_step": 129874, "epoch": 773} {"train_loss": -10.556069374084473, "global_step": 129875, "epoch": 773} {"train_loss": -10.5177001953125, "global_step": 129876, "epoch": 773} {"train_loss": -10.376338005065918, "global_step": 129877, "epoch": 773} {"train_loss": -10.397329330444336, "global_step": 129878, "epoch": 773} {"train_loss": -10.716594696044922, "global_step": 129879, "epoch": 773} {"train_loss": -10.551741600036621, "global_step": 129880, "epoch": 773} {"train_loss": -10.691062927246094, "global_step": 129881, "epoch": 773} {"train_loss": -10.1519136428833, "global_step": 129882, "epoch": 773} {"train_loss": -10.528072357177734, "global_step": 129883, "epoch": 773} {"train_loss": -10.455862045288086, "global_step": 129884, "epoch": 773} {"train_loss": -10.641836166381836, "global_step": 129885, "epoch": 773} {"train_loss": -10.626794815063477, "global_step": 129886, "epoch": 773} {"train_loss": -10.4525146484375, "global_step": 129887, "epoch": 773} {"train_loss": -10.549440383911133, "global_step": 129888, "epoch": 773} {"train_loss": -10.767740249633789, "global_step": 129889, "epoch": 773} {"train_loss": -10.482288360595703, "global_step": 129890, "epoch": 773} {"train_loss": -10.490156173706055, "global_step": 129891, "epoch": 773} {"train_loss": -10.311729431152344, "global_step": 129892, "epoch": 773} {"train_loss": -10.67674732208252, "global_step": 129893, "epoch": 773} {"train_loss": -10.614009857177734, "global_step": 129894, "epoch": 773} {"train_loss": -10.60738754272461, "global_step": 129895, "epoch": 773} {"train_loss": -10.714143753051758, "global_step": 129896, "epoch": 773} {"train_loss": -10.618484497070312, "global_step": 129897, "epoch": 773} {"train_loss": -10.343013763427734, "global_step": 129898, "epoch": 773} {"train_loss": -10.509123802185059, "global_step": 129899, "epoch": 773} {"train_loss": -10.382640838623047, "global_step": 129900, "epoch": 773} {"train_loss": -10.414807319641113, "global_step": 129901, "epoch": 773} {"train_loss": -10.471624374389648, "global_step": 129902, "epoch": 773} {"train_loss": -9.453022003173828, "global_step": 129903, "epoch": 773} {"train_loss": -10.59334659576416, "global_step": 129904, "epoch": 773} {"train_loss": -9.873880386352539, "global_step": 129905, "epoch": 773} {"train_loss": -10.442302703857422, "global_step": 129906, "epoch": 773} {"train_loss": -10.27940559387207, "global_step": 129907, "epoch": 773} {"train_loss": -9.64997386932373, "global_step": 129908, "epoch": 773} {"train_loss": -10.688716888427734, "global_step": 129909, "epoch": 773} {"train_loss": -10.376840591430664, "global_step": 129910, "epoch": 773} {"train_loss": -10.304244995117188, "global_step": 129911, "epoch": 773} {"train_loss": -10.411190032958984, "global_step": 129912, "epoch": 773} {"train_loss": -10.47508430480957, "global_step": 129913, "epoch": 773} {"train_loss": -10.550922393798828, "global_step": 129914, "epoch": 773} {"train_loss": -10.13401985168457, "global_step": 129915, "epoch": 773} {"train_loss": -10.397893905639648, "global_step": 129916, "epoch": 773} {"train_loss": -9.963155746459961, "global_step": 129917, "epoch": 773} {"train_loss": -10.564870834350586, "global_step": 129918, "epoch": 773} {"train_loss": -10.526500701904297, "global_step": 129919, "epoch": 773} {"train_loss": -10.202696800231934, "global_step": 129920, "epoch": 773} {"train_loss": -10.749094009399414, "global_step": 129921, "epoch": 773} {"train_loss": -10.228429794311523, "global_step": 129922, "epoch": 773} {"train_loss": -10.412038803100586, "global_step": 129923, "epoch": 773} {"train_loss": -10.481334686279297, "global_step": 129924, "epoch": 773} {"train_loss": -10.3474702835083, "global_step": 129925, "epoch": 773} {"train_loss": -10.78799057006836, "global_step": 129926, "epoch": 773} {"train_loss": -10.472418785095215, "global_step": 129927, "epoch": 773} {"train_loss": -10.519758224487305, "global_step": 129928, "epoch": 773} {"train_loss": -10.582618713378906, "global_step": 129929, "epoch": 773} {"train_loss": -10.457693099975586, "global_step": 129930, "epoch": 773} {"train_loss": -10.302940368652344, "global_step": 129931, "epoch": 773} {"train_loss": -10.671051025390625, "global_step": 129932, "epoch": 773} {"train_loss": -10.560906410217285, "global_step": 129933, "epoch": 773} {"train_loss": -10.24404525756836, "global_step": 129934, "epoch": 773} {"train_loss": -10.511996269226074, "global_step": 129935, "epoch": 773} {"train_loss": -10.36965274810791, "global_step": 129936, "epoch": 773} {"train_loss": -9.826421737670898, "global_step": 129937, "epoch": 773} {"train_loss": -10.535835266113281, "global_step": 129938, "epoch": 773} {"train_loss": -10.55538558959961, "global_step": 129939, "epoch": 773} {"train_loss": -10.147454261779785, "global_step": 129940, "epoch": 773} {"train_loss": -10.149885177612305, "global_step": 129941, "epoch": 773} {"train_loss": -9.720376968383789, "global_step": 129942, "epoch": 773} {"train_loss": -10.341472625732422, "global_step": 129943, "epoch": 773} {"train_loss": -10.099292755126953, "global_step": 129944, "epoch": 773} {"train_loss": -10.399120330810547, "global_step": 129945, "epoch": 773} {"train_loss": -9.956941604614258, "global_step": 129946, "epoch": 773} {"train_loss": -10.049586296081543, "global_step": 129947, "epoch": 773} {"train_loss": -10.369714736938477, "global_step": 129948, "epoch": 773} {"train_loss": -10.131643295288086, "global_step": 129949, "epoch": 773} {"train_loss": -10.029886245727539, "global_step": 129950, "epoch": 773} {"train_loss": -10.180328369140625, "global_step": 129951, "epoch": 773} {"train_loss": -10.297680854797363, "global_step": 129952, "epoch": 773} {"train_loss": -9.930292129516602, "global_step": 129953, "epoch": 773} {"train_loss": -9.852252960205078, "global_step": 129954, "epoch": 773} {"train_loss": -9.703123092651367, "global_step": 129955, "epoch": 773} {"train_loss": -10.251020431518555, "global_step": 129956, "epoch": 773} {"train_loss": -9.674192428588867, "global_step": 129957, "epoch": 773} {"train_loss": -9.979936599731445, "global_step": 129958, "epoch": 773} {"train_loss": -10.267061233520508, "global_step": 129959, "epoch": 773} {"train_loss": -10.145240783691406, "global_step": 129960, "epoch": 773} {"train_loss": -10.176553726196289, "global_step": 129961, "epoch": 773} {"train_loss": -10.459890365600586, "global_step": 129962, "epoch": 773} {"train_loss": -10.27231216430664, "global_step": 129963, "epoch": 773} {"train_loss": -10.529726028442383, "global_step": 129964, "epoch": 773} {"train_loss": -10.047701835632324, "global_step": 129965, "epoch": 773} {"train_loss": -10.443268775939941, "global_step": 129966, "epoch": 773} {"train_loss": -10.084684371948242, "global_step": 129967, "epoch": 773} {"train_loss": -9.994171142578125, "global_step": 129968, "epoch": 773} {"train_loss": -10.198183059692383, "global_step": 129969, "epoch": 773} {"train_loss": -10.266742706298828, "global_step": 129970, "epoch": 773} {"train_loss": -10.135629653930664, "global_step": 129971, "epoch": 773} {"train_loss": -10.219616889953613, "global_step": 129972, "epoch": 773} {"train_loss": -10.2586088180542, "global_step": 129973, "epoch": 773} {"train_loss": -10.206963539123535, "global_step": 129974, "epoch": 773} {"train_loss": -10.071707725524902, "global_step": 129975, "epoch": 773} {"train_loss": -10.006399154663086, "global_step": 129976, "epoch": 773} {"train_loss": -10.207928657531738, "global_step": 129977, "epoch": 773} {"train_loss": -9.984404563903809, "global_step": 129978, "epoch": 773} {"train_loss": -9.855878829956055, "global_step": 129979, "epoch": 773} {"train_loss": -10.614644050598145, "global_step": 129980, "epoch": 773} {"train_loss": -10.235244750976562, "global_step": 129981, "epoch": 773} {"train_loss": -10.276690483093262, "global_step": 129982, "epoch": 773} {"train_loss": -9.985143661499023, "global_step": 129983, "epoch": 773} {"train_loss": -10.395936012268066, "global_step": 129984, "epoch": 773} {"train_loss": -10.28570556640625, "global_step": 129985, "epoch": 773} {"train_loss": -10.483471870422363, "global_step": 129986, "epoch": 773} {"train_loss": -10.430730819702148, "global_step": 129987, "epoch": 773} {"train_loss": -10.406808853149414, "global_step": 129988, "epoch": 773} {"train_loss": -10.190051078796387, "global_step": 129989, "epoch": 773} {"train_loss": -10.43644905090332, "global_step": 129990, "epoch": 773} {"train_loss": -10.439046859741211, "global_step": 129991, "epoch": 773} {"train_loss": -10.361428260803223, "global_step": 129992, "epoch": 773} {"train_loss": -10.480252265930176, "global_step": 129993, "epoch": 773} {"train_loss": -10.548379898071289, "global_step": 129994, "epoch": 773} {"train_loss": -10.656933784484863, "global_step": 129995, "epoch": 773} {"train_loss": -10.694406509399414, "global_step": 129996, "epoch": 773} {"train_loss": -10.54570198059082, "global_step": 129997, "epoch": 773} {"train_loss": -10.733278274536133, "global_step": 129998, "epoch": 773} {"train_loss": -10.758659362792969, "global_step": 129999, "epoch": 773} {"train_loss": -10.731937408447266, "global_step": 130000, "epoch": 773} {"train_loss": -10.54680347442627, "global_step": 130001, "epoch": 773} {"train_loss": -10.317989349365234, "global_step": 130002, "epoch": 773} {"train_loss": -10.531591415405273, "global_step": 130003, "epoch": 773} {"train_loss": -10.697813987731934, "global_step": 130004, "epoch": 773} {"train_loss": -10.36933708190918, "global_step": 130005, "epoch": 773} {"train_loss": -10.241338729858398, "global_step": 130006, "epoch": 773} {"train_loss": -10.444608688354492, "global_step": 130007, "epoch": 773} {"train_loss": -10.614341735839844, "global_step": 130008, "epoch": 773} {"train_loss": -10.501909255981445, "global_step": 130009, "epoch": 773} {"train_loss": -10.54238510131836, "global_step": 130010, "epoch": 773} {"train_loss": -10.51806926727295, "global_step": 130011, "epoch": 773} {"train_loss": -10.437780380249023, "global_step": 130012, "epoch": 773} {"train_loss": -10.45740032196045, "global_step": 130013, "epoch": 773} {"train_loss": -10.717668533325195, "global_step": 130014, "epoch": 773} {"train_loss": -10.595497131347656, "global_step": 130015, "epoch": 773} {"train_loss": -10.508543014526367, "global_step": 130016, "epoch": 773} {"train_loss": -10.193334579467773, "global_step": 130017, "epoch": 773} {"train_loss": -10.676077842712402, "global_step": 130018, "epoch": 773} {"train_loss": -10.426980972290039, "global_step": 130019, "epoch": 773} {"train_loss": -10.175233840942383, "global_step": 130020, "epoch": 773} {"train_loss": -10.323905944824219, "global_step": 130021, "epoch": 773} {"train_loss": -10.393400192260742, "global_step": 130022, "epoch": 773} {"train_loss": -10.187814712524414, "global_step": 130023, "epoch": 773} {"train_loss": -10.400236129760742, "global_step": 130024, "epoch": 773} {"train_loss": -10.397528648376465, "global_step": 130025, "epoch": 773} {"train_loss": -9.933408737182617, "global_step": 130026, "epoch": 773} {"train_loss": -10.404272079467773, "global_step": 130027, "epoch": 773} {"train_loss": -9.781980514526367, "global_step": 130028, "epoch": 773} {"train_loss": -10.150687217712402, "global_step": 130029, "epoch": 773} {"train_loss": -9.563814163208008, "global_step": 130030, "epoch": 773} {"train_loss": -10.332789284842354, "global_step": 130031, "epoch": 773, "val_loss": 220824.5} {"train_loss": -10.441705703735352, "global_step": 130032, "epoch": 774} {"train_loss": -9.829439163208008, "global_step": 130033, "epoch": 774} {"train_loss": -10.518550872802734, "global_step": 130034, "epoch": 774} {"train_loss": -10.068903923034668, "global_step": 130035, "epoch": 774} {"train_loss": -10.461097717285156, "global_step": 130036, "epoch": 774} {"train_loss": -9.970871925354004, "global_step": 130037, "epoch": 774} {"train_loss": -10.284811973571777, "global_step": 130038, "epoch": 774} {"train_loss": -10.609569549560547, "global_step": 130039, "epoch": 774} {"train_loss": -10.46297836303711, "global_step": 130040, "epoch": 774} {"train_loss": -10.567416191101074, "global_step": 130041, "epoch": 774} {"train_loss": -10.380607604980469, "global_step": 130042, "epoch": 774} {"train_loss": -10.526047706604004, "global_step": 130043, "epoch": 774} {"train_loss": -10.049737930297852, "global_step": 130044, "epoch": 774} {"train_loss": -10.294366836547852, "global_step": 130045, "epoch": 774} {"train_loss": -10.14462661743164, "global_step": 130046, "epoch": 774} {"train_loss": -10.424324035644531, "global_step": 130047, "epoch": 774} {"train_loss": -10.260514259338379, "global_step": 130048, "epoch": 774} {"train_loss": -10.26176929473877, "global_step": 130049, "epoch": 774} {"train_loss": -10.149065017700195, "global_step": 130050, "epoch": 774} {"train_loss": -10.318069458007812, "global_step": 130051, "epoch": 774} {"train_loss": -10.334871292114258, "global_step": 130052, "epoch": 774} {"train_loss": -10.120025634765625, "global_step": 130053, "epoch": 774} {"train_loss": -10.344446182250977, "global_step": 130054, "epoch": 774} {"train_loss": -10.410831451416016, "global_step": 130055, "epoch": 774} {"train_loss": -10.409454345703125, "global_step": 130056, "epoch": 774} {"train_loss": -10.563191413879395, "global_step": 130057, "epoch": 774} {"train_loss": -10.564854621887207, "global_step": 130058, "epoch": 774} {"train_loss": -10.420063018798828, "global_step": 130059, "epoch": 774} {"train_loss": -10.33584976196289, "global_step": 130060, "epoch": 774} {"train_loss": -10.494335174560547, "global_step": 130061, "epoch": 774} {"train_loss": -9.623228073120117, "global_step": 130062, "epoch": 774} {"train_loss": -10.559356689453125, "global_step": 130063, "epoch": 774} {"train_loss": -9.88525390625, "global_step": 130064, "epoch": 774} {"train_loss": -10.466154098510742, "global_step": 130065, "epoch": 774} {"train_loss": -10.399066925048828, "global_step": 130066, "epoch": 774} {"train_loss": -10.231897354125977, "global_step": 130067, "epoch": 774} {"train_loss": -10.443446159362793, "global_step": 130068, "epoch": 774} {"train_loss": -10.45621109008789, "global_step": 130069, "epoch": 774} {"train_loss": -10.468658447265625, "global_step": 130070, "epoch": 774} {"train_loss": -10.076231956481934, "global_step": 130071, "epoch": 774} {"train_loss": -10.520280838012695, "global_step": 130072, "epoch": 774} {"train_loss": -10.36034107208252, "global_step": 130073, "epoch": 774} {"train_loss": -10.594982147216797, "global_step": 130074, "epoch": 774} {"train_loss": -10.402935028076172, "global_step": 130075, "epoch": 774} {"train_loss": -10.592530250549316, "global_step": 130076, "epoch": 774} {"train_loss": -10.706722259521484, "global_step": 130077, "epoch": 774} {"train_loss": -10.2347412109375, "global_step": 130078, "epoch": 774} {"train_loss": -10.456260681152344, "global_step": 130079, "epoch": 774} {"train_loss": -10.209587097167969, "global_step": 130080, "epoch": 774} {"train_loss": -10.013936996459961, "global_step": 130081, "epoch": 774} {"train_loss": -10.335445404052734, "global_step": 130082, "epoch": 774} {"train_loss": -10.408967971801758, "global_step": 130083, "epoch": 774} {"train_loss": -10.058551788330078, "global_step": 130084, "epoch": 774} {"train_loss": -10.344457626342773, "global_step": 130085, "epoch": 774} {"train_loss": -10.261161804199219, "global_step": 130086, "epoch": 774} {"train_loss": -10.220399856567383, "global_step": 130087, "epoch": 774} {"train_loss": -10.404203414916992, "global_step": 130088, "epoch": 774} {"train_loss": -9.360546112060547, "global_step": 130089, "epoch": 774} {"train_loss": -10.458263397216797, "global_step": 130090, "epoch": 774} {"train_loss": -9.958988189697266, "global_step": 130091, "epoch": 774} {"train_loss": -10.350364685058594, "global_step": 130092, "epoch": 774} {"train_loss": -10.18509292602539, "global_step": 130093, "epoch": 774} {"train_loss": -9.42939567565918, "global_step": 130094, "epoch": 774} {"train_loss": -10.589431762695312, "global_step": 130095, "epoch": 774} {"train_loss": -9.689460754394531, "global_step": 130096, "epoch": 774} {"train_loss": -10.571099281311035, "global_step": 130097, "epoch": 774} {"train_loss": -10.161209106445312, "global_step": 130098, "epoch": 774} {"train_loss": -10.274093627929688, "global_step": 130099, "epoch": 774} {"train_loss": -9.777959823608398, "global_step": 130100, "epoch": 774} {"train_loss": -10.332534790039062, "global_step": 130101, "epoch": 774} {"train_loss": -10.226280212402344, "global_step": 130102, "epoch": 774} {"train_loss": -10.386815071105957, "global_step": 130103, "epoch": 774} {"train_loss": -10.416449546813965, "global_step": 130104, "epoch": 774} {"train_loss": -10.214048385620117, "global_step": 130105, "epoch": 774} {"train_loss": -10.095643997192383, "global_step": 130106, "epoch": 774} {"train_loss": -10.478925704956055, "global_step": 130107, "epoch": 774} {"train_loss": -9.979713439941406, "global_step": 130108, "epoch": 774} {"train_loss": -10.489175796508789, "global_step": 130109, "epoch": 774} {"train_loss": -10.405537605285645, "global_step": 130110, "epoch": 774} {"train_loss": -10.152162551879883, "global_step": 130111, "epoch": 774} {"train_loss": -10.414749145507812, "global_step": 130112, "epoch": 774} {"train_loss": -10.26585865020752, "global_step": 130113, "epoch": 774} {"train_loss": -10.728822708129883, "global_step": 130114, "epoch": 774} {"train_loss": -10.531253814697266, "global_step": 130115, "epoch": 774} {"train_loss": -10.484496116638184, "global_step": 130116, "epoch": 774} {"train_loss": -10.396890640258789, "global_step": 130117, "epoch": 774} {"train_loss": -10.467696189880371, "global_step": 130118, "epoch": 774} {"train_loss": -10.110128402709961, "global_step": 130119, "epoch": 774} {"train_loss": -10.39582633972168, "global_step": 130120, "epoch": 774} {"train_loss": -10.324334144592285, "global_step": 130121, "epoch": 774} {"train_loss": -10.372777938842773, "global_step": 130122, "epoch": 774} {"train_loss": -10.403121948242188, "global_step": 130123, "epoch": 774} {"train_loss": -10.398309707641602, "global_step": 130124, "epoch": 774} {"train_loss": -10.288187026977539, "global_step": 130125, "epoch": 774} {"train_loss": -10.320068359375, "global_step": 130126, "epoch": 774} {"train_loss": -10.427054405212402, "global_step": 130127, "epoch": 774} {"train_loss": -10.502758026123047, "global_step": 130128, "epoch": 774} {"train_loss": -10.516115188598633, "global_step": 130129, "epoch": 774} {"train_loss": -10.396588325500488, "global_step": 130130, "epoch": 774} {"train_loss": -10.675023078918457, "global_step": 130131, "epoch": 774} {"train_loss": -10.543619155883789, "global_step": 130132, "epoch": 774} {"train_loss": -10.582290649414062, "global_step": 130133, "epoch": 774} {"train_loss": -10.595133781433105, "global_step": 130134, "epoch": 774} {"train_loss": -10.24665641784668, "global_step": 130135, "epoch": 774} {"train_loss": -10.200284004211426, "global_step": 130136, "epoch": 774} {"train_loss": -10.492524147033691, "global_step": 130137, "epoch": 774} {"train_loss": -10.629000663757324, "global_step": 130138, "epoch": 774} {"train_loss": -10.232752799987793, "global_step": 130139, "epoch": 774} {"train_loss": -10.295116424560547, "global_step": 130140, "epoch": 774} {"train_loss": -9.917430877685547, "global_step": 130141, "epoch": 774} {"train_loss": -10.331140518188477, "global_step": 130142, "epoch": 774} {"train_loss": -10.231695175170898, "global_step": 130143, "epoch": 774} {"train_loss": -10.29127311706543, "global_step": 130144, "epoch": 774} {"train_loss": -10.522930145263672, "global_step": 130145, "epoch": 774} {"train_loss": -10.366525650024414, "global_step": 130146, "epoch": 774} {"train_loss": -10.339241981506348, "global_step": 130147, "epoch": 774} {"train_loss": -10.186896324157715, "global_step": 130148, "epoch": 774} {"train_loss": -9.743758201599121, "global_step": 130149, "epoch": 774} {"train_loss": -10.125033378601074, "global_step": 130150, "epoch": 774} {"train_loss": -10.286792755126953, "global_step": 130151, "epoch": 774} {"train_loss": -10.052555084228516, "global_step": 130152, "epoch": 774} {"train_loss": -10.440408706665039, "global_step": 130153, "epoch": 774} {"train_loss": -10.149873733520508, "global_step": 130154, "epoch": 774} {"train_loss": -10.216999053955078, "global_step": 130155, "epoch": 774} {"train_loss": -10.306434631347656, "global_step": 130156, "epoch": 774} {"train_loss": -10.5081205368042, "global_step": 130157, "epoch": 774} {"train_loss": -10.35766887664795, "global_step": 130158, "epoch": 774} {"train_loss": -10.530664443969727, "global_step": 130159, "epoch": 774} {"train_loss": -10.094480514526367, "global_step": 130160, "epoch": 774} {"train_loss": -10.535658836364746, "global_step": 130161, "epoch": 774} {"train_loss": -10.408597946166992, "global_step": 130162, "epoch": 774} {"train_loss": -10.403486251831055, "global_step": 130163, "epoch": 774} {"train_loss": -10.502429962158203, "global_step": 130164, "epoch": 774} {"train_loss": -10.654313087463379, "global_step": 130165, "epoch": 774} {"train_loss": -10.329136848449707, "global_step": 130166, "epoch": 774} {"train_loss": -10.115039825439453, "global_step": 130167, "epoch": 774} {"train_loss": -10.283857345581055, "global_step": 130168, "epoch": 774} {"train_loss": -9.998592376708984, "global_step": 130169, "epoch": 774} {"train_loss": -10.335811614990234, "global_step": 130170, "epoch": 774} {"train_loss": -9.819255828857422, "global_step": 130171, "epoch": 774} {"train_loss": -10.593643188476562, "global_step": 130172, "epoch": 774} {"train_loss": -9.972769737243652, "global_step": 130173, "epoch": 774} {"train_loss": -10.29372501373291, "global_step": 130174, "epoch": 774} {"train_loss": -10.184955596923828, "global_step": 130175, "epoch": 774} {"train_loss": -9.99821662902832, "global_step": 130176, "epoch": 774} {"train_loss": -10.196016311645508, "global_step": 130177, "epoch": 774} {"train_loss": -10.317708969116211, "global_step": 130178, "epoch": 774} {"train_loss": -10.01945686340332, "global_step": 130179, "epoch": 774} {"train_loss": -10.325898170471191, "global_step": 130180, "epoch": 774} {"train_loss": -9.875468254089355, "global_step": 130181, "epoch": 774} {"train_loss": -9.9700288772583, "global_step": 130182, "epoch": 774} {"train_loss": -9.81986141204834, "global_step": 130183, "epoch": 774} {"train_loss": -10.204200744628906, "global_step": 130184, "epoch": 774} {"train_loss": -10.169910430908203, "global_step": 130185, "epoch": 774} {"train_loss": -10.284866333007812, "global_step": 130186, "epoch": 774} {"train_loss": -10.294748306274414, "global_step": 130187, "epoch": 774} {"train_loss": -10.280120849609375, "global_step": 130188, "epoch": 774} {"train_loss": -10.202356338500977, "global_step": 130189, "epoch": 774} {"train_loss": -10.16462516784668, "global_step": 130190, "epoch": 774} {"train_loss": -10.338946342468262, "global_step": 130191, "epoch": 774} {"train_loss": -10.20686149597168, "global_step": 130192, "epoch": 774} {"train_loss": -10.047584533691406, "global_step": 130193, "epoch": 774} {"train_loss": -10.172295570373535, "global_step": 130194, "epoch": 774} {"train_loss": -9.997687339782715, "global_step": 130195, "epoch": 774} {"train_loss": -10.152854919433594, "global_step": 130196, "epoch": 774} {"train_loss": -10.050973892211914, "global_step": 130197, "epoch": 774} {"train_loss": -10.339282989501953, "global_step": 130198, "epoch": 774} {"train_loss": -10.285656418119158, "global_step": 130199, "epoch": 774, "val_loss": 218523.484375} {"train_loss": -10.388284683227539, "global_step": 130200, "epoch": 775} {"train_loss": -10.5001859664917, "global_step": 130201, "epoch": 775} {"train_loss": -10.47336196899414, "global_step": 130202, "epoch": 775} {"train_loss": -10.377691268920898, "global_step": 130203, "epoch": 775} {"train_loss": -10.571403503417969, "global_step": 130204, "epoch": 775} {"train_loss": -10.269272804260254, "global_step": 130205, "epoch": 775} {"train_loss": -10.49341869354248, "global_step": 130206, "epoch": 775} {"train_loss": -10.474494934082031, "global_step": 130207, "epoch": 775} {"train_loss": -10.439817428588867, "global_step": 130208, "epoch": 775} {"train_loss": -10.535921096801758, "global_step": 130209, "epoch": 775} {"train_loss": -10.524740219116211, "global_step": 130210, "epoch": 775} {"train_loss": -10.29931354522705, "global_step": 130211, "epoch": 775} {"train_loss": -10.537010192871094, "global_step": 130212, "epoch": 775} {"train_loss": -10.681386947631836, "global_step": 130213, "epoch": 775} {"train_loss": -10.59377670288086, "global_step": 130214, "epoch": 775} {"train_loss": -10.42886734008789, "global_step": 130215, "epoch": 775} {"train_loss": -10.563711166381836, "global_step": 130216, "epoch": 775} {"train_loss": -10.453720092773438, "global_step": 130217, "epoch": 775} {"train_loss": -10.518379211425781, "global_step": 130218, "epoch": 775} {"train_loss": -10.714717864990234, "global_step": 130219, "epoch": 775} {"train_loss": -10.37411880493164, "global_step": 130220, "epoch": 775} {"train_loss": -10.7589111328125, "global_step": 130221, "epoch": 775} {"train_loss": -10.600909233093262, "global_step": 130222, "epoch": 775} {"train_loss": -10.482162475585938, "global_step": 130223, "epoch": 775} {"train_loss": -10.584003448486328, "global_step": 130224, "epoch": 775} {"train_loss": -10.409501075744629, "global_step": 130225, "epoch": 775} {"train_loss": -10.61509895324707, "global_step": 130226, "epoch": 775} {"train_loss": -10.616912841796875, "global_step": 130227, "epoch": 775} {"train_loss": -10.158321380615234, "global_step": 130228, "epoch": 775} {"train_loss": -10.55093002319336, "global_step": 130229, "epoch": 775} {"train_loss": -10.000133514404297, "global_step": 130230, "epoch": 775} {"train_loss": -10.322834014892578, "global_step": 130231, "epoch": 775} {"train_loss": -10.072772026062012, "global_step": 130232, "epoch": 775} {"train_loss": -9.613069534301758, "global_step": 130233, "epoch": 775} {"train_loss": -10.472562789916992, "global_step": 130234, "epoch": 775} {"train_loss": -9.703514099121094, "global_step": 130235, "epoch": 775} {"train_loss": -10.1639404296875, "global_step": 130236, "epoch": 775} {"train_loss": -10.093387603759766, "global_step": 130237, "epoch": 775} {"train_loss": -10.300039291381836, "global_step": 130238, "epoch": 775} {"train_loss": -10.490501403808594, "global_step": 130239, "epoch": 775} {"train_loss": -9.583427429199219, "global_step": 130240, "epoch": 775} {"train_loss": -10.291654586791992, "global_step": 130241, "epoch": 775} {"train_loss": -10.131584167480469, "global_step": 130242, "epoch": 775} {"train_loss": -10.425926208496094, "global_step": 130243, "epoch": 775} {"train_loss": -9.963315963745117, "global_step": 130244, "epoch": 775} {"train_loss": -10.230292320251465, "global_step": 130245, "epoch": 775} {"train_loss": -10.25698471069336, "global_step": 130246, "epoch": 775} {"train_loss": -10.097257614135742, "global_step": 130247, "epoch": 775} {"train_loss": -10.119850158691406, "global_step": 130248, "epoch": 775} {"train_loss": -10.254663467407227, "global_step": 130249, "epoch": 775} {"train_loss": -10.27639389038086, "global_step": 130250, "epoch": 775} {"train_loss": -10.559161186218262, "global_step": 130251, "epoch": 775} {"train_loss": -10.397449493408203, "global_step": 130252, "epoch": 775} {"train_loss": -10.126928329467773, "global_step": 130253, "epoch": 775} {"train_loss": -10.407812118530273, "global_step": 130254, "epoch": 775} {"train_loss": -9.914169311523438, "global_step": 130255, "epoch": 775} {"train_loss": -10.062662124633789, "global_step": 130256, "epoch": 775} {"train_loss": -10.179109573364258, "global_step": 130257, "epoch": 775} {"train_loss": -9.98530101776123, "global_step": 130258, "epoch": 775} {"train_loss": -10.151275634765625, "global_step": 130259, "epoch": 775} {"train_loss": -10.509954452514648, "global_step": 130260, "epoch": 775} {"train_loss": -9.782570838928223, "global_step": 130261, "epoch": 775} {"train_loss": -10.490900993347168, "global_step": 130262, "epoch": 775} {"train_loss": -10.217641830444336, "global_step": 130263, "epoch": 775} {"train_loss": -10.46275520324707, "global_step": 130264, "epoch": 775} {"train_loss": -10.18884563446045, "global_step": 130265, "epoch": 775} {"train_loss": -10.281810760498047, "global_step": 130266, "epoch": 775} {"train_loss": -9.778828620910645, "global_step": 130267, "epoch": 775} {"train_loss": -10.297294616699219, "global_step": 130268, "epoch": 775} {"train_loss": -10.031818389892578, "global_step": 130269, "epoch": 775} {"train_loss": -10.240184783935547, "global_step": 130270, "epoch": 775} {"train_loss": -10.160905838012695, "global_step": 130271, "epoch": 775} {"train_loss": -9.99445915222168, "global_step": 130272, "epoch": 775} {"train_loss": -10.285721778869629, "global_step": 130273, "epoch": 775} {"train_loss": -10.459829330444336, "global_step": 130274, "epoch": 775} {"train_loss": -10.61166763305664, "global_step": 130275, "epoch": 775} {"train_loss": -10.15300178527832, "global_step": 130276, "epoch": 775} {"train_loss": -10.508722305297852, "global_step": 130277, "epoch": 775} {"train_loss": -10.500810623168945, "global_step": 130278, "epoch": 775} {"train_loss": -10.478887557983398, "global_step": 130279, "epoch": 775} {"train_loss": -10.537691116333008, "global_step": 130280, "epoch": 775} {"train_loss": -10.567131996154785, "global_step": 130281, "epoch": 775} {"train_loss": -10.535608291625977, "global_step": 130282, "epoch": 775} {"train_loss": -10.6052885055542, "global_step": 130283, "epoch": 775} {"train_loss": -10.542753219604492, "global_step": 130284, "epoch": 775} {"train_loss": -10.515093803405762, "global_step": 130285, "epoch": 775} {"train_loss": -10.37575912475586, "global_step": 130286, "epoch": 775} {"train_loss": -10.460884094238281, "global_step": 130287, "epoch": 775} {"train_loss": -10.420082092285156, "global_step": 130288, "epoch": 775} {"train_loss": -10.535459518432617, "global_step": 130289, "epoch": 775} {"train_loss": -10.620667457580566, "global_step": 130290, "epoch": 775} {"train_loss": -10.713951110839844, "global_step": 130291, "epoch": 775} {"train_loss": -10.619585990905762, "global_step": 130292, "epoch": 775} {"train_loss": -10.74969482421875, "global_step": 130293, "epoch": 775} {"train_loss": -10.402329444885254, "global_step": 130294, "epoch": 775} {"train_loss": -10.272339820861816, "global_step": 130295, "epoch": 775} {"train_loss": -10.170309066772461, "global_step": 130296, "epoch": 775} {"train_loss": -9.838815689086914, "global_step": 130297, "epoch": 775} {"train_loss": -10.479323387145996, "global_step": 130298, "epoch": 775} {"train_loss": -10.152053833007812, "global_step": 130299, "epoch": 775} {"train_loss": -10.681183815002441, "global_step": 130300, "epoch": 775} {"train_loss": -10.303878784179688, "global_step": 130301, "epoch": 775} {"train_loss": -10.488389015197754, "global_step": 130302, "epoch": 775} {"train_loss": -10.376446723937988, "global_step": 130303, "epoch": 775} {"train_loss": -10.487879753112793, "global_step": 130304, "epoch": 775} {"train_loss": -10.025296211242676, "global_step": 130305, "epoch": 775} {"train_loss": -10.389532089233398, "global_step": 130306, "epoch": 775} {"train_loss": -9.903178215026855, "global_step": 130307, "epoch": 775} {"train_loss": -10.181482315063477, "global_step": 130308, "epoch": 775} {"train_loss": -10.43489933013916, "global_step": 130309, "epoch": 775} {"train_loss": -10.270354270935059, "global_step": 130310, "epoch": 775} {"train_loss": -10.32640266418457, "global_step": 130311, "epoch": 775} {"train_loss": -10.339786529541016, "global_step": 130312, "epoch": 775} {"train_loss": -9.890026092529297, "global_step": 130313, "epoch": 775} {"train_loss": -10.425713539123535, "global_step": 130314, "epoch": 775} {"train_loss": -10.195917129516602, "global_step": 130315, "epoch": 775} {"train_loss": -9.806167602539062, "global_step": 130316, "epoch": 775} {"train_loss": -10.374835968017578, "global_step": 130317, "epoch": 775} {"train_loss": -9.747557640075684, "global_step": 130318, "epoch": 775} {"train_loss": -10.065263748168945, "global_step": 130319, "epoch": 775} {"train_loss": -9.70199203491211, "global_step": 130320, "epoch": 775} {"train_loss": -10.314094543457031, "global_step": 130321, "epoch": 775} {"train_loss": -10.153145790100098, "global_step": 130322, "epoch": 775} {"train_loss": -10.194862365722656, "global_step": 130323, "epoch": 775} {"train_loss": -10.703632354736328, "global_step": 130324, "epoch": 775} {"train_loss": -10.132922172546387, "global_step": 130325, "epoch": 775} {"train_loss": -10.232464790344238, "global_step": 130326, "epoch": 775} {"train_loss": -10.350774765014648, "global_step": 130327, "epoch": 775} {"train_loss": -10.380952835083008, "global_step": 130328, "epoch": 775} {"train_loss": -10.654143333435059, "global_step": 130329, "epoch": 775} {"train_loss": -10.11836051940918, "global_step": 130330, "epoch": 775} {"train_loss": -10.373157501220703, "global_step": 130331, "epoch": 775} {"train_loss": -10.687755584716797, "global_step": 130332, "epoch": 775} {"train_loss": -10.542880058288574, "global_step": 130333, "epoch": 775} {"train_loss": -10.347156524658203, "global_step": 130334, "epoch": 775} {"train_loss": -10.335342407226562, "global_step": 130335, "epoch": 775} {"train_loss": -10.412071228027344, "global_step": 130336, "epoch": 775} {"train_loss": -10.51338005065918, "global_step": 130337, "epoch": 775} {"train_loss": -10.275842666625977, "global_step": 130338, "epoch": 775} {"train_loss": -10.472326278686523, "global_step": 130339, "epoch": 775} {"train_loss": -10.28562068939209, "global_step": 130340, "epoch": 775} {"train_loss": -10.46622085571289, "global_step": 130341, "epoch": 775} {"train_loss": -10.520807266235352, "global_step": 130342, "epoch": 775} {"train_loss": -10.222932815551758, "global_step": 130343, "epoch": 775} {"train_loss": -10.405604362487793, "global_step": 130344, "epoch": 775} {"train_loss": -10.04838752746582, "global_step": 130345, "epoch": 775} {"train_loss": -10.334296226501465, "global_step": 130346, "epoch": 775} {"train_loss": -10.499332427978516, "global_step": 130347, "epoch": 775} {"train_loss": -10.540943145751953, "global_step": 130348, "epoch": 775} {"train_loss": -10.62604808807373, "global_step": 130349, "epoch": 775} {"train_loss": -10.430834770202637, "global_step": 130350, "epoch": 775} {"train_loss": -10.621334075927734, "global_step": 130351, "epoch": 775} {"train_loss": -10.486600875854492, "global_step": 130352, "epoch": 775} {"train_loss": -10.50721549987793, "global_step": 130353, "epoch": 775} {"train_loss": -10.583036422729492, "global_step": 130354, "epoch": 775} {"train_loss": -10.622252464294434, "global_step": 130355, "epoch": 775} {"train_loss": -10.419218063354492, "global_step": 130356, "epoch": 775} {"train_loss": -10.61317253112793, "global_step": 130357, "epoch": 775} {"train_loss": -10.824146270751953, "global_step": 130358, "epoch": 775} {"train_loss": -10.445362091064453, "global_step": 130359, "epoch": 775} {"train_loss": -10.566573143005371, "global_step": 130360, "epoch": 775} {"train_loss": -10.753583908081055, "global_step": 130361, "epoch": 775} {"train_loss": -10.252462387084961, "global_step": 130362, "epoch": 775} {"train_loss": -10.648487091064453, "global_step": 130363, "epoch": 775} {"train_loss": -10.588934898376465, "global_step": 130364, "epoch": 775} {"train_loss": -10.520705223083496, "global_step": 130365, "epoch": 775} {"train_loss": -10.595144271850586, "global_step": 130366, "epoch": 775} {"train_loss": -10.354793968654814, "global_step": 130367, "epoch": 775, "val_loss": 221274.6875, "train_action_mse_error": 1.416914463043213} {"train_loss": -10.536982536315918, "global_step": 130368, "epoch": 776} {"train_loss": -9.830482482910156, "global_step": 130369, "epoch": 776} {"train_loss": -9.655660629272461, "global_step": 130370, "epoch": 776} {"train_loss": -10.169960021972656, "global_step": 130371, "epoch": 776} {"train_loss": -10.410503387451172, "global_step": 130372, "epoch": 776} {"train_loss": -10.020681381225586, "global_step": 130373, "epoch": 776} {"train_loss": -10.188611030578613, "global_step": 130374, "epoch": 776} {"train_loss": -10.100557327270508, "global_step": 130375, "epoch": 776} {"train_loss": -8.423116683959961, "global_step": 130376, "epoch": 776} {"train_loss": -10.035261154174805, "global_step": 130377, "epoch": 776} {"train_loss": -8.787348747253418, "global_step": 130378, "epoch": 776} {"train_loss": -10.388930320739746, "global_step": 130379, "epoch": 776} {"train_loss": -8.10693359375, "global_step": 130380, "epoch": 776} {"train_loss": -9.335118293762207, "global_step": 130381, "epoch": 776} {"train_loss": -9.176513671875, "global_step": 130382, "epoch": 776} {"train_loss": -9.967580795288086, "global_step": 130383, "epoch": 776} {"train_loss": -9.198042869567871, "global_step": 130384, "epoch": 776} {"train_loss": -10.202865600585938, "global_step": 130385, "epoch": 776} {"train_loss": -9.241479873657227, "global_step": 130386, "epoch": 776} {"train_loss": -9.771007537841797, "global_step": 130387, "epoch": 776} {"train_loss": -9.13015365600586, "global_step": 130388, "epoch": 776} {"train_loss": -10.14532470703125, "global_step": 130389, "epoch": 776} {"train_loss": -9.190231323242188, "global_step": 130390, "epoch": 776} {"train_loss": -10.070341110229492, "global_step": 130391, "epoch": 776} {"train_loss": -9.826240539550781, "global_step": 130392, "epoch": 776} {"train_loss": -9.621906280517578, "global_step": 130393, "epoch": 776} {"train_loss": -10.07685661315918, "global_step": 130394, "epoch": 776} {"train_loss": -9.70772933959961, "global_step": 130395, "epoch": 776} {"train_loss": -9.809093475341797, "global_step": 130396, "epoch": 776} {"train_loss": -9.986908912658691, "global_step": 130397, "epoch": 776} {"train_loss": -9.879100799560547, "global_step": 130398, "epoch": 776} {"train_loss": -10.119544982910156, "global_step": 130399, "epoch": 776} {"train_loss": -9.930810928344727, "global_step": 130400, "epoch": 776} {"train_loss": -9.954582214355469, "global_step": 130401, "epoch": 776} {"train_loss": -10.199493408203125, "global_step": 130402, "epoch": 776} {"train_loss": -10.049201965332031, "global_step": 130403, "epoch": 776} {"train_loss": -9.897507667541504, "global_step": 130404, "epoch": 776} {"train_loss": -10.354175567626953, "global_step": 130405, "epoch": 776} {"train_loss": -9.914261817932129, "global_step": 130406, "epoch": 776} {"train_loss": -10.166584014892578, "global_step": 130407, "epoch": 776} {"train_loss": -10.159751892089844, "global_step": 130408, "epoch": 776} {"train_loss": -10.128092765808105, "global_step": 130409, "epoch": 776} {"train_loss": -10.382270812988281, "global_step": 130410, "epoch": 776} {"train_loss": -10.200512886047363, "global_step": 130411, "epoch": 776} {"train_loss": -10.096805572509766, "global_step": 130412, "epoch": 776} {"train_loss": -10.236320495605469, "global_step": 130413, "epoch": 776} {"train_loss": -10.356956481933594, "global_step": 130414, "epoch": 776} {"train_loss": -10.30390739440918, "global_step": 130415, "epoch": 776} {"train_loss": -10.28524398803711, "global_step": 130416, "epoch": 776} {"train_loss": -10.361169815063477, "global_step": 130417, "epoch": 776} {"train_loss": -10.512133598327637, "global_step": 130418, "epoch": 776} {"train_loss": -10.230052947998047, "global_step": 130419, "epoch": 776} {"train_loss": -10.567657470703125, "global_step": 130420, "epoch": 776} {"train_loss": -10.340847969055176, "global_step": 130421, "epoch": 776} {"train_loss": -10.536527633666992, "global_step": 130422, "epoch": 776} {"train_loss": -10.38638687133789, "global_step": 130423, "epoch": 776} {"train_loss": -10.409845352172852, "global_step": 130424, "epoch": 776} {"train_loss": -10.33711051940918, "global_step": 130425, "epoch": 776} {"train_loss": -10.50341796875, "global_step": 130426, "epoch": 776} {"train_loss": -10.47343635559082, "global_step": 130427, "epoch": 776} {"train_loss": -10.44625186920166, "global_step": 130428, "epoch": 776} {"train_loss": -10.487974166870117, "global_step": 130429, "epoch": 776} {"train_loss": -10.474517822265625, "global_step": 130430, "epoch": 776} {"train_loss": -10.293943405151367, "global_step": 130431, "epoch": 776} {"train_loss": -10.646142959594727, "global_step": 130432, "epoch": 776} {"train_loss": -10.601691246032715, "global_step": 130433, "epoch": 776} {"train_loss": -10.624794960021973, "global_step": 130434, "epoch": 776} {"train_loss": -10.581987380981445, "global_step": 130435, "epoch": 776} {"train_loss": -10.318170547485352, "global_step": 130436, "epoch": 776} {"train_loss": -10.450918197631836, "global_step": 130437, "epoch": 776} {"train_loss": -10.439617156982422, "global_step": 130438, "epoch": 776} {"train_loss": -10.21896743774414, "global_step": 130439, "epoch": 776} {"train_loss": -10.437637329101562, "global_step": 130440, "epoch": 776} {"train_loss": -10.696755409240723, "global_step": 130441, "epoch": 776} {"train_loss": -10.237456321716309, "global_step": 130442, "epoch": 776} {"train_loss": -10.43509292602539, "global_step": 130443, "epoch": 776} {"train_loss": -10.485555648803711, "global_step": 130444, "epoch": 776} {"train_loss": -10.512210845947266, "global_step": 130445, "epoch": 776} {"train_loss": -10.47067928314209, "global_step": 130446, "epoch": 776} {"train_loss": -10.521844863891602, "global_step": 130447, "epoch": 776} {"train_loss": -10.412182807922363, "global_step": 130448, "epoch": 776} {"train_loss": -10.593452453613281, "global_step": 130449, "epoch": 776} {"train_loss": -10.557538986206055, "global_step": 130450, "epoch": 776} {"train_loss": -10.55116081237793, "global_step": 130451, "epoch": 776} {"train_loss": -10.750589370727539, "global_step": 130452, "epoch": 776} {"train_loss": -10.2989501953125, "global_step": 130453, "epoch": 776} {"train_loss": -10.513425827026367, "global_step": 130454, "epoch": 776} {"train_loss": -9.987943649291992, "global_step": 130455, "epoch": 776} {"train_loss": -10.562328338623047, "global_step": 130456, "epoch": 776} {"train_loss": -10.317195892333984, "global_step": 130457, "epoch": 776} {"train_loss": -10.45150375366211, "global_step": 130458, "epoch": 776} {"train_loss": -10.400522232055664, "global_step": 130459, "epoch": 776} {"train_loss": -10.444368362426758, "global_step": 130460, "epoch": 776} {"train_loss": -9.813709259033203, "global_step": 130461, "epoch": 776} {"train_loss": -10.38029670715332, "global_step": 130462, "epoch": 776} {"train_loss": -10.226017951965332, "global_step": 130463, "epoch": 776} {"train_loss": -9.892616271972656, "global_step": 130464, "epoch": 776} {"train_loss": -10.569765090942383, "global_step": 130465, "epoch": 776} {"train_loss": -10.208733558654785, "global_step": 130466, "epoch": 776} {"train_loss": -10.208017349243164, "global_step": 130467, "epoch": 776} {"train_loss": -10.154298782348633, "global_step": 130468, "epoch": 776} {"train_loss": -9.76820182800293, "global_step": 130469, "epoch": 776} {"train_loss": -10.38626480102539, "global_step": 130470, "epoch": 776} {"train_loss": -9.962263107299805, "global_step": 130471, "epoch": 776} {"train_loss": -10.561887741088867, "global_step": 130472, "epoch": 776} {"train_loss": -10.202096939086914, "global_step": 130473, "epoch": 776} {"train_loss": -9.675653457641602, "global_step": 130474, "epoch": 776} {"train_loss": -10.41740608215332, "global_step": 130475, "epoch": 776} {"train_loss": -10.280854225158691, "global_step": 130476, "epoch": 776} {"train_loss": -10.34988784790039, "global_step": 130477, "epoch": 776} {"train_loss": -10.54193115234375, "global_step": 130478, "epoch": 776} {"train_loss": -10.137526512145996, "global_step": 130479, "epoch": 776} {"train_loss": -10.442445755004883, "global_step": 130480, "epoch": 776} {"train_loss": -10.425261497497559, "global_step": 130481, "epoch": 776} {"train_loss": -10.081304550170898, "global_step": 130482, "epoch": 776} {"train_loss": -10.3524169921875, "global_step": 130483, "epoch": 776} {"train_loss": -9.737112045288086, "global_step": 130484, "epoch": 776} {"train_loss": -10.465932846069336, "global_step": 130485, "epoch": 776} {"train_loss": -10.146150588989258, "global_step": 130486, "epoch": 776} {"train_loss": -10.294537544250488, "global_step": 130487, "epoch": 776} {"train_loss": -9.93386173248291, "global_step": 130488, "epoch": 776} {"train_loss": -10.0562744140625, "global_step": 130489, "epoch": 776} {"train_loss": -9.89365005493164, "global_step": 130490, "epoch": 776} {"train_loss": -10.238212585449219, "global_step": 130491, "epoch": 776} {"train_loss": -10.111369132995605, "global_step": 130492, "epoch": 776} {"train_loss": -10.106880187988281, "global_step": 130493, "epoch": 776} {"train_loss": -10.188014030456543, "global_step": 130494, "epoch": 776} {"train_loss": -10.427907943725586, "global_step": 130495, "epoch": 776} {"train_loss": -9.938225746154785, "global_step": 130496, "epoch": 776} {"train_loss": -10.288383483886719, "global_step": 130497, "epoch": 776} {"train_loss": -9.920308113098145, "global_step": 130498, "epoch": 776} {"train_loss": -9.67466926574707, "global_step": 130499, "epoch": 776} {"train_loss": -9.679594039916992, "global_step": 130500, "epoch": 776} {"train_loss": -9.633223533630371, "global_step": 130501, "epoch": 776} {"train_loss": -9.580907821655273, "global_step": 130502, "epoch": 776} {"train_loss": -9.813255310058594, "global_step": 130503, "epoch": 776} {"train_loss": -9.421197891235352, "global_step": 130504, "epoch": 776} {"train_loss": -10.260063171386719, "global_step": 130505, "epoch": 776} {"train_loss": -9.733248710632324, "global_step": 130506, "epoch": 776} {"train_loss": -9.747093200683594, "global_step": 130507, "epoch": 776} {"train_loss": -10.104135513305664, "global_step": 130508, "epoch": 776} {"train_loss": -9.92112922668457, "global_step": 130509, "epoch": 776} {"train_loss": -9.865771293640137, "global_step": 130510, "epoch": 776} {"train_loss": -10.334139823913574, "global_step": 130511, "epoch": 776} {"train_loss": -9.856807708740234, "global_step": 130512, "epoch": 776} {"train_loss": -10.277800559997559, "global_step": 130513, "epoch": 776} {"train_loss": -10.153488159179688, "global_step": 130514, "epoch": 776} {"train_loss": -9.993030548095703, "global_step": 130515, "epoch": 776} {"train_loss": -10.192577362060547, "global_step": 130516, "epoch": 776} {"train_loss": -10.366430282592773, "global_step": 130517, "epoch": 776} {"train_loss": -10.076532363891602, "global_step": 130518, "epoch": 776} {"train_loss": -10.324965476989746, "global_step": 130519, "epoch": 776} {"train_loss": -10.292261123657227, "global_step": 130520, "epoch": 776} {"train_loss": -10.218515396118164, "global_step": 130521, "epoch": 776} {"train_loss": -10.376486778259277, "global_step": 130522, "epoch": 776} {"train_loss": -10.380066871643066, "global_step": 130523, "epoch": 776} {"train_loss": -10.370223999023438, "global_step": 130524, "epoch": 776} {"train_loss": -10.642878532409668, "global_step": 130525, "epoch": 776} {"train_loss": -10.200773239135742, "global_step": 130526, "epoch": 776} {"train_loss": -10.476106643676758, "global_step": 130527, "epoch": 776} {"train_loss": -10.425785064697266, "global_step": 130528, "epoch": 776} {"train_loss": -10.231115341186523, "global_step": 130529, "epoch": 776} {"train_loss": -10.30758285522461, "global_step": 130530, "epoch": 776} {"train_loss": -10.389488220214844, "global_step": 130531, "epoch": 776} {"train_loss": -10.423737525939941, "global_step": 130532, "epoch": 776} {"train_loss": -10.466753005981445, "global_step": 130533, "epoch": 776} {"train_loss": -10.4691162109375, "global_step": 130534, "epoch": 776} {"train_loss": -10.15270629950932, "global_step": 130535, "epoch": 776, "val_loss": 221769.1875} {"train_loss": -10.314403533935547, "global_step": 130536, "epoch": 777} {"train_loss": -10.432937622070312, "global_step": 130537, "epoch": 777} {"train_loss": -10.392976760864258, "global_step": 130538, "epoch": 777} {"train_loss": -10.657059669494629, "global_step": 130539, "epoch": 777} {"train_loss": -10.598872184753418, "global_step": 130540, "epoch": 777} {"train_loss": -10.621267318725586, "global_step": 130541, "epoch": 777} {"train_loss": -10.594549179077148, "global_step": 130542, "epoch": 777} {"train_loss": -10.63919448852539, "global_step": 130543, "epoch": 777} {"train_loss": -10.589410781860352, "global_step": 130544, "epoch": 777} {"train_loss": -10.625240325927734, "global_step": 130545, "epoch": 777} {"train_loss": -10.429025650024414, "global_step": 130546, "epoch": 777} {"train_loss": -10.582161903381348, "global_step": 130547, "epoch": 777} {"train_loss": -10.71297836303711, "global_step": 130548, "epoch": 777} {"train_loss": -10.612273216247559, "global_step": 130549, "epoch": 777} {"train_loss": -10.609185218811035, "global_step": 130550, "epoch": 777} {"train_loss": -10.4810152053833, "global_step": 130551, "epoch": 777} {"train_loss": -10.78342342376709, "global_step": 130552, "epoch": 777} {"train_loss": -10.608962059020996, "global_step": 130553, "epoch": 777} {"train_loss": -10.366240501403809, "global_step": 130554, "epoch": 777} {"train_loss": -10.557952880859375, "global_step": 130555, "epoch": 777} {"train_loss": -10.728189468383789, "global_step": 130556, "epoch": 777} {"train_loss": -10.262983322143555, "global_step": 130557, "epoch": 777} {"train_loss": -10.71428108215332, "global_step": 130558, "epoch": 777} {"train_loss": -10.629721641540527, "global_step": 130559, "epoch": 777} {"train_loss": -10.265619277954102, "global_step": 130560, "epoch": 777} {"train_loss": -10.307941436767578, "global_step": 130561, "epoch": 777} {"train_loss": -10.650768280029297, "global_step": 130562, "epoch": 777} {"train_loss": -9.999284744262695, "global_step": 130563, "epoch": 777} {"train_loss": -10.430742263793945, "global_step": 130564, "epoch": 777} {"train_loss": -9.910379409790039, "global_step": 130565, "epoch": 777} {"train_loss": -10.44135856628418, "global_step": 130566, "epoch": 777} {"train_loss": -10.312023162841797, "global_step": 130567, "epoch": 777} {"train_loss": -10.225970268249512, "global_step": 130568, "epoch": 777} {"train_loss": -10.253552436828613, "global_step": 130569, "epoch": 777} {"train_loss": -10.25016975402832, "global_step": 130570, "epoch": 777} {"train_loss": -10.284839630126953, "global_step": 130571, "epoch": 777} {"train_loss": -9.90746784210205, "global_step": 130572, "epoch": 777} {"train_loss": -9.569185256958008, "global_step": 130573, "epoch": 777} {"train_loss": -10.529062271118164, "global_step": 130574, "epoch": 777} {"train_loss": -9.96844482421875, "global_step": 130575, "epoch": 777} {"train_loss": -10.238946914672852, "global_step": 130576, "epoch": 777} {"train_loss": -9.591705322265625, "global_step": 130577, "epoch": 777} {"train_loss": -10.085343360900879, "global_step": 130578, "epoch": 777} {"train_loss": -10.052263259887695, "global_step": 130579, "epoch": 777} {"train_loss": -9.482906341552734, "global_step": 130580, "epoch": 777} {"train_loss": -10.011849403381348, "global_step": 130581, "epoch": 777} {"train_loss": -9.754927635192871, "global_step": 130582, "epoch": 777} {"train_loss": -10.228446960449219, "global_step": 130583, "epoch": 777} {"train_loss": -10.314216613769531, "global_step": 130584, "epoch": 777} {"train_loss": -9.903974533081055, "global_step": 130585, "epoch": 777} {"train_loss": -10.026021957397461, "global_step": 130586, "epoch": 777} {"train_loss": -10.349114418029785, "global_step": 130587, "epoch": 777} {"train_loss": -10.175094604492188, "global_step": 130588, "epoch": 777} {"train_loss": -10.346579551696777, "global_step": 130589, "epoch": 777} {"train_loss": -10.217840194702148, "global_step": 130590, "epoch": 777} {"train_loss": -10.058586120605469, "global_step": 130591, "epoch": 777} {"train_loss": -10.499720573425293, "global_step": 130592, "epoch": 777} {"train_loss": -10.213338851928711, "global_step": 130593, "epoch": 777} {"train_loss": -10.12005615234375, "global_step": 130594, "epoch": 777} {"train_loss": -10.31167984008789, "global_step": 130595, "epoch": 777} {"train_loss": -10.203091621398926, "global_step": 130596, "epoch": 777} {"train_loss": -10.205162048339844, "global_step": 130597, "epoch": 777} {"train_loss": -10.341573715209961, "global_step": 130598, "epoch": 777} {"train_loss": -10.417070388793945, "global_step": 130599, "epoch": 777} {"train_loss": -10.085441589355469, "global_step": 130600, "epoch": 777} {"train_loss": -10.183774948120117, "global_step": 130601, "epoch": 777} {"train_loss": -10.372602462768555, "global_step": 130602, "epoch": 777} {"train_loss": -10.577655792236328, "global_step": 130603, "epoch": 777} {"train_loss": -10.334565162658691, "global_step": 130604, "epoch": 777} {"train_loss": -10.444709777832031, "global_step": 130605, "epoch": 777} {"train_loss": -10.154988288879395, "global_step": 130606, "epoch": 777} {"train_loss": -10.454923629760742, "global_step": 130607, "epoch": 777} {"train_loss": -10.274456977844238, "global_step": 130608, "epoch": 777} {"train_loss": -10.307432174682617, "global_step": 130609, "epoch": 777} {"train_loss": -10.36379337310791, "global_step": 130610, "epoch": 777} {"train_loss": -10.412534713745117, "global_step": 130611, "epoch": 777} {"train_loss": -10.22199821472168, "global_step": 130612, "epoch": 777} {"train_loss": -10.60627269744873, "global_step": 130613, "epoch": 777} {"train_loss": -10.192768096923828, "global_step": 130614, "epoch": 777} {"train_loss": -10.367727279663086, "global_step": 130615, "epoch": 777} {"train_loss": -10.426228523254395, "global_step": 130616, "epoch": 777} {"train_loss": -10.339794158935547, "global_step": 130617, "epoch": 777} {"train_loss": -10.37525749206543, "global_step": 130618, "epoch": 777} {"train_loss": -10.190387725830078, "global_step": 130619, "epoch": 777} {"train_loss": -10.405808448791504, "global_step": 130620, "epoch": 777} {"train_loss": -10.477436065673828, "global_step": 130621, "epoch": 777} {"train_loss": -10.192964553833008, "global_step": 130622, "epoch": 777} {"train_loss": -10.494667053222656, "global_step": 130623, "epoch": 777} {"train_loss": -10.482839584350586, "global_step": 130624, "epoch": 777} {"train_loss": -10.517269134521484, "global_step": 130625, "epoch": 777} {"train_loss": -10.364725112915039, "global_step": 130626, "epoch": 777} {"train_loss": -10.474629402160645, "global_step": 130627, "epoch": 777} {"train_loss": -10.156397819519043, "global_step": 130628, "epoch": 777} {"train_loss": -10.0552339553833, "global_step": 130629, "epoch": 777} {"train_loss": -10.438390731811523, "global_step": 130630, "epoch": 777} {"train_loss": -10.32099437713623, "global_step": 130631, "epoch": 777} {"train_loss": -10.327159881591797, "global_step": 130632, "epoch": 777} {"train_loss": -10.458806991577148, "global_step": 130633, "epoch": 777} {"train_loss": -10.425932884216309, "global_step": 130634, "epoch": 777} {"train_loss": -10.350138664245605, "global_step": 130635, "epoch": 777} {"train_loss": -10.494256973266602, "global_step": 130636, "epoch": 777} {"train_loss": -10.422037124633789, "global_step": 130637, "epoch": 777} {"train_loss": -10.36564826965332, "global_step": 130638, "epoch": 777} {"train_loss": -10.360755920410156, "global_step": 130639, "epoch": 777} {"train_loss": -10.201236724853516, "global_step": 130640, "epoch": 777} {"train_loss": -10.109233856201172, "global_step": 130641, "epoch": 777} {"train_loss": -10.086739540100098, "global_step": 130642, "epoch": 777} {"train_loss": -10.5142240524292, "global_step": 130643, "epoch": 777} {"train_loss": -9.93319320678711, "global_step": 130644, "epoch": 777} {"train_loss": -10.130815505981445, "global_step": 130645, "epoch": 777} {"train_loss": -10.444181442260742, "global_step": 130646, "epoch": 777} {"train_loss": -10.62208366394043, "global_step": 130647, "epoch": 777} {"train_loss": -10.266764640808105, "global_step": 130648, "epoch": 777} {"train_loss": -10.507476806640625, "global_step": 130649, "epoch": 777} {"train_loss": -10.377305030822754, "global_step": 130650, "epoch": 777} {"train_loss": -10.243478775024414, "global_step": 130651, "epoch": 777} {"train_loss": -10.613531112670898, "global_step": 130652, "epoch": 777} {"train_loss": -10.520891189575195, "global_step": 130653, "epoch": 777} {"train_loss": -10.625896453857422, "global_step": 130654, "epoch": 777} {"train_loss": -10.622953414916992, "global_step": 130655, "epoch": 777} {"train_loss": -10.527167320251465, "global_step": 130656, "epoch": 777} {"train_loss": -10.419429779052734, "global_step": 130657, "epoch": 777} {"train_loss": -10.390218734741211, "global_step": 130658, "epoch": 777} {"train_loss": -10.318168640136719, "global_step": 130659, "epoch": 777} {"train_loss": -10.210439682006836, "global_step": 130660, "epoch": 777} {"train_loss": -10.30526351928711, "global_step": 130661, "epoch": 777} {"train_loss": -10.615800857543945, "global_step": 130662, "epoch": 777} {"train_loss": -10.299484252929688, "global_step": 130663, "epoch": 777} {"train_loss": -10.512203216552734, "global_step": 130664, "epoch": 777} {"train_loss": -10.454130172729492, "global_step": 130665, "epoch": 777} {"train_loss": -10.20004653930664, "global_step": 130666, "epoch": 777} {"train_loss": -10.338884353637695, "global_step": 130667, "epoch": 777} {"train_loss": -10.168633460998535, "global_step": 130668, "epoch": 777} {"train_loss": -10.230528831481934, "global_step": 130669, "epoch": 777} {"train_loss": -10.253551483154297, "global_step": 130670, "epoch": 777} {"train_loss": -9.778231620788574, "global_step": 130671, "epoch": 777} {"train_loss": -9.95650863647461, "global_step": 130672, "epoch": 777} {"train_loss": -9.993575096130371, "global_step": 130673, "epoch": 777} {"train_loss": -10.138154983520508, "global_step": 130674, "epoch": 777} {"train_loss": -10.39596939086914, "global_step": 130675, "epoch": 777} {"train_loss": -10.14316463470459, "global_step": 130676, "epoch": 777} {"train_loss": -10.584659576416016, "global_step": 130677, "epoch": 777} {"train_loss": -10.044296264648438, "global_step": 130678, "epoch": 777} {"train_loss": -10.109232902526855, "global_step": 130679, "epoch": 777} {"train_loss": -10.207358360290527, "global_step": 130680, "epoch": 777} {"train_loss": -10.038108825683594, "global_step": 130681, "epoch": 777} {"train_loss": -10.347593307495117, "global_step": 130682, "epoch": 777} {"train_loss": -9.804038047790527, "global_step": 130683, "epoch": 777} {"train_loss": -10.527290344238281, "global_step": 130684, "epoch": 777} {"train_loss": -10.141254425048828, "global_step": 130685, "epoch": 777} {"train_loss": -10.331340789794922, "global_step": 130686, "epoch": 777} {"train_loss": -10.01079273223877, "global_step": 130687, "epoch": 777} {"train_loss": -10.140911102294922, "global_step": 130688, "epoch": 777} {"train_loss": -10.344690322875977, "global_step": 130689, "epoch": 777} {"train_loss": -10.302251815795898, "global_step": 130690, "epoch": 777} {"train_loss": -10.051366806030273, "global_step": 130691, "epoch": 777} {"train_loss": -10.101831436157227, "global_step": 130692, "epoch": 777} {"train_loss": -9.92264175415039, "global_step": 130693, "epoch": 777} {"train_loss": -10.367406845092773, "global_step": 130694, "epoch": 777} {"train_loss": -10.146327018737793, "global_step": 130695, "epoch": 777} {"train_loss": -10.373961448669434, "global_step": 130696, "epoch": 777} {"train_loss": -10.459866523742676, "global_step": 130697, "epoch": 777} {"train_loss": -10.677175521850586, "global_step": 130698, "epoch": 777} {"train_loss": -10.331249237060547, "global_step": 130699, "epoch": 777} {"train_loss": -10.437495231628418, "global_step": 130700, "epoch": 777} {"train_loss": -10.354459762573242, "global_step": 130701, "epoch": 777} {"train_loss": -10.44639778137207, "global_step": 130702, "epoch": 777} {"train_loss": -10.31399538971129, "global_step": 130703, "epoch": 777, "val_loss": 221972.921875} {"train_loss": -10.57633113861084, "global_step": 130704, "epoch": 778} {"train_loss": -10.47384262084961, "global_step": 130705, "epoch": 778} {"train_loss": -10.569195747375488, "global_step": 130706, "epoch": 778} {"train_loss": -10.024457931518555, "global_step": 130707, "epoch": 778} {"train_loss": -10.374296188354492, "global_step": 130708, "epoch": 778} {"train_loss": -10.482051849365234, "global_step": 130709, "epoch": 778} {"train_loss": -10.624553680419922, "global_step": 130710, "epoch": 778} {"train_loss": -10.535480499267578, "global_step": 130711, "epoch": 778} {"train_loss": -10.241682052612305, "global_step": 130712, "epoch": 778} {"train_loss": -10.710068702697754, "global_step": 130713, "epoch": 778} {"train_loss": -10.276132583618164, "global_step": 130714, "epoch": 778} {"train_loss": -10.395517349243164, "global_step": 130715, "epoch": 778} {"train_loss": -10.53194808959961, "global_step": 130716, "epoch": 778} {"train_loss": -10.525063514709473, "global_step": 130717, "epoch": 778} {"train_loss": -10.700628280639648, "global_step": 130718, "epoch": 778} {"train_loss": -10.404476165771484, "global_step": 130719, "epoch": 778} {"train_loss": -10.524277687072754, "global_step": 130720, "epoch": 778} {"train_loss": -10.469669342041016, "global_step": 130721, "epoch": 778} {"train_loss": -10.583986282348633, "global_step": 130722, "epoch": 778} {"train_loss": -10.205584526062012, "global_step": 130723, "epoch": 778} {"train_loss": -10.282801628112793, "global_step": 130724, "epoch": 778} {"train_loss": -10.403608322143555, "global_step": 130725, "epoch": 778} {"train_loss": -9.963518142700195, "global_step": 130726, "epoch": 778} {"train_loss": -10.721271514892578, "global_step": 130727, "epoch": 778} {"train_loss": -10.146017074584961, "global_step": 130728, "epoch": 778} {"train_loss": -10.437653541564941, "global_step": 130729, "epoch": 778} {"train_loss": -10.62846565246582, "global_step": 130730, "epoch": 778} {"train_loss": -10.149657249450684, "global_step": 130731, "epoch": 778} {"train_loss": -10.307307243347168, "global_step": 130732, "epoch": 778} {"train_loss": -10.35226821899414, "global_step": 130733, "epoch": 778} {"train_loss": -10.453816413879395, "global_step": 130734, "epoch": 778} {"train_loss": -10.189157485961914, "global_step": 130735, "epoch": 778} {"train_loss": -10.424915313720703, "global_step": 130736, "epoch": 778} {"train_loss": -10.185138702392578, "global_step": 130737, "epoch": 778} {"train_loss": -10.10283088684082, "global_step": 130738, "epoch": 778} {"train_loss": -10.769475936889648, "global_step": 130739, "epoch": 778} {"train_loss": -10.33749008178711, "global_step": 130740, "epoch": 778} {"train_loss": -10.509603500366211, "global_step": 130741, "epoch": 778} {"train_loss": -10.505123138427734, "global_step": 130742, "epoch": 778} {"train_loss": -10.324590682983398, "global_step": 130743, "epoch": 778} {"train_loss": -10.550291061401367, "global_step": 130744, "epoch": 778} {"train_loss": -10.322321891784668, "global_step": 130745, "epoch": 778} {"train_loss": -10.60061264038086, "global_step": 130746, "epoch": 778} {"train_loss": -10.416749000549316, "global_step": 130747, "epoch": 778} {"train_loss": -10.419376373291016, "global_step": 130748, "epoch": 778} {"train_loss": -10.392902374267578, "global_step": 130749, "epoch": 778} {"train_loss": -10.632223129272461, "global_step": 130750, "epoch": 778} {"train_loss": -10.652876853942871, "global_step": 130751, "epoch": 778} {"train_loss": -10.605559349060059, "global_step": 130752, "epoch": 778} {"train_loss": -10.480867385864258, "global_step": 130753, "epoch": 778} {"train_loss": -10.760592460632324, "global_step": 130754, "epoch": 778} {"train_loss": -10.729808807373047, "global_step": 130755, "epoch": 778} {"train_loss": -10.722715377807617, "global_step": 130756, "epoch": 778} {"train_loss": -10.706766128540039, "global_step": 130757, "epoch": 778} {"train_loss": -10.404691696166992, "global_step": 130758, "epoch": 778} {"train_loss": -10.565479278564453, "global_step": 130759, "epoch": 778} {"train_loss": -10.724054336547852, "global_step": 130760, "epoch": 778} {"train_loss": -10.341014862060547, "global_step": 130761, "epoch": 778} {"train_loss": -10.45490550994873, "global_step": 130762, "epoch": 778} {"train_loss": -10.360269546508789, "global_step": 130763, "epoch": 778} {"train_loss": -10.033201217651367, "global_step": 130764, "epoch": 778} {"train_loss": -9.917838096618652, "global_step": 130765, "epoch": 778} {"train_loss": -10.448261260986328, "global_step": 130766, "epoch": 778} {"train_loss": -9.610852241516113, "global_step": 130767, "epoch": 778} {"train_loss": -9.941793441772461, "global_step": 130768, "epoch": 778} {"train_loss": -9.879297256469727, "global_step": 130769, "epoch": 778} {"train_loss": -10.010259628295898, "global_step": 130770, "epoch": 778} {"train_loss": -10.153654098510742, "global_step": 130771, "epoch": 778} {"train_loss": -9.632965087890625, "global_step": 130772, "epoch": 778} {"train_loss": -10.455706596374512, "global_step": 130773, "epoch": 778} {"train_loss": -10.11353874206543, "global_step": 130774, "epoch": 778} {"train_loss": -9.902816772460938, "global_step": 130775, "epoch": 778} {"train_loss": -10.351272583007812, "global_step": 130776, "epoch": 778} {"train_loss": -10.18738842010498, "global_step": 130777, "epoch": 778} {"train_loss": -10.315817832946777, "global_step": 130778, "epoch": 778} {"train_loss": -9.819076538085938, "global_step": 130779, "epoch": 778} {"train_loss": -10.18984317779541, "global_step": 130780, "epoch": 778} {"train_loss": -9.938215255737305, "global_step": 130781, "epoch": 778} {"train_loss": -9.912137985229492, "global_step": 130782, "epoch": 778} {"train_loss": -9.984865188598633, "global_step": 130783, "epoch": 778} {"train_loss": -9.777151107788086, "global_step": 130784, "epoch": 778} {"train_loss": -10.474079132080078, "global_step": 130785, "epoch": 778} {"train_loss": -9.786747932434082, "global_step": 130786, "epoch": 778} {"train_loss": -9.915079116821289, "global_step": 130787, "epoch": 778} {"train_loss": -10.106550216674805, "global_step": 130788, "epoch": 778} {"train_loss": -9.709123611450195, "global_step": 130789, "epoch": 778} {"train_loss": -10.15694522857666, "global_step": 130790, "epoch": 778} {"train_loss": -10.442956924438477, "global_step": 130791, "epoch": 778} {"train_loss": -9.92918586730957, "global_step": 130792, "epoch": 778} {"train_loss": -10.102054595947266, "global_step": 130793, "epoch": 778} {"train_loss": -10.221139907836914, "global_step": 130794, "epoch": 778} {"train_loss": -10.030195236206055, "global_step": 130795, "epoch": 778} {"train_loss": -9.989156723022461, "global_step": 130796, "epoch": 778} {"train_loss": -10.010381698608398, "global_step": 130797, "epoch": 778} {"train_loss": -9.89171314239502, "global_step": 130798, "epoch": 778} {"train_loss": -10.432083129882812, "global_step": 130799, "epoch": 778} {"train_loss": -9.840859413146973, "global_step": 130800, "epoch": 778} {"train_loss": -9.864137649536133, "global_step": 130801, "epoch": 778} {"train_loss": -10.11654281616211, "global_step": 130802, "epoch": 778} {"train_loss": -10.051803588867188, "global_step": 130803, "epoch": 778} {"train_loss": -10.227788925170898, "global_step": 130804, "epoch": 778} {"train_loss": -10.193746566772461, "global_step": 130805, "epoch": 778} {"train_loss": -10.135194778442383, "global_step": 130806, "epoch": 778} {"train_loss": -10.077308654785156, "global_step": 130807, "epoch": 778} {"train_loss": -10.101024627685547, "global_step": 130808, "epoch": 778} {"train_loss": -10.117765426635742, "global_step": 130809, "epoch": 778} {"train_loss": -10.2711181640625, "global_step": 130810, "epoch": 778} {"train_loss": -10.406148910522461, "global_step": 130811, "epoch": 778} {"train_loss": -10.235803604125977, "global_step": 130812, "epoch": 778} {"train_loss": -10.308903694152832, "global_step": 130813, "epoch": 778} {"train_loss": -10.1905517578125, "global_step": 130814, "epoch": 778} {"train_loss": -10.353123664855957, "global_step": 130815, "epoch": 778} {"train_loss": -9.989303588867188, "global_step": 130816, "epoch": 778} {"train_loss": -10.39162540435791, "global_step": 130817, "epoch": 778} {"train_loss": -10.284893035888672, "global_step": 130818, "epoch": 778} {"train_loss": -10.191701889038086, "global_step": 130819, "epoch": 778} {"train_loss": -10.399328231811523, "global_step": 130820, "epoch": 778} {"train_loss": -10.389605522155762, "global_step": 130821, "epoch": 778} {"train_loss": -10.528129577636719, "global_step": 130822, "epoch": 778} {"train_loss": -10.351813316345215, "global_step": 130823, "epoch": 778} {"train_loss": -10.328132629394531, "global_step": 130824, "epoch": 778} {"train_loss": -10.484533309936523, "global_step": 130825, "epoch": 778} {"train_loss": -10.37861442565918, "global_step": 130826, "epoch": 778} {"train_loss": -10.36329174041748, "global_step": 130827, "epoch": 778} {"train_loss": -10.422894477844238, "global_step": 130828, "epoch": 778} {"train_loss": -10.332873344421387, "global_step": 130829, "epoch": 778} {"train_loss": -10.392439842224121, "global_step": 130830, "epoch": 778} {"train_loss": -10.486676216125488, "global_step": 130831, "epoch": 778} {"train_loss": -10.448705673217773, "global_step": 130832, "epoch": 778} {"train_loss": -10.63951587677002, "global_step": 130833, "epoch": 778} {"train_loss": -10.45730209350586, "global_step": 130834, "epoch": 778} {"train_loss": -10.644662857055664, "global_step": 130835, "epoch": 778} {"train_loss": -10.651166915893555, "global_step": 130836, "epoch": 778} {"train_loss": -10.558494567871094, "global_step": 130837, "epoch": 778} {"train_loss": -10.548215866088867, "global_step": 130838, "epoch": 778} {"train_loss": -10.401683807373047, "global_step": 130839, "epoch": 778} {"train_loss": -10.387797355651855, "global_step": 130840, "epoch": 778} {"train_loss": -10.323338508605957, "global_step": 130841, "epoch": 778} {"train_loss": -10.07147216796875, "global_step": 130842, "epoch": 778} {"train_loss": -10.50240421295166, "global_step": 130843, "epoch": 778} {"train_loss": -10.637453079223633, "global_step": 130844, "epoch": 778} {"train_loss": -10.304191589355469, "global_step": 130845, "epoch": 778} {"train_loss": -10.592592239379883, "global_step": 130846, "epoch": 778} {"train_loss": -10.237665176391602, "global_step": 130847, "epoch": 778} {"train_loss": -10.116429328918457, "global_step": 130848, "epoch": 778} {"train_loss": -10.367591857910156, "global_step": 130849, "epoch": 778} {"train_loss": -10.565675735473633, "global_step": 130850, "epoch": 778} {"train_loss": -10.511462211608887, "global_step": 130851, "epoch": 778} {"train_loss": -10.348443984985352, "global_step": 130852, "epoch": 778} {"train_loss": -10.447744369506836, "global_step": 130853, "epoch": 778} {"train_loss": -10.328313827514648, "global_step": 130854, "epoch": 778} {"train_loss": -10.620783805847168, "global_step": 130855, "epoch": 778} {"train_loss": -10.815824508666992, "global_step": 130856, "epoch": 778} {"train_loss": -10.680315971374512, "global_step": 130857, "epoch": 778} {"train_loss": -10.244051933288574, "global_step": 130858, "epoch": 778} {"train_loss": -10.59286117553711, "global_step": 130859, "epoch": 778} {"train_loss": -10.45184326171875, "global_step": 130860, "epoch": 778} {"train_loss": -10.407288551330566, "global_step": 130861, "epoch": 778} {"train_loss": -10.732545852661133, "global_step": 130862, "epoch": 778} {"train_loss": -10.506492614746094, "global_step": 130863, "epoch": 778} {"train_loss": -10.687614440917969, "global_step": 130864, "epoch": 778} {"train_loss": -10.633041381835938, "global_step": 130865, "epoch": 778} {"train_loss": -10.493014335632324, "global_step": 130866, "epoch": 778} {"train_loss": -10.595245361328125, "global_step": 130867, "epoch": 778} {"train_loss": -10.368770599365234, "global_step": 130868, "epoch": 778} {"train_loss": -10.243453025817871, "global_step": 130869, "epoch": 778} {"train_loss": -10.648746490478516, "global_step": 130870, "epoch": 778} {"train_loss": -10.336541232608614, "global_step": 130871, "epoch": 778, "val_loss": 220082.703125} {"train_loss": -10.45615291595459, "global_step": 130872, "epoch": 779} {"train_loss": -10.705890655517578, "global_step": 130873, "epoch": 779} {"train_loss": -10.67001724243164, "global_step": 130874, "epoch": 779} {"train_loss": -10.58298397064209, "global_step": 130875, "epoch": 779} {"train_loss": -10.650705337524414, "global_step": 130876, "epoch": 779} {"train_loss": -10.61916446685791, "global_step": 130877, "epoch": 779} {"train_loss": -10.572718620300293, "global_step": 130878, "epoch": 779} {"train_loss": -10.535840034484863, "global_step": 130879, "epoch": 779} {"train_loss": -10.468864440917969, "global_step": 130880, "epoch": 779} {"train_loss": -10.335695266723633, "global_step": 130881, "epoch": 779} {"train_loss": -10.421615600585938, "global_step": 130882, "epoch": 779} {"train_loss": -10.592329025268555, "global_step": 130883, "epoch": 779} {"train_loss": -9.942981719970703, "global_step": 130884, "epoch": 779} {"train_loss": -10.378857612609863, "global_step": 130885, "epoch": 779} {"train_loss": -9.636117935180664, "global_step": 130886, "epoch": 779} {"train_loss": -9.660744667053223, "global_step": 130887, "epoch": 779} {"train_loss": -10.325705528259277, "global_step": 130888, "epoch": 779} {"train_loss": -9.903448104858398, "global_step": 130889, "epoch": 779} {"train_loss": -10.276124954223633, "global_step": 130890, "epoch": 779} {"train_loss": -9.762003898620605, "global_step": 130891, "epoch": 779} {"train_loss": -9.811988830566406, "global_step": 130892, "epoch": 779} {"train_loss": -10.300191879272461, "global_step": 130893, "epoch": 779} {"train_loss": -9.93398666381836, "global_step": 130894, "epoch": 779} {"train_loss": -10.460012435913086, "global_step": 130895, "epoch": 779} {"train_loss": -10.07579231262207, "global_step": 130896, "epoch": 779} {"train_loss": -10.061507225036621, "global_step": 130897, "epoch": 779} {"train_loss": -10.311559677124023, "global_step": 130898, "epoch": 779} {"train_loss": -10.09225845336914, "global_step": 130899, "epoch": 779} {"train_loss": -10.196064949035645, "global_step": 130900, "epoch": 779} {"train_loss": -10.38509750366211, "global_step": 130901, "epoch": 779} {"train_loss": -10.235696792602539, "global_step": 130902, "epoch": 779} {"train_loss": -10.589967727661133, "global_step": 130903, "epoch": 779} {"train_loss": -10.513206481933594, "global_step": 130904, "epoch": 779} {"train_loss": -10.199089050292969, "global_step": 130905, "epoch": 779} {"train_loss": -10.497845649719238, "global_step": 130906, "epoch": 779} {"train_loss": -10.366819381713867, "global_step": 130907, "epoch": 779} {"train_loss": -10.162599563598633, "global_step": 130908, "epoch": 779} {"train_loss": -10.370914459228516, "global_step": 130909, "epoch": 779} {"train_loss": -10.318144798278809, "global_step": 130910, "epoch": 779} {"train_loss": -10.200592994689941, "global_step": 130911, "epoch": 779} {"train_loss": -10.53972053527832, "global_step": 130912, "epoch": 779} {"train_loss": -10.315515518188477, "global_step": 130913, "epoch": 779} {"train_loss": -10.34151840209961, "global_step": 130914, "epoch": 779} {"train_loss": -10.601058959960938, "global_step": 130915, "epoch": 779} {"train_loss": -10.486862182617188, "global_step": 130916, "epoch": 779} {"train_loss": -10.392998695373535, "global_step": 130917, "epoch": 779} {"train_loss": -10.3046875, "global_step": 130918, "epoch": 779} {"train_loss": -10.382225036621094, "global_step": 130919, "epoch": 779} {"train_loss": -10.345767974853516, "global_step": 130920, "epoch": 779} {"train_loss": -10.646284103393555, "global_step": 130921, "epoch": 779} {"train_loss": -10.196362495422363, "global_step": 130922, "epoch": 779} {"train_loss": -10.420040130615234, "global_step": 130923, "epoch": 779} {"train_loss": -10.406732559204102, "global_step": 130924, "epoch": 779} {"train_loss": -9.9996976852417, "global_step": 130925, "epoch": 779} {"train_loss": -10.529402732849121, "global_step": 130926, "epoch": 779} {"train_loss": -10.399592399597168, "global_step": 130927, "epoch": 779} {"train_loss": -10.279996871948242, "global_step": 130928, "epoch": 779} {"train_loss": -10.405425071716309, "global_step": 130929, "epoch": 779} {"train_loss": -10.447887420654297, "global_step": 130930, "epoch": 779} {"train_loss": -9.99364185333252, "global_step": 130931, "epoch": 779} {"train_loss": -10.226064682006836, "global_step": 130932, "epoch": 779} {"train_loss": -10.3202486038208, "global_step": 130933, "epoch": 779} {"train_loss": -10.14916706085205, "global_step": 130934, "epoch": 779} {"train_loss": -10.245278358459473, "global_step": 130935, "epoch": 779} {"train_loss": -10.375429153442383, "global_step": 130936, "epoch": 779} {"train_loss": -10.240612030029297, "global_step": 130937, "epoch": 779} {"train_loss": -10.272907257080078, "global_step": 130938, "epoch": 779} {"train_loss": -10.124859809875488, "global_step": 130939, "epoch": 779} {"train_loss": -10.364959716796875, "global_step": 130940, "epoch": 779} {"train_loss": -9.880656242370605, "global_step": 130941, "epoch": 779} {"train_loss": -10.181236267089844, "global_step": 130942, "epoch": 779} {"train_loss": -10.51921272277832, "global_step": 130943, "epoch": 779} {"train_loss": -10.038310050964355, "global_step": 130944, "epoch": 779} {"train_loss": -10.13232707977295, "global_step": 130945, "epoch": 779} {"train_loss": -9.766092300415039, "global_step": 130946, "epoch": 779} {"train_loss": -10.455448150634766, "global_step": 130947, "epoch": 779} {"train_loss": -9.891902923583984, "global_step": 130948, "epoch": 779} {"train_loss": -10.325424194335938, "global_step": 130949, "epoch": 779} {"train_loss": -9.86934757232666, "global_step": 130950, "epoch": 779} {"train_loss": -10.262613296508789, "global_step": 130951, "epoch": 779} {"train_loss": -10.111456871032715, "global_step": 130952, "epoch": 779} {"train_loss": -10.518930435180664, "global_step": 130953, "epoch": 779} {"train_loss": -10.090690612792969, "global_step": 130954, "epoch": 779} {"train_loss": -10.23481273651123, "global_step": 130955, "epoch": 779} {"train_loss": -10.315496444702148, "global_step": 130956, "epoch": 779} {"train_loss": -10.048405647277832, "global_step": 130957, "epoch": 779} {"train_loss": -10.403807640075684, "global_step": 130958, "epoch": 779} {"train_loss": -10.467748641967773, "global_step": 130959, "epoch": 779} {"train_loss": -10.534378051757812, "global_step": 130960, "epoch": 779} {"train_loss": -10.250420570373535, "global_step": 130961, "epoch": 779} {"train_loss": -10.530864715576172, "global_step": 130962, "epoch": 779} {"train_loss": -10.209151268005371, "global_step": 130963, "epoch": 779} {"train_loss": -10.29737663269043, "global_step": 130964, "epoch": 779} {"train_loss": -10.326905250549316, "global_step": 130965, "epoch": 779} {"train_loss": -10.39957046508789, "global_step": 130966, "epoch": 779} {"train_loss": -10.626311302185059, "global_step": 130967, "epoch": 779} {"train_loss": -10.438518524169922, "global_step": 130968, "epoch": 779} {"train_loss": -10.420438766479492, "global_step": 130969, "epoch": 779} {"train_loss": -10.36149787902832, "global_step": 130970, "epoch": 779} {"train_loss": -10.568521499633789, "global_step": 130971, "epoch": 779} {"train_loss": -10.577808380126953, "global_step": 130972, "epoch": 779} {"train_loss": -10.424100875854492, "global_step": 130973, "epoch": 779} {"train_loss": -10.421669960021973, "global_step": 130974, "epoch": 779} {"train_loss": -10.39944839477539, "global_step": 130975, "epoch": 779} {"train_loss": -10.533342361450195, "global_step": 130976, "epoch": 779} {"train_loss": -10.664037704467773, "global_step": 130977, "epoch": 779} {"train_loss": -10.544194221496582, "global_step": 130978, "epoch": 779} {"train_loss": -10.317928314208984, "global_step": 130979, "epoch": 779} {"train_loss": -10.742578506469727, "global_step": 130980, "epoch": 779} {"train_loss": -10.491179466247559, "global_step": 130981, "epoch": 779} {"train_loss": -10.807968139648438, "global_step": 130982, "epoch": 779} {"train_loss": -10.530529022216797, "global_step": 130983, "epoch": 779} {"train_loss": -10.309365272521973, "global_step": 130984, "epoch": 779} {"train_loss": -10.601245880126953, "global_step": 130985, "epoch": 779} {"train_loss": -10.634176254272461, "global_step": 130986, "epoch": 779} {"train_loss": -10.437030792236328, "global_step": 130987, "epoch": 779} {"train_loss": -10.481918334960938, "global_step": 130988, "epoch": 779} {"train_loss": -10.587669372558594, "global_step": 130989, "epoch": 779} {"train_loss": -10.235520362854004, "global_step": 130990, "epoch": 779} {"train_loss": -10.51198959350586, "global_step": 130991, "epoch": 779} {"train_loss": -10.63479995727539, "global_step": 130992, "epoch": 779} {"train_loss": -10.186100006103516, "global_step": 130993, "epoch": 779} {"train_loss": -10.551904678344727, "global_step": 130994, "epoch": 779} {"train_loss": -10.622030258178711, "global_step": 130995, "epoch": 779} {"train_loss": -10.297943115234375, "global_step": 130996, "epoch": 779} {"train_loss": -9.754463195800781, "global_step": 130997, "epoch": 779} {"train_loss": -10.397605895996094, "global_step": 130998, "epoch": 779} {"train_loss": -9.529104232788086, "global_step": 130999, "epoch": 779} {"train_loss": -9.610766410827637, "global_step": 131000, "epoch": 779} {"train_loss": -10.348836898803711, "global_step": 131001, "epoch": 779} {"train_loss": -9.776402473449707, "global_step": 131002, "epoch": 779} {"train_loss": -9.64363956451416, "global_step": 131003, "epoch": 779} {"train_loss": -10.200480461120605, "global_step": 131004, "epoch": 779} {"train_loss": -10.242891311645508, "global_step": 131005, "epoch": 779} {"train_loss": -10.102739334106445, "global_step": 131006, "epoch": 779} {"train_loss": -10.503406524658203, "global_step": 131007, "epoch": 779} {"train_loss": -10.079694747924805, "global_step": 131008, "epoch": 779} {"train_loss": -10.01819896697998, "global_step": 131009, "epoch": 779} {"train_loss": -10.158843994140625, "global_step": 131010, "epoch": 779} {"train_loss": -10.417401313781738, "global_step": 131011, "epoch": 779} {"train_loss": -10.211426734924316, "global_step": 131012, "epoch": 779} {"train_loss": -10.060356140136719, "global_step": 131013, "epoch": 779} {"train_loss": -10.34585189819336, "global_step": 131014, "epoch": 779} {"train_loss": -10.428779602050781, "global_step": 131015, "epoch": 779} {"train_loss": -10.215566635131836, "global_step": 131016, "epoch": 779} {"train_loss": -10.18472957611084, "global_step": 131017, "epoch": 779} {"train_loss": -10.395940780639648, "global_step": 131018, "epoch": 779} {"train_loss": -10.33825969696045, "global_step": 131019, "epoch": 779} {"train_loss": -10.475383758544922, "global_step": 131020, "epoch": 779} {"train_loss": -10.44471549987793, "global_step": 131021, "epoch": 779} {"train_loss": -10.39654541015625, "global_step": 131022, "epoch": 779} {"train_loss": -10.535905838012695, "global_step": 131023, "epoch": 779} {"train_loss": -10.381089210510254, "global_step": 131024, "epoch": 779} {"train_loss": -10.324097633361816, "global_step": 131025, "epoch": 779} {"train_loss": -10.516898155212402, "global_step": 131026, "epoch": 779} {"train_loss": -10.335838317871094, "global_step": 131027, "epoch": 779} {"train_loss": -10.527116775512695, "global_step": 131028, "epoch": 779} {"train_loss": -10.49239444732666, "global_step": 131029, "epoch": 779} {"train_loss": -10.496089935302734, "global_step": 131030, "epoch": 779} {"train_loss": -10.474181175231934, "global_step": 131031, "epoch": 779} {"train_loss": -10.582655906677246, "global_step": 131032, "epoch": 779} {"train_loss": -10.373421669006348, "global_step": 131033, "epoch": 779} {"train_loss": -10.285642623901367, "global_step": 131034, "epoch": 779} {"train_loss": -10.605489730834961, "global_step": 131035, "epoch": 779} {"train_loss": -10.56387710571289, "global_step": 131036, "epoch": 779} {"train_loss": -10.530275344848633, "global_step": 131037, "epoch": 779} {"train_loss": -10.71257495880127, "global_step": 131038, "epoch": 779} {"train_loss": -10.327230697586423, "global_step": 131039, "epoch": 779, "val_loss": 220895.34375} {"train_loss": -10.809814453125, "global_step": 131040, "epoch": 780} {"train_loss": -10.644559860229492, "global_step": 131041, "epoch": 780} {"train_loss": -10.83839225769043, "global_step": 131042, "epoch": 780} {"train_loss": -10.493081092834473, "global_step": 131043, "epoch": 780} {"train_loss": -10.615852355957031, "global_step": 131044, "epoch": 780} {"train_loss": -10.336015701293945, "global_step": 131045, "epoch": 780} {"train_loss": -10.467348098754883, "global_step": 131046, "epoch": 780} {"train_loss": -10.523836135864258, "global_step": 131047, "epoch": 780} {"train_loss": -10.65279483795166, "global_step": 131048, "epoch": 780} {"train_loss": -10.383996963500977, "global_step": 131049, "epoch": 780} {"train_loss": -10.227119445800781, "global_step": 131050, "epoch": 780} {"train_loss": -10.334491729736328, "global_step": 131051, "epoch": 780} {"train_loss": -10.258390426635742, "global_step": 131052, "epoch": 780} {"train_loss": -10.148569107055664, "global_step": 131053, "epoch": 780} {"train_loss": -10.284529685974121, "global_step": 131054, "epoch": 780} {"train_loss": -9.934579849243164, "global_step": 131055, "epoch": 780} {"train_loss": -10.6719970703125, "global_step": 131056, "epoch": 780} {"train_loss": -9.891554832458496, "global_step": 131057, "epoch": 780} {"train_loss": -10.538972854614258, "global_step": 131058, "epoch": 780} {"train_loss": -10.248030662536621, "global_step": 131059, "epoch": 780} {"train_loss": -10.352765083312988, "global_step": 131060, "epoch": 780} {"train_loss": -10.428473472595215, "global_step": 131061, "epoch": 780} {"train_loss": -10.19925594329834, "global_step": 131062, "epoch": 780} {"train_loss": -10.195087432861328, "global_step": 131063, "epoch": 780} {"train_loss": -10.526429176330566, "global_step": 131064, "epoch": 780} {"train_loss": -10.282512664794922, "global_step": 131065, "epoch": 780} {"train_loss": -10.107677459716797, "global_step": 131066, "epoch": 780} {"train_loss": -10.416086196899414, "global_step": 131067, "epoch": 780} {"train_loss": -10.431424140930176, "global_step": 131068, "epoch": 780} {"train_loss": -10.475915908813477, "global_step": 131069, "epoch": 780} {"train_loss": -10.811946868896484, "global_step": 131070, "epoch": 780} {"train_loss": -10.733516693115234, "global_step": 131071, "epoch": 780} {"train_loss": -10.461804389953613, "global_step": 131072, "epoch": 780} {"train_loss": -10.473085403442383, "global_step": 131073, "epoch": 780} {"train_loss": -10.592509269714355, "global_step": 131074, "epoch": 780} {"train_loss": -10.488086700439453, "global_step": 131075, "epoch": 780} {"train_loss": -10.642728805541992, "global_step": 131076, "epoch": 780} {"train_loss": -10.568999290466309, "global_step": 131077, "epoch": 780} {"train_loss": -10.56148624420166, "global_step": 131078, "epoch": 780} {"train_loss": -10.535734176635742, "global_step": 131079, "epoch": 780} {"train_loss": -10.641005516052246, "global_step": 131080, "epoch": 780} {"train_loss": -10.616125106811523, "global_step": 131081, "epoch": 780} {"train_loss": -10.508312225341797, "global_step": 131082, "epoch": 780} {"train_loss": -10.282350540161133, "global_step": 131083, "epoch": 780} {"train_loss": -10.535752296447754, "global_step": 131084, "epoch": 780} {"train_loss": -10.415582656860352, "global_step": 131085, "epoch": 780} {"train_loss": -10.45840835571289, "global_step": 131086, "epoch": 780} {"train_loss": -10.551702499389648, "global_step": 131087, "epoch": 780} {"train_loss": -10.425933837890625, "global_step": 131088, "epoch": 780} {"train_loss": -10.330657958984375, "global_step": 131089, "epoch": 780} {"train_loss": -10.151899337768555, "global_step": 131090, "epoch": 780} {"train_loss": -10.490588188171387, "global_step": 131091, "epoch": 780} {"train_loss": -10.249809265136719, "global_step": 131092, "epoch": 780} {"train_loss": -10.552396774291992, "global_step": 131093, "epoch": 780} {"train_loss": -10.054893493652344, "global_step": 131094, "epoch": 780} {"train_loss": -10.486963272094727, "global_step": 131095, "epoch": 780} {"train_loss": -10.49919319152832, "global_step": 131096, "epoch": 780} {"train_loss": -10.28739070892334, "global_step": 131097, "epoch": 780} {"train_loss": -9.836833953857422, "global_step": 131098, "epoch": 780} {"train_loss": -10.34347915649414, "global_step": 131099, "epoch": 780} {"train_loss": -10.46583366394043, "global_step": 131100, "epoch": 780} {"train_loss": -10.189016342163086, "global_step": 131101, "epoch": 780} {"train_loss": -10.353500366210938, "global_step": 131102, "epoch": 780} {"train_loss": -10.729722023010254, "global_step": 131103, "epoch": 780} {"train_loss": -10.481664657592773, "global_step": 131104, "epoch": 780} {"train_loss": -9.741569519042969, "global_step": 131105, "epoch": 780} {"train_loss": -10.428569793701172, "global_step": 131106, "epoch": 780} {"train_loss": -9.739423751831055, "global_step": 131107, "epoch": 780} {"train_loss": -10.507743835449219, "global_step": 131108, "epoch": 780} {"train_loss": -10.104520797729492, "global_step": 131109, "epoch": 780} {"train_loss": -10.411340713500977, "global_step": 131110, "epoch": 780} {"train_loss": -10.076057434082031, "global_step": 131111, "epoch": 780} {"train_loss": -10.40074348449707, "global_step": 131112, "epoch": 780} {"train_loss": -10.333250999450684, "global_step": 131113, "epoch": 780} {"train_loss": -10.017938613891602, "global_step": 131114, "epoch": 780} {"train_loss": -10.389768600463867, "global_step": 131115, "epoch": 780} {"train_loss": -9.860361099243164, "global_step": 131116, "epoch": 780} {"train_loss": -10.318653106689453, "global_step": 131117, "epoch": 780} {"train_loss": -10.337392807006836, "global_step": 131118, "epoch": 780} {"train_loss": -9.403989791870117, "global_step": 131119, "epoch": 780} {"train_loss": -10.32510757446289, "global_step": 131120, "epoch": 780} {"train_loss": -9.44194221496582, "global_step": 131121, "epoch": 780} {"train_loss": -10.10739517211914, "global_step": 131122, "epoch": 780} {"train_loss": -10.325348854064941, "global_step": 131123, "epoch": 780} {"train_loss": -9.842133522033691, "global_step": 131124, "epoch": 780} {"train_loss": -10.29301929473877, "global_step": 131125, "epoch": 780} {"train_loss": -10.1744384765625, "global_step": 131126, "epoch": 780} {"train_loss": -9.858304977416992, "global_step": 131127, "epoch": 780} {"train_loss": -10.485865592956543, "global_step": 131128, "epoch": 780} {"train_loss": -10.475564002990723, "global_step": 131129, "epoch": 780} {"train_loss": -9.96276569366455, "global_step": 131130, "epoch": 780} {"train_loss": -10.347118377685547, "global_step": 131131, "epoch": 780} {"train_loss": -10.038187026977539, "global_step": 131132, "epoch": 780} {"train_loss": -10.158027648925781, "global_step": 131133, "epoch": 780} {"train_loss": -10.483488082885742, "global_step": 131134, "epoch": 780} {"train_loss": -9.83899211883545, "global_step": 131135, "epoch": 780} {"train_loss": -10.261541366577148, "global_step": 131136, "epoch": 780} {"train_loss": -9.999397277832031, "global_step": 131137, "epoch": 780} {"train_loss": -10.222136497497559, "global_step": 131138, "epoch": 780} {"train_loss": -9.92245864868164, "global_step": 131139, "epoch": 780} {"train_loss": -10.398908615112305, "global_step": 131140, "epoch": 780} {"train_loss": -10.196906089782715, "global_step": 131141, "epoch": 780} {"train_loss": -10.254343032836914, "global_step": 131142, "epoch": 780} {"train_loss": -10.179157257080078, "global_step": 131143, "epoch": 780} {"train_loss": -10.120098114013672, "global_step": 131144, "epoch": 780} {"train_loss": -10.359582901000977, "global_step": 131145, "epoch": 780} {"train_loss": -10.301813125610352, "global_step": 131146, "epoch": 780} {"train_loss": -10.378081321716309, "global_step": 131147, "epoch": 780} {"train_loss": -10.041223526000977, "global_step": 131148, "epoch": 780} {"train_loss": -10.372363090515137, "global_step": 131149, "epoch": 780} {"train_loss": -10.437911987304688, "global_step": 131150, "epoch": 780} {"train_loss": -10.302186012268066, "global_step": 131151, "epoch": 780} {"train_loss": -10.574203491210938, "global_step": 131152, "epoch": 780} {"train_loss": -10.21498966217041, "global_step": 131153, "epoch": 780} {"train_loss": -10.51576042175293, "global_step": 131154, "epoch": 780} {"train_loss": -10.298954010009766, "global_step": 131155, "epoch": 780} {"train_loss": -10.587815284729004, "global_step": 131156, "epoch": 780} {"train_loss": -10.508077621459961, "global_step": 131157, "epoch": 780} {"train_loss": -10.578512191772461, "global_step": 131158, "epoch": 780} {"train_loss": -10.459064483642578, "global_step": 131159, "epoch": 780} {"train_loss": -10.52242660522461, "global_step": 131160, "epoch": 780} {"train_loss": -10.612520217895508, "global_step": 131161, "epoch": 780} {"train_loss": -10.604296684265137, "global_step": 131162, "epoch": 780} {"train_loss": -10.566211700439453, "global_step": 131163, "epoch": 780} {"train_loss": -10.445924758911133, "global_step": 131164, "epoch": 780} {"train_loss": -10.45155143737793, "global_step": 131165, "epoch": 780} {"train_loss": -10.216119766235352, "global_step": 131166, "epoch": 780} {"train_loss": -10.603352546691895, "global_step": 131167, "epoch": 780} {"train_loss": -10.47126293182373, "global_step": 131168, "epoch": 780} {"train_loss": -10.616543769836426, "global_step": 131169, "epoch": 780} {"train_loss": -10.639896392822266, "global_step": 131170, "epoch": 780} {"train_loss": -10.581279754638672, "global_step": 131171, "epoch": 780} {"train_loss": -10.707305908203125, "global_step": 131172, "epoch": 780} {"train_loss": -10.604578018188477, "global_step": 131173, "epoch": 780} {"train_loss": -10.527563095092773, "global_step": 131174, "epoch": 780} {"train_loss": -10.59393310546875, "global_step": 131175, "epoch": 780} {"train_loss": -10.481644630432129, "global_step": 131176, "epoch": 780} {"train_loss": -10.822494506835938, "global_step": 131177, "epoch": 780} {"train_loss": -10.451687812805176, "global_step": 131178, "epoch": 780} {"train_loss": -10.307479858398438, "global_step": 131179, "epoch": 780} {"train_loss": -10.722786903381348, "global_step": 131180, "epoch": 780} {"train_loss": -10.482603073120117, "global_step": 131181, "epoch": 780} {"train_loss": -10.725191116333008, "global_step": 131182, "epoch": 780} {"train_loss": -10.323939323425293, "global_step": 131183, "epoch": 780} {"train_loss": -10.23497486114502, "global_step": 131184, "epoch": 780} {"train_loss": -10.291563987731934, "global_step": 131185, "epoch": 780} {"train_loss": -10.311593055725098, "global_step": 131186, "epoch": 780} {"train_loss": -10.497591018676758, "global_step": 131187, "epoch": 780} {"train_loss": -10.270158767700195, "global_step": 131188, "epoch": 780} {"train_loss": -10.258939743041992, "global_step": 131189, "epoch": 780} {"train_loss": -10.425567626953125, "global_step": 131190, "epoch": 780} {"train_loss": -10.340097427368164, "global_step": 131191, "epoch": 780} {"train_loss": -10.194751739501953, "global_step": 131192, "epoch": 780} {"train_loss": -9.635924339294434, "global_step": 131193, "epoch": 780} {"train_loss": -10.374629020690918, "global_step": 131194, "epoch": 780} {"train_loss": -9.684553146362305, "global_step": 131195, "epoch": 780} {"train_loss": -9.997669219970703, "global_step": 131196, "epoch": 780} {"train_loss": -10.33798885345459, "global_step": 131197, "epoch": 780} {"train_loss": -9.93234634399414, "global_step": 131198, "epoch": 780} {"train_loss": -10.024063110351562, "global_step": 131199, "epoch": 780} {"train_loss": -10.233732223510742, "global_step": 131200, "epoch": 780} {"train_loss": -10.044096946716309, "global_step": 131201, "epoch": 780} {"train_loss": -10.023127555847168, "global_step": 131202, "epoch": 780} {"train_loss": -10.430923461914062, "global_step": 131203, "epoch": 780} {"train_loss": -10.19235610961914, "global_step": 131204, "epoch": 780} {"train_loss": -10.256126403808594, "global_step": 131205, "epoch": 780} {"train_loss": -9.910093307495117, "global_step": 131206, "epoch": 780} {"train_loss": -10.339230622564044, "global_step": 131207, "epoch": 780, "val_loss": 219470.21875, "train_action_mse_error": 0.9820040464401245} {"train_loss": -9.276573181152344, "global_step": 131208, "epoch": 781} {"train_loss": -10.37654972076416, "global_step": 131209, "epoch": 781} {"train_loss": -10.040560722351074, "global_step": 131210, "epoch": 781} {"train_loss": -10.055159568786621, "global_step": 131211, "epoch": 781} {"train_loss": -9.677423477172852, "global_step": 131212, "epoch": 781} {"train_loss": -9.925056457519531, "global_step": 131213, "epoch": 781} {"train_loss": -9.230472564697266, "global_step": 131214, "epoch": 781} {"train_loss": -10.115228652954102, "global_step": 131215, "epoch": 781} {"train_loss": -9.714887619018555, "global_step": 131216, "epoch": 781} {"train_loss": -10.322712898254395, "global_step": 131217, "epoch": 781} {"train_loss": -9.79200553894043, "global_step": 131218, "epoch": 781} {"train_loss": -10.025586128234863, "global_step": 131219, "epoch": 781} {"train_loss": -9.995975494384766, "global_step": 131220, "epoch": 781} {"train_loss": -10.158841133117676, "global_step": 131221, "epoch": 781} {"train_loss": -10.304376602172852, "global_step": 131222, "epoch": 781} {"train_loss": -9.806702613830566, "global_step": 131223, "epoch": 781} {"train_loss": -10.359648704528809, "global_step": 131224, "epoch": 781} {"train_loss": -9.995660781860352, "global_step": 131225, "epoch": 781} {"train_loss": -10.02283000946045, "global_step": 131226, "epoch": 781} {"train_loss": -10.199974060058594, "global_step": 131227, "epoch": 781} {"train_loss": -10.23342514038086, "global_step": 131228, "epoch": 781} {"train_loss": -10.222855567932129, "global_step": 131229, "epoch": 781} {"train_loss": -10.118307113647461, "global_step": 131230, "epoch": 781} {"train_loss": -10.565732955932617, "global_step": 131231, "epoch": 781} {"train_loss": -10.226709365844727, "global_step": 131232, "epoch": 781} {"train_loss": -10.23214054107666, "global_step": 131233, "epoch": 781} {"train_loss": -10.294087409973145, "global_step": 131234, "epoch": 781} {"train_loss": -10.408936500549316, "global_step": 131235, "epoch": 781} {"train_loss": -10.214022636413574, "global_step": 131236, "epoch": 781} {"train_loss": -10.400787353515625, "global_step": 131237, "epoch": 781} {"train_loss": -10.276405334472656, "global_step": 131238, "epoch": 781} {"train_loss": -10.391542434692383, "global_step": 131239, "epoch": 781} {"train_loss": -10.37787914276123, "global_step": 131240, "epoch": 781} {"train_loss": -10.521539688110352, "global_step": 131241, "epoch": 781} {"train_loss": -10.292901039123535, "global_step": 131242, "epoch": 781} {"train_loss": -10.483985900878906, "global_step": 131243, "epoch": 781} {"train_loss": -10.618005752563477, "global_step": 131244, "epoch": 781} {"train_loss": -10.382379531860352, "global_step": 131245, "epoch": 781} {"train_loss": -10.40295696258545, "global_step": 131246, "epoch": 781} {"train_loss": -10.5184326171875, "global_step": 131247, "epoch": 781} {"train_loss": -10.74673080444336, "global_step": 131248, "epoch": 781} {"train_loss": -10.579482078552246, "global_step": 131249, "epoch": 781} {"train_loss": -10.615489959716797, "global_step": 131250, "epoch": 781} {"train_loss": -10.67810344696045, "global_step": 131251, "epoch": 781} {"train_loss": -10.648416519165039, "global_step": 131252, "epoch": 781} {"train_loss": -10.575433731079102, "global_step": 131253, "epoch": 781} {"train_loss": -10.607428550720215, "global_step": 131254, "epoch": 781} {"train_loss": -10.727560043334961, "global_step": 131255, "epoch": 781} {"train_loss": -10.707693099975586, "global_step": 131256, "epoch": 781} {"train_loss": -10.625324249267578, "global_step": 131257, "epoch": 781} {"train_loss": -10.64764404296875, "global_step": 131258, "epoch": 781} {"train_loss": -10.716180801391602, "global_step": 131259, "epoch": 781} {"train_loss": -10.47940444946289, "global_step": 131260, "epoch": 781} {"train_loss": -10.554198265075684, "global_step": 131261, "epoch": 781} {"train_loss": -10.592550277709961, "global_step": 131262, "epoch": 781} {"train_loss": -10.573965072631836, "global_step": 131263, "epoch": 781} {"train_loss": -10.83577823638916, "global_step": 131264, "epoch": 781} {"train_loss": -10.878746032714844, "global_step": 131265, "epoch": 781} {"train_loss": -10.774758338928223, "global_step": 131266, "epoch": 781} {"train_loss": -10.633829116821289, "global_step": 131267, "epoch": 781} {"train_loss": -10.843334197998047, "global_step": 131268, "epoch": 781} {"train_loss": -10.310196876525879, "global_step": 131269, "epoch": 781} {"train_loss": -10.038213729858398, "global_step": 131270, "epoch": 781} {"train_loss": -10.30718994140625, "global_step": 131271, "epoch": 781} {"train_loss": -9.755026817321777, "global_step": 131272, "epoch": 781} {"train_loss": -7.675478935241699, "global_step": 131273, "epoch": 781} {"train_loss": -9.824106216430664, "global_step": 131274, "epoch": 781} {"train_loss": -6.558498859405518, "global_step": 131275, "epoch": 781} {"train_loss": -6.253180027008057, "global_step": 131276, "epoch": 781} {"train_loss": -7.001241683959961, "global_step": 131277, "epoch": 781} {"train_loss": -7.837652206420898, "global_step": 131278, "epoch": 781} {"train_loss": -7.73905086517334, "global_step": 131279, "epoch": 781} {"train_loss": -9.106515884399414, "global_step": 131280, "epoch": 781} {"train_loss": -8.576484680175781, "global_step": 131281, "epoch": 781} {"train_loss": -8.126449584960938, "global_step": 131282, "epoch": 781} {"train_loss": -8.291410446166992, "global_step": 131283, "epoch": 781} {"train_loss": -9.032233238220215, "global_step": 131284, "epoch": 781} {"train_loss": -8.481904029846191, "global_step": 131285, "epoch": 781} {"train_loss": -8.160127639770508, "global_step": 131286, "epoch": 781} {"train_loss": -9.172706604003906, "global_step": 131287, "epoch": 781} {"train_loss": -9.617698669433594, "global_step": 131288, "epoch": 781} {"train_loss": -9.091379165649414, "global_step": 131289, "epoch": 781} {"train_loss": -9.026815414428711, "global_step": 131290, "epoch": 781} {"train_loss": -9.111917495727539, "global_step": 131291, "epoch": 781} {"train_loss": -9.42304801940918, "global_step": 131292, "epoch": 781} {"train_loss": -9.234021186828613, "global_step": 131293, "epoch": 781} {"train_loss": -9.138519287109375, "global_step": 131294, "epoch": 781} {"train_loss": -9.14069652557373, "global_step": 131295, "epoch": 781} {"train_loss": -9.452699661254883, "global_step": 131296, "epoch": 781} {"train_loss": -9.706491470336914, "global_step": 131297, "epoch": 781} {"train_loss": -9.363290786743164, "global_step": 131298, "epoch": 781} {"train_loss": -9.361639976501465, "global_step": 131299, "epoch": 781} {"train_loss": -9.523534774780273, "global_step": 131300, "epoch": 781} {"train_loss": -9.719535827636719, "global_step": 131301, "epoch": 781} {"train_loss": -9.793285369873047, "global_step": 131302, "epoch": 781} {"train_loss": -9.671162605285645, "global_step": 131303, "epoch": 781} {"train_loss": -9.632238388061523, "global_step": 131304, "epoch": 781} {"train_loss": -9.655248641967773, "global_step": 131305, "epoch": 781} {"train_loss": -9.74761962890625, "global_step": 131306, "epoch": 781} {"train_loss": -9.935559272766113, "global_step": 131307, "epoch": 781} {"train_loss": -9.72819995880127, "global_step": 131308, "epoch": 781} {"train_loss": -9.706498146057129, "global_step": 131309, "epoch": 781} {"train_loss": -9.956127166748047, "global_step": 131310, "epoch": 781} {"train_loss": -9.717350006103516, "global_step": 131311, "epoch": 781} {"train_loss": -9.92415714263916, "global_step": 131312, "epoch": 781} {"train_loss": -9.95322036743164, "global_step": 131313, "epoch": 781} {"train_loss": -10.026582717895508, "global_step": 131314, "epoch": 781} {"train_loss": -10.064519882202148, "global_step": 131315, "epoch": 781} {"train_loss": -10.058505058288574, "global_step": 131316, "epoch": 781} {"train_loss": -10.034111976623535, "global_step": 131317, "epoch": 781} {"train_loss": -10.167888641357422, "global_step": 131318, "epoch": 781} {"train_loss": -10.193025588989258, "global_step": 131319, "epoch": 781} {"train_loss": -10.173075675964355, "global_step": 131320, "epoch": 781} {"train_loss": -9.942930221557617, "global_step": 131321, "epoch": 781} {"train_loss": -10.258092880249023, "global_step": 131322, "epoch": 781} {"train_loss": -10.211507797241211, "global_step": 131323, "epoch": 781} {"train_loss": -10.285383224487305, "global_step": 131324, "epoch": 781} {"train_loss": -9.946627616882324, "global_step": 131325, "epoch": 781} {"train_loss": -10.048391342163086, "global_step": 131326, "epoch": 781} {"train_loss": -10.295343399047852, "global_step": 131327, "epoch": 781} {"train_loss": -10.501008033752441, "global_step": 131328, "epoch": 781} {"train_loss": -10.38710880279541, "global_step": 131329, "epoch": 781} {"train_loss": -10.296028137207031, "global_step": 131330, "epoch": 781} {"train_loss": -10.278562545776367, "global_step": 131331, "epoch": 781} {"train_loss": -10.431488037109375, "global_step": 131332, "epoch": 781} {"train_loss": -10.375694274902344, "global_step": 131333, "epoch": 781} {"train_loss": -10.540188789367676, "global_step": 131334, "epoch": 781} {"train_loss": -10.586532592773438, "global_step": 131335, "epoch": 781} {"train_loss": -10.170166969299316, "global_step": 131336, "epoch": 781} {"train_loss": -10.517396926879883, "global_step": 131337, "epoch": 781} {"train_loss": -10.367096900939941, "global_step": 131338, "epoch": 781} {"train_loss": -10.350603103637695, "global_step": 131339, "epoch": 781} {"train_loss": -10.536787033081055, "global_step": 131340, "epoch": 781} {"train_loss": -10.509093284606934, "global_step": 131341, "epoch": 781} {"train_loss": -10.494197845458984, "global_step": 131342, "epoch": 781} {"train_loss": -10.559917449951172, "global_step": 131343, "epoch": 781} {"train_loss": -10.39798641204834, "global_step": 131344, "epoch": 781} {"train_loss": -10.537862777709961, "global_step": 131345, "epoch": 781} {"train_loss": -10.619288444519043, "global_step": 131346, "epoch": 781} {"train_loss": -10.579782485961914, "global_step": 131347, "epoch": 781} {"train_loss": -10.500240325927734, "global_step": 131348, "epoch": 781} {"train_loss": -10.638261795043945, "global_step": 131349, "epoch": 781} {"train_loss": -10.58690357208252, "global_step": 131350, "epoch": 781} {"train_loss": -10.24155044555664, "global_step": 131351, "epoch": 781} {"train_loss": -10.501758575439453, "global_step": 131352, "epoch": 781} {"train_loss": -10.507123947143555, "global_step": 131353, "epoch": 781} {"train_loss": -10.639983177185059, "global_step": 131354, "epoch": 781} {"train_loss": -10.70773696899414, "global_step": 131355, "epoch": 781} {"train_loss": -10.693939208984375, "global_step": 131356, "epoch": 781} {"train_loss": -10.51275634765625, "global_step": 131357, "epoch": 781} {"train_loss": -10.606935501098633, "global_step": 131358, "epoch": 781} {"train_loss": -10.240083694458008, "global_step": 131359, "epoch": 781} {"train_loss": -10.660948753356934, "global_step": 131360, "epoch": 781} {"train_loss": -10.54796314239502, "global_step": 131361, "epoch": 781} {"train_loss": -10.709209442138672, "global_step": 131362, "epoch": 781} {"train_loss": -10.385218620300293, "global_step": 131363, "epoch": 781} {"train_loss": -10.487916946411133, "global_step": 131364, "epoch": 781} {"train_loss": -10.394489288330078, "global_step": 131365, "epoch": 781} {"train_loss": -10.167991638183594, "global_step": 131366, "epoch": 781} {"train_loss": -10.325401306152344, "global_step": 131367, "epoch": 781} {"train_loss": -10.476043701171875, "global_step": 131368, "epoch": 781} {"train_loss": -10.293296813964844, "global_step": 131369, "epoch": 781} {"train_loss": -10.51846694946289, "global_step": 131370, "epoch": 781} {"train_loss": -10.338827133178711, "global_step": 131371, "epoch": 781} {"train_loss": -10.265300750732422, "global_step": 131372, "epoch": 781} {"train_loss": -9.866434097290039, "global_step": 131373, "epoch": 781} {"train_loss": -9.677831649780273, "global_step": 131374, "epoch": 781} {"train_loss": -10.022513520149957, "global_step": 131375, "epoch": 781, "val_loss": 217238.609375} {"train_loss": -9.179356575012207, "global_step": 131376, "epoch": 782} {"train_loss": -10.091887474060059, "global_step": 131377, "epoch": 782} {"train_loss": -9.317556381225586, "global_step": 131378, "epoch": 782} {"train_loss": -10.242399215698242, "global_step": 131379, "epoch": 782} {"train_loss": -9.002405166625977, "global_step": 131380, "epoch": 782} {"train_loss": -10.214913368225098, "global_step": 131381, "epoch": 782} {"train_loss": -9.622428894042969, "global_step": 131382, "epoch": 782} {"train_loss": -9.305853843688965, "global_step": 131383, "epoch": 782} {"train_loss": -9.05105972290039, "global_step": 131384, "epoch": 782} {"train_loss": -9.831708908081055, "global_step": 131385, "epoch": 782} {"train_loss": -9.348922729492188, "global_step": 131386, "epoch": 782} {"train_loss": -9.635974884033203, "global_step": 131387, "epoch": 782} {"train_loss": -9.602188110351562, "global_step": 131388, "epoch": 782} {"train_loss": -9.566941261291504, "global_step": 131389, "epoch": 782} {"train_loss": -10.32017993927002, "global_step": 131390, "epoch": 782} {"train_loss": -9.663885116577148, "global_step": 131391, "epoch": 782} {"train_loss": -10.075733184814453, "global_step": 131392, "epoch": 782} {"train_loss": -9.88146686553955, "global_step": 131393, "epoch": 782} {"train_loss": -10.155502319335938, "global_step": 131394, "epoch": 782} {"train_loss": -10.213226318359375, "global_step": 131395, "epoch": 782} {"train_loss": -9.589666366577148, "global_step": 131396, "epoch": 782} {"train_loss": -10.071796417236328, "global_step": 131397, "epoch": 782} {"train_loss": -9.792973518371582, "global_step": 131398, "epoch": 782} {"train_loss": -9.855195045471191, "global_step": 131399, "epoch": 782} {"train_loss": -10.257780075073242, "global_step": 131400, "epoch": 782} {"train_loss": -10.030769348144531, "global_step": 131401, "epoch": 782} {"train_loss": -9.946772575378418, "global_step": 131402, "epoch": 782} {"train_loss": -10.341822624206543, "global_step": 131403, "epoch": 782} {"train_loss": -9.819875717163086, "global_step": 131404, "epoch": 782} {"train_loss": -9.896017074584961, "global_step": 131405, "epoch": 782} {"train_loss": -10.112373352050781, "global_step": 131406, "epoch": 782} {"train_loss": -10.104991912841797, "global_step": 131407, "epoch": 782} {"train_loss": -9.918193817138672, "global_step": 131408, "epoch": 782} {"train_loss": -9.93554973602295, "global_step": 131409, "epoch": 782} {"train_loss": -10.145462036132812, "global_step": 131410, "epoch": 782} {"train_loss": -9.77328872680664, "global_step": 131411, "epoch": 782} {"train_loss": -10.248852729797363, "global_step": 131412, "epoch": 782} {"train_loss": -10.113336563110352, "global_step": 131413, "epoch": 782} {"train_loss": -9.984668731689453, "global_step": 131414, "epoch": 782} {"train_loss": -10.135553359985352, "global_step": 131415, "epoch": 782} {"train_loss": -10.134124755859375, "global_step": 131416, "epoch": 782} {"train_loss": -10.155765533447266, "global_step": 131417, "epoch": 782} {"train_loss": -10.252737045288086, "global_step": 131418, "epoch": 782} {"train_loss": -9.939496994018555, "global_step": 131419, "epoch": 782} {"train_loss": -10.061721801757812, "global_step": 131420, "epoch": 782} {"train_loss": -10.225364685058594, "global_step": 131421, "epoch": 782} {"train_loss": -9.979524612426758, "global_step": 131422, "epoch": 782} {"train_loss": -10.247138023376465, "global_step": 131423, "epoch": 782} {"train_loss": -10.17941665649414, "global_step": 131424, "epoch": 782} {"train_loss": -10.480522155761719, "global_step": 131425, "epoch": 782} {"train_loss": -10.025968551635742, "global_step": 131426, "epoch": 782} {"train_loss": -10.499786376953125, "global_step": 131427, "epoch": 782} {"train_loss": -10.376029968261719, "global_step": 131428, "epoch": 782} {"train_loss": -10.223285675048828, "global_step": 131429, "epoch": 782} {"train_loss": -10.356075286865234, "global_step": 131430, "epoch": 782} {"train_loss": -10.400093078613281, "global_step": 131431, "epoch": 782} {"train_loss": -10.535722732543945, "global_step": 131432, "epoch": 782} {"train_loss": -10.517353057861328, "global_step": 131433, "epoch": 782} {"train_loss": -10.577812194824219, "global_step": 131434, "epoch": 782} {"train_loss": -10.419979095458984, "global_step": 131435, "epoch": 782} {"train_loss": -10.665665626525879, "global_step": 131436, "epoch": 782} {"train_loss": -10.280951499938965, "global_step": 131437, "epoch": 782} {"train_loss": -10.40545654296875, "global_step": 131438, "epoch": 782} {"train_loss": -10.186527252197266, "global_step": 131439, "epoch": 782} {"train_loss": -10.48459529876709, "global_step": 131440, "epoch": 782} {"train_loss": -10.581181526184082, "global_step": 131441, "epoch": 782} {"train_loss": -10.241896629333496, "global_step": 131442, "epoch": 782} {"train_loss": -10.604251861572266, "global_step": 131443, "epoch": 782} {"train_loss": -10.175554275512695, "global_step": 131444, "epoch": 782} {"train_loss": -10.754789352416992, "global_step": 131445, "epoch": 782} {"train_loss": -10.36839485168457, "global_step": 131446, "epoch": 782} {"train_loss": -10.196914672851562, "global_step": 131447, "epoch": 782} {"train_loss": -10.69542407989502, "global_step": 131448, "epoch": 782} {"train_loss": -10.374059677124023, "global_step": 131449, "epoch": 782} {"train_loss": -10.636846542358398, "global_step": 131450, "epoch": 782} {"train_loss": -10.476163864135742, "global_step": 131451, "epoch": 782} {"train_loss": -10.738332748413086, "global_step": 131452, "epoch": 782} {"train_loss": -10.394510269165039, "global_step": 131453, "epoch": 782} {"train_loss": -10.43165397644043, "global_step": 131454, "epoch": 782} {"train_loss": -10.457260131835938, "global_step": 131455, "epoch": 782} {"train_loss": -10.445106506347656, "global_step": 131456, "epoch": 782} {"train_loss": -10.680513381958008, "global_step": 131457, "epoch": 782} {"train_loss": -10.641560554504395, "global_step": 131458, "epoch": 782} {"train_loss": -10.574075698852539, "global_step": 131459, "epoch": 782} {"train_loss": -10.782102584838867, "global_step": 131460, "epoch": 782} {"train_loss": -10.822721481323242, "global_step": 131461, "epoch": 782} {"train_loss": -10.424110412597656, "global_step": 131462, "epoch": 782} {"train_loss": -10.767763137817383, "global_step": 131463, "epoch": 782} {"train_loss": -10.129863739013672, "global_step": 131464, "epoch": 782} {"train_loss": -10.72508430480957, "global_step": 131465, "epoch": 782} {"train_loss": -10.304142951965332, "global_step": 131466, "epoch": 782} {"train_loss": -10.561407089233398, "global_step": 131467, "epoch": 782} {"train_loss": -10.64958381652832, "global_step": 131468, "epoch": 782} {"train_loss": -10.48602294921875, "global_step": 131469, "epoch": 782} {"train_loss": -10.463566780090332, "global_step": 131470, "epoch": 782} {"train_loss": -10.54515266418457, "global_step": 131471, "epoch": 782} {"train_loss": -9.863842010498047, "global_step": 131472, "epoch": 782} {"train_loss": -9.512333869934082, "global_step": 131473, "epoch": 782} {"train_loss": -10.195392608642578, "global_step": 131474, "epoch": 782} {"train_loss": -9.069705963134766, "global_step": 131475, "epoch": 782} {"train_loss": -10.18575668334961, "global_step": 131476, "epoch": 782} {"train_loss": -9.224878311157227, "global_step": 131477, "epoch": 782} {"train_loss": -9.46296215057373, "global_step": 131478, "epoch": 782} {"train_loss": -10.080133438110352, "global_step": 131479, "epoch": 782} {"train_loss": -9.739917755126953, "global_step": 131480, "epoch": 782} {"train_loss": -8.757890701293945, "global_step": 131481, "epoch": 782} {"train_loss": -9.975752830505371, "global_step": 131482, "epoch": 782} {"train_loss": -9.39704704284668, "global_step": 131483, "epoch": 782} {"train_loss": -9.89402961730957, "global_step": 131484, "epoch": 782} {"train_loss": -9.687590599060059, "global_step": 131485, "epoch": 782} {"train_loss": -9.863435745239258, "global_step": 131486, "epoch": 782} {"train_loss": -9.631429672241211, "global_step": 131487, "epoch": 782} {"train_loss": -10.409849166870117, "global_step": 131488, "epoch": 782} {"train_loss": -9.740087509155273, "global_step": 131489, "epoch": 782} {"train_loss": -10.061321258544922, "global_step": 131490, "epoch": 782} {"train_loss": -10.193997383117676, "global_step": 131491, "epoch": 782} {"train_loss": -9.880166053771973, "global_step": 131492, "epoch": 782} {"train_loss": -9.905426979064941, "global_step": 131493, "epoch": 782} {"train_loss": -10.07630729675293, "global_step": 131494, "epoch": 782} {"train_loss": -9.876176834106445, "global_step": 131495, "epoch": 782} {"train_loss": -10.066560745239258, "global_step": 131496, "epoch": 782} {"train_loss": -10.021622657775879, "global_step": 131497, "epoch": 782} {"train_loss": -10.088221549987793, "global_step": 131498, "epoch": 782} {"train_loss": -10.16550350189209, "global_step": 131499, "epoch": 782} {"train_loss": -9.946727752685547, "global_step": 131500, "epoch": 782} {"train_loss": -10.192083358764648, "global_step": 131501, "epoch": 782} {"train_loss": -10.511329650878906, "global_step": 131502, "epoch": 782} {"train_loss": -10.214498519897461, "global_step": 131503, "epoch": 782} {"train_loss": -10.287385940551758, "global_step": 131504, "epoch": 782} {"train_loss": -10.12243366241455, "global_step": 131505, "epoch": 782} {"train_loss": -10.34382438659668, "global_step": 131506, "epoch": 782} {"train_loss": -10.159717559814453, "global_step": 131507, "epoch": 782} {"train_loss": -10.2024507522583, "global_step": 131508, "epoch": 782} {"train_loss": -10.337648391723633, "global_step": 131509, "epoch": 782} {"train_loss": -10.241823196411133, "global_step": 131510, "epoch": 782} {"train_loss": -10.20400619506836, "global_step": 131511, "epoch": 782} {"train_loss": -10.438385009765625, "global_step": 131512, "epoch": 782} {"train_loss": -9.995061874389648, "global_step": 131513, "epoch": 782} {"train_loss": -10.38353157043457, "global_step": 131514, "epoch": 782} {"train_loss": -10.304765701293945, "global_step": 131515, "epoch": 782} {"train_loss": -10.345473289489746, "global_step": 131516, "epoch": 782} {"train_loss": -10.350841522216797, "global_step": 131517, "epoch": 782} {"train_loss": -10.408096313476562, "global_step": 131518, "epoch": 782} {"train_loss": -10.25838851928711, "global_step": 131519, "epoch": 782} {"train_loss": -10.106252670288086, "global_step": 131520, "epoch": 782} {"train_loss": -10.247122764587402, "global_step": 131521, "epoch": 782} {"train_loss": -10.361268043518066, "global_step": 131522, "epoch": 782} {"train_loss": -10.225739479064941, "global_step": 131523, "epoch": 782} {"train_loss": -10.31831169128418, "global_step": 131524, "epoch": 782} {"train_loss": -10.430274963378906, "global_step": 131525, "epoch": 782} {"train_loss": -10.572455406188965, "global_step": 131526, "epoch": 782} {"train_loss": -10.128686904907227, "global_step": 131527, "epoch": 782} {"train_loss": -10.452205657958984, "global_step": 131528, "epoch": 782} {"train_loss": -10.13150405883789, "global_step": 131529, "epoch": 782} {"train_loss": -10.432394027709961, "global_step": 131530, "epoch": 782} {"train_loss": -10.229860305786133, "global_step": 131531, "epoch": 782} {"train_loss": -10.210899353027344, "global_step": 131532, "epoch": 782} {"train_loss": -10.345366477966309, "global_step": 131533, "epoch": 782} {"train_loss": -10.139822006225586, "global_step": 131534, "epoch": 782} {"train_loss": -10.637170791625977, "global_step": 131535, "epoch": 782} {"train_loss": -9.971778869628906, "global_step": 131536, "epoch": 782} {"train_loss": -9.94994068145752, "global_step": 131537, "epoch": 782} {"train_loss": -10.365375518798828, "global_step": 131538, "epoch": 782} {"train_loss": -10.065999984741211, "global_step": 131539, "epoch": 782} {"train_loss": -10.36103343963623, "global_step": 131540, "epoch": 782} {"train_loss": -10.220918655395508, "global_step": 131541, "epoch": 782} {"train_loss": -10.393658638000488, "global_step": 131542, "epoch": 782} {"train_loss": -10.147500475247702, "global_step": 131543, "epoch": 782, "val_loss": 219237.0} {"train_loss": -10.054757118225098, "global_step": 131544, "epoch": 783} {"train_loss": -10.547088623046875, "global_step": 131545, "epoch": 783} {"train_loss": -10.157402992248535, "global_step": 131546, "epoch": 783} {"train_loss": -10.526727676391602, "global_step": 131547, "epoch": 783} {"train_loss": -10.077343940734863, "global_step": 131548, "epoch": 783} {"train_loss": -10.21696949005127, "global_step": 131549, "epoch": 783} {"train_loss": -10.3897066116333, "global_step": 131550, "epoch": 783} {"train_loss": -9.886116027832031, "global_step": 131551, "epoch": 783} {"train_loss": -10.11184024810791, "global_step": 131552, "epoch": 783} {"train_loss": -9.64802074432373, "global_step": 131553, "epoch": 783} {"train_loss": -10.345428466796875, "global_step": 131554, "epoch": 783} {"train_loss": -9.94326400756836, "global_step": 131555, "epoch": 783} {"train_loss": -10.368124961853027, "global_step": 131556, "epoch": 783} {"train_loss": -10.406319618225098, "global_step": 131557, "epoch": 783} {"train_loss": -10.157645225524902, "global_step": 131558, "epoch": 783} {"train_loss": -10.505348205566406, "global_step": 131559, "epoch": 783} {"train_loss": -10.512455940246582, "global_step": 131560, "epoch": 783} {"train_loss": -9.87367057800293, "global_step": 131561, "epoch": 783} {"train_loss": -10.534429550170898, "global_step": 131562, "epoch": 783} {"train_loss": -9.836841583251953, "global_step": 131563, "epoch": 783} {"train_loss": -10.52790641784668, "global_step": 131564, "epoch": 783} {"train_loss": -10.236783981323242, "global_step": 131565, "epoch": 783} {"train_loss": -10.622998237609863, "global_step": 131566, "epoch": 783} {"train_loss": -10.406393051147461, "global_step": 131567, "epoch": 783} {"train_loss": -10.75075912475586, "global_step": 131568, "epoch": 783} {"train_loss": -10.178813934326172, "global_step": 131569, "epoch": 783} {"train_loss": -10.348562240600586, "global_step": 131570, "epoch": 783} {"train_loss": -10.113269805908203, "global_step": 131571, "epoch": 783} {"train_loss": -10.522768020629883, "global_step": 131572, "epoch": 783} {"train_loss": -10.44145393371582, "global_step": 131573, "epoch": 783} {"train_loss": -10.173389434814453, "global_step": 131574, "epoch": 783} {"train_loss": -10.586372375488281, "global_step": 131575, "epoch": 783} {"train_loss": -10.174739837646484, "global_step": 131576, "epoch": 783} {"train_loss": -10.548355102539062, "global_step": 131577, "epoch": 783} {"train_loss": -10.489293098449707, "global_step": 131578, "epoch": 783} {"train_loss": -10.44229507446289, "global_step": 131579, "epoch": 783} {"train_loss": -10.60645580291748, "global_step": 131580, "epoch": 783} {"train_loss": -10.346748352050781, "global_step": 131581, "epoch": 783} {"train_loss": -10.570149421691895, "global_step": 131582, "epoch": 783} {"train_loss": -10.633634567260742, "global_step": 131583, "epoch": 783} {"train_loss": -10.561767578125, "global_step": 131584, "epoch": 783} {"train_loss": -10.626520156860352, "global_step": 131585, "epoch": 783} {"train_loss": -10.537363052368164, "global_step": 131586, "epoch": 783} {"train_loss": -10.735764503479004, "global_step": 131587, "epoch": 783} {"train_loss": -10.672073364257812, "global_step": 131588, "epoch": 783} {"train_loss": -10.49464225769043, "global_step": 131589, "epoch": 783} {"train_loss": -10.573386192321777, "global_step": 131590, "epoch": 783} {"train_loss": -10.474949836730957, "global_step": 131591, "epoch": 783} {"train_loss": -10.58526611328125, "global_step": 131592, "epoch": 783} {"train_loss": -10.812993049621582, "global_step": 131593, "epoch": 783} {"train_loss": -10.758513450622559, "global_step": 131594, "epoch": 783} {"train_loss": -10.459388732910156, "global_step": 131595, "epoch": 783} {"train_loss": -10.511807441711426, "global_step": 131596, "epoch": 783} {"train_loss": -10.618133544921875, "global_step": 131597, "epoch": 783} {"train_loss": -10.551406860351562, "global_step": 131598, "epoch": 783} {"train_loss": -10.516359329223633, "global_step": 131599, "epoch": 783} {"train_loss": -10.572602272033691, "global_step": 131600, "epoch": 783} {"train_loss": -10.450349807739258, "global_step": 131601, "epoch": 783} {"train_loss": -10.521505355834961, "global_step": 131602, "epoch": 783} {"train_loss": -10.352806091308594, "global_step": 131603, "epoch": 783} {"train_loss": -10.710895538330078, "global_step": 131604, "epoch": 783} {"train_loss": -10.035223007202148, "global_step": 131605, "epoch": 783} {"train_loss": -10.444038391113281, "global_step": 131606, "epoch": 783} {"train_loss": -10.869491577148438, "global_step": 131607, "epoch": 783} {"train_loss": -10.006534576416016, "global_step": 131608, "epoch": 783} {"train_loss": -10.64556884765625, "global_step": 131609, "epoch": 783} {"train_loss": -10.340185165405273, "global_step": 131610, "epoch": 783} {"train_loss": -10.667363166809082, "global_step": 131611, "epoch": 783} {"train_loss": -10.545610427856445, "global_step": 131612, "epoch": 783} {"train_loss": -9.886159896850586, "global_step": 131613, "epoch": 783} {"train_loss": -10.674068450927734, "global_step": 131614, "epoch": 783} {"train_loss": -10.378141403198242, "global_step": 131615, "epoch": 783} {"train_loss": -10.177252769470215, "global_step": 131616, "epoch": 783} {"train_loss": -10.435196876525879, "global_step": 131617, "epoch": 783} {"train_loss": -10.547882080078125, "global_step": 131618, "epoch": 783} {"train_loss": -9.909687042236328, "global_step": 131619, "epoch": 783} {"train_loss": -10.73621940612793, "global_step": 131620, "epoch": 783} {"train_loss": -10.13430404663086, "global_step": 131621, "epoch": 783} {"train_loss": -10.174920082092285, "global_step": 131622, "epoch": 783} {"train_loss": -10.577354431152344, "global_step": 131623, "epoch": 783} {"train_loss": -10.096200942993164, "global_step": 131624, "epoch": 783} {"train_loss": -10.519264221191406, "global_step": 131625, "epoch": 783} {"train_loss": -10.723287582397461, "global_step": 131626, "epoch": 783} {"train_loss": -10.516469955444336, "global_step": 131627, "epoch": 783} {"train_loss": -10.360750198364258, "global_step": 131628, "epoch": 783} {"train_loss": -10.182509422302246, "global_step": 131629, "epoch": 783} {"train_loss": -10.190067291259766, "global_step": 131630, "epoch": 783} {"train_loss": -10.456958770751953, "global_step": 131631, "epoch": 783} {"train_loss": -9.742513656616211, "global_step": 131632, "epoch": 783} {"train_loss": -10.389471054077148, "global_step": 131633, "epoch": 783} {"train_loss": -9.976177215576172, "global_step": 131634, "epoch": 783} {"train_loss": -10.10588264465332, "global_step": 131635, "epoch": 783} {"train_loss": -10.201955795288086, "global_step": 131636, "epoch": 783} {"train_loss": -10.010089874267578, "global_step": 131637, "epoch": 783} {"train_loss": -10.566462516784668, "global_step": 131638, "epoch": 783} {"train_loss": -10.117626190185547, "global_step": 131639, "epoch": 783} {"train_loss": -10.18517017364502, "global_step": 131640, "epoch": 783} {"train_loss": -10.308277130126953, "global_step": 131641, "epoch": 783} {"train_loss": -9.878242492675781, "global_step": 131642, "epoch": 783} {"train_loss": -10.499666213989258, "global_step": 131643, "epoch": 783} {"train_loss": -10.124608993530273, "global_step": 131644, "epoch": 783} {"train_loss": -9.98984146118164, "global_step": 131645, "epoch": 783} {"train_loss": -10.237213134765625, "global_step": 131646, "epoch": 783} {"train_loss": -10.058467864990234, "global_step": 131647, "epoch": 783} {"train_loss": -10.263742446899414, "global_step": 131648, "epoch": 783} {"train_loss": -10.170656204223633, "global_step": 131649, "epoch": 783} {"train_loss": -9.986695289611816, "global_step": 131650, "epoch": 783} {"train_loss": -10.134459495544434, "global_step": 131651, "epoch": 783} {"train_loss": -10.485820770263672, "global_step": 131652, "epoch": 783} {"train_loss": -10.068845748901367, "global_step": 131653, "epoch": 783} {"train_loss": -10.226147651672363, "global_step": 131654, "epoch": 783} {"train_loss": -10.555596351623535, "global_step": 131655, "epoch": 783} {"train_loss": -10.184247970581055, "global_step": 131656, "epoch": 783} {"train_loss": -10.417649269104004, "global_step": 131657, "epoch": 783} {"train_loss": -10.390975952148438, "global_step": 131658, "epoch": 783} {"train_loss": -10.176626205444336, "global_step": 131659, "epoch": 783} {"train_loss": -10.366310119628906, "global_step": 131660, "epoch": 783} {"train_loss": -9.859136581420898, "global_step": 131661, "epoch": 783} {"train_loss": -10.051148414611816, "global_step": 131662, "epoch": 783} {"train_loss": -10.430400848388672, "global_step": 131663, "epoch": 783} {"train_loss": -10.232156753540039, "global_step": 131664, "epoch": 783} {"train_loss": -10.235956192016602, "global_step": 131665, "epoch": 783} {"train_loss": -10.081438064575195, "global_step": 131666, "epoch": 783} {"train_loss": -10.49191665649414, "global_step": 131667, "epoch": 783} {"train_loss": -10.342525482177734, "global_step": 131668, "epoch": 783} {"train_loss": -10.513801574707031, "global_step": 131669, "epoch": 783} {"train_loss": -10.118026733398438, "global_step": 131670, "epoch": 783} {"train_loss": -10.483055114746094, "global_step": 131671, "epoch": 783} {"train_loss": -10.427314758300781, "global_step": 131672, "epoch": 783} {"train_loss": -10.509490013122559, "global_step": 131673, "epoch": 783} {"train_loss": -10.567344665527344, "global_step": 131674, "epoch": 783} {"train_loss": -10.549873352050781, "global_step": 131675, "epoch": 783} {"train_loss": -10.494583129882812, "global_step": 131676, "epoch": 783} {"train_loss": -10.488935470581055, "global_step": 131677, "epoch": 783} {"train_loss": -10.718193054199219, "global_step": 131678, "epoch": 783} {"train_loss": -10.442270278930664, "global_step": 131679, "epoch": 783} {"train_loss": -10.618749618530273, "global_step": 131680, "epoch": 783} {"train_loss": -10.487386703491211, "global_step": 131681, "epoch": 783} {"train_loss": -10.450632095336914, "global_step": 131682, "epoch": 783} {"train_loss": -10.63349723815918, "global_step": 131683, "epoch": 783} {"train_loss": -10.527490615844727, "global_step": 131684, "epoch": 783} {"train_loss": -10.623785018920898, "global_step": 131685, "epoch": 783} {"train_loss": -10.548038482666016, "global_step": 131686, "epoch": 783} {"train_loss": -10.592694282531738, "global_step": 131687, "epoch": 783} {"train_loss": -10.143400192260742, "global_step": 131688, "epoch": 783} {"train_loss": -10.09683609008789, "global_step": 131689, "epoch": 783} {"train_loss": -9.826672554016113, "global_step": 131690, "epoch": 783} {"train_loss": -10.441547393798828, "global_step": 131691, "epoch": 783} {"train_loss": -9.654281616210938, "global_step": 131692, "epoch": 783} {"train_loss": -10.220924377441406, "global_step": 131693, "epoch": 783} {"train_loss": -10.110121726989746, "global_step": 131694, "epoch": 783} {"train_loss": -10.153829574584961, "global_step": 131695, "epoch": 783} {"train_loss": -9.881967544555664, "global_step": 131696, "epoch": 783} {"train_loss": -10.252986907958984, "global_step": 131697, "epoch": 783} {"train_loss": -10.174203872680664, "global_step": 131698, "epoch": 783} {"train_loss": -10.2745943069458, "global_step": 131699, "epoch": 783} {"train_loss": -9.998481750488281, "global_step": 131700, "epoch": 783} {"train_loss": -10.057863235473633, "global_step": 131701, "epoch": 783} {"train_loss": -10.094022750854492, "global_step": 131702, "epoch": 783} {"train_loss": -10.114389419555664, "global_step": 131703, "epoch": 783} {"train_loss": -10.149532318115234, "global_step": 131704, "epoch": 783} {"train_loss": -10.40002727508545, "global_step": 131705, "epoch": 783} {"train_loss": -10.073854446411133, "global_step": 131706, "epoch": 783} {"train_loss": -10.595829010009766, "global_step": 131707, "epoch": 783} {"train_loss": -10.087722778320312, "global_step": 131708, "epoch": 783} {"train_loss": -10.271195411682129, "global_step": 131709, "epoch": 783} {"train_loss": -10.414007186889648, "global_step": 131710, "epoch": 783} {"train_loss": -10.335258920987448, "global_step": 131711, "epoch": 783, "val_loss": 222531.625} {"train_loss": -10.411956787109375, "global_step": 131712, "epoch": 784} {"train_loss": -9.834299087524414, "global_step": 131713, "epoch": 784} {"train_loss": -10.567934036254883, "global_step": 131714, "epoch": 784} {"train_loss": -9.940628051757812, "global_step": 131715, "epoch": 784} {"train_loss": -10.272159576416016, "global_step": 131716, "epoch": 784} {"train_loss": -10.353689193725586, "global_step": 131717, "epoch": 784} {"train_loss": -10.359594345092773, "global_step": 131718, "epoch": 784} {"train_loss": -10.344282150268555, "global_step": 131719, "epoch": 784} {"train_loss": -10.325922012329102, "global_step": 131720, "epoch": 784} {"train_loss": -10.4161958694458, "global_step": 131721, "epoch": 784} {"train_loss": -10.298524856567383, "global_step": 131722, "epoch": 784} {"train_loss": -10.390874862670898, "global_step": 131723, "epoch": 784} {"train_loss": -10.531766891479492, "global_step": 131724, "epoch": 784} {"train_loss": -10.303401947021484, "global_step": 131725, "epoch": 784} {"train_loss": -10.433807373046875, "global_step": 131726, "epoch": 784} {"train_loss": -10.543078422546387, "global_step": 131727, "epoch": 784} {"train_loss": -10.532405853271484, "global_step": 131728, "epoch": 784} {"train_loss": -10.671609878540039, "global_step": 131729, "epoch": 784} {"train_loss": -10.501289367675781, "global_step": 131730, "epoch": 784} {"train_loss": -10.68948745727539, "global_step": 131731, "epoch": 784} {"train_loss": -10.51684856414795, "global_step": 131732, "epoch": 784} {"train_loss": -10.246305465698242, "global_step": 131733, "epoch": 784} {"train_loss": -10.448066711425781, "global_step": 131734, "epoch": 784} {"train_loss": -10.556583404541016, "global_step": 131735, "epoch": 784} {"train_loss": -10.536092758178711, "global_step": 131736, "epoch": 784} {"train_loss": -10.531076431274414, "global_step": 131737, "epoch": 784} {"train_loss": -10.612473487854004, "global_step": 131738, "epoch": 784} {"train_loss": -10.154977798461914, "global_step": 131739, "epoch": 784} {"train_loss": -10.69376277923584, "global_step": 131740, "epoch": 784} {"train_loss": -10.160013198852539, "global_step": 131741, "epoch": 784} {"train_loss": -10.493783950805664, "global_step": 131742, "epoch": 784} {"train_loss": -10.22365951538086, "global_step": 131743, "epoch": 784} {"train_loss": -10.117234230041504, "global_step": 131744, "epoch": 784} {"train_loss": -9.587019920349121, "global_step": 131745, "epoch": 784} {"train_loss": -9.693560600280762, "global_step": 131746, "epoch": 784} {"train_loss": -9.820016860961914, "global_step": 131747, "epoch": 784} {"train_loss": -9.994144439697266, "global_step": 131748, "epoch": 784} {"train_loss": -9.809515953063965, "global_step": 131749, "epoch": 784} {"train_loss": -10.288782119750977, "global_step": 131750, "epoch": 784} {"train_loss": -9.071142196655273, "global_step": 131751, "epoch": 784} {"train_loss": -10.55801010131836, "global_step": 131752, "epoch": 784} {"train_loss": -9.33641242980957, "global_step": 131753, "epoch": 784} {"train_loss": -9.362688064575195, "global_step": 131754, "epoch": 784} {"train_loss": -10.01341724395752, "global_step": 131755, "epoch": 784} {"train_loss": -9.590160369873047, "global_step": 131756, "epoch": 784} {"train_loss": -9.52022933959961, "global_step": 131757, "epoch": 784} {"train_loss": -9.980964660644531, "global_step": 131758, "epoch": 784} {"train_loss": -9.164138793945312, "global_step": 131759, "epoch": 784} {"train_loss": -10.135002136230469, "global_step": 131760, "epoch": 784} {"train_loss": -9.67133617401123, "global_step": 131761, "epoch": 784} {"train_loss": -9.945100784301758, "global_step": 131762, "epoch": 784} {"train_loss": -10.308889389038086, "global_step": 131763, "epoch": 784} {"train_loss": -9.818756103515625, "global_step": 131764, "epoch": 784} {"train_loss": -10.283709526062012, "global_step": 131765, "epoch": 784} {"train_loss": -10.302327156066895, "global_step": 131766, "epoch": 784} {"train_loss": -9.972562789916992, "global_step": 131767, "epoch": 784} {"train_loss": -10.228609085083008, "global_step": 131768, "epoch": 784} {"train_loss": -10.510807037353516, "global_step": 131769, "epoch": 784} {"train_loss": -10.260139465332031, "global_step": 131770, "epoch": 784} {"train_loss": -10.111156463623047, "global_step": 131771, "epoch": 784} {"train_loss": -10.369958877563477, "global_step": 131772, "epoch": 784} {"train_loss": -9.869905471801758, "global_step": 131773, "epoch": 784} {"train_loss": -10.124106407165527, "global_step": 131774, "epoch": 784} {"train_loss": -10.490257263183594, "global_step": 131775, "epoch": 784} {"train_loss": -10.384899139404297, "global_step": 131776, "epoch": 784} {"train_loss": -10.247943878173828, "global_step": 131777, "epoch": 784} {"train_loss": -10.432558059692383, "global_step": 131778, "epoch": 784} {"train_loss": -10.244444847106934, "global_step": 131779, "epoch": 784} {"train_loss": -10.37706184387207, "global_step": 131780, "epoch": 784} {"train_loss": -10.579954147338867, "global_step": 131781, "epoch": 784} {"train_loss": -10.284334182739258, "global_step": 131782, "epoch": 784} {"train_loss": -10.465394020080566, "global_step": 131783, "epoch": 784} {"train_loss": -10.451362609863281, "global_step": 131784, "epoch": 784} {"train_loss": -10.46096420288086, "global_step": 131785, "epoch": 784} {"train_loss": -10.583712577819824, "global_step": 131786, "epoch": 784} {"train_loss": -10.432497024536133, "global_step": 131787, "epoch": 784} {"train_loss": -10.66393756866455, "global_step": 131788, "epoch": 784} {"train_loss": -10.502361297607422, "global_step": 131789, "epoch": 784} {"train_loss": -10.676397323608398, "global_step": 131790, "epoch": 784} {"train_loss": -10.289802551269531, "global_step": 131791, "epoch": 784} {"train_loss": -10.29005241394043, "global_step": 131792, "epoch": 784} {"train_loss": -9.942337989807129, "global_step": 131793, "epoch": 784} {"train_loss": -9.785409927368164, "global_step": 131794, "epoch": 784} {"train_loss": -10.188825607299805, "global_step": 131795, "epoch": 784} {"train_loss": -10.112661361694336, "global_step": 131796, "epoch": 784} {"train_loss": -10.314693450927734, "global_step": 131797, "epoch": 784} {"train_loss": -9.833478927612305, "global_step": 131798, "epoch": 784} {"train_loss": -9.780649185180664, "global_step": 131799, "epoch": 784} {"train_loss": -10.232420921325684, "global_step": 131800, "epoch": 784} {"train_loss": -9.141804695129395, "global_step": 131801, "epoch": 784} {"train_loss": -9.956514358520508, "global_step": 131802, "epoch": 784} {"train_loss": -9.980962753295898, "global_step": 131803, "epoch": 784} {"train_loss": -10.086508750915527, "global_step": 131804, "epoch": 784} {"train_loss": -9.375709533691406, "global_step": 131805, "epoch": 784} {"train_loss": -10.510698318481445, "global_step": 131806, "epoch": 784} {"train_loss": -9.22808837890625, "global_step": 131807, "epoch": 784} {"train_loss": -10.618642807006836, "global_step": 131808, "epoch": 784} {"train_loss": -10.099434852600098, "global_step": 131809, "epoch": 784} {"train_loss": -10.1431884765625, "global_step": 131810, "epoch": 784} {"train_loss": -10.194663047790527, "global_step": 131811, "epoch": 784} {"train_loss": -10.374104499816895, "global_step": 131812, "epoch": 784} {"train_loss": -10.140106201171875, "global_step": 131813, "epoch": 784} {"train_loss": -10.464755058288574, "global_step": 131814, "epoch": 784} {"train_loss": -10.295687675476074, "global_step": 131815, "epoch": 784} {"train_loss": -10.438222885131836, "global_step": 131816, "epoch": 784} {"train_loss": -10.211591720581055, "global_step": 131817, "epoch": 784} {"train_loss": -10.436493873596191, "global_step": 131818, "epoch": 784} {"train_loss": -10.264281272888184, "global_step": 131819, "epoch": 784} {"train_loss": -10.428617477416992, "global_step": 131820, "epoch": 784} {"train_loss": -10.304559707641602, "global_step": 131821, "epoch": 784} {"train_loss": -10.31747055053711, "global_step": 131822, "epoch": 784} {"train_loss": -10.039066314697266, "global_step": 131823, "epoch": 784} {"train_loss": -10.548309326171875, "global_step": 131824, "epoch": 784} {"train_loss": -10.406492233276367, "global_step": 131825, "epoch": 784} {"train_loss": -10.468326568603516, "global_step": 131826, "epoch": 784} {"train_loss": -10.593101501464844, "global_step": 131827, "epoch": 784} {"train_loss": -10.57708740234375, "global_step": 131828, "epoch": 784} {"train_loss": -10.505112648010254, "global_step": 131829, "epoch": 784} {"train_loss": -10.626547813415527, "global_step": 131830, "epoch": 784} {"train_loss": -10.43110466003418, "global_step": 131831, "epoch": 784} {"train_loss": -10.814931869506836, "global_step": 131832, "epoch": 784} {"train_loss": -10.460044860839844, "global_step": 131833, "epoch": 784} {"train_loss": -10.586402893066406, "global_step": 131834, "epoch": 784} {"train_loss": -10.644880294799805, "global_step": 131835, "epoch": 784} {"train_loss": -10.537267684936523, "global_step": 131836, "epoch": 784} {"train_loss": -10.713911056518555, "global_step": 131837, "epoch": 784} {"train_loss": -10.725221633911133, "global_step": 131838, "epoch": 784} {"train_loss": -10.485076904296875, "global_step": 131839, "epoch": 784} {"train_loss": -10.452152252197266, "global_step": 131840, "epoch": 784} {"train_loss": -10.464049339294434, "global_step": 131841, "epoch": 784} {"train_loss": -10.601361274719238, "global_step": 131842, "epoch": 784} {"train_loss": -10.819112777709961, "global_step": 131843, "epoch": 784} {"train_loss": -10.475974082946777, "global_step": 131844, "epoch": 784} {"train_loss": -10.84850025177002, "global_step": 131845, "epoch": 784} {"train_loss": -10.541335105895996, "global_step": 131846, "epoch": 784} {"train_loss": -10.494237899780273, "global_step": 131847, "epoch": 784} {"train_loss": -10.727943420410156, "global_step": 131848, "epoch": 784} {"train_loss": -10.596782684326172, "global_step": 131849, "epoch": 784} {"train_loss": -10.238275527954102, "global_step": 131850, "epoch": 784} {"train_loss": -10.661230087280273, "global_step": 131851, "epoch": 784} {"train_loss": -10.269632339477539, "global_step": 131852, "epoch": 784} {"train_loss": -10.341983795166016, "global_step": 131853, "epoch": 784} {"train_loss": -10.269290924072266, "global_step": 131854, "epoch": 784} {"train_loss": -10.186808586120605, "global_step": 131855, "epoch": 784} {"train_loss": -10.558282852172852, "global_step": 131856, "epoch": 784} {"train_loss": -10.415324211120605, "global_step": 131857, "epoch": 784} {"train_loss": -10.480628967285156, "global_step": 131858, "epoch": 784} {"train_loss": -10.194378852844238, "global_step": 131859, "epoch": 784} {"train_loss": -10.238286018371582, "global_step": 131860, "epoch": 784} {"train_loss": -10.749198913574219, "global_step": 131861, "epoch": 784} {"train_loss": -10.290748596191406, "global_step": 131862, "epoch": 784} {"train_loss": -10.246828079223633, "global_step": 131863, "epoch": 784} {"train_loss": -10.490091323852539, "global_step": 131864, "epoch": 784} {"train_loss": -10.215014457702637, "global_step": 131865, "epoch": 784} {"train_loss": -10.269529342651367, "global_step": 131866, "epoch": 784} {"train_loss": -10.515204429626465, "global_step": 131867, "epoch": 784} {"train_loss": -10.349787712097168, "global_step": 131868, "epoch": 784} {"train_loss": -10.02462387084961, "global_step": 131869, "epoch": 784} {"train_loss": -10.390005111694336, "global_step": 131870, "epoch": 784} {"train_loss": -10.256307601928711, "global_step": 131871, "epoch": 784} {"train_loss": -10.549690246582031, "global_step": 131872, "epoch": 784} {"train_loss": -10.246381759643555, "global_step": 131873, "epoch": 784} {"train_loss": -10.371892929077148, "global_step": 131874, "epoch": 784} {"train_loss": -10.415079116821289, "global_step": 131875, "epoch": 784} {"train_loss": -10.354225158691406, "global_step": 131876, "epoch": 784} {"train_loss": -10.131184577941895, "global_step": 131877, "epoch": 784} {"train_loss": -10.06507396697998, "global_step": 131878, "epoch": 784} {"train_loss": -10.279028585978917, "global_step": 131879, "epoch": 784, "val_loss": 218978.96875} {"train_loss": -10.006521224975586, "global_step": 131880, "epoch": 785} {"train_loss": -9.9924898147583, "global_step": 131881, "epoch": 785} {"train_loss": -10.344741821289062, "global_step": 131882, "epoch": 785} {"train_loss": -9.986698150634766, "global_step": 131883, "epoch": 785} {"train_loss": -10.379493713378906, "global_step": 131884, "epoch": 785} {"train_loss": -10.332168579101562, "global_step": 131885, "epoch": 785} {"train_loss": -9.990375518798828, "global_step": 131886, "epoch": 785} {"train_loss": -10.20828628540039, "global_step": 131887, "epoch": 785} {"train_loss": -9.960580825805664, "global_step": 131888, "epoch": 785} {"train_loss": -10.384468078613281, "global_step": 131889, "epoch": 785} {"train_loss": -9.984289169311523, "global_step": 131890, "epoch": 785} {"train_loss": -9.865442276000977, "global_step": 131891, "epoch": 785} {"train_loss": -10.330193519592285, "global_step": 131892, "epoch": 785} {"train_loss": -10.041610717773438, "global_step": 131893, "epoch": 785} {"train_loss": -10.345947265625, "global_step": 131894, "epoch": 785} {"train_loss": -9.51192855834961, "global_step": 131895, "epoch": 785} {"train_loss": -10.321630477905273, "global_step": 131896, "epoch": 785} {"train_loss": -9.017809867858887, "global_step": 131897, "epoch": 785} {"train_loss": -10.432250022888184, "global_step": 131898, "epoch": 785} {"train_loss": -9.256141662597656, "global_step": 131899, "epoch": 785} {"train_loss": -10.475292205810547, "global_step": 131900, "epoch": 785} {"train_loss": -9.203672409057617, "global_step": 131901, "epoch": 785} {"train_loss": -10.179482460021973, "global_step": 131902, "epoch": 785} {"train_loss": -9.455012321472168, "global_step": 131903, "epoch": 785} {"train_loss": -10.234304428100586, "global_step": 131904, "epoch": 785} {"train_loss": -9.883207321166992, "global_step": 131905, "epoch": 785} {"train_loss": -10.027519226074219, "global_step": 131906, "epoch": 785} {"train_loss": -10.100492477416992, "global_step": 131907, "epoch": 785} {"train_loss": -10.304094314575195, "global_step": 131908, "epoch": 785} {"train_loss": -10.267107963562012, "global_step": 131909, "epoch": 785} {"train_loss": -10.242137908935547, "global_step": 131910, "epoch": 785} {"train_loss": -10.417085647583008, "global_step": 131911, "epoch": 785} {"train_loss": -10.203908920288086, "global_step": 131912, "epoch": 785} {"train_loss": -10.431611061096191, "global_step": 131913, "epoch": 785} {"train_loss": -10.209465980529785, "global_step": 131914, "epoch": 785} {"train_loss": -10.37887191772461, "global_step": 131915, "epoch": 785} {"train_loss": -10.361324310302734, "global_step": 131916, "epoch": 785} {"train_loss": -10.456846237182617, "global_step": 131917, "epoch": 785} {"train_loss": -10.297835350036621, "global_step": 131918, "epoch": 785} {"train_loss": -10.393857955932617, "global_step": 131919, "epoch": 785} {"train_loss": -10.652477264404297, "global_step": 131920, "epoch": 785} {"train_loss": -10.22591781616211, "global_step": 131921, "epoch": 785} {"train_loss": -10.500865936279297, "global_step": 131922, "epoch": 785} {"train_loss": -10.32050895690918, "global_step": 131923, "epoch": 785} {"train_loss": -10.638336181640625, "global_step": 131924, "epoch": 785} {"train_loss": -10.500298500061035, "global_step": 131925, "epoch": 785} {"train_loss": -10.519657135009766, "global_step": 131926, "epoch": 785} {"train_loss": -10.35716438293457, "global_step": 131927, "epoch": 785} {"train_loss": -10.718782424926758, "global_step": 131928, "epoch": 785} {"train_loss": -10.321245193481445, "global_step": 131929, "epoch": 785} {"train_loss": -10.620762825012207, "global_step": 131930, "epoch": 785} {"train_loss": -10.367225646972656, "global_step": 131931, "epoch": 785} {"train_loss": -10.452022552490234, "global_step": 131932, "epoch": 785} {"train_loss": -10.73116397857666, "global_step": 131933, "epoch": 785} {"train_loss": -10.653594970703125, "global_step": 131934, "epoch": 785} {"train_loss": -10.608053207397461, "global_step": 131935, "epoch": 785} {"train_loss": -10.431451797485352, "global_step": 131936, "epoch": 785} {"train_loss": -10.778463363647461, "global_step": 131937, "epoch": 785} {"train_loss": -10.54340934753418, "global_step": 131938, "epoch": 785} {"train_loss": -10.577014923095703, "global_step": 131939, "epoch": 785} {"train_loss": -10.839357376098633, "global_step": 131940, "epoch": 785} {"train_loss": -10.360498428344727, "global_step": 131941, "epoch": 785} {"train_loss": -10.359861373901367, "global_step": 131942, "epoch": 785} {"train_loss": -10.891626358032227, "global_step": 131943, "epoch": 785} {"train_loss": -10.618284225463867, "global_step": 131944, "epoch": 785} {"train_loss": -9.848485946655273, "global_step": 131945, "epoch": 785} {"train_loss": -10.591775894165039, "global_step": 131946, "epoch": 785} {"train_loss": -10.287772178649902, "global_step": 131947, "epoch": 785} {"train_loss": -10.570793151855469, "global_step": 131948, "epoch": 785} {"train_loss": -10.585441589355469, "global_step": 131949, "epoch": 785} {"train_loss": -10.448230743408203, "global_step": 131950, "epoch": 785} {"train_loss": -10.619046211242676, "global_step": 131951, "epoch": 785} {"train_loss": -10.57063102722168, "global_step": 131952, "epoch": 785} {"train_loss": -10.336575508117676, "global_step": 131953, "epoch": 785} {"train_loss": -10.378604888916016, "global_step": 131954, "epoch": 785} {"train_loss": -10.07578182220459, "global_step": 131955, "epoch": 785} {"train_loss": -10.36276912689209, "global_step": 131956, "epoch": 785} {"train_loss": -10.223188400268555, "global_step": 131957, "epoch": 785} {"train_loss": -10.03774642944336, "global_step": 131958, "epoch": 785} {"train_loss": -10.59739875793457, "global_step": 131959, "epoch": 785} {"train_loss": -9.663198471069336, "global_step": 131960, "epoch": 785} {"train_loss": -10.178943634033203, "global_step": 131961, "epoch": 785} {"train_loss": -10.347267150878906, "global_step": 131962, "epoch": 785} {"train_loss": -9.942794799804688, "global_step": 131963, "epoch": 785} {"train_loss": -10.531444549560547, "global_step": 131964, "epoch": 785} {"train_loss": -9.86225700378418, "global_step": 131965, "epoch": 785} {"train_loss": -10.610657691955566, "global_step": 131966, "epoch": 785} {"train_loss": -10.112020492553711, "global_step": 131967, "epoch": 785} {"train_loss": -10.270349502563477, "global_step": 131968, "epoch": 785} {"train_loss": -10.114863395690918, "global_step": 131969, "epoch": 785} {"train_loss": -10.132987976074219, "global_step": 131970, "epoch": 785} {"train_loss": -10.741886138916016, "global_step": 131971, "epoch": 785} {"train_loss": -10.323701858520508, "global_step": 131972, "epoch": 785} {"train_loss": -10.42410659790039, "global_step": 131973, "epoch": 785} {"train_loss": -10.507242202758789, "global_step": 131974, "epoch": 785} {"train_loss": -10.594914436340332, "global_step": 131975, "epoch": 785} {"train_loss": -10.320268630981445, "global_step": 131976, "epoch": 785} {"train_loss": -10.561103820800781, "global_step": 131977, "epoch": 785} {"train_loss": -10.262887954711914, "global_step": 131978, "epoch": 785} {"train_loss": -10.54578971862793, "global_step": 131979, "epoch": 785} {"train_loss": -10.42917537689209, "global_step": 131980, "epoch": 785} {"train_loss": -10.179941177368164, "global_step": 131981, "epoch": 785} {"train_loss": -10.55949592590332, "global_step": 131982, "epoch": 785} {"train_loss": -10.501398086547852, "global_step": 131983, "epoch": 785} {"train_loss": -10.37905216217041, "global_step": 131984, "epoch": 785} {"train_loss": -10.56928539276123, "global_step": 131985, "epoch": 785} {"train_loss": -10.43753719329834, "global_step": 131986, "epoch": 785} {"train_loss": -10.680900573730469, "global_step": 131987, "epoch": 785} {"train_loss": -10.037860870361328, "global_step": 131988, "epoch": 785} {"train_loss": -10.404703140258789, "global_step": 131989, "epoch": 785} {"train_loss": -10.528909683227539, "global_step": 131990, "epoch": 785} {"train_loss": -10.421337127685547, "global_step": 131991, "epoch": 785} {"train_loss": -10.751768112182617, "global_step": 131992, "epoch": 785} {"train_loss": -10.483662605285645, "global_step": 131993, "epoch": 785} {"train_loss": -10.643922805786133, "global_step": 131994, "epoch": 785} {"train_loss": -10.267902374267578, "global_step": 131995, "epoch": 785} {"train_loss": -10.493551254272461, "global_step": 131996, "epoch": 785} {"train_loss": -10.399984359741211, "global_step": 131997, "epoch": 785} {"train_loss": -10.562424659729004, "global_step": 131998, "epoch": 785} {"train_loss": -10.601703643798828, "global_step": 131999, "epoch": 785} {"train_loss": -10.417285919189453, "global_step": 132000, "epoch": 785} {"train_loss": -10.459821701049805, "global_step": 132001, "epoch": 785} {"train_loss": -10.303983688354492, "global_step": 132002, "epoch": 785} {"train_loss": -10.561843872070312, "global_step": 132003, "epoch": 785} {"train_loss": -10.314494132995605, "global_step": 132004, "epoch": 785} {"train_loss": -10.243907928466797, "global_step": 132005, "epoch": 785} {"train_loss": -10.524642944335938, "global_step": 132006, "epoch": 785} {"train_loss": -10.23359489440918, "global_step": 132007, "epoch": 785} {"train_loss": -10.721978187561035, "global_step": 132008, "epoch": 785} {"train_loss": -10.320068359375, "global_step": 132009, "epoch": 785} {"train_loss": -10.651302337646484, "global_step": 132010, "epoch": 785} {"train_loss": -10.268787384033203, "global_step": 132011, "epoch": 785} {"train_loss": -10.39223861694336, "global_step": 132012, "epoch": 785} {"train_loss": -10.435583114624023, "global_step": 132013, "epoch": 785} {"train_loss": -10.460559844970703, "global_step": 132014, "epoch": 785} {"train_loss": -10.727460861206055, "global_step": 132015, "epoch": 785} {"train_loss": -10.603506088256836, "global_step": 132016, "epoch": 785} {"train_loss": -10.689785957336426, "global_step": 132017, "epoch": 785} {"train_loss": -10.652225494384766, "global_step": 132018, "epoch": 785} {"train_loss": -10.487030029296875, "global_step": 132019, "epoch": 785} {"train_loss": -10.59119987487793, "global_step": 132020, "epoch": 785} {"train_loss": -10.482263565063477, "global_step": 132021, "epoch": 785} {"train_loss": -10.52486801147461, "global_step": 132022, "epoch": 785} {"train_loss": -10.516717910766602, "global_step": 132023, "epoch": 785} {"train_loss": -10.73179817199707, "global_step": 132024, "epoch": 785} {"train_loss": -10.738758087158203, "global_step": 132025, "epoch": 785} {"train_loss": -10.517816543579102, "global_step": 132026, "epoch": 785} {"train_loss": -10.121071815490723, "global_step": 132027, "epoch": 785} {"train_loss": -9.872468948364258, "global_step": 132028, "epoch": 785} {"train_loss": -10.309898376464844, "global_step": 132029, "epoch": 785} {"train_loss": -9.225194931030273, "global_step": 132030, "epoch": 785} {"train_loss": -10.316401481628418, "global_step": 132031, "epoch": 785} {"train_loss": -9.908288955688477, "global_step": 132032, "epoch": 785} {"train_loss": -10.160648345947266, "global_step": 132033, "epoch": 785} {"train_loss": -10.162909507751465, "global_step": 132034, "epoch": 785} {"train_loss": -10.36846923828125, "global_step": 132035, "epoch": 785} {"train_loss": -9.916505813598633, "global_step": 132036, "epoch": 785} {"train_loss": -9.904509544372559, "global_step": 132037, "epoch": 785} {"train_loss": -10.411123275756836, "global_step": 132038, "epoch": 785} {"train_loss": -9.886998176574707, "global_step": 132039, "epoch": 785} {"train_loss": -9.966961860656738, "global_step": 132040, "epoch": 785} {"train_loss": -10.250614166259766, "global_step": 132041, "epoch": 785} {"train_loss": -10.0562162399292, "global_step": 132042, "epoch": 785} {"train_loss": -9.787264823913574, "global_step": 132043, "epoch": 785} {"train_loss": -9.910775184631348, "global_step": 132044, "epoch": 785} {"train_loss": -9.912052154541016, "global_step": 132045, "epoch": 785} {"train_loss": -10.28089714050293, "global_step": 132046, "epoch": 785} {"train_loss": -10.312214062327431, "global_step": 132047, "epoch": 785, "val_loss": 218788.46875, "train_action_mse_error": 6.291531085968018} {"train_loss": -9.601078987121582, "global_step": 132048, "epoch": 786} {"train_loss": -9.83392333984375, "global_step": 132049, "epoch": 786} {"train_loss": -9.899015426635742, "global_step": 132050, "epoch": 786} {"train_loss": -9.785518646240234, "global_step": 132051, "epoch": 786} {"train_loss": -9.998688697814941, "global_step": 132052, "epoch": 786} {"train_loss": -9.794361114501953, "global_step": 132053, "epoch": 786} {"train_loss": -9.857218742370605, "global_step": 132054, "epoch": 786} {"train_loss": -10.339078903198242, "global_step": 132055, "epoch": 786} {"train_loss": -10.026270866394043, "global_step": 132056, "epoch": 786} {"train_loss": -10.412373542785645, "global_step": 132057, "epoch": 786} {"train_loss": -10.27944564819336, "global_step": 132058, "epoch": 786} {"train_loss": -10.186800956726074, "global_step": 132059, "epoch": 786} {"train_loss": -10.243940353393555, "global_step": 132060, "epoch": 786} {"train_loss": -10.099562644958496, "global_step": 132061, "epoch": 786} {"train_loss": -10.150890350341797, "global_step": 132062, "epoch": 786} {"train_loss": -10.351093292236328, "global_step": 132063, "epoch": 786} {"train_loss": -10.405206680297852, "global_step": 132064, "epoch": 786} {"train_loss": -10.436466217041016, "global_step": 132065, "epoch": 786} {"train_loss": -10.365997314453125, "global_step": 132066, "epoch": 786} {"train_loss": -10.344156265258789, "global_step": 132067, "epoch": 786} {"train_loss": -10.320908546447754, "global_step": 132068, "epoch": 786} {"train_loss": -10.575521469116211, "global_step": 132069, "epoch": 786} {"train_loss": -10.508153915405273, "global_step": 132070, "epoch": 786} {"train_loss": -10.598177909851074, "global_step": 132071, "epoch": 786} {"train_loss": -10.76795768737793, "global_step": 132072, "epoch": 786} {"train_loss": -10.483305931091309, "global_step": 132073, "epoch": 786} {"train_loss": -10.494365692138672, "global_step": 132074, "epoch": 786} {"train_loss": -10.735442161560059, "global_step": 132075, "epoch": 786} {"train_loss": -10.486732482910156, "global_step": 132076, "epoch": 786} {"train_loss": -10.531129837036133, "global_step": 132077, "epoch": 786} {"train_loss": -10.526823043823242, "global_step": 132078, "epoch": 786} {"train_loss": -10.552845001220703, "global_step": 132079, "epoch": 786} {"train_loss": -10.59710693359375, "global_step": 132080, "epoch": 786} {"train_loss": -10.484258651733398, "global_step": 132081, "epoch": 786} {"train_loss": -10.549038887023926, "global_step": 132082, "epoch": 786} {"train_loss": -10.658699035644531, "global_step": 132083, "epoch": 786} {"train_loss": -10.294793128967285, "global_step": 132084, "epoch": 786} {"train_loss": -10.542097091674805, "global_step": 132085, "epoch": 786} {"train_loss": -10.692867279052734, "global_step": 132086, "epoch": 786} {"train_loss": -10.416875839233398, "global_step": 132087, "epoch": 786} {"train_loss": -10.734786987304688, "global_step": 132088, "epoch": 786} {"train_loss": -10.382518768310547, "global_step": 132089, "epoch": 786} {"train_loss": -10.781850814819336, "global_step": 132090, "epoch": 786} {"train_loss": -10.455926895141602, "global_step": 132091, "epoch": 786} {"train_loss": -10.285587310791016, "global_step": 132092, "epoch": 786} {"train_loss": -10.54647159576416, "global_step": 132093, "epoch": 786} {"train_loss": -10.162494659423828, "global_step": 132094, "epoch": 786} {"train_loss": -10.433782577514648, "global_step": 132095, "epoch": 786} {"train_loss": -10.371681213378906, "global_step": 132096, "epoch": 786} {"train_loss": -10.080936431884766, "global_step": 132097, "epoch": 786} {"train_loss": -10.23246955871582, "global_step": 132098, "epoch": 786} {"train_loss": -10.66807746887207, "global_step": 132099, "epoch": 786} {"train_loss": -10.335823059082031, "global_step": 132100, "epoch": 786} {"train_loss": -10.704916954040527, "global_step": 132101, "epoch": 786} {"train_loss": -10.541997909545898, "global_step": 132102, "epoch": 786} {"train_loss": -10.409423828125, "global_step": 132103, "epoch": 786} {"train_loss": -10.363931655883789, "global_step": 132104, "epoch": 786} {"train_loss": -9.987222671508789, "global_step": 132105, "epoch": 786} {"train_loss": -10.662708282470703, "global_step": 132106, "epoch": 786} {"train_loss": -10.233556747436523, "global_step": 132107, "epoch": 786} {"train_loss": -10.36605453491211, "global_step": 132108, "epoch": 786} {"train_loss": -10.43001937866211, "global_step": 132109, "epoch": 786} {"train_loss": -9.990152359008789, "global_step": 132110, "epoch": 786} {"train_loss": -10.254985809326172, "global_step": 132111, "epoch": 786} {"train_loss": -10.25658893585205, "global_step": 132112, "epoch": 786} {"train_loss": -10.347894668579102, "global_step": 132113, "epoch": 786} {"train_loss": -10.270803451538086, "global_step": 132114, "epoch": 786} {"train_loss": -10.422499656677246, "global_step": 132115, "epoch": 786} {"train_loss": -10.606258392333984, "global_step": 132116, "epoch": 786} {"train_loss": -10.489446640014648, "global_step": 132117, "epoch": 786} {"train_loss": -10.383031845092773, "global_step": 132118, "epoch": 786} {"train_loss": -10.4494047164917, "global_step": 132119, "epoch": 786} {"train_loss": -10.39906120300293, "global_step": 132120, "epoch": 786} {"train_loss": -10.62910270690918, "global_step": 132121, "epoch": 786} {"train_loss": -10.592637062072754, "global_step": 132122, "epoch": 786} {"train_loss": -10.474239349365234, "global_step": 132123, "epoch": 786} {"train_loss": -10.173322677612305, "global_step": 132124, "epoch": 786} {"train_loss": -10.260494232177734, "global_step": 132125, "epoch": 786} {"train_loss": -10.426533699035645, "global_step": 132126, "epoch": 786} {"train_loss": -10.426777839660645, "global_step": 132127, "epoch": 786} {"train_loss": -10.57087230682373, "global_step": 132128, "epoch": 786} {"train_loss": -9.921306610107422, "global_step": 132129, "epoch": 786} {"train_loss": -10.633216857910156, "global_step": 132130, "epoch": 786} {"train_loss": -10.10800552368164, "global_step": 132131, "epoch": 786} {"train_loss": -10.41404914855957, "global_step": 132132, "epoch": 786} {"train_loss": -10.06119441986084, "global_step": 132133, "epoch": 786} {"train_loss": -10.336742401123047, "global_step": 132134, "epoch": 786} {"train_loss": -10.439398765563965, "global_step": 132135, "epoch": 786} {"train_loss": -10.023648262023926, "global_step": 132136, "epoch": 786} {"train_loss": -10.566842079162598, "global_step": 132137, "epoch": 786} {"train_loss": -10.348726272583008, "global_step": 132138, "epoch": 786} {"train_loss": -10.224674224853516, "global_step": 132139, "epoch": 786} {"train_loss": -10.142126083374023, "global_step": 132140, "epoch": 786} {"train_loss": -10.33750057220459, "global_step": 132141, "epoch": 786} {"train_loss": -10.537972450256348, "global_step": 132142, "epoch": 786} {"train_loss": -10.121725082397461, "global_step": 132143, "epoch": 786} {"train_loss": -10.415715217590332, "global_step": 132144, "epoch": 786} {"train_loss": -10.59956169128418, "global_step": 132145, "epoch": 786} {"train_loss": -10.119366645812988, "global_step": 132146, "epoch": 786} {"train_loss": -10.524614334106445, "global_step": 132147, "epoch": 786} {"train_loss": -10.182356834411621, "global_step": 132148, "epoch": 786} {"train_loss": -10.330941200256348, "global_step": 132149, "epoch": 786} {"train_loss": -10.402182579040527, "global_step": 132150, "epoch": 786} {"train_loss": -9.90609359741211, "global_step": 132151, "epoch": 786} {"train_loss": -10.489616394042969, "global_step": 132152, "epoch": 786} {"train_loss": -9.818638801574707, "global_step": 132153, "epoch": 786} {"train_loss": -10.02003002166748, "global_step": 132154, "epoch": 786} {"train_loss": -9.441915512084961, "global_step": 132155, "epoch": 786} {"train_loss": -10.52311897277832, "global_step": 132156, "epoch": 786} {"train_loss": -10.146751403808594, "global_step": 132157, "epoch": 786} {"train_loss": -9.553308486938477, "global_step": 132158, "epoch": 786} {"train_loss": -10.327126502990723, "global_step": 132159, "epoch": 786} {"train_loss": -9.76399040222168, "global_step": 132160, "epoch": 786} {"train_loss": -9.99631118774414, "global_step": 132161, "epoch": 786} {"train_loss": -10.56972885131836, "global_step": 132162, "epoch": 786} {"train_loss": -10.24010944366455, "global_step": 132163, "epoch": 786} {"train_loss": -10.327126502990723, "global_step": 132164, "epoch": 786} {"train_loss": -10.11145305633545, "global_step": 132165, "epoch": 786} {"train_loss": -10.162012100219727, "global_step": 132166, "epoch": 786} {"train_loss": -10.228419303894043, "global_step": 132167, "epoch": 786} {"train_loss": -10.267139434814453, "global_step": 132168, "epoch": 786} {"train_loss": -10.152621269226074, "global_step": 132169, "epoch": 786} {"train_loss": -10.370397567749023, "global_step": 132170, "epoch": 786} {"train_loss": -9.927042007446289, "global_step": 132171, "epoch": 786} {"train_loss": -10.301835060119629, "global_step": 132172, "epoch": 786} {"train_loss": -10.23588752746582, "global_step": 132173, "epoch": 786} {"train_loss": -10.120970726013184, "global_step": 132174, "epoch": 786} {"train_loss": -10.44810676574707, "global_step": 132175, "epoch": 786} {"train_loss": -10.110450744628906, "global_step": 132176, "epoch": 786} {"train_loss": -10.139249801635742, "global_step": 132177, "epoch": 786} {"train_loss": -10.49389362335205, "global_step": 132178, "epoch": 786} {"train_loss": -10.431344985961914, "global_step": 132179, "epoch": 786} {"train_loss": -10.232053756713867, "global_step": 132180, "epoch": 786} {"train_loss": -10.498893737792969, "global_step": 132181, "epoch": 786} {"train_loss": -10.068107604980469, "global_step": 132182, "epoch": 786} {"train_loss": -10.282422065734863, "global_step": 132183, "epoch": 786} {"train_loss": -10.386358261108398, "global_step": 132184, "epoch": 786} {"train_loss": -10.17872428894043, "global_step": 132185, "epoch": 786} {"train_loss": -10.140828132629395, "global_step": 132186, "epoch": 786} {"train_loss": -10.427446365356445, "global_step": 132187, "epoch": 786} {"train_loss": -10.258735656738281, "global_step": 132188, "epoch": 786} {"train_loss": -10.224851608276367, "global_step": 132189, "epoch": 786} {"train_loss": -10.249961853027344, "global_step": 132190, "epoch": 786} {"train_loss": -10.074396133422852, "global_step": 132191, "epoch": 786} {"train_loss": -10.131707191467285, "global_step": 132192, "epoch": 786} {"train_loss": -10.217445373535156, "global_step": 132193, "epoch": 786} {"train_loss": -10.181350708007812, "global_step": 132194, "epoch": 786} {"train_loss": -10.3086519241333, "global_step": 132195, "epoch": 786} {"train_loss": -10.322021484375, "global_step": 132196, "epoch": 786} {"train_loss": -10.40385627746582, "global_step": 132197, "epoch": 786} {"train_loss": -10.469579696655273, "global_step": 132198, "epoch": 786} {"train_loss": -10.478741645812988, "global_step": 132199, "epoch": 786} {"train_loss": -10.311891555786133, "global_step": 132200, "epoch": 786} {"train_loss": -10.586435317993164, "global_step": 132201, "epoch": 786} {"train_loss": -10.458170890808105, "global_step": 132202, "epoch": 786} {"train_loss": -10.518078804016113, "global_step": 132203, "epoch": 786} {"train_loss": -10.66224479675293, "global_step": 132204, "epoch": 786} {"train_loss": -10.612143516540527, "global_step": 132205, "epoch": 786} {"train_loss": -10.526247024536133, "global_step": 132206, "epoch": 786} {"train_loss": -10.54229736328125, "global_step": 132207, "epoch": 786} {"train_loss": -10.34167766571045, "global_step": 132208, "epoch": 786} {"train_loss": -10.32768440246582, "global_step": 132209, "epoch": 786} {"train_loss": -10.413946151733398, "global_step": 132210, "epoch": 786} {"train_loss": -10.500239372253418, "global_step": 132211, "epoch": 786} {"train_loss": -10.440908432006836, "global_step": 132212, "epoch": 786} {"train_loss": -10.434083938598633, "global_step": 132213, "epoch": 786} {"train_loss": -10.664188385009766, "global_step": 132214, "epoch": 786} {"train_loss": -10.324526610828581, "global_step": 132215, "epoch": 786, "val_loss": 222488.28125} {"train_loss": -10.578222274780273, "global_step": 132216, "epoch": 787} {"train_loss": -10.337835311889648, "global_step": 132217, "epoch": 787} {"train_loss": -10.535189628601074, "global_step": 132218, "epoch": 787} {"train_loss": -10.411171913146973, "global_step": 132219, "epoch": 787} {"train_loss": -10.160665512084961, "global_step": 132220, "epoch": 787} {"train_loss": -10.685646057128906, "global_step": 132221, "epoch": 787} {"train_loss": -10.230398178100586, "global_step": 132222, "epoch": 787} {"train_loss": -9.959550857543945, "global_step": 132223, "epoch": 787} {"train_loss": -10.497391700744629, "global_step": 132224, "epoch": 787} {"train_loss": -10.138371467590332, "global_step": 132225, "epoch": 787} {"train_loss": -10.110904693603516, "global_step": 132226, "epoch": 787} {"train_loss": -10.387173652648926, "global_step": 132227, "epoch": 787} {"train_loss": -9.568086624145508, "global_step": 132228, "epoch": 787} {"train_loss": -10.52173900604248, "global_step": 132229, "epoch": 787} {"train_loss": -8.819154739379883, "global_step": 132230, "epoch": 787} {"train_loss": -10.222400665283203, "global_step": 132231, "epoch": 787} {"train_loss": -10.174158096313477, "global_step": 132232, "epoch": 787} {"train_loss": -9.90527057647705, "global_step": 132233, "epoch": 787} {"train_loss": -10.39074993133545, "global_step": 132234, "epoch": 787} {"train_loss": -9.201635360717773, "global_step": 132235, "epoch": 787} {"train_loss": -10.200432777404785, "global_step": 132236, "epoch": 787} {"train_loss": -9.598071098327637, "global_step": 132237, "epoch": 787} {"train_loss": -10.211616516113281, "global_step": 132238, "epoch": 787} {"train_loss": -9.936616897583008, "global_step": 132239, "epoch": 787} {"train_loss": -10.237896919250488, "global_step": 132240, "epoch": 787} {"train_loss": -9.782278060913086, "global_step": 132241, "epoch": 787} {"train_loss": -10.289742469787598, "global_step": 132242, "epoch": 787} {"train_loss": -10.237743377685547, "global_step": 132243, "epoch": 787} {"train_loss": -10.215326309204102, "global_step": 132244, "epoch": 787} {"train_loss": -10.527021408081055, "global_step": 132245, "epoch": 787} {"train_loss": -10.218558311462402, "global_step": 132246, "epoch": 787} {"train_loss": -10.471723556518555, "global_step": 132247, "epoch": 787} {"train_loss": -10.275127410888672, "global_step": 132248, "epoch": 787} {"train_loss": -10.189779281616211, "global_step": 132249, "epoch": 787} {"train_loss": -10.451486587524414, "global_step": 132250, "epoch": 787} {"train_loss": -10.388687133789062, "global_step": 132251, "epoch": 787} {"train_loss": -10.395309448242188, "global_step": 132252, "epoch": 787} {"train_loss": -10.464546203613281, "global_step": 132253, "epoch": 787} {"train_loss": -10.167095184326172, "global_step": 132254, "epoch": 787} {"train_loss": -10.551546096801758, "global_step": 132255, "epoch": 787} {"train_loss": -10.337458610534668, "global_step": 132256, "epoch": 787} {"train_loss": -10.705131530761719, "global_step": 132257, "epoch": 787} {"train_loss": -10.27745532989502, "global_step": 132258, "epoch": 787} {"train_loss": -10.440649032592773, "global_step": 132259, "epoch": 787} {"train_loss": -10.359786987304688, "global_step": 132260, "epoch": 787} {"train_loss": -10.511978149414062, "global_step": 132261, "epoch": 787} {"train_loss": -10.451101303100586, "global_step": 132262, "epoch": 787} {"train_loss": -10.376388549804688, "global_step": 132263, "epoch": 787} {"train_loss": -10.559930801391602, "global_step": 132264, "epoch": 787} {"train_loss": -10.450044631958008, "global_step": 132265, "epoch": 787} {"train_loss": -10.473062515258789, "global_step": 132266, "epoch": 787} {"train_loss": -10.633722305297852, "global_step": 132267, "epoch": 787} {"train_loss": -10.793477058410645, "global_step": 132268, "epoch": 787} {"train_loss": -10.557825088500977, "global_step": 132269, "epoch": 787} {"train_loss": -10.478120803833008, "global_step": 132270, "epoch": 787} {"train_loss": -10.514789581298828, "global_step": 132271, "epoch": 787} {"train_loss": -10.619539260864258, "global_step": 132272, "epoch": 787} {"train_loss": -10.667337417602539, "global_step": 132273, "epoch": 787} {"train_loss": -10.30293083190918, "global_step": 132274, "epoch": 787} {"train_loss": -10.726909637451172, "global_step": 132275, "epoch": 787} {"train_loss": -10.467204093933105, "global_step": 132276, "epoch": 787} {"train_loss": -10.232934951782227, "global_step": 132277, "epoch": 787} {"train_loss": -10.471385955810547, "global_step": 132278, "epoch": 787} {"train_loss": -10.66425895690918, "global_step": 132279, "epoch": 787} {"train_loss": -10.484914779663086, "global_step": 132280, "epoch": 787} {"train_loss": -10.697373390197754, "global_step": 132281, "epoch": 787} {"train_loss": -10.743149757385254, "global_step": 132282, "epoch": 787} {"train_loss": -10.541043281555176, "global_step": 132283, "epoch": 787} {"train_loss": -10.71037483215332, "global_step": 132284, "epoch": 787} {"train_loss": -10.84185791015625, "global_step": 132285, "epoch": 787} {"train_loss": -10.57744312286377, "global_step": 132286, "epoch": 787} {"train_loss": -10.510069847106934, "global_step": 132287, "epoch": 787} {"train_loss": -10.511198997497559, "global_step": 132288, "epoch": 787} {"train_loss": -10.622705459594727, "global_step": 132289, "epoch": 787} {"train_loss": -10.349319458007812, "global_step": 132290, "epoch": 787} {"train_loss": -10.248008728027344, "global_step": 132291, "epoch": 787} {"train_loss": -10.561717987060547, "global_step": 132292, "epoch": 787} {"train_loss": -10.159772872924805, "global_step": 132293, "epoch": 787} {"train_loss": -10.553972244262695, "global_step": 132294, "epoch": 787} {"train_loss": -10.466389656066895, "global_step": 132295, "epoch": 787} {"train_loss": -10.608439445495605, "global_step": 132296, "epoch": 787} {"train_loss": -10.428342819213867, "global_step": 132297, "epoch": 787} {"train_loss": -10.44161605834961, "global_step": 132298, "epoch": 787} {"train_loss": -10.429697036743164, "global_step": 132299, "epoch": 787} {"train_loss": -10.541327476501465, "global_step": 132300, "epoch": 787} {"train_loss": -10.239396095275879, "global_step": 132301, "epoch": 787} {"train_loss": -10.718755722045898, "global_step": 132302, "epoch": 787} {"train_loss": -10.443275451660156, "global_step": 132303, "epoch": 787} {"train_loss": -10.416149139404297, "global_step": 132304, "epoch": 787} {"train_loss": -10.220900535583496, "global_step": 132305, "epoch": 787} {"train_loss": -10.57742691040039, "global_step": 132306, "epoch": 787} {"train_loss": -10.352455139160156, "global_step": 132307, "epoch": 787} {"train_loss": -10.609838485717773, "global_step": 132308, "epoch": 787} {"train_loss": -10.554000854492188, "global_step": 132309, "epoch": 787} {"train_loss": -10.673789978027344, "global_step": 132310, "epoch": 787} {"train_loss": -10.606742858886719, "global_step": 132311, "epoch": 787} {"train_loss": -10.610260963439941, "global_step": 132312, "epoch": 787} {"train_loss": -10.57562255859375, "global_step": 132313, "epoch": 787} {"train_loss": -10.74217700958252, "global_step": 132314, "epoch": 787} {"train_loss": -10.421833992004395, "global_step": 132315, "epoch": 787} {"train_loss": -10.832717895507812, "global_step": 132316, "epoch": 787} {"train_loss": -10.74820613861084, "global_step": 132317, "epoch": 787} {"train_loss": -10.791955947875977, "global_step": 132318, "epoch": 787} {"train_loss": -10.652639389038086, "global_step": 132319, "epoch": 787} {"train_loss": -10.536809921264648, "global_step": 132320, "epoch": 787} {"train_loss": -10.549028396606445, "global_step": 132321, "epoch": 787} {"train_loss": -10.483626365661621, "global_step": 132322, "epoch": 787} {"train_loss": -10.447198867797852, "global_step": 132323, "epoch": 787} {"train_loss": -10.473971366882324, "global_step": 132324, "epoch": 787} {"train_loss": -10.395227432250977, "global_step": 132325, "epoch": 787} {"train_loss": -10.839058876037598, "global_step": 132326, "epoch": 787} {"train_loss": -10.47326946258545, "global_step": 132327, "epoch": 787} {"train_loss": -10.280888557434082, "global_step": 132328, "epoch": 787} {"train_loss": -10.221317291259766, "global_step": 132329, "epoch": 787} {"train_loss": -9.83285140991211, "global_step": 132330, "epoch": 787} {"train_loss": -10.116159439086914, "global_step": 132331, "epoch": 787} {"train_loss": -10.094407081604004, "global_step": 132332, "epoch": 787} {"train_loss": -9.691556930541992, "global_step": 132333, "epoch": 787} {"train_loss": -9.863036155700684, "global_step": 132334, "epoch": 787} {"train_loss": -9.454742431640625, "global_step": 132335, "epoch": 787} {"train_loss": -9.260125160217285, "global_step": 132336, "epoch": 787} {"train_loss": -9.484430313110352, "global_step": 132337, "epoch": 787} {"train_loss": -8.937887191772461, "global_step": 132338, "epoch": 787} {"train_loss": -9.678559303283691, "global_step": 132339, "epoch": 787} {"train_loss": -9.474581718444824, "global_step": 132340, "epoch": 787} {"train_loss": -9.205777168273926, "global_step": 132341, "epoch": 787} {"train_loss": -9.676288604736328, "global_step": 132342, "epoch": 787} {"train_loss": -9.792842864990234, "global_step": 132343, "epoch": 787} {"train_loss": -9.204511642456055, "global_step": 132344, "epoch": 787} {"train_loss": -9.527796745300293, "global_step": 132345, "epoch": 787} {"train_loss": -9.976911544799805, "global_step": 132346, "epoch": 787} {"train_loss": -9.782498359680176, "global_step": 132347, "epoch": 787} {"train_loss": -9.966059684753418, "global_step": 132348, "epoch": 787} {"train_loss": -9.860774993896484, "global_step": 132349, "epoch": 787} {"train_loss": -9.801290512084961, "global_step": 132350, "epoch": 787} {"train_loss": -9.82642936706543, "global_step": 132351, "epoch": 787} {"train_loss": -9.901346206665039, "global_step": 132352, "epoch": 787} {"train_loss": -10.176057815551758, "global_step": 132353, "epoch": 787} {"train_loss": -10.108440399169922, "global_step": 132354, "epoch": 787} {"train_loss": -10.267984390258789, "global_step": 132355, "epoch": 787} {"train_loss": -10.251001358032227, "global_step": 132356, "epoch": 787} {"train_loss": -9.949884414672852, "global_step": 132357, "epoch": 787} {"train_loss": -10.375694274902344, "global_step": 132358, "epoch": 787} {"train_loss": -10.057764053344727, "global_step": 132359, "epoch": 787} {"train_loss": -10.245321273803711, "global_step": 132360, "epoch": 787} {"train_loss": -10.08237075805664, "global_step": 132361, "epoch": 787} {"train_loss": -10.18336296081543, "global_step": 132362, "epoch": 787} {"train_loss": -10.35848617553711, "global_step": 132363, "epoch": 787} {"train_loss": -10.484270095825195, "global_step": 132364, "epoch": 787} {"train_loss": -10.373016357421875, "global_step": 132365, "epoch": 787} {"train_loss": -10.222046852111816, "global_step": 132366, "epoch": 787} {"train_loss": -10.304883003234863, "global_step": 132367, "epoch": 787} {"train_loss": -10.361322402954102, "global_step": 132368, "epoch": 787} {"train_loss": -10.443115234375, "global_step": 132369, "epoch": 787} {"train_loss": -10.319565773010254, "global_step": 132370, "epoch": 787} {"train_loss": -10.436463356018066, "global_step": 132371, "epoch": 787} {"train_loss": -10.425593376159668, "global_step": 132372, "epoch": 787} {"train_loss": -10.40034294128418, "global_step": 132373, "epoch": 787} {"train_loss": -10.402504920959473, "global_step": 132374, "epoch": 787} {"train_loss": -10.41836929321289, "global_step": 132375, "epoch": 787} {"train_loss": -10.507428169250488, "global_step": 132376, "epoch": 787} {"train_loss": -10.539203643798828, "global_step": 132377, "epoch": 787} {"train_loss": -10.42480754852295, "global_step": 132378, "epoch": 787} {"train_loss": -10.455875396728516, "global_step": 132379, "epoch": 787} {"train_loss": -10.567837715148926, "global_step": 132380, "epoch": 787} {"train_loss": -10.469259262084961, "global_step": 132381, "epoch": 787} {"train_loss": -10.476089477539062, "global_step": 132382, "epoch": 787} {"train_loss": -10.293590369678679, "global_step": 132383, "epoch": 787, "val_loss": 221866.34375} {"train_loss": -10.567024230957031, "global_step": 132384, "epoch": 788} {"train_loss": -10.638565063476562, "global_step": 132385, "epoch": 788} {"train_loss": -10.460925102233887, "global_step": 132386, "epoch": 788} {"train_loss": -10.573182106018066, "global_step": 132387, "epoch": 788} {"train_loss": -10.309926986694336, "global_step": 132388, "epoch": 788} {"train_loss": -10.784067153930664, "global_step": 132389, "epoch": 788} {"train_loss": -10.70242977142334, "global_step": 132390, "epoch": 788} {"train_loss": -10.42202091217041, "global_step": 132391, "epoch": 788} {"train_loss": -10.864086151123047, "global_step": 132392, "epoch": 788} {"train_loss": -10.405731201171875, "global_step": 132393, "epoch": 788} {"train_loss": -10.362552642822266, "global_step": 132394, "epoch": 788} {"train_loss": -10.641951560974121, "global_step": 132395, "epoch": 788} {"train_loss": -10.316460609436035, "global_step": 132396, "epoch": 788} {"train_loss": -10.463146209716797, "global_step": 132397, "epoch": 788} {"train_loss": -10.297277450561523, "global_step": 132398, "epoch": 788} {"train_loss": -10.536069869995117, "global_step": 132399, "epoch": 788} {"train_loss": -10.443374633789062, "global_step": 132400, "epoch": 788} {"train_loss": -10.36363410949707, "global_step": 132401, "epoch": 788} {"train_loss": -10.770243644714355, "global_step": 132402, "epoch": 788} {"train_loss": -10.503772735595703, "global_step": 132403, "epoch": 788} {"train_loss": -10.492725372314453, "global_step": 132404, "epoch": 788} {"train_loss": -10.404220581054688, "global_step": 132405, "epoch": 788} {"train_loss": -9.919332504272461, "global_step": 132406, "epoch": 788} {"train_loss": -10.590734481811523, "global_step": 132407, "epoch": 788} {"train_loss": -9.973990440368652, "global_step": 132408, "epoch": 788} {"train_loss": -9.70307731628418, "global_step": 132409, "epoch": 788} {"train_loss": -10.353347778320312, "global_step": 132410, "epoch": 788} {"train_loss": -9.966604232788086, "global_step": 132411, "epoch": 788} {"train_loss": -9.245540618896484, "global_step": 132412, "epoch": 788} {"train_loss": -10.28990650177002, "global_step": 132413, "epoch": 788} {"train_loss": -9.813918113708496, "global_step": 132414, "epoch": 788} {"train_loss": -10.334846496582031, "global_step": 132415, "epoch": 788} {"train_loss": -9.98985481262207, "global_step": 132416, "epoch": 788} {"train_loss": -9.852794647216797, "global_step": 132417, "epoch": 788} {"train_loss": -10.23782730102539, "global_step": 132418, "epoch": 788} {"train_loss": -9.998897552490234, "global_step": 132419, "epoch": 788} {"train_loss": -10.308231353759766, "global_step": 132420, "epoch": 788} {"train_loss": -9.833524703979492, "global_step": 132421, "epoch": 788} {"train_loss": -10.201706886291504, "global_step": 132422, "epoch": 788} {"train_loss": -9.81466293334961, "global_step": 132423, "epoch": 788} {"train_loss": -9.88076400756836, "global_step": 132424, "epoch": 788} {"train_loss": -9.980754852294922, "global_step": 132425, "epoch": 788} {"train_loss": -10.395367622375488, "global_step": 132426, "epoch": 788} {"train_loss": -9.917831420898438, "global_step": 132427, "epoch": 788} {"train_loss": -10.202375411987305, "global_step": 132428, "epoch": 788} {"train_loss": -10.126628875732422, "global_step": 132429, "epoch": 788} {"train_loss": -10.033573150634766, "global_step": 132430, "epoch": 788} {"train_loss": -10.221612930297852, "global_step": 132431, "epoch": 788} {"train_loss": -10.35818862915039, "global_step": 132432, "epoch": 788} {"train_loss": -10.026596069335938, "global_step": 132433, "epoch": 788} {"train_loss": -10.599834442138672, "global_step": 132434, "epoch": 788} {"train_loss": -10.367780685424805, "global_step": 132435, "epoch": 788} {"train_loss": -10.381970405578613, "global_step": 132436, "epoch": 788} {"train_loss": -10.564414978027344, "global_step": 132437, "epoch": 788} {"train_loss": -10.570915222167969, "global_step": 132438, "epoch": 788} {"train_loss": -10.486736297607422, "global_step": 132439, "epoch": 788} {"train_loss": -10.35673713684082, "global_step": 132440, "epoch": 788} {"train_loss": -10.295736312866211, "global_step": 132441, "epoch": 788} {"train_loss": -10.50167179107666, "global_step": 132442, "epoch": 788} {"train_loss": -10.469050407409668, "global_step": 132443, "epoch": 788} {"train_loss": -10.701738357543945, "global_step": 132444, "epoch": 788} {"train_loss": -10.41678237915039, "global_step": 132445, "epoch": 788} {"train_loss": -10.45437240600586, "global_step": 132446, "epoch": 788} {"train_loss": -10.447959899902344, "global_step": 132447, "epoch": 788} {"train_loss": -10.479958534240723, "global_step": 132448, "epoch": 788} {"train_loss": -10.276702880859375, "global_step": 132449, "epoch": 788} {"train_loss": -10.429625511169434, "global_step": 132450, "epoch": 788} {"train_loss": -10.329793930053711, "global_step": 132451, "epoch": 788} {"train_loss": -10.680763244628906, "global_step": 132452, "epoch": 788} {"train_loss": -10.275306701660156, "global_step": 132453, "epoch": 788} {"train_loss": -10.412080764770508, "global_step": 132454, "epoch": 788} {"train_loss": -10.42020034790039, "global_step": 132455, "epoch": 788} {"train_loss": -10.623540878295898, "global_step": 132456, "epoch": 788} {"train_loss": -10.512877464294434, "global_step": 132457, "epoch": 788} {"train_loss": -10.247005462646484, "global_step": 132458, "epoch": 788} {"train_loss": -10.55681037902832, "global_step": 132459, "epoch": 788} {"train_loss": -10.554595947265625, "global_step": 132460, "epoch": 788} {"train_loss": -10.226625442504883, "global_step": 132461, "epoch": 788} {"train_loss": -10.586164474487305, "global_step": 132462, "epoch": 788} {"train_loss": -10.40697956085205, "global_step": 132463, "epoch": 788} {"train_loss": -10.140691757202148, "global_step": 132464, "epoch": 788} {"train_loss": -10.134286880493164, "global_step": 132465, "epoch": 788} {"train_loss": -10.052448272705078, "global_step": 132466, "epoch": 788} {"train_loss": -10.257923126220703, "global_step": 132467, "epoch": 788} {"train_loss": -10.221307754516602, "global_step": 132468, "epoch": 788} {"train_loss": -10.281609535217285, "global_step": 132469, "epoch": 788} {"train_loss": -10.025155067443848, "global_step": 132470, "epoch": 788} {"train_loss": -10.194881439208984, "global_step": 132471, "epoch": 788} {"train_loss": -9.99826431274414, "global_step": 132472, "epoch": 788} {"train_loss": -10.614689826965332, "global_step": 132473, "epoch": 788} {"train_loss": -10.21374225616455, "global_step": 132474, "epoch": 788} {"train_loss": -10.37621021270752, "global_step": 132475, "epoch": 788} {"train_loss": -10.385761260986328, "global_step": 132476, "epoch": 788} {"train_loss": -9.953373908996582, "global_step": 132477, "epoch": 788} {"train_loss": -10.374550819396973, "global_step": 132478, "epoch": 788} {"train_loss": -9.992416381835938, "global_step": 132479, "epoch": 788} {"train_loss": -9.853710174560547, "global_step": 132480, "epoch": 788} {"train_loss": -10.394203186035156, "global_step": 132481, "epoch": 788} {"train_loss": -10.123754501342773, "global_step": 132482, "epoch": 788} {"train_loss": -10.068047523498535, "global_step": 132483, "epoch": 788} {"train_loss": -10.355255126953125, "global_step": 132484, "epoch": 788} {"train_loss": -9.710405349731445, "global_step": 132485, "epoch": 788} {"train_loss": -10.660520553588867, "global_step": 132486, "epoch": 788} {"train_loss": -9.929861068725586, "global_step": 132487, "epoch": 788} {"train_loss": -10.413623809814453, "global_step": 132488, "epoch": 788} {"train_loss": -10.215316772460938, "global_step": 132489, "epoch": 788} {"train_loss": -10.16396713256836, "global_step": 132490, "epoch": 788} {"train_loss": -10.290914535522461, "global_step": 132491, "epoch": 788} {"train_loss": -10.322333335876465, "global_step": 132492, "epoch": 788} {"train_loss": -10.359297752380371, "global_step": 132493, "epoch": 788} {"train_loss": -10.063343048095703, "global_step": 132494, "epoch": 788} {"train_loss": -10.330971717834473, "global_step": 132495, "epoch": 788} {"train_loss": -10.36351203918457, "global_step": 132496, "epoch": 788} {"train_loss": -10.307615280151367, "global_step": 132497, "epoch": 788} {"train_loss": -10.38064193725586, "global_step": 132498, "epoch": 788} {"train_loss": -10.235006332397461, "global_step": 132499, "epoch": 788} {"train_loss": -10.382970809936523, "global_step": 132500, "epoch": 788} {"train_loss": -10.387449264526367, "global_step": 132501, "epoch": 788} {"train_loss": -10.137720108032227, "global_step": 132502, "epoch": 788} {"train_loss": -10.238351821899414, "global_step": 132503, "epoch": 788} {"train_loss": -10.456598281860352, "global_step": 132504, "epoch": 788} {"train_loss": -10.503374099731445, "global_step": 132505, "epoch": 788} {"train_loss": -10.53056526184082, "global_step": 132506, "epoch": 788} {"train_loss": -10.637140274047852, "global_step": 132507, "epoch": 788} {"train_loss": -10.479413986206055, "global_step": 132508, "epoch": 788} {"train_loss": -10.488624572753906, "global_step": 132509, "epoch": 788} {"train_loss": -10.480378150939941, "global_step": 132510, "epoch": 788} {"train_loss": -10.523614883422852, "global_step": 132511, "epoch": 788} {"train_loss": -10.39938735961914, "global_step": 132512, "epoch": 788} {"train_loss": -10.332035064697266, "global_step": 132513, "epoch": 788} {"train_loss": -10.4269437789917, "global_step": 132514, "epoch": 788} {"train_loss": -10.469985961914062, "global_step": 132515, "epoch": 788} {"train_loss": -10.388203620910645, "global_step": 132516, "epoch": 788} {"train_loss": -10.254302978515625, "global_step": 132517, "epoch": 788} {"train_loss": -10.306879043579102, "global_step": 132518, "epoch": 788} {"train_loss": -10.65160846710205, "global_step": 132519, "epoch": 788} {"train_loss": -10.155086517333984, "global_step": 132520, "epoch": 788} {"train_loss": -10.336990356445312, "global_step": 132521, "epoch": 788} {"train_loss": -10.283775329589844, "global_step": 132522, "epoch": 788} {"train_loss": -10.31281852722168, "global_step": 132523, "epoch": 788} {"train_loss": -10.561857223510742, "global_step": 132524, "epoch": 788} {"train_loss": -10.531990051269531, "global_step": 132525, "epoch": 788} {"train_loss": -10.046758651733398, "global_step": 132526, "epoch": 788} {"train_loss": -10.71009635925293, "global_step": 132527, "epoch": 788} {"train_loss": -10.381593704223633, "global_step": 132528, "epoch": 788} {"train_loss": -10.455337524414062, "global_step": 132529, "epoch": 788} {"train_loss": -10.609859466552734, "global_step": 132530, "epoch": 788} {"train_loss": -10.134298324584961, "global_step": 132531, "epoch": 788} {"train_loss": -10.32392692565918, "global_step": 132532, "epoch": 788} {"train_loss": -10.208466529846191, "global_step": 132533, "epoch": 788} {"train_loss": -10.487382888793945, "global_step": 132534, "epoch": 788} {"train_loss": -10.330955505371094, "global_step": 132535, "epoch": 788} {"train_loss": -10.257680892944336, "global_step": 132536, "epoch": 788} {"train_loss": -10.385578155517578, "global_step": 132537, "epoch": 788} {"train_loss": -10.133600234985352, "global_step": 132538, "epoch": 788} {"train_loss": -10.172826766967773, "global_step": 132539, "epoch": 788} {"train_loss": -10.332220077514648, "global_step": 132540, "epoch": 788} {"train_loss": -10.346264839172363, "global_step": 132541, "epoch": 788} {"train_loss": -10.409191131591797, "global_step": 132542, "epoch": 788} {"train_loss": -10.657772064208984, "global_step": 132543, "epoch": 788} {"train_loss": -10.468141555786133, "global_step": 132544, "epoch": 788} {"train_loss": -10.338357925415039, "global_step": 132545, "epoch": 788} {"train_loss": -10.491296768188477, "global_step": 132546, "epoch": 788} {"train_loss": -10.412330627441406, "global_step": 132547, "epoch": 788} {"train_loss": -10.111873626708984, "global_step": 132548, "epoch": 788} {"train_loss": -10.662368774414062, "global_step": 132549, "epoch": 788} {"train_loss": -10.223265647888184, "global_step": 132550, "epoch": 788} {"train_loss": -10.324073371433077, "global_step": 132551, "epoch": 788, "val_loss": 221751.484375} {"train_loss": -9.69699478149414, "global_step": 132552, "epoch": 789} {"train_loss": -10.340907096862793, "global_step": 132553, "epoch": 789} {"train_loss": -9.485973358154297, "global_step": 132554, "epoch": 789} {"train_loss": -10.22221851348877, "global_step": 132555, "epoch": 789} {"train_loss": -9.821784973144531, "global_step": 132556, "epoch": 789} {"train_loss": -10.320829391479492, "global_step": 132557, "epoch": 789} {"train_loss": -10.096202850341797, "global_step": 132558, "epoch": 789} {"train_loss": -10.088205337524414, "global_step": 132559, "epoch": 789} {"train_loss": -9.961660385131836, "global_step": 132560, "epoch": 789} {"train_loss": -10.463388442993164, "global_step": 132561, "epoch": 789} {"train_loss": -10.430227279663086, "global_step": 132562, "epoch": 789} {"train_loss": -10.31302547454834, "global_step": 132563, "epoch": 789} {"train_loss": -10.242358207702637, "global_step": 132564, "epoch": 789} {"train_loss": -10.5189847946167, "global_step": 132565, "epoch": 789} {"train_loss": -10.429645538330078, "global_step": 132566, "epoch": 789} {"train_loss": -10.639491081237793, "global_step": 132567, "epoch": 789} {"train_loss": -10.306394577026367, "global_step": 132568, "epoch": 789} {"train_loss": -10.486316680908203, "global_step": 132569, "epoch": 789} {"train_loss": -10.190238952636719, "global_step": 132570, "epoch": 789} {"train_loss": -10.389360427856445, "global_step": 132571, "epoch": 789} {"train_loss": -10.444128036499023, "global_step": 132572, "epoch": 789} {"train_loss": -10.523055076599121, "global_step": 132573, "epoch": 789} {"train_loss": -10.525001525878906, "global_step": 132574, "epoch": 789} {"train_loss": -10.690553665161133, "global_step": 132575, "epoch": 789} {"train_loss": -10.552396774291992, "global_step": 132576, "epoch": 789} {"train_loss": -10.617733001708984, "global_step": 132577, "epoch": 789} {"train_loss": -10.486095428466797, "global_step": 132578, "epoch": 789} {"train_loss": -10.502653121948242, "global_step": 132579, "epoch": 789} {"train_loss": -10.394233703613281, "global_step": 132580, "epoch": 789} {"train_loss": -10.475461959838867, "global_step": 132581, "epoch": 789} {"train_loss": -10.639385223388672, "global_step": 132582, "epoch": 789} {"train_loss": -10.539129257202148, "global_step": 132583, "epoch": 789} {"train_loss": -10.562175750732422, "global_step": 132584, "epoch": 789} {"train_loss": -10.643310546875, "global_step": 132585, "epoch": 789} {"train_loss": -10.588786125183105, "global_step": 132586, "epoch": 789} {"train_loss": -10.193626403808594, "global_step": 132587, "epoch": 789} {"train_loss": -10.455453872680664, "global_step": 132588, "epoch": 789} {"train_loss": -10.504413604736328, "global_step": 132589, "epoch": 789} {"train_loss": -10.602216720581055, "global_step": 132590, "epoch": 789} {"train_loss": -10.476263046264648, "global_step": 132591, "epoch": 789} {"train_loss": -10.50449275970459, "global_step": 132592, "epoch": 789} {"train_loss": -10.085979461669922, "global_step": 132593, "epoch": 789} {"train_loss": -10.258783340454102, "global_step": 132594, "epoch": 789} {"train_loss": -10.052169799804688, "global_step": 132595, "epoch": 789} {"train_loss": -10.022395133972168, "global_step": 132596, "epoch": 789} {"train_loss": -10.227694511413574, "global_step": 132597, "epoch": 789} {"train_loss": -9.410623550415039, "global_step": 132598, "epoch": 789} {"train_loss": -9.966946601867676, "global_step": 132599, "epoch": 789} {"train_loss": -9.901576042175293, "global_step": 132600, "epoch": 789} {"train_loss": -9.187161445617676, "global_step": 132601, "epoch": 789} {"train_loss": -9.628440856933594, "global_step": 132602, "epoch": 789} {"train_loss": -9.281526565551758, "global_step": 132603, "epoch": 789} {"train_loss": -10.063132286071777, "global_step": 132604, "epoch": 789} {"train_loss": -9.225570678710938, "global_step": 132605, "epoch": 789} {"train_loss": -10.296740531921387, "global_step": 132606, "epoch": 789} {"train_loss": -9.205673217773438, "global_step": 132607, "epoch": 789} {"train_loss": -10.163201332092285, "global_step": 132608, "epoch": 789} {"train_loss": -9.71245288848877, "global_step": 132609, "epoch": 789} {"train_loss": -9.891836166381836, "global_step": 132610, "epoch": 789} {"train_loss": -10.23340892791748, "global_step": 132611, "epoch": 789} {"train_loss": -10.11754322052002, "global_step": 132612, "epoch": 789} {"train_loss": -9.560657501220703, "global_step": 132613, "epoch": 789} {"train_loss": -10.196916580200195, "global_step": 132614, "epoch": 789} {"train_loss": -9.774744987487793, "global_step": 132615, "epoch": 789} {"train_loss": -10.003564834594727, "global_step": 132616, "epoch": 789} {"train_loss": -9.609073638916016, "global_step": 132617, "epoch": 789} {"train_loss": -10.146673202514648, "global_step": 132618, "epoch": 789} {"train_loss": -10.20242691040039, "global_step": 132619, "epoch": 789} {"train_loss": -10.101198196411133, "global_step": 132620, "epoch": 789} {"train_loss": -10.219795227050781, "global_step": 132621, "epoch": 789} {"train_loss": -10.320569038391113, "global_step": 132622, "epoch": 789} {"train_loss": -10.560277938842773, "global_step": 132623, "epoch": 789} {"train_loss": -10.242118835449219, "global_step": 132624, "epoch": 789} {"train_loss": -10.239372253417969, "global_step": 132625, "epoch": 789} {"train_loss": -10.473926544189453, "global_step": 132626, "epoch": 789} {"train_loss": -10.479391098022461, "global_step": 132627, "epoch": 789} {"train_loss": -10.348217010498047, "global_step": 132628, "epoch": 789} {"train_loss": -10.292556762695312, "global_step": 132629, "epoch": 789} {"train_loss": -10.457935333251953, "global_step": 132630, "epoch": 789} {"train_loss": -10.421466827392578, "global_step": 132631, "epoch": 789} {"train_loss": -10.276823043823242, "global_step": 132632, "epoch": 789} {"train_loss": -10.487262725830078, "global_step": 132633, "epoch": 789} {"train_loss": -10.482525825500488, "global_step": 132634, "epoch": 789} {"train_loss": -10.376920700073242, "global_step": 132635, "epoch": 789} {"train_loss": -10.451228141784668, "global_step": 132636, "epoch": 789} {"train_loss": -10.254810333251953, "global_step": 132637, "epoch": 789} {"train_loss": -10.416065216064453, "global_step": 132638, "epoch": 789} {"train_loss": -10.500408172607422, "global_step": 132639, "epoch": 789} {"train_loss": -10.50374698638916, "global_step": 132640, "epoch": 789} {"train_loss": -10.401168823242188, "global_step": 132641, "epoch": 789} {"train_loss": -10.396394729614258, "global_step": 132642, "epoch": 789} {"train_loss": -10.512153625488281, "global_step": 132643, "epoch": 789} {"train_loss": -10.45644760131836, "global_step": 132644, "epoch": 789} {"train_loss": -10.404693603515625, "global_step": 132645, "epoch": 789} {"train_loss": -10.535533905029297, "global_step": 132646, "epoch": 789} {"train_loss": -10.45462703704834, "global_step": 132647, "epoch": 789} {"train_loss": -10.497556686401367, "global_step": 132648, "epoch": 789} {"train_loss": -10.696948051452637, "global_step": 132649, "epoch": 789} {"train_loss": -10.614032745361328, "global_step": 132650, "epoch": 789} {"train_loss": -10.614725112915039, "global_step": 132651, "epoch": 789} {"train_loss": -10.594552993774414, "global_step": 132652, "epoch": 789} {"train_loss": -10.388162612915039, "global_step": 132653, "epoch": 789} {"train_loss": -10.256938934326172, "global_step": 132654, "epoch": 789} {"train_loss": -10.600814819335938, "global_step": 132655, "epoch": 789} {"train_loss": -10.234542846679688, "global_step": 132656, "epoch": 789} {"train_loss": -10.437321662902832, "global_step": 132657, "epoch": 789} {"train_loss": -10.365436553955078, "global_step": 132658, "epoch": 789} {"train_loss": -9.998470306396484, "global_step": 132659, "epoch": 789} {"train_loss": -10.403558731079102, "global_step": 132660, "epoch": 789} {"train_loss": -10.398677825927734, "global_step": 132661, "epoch": 789} {"train_loss": -10.10492992401123, "global_step": 132662, "epoch": 789} {"train_loss": -10.51276969909668, "global_step": 132663, "epoch": 789} {"train_loss": -10.145132064819336, "global_step": 132664, "epoch": 789} {"train_loss": -10.308585166931152, "global_step": 132665, "epoch": 789} {"train_loss": -9.859518051147461, "global_step": 132666, "epoch": 789} {"train_loss": -9.698114395141602, "global_step": 132667, "epoch": 789} {"train_loss": -10.336527824401855, "global_step": 132668, "epoch": 789} {"train_loss": -9.93054485321045, "global_step": 132669, "epoch": 789} {"train_loss": -10.3407564163208, "global_step": 132670, "epoch": 789} {"train_loss": -10.36019515991211, "global_step": 132671, "epoch": 789} {"train_loss": -9.884634971618652, "global_step": 132672, "epoch": 789} {"train_loss": -10.325571060180664, "global_step": 132673, "epoch": 789} {"train_loss": -10.181282043457031, "global_step": 132674, "epoch": 789} {"train_loss": -10.576194763183594, "global_step": 132675, "epoch": 789} {"train_loss": -10.554156303405762, "global_step": 132676, "epoch": 789} {"train_loss": -10.441913604736328, "global_step": 132677, "epoch": 789} {"train_loss": -10.628314971923828, "global_step": 132678, "epoch": 789} {"train_loss": -10.434584617614746, "global_step": 132679, "epoch": 789} {"train_loss": -10.650238037109375, "global_step": 132680, "epoch": 789} {"train_loss": -10.33360481262207, "global_step": 132681, "epoch": 789} {"train_loss": -10.530767440795898, "global_step": 132682, "epoch": 789} {"train_loss": -10.476101875305176, "global_step": 132683, "epoch": 789} {"train_loss": -10.66801643371582, "global_step": 132684, "epoch": 789} {"train_loss": -10.631710052490234, "global_step": 132685, "epoch": 789} {"train_loss": -10.63271713256836, "global_step": 132686, "epoch": 789} {"train_loss": -10.661581993103027, "global_step": 132687, "epoch": 789} {"train_loss": -10.496225357055664, "global_step": 132688, "epoch": 789} {"train_loss": -10.686166763305664, "global_step": 132689, "epoch": 789} {"train_loss": -10.416735649108887, "global_step": 132690, "epoch": 789} {"train_loss": -10.408469200134277, "global_step": 132691, "epoch": 789} {"train_loss": -10.411552429199219, "global_step": 132692, "epoch": 789} {"train_loss": -10.681329727172852, "global_step": 132693, "epoch": 789} {"train_loss": -10.49698257446289, "global_step": 132694, "epoch": 789} {"train_loss": -10.694242477416992, "global_step": 132695, "epoch": 789} {"train_loss": -10.728750228881836, "global_step": 132696, "epoch": 789} {"train_loss": -10.864494323730469, "global_step": 132697, "epoch": 789} {"train_loss": -10.752180099487305, "global_step": 132698, "epoch": 789} {"train_loss": -10.754368782043457, "global_step": 132699, "epoch": 789} {"train_loss": -10.45187759399414, "global_step": 132700, "epoch": 789} {"train_loss": -10.751035690307617, "global_step": 132701, "epoch": 789} {"train_loss": -10.657785415649414, "global_step": 132702, "epoch": 789} {"train_loss": -10.700371742248535, "global_step": 132703, "epoch": 789} {"train_loss": -10.546335220336914, "global_step": 132704, "epoch": 789} {"train_loss": -10.985574722290039, "global_step": 132705, "epoch": 789} {"train_loss": -10.644775390625, "global_step": 132706, "epoch": 789} {"train_loss": -10.70654296875, "global_step": 132707, "epoch": 789} {"train_loss": -10.622173309326172, "global_step": 132708, "epoch": 789} {"train_loss": -10.719030380249023, "global_step": 132709, "epoch": 789} {"train_loss": -10.52435302734375, "global_step": 132710, "epoch": 789} {"train_loss": -10.374382019042969, "global_step": 132711, "epoch": 789} {"train_loss": -10.52370548248291, "global_step": 132712, "epoch": 789} {"train_loss": -10.50285530090332, "global_step": 132713, "epoch": 789} {"train_loss": -10.300819396972656, "global_step": 132714, "epoch": 789} {"train_loss": -10.608640670776367, "global_step": 132715, "epoch": 789} {"train_loss": -10.849008560180664, "global_step": 132716, "epoch": 789} {"train_loss": -10.427251815795898, "global_step": 132717, "epoch": 789} {"train_loss": -10.664685249328613, "global_step": 132718, "epoch": 789} {"train_loss": -10.343007910819281, "global_step": 132719, "epoch": 789, "val_loss": 220388.5625} {"train_loss": -10.499675750732422, "global_step": 132720, "epoch": 790} {"train_loss": -10.423194885253906, "global_step": 132721, "epoch": 790} {"train_loss": -10.401789665222168, "global_step": 132722, "epoch": 790} {"train_loss": -10.396822929382324, "global_step": 132723, "epoch": 790} {"train_loss": -10.37806510925293, "global_step": 132724, "epoch": 790} {"train_loss": -10.589668273925781, "global_step": 132725, "epoch": 790} {"train_loss": -10.002967834472656, "global_step": 132726, "epoch": 790} {"train_loss": -9.835687637329102, "global_step": 132727, "epoch": 790} {"train_loss": -9.330705642700195, "global_step": 132728, "epoch": 790} {"train_loss": -9.277626037597656, "global_step": 132729, "epoch": 790} {"train_loss": -9.063379287719727, "global_step": 132730, "epoch": 790} {"train_loss": -8.823461532592773, "global_step": 132731, "epoch": 790} {"train_loss": -9.3785400390625, "global_step": 132732, "epoch": 790} {"train_loss": -10.069839477539062, "global_step": 132733, "epoch": 790} {"train_loss": -9.460498809814453, "global_step": 132734, "epoch": 790} {"train_loss": -9.440303802490234, "global_step": 132735, "epoch": 790} {"train_loss": -9.242202758789062, "global_step": 132736, "epoch": 790} {"train_loss": -9.471012115478516, "global_step": 132737, "epoch": 790} {"train_loss": -9.906900405883789, "global_step": 132738, "epoch": 790} {"train_loss": -9.755575180053711, "global_step": 132739, "epoch": 790} {"train_loss": -9.90884017944336, "global_step": 132740, "epoch": 790} {"train_loss": -9.868413925170898, "global_step": 132741, "epoch": 790} {"train_loss": -9.118276596069336, "global_step": 132742, "epoch": 790} {"train_loss": -9.968361854553223, "global_step": 132743, "epoch": 790} {"train_loss": -9.818105697631836, "global_step": 132744, "epoch": 790} {"train_loss": -9.766326904296875, "global_step": 132745, "epoch": 790} {"train_loss": -9.983377456665039, "global_step": 132746, "epoch": 790} {"train_loss": -9.595930099487305, "global_step": 132747, "epoch": 790} {"train_loss": -10.054616928100586, "global_step": 132748, "epoch": 790} {"train_loss": -9.814094543457031, "global_step": 132749, "epoch": 790} {"train_loss": -9.911532402038574, "global_step": 132750, "epoch": 790} {"train_loss": -10.21143627166748, "global_step": 132751, "epoch": 790} {"train_loss": -9.900026321411133, "global_step": 132752, "epoch": 790} {"train_loss": -10.312057495117188, "global_step": 132753, "epoch": 790} {"train_loss": -10.319934844970703, "global_step": 132754, "epoch": 790} {"train_loss": -10.070954322814941, "global_step": 132755, "epoch": 790} {"train_loss": -10.031824111938477, "global_step": 132756, "epoch": 790} {"train_loss": -10.17149543762207, "global_step": 132757, "epoch": 790} {"train_loss": -10.196613311767578, "global_step": 132758, "epoch": 790} {"train_loss": -10.296518325805664, "global_step": 132759, "epoch": 790} {"train_loss": -10.20511245727539, "global_step": 132760, "epoch": 790} {"train_loss": -10.407903671264648, "global_step": 132761, "epoch": 790} {"train_loss": -10.576053619384766, "global_step": 132762, "epoch": 790} {"train_loss": -10.321606636047363, "global_step": 132763, "epoch": 790} {"train_loss": -10.300664901733398, "global_step": 132764, "epoch": 790} {"train_loss": -10.294109344482422, "global_step": 132765, "epoch": 790} {"train_loss": -10.414255142211914, "global_step": 132766, "epoch": 790} {"train_loss": -10.365302085876465, "global_step": 132767, "epoch": 790} {"train_loss": -10.310245513916016, "global_step": 132768, "epoch": 790} {"train_loss": -10.490623474121094, "global_step": 132769, "epoch": 790} {"train_loss": -10.293956756591797, "global_step": 132770, "epoch": 790} {"train_loss": -10.339728355407715, "global_step": 132771, "epoch": 790} {"train_loss": -10.451859474182129, "global_step": 132772, "epoch": 790} {"train_loss": -10.564654350280762, "global_step": 132773, "epoch": 790} {"train_loss": -10.454729080200195, "global_step": 132774, "epoch": 790} {"train_loss": -10.572444915771484, "global_step": 132775, "epoch": 790} {"train_loss": -10.562646865844727, "global_step": 132776, "epoch": 790} {"train_loss": -10.387617111206055, "global_step": 132777, "epoch": 790} {"train_loss": -10.488911628723145, "global_step": 132778, "epoch": 790} {"train_loss": -10.612834930419922, "global_step": 132779, "epoch": 790} {"train_loss": -10.23924446105957, "global_step": 132780, "epoch": 790} {"train_loss": -10.584104537963867, "global_step": 132781, "epoch": 790} {"train_loss": -10.482542991638184, "global_step": 132782, "epoch": 790} {"train_loss": -10.668159484863281, "global_step": 132783, "epoch": 790} {"train_loss": -10.582695007324219, "global_step": 132784, "epoch": 790} {"train_loss": -10.575133323669434, "global_step": 132785, "epoch": 790} {"train_loss": -10.393311500549316, "global_step": 132786, "epoch": 790} {"train_loss": -10.47426700592041, "global_step": 132787, "epoch": 790} {"train_loss": -10.655746459960938, "global_step": 132788, "epoch": 790} {"train_loss": -10.716999053955078, "global_step": 132789, "epoch": 790} {"train_loss": -10.666061401367188, "global_step": 132790, "epoch": 790} {"train_loss": -10.564281463623047, "global_step": 132791, "epoch": 790} {"train_loss": -10.577381134033203, "global_step": 132792, "epoch": 790} {"train_loss": -10.62619400024414, "global_step": 132793, "epoch": 790} {"train_loss": -10.427210807800293, "global_step": 132794, "epoch": 790} {"train_loss": -10.74348258972168, "global_step": 132795, "epoch": 790} {"train_loss": -10.380834579467773, "global_step": 132796, "epoch": 790} {"train_loss": -10.28760814666748, "global_step": 132797, "epoch": 790} {"train_loss": -10.330848693847656, "global_step": 132798, "epoch": 790} {"train_loss": -10.383028030395508, "global_step": 132799, "epoch": 790} {"train_loss": -10.34697437286377, "global_step": 132800, "epoch": 790} {"train_loss": -9.859585762023926, "global_step": 132801, "epoch": 790} {"train_loss": -10.3163480758667, "global_step": 132802, "epoch": 790} {"train_loss": -10.474231719970703, "global_step": 132803, "epoch": 790} {"train_loss": -10.072242736816406, "global_step": 132804, "epoch": 790} {"train_loss": -10.552210807800293, "global_step": 132805, "epoch": 790} {"train_loss": -10.323110580444336, "global_step": 132806, "epoch": 790} {"train_loss": -10.124500274658203, "global_step": 132807, "epoch": 790} {"train_loss": -10.097738265991211, "global_step": 132808, "epoch": 790} {"train_loss": -10.447286605834961, "global_step": 132809, "epoch": 790} {"train_loss": -9.757413864135742, "global_step": 132810, "epoch": 790} {"train_loss": -10.481761932373047, "global_step": 132811, "epoch": 790} {"train_loss": -9.764543533325195, "global_step": 132812, "epoch": 790} {"train_loss": -10.45920181274414, "global_step": 132813, "epoch": 790} {"train_loss": -10.1582612991333, "global_step": 132814, "epoch": 790} {"train_loss": -10.402140617370605, "global_step": 132815, "epoch": 790} {"train_loss": -10.087137222290039, "global_step": 132816, "epoch": 790} {"train_loss": -10.51736831665039, "global_step": 132817, "epoch": 790} {"train_loss": -9.978586196899414, "global_step": 132818, "epoch": 790} {"train_loss": -10.259320259094238, "global_step": 132819, "epoch": 790} {"train_loss": -10.536599159240723, "global_step": 132820, "epoch": 790} {"train_loss": -10.369911193847656, "global_step": 132821, "epoch": 790} {"train_loss": -10.494482040405273, "global_step": 132822, "epoch": 790} {"train_loss": -10.119789123535156, "global_step": 132823, "epoch": 790} {"train_loss": -10.49631404876709, "global_step": 132824, "epoch": 790} {"train_loss": -9.61003303527832, "global_step": 132825, "epoch": 790} {"train_loss": -10.58413314819336, "global_step": 132826, "epoch": 790} {"train_loss": -9.86496353149414, "global_step": 132827, "epoch": 790} {"train_loss": -10.360466957092285, "global_step": 132828, "epoch": 790} {"train_loss": -10.204428672790527, "global_step": 132829, "epoch": 790} {"train_loss": -10.188661575317383, "global_step": 132830, "epoch": 790} {"train_loss": -10.147830963134766, "global_step": 132831, "epoch": 790} {"train_loss": -10.300424575805664, "global_step": 132832, "epoch": 790} {"train_loss": -9.809226989746094, "global_step": 132833, "epoch": 790} {"train_loss": -10.359487533569336, "global_step": 132834, "epoch": 790} {"train_loss": -10.172877311706543, "global_step": 132835, "epoch": 790} {"train_loss": -10.462377548217773, "global_step": 132836, "epoch": 790} {"train_loss": -10.295893669128418, "global_step": 132837, "epoch": 790} {"train_loss": -10.002527236938477, "global_step": 132838, "epoch": 790} {"train_loss": -10.498542785644531, "global_step": 132839, "epoch": 790} {"train_loss": -10.229693412780762, "global_step": 132840, "epoch": 790} {"train_loss": -10.445517539978027, "global_step": 132841, "epoch": 790} {"train_loss": -10.322391510009766, "global_step": 132842, "epoch": 790} {"train_loss": -10.341724395751953, "global_step": 132843, "epoch": 790} {"train_loss": -10.414419174194336, "global_step": 132844, "epoch": 790} {"train_loss": -10.437272071838379, "global_step": 132845, "epoch": 790} {"train_loss": -10.648359298706055, "global_step": 132846, "epoch": 790} {"train_loss": -10.480183601379395, "global_step": 132847, "epoch": 790} {"train_loss": -10.403414726257324, "global_step": 132848, "epoch": 790} {"train_loss": -10.6242036819458, "global_step": 132849, "epoch": 790} {"train_loss": -10.542264938354492, "global_step": 132850, "epoch": 790} {"train_loss": -10.656848907470703, "global_step": 132851, "epoch": 790} {"train_loss": -10.529670715332031, "global_step": 132852, "epoch": 790} {"train_loss": -10.736969947814941, "global_step": 132853, "epoch": 790} {"train_loss": -10.532081604003906, "global_step": 132854, "epoch": 790} {"train_loss": -10.393471717834473, "global_step": 132855, "epoch": 790} {"train_loss": -10.807882308959961, "global_step": 132856, "epoch": 790} {"train_loss": -10.572205543518066, "global_step": 132857, "epoch": 790} {"train_loss": -10.694272994995117, "global_step": 132858, "epoch": 790} {"train_loss": -10.365809440612793, "global_step": 132859, "epoch": 790} {"train_loss": -10.787347793579102, "global_step": 132860, "epoch": 790} {"train_loss": -10.397554397583008, "global_step": 132861, "epoch": 790} {"train_loss": -10.706033706665039, "global_step": 132862, "epoch": 790} {"train_loss": -10.453968048095703, "global_step": 132863, "epoch": 790} {"train_loss": -10.593534469604492, "global_step": 132864, "epoch": 790} {"train_loss": -10.599617004394531, "global_step": 132865, "epoch": 790} {"train_loss": -10.547738075256348, "global_step": 132866, "epoch": 790} {"train_loss": -10.475147247314453, "global_step": 132867, "epoch": 790} {"train_loss": -9.27039909362793, "global_step": 132868, "epoch": 790} {"train_loss": -10.498858451843262, "global_step": 132869, "epoch": 790} {"train_loss": -10.147379875183105, "global_step": 132870, "epoch": 790} {"train_loss": -10.539337158203125, "global_step": 132871, "epoch": 790} {"train_loss": -10.329833030700684, "global_step": 132872, "epoch": 790} {"train_loss": -10.002951622009277, "global_step": 132873, "epoch": 790} {"train_loss": -10.237173080444336, "global_step": 132874, "epoch": 790} {"train_loss": -10.435613632202148, "global_step": 132875, "epoch": 790} {"train_loss": -10.282997131347656, "global_step": 132876, "epoch": 790} {"train_loss": -10.56887149810791, "global_step": 132877, "epoch": 790} {"train_loss": -10.231327056884766, "global_step": 132878, "epoch": 790} {"train_loss": -10.556105613708496, "global_step": 132879, "epoch": 790} {"train_loss": -10.170726776123047, "global_step": 132880, "epoch": 790} {"train_loss": -10.516277313232422, "global_step": 132881, "epoch": 790} {"train_loss": -10.251382827758789, "global_step": 132882, "epoch": 790} {"train_loss": -10.325821876525879, "global_step": 132883, "epoch": 790} {"train_loss": -10.619977951049805, "global_step": 132884, "epoch": 790} {"train_loss": -10.467093467712402, "global_step": 132885, "epoch": 790} {"train_loss": -10.224475860595703, "global_step": 132886, "epoch": 790} {"train_loss": -10.262616412980217, "global_step": 132887, "epoch": 790, "val_loss": 217651.1875, "train_action_mse_error": 2.9220566749572754} {"train_loss": -10.2275390625, "global_step": 132888, "epoch": 791} {"train_loss": -10.558527946472168, "global_step": 132889, "epoch": 791} {"train_loss": -10.03908920288086, "global_step": 132890, "epoch": 791} {"train_loss": -10.040138244628906, "global_step": 132891, "epoch": 791} {"train_loss": -10.34653377532959, "global_step": 132892, "epoch": 791} {"train_loss": -9.794050216674805, "global_step": 132893, "epoch": 791} {"train_loss": -10.480335235595703, "global_step": 132894, "epoch": 791} {"train_loss": -10.158699989318848, "global_step": 132895, "epoch": 791} {"train_loss": -10.090995788574219, "global_step": 132896, "epoch": 791} {"train_loss": -10.533872604370117, "global_step": 132897, "epoch": 791} {"train_loss": -9.709952354431152, "global_step": 132898, "epoch": 791} {"train_loss": -10.383054733276367, "global_step": 132899, "epoch": 791} {"train_loss": -9.93974494934082, "global_step": 132900, "epoch": 791} {"train_loss": -10.06124210357666, "global_step": 132901, "epoch": 791} {"train_loss": -10.385017395019531, "global_step": 132902, "epoch": 791} {"train_loss": -9.963004112243652, "global_step": 132903, "epoch": 791} {"train_loss": -10.057635307312012, "global_step": 132904, "epoch": 791} {"train_loss": -10.304117202758789, "global_step": 132905, "epoch": 791} {"train_loss": -10.260101318359375, "global_step": 132906, "epoch": 791} {"train_loss": -10.4769868850708, "global_step": 132907, "epoch": 791} {"train_loss": -10.315624237060547, "global_step": 132908, "epoch": 791} {"train_loss": -10.478401184082031, "global_step": 132909, "epoch": 791} {"train_loss": -10.677007675170898, "global_step": 132910, "epoch": 791} {"train_loss": -10.34899616241455, "global_step": 132911, "epoch": 791} {"train_loss": -10.271906852722168, "global_step": 132912, "epoch": 791} {"train_loss": -10.123712539672852, "global_step": 132913, "epoch": 791} {"train_loss": -9.94419002532959, "global_step": 132914, "epoch": 791} {"train_loss": -10.546757698059082, "global_step": 132915, "epoch": 791} {"train_loss": -10.103012084960938, "global_step": 132916, "epoch": 791} {"train_loss": -10.540081977844238, "global_step": 132917, "epoch": 791} {"train_loss": -10.382883071899414, "global_step": 132918, "epoch": 791} {"train_loss": -10.292337417602539, "global_step": 132919, "epoch": 791} {"train_loss": -10.46250057220459, "global_step": 132920, "epoch": 791} {"train_loss": -10.538284301757812, "global_step": 132921, "epoch": 791} {"train_loss": -10.489147186279297, "global_step": 132922, "epoch": 791} {"train_loss": -10.34820556640625, "global_step": 132923, "epoch": 791} {"train_loss": -10.490314483642578, "global_step": 132924, "epoch": 791} {"train_loss": -10.57678508758545, "global_step": 132925, "epoch": 791} {"train_loss": -10.55105209350586, "global_step": 132926, "epoch": 791} {"train_loss": -10.604920387268066, "global_step": 132927, "epoch": 791} {"train_loss": -10.503325462341309, "global_step": 132928, "epoch": 791} {"train_loss": -10.491050720214844, "global_step": 132929, "epoch": 791} {"train_loss": -10.426061630249023, "global_step": 132930, "epoch": 791} {"train_loss": -10.653346061706543, "global_step": 132931, "epoch": 791} {"train_loss": -10.481962203979492, "global_step": 132932, "epoch": 791} {"train_loss": -10.436234474182129, "global_step": 132933, "epoch": 791} {"train_loss": -10.630571365356445, "global_step": 132934, "epoch": 791} {"train_loss": -10.621973037719727, "global_step": 132935, "epoch": 791} {"train_loss": -10.51970100402832, "global_step": 132936, "epoch": 791} {"train_loss": -10.688192367553711, "global_step": 132937, "epoch": 791} {"train_loss": -10.238869667053223, "global_step": 132938, "epoch": 791} {"train_loss": -10.692091941833496, "global_step": 132939, "epoch": 791} {"train_loss": -10.207780838012695, "global_step": 132940, "epoch": 791} {"train_loss": -10.901799201965332, "global_step": 132941, "epoch": 791} {"train_loss": -10.091154098510742, "global_step": 132942, "epoch": 791} {"train_loss": -10.78078556060791, "global_step": 132943, "epoch": 791} {"train_loss": -10.357709884643555, "global_step": 132944, "epoch": 791} {"train_loss": -10.573596954345703, "global_step": 132945, "epoch": 791} {"train_loss": -10.22488021850586, "global_step": 132946, "epoch": 791} {"train_loss": -10.496076583862305, "global_step": 132947, "epoch": 791} {"train_loss": -10.373268127441406, "global_step": 132948, "epoch": 791} {"train_loss": -10.685812950134277, "global_step": 132949, "epoch": 791} {"train_loss": -10.157064437866211, "global_step": 132950, "epoch": 791} {"train_loss": -10.59650993347168, "global_step": 132951, "epoch": 791} {"train_loss": -10.897433280944824, "global_step": 132952, "epoch": 791} {"train_loss": -10.488104820251465, "global_step": 132953, "epoch": 791} {"train_loss": -10.679290771484375, "global_step": 132954, "epoch": 791} {"train_loss": -10.806726455688477, "global_step": 132955, "epoch": 791} {"train_loss": -10.119397163391113, "global_step": 132956, "epoch": 791} {"train_loss": -9.994855880737305, "global_step": 132957, "epoch": 791} {"train_loss": -10.58254623413086, "global_step": 132958, "epoch": 791} {"train_loss": -9.94968318939209, "global_step": 132959, "epoch": 791} {"train_loss": -10.290979385375977, "global_step": 132960, "epoch": 791} {"train_loss": -10.03225040435791, "global_step": 132961, "epoch": 791} {"train_loss": -9.890630722045898, "global_step": 132962, "epoch": 791} {"train_loss": -10.15013313293457, "global_step": 132963, "epoch": 791} {"train_loss": -10.236875534057617, "global_step": 132964, "epoch": 791} {"train_loss": -10.725658416748047, "global_step": 132965, "epoch": 791} {"train_loss": -10.22320556640625, "global_step": 132966, "epoch": 791} {"train_loss": -10.449535369873047, "global_step": 132967, "epoch": 791} {"train_loss": -10.156742095947266, "global_step": 132968, "epoch": 791} {"train_loss": -10.10086441040039, "global_step": 132969, "epoch": 791} {"train_loss": -10.27676773071289, "global_step": 132970, "epoch": 791} {"train_loss": -9.933931350708008, "global_step": 132971, "epoch": 791} {"train_loss": -10.273004531860352, "global_step": 132972, "epoch": 791} {"train_loss": -9.99577522277832, "global_step": 132973, "epoch": 791} {"train_loss": -10.137694358825684, "global_step": 132974, "epoch": 791} {"train_loss": -9.926665306091309, "global_step": 132975, "epoch": 791} {"train_loss": -10.086118698120117, "global_step": 132976, "epoch": 791} {"train_loss": -10.084124565124512, "global_step": 132977, "epoch": 791} {"train_loss": -10.232525825500488, "global_step": 132978, "epoch": 791} {"train_loss": -10.3892822265625, "global_step": 132979, "epoch": 791} {"train_loss": -10.093764305114746, "global_step": 132980, "epoch": 791} {"train_loss": -10.043622970581055, "global_step": 132981, "epoch": 791} {"train_loss": -10.31102180480957, "global_step": 132982, "epoch": 791} {"train_loss": -10.300033569335938, "global_step": 132983, "epoch": 791} {"train_loss": -10.43095874786377, "global_step": 132984, "epoch": 791} {"train_loss": -10.253865242004395, "global_step": 132985, "epoch": 791} {"train_loss": -10.288846015930176, "global_step": 132986, "epoch": 791} {"train_loss": -10.096705436706543, "global_step": 132987, "epoch": 791} {"train_loss": -10.427827835083008, "global_step": 132988, "epoch": 791} {"train_loss": -10.074390411376953, "global_step": 132989, "epoch": 791} {"train_loss": -10.465327262878418, "global_step": 132990, "epoch": 791} {"train_loss": -10.07110595703125, "global_step": 132991, "epoch": 791} {"train_loss": -10.392704963684082, "global_step": 132992, "epoch": 791} {"train_loss": -10.373495101928711, "global_step": 132993, "epoch": 791} {"train_loss": -10.317148208618164, "global_step": 132994, "epoch": 791} {"train_loss": -10.565492630004883, "global_step": 132995, "epoch": 791} {"train_loss": -10.458929061889648, "global_step": 132996, "epoch": 791} {"train_loss": -10.475750923156738, "global_step": 132997, "epoch": 791} {"train_loss": -10.653621673583984, "global_step": 132998, "epoch": 791} {"train_loss": -10.60704231262207, "global_step": 132999, "epoch": 791} {"train_loss": -10.334532737731934, "global_step": 133000, "epoch": 791} {"train_loss": -10.665369987487793, "global_step": 133001, "epoch": 791} {"train_loss": -10.466325759887695, "global_step": 133002, "epoch": 791} {"train_loss": -10.546493530273438, "global_step": 133003, "epoch": 791} {"train_loss": -10.60986328125, "global_step": 133004, "epoch": 791} {"train_loss": -10.623939514160156, "global_step": 133005, "epoch": 791} {"train_loss": -10.586454391479492, "global_step": 133006, "epoch": 791} {"train_loss": -10.478062629699707, "global_step": 133007, "epoch": 791} {"train_loss": -10.856744766235352, "global_step": 133008, "epoch": 791} {"train_loss": -10.658256530761719, "global_step": 133009, "epoch": 791} {"train_loss": -10.509480476379395, "global_step": 133010, "epoch": 791} {"train_loss": -10.564790725708008, "global_step": 133011, "epoch": 791} {"train_loss": -10.605411529541016, "global_step": 133012, "epoch": 791} {"train_loss": -10.499868392944336, "global_step": 133013, "epoch": 791} {"train_loss": -10.674962997436523, "global_step": 133014, "epoch": 791} {"train_loss": -10.717047691345215, "global_step": 133015, "epoch": 791} {"train_loss": -10.232526779174805, "global_step": 133016, "epoch": 791} {"train_loss": -10.591730117797852, "global_step": 133017, "epoch": 791} {"train_loss": -10.814689636230469, "global_step": 133018, "epoch": 791} {"train_loss": -10.2310209274292, "global_step": 133019, "epoch": 791} {"train_loss": -10.42895793914795, "global_step": 133020, "epoch": 791} {"train_loss": -10.43404769897461, "global_step": 133021, "epoch": 791} {"train_loss": -10.425065994262695, "global_step": 133022, "epoch": 791} {"train_loss": -10.421724319458008, "global_step": 133023, "epoch": 791} {"train_loss": -10.493328094482422, "global_step": 133024, "epoch": 791} {"train_loss": -9.896476745605469, "global_step": 133025, "epoch": 791} {"train_loss": -10.513986587524414, "global_step": 133026, "epoch": 791} {"train_loss": -10.27843189239502, "global_step": 133027, "epoch": 791} {"train_loss": -10.303596496582031, "global_step": 133028, "epoch": 791} {"train_loss": -10.327627182006836, "global_step": 133029, "epoch": 791} {"train_loss": -10.681154251098633, "global_step": 133030, "epoch": 791} {"train_loss": -10.516284942626953, "global_step": 133031, "epoch": 791} {"train_loss": -10.335683822631836, "global_step": 133032, "epoch": 791} {"train_loss": -10.573783874511719, "global_step": 133033, "epoch": 791} {"train_loss": -10.435468673706055, "global_step": 133034, "epoch": 791} {"train_loss": -10.132059097290039, "global_step": 133035, "epoch": 791} {"train_loss": -10.667937278747559, "global_step": 133036, "epoch": 791} {"train_loss": -10.09353256225586, "global_step": 133037, "epoch": 791} {"train_loss": -10.46606731414795, "global_step": 133038, "epoch": 791} {"train_loss": -10.391168594360352, "global_step": 133039, "epoch": 791} {"train_loss": -10.475322723388672, "global_step": 133040, "epoch": 791} {"train_loss": -10.243017196655273, "global_step": 133041, "epoch": 791} {"train_loss": -10.536808967590332, "global_step": 133042, "epoch": 791} {"train_loss": -10.173297882080078, "global_step": 133043, "epoch": 791} {"train_loss": -10.478165626525879, "global_step": 133044, "epoch": 791} {"train_loss": -10.463109016418457, "global_step": 133045, "epoch": 791} {"train_loss": -9.54207706451416, "global_step": 133046, "epoch": 791} {"train_loss": -10.29448127746582, "global_step": 133047, "epoch": 791} {"train_loss": -9.842086791992188, "global_step": 133048, "epoch": 791} {"train_loss": -10.257965087890625, "global_step": 133049, "epoch": 791} {"train_loss": -9.919848442077637, "global_step": 133050, "epoch": 791} {"train_loss": -10.230010032653809, "global_step": 133051, "epoch": 791} {"train_loss": -9.812204360961914, "global_step": 133052, "epoch": 791} {"train_loss": -10.132574081420898, "global_step": 133053, "epoch": 791} {"train_loss": -10.291017532348633, "global_step": 133054, "epoch": 791} {"train_loss": -10.353987654050192, "global_step": 133055, "epoch": 791, "val_loss": 221640.625} {"train_loss": -10.19119930267334, "global_step": 133056, "epoch": 792} {"train_loss": -10.147760391235352, "global_step": 133057, "epoch": 792} {"train_loss": -10.588312149047852, "global_step": 133058, "epoch": 792} {"train_loss": -10.492677688598633, "global_step": 133059, "epoch": 792} {"train_loss": -10.530716896057129, "global_step": 133060, "epoch": 792} {"train_loss": -10.231232643127441, "global_step": 133061, "epoch": 792} {"train_loss": -10.59189224243164, "global_step": 133062, "epoch": 792} {"train_loss": -10.536600112915039, "global_step": 133063, "epoch": 792} {"train_loss": -10.529458999633789, "global_step": 133064, "epoch": 792} {"train_loss": -10.375499725341797, "global_step": 133065, "epoch": 792} {"train_loss": -10.57827377319336, "global_step": 133066, "epoch": 792} {"train_loss": -10.15868091583252, "global_step": 133067, "epoch": 792} {"train_loss": -10.192206382751465, "global_step": 133068, "epoch": 792} {"train_loss": -10.441417694091797, "global_step": 133069, "epoch": 792} {"train_loss": -10.410709381103516, "global_step": 133070, "epoch": 792} {"train_loss": -10.439610481262207, "global_step": 133071, "epoch": 792} {"train_loss": -10.681781768798828, "global_step": 133072, "epoch": 792} {"train_loss": -10.61895751953125, "global_step": 133073, "epoch": 792} {"train_loss": -10.631997108459473, "global_step": 133074, "epoch": 792} {"train_loss": -10.610430717468262, "global_step": 133075, "epoch": 792} {"train_loss": -10.427929878234863, "global_step": 133076, "epoch": 792} {"train_loss": -10.566988945007324, "global_step": 133077, "epoch": 792} {"train_loss": -10.600842475891113, "global_step": 133078, "epoch": 792} {"train_loss": -10.697502136230469, "global_step": 133079, "epoch": 792} {"train_loss": -10.478472709655762, "global_step": 133080, "epoch": 792} {"train_loss": -10.582880020141602, "global_step": 133081, "epoch": 792} {"train_loss": -10.39335823059082, "global_step": 133082, "epoch": 792} {"train_loss": -10.408589363098145, "global_step": 133083, "epoch": 792} {"train_loss": -10.410114288330078, "global_step": 133084, "epoch": 792} {"train_loss": -10.308874130249023, "global_step": 133085, "epoch": 792} {"train_loss": -10.483404159545898, "global_step": 133086, "epoch": 792} {"train_loss": -10.48127555847168, "global_step": 133087, "epoch": 792} {"train_loss": -10.278515815734863, "global_step": 133088, "epoch": 792} {"train_loss": -10.679508209228516, "global_step": 133089, "epoch": 792} {"train_loss": -10.478617668151855, "global_step": 133090, "epoch": 792} {"train_loss": -10.479546546936035, "global_step": 133091, "epoch": 792} {"train_loss": -10.514850616455078, "global_step": 133092, "epoch": 792} {"train_loss": -10.46920108795166, "global_step": 133093, "epoch": 792} {"train_loss": -10.748199462890625, "global_step": 133094, "epoch": 792} {"train_loss": -10.443065643310547, "global_step": 133095, "epoch": 792} {"train_loss": -10.442837715148926, "global_step": 133096, "epoch": 792} {"train_loss": -10.599479675292969, "global_step": 133097, "epoch": 792} {"train_loss": -10.517746925354004, "global_step": 133098, "epoch": 792} {"train_loss": -10.37666130065918, "global_step": 133099, "epoch": 792} {"train_loss": -10.466363906860352, "global_step": 133100, "epoch": 792} {"train_loss": -10.355710983276367, "global_step": 133101, "epoch": 792} {"train_loss": -10.59238338470459, "global_step": 133102, "epoch": 792} {"train_loss": -10.173388481140137, "global_step": 133103, "epoch": 792} {"train_loss": -10.19857120513916, "global_step": 133104, "epoch": 792} {"train_loss": -10.646549224853516, "global_step": 133105, "epoch": 792} {"train_loss": -9.920352935791016, "global_step": 133106, "epoch": 792} {"train_loss": -10.671358108520508, "global_step": 133107, "epoch": 792} {"train_loss": -10.126827239990234, "global_step": 133108, "epoch": 792} {"train_loss": -10.50289535522461, "global_step": 133109, "epoch": 792} {"train_loss": -10.34669017791748, "global_step": 133110, "epoch": 792} {"train_loss": -10.294626235961914, "global_step": 133111, "epoch": 792} {"train_loss": -10.495481491088867, "global_step": 133112, "epoch": 792} {"train_loss": -10.181863784790039, "global_step": 133113, "epoch": 792} {"train_loss": -10.418731689453125, "global_step": 133114, "epoch": 792} {"train_loss": -10.222307205200195, "global_step": 133115, "epoch": 792} {"train_loss": -10.572179794311523, "global_step": 133116, "epoch": 792} {"train_loss": -10.306654930114746, "global_step": 133117, "epoch": 792} {"train_loss": -10.497331619262695, "global_step": 133118, "epoch": 792} {"train_loss": -10.568056106567383, "global_step": 133119, "epoch": 792} {"train_loss": -10.819931030273438, "global_step": 133120, "epoch": 792} {"train_loss": -10.680692672729492, "global_step": 133121, "epoch": 792} {"train_loss": -10.711206436157227, "global_step": 133122, "epoch": 792} {"train_loss": -10.649873733520508, "global_step": 133123, "epoch": 792} {"train_loss": -10.567890167236328, "global_step": 133124, "epoch": 792} {"train_loss": -10.535463333129883, "global_step": 133125, "epoch": 792} {"train_loss": -10.583112716674805, "global_step": 133126, "epoch": 792} {"train_loss": -10.545345306396484, "global_step": 133127, "epoch": 792} {"train_loss": -10.703622817993164, "global_step": 133128, "epoch": 792} {"train_loss": -10.764775276184082, "global_step": 133129, "epoch": 792} {"train_loss": -10.61168098449707, "global_step": 133130, "epoch": 792} {"train_loss": -10.538680076599121, "global_step": 133131, "epoch": 792} {"train_loss": -10.257652282714844, "global_step": 133132, "epoch": 792} {"train_loss": -10.54928207397461, "global_step": 133133, "epoch": 792} {"train_loss": -10.434678077697754, "global_step": 133134, "epoch": 792} {"train_loss": -10.190754890441895, "global_step": 133135, "epoch": 792} {"train_loss": -10.310229301452637, "global_step": 133136, "epoch": 792} {"train_loss": -10.751365661621094, "global_step": 133137, "epoch": 792} {"train_loss": -10.147467613220215, "global_step": 133138, "epoch": 792} {"train_loss": -10.506451606750488, "global_step": 133139, "epoch": 792} {"train_loss": -10.555999755859375, "global_step": 133140, "epoch": 792} {"train_loss": -10.591981887817383, "global_step": 133141, "epoch": 792} {"train_loss": -10.234268188476562, "global_step": 133142, "epoch": 792} {"train_loss": -10.52553653717041, "global_step": 133143, "epoch": 792} {"train_loss": -10.304961204528809, "global_step": 133144, "epoch": 792} {"train_loss": -10.533851623535156, "global_step": 133145, "epoch": 792} {"train_loss": -10.658207893371582, "global_step": 133146, "epoch": 792} {"train_loss": -10.400754928588867, "global_step": 133147, "epoch": 792} {"train_loss": -10.42153549194336, "global_step": 133148, "epoch": 792} {"train_loss": -10.554178237915039, "global_step": 133149, "epoch": 792} {"train_loss": -10.272665023803711, "global_step": 133150, "epoch": 792} {"train_loss": -10.599688529968262, "global_step": 133151, "epoch": 792} {"train_loss": -10.147054672241211, "global_step": 133152, "epoch": 792} {"train_loss": -10.52963638305664, "global_step": 133153, "epoch": 792} {"train_loss": -10.285196304321289, "global_step": 133154, "epoch": 792} {"train_loss": -10.268312454223633, "global_step": 133155, "epoch": 792} {"train_loss": -10.235321044921875, "global_step": 133156, "epoch": 792} {"train_loss": -10.159395217895508, "global_step": 133157, "epoch": 792} {"train_loss": -10.405112266540527, "global_step": 133158, "epoch": 792} {"train_loss": -9.930871963500977, "global_step": 133159, "epoch": 792} {"train_loss": -10.417113304138184, "global_step": 133160, "epoch": 792} {"train_loss": -10.230524063110352, "global_step": 133161, "epoch": 792} {"train_loss": -10.089908599853516, "global_step": 133162, "epoch": 792} {"train_loss": -10.237686157226562, "global_step": 133163, "epoch": 792} {"train_loss": -10.141112327575684, "global_step": 133164, "epoch": 792} {"train_loss": -10.180450439453125, "global_step": 133165, "epoch": 792} {"train_loss": -10.206785202026367, "global_step": 133166, "epoch": 792} {"train_loss": -10.303342819213867, "global_step": 133167, "epoch": 792} {"train_loss": -10.33549976348877, "global_step": 133168, "epoch": 792} {"train_loss": -9.838011741638184, "global_step": 133169, "epoch": 792} {"train_loss": -10.331258773803711, "global_step": 133170, "epoch": 792} {"train_loss": -10.173149108886719, "global_step": 133171, "epoch": 792} {"train_loss": -10.173582077026367, "global_step": 133172, "epoch": 792} {"train_loss": -10.04925537109375, "global_step": 133173, "epoch": 792} {"train_loss": -10.165789604187012, "global_step": 133174, "epoch": 792} {"train_loss": -10.264411926269531, "global_step": 133175, "epoch": 792} {"train_loss": -10.02454948425293, "global_step": 133176, "epoch": 792} {"train_loss": -10.441713333129883, "global_step": 133177, "epoch": 792} {"train_loss": -10.182507514953613, "global_step": 133178, "epoch": 792} {"train_loss": -10.369224548339844, "global_step": 133179, "epoch": 792} {"train_loss": -10.325799942016602, "global_step": 133180, "epoch": 792} {"train_loss": -10.160669326782227, "global_step": 133181, "epoch": 792} {"train_loss": -10.394092559814453, "global_step": 133182, "epoch": 792} {"train_loss": -10.284193992614746, "global_step": 133183, "epoch": 792} {"train_loss": -10.162922859191895, "global_step": 133184, "epoch": 792} {"train_loss": -10.2568941116333, "global_step": 133185, "epoch": 792} {"train_loss": -10.214263916015625, "global_step": 133186, "epoch": 792} {"train_loss": -10.172262191772461, "global_step": 133187, "epoch": 792} {"train_loss": -10.285224914550781, "global_step": 133188, "epoch": 792} {"train_loss": -10.331003189086914, "global_step": 133189, "epoch": 792} {"train_loss": -10.156839370727539, "global_step": 133190, "epoch": 792} {"train_loss": -10.725887298583984, "global_step": 133191, "epoch": 792} {"train_loss": -10.234089851379395, "global_step": 133192, "epoch": 792} {"train_loss": -10.596847534179688, "global_step": 133193, "epoch": 792} {"train_loss": -10.635611534118652, "global_step": 133194, "epoch": 792} {"train_loss": -10.402593612670898, "global_step": 133195, "epoch": 792} {"train_loss": -10.49399185180664, "global_step": 133196, "epoch": 792} {"train_loss": -10.724397659301758, "global_step": 133197, "epoch": 792} {"train_loss": -10.601134300231934, "global_step": 133198, "epoch": 792} {"train_loss": -10.68765640258789, "global_step": 133199, "epoch": 792} {"train_loss": -10.601898193359375, "global_step": 133200, "epoch": 792} {"train_loss": -10.702041625976562, "global_step": 133201, "epoch": 792} {"train_loss": -10.56416130065918, "global_step": 133202, "epoch": 792} {"train_loss": -10.332618713378906, "global_step": 133203, "epoch": 792} {"train_loss": -10.526351928710938, "global_step": 133204, "epoch": 792} {"train_loss": -10.680696487426758, "global_step": 133205, "epoch": 792} {"train_loss": -10.518413543701172, "global_step": 133206, "epoch": 792} {"train_loss": -10.6017484664917, "global_step": 133207, "epoch": 792} {"train_loss": -10.44774055480957, "global_step": 133208, "epoch": 792} {"train_loss": -10.43172836303711, "global_step": 133209, "epoch": 792} {"train_loss": -10.020505905151367, "global_step": 133210, "epoch": 792} {"train_loss": -10.556011199951172, "global_step": 133211, "epoch": 792} {"train_loss": -10.165586471557617, "global_step": 133212, "epoch": 792} {"train_loss": -10.295916557312012, "global_step": 133213, "epoch": 792} {"train_loss": -10.559812545776367, "global_step": 133214, "epoch": 792} {"train_loss": -10.473023414611816, "global_step": 133215, "epoch": 792} {"train_loss": -10.363086700439453, "global_step": 133216, "epoch": 792} {"train_loss": -10.252833366394043, "global_step": 133217, "epoch": 792} {"train_loss": -10.617379188537598, "global_step": 133218, "epoch": 792} {"train_loss": -10.47563362121582, "global_step": 133219, "epoch": 792} {"train_loss": -10.464333534240723, "global_step": 133220, "epoch": 792} {"train_loss": -10.69459342956543, "global_step": 133221, "epoch": 792} {"train_loss": -10.299386024475098, "global_step": 133222, "epoch": 792} {"train_loss": -10.415821506863548, "global_step": 133223, "epoch": 792, "val_loss": 218794.375} {"train_loss": -10.652301788330078, "global_step": 133224, "epoch": 793} {"train_loss": -10.467853546142578, "global_step": 133225, "epoch": 793} {"train_loss": -10.494735717773438, "global_step": 133226, "epoch": 793} {"train_loss": -10.221009254455566, "global_step": 133227, "epoch": 793} {"train_loss": -10.48026180267334, "global_step": 133228, "epoch": 793} {"train_loss": -10.5830078125, "global_step": 133229, "epoch": 793} {"train_loss": -10.614068984985352, "global_step": 133230, "epoch": 793} {"train_loss": -10.343332290649414, "global_step": 133231, "epoch": 793} {"train_loss": -10.415728569030762, "global_step": 133232, "epoch": 793} {"train_loss": -10.48106861114502, "global_step": 133233, "epoch": 793} {"train_loss": -10.493917465209961, "global_step": 133234, "epoch": 793} {"train_loss": -10.549070358276367, "global_step": 133235, "epoch": 793} {"train_loss": -10.239713668823242, "global_step": 133236, "epoch": 793} {"train_loss": -10.730030059814453, "global_step": 133237, "epoch": 793} {"train_loss": -10.032135009765625, "global_step": 133238, "epoch": 793} {"train_loss": -10.42618179321289, "global_step": 133239, "epoch": 793} {"train_loss": -10.588504791259766, "global_step": 133240, "epoch": 793} {"train_loss": -10.668966293334961, "global_step": 133241, "epoch": 793} {"train_loss": -10.610271453857422, "global_step": 133242, "epoch": 793} {"train_loss": -10.780643463134766, "global_step": 133243, "epoch": 793} {"train_loss": -9.997600555419922, "global_step": 133244, "epoch": 793} {"train_loss": -10.50261116027832, "global_step": 133245, "epoch": 793} {"train_loss": -10.481005668640137, "global_step": 133246, "epoch": 793} {"train_loss": -10.639274597167969, "global_step": 133247, "epoch": 793} {"train_loss": -10.565732955932617, "global_step": 133248, "epoch": 793} {"train_loss": -10.287357330322266, "global_step": 133249, "epoch": 793} {"train_loss": -10.448163032531738, "global_step": 133250, "epoch": 793} {"train_loss": -10.317581176757812, "global_step": 133251, "epoch": 793} {"train_loss": -10.579710960388184, "global_step": 133252, "epoch": 793} {"train_loss": -10.6017427444458, "global_step": 133253, "epoch": 793} {"train_loss": -10.064854621887207, "global_step": 133254, "epoch": 793} {"train_loss": -10.369452476501465, "global_step": 133255, "epoch": 793} {"train_loss": -10.481832504272461, "global_step": 133256, "epoch": 793} {"train_loss": -9.564090728759766, "global_step": 133257, "epoch": 793} {"train_loss": -10.380699157714844, "global_step": 133258, "epoch": 793} {"train_loss": -9.679891586303711, "global_step": 133259, "epoch": 793} {"train_loss": -9.709208488464355, "global_step": 133260, "epoch": 793} {"train_loss": -10.30390739440918, "global_step": 133261, "epoch": 793} {"train_loss": -9.524898529052734, "global_step": 133262, "epoch": 793} {"train_loss": -10.113325119018555, "global_step": 133263, "epoch": 793} {"train_loss": -9.747039794921875, "global_step": 133264, "epoch": 793} {"train_loss": -9.797161102294922, "global_step": 133265, "epoch": 793} {"train_loss": -9.14671516418457, "global_step": 133266, "epoch": 793} {"train_loss": -9.52817153930664, "global_step": 133267, "epoch": 793} {"train_loss": -9.43227481842041, "global_step": 133268, "epoch": 793} {"train_loss": -8.902620315551758, "global_step": 133269, "epoch": 793} {"train_loss": -10.047850608825684, "global_step": 133270, "epoch": 793} {"train_loss": -9.255224227905273, "global_step": 133271, "epoch": 793} {"train_loss": -9.929900169372559, "global_step": 133272, "epoch": 793} {"train_loss": -9.784512519836426, "global_step": 133273, "epoch": 793} {"train_loss": -9.639318466186523, "global_step": 133274, "epoch": 793} {"train_loss": -9.412729263305664, "global_step": 133275, "epoch": 793} {"train_loss": -10.074394226074219, "global_step": 133276, "epoch": 793} {"train_loss": -9.51607894897461, "global_step": 133277, "epoch": 793} {"train_loss": -9.885927200317383, "global_step": 133278, "epoch": 793} {"train_loss": -10.005071640014648, "global_step": 133279, "epoch": 793} {"train_loss": -9.900861740112305, "global_step": 133280, "epoch": 793} {"train_loss": -10.089179992675781, "global_step": 133281, "epoch": 793} {"train_loss": -10.22850513458252, "global_step": 133282, "epoch": 793} {"train_loss": -10.194845199584961, "global_step": 133283, "epoch": 793} {"train_loss": -10.161259651184082, "global_step": 133284, "epoch": 793} {"train_loss": -10.150247573852539, "global_step": 133285, "epoch": 793} {"train_loss": -10.354667663574219, "global_step": 133286, "epoch": 793} {"train_loss": -10.28094482421875, "global_step": 133287, "epoch": 793} {"train_loss": -10.383434295654297, "global_step": 133288, "epoch": 793} {"train_loss": -10.304415702819824, "global_step": 133289, "epoch": 793} {"train_loss": -10.526525497436523, "global_step": 133290, "epoch": 793} {"train_loss": -10.439376831054688, "global_step": 133291, "epoch": 793} {"train_loss": -10.367863655090332, "global_step": 133292, "epoch": 793} {"train_loss": -10.485429763793945, "global_step": 133293, "epoch": 793} {"train_loss": -10.053804397583008, "global_step": 133294, "epoch": 793} {"train_loss": -10.36815071105957, "global_step": 133295, "epoch": 793} {"train_loss": -10.287263870239258, "global_step": 133296, "epoch": 793} {"train_loss": -10.52385425567627, "global_step": 133297, "epoch": 793} {"train_loss": -10.235294342041016, "global_step": 133298, "epoch": 793} {"train_loss": -10.58743953704834, "global_step": 133299, "epoch": 793} {"train_loss": -10.495039939880371, "global_step": 133300, "epoch": 793} {"train_loss": -10.463486671447754, "global_step": 133301, "epoch": 793} {"train_loss": -10.503942489624023, "global_step": 133302, "epoch": 793} {"train_loss": -10.738615989685059, "global_step": 133303, "epoch": 793} {"train_loss": -10.694632530212402, "global_step": 133304, "epoch": 793} {"train_loss": -10.467619895935059, "global_step": 133305, "epoch": 793} {"train_loss": -10.671581268310547, "global_step": 133306, "epoch": 793} {"train_loss": -10.419668197631836, "global_step": 133307, "epoch": 793} {"train_loss": -10.648597717285156, "global_step": 133308, "epoch": 793} {"train_loss": -10.503519058227539, "global_step": 133309, "epoch": 793} {"train_loss": -10.718935012817383, "global_step": 133310, "epoch": 793} {"train_loss": -10.408045768737793, "global_step": 133311, "epoch": 793} {"train_loss": -10.436948776245117, "global_step": 133312, "epoch": 793} {"train_loss": -10.733402252197266, "global_step": 133313, "epoch": 793} {"train_loss": -10.514216423034668, "global_step": 133314, "epoch": 793} {"train_loss": -10.639893531799316, "global_step": 133315, "epoch": 793} {"train_loss": -10.666435241699219, "global_step": 133316, "epoch": 793} {"train_loss": -10.681803703308105, "global_step": 133317, "epoch": 793} {"train_loss": -10.478996276855469, "global_step": 133318, "epoch": 793} {"train_loss": -10.27208137512207, "global_step": 133319, "epoch": 793} {"train_loss": -10.680355072021484, "global_step": 133320, "epoch": 793} {"train_loss": -10.536739349365234, "global_step": 133321, "epoch": 793} {"train_loss": -10.210660934448242, "global_step": 133322, "epoch": 793} {"train_loss": -10.683095932006836, "global_step": 133323, "epoch": 793} {"train_loss": -9.811075210571289, "global_step": 133324, "epoch": 793} {"train_loss": -10.129212379455566, "global_step": 133325, "epoch": 793} {"train_loss": -10.195273399353027, "global_step": 133326, "epoch": 793} {"train_loss": -10.254425048828125, "global_step": 133327, "epoch": 793} {"train_loss": -10.172016143798828, "global_step": 133328, "epoch": 793} {"train_loss": -10.517354011535645, "global_step": 133329, "epoch": 793} {"train_loss": -10.201120376586914, "global_step": 133330, "epoch": 793} {"train_loss": -10.494399070739746, "global_step": 133331, "epoch": 793} {"train_loss": -10.428068161010742, "global_step": 133332, "epoch": 793} {"train_loss": -10.349691390991211, "global_step": 133333, "epoch": 793} {"train_loss": -10.268991470336914, "global_step": 133334, "epoch": 793} {"train_loss": -10.34709644317627, "global_step": 133335, "epoch": 793} {"train_loss": -10.509744644165039, "global_step": 133336, "epoch": 793} {"train_loss": -10.515629768371582, "global_step": 133337, "epoch": 793} {"train_loss": -10.522100448608398, "global_step": 133338, "epoch": 793} {"train_loss": -10.715597152709961, "global_step": 133339, "epoch": 793} {"train_loss": -10.720548629760742, "global_step": 133340, "epoch": 793} {"train_loss": -10.490102767944336, "global_step": 133341, "epoch": 793} {"train_loss": -10.33537483215332, "global_step": 133342, "epoch": 793} {"train_loss": -10.548503875732422, "global_step": 133343, "epoch": 793} {"train_loss": -10.354543685913086, "global_step": 133344, "epoch": 793} {"train_loss": -10.389452934265137, "global_step": 133345, "epoch": 793} {"train_loss": -10.716290473937988, "global_step": 133346, "epoch": 793} {"train_loss": -10.472054481506348, "global_step": 133347, "epoch": 793} {"train_loss": -10.540328979492188, "global_step": 133348, "epoch": 793} {"train_loss": -10.490495681762695, "global_step": 133349, "epoch": 793} {"train_loss": -10.360462188720703, "global_step": 133350, "epoch": 793} {"train_loss": -10.541643142700195, "global_step": 133351, "epoch": 793} {"train_loss": -10.48396110534668, "global_step": 133352, "epoch": 793} {"train_loss": -9.9061918258667, "global_step": 133353, "epoch": 793} {"train_loss": -10.497151374816895, "global_step": 133354, "epoch": 793} {"train_loss": -10.544319152832031, "global_step": 133355, "epoch": 793} {"train_loss": -10.47756576538086, "global_step": 133356, "epoch": 793} {"train_loss": -10.486039161682129, "global_step": 133357, "epoch": 793} {"train_loss": -10.609314918518066, "global_step": 133358, "epoch": 793} {"train_loss": -10.449832916259766, "global_step": 133359, "epoch": 793} {"train_loss": -10.216808319091797, "global_step": 133360, "epoch": 793} {"train_loss": -10.505746841430664, "global_step": 133361, "epoch": 793} {"train_loss": -10.151261329650879, "global_step": 133362, "epoch": 793} {"train_loss": -10.418466567993164, "global_step": 133363, "epoch": 793} {"train_loss": -10.412217140197754, "global_step": 133364, "epoch": 793} {"train_loss": -10.493541717529297, "global_step": 133365, "epoch": 793} {"train_loss": -10.712438583374023, "global_step": 133366, "epoch": 793} {"train_loss": -10.450887680053711, "global_step": 133367, "epoch": 793} {"train_loss": -10.357074737548828, "global_step": 133368, "epoch": 793} {"train_loss": -10.609048843383789, "global_step": 133369, "epoch": 793} {"train_loss": -10.515291213989258, "global_step": 133370, "epoch": 793} {"train_loss": -10.570281028747559, "global_step": 133371, "epoch": 793} {"train_loss": -10.584418296813965, "global_step": 133372, "epoch": 793} {"train_loss": -10.602676391601562, "global_step": 133373, "epoch": 793} {"train_loss": -10.549100875854492, "global_step": 133374, "epoch": 793} {"train_loss": -10.713549613952637, "global_step": 133375, "epoch": 793} {"train_loss": -10.536046981811523, "global_step": 133376, "epoch": 793} {"train_loss": -10.464801788330078, "global_step": 133377, "epoch": 793} {"train_loss": -10.334859848022461, "global_step": 133378, "epoch": 793} {"train_loss": -10.364206314086914, "global_step": 133379, "epoch": 793} {"train_loss": -10.329163551330566, "global_step": 133380, "epoch": 793} {"train_loss": -9.820878028869629, "global_step": 133381, "epoch": 793} {"train_loss": -10.479591369628906, "global_step": 133382, "epoch": 793} {"train_loss": -9.869205474853516, "global_step": 133383, "epoch": 793} {"train_loss": -10.385697364807129, "global_step": 133384, "epoch": 793} {"train_loss": -10.154170989990234, "global_step": 133385, "epoch": 793} {"train_loss": -10.208236694335938, "global_step": 133386, "epoch": 793} {"train_loss": -10.590838432312012, "global_step": 133387, "epoch": 793} {"train_loss": -10.043548583984375, "global_step": 133388, "epoch": 793} {"train_loss": -10.568599700927734, "global_step": 133389, "epoch": 793} {"train_loss": -9.827495574951172, "global_step": 133390, "epoch": 793} {"train_loss": -10.326236963272095, "global_step": 133391, "epoch": 793, "val_loss": 221637.75} {"train_loss": -10.320964813232422, "global_step": 133392, "epoch": 794} {"train_loss": -10.238313674926758, "global_step": 133393, "epoch": 794} {"train_loss": -10.130583763122559, "global_step": 133394, "epoch": 794} {"train_loss": -9.943751335144043, "global_step": 133395, "epoch": 794} {"train_loss": -10.240694046020508, "global_step": 133396, "epoch": 794} {"train_loss": -9.924659729003906, "global_step": 133397, "epoch": 794} {"train_loss": -10.408775329589844, "global_step": 133398, "epoch": 794} {"train_loss": -10.001684188842773, "global_step": 133399, "epoch": 794} {"train_loss": -10.028467178344727, "global_step": 133400, "epoch": 794} {"train_loss": -9.753063201904297, "global_step": 133401, "epoch": 794} {"train_loss": -10.221992492675781, "global_step": 133402, "epoch": 794} {"train_loss": -9.812150955200195, "global_step": 133403, "epoch": 794} {"train_loss": -10.344854354858398, "global_step": 133404, "epoch": 794} {"train_loss": -9.992207527160645, "global_step": 133405, "epoch": 794} {"train_loss": -10.356378555297852, "global_step": 133406, "epoch": 794} {"train_loss": -9.865955352783203, "global_step": 133407, "epoch": 794} {"train_loss": -10.427660942077637, "global_step": 133408, "epoch": 794} {"train_loss": -9.908360481262207, "global_step": 133409, "epoch": 794} {"train_loss": -10.040597915649414, "global_step": 133410, "epoch": 794} {"train_loss": -9.772371292114258, "global_step": 133411, "epoch": 794} {"train_loss": -9.736289978027344, "global_step": 133412, "epoch": 794} {"train_loss": -9.827713012695312, "global_step": 133413, "epoch": 794} {"train_loss": -9.687902450561523, "global_step": 133414, "epoch": 794} {"train_loss": -10.14150619506836, "global_step": 133415, "epoch": 794} {"train_loss": -9.08381462097168, "global_step": 133416, "epoch": 794} {"train_loss": -10.467168807983398, "global_step": 133417, "epoch": 794} {"train_loss": -9.383161544799805, "global_step": 133418, "epoch": 794} {"train_loss": -10.309846878051758, "global_step": 133419, "epoch": 794} {"train_loss": -9.78984260559082, "global_step": 133420, "epoch": 794} {"train_loss": -9.763710021972656, "global_step": 133421, "epoch": 794} {"train_loss": -9.858247756958008, "global_step": 133422, "epoch": 794} {"train_loss": -10.174396514892578, "global_step": 133423, "epoch": 794} {"train_loss": -10.067276954650879, "global_step": 133424, "epoch": 794} {"train_loss": -9.780317306518555, "global_step": 133425, "epoch": 794} {"train_loss": -10.109726905822754, "global_step": 133426, "epoch": 794} {"train_loss": -9.711763381958008, "global_step": 133427, "epoch": 794} {"train_loss": -9.950478553771973, "global_step": 133428, "epoch": 794} {"train_loss": -10.115962982177734, "global_step": 133429, "epoch": 794} {"train_loss": -10.204790115356445, "global_step": 133430, "epoch": 794} {"train_loss": -9.947851181030273, "global_step": 133431, "epoch": 794} {"train_loss": -10.34500503540039, "global_step": 133432, "epoch": 794} {"train_loss": -10.029476165771484, "global_step": 133433, "epoch": 794} {"train_loss": -10.425936698913574, "global_step": 133434, "epoch": 794} {"train_loss": -9.987089157104492, "global_step": 133435, "epoch": 794} {"train_loss": -10.345311164855957, "global_step": 133436, "epoch": 794} {"train_loss": -10.360757827758789, "global_step": 133437, "epoch": 794} {"train_loss": -10.152111053466797, "global_step": 133438, "epoch": 794} {"train_loss": -10.247604370117188, "global_step": 133439, "epoch": 794} {"train_loss": -10.275362014770508, "global_step": 133440, "epoch": 794} {"train_loss": -10.3021879196167, "global_step": 133441, "epoch": 794} {"train_loss": -10.256219863891602, "global_step": 133442, "epoch": 794} {"train_loss": -10.252971649169922, "global_step": 133443, "epoch": 794} {"train_loss": -10.35633659362793, "global_step": 133444, "epoch": 794} {"train_loss": -10.21141242980957, "global_step": 133445, "epoch": 794} {"train_loss": -10.299208641052246, "global_step": 133446, "epoch": 794} {"train_loss": -10.551474571228027, "global_step": 133447, "epoch": 794} {"train_loss": -10.15673828125, "global_step": 133448, "epoch": 794} {"train_loss": -10.378485679626465, "global_step": 133449, "epoch": 794} {"train_loss": -10.476522445678711, "global_step": 133450, "epoch": 794} {"train_loss": -10.360702514648438, "global_step": 133451, "epoch": 794} {"train_loss": -10.403068542480469, "global_step": 133452, "epoch": 794} {"train_loss": -10.458322525024414, "global_step": 133453, "epoch": 794} {"train_loss": -10.29925537109375, "global_step": 133454, "epoch": 794} {"train_loss": -10.409832000732422, "global_step": 133455, "epoch": 794} {"train_loss": -10.470134735107422, "global_step": 133456, "epoch": 794} {"train_loss": -10.11440372467041, "global_step": 133457, "epoch": 794} {"train_loss": -10.456792831420898, "global_step": 133458, "epoch": 794} {"train_loss": -10.59765625, "global_step": 133459, "epoch": 794} {"train_loss": -10.418848037719727, "global_step": 133460, "epoch": 794} {"train_loss": -10.439175605773926, "global_step": 133461, "epoch": 794} {"train_loss": -10.450296401977539, "global_step": 133462, "epoch": 794} {"train_loss": -10.755184173583984, "global_step": 133463, "epoch": 794} {"train_loss": -10.646764755249023, "global_step": 133464, "epoch": 794} {"train_loss": -10.834471702575684, "global_step": 133465, "epoch": 794} {"train_loss": -10.538908004760742, "global_step": 133466, "epoch": 794} {"train_loss": -10.51486587524414, "global_step": 133467, "epoch": 794} {"train_loss": -10.594679832458496, "global_step": 133468, "epoch": 794} {"train_loss": -10.644242286682129, "global_step": 133469, "epoch": 794} {"train_loss": -10.896932601928711, "global_step": 133470, "epoch": 794} {"train_loss": -10.353328704833984, "global_step": 133471, "epoch": 794} {"train_loss": -10.298449516296387, "global_step": 133472, "epoch": 794} {"train_loss": -10.831748962402344, "global_step": 133473, "epoch": 794} {"train_loss": -10.554742813110352, "global_step": 133474, "epoch": 794} {"train_loss": -10.707133293151855, "global_step": 133475, "epoch": 794} {"train_loss": -10.498278617858887, "global_step": 133476, "epoch": 794} {"train_loss": -10.777704238891602, "global_step": 133477, "epoch": 794} {"train_loss": -10.8284912109375, "global_step": 133478, "epoch": 794} {"train_loss": -10.469034194946289, "global_step": 133479, "epoch": 794} {"train_loss": -10.810091018676758, "global_step": 133480, "epoch": 794} {"train_loss": -10.39378547668457, "global_step": 133481, "epoch": 794} {"train_loss": -10.281837463378906, "global_step": 133482, "epoch": 794} {"train_loss": -10.665227890014648, "global_step": 133483, "epoch": 794} {"train_loss": -9.933929443359375, "global_step": 133484, "epoch": 794} {"train_loss": -10.327310562133789, "global_step": 133485, "epoch": 794} {"train_loss": -10.0776948928833, "global_step": 133486, "epoch": 794} {"train_loss": -10.416692733764648, "global_step": 133487, "epoch": 794} {"train_loss": -10.354896545410156, "global_step": 133488, "epoch": 794} {"train_loss": -10.006088256835938, "global_step": 133489, "epoch": 794} {"train_loss": -10.116868019104004, "global_step": 133490, "epoch": 794} {"train_loss": -10.266273498535156, "global_step": 133491, "epoch": 794} {"train_loss": -10.22584056854248, "global_step": 133492, "epoch": 794} {"train_loss": -10.671771049499512, "global_step": 133493, "epoch": 794} {"train_loss": -10.294776916503906, "global_step": 133494, "epoch": 794} {"train_loss": -10.873453140258789, "global_step": 133495, "epoch": 794} {"train_loss": -10.04006290435791, "global_step": 133496, "epoch": 794} {"train_loss": -10.41767692565918, "global_step": 133497, "epoch": 794} {"train_loss": -10.350979804992676, "global_step": 133498, "epoch": 794} {"train_loss": -10.313602447509766, "global_step": 133499, "epoch": 794} {"train_loss": -10.513797760009766, "global_step": 133500, "epoch": 794} {"train_loss": -10.575608253479004, "global_step": 133501, "epoch": 794} {"train_loss": -10.277189254760742, "global_step": 133502, "epoch": 794} {"train_loss": -10.707929611206055, "global_step": 133503, "epoch": 794} {"train_loss": -10.282637596130371, "global_step": 133504, "epoch": 794} {"train_loss": -10.643782615661621, "global_step": 133505, "epoch": 794} {"train_loss": -10.481671333312988, "global_step": 133506, "epoch": 794} {"train_loss": -10.433375358581543, "global_step": 133507, "epoch": 794} {"train_loss": -10.693653106689453, "global_step": 133508, "epoch": 794} {"train_loss": -10.591621398925781, "global_step": 133509, "epoch": 794} {"train_loss": -10.732032775878906, "global_step": 133510, "epoch": 794} {"train_loss": -10.648200988769531, "global_step": 133511, "epoch": 794} {"train_loss": -10.56964111328125, "global_step": 133512, "epoch": 794} {"train_loss": -10.698410034179688, "global_step": 133513, "epoch": 794} {"train_loss": -10.80742073059082, "global_step": 133514, "epoch": 794} {"train_loss": -10.229984283447266, "global_step": 133515, "epoch": 794} {"train_loss": -10.560587882995605, "global_step": 133516, "epoch": 794} {"train_loss": -10.279632568359375, "global_step": 133517, "epoch": 794} {"train_loss": -10.693306922912598, "global_step": 133518, "epoch": 794} {"train_loss": -10.189776420593262, "global_step": 133519, "epoch": 794} {"train_loss": -10.678567886352539, "global_step": 133520, "epoch": 794} {"train_loss": -10.611261367797852, "global_step": 133521, "epoch": 794} {"train_loss": -10.589576721191406, "global_step": 133522, "epoch": 794} {"train_loss": -10.705208778381348, "global_step": 133523, "epoch": 794} {"train_loss": -10.619600296020508, "global_step": 133524, "epoch": 794} {"train_loss": -10.754512786865234, "global_step": 133525, "epoch": 794} {"train_loss": -10.512529373168945, "global_step": 133526, "epoch": 794} {"train_loss": -10.448963165283203, "global_step": 133527, "epoch": 794} {"train_loss": -10.394070625305176, "global_step": 133528, "epoch": 794} {"train_loss": -10.44654655456543, "global_step": 133529, "epoch": 794} {"train_loss": -10.474221229553223, "global_step": 133530, "epoch": 794} {"train_loss": -10.64479923248291, "global_step": 133531, "epoch": 794} {"train_loss": -10.418386459350586, "global_step": 133532, "epoch": 794} {"train_loss": -10.411677360534668, "global_step": 133533, "epoch": 794} {"train_loss": -10.159181594848633, "global_step": 133534, "epoch": 794} {"train_loss": -10.520198822021484, "global_step": 133535, "epoch": 794} {"train_loss": -10.742148399353027, "global_step": 133536, "epoch": 794} {"train_loss": -10.389663696289062, "global_step": 133537, "epoch": 794} {"train_loss": -10.647014617919922, "global_step": 133538, "epoch": 794} {"train_loss": -10.51015567779541, "global_step": 133539, "epoch": 794} {"train_loss": -10.30864429473877, "global_step": 133540, "epoch": 794} {"train_loss": -9.789981842041016, "global_step": 133541, "epoch": 794} {"train_loss": -9.936904907226562, "global_step": 133542, "epoch": 794} {"train_loss": -10.49882698059082, "global_step": 133543, "epoch": 794} {"train_loss": -9.84917163848877, "global_step": 133544, "epoch": 794} {"train_loss": -10.336180686950684, "global_step": 133545, "epoch": 794} {"train_loss": -10.10801887512207, "global_step": 133546, "epoch": 794} {"train_loss": -10.381645202636719, "global_step": 133547, "epoch": 794} {"train_loss": -10.362200736999512, "global_step": 133548, "epoch": 794} {"train_loss": -10.139287948608398, "global_step": 133549, "epoch": 794} {"train_loss": -10.116426467895508, "global_step": 133550, "epoch": 794} {"train_loss": -10.301658630371094, "global_step": 133551, "epoch": 794} {"train_loss": -10.137251853942871, "global_step": 133552, "epoch": 794} {"train_loss": -10.58497428894043, "global_step": 133553, "epoch": 794} {"train_loss": -9.823766708374023, "global_step": 133554, "epoch": 794} {"train_loss": -10.15330982208252, "global_step": 133555, "epoch": 794} {"train_loss": -10.300225257873535, "global_step": 133556, "epoch": 794} {"train_loss": -10.062997817993164, "global_step": 133557, "epoch": 794} {"train_loss": -10.249500274658203, "global_step": 133558, "epoch": 794} {"train_loss": -10.313109403564816, "global_step": 133559, "epoch": 794, "val_loss": 220311.171875} {"train_loss": -10.078091621398926, "global_step": 133560, "epoch": 795} {"train_loss": -9.82210922241211, "global_step": 133561, "epoch": 795} {"train_loss": -10.359991073608398, "global_step": 133562, "epoch": 795} {"train_loss": -10.477811813354492, "global_step": 133563, "epoch": 795} {"train_loss": -10.332246780395508, "global_step": 133564, "epoch": 795} {"train_loss": -10.232643127441406, "global_step": 133565, "epoch": 795} {"train_loss": -10.536048889160156, "global_step": 133566, "epoch": 795} {"train_loss": -10.075100898742676, "global_step": 133567, "epoch": 795} {"train_loss": -10.306314468383789, "global_step": 133568, "epoch": 795} {"train_loss": -10.280916213989258, "global_step": 133569, "epoch": 795} {"train_loss": -10.092399597167969, "global_step": 133570, "epoch": 795} {"train_loss": -10.292301177978516, "global_step": 133571, "epoch": 795} {"train_loss": -10.286190032958984, "global_step": 133572, "epoch": 795} {"train_loss": -10.188136100769043, "global_step": 133573, "epoch": 795} {"train_loss": -10.017448425292969, "global_step": 133574, "epoch": 795} {"train_loss": -10.247167587280273, "global_step": 133575, "epoch": 795} {"train_loss": -9.978702545166016, "global_step": 133576, "epoch": 795} {"train_loss": -10.353774070739746, "global_step": 133577, "epoch": 795} {"train_loss": -10.29420280456543, "global_step": 133578, "epoch": 795} {"train_loss": -10.1642484664917, "global_step": 133579, "epoch": 795} {"train_loss": -10.24085807800293, "global_step": 133580, "epoch": 795} {"train_loss": -10.444292068481445, "global_step": 133581, "epoch": 795} {"train_loss": -10.285194396972656, "global_step": 133582, "epoch": 795} {"train_loss": -10.413105964660645, "global_step": 133583, "epoch": 795} {"train_loss": -10.36282730102539, "global_step": 133584, "epoch": 795} {"train_loss": -10.48383903503418, "global_step": 133585, "epoch": 795} {"train_loss": -10.337730407714844, "global_step": 133586, "epoch": 795} {"train_loss": -10.237489700317383, "global_step": 133587, "epoch": 795} {"train_loss": -10.633646011352539, "global_step": 133588, "epoch": 795} {"train_loss": -10.283288955688477, "global_step": 133589, "epoch": 795} {"train_loss": -10.414650917053223, "global_step": 133590, "epoch": 795} {"train_loss": -10.347269058227539, "global_step": 133591, "epoch": 795} {"train_loss": -10.402420043945312, "global_step": 133592, "epoch": 795} {"train_loss": -10.502281188964844, "global_step": 133593, "epoch": 795} {"train_loss": -10.720964431762695, "global_step": 133594, "epoch": 795} {"train_loss": -10.648012161254883, "global_step": 133595, "epoch": 795} {"train_loss": -10.415369033813477, "global_step": 133596, "epoch": 795} {"train_loss": -10.537485122680664, "global_step": 133597, "epoch": 795} {"train_loss": -10.5829496383667, "global_step": 133598, "epoch": 795} {"train_loss": -10.615490913391113, "global_step": 133599, "epoch": 795} {"train_loss": -10.706199645996094, "global_step": 133600, "epoch": 795} {"train_loss": -10.399210929870605, "global_step": 133601, "epoch": 795} {"train_loss": -10.521953582763672, "global_step": 133602, "epoch": 795} {"train_loss": -10.533475875854492, "global_step": 133603, "epoch": 795} {"train_loss": -10.659502983093262, "global_step": 133604, "epoch": 795} {"train_loss": -10.67769718170166, "global_step": 133605, "epoch": 795} {"train_loss": -10.37596321105957, "global_step": 133606, "epoch": 795} {"train_loss": -10.75123119354248, "global_step": 133607, "epoch": 795} {"train_loss": -10.662372589111328, "global_step": 133608, "epoch": 795} {"train_loss": -10.896230697631836, "global_step": 133609, "epoch": 795} {"train_loss": -10.704804420471191, "global_step": 133610, "epoch": 795} {"train_loss": -10.875683784484863, "global_step": 133611, "epoch": 795} {"train_loss": -10.823406219482422, "global_step": 133612, "epoch": 795} {"train_loss": -10.75970458984375, "global_step": 133613, "epoch": 795} {"train_loss": -10.575191497802734, "global_step": 133614, "epoch": 795} {"train_loss": -10.99986457824707, "global_step": 133615, "epoch": 795} {"train_loss": -10.686949729919434, "global_step": 133616, "epoch": 795} {"train_loss": -10.83239459991455, "global_step": 133617, "epoch": 795} {"train_loss": -10.910923957824707, "global_step": 133618, "epoch": 795} {"train_loss": -10.543866157531738, "global_step": 133619, "epoch": 795} {"train_loss": -10.789230346679688, "global_step": 133620, "epoch": 795} {"train_loss": -10.399833679199219, "global_step": 133621, "epoch": 795} {"train_loss": -10.444594383239746, "global_step": 133622, "epoch": 795} {"train_loss": -10.39423942565918, "global_step": 133623, "epoch": 795} {"train_loss": -10.623705863952637, "global_step": 133624, "epoch": 795} {"train_loss": -9.927223205566406, "global_step": 133625, "epoch": 795} {"train_loss": -10.76165771484375, "global_step": 133626, "epoch": 795} {"train_loss": -10.28714656829834, "global_step": 133627, "epoch": 795} {"train_loss": -10.006903648376465, "global_step": 133628, "epoch": 795} {"train_loss": -10.573704719543457, "global_step": 133629, "epoch": 795} {"train_loss": -10.545985221862793, "global_step": 133630, "epoch": 795} {"train_loss": -10.48562240600586, "global_step": 133631, "epoch": 795} {"train_loss": -10.697298049926758, "global_step": 133632, "epoch": 795} {"train_loss": -10.21527099609375, "global_step": 133633, "epoch": 795} {"train_loss": -10.190377235412598, "global_step": 133634, "epoch": 795} {"train_loss": -10.459251403808594, "global_step": 133635, "epoch": 795} {"train_loss": -10.535280227661133, "global_step": 133636, "epoch": 795} {"train_loss": -10.117776870727539, "global_step": 133637, "epoch": 795} {"train_loss": -10.368916511535645, "global_step": 133638, "epoch": 795} {"train_loss": -10.543795585632324, "global_step": 133639, "epoch": 795} {"train_loss": -10.033662796020508, "global_step": 133640, "epoch": 795} {"train_loss": -10.240859985351562, "global_step": 133641, "epoch": 795} {"train_loss": -10.266425132751465, "global_step": 133642, "epoch": 795} {"train_loss": -10.09779167175293, "global_step": 133643, "epoch": 795} {"train_loss": -10.318327903747559, "global_step": 133644, "epoch": 795} {"train_loss": -10.196678161621094, "global_step": 133645, "epoch": 795} {"train_loss": -10.417402267456055, "global_step": 133646, "epoch": 795} {"train_loss": -9.81808090209961, "global_step": 133647, "epoch": 795} {"train_loss": -10.243429183959961, "global_step": 133648, "epoch": 795} {"train_loss": -9.903417587280273, "global_step": 133649, "epoch": 795} {"train_loss": -10.187714576721191, "global_step": 133650, "epoch": 795} {"train_loss": -10.439781188964844, "global_step": 133651, "epoch": 795} {"train_loss": -9.981661796569824, "global_step": 133652, "epoch": 795} {"train_loss": -10.449953079223633, "global_step": 133653, "epoch": 795} {"train_loss": -9.989814758300781, "global_step": 133654, "epoch": 795} {"train_loss": -10.251616477966309, "global_step": 133655, "epoch": 795} {"train_loss": -10.078874588012695, "global_step": 133656, "epoch": 795} {"train_loss": -9.722658157348633, "global_step": 133657, "epoch": 795} {"train_loss": -9.85450553894043, "global_step": 133658, "epoch": 795} {"train_loss": -9.692527770996094, "global_step": 133659, "epoch": 795} {"train_loss": -10.339037895202637, "global_step": 133660, "epoch": 795} {"train_loss": -10.040059089660645, "global_step": 133661, "epoch": 795} {"train_loss": -9.648933410644531, "global_step": 133662, "epoch": 795} {"train_loss": -9.649433135986328, "global_step": 133663, "epoch": 795} {"train_loss": -9.743287086486816, "global_step": 133664, "epoch": 795} {"train_loss": -9.596658706665039, "global_step": 133665, "epoch": 795} {"train_loss": -9.360589981079102, "global_step": 133666, "epoch": 795} {"train_loss": -9.598443984985352, "global_step": 133667, "epoch": 795} {"train_loss": -9.797565460205078, "global_step": 133668, "epoch": 795} {"train_loss": -10.272335052490234, "global_step": 133669, "epoch": 795} {"train_loss": -9.96650505065918, "global_step": 133670, "epoch": 795} {"train_loss": -10.00328254699707, "global_step": 133671, "epoch": 795} {"train_loss": -10.131402969360352, "global_step": 133672, "epoch": 795} {"train_loss": -9.939449310302734, "global_step": 133673, "epoch": 795} {"train_loss": -10.124324798583984, "global_step": 133674, "epoch": 795} {"train_loss": -10.096595764160156, "global_step": 133675, "epoch": 795} {"train_loss": -10.049105644226074, "global_step": 133676, "epoch": 795} {"train_loss": -10.089851379394531, "global_step": 133677, "epoch": 795} {"train_loss": -10.234294891357422, "global_step": 133678, "epoch": 795} {"train_loss": -10.227215766906738, "global_step": 133679, "epoch": 795} {"train_loss": -10.266489028930664, "global_step": 133680, "epoch": 795} {"train_loss": -10.360603332519531, "global_step": 133681, "epoch": 795} {"train_loss": -10.14493179321289, "global_step": 133682, "epoch": 795} {"train_loss": -10.111852645874023, "global_step": 133683, "epoch": 795} {"train_loss": -10.0686616897583, "global_step": 133684, "epoch": 795} {"train_loss": -10.057114601135254, "global_step": 133685, "epoch": 795} {"train_loss": -10.186367988586426, "global_step": 133686, "epoch": 795} {"train_loss": -10.3709716796875, "global_step": 133687, "epoch": 795} {"train_loss": -9.839757919311523, "global_step": 133688, "epoch": 795} {"train_loss": -10.33612060546875, "global_step": 133689, "epoch": 795} {"train_loss": -10.188232421875, "global_step": 133690, "epoch": 795} {"train_loss": -10.317049026489258, "global_step": 133691, "epoch": 795} {"train_loss": -10.342622756958008, "global_step": 133692, "epoch": 795} {"train_loss": -10.222068786621094, "global_step": 133693, "epoch": 795} {"train_loss": -10.2994384765625, "global_step": 133694, "epoch": 795} {"train_loss": -10.55445671081543, "global_step": 133695, "epoch": 795} {"train_loss": -10.379322052001953, "global_step": 133696, "epoch": 795} {"train_loss": -10.478684425354004, "global_step": 133697, "epoch": 795} {"train_loss": -10.067220687866211, "global_step": 133698, "epoch": 795} {"train_loss": -10.559638977050781, "global_step": 133699, "epoch": 795} {"train_loss": -10.12000560760498, "global_step": 133700, "epoch": 795} {"train_loss": -10.607149124145508, "global_step": 133701, "epoch": 795} {"train_loss": -10.641702651977539, "global_step": 133702, "epoch": 795} {"train_loss": -10.601335525512695, "global_step": 133703, "epoch": 795} {"train_loss": -10.202351570129395, "global_step": 133704, "epoch": 795} {"train_loss": -10.53812026977539, "global_step": 133705, "epoch": 795} {"train_loss": -10.270444869995117, "global_step": 133706, "epoch": 795} {"train_loss": -10.499340057373047, "global_step": 133707, "epoch": 795} {"train_loss": -10.563910484313965, "global_step": 133708, "epoch": 795} {"train_loss": -10.240782737731934, "global_step": 133709, "epoch": 795} {"train_loss": -10.45366096496582, "global_step": 133710, "epoch": 795} {"train_loss": -10.477409362792969, "global_step": 133711, "epoch": 795} {"train_loss": -10.540541648864746, "global_step": 133712, "epoch": 795} {"train_loss": -10.601261138916016, "global_step": 133713, "epoch": 795} {"train_loss": -10.703226089477539, "global_step": 133714, "epoch": 795} {"train_loss": -10.340723037719727, "global_step": 133715, "epoch": 795} {"train_loss": -10.592336654663086, "global_step": 133716, "epoch": 795} {"train_loss": -10.58492374420166, "global_step": 133717, "epoch": 795} {"train_loss": -10.628026008605957, "global_step": 133718, "epoch": 795} {"train_loss": -10.174044609069824, "global_step": 133719, "epoch": 795} {"train_loss": -10.233443260192871, "global_step": 133720, "epoch": 795} {"train_loss": -10.795492172241211, "global_step": 133721, "epoch": 795} {"train_loss": -10.457316398620605, "global_step": 133722, "epoch": 795} {"train_loss": -10.717405319213867, "global_step": 133723, "epoch": 795} {"train_loss": -10.490873336791992, "global_step": 133724, "epoch": 795} {"train_loss": -10.32391357421875, "global_step": 133725, "epoch": 795} {"train_loss": -10.315404891967773, "global_step": 133726, "epoch": 795} {"train_loss": -10.32462469736735, "global_step": 133727, "epoch": 795, "val_loss": 224594.46875, "train_action_mse_error": 0.6664002537727356} {"train_loss": -10.124261856079102, "global_step": 133728, "epoch": 796} {"train_loss": -10.287261009216309, "global_step": 133729, "epoch": 796} {"train_loss": -9.796454429626465, "global_step": 133730, "epoch": 796} {"train_loss": -10.543342590332031, "global_step": 133731, "epoch": 796} {"train_loss": -9.658031463623047, "global_step": 133732, "epoch": 796} {"train_loss": -9.767257690429688, "global_step": 133733, "epoch": 796} {"train_loss": -10.383581161499023, "global_step": 133734, "epoch": 796} {"train_loss": -9.868045806884766, "global_step": 133735, "epoch": 796} {"train_loss": -10.317753791809082, "global_step": 133736, "epoch": 796} {"train_loss": -10.329629898071289, "global_step": 133737, "epoch": 796} {"train_loss": -10.241293907165527, "global_step": 133738, "epoch": 796} {"train_loss": -10.058473587036133, "global_step": 133739, "epoch": 796} {"train_loss": -10.247880935668945, "global_step": 133740, "epoch": 796} {"train_loss": -10.658245086669922, "global_step": 133741, "epoch": 796} {"train_loss": -9.908151626586914, "global_step": 133742, "epoch": 796} {"train_loss": -10.528037071228027, "global_step": 133743, "epoch": 796} {"train_loss": -10.65294075012207, "global_step": 133744, "epoch": 796} {"train_loss": -10.283040046691895, "global_step": 133745, "epoch": 796} {"train_loss": -10.671745300292969, "global_step": 133746, "epoch": 796} {"train_loss": -10.130000114440918, "global_step": 133747, "epoch": 796} {"train_loss": -10.516435623168945, "global_step": 133748, "epoch": 796} {"train_loss": -10.372235298156738, "global_step": 133749, "epoch": 796} {"train_loss": -10.271785736083984, "global_step": 133750, "epoch": 796} {"train_loss": -10.553760528564453, "global_step": 133751, "epoch": 796} {"train_loss": -10.269732475280762, "global_step": 133752, "epoch": 796} {"train_loss": -10.637099266052246, "global_step": 133753, "epoch": 796} {"train_loss": -10.52752685546875, "global_step": 133754, "epoch": 796} {"train_loss": -10.308669090270996, "global_step": 133755, "epoch": 796} {"train_loss": -10.492555618286133, "global_step": 133756, "epoch": 796} {"train_loss": -10.415346145629883, "global_step": 133757, "epoch": 796} {"train_loss": -10.41749382019043, "global_step": 133758, "epoch": 796} {"train_loss": -10.499308586120605, "global_step": 133759, "epoch": 796} {"train_loss": -10.556346893310547, "global_step": 133760, "epoch": 796} {"train_loss": -10.821500778198242, "global_step": 133761, "epoch": 796} {"train_loss": -10.438594818115234, "global_step": 133762, "epoch": 796} {"train_loss": -10.37279987335205, "global_step": 133763, "epoch": 796} {"train_loss": -10.644822120666504, "global_step": 133764, "epoch": 796} {"train_loss": -10.543294906616211, "global_step": 133765, "epoch": 796} {"train_loss": -10.68790340423584, "global_step": 133766, "epoch": 796} {"train_loss": -10.629520416259766, "global_step": 133767, "epoch": 796} {"train_loss": -10.665987014770508, "global_step": 133768, "epoch": 796} {"train_loss": -10.275843620300293, "global_step": 133769, "epoch": 796} {"train_loss": -10.446417808532715, "global_step": 133770, "epoch": 796} {"train_loss": -10.463483810424805, "global_step": 133771, "epoch": 796} {"train_loss": -10.387760162353516, "global_step": 133772, "epoch": 796} {"train_loss": -10.478254318237305, "global_step": 133773, "epoch": 796} {"train_loss": -10.525994300842285, "global_step": 133774, "epoch": 796} {"train_loss": -10.159570693969727, "global_step": 133775, "epoch": 796} {"train_loss": -10.063179016113281, "global_step": 133776, "epoch": 796} {"train_loss": -10.312920570373535, "global_step": 133777, "epoch": 796} {"train_loss": -10.461885452270508, "global_step": 133778, "epoch": 796} {"train_loss": -9.88540267944336, "global_step": 133779, "epoch": 796} {"train_loss": -10.525432586669922, "global_step": 133780, "epoch": 796} {"train_loss": -10.465150833129883, "global_step": 133781, "epoch": 796} {"train_loss": -9.413949012756348, "global_step": 133782, "epoch": 796} {"train_loss": -10.381331443786621, "global_step": 133783, "epoch": 796} {"train_loss": -10.2335205078125, "global_step": 133784, "epoch": 796} {"train_loss": -9.845192909240723, "global_step": 133785, "epoch": 796} {"train_loss": -10.397150039672852, "global_step": 133786, "epoch": 796} {"train_loss": -9.537886619567871, "global_step": 133787, "epoch": 796} {"train_loss": -10.406054496765137, "global_step": 133788, "epoch": 796} {"train_loss": -9.73375415802002, "global_step": 133789, "epoch": 796} {"train_loss": -10.705326080322266, "global_step": 133790, "epoch": 796} {"train_loss": -9.735897064208984, "global_step": 133791, "epoch": 796} {"train_loss": -10.668170928955078, "global_step": 133792, "epoch": 796} {"train_loss": -10.020135879516602, "global_step": 133793, "epoch": 796} {"train_loss": -10.121662139892578, "global_step": 133794, "epoch": 796} {"train_loss": -10.266128540039062, "global_step": 133795, "epoch": 796} {"train_loss": -10.374320983886719, "global_step": 133796, "epoch": 796} {"train_loss": -10.624100685119629, "global_step": 133797, "epoch": 796} {"train_loss": -10.215558052062988, "global_step": 133798, "epoch": 796} {"train_loss": -10.175934791564941, "global_step": 133799, "epoch": 796} {"train_loss": -10.02576732635498, "global_step": 133800, "epoch": 796} {"train_loss": -10.333785057067871, "global_step": 133801, "epoch": 796} {"train_loss": -10.549489974975586, "global_step": 133802, "epoch": 796} {"train_loss": -10.07909107208252, "global_step": 133803, "epoch": 796} {"train_loss": -10.353158950805664, "global_step": 133804, "epoch": 796} {"train_loss": -9.989886283874512, "global_step": 133805, "epoch": 796} {"train_loss": -10.26461124420166, "global_step": 133806, "epoch": 796} {"train_loss": -10.043747901916504, "global_step": 133807, "epoch": 796} {"train_loss": -10.26732063293457, "global_step": 133808, "epoch": 796} {"train_loss": -10.381553649902344, "global_step": 133809, "epoch": 796} {"train_loss": -10.411935806274414, "global_step": 133810, "epoch": 796} {"train_loss": -10.540199279785156, "global_step": 133811, "epoch": 796} {"train_loss": -10.327192306518555, "global_step": 133812, "epoch": 796} {"train_loss": -10.52037239074707, "global_step": 133813, "epoch": 796} {"train_loss": -10.354350090026855, "global_step": 133814, "epoch": 796} {"train_loss": -10.549148559570312, "global_step": 133815, "epoch": 796} {"train_loss": -10.371238708496094, "global_step": 133816, "epoch": 796} {"train_loss": -10.444482803344727, "global_step": 133817, "epoch": 796} {"train_loss": -10.427922248840332, "global_step": 133818, "epoch": 796} {"train_loss": -10.445516586303711, "global_step": 133819, "epoch": 796} {"train_loss": -10.260943412780762, "global_step": 133820, "epoch": 796} {"train_loss": -10.679169654846191, "global_step": 133821, "epoch": 796} {"train_loss": -10.179699897766113, "global_step": 133822, "epoch": 796} {"train_loss": -10.5482816696167, "global_step": 133823, "epoch": 796} {"train_loss": -10.281543731689453, "global_step": 133824, "epoch": 796} {"train_loss": -10.459397315979004, "global_step": 133825, "epoch": 796} {"train_loss": -10.442888259887695, "global_step": 133826, "epoch": 796} {"train_loss": -10.316633224487305, "global_step": 133827, "epoch": 796} {"train_loss": -10.51103401184082, "global_step": 133828, "epoch": 796} {"train_loss": -10.198392868041992, "global_step": 133829, "epoch": 796} {"train_loss": -10.570150375366211, "global_step": 133830, "epoch": 796} {"train_loss": -10.232929229736328, "global_step": 133831, "epoch": 796} {"train_loss": -10.636486053466797, "global_step": 133832, "epoch": 796} {"train_loss": -10.255501747131348, "global_step": 133833, "epoch": 796} {"train_loss": -10.347126960754395, "global_step": 133834, "epoch": 796} {"train_loss": -10.42497444152832, "global_step": 133835, "epoch": 796} {"train_loss": -10.099283218383789, "global_step": 133836, "epoch": 796} {"train_loss": -10.495174407958984, "global_step": 133837, "epoch": 796} {"train_loss": -10.560335159301758, "global_step": 133838, "epoch": 796} {"train_loss": -10.36515998840332, "global_step": 133839, "epoch": 796} {"train_loss": -10.393775939941406, "global_step": 133840, "epoch": 796} {"train_loss": -10.097722053527832, "global_step": 133841, "epoch": 796} {"train_loss": -10.501338005065918, "global_step": 133842, "epoch": 796} {"train_loss": -10.043807983398438, "global_step": 133843, "epoch": 796} {"train_loss": -10.403050422668457, "global_step": 133844, "epoch": 796} {"train_loss": -10.325434684753418, "global_step": 133845, "epoch": 796} {"train_loss": -10.733022689819336, "global_step": 133846, "epoch": 796} {"train_loss": -10.115959167480469, "global_step": 133847, "epoch": 796} {"train_loss": -10.625890731811523, "global_step": 133848, "epoch": 796} {"train_loss": -10.29421615600586, "global_step": 133849, "epoch": 796} {"train_loss": -10.671066284179688, "global_step": 133850, "epoch": 796} {"train_loss": -10.502666473388672, "global_step": 133851, "epoch": 796} {"train_loss": -10.406845092773438, "global_step": 133852, "epoch": 796} {"train_loss": -10.493796348571777, "global_step": 133853, "epoch": 796} {"train_loss": -10.50213623046875, "global_step": 133854, "epoch": 796} {"train_loss": -10.35624885559082, "global_step": 133855, "epoch": 796} {"train_loss": -10.400593757629395, "global_step": 133856, "epoch": 796} {"train_loss": -10.652990341186523, "global_step": 133857, "epoch": 796} {"train_loss": -10.628087043762207, "global_step": 133858, "epoch": 796} {"train_loss": -10.6934814453125, "global_step": 133859, "epoch": 796} {"train_loss": -10.52424430847168, "global_step": 133860, "epoch": 796} {"train_loss": -10.522117614746094, "global_step": 133861, "epoch": 796} {"train_loss": -10.288432121276855, "global_step": 133862, "epoch": 796} {"train_loss": -10.413497924804688, "global_step": 133863, "epoch": 796} {"train_loss": -10.135372161865234, "global_step": 133864, "epoch": 796} {"train_loss": -10.402143478393555, "global_step": 133865, "epoch": 796} {"train_loss": -10.053321838378906, "global_step": 133866, "epoch": 796} {"train_loss": -9.968232154846191, "global_step": 133867, "epoch": 796} {"train_loss": -10.598974227905273, "global_step": 133868, "epoch": 796} {"train_loss": -9.8366060256958, "global_step": 133869, "epoch": 796} {"train_loss": -10.600475311279297, "global_step": 133870, "epoch": 796} {"train_loss": -10.14413070678711, "global_step": 133871, "epoch": 796} {"train_loss": -10.044719696044922, "global_step": 133872, "epoch": 796} {"train_loss": -10.135400772094727, "global_step": 133873, "epoch": 796} {"train_loss": -10.406583786010742, "global_step": 133874, "epoch": 796} {"train_loss": -10.10751724243164, "global_step": 133875, "epoch": 796} {"train_loss": -10.048660278320312, "global_step": 133876, "epoch": 796} {"train_loss": -9.61768627166748, "global_step": 133877, "epoch": 796} {"train_loss": -9.822553634643555, "global_step": 133878, "epoch": 796} {"train_loss": -9.941936492919922, "global_step": 133879, "epoch": 796} {"train_loss": -10.26770305633545, "global_step": 133880, "epoch": 796} {"train_loss": -10.161352157592773, "global_step": 133881, "epoch": 796} {"train_loss": -9.906770706176758, "global_step": 133882, "epoch": 796} {"train_loss": -10.027497291564941, "global_step": 133883, "epoch": 796} {"train_loss": -10.106517791748047, "global_step": 133884, "epoch": 796} {"train_loss": -9.802520751953125, "global_step": 133885, "epoch": 796} {"train_loss": -10.266624450683594, "global_step": 133886, "epoch": 796} {"train_loss": -10.282240867614746, "global_step": 133887, "epoch": 796} {"train_loss": -10.049983978271484, "global_step": 133888, "epoch": 796} {"train_loss": -10.551545143127441, "global_step": 133889, "epoch": 796} {"train_loss": -10.257116317749023, "global_step": 133890, "epoch": 796} {"train_loss": -10.399681091308594, "global_step": 133891, "epoch": 796} {"train_loss": -10.234281539916992, "global_step": 133892, "epoch": 796} {"train_loss": -10.441465377807617, "global_step": 133893, "epoch": 796} {"train_loss": -10.328874588012695, "global_step": 133894, "epoch": 796} {"train_loss": -10.315448352268763, "global_step": 133895, "epoch": 796, "val_loss": 225185.21875} {"train_loss": -10.204442977905273, "global_step": 133896, "epoch": 797} {"train_loss": -10.721660614013672, "global_step": 133897, "epoch": 797} {"train_loss": -10.768404006958008, "global_step": 133898, "epoch": 797} {"train_loss": -10.324283599853516, "global_step": 133899, "epoch": 797} {"train_loss": -10.666817665100098, "global_step": 133900, "epoch": 797} {"train_loss": -10.51160717010498, "global_step": 133901, "epoch": 797} {"train_loss": -10.310014724731445, "global_step": 133902, "epoch": 797} {"train_loss": -10.845768928527832, "global_step": 133903, "epoch": 797} {"train_loss": -10.454360961914062, "global_step": 133904, "epoch": 797} {"train_loss": -10.609195709228516, "global_step": 133905, "epoch": 797} {"train_loss": -10.51016902923584, "global_step": 133906, "epoch": 797} {"train_loss": -10.524139404296875, "global_step": 133907, "epoch": 797} {"train_loss": -10.750118255615234, "global_step": 133908, "epoch": 797} {"train_loss": -10.570115089416504, "global_step": 133909, "epoch": 797} {"train_loss": -10.576087951660156, "global_step": 133910, "epoch": 797} {"train_loss": -10.93768310546875, "global_step": 133911, "epoch": 797} {"train_loss": -10.259580612182617, "global_step": 133912, "epoch": 797} {"train_loss": -10.600253105163574, "global_step": 133913, "epoch": 797} {"train_loss": -10.57136058807373, "global_step": 133914, "epoch": 797} {"train_loss": -9.946141242980957, "global_step": 133915, "epoch": 797} {"train_loss": -10.38851547241211, "global_step": 133916, "epoch": 797} {"train_loss": -10.727912902832031, "global_step": 133917, "epoch": 797} {"train_loss": -10.214581489562988, "global_step": 133918, "epoch": 797} {"train_loss": -10.747184753417969, "global_step": 133919, "epoch": 797} {"train_loss": -10.462132453918457, "global_step": 133920, "epoch": 797} {"train_loss": -9.93844985961914, "global_step": 133921, "epoch": 797} {"train_loss": -10.508224487304688, "global_step": 133922, "epoch": 797} {"train_loss": -10.026922225952148, "global_step": 133923, "epoch": 797} {"train_loss": -9.785004615783691, "global_step": 133924, "epoch": 797} {"train_loss": -10.515478134155273, "global_step": 133925, "epoch": 797} {"train_loss": -10.15728759765625, "global_step": 133926, "epoch": 797} {"train_loss": -10.396295547485352, "global_step": 133927, "epoch": 797} {"train_loss": -10.373335838317871, "global_step": 133928, "epoch": 797} {"train_loss": -10.223073959350586, "global_step": 133929, "epoch": 797} {"train_loss": -10.192146301269531, "global_step": 133930, "epoch": 797} {"train_loss": -9.952329635620117, "global_step": 133931, "epoch": 797} {"train_loss": -10.01823616027832, "global_step": 133932, "epoch": 797} {"train_loss": -10.20964241027832, "global_step": 133933, "epoch": 797} {"train_loss": -9.78707504272461, "global_step": 133934, "epoch": 797} {"train_loss": -10.332540512084961, "global_step": 133935, "epoch": 797} {"train_loss": -10.119232177734375, "global_step": 133936, "epoch": 797} {"train_loss": -9.554706573486328, "global_step": 133937, "epoch": 797} {"train_loss": -10.173661231994629, "global_step": 133938, "epoch": 797} {"train_loss": -9.300146102905273, "global_step": 133939, "epoch": 797} {"train_loss": -10.509553909301758, "global_step": 133940, "epoch": 797} {"train_loss": -9.410321235656738, "global_step": 133941, "epoch": 797} {"train_loss": -9.816986083984375, "global_step": 133942, "epoch": 797} {"train_loss": -9.384227752685547, "global_step": 133943, "epoch": 797} {"train_loss": -10.021482467651367, "global_step": 133944, "epoch": 797} {"train_loss": -8.79321002960205, "global_step": 133945, "epoch": 797} {"train_loss": -10.335769653320312, "global_step": 133946, "epoch": 797} {"train_loss": -9.347615242004395, "global_step": 133947, "epoch": 797} {"train_loss": -9.8555908203125, "global_step": 133948, "epoch": 797} {"train_loss": -10.338815689086914, "global_step": 133949, "epoch": 797} {"train_loss": -9.421199798583984, "global_step": 133950, "epoch": 797} {"train_loss": -10.074893951416016, "global_step": 133951, "epoch": 797} {"train_loss": -9.65325927734375, "global_step": 133952, "epoch": 797} {"train_loss": -9.826736450195312, "global_step": 133953, "epoch": 797} {"train_loss": -9.942703247070312, "global_step": 133954, "epoch": 797} {"train_loss": -9.672405242919922, "global_step": 133955, "epoch": 797} {"train_loss": -10.119544982910156, "global_step": 133956, "epoch": 797} {"train_loss": -9.796881675720215, "global_step": 133957, "epoch": 797} {"train_loss": -10.368369102478027, "global_step": 133958, "epoch": 797} {"train_loss": -10.137321472167969, "global_step": 133959, "epoch": 797} {"train_loss": -10.229321479797363, "global_step": 133960, "epoch": 797} {"train_loss": -10.32118034362793, "global_step": 133961, "epoch": 797} {"train_loss": -10.21371078491211, "global_step": 133962, "epoch": 797} {"train_loss": -10.36670970916748, "global_step": 133963, "epoch": 797} {"train_loss": -10.026905059814453, "global_step": 133964, "epoch": 797} {"train_loss": -10.2308931350708, "global_step": 133965, "epoch": 797} {"train_loss": -10.191764831542969, "global_step": 133966, "epoch": 797} {"train_loss": -10.101329803466797, "global_step": 133967, "epoch": 797} {"train_loss": -10.35523796081543, "global_step": 133968, "epoch": 797} {"train_loss": -10.343391418457031, "global_step": 133969, "epoch": 797} {"train_loss": -10.269720077514648, "global_step": 133970, "epoch": 797} {"train_loss": -10.382919311523438, "global_step": 133971, "epoch": 797} {"train_loss": -10.263469696044922, "global_step": 133972, "epoch": 797} {"train_loss": -10.355670928955078, "global_step": 133973, "epoch": 797} {"train_loss": -10.531652450561523, "global_step": 133974, "epoch": 797} {"train_loss": -10.18783187866211, "global_step": 133975, "epoch": 797} {"train_loss": -10.513221740722656, "global_step": 133976, "epoch": 797} {"train_loss": -10.278223037719727, "global_step": 133977, "epoch": 797} {"train_loss": -10.583351135253906, "global_step": 133978, "epoch": 797} {"train_loss": -10.529611587524414, "global_step": 133979, "epoch": 797} {"train_loss": -10.293981552124023, "global_step": 133980, "epoch": 797} {"train_loss": -10.722116470336914, "global_step": 133981, "epoch": 797} {"train_loss": -10.368054389953613, "global_step": 133982, "epoch": 797} {"train_loss": -10.464366912841797, "global_step": 133983, "epoch": 797} {"train_loss": -10.55423355102539, "global_step": 133984, "epoch": 797} {"train_loss": -10.443845748901367, "global_step": 133985, "epoch": 797} {"train_loss": -10.729373931884766, "global_step": 133986, "epoch": 797} {"train_loss": -10.290567398071289, "global_step": 133987, "epoch": 797} {"train_loss": -10.55167007446289, "global_step": 133988, "epoch": 797} {"train_loss": -10.34305191040039, "global_step": 133989, "epoch": 797} {"train_loss": -10.691043853759766, "global_step": 133990, "epoch": 797} {"train_loss": -10.642078399658203, "global_step": 133991, "epoch": 797} {"train_loss": -10.431148529052734, "global_step": 133992, "epoch": 797} {"train_loss": -10.377787590026855, "global_step": 133993, "epoch": 797} {"train_loss": -10.347526550292969, "global_step": 133994, "epoch": 797} {"train_loss": -10.60317325592041, "global_step": 133995, "epoch": 797} {"train_loss": -10.646074295043945, "global_step": 133996, "epoch": 797} {"train_loss": -10.624006271362305, "global_step": 133997, "epoch": 797} {"train_loss": -10.607728958129883, "global_step": 133998, "epoch": 797} {"train_loss": -10.480325698852539, "global_step": 133999, "epoch": 797} {"train_loss": -10.510162353515625, "global_step": 134000, "epoch": 797} {"train_loss": -10.382400512695312, "global_step": 134001, "epoch": 797} {"train_loss": -10.422136306762695, "global_step": 134002, "epoch": 797} {"train_loss": -10.688224792480469, "global_step": 134003, "epoch": 797} {"train_loss": -10.614373207092285, "global_step": 134004, "epoch": 797} {"train_loss": -10.685527801513672, "global_step": 134005, "epoch": 797} {"train_loss": -10.499094009399414, "global_step": 134006, "epoch": 797} {"train_loss": -10.581576347351074, "global_step": 134007, "epoch": 797} {"train_loss": -10.374696731567383, "global_step": 134008, "epoch": 797} {"train_loss": -10.63169002532959, "global_step": 134009, "epoch": 797} {"train_loss": -10.478225708007812, "global_step": 134010, "epoch": 797} {"train_loss": -10.307361602783203, "global_step": 134011, "epoch": 797} {"train_loss": -10.583588600158691, "global_step": 134012, "epoch": 797} {"train_loss": -10.565593719482422, "global_step": 134013, "epoch": 797} {"train_loss": -10.589731216430664, "global_step": 134014, "epoch": 797} {"train_loss": -10.406187057495117, "global_step": 134015, "epoch": 797} {"train_loss": -10.280521392822266, "global_step": 134016, "epoch": 797} {"train_loss": -10.244503021240234, "global_step": 134017, "epoch": 797} {"train_loss": -9.690032005310059, "global_step": 134018, "epoch": 797} {"train_loss": -9.718557357788086, "global_step": 134019, "epoch": 797} {"train_loss": -9.233607292175293, "global_step": 134020, "epoch": 797} {"train_loss": -10.28304672241211, "global_step": 134021, "epoch": 797} {"train_loss": -9.925854682922363, "global_step": 134022, "epoch": 797} {"train_loss": -9.902423858642578, "global_step": 134023, "epoch": 797} {"train_loss": -9.979536056518555, "global_step": 134024, "epoch": 797} {"train_loss": -9.934103965759277, "global_step": 134025, "epoch": 797} {"train_loss": -9.779212951660156, "global_step": 134026, "epoch": 797} {"train_loss": -10.058704376220703, "global_step": 134027, "epoch": 797} {"train_loss": -9.93994426727295, "global_step": 134028, "epoch": 797} {"train_loss": -9.254154205322266, "global_step": 134029, "epoch": 797} {"train_loss": -10.13902473449707, "global_step": 134030, "epoch": 797} {"train_loss": -9.786579132080078, "global_step": 134031, "epoch": 797} {"train_loss": -10.111164093017578, "global_step": 134032, "epoch": 797} {"train_loss": -9.574827194213867, "global_step": 134033, "epoch": 797} {"train_loss": -9.617030143737793, "global_step": 134034, "epoch": 797} {"train_loss": -9.817185401916504, "global_step": 134035, "epoch": 797} {"train_loss": -9.786479949951172, "global_step": 134036, "epoch": 797} {"train_loss": -9.744678497314453, "global_step": 134037, "epoch": 797} {"train_loss": -10.083779335021973, "global_step": 134038, "epoch": 797} {"train_loss": -9.744338989257812, "global_step": 134039, "epoch": 797} {"train_loss": -10.235234260559082, "global_step": 134040, "epoch": 797} {"train_loss": -10.291060447692871, "global_step": 134041, "epoch": 797} {"train_loss": -10.125005722045898, "global_step": 134042, "epoch": 797} {"train_loss": -10.474472045898438, "global_step": 134043, "epoch": 797} {"train_loss": -10.175834655761719, "global_step": 134044, "epoch": 797} {"train_loss": -10.14167594909668, "global_step": 134045, "epoch": 797} {"train_loss": -10.1056547164917, "global_step": 134046, "epoch": 797} {"train_loss": -10.467161178588867, "global_step": 134047, "epoch": 797} {"train_loss": -10.233409881591797, "global_step": 134048, "epoch": 797} {"train_loss": -10.259103775024414, "global_step": 134049, "epoch": 797} {"train_loss": -10.406471252441406, "global_step": 134050, "epoch": 797} {"train_loss": -10.305099487304688, "global_step": 134051, "epoch": 797} {"train_loss": -10.30421257019043, "global_step": 134052, "epoch": 797} {"train_loss": -10.23287296295166, "global_step": 134053, "epoch": 797} {"train_loss": -10.444443702697754, "global_step": 134054, "epoch": 797} {"train_loss": -10.550640106201172, "global_step": 134055, "epoch": 797} {"train_loss": -10.623069763183594, "global_step": 134056, "epoch": 797} {"train_loss": -10.425195693969727, "global_step": 134057, "epoch": 797} {"train_loss": -10.526121139526367, "global_step": 134058, "epoch": 797} {"train_loss": -10.333717346191406, "global_step": 134059, "epoch": 797} {"train_loss": -10.563735961914062, "global_step": 134060, "epoch": 797} {"train_loss": -10.465709686279297, "global_step": 134061, "epoch": 797} {"train_loss": -10.599088668823242, "global_step": 134062, "epoch": 797} {"train_loss": -10.249410771188282, "global_step": 134063, "epoch": 797, "val_loss": 222872.328125} {"train_loss": -10.465333938598633, "global_step": 134064, "epoch": 798} {"train_loss": -10.811742782592773, "global_step": 134065, "epoch": 798} {"train_loss": -10.608182907104492, "global_step": 134066, "epoch": 798} {"train_loss": -10.520999908447266, "global_step": 134067, "epoch": 798} {"train_loss": -10.657949447631836, "global_step": 134068, "epoch": 798} {"train_loss": -10.752494812011719, "global_step": 134069, "epoch": 798} {"train_loss": -10.402286529541016, "global_step": 134070, "epoch": 798} {"train_loss": -10.593358993530273, "global_step": 134071, "epoch": 798} {"train_loss": -10.623682975769043, "global_step": 134072, "epoch": 798} {"train_loss": -10.576841354370117, "global_step": 134073, "epoch": 798} {"train_loss": -10.702766418457031, "global_step": 134074, "epoch": 798} {"train_loss": -10.572282791137695, "global_step": 134075, "epoch": 798} {"train_loss": -10.83544921875, "global_step": 134076, "epoch": 798} {"train_loss": -10.48556900024414, "global_step": 134077, "epoch": 798} {"train_loss": -10.760095596313477, "global_step": 134078, "epoch": 798} {"train_loss": -10.832240104675293, "global_step": 134079, "epoch": 798} {"train_loss": -10.20065689086914, "global_step": 134080, "epoch": 798} {"train_loss": -10.701776504516602, "global_step": 134081, "epoch": 798} {"train_loss": -10.667032241821289, "global_step": 134082, "epoch": 798} {"train_loss": -10.748381614685059, "global_step": 134083, "epoch": 798} {"train_loss": -10.845510482788086, "global_step": 134084, "epoch": 798} {"train_loss": -10.505500793457031, "global_step": 134085, "epoch": 798} {"train_loss": -10.42640209197998, "global_step": 134086, "epoch": 798} {"train_loss": -10.38075065612793, "global_step": 134087, "epoch": 798} {"train_loss": -10.386098861694336, "global_step": 134088, "epoch": 798} {"train_loss": -10.261216163635254, "global_step": 134089, "epoch": 798} {"train_loss": -10.750275611877441, "global_step": 134090, "epoch": 798} {"train_loss": -9.755193710327148, "global_step": 134091, "epoch": 798} {"train_loss": -10.701424598693848, "global_step": 134092, "epoch": 798} {"train_loss": -10.403902053833008, "global_step": 134093, "epoch": 798} {"train_loss": -10.693841934204102, "global_step": 134094, "epoch": 798} {"train_loss": -10.677441596984863, "global_step": 134095, "epoch": 798} {"train_loss": -9.852770805358887, "global_step": 134096, "epoch": 798} {"train_loss": -10.39376449584961, "global_step": 134097, "epoch": 798} {"train_loss": -10.257652282714844, "global_step": 134098, "epoch": 798} {"train_loss": -9.951955795288086, "global_step": 134099, "epoch": 798} {"train_loss": -10.621723175048828, "global_step": 134100, "epoch": 798} {"train_loss": -9.846187591552734, "global_step": 134101, "epoch": 798} {"train_loss": -10.327186584472656, "global_step": 134102, "epoch": 798} {"train_loss": -10.13929557800293, "global_step": 134103, "epoch": 798} {"train_loss": -10.361825942993164, "global_step": 134104, "epoch": 798} {"train_loss": -10.250717163085938, "global_step": 134105, "epoch": 798} {"train_loss": -10.161746978759766, "global_step": 134106, "epoch": 798} {"train_loss": -9.93509292602539, "global_step": 134107, "epoch": 798} {"train_loss": -10.29710865020752, "global_step": 134108, "epoch": 798} {"train_loss": -9.80569076538086, "global_step": 134109, "epoch": 798} {"train_loss": -10.412981033325195, "global_step": 134110, "epoch": 798} {"train_loss": -10.101058959960938, "global_step": 134111, "epoch": 798} {"train_loss": -10.282764434814453, "global_step": 134112, "epoch": 798} {"train_loss": -9.932126998901367, "global_step": 134113, "epoch": 798} {"train_loss": -10.151321411132812, "global_step": 134114, "epoch": 798} {"train_loss": -10.094450950622559, "global_step": 134115, "epoch": 798} {"train_loss": -10.13603687286377, "global_step": 134116, "epoch": 798} {"train_loss": -10.027653694152832, "global_step": 134117, "epoch": 798} {"train_loss": -10.248393058776855, "global_step": 134118, "epoch": 798} {"train_loss": -10.30756950378418, "global_step": 134119, "epoch": 798} {"train_loss": -10.164512634277344, "global_step": 134120, "epoch": 798} {"train_loss": -10.345823287963867, "global_step": 134121, "epoch": 798} {"train_loss": -10.122465133666992, "global_step": 134122, "epoch": 798} {"train_loss": -10.015825271606445, "global_step": 134123, "epoch": 798} {"train_loss": -10.39050579071045, "global_step": 134124, "epoch": 798} {"train_loss": -10.176362991333008, "global_step": 134125, "epoch": 798} {"train_loss": -10.136102676391602, "global_step": 134126, "epoch": 798} {"train_loss": -10.605752944946289, "global_step": 134127, "epoch": 798} {"train_loss": -10.332786560058594, "global_step": 134128, "epoch": 798} {"train_loss": -10.340387344360352, "global_step": 134129, "epoch": 798} {"train_loss": -10.499265670776367, "global_step": 134130, "epoch": 798} {"train_loss": -10.079329490661621, "global_step": 134131, "epoch": 798} {"train_loss": -10.24228572845459, "global_step": 134132, "epoch": 798} {"train_loss": -10.608694076538086, "global_step": 134133, "epoch": 798} {"train_loss": -10.493856430053711, "global_step": 134134, "epoch": 798} {"train_loss": -10.371206283569336, "global_step": 134135, "epoch": 798} {"train_loss": -10.522927284240723, "global_step": 134136, "epoch": 798} {"train_loss": -10.568611145019531, "global_step": 134137, "epoch": 798} {"train_loss": -10.437265396118164, "global_step": 134138, "epoch": 798} {"train_loss": -10.491239547729492, "global_step": 134139, "epoch": 798} {"train_loss": -10.382135391235352, "global_step": 134140, "epoch": 798} {"train_loss": -10.650749206542969, "global_step": 134141, "epoch": 798} {"train_loss": -10.53203010559082, "global_step": 134142, "epoch": 798} {"train_loss": -10.468018531799316, "global_step": 134143, "epoch": 798} {"train_loss": -10.64439582824707, "global_step": 134144, "epoch": 798} {"train_loss": -10.18560791015625, "global_step": 134145, "epoch": 798} {"train_loss": -10.798430442810059, "global_step": 134146, "epoch": 798} {"train_loss": -10.315725326538086, "global_step": 134147, "epoch": 798} {"train_loss": -10.412357330322266, "global_step": 134148, "epoch": 798} {"train_loss": -10.631391525268555, "global_step": 134149, "epoch": 798} {"train_loss": -10.626052856445312, "global_step": 134150, "epoch": 798} {"train_loss": -10.718196868896484, "global_step": 134151, "epoch": 798} {"train_loss": -10.600301742553711, "global_step": 134152, "epoch": 798} {"train_loss": -10.552775382995605, "global_step": 134153, "epoch": 798} {"train_loss": -10.627691268920898, "global_step": 134154, "epoch": 798} {"train_loss": -10.616846084594727, "global_step": 134155, "epoch": 798} {"train_loss": -10.653358459472656, "global_step": 134156, "epoch": 798} {"train_loss": -10.64673137664795, "global_step": 134157, "epoch": 798} {"train_loss": -10.838729858398438, "global_step": 134158, "epoch": 798} {"train_loss": -10.777896881103516, "global_step": 134159, "epoch": 798} {"train_loss": -10.894608497619629, "global_step": 134160, "epoch": 798} {"train_loss": -10.74040412902832, "global_step": 134161, "epoch": 798} {"train_loss": -10.797134399414062, "global_step": 134162, "epoch": 798} {"train_loss": -10.7598237991333, "global_step": 134163, "epoch": 798} {"train_loss": -10.800068855285645, "global_step": 134164, "epoch": 798} {"train_loss": -10.738252639770508, "global_step": 134165, "epoch": 798} {"train_loss": -10.714566230773926, "global_step": 134166, "epoch": 798} {"train_loss": -10.62370491027832, "global_step": 134167, "epoch": 798} {"train_loss": -10.433103561401367, "global_step": 134168, "epoch": 798} {"train_loss": -10.5101318359375, "global_step": 134169, "epoch": 798} {"train_loss": -10.430623054504395, "global_step": 134170, "epoch": 798} {"train_loss": -10.058168411254883, "global_step": 134171, "epoch": 798} {"train_loss": -9.611162185668945, "global_step": 134172, "epoch": 798} {"train_loss": -10.252725601196289, "global_step": 134173, "epoch": 798} {"train_loss": -9.554620742797852, "global_step": 134174, "epoch": 798} {"train_loss": -9.597644805908203, "global_step": 134175, "epoch": 798} {"train_loss": -10.405166625976562, "global_step": 134176, "epoch": 798} {"train_loss": -9.96773624420166, "global_step": 134177, "epoch": 798} {"train_loss": -10.293381690979004, "global_step": 134178, "epoch": 798} {"train_loss": -9.785026550292969, "global_step": 134179, "epoch": 798} {"train_loss": -10.260815620422363, "global_step": 134180, "epoch": 798} {"train_loss": -9.811538696289062, "global_step": 134181, "epoch": 798} {"train_loss": -10.159392356872559, "global_step": 134182, "epoch": 798} {"train_loss": -10.601516723632812, "global_step": 134183, "epoch": 798} {"train_loss": -10.36048412322998, "global_step": 134184, "epoch": 798} {"train_loss": -10.099380493164062, "global_step": 134185, "epoch": 798} {"train_loss": -9.673803329467773, "global_step": 134186, "epoch": 798} {"train_loss": -10.067007064819336, "global_step": 134187, "epoch": 798} {"train_loss": -9.681229591369629, "global_step": 134188, "epoch": 798} {"train_loss": -9.551239013671875, "global_step": 134189, "epoch": 798} {"train_loss": -9.26402759552002, "global_step": 134190, "epoch": 798} {"train_loss": -9.709264755249023, "global_step": 134191, "epoch": 798} {"train_loss": -9.380697250366211, "global_step": 134192, "epoch": 798} {"train_loss": -10.174674034118652, "global_step": 134193, "epoch": 798} {"train_loss": -9.876969337463379, "global_step": 134194, "epoch": 798} {"train_loss": -10.20120906829834, "global_step": 134195, "epoch": 798} {"train_loss": -9.909587860107422, "global_step": 134196, "epoch": 798} {"train_loss": -10.410056114196777, "global_step": 134197, "epoch": 798} {"train_loss": -10.03978157043457, "global_step": 134198, "epoch": 798} {"train_loss": -10.010498046875, "global_step": 134199, "epoch": 798} {"train_loss": -10.368473052978516, "global_step": 134200, "epoch": 798} {"train_loss": -10.062150955200195, "global_step": 134201, "epoch": 798} {"train_loss": -10.20810604095459, "global_step": 134202, "epoch": 798} {"train_loss": -10.059499740600586, "global_step": 134203, "epoch": 798} {"train_loss": -9.984298706054688, "global_step": 134204, "epoch": 798} {"train_loss": -10.378661155700684, "global_step": 134205, "epoch": 798} {"train_loss": -10.227519989013672, "global_step": 134206, "epoch": 798} {"train_loss": -10.281961441040039, "global_step": 134207, "epoch": 798} {"train_loss": -10.285797119140625, "global_step": 134208, "epoch": 798} {"train_loss": -10.297231674194336, "global_step": 134209, "epoch": 798} {"train_loss": -10.29255199432373, "global_step": 134210, "epoch": 798} {"train_loss": -10.271838188171387, "global_step": 134211, "epoch": 798} {"train_loss": -10.170269012451172, "global_step": 134212, "epoch": 798} {"train_loss": -10.199440002441406, "global_step": 134213, "epoch": 798} {"train_loss": -10.479707717895508, "global_step": 134214, "epoch": 798} {"train_loss": -10.499211311340332, "global_step": 134215, "epoch": 798} {"train_loss": -10.443180084228516, "global_step": 134216, "epoch": 798} {"train_loss": -10.740062713623047, "global_step": 134217, "epoch": 798} {"train_loss": -10.52983283996582, "global_step": 134218, "epoch": 798} {"train_loss": -10.476058959960938, "global_step": 134219, "epoch": 798} {"train_loss": -10.558107376098633, "global_step": 134220, "epoch": 798} {"train_loss": -10.457171440124512, "global_step": 134221, "epoch": 798} {"train_loss": -10.575340270996094, "global_step": 134222, "epoch": 798} {"train_loss": -10.700091361999512, "global_step": 134223, "epoch": 798} {"train_loss": -10.560562133789062, "global_step": 134224, "epoch": 798} {"train_loss": -10.550691604614258, "global_step": 134225, "epoch": 798} {"train_loss": -10.434101104736328, "global_step": 134226, "epoch": 798} {"train_loss": -10.605754852294922, "global_step": 134227, "epoch": 798} {"train_loss": -10.366857528686523, "global_step": 134228, "epoch": 798} {"train_loss": -10.766390800476074, "global_step": 134229, "epoch": 798} {"train_loss": -10.662120819091797, "global_step": 134230, "epoch": 798} {"train_loss": -10.357626574380058, "global_step": 134231, "epoch": 798, "val_loss": 222549.609375} {"train_loss": -10.635623931884766, "global_step": 134232, "epoch": 799} {"train_loss": -10.575242042541504, "global_step": 134233, "epoch": 799} {"train_loss": -10.81240177154541, "global_step": 134234, "epoch": 799} {"train_loss": -10.585830688476562, "global_step": 134235, "epoch": 799} {"train_loss": -10.341354370117188, "global_step": 134236, "epoch": 799} {"train_loss": -10.689538955688477, "global_step": 134237, "epoch": 799} {"train_loss": -10.815546989440918, "global_step": 134238, "epoch": 799} {"train_loss": -10.222389221191406, "global_step": 134239, "epoch": 799} {"train_loss": -10.443023681640625, "global_step": 134240, "epoch": 799} {"train_loss": -10.544174194335938, "global_step": 134241, "epoch": 799} {"train_loss": -10.541461944580078, "global_step": 134242, "epoch": 799} {"train_loss": -10.284003257751465, "global_step": 134243, "epoch": 799} {"train_loss": -9.455780029296875, "global_step": 134244, "epoch": 799} {"train_loss": -10.08955192565918, "global_step": 134245, "epoch": 799} {"train_loss": -9.839000701904297, "global_step": 134246, "epoch": 799} {"train_loss": -9.703605651855469, "global_step": 134247, "epoch": 799} {"train_loss": -9.996931076049805, "global_step": 134248, "epoch": 799} {"train_loss": -9.723709106445312, "global_step": 134249, "epoch": 799} {"train_loss": -9.81266975402832, "global_step": 134250, "epoch": 799} {"train_loss": -10.433510780334473, "global_step": 134251, "epoch": 799} {"train_loss": -9.787576675415039, "global_step": 134252, "epoch": 799} {"train_loss": -10.347740173339844, "global_step": 134253, "epoch": 799} {"train_loss": -9.500467300415039, "global_step": 134254, "epoch": 799} {"train_loss": -9.84288215637207, "global_step": 134255, "epoch": 799} {"train_loss": -9.459831237792969, "global_step": 134256, "epoch": 799} {"train_loss": -9.417482376098633, "global_step": 134257, "epoch": 799} {"train_loss": -9.984335899353027, "global_step": 134258, "epoch": 799} {"train_loss": -9.835902214050293, "global_step": 134259, "epoch": 799} {"train_loss": -9.973747253417969, "global_step": 134260, "epoch": 799} {"train_loss": -10.006080627441406, "global_step": 134261, "epoch": 799} {"train_loss": -9.866495132446289, "global_step": 134262, "epoch": 799} {"train_loss": -10.045387268066406, "global_step": 134263, "epoch": 799} {"train_loss": -10.211501121520996, "global_step": 134264, "epoch": 799} {"train_loss": -9.507574081420898, "global_step": 134265, "epoch": 799} {"train_loss": -10.419353485107422, "global_step": 134266, "epoch": 799} {"train_loss": -9.990274429321289, "global_step": 134267, "epoch": 799} {"train_loss": -10.144058227539062, "global_step": 134268, "epoch": 799} {"train_loss": -10.114582061767578, "global_step": 134269, "epoch": 799} {"train_loss": -10.284488677978516, "global_step": 134270, "epoch": 799} {"train_loss": -10.139378547668457, "global_step": 134271, "epoch": 799} {"train_loss": -10.283429145812988, "global_step": 134272, "epoch": 799} {"train_loss": -10.203733444213867, "global_step": 134273, "epoch": 799} {"train_loss": -9.987039566040039, "global_step": 134274, "epoch": 799} {"train_loss": -10.350125312805176, "global_step": 134275, "epoch": 799} {"train_loss": -10.311101913452148, "global_step": 134276, "epoch": 799} {"train_loss": -10.43077278137207, "global_step": 134277, "epoch": 799} {"train_loss": -10.386566162109375, "global_step": 134278, "epoch": 799} {"train_loss": -10.423650741577148, "global_step": 134279, "epoch": 799} {"train_loss": -10.363062858581543, "global_step": 134280, "epoch": 799} {"train_loss": -10.432080268859863, "global_step": 134281, "epoch": 799} {"train_loss": -10.570075035095215, "global_step": 134282, "epoch": 799} {"train_loss": -10.622827529907227, "global_step": 134283, "epoch": 799} {"train_loss": -10.678434371948242, "global_step": 134284, "epoch": 799} {"train_loss": -10.410457611083984, "global_step": 134285, "epoch": 799} {"train_loss": -10.473328590393066, "global_step": 134286, "epoch": 799} {"train_loss": -10.539312362670898, "global_step": 134287, "epoch": 799} {"train_loss": -10.559517860412598, "global_step": 134288, "epoch": 799} {"train_loss": -10.590365409851074, "global_step": 134289, "epoch": 799} {"train_loss": -10.822521209716797, "global_step": 134290, "epoch": 799} {"train_loss": -10.444448471069336, "global_step": 134291, "epoch": 799} {"train_loss": -10.571680068969727, "global_step": 134292, "epoch": 799} {"train_loss": -10.677328109741211, "global_step": 134293, "epoch": 799} {"train_loss": -10.657346725463867, "global_step": 134294, "epoch": 799} {"train_loss": -10.802260398864746, "global_step": 134295, "epoch": 799} {"train_loss": -10.495959281921387, "global_step": 134296, "epoch": 799} {"train_loss": -10.647320747375488, "global_step": 134297, "epoch": 799} {"train_loss": -10.532417297363281, "global_step": 134298, "epoch": 799} {"train_loss": -10.611305236816406, "global_step": 134299, "epoch": 799} {"train_loss": -10.782508850097656, "global_step": 134300, "epoch": 799} {"train_loss": -10.616676330566406, "global_step": 134301, "epoch": 799} {"train_loss": -10.78659439086914, "global_step": 134302, "epoch": 799} {"train_loss": -10.983039855957031, "global_step": 134303, "epoch": 799} {"train_loss": -10.937284469604492, "global_step": 134304, "epoch": 799} {"train_loss": -10.598281860351562, "global_step": 134305, "epoch": 799} {"train_loss": -10.97384262084961, "global_step": 134306, "epoch": 799} {"train_loss": -10.728719711303711, "global_step": 134307, "epoch": 799} {"train_loss": -10.407817840576172, "global_step": 134308, "epoch": 799} {"train_loss": -10.587648391723633, "global_step": 134309, "epoch": 799} {"train_loss": -10.641582489013672, "global_step": 134310, "epoch": 799} {"train_loss": -10.684316635131836, "global_step": 134311, "epoch": 799} {"train_loss": -10.1580810546875, "global_step": 134312, "epoch": 799} {"train_loss": -10.60995101928711, "global_step": 134313, "epoch": 799} {"train_loss": -10.257247924804688, "global_step": 134314, "epoch": 799} {"train_loss": -10.532285690307617, "global_step": 134315, "epoch": 799} {"train_loss": -10.649253845214844, "global_step": 134316, "epoch": 799} {"train_loss": -10.287546157836914, "global_step": 134317, "epoch": 799} {"train_loss": -10.70135498046875, "global_step": 134318, "epoch": 799} {"train_loss": -10.415603637695312, "global_step": 134319, "epoch": 799} {"train_loss": -10.10137939453125, "global_step": 134320, "epoch": 799} {"train_loss": -10.256264686584473, "global_step": 134321, "epoch": 799} {"train_loss": -10.766144752502441, "global_step": 134322, "epoch": 799} {"train_loss": -10.222085952758789, "global_step": 134323, "epoch": 799} {"train_loss": -10.589208602905273, "global_step": 134324, "epoch": 799} {"train_loss": -10.409379005432129, "global_step": 134325, "epoch": 799} {"train_loss": -10.673168182373047, "global_step": 134326, "epoch": 799} {"train_loss": -10.22132682800293, "global_step": 134327, "epoch": 799} {"train_loss": -10.600955963134766, "global_step": 134328, "epoch": 799} {"train_loss": -10.652688026428223, "global_step": 134329, "epoch": 799} {"train_loss": -10.356441497802734, "global_step": 134330, "epoch": 799} {"train_loss": -10.209897994995117, "global_step": 134331, "epoch": 799} {"train_loss": -10.454602241516113, "global_step": 134332, "epoch": 799} {"train_loss": -10.202804565429688, "global_step": 134333, "epoch": 799} {"train_loss": -10.116843223571777, "global_step": 134334, "epoch": 799} {"train_loss": -10.0449857711792, "global_step": 134335, "epoch": 799} {"train_loss": -10.504514694213867, "global_step": 134336, "epoch": 799} {"train_loss": -10.266975402832031, "global_step": 134337, "epoch": 799} {"train_loss": -10.56534194946289, "global_step": 134338, "epoch": 799} {"train_loss": -10.576634407043457, "global_step": 134339, "epoch": 799} {"train_loss": -10.2618408203125, "global_step": 134340, "epoch": 799} {"train_loss": -10.404966354370117, "global_step": 134341, "epoch": 799} {"train_loss": -10.717284202575684, "global_step": 134342, "epoch": 799} {"train_loss": -10.617015838623047, "global_step": 134343, "epoch": 799} {"train_loss": -10.327865600585938, "global_step": 134344, "epoch": 799} {"train_loss": -10.499259948730469, "global_step": 134345, "epoch": 799} {"train_loss": -10.530229568481445, "global_step": 134346, "epoch": 799} {"train_loss": -10.67451286315918, "global_step": 134347, "epoch": 799} {"train_loss": -10.728594779968262, "global_step": 134348, "epoch": 799} {"train_loss": -10.71538257598877, "global_step": 134349, "epoch": 799} {"train_loss": -10.729726791381836, "global_step": 134350, "epoch": 799} {"train_loss": -10.424027442932129, "global_step": 134351, "epoch": 799} {"train_loss": -10.490434646606445, "global_step": 134352, "epoch": 799} {"train_loss": -10.759444236755371, "global_step": 134353, "epoch": 799} {"train_loss": -10.535964965820312, "global_step": 134354, "epoch": 799} {"train_loss": -10.646865844726562, "global_step": 134355, "epoch": 799} {"train_loss": -10.485572814941406, "global_step": 134356, "epoch": 799} {"train_loss": -10.645556449890137, "global_step": 134357, "epoch": 799} {"train_loss": -10.50253963470459, "global_step": 134358, "epoch": 799} {"train_loss": -10.294866561889648, "global_step": 134359, "epoch": 799} {"train_loss": -10.238093376159668, "global_step": 134360, "epoch": 799} {"train_loss": -10.491345405578613, "global_step": 134361, "epoch": 799} {"train_loss": -10.300060272216797, "global_step": 134362, "epoch": 799} {"train_loss": -10.333362579345703, "global_step": 134363, "epoch": 799} {"train_loss": -10.606269836425781, "global_step": 134364, "epoch": 799} {"train_loss": -10.418710708618164, "global_step": 134365, "epoch": 799} {"train_loss": -10.354798316955566, "global_step": 134366, "epoch": 799} {"train_loss": -10.462915420532227, "global_step": 134367, "epoch": 799} {"train_loss": -10.411764144897461, "global_step": 134368, "epoch": 799} {"train_loss": -10.480998992919922, "global_step": 134369, "epoch": 799} {"train_loss": -10.236688613891602, "global_step": 134370, "epoch": 799} {"train_loss": -10.658819198608398, "global_step": 134371, "epoch": 799} {"train_loss": -10.675848007202148, "global_step": 134372, "epoch": 799} {"train_loss": -10.578645706176758, "global_step": 134373, "epoch": 799} {"train_loss": -10.581703186035156, "global_step": 134374, "epoch": 799} {"train_loss": -10.522851943969727, "global_step": 134375, "epoch": 799} {"train_loss": -10.692404747009277, "global_step": 134376, "epoch": 799} {"train_loss": -10.306791305541992, "global_step": 134377, "epoch": 799} {"train_loss": -10.516962051391602, "global_step": 134378, "epoch": 799} {"train_loss": -10.424646377563477, "global_step": 134379, "epoch": 799} {"train_loss": -10.493847846984863, "global_step": 134380, "epoch": 799} {"train_loss": -10.652114868164062, "global_step": 134381, "epoch": 799} {"train_loss": -10.77534008026123, "global_step": 134382, "epoch": 799} {"train_loss": -10.477235794067383, "global_step": 134383, "epoch": 799} {"train_loss": -10.554664611816406, "global_step": 134384, "epoch": 799} {"train_loss": -10.798505783081055, "global_step": 134385, "epoch": 799} {"train_loss": -10.542853355407715, "global_step": 134386, "epoch": 799} {"train_loss": -10.660507202148438, "global_step": 134387, "epoch": 799} {"train_loss": -10.401177406311035, "global_step": 134388, "epoch": 799} {"train_loss": -10.577223777770996, "global_step": 134389, "epoch": 799} {"train_loss": -10.392556190490723, "global_step": 134390, "epoch": 799} {"train_loss": -10.262897491455078, "global_step": 134391, "epoch": 799} {"train_loss": -10.496192932128906, "global_step": 134392, "epoch": 799} {"train_loss": -10.027695655822754, "global_step": 134393, "epoch": 799} {"train_loss": -10.718315124511719, "global_step": 134394, "epoch": 799} {"train_loss": -10.499135971069336, "global_step": 134395, "epoch": 799} {"train_loss": -10.511688232421875, "global_step": 134396, "epoch": 799} {"train_loss": -10.505645751953125, "global_step": 134397, "epoch": 799} {"train_loss": -10.627811431884766, "global_step": 134398, "epoch": 799} {"train_loss": -10.411766137395587, "global_step": 134399, "epoch": 799, "val_loss": 220638.828125} {"train_loss": -10.374734878540039, "global_step": 134400, "epoch": 800} {"train_loss": -10.443052291870117, "global_step": 134401, "epoch": 800} {"train_loss": -10.405292510986328, "global_step": 134402, "epoch": 800} {"train_loss": -10.143003463745117, "global_step": 134403, "epoch": 800} {"train_loss": -10.310253143310547, "global_step": 134404, "epoch": 800} {"train_loss": -10.583078384399414, "global_step": 134405, "epoch": 800} {"train_loss": -10.172218322753906, "global_step": 134406, "epoch": 800} {"train_loss": -10.316497802734375, "global_step": 134407, "epoch": 800} {"train_loss": -10.26722526550293, "global_step": 134408, "epoch": 800} {"train_loss": -10.448766708374023, "global_step": 134409, "epoch": 800} {"train_loss": -10.264087677001953, "global_step": 134410, "epoch": 800} {"train_loss": -10.573341369628906, "global_step": 134411, "epoch": 800} {"train_loss": -10.099181175231934, "global_step": 134412, "epoch": 800} {"train_loss": -10.464889526367188, "global_step": 134413, "epoch": 800} {"train_loss": -10.301650047302246, "global_step": 134414, "epoch": 800} {"train_loss": -10.292388916015625, "global_step": 134415, "epoch": 800} {"train_loss": -10.475732803344727, "global_step": 134416, "epoch": 800} {"train_loss": -9.964338302612305, "global_step": 134417, "epoch": 800} {"train_loss": -10.643829345703125, "global_step": 134418, "epoch": 800} {"train_loss": -10.294073104858398, "global_step": 134419, "epoch": 800} {"train_loss": -10.389740943908691, "global_step": 134420, "epoch": 800} {"train_loss": -10.437543869018555, "global_step": 134421, "epoch": 800} {"train_loss": -9.84249496459961, "global_step": 134422, "epoch": 800} {"train_loss": -10.680000305175781, "global_step": 134423, "epoch": 800} {"train_loss": -10.017885208129883, "global_step": 134424, "epoch": 800} {"train_loss": -10.243719100952148, "global_step": 134425, "epoch": 800} {"train_loss": -10.528727531433105, "global_step": 134426, "epoch": 800} {"train_loss": -10.219522476196289, "global_step": 134427, "epoch": 800} {"train_loss": -10.521909713745117, "global_step": 134428, "epoch": 800} {"train_loss": -10.254655838012695, "global_step": 134429, "epoch": 800} {"train_loss": -10.457040786743164, "global_step": 134430, "epoch": 800} {"train_loss": -9.961196899414062, "global_step": 134431, "epoch": 800} {"train_loss": -9.913366317749023, "global_step": 134432, "epoch": 800} {"train_loss": -10.53304386138916, "global_step": 134433, "epoch": 800} {"train_loss": -10.137840270996094, "global_step": 134434, "epoch": 800} {"train_loss": -10.301668167114258, "global_step": 134435, "epoch": 800} {"train_loss": -10.477828979492188, "global_step": 134436, "epoch": 800} {"train_loss": -10.504806518554688, "global_step": 134437, "epoch": 800} {"train_loss": -10.433967590332031, "global_step": 134438, "epoch": 800} {"train_loss": -10.382431983947754, "global_step": 134439, "epoch": 800} {"train_loss": -10.604486465454102, "global_step": 134440, "epoch": 800} {"train_loss": -10.27602767944336, "global_step": 134441, "epoch": 800} {"train_loss": -10.410348892211914, "global_step": 134442, "epoch": 800} {"train_loss": -10.343406677246094, "global_step": 134443, "epoch": 800} {"train_loss": -10.483964920043945, "global_step": 134444, "epoch": 800} {"train_loss": -10.449200630187988, "global_step": 134445, "epoch": 800} {"train_loss": -10.565780639648438, "global_step": 134446, "epoch": 800} {"train_loss": -10.399526596069336, "global_step": 134447, "epoch": 800} {"train_loss": -10.624082565307617, "global_step": 134448, "epoch": 800} {"train_loss": -10.409209251403809, "global_step": 134449, "epoch": 800} {"train_loss": -10.667101860046387, "global_step": 134450, "epoch": 800} {"train_loss": -10.499282836914062, "global_step": 134451, "epoch": 800} {"train_loss": -10.428421020507812, "global_step": 134452, "epoch": 800} {"train_loss": -10.508288383483887, "global_step": 134453, "epoch": 800} {"train_loss": -10.604634284973145, "global_step": 134454, "epoch": 800} {"train_loss": -10.400259017944336, "global_step": 134455, "epoch": 800} {"train_loss": -10.615830421447754, "global_step": 134456, "epoch": 800} {"train_loss": -10.738025665283203, "global_step": 134457, "epoch": 800} {"train_loss": -10.521692276000977, "global_step": 134458, "epoch": 800} {"train_loss": -10.555618286132812, "global_step": 134459, "epoch": 800} {"train_loss": -10.552570343017578, "global_step": 134460, "epoch": 800} {"train_loss": -10.443968772888184, "global_step": 134461, "epoch": 800} {"train_loss": -10.514232635498047, "global_step": 134462, "epoch": 800} {"train_loss": -10.242646217346191, "global_step": 134463, "epoch": 800} {"train_loss": -10.519881248474121, "global_step": 134464, "epoch": 800} {"train_loss": -10.326616287231445, "global_step": 134465, "epoch": 800} {"train_loss": -10.641106605529785, "global_step": 134466, "epoch": 800} {"train_loss": -10.402647018432617, "global_step": 134467, "epoch": 800} {"train_loss": -10.441993713378906, "global_step": 134468, "epoch": 800} {"train_loss": -10.575878143310547, "global_step": 134469, "epoch": 800} {"train_loss": -10.377721786499023, "global_step": 134470, "epoch": 800} {"train_loss": -10.727285385131836, "global_step": 134471, "epoch": 800} {"train_loss": -10.001422882080078, "global_step": 134472, "epoch": 800} {"train_loss": -10.627678871154785, "global_step": 134473, "epoch": 800} {"train_loss": -10.409215927124023, "global_step": 134474, "epoch": 800} {"train_loss": -10.485198974609375, "global_step": 134475, "epoch": 800} {"train_loss": -10.489031791687012, "global_step": 134476, "epoch": 800} {"train_loss": -10.323262214660645, "global_step": 134477, "epoch": 800} {"train_loss": -10.4407320022583, "global_step": 134478, "epoch": 800} {"train_loss": -10.496994018554688, "global_step": 134479, "epoch": 800} {"train_loss": -10.642682075500488, "global_step": 134480, "epoch": 800} {"train_loss": -10.558941841125488, "global_step": 134481, "epoch": 800} {"train_loss": -10.175809860229492, "global_step": 134482, "epoch": 800} {"train_loss": -10.392370223999023, "global_step": 134483, "epoch": 800} {"train_loss": -10.404218673706055, "global_step": 134484, "epoch": 800} {"train_loss": -10.058650970458984, "global_step": 134485, "epoch": 800} {"train_loss": -10.390262603759766, "global_step": 134486, "epoch": 800} {"train_loss": -9.845706939697266, "global_step": 134487, "epoch": 800} {"train_loss": -9.546541213989258, "global_step": 134488, "epoch": 800} {"train_loss": -8.7912015914917, "global_step": 134489, "epoch": 800} {"train_loss": -9.082354545593262, "global_step": 134490, "epoch": 800} {"train_loss": -9.773279190063477, "global_step": 134491, "epoch": 800} {"train_loss": -9.350555419921875, "global_step": 134492, "epoch": 800} {"train_loss": -10.045805931091309, "global_step": 134493, "epoch": 800} {"train_loss": -9.10133171081543, "global_step": 134494, "epoch": 800} {"train_loss": -10.057731628417969, "global_step": 134495, "epoch": 800} {"train_loss": -9.601391792297363, "global_step": 134496, "epoch": 800} {"train_loss": -9.956003189086914, "global_step": 134497, "epoch": 800} {"train_loss": -9.536579132080078, "global_step": 134498, "epoch": 800} {"train_loss": -10.06977653503418, "global_step": 134499, "epoch": 800} {"train_loss": -9.737926483154297, "global_step": 134500, "epoch": 800} {"train_loss": -10.227805137634277, "global_step": 134501, "epoch": 800} {"train_loss": -9.88388442993164, "global_step": 134502, "epoch": 800} {"train_loss": -10.333911895751953, "global_step": 134503, "epoch": 800} {"train_loss": -10.233283996582031, "global_step": 134504, "epoch": 800} {"train_loss": -9.995320320129395, "global_step": 134505, "epoch": 800} {"train_loss": -10.242998123168945, "global_step": 134506, "epoch": 800} {"train_loss": -10.240177154541016, "global_step": 134507, "epoch": 800} {"train_loss": -10.11123275756836, "global_step": 134508, "epoch": 800} {"train_loss": -10.215486526489258, "global_step": 134509, "epoch": 800} {"train_loss": -10.359691619873047, "global_step": 134510, "epoch": 800} {"train_loss": -10.120403289794922, "global_step": 134511, "epoch": 800} {"train_loss": -10.378138542175293, "global_step": 134512, "epoch": 800} {"train_loss": -10.10202407836914, "global_step": 134513, "epoch": 800} {"train_loss": -10.404869079589844, "global_step": 134514, "epoch": 800} {"train_loss": -10.230391502380371, "global_step": 134515, "epoch": 800} {"train_loss": -10.243659973144531, "global_step": 134516, "epoch": 800} {"train_loss": -10.146608352661133, "global_step": 134517, "epoch": 800} {"train_loss": -10.44381332397461, "global_step": 134518, "epoch": 800} {"train_loss": -10.320627212524414, "global_step": 134519, "epoch": 800} {"train_loss": -10.377754211425781, "global_step": 134520, "epoch": 800} {"train_loss": -10.341832160949707, "global_step": 134521, "epoch": 800} {"train_loss": -10.428814888000488, "global_step": 134522, "epoch": 800} {"train_loss": -10.374006271362305, "global_step": 134523, "epoch": 800} {"train_loss": -10.442407608032227, "global_step": 134524, "epoch": 800} {"train_loss": -10.457939147949219, "global_step": 134525, "epoch": 800} {"train_loss": -10.395964622497559, "global_step": 134526, "epoch": 800} {"train_loss": -10.458093643188477, "global_step": 134527, "epoch": 800} {"train_loss": -10.412338256835938, "global_step": 134528, "epoch": 800} {"train_loss": -10.557295799255371, "global_step": 134529, "epoch": 800} {"train_loss": -10.44011116027832, "global_step": 134530, "epoch": 800} {"train_loss": -10.645791053771973, "global_step": 134531, "epoch": 800} {"train_loss": -10.39797592163086, "global_step": 134532, "epoch": 800} {"train_loss": -10.656171798706055, "global_step": 134533, "epoch": 800} {"train_loss": -10.662660598754883, "global_step": 134534, "epoch": 800} {"train_loss": -10.478443145751953, "global_step": 134535, "epoch": 800} {"train_loss": -10.524140357971191, "global_step": 134536, "epoch": 800} {"train_loss": -10.6520357131958, "global_step": 134537, "epoch": 800} {"train_loss": -10.69782543182373, "global_step": 134538, "epoch": 800} {"train_loss": -10.487826347351074, "global_step": 134539, "epoch": 800} {"train_loss": -10.88334846496582, "global_step": 134540, "epoch": 800} {"train_loss": -10.629011154174805, "global_step": 134541, "epoch": 800} {"train_loss": -10.795405387878418, "global_step": 134542, "epoch": 800} {"train_loss": -10.818094253540039, "global_step": 134543, "epoch": 800} {"train_loss": -10.710959434509277, "global_step": 134544, "epoch": 800} {"train_loss": -10.589861869812012, "global_step": 134545, "epoch": 800} {"train_loss": -10.74536418914795, "global_step": 134546, "epoch": 800} {"train_loss": -10.61465835571289, "global_step": 134547, "epoch": 800} {"train_loss": -10.585783004760742, "global_step": 134548, "epoch": 800} {"train_loss": -10.763004302978516, "global_step": 134549, "epoch": 800} {"train_loss": -10.727030754089355, "global_step": 134550, "epoch": 800} {"train_loss": -10.587600708007812, "global_step": 134551, "epoch": 800} {"train_loss": -10.716935157775879, "global_step": 134552, "epoch": 800} {"train_loss": -10.654200553894043, "global_step": 134553, "epoch": 800} {"train_loss": -10.710826873779297, "global_step": 134554, "epoch": 800} {"train_loss": -10.321252822875977, "global_step": 134555, "epoch": 800} {"train_loss": -10.540521621704102, "global_step": 134556, "epoch": 800} {"train_loss": -10.290660858154297, "global_step": 134557, "epoch": 800} {"train_loss": -10.705793380737305, "global_step": 134558, "epoch": 800} {"train_loss": -10.238404273986816, "global_step": 134559, "epoch": 800} {"train_loss": -10.580150604248047, "global_step": 134560, "epoch": 800} {"train_loss": -10.403039932250977, "global_step": 134561, "epoch": 800} {"train_loss": -10.45970630645752, "global_step": 134562, "epoch": 800} {"train_loss": -10.437851905822754, "global_step": 134563, "epoch": 800} {"train_loss": -10.166260719299316, "global_step": 134564, "epoch": 800} {"train_loss": -10.659740447998047, "global_step": 134565, "epoch": 800} {"train_loss": -10.168951034545898, "global_step": 134566, "epoch": 800} {"train_loss": -10.352953893797737, "global_step": 134567, "epoch": 800, "train/sim_max_reward_0": 0.5045899027254207, "train/sim_max_reward_1": 0.9548133290129632, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.4422303463964311, "train/sim_max_reward_4": 0.9839287113597895, "train/sim_max_reward_5": 0.5744421308112188, "test/sim_max_reward_4400000": 0.269005906768891, "test/sim_max_reward_4400001": 0.32568860448189585, "test/sim_max_reward_4400002": 0.07695188868648646, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.4066770640147294, "test/sim_max_reward_4400005": 0.4957740072141094, "test/sim_max_reward_4400006": 0.30878731791391884, "test/sim_max_reward_4400007": 0.24840296570797604, "test/sim_max_reward_4400008": 0.6192886056368927, "test/sim_max_reward_4400009": 0.414208118329179, "test/sim_max_reward_4400010": 0.9750306850886409, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 0.4199673281840554, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9930167069511697, "test/sim_max_reward_4400019": 0.25458220676831783, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9420678791167472, "test/sim_max_reward_4400023": 0.15965738496500043, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.6582200727341948, "test/sim_max_reward_4400026": 0.07280296357824649, "test/sim_max_reward_4400027": 0.18790936256007593, "test/sim_max_reward_4400028": 0.010363480295857097, "test/sim_max_reward_4400029": 0.49283504400464856, "test/sim_max_reward_4400030": 0.9241089320077363, "test/sim_max_reward_4400031": 0.9870762740415454, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.15598148320856023, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.965465103971642, "test/sim_max_reward_4400036": 0.3780723792677014, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9317319808712395, "test/sim_max_reward_4400042": 0.9599249997596248, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.17644143030932644, "test/sim_max_reward_4400045": 0.9774471464729981, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.5766674033843039, "test/mean_score": 0.5119884076626897, "val_loss": 222316.65625, "train_action_mse_error": 7.250169277191162} {"train_loss": -10.225194931030273, "global_step": 134568, "epoch": 801} {"train_loss": -10.508833885192871, "global_step": 134569, "epoch": 801} {"train_loss": -9.885904312133789, "global_step": 134570, "epoch": 801} {"train_loss": -10.098724365234375, "global_step": 134571, "epoch": 801} {"train_loss": -10.119760513305664, "global_step": 134572, "epoch": 801} {"train_loss": -9.85230827331543, "global_step": 134573, "epoch": 801} {"train_loss": -10.451705932617188, "global_step": 134574, "epoch": 801} {"train_loss": -9.49226188659668, "global_step": 134575, "epoch": 801} {"train_loss": -10.382646560668945, "global_step": 134576, "epoch": 801} {"train_loss": -10.310341835021973, "global_step": 134577, "epoch": 801} {"train_loss": -9.957683563232422, "global_step": 134578, "epoch": 801} {"train_loss": -10.180965423583984, "global_step": 134579, "epoch": 801} {"train_loss": -10.136850357055664, "global_step": 134580, "epoch": 801} {"train_loss": -10.496760368347168, "global_step": 134581, "epoch": 801} {"train_loss": -10.17490005493164, "global_step": 134582, "epoch": 801} {"train_loss": -10.529630661010742, "global_step": 134583, "epoch": 801} {"train_loss": -10.032621383666992, "global_step": 134584, "epoch": 801} {"train_loss": -10.591930389404297, "global_step": 134585, "epoch": 801} {"train_loss": -10.516094207763672, "global_step": 134586, "epoch": 801} {"train_loss": -10.484647750854492, "global_step": 134587, "epoch": 801} {"train_loss": -9.973894119262695, "global_step": 134588, "epoch": 801} {"train_loss": -10.290717124938965, "global_step": 134589, "epoch": 801} {"train_loss": -10.261526107788086, "global_step": 134590, "epoch": 801} {"train_loss": -10.208671569824219, "global_step": 134591, "epoch": 801} {"train_loss": -10.192655563354492, "global_step": 134592, "epoch": 801} {"train_loss": -10.479961395263672, "global_step": 134593, "epoch": 801} {"train_loss": -10.241108894348145, "global_step": 134594, "epoch": 801} {"train_loss": -10.459870338439941, "global_step": 134595, "epoch": 801} {"train_loss": -10.36658000946045, "global_step": 134596, "epoch": 801} {"train_loss": -10.344470024108887, "global_step": 134597, "epoch": 801} {"train_loss": -10.68124008178711, "global_step": 134598, "epoch": 801} {"train_loss": -10.397560119628906, "global_step": 134599, "epoch": 801} {"train_loss": -10.402261734008789, "global_step": 134600, "epoch": 801} {"train_loss": -10.421381950378418, "global_step": 134601, "epoch": 801} {"train_loss": -10.320512771606445, "global_step": 134602, "epoch": 801} {"train_loss": -10.50277042388916, "global_step": 134603, "epoch": 801} {"train_loss": -10.450544357299805, "global_step": 134604, "epoch": 801} {"train_loss": -10.369712829589844, "global_step": 134605, "epoch": 801} {"train_loss": -10.589839935302734, "global_step": 134606, "epoch": 801} {"train_loss": -10.58998966217041, "global_step": 134607, "epoch": 801} {"train_loss": -10.48693561553955, "global_step": 134608, "epoch": 801} {"train_loss": -10.564035415649414, "global_step": 134609, "epoch": 801} {"train_loss": -10.612807273864746, "global_step": 134610, "epoch": 801} {"train_loss": -10.406304359436035, "global_step": 134611, "epoch": 801} {"train_loss": -10.53877067565918, "global_step": 134612, "epoch": 801} {"train_loss": -10.539020538330078, "global_step": 134613, "epoch": 801} {"train_loss": -10.475288391113281, "global_step": 134614, "epoch": 801} {"train_loss": -10.607394218444824, "global_step": 134615, "epoch": 801} {"train_loss": -10.723215103149414, "global_step": 134616, "epoch": 801} {"train_loss": -10.613462448120117, "global_step": 134617, "epoch": 801} {"train_loss": -10.544889450073242, "global_step": 134618, "epoch": 801} {"train_loss": -10.509157180786133, "global_step": 134619, "epoch": 801} {"train_loss": -10.64461612701416, "global_step": 134620, "epoch": 801} {"train_loss": -10.577438354492188, "global_step": 134621, "epoch": 801} {"train_loss": -10.758401870727539, "global_step": 134622, "epoch": 801} {"train_loss": -10.459603309631348, "global_step": 134623, "epoch": 801} {"train_loss": -10.586553573608398, "global_step": 134624, "epoch": 801} {"train_loss": -10.694530487060547, "global_step": 134625, "epoch": 801} {"train_loss": -10.617927551269531, "global_step": 134626, "epoch": 801} {"train_loss": -10.539060592651367, "global_step": 134627, "epoch": 801} {"train_loss": -10.571782112121582, "global_step": 134628, "epoch": 801} {"train_loss": -10.51750373840332, "global_step": 134629, "epoch": 801} {"train_loss": -10.19278621673584, "global_step": 134630, "epoch": 801} {"train_loss": -10.644491195678711, "global_step": 134631, "epoch": 801} {"train_loss": -10.463973045349121, "global_step": 134632, "epoch": 801} {"train_loss": -10.55023193359375, "global_step": 134633, "epoch": 801} {"train_loss": -10.299598693847656, "global_step": 134634, "epoch": 801} {"train_loss": -10.661598205566406, "global_step": 134635, "epoch": 801} {"train_loss": -10.471449851989746, "global_step": 134636, "epoch": 801} {"train_loss": -10.325632095336914, "global_step": 134637, "epoch": 801} {"train_loss": -10.808391571044922, "global_step": 134638, "epoch": 801} {"train_loss": -10.304149627685547, "global_step": 134639, "epoch": 801} {"train_loss": -10.29780387878418, "global_step": 134640, "epoch": 801} {"train_loss": -10.23581314086914, "global_step": 134641, "epoch": 801} {"train_loss": -10.088973045349121, "global_step": 134642, "epoch": 801} {"train_loss": -10.49741268157959, "global_step": 134643, "epoch": 801} {"train_loss": -10.279863357543945, "global_step": 134644, "epoch": 801} {"train_loss": -10.337562561035156, "global_step": 134645, "epoch": 801} {"train_loss": -10.34566879272461, "global_step": 134646, "epoch": 801} {"train_loss": -10.572542190551758, "global_step": 134647, "epoch": 801} {"train_loss": -10.521926879882812, "global_step": 134648, "epoch": 801} {"train_loss": -10.438911437988281, "global_step": 134649, "epoch": 801} {"train_loss": -10.683100700378418, "global_step": 134650, "epoch": 801} {"train_loss": -10.66961669921875, "global_step": 134651, "epoch": 801} {"train_loss": -10.529415130615234, "global_step": 134652, "epoch": 801} {"train_loss": -10.414243698120117, "global_step": 134653, "epoch": 801} {"train_loss": -10.442026138305664, "global_step": 134654, "epoch": 801} {"train_loss": -10.403881072998047, "global_step": 134655, "epoch": 801} {"train_loss": -10.349831581115723, "global_step": 134656, "epoch": 801} {"train_loss": -10.065595626831055, "global_step": 134657, "epoch": 801} {"train_loss": -10.214672088623047, "global_step": 134658, "epoch": 801} {"train_loss": -10.47771167755127, "global_step": 134659, "epoch": 801} {"train_loss": -10.080131530761719, "global_step": 134660, "epoch": 801} {"train_loss": -9.777515411376953, "global_step": 134661, "epoch": 801} {"train_loss": -9.75987720489502, "global_step": 134662, "epoch": 801} {"train_loss": -8.984835624694824, "global_step": 134663, "epoch": 801} {"train_loss": -10.138399124145508, "global_step": 134664, "epoch": 801} {"train_loss": -9.364429473876953, "global_step": 134665, "epoch": 801} {"train_loss": -10.355268478393555, "global_step": 134666, "epoch": 801} {"train_loss": -9.272665023803711, "global_step": 134667, "epoch": 801} {"train_loss": -10.031312942504883, "global_step": 134668, "epoch": 801} {"train_loss": -9.446345329284668, "global_step": 134669, "epoch": 801} {"train_loss": -9.935506820678711, "global_step": 134670, "epoch": 801} {"train_loss": -9.736040115356445, "global_step": 134671, "epoch": 801} {"train_loss": -10.220710754394531, "global_step": 134672, "epoch": 801} {"train_loss": -10.009797096252441, "global_step": 134673, "epoch": 801} {"train_loss": -10.428750991821289, "global_step": 134674, "epoch": 801} {"train_loss": -10.229043006896973, "global_step": 134675, "epoch": 801} {"train_loss": -10.24717903137207, "global_step": 134676, "epoch": 801} {"train_loss": -9.923802375793457, "global_step": 134677, "epoch": 801} {"train_loss": -10.313472747802734, "global_step": 134678, "epoch": 801} {"train_loss": -9.942161560058594, "global_step": 134679, "epoch": 801} {"train_loss": -10.331754684448242, "global_step": 134680, "epoch": 801} {"train_loss": -10.026302337646484, "global_step": 134681, "epoch": 801} {"train_loss": -10.263969421386719, "global_step": 134682, "epoch": 801} {"train_loss": -10.461938858032227, "global_step": 134683, "epoch": 801} {"train_loss": -10.271055221557617, "global_step": 134684, "epoch": 801} {"train_loss": -10.20286750793457, "global_step": 134685, "epoch": 801} {"train_loss": -10.356562614440918, "global_step": 134686, "epoch": 801} {"train_loss": -10.25932788848877, "global_step": 134687, "epoch": 801} {"train_loss": -10.52581787109375, "global_step": 134688, "epoch": 801} {"train_loss": -10.523513793945312, "global_step": 134689, "epoch": 801} {"train_loss": -10.598677635192871, "global_step": 134690, "epoch": 801} {"train_loss": -10.441629409790039, "global_step": 134691, "epoch": 801} {"train_loss": -10.537425994873047, "global_step": 134692, "epoch": 801} {"train_loss": -10.621805191040039, "global_step": 134693, "epoch": 801} {"train_loss": -10.714550018310547, "global_step": 134694, "epoch": 801} {"train_loss": -10.471988677978516, "global_step": 134695, "epoch": 801} {"train_loss": -10.615034103393555, "global_step": 134696, "epoch": 801} {"train_loss": -10.50943374633789, "global_step": 134697, "epoch": 801} {"train_loss": -10.489828109741211, "global_step": 134698, "epoch": 801} {"train_loss": -10.567155838012695, "global_step": 134699, "epoch": 801} {"train_loss": -10.667937278747559, "global_step": 134700, "epoch": 801} {"train_loss": -10.61286735534668, "global_step": 134701, "epoch": 801} {"train_loss": -10.697084426879883, "global_step": 134702, "epoch": 801} {"train_loss": -10.63284969329834, "global_step": 134703, "epoch": 801} {"train_loss": -10.541742324829102, "global_step": 134704, "epoch": 801} {"train_loss": -10.654016494750977, "global_step": 134705, "epoch": 801} {"train_loss": -10.553695678710938, "global_step": 134706, "epoch": 801} {"train_loss": -10.546541213989258, "global_step": 134707, "epoch": 801} {"train_loss": -10.69466781616211, "global_step": 134708, "epoch": 801} {"train_loss": -10.90207290649414, "global_step": 134709, "epoch": 801} {"train_loss": -10.561485290527344, "global_step": 134710, "epoch": 801} {"train_loss": -10.723736763000488, "global_step": 134711, "epoch": 801} {"train_loss": -10.639301300048828, "global_step": 134712, "epoch": 801} {"train_loss": -10.995674133300781, "global_step": 134713, "epoch": 801} {"train_loss": -10.534892082214355, "global_step": 134714, "epoch": 801} {"train_loss": -10.783452987670898, "global_step": 134715, "epoch": 801} {"train_loss": -10.591867446899414, "global_step": 134716, "epoch": 801} {"train_loss": -10.27604866027832, "global_step": 134717, "epoch": 801} {"train_loss": -10.213172912597656, "global_step": 134718, "epoch": 801} {"train_loss": -10.171808242797852, "global_step": 134719, "epoch": 801} {"train_loss": -10.434194564819336, "global_step": 134720, "epoch": 801} {"train_loss": -10.382868766784668, "global_step": 134721, "epoch": 801} {"train_loss": -10.594050407409668, "global_step": 134722, "epoch": 801} {"train_loss": -10.640968322753906, "global_step": 134723, "epoch": 801} {"train_loss": -10.824066162109375, "global_step": 134724, "epoch": 801} {"train_loss": -10.648475646972656, "global_step": 134725, "epoch": 801} {"train_loss": -10.663705825805664, "global_step": 134726, "epoch": 801} {"train_loss": -9.924001693725586, "global_step": 134727, "epoch": 801} {"train_loss": -10.451139450073242, "global_step": 134728, "epoch": 801} {"train_loss": -10.56688117980957, "global_step": 134729, "epoch": 801} {"train_loss": -10.499399185180664, "global_step": 134730, "epoch": 801} {"train_loss": -10.41858959197998, "global_step": 134731, "epoch": 801} {"train_loss": -10.309759140014648, "global_step": 134732, "epoch": 801} {"train_loss": -9.981159210205078, "global_step": 134733, "epoch": 801} {"train_loss": -10.63206958770752, "global_step": 134734, "epoch": 801} {"train_loss": -10.374016057877313, "global_step": 134735, "epoch": 801, "val_loss": 222101.578125} {"train_loss": -10.362939834594727, "global_step": 134736, "epoch": 802} {"train_loss": -10.173978805541992, "global_step": 134737, "epoch": 802} {"train_loss": -10.132126808166504, "global_step": 134738, "epoch": 802} {"train_loss": -10.539861679077148, "global_step": 134739, "epoch": 802} {"train_loss": -10.183948516845703, "global_step": 134740, "epoch": 802} {"train_loss": -10.224355697631836, "global_step": 134741, "epoch": 802} {"train_loss": -10.183387756347656, "global_step": 134742, "epoch": 802} {"train_loss": -10.092811584472656, "global_step": 134743, "epoch": 802} {"train_loss": -10.2481107711792, "global_step": 134744, "epoch": 802} {"train_loss": -10.132887840270996, "global_step": 134745, "epoch": 802} {"train_loss": -9.987712860107422, "global_step": 134746, "epoch": 802} {"train_loss": -10.078780174255371, "global_step": 134747, "epoch": 802} {"train_loss": -9.452613830566406, "global_step": 134748, "epoch": 802} {"train_loss": -9.743590354919434, "global_step": 134749, "epoch": 802} {"train_loss": -10.271738052368164, "global_step": 134750, "epoch": 802} {"train_loss": -9.82155990600586, "global_step": 134751, "epoch": 802} {"train_loss": -10.547276496887207, "global_step": 134752, "epoch": 802} {"train_loss": -10.05385684967041, "global_step": 134753, "epoch": 802} {"train_loss": -10.330270767211914, "global_step": 134754, "epoch": 802} {"train_loss": -10.229144096374512, "global_step": 134755, "epoch": 802} {"train_loss": -10.078965187072754, "global_step": 134756, "epoch": 802} {"train_loss": -10.289644241333008, "global_step": 134757, "epoch": 802} {"train_loss": -10.310019493103027, "global_step": 134758, "epoch": 802} {"train_loss": -10.06716537475586, "global_step": 134759, "epoch": 802} {"train_loss": -10.58403205871582, "global_step": 134760, "epoch": 802} {"train_loss": -10.258514404296875, "global_step": 134761, "epoch": 802} {"train_loss": -10.490758895874023, "global_step": 134762, "epoch": 802} {"train_loss": -10.335596084594727, "global_step": 134763, "epoch": 802} {"train_loss": -10.445980072021484, "global_step": 134764, "epoch": 802} {"train_loss": -10.548103332519531, "global_step": 134765, "epoch": 802} {"train_loss": -10.40325927734375, "global_step": 134766, "epoch": 802} {"train_loss": -10.50483512878418, "global_step": 134767, "epoch": 802} {"train_loss": -10.352672576904297, "global_step": 134768, "epoch": 802} {"train_loss": -10.442315101623535, "global_step": 134769, "epoch": 802} {"train_loss": -10.631951332092285, "global_step": 134770, "epoch": 802} {"train_loss": -10.41183853149414, "global_step": 134771, "epoch": 802} {"train_loss": -10.538116455078125, "global_step": 134772, "epoch": 802} {"train_loss": -10.638137817382812, "global_step": 134773, "epoch": 802} {"train_loss": -10.550342559814453, "global_step": 134774, "epoch": 802} {"train_loss": -10.588383674621582, "global_step": 134775, "epoch": 802} {"train_loss": -10.55729866027832, "global_step": 134776, "epoch": 802} {"train_loss": -10.687687873840332, "global_step": 134777, "epoch": 802} {"train_loss": -10.585636138916016, "global_step": 134778, "epoch": 802} {"train_loss": -10.783687591552734, "global_step": 134779, "epoch": 802} {"train_loss": -10.685528755187988, "global_step": 134780, "epoch": 802} {"train_loss": -10.875696182250977, "global_step": 134781, "epoch": 802} {"train_loss": -10.550867080688477, "global_step": 134782, "epoch": 802} {"train_loss": -10.545320510864258, "global_step": 134783, "epoch": 802} {"train_loss": -10.574664115905762, "global_step": 134784, "epoch": 802} {"train_loss": -10.487215995788574, "global_step": 134785, "epoch": 802} {"train_loss": -10.364190101623535, "global_step": 134786, "epoch": 802} {"train_loss": -10.319791793823242, "global_step": 134787, "epoch": 802} {"train_loss": -10.537771224975586, "global_step": 134788, "epoch": 802} {"train_loss": -10.672199249267578, "global_step": 134789, "epoch": 802} {"train_loss": -10.462686538696289, "global_step": 134790, "epoch": 802} {"train_loss": -10.665473937988281, "global_step": 134791, "epoch": 802} {"train_loss": -10.484813690185547, "global_step": 134792, "epoch": 802} {"train_loss": -10.490289688110352, "global_step": 134793, "epoch": 802} {"train_loss": -10.585813522338867, "global_step": 134794, "epoch": 802} {"train_loss": -10.585569381713867, "global_step": 134795, "epoch": 802} {"train_loss": -10.401664733886719, "global_step": 134796, "epoch": 802} {"train_loss": -10.258408546447754, "global_step": 134797, "epoch": 802} {"train_loss": -10.703192710876465, "global_step": 134798, "epoch": 802} {"train_loss": -10.541243553161621, "global_step": 134799, "epoch": 802} {"train_loss": -10.631389617919922, "global_step": 134800, "epoch": 802} {"train_loss": -10.481819152832031, "global_step": 134801, "epoch": 802} {"train_loss": -10.624677658081055, "global_step": 134802, "epoch": 802} {"train_loss": -10.493861198425293, "global_step": 134803, "epoch": 802} {"train_loss": -10.255294799804688, "global_step": 134804, "epoch": 802} {"train_loss": -10.641744613647461, "global_step": 134805, "epoch": 802} {"train_loss": -9.997518539428711, "global_step": 134806, "epoch": 802} {"train_loss": -10.489190101623535, "global_step": 134807, "epoch": 802} {"train_loss": -10.551189422607422, "global_step": 134808, "epoch": 802} {"train_loss": -10.316459655761719, "global_step": 134809, "epoch": 802} {"train_loss": -9.638605117797852, "global_step": 134810, "epoch": 802} {"train_loss": -10.553062438964844, "global_step": 134811, "epoch": 802} {"train_loss": -9.926692962646484, "global_step": 134812, "epoch": 802} {"train_loss": -10.619885444641113, "global_step": 134813, "epoch": 802} {"train_loss": -10.168996810913086, "global_step": 134814, "epoch": 802} {"train_loss": -10.265734672546387, "global_step": 134815, "epoch": 802} {"train_loss": -10.617484092712402, "global_step": 134816, "epoch": 802} {"train_loss": -10.527570724487305, "global_step": 134817, "epoch": 802} {"train_loss": -10.534381866455078, "global_step": 134818, "epoch": 802} {"train_loss": -10.123207092285156, "global_step": 134819, "epoch": 802} {"train_loss": -10.635669708251953, "global_step": 134820, "epoch": 802} {"train_loss": -10.406394958496094, "global_step": 134821, "epoch": 802} {"train_loss": -10.677327156066895, "global_step": 134822, "epoch": 802} {"train_loss": -10.595184326171875, "global_step": 134823, "epoch": 802} {"train_loss": -10.341346740722656, "global_step": 134824, "epoch": 802} {"train_loss": -10.400442123413086, "global_step": 134825, "epoch": 802} {"train_loss": -10.03730297088623, "global_step": 134826, "epoch": 802} {"train_loss": -10.45350456237793, "global_step": 134827, "epoch": 802} {"train_loss": -10.083333015441895, "global_step": 134828, "epoch": 802} {"train_loss": -10.565994262695312, "global_step": 134829, "epoch": 802} {"train_loss": -10.204248428344727, "global_step": 134830, "epoch": 802} {"train_loss": -10.45549201965332, "global_step": 134831, "epoch": 802} {"train_loss": -10.317391395568848, "global_step": 134832, "epoch": 802} {"train_loss": -9.946687698364258, "global_step": 134833, "epoch": 802} {"train_loss": -10.86741828918457, "global_step": 134834, "epoch": 802} {"train_loss": -10.187176704406738, "global_step": 134835, "epoch": 802} {"train_loss": -10.482912063598633, "global_step": 134836, "epoch": 802} {"train_loss": -10.531421661376953, "global_step": 134837, "epoch": 802} {"train_loss": -10.56860637664795, "global_step": 134838, "epoch": 802} {"train_loss": -10.650579452514648, "global_step": 134839, "epoch": 802} {"train_loss": -10.455102920532227, "global_step": 134840, "epoch": 802} {"train_loss": -10.563399314880371, "global_step": 134841, "epoch": 802} {"train_loss": -10.40274715423584, "global_step": 134842, "epoch": 802} {"train_loss": -10.668512344360352, "global_step": 134843, "epoch": 802} {"train_loss": -10.754786491394043, "global_step": 134844, "epoch": 802} {"train_loss": -10.587494850158691, "global_step": 134845, "epoch": 802} {"train_loss": -10.835641860961914, "global_step": 134846, "epoch": 802} {"train_loss": -10.285757064819336, "global_step": 134847, "epoch": 802} {"train_loss": -10.539900779724121, "global_step": 134848, "epoch": 802} {"train_loss": -10.6985502243042, "global_step": 134849, "epoch": 802} {"train_loss": -10.5106201171875, "global_step": 134850, "epoch": 802} {"train_loss": -10.60405445098877, "global_step": 134851, "epoch": 802} {"train_loss": -10.551830291748047, "global_step": 134852, "epoch": 802} {"train_loss": -10.573308944702148, "global_step": 134853, "epoch": 802} {"train_loss": -10.757857322692871, "global_step": 134854, "epoch": 802} {"train_loss": -10.37765884399414, "global_step": 134855, "epoch": 802} {"train_loss": -10.719963073730469, "global_step": 134856, "epoch": 802} {"train_loss": -10.543462753295898, "global_step": 134857, "epoch": 802} {"train_loss": -10.777116775512695, "global_step": 134858, "epoch": 802} {"train_loss": -10.615839958190918, "global_step": 134859, "epoch": 802} {"train_loss": -10.701183319091797, "global_step": 134860, "epoch": 802} {"train_loss": -10.484930038452148, "global_step": 134861, "epoch": 802} {"train_loss": -10.621588706970215, "global_step": 134862, "epoch": 802} {"train_loss": -10.6551513671875, "global_step": 134863, "epoch": 802} {"train_loss": -10.396156311035156, "global_step": 134864, "epoch": 802} {"train_loss": -10.546070098876953, "global_step": 134865, "epoch": 802} {"train_loss": -10.51334285736084, "global_step": 134866, "epoch": 802} {"train_loss": -9.927266120910645, "global_step": 134867, "epoch": 802} {"train_loss": -10.363397598266602, "global_step": 134868, "epoch": 802} {"train_loss": -10.66865062713623, "global_step": 134869, "epoch": 802} {"train_loss": -10.137422561645508, "global_step": 134870, "epoch": 802} {"train_loss": -9.956571578979492, "global_step": 134871, "epoch": 802} {"train_loss": -10.642688751220703, "global_step": 134872, "epoch": 802} {"train_loss": -9.93464469909668, "global_step": 134873, "epoch": 802} {"train_loss": -10.54025936126709, "global_step": 134874, "epoch": 802} {"train_loss": -10.407696723937988, "global_step": 134875, "epoch": 802} {"train_loss": -9.799863815307617, "global_step": 134876, "epoch": 802} {"train_loss": -10.355293273925781, "global_step": 134877, "epoch": 802} {"train_loss": -10.33931827545166, "global_step": 134878, "epoch": 802} {"train_loss": -10.300752639770508, "global_step": 134879, "epoch": 802} {"train_loss": -10.658212661743164, "global_step": 134880, "epoch": 802} {"train_loss": -10.20067024230957, "global_step": 134881, "epoch": 802} {"train_loss": -10.563236236572266, "global_step": 134882, "epoch": 802} {"train_loss": -10.083927154541016, "global_step": 134883, "epoch": 802} {"train_loss": -10.521749496459961, "global_step": 134884, "epoch": 802} {"train_loss": -10.222524642944336, "global_step": 134885, "epoch": 802} {"train_loss": -10.50984001159668, "global_step": 134886, "epoch": 802} {"train_loss": -10.292413711547852, "global_step": 134887, "epoch": 802} {"train_loss": -10.371658325195312, "global_step": 134888, "epoch": 802} {"train_loss": -10.141006469726562, "global_step": 134889, "epoch": 802} {"train_loss": -10.030424118041992, "global_step": 134890, "epoch": 802} {"train_loss": -10.280023574829102, "global_step": 134891, "epoch": 802} {"train_loss": -10.351617813110352, "global_step": 134892, "epoch": 802} {"train_loss": -10.473626136779785, "global_step": 134893, "epoch": 802} {"train_loss": -10.301684379577637, "global_step": 134894, "epoch": 802} {"train_loss": -10.135391235351562, "global_step": 134895, "epoch": 802} {"train_loss": -10.439591407775879, "global_step": 134896, "epoch": 802} {"train_loss": -10.485925674438477, "global_step": 134897, "epoch": 802} {"train_loss": -10.279813766479492, "global_step": 134898, "epoch": 802} {"train_loss": -10.305885314941406, "global_step": 134899, "epoch": 802} {"train_loss": -10.367768287658691, "global_step": 134900, "epoch": 802} {"train_loss": -10.527965545654297, "global_step": 134901, "epoch": 802} {"train_loss": -10.511577606201172, "global_step": 134902, "epoch": 802} {"train_loss": -10.404818341845559, "global_step": 134903, "epoch": 802, "val_loss": 223444.015625} {"train_loss": -10.598114013671875, "global_step": 134904, "epoch": 803} {"train_loss": -10.060585021972656, "global_step": 134905, "epoch": 803} {"train_loss": -10.327860832214355, "global_step": 134906, "epoch": 803} {"train_loss": -10.351959228515625, "global_step": 134907, "epoch": 803} {"train_loss": -10.553832054138184, "global_step": 134908, "epoch": 803} {"train_loss": -10.288053512573242, "global_step": 134909, "epoch": 803} {"train_loss": -10.518143653869629, "global_step": 134910, "epoch": 803} {"train_loss": -10.234929084777832, "global_step": 134911, "epoch": 803} {"train_loss": -10.602239608764648, "global_step": 134912, "epoch": 803} {"train_loss": -10.180819511413574, "global_step": 134913, "epoch": 803} {"train_loss": -10.334875106811523, "global_step": 134914, "epoch": 803} {"train_loss": -10.687277793884277, "global_step": 134915, "epoch": 803} {"train_loss": -10.4514799118042, "global_step": 134916, "epoch": 803} {"train_loss": -10.311763763427734, "global_step": 134917, "epoch": 803} {"train_loss": -10.566266059875488, "global_step": 134918, "epoch": 803} {"train_loss": -10.537038803100586, "global_step": 134919, "epoch": 803} {"train_loss": -9.838939666748047, "global_step": 134920, "epoch": 803} {"train_loss": -10.433350563049316, "global_step": 134921, "epoch": 803} {"train_loss": -10.179390907287598, "global_step": 134922, "epoch": 803} {"train_loss": -10.614595413208008, "global_step": 134923, "epoch": 803} {"train_loss": -10.615660667419434, "global_step": 134924, "epoch": 803} {"train_loss": -10.373571395874023, "global_step": 134925, "epoch": 803} {"train_loss": -10.463393211364746, "global_step": 134926, "epoch": 803} {"train_loss": -10.091049194335938, "global_step": 134927, "epoch": 803} {"train_loss": -10.59804916381836, "global_step": 134928, "epoch": 803} {"train_loss": -10.552431106567383, "global_step": 134929, "epoch": 803} {"train_loss": -10.489253997802734, "global_step": 134930, "epoch": 803} {"train_loss": -10.447164535522461, "global_step": 134931, "epoch": 803} {"train_loss": -10.355531692504883, "global_step": 134932, "epoch": 803} {"train_loss": -10.67879581451416, "global_step": 134933, "epoch": 803} {"train_loss": -9.841583251953125, "global_step": 134934, "epoch": 803} {"train_loss": -10.778956413269043, "global_step": 134935, "epoch": 803} {"train_loss": -9.794087409973145, "global_step": 134936, "epoch": 803} {"train_loss": -10.296794891357422, "global_step": 134937, "epoch": 803} {"train_loss": -10.257380485534668, "global_step": 134938, "epoch": 803} {"train_loss": -10.020898818969727, "global_step": 134939, "epoch": 803} {"train_loss": -10.278457641601562, "global_step": 134940, "epoch": 803} {"train_loss": -9.963903427124023, "global_step": 134941, "epoch": 803} {"train_loss": -10.526594161987305, "global_step": 134942, "epoch": 803} {"train_loss": -9.970420837402344, "global_step": 134943, "epoch": 803} {"train_loss": -10.490504264831543, "global_step": 134944, "epoch": 803} {"train_loss": -10.276658058166504, "global_step": 134945, "epoch": 803} {"train_loss": -10.390803337097168, "global_step": 134946, "epoch": 803} {"train_loss": -10.091715812683105, "global_step": 134947, "epoch": 803} {"train_loss": -10.475650787353516, "global_step": 134948, "epoch": 803} {"train_loss": -10.675399780273438, "global_step": 134949, "epoch": 803} {"train_loss": -10.679524421691895, "global_step": 134950, "epoch": 803} {"train_loss": -10.210712432861328, "global_step": 134951, "epoch": 803} {"train_loss": -10.01821517944336, "global_step": 134952, "epoch": 803} {"train_loss": -10.163686752319336, "global_step": 134953, "epoch": 803} {"train_loss": -10.13548755645752, "global_step": 134954, "epoch": 803} {"train_loss": -10.58824348449707, "global_step": 134955, "epoch": 803} {"train_loss": -10.480093955993652, "global_step": 134956, "epoch": 803} {"train_loss": -10.12690544128418, "global_step": 134957, "epoch": 803} {"train_loss": -10.023514747619629, "global_step": 134958, "epoch": 803} {"train_loss": -10.497822761535645, "global_step": 134959, "epoch": 803} {"train_loss": -10.03300666809082, "global_step": 134960, "epoch": 803} {"train_loss": -10.583503723144531, "global_step": 134961, "epoch": 803} {"train_loss": -9.795177459716797, "global_step": 134962, "epoch": 803} {"train_loss": -10.085372924804688, "global_step": 134963, "epoch": 803} {"train_loss": -10.241905212402344, "global_step": 134964, "epoch": 803} {"train_loss": -10.471689224243164, "global_step": 134965, "epoch": 803} {"train_loss": -10.596555709838867, "global_step": 134966, "epoch": 803} {"train_loss": -10.074312210083008, "global_step": 134967, "epoch": 803} {"train_loss": -10.680990219116211, "global_step": 134968, "epoch": 803} {"train_loss": -10.190189361572266, "global_step": 134969, "epoch": 803} {"train_loss": -10.32358169555664, "global_step": 134970, "epoch": 803} {"train_loss": -10.377180099487305, "global_step": 134971, "epoch": 803} {"train_loss": -10.6083402633667, "global_step": 134972, "epoch": 803} {"train_loss": -10.439020156860352, "global_step": 134973, "epoch": 803} {"train_loss": -10.577516555786133, "global_step": 134974, "epoch": 803} {"train_loss": -10.620553970336914, "global_step": 134975, "epoch": 803} {"train_loss": -10.550607681274414, "global_step": 134976, "epoch": 803} {"train_loss": -10.805253982543945, "global_step": 134977, "epoch": 803} {"train_loss": -10.493844032287598, "global_step": 134978, "epoch": 803} {"train_loss": -10.714258193969727, "global_step": 134979, "epoch": 803} {"train_loss": -10.609046936035156, "global_step": 134980, "epoch": 803} {"train_loss": -10.406667709350586, "global_step": 134981, "epoch": 803} {"train_loss": -10.747747421264648, "global_step": 134982, "epoch": 803} {"train_loss": -10.454743385314941, "global_step": 134983, "epoch": 803} {"train_loss": -10.625566482543945, "global_step": 134984, "epoch": 803} {"train_loss": -10.456989288330078, "global_step": 134985, "epoch": 803} {"train_loss": -10.409402847290039, "global_step": 134986, "epoch": 803} {"train_loss": -10.721574783325195, "global_step": 134987, "epoch": 803} {"train_loss": -10.519347190856934, "global_step": 134988, "epoch": 803} {"train_loss": -10.644405364990234, "global_step": 134989, "epoch": 803} {"train_loss": -10.495906829833984, "global_step": 134990, "epoch": 803} {"train_loss": -10.460755348205566, "global_step": 134991, "epoch": 803} {"train_loss": -10.900503158569336, "global_step": 134992, "epoch": 803} {"train_loss": -10.417600631713867, "global_step": 134993, "epoch": 803} {"train_loss": -10.379667282104492, "global_step": 134994, "epoch": 803} {"train_loss": -10.585041046142578, "global_step": 134995, "epoch": 803} {"train_loss": -9.946842193603516, "global_step": 134996, "epoch": 803} {"train_loss": -10.477785110473633, "global_step": 134997, "epoch": 803} {"train_loss": -9.726455688476562, "global_step": 134998, "epoch": 803} {"train_loss": -10.091842651367188, "global_step": 134999, "epoch": 803} {"train_loss": -10.381622314453125, "global_step": 135000, "epoch": 803} {"train_loss": -10.056947708129883, "global_step": 135001, "epoch": 803} {"train_loss": -10.356987953186035, "global_step": 135002, "epoch": 803} {"train_loss": -9.838924407958984, "global_step": 135003, "epoch": 803} {"train_loss": -9.771465301513672, "global_step": 135004, "epoch": 803} {"train_loss": -9.52043342590332, "global_step": 135005, "epoch": 803} {"train_loss": -9.847576141357422, "global_step": 135006, "epoch": 803} {"train_loss": -10.175141334533691, "global_step": 135007, "epoch": 803} {"train_loss": -9.65739631652832, "global_step": 135008, "epoch": 803} {"train_loss": -10.400145530700684, "global_step": 135009, "epoch": 803} {"train_loss": -9.37317180633545, "global_step": 135010, "epoch": 803} {"train_loss": -9.994795799255371, "global_step": 135011, "epoch": 803} {"train_loss": -9.544944763183594, "global_step": 135012, "epoch": 803} {"train_loss": -10.21509075164795, "global_step": 135013, "epoch": 803} {"train_loss": -9.693138122558594, "global_step": 135014, "epoch": 803} {"train_loss": -10.336231231689453, "global_step": 135015, "epoch": 803} {"train_loss": -9.76538372039795, "global_step": 135016, "epoch": 803} {"train_loss": -10.375616073608398, "global_step": 135017, "epoch": 803} {"train_loss": -10.151466369628906, "global_step": 135018, "epoch": 803} {"train_loss": -10.340593338012695, "global_step": 135019, "epoch": 803} {"train_loss": -10.286040306091309, "global_step": 135020, "epoch": 803} {"train_loss": -10.4865140914917, "global_step": 135021, "epoch": 803} {"train_loss": -10.174190521240234, "global_step": 135022, "epoch": 803} {"train_loss": -10.335289001464844, "global_step": 135023, "epoch": 803} {"train_loss": -10.217679023742676, "global_step": 135024, "epoch": 803} {"train_loss": -10.303666114807129, "global_step": 135025, "epoch": 803} {"train_loss": -10.255697250366211, "global_step": 135026, "epoch": 803} {"train_loss": -10.441341400146484, "global_step": 135027, "epoch": 803} {"train_loss": -10.079817771911621, "global_step": 135028, "epoch": 803} {"train_loss": -10.493673324584961, "global_step": 135029, "epoch": 803} {"train_loss": -10.235066413879395, "global_step": 135030, "epoch": 803} {"train_loss": -10.450298309326172, "global_step": 135031, "epoch": 803} {"train_loss": -10.507433891296387, "global_step": 135032, "epoch": 803} {"train_loss": -10.58072280883789, "global_step": 135033, "epoch": 803} {"train_loss": -10.26036262512207, "global_step": 135034, "epoch": 803} {"train_loss": -10.396644592285156, "global_step": 135035, "epoch": 803} {"train_loss": -10.379619598388672, "global_step": 135036, "epoch": 803} {"train_loss": -10.294673919677734, "global_step": 135037, "epoch": 803} {"train_loss": -10.50168514251709, "global_step": 135038, "epoch": 803} {"train_loss": -10.198370933532715, "global_step": 135039, "epoch": 803} {"train_loss": -10.687601089477539, "global_step": 135040, "epoch": 803} {"train_loss": -10.388021469116211, "global_step": 135041, "epoch": 803} {"train_loss": -10.464544296264648, "global_step": 135042, "epoch": 803} {"train_loss": -10.117378234863281, "global_step": 135043, "epoch": 803} {"train_loss": -10.743963241577148, "global_step": 135044, "epoch": 803} {"train_loss": -10.233948707580566, "global_step": 135045, "epoch": 803} {"train_loss": -10.585566520690918, "global_step": 135046, "epoch": 803} {"train_loss": -10.072412490844727, "global_step": 135047, "epoch": 803} {"train_loss": -10.665271759033203, "global_step": 135048, "epoch": 803} {"train_loss": -10.411529541015625, "global_step": 135049, "epoch": 803} {"train_loss": -10.674324035644531, "global_step": 135050, "epoch": 803} {"train_loss": -10.452466011047363, "global_step": 135051, "epoch": 803} {"train_loss": -10.492547035217285, "global_step": 135052, "epoch": 803} {"train_loss": -10.60670280456543, "global_step": 135053, "epoch": 803} {"train_loss": -10.769388198852539, "global_step": 135054, "epoch": 803} {"train_loss": -10.743274688720703, "global_step": 135055, "epoch": 803} {"train_loss": -10.689414978027344, "global_step": 135056, "epoch": 803} {"train_loss": -10.641897201538086, "global_step": 135057, "epoch": 803} {"train_loss": -10.731945037841797, "global_step": 135058, "epoch": 803} {"train_loss": -10.497825622558594, "global_step": 135059, "epoch": 803} {"train_loss": -10.67412281036377, "global_step": 135060, "epoch": 803} {"train_loss": -10.238591194152832, "global_step": 135061, "epoch": 803} {"train_loss": -10.60639762878418, "global_step": 135062, "epoch": 803} {"train_loss": -10.305227279663086, "global_step": 135063, "epoch": 803} {"train_loss": -10.639541625976562, "global_step": 135064, "epoch": 803} {"train_loss": -10.529520034790039, "global_step": 135065, "epoch": 803} {"train_loss": -10.102361679077148, "global_step": 135066, "epoch": 803} {"train_loss": -10.207162857055664, "global_step": 135067, "epoch": 803} {"train_loss": -10.069229125976562, "global_step": 135068, "epoch": 803} {"train_loss": -10.399528503417969, "global_step": 135069, "epoch": 803} {"train_loss": -9.989141464233398, "global_step": 135070, "epoch": 803} {"train_loss": -10.346990335555304, "global_step": 135071, "epoch": 803, "val_loss": 222946.328125} {"train_loss": -9.404468536376953, "global_step": 135072, "epoch": 804} {"train_loss": -10.348106384277344, "global_step": 135073, "epoch": 804} {"train_loss": -10.362478256225586, "global_step": 135074, "epoch": 804} {"train_loss": -10.070623397827148, "global_step": 135075, "epoch": 804} {"train_loss": -10.32132339477539, "global_step": 135076, "epoch": 804} {"train_loss": -10.162530899047852, "global_step": 135077, "epoch": 804} {"train_loss": -10.351540565490723, "global_step": 135078, "epoch": 804} {"train_loss": -10.275127410888672, "global_step": 135079, "epoch": 804} {"train_loss": -10.291799545288086, "global_step": 135080, "epoch": 804} {"train_loss": -10.389373779296875, "global_step": 135081, "epoch": 804} {"train_loss": -10.447921752929688, "global_step": 135082, "epoch": 804} {"train_loss": -10.584798812866211, "global_step": 135083, "epoch": 804} {"train_loss": -10.377920150756836, "global_step": 135084, "epoch": 804} {"train_loss": -10.34836196899414, "global_step": 135085, "epoch": 804} {"train_loss": -10.378168106079102, "global_step": 135086, "epoch": 804} {"train_loss": -10.137343406677246, "global_step": 135087, "epoch": 804} {"train_loss": -10.26555061340332, "global_step": 135088, "epoch": 804} {"train_loss": -10.194197654724121, "global_step": 135089, "epoch": 804} {"train_loss": -10.207830429077148, "global_step": 135090, "epoch": 804} {"train_loss": -10.177231788635254, "global_step": 135091, "epoch": 804} {"train_loss": -9.570785522460938, "global_step": 135092, "epoch": 804} {"train_loss": -10.042768478393555, "global_step": 135093, "epoch": 804} {"train_loss": -9.681873321533203, "global_step": 135094, "epoch": 804} {"train_loss": -10.579126358032227, "global_step": 135095, "epoch": 804} {"train_loss": -10.052230834960938, "global_step": 135096, "epoch": 804} {"train_loss": -10.32040786743164, "global_step": 135097, "epoch": 804} {"train_loss": -10.364269256591797, "global_step": 135098, "epoch": 804} {"train_loss": -10.07229995727539, "global_step": 135099, "epoch": 804} {"train_loss": -10.338833808898926, "global_step": 135100, "epoch": 804} {"train_loss": -10.37470817565918, "global_step": 135101, "epoch": 804} {"train_loss": -10.222637176513672, "global_step": 135102, "epoch": 804} {"train_loss": -10.450540542602539, "global_step": 135103, "epoch": 804} {"train_loss": -10.156350135803223, "global_step": 135104, "epoch": 804} {"train_loss": -10.290929794311523, "global_step": 135105, "epoch": 804} {"train_loss": -10.549667358398438, "global_step": 135106, "epoch": 804} {"train_loss": -10.409422874450684, "global_step": 135107, "epoch": 804} {"train_loss": -10.053529739379883, "global_step": 135108, "epoch": 804} {"train_loss": -10.34305191040039, "global_step": 135109, "epoch": 804} {"train_loss": -9.991904258728027, "global_step": 135110, "epoch": 804} {"train_loss": -10.332258224487305, "global_step": 135111, "epoch": 804} {"train_loss": -10.04051399230957, "global_step": 135112, "epoch": 804} {"train_loss": -10.313188552856445, "global_step": 135113, "epoch": 804} {"train_loss": -10.05311393737793, "global_step": 135114, "epoch": 804} {"train_loss": -10.365028381347656, "global_step": 135115, "epoch": 804} {"train_loss": -9.949052810668945, "global_step": 135116, "epoch": 804} {"train_loss": -10.34424877166748, "global_step": 135117, "epoch": 804} {"train_loss": -10.395637512207031, "global_step": 135118, "epoch": 804} {"train_loss": -10.254150390625, "global_step": 135119, "epoch": 804} {"train_loss": -10.620511054992676, "global_step": 135120, "epoch": 804} {"train_loss": -10.079556465148926, "global_step": 135121, "epoch": 804} {"train_loss": -10.286877632141113, "global_step": 135122, "epoch": 804} {"train_loss": -10.524169921875, "global_step": 135123, "epoch": 804} {"train_loss": -10.529139518737793, "global_step": 135124, "epoch": 804} {"train_loss": -10.710077285766602, "global_step": 135125, "epoch": 804} {"train_loss": -10.679789543151855, "global_step": 135126, "epoch": 804} {"train_loss": -10.30534839630127, "global_step": 135127, "epoch": 804} {"train_loss": -10.604795455932617, "global_step": 135128, "epoch": 804} {"train_loss": -10.686920166015625, "global_step": 135129, "epoch": 804} {"train_loss": -10.544376373291016, "global_step": 135130, "epoch": 804} {"train_loss": -10.639347076416016, "global_step": 135131, "epoch": 804} {"train_loss": -10.686117172241211, "global_step": 135132, "epoch": 804} {"train_loss": -10.774629592895508, "global_step": 135133, "epoch": 804} {"train_loss": -10.670391082763672, "global_step": 135134, "epoch": 804} {"train_loss": -10.76467227935791, "global_step": 135135, "epoch": 804} {"train_loss": -10.80946159362793, "global_step": 135136, "epoch": 804} {"train_loss": -10.698047637939453, "global_step": 135137, "epoch": 804} {"train_loss": -10.755428314208984, "global_step": 135138, "epoch": 804} {"train_loss": -10.87153434753418, "global_step": 135139, "epoch": 804} {"train_loss": -10.626758575439453, "global_step": 135140, "epoch": 804} {"train_loss": -10.6987886428833, "global_step": 135141, "epoch": 804} {"train_loss": -10.667579650878906, "global_step": 135142, "epoch": 804} {"train_loss": -10.569622039794922, "global_step": 135143, "epoch": 804} {"train_loss": -10.578550338745117, "global_step": 135144, "epoch": 804} {"train_loss": -10.704000473022461, "global_step": 135145, "epoch": 804} {"train_loss": -10.642667770385742, "global_step": 135146, "epoch": 804} {"train_loss": -10.292007446289062, "global_step": 135147, "epoch": 804} {"train_loss": -10.446687698364258, "global_step": 135148, "epoch": 804} {"train_loss": -9.962127685546875, "global_step": 135149, "epoch": 804} {"train_loss": -9.779943466186523, "global_step": 135150, "epoch": 804} {"train_loss": -9.974493980407715, "global_step": 135151, "epoch": 804} {"train_loss": -10.380996704101562, "global_step": 135152, "epoch": 804} {"train_loss": -9.938179969787598, "global_step": 135153, "epoch": 804} {"train_loss": -9.977703094482422, "global_step": 135154, "epoch": 804} {"train_loss": -10.405900955200195, "global_step": 135155, "epoch": 804} {"train_loss": -9.887941360473633, "global_step": 135156, "epoch": 804} {"train_loss": -9.962852478027344, "global_step": 135157, "epoch": 804} {"train_loss": -9.909284591674805, "global_step": 135158, "epoch": 804} {"train_loss": -9.563779830932617, "global_step": 135159, "epoch": 804} {"train_loss": -9.868427276611328, "global_step": 135160, "epoch": 804} {"train_loss": -9.889607429504395, "global_step": 135161, "epoch": 804} {"train_loss": -10.2598876953125, "global_step": 135162, "epoch": 804} {"train_loss": -10.069681167602539, "global_step": 135163, "epoch": 804} {"train_loss": -10.412920951843262, "global_step": 135164, "epoch": 804} {"train_loss": -10.000986099243164, "global_step": 135165, "epoch": 804} {"train_loss": -10.342059135437012, "global_step": 135166, "epoch": 804} {"train_loss": -10.151942253112793, "global_step": 135167, "epoch": 804} {"train_loss": -10.439010620117188, "global_step": 135168, "epoch": 804} {"train_loss": -10.043752670288086, "global_step": 135169, "epoch": 804} {"train_loss": -10.592695236206055, "global_step": 135170, "epoch": 804} {"train_loss": -10.00132942199707, "global_step": 135171, "epoch": 804} {"train_loss": -10.594219207763672, "global_step": 135172, "epoch": 804} {"train_loss": -10.305130004882812, "global_step": 135173, "epoch": 804} {"train_loss": -10.602025985717773, "global_step": 135174, "epoch": 804} {"train_loss": -10.286173820495605, "global_step": 135175, "epoch": 804} {"train_loss": -10.487374305725098, "global_step": 135176, "epoch": 804} {"train_loss": -10.268045425415039, "global_step": 135177, "epoch": 804} {"train_loss": -10.703901290893555, "global_step": 135178, "epoch": 804} {"train_loss": -10.024139404296875, "global_step": 135179, "epoch": 804} {"train_loss": -10.662481307983398, "global_step": 135180, "epoch": 804} {"train_loss": -10.323049545288086, "global_step": 135181, "epoch": 804} {"train_loss": -10.532022476196289, "global_step": 135182, "epoch": 804} {"train_loss": -10.414997100830078, "global_step": 135183, "epoch": 804} {"train_loss": -10.362576484680176, "global_step": 135184, "epoch": 804} {"train_loss": -10.010555267333984, "global_step": 135185, "epoch": 804} {"train_loss": -10.40261173248291, "global_step": 135186, "epoch": 804} {"train_loss": -10.202351570129395, "global_step": 135187, "epoch": 804} {"train_loss": -10.384474754333496, "global_step": 135188, "epoch": 804} {"train_loss": -10.500165939331055, "global_step": 135189, "epoch": 804} {"train_loss": -10.275751113891602, "global_step": 135190, "epoch": 804} {"train_loss": -10.636905670166016, "global_step": 135191, "epoch": 804} {"train_loss": -10.604907989501953, "global_step": 135192, "epoch": 804} {"train_loss": -10.333717346191406, "global_step": 135193, "epoch": 804} {"train_loss": -10.848970413208008, "global_step": 135194, "epoch": 804} {"train_loss": -10.608630180358887, "global_step": 135195, "epoch": 804} {"train_loss": -10.7034912109375, "global_step": 135196, "epoch": 804} {"train_loss": -10.549737930297852, "global_step": 135197, "epoch": 804} {"train_loss": -10.320322036743164, "global_step": 135198, "epoch": 804} {"train_loss": -10.577417373657227, "global_step": 135199, "epoch": 804} {"train_loss": -10.754785537719727, "global_step": 135200, "epoch": 804} {"train_loss": -10.433219909667969, "global_step": 135201, "epoch": 804} {"train_loss": -10.573174476623535, "global_step": 135202, "epoch": 804} {"train_loss": -10.82830810546875, "global_step": 135203, "epoch": 804} {"train_loss": -10.771808624267578, "global_step": 135204, "epoch": 804} {"train_loss": -10.399539947509766, "global_step": 135205, "epoch": 804} {"train_loss": -10.398146629333496, "global_step": 135206, "epoch": 804} {"train_loss": -10.530502319335938, "global_step": 135207, "epoch": 804} {"train_loss": -10.629859924316406, "global_step": 135208, "epoch": 804} {"train_loss": -10.520650863647461, "global_step": 135209, "epoch": 804} {"train_loss": -10.16476058959961, "global_step": 135210, "epoch": 804} {"train_loss": -10.607017517089844, "global_step": 135211, "epoch": 804} {"train_loss": -10.337532997131348, "global_step": 135212, "epoch": 804} {"train_loss": -10.579618453979492, "global_step": 135213, "epoch": 804} {"train_loss": -10.4166841506958, "global_step": 135214, "epoch": 804} {"train_loss": -10.28797721862793, "global_step": 135215, "epoch": 804} {"train_loss": -10.660415649414062, "global_step": 135216, "epoch": 804} {"train_loss": -10.12797737121582, "global_step": 135217, "epoch": 804} {"train_loss": -10.282142639160156, "global_step": 135218, "epoch": 804} {"train_loss": -10.532536506652832, "global_step": 135219, "epoch": 804} {"train_loss": -10.056145668029785, "global_step": 135220, "epoch": 804} {"train_loss": -10.648648262023926, "global_step": 135221, "epoch": 804} {"train_loss": -10.472297668457031, "global_step": 135222, "epoch": 804} {"train_loss": -9.894487380981445, "global_step": 135223, "epoch": 804} {"train_loss": -9.961360931396484, "global_step": 135224, "epoch": 804} {"train_loss": -10.426847457885742, "global_step": 135225, "epoch": 804} {"train_loss": -9.705577850341797, "global_step": 135226, "epoch": 804} {"train_loss": -10.372872352600098, "global_step": 135227, "epoch": 804} {"train_loss": -9.30645751953125, "global_step": 135228, "epoch": 804} {"train_loss": -10.294690132141113, "global_step": 135229, "epoch": 804} {"train_loss": -9.771854400634766, "global_step": 135230, "epoch": 804} {"train_loss": -10.39486312866211, "global_step": 135231, "epoch": 804} {"train_loss": -10.01832389831543, "global_step": 135232, "epoch": 804} {"train_loss": -10.28110122680664, "global_step": 135233, "epoch": 804} {"train_loss": -10.056922912597656, "global_step": 135234, "epoch": 804} {"train_loss": -10.0178861618042, "global_step": 135235, "epoch": 804} {"train_loss": -10.0930757522583, "global_step": 135236, "epoch": 804} {"train_loss": -10.096402168273926, "global_step": 135237, "epoch": 804} {"train_loss": -10.367413520812988, "global_step": 135238, "epoch": 804} {"train_loss": -10.325786817641486, "global_step": 135239, "epoch": 804, "val_loss": 222144.171875} {"train_loss": -10.19029426574707, "global_step": 135240, "epoch": 805} {"train_loss": -10.200958251953125, "global_step": 135241, "epoch": 805} {"train_loss": -10.04083251953125, "global_step": 135242, "epoch": 805} {"train_loss": -10.050749778747559, "global_step": 135243, "epoch": 805} {"train_loss": -10.241546630859375, "global_step": 135244, "epoch": 805} {"train_loss": -10.152352333068848, "global_step": 135245, "epoch": 805} {"train_loss": -10.690576553344727, "global_step": 135246, "epoch": 805} {"train_loss": -10.377819061279297, "global_step": 135247, "epoch": 805} {"train_loss": -10.303083419799805, "global_step": 135248, "epoch": 805} {"train_loss": -10.521892547607422, "global_step": 135249, "epoch": 805} {"train_loss": -10.365066528320312, "global_step": 135250, "epoch": 805} {"train_loss": -10.385254859924316, "global_step": 135251, "epoch": 805} {"train_loss": -10.36929988861084, "global_step": 135252, "epoch": 805} {"train_loss": -10.593841552734375, "global_step": 135253, "epoch": 805} {"train_loss": -10.152849197387695, "global_step": 135254, "epoch": 805} {"train_loss": -10.414422988891602, "global_step": 135255, "epoch": 805} {"train_loss": -10.674034118652344, "global_step": 135256, "epoch": 805} {"train_loss": -10.118175506591797, "global_step": 135257, "epoch": 805} {"train_loss": -10.592552185058594, "global_step": 135258, "epoch": 805} {"train_loss": -10.359365463256836, "global_step": 135259, "epoch": 805} {"train_loss": -10.317841529846191, "global_step": 135260, "epoch": 805} {"train_loss": -10.767098426818848, "global_step": 135261, "epoch": 805} {"train_loss": -10.432735443115234, "global_step": 135262, "epoch": 805} {"train_loss": -10.515007972717285, "global_step": 135263, "epoch": 805} {"train_loss": -10.627674102783203, "global_step": 135264, "epoch": 805} {"train_loss": -10.677591323852539, "global_step": 135265, "epoch": 805} {"train_loss": -10.083635330200195, "global_step": 135266, "epoch": 805} {"train_loss": -10.488037109375, "global_step": 135267, "epoch": 805} {"train_loss": -10.41443920135498, "global_step": 135268, "epoch": 805} {"train_loss": -10.564961433410645, "global_step": 135269, "epoch": 805} {"train_loss": -10.66590690612793, "global_step": 135270, "epoch": 805} {"train_loss": -10.552566528320312, "global_step": 135271, "epoch": 805} {"train_loss": -10.692720413208008, "global_step": 135272, "epoch": 805} {"train_loss": -10.854766845703125, "global_step": 135273, "epoch": 805} {"train_loss": -10.805212020874023, "global_step": 135274, "epoch": 805} {"train_loss": -10.59447956085205, "global_step": 135275, "epoch": 805} {"train_loss": -10.829402923583984, "global_step": 135276, "epoch": 805} {"train_loss": -10.783127784729004, "global_step": 135277, "epoch": 805} {"train_loss": -10.838876724243164, "global_step": 135278, "epoch": 805} {"train_loss": -10.584415435791016, "global_step": 135279, "epoch": 805} {"train_loss": -10.786641120910645, "global_step": 135280, "epoch": 805} {"train_loss": -10.672332763671875, "global_step": 135281, "epoch": 805} {"train_loss": -10.58940601348877, "global_step": 135282, "epoch": 805} {"train_loss": -10.697944641113281, "global_step": 135283, "epoch": 805} {"train_loss": -10.883901596069336, "global_step": 135284, "epoch": 805} {"train_loss": -10.670801162719727, "global_step": 135285, "epoch": 805} {"train_loss": -10.877239227294922, "global_step": 135286, "epoch": 805} {"train_loss": -10.717070579528809, "global_step": 135287, "epoch": 805} {"train_loss": -10.785950660705566, "global_step": 135288, "epoch": 805} {"train_loss": -10.657188415527344, "global_step": 135289, "epoch": 805} {"train_loss": -10.63662338256836, "global_step": 135290, "epoch": 805} {"train_loss": -10.423395156860352, "global_step": 135291, "epoch": 805} {"train_loss": -10.132389068603516, "global_step": 135292, "epoch": 805} {"train_loss": -10.865421295166016, "global_step": 135293, "epoch": 805} {"train_loss": -10.344769477844238, "global_step": 135294, "epoch": 805} {"train_loss": -10.18135929107666, "global_step": 135295, "epoch": 805} {"train_loss": -10.278095245361328, "global_step": 135296, "epoch": 805} {"train_loss": -10.698663711547852, "global_step": 135297, "epoch": 805} {"train_loss": -10.567035675048828, "global_step": 135298, "epoch": 805} {"train_loss": -10.359292030334473, "global_step": 135299, "epoch": 805} {"train_loss": -10.46760368347168, "global_step": 135300, "epoch": 805} {"train_loss": -10.522192001342773, "global_step": 135301, "epoch": 805} {"train_loss": -9.988626480102539, "global_step": 135302, "epoch": 805} {"train_loss": -9.661101341247559, "global_step": 135303, "epoch": 805} {"train_loss": -10.482595443725586, "global_step": 135304, "epoch": 805} {"train_loss": -9.364439010620117, "global_step": 135305, "epoch": 805} {"train_loss": -10.13786792755127, "global_step": 135306, "epoch": 805} {"train_loss": -10.396852493286133, "global_step": 135307, "epoch": 805} {"train_loss": -9.73967170715332, "global_step": 135308, "epoch": 805} {"train_loss": -10.63176441192627, "global_step": 135309, "epoch": 805} {"train_loss": -9.968229293823242, "global_step": 135310, "epoch": 805} {"train_loss": -10.513045310974121, "global_step": 135311, "epoch": 805} {"train_loss": -10.100234985351562, "global_step": 135312, "epoch": 805} {"train_loss": -9.726085662841797, "global_step": 135313, "epoch": 805} {"train_loss": -10.169656753540039, "global_step": 135314, "epoch": 805} {"train_loss": -9.794393539428711, "global_step": 135315, "epoch": 805} {"train_loss": -10.315162658691406, "global_step": 135316, "epoch": 805} {"train_loss": -10.401473045349121, "global_step": 135317, "epoch": 805} {"train_loss": -10.325248718261719, "global_step": 135318, "epoch": 805} {"train_loss": -10.06026840209961, "global_step": 135319, "epoch": 805} {"train_loss": -10.451065063476562, "global_step": 135320, "epoch": 805} {"train_loss": -10.050128936767578, "global_step": 135321, "epoch": 805} {"train_loss": -10.299833297729492, "global_step": 135322, "epoch": 805} {"train_loss": -10.329358100891113, "global_step": 135323, "epoch": 805} {"train_loss": -9.973345756530762, "global_step": 135324, "epoch": 805} {"train_loss": -10.506027221679688, "global_step": 135325, "epoch": 805} {"train_loss": -10.32214641571045, "global_step": 135326, "epoch": 805} {"train_loss": -10.25770378112793, "global_step": 135327, "epoch": 805} {"train_loss": -10.522335052490234, "global_step": 135328, "epoch": 805} {"train_loss": -10.29373550415039, "global_step": 135329, "epoch": 805} {"train_loss": -10.172120094299316, "global_step": 135330, "epoch": 805} {"train_loss": -10.252325057983398, "global_step": 135331, "epoch": 805} {"train_loss": -10.315114974975586, "global_step": 135332, "epoch": 805} {"train_loss": -10.322015762329102, "global_step": 135333, "epoch": 805} {"train_loss": -10.574369430541992, "global_step": 135334, "epoch": 805} {"train_loss": -10.1463041305542, "global_step": 135335, "epoch": 805} {"train_loss": -10.446529388427734, "global_step": 135336, "epoch": 805} {"train_loss": -10.715241432189941, "global_step": 135337, "epoch": 805} {"train_loss": -10.31319808959961, "global_step": 135338, "epoch": 805} {"train_loss": -10.464920043945312, "global_step": 135339, "epoch": 805} {"train_loss": -10.144084930419922, "global_step": 135340, "epoch": 805} {"train_loss": -10.417877197265625, "global_step": 135341, "epoch": 805} {"train_loss": -10.384448051452637, "global_step": 135342, "epoch": 805} {"train_loss": -10.541550636291504, "global_step": 135343, "epoch": 805} {"train_loss": -10.523073196411133, "global_step": 135344, "epoch": 805} {"train_loss": -10.551336288452148, "global_step": 135345, "epoch": 805} {"train_loss": -10.442554473876953, "global_step": 135346, "epoch": 805} {"train_loss": -10.446035385131836, "global_step": 135347, "epoch": 805} {"train_loss": -10.345913887023926, "global_step": 135348, "epoch": 805} {"train_loss": -10.569661140441895, "global_step": 135349, "epoch": 805} {"train_loss": -10.797347068786621, "global_step": 135350, "epoch": 805} {"train_loss": -10.505870819091797, "global_step": 135351, "epoch": 805} {"train_loss": -10.78060531616211, "global_step": 135352, "epoch": 805} {"train_loss": -10.584630966186523, "global_step": 135353, "epoch": 805} {"train_loss": -10.551605224609375, "global_step": 135354, "epoch": 805} {"train_loss": -10.444908142089844, "global_step": 135355, "epoch": 805} {"train_loss": -10.71818733215332, "global_step": 135356, "epoch": 805} {"train_loss": -10.58356761932373, "global_step": 135357, "epoch": 805} {"train_loss": -10.59623908996582, "global_step": 135358, "epoch": 805} {"train_loss": -10.606433868408203, "global_step": 135359, "epoch": 805} {"train_loss": -10.487348556518555, "global_step": 135360, "epoch": 805} {"train_loss": -10.77825927734375, "global_step": 135361, "epoch": 805} {"train_loss": -10.51470947265625, "global_step": 135362, "epoch": 805} {"train_loss": -10.384151458740234, "global_step": 135363, "epoch": 805} {"train_loss": -10.451881408691406, "global_step": 135364, "epoch": 805} {"train_loss": -10.554078102111816, "global_step": 135365, "epoch": 805} {"train_loss": -10.804166793823242, "global_step": 135366, "epoch": 805} {"train_loss": -10.64400863647461, "global_step": 135367, "epoch": 805} {"train_loss": -10.504610061645508, "global_step": 135368, "epoch": 805} {"train_loss": -10.551766395568848, "global_step": 135369, "epoch": 805} {"train_loss": -10.100510597229004, "global_step": 135370, "epoch": 805} {"train_loss": -10.812904357910156, "global_step": 135371, "epoch": 805} {"train_loss": -10.342547416687012, "global_step": 135372, "epoch": 805} {"train_loss": -10.640151977539062, "global_step": 135373, "epoch": 805} {"train_loss": -10.304981231689453, "global_step": 135374, "epoch": 805} {"train_loss": -10.687731742858887, "global_step": 135375, "epoch": 805} {"train_loss": -10.678695678710938, "global_step": 135376, "epoch": 805} {"train_loss": -10.682750701904297, "global_step": 135377, "epoch": 805} {"train_loss": -10.566718101501465, "global_step": 135378, "epoch": 805} {"train_loss": -10.6593017578125, "global_step": 135379, "epoch": 805} {"train_loss": -10.591063499450684, "global_step": 135380, "epoch": 805} {"train_loss": -10.6973876953125, "global_step": 135381, "epoch": 805} {"train_loss": -10.757089614868164, "global_step": 135382, "epoch": 805} {"train_loss": -10.268954277038574, "global_step": 135383, "epoch": 805} {"train_loss": -10.760903358459473, "global_step": 135384, "epoch": 805} {"train_loss": -10.402799606323242, "global_step": 135385, "epoch": 805} {"train_loss": -10.379182815551758, "global_step": 135386, "epoch": 805} {"train_loss": -10.639032363891602, "global_step": 135387, "epoch": 805} {"train_loss": -10.802114486694336, "global_step": 135388, "epoch": 805} {"train_loss": -10.553112983703613, "global_step": 135389, "epoch": 805} {"train_loss": -10.475013732910156, "global_step": 135390, "epoch": 805} {"train_loss": -10.75397777557373, "global_step": 135391, "epoch": 805} {"train_loss": -10.575100898742676, "global_step": 135392, "epoch": 805} {"train_loss": -10.571075439453125, "global_step": 135393, "epoch": 805} {"train_loss": -10.543096542358398, "global_step": 135394, "epoch": 805} {"train_loss": -10.622221946716309, "global_step": 135395, "epoch": 805} {"train_loss": -10.429193496704102, "global_step": 135396, "epoch": 805} {"train_loss": -10.433868408203125, "global_step": 135397, "epoch": 805} {"train_loss": -10.482776641845703, "global_step": 135398, "epoch": 805} {"train_loss": -10.190361022949219, "global_step": 135399, "epoch": 805} {"train_loss": -10.45793342590332, "global_step": 135400, "epoch": 805} {"train_loss": -10.44485855102539, "global_step": 135401, "epoch": 805} {"train_loss": -10.288251876831055, "global_step": 135402, "epoch": 805} {"train_loss": -10.226566314697266, "global_step": 135403, "epoch": 805} {"train_loss": -10.27802848815918, "global_step": 135404, "epoch": 805} {"train_loss": -10.249292373657227, "global_step": 135405, "epoch": 805} {"train_loss": -10.43355941772461, "global_step": 135406, "epoch": 805} {"train_loss": -10.4460608959198, "global_step": 135407, "epoch": 805, "val_loss": 223430.5625, "train_action_mse_error": 5.929654598236084} {"train_loss": -10.175045013427734, "global_step": 135408, "epoch": 806} {"train_loss": -9.981500625610352, "global_step": 135409, "epoch": 806} {"train_loss": -10.173338890075684, "global_step": 135410, "epoch": 806} {"train_loss": -9.810587882995605, "global_step": 135411, "epoch": 806} {"train_loss": -10.085321426391602, "global_step": 135412, "epoch": 806} {"train_loss": -9.835854530334473, "global_step": 135413, "epoch": 806} {"train_loss": -10.037841796875, "global_step": 135414, "epoch": 806} {"train_loss": -10.160512924194336, "global_step": 135415, "epoch": 806} {"train_loss": -9.717620849609375, "global_step": 135416, "epoch": 806} {"train_loss": -10.43710708618164, "global_step": 135417, "epoch": 806} {"train_loss": -9.741018295288086, "global_step": 135418, "epoch": 806} {"train_loss": -9.543220520019531, "global_step": 135419, "epoch": 806} {"train_loss": -9.838252067565918, "global_step": 135420, "epoch": 806} {"train_loss": -9.58299732208252, "global_step": 135421, "epoch": 806} {"train_loss": -9.622825622558594, "global_step": 135422, "epoch": 806} {"train_loss": -9.848894119262695, "global_step": 135423, "epoch": 806} {"train_loss": -9.939355850219727, "global_step": 135424, "epoch": 806} {"train_loss": -9.4775972366333, "global_step": 135425, "epoch": 806} {"train_loss": -9.821271896362305, "global_step": 135426, "epoch": 806} {"train_loss": -9.491411209106445, "global_step": 135427, "epoch": 806} {"train_loss": -9.873157501220703, "global_step": 135428, "epoch": 806} {"train_loss": -9.946395874023438, "global_step": 135429, "epoch": 806} {"train_loss": -9.969341278076172, "global_step": 135430, "epoch": 806} {"train_loss": -10.096956253051758, "global_step": 135431, "epoch": 806} {"train_loss": -10.196941375732422, "global_step": 135432, "epoch": 806} {"train_loss": -9.946008682250977, "global_step": 135433, "epoch": 806} {"train_loss": -10.006240844726562, "global_step": 135434, "epoch": 806} {"train_loss": -10.207892417907715, "global_step": 135435, "epoch": 806} {"train_loss": -10.366052627563477, "global_step": 135436, "epoch": 806} {"train_loss": -10.198688507080078, "global_step": 135437, "epoch": 806} {"train_loss": -10.313129425048828, "global_step": 135438, "epoch": 806} {"train_loss": -10.226675033569336, "global_step": 135439, "epoch": 806} {"train_loss": -10.436172485351562, "global_step": 135440, "epoch": 806} {"train_loss": -10.193862915039062, "global_step": 135441, "epoch": 806} {"train_loss": -10.219772338867188, "global_step": 135442, "epoch": 806} {"train_loss": -10.409106254577637, "global_step": 135443, "epoch": 806} {"train_loss": -10.442959785461426, "global_step": 135444, "epoch": 806} {"train_loss": -10.36709976196289, "global_step": 135445, "epoch": 806} {"train_loss": -10.666223526000977, "global_step": 135446, "epoch": 806} {"train_loss": -10.474441528320312, "global_step": 135447, "epoch": 806} {"train_loss": -10.295681953430176, "global_step": 135448, "epoch": 806} {"train_loss": -10.495048522949219, "global_step": 135449, "epoch": 806} {"train_loss": -10.227222442626953, "global_step": 135450, "epoch": 806} {"train_loss": -10.721526145935059, "global_step": 135451, "epoch": 806} {"train_loss": -10.65719985961914, "global_step": 135452, "epoch": 806} {"train_loss": -10.627008438110352, "global_step": 135453, "epoch": 806} {"train_loss": -10.716272354125977, "global_step": 135454, "epoch": 806} {"train_loss": -10.592611312866211, "global_step": 135455, "epoch": 806} {"train_loss": -10.588348388671875, "global_step": 135456, "epoch": 806} {"train_loss": -10.514291763305664, "global_step": 135457, "epoch": 806} {"train_loss": -10.511383056640625, "global_step": 135458, "epoch": 806} {"train_loss": -10.773308753967285, "global_step": 135459, "epoch": 806} {"train_loss": -10.603370666503906, "global_step": 135460, "epoch": 806} {"train_loss": -10.517229080200195, "global_step": 135461, "epoch": 806} {"train_loss": -10.633890151977539, "global_step": 135462, "epoch": 806} {"train_loss": -10.625577926635742, "global_step": 135463, "epoch": 806} {"train_loss": -10.794517517089844, "global_step": 135464, "epoch": 806} {"train_loss": -10.709442138671875, "global_step": 135465, "epoch": 806} {"train_loss": -10.853129386901855, "global_step": 135466, "epoch": 806} {"train_loss": -10.368648529052734, "global_step": 135467, "epoch": 806} {"train_loss": -10.657828330993652, "global_step": 135468, "epoch": 806} {"train_loss": -10.886560440063477, "global_step": 135469, "epoch": 806} {"train_loss": -10.72494125366211, "global_step": 135470, "epoch": 806} {"train_loss": -10.806974411010742, "global_step": 135471, "epoch": 806} {"train_loss": -10.768338203430176, "global_step": 135472, "epoch": 806} {"train_loss": -10.838133811950684, "global_step": 135473, "epoch": 806} {"train_loss": -10.98681354522705, "global_step": 135474, "epoch": 806} {"train_loss": -10.751043319702148, "global_step": 135475, "epoch": 806} {"train_loss": -10.816125869750977, "global_step": 135476, "epoch": 806} {"train_loss": -10.319494247436523, "global_step": 135477, "epoch": 806} {"train_loss": -10.824362754821777, "global_step": 135478, "epoch": 806} {"train_loss": -10.583187103271484, "global_step": 135479, "epoch": 806} {"train_loss": -10.515837669372559, "global_step": 135480, "epoch": 806} {"train_loss": -10.661548614501953, "global_step": 135481, "epoch": 806} {"train_loss": -10.671188354492188, "global_step": 135482, "epoch": 806} {"train_loss": -10.624956130981445, "global_step": 135483, "epoch": 806} {"train_loss": -10.672381401062012, "global_step": 135484, "epoch": 806} {"train_loss": -10.647603988647461, "global_step": 135485, "epoch": 806} {"train_loss": -10.361862182617188, "global_step": 135486, "epoch": 806} {"train_loss": -10.468914031982422, "global_step": 135487, "epoch": 806} {"train_loss": -10.523359298706055, "global_step": 135488, "epoch": 806} {"train_loss": -10.69283676147461, "global_step": 135489, "epoch": 806} {"train_loss": -10.515569686889648, "global_step": 135490, "epoch": 806} {"train_loss": -10.473010063171387, "global_step": 135491, "epoch": 806} {"train_loss": -10.557018280029297, "global_step": 135492, "epoch": 806} {"train_loss": -10.953533172607422, "global_step": 135493, "epoch": 806} {"train_loss": -10.318201065063477, "global_step": 135494, "epoch": 806} {"train_loss": -10.637929916381836, "global_step": 135495, "epoch": 806} {"train_loss": -10.442605018615723, "global_step": 135496, "epoch": 806} {"train_loss": -10.791114807128906, "global_step": 135497, "epoch": 806} {"train_loss": -10.69906997680664, "global_step": 135498, "epoch": 806} {"train_loss": -10.554788589477539, "global_step": 135499, "epoch": 806} {"train_loss": -10.135782241821289, "global_step": 135500, "epoch": 806} {"train_loss": -10.187183380126953, "global_step": 135501, "epoch": 806} {"train_loss": -10.40689468383789, "global_step": 135502, "epoch": 806} {"train_loss": -10.030230522155762, "global_step": 135503, "epoch": 806} {"train_loss": -9.802595138549805, "global_step": 135504, "epoch": 806} {"train_loss": -10.037126541137695, "global_step": 135505, "epoch": 806} {"train_loss": -10.28454303741455, "global_step": 135506, "epoch": 806} {"train_loss": -10.33219051361084, "global_step": 135507, "epoch": 806} {"train_loss": -10.247995376586914, "global_step": 135508, "epoch": 806} {"train_loss": -10.170242309570312, "global_step": 135509, "epoch": 806} {"train_loss": -10.472074508666992, "global_step": 135510, "epoch": 806} {"train_loss": -10.332930564880371, "global_step": 135511, "epoch": 806} {"train_loss": -10.274574279785156, "global_step": 135512, "epoch": 806} {"train_loss": -10.320544242858887, "global_step": 135513, "epoch": 806} {"train_loss": -10.388656616210938, "global_step": 135514, "epoch": 806} {"train_loss": -10.387449264526367, "global_step": 135515, "epoch": 806} {"train_loss": -10.426198959350586, "global_step": 135516, "epoch": 806} {"train_loss": -10.68875789642334, "global_step": 135517, "epoch": 806} {"train_loss": -10.536958694458008, "global_step": 135518, "epoch": 806} {"train_loss": -10.397211074829102, "global_step": 135519, "epoch": 806} {"train_loss": -10.460592269897461, "global_step": 135520, "epoch": 806} {"train_loss": -10.627852439880371, "global_step": 135521, "epoch": 806} {"train_loss": -10.384617805480957, "global_step": 135522, "epoch": 806} {"train_loss": -10.711841583251953, "global_step": 135523, "epoch": 806} {"train_loss": -10.485818862915039, "global_step": 135524, "epoch": 806} {"train_loss": -10.675193786621094, "global_step": 135525, "epoch": 806} {"train_loss": -10.690326690673828, "global_step": 135526, "epoch": 806} {"train_loss": -10.650224685668945, "global_step": 135527, "epoch": 806} {"train_loss": -10.677289009094238, "global_step": 135528, "epoch": 806} {"train_loss": -10.445805549621582, "global_step": 135529, "epoch": 806} {"train_loss": -10.512092590332031, "global_step": 135530, "epoch": 806} {"train_loss": -10.264501571655273, "global_step": 135531, "epoch": 806} {"train_loss": -10.55801010131836, "global_step": 135532, "epoch": 806} {"train_loss": -10.712547302246094, "global_step": 135533, "epoch": 806} {"train_loss": -10.299933433532715, "global_step": 135534, "epoch": 806} {"train_loss": -10.63497543334961, "global_step": 135535, "epoch": 806} {"train_loss": -10.50446891784668, "global_step": 135536, "epoch": 806} {"train_loss": -10.661422729492188, "global_step": 135537, "epoch": 806} {"train_loss": -10.490405082702637, "global_step": 135538, "epoch": 806} {"train_loss": -10.536109924316406, "global_step": 135539, "epoch": 806} {"train_loss": -10.477378845214844, "global_step": 135540, "epoch": 806} {"train_loss": -10.4328031539917, "global_step": 135541, "epoch": 806} {"train_loss": -10.682788848876953, "global_step": 135542, "epoch": 806} {"train_loss": -10.626484870910645, "global_step": 135543, "epoch": 806} {"train_loss": -10.79341983795166, "global_step": 135544, "epoch": 806} {"train_loss": -10.69342041015625, "global_step": 135545, "epoch": 806} {"train_loss": -10.667724609375, "global_step": 135546, "epoch": 806} {"train_loss": -10.29928970336914, "global_step": 135547, "epoch": 806} {"train_loss": -10.551606178283691, "global_step": 135548, "epoch": 806} {"train_loss": -10.345892906188965, "global_step": 135549, "epoch": 806} {"train_loss": -10.557774543762207, "global_step": 135550, "epoch": 806} {"train_loss": -10.669782638549805, "global_step": 135551, "epoch": 806} {"train_loss": -10.978862762451172, "global_step": 135552, "epoch": 806} {"train_loss": -10.997434616088867, "global_step": 135553, "epoch": 806} {"train_loss": -10.578189849853516, "global_step": 135554, "epoch": 806} {"train_loss": -10.509682655334473, "global_step": 135555, "epoch": 806} {"train_loss": -10.796886444091797, "global_step": 135556, "epoch": 806} {"train_loss": -10.808721542358398, "global_step": 135557, "epoch": 806} {"train_loss": -10.83319091796875, "global_step": 135558, "epoch": 806} {"train_loss": -10.755077362060547, "global_step": 135559, "epoch": 806} {"train_loss": -10.594137191772461, "global_step": 135560, "epoch": 806} {"train_loss": -10.796041488647461, "global_step": 135561, "epoch": 806} {"train_loss": -9.963300704956055, "global_step": 135562, "epoch": 806} {"train_loss": -9.657357215881348, "global_step": 135563, "epoch": 806} {"train_loss": -10.538999557495117, "global_step": 135564, "epoch": 806} {"train_loss": -10.094173431396484, "global_step": 135565, "epoch": 806} {"train_loss": -10.21683120727539, "global_step": 135566, "epoch": 806} {"train_loss": -10.836544036865234, "global_step": 135567, "epoch": 806} {"train_loss": -10.411999702453613, "global_step": 135568, "epoch": 806} {"train_loss": -10.823627471923828, "global_step": 135569, "epoch": 806} {"train_loss": -10.155217170715332, "global_step": 135570, "epoch": 806} {"train_loss": -10.246163368225098, "global_step": 135571, "epoch": 806} {"train_loss": -10.571741104125977, "global_step": 135572, "epoch": 806} {"train_loss": -10.455636978149414, "global_step": 135573, "epoch": 806} {"train_loss": -10.536458969116211, "global_step": 135574, "epoch": 806} {"train_loss": -10.417414131618681, "global_step": 135575, "epoch": 806, "val_loss": 219539.65625} {"train_loss": -10.144648551940918, "global_step": 135576, "epoch": 807} {"train_loss": -10.005508422851562, "global_step": 135577, "epoch": 807} {"train_loss": -10.271964073181152, "global_step": 135578, "epoch": 807} {"train_loss": -10.393682479858398, "global_step": 135579, "epoch": 807} {"train_loss": -10.323962211608887, "global_step": 135580, "epoch": 807} {"train_loss": -10.634252548217773, "global_step": 135581, "epoch": 807} {"train_loss": -10.275873184204102, "global_step": 135582, "epoch": 807} {"train_loss": -10.501601219177246, "global_step": 135583, "epoch": 807} {"train_loss": -10.58246898651123, "global_step": 135584, "epoch": 807} {"train_loss": -10.368597984313965, "global_step": 135585, "epoch": 807} {"train_loss": -10.758026123046875, "global_step": 135586, "epoch": 807} {"train_loss": -10.448160171508789, "global_step": 135587, "epoch": 807} {"train_loss": -10.850788116455078, "global_step": 135588, "epoch": 807} {"train_loss": -10.831972122192383, "global_step": 135589, "epoch": 807} {"train_loss": -10.650209426879883, "global_step": 135590, "epoch": 807} {"train_loss": -10.57296085357666, "global_step": 135591, "epoch": 807} {"train_loss": -10.639198303222656, "global_step": 135592, "epoch": 807} {"train_loss": -10.60677719116211, "global_step": 135593, "epoch": 807} {"train_loss": -10.7935209274292, "global_step": 135594, "epoch": 807} {"train_loss": -10.67535400390625, "global_step": 135595, "epoch": 807} {"train_loss": -10.484885215759277, "global_step": 135596, "epoch": 807} {"train_loss": -10.456243515014648, "global_step": 135597, "epoch": 807} {"train_loss": -10.436145782470703, "global_step": 135598, "epoch": 807} {"train_loss": -10.595870971679688, "global_step": 135599, "epoch": 807} {"train_loss": -10.746213912963867, "global_step": 135600, "epoch": 807} {"train_loss": -10.5574369430542, "global_step": 135601, "epoch": 807} {"train_loss": -10.488349914550781, "global_step": 135602, "epoch": 807} {"train_loss": -10.762470245361328, "global_step": 135603, "epoch": 807} {"train_loss": -10.646958351135254, "global_step": 135604, "epoch": 807} {"train_loss": -10.262678146362305, "global_step": 135605, "epoch": 807} {"train_loss": -10.475321769714355, "global_step": 135606, "epoch": 807} {"train_loss": -10.680835723876953, "global_step": 135607, "epoch": 807} {"train_loss": -10.277295112609863, "global_step": 135608, "epoch": 807} {"train_loss": -10.530228614807129, "global_step": 135609, "epoch": 807} {"train_loss": -10.695571899414062, "global_step": 135610, "epoch": 807} {"train_loss": -10.4053955078125, "global_step": 135611, "epoch": 807} {"train_loss": -10.585190773010254, "global_step": 135612, "epoch": 807} {"train_loss": -10.35540771484375, "global_step": 135613, "epoch": 807} {"train_loss": -10.745123863220215, "global_step": 135614, "epoch": 807} {"train_loss": -10.499922752380371, "global_step": 135615, "epoch": 807} {"train_loss": -10.57723331451416, "global_step": 135616, "epoch": 807} {"train_loss": -10.642980575561523, "global_step": 135617, "epoch": 807} {"train_loss": -10.238526344299316, "global_step": 135618, "epoch": 807} {"train_loss": -10.271392822265625, "global_step": 135619, "epoch": 807} {"train_loss": -10.76414680480957, "global_step": 135620, "epoch": 807} {"train_loss": -10.567736625671387, "global_step": 135621, "epoch": 807} {"train_loss": -10.670585632324219, "global_step": 135622, "epoch": 807} {"train_loss": -10.773062705993652, "global_step": 135623, "epoch": 807} {"train_loss": -10.769632339477539, "global_step": 135624, "epoch": 807} {"train_loss": -10.671510696411133, "global_step": 135625, "epoch": 807} {"train_loss": -10.899706840515137, "global_step": 135626, "epoch": 807} {"train_loss": -10.869966506958008, "global_step": 135627, "epoch": 807} {"train_loss": -10.695497512817383, "global_step": 135628, "epoch": 807} {"train_loss": -10.523530960083008, "global_step": 135629, "epoch": 807} {"train_loss": -10.523719787597656, "global_step": 135630, "epoch": 807} {"train_loss": -10.71023941040039, "global_step": 135631, "epoch": 807} {"train_loss": -10.649452209472656, "global_step": 135632, "epoch": 807} {"train_loss": -10.835084915161133, "global_step": 135633, "epoch": 807} {"train_loss": -10.672380447387695, "global_step": 135634, "epoch": 807} {"train_loss": -10.268388748168945, "global_step": 135635, "epoch": 807} {"train_loss": -10.383068084716797, "global_step": 135636, "epoch": 807} {"train_loss": -10.666573524475098, "global_step": 135637, "epoch": 807} {"train_loss": -10.293594360351562, "global_step": 135638, "epoch": 807} {"train_loss": -10.444758415222168, "global_step": 135639, "epoch": 807} {"train_loss": -10.830039978027344, "global_step": 135640, "epoch": 807} {"train_loss": -10.585434913635254, "global_step": 135641, "epoch": 807} {"train_loss": -10.395376205444336, "global_step": 135642, "epoch": 807} {"train_loss": -10.711217880249023, "global_step": 135643, "epoch": 807} {"train_loss": -10.481550216674805, "global_step": 135644, "epoch": 807} {"train_loss": -10.552724838256836, "global_step": 135645, "epoch": 807} {"train_loss": -10.47227668762207, "global_step": 135646, "epoch": 807} {"train_loss": -9.92931842803955, "global_step": 135647, "epoch": 807} {"train_loss": -10.012481689453125, "global_step": 135648, "epoch": 807} {"train_loss": -10.452925682067871, "global_step": 135649, "epoch": 807} {"train_loss": -10.582372665405273, "global_step": 135650, "epoch": 807} {"train_loss": -10.527020454406738, "global_step": 135651, "epoch": 807} {"train_loss": -10.222097396850586, "global_step": 135652, "epoch": 807} {"train_loss": -10.5313081741333, "global_step": 135653, "epoch": 807} {"train_loss": -10.049732208251953, "global_step": 135654, "epoch": 807} {"train_loss": -10.491567611694336, "global_step": 135655, "epoch": 807} {"train_loss": -10.721138954162598, "global_step": 135656, "epoch": 807} {"train_loss": -10.550012588500977, "global_step": 135657, "epoch": 807} {"train_loss": -10.49559211730957, "global_step": 135658, "epoch": 807} {"train_loss": -9.501758575439453, "global_step": 135659, "epoch": 807} {"train_loss": -10.589715957641602, "global_step": 135660, "epoch": 807} {"train_loss": -9.265253067016602, "global_step": 135661, "epoch": 807} {"train_loss": -10.002931594848633, "global_step": 135662, "epoch": 807} {"train_loss": -9.848419189453125, "global_step": 135663, "epoch": 807} {"train_loss": -9.870220184326172, "global_step": 135664, "epoch": 807} {"train_loss": -9.817694664001465, "global_step": 135665, "epoch": 807} {"train_loss": -9.731935501098633, "global_step": 135666, "epoch": 807} {"train_loss": -9.918027877807617, "global_step": 135667, "epoch": 807} {"train_loss": -9.431280136108398, "global_step": 135668, "epoch": 807} {"train_loss": -9.207152366638184, "global_step": 135669, "epoch": 807} {"train_loss": -8.652093887329102, "global_step": 135670, "epoch": 807} {"train_loss": -9.544197082519531, "global_step": 135671, "epoch": 807} {"train_loss": -9.754964828491211, "global_step": 135672, "epoch": 807} {"train_loss": -9.489028930664062, "global_step": 135673, "epoch": 807} {"train_loss": -9.26451301574707, "global_step": 135674, "epoch": 807} {"train_loss": -10.000604629516602, "global_step": 135675, "epoch": 807} {"train_loss": -9.576386451721191, "global_step": 135676, "epoch": 807} {"train_loss": -9.78432846069336, "global_step": 135677, "epoch": 807} {"train_loss": -10.11618709564209, "global_step": 135678, "epoch": 807} {"train_loss": -10.026598930358887, "global_step": 135679, "epoch": 807} {"train_loss": -9.94446849822998, "global_step": 135680, "epoch": 807} {"train_loss": -10.046892166137695, "global_step": 135681, "epoch": 807} {"train_loss": -10.187192916870117, "global_step": 135682, "epoch": 807} {"train_loss": -10.128676414489746, "global_step": 135683, "epoch": 807} {"train_loss": -10.0374116897583, "global_step": 135684, "epoch": 807} {"train_loss": -10.325701713562012, "global_step": 135685, "epoch": 807} {"train_loss": -10.065047264099121, "global_step": 135686, "epoch": 807} {"train_loss": -10.16871452331543, "global_step": 135687, "epoch": 807} {"train_loss": -10.15853214263916, "global_step": 135688, "epoch": 807} {"train_loss": -10.2960844039917, "global_step": 135689, "epoch": 807} {"train_loss": -10.11924934387207, "global_step": 135690, "epoch": 807} {"train_loss": -10.325896263122559, "global_step": 135691, "epoch": 807} {"train_loss": -9.88772964477539, "global_step": 135692, "epoch": 807} {"train_loss": -10.42697525024414, "global_step": 135693, "epoch": 807} {"train_loss": -10.29376220703125, "global_step": 135694, "epoch": 807} {"train_loss": -10.288534164428711, "global_step": 135695, "epoch": 807} {"train_loss": -10.20535945892334, "global_step": 135696, "epoch": 807} {"train_loss": -10.154961585998535, "global_step": 135697, "epoch": 807} {"train_loss": -10.088869094848633, "global_step": 135698, "epoch": 807} {"train_loss": -10.458436965942383, "global_step": 135699, "epoch": 807} {"train_loss": -9.940423965454102, "global_step": 135700, "epoch": 807} {"train_loss": -10.393637657165527, "global_step": 135701, "epoch": 807} {"train_loss": -10.119300842285156, "global_step": 135702, "epoch": 807} {"train_loss": -10.354803085327148, "global_step": 135703, "epoch": 807} {"train_loss": -10.280728340148926, "global_step": 135704, "epoch": 807} {"train_loss": -10.33755111694336, "global_step": 135705, "epoch": 807} {"train_loss": -10.52425765991211, "global_step": 135706, "epoch": 807} {"train_loss": -10.604116439819336, "global_step": 135707, "epoch": 807} {"train_loss": -10.334051132202148, "global_step": 135708, "epoch": 807} {"train_loss": -10.585805892944336, "global_step": 135709, "epoch": 807} {"train_loss": -10.681451797485352, "global_step": 135710, "epoch": 807} {"train_loss": -10.541479110717773, "global_step": 135711, "epoch": 807} {"train_loss": -10.75154972076416, "global_step": 135712, "epoch": 807} {"train_loss": -10.625859260559082, "global_step": 135713, "epoch": 807} {"train_loss": -10.58646011352539, "global_step": 135714, "epoch": 807} {"train_loss": -10.631307601928711, "global_step": 135715, "epoch": 807} {"train_loss": -10.405662536621094, "global_step": 135716, "epoch": 807} {"train_loss": -10.565652847290039, "global_step": 135717, "epoch": 807} {"train_loss": -10.68232536315918, "global_step": 135718, "epoch": 807} {"train_loss": -10.772106170654297, "global_step": 135719, "epoch": 807} {"train_loss": -10.683222770690918, "global_step": 135720, "epoch": 807} {"train_loss": -10.722057342529297, "global_step": 135721, "epoch": 807} {"train_loss": -10.680562973022461, "global_step": 135722, "epoch": 807} {"train_loss": -10.797775268554688, "global_step": 135723, "epoch": 807} {"train_loss": -10.90040397644043, "global_step": 135724, "epoch": 807} {"train_loss": -10.8251953125, "global_step": 135725, "epoch": 807} {"train_loss": -10.594717025756836, "global_step": 135726, "epoch": 807} {"train_loss": -10.66415023803711, "global_step": 135727, "epoch": 807} {"train_loss": -10.621456146240234, "global_step": 135728, "epoch": 807} {"train_loss": -10.80270004272461, "global_step": 135729, "epoch": 807} {"train_loss": -10.731877326965332, "global_step": 135730, "epoch": 807} {"train_loss": -10.784509658813477, "global_step": 135731, "epoch": 807} {"train_loss": -10.825974464416504, "global_step": 135732, "epoch": 807} {"train_loss": -10.606968879699707, "global_step": 135733, "epoch": 807} {"train_loss": -10.397319793701172, "global_step": 135734, "epoch": 807} {"train_loss": -10.430416107177734, "global_step": 135735, "epoch": 807} {"train_loss": -10.802961349487305, "global_step": 135736, "epoch": 807} {"train_loss": -10.486505508422852, "global_step": 135737, "epoch": 807} {"train_loss": -10.102872848510742, "global_step": 135738, "epoch": 807} {"train_loss": -10.414764404296875, "global_step": 135739, "epoch": 807} {"train_loss": -10.408468246459961, "global_step": 135740, "epoch": 807} {"train_loss": -10.659866333007812, "global_step": 135741, "epoch": 807} {"train_loss": -9.830062866210938, "global_step": 135742, "epoch": 807} {"train_loss": -10.38580140045711, "global_step": 135743, "epoch": 807, "val_loss": 222959.46875} {"train_loss": -10.123101234436035, "global_step": 135744, "epoch": 808} {"train_loss": -9.55771541595459, "global_step": 135745, "epoch": 808} {"train_loss": -10.630101203918457, "global_step": 135746, "epoch": 808} {"train_loss": -9.99262523651123, "global_step": 135747, "epoch": 808} {"train_loss": -10.215314865112305, "global_step": 135748, "epoch": 808} {"train_loss": -9.874105453491211, "global_step": 135749, "epoch": 808} {"train_loss": -9.97300910949707, "global_step": 135750, "epoch": 808} {"train_loss": -10.329364776611328, "global_step": 135751, "epoch": 808} {"train_loss": -9.484880447387695, "global_step": 135752, "epoch": 808} {"train_loss": -10.412446975708008, "global_step": 135753, "epoch": 808} {"train_loss": -9.921252250671387, "global_step": 135754, "epoch": 808} {"train_loss": -9.872503280639648, "global_step": 135755, "epoch": 808} {"train_loss": -10.304792404174805, "global_step": 135756, "epoch": 808} {"train_loss": -10.147534370422363, "global_step": 135757, "epoch": 808} {"train_loss": -10.031545639038086, "global_step": 135758, "epoch": 808} {"train_loss": -10.2925386428833, "global_step": 135759, "epoch": 808} {"train_loss": -9.684976577758789, "global_step": 135760, "epoch": 808} {"train_loss": -10.122183799743652, "global_step": 135761, "epoch": 808} {"train_loss": -10.346685409545898, "global_step": 135762, "epoch": 808} {"train_loss": -10.24833869934082, "global_step": 135763, "epoch": 808} {"train_loss": -10.177990913391113, "global_step": 135764, "epoch": 808} {"train_loss": -10.081972122192383, "global_step": 135765, "epoch": 808} {"train_loss": -9.799622535705566, "global_step": 135766, "epoch": 808} {"train_loss": -9.795385360717773, "global_step": 135767, "epoch": 808} {"train_loss": -10.280715942382812, "global_step": 135768, "epoch": 808} {"train_loss": -9.678651809692383, "global_step": 135769, "epoch": 808} {"train_loss": -10.411157608032227, "global_step": 135770, "epoch": 808} {"train_loss": -10.231494903564453, "global_step": 135771, "epoch": 808} {"train_loss": -10.002187728881836, "global_step": 135772, "epoch": 808} {"train_loss": -10.230155944824219, "global_step": 135773, "epoch": 808} {"train_loss": -10.081113815307617, "global_step": 135774, "epoch": 808} {"train_loss": -10.016844749450684, "global_step": 135775, "epoch": 808} {"train_loss": -10.312983512878418, "global_step": 135776, "epoch": 808} {"train_loss": -9.995406150817871, "global_step": 135777, "epoch": 808} {"train_loss": -10.123027801513672, "global_step": 135778, "epoch": 808} {"train_loss": -10.457154273986816, "global_step": 135779, "epoch": 808} {"train_loss": -10.374573707580566, "global_step": 135780, "epoch": 808} {"train_loss": -10.296724319458008, "global_step": 135781, "epoch": 808} {"train_loss": -10.576276779174805, "global_step": 135782, "epoch": 808} {"train_loss": -10.355311393737793, "global_step": 135783, "epoch": 808} {"train_loss": -10.53354549407959, "global_step": 135784, "epoch": 808} {"train_loss": -10.242513656616211, "global_step": 135785, "epoch": 808} {"train_loss": -10.39515495300293, "global_step": 135786, "epoch": 808} {"train_loss": -10.503202438354492, "global_step": 135787, "epoch": 808} {"train_loss": -10.48885726928711, "global_step": 135788, "epoch": 808} {"train_loss": -10.407198905944824, "global_step": 135789, "epoch": 808} {"train_loss": -10.448641777038574, "global_step": 135790, "epoch": 808} {"train_loss": -10.668684005737305, "global_step": 135791, "epoch": 808} {"train_loss": -10.248762130737305, "global_step": 135792, "epoch": 808} {"train_loss": -10.541156768798828, "global_step": 135793, "epoch": 808} {"train_loss": -10.477792739868164, "global_step": 135794, "epoch": 808} {"train_loss": -10.342466354370117, "global_step": 135795, "epoch": 808} {"train_loss": -10.345805168151855, "global_step": 135796, "epoch": 808} {"train_loss": -10.171897888183594, "global_step": 135797, "epoch": 808} {"train_loss": -10.711265563964844, "global_step": 135798, "epoch": 808} {"train_loss": -10.056665420532227, "global_step": 135799, "epoch": 808} {"train_loss": -10.622275352478027, "global_step": 135800, "epoch": 808} {"train_loss": -10.559103965759277, "global_step": 135801, "epoch": 808} {"train_loss": -10.12015438079834, "global_step": 135802, "epoch": 808} {"train_loss": -10.681103706359863, "global_step": 135803, "epoch": 808} {"train_loss": -10.36764144897461, "global_step": 135804, "epoch": 808} {"train_loss": -10.4618558883667, "global_step": 135805, "epoch": 808} {"train_loss": -10.50577163696289, "global_step": 135806, "epoch": 808} {"train_loss": -10.342571258544922, "global_step": 135807, "epoch": 808} {"train_loss": -10.360777854919434, "global_step": 135808, "epoch": 808} {"train_loss": -10.321630477905273, "global_step": 135809, "epoch": 808} {"train_loss": -9.95187759399414, "global_step": 135810, "epoch": 808} {"train_loss": -10.3091402053833, "global_step": 135811, "epoch": 808} {"train_loss": -10.207695007324219, "global_step": 135812, "epoch": 808} {"train_loss": -10.478281021118164, "global_step": 135813, "epoch": 808} {"train_loss": -10.170859336853027, "global_step": 135814, "epoch": 808} {"train_loss": -10.311727523803711, "global_step": 135815, "epoch": 808} {"train_loss": -10.311788558959961, "global_step": 135816, "epoch": 808} {"train_loss": -10.111541748046875, "global_step": 135817, "epoch": 808} {"train_loss": -10.206914901733398, "global_step": 135818, "epoch": 808} {"train_loss": -9.813465118408203, "global_step": 135819, "epoch": 808} {"train_loss": -10.696300506591797, "global_step": 135820, "epoch": 808} {"train_loss": -9.996402740478516, "global_step": 135821, "epoch": 808} {"train_loss": -10.521522521972656, "global_step": 135822, "epoch": 808} {"train_loss": -10.376529693603516, "global_step": 135823, "epoch": 808} {"train_loss": -10.274145126342773, "global_step": 135824, "epoch": 808} {"train_loss": -10.709065437316895, "global_step": 135825, "epoch": 808} {"train_loss": -10.46376895904541, "global_step": 135826, "epoch": 808} {"train_loss": -10.58677864074707, "global_step": 135827, "epoch": 808} {"train_loss": -10.590770721435547, "global_step": 135828, "epoch": 808} {"train_loss": -10.526793479919434, "global_step": 135829, "epoch": 808} {"train_loss": -10.603372573852539, "global_step": 135830, "epoch": 808} {"train_loss": -10.572866439819336, "global_step": 135831, "epoch": 808} {"train_loss": -10.41004753112793, "global_step": 135832, "epoch": 808} {"train_loss": -10.75454330444336, "global_step": 135833, "epoch": 808} {"train_loss": -10.826946258544922, "global_step": 135834, "epoch": 808} {"train_loss": -10.748235702514648, "global_step": 135835, "epoch": 808} {"train_loss": -10.713111877441406, "global_step": 135836, "epoch": 808} {"train_loss": -10.758037567138672, "global_step": 135837, "epoch": 808} {"train_loss": -10.812189102172852, "global_step": 135838, "epoch": 808} {"train_loss": -10.630162239074707, "global_step": 135839, "epoch": 808} {"train_loss": -10.781839370727539, "global_step": 135840, "epoch": 808} {"train_loss": -10.756902694702148, "global_step": 135841, "epoch": 808} {"train_loss": -10.844683647155762, "global_step": 135842, "epoch": 808} {"train_loss": -10.4893798828125, "global_step": 135843, "epoch": 808} {"train_loss": -10.855852127075195, "global_step": 135844, "epoch": 808} {"train_loss": -10.605968475341797, "global_step": 135845, "epoch": 808} {"train_loss": -10.591781616210938, "global_step": 135846, "epoch": 808} {"train_loss": -10.841103553771973, "global_step": 135847, "epoch": 808} {"train_loss": -10.949575424194336, "global_step": 135848, "epoch": 808} {"train_loss": -10.743237495422363, "global_step": 135849, "epoch": 808} {"train_loss": -10.837505340576172, "global_step": 135850, "epoch": 808} {"train_loss": -10.51435661315918, "global_step": 135851, "epoch": 808} {"train_loss": -10.567245483398438, "global_step": 135852, "epoch": 808} {"train_loss": -10.734578132629395, "global_step": 135853, "epoch": 808} {"train_loss": -10.677474975585938, "global_step": 135854, "epoch": 808} {"train_loss": -10.645105361938477, "global_step": 135855, "epoch": 808} {"train_loss": -10.766554832458496, "global_step": 135856, "epoch": 808} {"train_loss": -10.72793960571289, "global_step": 135857, "epoch": 808} {"train_loss": -10.57120132446289, "global_step": 135858, "epoch": 808} {"train_loss": -10.82792854309082, "global_step": 135859, "epoch": 808} {"train_loss": -10.829034805297852, "global_step": 135860, "epoch": 808} {"train_loss": -10.313462257385254, "global_step": 135861, "epoch": 808} {"train_loss": -10.846116065979004, "global_step": 135862, "epoch": 808} {"train_loss": -10.464325904846191, "global_step": 135863, "epoch": 808} {"train_loss": -10.571815490722656, "global_step": 135864, "epoch": 808} {"train_loss": -10.162612915039062, "global_step": 135865, "epoch": 808} {"train_loss": -9.896295547485352, "global_step": 135866, "epoch": 808} {"train_loss": -9.664935111999512, "global_step": 135867, "epoch": 808} {"train_loss": -10.269306182861328, "global_step": 135868, "epoch": 808} {"train_loss": -9.0680570602417, "global_step": 135869, "epoch": 808} {"train_loss": -9.907632827758789, "global_step": 135870, "epoch": 808} {"train_loss": -9.421651840209961, "global_step": 135871, "epoch": 808} {"train_loss": -10.029424667358398, "global_step": 135872, "epoch": 808} {"train_loss": -9.615900039672852, "global_step": 135873, "epoch": 808} {"train_loss": -10.137923240661621, "global_step": 135874, "epoch": 808} {"train_loss": -9.530904769897461, "global_step": 135875, "epoch": 808} {"train_loss": -10.20846939086914, "global_step": 135876, "epoch": 808} {"train_loss": -9.689626693725586, "global_step": 135877, "epoch": 808} {"train_loss": -10.395545959472656, "global_step": 135878, "epoch": 808} {"train_loss": -10.293366432189941, "global_step": 135879, "epoch": 808} {"train_loss": -10.251386642456055, "global_step": 135880, "epoch": 808} {"train_loss": -10.335070610046387, "global_step": 135881, "epoch": 808} {"train_loss": -10.048330307006836, "global_step": 135882, "epoch": 808} {"train_loss": -10.201872825622559, "global_step": 135883, "epoch": 808} {"train_loss": -9.993887901306152, "global_step": 135884, "epoch": 808} {"train_loss": -10.186422348022461, "global_step": 135885, "epoch": 808} {"train_loss": -10.197925567626953, "global_step": 135886, "epoch": 808} {"train_loss": -10.422243118286133, "global_step": 135887, "epoch": 808} {"train_loss": -10.46121597290039, "global_step": 135888, "epoch": 808} {"train_loss": -10.337699890136719, "global_step": 135889, "epoch": 808} {"train_loss": -10.327896118164062, "global_step": 135890, "epoch": 808} {"train_loss": -10.38662338256836, "global_step": 135891, "epoch": 808} {"train_loss": -10.166757583618164, "global_step": 135892, "epoch": 808} {"train_loss": -10.654741287231445, "global_step": 135893, "epoch": 808} {"train_loss": -10.509366035461426, "global_step": 135894, "epoch": 808} {"train_loss": -10.322347640991211, "global_step": 135895, "epoch": 808} {"train_loss": -10.643949508666992, "global_step": 135896, "epoch": 808} {"train_loss": -10.59533977508545, "global_step": 135897, "epoch": 808} {"train_loss": -10.34482192993164, "global_step": 135898, "epoch": 808} {"train_loss": -10.546178817749023, "global_step": 135899, "epoch": 808} {"train_loss": -10.491962432861328, "global_step": 135900, "epoch": 808} {"train_loss": -10.704286575317383, "global_step": 135901, "epoch": 808} {"train_loss": -10.668453216552734, "global_step": 135902, "epoch": 808} {"train_loss": -10.565743446350098, "global_step": 135903, "epoch": 808} {"train_loss": -10.597108840942383, "global_step": 135904, "epoch": 808} {"train_loss": -10.549932479858398, "global_step": 135905, "epoch": 808} {"train_loss": -10.470431327819824, "global_step": 135906, "epoch": 808} {"train_loss": -10.663869857788086, "global_step": 135907, "epoch": 808} {"train_loss": -10.5634183883667, "global_step": 135908, "epoch": 808} {"train_loss": -10.657835006713867, "global_step": 135909, "epoch": 808} {"train_loss": -10.573747634887695, "global_step": 135910, "epoch": 808} {"train_loss": -10.35037436371758, "global_step": 135911, "epoch": 808, "val_loss": 223657.046875} {"train_loss": -10.585973739624023, "global_step": 135912, "epoch": 809} {"train_loss": -10.482995986938477, "global_step": 135913, "epoch": 809} {"train_loss": -10.619682312011719, "global_step": 135914, "epoch": 809} {"train_loss": -10.688058853149414, "global_step": 135915, "epoch": 809} {"train_loss": -10.604719161987305, "global_step": 135916, "epoch": 809} {"train_loss": -10.759511947631836, "global_step": 135917, "epoch": 809} {"train_loss": -10.596900939941406, "global_step": 135918, "epoch": 809} {"train_loss": -10.744678497314453, "global_step": 135919, "epoch": 809} {"train_loss": -10.41183853149414, "global_step": 135920, "epoch": 809} {"train_loss": -10.7354736328125, "global_step": 135921, "epoch": 809} {"train_loss": -10.582738876342773, "global_step": 135922, "epoch": 809} {"train_loss": -10.63381576538086, "global_step": 135923, "epoch": 809} {"train_loss": -10.622821807861328, "global_step": 135924, "epoch": 809} {"train_loss": -10.767019271850586, "global_step": 135925, "epoch": 809} {"train_loss": -10.810476303100586, "global_step": 135926, "epoch": 809} {"train_loss": -10.518441200256348, "global_step": 135927, "epoch": 809} {"train_loss": -10.47446060180664, "global_step": 135928, "epoch": 809} {"train_loss": -10.543342590332031, "global_step": 135929, "epoch": 809} {"train_loss": -10.818679809570312, "global_step": 135930, "epoch": 809} {"train_loss": -10.587782859802246, "global_step": 135931, "epoch": 809} {"train_loss": -10.252870559692383, "global_step": 135932, "epoch": 809} {"train_loss": -10.50403881072998, "global_step": 135933, "epoch": 809} {"train_loss": -10.336828231811523, "global_step": 135934, "epoch": 809} {"train_loss": -10.45874309539795, "global_step": 135935, "epoch": 809} {"train_loss": -10.376376152038574, "global_step": 135936, "epoch": 809} {"train_loss": -9.957155227661133, "global_step": 135937, "epoch": 809} {"train_loss": -10.619260787963867, "global_step": 135938, "epoch": 809} {"train_loss": -10.122417449951172, "global_step": 135939, "epoch": 809} {"train_loss": -9.576167106628418, "global_step": 135940, "epoch": 809} {"train_loss": -10.649535179138184, "global_step": 135941, "epoch": 809} {"train_loss": -9.469178199768066, "global_step": 135942, "epoch": 809} {"train_loss": -10.096298217773438, "global_step": 135943, "epoch": 809} {"train_loss": -10.321892738342285, "global_step": 135944, "epoch": 809} {"train_loss": -10.10081672668457, "global_step": 135945, "epoch": 809} {"train_loss": -10.548508644104004, "global_step": 135946, "epoch": 809} {"train_loss": -9.808485984802246, "global_step": 135947, "epoch": 809} {"train_loss": -10.13473892211914, "global_step": 135948, "epoch": 809} {"train_loss": -9.848213195800781, "global_step": 135949, "epoch": 809} {"train_loss": -9.642599105834961, "global_step": 135950, "epoch": 809} {"train_loss": -9.8006010055542, "global_step": 135951, "epoch": 809} {"train_loss": -9.737552642822266, "global_step": 135952, "epoch": 809} {"train_loss": -10.123859405517578, "global_step": 135953, "epoch": 809} {"train_loss": -10.059081077575684, "global_step": 135954, "epoch": 809} {"train_loss": -9.781450271606445, "global_step": 135955, "epoch": 809} {"train_loss": -10.23837661743164, "global_step": 135956, "epoch": 809} {"train_loss": -9.925686836242676, "global_step": 135957, "epoch": 809} {"train_loss": -9.999300003051758, "global_step": 135958, "epoch": 809} {"train_loss": -10.310861587524414, "global_step": 135959, "epoch": 809} {"train_loss": -10.281778335571289, "global_step": 135960, "epoch": 809} {"train_loss": -9.971640586853027, "global_step": 135961, "epoch": 809} {"train_loss": -10.193611145019531, "global_step": 135962, "epoch": 809} {"train_loss": -10.183364868164062, "global_step": 135963, "epoch": 809} {"train_loss": -10.222493171691895, "global_step": 135964, "epoch": 809} {"train_loss": -10.222932815551758, "global_step": 135965, "epoch": 809} {"train_loss": -10.341702461242676, "global_step": 135966, "epoch": 809} {"train_loss": -10.225050926208496, "global_step": 135967, "epoch": 809} {"train_loss": -10.352274894714355, "global_step": 135968, "epoch": 809} {"train_loss": -10.243877410888672, "global_step": 135969, "epoch": 809} {"train_loss": -10.239234924316406, "global_step": 135970, "epoch": 809} {"train_loss": -10.202320098876953, "global_step": 135971, "epoch": 809} {"train_loss": -10.514759063720703, "global_step": 135972, "epoch": 809} {"train_loss": -10.038663864135742, "global_step": 135973, "epoch": 809} {"train_loss": -10.302959442138672, "global_step": 135974, "epoch": 809} {"train_loss": -10.420998573303223, "global_step": 135975, "epoch": 809} {"train_loss": -10.477714538574219, "global_step": 135976, "epoch": 809} {"train_loss": -10.471494674682617, "global_step": 135977, "epoch": 809} {"train_loss": -10.2755126953125, "global_step": 135978, "epoch": 809} {"train_loss": -10.627347946166992, "global_step": 135979, "epoch": 809} {"train_loss": -10.337843894958496, "global_step": 135980, "epoch": 809} {"train_loss": -10.426372528076172, "global_step": 135981, "epoch": 809} {"train_loss": -10.429323196411133, "global_step": 135982, "epoch": 809} {"train_loss": -10.67538833618164, "global_step": 135983, "epoch": 809} {"train_loss": -10.3531494140625, "global_step": 135984, "epoch": 809} {"train_loss": -10.735002517700195, "global_step": 135985, "epoch": 809} {"train_loss": -10.175870895385742, "global_step": 135986, "epoch": 809} {"train_loss": -10.33229923248291, "global_step": 135987, "epoch": 809} {"train_loss": -10.528549194335938, "global_step": 135988, "epoch": 809} {"train_loss": -10.64273452758789, "global_step": 135989, "epoch": 809} {"train_loss": -10.632909774780273, "global_step": 135990, "epoch": 809} {"train_loss": -10.577150344848633, "global_step": 135991, "epoch": 809} {"train_loss": -10.739080429077148, "global_step": 135992, "epoch": 809} {"train_loss": -10.61180591583252, "global_step": 135993, "epoch": 809} {"train_loss": -10.632533073425293, "global_step": 135994, "epoch": 809} {"train_loss": -10.347243309020996, "global_step": 135995, "epoch": 809} {"train_loss": -10.57988166809082, "global_step": 135996, "epoch": 809} {"train_loss": -10.621169090270996, "global_step": 135997, "epoch": 809} {"train_loss": -10.5563325881958, "global_step": 135998, "epoch": 809} {"train_loss": -10.788200378417969, "global_step": 135999, "epoch": 809} {"train_loss": -10.693827629089355, "global_step": 136000, "epoch": 809} {"train_loss": -10.679466247558594, "global_step": 136001, "epoch": 809} {"train_loss": -10.581151962280273, "global_step": 136002, "epoch": 809} {"train_loss": -10.855733871459961, "global_step": 136003, "epoch": 809} {"train_loss": -10.507518768310547, "global_step": 136004, "epoch": 809} {"train_loss": -10.77365493774414, "global_step": 136005, "epoch": 809} {"train_loss": -10.605985641479492, "global_step": 136006, "epoch": 809} {"train_loss": -10.461254119873047, "global_step": 136007, "epoch": 809} {"train_loss": -10.482025146484375, "global_step": 136008, "epoch": 809} {"train_loss": -10.656368255615234, "global_step": 136009, "epoch": 809} {"train_loss": -10.618047714233398, "global_step": 136010, "epoch": 809} {"train_loss": -10.450587272644043, "global_step": 136011, "epoch": 809} {"train_loss": -10.639470100402832, "global_step": 136012, "epoch": 809} {"train_loss": -10.348142623901367, "global_step": 136013, "epoch": 809} {"train_loss": -10.698293685913086, "global_step": 136014, "epoch": 809} {"train_loss": -10.481006622314453, "global_step": 136015, "epoch": 809} {"train_loss": -10.713176727294922, "global_step": 136016, "epoch": 809} {"train_loss": -10.324485778808594, "global_step": 136017, "epoch": 809} {"train_loss": -10.474851608276367, "global_step": 136018, "epoch": 809} {"train_loss": -10.089991569519043, "global_step": 136019, "epoch": 809} {"train_loss": -10.422294616699219, "global_step": 136020, "epoch": 809} {"train_loss": -10.47680950164795, "global_step": 136021, "epoch": 809} {"train_loss": -10.371994018554688, "global_step": 136022, "epoch": 809} {"train_loss": -10.42214584350586, "global_step": 136023, "epoch": 809} {"train_loss": -10.359743118286133, "global_step": 136024, "epoch": 809} {"train_loss": -10.285089492797852, "global_step": 136025, "epoch": 809} {"train_loss": -10.02272891998291, "global_step": 136026, "epoch": 809} {"train_loss": -10.49483871459961, "global_step": 136027, "epoch": 809} {"train_loss": -10.600381851196289, "global_step": 136028, "epoch": 809} {"train_loss": -10.328288078308105, "global_step": 136029, "epoch": 809} {"train_loss": -10.642085075378418, "global_step": 136030, "epoch": 809} {"train_loss": -10.285948753356934, "global_step": 136031, "epoch": 809} {"train_loss": -10.647150039672852, "global_step": 136032, "epoch": 809} {"train_loss": -10.431303024291992, "global_step": 136033, "epoch": 809} {"train_loss": -10.407722473144531, "global_step": 136034, "epoch": 809} {"train_loss": -10.58033561706543, "global_step": 136035, "epoch": 809} {"train_loss": -10.58793830871582, "global_step": 136036, "epoch": 809} {"train_loss": -10.628931999206543, "global_step": 136037, "epoch": 809} {"train_loss": -10.565301895141602, "global_step": 136038, "epoch": 809} {"train_loss": -10.56872272491455, "global_step": 136039, "epoch": 809} {"train_loss": -10.733404159545898, "global_step": 136040, "epoch": 809} {"train_loss": -10.625957489013672, "global_step": 136041, "epoch": 809} {"train_loss": -10.799080848693848, "global_step": 136042, "epoch": 809} {"train_loss": -10.726529121398926, "global_step": 136043, "epoch": 809} {"train_loss": -10.334449768066406, "global_step": 136044, "epoch": 809} {"train_loss": -10.442988395690918, "global_step": 136045, "epoch": 809} {"train_loss": -10.283080101013184, "global_step": 136046, "epoch": 809} {"train_loss": -10.58271598815918, "global_step": 136047, "epoch": 809} {"train_loss": -10.270284652709961, "global_step": 136048, "epoch": 809} {"train_loss": -10.419717788696289, "global_step": 136049, "epoch": 809} {"train_loss": -10.77382755279541, "global_step": 136050, "epoch": 809} {"train_loss": -10.32119369506836, "global_step": 136051, "epoch": 809} {"train_loss": -10.325199127197266, "global_step": 136052, "epoch": 809} {"train_loss": -10.307928085327148, "global_step": 136053, "epoch": 809} {"train_loss": -10.028307914733887, "global_step": 136054, "epoch": 809} {"train_loss": -10.480327606201172, "global_step": 136055, "epoch": 809} {"train_loss": -10.089768409729004, "global_step": 136056, "epoch": 809} {"train_loss": -10.421714782714844, "global_step": 136057, "epoch": 809} {"train_loss": -10.443304061889648, "global_step": 136058, "epoch": 809} {"train_loss": -10.468949317932129, "global_step": 136059, "epoch": 809} {"train_loss": -10.723670959472656, "global_step": 136060, "epoch": 809} {"train_loss": -10.54745864868164, "global_step": 136061, "epoch": 809} {"train_loss": -10.282505989074707, "global_step": 136062, "epoch": 809} {"train_loss": -10.524324417114258, "global_step": 136063, "epoch": 809} {"train_loss": -10.351588249206543, "global_step": 136064, "epoch": 809} {"train_loss": -10.520021438598633, "global_step": 136065, "epoch": 809} {"train_loss": -10.627067565917969, "global_step": 136066, "epoch": 809} {"train_loss": -10.740137100219727, "global_step": 136067, "epoch": 809} {"train_loss": -10.49072551727295, "global_step": 136068, "epoch": 809} {"train_loss": -10.62983226776123, "global_step": 136069, "epoch": 809} {"train_loss": -10.44893741607666, "global_step": 136070, "epoch": 809} {"train_loss": -10.435371398925781, "global_step": 136071, "epoch": 809} {"train_loss": -10.636845588684082, "global_step": 136072, "epoch": 809} {"train_loss": -10.295795440673828, "global_step": 136073, "epoch": 809} {"train_loss": -10.515336990356445, "global_step": 136074, "epoch": 809} {"train_loss": -10.522289276123047, "global_step": 136075, "epoch": 809} {"train_loss": -10.519161224365234, "global_step": 136076, "epoch": 809} {"train_loss": -10.419229507446289, "global_step": 136077, "epoch": 809} {"train_loss": -10.57918930053711, "global_step": 136078, "epoch": 809} {"train_loss": -10.424748789696466, "global_step": 136079, "epoch": 809, "val_loss": 223954.484375} {"train_loss": -10.416312217712402, "global_step": 136080, "epoch": 810} {"train_loss": -10.618656158447266, "global_step": 136081, "epoch": 810} {"train_loss": -10.005728721618652, "global_step": 136082, "epoch": 810} {"train_loss": -10.46432113647461, "global_step": 136083, "epoch": 810} {"train_loss": -10.559720993041992, "global_step": 136084, "epoch": 810} {"train_loss": -10.085649490356445, "global_step": 136085, "epoch": 810} {"train_loss": -10.582014083862305, "global_step": 136086, "epoch": 810} {"train_loss": -10.195399284362793, "global_step": 136087, "epoch": 810} {"train_loss": -10.555902481079102, "global_step": 136088, "epoch": 810} {"train_loss": -10.113081932067871, "global_step": 136089, "epoch": 810} {"train_loss": -10.36928653717041, "global_step": 136090, "epoch": 810} {"train_loss": -10.550853729248047, "global_step": 136091, "epoch": 810} {"train_loss": -10.137334823608398, "global_step": 136092, "epoch": 810} {"train_loss": -10.705658912658691, "global_step": 136093, "epoch": 810} {"train_loss": -10.052873611450195, "global_step": 136094, "epoch": 810} {"train_loss": -10.316184997558594, "global_step": 136095, "epoch": 810} {"train_loss": -10.21352767944336, "global_step": 136096, "epoch": 810} {"train_loss": -9.677214622497559, "global_step": 136097, "epoch": 810} {"train_loss": -10.47146987915039, "global_step": 136098, "epoch": 810} {"train_loss": -10.158348083496094, "global_step": 136099, "epoch": 810} {"train_loss": -10.25379753112793, "global_step": 136100, "epoch": 810} {"train_loss": -10.103215217590332, "global_step": 136101, "epoch": 810} {"train_loss": -10.142793655395508, "global_step": 136102, "epoch": 810} {"train_loss": -10.224893569946289, "global_step": 136103, "epoch": 810} {"train_loss": -10.393950462341309, "global_step": 136104, "epoch": 810} {"train_loss": -10.131002426147461, "global_step": 136105, "epoch": 810} {"train_loss": -10.487218856811523, "global_step": 136106, "epoch": 810} {"train_loss": -10.44599437713623, "global_step": 136107, "epoch": 810} {"train_loss": -10.34882640838623, "global_step": 136108, "epoch": 810} {"train_loss": -10.462584495544434, "global_step": 136109, "epoch": 810} {"train_loss": -10.131448745727539, "global_step": 136110, "epoch": 810} {"train_loss": -10.497014045715332, "global_step": 136111, "epoch": 810} {"train_loss": -10.274856567382812, "global_step": 136112, "epoch": 810} {"train_loss": -10.268745422363281, "global_step": 136113, "epoch": 810} {"train_loss": -10.28717041015625, "global_step": 136114, "epoch": 810} {"train_loss": -10.37215805053711, "global_step": 136115, "epoch": 810} {"train_loss": -10.420978546142578, "global_step": 136116, "epoch": 810} {"train_loss": -10.709480285644531, "global_step": 136117, "epoch": 810} {"train_loss": -10.292585372924805, "global_step": 136118, "epoch": 810} {"train_loss": -10.535879135131836, "global_step": 136119, "epoch": 810} {"train_loss": -10.578630447387695, "global_step": 136120, "epoch": 810} {"train_loss": -10.117565155029297, "global_step": 136121, "epoch": 810} {"train_loss": -10.476508140563965, "global_step": 136122, "epoch": 810} {"train_loss": -10.484204292297363, "global_step": 136123, "epoch": 810} {"train_loss": -10.445955276489258, "global_step": 136124, "epoch": 810} {"train_loss": -10.018074035644531, "global_step": 136125, "epoch": 810} {"train_loss": -10.010541915893555, "global_step": 136126, "epoch": 810} {"train_loss": -10.028997421264648, "global_step": 136127, "epoch": 810} {"train_loss": -10.387594223022461, "global_step": 136128, "epoch": 810} {"train_loss": -9.802879333496094, "global_step": 136129, "epoch": 810} {"train_loss": -10.150003433227539, "global_step": 136130, "epoch": 810} {"train_loss": -10.318941116333008, "global_step": 136131, "epoch": 810} {"train_loss": -9.9542236328125, "global_step": 136132, "epoch": 810} {"train_loss": -10.257207870483398, "global_step": 136133, "epoch": 810} {"train_loss": -10.22031021118164, "global_step": 136134, "epoch": 810} {"train_loss": -9.705281257629395, "global_step": 136135, "epoch": 810} {"train_loss": -10.298843383789062, "global_step": 136136, "epoch": 810} {"train_loss": -10.189682006835938, "global_step": 136137, "epoch": 810} {"train_loss": -10.209388732910156, "global_step": 136138, "epoch": 810} {"train_loss": -10.201809883117676, "global_step": 136139, "epoch": 810} {"train_loss": -10.3260498046875, "global_step": 136140, "epoch": 810} {"train_loss": -10.195365905761719, "global_step": 136141, "epoch": 810} {"train_loss": -10.338726997375488, "global_step": 136142, "epoch": 810} {"train_loss": -10.459226608276367, "global_step": 136143, "epoch": 810} {"train_loss": -10.540637969970703, "global_step": 136144, "epoch": 810} {"train_loss": -10.441143989562988, "global_step": 136145, "epoch": 810} {"train_loss": -10.307119369506836, "global_step": 136146, "epoch": 810} {"train_loss": -10.350264549255371, "global_step": 136147, "epoch": 810} {"train_loss": -10.546516418457031, "global_step": 136148, "epoch": 810} {"train_loss": -10.44245433807373, "global_step": 136149, "epoch": 810} {"train_loss": -10.515741348266602, "global_step": 136150, "epoch": 810} {"train_loss": -10.262036323547363, "global_step": 136151, "epoch": 810} {"train_loss": -10.646514892578125, "global_step": 136152, "epoch": 810} {"train_loss": -10.596515655517578, "global_step": 136153, "epoch": 810} {"train_loss": -10.623756408691406, "global_step": 136154, "epoch": 810} {"train_loss": -10.233902931213379, "global_step": 136155, "epoch": 810} {"train_loss": -10.732271194458008, "global_step": 136156, "epoch": 810} {"train_loss": -10.514288902282715, "global_step": 136157, "epoch": 810} {"train_loss": -10.559059143066406, "global_step": 136158, "epoch": 810} {"train_loss": -10.507144927978516, "global_step": 136159, "epoch": 810} {"train_loss": -10.776424407958984, "global_step": 136160, "epoch": 810} {"train_loss": -10.703720092773438, "global_step": 136161, "epoch": 810} {"train_loss": -10.56674575805664, "global_step": 136162, "epoch": 810} {"train_loss": -10.760366439819336, "global_step": 136163, "epoch": 810} {"train_loss": -10.43008041381836, "global_step": 136164, "epoch": 810} {"train_loss": -10.719341278076172, "global_step": 136165, "epoch": 810} {"train_loss": -10.654595375061035, "global_step": 136166, "epoch": 810} {"train_loss": -10.38951301574707, "global_step": 136167, "epoch": 810} {"train_loss": -10.606426239013672, "global_step": 136168, "epoch": 810} {"train_loss": -10.545942306518555, "global_step": 136169, "epoch": 810} {"train_loss": -10.407815933227539, "global_step": 136170, "epoch": 810} {"train_loss": -10.636043548583984, "global_step": 136171, "epoch": 810} {"train_loss": -10.583678245544434, "global_step": 136172, "epoch": 810} {"train_loss": -10.706933975219727, "global_step": 136173, "epoch": 810} {"train_loss": -10.671133041381836, "global_step": 136174, "epoch": 810} {"train_loss": -10.631155967712402, "global_step": 136175, "epoch": 810} {"train_loss": -10.566884994506836, "global_step": 136176, "epoch": 810} {"train_loss": -10.584797859191895, "global_step": 136177, "epoch": 810} {"train_loss": -10.698709487915039, "global_step": 136178, "epoch": 810} {"train_loss": -10.335617065429688, "global_step": 136179, "epoch": 810} {"train_loss": -10.892843246459961, "global_step": 136180, "epoch": 810} {"train_loss": -10.364358901977539, "global_step": 136181, "epoch": 810} {"train_loss": -10.530171394348145, "global_step": 136182, "epoch": 810} {"train_loss": -10.590433120727539, "global_step": 136183, "epoch": 810} {"train_loss": -10.116662979125977, "global_step": 136184, "epoch": 810} {"train_loss": -10.15553092956543, "global_step": 136185, "epoch": 810} {"train_loss": -10.407328605651855, "global_step": 136186, "epoch": 810} {"train_loss": -10.330099105834961, "global_step": 136187, "epoch": 810} {"train_loss": -10.400857925415039, "global_step": 136188, "epoch": 810} {"train_loss": -10.12348747253418, "global_step": 136189, "epoch": 810} {"train_loss": -9.991928100585938, "global_step": 136190, "epoch": 810} {"train_loss": -10.591585159301758, "global_step": 136191, "epoch": 810} {"train_loss": -10.407693862915039, "global_step": 136192, "epoch": 810} {"train_loss": -10.543638229370117, "global_step": 136193, "epoch": 810} {"train_loss": -10.261072158813477, "global_step": 136194, "epoch": 810} {"train_loss": -10.52743911743164, "global_step": 136195, "epoch": 810} {"train_loss": -10.622444152832031, "global_step": 136196, "epoch": 810} {"train_loss": -10.611721992492676, "global_step": 136197, "epoch": 810} {"train_loss": -10.619699478149414, "global_step": 136198, "epoch": 810} {"train_loss": -10.38054084777832, "global_step": 136199, "epoch": 810} {"train_loss": -10.484870910644531, "global_step": 136200, "epoch": 810} {"train_loss": -10.771098136901855, "global_step": 136201, "epoch": 810} {"train_loss": -10.60289478302002, "global_step": 136202, "epoch": 810} {"train_loss": -10.656047821044922, "global_step": 136203, "epoch": 810} {"train_loss": -10.587526321411133, "global_step": 136204, "epoch": 810} {"train_loss": -10.600152015686035, "global_step": 136205, "epoch": 810} {"train_loss": -10.146524429321289, "global_step": 136206, "epoch": 810} {"train_loss": -10.718080520629883, "global_step": 136207, "epoch": 810} {"train_loss": -10.500404357910156, "global_step": 136208, "epoch": 810} {"train_loss": -10.492443084716797, "global_step": 136209, "epoch": 810} {"train_loss": -10.701125144958496, "global_step": 136210, "epoch": 810} {"train_loss": -10.568307876586914, "global_step": 136211, "epoch": 810} {"train_loss": -10.566838264465332, "global_step": 136212, "epoch": 810} {"train_loss": -10.70055866241455, "global_step": 136213, "epoch": 810} {"train_loss": -10.55447769165039, "global_step": 136214, "epoch": 810} {"train_loss": -10.495168685913086, "global_step": 136215, "epoch": 810} {"train_loss": -10.722963333129883, "global_step": 136216, "epoch": 810} {"train_loss": -10.43203353881836, "global_step": 136217, "epoch": 810} {"train_loss": -10.142839431762695, "global_step": 136218, "epoch": 810} {"train_loss": -10.643878936767578, "global_step": 136219, "epoch": 810} {"train_loss": -10.231254577636719, "global_step": 136220, "epoch": 810} {"train_loss": -10.472818374633789, "global_step": 136221, "epoch": 810} {"train_loss": -10.445518493652344, "global_step": 136222, "epoch": 810} {"train_loss": -10.826566696166992, "global_step": 136223, "epoch": 810} {"train_loss": -10.33789348602295, "global_step": 136224, "epoch": 810} {"train_loss": -10.53270149230957, "global_step": 136225, "epoch": 810} {"train_loss": -10.696084976196289, "global_step": 136226, "epoch": 810} {"train_loss": -10.79664421081543, "global_step": 136227, "epoch": 810} {"train_loss": -10.522515296936035, "global_step": 136228, "epoch": 810} {"train_loss": -10.760692596435547, "global_step": 136229, "epoch": 810} {"train_loss": -10.627103805541992, "global_step": 136230, "epoch": 810} {"train_loss": -10.694379806518555, "global_step": 136231, "epoch": 810} {"train_loss": -10.711494445800781, "global_step": 136232, "epoch": 810} {"train_loss": -10.839996337890625, "global_step": 136233, "epoch": 810} {"train_loss": -10.529708862304688, "global_step": 136234, "epoch": 810} {"train_loss": -11.013458251953125, "global_step": 136235, "epoch": 810} {"train_loss": -10.690864562988281, "global_step": 136236, "epoch": 810} {"train_loss": -10.583794593811035, "global_step": 136237, "epoch": 810} {"train_loss": -10.826062202453613, "global_step": 136238, "epoch": 810} {"train_loss": -10.68282699584961, "global_step": 136239, "epoch": 810} {"train_loss": -10.412395477294922, "global_step": 136240, "epoch": 810} {"train_loss": -10.252914428710938, "global_step": 136241, "epoch": 810} {"train_loss": -10.45384407043457, "global_step": 136242, "epoch": 810} {"train_loss": -9.861597061157227, "global_step": 136243, "epoch": 810} {"train_loss": -10.262192726135254, "global_step": 136244, "epoch": 810} {"train_loss": -10.481815338134766, "global_step": 136245, "epoch": 810} {"train_loss": -9.860197067260742, "global_step": 136246, "epoch": 810} {"train_loss": -10.427961008889335, "global_step": 136247, "epoch": 810, "val_loss": 221551.203125, "train_action_mse_error": 1.518221139907837} {"train_loss": -10.585920333862305, "global_step": 136248, "epoch": 811} {"train_loss": -10.086202621459961, "global_step": 136249, "epoch": 811} {"train_loss": -9.715105056762695, "global_step": 136250, "epoch": 811} {"train_loss": -10.516866683959961, "global_step": 136251, "epoch": 811} {"train_loss": -10.288771629333496, "global_step": 136252, "epoch": 811} {"train_loss": -10.234333038330078, "global_step": 136253, "epoch": 811} {"train_loss": -10.119868278503418, "global_step": 136254, "epoch": 811} {"train_loss": -10.25752067565918, "global_step": 136255, "epoch": 811} {"train_loss": -9.734953880310059, "global_step": 136256, "epoch": 811} {"train_loss": -10.33618450164795, "global_step": 136257, "epoch": 811} {"train_loss": -10.357847213745117, "global_step": 136258, "epoch": 811} {"train_loss": -9.954177856445312, "global_step": 136259, "epoch": 811} {"train_loss": -10.418525695800781, "global_step": 136260, "epoch": 811} {"train_loss": -9.96386432647705, "global_step": 136261, "epoch": 811} {"train_loss": -10.239153861999512, "global_step": 136262, "epoch": 811} {"train_loss": -10.115241050720215, "global_step": 136263, "epoch": 811} {"train_loss": -10.358741760253906, "global_step": 136264, "epoch": 811} {"train_loss": -10.193845748901367, "global_step": 136265, "epoch": 811} {"train_loss": -10.31831169128418, "global_step": 136266, "epoch": 811} {"train_loss": -10.12618350982666, "global_step": 136267, "epoch": 811} {"train_loss": -10.622221946716309, "global_step": 136268, "epoch": 811} {"train_loss": -10.380887985229492, "global_step": 136269, "epoch": 811} {"train_loss": -10.456947326660156, "global_step": 136270, "epoch": 811} {"train_loss": -10.367997169494629, "global_step": 136271, "epoch": 811} {"train_loss": -10.281023025512695, "global_step": 136272, "epoch": 811} {"train_loss": -9.954950332641602, "global_step": 136273, "epoch": 811} {"train_loss": -10.386265754699707, "global_step": 136274, "epoch": 811} {"train_loss": -10.388044357299805, "global_step": 136275, "epoch": 811} {"train_loss": -10.236900329589844, "global_step": 136276, "epoch": 811} {"train_loss": -10.016866683959961, "global_step": 136277, "epoch": 811} {"train_loss": -10.174192428588867, "global_step": 136278, "epoch": 811} {"train_loss": -10.096037864685059, "global_step": 136279, "epoch": 811} {"train_loss": -10.104911804199219, "global_step": 136280, "epoch": 811} {"train_loss": -10.160085678100586, "global_step": 136281, "epoch": 811} {"train_loss": -10.292213439941406, "global_step": 136282, "epoch": 811} {"train_loss": -10.269952774047852, "global_step": 136283, "epoch": 811} {"train_loss": -10.698622703552246, "global_step": 136284, "epoch": 811} {"train_loss": -10.446552276611328, "global_step": 136285, "epoch": 811} {"train_loss": -10.538512229919434, "global_step": 136286, "epoch": 811} {"train_loss": -10.378064155578613, "global_step": 136287, "epoch": 811} {"train_loss": -10.276912689208984, "global_step": 136288, "epoch": 811} {"train_loss": -10.766463279724121, "global_step": 136289, "epoch": 811} {"train_loss": -10.711122512817383, "global_step": 136290, "epoch": 811} {"train_loss": -10.609024047851562, "global_step": 136291, "epoch": 811} {"train_loss": -10.668790817260742, "global_step": 136292, "epoch": 811} {"train_loss": -10.61299991607666, "global_step": 136293, "epoch": 811} {"train_loss": -10.347702026367188, "global_step": 136294, "epoch": 811} {"train_loss": -10.49909782409668, "global_step": 136295, "epoch": 811} {"train_loss": -10.385671615600586, "global_step": 136296, "epoch": 811} {"train_loss": -10.542728424072266, "global_step": 136297, "epoch": 811} {"train_loss": -10.674238204956055, "global_step": 136298, "epoch": 811} {"train_loss": -10.5680513381958, "global_step": 136299, "epoch": 811} {"train_loss": -10.715600967407227, "global_step": 136300, "epoch": 811} {"train_loss": -10.501518249511719, "global_step": 136301, "epoch": 811} {"train_loss": -10.912421226501465, "global_step": 136302, "epoch": 811} {"train_loss": -10.697071075439453, "global_step": 136303, "epoch": 811} {"train_loss": -10.862640380859375, "global_step": 136304, "epoch": 811} {"train_loss": -10.778680801391602, "global_step": 136305, "epoch": 811} {"train_loss": -10.453813552856445, "global_step": 136306, "epoch": 811} {"train_loss": -10.751792907714844, "global_step": 136307, "epoch": 811} {"train_loss": -10.784634590148926, "global_step": 136308, "epoch": 811} {"train_loss": -10.677558898925781, "global_step": 136309, "epoch": 811} {"train_loss": -10.890470504760742, "global_step": 136310, "epoch": 811} {"train_loss": -10.6984281539917, "global_step": 136311, "epoch": 811} {"train_loss": -10.94603157043457, "global_step": 136312, "epoch": 811} {"train_loss": -10.643043518066406, "global_step": 136313, "epoch": 811} {"train_loss": -10.655437469482422, "global_step": 136314, "epoch": 811} {"train_loss": -10.908777236938477, "global_step": 136315, "epoch": 811} {"train_loss": -10.457502365112305, "global_step": 136316, "epoch": 811} {"train_loss": -10.642631530761719, "global_step": 136317, "epoch": 811} {"train_loss": -10.457239151000977, "global_step": 136318, "epoch": 811} {"train_loss": -10.353670120239258, "global_step": 136319, "epoch": 811} {"train_loss": -10.29418659210205, "global_step": 136320, "epoch": 811} {"train_loss": -10.540443420410156, "global_step": 136321, "epoch": 811} {"train_loss": -10.390300750732422, "global_step": 136322, "epoch": 811} {"train_loss": -10.659830093383789, "global_step": 136323, "epoch": 811} {"train_loss": -10.670431137084961, "global_step": 136324, "epoch": 811} {"train_loss": -10.30594539642334, "global_step": 136325, "epoch": 811} {"train_loss": -10.229856491088867, "global_step": 136326, "epoch": 811} {"train_loss": -10.565845489501953, "global_step": 136327, "epoch": 811} {"train_loss": -10.103049278259277, "global_step": 136328, "epoch": 811} {"train_loss": -10.555596351623535, "global_step": 136329, "epoch": 811} {"train_loss": -10.614908218383789, "global_step": 136330, "epoch": 811} {"train_loss": -10.31853199005127, "global_step": 136331, "epoch": 811} {"train_loss": -10.303431510925293, "global_step": 136332, "epoch": 811} {"train_loss": -10.433586120605469, "global_step": 136333, "epoch": 811} {"train_loss": -9.858428955078125, "global_step": 136334, "epoch": 811} {"train_loss": -10.570268630981445, "global_step": 136335, "epoch": 811} {"train_loss": -10.519662857055664, "global_step": 136336, "epoch": 811} {"train_loss": -10.335424423217773, "global_step": 136337, "epoch": 811} {"train_loss": -10.520895004272461, "global_step": 136338, "epoch": 811} {"train_loss": -10.591078758239746, "global_step": 136339, "epoch": 811} {"train_loss": -10.401362419128418, "global_step": 136340, "epoch": 811} {"train_loss": -10.104917526245117, "global_step": 136341, "epoch": 811} {"train_loss": -10.757619857788086, "global_step": 136342, "epoch": 811} {"train_loss": -10.425384521484375, "global_step": 136343, "epoch": 811} {"train_loss": -10.410994529724121, "global_step": 136344, "epoch": 811} {"train_loss": -10.582169532775879, "global_step": 136345, "epoch": 811} {"train_loss": -10.448555946350098, "global_step": 136346, "epoch": 811} {"train_loss": -10.634209632873535, "global_step": 136347, "epoch": 811} {"train_loss": -10.56364631652832, "global_step": 136348, "epoch": 811} {"train_loss": -10.611227035522461, "global_step": 136349, "epoch": 811} {"train_loss": -10.505340576171875, "global_step": 136350, "epoch": 811} {"train_loss": -10.490039825439453, "global_step": 136351, "epoch": 811} {"train_loss": -10.603462219238281, "global_step": 136352, "epoch": 811} {"train_loss": -10.67007064819336, "global_step": 136353, "epoch": 811} {"train_loss": -10.529524803161621, "global_step": 136354, "epoch": 811} {"train_loss": -10.659673690795898, "global_step": 136355, "epoch": 811} {"train_loss": -10.424280166625977, "global_step": 136356, "epoch": 811} {"train_loss": -10.691143035888672, "global_step": 136357, "epoch": 811} {"train_loss": -10.55184555053711, "global_step": 136358, "epoch": 811} {"train_loss": -10.421030044555664, "global_step": 136359, "epoch": 811} {"train_loss": -10.498652458190918, "global_step": 136360, "epoch": 811} {"train_loss": -10.85865306854248, "global_step": 136361, "epoch": 811} {"train_loss": -9.936147689819336, "global_step": 136362, "epoch": 811} {"train_loss": -10.57203197479248, "global_step": 136363, "epoch": 811} {"train_loss": -10.453210830688477, "global_step": 136364, "epoch": 811} {"train_loss": -10.276538848876953, "global_step": 136365, "epoch": 811} {"train_loss": -10.676055908203125, "global_step": 136366, "epoch": 811} {"train_loss": -10.071943283081055, "global_step": 136367, "epoch": 811} {"train_loss": -10.50965690612793, "global_step": 136368, "epoch": 811} {"train_loss": -10.630382537841797, "global_step": 136369, "epoch": 811} {"train_loss": -10.25788402557373, "global_step": 136370, "epoch": 811} {"train_loss": -10.501514434814453, "global_step": 136371, "epoch": 811} {"train_loss": -10.464594841003418, "global_step": 136372, "epoch": 811} {"train_loss": -10.209760665893555, "global_step": 136373, "epoch": 811} {"train_loss": -10.512280464172363, "global_step": 136374, "epoch": 811} {"train_loss": -9.751301765441895, "global_step": 136375, "epoch": 811} {"train_loss": -10.21809196472168, "global_step": 136376, "epoch": 811} {"train_loss": -10.062480926513672, "global_step": 136377, "epoch": 811} {"train_loss": -10.405954360961914, "global_step": 136378, "epoch": 811} {"train_loss": -10.021200180053711, "global_step": 136379, "epoch": 811} {"train_loss": -10.773021697998047, "global_step": 136380, "epoch": 811} {"train_loss": -9.856406211853027, "global_step": 136381, "epoch": 811} {"train_loss": -10.54254150390625, "global_step": 136382, "epoch": 811} {"train_loss": -10.462129592895508, "global_step": 136383, "epoch": 811} {"train_loss": -10.355001449584961, "global_step": 136384, "epoch": 811} {"train_loss": -10.247550964355469, "global_step": 136385, "epoch": 811} {"train_loss": -10.60982894897461, "global_step": 136386, "epoch": 811} {"train_loss": -10.353243827819824, "global_step": 136387, "epoch": 811} {"train_loss": -10.358505249023438, "global_step": 136388, "epoch": 811} {"train_loss": -10.30253791809082, "global_step": 136389, "epoch": 811} {"train_loss": -10.38296127319336, "global_step": 136390, "epoch": 811} {"train_loss": -10.323456764221191, "global_step": 136391, "epoch": 811} {"train_loss": -10.394783973693848, "global_step": 136392, "epoch": 811} {"train_loss": -10.068487167358398, "global_step": 136393, "epoch": 811} {"train_loss": -10.445350646972656, "global_step": 136394, "epoch": 811} {"train_loss": -10.214639663696289, "global_step": 136395, "epoch": 811} {"train_loss": -10.46615982055664, "global_step": 136396, "epoch": 811} {"train_loss": -10.451598167419434, "global_step": 136397, "epoch": 811} {"train_loss": -10.120152473449707, "global_step": 136398, "epoch": 811} {"train_loss": -10.442381858825684, "global_step": 136399, "epoch": 811} {"train_loss": -10.333367347717285, "global_step": 136400, "epoch": 811} {"train_loss": -10.324277877807617, "global_step": 136401, "epoch": 811} {"train_loss": -10.662277221679688, "global_step": 136402, "epoch": 811} {"train_loss": -10.11509895324707, "global_step": 136403, "epoch": 811} {"train_loss": -10.613842010498047, "global_step": 136404, "epoch": 811} {"train_loss": -10.61288833618164, "global_step": 136405, "epoch": 811} {"train_loss": -10.40478801727295, "global_step": 136406, "epoch": 811} {"train_loss": -10.627965927124023, "global_step": 136407, "epoch": 811} {"train_loss": -10.683855056762695, "global_step": 136408, "epoch": 811} {"train_loss": -10.67210865020752, "global_step": 136409, "epoch": 811} {"train_loss": -10.46639347076416, "global_step": 136410, "epoch": 811} {"train_loss": -10.689555168151855, "global_step": 136411, "epoch": 811} {"train_loss": -10.541095733642578, "global_step": 136412, "epoch": 811} {"train_loss": -10.61387825012207, "global_step": 136413, "epoch": 811} {"train_loss": -10.739583969116211, "global_step": 136414, "epoch": 811} {"train_loss": -10.429424757049198, "global_step": 136415, "epoch": 811, "val_loss": 221916.609375} {"train_loss": -10.761494636535645, "global_step": 136416, "epoch": 812} {"train_loss": -10.443864822387695, "global_step": 136417, "epoch": 812} {"train_loss": -10.681388854980469, "global_step": 136418, "epoch": 812} {"train_loss": -10.899248123168945, "global_step": 136419, "epoch": 812} {"train_loss": -10.490154266357422, "global_step": 136420, "epoch": 812} {"train_loss": -10.580394744873047, "global_step": 136421, "epoch": 812} {"train_loss": -10.827902793884277, "global_step": 136422, "epoch": 812} {"train_loss": -10.632696151733398, "global_step": 136423, "epoch": 812} {"train_loss": -10.634842872619629, "global_step": 136424, "epoch": 812} {"train_loss": -10.680967330932617, "global_step": 136425, "epoch": 812} {"train_loss": -10.670838356018066, "global_step": 136426, "epoch": 812} {"train_loss": -10.225738525390625, "global_step": 136427, "epoch": 812} {"train_loss": -10.787043571472168, "global_step": 136428, "epoch": 812} {"train_loss": -10.483321189880371, "global_step": 136429, "epoch": 812} {"train_loss": -10.515643119812012, "global_step": 136430, "epoch": 812} {"train_loss": -10.696414947509766, "global_step": 136431, "epoch": 812} {"train_loss": -10.526679039001465, "global_step": 136432, "epoch": 812} {"train_loss": -10.782854080200195, "global_step": 136433, "epoch": 812} {"train_loss": -10.630533218383789, "global_step": 136434, "epoch": 812} {"train_loss": -10.711301803588867, "global_step": 136435, "epoch": 812} {"train_loss": -10.833839416503906, "global_step": 136436, "epoch": 812} {"train_loss": -10.839652061462402, "global_step": 136437, "epoch": 812} {"train_loss": -10.510810852050781, "global_step": 136438, "epoch": 812} {"train_loss": -10.625740051269531, "global_step": 136439, "epoch": 812} {"train_loss": -10.640096664428711, "global_step": 136440, "epoch": 812} {"train_loss": -10.459447860717773, "global_step": 136441, "epoch": 812} {"train_loss": -10.683959007263184, "global_step": 136442, "epoch": 812} {"train_loss": -10.74275016784668, "global_step": 136443, "epoch": 812} {"train_loss": -11.052711486816406, "global_step": 136444, "epoch": 812} {"train_loss": -10.712606430053711, "global_step": 136445, "epoch": 812} {"train_loss": -10.708189010620117, "global_step": 136446, "epoch": 812} {"train_loss": -10.611862182617188, "global_step": 136447, "epoch": 812} {"train_loss": -10.705340385437012, "global_step": 136448, "epoch": 812} {"train_loss": -10.980846405029297, "global_step": 136449, "epoch": 812} {"train_loss": -10.409515380859375, "global_step": 136450, "epoch": 812} {"train_loss": -10.772746086120605, "global_step": 136451, "epoch": 812} {"train_loss": -10.309344291687012, "global_step": 136452, "epoch": 812} {"train_loss": -10.756677627563477, "global_step": 136453, "epoch": 812} {"train_loss": -10.575597763061523, "global_step": 136454, "epoch": 812} {"train_loss": -10.753104209899902, "global_step": 136455, "epoch": 812} {"train_loss": -10.448883056640625, "global_step": 136456, "epoch": 812} {"train_loss": -10.775382995605469, "global_step": 136457, "epoch": 812} {"train_loss": -10.595287322998047, "global_step": 136458, "epoch": 812} {"train_loss": -10.797090530395508, "global_step": 136459, "epoch": 812} {"train_loss": -10.528176307678223, "global_step": 136460, "epoch": 812} {"train_loss": -10.509086608886719, "global_step": 136461, "epoch": 812} {"train_loss": -10.762224197387695, "global_step": 136462, "epoch": 812} {"train_loss": -10.665287017822266, "global_step": 136463, "epoch": 812} {"train_loss": -10.323660850524902, "global_step": 136464, "epoch": 812} {"train_loss": -10.54100227355957, "global_step": 136465, "epoch": 812} {"train_loss": -10.662885665893555, "global_step": 136466, "epoch": 812} {"train_loss": -10.866462707519531, "global_step": 136467, "epoch": 812} {"train_loss": -10.389856338500977, "global_step": 136468, "epoch": 812} {"train_loss": -10.774129867553711, "global_step": 136469, "epoch": 812} {"train_loss": -10.55917739868164, "global_step": 136470, "epoch": 812} {"train_loss": -10.351583480834961, "global_step": 136471, "epoch": 812} {"train_loss": -10.13282585144043, "global_step": 136472, "epoch": 812} {"train_loss": -10.829940795898438, "global_step": 136473, "epoch": 812} {"train_loss": -10.522883415222168, "global_step": 136474, "epoch": 812} {"train_loss": -10.383432388305664, "global_step": 136475, "epoch": 812} {"train_loss": -10.839094161987305, "global_step": 136476, "epoch": 812} {"train_loss": -10.642265319824219, "global_step": 136477, "epoch": 812} {"train_loss": -10.398502349853516, "global_step": 136478, "epoch": 812} {"train_loss": -10.756978034973145, "global_step": 136479, "epoch": 812} {"train_loss": -10.467421531677246, "global_step": 136480, "epoch": 812} {"train_loss": -10.668323516845703, "global_step": 136481, "epoch": 812} {"train_loss": -10.55697250366211, "global_step": 136482, "epoch": 812} {"train_loss": -10.589879989624023, "global_step": 136483, "epoch": 812} {"train_loss": -10.48119068145752, "global_step": 136484, "epoch": 812} {"train_loss": -10.6280517578125, "global_step": 136485, "epoch": 812} {"train_loss": -10.6507568359375, "global_step": 136486, "epoch": 812} {"train_loss": -10.454345703125, "global_step": 136487, "epoch": 812} {"train_loss": -10.627579689025879, "global_step": 136488, "epoch": 812} {"train_loss": -10.57436466217041, "global_step": 136489, "epoch": 812} {"train_loss": -10.753833770751953, "global_step": 136490, "epoch": 812} {"train_loss": -10.673885345458984, "global_step": 136491, "epoch": 812} {"train_loss": -10.487768173217773, "global_step": 136492, "epoch": 812} {"train_loss": -10.633281707763672, "global_step": 136493, "epoch": 812} {"train_loss": -10.744061470031738, "global_step": 136494, "epoch": 812} {"train_loss": -10.905614852905273, "global_step": 136495, "epoch": 812} {"train_loss": -10.518353462219238, "global_step": 136496, "epoch": 812} {"train_loss": -10.436290740966797, "global_step": 136497, "epoch": 812} {"train_loss": -10.58521842956543, "global_step": 136498, "epoch": 812} {"train_loss": -10.783173561096191, "global_step": 136499, "epoch": 812} {"train_loss": -10.67595100402832, "global_step": 136500, "epoch": 812} {"train_loss": -10.486515045166016, "global_step": 136501, "epoch": 812} {"train_loss": -10.44793701171875, "global_step": 136502, "epoch": 812} {"train_loss": -10.131230354309082, "global_step": 136503, "epoch": 812} {"train_loss": -10.466554641723633, "global_step": 136504, "epoch": 812} {"train_loss": -9.664114952087402, "global_step": 136505, "epoch": 812} {"train_loss": -9.670191764831543, "global_step": 136506, "epoch": 812} {"train_loss": -10.361408233642578, "global_step": 136507, "epoch": 812} {"train_loss": -10.386407852172852, "global_step": 136508, "epoch": 812} {"train_loss": -10.073144912719727, "global_step": 136509, "epoch": 812} {"train_loss": -10.572500228881836, "global_step": 136510, "epoch": 812} {"train_loss": -9.873014450073242, "global_step": 136511, "epoch": 812} {"train_loss": -10.107022285461426, "global_step": 136512, "epoch": 812} {"train_loss": -9.913251876831055, "global_step": 136513, "epoch": 812} {"train_loss": -9.829723358154297, "global_step": 136514, "epoch": 812} {"train_loss": -10.310934066772461, "global_step": 136515, "epoch": 812} {"train_loss": -9.772680282592773, "global_step": 136516, "epoch": 812} {"train_loss": -10.024925231933594, "global_step": 136517, "epoch": 812} {"train_loss": -10.136476516723633, "global_step": 136518, "epoch": 812} {"train_loss": -10.143606185913086, "global_step": 136519, "epoch": 812} {"train_loss": -10.358742713928223, "global_step": 136520, "epoch": 812} {"train_loss": -10.408976554870605, "global_step": 136521, "epoch": 812} {"train_loss": -10.360452651977539, "global_step": 136522, "epoch": 812} {"train_loss": -10.243553161621094, "global_step": 136523, "epoch": 812} {"train_loss": -10.210973739624023, "global_step": 136524, "epoch": 812} {"train_loss": -10.204299926757812, "global_step": 136525, "epoch": 812} {"train_loss": -10.446694374084473, "global_step": 136526, "epoch": 812} {"train_loss": -10.559791564941406, "global_step": 136527, "epoch": 812} {"train_loss": -10.424723625183105, "global_step": 136528, "epoch": 812} {"train_loss": -10.634897232055664, "global_step": 136529, "epoch": 812} {"train_loss": -10.437247276306152, "global_step": 136530, "epoch": 812} {"train_loss": -10.669952392578125, "global_step": 136531, "epoch": 812} {"train_loss": -10.544465065002441, "global_step": 136532, "epoch": 812} {"train_loss": -10.564455032348633, "global_step": 136533, "epoch": 812} {"train_loss": -10.533416748046875, "global_step": 136534, "epoch": 812} {"train_loss": -10.677192687988281, "global_step": 136535, "epoch": 812} {"train_loss": -10.38058853149414, "global_step": 136536, "epoch": 812} {"train_loss": -10.254127502441406, "global_step": 136537, "epoch": 812} {"train_loss": -10.611492156982422, "global_step": 136538, "epoch": 812} {"train_loss": -10.4838228225708, "global_step": 136539, "epoch": 812} {"train_loss": -10.41183090209961, "global_step": 136540, "epoch": 812} {"train_loss": -10.375368118286133, "global_step": 136541, "epoch": 812} {"train_loss": -10.787721633911133, "global_step": 136542, "epoch": 812} {"train_loss": -10.570793151855469, "global_step": 136543, "epoch": 812} {"train_loss": -10.431329727172852, "global_step": 136544, "epoch": 812} {"train_loss": -10.321934700012207, "global_step": 136545, "epoch": 812} {"train_loss": -10.53532600402832, "global_step": 136546, "epoch": 812} {"train_loss": -10.458067893981934, "global_step": 136547, "epoch": 812} {"train_loss": -10.561111450195312, "global_step": 136548, "epoch": 812} {"train_loss": -10.57703685760498, "global_step": 136549, "epoch": 812} {"train_loss": -10.448777198791504, "global_step": 136550, "epoch": 812} {"train_loss": -10.815932273864746, "global_step": 136551, "epoch": 812} {"train_loss": -10.46060562133789, "global_step": 136552, "epoch": 812} {"train_loss": -10.913814544677734, "global_step": 136553, "epoch": 812} {"train_loss": -10.591228485107422, "global_step": 136554, "epoch": 812} {"train_loss": -10.602095603942871, "global_step": 136555, "epoch": 812} {"train_loss": -10.704690933227539, "global_step": 136556, "epoch": 812} {"train_loss": -10.201274871826172, "global_step": 136557, "epoch": 812} {"train_loss": -10.597894668579102, "global_step": 136558, "epoch": 812} {"train_loss": -10.7154541015625, "global_step": 136559, "epoch": 812} {"train_loss": -10.514809608459473, "global_step": 136560, "epoch": 812} {"train_loss": -10.495487213134766, "global_step": 136561, "epoch": 812} {"train_loss": -10.54601001739502, "global_step": 136562, "epoch": 812} {"train_loss": -10.536837577819824, "global_step": 136563, "epoch": 812} {"train_loss": -10.19200611114502, "global_step": 136564, "epoch": 812} {"train_loss": -10.88762092590332, "global_step": 136565, "epoch": 812} {"train_loss": -10.173347473144531, "global_step": 136566, "epoch": 812} {"train_loss": -10.73291301727295, "global_step": 136567, "epoch": 812} {"train_loss": -10.5933256149292, "global_step": 136568, "epoch": 812} {"train_loss": -10.403423309326172, "global_step": 136569, "epoch": 812} {"train_loss": -10.584895133972168, "global_step": 136570, "epoch": 812} {"train_loss": -10.550070762634277, "global_step": 136571, "epoch": 812} {"train_loss": -10.839595794677734, "global_step": 136572, "epoch": 812} {"train_loss": -10.571830749511719, "global_step": 136573, "epoch": 812} {"train_loss": -10.67829704284668, "global_step": 136574, "epoch": 812} {"train_loss": -10.611112594604492, "global_step": 136575, "epoch": 812} {"train_loss": -10.61367416381836, "global_step": 136576, "epoch": 812} {"train_loss": -10.608712196350098, "global_step": 136577, "epoch": 812} {"train_loss": -10.574441909790039, "global_step": 136578, "epoch": 812} {"train_loss": -10.718011856079102, "global_step": 136579, "epoch": 812} {"train_loss": -10.784811019897461, "global_step": 136580, "epoch": 812} {"train_loss": -10.66746711730957, "global_step": 136581, "epoch": 812} {"train_loss": -10.706239700317383, "global_step": 136582, "epoch": 812} {"train_loss": -10.536896132287525, "global_step": 136583, "epoch": 812, "val_loss": 222093.84375} {"train_loss": -10.263924598693848, "global_step": 136584, "epoch": 813} {"train_loss": -10.761183738708496, "global_step": 136585, "epoch": 813} {"train_loss": -10.38606071472168, "global_step": 136586, "epoch": 813} {"train_loss": -10.390497207641602, "global_step": 136587, "epoch": 813} {"train_loss": -10.596683502197266, "global_step": 136588, "epoch": 813} {"train_loss": -10.64328384399414, "global_step": 136589, "epoch": 813} {"train_loss": -10.345330238342285, "global_step": 136590, "epoch": 813} {"train_loss": -10.434364318847656, "global_step": 136591, "epoch": 813} {"train_loss": -10.669393539428711, "global_step": 136592, "epoch": 813} {"train_loss": -10.593809127807617, "global_step": 136593, "epoch": 813} {"train_loss": -10.443570137023926, "global_step": 136594, "epoch": 813} {"train_loss": -10.441995620727539, "global_step": 136595, "epoch": 813} {"train_loss": -10.811543464660645, "global_step": 136596, "epoch": 813} {"train_loss": -10.215802192687988, "global_step": 136597, "epoch": 813} {"train_loss": -10.4354248046875, "global_step": 136598, "epoch": 813} {"train_loss": -10.380376815795898, "global_step": 136599, "epoch": 813} {"train_loss": -10.540693283081055, "global_step": 136600, "epoch": 813} {"train_loss": -10.400726318359375, "global_step": 136601, "epoch": 813} {"train_loss": -10.401311874389648, "global_step": 136602, "epoch": 813} {"train_loss": -10.604264259338379, "global_step": 136603, "epoch": 813} {"train_loss": -10.344508171081543, "global_step": 136604, "epoch": 813} {"train_loss": -10.45865249633789, "global_step": 136605, "epoch": 813} {"train_loss": -10.675019264221191, "global_step": 136606, "epoch": 813} {"train_loss": -10.126707077026367, "global_step": 136607, "epoch": 813} {"train_loss": -10.612028121948242, "global_step": 136608, "epoch": 813} {"train_loss": -10.476844787597656, "global_step": 136609, "epoch": 813} {"train_loss": -9.240818977355957, "global_step": 136610, "epoch": 813} {"train_loss": -10.416011810302734, "global_step": 136611, "epoch": 813} {"train_loss": -9.834563255310059, "global_step": 136612, "epoch": 813} {"train_loss": -10.265352249145508, "global_step": 136613, "epoch": 813} {"train_loss": -10.516158103942871, "global_step": 136614, "epoch": 813} {"train_loss": -9.881908416748047, "global_step": 136615, "epoch": 813} {"train_loss": -9.676794052124023, "global_step": 136616, "epoch": 813} {"train_loss": -10.408945083618164, "global_step": 136617, "epoch": 813} {"train_loss": -10.05654525756836, "global_step": 136618, "epoch": 813} {"train_loss": -9.892908096313477, "global_step": 136619, "epoch": 813} {"train_loss": -10.408517837524414, "global_step": 136620, "epoch": 813} {"train_loss": -9.091167449951172, "global_step": 136621, "epoch": 813} {"train_loss": -10.504672050476074, "global_step": 136622, "epoch": 813} {"train_loss": -9.446236610412598, "global_step": 136623, "epoch": 813} {"train_loss": -10.377952575683594, "global_step": 136624, "epoch": 813} {"train_loss": -9.815105438232422, "global_step": 136625, "epoch": 813} {"train_loss": -10.285465240478516, "global_step": 136626, "epoch": 813} {"train_loss": -9.791973114013672, "global_step": 136627, "epoch": 813} {"train_loss": -10.388907432556152, "global_step": 136628, "epoch": 813} {"train_loss": -9.740703582763672, "global_step": 136629, "epoch": 813} {"train_loss": -10.35232162475586, "global_step": 136630, "epoch": 813} {"train_loss": -10.143168449401855, "global_step": 136631, "epoch": 813} {"train_loss": -10.294149398803711, "global_step": 136632, "epoch": 813} {"train_loss": -10.067912101745605, "global_step": 136633, "epoch": 813} {"train_loss": -10.44843578338623, "global_step": 136634, "epoch": 813} {"train_loss": -10.005640029907227, "global_step": 136635, "epoch": 813} {"train_loss": -10.303421020507812, "global_step": 136636, "epoch": 813} {"train_loss": -9.784357070922852, "global_step": 136637, "epoch": 813} {"train_loss": -10.36337661743164, "global_step": 136638, "epoch": 813} {"train_loss": -10.140599250793457, "global_step": 136639, "epoch": 813} {"train_loss": -9.57051944732666, "global_step": 136640, "epoch": 813} {"train_loss": -10.323740005493164, "global_step": 136641, "epoch": 813} {"train_loss": -9.780038833618164, "global_step": 136642, "epoch": 813} {"train_loss": -10.430994033813477, "global_step": 136643, "epoch": 813} {"train_loss": -9.721632957458496, "global_step": 136644, "epoch": 813} {"train_loss": -10.166473388671875, "global_step": 136645, "epoch": 813} {"train_loss": -9.794755935668945, "global_step": 136646, "epoch": 813} {"train_loss": -10.481689453125, "global_step": 136647, "epoch": 813} {"train_loss": -9.662091255187988, "global_step": 136648, "epoch": 813} {"train_loss": -10.117781639099121, "global_step": 136649, "epoch": 813} {"train_loss": -10.180513381958008, "global_step": 136650, "epoch": 813} {"train_loss": -10.183980941772461, "global_step": 136651, "epoch": 813} {"train_loss": -10.159164428710938, "global_step": 136652, "epoch": 813} {"train_loss": -9.948305130004883, "global_step": 136653, "epoch": 813} {"train_loss": -10.308832168579102, "global_step": 136654, "epoch": 813} {"train_loss": -10.057001113891602, "global_step": 136655, "epoch": 813} {"train_loss": -10.380340576171875, "global_step": 136656, "epoch": 813} {"train_loss": -10.404838562011719, "global_step": 136657, "epoch": 813} {"train_loss": -10.260183334350586, "global_step": 136658, "epoch": 813} {"train_loss": -10.20315933227539, "global_step": 136659, "epoch": 813} {"train_loss": -10.48350715637207, "global_step": 136660, "epoch": 813} {"train_loss": -10.293327331542969, "global_step": 136661, "epoch": 813} {"train_loss": -10.450532913208008, "global_step": 136662, "epoch": 813} {"train_loss": -10.502416610717773, "global_step": 136663, "epoch": 813} {"train_loss": -10.247394561767578, "global_step": 136664, "epoch": 813} {"train_loss": -10.515129089355469, "global_step": 136665, "epoch": 813} {"train_loss": -10.545276641845703, "global_step": 136666, "epoch": 813} {"train_loss": -10.420732498168945, "global_step": 136667, "epoch": 813} {"train_loss": -10.531438827514648, "global_step": 136668, "epoch": 813} {"train_loss": -10.491053581237793, "global_step": 136669, "epoch": 813} {"train_loss": -10.549842834472656, "global_step": 136670, "epoch": 813} {"train_loss": -10.674210548400879, "global_step": 136671, "epoch": 813} {"train_loss": -10.376218795776367, "global_step": 136672, "epoch": 813} {"train_loss": -10.681502342224121, "global_step": 136673, "epoch": 813} {"train_loss": -10.689416885375977, "global_step": 136674, "epoch": 813} {"train_loss": -10.901435852050781, "global_step": 136675, "epoch": 813} {"train_loss": -10.486852645874023, "global_step": 136676, "epoch": 813} {"train_loss": -10.720076560974121, "global_step": 136677, "epoch": 813} {"train_loss": -10.591991424560547, "global_step": 136678, "epoch": 813} {"train_loss": -10.736616134643555, "global_step": 136679, "epoch": 813} {"train_loss": -10.378753662109375, "global_step": 136680, "epoch": 813} {"train_loss": -10.667597770690918, "global_step": 136681, "epoch": 813} {"train_loss": -10.710443496704102, "global_step": 136682, "epoch": 813} {"train_loss": -10.39990234375, "global_step": 136683, "epoch": 813} {"train_loss": -10.474030494689941, "global_step": 136684, "epoch": 813} {"train_loss": -10.40678882598877, "global_step": 136685, "epoch": 813} {"train_loss": -10.6405611038208, "global_step": 136686, "epoch": 813} {"train_loss": -10.738298416137695, "global_step": 136687, "epoch": 813} {"train_loss": -10.487022399902344, "global_step": 136688, "epoch": 813} {"train_loss": -10.574535369873047, "global_step": 136689, "epoch": 813} {"train_loss": -10.682369232177734, "global_step": 136690, "epoch": 813} {"train_loss": -10.376566886901855, "global_step": 136691, "epoch": 813} {"train_loss": -10.352499008178711, "global_step": 136692, "epoch": 813} {"train_loss": -10.407353401184082, "global_step": 136693, "epoch": 813} {"train_loss": -10.649115562438965, "global_step": 136694, "epoch": 813} {"train_loss": -10.72039794921875, "global_step": 136695, "epoch": 813} {"train_loss": -10.801019668579102, "global_step": 136696, "epoch": 813} {"train_loss": -10.669560432434082, "global_step": 136697, "epoch": 813} {"train_loss": -10.865443229675293, "global_step": 136698, "epoch": 813} {"train_loss": -10.68829345703125, "global_step": 136699, "epoch": 813} {"train_loss": -10.699296951293945, "global_step": 136700, "epoch": 813} {"train_loss": -10.715215682983398, "global_step": 136701, "epoch": 813} {"train_loss": -10.524822235107422, "global_step": 136702, "epoch": 813} {"train_loss": -10.717310905456543, "global_step": 136703, "epoch": 813} {"train_loss": -10.602619171142578, "global_step": 136704, "epoch": 813} {"train_loss": -10.71346664428711, "global_step": 136705, "epoch": 813} {"train_loss": -10.627971649169922, "global_step": 136706, "epoch": 813} {"train_loss": -10.959879875183105, "global_step": 136707, "epoch": 813} {"train_loss": -10.493566513061523, "global_step": 136708, "epoch": 813} {"train_loss": -10.654474258422852, "global_step": 136709, "epoch": 813} {"train_loss": -10.720436096191406, "global_step": 136710, "epoch": 813} {"train_loss": -10.837787628173828, "global_step": 136711, "epoch": 813} {"train_loss": -10.667807579040527, "global_step": 136712, "epoch": 813} {"train_loss": -10.760381698608398, "global_step": 136713, "epoch": 813} {"train_loss": -10.816749572753906, "global_step": 136714, "epoch": 813} {"train_loss": -10.709115982055664, "global_step": 136715, "epoch": 813} {"train_loss": -10.529753684997559, "global_step": 136716, "epoch": 813} {"train_loss": -10.058307647705078, "global_step": 136717, "epoch": 813} {"train_loss": -10.712425231933594, "global_step": 136718, "epoch": 813} {"train_loss": -10.371549606323242, "global_step": 136719, "epoch": 813} {"train_loss": -10.391580581665039, "global_step": 136720, "epoch": 813} {"train_loss": -10.158549308776855, "global_step": 136721, "epoch": 813} {"train_loss": -10.360032081604004, "global_step": 136722, "epoch": 813} {"train_loss": -10.164134979248047, "global_step": 136723, "epoch": 813} {"train_loss": -10.402833938598633, "global_step": 136724, "epoch": 813} {"train_loss": -10.62533187866211, "global_step": 136725, "epoch": 813} {"train_loss": -10.878484725952148, "global_step": 136726, "epoch": 813} {"train_loss": -10.654535293579102, "global_step": 136727, "epoch": 813} {"train_loss": -10.575794219970703, "global_step": 136728, "epoch": 813} {"train_loss": -10.577731132507324, "global_step": 136729, "epoch": 813} {"train_loss": -10.708404541015625, "global_step": 136730, "epoch": 813} {"train_loss": -10.518569946289062, "global_step": 136731, "epoch": 813} {"train_loss": -10.416247367858887, "global_step": 136732, "epoch": 813} {"train_loss": -10.666420936584473, "global_step": 136733, "epoch": 813} {"train_loss": -10.615528106689453, "global_step": 136734, "epoch": 813} {"train_loss": -10.465137481689453, "global_step": 136735, "epoch": 813} {"train_loss": -10.569049835205078, "global_step": 136736, "epoch": 813} {"train_loss": -10.82598876953125, "global_step": 136737, "epoch": 813} {"train_loss": -10.585189819335938, "global_step": 136738, "epoch": 813} {"train_loss": -10.723739624023438, "global_step": 136739, "epoch": 813} {"train_loss": -10.545385360717773, "global_step": 136740, "epoch": 813} {"train_loss": -10.414824485778809, "global_step": 136741, "epoch": 813} {"train_loss": -10.161775588989258, "global_step": 136742, "epoch": 813} {"train_loss": -10.332534790039062, "global_step": 136743, "epoch": 813} {"train_loss": -10.14315128326416, "global_step": 136744, "epoch": 813} {"train_loss": -10.52070426940918, "global_step": 136745, "epoch": 813} {"train_loss": -10.305347442626953, "global_step": 136746, "epoch": 813} {"train_loss": -10.193689346313477, "global_step": 136747, "epoch": 813} {"train_loss": -9.581579208374023, "global_step": 136748, "epoch": 813} {"train_loss": -10.03495979309082, "global_step": 136749, "epoch": 813} {"train_loss": -9.718693733215332, "global_step": 136750, "epoch": 813} {"train_loss": -10.383786536398388, "global_step": 136751, "epoch": 813, "val_loss": 224146.375} {"train_loss": -9.59404182434082, "global_step": 136752, "epoch": 814} {"train_loss": -9.665504455566406, "global_step": 136753, "epoch": 814} {"train_loss": -9.973428726196289, "global_step": 136754, "epoch": 814} {"train_loss": -9.580469131469727, "global_step": 136755, "epoch": 814} {"train_loss": -9.460671424865723, "global_step": 136756, "epoch": 814} {"train_loss": -10.083030700683594, "global_step": 136757, "epoch": 814} {"train_loss": -8.973240852355957, "global_step": 136758, "epoch": 814} {"train_loss": -10.067171096801758, "global_step": 136759, "epoch": 814} {"train_loss": -10.114145278930664, "global_step": 136760, "epoch": 814} {"train_loss": -10.090396881103516, "global_step": 136761, "epoch": 814} {"train_loss": -9.553291320800781, "global_step": 136762, "epoch": 814} {"train_loss": -10.076492309570312, "global_step": 136763, "epoch": 814} {"train_loss": -10.155740737915039, "global_step": 136764, "epoch": 814} {"train_loss": -10.026037216186523, "global_step": 136765, "epoch": 814} {"train_loss": -10.273934364318848, "global_step": 136766, "epoch": 814} {"train_loss": -10.11410140991211, "global_step": 136767, "epoch": 814} {"train_loss": -10.110628128051758, "global_step": 136768, "epoch": 814} {"train_loss": -10.132511138916016, "global_step": 136769, "epoch": 814} {"train_loss": -10.047439575195312, "global_step": 136770, "epoch": 814} {"train_loss": -9.790141105651855, "global_step": 136771, "epoch": 814} {"train_loss": -9.892183303833008, "global_step": 136772, "epoch": 814} {"train_loss": -10.148519515991211, "global_step": 136773, "epoch": 814} {"train_loss": -9.96934700012207, "global_step": 136774, "epoch": 814} {"train_loss": -10.374940872192383, "global_step": 136775, "epoch": 814} {"train_loss": -9.908565521240234, "global_step": 136776, "epoch": 814} {"train_loss": -10.280061721801758, "global_step": 136777, "epoch": 814} {"train_loss": -10.095041275024414, "global_step": 136778, "epoch": 814} {"train_loss": -10.102592468261719, "global_step": 136779, "epoch": 814} {"train_loss": -10.274620056152344, "global_step": 136780, "epoch": 814} {"train_loss": -10.039788246154785, "global_step": 136781, "epoch": 814} {"train_loss": -10.350828170776367, "global_step": 136782, "epoch": 814} {"train_loss": -10.319074630737305, "global_step": 136783, "epoch": 814} {"train_loss": -10.408889770507812, "global_step": 136784, "epoch": 814} {"train_loss": -10.167640686035156, "global_step": 136785, "epoch": 814} {"train_loss": -10.630361557006836, "global_step": 136786, "epoch": 814} {"train_loss": -10.397869110107422, "global_step": 136787, "epoch": 814} {"train_loss": -10.295801162719727, "global_step": 136788, "epoch": 814} {"train_loss": -10.306585311889648, "global_step": 136789, "epoch": 814} {"train_loss": -10.656364440917969, "global_step": 136790, "epoch": 814} {"train_loss": -10.393956184387207, "global_step": 136791, "epoch": 814} {"train_loss": -10.66722297668457, "global_step": 136792, "epoch": 814} {"train_loss": -10.553390502929688, "global_step": 136793, "epoch": 814} {"train_loss": -10.689094543457031, "global_step": 136794, "epoch": 814} {"train_loss": -10.62883186340332, "global_step": 136795, "epoch": 814} {"train_loss": -10.59815788269043, "global_step": 136796, "epoch": 814} {"train_loss": -10.623438835144043, "global_step": 136797, "epoch": 814} {"train_loss": -10.732216835021973, "global_step": 136798, "epoch": 814} {"train_loss": -10.802826881408691, "global_step": 136799, "epoch": 814} {"train_loss": -10.710020065307617, "global_step": 136800, "epoch": 814} {"train_loss": -10.831099510192871, "global_step": 136801, "epoch": 814} {"train_loss": -10.712308883666992, "global_step": 136802, "epoch": 814} {"train_loss": -10.68369197845459, "global_step": 136803, "epoch": 814} {"train_loss": -10.753861427307129, "global_step": 136804, "epoch": 814} {"train_loss": -10.923639297485352, "global_step": 136805, "epoch": 814} {"train_loss": -10.814933776855469, "global_step": 136806, "epoch": 814} {"train_loss": -10.964491844177246, "global_step": 136807, "epoch": 814} {"train_loss": -11.044689178466797, "global_step": 136808, "epoch": 814} {"train_loss": -10.902753829956055, "global_step": 136809, "epoch": 814} {"train_loss": -10.77022647857666, "global_step": 136810, "epoch": 814} {"train_loss": -10.889735221862793, "global_step": 136811, "epoch": 814} {"train_loss": -10.753337860107422, "global_step": 136812, "epoch": 814} {"train_loss": -10.610668182373047, "global_step": 136813, "epoch": 814} {"train_loss": -11.18046760559082, "global_step": 136814, "epoch": 814} {"train_loss": -10.705492973327637, "global_step": 136815, "epoch": 814} {"train_loss": -10.700743675231934, "global_step": 136816, "epoch": 814} {"train_loss": -10.571518898010254, "global_step": 136817, "epoch": 814} {"train_loss": -10.861639022827148, "global_step": 136818, "epoch": 814} {"train_loss": -10.753826141357422, "global_step": 136819, "epoch": 814} {"train_loss": -11.016756057739258, "global_step": 136820, "epoch": 814} {"train_loss": -10.559016227722168, "global_step": 136821, "epoch": 814} {"train_loss": -10.679814338684082, "global_step": 136822, "epoch": 814} {"train_loss": -10.474044799804688, "global_step": 136823, "epoch": 814} {"train_loss": -9.384987831115723, "global_step": 136824, "epoch": 814} {"train_loss": -10.073653221130371, "global_step": 136825, "epoch": 814} {"train_loss": -10.717327117919922, "global_step": 136826, "epoch": 814} {"train_loss": -10.324811935424805, "global_step": 136827, "epoch": 814} {"train_loss": -10.087690353393555, "global_step": 136828, "epoch": 814} {"train_loss": -10.801398277282715, "global_step": 136829, "epoch": 814} {"train_loss": -10.760851860046387, "global_step": 136830, "epoch": 814} {"train_loss": -10.066959381103516, "global_step": 136831, "epoch": 814} {"train_loss": -10.732941627502441, "global_step": 136832, "epoch": 814} {"train_loss": -10.652353286743164, "global_step": 136833, "epoch": 814} {"train_loss": -10.552270889282227, "global_step": 136834, "epoch": 814} {"train_loss": -9.847562789916992, "global_step": 136835, "epoch": 814} {"train_loss": -10.882232666015625, "global_step": 136836, "epoch": 814} {"train_loss": -10.638083457946777, "global_step": 136837, "epoch": 814} {"train_loss": -10.695716857910156, "global_step": 136838, "epoch": 814} {"train_loss": -10.599309921264648, "global_step": 136839, "epoch": 814} {"train_loss": -10.261614799499512, "global_step": 136840, "epoch": 814} {"train_loss": -10.389750480651855, "global_step": 136841, "epoch": 814} {"train_loss": -10.414545059204102, "global_step": 136842, "epoch": 814} {"train_loss": -10.034941673278809, "global_step": 136843, "epoch": 814} {"train_loss": -10.131497383117676, "global_step": 136844, "epoch": 814} {"train_loss": -10.536937713623047, "global_step": 136845, "epoch": 814} {"train_loss": -9.877864837646484, "global_step": 136846, "epoch": 814} {"train_loss": -9.728456497192383, "global_step": 136847, "epoch": 814} {"train_loss": -9.674046516418457, "global_step": 136848, "epoch": 814} {"train_loss": -9.51085376739502, "global_step": 136849, "epoch": 814} {"train_loss": -9.477470397949219, "global_step": 136850, "epoch": 814} {"train_loss": -10.123407363891602, "global_step": 136851, "epoch": 814} {"train_loss": -9.801911354064941, "global_step": 136852, "epoch": 814} {"train_loss": -9.908061981201172, "global_step": 136853, "epoch": 814} {"train_loss": -9.988417625427246, "global_step": 136854, "epoch": 814} {"train_loss": -10.047005653381348, "global_step": 136855, "epoch": 814} {"train_loss": -9.908258438110352, "global_step": 136856, "epoch": 814} {"train_loss": -9.995293617248535, "global_step": 136857, "epoch": 814} {"train_loss": -9.665861129760742, "global_step": 136858, "epoch": 814} {"train_loss": -10.475523948669434, "global_step": 136859, "epoch": 814} {"train_loss": -9.759041786193848, "global_step": 136860, "epoch": 814} {"train_loss": -10.327455520629883, "global_step": 136861, "epoch": 814} {"train_loss": -9.828840255737305, "global_step": 136862, "epoch": 814} {"train_loss": -10.041597366333008, "global_step": 136863, "epoch": 814} {"train_loss": -10.217938423156738, "global_step": 136864, "epoch": 814} {"train_loss": -10.102333068847656, "global_step": 136865, "epoch": 814} {"train_loss": -10.27570915222168, "global_step": 136866, "epoch": 814} {"train_loss": -10.232733726501465, "global_step": 136867, "epoch": 814} {"train_loss": -10.51817512512207, "global_step": 136868, "epoch": 814} {"train_loss": -10.036360740661621, "global_step": 136869, "epoch": 814} {"train_loss": -10.408010482788086, "global_step": 136870, "epoch": 814} {"train_loss": -10.381080627441406, "global_step": 136871, "epoch": 814} {"train_loss": -10.376745223999023, "global_step": 136872, "epoch": 814} {"train_loss": -10.40639877319336, "global_step": 136873, "epoch": 814} {"train_loss": -10.442337989807129, "global_step": 136874, "epoch": 814} {"train_loss": -10.565532684326172, "global_step": 136875, "epoch": 814} {"train_loss": -10.525619506835938, "global_step": 136876, "epoch": 814} {"train_loss": -10.397310256958008, "global_step": 136877, "epoch": 814} {"train_loss": -10.631511688232422, "global_step": 136878, "epoch": 814} {"train_loss": -10.484085083007812, "global_step": 136879, "epoch": 814} {"train_loss": -10.595532417297363, "global_step": 136880, "epoch": 814} {"train_loss": -10.53345012664795, "global_step": 136881, "epoch": 814} {"train_loss": -10.681219100952148, "global_step": 136882, "epoch": 814} {"train_loss": -10.768985748291016, "global_step": 136883, "epoch": 814} {"train_loss": -10.852940559387207, "global_step": 136884, "epoch": 814} {"train_loss": -10.596107482910156, "global_step": 136885, "epoch": 814} {"train_loss": -10.704383850097656, "global_step": 136886, "epoch": 814} {"train_loss": -10.61729621887207, "global_step": 136887, "epoch": 814} {"train_loss": -10.723968505859375, "global_step": 136888, "epoch": 814} {"train_loss": -10.622323036193848, "global_step": 136889, "epoch": 814} {"train_loss": -10.668780326843262, "global_step": 136890, "epoch": 814} {"train_loss": -10.657156944274902, "global_step": 136891, "epoch": 814} {"train_loss": -10.81674575805664, "global_step": 136892, "epoch": 814} {"train_loss": -10.872751235961914, "global_step": 136893, "epoch": 814} {"train_loss": -10.840824127197266, "global_step": 136894, "epoch": 814} {"train_loss": -10.63785171508789, "global_step": 136895, "epoch": 814} {"train_loss": -10.88205337524414, "global_step": 136896, "epoch": 814} {"train_loss": -10.711091041564941, "global_step": 136897, "epoch": 814} {"train_loss": -10.731470108032227, "global_step": 136898, "epoch": 814} {"train_loss": -10.897310256958008, "global_step": 136899, "epoch": 814} {"train_loss": -10.937485694885254, "global_step": 136900, "epoch": 814} {"train_loss": -10.954839706420898, "global_step": 136901, "epoch": 814} {"train_loss": -10.774225234985352, "global_step": 136902, "epoch": 814} {"train_loss": -10.665952682495117, "global_step": 136903, "epoch": 814} {"train_loss": -10.487266540527344, "global_step": 136904, "epoch": 814} {"train_loss": -10.788053512573242, "global_step": 136905, "epoch": 814} {"train_loss": -10.838720321655273, "global_step": 136906, "epoch": 814} {"train_loss": -10.770870208740234, "global_step": 136907, "epoch": 814} {"train_loss": -10.393957138061523, "global_step": 136908, "epoch": 814} {"train_loss": -10.021955490112305, "global_step": 136909, "epoch": 814} {"train_loss": -9.800811767578125, "global_step": 136910, "epoch": 814} {"train_loss": -10.765357971191406, "global_step": 136911, "epoch": 814} {"train_loss": -10.354005813598633, "global_step": 136912, "epoch": 814} {"train_loss": -9.556618690490723, "global_step": 136913, "epoch": 814} {"train_loss": -9.394798278808594, "global_step": 136914, "epoch": 814} {"train_loss": -10.580327987670898, "global_step": 136915, "epoch": 814} {"train_loss": -9.625621795654297, "global_step": 136916, "epoch": 814} {"train_loss": -8.473775863647461, "global_step": 136917, "epoch": 814} {"train_loss": -10.632486343383789, "global_step": 136918, "epoch": 814} {"train_loss": -10.35618573711032, "global_step": 136919, "epoch": 814, "val_loss": 214766.140625} {"train_loss": -10.073837280273438, "global_step": 136920, "epoch": 815} {"train_loss": -9.536029815673828, "global_step": 136921, "epoch": 815} {"train_loss": -9.975075721740723, "global_step": 136922, "epoch": 815} {"train_loss": -9.219014167785645, "global_step": 136923, "epoch": 815} {"train_loss": -10.273283004760742, "global_step": 136924, "epoch": 815} {"train_loss": -9.763631820678711, "global_step": 136925, "epoch": 815} {"train_loss": -9.948164939880371, "global_step": 136926, "epoch": 815} {"train_loss": -9.938261985778809, "global_step": 136927, "epoch": 815} {"train_loss": -10.241007804870605, "global_step": 136928, "epoch": 815} {"train_loss": -10.072094917297363, "global_step": 136929, "epoch": 815} {"train_loss": -10.040956497192383, "global_step": 136930, "epoch": 815} {"train_loss": -10.174592971801758, "global_step": 136931, "epoch": 815} {"train_loss": -10.192164421081543, "global_step": 136932, "epoch": 815} {"train_loss": -10.349620819091797, "global_step": 136933, "epoch": 815} {"train_loss": -10.423720359802246, "global_step": 136934, "epoch": 815} {"train_loss": -10.300711631774902, "global_step": 136935, "epoch": 815} {"train_loss": -10.390164375305176, "global_step": 136936, "epoch": 815} {"train_loss": -10.350715637207031, "global_step": 136937, "epoch": 815} {"train_loss": -10.197689056396484, "global_step": 136938, "epoch": 815} {"train_loss": -10.291157722473145, "global_step": 136939, "epoch": 815} {"train_loss": -10.311899185180664, "global_step": 136940, "epoch": 815} {"train_loss": -10.102449417114258, "global_step": 136941, "epoch": 815} {"train_loss": -10.527776718139648, "global_step": 136942, "epoch": 815} {"train_loss": -10.475746154785156, "global_step": 136943, "epoch": 815} {"train_loss": -10.332423210144043, "global_step": 136944, "epoch": 815} {"train_loss": -10.552725791931152, "global_step": 136945, "epoch": 815} {"train_loss": -10.481136322021484, "global_step": 136946, "epoch": 815} {"train_loss": -10.357502937316895, "global_step": 136947, "epoch": 815} {"train_loss": -10.488729476928711, "global_step": 136948, "epoch": 815} {"train_loss": -10.416947364807129, "global_step": 136949, "epoch": 815} {"train_loss": -10.473848342895508, "global_step": 136950, "epoch": 815} {"train_loss": -10.483292579650879, "global_step": 136951, "epoch": 815} {"train_loss": -10.485713005065918, "global_step": 136952, "epoch": 815} {"train_loss": -10.318960189819336, "global_step": 136953, "epoch": 815} {"train_loss": -10.103530883789062, "global_step": 136954, "epoch": 815} {"train_loss": -10.50376033782959, "global_step": 136955, "epoch": 815} {"train_loss": -10.618138313293457, "global_step": 136956, "epoch": 815} {"train_loss": -10.742860794067383, "global_step": 136957, "epoch": 815} {"train_loss": -10.396932601928711, "global_step": 136958, "epoch": 815} {"train_loss": -10.797369003295898, "global_step": 136959, "epoch": 815} {"train_loss": -10.408546447753906, "global_step": 136960, "epoch": 815} {"train_loss": -10.640654563903809, "global_step": 136961, "epoch": 815} {"train_loss": -10.637086868286133, "global_step": 136962, "epoch": 815} {"train_loss": -10.742488861083984, "global_step": 136963, "epoch": 815} {"train_loss": -10.808507919311523, "global_step": 136964, "epoch": 815} {"train_loss": -10.80118179321289, "global_step": 136965, "epoch": 815} {"train_loss": -10.716619491577148, "global_step": 136966, "epoch": 815} {"train_loss": -10.645408630371094, "global_step": 136967, "epoch": 815} {"train_loss": -10.74360466003418, "global_step": 136968, "epoch": 815} {"train_loss": -10.859550476074219, "global_step": 136969, "epoch": 815} {"train_loss": -10.394844055175781, "global_step": 136970, "epoch": 815} {"train_loss": -10.892885208129883, "global_step": 136971, "epoch": 815} {"train_loss": -10.565845489501953, "global_step": 136972, "epoch": 815} {"train_loss": -10.669212341308594, "global_step": 136973, "epoch": 815} {"train_loss": -10.531379699707031, "global_step": 136974, "epoch": 815} {"train_loss": -10.379648208618164, "global_step": 136975, "epoch": 815} {"train_loss": -10.517223358154297, "global_step": 136976, "epoch": 815} {"train_loss": -10.74399185180664, "global_step": 136977, "epoch": 815} {"train_loss": -10.25160026550293, "global_step": 136978, "epoch": 815} {"train_loss": -10.457256317138672, "global_step": 136979, "epoch": 815} {"train_loss": -10.321008682250977, "global_step": 136980, "epoch": 815} {"train_loss": -10.496377944946289, "global_step": 136981, "epoch": 815} {"train_loss": -10.454896926879883, "global_step": 136982, "epoch": 815} {"train_loss": -10.371355056762695, "global_step": 136983, "epoch": 815} {"train_loss": -10.501317977905273, "global_step": 136984, "epoch": 815} {"train_loss": -10.447061538696289, "global_step": 136985, "epoch": 815} {"train_loss": -10.51407241821289, "global_step": 136986, "epoch": 815} {"train_loss": -10.493623733520508, "global_step": 136987, "epoch": 815} {"train_loss": -10.347688674926758, "global_step": 136988, "epoch": 815} {"train_loss": -10.276918411254883, "global_step": 136989, "epoch": 815} {"train_loss": -10.583211898803711, "global_step": 136990, "epoch": 815} {"train_loss": -10.186327934265137, "global_step": 136991, "epoch": 815} {"train_loss": -10.210533142089844, "global_step": 136992, "epoch": 815} {"train_loss": -10.159381866455078, "global_step": 136993, "epoch": 815} {"train_loss": -10.779129028320312, "global_step": 136994, "epoch": 815} {"train_loss": -10.135326385498047, "global_step": 136995, "epoch": 815} {"train_loss": -10.565898895263672, "global_step": 136996, "epoch": 815} {"train_loss": -9.81674861907959, "global_step": 136997, "epoch": 815} {"train_loss": -10.647428512573242, "global_step": 136998, "epoch": 815} {"train_loss": -10.037944793701172, "global_step": 136999, "epoch": 815} {"train_loss": -10.662726402282715, "global_step": 137000, "epoch": 815} {"train_loss": -10.187437057495117, "global_step": 137001, "epoch": 815} {"train_loss": -10.201499938964844, "global_step": 137002, "epoch": 815} {"train_loss": -10.488927841186523, "global_step": 137003, "epoch": 815} {"train_loss": -10.136945724487305, "global_step": 137004, "epoch": 815} {"train_loss": -10.527204513549805, "global_step": 137005, "epoch": 815} {"train_loss": -10.409454345703125, "global_step": 137006, "epoch": 815} {"train_loss": -10.406778335571289, "global_step": 137007, "epoch": 815} {"train_loss": -10.655248641967773, "global_step": 137008, "epoch": 815} {"train_loss": -9.951290130615234, "global_step": 137009, "epoch": 815} {"train_loss": -10.325490951538086, "global_step": 137010, "epoch": 815} {"train_loss": -10.527998924255371, "global_step": 137011, "epoch": 815} {"train_loss": -10.412598609924316, "global_step": 137012, "epoch": 815} {"train_loss": -10.385733604431152, "global_step": 137013, "epoch": 815} {"train_loss": -10.48326301574707, "global_step": 137014, "epoch": 815} {"train_loss": -10.29155158996582, "global_step": 137015, "epoch": 815} {"train_loss": -10.398614883422852, "global_step": 137016, "epoch": 815} {"train_loss": -10.621870994567871, "global_step": 137017, "epoch": 815} {"train_loss": -10.444915771484375, "global_step": 137018, "epoch": 815} {"train_loss": -10.67959213256836, "global_step": 137019, "epoch": 815} {"train_loss": -10.438989639282227, "global_step": 137020, "epoch": 815} {"train_loss": -10.728814125061035, "global_step": 137021, "epoch": 815} {"train_loss": -10.758556365966797, "global_step": 137022, "epoch": 815} {"train_loss": -10.653168678283691, "global_step": 137023, "epoch": 815} {"train_loss": -10.688814163208008, "global_step": 137024, "epoch": 815} {"train_loss": -10.609176635742188, "global_step": 137025, "epoch": 815} {"train_loss": -10.717267990112305, "global_step": 137026, "epoch": 815} {"train_loss": -10.858329772949219, "global_step": 137027, "epoch": 815} {"train_loss": -10.705551147460938, "global_step": 137028, "epoch": 815} {"train_loss": -10.669031143188477, "global_step": 137029, "epoch": 815} {"train_loss": -10.704545974731445, "global_step": 137030, "epoch": 815} {"train_loss": -10.566007614135742, "global_step": 137031, "epoch": 815} {"train_loss": -10.863142967224121, "global_step": 137032, "epoch": 815} {"train_loss": -10.625984191894531, "global_step": 137033, "epoch": 815} {"train_loss": -10.635992050170898, "global_step": 137034, "epoch": 815} {"train_loss": -10.705184936523438, "global_step": 137035, "epoch": 815} {"train_loss": -10.591464042663574, "global_step": 137036, "epoch": 815} {"train_loss": -10.713089942932129, "global_step": 137037, "epoch": 815} {"train_loss": -10.33608627319336, "global_step": 137038, "epoch": 815} {"train_loss": -10.728511810302734, "global_step": 137039, "epoch": 815} {"train_loss": -10.146295547485352, "global_step": 137040, "epoch": 815} {"train_loss": -10.622566223144531, "global_step": 137041, "epoch": 815} {"train_loss": -10.515329360961914, "global_step": 137042, "epoch": 815} {"train_loss": -10.74086856842041, "global_step": 137043, "epoch": 815} {"train_loss": -10.3595609664917, "global_step": 137044, "epoch": 815} {"train_loss": -10.290609359741211, "global_step": 137045, "epoch": 815} {"train_loss": -10.42596435546875, "global_step": 137046, "epoch": 815} {"train_loss": -9.791220664978027, "global_step": 137047, "epoch": 815} {"train_loss": -10.689521789550781, "global_step": 137048, "epoch": 815} {"train_loss": -10.61927318572998, "global_step": 137049, "epoch": 815} {"train_loss": -10.205341339111328, "global_step": 137050, "epoch": 815} {"train_loss": -10.680913925170898, "global_step": 137051, "epoch": 815} {"train_loss": -10.267326354980469, "global_step": 137052, "epoch": 815} {"train_loss": -10.438297271728516, "global_step": 137053, "epoch": 815} {"train_loss": -10.411468505859375, "global_step": 137054, "epoch": 815} {"train_loss": -10.792133331298828, "global_step": 137055, "epoch": 815} {"train_loss": -10.638382911682129, "global_step": 137056, "epoch": 815} {"train_loss": -10.265344619750977, "global_step": 137057, "epoch": 815} {"train_loss": -10.606396675109863, "global_step": 137058, "epoch": 815} {"train_loss": -10.433218002319336, "global_step": 137059, "epoch": 815} {"train_loss": -10.22887134552002, "global_step": 137060, "epoch": 815} {"train_loss": -10.803747177124023, "global_step": 137061, "epoch": 815} {"train_loss": -10.655864715576172, "global_step": 137062, "epoch": 815} {"train_loss": -10.744821548461914, "global_step": 137063, "epoch": 815} {"train_loss": -10.396408081054688, "global_step": 137064, "epoch": 815} {"train_loss": -10.455810546875, "global_step": 137065, "epoch": 815} {"train_loss": -10.582690238952637, "global_step": 137066, "epoch": 815} {"train_loss": -10.57667064666748, "global_step": 137067, "epoch": 815} {"train_loss": -10.509247779846191, "global_step": 137068, "epoch": 815} {"train_loss": -10.5314302444458, "global_step": 137069, "epoch": 815} {"train_loss": -10.640581130981445, "global_step": 137070, "epoch": 815} {"train_loss": -10.735940933227539, "global_step": 137071, "epoch": 815} {"train_loss": -10.654947280883789, "global_step": 137072, "epoch": 815} {"train_loss": -10.448981285095215, "global_step": 137073, "epoch": 815} {"train_loss": -10.82277774810791, "global_step": 137074, "epoch": 815} {"train_loss": -10.470465660095215, "global_step": 137075, "epoch": 815} {"train_loss": -10.385766983032227, "global_step": 137076, "epoch": 815} {"train_loss": -10.164929389953613, "global_step": 137077, "epoch": 815} {"train_loss": -9.90602970123291, "global_step": 137078, "epoch": 815} {"train_loss": -10.477849960327148, "global_step": 137079, "epoch": 815} {"train_loss": -10.330432891845703, "global_step": 137080, "epoch": 815} {"train_loss": -10.394330024719238, "global_step": 137081, "epoch": 815} {"train_loss": -10.24496078491211, "global_step": 137082, "epoch": 815} {"train_loss": -10.01995849609375, "global_step": 137083, "epoch": 815} {"train_loss": -10.531723022460938, "global_step": 137084, "epoch": 815} {"train_loss": -10.211799621582031, "global_step": 137085, "epoch": 815} {"train_loss": -10.243621826171875, "global_step": 137086, "epoch": 815} {"train_loss": -10.434498179526557, "global_step": 137087, "epoch": 815, "val_loss": 223898.515625, "train_action_mse_error": 2.2980849742889404} {"train_loss": -10.567873001098633, "global_step": 137088, "epoch": 816} {"train_loss": -9.751686096191406, "global_step": 137089, "epoch": 816} {"train_loss": -10.348307609558105, "global_step": 137090, "epoch": 816} {"train_loss": -10.257587432861328, "global_step": 137091, "epoch": 816} {"train_loss": -10.285797119140625, "global_step": 137092, "epoch": 816} {"train_loss": -10.161609649658203, "global_step": 137093, "epoch": 816} {"train_loss": -10.032257080078125, "global_step": 137094, "epoch": 816} {"train_loss": -10.303050994873047, "global_step": 137095, "epoch": 816} {"train_loss": -9.938619613647461, "global_step": 137096, "epoch": 816} {"train_loss": -9.926939010620117, "global_step": 137097, "epoch": 816} {"train_loss": -9.964481353759766, "global_step": 137098, "epoch": 816} {"train_loss": -10.005867004394531, "global_step": 137099, "epoch": 816} {"train_loss": -9.898435592651367, "global_step": 137100, "epoch": 816} {"train_loss": -9.809592247009277, "global_step": 137101, "epoch": 816} {"train_loss": -10.346900939941406, "global_step": 137102, "epoch": 816} {"train_loss": -10.1827392578125, "global_step": 137103, "epoch": 816} {"train_loss": -9.774833679199219, "global_step": 137104, "epoch": 816} {"train_loss": -10.12621784210205, "global_step": 137105, "epoch": 816} {"train_loss": -9.977242469787598, "global_step": 137106, "epoch": 816} {"train_loss": -10.072713851928711, "global_step": 137107, "epoch": 816} {"train_loss": -10.079469680786133, "global_step": 137108, "epoch": 816} {"train_loss": -10.314814567565918, "global_step": 137109, "epoch": 816} {"train_loss": -10.117043495178223, "global_step": 137110, "epoch": 816} {"train_loss": -10.499120712280273, "global_step": 137111, "epoch": 816} {"train_loss": -10.2211275100708, "global_step": 137112, "epoch": 816} {"train_loss": -10.537046432495117, "global_step": 137113, "epoch": 816} {"train_loss": -10.167288780212402, "global_step": 137114, "epoch": 816} {"train_loss": -10.21799373626709, "global_step": 137115, "epoch": 816} {"train_loss": -10.324098587036133, "global_step": 137116, "epoch": 816} {"train_loss": -10.452319145202637, "global_step": 137117, "epoch": 816} {"train_loss": -10.346870422363281, "global_step": 137118, "epoch": 816} {"train_loss": -10.696287155151367, "global_step": 137119, "epoch": 816} {"train_loss": -10.262223243713379, "global_step": 137120, "epoch": 816} {"train_loss": -10.47378921508789, "global_step": 137121, "epoch": 816} {"train_loss": -10.85214614868164, "global_step": 137122, "epoch": 816} {"train_loss": -10.437128067016602, "global_step": 137123, "epoch": 816} {"train_loss": -10.155068397521973, "global_step": 137124, "epoch": 816} {"train_loss": -10.588661193847656, "global_step": 137125, "epoch": 816} {"train_loss": -10.404027938842773, "global_step": 137126, "epoch": 816} {"train_loss": -10.490779876708984, "global_step": 137127, "epoch": 816} {"train_loss": -10.354732513427734, "global_step": 137128, "epoch": 816} {"train_loss": -10.435267448425293, "global_step": 137129, "epoch": 816} {"train_loss": -10.371728897094727, "global_step": 137130, "epoch": 816} {"train_loss": -10.40380573272705, "global_step": 137131, "epoch": 816} {"train_loss": -10.724115371704102, "global_step": 137132, "epoch": 816} {"train_loss": -10.199615478515625, "global_step": 137133, "epoch": 816} {"train_loss": -10.81899356842041, "global_step": 137134, "epoch": 816} {"train_loss": -10.426467895507812, "global_step": 137135, "epoch": 816} {"train_loss": -10.56500244140625, "global_step": 137136, "epoch": 816} {"train_loss": -10.617890357971191, "global_step": 137137, "epoch": 816} {"train_loss": -10.626264572143555, "global_step": 137138, "epoch": 816} {"train_loss": -10.64105224609375, "global_step": 137139, "epoch": 816} {"train_loss": -10.584802627563477, "global_step": 137140, "epoch": 816} {"train_loss": -10.820793151855469, "global_step": 137141, "epoch": 816} {"train_loss": -10.780057907104492, "global_step": 137142, "epoch": 816} {"train_loss": -10.778852462768555, "global_step": 137143, "epoch": 816} {"train_loss": -10.60909652709961, "global_step": 137144, "epoch": 816} {"train_loss": -10.605030059814453, "global_step": 137145, "epoch": 816} {"train_loss": -10.882926940917969, "global_step": 137146, "epoch": 816} {"train_loss": -10.835993766784668, "global_step": 137147, "epoch": 816} {"train_loss": -10.893182754516602, "global_step": 137148, "epoch": 816} {"train_loss": -10.96688461303711, "global_step": 137149, "epoch": 816} {"train_loss": -10.777302742004395, "global_step": 137150, "epoch": 816} {"train_loss": -10.775358200073242, "global_step": 137151, "epoch": 816} {"train_loss": -10.799820899963379, "global_step": 137152, "epoch": 816} {"train_loss": -11.017888069152832, "global_step": 137153, "epoch": 816} {"train_loss": -10.927228927612305, "global_step": 137154, "epoch": 816} {"train_loss": -10.610634803771973, "global_step": 137155, "epoch": 816} {"train_loss": -10.794229507446289, "global_step": 137156, "epoch": 816} {"train_loss": -10.34469223022461, "global_step": 137157, "epoch": 816} {"train_loss": -10.306344032287598, "global_step": 137158, "epoch": 816} {"train_loss": -10.31003189086914, "global_step": 137159, "epoch": 816} {"train_loss": -10.717519760131836, "global_step": 137160, "epoch": 816} {"train_loss": -10.512497901916504, "global_step": 137161, "epoch": 816} {"train_loss": -10.186738967895508, "global_step": 137162, "epoch": 816} {"train_loss": -10.470315933227539, "global_step": 137163, "epoch": 816} {"train_loss": -10.273395538330078, "global_step": 137164, "epoch": 816} {"train_loss": -10.263969421386719, "global_step": 137165, "epoch": 816} {"train_loss": -10.66353988647461, "global_step": 137166, "epoch": 816} {"train_loss": -10.432361602783203, "global_step": 137167, "epoch": 816} {"train_loss": -10.521784782409668, "global_step": 137168, "epoch": 816} {"train_loss": -10.613709449768066, "global_step": 137169, "epoch": 816} {"train_loss": -10.305900573730469, "global_step": 137170, "epoch": 816} {"train_loss": -10.123394012451172, "global_step": 137171, "epoch": 816} {"train_loss": -10.288079261779785, "global_step": 137172, "epoch": 816} {"train_loss": -10.413186073303223, "global_step": 137173, "epoch": 816} {"train_loss": -9.867473602294922, "global_step": 137174, "epoch": 816} {"train_loss": -9.895063400268555, "global_step": 137175, "epoch": 816} {"train_loss": -9.87611198425293, "global_step": 137176, "epoch": 816} {"train_loss": -10.137020111083984, "global_step": 137177, "epoch": 816} {"train_loss": -9.739625930786133, "global_step": 137178, "epoch": 816} {"train_loss": -9.609935760498047, "global_step": 137179, "epoch": 816} {"train_loss": -9.252683639526367, "global_step": 137180, "epoch": 816} {"train_loss": -10.135139465332031, "global_step": 137181, "epoch": 816} {"train_loss": -9.205851554870605, "global_step": 137182, "epoch": 816} {"train_loss": -9.804278373718262, "global_step": 137183, "epoch": 816} {"train_loss": -9.238950729370117, "global_step": 137184, "epoch": 816} {"train_loss": -10.375125885009766, "global_step": 137185, "epoch": 816} {"train_loss": -9.31576156616211, "global_step": 137186, "epoch": 816} {"train_loss": -10.210418701171875, "global_step": 137187, "epoch": 816} {"train_loss": -9.837564468383789, "global_step": 137188, "epoch": 816} {"train_loss": -9.907207489013672, "global_step": 137189, "epoch": 816} {"train_loss": -10.153003692626953, "global_step": 137190, "epoch": 816} {"train_loss": -9.740974426269531, "global_step": 137191, "epoch": 816} {"train_loss": -9.894720077514648, "global_step": 137192, "epoch": 816} {"train_loss": -9.939896583557129, "global_step": 137193, "epoch": 816} {"train_loss": -10.088834762573242, "global_step": 137194, "epoch": 816} {"train_loss": -10.078757286071777, "global_step": 137195, "epoch": 816} {"train_loss": -10.21340560913086, "global_step": 137196, "epoch": 816} {"train_loss": -10.304749488830566, "global_step": 137197, "epoch": 816} {"train_loss": -10.257429122924805, "global_step": 137198, "epoch": 816} {"train_loss": -10.333192825317383, "global_step": 137199, "epoch": 816} {"train_loss": -10.304716110229492, "global_step": 137200, "epoch": 816} {"train_loss": -10.51159381866455, "global_step": 137201, "epoch": 816} {"train_loss": -10.224054336547852, "global_step": 137202, "epoch": 816} {"train_loss": -10.38348388671875, "global_step": 137203, "epoch": 816} {"train_loss": -10.415567398071289, "global_step": 137204, "epoch": 816} {"train_loss": -10.479354858398438, "global_step": 137205, "epoch": 816} {"train_loss": -10.448620796203613, "global_step": 137206, "epoch": 816} {"train_loss": -10.344636917114258, "global_step": 137207, "epoch": 816} {"train_loss": -10.439750671386719, "global_step": 137208, "epoch": 816} {"train_loss": -10.451152801513672, "global_step": 137209, "epoch": 816} {"train_loss": -10.620000839233398, "global_step": 137210, "epoch": 816} {"train_loss": -10.568442344665527, "global_step": 137211, "epoch": 816} {"train_loss": -10.589265823364258, "global_step": 137212, "epoch": 816} {"train_loss": -10.378046035766602, "global_step": 137213, "epoch": 816} {"train_loss": -10.756226539611816, "global_step": 137214, "epoch": 816} {"train_loss": -10.418472290039062, "global_step": 137215, "epoch": 816} {"train_loss": -10.697317123413086, "global_step": 137216, "epoch": 816} {"train_loss": -10.546175003051758, "global_step": 137217, "epoch": 816} {"train_loss": -10.666970252990723, "global_step": 137218, "epoch": 816} {"train_loss": -10.765210151672363, "global_step": 137219, "epoch": 816} {"train_loss": -10.501972198486328, "global_step": 137220, "epoch": 816} {"train_loss": -10.499673843383789, "global_step": 137221, "epoch": 816} {"train_loss": -10.680398941040039, "global_step": 137222, "epoch": 816} {"train_loss": -10.562865257263184, "global_step": 137223, "epoch": 816} {"train_loss": -10.817882537841797, "global_step": 137224, "epoch": 816} {"train_loss": -10.721014022827148, "global_step": 137225, "epoch": 816} {"train_loss": -10.580141067504883, "global_step": 137226, "epoch": 816} {"train_loss": -10.915119171142578, "global_step": 137227, "epoch": 816} {"train_loss": -10.876786231994629, "global_step": 137228, "epoch": 816} {"train_loss": -10.697315216064453, "global_step": 137229, "epoch": 816} {"train_loss": -10.627293586730957, "global_step": 137230, "epoch": 816} {"train_loss": -10.689284324645996, "global_step": 137231, "epoch": 816} {"train_loss": -10.83144760131836, "global_step": 137232, "epoch": 816} {"train_loss": -10.783303260803223, "global_step": 137233, "epoch": 816} {"train_loss": -10.935993194580078, "global_step": 137234, "epoch": 816} {"train_loss": -10.726829528808594, "global_step": 137235, "epoch": 816} {"train_loss": -10.792497634887695, "global_step": 137236, "epoch": 816} {"train_loss": -10.752706527709961, "global_step": 137237, "epoch": 816} {"train_loss": -10.629287719726562, "global_step": 137238, "epoch": 816} {"train_loss": -10.783085823059082, "global_step": 137239, "epoch": 816} {"train_loss": -10.640085220336914, "global_step": 137240, "epoch": 816} {"train_loss": -10.837965965270996, "global_step": 137241, "epoch": 816} {"train_loss": -10.609926223754883, "global_step": 137242, "epoch": 816} {"train_loss": -10.91891860961914, "global_step": 137243, "epoch": 816} {"train_loss": -10.698280334472656, "global_step": 137244, "epoch": 816} {"train_loss": -10.603612899780273, "global_step": 137245, "epoch": 816} {"train_loss": -10.837072372436523, "global_step": 137246, "epoch": 816} {"train_loss": -10.834321975708008, "global_step": 137247, "epoch": 816} {"train_loss": -10.866573333740234, "global_step": 137248, "epoch": 816} {"train_loss": -10.77660083770752, "global_step": 137249, "epoch": 816} {"train_loss": -10.557289123535156, "global_step": 137250, "epoch": 816} {"train_loss": -9.993083953857422, "global_step": 137251, "epoch": 816} {"train_loss": -10.136445999145508, "global_step": 137252, "epoch": 816} {"train_loss": -10.147111892700195, "global_step": 137253, "epoch": 816} {"train_loss": -10.1006498336792, "global_step": 137254, "epoch": 816} {"train_loss": -10.389969581649417, "global_step": 137255, "epoch": 816, "val_loss": 224395.703125} {"train_loss": -10.049434661865234, "global_step": 137256, "epoch": 817} {"train_loss": -9.263617515563965, "global_step": 137257, "epoch": 817} {"train_loss": -9.22219181060791, "global_step": 137258, "epoch": 817} {"train_loss": -9.684183120727539, "global_step": 137259, "epoch": 817} {"train_loss": -8.78757381439209, "global_step": 137260, "epoch": 817} {"train_loss": -9.8262357711792, "global_step": 137261, "epoch": 817} {"train_loss": -8.245084762573242, "global_step": 137262, "epoch": 817} {"train_loss": -9.959562301635742, "global_step": 137263, "epoch": 817} {"train_loss": -9.332535743713379, "global_step": 137264, "epoch": 817} {"train_loss": -9.594715118408203, "global_step": 137265, "epoch": 817} {"train_loss": -9.193801879882812, "global_step": 137266, "epoch": 817} {"train_loss": -9.588748931884766, "global_step": 137267, "epoch": 817} {"train_loss": -9.537485122680664, "global_step": 137268, "epoch": 817} {"train_loss": -9.303811073303223, "global_step": 137269, "epoch": 817} {"train_loss": -9.885297775268555, "global_step": 137270, "epoch": 817} {"train_loss": -10.068609237670898, "global_step": 137271, "epoch": 817} {"train_loss": -9.63193130493164, "global_step": 137272, "epoch": 817} {"train_loss": -9.829355239868164, "global_step": 137273, "epoch": 817} {"train_loss": -9.937206268310547, "global_step": 137274, "epoch": 817} {"train_loss": -10.100651741027832, "global_step": 137275, "epoch": 817} {"train_loss": -9.940374374389648, "global_step": 137276, "epoch": 817} {"train_loss": -10.165931701660156, "global_step": 137277, "epoch": 817} {"train_loss": -9.915661811828613, "global_step": 137278, "epoch": 817} {"train_loss": -10.023242950439453, "global_step": 137279, "epoch": 817} {"train_loss": -10.029953002929688, "global_step": 137280, "epoch": 817} {"train_loss": -10.03282356262207, "global_step": 137281, "epoch": 817} {"train_loss": -10.21436882019043, "global_step": 137282, "epoch": 817} {"train_loss": -10.097430229187012, "global_step": 137283, "epoch": 817} {"train_loss": -10.129911422729492, "global_step": 137284, "epoch": 817} {"train_loss": -10.169337272644043, "global_step": 137285, "epoch": 817} {"train_loss": -10.122782707214355, "global_step": 137286, "epoch": 817} {"train_loss": -10.224312782287598, "global_step": 137287, "epoch": 817} {"train_loss": -10.046867370605469, "global_step": 137288, "epoch": 817} {"train_loss": -10.202727317810059, "global_step": 137289, "epoch": 817} {"train_loss": -10.036165237426758, "global_step": 137290, "epoch": 817} {"train_loss": -10.237700462341309, "global_step": 137291, "epoch": 817} {"train_loss": -10.400775909423828, "global_step": 137292, "epoch": 817} {"train_loss": -10.203526496887207, "global_step": 137293, "epoch": 817} {"train_loss": -10.304020881652832, "global_step": 137294, "epoch": 817} {"train_loss": -10.386526107788086, "global_step": 137295, "epoch": 817} {"train_loss": -10.338869094848633, "global_step": 137296, "epoch": 817} {"train_loss": -10.58285140991211, "global_step": 137297, "epoch": 817} {"train_loss": -10.516606330871582, "global_step": 137298, "epoch": 817} {"train_loss": -10.610624313354492, "global_step": 137299, "epoch": 817} {"train_loss": -10.54854965209961, "global_step": 137300, "epoch": 817} {"train_loss": -10.40528392791748, "global_step": 137301, "epoch": 817} {"train_loss": -10.328893661499023, "global_step": 137302, "epoch": 817} {"train_loss": -10.802408218383789, "global_step": 137303, "epoch": 817} {"train_loss": -10.617563247680664, "global_step": 137304, "epoch": 817} {"train_loss": -10.550125122070312, "global_step": 137305, "epoch": 817} {"train_loss": -10.516965866088867, "global_step": 137306, "epoch": 817} {"train_loss": -10.543230056762695, "global_step": 137307, "epoch": 817} {"train_loss": -10.799065589904785, "global_step": 137308, "epoch": 817} {"train_loss": -10.445085525512695, "global_step": 137309, "epoch": 817} {"train_loss": -10.614072799682617, "global_step": 137310, "epoch": 817} {"train_loss": -10.644346237182617, "global_step": 137311, "epoch": 817} {"train_loss": -10.873361587524414, "global_step": 137312, "epoch": 817} {"train_loss": -10.759103775024414, "global_step": 137313, "epoch": 817} {"train_loss": -10.695486068725586, "global_step": 137314, "epoch": 817} {"train_loss": -10.760112762451172, "global_step": 137315, "epoch": 817} {"train_loss": -10.516504287719727, "global_step": 137316, "epoch": 817} {"train_loss": -10.642934799194336, "global_step": 137317, "epoch": 817} {"train_loss": -10.852943420410156, "global_step": 137318, "epoch": 817} {"train_loss": -10.731840133666992, "global_step": 137319, "epoch": 817} {"train_loss": -11.016951560974121, "global_step": 137320, "epoch": 817} {"train_loss": -10.81180477142334, "global_step": 137321, "epoch": 817} {"train_loss": -10.849828720092773, "global_step": 137322, "epoch": 817} {"train_loss": -10.727195739746094, "global_step": 137323, "epoch": 817} {"train_loss": -10.817981719970703, "global_step": 137324, "epoch": 817} {"train_loss": -10.625688552856445, "global_step": 137325, "epoch": 817} {"train_loss": -10.611101150512695, "global_step": 137326, "epoch": 817} {"train_loss": -10.848889350891113, "global_step": 137327, "epoch": 817} {"train_loss": -10.68139362335205, "global_step": 137328, "epoch": 817} {"train_loss": -10.987747192382812, "global_step": 137329, "epoch": 817} {"train_loss": -10.865568161010742, "global_step": 137330, "epoch": 817} {"train_loss": -10.718351364135742, "global_step": 137331, "epoch": 817} {"train_loss": -10.775384902954102, "global_step": 137332, "epoch": 817} {"train_loss": -10.757898330688477, "global_step": 137333, "epoch": 817} {"train_loss": -10.742022514343262, "global_step": 137334, "epoch": 817} {"train_loss": -10.929779052734375, "global_step": 137335, "epoch": 817} {"train_loss": -10.583751678466797, "global_step": 137336, "epoch": 817} {"train_loss": -10.598666191101074, "global_step": 137337, "epoch": 817} {"train_loss": -10.764775276184082, "global_step": 137338, "epoch": 817} {"train_loss": -11.013132095336914, "global_step": 137339, "epoch": 817} {"train_loss": -10.796947479248047, "global_step": 137340, "epoch": 817} {"train_loss": -10.825489044189453, "global_step": 137341, "epoch": 817} {"train_loss": -10.418956756591797, "global_step": 137342, "epoch": 817} {"train_loss": -10.744379043579102, "global_step": 137343, "epoch": 817} {"train_loss": -10.266533851623535, "global_step": 137344, "epoch": 817} {"train_loss": -10.540641784667969, "global_step": 137345, "epoch": 817} {"train_loss": -10.305273056030273, "global_step": 137346, "epoch": 817} {"train_loss": -10.445741653442383, "global_step": 137347, "epoch": 817} {"train_loss": -10.423561096191406, "global_step": 137348, "epoch": 817} {"train_loss": -10.938326835632324, "global_step": 137349, "epoch": 817} {"train_loss": -10.463516235351562, "global_step": 137350, "epoch": 817} {"train_loss": -10.382177352905273, "global_step": 137351, "epoch": 817} {"train_loss": -9.787643432617188, "global_step": 137352, "epoch": 817} {"train_loss": -10.532363891601562, "global_step": 137353, "epoch": 817} {"train_loss": -10.316704750061035, "global_step": 137354, "epoch": 817} {"train_loss": -10.118775367736816, "global_step": 137355, "epoch": 817} {"train_loss": -10.304859161376953, "global_step": 137356, "epoch": 817} {"train_loss": -10.113142013549805, "global_step": 137357, "epoch": 817} {"train_loss": -10.438522338867188, "global_step": 137358, "epoch": 817} {"train_loss": -10.393373489379883, "global_step": 137359, "epoch": 817} {"train_loss": -10.327858924865723, "global_step": 137360, "epoch": 817} {"train_loss": -10.316512107849121, "global_step": 137361, "epoch": 817} {"train_loss": -10.46780014038086, "global_step": 137362, "epoch": 817} {"train_loss": -9.9803466796875, "global_step": 137363, "epoch": 817} {"train_loss": -10.400083541870117, "global_step": 137364, "epoch": 817} {"train_loss": -10.494543075561523, "global_step": 137365, "epoch": 817} {"train_loss": -10.18474292755127, "global_step": 137366, "epoch": 817} {"train_loss": -10.29824161529541, "global_step": 137367, "epoch": 817} {"train_loss": -10.424715042114258, "global_step": 137368, "epoch": 817} {"train_loss": -10.497903823852539, "global_step": 137369, "epoch": 817} {"train_loss": -10.35663890838623, "global_step": 137370, "epoch": 817} {"train_loss": -10.236148834228516, "global_step": 137371, "epoch": 817} {"train_loss": -10.252001762390137, "global_step": 137372, "epoch": 817} {"train_loss": -9.90219497680664, "global_step": 137373, "epoch": 817} {"train_loss": -9.896242141723633, "global_step": 137374, "epoch": 817} {"train_loss": -10.719593048095703, "global_step": 137375, "epoch": 817} {"train_loss": -10.33027458190918, "global_step": 137376, "epoch": 817} {"train_loss": -10.28795051574707, "global_step": 137377, "epoch": 817} {"train_loss": -10.42358684539795, "global_step": 137378, "epoch": 817} {"train_loss": -10.440476417541504, "global_step": 137379, "epoch": 817} {"train_loss": -10.42609691619873, "global_step": 137380, "epoch": 817} {"train_loss": -10.226974487304688, "global_step": 137381, "epoch": 817} {"train_loss": -10.723014831542969, "global_step": 137382, "epoch": 817} {"train_loss": -10.235136032104492, "global_step": 137383, "epoch": 817} {"train_loss": -10.496463775634766, "global_step": 137384, "epoch": 817} {"train_loss": -10.284265518188477, "global_step": 137385, "epoch": 817} {"train_loss": -10.511970520019531, "global_step": 137386, "epoch": 817} {"train_loss": -10.670702934265137, "global_step": 137387, "epoch": 817} {"train_loss": -10.300506591796875, "global_step": 137388, "epoch": 817} {"train_loss": -9.955831527709961, "global_step": 137389, "epoch": 817} {"train_loss": -9.987797737121582, "global_step": 137390, "epoch": 817} {"train_loss": -10.45038890838623, "global_step": 137391, "epoch": 817} {"train_loss": -10.072653770446777, "global_step": 137392, "epoch": 817} {"train_loss": -10.272967338562012, "global_step": 137393, "epoch": 817} {"train_loss": -10.089569091796875, "global_step": 137394, "epoch": 817} {"train_loss": -10.201005935668945, "global_step": 137395, "epoch": 817} {"train_loss": -9.841599464416504, "global_step": 137396, "epoch": 817} {"train_loss": -10.007444381713867, "global_step": 137397, "epoch": 817} {"train_loss": -10.288829803466797, "global_step": 137398, "epoch": 817} {"train_loss": -10.481582641601562, "global_step": 137399, "epoch": 817} {"train_loss": -9.613468170166016, "global_step": 137400, "epoch": 817} {"train_loss": -9.666516304016113, "global_step": 137401, "epoch": 817} {"train_loss": -9.876497268676758, "global_step": 137402, "epoch": 817} {"train_loss": -9.778308868408203, "global_step": 137403, "epoch": 817} {"train_loss": -10.355297088623047, "global_step": 137404, "epoch": 817} {"train_loss": -9.809534072875977, "global_step": 137405, "epoch": 817} {"train_loss": -9.92216968536377, "global_step": 137406, "epoch": 817} {"train_loss": -10.330288887023926, "global_step": 137407, "epoch": 817} {"train_loss": -9.881929397583008, "global_step": 137408, "epoch": 817} {"train_loss": -10.2193603515625, "global_step": 137409, "epoch": 817} {"train_loss": -10.196142196655273, "global_step": 137410, "epoch": 817} {"train_loss": -10.333843231201172, "global_step": 137411, "epoch": 817} {"train_loss": -10.207411766052246, "global_step": 137412, "epoch": 817} {"train_loss": -10.036429405212402, "global_step": 137413, "epoch": 817} {"train_loss": -10.42811393737793, "global_step": 137414, "epoch": 817} {"train_loss": -10.449125289916992, "global_step": 137415, "epoch": 817} {"train_loss": -9.826729774475098, "global_step": 137416, "epoch": 817} {"train_loss": -10.714319229125977, "global_step": 137417, "epoch": 817} {"train_loss": -10.212904930114746, "global_step": 137418, "epoch": 817} {"train_loss": -10.03303337097168, "global_step": 137419, "epoch": 817} {"train_loss": -10.518533706665039, "global_step": 137420, "epoch": 817} {"train_loss": -9.737119674682617, "global_step": 137421, "epoch": 817} {"train_loss": -10.261469841003418, "global_step": 137422, "epoch": 817} {"train_loss": -10.283416373389107, "global_step": 137423, "epoch": 817, "val_loss": 224588.53125} {"train_loss": -10.204334259033203, "global_step": 137424, "epoch": 818} {"train_loss": -10.150392532348633, "global_step": 137425, "epoch": 818} {"train_loss": -10.373306274414062, "global_step": 137426, "epoch": 818} {"train_loss": -9.902780532836914, "global_step": 137427, "epoch": 818} {"train_loss": -10.243188858032227, "global_step": 137428, "epoch": 818} {"train_loss": -10.113571166992188, "global_step": 137429, "epoch": 818} {"train_loss": -10.310543060302734, "global_step": 137430, "epoch": 818} {"train_loss": -10.140499114990234, "global_step": 137431, "epoch": 818} {"train_loss": -10.13227367401123, "global_step": 137432, "epoch": 818} {"train_loss": -10.205365180969238, "global_step": 137433, "epoch": 818} {"train_loss": -9.720870971679688, "global_step": 137434, "epoch": 818} {"train_loss": -10.523628234863281, "global_step": 137435, "epoch": 818} {"train_loss": -9.989473342895508, "global_step": 137436, "epoch": 818} {"train_loss": -10.195943832397461, "global_step": 137437, "epoch": 818} {"train_loss": -9.876481056213379, "global_step": 137438, "epoch": 818} {"train_loss": -10.417378425598145, "global_step": 137439, "epoch": 818} {"train_loss": -10.145095825195312, "global_step": 137440, "epoch": 818} {"train_loss": -10.105875015258789, "global_step": 137441, "epoch": 818} {"train_loss": -10.353153228759766, "global_step": 137442, "epoch": 818} {"train_loss": -9.996984481811523, "global_step": 137443, "epoch": 818} {"train_loss": -10.010621070861816, "global_step": 137444, "epoch": 818} {"train_loss": -10.4205322265625, "global_step": 137445, "epoch": 818} {"train_loss": -9.975912094116211, "global_step": 137446, "epoch": 818} {"train_loss": -10.377275466918945, "global_step": 137447, "epoch": 818} {"train_loss": -10.610767364501953, "global_step": 137448, "epoch": 818} {"train_loss": -10.180509567260742, "global_step": 137449, "epoch": 818} {"train_loss": -10.283077239990234, "global_step": 137450, "epoch": 818} {"train_loss": -10.711930274963379, "global_step": 137451, "epoch": 818} {"train_loss": -10.205179214477539, "global_step": 137452, "epoch": 818} {"train_loss": -10.480602264404297, "global_step": 137453, "epoch": 818} {"train_loss": -10.68828010559082, "global_step": 137454, "epoch": 818} {"train_loss": -10.367570877075195, "global_step": 137455, "epoch": 818} {"train_loss": -10.604379653930664, "global_step": 137456, "epoch": 818} {"train_loss": -10.666206359863281, "global_step": 137457, "epoch": 818} {"train_loss": -10.25344467163086, "global_step": 137458, "epoch": 818} {"train_loss": -10.623857498168945, "global_step": 137459, "epoch": 818} {"train_loss": -10.427756309509277, "global_step": 137460, "epoch": 818} {"train_loss": -10.72614860534668, "global_step": 137461, "epoch": 818} {"train_loss": -10.62607192993164, "global_step": 137462, "epoch": 818} {"train_loss": -10.66722297668457, "global_step": 137463, "epoch": 818} {"train_loss": -10.529868125915527, "global_step": 137464, "epoch": 818} {"train_loss": -10.77001953125, "global_step": 137465, "epoch": 818} {"train_loss": -10.68006706237793, "global_step": 137466, "epoch": 818} {"train_loss": -10.783153533935547, "global_step": 137467, "epoch": 818} {"train_loss": -10.684622764587402, "global_step": 137468, "epoch": 818} {"train_loss": -10.738374710083008, "global_step": 137469, "epoch": 818} {"train_loss": -10.682037353515625, "global_step": 137470, "epoch": 818} {"train_loss": -10.708885192871094, "global_step": 137471, "epoch": 818} {"train_loss": -10.645051956176758, "global_step": 137472, "epoch": 818} {"train_loss": -10.51883316040039, "global_step": 137473, "epoch": 818} {"train_loss": -10.861783027648926, "global_step": 137474, "epoch": 818} {"train_loss": -10.936992645263672, "global_step": 137475, "epoch": 818} {"train_loss": -10.61746597290039, "global_step": 137476, "epoch": 818} {"train_loss": -10.842391967773438, "global_step": 137477, "epoch": 818} {"train_loss": -10.529557228088379, "global_step": 137478, "epoch": 818} {"train_loss": -10.343277931213379, "global_step": 137479, "epoch": 818} {"train_loss": -10.096853256225586, "global_step": 137480, "epoch": 818} {"train_loss": -9.841575622558594, "global_step": 137481, "epoch": 818} {"train_loss": -10.165246963500977, "global_step": 137482, "epoch": 818} {"train_loss": -10.011831283569336, "global_step": 137483, "epoch": 818} {"train_loss": -10.41685676574707, "global_step": 137484, "epoch": 818} {"train_loss": -10.374125480651855, "global_step": 137485, "epoch": 818} {"train_loss": -10.428823471069336, "global_step": 137486, "epoch": 818} {"train_loss": -10.450754165649414, "global_step": 137487, "epoch": 818} {"train_loss": -10.572863578796387, "global_step": 137488, "epoch": 818} {"train_loss": -10.417844772338867, "global_step": 137489, "epoch": 818} {"train_loss": -10.842012405395508, "global_step": 137490, "epoch": 818} {"train_loss": -10.32177734375, "global_step": 137491, "epoch": 818} {"train_loss": -10.524953842163086, "global_step": 137492, "epoch": 818} {"train_loss": -10.537114143371582, "global_step": 137493, "epoch": 818} {"train_loss": -10.256599426269531, "global_step": 137494, "epoch": 818} {"train_loss": -10.510151863098145, "global_step": 137495, "epoch": 818} {"train_loss": -10.49610710144043, "global_step": 137496, "epoch": 818} {"train_loss": -10.254425048828125, "global_step": 137497, "epoch": 818} {"train_loss": -10.510412216186523, "global_step": 137498, "epoch": 818} {"train_loss": -10.299905776977539, "global_step": 137499, "epoch": 818} {"train_loss": -10.162418365478516, "global_step": 137500, "epoch": 818} {"train_loss": -10.22941780090332, "global_step": 137501, "epoch": 818} {"train_loss": -10.680500030517578, "global_step": 137502, "epoch": 818} {"train_loss": -10.098628997802734, "global_step": 137503, "epoch": 818} {"train_loss": -10.356107711791992, "global_step": 137504, "epoch": 818} {"train_loss": -10.47201156616211, "global_step": 137505, "epoch": 818} {"train_loss": -9.935476303100586, "global_step": 137506, "epoch": 818} {"train_loss": -10.370882034301758, "global_step": 137507, "epoch": 818} {"train_loss": -9.815285682678223, "global_step": 137508, "epoch": 818} {"train_loss": -10.171865463256836, "global_step": 137509, "epoch": 818} {"train_loss": -10.222870826721191, "global_step": 137510, "epoch": 818} {"train_loss": -10.19729232788086, "global_step": 137511, "epoch": 818} {"train_loss": -10.46243667602539, "global_step": 137512, "epoch": 818} {"train_loss": -10.029354095458984, "global_step": 137513, "epoch": 818} {"train_loss": -10.542539596557617, "global_step": 137514, "epoch": 818} {"train_loss": -10.146615982055664, "global_step": 137515, "epoch": 818} {"train_loss": -10.580248832702637, "global_step": 137516, "epoch": 818} {"train_loss": -10.645665168762207, "global_step": 137517, "epoch": 818} {"train_loss": -10.515035629272461, "global_step": 137518, "epoch": 818} {"train_loss": -10.635501861572266, "global_step": 137519, "epoch": 818} {"train_loss": -10.361396789550781, "global_step": 137520, "epoch": 818} {"train_loss": -10.343942642211914, "global_step": 137521, "epoch": 818} {"train_loss": -10.559850692749023, "global_step": 137522, "epoch": 818} {"train_loss": -10.65380859375, "global_step": 137523, "epoch": 818} {"train_loss": -10.529258728027344, "global_step": 137524, "epoch": 818} {"train_loss": -10.73874568939209, "global_step": 137525, "epoch": 818} {"train_loss": -10.40194320678711, "global_step": 137526, "epoch": 818} {"train_loss": -10.398181915283203, "global_step": 137527, "epoch": 818} {"train_loss": -10.821554183959961, "global_step": 137528, "epoch": 818} {"train_loss": -10.570988655090332, "global_step": 137529, "epoch": 818} {"train_loss": -10.529104232788086, "global_step": 137530, "epoch": 818} {"train_loss": -10.43133544921875, "global_step": 137531, "epoch": 818} {"train_loss": -10.738967895507812, "global_step": 137532, "epoch": 818} {"train_loss": -10.5025634765625, "global_step": 137533, "epoch": 818} {"train_loss": -10.5291748046875, "global_step": 137534, "epoch": 818} {"train_loss": -10.62034797668457, "global_step": 137535, "epoch": 818} {"train_loss": -10.832880020141602, "global_step": 137536, "epoch": 818} {"train_loss": -10.411677360534668, "global_step": 137537, "epoch": 818} {"train_loss": -10.692437171936035, "global_step": 137538, "epoch": 818} {"train_loss": -10.853076934814453, "global_step": 137539, "epoch": 818} {"train_loss": -10.748957633972168, "global_step": 137540, "epoch": 818} {"train_loss": -10.648502349853516, "global_step": 137541, "epoch": 818} {"train_loss": -10.398272514343262, "global_step": 137542, "epoch": 818} {"train_loss": -10.816173553466797, "global_step": 137543, "epoch": 818} {"train_loss": -10.850777626037598, "global_step": 137544, "epoch": 818} {"train_loss": -10.643203735351562, "global_step": 137545, "epoch": 818} {"train_loss": -10.50297737121582, "global_step": 137546, "epoch": 818} {"train_loss": -10.575611114501953, "global_step": 137547, "epoch": 818} {"train_loss": -10.754203796386719, "global_step": 137548, "epoch": 818} {"train_loss": -10.353890419006348, "global_step": 137549, "epoch": 818} {"train_loss": -10.574649810791016, "global_step": 137550, "epoch": 818} {"train_loss": -10.448598861694336, "global_step": 137551, "epoch": 818} {"train_loss": -10.675268173217773, "global_step": 137552, "epoch": 818} {"train_loss": -10.199817657470703, "global_step": 137553, "epoch": 818} {"train_loss": -10.56663990020752, "global_step": 137554, "epoch": 818} {"train_loss": -10.377288818359375, "global_step": 137555, "epoch": 818} {"train_loss": -10.581910133361816, "global_step": 137556, "epoch": 818} {"train_loss": -10.541248321533203, "global_step": 137557, "epoch": 818} {"train_loss": -10.01972484588623, "global_step": 137558, "epoch": 818} {"train_loss": -10.528844833374023, "global_step": 137559, "epoch": 818} {"train_loss": -10.358829498291016, "global_step": 137560, "epoch": 818} {"train_loss": -10.46027660369873, "global_step": 137561, "epoch": 818} {"train_loss": -10.668901443481445, "global_step": 137562, "epoch": 818} {"train_loss": -10.101659774780273, "global_step": 137563, "epoch": 818} {"train_loss": -10.701231002807617, "global_step": 137564, "epoch": 818} {"train_loss": -10.571858406066895, "global_step": 137565, "epoch": 818} {"train_loss": -10.398908615112305, "global_step": 137566, "epoch": 818} {"train_loss": -10.435444831848145, "global_step": 137567, "epoch": 818} {"train_loss": -10.424203872680664, "global_step": 137568, "epoch": 818} {"train_loss": -10.641385078430176, "global_step": 137569, "epoch": 818} {"train_loss": -10.539897918701172, "global_step": 137570, "epoch": 818} {"train_loss": -10.719477653503418, "global_step": 137571, "epoch": 818} {"train_loss": -10.284637451171875, "global_step": 137572, "epoch": 818} {"train_loss": -10.568140983581543, "global_step": 137573, "epoch": 818} {"train_loss": -10.5908784866333, "global_step": 137574, "epoch": 818} {"train_loss": -10.237649917602539, "global_step": 137575, "epoch": 818} {"train_loss": -10.474067687988281, "global_step": 137576, "epoch": 818} {"train_loss": -10.58758544921875, "global_step": 137577, "epoch": 818} {"train_loss": -10.336009979248047, "global_step": 137578, "epoch": 818} {"train_loss": -10.587492942810059, "global_step": 137579, "epoch": 818} {"train_loss": -10.185981750488281, "global_step": 137580, "epoch": 818} {"train_loss": -10.404108047485352, "global_step": 137581, "epoch": 818} {"train_loss": -10.604789733886719, "global_step": 137582, "epoch": 818} {"train_loss": -9.968240737915039, "global_step": 137583, "epoch": 818} {"train_loss": -10.413066864013672, "global_step": 137584, "epoch": 818} {"train_loss": -9.861126899719238, "global_step": 137585, "epoch": 818} {"train_loss": -10.225536346435547, "global_step": 137586, "epoch": 818} {"train_loss": -10.082307815551758, "global_step": 137587, "epoch": 818} {"train_loss": -10.119487762451172, "global_step": 137588, "epoch": 818} {"train_loss": -10.243062973022461, "global_step": 137589, "epoch": 818} {"train_loss": -10.04531478881836, "global_step": 137590, "epoch": 818} {"train_loss": -10.424523921239944, "global_step": 137591, "epoch": 818, "val_loss": 225759.578125} {"train_loss": -9.18912124633789, "global_step": 137592, "epoch": 819} {"train_loss": -10.368085861206055, "global_step": 137593, "epoch": 819} {"train_loss": -9.591849327087402, "global_step": 137594, "epoch": 819} {"train_loss": -10.013045310974121, "global_step": 137595, "epoch": 819} {"train_loss": -9.972225189208984, "global_step": 137596, "epoch": 819} {"train_loss": -9.876163482666016, "global_step": 137597, "epoch": 819} {"train_loss": -10.16168212890625, "global_step": 137598, "epoch": 819} {"train_loss": -10.015928268432617, "global_step": 137599, "epoch": 819} {"train_loss": -10.36068058013916, "global_step": 137600, "epoch": 819} {"train_loss": -10.081514358520508, "global_step": 137601, "epoch": 819} {"train_loss": -10.408731460571289, "global_step": 137602, "epoch": 819} {"train_loss": -10.349457740783691, "global_step": 137603, "epoch": 819} {"train_loss": -10.259636878967285, "global_step": 137604, "epoch": 819} {"train_loss": -10.093961715698242, "global_step": 137605, "epoch": 819} {"train_loss": -10.494556427001953, "global_step": 137606, "epoch": 819} {"train_loss": -10.158935546875, "global_step": 137607, "epoch": 819} {"train_loss": -10.489086151123047, "global_step": 137608, "epoch": 819} {"train_loss": -10.296585083007812, "global_step": 137609, "epoch": 819} {"train_loss": -10.403217315673828, "global_step": 137610, "epoch": 819} {"train_loss": -10.320413589477539, "global_step": 137611, "epoch": 819} {"train_loss": -10.630876541137695, "global_step": 137612, "epoch": 819} {"train_loss": -10.324395179748535, "global_step": 137613, "epoch": 819} {"train_loss": -10.112147331237793, "global_step": 137614, "epoch": 819} {"train_loss": -10.25174331665039, "global_step": 137615, "epoch": 819} {"train_loss": -10.14499282836914, "global_step": 137616, "epoch": 819} {"train_loss": -10.379953384399414, "global_step": 137617, "epoch": 819} {"train_loss": -10.250143051147461, "global_step": 137618, "epoch": 819} {"train_loss": -10.276291847229004, "global_step": 137619, "epoch": 819} {"train_loss": -10.477993965148926, "global_step": 137620, "epoch": 819} {"train_loss": -10.532747268676758, "global_step": 137621, "epoch": 819} {"train_loss": -10.476919174194336, "global_step": 137622, "epoch": 819} {"train_loss": -10.288145065307617, "global_step": 137623, "epoch": 819} {"train_loss": -10.547151565551758, "global_step": 137624, "epoch": 819} {"train_loss": -10.585809707641602, "global_step": 137625, "epoch": 819} {"train_loss": -10.554641723632812, "global_step": 137626, "epoch": 819} {"train_loss": -10.238319396972656, "global_step": 137627, "epoch": 819} {"train_loss": -10.34927749633789, "global_step": 137628, "epoch": 819} {"train_loss": -10.661643981933594, "global_step": 137629, "epoch": 819} {"train_loss": -10.50979232788086, "global_step": 137630, "epoch": 819} {"train_loss": -10.557016372680664, "global_step": 137631, "epoch": 819} {"train_loss": -10.545591354370117, "global_step": 137632, "epoch": 819} {"train_loss": -10.69925308227539, "global_step": 137633, "epoch": 819} {"train_loss": -10.642789840698242, "global_step": 137634, "epoch": 819} {"train_loss": -10.722959518432617, "global_step": 137635, "epoch": 819} {"train_loss": -10.605958938598633, "global_step": 137636, "epoch": 819} {"train_loss": -10.555665016174316, "global_step": 137637, "epoch": 819} {"train_loss": -10.856740951538086, "global_step": 137638, "epoch": 819} {"train_loss": -10.720561027526855, "global_step": 137639, "epoch": 819} {"train_loss": -10.700448036193848, "global_step": 137640, "epoch": 819} {"train_loss": -10.704366683959961, "global_step": 137641, "epoch": 819} {"train_loss": -10.792247772216797, "global_step": 137642, "epoch": 819} {"train_loss": -10.91988468170166, "global_step": 137643, "epoch": 819} {"train_loss": -10.854223251342773, "global_step": 137644, "epoch": 819} {"train_loss": -10.76462173461914, "global_step": 137645, "epoch": 819} {"train_loss": -10.967069625854492, "global_step": 137646, "epoch": 819} {"train_loss": -10.737911224365234, "global_step": 137647, "epoch": 819} {"train_loss": -10.74337387084961, "global_step": 137648, "epoch": 819} {"train_loss": -10.724609375, "global_step": 137649, "epoch": 819} {"train_loss": -10.501102447509766, "global_step": 137650, "epoch": 819} {"train_loss": -10.627653121948242, "global_step": 137651, "epoch": 819} {"train_loss": -10.793254852294922, "global_step": 137652, "epoch": 819} {"train_loss": -10.609598159790039, "global_step": 137653, "epoch": 819} {"train_loss": -10.66756820678711, "global_step": 137654, "epoch": 819} {"train_loss": -10.839798927307129, "global_step": 137655, "epoch": 819} {"train_loss": -10.50097370147705, "global_step": 137656, "epoch": 819} {"train_loss": -10.84528923034668, "global_step": 137657, "epoch": 819} {"train_loss": -10.442188262939453, "global_step": 137658, "epoch": 819} {"train_loss": -10.967988014221191, "global_step": 137659, "epoch": 819} {"train_loss": -10.545878410339355, "global_step": 137660, "epoch": 819} {"train_loss": -10.425228118896484, "global_step": 137661, "epoch": 819} {"train_loss": -11.024798393249512, "global_step": 137662, "epoch": 819} {"train_loss": -10.861810684204102, "global_step": 137663, "epoch": 819} {"train_loss": -10.737483978271484, "global_step": 137664, "epoch": 819} {"train_loss": -10.527727127075195, "global_step": 137665, "epoch": 819} {"train_loss": -10.66123104095459, "global_step": 137666, "epoch": 819} {"train_loss": -10.402174949645996, "global_step": 137667, "epoch": 819} {"train_loss": -10.652473449707031, "global_step": 137668, "epoch": 819} {"train_loss": -10.535161018371582, "global_step": 137669, "epoch": 819} {"train_loss": -10.368457794189453, "global_step": 137670, "epoch": 819} {"train_loss": -10.17774772644043, "global_step": 137671, "epoch": 819} {"train_loss": -10.255399703979492, "global_step": 137672, "epoch": 819} {"train_loss": -10.527901649475098, "global_step": 137673, "epoch": 819} {"train_loss": -10.306316375732422, "global_step": 137674, "epoch": 819} {"train_loss": -10.137123107910156, "global_step": 137675, "epoch": 819} {"train_loss": -10.322663307189941, "global_step": 137676, "epoch": 819} {"train_loss": -9.526208877563477, "global_step": 137677, "epoch": 819} {"train_loss": -10.703237533569336, "global_step": 137678, "epoch": 819} {"train_loss": -9.280940055847168, "global_step": 137679, "epoch": 819} {"train_loss": -9.83151626586914, "global_step": 137680, "epoch": 819} {"train_loss": -10.327994346618652, "global_step": 137681, "epoch": 819} {"train_loss": -8.684183120727539, "global_step": 137682, "epoch": 819} {"train_loss": -10.802489280700684, "global_step": 137683, "epoch": 819} {"train_loss": -9.072064399719238, "global_step": 137684, "epoch": 819} {"train_loss": -10.356522560119629, "global_step": 137685, "epoch": 819} {"train_loss": -10.113327980041504, "global_step": 137686, "epoch": 819} {"train_loss": -10.043144226074219, "global_step": 137687, "epoch": 819} {"train_loss": -10.422409057617188, "global_step": 137688, "epoch": 819} {"train_loss": -10.195646286010742, "global_step": 137689, "epoch": 819} {"train_loss": -10.431070327758789, "global_step": 137690, "epoch": 819} {"train_loss": -10.373100280761719, "global_step": 137691, "epoch": 819} {"train_loss": -10.423971176147461, "global_step": 137692, "epoch": 819} {"train_loss": -10.4573974609375, "global_step": 137693, "epoch": 819} {"train_loss": -10.48318862915039, "global_step": 137694, "epoch": 819} {"train_loss": -10.531405448913574, "global_step": 137695, "epoch": 819} {"train_loss": -10.420501708984375, "global_step": 137696, "epoch": 819} {"train_loss": -10.353428840637207, "global_step": 137697, "epoch": 819} {"train_loss": -10.632650375366211, "global_step": 137698, "epoch": 819} {"train_loss": -10.733699798583984, "global_step": 137699, "epoch": 819} {"train_loss": -10.603605270385742, "global_step": 137700, "epoch": 819} {"train_loss": -10.644170761108398, "global_step": 137701, "epoch": 819} {"train_loss": -10.487495422363281, "global_step": 137702, "epoch": 819} {"train_loss": -10.339599609375, "global_step": 137703, "epoch": 819} {"train_loss": -10.402913093566895, "global_step": 137704, "epoch": 819} {"train_loss": -10.387079238891602, "global_step": 137705, "epoch": 819} {"train_loss": -10.703485488891602, "global_step": 137706, "epoch": 819} {"train_loss": -10.519208908081055, "global_step": 137707, "epoch": 819} {"train_loss": -10.393865585327148, "global_step": 137708, "epoch": 819} {"train_loss": -10.68441390991211, "global_step": 137709, "epoch": 819} {"train_loss": -10.536876678466797, "global_step": 137710, "epoch": 819} {"train_loss": -10.522171974182129, "global_step": 137711, "epoch": 819} {"train_loss": -10.637243270874023, "global_step": 137712, "epoch": 819} {"train_loss": -10.539546012878418, "global_step": 137713, "epoch": 819} {"train_loss": -10.594437599182129, "global_step": 137714, "epoch": 819} {"train_loss": -10.416177749633789, "global_step": 137715, "epoch": 819} {"train_loss": -10.77212142944336, "global_step": 137716, "epoch": 819} {"train_loss": -10.4905366897583, "global_step": 137717, "epoch": 819} {"train_loss": -10.818134307861328, "global_step": 137718, "epoch": 819} {"train_loss": -10.684142112731934, "global_step": 137719, "epoch": 819} {"train_loss": -10.709514617919922, "global_step": 137720, "epoch": 819} {"train_loss": -10.543657302856445, "global_step": 137721, "epoch": 819} {"train_loss": -10.463659286499023, "global_step": 137722, "epoch": 819} {"train_loss": -10.385357856750488, "global_step": 137723, "epoch": 819} {"train_loss": -10.648151397705078, "global_step": 137724, "epoch": 819} {"train_loss": -10.520586013793945, "global_step": 137725, "epoch": 819} {"train_loss": -9.996384620666504, "global_step": 137726, "epoch": 819} {"train_loss": -10.548309326171875, "global_step": 137727, "epoch": 819} {"train_loss": -10.151936531066895, "global_step": 137728, "epoch": 819} {"train_loss": -9.917428016662598, "global_step": 137729, "epoch": 819} {"train_loss": -10.678423881530762, "global_step": 137730, "epoch": 819} {"train_loss": -10.161720275878906, "global_step": 137731, "epoch": 819} {"train_loss": -10.537607192993164, "global_step": 137732, "epoch": 819} {"train_loss": -10.160205841064453, "global_step": 137733, "epoch": 819} {"train_loss": -10.568796157836914, "global_step": 137734, "epoch": 819} {"train_loss": -10.283464431762695, "global_step": 137735, "epoch": 819} {"train_loss": -10.609561920166016, "global_step": 137736, "epoch": 819} {"train_loss": -10.245370864868164, "global_step": 137737, "epoch": 819} {"train_loss": -10.440925598144531, "global_step": 137738, "epoch": 819} {"train_loss": -10.38043212890625, "global_step": 137739, "epoch": 819} {"train_loss": -10.3916597366333, "global_step": 137740, "epoch": 819} {"train_loss": -10.739280700683594, "global_step": 137741, "epoch": 819} {"train_loss": -10.617825508117676, "global_step": 137742, "epoch": 819} {"train_loss": -10.600781440734863, "global_step": 137743, "epoch": 819} {"train_loss": -10.467872619628906, "global_step": 137744, "epoch": 819} {"train_loss": -10.7045316696167, "global_step": 137745, "epoch": 819} {"train_loss": -10.729145050048828, "global_step": 137746, "epoch": 819} {"train_loss": -10.739822387695312, "global_step": 137747, "epoch": 819} {"train_loss": -10.7791748046875, "global_step": 137748, "epoch": 819} {"train_loss": -10.71180534362793, "global_step": 137749, "epoch": 819} {"train_loss": -10.822245597839355, "global_step": 137750, "epoch": 819} {"train_loss": -10.585309982299805, "global_step": 137751, "epoch": 819} {"train_loss": -10.32196044921875, "global_step": 137752, "epoch": 819} {"train_loss": -10.459890365600586, "global_step": 137753, "epoch": 819} {"train_loss": -10.069950103759766, "global_step": 137754, "epoch": 819} {"train_loss": -10.7265625, "global_step": 137755, "epoch": 819} {"train_loss": -9.952417373657227, "global_step": 137756, "epoch": 819} {"train_loss": -10.254858016967773, "global_step": 137757, "epoch": 819} {"train_loss": -10.564558029174805, "global_step": 137758, "epoch": 819} {"train_loss": -10.435275560333615, "global_step": 137759, "epoch": 819, "val_loss": 216956.5625} {"train_loss": -9.903350830078125, "global_step": 137760, "epoch": 820} {"train_loss": -9.722326278686523, "global_step": 137761, "epoch": 820} {"train_loss": -9.200395584106445, "global_step": 137762, "epoch": 820} {"train_loss": -9.878198623657227, "global_step": 137763, "epoch": 820} {"train_loss": -9.147930145263672, "global_step": 137764, "epoch": 820} {"train_loss": -9.470916748046875, "global_step": 137765, "epoch": 820} {"train_loss": -9.450623512268066, "global_step": 137766, "epoch": 820} {"train_loss": -10.350563049316406, "global_step": 137767, "epoch": 820} {"train_loss": -9.647405624389648, "global_step": 137768, "epoch": 820} {"train_loss": -10.406314849853516, "global_step": 137769, "epoch": 820} {"train_loss": -9.740901947021484, "global_step": 137770, "epoch": 820} {"train_loss": -10.18045425415039, "global_step": 137771, "epoch": 820} {"train_loss": -9.73695182800293, "global_step": 137772, "epoch": 820} {"train_loss": -10.25294303894043, "global_step": 137773, "epoch": 820} {"train_loss": -9.739667892456055, "global_step": 137774, "epoch": 820} {"train_loss": -10.263912200927734, "global_step": 137775, "epoch": 820} {"train_loss": -10.073578834533691, "global_step": 137776, "epoch": 820} {"train_loss": -10.222415924072266, "global_step": 137777, "epoch": 820} {"train_loss": -10.269147872924805, "global_step": 137778, "epoch": 820} {"train_loss": -10.001749992370605, "global_step": 137779, "epoch": 820} {"train_loss": -10.405862808227539, "global_step": 137780, "epoch": 820} {"train_loss": -10.162712097167969, "global_step": 137781, "epoch": 820} {"train_loss": -10.335135459899902, "global_step": 137782, "epoch": 820} {"train_loss": -10.550323486328125, "global_step": 137783, "epoch": 820} {"train_loss": -10.32786750793457, "global_step": 137784, "epoch": 820} {"train_loss": -10.24249267578125, "global_step": 137785, "epoch": 820} {"train_loss": -10.464588165283203, "global_step": 137786, "epoch": 820} {"train_loss": -10.193398475646973, "global_step": 137787, "epoch": 820} {"train_loss": -10.652095794677734, "global_step": 137788, "epoch": 820} {"train_loss": -10.328447341918945, "global_step": 137789, "epoch": 820} {"train_loss": -10.571239471435547, "global_step": 137790, "epoch": 820} {"train_loss": -10.483930587768555, "global_step": 137791, "epoch": 820} {"train_loss": -10.579707145690918, "global_step": 137792, "epoch": 820} {"train_loss": -10.656257629394531, "global_step": 137793, "epoch": 820} {"train_loss": -10.564160346984863, "global_step": 137794, "epoch": 820} {"train_loss": -10.567110061645508, "global_step": 137795, "epoch": 820} {"train_loss": -10.627065658569336, "global_step": 137796, "epoch": 820} {"train_loss": -10.306509017944336, "global_step": 137797, "epoch": 820} {"train_loss": -10.471549987792969, "global_step": 137798, "epoch": 820} {"train_loss": -10.637165069580078, "global_step": 137799, "epoch": 820} {"train_loss": -10.77954387664795, "global_step": 137800, "epoch": 820} {"train_loss": -10.49677848815918, "global_step": 137801, "epoch": 820} {"train_loss": -10.836021423339844, "global_step": 137802, "epoch": 820} {"train_loss": -10.557493209838867, "global_step": 137803, "epoch": 820} {"train_loss": -10.490619659423828, "global_step": 137804, "epoch": 820} {"train_loss": -10.716536521911621, "global_step": 137805, "epoch": 820} {"train_loss": -10.69428825378418, "global_step": 137806, "epoch": 820} {"train_loss": -10.573894500732422, "global_step": 137807, "epoch": 820} {"train_loss": -10.793848037719727, "global_step": 137808, "epoch": 820} {"train_loss": -10.665908813476562, "global_step": 137809, "epoch": 820} {"train_loss": -10.732646942138672, "global_step": 137810, "epoch": 820} {"train_loss": -10.773988723754883, "global_step": 137811, "epoch": 820} {"train_loss": -10.722099304199219, "global_step": 137812, "epoch": 820} {"train_loss": -10.70113754272461, "global_step": 137813, "epoch": 820} {"train_loss": -10.688423156738281, "global_step": 137814, "epoch": 820} {"train_loss": -10.723865509033203, "global_step": 137815, "epoch": 820} {"train_loss": -10.816132545471191, "global_step": 137816, "epoch": 820} {"train_loss": -10.739070892333984, "global_step": 137817, "epoch": 820} {"train_loss": -10.459955215454102, "global_step": 137818, "epoch": 820} {"train_loss": -10.401618003845215, "global_step": 137819, "epoch": 820} {"train_loss": -10.728216171264648, "global_step": 137820, "epoch": 820} {"train_loss": -10.551478385925293, "global_step": 137821, "epoch": 820} {"train_loss": -10.231749534606934, "global_step": 137822, "epoch": 820} {"train_loss": -9.774848937988281, "global_step": 137823, "epoch": 820} {"train_loss": -10.114877700805664, "global_step": 137824, "epoch": 820} {"train_loss": -8.097829818725586, "global_step": 137825, "epoch": 820} {"train_loss": -9.537275314331055, "global_step": 137826, "epoch": 820} {"train_loss": -9.751510620117188, "global_step": 137827, "epoch": 820} {"train_loss": -9.665149688720703, "global_step": 137828, "epoch": 820} {"train_loss": -10.194201469421387, "global_step": 137829, "epoch": 820} {"train_loss": -9.458318710327148, "global_step": 137830, "epoch": 820} {"train_loss": -10.15859603881836, "global_step": 137831, "epoch": 820} {"train_loss": -10.124282836914062, "global_step": 137832, "epoch": 820} {"train_loss": -10.198502540588379, "global_step": 137833, "epoch": 820} {"train_loss": -10.216085433959961, "global_step": 137834, "epoch": 820} {"train_loss": -9.833595275878906, "global_step": 137835, "epoch": 820} {"train_loss": -10.260008811950684, "global_step": 137836, "epoch": 820} {"train_loss": -10.115180969238281, "global_step": 137837, "epoch": 820} {"train_loss": -10.114578247070312, "global_step": 137838, "epoch": 820} {"train_loss": -10.127552032470703, "global_step": 137839, "epoch": 820} {"train_loss": -9.988836288452148, "global_step": 137840, "epoch": 820} {"train_loss": -10.18853759765625, "global_step": 137841, "epoch": 820} {"train_loss": -10.14950942993164, "global_step": 137842, "epoch": 820} {"train_loss": -10.075214385986328, "global_step": 137843, "epoch": 820} {"train_loss": -10.506980895996094, "global_step": 137844, "epoch": 820} {"train_loss": -10.315345764160156, "global_step": 137845, "epoch": 820} {"train_loss": -10.309979438781738, "global_step": 137846, "epoch": 820} {"train_loss": -10.273691177368164, "global_step": 137847, "epoch": 820} {"train_loss": -10.319807052612305, "global_step": 137848, "epoch": 820} {"train_loss": -10.762093544006348, "global_step": 137849, "epoch": 820} {"train_loss": -10.700345993041992, "global_step": 137850, "epoch": 820} {"train_loss": -10.55614948272705, "global_step": 137851, "epoch": 820} {"train_loss": -10.425737380981445, "global_step": 137852, "epoch": 820} {"train_loss": -10.45236587524414, "global_step": 137853, "epoch": 820} {"train_loss": -10.695661544799805, "global_step": 137854, "epoch": 820} {"train_loss": -10.670385360717773, "global_step": 137855, "epoch": 820} {"train_loss": -10.723109245300293, "global_step": 137856, "epoch": 820} {"train_loss": -10.721826553344727, "global_step": 137857, "epoch": 820} {"train_loss": -10.655935287475586, "global_step": 137858, "epoch": 820} {"train_loss": -10.783968925476074, "global_step": 137859, "epoch": 820} {"train_loss": -10.654777526855469, "global_step": 137860, "epoch": 820} {"train_loss": -10.8040132522583, "global_step": 137861, "epoch": 820} {"train_loss": -10.59805679321289, "global_step": 137862, "epoch": 820} {"train_loss": -10.668599128723145, "global_step": 137863, "epoch": 820} {"train_loss": -10.661092758178711, "global_step": 137864, "epoch": 820} {"train_loss": -10.891752243041992, "global_step": 137865, "epoch": 820} {"train_loss": -10.456838607788086, "global_step": 137866, "epoch": 820} {"train_loss": -10.58256721496582, "global_step": 137867, "epoch": 820} {"train_loss": -10.687021255493164, "global_step": 137868, "epoch": 820} {"train_loss": -10.69994068145752, "global_step": 137869, "epoch": 820} {"train_loss": -10.673585891723633, "global_step": 137870, "epoch": 820} {"train_loss": -10.88969898223877, "global_step": 137871, "epoch": 820} {"train_loss": -10.866859436035156, "global_step": 137872, "epoch": 820} {"train_loss": -10.685311317443848, "global_step": 137873, "epoch": 820} {"train_loss": -10.800999641418457, "global_step": 137874, "epoch": 820} {"train_loss": -10.90151309967041, "global_step": 137875, "epoch": 820} {"train_loss": -10.948925018310547, "global_step": 137876, "epoch": 820} {"train_loss": -10.904003143310547, "global_step": 137877, "epoch": 820} {"train_loss": -10.941693305969238, "global_step": 137878, "epoch": 820} {"train_loss": -10.795284271240234, "global_step": 137879, "epoch": 820} {"train_loss": -10.900760650634766, "global_step": 137880, "epoch": 820} {"train_loss": -10.651331901550293, "global_step": 137881, "epoch": 820} {"train_loss": -10.656375885009766, "global_step": 137882, "epoch": 820} {"train_loss": -10.497016906738281, "global_step": 137883, "epoch": 820} {"train_loss": -10.601022720336914, "global_step": 137884, "epoch": 820} {"train_loss": -10.261445999145508, "global_step": 137885, "epoch": 820} {"train_loss": -10.272058486938477, "global_step": 137886, "epoch": 820} {"train_loss": -10.091421127319336, "global_step": 137887, "epoch": 820} {"train_loss": -10.385379791259766, "global_step": 137888, "epoch": 820} {"train_loss": -9.816051483154297, "global_step": 137889, "epoch": 820} {"train_loss": -10.674467086791992, "global_step": 137890, "epoch": 820} {"train_loss": -9.429193496704102, "global_step": 137891, "epoch": 820} {"train_loss": -7.683589458465576, "global_step": 137892, "epoch": 820} {"train_loss": -9.170690536499023, "global_step": 137893, "epoch": 820} {"train_loss": -9.698648452758789, "global_step": 137894, "epoch": 820} {"train_loss": -9.751218795776367, "global_step": 137895, "epoch": 820} {"train_loss": -10.32197093963623, "global_step": 137896, "epoch": 820} {"train_loss": -9.369955062866211, "global_step": 137897, "epoch": 820} {"train_loss": -10.190275192260742, "global_step": 137898, "epoch": 820} {"train_loss": -9.949503898620605, "global_step": 137899, "epoch": 820} {"train_loss": -10.132928848266602, "global_step": 137900, "epoch": 820} {"train_loss": -10.34883975982666, "global_step": 137901, "epoch": 820} {"train_loss": -10.015666961669922, "global_step": 137902, "epoch": 820} {"train_loss": -10.014827728271484, "global_step": 137903, "epoch": 820} {"train_loss": -9.92905330657959, "global_step": 137904, "epoch": 820} {"train_loss": -10.151506423950195, "global_step": 137905, "epoch": 820} {"train_loss": -10.089347839355469, "global_step": 137906, "epoch": 820} {"train_loss": -10.215213775634766, "global_step": 137907, "epoch": 820} {"train_loss": -9.85426139831543, "global_step": 137908, "epoch": 820} {"train_loss": -10.624982833862305, "global_step": 137909, "epoch": 820} {"train_loss": -10.284516334533691, "global_step": 137910, "epoch": 820} {"train_loss": -10.34498405456543, "global_step": 137911, "epoch": 820} {"train_loss": -10.284070014953613, "global_step": 137912, "epoch": 820} {"train_loss": -10.102659225463867, "global_step": 137913, "epoch": 820} {"train_loss": -10.325757026672363, "global_step": 137914, "epoch": 820} {"train_loss": -10.463735580444336, "global_step": 137915, "epoch": 820} {"train_loss": -10.507587432861328, "global_step": 137916, "epoch": 820} {"train_loss": -10.70965576171875, "global_step": 137917, "epoch": 820} {"train_loss": -10.56274700164795, "global_step": 137918, "epoch": 820} {"train_loss": -10.545597076416016, "global_step": 137919, "epoch": 820} {"train_loss": -10.688211441040039, "global_step": 137920, "epoch": 820} {"train_loss": -10.544282913208008, "global_step": 137921, "epoch": 820} {"train_loss": -10.510028839111328, "global_step": 137922, "epoch": 820} {"train_loss": -10.696720123291016, "global_step": 137923, "epoch": 820} {"train_loss": -10.337312698364258, "global_step": 137924, "epoch": 820} {"train_loss": -10.711492538452148, "global_step": 137925, "epoch": 820} {"train_loss": -10.559263229370117, "global_step": 137926, "epoch": 820} {"train_loss": -10.321537230695997, "global_step": 137927, "epoch": 820, "val_loss": 216493.71875, "train_action_mse_error": 2.2368903160095215} {"train_loss": -10.58924388885498, "global_step": 137928, "epoch": 821} {"train_loss": -10.707110404968262, "global_step": 137929, "epoch": 821} {"train_loss": -10.628189086914062, "global_step": 137930, "epoch": 821} {"train_loss": -10.51679801940918, "global_step": 137931, "epoch": 821} {"train_loss": -10.456478118896484, "global_step": 137932, "epoch": 821} {"train_loss": -10.642555236816406, "global_step": 137933, "epoch": 821} {"train_loss": -10.570243835449219, "global_step": 137934, "epoch": 821} {"train_loss": -10.680315017700195, "global_step": 137935, "epoch": 821} {"train_loss": -10.506917953491211, "global_step": 137936, "epoch": 821} {"train_loss": -10.809160232543945, "global_step": 137937, "epoch": 821} {"train_loss": -10.801566123962402, "global_step": 137938, "epoch": 821} {"train_loss": -10.754724502563477, "global_step": 137939, "epoch": 821} {"train_loss": -10.70356559753418, "global_step": 137940, "epoch": 821} {"train_loss": -10.797574996948242, "global_step": 137941, "epoch": 821} {"train_loss": -10.751325607299805, "global_step": 137942, "epoch": 821} {"train_loss": -10.903509140014648, "global_step": 137943, "epoch": 821} {"train_loss": -10.747214317321777, "global_step": 137944, "epoch": 821} {"train_loss": -10.549030303955078, "global_step": 137945, "epoch": 821} {"train_loss": -10.850420951843262, "global_step": 137946, "epoch": 821} {"train_loss": -10.687952041625977, "global_step": 137947, "epoch": 821} {"train_loss": -10.773086547851562, "global_step": 137948, "epoch": 821} {"train_loss": -10.399770736694336, "global_step": 137949, "epoch": 821} {"train_loss": -10.636022567749023, "global_step": 137950, "epoch": 821} {"train_loss": -10.727158546447754, "global_step": 137951, "epoch": 821} {"train_loss": -10.51850414276123, "global_step": 137952, "epoch": 821} {"train_loss": -10.803427696228027, "global_step": 137953, "epoch": 821} {"train_loss": -10.520397186279297, "global_step": 137954, "epoch": 821} {"train_loss": -9.667594909667969, "global_step": 137955, "epoch": 821} {"train_loss": -10.129020690917969, "global_step": 137956, "epoch": 821} {"train_loss": -10.513792037963867, "global_step": 137957, "epoch": 821} {"train_loss": -10.601295471191406, "global_step": 137958, "epoch": 821} {"train_loss": -10.208658218383789, "global_step": 137959, "epoch": 821} {"train_loss": -10.818500518798828, "global_step": 137960, "epoch": 821} {"train_loss": -10.543630599975586, "global_step": 137961, "epoch": 821} {"train_loss": -10.347196578979492, "global_step": 137962, "epoch": 821} {"train_loss": -10.639968872070312, "global_step": 137963, "epoch": 821} {"train_loss": -10.158991813659668, "global_step": 137964, "epoch": 821} {"train_loss": -10.423186302185059, "global_step": 137965, "epoch": 821} {"train_loss": -9.92532730102539, "global_step": 137966, "epoch": 821} {"train_loss": -9.587963104248047, "global_step": 137967, "epoch": 821} {"train_loss": -10.223848342895508, "global_step": 137968, "epoch": 821} {"train_loss": -10.101192474365234, "global_step": 137969, "epoch": 821} {"train_loss": -10.37067699432373, "global_step": 137970, "epoch": 821} {"train_loss": -9.855904579162598, "global_step": 137971, "epoch": 821} {"train_loss": -10.215005874633789, "global_step": 137972, "epoch": 821} {"train_loss": -10.00044059753418, "global_step": 137973, "epoch": 821} {"train_loss": -10.179915428161621, "global_step": 137974, "epoch": 821} {"train_loss": -10.577038764953613, "global_step": 137975, "epoch": 821} {"train_loss": -10.237208366394043, "global_step": 137976, "epoch": 821} {"train_loss": -10.354019165039062, "global_step": 137977, "epoch": 821} {"train_loss": -10.291385650634766, "global_step": 137978, "epoch": 821} {"train_loss": -9.72188663482666, "global_step": 137979, "epoch": 821} {"train_loss": -10.168724060058594, "global_step": 137980, "epoch": 821} {"train_loss": -9.960394859313965, "global_step": 137981, "epoch": 821} {"train_loss": -10.612688064575195, "global_step": 137982, "epoch": 821} {"train_loss": -10.546954154968262, "global_step": 137983, "epoch": 821} {"train_loss": -10.318359375, "global_step": 137984, "epoch": 821} {"train_loss": -10.319771766662598, "global_step": 137985, "epoch": 821} {"train_loss": -10.377357482910156, "global_step": 137986, "epoch": 821} {"train_loss": -10.442468643188477, "global_step": 137987, "epoch": 821} {"train_loss": -10.291046142578125, "global_step": 137988, "epoch": 821} {"train_loss": -10.481727600097656, "global_step": 137989, "epoch": 821} {"train_loss": -10.468317985534668, "global_step": 137990, "epoch": 821} {"train_loss": -10.612178802490234, "global_step": 137991, "epoch": 821} {"train_loss": -10.372490882873535, "global_step": 137992, "epoch": 821} {"train_loss": -10.56236743927002, "global_step": 137993, "epoch": 821} {"train_loss": -10.534388542175293, "global_step": 137994, "epoch": 821} {"train_loss": -10.531907081604004, "global_step": 137995, "epoch": 821} {"train_loss": -10.369441986083984, "global_step": 137996, "epoch": 821} {"train_loss": -10.649360656738281, "global_step": 137997, "epoch": 821} {"train_loss": -10.47728157043457, "global_step": 137998, "epoch": 821} {"train_loss": -10.828685760498047, "global_step": 137999, "epoch": 821} {"train_loss": -10.372875213623047, "global_step": 138000, "epoch": 821} {"train_loss": -10.700835227966309, "global_step": 138001, "epoch": 821} {"train_loss": -10.532501220703125, "global_step": 138002, "epoch": 821} {"train_loss": -10.485462188720703, "global_step": 138003, "epoch": 821} {"train_loss": -10.757577896118164, "global_step": 138004, "epoch": 821} {"train_loss": -10.654768943786621, "global_step": 138005, "epoch": 821} {"train_loss": -10.559814453125, "global_step": 138006, "epoch": 821} {"train_loss": -10.510286331176758, "global_step": 138007, "epoch": 821} {"train_loss": -10.657052993774414, "global_step": 138008, "epoch": 821} {"train_loss": -10.143824577331543, "global_step": 138009, "epoch": 821} {"train_loss": -10.487156867980957, "global_step": 138010, "epoch": 821} {"train_loss": -10.369841575622559, "global_step": 138011, "epoch": 821} {"train_loss": -10.291508674621582, "global_step": 138012, "epoch": 821} {"train_loss": -10.656411170959473, "global_step": 138013, "epoch": 821} {"train_loss": -10.400503158569336, "global_step": 138014, "epoch": 821} {"train_loss": -10.60710334777832, "global_step": 138015, "epoch": 821} {"train_loss": -10.433988571166992, "global_step": 138016, "epoch": 821} {"train_loss": -10.702495574951172, "global_step": 138017, "epoch": 821} {"train_loss": -10.151952743530273, "global_step": 138018, "epoch": 821} {"train_loss": -10.733556747436523, "global_step": 138019, "epoch": 821} {"train_loss": -10.40107250213623, "global_step": 138020, "epoch": 821} {"train_loss": -10.116401672363281, "global_step": 138021, "epoch": 821} {"train_loss": -10.617807388305664, "global_step": 138022, "epoch": 821} {"train_loss": -10.433938980102539, "global_step": 138023, "epoch": 821} {"train_loss": -10.291501998901367, "global_step": 138024, "epoch": 821} {"train_loss": -10.420482635498047, "global_step": 138025, "epoch": 821} {"train_loss": -10.217384338378906, "global_step": 138026, "epoch": 821} {"train_loss": -9.975038528442383, "global_step": 138027, "epoch": 821} {"train_loss": -9.552526473999023, "global_step": 138028, "epoch": 821} {"train_loss": -10.22544002532959, "global_step": 138029, "epoch": 821} {"train_loss": -9.280935287475586, "global_step": 138030, "epoch": 821} {"train_loss": -10.604469299316406, "global_step": 138031, "epoch": 821} {"train_loss": -9.543035507202148, "global_step": 138032, "epoch": 821} {"train_loss": -10.095771789550781, "global_step": 138033, "epoch": 821} {"train_loss": -9.3849515914917, "global_step": 138034, "epoch": 821} {"train_loss": -10.275396347045898, "global_step": 138035, "epoch": 821} {"train_loss": -9.408869743347168, "global_step": 138036, "epoch": 821} {"train_loss": -10.3630952835083, "global_step": 138037, "epoch": 821} {"train_loss": -9.716645240783691, "global_step": 138038, "epoch": 821} {"train_loss": -9.75058650970459, "global_step": 138039, "epoch": 821} {"train_loss": -9.769460678100586, "global_step": 138040, "epoch": 821} {"train_loss": -9.842595100402832, "global_step": 138041, "epoch": 821} {"train_loss": -9.507074356079102, "global_step": 138042, "epoch": 821} {"train_loss": -10.10731029510498, "global_step": 138043, "epoch": 821} {"train_loss": -10.150482177734375, "global_step": 138044, "epoch": 821} {"train_loss": -10.22495174407959, "global_step": 138045, "epoch": 821} {"train_loss": -10.111963272094727, "global_step": 138046, "epoch": 821} {"train_loss": -9.934226989746094, "global_step": 138047, "epoch": 821} {"train_loss": -9.938140869140625, "global_step": 138048, "epoch": 821} {"train_loss": -9.722433090209961, "global_step": 138049, "epoch": 821} {"train_loss": -10.106256484985352, "global_step": 138050, "epoch": 821} {"train_loss": -9.806404113769531, "global_step": 138051, "epoch": 821} {"train_loss": -9.96088695526123, "global_step": 138052, "epoch": 821} {"train_loss": -10.221879959106445, "global_step": 138053, "epoch": 821} {"train_loss": -9.907833099365234, "global_step": 138054, "epoch": 821} {"train_loss": -9.967914581298828, "global_step": 138055, "epoch": 821} {"train_loss": -9.750619888305664, "global_step": 138056, "epoch": 821} {"train_loss": -10.241877555847168, "global_step": 138057, "epoch": 821} {"train_loss": -10.390074729919434, "global_step": 138058, "epoch": 821} {"train_loss": -9.884723663330078, "global_step": 138059, "epoch": 821} {"train_loss": -10.243322372436523, "global_step": 138060, "epoch": 821} {"train_loss": -10.338726997375488, "global_step": 138061, "epoch": 821} {"train_loss": -10.201708793640137, "global_step": 138062, "epoch": 821} {"train_loss": -10.194496154785156, "global_step": 138063, "epoch": 821} {"train_loss": -10.339229583740234, "global_step": 138064, "epoch": 821} {"train_loss": -10.401548385620117, "global_step": 138065, "epoch": 821} {"train_loss": -10.282602310180664, "global_step": 138066, "epoch": 821} {"train_loss": -10.182764053344727, "global_step": 138067, "epoch": 821} {"train_loss": -10.509684562683105, "global_step": 138068, "epoch": 821} {"train_loss": -10.515996932983398, "global_step": 138069, "epoch": 821} {"train_loss": -10.340950012207031, "global_step": 138070, "epoch": 821} {"train_loss": -10.548422813415527, "global_step": 138071, "epoch": 821} {"train_loss": -10.303260803222656, "global_step": 138072, "epoch": 821} {"train_loss": -10.733597755432129, "global_step": 138073, "epoch": 821} {"train_loss": -10.481197357177734, "global_step": 138074, "epoch": 821} {"train_loss": -10.52035140991211, "global_step": 138075, "epoch": 821} {"train_loss": -10.459716796875, "global_step": 138076, "epoch": 821} {"train_loss": -10.516890525817871, "global_step": 138077, "epoch": 821} {"train_loss": -10.557981491088867, "global_step": 138078, "epoch": 821} {"train_loss": -10.683380126953125, "global_step": 138079, "epoch": 821} {"train_loss": -10.684627532958984, "global_step": 138080, "epoch": 821} {"train_loss": -10.686519622802734, "global_step": 138081, "epoch": 821} {"train_loss": -10.5267915725708, "global_step": 138082, "epoch": 821} {"train_loss": -10.59483528137207, "global_step": 138083, "epoch": 821} {"train_loss": -10.36018180847168, "global_step": 138084, "epoch": 821} {"train_loss": -10.805096626281738, "global_step": 138085, "epoch": 821} {"train_loss": -10.630220413208008, "global_step": 138086, "epoch": 821} {"train_loss": -10.525849342346191, "global_step": 138087, "epoch": 821} {"train_loss": -10.721933364868164, "global_step": 138088, "epoch": 821} {"train_loss": -10.285524368286133, "global_step": 138089, "epoch": 821} {"train_loss": -10.42871379852295, "global_step": 138090, "epoch": 821} {"train_loss": -10.528074264526367, "global_step": 138091, "epoch": 821} {"train_loss": -10.350106239318848, "global_step": 138092, "epoch": 821} {"train_loss": -10.549619674682617, "global_step": 138093, "epoch": 821} {"train_loss": -10.17654037475586, "global_step": 138094, "epoch": 821} {"train_loss": -10.356598973274231, "global_step": 138095, "epoch": 821, "val_loss": 218921.75} {"train_loss": -10.504650115966797, "global_step": 138096, "epoch": 822} {"train_loss": -10.315792083740234, "global_step": 138097, "epoch": 822} {"train_loss": -10.507147789001465, "global_step": 138098, "epoch": 822} {"train_loss": -9.96338176727295, "global_step": 138099, "epoch": 822} {"train_loss": -10.7730073928833, "global_step": 138100, "epoch": 822} {"train_loss": -10.399467468261719, "global_step": 138101, "epoch": 822} {"train_loss": -10.393354415893555, "global_step": 138102, "epoch": 822} {"train_loss": -10.444401741027832, "global_step": 138103, "epoch": 822} {"train_loss": -10.519487380981445, "global_step": 138104, "epoch": 822} {"train_loss": -10.747446060180664, "global_step": 138105, "epoch": 822} {"train_loss": -10.398336410522461, "global_step": 138106, "epoch": 822} {"train_loss": -10.420797348022461, "global_step": 138107, "epoch": 822} {"train_loss": -10.698295593261719, "global_step": 138108, "epoch": 822} {"train_loss": -10.66836929321289, "global_step": 138109, "epoch": 822} {"train_loss": -10.400727272033691, "global_step": 138110, "epoch": 822} {"train_loss": -10.444547653198242, "global_step": 138111, "epoch": 822} {"train_loss": -10.565652847290039, "global_step": 138112, "epoch": 822} {"train_loss": -10.64771842956543, "global_step": 138113, "epoch": 822} {"train_loss": -10.698305130004883, "global_step": 138114, "epoch": 822} {"train_loss": -10.688804626464844, "global_step": 138115, "epoch": 822} {"train_loss": -10.448587417602539, "global_step": 138116, "epoch": 822} {"train_loss": -10.386255264282227, "global_step": 138117, "epoch": 822} {"train_loss": -10.643766403198242, "global_step": 138118, "epoch": 822} {"train_loss": -10.910754203796387, "global_step": 138119, "epoch": 822} {"train_loss": -10.750368118286133, "global_step": 138120, "epoch": 822} {"train_loss": -10.71468734741211, "global_step": 138121, "epoch": 822} {"train_loss": -10.707164764404297, "global_step": 138122, "epoch": 822} {"train_loss": -10.585968971252441, "global_step": 138123, "epoch": 822} {"train_loss": -10.597933769226074, "global_step": 138124, "epoch": 822} {"train_loss": -10.812469482421875, "global_step": 138125, "epoch": 822} {"train_loss": -10.521120071411133, "global_step": 138126, "epoch": 822} {"train_loss": -10.812320709228516, "global_step": 138127, "epoch": 822} {"train_loss": -10.505053520202637, "global_step": 138128, "epoch": 822} {"train_loss": -10.484445571899414, "global_step": 138129, "epoch": 822} {"train_loss": -10.889700889587402, "global_step": 138130, "epoch": 822} {"train_loss": -10.916912078857422, "global_step": 138131, "epoch": 822} {"train_loss": -10.834238052368164, "global_step": 138132, "epoch": 822} {"train_loss": -10.902898788452148, "global_step": 138133, "epoch": 822} {"train_loss": -10.690422058105469, "global_step": 138134, "epoch": 822} {"train_loss": -10.827292442321777, "global_step": 138135, "epoch": 822} {"train_loss": -10.804193496704102, "global_step": 138136, "epoch": 822} {"train_loss": -10.75152587890625, "global_step": 138137, "epoch": 822} {"train_loss": -11.01792049407959, "global_step": 138138, "epoch": 822} {"train_loss": -10.582756042480469, "global_step": 138139, "epoch": 822} {"train_loss": -10.457610130310059, "global_step": 138140, "epoch": 822} {"train_loss": -10.582802772521973, "global_step": 138141, "epoch": 822} {"train_loss": -10.548540115356445, "global_step": 138142, "epoch": 822} {"train_loss": -9.825981140136719, "global_step": 138143, "epoch": 822} {"train_loss": -10.746490478515625, "global_step": 138144, "epoch": 822} {"train_loss": -10.82400894165039, "global_step": 138145, "epoch": 822} {"train_loss": -10.449594497680664, "global_step": 138146, "epoch": 822} {"train_loss": -10.22755241394043, "global_step": 138147, "epoch": 822} {"train_loss": -10.745475769042969, "global_step": 138148, "epoch": 822} {"train_loss": -10.534340858459473, "global_step": 138149, "epoch": 822} {"train_loss": -10.459582328796387, "global_step": 138150, "epoch": 822} {"train_loss": -10.448575973510742, "global_step": 138151, "epoch": 822} {"train_loss": -10.615434646606445, "global_step": 138152, "epoch": 822} {"train_loss": -10.604799270629883, "global_step": 138153, "epoch": 822} {"train_loss": -10.395038604736328, "global_step": 138154, "epoch": 822} {"train_loss": -10.674234390258789, "global_step": 138155, "epoch": 822} {"train_loss": -10.714522361755371, "global_step": 138156, "epoch": 822} {"train_loss": -10.63711929321289, "global_step": 138157, "epoch": 822} {"train_loss": -10.530099868774414, "global_step": 138158, "epoch": 822} {"train_loss": -10.503913879394531, "global_step": 138159, "epoch": 822} {"train_loss": -10.646015167236328, "global_step": 138160, "epoch": 822} {"train_loss": -10.55923080444336, "global_step": 138161, "epoch": 822} {"train_loss": -10.686666488647461, "global_step": 138162, "epoch": 822} {"train_loss": -10.649709701538086, "global_step": 138163, "epoch": 822} {"train_loss": -10.727925300598145, "global_step": 138164, "epoch": 822} {"train_loss": -10.622432708740234, "global_step": 138165, "epoch": 822} {"train_loss": -10.731423377990723, "global_step": 138166, "epoch": 822} {"train_loss": -10.833829879760742, "global_step": 138167, "epoch": 822} {"train_loss": -10.668607711791992, "global_step": 138168, "epoch": 822} {"train_loss": -10.876875877380371, "global_step": 138169, "epoch": 822} {"train_loss": -10.767531394958496, "global_step": 138170, "epoch": 822} {"train_loss": -10.847089767456055, "global_step": 138171, "epoch": 822} {"train_loss": -10.739786148071289, "global_step": 138172, "epoch": 822} {"train_loss": -10.698226928710938, "global_step": 138173, "epoch": 822} {"train_loss": -10.576193809509277, "global_step": 138174, "epoch": 822} {"train_loss": -10.566204071044922, "global_step": 138175, "epoch": 822} {"train_loss": -10.639488220214844, "global_step": 138176, "epoch": 822} {"train_loss": -10.772968292236328, "global_step": 138177, "epoch": 822} {"train_loss": -10.600265502929688, "global_step": 138178, "epoch": 822} {"train_loss": -10.588099479675293, "global_step": 138179, "epoch": 822} {"train_loss": -10.458041191101074, "global_step": 138180, "epoch": 822} {"train_loss": -10.554296493530273, "global_step": 138181, "epoch": 822} {"train_loss": -10.462432861328125, "global_step": 138182, "epoch": 822} {"train_loss": -10.28287124633789, "global_step": 138183, "epoch": 822} {"train_loss": -9.466217041015625, "global_step": 138184, "epoch": 822} {"train_loss": -10.10335636138916, "global_step": 138185, "epoch": 822} {"train_loss": -9.738862991333008, "global_step": 138186, "epoch": 822} {"train_loss": -10.178353309631348, "global_step": 138187, "epoch": 822} {"train_loss": -9.897489547729492, "global_step": 138188, "epoch": 822} {"train_loss": -10.668697357177734, "global_step": 138189, "epoch": 822} {"train_loss": -10.530795097351074, "global_step": 138190, "epoch": 822} {"train_loss": -9.855924606323242, "global_step": 138191, "epoch": 822} {"train_loss": -10.529388427734375, "global_step": 138192, "epoch": 822} {"train_loss": -10.322274208068848, "global_step": 138193, "epoch": 822} {"train_loss": -10.763833999633789, "global_step": 138194, "epoch": 822} {"train_loss": -10.29834270477295, "global_step": 138195, "epoch": 822} {"train_loss": -10.460305213928223, "global_step": 138196, "epoch": 822} {"train_loss": -10.59521770477295, "global_step": 138197, "epoch": 822} {"train_loss": -10.52785873413086, "global_step": 138198, "epoch": 822} {"train_loss": -10.775814056396484, "global_step": 138199, "epoch": 822} {"train_loss": -10.028931617736816, "global_step": 138200, "epoch": 822} {"train_loss": -10.65359115600586, "global_step": 138201, "epoch": 822} {"train_loss": -10.48803997039795, "global_step": 138202, "epoch": 822} {"train_loss": -10.356582641601562, "global_step": 138203, "epoch": 822} {"train_loss": -10.528454780578613, "global_step": 138204, "epoch": 822} {"train_loss": -10.514730453491211, "global_step": 138205, "epoch": 822} {"train_loss": -10.209121704101562, "global_step": 138206, "epoch": 822} {"train_loss": -10.759378433227539, "global_step": 138207, "epoch": 822} {"train_loss": -10.420171737670898, "global_step": 138208, "epoch": 822} {"train_loss": -10.44599723815918, "global_step": 138209, "epoch": 822} {"train_loss": -10.155567169189453, "global_step": 138210, "epoch": 822} {"train_loss": -10.604515075683594, "global_step": 138211, "epoch": 822} {"train_loss": -10.59620189666748, "global_step": 138212, "epoch": 822} {"train_loss": -10.126190185546875, "global_step": 138213, "epoch": 822} {"train_loss": -10.52395248413086, "global_step": 138214, "epoch": 822} {"train_loss": -10.526629447937012, "global_step": 138215, "epoch": 822} {"train_loss": -10.614409446716309, "global_step": 138216, "epoch": 822} {"train_loss": -10.502820014953613, "global_step": 138217, "epoch": 822} {"train_loss": -10.236188888549805, "global_step": 138218, "epoch": 822} {"train_loss": -10.802906036376953, "global_step": 138219, "epoch": 822} {"train_loss": -10.456216812133789, "global_step": 138220, "epoch": 822} {"train_loss": -10.663839340209961, "global_step": 138221, "epoch": 822} {"train_loss": -10.491185188293457, "global_step": 138222, "epoch": 822} {"train_loss": -10.839071273803711, "global_step": 138223, "epoch": 822} {"train_loss": -10.53226089477539, "global_step": 138224, "epoch": 822} {"train_loss": -10.768203735351562, "global_step": 138225, "epoch": 822} {"train_loss": -10.454298973083496, "global_step": 138226, "epoch": 822} {"train_loss": -10.65213680267334, "global_step": 138227, "epoch": 822} {"train_loss": -10.633031845092773, "global_step": 138228, "epoch": 822} {"train_loss": -10.79207706451416, "global_step": 138229, "epoch": 822} {"train_loss": -10.665933609008789, "global_step": 138230, "epoch": 822} {"train_loss": -10.691132545471191, "global_step": 138231, "epoch": 822} {"train_loss": -10.696893692016602, "global_step": 138232, "epoch": 822} {"train_loss": -10.850763320922852, "global_step": 138233, "epoch": 822} {"train_loss": -10.75230884552002, "global_step": 138234, "epoch": 822} {"train_loss": -10.532999038696289, "global_step": 138235, "epoch": 822} {"train_loss": -10.71464729309082, "global_step": 138236, "epoch": 822} {"train_loss": -10.485018730163574, "global_step": 138237, "epoch": 822} {"train_loss": -10.462825775146484, "global_step": 138238, "epoch": 822} {"train_loss": -10.195411682128906, "global_step": 138239, "epoch": 822} {"train_loss": -10.629131317138672, "global_step": 138240, "epoch": 822} {"train_loss": -10.696261405944824, "global_step": 138241, "epoch": 822} {"train_loss": -10.683452606201172, "global_step": 138242, "epoch": 822} {"train_loss": -10.816361427307129, "global_step": 138243, "epoch": 822} {"train_loss": -10.5690336227417, "global_step": 138244, "epoch": 822} {"train_loss": -10.53155517578125, "global_step": 138245, "epoch": 822} {"train_loss": -10.906051635742188, "global_step": 138246, "epoch": 822} {"train_loss": -10.575675010681152, "global_step": 138247, "epoch": 822} {"train_loss": -10.766144752502441, "global_step": 138248, "epoch": 822} {"train_loss": -10.483205795288086, "global_step": 138249, "epoch": 822} {"train_loss": -10.769916534423828, "global_step": 138250, "epoch": 822} {"train_loss": -10.587719917297363, "global_step": 138251, "epoch": 822} {"train_loss": -10.601829528808594, "global_step": 138252, "epoch": 822} {"train_loss": -10.43155574798584, "global_step": 138253, "epoch": 822} {"train_loss": -10.62273120880127, "global_step": 138254, "epoch": 822} {"train_loss": -10.477798461914062, "global_step": 138255, "epoch": 822} {"train_loss": -10.587575912475586, "global_step": 138256, "epoch": 822} {"train_loss": -10.692548751831055, "global_step": 138257, "epoch": 822} {"train_loss": -10.779937744140625, "global_step": 138258, "epoch": 822} {"train_loss": -10.636861801147461, "global_step": 138259, "epoch": 822} {"train_loss": -10.566167831420898, "global_step": 138260, "epoch": 822} {"train_loss": -10.587031364440918, "global_step": 138261, "epoch": 822} {"train_loss": -10.461607933044434, "global_step": 138262, "epoch": 822} {"train_loss": -10.561735862777347, "global_step": 138263, "epoch": 822, "val_loss": 223374.21875} {"train_loss": -10.195634841918945, "global_step": 138264, "epoch": 823} {"train_loss": -10.92056655883789, "global_step": 138265, "epoch": 823} {"train_loss": -10.350288391113281, "global_step": 138266, "epoch": 823} {"train_loss": -10.88811206817627, "global_step": 138267, "epoch": 823} {"train_loss": -10.636918067932129, "global_step": 138268, "epoch": 823} {"train_loss": -10.490158081054688, "global_step": 138269, "epoch": 823} {"train_loss": -10.421693801879883, "global_step": 138270, "epoch": 823} {"train_loss": -10.554891586303711, "global_step": 138271, "epoch": 823} {"train_loss": -10.398386001586914, "global_step": 138272, "epoch": 823} {"train_loss": -10.68199634552002, "global_step": 138273, "epoch": 823} {"train_loss": -10.463781356811523, "global_step": 138274, "epoch": 823} {"train_loss": -10.293123245239258, "global_step": 138275, "epoch": 823} {"train_loss": -10.46561050415039, "global_step": 138276, "epoch": 823} {"train_loss": -9.482147216796875, "global_step": 138277, "epoch": 823} {"train_loss": -10.087116241455078, "global_step": 138278, "epoch": 823} {"train_loss": -10.28495979309082, "global_step": 138279, "epoch": 823} {"train_loss": -10.296499252319336, "global_step": 138280, "epoch": 823} {"train_loss": -10.568370819091797, "global_step": 138281, "epoch": 823} {"train_loss": -10.371868133544922, "global_step": 138282, "epoch": 823} {"train_loss": -10.610407829284668, "global_step": 138283, "epoch": 823} {"train_loss": -10.593452453613281, "global_step": 138284, "epoch": 823} {"train_loss": -10.514020919799805, "global_step": 138285, "epoch": 823} {"train_loss": -10.558454513549805, "global_step": 138286, "epoch": 823} {"train_loss": -10.561168670654297, "global_step": 138287, "epoch": 823} {"train_loss": -10.625834465026855, "global_step": 138288, "epoch": 823} {"train_loss": -10.860652923583984, "global_step": 138289, "epoch": 823} {"train_loss": -10.697977066040039, "global_step": 138290, "epoch": 823} {"train_loss": -10.585278511047363, "global_step": 138291, "epoch": 823} {"train_loss": -10.463125228881836, "global_step": 138292, "epoch": 823} {"train_loss": -10.528299331665039, "global_step": 138293, "epoch": 823} {"train_loss": -10.542572021484375, "global_step": 138294, "epoch": 823} {"train_loss": -10.46555233001709, "global_step": 138295, "epoch": 823} {"train_loss": -10.656705856323242, "global_step": 138296, "epoch": 823} {"train_loss": -10.492362976074219, "global_step": 138297, "epoch": 823} {"train_loss": -10.99483871459961, "global_step": 138298, "epoch": 823} {"train_loss": -10.894414901733398, "global_step": 138299, "epoch": 823} {"train_loss": -10.42585563659668, "global_step": 138300, "epoch": 823} {"train_loss": -10.738791465759277, "global_step": 138301, "epoch": 823} {"train_loss": -10.730988502502441, "global_step": 138302, "epoch": 823} {"train_loss": -10.677507400512695, "global_step": 138303, "epoch": 823} {"train_loss": -10.717362403869629, "global_step": 138304, "epoch": 823} {"train_loss": -10.5426664352417, "global_step": 138305, "epoch": 823} {"train_loss": -10.433379173278809, "global_step": 138306, "epoch": 823} {"train_loss": -10.757036209106445, "global_step": 138307, "epoch": 823} {"train_loss": -10.951299667358398, "global_step": 138308, "epoch": 823} {"train_loss": -10.653676986694336, "global_step": 138309, "epoch": 823} {"train_loss": -10.568737983703613, "global_step": 138310, "epoch": 823} {"train_loss": -10.948817253112793, "global_step": 138311, "epoch": 823} {"train_loss": -10.595333099365234, "global_step": 138312, "epoch": 823} {"train_loss": -10.929193496704102, "global_step": 138313, "epoch": 823} {"train_loss": -10.533990859985352, "global_step": 138314, "epoch": 823} {"train_loss": -10.500898361206055, "global_step": 138315, "epoch": 823} {"train_loss": -10.73468017578125, "global_step": 138316, "epoch": 823} {"train_loss": -10.585824012756348, "global_step": 138317, "epoch": 823} {"train_loss": -10.634193420410156, "global_step": 138318, "epoch": 823} {"train_loss": -10.800333023071289, "global_step": 138319, "epoch": 823} {"train_loss": -10.565332412719727, "global_step": 138320, "epoch": 823} {"train_loss": -10.679163932800293, "global_step": 138321, "epoch": 823} {"train_loss": -10.228240966796875, "global_step": 138322, "epoch": 823} {"train_loss": -10.605890274047852, "global_step": 138323, "epoch": 823} {"train_loss": -10.275275230407715, "global_step": 138324, "epoch": 823} {"train_loss": -10.721273422241211, "global_step": 138325, "epoch": 823} {"train_loss": -10.428149223327637, "global_step": 138326, "epoch": 823} {"train_loss": -10.53687858581543, "global_step": 138327, "epoch": 823} {"train_loss": -10.601470947265625, "global_step": 138328, "epoch": 823} {"train_loss": -10.591530799865723, "global_step": 138329, "epoch": 823} {"train_loss": -10.914125442504883, "global_step": 138330, "epoch": 823} {"train_loss": -10.781789779663086, "global_step": 138331, "epoch": 823} {"train_loss": -10.567533493041992, "global_step": 138332, "epoch": 823} {"train_loss": -10.474254608154297, "global_step": 138333, "epoch": 823} {"train_loss": -10.53023624420166, "global_step": 138334, "epoch": 823} {"train_loss": -10.580734252929688, "global_step": 138335, "epoch": 823} {"train_loss": -10.585603713989258, "global_step": 138336, "epoch": 823} {"train_loss": -10.074514389038086, "global_step": 138337, "epoch": 823} {"train_loss": -9.972396850585938, "global_step": 138338, "epoch": 823} {"train_loss": -10.676650047302246, "global_step": 138339, "epoch": 823} {"train_loss": -9.956022262573242, "global_step": 138340, "epoch": 823} {"train_loss": -10.44686508178711, "global_step": 138341, "epoch": 823} {"train_loss": -10.423891067504883, "global_step": 138342, "epoch": 823} {"train_loss": -10.210393905639648, "global_step": 138343, "epoch": 823} {"train_loss": -10.312705993652344, "global_step": 138344, "epoch": 823} {"train_loss": -10.132087707519531, "global_step": 138345, "epoch": 823} {"train_loss": -10.487055778503418, "global_step": 138346, "epoch": 823} {"train_loss": -10.130412101745605, "global_step": 138347, "epoch": 823} {"train_loss": -10.437114715576172, "global_step": 138348, "epoch": 823} {"train_loss": -9.816793441772461, "global_step": 138349, "epoch": 823} {"train_loss": -9.914265632629395, "global_step": 138350, "epoch": 823} {"train_loss": -9.693487167358398, "global_step": 138351, "epoch": 823} {"train_loss": -9.868865966796875, "global_step": 138352, "epoch": 823} {"train_loss": -9.991800308227539, "global_step": 138353, "epoch": 823} {"train_loss": -9.71743106842041, "global_step": 138354, "epoch": 823} {"train_loss": -10.41540813446045, "global_step": 138355, "epoch": 823} {"train_loss": -9.443428039550781, "global_step": 138356, "epoch": 823} {"train_loss": -10.194378852844238, "global_step": 138357, "epoch": 823} {"train_loss": -9.772760391235352, "global_step": 138358, "epoch": 823} {"train_loss": -10.2783203125, "global_step": 138359, "epoch": 823} {"train_loss": -10.00886344909668, "global_step": 138360, "epoch": 823} {"train_loss": -10.196866035461426, "global_step": 138361, "epoch": 823} {"train_loss": -10.236278533935547, "global_step": 138362, "epoch": 823} {"train_loss": -10.269166946411133, "global_step": 138363, "epoch": 823} {"train_loss": -10.157112121582031, "global_step": 138364, "epoch": 823} {"train_loss": -10.488483428955078, "global_step": 138365, "epoch": 823} {"train_loss": -10.447946548461914, "global_step": 138366, "epoch": 823} {"train_loss": -10.174519538879395, "global_step": 138367, "epoch": 823} {"train_loss": -10.2139253616333, "global_step": 138368, "epoch": 823} {"train_loss": -10.354854583740234, "global_step": 138369, "epoch": 823} {"train_loss": -10.58755111694336, "global_step": 138370, "epoch": 823} {"train_loss": -10.479503631591797, "global_step": 138371, "epoch": 823} {"train_loss": -10.156957626342773, "global_step": 138372, "epoch": 823} {"train_loss": -10.602222442626953, "global_step": 138373, "epoch": 823} {"train_loss": -10.556674003601074, "global_step": 138374, "epoch": 823} {"train_loss": -10.291526794433594, "global_step": 138375, "epoch": 823} {"train_loss": -10.681909561157227, "global_step": 138376, "epoch": 823} {"train_loss": -10.228483200073242, "global_step": 138377, "epoch": 823} {"train_loss": -10.537546157836914, "global_step": 138378, "epoch": 823} {"train_loss": -10.647295951843262, "global_step": 138379, "epoch": 823} {"train_loss": -10.332721710205078, "global_step": 138380, "epoch": 823} {"train_loss": -10.684778213500977, "global_step": 138381, "epoch": 823} {"train_loss": -10.466873168945312, "global_step": 138382, "epoch": 823} {"train_loss": -10.554149627685547, "global_step": 138383, "epoch": 823} {"train_loss": -10.604724884033203, "global_step": 138384, "epoch": 823} {"train_loss": -10.669405937194824, "global_step": 138385, "epoch": 823} {"train_loss": -10.757034301757812, "global_step": 138386, "epoch": 823} {"train_loss": -10.530420303344727, "global_step": 138387, "epoch": 823} {"train_loss": -10.718629837036133, "global_step": 138388, "epoch": 823} {"train_loss": -10.801227569580078, "global_step": 138389, "epoch": 823} {"train_loss": -10.736096382141113, "global_step": 138390, "epoch": 823} {"train_loss": -10.899027824401855, "global_step": 138391, "epoch": 823} {"train_loss": -10.818233489990234, "global_step": 138392, "epoch": 823} {"train_loss": -10.56037712097168, "global_step": 138393, "epoch": 823} {"train_loss": -10.386804580688477, "global_step": 138394, "epoch": 823} {"train_loss": -10.67304515838623, "global_step": 138395, "epoch": 823} {"train_loss": -9.831382751464844, "global_step": 138396, "epoch": 823} {"train_loss": -10.668007850646973, "global_step": 138397, "epoch": 823} {"train_loss": -10.44670295715332, "global_step": 138398, "epoch": 823} {"train_loss": -10.786032676696777, "global_step": 138399, "epoch": 823} {"train_loss": -10.307570457458496, "global_step": 138400, "epoch": 823} {"train_loss": -10.504526138305664, "global_step": 138401, "epoch": 823} {"train_loss": -10.482063293457031, "global_step": 138402, "epoch": 823} {"train_loss": -9.295350074768066, "global_step": 138403, "epoch": 823} {"train_loss": -10.650904655456543, "global_step": 138404, "epoch": 823} {"train_loss": -8.655704498291016, "global_step": 138405, "epoch": 823} {"train_loss": -10.249177932739258, "global_step": 138406, "epoch": 823} {"train_loss": -9.531440734863281, "global_step": 138407, "epoch": 823} {"train_loss": -9.335205078125, "global_step": 138408, "epoch": 823} {"train_loss": -9.52345085144043, "global_step": 138409, "epoch": 823} {"train_loss": -9.892589569091797, "global_step": 138410, "epoch": 823} {"train_loss": -9.468048095703125, "global_step": 138411, "epoch": 823} {"train_loss": -10.329364776611328, "global_step": 138412, "epoch": 823} {"train_loss": -9.984176635742188, "global_step": 138413, "epoch": 823} {"train_loss": -10.315999984741211, "global_step": 138414, "epoch": 823} {"train_loss": -10.315868377685547, "global_step": 138415, "epoch": 823} {"train_loss": -10.394817352294922, "global_step": 138416, "epoch": 823} {"train_loss": -10.119364738464355, "global_step": 138417, "epoch": 823} {"train_loss": -10.386358261108398, "global_step": 138418, "epoch": 823} {"train_loss": -10.305855751037598, "global_step": 138419, "epoch": 823} {"train_loss": -10.189638137817383, "global_step": 138420, "epoch": 823} {"train_loss": -10.242907524108887, "global_step": 138421, "epoch": 823} {"train_loss": -10.43448257446289, "global_step": 138422, "epoch": 823} {"train_loss": -10.343443870544434, "global_step": 138423, "epoch": 823} {"train_loss": -10.223920822143555, "global_step": 138424, "epoch": 823} {"train_loss": -10.54125690460205, "global_step": 138425, "epoch": 823} {"train_loss": -10.360239028930664, "global_step": 138426, "epoch": 823} {"train_loss": -10.608572006225586, "global_step": 138427, "epoch": 823} {"train_loss": -10.40548038482666, "global_step": 138428, "epoch": 823} {"train_loss": -10.457040786743164, "global_step": 138429, "epoch": 823} {"train_loss": -10.142145156860352, "global_step": 138430, "epoch": 823} {"train_loss": -10.403879551660447, "global_step": 138431, "epoch": 823, "val_loss": 225656.296875} {"train_loss": -10.289019584655762, "global_step": 138432, "epoch": 824} {"train_loss": -10.402212142944336, "global_step": 138433, "epoch": 824} {"train_loss": -10.308021545410156, "global_step": 138434, "epoch": 824} {"train_loss": -10.353699684143066, "global_step": 138435, "epoch": 824} {"train_loss": -10.510841369628906, "global_step": 138436, "epoch": 824} {"train_loss": -10.58041763305664, "global_step": 138437, "epoch": 824} {"train_loss": -10.51032543182373, "global_step": 138438, "epoch": 824} {"train_loss": -10.409870147705078, "global_step": 138439, "epoch": 824} {"train_loss": -10.571495056152344, "global_step": 138440, "epoch": 824} {"train_loss": -10.454741477966309, "global_step": 138441, "epoch": 824} {"train_loss": -10.586445808410645, "global_step": 138442, "epoch": 824} {"train_loss": -10.631174087524414, "global_step": 138443, "epoch": 824} {"train_loss": -10.913777351379395, "global_step": 138444, "epoch": 824} {"train_loss": -10.597579002380371, "global_step": 138445, "epoch": 824} {"train_loss": -10.5751953125, "global_step": 138446, "epoch": 824} {"train_loss": -10.830107688903809, "global_step": 138447, "epoch": 824} {"train_loss": -10.697084426879883, "global_step": 138448, "epoch": 824} {"train_loss": -10.70843505859375, "global_step": 138449, "epoch": 824} {"train_loss": -10.40256118774414, "global_step": 138450, "epoch": 824} {"train_loss": -10.634148597717285, "global_step": 138451, "epoch": 824} {"train_loss": -10.765365600585938, "global_step": 138452, "epoch": 824} {"train_loss": -10.78142261505127, "global_step": 138453, "epoch": 824} {"train_loss": -10.455684661865234, "global_step": 138454, "epoch": 824} {"train_loss": -10.789793014526367, "global_step": 138455, "epoch": 824} {"train_loss": -10.678823471069336, "global_step": 138456, "epoch": 824} {"train_loss": -10.567296981811523, "global_step": 138457, "epoch": 824} {"train_loss": -10.840812683105469, "global_step": 138458, "epoch": 824} {"train_loss": -10.621118545532227, "global_step": 138459, "epoch": 824} {"train_loss": -10.754348754882812, "global_step": 138460, "epoch": 824} {"train_loss": -10.68207836151123, "global_step": 138461, "epoch": 824} {"train_loss": -10.612615585327148, "global_step": 138462, "epoch": 824} {"train_loss": -10.549558639526367, "global_step": 138463, "epoch": 824} {"train_loss": -10.53349494934082, "global_step": 138464, "epoch": 824} {"train_loss": -10.882196426391602, "global_step": 138465, "epoch": 824} {"train_loss": -10.863066673278809, "global_step": 138466, "epoch": 824} {"train_loss": -10.533425331115723, "global_step": 138467, "epoch": 824} {"train_loss": -10.75182819366455, "global_step": 138468, "epoch": 824} {"train_loss": -10.765266418457031, "global_step": 138469, "epoch": 824} {"train_loss": -10.50387954711914, "global_step": 138470, "epoch": 824} {"train_loss": -10.926534652709961, "global_step": 138471, "epoch": 824} {"train_loss": -10.611173629760742, "global_step": 138472, "epoch": 824} {"train_loss": -10.734637260437012, "global_step": 138473, "epoch": 824} {"train_loss": -10.94684886932373, "global_step": 138474, "epoch": 824} {"train_loss": -10.556235313415527, "global_step": 138475, "epoch": 824} {"train_loss": -10.34794807434082, "global_step": 138476, "epoch": 824} {"train_loss": -10.986117362976074, "global_step": 138477, "epoch": 824} {"train_loss": -10.502981185913086, "global_step": 138478, "epoch": 824} {"train_loss": -10.483236312866211, "global_step": 138479, "epoch": 824} {"train_loss": -10.846665382385254, "global_step": 138480, "epoch": 824} {"train_loss": -10.262823104858398, "global_step": 138481, "epoch": 824} {"train_loss": -10.486940383911133, "global_step": 138482, "epoch": 824} {"train_loss": -10.41069221496582, "global_step": 138483, "epoch": 824} {"train_loss": -10.515777587890625, "global_step": 138484, "epoch": 824} {"train_loss": -10.56951904296875, "global_step": 138485, "epoch": 824} {"train_loss": -10.408246994018555, "global_step": 138486, "epoch": 824} {"train_loss": -10.441377639770508, "global_step": 138487, "epoch": 824} {"train_loss": -10.75316047668457, "global_step": 138488, "epoch": 824} {"train_loss": -10.5755033493042, "global_step": 138489, "epoch": 824} {"train_loss": -10.665912628173828, "global_step": 138490, "epoch": 824} {"train_loss": -10.675050735473633, "global_step": 138491, "epoch": 824} {"train_loss": -10.334403038024902, "global_step": 138492, "epoch": 824} {"train_loss": -10.849525451660156, "global_step": 138493, "epoch": 824} {"train_loss": -10.598365783691406, "global_step": 138494, "epoch": 824} {"train_loss": -10.196413040161133, "global_step": 138495, "epoch": 824} {"train_loss": -10.381210327148438, "global_step": 138496, "epoch": 824} {"train_loss": -10.481492042541504, "global_step": 138497, "epoch": 824} {"train_loss": -10.822312355041504, "global_step": 138498, "epoch": 824} {"train_loss": -10.577770233154297, "global_step": 138499, "epoch": 824} {"train_loss": -10.79508113861084, "global_step": 138500, "epoch": 824} {"train_loss": -10.693471908569336, "global_step": 138501, "epoch": 824} {"train_loss": -10.616228103637695, "global_step": 138502, "epoch": 824} {"train_loss": -10.814042091369629, "global_step": 138503, "epoch": 824} {"train_loss": -10.424257278442383, "global_step": 138504, "epoch": 824} {"train_loss": -10.35450553894043, "global_step": 138505, "epoch": 824} {"train_loss": -10.797233581542969, "global_step": 138506, "epoch": 824} {"train_loss": -10.365169525146484, "global_step": 138507, "epoch": 824} {"train_loss": -10.634838104248047, "global_step": 138508, "epoch": 824} {"train_loss": -10.499967575073242, "global_step": 138509, "epoch": 824} {"train_loss": -10.220863342285156, "global_step": 138510, "epoch": 824} {"train_loss": -10.569379806518555, "global_step": 138511, "epoch": 824} {"train_loss": -10.543493270874023, "global_step": 138512, "epoch": 824} {"train_loss": -10.497478485107422, "global_step": 138513, "epoch": 824} {"train_loss": -10.233366012573242, "global_step": 138514, "epoch": 824} {"train_loss": -10.473026275634766, "global_step": 138515, "epoch": 824} {"train_loss": -10.360901832580566, "global_step": 138516, "epoch": 824} {"train_loss": -10.511517524719238, "global_step": 138517, "epoch": 824} {"train_loss": -10.346671104431152, "global_step": 138518, "epoch": 824} {"train_loss": -10.544148445129395, "global_step": 138519, "epoch": 824} {"train_loss": -10.288995742797852, "global_step": 138520, "epoch": 824} {"train_loss": -10.757124900817871, "global_step": 138521, "epoch": 824} {"train_loss": -10.299247741699219, "global_step": 138522, "epoch": 824} {"train_loss": -10.611186981201172, "global_step": 138523, "epoch": 824} {"train_loss": -9.68146800994873, "global_step": 138524, "epoch": 824} {"train_loss": -10.290367126464844, "global_step": 138525, "epoch": 824} {"train_loss": -9.461462020874023, "global_step": 138526, "epoch": 824} {"train_loss": -10.20747184753418, "global_step": 138527, "epoch": 824} {"train_loss": -9.85438346862793, "global_step": 138528, "epoch": 824} {"train_loss": -10.308874130249023, "global_step": 138529, "epoch": 824} {"train_loss": -10.067438125610352, "global_step": 138530, "epoch": 824} {"train_loss": -10.392450332641602, "global_step": 138531, "epoch": 824} {"train_loss": -10.393095970153809, "global_step": 138532, "epoch": 824} {"train_loss": -10.350996017456055, "global_step": 138533, "epoch": 824} {"train_loss": -10.515849113464355, "global_step": 138534, "epoch": 824} {"train_loss": -10.40102481842041, "global_step": 138535, "epoch": 824} {"train_loss": -10.516088485717773, "global_step": 138536, "epoch": 824} {"train_loss": -10.470962524414062, "global_step": 138537, "epoch": 824} {"train_loss": -10.39246940612793, "global_step": 138538, "epoch": 824} {"train_loss": -10.535035133361816, "global_step": 138539, "epoch": 824} {"train_loss": -10.384014129638672, "global_step": 138540, "epoch": 824} {"train_loss": -10.529075622558594, "global_step": 138541, "epoch": 824} {"train_loss": -10.573054313659668, "global_step": 138542, "epoch": 824} {"train_loss": -10.721315383911133, "global_step": 138543, "epoch": 824} {"train_loss": -10.495370864868164, "global_step": 138544, "epoch": 824} {"train_loss": -10.335845947265625, "global_step": 138545, "epoch": 824} {"train_loss": -10.782369613647461, "global_step": 138546, "epoch": 824} {"train_loss": -10.378021240234375, "global_step": 138547, "epoch": 824} {"train_loss": -10.814689636230469, "global_step": 138548, "epoch": 824} {"train_loss": -10.547178268432617, "global_step": 138549, "epoch": 824} {"train_loss": -10.531352996826172, "global_step": 138550, "epoch": 824} {"train_loss": -10.682994842529297, "global_step": 138551, "epoch": 824} {"train_loss": -10.160325050354004, "global_step": 138552, "epoch": 824} {"train_loss": -10.718331336975098, "global_step": 138553, "epoch": 824} {"train_loss": -10.362262725830078, "global_step": 138554, "epoch": 824} {"train_loss": -10.530206680297852, "global_step": 138555, "epoch": 824} {"train_loss": -10.485772132873535, "global_step": 138556, "epoch": 824} {"train_loss": -10.434277534484863, "global_step": 138557, "epoch": 824} {"train_loss": -10.676002502441406, "global_step": 138558, "epoch": 824} {"train_loss": -10.62993049621582, "global_step": 138559, "epoch": 824} {"train_loss": -10.609262466430664, "global_step": 138560, "epoch": 824} {"train_loss": -10.801895141601562, "global_step": 138561, "epoch": 824} {"train_loss": -10.601775169372559, "global_step": 138562, "epoch": 824} {"train_loss": -10.568437576293945, "global_step": 138563, "epoch": 824} {"train_loss": -10.440160751342773, "global_step": 138564, "epoch": 824} {"train_loss": -10.474079132080078, "global_step": 138565, "epoch": 824} {"train_loss": -10.776567459106445, "global_step": 138566, "epoch": 824} {"train_loss": -10.688852310180664, "global_step": 138567, "epoch": 824} {"train_loss": -10.638627052307129, "global_step": 138568, "epoch": 824} {"train_loss": -10.739105224609375, "global_step": 138569, "epoch": 824} {"train_loss": -10.471517562866211, "global_step": 138570, "epoch": 824} {"train_loss": -10.389359474182129, "global_step": 138571, "epoch": 824} {"train_loss": -10.40123176574707, "global_step": 138572, "epoch": 824} {"train_loss": -10.378223419189453, "global_step": 138573, "epoch": 824} {"train_loss": -10.176971435546875, "global_step": 138574, "epoch": 824} {"train_loss": -10.058577537536621, "global_step": 138575, "epoch": 824} {"train_loss": -9.89655876159668, "global_step": 138576, "epoch": 824} {"train_loss": -10.534561157226562, "global_step": 138577, "epoch": 824} {"train_loss": -10.237010955810547, "global_step": 138578, "epoch": 824} {"train_loss": -10.148712158203125, "global_step": 138579, "epoch": 824} {"train_loss": -10.09908390045166, "global_step": 138580, "epoch": 824} {"train_loss": -10.296936988830566, "global_step": 138581, "epoch": 824} {"train_loss": -10.400247573852539, "global_step": 138582, "epoch": 824} {"train_loss": -9.507160186767578, "global_step": 138583, "epoch": 824} {"train_loss": -10.65259075164795, "global_step": 138584, "epoch": 824} {"train_loss": -10.063936233520508, "global_step": 138585, "epoch": 824} {"train_loss": -10.65400505065918, "global_step": 138586, "epoch": 824} {"train_loss": -10.089635848999023, "global_step": 138587, "epoch": 824} {"train_loss": -10.718592643737793, "global_step": 138588, "epoch": 824} {"train_loss": -10.168163299560547, "global_step": 138589, "epoch": 824} {"train_loss": -10.20206356048584, "global_step": 138590, "epoch": 824} {"train_loss": -10.25182056427002, "global_step": 138591, "epoch": 824} {"train_loss": -10.400941848754883, "global_step": 138592, "epoch": 824} {"train_loss": -10.362310409545898, "global_step": 138593, "epoch": 824} {"train_loss": -10.159065246582031, "global_step": 138594, "epoch": 824} {"train_loss": -10.390302658081055, "global_step": 138595, "epoch": 824} {"train_loss": -10.28630542755127, "global_step": 138596, "epoch": 824} {"train_loss": -10.586912155151367, "global_step": 138597, "epoch": 824} {"train_loss": -10.329130172729492, "global_step": 138598, "epoch": 824} {"train_loss": -10.49331797872271, "global_step": 138599, "epoch": 824, "val_loss": 226022.75} {"train_loss": -10.417587280273438, "global_step": 138600, "epoch": 825} {"train_loss": -10.485559463500977, "global_step": 138601, "epoch": 825} {"train_loss": -10.350695610046387, "global_step": 138602, "epoch": 825} {"train_loss": -10.752799034118652, "global_step": 138603, "epoch": 825} {"train_loss": -10.58704948425293, "global_step": 138604, "epoch": 825} {"train_loss": -10.72800064086914, "global_step": 138605, "epoch": 825} {"train_loss": -10.614405632019043, "global_step": 138606, "epoch": 825} {"train_loss": -10.729111671447754, "global_step": 138607, "epoch": 825} {"train_loss": -10.534648895263672, "global_step": 138608, "epoch": 825} {"train_loss": -10.481222152709961, "global_step": 138609, "epoch": 825} {"train_loss": -10.5909423828125, "global_step": 138610, "epoch": 825} {"train_loss": -10.474390029907227, "global_step": 138611, "epoch": 825} {"train_loss": -10.574860572814941, "global_step": 138612, "epoch": 825} {"train_loss": -10.739388465881348, "global_step": 138613, "epoch": 825} {"train_loss": -10.840517044067383, "global_step": 138614, "epoch": 825} {"train_loss": -10.594409942626953, "global_step": 138615, "epoch": 825} {"train_loss": -10.928211212158203, "global_step": 138616, "epoch": 825} {"train_loss": -10.725052833557129, "global_step": 138617, "epoch": 825} {"train_loss": -10.678573608398438, "global_step": 138618, "epoch": 825} {"train_loss": -10.881560325622559, "global_step": 138619, "epoch": 825} {"train_loss": -10.771677017211914, "global_step": 138620, "epoch": 825} {"train_loss": -10.757811546325684, "global_step": 138621, "epoch": 825} {"train_loss": -10.597199440002441, "global_step": 138622, "epoch": 825} {"train_loss": -10.453445434570312, "global_step": 138623, "epoch": 825} {"train_loss": -10.680665969848633, "global_step": 138624, "epoch": 825} {"train_loss": -10.894872665405273, "global_step": 138625, "epoch": 825} {"train_loss": -10.947711944580078, "global_step": 138626, "epoch": 825} {"train_loss": -10.872674942016602, "global_step": 138627, "epoch": 825} {"train_loss": -10.864358901977539, "global_step": 138628, "epoch": 825} {"train_loss": -11.071487426757812, "global_step": 138629, "epoch": 825} {"train_loss": -10.627750396728516, "global_step": 138630, "epoch": 825} {"train_loss": -10.848052978515625, "global_step": 138631, "epoch": 825} {"train_loss": -10.782623291015625, "global_step": 138632, "epoch": 825} {"train_loss": -10.903121948242188, "global_step": 138633, "epoch": 825} {"train_loss": -11.002120971679688, "global_step": 138634, "epoch": 825} {"train_loss": -10.990574836730957, "global_step": 138635, "epoch": 825} {"train_loss": -10.51909065246582, "global_step": 138636, "epoch": 825} {"train_loss": -10.644360542297363, "global_step": 138637, "epoch": 825} {"train_loss": -10.829204559326172, "global_step": 138638, "epoch": 825} {"train_loss": -10.341849327087402, "global_step": 138639, "epoch": 825} {"train_loss": -9.878421783447266, "global_step": 138640, "epoch": 825} {"train_loss": -10.796045303344727, "global_step": 138641, "epoch": 825} {"train_loss": -10.426791191101074, "global_step": 138642, "epoch": 825} {"train_loss": -10.558358192443848, "global_step": 138643, "epoch": 825} {"train_loss": -10.412252426147461, "global_step": 138644, "epoch": 825} {"train_loss": -10.328692436218262, "global_step": 138645, "epoch": 825} {"train_loss": -10.075663566589355, "global_step": 138646, "epoch": 825} {"train_loss": -10.330155372619629, "global_step": 138647, "epoch": 825} {"train_loss": -9.523340225219727, "global_step": 138648, "epoch": 825} {"train_loss": -9.336396217346191, "global_step": 138649, "epoch": 825} {"train_loss": -10.51327133178711, "global_step": 138650, "epoch": 825} {"train_loss": -9.34195613861084, "global_step": 138651, "epoch": 825} {"train_loss": -9.59109878540039, "global_step": 138652, "epoch": 825} {"train_loss": -10.077287673950195, "global_step": 138653, "epoch": 825} {"train_loss": -9.925607681274414, "global_step": 138654, "epoch": 825} {"train_loss": -9.76051139831543, "global_step": 138655, "epoch": 825} {"train_loss": -10.11937141418457, "global_step": 138656, "epoch": 825} {"train_loss": -9.605960845947266, "global_step": 138657, "epoch": 825} {"train_loss": -10.345909118652344, "global_step": 138658, "epoch": 825} {"train_loss": -9.789011001586914, "global_step": 138659, "epoch": 825} {"train_loss": -9.92251205444336, "global_step": 138660, "epoch": 825} {"train_loss": -10.278139114379883, "global_step": 138661, "epoch": 825} {"train_loss": -10.170703887939453, "global_step": 138662, "epoch": 825} {"train_loss": -10.109830856323242, "global_step": 138663, "epoch": 825} {"train_loss": -10.168848991394043, "global_step": 138664, "epoch": 825} {"train_loss": -9.832168579101562, "global_step": 138665, "epoch": 825} {"train_loss": -10.409293174743652, "global_step": 138666, "epoch": 825} {"train_loss": -10.172283172607422, "global_step": 138667, "epoch": 825} {"train_loss": -10.210625648498535, "global_step": 138668, "epoch": 825} {"train_loss": -9.900527954101562, "global_step": 138669, "epoch": 825} {"train_loss": -10.2078218460083, "global_step": 138670, "epoch": 825} {"train_loss": -10.017354965209961, "global_step": 138671, "epoch": 825} {"train_loss": -10.539809226989746, "global_step": 138672, "epoch": 825} {"train_loss": -10.20029067993164, "global_step": 138673, "epoch": 825} {"train_loss": -10.342266082763672, "global_step": 138674, "epoch": 825} {"train_loss": -10.521535873413086, "global_step": 138675, "epoch": 825} {"train_loss": -10.30757999420166, "global_step": 138676, "epoch": 825} {"train_loss": -10.465470314025879, "global_step": 138677, "epoch": 825} {"train_loss": -10.510709762573242, "global_step": 138678, "epoch": 825} {"train_loss": -10.48013973236084, "global_step": 138679, "epoch": 825} {"train_loss": -10.423253059387207, "global_step": 138680, "epoch": 825} {"train_loss": -10.737298965454102, "global_step": 138681, "epoch": 825} {"train_loss": -10.499486923217773, "global_step": 138682, "epoch": 825} {"train_loss": -10.566051483154297, "global_step": 138683, "epoch": 825} {"train_loss": -10.396114349365234, "global_step": 138684, "epoch": 825} {"train_loss": -10.728839874267578, "global_step": 138685, "epoch": 825} {"train_loss": -10.418039321899414, "global_step": 138686, "epoch": 825} {"train_loss": -10.60914421081543, "global_step": 138687, "epoch": 825} {"train_loss": -10.356440544128418, "global_step": 138688, "epoch": 825} {"train_loss": -10.778389930725098, "global_step": 138689, "epoch": 825} {"train_loss": -10.633173942565918, "global_step": 138690, "epoch": 825} {"train_loss": -10.583121299743652, "global_step": 138691, "epoch": 825} {"train_loss": -10.796095848083496, "global_step": 138692, "epoch": 825} {"train_loss": -10.752850532531738, "global_step": 138693, "epoch": 825} {"train_loss": -10.626903533935547, "global_step": 138694, "epoch": 825} {"train_loss": -10.777231216430664, "global_step": 138695, "epoch": 825} {"train_loss": -10.814482688903809, "global_step": 138696, "epoch": 825} {"train_loss": -10.6673583984375, "global_step": 138697, "epoch": 825} {"train_loss": -10.696145057678223, "global_step": 138698, "epoch": 825} {"train_loss": -10.73016357421875, "global_step": 138699, "epoch": 825} {"train_loss": -10.649267196655273, "global_step": 138700, "epoch": 825} {"train_loss": -10.943227767944336, "global_step": 138701, "epoch": 825} {"train_loss": -10.76927375793457, "global_step": 138702, "epoch": 825} {"train_loss": -10.939749717712402, "global_step": 138703, "epoch": 825} {"train_loss": -10.807116508483887, "global_step": 138704, "epoch": 825} {"train_loss": -10.874897003173828, "global_step": 138705, "epoch": 825} {"train_loss": -10.884706497192383, "global_step": 138706, "epoch": 825} {"train_loss": -10.839353561401367, "global_step": 138707, "epoch": 825} {"train_loss": -10.740323066711426, "global_step": 138708, "epoch": 825} {"train_loss": -10.670639038085938, "global_step": 138709, "epoch": 825} {"train_loss": -10.851495742797852, "global_step": 138710, "epoch": 825} {"train_loss": -10.631366729736328, "global_step": 138711, "epoch": 825} {"train_loss": -10.643545150756836, "global_step": 138712, "epoch": 825} {"train_loss": -10.65748119354248, "global_step": 138713, "epoch": 825} {"train_loss": -10.756117820739746, "global_step": 138714, "epoch": 825} {"train_loss": -10.494976043701172, "global_step": 138715, "epoch": 825} {"train_loss": -10.291786193847656, "global_step": 138716, "epoch": 825} {"train_loss": -10.037154197692871, "global_step": 138717, "epoch": 825} {"train_loss": -10.183271408081055, "global_step": 138718, "epoch": 825} {"train_loss": -10.704540252685547, "global_step": 138719, "epoch": 825} {"train_loss": -10.409828186035156, "global_step": 138720, "epoch": 825} {"train_loss": -10.633272171020508, "global_step": 138721, "epoch": 825} {"train_loss": -10.178232192993164, "global_step": 138722, "epoch": 825} {"train_loss": -10.417760848999023, "global_step": 138723, "epoch": 825} {"train_loss": -10.195158004760742, "global_step": 138724, "epoch": 825} {"train_loss": -9.769246101379395, "global_step": 138725, "epoch": 825} {"train_loss": -9.92929458618164, "global_step": 138726, "epoch": 825} {"train_loss": -9.996235847473145, "global_step": 138727, "epoch": 825} {"train_loss": -10.400947570800781, "global_step": 138728, "epoch": 825} {"train_loss": -9.923151969909668, "global_step": 138729, "epoch": 825} {"train_loss": -10.004413604736328, "global_step": 138730, "epoch": 825} {"train_loss": -10.073484420776367, "global_step": 138731, "epoch": 825} {"train_loss": -9.833063125610352, "global_step": 138732, "epoch": 825} {"train_loss": -10.537309646606445, "global_step": 138733, "epoch": 825} {"train_loss": -10.031081199645996, "global_step": 138734, "epoch": 825} {"train_loss": -10.553800582885742, "global_step": 138735, "epoch": 825} {"train_loss": -10.103710174560547, "global_step": 138736, "epoch": 825} {"train_loss": -10.520017623901367, "global_step": 138737, "epoch": 825} {"train_loss": -10.241857528686523, "global_step": 138738, "epoch": 825} {"train_loss": -10.481319427490234, "global_step": 138739, "epoch": 825} {"train_loss": -10.387635231018066, "global_step": 138740, "epoch": 825} {"train_loss": -10.446659088134766, "global_step": 138741, "epoch": 825} {"train_loss": -10.240535736083984, "global_step": 138742, "epoch": 825} {"train_loss": -10.1051025390625, "global_step": 138743, "epoch": 825} {"train_loss": -10.40302562713623, "global_step": 138744, "epoch": 825} {"train_loss": -9.762592315673828, "global_step": 138745, "epoch": 825} {"train_loss": -10.499935150146484, "global_step": 138746, "epoch": 825} {"train_loss": -10.441978454589844, "global_step": 138747, "epoch": 825} {"train_loss": -10.097526550292969, "global_step": 138748, "epoch": 825} {"train_loss": -10.588483810424805, "global_step": 138749, "epoch": 825} {"train_loss": -9.910049438476562, "global_step": 138750, "epoch": 825} {"train_loss": -10.516855239868164, "global_step": 138751, "epoch": 825} {"train_loss": -10.37594223022461, "global_step": 138752, "epoch": 825} {"train_loss": -10.173563003540039, "global_step": 138753, "epoch": 825} {"train_loss": -10.564752578735352, "global_step": 138754, "epoch": 825} {"train_loss": -9.842782020568848, "global_step": 138755, "epoch": 825} {"train_loss": -10.46221923828125, "global_step": 138756, "epoch": 825} {"train_loss": -10.249441146850586, "global_step": 138757, "epoch": 825} {"train_loss": -10.285355567932129, "global_step": 138758, "epoch": 825} {"train_loss": -10.167449951171875, "global_step": 138759, "epoch": 825} {"train_loss": -10.589883804321289, "global_step": 138760, "epoch": 825} {"train_loss": -10.179001808166504, "global_step": 138761, "epoch": 825} {"train_loss": -10.428667068481445, "global_step": 138762, "epoch": 825} {"train_loss": -10.322412490844727, "global_step": 138763, "epoch": 825} {"train_loss": -10.543882369995117, "global_step": 138764, "epoch": 825} {"train_loss": -10.322010040283203, "global_step": 138765, "epoch": 825} {"train_loss": -10.468868255615234, "global_step": 138766, "epoch": 825} {"train_loss": -10.431604760033744, "global_step": 138767, "epoch": 825, "val_loss": 226662.75, "train_action_mse_error": 1.8945144414901733} {"train_loss": -10.547353744506836, "global_step": 138768, "epoch": 826} {"train_loss": -10.565241813659668, "global_step": 138769, "epoch": 826} {"train_loss": -10.552120208740234, "global_step": 138770, "epoch": 826} {"train_loss": -10.425823211669922, "global_step": 138771, "epoch": 826} {"train_loss": -10.567402839660645, "global_step": 138772, "epoch": 826} {"train_loss": -10.450806617736816, "global_step": 138773, "epoch": 826} {"train_loss": -10.230798721313477, "global_step": 138774, "epoch": 826} {"train_loss": -10.4288911819458, "global_step": 138775, "epoch": 826} {"train_loss": -10.405986785888672, "global_step": 138776, "epoch": 826} {"train_loss": -10.46370792388916, "global_step": 138777, "epoch": 826} {"train_loss": -10.699131965637207, "global_step": 138778, "epoch": 826} {"train_loss": -10.622218132019043, "global_step": 138779, "epoch": 826} {"train_loss": -10.484249114990234, "global_step": 138780, "epoch": 826} {"train_loss": -10.761765480041504, "global_step": 138781, "epoch": 826} {"train_loss": -10.515082359313965, "global_step": 138782, "epoch": 826} {"train_loss": -10.295858383178711, "global_step": 138783, "epoch": 826} {"train_loss": -10.546211242675781, "global_step": 138784, "epoch": 826} {"train_loss": -10.302194595336914, "global_step": 138785, "epoch": 826} {"train_loss": -10.355130195617676, "global_step": 138786, "epoch": 826} {"train_loss": -10.130849838256836, "global_step": 138787, "epoch": 826} {"train_loss": -10.502105712890625, "global_step": 138788, "epoch": 826} {"train_loss": -10.19771957397461, "global_step": 138789, "epoch": 826} {"train_loss": -10.546544075012207, "global_step": 138790, "epoch": 826} {"train_loss": -10.476152420043945, "global_step": 138791, "epoch": 826} {"train_loss": -10.637262344360352, "global_step": 138792, "epoch": 826} {"train_loss": -10.448380470275879, "global_step": 138793, "epoch": 826} {"train_loss": -10.407681465148926, "global_step": 138794, "epoch": 826} {"train_loss": -10.706474304199219, "global_step": 138795, "epoch": 826} {"train_loss": -10.75073528289795, "global_step": 138796, "epoch": 826} {"train_loss": -10.669251441955566, "global_step": 138797, "epoch": 826} {"train_loss": -10.58698558807373, "global_step": 138798, "epoch": 826} {"train_loss": -10.645254135131836, "global_step": 138799, "epoch": 826} {"train_loss": -10.57901382446289, "global_step": 138800, "epoch": 826} {"train_loss": -10.521703720092773, "global_step": 138801, "epoch": 826} {"train_loss": -10.605876922607422, "global_step": 138802, "epoch": 826} {"train_loss": -10.527494430541992, "global_step": 138803, "epoch": 826} {"train_loss": -10.137004852294922, "global_step": 138804, "epoch": 826} {"train_loss": -10.338456153869629, "global_step": 138805, "epoch": 826} {"train_loss": -10.623472213745117, "global_step": 138806, "epoch": 826} {"train_loss": -10.263731002807617, "global_step": 138807, "epoch": 826} {"train_loss": -10.712167739868164, "global_step": 138808, "epoch": 826} {"train_loss": -10.455612182617188, "global_step": 138809, "epoch": 826} {"train_loss": -10.760068893432617, "global_step": 138810, "epoch": 826} {"train_loss": -10.819738388061523, "global_step": 138811, "epoch": 826} {"train_loss": -10.665478706359863, "global_step": 138812, "epoch": 826} {"train_loss": -10.734838485717773, "global_step": 138813, "epoch": 826} {"train_loss": -10.755720138549805, "global_step": 138814, "epoch": 826} {"train_loss": -10.571128845214844, "global_step": 138815, "epoch": 826} {"train_loss": -10.687501907348633, "global_step": 138816, "epoch": 826} {"train_loss": -10.596698760986328, "global_step": 138817, "epoch": 826} {"train_loss": -10.661197662353516, "global_step": 138818, "epoch": 826} {"train_loss": -10.59540843963623, "global_step": 138819, "epoch": 826} {"train_loss": -10.746572494506836, "global_step": 138820, "epoch": 826} {"train_loss": -10.491442680358887, "global_step": 138821, "epoch": 826} {"train_loss": -10.846101760864258, "global_step": 138822, "epoch": 826} {"train_loss": -10.739596366882324, "global_step": 138823, "epoch": 826} {"train_loss": -10.704216003417969, "global_step": 138824, "epoch": 826} {"train_loss": -10.518171310424805, "global_step": 138825, "epoch": 826} {"train_loss": -10.282950401306152, "global_step": 138826, "epoch": 826} {"train_loss": -10.80266284942627, "global_step": 138827, "epoch": 826} {"train_loss": -10.503877639770508, "global_step": 138828, "epoch": 826} {"train_loss": -10.20379638671875, "global_step": 138829, "epoch": 826} {"train_loss": -10.40400505065918, "global_step": 138830, "epoch": 826} {"train_loss": -10.890018463134766, "global_step": 138831, "epoch": 826} {"train_loss": -10.222024917602539, "global_step": 138832, "epoch": 826} {"train_loss": -10.610651016235352, "global_step": 138833, "epoch": 826} {"train_loss": -10.458191871643066, "global_step": 138834, "epoch": 826} {"train_loss": -10.679762840270996, "global_step": 138835, "epoch": 826} {"train_loss": -10.609821319580078, "global_step": 138836, "epoch": 826} {"train_loss": -10.480148315429688, "global_step": 138837, "epoch": 826} {"train_loss": -10.701608657836914, "global_step": 138838, "epoch": 826} {"train_loss": -10.187350273132324, "global_step": 138839, "epoch": 826} {"train_loss": -10.309211730957031, "global_step": 138840, "epoch": 826} {"train_loss": -10.288848876953125, "global_step": 138841, "epoch": 826} {"train_loss": -10.603194236755371, "global_step": 138842, "epoch": 826} {"train_loss": -10.161704063415527, "global_step": 138843, "epoch": 826} {"train_loss": -10.321121215820312, "global_step": 138844, "epoch": 826} {"train_loss": -10.012788772583008, "global_step": 138845, "epoch": 826} {"train_loss": -10.119129180908203, "global_step": 138846, "epoch": 826} {"train_loss": -9.729372024536133, "global_step": 138847, "epoch": 826} {"train_loss": -9.975415229797363, "global_step": 138848, "epoch": 826} {"train_loss": -10.664276123046875, "global_step": 138849, "epoch": 826} {"train_loss": -10.333176612854004, "global_step": 138850, "epoch": 826} {"train_loss": -10.120285034179688, "global_step": 138851, "epoch": 826} {"train_loss": -10.518776893615723, "global_step": 138852, "epoch": 826} {"train_loss": -10.322260856628418, "global_step": 138853, "epoch": 826} {"train_loss": -10.26466178894043, "global_step": 138854, "epoch": 826} {"train_loss": -10.718513488769531, "global_step": 138855, "epoch": 826} {"train_loss": -10.372613906860352, "global_step": 138856, "epoch": 826} {"train_loss": -10.282122611999512, "global_step": 138857, "epoch": 826} {"train_loss": -10.671157836914062, "global_step": 138858, "epoch": 826} {"train_loss": -10.63507080078125, "global_step": 138859, "epoch": 826} {"train_loss": -10.268033981323242, "global_step": 138860, "epoch": 826} {"train_loss": -10.546634674072266, "global_step": 138861, "epoch": 826} {"train_loss": -10.344200134277344, "global_step": 138862, "epoch": 826} {"train_loss": -10.35437297821045, "global_step": 138863, "epoch": 826} {"train_loss": -10.317123413085938, "global_step": 138864, "epoch": 826} {"train_loss": -9.933709144592285, "global_step": 138865, "epoch": 826} {"train_loss": -10.215867042541504, "global_step": 138866, "epoch": 826} {"train_loss": -10.280424118041992, "global_step": 138867, "epoch": 826} {"train_loss": -9.88382339477539, "global_step": 138868, "epoch": 826} {"train_loss": -10.517423629760742, "global_step": 138869, "epoch": 826} {"train_loss": -10.261941909790039, "global_step": 138870, "epoch": 826} {"train_loss": -10.461153030395508, "global_step": 138871, "epoch": 826} {"train_loss": -10.004816055297852, "global_step": 138872, "epoch": 826} {"train_loss": -10.230112075805664, "global_step": 138873, "epoch": 826} {"train_loss": -10.148737907409668, "global_step": 138874, "epoch": 826} {"train_loss": -10.635356903076172, "global_step": 138875, "epoch": 826} {"train_loss": -10.432939529418945, "global_step": 138876, "epoch": 826} {"train_loss": -10.077005386352539, "global_step": 138877, "epoch": 826} {"train_loss": -10.516865730285645, "global_step": 138878, "epoch": 826} {"train_loss": -10.193951606750488, "global_step": 138879, "epoch": 826} {"train_loss": -10.533349990844727, "global_step": 138880, "epoch": 826} {"train_loss": -10.224881172180176, "global_step": 138881, "epoch": 826} {"train_loss": -10.564924240112305, "global_step": 138882, "epoch": 826} {"train_loss": -10.288065910339355, "global_step": 138883, "epoch": 826} {"train_loss": -10.677720069885254, "global_step": 138884, "epoch": 826} {"train_loss": -10.435871124267578, "global_step": 138885, "epoch": 826} {"train_loss": -10.418020248413086, "global_step": 138886, "epoch": 826} {"train_loss": -10.641861915588379, "global_step": 138887, "epoch": 826} {"train_loss": -10.386321067810059, "global_step": 138888, "epoch": 826} {"train_loss": -10.408040046691895, "global_step": 138889, "epoch": 826} {"train_loss": -10.475813865661621, "global_step": 138890, "epoch": 826} {"train_loss": -10.548189163208008, "global_step": 138891, "epoch": 826} {"train_loss": -10.640623092651367, "global_step": 138892, "epoch": 826} {"train_loss": -10.66727066040039, "global_step": 138893, "epoch": 826} {"train_loss": -10.738903045654297, "global_step": 138894, "epoch": 826} {"train_loss": -10.611246109008789, "global_step": 138895, "epoch": 826} {"train_loss": -10.783689498901367, "global_step": 138896, "epoch": 826} {"train_loss": -10.686843872070312, "global_step": 138897, "epoch": 826} {"train_loss": -10.45055866241455, "global_step": 138898, "epoch": 826} {"train_loss": -10.764959335327148, "global_step": 138899, "epoch": 826} {"train_loss": -10.656991958618164, "global_step": 138900, "epoch": 826} {"train_loss": -10.781530380249023, "global_step": 138901, "epoch": 826} {"train_loss": -10.64516544342041, "global_step": 138902, "epoch": 826} {"train_loss": -10.540821075439453, "global_step": 138903, "epoch": 826} {"train_loss": -10.472542762756348, "global_step": 138904, "epoch": 826} {"train_loss": -10.664331436157227, "global_step": 138905, "epoch": 826} {"train_loss": -10.508872985839844, "global_step": 138906, "epoch": 826} {"train_loss": -10.574667930603027, "global_step": 138907, "epoch": 826} {"train_loss": -10.401586532592773, "global_step": 138908, "epoch": 826} {"train_loss": -10.406269073486328, "global_step": 138909, "epoch": 826} {"train_loss": -10.330732345581055, "global_step": 138910, "epoch": 826} {"train_loss": -10.617949485778809, "global_step": 138911, "epoch": 826} {"train_loss": -10.600400924682617, "global_step": 138912, "epoch": 826} {"train_loss": -10.698661804199219, "global_step": 138913, "epoch": 826} {"train_loss": -10.1460599899292, "global_step": 138914, "epoch": 826} {"train_loss": -10.809917449951172, "global_step": 138915, "epoch": 826} {"train_loss": -10.416267395019531, "global_step": 138916, "epoch": 826} {"train_loss": -10.407398223876953, "global_step": 138917, "epoch": 826} {"train_loss": -10.204474449157715, "global_step": 138918, "epoch": 826} {"train_loss": -10.264461517333984, "global_step": 138919, "epoch": 826} {"train_loss": -9.92501449584961, "global_step": 138920, "epoch": 826} {"train_loss": -9.510993957519531, "global_step": 138921, "epoch": 826} {"train_loss": -10.704882621765137, "global_step": 138922, "epoch": 826} {"train_loss": -9.697500228881836, "global_step": 138923, "epoch": 826} {"train_loss": -10.267288208007812, "global_step": 138924, "epoch": 826} {"train_loss": -9.574909210205078, "global_step": 138925, "epoch": 826} {"train_loss": -9.450039863586426, "global_step": 138926, "epoch": 826} {"train_loss": -9.715766906738281, "global_step": 138927, "epoch": 826} {"train_loss": -8.986764907836914, "global_step": 138928, "epoch": 826} {"train_loss": -8.690081596374512, "global_step": 138929, "epoch": 826} {"train_loss": -9.837696075439453, "global_step": 138930, "epoch": 826} {"train_loss": -8.815662384033203, "global_step": 138931, "epoch": 826} {"train_loss": -9.633199691772461, "global_step": 138932, "epoch": 826} {"train_loss": -8.655712127685547, "global_step": 138933, "epoch": 826} {"train_loss": -9.849255561828613, "global_step": 138934, "epoch": 826} {"train_loss": -10.374565442403158, "global_step": 138935, "epoch": 826, "val_loss": 219899.640625} {"train_loss": -9.474466323852539, "global_step": 138936, "epoch": 827} {"train_loss": -9.007757186889648, "global_step": 138937, "epoch": 827} {"train_loss": -9.401540756225586, "global_step": 138938, "epoch": 827} {"train_loss": -9.460217475891113, "global_step": 138939, "epoch": 827} {"train_loss": -8.814966201782227, "global_step": 138940, "epoch": 827} {"train_loss": -9.957594871520996, "global_step": 138941, "epoch": 827} {"train_loss": -9.157098770141602, "global_step": 138942, "epoch": 827} {"train_loss": -9.18875503540039, "global_step": 138943, "epoch": 827} {"train_loss": -10.007194519042969, "global_step": 138944, "epoch": 827} {"train_loss": -9.687934875488281, "global_step": 138945, "epoch": 827} {"train_loss": -9.625139236450195, "global_step": 138946, "epoch": 827} {"train_loss": -9.881115913391113, "global_step": 138947, "epoch": 827} {"train_loss": -9.571808815002441, "global_step": 138948, "epoch": 827} {"train_loss": -9.579489707946777, "global_step": 138949, "epoch": 827} {"train_loss": -9.977850914001465, "global_step": 138950, "epoch": 827} {"train_loss": -9.5934419631958, "global_step": 138951, "epoch": 827} {"train_loss": -9.503664016723633, "global_step": 138952, "epoch": 827} {"train_loss": -9.873489379882812, "global_step": 138953, "epoch": 827} {"train_loss": -9.904526710510254, "global_step": 138954, "epoch": 827} {"train_loss": -9.489874839782715, "global_step": 138955, "epoch": 827} {"train_loss": -10.126771926879883, "global_step": 138956, "epoch": 827} {"train_loss": -10.246021270751953, "global_step": 138957, "epoch": 827} {"train_loss": -9.67408275604248, "global_step": 138958, "epoch": 827} {"train_loss": -9.820049285888672, "global_step": 138959, "epoch": 827} {"train_loss": -10.163938522338867, "global_step": 138960, "epoch": 827} {"train_loss": -10.045394897460938, "global_step": 138961, "epoch": 827} {"train_loss": -10.062287330627441, "global_step": 138962, "epoch": 827} {"train_loss": -10.25391960144043, "global_step": 138963, "epoch": 827} {"train_loss": -9.913976669311523, "global_step": 138964, "epoch": 827} {"train_loss": -10.158446311950684, "global_step": 138965, "epoch": 827} {"train_loss": -10.305493354797363, "global_step": 138966, "epoch": 827} {"train_loss": -10.110107421875, "global_step": 138967, "epoch": 827} {"train_loss": -10.192584991455078, "global_step": 138968, "epoch": 827} {"train_loss": -10.258214950561523, "global_step": 138969, "epoch": 827} {"train_loss": -10.251935005187988, "global_step": 138970, "epoch": 827} {"train_loss": -10.338960647583008, "global_step": 138971, "epoch": 827} {"train_loss": -10.206510543823242, "global_step": 138972, "epoch": 827} {"train_loss": -10.557395935058594, "global_step": 138973, "epoch": 827} {"train_loss": -10.474685668945312, "global_step": 138974, "epoch": 827} {"train_loss": -10.49864673614502, "global_step": 138975, "epoch": 827} {"train_loss": -10.569818496704102, "global_step": 138976, "epoch": 827} {"train_loss": -10.43140983581543, "global_step": 138977, "epoch": 827} {"train_loss": -10.606660842895508, "global_step": 138978, "epoch": 827} {"train_loss": -10.632509231567383, "global_step": 138979, "epoch": 827} {"train_loss": -10.494028091430664, "global_step": 138980, "epoch": 827} {"train_loss": -10.510123252868652, "global_step": 138981, "epoch": 827} {"train_loss": -10.47451400756836, "global_step": 138982, "epoch": 827} {"train_loss": -10.514580726623535, "global_step": 138983, "epoch": 827} {"train_loss": -10.657812118530273, "global_step": 138984, "epoch": 827} {"train_loss": -10.93433952331543, "global_step": 138985, "epoch": 827} {"train_loss": -10.786398887634277, "global_step": 138986, "epoch": 827} {"train_loss": -10.680814743041992, "global_step": 138987, "epoch": 827} {"train_loss": -10.725517272949219, "global_step": 138988, "epoch": 827} {"train_loss": -10.682470321655273, "global_step": 138989, "epoch": 827} {"train_loss": -10.691085815429688, "global_step": 138990, "epoch": 827} {"train_loss": -10.868010520935059, "global_step": 138991, "epoch": 827} {"train_loss": -10.88591480255127, "global_step": 138992, "epoch": 827} {"train_loss": -10.798463821411133, "global_step": 138993, "epoch": 827} {"train_loss": -10.586164474487305, "global_step": 138994, "epoch": 827} {"train_loss": -10.463664054870605, "global_step": 138995, "epoch": 827} {"train_loss": -10.562976837158203, "global_step": 138996, "epoch": 827} {"train_loss": -10.506932258605957, "global_step": 138997, "epoch": 827} {"train_loss": -10.640997886657715, "global_step": 138998, "epoch": 827} {"train_loss": -10.521139144897461, "global_step": 138999, "epoch": 827} {"train_loss": -10.808627128601074, "global_step": 139000, "epoch": 827} {"train_loss": -10.674270629882812, "global_step": 139001, "epoch": 827} {"train_loss": -10.763741493225098, "global_step": 139002, "epoch": 827} {"train_loss": -10.615523338317871, "global_step": 139003, "epoch": 827} {"train_loss": -10.850557327270508, "global_step": 139004, "epoch": 827} {"train_loss": -10.556553840637207, "global_step": 139005, "epoch": 827} {"train_loss": -10.69810676574707, "global_step": 139006, "epoch": 827} {"train_loss": -10.832202911376953, "global_step": 139007, "epoch": 827} {"train_loss": -10.778356552124023, "global_step": 139008, "epoch": 827} {"train_loss": -10.64909839630127, "global_step": 139009, "epoch": 827} {"train_loss": -10.17924690246582, "global_step": 139010, "epoch": 827} {"train_loss": -10.204500198364258, "global_step": 139011, "epoch": 827} {"train_loss": -10.294219970703125, "global_step": 139012, "epoch": 827} {"train_loss": -10.633895874023438, "global_step": 139013, "epoch": 827} {"train_loss": -10.565397262573242, "global_step": 139014, "epoch": 827} {"train_loss": -10.58285140991211, "global_step": 139015, "epoch": 827} {"train_loss": -10.67845344543457, "global_step": 139016, "epoch": 827} {"train_loss": -10.658248901367188, "global_step": 139017, "epoch": 827} {"train_loss": -10.69503402709961, "global_step": 139018, "epoch": 827} {"train_loss": -10.815576553344727, "global_step": 139019, "epoch": 827} {"train_loss": -10.785308837890625, "global_step": 139020, "epoch": 827} {"train_loss": -10.759095191955566, "global_step": 139021, "epoch": 827} {"train_loss": -10.654104232788086, "global_step": 139022, "epoch": 827} {"train_loss": -10.42854118347168, "global_step": 139023, "epoch": 827} {"train_loss": -10.658533096313477, "global_step": 139024, "epoch": 827} {"train_loss": -10.249761581420898, "global_step": 139025, "epoch": 827} {"train_loss": -10.393712997436523, "global_step": 139026, "epoch": 827} {"train_loss": -10.628852844238281, "global_step": 139027, "epoch": 827} {"train_loss": -9.440771102905273, "global_step": 139028, "epoch": 827} {"train_loss": -9.78477668762207, "global_step": 139029, "epoch": 827} {"train_loss": -10.457529067993164, "global_step": 139030, "epoch": 827} {"train_loss": -10.029247283935547, "global_step": 139031, "epoch": 827} {"train_loss": -10.497995376586914, "global_step": 139032, "epoch": 827} {"train_loss": -9.854314804077148, "global_step": 139033, "epoch": 827} {"train_loss": -10.585249900817871, "global_step": 139034, "epoch": 827} {"train_loss": -10.078834533691406, "global_step": 139035, "epoch": 827} {"train_loss": -10.496025085449219, "global_step": 139036, "epoch": 827} {"train_loss": -10.451488494873047, "global_step": 139037, "epoch": 827} {"train_loss": -10.54511833190918, "global_step": 139038, "epoch": 827} {"train_loss": -10.689027786254883, "global_step": 139039, "epoch": 827} {"train_loss": -10.394370079040527, "global_step": 139040, "epoch": 827} {"train_loss": -10.661706924438477, "global_step": 139041, "epoch": 827} {"train_loss": -10.453987121582031, "global_step": 139042, "epoch": 827} {"train_loss": -10.824442863464355, "global_step": 139043, "epoch": 827} {"train_loss": -10.577818870544434, "global_step": 139044, "epoch": 827} {"train_loss": -10.384746551513672, "global_step": 139045, "epoch": 827} {"train_loss": -10.656696319580078, "global_step": 139046, "epoch": 827} {"train_loss": -10.57275390625, "global_step": 139047, "epoch": 827} {"train_loss": -10.735613822937012, "global_step": 139048, "epoch": 827} {"train_loss": -10.75784683227539, "global_step": 139049, "epoch": 827} {"train_loss": -10.885714530944824, "global_step": 139050, "epoch": 827} {"train_loss": -10.53748607635498, "global_step": 139051, "epoch": 827} {"train_loss": -10.48958683013916, "global_step": 139052, "epoch": 827} {"train_loss": -10.727492332458496, "global_step": 139053, "epoch": 827} {"train_loss": -10.738570213317871, "global_step": 139054, "epoch": 827} {"train_loss": -10.728029251098633, "global_step": 139055, "epoch": 827} {"train_loss": -10.771866798400879, "global_step": 139056, "epoch": 827} {"train_loss": -10.822242736816406, "global_step": 139057, "epoch": 827} {"train_loss": -10.675094604492188, "global_step": 139058, "epoch": 827} {"train_loss": -10.718698501586914, "global_step": 139059, "epoch": 827} {"train_loss": -10.636027336120605, "global_step": 139060, "epoch": 827} {"train_loss": -10.700926780700684, "global_step": 139061, "epoch": 827} {"train_loss": -10.628267288208008, "global_step": 139062, "epoch": 827} {"train_loss": -10.485383987426758, "global_step": 139063, "epoch": 827} {"train_loss": -10.897751808166504, "global_step": 139064, "epoch": 827} {"train_loss": -10.755744934082031, "global_step": 139065, "epoch": 827} {"train_loss": -10.570611000061035, "global_step": 139066, "epoch": 827} {"train_loss": -10.949344635009766, "global_step": 139067, "epoch": 827} {"train_loss": -10.772343635559082, "global_step": 139068, "epoch": 827} {"train_loss": -10.884016036987305, "global_step": 139069, "epoch": 827} {"train_loss": -10.714410781860352, "global_step": 139070, "epoch": 827} {"train_loss": -10.71435832977295, "global_step": 139071, "epoch": 827} {"train_loss": -10.5486421585083, "global_step": 139072, "epoch": 827} {"train_loss": -10.855231285095215, "global_step": 139073, "epoch": 827} {"train_loss": -10.407344818115234, "global_step": 139074, "epoch": 827} {"train_loss": -10.228494644165039, "global_step": 139075, "epoch": 827} {"train_loss": -10.79963207244873, "global_step": 139076, "epoch": 827} {"train_loss": -10.16148567199707, "global_step": 139077, "epoch": 827} {"train_loss": -10.386825561523438, "global_step": 139078, "epoch": 827} {"train_loss": -10.261710166931152, "global_step": 139079, "epoch": 827} {"train_loss": -10.529815673828125, "global_step": 139080, "epoch": 827} {"train_loss": -9.447754859924316, "global_step": 139081, "epoch": 827} {"train_loss": -10.577823638916016, "global_step": 139082, "epoch": 827} {"train_loss": -9.112497329711914, "global_step": 139083, "epoch": 827} {"train_loss": -8.188419342041016, "global_step": 139084, "epoch": 827} {"train_loss": -10.521736145019531, "global_step": 139085, "epoch": 827} {"train_loss": -8.432172775268555, "global_step": 139086, "epoch": 827} {"train_loss": -10.427506446838379, "global_step": 139087, "epoch": 827} {"train_loss": -9.569067001342773, "global_step": 139088, "epoch": 827} {"train_loss": -10.150238037109375, "global_step": 139089, "epoch": 827} {"train_loss": -10.030556678771973, "global_step": 139090, "epoch": 827} {"train_loss": -9.694573402404785, "global_step": 139091, "epoch": 827} {"train_loss": -9.917823791503906, "global_step": 139092, "epoch": 827} {"train_loss": -9.684942245483398, "global_step": 139093, "epoch": 827} {"train_loss": -10.267208099365234, "global_step": 139094, "epoch": 827} {"train_loss": -9.583260536193848, "global_step": 139095, "epoch": 827} {"train_loss": -10.247201919555664, "global_step": 139096, "epoch": 827} {"train_loss": -10.05135726928711, "global_step": 139097, "epoch": 827} {"train_loss": -9.80054759979248, "global_step": 139098, "epoch": 827} {"train_loss": -10.275300979614258, "global_step": 139099, "epoch": 827} {"train_loss": -9.501649856567383, "global_step": 139100, "epoch": 827} {"train_loss": -10.38851547241211, "global_step": 139101, "epoch": 827} {"train_loss": -9.868143081665039, "global_step": 139102, "epoch": 827} {"train_loss": -10.310485964729672, "global_step": 139103, "epoch": 827, "val_loss": 216570.296875} {"train_loss": -9.06460952758789, "global_step": 139104, "epoch": 828} {"train_loss": -10.450153350830078, "global_step": 139105, "epoch": 828} {"train_loss": -9.717203140258789, "global_step": 139106, "epoch": 828} {"train_loss": -9.89880657196045, "global_step": 139107, "epoch": 828} {"train_loss": -10.086687088012695, "global_step": 139108, "epoch": 828} {"train_loss": -10.153456687927246, "global_step": 139109, "epoch": 828} {"train_loss": -10.21424674987793, "global_step": 139110, "epoch": 828} {"train_loss": -10.20962142944336, "global_step": 139111, "epoch": 828} {"train_loss": -10.45750904083252, "global_step": 139112, "epoch": 828} {"train_loss": -10.133965492248535, "global_step": 139113, "epoch": 828} {"train_loss": -10.302751541137695, "global_step": 139114, "epoch": 828} {"train_loss": -10.428374290466309, "global_step": 139115, "epoch": 828} {"train_loss": -10.431695938110352, "global_step": 139116, "epoch": 828} {"train_loss": -10.328784942626953, "global_step": 139117, "epoch": 828} {"train_loss": -10.392965316772461, "global_step": 139118, "epoch": 828} {"train_loss": -10.283697128295898, "global_step": 139119, "epoch": 828} {"train_loss": -10.34056282043457, "global_step": 139120, "epoch": 828} {"train_loss": -10.43498420715332, "global_step": 139121, "epoch": 828} {"train_loss": -10.507527351379395, "global_step": 139122, "epoch": 828} {"train_loss": -10.319075584411621, "global_step": 139123, "epoch": 828} {"train_loss": -10.43791389465332, "global_step": 139124, "epoch": 828} {"train_loss": -10.472984313964844, "global_step": 139125, "epoch": 828} {"train_loss": -10.583059310913086, "global_step": 139126, "epoch": 828} {"train_loss": -10.473697662353516, "global_step": 139127, "epoch": 828} {"train_loss": -10.467467308044434, "global_step": 139128, "epoch": 828} {"train_loss": -10.448427200317383, "global_step": 139129, "epoch": 828} {"train_loss": -10.679924964904785, "global_step": 139130, "epoch": 828} {"train_loss": -10.335419654846191, "global_step": 139131, "epoch": 828} {"train_loss": -10.466049194335938, "global_step": 139132, "epoch": 828} {"train_loss": -10.52334213256836, "global_step": 139133, "epoch": 828} {"train_loss": -10.443388938903809, "global_step": 139134, "epoch": 828} {"train_loss": -10.298316955566406, "global_step": 139135, "epoch": 828} {"train_loss": -10.46810531616211, "global_step": 139136, "epoch": 828} {"train_loss": -10.545443534851074, "global_step": 139137, "epoch": 828} {"train_loss": -10.581233978271484, "global_step": 139138, "epoch": 828} {"train_loss": -10.736291885375977, "global_step": 139139, "epoch": 828} {"train_loss": -10.3009614944458, "global_step": 139140, "epoch": 828} {"train_loss": -10.663321495056152, "global_step": 139141, "epoch": 828} {"train_loss": -10.830617904663086, "global_step": 139142, "epoch": 828} {"train_loss": -10.704391479492188, "global_step": 139143, "epoch": 828} {"train_loss": -10.513276100158691, "global_step": 139144, "epoch": 828} {"train_loss": -10.568218231201172, "global_step": 139145, "epoch": 828} {"train_loss": -10.583256721496582, "global_step": 139146, "epoch": 828} {"train_loss": -10.703592300415039, "global_step": 139147, "epoch": 828} {"train_loss": -10.54786491394043, "global_step": 139148, "epoch": 828} {"train_loss": -10.572830200195312, "global_step": 139149, "epoch": 828} {"train_loss": -10.780153274536133, "global_step": 139150, "epoch": 828} {"train_loss": -10.674668312072754, "global_step": 139151, "epoch": 828} {"train_loss": -10.679788589477539, "global_step": 139152, "epoch": 828} {"train_loss": -10.278922080993652, "global_step": 139153, "epoch": 828} {"train_loss": -10.503076553344727, "global_step": 139154, "epoch": 828} {"train_loss": -10.648885726928711, "global_step": 139155, "epoch": 828} {"train_loss": -10.397565841674805, "global_step": 139156, "epoch": 828} {"train_loss": -10.10055923461914, "global_step": 139157, "epoch": 828} {"train_loss": -10.84113883972168, "global_step": 139158, "epoch": 828} {"train_loss": -10.042060852050781, "global_step": 139159, "epoch": 828} {"train_loss": -10.578428268432617, "global_step": 139160, "epoch": 828} {"train_loss": -10.284423828125, "global_step": 139161, "epoch": 828} {"train_loss": -10.397751808166504, "global_step": 139162, "epoch": 828} {"train_loss": -10.481687545776367, "global_step": 139163, "epoch": 828} {"train_loss": -10.284292221069336, "global_step": 139164, "epoch": 828} {"train_loss": -10.519054412841797, "global_step": 139165, "epoch": 828} {"train_loss": -10.077725410461426, "global_step": 139166, "epoch": 828} {"train_loss": -10.378804206848145, "global_step": 139167, "epoch": 828} {"train_loss": -10.308030128479004, "global_step": 139168, "epoch": 828} {"train_loss": -10.502318382263184, "global_step": 139169, "epoch": 828} {"train_loss": -10.637123107910156, "global_step": 139170, "epoch": 828} {"train_loss": -10.493061065673828, "global_step": 139171, "epoch": 828} {"train_loss": -10.435444831848145, "global_step": 139172, "epoch": 828} {"train_loss": -10.051628112792969, "global_step": 139173, "epoch": 828} {"train_loss": -10.609403610229492, "global_step": 139174, "epoch": 828} {"train_loss": -10.203840255737305, "global_step": 139175, "epoch": 828} {"train_loss": -10.425585746765137, "global_step": 139176, "epoch": 828} {"train_loss": -10.231438636779785, "global_step": 139177, "epoch": 828} {"train_loss": -10.45997142791748, "global_step": 139178, "epoch": 828} {"train_loss": -10.430228233337402, "global_step": 139179, "epoch": 828} {"train_loss": -10.637718200683594, "global_step": 139180, "epoch": 828} {"train_loss": -10.590272903442383, "global_step": 139181, "epoch": 828} {"train_loss": -10.671412467956543, "global_step": 139182, "epoch": 828} {"train_loss": -10.69294548034668, "global_step": 139183, "epoch": 828} {"train_loss": -10.404901504516602, "global_step": 139184, "epoch": 828} {"train_loss": -10.709592819213867, "global_step": 139185, "epoch": 828} {"train_loss": -10.42873764038086, "global_step": 139186, "epoch": 828} {"train_loss": -10.572912216186523, "global_step": 139187, "epoch": 828} {"train_loss": -10.651268005371094, "global_step": 139188, "epoch": 828} {"train_loss": -10.576169967651367, "global_step": 139189, "epoch": 828} {"train_loss": -10.750739097595215, "global_step": 139190, "epoch": 828} {"train_loss": -10.762166023254395, "global_step": 139191, "epoch": 828} {"train_loss": -10.600043296813965, "global_step": 139192, "epoch": 828} {"train_loss": -10.775288581848145, "global_step": 139193, "epoch": 828} {"train_loss": -10.53433609008789, "global_step": 139194, "epoch": 828} {"train_loss": -10.67857551574707, "global_step": 139195, "epoch": 828} {"train_loss": -10.645515441894531, "global_step": 139196, "epoch": 828} {"train_loss": -10.574313163757324, "global_step": 139197, "epoch": 828} {"train_loss": -10.411229133605957, "global_step": 139198, "epoch": 828} {"train_loss": -10.767494201660156, "global_step": 139199, "epoch": 828} {"train_loss": -10.784109115600586, "global_step": 139200, "epoch": 828} {"train_loss": -10.43358039855957, "global_step": 139201, "epoch": 828} {"train_loss": -10.657958030700684, "global_step": 139202, "epoch": 828} {"train_loss": -10.493280410766602, "global_step": 139203, "epoch": 828} {"train_loss": -10.73524284362793, "global_step": 139204, "epoch": 828} {"train_loss": -10.51812744140625, "global_step": 139205, "epoch": 828} {"train_loss": -10.752948760986328, "global_step": 139206, "epoch": 828} {"train_loss": -10.37252140045166, "global_step": 139207, "epoch": 828} {"train_loss": -10.5665283203125, "global_step": 139208, "epoch": 828} {"train_loss": -10.57080364227295, "global_step": 139209, "epoch": 828} {"train_loss": -10.321797370910645, "global_step": 139210, "epoch": 828} {"train_loss": -10.707016944885254, "global_step": 139211, "epoch": 828} {"train_loss": -10.526365280151367, "global_step": 139212, "epoch": 828} {"train_loss": -10.91112232208252, "global_step": 139213, "epoch": 828} {"train_loss": -10.493265151977539, "global_step": 139214, "epoch": 828} {"train_loss": -10.646110534667969, "global_step": 139215, "epoch": 828} {"train_loss": -10.658758163452148, "global_step": 139216, "epoch": 828} {"train_loss": -10.684732437133789, "global_step": 139217, "epoch": 828} {"train_loss": -10.409645080566406, "global_step": 139218, "epoch": 828} {"train_loss": -10.764410018920898, "global_step": 139219, "epoch": 828} {"train_loss": -10.82297420501709, "global_step": 139220, "epoch": 828} {"train_loss": -10.654190063476562, "global_step": 139221, "epoch": 828} {"train_loss": -10.965253829956055, "global_step": 139222, "epoch": 828} {"train_loss": -10.753097534179688, "global_step": 139223, "epoch": 828} {"train_loss": -10.705615997314453, "global_step": 139224, "epoch": 828} {"train_loss": -10.726317405700684, "global_step": 139225, "epoch": 828} {"train_loss": -10.649336814880371, "global_step": 139226, "epoch": 828} {"train_loss": -10.523456573486328, "global_step": 139227, "epoch": 828} {"train_loss": -10.677398681640625, "global_step": 139228, "epoch": 828} {"train_loss": -10.72877311706543, "global_step": 139229, "epoch": 828} {"train_loss": -10.436802864074707, "global_step": 139230, "epoch": 828} {"train_loss": -10.379913330078125, "global_step": 139231, "epoch": 828} {"train_loss": -10.952341079711914, "global_step": 139232, "epoch": 828} {"train_loss": -10.702546119689941, "global_step": 139233, "epoch": 828} {"train_loss": -10.494867324829102, "global_step": 139234, "epoch": 828} {"train_loss": -10.802571296691895, "global_step": 139235, "epoch": 828} {"train_loss": -10.348772048950195, "global_step": 139236, "epoch": 828} {"train_loss": -10.48255729675293, "global_step": 139237, "epoch": 828} {"train_loss": -10.709831237792969, "global_step": 139238, "epoch": 828} {"train_loss": -10.677021026611328, "global_step": 139239, "epoch": 828} {"train_loss": -10.572283744812012, "global_step": 139240, "epoch": 828} {"train_loss": -10.439187049865723, "global_step": 139241, "epoch": 828} {"train_loss": -10.476030349731445, "global_step": 139242, "epoch": 828} {"train_loss": -10.759981155395508, "global_step": 139243, "epoch": 828} {"train_loss": -10.668022155761719, "global_step": 139244, "epoch": 828} {"train_loss": -10.386991500854492, "global_step": 139245, "epoch": 828} {"train_loss": -10.748019218444824, "global_step": 139246, "epoch": 828} {"train_loss": -10.382790565490723, "global_step": 139247, "epoch": 828} {"train_loss": -10.491844177246094, "global_step": 139248, "epoch": 828} {"train_loss": -10.568809509277344, "global_step": 139249, "epoch": 828} {"train_loss": -10.494373321533203, "global_step": 139250, "epoch": 828} {"train_loss": -10.676299095153809, "global_step": 139251, "epoch": 828} {"train_loss": -10.16746711730957, "global_step": 139252, "epoch": 828} {"train_loss": -10.292936325073242, "global_step": 139253, "epoch": 828} {"train_loss": -10.438987731933594, "global_step": 139254, "epoch": 828} {"train_loss": -10.236989974975586, "global_step": 139255, "epoch": 828} {"train_loss": -10.511445999145508, "global_step": 139256, "epoch": 828} {"train_loss": -10.234972953796387, "global_step": 139257, "epoch": 828} {"train_loss": -10.695782661437988, "global_step": 139258, "epoch": 828} {"train_loss": -10.416476249694824, "global_step": 139259, "epoch": 828} {"train_loss": -10.541518211364746, "global_step": 139260, "epoch": 828} {"train_loss": -10.7247953414917, "global_step": 139261, "epoch": 828} {"train_loss": -10.343544006347656, "global_step": 139262, "epoch": 828} {"train_loss": -10.593937873840332, "global_step": 139263, "epoch": 828} {"train_loss": -10.398961067199707, "global_step": 139264, "epoch": 828} {"train_loss": -10.66175651550293, "global_step": 139265, "epoch": 828} {"train_loss": -10.548711776733398, "global_step": 139266, "epoch": 828} {"train_loss": -10.665699005126953, "global_step": 139267, "epoch": 828} {"train_loss": -10.46297836303711, "global_step": 139268, "epoch": 828} {"train_loss": -10.360479354858398, "global_step": 139269, "epoch": 828} {"train_loss": -10.352029800415039, "global_step": 139270, "epoch": 828} {"train_loss": -10.499750006766547, "global_step": 139271, "epoch": 828, "val_loss": 224237.53125} {"train_loss": -9.800708770751953, "global_step": 139272, "epoch": 829} {"train_loss": -10.448509216308594, "global_step": 139273, "epoch": 829} {"train_loss": -10.095332145690918, "global_step": 139274, "epoch": 829} {"train_loss": -10.309799194335938, "global_step": 139275, "epoch": 829} {"train_loss": -10.039741516113281, "global_step": 139276, "epoch": 829} {"train_loss": -10.15030288696289, "global_step": 139277, "epoch": 829} {"train_loss": -10.59139633178711, "global_step": 139278, "epoch": 829} {"train_loss": -10.197932243347168, "global_step": 139279, "epoch": 829} {"train_loss": -10.25693130493164, "global_step": 139280, "epoch": 829} {"train_loss": -10.482292175292969, "global_step": 139281, "epoch": 829} {"train_loss": -9.833009719848633, "global_step": 139282, "epoch": 829} {"train_loss": -10.295328140258789, "global_step": 139283, "epoch": 829} {"train_loss": -9.86589527130127, "global_step": 139284, "epoch": 829} {"train_loss": -9.997233390808105, "global_step": 139285, "epoch": 829} {"train_loss": -10.45213508605957, "global_step": 139286, "epoch": 829} {"train_loss": -9.823626518249512, "global_step": 139287, "epoch": 829} {"train_loss": -10.59937572479248, "global_step": 139288, "epoch": 829} {"train_loss": -10.221822738647461, "global_step": 139289, "epoch": 829} {"train_loss": -10.366265296936035, "global_step": 139290, "epoch": 829} {"train_loss": -10.213871002197266, "global_step": 139291, "epoch": 829} {"train_loss": -10.328311920166016, "global_step": 139292, "epoch": 829} {"train_loss": -10.065351486206055, "global_step": 139293, "epoch": 829} {"train_loss": -10.374761581420898, "global_step": 139294, "epoch": 829} {"train_loss": -10.188746452331543, "global_step": 139295, "epoch": 829} {"train_loss": -10.55367660522461, "global_step": 139296, "epoch": 829} {"train_loss": -10.709576606750488, "global_step": 139297, "epoch": 829} {"train_loss": -10.115825653076172, "global_step": 139298, "epoch": 829} {"train_loss": -10.414626121520996, "global_step": 139299, "epoch": 829} {"train_loss": -10.197381973266602, "global_step": 139300, "epoch": 829} {"train_loss": -10.45063591003418, "global_step": 139301, "epoch": 829} {"train_loss": -10.55821418762207, "global_step": 139302, "epoch": 829} {"train_loss": -10.530633926391602, "global_step": 139303, "epoch": 829} {"train_loss": -10.096927642822266, "global_step": 139304, "epoch": 829} {"train_loss": -10.652665138244629, "global_step": 139305, "epoch": 829} {"train_loss": -10.253080368041992, "global_step": 139306, "epoch": 829} {"train_loss": -10.602262496948242, "global_step": 139307, "epoch": 829} {"train_loss": -10.23710823059082, "global_step": 139308, "epoch": 829} {"train_loss": -10.506524085998535, "global_step": 139309, "epoch": 829} {"train_loss": -10.65500259399414, "global_step": 139310, "epoch": 829} {"train_loss": -10.536599159240723, "global_step": 139311, "epoch": 829} {"train_loss": -10.61384391784668, "global_step": 139312, "epoch": 829} {"train_loss": -10.469780921936035, "global_step": 139313, "epoch": 829} {"train_loss": -10.649588584899902, "global_step": 139314, "epoch": 829} {"train_loss": -10.705892562866211, "global_step": 139315, "epoch": 829} {"train_loss": -10.730582237243652, "global_step": 139316, "epoch": 829} {"train_loss": -10.593297958374023, "global_step": 139317, "epoch": 829} {"train_loss": -10.664369583129883, "global_step": 139318, "epoch": 829} {"train_loss": -10.420980453491211, "global_step": 139319, "epoch": 829} {"train_loss": -10.590879440307617, "global_step": 139320, "epoch": 829} {"train_loss": -10.42735481262207, "global_step": 139321, "epoch": 829} {"train_loss": -10.89054012298584, "global_step": 139322, "epoch": 829} {"train_loss": -10.495183944702148, "global_step": 139323, "epoch": 829} {"train_loss": -10.742973327636719, "global_step": 139324, "epoch": 829} {"train_loss": -10.535030364990234, "global_step": 139325, "epoch": 829} {"train_loss": -10.723888397216797, "global_step": 139326, "epoch": 829} {"train_loss": -10.575541496276855, "global_step": 139327, "epoch": 829} {"train_loss": -10.705791473388672, "global_step": 139328, "epoch": 829} {"train_loss": -10.379193305969238, "global_step": 139329, "epoch": 829} {"train_loss": -10.812585830688477, "global_step": 139330, "epoch": 829} {"train_loss": -10.58718490600586, "global_step": 139331, "epoch": 829} {"train_loss": -10.822001457214355, "global_step": 139332, "epoch": 829} {"train_loss": -10.657079696655273, "global_step": 139333, "epoch": 829} {"train_loss": -10.522401809692383, "global_step": 139334, "epoch": 829} {"train_loss": -10.629701614379883, "global_step": 139335, "epoch": 829} {"train_loss": -10.571715354919434, "global_step": 139336, "epoch": 829} {"train_loss": -10.661561965942383, "global_step": 139337, "epoch": 829} {"train_loss": -10.448898315429688, "global_step": 139338, "epoch": 829} {"train_loss": -10.424295425415039, "global_step": 139339, "epoch": 829} {"train_loss": -10.387181282043457, "global_step": 139340, "epoch": 829} {"train_loss": -10.294302940368652, "global_step": 139341, "epoch": 829} {"train_loss": -10.492703437805176, "global_step": 139342, "epoch": 829} {"train_loss": -10.417192459106445, "global_step": 139343, "epoch": 829} {"train_loss": -10.179362297058105, "global_step": 139344, "epoch": 829} {"train_loss": -10.46899127960205, "global_step": 139345, "epoch": 829} {"train_loss": -10.047422409057617, "global_step": 139346, "epoch": 829} {"train_loss": -10.16429328918457, "global_step": 139347, "epoch": 829} {"train_loss": -10.10322380065918, "global_step": 139348, "epoch": 829} {"train_loss": -9.532867431640625, "global_step": 139349, "epoch": 829} {"train_loss": -10.663984298706055, "global_step": 139350, "epoch": 829} {"train_loss": -9.353004455566406, "global_step": 139351, "epoch": 829} {"train_loss": -9.922750473022461, "global_step": 139352, "epoch": 829} {"train_loss": -10.473235130310059, "global_step": 139353, "epoch": 829} {"train_loss": -9.791345596313477, "global_step": 139354, "epoch": 829} {"train_loss": -10.756816864013672, "global_step": 139355, "epoch": 829} {"train_loss": -10.321945190429688, "global_step": 139356, "epoch": 829} {"train_loss": -10.430438041687012, "global_step": 139357, "epoch": 829} {"train_loss": -10.522597312927246, "global_step": 139358, "epoch": 829} {"train_loss": -10.555166244506836, "global_step": 139359, "epoch": 829} {"train_loss": -10.149202346801758, "global_step": 139360, "epoch": 829} {"train_loss": -10.47145938873291, "global_step": 139361, "epoch": 829} {"train_loss": -10.56266975402832, "global_step": 139362, "epoch": 829} {"train_loss": -10.303060531616211, "global_step": 139363, "epoch": 829} {"train_loss": -10.671889305114746, "global_step": 139364, "epoch": 829} {"train_loss": -10.650785446166992, "global_step": 139365, "epoch": 829} {"train_loss": -10.69109058380127, "global_step": 139366, "epoch": 829} {"train_loss": -10.593213081359863, "global_step": 139367, "epoch": 829} {"train_loss": -10.724185943603516, "global_step": 139368, "epoch": 829} {"train_loss": -10.690971374511719, "global_step": 139369, "epoch": 829} {"train_loss": -10.539572715759277, "global_step": 139370, "epoch": 829} {"train_loss": -10.098584175109863, "global_step": 139371, "epoch": 829} {"train_loss": -10.53693675994873, "global_step": 139372, "epoch": 829} {"train_loss": -10.479085922241211, "global_step": 139373, "epoch": 829} {"train_loss": -10.38092041015625, "global_step": 139374, "epoch": 829} {"train_loss": -10.656028747558594, "global_step": 139375, "epoch": 829} {"train_loss": -10.22364616394043, "global_step": 139376, "epoch": 829} {"train_loss": -10.531890869140625, "global_step": 139377, "epoch": 829} {"train_loss": -10.317358016967773, "global_step": 139378, "epoch": 829} {"train_loss": -10.694232940673828, "global_step": 139379, "epoch": 829} {"train_loss": -10.373912811279297, "global_step": 139380, "epoch": 829} {"train_loss": -10.607597351074219, "global_step": 139381, "epoch": 829} {"train_loss": -10.3922119140625, "global_step": 139382, "epoch": 829} {"train_loss": -10.346446990966797, "global_step": 139383, "epoch": 829} {"train_loss": -10.608352661132812, "global_step": 139384, "epoch": 829} {"train_loss": -10.44610595703125, "global_step": 139385, "epoch": 829} {"train_loss": -10.735579490661621, "global_step": 139386, "epoch": 829} {"train_loss": -10.678050994873047, "global_step": 139387, "epoch": 829} {"train_loss": -10.408634185791016, "global_step": 139388, "epoch": 829} {"train_loss": -10.641132354736328, "global_step": 139389, "epoch": 829} {"train_loss": -10.490090370178223, "global_step": 139390, "epoch": 829} {"train_loss": -10.762248992919922, "global_step": 139391, "epoch": 829} {"train_loss": -10.655346870422363, "global_step": 139392, "epoch": 829} {"train_loss": -10.78941822052002, "global_step": 139393, "epoch": 829} {"train_loss": -10.761789321899414, "global_step": 139394, "epoch": 829} {"train_loss": -10.852693557739258, "global_step": 139395, "epoch": 829} {"train_loss": -10.48495864868164, "global_step": 139396, "epoch": 829} {"train_loss": -10.906471252441406, "global_step": 139397, "epoch": 829} {"train_loss": -10.5587797164917, "global_step": 139398, "epoch": 829} {"train_loss": -10.801460266113281, "global_step": 139399, "epoch": 829} {"train_loss": -10.848564147949219, "global_step": 139400, "epoch": 829} {"train_loss": -10.811677932739258, "global_step": 139401, "epoch": 829} {"train_loss": -10.639537811279297, "global_step": 139402, "epoch": 829} {"train_loss": -10.513583183288574, "global_step": 139403, "epoch": 829} {"train_loss": -10.053838729858398, "global_step": 139404, "epoch": 829} {"train_loss": -10.911916732788086, "global_step": 139405, "epoch": 829} {"train_loss": -10.208734512329102, "global_step": 139406, "epoch": 829} {"train_loss": -10.75542163848877, "global_step": 139407, "epoch": 829} {"train_loss": -10.662564277648926, "global_step": 139408, "epoch": 829} {"train_loss": -10.981260299682617, "global_step": 139409, "epoch": 829} {"train_loss": -10.67863941192627, "global_step": 139410, "epoch": 829} {"train_loss": -10.700658798217773, "global_step": 139411, "epoch": 829} {"train_loss": -10.807236671447754, "global_step": 139412, "epoch": 829} {"train_loss": -10.708416938781738, "global_step": 139413, "epoch": 829} {"train_loss": -10.291462898254395, "global_step": 139414, "epoch": 829} {"train_loss": -10.739418029785156, "global_step": 139415, "epoch": 829} {"train_loss": -10.756546020507812, "global_step": 139416, "epoch": 829} {"train_loss": -10.546623229980469, "global_step": 139417, "epoch": 829} {"train_loss": -10.26550579071045, "global_step": 139418, "epoch": 829} {"train_loss": -10.466924667358398, "global_step": 139419, "epoch": 829} {"train_loss": -10.678210258483887, "global_step": 139420, "epoch": 829} {"train_loss": -10.346009254455566, "global_step": 139421, "epoch": 829} {"train_loss": -10.459188461303711, "global_step": 139422, "epoch": 829} {"train_loss": -10.638328552246094, "global_step": 139423, "epoch": 829} {"train_loss": -10.509008407592773, "global_step": 139424, "epoch": 829} {"train_loss": -10.65328598022461, "global_step": 139425, "epoch": 829} {"train_loss": -10.700212478637695, "global_step": 139426, "epoch": 829} {"train_loss": -10.643028259277344, "global_step": 139427, "epoch": 829} {"train_loss": -10.759214401245117, "global_step": 139428, "epoch": 829} {"train_loss": -10.739068031311035, "global_step": 139429, "epoch": 829} {"train_loss": -10.399969100952148, "global_step": 139430, "epoch": 829} {"train_loss": -10.44904613494873, "global_step": 139431, "epoch": 829} {"train_loss": -10.639689445495605, "global_step": 139432, "epoch": 829} {"train_loss": -10.736153602600098, "global_step": 139433, "epoch": 829} {"train_loss": -10.709772109985352, "global_step": 139434, "epoch": 829} {"train_loss": -10.651268005371094, "global_step": 139435, "epoch": 829} {"train_loss": -10.843029022216797, "global_step": 139436, "epoch": 829} {"train_loss": -10.466781616210938, "global_step": 139437, "epoch": 829} {"train_loss": -10.470968246459961, "global_step": 139438, "epoch": 829} {"train_loss": -10.480683758145286, "global_step": 139439, "epoch": 829, "val_loss": 222739.046875} {"train_loss": -10.558603286743164, "global_step": 139440, "epoch": 830} {"train_loss": -10.68521499633789, "global_step": 139441, "epoch": 830} {"train_loss": -10.224672317504883, "global_step": 139442, "epoch": 830} {"train_loss": -10.632011413574219, "global_step": 139443, "epoch": 830} {"train_loss": -10.681437492370605, "global_step": 139444, "epoch": 830} {"train_loss": -10.732187271118164, "global_step": 139445, "epoch": 830} {"train_loss": -10.49050521850586, "global_step": 139446, "epoch": 830} {"train_loss": -10.713823318481445, "global_step": 139447, "epoch": 830} {"train_loss": -10.57040023803711, "global_step": 139448, "epoch": 830} {"train_loss": -10.684770584106445, "global_step": 139449, "epoch": 830} {"train_loss": -10.573802947998047, "global_step": 139450, "epoch": 830} {"train_loss": -10.329615592956543, "global_step": 139451, "epoch": 830} {"train_loss": -10.658297538757324, "global_step": 139452, "epoch": 830} {"train_loss": -10.298227310180664, "global_step": 139453, "epoch": 830} {"train_loss": -10.610564231872559, "global_step": 139454, "epoch": 830} {"train_loss": -10.74380874633789, "global_step": 139455, "epoch": 830} {"train_loss": -10.627248764038086, "global_step": 139456, "epoch": 830} {"train_loss": -10.6883544921875, "global_step": 139457, "epoch": 830} {"train_loss": -10.525370597839355, "global_step": 139458, "epoch": 830} {"train_loss": -10.615547180175781, "global_step": 139459, "epoch": 830} {"train_loss": -10.504966735839844, "global_step": 139460, "epoch": 830} {"train_loss": -10.476943969726562, "global_step": 139461, "epoch": 830} {"train_loss": -10.595746994018555, "global_step": 139462, "epoch": 830} {"train_loss": -10.423181533813477, "global_step": 139463, "epoch": 830} {"train_loss": -10.589558601379395, "global_step": 139464, "epoch": 830} {"train_loss": -10.186594009399414, "global_step": 139465, "epoch": 830} {"train_loss": -10.508338928222656, "global_step": 139466, "epoch": 830} {"train_loss": -10.337423324584961, "global_step": 139467, "epoch": 830} {"train_loss": -10.556879043579102, "global_step": 139468, "epoch": 830} {"train_loss": -9.945695877075195, "global_step": 139469, "epoch": 830} {"train_loss": -9.982454299926758, "global_step": 139470, "epoch": 830} {"train_loss": -9.577359199523926, "global_step": 139471, "epoch": 830} {"train_loss": -9.812445640563965, "global_step": 139472, "epoch": 830} {"train_loss": -10.067598342895508, "global_step": 139473, "epoch": 830} {"train_loss": -9.098653793334961, "global_step": 139474, "epoch": 830} {"train_loss": -10.205482482910156, "global_step": 139475, "epoch": 830} {"train_loss": -10.355630874633789, "global_step": 139476, "epoch": 830} {"train_loss": -9.763397216796875, "global_step": 139477, "epoch": 830} {"train_loss": -10.271025657653809, "global_step": 139478, "epoch": 830} {"train_loss": -10.166358947753906, "global_step": 139479, "epoch": 830} {"train_loss": -10.419476509094238, "global_step": 139480, "epoch": 830} {"train_loss": -10.475686073303223, "global_step": 139481, "epoch": 830} {"train_loss": -10.497879028320312, "global_step": 139482, "epoch": 830} {"train_loss": -10.230518341064453, "global_step": 139483, "epoch": 830} {"train_loss": -10.665199279785156, "global_step": 139484, "epoch": 830} {"train_loss": -10.345491409301758, "global_step": 139485, "epoch": 830} {"train_loss": -10.045206069946289, "global_step": 139486, "epoch": 830} {"train_loss": -10.293567657470703, "global_step": 139487, "epoch": 830} {"train_loss": -10.341716766357422, "global_step": 139488, "epoch": 830} {"train_loss": -10.367555618286133, "global_step": 139489, "epoch": 830} {"train_loss": -10.427555084228516, "global_step": 139490, "epoch": 830} {"train_loss": -10.44544792175293, "global_step": 139491, "epoch": 830} {"train_loss": -9.978128433227539, "global_step": 139492, "epoch": 830} {"train_loss": -10.517871856689453, "global_step": 139493, "epoch": 830} {"train_loss": -10.630908966064453, "global_step": 139494, "epoch": 830} {"train_loss": -10.457914352416992, "global_step": 139495, "epoch": 830} {"train_loss": -10.639616012573242, "global_step": 139496, "epoch": 830} {"train_loss": -10.630329132080078, "global_step": 139497, "epoch": 830} {"train_loss": -10.527036666870117, "global_step": 139498, "epoch": 830} {"train_loss": -10.441902160644531, "global_step": 139499, "epoch": 830} {"train_loss": -10.53010082244873, "global_step": 139500, "epoch": 830} {"train_loss": -10.422563552856445, "global_step": 139501, "epoch": 830} {"train_loss": -10.852320671081543, "global_step": 139502, "epoch": 830} {"train_loss": -10.301170349121094, "global_step": 139503, "epoch": 830} {"train_loss": -10.764485359191895, "global_step": 139504, "epoch": 830} {"train_loss": -9.944549560546875, "global_step": 139505, "epoch": 830} {"train_loss": -10.27294921875, "global_step": 139506, "epoch": 830} {"train_loss": -10.47093391418457, "global_step": 139507, "epoch": 830} {"train_loss": -10.320585250854492, "global_step": 139508, "epoch": 830} {"train_loss": -10.421133041381836, "global_step": 139509, "epoch": 830} {"train_loss": -10.580944061279297, "global_step": 139510, "epoch": 830} {"train_loss": -10.369612693786621, "global_step": 139511, "epoch": 830} {"train_loss": -10.678407669067383, "global_step": 139512, "epoch": 830} {"train_loss": -10.30202865600586, "global_step": 139513, "epoch": 830} {"train_loss": -10.569049835205078, "global_step": 139514, "epoch": 830} {"train_loss": -10.276145935058594, "global_step": 139515, "epoch": 830} {"train_loss": -10.450773239135742, "global_step": 139516, "epoch": 830} {"train_loss": -10.463541030883789, "global_step": 139517, "epoch": 830} {"train_loss": -10.333765029907227, "global_step": 139518, "epoch": 830} {"train_loss": -10.879780769348145, "global_step": 139519, "epoch": 830} {"train_loss": -10.525636672973633, "global_step": 139520, "epoch": 830} {"train_loss": -10.505142211914062, "global_step": 139521, "epoch": 830} {"train_loss": -10.684431076049805, "global_step": 139522, "epoch": 830} {"train_loss": -9.876399993896484, "global_step": 139523, "epoch": 830} {"train_loss": -10.321016311645508, "global_step": 139524, "epoch": 830} {"train_loss": -9.690014839172363, "global_step": 139525, "epoch": 830} {"train_loss": -10.402148246765137, "global_step": 139526, "epoch": 830} {"train_loss": -10.148979187011719, "global_step": 139527, "epoch": 830} {"train_loss": -10.506726264953613, "global_step": 139528, "epoch": 830} {"train_loss": -10.332220077514648, "global_step": 139529, "epoch": 830} {"train_loss": -10.40280532836914, "global_step": 139530, "epoch": 830} {"train_loss": -10.214722633361816, "global_step": 139531, "epoch": 830} {"train_loss": -10.094501495361328, "global_step": 139532, "epoch": 830} {"train_loss": -10.659082412719727, "global_step": 139533, "epoch": 830} {"train_loss": -10.460516929626465, "global_step": 139534, "epoch": 830} {"train_loss": -10.633838653564453, "global_step": 139535, "epoch": 830} {"train_loss": -10.290159225463867, "global_step": 139536, "epoch": 830} {"train_loss": -10.485668182373047, "global_step": 139537, "epoch": 830} {"train_loss": -10.391678810119629, "global_step": 139538, "epoch": 830} {"train_loss": -10.390154838562012, "global_step": 139539, "epoch": 830} {"train_loss": -10.092323303222656, "global_step": 139540, "epoch": 830} {"train_loss": -10.51297378540039, "global_step": 139541, "epoch": 830} {"train_loss": -10.083696365356445, "global_step": 139542, "epoch": 830} {"train_loss": -10.434337615966797, "global_step": 139543, "epoch": 830} {"train_loss": -10.533262252807617, "global_step": 139544, "epoch": 830} {"train_loss": -10.304313659667969, "global_step": 139545, "epoch": 830} {"train_loss": -10.699287414550781, "global_step": 139546, "epoch": 830} {"train_loss": -10.324005126953125, "global_step": 139547, "epoch": 830} {"train_loss": -10.489295959472656, "global_step": 139548, "epoch": 830} {"train_loss": -10.505388259887695, "global_step": 139549, "epoch": 830} {"train_loss": -10.754242897033691, "global_step": 139550, "epoch": 830} {"train_loss": -10.373025894165039, "global_step": 139551, "epoch": 830} {"train_loss": -10.771169662475586, "global_step": 139552, "epoch": 830} {"train_loss": -10.580758094787598, "global_step": 139553, "epoch": 830} {"train_loss": -10.466386795043945, "global_step": 139554, "epoch": 830} {"train_loss": -10.260050773620605, "global_step": 139555, "epoch": 830} {"train_loss": -10.609136581420898, "global_step": 139556, "epoch": 830} {"train_loss": -10.31106948852539, "global_step": 139557, "epoch": 830} {"train_loss": -10.40209674835205, "global_step": 139558, "epoch": 830} {"train_loss": -10.34815788269043, "global_step": 139559, "epoch": 830} {"train_loss": -10.314717292785645, "global_step": 139560, "epoch": 830} {"train_loss": -10.4759521484375, "global_step": 139561, "epoch": 830} {"train_loss": -10.16321086883545, "global_step": 139562, "epoch": 830} {"train_loss": -10.658723831176758, "global_step": 139563, "epoch": 830} {"train_loss": -10.416498184204102, "global_step": 139564, "epoch": 830} {"train_loss": -10.524028778076172, "global_step": 139565, "epoch": 830} {"train_loss": -10.497903823852539, "global_step": 139566, "epoch": 830} {"train_loss": -10.385823249816895, "global_step": 139567, "epoch": 830} {"train_loss": -10.616748809814453, "global_step": 139568, "epoch": 830} {"train_loss": -10.347505569458008, "global_step": 139569, "epoch": 830} {"train_loss": -10.282064437866211, "global_step": 139570, "epoch": 830} {"train_loss": -9.638167381286621, "global_step": 139571, "epoch": 830} {"train_loss": -10.180719375610352, "global_step": 139572, "epoch": 830} {"train_loss": -9.828771591186523, "global_step": 139573, "epoch": 830} {"train_loss": -9.827098846435547, "global_step": 139574, "epoch": 830} {"train_loss": -10.803942680358887, "global_step": 139575, "epoch": 830} {"train_loss": -10.104585647583008, "global_step": 139576, "epoch": 830} {"train_loss": -10.597818374633789, "global_step": 139577, "epoch": 830} {"train_loss": -10.066696166992188, "global_step": 139578, "epoch": 830} {"train_loss": -10.711257934570312, "global_step": 139579, "epoch": 830} {"train_loss": -10.334588050842285, "global_step": 139580, "epoch": 830} {"train_loss": -10.611940383911133, "global_step": 139581, "epoch": 830} {"train_loss": -10.627238273620605, "global_step": 139582, "epoch": 830} {"train_loss": -10.468588829040527, "global_step": 139583, "epoch": 830} {"train_loss": -10.609912872314453, "global_step": 139584, "epoch": 830} {"train_loss": -10.744181632995605, "global_step": 139585, "epoch": 830} {"train_loss": -10.473559379577637, "global_step": 139586, "epoch": 830} {"train_loss": -10.66372299194336, "global_step": 139587, "epoch": 830} {"train_loss": -10.304357528686523, "global_step": 139588, "epoch": 830} {"train_loss": -10.72433090209961, "global_step": 139589, "epoch": 830} {"train_loss": -10.38978385925293, "global_step": 139590, "epoch": 830} {"train_loss": -10.712182998657227, "global_step": 139591, "epoch": 830} {"train_loss": -10.606821060180664, "global_step": 139592, "epoch": 830} {"train_loss": -10.186978340148926, "global_step": 139593, "epoch": 830} {"train_loss": -10.621326446533203, "global_step": 139594, "epoch": 830} {"train_loss": -10.24747371673584, "global_step": 139595, "epoch": 830} {"train_loss": -10.748245239257812, "global_step": 139596, "epoch": 830} {"train_loss": -10.494966506958008, "global_step": 139597, "epoch": 830} {"train_loss": -10.853796005249023, "global_step": 139598, "epoch": 830} {"train_loss": -10.686019897460938, "global_step": 139599, "epoch": 830} {"train_loss": -10.64775276184082, "global_step": 139600, "epoch": 830} {"train_loss": -10.401909828186035, "global_step": 139601, "epoch": 830} {"train_loss": -10.724874496459961, "global_step": 139602, "epoch": 830} {"train_loss": -10.65727710723877, "global_step": 139603, "epoch": 830} {"train_loss": -10.122998237609863, "global_step": 139604, "epoch": 830} {"train_loss": -10.644729614257812, "global_step": 139605, "epoch": 830} {"train_loss": -10.438833236694336, "global_step": 139606, "epoch": 830} {"train_loss": -10.416687573705401, "global_step": 139607, "epoch": 830, "val_loss": 226137.0, "train_action_mse_error": 1.64597487449646} {"train_loss": -10.515100479125977, "global_step": 139608, "epoch": 831} {"train_loss": -10.465948104858398, "global_step": 139609, "epoch": 831} {"train_loss": -10.620311737060547, "global_step": 139610, "epoch": 831} {"train_loss": -10.566542625427246, "global_step": 139611, "epoch": 831} {"train_loss": -10.492098808288574, "global_step": 139612, "epoch": 831} {"train_loss": -10.65062427520752, "global_step": 139613, "epoch": 831} {"train_loss": -10.403696060180664, "global_step": 139614, "epoch": 831} {"train_loss": -10.418705940246582, "global_step": 139615, "epoch": 831} {"train_loss": -10.466476440429688, "global_step": 139616, "epoch": 831} {"train_loss": -10.147655487060547, "global_step": 139617, "epoch": 831} {"train_loss": -10.408674240112305, "global_step": 139618, "epoch": 831} {"train_loss": -10.480697631835938, "global_step": 139619, "epoch": 831} {"train_loss": -10.441309928894043, "global_step": 139620, "epoch": 831} {"train_loss": -10.427274703979492, "global_step": 139621, "epoch": 831} {"train_loss": -10.265787124633789, "global_step": 139622, "epoch": 831} {"train_loss": -10.468262672424316, "global_step": 139623, "epoch": 831} {"train_loss": -10.394624710083008, "global_step": 139624, "epoch": 831} {"train_loss": -10.713756561279297, "global_step": 139625, "epoch": 831} {"train_loss": -10.4381685256958, "global_step": 139626, "epoch": 831} {"train_loss": -10.835362434387207, "global_step": 139627, "epoch": 831} {"train_loss": -10.601524353027344, "global_step": 139628, "epoch": 831} {"train_loss": -10.937877655029297, "global_step": 139629, "epoch": 831} {"train_loss": -10.524494171142578, "global_step": 139630, "epoch": 831} {"train_loss": -10.687421798706055, "global_step": 139631, "epoch": 831} {"train_loss": -10.537967681884766, "global_step": 139632, "epoch": 831} {"train_loss": -10.4129638671875, "global_step": 139633, "epoch": 831} {"train_loss": -10.80544376373291, "global_step": 139634, "epoch": 831} {"train_loss": -10.393548011779785, "global_step": 139635, "epoch": 831} {"train_loss": -10.728422164916992, "global_step": 139636, "epoch": 831} {"train_loss": -10.514429092407227, "global_step": 139637, "epoch": 831} {"train_loss": -10.433387756347656, "global_step": 139638, "epoch": 831} {"train_loss": -10.78977108001709, "global_step": 139639, "epoch": 831} {"train_loss": -10.588991165161133, "global_step": 139640, "epoch": 831} {"train_loss": -10.67452335357666, "global_step": 139641, "epoch": 831} {"train_loss": -10.837745666503906, "global_step": 139642, "epoch": 831} {"train_loss": -10.747505187988281, "global_step": 139643, "epoch": 831} {"train_loss": -10.803254127502441, "global_step": 139644, "epoch": 831} {"train_loss": -10.871500015258789, "global_step": 139645, "epoch": 831} {"train_loss": -10.745672225952148, "global_step": 139646, "epoch": 831} {"train_loss": -10.80814266204834, "global_step": 139647, "epoch": 831} {"train_loss": -10.591707229614258, "global_step": 139648, "epoch": 831} {"train_loss": -10.669525146484375, "global_step": 139649, "epoch": 831} {"train_loss": -11.04133129119873, "global_step": 139650, "epoch": 831} {"train_loss": -10.824249267578125, "global_step": 139651, "epoch": 831} {"train_loss": -10.910816192626953, "global_step": 139652, "epoch": 831} {"train_loss": -10.836406707763672, "global_step": 139653, "epoch": 831} {"train_loss": -10.660099029541016, "global_step": 139654, "epoch": 831} {"train_loss": -10.560748100280762, "global_step": 139655, "epoch": 831} {"train_loss": -10.461326599121094, "global_step": 139656, "epoch": 831} {"train_loss": -10.49496841430664, "global_step": 139657, "epoch": 831} {"train_loss": -10.292868614196777, "global_step": 139658, "epoch": 831} {"train_loss": -10.796926498413086, "global_step": 139659, "epoch": 831} {"train_loss": -10.44303035736084, "global_step": 139660, "epoch": 831} {"train_loss": -10.388069152832031, "global_step": 139661, "epoch": 831} {"train_loss": -10.789714813232422, "global_step": 139662, "epoch": 831} {"train_loss": -10.708982467651367, "global_step": 139663, "epoch": 831} {"train_loss": -10.584539413452148, "global_step": 139664, "epoch": 831} {"train_loss": -10.58566951751709, "global_step": 139665, "epoch": 831} {"train_loss": -10.729060173034668, "global_step": 139666, "epoch": 831} {"train_loss": -10.339605331420898, "global_step": 139667, "epoch": 831} {"train_loss": -10.372885704040527, "global_step": 139668, "epoch": 831} {"train_loss": -10.531137466430664, "global_step": 139669, "epoch": 831} {"train_loss": -10.31732177734375, "global_step": 139670, "epoch": 831} {"train_loss": -10.679620742797852, "global_step": 139671, "epoch": 831} {"train_loss": -10.560979843139648, "global_step": 139672, "epoch": 831} {"train_loss": -10.794672966003418, "global_step": 139673, "epoch": 831} {"train_loss": -10.520212173461914, "global_step": 139674, "epoch": 831} {"train_loss": -10.401008605957031, "global_step": 139675, "epoch": 831} {"train_loss": -10.379032135009766, "global_step": 139676, "epoch": 831} {"train_loss": -10.369701385498047, "global_step": 139677, "epoch": 831} {"train_loss": -9.96622371673584, "global_step": 139678, "epoch": 831} {"train_loss": -10.327759742736816, "global_step": 139679, "epoch": 831} {"train_loss": -10.65030288696289, "global_step": 139680, "epoch": 831} {"train_loss": -10.70536994934082, "global_step": 139681, "epoch": 831} {"train_loss": -10.485008239746094, "global_step": 139682, "epoch": 831} {"train_loss": -10.671754837036133, "global_step": 139683, "epoch": 831} {"train_loss": -10.687390327453613, "global_step": 139684, "epoch": 831} {"train_loss": -10.34167194366455, "global_step": 139685, "epoch": 831} {"train_loss": -10.35374641418457, "global_step": 139686, "epoch": 831} {"train_loss": -10.481758117675781, "global_step": 139687, "epoch": 831} {"train_loss": -10.625995635986328, "global_step": 139688, "epoch": 831} {"train_loss": -10.547372817993164, "global_step": 139689, "epoch": 831} {"train_loss": -10.386838912963867, "global_step": 139690, "epoch": 831} {"train_loss": -10.590489387512207, "global_step": 139691, "epoch": 831} {"train_loss": -10.34160327911377, "global_step": 139692, "epoch": 831} {"train_loss": -10.451339721679688, "global_step": 139693, "epoch": 831} {"train_loss": -10.26971435546875, "global_step": 139694, "epoch": 831} {"train_loss": -10.35946273803711, "global_step": 139695, "epoch": 831} {"train_loss": -10.548810958862305, "global_step": 139696, "epoch": 831} {"train_loss": -10.357644081115723, "global_step": 139697, "epoch": 831} {"train_loss": -10.319242477416992, "global_step": 139698, "epoch": 831} {"train_loss": -10.277791023254395, "global_step": 139699, "epoch": 831} {"train_loss": -10.299933433532715, "global_step": 139700, "epoch": 831} {"train_loss": -10.479552268981934, "global_step": 139701, "epoch": 831} {"train_loss": -10.289176940917969, "global_step": 139702, "epoch": 831} {"train_loss": -10.683609008789062, "global_step": 139703, "epoch": 831} {"train_loss": -10.489568710327148, "global_step": 139704, "epoch": 831} {"train_loss": -10.577346801757812, "global_step": 139705, "epoch": 831} {"train_loss": -10.519800186157227, "global_step": 139706, "epoch": 831} {"train_loss": -10.489110946655273, "global_step": 139707, "epoch": 831} {"train_loss": -10.763293266296387, "global_step": 139708, "epoch": 831} {"train_loss": -10.516977310180664, "global_step": 139709, "epoch": 831} {"train_loss": -10.475639343261719, "global_step": 139710, "epoch": 831} {"train_loss": -10.536214828491211, "global_step": 139711, "epoch": 831} {"train_loss": -10.746843338012695, "global_step": 139712, "epoch": 831} {"train_loss": -10.861313819885254, "global_step": 139713, "epoch": 831} {"train_loss": -10.705825805664062, "global_step": 139714, "epoch": 831} {"train_loss": -10.616146087646484, "global_step": 139715, "epoch": 831} {"train_loss": -10.900132179260254, "global_step": 139716, "epoch": 831} {"train_loss": -10.666515350341797, "global_step": 139717, "epoch": 831} {"train_loss": -10.569474220275879, "global_step": 139718, "epoch": 831} {"train_loss": -10.699724197387695, "global_step": 139719, "epoch": 831} {"train_loss": -10.3631591796875, "global_step": 139720, "epoch": 831} {"train_loss": -10.656251907348633, "global_step": 139721, "epoch": 831} {"train_loss": -10.704490661621094, "global_step": 139722, "epoch": 831} {"train_loss": -10.727540016174316, "global_step": 139723, "epoch": 831} {"train_loss": -10.928214073181152, "global_step": 139724, "epoch": 831} {"train_loss": -10.590873718261719, "global_step": 139725, "epoch": 831} {"train_loss": -10.779300689697266, "global_step": 139726, "epoch": 831} {"train_loss": -10.787763595581055, "global_step": 139727, "epoch": 831} {"train_loss": -10.76692008972168, "global_step": 139728, "epoch": 831} {"train_loss": -10.739694595336914, "global_step": 139729, "epoch": 831} {"train_loss": -10.576879501342773, "global_step": 139730, "epoch": 831} {"train_loss": -10.747127532958984, "global_step": 139731, "epoch": 831} {"train_loss": -10.228143692016602, "global_step": 139732, "epoch": 831} {"train_loss": -10.587873458862305, "global_step": 139733, "epoch": 831} {"train_loss": -10.709261894226074, "global_step": 139734, "epoch": 831} {"train_loss": -10.703424453735352, "global_step": 139735, "epoch": 831} {"train_loss": -10.668937683105469, "global_step": 139736, "epoch": 831} {"train_loss": -10.53300666809082, "global_step": 139737, "epoch": 831} {"train_loss": -10.684542655944824, "global_step": 139738, "epoch": 831} {"train_loss": -10.854997634887695, "global_step": 139739, "epoch": 831} {"train_loss": -10.69149398803711, "global_step": 139740, "epoch": 831} {"train_loss": -10.706661224365234, "global_step": 139741, "epoch": 831} {"train_loss": -10.778951644897461, "global_step": 139742, "epoch": 831} {"train_loss": -10.487550735473633, "global_step": 139743, "epoch": 831} {"train_loss": -10.428985595703125, "global_step": 139744, "epoch": 831} {"train_loss": -10.56979751586914, "global_step": 139745, "epoch": 831} {"train_loss": -10.159578323364258, "global_step": 139746, "epoch": 831} {"train_loss": -9.603561401367188, "global_step": 139747, "epoch": 831} {"train_loss": -10.121570587158203, "global_step": 139748, "epoch": 831} {"train_loss": -10.27099609375, "global_step": 139749, "epoch": 831} {"train_loss": -10.084388732910156, "global_step": 139750, "epoch": 831} {"train_loss": -10.546506881713867, "global_step": 139751, "epoch": 831} {"train_loss": -10.436241149902344, "global_step": 139752, "epoch": 831} {"train_loss": -10.313697814941406, "global_step": 139753, "epoch": 831} {"train_loss": -10.589889526367188, "global_step": 139754, "epoch": 831} {"train_loss": -10.255218505859375, "global_step": 139755, "epoch": 831} {"train_loss": -10.557343482971191, "global_step": 139756, "epoch": 831} {"train_loss": -10.407613754272461, "global_step": 139757, "epoch": 831} {"train_loss": -9.613582611083984, "global_step": 139758, "epoch": 831} {"train_loss": -10.498395919799805, "global_step": 139759, "epoch": 831} {"train_loss": -10.005792617797852, "global_step": 139760, "epoch": 831} {"train_loss": -10.083786964416504, "global_step": 139761, "epoch": 831} {"train_loss": -10.585371971130371, "global_step": 139762, "epoch": 831} {"train_loss": -10.406213760375977, "global_step": 139763, "epoch": 831} {"train_loss": -10.635478019714355, "global_step": 139764, "epoch": 831} {"train_loss": -10.359063148498535, "global_step": 139765, "epoch": 831} {"train_loss": -10.348067283630371, "global_step": 139766, "epoch": 831} {"train_loss": -10.526958465576172, "global_step": 139767, "epoch": 831} {"train_loss": -10.391902923583984, "global_step": 139768, "epoch": 831} {"train_loss": -10.63129711151123, "global_step": 139769, "epoch": 831} {"train_loss": -10.45112419128418, "global_step": 139770, "epoch": 831} {"train_loss": -10.438985824584961, "global_step": 139771, "epoch": 831} {"train_loss": -10.431402206420898, "global_step": 139772, "epoch": 831} {"train_loss": -10.65988826751709, "global_step": 139773, "epoch": 831} {"train_loss": -10.722271919250488, "global_step": 139774, "epoch": 831} {"train_loss": -10.53592262381599, "global_step": 139775, "epoch": 831, "val_loss": 224660.921875} {"train_loss": -10.694540977478027, "global_step": 139776, "epoch": 832} {"train_loss": -10.874551773071289, "global_step": 139777, "epoch": 832} {"train_loss": -10.60902214050293, "global_step": 139778, "epoch": 832} {"train_loss": -10.52015495300293, "global_step": 139779, "epoch": 832} {"train_loss": -10.72782039642334, "global_step": 139780, "epoch": 832} {"train_loss": -10.499798774719238, "global_step": 139781, "epoch": 832} {"train_loss": -10.238967895507812, "global_step": 139782, "epoch": 832} {"train_loss": -10.56031608581543, "global_step": 139783, "epoch": 832} {"train_loss": -10.71666431427002, "global_step": 139784, "epoch": 832} {"train_loss": -10.63857650756836, "global_step": 139785, "epoch": 832} {"train_loss": -10.656896591186523, "global_step": 139786, "epoch": 832} {"train_loss": -10.39533519744873, "global_step": 139787, "epoch": 832} {"train_loss": -10.732074737548828, "global_step": 139788, "epoch": 832} {"train_loss": -10.501104354858398, "global_step": 139789, "epoch": 832} {"train_loss": -10.411463737487793, "global_step": 139790, "epoch": 832} {"train_loss": -10.74714469909668, "global_step": 139791, "epoch": 832} {"train_loss": -10.562593460083008, "global_step": 139792, "epoch": 832} {"train_loss": -10.869524002075195, "global_step": 139793, "epoch": 832} {"train_loss": -10.086782455444336, "global_step": 139794, "epoch": 832} {"train_loss": -10.245132446289062, "global_step": 139795, "epoch": 832} {"train_loss": -10.457239151000977, "global_step": 139796, "epoch": 832} {"train_loss": -10.116401672363281, "global_step": 139797, "epoch": 832} {"train_loss": -10.3098783493042, "global_step": 139798, "epoch": 832} {"train_loss": -10.62122631072998, "global_step": 139799, "epoch": 832} {"train_loss": -10.2883882522583, "global_step": 139800, "epoch": 832} {"train_loss": -10.733238220214844, "global_step": 139801, "epoch": 832} {"train_loss": -9.726629257202148, "global_step": 139802, "epoch": 832} {"train_loss": -10.627347946166992, "global_step": 139803, "epoch": 832} {"train_loss": -9.893157958984375, "global_step": 139804, "epoch": 832} {"train_loss": -10.033744812011719, "global_step": 139805, "epoch": 832} {"train_loss": -10.28994369506836, "global_step": 139806, "epoch": 832} {"train_loss": -9.730669975280762, "global_step": 139807, "epoch": 832} {"train_loss": -10.465011596679688, "global_step": 139808, "epoch": 832} {"train_loss": -9.65671157836914, "global_step": 139809, "epoch": 832} {"train_loss": -9.9967041015625, "global_step": 139810, "epoch": 832} {"train_loss": -9.470585823059082, "global_step": 139811, "epoch": 832} {"train_loss": -9.937089920043945, "global_step": 139812, "epoch": 832} {"train_loss": -8.861302375793457, "global_step": 139813, "epoch": 832} {"train_loss": -9.993918418884277, "global_step": 139814, "epoch": 832} {"train_loss": -9.54037857055664, "global_step": 139815, "epoch": 832} {"train_loss": -10.208430290222168, "global_step": 139816, "epoch": 832} {"train_loss": -9.872627258300781, "global_step": 139817, "epoch": 832} {"train_loss": -10.083444595336914, "global_step": 139818, "epoch": 832} {"train_loss": -10.127567291259766, "global_step": 139819, "epoch": 832} {"train_loss": -9.674376487731934, "global_step": 139820, "epoch": 832} {"train_loss": -10.345136642456055, "global_step": 139821, "epoch": 832} {"train_loss": -10.259819030761719, "global_step": 139822, "epoch": 832} {"train_loss": -10.188825607299805, "global_step": 139823, "epoch": 832} {"train_loss": -10.292216300964355, "global_step": 139824, "epoch": 832} {"train_loss": -10.400806427001953, "global_step": 139825, "epoch": 832} {"train_loss": -10.215087890625, "global_step": 139826, "epoch": 832} {"train_loss": -10.379364013671875, "global_step": 139827, "epoch": 832} {"train_loss": -10.495981216430664, "global_step": 139828, "epoch": 832} {"train_loss": -10.304154396057129, "global_step": 139829, "epoch": 832} {"train_loss": -10.547619819641113, "global_step": 139830, "epoch": 832} {"train_loss": -10.499181747436523, "global_step": 139831, "epoch": 832} {"train_loss": -10.526861190795898, "global_step": 139832, "epoch": 832} {"train_loss": -10.38105583190918, "global_step": 139833, "epoch": 832} {"train_loss": -10.480049133300781, "global_step": 139834, "epoch": 832} {"train_loss": -10.42199993133545, "global_step": 139835, "epoch": 832} {"train_loss": -10.637151718139648, "global_step": 139836, "epoch": 832} {"train_loss": -10.62533187866211, "global_step": 139837, "epoch": 832} {"train_loss": -10.406620025634766, "global_step": 139838, "epoch": 832} {"train_loss": -10.40636920928955, "global_step": 139839, "epoch": 832} {"train_loss": -10.43671703338623, "global_step": 139840, "epoch": 832} {"train_loss": -10.529534339904785, "global_step": 139841, "epoch": 832} {"train_loss": -10.502948760986328, "global_step": 139842, "epoch": 832} {"train_loss": -10.543628692626953, "global_step": 139843, "epoch": 832} {"train_loss": -10.42178726196289, "global_step": 139844, "epoch": 832} {"train_loss": -10.700053215026855, "global_step": 139845, "epoch": 832} {"train_loss": -10.778755187988281, "global_step": 139846, "epoch": 832} {"train_loss": -10.200700759887695, "global_step": 139847, "epoch": 832} {"train_loss": -10.63166618347168, "global_step": 139848, "epoch": 832} {"train_loss": -10.469667434692383, "global_step": 139849, "epoch": 832} {"train_loss": -10.596857070922852, "global_step": 139850, "epoch": 832} {"train_loss": -10.270593643188477, "global_step": 139851, "epoch": 832} {"train_loss": -10.84799861907959, "global_step": 139852, "epoch": 832} {"train_loss": -10.283388137817383, "global_step": 139853, "epoch": 832} {"train_loss": -10.717585563659668, "global_step": 139854, "epoch": 832} {"train_loss": -10.577564239501953, "global_step": 139855, "epoch": 832} {"train_loss": -10.746092796325684, "global_step": 139856, "epoch": 832} {"train_loss": -10.584595680236816, "global_step": 139857, "epoch": 832} {"train_loss": -10.116744995117188, "global_step": 139858, "epoch": 832} {"train_loss": -10.425509452819824, "global_step": 139859, "epoch": 832} {"train_loss": -10.471538543701172, "global_step": 139860, "epoch": 832} {"train_loss": -10.255699157714844, "global_step": 139861, "epoch": 832} {"train_loss": -10.247190475463867, "global_step": 139862, "epoch": 832} {"train_loss": -10.030624389648438, "global_step": 139863, "epoch": 832} {"train_loss": -10.735787391662598, "global_step": 139864, "epoch": 832} {"train_loss": -9.91372299194336, "global_step": 139865, "epoch": 832} {"train_loss": -9.976310729980469, "global_step": 139866, "epoch": 832} {"train_loss": -10.57680892944336, "global_step": 139867, "epoch": 832} {"train_loss": -9.796892166137695, "global_step": 139868, "epoch": 832} {"train_loss": -10.44739055633545, "global_step": 139869, "epoch": 832} {"train_loss": -10.252557754516602, "global_step": 139870, "epoch": 832} {"train_loss": -10.530153274536133, "global_step": 139871, "epoch": 832} {"train_loss": -10.360033988952637, "global_step": 139872, "epoch": 832} {"train_loss": -10.545785903930664, "global_step": 139873, "epoch": 832} {"train_loss": -10.482583045959473, "global_step": 139874, "epoch": 832} {"train_loss": -10.169707298278809, "global_step": 139875, "epoch": 832} {"train_loss": -10.785395622253418, "global_step": 139876, "epoch": 832} {"train_loss": -10.239547729492188, "global_step": 139877, "epoch": 832} {"train_loss": -10.74526596069336, "global_step": 139878, "epoch": 832} {"train_loss": -10.369461059570312, "global_step": 139879, "epoch": 832} {"train_loss": -10.661591529846191, "global_step": 139880, "epoch": 832} {"train_loss": -10.429208755493164, "global_step": 139881, "epoch": 832} {"train_loss": -10.768475532531738, "global_step": 139882, "epoch": 832} {"train_loss": -10.566394805908203, "global_step": 139883, "epoch": 832} {"train_loss": -10.498934745788574, "global_step": 139884, "epoch": 832} {"train_loss": -10.54127311706543, "global_step": 139885, "epoch": 832} {"train_loss": -10.856161117553711, "global_step": 139886, "epoch": 832} {"train_loss": -10.246919631958008, "global_step": 139887, "epoch": 832} {"train_loss": -10.583505630493164, "global_step": 139888, "epoch": 832} {"train_loss": -10.736272811889648, "global_step": 139889, "epoch": 832} {"train_loss": -10.730188369750977, "global_step": 139890, "epoch": 832} {"train_loss": -10.81924057006836, "global_step": 139891, "epoch": 832} {"train_loss": -10.557247161865234, "global_step": 139892, "epoch": 832} {"train_loss": -10.783856391906738, "global_step": 139893, "epoch": 832} {"train_loss": -10.752079010009766, "global_step": 139894, "epoch": 832} {"train_loss": -10.976972579956055, "global_step": 139895, "epoch": 832} {"train_loss": -10.624658584594727, "global_step": 139896, "epoch": 832} {"train_loss": -10.703168869018555, "global_step": 139897, "epoch": 832} {"train_loss": -10.705852508544922, "global_step": 139898, "epoch": 832} {"train_loss": -10.673535346984863, "global_step": 139899, "epoch": 832} {"train_loss": -10.522451400756836, "global_step": 139900, "epoch": 832} {"train_loss": -10.351095199584961, "global_step": 139901, "epoch": 832} {"train_loss": -10.379043579101562, "global_step": 139902, "epoch": 832} {"train_loss": -10.46709156036377, "global_step": 139903, "epoch": 832} {"train_loss": -10.82850170135498, "global_step": 139904, "epoch": 832} {"train_loss": -10.941231727600098, "global_step": 139905, "epoch": 832} {"train_loss": -10.774067878723145, "global_step": 139906, "epoch": 832} {"train_loss": -10.830066680908203, "global_step": 139907, "epoch": 832} {"train_loss": -10.561487197875977, "global_step": 139908, "epoch": 832} {"train_loss": -10.70539665222168, "global_step": 139909, "epoch": 832} {"train_loss": -10.639476776123047, "global_step": 139910, "epoch": 832} {"train_loss": -10.494791984558105, "global_step": 139911, "epoch": 832} {"train_loss": -10.6088285446167, "global_step": 139912, "epoch": 832} {"train_loss": -10.343074798583984, "global_step": 139913, "epoch": 832} {"train_loss": -10.512472152709961, "global_step": 139914, "epoch": 832} {"train_loss": -10.377819061279297, "global_step": 139915, "epoch": 832} {"train_loss": -10.299554824829102, "global_step": 139916, "epoch": 832} {"train_loss": -10.22525691986084, "global_step": 139917, "epoch": 832} {"train_loss": -10.632840156555176, "global_step": 139918, "epoch": 832} {"train_loss": -10.425875663757324, "global_step": 139919, "epoch": 832} {"train_loss": -10.788569450378418, "global_step": 139920, "epoch": 832} {"train_loss": -10.655014038085938, "global_step": 139921, "epoch": 832} {"train_loss": -10.644367218017578, "global_step": 139922, "epoch": 832} {"train_loss": -10.417369842529297, "global_step": 139923, "epoch": 832} {"train_loss": -10.697135925292969, "global_step": 139924, "epoch": 832} {"train_loss": -10.88255500793457, "global_step": 139925, "epoch": 832} {"train_loss": -10.990302085876465, "global_step": 139926, "epoch": 832} {"train_loss": -10.53127670288086, "global_step": 139927, "epoch": 832} {"train_loss": -10.400177001953125, "global_step": 139928, "epoch": 832} {"train_loss": -10.730533599853516, "global_step": 139929, "epoch": 832} {"train_loss": -10.075490951538086, "global_step": 139930, "epoch": 832} {"train_loss": -10.581774711608887, "global_step": 139931, "epoch": 832} {"train_loss": -10.533287048339844, "global_step": 139932, "epoch": 832} {"train_loss": -9.851423263549805, "global_step": 139933, "epoch": 832} {"train_loss": -10.763710975646973, "global_step": 139934, "epoch": 832} {"train_loss": -10.346521377563477, "global_step": 139935, "epoch": 832} {"train_loss": -10.549812316894531, "global_step": 139936, "epoch": 832} {"train_loss": -10.481683731079102, "global_step": 139937, "epoch": 832} {"train_loss": -10.449065208435059, "global_step": 139938, "epoch": 832} {"train_loss": -10.43341064453125, "global_step": 139939, "epoch": 832} {"train_loss": -10.37431526184082, "global_step": 139940, "epoch": 832} {"train_loss": -10.171263694763184, "global_step": 139941, "epoch": 832} {"train_loss": -10.850858688354492, "global_step": 139942, "epoch": 832} {"train_loss": -10.439149220784506, "global_step": 139943, "epoch": 832, "val_loss": 225662.859375} {"train_loss": -10.183723449707031, "global_step": 139944, "epoch": 833} {"train_loss": -10.288551330566406, "global_step": 139945, "epoch": 833} {"train_loss": -9.880803108215332, "global_step": 139946, "epoch": 833} {"train_loss": -10.080263137817383, "global_step": 139947, "epoch": 833} {"train_loss": -10.425458908081055, "global_step": 139948, "epoch": 833} {"train_loss": -10.147476196289062, "global_step": 139949, "epoch": 833} {"train_loss": -10.484724044799805, "global_step": 139950, "epoch": 833} {"train_loss": -9.863504409790039, "global_step": 139951, "epoch": 833} {"train_loss": -10.460831642150879, "global_step": 139952, "epoch": 833} {"train_loss": -10.114757537841797, "global_step": 139953, "epoch": 833} {"train_loss": -10.412240028381348, "global_step": 139954, "epoch": 833} {"train_loss": -10.396896362304688, "global_step": 139955, "epoch": 833} {"train_loss": -10.556009292602539, "global_step": 139956, "epoch": 833} {"train_loss": -10.313982009887695, "global_step": 139957, "epoch": 833} {"train_loss": -10.45218276977539, "global_step": 139958, "epoch": 833} {"train_loss": -9.901044845581055, "global_step": 139959, "epoch": 833} {"train_loss": -10.630041122436523, "global_step": 139960, "epoch": 833} {"train_loss": -9.982237815856934, "global_step": 139961, "epoch": 833} {"train_loss": -10.349204063415527, "global_step": 139962, "epoch": 833} {"train_loss": -10.159297943115234, "global_step": 139963, "epoch": 833} {"train_loss": -10.026043891906738, "global_step": 139964, "epoch": 833} {"train_loss": -10.297737121582031, "global_step": 139965, "epoch": 833} {"train_loss": -10.635549545288086, "global_step": 139966, "epoch": 833} {"train_loss": -10.178400039672852, "global_step": 139967, "epoch": 833} {"train_loss": -10.479447364807129, "global_step": 139968, "epoch": 833} {"train_loss": -10.356104850769043, "global_step": 139969, "epoch": 833} {"train_loss": -10.143985748291016, "global_step": 139970, "epoch": 833} {"train_loss": -10.656826972961426, "global_step": 139971, "epoch": 833} {"train_loss": -10.32417106628418, "global_step": 139972, "epoch": 833} {"train_loss": -10.699633598327637, "global_step": 139973, "epoch": 833} {"train_loss": -10.371126174926758, "global_step": 139974, "epoch": 833} {"train_loss": -10.754657745361328, "global_step": 139975, "epoch": 833} {"train_loss": -10.606335639953613, "global_step": 139976, "epoch": 833} {"train_loss": -10.59127426147461, "global_step": 139977, "epoch": 833} {"train_loss": -10.686426162719727, "global_step": 139978, "epoch": 833} {"train_loss": -10.606193542480469, "global_step": 139979, "epoch": 833} {"train_loss": -10.547708511352539, "global_step": 139980, "epoch": 833} {"train_loss": -10.835090637207031, "global_step": 139981, "epoch": 833} {"train_loss": -10.66527271270752, "global_step": 139982, "epoch": 833} {"train_loss": -10.805142402648926, "global_step": 139983, "epoch": 833} {"train_loss": -10.854287147521973, "global_step": 139984, "epoch": 833} {"train_loss": -10.692718505859375, "global_step": 139985, "epoch": 833} {"train_loss": -10.81268310546875, "global_step": 139986, "epoch": 833} {"train_loss": -10.547886848449707, "global_step": 139987, "epoch": 833} {"train_loss": -10.939526557922363, "global_step": 139988, "epoch": 833} {"train_loss": -10.923982620239258, "global_step": 139989, "epoch": 833} {"train_loss": -10.619558334350586, "global_step": 139990, "epoch": 833} {"train_loss": -10.891670227050781, "global_step": 139991, "epoch": 833} {"train_loss": -10.59286880493164, "global_step": 139992, "epoch": 833} {"train_loss": -10.606109619140625, "global_step": 139993, "epoch": 833} {"train_loss": -10.277039527893066, "global_step": 139994, "epoch": 833} {"train_loss": -10.821069717407227, "global_step": 139995, "epoch": 833} {"train_loss": -10.214065551757812, "global_step": 139996, "epoch": 833} {"train_loss": -10.009405136108398, "global_step": 139997, "epoch": 833} {"train_loss": -10.57468032836914, "global_step": 139998, "epoch": 833} {"train_loss": -10.585792541503906, "global_step": 139999, "epoch": 833} {"train_loss": -10.476682662963867, "global_step": 140000, "epoch": 833} {"train_loss": -10.534599304199219, "global_step": 140001, "epoch": 833} {"train_loss": -10.35675048828125, "global_step": 140002, "epoch": 833} {"train_loss": -10.350890159606934, "global_step": 140003, "epoch": 833} {"train_loss": -10.252565383911133, "global_step": 140004, "epoch": 833} {"train_loss": -10.847230911254883, "global_step": 140005, "epoch": 833} {"train_loss": -10.080927848815918, "global_step": 140006, "epoch": 833} {"train_loss": -10.926815032958984, "global_step": 140007, "epoch": 833} {"train_loss": -10.418938636779785, "global_step": 140008, "epoch": 833} {"train_loss": -10.821637153625488, "global_step": 140009, "epoch": 833} {"train_loss": -10.624542236328125, "global_step": 140010, "epoch": 833} {"train_loss": -10.363826751708984, "global_step": 140011, "epoch": 833} {"train_loss": -11.135370254516602, "global_step": 140012, "epoch": 833} {"train_loss": -10.70718765258789, "global_step": 140013, "epoch": 833} {"train_loss": -10.506707191467285, "global_step": 140014, "epoch": 833} {"train_loss": -10.871843338012695, "global_step": 140015, "epoch": 833} {"train_loss": -10.772096633911133, "global_step": 140016, "epoch": 833} {"train_loss": -10.502433776855469, "global_step": 140017, "epoch": 833} {"train_loss": -10.648992538452148, "global_step": 140018, "epoch": 833} {"train_loss": -10.759957313537598, "global_step": 140019, "epoch": 833} {"train_loss": -10.778489112854004, "global_step": 140020, "epoch": 833} {"train_loss": -10.672355651855469, "global_step": 140021, "epoch": 833} {"train_loss": -10.83882999420166, "global_step": 140022, "epoch": 833} {"train_loss": -10.628997802734375, "global_step": 140023, "epoch": 833} {"train_loss": -10.579626083374023, "global_step": 140024, "epoch": 833} {"train_loss": -10.902664184570312, "global_step": 140025, "epoch": 833} {"train_loss": -10.460634231567383, "global_step": 140026, "epoch": 833} {"train_loss": -10.748773574829102, "global_step": 140027, "epoch": 833} {"train_loss": -10.425695419311523, "global_step": 140028, "epoch": 833} {"train_loss": -10.588388442993164, "global_step": 140029, "epoch": 833} {"train_loss": -10.50060749053955, "global_step": 140030, "epoch": 833} {"train_loss": -10.495086669921875, "global_step": 140031, "epoch": 833} {"train_loss": -10.368476867675781, "global_step": 140032, "epoch": 833} {"train_loss": -10.554922103881836, "global_step": 140033, "epoch": 833} {"train_loss": -10.287275314331055, "global_step": 140034, "epoch": 833} {"train_loss": -10.739202499389648, "global_step": 140035, "epoch": 833} {"train_loss": -10.465140342712402, "global_step": 140036, "epoch": 833} {"train_loss": -10.534660339355469, "global_step": 140037, "epoch": 833} {"train_loss": -10.930044174194336, "global_step": 140038, "epoch": 833} {"train_loss": -10.140042304992676, "global_step": 140039, "epoch": 833} {"train_loss": -9.932656288146973, "global_step": 140040, "epoch": 833} {"train_loss": -9.390739440917969, "global_step": 140041, "epoch": 833} {"train_loss": -9.706437110900879, "global_step": 140042, "epoch": 833} {"train_loss": -9.835562705993652, "global_step": 140043, "epoch": 833} {"train_loss": -9.733467102050781, "global_step": 140044, "epoch": 833} {"train_loss": -10.522038459777832, "global_step": 140045, "epoch": 833} {"train_loss": -9.819655418395996, "global_step": 140046, "epoch": 833} {"train_loss": -10.071918487548828, "global_step": 140047, "epoch": 833} {"train_loss": -10.589763641357422, "global_step": 140048, "epoch": 833} {"train_loss": -10.05173110961914, "global_step": 140049, "epoch": 833} {"train_loss": -10.068126678466797, "global_step": 140050, "epoch": 833} {"train_loss": -10.278749465942383, "global_step": 140051, "epoch": 833} {"train_loss": -10.177709579467773, "global_step": 140052, "epoch": 833} {"train_loss": -10.211769104003906, "global_step": 140053, "epoch": 833} {"train_loss": -10.111248970031738, "global_step": 140054, "epoch": 833} {"train_loss": -10.101850509643555, "global_step": 140055, "epoch": 833} {"train_loss": -10.343271255493164, "global_step": 140056, "epoch": 833} {"train_loss": -10.055473327636719, "global_step": 140057, "epoch": 833} {"train_loss": -10.040146827697754, "global_step": 140058, "epoch": 833} {"train_loss": -9.968942642211914, "global_step": 140059, "epoch": 833} {"train_loss": -10.249208450317383, "global_step": 140060, "epoch": 833} {"train_loss": -10.532669067382812, "global_step": 140061, "epoch": 833} {"train_loss": -10.079957008361816, "global_step": 140062, "epoch": 833} {"train_loss": -10.671099662780762, "global_step": 140063, "epoch": 833} {"train_loss": -9.909704208374023, "global_step": 140064, "epoch": 833} {"train_loss": -10.441932678222656, "global_step": 140065, "epoch": 833} {"train_loss": -10.35755443572998, "global_step": 140066, "epoch": 833} {"train_loss": -10.2500638961792, "global_step": 140067, "epoch": 833} {"train_loss": -10.267053604125977, "global_step": 140068, "epoch": 833} {"train_loss": -10.36020278930664, "global_step": 140069, "epoch": 833} {"train_loss": -10.181665420532227, "global_step": 140070, "epoch": 833} {"train_loss": -10.373050689697266, "global_step": 140071, "epoch": 833} {"train_loss": -10.251472473144531, "global_step": 140072, "epoch": 833} {"train_loss": -9.62732982635498, "global_step": 140073, "epoch": 833} {"train_loss": -9.930551528930664, "global_step": 140074, "epoch": 833} {"train_loss": -9.126531600952148, "global_step": 140075, "epoch": 833} {"train_loss": -10.386792182922363, "global_step": 140076, "epoch": 833} {"train_loss": -9.572930335998535, "global_step": 140077, "epoch": 833} {"train_loss": -10.300325393676758, "global_step": 140078, "epoch": 833} {"train_loss": -10.094560623168945, "global_step": 140079, "epoch": 833} {"train_loss": -10.388242721557617, "global_step": 140080, "epoch": 833} {"train_loss": -9.999189376831055, "global_step": 140081, "epoch": 833} {"train_loss": -10.620271682739258, "global_step": 140082, "epoch": 833} {"train_loss": -9.931000709533691, "global_step": 140083, "epoch": 833} {"train_loss": -10.342487335205078, "global_step": 140084, "epoch": 833} {"train_loss": -9.878273010253906, "global_step": 140085, "epoch": 833} {"train_loss": -10.348355293273926, "global_step": 140086, "epoch": 833} {"train_loss": -10.177006721496582, "global_step": 140087, "epoch": 833} {"train_loss": -10.477204322814941, "global_step": 140088, "epoch": 833} {"train_loss": -10.367424011230469, "global_step": 140089, "epoch": 833} {"train_loss": -9.957778930664062, "global_step": 140090, "epoch": 833} {"train_loss": -10.459430694580078, "global_step": 140091, "epoch": 833} {"train_loss": -10.226829528808594, "global_step": 140092, "epoch": 833} {"train_loss": -10.707391738891602, "global_step": 140093, "epoch": 833} {"train_loss": -10.507080078125, "global_step": 140094, "epoch": 833} {"train_loss": -10.534025192260742, "global_step": 140095, "epoch": 833} {"train_loss": -10.485024452209473, "global_step": 140096, "epoch": 833} {"train_loss": -10.670350074768066, "global_step": 140097, "epoch": 833} {"train_loss": -10.594470977783203, "global_step": 140098, "epoch": 833} {"train_loss": -10.494958877563477, "global_step": 140099, "epoch": 833} {"train_loss": -10.704093933105469, "global_step": 140100, "epoch": 833} {"train_loss": -10.417470932006836, "global_step": 140101, "epoch": 833} {"train_loss": -10.590076446533203, "global_step": 140102, "epoch": 833} {"train_loss": -10.727714538574219, "global_step": 140103, "epoch": 833} {"train_loss": -10.692963600158691, "global_step": 140104, "epoch": 833} {"train_loss": -10.702713012695312, "global_step": 140105, "epoch": 833} {"train_loss": -10.674134254455566, "global_step": 140106, "epoch": 833} {"train_loss": -10.599584579467773, "global_step": 140107, "epoch": 833} {"train_loss": -10.60781478881836, "global_step": 140108, "epoch": 833} {"train_loss": -10.661325454711914, "global_step": 140109, "epoch": 833} {"train_loss": -10.4827299118042, "global_step": 140110, "epoch": 833} {"train_loss": -10.403836925824484, "global_step": 140111, "epoch": 833, "val_loss": 226688.5625} {"train_loss": -10.973546028137207, "global_step": 140112, "epoch": 834} {"train_loss": -10.888599395751953, "global_step": 140113, "epoch": 834} {"train_loss": -10.955888748168945, "global_step": 140114, "epoch": 834} {"train_loss": -10.459796905517578, "global_step": 140115, "epoch": 834} {"train_loss": -10.5430908203125, "global_step": 140116, "epoch": 834} {"train_loss": -10.495071411132812, "global_step": 140117, "epoch": 834} {"train_loss": -10.768033027648926, "global_step": 140118, "epoch": 834} {"train_loss": -10.460611343383789, "global_step": 140119, "epoch": 834} {"train_loss": -10.645269393920898, "global_step": 140120, "epoch": 834} {"train_loss": -10.55578327178955, "global_step": 140121, "epoch": 834} {"train_loss": -10.731461524963379, "global_step": 140122, "epoch": 834} {"train_loss": -10.513130187988281, "global_step": 140123, "epoch": 834} {"train_loss": -10.49868392944336, "global_step": 140124, "epoch": 834} {"train_loss": -10.737226486206055, "global_step": 140125, "epoch": 834} {"train_loss": -10.939241409301758, "global_step": 140126, "epoch": 834} {"train_loss": -10.726445198059082, "global_step": 140127, "epoch": 834} {"train_loss": -10.248231887817383, "global_step": 140128, "epoch": 834} {"train_loss": -10.441787719726562, "global_step": 140129, "epoch": 834} {"train_loss": -10.563793182373047, "global_step": 140130, "epoch": 834} {"train_loss": -10.04025936126709, "global_step": 140131, "epoch": 834} {"train_loss": -10.74695873260498, "global_step": 140132, "epoch": 834} {"train_loss": -10.221253395080566, "global_step": 140133, "epoch": 834} {"train_loss": -10.243461608886719, "global_step": 140134, "epoch": 834} {"train_loss": -9.931591033935547, "global_step": 140135, "epoch": 834} {"train_loss": -9.635448455810547, "global_step": 140136, "epoch": 834} {"train_loss": -9.505888938903809, "global_step": 140137, "epoch": 834} {"train_loss": -9.916752815246582, "global_step": 140138, "epoch": 834} {"train_loss": -9.643319129943848, "global_step": 140139, "epoch": 834} {"train_loss": -10.382426261901855, "global_step": 140140, "epoch": 834} {"train_loss": -9.87780475616455, "global_step": 140141, "epoch": 834} {"train_loss": -10.68881607055664, "global_step": 140142, "epoch": 834} {"train_loss": -10.154977798461914, "global_step": 140143, "epoch": 834} {"train_loss": -10.224066734313965, "global_step": 140144, "epoch": 834} {"train_loss": -10.090011596679688, "global_step": 140145, "epoch": 834} {"train_loss": -10.301591873168945, "global_step": 140146, "epoch": 834} {"train_loss": -9.862802505493164, "global_step": 140147, "epoch": 834} {"train_loss": -10.443658828735352, "global_step": 140148, "epoch": 834} {"train_loss": -9.69742202758789, "global_step": 140149, "epoch": 834} {"train_loss": -10.368278503417969, "global_step": 140150, "epoch": 834} {"train_loss": -9.905783653259277, "global_step": 140151, "epoch": 834} {"train_loss": -9.908971786499023, "global_step": 140152, "epoch": 834} {"train_loss": -9.813194274902344, "global_step": 140153, "epoch": 834} {"train_loss": -10.090306282043457, "global_step": 140154, "epoch": 834} {"train_loss": -10.410897254943848, "global_step": 140155, "epoch": 834} {"train_loss": -10.625454902648926, "global_step": 140156, "epoch": 834} {"train_loss": -9.901912689208984, "global_step": 140157, "epoch": 834} {"train_loss": -10.507911682128906, "global_step": 140158, "epoch": 834} {"train_loss": -10.429376602172852, "global_step": 140159, "epoch": 834} {"train_loss": -10.28691291809082, "global_step": 140160, "epoch": 834} {"train_loss": -10.582752227783203, "global_step": 140161, "epoch": 834} {"train_loss": -10.418527603149414, "global_step": 140162, "epoch": 834} {"train_loss": -10.462398529052734, "global_step": 140163, "epoch": 834} {"train_loss": -10.397868156433105, "global_step": 140164, "epoch": 834} {"train_loss": -10.489128112792969, "global_step": 140165, "epoch": 834} {"train_loss": -10.430501937866211, "global_step": 140166, "epoch": 834} {"train_loss": -10.509764671325684, "global_step": 140167, "epoch": 834} {"train_loss": -10.197144508361816, "global_step": 140168, "epoch": 834} {"train_loss": -10.400485038757324, "global_step": 140169, "epoch": 834} {"train_loss": -10.761768341064453, "global_step": 140170, "epoch": 834} {"train_loss": -10.568400382995605, "global_step": 140171, "epoch": 834} {"train_loss": -10.820281982421875, "global_step": 140172, "epoch": 834} {"train_loss": -10.616724967956543, "global_step": 140173, "epoch": 834} {"train_loss": -10.540513038635254, "global_step": 140174, "epoch": 834} {"train_loss": -10.385343551635742, "global_step": 140175, "epoch": 834} {"train_loss": -10.51862621307373, "global_step": 140176, "epoch": 834} {"train_loss": -10.700322151184082, "global_step": 140177, "epoch": 834} {"train_loss": -10.578170776367188, "global_step": 140178, "epoch": 834} {"train_loss": -10.774271011352539, "global_step": 140179, "epoch": 834} {"train_loss": -10.606842041015625, "global_step": 140180, "epoch": 834} {"train_loss": -10.579891204833984, "global_step": 140181, "epoch": 834} {"train_loss": -10.669364929199219, "global_step": 140182, "epoch": 834} {"train_loss": -10.646190643310547, "global_step": 140183, "epoch": 834} {"train_loss": -10.75110912322998, "global_step": 140184, "epoch": 834} {"train_loss": -10.736513137817383, "global_step": 140185, "epoch": 834} {"train_loss": -10.911914825439453, "global_step": 140186, "epoch": 834} {"train_loss": -10.778722763061523, "global_step": 140187, "epoch": 834} {"train_loss": -10.60107135772705, "global_step": 140188, "epoch": 834} {"train_loss": -10.744392395019531, "global_step": 140189, "epoch": 834} {"train_loss": -10.848326683044434, "global_step": 140190, "epoch": 834} {"train_loss": -10.77108383178711, "global_step": 140191, "epoch": 834} {"train_loss": -10.679763793945312, "global_step": 140192, "epoch": 834} {"train_loss": -10.70727825164795, "global_step": 140193, "epoch": 834} {"train_loss": -10.782602310180664, "global_step": 140194, "epoch": 834} {"train_loss": -10.976314544677734, "global_step": 140195, "epoch": 834} {"train_loss": -10.44264030456543, "global_step": 140196, "epoch": 834} {"train_loss": -10.772523880004883, "global_step": 140197, "epoch": 834} {"train_loss": -10.735126495361328, "global_step": 140198, "epoch": 834} {"train_loss": -10.908041000366211, "global_step": 140199, "epoch": 834} {"train_loss": -10.886305809020996, "global_step": 140200, "epoch": 834} {"train_loss": -10.79044246673584, "global_step": 140201, "epoch": 834} {"train_loss": -10.69433879852295, "global_step": 140202, "epoch": 834} {"train_loss": -10.8849458694458, "global_step": 140203, "epoch": 834} {"train_loss": -10.618709564208984, "global_step": 140204, "epoch": 834} {"train_loss": -10.691112518310547, "global_step": 140205, "epoch": 834} {"train_loss": -10.809040069580078, "global_step": 140206, "epoch": 834} {"train_loss": -10.775208473205566, "global_step": 140207, "epoch": 834} {"train_loss": -10.934743881225586, "global_step": 140208, "epoch": 834} {"train_loss": -10.930448532104492, "global_step": 140209, "epoch": 834} {"train_loss": -10.982528686523438, "global_step": 140210, "epoch": 834} {"train_loss": -10.690261840820312, "global_step": 140211, "epoch": 834} {"train_loss": -10.797439575195312, "global_step": 140212, "epoch": 834} {"train_loss": -10.854646682739258, "global_step": 140213, "epoch": 834} {"train_loss": -10.704133987426758, "global_step": 140214, "epoch": 834} {"train_loss": -10.611612319946289, "global_step": 140215, "epoch": 834} {"train_loss": -10.748754501342773, "global_step": 140216, "epoch": 834} {"train_loss": -10.802438735961914, "global_step": 140217, "epoch": 834} {"train_loss": -10.78713321685791, "global_step": 140218, "epoch": 834} {"train_loss": -10.398147583007812, "global_step": 140219, "epoch": 834} {"train_loss": -9.809067726135254, "global_step": 140220, "epoch": 834} {"train_loss": -10.156338691711426, "global_step": 140221, "epoch": 834} {"train_loss": -10.625606536865234, "global_step": 140222, "epoch": 834} {"train_loss": -10.418188095092773, "global_step": 140223, "epoch": 834} {"train_loss": -10.316600799560547, "global_step": 140224, "epoch": 834} {"train_loss": -10.539983749389648, "global_step": 140225, "epoch": 834} {"train_loss": -10.490574836730957, "global_step": 140226, "epoch": 834} {"train_loss": -10.52310848236084, "global_step": 140227, "epoch": 834} {"train_loss": -10.746273040771484, "global_step": 140228, "epoch": 834} {"train_loss": -10.21999740600586, "global_step": 140229, "epoch": 834} {"train_loss": -10.455772399902344, "global_step": 140230, "epoch": 834} {"train_loss": -10.42319393157959, "global_step": 140231, "epoch": 834} {"train_loss": -10.085336685180664, "global_step": 140232, "epoch": 834} {"train_loss": -10.225624084472656, "global_step": 140233, "epoch": 834} {"train_loss": -10.215746879577637, "global_step": 140234, "epoch": 834} {"train_loss": -10.426299095153809, "global_step": 140235, "epoch": 834} {"train_loss": -10.226163864135742, "global_step": 140236, "epoch": 834} {"train_loss": -10.233962059020996, "global_step": 140237, "epoch": 834} {"train_loss": -10.036161422729492, "global_step": 140238, "epoch": 834} {"train_loss": -8.769775390625, "global_step": 140239, "epoch": 834} {"train_loss": -9.516891479492188, "global_step": 140240, "epoch": 834} {"train_loss": -9.113912582397461, "global_step": 140241, "epoch": 834} {"train_loss": -10.450643539428711, "global_step": 140242, "epoch": 834} {"train_loss": -9.20740795135498, "global_step": 140243, "epoch": 834} {"train_loss": -9.513612747192383, "global_step": 140244, "epoch": 834} {"train_loss": -10.146328926086426, "global_step": 140245, "epoch": 834} {"train_loss": -9.913009643554688, "global_step": 140246, "epoch": 834} {"train_loss": -10.241113662719727, "global_step": 140247, "epoch": 834} {"train_loss": -9.933876037597656, "global_step": 140248, "epoch": 834} {"train_loss": -10.180830001831055, "global_step": 140249, "epoch": 834} {"train_loss": -9.499619483947754, "global_step": 140250, "epoch": 834} {"train_loss": -10.324167251586914, "global_step": 140251, "epoch": 834} {"train_loss": -9.99464225769043, "global_step": 140252, "epoch": 834} {"train_loss": -10.044326782226562, "global_step": 140253, "epoch": 834} {"train_loss": -10.526172637939453, "global_step": 140254, "epoch": 834} {"train_loss": -9.70230770111084, "global_step": 140255, "epoch": 834} {"train_loss": -10.39653205871582, "global_step": 140256, "epoch": 834} {"train_loss": -10.401936531066895, "global_step": 140257, "epoch": 834} {"train_loss": -10.006511688232422, "global_step": 140258, "epoch": 834} {"train_loss": -10.520901679992676, "global_step": 140259, "epoch": 834} {"train_loss": -10.485359191894531, "global_step": 140260, "epoch": 834} {"train_loss": -10.360029220581055, "global_step": 140261, "epoch": 834} {"train_loss": -10.290445327758789, "global_step": 140262, "epoch": 834} {"train_loss": -10.463233947753906, "global_step": 140263, "epoch": 834} {"train_loss": -10.379000663757324, "global_step": 140264, "epoch": 834} {"train_loss": -10.495893478393555, "global_step": 140265, "epoch": 834} {"train_loss": -10.41842269897461, "global_step": 140266, "epoch": 834} {"train_loss": -10.288662910461426, "global_step": 140267, "epoch": 834} {"train_loss": -10.659440040588379, "global_step": 140268, "epoch": 834} {"train_loss": -10.54658317565918, "global_step": 140269, "epoch": 834} {"train_loss": -10.617465019226074, "global_step": 140270, "epoch": 834} {"train_loss": -10.228470802307129, "global_step": 140271, "epoch": 834} {"train_loss": -10.488951683044434, "global_step": 140272, "epoch": 834} {"train_loss": -10.698810577392578, "global_step": 140273, "epoch": 834} {"train_loss": -10.561254501342773, "global_step": 140274, "epoch": 834} {"train_loss": -10.413196563720703, "global_step": 140275, "epoch": 834} {"train_loss": -10.646034240722656, "global_step": 140276, "epoch": 834} {"train_loss": -10.731269836425781, "global_step": 140277, "epoch": 834} {"train_loss": -10.536443710327148, "global_step": 140278, "epoch": 834} {"train_loss": -10.421028250739688, "global_step": 140279, "epoch": 834, "val_loss": 224833.9375} {"train_loss": -10.697221755981445, "global_step": 140280, "epoch": 835} {"train_loss": -10.810018539428711, "global_step": 140281, "epoch": 835} {"train_loss": -10.892723083496094, "global_step": 140282, "epoch": 835} {"train_loss": -10.839851379394531, "global_step": 140283, "epoch": 835} {"train_loss": -10.838427543640137, "global_step": 140284, "epoch": 835} {"train_loss": -10.767913818359375, "global_step": 140285, "epoch": 835} {"train_loss": -10.607587814331055, "global_step": 140286, "epoch": 835} {"train_loss": -10.756118774414062, "global_step": 140287, "epoch": 835} {"train_loss": -10.880830764770508, "global_step": 140288, "epoch": 835} {"train_loss": -11.065792083740234, "global_step": 140289, "epoch": 835} {"train_loss": -10.842130661010742, "global_step": 140290, "epoch": 835} {"train_loss": -10.778863906860352, "global_step": 140291, "epoch": 835} {"train_loss": -10.663000106811523, "global_step": 140292, "epoch": 835} {"train_loss": -10.616796493530273, "global_step": 140293, "epoch": 835} {"train_loss": -10.632588386535645, "global_step": 140294, "epoch": 835} {"train_loss": -10.970124244689941, "global_step": 140295, "epoch": 835} {"train_loss": -10.867868423461914, "global_step": 140296, "epoch": 835} {"train_loss": -10.975576400756836, "global_step": 140297, "epoch": 835} {"train_loss": -10.918447494506836, "global_step": 140298, "epoch": 835} {"train_loss": -11.144575119018555, "global_step": 140299, "epoch": 835} {"train_loss": -10.956398963928223, "global_step": 140300, "epoch": 835} {"train_loss": -10.93327522277832, "global_step": 140301, "epoch": 835} {"train_loss": -10.564738273620605, "global_step": 140302, "epoch": 835} {"train_loss": -10.379006385803223, "global_step": 140303, "epoch": 835} {"train_loss": -10.502376556396484, "global_step": 140304, "epoch": 835} {"train_loss": -11.03404426574707, "global_step": 140305, "epoch": 835} {"train_loss": -10.15101432800293, "global_step": 140306, "epoch": 835} {"train_loss": -8.54456615447998, "global_step": 140307, "epoch": 835} {"train_loss": -9.63613510131836, "global_step": 140308, "epoch": 835} {"train_loss": -10.402442932128906, "global_step": 140309, "epoch": 835} {"train_loss": -9.923973083496094, "global_step": 140310, "epoch": 835} {"train_loss": -9.394189834594727, "global_step": 140311, "epoch": 835} {"train_loss": -8.418571472167969, "global_step": 140312, "epoch": 835} {"train_loss": -10.181924819946289, "global_step": 140313, "epoch": 835} {"train_loss": -9.023908615112305, "global_step": 140314, "epoch": 835} {"train_loss": -9.100837707519531, "global_step": 140315, "epoch": 835} {"train_loss": -9.938169479370117, "global_step": 140316, "epoch": 835} {"train_loss": -8.236360549926758, "global_step": 140317, "epoch": 835} {"train_loss": -9.585488319396973, "global_step": 140318, "epoch": 835} {"train_loss": -9.168161392211914, "global_step": 140319, "epoch": 835} {"train_loss": -9.408540725708008, "global_step": 140320, "epoch": 835} {"train_loss": -9.282696723937988, "global_step": 140321, "epoch": 835} {"train_loss": -9.724315643310547, "global_step": 140322, "epoch": 835} {"train_loss": -9.646918296813965, "global_step": 140323, "epoch": 835} {"train_loss": -9.902796745300293, "global_step": 140324, "epoch": 835} {"train_loss": -9.898509979248047, "global_step": 140325, "epoch": 835} {"train_loss": -9.250795364379883, "global_step": 140326, "epoch": 835} {"train_loss": -9.978689193725586, "global_step": 140327, "epoch": 835} {"train_loss": -10.305366516113281, "global_step": 140328, "epoch": 835} {"train_loss": -9.871031761169434, "global_step": 140329, "epoch": 835} {"train_loss": -10.093274116516113, "global_step": 140330, "epoch": 835} {"train_loss": -10.05689811706543, "global_step": 140331, "epoch": 835} {"train_loss": -9.888321876525879, "global_step": 140332, "epoch": 835} {"train_loss": -10.16464614868164, "global_step": 140333, "epoch": 835} {"train_loss": -10.255996704101562, "global_step": 140334, "epoch": 835} {"train_loss": -10.107487678527832, "global_step": 140335, "epoch": 835} {"train_loss": -10.013324737548828, "global_step": 140336, "epoch": 835} {"train_loss": -10.100231170654297, "global_step": 140337, "epoch": 835} {"train_loss": -10.042734146118164, "global_step": 140338, "epoch": 835} {"train_loss": -10.217028617858887, "global_step": 140339, "epoch": 835} {"train_loss": -10.251606941223145, "global_step": 140340, "epoch": 835} {"train_loss": -10.254636764526367, "global_step": 140341, "epoch": 835} {"train_loss": -10.235671997070312, "global_step": 140342, "epoch": 835} {"train_loss": -10.470193862915039, "global_step": 140343, "epoch": 835} {"train_loss": -10.372214317321777, "global_step": 140344, "epoch": 835} {"train_loss": -10.25935173034668, "global_step": 140345, "epoch": 835} {"train_loss": -10.388071060180664, "global_step": 140346, "epoch": 835} {"train_loss": -10.419105529785156, "global_step": 140347, "epoch": 835} {"train_loss": -10.49770736694336, "global_step": 140348, "epoch": 835} {"train_loss": -10.455388069152832, "global_step": 140349, "epoch": 835} {"train_loss": -10.431108474731445, "global_step": 140350, "epoch": 835} {"train_loss": -10.285568237304688, "global_step": 140351, "epoch": 835} {"train_loss": -10.3779296875, "global_step": 140352, "epoch": 835} {"train_loss": -10.421869277954102, "global_step": 140353, "epoch": 835} {"train_loss": -10.505843162536621, "global_step": 140354, "epoch": 835} {"train_loss": -10.651754379272461, "global_step": 140355, "epoch": 835} {"train_loss": -10.382867813110352, "global_step": 140356, "epoch": 835} {"train_loss": -10.417219161987305, "global_step": 140357, "epoch": 835} {"train_loss": -10.722643852233887, "global_step": 140358, "epoch": 835} {"train_loss": -10.804426193237305, "global_step": 140359, "epoch": 835} {"train_loss": -10.759178161621094, "global_step": 140360, "epoch": 835} {"train_loss": -10.709074020385742, "global_step": 140361, "epoch": 835} {"train_loss": -10.701845169067383, "global_step": 140362, "epoch": 835} {"train_loss": -10.780744552612305, "global_step": 140363, "epoch": 835} {"train_loss": -10.789728164672852, "global_step": 140364, "epoch": 835} {"train_loss": -10.763050079345703, "global_step": 140365, "epoch": 835} {"train_loss": -10.77847671508789, "global_step": 140366, "epoch": 835} {"train_loss": -10.753789901733398, "global_step": 140367, "epoch": 835} {"train_loss": -10.714780807495117, "global_step": 140368, "epoch": 835} {"train_loss": -10.712453842163086, "global_step": 140369, "epoch": 835} {"train_loss": -10.79098892211914, "global_step": 140370, "epoch": 835} {"train_loss": -10.383070945739746, "global_step": 140371, "epoch": 835} {"train_loss": -10.916156768798828, "global_step": 140372, "epoch": 835} {"train_loss": -10.769294738769531, "global_step": 140373, "epoch": 835} {"train_loss": -10.755496978759766, "global_step": 140374, "epoch": 835} {"train_loss": -10.915046691894531, "global_step": 140375, "epoch": 835} {"train_loss": -10.765862464904785, "global_step": 140376, "epoch": 835} {"train_loss": -10.908634185791016, "global_step": 140377, "epoch": 835} {"train_loss": -10.434913635253906, "global_step": 140378, "epoch": 835} {"train_loss": -10.469400405883789, "global_step": 140379, "epoch": 835} {"train_loss": -10.60010814666748, "global_step": 140380, "epoch": 835} {"train_loss": -10.689229965209961, "global_step": 140381, "epoch": 835} {"train_loss": -10.845231056213379, "global_step": 140382, "epoch": 835} {"train_loss": -10.687602043151855, "global_step": 140383, "epoch": 835} {"train_loss": -10.658401489257812, "global_step": 140384, "epoch": 835} {"train_loss": -10.515946388244629, "global_step": 140385, "epoch": 835} {"train_loss": -10.97326374053955, "global_step": 140386, "epoch": 835} {"train_loss": -10.405966758728027, "global_step": 140387, "epoch": 835} {"train_loss": -10.88119888305664, "global_step": 140388, "epoch": 835} {"train_loss": -10.411623001098633, "global_step": 140389, "epoch": 835} {"train_loss": -10.657434463500977, "global_step": 140390, "epoch": 835} {"train_loss": -10.716419219970703, "global_step": 140391, "epoch": 835} {"train_loss": -10.696609497070312, "global_step": 140392, "epoch": 835} {"train_loss": -10.683540344238281, "global_step": 140393, "epoch": 835} {"train_loss": -10.507402420043945, "global_step": 140394, "epoch": 835} {"train_loss": -10.718664169311523, "global_step": 140395, "epoch": 835} {"train_loss": -10.467378616333008, "global_step": 140396, "epoch": 835} {"train_loss": -10.124876976013184, "global_step": 140397, "epoch": 835} {"train_loss": -10.909161567687988, "global_step": 140398, "epoch": 835} {"train_loss": -10.068419456481934, "global_step": 140399, "epoch": 835} {"train_loss": -10.132064819335938, "global_step": 140400, "epoch": 835} {"train_loss": -9.91142463684082, "global_step": 140401, "epoch": 835} {"train_loss": -10.893391609191895, "global_step": 140402, "epoch": 835} {"train_loss": -10.329696655273438, "global_step": 140403, "epoch": 835} {"train_loss": -10.313365936279297, "global_step": 140404, "epoch": 835} {"train_loss": -10.51838493347168, "global_step": 140405, "epoch": 835} {"train_loss": -10.096885681152344, "global_step": 140406, "epoch": 835} {"train_loss": -10.662947654724121, "global_step": 140407, "epoch": 835} {"train_loss": -10.61478328704834, "global_step": 140408, "epoch": 835} {"train_loss": -10.426321029663086, "global_step": 140409, "epoch": 835} {"train_loss": -10.470361709594727, "global_step": 140410, "epoch": 835} {"train_loss": -10.426936149597168, "global_step": 140411, "epoch": 835} {"train_loss": -10.573654174804688, "global_step": 140412, "epoch": 835} {"train_loss": -10.149314880371094, "global_step": 140413, "epoch": 835} {"train_loss": -10.343811988830566, "global_step": 140414, "epoch": 835} {"train_loss": -10.773994445800781, "global_step": 140415, "epoch": 835} {"train_loss": -10.485601425170898, "global_step": 140416, "epoch": 835} {"train_loss": -10.789302825927734, "global_step": 140417, "epoch": 835} {"train_loss": -10.653993606567383, "global_step": 140418, "epoch": 835} {"train_loss": -10.461137771606445, "global_step": 140419, "epoch": 835} {"train_loss": -10.365375518798828, "global_step": 140420, "epoch": 835} {"train_loss": -10.55877685546875, "global_step": 140421, "epoch": 835} {"train_loss": -10.561391830444336, "global_step": 140422, "epoch": 835} {"train_loss": -10.086347579956055, "global_step": 140423, "epoch": 835} {"train_loss": -10.283227920532227, "global_step": 140424, "epoch": 835} {"train_loss": -10.608525276184082, "global_step": 140425, "epoch": 835} {"train_loss": -10.39013671875, "global_step": 140426, "epoch": 835} {"train_loss": -10.288041114807129, "global_step": 140427, "epoch": 835} {"train_loss": -10.357120513916016, "global_step": 140428, "epoch": 835} {"train_loss": -10.261013984680176, "global_step": 140429, "epoch": 835} {"train_loss": -9.868181228637695, "global_step": 140430, "epoch": 835} {"train_loss": -10.70752239227295, "global_step": 140431, "epoch": 835} {"train_loss": -9.713037490844727, "global_step": 140432, "epoch": 835} {"train_loss": -10.386098861694336, "global_step": 140433, "epoch": 835} {"train_loss": -10.171850204467773, "global_step": 140434, "epoch": 835} {"train_loss": -10.320646286010742, "global_step": 140435, "epoch": 835} {"train_loss": -10.133499145507812, "global_step": 140436, "epoch": 835} {"train_loss": -10.537269592285156, "global_step": 140437, "epoch": 835} {"train_loss": -10.200472831726074, "global_step": 140438, "epoch": 835} {"train_loss": -10.531269073486328, "global_step": 140439, "epoch": 835} {"train_loss": -10.153495788574219, "global_step": 140440, "epoch": 835} {"train_loss": -10.582756996154785, "global_step": 140441, "epoch": 835} {"train_loss": -10.524709701538086, "global_step": 140442, "epoch": 835} {"train_loss": -10.346707344055176, "global_step": 140443, "epoch": 835} {"train_loss": -10.58602523803711, "global_step": 140444, "epoch": 835} {"train_loss": -10.439230918884277, "global_step": 140445, "epoch": 835} {"train_loss": -10.582317352294922, "global_step": 140446, "epoch": 835} {"train_loss": -10.390546225366139, "global_step": 140447, "epoch": 835, "val_loss": 224439.0, "train_action_mse_error": 5.9077911376953125} {"train_loss": -10.593302726745605, "global_step": 140448, "epoch": 836} {"train_loss": -10.477930068969727, "global_step": 140449, "epoch": 836} {"train_loss": -10.293569564819336, "global_step": 140450, "epoch": 836} {"train_loss": -10.318882942199707, "global_step": 140451, "epoch": 836} {"train_loss": -10.29892349243164, "global_step": 140452, "epoch": 836} {"train_loss": -10.261018753051758, "global_step": 140453, "epoch": 836} {"train_loss": -10.681167602539062, "global_step": 140454, "epoch": 836} {"train_loss": -10.222827911376953, "global_step": 140455, "epoch": 836} {"train_loss": -10.50782585144043, "global_step": 140456, "epoch": 836} {"train_loss": -10.356733322143555, "global_step": 140457, "epoch": 836} {"train_loss": -10.403894424438477, "global_step": 140458, "epoch": 836} {"train_loss": -10.797551155090332, "global_step": 140459, "epoch": 836} {"train_loss": -10.50186538696289, "global_step": 140460, "epoch": 836} {"train_loss": -10.512258529663086, "global_step": 140461, "epoch": 836} {"train_loss": -10.758279800415039, "global_step": 140462, "epoch": 836} {"train_loss": -10.560640335083008, "global_step": 140463, "epoch": 836} {"train_loss": -10.629240989685059, "global_step": 140464, "epoch": 836} {"train_loss": -10.410855293273926, "global_step": 140465, "epoch": 836} {"train_loss": -10.596738815307617, "global_step": 140466, "epoch": 836} {"train_loss": -10.30630874633789, "global_step": 140467, "epoch": 836} {"train_loss": -10.550954818725586, "global_step": 140468, "epoch": 836} {"train_loss": -10.345088005065918, "global_step": 140469, "epoch": 836} {"train_loss": -10.497221946716309, "global_step": 140470, "epoch": 836} {"train_loss": -10.571626663208008, "global_step": 140471, "epoch": 836} {"train_loss": -10.403265953063965, "global_step": 140472, "epoch": 836} {"train_loss": -10.396987915039062, "global_step": 140473, "epoch": 836} {"train_loss": -10.732295989990234, "global_step": 140474, "epoch": 836} {"train_loss": -10.503225326538086, "global_step": 140475, "epoch": 836} {"train_loss": -10.295135498046875, "global_step": 140476, "epoch": 836} {"train_loss": -10.393970489501953, "global_step": 140477, "epoch": 836} {"train_loss": -10.589118957519531, "global_step": 140478, "epoch": 836} {"train_loss": -10.511327743530273, "global_step": 140479, "epoch": 836} {"train_loss": -10.606666564941406, "global_step": 140480, "epoch": 836} {"train_loss": -10.439311027526855, "global_step": 140481, "epoch": 836} {"train_loss": -10.602136611938477, "global_step": 140482, "epoch": 836} {"train_loss": -9.981367111206055, "global_step": 140483, "epoch": 836} {"train_loss": -10.427846908569336, "global_step": 140484, "epoch": 836} {"train_loss": -10.490646362304688, "global_step": 140485, "epoch": 836} {"train_loss": -10.290143013000488, "global_step": 140486, "epoch": 836} {"train_loss": -10.554092407226562, "global_step": 140487, "epoch": 836} {"train_loss": -10.620962142944336, "global_step": 140488, "epoch": 836} {"train_loss": -10.54063606262207, "global_step": 140489, "epoch": 836} {"train_loss": -10.559925079345703, "global_step": 140490, "epoch": 836} {"train_loss": -10.594149589538574, "global_step": 140491, "epoch": 836} {"train_loss": -10.420528411865234, "global_step": 140492, "epoch": 836} {"train_loss": -10.790695190429688, "global_step": 140493, "epoch": 836} {"train_loss": -10.581674575805664, "global_step": 140494, "epoch": 836} {"train_loss": -10.47774887084961, "global_step": 140495, "epoch": 836} {"train_loss": -10.610572814941406, "global_step": 140496, "epoch": 836} {"train_loss": -10.381328582763672, "global_step": 140497, "epoch": 836} {"train_loss": -10.314300537109375, "global_step": 140498, "epoch": 836} {"train_loss": -10.576553344726562, "global_step": 140499, "epoch": 836} {"train_loss": -10.510414123535156, "global_step": 140500, "epoch": 836} {"train_loss": -10.474031448364258, "global_step": 140501, "epoch": 836} {"train_loss": -10.09604549407959, "global_step": 140502, "epoch": 836} {"train_loss": -10.550973892211914, "global_step": 140503, "epoch": 836} {"train_loss": -9.787636756896973, "global_step": 140504, "epoch": 836} {"train_loss": -10.531402587890625, "global_step": 140505, "epoch": 836} {"train_loss": -10.640190124511719, "global_step": 140506, "epoch": 836} {"train_loss": -10.597084999084473, "global_step": 140507, "epoch": 836} {"train_loss": -10.379637718200684, "global_step": 140508, "epoch": 836} {"train_loss": -10.151442527770996, "global_step": 140509, "epoch": 836} {"train_loss": -10.571386337280273, "global_step": 140510, "epoch": 836} {"train_loss": -9.912333488464355, "global_step": 140511, "epoch": 836} {"train_loss": -10.535955429077148, "global_step": 140512, "epoch": 836} {"train_loss": -10.355497360229492, "global_step": 140513, "epoch": 836} {"train_loss": -9.754913330078125, "global_step": 140514, "epoch": 836} {"train_loss": -10.333324432373047, "global_step": 140515, "epoch": 836} {"train_loss": -9.963111877441406, "global_step": 140516, "epoch": 836} {"train_loss": -10.373756408691406, "global_step": 140517, "epoch": 836} {"train_loss": -10.486645698547363, "global_step": 140518, "epoch": 836} {"train_loss": -10.315924644470215, "global_step": 140519, "epoch": 836} {"train_loss": -10.647480964660645, "global_step": 140520, "epoch": 836} {"train_loss": -10.22665786743164, "global_step": 140521, "epoch": 836} {"train_loss": -10.721104621887207, "global_step": 140522, "epoch": 836} {"train_loss": -10.07641887664795, "global_step": 140523, "epoch": 836} {"train_loss": -10.508271217346191, "global_step": 140524, "epoch": 836} {"train_loss": -10.530126571655273, "global_step": 140525, "epoch": 836} {"train_loss": -10.29068374633789, "global_step": 140526, "epoch": 836} {"train_loss": -10.570738792419434, "global_step": 140527, "epoch": 836} {"train_loss": -10.5798978805542, "global_step": 140528, "epoch": 836} {"train_loss": -10.353995323181152, "global_step": 140529, "epoch": 836} {"train_loss": -10.380973815917969, "global_step": 140530, "epoch": 836} {"train_loss": -10.185907363891602, "global_step": 140531, "epoch": 836} {"train_loss": -10.635601043701172, "global_step": 140532, "epoch": 836} {"train_loss": -10.651805877685547, "global_step": 140533, "epoch": 836} {"train_loss": -10.469034194946289, "global_step": 140534, "epoch": 836} {"train_loss": -10.27621841430664, "global_step": 140535, "epoch": 836} {"train_loss": -10.750020980834961, "global_step": 140536, "epoch": 836} {"train_loss": -10.2400541305542, "global_step": 140537, "epoch": 836} {"train_loss": -10.74196720123291, "global_step": 140538, "epoch": 836} {"train_loss": -10.168828010559082, "global_step": 140539, "epoch": 836} {"train_loss": -10.235452651977539, "global_step": 140540, "epoch": 836} {"train_loss": -10.42759895324707, "global_step": 140541, "epoch": 836} {"train_loss": -10.238953590393066, "global_step": 140542, "epoch": 836} {"train_loss": -10.260930061340332, "global_step": 140543, "epoch": 836} {"train_loss": -10.230966567993164, "global_step": 140544, "epoch": 836} {"train_loss": -10.483821868896484, "global_step": 140545, "epoch": 836} {"train_loss": -10.429600715637207, "global_step": 140546, "epoch": 836} {"train_loss": -10.486632347106934, "global_step": 140547, "epoch": 836} {"train_loss": -10.571599960327148, "global_step": 140548, "epoch": 836} {"train_loss": -10.717307090759277, "global_step": 140549, "epoch": 836} {"train_loss": -9.997356414794922, "global_step": 140550, "epoch": 836} {"train_loss": -10.461792945861816, "global_step": 140551, "epoch": 836} {"train_loss": -10.097494125366211, "global_step": 140552, "epoch": 836} {"train_loss": -10.748957633972168, "global_step": 140553, "epoch": 836} {"train_loss": -10.602018356323242, "global_step": 140554, "epoch": 836} {"train_loss": -10.524251937866211, "global_step": 140555, "epoch": 836} {"train_loss": -10.575658798217773, "global_step": 140556, "epoch": 836} {"train_loss": -10.494370460510254, "global_step": 140557, "epoch": 836} {"train_loss": -10.549301147460938, "global_step": 140558, "epoch": 836} {"train_loss": -10.45445442199707, "global_step": 140559, "epoch": 836} {"train_loss": -10.522344589233398, "global_step": 140560, "epoch": 836} {"train_loss": -10.652045249938965, "global_step": 140561, "epoch": 836} {"train_loss": -10.240234375, "global_step": 140562, "epoch": 836} {"train_loss": -10.612854957580566, "global_step": 140563, "epoch": 836} {"train_loss": -10.561291694641113, "global_step": 140564, "epoch": 836} {"train_loss": -10.509932518005371, "global_step": 140565, "epoch": 836} {"train_loss": -10.545483589172363, "global_step": 140566, "epoch": 836} {"train_loss": -10.402654647827148, "global_step": 140567, "epoch": 836} {"train_loss": -10.437013626098633, "global_step": 140568, "epoch": 836} {"train_loss": -10.777835845947266, "global_step": 140569, "epoch": 836} {"train_loss": -10.497340202331543, "global_step": 140570, "epoch": 836} {"train_loss": -10.763204574584961, "global_step": 140571, "epoch": 836} {"train_loss": -10.74888801574707, "global_step": 140572, "epoch": 836} {"train_loss": -10.645734786987305, "global_step": 140573, "epoch": 836} {"train_loss": -10.530746459960938, "global_step": 140574, "epoch": 836} {"train_loss": -10.655593872070312, "global_step": 140575, "epoch": 836} {"train_loss": -10.59501838684082, "global_step": 140576, "epoch": 836} {"train_loss": -10.594650268554688, "global_step": 140577, "epoch": 836} {"train_loss": -10.647384643554688, "global_step": 140578, "epoch": 836} {"train_loss": -10.857784271240234, "global_step": 140579, "epoch": 836} {"train_loss": -10.44314193725586, "global_step": 140580, "epoch": 836} {"train_loss": -10.800718307495117, "global_step": 140581, "epoch": 836} {"train_loss": -10.835737228393555, "global_step": 140582, "epoch": 836} {"train_loss": -10.70922565460205, "global_step": 140583, "epoch": 836} {"train_loss": -11.116849899291992, "global_step": 140584, "epoch": 836} {"train_loss": -10.823756217956543, "global_step": 140585, "epoch": 836} {"train_loss": -10.928939819335938, "global_step": 140586, "epoch": 836} {"train_loss": -10.710412979125977, "global_step": 140587, "epoch": 836} {"train_loss": -10.70016098022461, "global_step": 140588, "epoch": 836} {"train_loss": -10.476922988891602, "global_step": 140589, "epoch": 836} {"train_loss": -10.75194263458252, "global_step": 140590, "epoch": 836} {"train_loss": -10.565851211547852, "global_step": 140591, "epoch": 836} {"train_loss": -11.001243591308594, "global_step": 140592, "epoch": 836} {"train_loss": -10.674480438232422, "global_step": 140593, "epoch": 836} {"train_loss": -10.467597961425781, "global_step": 140594, "epoch": 836} {"train_loss": -10.84527587890625, "global_step": 140595, "epoch": 836} {"train_loss": -10.003597259521484, "global_step": 140596, "epoch": 836} {"train_loss": -10.315006256103516, "global_step": 140597, "epoch": 836} {"train_loss": -10.848165512084961, "global_step": 140598, "epoch": 836} {"train_loss": -10.733709335327148, "global_step": 140599, "epoch": 836} {"train_loss": -10.318136215209961, "global_step": 140600, "epoch": 836} {"train_loss": -10.850385665893555, "global_step": 140601, "epoch": 836} {"train_loss": -10.111978530883789, "global_step": 140602, "epoch": 836} {"train_loss": -9.635429382324219, "global_step": 140603, "epoch": 836} {"train_loss": -10.288106918334961, "global_step": 140604, "epoch": 836} {"train_loss": -8.841682434082031, "global_step": 140605, "epoch": 836} {"train_loss": -10.204211235046387, "global_step": 140606, "epoch": 836} {"train_loss": -9.216103553771973, "global_step": 140607, "epoch": 836} {"train_loss": -9.622905731201172, "global_step": 140608, "epoch": 836} {"train_loss": -10.243436813354492, "global_step": 140609, "epoch": 836} {"train_loss": -9.970148086547852, "global_step": 140610, "epoch": 836} {"train_loss": -10.244951248168945, "global_step": 140611, "epoch": 836} {"train_loss": -10.071221351623535, "global_step": 140612, "epoch": 836} {"train_loss": -9.681742668151855, "global_step": 140613, "epoch": 836} {"train_loss": -10.46800422668457, "global_step": 140614, "epoch": 836} {"train_loss": -10.440605191957383, "global_step": 140615, "epoch": 836, "val_loss": 222500.46875} {"train_loss": -10.338202476501465, "global_step": 140616, "epoch": 837} {"train_loss": -10.288887023925781, "global_step": 140617, "epoch": 837} {"train_loss": -10.26995849609375, "global_step": 140618, "epoch": 837} {"train_loss": -10.020931243896484, "global_step": 140619, "epoch": 837} {"train_loss": -10.242148399353027, "global_step": 140620, "epoch": 837} {"train_loss": -10.226607322692871, "global_step": 140621, "epoch": 837} {"train_loss": -10.344619750976562, "global_step": 140622, "epoch": 837} {"train_loss": -10.419626235961914, "global_step": 140623, "epoch": 837} {"train_loss": -10.436285972595215, "global_step": 140624, "epoch": 837} {"train_loss": -10.334030151367188, "global_step": 140625, "epoch": 837} {"train_loss": -10.453459739685059, "global_step": 140626, "epoch": 837} {"train_loss": -10.399385452270508, "global_step": 140627, "epoch": 837} {"train_loss": -10.493160247802734, "global_step": 140628, "epoch": 837} {"train_loss": -10.54439640045166, "global_step": 140629, "epoch": 837} {"train_loss": -10.700789451599121, "global_step": 140630, "epoch": 837} {"train_loss": -10.46863842010498, "global_step": 140631, "epoch": 837} {"train_loss": -10.62424087524414, "global_step": 140632, "epoch": 837} {"train_loss": -10.667267799377441, "global_step": 140633, "epoch": 837} {"train_loss": -10.498858451843262, "global_step": 140634, "epoch": 837} {"train_loss": -10.674162864685059, "global_step": 140635, "epoch": 837} {"train_loss": -10.4157075881958, "global_step": 140636, "epoch": 837} {"train_loss": -10.555412292480469, "global_step": 140637, "epoch": 837} {"train_loss": -10.674560546875, "global_step": 140638, "epoch": 837} {"train_loss": -10.362632751464844, "global_step": 140639, "epoch": 837} {"train_loss": -10.950797080993652, "global_step": 140640, "epoch": 837} {"train_loss": -10.713512420654297, "global_step": 140641, "epoch": 837} {"train_loss": -10.511488914489746, "global_step": 140642, "epoch": 837} {"train_loss": -10.752758026123047, "global_step": 140643, "epoch": 837} {"train_loss": -10.69438362121582, "global_step": 140644, "epoch": 837} {"train_loss": -10.716452598571777, "global_step": 140645, "epoch": 837} {"train_loss": -10.759794235229492, "global_step": 140646, "epoch": 837} {"train_loss": -10.609064102172852, "global_step": 140647, "epoch": 837} {"train_loss": -10.75399398803711, "global_step": 140648, "epoch": 837} {"train_loss": -10.271034240722656, "global_step": 140649, "epoch": 837} {"train_loss": -10.589574813842773, "global_step": 140650, "epoch": 837} {"train_loss": -10.144706726074219, "global_step": 140651, "epoch": 837} {"train_loss": -10.388700485229492, "global_step": 140652, "epoch": 837} {"train_loss": -10.191922187805176, "global_step": 140653, "epoch": 837} {"train_loss": -10.352848052978516, "global_step": 140654, "epoch": 837} {"train_loss": -9.949625015258789, "global_step": 140655, "epoch": 837} {"train_loss": -10.187552452087402, "global_step": 140656, "epoch": 837} {"train_loss": -10.335542678833008, "global_step": 140657, "epoch": 837} {"train_loss": -10.200922012329102, "global_step": 140658, "epoch": 837} {"train_loss": -10.262249946594238, "global_step": 140659, "epoch": 837} {"train_loss": -9.698952674865723, "global_step": 140660, "epoch": 837} {"train_loss": -10.185192108154297, "global_step": 140661, "epoch": 837} {"train_loss": -9.776494979858398, "global_step": 140662, "epoch": 837} {"train_loss": -9.885534286499023, "global_step": 140663, "epoch": 837} {"train_loss": -10.153277397155762, "global_step": 140664, "epoch": 837} {"train_loss": -10.275087356567383, "global_step": 140665, "epoch": 837} {"train_loss": -10.720429420471191, "global_step": 140666, "epoch": 837} {"train_loss": -10.15231704711914, "global_step": 140667, "epoch": 837} {"train_loss": -10.64406681060791, "global_step": 140668, "epoch": 837} {"train_loss": -10.410765647888184, "global_step": 140669, "epoch": 837} {"train_loss": -10.476175308227539, "global_step": 140670, "epoch": 837} {"train_loss": -10.308290481567383, "global_step": 140671, "epoch": 837} {"train_loss": -10.773221969604492, "global_step": 140672, "epoch": 837} {"train_loss": -10.049179077148438, "global_step": 140673, "epoch": 837} {"train_loss": -10.400453567504883, "global_step": 140674, "epoch": 837} {"train_loss": -10.043346405029297, "global_step": 140675, "epoch": 837} {"train_loss": -10.663182258605957, "global_step": 140676, "epoch": 837} {"train_loss": -10.371614456176758, "global_step": 140677, "epoch": 837} {"train_loss": -10.587934494018555, "global_step": 140678, "epoch": 837} {"train_loss": -10.53585147857666, "global_step": 140679, "epoch": 837} {"train_loss": -10.308679580688477, "global_step": 140680, "epoch": 837} {"train_loss": -10.38461685180664, "global_step": 140681, "epoch": 837} {"train_loss": -10.50859260559082, "global_step": 140682, "epoch": 837} {"train_loss": -10.548187255859375, "global_step": 140683, "epoch": 837} {"train_loss": -10.547709465026855, "global_step": 140684, "epoch": 837} {"train_loss": -10.727848052978516, "global_step": 140685, "epoch": 837} {"train_loss": -10.3829927444458, "global_step": 140686, "epoch": 837} {"train_loss": -10.48287582397461, "global_step": 140687, "epoch": 837} {"train_loss": -10.6087646484375, "global_step": 140688, "epoch": 837} {"train_loss": -10.609960556030273, "global_step": 140689, "epoch": 837} {"train_loss": -10.616759300231934, "global_step": 140690, "epoch": 837} {"train_loss": -10.411069869995117, "global_step": 140691, "epoch": 837} {"train_loss": -10.282965660095215, "global_step": 140692, "epoch": 837} {"train_loss": -10.725730895996094, "global_step": 140693, "epoch": 837} {"train_loss": -10.512601852416992, "global_step": 140694, "epoch": 837} {"train_loss": -10.712505340576172, "global_step": 140695, "epoch": 837} {"train_loss": -10.506900787353516, "global_step": 140696, "epoch": 837} {"train_loss": -10.53554630279541, "global_step": 140697, "epoch": 837} {"train_loss": -10.585503578186035, "global_step": 140698, "epoch": 837} {"train_loss": -10.48275375366211, "global_step": 140699, "epoch": 837} {"train_loss": -10.474390029907227, "global_step": 140700, "epoch": 837} {"train_loss": -10.821277618408203, "global_step": 140701, "epoch": 837} {"train_loss": -10.388883590698242, "global_step": 140702, "epoch": 837} {"train_loss": -10.608672142028809, "global_step": 140703, "epoch": 837} {"train_loss": -10.524738311767578, "global_step": 140704, "epoch": 837} {"train_loss": -10.646224975585938, "global_step": 140705, "epoch": 837} {"train_loss": -10.603100776672363, "global_step": 140706, "epoch": 837} {"train_loss": -10.67949104309082, "global_step": 140707, "epoch": 837} {"train_loss": -10.781166076660156, "global_step": 140708, "epoch": 837} {"train_loss": -10.384669303894043, "global_step": 140709, "epoch": 837} {"train_loss": -10.947603225708008, "global_step": 140710, "epoch": 837} {"train_loss": -10.388582229614258, "global_step": 140711, "epoch": 837} {"train_loss": -10.606847763061523, "global_step": 140712, "epoch": 837} {"train_loss": -10.644661903381348, "global_step": 140713, "epoch": 837} {"train_loss": -10.421409606933594, "global_step": 140714, "epoch": 837} {"train_loss": -10.860021591186523, "global_step": 140715, "epoch": 837} {"train_loss": -10.431356430053711, "global_step": 140716, "epoch": 837} {"train_loss": -10.831811904907227, "global_step": 140717, "epoch": 837} {"train_loss": -10.589675903320312, "global_step": 140718, "epoch": 837} {"train_loss": -10.580293655395508, "global_step": 140719, "epoch": 837} {"train_loss": -10.73123836517334, "global_step": 140720, "epoch": 837} {"train_loss": -10.579952239990234, "global_step": 140721, "epoch": 837} {"train_loss": -10.447488784790039, "global_step": 140722, "epoch": 837} {"train_loss": -10.6617431640625, "global_step": 140723, "epoch": 837} {"train_loss": -10.629951477050781, "global_step": 140724, "epoch": 837} {"train_loss": -10.559770584106445, "global_step": 140725, "epoch": 837} {"train_loss": -10.177680969238281, "global_step": 140726, "epoch": 837} {"train_loss": -10.84716796875, "global_step": 140727, "epoch": 837} {"train_loss": -10.568880081176758, "global_step": 140728, "epoch": 837} {"train_loss": -10.761343955993652, "global_step": 140729, "epoch": 837} {"train_loss": -10.445600509643555, "global_step": 140730, "epoch": 837} {"train_loss": -10.53095817565918, "global_step": 140731, "epoch": 837} {"train_loss": -10.51412582397461, "global_step": 140732, "epoch": 837} {"train_loss": -10.519966125488281, "global_step": 140733, "epoch": 837} {"train_loss": -10.080081939697266, "global_step": 140734, "epoch": 837} {"train_loss": -10.432055473327637, "global_step": 140735, "epoch": 837} {"train_loss": -10.559596061706543, "global_step": 140736, "epoch": 837} {"train_loss": -10.364795684814453, "global_step": 140737, "epoch": 837} {"train_loss": -10.619001388549805, "global_step": 140738, "epoch": 837} {"train_loss": -10.497007369995117, "global_step": 140739, "epoch": 837} {"train_loss": -10.151615142822266, "global_step": 140740, "epoch": 837} {"train_loss": -10.374578475952148, "global_step": 140741, "epoch": 837} {"train_loss": -10.426875114440918, "global_step": 140742, "epoch": 837} {"train_loss": -10.401512145996094, "global_step": 140743, "epoch": 837} {"train_loss": -10.533060073852539, "global_step": 140744, "epoch": 837} {"train_loss": -10.385429382324219, "global_step": 140745, "epoch": 837} {"train_loss": -10.104389190673828, "global_step": 140746, "epoch": 837} {"train_loss": -10.415891647338867, "global_step": 140747, "epoch": 837} {"train_loss": -10.200475692749023, "global_step": 140748, "epoch": 837} {"train_loss": -10.810921669006348, "global_step": 140749, "epoch": 837} {"train_loss": -10.549233436584473, "global_step": 140750, "epoch": 837} {"train_loss": -10.238919258117676, "global_step": 140751, "epoch": 837} {"train_loss": -10.451560020446777, "global_step": 140752, "epoch": 837} {"train_loss": -10.43924331665039, "global_step": 140753, "epoch": 837} {"train_loss": -10.440765380859375, "global_step": 140754, "epoch": 837} {"train_loss": -10.309414863586426, "global_step": 140755, "epoch": 837} {"train_loss": -10.711252212524414, "global_step": 140756, "epoch": 837} {"train_loss": -10.511341094970703, "global_step": 140757, "epoch": 837} {"train_loss": -10.604032516479492, "global_step": 140758, "epoch": 837} {"train_loss": -10.654586791992188, "global_step": 140759, "epoch": 837} {"train_loss": -10.549714088439941, "global_step": 140760, "epoch": 837} {"train_loss": -10.768510818481445, "global_step": 140761, "epoch": 837} {"train_loss": -10.652849197387695, "global_step": 140762, "epoch": 837} {"train_loss": -10.650867462158203, "global_step": 140763, "epoch": 837} {"train_loss": -10.745620727539062, "global_step": 140764, "epoch": 837} {"train_loss": -10.573488235473633, "global_step": 140765, "epoch": 837} {"train_loss": -10.464456558227539, "global_step": 140766, "epoch": 837} {"train_loss": -10.860827445983887, "global_step": 140767, "epoch": 837} {"train_loss": -10.68886947631836, "global_step": 140768, "epoch": 837} {"train_loss": -10.918685913085938, "global_step": 140769, "epoch": 837} {"train_loss": -10.628561973571777, "global_step": 140770, "epoch": 837} {"train_loss": -10.868202209472656, "global_step": 140771, "epoch": 837} {"train_loss": -10.759922981262207, "global_step": 140772, "epoch": 837} {"train_loss": -10.73585033416748, "global_step": 140773, "epoch": 837} {"train_loss": -10.645843505859375, "global_step": 140774, "epoch": 837} {"train_loss": -10.719639778137207, "global_step": 140775, "epoch": 837} {"train_loss": -10.600570678710938, "global_step": 140776, "epoch": 837} {"train_loss": -10.788358688354492, "global_step": 140777, "epoch": 837} {"train_loss": -10.760841369628906, "global_step": 140778, "epoch": 837} {"train_loss": -11.032407760620117, "global_step": 140779, "epoch": 837} {"train_loss": -10.992684364318848, "global_step": 140780, "epoch": 837} {"train_loss": -10.49726676940918, "global_step": 140781, "epoch": 837} {"train_loss": -10.886768341064453, "global_step": 140782, "epoch": 837} {"train_loss": -10.508439779281616, "global_step": 140783, "epoch": 837, "val_loss": 225159.890625} {"train_loss": -10.599905014038086, "global_step": 140784, "epoch": 838} {"train_loss": -10.489734649658203, "global_step": 140785, "epoch": 838} {"train_loss": -10.751623153686523, "global_step": 140786, "epoch": 838} {"train_loss": -10.471502304077148, "global_step": 140787, "epoch": 838} {"train_loss": -10.858808517456055, "global_step": 140788, "epoch": 838} {"train_loss": -10.541176795959473, "global_step": 140789, "epoch": 838} {"train_loss": -10.527350425720215, "global_step": 140790, "epoch": 838} {"train_loss": -10.635866165161133, "global_step": 140791, "epoch": 838} {"train_loss": -10.7257080078125, "global_step": 140792, "epoch": 838} {"train_loss": -10.598711013793945, "global_step": 140793, "epoch": 838} {"train_loss": -10.829209327697754, "global_step": 140794, "epoch": 838} {"train_loss": -10.616912841796875, "global_step": 140795, "epoch": 838} {"train_loss": -10.371854782104492, "global_step": 140796, "epoch": 838} {"train_loss": -10.853090286254883, "global_step": 140797, "epoch": 838} {"train_loss": -10.646793365478516, "global_step": 140798, "epoch": 838} {"train_loss": -10.145121574401855, "global_step": 140799, "epoch": 838} {"train_loss": -10.805353164672852, "global_step": 140800, "epoch": 838} {"train_loss": -10.296979904174805, "global_step": 140801, "epoch": 838} {"train_loss": -10.162227630615234, "global_step": 140802, "epoch": 838} {"train_loss": -10.44332504272461, "global_step": 140803, "epoch": 838} {"train_loss": -10.598217964172363, "global_step": 140804, "epoch": 838} {"train_loss": -10.349990844726562, "global_step": 140805, "epoch": 838} {"train_loss": -10.694564819335938, "global_step": 140806, "epoch": 838} {"train_loss": -10.735088348388672, "global_step": 140807, "epoch": 838} {"train_loss": -10.666486740112305, "global_step": 140808, "epoch": 838} {"train_loss": -10.475898742675781, "global_step": 140809, "epoch": 838} {"train_loss": -10.543266296386719, "global_step": 140810, "epoch": 838} {"train_loss": -10.510997772216797, "global_step": 140811, "epoch": 838} {"train_loss": -10.34800910949707, "global_step": 140812, "epoch": 838} {"train_loss": -10.742740631103516, "global_step": 140813, "epoch": 838} {"train_loss": -10.2752685546875, "global_step": 140814, "epoch": 838} {"train_loss": -10.71158218383789, "global_step": 140815, "epoch": 838} {"train_loss": -10.472610473632812, "global_step": 140816, "epoch": 838} {"train_loss": -10.335067749023438, "global_step": 140817, "epoch": 838} {"train_loss": -10.665307998657227, "global_step": 140818, "epoch": 838} {"train_loss": -10.501171112060547, "global_step": 140819, "epoch": 838} {"train_loss": -10.627029418945312, "global_step": 140820, "epoch": 838} {"train_loss": -10.62147331237793, "global_step": 140821, "epoch": 838} {"train_loss": -10.632303237915039, "global_step": 140822, "epoch": 838} {"train_loss": -10.759246826171875, "global_step": 140823, "epoch": 838} {"train_loss": -10.445958137512207, "global_step": 140824, "epoch": 838} {"train_loss": -10.711309432983398, "global_step": 140825, "epoch": 838} {"train_loss": -10.616340637207031, "global_step": 140826, "epoch": 838} {"train_loss": -10.928550720214844, "global_step": 140827, "epoch": 838} {"train_loss": -10.67750358581543, "global_step": 140828, "epoch": 838} {"train_loss": -10.86461353302002, "global_step": 140829, "epoch": 838} {"train_loss": -10.770661354064941, "global_step": 140830, "epoch": 838} {"train_loss": -10.883133888244629, "global_step": 140831, "epoch": 838} {"train_loss": -10.781797409057617, "global_step": 140832, "epoch": 838} {"train_loss": -10.764728546142578, "global_step": 140833, "epoch": 838} {"train_loss": -10.735942840576172, "global_step": 140834, "epoch": 838} {"train_loss": -10.692874908447266, "global_step": 140835, "epoch": 838} {"train_loss": -10.698280334472656, "global_step": 140836, "epoch": 838} {"train_loss": -10.657615661621094, "global_step": 140837, "epoch": 838} {"train_loss": -10.695201873779297, "global_step": 140838, "epoch": 838} {"train_loss": -10.566055297851562, "global_step": 140839, "epoch": 838} {"train_loss": -10.882088661193848, "global_step": 140840, "epoch": 838} {"train_loss": -10.526910781860352, "global_step": 140841, "epoch": 838} {"train_loss": -10.565139770507812, "global_step": 140842, "epoch": 838} {"train_loss": -10.857948303222656, "global_step": 140843, "epoch": 838} {"train_loss": -10.48484992980957, "global_step": 140844, "epoch": 838} {"train_loss": -9.99543571472168, "global_step": 140845, "epoch": 838} {"train_loss": -10.760480880737305, "global_step": 140846, "epoch": 838} {"train_loss": -10.536693572998047, "global_step": 140847, "epoch": 838} {"train_loss": -10.761841773986816, "global_step": 140848, "epoch": 838} {"train_loss": -10.21252155303955, "global_step": 140849, "epoch": 838} {"train_loss": -10.409745216369629, "global_step": 140850, "epoch": 838} {"train_loss": -10.410887718200684, "global_step": 140851, "epoch": 838} {"train_loss": -10.24398422241211, "global_step": 140852, "epoch": 838} {"train_loss": -10.651408195495605, "global_step": 140853, "epoch": 838} {"train_loss": -10.010597229003906, "global_step": 140854, "epoch": 838} {"train_loss": -10.145195007324219, "global_step": 140855, "epoch": 838} {"train_loss": -10.186485290527344, "global_step": 140856, "epoch": 838} {"train_loss": -8.888069152832031, "global_step": 140857, "epoch": 838} {"train_loss": -10.323606491088867, "global_step": 140858, "epoch": 838} {"train_loss": -9.927189826965332, "global_step": 140859, "epoch": 838} {"train_loss": -9.974462509155273, "global_step": 140860, "epoch": 838} {"train_loss": -9.647764205932617, "global_step": 140861, "epoch": 838} {"train_loss": -10.102457046508789, "global_step": 140862, "epoch": 838} {"train_loss": -10.195609092712402, "global_step": 140863, "epoch": 838} {"train_loss": -9.9998140335083, "global_step": 140864, "epoch": 838} {"train_loss": -10.395907402038574, "global_step": 140865, "epoch": 838} {"train_loss": -10.091442108154297, "global_step": 140866, "epoch": 838} {"train_loss": -10.323801040649414, "global_step": 140867, "epoch": 838} {"train_loss": -10.233062744140625, "global_step": 140868, "epoch": 838} {"train_loss": -10.589033126831055, "global_step": 140869, "epoch": 838} {"train_loss": -10.460771560668945, "global_step": 140870, "epoch": 838} {"train_loss": -10.54831600189209, "global_step": 140871, "epoch": 838} {"train_loss": -10.366548538208008, "global_step": 140872, "epoch": 838} {"train_loss": -9.675214767456055, "global_step": 140873, "epoch": 838} {"train_loss": -10.634848594665527, "global_step": 140874, "epoch": 838} {"train_loss": -9.822991371154785, "global_step": 140875, "epoch": 838} {"train_loss": -10.099234580993652, "global_step": 140876, "epoch": 838} {"train_loss": -10.384604454040527, "global_step": 140877, "epoch": 838} {"train_loss": -10.197470664978027, "global_step": 140878, "epoch": 838} {"train_loss": -10.365108489990234, "global_step": 140879, "epoch": 838} {"train_loss": -10.557022094726562, "global_step": 140880, "epoch": 838} {"train_loss": -10.327120780944824, "global_step": 140881, "epoch": 838} {"train_loss": -10.569398880004883, "global_step": 140882, "epoch": 838} {"train_loss": -10.342620849609375, "global_step": 140883, "epoch": 838} {"train_loss": -10.557260513305664, "global_step": 140884, "epoch": 838} {"train_loss": -10.768059730529785, "global_step": 140885, "epoch": 838} {"train_loss": -10.23532485961914, "global_step": 140886, "epoch": 838} {"train_loss": -10.514519691467285, "global_step": 140887, "epoch": 838} {"train_loss": -10.374971389770508, "global_step": 140888, "epoch": 838} {"train_loss": -10.65915298461914, "global_step": 140889, "epoch": 838} {"train_loss": -10.774524688720703, "global_step": 140890, "epoch": 838} {"train_loss": -10.767019271850586, "global_step": 140891, "epoch": 838} {"train_loss": -10.776275634765625, "global_step": 140892, "epoch": 838} {"train_loss": -10.62276554107666, "global_step": 140893, "epoch": 838} {"train_loss": -10.509026527404785, "global_step": 140894, "epoch": 838} {"train_loss": -10.501258850097656, "global_step": 140895, "epoch": 838} {"train_loss": -10.852676391601562, "global_step": 140896, "epoch": 838} {"train_loss": -10.328720092773438, "global_step": 140897, "epoch": 838} {"train_loss": -10.979887008666992, "global_step": 140898, "epoch": 838} {"train_loss": -10.509231567382812, "global_step": 140899, "epoch": 838} {"train_loss": -10.711587905883789, "global_step": 140900, "epoch": 838} {"train_loss": -10.250364303588867, "global_step": 140901, "epoch": 838} {"train_loss": -10.728221893310547, "global_step": 140902, "epoch": 838} {"train_loss": -10.426898956298828, "global_step": 140903, "epoch": 838} {"train_loss": -10.580574035644531, "global_step": 140904, "epoch": 838} {"train_loss": -10.756778717041016, "global_step": 140905, "epoch": 838} {"train_loss": -10.405853271484375, "global_step": 140906, "epoch": 838} {"train_loss": -10.800371170043945, "global_step": 140907, "epoch": 838} {"train_loss": -10.589107513427734, "global_step": 140908, "epoch": 838} {"train_loss": -10.56903076171875, "global_step": 140909, "epoch": 838} {"train_loss": -10.593780517578125, "global_step": 140910, "epoch": 838} {"train_loss": -10.732004165649414, "global_step": 140911, "epoch": 838} {"train_loss": -10.774484634399414, "global_step": 140912, "epoch": 838} {"train_loss": -10.50898551940918, "global_step": 140913, "epoch": 838} {"train_loss": -10.74644660949707, "global_step": 140914, "epoch": 838} {"train_loss": -10.794748306274414, "global_step": 140915, "epoch": 838} {"train_loss": -10.694860458374023, "global_step": 140916, "epoch": 838} {"train_loss": -10.87993049621582, "global_step": 140917, "epoch": 838} {"train_loss": -10.949655532836914, "global_step": 140918, "epoch": 838} {"train_loss": -10.76054573059082, "global_step": 140919, "epoch": 838} {"train_loss": -10.851259231567383, "global_step": 140920, "epoch": 838} {"train_loss": -10.79588508605957, "global_step": 140921, "epoch": 838} {"train_loss": -10.610513687133789, "global_step": 140922, "epoch": 838} {"train_loss": -10.687511444091797, "global_step": 140923, "epoch": 838} {"train_loss": -10.776365280151367, "global_step": 140924, "epoch": 838} {"train_loss": -10.948909759521484, "global_step": 140925, "epoch": 838} {"train_loss": -10.73241901397705, "global_step": 140926, "epoch": 838} {"train_loss": -10.76171875, "global_step": 140927, "epoch": 838} {"train_loss": -10.578802108764648, "global_step": 140928, "epoch": 838} {"train_loss": -10.752904891967773, "global_step": 140929, "epoch": 838} {"train_loss": -10.251199722290039, "global_step": 140930, "epoch": 838} {"train_loss": -10.838163375854492, "global_step": 140931, "epoch": 838} {"train_loss": -10.484003067016602, "global_step": 140932, "epoch": 838} {"train_loss": -10.605207443237305, "global_step": 140933, "epoch": 838} {"train_loss": -10.790522575378418, "global_step": 140934, "epoch": 838} {"train_loss": -10.685786247253418, "global_step": 140935, "epoch": 838} {"train_loss": -10.644746780395508, "global_step": 140936, "epoch": 838} {"train_loss": -10.609244346618652, "global_step": 140937, "epoch": 838} {"train_loss": -10.610379219055176, "global_step": 140938, "epoch": 838} {"train_loss": -10.617757797241211, "global_step": 140939, "epoch": 838} {"train_loss": -10.985885620117188, "global_step": 140940, "epoch": 838} {"train_loss": -10.950559616088867, "global_step": 140941, "epoch": 838} {"train_loss": -10.505029678344727, "global_step": 140942, "epoch": 838} {"train_loss": -10.858903884887695, "global_step": 140943, "epoch": 838} {"train_loss": -10.878249168395996, "global_step": 140944, "epoch": 838} {"train_loss": -10.860671043395996, "global_step": 140945, "epoch": 838} {"train_loss": -10.451642990112305, "global_step": 140946, "epoch": 838} {"train_loss": -10.789379119873047, "global_step": 140947, "epoch": 838} {"train_loss": -10.598819732666016, "global_step": 140948, "epoch": 838} {"train_loss": -10.431331634521484, "global_step": 140949, "epoch": 838} {"train_loss": -10.501117706298828, "global_step": 140950, "epoch": 838} {"train_loss": -10.54663824467432, "global_step": 140951, "epoch": 838, "val_loss": 224207.359375} {"train_loss": -10.067492485046387, "global_step": 140952, "epoch": 839} {"train_loss": -10.149521827697754, "global_step": 140953, "epoch": 839} {"train_loss": -10.388769149780273, "global_step": 140954, "epoch": 839} {"train_loss": -9.708456993103027, "global_step": 140955, "epoch": 839} {"train_loss": -10.669755935668945, "global_step": 140956, "epoch": 839} {"train_loss": -10.276926040649414, "global_step": 140957, "epoch": 839} {"train_loss": -9.91865062713623, "global_step": 140958, "epoch": 839} {"train_loss": -10.693235397338867, "global_step": 140959, "epoch": 839} {"train_loss": -10.256783485412598, "global_step": 140960, "epoch": 839} {"train_loss": -10.469196319580078, "global_step": 140961, "epoch": 839} {"train_loss": -10.22485065460205, "global_step": 140962, "epoch": 839} {"train_loss": -9.932806015014648, "global_step": 140963, "epoch": 839} {"train_loss": -10.684124946594238, "global_step": 140964, "epoch": 839} {"train_loss": -9.418119430541992, "global_step": 140965, "epoch": 839} {"train_loss": -10.217836380004883, "global_step": 140966, "epoch": 839} {"train_loss": -10.034263610839844, "global_step": 140967, "epoch": 839} {"train_loss": -10.236330032348633, "global_step": 140968, "epoch": 839} {"train_loss": -10.415200233459473, "global_step": 140969, "epoch": 839} {"train_loss": -10.097343444824219, "global_step": 140970, "epoch": 839} {"train_loss": -9.820039749145508, "global_step": 140971, "epoch": 839} {"train_loss": -10.321513175964355, "global_step": 140972, "epoch": 839} {"train_loss": -9.558418273925781, "global_step": 140973, "epoch": 839} {"train_loss": -9.871330261230469, "global_step": 140974, "epoch": 839} {"train_loss": -9.9976167678833, "global_step": 140975, "epoch": 839} {"train_loss": -9.875616073608398, "global_step": 140976, "epoch": 839} {"train_loss": -10.139842987060547, "global_step": 140977, "epoch": 839} {"train_loss": -9.841386795043945, "global_step": 140978, "epoch": 839} {"train_loss": -9.78466796875, "global_step": 140979, "epoch": 839} {"train_loss": -10.275368690490723, "global_step": 140980, "epoch": 839} {"train_loss": -9.85793685913086, "global_step": 140981, "epoch": 839} {"train_loss": -10.103446960449219, "global_step": 140982, "epoch": 839} {"train_loss": -10.190460205078125, "global_step": 140983, "epoch": 839} {"train_loss": -10.104942321777344, "global_step": 140984, "epoch": 839} {"train_loss": -9.32077407836914, "global_step": 140985, "epoch": 839} {"train_loss": -10.364290237426758, "global_step": 140986, "epoch": 839} {"train_loss": -10.238883972167969, "global_step": 140987, "epoch": 839} {"train_loss": -9.62110424041748, "global_step": 140988, "epoch": 839} {"train_loss": -10.142644882202148, "global_step": 140989, "epoch": 839} {"train_loss": -10.34738826751709, "global_step": 140990, "epoch": 839} {"train_loss": -9.935796737670898, "global_step": 140991, "epoch": 839} {"train_loss": -10.291302680969238, "global_step": 140992, "epoch": 839} {"train_loss": -10.220569610595703, "global_step": 140993, "epoch": 839} {"train_loss": -10.39651107788086, "global_step": 140994, "epoch": 839} {"train_loss": -10.624460220336914, "global_step": 140995, "epoch": 839} {"train_loss": -10.268258094787598, "global_step": 140996, "epoch": 839} {"train_loss": -10.285001754760742, "global_step": 140997, "epoch": 839} {"train_loss": -10.445758819580078, "global_step": 140998, "epoch": 839} {"train_loss": -10.457648277282715, "global_step": 140999, "epoch": 839} {"train_loss": -10.54427719116211, "global_step": 141000, "epoch": 839} {"train_loss": -10.45868968963623, "global_step": 141001, "epoch": 839} {"train_loss": -10.36100959777832, "global_step": 141002, "epoch": 839} {"train_loss": -10.444077491760254, "global_step": 141003, "epoch": 839} {"train_loss": -10.572433471679688, "global_step": 141004, "epoch": 839} {"train_loss": -10.438358306884766, "global_step": 141005, "epoch": 839} {"train_loss": -10.520334243774414, "global_step": 141006, "epoch": 839} {"train_loss": -10.561744689941406, "global_step": 141007, "epoch": 839} {"train_loss": -10.531417846679688, "global_step": 141008, "epoch": 839} {"train_loss": -10.313547134399414, "global_step": 141009, "epoch": 839} {"train_loss": -10.52071762084961, "global_step": 141010, "epoch": 839} {"train_loss": -10.525486946105957, "global_step": 141011, "epoch": 839} {"train_loss": -10.500954627990723, "global_step": 141012, "epoch": 839} {"train_loss": -9.787755966186523, "global_step": 141013, "epoch": 839} {"train_loss": -9.982210159301758, "global_step": 141014, "epoch": 839} {"train_loss": -10.616108894348145, "global_step": 141015, "epoch": 839} {"train_loss": -10.185949325561523, "global_step": 141016, "epoch": 839} {"train_loss": -10.251832008361816, "global_step": 141017, "epoch": 839} {"train_loss": -10.223995208740234, "global_step": 141018, "epoch": 839} {"train_loss": -10.469399452209473, "global_step": 141019, "epoch": 839} {"train_loss": -10.512781143188477, "global_step": 141020, "epoch": 839} {"train_loss": -10.340530395507812, "global_step": 141021, "epoch": 839} {"train_loss": -10.536738395690918, "global_step": 141022, "epoch": 839} {"train_loss": -10.198559761047363, "global_step": 141023, "epoch": 839} {"train_loss": -10.525860786437988, "global_step": 141024, "epoch": 839} {"train_loss": -10.259809494018555, "global_step": 141025, "epoch": 839} {"train_loss": -10.41804313659668, "global_step": 141026, "epoch": 839} {"train_loss": -10.60062026977539, "global_step": 141027, "epoch": 839} {"train_loss": -10.382589340209961, "global_step": 141028, "epoch": 839} {"train_loss": -10.516180038452148, "global_step": 141029, "epoch": 839} {"train_loss": -10.488560676574707, "global_step": 141030, "epoch": 839} {"train_loss": -10.451028823852539, "global_step": 141031, "epoch": 839} {"train_loss": -10.629914283752441, "global_step": 141032, "epoch": 839} {"train_loss": -10.582621574401855, "global_step": 141033, "epoch": 839} {"train_loss": -10.53136920928955, "global_step": 141034, "epoch": 839} {"train_loss": -10.637303352355957, "global_step": 141035, "epoch": 839} {"train_loss": -10.685249328613281, "global_step": 141036, "epoch": 839} {"train_loss": -10.450538635253906, "global_step": 141037, "epoch": 839} {"train_loss": -10.696958541870117, "global_step": 141038, "epoch": 839} {"train_loss": -10.230493545532227, "global_step": 141039, "epoch": 839} {"train_loss": -10.525402069091797, "global_step": 141040, "epoch": 839} {"train_loss": -10.33503246307373, "global_step": 141041, "epoch": 839} {"train_loss": -10.457387924194336, "global_step": 141042, "epoch": 839} {"train_loss": -10.530309677124023, "global_step": 141043, "epoch": 839} {"train_loss": -10.561616897583008, "global_step": 141044, "epoch": 839} {"train_loss": -10.755398750305176, "global_step": 141045, "epoch": 839} {"train_loss": -10.416322708129883, "global_step": 141046, "epoch": 839} {"train_loss": -10.537801742553711, "global_step": 141047, "epoch": 839} {"train_loss": -10.715087890625, "global_step": 141048, "epoch": 839} {"train_loss": -10.429121017456055, "global_step": 141049, "epoch": 839} {"train_loss": -10.559284210205078, "global_step": 141050, "epoch": 839} {"train_loss": -10.541638374328613, "global_step": 141051, "epoch": 839} {"train_loss": -10.491233825683594, "global_step": 141052, "epoch": 839} {"train_loss": -10.553915023803711, "global_step": 141053, "epoch": 839} {"train_loss": -10.501724243164062, "global_step": 141054, "epoch": 839} {"train_loss": -10.68160629272461, "global_step": 141055, "epoch": 839} {"train_loss": -10.59847640991211, "global_step": 141056, "epoch": 839} {"train_loss": -10.446022987365723, "global_step": 141057, "epoch": 839} {"train_loss": -10.287389755249023, "global_step": 141058, "epoch": 839} {"train_loss": -9.984562873840332, "global_step": 141059, "epoch": 839} {"train_loss": -10.933144569396973, "global_step": 141060, "epoch": 839} {"train_loss": -9.511494636535645, "global_step": 141061, "epoch": 839} {"train_loss": -10.247084617614746, "global_step": 141062, "epoch": 839} {"train_loss": -10.175899505615234, "global_step": 141063, "epoch": 839} {"train_loss": -9.897979736328125, "global_step": 141064, "epoch": 839} {"train_loss": -10.844686508178711, "global_step": 141065, "epoch": 839} {"train_loss": -10.37769889831543, "global_step": 141066, "epoch": 839} {"train_loss": -10.61702823638916, "global_step": 141067, "epoch": 839} {"train_loss": -10.456193923950195, "global_step": 141068, "epoch": 839} {"train_loss": -10.147466659545898, "global_step": 141069, "epoch": 839} {"train_loss": -10.735448837280273, "global_step": 141070, "epoch": 839} {"train_loss": -10.07591724395752, "global_step": 141071, "epoch": 839} {"train_loss": -10.275359153747559, "global_step": 141072, "epoch": 839} {"train_loss": -9.375763893127441, "global_step": 141073, "epoch": 839} {"train_loss": -9.961657524108887, "global_step": 141074, "epoch": 839} {"train_loss": -10.002867698669434, "global_step": 141075, "epoch": 839} {"train_loss": -10.297760009765625, "global_step": 141076, "epoch": 839} {"train_loss": -9.768848419189453, "global_step": 141077, "epoch": 839} {"train_loss": -10.3878173828125, "global_step": 141078, "epoch": 839} {"train_loss": -9.559821128845215, "global_step": 141079, "epoch": 839} {"train_loss": -9.688142776489258, "global_step": 141080, "epoch": 839} {"train_loss": -9.723268508911133, "global_step": 141081, "epoch": 839} {"train_loss": -9.585150718688965, "global_step": 141082, "epoch": 839} {"train_loss": -9.597026824951172, "global_step": 141083, "epoch": 839} {"train_loss": -8.85348892211914, "global_step": 141084, "epoch": 839} {"train_loss": -10.206568717956543, "global_step": 141085, "epoch": 839} {"train_loss": -8.720434188842773, "global_step": 141086, "epoch": 839} {"train_loss": -9.743050575256348, "global_step": 141087, "epoch": 839} {"train_loss": -10.341878890991211, "global_step": 141088, "epoch": 839} {"train_loss": -9.744043350219727, "global_step": 141089, "epoch": 839} {"train_loss": -9.827865600585938, "global_step": 141090, "epoch": 839} {"train_loss": -9.416463851928711, "global_step": 141091, "epoch": 839} {"train_loss": -10.038801193237305, "global_step": 141092, "epoch": 839} {"train_loss": -9.560538291931152, "global_step": 141093, "epoch": 839} {"train_loss": -9.771864891052246, "global_step": 141094, "epoch": 839} {"train_loss": -10.052713394165039, "global_step": 141095, "epoch": 839} {"train_loss": -9.902271270751953, "global_step": 141096, "epoch": 839} {"train_loss": -10.353995323181152, "global_step": 141097, "epoch": 839} {"train_loss": -9.853214263916016, "global_step": 141098, "epoch": 839} {"train_loss": -10.175182342529297, "global_step": 141099, "epoch": 839} {"train_loss": -9.973994255065918, "global_step": 141100, "epoch": 839} {"train_loss": -9.962946891784668, "global_step": 141101, "epoch": 839} {"train_loss": -10.278945922851562, "global_step": 141102, "epoch": 839} {"train_loss": -10.138509750366211, "global_step": 141103, "epoch": 839} {"train_loss": -10.168792724609375, "global_step": 141104, "epoch": 839} {"train_loss": -10.180130004882812, "global_step": 141105, "epoch": 839} {"train_loss": -10.205639839172363, "global_step": 141106, "epoch": 839} {"train_loss": -10.145462989807129, "global_step": 141107, "epoch": 839} {"train_loss": -10.131325721740723, "global_step": 141108, "epoch": 839} {"train_loss": -10.34733772277832, "global_step": 141109, "epoch": 839} {"train_loss": -10.428104400634766, "global_step": 141110, "epoch": 839} {"train_loss": -10.403861045837402, "global_step": 141111, "epoch": 839} {"train_loss": -10.225292205810547, "global_step": 141112, "epoch": 839} {"train_loss": -10.200756072998047, "global_step": 141113, "epoch": 839} {"train_loss": -10.339125633239746, "global_step": 141114, "epoch": 839} {"train_loss": -10.362525939941406, "global_step": 141115, "epoch": 839} {"train_loss": -10.365789413452148, "global_step": 141116, "epoch": 839} {"train_loss": -10.544690132141113, "global_step": 141117, "epoch": 839} {"train_loss": -10.503345489501953, "global_step": 141118, "epoch": 839} {"train_loss": -10.227837585267567, "global_step": 141119, "epoch": 839, "val_loss": 226149.96875} {"train_loss": -10.641963005065918, "global_step": 141120, "epoch": 840} {"train_loss": -10.558445930480957, "global_step": 141121, "epoch": 840} {"train_loss": -10.781072616577148, "global_step": 141122, "epoch": 840} {"train_loss": -10.584423065185547, "global_step": 141123, "epoch": 840} {"train_loss": -10.726078033447266, "global_step": 141124, "epoch": 840} {"train_loss": -10.621325492858887, "global_step": 141125, "epoch": 840} {"train_loss": -10.475625991821289, "global_step": 141126, "epoch": 840} {"train_loss": -10.554563522338867, "global_step": 141127, "epoch": 840} {"train_loss": -10.563791275024414, "global_step": 141128, "epoch": 840} {"train_loss": -10.72884464263916, "global_step": 141129, "epoch": 840} {"train_loss": -10.876812934875488, "global_step": 141130, "epoch": 840} {"train_loss": -10.601959228515625, "global_step": 141131, "epoch": 840} {"train_loss": -10.802276611328125, "global_step": 141132, "epoch": 840} {"train_loss": -10.495344161987305, "global_step": 141133, "epoch": 840} {"train_loss": -10.784780502319336, "global_step": 141134, "epoch": 840} {"train_loss": -10.697897911071777, "global_step": 141135, "epoch": 840} {"train_loss": -10.791345596313477, "global_step": 141136, "epoch": 840} {"train_loss": -10.595060348510742, "global_step": 141137, "epoch": 840} {"train_loss": -10.860233306884766, "global_step": 141138, "epoch": 840} {"train_loss": -11.068084716796875, "global_step": 141139, "epoch": 840} {"train_loss": -10.911375045776367, "global_step": 141140, "epoch": 840} {"train_loss": -10.800747871398926, "global_step": 141141, "epoch": 840} {"train_loss": -10.874086380004883, "global_step": 141142, "epoch": 840} {"train_loss": -10.510943412780762, "global_step": 141143, "epoch": 840} {"train_loss": -10.775874137878418, "global_step": 141144, "epoch": 840} {"train_loss": -10.905289649963379, "global_step": 141145, "epoch": 840} {"train_loss": -10.950784683227539, "global_step": 141146, "epoch": 840} {"train_loss": -10.719938278198242, "global_step": 141147, "epoch": 840} {"train_loss": -11.113195419311523, "global_step": 141148, "epoch": 840} {"train_loss": -10.728885650634766, "global_step": 141149, "epoch": 840} {"train_loss": -10.83327865600586, "global_step": 141150, "epoch": 840} {"train_loss": -10.791839599609375, "global_step": 141151, "epoch": 840} {"train_loss": -10.947284698486328, "global_step": 141152, "epoch": 840} {"train_loss": -10.777932167053223, "global_step": 141153, "epoch": 840} {"train_loss": -10.612794876098633, "global_step": 141154, "epoch": 840} {"train_loss": -11.09323501586914, "global_step": 141155, "epoch": 840} {"train_loss": -10.500640869140625, "global_step": 141156, "epoch": 840} {"train_loss": -10.541566848754883, "global_step": 141157, "epoch": 840} {"train_loss": -11.083045959472656, "global_step": 141158, "epoch": 840} {"train_loss": -10.023476600646973, "global_step": 141159, "epoch": 840} {"train_loss": -9.400580406188965, "global_step": 141160, "epoch": 840} {"train_loss": -10.658710479736328, "global_step": 141161, "epoch": 840} {"train_loss": -8.888900756835938, "global_step": 141162, "epoch": 840} {"train_loss": -9.626039505004883, "global_step": 141163, "epoch": 840} {"train_loss": -10.852941513061523, "global_step": 141164, "epoch": 840} {"train_loss": -8.51955795288086, "global_step": 141165, "epoch": 840} {"train_loss": -10.73137378692627, "global_step": 141166, "epoch": 840} {"train_loss": -8.360143661499023, "global_step": 141167, "epoch": 840} {"train_loss": -9.587288856506348, "global_step": 141168, "epoch": 840} {"train_loss": -8.93778133392334, "global_step": 141169, "epoch": 840} {"train_loss": -9.675397872924805, "global_step": 141170, "epoch": 840} {"train_loss": -9.468175888061523, "global_step": 141171, "epoch": 840} {"train_loss": -9.443937301635742, "global_step": 141172, "epoch": 840} {"train_loss": -9.663772583007812, "global_step": 141173, "epoch": 840} {"train_loss": -9.528055191040039, "global_step": 141174, "epoch": 840} {"train_loss": -9.528282165527344, "global_step": 141175, "epoch": 840} {"train_loss": -9.171680450439453, "global_step": 141176, "epoch": 840} {"train_loss": -10.061656951904297, "global_step": 141177, "epoch": 840} {"train_loss": -10.074369430541992, "global_step": 141178, "epoch": 840} {"train_loss": -9.987438201904297, "global_step": 141179, "epoch": 840} {"train_loss": -9.869410514831543, "global_step": 141180, "epoch": 840} {"train_loss": -9.893048286437988, "global_step": 141181, "epoch": 840} {"train_loss": -10.147819519042969, "global_step": 141182, "epoch": 840} {"train_loss": -10.289536476135254, "global_step": 141183, "epoch": 840} {"train_loss": -10.119218826293945, "global_step": 141184, "epoch": 840} {"train_loss": -10.298959732055664, "global_step": 141185, "epoch": 840} {"train_loss": -10.016487121582031, "global_step": 141186, "epoch": 840} {"train_loss": -10.206600189208984, "global_step": 141187, "epoch": 840} {"train_loss": -10.242477416992188, "global_step": 141188, "epoch": 840} {"train_loss": -10.199361801147461, "global_step": 141189, "epoch": 840} {"train_loss": -10.209149360656738, "global_step": 141190, "epoch": 840} {"train_loss": -10.444377899169922, "global_step": 141191, "epoch": 840} {"train_loss": -10.294769287109375, "global_step": 141192, "epoch": 840} {"train_loss": -10.312044143676758, "global_step": 141193, "epoch": 840} {"train_loss": -10.104348182678223, "global_step": 141194, "epoch": 840} {"train_loss": -10.452664375305176, "global_step": 141195, "epoch": 840} {"train_loss": -10.307239532470703, "global_step": 141196, "epoch": 840} {"train_loss": -10.50300407409668, "global_step": 141197, "epoch": 840} {"train_loss": -10.465248107910156, "global_step": 141198, "epoch": 840} {"train_loss": -10.447274208068848, "global_step": 141199, "epoch": 840} {"train_loss": -10.425029754638672, "global_step": 141200, "epoch": 840} {"train_loss": -10.421859741210938, "global_step": 141201, "epoch": 840} {"train_loss": -10.51575756072998, "global_step": 141202, "epoch": 840} {"train_loss": -10.258224487304688, "global_step": 141203, "epoch": 840} {"train_loss": -10.58182144165039, "global_step": 141204, "epoch": 840} {"train_loss": -10.667777061462402, "global_step": 141205, "epoch": 840} {"train_loss": -10.560628890991211, "global_step": 141206, "epoch": 840} {"train_loss": -10.70872688293457, "global_step": 141207, "epoch": 840} {"train_loss": -10.643519401550293, "global_step": 141208, "epoch": 840} {"train_loss": -10.38876724243164, "global_step": 141209, "epoch": 840} {"train_loss": -10.530059814453125, "global_step": 141210, "epoch": 840} {"train_loss": -10.702350616455078, "global_step": 141211, "epoch": 840} {"train_loss": -10.653409957885742, "global_step": 141212, "epoch": 840} {"train_loss": -10.851112365722656, "global_step": 141213, "epoch": 840} {"train_loss": -10.533998489379883, "global_step": 141214, "epoch": 840} {"train_loss": -10.847676277160645, "global_step": 141215, "epoch": 840} {"train_loss": -10.766980171203613, "global_step": 141216, "epoch": 840} {"train_loss": -10.968782424926758, "global_step": 141217, "epoch": 840} {"train_loss": -10.799978256225586, "global_step": 141218, "epoch": 840} {"train_loss": -10.712303161621094, "global_step": 141219, "epoch": 840} {"train_loss": -10.76713752746582, "global_step": 141220, "epoch": 840} {"train_loss": -10.964171409606934, "global_step": 141221, "epoch": 840} {"train_loss": -10.76900863647461, "global_step": 141222, "epoch": 840} {"train_loss": -10.699929237365723, "global_step": 141223, "epoch": 840} {"train_loss": -10.719986915588379, "global_step": 141224, "epoch": 840} {"train_loss": -10.519596099853516, "global_step": 141225, "epoch": 840} {"train_loss": -10.7265625, "global_step": 141226, "epoch": 840} {"train_loss": -10.981783866882324, "global_step": 141227, "epoch": 840} {"train_loss": -11.046550750732422, "global_step": 141228, "epoch": 840} {"train_loss": -10.662986755371094, "global_step": 141229, "epoch": 840} {"train_loss": -10.748391151428223, "global_step": 141230, "epoch": 840} {"train_loss": -10.64858627319336, "global_step": 141231, "epoch": 840} {"train_loss": -10.424077987670898, "global_step": 141232, "epoch": 840} {"train_loss": -10.683655738830566, "global_step": 141233, "epoch": 840} {"train_loss": -10.46205997467041, "global_step": 141234, "epoch": 840} {"train_loss": -10.993551254272461, "global_step": 141235, "epoch": 840} {"train_loss": -10.80721664428711, "global_step": 141236, "epoch": 840} {"train_loss": -10.834587097167969, "global_step": 141237, "epoch": 840} {"train_loss": -10.60720443725586, "global_step": 141238, "epoch": 840} {"train_loss": -10.35949993133545, "global_step": 141239, "epoch": 840} {"train_loss": -10.917909622192383, "global_step": 141240, "epoch": 840} {"train_loss": -10.709961891174316, "global_step": 141241, "epoch": 840} {"train_loss": -10.99432373046875, "global_step": 141242, "epoch": 840} {"train_loss": -10.712732315063477, "global_step": 141243, "epoch": 840} {"train_loss": -10.930858612060547, "global_step": 141244, "epoch": 840} {"train_loss": -10.893896102905273, "global_step": 141245, "epoch": 840} {"train_loss": -10.869039535522461, "global_step": 141246, "epoch": 840} {"train_loss": -10.798395156860352, "global_step": 141247, "epoch": 840} {"train_loss": -10.996288299560547, "global_step": 141248, "epoch": 840} {"train_loss": -10.768192291259766, "global_step": 141249, "epoch": 840} {"train_loss": -10.919975280761719, "global_step": 141250, "epoch": 840} {"train_loss": -10.91679859161377, "global_step": 141251, "epoch": 840} {"train_loss": -10.66772747039795, "global_step": 141252, "epoch": 840} {"train_loss": -10.861663818359375, "global_step": 141253, "epoch": 840} {"train_loss": -10.832868576049805, "global_step": 141254, "epoch": 840} {"train_loss": -10.558999061584473, "global_step": 141255, "epoch": 840} {"train_loss": -10.817269325256348, "global_step": 141256, "epoch": 840} {"train_loss": -10.623027801513672, "global_step": 141257, "epoch": 840} {"train_loss": -10.858194351196289, "global_step": 141258, "epoch": 840} {"train_loss": -10.90369701385498, "global_step": 141259, "epoch": 840} {"train_loss": -10.423955917358398, "global_step": 141260, "epoch": 840} {"train_loss": -10.400979995727539, "global_step": 141261, "epoch": 840} {"train_loss": -10.56751537322998, "global_step": 141262, "epoch": 840} {"train_loss": -9.990232467651367, "global_step": 141263, "epoch": 840} {"train_loss": -10.44076919555664, "global_step": 141264, "epoch": 840} {"train_loss": -9.824871063232422, "global_step": 141265, "epoch": 840} {"train_loss": -10.352188110351562, "global_step": 141266, "epoch": 840} {"train_loss": -9.603004455566406, "global_step": 141267, "epoch": 840} {"train_loss": -10.353246688842773, "global_step": 141268, "epoch": 840} {"train_loss": -10.304503440856934, "global_step": 141269, "epoch": 840} {"train_loss": -9.593709945678711, "global_step": 141270, "epoch": 840} {"train_loss": -10.557796478271484, "global_step": 141271, "epoch": 840} {"train_loss": -9.14581298828125, "global_step": 141272, "epoch": 840} {"train_loss": -10.093790054321289, "global_step": 141273, "epoch": 840} {"train_loss": -10.564460754394531, "global_step": 141274, "epoch": 840} {"train_loss": -10.229324340820312, "global_step": 141275, "epoch": 840} {"train_loss": -10.527813911437988, "global_step": 141276, "epoch": 840} {"train_loss": -10.041058540344238, "global_step": 141277, "epoch": 840} {"train_loss": -10.197439193725586, "global_step": 141278, "epoch": 840} {"train_loss": -10.14777946472168, "global_step": 141279, "epoch": 840} {"train_loss": -10.621458053588867, "global_step": 141280, "epoch": 840} {"train_loss": -9.95124340057373, "global_step": 141281, "epoch": 840} {"train_loss": -9.75649356842041, "global_step": 141282, "epoch": 840} {"train_loss": -10.603784561157227, "global_step": 141283, "epoch": 840} {"train_loss": -10.033935546875, "global_step": 141284, "epoch": 840} {"train_loss": -10.259415626525879, "global_step": 141285, "epoch": 840} {"train_loss": -10.077081680297852, "global_step": 141286, "epoch": 840} {"train_loss": -10.444033231054034, "global_step": 141287, "epoch": 840, "val_loss": 219895.609375, "train_action_mse_error": 3.1567225456237793} {"train_loss": -10.044998168945312, "global_step": 141288, "epoch": 841} {"train_loss": -10.094432830810547, "global_step": 141289, "epoch": 841} {"train_loss": -10.276450157165527, "global_step": 141290, "epoch": 841} {"train_loss": -10.216133117675781, "global_step": 141291, "epoch": 841} {"train_loss": -9.944878578186035, "global_step": 141292, "epoch": 841} {"train_loss": -10.614036560058594, "global_step": 141293, "epoch": 841} {"train_loss": -10.116392135620117, "global_step": 141294, "epoch": 841} {"train_loss": -10.13998794555664, "global_step": 141295, "epoch": 841} {"train_loss": -10.361027717590332, "global_step": 141296, "epoch": 841} {"train_loss": -9.966145515441895, "global_step": 141297, "epoch": 841} {"train_loss": -10.175276756286621, "global_step": 141298, "epoch": 841} {"train_loss": -10.389362335205078, "global_step": 141299, "epoch": 841} {"train_loss": -9.94430160522461, "global_step": 141300, "epoch": 841} {"train_loss": -10.413848876953125, "global_step": 141301, "epoch": 841} {"train_loss": -10.315422058105469, "global_step": 141302, "epoch": 841} {"train_loss": -10.359129905700684, "global_step": 141303, "epoch": 841} {"train_loss": -10.573017120361328, "global_step": 141304, "epoch": 841} {"train_loss": -10.205511093139648, "global_step": 141305, "epoch": 841} {"train_loss": -10.28091812133789, "global_step": 141306, "epoch": 841} {"train_loss": -10.249643325805664, "global_step": 141307, "epoch": 841} {"train_loss": -10.158905982971191, "global_step": 141308, "epoch": 841} {"train_loss": -10.25938606262207, "global_step": 141309, "epoch": 841} {"train_loss": -10.4937162399292, "global_step": 141310, "epoch": 841} {"train_loss": -10.537485122680664, "global_step": 141311, "epoch": 841} {"train_loss": -10.46693229675293, "global_step": 141312, "epoch": 841} {"train_loss": -10.472616195678711, "global_step": 141313, "epoch": 841} {"train_loss": -10.236682891845703, "global_step": 141314, "epoch": 841} {"train_loss": -10.626443862915039, "global_step": 141315, "epoch": 841} {"train_loss": -9.965644836425781, "global_step": 141316, "epoch": 841} {"train_loss": -10.724874496459961, "global_step": 141317, "epoch": 841} {"train_loss": -10.181929588317871, "global_step": 141318, "epoch": 841} {"train_loss": -10.392306327819824, "global_step": 141319, "epoch": 841} {"train_loss": -10.597738265991211, "global_step": 141320, "epoch": 841} {"train_loss": -10.602964401245117, "global_step": 141321, "epoch": 841} {"train_loss": -10.427104949951172, "global_step": 141322, "epoch": 841} {"train_loss": -10.646451950073242, "global_step": 141323, "epoch": 841} {"train_loss": -10.476607322692871, "global_step": 141324, "epoch": 841} {"train_loss": -10.223959922790527, "global_step": 141325, "epoch": 841} {"train_loss": -10.678044319152832, "global_step": 141326, "epoch": 841} {"train_loss": -10.41930866241455, "global_step": 141327, "epoch": 841} {"train_loss": -10.779252052307129, "global_step": 141328, "epoch": 841} {"train_loss": -10.16879653930664, "global_step": 141329, "epoch": 841} {"train_loss": -10.802303314208984, "global_step": 141330, "epoch": 841} {"train_loss": -10.608495712280273, "global_step": 141331, "epoch": 841} {"train_loss": -10.446298599243164, "global_step": 141332, "epoch": 841} {"train_loss": -10.784892082214355, "global_step": 141333, "epoch": 841} {"train_loss": -10.654400825500488, "global_step": 141334, "epoch": 841} {"train_loss": -10.953571319580078, "global_step": 141335, "epoch": 841} {"train_loss": -10.860157012939453, "global_step": 141336, "epoch": 841} {"train_loss": -10.762129783630371, "global_step": 141337, "epoch": 841} {"train_loss": -10.691883087158203, "global_step": 141338, "epoch": 841} {"train_loss": -10.854284286499023, "global_step": 141339, "epoch": 841} {"train_loss": -10.816306114196777, "global_step": 141340, "epoch": 841} {"train_loss": -10.87373161315918, "global_step": 141341, "epoch": 841} {"train_loss": -10.844938278198242, "global_step": 141342, "epoch": 841} {"train_loss": -10.969133377075195, "global_step": 141343, "epoch": 841} {"train_loss": -10.957752227783203, "global_step": 141344, "epoch": 841} {"train_loss": -11.15641975402832, "global_step": 141345, "epoch": 841} {"train_loss": -10.821898460388184, "global_step": 141346, "epoch": 841} {"train_loss": -11.032564163208008, "global_step": 141347, "epoch": 841} {"train_loss": -10.993997573852539, "global_step": 141348, "epoch": 841} {"train_loss": -10.988256454467773, "global_step": 141349, "epoch": 841} {"train_loss": -10.665712356567383, "global_step": 141350, "epoch": 841} {"train_loss": -11.033796310424805, "global_step": 141351, "epoch": 841} {"train_loss": -11.071052551269531, "global_step": 141352, "epoch": 841} {"train_loss": -10.733915328979492, "global_step": 141353, "epoch": 841} {"train_loss": -10.574387550354004, "global_step": 141354, "epoch": 841} {"train_loss": -10.810962677001953, "global_step": 141355, "epoch": 841} {"train_loss": -10.623348236083984, "global_step": 141356, "epoch": 841} {"train_loss": -10.2127685546875, "global_step": 141357, "epoch": 841} {"train_loss": -10.738134384155273, "global_step": 141358, "epoch": 841} {"train_loss": -10.591875076293945, "global_step": 141359, "epoch": 841} {"train_loss": -10.647846221923828, "global_step": 141360, "epoch": 841} {"train_loss": -10.883665084838867, "global_step": 141361, "epoch": 841} {"train_loss": -10.977245330810547, "global_step": 141362, "epoch": 841} {"train_loss": -10.586606979370117, "global_step": 141363, "epoch": 841} {"train_loss": -10.141697883605957, "global_step": 141364, "epoch": 841} {"train_loss": -10.963920593261719, "global_step": 141365, "epoch": 841} {"train_loss": -10.729211807250977, "global_step": 141366, "epoch": 841} {"train_loss": -10.260930061340332, "global_step": 141367, "epoch": 841} {"train_loss": -10.484842300415039, "global_step": 141368, "epoch": 841} {"train_loss": -10.027154922485352, "global_step": 141369, "epoch": 841} {"train_loss": -10.462093353271484, "global_step": 141370, "epoch": 841} {"train_loss": -9.281695365905762, "global_step": 141371, "epoch": 841} {"train_loss": -9.960535049438477, "global_step": 141372, "epoch": 841} {"train_loss": -10.699899673461914, "global_step": 141373, "epoch": 841} {"train_loss": -10.258750915527344, "global_step": 141374, "epoch": 841} {"train_loss": -10.441128730773926, "global_step": 141375, "epoch": 841} {"train_loss": -10.517865180969238, "global_step": 141376, "epoch": 841} {"train_loss": -10.16650390625, "global_step": 141377, "epoch": 841} {"train_loss": -10.482233047485352, "global_step": 141378, "epoch": 841} {"train_loss": -10.279536247253418, "global_step": 141379, "epoch": 841} {"train_loss": -10.234691619873047, "global_step": 141380, "epoch": 841} {"train_loss": -10.488438606262207, "global_step": 141381, "epoch": 841} {"train_loss": -10.611926078796387, "global_step": 141382, "epoch": 841} {"train_loss": -10.704536437988281, "global_step": 141383, "epoch": 841} {"train_loss": -10.852376937866211, "global_step": 141384, "epoch": 841} {"train_loss": -10.503255844116211, "global_step": 141385, "epoch": 841} {"train_loss": -10.527511596679688, "global_step": 141386, "epoch": 841} {"train_loss": -10.79662036895752, "global_step": 141387, "epoch": 841} {"train_loss": -10.65428352355957, "global_step": 141388, "epoch": 841} {"train_loss": -10.651250839233398, "global_step": 141389, "epoch": 841} {"train_loss": -10.541303634643555, "global_step": 141390, "epoch": 841} {"train_loss": -10.420540809631348, "global_step": 141391, "epoch": 841} {"train_loss": -10.40776252746582, "global_step": 141392, "epoch": 841} {"train_loss": -10.408733367919922, "global_step": 141393, "epoch": 841} {"train_loss": -10.61641788482666, "global_step": 141394, "epoch": 841} {"train_loss": -10.483390808105469, "global_step": 141395, "epoch": 841} {"train_loss": -10.668498992919922, "global_step": 141396, "epoch": 841} {"train_loss": -10.67176342010498, "global_step": 141397, "epoch": 841} {"train_loss": -10.573310852050781, "global_step": 141398, "epoch": 841} {"train_loss": -10.43392276763916, "global_step": 141399, "epoch": 841} {"train_loss": -10.176678657531738, "global_step": 141400, "epoch": 841} {"train_loss": -10.569334030151367, "global_step": 141401, "epoch": 841} {"train_loss": -10.42827033996582, "global_step": 141402, "epoch": 841} {"train_loss": -10.56784439086914, "global_step": 141403, "epoch": 841} {"train_loss": -10.372557640075684, "global_step": 141404, "epoch": 841} {"train_loss": -10.682844161987305, "global_step": 141405, "epoch": 841} {"train_loss": -10.664422988891602, "global_step": 141406, "epoch": 841} {"train_loss": -10.77859115600586, "global_step": 141407, "epoch": 841} {"train_loss": -10.702056884765625, "global_step": 141408, "epoch": 841} {"train_loss": -10.76845645904541, "global_step": 141409, "epoch": 841} {"train_loss": -10.74875259399414, "global_step": 141410, "epoch": 841} {"train_loss": -10.69015884399414, "global_step": 141411, "epoch": 841} {"train_loss": -10.778595924377441, "global_step": 141412, "epoch": 841} {"train_loss": -10.436763763427734, "global_step": 141413, "epoch": 841} {"train_loss": -10.309782028198242, "global_step": 141414, "epoch": 841} {"train_loss": -10.77674388885498, "global_step": 141415, "epoch": 841} {"train_loss": -10.689151763916016, "global_step": 141416, "epoch": 841} {"train_loss": -10.794302940368652, "global_step": 141417, "epoch": 841} {"train_loss": -10.575824737548828, "global_step": 141418, "epoch": 841} {"train_loss": -10.635544776916504, "global_step": 141419, "epoch": 841} {"train_loss": -10.96435832977295, "global_step": 141420, "epoch": 841} {"train_loss": -10.636323928833008, "global_step": 141421, "epoch": 841} {"train_loss": -11.02073860168457, "global_step": 141422, "epoch": 841} {"train_loss": -10.57839584350586, "global_step": 141423, "epoch": 841} {"train_loss": -10.756155967712402, "global_step": 141424, "epoch": 841} {"train_loss": -10.903246879577637, "global_step": 141425, "epoch": 841} {"train_loss": -10.838571548461914, "global_step": 141426, "epoch": 841} {"train_loss": -11.070639610290527, "global_step": 141427, "epoch": 841} {"train_loss": -10.670235633850098, "global_step": 141428, "epoch": 841} {"train_loss": -10.883769989013672, "global_step": 141429, "epoch": 841} {"train_loss": -10.630010604858398, "global_step": 141430, "epoch": 841} {"train_loss": -10.592157363891602, "global_step": 141431, "epoch": 841} {"train_loss": -10.559026718139648, "global_step": 141432, "epoch": 841} {"train_loss": -10.8438720703125, "global_step": 141433, "epoch": 841} {"train_loss": -10.300945281982422, "global_step": 141434, "epoch": 841} {"train_loss": -10.69371509552002, "global_step": 141435, "epoch": 841} {"train_loss": -10.590662956237793, "global_step": 141436, "epoch": 841} {"train_loss": -10.516901016235352, "global_step": 141437, "epoch": 841} {"train_loss": -10.556928634643555, "global_step": 141438, "epoch": 841} {"train_loss": -10.459890365600586, "global_step": 141439, "epoch": 841} {"train_loss": -10.643733978271484, "global_step": 141440, "epoch": 841} {"train_loss": -10.592985153198242, "global_step": 141441, "epoch": 841} {"train_loss": -10.493717193603516, "global_step": 141442, "epoch": 841} {"train_loss": -10.39930534362793, "global_step": 141443, "epoch": 841} {"train_loss": -9.910079002380371, "global_step": 141444, "epoch": 841} {"train_loss": -10.671165466308594, "global_step": 141445, "epoch": 841} {"train_loss": -10.33588981628418, "global_step": 141446, "epoch": 841} {"train_loss": -10.165536880493164, "global_step": 141447, "epoch": 841} {"train_loss": -10.78516960144043, "global_step": 141448, "epoch": 841} {"train_loss": -10.269851684570312, "global_step": 141449, "epoch": 841} {"train_loss": -10.599139213562012, "global_step": 141450, "epoch": 841} {"train_loss": -10.23968505859375, "global_step": 141451, "epoch": 841} {"train_loss": -10.601761817932129, "global_step": 141452, "epoch": 841} {"train_loss": -10.505049705505371, "global_step": 141453, "epoch": 841} {"train_loss": -10.471297264099121, "global_step": 141454, "epoch": 841} {"train_loss": -10.542205197470528, "global_step": 141455, "epoch": 841, "val_loss": 228027.046875} {"train_loss": -10.400876998901367, "global_step": 141456, "epoch": 842} {"train_loss": -10.311220169067383, "global_step": 141457, "epoch": 842} {"train_loss": -10.59640121459961, "global_step": 141458, "epoch": 842} {"train_loss": -10.118279457092285, "global_step": 141459, "epoch": 842} {"train_loss": -10.570486068725586, "global_step": 141460, "epoch": 842} {"train_loss": -10.230326652526855, "global_step": 141461, "epoch": 842} {"train_loss": -10.575724601745605, "global_step": 141462, "epoch": 842} {"train_loss": -10.392115592956543, "global_step": 141463, "epoch": 842} {"train_loss": -10.605415344238281, "global_step": 141464, "epoch": 842} {"train_loss": -10.191352844238281, "global_step": 141465, "epoch": 842} {"train_loss": -10.293228149414062, "global_step": 141466, "epoch": 842} {"train_loss": -10.334510803222656, "global_step": 141467, "epoch": 842} {"train_loss": -10.34913158416748, "global_step": 141468, "epoch": 842} {"train_loss": -10.435240745544434, "global_step": 141469, "epoch": 842} {"train_loss": -10.169157028198242, "global_step": 141470, "epoch": 842} {"train_loss": -10.481091499328613, "global_step": 141471, "epoch": 842} {"train_loss": -10.06900405883789, "global_step": 141472, "epoch": 842} {"train_loss": -10.625463485717773, "global_step": 141473, "epoch": 842} {"train_loss": -10.001585006713867, "global_step": 141474, "epoch": 842} {"train_loss": -10.732373237609863, "global_step": 141475, "epoch": 842} {"train_loss": -10.273853302001953, "global_step": 141476, "epoch": 842} {"train_loss": -10.589326858520508, "global_step": 141477, "epoch": 842} {"train_loss": -10.486665725708008, "global_step": 141478, "epoch": 842} {"train_loss": -10.645980834960938, "global_step": 141479, "epoch": 842} {"train_loss": -10.633442878723145, "global_step": 141480, "epoch": 842} {"train_loss": -10.718711853027344, "global_step": 141481, "epoch": 842} {"train_loss": -10.628227233886719, "global_step": 141482, "epoch": 842} {"train_loss": -10.744651794433594, "global_step": 141483, "epoch": 842} {"train_loss": -10.742298126220703, "global_step": 141484, "epoch": 842} {"train_loss": -10.88252067565918, "global_step": 141485, "epoch": 842} {"train_loss": -10.733928680419922, "global_step": 141486, "epoch": 842} {"train_loss": -10.939231872558594, "global_step": 141487, "epoch": 842} {"train_loss": -10.859711647033691, "global_step": 141488, "epoch": 842} {"train_loss": -10.756071090698242, "global_step": 141489, "epoch": 842} {"train_loss": -10.962924003601074, "global_step": 141490, "epoch": 842} {"train_loss": -10.836546897888184, "global_step": 141491, "epoch": 842} {"train_loss": -10.776782989501953, "global_step": 141492, "epoch": 842} {"train_loss": -10.884100914001465, "global_step": 141493, "epoch": 842} {"train_loss": -11.13682746887207, "global_step": 141494, "epoch": 842} {"train_loss": -11.043990135192871, "global_step": 141495, "epoch": 842} {"train_loss": -10.97700309753418, "global_step": 141496, "epoch": 842} {"train_loss": -11.038824081420898, "global_step": 141497, "epoch": 842} {"train_loss": -10.996152877807617, "global_step": 141498, "epoch": 842} {"train_loss": -10.879556655883789, "global_step": 141499, "epoch": 842} {"train_loss": -10.796487808227539, "global_step": 141500, "epoch": 842} {"train_loss": -10.748647689819336, "global_step": 141501, "epoch": 842} {"train_loss": -10.71718692779541, "global_step": 141502, "epoch": 842} {"train_loss": -10.698227882385254, "global_step": 141503, "epoch": 842} {"train_loss": -11.079828262329102, "global_step": 141504, "epoch": 842} {"train_loss": -10.848082542419434, "global_step": 141505, "epoch": 842} {"train_loss": -10.9922513961792, "global_step": 141506, "epoch": 842} {"train_loss": -11.211978912353516, "global_step": 141507, "epoch": 842} {"train_loss": -10.99892807006836, "global_step": 141508, "epoch": 842} {"train_loss": -10.815383911132812, "global_step": 141509, "epoch": 842} {"train_loss": -10.917083740234375, "global_step": 141510, "epoch": 842} {"train_loss": -10.727664947509766, "global_step": 141511, "epoch": 842} {"train_loss": -10.453466415405273, "global_step": 141512, "epoch": 842} {"train_loss": -10.865205764770508, "global_step": 141513, "epoch": 842} {"train_loss": -10.80263900756836, "global_step": 141514, "epoch": 842} {"train_loss": -9.477272033691406, "global_step": 141515, "epoch": 842} {"train_loss": -9.091484069824219, "global_step": 141516, "epoch": 842} {"train_loss": -10.682926177978516, "global_step": 141517, "epoch": 842} {"train_loss": -9.89494514465332, "global_step": 141518, "epoch": 842} {"train_loss": -10.415505409240723, "global_step": 141519, "epoch": 842} {"train_loss": -10.041655540466309, "global_step": 141520, "epoch": 842} {"train_loss": -9.242681503295898, "global_step": 141521, "epoch": 842} {"train_loss": -10.114500999450684, "global_step": 141522, "epoch": 842} {"train_loss": -9.583704948425293, "global_step": 141523, "epoch": 842} {"train_loss": -9.973297119140625, "global_step": 141524, "epoch": 842} {"train_loss": -10.008520126342773, "global_step": 141525, "epoch": 842} {"train_loss": -10.41904067993164, "global_step": 141526, "epoch": 842} {"train_loss": -10.408600807189941, "global_step": 141527, "epoch": 842} {"train_loss": -10.355399131774902, "global_step": 141528, "epoch": 842} {"train_loss": -9.932400703430176, "global_step": 141529, "epoch": 842} {"train_loss": -10.242204666137695, "global_step": 141530, "epoch": 842} {"train_loss": -10.131328582763672, "global_step": 141531, "epoch": 842} {"train_loss": -10.234006881713867, "global_step": 141532, "epoch": 842} {"train_loss": -10.328189849853516, "global_step": 141533, "epoch": 842} {"train_loss": -10.152443885803223, "global_step": 141534, "epoch": 842} {"train_loss": -10.035611152648926, "global_step": 141535, "epoch": 842} {"train_loss": -10.036163330078125, "global_step": 141536, "epoch": 842} {"train_loss": -10.055971145629883, "global_step": 141537, "epoch": 842} {"train_loss": -10.42526626586914, "global_step": 141538, "epoch": 842} {"train_loss": -10.588220596313477, "global_step": 141539, "epoch": 842} {"train_loss": -10.150604248046875, "global_step": 141540, "epoch": 842} {"train_loss": -10.307394027709961, "global_step": 141541, "epoch": 842} {"train_loss": -10.48255443572998, "global_step": 141542, "epoch": 842} {"train_loss": -10.645233154296875, "global_step": 141543, "epoch": 842} {"train_loss": -10.230610847473145, "global_step": 141544, "epoch": 842} {"train_loss": -10.450416564941406, "global_step": 141545, "epoch": 842} {"train_loss": -10.463935852050781, "global_step": 141546, "epoch": 842} {"train_loss": -10.213272094726562, "global_step": 141547, "epoch": 842} {"train_loss": -10.515169143676758, "global_step": 141548, "epoch": 842} {"train_loss": -10.58739948272705, "global_step": 141549, "epoch": 842} {"train_loss": -10.550519943237305, "global_step": 141550, "epoch": 842} {"train_loss": -10.439284324645996, "global_step": 141551, "epoch": 842} {"train_loss": -10.442487716674805, "global_step": 141552, "epoch": 842} {"train_loss": -10.59634780883789, "global_step": 141553, "epoch": 842} {"train_loss": -10.20266056060791, "global_step": 141554, "epoch": 842} {"train_loss": -10.531505584716797, "global_step": 141555, "epoch": 842} {"train_loss": -10.625955581665039, "global_step": 141556, "epoch": 842} {"train_loss": -10.74002456665039, "global_step": 141557, "epoch": 842} {"train_loss": -10.650190353393555, "global_step": 141558, "epoch": 842} {"train_loss": -10.30752944946289, "global_step": 141559, "epoch": 842} {"train_loss": -10.488199234008789, "global_step": 141560, "epoch": 842} {"train_loss": -10.45093822479248, "global_step": 141561, "epoch": 842} {"train_loss": -10.557243347167969, "global_step": 141562, "epoch": 842} {"train_loss": -10.613450050354004, "global_step": 141563, "epoch": 842} {"train_loss": -10.604988098144531, "global_step": 141564, "epoch": 842} {"train_loss": -10.7305326461792, "global_step": 141565, "epoch": 842} {"train_loss": -10.4631929397583, "global_step": 141566, "epoch": 842} {"train_loss": -10.57574462890625, "global_step": 141567, "epoch": 842} {"train_loss": -10.453119277954102, "global_step": 141568, "epoch": 842} {"train_loss": -10.745279312133789, "global_step": 141569, "epoch": 842} {"train_loss": -10.421866416931152, "global_step": 141570, "epoch": 842} {"train_loss": -10.474496841430664, "global_step": 141571, "epoch": 842} {"train_loss": -10.479650497436523, "global_step": 141572, "epoch": 842} {"train_loss": -10.561995506286621, "global_step": 141573, "epoch": 842} {"train_loss": -10.569007873535156, "global_step": 141574, "epoch": 842} {"train_loss": -10.931795120239258, "global_step": 141575, "epoch": 842} {"train_loss": -10.283809661865234, "global_step": 141576, "epoch": 842} {"train_loss": -10.378219604492188, "global_step": 141577, "epoch": 842} {"train_loss": -10.546370506286621, "global_step": 141578, "epoch": 842} {"train_loss": -10.512592315673828, "global_step": 141579, "epoch": 842} {"train_loss": -10.533885955810547, "global_step": 141580, "epoch": 842} {"train_loss": -10.627641677856445, "global_step": 141581, "epoch": 842} {"train_loss": -10.69711685180664, "global_step": 141582, "epoch": 842} {"train_loss": -10.64085578918457, "global_step": 141583, "epoch": 842} {"train_loss": -10.709922790527344, "global_step": 141584, "epoch": 842} {"train_loss": -10.642792701721191, "global_step": 141585, "epoch": 842} {"train_loss": -10.88227367401123, "global_step": 141586, "epoch": 842} {"train_loss": -10.409671783447266, "global_step": 141587, "epoch": 842} {"train_loss": -10.571847915649414, "global_step": 141588, "epoch": 842} {"train_loss": -10.616981506347656, "global_step": 141589, "epoch": 842} {"train_loss": -10.615875244140625, "global_step": 141590, "epoch": 842} {"train_loss": -10.340936660766602, "global_step": 141591, "epoch": 842} {"train_loss": -10.823781967163086, "global_step": 141592, "epoch": 842} {"train_loss": -10.600719451904297, "global_step": 141593, "epoch": 842} {"train_loss": -10.462159156799316, "global_step": 141594, "epoch": 842} {"train_loss": -10.683547973632812, "global_step": 141595, "epoch": 842} {"train_loss": -10.266947746276855, "global_step": 141596, "epoch": 842} {"train_loss": -10.848126411437988, "global_step": 141597, "epoch": 842} {"train_loss": -10.424331665039062, "global_step": 141598, "epoch": 842} {"train_loss": -10.674972534179688, "global_step": 141599, "epoch": 842} {"train_loss": -10.764713287353516, "global_step": 141600, "epoch": 842} {"train_loss": -10.595178604125977, "global_step": 141601, "epoch": 842} {"train_loss": -10.89011001586914, "global_step": 141602, "epoch": 842} {"train_loss": -10.676408767700195, "global_step": 141603, "epoch": 842} {"train_loss": -10.795430183410645, "global_step": 141604, "epoch": 842} {"train_loss": -10.80943775177002, "global_step": 141605, "epoch": 842} {"train_loss": -10.908393859863281, "global_step": 141606, "epoch": 842} {"train_loss": -10.76136589050293, "global_step": 141607, "epoch": 842} {"train_loss": -10.890836715698242, "global_step": 141608, "epoch": 842} {"train_loss": -10.812749862670898, "global_step": 141609, "epoch": 842} {"train_loss": -11.047597885131836, "global_step": 141610, "epoch": 842} {"train_loss": -10.748098373413086, "global_step": 141611, "epoch": 842} {"train_loss": -10.808643341064453, "global_step": 141612, "epoch": 842} {"train_loss": -10.590402603149414, "global_step": 141613, "epoch": 842} {"train_loss": -10.643966674804688, "global_step": 141614, "epoch": 842} {"train_loss": -10.791067123413086, "global_step": 141615, "epoch": 842} {"train_loss": -10.708450317382812, "global_step": 141616, "epoch": 842} {"train_loss": -10.881709098815918, "global_step": 141617, "epoch": 842} {"train_loss": -10.75178337097168, "global_step": 141618, "epoch": 842} {"train_loss": -10.780256271362305, "global_step": 141619, "epoch": 842} {"train_loss": -10.866188049316406, "global_step": 141620, "epoch": 842} {"train_loss": -10.835944175720215, "global_step": 141621, "epoch": 842} {"train_loss": -10.678451538085938, "global_step": 141622, "epoch": 842} {"train_loss": -10.54798326038179, "global_step": 141623, "epoch": 842, "val_loss": 227665.453125} {"train_loss": -10.106386184692383, "global_step": 141624, "epoch": 843} {"train_loss": -10.071138381958008, "global_step": 141625, "epoch": 843} {"train_loss": -10.30885124206543, "global_step": 141626, "epoch": 843} {"train_loss": -10.547465324401855, "global_step": 141627, "epoch": 843} {"train_loss": -10.197107315063477, "global_step": 141628, "epoch": 843} {"train_loss": -9.929399490356445, "global_step": 141629, "epoch": 843} {"train_loss": -10.238222122192383, "global_step": 141630, "epoch": 843} {"train_loss": -9.765088081359863, "global_step": 141631, "epoch": 843} {"train_loss": -9.956277847290039, "global_step": 141632, "epoch": 843} {"train_loss": -10.168020248413086, "global_step": 141633, "epoch": 843} {"train_loss": -9.806032180786133, "global_step": 141634, "epoch": 843} {"train_loss": -10.484274864196777, "global_step": 141635, "epoch": 843} {"train_loss": -9.934439659118652, "global_step": 141636, "epoch": 843} {"train_loss": -10.466829299926758, "global_step": 141637, "epoch": 843} {"train_loss": -10.243524551391602, "global_step": 141638, "epoch": 843} {"train_loss": -10.257235527038574, "global_step": 141639, "epoch": 843} {"train_loss": -10.296564102172852, "global_step": 141640, "epoch": 843} {"train_loss": -10.3108491897583, "global_step": 141641, "epoch": 843} {"train_loss": -10.467254638671875, "global_step": 141642, "epoch": 843} {"train_loss": -10.364981651306152, "global_step": 141643, "epoch": 843} {"train_loss": -10.54444694519043, "global_step": 141644, "epoch": 843} {"train_loss": -10.243755340576172, "global_step": 141645, "epoch": 843} {"train_loss": -10.424399375915527, "global_step": 141646, "epoch": 843} {"train_loss": -10.590702056884766, "global_step": 141647, "epoch": 843} {"train_loss": -10.715256690979004, "global_step": 141648, "epoch": 843} {"train_loss": -10.676409721374512, "global_step": 141649, "epoch": 843} {"train_loss": -10.920469284057617, "global_step": 141650, "epoch": 843} {"train_loss": -10.686336517333984, "global_step": 141651, "epoch": 843} {"train_loss": -10.797283172607422, "global_step": 141652, "epoch": 843} {"train_loss": -10.787569046020508, "global_step": 141653, "epoch": 843} {"train_loss": -10.834272384643555, "global_step": 141654, "epoch": 843} {"train_loss": -10.755806922912598, "global_step": 141655, "epoch": 843} {"train_loss": -10.658977508544922, "global_step": 141656, "epoch": 843} {"train_loss": -10.712621688842773, "global_step": 141657, "epoch": 843} {"train_loss": -10.739383697509766, "global_step": 141658, "epoch": 843} {"train_loss": -10.764762878417969, "global_step": 141659, "epoch": 843} {"train_loss": -10.870780944824219, "global_step": 141660, "epoch": 843} {"train_loss": -10.636833190917969, "global_step": 141661, "epoch": 843} {"train_loss": -10.822467803955078, "global_step": 141662, "epoch": 843} {"train_loss": -10.610466003417969, "global_step": 141663, "epoch": 843} {"train_loss": -10.779382705688477, "global_step": 141664, "epoch": 843} {"train_loss": -10.640095710754395, "global_step": 141665, "epoch": 843} {"train_loss": -10.824396133422852, "global_step": 141666, "epoch": 843} {"train_loss": -10.815533638000488, "global_step": 141667, "epoch": 843} {"train_loss": -10.905561447143555, "global_step": 141668, "epoch": 843} {"train_loss": -10.685473442077637, "global_step": 141669, "epoch": 843} {"train_loss": -11.019551277160645, "global_step": 141670, "epoch": 843} {"train_loss": -10.657373428344727, "global_step": 141671, "epoch": 843} {"train_loss": -10.65572738647461, "global_step": 141672, "epoch": 843} {"train_loss": -10.885255813598633, "global_step": 141673, "epoch": 843} {"train_loss": -10.496805191040039, "global_step": 141674, "epoch": 843} {"train_loss": -10.676441192626953, "global_step": 141675, "epoch": 843} {"train_loss": -10.147809982299805, "global_step": 141676, "epoch": 843} {"train_loss": -10.856746673583984, "global_step": 141677, "epoch": 843} {"train_loss": -11.07053279876709, "global_step": 141678, "epoch": 843} {"train_loss": -10.625112533569336, "global_step": 141679, "epoch": 843} {"train_loss": -10.09927749633789, "global_step": 141680, "epoch": 843} {"train_loss": -10.9469575881958, "global_step": 141681, "epoch": 843} {"train_loss": -10.135942459106445, "global_step": 141682, "epoch": 843} {"train_loss": -10.725038528442383, "global_step": 141683, "epoch": 843} {"train_loss": -10.480846405029297, "global_step": 141684, "epoch": 843} {"train_loss": -10.6337890625, "global_step": 141685, "epoch": 843} {"train_loss": -10.721502304077148, "global_step": 141686, "epoch": 843} {"train_loss": -10.068744659423828, "global_step": 141687, "epoch": 843} {"train_loss": -10.84115219116211, "global_step": 141688, "epoch": 843} {"train_loss": -9.932605743408203, "global_step": 141689, "epoch": 843} {"train_loss": -10.110925674438477, "global_step": 141690, "epoch": 843} {"train_loss": -10.679217338562012, "global_step": 141691, "epoch": 843} {"train_loss": -10.060428619384766, "global_step": 141692, "epoch": 843} {"train_loss": -9.920156478881836, "global_step": 141693, "epoch": 843} {"train_loss": -10.312729835510254, "global_step": 141694, "epoch": 843} {"train_loss": -9.916206359863281, "global_step": 141695, "epoch": 843} {"train_loss": -9.86560344696045, "global_step": 141696, "epoch": 843} {"train_loss": -10.02790641784668, "global_step": 141697, "epoch": 843} {"train_loss": -9.759057998657227, "global_step": 141698, "epoch": 843} {"train_loss": -10.193163871765137, "global_step": 141699, "epoch": 843} {"train_loss": -9.880393028259277, "global_step": 141700, "epoch": 843} {"train_loss": -10.30062484741211, "global_step": 141701, "epoch": 843} {"train_loss": -9.743003845214844, "global_step": 141702, "epoch": 843} {"train_loss": -10.292463302612305, "global_step": 141703, "epoch": 843} {"train_loss": -9.77692985534668, "global_step": 141704, "epoch": 843} {"train_loss": -9.93331527709961, "global_step": 141705, "epoch": 843} {"train_loss": -9.368310928344727, "global_step": 141706, "epoch": 843} {"train_loss": -10.033956527709961, "global_step": 141707, "epoch": 843} {"train_loss": -10.086559295654297, "global_step": 141708, "epoch": 843} {"train_loss": -9.74293327331543, "global_step": 141709, "epoch": 843} {"train_loss": -9.950459480285645, "global_step": 141710, "epoch": 843} {"train_loss": -9.685787200927734, "global_step": 141711, "epoch": 843} {"train_loss": -9.951818466186523, "global_step": 141712, "epoch": 843} {"train_loss": -10.013853073120117, "global_step": 141713, "epoch": 843} {"train_loss": -9.678834915161133, "global_step": 141714, "epoch": 843} {"train_loss": -10.408254623413086, "global_step": 141715, "epoch": 843} {"train_loss": -9.662298202514648, "global_step": 141716, "epoch": 843} {"train_loss": -9.914886474609375, "global_step": 141717, "epoch": 843} {"train_loss": -9.962377548217773, "global_step": 141718, "epoch": 843} {"train_loss": -10.00870132446289, "global_step": 141719, "epoch": 843} {"train_loss": -10.101320266723633, "global_step": 141720, "epoch": 843} {"train_loss": -10.22317123413086, "global_step": 141721, "epoch": 843} {"train_loss": -10.33403205871582, "global_step": 141722, "epoch": 843} {"train_loss": -10.493234634399414, "global_step": 141723, "epoch": 843} {"train_loss": -10.215606689453125, "global_step": 141724, "epoch": 843} {"train_loss": -10.266837120056152, "global_step": 141725, "epoch": 843} {"train_loss": -10.583301544189453, "global_step": 141726, "epoch": 843} {"train_loss": -10.210750579833984, "global_step": 141727, "epoch": 843} {"train_loss": -10.364904403686523, "global_step": 141728, "epoch": 843} {"train_loss": -10.508087158203125, "global_step": 141729, "epoch": 843} {"train_loss": -10.365931510925293, "global_step": 141730, "epoch": 843} {"train_loss": -10.451043128967285, "global_step": 141731, "epoch": 843} {"train_loss": -10.50515365600586, "global_step": 141732, "epoch": 843} {"train_loss": -10.661195755004883, "global_step": 141733, "epoch": 843} {"train_loss": -10.455204963684082, "global_step": 141734, "epoch": 843} {"train_loss": -10.648075103759766, "global_step": 141735, "epoch": 843} {"train_loss": -10.721475601196289, "global_step": 141736, "epoch": 843} {"train_loss": -10.6428861618042, "global_step": 141737, "epoch": 843} {"train_loss": -10.650720596313477, "global_step": 141738, "epoch": 843} {"train_loss": -10.603971481323242, "global_step": 141739, "epoch": 843} {"train_loss": -10.595878601074219, "global_step": 141740, "epoch": 843} {"train_loss": -10.701688766479492, "global_step": 141741, "epoch": 843} {"train_loss": -10.77900505065918, "global_step": 141742, "epoch": 843} {"train_loss": -10.556286811828613, "global_step": 141743, "epoch": 843} {"train_loss": -10.696107864379883, "global_step": 141744, "epoch": 843} {"train_loss": -10.799529075622559, "global_step": 141745, "epoch": 843} {"train_loss": -10.907632827758789, "global_step": 141746, "epoch": 843} {"train_loss": -10.676323890686035, "global_step": 141747, "epoch": 843} {"train_loss": -10.74142074584961, "global_step": 141748, "epoch": 843} {"train_loss": -10.828310012817383, "global_step": 141749, "epoch": 843} {"train_loss": -10.72979736328125, "global_step": 141750, "epoch": 843} {"train_loss": -10.925519943237305, "global_step": 141751, "epoch": 843} {"train_loss": -10.666048049926758, "global_step": 141752, "epoch": 843} {"train_loss": -10.733232498168945, "global_step": 141753, "epoch": 843} {"train_loss": -10.629776954650879, "global_step": 141754, "epoch": 843} {"train_loss": -10.889261245727539, "global_step": 141755, "epoch": 843} {"train_loss": -10.669248580932617, "global_step": 141756, "epoch": 843} {"train_loss": -10.844625473022461, "global_step": 141757, "epoch": 843} {"train_loss": -10.834447860717773, "global_step": 141758, "epoch": 843} {"train_loss": -10.60290813446045, "global_step": 141759, "epoch": 843} {"train_loss": -10.429503440856934, "global_step": 141760, "epoch": 843} {"train_loss": -10.838011741638184, "global_step": 141761, "epoch": 843} {"train_loss": -10.430130004882812, "global_step": 141762, "epoch": 843} {"train_loss": -10.618343353271484, "global_step": 141763, "epoch": 843} {"train_loss": -9.509258270263672, "global_step": 141764, "epoch": 843} {"train_loss": -10.615633010864258, "global_step": 141765, "epoch": 843} {"train_loss": -9.00956916809082, "global_step": 141766, "epoch": 843} {"train_loss": -10.024615287780762, "global_step": 141767, "epoch": 843} {"train_loss": -10.089674949645996, "global_step": 141768, "epoch": 843} {"train_loss": -9.671881675720215, "global_step": 141769, "epoch": 843} {"train_loss": -9.631635665893555, "global_step": 141770, "epoch": 843} {"train_loss": -10.682110786437988, "global_step": 141771, "epoch": 843} {"train_loss": -9.259754180908203, "global_step": 141772, "epoch": 843} {"train_loss": -10.201726913452148, "global_step": 141773, "epoch": 843} {"train_loss": -9.515641212463379, "global_step": 141774, "epoch": 843} {"train_loss": -10.604028701782227, "global_step": 141775, "epoch": 843} {"train_loss": -9.578302383422852, "global_step": 141776, "epoch": 843} {"train_loss": -10.435646057128906, "global_step": 141777, "epoch": 843} {"train_loss": -9.855215072631836, "global_step": 141778, "epoch": 843} {"train_loss": -10.153499603271484, "global_step": 141779, "epoch": 843} {"train_loss": -10.343023300170898, "global_step": 141780, "epoch": 843} {"train_loss": -9.955336570739746, "global_step": 141781, "epoch": 843} {"train_loss": -10.251718521118164, "global_step": 141782, "epoch": 843} {"train_loss": -10.599157333374023, "global_step": 141783, "epoch": 843} {"train_loss": -10.540813446044922, "global_step": 141784, "epoch": 843} {"train_loss": -10.281299591064453, "global_step": 141785, "epoch": 843} {"train_loss": -10.099180221557617, "global_step": 141786, "epoch": 843} {"train_loss": -10.296956062316895, "global_step": 141787, "epoch": 843} {"train_loss": -10.294719696044922, "global_step": 141788, "epoch": 843} {"train_loss": -10.406428337097168, "global_step": 141789, "epoch": 843} {"train_loss": -10.441356658935547, "global_step": 141790, "epoch": 843} {"train_loss": -10.369726044791085, "global_step": 141791, "epoch": 843, "val_loss": 223439.109375} {"train_loss": -10.412225723266602, "global_step": 141792, "epoch": 844} {"train_loss": -10.442989349365234, "global_step": 141793, "epoch": 844} {"train_loss": -10.33283805847168, "global_step": 141794, "epoch": 844} {"train_loss": -10.684879302978516, "global_step": 141795, "epoch": 844} {"train_loss": -10.299866676330566, "global_step": 141796, "epoch": 844} {"train_loss": -10.750814437866211, "global_step": 141797, "epoch": 844} {"train_loss": -10.555756568908691, "global_step": 141798, "epoch": 844} {"train_loss": -10.61984634399414, "global_step": 141799, "epoch": 844} {"train_loss": -10.368961334228516, "global_step": 141800, "epoch": 844} {"train_loss": -10.506431579589844, "global_step": 141801, "epoch": 844} {"train_loss": -10.280783653259277, "global_step": 141802, "epoch": 844} {"train_loss": -10.402327537536621, "global_step": 141803, "epoch": 844} {"train_loss": -10.629179954528809, "global_step": 141804, "epoch": 844} {"train_loss": -10.330890655517578, "global_step": 141805, "epoch": 844} {"train_loss": -10.735767364501953, "global_step": 141806, "epoch": 844} {"train_loss": -10.660003662109375, "global_step": 141807, "epoch": 844} {"train_loss": -10.751608848571777, "global_step": 141808, "epoch": 844} {"train_loss": -10.799860000610352, "global_step": 141809, "epoch": 844} {"train_loss": -10.760455131530762, "global_step": 141810, "epoch": 844} {"train_loss": -10.741177558898926, "global_step": 141811, "epoch": 844} {"train_loss": -10.786998748779297, "global_step": 141812, "epoch": 844} {"train_loss": -10.844717025756836, "global_step": 141813, "epoch": 844} {"train_loss": -10.764195442199707, "global_step": 141814, "epoch": 844} {"train_loss": -10.793089866638184, "global_step": 141815, "epoch": 844} {"train_loss": -10.952363967895508, "global_step": 141816, "epoch": 844} {"train_loss": -10.723273277282715, "global_step": 141817, "epoch": 844} {"train_loss": -10.87509536743164, "global_step": 141818, "epoch": 844} {"train_loss": -10.613794326782227, "global_step": 141819, "epoch": 844} {"train_loss": -10.705690383911133, "global_step": 141820, "epoch": 844} {"train_loss": -10.747982025146484, "global_step": 141821, "epoch": 844} {"train_loss": -10.844893455505371, "global_step": 141822, "epoch": 844} {"train_loss": -10.562307357788086, "global_step": 141823, "epoch": 844} {"train_loss": -10.92025089263916, "global_step": 141824, "epoch": 844} {"train_loss": -10.575376510620117, "global_step": 141825, "epoch": 844} {"train_loss": -10.698222160339355, "global_step": 141826, "epoch": 844} {"train_loss": -11.153722763061523, "global_step": 141827, "epoch": 844} {"train_loss": -10.596370697021484, "global_step": 141828, "epoch": 844} {"train_loss": -11.046884536743164, "global_step": 141829, "epoch": 844} {"train_loss": -10.984496116638184, "global_step": 141830, "epoch": 844} {"train_loss": -10.880376815795898, "global_step": 141831, "epoch": 844} {"train_loss": -10.77783203125, "global_step": 141832, "epoch": 844} {"train_loss": -10.959051132202148, "global_step": 141833, "epoch": 844} {"train_loss": -10.885986328125, "global_step": 141834, "epoch": 844} {"train_loss": -10.914979934692383, "global_step": 141835, "epoch": 844} {"train_loss": -10.867584228515625, "global_step": 141836, "epoch": 844} {"train_loss": -10.710373878479004, "global_step": 141837, "epoch": 844} {"train_loss": -10.733710289001465, "global_step": 141838, "epoch": 844} {"train_loss": -10.303179740905762, "global_step": 141839, "epoch": 844} {"train_loss": -10.92557144165039, "global_step": 141840, "epoch": 844} {"train_loss": -10.246037483215332, "global_step": 141841, "epoch": 844} {"train_loss": -9.938833236694336, "global_step": 141842, "epoch": 844} {"train_loss": -10.596705436706543, "global_step": 141843, "epoch": 844} {"train_loss": -10.732736587524414, "global_step": 141844, "epoch": 844} {"train_loss": -9.925085067749023, "global_step": 141845, "epoch": 844} {"train_loss": -9.81870174407959, "global_step": 141846, "epoch": 844} {"train_loss": -10.49612045288086, "global_step": 141847, "epoch": 844} {"train_loss": -10.491504669189453, "global_step": 141848, "epoch": 844} {"train_loss": -10.255736351013184, "global_step": 141849, "epoch": 844} {"train_loss": -10.681028366088867, "global_step": 141850, "epoch": 844} {"train_loss": -10.412997245788574, "global_step": 141851, "epoch": 844} {"train_loss": -10.225446701049805, "global_step": 141852, "epoch": 844} {"train_loss": -10.485143661499023, "global_step": 141853, "epoch": 844} {"train_loss": -10.575977325439453, "global_step": 141854, "epoch": 844} {"train_loss": -10.617504119873047, "global_step": 141855, "epoch": 844} {"train_loss": -10.393933296203613, "global_step": 141856, "epoch": 844} {"train_loss": -10.509485244750977, "global_step": 141857, "epoch": 844} {"train_loss": -10.490114212036133, "global_step": 141858, "epoch": 844} {"train_loss": -10.407419204711914, "global_step": 141859, "epoch": 844} {"train_loss": -10.580743789672852, "global_step": 141860, "epoch": 844} {"train_loss": -10.775290489196777, "global_step": 141861, "epoch": 844} {"train_loss": -10.263157844543457, "global_step": 141862, "epoch": 844} {"train_loss": -11.012916564941406, "global_step": 141863, "epoch": 844} {"train_loss": -10.203689575195312, "global_step": 141864, "epoch": 844} {"train_loss": -10.619770050048828, "global_step": 141865, "epoch": 844} {"train_loss": -10.63818073272705, "global_step": 141866, "epoch": 844} {"train_loss": -10.501567840576172, "global_step": 141867, "epoch": 844} {"train_loss": -10.553288459777832, "global_step": 141868, "epoch": 844} {"train_loss": -10.744857788085938, "global_step": 141869, "epoch": 844} {"train_loss": -10.793441772460938, "global_step": 141870, "epoch": 844} {"train_loss": -10.456230163574219, "global_step": 141871, "epoch": 844} {"train_loss": -10.602380752563477, "global_step": 141872, "epoch": 844} {"train_loss": -10.950468063354492, "global_step": 141873, "epoch": 844} {"train_loss": -10.753280639648438, "global_step": 141874, "epoch": 844} {"train_loss": -10.843241691589355, "global_step": 141875, "epoch": 844} {"train_loss": -10.356815338134766, "global_step": 141876, "epoch": 844} {"train_loss": -10.695943832397461, "global_step": 141877, "epoch": 844} {"train_loss": -10.646636009216309, "global_step": 141878, "epoch": 844} {"train_loss": -10.853280067443848, "global_step": 141879, "epoch": 844} {"train_loss": -10.630329132080078, "global_step": 141880, "epoch": 844} {"train_loss": -10.580879211425781, "global_step": 141881, "epoch": 844} {"train_loss": -10.764765739440918, "global_step": 141882, "epoch": 844} {"train_loss": -10.510477066040039, "global_step": 141883, "epoch": 844} {"train_loss": -10.903253555297852, "global_step": 141884, "epoch": 844} {"train_loss": -10.244093894958496, "global_step": 141885, "epoch": 844} {"train_loss": -10.655223846435547, "global_step": 141886, "epoch": 844} {"train_loss": -10.656391143798828, "global_step": 141887, "epoch": 844} {"train_loss": -10.755878448486328, "global_step": 141888, "epoch": 844} {"train_loss": -10.52889347076416, "global_step": 141889, "epoch": 844} {"train_loss": -10.657812118530273, "global_step": 141890, "epoch": 844} {"train_loss": -10.855772018432617, "global_step": 141891, "epoch": 844} {"train_loss": -10.582870483398438, "global_step": 141892, "epoch": 844} {"train_loss": -10.443061828613281, "global_step": 141893, "epoch": 844} {"train_loss": -10.512224197387695, "global_step": 141894, "epoch": 844} {"train_loss": -10.521184921264648, "global_step": 141895, "epoch": 844} {"train_loss": -10.206357955932617, "global_step": 141896, "epoch": 844} {"train_loss": -10.668880462646484, "global_step": 141897, "epoch": 844} {"train_loss": -10.466292381286621, "global_step": 141898, "epoch": 844} {"train_loss": -10.735118865966797, "global_step": 141899, "epoch": 844} {"train_loss": -10.364830017089844, "global_step": 141900, "epoch": 844} {"train_loss": -10.643560409545898, "global_step": 141901, "epoch": 844} {"train_loss": -10.592369079589844, "global_step": 141902, "epoch": 844} {"train_loss": -10.529367446899414, "global_step": 141903, "epoch": 844} {"train_loss": -10.752908706665039, "global_step": 141904, "epoch": 844} {"train_loss": -10.559927940368652, "global_step": 141905, "epoch": 844} {"train_loss": -10.429469108581543, "global_step": 141906, "epoch": 844} {"train_loss": -10.138748168945312, "global_step": 141907, "epoch": 844} {"train_loss": -10.402839660644531, "global_step": 141908, "epoch": 844} {"train_loss": -10.524245262145996, "global_step": 141909, "epoch": 844} {"train_loss": -10.46383285522461, "global_step": 141910, "epoch": 844} {"train_loss": -10.5052490234375, "global_step": 141911, "epoch": 844} {"train_loss": -10.4645414352417, "global_step": 141912, "epoch": 844} {"train_loss": -10.495285987854004, "global_step": 141913, "epoch": 844} {"train_loss": -10.225709915161133, "global_step": 141914, "epoch": 844} {"train_loss": -10.770193099975586, "global_step": 141915, "epoch": 844} {"train_loss": -10.489103317260742, "global_step": 141916, "epoch": 844} {"train_loss": -10.608589172363281, "global_step": 141917, "epoch": 844} {"train_loss": -10.565068244934082, "global_step": 141918, "epoch": 844} {"train_loss": -10.716452598571777, "global_step": 141919, "epoch": 844} {"train_loss": -10.537318229675293, "global_step": 141920, "epoch": 844} {"train_loss": -10.21028995513916, "global_step": 141921, "epoch": 844} {"train_loss": -10.861438751220703, "global_step": 141922, "epoch": 844} {"train_loss": -10.212234497070312, "global_step": 141923, "epoch": 844} {"train_loss": -10.495059967041016, "global_step": 141924, "epoch": 844} {"train_loss": -10.186872482299805, "global_step": 141925, "epoch": 844} {"train_loss": -10.653514862060547, "global_step": 141926, "epoch": 844} {"train_loss": -10.554032325744629, "global_step": 141927, "epoch": 844} {"train_loss": -10.393817901611328, "global_step": 141928, "epoch": 844} {"train_loss": -10.628263473510742, "global_step": 141929, "epoch": 844} {"train_loss": -10.505813598632812, "global_step": 141930, "epoch": 844} {"train_loss": -10.37751293182373, "global_step": 141931, "epoch": 844} {"train_loss": -10.539381980895996, "global_step": 141932, "epoch": 844} {"train_loss": -10.417691230773926, "global_step": 141933, "epoch": 844} {"train_loss": -10.647293090820312, "global_step": 141934, "epoch": 844} {"train_loss": -10.442621231079102, "global_step": 141935, "epoch": 844} {"train_loss": -10.433204650878906, "global_step": 141936, "epoch": 844} {"train_loss": -10.842506408691406, "global_step": 141937, "epoch": 844} {"train_loss": -10.504460334777832, "global_step": 141938, "epoch": 844} {"train_loss": -10.62349796295166, "global_step": 141939, "epoch": 844} {"train_loss": -10.567340850830078, "global_step": 141940, "epoch": 844} {"train_loss": -10.834285736083984, "global_step": 141941, "epoch": 844} {"train_loss": -10.337113380432129, "global_step": 141942, "epoch": 844} {"train_loss": -10.61370849609375, "global_step": 141943, "epoch": 844} {"train_loss": -10.595294952392578, "global_step": 141944, "epoch": 844} {"train_loss": -10.542040824890137, "global_step": 141945, "epoch": 844} {"train_loss": -10.249724388122559, "global_step": 141946, "epoch": 844} {"train_loss": -10.647211074829102, "global_step": 141947, "epoch": 844} {"train_loss": -10.440863609313965, "global_step": 141948, "epoch": 844} {"train_loss": -10.529874801635742, "global_step": 141949, "epoch": 844} {"train_loss": -10.610243797302246, "global_step": 141950, "epoch": 844} {"train_loss": -10.458250045776367, "global_step": 141951, "epoch": 844} {"train_loss": -10.552764892578125, "global_step": 141952, "epoch": 844} {"train_loss": -10.397750854492188, "global_step": 141953, "epoch": 844} {"train_loss": -10.649301528930664, "global_step": 141954, "epoch": 844} {"train_loss": -10.416587829589844, "global_step": 141955, "epoch": 844} {"train_loss": -10.53867244720459, "global_step": 141956, "epoch": 844} {"train_loss": -10.590360641479492, "global_step": 141957, "epoch": 844} {"train_loss": -10.723021507263184, "global_step": 141958, "epoch": 844} {"train_loss": -10.580254838580178, "global_step": 141959, "epoch": 844, "val_loss": 225453.859375} {"train_loss": -10.33757209777832, "global_step": 141960, "epoch": 845} {"train_loss": -10.686720848083496, "global_step": 141961, "epoch": 845} {"train_loss": -10.158346176147461, "global_step": 141962, "epoch": 845} {"train_loss": -10.10688591003418, "global_step": 141963, "epoch": 845} {"train_loss": -10.37333869934082, "global_step": 141964, "epoch": 845} {"train_loss": -10.173650741577148, "global_step": 141965, "epoch": 845} {"train_loss": -10.186230659484863, "global_step": 141966, "epoch": 845} {"train_loss": -9.998678207397461, "global_step": 141967, "epoch": 845} {"train_loss": -10.384395599365234, "global_step": 141968, "epoch": 845} {"train_loss": -10.129364967346191, "global_step": 141969, "epoch": 845} {"train_loss": -10.14866828918457, "global_step": 141970, "epoch": 845} {"train_loss": -10.253168106079102, "global_step": 141971, "epoch": 845} {"train_loss": -10.472875595092773, "global_step": 141972, "epoch": 845} {"train_loss": -9.4526948928833, "global_step": 141973, "epoch": 845} {"train_loss": -10.283624649047852, "global_step": 141974, "epoch": 845} {"train_loss": -10.305750846862793, "global_step": 141975, "epoch": 845} {"train_loss": -10.29623794555664, "global_step": 141976, "epoch": 845} {"train_loss": -10.198291778564453, "global_step": 141977, "epoch": 845} {"train_loss": -10.270721435546875, "global_step": 141978, "epoch": 845} {"train_loss": -10.603752136230469, "global_step": 141979, "epoch": 845} {"train_loss": -10.34251594543457, "global_step": 141980, "epoch": 845} {"train_loss": -10.504130363464355, "global_step": 141981, "epoch": 845} {"train_loss": -10.588350296020508, "global_step": 141982, "epoch": 845} {"train_loss": -10.201798439025879, "global_step": 141983, "epoch": 845} {"train_loss": -10.535966873168945, "global_step": 141984, "epoch": 845} {"train_loss": -10.473803520202637, "global_step": 141985, "epoch": 845} {"train_loss": -10.462117195129395, "global_step": 141986, "epoch": 845} {"train_loss": -10.517579078674316, "global_step": 141987, "epoch": 845} {"train_loss": -10.667627334594727, "global_step": 141988, "epoch": 845} {"train_loss": -10.46861743927002, "global_step": 141989, "epoch": 845} {"train_loss": -10.598958969116211, "global_step": 141990, "epoch": 845} {"train_loss": -10.768407821655273, "global_step": 141991, "epoch": 845} {"train_loss": -10.753040313720703, "global_step": 141992, "epoch": 845} {"train_loss": -10.532012939453125, "global_step": 141993, "epoch": 845} {"train_loss": -10.495917320251465, "global_step": 141994, "epoch": 845} {"train_loss": -10.693868637084961, "global_step": 141995, "epoch": 845} {"train_loss": -10.690999984741211, "global_step": 141996, "epoch": 845} {"train_loss": -10.287690162658691, "global_step": 141997, "epoch": 845} {"train_loss": -10.473260879516602, "global_step": 141998, "epoch": 845} {"train_loss": -10.567230224609375, "global_step": 141999, "epoch": 845} {"train_loss": -10.773797988891602, "global_step": 142000, "epoch": 845} {"train_loss": -10.673851013183594, "global_step": 142001, "epoch": 845} {"train_loss": -10.84756088256836, "global_step": 142002, "epoch": 845} {"train_loss": -10.797316551208496, "global_step": 142003, "epoch": 845} {"train_loss": -10.789939880371094, "global_step": 142004, "epoch": 845} {"train_loss": -10.85201644897461, "global_step": 142005, "epoch": 845} {"train_loss": -10.748023986816406, "global_step": 142006, "epoch": 845} {"train_loss": -10.822702407836914, "global_step": 142007, "epoch": 845} {"train_loss": -10.893537521362305, "global_step": 142008, "epoch": 845} {"train_loss": -10.687284469604492, "global_step": 142009, "epoch": 845} {"train_loss": -10.586442947387695, "global_step": 142010, "epoch": 845} {"train_loss": -10.891792297363281, "global_step": 142011, "epoch": 845} {"train_loss": -10.690528869628906, "global_step": 142012, "epoch": 845} {"train_loss": -10.659807205200195, "global_step": 142013, "epoch": 845} {"train_loss": -11.036336898803711, "global_step": 142014, "epoch": 845} {"train_loss": -10.570302963256836, "global_step": 142015, "epoch": 845} {"train_loss": -10.883033752441406, "global_step": 142016, "epoch": 845} {"train_loss": -10.862752914428711, "global_step": 142017, "epoch": 845} {"train_loss": -10.652482986450195, "global_step": 142018, "epoch": 845} {"train_loss": -11.006906509399414, "global_step": 142019, "epoch": 845} {"train_loss": -11.051619529724121, "global_step": 142020, "epoch": 845} {"train_loss": -10.892692565917969, "global_step": 142021, "epoch": 845} {"train_loss": -10.299391746520996, "global_step": 142022, "epoch": 845} {"train_loss": -10.94016170501709, "global_step": 142023, "epoch": 845} {"train_loss": -10.553506851196289, "global_step": 142024, "epoch": 845} {"train_loss": -10.997296333312988, "global_step": 142025, "epoch": 845} {"train_loss": -10.768306732177734, "global_step": 142026, "epoch": 845} {"train_loss": -10.798501014709473, "global_step": 142027, "epoch": 845} {"train_loss": -10.521717071533203, "global_step": 142028, "epoch": 845} {"train_loss": -10.808334350585938, "global_step": 142029, "epoch": 845} {"train_loss": -10.719022750854492, "global_step": 142030, "epoch": 845} {"train_loss": -10.940837860107422, "global_step": 142031, "epoch": 845} {"train_loss": -10.821808815002441, "global_step": 142032, "epoch": 845} {"train_loss": -11.052963256835938, "global_step": 142033, "epoch": 845} {"train_loss": -10.627498626708984, "global_step": 142034, "epoch": 845} {"train_loss": -10.641201972961426, "global_step": 142035, "epoch": 845} {"train_loss": -10.788358688354492, "global_step": 142036, "epoch": 845} {"train_loss": -10.383646011352539, "global_step": 142037, "epoch": 845} {"train_loss": -11.014668464660645, "global_step": 142038, "epoch": 845} {"train_loss": -10.825443267822266, "global_step": 142039, "epoch": 845} {"train_loss": -10.82055950164795, "global_step": 142040, "epoch": 845} {"train_loss": -10.859634399414062, "global_step": 142041, "epoch": 845} {"train_loss": -10.657550811767578, "global_step": 142042, "epoch": 845} {"train_loss": -10.919454574584961, "global_step": 142043, "epoch": 845} {"train_loss": -10.458219528198242, "global_step": 142044, "epoch": 845} {"train_loss": -10.799507141113281, "global_step": 142045, "epoch": 845} {"train_loss": -10.313817977905273, "global_step": 142046, "epoch": 845} {"train_loss": -10.459707260131836, "global_step": 142047, "epoch": 845} {"train_loss": -10.008472442626953, "global_step": 142048, "epoch": 845} {"train_loss": -9.666102409362793, "global_step": 142049, "epoch": 845} {"train_loss": -10.236507415771484, "global_step": 142050, "epoch": 845} {"train_loss": -9.855827331542969, "global_step": 142051, "epoch": 845} {"train_loss": -9.02269172668457, "global_step": 142052, "epoch": 845} {"train_loss": -8.752309799194336, "global_step": 142053, "epoch": 845} {"train_loss": -9.846991539001465, "global_step": 142054, "epoch": 845} {"train_loss": -9.363576889038086, "global_step": 142055, "epoch": 845} {"train_loss": -9.684544563293457, "global_step": 142056, "epoch": 845} {"train_loss": -9.323142051696777, "global_step": 142057, "epoch": 845} {"train_loss": -10.424905776977539, "global_step": 142058, "epoch": 845} {"train_loss": -9.523361206054688, "global_step": 142059, "epoch": 845} {"train_loss": -9.88347339630127, "global_step": 142060, "epoch": 845} {"train_loss": -10.06058120727539, "global_step": 142061, "epoch": 845} {"train_loss": -9.887931823730469, "global_step": 142062, "epoch": 845} {"train_loss": -10.203095436096191, "global_step": 142063, "epoch": 845} {"train_loss": -9.685770034790039, "global_step": 142064, "epoch": 845} {"train_loss": -10.098310470581055, "global_step": 142065, "epoch": 845} {"train_loss": -9.983816146850586, "global_step": 142066, "epoch": 845} {"train_loss": -9.453222274780273, "global_step": 142067, "epoch": 845} {"train_loss": -9.9967622756958, "global_step": 142068, "epoch": 845} {"train_loss": -10.35273551940918, "global_step": 142069, "epoch": 845} {"train_loss": -9.76710319519043, "global_step": 142070, "epoch": 845} {"train_loss": -10.080877304077148, "global_step": 142071, "epoch": 845} {"train_loss": -10.17861270904541, "global_step": 142072, "epoch": 845} {"train_loss": -10.232449531555176, "global_step": 142073, "epoch": 845} {"train_loss": -9.887237548828125, "global_step": 142074, "epoch": 845} {"train_loss": -10.287162780761719, "global_step": 142075, "epoch": 845} {"train_loss": -9.914695739746094, "global_step": 142076, "epoch": 845} {"train_loss": -10.271566390991211, "global_step": 142077, "epoch": 845} {"train_loss": -10.528650283813477, "global_step": 142078, "epoch": 845} {"train_loss": -10.37861156463623, "global_step": 142079, "epoch": 845} {"train_loss": -10.3186616897583, "global_step": 142080, "epoch": 845} {"train_loss": -10.488433837890625, "global_step": 142081, "epoch": 845} {"train_loss": -10.561829566955566, "global_step": 142082, "epoch": 845} {"train_loss": -10.423111915588379, "global_step": 142083, "epoch": 845} {"train_loss": -10.544546127319336, "global_step": 142084, "epoch": 845} {"train_loss": -10.50438117980957, "global_step": 142085, "epoch": 845} {"train_loss": -10.366229057312012, "global_step": 142086, "epoch": 845} {"train_loss": -10.375706672668457, "global_step": 142087, "epoch": 845} {"train_loss": -10.482464790344238, "global_step": 142088, "epoch": 845} {"train_loss": -10.534902572631836, "global_step": 142089, "epoch": 845} {"train_loss": -10.509288787841797, "global_step": 142090, "epoch": 845} {"train_loss": -10.658672332763672, "global_step": 142091, "epoch": 845} {"train_loss": -10.750956535339355, "global_step": 142092, "epoch": 845} {"train_loss": -10.785013198852539, "global_step": 142093, "epoch": 845} {"train_loss": -10.577825546264648, "global_step": 142094, "epoch": 845} {"train_loss": -10.875959396362305, "global_step": 142095, "epoch": 845} {"train_loss": -10.706974029541016, "global_step": 142096, "epoch": 845} {"train_loss": -10.800718307495117, "global_step": 142097, "epoch": 845} {"train_loss": -10.659200668334961, "global_step": 142098, "epoch": 845} {"train_loss": -10.848855018615723, "global_step": 142099, "epoch": 845} {"train_loss": -10.538657188415527, "global_step": 142100, "epoch": 845} {"train_loss": -10.62324333190918, "global_step": 142101, "epoch": 845} {"train_loss": -10.77655029296875, "global_step": 142102, "epoch": 845} {"train_loss": -10.646745681762695, "global_step": 142103, "epoch": 845} {"train_loss": -10.840517044067383, "global_step": 142104, "epoch": 845} {"train_loss": -10.685140609741211, "global_step": 142105, "epoch": 845} {"train_loss": -10.750089645385742, "global_step": 142106, "epoch": 845} {"train_loss": -10.825668334960938, "global_step": 142107, "epoch": 845} {"train_loss": -10.687747955322266, "global_step": 142108, "epoch": 845} {"train_loss": -10.607404708862305, "global_step": 142109, "epoch": 845} {"train_loss": -10.760746002197266, "global_step": 142110, "epoch": 845} {"train_loss": -10.548788070678711, "global_step": 142111, "epoch": 845} {"train_loss": -10.817627906799316, "global_step": 142112, "epoch": 845} {"train_loss": -10.653386116027832, "global_step": 142113, "epoch": 845} {"train_loss": -10.71109676361084, "global_step": 142114, "epoch": 845} {"train_loss": -10.80800724029541, "global_step": 142115, "epoch": 845} {"train_loss": -10.838263511657715, "global_step": 142116, "epoch": 845} {"train_loss": -10.487106323242188, "global_step": 142117, "epoch": 845} {"train_loss": -10.490842819213867, "global_step": 142118, "epoch": 845} {"train_loss": -10.94643783569336, "global_step": 142119, "epoch": 845} {"train_loss": -10.804713249206543, "global_step": 142120, "epoch": 845} {"train_loss": -10.900320053100586, "global_step": 142121, "epoch": 845} {"train_loss": -10.780162811279297, "global_step": 142122, "epoch": 845} {"train_loss": -10.915188789367676, "global_step": 142123, "epoch": 845} {"train_loss": -10.661498069763184, "global_step": 142124, "epoch": 845} {"train_loss": -11.146169662475586, "global_step": 142125, "epoch": 845} {"train_loss": -10.566917419433594, "global_step": 142126, "epoch": 845} {"train_loss": -10.482228636741638, "global_step": 142127, "epoch": 845, "val_loss": 215287.90625, "train_action_mse_error": 1.3611793518066406} {"train_loss": -10.709407806396484, "global_step": 142128, "epoch": 846} {"train_loss": -10.749398231506348, "global_step": 142129, "epoch": 846} {"train_loss": -10.7280855178833, "global_step": 142130, "epoch": 846} {"train_loss": -10.718700408935547, "global_step": 142131, "epoch": 846} {"train_loss": -10.893247604370117, "global_step": 142132, "epoch": 846} {"train_loss": -10.59500789642334, "global_step": 142133, "epoch": 846} {"train_loss": -10.805501937866211, "global_step": 142134, "epoch": 846} {"train_loss": -10.497661590576172, "global_step": 142135, "epoch": 846} {"train_loss": -10.789909362792969, "global_step": 142136, "epoch": 846} {"train_loss": -10.945818901062012, "global_step": 142137, "epoch": 846} {"train_loss": -10.633186340332031, "global_step": 142138, "epoch": 846} {"train_loss": -10.745203971862793, "global_step": 142139, "epoch": 846} {"train_loss": -10.717626571655273, "global_step": 142140, "epoch": 846} {"train_loss": -10.911806106567383, "global_step": 142141, "epoch": 846} {"train_loss": -10.501655578613281, "global_step": 142142, "epoch": 846} {"train_loss": -10.60249137878418, "global_step": 142143, "epoch": 846} {"train_loss": -10.318109512329102, "global_step": 142144, "epoch": 846} {"train_loss": -10.806398391723633, "global_step": 142145, "epoch": 846} {"train_loss": -10.591499328613281, "global_step": 142146, "epoch": 846} {"train_loss": -10.76019287109375, "global_step": 142147, "epoch": 846} {"train_loss": -10.341510772705078, "global_step": 142148, "epoch": 846} {"train_loss": -10.685012817382812, "global_step": 142149, "epoch": 846} {"train_loss": -10.537983894348145, "global_step": 142150, "epoch": 846} {"train_loss": -10.560842514038086, "global_step": 142151, "epoch": 846} {"train_loss": -10.546034812927246, "global_step": 142152, "epoch": 846} {"train_loss": -10.703853607177734, "global_step": 142153, "epoch": 846} {"train_loss": -10.320390701293945, "global_step": 142154, "epoch": 846} {"train_loss": -10.395005226135254, "global_step": 142155, "epoch": 846} {"train_loss": -10.425732612609863, "global_step": 142156, "epoch": 846} {"train_loss": -10.60851001739502, "global_step": 142157, "epoch": 846} {"train_loss": -10.450098037719727, "global_step": 142158, "epoch": 846} {"train_loss": -10.707427978515625, "global_step": 142159, "epoch": 846} {"train_loss": -10.515341758728027, "global_step": 142160, "epoch": 846} {"train_loss": -10.720829010009766, "global_step": 142161, "epoch": 846} {"train_loss": -10.61335563659668, "global_step": 142162, "epoch": 846} {"train_loss": -10.546663284301758, "global_step": 142163, "epoch": 846} {"train_loss": -10.911739349365234, "global_step": 142164, "epoch": 846} {"train_loss": -10.629732131958008, "global_step": 142165, "epoch": 846} {"train_loss": -10.46914291381836, "global_step": 142166, "epoch": 846} {"train_loss": -11.033547401428223, "global_step": 142167, "epoch": 846} {"train_loss": -10.674365997314453, "global_step": 142168, "epoch": 846} {"train_loss": -10.889084815979004, "global_step": 142169, "epoch": 846} {"train_loss": -10.773137092590332, "global_step": 142170, "epoch": 846} {"train_loss": -10.641570091247559, "global_step": 142171, "epoch": 846} {"train_loss": -10.789435386657715, "global_step": 142172, "epoch": 846} {"train_loss": -10.777304649353027, "global_step": 142173, "epoch": 846} {"train_loss": -10.615228652954102, "global_step": 142174, "epoch": 846} {"train_loss": -10.678573608398438, "global_step": 142175, "epoch": 846} {"train_loss": -10.623807907104492, "global_step": 142176, "epoch": 846} {"train_loss": -10.669418334960938, "global_step": 142177, "epoch": 846} {"train_loss": -10.68824577331543, "global_step": 142178, "epoch": 846} {"train_loss": -10.670337677001953, "global_step": 142179, "epoch": 846} {"train_loss": -10.35667610168457, "global_step": 142180, "epoch": 846} {"train_loss": -10.43461799621582, "global_step": 142181, "epoch": 846} {"train_loss": -10.709124565124512, "global_step": 142182, "epoch": 846} {"train_loss": -10.424887657165527, "global_step": 142183, "epoch": 846} {"train_loss": -10.707258224487305, "global_step": 142184, "epoch": 846} {"train_loss": -10.832332611083984, "global_step": 142185, "epoch": 846} {"train_loss": -10.626455307006836, "global_step": 142186, "epoch": 846} {"train_loss": -10.113683700561523, "global_step": 142187, "epoch": 846} {"train_loss": -10.505054473876953, "global_step": 142188, "epoch": 846} {"train_loss": -10.212207794189453, "global_step": 142189, "epoch": 846} {"train_loss": -9.78724479675293, "global_step": 142190, "epoch": 846} {"train_loss": -10.830789566040039, "global_step": 142191, "epoch": 846} {"train_loss": -9.421175003051758, "global_step": 142192, "epoch": 846} {"train_loss": -10.637821197509766, "global_step": 142193, "epoch": 846} {"train_loss": -9.861189842224121, "global_step": 142194, "epoch": 846} {"train_loss": -10.161108016967773, "global_step": 142195, "epoch": 846} {"train_loss": -9.910125732421875, "global_step": 142196, "epoch": 846} {"train_loss": -10.194367408752441, "global_step": 142197, "epoch": 846} {"train_loss": -10.104955673217773, "global_step": 142198, "epoch": 846} {"train_loss": -9.551947593688965, "global_step": 142199, "epoch": 846} {"train_loss": -10.288515090942383, "global_step": 142200, "epoch": 846} {"train_loss": -9.667362213134766, "global_step": 142201, "epoch": 846} {"train_loss": -10.424314498901367, "global_step": 142202, "epoch": 846} {"train_loss": -9.373004913330078, "global_step": 142203, "epoch": 846} {"train_loss": -10.727338790893555, "global_step": 142204, "epoch": 846} {"train_loss": -9.521308898925781, "global_step": 142205, "epoch": 846} {"train_loss": -10.349353790283203, "global_step": 142206, "epoch": 846} {"train_loss": -9.5857572555542, "global_step": 142207, "epoch": 846} {"train_loss": -10.455850601196289, "global_step": 142208, "epoch": 846} {"train_loss": -10.248968124389648, "global_step": 142209, "epoch": 846} {"train_loss": -10.42501449584961, "global_step": 142210, "epoch": 846} {"train_loss": -10.128580093383789, "global_step": 142211, "epoch": 846} {"train_loss": -10.431905746459961, "global_step": 142212, "epoch": 846} {"train_loss": -10.362312316894531, "global_step": 142213, "epoch": 846} {"train_loss": -10.630556106567383, "global_step": 142214, "epoch": 846} {"train_loss": -10.492915153503418, "global_step": 142215, "epoch": 846} {"train_loss": -10.693222999572754, "global_step": 142216, "epoch": 846} {"train_loss": -10.55746078491211, "global_step": 142217, "epoch": 846} {"train_loss": -10.59577751159668, "global_step": 142218, "epoch": 846} {"train_loss": -10.499360084533691, "global_step": 142219, "epoch": 846} {"train_loss": -10.509833335876465, "global_step": 142220, "epoch": 846} {"train_loss": -10.608344078063965, "global_step": 142221, "epoch": 846} {"train_loss": -10.444013595581055, "global_step": 142222, "epoch": 846} {"train_loss": -10.665055274963379, "global_step": 142223, "epoch": 846} {"train_loss": -10.44472599029541, "global_step": 142224, "epoch": 846} {"train_loss": -10.462642669677734, "global_step": 142225, "epoch": 846} {"train_loss": -10.558721542358398, "global_step": 142226, "epoch": 846} {"train_loss": -10.500347137451172, "global_step": 142227, "epoch": 846} {"train_loss": -10.553238868713379, "global_step": 142228, "epoch": 846} {"train_loss": -10.715608596801758, "global_step": 142229, "epoch": 846} {"train_loss": -10.610942840576172, "global_step": 142230, "epoch": 846} {"train_loss": -10.517232894897461, "global_step": 142231, "epoch": 846} {"train_loss": -10.892078399658203, "global_step": 142232, "epoch": 846} {"train_loss": -10.535834312438965, "global_step": 142233, "epoch": 846} {"train_loss": -10.755924224853516, "global_step": 142234, "epoch": 846} {"train_loss": -10.615931510925293, "global_step": 142235, "epoch": 846} {"train_loss": -10.661835670471191, "global_step": 142236, "epoch": 846} {"train_loss": -10.570390701293945, "global_step": 142237, "epoch": 846} {"train_loss": -10.628975868225098, "global_step": 142238, "epoch": 846} {"train_loss": -10.813000679016113, "global_step": 142239, "epoch": 846} {"train_loss": -10.748944282531738, "global_step": 142240, "epoch": 846} {"train_loss": -10.81519603729248, "global_step": 142241, "epoch": 846} {"train_loss": -10.770491600036621, "global_step": 142242, "epoch": 846} {"train_loss": -10.709146499633789, "global_step": 142243, "epoch": 846} {"train_loss": -10.593437194824219, "global_step": 142244, "epoch": 846} {"train_loss": -10.816925048828125, "global_step": 142245, "epoch": 846} {"train_loss": -10.770639419555664, "global_step": 142246, "epoch": 846} {"train_loss": -10.606050491333008, "global_step": 142247, "epoch": 846} {"train_loss": -10.917369842529297, "global_step": 142248, "epoch": 846} {"train_loss": -10.45379638671875, "global_step": 142249, "epoch": 846} {"train_loss": -10.851445198059082, "global_step": 142250, "epoch": 846} {"train_loss": -10.139867782592773, "global_step": 142251, "epoch": 846} {"train_loss": -10.558858871459961, "global_step": 142252, "epoch": 846} {"train_loss": -10.42515754699707, "global_step": 142253, "epoch": 846} {"train_loss": -10.38496208190918, "global_step": 142254, "epoch": 846} {"train_loss": -10.205093383789062, "global_step": 142255, "epoch": 846} {"train_loss": -10.292245864868164, "global_step": 142256, "epoch": 846} {"train_loss": -10.315838813781738, "global_step": 142257, "epoch": 846} {"train_loss": -9.878236770629883, "global_step": 142258, "epoch": 846} {"train_loss": -10.286532402038574, "global_step": 142259, "epoch": 846} {"train_loss": -9.844979286193848, "global_step": 142260, "epoch": 846} {"train_loss": -10.12013053894043, "global_step": 142261, "epoch": 846} {"train_loss": -10.432600975036621, "global_step": 142262, "epoch": 846} {"train_loss": -10.581296920776367, "global_step": 142263, "epoch": 846} {"train_loss": -10.297231674194336, "global_step": 142264, "epoch": 846} {"train_loss": -10.285184860229492, "global_step": 142265, "epoch": 846} {"train_loss": -10.464351654052734, "global_step": 142266, "epoch": 846} {"train_loss": -10.179443359375, "global_step": 142267, "epoch": 846} {"train_loss": -10.403397560119629, "global_step": 142268, "epoch": 846} {"train_loss": -10.50794506072998, "global_step": 142269, "epoch": 846} {"train_loss": -10.294527053833008, "global_step": 142270, "epoch": 846} {"train_loss": -10.466623306274414, "global_step": 142271, "epoch": 846} {"train_loss": -10.37612533569336, "global_step": 142272, "epoch": 846} {"train_loss": -10.30290412902832, "global_step": 142273, "epoch": 846} {"train_loss": -10.48194694519043, "global_step": 142274, "epoch": 846} {"train_loss": -10.2748384475708, "global_step": 142275, "epoch": 846} {"train_loss": -10.085241317749023, "global_step": 142276, "epoch": 846} {"train_loss": -10.504409790039062, "global_step": 142277, "epoch": 846} {"train_loss": -10.636727333068848, "global_step": 142278, "epoch": 846} {"train_loss": -10.513166427612305, "global_step": 142279, "epoch": 846} {"train_loss": -10.631048202514648, "global_step": 142280, "epoch": 846} {"train_loss": -10.049592971801758, "global_step": 142281, "epoch": 846} {"train_loss": -10.43619441986084, "global_step": 142282, "epoch": 846} {"train_loss": -10.548309326171875, "global_step": 142283, "epoch": 846} {"train_loss": -10.33841323852539, "global_step": 142284, "epoch": 846} {"train_loss": -10.790164947509766, "global_step": 142285, "epoch": 846} {"train_loss": -10.344758033752441, "global_step": 142286, "epoch": 846} {"train_loss": -10.554122924804688, "global_step": 142287, "epoch": 846} {"train_loss": -10.31707763671875, "global_step": 142288, "epoch": 846} {"train_loss": -10.22526741027832, "global_step": 142289, "epoch": 846} {"train_loss": -10.26968002319336, "global_step": 142290, "epoch": 846} {"train_loss": -10.17707633972168, "global_step": 142291, "epoch": 846} {"train_loss": -10.513740539550781, "global_step": 142292, "epoch": 846} {"train_loss": -10.289758682250977, "global_step": 142293, "epoch": 846} {"train_loss": -10.230783462524414, "global_step": 142294, "epoch": 846} {"train_loss": -10.480411682810102, "global_step": 142295, "epoch": 846, "val_loss": 219658.046875} {"train_loss": -9.994009971618652, "global_step": 142296, "epoch": 847} {"train_loss": -10.633123397827148, "global_step": 142297, "epoch": 847} {"train_loss": -10.013381958007812, "global_step": 142298, "epoch": 847} {"train_loss": -10.617359161376953, "global_step": 142299, "epoch": 847} {"train_loss": -10.476492881774902, "global_step": 142300, "epoch": 847} {"train_loss": -10.512959480285645, "global_step": 142301, "epoch": 847} {"train_loss": -9.911359786987305, "global_step": 142302, "epoch": 847} {"train_loss": -10.349448204040527, "global_step": 142303, "epoch": 847} {"train_loss": -10.367255210876465, "global_step": 142304, "epoch": 847} {"train_loss": -10.50328540802002, "global_step": 142305, "epoch": 847} {"train_loss": -10.15638542175293, "global_step": 142306, "epoch": 847} {"train_loss": -10.17576789855957, "global_step": 142307, "epoch": 847} {"train_loss": -10.384716033935547, "global_step": 142308, "epoch": 847} {"train_loss": -10.078388214111328, "global_step": 142309, "epoch": 847} {"train_loss": -10.562581062316895, "global_step": 142310, "epoch": 847} {"train_loss": -10.034186363220215, "global_step": 142311, "epoch": 847} {"train_loss": -10.26506519317627, "global_step": 142312, "epoch": 847} {"train_loss": -10.5317964553833, "global_step": 142313, "epoch": 847} {"train_loss": -10.504894256591797, "global_step": 142314, "epoch": 847} {"train_loss": -10.477363586425781, "global_step": 142315, "epoch": 847} {"train_loss": -10.496042251586914, "global_step": 142316, "epoch": 847} {"train_loss": -10.265389442443848, "global_step": 142317, "epoch": 847} {"train_loss": -10.583389282226562, "global_step": 142318, "epoch": 847} {"train_loss": -10.583008766174316, "global_step": 142319, "epoch": 847} {"train_loss": -10.56993293762207, "global_step": 142320, "epoch": 847} {"train_loss": -10.687745094299316, "global_step": 142321, "epoch": 847} {"train_loss": -10.72083854675293, "global_step": 142322, "epoch": 847} {"train_loss": -10.806732177734375, "global_step": 142323, "epoch": 847} {"train_loss": -10.757417678833008, "global_step": 142324, "epoch": 847} {"train_loss": -10.854530334472656, "global_step": 142325, "epoch": 847} {"train_loss": -10.717615127563477, "global_step": 142326, "epoch": 847} {"train_loss": -10.479391098022461, "global_step": 142327, "epoch": 847} {"train_loss": -10.93314266204834, "global_step": 142328, "epoch": 847} {"train_loss": -10.65861988067627, "global_step": 142329, "epoch": 847} {"train_loss": -11.00660514831543, "global_step": 142330, "epoch": 847} {"train_loss": -10.779834747314453, "global_step": 142331, "epoch": 847} {"train_loss": -10.860143661499023, "global_step": 142332, "epoch": 847} {"train_loss": -10.89258098602295, "global_step": 142333, "epoch": 847} {"train_loss": -10.701542854309082, "global_step": 142334, "epoch": 847} {"train_loss": -10.815228462219238, "global_step": 142335, "epoch": 847} {"train_loss": -10.575331687927246, "global_step": 142336, "epoch": 847} {"train_loss": -10.755029678344727, "global_step": 142337, "epoch": 847} {"train_loss": -10.624957084655762, "global_step": 142338, "epoch": 847} {"train_loss": -10.47530460357666, "global_step": 142339, "epoch": 847} {"train_loss": -10.603241920471191, "global_step": 142340, "epoch": 847} {"train_loss": -10.595379829406738, "global_step": 142341, "epoch": 847} {"train_loss": -10.24798583984375, "global_step": 142342, "epoch": 847} {"train_loss": -10.856801986694336, "global_step": 142343, "epoch": 847} {"train_loss": -9.923645973205566, "global_step": 142344, "epoch": 847} {"train_loss": -10.76662540435791, "global_step": 142345, "epoch": 847} {"train_loss": -11.026158332824707, "global_step": 142346, "epoch": 847} {"train_loss": -10.387628555297852, "global_step": 142347, "epoch": 847} {"train_loss": -10.446784973144531, "global_step": 142348, "epoch": 847} {"train_loss": -10.659646987915039, "global_step": 142349, "epoch": 847} {"train_loss": -10.395687103271484, "global_step": 142350, "epoch": 847} {"train_loss": -10.453333854675293, "global_step": 142351, "epoch": 847} {"train_loss": -10.9556884765625, "global_step": 142352, "epoch": 847} {"train_loss": -10.410811424255371, "global_step": 142353, "epoch": 847} {"train_loss": -10.70178508758545, "global_step": 142354, "epoch": 847} {"train_loss": -10.403169631958008, "global_step": 142355, "epoch": 847} {"train_loss": -10.063604354858398, "global_step": 142356, "epoch": 847} {"train_loss": -10.510976791381836, "global_step": 142357, "epoch": 847} {"train_loss": -10.380571365356445, "global_step": 142358, "epoch": 847} {"train_loss": -10.635515213012695, "global_step": 142359, "epoch": 847} {"train_loss": -10.702188491821289, "global_step": 142360, "epoch": 847} {"train_loss": -9.644492149353027, "global_step": 142361, "epoch": 847} {"train_loss": -10.248838424682617, "global_step": 142362, "epoch": 847} {"train_loss": -10.297319412231445, "global_step": 142363, "epoch": 847} {"train_loss": -10.040424346923828, "global_step": 142364, "epoch": 847} {"train_loss": -10.905863761901855, "global_step": 142365, "epoch": 847} {"train_loss": -10.13104248046875, "global_step": 142366, "epoch": 847} {"train_loss": -10.429154396057129, "global_step": 142367, "epoch": 847} {"train_loss": -10.32569694519043, "global_step": 142368, "epoch": 847} {"train_loss": -10.008925437927246, "global_step": 142369, "epoch": 847} {"train_loss": -10.845084190368652, "global_step": 142370, "epoch": 847} {"train_loss": -10.102599143981934, "global_step": 142371, "epoch": 847} {"train_loss": -10.64736270904541, "global_step": 142372, "epoch": 847} {"train_loss": -10.304620742797852, "global_step": 142373, "epoch": 847} {"train_loss": -10.451738357543945, "global_step": 142374, "epoch": 847} {"train_loss": -10.343572616577148, "global_step": 142375, "epoch": 847} {"train_loss": -10.55009651184082, "global_step": 142376, "epoch": 847} {"train_loss": -10.565226554870605, "global_step": 142377, "epoch": 847} {"train_loss": -10.63634967803955, "global_step": 142378, "epoch": 847} {"train_loss": -10.566245079040527, "global_step": 142379, "epoch": 847} {"train_loss": -10.725725173950195, "global_step": 142380, "epoch": 847} {"train_loss": -10.569986343383789, "global_step": 142381, "epoch": 847} {"train_loss": -10.681541442871094, "global_step": 142382, "epoch": 847} {"train_loss": -10.486066818237305, "global_step": 142383, "epoch": 847} {"train_loss": -10.46653938293457, "global_step": 142384, "epoch": 847} {"train_loss": -10.780803680419922, "global_step": 142385, "epoch": 847} {"train_loss": -10.542671203613281, "global_step": 142386, "epoch": 847} {"train_loss": -10.129190444946289, "global_step": 142387, "epoch": 847} {"train_loss": -10.545160293579102, "global_step": 142388, "epoch": 847} {"train_loss": -10.2186918258667, "global_step": 142389, "epoch": 847} {"train_loss": -10.30318546295166, "global_step": 142390, "epoch": 847} {"train_loss": -10.565354347229004, "global_step": 142391, "epoch": 847} {"train_loss": -10.681997299194336, "global_step": 142392, "epoch": 847} {"train_loss": -10.856538772583008, "global_step": 142393, "epoch": 847} {"train_loss": -10.70016860961914, "global_step": 142394, "epoch": 847} {"train_loss": -10.552824020385742, "global_step": 142395, "epoch": 847} {"train_loss": -10.763001441955566, "global_step": 142396, "epoch": 847} {"train_loss": -10.282182693481445, "global_step": 142397, "epoch": 847} {"train_loss": -10.643033981323242, "global_step": 142398, "epoch": 847} {"train_loss": -10.379989624023438, "global_step": 142399, "epoch": 847} {"train_loss": -10.682892799377441, "global_step": 142400, "epoch": 847} {"train_loss": -10.662534713745117, "global_step": 142401, "epoch": 847} {"train_loss": -10.685286521911621, "global_step": 142402, "epoch": 847} {"train_loss": -10.863147735595703, "global_step": 142403, "epoch": 847} {"train_loss": -10.509805679321289, "global_step": 142404, "epoch": 847} {"train_loss": -10.787117958068848, "global_step": 142405, "epoch": 847} {"train_loss": -10.7145357131958, "global_step": 142406, "epoch": 847} {"train_loss": -10.741081237792969, "global_step": 142407, "epoch": 847} {"train_loss": -10.720033645629883, "global_step": 142408, "epoch": 847} {"train_loss": -10.458672523498535, "global_step": 142409, "epoch": 847} {"train_loss": -10.619064331054688, "global_step": 142410, "epoch": 847} {"train_loss": -10.590616226196289, "global_step": 142411, "epoch": 847} {"train_loss": -10.890106201171875, "global_step": 142412, "epoch": 847} {"train_loss": -10.807796478271484, "global_step": 142413, "epoch": 847} {"train_loss": -10.505988121032715, "global_step": 142414, "epoch": 847} {"train_loss": -10.799139976501465, "global_step": 142415, "epoch": 847} {"train_loss": -10.57965087890625, "global_step": 142416, "epoch": 847} {"train_loss": -10.831960678100586, "global_step": 142417, "epoch": 847} {"train_loss": -10.65110969543457, "global_step": 142418, "epoch": 847} {"train_loss": -10.393231391906738, "global_step": 142419, "epoch": 847} {"train_loss": -10.646163940429688, "global_step": 142420, "epoch": 847} {"train_loss": -10.667313575744629, "global_step": 142421, "epoch": 847} {"train_loss": -10.636330604553223, "global_step": 142422, "epoch": 847} {"train_loss": -10.342037200927734, "global_step": 142423, "epoch": 847} {"train_loss": -10.834543228149414, "global_step": 142424, "epoch": 847} {"train_loss": -10.440821647644043, "global_step": 142425, "epoch": 847} {"train_loss": -10.614556312561035, "global_step": 142426, "epoch": 847} {"train_loss": -10.524736404418945, "global_step": 142427, "epoch": 847} {"train_loss": -10.137219429016113, "global_step": 142428, "epoch": 847} {"train_loss": -10.585655212402344, "global_step": 142429, "epoch": 847} {"train_loss": -10.385575294494629, "global_step": 142430, "epoch": 847} {"train_loss": -10.550589561462402, "global_step": 142431, "epoch": 847} {"train_loss": -10.532194137573242, "global_step": 142432, "epoch": 847} {"train_loss": -10.21407699584961, "global_step": 142433, "epoch": 847} {"train_loss": -10.815055847167969, "global_step": 142434, "epoch": 847} {"train_loss": -10.754280090332031, "global_step": 142435, "epoch": 847} {"train_loss": -10.740520477294922, "global_step": 142436, "epoch": 847} {"train_loss": -10.810276985168457, "global_step": 142437, "epoch": 847} {"train_loss": -10.583880424499512, "global_step": 142438, "epoch": 847} {"train_loss": -10.608485221862793, "global_step": 142439, "epoch": 847} {"train_loss": -10.838289260864258, "global_step": 142440, "epoch": 847} {"train_loss": -10.492392539978027, "global_step": 142441, "epoch": 847} {"train_loss": -10.70842456817627, "global_step": 142442, "epoch": 847} {"train_loss": -10.680795669555664, "global_step": 142443, "epoch": 847} {"train_loss": -10.708330154418945, "global_step": 142444, "epoch": 847} {"train_loss": -10.959622383117676, "global_step": 142445, "epoch": 847} {"train_loss": -10.733041763305664, "global_step": 142446, "epoch": 847} {"train_loss": -10.753959655761719, "global_step": 142447, "epoch": 847} {"train_loss": -10.77818489074707, "global_step": 142448, "epoch": 847} {"train_loss": -10.73921012878418, "global_step": 142449, "epoch": 847} {"train_loss": -10.846860885620117, "global_step": 142450, "epoch": 847} {"train_loss": -10.914102554321289, "global_step": 142451, "epoch": 847} {"train_loss": -10.70594596862793, "global_step": 142452, "epoch": 847} {"train_loss": -10.930158615112305, "global_step": 142453, "epoch": 847} {"train_loss": -10.937128067016602, "global_step": 142454, "epoch": 847} {"train_loss": -10.604891777038574, "global_step": 142455, "epoch": 847} {"train_loss": -10.709298133850098, "global_step": 142456, "epoch": 847} {"train_loss": -10.895689010620117, "global_step": 142457, "epoch": 847} {"train_loss": -10.648229598999023, "global_step": 142458, "epoch": 847} {"train_loss": -10.58289909362793, "global_step": 142459, "epoch": 847} {"train_loss": -10.571240425109863, "global_step": 142460, "epoch": 847} {"train_loss": -10.375005722045898, "global_step": 142461, "epoch": 847} {"train_loss": -10.781124114990234, "global_step": 142462, "epoch": 847} {"train_loss": -10.564200202624003, "global_step": 142463, "epoch": 847, "val_loss": 223947.703125} {"train_loss": -11.075153350830078, "global_step": 142464, "epoch": 848} {"train_loss": -10.839920043945312, "global_step": 142465, "epoch": 848} {"train_loss": -10.73417854309082, "global_step": 142466, "epoch": 848} {"train_loss": -10.886842727661133, "global_step": 142467, "epoch": 848} {"train_loss": -10.853057861328125, "global_step": 142468, "epoch": 848} {"train_loss": -10.941608428955078, "global_step": 142469, "epoch": 848} {"train_loss": -10.956380844116211, "global_step": 142470, "epoch": 848} {"train_loss": -10.922140121459961, "global_step": 142471, "epoch": 848} {"train_loss": -11.150138854980469, "global_step": 142472, "epoch": 848} {"train_loss": -10.921651840209961, "global_step": 142473, "epoch": 848} {"train_loss": -10.97022819519043, "global_step": 142474, "epoch": 848} {"train_loss": -10.920119285583496, "global_step": 142475, "epoch": 848} {"train_loss": -10.844819068908691, "global_step": 142476, "epoch": 848} {"train_loss": -10.690988540649414, "global_step": 142477, "epoch": 848} {"train_loss": -10.406371116638184, "global_step": 142478, "epoch": 848} {"train_loss": -10.558619499206543, "global_step": 142479, "epoch": 848} {"train_loss": -10.901172637939453, "global_step": 142480, "epoch": 848} {"train_loss": -10.758108139038086, "global_step": 142481, "epoch": 848} {"train_loss": -10.141162872314453, "global_step": 142482, "epoch": 848} {"train_loss": -10.845670700073242, "global_step": 142483, "epoch": 848} {"train_loss": -10.607962608337402, "global_step": 142484, "epoch": 848} {"train_loss": -10.509068489074707, "global_step": 142485, "epoch": 848} {"train_loss": -10.554645538330078, "global_step": 142486, "epoch": 848} {"train_loss": -10.46754264831543, "global_step": 142487, "epoch": 848} {"train_loss": -9.630025863647461, "global_step": 142488, "epoch": 848} {"train_loss": -10.604220390319824, "global_step": 142489, "epoch": 848} {"train_loss": -8.551202774047852, "global_step": 142490, "epoch": 848} {"train_loss": -9.22624397277832, "global_step": 142491, "epoch": 848} {"train_loss": -10.11536979675293, "global_step": 142492, "epoch": 848} {"train_loss": -8.452503204345703, "global_step": 142493, "epoch": 848} {"train_loss": -9.344989776611328, "global_step": 142494, "epoch": 848} {"train_loss": -8.954636573791504, "global_step": 142495, "epoch": 848} {"train_loss": -9.749260902404785, "global_step": 142496, "epoch": 848} {"train_loss": -8.496309280395508, "global_step": 142497, "epoch": 848} {"train_loss": -10.074392318725586, "global_step": 142498, "epoch": 848} {"train_loss": -9.025891304016113, "global_step": 142499, "epoch": 848} {"train_loss": -10.007218360900879, "global_step": 142500, "epoch": 848} {"train_loss": -10.07585334777832, "global_step": 142501, "epoch": 848} {"train_loss": -10.03101921081543, "global_step": 142502, "epoch": 848} {"train_loss": -10.138801574707031, "global_step": 142503, "epoch": 848} {"train_loss": -10.131810188293457, "global_step": 142504, "epoch": 848} {"train_loss": -10.011817932128906, "global_step": 142505, "epoch": 848} {"train_loss": -9.897808074951172, "global_step": 142506, "epoch": 848} {"train_loss": -9.854565620422363, "global_step": 142507, "epoch": 848} {"train_loss": -10.334392547607422, "global_step": 142508, "epoch": 848} {"train_loss": -10.155077934265137, "global_step": 142509, "epoch": 848} {"train_loss": -10.17477035522461, "global_step": 142510, "epoch": 848} {"train_loss": -10.566740989685059, "global_step": 142511, "epoch": 848} {"train_loss": -10.51176929473877, "global_step": 142512, "epoch": 848} {"train_loss": -10.18683910369873, "global_step": 142513, "epoch": 848} {"train_loss": -10.174283981323242, "global_step": 142514, "epoch": 848} {"train_loss": -10.267748832702637, "global_step": 142515, "epoch": 848} {"train_loss": -10.191811561584473, "global_step": 142516, "epoch": 848} {"train_loss": -10.627561569213867, "global_step": 142517, "epoch": 848} {"train_loss": -10.26058578491211, "global_step": 142518, "epoch": 848} {"train_loss": -10.24624252319336, "global_step": 142519, "epoch": 848} {"train_loss": -10.197089195251465, "global_step": 142520, "epoch": 848} {"train_loss": -10.243473052978516, "global_step": 142521, "epoch": 848} {"train_loss": -10.42237663269043, "global_step": 142522, "epoch": 848} {"train_loss": -10.42799186706543, "global_step": 142523, "epoch": 848} {"train_loss": -10.403564453125, "global_step": 142524, "epoch": 848} {"train_loss": -10.315689086914062, "global_step": 142525, "epoch": 848} {"train_loss": -10.553215026855469, "global_step": 142526, "epoch": 848} {"train_loss": -10.639646530151367, "global_step": 142527, "epoch": 848} {"train_loss": -10.51930046081543, "global_step": 142528, "epoch": 848} {"train_loss": -10.594221115112305, "global_step": 142529, "epoch": 848} {"train_loss": -10.539546966552734, "global_step": 142530, "epoch": 848} {"train_loss": -10.43616771697998, "global_step": 142531, "epoch": 848} {"train_loss": -10.710075378417969, "global_step": 142532, "epoch": 848} {"train_loss": -10.42230224609375, "global_step": 142533, "epoch": 848} {"train_loss": -10.336094856262207, "global_step": 142534, "epoch": 848} {"train_loss": -10.572527885437012, "global_step": 142535, "epoch": 848} {"train_loss": -10.672935485839844, "global_step": 142536, "epoch": 848} {"train_loss": -10.414168357849121, "global_step": 142537, "epoch": 848} {"train_loss": -10.768593788146973, "global_step": 142538, "epoch": 848} {"train_loss": -10.526947021484375, "global_step": 142539, "epoch": 848} {"train_loss": -10.843971252441406, "global_step": 142540, "epoch": 848} {"train_loss": -10.545019149780273, "global_step": 142541, "epoch": 848} {"train_loss": -10.692723274230957, "global_step": 142542, "epoch": 848} {"train_loss": -10.531464576721191, "global_step": 142543, "epoch": 848} {"train_loss": -10.67097282409668, "global_step": 142544, "epoch": 848} {"train_loss": -10.971471786499023, "global_step": 142545, "epoch": 848} {"train_loss": -10.85914134979248, "global_step": 142546, "epoch": 848} {"train_loss": -10.77704906463623, "global_step": 142547, "epoch": 848} {"train_loss": -10.64799976348877, "global_step": 142548, "epoch": 848} {"train_loss": -10.8524169921875, "global_step": 142549, "epoch": 848} {"train_loss": -10.56747817993164, "global_step": 142550, "epoch": 848} {"train_loss": -10.969542503356934, "global_step": 142551, "epoch": 848} {"train_loss": -10.840272903442383, "global_step": 142552, "epoch": 848} {"train_loss": -10.543782234191895, "global_step": 142553, "epoch": 848} {"train_loss": -10.676055908203125, "global_step": 142554, "epoch": 848} {"train_loss": -11.003898620605469, "global_step": 142555, "epoch": 848} {"train_loss": -10.707765579223633, "global_step": 142556, "epoch": 848} {"train_loss": -10.673782348632812, "global_step": 142557, "epoch": 848} {"train_loss": -10.954570770263672, "global_step": 142558, "epoch": 848} {"train_loss": -10.455923080444336, "global_step": 142559, "epoch": 848} {"train_loss": -10.729565620422363, "global_step": 142560, "epoch": 848} {"train_loss": -10.530091285705566, "global_step": 142561, "epoch": 848} {"train_loss": -9.939720153808594, "global_step": 142562, "epoch": 848} {"train_loss": -10.770198822021484, "global_step": 142563, "epoch": 848} {"train_loss": -10.092849731445312, "global_step": 142564, "epoch": 848} {"train_loss": -10.482547760009766, "global_step": 142565, "epoch": 848} {"train_loss": -10.786888122558594, "global_step": 142566, "epoch": 848} {"train_loss": -10.34461784362793, "global_step": 142567, "epoch": 848} {"train_loss": -10.803675651550293, "global_step": 142568, "epoch": 848} {"train_loss": -10.248292922973633, "global_step": 142569, "epoch": 848} {"train_loss": -10.275794982910156, "global_step": 142570, "epoch": 848} {"train_loss": -10.592032432556152, "global_step": 142571, "epoch": 848} {"train_loss": -10.408411979675293, "global_step": 142572, "epoch": 848} {"train_loss": -10.345136642456055, "global_step": 142573, "epoch": 848} {"train_loss": -10.42622184753418, "global_step": 142574, "epoch": 848} {"train_loss": -10.52001667022705, "global_step": 142575, "epoch": 848} {"train_loss": -10.167523384094238, "global_step": 142576, "epoch": 848} {"train_loss": -10.410432815551758, "global_step": 142577, "epoch": 848} {"train_loss": -10.246225357055664, "global_step": 142578, "epoch": 848} {"train_loss": -10.400205612182617, "global_step": 142579, "epoch": 848} {"train_loss": -10.621794700622559, "global_step": 142580, "epoch": 848} {"train_loss": -9.935806274414062, "global_step": 142581, "epoch": 848} {"train_loss": -10.005041122436523, "global_step": 142582, "epoch": 848} {"train_loss": -10.066352844238281, "global_step": 142583, "epoch": 848} {"train_loss": -9.964266777038574, "global_step": 142584, "epoch": 848} {"train_loss": -10.503830909729004, "global_step": 142585, "epoch": 848} {"train_loss": -9.885351181030273, "global_step": 142586, "epoch": 848} {"train_loss": -10.77392864227295, "global_step": 142587, "epoch": 848} {"train_loss": -10.396714210510254, "global_step": 142588, "epoch": 848} {"train_loss": -10.34670639038086, "global_step": 142589, "epoch": 848} {"train_loss": -10.277656555175781, "global_step": 142590, "epoch": 848} {"train_loss": -10.63963794708252, "global_step": 142591, "epoch": 848} {"train_loss": -10.31562614440918, "global_step": 142592, "epoch": 848} {"train_loss": -10.352707862854004, "global_step": 142593, "epoch": 848} {"train_loss": -10.618749618530273, "global_step": 142594, "epoch": 848} {"train_loss": -10.37739372253418, "global_step": 142595, "epoch": 848} {"train_loss": -10.231897354125977, "global_step": 142596, "epoch": 848} {"train_loss": -10.606236457824707, "global_step": 142597, "epoch": 848} {"train_loss": -10.156620025634766, "global_step": 142598, "epoch": 848} {"train_loss": -10.289259910583496, "global_step": 142599, "epoch": 848} {"train_loss": -10.439104080200195, "global_step": 142600, "epoch": 848} {"train_loss": -10.426746368408203, "global_step": 142601, "epoch": 848} {"train_loss": -10.275182723999023, "global_step": 142602, "epoch": 848} {"train_loss": -10.765460968017578, "global_step": 142603, "epoch": 848} {"train_loss": -10.367803573608398, "global_step": 142604, "epoch": 848} {"train_loss": -10.251657485961914, "global_step": 142605, "epoch": 848} {"train_loss": -10.839834213256836, "global_step": 142606, "epoch": 848} {"train_loss": -10.567571640014648, "global_step": 142607, "epoch": 848} {"train_loss": -10.367197036743164, "global_step": 142608, "epoch": 848} {"train_loss": -10.794182777404785, "global_step": 142609, "epoch": 848} {"train_loss": -10.512516021728516, "global_step": 142610, "epoch": 848} {"train_loss": -10.43136215209961, "global_step": 142611, "epoch": 848} {"train_loss": -10.53548812866211, "global_step": 142612, "epoch": 848} {"train_loss": -10.520606994628906, "global_step": 142613, "epoch": 848} {"train_loss": -10.385873794555664, "global_step": 142614, "epoch": 848} {"train_loss": -10.469402313232422, "global_step": 142615, "epoch": 848} {"train_loss": -10.424236297607422, "global_step": 142616, "epoch": 848} {"train_loss": -10.594614028930664, "global_step": 142617, "epoch": 848} {"train_loss": -10.752732276916504, "global_step": 142618, "epoch": 848} {"train_loss": -10.875761032104492, "global_step": 142619, "epoch": 848} {"train_loss": -10.669408798217773, "global_step": 142620, "epoch": 848} {"train_loss": -10.699623107910156, "global_step": 142621, "epoch": 848} {"train_loss": -10.783018112182617, "global_step": 142622, "epoch": 848} {"train_loss": -10.676153182983398, "global_step": 142623, "epoch": 848} {"train_loss": -10.930146217346191, "global_step": 142624, "epoch": 848} {"train_loss": -10.92185115814209, "global_step": 142625, "epoch": 848} {"train_loss": -10.69515609741211, "global_step": 142626, "epoch": 848} {"train_loss": -10.754499435424805, "global_step": 142627, "epoch": 848} {"train_loss": -10.822422981262207, "global_step": 142628, "epoch": 848} {"train_loss": -10.654935836791992, "global_step": 142629, "epoch": 848} {"train_loss": -10.987837791442871, "global_step": 142630, "epoch": 848} {"train_loss": -10.439878997348604, "global_step": 142631, "epoch": 848, "val_loss": 223166.125} {"train_loss": -10.907787322998047, "global_step": 142632, "epoch": 849} {"train_loss": -10.55868148803711, "global_step": 142633, "epoch": 849} {"train_loss": -10.71725082397461, "global_step": 142634, "epoch": 849} {"train_loss": -10.457955360412598, "global_step": 142635, "epoch": 849} {"train_loss": -10.727582931518555, "global_step": 142636, "epoch": 849} {"train_loss": -10.701122283935547, "global_step": 142637, "epoch": 849} {"train_loss": -10.460216522216797, "global_step": 142638, "epoch": 849} {"train_loss": -10.797223091125488, "global_step": 142639, "epoch": 849} {"train_loss": -10.721697807312012, "global_step": 142640, "epoch": 849} {"train_loss": -10.429891586303711, "global_step": 142641, "epoch": 849} {"train_loss": -10.540826797485352, "global_step": 142642, "epoch": 849} {"train_loss": -10.534154891967773, "global_step": 142643, "epoch": 849} {"train_loss": -10.803567886352539, "global_step": 142644, "epoch": 849} {"train_loss": -10.28592586517334, "global_step": 142645, "epoch": 849} {"train_loss": -10.745246887207031, "global_step": 142646, "epoch": 849} {"train_loss": -10.4525728225708, "global_step": 142647, "epoch": 849} {"train_loss": -10.793220520019531, "global_step": 142648, "epoch": 849} {"train_loss": -9.102394104003906, "global_step": 142649, "epoch": 849} {"train_loss": -10.291213035583496, "global_step": 142650, "epoch": 849} {"train_loss": -10.37596321105957, "global_step": 142651, "epoch": 849} {"train_loss": -9.894231796264648, "global_step": 142652, "epoch": 849} {"train_loss": -9.95678424835205, "global_step": 142653, "epoch": 849} {"train_loss": -9.762226104736328, "global_step": 142654, "epoch": 849} {"train_loss": -8.480436325073242, "global_step": 142655, "epoch": 849} {"train_loss": -8.535043716430664, "global_step": 142656, "epoch": 849} {"train_loss": -9.897236824035645, "global_step": 142657, "epoch": 849} {"train_loss": -9.276363372802734, "global_step": 142658, "epoch": 849} {"train_loss": -8.98351001739502, "global_step": 142659, "epoch": 849} {"train_loss": -9.23508071899414, "global_step": 142660, "epoch": 849} {"train_loss": -9.677311897277832, "global_step": 142661, "epoch": 849} {"train_loss": -9.100576400756836, "global_step": 142662, "epoch": 849} {"train_loss": -9.658113479614258, "global_step": 142663, "epoch": 849} {"train_loss": -10.022936820983887, "global_step": 142664, "epoch": 849} {"train_loss": -9.772218704223633, "global_step": 142665, "epoch": 849} {"train_loss": -10.138094902038574, "global_step": 142666, "epoch": 849} {"train_loss": -9.697744369506836, "global_step": 142667, "epoch": 849} {"train_loss": -10.276455879211426, "global_step": 142668, "epoch": 849} {"train_loss": -10.29925537109375, "global_step": 142669, "epoch": 849} {"train_loss": -10.259939193725586, "global_step": 142670, "epoch": 849} {"train_loss": -10.245226860046387, "global_step": 142671, "epoch": 849} {"train_loss": -10.233859062194824, "global_step": 142672, "epoch": 849} {"train_loss": -10.381566047668457, "global_step": 142673, "epoch": 849} {"train_loss": -10.092792510986328, "global_step": 142674, "epoch": 849} {"train_loss": -10.494670867919922, "global_step": 142675, "epoch": 849} {"train_loss": -10.403227806091309, "global_step": 142676, "epoch": 849} {"train_loss": -10.4978609085083, "global_step": 142677, "epoch": 849} {"train_loss": -10.380815505981445, "global_step": 142678, "epoch": 849} {"train_loss": -10.477468490600586, "global_step": 142679, "epoch": 849} {"train_loss": -10.23060417175293, "global_step": 142680, "epoch": 849} {"train_loss": -10.623983383178711, "global_step": 142681, "epoch": 849} {"train_loss": -10.613819122314453, "global_step": 142682, "epoch": 849} {"train_loss": -10.399274826049805, "global_step": 142683, "epoch": 849} {"train_loss": -10.465778350830078, "global_step": 142684, "epoch": 849} {"train_loss": -10.557048797607422, "global_step": 142685, "epoch": 849} {"train_loss": -10.570426940917969, "global_step": 142686, "epoch": 849} {"train_loss": -10.511103630065918, "global_step": 142687, "epoch": 849} {"train_loss": -10.553468704223633, "global_step": 142688, "epoch": 849} {"train_loss": -10.702210426330566, "global_step": 142689, "epoch": 849} {"train_loss": -10.517206192016602, "global_step": 142690, "epoch": 849} {"train_loss": -10.644351959228516, "global_step": 142691, "epoch": 849} {"train_loss": -10.654764175415039, "global_step": 142692, "epoch": 849} {"train_loss": -10.68370246887207, "global_step": 142693, "epoch": 849} {"train_loss": -10.555217742919922, "global_step": 142694, "epoch": 849} {"train_loss": -10.806290626525879, "global_step": 142695, "epoch": 849} {"train_loss": -10.560759544372559, "global_step": 142696, "epoch": 849} {"train_loss": -10.82817268371582, "global_step": 142697, "epoch": 849} {"train_loss": -10.720084190368652, "global_step": 142698, "epoch": 849} {"train_loss": -10.860962867736816, "global_step": 142699, "epoch": 849} {"train_loss": -10.787761688232422, "global_step": 142700, "epoch": 849} {"train_loss": -10.641422271728516, "global_step": 142701, "epoch": 849} {"train_loss": -10.8263521194458, "global_step": 142702, "epoch": 849} {"train_loss": -10.781475067138672, "global_step": 142703, "epoch": 849} {"train_loss": -10.71544075012207, "global_step": 142704, "epoch": 849} {"train_loss": -10.761371612548828, "global_step": 142705, "epoch": 849} {"train_loss": -10.602336883544922, "global_step": 142706, "epoch": 849} {"train_loss": -10.66718864440918, "global_step": 142707, "epoch": 849} {"train_loss": -10.792972564697266, "global_step": 142708, "epoch": 849} {"train_loss": -10.53565788269043, "global_step": 142709, "epoch": 849} {"train_loss": -10.132265090942383, "global_step": 142710, "epoch": 849} {"train_loss": -10.703113555908203, "global_step": 142711, "epoch": 849} {"train_loss": -10.703433990478516, "global_step": 142712, "epoch": 849} {"train_loss": -10.601969718933105, "global_step": 142713, "epoch": 849} {"train_loss": -10.935359954833984, "global_step": 142714, "epoch": 849} {"train_loss": -10.758084297180176, "global_step": 142715, "epoch": 849} {"train_loss": -10.99223518371582, "global_step": 142716, "epoch": 849} {"train_loss": -10.57090950012207, "global_step": 142717, "epoch": 849} {"train_loss": -10.570489883422852, "global_step": 142718, "epoch": 849} {"train_loss": -10.671829223632812, "global_step": 142719, "epoch": 849} {"train_loss": -10.486949920654297, "global_step": 142720, "epoch": 849} {"train_loss": -10.905963897705078, "global_step": 142721, "epoch": 849} {"train_loss": -10.418909072875977, "global_step": 142722, "epoch": 849} {"train_loss": -9.901276588439941, "global_step": 142723, "epoch": 849} {"train_loss": -10.529621124267578, "global_step": 142724, "epoch": 849} {"train_loss": -10.657074928283691, "global_step": 142725, "epoch": 849} {"train_loss": -10.089319229125977, "global_step": 142726, "epoch": 849} {"train_loss": -10.671730041503906, "global_step": 142727, "epoch": 849} {"train_loss": -9.64271354675293, "global_step": 142728, "epoch": 849} {"train_loss": -10.344429016113281, "global_step": 142729, "epoch": 849} {"train_loss": -10.094858169555664, "global_step": 142730, "epoch": 849} {"train_loss": -10.504558563232422, "global_step": 142731, "epoch": 849} {"train_loss": -9.996110916137695, "global_step": 142732, "epoch": 849} {"train_loss": -10.734077453613281, "global_step": 142733, "epoch": 849} {"train_loss": -10.189249038696289, "global_step": 142734, "epoch": 849} {"train_loss": -10.379144668579102, "global_step": 142735, "epoch": 849} {"train_loss": -10.664642333984375, "global_step": 142736, "epoch": 849} {"train_loss": -10.30160903930664, "global_step": 142737, "epoch": 849} {"train_loss": -10.668704986572266, "global_step": 142738, "epoch": 849} {"train_loss": -10.338102340698242, "global_step": 142739, "epoch": 849} {"train_loss": -10.83535385131836, "global_step": 142740, "epoch": 849} {"train_loss": -10.642007827758789, "global_step": 142741, "epoch": 849} {"train_loss": -10.663705825805664, "global_step": 142742, "epoch": 849} {"train_loss": -10.681652069091797, "global_step": 142743, "epoch": 849} {"train_loss": -10.447311401367188, "global_step": 142744, "epoch": 849} {"train_loss": -10.770756721496582, "global_step": 142745, "epoch": 849} {"train_loss": -10.823005676269531, "global_step": 142746, "epoch": 849} {"train_loss": -10.78754997253418, "global_step": 142747, "epoch": 849} {"train_loss": -10.553333282470703, "global_step": 142748, "epoch": 849} {"train_loss": -10.739656448364258, "global_step": 142749, "epoch": 849} {"train_loss": -10.449212074279785, "global_step": 142750, "epoch": 849} {"train_loss": -10.67153263092041, "global_step": 142751, "epoch": 849} {"train_loss": -10.620856285095215, "global_step": 142752, "epoch": 849} {"train_loss": -10.450811386108398, "global_step": 142753, "epoch": 849} {"train_loss": -10.353353500366211, "global_step": 142754, "epoch": 849} {"train_loss": -10.436695098876953, "global_step": 142755, "epoch": 849} {"train_loss": -10.54067611694336, "global_step": 142756, "epoch": 849} {"train_loss": -10.517648696899414, "global_step": 142757, "epoch": 849} {"train_loss": -10.65466022491455, "global_step": 142758, "epoch": 849} {"train_loss": -10.71607780456543, "global_step": 142759, "epoch": 849} {"train_loss": -10.561264038085938, "global_step": 142760, "epoch": 849} {"train_loss": -10.752717971801758, "global_step": 142761, "epoch": 849} {"train_loss": -10.49350357055664, "global_step": 142762, "epoch": 849} {"train_loss": -10.509041786193848, "global_step": 142763, "epoch": 849} {"train_loss": -10.355132102966309, "global_step": 142764, "epoch": 849} {"train_loss": -9.931901931762695, "global_step": 142765, "epoch": 849} {"train_loss": -10.451377868652344, "global_step": 142766, "epoch": 849} {"train_loss": -9.889413833618164, "global_step": 142767, "epoch": 849} {"train_loss": -10.512205123901367, "global_step": 142768, "epoch": 849} {"train_loss": -9.87695598602295, "global_step": 142769, "epoch": 849} {"train_loss": -9.904342651367188, "global_step": 142770, "epoch": 849} {"train_loss": -10.574880599975586, "global_step": 142771, "epoch": 849} {"train_loss": -10.277266502380371, "global_step": 142772, "epoch": 849} {"train_loss": -10.579357147216797, "global_step": 142773, "epoch": 849} {"train_loss": -10.415216445922852, "global_step": 142774, "epoch": 849} {"train_loss": -10.44755744934082, "global_step": 142775, "epoch": 849} {"train_loss": -10.531187057495117, "global_step": 142776, "epoch": 849} {"train_loss": -10.41020393371582, "global_step": 142777, "epoch": 849} {"train_loss": -10.55077838897705, "global_step": 142778, "epoch": 849} {"train_loss": -10.71183967590332, "global_step": 142779, "epoch": 849} {"train_loss": -10.551811218261719, "global_step": 142780, "epoch": 849} {"train_loss": -10.826377868652344, "global_step": 142781, "epoch": 849} {"train_loss": -10.18481159210205, "global_step": 142782, "epoch": 849} {"train_loss": -10.398005485534668, "global_step": 142783, "epoch": 849} {"train_loss": -10.327981948852539, "global_step": 142784, "epoch": 849} {"train_loss": -10.52868938446045, "global_step": 142785, "epoch": 849} {"train_loss": -10.64143180847168, "global_step": 142786, "epoch": 849} {"train_loss": -10.531244277954102, "global_step": 142787, "epoch": 849} {"train_loss": -10.294954299926758, "global_step": 142788, "epoch": 849} {"train_loss": -10.601694107055664, "global_step": 142789, "epoch": 849} {"train_loss": -10.419093132019043, "global_step": 142790, "epoch": 849} {"train_loss": -10.677936553955078, "global_step": 142791, "epoch": 849} {"train_loss": -10.292106628417969, "global_step": 142792, "epoch": 849} {"train_loss": -10.581136703491211, "global_step": 142793, "epoch": 849} {"train_loss": -10.419182777404785, "global_step": 142794, "epoch": 849} {"train_loss": -10.749992370605469, "global_step": 142795, "epoch": 849} {"train_loss": -10.47327995300293, "global_step": 142796, "epoch": 849} {"train_loss": -10.699386596679688, "global_step": 142797, "epoch": 849} {"train_loss": -10.517367362976074, "global_step": 142798, "epoch": 849} {"train_loss": -10.420113955225263, "global_step": 142799, "epoch": 849, "val_loss": 225368.15625} {"train_loss": -10.696843147277832, "global_step": 142800, "epoch": 850} {"train_loss": -10.927650451660156, "global_step": 142801, "epoch": 850} {"train_loss": -10.460434913635254, "global_step": 142802, "epoch": 850} {"train_loss": -10.714921951293945, "global_step": 142803, "epoch": 850} {"train_loss": -11.033464431762695, "global_step": 142804, "epoch": 850} {"train_loss": -10.719371795654297, "global_step": 142805, "epoch": 850} {"train_loss": -10.759662628173828, "global_step": 142806, "epoch": 850} {"train_loss": -10.696630477905273, "global_step": 142807, "epoch": 850} {"train_loss": -10.537755966186523, "global_step": 142808, "epoch": 850} {"train_loss": -10.691987991333008, "global_step": 142809, "epoch": 850} {"train_loss": -10.760139465332031, "global_step": 142810, "epoch": 850} {"train_loss": -10.367462158203125, "global_step": 142811, "epoch": 850} {"train_loss": -10.839282989501953, "global_step": 142812, "epoch": 850} {"train_loss": -10.66031265258789, "global_step": 142813, "epoch": 850} {"train_loss": -10.824064254760742, "global_step": 142814, "epoch": 850} {"train_loss": -10.654821395874023, "global_step": 142815, "epoch": 850} {"train_loss": -10.602888107299805, "global_step": 142816, "epoch": 850} {"train_loss": -10.664383888244629, "global_step": 142817, "epoch": 850} {"train_loss": -10.807954788208008, "global_step": 142818, "epoch": 850} {"train_loss": -10.706220626831055, "global_step": 142819, "epoch": 850} {"train_loss": -10.776097297668457, "global_step": 142820, "epoch": 850} {"train_loss": -10.819543838500977, "global_step": 142821, "epoch": 850} {"train_loss": -10.877281188964844, "global_step": 142822, "epoch": 850} {"train_loss": -10.923250198364258, "global_step": 142823, "epoch": 850} {"train_loss": -10.756816864013672, "global_step": 142824, "epoch": 850} {"train_loss": -10.888449668884277, "global_step": 142825, "epoch": 850} {"train_loss": -10.788663864135742, "global_step": 142826, "epoch": 850} {"train_loss": -10.72245979309082, "global_step": 142827, "epoch": 850} {"train_loss": -10.787421226501465, "global_step": 142828, "epoch": 850} {"train_loss": -10.576053619384766, "global_step": 142829, "epoch": 850} {"train_loss": -10.618505477905273, "global_step": 142830, "epoch": 850} {"train_loss": -10.32359790802002, "global_step": 142831, "epoch": 850} {"train_loss": -10.794090270996094, "global_step": 142832, "epoch": 850} {"train_loss": -10.714439392089844, "global_step": 142833, "epoch": 850} {"train_loss": -10.539007186889648, "global_step": 142834, "epoch": 850} {"train_loss": -10.317253112792969, "global_step": 142835, "epoch": 850} {"train_loss": -11.054996490478516, "global_step": 142836, "epoch": 850} {"train_loss": -10.401954650878906, "global_step": 142837, "epoch": 850} {"train_loss": -10.703557014465332, "global_step": 142838, "epoch": 850} {"train_loss": -10.631057739257812, "global_step": 142839, "epoch": 850} {"train_loss": -10.403953552246094, "global_step": 142840, "epoch": 850} {"train_loss": -11.018729209899902, "global_step": 142841, "epoch": 850} {"train_loss": -9.88123607635498, "global_step": 142842, "epoch": 850} {"train_loss": -10.38247013092041, "global_step": 142843, "epoch": 850} {"train_loss": -10.377504348754883, "global_step": 142844, "epoch": 850} {"train_loss": -10.1300048828125, "global_step": 142845, "epoch": 850} {"train_loss": -10.38623046875, "global_step": 142846, "epoch": 850} {"train_loss": -10.262014389038086, "global_step": 142847, "epoch": 850} {"train_loss": -10.048186302185059, "global_step": 142848, "epoch": 850} {"train_loss": -10.464019775390625, "global_step": 142849, "epoch": 850} {"train_loss": -10.414525985717773, "global_step": 142850, "epoch": 850} {"train_loss": -10.321242332458496, "global_step": 142851, "epoch": 850} {"train_loss": -10.522056579589844, "global_step": 142852, "epoch": 850} {"train_loss": -10.4462308883667, "global_step": 142853, "epoch": 850} {"train_loss": -10.291290283203125, "global_step": 142854, "epoch": 850} {"train_loss": -10.72091007232666, "global_step": 142855, "epoch": 850} {"train_loss": -10.107097625732422, "global_step": 142856, "epoch": 850} {"train_loss": -10.607555389404297, "global_step": 142857, "epoch": 850} {"train_loss": -10.406936645507812, "global_step": 142858, "epoch": 850} {"train_loss": -10.380196571350098, "global_step": 142859, "epoch": 850} {"train_loss": -10.569035530090332, "global_step": 142860, "epoch": 850} {"train_loss": -10.254045486450195, "global_step": 142861, "epoch": 850} {"train_loss": -10.479347229003906, "global_step": 142862, "epoch": 850} {"train_loss": -9.97479248046875, "global_step": 142863, "epoch": 850} {"train_loss": -10.62613296508789, "global_step": 142864, "epoch": 850} {"train_loss": -10.044832229614258, "global_step": 142865, "epoch": 850} {"train_loss": -10.607458114624023, "global_step": 142866, "epoch": 850} {"train_loss": -10.562321662902832, "global_step": 142867, "epoch": 850} {"train_loss": -10.639410018920898, "global_step": 142868, "epoch": 850} {"train_loss": -10.711949348449707, "global_step": 142869, "epoch": 850} {"train_loss": -10.568944931030273, "global_step": 142870, "epoch": 850} {"train_loss": -10.549866676330566, "global_step": 142871, "epoch": 850} {"train_loss": -10.459399223327637, "global_step": 142872, "epoch": 850} {"train_loss": -10.680771827697754, "global_step": 142873, "epoch": 850} {"train_loss": -10.65217113494873, "global_step": 142874, "epoch": 850} {"train_loss": -10.747945785522461, "global_step": 142875, "epoch": 850} {"train_loss": -10.710230827331543, "global_step": 142876, "epoch": 850} {"train_loss": -10.876103401184082, "global_step": 142877, "epoch": 850} {"train_loss": -10.88037395477295, "global_step": 142878, "epoch": 850} {"train_loss": -10.805486679077148, "global_step": 142879, "epoch": 850} {"train_loss": -10.834813117980957, "global_step": 142880, "epoch": 850} {"train_loss": -10.824577331542969, "global_step": 142881, "epoch": 850} {"train_loss": -10.62724494934082, "global_step": 142882, "epoch": 850} {"train_loss": -10.745255470275879, "global_step": 142883, "epoch": 850} {"train_loss": -10.714277267456055, "global_step": 142884, "epoch": 850} {"train_loss": -10.737081527709961, "global_step": 142885, "epoch": 850} {"train_loss": -10.914281845092773, "global_step": 142886, "epoch": 850} {"train_loss": -10.540576934814453, "global_step": 142887, "epoch": 850} {"train_loss": -10.72204875946045, "global_step": 142888, "epoch": 850} {"train_loss": -10.680597305297852, "global_step": 142889, "epoch": 850} {"train_loss": -10.680322647094727, "global_step": 142890, "epoch": 850} {"train_loss": -10.595942497253418, "global_step": 142891, "epoch": 850} {"train_loss": -10.674388885498047, "global_step": 142892, "epoch": 850} {"train_loss": -10.875921249389648, "global_step": 142893, "epoch": 850} {"train_loss": -10.381941795349121, "global_step": 142894, "epoch": 850} {"train_loss": -10.19551944732666, "global_step": 142895, "epoch": 850} {"train_loss": -10.959197044372559, "global_step": 142896, "epoch": 850} {"train_loss": -10.699539184570312, "global_step": 142897, "epoch": 850} {"train_loss": -10.469404220581055, "global_step": 142898, "epoch": 850} {"train_loss": -10.830521583557129, "global_step": 142899, "epoch": 850} {"train_loss": -10.56596565246582, "global_step": 142900, "epoch": 850} {"train_loss": -10.522756576538086, "global_step": 142901, "epoch": 850} {"train_loss": -10.645273208618164, "global_step": 142902, "epoch": 850} {"train_loss": -10.95064926147461, "global_step": 142903, "epoch": 850} {"train_loss": -10.574182510375977, "global_step": 142904, "epoch": 850} {"train_loss": -10.295302391052246, "global_step": 142905, "epoch": 850} {"train_loss": -10.522733688354492, "global_step": 142906, "epoch": 850} {"train_loss": -10.61878776550293, "global_step": 142907, "epoch": 850} {"train_loss": -10.309271812438965, "global_step": 142908, "epoch": 850} {"train_loss": -10.529932022094727, "global_step": 142909, "epoch": 850} {"train_loss": -10.45932674407959, "global_step": 142910, "epoch": 850} {"train_loss": -10.716205596923828, "global_step": 142911, "epoch": 850} {"train_loss": -10.487699508666992, "global_step": 142912, "epoch": 850} {"train_loss": -10.6700439453125, "global_step": 142913, "epoch": 850} {"train_loss": -10.715999603271484, "global_step": 142914, "epoch": 850} {"train_loss": -10.679054260253906, "global_step": 142915, "epoch": 850} {"train_loss": -10.652788162231445, "global_step": 142916, "epoch": 850} {"train_loss": -10.667829513549805, "global_step": 142917, "epoch": 850} {"train_loss": -10.831555366516113, "global_step": 142918, "epoch": 850} {"train_loss": -10.730451583862305, "global_step": 142919, "epoch": 850} {"train_loss": -10.661657333374023, "global_step": 142920, "epoch": 850} {"train_loss": -10.690306663513184, "global_step": 142921, "epoch": 850} {"train_loss": -10.601175308227539, "global_step": 142922, "epoch": 850} {"train_loss": -10.963348388671875, "global_step": 142923, "epoch": 850} {"train_loss": -10.471236228942871, "global_step": 142924, "epoch": 850} {"train_loss": -10.689874649047852, "global_step": 142925, "epoch": 850} {"train_loss": -10.36569595336914, "global_step": 142926, "epoch": 850} {"train_loss": -10.46512222290039, "global_step": 142927, "epoch": 850} {"train_loss": -10.809516906738281, "global_step": 142928, "epoch": 850} {"train_loss": -10.5462646484375, "global_step": 142929, "epoch": 850} {"train_loss": -10.90837287902832, "global_step": 142930, "epoch": 850} {"train_loss": -10.57432746887207, "global_step": 142931, "epoch": 850} {"train_loss": -10.812100410461426, "global_step": 142932, "epoch": 850} {"train_loss": -10.498956680297852, "global_step": 142933, "epoch": 850} {"train_loss": -10.355688095092773, "global_step": 142934, "epoch": 850} {"train_loss": -10.749680519104004, "global_step": 142935, "epoch": 850} {"train_loss": -10.615747451782227, "global_step": 142936, "epoch": 850} {"train_loss": -10.683390617370605, "global_step": 142937, "epoch": 850} {"train_loss": -10.653377532958984, "global_step": 142938, "epoch": 850} {"train_loss": -10.752824783325195, "global_step": 142939, "epoch": 850} {"train_loss": -10.584511756896973, "global_step": 142940, "epoch": 850} {"train_loss": -10.868532180786133, "global_step": 142941, "epoch": 850} {"train_loss": -10.638789176940918, "global_step": 142942, "epoch": 850} {"train_loss": -10.91661262512207, "global_step": 142943, "epoch": 850} {"train_loss": -10.745147705078125, "global_step": 142944, "epoch": 850} {"train_loss": -10.768758773803711, "global_step": 142945, "epoch": 850} {"train_loss": -10.892465591430664, "global_step": 142946, "epoch": 850} {"train_loss": -10.768609046936035, "global_step": 142947, "epoch": 850} {"train_loss": -10.956941604614258, "global_step": 142948, "epoch": 850} {"train_loss": -10.593170166015625, "global_step": 142949, "epoch": 850} {"train_loss": -10.841283798217773, "global_step": 142950, "epoch": 850} {"train_loss": -10.817808151245117, "global_step": 142951, "epoch": 850} {"train_loss": -10.567282676696777, "global_step": 142952, "epoch": 850} {"train_loss": -10.72296142578125, "global_step": 142953, "epoch": 850} {"train_loss": -10.893930435180664, "global_step": 142954, "epoch": 850} {"train_loss": -10.810121536254883, "global_step": 142955, "epoch": 850} {"train_loss": -10.940810203552246, "global_step": 142956, "epoch": 850} {"train_loss": -10.846677780151367, "global_step": 142957, "epoch": 850} {"train_loss": -10.764457702636719, "global_step": 142958, "epoch": 850} {"train_loss": -10.646167755126953, "global_step": 142959, "epoch": 850} {"train_loss": -10.8148193359375, "global_step": 142960, "epoch": 850} {"train_loss": -10.755731582641602, "global_step": 142961, "epoch": 850} {"train_loss": -11.103511810302734, "global_step": 142962, "epoch": 850} {"train_loss": -10.71219253540039, "global_step": 142963, "epoch": 850} {"train_loss": -10.72142219543457, "global_step": 142964, "epoch": 850} {"train_loss": -10.682723999023438, "global_step": 142965, "epoch": 850} {"train_loss": -11.018928527832031, "global_step": 142966, "epoch": 850} {"train_loss": -10.643500997906639, "global_step": 142967, "epoch": 850, "train/sim_max_reward_0": 0.9516406557542547, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.0004049829700773399, "train/sim_max_reward_3": 0.41714674788381023, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.6719438952512237, "test/sim_max_reward_4400000": 0.24864401524419308, "test/sim_max_reward_4400001": 0.3254553345752006, "test/sim_max_reward_4400002": 0.17085287940723162, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.4076534658364656, "test/sim_max_reward_4400005": 0.9845621929717756, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.5206727764104945, "test/sim_max_reward_4400009": 0.3436009338020839, "test/sim_max_reward_4400010": 0.2529518510119154, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 0.8641318602337901, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.4773323232248494, "test/sim_max_reward_4400015": 0.7188558596730171, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 0.6272577727715827, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.6872959420903212, "test/sim_max_reward_4400022": 0.9800865695091503, "test/sim_max_reward_4400023": 1.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.07157180987699834, "test/sim_max_reward_4400027": 0.9864570209834322, "test/sim_max_reward_4400028": 0.6831288933226898, "test/sim_max_reward_4400029": 0.4523874743780121, "test/sim_max_reward_4400030": 0.9827499743723705, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.13009479837268406, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.4801278451049327, "test/sim_max_reward_4400036": 0.3672625033457593, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.07174900475782633, "test/sim_max_reward_4400042": 1.0, "test/sim_max_reward_4400043": 0.9531632523470094, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.278829760407302, "train/mean_score": 0.6735227136432277, "test/mean_score": 0.5667906686974399, "val_loss": 226916.203125, "train_action_mse_error": 1.255570888519287} {"train_loss": -10.324544906616211, "global_step": 142968, "epoch": 851} {"train_loss": -10.189733505249023, "global_step": 142969, "epoch": 851} {"train_loss": -10.632596015930176, "global_step": 142970, "epoch": 851} {"train_loss": -10.452240943908691, "global_step": 142971, "epoch": 851} {"train_loss": -10.34421157836914, "global_step": 142972, "epoch": 851} {"train_loss": -9.987425804138184, "global_step": 142973, "epoch": 851} {"train_loss": -10.339871406555176, "global_step": 142974, "epoch": 851} {"train_loss": -10.376986503601074, "global_step": 142975, "epoch": 851} {"train_loss": -9.225057601928711, "global_step": 142976, "epoch": 851} {"train_loss": -10.225728988647461, "global_step": 142977, "epoch": 851} {"train_loss": -9.513504981994629, "global_step": 142978, "epoch": 851} {"train_loss": -9.515942573547363, "global_step": 142979, "epoch": 851} {"train_loss": -9.948087692260742, "global_step": 142980, "epoch": 851} {"train_loss": -9.433698654174805, "global_step": 142981, "epoch": 851} {"train_loss": -10.391610145568848, "global_step": 142982, "epoch": 851} {"train_loss": -9.397504806518555, "global_step": 142983, "epoch": 851} {"train_loss": -10.44554328918457, "global_step": 142984, "epoch": 851} {"train_loss": -9.778284072875977, "global_step": 142985, "epoch": 851} {"train_loss": -10.360116958618164, "global_step": 142986, "epoch": 851} {"train_loss": -9.914400100708008, "global_step": 142987, "epoch": 851} {"train_loss": -9.901097297668457, "global_step": 142988, "epoch": 851} {"train_loss": -10.3445405960083, "global_step": 142989, "epoch": 851} {"train_loss": -9.931792259216309, "global_step": 142990, "epoch": 851} {"train_loss": -10.182236671447754, "global_step": 142991, "epoch": 851} {"train_loss": -10.020774841308594, "global_step": 142992, "epoch": 851} {"train_loss": -10.218863487243652, "global_step": 142993, "epoch": 851} {"train_loss": -10.456504821777344, "global_step": 142994, "epoch": 851} {"train_loss": -10.125783920288086, "global_step": 142995, "epoch": 851} {"train_loss": -10.077635765075684, "global_step": 142996, "epoch": 851} {"train_loss": -10.24927043914795, "global_step": 142997, "epoch": 851} {"train_loss": -10.276178359985352, "global_step": 142998, "epoch": 851} {"train_loss": -10.279277801513672, "global_step": 142999, "epoch": 851} {"train_loss": -10.364683151245117, "global_step": 143000, "epoch": 851} {"train_loss": -10.500667572021484, "global_step": 143001, "epoch": 851} {"train_loss": -9.892630577087402, "global_step": 143002, "epoch": 851} {"train_loss": -10.371699333190918, "global_step": 143003, "epoch": 851} {"train_loss": -10.261629104614258, "global_step": 143004, "epoch": 851} {"train_loss": -10.630736351013184, "global_step": 143005, "epoch": 851} {"train_loss": -10.388100624084473, "global_step": 143006, "epoch": 851} {"train_loss": -10.367924690246582, "global_step": 143007, "epoch": 851} {"train_loss": -10.719198226928711, "global_step": 143008, "epoch": 851} {"train_loss": -10.4152193069458, "global_step": 143009, "epoch": 851} {"train_loss": -10.540761947631836, "global_step": 143010, "epoch": 851} {"train_loss": -10.228592872619629, "global_step": 143011, "epoch": 851} {"train_loss": -10.6878662109375, "global_step": 143012, "epoch": 851} {"train_loss": -10.565038681030273, "global_step": 143013, "epoch": 851} {"train_loss": -10.71839714050293, "global_step": 143014, "epoch": 851} {"train_loss": -10.686145782470703, "global_step": 143015, "epoch": 851} {"train_loss": -10.644634246826172, "global_step": 143016, "epoch": 851} {"train_loss": -10.787267684936523, "global_step": 143017, "epoch": 851} {"train_loss": -10.716121673583984, "global_step": 143018, "epoch": 851} {"train_loss": -10.888669967651367, "global_step": 143019, "epoch": 851} {"train_loss": -10.751852035522461, "global_step": 143020, "epoch": 851} {"train_loss": -10.895090103149414, "global_step": 143021, "epoch": 851} {"train_loss": -10.876436233520508, "global_step": 143022, "epoch": 851} {"train_loss": -10.967554092407227, "global_step": 143023, "epoch": 851} {"train_loss": -10.770641326904297, "global_step": 143024, "epoch": 851} {"train_loss": -10.627260208129883, "global_step": 143025, "epoch": 851} {"train_loss": -11.08842658996582, "global_step": 143026, "epoch": 851} {"train_loss": -11.009689331054688, "global_step": 143027, "epoch": 851} {"train_loss": -10.694342613220215, "global_step": 143028, "epoch": 851} {"train_loss": -11.11054801940918, "global_step": 143029, "epoch": 851} {"train_loss": -11.056739807128906, "global_step": 143030, "epoch": 851} {"train_loss": -10.87293529510498, "global_step": 143031, "epoch": 851} {"train_loss": -10.968046188354492, "global_step": 143032, "epoch": 851} {"train_loss": -11.0911226272583, "global_step": 143033, "epoch": 851} {"train_loss": -10.618953704833984, "global_step": 143034, "epoch": 851} {"train_loss": -10.862399101257324, "global_step": 143035, "epoch": 851} {"train_loss": -10.949178695678711, "global_step": 143036, "epoch": 851} {"train_loss": -10.60964584350586, "global_step": 143037, "epoch": 851} {"train_loss": -11.072004318237305, "global_step": 143038, "epoch": 851} {"train_loss": -10.902339935302734, "global_step": 143039, "epoch": 851} {"train_loss": -10.801071166992188, "global_step": 143040, "epoch": 851} {"train_loss": -10.973404884338379, "global_step": 143041, "epoch": 851} {"train_loss": -10.682863235473633, "global_step": 143042, "epoch": 851} {"train_loss": -10.671174049377441, "global_step": 143043, "epoch": 851} {"train_loss": -10.785808563232422, "global_step": 143044, "epoch": 851} {"train_loss": -10.656917572021484, "global_step": 143045, "epoch": 851} {"train_loss": -10.836505889892578, "global_step": 143046, "epoch": 851} {"train_loss": -10.866690635681152, "global_step": 143047, "epoch": 851} {"train_loss": -10.768662452697754, "global_step": 143048, "epoch": 851} {"train_loss": -10.620994567871094, "global_step": 143049, "epoch": 851} {"train_loss": -10.74020004272461, "global_step": 143050, "epoch": 851} {"train_loss": -11.042314529418945, "global_step": 143051, "epoch": 851} {"train_loss": -10.677539825439453, "global_step": 143052, "epoch": 851} {"train_loss": -10.940255165100098, "global_step": 143053, "epoch": 851} {"train_loss": -10.861581802368164, "global_step": 143054, "epoch": 851} {"train_loss": -10.875405311584473, "global_step": 143055, "epoch": 851} {"train_loss": -10.478918075561523, "global_step": 143056, "epoch": 851} {"train_loss": -10.617965698242188, "global_step": 143057, "epoch": 851} {"train_loss": -10.217636108398438, "global_step": 143058, "epoch": 851} {"train_loss": -9.43865966796875, "global_step": 143059, "epoch": 851} {"train_loss": -9.366756439208984, "global_step": 143060, "epoch": 851} {"train_loss": -10.27029037475586, "global_step": 143061, "epoch": 851} {"train_loss": -10.066689491271973, "global_step": 143062, "epoch": 851} {"train_loss": -9.256572723388672, "global_step": 143063, "epoch": 851} {"train_loss": -10.294404983520508, "global_step": 143064, "epoch": 851} {"train_loss": -10.218315124511719, "global_step": 143065, "epoch": 851} {"train_loss": -9.891950607299805, "global_step": 143066, "epoch": 851} {"train_loss": -9.960453033447266, "global_step": 143067, "epoch": 851} {"train_loss": -10.004179000854492, "global_step": 143068, "epoch": 851} {"train_loss": -9.76754379272461, "global_step": 143069, "epoch": 851} {"train_loss": -9.921948432922363, "global_step": 143070, "epoch": 851} {"train_loss": -9.289815902709961, "global_step": 143071, "epoch": 851} {"train_loss": -10.290057182312012, "global_step": 143072, "epoch": 851} {"train_loss": -9.27345085144043, "global_step": 143073, "epoch": 851} {"train_loss": -9.812074661254883, "global_step": 143074, "epoch": 851} {"train_loss": -9.564472198486328, "global_step": 143075, "epoch": 851} {"train_loss": -10.242841720581055, "global_step": 143076, "epoch": 851} {"train_loss": -9.795354843139648, "global_step": 143077, "epoch": 851} {"train_loss": -10.233054161071777, "global_step": 143078, "epoch": 851} {"train_loss": -10.249136924743652, "global_step": 143079, "epoch": 851} {"train_loss": -10.577136993408203, "global_step": 143080, "epoch": 851} {"train_loss": -9.925726890563965, "global_step": 143081, "epoch": 851} {"train_loss": -10.52454662322998, "global_step": 143082, "epoch": 851} {"train_loss": -10.230326652526855, "global_step": 143083, "epoch": 851} {"train_loss": -10.316435813903809, "global_step": 143084, "epoch": 851} {"train_loss": -10.495658874511719, "global_step": 143085, "epoch": 851} {"train_loss": -10.339696884155273, "global_step": 143086, "epoch": 851} {"train_loss": -10.431233406066895, "global_step": 143087, "epoch": 851} {"train_loss": -10.229151725769043, "global_step": 143088, "epoch": 851} {"train_loss": -10.532882690429688, "global_step": 143089, "epoch": 851} {"train_loss": -10.331153869628906, "global_step": 143090, "epoch": 851} {"train_loss": -10.22520637512207, "global_step": 143091, "epoch": 851} {"train_loss": -10.527099609375, "global_step": 143092, "epoch": 851} {"train_loss": -10.560256958007812, "global_step": 143093, "epoch": 851} {"train_loss": -10.359243392944336, "global_step": 143094, "epoch": 851} {"train_loss": -10.423336029052734, "global_step": 143095, "epoch": 851} {"train_loss": -10.430803298950195, "global_step": 143096, "epoch": 851} {"train_loss": -10.698044776916504, "global_step": 143097, "epoch": 851} {"train_loss": -10.368742942810059, "global_step": 143098, "epoch": 851} {"train_loss": -10.508867263793945, "global_step": 143099, "epoch": 851} {"train_loss": -10.375349998474121, "global_step": 143100, "epoch": 851} {"train_loss": -10.737383842468262, "global_step": 143101, "epoch": 851} {"train_loss": -10.695379257202148, "global_step": 143102, "epoch": 851} {"train_loss": -10.540254592895508, "global_step": 143103, "epoch": 851} {"train_loss": -10.534343719482422, "global_step": 143104, "epoch": 851} {"train_loss": -10.504819869995117, "global_step": 143105, "epoch": 851} {"train_loss": -10.72939682006836, "global_step": 143106, "epoch": 851} {"train_loss": -10.746482849121094, "global_step": 143107, "epoch": 851} {"train_loss": -10.650900840759277, "global_step": 143108, "epoch": 851} {"train_loss": -10.359956741333008, "global_step": 143109, "epoch": 851} {"train_loss": -10.79600715637207, "global_step": 143110, "epoch": 851} {"train_loss": -10.9005126953125, "global_step": 143111, "epoch": 851} {"train_loss": -10.77682876586914, "global_step": 143112, "epoch": 851} {"train_loss": -10.942455291748047, "global_step": 143113, "epoch": 851} {"train_loss": -10.956207275390625, "global_step": 143114, "epoch": 851} {"train_loss": -10.801126480102539, "global_step": 143115, "epoch": 851} {"train_loss": -10.716044425964355, "global_step": 143116, "epoch": 851} {"train_loss": -10.693782806396484, "global_step": 143117, "epoch": 851} {"train_loss": -10.790325164794922, "global_step": 143118, "epoch": 851} {"train_loss": -10.918478012084961, "global_step": 143119, "epoch": 851} {"train_loss": -10.644991874694824, "global_step": 143120, "epoch": 851} {"train_loss": -10.832979202270508, "global_step": 143121, "epoch": 851} {"train_loss": -10.838905334472656, "global_step": 143122, "epoch": 851} {"train_loss": -10.802560806274414, "global_step": 143123, "epoch": 851} {"train_loss": -10.917150497436523, "global_step": 143124, "epoch": 851} {"train_loss": -10.762808799743652, "global_step": 143125, "epoch": 851} {"train_loss": -10.841535568237305, "global_step": 143126, "epoch": 851} {"train_loss": -10.632732391357422, "global_step": 143127, "epoch": 851} {"train_loss": -10.60561752319336, "global_step": 143128, "epoch": 851} {"train_loss": -10.468038558959961, "global_step": 143129, "epoch": 851} {"train_loss": -10.574630737304688, "global_step": 143130, "epoch": 851} {"train_loss": -10.853713989257812, "global_step": 143131, "epoch": 851} {"train_loss": -10.524761199951172, "global_step": 143132, "epoch": 851} {"train_loss": -10.51942253112793, "global_step": 143133, "epoch": 851} {"train_loss": -10.588590621948242, "global_step": 143134, "epoch": 851} {"train_loss": -10.450563782737369, "global_step": 143135, "epoch": 851, "val_loss": 225868.125} {"train_loss": -10.8636474609375, "global_step": 143136, "epoch": 852} {"train_loss": -10.751620292663574, "global_step": 143137, "epoch": 852} {"train_loss": -10.73901653289795, "global_step": 143138, "epoch": 852} {"train_loss": -10.66778564453125, "global_step": 143139, "epoch": 852} {"train_loss": -10.625690460205078, "global_step": 143140, "epoch": 852} {"train_loss": -10.807901382446289, "global_step": 143141, "epoch": 852} {"train_loss": -10.44991683959961, "global_step": 143142, "epoch": 852} {"train_loss": -10.548667907714844, "global_step": 143143, "epoch": 852} {"train_loss": -10.448102951049805, "global_step": 143144, "epoch": 852} {"train_loss": -10.396042823791504, "global_step": 143145, "epoch": 852} {"train_loss": -9.84470272064209, "global_step": 143146, "epoch": 852} {"train_loss": -10.227359771728516, "global_step": 143147, "epoch": 852} {"train_loss": -10.139422416687012, "global_step": 143148, "epoch": 852} {"train_loss": -9.989511489868164, "global_step": 143149, "epoch": 852} {"train_loss": -9.497404098510742, "global_step": 143150, "epoch": 852} {"train_loss": -10.252195358276367, "global_step": 143151, "epoch": 852} {"train_loss": -9.495609283447266, "global_step": 143152, "epoch": 852} {"train_loss": -10.0050687789917, "global_step": 143153, "epoch": 852} {"train_loss": -10.017274856567383, "global_step": 143154, "epoch": 852} {"train_loss": -9.615717887878418, "global_step": 143155, "epoch": 852} {"train_loss": -9.890777587890625, "global_step": 143156, "epoch": 852} {"train_loss": -9.808913230895996, "global_step": 143157, "epoch": 852} {"train_loss": -9.200162887573242, "global_step": 143158, "epoch": 852} {"train_loss": -9.801633834838867, "global_step": 143159, "epoch": 852} {"train_loss": -8.865692138671875, "global_step": 143160, "epoch": 852} {"train_loss": -9.778829574584961, "global_step": 143161, "epoch": 852} {"train_loss": -9.642631530761719, "global_step": 143162, "epoch": 852} {"train_loss": -9.609621047973633, "global_step": 143163, "epoch": 852} {"train_loss": -9.386306762695312, "global_step": 143164, "epoch": 852} {"train_loss": -9.914278030395508, "global_step": 143165, "epoch": 852} {"train_loss": -9.862161636352539, "global_step": 143166, "epoch": 852} {"train_loss": -9.192342758178711, "global_step": 143167, "epoch": 852} {"train_loss": -10.149365425109863, "global_step": 143168, "epoch": 852} {"train_loss": -9.198637008666992, "global_step": 143169, "epoch": 852} {"train_loss": -9.924018859863281, "global_step": 143170, "epoch": 852} {"train_loss": -9.974519729614258, "global_step": 143171, "epoch": 852} {"train_loss": -9.768507957458496, "global_step": 143172, "epoch": 852} {"train_loss": -9.512763023376465, "global_step": 143173, "epoch": 852} {"train_loss": -9.543939590454102, "global_step": 143174, "epoch": 852} {"train_loss": -10.350421905517578, "global_step": 143175, "epoch": 852} {"train_loss": -9.66240119934082, "global_step": 143176, "epoch": 852} {"train_loss": -10.028615951538086, "global_step": 143177, "epoch": 852} {"train_loss": -10.061885833740234, "global_step": 143178, "epoch": 852} {"train_loss": -9.755558013916016, "global_step": 143179, "epoch": 852} {"train_loss": -9.95828628540039, "global_step": 143180, "epoch": 852} {"train_loss": -9.955291748046875, "global_step": 143181, "epoch": 852} {"train_loss": -9.680191040039062, "global_step": 143182, "epoch": 852} {"train_loss": -10.153444290161133, "global_step": 143183, "epoch": 852} {"train_loss": -9.934247970581055, "global_step": 143184, "epoch": 852} {"train_loss": -10.054316520690918, "global_step": 143185, "epoch": 852} {"train_loss": -10.372447967529297, "global_step": 143186, "epoch": 852} {"train_loss": -9.943853378295898, "global_step": 143187, "epoch": 852} {"train_loss": -10.37984848022461, "global_step": 143188, "epoch": 852} {"train_loss": -10.221887588500977, "global_step": 143189, "epoch": 852} {"train_loss": -10.02017593383789, "global_step": 143190, "epoch": 852} {"train_loss": -10.420450210571289, "global_step": 143191, "epoch": 852} {"train_loss": -10.188268661499023, "global_step": 143192, "epoch": 852} {"train_loss": -10.125728607177734, "global_step": 143193, "epoch": 852} {"train_loss": -10.229531288146973, "global_step": 143194, "epoch": 852} {"train_loss": -10.426224708557129, "global_step": 143195, "epoch": 852} {"train_loss": -10.41693115234375, "global_step": 143196, "epoch": 852} {"train_loss": -10.096617698669434, "global_step": 143197, "epoch": 852} {"train_loss": -10.394432067871094, "global_step": 143198, "epoch": 852} {"train_loss": -10.539652824401855, "global_step": 143199, "epoch": 852} {"train_loss": -10.402091026306152, "global_step": 143200, "epoch": 852} {"train_loss": -10.412740707397461, "global_step": 143201, "epoch": 852} {"train_loss": -10.430389404296875, "global_step": 143202, "epoch": 852} {"train_loss": -10.464534759521484, "global_step": 143203, "epoch": 852} {"train_loss": -10.593295097351074, "global_step": 143204, "epoch": 852} {"train_loss": -10.335611343383789, "global_step": 143205, "epoch": 852} {"train_loss": -10.345243453979492, "global_step": 143206, "epoch": 852} {"train_loss": -10.556249618530273, "global_step": 143207, "epoch": 852} {"train_loss": -10.826062202453613, "global_step": 143208, "epoch": 852} {"train_loss": -10.786994934082031, "global_step": 143209, "epoch": 852} {"train_loss": -10.695025444030762, "global_step": 143210, "epoch": 852} {"train_loss": -10.606271743774414, "global_step": 143211, "epoch": 852} {"train_loss": -10.643438339233398, "global_step": 143212, "epoch": 852} {"train_loss": -10.697680473327637, "global_step": 143213, "epoch": 852} {"train_loss": -10.787384033203125, "global_step": 143214, "epoch": 852} {"train_loss": -10.757801055908203, "global_step": 143215, "epoch": 852} {"train_loss": -10.77010440826416, "global_step": 143216, "epoch": 852} {"train_loss": -10.861379623413086, "global_step": 143217, "epoch": 852} {"train_loss": -10.597766876220703, "global_step": 143218, "epoch": 852} {"train_loss": -10.769161224365234, "global_step": 143219, "epoch": 852} {"train_loss": -10.823179244995117, "global_step": 143220, "epoch": 852} {"train_loss": -11.11712646484375, "global_step": 143221, "epoch": 852} {"train_loss": -10.480539321899414, "global_step": 143222, "epoch": 852} {"train_loss": -10.88786506652832, "global_step": 143223, "epoch": 852} {"train_loss": -10.79011344909668, "global_step": 143224, "epoch": 852} {"train_loss": -10.669766426086426, "global_step": 143225, "epoch": 852} {"train_loss": -11.00381088256836, "global_step": 143226, "epoch": 852} {"train_loss": -11.00001335144043, "global_step": 143227, "epoch": 852} {"train_loss": -10.504402160644531, "global_step": 143228, "epoch": 852} {"train_loss": -10.997775077819824, "global_step": 143229, "epoch": 852} {"train_loss": -10.886184692382812, "global_step": 143230, "epoch": 852} {"train_loss": -11.061999320983887, "global_step": 143231, "epoch": 852} {"train_loss": -10.751177787780762, "global_step": 143232, "epoch": 852} {"train_loss": -11.024349212646484, "global_step": 143233, "epoch": 852} {"train_loss": -10.97085189819336, "global_step": 143234, "epoch": 852} {"train_loss": -10.77048110961914, "global_step": 143235, "epoch": 852} {"train_loss": -10.835853576660156, "global_step": 143236, "epoch": 852} {"train_loss": -10.925399780273438, "global_step": 143237, "epoch": 852} {"train_loss": -11.140846252441406, "global_step": 143238, "epoch": 852} {"train_loss": -10.669506072998047, "global_step": 143239, "epoch": 852} {"train_loss": -11.033596992492676, "global_step": 143240, "epoch": 852} {"train_loss": -10.414892196655273, "global_step": 143241, "epoch": 852} {"train_loss": -10.095134735107422, "global_step": 143242, "epoch": 852} {"train_loss": -10.340106964111328, "global_step": 143243, "epoch": 852} {"train_loss": -10.95438003540039, "global_step": 143244, "epoch": 852} {"train_loss": -10.81247329711914, "global_step": 143245, "epoch": 852} {"train_loss": -10.988073348999023, "global_step": 143246, "epoch": 852} {"train_loss": -10.59121322631836, "global_step": 143247, "epoch": 852} {"train_loss": -10.857126235961914, "global_step": 143248, "epoch": 852} {"train_loss": -10.476103782653809, "global_step": 143249, "epoch": 852} {"train_loss": -10.410211563110352, "global_step": 143250, "epoch": 852} {"train_loss": -9.837287902832031, "global_step": 143251, "epoch": 852} {"train_loss": -10.59366226196289, "global_step": 143252, "epoch": 852} {"train_loss": -10.394599914550781, "global_step": 143253, "epoch": 852} {"train_loss": -10.611455917358398, "global_step": 143254, "epoch": 852} {"train_loss": -10.625199317932129, "global_step": 143255, "epoch": 852} {"train_loss": -10.972509384155273, "global_step": 143256, "epoch": 852} {"train_loss": -10.565361022949219, "global_step": 143257, "epoch": 852} {"train_loss": -10.624163627624512, "global_step": 143258, "epoch": 852} {"train_loss": -10.266668319702148, "global_step": 143259, "epoch": 852} {"train_loss": -10.602240562438965, "global_step": 143260, "epoch": 852} {"train_loss": -10.43514633178711, "global_step": 143261, "epoch": 852} {"train_loss": -10.440570831298828, "global_step": 143262, "epoch": 852} {"train_loss": -9.866982460021973, "global_step": 143263, "epoch": 852} {"train_loss": -10.633893966674805, "global_step": 143264, "epoch": 852} {"train_loss": -9.984334945678711, "global_step": 143265, "epoch": 852} {"train_loss": -10.1362886428833, "global_step": 143266, "epoch": 852} {"train_loss": -10.195751190185547, "global_step": 143267, "epoch": 852} {"train_loss": -10.519035339355469, "global_step": 143268, "epoch": 852} {"train_loss": -10.722240447998047, "global_step": 143269, "epoch": 852} {"train_loss": -10.419413566589355, "global_step": 143270, "epoch": 852} {"train_loss": -10.49478816986084, "global_step": 143271, "epoch": 852} {"train_loss": -10.168575286865234, "global_step": 143272, "epoch": 852} {"train_loss": -10.54133415222168, "global_step": 143273, "epoch": 852} {"train_loss": -10.65285873413086, "global_step": 143274, "epoch": 852} {"train_loss": -10.236705780029297, "global_step": 143275, "epoch": 852} {"train_loss": -10.482868194580078, "global_step": 143276, "epoch": 852} {"train_loss": -10.420913696289062, "global_step": 143277, "epoch": 852} {"train_loss": -10.806636810302734, "global_step": 143278, "epoch": 852} {"train_loss": -10.764415740966797, "global_step": 143279, "epoch": 852} {"train_loss": -10.51327896118164, "global_step": 143280, "epoch": 852} {"train_loss": -10.721803665161133, "global_step": 143281, "epoch": 852} {"train_loss": -10.350561141967773, "global_step": 143282, "epoch": 852} {"train_loss": -10.70863151550293, "global_step": 143283, "epoch": 852} {"train_loss": -10.376714706420898, "global_step": 143284, "epoch": 852} {"train_loss": -10.680378913879395, "global_step": 143285, "epoch": 852} {"train_loss": -10.573517799377441, "global_step": 143286, "epoch": 852} {"train_loss": -10.638277053833008, "global_step": 143287, "epoch": 852} {"train_loss": -10.650253295898438, "global_step": 143288, "epoch": 852} {"train_loss": -10.64932918548584, "global_step": 143289, "epoch": 852} {"train_loss": -10.712640762329102, "global_step": 143290, "epoch": 852} {"train_loss": -10.63010311126709, "global_step": 143291, "epoch": 852} {"train_loss": -10.790400505065918, "global_step": 143292, "epoch": 852} {"train_loss": -10.625160217285156, "global_step": 143293, "epoch": 852} {"train_loss": -10.509489059448242, "global_step": 143294, "epoch": 852} {"train_loss": -10.714696884155273, "global_step": 143295, "epoch": 852} {"train_loss": -10.843111038208008, "global_step": 143296, "epoch": 852} {"train_loss": -10.704227447509766, "global_step": 143297, "epoch": 852} {"train_loss": -10.735342025756836, "global_step": 143298, "epoch": 852} {"train_loss": -10.945974349975586, "global_step": 143299, "epoch": 852} {"train_loss": -10.636640548706055, "global_step": 143300, "epoch": 852} {"train_loss": -10.924491882324219, "global_step": 143301, "epoch": 852} {"train_loss": -10.599414825439453, "global_step": 143302, "epoch": 852} {"train_loss": -10.402222593625387, "global_step": 143303, "epoch": 852, "val_loss": 226860.921875} {"train_loss": -10.646862030029297, "global_step": 143304, "epoch": 853} {"train_loss": -10.783743858337402, "global_step": 143305, "epoch": 853} {"train_loss": -10.776917457580566, "global_step": 143306, "epoch": 853} {"train_loss": -10.760698318481445, "global_step": 143307, "epoch": 853} {"train_loss": -10.813665390014648, "global_step": 143308, "epoch": 853} {"train_loss": -10.680800437927246, "global_step": 143309, "epoch": 853} {"train_loss": -11.079183578491211, "global_step": 143310, "epoch": 853} {"train_loss": -10.691780090332031, "global_step": 143311, "epoch": 853} {"train_loss": -10.997535705566406, "global_step": 143312, "epoch": 853} {"train_loss": -10.84261703491211, "global_step": 143313, "epoch": 853} {"train_loss": -10.936258316040039, "global_step": 143314, "epoch": 853} {"train_loss": -10.92849349975586, "global_step": 143315, "epoch": 853} {"train_loss": -10.967439651489258, "global_step": 143316, "epoch": 853} {"train_loss": -10.660470962524414, "global_step": 143317, "epoch": 853} {"train_loss": -10.598363876342773, "global_step": 143318, "epoch": 853} {"train_loss": -10.583879470825195, "global_step": 143319, "epoch": 853} {"train_loss": -10.336448669433594, "global_step": 143320, "epoch": 853} {"train_loss": -10.557099342346191, "global_step": 143321, "epoch": 853} {"train_loss": -10.862133026123047, "global_step": 143322, "epoch": 853} {"train_loss": -10.804166793823242, "global_step": 143323, "epoch": 853} {"train_loss": -10.407898902893066, "global_step": 143324, "epoch": 853} {"train_loss": -10.235601425170898, "global_step": 143325, "epoch": 853} {"train_loss": -10.529751777648926, "global_step": 143326, "epoch": 853} {"train_loss": -10.214421272277832, "global_step": 143327, "epoch": 853} {"train_loss": -9.85290813446045, "global_step": 143328, "epoch": 853} {"train_loss": -10.629931449890137, "global_step": 143329, "epoch": 853} {"train_loss": -9.575475692749023, "global_step": 143330, "epoch": 853} {"train_loss": -9.708687782287598, "global_step": 143331, "epoch": 853} {"train_loss": -10.371066093444824, "global_step": 143332, "epoch": 853} {"train_loss": -8.963804244995117, "global_step": 143333, "epoch": 853} {"train_loss": -9.699853897094727, "global_step": 143334, "epoch": 853} {"train_loss": -8.981481552124023, "global_step": 143335, "epoch": 853} {"train_loss": -9.091904640197754, "global_step": 143336, "epoch": 853} {"train_loss": -8.9849271774292, "global_step": 143337, "epoch": 853} {"train_loss": -9.959957122802734, "global_step": 143338, "epoch": 853} {"train_loss": -9.545358657836914, "global_step": 143339, "epoch": 853} {"train_loss": -9.901241302490234, "global_step": 143340, "epoch": 853} {"train_loss": -9.486003875732422, "global_step": 143341, "epoch": 853} {"train_loss": -10.074596405029297, "global_step": 143342, "epoch": 853} {"train_loss": -9.706717491149902, "global_step": 143343, "epoch": 853} {"train_loss": -10.429874420166016, "global_step": 143344, "epoch": 853} {"train_loss": -10.025674819946289, "global_step": 143345, "epoch": 853} {"train_loss": -10.009893417358398, "global_step": 143346, "epoch": 853} {"train_loss": -9.873451232910156, "global_step": 143347, "epoch": 853} {"train_loss": -10.095735549926758, "global_step": 143348, "epoch": 853} {"train_loss": -10.057565689086914, "global_step": 143349, "epoch": 853} {"train_loss": -10.240577697753906, "global_step": 143350, "epoch": 853} {"train_loss": -10.318742752075195, "global_step": 143351, "epoch": 853} {"train_loss": -10.035867691040039, "global_step": 143352, "epoch": 853} {"train_loss": -10.43791389465332, "global_step": 143353, "epoch": 853} {"train_loss": -10.218299865722656, "global_step": 143354, "epoch": 853} {"train_loss": -10.461923599243164, "global_step": 143355, "epoch": 853} {"train_loss": -10.319950103759766, "global_step": 143356, "epoch": 853} {"train_loss": -10.272902488708496, "global_step": 143357, "epoch": 853} {"train_loss": -10.576937675476074, "global_step": 143358, "epoch": 853} {"train_loss": -10.349994659423828, "global_step": 143359, "epoch": 853} {"train_loss": -10.170677185058594, "global_step": 143360, "epoch": 853} {"train_loss": -10.473382949829102, "global_step": 143361, "epoch": 853} {"train_loss": -10.269705772399902, "global_step": 143362, "epoch": 853} {"train_loss": -10.332642555236816, "global_step": 143363, "epoch": 853} {"train_loss": -10.348625183105469, "global_step": 143364, "epoch": 853} {"train_loss": -10.419551849365234, "global_step": 143365, "epoch": 853} {"train_loss": -10.282912254333496, "global_step": 143366, "epoch": 853} {"train_loss": -10.49841594696045, "global_step": 143367, "epoch": 853} {"train_loss": -10.373214721679688, "global_step": 143368, "epoch": 853} {"train_loss": -10.606585502624512, "global_step": 143369, "epoch": 853} {"train_loss": -10.450825691223145, "global_step": 143370, "epoch": 853} {"train_loss": -10.577932357788086, "global_step": 143371, "epoch": 853} {"train_loss": -10.47293758392334, "global_step": 143372, "epoch": 853} {"train_loss": -10.609819412231445, "global_step": 143373, "epoch": 853} {"train_loss": -10.68820571899414, "global_step": 143374, "epoch": 853} {"train_loss": -10.807900428771973, "global_step": 143375, "epoch": 853} {"train_loss": -10.813392639160156, "global_step": 143376, "epoch": 853} {"train_loss": -10.737668991088867, "global_step": 143377, "epoch": 853} {"train_loss": -10.898428916931152, "global_step": 143378, "epoch": 853} {"train_loss": -10.76758098602295, "global_step": 143379, "epoch": 853} {"train_loss": -10.909278869628906, "global_step": 143380, "epoch": 853} {"train_loss": -10.616558074951172, "global_step": 143381, "epoch": 853} {"train_loss": -10.935863494873047, "global_step": 143382, "epoch": 853} {"train_loss": -10.976296424865723, "global_step": 143383, "epoch": 853} {"train_loss": -10.956430435180664, "global_step": 143384, "epoch": 853} {"train_loss": -10.80827808380127, "global_step": 143385, "epoch": 853} {"train_loss": -10.855953216552734, "global_step": 143386, "epoch": 853} {"train_loss": -10.857155799865723, "global_step": 143387, "epoch": 853} {"train_loss": -10.929401397705078, "global_step": 143388, "epoch": 853} {"train_loss": -10.971539497375488, "global_step": 143389, "epoch": 853} {"train_loss": -10.692873001098633, "global_step": 143390, "epoch": 853} {"train_loss": -10.774431228637695, "global_step": 143391, "epoch": 853} {"train_loss": -10.977104187011719, "global_step": 143392, "epoch": 853} {"train_loss": -10.99079704284668, "global_step": 143393, "epoch": 853} {"train_loss": -10.738096237182617, "global_step": 143394, "epoch": 853} {"train_loss": -10.980587005615234, "global_step": 143395, "epoch": 853} {"train_loss": -10.704877853393555, "global_step": 143396, "epoch": 853} {"train_loss": -10.524256706237793, "global_step": 143397, "epoch": 853} {"train_loss": -10.978971481323242, "global_step": 143398, "epoch": 853} {"train_loss": -10.77351188659668, "global_step": 143399, "epoch": 853} {"train_loss": -10.514968872070312, "global_step": 143400, "epoch": 853} {"train_loss": -10.844707489013672, "global_step": 143401, "epoch": 853} {"train_loss": -10.581239700317383, "global_step": 143402, "epoch": 853} {"train_loss": -10.624086380004883, "global_step": 143403, "epoch": 853} {"train_loss": -10.385231018066406, "global_step": 143404, "epoch": 853} {"train_loss": -10.594715118408203, "global_step": 143405, "epoch": 853} {"train_loss": -10.686253547668457, "global_step": 143406, "epoch": 853} {"train_loss": -10.7884521484375, "global_step": 143407, "epoch": 853} {"train_loss": -10.418883323669434, "global_step": 143408, "epoch": 853} {"train_loss": -10.635902404785156, "global_step": 143409, "epoch": 853} {"train_loss": -10.312511444091797, "global_step": 143410, "epoch": 853} {"train_loss": -10.448087692260742, "global_step": 143411, "epoch": 853} {"train_loss": -10.20315933227539, "global_step": 143412, "epoch": 853} {"train_loss": -10.665566444396973, "global_step": 143413, "epoch": 853} {"train_loss": -9.654273986816406, "global_step": 143414, "epoch": 853} {"train_loss": -10.666069030761719, "global_step": 143415, "epoch": 853} {"train_loss": -10.049854278564453, "global_step": 143416, "epoch": 853} {"train_loss": -9.788894653320312, "global_step": 143417, "epoch": 853} {"train_loss": -9.99720573425293, "global_step": 143418, "epoch": 853} {"train_loss": -10.036362648010254, "global_step": 143419, "epoch": 853} {"train_loss": -10.154940605163574, "global_step": 143420, "epoch": 853} {"train_loss": -10.061874389648438, "global_step": 143421, "epoch": 853} {"train_loss": -10.371797561645508, "global_step": 143422, "epoch": 853} {"train_loss": -10.189289093017578, "global_step": 143423, "epoch": 853} {"train_loss": -10.566054344177246, "global_step": 143424, "epoch": 853} {"train_loss": -10.494750022888184, "global_step": 143425, "epoch": 853} {"train_loss": -10.378068923950195, "global_step": 143426, "epoch": 853} {"train_loss": -10.397703170776367, "global_step": 143427, "epoch": 853} {"train_loss": -10.451431274414062, "global_step": 143428, "epoch": 853} {"train_loss": -10.506715774536133, "global_step": 143429, "epoch": 853} {"train_loss": -10.610845565795898, "global_step": 143430, "epoch": 853} {"train_loss": -10.526839256286621, "global_step": 143431, "epoch": 853} {"train_loss": -10.484079360961914, "global_step": 143432, "epoch": 853} {"train_loss": -10.612812042236328, "global_step": 143433, "epoch": 853} {"train_loss": -10.829862594604492, "global_step": 143434, "epoch": 853} {"train_loss": -10.44265365600586, "global_step": 143435, "epoch": 853} {"train_loss": -10.338988304138184, "global_step": 143436, "epoch": 853} {"train_loss": -10.69028377532959, "global_step": 143437, "epoch": 853} {"train_loss": -10.135150909423828, "global_step": 143438, "epoch": 853} {"train_loss": -10.638703346252441, "global_step": 143439, "epoch": 853} {"train_loss": -10.564979553222656, "global_step": 143440, "epoch": 853} {"train_loss": -10.530197143554688, "global_step": 143441, "epoch": 853} {"train_loss": -10.607284545898438, "global_step": 143442, "epoch": 853} {"train_loss": -10.603532791137695, "global_step": 143443, "epoch": 853} {"train_loss": -10.690147399902344, "global_step": 143444, "epoch": 853} {"train_loss": -10.614290237426758, "global_step": 143445, "epoch": 853} {"train_loss": -10.51048469543457, "global_step": 143446, "epoch": 853} {"train_loss": -10.729290008544922, "global_step": 143447, "epoch": 853} {"train_loss": -10.663368225097656, "global_step": 143448, "epoch": 853} {"train_loss": -10.85245132446289, "global_step": 143449, "epoch": 853} {"train_loss": -10.88395881652832, "global_step": 143450, "epoch": 853} {"train_loss": -10.872967720031738, "global_step": 143451, "epoch": 853} {"train_loss": -10.740226745605469, "global_step": 143452, "epoch": 853} {"train_loss": -10.694544792175293, "global_step": 143453, "epoch": 853} {"train_loss": -10.783605575561523, "global_step": 143454, "epoch": 853} {"train_loss": -11.09262466430664, "global_step": 143455, "epoch": 853} {"train_loss": -10.661091804504395, "global_step": 143456, "epoch": 853} {"train_loss": -10.946771621704102, "global_step": 143457, "epoch": 853} {"train_loss": -10.685783386230469, "global_step": 143458, "epoch": 853} {"train_loss": -11.044916152954102, "global_step": 143459, "epoch": 853} {"train_loss": -10.904661178588867, "global_step": 143460, "epoch": 853} {"train_loss": -10.705816268920898, "global_step": 143461, "epoch": 853} {"train_loss": -10.865755081176758, "global_step": 143462, "epoch": 853} {"train_loss": -10.557418823242188, "global_step": 143463, "epoch": 853} {"train_loss": -9.993021965026855, "global_step": 143464, "epoch": 853} {"train_loss": -11.000324249267578, "global_step": 143465, "epoch": 853} {"train_loss": -10.242467880249023, "global_step": 143466, "epoch": 853} {"train_loss": -10.525405883789062, "global_step": 143467, "epoch": 853} {"train_loss": -10.515923500061035, "global_step": 143468, "epoch": 853} {"train_loss": -10.187561988830566, "global_step": 143469, "epoch": 853} {"train_loss": -10.553345680236816, "global_step": 143470, "epoch": 853} {"train_loss": -10.479777733484903, "global_step": 143471, "epoch": 853, "val_loss": 228212.28125} {"train_loss": -10.508403778076172, "global_step": 143472, "epoch": 854} {"train_loss": -10.779718399047852, "global_step": 143473, "epoch": 854} {"train_loss": -10.666358947753906, "global_step": 143474, "epoch": 854} {"train_loss": -10.477935791015625, "global_step": 143475, "epoch": 854} {"train_loss": -10.886003494262695, "global_step": 143476, "epoch": 854} {"train_loss": -10.453195571899414, "global_step": 143477, "epoch": 854} {"train_loss": -10.875242233276367, "global_step": 143478, "epoch": 854} {"train_loss": -10.520398139953613, "global_step": 143479, "epoch": 854} {"train_loss": -10.86038589477539, "global_step": 143480, "epoch": 854} {"train_loss": -10.640681266784668, "global_step": 143481, "epoch": 854} {"train_loss": -10.721471786499023, "global_step": 143482, "epoch": 854} {"train_loss": -10.87958812713623, "global_step": 143483, "epoch": 854} {"train_loss": -10.551579475402832, "global_step": 143484, "epoch": 854} {"train_loss": -10.992630004882812, "global_step": 143485, "epoch": 854} {"train_loss": -10.570039749145508, "global_step": 143486, "epoch": 854} {"train_loss": -10.602264404296875, "global_step": 143487, "epoch": 854} {"train_loss": -10.601754188537598, "global_step": 143488, "epoch": 854} {"train_loss": -10.684961318969727, "global_step": 143489, "epoch": 854} {"train_loss": -10.894655227661133, "global_step": 143490, "epoch": 854} {"train_loss": -10.440773963928223, "global_step": 143491, "epoch": 854} {"train_loss": -10.934707641601562, "global_step": 143492, "epoch": 854} {"train_loss": -10.75645923614502, "global_step": 143493, "epoch": 854} {"train_loss": -10.76789665222168, "global_step": 143494, "epoch": 854} {"train_loss": -10.689790725708008, "global_step": 143495, "epoch": 854} {"train_loss": -10.707367897033691, "global_step": 143496, "epoch": 854} {"train_loss": -10.871618270874023, "global_step": 143497, "epoch": 854} {"train_loss": -10.884506225585938, "global_step": 143498, "epoch": 854} {"train_loss": -10.845568656921387, "global_step": 143499, "epoch": 854} {"train_loss": -10.817176818847656, "global_step": 143500, "epoch": 854} {"train_loss": -10.465088844299316, "global_step": 143501, "epoch": 854} {"train_loss": -10.909974098205566, "global_step": 143502, "epoch": 854} {"train_loss": -10.375606536865234, "global_step": 143503, "epoch": 854} {"train_loss": -10.799968719482422, "global_step": 143504, "epoch": 854} {"train_loss": -10.75186824798584, "global_step": 143505, "epoch": 854} {"train_loss": -10.357440948486328, "global_step": 143506, "epoch": 854} {"train_loss": -10.412513732910156, "global_step": 143507, "epoch": 854} {"train_loss": -10.666891098022461, "global_step": 143508, "epoch": 854} {"train_loss": -10.607097625732422, "global_step": 143509, "epoch": 854} {"train_loss": -10.205245971679688, "global_step": 143510, "epoch": 854} {"train_loss": -10.731039047241211, "global_step": 143511, "epoch": 854} {"train_loss": -10.711697578430176, "global_step": 143512, "epoch": 854} {"train_loss": -10.492952346801758, "global_step": 143513, "epoch": 854} {"train_loss": -10.637096405029297, "global_step": 143514, "epoch": 854} {"train_loss": -10.374639511108398, "global_step": 143515, "epoch": 854} {"train_loss": -10.440730094909668, "global_step": 143516, "epoch": 854} {"train_loss": -10.346185684204102, "global_step": 143517, "epoch": 854} {"train_loss": -9.594881057739258, "global_step": 143518, "epoch": 854} {"train_loss": -10.242603302001953, "global_step": 143519, "epoch": 854} {"train_loss": -10.42601203918457, "global_step": 143520, "epoch": 854} {"train_loss": -10.114957809448242, "global_step": 143521, "epoch": 854} {"train_loss": -10.409013748168945, "global_step": 143522, "epoch": 854} {"train_loss": -9.984436988830566, "global_step": 143523, "epoch": 854} {"train_loss": -10.550888061523438, "global_step": 143524, "epoch": 854} {"train_loss": -10.002655982971191, "global_step": 143525, "epoch": 854} {"train_loss": -10.554418563842773, "global_step": 143526, "epoch": 854} {"train_loss": -10.239717483520508, "global_step": 143527, "epoch": 854} {"train_loss": -10.720878601074219, "global_step": 143528, "epoch": 854} {"train_loss": -10.149226188659668, "global_step": 143529, "epoch": 854} {"train_loss": -10.692696571350098, "global_step": 143530, "epoch": 854} {"train_loss": -10.437055587768555, "global_step": 143531, "epoch": 854} {"train_loss": -10.654067993164062, "global_step": 143532, "epoch": 854} {"train_loss": -10.663084030151367, "global_step": 143533, "epoch": 854} {"train_loss": -10.482544898986816, "global_step": 143534, "epoch": 854} {"train_loss": -10.53449535369873, "global_step": 143535, "epoch": 854} {"train_loss": -10.623640060424805, "global_step": 143536, "epoch": 854} {"train_loss": -10.527861595153809, "global_step": 143537, "epoch": 854} {"train_loss": -10.72390365600586, "global_step": 143538, "epoch": 854} {"train_loss": -10.747777938842773, "global_step": 143539, "epoch": 854} {"train_loss": -10.554964065551758, "global_step": 143540, "epoch": 854} {"train_loss": -10.701087951660156, "global_step": 143541, "epoch": 854} {"train_loss": -10.749268531799316, "global_step": 143542, "epoch": 854} {"train_loss": -10.455660820007324, "global_step": 143543, "epoch": 854} {"train_loss": -10.815132141113281, "global_step": 143544, "epoch": 854} {"train_loss": -10.722384452819824, "global_step": 143545, "epoch": 854} {"train_loss": -10.584104537963867, "global_step": 143546, "epoch": 854} {"train_loss": -10.698179244995117, "global_step": 143547, "epoch": 854} {"train_loss": -10.929464340209961, "global_step": 143548, "epoch": 854} {"train_loss": -10.294180870056152, "global_step": 143549, "epoch": 854} {"train_loss": -10.688915252685547, "global_step": 143550, "epoch": 854} {"train_loss": -10.20069694519043, "global_step": 143551, "epoch": 854} {"train_loss": -10.389291763305664, "global_step": 143552, "epoch": 854} {"train_loss": -10.438275337219238, "global_step": 143553, "epoch": 854} {"train_loss": -10.343137741088867, "global_step": 143554, "epoch": 854} {"train_loss": -10.683296203613281, "global_step": 143555, "epoch": 854} {"train_loss": -10.558950424194336, "global_step": 143556, "epoch": 854} {"train_loss": -10.411250114440918, "global_step": 143557, "epoch": 854} {"train_loss": -10.30157470703125, "global_step": 143558, "epoch": 854} {"train_loss": -10.067469596862793, "global_step": 143559, "epoch": 854} {"train_loss": -10.582671165466309, "global_step": 143560, "epoch": 854} {"train_loss": -10.50074577331543, "global_step": 143561, "epoch": 854} {"train_loss": -10.118602752685547, "global_step": 143562, "epoch": 854} {"train_loss": -10.5338716506958, "global_step": 143563, "epoch": 854} {"train_loss": -10.226662635803223, "global_step": 143564, "epoch": 854} {"train_loss": -10.755313873291016, "global_step": 143565, "epoch": 854} {"train_loss": -10.530017852783203, "global_step": 143566, "epoch": 854} {"train_loss": -10.480925559997559, "global_step": 143567, "epoch": 854} {"train_loss": -10.694562911987305, "global_step": 143568, "epoch": 854} {"train_loss": -10.509251594543457, "global_step": 143569, "epoch": 854} {"train_loss": -10.421126365661621, "global_step": 143570, "epoch": 854} {"train_loss": -10.383411407470703, "global_step": 143571, "epoch": 854} {"train_loss": -10.45966625213623, "global_step": 143572, "epoch": 854} {"train_loss": -10.307687759399414, "global_step": 143573, "epoch": 854} {"train_loss": -10.852742195129395, "global_step": 143574, "epoch": 854} {"train_loss": -10.368898391723633, "global_step": 143575, "epoch": 854} {"train_loss": -10.713888168334961, "global_step": 143576, "epoch": 854} {"train_loss": -10.492288589477539, "global_step": 143577, "epoch": 854} {"train_loss": -10.554912567138672, "global_step": 143578, "epoch": 854} {"train_loss": -10.690208435058594, "global_step": 143579, "epoch": 854} {"train_loss": -10.474987030029297, "global_step": 143580, "epoch": 854} {"train_loss": -10.658191680908203, "global_step": 143581, "epoch": 854} {"train_loss": -10.522544860839844, "global_step": 143582, "epoch": 854} {"train_loss": -10.002874374389648, "global_step": 143583, "epoch": 854} {"train_loss": -10.717802047729492, "global_step": 143584, "epoch": 854} {"train_loss": -10.426469802856445, "global_step": 143585, "epoch": 854} {"train_loss": -10.654500961303711, "global_step": 143586, "epoch": 854} {"train_loss": -10.613765716552734, "global_step": 143587, "epoch": 854} {"train_loss": -10.605562210083008, "global_step": 143588, "epoch": 854} {"train_loss": -10.764965057373047, "global_step": 143589, "epoch": 854} {"train_loss": -10.53709888458252, "global_step": 143590, "epoch": 854} {"train_loss": -10.576408386230469, "global_step": 143591, "epoch": 854} {"train_loss": -10.351566314697266, "global_step": 143592, "epoch": 854} {"train_loss": -10.446247100830078, "global_step": 143593, "epoch": 854} {"train_loss": -10.32843017578125, "global_step": 143594, "epoch": 854} {"train_loss": -10.64559555053711, "global_step": 143595, "epoch": 854} {"train_loss": -10.22238540649414, "global_step": 143596, "epoch": 854} {"train_loss": -10.53441333770752, "global_step": 143597, "epoch": 854} {"train_loss": -10.305274963378906, "global_step": 143598, "epoch": 854} {"train_loss": -10.194681167602539, "global_step": 143599, "epoch": 854} {"train_loss": -10.473240852355957, "global_step": 143600, "epoch": 854} {"train_loss": -10.589741706848145, "global_step": 143601, "epoch": 854} {"train_loss": -10.35891342163086, "global_step": 143602, "epoch": 854} {"train_loss": -10.326752662658691, "global_step": 143603, "epoch": 854} {"train_loss": -10.522497177124023, "global_step": 143604, "epoch": 854} {"train_loss": -10.673531532287598, "global_step": 143605, "epoch": 854} {"train_loss": -10.218168258666992, "global_step": 143606, "epoch": 854} {"train_loss": -10.700698852539062, "global_step": 143607, "epoch": 854} {"train_loss": -10.523994445800781, "global_step": 143608, "epoch": 854} {"train_loss": -10.384162902832031, "global_step": 143609, "epoch": 854} {"train_loss": -10.415892601013184, "global_step": 143610, "epoch": 854} {"train_loss": -10.445030212402344, "global_step": 143611, "epoch": 854} {"train_loss": -10.698470115661621, "global_step": 143612, "epoch": 854} {"train_loss": -10.450200080871582, "global_step": 143613, "epoch": 854} {"train_loss": -10.633342742919922, "global_step": 143614, "epoch": 854} {"train_loss": -10.70175552368164, "global_step": 143615, "epoch": 854} {"train_loss": -10.149471282958984, "global_step": 143616, "epoch": 854} {"train_loss": -10.935612678527832, "global_step": 143617, "epoch": 854} {"train_loss": -10.640277862548828, "global_step": 143618, "epoch": 854} {"train_loss": -10.645785331726074, "global_step": 143619, "epoch": 854} {"train_loss": -10.530156135559082, "global_step": 143620, "epoch": 854} {"train_loss": -10.890310287475586, "global_step": 143621, "epoch": 854} {"train_loss": -10.579107284545898, "global_step": 143622, "epoch": 854} {"train_loss": -10.549835205078125, "global_step": 143623, "epoch": 854} {"train_loss": -10.612113952636719, "global_step": 143624, "epoch": 854} {"train_loss": -10.870843887329102, "global_step": 143625, "epoch": 854} {"train_loss": -10.802846908569336, "global_step": 143626, "epoch": 854} {"train_loss": -10.953234672546387, "global_step": 143627, "epoch": 854} {"train_loss": -10.60481071472168, "global_step": 143628, "epoch": 854} {"train_loss": -10.843976974487305, "global_step": 143629, "epoch": 854} {"train_loss": -10.629069328308105, "global_step": 143630, "epoch": 854} {"train_loss": -10.766790390014648, "global_step": 143631, "epoch": 854} {"train_loss": -10.779895782470703, "global_step": 143632, "epoch": 854} {"train_loss": -10.675503730773926, "global_step": 143633, "epoch": 854} {"train_loss": -10.79220199584961, "global_step": 143634, "epoch": 854} {"train_loss": -10.815950393676758, "global_step": 143635, "epoch": 854} {"train_loss": -10.65698528289795, "global_step": 143636, "epoch": 854} {"train_loss": -10.938088417053223, "global_step": 143637, "epoch": 854} {"train_loss": -10.872658729553223, "global_step": 143638, "epoch": 854} {"train_loss": -10.566194772720337, "global_step": 143639, "epoch": 854, "val_loss": 227262.703125} {"train_loss": -10.913457870483398, "global_step": 143640, "epoch": 855} {"train_loss": -10.632009506225586, "global_step": 143641, "epoch": 855} {"train_loss": -10.567426681518555, "global_step": 143642, "epoch": 855} {"train_loss": -10.951711654663086, "global_step": 143643, "epoch": 855} {"train_loss": -10.474302291870117, "global_step": 143644, "epoch": 855} {"train_loss": -10.822303771972656, "global_step": 143645, "epoch": 855} {"train_loss": -10.593497276306152, "global_step": 143646, "epoch": 855} {"train_loss": -10.523836135864258, "global_step": 143647, "epoch": 855} {"train_loss": -10.731512069702148, "global_step": 143648, "epoch": 855} {"train_loss": -10.565094947814941, "global_step": 143649, "epoch": 855} {"train_loss": -10.776268005371094, "global_step": 143650, "epoch": 855} {"train_loss": -10.819005966186523, "global_step": 143651, "epoch": 855} {"train_loss": -10.87026596069336, "global_step": 143652, "epoch": 855} {"train_loss": -10.631335258483887, "global_step": 143653, "epoch": 855} {"train_loss": -10.69536018371582, "global_step": 143654, "epoch": 855} {"train_loss": -10.370628356933594, "global_step": 143655, "epoch": 855} {"train_loss": -10.985177993774414, "global_step": 143656, "epoch": 855} {"train_loss": -10.465919494628906, "global_step": 143657, "epoch": 855} {"train_loss": -10.442483901977539, "global_step": 143658, "epoch": 855} {"train_loss": -10.530450820922852, "global_step": 143659, "epoch": 855} {"train_loss": -10.255708694458008, "global_step": 143660, "epoch": 855} {"train_loss": -10.793329238891602, "global_step": 143661, "epoch": 855} {"train_loss": -10.314765930175781, "global_step": 143662, "epoch": 855} {"train_loss": -10.412858009338379, "global_step": 143663, "epoch": 855} {"train_loss": -10.59096908569336, "global_step": 143664, "epoch": 855} {"train_loss": -10.674437522888184, "global_step": 143665, "epoch": 855} {"train_loss": -10.425335884094238, "global_step": 143666, "epoch": 855} {"train_loss": -10.605212211608887, "global_step": 143667, "epoch": 855} {"train_loss": -10.698378562927246, "global_step": 143668, "epoch": 855} {"train_loss": -10.571131706237793, "global_step": 143669, "epoch": 855} {"train_loss": -10.924774169921875, "global_step": 143670, "epoch": 855} {"train_loss": -9.928245544433594, "global_step": 143671, "epoch": 855} {"train_loss": -10.524738311767578, "global_step": 143672, "epoch": 855} {"train_loss": -10.799235343933105, "global_step": 143673, "epoch": 855} {"train_loss": -10.388476371765137, "global_step": 143674, "epoch": 855} {"train_loss": -10.680211067199707, "global_step": 143675, "epoch": 855} {"train_loss": -10.599834442138672, "global_step": 143676, "epoch": 855} {"train_loss": -10.699070930480957, "global_step": 143677, "epoch": 855} {"train_loss": -10.471612930297852, "global_step": 143678, "epoch": 855} {"train_loss": -10.833114624023438, "global_step": 143679, "epoch": 855} {"train_loss": -10.80327033996582, "global_step": 143680, "epoch": 855} {"train_loss": -10.454769134521484, "global_step": 143681, "epoch": 855} {"train_loss": -10.622374534606934, "global_step": 143682, "epoch": 855} {"train_loss": -10.548314094543457, "global_step": 143683, "epoch": 855} {"train_loss": -10.716936111450195, "global_step": 143684, "epoch": 855} {"train_loss": -10.678028106689453, "global_step": 143685, "epoch": 855} {"train_loss": -10.835110664367676, "global_step": 143686, "epoch": 855} {"train_loss": -11.058920860290527, "global_step": 143687, "epoch": 855} {"train_loss": -10.604623794555664, "global_step": 143688, "epoch": 855} {"train_loss": -10.656292915344238, "global_step": 143689, "epoch": 855} {"train_loss": -10.721002578735352, "global_step": 143690, "epoch": 855} {"train_loss": -10.729440689086914, "global_step": 143691, "epoch": 855} {"train_loss": -10.508593559265137, "global_step": 143692, "epoch": 855} {"train_loss": -10.332632064819336, "global_step": 143693, "epoch": 855} {"train_loss": -10.593246459960938, "global_step": 143694, "epoch": 855} {"train_loss": -10.394025802612305, "global_step": 143695, "epoch": 855} {"train_loss": -10.891586303710938, "global_step": 143696, "epoch": 855} {"train_loss": -10.389106750488281, "global_step": 143697, "epoch": 855} {"train_loss": -10.82632827758789, "global_step": 143698, "epoch": 855} {"train_loss": -10.441688537597656, "global_step": 143699, "epoch": 855} {"train_loss": -10.301032066345215, "global_step": 143700, "epoch": 855} {"train_loss": -10.680763244628906, "global_step": 143701, "epoch": 855} {"train_loss": -10.498555183410645, "global_step": 143702, "epoch": 855} {"train_loss": -10.302790641784668, "global_step": 143703, "epoch": 855} {"train_loss": -10.71572494506836, "global_step": 143704, "epoch": 855} {"train_loss": -10.464031219482422, "global_step": 143705, "epoch": 855} {"train_loss": -10.637870788574219, "global_step": 143706, "epoch": 855} {"train_loss": -10.280482292175293, "global_step": 143707, "epoch": 855} {"train_loss": -10.418107986450195, "global_step": 143708, "epoch": 855} {"train_loss": -10.944229125976562, "global_step": 143709, "epoch": 855} {"train_loss": -10.502399444580078, "global_step": 143710, "epoch": 855} {"train_loss": -10.947263717651367, "global_step": 143711, "epoch": 855} {"train_loss": -10.45169448852539, "global_step": 143712, "epoch": 855} {"train_loss": -10.540107727050781, "global_step": 143713, "epoch": 855} {"train_loss": -10.600960731506348, "global_step": 143714, "epoch": 855} {"train_loss": -10.471760749816895, "global_step": 143715, "epoch": 855} {"train_loss": -10.749734878540039, "global_step": 143716, "epoch": 855} {"train_loss": -10.703620910644531, "global_step": 143717, "epoch": 855} {"train_loss": -10.535322189331055, "global_step": 143718, "epoch": 855} {"train_loss": -10.825488090515137, "global_step": 143719, "epoch": 855} {"train_loss": -10.340301513671875, "global_step": 143720, "epoch": 855} {"train_loss": -10.711034774780273, "global_step": 143721, "epoch": 855} {"train_loss": -10.820409774780273, "global_step": 143722, "epoch": 855} {"train_loss": -10.44682502746582, "global_step": 143723, "epoch": 855} {"train_loss": -10.522482872009277, "global_step": 143724, "epoch": 855} {"train_loss": -10.157328605651855, "global_step": 143725, "epoch": 855} {"train_loss": -10.238558769226074, "global_step": 143726, "epoch": 855} {"train_loss": -10.628091812133789, "global_step": 143727, "epoch": 855} {"train_loss": -10.404966354370117, "global_step": 143728, "epoch": 855} {"train_loss": -10.598296165466309, "global_step": 143729, "epoch": 855} {"train_loss": -10.787028312683105, "global_step": 143730, "epoch": 855} {"train_loss": -10.392247200012207, "global_step": 143731, "epoch": 855} {"train_loss": -10.342975616455078, "global_step": 143732, "epoch": 855} {"train_loss": -10.609472274780273, "global_step": 143733, "epoch": 855} {"train_loss": -10.036225318908691, "global_step": 143734, "epoch": 855} {"train_loss": -10.73282241821289, "global_step": 143735, "epoch": 855} {"train_loss": -10.235493659973145, "global_step": 143736, "epoch": 855} {"train_loss": -10.796845436096191, "global_step": 143737, "epoch": 855} {"train_loss": -10.731231689453125, "global_step": 143738, "epoch": 855} {"train_loss": -10.49437141418457, "global_step": 143739, "epoch": 855} {"train_loss": -10.735203742980957, "global_step": 143740, "epoch": 855} {"train_loss": -10.608145713806152, "global_step": 143741, "epoch": 855} {"train_loss": -10.431254386901855, "global_step": 143742, "epoch": 855} {"train_loss": -10.738161087036133, "global_step": 143743, "epoch": 855} {"train_loss": -10.456720352172852, "global_step": 143744, "epoch": 855} {"train_loss": -10.772315979003906, "global_step": 143745, "epoch": 855} {"train_loss": -10.588203430175781, "global_step": 143746, "epoch": 855} {"train_loss": -10.288745880126953, "global_step": 143747, "epoch": 855} {"train_loss": -10.756683349609375, "global_step": 143748, "epoch": 855} {"train_loss": -10.155920028686523, "global_step": 143749, "epoch": 855} {"train_loss": -10.604421615600586, "global_step": 143750, "epoch": 855} {"train_loss": -10.200535774230957, "global_step": 143751, "epoch": 855} {"train_loss": -10.499710083007812, "global_step": 143752, "epoch": 855} {"train_loss": -10.566393852233887, "global_step": 143753, "epoch": 855} {"train_loss": -10.676624298095703, "global_step": 143754, "epoch": 855} {"train_loss": -10.326379776000977, "global_step": 143755, "epoch": 855} {"train_loss": -10.448163986206055, "global_step": 143756, "epoch": 855} {"train_loss": -10.581421852111816, "global_step": 143757, "epoch": 855} {"train_loss": -10.375884056091309, "global_step": 143758, "epoch": 855} {"train_loss": -10.546995162963867, "global_step": 143759, "epoch": 855} {"train_loss": -10.19276237487793, "global_step": 143760, "epoch": 855} {"train_loss": -10.630435943603516, "global_step": 143761, "epoch": 855} {"train_loss": -10.264089584350586, "global_step": 143762, "epoch": 855} {"train_loss": -10.261529922485352, "global_step": 143763, "epoch": 855} {"train_loss": -9.891551971435547, "global_step": 143764, "epoch": 855} {"train_loss": -9.563239097595215, "global_step": 143765, "epoch": 855} {"train_loss": -10.103008270263672, "global_step": 143766, "epoch": 855} {"train_loss": -10.382134437561035, "global_step": 143767, "epoch": 855} {"train_loss": -10.424079895019531, "global_step": 143768, "epoch": 855} {"train_loss": -10.07774543762207, "global_step": 143769, "epoch": 855} {"train_loss": -10.429349899291992, "global_step": 143770, "epoch": 855} {"train_loss": -10.59164810180664, "global_step": 143771, "epoch": 855} {"train_loss": -10.40975284576416, "global_step": 143772, "epoch": 855} {"train_loss": -10.697282791137695, "global_step": 143773, "epoch": 855} {"train_loss": -10.589584350585938, "global_step": 143774, "epoch": 855} {"train_loss": -10.551576614379883, "global_step": 143775, "epoch": 855} {"train_loss": -10.570859909057617, "global_step": 143776, "epoch": 855} {"train_loss": -10.654342651367188, "global_step": 143777, "epoch": 855} {"train_loss": -10.705215454101562, "global_step": 143778, "epoch": 855} {"train_loss": -10.48271369934082, "global_step": 143779, "epoch": 855} {"train_loss": -10.626699447631836, "global_step": 143780, "epoch": 855} {"train_loss": -10.759284019470215, "global_step": 143781, "epoch": 855} {"train_loss": -10.540641784667969, "global_step": 143782, "epoch": 855} {"train_loss": -10.838560104370117, "global_step": 143783, "epoch": 855} {"train_loss": -10.68030071258545, "global_step": 143784, "epoch": 855} {"train_loss": -10.735734939575195, "global_step": 143785, "epoch": 855} {"train_loss": -10.883905410766602, "global_step": 143786, "epoch": 855} {"train_loss": -10.59161376953125, "global_step": 143787, "epoch": 855} {"train_loss": -10.52409553527832, "global_step": 143788, "epoch": 855} {"train_loss": -10.725915908813477, "global_step": 143789, "epoch": 855} {"train_loss": -10.395793914794922, "global_step": 143790, "epoch": 855} {"train_loss": -10.8651762008667, "global_step": 143791, "epoch": 855} {"train_loss": -10.48446273803711, "global_step": 143792, "epoch": 855} {"train_loss": -10.711236953735352, "global_step": 143793, "epoch": 855} {"train_loss": -10.731865882873535, "global_step": 143794, "epoch": 855} {"train_loss": -10.677753448486328, "global_step": 143795, "epoch": 855} {"train_loss": -10.508565902709961, "global_step": 143796, "epoch": 855} {"train_loss": -10.577062606811523, "global_step": 143797, "epoch": 855} {"train_loss": -10.916664123535156, "global_step": 143798, "epoch": 855} {"train_loss": -10.470196723937988, "global_step": 143799, "epoch": 855} {"train_loss": -10.968144416809082, "global_step": 143800, "epoch": 855} {"train_loss": -10.492636680603027, "global_step": 143801, "epoch": 855} {"train_loss": -10.920442581176758, "global_step": 143802, "epoch": 855} {"train_loss": -10.734307289123535, "global_step": 143803, "epoch": 855} {"train_loss": -10.61489486694336, "global_step": 143804, "epoch": 855} {"train_loss": -10.925357818603516, "global_step": 143805, "epoch": 855} {"train_loss": -10.399890899658203, "global_step": 143806, "epoch": 855} {"train_loss": -10.571119450387501, "global_step": 143807, "epoch": 855, "val_loss": 228367.671875, "train_action_mse_error": 1.5404318571090698} {"train_loss": -10.388139724731445, "global_step": 143808, "epoch": 856} {"train_loss": -10.54617977142334, "global_step": 143809, "epoch": 856} {"train_loss": -10.671367645263672, "global_step": 143810, "epoch": 856} {"train_loss": -10.083351135253906, "global_step": 143811, "epoch": 856} {"train_loss": -10.663117408752441, "global_step": 143812, "epoch": 856} {"train_loss": -10.321219444274902, "global_step": 143813, "epoch": 856} {"train_loss": -10.638704299926758, "global_step": 143814, "epoch": 856} {"train_loss": -10.624653816223145, "global_step": 143815, "epoch": 856} {"train_loss": -10.419706344604492, "global_step": 143816, "epoch": 856} {"train_loss": -10.689620971679688, "global_step": 143817, "epoch": 856} {"train_loss": -10.44176197052002, "global_step": 143818, "epoch": 856} {"train_loss": -10.552597045898438, "global_step": 143819, "epoch": 856} {"train_loss": -10.442825317382812, "global_step": 143820, "epoch": 856} {"train_loss": -10.39981460571289, "global_step": 143821, "epoch": 856} {"train_loss": -10.202766418457031, "global_step": 143822, "epoch": 856} {"train_loss": -9.679534912109375, "global_step": 143823, "epoch": 856} {"train_loss": -9.802923202514648, "global_step": 143824, "epoch": 856} {"train_loss": -10.450176239013672, "global_step": 143825, "epoch": 856} {"train_loss": -10.412382125854492, "global_step": 143826, "epoch": 856} {"train_loss": -10.281757354736328, "global_step": 143827, "epoch": 856} {"train_loss": -10.741842269897461, "global_step": 143828, "epoch": 856} {"train_loss": -10.201022148132324, "global_step": 143829, "epoch": 856} {"train_loss": -10.513921737670898, "global_step": 143830, "epoch": 856} {"train_loss": -10.353260040283203, "global_step": 143831, "epoch": 856} {"train_loss": -10.654926300048828, "global_step": 143832, "epoch": 856} {"train_loss": -10.260104179382324, "global_step": 143833, "epoch": 856} {"train_loss": -10.587878227233887, "global_step": 143834, "epoch": 856} {"train_loss": -10.08618450164795, "global_step": 143835, "epoch": 856} {"train_loss": -10.80839729309082, "global_step": 143836, "epoch": 856} {"train_loss": -10.318486213684082, "global_step": 143837, "epoch": 856} {"train_loss": -10.579368591308594, "global_step": 143838, "epoch": 856} {"train_loss": -10.28079605102539, "global_step": 143839, "epoch": 856} {"train_loss": -10.980953216552734, "global_step": 143840, "epoch": 856} {"train_loss": -10.497828483581543, "global_step": 143841, "epoch": 856} {"train_loss": -10.703956604003906, "global_step": 143842, "epoch": 856} {"train_loss": -10.480462074279785, "global_step": 143843, "epoch": 856} {"train_loss": -10.634855270385742, "global_step": 143844, "epoch": 856} {"train_loss": -10.325662612915039, "global_step": 143845, "epoch": 856} {"train_loss": -10.536989212036133, "global_step": 143846, "epoch": 856} {"train_loss": -10.619980812072754, "global_step": 143847, "epoch": 856} {"train_loss": -10.667885780334473, "global_step": 143848, "epoch": 856} {"train_loss": -10.606228828430176, "global_step": 143849, "epoch": 856} {"train_loss": -10.734889030456543, "global_step": 143850, "epoch": 856} {"train_loss": -10.862958908081055, "global_step": 143851, "epoch": 856} {"train_loss": -10.767045974731445, "global_step": 143852, "epoch": 856} {"train_loss": -10.706023216247559, "global_step": 143853, "epoch": 856} {"train_loss": -10.804378509521484, "global_step": 143854, "epoch": 856} {"train_loss": -10.933187484741211, "global_step": 143855, "epoch": 856} {"train_loss": -10.722206115722656, "global_step": 143856, "epoch": 856} {"train_loss": -10.845760345458984, "global_step": 143857, "epoch": 856} {"train_loss": -10.58620834350586, "global_step": 143858, "epoch": 856} {"train_loss": -10.729269027709961, "global_step": 143859, "epoch": 856} {"train_loss": -10.83401870727539, "global_step": 143860, "epoch": 856} {"train_loss": -10.720437049865723, "global_step": 143861, "epoch": 856} {"train_loss": -10.884230613708496, "global_step": 143862, "epoch": 856} {"train_loss": -10.825387001037598, "global_step": 143863, "epoch": 856} {"train_loss": -11.021340370178223, "global_step": 143864, "epoch": 856} {"train_loss": -10.66151237487793, "global_step": 143865, "epoch": 856} {"train_loss": -10.482821464538574, "global_step": 143866, "epoch": 856} {"train_loss": -10.74131965637207, "global_step": 143867, "epoch": 856} {"train_loss": -10.810861587524414, "global_step": 143868, "epoch": 856} {"train_loss": -10.788046836853027, "global_step": 143869, "epoch": 856} {"train_loss": -11.043627738952637, "global_step": 143870, "epoch": 856} {"train_loss": -10.631580352783203, "global_step": 143871, "epoch": 856} {"train_loss": -11.10898208618164, "global_step": 143872, "epoch": 856} {"train_loss": -10.600975036621094, "global_step": 143873, "epoch": 856} {"train_loss": -10.898372650146484, "global_step": 143874, "epoch": 856} {"train_loss": -10.522102355957031, "global_step": 143875, "epoch": 856} {"train_loss": -11.054485321044922, "global_step": 143876, "epoch": 856} {"train_loss": -10.58871841430664, "global_step": 143877, "epoch": 856} {"train_loss": -10.473796844482422, "global_step": 143878, "epoch": 856} {"train_loss": -9.652817726135254, "global_step": 143879, "epoch": 856} {"train_loss": -10.62988567352295, "global_step": 143880, "epoch": 856} {"train_loss": -10.088372230529785, "global_step": 143881, "epoch": 856} {"train_loss": -10.830216407775879, "global_step": 143882, "epoch": 856} {"train_loss": -10.50686264038086, "global_step": 143883, "epoch": 856} {"train_loss": -10.383938789367676, "global_step": 143884, "epoch": 856} {"train_loss": -10.452332496643066, "global_step": 143885, "epoch": 856} {"train_loss": -10.56257152557373, "global_step": 143886, "epoch": 856} {"train_loss": -10.239452362060547, "global_step": 143887, "epoch": 856} {"train_loss": -10.58232307434082, "global_step": 143888, "epoch": 856} {"train_loss": -10.18996810913086, "global_step": 143889, "epoch": 856} {"train_loss": -10.174927711486816, "global_step": 143890, "epoch": 856} {"train_loss": -10.277351379394531, "global_step": 143891, "epoch": 856} {"train_loss": -9.925174713134766, "global_step": 143892, "epoch": 856} {"train_loss": -8.810945510864258, "global_step": 143893, "epoch": 856} {"train_loss": -10.40230941772461, "global_step": 143894, "epoch": 856} {"train_loss": -10.077988624572754, "global_step": 143895, "epoch": 856} {"train_loss": -9.970807075500488, "global_step": 143896, "epoch": 856} {"train_loss": -10.306077003479004, "global_step": 143897, "epoch": 856} {"train_loss": -10.354307174682617, "global_step": 143898, "epoch": 856} {"train_loss": -10.425703048706055, "global_step": 143899, "epoch": 856} {"train_loss": -10.742170333862305, "global_step": 143900, "epoch": 856} {"train_loss": -10.296769142150879, "global_step": 143901, "epoch": 856} {"train_loss": -10.388648986816406, "global_step": 143902, "epoch": 856} {"train_loss": -10.446755409240723, "global_step": 143903, "epoch": 856} {"train_loss": -10.48853874206543, "global_step": 143904, "epoch": 856} {"train_loss": -10.358229637145996, "global_step": 143905, "epoch": 856} {"train_loss": -10.836874008178711, "global_step": 143906, "epoch": 856} {"train_loss": -10.229413986206055, "global_step": 143907, "epoch": 856} {"train_loss": -10.473846435546875, "global_step": 143908, "epoch": 856} {"train_loss": -10.598758697509766, "global_step": 143909, "epoch": 856} {"train_loss": -10.454183578491211, "global_step": 143910, "epoch": 856} {"train_loss": -10.486825942993164, "global_step": 143911, "epoch": 856} {"train_loss": -10.377058029174805, "global_step": 143912, "epoch": 856} {"train_loss": -10.54638671875, "global_step": 143913, "epoch": 856} {"train_loss": -10.251827239990234, "global_step": 143914, "epoch": 856} {"train_loss": -10.713539123535156, "global_step": 143915, "epoch": 856} {"train_loss": -10.501623153686523, "global_step": 143916, "epoch": 856} {"train_loss": -10.806217193603516, "global_step": 143917, "epoch": 856} {"train_loss": -10.721328735351562, "global_step": 143918, "epoch": 856} {"train_loss": -10.844748497009277, "global_step": 143919, "epoch": 856} {"train_loss": -10.471967697143555, "global_step": 143920, "epoch": 856} {"train_loss": -10.534062385559082, "global_step": 143921, "epoch": 856} {"train_loss": -10.75379753112793, "global_step": 143922, "epoch": 856} {"train_loss": -10.460693359375, "global_step": 143923, "epoch": 856} {"train_loss": -10.842826843261719, "global_step": 143924, "epoch": 856} {"train_loss": -10.332218170166016, "global_step": 143925, "epoch": 856} {"train_loss": -10.913338661193848, "global_step": 143926, "epoch": 856} {"train_loss": -10.445493698120117, "global_step": 143927, "epoch": 856} {"train_loss": -10.86046028137207, "global_step": 143928, "epoch": 856} {"train_loss": -10.742030143737793, "global_step": 143929, "epoch": 856} {"train_loss": -10.70786190032959, "global_step": 143930, "epoch": 856} {"train_loss": -10.732934951782227, "global_step": 143931, "epoch": 856} {"train_loss": -10.873950004577637, "global_step": 143932, "epoch": 856} {"train_loss": -10.836925506591797, "global_step": 143933, "epoch": 856} {"train_loss": -10.800729751586914, "global_step": 143934, "epoch": 856} {"train_loss": -10.870088577270508, "global_step": 143935, "epoch": 856} {"train_loss": -10.584538459777832, "global_step": 143936, "epoch": 856} {"train_loss": -10.722290992736816, "global_step": 143937, "epoch": 856} {"train_loss": -10.89566421508789, "global_step": 143938, "epoch": 856} {"train_loss": -10.613097190856934, "global_step": 143939, "epoch": 856} {"train_loss": -10.896280288696289, "global_step": 143940, "epoch": 856} {"train_loss": -10.545039176940918, "global_step": 143941, "epoch": 856} {"train_loss": -10.701702117919922, "global_step": 143942, "epoch": 856} {"train_loss": -10.891763687133789, "global_step": 143943, "epoch": 856} {"train_loss": -10.985944747924805, "global_step": 143944, "epoch": 856} {"train_loss": -10.5756254196167, "global_step": 143945, "epoch": 856} {"train_loss": -10.907450675964355, "global_step": 143946, "epoch": 856} {"train_loss": -10.288509368896484, "global_step": 143947, "epoch": 856} {"train_loss": -10.063222885131836, "global_step": 143948, "epoch": 856} {"train_loss": -10.72815990447998, "global_step": 143949, "epoch": 856} {"train_loss": -10.484376907348633, "global_step": 143950, "epoch": 856} {"train_loss": -10.556281089782715, "global_step": 143951, "epoch": 856} {"train_loss": -10.29389476776123, "global_step": 143952, "epoch": 856} {"train_loss": -10.629408836364746, "global_step": 143953, "epoch": 856} {"train_loss": -10.572179794311523, "global_step": 143954, "epoch": 856} {"train_loss": -10.512567520141602, "global_step": 143955, "epoch": 856} {"train_loss": -10.583769798278809, "global_step": 143956, "epoch": 856} {"train_loss": -10.572443008422852, "global_step": 143957, "epoch": 856} {"train_loss": -10.891570091247559, "global_step": 143958, "epoch": 856} {"train_loss": -10.50008487701416, "global_step": 143959, "epoch": 856} {"train_loss": -10.717607498168945, "global_step": 143960, "epoch": 856} {"train_loss": -10.853562355041504, "global_step": 143961, "epoch": 856} {"train_loss": -10.611586570739746, "global_step": 143962, "epoch": 856} {"train_loss": -10.836742401123047, "global_step": 143963, "epoch": 856} {"train_loss": -10.614727020263672, "global_step": 143964, "epoch": 856} {"train_loss": -10.451423645019531, "global_step": 143965, "epoch": 856} {"train_loss": -10.876022338867188, "global_step": 143966, "epoch": 856} {"train_loss": -10.640027046203613, "global_step": 143967, "epoch": 856} {"train_loss": -10.812347412109375, "global_step": 143968, "epoch": 856} {"train_loss": -10.42238712310791, "global_step": 143969, "epoch": 856} {"train_loss": -10.668015480041504, "global_step": 143970, "epoch": 856} {"train_loss": -10.635978698730469, "global_step": 143971, "epoch": 856} {"train_loss": -10.534637451171875, "global_step": 143972, "epoch": 856} {"train_loss": -11.046585083007812, "global_step": 143973, "epoch": 856} {"train_loss": -10.53037166595459, "global_step": 143974, "epoch": 856} {"train_loss": -10.558096976507278, "global_step": 143975, "epoch": 856, "val_loss": 228409.21875} {"train_loss": -10.705120086669922, "global_step": 143976, "epoch": 857} {"train_loss": -10.50267505645752, "global_step": 143977, "epoch": 857} {"train_loss": -10.73306655883789, "global_step": 143978, "epoch": 857} {"train_loss": -10.479715347290039, "global_step": 143979, "epoch": 857} {"train_loss": -10.80113410949707, "global_step": 143980, "epoch": 857} {"train_loss": -10.637646675109863, "global_step": 143981, "epoch": 857} {"train_loss": -10.668350219726562, "global_step": 143982, "epoch": 857} {"train_loss": -10.899412155151367, "global_step": 143983, "epoch": 857} {"train_loss": -10.718486785888672, "global_step": 143984, "epoch": 857} {"train_loss": -10.901494979858398, "global_step": 143985, "epoch": 857} {"train_loss": -10.34738540649414, "global_step": 143986, "epoch": 857} {"train_loss": -10.658699035644531, "global_step": 143987, "epoch": 857} {"train_loss": -10.855871200561523, "global_step": 143988, "epoch": 857} {"train_loss": -10.799312591552734, "global_step": 143989, "epoch": 857} {"train_loss": -10.588985443115234, "global_step": 143990, "epoch": 857} {"train_loss": -10.710813522338867, "global_step": 143991, "epoch": 857} {"train_loss": -10.831954956054688, "global_step": 143992, "epoch": 857} {"train_loss": -10.475240707397461, "global_step": 143993, "epoch": 857} {"train_loss": -10.760461807250977, "global_step": 143994, "epoch": 857} {"train_loss": -10.755041122436523, "global_step": 143995, "epoch": 857} {"train_loss": -10.800997734069824, "global_step": 143996, "epoch": 857} {"train_loss": -10.714824676513672, "global_step": 143997, "epoch": 857} {"train_loss": -10.597481727600098, "global_step": 143998, "epoch": 857} {"train_loss": -10.875944137573242, "global_step": 143999, "epoch": 857} {"train_loss": -10.794052124023438, "global_step": 144000, "epoch": 857} {"train_loss": -10.438926696777344, "global_step": 144001, "epoch": 857} {"train_loss": -10.756758689880371, "global_step": 144002, "epoch": 857} {"train_loss": -10.683704376220703, "global_step": 144003, "epoch": 857} {"train_loss": -10.896127700805664, "global_step": 144004, "epoch": 857} {"train_loss": -10.5595703125, "global_step": 144005, "epoch": 857} {"train_loss": -10.94428825378418, "global_step": 144006, "epoch": 857} {"train_loss": -10.722916603088379, "global_step": 144007, "epoch": 857} {"train_loss": -10.765392303466797, "global_step": 144008, "epoch": 857} {"train_loss": -10.667336463928223, "global_step": 144009, "epoch": 857} {"train_loss": -10.532102584838867, "global_step": 144010, "epoch": 857} {"train_loss": -10.52901554107666, "global_step": 144011, "epoch": 857} {"train_loss": -10.71103286743164, "global_step": 144012, "epoch": 857} {"train_loss": -10.645384788513184, "global_step": 144013, "epoch": 857} {"train_loss": -10.967443466186523, "global_step": 144014, "epoch": 857} {"train_loss": -10.84261417388916, "global_step": 144015, "epoch": 857} {"train_loss": -10.58538818359375, "global_step": 144016, "epoch": 857} {"train_loss": -10.336668014526367, "global_step": 144017, "epoch": 857} {"train_loss": -10.412839889526367, "global_step": 144018, "epoch": 857} {"train_loss": -9.911140441894531, "global_step": 144019, "epoch": 857} {"train_loss": -9.897222518920898, "global_step": 144020, "epoch": 857} {"train_loss": -10.048806190490723, "global_step": 144021, "epoch": 857} {"train_loss": -9.622523307800293, "global_step": 144022, "epoch": 857} {"train_loss": -10.328914642333984, "global_step": 144023, "epoch": 857} {"train_loss": -8.930747985839844, "global_step": 144024, "epoch": 857} {"train_loss": -9.970559120178223, "global_step": 144025, "epoch": 857} {"train_loss": -10.105886459350586, "global_step": 144026, "epoch": 857} {"train_loss": -9.673276901245117, "global_step": 144027, "epoch": 857} {"train_loss": -9.84790325164795, "global_step": 144028, "epoch": 857} {"train_loss": -9.4600830078125, "global_step": 144029, "epoch": 857} {"train_loss": -9.861303329467773, "global_step": 144030, "epoch": 857} {"train_loss": -9.997406959533691, "global_step": 144031, "epoch": 857} {"train_loss": -10.154056549072266, "global_step": 144032, "epoch": 857} {"train_loss": -10.32870864868164, "global_step": 144033, "epoch": 857} {"train_loss": -10.256158828735352, "global_step": 144034, "epoch": 857} {"train_loss": -10.15068244934082, "global_step": 144035, "epoch": 857} {"train_loss": -9.94723129272461, "global_step": 144036, "epoch": 857} {"train_loss": -10.410677909851074, "global_step": 144037, "epoch": 857} {"train_loss": -10.191400527954102, "global_step": 144038, "epoch": 857} {"train_loss": -10.44862174987793, "global_step": 144039, "epoch": 857} {"train_loss": -10.25589370727539, "global_step": 144040, "epoch": 857} {"train_loss": -10.146417617797852, "global_step": 144041, "epoch": 857} {"train_loss": -10.648393630981445, "global_step": 144042, "epoch": 857} {"train_loss": -10.454305648803711, "global_step": 144043, "epoch": 857} {"train_loss": -10.340194702148438, "global_step": 144044, "epoch": 857} {"train_loss": -10.447297096252441, "global_step": 144045, "epoch": 857} {"train_loss": -10.252433776855469, "global_step": 144046, "epoch": 857} {"train_loss": -10.426515579223633, "global_step": 144047, "epoch": 857} {"train_loss": -10.536333084106445, "global_step": 144048, "epoch": 857} {"train_loss": -10.51160717010498, "global_step": 144049, "epoch": 857} {"train_loss": -10.339128494262695, "global_step": 144050, "epoch": 857} {"train_loss": -10.482566833496094, "global_step": 144051, "epoch": 857} {"train_loss": -10.519392013549805, "global_step": 144052, "epoch": 857} {"train_loss": -10.529157638549805, "global_step": 144053, "epoch": 857} {"train_loss": -10.55573558807373, "global_step": 144054, "epoch": 857} {"train_loss": -10.277409553527832, "global_step": 144055, "epoch": 857} {"train_loss": -10.50943660736084, "global_step": 144056, "epoch": 857} {"train_loss": -10.603550910949707, "global_step": 144057, "epoch": 857} {"train_loss": -10.431805610656738, "global_step": 144058, "epoch": 857} {"train_loss": -10.549565315246582, "global_step": 144059, "epoch": 857} {"train_loss": -10.581796646118164, "global_step": 144060, "epoch": 857} {"train_loss": -10.666952133178711, "global_step": 144061, "epoch": 857} {"train_loss": -10.798501968383789, "global_step": 144062, "epoch": 857} {"train_loss": -10.705509185791016, "global_step": 144063, "epoch": 857} {"train_loss": -10.81019401550293, "global_step": 144064, "epoch": 857} {"train_loss": -10.599359512329102, "global_step": 144065, "epoch": 857} {"train_loss": -10.559406280517578, "global_step": 144066, "epoch": 857} {"train_loss": -10.589083671569824, "global_step": 144067, "epoch": 857} {"train_loss": -10.727104187011719, "global_step": 144068, "epoch": 857} {"train_loss": -10.77489948272705, "global_step": 144069, "epoch": 857} {"train_loss": -10.77145004272461, "global_step": 144070, "epoch": 857} {"train_loss": -10.648194313049316, "global_step": 144071, "epoch": 857} {"train_loss": -10.807816505432129, "global_step": 144072, "epoch": 857} {"train_loss": -10.765226364135742, "global_step": 144073, "epoch": 857} {"train_loss": -10.904022216796875, "global_step": 144074, "epoch": 857} {"train_loss": -10.876907348632812, "global_step": 144075, "epoch": 857} {"train_loss": -10.837028503417969, "global_step": 144076, "epoch": 857} {"train_loss": -10.977006912231445, "global_step": 144077, "epoch": 857} {"train_loss": -10.920936584472656, "global_step": 144078, "epoch": 857} {"train_loss": -11.110480308532715, "global_step": 144079, "epoch": 857} {"train_loss": -10.771029472351074, "global_step": 144080, "epoch": 857} {"train_loss": -11.088399887084961, "global_step": 144081, "epoch": 857} {"train_loss": -10.79050064086914, "global_step": 144082, "epoch": 857} {"train_loss": -11.168098449707031, "global_step": 144083, "epoch": 857} {"train_loss": -11.033848762512207, "global_step": 144084, "epoch": 857} {"train_loss": -10.829117774963379, "global_step": 144085, "epoch": 857} {"train_loss": -10.763615608215332, "global_step": 144086, "epoch": 857} {"train_loss": -10.893516540527344, "global_step": 144087, "epoch": 857} {"train_loss": -10.783748626708984, "global_step": 144088, "epoch": 857} {"train_loss": -11.052451133728027, "global_step": 144089, "epoch": 857} {"train_loss": -10.828985214233398, "global_step": 144090, "epoch": 857} {"train_loss": -11.032092094421387, "global_step": 144091, "epoch": 857} {"train_loss": -10.786260604858398, "global_step": 144092, "epoch": 857} {"train_loss": -10.723604202270508, "global_step": 144093, "epoch": 857} {"train_loss": -11.06951904296875, "global_step": 144094, "epoch": 857} {"train_loss": -10.72350025177002, "global_step": 144095, "epoch": 857} {"train_loss": -10.349931716918945, "global_step": 144096, "epoch": 857} {"train_loss": -10.38075065612793, "global_step": 144097, "epoch": 857} {"train_loss": -10.305044174194336, "global_step": 144098, "epoch": 857} {"train_loss": -10.37431526184082, "global_step": 144099, "epoch": 857} {"train_loss": -10.438982009887695, "global_step": 144100, "epoch": 857} {"train_loss": -10.41871452331543, "global_step": 144101, "epoch": 857} {"train_loss": -10.474203109741211, "global_step": 144102, "epoch": 857} {"train_loss": -10.732702255249023, "global_step": 144103, "epoch": 857} {"train_loss": -10.414517402648926, "global_step": 144104, "epoch": 857} {"train_loss": -10.352011680603027, "global_step": 144105, "epoch": 857} {"train_loss": -10.345765113830566, "global_step": 144106, "epoch": 857} {"train_loss": -10.778535842895508, "global_step": 144107, "epoch": 857} {"train_loss": -10.694937705993652, "global_step": 144108, "epoch": 857} {"train_loss": -10.061185836791992, "global_step": 144109, "epoch": 857} {"train_loss": -10.302972793579102, "global_step": 144110, "epoch": 857} {"train_loss": -10.323776245117188, "global_step": 144111, "epoch": 857} {"train_loss": -9.966327667236328, "global_step": 144112, "epoch": 857} {"train_loss": -10.108097076416016, "global_step": 144113, "epoch": 857} {"train_loss": -10.069831848144531, "global_step": 144114, "epoch": 857} {"train_loss": -10.017176628112793, "global_step": 144115, "epoch": 857} {"train_loss": -9.8604154586792, "global_step": 144116, "epoch": 857} {"train_loss": -10.132883071899414, "global_step": 144117, "epoch": 857} {"train_loss": -9.825037002563477, "global_step": 144118, "epoch": 857} {"train_loss": -9.961874961853027, "global_step": 144119, "epoch": 857} {"train_loss": -9.979560852050781, "global_step": 144120, "epoch": 857} {"train_loss": -9.368460655212402, "global_step": 144121, "epoch": 857} {"train_loss": -10.060622215270996, "global_step": 144122, "epoch": 857} {"train_loss": -9.609933853149414, "global_step": 144123, "epoch": 857} {"train_loss": -9.574577331542969, "global_step": 144124, "epoch": 857} {"train_loss": -9.80586051940918, "global_step": 144125, "epoch": 857} {"train_loss": -9.548288345336914, "global_step": 144126, "epoch": 857} {"train_loss": -9.880494117736816, "global_step": 144127, "epoch": 857} {"train_loss": -10.302755355834961, "global_step": 144128, "epoch": 857} {"train_loss": -9.687570571899414, "global_step": 144129, "epoch": 857} {"train_loss": -10.035770416259766, "global_step": 144130, "epoch": 857} {"train_loss": -10.625727653503418, "global_step": 144131, "epoch": 857} {"train_loss": -10.030252456665039, "global_step": 144132, "epoch": 857} {"train_loss": -10.103193283081055, "global_step": 144133, "epoch": 857} {"train_loss": -10.41807746887207, "global_step": 144134, "epoch": 857} {"train_loss": -10.124601364135742, "global_step": 144135, "epoch": 857} {"train_loss": -10.36876392364502, "global_step": 144136, "epoch": 857} {"train_loss": -10.349523544311523, "global_step": 144137, "epoch": 857} {"train_loss": -10.300132751464844, "global_step": 144138, "epoch": 857} {"train_loss": -9.985952377319336, "global_step": 144139, "epoch": 857} {"train_loss": -10.418192863464355, "global_step": 144140, "epoch": 857} {"train_loss": -10.231649398803711, "global_step": 144141, "epoch": 857} {"train_loss": -10.344297409057617, "global_step": 144142, "epoch": 857} {"train_loss": -10.453862343515668, "global_step": 144143, "epoch": 857, "val_loss": 230767.9375} {"train_loss": -10.370126724243164, "global_step": 144144, "epoch": 858} {"train_loss": -10.346494674682617, "global_step": 144145, "epoch": 858} {"train_loss": -10.412564277648926, "global_step": 144146, "epoch": 858} {"train_loss": -10.133943557739258, "global_step": 144147, "epoch": 858} {"train_loss": -10.430500984191895, "global_step": 144148, "epoch": 858} {"train_loss": -10.548816680908203, "global_step": 144149, "epoch": 858} {"train_loss": -10.508431434631348, "global_step": 144150, "epoch": 858} {"train_loss": -10.431568145751953, "global_step": 144151, "epoch": 858} {"train_loss": -10.662264823913574, "global_step": 144152, "epoch": 858} {"train_loss": -10.574604034423828, "global_step": 144153, "epoch": 858} {"train_loss": -10.521797180175781, "global_step": 144154, "epoch": 858} {"train_loss": -10.598474502563477, "global_step": 144155, "epoch": 858} {"train_loss": -10.598594665527344, "global_step": 144156, "epoch": 858} {"train_loss": -10.621404647827148, "global_step": 144157, "epoch": 858} {"train_loss": -10.551666259765625, "global_step": 144158, "epoch": 858} {"train_loss": -10.564592361450195, "global_step": 144159, "epoch": 858} {"train_loss": -10.453166961669922, "global_step": 144160, "epoch": 858} {"train_loss": -10.56126594543457, "global_step": 144161, "epoch": 858} {"train_loss": -10.797616004943848, "global_step": 144162, "epoch": 858} {"train_loss": -10.711686134338379, "global_step": 144163, "epoch": 858} {"train_loss": -10.894343376159668, "global_step": 144164, "epoch": 858} {"train_loss": -10.968799591064453, "global_step": 144165, "epoch": 858} {"train_loss": -10.795012474060059, "global_step": 144166, "epoch": 858} {"train_loss": -10.87321949005127, "global_step": 144167, "epoch": 858} {"train_loss": -10.883525848388672, "global_step": 144168, "epoch": 858} {"train_loss": -11.0261869430542, "global_step": 144169, "epoch": 858} {"train_loss": -10.96037483215332, "global_step": 144170, "epoch": 858} {"train_loss": -10.907466888427734, "global_step": 144171, "epoch": 858} {"train_loss": -10.851682662963867, "global_step": 144172, "epoch": 858} {"train_loss": -10.923047065734863, "global_step": 144173, "epoch": 858} {"train_loss": -10.802475929260254, "global_step": 144174, "epoch": 858} {"train_loss": -11.000782012939453, "global_step": 144175, "epoch": 858} {"train_loss": -10.925464630126953, "global_step": 144176, "epoch": 858} {"train_loss": -10.77501392364502, "global_step": 144177, "epoch": 858} {"train_loss": -10.64444351196289, "global_step": 144178, "epoch": 858} {"train_loss": -10.600753784179688, "global_step": 144179, "epoch": 858} {"train_loss": -10.294414520263672, "global_step": 144180, "epoch": 858} {"train_loss": -10.819902420043945, "global_step": 144181, "epoch": 858} {"train_loss": -10.482454299926758, "global_step": 144182, "epoch": 858} {"train_loss": -10.702154159545898, "global_step": 144183, "epoch": 858} {"train_loss": -10.848384857177734, "global_step": 144184, "epoch": 858} {"train_loss": -10.840851783752441, "global_step": 144185, "epoch": 858} {"train_loss": -10.951032638549805, "global_step": 144186, "epoch": 858} {"train_loss": -11.005105972290039, "global_step": 144187, "epoch": 858} {"train_loss": -10.653707504272461, "global_step": 144188, "epoch": 858} {"train_loss": -10.220203399658203, "global_step": 144189, "epoch": 858} {"train_loss": -10.862082481384277, "global_step": 144190, "epoch": 858} {"train_loss": -10.565016746520996, "global_step": 144191, "epoch": 858} {"train_loss": -10.945494651794434, "global_step": 144192, "epoch": 858} {"train_loss": -10.57807731628418, "global_step": 144193, "epoch": 858} {"train_loss": -10.868097305297852, "global_step": 144194, "epoch": 858} {"train_loss": -11.16450309753418, "global_step": 144195, "epoch": 858} {"train_loss": -10.884206771850586, "global_step": 144196, "epoch": 858} {"train_loss": -10.552480697631836, "global_step": 144197, "epoch": 858} {"train_loss": -10.950164794921875, "global_step": 144198, "epoch": 858} {"train_loss": -10.539617538452148, "global_step": 144199, "epoch": 858} {"train_loss": -10.71241569519043, "global_step": 144200, "epoch": 858} {"train_loss": -10.788396835327148, "global_step": 144201, "epoch": 858} {"train_loss": -10.712919235229492, "global_step": 144202, "epoch": 858} {"train_loss": -10.396529197692871, "global_step": 144203, "epoch": 858} {"train_loss": -9.828999519348145, "global_step": 144204, "epoch": 858} {"train_loss": -10.738924026489258, "global_step": 144205, "epoch": 858} {"train_loss": -10.16458797454834, "global_step": 144206, "epoch": 858} {"train_loss": -10.522140502929688, "global_step": 144207, "epoch": 858} {"train_loss": -10.731115341186523, "global_step": 144208, "epoch": 858} {"train_loss": -10.440958023071289, "global_step": 144209, "epoch": 858} {"train_loss": -10.716306686401367, "global_step": 144210, "epoch": 858} {"train_loss": -10.460206985473633, "global_step": 144211, "epoch": 858} {"train_loss": -10.323705673217773, "global_step": 144212, "epoch": 858} {"train_loss": -10.55864143371582, "global_step": 144213, "epoch": 858} {"train_loss": -10.553693771362305, "global_step": 144214, "epoch": 858} {"train_loss": -10.20595645904541, "global_step": 144215, "epoch": 858} {"train_loss": -10.901748657226562, "global_step": 144216, "epoch": 858} {"train_loss": -10.217531204223633, "global_step": 144217, "epoch": 858} {"train_loss": -10.176607131958008, "global_step": 144218, "epoch": 858} {"train_loss": -10.44357681274414, "global_step": 144219, "epoch": 858} {"train_loss": -10.373655319213867, "global_step": 144220, "epoch": 858} {"train_loss": -10.4428129196167, "global_step": 144221, "epoch": 858} {"train_loss": -10.63724136352539, "global_step": 144222, "epoch": 858} {"train_loss": -10.51164436340332, "global_step": 144223, "epoch": 858} {"train_loss": -10.56887149810791, "global_step": 144224, "epoch": 858} {"train_loss": -10.585421562194824, "global_step": 144225, "epoch": 858} {"train_loss": -10.669243812561035, "global_step": 144226, "epoch": 858} {"train_loss": -10.571417808532715, "global_step": 144227, "epoch": 858} {"train_loss": -10.80609130859375, "global_step": 144228, "epoch": 858} {"train_loss": -10.320125579833984, "global_step": 144229, "epoch": 858} {"train_loss": -10.450017929077148, "global_step": 144230, "epoch": 858} {"train_loss": -10.582653045654297, "global_step": 144231, "epoch": 858} {"train_loss": -10.67672348022461, "global_step": 144232, "epoch": 858} {"train_loss": -10.346023559570312, "global_step": 144233, "epoch": 858} {"train_loss": -10.240354537963867, "global_step": 144234, "epoch": 858} {"train_loss": -10.515789985656738, "global_step": 144235, "epoch": 858} {"train_loss": -10.106030464172363, "global_step": 144236, "epoch": 858} {"train_loss": -10.528759956359863, "global_step": 144237, "epoch": 858} {"train_loss": -10.298615455627441, "global_step": 144238, "epoch": 858} {"train_loss": -10.285172462463379, "global_step": 144239, "epoch": 858} {"train_loss": -10.5149564743042, "global_step": 144240, "epoch": 858} {"train_loss": -9.93405532836914, "global_step": 144241, "epoch": 858} {"train_loss": -10.356761932373047, "global_step": 144242, "epoch": 858} {"train_loss": -10.32406234741211, "global_step": 144243, "epoch": 858} {"train_loss": -10.44631576538086, "global_step": 144244, "epoch": 858} {"train_loss": -10.529449462890625, "global_step": 144245, "epoch": 858} {"train_loss": -10.364094734191895, "global_step": 144246, "epoch": 858} {"train_loss": -10.480254173278809, "global_step": 144247, "epoch": 858} {"train_loss": -10.57063102722168, "global_step": 144248, "epoch": 858} {"train_loss": -10.497148513793945, "global_step": 144249, "epoch": 858} {"train_loss": -10.697430610656738, "global_step": 144250, "epoch": 858} {"train_loss": -10.681045532226562, "global_step": 144251, "epoch": 858} {"train_loss": -10.504266738891602, "global_step": 144252, "epoch": 858} {"train_loss": -10.601670265197754, "global_step": 144253, "epoch": 858} {"train_loss": -10.410703659057617, "global_step": 144254, "epoch": 858} {"train_loss": -10.59768295288086, "global_step": 144255, "epoch": 858} {"train_loss": -10.647823333740234, "global_step": 144256, "epoch": 858} {"train_loss": -10.441699981689453, "global_step": 144257, "epoch": 858} {"train_loss": -10.73251724243164, "global_step": 144258, "epoch": 858} {"train_loss": -10.630122184753418, "global_step": 144259, "epoch": 858} {"train_loss": -10.733596801757812, "global_step": 144260, "epoch": 858} {"train_loss": -10.488037109375, "global_step": 144261, "epoch": 858} {"train_loss": -10.741368293762207, "global_step": 144262, "epoch": 858} {"train_loss": -10.42599868774414, "global_step": 144263, "epoch": 858} {"train_loss": -10.690543174743652, "global_step": 144264, "epoch": 858} {"train_loss": -10.586772918701172, "global_step": 144265, "epoch": 858} {"train_loss": -10.709648132324219, "global_step": 144266, "epoch": 858} {"train_loss": -10.676607131958008, "global_step": 144267, "epoch": 858} {"train_loss": -10.55624008178711, "global_step": 144268, "epoch": 858} {"train_loss": -10.765789985656738, "global_step": 144269, "epoch": 858} {"train_loss": -10.65931510925293, "global_step": 144270, "epoch": 858} {"train_loss": -10.713855743408203, "global_step": 144271, "epoch": 858} {"train_loss": -10.80229377746582, "global_step": 144272, "epoch": 858} {"train_loss": -10.4514799118042, "global_step": 144273, "epoch": 858} {"train_loss": -10.891918182373047, "global_step": 144274, "epoch": 858} {"train_loss": -10.501322746276855, "global_step": 144275, "epoch": 858} {"train_loss": -10.922368049621582, "global_step": 144276, "epoch": 858} {"train_loss": -10.773862838745117, "global_step": 144277, "epoch": 858} {"train_loss": -10.385000228881836, "global_step": 144278, "epoch": 858} {"train_loss": -10.766590118408203, "global_step": 144279, "epoch": 858} {"train_loss": -10.626352310180664, "global_step": 144280, "epoch": 858} {"train_loss": -10.705732345581055, "global_step": 144281, "epoch": 858} {"train_loss": -10.719715118408203, "global_step": 144282, "epoch": 858} {"train_loss": -10.410446166992188, "global_step": 144283, "epoch": 858} {"train_loss": -10.792895317077637, "global_step": 144284, "epoch": 858} {"train_loss": -10.269523620605469, "global_step": 144285, "epoch": 858} {"train_loss": -10.045782089233398, "global_step": 144286, "epoch": 858} {"train_loss": -10.689444541931152, "global_step": 144287, "epoch": 858} {"train_loss": -10.35649299621582, "global_step": 144288, "epoch": 858} {"train_loss": -10.422731399536133, "global_step": 144289, "epoch": 858} {"train_loss": -10.906649589538574, "global_step": 144290, "epoch": 858} {"train_loss": -10.31065559387207, "global_step": 144291, "epoch": 858} {"train_loss": -10.735563278198242, "global_step": 144292, "epoch": 858} {"train_loss": -10.415157318115234, "global_step": 144293, "epoch": 858} {"train_loss": -10.393732070922852, "global_step": 144294, "epoch": 858} {"train_loss": -10.69031810760498, "global_step": 144295, "epoch": 858} {"train_loss": -10.49255084991455, "global_step": 144296, "epoch": 858} {"train_loss": -10.813530921936035, "global_step": 144297, "epoch": 858} {"train_loss": -10.352663040161133, "global_step": 144298, "epoch": 858} {"train_loss": -10.851780891418457, "global_step": 144299, "epoch": 858} {"train_loss": -10.19797134399414, "global_step": 144300, "epoch": 858} {"train_loss": -10.706862449645996, "global_step": 144301, "epoch": 858} {"train_loss": -10.553606033325195, "global_step": 144302, "epoch": 858} {"train_loss": -10.38895320892334, "global_step": 144303, "epoch": 858} {"train_loss": -10.44772720336914, "global_step": 144304, "epoch": 858} {"train_loss": -10.249699592590332, "global_step": 144305, "epoch": 858} {"train_loss": -10.564403533935547, "global_step": 144306, "epoch": 858} {"train_loss": -10.4212064743042, "global_step": 144307, "epoch": 858} {"train_loss": -10.409821510314941, "global_step": 144308, "epoch": 858} {"train_loss": -10.692062377929688, "global_step": 144309, "epoch": 858} {"train_loss": -10.1959228515625, "global_step": 144310, "epoch": 858} {"train_loss": -10.580628139632088, "global_step": 144311, "epoch": 858, "val_loss": 228932.234375} {"train_loss": -10.427071571350098, "global_step": 144312, "epoch": 859} {"train_loss": -10.838478088378906, "global_step": 144313, "epoch": 859} {"train_loss": -10.497668266296387, "global_step": 144314, "epoch": 859} {"train_loss": -10.301188468933105, "global_step": 144315, "epoch": 859} {"train_loss": -10.551032066345215, "global_step": 144316, "epoch": 859} {"train_loss": -10.302667617797852, "global_step": 144317, "epoch": 859} {"train_loss": -10.319705963134766, "global_step": 144318, "epoch": 859} {"train_loss": -10.483563423156738, "global_step": 144319, "epoch": 859} {"train_loss": -10.631397247314453, "global_step": 144320, "epoch": 859} {"train_loss": -10.628667831420898, "global_step": 144321, "epoch": 859} {"train_loss": -10.341994285583496, "global_step": 144322, "epoch": 859} {"train_loss": -10.362946510314941, "global_step": 144323, "epoch": 859} {"train_loss": -10.50462532043457, "global_step": 144324, "epoch": 859} {"train_loss": -10.608059883117676, "global_step": 144325, "epoch": 859} {"train_loss": -10.588432312011719, "global_step": 144326, "epoch": 859} {"train_loss": -10.293147087097168, "global_step": 144327, "epoch": 859} {"train_loss": -10.882826805114746, "global_step": 144328, "epoch": 859} {"train_loss": -10.68497085571289, "global_step": 144329, "epoch": 859} {"train_loss": -10.720884323120117, "global_step": 144330, "epoch": 859} {"train_loss": -10.478166580200195, "global_step": 144331, "epoch": 859} {"train_loss": -10.876285552978516, "global_step": 144332, "epoch": 859} {"train_loss": -10.616523742675781, "global_step": 144333, "epoch": 859} {"train_loss": -10.676623344421387, "global_step": 144334, "epoch": 859} {"train_loss": -10.57441520690918, "global_step": 144335, "epoch": 859} {"train_loss": -10.768024444580078, "global_step": 144336, "epoch": 859} {"train_loss": -10.583284378051758, "global_step": 144337, "epoch": 859} {"train_loss": -10.729629516601562, "global_step": 144338, "epoch": 859} {"train_loss": -10.532852172851562, "global_step": 144339, "epoch": 859} {"train_loss": -10.621904373168945, "global_step": 144340, "epoch": 859} {"train_loss": -10.740663528442383, "global_step": 144341, "epoch": 859} {"train_loss": -10.085036277770996, "global_step": 144342, "epoch": 859} {"train_loss": -10.46240520477295, "global_step": 144343, "epoch": 859} {"train_loss": -10.458955764770508, "global_step": 144344, "epoch": 859} {"train_loss": -10.573051452636719, "global_step": 144345, "epoch": 859} {"train_loss": -10.766767501831055, "global_step": 144346, "epoch": 859} {"train_loss": -10.624008178710938, "global_step": 144347, "epoch": 859} {"train_loss": -10.53707504272461, "global_step": 144348, "epoch": 859} {"train_loss": -10.681095123291016, "global_step": 144349, "epoch": 859} {"train_loss": -10.517807006835938, "global_step": 144350, "epoch": 859} {"train_loss": -10.576403617858887, "global_step": 144351, "epoch": 859} {"train_loss": -10.578020095825195, "global_step": 144352, "epoch": 859} {"train_loss": -10.751199722290039, "global_step": 144353, "epoch": 859} {"train_loss": -10.33407974243164, "global_step": 144354, "epoch": 859} {"train_loss": -10.616900444030762, "global_step": 144355, "epoch": 859} {"train_loss": -10.71464729309082, "global_step": 144356, "epoch": 859} {"train_loss": -10.575308799743652, "global_step": 144357, "epoch": 859} {"train_loss": -10.329243659973145, "global_step": 144358, "epoch": 859} {"train_loss": -10.602621078491211, "global_step": 144359, "epoch": 859} {"train_loss": -10.144737243652344, "global_step": 144360, "epoch": 859} {"train_loss": -10.747733116149902, "global_step": 144361, "epoch": 859} {"train_loss": -9.63267707824707, "global_step": 144362, "epoch": 859} {"train_loss": -10.509125709533691, "global_step": 144363, "epoch": 859} {"train_loss": -10.743753433227539, "global_step": 144364, "epoch": 859} {"train_loss": -10.28346061706543, "global_step": 144365, "epoch": 859} {"train_loss": -10.699893951416016, "global_step": 144366, "epoch": 859} {"train_loss": -10.550790786743164, "global_step": 144367, "epoch": 859} {"train_loss": -10.366189002990723, "global_step": 144368, "epoch": 859} {"train_loss": -10.461648941040039, "global_step": 144369, "epoch": 859} {"train_loss": -10.262380599975586, "global_step": 144370, "epoch": 859} {"train_loss": -10.05296802520752, "global_step": 144371, "epoch": 859} {"train_loss": -10.639094352722168, "global_step": 144372, "epoch": 859} {"train_loss": -9.961583137512207, "global_step": 144373, "epoch": 859} {"train_loss": -10.419121742248535, "global_step": 144374, "epoch": 859} {"train_loss": -9.94974136352539, "global_step": 144375, "epoch": 859} {"train_loss": -10.237071990966797, "global_step": 144376, "epoch": 859} {"train_loss": -9.766546249389648, "global_step": 144377, "epoch": 859} {"train_loss": -10.407855987548828, "global_step": 144378, "epoch": 859} {"train_loss": -9.254335403442383, "global_step": 144379, "epoch": 859} {"train_loss": -10.068758010864258, "global_step": 144380, "epoch": 859} {"train_loss": -9.32773208618164, "global_step": 144381, "epoch": 859} {"train_loss": -9.288273811340332, "global_step": 144382, "epoch": 859} {"train_loss": -9.074339866638184, "global_step": 144383, "epoch": 859} {"train_loss": -10.110260009765625, "global_step": 144384, "epoch": 859} {"train_loss": -8.854496002197266, "global_step": 144385, "epoch": 859} {"train_loss": -9.652729034423828, "global_step": 144386, "epoch": 859} {"train_loss": -9.860292434692383, "global_step": 144387, "epoch": 859} {"train_loss": -9.837684631347656, "global_step": 144388, "epoch": 859} {"train_loss": -10.575257301330566, "global_step": 144389, "epoch": 859} {"train_loss": -9.193687438964844, "global_step": 144390, "epoch": 859} {"train_loss": -10.58761215209961, "global_step": 144391, "epoch": 859} {"train_loss": -9.823823928833008, "global_step": 144392, "epoch": 859} {"train_loss": -10.235713005065918, "global_step": 144393, "epoch": 859} {"train_loss": -10.069679260253906, "global_step": 144394, "epoch": 859} {"train_loss": -10.101875305175781, "global_step": 144395, "epoch": 859} {"train_loss": -10.435186386108398, "global_step": 144396, "epoch": 859} {"train_loss": -10.28742504119873, "global_step": 144397, "epoch": 859} {"train_loss": -10.559590339660645, "global_step": 144398, "epoch": 859} {"train_loss": -10.106651306152344, "global_step": 144399, "epoch": 859} {"train_loss": -10.323065757751465, "global_step": 144400, "epoch": 859} {"train_loss": -10.2919282913208, "global_step": 144401, "epoch": 859} {"train_loss": -10.253337860107422, "global_step": 144402, "epoch": 859} {"train_loss": -10.456548690795898, "global_step": 144403, "epoch": 859} {"train_loss": -10.38135814666748, "global_step": 144404, "epoch": 859} {"train_loss": -10.46109390258789, "global_step": 144405, "epoch": 859} {"train_loss": -10.534473419189453, "global_step": 144406, "epoch": 859} {"train_loss": -10.637260437011719, "global_step": 144407, "epoch": 859} {"train_loss": -10.47711181640625, "global_step": 144408, "epoch": 859} {"train_loss": -10.702085494995117, "global_step": 144409, "epoch": 859} {"train_loss": -10.54111385345459, "global_step": 144410, "epoch": 859} {"train_loss": -10.614206314086914, "global_step": 144411, "epoch": 859} {"train_loss": -10.527961730957031, "global_step": 144412, "epoch": 859} {"train_loss": -10.763324737548828, "global_step": 144413, "epoch": 859} {"train_loss": -10.352121353149414, "global_step": 144414, "epoch": 859} {"train_loss": -10.710267066955566, "global_step": 144415, "epoch": 859} {"train_loss": -10.468442916870117, "global_step": 144416, "epoch": 859} {"train_loss": -10.651323318481445, "global_step": 144417, "epoch": 859} {"train_loss": -10.919719696044922, "global_step": 144418, "epoch": 859} {"train_loss": -10.533105850219727, "global_step": 144419, "epoch": 859} {"train_loss": -10.604631423950195, "global_step": 144420, "epoch": 859} {"train_loss": -10.581178665161133, "global_step": 144421, "epoch": 859} {"train_loss": -10.859577178955078, "global_step": 144422, "epoch": 859} {"train_loss": -10.640012741088867, "global_step": 144423, "epoch": 859} {"train_loss": -10.912703514099121, "global_step": 144424, "epoch": 859} {"train_loss": -10.867767333984375, "global_step": 144425, "epoch": 859} {"train_loss": -10.716745376586914, "global_step": 144426, "epoch": 859} {"train_loss": -10.853955268859863, "global_step": 144427, "epoch": 859} {"train_loss": -10.962488174438477, "global_step": 144428, "epoch": 859} {"train_loss": -10.828544616699219, "global_step": 144429, "epoch": 859} {"train_loss": -11.006623268127441, "global_step": 144430, "epoch": 859} {"train_loss": -11.018251419067383, "global_step": 144431, "epoch": 859} {"train_loss": -10.879989624023438, "global_step": 144432, "epoch": 859} {"train_loss": -11.029655456542969, "global_step": 144433, "epoch": 859} {"train_loss": -10.842361450195312, "global_step": 144434, "epoch": 859} {"train_loss": -10.827672004699707, "global_step": 144435, "epoch": 859} {"train_loss": -10.923322677612305, "global_step": 144436, "epoch": 859} {"train_loss": -11.049127578735352, "global_step": 144437, "epoch": 859} {"train_loss": -10.570104598999023, "global_step": 144438, "epoch": 859} {"train_loss": -10.220588684082031, "global_step": 144439, "epoch": 859} {"train_loss": -10.505168914794922, "global_step": 144440, "epoch": 859} {"train_loss": -10.484630584716797, "global_step": 144441, "epoch": 859} {"train_loss": -10.926706314086914, "global_step": 144442, "epoch": 859} {"train_loss": -10.798250198364258, "global_step": 144443, "epoch": 859} {"train_loss": -10.421512603759766, "global_step": 144444, "epoch": 859} {"train_loss": -10.539825439453125, "global_step": 144445, "epoch": 859} {"train_loss": -9.727579116821289, "global_step": 144446, "epoch": 859} {"train_loss": -10.389469146728516, "global_step": 144447, "epoch": 859} {"train_loss": -9.847448348999023, "global_step": 144448, "epoch": 859} {"train_loss": -10.30938720703125, "global_step": 144449, "epoch": 859} {"train_loss": -9.702192306518555, "global_step": 144450, "epoch": 859} {"train_loss": -10.607735633850098, "global_step": 144451, "epoch": 859} {"train_loss": -10.096193313598633, "global_step": 144452, "epoch": 859} {"train_loss": -9.89785385131836, "global_step": 144453, "epoch": 859} {"train_loss": -10.256200790405273, "global_step": 144454, "epoch": 859} {"train_loss": -10.180217742919922, "global_step": 144455, "epoch": 859} {"train_loss": -10.110733032226562, "global_step": 144456, "epoch": 859} {"train_loss": -10.196402549743652, "global_step": 144457, "epoch": 859} {"train_loss": -10.029054641723633, "global_step": 144458, "epoch": 859} {"train_loss": -10.391143798828125, "global_step": 144459, "epoch": 859} {"train_loss": -10.461053848266602, "global_step": 144460, "epoch": 859} {"train_loss": -10.69687271118164, "global_step": 144461, "epoch": 859} {"train_loss": -10.325456619262695, "global_step": 144462, "epoch": 859} {"train_loss": -10.494378089904785, "global_step": 144463, "epoch": 859} {"train_loss": -10.80203628540039, "global_step": 144464, "epoch": 859} {"train_loss": -10.666069030761719, "global_step": 144465, "epoch": 859} {"train_loss": -10.416830062866211, "global_step": 144466, "epoch": 859} {"train_loss": -10.666618347167969, "global_step": 144467, "epoch": 859} {"train_loss": -10.856603622436523, "global_step": 144468, "epoch": 859} {"train_loss": -10.960731506347656, "global_step": 144469, "epoch": 859} {"train_loss": -10.68486213684082, "global_step": 144470, "epoch": 859} {"train_loss": -11.040843963623047, "global_step": 144471, "epoch": 859} {"train_loss": -10.832849502563477, "global_step": 144472, "epoch": 859} {"train_loss": -10.662068367004395, "global_step": 144473, "epoch": 859} {"train_loss": -10.925215721130371, "global_step": 144474, "epoch": 859} {"train_loss": -10.856788635253906, "global_step": 144475, "epoch": 859} {"train_loss": -10.85434341430664, "global_step": 144476, "epoch": 859} {"train_loss": -10.737394332885742, "global_step": 144477, "epoch": 859} {"train_loss": -10.893573760986328, "global_step": 144478, "epoch": 859} {"train_loss": -10.457610385758537, "global_step": 144479, "epoch": 859, "val_loss": 225536.015625} {"train_loss": -10.95175838470459, "global_step": 144480, "epoch": 860} {"train_loss": -10.658797264099121, "global_step": 144481, "epoch": 860} {"train_loss": -10.929316520690918, "global_step": 144482, "epoch": 860} {"train_loss": -10.84006118774414, "global_step": 144483, "epoch": 860} {"train_loss": -10.97193717956543, "global_step": 144484, "epoch": 860} {"train_loss": -10.86523151397705, "global_step": 144485, "epoch": 860} {"train_loss": -10.879985809326172, "global_step": 144486, "epoch": 860} {"train_loss": -10.664163589477539, "global_step": 144487, "epoch": 860} {"train_loss": -10.736858367919922, "global_step": 144488, "epoch": 860} {"train_loss": -10.860795974731445, "global_step": 144489, "epoch": 860} {"train_loss": -10.698407173156738, "global_step": 144490, "epoch": 860} {"train_loss": -11.06679630279541, "global_step": 144491, "epoch": 860} {"train_loss": -10.67037296295166, "global_step": 144492, "epoch": 860} {"train_loss": -10.63581371307373, "global_step": 144493, "epoch": 860} {"train_loss": -10.785682678222656, "global_step": 144494, "epoch": 860} {"train_loss": -10.426704406738281, "global_step": 144495, "epoch": 860} {"train_loss": -10.795355796813965, "global_step": 144496, "epoch": 860} {"train_loss": -10.15092658996582, "global_step": 144497, "epoch": 860} {"train_loss": -10.46288776397705, "global_step": 144498, "epoch": 860} {"train_loss": -10.599004745483398, "global_step": 144499, "epoch": 860} {"train_loss": -10.73946762084961, "global_step": 144500, "epoch": 860} {"train_loss": -9.856316566467285, "global_step": 144501, "epoch": 860} {"train_loss": -10.622432708740234, "global_step": 144502, "epoch": 860} {"train_loss": -9.327584266662598, "global_step": 144503, "epoch": 860} {"train_loss": -10.413870811462402, "global_step": 144504, "epoch": 860} {"train_loss": -10.406267166137695, "global_step": 144505, "epoch": 860} {"train_loss": -10.388710021972656, "global_step": 144506, "epoch": 860} {"train_loss": -10.180618286132812, "global_step": 144507, "epoch": 860} {"train_loss": -10.617820739746094, "global_step": 144508, "epoch": 860} {"train_loss": -10.113641738891602, "global_step": 144509, "epoch": 860} {"train_loss": -10.071346282958984, "global_step": 144510, "epoch": 860} {"train_loss": -10.373588562011719, "global_step": 144511, "epoch": 860} {"train_loss": -9.72085952758789, "global_step": 144512, "epoch": 860} {"train_loss": -10.403496742248535, "global_step": 144513, "epoch": 860} {"train_loss": -10.034202575683594, "global_step": 144514, "epoch": 860} {"train_loss": -10.40955924987793, "global_step": 144515, "epoch": 860} {"train_loss": -10.553083419799805, "global_step": 144516, "epoch": 860} {"train_loss": -10.312786102294922, "global_step": 144517, "epoch": 860} {"train_loss": -10.165456771850586, "global_step": 144518, "epoch": 860} {"train_loss": -10.194531440734863, "global_step": 144519, "epoch": 860} {"train_loss": -10.51461124420166, "global_step": 144520, "epoch": 860} {"train_loss": -10.095935821533203, "global_step": 144521, "epoch": 860} {"train_loss": -10.58523178100586, "global_step": 144522, "epoch": 860} {"train_loss": -9.987991333007812, "global_step": 144523, "epoch": 860} {"train_loss": -10.64482307434082, "global_step": 144524, "epoch": 860} {"train_loss": -10.499363899230957, "global_step": 144525, "epoch": 860} {"train_loss": -10.766899108886719, "global_step": 144526, "epoch": 860} {"train_loss": -10.767377853393555, "global_step": 144527, "epoch": 860} {"train_loss": -10.598230361938477, "global_step": 144528, "epoch": 860} {"train_loss": -10.72070598602295, "global_step": 144529, "epoch": 860} {"train_loss": -10.67221450805664, "global_step": 144530, "epoch": 860} {"train_loss": -10.847087860107422, "global_step": 144531, "epoch": 860} {"train_loss": -10.771888732910156, "global_step": 144532, "epoch": 860} {"train_loss": -10.750544548034668, "global_step": 144533, "epoch": 860} {"train_loss": -10.662120819091797, "global_step": 144534, "epoch": 860} {"train_loss": -10.879508972167969, "global_step": 144535, "epoch": 860} {"train_loss": -10.74917984008789, "global_step": 144536, "epoch": 860} {"train_loss": -10.836080551147461, "global_step": 144537, "epoch": 860} {"train_loss": -10.605396270751953, "global_step": 144538, "epoch": 860} {"train_loss": -10.882783889770508, "global_step": 144539, "epoch": 860} {"train_loss": -10.830537796020508, "global_step": 144540, "epoch": 860} {"train_loss": -10.694948196411133, "global_step": 144541, "epoch": 860} {"train_loss": -10.956016540527344, "global_step": 144542, "epoch": 860} {"train_loss": -10.796377182006836, "global_step": 144543, "epoch": 860} {"train_loss": -10.920966148376465, "global_step": 144544, "epoch": 860} {"train_loss": -10.864809036254883, "global_step": 144545, "epoch": 860} {"train_loss": -10.846474647521973, "global_step": 144546, "epoch": 860} {"train_loss": -10.959051132202148, "global_step": 144547, "epoch": 860} {"train_loss": -10.77383041381836, "global_step": 144548, "epoch": 860} {"train_loss": -10.84703254699707, "global_step": 144549, "epoch": 860} {"train_loss": -10.860406875610352, "global_step": 144550, "epoch": 860} {"train_loss": -10.633779525756836, "global_step": 144551, "epoch": 860} {"train_loss": -10.65241813659668, "global_step": 144552, "epoch": 860} {"train_loss": -11.019018173217773, "global_step": 144553, "epoch": 860} {"train_loss": -10.869376182556152, "global_step": 144554, "epoch": 860} {"train_loss": -11.081624031066895, "global_step": 144555, "epoch": 860} {"train_loss": -11.010025024414062, "global_step": 144556, "epoch": 860} {"train_loss": -10.915102005004883, "global_step": 144557, "epoch": 860} {"train_loss": -10.807846069335938, "global_step": 144558, "epoch": 860} {"train_loss": -10.711255073547363, "global_step": 144559, "epoch": 860} {"train_loss": -10.813828468322754, "global_step": 144560, "epoch": 860} {"train_loss": -11.043224334716797, "global_step": 144561, "epoch": 860} {"train_loss": -10.769631385803223, "global_step": 144562, "epoch": 860} {"train_loss": -10.591026306152344, "global_step": 144563, "epoch": 860} {"train_loss": -10.572604179382324, "global_step": 144564, "epoch": 860} {"train_loss": -10.908447265625, "global_step": 144565, "epoch": 860} {"train_loss": -10.890626907348633, "global_step": 144566, "epoch": 860} {"train_loss": -10.920431137084961, "global_step": 144567, "epoch": 860} {"train_loss": -10.844121932983398, "global_step": 144568, "epoch": 860} {"train_loss": -10.652458190917969, "global_step": 144569, "epoch": 860} {"train_loss": -10.360081672668457, "global_step": 144570, "epoch": 860} {"train_loss": -9.859079360961914, "global_step": 144571, "epoch": 860} {"train_loss": -10.789567947387695, "global_step": 144572, "epoch": 860} {"train_loss": -10.096656799316406, "global_step": 144573, "epoch": 860} {"train_loss": -9.590599060058594, "global_step": 144574, "epoch": 860} {"train_loss": -10.763517379760742, "global_step": 144575, "epoch": 860} {"train_loss": -9.733589172363281, "global_step": 144576, "epoch": 860} {"train_loss": -9.576208114624023, "global_step": 144577, "epoch": 860} {"train_loss": -10.422769546508789, "global_step": 144578, "epoch": 860} {"train_loss": -8.382024765014648, "global_step": 144579, "epoch": 860} {"train_loss": -9.615804672241211, "global_step": 144580, "epoch": 860} {"train_loss": -9.290489196777344, "global_step": 144581, "epoch": 860} {"train_loss": -9.10458755493164, "global_step": 144582, "epoch": 860} {"train_loss": -9.580633163452148, "global_step": 144583, "epoch": 860} {"train_loss": -9.950736999511719, "global_step": 144584, "epoch": 860} {"train_loss": -10.092161178588867, "global_step": 144585, "epoch": 860} {"train_loss": -9.917736053466797, "global_step": 144586, "epoch": 860} {"train_loss": -10.021702766418457, "global_step": 144587, "epoch": 860} {"train_loss": -10.474897384643555, "global_step": 144588, "epoch": 860} {"train_loss": -10.158365249633789, "global_step": 144589, "epoch": 860} {"train_loss": -10.456624984741211, "global_step": 144590, "epoch": 860} {"train_loss": -10.254030227661133, "global_step": 144591, "epoch": 860} {"train_loss": -10.215677261352539, "global_step": 144592, "epoch": 860} {"train_loss": -10.000579833984375, "global_step": 144593, "epoch": 860} {"train_loss": -10.480493545532227, "global_step": 144594, "epoch": 860} {"train_loss": -10.252033233642578, "global_step": 144595, "epoch": 860} {"train_loss": -10.090414047241211, "global_step": 144596, "epoch": 860} {"train_loss": -10.073014259338379, "global_step": 144597, "epoch": 860} {"train_loss": -10.107437133789062, "global_step": 144598, "epoch": 860} {"train_loss": -10.458169937133789, "global_step": 144599, "epoch": 860} {"train_loss": -9.951255798339844, "global_step": 144600, "epoch": 860} {"train_loss": -10.349239349365234, "global_step": 144601, "epoch": 860} {"train_loss": -10.307835578918457, "global_step": 144602, "epoch": 860} {"train_loss": -10.18069839477539, "global_step": 144603, "epoch": 860} {"train_loss": -10.36467170715332, "global_step": 144604, "epoch": 860} {"train_loss": -10.21946907043457, "global_step": 144605, "epoch": 860} {"train_loss": -10.346571922302246, "global_step": 144606, "epoch": 860} {"train_loss": -10.369858741760254, "global_step": 144607, "epoch": 860} {"train_loss": -10.158547401428223, "global_step": 144608, "epoch": 860} {"train_loss": -10.355216979980469, "global_step": 144609, "epoch": 860} {"train_loss": -10.287654876708984, "global_step": 144610, "epoch": 860} {"train_loss": -10.569761276245117, "global_step": 144611, "epoch": 860} {"train_loss": -10.399120330810547, "global_step": 144612, "epoch": 860} {"train_loss": -10.416568756103516, "global_step": 144613, "epoch": 860} {"train_loss": -10.679891586303711, "global_step": 144614, "epoch": 860} {"train_loss": -10.42853832244873, "global_step": 144615, "epoch": 860} {"train_loss": -10.591391563415527, "global_step": 144616, "epoch": 860} {"train_loss": -10.44621467590332, "global_step": 144617, "epoch": 860} {"train_loss": -10.725112915039062, "global_step": 144618, "epoch": 860} {"train_loss": -10.596657752990723, "global_step": 144619, "epoch": 860} {"train_loss": -10.557720184326172, "global_step": 144620, "epoch": 860} {"train_loss": -10.591287612915039, "global_step": 144621, "epoch": 860} {"train_loss": -10.618234634399414, "global_step": 144622, "epoch": 860} {"train_loss": -10.671712875366211, "global_step": 144623, "epoch": 860} {"train_loss": -10.341079711914062, "global_step": 144624, "epoch": 860} {"train_loss": -10.708681106567383, "global_step": 144625, "epoch": 860} {"train_loss": -10.778093338012695, "global_step": 144626, "epoch": 860} {"train_loss": -10.363775253295898, "global_step": 144627, "epoch": 860} {"train_loss": -10.640335083007812, "global_step": 144628, "epoch": 860} {"train_loss": -10.581912994384766, "global_step": 144629, "epoch": 860} {"train_loss": -10.587799072265625, "global_step": 144630, "epoch": 860} {"train_loss": -10.637615203857422, "global_step": 144631, "epoch": 860} {"train_loss": -10.787240028381348, "global_step": 144632, "epoch": 860} {"train_loss": -10.817728042602539, "global_step": 144633, "epoch": 860} {"train_loss": -10.681428909301758, "global_step": 144634, "epoch": 860} {"train_loss": -10.411172866821289, "global_step": 144635, "epoch": 860} {"train_loss": -10.715316772460938, "global_step": 144636, "epoch": 860} {"train_loss": -10.514759063720703, "global_step": 144637, "epoch": 860} {"train_loss": -10.707757949829102, "global_step": 144638, "epoch": 860} {"train_loss": -10.34086799621582, "global_step": 144639, "epoch": 860} {"train_loss": -10.667718887329102, "global_step": 144640, "epoch": 860} {"train_loss": -10.787500381469727, "global_step": 144641, "epoch": 860} {"train_loss": -10.524872779846191, "global_step": 144642, "epoch": 860} {"train_loss": -10.920069694519043, "global_step": 144643, "epoch": 860} {"train_loss": -10.761395454406738, "global_step": 144644, "epoch": 860} {"train_loss": -10.852275848388672, "global_step": 144645, "epoch": 860} {"train_loss": -10.615396499633789, "global_step": 144646, "epoch": 860} {"train_loss": -10.494742739768256, "global_step": 144647, "epoch": 860, "val_loss": 225132.65625, "train_action_mse_error": 1.8052918910980225} {"train_loss": -10.916566848754883, "global_step": 144648, "epoch": 861} {"train_loss": -10.429130554199219, "global_step": 144649, "epoch": 861} {"train_loss": -10.914459228515625, "global_step": 144650, "epoch": 861} {"train_loss": -10.871270179748535, "global_step": 144651, "epoch": 861} {"train_loss": -10.77371597290039, "global_step": 144652, "epoch": 861} {"train_loss": -11.008113861083984, "global_step": 144653, "epoch": 861} {"train_loss": -10.986225128173828, "global_step": 144654, "epoch": 861} {"train_loss": -10.915630340576172, "global_step": 144655, "epoch": 861} {"train_loss": -10.792448043823242, "global_step": 144656, "epoch": 861} {"train_loss": -10.886938095092773, "global_step": 144657, "epoch": 861} {"train_loss": -10.898795127868652, "global_step": 144658, "epoch": 861} {"train_loss": -10.94497013092041, "global_step": 144659, "epoch": 861} {"train_loss": -10.880414009094238, "global_step": 144660, "epoch": 861} {"train_loss": -10.941664695739746, "global_step": 144661, "epoch": 861} {"train_loss": -11.107230186462402, "global_step": 144662, "epoch": 861} {"train_loss": -10.660541534423828, "global_step": 144663, "epoch": 861} {"train_loss": -11.038835525512695, "global_step": 144664, "epoch": 861} {"train_loss": -11.161091804504395, "global_step": 144665, "epoch": 861} {"train_loss": -10.883199691772461, "global_step": 144666, "epoch": 861} {"train_loss": -10.94347095489502, "global_step": 144667, "epoch": 861} {"train_loss": -10.78058910369873, "global_step": 144668, "epoch": 861} {"train_loss": -11.057502746582031, "global_step": 144669, "epoch": 861} {"train_loss": -10.713835716247559, "global_step": 144670, "epoch": 861} {"train_loss": -10.859821319580078, "global_step": 144671, "epoch": 861} {"train_loss": -10.591597557067871, "global_step": 144672, "epoch": 861} {"train_loss": -10.663934707641602, "global_step": 144673, "epoch": 861} {"train_loss": -10.844795227050781, "global_step": 144674, "epoch": 861} {"train_loss": -11.129631042480469, "global_step": 144675, "epoch": 861} {"train_loss": -10.909245491027832, "global_step": 144676, "epoch": 861} {"train_loss": -10.903670310974121, "global_step": 144677, "epoch": 861} {"train_loss": -10.984579086303711, "global_step": 144678, "epoch": 861} {"train_loss": -10.877095222473145, "global_step": 144679, "epoch": 861} {"train_loss": -10.669748306274414, "global_step": 144680, "epoch": 861} {"train_loss": -10.91913890838623, "global_step": 144681, "epoch": 861} {"train_loss": -10.849759101867676, "global_step": 144682, "epoch": 861} {"train_loss": -10.4470796585083, "global_step": 144683, "epoch": 861} {"train_loss": -10.586445808410645, "global_step": 144684, "epoch": 861} {"train_loss": -10.98945426940918, "global_step": 144685, "epoch": 861} {"train_loss": -10.811635971069336, "global_step": 144686, "epoch": 861} {"train_loss": -10.485847473144531, "global_step": 144687, "epoch": 861} {"train_loss": -10.837610244750977, "global_step": 144688, "epoch": 861} {"train_loss": -10.465927124023438, "global_step": 144689, "epoch": 861} {"train_loss": -10.66099739074707, "global_step": 144690, "epoch": 861} {"train_loss": -10.791833877563477, "global_step": 144691, "epoch": 861} {"train_loss": -10.543041229248047, "global_step": 144692, "epoch": 861} {"train_loss": -10.799025535583496, "global_step": 144693, "epoch": 861} {"train_loss": -10.68382453918457, "global_step": 144694, "epoch": 861} {"train_loss": -10.596263885498047, "global_step": 144695, "epoch": 861} {"train_loss": -10.498992919921875, "global_step": 144696, "epoch": 861} {"train_loss": -10.881845474243164, "global_step": 144697, "epoch": 861} {"train_loss": -10.33473014831543, "global_step": 144698, "epoch": 861} {"train_loss": -10.69565200805664, "global_step": 144699, "epoch": 861} {"train_loss": -10.639659881591797, "global_step": 144700, "epoch": 861} {"train_loss": -10.15157699584961, "global_step": 144701, "epoch": 861} {"train_loss": -10.225919723510742, "global_step": 144702, "epoch": 861} {"train_loss": -10.852099418640137, "global_step": 144703, "epoch": 861} {"train_loss": -10.281264305114746, "global_step": 144704, "epoch": 861} {"train_loss": -10.811723709106445, "global_step": 144705, "epoch": 861} {"train_loss": -10.450279235839844, "global_step": 144706, "epoch": 861} {"train_loss": -10.699605941772461, "global_step": 144707, "epoch": 861} {"train_loss": -10.252904891967773, "global_step": 144708, "epoch": 861} {"train_loss": -10.766109466552734, "global_step": 144709, "epoch": 861} {"train_loss": -10.350855827331543, "global_step": 144710, "epoch": 861} {"train_loss": -10.843338966369629, "global_step": 144711, "epoch": 861} {"train_loss": -10.473695755004883, "global_step": 144712, "epoch": 861} {"train_loss": -10.364336967468262, "global_step": 144713, "epoch": 861} {"train_loss": -10.652546882629395, "global_step": 144714, "epoch": 861} {"train_loss": -9.986781120300293, "global_step": 144715, "epoch": 861} {"train_loss": -10.609451293945312, "global_step": 144716, "epoch": 861} {"train_loss": -10.014381408691406, "global_step": 144717, "epoch": 861} {"train_loss": -10.346260070800781, "global_step": 144718, "epoch": 861} {"train_loss": -10.463733673095703, "global_step": 144719, "epoch": 861} {"train_loss": -10.209606170654297, "global_step": 144720, "epoch": 861} {"train_loss": -10.387109756469727, "global_step": 144721, "epoch": 861} {"train_loss": -10.315152168273926, "global_step": 144722, "epoch": 861} {"train_loss": -10.697131156921387, "global_step": 144723, "epoch": 861} {"train_loss": -10.561746597290039, "global_step": 144724, "epoch": 861} {"train_loss": -10.296422958374023, "global_step": 144725, "epoch": 861} {"train_loss": -10.62618637084961, "global_step": 144726, "epoch": 861} {"train_loss": -10.702001571655273, "global_step": 144727, "epoch": 861} {"train_loss": -10.404038429260254, "global_step": 144728, "epoch": 861} {"train_loss": -10.800683975219727, "global_step": 144729, "epoch": 861} {"train_loss": -10.45814323425293, "global_step": 144730, "epoch": 861} {"train_loss": -10.647994995117188, "global_step": 144731, "epoch": 861} {"train_loss": -10.519892692565918, "global_step": 144732, "epoch": 861} {"train_loss": -10.116861343383789, "global_step": 144733, "epoch": 861} {"train_loss": -10.681427001953125, "global_step": 144734, "epoch": 861} {"train_loss": -10.381245613098145, "global_step": 144735, "epoch": 861} {"train_loss": -10.50051212310791, "global_step": 144736, "epoch": 861} {"train_loss": -10.650222778320312, "global_step": 144737, "epoch": 861} {"train_loss": -10.417203903198242, "global_step": 144738, "epoch": 861} {"train_loss": -10.294116973876953, "global_step": 144739, "epoch": 861} {"train_loss": -10.597664833068848, "global_step": 144740, "epoch": 861} {"train_loss": -10.51489543914795, "global_step": 144741, "epoch": 861} {"train_loss": -10.585017204284668, "global_step": 144742, "epoch": 861} {"train_loss": -10.62515640258789, "global_step": 144743, "epoch": 861} {"train_loss": -10.219213485717773, "global_step": 144744, "epoch": 861} {"train_loss": -10.675042152404785, "global_step": 144745, "epoch": 861} {"train_loss": -10.330320358276367, "global_step": 144746, "epoch": 861} {"train_loss": -10.10823917388916, "global_step": 144747, "epoch": 861} {"train_loss": -9.795419692993164, "global_step": 144748, "epoch": 861} {"train_loss": -10.10696792602539, "global_step": 144749, "epoch": 861} {"train_loss": -10.276230812072754, "global_step": 144750, "epoch": 861} {"train_loss": -10.024070739746094, "global_step": 144751, "epoch": 861} {"train_loss": -10.410602569580078, "global_step": 144752, "epoch": 861} {"train_loss": -10.45075798034668, "global_step": 144753, "epoch": 861} {"train_loss": -10.325004577636719, "global_step": 144754, "epoch": 861} {"train_loss": -10.202277183532715, "global_step": 144755, "epoch": 861} {"train_loss": -10.63231086730957, "global_step": 144756, "epoch": 861} {"train_loss": -10.909685134887695, "global_step": 144757, "epoch": 861} {"train_loss": -10.349822044372559, "global_step": 144758, "epoch": 861} {"train_loss": -10.798046112060547, "global_step": 144759, "epoch": 861} {"train_loss": -10.328737258911133, "global_step": 144760, "epoch": 861} {"train_loss": -10.43829345703125, "global_step": 144761, "epoch": 861} {"train_loss": -10.672933578491211, "global_step": 144762, "epoch": 861} {"train_loss": -10.699272155761719, "global_step": 144763, "epoch": 861} {"train_loss": -10.537790298461914, "global_step": 144764, "epoch": 861} {"train_loss": -10.23556137084961, "global_step": 144765, "epoch": 861} {"train_loss": -10.729394912719727, "global_step": 144766, "epoch": 861} {"train_loss": -10.533788681030273, "global_step": 144767, "epoch": 861} {"train_loss": -10.807920455932617, "global_step": 144768, "epoch": 861} {"train_loss": -10.835819244384766, "global_step": 144769, "epoch": 861} {"train_loss": -10.712455749511719, "global_step": 144770, "epoch": 861} {"train_loss": -10.887327194213867, "global_step": 144771, "epoch": 861} {"train_loss": -10.625244140625, "global_step": 144772, "epoch": 861} {"train_loss": -10.870830535888672, "global_step": 144773, "epoch": 861} {"train_loss": -10.664603233337402, "global_step": 144774, "epoch": 861} {"train_loss": -10.917848587036133, "global_step": 144775, "epoch": 861} {"train_loss": -10.704952239990234, "global_step": 144776, "epoch": 861} {"train_loss": -11.001288414001465, "global_step": 144777, "epoch": 861} {"train_loss": -10.997742652893066, "global_step": 144778, "epoch": 861} {"train_loss": -10.882893562316895, "global_step": 144779, "epoch": 861} {"train_loss": -10.778505325317383, "global_step": 144780, "epoch": 861} {"train_loss": -10.97813892364502, "global_step": 144781, "epoch": 861} {"train_loss": -10.953584671020508, "global_step": 144782, "epoch": 861} {"train_loss": -11.136253356933594, "global_step": 144783, "epoch": 861} {"train_loss": -10.81760025024414, "global_step": 144784, "epoch": 861} {"train_loss": -11.082290649414062, "global_step": 144785, "epoch": 861} {"train_loss": -10.839615821838379, "global_step": 144786, "epoch": 861} {"train_loss": -10.848075866699219, "global_step": 144787, "epoch": 861} {"train_loss": -10.891474723815918, "global_step": 144788, "epoch": 861} {"train_loss": -11.014263153076172, "global_step": 144789, "epoch": 861} {"train_loss": -10.7462739944458, "global_step": 144790, "epoch": 861} {"train_loss": -10.930059432983398, "global_step": 144791, "epoch": 861} {"train_loss": -10.884251594543457, "global_step": 144792, "epoch": 861} {"train_loss": -10.88754653930664, "global_step": 144793, "epoch": 861} {"train_loss": -10.892091751098633, "global_step": 144794, "epoch": 861} {"train_loss": -10.598864555358887, "global_step": 144795, "epoch": 861} {"train_loss": -10.840654373168945, "global_step": 144796, "epoch": 861} {"train_loss": -10.934951782226562, "global_step": 144797, "epoch": 861} {"train_loss": -10.836098670959473, "global_step": 144798, "epoch": 861} {"train_loss": -10.62905502319336, "global_step": 144799, "epoch": 861} {"train_loss": -10.893396377563477, "global_step": 144800, "epoch": 861} {"train_loss": -11.06422233581543, "global_step": 144801, "epoch": 861} {"train_loss": -10.436159133911133, "global_step": 144802, "epoch": 861} {"train_loss": -10.51703929901123, "global_step": 144803, "epoch": 861} {"train_loss": -10.105645179748535, "global_step": 144804, "epoch": 861} {"train_loss": -10.8734130859375, "global_step": 144805, "epoch": 861} {"train_loss": -10.643610954284668, "global_step": 144806, "epoch": 861} {"train_loss": -10.486461639404297, "global_step": 144807, "epoch": 861} {"train_loss": -10.048864364624023, "global_step": 144808, "epoch": 861} {"train_loss": -10.868670463562012, "global_step": 144809, "epoch": 861} {"train_loss": -10.323660850524902, "global_step": 144810, "epoch": 861} {"train_loss": -10.372684478759766, "global_step": 144811, "epoch": 861} {"train_loss": -10.789144515991211, "global_step": 144812, "epoch": 861} {"train_loss": -10.056636810302734, "global_step": 144813, "epoch": 861} {"train_loss": -10.453125953674316, "global_step": 144814, "epoch": 861} {"train_loss": -10.647093892097473, "global_step": 144815, "epoch": 861, "val_loss": 228444.5} {"train_loss": -10.391036987304688, "global_step": 144816, "epoch": 862} {"train_loss": -10.661012649536133, "global_step": 144817, "epoch": 862} {"train_loss": -10.447319030761719, "global_step": 144818, "epoch": 862} {"train_loss": -10.684160232543945, "global_step": 144819, "epoch": 862} {"train_loss": -10.759537696838379, "global_step": 144820, "epoch": 862} {"train_loss": -10.530385971069336, "global_step": 144821, "epoch": 862} {"train_loss": -10.455682754516602, "global_step": 144822, "epoch": 862} {"train_loss": -10.194942474365234, "global_step": 144823, "epoch": 862} {"train_loss": -10.840940475463867, "global_step": 144824, "epoch": 862} {"train_loss": -10.189413070678711, "global_step": 144825, "epoch": 862} {"train_loss": -10.629201889038086, "global_step": 144826, "epoch": 862} {"train_loss": -10.70697021484375, "global_step": 144827, "epoch": 862} {"train_loss": -10.649998664855957, "global_step": 144828, "epoch": 862} {"train_loss": -10.611268997192383, "global_step": 144829, "epoch": 862} {"train_loss": -10.474750518798828, "global_step": 144830, "epoch": 862} {"train_loss": -10.527214050292969, "global_step": 144831, "epoch": 862} {"train_loss": -10.738941192626953, "global_step": 144832, "epoch": 862} {"train_loss": -10.500804901123047, "global_step": 144833, "epoch": 862} {"train_loss": -10.563945770263672, "global_step": 144834, "epoch": 862} {"train_loss": -10.519519805908203, "global_step": 144835, "epoch": 862} {"train_loss": -10.635095596313477, "global_step": 144836, "epoch": 862} {"train_loss": -10.290314674377441, "global_step": 144837, "epoch": 862} {"train_loss": -10.620489120483398, "global_step": 144838, "epoch": 862} {"train_loss": -10.67538070678711, "global_step": 144839, "epoch": 862} {"train_loss": -10.357940673828125, "global_step": 144840, "epoch": 862} {"train_loss": -10.690239906311035, "global_step": 144841, "epoch": 862} {"train_loss": -10.553596496582031, "global_step": 144842, "epoch": 862} {"train_loss": -10.477218627929688, "global_step": 144843, "epoch": 862} {"train_loss": -10.790607452392578, "global_step": 144844, "epoch": 862} {"train_loss": -10.635305404663086, "global_step": 144845, "epoch": 862} {"train_loss": -10.728536605834961, "global_step": 144846, "epoch": 862} {"train_loss": -10.305623054504395, "global_step": 144847, "epoch": 862} {"train_loss": -10.708385467529297, "global_step": 144848, "epoch": 862} {"train_loss": -10.824811935424805, "global_step": 144849, "epoch": 862} {"train_loss": -10.631330490112305, "global_step": 144850, "epoch": 862} {"train_loss": -11.016390800476074, "global_step": 144851, "epoch": 862} {"train_loss": -10.664095878601074, "global_step": 144852, "epoch": 862} {"train_loss": -10.743671417236328, "global_step": 144853, "epoch": 862} {"train_loss": -10.252405166625977, "global_step": 144854, "epoch": 862} {"train_loss": -10.886103630065918, "global_step": 144855, "epoch": 862} {"train_loss": -10.396984100341797, "global_step": 144856, "epoch": 862} {"train_loss": -10.357914924621582, "global_step": 144857, "epoch": 862} {"train_loss": -10.662288665771484, "global_step": 144858, "epoch": 862} {"train_loss": -10.466038703918457, "global_step": 144859, "epoch": 862} {"train_loss": -10.913055419921875, "global_step": 144860, "epoch": 862} {"train_loss": -10.652849197387695, "global_step": 144861, "epoch": 862} {"train_loss": -10.724740982055664, "global_step": 144862, "epoch": 862} {"train_loss": -10.350285530090332, "global_step": 144863, "epoch": 862} {"train_loss": -10.822271347045898, "global_step": 144864, "epoch": 862} {"train_loss": -10.666242599487305, "global_step": 144865, "epoch": 862} {"train_loss": -10.537765502929688, "global_step": 144866, "epoch": 862} {"train_loss": -10.394195556640625, "global_step": 144867, "epoch": 862} {"train_loss": -10.573477745056152, "global_step": 144868, "epoch": 862} {"train_loss": -10.84268569946289, "global_step": 144869, "epoch": 862} {"train_loss": -10.393133163452148, "global_step": 144870, "epoch": 862} {"train_loss": -10.690861701965332, "global_step": 144871, "epoch": 862} {"train_loss": -10.878479957580566, "global_step": 144872, "epoch": 862} {"train_loss": -10.826187133789062, "global_step": 144873, "epoch": 862} {"train_loss": -10.92081356048584, "global_step": 144874, "epoch": 862} {"train_loss": -10.343720436096191, "global_step": 144875, "epoch": 862} {"train_loss": -10.809343338012695, "global_step": 144876, "epoch": 862} {"train_loss": -10.739704132080078, "global_step": 144877, "epoch": 862} {"train_loss": -10.798698425292969, "global_step": 144878, "epoch": 862} {"train_loss": -10.802408218383789, "global_step": 144879, "epoch": 862} {"train_loss": -10.746512413024902, "global_step": 144880, "epoch": 862} {"train_loss": -10.616352081298828, "global_step": 144881, "epoch": 862} {"train_loss": -11.001198768615723, "global_step": 144882, "epoch": 862} {"train_loss": -10.820944786071777, "global_step": 144883, "epoch": 862} {"train_loss": -10.703866958618164, "global_step": 144884, "epoch": 862} {"train_loss": -10.755666732788086, "global_step": 144885, "epoch": 862} {"train_loss": -10.328412055969238, "global_step": 144886, "epoch": 862} {"train_loss": -10.666457176208496, "global_step": 144887, "epoch": 862} {"train_loss": -10.668664932250977, "global_step": 144888, "epoch": 862} {"train_loss": -9.929793357849121, "global_step": 144889, "epoch": 862} {"train_loss": -10.65235710144043, "global_step": 144890, "epoch": 862} {"train_loss": -10.538232803344727, "global_step": 144891, "epoch": 862} {"train_loss": -10.589363098144531, "global_step": 144892, "epoch": 862} {"train_loss": -10.825150489807129, "global_step": 144893, "epoch": 862} {"train_loss": -10.592355728149414, "global_step": 144894, "epoch": 862} {"train_loss": -10.653554916381836, "global_step": 144895, "epoch": 862} {"train_loss": -10.620695114135742, "global_step": 144896, "epoch": 862} {"train_loss": -10.645386695861816, "global_step": 144897, "epoch": 862} {"train_loss": -10.400857925415039, "global_step": 144898, "epoch": 862} {"train_loss": -10.59223461151123, "global_step": 144899, "epoch": 862} {"train_loss": -10.649126052856445, "global_step": 144900, "epoch": 862} {"train_loss": -10.877111434936523, "global_step": 144901, "epoch": 862} {"train_loss": -10.552047729492188, "global_step": 144902, "epoch": 862} {"train_loss": -10.526914596557617, "global_step": 144903, "epoch": 862} {"train_loss": -10.418354034423828, "global_step": 144904, "epoch": 862} {"train_loss": -10.612290382385254, "global_step": 144905, "epoch": 862} {"train_loss": -10.755453109741211, "global_step": 144906, "epoch": 862} {"train_loss": -10.734176635742188, "global_step": 144907, "epoch": 862} {"train_loss": -10.65962028503418, "global_step": 144908, "epoch": 862} {"train_loss": -10.250951766967773, "global_step": 144909, "epoch": 862} {"train_loss": -10.486865997314453, "global_step": 144910, "epoch": 862} {"train_loss": -10.521820068359375, "global_step": 144911, "epoch": 862} {"train_loss": -10.372213363647461, "global_step": 144912, "epoch": 862} {"train_loss": -10.92906665802002, "global_step": 144913, "epoch": 862} {"train_loss": -10.449174880981445, "global_step": 144914, "epoch": 862} {"train_loss": -10.436431884765625, "global_step": 144915, "epoch": 862} {"train_loss": -10.82088851928711, "global_step": 144916, "epoch": 862} {"train_loss": -10.59895133972168, "global_step": 144917, "epoch": 862} {"train_loss": -10.52865219116211, "global_step": 144918, "epoch": 862} {"train_loss": -10.46082592010498, "global_step": 144919, "epoch": 862} {"train_loss": -10.684114456176758, "global_step": 144920, "epoch": 862} {"train_loss": -10.280344009399414, "global_step": 144921, "epoch": 862} {"train_loss": -10.569000244140625, "global_step": 144922, "epoch": 862} {"train_loss": -10.261999130249023, "global_step": 144923, "epoch": 862} {"train_loss": -10.32145881652832, "global_step": 144924, "epoch": 862} {"train_loss": -10.237460136413574, "global_step": 144925, "epoch": 862} {"train_loss": -10.379263877868652, "global_step": 144926, "epoch": 862} {"train_loss": -10.535669326782227, "global_step": 144927, "epoch": 862} {"train_loss": -10.499641418457031, "global_step": 144928, "epoch": 862} {"train_loss": -10.524473190307617, "global_step": 144929, "epoch": 862} {"train_loss": -10.636220932006836, "global_step": 144930, "epoch": 862} {"train_loss": -10.532408714294434, "global_step": 144931, "epoch": 862} {"train_loss": -10.427882194519043, "global_step": 144932, "epoch": 862} {"train_loss": -10.517818450927734, "global_step": 144933, "epoch": 862} {"train_loss": -10.279888153076172, "global_step": 144934, "epoch": 862} {"train_loss": -10.774861335754395, "global_step": 144935, "epoch": 862} {"train_loss": -10.27568244934082, "global_step": 144936, "epoch": 862} {"train_loss": -10.576967239379883, "global_step": 144937, "epoch": 862} {"train_loss": -10.374958992004395, "global_step": 144938, "epoch": 862} {"train_loss": -10.875279426574707, "global_step": 144939, "epoch": 862} {"train_loss": -10.311691284179688, "global_step": 144940, "epoch": 862} {"train_loss": -10.637002944946289, "global_step": 144941, "epoch": 862} {"train_loss": -10.399065017700195, "global_step": 144942, "epoch": 862} {"train_loss": -10.73234748840332, "global_step": 144943, "epoch": 862} {"train_loss": -10.140825271606445, "global_step": 144944, "epoch": 862} {"train_loss": -10.263142585754395, "global_step": 144945, "epoch": 862} {"train_loss": -10.332630157470703, "global_step": 144946, "epoch": 862} {"train_loss": -10.628026008605957, "global_step": 144947, "epoch": 862} {"train_loss": -10.722487449645996, "global_step": 144948, "epoch": 862} {"train_loss": -10.445259094238281, "global_step": 144949, "epoch": 862} {"train_loss": -10.459515571594238, "global_step": 144950, "epoch": 862} {"train_loss": -10.554162979125977, "global_step": 144951, "epoch": 862} {"train_loss": -10.532503128051758, "global_step": 144952, "epoch": 862} {"train_loss": -10.712786674499512, "global_step": 144953, "epoch": 862} {"train_loss": -10.79847526550293, "global_step": 144954, "epoch": 862} {"train_loss": -10.59850788116455, "global_step": 144955, "epoch": 862} {"train_loss": -10.652742385864258, "global_step": 144956, "epoch": 862} {"train_loss": -10.925142288208008, "global_step": 144957, "epoch": 862} {"train_loss": -10.844541549682617, "global_step": 144958, "epoch": 862} {"train_loss": -10.773598670959473, "global_step": 144959, "epoch": 862} {"train_loss": -10.545978546142578, "global_step": 144960, "epoch": 862} {"train_loss": -10.747146606445312, "global_step": 144961, "epoch": 862} {"train_loss": -10.782448768615723, "global_step": 144962, "epoch": 862} {"train_loss": -10.708189010620117, "global_step": 144963, "epoch": 862} {"train_loss": -10.777939796447754, "global_step": 144964, "epoch": 862} {"train_loss": -10.44041633605957, "global_step": 144965, "epoch": 862} {"train_loss": -10.501367568969727, "global_step": 144966, "epoch": 862} {"train_loss": -10.715841293334961, "global_step": 144967, "epoch": 862} {"train_loss": -10.390436172485352, "global_step": 144968, "epoch": 862} {"train_loss": -10.531286239624023, "global_step": 144969, "epoch": 862} {"train_loss": -10.190315246582031, "global_step": 144970, "epoch": 862} {"train_loss": -10.661867141723633, "global_step": 144971, "epoch": 862} {"train_loss": -10.040534973144531, "global_step": 144972, "epoch": 862} {"train_loss": -10.602957725524902, "global_step": 144973, "epoch": 862} {"train_loss": -10.109421730041504, "global_step": 144974, "epoch": 862} {"train_loss": -10.53874397277832, "global_step": 144975, "epoch": 862} {"train_loss": -10.439315795898438, "global_step": 144976, "epoch": 862} {"train_loss": -10.50908374786377, "global_step": 144977, "epoch": 862} {"train_loss": -10.687649726867676, "global_step": 144978, "epoch": 862} {"train_loss": -10.667327880859375, "global_step": 144979, "epoch": 862} {"train_loss": -10.871498107910156, "global_step": 144980, "epoch": 862} {"train_loss": -10.599405288696289, "global_step": 144981, "epoch": 862} {"train_loss": -10.796881675720215, "global_step": 144982, "epoch": 862} {"train_loss": -10.580358828817095, "global_step": 144983, "epoch": 862, "val_loss": 229713.59375} {"train_loss": -10.623780250549316, "global_step": 144984, "epoch": 863} {"train_loss": -10.528542518615723, "global_step": 144985, "epoch": 863} {"train_loss": -10.573902130126953, "global_step": 144986, "epoch": 863} {"train_loss": -10.277316093444824, "global_step": 144987, "epoch": 863} {"train_loss": -10.88311767578125, "global_step": 144988, "epoch": 863} {"train_loss": -10.723122596740723, "global_step": 144989, "epoch": 863} {"train_loss": -10.655179977416992, "global_step": 144990, "epoch": 863} {"train_loss": -10.774256706237793, "global_step": 144991, "epoch": 863} {"train_loss": -10.659398078918457, "global_step": 144992, "epoch": 863} {"train_loss": -10.719779968261719, "global_step": 144993, "epoch": 863} {"train_loss": -10.744462966918945, "global_step": 144994, "epoch": 863} {"train_loss": -10.778665542602539, "global_step": 144995, "epoch": 863} {"train_loss": -11.069347381591797, "global_step": 144996, "epoch": 863} {"train_loss": -10.728020668029785, "global_step": 144997, "epoch": 863} {"train_loss": -10.73231029510498, "global_step": 144998, "epoch": 863} {"train_loss": -10.537853240966797, "global_step": 144999, "epoch": 863} {"train_loss": -9.944940567016602, "global_step": 145000, "epoch": 863} {"train_loss": -10.849888801574707, "global_step": 145001, "epoch": 863} {"train_loss": -10.097074508666992, "global_step": 145002, "epoch": 863} {"train_loss": -10.226329803466797, "global_step": 145003, "epoch": 863} {"train_loss": -10.698034286499023, "global_step": 145004, "epoch": 863} {"train_loss": -10.544574737548828, "global_step": 145005, "epoch": 863} {"train_loss": -10.64439582824707, "global_step": 145006, "epoch": 863} {"train_loss": -10.324568748474121, "global_step": 145007, "epoch": 863} {"train_loss": -10.749591827392578, "global_step": 145008, "epoch": 863} {"train_loss": -10.74794864654541, "global_step": 145009, "epoch": 863} {"train_loss": -10.280170440673828, "global_step": 145010, "epoch": 863} {"train_loss": -10.853769302368164, "global_step": 145011, "epoch": 863} {"train_loss": -10.299419403076172, "global_step": 145012, "epoch": 863} {"train_loss": -10.499004364013672, "global_step": 145013, "epoch": 863} {"train_loss": -10.02302360534668, "global_step": 145014, "epoch": 863} {"train_loss": -10.567872047424316, "global_step": 145015, "epoch": 863} {"train_loss": -10.375614166259766, "global_step": 145016, "epoch": 863} {"train_loss": -10.388477325439453, "global_step": 145017, "epoch": 863} {"train_loss": -10.461749076843262, "global_step": 145018, "epoch": 863} {"train_loss": -10.640118598937988, "global_step": 145019, "epoch": 863} {"train_loss": -10.264167785644531, "global_step": 145020, "epoch": 863} {"train_loss": -10.80406379699707, "global_step": 145021, "epoch": 863} {"train_loss": -10.270052909851074, "global_step": 145022, "epoch": 863} {"train_loss": -10.968595504760742, "global_step": 145023, "epoch": 863} {"train_loss": -10.634502410888672, "global_step": 145024, "epoch": 863} {"train_loss": -10.559171676635742, "global_step": 145025, "epoch": 863} {"train_loss": -10.661896705627441, "global_step": 145026, "epoch": 863} {"train_loss": -10.068314552307129, "global_step": 145027, "epoch": 863} {"train_loss": -10.476411819458008, "global_step": 145028, "epoch": 863} {"train_loss": -10.12545108795166, "global_step": 145029, "epoch": 863} {"train_loss": -10.38121509552002, "global_step": 145030, "epoch": 863} {"train_loss": -10.729545593261719, "global_step": 145031, "epoch": 863} {"train_loss": -10.68266487121582, "global_step": 145032, "epoch": 863} {"train_loss": -10.48453140258789, "global_step": 145033, "epoch": 863} {"train_loss": -10.525971412658691, "global_step": 145034, "epoch": 863} {"train_loss": -10.505645751953125, "global_step": 145035, "epoch": 863} {"train_loss": -10.343677520751953, "global_step": 145036, "epoch": 863} {"train_loss": -10.398857116699219, "global_step": 145037, "epoch": 863} {"train_loss": -10.581228256225586, "global_step": 145038, "epoch": 863} {"train_loss": -10.26593017578125, "global_step": 145039, "epoch": 863} {"train_loss": -10.537907600402832, "global_step": 145040, "epoch": 863} {"train_loss": -10.407302856445312, "global_step": 145041, "epoch": 863} {"train_loss": -10.353397369384766, "global_step": 145042, "epoch": 863} {"train_loss": -10.385924339294434, "global_step": 145043, "epoch": 863} {"train_loss": -10.879138946533203, "global_step": 145044, "epoch": 863} {"train_loss": -10.101106643676758, "global_step": 145045, "epoch": 863} {"train_loss": -10.649497032165527, "global_step": 145046, "epoch": 863} {"train_loss": -10.231369972229004, "global_step": 145047, "epoch": 863} {"train_loss": -10.479368209838867, "global_step": 145048, "epoch": 863} {"train_loss": -10.385574340820312, "global_step": 145049, "epoch": 863} {"train_loss": -10.330254554748535, "global_step": 145050, "epoch": 863} {"train_loss": -10.420181274414062, "global_step": 145051, "epoch": 863} {"train_loss": -10.322607040405273, "global_step": 145052, "epoch": 863} {"train_loss": -10.483484268188477, "global_step": 145053, "epoch": 863} {"train_loss": -10.215890884399414, "global_step": 145054, "epoch": 863} {"train_loss": -10.41832160949707, "global_step": 145055, "epoch": 863} {"train_loss": -10.608872413635254, "global_step": 145056, "epoch": 863} {"train_loss": -10.459695816040039, "global_step": 145057, "epoch": 863} {"train_loss": -10.221187591552734, "global_step": 145058, "epoch": 863} {"train_loss": -10.698587417602539, "global_step": 145059, "epoch": 863} {"train_loss": -10.48178768157959, "global_step": 145060, "epoch": 863} {"train_loss": -10.679953575134277, "global_step": 145061, "epoch": 863} {"train_loss": -10.543390274047852, "global_step": 145062, "epoch": 863} {"train_loss": -10.505131721496582, "global_step": 145063, "epoch": 863} {"train_loss": -10.548440933227539, "global_step": 145064, "epoch": 863} {"train_loss": -10.56527328491211, "global_step": 145065, "epoch": 863} {"train_loss": -10.833873748779297, "global_step": 145066, "epoch": 863} {"train_loss": -10.855914115905762, "global_step": 145067, "epoch": 863} {"train_loss": -10.827737808227539, "global_step": 145068, "epoch": 863} {"train_loss": -10.919775009155273, "global_step": 145069, "epoch": 863} {"train_loss": -10.932988166809082, "global_step": 145070, "epoch": 863} {"train_loss": -10.53971004486084, "global_step": 145071, "epoch": 863} {"train_loss": -10.551424980163574, "global_step": 145072, "epoch": 863} {"train_loss": -10.921334266662598, "global_step": 145073, "epoch": 863} {"train_loss": -10.63233757019043, "global_step": 145074, "epoch": 863} {"train_loss": -10.656180381774902, "global_step": 145075, "epoch": 863} {"train_loss": -10.850198745727539, "global_step": 145076, "epoch": 863} {"train_loss": -10.658387184143066, "global_step": 145077, "epoch": 863} {"train_loss": -10.74304485321045, "global_step": 145078, "epoch": 863} {"train_loss": -10.909594535827637, "global_step": 145079, "epoch": 863} {"train_loss": -10.843306541442871, "global_step": 145080, "epoch": 863} {"train_loss": -10.935657501220703, "global_step": 145081, "epoch": 863} {"train_loss": -10.645748138427734, "global_step": 145082, "epoch": 863} {"train_loss": -10.861621856689453, "global_step": 145083, "epoch": 863} {"train_loss": -10.829245567321777, "global_step": 145084, "epoch": 863} {"train_loss": -10.876151084899902, "global_step": 145085, "epoch": 863} {"train_loss": -10.841245651245117, "global_step": 145086, "epoch": 863} {"train_loss": -10.990792274475098, "global_step": 145087, "epoch": 863} {"train_loss": -10.676918029785156, "global_step": 145088, "epoch": 863} {"train_loss": -10.802087783813477, "global_step": 145089, "epoch": 863} {"train_loss": -10.462762832641602, "global_step": 145090, "epoch": 863} {"train_loss": -10.866214752197266, "global_step": 145091, "epoch": 863} {"train_loss": -10.358612060546875, "global_step": 145092, "epoch": 863} {"train_loss": -10.709966659545898, "global_step": 145093, "epoch": 863} {"train_loss": -10.756023406982422, "global_step": 145094, "epoch": 863} {"train_loss": -10.647454261779785, "global_step": 145095, "epoch": 863} {"train_loss": -10.805130004882812, "global_step": 145096, "epoch": 863} {"train_loss": -10.966413497924805, "global_step": 145097, "epoch": 863} {"train_loss": -10.778533935546875, "global_step": 145098, "epoch": 863} {"train_loss": -10.675359725952148, "global_step": 145099, "epoch": 863} {"train_loss": -11.15749454498291, "global_step": 145100, "epoch": 863} {"train_loss": -10.529500961303711, "global_step": 145101, "epoch": 863} {"train_loss": -10.907234191894531, "global_step": 145102, "epoch": 863} {"train_loss": -10.735580444335938, "global_step": 145103, "epoch": 863} {"train_loss": -10.986323356628418, "global_step": 145104, "epoch": 863} {"train_loss": -10.735333442687988, "global_step": 145105, "epoch": 863} {"train_loss": -10.325878143310547, "global_step": 145106, "epoch": 863} {"train_loss": -10.794178009033203, "global_step": 145107, "epoch": 863} {"train_loss": -10.628981590270996, "global_step": 145108, "epoch": 863} {"train_loss": -9.683509826660156, "global_step": 145109, "epoch": 863} {"train_loss": -10.953177452087402, "global_step": 145110, "epoch": 863} {"train_loss": -10.380189895629883, "global_step": 145111, "epoch": 863} {"train_loss": -10.3666353225708, "global_step": 145112, "epoch": 863} {"train_loss": -10.462363243103027, "global_step": 145113, "epoch": 863} {"train_loss": -9.930756568908691, "global_step": 145114, "epoch": 863} {"train_loss": -9.950052261352539, "global_step": 145115, "epoch": 863} {"train_loss": -10.105376243591309, "global_step": 145116, "epoch": 863} {"train_loss": -10.459149360656738, "global_step": 145117, "epoch": 863} {"train_loss": -10.294170379638672, "global_step": 145118, "epoch": 863} {"train_loss": -10.239508628845215, "global_step": 145119, "epoch": 863} {"train_loss": -10.387205123901367, "global_step": 145120, "epoch": 863} {"train_loss": -10.445451736450195, "global_step": 145121, "epoch": 863} {"train_loss": -10.345113754272461, "global_step": 145122, "epoch": 863} {"train_loss": -10.395498275756836, "global_step": 145123, "epoch": 863} {"train_loss": -10.568721771240234, "global_step": 145124, "epoch": 863} {"train_loss": -10.491850852966309, "global_step": 145125, "epoch": 863} {"train_loss": -10.655967712402344, "global_step": 145126, "epoch": 863} {"train_loss": -10.271615028381348, "global_step": 145127, "epoch": 863} {"train_loss": -10.249231338500977, "global_step": 145128, "epoch": 863} {"train_loss": -10.514678001403809, "global_step": 145129, "epoch": 863} {"train_loss": -10.506633758544922, "global_step": 145130, "epoch": 863} {"train_loss": -10.476673126220703, "global_step": 145131, "epoch": 863} {"train_loss": -10.394720077514648, "global_step": 145132, "epoch": 863} {"train_loss": -10.485797882080078, "global_step": 145133, "epoch": 863} {"train_loss": -10.570387840270996, "global_step": 145134, "epoch": 863} {"train_loss": -10.608551025390625, "global_step": 145135, "epoch": 863} {"train_loss": -10.665499687194824, "global_step": 145136, "epoch": 863} {"train_loss": -10.691926956176758, "global_step": 145137, "epoch": 863} {"train_loss": -10.66267204284668, "global_step": 145138, "epoch": 863} {"train_loss": -10.600566864013672, "global_step": 145139, "epoch": 863} {"train_loss": -10.340065956115723, "global_step": 145140, "epoch": 863} {"train_loss": -10.576803207397461, "global_step": 145141, "epoch": 863} {"train_loss": -10.271085739135742, "global_step": 145142, "epoch": 863} {"train_loss": -10.855995178222656, "global_step": 145143, "epoch": 863} {"train_loss": -10.728723526000977, "global_step": 145144, "epoch": 863} {"train_loss": -10.521966934204102, "global_step": 145145, "epoch": 863} {"train_loss": -10.689441680908203, "global_step": 145146, "epoch": 863} {"train_loss": -10.628870010375977, "global_step": 145147, "epoch": 863} {"train_loss": -10.830953598022461, "global_step": 145148, "epoch": 863} {"train_loss": -10.70360279083252, "global_step": 145149, "epoch": 863} {"train_loss": -10.559173583984375, "global_step": 145150, "epoch": 863} {"train_loss": -10.567535343624296, "global_step": 145151, "epoch": 863, "val_loss": 226523.40625} {"train_loss": -10.716178894042969, "global_step": 145152, "epoch": 864} {"train_loss": -10.849909782409668, "global_step": 145153, "epoch": 864} {"train_loss": -10.726208686828613, "global_step": 145154, "epoch": 864} {"train_loss": -10.579931259155273, "global_step": 145155, "epoch": 864} {"train_loss": -10.887614250183105, "global_step": 145156, "epoch": 864} {"train_loss": -10.411323547363281, "global_step": 145157, "epoch": 864} {"train_loss": -10.700929641723633, "global_step": 145158, "epoch": 864} {"train_loss": -11.04324722290039, "global_step": 145159, "epoch": 864} {"train_loss": -10.44636344909668, "global_step": 145160, "epoch": 864} {"train_loss": -10.963266372680664, "global_step": 145161, "epoch": 864} {"train_loss": -10.7720308303833, "global_step": 145162, "epoch": 864} {"train_loss": -10.891485214233398, "global_step": 145163, "epoch": 864} {"train_loss": -10.80253791809082, "global_step": 145164, "epoch": 864} {"train_loss": -10.928444862365723, "global_step": 145165, "epoch": 864} {"train_loss": -11.08017349243164, "global_step": 145166, "epoch": 864} {"train_loss": -10.66281509399414, "global_step": 145167, "epoch": 864} {"train_loss": -10.976927757263184, "global_step": 145168, "epoch": 864} {"train_loss": -10.877462387084961, "global_step": 145169, "epoch": 864} {"train_loss": -10.945903778076172, "global_step": 145170, "epoch": 864} {"train_loss": -10.469277381896973, "global_step": 145171, "epoch": 864} {"train_loss": -10.77145004272461, "global_step": 145172, "epoch": 864} {"train_loss": -10.517722129821777, "global_step": 145173, "epoch": 864} {"train_loss": -10.358163833618164, "global_step": 145174, "epoch": 864} {"train_loss": -9.94229507446289, "global_step": 145175, "epoch": 864} {"train_loss": -10.960882186889648, "global_step": 145176, "epoch": 864} {"train_loss": -10.073846817016602, "global_step": 145177, "epoch": 864} {"train_loss": -10.620302200317383, "global_step": 145178, "epoch": 864} {"train_loss": -10.529808044433594, "global_step": 145179, "epoch": 864} {"train_loss": -9.85317611694336, "global_step": 145180, "epoch": 864} {"train_loss": -10.880805015563965, "global_step": 145181, "epoch": 864} {"train_loss": -10.024559020996094, "global_step": 145182, "epoch": 864} {"train_loss": -10.584056854248047, "global_step": 145183, "epoch": 864} {"train_loss": -10.310995101928711, "global_step": 145184, "epoch": 864} {"train_loss": -10.77674674987793, "global_step": 145185, "epoch": 864} {"train_loss": -10.965740203857422, "global_step": 145186, "epoch": 864} {"train_loss": -10.65666389465332, "global_step": 145187, "epoch": 864} {"train_loss": -10.827442169189453, "global_step": 145188, "epoch": 864} {"train_loss": -10.320560455322266, "global_step": 145189, "epoch": 864} {"train_loss": -10.603599548339844, "global_step": 145190, "epoch": 864} {"train_loss": -10.78293228149414, "global_step": 145191, "epoch": 864} {"train_loss": -10.37544059753418, "global_step": 145192, "epoch": 864} {"train_loss": -10.662250518798828, "global_step": 145193, "epoch": 864} {"train_loss": -10.576507568359375, "global_step": 145194, "epoch": 864} {"train_loss": -10.906839370727539, "global_step": 145195, "epoch": 864} {"train_loss": -10.262018203735352, "global_step": 145196, "epoch": 864} {"train_loss": -10.52386474609375, "global_step": 145197, "epoch": 864} {"train_loss": -10.118053436279297, "global_step": 145198, "epoch": 864} {"train_loss": -10.486984252929688, "global_step": 145199, "epoch": 864} {"train_loss": -10.543206214904785, "global_step": 145200, "epoch": 864} {"train_loss": -10.339601516723633, "global_step": 145201, "epoch": 864} {"train_loss": -10.145098686218262, "global_step": 145202, "epoch": 864} {"train_loss": -10.26053237915039, "global_step": 145203, "epoch": 864} {"train_loss": -10.448220252990723, "global_step": 145204, "epoch": 864} {"train_loss": -10.782222747802734, "global_step": 145205, "epoch": 864} {"train_loss": -10.392507553100586, "global_step": 145206, "epoch": 864} {"train_loss": -10.321795463562012, "global_step": 145207, "epoch": 864} {"train_loss": -10.343123435974121, "global_step": 145208, "epoch": 864} {"train_loss": -10.252246856689453, "global_step": 145209, "epoch": 864} {"train_loss": -10.430330276489258, "global_step": 145210, "epoch": 864} {"train_loss": -9.889932632446289, "global_step": 145211, "epoch": 864} {"train_loss": -10.520922660827637, "global_step": 145212, "epoch": 864} {"train_loss": -10.164359092712402, "global_step": 145213, "epoch": 864} {"train_loss": -10.364349365234375, "global_step": 145214, "epoch": 864} {"train_loss": -10.266677856445312, "global_step": 145215, "epoch": 864} {"train_loss": -10.598793029785156, "global_step": 145216, "epoch": 864} {"train_loss": -10.059487342834473, "global_step": 145217, "epoch": 864} {"train_loss": -10.32253646850586, "global_step": 145218, "epoch": 864} {"train_loss": -10.052217483520508, "global_step": 145219, "epoch": 864} {"train_loss": -10.453446388244629, "global_step": 145220, "epoch": 864} {"train_loss": -10.2879056930542, "global_step": 145221, "epoch": 864} {"train_loss": -10.040544509887695, "global_step": 145222, "epoch": 864} {"train_loss": -10.379676818847656, "global_step": 145223, "epoch": 864} {"train_loss": -10.61391830444336, "global_step": 145224, "epoch": 864} {"train_loss": -10.550987243652344, "global_step": 145225, "epoch": 864} {"train_loss": -10.527250289916992, "global_step": 145226, "epoch": 864} {"train_loss": -10.41478157043457, "global_step": 145227, "epoch": 864} {"train_loss": -10.583169937133789, "global_step": 145228, "epoch": 864} {"train_loss": -10.376640319824219, "global_step": 145229, "epoch": 864} {"train_loss": -10.540887832641602, "global_step": 145230, "epoch": 864} {"train_loss": -10.516571044921875, "global_step": 145231, "epoch": 864} {"train_loss": -10.663381576538086, "global_step": 145232, "epoch": 864} {"train_loss": -10.530329704284668, "global_step": 145233, "epoch": 864} {"train_loss": -10.564634323120117, "global_step": 145234, "epoch": 864} {"train_loss": -10.577781677246094, "global_step": 145235, "epoch": 864} {"train_loss": -10.604104995727539, "global_step": 145236, "epoch": 864} {"train_loss": -10.60610580444336, "global_step": 145237, "epoch": 864} {"train_loss": -10.654935836791992, "global_step": 145238, "epoch": 864} {"train_loss": -10.879232406616211, "global_step": 145239, "epoch": 864} {"train_loss": -10.681726455688477, "global_step": 145240, "epoch": 864} {"train_loss": -10.751768112182617, "global_step": 145241, "epoch": 864} {"train_loss": -10.565698623657227, "global_step": 145242, "epoch": 864} {"train_loss": -10.574697494506836, "global_step": 145243, "epoch": 864} {"train_loss": -10.769508361816406, "global_step": 145244, "epoch": 864} {"train_loss": -10.702128410339355, "global_step": 145245, "epoch": 864} {"train_loss": -10.530623435974121, "global_step": 145246, "epoch": 864} {"train_loss": -10.684917449951172, "global_step": 145247, "epoch": 864} {"train_loss": -10.485288619995117, "global_step": 145248, "epoch": 864} {"train_loss": -10.679325103759766, "global_step": 145249, "epoch": 864} {"train_loss": -10.545858383178711, "global_step": 145250, "epoch": 864} {"train_loss": -10.8893404006958, "global_step": 145251, "epoch": 864} {"train_loss": -10.840864181518555, "global_step": 145252, "epoch": 864} {"train_loss": -10.836697578430176, "global_step": 145253, "epoch": 864} {"train_loss": -10.740779876708984, "global_step": 145254, "epoch": 864} {"train_loss": -10.555015563964844, "global_step": 145255, "epoch": 864} {"train_loss": -10.78421401977539, "global_step": 145256, "epoch": 864} {"train_loss": -10.574729919433594, "global_step": 145257, "epoch": 864} {"train_loss": -10.804004669189453, "global_step": 145258, "epoch": 864} {"train_loss": -10.633222579956055, "global_step": 145259, "epoch": 864} {"train_loss": -10.731077194213867, "global_step": 145260, "epoch": 864} {"train_loss": -10.772974967956543, "global_step": 145261, "epoch": 864} {"train_loss": -10.944839477539062, "global_step": 145262, "epoch": 864} {"train_loss": -10.538558959960938, "global_step": 145263, "epoch": 864} {"train_loss": -10.350046157836914, "global_step": 145264, "epoch": 864} {"train_loss": -10.440008163452148, "global_step": 145265, "epoch": 864} {"train_loss": -10.45660400390625, "global_step": 145266, "epoch": 864} {"train_loss": -10.49370288848877, "global_step": 145267, "epoch": 864} {"train_loss": -10.315170288085938, "global_step": 145268, "epoch": 864} {"train_loss": -10.434133529663086, "global_step": 145269, "epoch": 864} {"train_loss": -10.089726448059082, "global_step": 145270, "epoch": 864} {"train_loss": -10.208419799804688, "global_step": 145271, "epoch": 864} {"train_loss": -10.533234596252441, "global_step": 145272, "epoch": 864} {"train_loss": -10.432280540466309, "global_step": 145273, "epoch": 864} {"train_loss": -10.425847053527832, "global_step": 145274, "epoch": 864} {"train_loss": -10.158880233764648, "global_step": 145275, "epoch": 864} {"train_loss": -10.04025936126709, "global_step": 145276, "epoch": 864} {"train_loss": -9.99267578125, "global_step": 145277, "epoch": 864} {"train_loss": -10.629210472106934, "global_step": 145278, "epoch": 864} {"train_loss": -10.389877319335938, "global_step": 145279, "epoch": 864} {"train_loss": -10.43843936920166, "global_step": 145280, "epoch": 864} {"train_loss": -10.283590316772461, "global_step": 145281, "epoch": 864} {"train_loss": -10.794242858886719, "global_step": 145282, "epoch": 864} {"train_loss": -10.361205101013184, "global_step": 145283, "epoch": 864} {"train_loss": -10.494847297668457, "global_step": 145284, "epoch": 864} {"train_loss": -10.410691261291504, "global_step": 145285, "epoch": 864} {"train_loss": -10.71970272064209, "global_step": 145286, "epoch": 864} {"train_loss": -10.444461822509766, "global_step": 145287, "epoch": 864} {"train_loss": -10.461625099182129, "global_step": 145288, "epoch": 864} {"train_loss": -10.424966812133789, "global_step": 145289, "epoch": 864} {"train_loss": -10.633129119873047, "global_step": 145290, "epoch": 864} {"train_loss": -10.685945510864258, "global_step": 145291, "epoch": 864} {"train_loss": -10.429311752319336, "global_step": 145292, "epoch": 864} {"train_loss": -10.619277954101562, "global_step": 145293, "epoch": 864} {"train_loss": -10.563294410705566, "global_step": 145294, "epoch": 864} {"train_loss": -10.382494926452637, "global_step": 145295, "epoch": 864} {"train_loss": -10.787859916687012, "global_step": 145296, "epoch": 864} {"train_loss": -10.725661277770996, "global_step": 145297, "epoch": 864} {"train_loss": -10.664854049682617, "global_step": 145298, "epoch": 864} {"train_loss": -10.889339447021484, "global_step": 145299, "epoch": 864} {"train_loss": -10.858226776123047, "global_step": 145300, "epoch": 864} {"train_loss": -10.858932495117188, "global_step": 145301, "epoch": 864} {"train_loss": -10.869362831115723, "global_step": 145302, "epoch": 864} {"train_loss": -10.847199440002441, "global_step": 145303, "epoch": 864} {"train_loss": -10.816595077514648, "global_step": 145304, "epoch": 864} {"train_loss": -10.950819969177246, "global_step": 145305, "epoch": 864} {"train_loss": -10.712483406066895, "global_step": 145306, "epoch": 864} {"train_loss": -10.928747177124023, "global_step": 145307, "epoch": 864} {"train_loss": -10.72974967956543, "global_step": 145308, "epoch": 864} {"train_loss": -10.335994720458984, "global_step": 145309, "epoch": 864} {"train_loss": -10.707284927368164, "global_step": 145310, "epoch": 864} {"train_loss": -10.400888442993164, "global_step": 145311, "epoch": 864} {"train_loss": -10.417306900024414, "global_step": 145312, "epoch": 864} {"train_loss": -10.660982131958008, "global_step": 145313, "epoch": 864} {"train_loss": -10.553382873535156, "global_step": 145314, "epoch": 864} {"train_loss": -10.923837661743164, "global_step": 145315, "epoch": 864} {"train_loss": -10.698877334594727, "global_step": 145316, "epoch": 864} {"train_loss": -10.615760803222656, "global_step": 145317, "epoch": 864} {"train_loss": -10.701505661010742, "global_step": 145318, "epoch": 864} {"train_loss": -10.562835176785788, "global_step": 145319, "epoch": 864, "val_loss": 228662.953125} {"train_loss": -10.614374160766602, "global_step": 145320, "epoch": 865} {"train_loss": -10.545859336853027, "global_step": 145321, "epoch": 865} {"train_loss": -10.594359397888184, "global_step": 145322, "epoch": 865} {"train_loss": -10.803075790405273, "global_step": 145323, "epoch": 865} {"train_loss": -11.04160213470459, "global_step": 145324, "epoch": 865} {"train_loss": -10.478322982788086, "global_step": 145325, "epoch": 865} {"train_loss": -10.813647270202637, "global_step": 145326, "epoch": 865} {"train_loss": -10.871789932250977, "global_step": 145327, "epoch": 865} {"train_loss": -10.758523941040039, "global_step": 145328, "epoch": 865} {"train_loss": -11.083523750305176, "global_step": 145329, "epoch": 865} {"train_loss": -11.05477523803711, "global_step": 145330, "epoch": 865} {"train_loss": -10.841361999511719, "global_step": 145331, "epoch": 865} {"train_loss": -10.998086929321289, "global_step": 145332, "epoch": 865} {"train_loss": -11.055140495300293, "global_step": 145333, "epoch": 865} {"train_loss": -11.148530960083008, "global_step": 145334, "epoch": 865} {"train_loss": -10.714412689208984, "global_step": 145335, "epoch": 865} {"train_loss": -10.938615798950195, "global_step": 145336, "epoch": 865} {"train_loss": -11.052267074584961, "global_step": 145337, "epoch": 865} {"train_loss": -10.882111549377441, "global_step": 145338, "epoch": 865} {"train_loss": -10.858505249023438, "global_step": 145339, "epoch": 865} {"train_loss": -10.901092529296875, "global_step": 145340, "epoch": 865} {"train_loss": -10.811141014099121, "global_step": 145341, "epoch": 865} {"train_loss": -10.853835105895996, "global_step": 145342, "epoch": 865} {"train_loss": -10.564213752746582, "global_step": 145343, "epoch": 865} {"train_loss": -10.839683532714844, "global_step": 145344, "epoch": 865} {"train_loss": -10.528173446655273, "global_step": 145345, "epoch": 865} {"train_loss": -10.552854537963867, "global_step": 145346, "epoch": 865} {"train_loss": -10.970914840698242, "global_step": 145347, "epoch": 865} {"train_loss": -9.970942497253418, "global_step": 145348, "epoch": 865} {"train_loss": -10.722625732421875, "global_step": 145349, "epoch": 865} {"train_loss": -10.003137588500977, "global_step": 145350, "epoch": 865} {"train_loss": -10.736557006835938, "global_step": 145351, "epoch": 865} {"train_loss": -10.671636581420898, "global_step": 145352, "epoch": 865} {"train_loss": -10.740331649780273, "global_step": 145353, "epoch": 865} {"train_loss": -10.546371459960938, "global_step": 145354, "epoch": 865} {"train_loss": -10.985025405883789, "global_step": 145355, "epoch": 865} {"train_loss": -10.518852233886719, "global_step": 145356, "epoch": 865} {"train_loss": -10.729716300964355, "global_step": 145357, "epoch": 865} {"train_loss": -10.892929077148438, "global_step": 145358, "epoch": 865} {"train_loss": -10.612958908081055, "global_step": 145359, "epoch": 865} {"train_loss": -10.19900894165039, "global_step": 145360, "epoch": 865} {"train_loss": -10.626321792602539, "global_step": 145361, "epoch": 865} {"train_loss": -10.725772857666016, "global_step": 145362, "epoch": 865} {"train_loss": -10.457145690917969, "global_step": 145363, "epoch": 865} {"train_loss": -10.833517074584961, "global_step": 145364, "epoch": 865} {"train_loss": -10.838995933532715, "global_step": 145365, "epoch": 865} {"train_loss": -10.610980033874512, "global_step": 145366, "epoch": 865} {"train_loss": -10.611380577087402, "global_step": 145367, "epoch": 865} {"train_loss": -10.898238182067871, "global_step": 145368, "epoch": 865} {"train_loss": -10.30483627319336, "global_step": 145369, "epoch": 865} {"train_loss": -10.722084045410156, "global_step": 145370, "epoch": 865} {"train_loss": -10.186193466186523, "global_step": 145371, "epoch": 865} {"train_loss": -10.400150299072266, "global_step": 145372, "epoch": 865} {"train_loss": -10.474822998046875, "global_step": 145373, "epoch": 865} {"train_loss": -9.85812759399414, "global_step": 145374, "epoch": 865} {"train_loss": -10.597220420837402, "global_step": 145375, "epoch": 865} {"train_loss": -10.23653793334961, "global_step": 145376, "epoch": 865} {"train_loss": -10.088981628417969, "global_step": 145377, "epoch": 865} {"train_loss": -10.225963592529297, "global_step": 145378, "epoch": 865} {"train_loss": -10.383649826049805, "global_step": 145379, "epoch": 865} {"train_loss": -10.53993034362793, "global_step": 145380, "epoch": 865} {"train_loss": -10.576435089111328, "global_step": 145381, "epoch": 865} {"train_loss": -10.200082778930664, "global_step": 145382, "epoch": 865} {"train_loss": -10.577570915222168, "global_step": 145383, "epoch": 865} {"train_loss": -10.545548439025879, "global_step": 145384, "epoch": 865} {"train_loss": -10.211169242858887, "global_step": 145385, "epoch": 865} {"train_loss": -10.728193283081055, "global_step": 145386, "epoch": 865} {"train_loss": -10.519397735595703, "global_step": 145387, "epoch": 865} {"train_loss": -10.718618392944336, "global_step": 145388, "epoch": 865} {"train_loss": -10.681974411010742, "global_step": 145389, "epoch": 865} {"train_loss": -10.652190208435059, "global_step": 145390, "epoch": 865} {"train_loss": -10.635663986206055, "global_step": 145391, "epoch": 865} {"train_loss": -10.61029052734375, "global_step": 145392, "epoch": 865} {"train_loss": -10.67713737487793, "global_step": 145393, "epoch": 865} {"train_loss": -10.614437103271484, "global_step": 145394, "epoch": 865} {"train_loss": -10.790759086608887, "global_step": 145395, "epoch": 865} {"train_loss": -10.48484992980957, "global_step": 145396, "epoch": 865} {"train_loss": -10.71611499786377, "global_step": 145397, "epoch": 865} {"train_loss": -10.291216850280762, "global_step": 145398, "epoch": 865} {"train_loss": -10.510139465332031, "global_step": 145399, "epoch": 865} {"train_loss": -9.77072525024414, "global_step": 145400, "epoch": 865} {"train_loss": -10.491687774658203, "global_step": 145401, "epoch": 865} {"train_loss": -10.266336441040039, "global_step": 145402, "epoch": 865} {"train_loss": -9.981121063232422, "global_step": 145403, "epoch": 865} {"train_loss": -10.452560424804688, "global_step": 145404, "epoch": 865} {"train_loss": -10.33049488067627, "global_step": 145405, "epoch": 865} {"train_loss": -10.077096939086914, "global_step": 145406, "epoch": 865} {"train_loss": -10.564796447753906, "global_step": 145407, "epoch": 865} {"train_loss": -10.05502986907959, "global_step": 145408, "epoch": 865} {"train_loss": -10.045347213745117, "global_step": 145409, "epoch": 865} {"train_loss": -10.284805297851562, "global_step": 145410, "epoch": 865} {"train_loss": -10.346759796142578, "global_step": 145411, "epoch": 865} {"train_loss": -10.20521068572998, "global_step": 145412, "epoch": 865} {"train_loss": -10.405945777893066, "global_step": 145413, "epoch": 865} {"train_loss": -10.41479778289795, "global_step": 145414, "epoch": 865} {"train_loss": -10.404258728027344, "global_step": 145415, "epoch": 865} {"train_loss": -10.588724136352539, "global_step": 145416, "epoch": 865} {"train_loss": -10.384857177734375, "global_step": 145417, "epoch": 865} {"train_loss": -10.512197494506836, "global_step": 145418, "epoch": 865} {"train_loss": -10.620672225952148, "global_step": 145419, "epoch": 865} {"train_loss": -10.451188087463379, "global_step": 145420, "epoch": 865} {"train_loss": -10.733634948730469, "global_step": 145421, "epoch": 865} {"train_loss": -10.584519386291504, "global_step": 145422, "epoch": 865} {"train_loss": -10.426228523254395, "global_step": 145423, "epoch": 865} {"train_loss": -10.613853454589844, "global_step": 145424, "epoch": 865} {"train_loss": -10.863306045532227, "global_step": 145425, "epoch": 865} {"train_loss": -10.607699394226074, "global_step": 145426, "epoch": 865} {"train_loss": -10.631402969360352, "global_step": 145427, "epoch": 865} {"train_loss": -10.81339168548584, "global_step": 145428, "epoch": 865} {"train_loss": -10.922252655029297, "global_step": 145429, "epoch": 865} {"train_loss": -10.510108947753906, "global_step": 145430, "epoch": 865} {"train_loss": -10.89889144897461, "global_step": 145431, "epoch": 865} {"train_loss": -10.766571044921875, "global_step": 145432, "epoch": 865} {"train_loss": -10.827580451965332, "global_step": 145433, "epoch": 865} {"train_loss": -10.773855209350586, "global_step": 145434, "epoch": 865} {"train_loss": -10.906024932861328, "global_step": 145435, "epoch": 865} {"train_loss": -10.633295059204102, "global_step": 145436, "epoch": 865} {"train_loss": -10.962721824645996, "global_step": 145437, "epoch": 865} {"train_loss": -10.641036987304688, "global_step": 145438, "epoch": 865} {"train_loss": -10.841596603393555, "global_step": 145439, "epoch": 865} {"train_loss": -10.943431854248047, "global_step": 145440, "epoch": 865} {"train_loss": -10.733842849731445, "global_step": 145441, "epoch": 865} {"train_loss": -11.023099899291992, "global_step": 145442, "epoch": 865} {"train_loss": -11.11645793914795, "global_step": 145443, "epoch": 865} {"train_loss": -10.843314170837402, "global_step": 145444, "epoch": 865} {"train_loss": -10.877958297729492, "global_step": 145445, "epoch": 865} {"train_loss": -10.957703590393066, "global_step": 145446, "epoch": 865} {"train_loss": -10.771489143371582, "global_step": 145447, "epoch": 865} {"train_loss": -10.810461044311523, "global_step": 145448, "epoch": 865} {"train_loss": -10.854758262634277, "global_step": 145449, "epoch": 865} {"train_loss": -10.981832504272461, "global_step": 145450, "epoch": 865} {"train_loss": -10.79571533203125, "global_step": 145451, "epoch": 865} {"train_loss": -11.129476547241211, "global_step": 145452, "epoch": 865} {"train_loss": -10.938175201416016, "global_step": 145453, "epoch": 865} {"train_loss": -10.846162796020508, "global_step": 145454, "epoch": 865} {"train_loss": -11.0652494430542, "global_step": 145455, "epoch": 865} {"train_loss": -10.314477920532227, "global_step": 145456, "epoch": 865} {"train_loss": -10.549806594848633, "global_step": 145457, "epoch": 865} {"train_loss": -10.65390682220459, "global_step": 145458, "epoch": 865} {"train_loss": -10.712979316711426, "global_step": 145459, "epoch": 865} {"train_loss": -10.945234298706055, "global_step": 145460, "epoch": 865} {"train_loss": -10.6741304397583, "global_step": 145461, "epoch": 865} {"train_loss": -10.66789436340332, "global_step": 145462, "epoch": 865} {"train_loss": -11.109611511230469, "global_step": 145463, "epoch": 865} {"train_loss": -10.622185707092285, "global_step": 145464, "epoch": 865} {"train_loss": -10.437337875366211, "global_step": 145465, "epoch": 865} {"train_loss": -10.479960441589355, "global_step": 145466, "epoch": 865} {"train_loss": -9.534021377563477, "global_step": 145467, "epoch": 865} {"train_loss": -10.13180160522461, "global_step": 145468, "epoch": 865} {"train_loss": -10.73975658416748, "global_step": 145469, "epoch": 865} {"train_loss": -10.524589538574219, "global_step": 145470, "epoch": 865} {"train_loss": -10.067346572875977, "global_step": 145471, "epoch": 865} {"train_loss": -9.83773136138916, "global_step": 145472, "epoch": 865} {"train_loss": -10.992450714111328, "global_step": 145473, "epoch": 865} {"train_loss": -9.66619873046875, "global_step": 145474, "epoch": 865} {"train_loss": -10.550687789916992, "global_step": 145475, "epoch": 865} {"train_loss": -9.686602592468262, "global_step": 145476, "epoch": 865} {"train_loss": -9.968910217285156, "global_step": 145477, "epoch": 865} {"train_loss": -10.630794525146484, "global_step": 145478, "epoch": 865} {"train_loss": -9.845537185668945, "global_step": 145479, "epoch": 865} {"train_loss": -10.231433868408203, "global_step": 145480, "epoch": 865} {"train_loss": -10.178504943847656, "global_step": 145481, "epoch": 865} {"train_loss": -10.34596061706543, "global_step": 145482, "epoch": 865} {"train_loss": -10.414976119995117, "global_step": 145483, "epoch": 865} {"train_loss": -9.777002334594727, "global_step": 145484, "epoch": 865} {"train_loss": -10.875045776367188, "global_step": 145485, "epoch": 865} {"train_loss": -10.688359260559082, "global_step": 145486, "epoch": 865} {"train_loss": -10.584325029736473, "global_step": 145487, "epoch": 865, "val_loss": 224064.265625, "train_action_mse_error": 1.995357871055603} {"train_loss": -10.623907089233398, "global_step": 145488, "epoch": 866} {"train_loss": -10.080792427062988, "global_step": 145489, "epoch": 866} {"train_loss": -10.738874435424805, "global_step": 145490, "epoch": 866} {"train_loss": -10.470474243164062, "global_step": 145491, "epoch": 866} {"train_loss": -10.470492362976074, "global_step": 145492, "epoch": 866} {"train_loss": -10.560314178466797, "global_step": 145493, "epoch": 866} {"train_loss": -10.440881729125977, "global_step": 145494, "epoch": 866} {"train_loss": -10.524410247802734, "global_step": 145495, "epoch": 866} {"train_loss": -10.623943328857422, "global_step": 145496, "epoch": 866} {"train_loss": -10.621620178222656, "global_step": 145497, "epoch": 866} {"train_loss": -10.36082649230957, "global_step": 145498, "epoch": 866} {"train_loss": -10.449934005737305, "global_step": 145499, "epoch": 866} {"train_loss": -10.187697410583496, "global_step": 145500, "epoch": 866} {"train_loss": -10.295616149902344, "global_step": 145501, "epoch": 866} {"train_loss": -10.230546951293945, "global_step": 145502, "epoch": 866} {"train_loss": -10.724620819091797, "global_step": 145503, "epoch": 866} {"train_loss": -10.830835342407227, "global_step": 145504, "epoch": 866} {"train_loss": -10.76089096069336, "global_step": 145505, "epoch": 866} {"train_loss": -10.782179832458496, "global_step": 145506, "epoch": 866} {"train_loss": -10.812763214111328, "global_step": 145507, "epoch": 866} {"train_loss": -10.560505867004395, "global_step": 145508, "epoch": 866} {"train_loss": -10.870904922485352, "global_step": 145509, "epoch": 866} {"train_loss": -10.783944129943848, "global_step": 145510, "epoch": 866} {"train_loss": -10.783319473266602, "global_step": 145511, "epoch": 866} {"train_loss": -10.690990447998047, "global_step": 145512, "epoch": 866} {"train_loss": -10.805608749389648, "global_step": 145513, "epoch": 866} {"train_loss": -10.70503044128418, "global_step": 145514, "epoch": 866} {"train_loss": -10.463348388671875, "global_step": 145515, "epoch": 866} {"train_loss": -10.73304557800293, "global_step": 145516, "epoch": 866} {"train_loss": -10.608377456665039, "global_step": 145517, "epoch": 866} {"train_loss": -10.917692184448242, "global_step": 145518, "epoch": 866} {"train_loss": -10.139703750610352, "global_step": 145519, "epoch": 866} {"train_loss": -10.74216079711914, "global_step": 145520, "epoch": 866} {"train_loss": -10.318147659301758, "global_step": 145521, "epoch": 866} {"train_loss": -10.751843452453613, "global_step": 145522, "epoch": 866} {"train_loss": -10.361413955688477, "global_step": 145523, "epoch": 866} {"train_loss": -10.31410026550293, "global_step": 145524, "epoch": 866} {"train_loss": -10.462240219116211, "global_step": 145525, "epoch": 866} {"train_loss": -9.694926261901855, "global_step": 145526, "epoch": 866} {"train_loss": -10.437131881713867, "global_step": 145527, "epoch": 866} {"train_loss": -9.785360336303711, "global_step": 145528, "epoch": 866} {"train_loss": -10.342026710510254, "global_step": 145529, "epoch": 866} {"train_loss": -10.257568359375, "global_step": 145530, "epoch": 866} {"train_loss": -10.372629165649414, "global_step": 145531, "epoch": 866} {"train_loss": -10.201292991638184, "global_step": 145532, "epoch": 866} {"train_loss": -10.743285179138184, "global_step": 145533, "epoch": 866} {"train_loss": -10.187385559082031, "global_step": 145534, "epoch": 866} {"train_loss": -10.330883026123047, "global_step": 145535, "epoch": 866} {"train_loss": -10.319738388061523, "global_step": 145536, "epoch": 866} {"train_loss": -10.30018138885498, "global_step": 145537, "epoch": 866} {"train_loss": -9.992057800292969, "global_step": 145538, "epoch": 866} {"train_loss": -10.526176452636719, "global_step": 145539, "epoch": 866} {"train_loss": -10.279376983642578, "global_step": 145540, "epoch": 866} {"train_loss": -10.622368812561035, "global_step": 145541, "epoch": 866} {"train_loss": -10.543964385986328, "global_step": 145542, "epoch": 866} {"train_loss": -10.566137313842773, "global_step": 145543, "epoch": 866} {"train_loss": -10.457381248474121, "global_step": 145544, "epoch": 866} {"train_loss": -10.494437217712402, "global_step": 145545, "epoch": 866} {"train_loss": -10.616863250732422, "global_step": 145546, "epoch": 866} {"train_loss": -10.579354286193848, "global_step": 145547, "epoch": 866} {"train_loss": -10.112160682678223, "global_step": 145548, "epoch": 866} {"train_loss": -10.394725799560547, "global_step": 145549, "epoch": 866} {"train_loss": -10.447622299194336, "global_step": 145550, "epoch": 866} {"train_loss": -10.551058769226074, "global_step": 145551, "epoch": 866} {"train_loss": -10.448230743408203, "global_step": 145552, "epoch": 866} {"train_loss": -10.12451171875, "global_step": 145553, "epoch": 866} {"train_loss": -10.730005264282227, "global_step": 145554, "epoch": 866} {"train_loss": -10.05821418762207, "global_step": 145555, "epoch": 866} {"train_loss": -11.008277893066406, "global_step": 145556, "epoch": 866} {"train_loss": -9.760421752929688, "global_step": 145557, "epoch": 866} {"train_loss": -10.840900421142578, "global_step": 145558, "epoch": 866} {"train_loss": -10.611238479614258, "global_step": 145559, "epoch": 866} {"train_loss": -10.31212043762207, "global_step": 145560, "epoch": 866} {"train_loss": -10.341939926147461, "global_step": 145561, "epoch": 866} {"train_loss": -10.576923370361328, "global_step": 145562, "epoch": 866} {"train_loss": -10.836384773254395, "global_step": 145563, "epoch": 866} {"train_loss": -10.686981201171875, "global_step": 145564, "epoch": 866} {"train_loss": -10.736763000488281, "global_step": 145565, "epoch": 866} {"train_loss": -10.722963333129883, "global_step": 145566, "epoch": 866} {"train_loss": -10.752923011779785, "global_step": 145567, "epoch": 866} {"train_loss": -10.481797218322754, "global_step": 145568, "epoch": 866} {"train_loss": -10.772037506103516, "global_step": 145569, "epoch": 866} {"train_loss": -10.403287887573242, "global_step": 145570, "epoch": 866} {"train_loss": -10.51507568359375, "global_step": 145571, "epoch": 866} {"train_loss": -10.667465209960938, "global_step": 145572, "epoch": 866} {"train_loss": -10.946555137634277, "global_step": 145573, "epoch": 866} {"train_loss": -10.483495712280273, "global_step": 145574, "epoch": 866} {"train_loss": -10.588613510131836, "global_step": 145575, "epoch": 866} {"train_loss": -10.63554573059082, "global_step": 145576, "epoch": 866} {"train_loss": -10.991711616516113, "global_step": 145577, "epoch": 866} {"train_loss": -10.56049919128418, "global_step": 145578, "epoch": 866} {"train_loss": -10.664016723632812, "global_step": 145579, "epoch": 866} {"train_loss": -10.328649520874023, "global_step": 145580, "epoch": 866} {"train_loss": -10.617863655090332, "global_step": 145581, "epoch": 866} {"train_loss": -10.637308120727539, "global_step": 145582, "epoch": 866} {"train_loss": -10.497308731079102, "global_step": 145583, "epoch": 866} {"train_loss": -10.672887802124023, "global_step": 145584, "epoch": 866} {"train_loss": -10.961990356445312, "global_step": 145585, "epoch": 866} {"train_loss": -10.883903503417969, "global_step": 145586, "epoch": 866} {"train_loss": -10.781074523925781, "global_step": 145587, "epoch": 866} {"train_loss": -10.619623184204102, "global_step": 145588, "epoch": 866} {"train_loss": -10.52847671508789, "global_step": 145589, "epoch": 866} {"train_loss": -10.419296264648438, "global_step": 145590, "epoch": 866} {"train_loss": -10.769110679626465, "global_step": 145591, "epoch": 866} {"train_loss": -10.56087875366211, "global_step": 145592, "epoch": 866} {"train_loss": -10.873228073120117, "global_step": 145593, "epoch": 866} {"train_loss": -10.793319702148438, "global_step": 145594, "epoch": 866} {"train_loss": -10.731109619140625, "global_step": 145595, "epoch": 866} {"train_loss": -10.8699312210083, "global_step": 145596, "epoch": 866} {"train_loss": -11.025415420532227, "global_step": 145597, "epoch": 866} {"train_loss": -10.851993560791016, "global_step": 145598, "epoch": 866} {"train_loss": -10.795797348022461, "global_step": 145599, "epoch": 866} {"train_loss": -10.861474990844727, "global_step": 145600, "epoch": 866} {"train_loss": -11.165761947631836, "global_step": 145601, "epoch": 866} {"train_loss": -11.042781829833984, "global_step": 145602, "epoch": 866} {"train_loss": -11.083329200744629, "global_step": 145603, "epoch": 866} {"train_loss": -10.91390609741211, "global_step": 145604, "epoch": 866} {"train_loss": -11.16286849975586, "global_step": 145605, "epoch": 866} {"train_loss": -11.135747909545898, "global_step": 145606, "epoch": 866} {"train_loss": -10.877403259277344, "global_step": 145607, "epoch": 866} {"train_loss": -11.221175193786621, "global_step": 145608, "epoch": 866} {"train_loss": -10.854976654052734, "global_step": 145609, "epoch": 866} {"train_loss": -10.999587059020996, "global_step": 145610, "epoch": 866} {"train_loss": -10.942886352539062, "global_step": 145611, "epoch": 866} {"train_loss": -10.92924690246582, "global_step": 145612, "epoch": 866} {"train_loss": -10.832178115844727, "global_step": 145613, "epoch": 866} {"train_loss": -10.605237007141113, "global_step": 145614, "epoch": 866} {"train_loss": -10.911576271057129, "global_step": 145615, "epoch": 866} {"train_loss": -10.633262634277344, "global_step": 145616, "epoch": 866} {"train_loss": -10.662728309631348, "global_step": 145617, "epoch": 866} {"train_loss": -10.820602416992188, "global_step": 145618, "epoch": 866} {"train_loss": -10.450189590454102, "global_step": 145619, "epoch": 866} {"train_loss": -10.989753723144531, "global_step": 145620, "epoch": 866} {"train_loss": -10.607391357421875, "global_step": 145621, "epoch": 866} {"train_loss": -10.48192024230957, "global_step": 145622, "epoch": 866} {"train_loss": -10.584561347961426, "global_step": 145623, "epoch": 866} {"train_loss": -10.544126510620117, "global_step": 145624, "epoch": 866} {"train_loss": -10.257909774780273, "global_step": 145625, "epoch": 866} {"train_loss": -10.625616073608398, "global_step": 145626, "epoch": 866} {"train_loss": -10.680318832397461, "global_step": 145627, "epoch": 866} {"train_loss": -10.533300399780273, "global_step": 145628, "epoch": 866} {"train_loss": -10.4054594039917, "global_step": 145629, "epoch": 866} {"train_loss": -10.128284454345703, "global_step": 145630, "epoch": 866} {"train_loss": -10.162187576293945, "global_step": 145631, "epoch": 866} {"train_loss": -10.017659187316895, "global_step": 145632, "epoch": 866} {"train_loss": -10.51579475402832, "global_step": 145633, "epoch": 866} {"train_loss": -10.503457069396973, "global_step": 145634, "epoch": 866} {"train_loss": -9.886293411254883, "global_step": 145635, "epoch": 866} {"train_loss": -10.02221393585205, "global_step": 145636, "epoch": 866} {"train_loss": -9.462955474853516, "global_step": 145637, "epoch": 866} {"train_loss": -10.37065315246582, "global_step": 145638, "epoch": 866} {"train_loss": -9.809343338012695, "global_step": 145639, "epoch": 866} {"train_loss": -10.473583221435547, "global_step": 145640, "epoch": 866} {"train_loss": -9.821281433105469, "global_step": 145641, "epoch": 866} {"train_loss": -10.485107421875, "global_step": 145642, "epoch": 866} {"train_loss": -9.974370002746582, "global_step": 145643, "epoch": 866} {"train_loss": -10.651469230651855, "global_step": 145644, "epoch": 866} {"train_loss": -10.237183570861816, "global_step": 145645, "epoch": 866} {"train_loss": -10.829565048217773, "global_step": 145646, "epoch": 866} {"train_loss": -10.298110961914062, "global_step": 145647, "epoch": 866} {"train_loss": -10.656843185424805, "global_step": 145648, "epoch": 866} {"train_loss": -10.25042724609375, "global_step": 145649, "epoch": 866} {"train_loss": -10.670525550842285, "global_step": 145650, "epoch": 866} {"train_loss": -10.214120864868164, "global_step": 145651, "epoch": 866} {"train_loss": -10.531363487243652, "global_step": 145652, "epoch": 866} {"train_loss": -9.950065612792969, "global_step": 145653, "epoch": 866} {"train_loss": -10.498296737670898, "global_step": 145654, "epoch": 866} {"train_loss": -10.546189018658229, "global_step": 145655, "epoch": 866, "val_loss": 228362.109375} {"train_loss": -9.993345260620117, "global_step": 145656, "epoch": 867} {"train_loss": -10.375970840454102, "global_step": 145657, "epoch": 867} {"train_loss": -10.320363998413086, "global_step": 145658, "epoch": 867} {"train_loss": -10.492643356323242, "global_step": 145659, "epoch": 867} {"train_loss": -10.603504180908203, "global_step": 145660, "epoch": 867} {"train_loss": -10.542892456054688, "global_step": 145661, "epoch": 867} {"train_loss": -10.453569412231445, "global_step": 145662, "epoch": 867} {"train_loss": -10.482831954956055, "global_step": 145663, "epoch": 867} {"train_loss": -10.400505065917969, "global_step": 145664, "epoch": 867} {"train_loss": -10.513187408447266, "global_step": 145665, "epoch": 867} {"train_loss": -10.622015953063965, "global_step": 145666, "epoch": 867} {"train_loss": -10.592094421386719, "global_step": 145667, "epoch": 867} {"train_loss": -10.582974433898926, "global_step": 145668, "epoch": 867} {"train_loss": -10.526433944702148, "global_step": 145669, "epoch": 867} {"train_loss": -10.820720672607422, "global_step": 145670, "epoch": 867} {"train_loss": -10.637287139892578, "global_step": 145671, "epoch": 867} {"train_loss": -10.676237106323242, "global_step": 145672, "epoch": 867} {"train_loss": -10.773735046386719, "global_step": 145673, "epoch": 867} {"train_loss": -10.71065616607666, "global_step": 145674, "epoch": 867} {"train_loss": -10.654003143310547, "global_step": 145675, "epoch": 867} {"train_loss": -10.719776153564453, "global_step": 145676, "epoch": 867} {"train_loss": -10.815979957580566, "global_step": 145677, "epoch": 867} {"train_loss": -10.411970138549805, "global_step": 145678, "epoch": 867} {"train_loss": -10.861769676208496, "global_step": 145679, "epoch": 867} {"train_loss": -10.797447204589844, "global_step": 145680, "epoch": 867} {"train_loss": -10.81974983215332, "global_step": 145681, "epoch": 867} {"train_loss": -10.786502838134766, "global_step": 145682, "epoch": 867} {"train_loss": -10.734169960021973, "global_step": 145683, "epoch": 867} {"train_loss": -10.790849685668945, "global_step": 145684, "epoch": 867} {"train_loss": -10.838662147521973, "global_step": 145685, "epoch": 867} {"train_loss": -10.576044082641602, "global_step": 145686, "epoch": 867} {"train_loss": -10.864002227783203, "global_step": 145687, "epoch": 867} {"train_loss": -11.04289436340332, "global_step": 145688, "epoch": 867} {"train_loss": -10.848785400390625, "global_step": 145689, "epoch": 867} {"train_loss": -10.86536979675293, "global_step": 145690, "epoch": 867} {"train_loss": -10.95539665222168, "global_step": 145691, "epoch": 867} {"train_loss": -10.691998481750488, "global_step": 145692, "epoch": 867} {"train_loss": -10.661523818969727, "global_step": 145693, "epoch": 867} {"train_loss": -10.791553497314453, "global_step": 145694, "epoch": 867} {"train_loss": -10.944847106933594, "global_step": 145695, "epoch": 867} {"train_loss": -10.892168045043945, "global_step": 145696, "epoch": 867} {"train_loss": -10.737470626831055, "global_step": 145697, "epoch": 867} {"train_loss": -10.972347259521484, "global_step": 145698, "epoch": 867} {"train_loss": -10.876365661621094, "global_step": 145699, "epoch": 867} {"train_loss": -10.889434814453125, "global_step": 145700, "epoch": 867} {"train_loss": -10.68156623840332, "global_step": 145701, "epoch": 867} {"train_loss": -10.873483657836914, "global_step": 145702, "epoch": 867} {"train_loss": -10.469157218933105, "global_step": 145703, "epoch": 867} {"train_loss": -10.44387435913086, "global_step": 145704, "epoch": 867} {"train_loss": -10.357173919677734, "global_step": 145705, "epoch": 867} {"train_loss": -11.032892227172852, "global_step": 145706, "epoch": 867} {"train_loss": -10.213201522827148, "global_step": 145707, "epoch": 867} {"train_loss": -9.530248641967773, "global_step": 145708, "epoch": 867} {"train_loss": -8.924337387084961, "global_step": 145709, "epoch": 867} {"train_loss": -10.815376281738281, "global_step": 145710, "epoch": 867} {"train_loss": -8.983028411865234, "global_step": 145711, "epoch": 867} {"train_loss": -10.09164810180664, "global_step": 145712, "epoch": 867} {"train_loss": -10.01668930053711, "global_step": 145713, "epoch": 867} {"train_loss": -9.621070861816406, "global_step": 145714, "epoch": 867} {"train_loss": -9.095684051513672, "global_step": 145715, "epoch": 867} {"train_loss": -9.96966552734375, "global_step": 145716, "epoch": 867} {"train_loss": -9.491120338439941, "global_step": 145717, "epoch": 867} {"train_loss": -9.197240829467773, "global_step": 145718, "epoch": 867} {"train_loss": -10.5288667678833, "global_step": 145719, "epoch": 867} {"train_loss": -9.432421684265137, "global_step": 145720, "epoch": 867} {"train_loss": -10.011699676513672, "global_step": 145721, "epoch": 867} {"train_loss": -10.03271770477295, "global_step": 145722, "epoch": 867} {"train_loss": -9.906294822692871, "global_step": 145723, "epoch": 867} {"train_loss": -10.174661636352539, "global_step": 145724, "epoch": 867} {"train_loss": -10.368322372436523, "global_step": 145725, "epoch": 867} {"train_loss": -10.141914367675781, "global_step": 145726, "epoch": 867} {"train_loss": -9.913585662841797, "global_step": 145727, "epoch": 867} {"train_loss": -10.467992782592773, "global_step": 145728, "epoch": 867} {"train_loss": -10.174495697021484, "global_step": 145729, "epoch": 867} {"train_loss": -9.826009750366211, "global_step": 145730, "epoch": 867} {"train_loss": -10.41262149810791, "global_step": 145731, "epoch": 867} {"train_loss": -10.266165733337402, "global_step": 145732, "epoch": 867} {"train_loss": -10.099684715270996, "global_step": 145733, "epoch": 867} {"train_loss": -10.363300323486328, "global_step": 145734, "epoch": 867} {"train_loss": -10.368138313293457, "global_step": 145735, "epoch": 867} {"train_loss": -10.238541603088379, "global_step": 145736, "epoch": 867} {"train_loss": -10.417083740234375, "global_step": 145737, "epoch": 867} {"train_loss": -10.76328182220459, "global_step": 145738, "epoch": 867} {"train_loss": -10.573497772216797, "global_step": 145739, "epoch": 867} {"train_loss": -10.43606948852539, "global_step": 145740, "epoch": 867} {"train_loss": -10.207691192626953, "global_step": 145741, "epoch": 867} {"train_loss": -10.430886268615723, "global_step": 145742, "epoch": 867} {"train_loss": -10.512096405029297, "global_step": 145743, "epoch": 867} {"train_loss": -10.403894424438477, "global_step": 145744, "epoch": 867} {"train_loss": -10.456766128540039, "global_step": 145745, "epoch": 867} {"train_loss": -10.515630722045898, "global_step": 145746, "epoch": 867} {"train_loss": -10.37027359008789, "global_step": 145747, "epoch": 867} {"train_loss": -10.494356155395508, "global_step": 145748, "epoch": 867} {"train_loss": -10.414379119873047, "global_step": 145749, "epoch": 867} {"train_loss": -10.561843872070312, "global_step": 145750, "epoch": 867} {"train_loss": -10.519189834594727, "global_step": 145751, "epoch": 867} {"train_loss": -10.710466384887695, "global_step": 145752, "epoch": 867} {"train_loss": -10.601594924926758, "global_step": 145753, "epoch": 867} {"train_loss": -10.626749992370605, "global_step": 145754, "epoch": 867} {"train_loss": -10.558279037475586, "global_step": 145755, "epoch": 867} {"train_loss": -10.769464492797852, "global_step": 145756, "epoch": 867} {"train_loss": -10.719852447509766, "global_step": 145757, "epoch": 867} {"train_loss": -10.686341285705566, "global_step": 145758, "epoch": 867} {"train_loss": -10.748581886291504, "global_step": 145759, "epoch": 867} {"train_loss": -10.783040046691895, "global_step": 145760, "epoch": 867} {"train_loss": -10.734434127807617, "global_step": 145761, "epoch": 867} {"train_loss": -10.705048561096191, "global_step": 145762, "epoch": 867} {"train_loss": -10.829202651977539, "global_step": 145763, "epoch": 867} {"train_loss": -10.544991493225098, "global_step": 145764, "epoch": 867} {"train_loss": -10.754294395446777, "global_step": 145765, "epoch": 867} {"train_loss": -10.70545768737793, "global_step": 145766, "epoch": 867} {"train_loss": -10.885215759277344, "global_step": 145767, "epoch": 867} {"train_loss": -10.450186729431152, "global_step": 145768, "epoch": 867} {"train_loss": -10.632741928100586, "global_step": 145769, "epoch": 867} {"train_loss": -10.442903518676758, "global_step": 145770, "epoch": 867} {"train_loss": -10.528907775878906, "global_step": 145771, "epoch": 867} {"train_loss": -10.825336456298828, "global_step": 145772, "epoch": 867} {"train_loss": -10.62955093383789, "global_step": 145773, "epoch": 867} {"train_loss": -10.870561599731445, "global_step": 145774, "epoch": 867} {"train_loss": -10.596247673034668, "global_step": 145775, "epoch": 867} {"train_loss": -10.8018217086792, "global_step": 145776, "epoch": 867} {"train_loss": -10.680274963378906, "global_step": 145777, "epoch": 867} {"train_loss": -10.561487197875977, "global_step": 145778, "epoch": 867} {"train_loss": -10.900081634521484, "global_step": 145779, "epoch": 867} {"train_loss": -11.03200626373291, "global_step": 145780, "epoch": 867} {"train_loss": -10.821585655212402, "global_step": 145781, "epoch": 867} {"train_loss": -10.832962036132812, "global_step": 145782, "epoch": 867} {"train_loss": -10.86903190612793, "global_step": 145783, "epoch": 867} {"train_loss": -10.809417724609375, "global_step": 145784, "epoch": 867} {"train_loss": -10.88662052154541, "global_step": 145785, "epoch": 867} {"train_loss": -10.63995361328125, "global_step": 145786, "epoch": 867} {"train_loss": -10.119657516479492, "global_step": 145787, "epoch": 867} {"train_loss": -10.469619750976562, "global_step": 145788, "epoch": 867} {"train_loss": -10.572010040283203, "global_step": 145789, "epoch": 867} {"train_loss": -10.75265121459961, "global_step": 145790, "epoch": 867} {"train_loss": -10.768386840820312, "global_step": 145791, "epoch": 867} {"train_loss": -10.520973205566406, "global_step": 145792, "epoch": 867} {"train_loss": -10.691123962402344, "global_step": 145793, "epoch": 867} {"train_loss": -10.380422592163086, "global_step": 145794, "epoch": 867} {"train_loss": -10.909152030944824, "global_step": 145795, "epoch": 867} {"train_loss": -10.621926307678223, "global_step": 145796, "epoch": 867} {"train_loss": -10.626288414001465, "global_step": 145797, "epoch": 867} {"train_loss": -10.525243759155273, "global_step": 145798, "epoch": 867} {"train_loss": -9.842060089111328, "global_step": 145799, "epoch": 867} {"train_loss": -10.936186790466309, "global_step": 145800, "epoch": 867} {"train_loss": -10.71190071105957, "global_step": 145801, "epoch": 867} {"train_loss": -10.209026336669922, "global_step": 145802, "epoch": 867} {"train_loss": -10.934094429016113, "global_step": 145803, "epoch": 867} {"train_loss": -10.660639762878418, "global_step": 145804, "epoch": 867} {"train_loss": -10.64068603515625, "global_step": 145805, "epoch": 867} {"train_loss": -9.966794967651367, "global_step": 145806, "epoch": 867} {"train_loss": -10.286867141723633, "global_step": 145807, "epoch": 867} {"train_loss": -10.574583053588867, "global_step": 145808, "epoch": 867} {"train_loss": -10.245227813720703, "global_step": 145809, "epoch": 867} {"train_loss": -10.276662826538086, "global_step": 145810, "epoch": 867} {"train_loss": -10.577371597290039, "global_step": 145811, "epoch": 867} {"train_loss": -10.590788841247559, "global_step": 145812, "epoch": 867} {"train_loss": -10.523039817810059, "global_step": 145813, "epoch": 867} {"train_loss": -10.636040687561035, "global_step": 145814, "epoch": 867} {"train_loss": -9.940343856811523, "global_step": 145815, "epoch": 867} {"train_loss": -10.517868041992188, "global_step": 145816, "epoch": 867} {"train_loss": -10.306255340576172, "global_step": 145817, "epoch": 867} {"train_loss": -9.814159393310547, "global_step": 145818, "epoch": 867} {"train_loss": -10.075803756713867, "global_step": 145819, "epoch": 867} {"train_loss": -10.529712677001953, "global_step": 145820, "epoch": 867} {"train_loss": -9.68197250366211, "global_step": 145821, "epoch": 867} {"train_loss": -10.620956420898438, "global_step": 145822, "epoch": 867} {"train_loss": -10.487381174450828, "global_step": 145823, "epoch": 867, "val_loss": 220505.578125} {"train_loss": -10.50179672241211, "global_step": 145824, "epoch": 868} {"train_loss": -10.302327156066895, "global_step": 145825, "epoch": 868} {"train_loss": -10.55252456665039, "global_step": 145826, "epoch": 868} {"train_loss": -10.115751266479492, "global_step": 145827, "epoch": 868} {"train_loss": -10.494314193725586, "global_step": 145828, "epoch": 868} {"train_loss": -10.43493938446045, "global_step": 145829, "epoch": 868} {"train_loss": -10.398048400878906, "global_step": 145830, "epoch": 868} {"train_loss": -10.234336853027344, "global_step": 145831, "epoch": 868} {"train_loss": -10.261475563049316, "global_step": 145832, "epoch": 868} {"train_loss": -10.830738067626953, "global_step": 145833, "epoch": 868} {"train_loss": -10.244078636169434, "global_step": 145834, "epoch": 868} {"train_loss": -10.535926818847656, "global_step": 145835, "epoch": 868} {"train_loss": -10.573111534118652, "global_step": 145836, "epoch": 868} {"train_loss": -10.442462921142578, "global_step": 145837, "epoch": 868} {"train_loss": -10.564603805541992, "global_step": 145838, "epoch": 868} {"train_loss": -10.676485061645508, "global_step": 145839, "epoch": 868} {"train_loss": -10.71563720703125, "global_step": 145840, "epoch": 868} {"train_loss": -10.56299877166748, "global_step": 145841, "epoch": 868} {"train_loss": -10.672632217407227, "global_step": 145842, "epoch": 868} {"train_loss": -10.15743637084961, "global_step": 145843, "epoch": 868} {"train_loss": -10.590597152709961, "global_step": 145844, "epoch": 868} {"train_loss": -10.508262634277344, "global_step": 145845, "epoch": 868} {"train_loss": -10.806121826171875, "global_step": 145846, "epoch": 868} {"train_loss": -10.449907302856445, "global_step": 145847, "epoch": 868} {"train_loss": -10.235179901123047, "global_step": 145848, "epoch": 868} {"train_loss": -10.439011573791504, "global_step": 145849, "epoch": 868} {"train_loss": -10.707491874694824, "global_step": 145850, "epoch": 868} {"train_loss": -10.525890350341797, "global_step": 145851, "epoch": 868} {"train_loss": -10.543405532836914, "global_step": 145852, "epoch": 868} {"train_loss": -10.526021003723145, "global_step": 145853, "epoch": 868} {"train_loss": -10.791204452514648, "global_step": 145854, "epoch": 868} {"train_loss": -10.568704605102539, "global_step": 145855, "epoch": 868} {"train_loss": -10.91970157623291, "global_step": 145856, "epoch": 868} {"train_loss": -10.791258811950684, "global_step": 145857, "epoch": 868} {"train_loss": -11.010725021362305, "global_step": 145858, "epoch": 868} {"train_loss": -10.698888778686523, "global_step": 145859, "epoch": 868} {"train_loss": -10.49252986907959, "global_step": 145860, "epoch": 868} {"train_loss": -10.916812896728516, "global_step": 145861, "epoch": 868} {"train_loss": -10.693158149719238, "global_step": 145862, "epoch": 868} {"train_loss": -10.94278335571289, "global_step": 145863, "epoch": 868} {"train_loss": -10.525047302246094, "global_step": 145864, "epoch": 868} {"train_loss": -10.687006950378418, "global_step": 145865, "epoch": 868} {"train_loss": -10.264528274536133, "global_step": 145866, "epoch": 868} {"train_loss": -10.771867752075195, "global_step": 145867, "epoch": 868} {"train_loss": -10.500577926635742, "global_step": 145868, "epoch": 868} {"train_loss": -10.515653610229492, "global_step": 145869, "epoch": 868} {"train_loss": -10.341290473937988, "global_step": 145870, "epoch": 868} {"train_loss": -10.602649688720703, "global_step": 145871, "epoch": 868} {"train_loss": -10.429752349853516, "global_step": 145872, "epoch": 868} {"train_loss": -10.636058807373047, "global_step": 145873, "epoch": 868} {"train_loss": -10.535710334777832, "global_step": 145874, "epoch": 868} {"train_loss": -10.728147506713867, "global_step": 145875, "epoch": 868} {"train_loss": -10.407316207885742, "global_step": 145876, "epoch": 868} {"train_loss": -10.631153106689453, "global_step": 145877, "epoch": 868} {"train_loss": -10.518489837646484, "global_step": 145878, "epoch": 868} {"train_loss": -10.522260665893555, "global_step": 145879, "epoch": 868} {"train_loss": -10.494836807250977, "global_step": 145880, "epoch": 868} {"train_loss": -10.603604316711426, "global_step": 145881, "epoch": 868} {"train_loss": -10.440034866333008, "global_step": 145882, "epoch": 868} {"train_loss": -10.542625427246094, "global_step": 145883, "epoch": 868} {"train_loss": -10.24234390258789, "global_step": 145884, "epoch": 868} {"train_loss": -10.508381843566895, "global_step": 145885, "epoch": 868} {"train_loss": -10.44867992401123, "global_step": 145886, "epoch": 868} {"train_loss": -10.302509307861328, "global_step": 145887, "epoch": 868} {"train_loss": -10.805004119873047, "global_step": 145888, "epoch": 868} {"train_loss": -9.81960678100586, "global_step": 145889, "epoch": 868} {"train_loss": -10.878202438354492, "global_step": 145890, "epoch": 868} {"train_loss": -10.445798873901367, "global_step": 145891, "epoch": 868} {"train_loss": -10.554777145385742, "global_step": 145892, "epoch": 868} {"train_loss": -10.199544906616211, "global_step": 145893, "epoch": 868} {"train_loss": -10.670015335083008, "global_step": 145894, "epoch": 868} {"train_loss": -10.29057502746582, "global_step": 145895, "epoch": 868} {"train_loss": -10.31601619720459, "global_step": 145896, "epoch": 868} {"train_loss": -10.273696899414062, "global_step": 145897, "epoch": 868} {"train_loss": -10.360215187072754, "global_step": 145898, "epoch": 868} {"train_loss": -10.51986026763916, "global_step": 145899, "epoch": 868} {"train_loss": -9.962701797485352, "global_step": 145900, "epoch": 868} {"train_loss": -10.064589500427246, "global_step": 145901, "epoch": 868} {"train_loss": -9.669297218322754, "global_step": 145902, "epoch": 868} {"train_loss": -10.394877433776855, "global_step": 145903, "epoch": 868} {"train_loss": -9.741710662841797, "global_step": 145904, "epoch": 868} {"train_loss": -10.426469802856445, "global_step": 145905, "epoch": 868} {"train_loss": -10.149316787719727, "global_step": 145906, "epoch": 868} {"train_loss": -10.14068603515625, "global_step": 145907, "epoch": 868} {"train_loss": -10.135175704956055, "global_step": 145908, "epoch": 868} {"train_loss": -10.018037796020508, "global_step": 145909, "epoch": 868} {"train_loss": -10.143543243408203, "global_step": 145910, "epoch": 868} {"train_loss": -10.159916877746582, "global_step": 145911, "epoch": 868} {"train_loss": -10.324316024780273, "global_step": 145912, "epoch": 868} {"train_loss": -9.979545593261719, "global_step": 145913, "epoch": 868} {"train_loss": -10.684308052062988, "global_step": 145914, "epoch": 868} {"train_loss": -10.215956687927246, "global_step": 145915, "epoch": 868} {"train_loss": -10.45222282409668, "global_step": 145916, "epoch": 868} {"train_loss": -10.589553833007812, "global_step": 145917, "epoch": 868} {"train_loss": -10.565433502197266, "global_step": 145918, "epoch": 868} {"train_loss": -9.910289764404297, "global_step": 145919, "epoch": 868} {"train_loss": -10.643062591552734, "global_step": 145920, "epoch": 868} {"train_loss": -10.297536849975586, "global_step": 145921, "epoch": 868} {"train_loss": -10.560357093811035, "global_step": 145922, "epoch": 868} {"train_loss": -10.461064338684082, "global_step": 145923, "epoch": 868} {"train_loss": -10.616222381591797, "global_step": 145924, "epoch": 868} {"train_loss": -10.548303604125977, "global_step": 145925, "epoch": 868} {"train_loss": -10.765841484069824, "global_step": 145926, "epoch": 868} {"train_loss": -10.426985740661621, "global_step": 145927, "epoch": 868} {"train_loss": -10.468219757080078, "global_step": 145928, "epoch": 868} {"train_loss": -10.503515243530273, "global_step": 145929, "epoch": 868} {"train_loss": -10.678693771362305, "global_step": 145930, "epoch": 868} {"train_loss": -10.474044799804688, "global_step": 145931, "epoch": 868} {"train_loss": -10.513561248779297, "global_step": 145932, "epoch": 868} {"train_loss": -10.670446395874023, "global_step": 145933, "epoch": 868} {"train_loss": -10.622062683105469, "global_step": 145934, "epoch": 868} {"train_loss": -10.749153137207031, "global_step": 145935, "epoch": 868} {"train_loss": -10.453588485717773, "global_step": 145936, "epoch": 868} {"train_loss": -10.53062629699707, "global_step": 145937, "epoch": 868} {"train_loss": -10.307794570922852, "global_step": 145938, "epoch": 868} {"train_loss": -10.79224967956543, "global_step": 145939, "epoch": 868} {"train_loss": -10.616146087646484, "global_step": 145940, "epoch": 868} {"train_loss": -10.721334457397461, "global_step": 145941, "epoch": 868} {"train_loss": -10.55160903930664, "global_step": 145942, "epoch": 868} {"train_loss": -10.570478439331055, "global_step": 145943, "epoch": 868} {"train_loss": -10.740816116333008, "global_step": 145944, "epoch": 868} {"train_loss": -10.695287704467773, "global_step": 145945, "epoch": 868} {"train_loss": -10.659927368164062, "global_step": 145946, "epoch": 868} {"train_loss": -10.730766296386719, "global_step": 145947, "epoch": 868} {"train_loss": -10.727272033691406, "global_step": 145948, "epoch": 868} {"train_loss": -10.378281593322754, "global_step": 145949, "epoch": 868} {"train_loss": -10.880008697509766, "global_step": 145950, "epoch": 868} {"train_loss": -10.65456485748291, "global_step": 145951, "epoch": 868} {"train_loss": -10.847472190856934, "global_step": 145952, "epoch": 868} {"train_loss": -10.451044082641602, "global_step": 145953, "epoch": 868} {"train_loss": -10.63731575012207, "global_step": 145954, "epoch": 868} {"train_loss": -10.550769805908203, "global_step": 145955, "epoch": 868} {"train_loss": -10.546619415283203, "global_step": 145956, "epoch": 868} {"train_loss": -10.630876541137695, "global_step": 145957, "epoch": 868} {"train_loss": -10.964042663574219, "global_step": 145958, "epoch": 868} {"train_loss": -10.758962631225586, "global_step": 145959, "epoch": 868} {"train_loss": -10.839759826660156, "global_step": 145960, "epoch": 868} {"train_loss": -11.020557403564453, "global_step": 145961, "epoch": 868} {"train_loss": -11.02403736114502, "global_step": 145962, "epoch": 868} {"train_loss": -11.045893669128418, "global_step": 145963, "epoch": 868} {"train_loss": -10.736980438232422, "global_step": 145964, "epoch": 868} {"train_loss": -10.723836898803711, "global_step": 145965, "epoch": 868} {"train_loss": -10.966068267822266, "global_step": 145966, "epoch": 868} {"train_loss": -10.606782913208008, "global_step": 145967, "epoch": 868} {"train_loss": -10.932705879211426, "global_step": 145968, "epoch": 868} {"train_loss": -11.048059463500977, "global_step": 145969, "epoch": 868} {"train_loss": -10.53924560546875, "global_step": 145970, "epoch": 868} {"train_loss": -10.60258674621582, "global_step": 145971, "epoch": 868} {"train_loss": -10.664011001586914, "global_step": 145972, "epoch": 868} {"train_loss": -10.554642677307129, "global_step": 145973, "epoch": 868} {"train_loss": -11.02519702911377, "global_step": 145974, "epoch": 868} {"train_loss": -10.79239273071289, "global_step": 145975, "epoch": 868} {"train_loss": -10.788026809692383, "global_step": 145976, "epoch": 868} {"train_loss": -10.673776626586914, "global_step": 145977, "epoch": 868} {"train_loss": -10.592580795288086, "global_step": 145978, "epoch": 868} {"train_loss": -10.675111770629883, "global_step": 145979, "epoch": 868} {"train_loss": -10.574851036071777, "global_step": 145980, "epoch": 868} {"train_loss": -10.537389755249023, "global_step": 145981, "epoch": 868} {"train_loss": -10.660282135009766, "global_step": 145982, "epoch": 868} {"train_loss": -10.860746383666992, "global_step": 145983, "epoch": 868} {"train_loss": -10.722505569458008, "global_step": 145984, "epoch": 868} {"train_loss": -10.796242713928223, "global_step": 145985, "epoch": 868} {"train_loss": -10.587945938110352, "global_step": 145986, "epoch": 868} {"train_loss": -10.573798179626465, "global_step": 145987, "epoch": 868} {"train_loss": -9.861420631408691, "global_step": 145988, "epoch": 868} {"train_loss": -10.464116096496582, "global_step": 145989, "epoch": 868} {"train_loss": -10.35651969909668, "global_step": 145990, "epoch": 868} {"train_loss": -10.536956350008646, "global_step": 145991, "epoch": 868, "val_loss": 218563.484375} {"train_loss": -10.545628547668457, "global_step": 145992, "epoch": 869} {"train_loss": -9.849066734313965, "global_step": 145993, "epoch": 869} {"train_loss": -10.145890235900879, "global_step": 145994, "epoch": 869} {"train_loss": -10.110176086425781, "global_step": 145995, "epoch": 869} {"train_loss": -10.110901832580566, "global_step": 145996, "epoch": 869} {"train_loss": -9.381269454956055, "global_step": 145997, "epoch": 869} {"train_loss": -10.51297664642334, "global_step": 145998, "epoch": 869} {"train_loss": -10.191777229309082, "global_step": 145999, "epoch": 869} {"train_loss": -10.120067596435547, "global_step": 146000, "epoch": 869} {"train_loss": -10.371672630310059, "global_step": 146001, "epoch": 869} {"train_loss": -10.357236862182617, "global_step": 146002, "epoch": 869} {"train_loss": -10.55236530303955, "global_step": 146003, "epoch": 869} {"train_loss": -10.594247817993164, "global_step": 146004, "epoch": 869} {"train_loss": -10.454607963562012, "global_step": 146005, "epoch": 869} {"train_loss": -10.604756355285645, "global_step": 146006, "epoch": 869} {"train_loss": -10.689444541931152, "global_step": 146007, "epoch": 869} {"train_loss": -10.657819747924805, "global_step": 146008, "epoch": 869} {"train_loss": -10.29733943939209, "global_step": 146009, "epoch": 869} {"train_loss": -10.6217679977417, "global_step": 146010, "epoch": 869} {"train_loss": -10.280280113220215, "global_step": 146011, "epoch": 869} {"train_loss": -10.535748481750488, "global_step": 146012, "epoch": 869} {"train_loss": -10.628610610961914, "global_step": 146013, "epoch": 869} {"train_loss": -10.47715950012207, "global_step": 146014, "epoch": 869} {"train_loss": -10.658753395080566, "global_step": 146015, "epoch": 869} {"train_loss": -10.280043601989746, "global_step": 146016, "epoch": 869} {"train_loss": -10.421697616577148, "global_step": 146017, "epoch": 869} {"train_loss": -10.453375816345215, "global_step": 146018, "epoch": 869} {"train_loss": -10.475914001464844, "global_step": 146019, "epoch": 869} {"train_loss": -10.766966819763184, "global_step": 146020, "epoch": 869} {"train_loss": -10.558753967285156, "global_step": 146021, "epoch": 869} {"train_loss": -10.352071762084961, "global_step": 146022, "epoch": 869} {"train_loss": -10.273866653442383, "global_step": 146023, "epoch": 869} {"train_loss": -10.602258682250977, "global_step": 146024, "epoch": 869} {"train_loss": -10.4221830368042, "global_step": 146025, "epoch": 869} {"train_loss": -10.584909439086914, "global_step": 146026, "epoch": 869} {"train_loss": -10.322800636291504, "global_step": 146027, "epoch": 869} {"train_loss": -10.649238586425781, "global_step": 146028, "epoch": 869} {"train_loss": -10.505191802978516, "global_step": 146029, "epoch": 869} {"train_loss": -10.49423599243164, "global_step": 146030, "epoch": 869} {"train_loss": -10.650601387023926, "global_step": 146031, "epoch": 869} {"train_loss": -10.727338790893555, "global_step": 146032, "epoch": 869} {"train_loss": -10.398017883300781, "global_step": 146033, "epoch": 869} {"train_loss": -10.495613098144531, "global_step": 146034, "epoch": 869} {"train_loss": -10.703235626220703, "global_step": 146035, "epoch": 869} {"train_loss": -10.438615798950195, "global_step": 146036, "epoch": 869} {"train_loss": -10.450457572937012, "global_step": 146037, "epoch": 869} {"train_loss": -10.570741653442383, "global_step": 146038, "epoch": 869} {"train_loss": -10.478191375732422, "global_step": 146039, "epoch": 869} {"train_loss": -10.799171447753906, "global_step": 146040, "epoch": 869} {"train_loss": -10.58381175994873, "global_step": 146041, "epoch": 869} {"train_loss": -10.573833465576172, "global_step": 146042, "epoch": 869} {"train_loss": -10.346497535705566, "global_step": 146043, "epoch": 869} {"train_loss": -10.384660720825195, "global_step": 146044, "epoch": 869} {"train_loss": -10.717021942138672, "global_step": 146045, "epoch": 869} {"train_loss": -10.60016918182373, "global_step": 146046, "epoch": 869} {"train_loss": -10.704715728759766, "global_step": 146047, "epoch": 869} {"train_loss": -10.354248046875, "global_step": 146048, "epoch": 869} {"train_loss": -10.38317584991455, "global_step": 146049, "epoch": 869} {"train_loss": -10.697395324707031, "global_step": 146050, "epoch": 869} {"train_loss": -10.448603630065918, "global_step": 146051, "epoch": 869} {"train_loss": -10.73794937133789, "global_step": 146052, "epoch": 869} {"train_loss": -10.77750015258789, "global_step": 146053, "epoch": 869} {"train_loss": -10.801220893859863, "global_step": 146054, "epoch": 869} {"train_loss": -10.842737197875977, "global_step": 146055, "epoch": 869} {"train_loss": -10.647544860839844, "global_step": 146056, "epoch": 869} {"train_loss": -10.480382919311523, "global_step": 146057, "epoch": 869} {"train_loss": -10.353489875793457, "global_step": 146058, "epoch": 869} {"train_loss": -10.63436222076416, "global_step": 146059, "epoch": 869} {"train_loss": -10.259641647338867, "global_step": 146060, "epoch": 869} {"train_loss": -10.809081077575684, "global_step": 146061, "epoch": 869} {"train_loss": -10.683073997497559, "global_step": 146062, "epoch": 869} {"train_loss": -10.81525707244873, "global_step": 146063, "epoch": 869} {"train_loss": -10.83655071258545, "global_step": 146064, "epoch": 869} {"train_loss": -10.726189613342285, "global_step": 146065, "epoch": 869} {"train_loss": -10.648445129394531, "global_step": 146066, "epoch": 869} {"train_loss": -10.725281715393066, "global_step": 146067, "epoch": 869} {"train_loss": -10.511625289916992, "global_step": 146068, "epoch": 869} {"train_loss": -10.781961441040039, "global_step": 146069, "epoch": 869} {"train_loss": -10.908628463745117, "global_step": 146070, "epoch": 869} {"train_loss": -10.658611297607422, "global_step": 146071, "epoch": 869} {"train_loss": -10.719398498535156, "global_step": 146072, "epoch": 869} {"train_loss": -10.61274528503418, "global_step": 146073, "epoch": 869} {"train_loss": -10.660163879394531, "global_step": 146074, "epoch": 869} {"train_loss": -10.668692588806152, "global_step": 146075, "epoch": 869} {"train_loss": -10.982568740844727, "global_step": 146076, "epoch": 869} {"train_loss": -10.718080520629883, "global_step": 146077, "epoch": 869} {"train_loss": -10.640786170959473, "global_step": 146078, "epoch": 869} {"train_loss": -11.056696891784668, "global_step": 146079, "epoch": 869} {"train_loss": -10.894425392150879, "global_step": 146080, "epoch": 869} {"train_loss": -10.753328323364258, "global_step": 146081, "epoch": 869} {"train_loss": -11.006848335266113, "global_step": 146082, "epoch": 869} {"train_loss": -10.556356430053711, "global_step": 146083, "epoch": 869} {"train_loss": -10.484574317932129, "global_step": 146084, "epoch": 869} {"train_loss": -10.806443214416504, "global_step": 146085, "epoch": 869} {"train_loss": -10.445778846740723, "global_step": 146086, "epoch": 869} {"train_loss": -10.694572448730469, "global_step": 146087, "epoch": 869} {"train_loss": -10.971219062805176, "global_step": 146088, "epoch": 869} {"train_loss": -10.900936126708984, "global_step": 146089, "epoch": 869} {"train_loss": -10.95036506652832, "global_step": 146090, "epoch": 869} {"train_loss": -10.679983139038086, "global_step": 146091, "epoch": 869} {"train_loss": -10.803993225097656, "global_step": 146092, "epoch": 869} {"train_loss": -10.938678741455078, "global_step": 146093, "epoch": 869} {"train_loss": -10.829523086547852, "global_step": 146094, "epoch": 869} {"train_loss": -10.638995170593262, "global_step": 146095, "epoch": 869} {"train_loss": -10.907455444335938, "global_step": 146096, "epoch": 869} {"train_loss": -10.673994064331055, "global_step": 146097, "epoch": 869} {"train_loss": -10.718647003173828, "global_step": 146098, "epoch": 869} {"train_loss": -11.00607681274414, "global_step": 146099, "epoch": 869} {"train_loss": -11.14371109008789, "global_step": 146100, "epoch": 869} {"train_loss": -11.079201698303223, "global_step": 146101, "epoch": 869} {"train_loss": -10.706887245178223, "global_step": 146102, "epoch": 869} {"train_loss": -11.03117847442627, "global_step": 146103, "epoch": 869} {"train_loss": -10.860113143920898, "global_step": 146104, "epoch": 869} {"train_loss": -11.100447654724121, "global_step": 146105, "epoch": 869} {"train_loss": -10.67379379272461, "global_step": 146106, "epoch": 869} {"train_loss": -10.991449356079102, "global_step": 146107, "epoch": 869} {"train_loss": -10.692506790161133, "global_step": 146108, "epoch": 869} {"train_loss": -11.013530731201172, "global_step": 146109, "epoch": 869} {"train_loss": -10.58614730834961, "global_step": 146110, "epoch": 869} {"train_loss": -10.762815475463867, "global_step": 146111, "epoch": 869} {"train_loss": -10.878011703491211, "global_step": 146112, "epoch": 869} {"train_loss": -11.010488510131836, "global_step": 146113, "epoch": 869} {"train_loss": -10.895040512084961, "global_step": 146114, "epoch": 869} {"train_loss": -10.646137237548828, "global_step": 146115, "epoch": 869} {"train_loss": -10.66552448272705, "global_step": 146116, "epoch": 869} {"train_loss": -10.952740669250488, "global_step": 146117, "epoch": 869} {"train_loss": -9.950130462646484, "global_step": 146118, "epoch": 869} {"train_loss": -10.700157165527344, "global_step": 146119, "epoch": 869} {"train_loss": -10.629226684570312, "global_step": 146120, "epoch": 869} {"train_loss": -11.055105209350586, "global_step": 146121, "epoch": 869} {"train_loss": -10.574760437011719, "global_step": 146122, "epoch": 869} {"train_loss": -10.591693878173828, "global_step": 146123, "epoch": 869} {"train_loss": -10.636470794677734, "global_step": 146124, "epoch": 869} {"train_loss": -10.551248550415039, "global_step": 146125, "epoch": 869} {"train_loss": -10.408886909484863, "global_step": 146126, "epoch": 869} {"train_loss": -10.251888275146484, "global_step": 146127, "epoch": 869} {"train_loss": -10.003600120544434, "global_step": 146128, "epoch": 869} {"train_loss": -9.162773132324219, "global_step": 146129, "epoch": 869} {"train_loss": -9.123005867004395, "global_step": 146130, "epoch": 869} {"train_loss": -9.573168754577637, "global_step": 146131, "epoch": 869} {"train_loss": -9.213469505310059, "global_step": 146132, "epoch": 869} {"train_loss": -9.272378921508789, "global_step": 146133, "epoch": 869} {"train_loss": -9.684968948364258, "global_step": 146134, "epoch": 869} {"train_loss": -9.092948913574219, "global_step": 146135, "epoch": 869} {"train_loss": -9.092957496643066, "global_step": 146136, "epoch": 869} {"train_loss": -9.7969331741333, "global_step": 146137, "epoch": 869} {"train_loss": -9.278732299804688, "global_step": 146138, "epoch": 869} {"train_loss": -9.757478713989258, "global_step": 146139, "epoch": 869} {"train_loss": -9.666669845581055, "global_step": 146140, "epoch": 869} {"train_loss": -9.83734130859375, "global_step": 146141, "epoch": 869} {"train_loss": -9.89441967010498, "global_step": 146142, "epoch": 869} {"train_loss": -9.90046501159668, "global_step": 146143, "epoch": 869} {"train_loss": -10.291313171386719, "global_step": 146144, "epoch": 869} {"train_loss": -9.627557754516602, "global_step": 146145, "epoch": 869} {"train_loss": -10.366911888122559, "global_step": 146146, "epoch": 869} {"train_loss": -10.041654586791992, "global_step": 146147, "epoch": 869} {"train_loss": -10.032167434692383, "global_step": 146148, "epoch": 869} {"train_loss": -10.009779930114746, "global_step": 146149, "epoch": 869} {"train_loss": -9.925567626953125, "global_step": 146150, "epoch": 869} {"train_loss": -9.93313980102539, "global_step": 146151, "epoch": 869} {"train_loss": -10.063558578491211, "global_step": 146152, "epoch": 869} {"train_loss": -9.898130416870117, "global_step": 146153, "epoch": 869} {"train_loss": -10.2988920211792, "global_step": 146154, "epoch": 869} {"train_loss": -9.889260292053223, "global_step": 146155, "epoch": 869} {"train_loss": -10.205208778381348, "global_step": 146156, "epoch": 869} {"train_loss": -10.401824951171875, "global_step": 146157, "epoch": 869} {"train_loss": -10.263233184814453, "global_step": 146158, "epoch": 869} {"train_loss": -10.461901119777135, "global_step": 146159, "epoch": 869, "val_loss": 222894.1875} {"train_loss": -10.304475784301758, "global_step": 146160, "epoch": 870} {"train_loss": -10.159820556640625, "global_step": 146161, "epoch": 870} {"train_loss": -10.534680366516113, "global_step": 146162, "epoch": 870} {"train_loss": -10.516363143920898, "global_step": 146163, "epoch": 870} {"train_loss": -10.172000885009766, "global_step": 146164, "epoch": 870} {"train_loss": -10.505656242370605, "global_step": 146165, "epoch": 870} {"train_loss": -10.143930435180664, "global_step": 146166, "epoch": 870} {"train_loss": -10.347829818725586, "global_step": 146167, "epoch": 870} {"train_loss": -10.600407600402832, "global_step": 146168, "epoch": 870} {"train_loss": -10.528576850891113, "global_step": 146169, "epoch": 870} {"train_loss": -10.649015426635742, "global_step": 146170, "epoch": 870} {"train_loss": -10.505481719970703, "global_step": 146171, "epoch": 870} {"train_loss": -10.447281837463379, "global_step": 146172, "epoch": 870} {"train_loss": -10.606740951538086, "global_step": 146173, "epoch": 870} {"train_loss": -10.542882919311523, "global_step": 146174, "epoch": 870} {"train_loss": -10.70317554473877, "global_step": 146175, "epoch": 870} {"train_loss": -10.68946647644043, "global_step": 146176, "epoch": 870} {"train_loss": -10.670247077941895, "global_step": 146177, "epoch": 870} {"train_loss": -10.572542190551758, "global_step": 146178, "epoch": 870} {"train_loss": -10.682336807250977, "global_step": 146179, "epoch": 870} {"train_loss": -10.651328086853027, "global_step": 146180, "epoch": 870} {"train_loss": -10.694499969482422, "global_step": 146181, "epoch": 870} {"train_loss": -10.724021911621094, "global_step": 146182, "epoch": 870} {"train_loss": -10.754806518554688, "global_step": 146183, "epoch": 870} {"train_loss": -10.69411563873291, "global_step": 146184, "epoch": 870} {"train_loss": -10.85158920288086, "global_step": 146185, "epoch": 870} {"train_loss": -10.724767684936523, "global_step": 146186, "epoch": 870} {"train_loss": -10.888551712036133, "global_step": 146187, "epoch": 870} {"train_loss": -10.6842041015625, "global_step": 146188, "epoch": 870} {"train_loss": -10.721513748168945, "global_step": 146189, "epoch": 870} {"train_loss": -10.920345306396484, "global_step": 146190, "epoch": 870} {"train_loss": -10.822184562683105, "global_step": 146191, "epoch": 870} {"train_loss": -10.820487976074219, "global_step": 146192, "epoch": 870} {"train_loss": -10.661947250366211, "global_step": 146193, "epoch": 870} {"train_loss": -10.795775413513184, "global_step": 146194, "epoch": 870} {"train_loss": -10.634767532348633, "global_step": 146195, "epoch": 870} {"train_loss": -10.611804962158203, "global_step": 146196, "epoch": 870} {"train_loss": -10.676178932189941, "global_step": 146197, "epoch": 870} {"train_loss": -10.783523559570312, "global_step": 146198, "epoch": 870} {"train_loss": -10.891383171081543, "global_step": 146199, "epoch": 870} {"train_loss": -10.609212875366211, "global_step": 146200, "epoch": 870} {"train_loss": -10.38003921508789, "global_step": 146201, "epoch": 870} {"train_loss": -11.081071853637695, "global_step": 146202, "epoch": 870} {"train_loss": -10.41974925994873, "global_step": 146203, "epoch": 870} {"train_loss": -10.643417358398438, "global_step": 146204, "epoch": 870} {"train_loss": -11.013350486755371, "global_step": 146205, "epoch": 870} {"train_loss": -10.519399642944336, "global_step": 146206, "epoch": 870} {"train_loss": -10.828165054321289, "global_step": 146207, "epoch": 870} {"train_loss": -10.518708229064941, "global_step": 146208, "epoch": 870} {"train_loss": -10.320552825927734, "global_step": 146209, "epoch": 870} {"train_loss": -10.411659240722656, "global_step": 146210, "epoch": 870} {"train_loss": -10.879220008850098, "global_step": 146211, "epoch": 870} {"train_loss": -10.29656982421875, "global_step": 146212, "epoch": 870} {"train_loss": -10.853493690490723, "global_step": 146213, "epoch": 870} {"train_loss": -10.401606559753418, "global_step": 146214, "epoch": 870} {"train_loss": -10.54951286315918, "global_step": 146215, "epoch": 870} {"train_loss": -10.833311080932617, "global_step": 146216, "epoch": 870} {"train_loss": -10.262500762939453, "global_step": 146217, "epoch": 870} {"train_loss": -10.090311050415039, "global_step": 146218, "epoch": 870} {"train_loss": -10.69709300994873, "global_step": 146219, "epoch": 870} {"train_loss": -10.602286338806152, "global_step": 146220, "epoch": 870} {"train_loss": -10.819343566894531, "global_step": 146221, "epoch": 870} {"train_loss": -10.377593994140625, "global_step": 146222, "epoch": 870} {"train_loss": -10.790356636047363, "global_step": 146223, "epoch": 870} {"train_loss": -10.71783447265625, "global_step": 146224, "epoch": 870} {"train_loss": -10.545541763305664, "global_step": 146225, "epoch": 870} {"train_loss": -10.971491813659668, "global_step": 146226, "epoch": 870} {"train_loss": -10.534543991088867, "global_step": 146227, "epoch": 870} {"train_loss": -10.771631240844727, "global_step": 146228, "epoch": 870} {"train_loss": -10.697663307189941, "global_step": 146229, "epoch": 870} {"train_loss": -10.836353302001953, "global_step": 146230, "epoch": 870} {"train_loss": -10.832221984863281, "global_step": 146231, "epoch": 870} {"train_loss": -10.735549926757812, "global_step": 146232, "epoch": 870} {"train_loss": -10.965179443359375, "global_step": 146233, "epoch": 870} {"train_loss": -10.571954727172852, "global_step": 146234, "epoch": 870} {"train_loss": -10.801536560058594, "global_step": 146235, "epoch": 870} {"train_loss": -10.760520935058594, "global_step": 146236, "epoch": 870} {"train_loss": -10.764904022216797, "global_step": 146237, "epoch": 870} {"train_loss": -10.855684280395508, "global_step": 146238, "epoch": 870} {"train_loss": -10.906881332397461, "global_step": 146239, "epoch": 870} {"train_loss": -10.90560531616211, "global_step": 146240, "epoch": 870} {"train_loss": -10.76353645324707, "global_step": 146241, "epoch": 870} {"train_loss": -10.848706245422363, "global_step": 146242, "epoch": 870} {"train_loss": -10.913642883300781, "global_step": 146243, "epoch": 870} {"train_loss": -11.034933090209961, "global_step": 146244, "epoch": 870} {"train_loss": -10.940478324890137, "global_step": 146245, "epoch": 870} {"train_loss": -10.954100608825684, "global_step": 146246, "epoch": 870} {"train_loss": -11.094717025756836, "global_step": 146247, "epoch": 870} {"train_loss": -10.822819709777832, "global_step": 146248, "epoch": 870} {"train_loss": -10.884032249450684, "global_step": 146249, "epoch": 870} {"train_loss": -10.84571647644043, "global_step": 146250, "epoch": 870} {"train_loss": -10.842536926269531, "global_step": 146251, "epoch": 870} {"train_loss": -10.68583869934082, "global_step": 146252, "epoch": 870} {"train_loss": -10.77375316619873, "global_step": 146253, "epoch": 870} {"train_loss": -10.409164428710938, "global_step": 146254, "epoch": 870} {"train_loss": -10.808963775634766, "global_step": 146255, "epoch": 870} {"train_loss": -10.426544189453125, "global_step": 146256, "epoch": 870} {"train_loss": -10.583242416381836, "global_step": 146257, "epoch": 870} {"train_loss": -10.341972351074219, "global_step": 146258, "epoch": 870} {"train_loss": -10.61529541015625, "global_step": 146259, "epoch": 870} {"train_loss": -10.32313060760498, "global_step": 146260, "epoch": 870} {"train_loss": -10.991122245788574, "global_step": 146261, "epoch": 870} {"train_loss": -10.285955429077148, "global_step": 146262, "epoch": 870} {"train_loss": -10.81177043914795, "global_step": 146263, "epoch": 870} {"train_loss": -10.773589134216309, "global_step": 146264, "epoch": 870} {"train_loss": -10.85732650756836, "global_step": 146265, "epoch": 870} {"train_loss": -10.852270126342773, "global_step": 146266, "epoch": 870} {"train_loss": -10.498327255249023, "global_step": 146267, "epoch": 870} {"train_loss": -10.71420955657959, "global_step": 146268, "epoch": 870} {"train_loss": -10.467870712280273, "global_step": 146269, "epoch": 870} {"train_loss": -10.875353813171387, "global_step": 146270, "epoch": 870} {"train_loss": -10.66408634185791, "global_step": 146271, "epoch": 870} {"train_loss": -10.540990829467773, "global_step": 146272, "epoch": 870} {"train_loss": -10.583133697509766, "global_step": 146273, "epoch": 870} {"train_loss": -10.78152084350586, "global_step": 146274, "epoch": 870} {"train_loss": -10.945361137390137, "global_step": 146275, "epoch": 870} {"train_loss": -10.858641624450684, "global_step": 146276, "epoch": 870} {"train_loss": -10.447278022766113, "global_step": 146277, "epoch": 870} {"train_loss": -10.700578689575195, "global_step": 146278, "epoch": 870} {"train_loss": -10.894071578979492, "global_step": 146279, "epoch": 870} {"train_loss": -10.546947479248047, "global_step": 146280, "epoch": 870} {"train_loss": -10.938374519348145, "global_step": 146281, "epoch": 870} {"train_loss": -10.403830528259277, "global_step": 146282, "epoch": 870} {"train_loss": -10.8126802444458, "global_step": 146283, "epoch": 870} {"train_loss": -10.841554641723633, "global_step": 146284, "epoch": 870} {"train_loss": -10.827080726623535, "global_step": 146285, "epoch": 870} {"train_loss": -10.82390022277832, "global_step": 146286, "epoch": 870} {"train_loss": -10.586584091186523, "global_step": 146287, "epoch": 870} {"train_loss": -10.715343475341797, "global_step": 146288, "epoch": 870} {"train_loss": -10.649251937866211, "global_step": 146289, "epoch": 870} {"train_loss": -10.640191078186035, "global_step": 146290, "epoch": 870} {"train_loss": -10.803241729736328, "global_step": 146291, "epoch": 870} {"train_loss": -10.423151016235352, "global_step": 146292, "epoch": 870} {"train_loss": -10.884692192077637, "global_step": 146293, "epoch": 870} {"train_loss": -10.523025512695312, "global_step": 146294, "epoch": 870} {"train_loss": -10.94217300415039, "global_step": 146295, "epoch": 870} {"train_loss": -10.897216796875, "global_step": 146296, "epoch": 870} {"train_loss": -10.877927780151367, "global_step": 146297, "epoch": 870} {"train_loss": -10.897956848144531, "global_step": 146298, "epoch": 870} {"train_loss": -10.757122039794922, "global_step": 146299, "epoch": 870} {"train_loss": -10.895503044128418, "global_step": 146300, "epoch": 870} {"train_loss": -10.683695793151855, "global_step": 146301, "epoch": 870} {"train_loss": -10.722831726074219, "global_step": 146302, "epoch": 870} {"train_loss": -10.880866050720215, "global_step": 146303, "epoch": 870} {"train_loss": -10.72521686553955, "global_step": 146304, "epoch": 870} {"train_loss": -10.562519073486328, "global_step": 146305, "epoch": 870} {"train_loss": -10.49621295928955, "global_step": 146306, "epoch": 870} {"train_loss": -10.261449813842773, "global_step": 146307, "epoch": 870} {"train_loss": -10.227521896362305, "global_step": 146308, "epoch": 870} {"train_loss": -10.662592887878418, "global_step": 146309, "epoch": 870} {"train_loss": -9.878899574279785, "global_step": 146310, "epoch": 870} {"train_loss": -10.44992733001709, "global_step": 146311, "epoch": 870} {"train_loss": -10.536693572998047, "global_step": 146312, "epoch": 870} {"train_loss": -10.42965316772461, "global_step": 146313, "epoch": 870} {"train_loss": -10.660347938537598, "global_step": 146314, "epoch": 870} {"train_loss": -10.704593658447266, "global_step": 146315, "epoch": 870} {"train_loss": -10.346961975097656, "global_step": 146316, "epoch": 870} {"train_loss": -10.678192138671875, "global_step": 146317, "epoch": 870} {"train_loss": -10.096847534179688, "global_step": 146318, "epoch": 870} {"train_loss": -10.464896202087402, "global_step": 146319, "epoch": 870} {"train_loss": -10.412033081054688, "global_step": 146320, "epoch": 870} {"train_loss": -10.192098617553711, "global_step": 146321, "epoch": 870} {"train_loss": -10.500126838684082, "global_step": 146322, "epoch": 870} {"train_loss": -10.213815689086914, "global_step": 146323, "epoch": 870} {"train_loss": -10.582451820373535, "global_step": 146324, "epoch": 870} {"train_loss": -10.242067337036133, "global_step": 146325, "epoch": 870} {"train_loss": -10.846844673156738, "global_step": 146326, "epoch": 870} {"train_loss": -10.650796492894491, "global_step": 146327, "epoch": 870, "val_loss": 227788.515625, "train_action_mse_error": 1.1594438552856445} {"train_loss": -10.741373062133789, "global_step": 146328, "epoch": 871} {"train_loss": -10.547685623168945, "global_step": 146329, "epoch": 871} {"train_loss": -10.72873306274414, "global_step": 146330, "epoch": 871} {"train_loss": -10.61158561706543, "global_step": 146331, "epoch": 871} {"train_loss": -10.482683181762695, "global_step": 146332, "epoch": 871} {"train_loss": -10.449453353881836, "global_step": 146333, "epoch": 871} {"train_loss": -10.631746292114258, "global_step": 146334, "epoch": 871} {"train_loss": -10.833901405334473, "global_step": 146335, "epoch": 871} {"train_loss": -10.56320571899414, "global_step": 146336, "epoch": 871} {"train_loss": -10.8068208694458, "global_step": 146337, "epoch": 871} {"train_loss": -10.696697235107422, "global_step": 146338, "epoch": 871} {"train_loss": -10.504730224609375, "global_step": 146339, "epoch": 871} {"train_loss": -10.756567001342773, "global_step": 146340, "epoch": 871} {"train_loss": -10.56607437133789, "global_step": 146341, "epoch": 871} {"train_loss": -10.675410270690918, "global_step": 146342, "epoch": 871} {"train_loss": -10.837657928466797, "global_step": 146343, "epoch": 871} {"train_loss": -10.365153312683105, "global_step": 146344, "epoch": 871} {"train_loss": -10.7554349899292, "global_step": 146345, "epoch": 871} {"train_loss": -10.805527687072754, "global_step": 146346, "epoch": 871} {"train_loss": -10.719549179077148, "global_step": 146347, "epoch": 871} {"train_loss": -10.756312370300293, "global_step": 146348, "epoch": 871} {"train_loss": -10.729658126831055, "global_step": 146349, "epoch": 871} {"train_loss": -10.660865783691406, "global_step": 146350, "epoch": 871} {"train_loss": -10.66141128540039, "global_step": 146351, "epoch": 871} {"train_loss": -10.898712158203125, "global_step": 146352, "epoch": 871} {"train_loss": -10.934547424316406, "global_step": 146353, "epoch": 871} {"train_loss": -10.384576797485352, "global_step": 146354, "epoch": 871} {"train_loss": -10.791337966918945, "global_step": 146355, "epoch": 871} {"train_loss": -10.619317054748535, "global_step": 146356, "epoch": 871} {"train_loss": -10.512951850891113, "global_step": 146357, "epoch": 871} {"train_loss": -10.8754243850708, "global_step": 146358, "epoch": 871} {"train_loss": -10.376036643981934, "global_step": 146359, "epoch": 871} {"train_loss": -11.070302963256836, "global_step": 146360, "epoch": 871} {"train_loss": -10.850733757019043, "global_step": 146361, "epoch": 871} {"train_loss": -10.970721244812012, "global_step": 146362, "epoch": 871} {"train_loss": -11.012609481811523, "global_step": 146363, "epoch": 871} {"train_loss": -10.944278717041016, "global_step": 146364, "epoch": 871} {"train_loss": -10.956918716430664, "global_step": 146365, "epoch": 871} {"train_loss": -10.584100723266602, "global_step": 146366, "epoch": 871} {"train_loss": -10.655935287475586, "global_step": 146367, "epoch": 871} {"train_loss": -10.81307601928711, "global_step": 146368, "epoch": 871} {"train_loss": -10.733572959899902, "global_step": 146369, "epoch": 871} {"train_loss": -10.787365913391113, "global_step": 146370, "epoch": 871} {"train_loss": -10.389663696289062, "global_step": 146371, "epoch": 871} {"train_loss": -10.758010864257812, "global_step": 146372, "epoch": 871} {"train_loss": -10.527904510498047, "global_step": 146373, "epoch": 871} {"train_loss": -10.776844024658203, "global_step": 146374, "epoch": 871} {"train_loss": -10.386587142944336, "global_step": 146375, "epoch": 871} {"train_loss": -9.642768859863281, "global_step": 146376, "epoch": 871} {"train_loss": -10.585100173950195, "global_step": 146377, "epoch": 871} {"train_loss": -10.006168365478516, "global_step": 146378, "epoch": 871} {"train_loss": -9.646873474121094, "global_step": 146379, "epoch": 871} {"train_loss": -10.286979675292969, "global_step": 146380, "epoch": 871} {"train_loss": -9.60987377166748, "global_step": 146381, "epoch": 871} {"train_loss": -10.194297790527344, "global_step": 146382, "epoch": 871} {"train_loss": -9.365453720092773, "global_step": 146383, "epoch": 871} {"train_loss": -10.152377128601074, "global_step": 146384, "epoch": 871} {"train_loss": -9.875728607177734, "global_step": 146385, "epoch": 871} {"train_loss": -10.096349716186523, "global_step": 146386, "epoch": 871} {"train_loss": -10.331538200378418, "global_step": 146387, "epoch": 871} {"train_loss": -9.726923942565918, "global_step": 146388, "epoch": 871} {"train_loss": -10.29981517791748, "global_step": 146389, "epoch": 871} {"train_loss": -10.219141006469727, "global_step": 146390, "epoch": 871} {"train_loss": -10.391324043273926, "global_step": 146391, "epoch": 871} {"train_loss": -10.156986236572266, "global_step": 146392, "epoch": 871} {"train_loss": -10.276888847351074, "global_step": 146393, "epoch": 871} {"train_loss": -10.583698272705078, "global_step": 146394, "epoch": 871} {"train_loss": -10.26606559753418, "global_step": 146395, "epoch": 871} {"train_loss": -10.549421310424805, "global_step": 146396, "epoch": 871} {"train_loss": -10.654630661010742, "global_step": 146397, "epoch": 871} {"train_loss": -10.167280197143555, "global_step": 146398, "epoch": 871} {"train_loss": -10.533605575561523, "global_step": 146399, "epoch": 871} {"train_loss": -10.571759223937988, "global_step": 146400, "epoch": 871} {"train_loss": -10.508543014526367, "global_step": 146401, "epoch": 871} {"train_loss": -10.579952239990234, "global_step": 146402, "epoch": 871} {"train_loss": -10.519561767578125, "global_step": 146403, "epoch": 871} {"train_loss": -10.456777572631836, "global_step": 146404, "epoch": 871} {"train_loss": -10.76566219329834, "global_step": 146405, "epoch": 871} {"train_loss": -10.653059005737305, "global_step": 146406, "epoch": 871} {"train_loss": -10.85078239440918, "global_step": 146407, "epoch": 871} {"train_loss": -10.597529411315918, "global_step": 146408, "epoch": 871} {"train_loss": -10.634449005126953, "global_step": 146409, "epoch": 871} {"train_loss": -10.601669311523438, "global_step": 146410, "epoch": 871} {"train_loss": -10.86988639831543, "global_step": 146411, "epoch": 871} {"train_loss": -10.558670043945312, "global_step": 146412, "epoch": 871} {"train_loss": -10.60009765625, "global_step": 146413, "epoch": 871} {"train_loss": -10.594721794128418, "global_step": 146414, "epoch": 871} {"train_loss": -10.761935234069824, "global_step": 146415, "epoch": 871} {"train_loss": -10.761001586914062, "global_step": 146416, "epoch": 871} {"train_loss": -10.659979820251465, "global_step": 146417, "epoch": 871} {"train_loss": -10.636237144470215, "global_step": 146418, "epoch": 871} {"train_loss": -10.647211074829102, "global_step": 146419, "epoch": 871} {"train_loss": -10.57469654083252, "global_step": 146420, "epoch": 871} {"train_loss": -10.649176597595215, "global_step": 146421, "epoch": 871} {"train_loss": -10.497295379638672, "global_step": 146422, "epoch": 871} {"train_loss": -11.00058650970459, "global_step": 146423, "epoch": 871} {"train_loss": -10.875743865966797, "global_step": 146424, "epoch": 871} {"train_loss": -10.787393569946289, "global_step": 146425, "epoch": 871} {"train_loss": -11.001299858093262, "global_step": 146426, "epoch": 871} {"train_loss": -10.77920913696289, "global_step": 146427, "epoch": 871} {"train_loss": -10.863180160522461, "global_step": 146428, "epoch": 871} {"train_loss": -10.98697566986084, "global_step": 146429, "epoch": 871} {"train_loss": -10.859762191772461, "global_step": 146430, "epoch": 871} {"train_loss": -11.006072998046875, "global_step": 146431, "epoch": 871} {"train_loss": -10.813753128051758, "global_step": 146432, "epoch": 871} {"train_loss": -10.865460395812988, "global_step": 146433, "epoch": 871} {"train_loss": -11.19390869140625, "global_step": 146434, "epoch": 871} {"train_loss": -10.893448829650879, "global_step": 146435, "epoch": 871} {"train_loss": -10.829479217529297, "global_step": 146436, "epoch": 871} {"train_loss": -10.919363021850586, "global_step": 146437, "epoch": 871} {"train_loss": -10.865083694458008, "global_step": 146438, "epoch": 871} {"train_loss": -11.026491165161133, "global_step": 146439, "epoch": 871} {"train_loss": -10.593936920166016, "global_step": 146440, "epoch": 871} {"train_loss": -10.741211891174316, "global_step": 146441, "epoch": 871} {"train_loss": -11.10228443145752, "global_step": 146442, "epoch": 871} {"train_loss": -10.895547866821289, "global_step": 146443, "epoch": 871} {"train_loss": -10.842172622680664, "global_step": 146444, "epoch": 871} {"train_loss": -11.149575233459473, "global_step": 146445, "epoch": 871} {"train_loss": -10.635517120361328, "global_step": 146446, "epoch": 871} {"train_loss": -10.721803665161133, "global_step": 146447, "epoch": 871} {"train_loss": -10.876102447509766, "global_step": 146448, "epoch": 871} {"train_loss": -10.756919860839844, "global_step": 146449, "epoch": 871} {"train_loss": -10.64853286743164, "global_step": 146450, "epoch": 871} {"train_loss": -11.018087387084961, "global_step": 146451, "epoch": 871} {"train_loss": -10.823198318481445, "global_step": 146452, "epoch": 871} {"train_loss": -10.25799560546875, "global_step": 146453, "epoch": 871} {"train_loss": -10.280712127685547, "global_step": 146454, "epoch": 871} {"train_loss": -10.41508674621582, "global_step": 146455, "epoch": 871} {"train_loss": -9.963552474975586, "global_step": 146456, "epoch": 871} {"train_loss": -10.515205383300781, "global_step": 146457, "epoch": 871} {"train_loss": -10.480338096618652, "global_step": 146458, "epoch": 871} {"train_loss": -8.828985214233398, "global_step": 146459, "epoch": 871} {"train_loss": -10.463647842407227, "global_step": 146460, "epoch": 871} {"train_loss": -9.983406066894531, "global_step": 146461, "epoch": 871} {"train_loss": -9.504209518432617, "global_step": 146462, "epoch": 871} {"train_loss": -10.348051071166992, "global_step": 146463, "epoch": 871} {"train_loss": -10.075101852416992, "global_step": 146464, "epoch": 871} {"train_loss": -10.142208099365234, "global_step": 146465, "epoch": 871} {"train_loss": -9.896522521972656, "global_step": 146466, "epoch": 871} {"train_loss": -10.470752716064453, "global_step": 146467, "epoch": 871} {"train_loss": -10.089523315429688, "global_step": 146468, "epoch": 871} {"train_loss": -10.71569538116455, "global_step": 146469, "epoch": 871} {"train_loss": -9.994807243347168, "global_step": 146470, "epoch": 871} {"train_loss": -10.393072128295898, "global_step": 146471, "epoch": 871} {"train_loss": -9.930632591247559, "global_step": 146472, "epoch": 871} {"train_loss": -10.012613296508789, "global_step": 146473, "epoch": 871} {"train_loss": -10.36500358581543, "global_step": 146474, "epoch": 871} {"train_loss": -10.16533088684082, "global_step": 146475, "epoch": 871} {"train_loss": -10.5743989944458, "global_step": 146476, "epoch": 871} {"train_loss": -10.578241348266602, "global_step": 146477, "epoch": 871} {"train_loss": -10.215051651000977, "global_step": 146478, "epoch": 871} {"train_loss": -10.332247734069824, "global_step": 146479, "epoch": 871} {"train_loss": -10.261735916137695, "global_step": 146480, "epoch": 871} {"train_loss": -10.211986541748047, "global_step": 146481, "epoch": 871} {"train_loss": -10.266949653625488, "global_step": 146482, "epoch": 871} {"train_loss": -10.440469741821289, "global_step": 146483, "epoch": 871} {"train_loss": -10.239848136901855, "global_step": 146484, "epoch": 871} {"train_loss": -10.101083755493164, "global_step": 146485, "epoch": 871} {"train_loss": -10.46658706665039, "global_step": 146486, "epoch": 871} {"train_loss": -10.04102611541748, "global_step": 146487, "epoch": 871} {"train_loss": -10.610599517822266, "global_step": 146488, "epoch": 871} {"train_loss": -10.03792953491211, "global_step": 146489, "epoch": 871} {"train_loss": -10.122274398803711, "global_step": 146490, "epoch": 871} {"train_loss": -10.105697631835938, "global_step": 146491, "epoch": 871} {"train_loss": -10.527908325195312, "global_step": 146492, "epoch": 871} {"train_loss": -10.305580139160156, "global_step": 146493, "epoch": 871} {"train_loss": -9.777521133422852, "global_step": 146494, "epoch": 871} {"train_loss": -10.517299067406427, "global_step": 146495, "epoch": 871, "val_loss": 227158.96875} {"train_loss": -10.526435852050781, "global_step": 146496, "epoch": 872} {"train_loss": -10.025968551635742, "global_step": 146497, "epoch": 872} {"train_loss": -10.613975524902344, "global_step": 146498, "epoch": 872} {"train_loss": -10.316326141357422, "global_step": 146499, "epoch": 872} {"train_loss": -10.492353439331055, "global_step": 146500, "epoch": 872} {"train_loss": -10.758472442626953, "global_step": 146501, "epoch": 872} {"train_loss": -10.456021308898926, "global_step": 146502, "epoch": 872} {"train_loss": -10.468287467956543, "global_step": 146503, "epoch": 872} {"train_loss": -10.604068756103516, "global_step": 146504, "epoch": 872} {"train_loss": -10.577499389648438, "global_step": 146505, "epoch": 872} {"train_loss": -10.719566345214844, "global_step": 146506, "epoch": 872} {"train_loss": -10.670881271362305, "global_step": 146507, "epoch": 872} {"train_loss": -10.521982192993164, "global_step": 146508, "epoch": 872} {"train_loss": -10.691011428833008, "global_step": 146509, "epoch": 872} {"train_loss": -10.7633056640625, "global_step": 146510, "epoch": 872} {"train_loss": -10.775240898132324, "global_step": 146511, "epoch": 872} {"train_loss": -10.79714584350586, "global_step": 146512, "epoch": 872} {"train_loss": -10.910985946655273, "global_step": 146513, "epoch": 872} {"train_loss": -10.715871810913086, "global_step": 146514, "epoch": 872} {"train_loss": -10.87822151184082, "global_step": 146515, "epoch": 872} {"train_loss": -10.852632522583008, "global_step": 146516, "epoch": 872} {"train_loss": -10.766469955444336, "global_step": 146517, "epoch": 872} {"train_loss": -10.818028450012207, "global_step": 146518, "epoch": 872} {"train_loss": -10.791260719299316, "global_step": 146519, "epoch": 872} {"train_loss": -10.843573570251465, "global_step": 146520, "epoch": 872} {"train_loss": -10.974359512329102, "global_step": 146521, "epoch": 872} {"train_loss": -10.957012176513672, "global_step": 146522, "epoch": 872} {"train_loss": -10.900110244750977, "global_step": 146523, "epoch": 872} {"train_loss": -10.970596313476562, "global_step": 146524, "epoch": 872} {"train_loss": -10.908873558044434, "global_step": 146525, "epoch": 872} {"train_loss": -10.949214935302734, "global_step": 146526, "epoch": 872} {"train_loss": -11.051591873168945, "global_step": 146527, "epoch": 872} {"train_loss": -10.975958824157715, "global_step": 146528, "epoch": 872} {"train_loss": -11.055179595947266, "global_step": 146529, "epoch": 872} {"train_loss": -11.133355140686035, "global_step": 146530, "epoch": 872} {"train_loss": -11.10946273803711, "global_step": 146531, "epoch": 872} {"train_loss": -10.994072914123535, "global_step": 146532, "epoch": 872} {"train_loss": -10.968111991882324, "global_step": 146533, "epoch": 872} {"train_loss": -11.05251407623291, "global_step": 146534, "epoch": 872} {"train_loss": -10.765754699707031, "global_step": 146535, "epoch": 872} {"train_loss": -10.687847137451172, "global_step": 146536, "epoch": 872} {"train_loss": -11.054143905639648, "global_step": 146537, "epoch": 872} {"train_loss": -11.07091236114502, "global_step": 146538, "epoch": 872} {"train_loss": -10.765936851501465, "global_step": 146539, "epoch": 872} {"train_loss": -11.004608154296875, "global_step": 146540, "epoch": 872} {"train_loss": -10.906034469604492, "global_step": 146541, "epoch": 872} {"train_loss": -11.075484275817871, "global_step": 146542, "epoch": 872} {"train_loss": -10.610411643981934, "global_step": 146543, "epoch": 872} {"train_loss": -10.439672470092773, "global_step": 146544, "epoch": 872} {"train_loss": -10.803927421569824, "global_step": 146545, "epoch": 872} {"train_loss": -10.006465911865234, "global_step": 146546, "epoch": 872} {"train_loss": -9.26905632019043, "global_step": 146547, "epoch": 872} {"train_loss": -10.76188850402832, "global_step": 146548, "epoch": 872} {"train_loss": -10.934343338012695, "global_step": 146549, "epoch": 872} {"train_loss": -10.016716003417969, "global_step": 146550, "epoch": 872} {"train_loss": -10.65684986114502, "global_step": 146551, "epoch": 872} {"train_loss": -10.013216018676758, "global_step": 146552, "epoch": 872} {"train_loss": -10.144634246826172, "global_step": 146553, "epoch": 872} {"train_loss": -10.545137405395508, "global_step": 146554, "epoch": 872} {"train_loss": -10.376691818237305, "global_step": 146555, "epoch": 872} {"train_loss": -10.380796432495117, "global_step": 146556, "epoch": 872} {"train_loss": -10.992137908935547, "global_step": 146557, "epoch": 872} {"train_loss": -10.670053482055664, "global_step": 146558, "epoch": 872} {"train_loss": -10.143092155456543, "global_step": 146559, "epoch": 872} {"train_loss": -10.451335906982422, "global_step": 146560, "epoch": 872} {"train_loss": -10.455263137817383, "global_step": 146561, "epoch": 872} {"train_loss": -10.413534164428711, "global_step": 146562, "epoch": 872} {"train_loss": -10.579923629760742, "global_step": 146563, "epoch": 872} {"train_loss": -10.252429008483887, "global_step": 146564, "epoch": 872} {"train_loss": -10.393415451049805, "global_step": 146565, "epoch": 872} {"train_loss": -9.729181289672852, "global_step": 146566, "epoch": 872} {"train_loss": -10.125072479248047, "global_step": 146567, "epoch": 872} {"train_loss": -9.151062965393066, "global_step": 146568, "epoch": 872} {"train_loss": -9.773551940917969, "global_step": 146569, "epoch": 872} {"train_loss": -9.731136322021484, "global_step": 146570, "epoch": 872} {"train_loss": -9.724145889282227, "global_step": 146571, "epoch": 872} {"train_loss": -9.913681030273438, "global_step": 146572, "epoch": 872} {"train_loss": -9.943985939025879, "global_step": 146573, "epoch": 872} {"train_loss": -10.179529190063477, "global_step": 146574, "epoch": 872} {"train_loss": -10.703197479248047, "global_step": 146575, "epoch": 872} {"train_loss": -10.092960357666016, "global_step": 146576, "epoch": 872} {"train_loss": -10.249859809875488, "global_step": 146577, "epoch": 872} {"train_loss": -10.26093864440918, "global_step": 146578, "epoch": 872} {"train_loss": -10.447223663330078, "global_step": 146579, "epoch": 872} {"train_loss": -10.238037109375, "global_step": 146580, "epoch": 872} {"train_loss": -10.382922172546387, "global_step": 146581, "epoch": 872} {"train_loss": -10.40716552734375, "global_step": 146582, "epoch": 872} {"train_loss": -10.22654914855957, "global_step": 146583, "epoch": 872} {"train_loss": -10.524954795837402, "global_step": 146584, "epoch": 872} {"train_loss": -10.477531433105469, "global_step": 146585, "epoch": 872} {"train_loss": -10.694499969482422, "global_step": 146586, "epoch": 872} {"train_loss": -10.465085983276367, "global_step": 146587, "epoch": 872} {"train_loss": -10.558780670166016, "global_step": 146588, "epoch": 872} {"train_loss": -10.91453742980957, "global_step": 146589, "epoch": 872} {"train_loss": -10.676285743713379, "global_step": 146590, "epoch": 872} {"train_loss": -10.802593231201172, "global_step": 146591, "epoch": 872} {"train_loss": -10.667696952819824, "global_step": 146592, "epoch": 872} {"train_loss": -10.668415069580078, "global_step": 146593, "epoch": 872} {"train_loss": -10.718255996704102, "global_step": 146594, "epoch": 872} {"train_loss": -10.759599685668945, "global_step": 146595, "epoch": 872} {"train_loss": -10.627522468566895, "global_step": 146596, "epoch": 872} {"train_loss": -10.791637420654297, "global_step": 146597, "epoch": 872} {"train_loss": -10.646862030029297, "global_step": 146598, "epoch": 872} {"train_loss": -10.873781204223633, "global_step": 146599, "epoch": 872} {"train_loss": -10.776592254638672, "global_step": 146600, "epoch": 872} {"train_loss": -10.850286483764648, "global_step": 146601, "epoch": 872} {"train_loss": -10.814144134521484, "global_step": 146602, "epoch": 872} {"train_loss": -10.943852424621582, "global_step": 146603, "epoch": 872} {"train_loss": -10.532899856567383, "global_step": 146604, "epoch": 872} {"train_loss": -10.91156005859375, "global_step": 146605, "epoch": 872} {"train_loss": -10.916733741760254, "global_step": 146606, "epoch": 872} {"train_loss": -10.964963912963867, "global_step": 146607, "epoch": 872} {"train_loss": -10.946157455444336, "global_step": 146608, "epoch": 872} {"train_loss": -10.781393051147461, "global_step": 146609, "epoch": 872} {"train_loss": -10.84992790222168, "global_step": 146610, "epoch": 872} {"train_loss": -10.829116821289062, "global_step": 146611, "epoch": 872} {"train_loss": -10.94324016571045, "global_step": 146612, "epoch": 872} {"train_loss": -10.864858627319336, "global_step": 146613, "epoch": 872} {"train_loss": -11.181022644042969, "global_step": 146614, "epoch": 872} {"train_loss": -10.982585906982422, "global_step": 146615, "epoch": 872} {"train_loss": -10.798501014709473, "global_step": 146616, "epoch": 872} {"train_loss": -11.036941528320312, "global_step": 146617, "epoch": 872} {"train_loss": -10.857887268066406, "global_step": 146618, "epoch": 872} {"train_loss": -10.809791564941406, "global_step": 146619, "epoch": 872} {"train_loss": -10.728259086608887, "global_step": 146620, "epoch": 872} {"train_loss": -10.909112930297852, "global_step": 146621, "epoch": 872} {"train_loss": -10.654875755310059, "global_step": 146622, "epoch": 872} {"train_loss": -10.881853103637695, "global_step": 146623, "epoch": 872} {"train_loss": -10.492794036865234, "global_step": 146624, "epoch": 872} {"train_loss": -10.958027839660645, "global_step": 146625, "epoch": 872} {"train_loss": -10.828879356384277, "global_step": 146626, "epoch": 872} {"train_loss": -10.67854118347168, "global_step": 146627, "epoch": 872} {"train_loss": -10.768450736999512, "global_step": 146628, "epoch": 872} {"train_loss": -10.269831657409668, "global_step": 146629, "epoch": 872} {"train_loss": -9.92177963256836, "global_step": 146630, "epoch": 872} {"train_loss": -10.448260307312012, "global_step": 146631, "epoch": 872} {"train_loss": -10.320026397705078, "global_step": 146632, "epoch": 872} {"train_loss": -10.15284252166748, "global_step": 146633, "epoch": 872} {"train_loss": -10.433286666870117, "global_step": 146634, "epoch": 872} {"train_loss": -10.327701568603516, "global_step": 146635, "epoch": 872} {"train_loss": -9.581212997436523, "global_step": 146636, "epoch": 872} {"train_loss": -9.984378814697266, "global_step": 146637, "epoch": 872} {"train_loss": -9.869929313659668, "global_step": 146638, "epoch": 872} {"train_loss": -9.75450325012207, "global_step": 146639, "epoch": 872} {"train_loss": -10.320135116577148, "global_step": 146640, "epoch": 872} {"train_loss": -9.870981216430664, "global_step": 146641, "epoch": 872} {"train_loss": -10.204215049743652, "global_step": 146642, "epoch": 872} {"train_loss": -9.694604873657227, "global_step": 146643, "epoch": 872} {"train_loss": -10.374002456665039, "global_step": 146644, "epoch": 872} {"train_loss": -10.163460731506348, "global_step": 146645, "epoch": 872} {"train_loss": -10.282297134399414, "global_step": 146646, "epoch": 872} {"train_loss": -10.036725997924805, "global_step": 146647, "epoch": 872} {"train_loss": -10.12811279296875, "global_step": 146648, "epoch": 872} {"train_loss": -10.097306251525879, "global_step": 146649, "epoch": 872} {"train_loss": -10.452731132507324, "global_step": 146650, "epoch": 872} {"train_loss": -10.200206756591797, "global_step": 146651, "epoch": 872} {"train_loss": -10.392011642456055, "global_step": 146652, "epoch": 872} {"train_loss": -10.398285865783691, "global_step": 146653, "epoch": 872} {"train_loss": -10.243653297424316, "global_step": 146654, "epoch": 872} {"train_loss": -10.514212608337402, "global_step": 146655, "epoch": 872} {"train_loss": -10.526952743530273, "global_step": 146656, "epoch": 872} {"train_loss": -10.337026596069336, "global_step": 146657, "epoch": 872} {"train_loss": -10.505096435546875, "global_step": 146658, "epoch": 872} {"train_loss": -10.542146682739258, "global_step": 146659, "epoch": 872} {"train_loss": -10.619562149047852, "global_step": 146660, "epoch": 872} {"train_loss": -10.553131103515625, "global_step": 146661, "epoch": 872} {"train_loss": -10.836702346801758, "global_step": 146662, "epoch": 872} {"train_loss": -10.551895431109838, "global_step": 146663, "epoch": 872, "val_loss": 228803.28125} {"train_loss": -10.73843002319336, "global_step": 146664, "epoch": 873} {"train_loss": -10.55282974243164, "global_step": 146665, "epoch": 873} {"train_loss": -10.732315063476562, "global_step": 146666, "epoch": 873} {"train_loss": -10.911922454833984, "global_step": 146667, "epoch": 873} {"train_loss": -10.793295860290527, "global_step": 146668, "epoch": 873} {"train_loss": -10.786624908447266, "global_step": 146669, "epoch": 873} {"train_loss": -10.807943344116211, "global_step": 146670, "epoch": 873} {"train_loss": -10.790830612182617, "global_step": 146671, "epoch": 873} {"train_loss": -10.694881439208984, "global_step": 146672, "epoch": 873} {"train_loss": -10.597265243530273, "global_step": 146673, "epoch": 873} {"train_loss": -10.650158882141113, "global_step": 146674, "epoch": 873} {"train_loss": -10.73231315612793, "global_step": 146675, "epoch": 873} {"train_loss": -10.868793487548828, "global_step": 146676, "epoch": 873} {"train_loss": -10.748836517333984, "global_step": 146677, "epoch": 873} {"train_loss": -10.83604621887207, "global_step": 146678, "epoch": 873} {"train_loss": -10.805854797363281, "global_step": 146679, "epoch": 873} {"train_loss": -10.468255043029785, "global_step": 146680, "epoch": 873} {"train_loss": -10.820568084716797, "global_step": 146681, "epoch": 873} {"train_loss": -10.859569549560547, "global_step": 146682, "epoch": 873} {"train_loss": -10.481595993041992, "global_step": 146683, "epoch": 873} {"train_loss": -11.008443832397461, "global_step": 146684, "epoch": 873} {"train_loss": -11.027318000793457, "global_step": 146685, "epoch": 873} {"train_loss": -10.717560768127441, "global_step": 146686, "epoch": 873} {"train_loss": -11.159419059753418, "global_step": 146687, "epoch": 873} {"train_loss": -10.90775203704834, "global_step": 146688, "epoch": 873} {"train_loss": -11.01243782043457, "global_step": 146689, "epoch": 873} {"train_loss": -10.991752624511719, "global_step": 146690, "epoch": 873} {"train_loss": -11.005050659179688, "global_step": 146691, "epoch": 873} {"train_loss": -10.835970878601074, "global_step": 146692, "epoch": 873} {"train_loss": -11.219389915466309, "global_step": 146693, "epoch": 873} {"train_loss": -10.872901916503906, "global_step": 146694, "epoch": 873} {"train_loss": -10.66563892364502, "global_step": 146695, "epoch": 873} {"train_loss": -11.023938179016113, "global_step": 146696, "epoch": 873} {"train_loss": -10.955375671386719, "global_step": 146697, "epoch": 873} {"train_loss": -10.904644966125488, "global_step": 146698, "epoch": 873} {"train_loss": -11.081324577331543, "global_step": 146699, "epoch": 873} {"train_loss": -10.861228942871094, "global_step": 146700, "epoch": 873} {"train_loss": -10.737642288208008, "global_step": 146701, "epoch": 873} {"train_loss": -11.111818313598633, "global_step": 146702, "epoch": 873} {"train_loss": -11.020346641540527, "global_step": 146703, "epoch": 873} {"train_loss": -10.989463806152344, "global_step": 146704, "epoch": 873} {"train_loss": -10.773276329040527, "global_step": 146705, "epoch": 873} {"train_loss": -10.757604598999023, "global_step": 146706, "epoch": 873} {"train_loss": -11.044759750366211, "global_step": 146707, "epoch": 873} {"train_loss": -10.613195419311523, "global_step": 146708, "epoch": 873} {"train_loss": -10.888312339782715, "global_step": 146709, "epoch": 873} {"train_loss": -10.761175155639648, "global_step": 146710, "epoch": 873} {"train_loss": -10.615886688232422, "global_step": 146711, "epoch": 873} {"train_loss": -10.519371032714844, "global_step": 146712, "epoch": 873} {"train_loss": -10.932024955749512, "global_step": 146713, "epoch": 873} {"train_loss": -10.711758613586426, "global_step": 146714, "epoch": 873} {"train_loss": -10.72326374053955, "global_step": 146715, "epoch": 873} {"train_loss": -10.876489639282227, "global_step": 146716, "epoch": 873} {"train_loss": -10.996851921081543, "global_step": 146717, "epoch": 873} {"train_loss": -10.74494743347168, "global_step": 146718, "epoch": 873} {"train_loss": -10.715612411499023, "global_step": 146719, "epoch": 873} {"train_loss": -10.491823196411133, "global_step": 146720, "epoch": 873} {"train_loss": -10.643336296081543, "global_step": 146721, "epoch": 873} {"train_loss": -10.805131912231445, "global_step": 146722, "epoch": 873} {"train_loss": -10.528101921081543, "global_step": 146723, "epoch": 873} {"train_loss": -10.509382247924805, "global_step": 146724, "epoch": 873} {"train_loss": -10.471696853637695, "global_step": 146725, "epoch": 873} {"train_loss": -10.857267379760742, "global_step": 146726, "epoch": 873} {"train_loss": -10.794301986694336, "global_step": 146727, "epoch": 873} {"train_loss": -10.602605819702148, "global_step": 146728, "epoch": 873} {"train_loss": -10.547369003295898, "global_step": 146729, "epoch": 873} {"train_loss": -10.047174453735352, "global_step": 146730, "epoch": 873} {"train_loss": -10.497398376464844, "global_step": 146731, "epoch": 873} {"train_loss": -10.17076301574707, "global_step": 146732, "epoch": 873} {"train_loss": -10.54732894897461, "global_step": 146733, "epoch": 873} {"train_loss": -10.301671981811523, "global_step": 146734, "epoch": 873} {"train_loss": -10.155466079711914, "global_step": 146735, "epoch": 873} {"train_loss": -10.396352767944336, "global_step": 146736, "epoch": 873} {"train_loss": -10.287542343139648, "global_step": 146737, "epoch": 873} {"train_loss": -9.670523643493652, "global_step": 146738, "epoch": 873} {"train_loss": -10.248225212097168, "global_step": 146739, "epoch": 873} {"train_loss": -9.728414535522461, "global_step": 146740, "epoch": 873} {"train_loss": -10.211559295654297, "global_step": 146741, "epoch": 873} {"train_loss": -10.120828628540039, "global_step": 146742, "epoch": 873} {"train_loss": -9.913858413696289, "global_step": 146743, "epoch": 873} {"train_loss": -10.265380859375, "global_step": 146744, "epoch": 873} {"train_loss": -9.179248809814453, "global_step": 146745, "epoch": 873} {"train_loss": -10.299783706665039, "global_step": 146746, "epoch": 873} {"train_loss": -10.100177764892578, "global_step": 146747, "epoch": 873} {"train_loss": -9.7014799118042, "global_step": 146748, "epoch": 873} {"train_loss": -10.37133502960205, "global_step": 146749, "epoch": 873} {"train_loss": -10.370152473449707, "global_step": 146750, "epoch": 873} {"train_loss": -10.067218780517578, "global_step": 146751, "epoch": 873} {"train_loss": -10.643665313720703, "global_step": 146752, "epoch": 873} {"train_loss": -10.017422676086426, "global_step": 146753, "epoch": 873} {"train_loss": -10.5359525680542, "global_step": 146754, "epoch": 873} {"train_loss": -10.596779823303223, "global_step": 146755, "epoch": 873} {"train_loss": -10.343143463134766, "global_step": 146756, "epoch": 873} {"train_loss": -10.689942359924316, "global_step": 146757, "epoch": 873} {"train_loss": -10.67603874206543, "global_step": 146758, "epoch": 873} {"train_loss": -10.600101470947266, "global_step": 146759, "epoch": 873} {"train_loss": -10.448156356811523, "global_step": 146760, "epoch": 873} {"train_loss": -10.270153999328613, "global_step": 146761, "epoch": 873} {"train_loss": -10.707986831665039, "global_step": 146762, "epoch": 873} {"train_loss": -10.664227485656738, "global_step": 146763, "epoch": 873} {"train_loss": -10.402616500854492, "global_step": 146764, "epoch": 873} {"train_loss": -10.693099975585938, "global_step": 146765, "epoch": 873} {"train_loss": -10.581016540527344, "global_step": 146766, "epoch": 873} {"train_loss": -10.56347370147705, "global_step": 146767, "epoch": 873} {"train_loss": -10.508100509643555, "global_step": 146768, "epoch": 873} {"train_loss": -10.416963577270508, "global_step": 146769, "epoch": 873} {"train_loss": -10.653402328491211, "global_step": 146770, "epoch": 873} {"train_loss": -10.62846851348877, "global_step": 146771, "epoch": 873} {"train_loss": -10.616888046264648, "global_step": 146772, "epoch": 873} {"train_loss": -10.561075210571289, "global_step": 146773, "epoch": 873} {"train_loss": -10.694452285766602, "global_step": 146774, "epoch": 873} {"train_loss": -10.474292755126953, "global_step": 146775, "epoch": 873} {"train_loss": -10.698807716369629, "global_step": 146776, "epoch": 873} {"train_loss": -10.543539047241211, "global_step": 146777, "epoch": 873} {"train_loss": -10.648292541503906, "global_step": 146778, "epoch": 873} {"train_loss": -10.663101196289062, "global_step": 146779, "epoch": 873} {"train_loss": -10.867975234985352, "global_step": 146780, "epoch": 873} {"train_loss": -10.746310234069824, "global_step": 146781, "epoch": 873} {"train_loss": -10.780611038208008, "global_step": 146782, "epoch": 873} {"train_loss": -10.562114715576172, "global_step": 146783, "epoch": 873} {"train_loss": -10.807867050170898, "global_step": 146784, "epoch": 873} {"train_loss": -10.859851837158203, "global_step": 146785, "epoch": 873} {"train_loss": -10.67431640625, "global_step": 146786, "epoch": 873} {"train_loss": -10.774493217468262, "global_step": 146787, "epoch": 873} {"train_loss": -10.981389045715332, "global_step": 146788, "epoch": 873} {"train_loss": -10.776411056518555, "global_step": 146789, "epoch": 873} {"train_loss": -10.990741729736328, "global_step": 146790, "epoch": 873} {"train_loss": -10.737442016601562, "global_step": 146791, "epoch": 873} {"train_loss": -10.728728294372559, "global_step": 146792, "epoch": 873} {"train_loss": -10.876236915588379, "global_step": 146793, "epoch": 873} {"train_loss": -10.840841293334961, "global_step": 146794, "epoch": 873} {"train_loss": -10.73915958404541, "global_step": 146795, "epoch": 873} {"train_loss": -10.765145301818848, "global_step": 146796, "epoch": 873} {"train_loss": -10.668861389160156, "global_step": 146797, "epoch": 873} {"train_loss": -10.61050033569336, "global_step": 146798, "epoch": 873} {"train_loss": -10.556407928466797, "global_step": 146799, "epoch": 873} {"train_loss": -10.419842720031738, "global_step": 146800, "epoch": 873} {"train_loss": -10.13633918762207, "global_step": 146801, "epoch": 873} {"train_loss": -10.513339042663574, "global_step": 146802, "epoch": 873} {"train_loss": -10.316645622253418, "global_step": 146803, "epoch": 873} {"train_loss": -10.224395751953125, "global_step": 146804, "epoch": 873} {"train_loss": -10.689838409423828, "global_step": 146805, "epoch": 873} {"train_loss": -9.75207233428955, "global_step": 146806, "epoch": 873} {"train_loss": -9.98843002319336, "global_step": 146807, "epoch": 873} {"train_loss": -9.748062133789062, "global_step": 146808, "epoch": 873} {"train_loss": -9.721009254455566, "global_step": 146809, "epoch": 873} {"train_loss": -10.417003631591797, "global_step": 146810, "epoch": 873} {"train_loss": -10.000299453735352, "global_step": 146811, "epoch": 873} {"train_loss": -10.087457656860352, "global_step": 146812, "epoch": 873} {"train_loss": -9.833980560302734, "global_step": 146813, "epoch": 873} {"train_loss": -10.142047882080078, "global_step": 146814, "epoch": 873} {"train_loss": -10.524349212646484, "global_step": 146815, "epoch": 873} {"train_loss": -9.685267448425293, "global_step": 146816, "epoch": 873} {"train_loss": -10.452936172485352, "global_step": 146817, "epoch": 873} {"train_loss": -10.259937286376953, "global_step": 146818, "epoch": 873} {"train_loss": -9.806720733642578, "global_step": 146819, "epoch": 873} {"train_loss": -10.628584861755371, "global_step": 146820, "epoch": 873} {"train_loss": -9.922454833984375, "global_step": 146821, "epoch": 873} {"train_loss": -10.680488586425781, "global_step": 146822, "epoch": 873} {"train_loss": -10.515199661254883, "global_step": 146823, "epoch": 873} {"train_loss": -10.168858528137207, "global_step": 146824, "epoch": 873} {"train_loss": -10.667896270751953, "global_step": 146825, "epoch": 873} {"train_loss": -10.389318466186523, "global_step": 146826, "epoch": 873} {"train_loss": -10.49767017364502, "global_step": 146827, "epoch": 873} {"train_loss": -10.72119140625, "global_step": 146828, "epoch": 873} {"train_loss": -10.566125869750977, "global_step": 146829, "epoch": 873} {"train_loss": -10.458364486694336, "global_step": 146830, "epoch": 873} {"train_loss": -10.564051054772877, "global_step": 146831, "epoch": 873, "val_loss": 229440.78125} {"train_loss": -10.297260284423828, "global_step": 146832, "epoch": 874} {"train_loss": -10.553802490234375, "global_step": 146833, "epoch": 874} {"train_loss": -10.63671875, "global_step": 146834, "epoch": 874} {"train_loss": -10.556262969970703, "global_step": 146835, "epoch": 874} {"train_loss": -10.334839820861816, "global_step": 146836, "epoch": 874} {"train_loss": -10.379674911499023, "global_step": 146837, "epoch": 874} {"train_loss": -10.431112289428711, "global_step": 146838, "epoch": 874} {"train_loss": -10.608421325683594, "global_step": 146839, "epoch": 874} {"train_loss": -10.666805267333984, "global_step": 146840, "epoch": 874} {"train_loss": -10.6563138961792, "global_step": 146841, "epoch": 874} {"train_loss": -10.554054260253906, "global_step": 146842, "epoch": 874} {"train_loss": -10.760588645935059, "global_step": 146843, "epoch": 874} {"train_loss": -10.56883716583252, "global_step": 146844, "epoch": 874} {"train_loss": -10.899131774902344, "global_step": 146845, "epoch": 874} {"train_loss": -10.729629516601562, "global_step": 146846, "epoch": 874} {"train_loss": -10.821316719055176, "global_step": 146847, "epoch": 874} {"train_loss": -10.702159881591797, "global_step": 146848, "epoch": 874} {"train_loss": -10.782205581665039, "global_step": 146849, "epoch": 874} {"train_loss": -10.796113967895508, "global_step": 146850, "epoch": 874} {"train_loss": -10.712320327758789, "global_step": 146851, "epoch": 874} {"train_loss": -10.629111289978027, "global_step": 146852, "epoch": 874} {"train_loss": -10.682196617126465, "global_step": 146853, "epoch": 874} {"train_loss": -10.382720947265625, "global_step": 146854, "epoch": 874} {"train_loss": -10.970250129699707, "global_step": 146855, "epoch": 874} {"train_loss": -10.475119590759277, "global_step": 146856, "epoch": 874} {"train_loss": -10.73551082611084, "global_step": 146857, "epoch": 874} {"train_loss": -10.537140846252441, "global_step": 146858, "epoch": 874} {"train_loss": -11.031129837036133, "global_step": 146859, "epoch": 874} {"train_loss": -10.212766647338867, "global_step": 146860, "epoch": 874} {"train_loss": -10.955732345581055, "global_step": 146861, "epoch": 874} {"train_loss": -10.323616027832031, "global_step": 146862, "epoch": 874} {"train_loss": -10.760958671569824, "global_step": 146863, "epoch": 874} {"train_loss": -10.465604782104492, "global_step": 146864, "epoch": 874} {"train_loss": -10.835701942443848, "global_step": 146865, "epoch": 874} {"train_loss": -10.805553436279297, "global_step": 146866, "epoch": 874} {"train_loss": -10.788171768188477, "global_step": 146867, "epoch": 874} {"train_loss": -10.509153366088867, "global_step": 146868, "epoch": 874} {"train_loss": -10.574663162231445, "global_step": 146869, "epoch": 874} {"train_loss": -10.540756225585938, "global_step": 146870, "epoch": 874} {"train_loss": -10.84187126159668, "global_step": 146871, "epoch": 874} {"train_loss": -10.291439056396484, "global_step": 146872, "epoch": 874} {"train_loss": -10.404716491699219, "global_step": 146873, "epoch": 874} {"train_loss": -10.458492279052734, "global_step": 146874, "epoch": 874} {"train_loss": -10.67698860168457, "global_step": 146875, "epoch": 874} {"train_loss": -10.10799789428711, "global_step": 146876, "epoch": 874} {"train_loss": -10.77031135559082, "global_step": 146877, "epoch": 874} {"train_loss": -10.376497268676758, "global_step": 146878, "epoch": 874} {"train_loss": -10.604856491088867, "global_step": 146879, "epoch": 874} {"train_loss": -10.564752578735352, "global_step": 146880, "epoch": 874} {"train_loss": -10.422454833984375, "global_step": 146881, "epoch": 874} {"train_loss": -10.758278846740723, "global_step": 146882, "epoch": 874} {"train_loss": -10.69382381439209, "global_step": 146883, "epoch": 874} {"train_loss": -10.477409362792969, "global_step": 146884, "epoch": 874} {"train_loss": -10.60215950012207, "global_step": 146885, "epoch": 874} {"train_loss": -10.414125442504883, "global_step": 146886, "epoch": 874} {"train_loss": -10.627019882202148, "global_step": 146887, "epoch": 874} {"train_loss": -10.747745513916016, "global_step": 146888, "epoch": 874} {"train_loss": -10.782478332519531, "global_step": 146889, "epoch": 874} {"train_loss": -10.682108879089355, "global_step": 146890, "epoch": 874} {"train_loss": -10.386968612670898, "global_step": 146891, "epoch": 874} {"train_loss": -10.451520919799805, "global_step": 146892, "epoch": 874} {"train_loss": -10.648069381713867, "global_step": 146893, "epoch": 874} {"train_loss": -10.82075309753418, "global_step": 146894, "epoch": 874} {"train_loss": -10.697834014892578, "global_step": 146895, "epoch": 874} {"train_loss": -10.543571472167969, "global_step": 146896, "epoch": 874} {"train_loss": -10.269027709960938, "global_step": 146897, "epoch": 874} {"train_loss": -10.890661239624023, "global_step": 146898, "epoch": 874} {"train_loss": -10.595626831054688, "global_step": 146899, "epoch": 874} {"train_loss": -10.677663803100586, "global_step": 146900, "epoch": 874} {"train_loss": -10.712570190429688, "global_step": 146901, "epoch": 874} {"train_loss": -10.453666687011719, "global_step": 146902, "epoch": 874} {"train_loss": -10.758325576782227, "global_step": 146903, "epoch": 874} {"train_loss": -10.706788063049316, "global_step": 146904, "epoch": 874} {"train_loss": -10.746368408203125, "global_step": 146905, "epoch": 874} {"train_loss": -10.666426658630371, "global_step": 146906, "epoch": 874} {"train_loss": -10.868220329284668, "global_step": 146907, "epoch": 874} {"train_loss": -10.580541610717773, "global_step": 146908, "epoch": 874} {"train_loss": -10.164015769958496, "global_step": 146909, "epoch": 874} {"train_loss": -10.747176170349121, "global_step": 146910, "epoch": 874} {"train_loss": -10.040376663208008, "global_step": 146911, "epoch": 874} {"train_loss": -10.62016773223877, "global_step": 146912, "epoch": 874} {"train_loss": -10.365242004394531, "global_step": 146913, "epoch": 874} {"train_loss": -10.272529602050781, "global_step": 146914, "epoch": 874} {"train_loss": -10.434066772460938, "global_step": 146915, "epoch": 874} {"train_loss": -10.137350082397461, "global_step": 146916, "epoch": 874} {"train_loss": -10.64749526977539, "global_step": 146917, "epoch": 874} {"train_loss": -10.15674877166748, "global_step": 146918, "epoch": 874} {"train_loss": -10.409826278686523, "global_step": 146919, "epoch": 874} {"train_loss": -10.63328742980957, "global_step": 146920, "epoch": 874} {"train_loss": -10.203315734863281, "global_step": 146921, "epoch": 874} {"train_loss": -10.441638946533203, "global_step": 146922, "epoch": 874} {"train_loss": -10.307823181152344, "global_step": 146923, "epoch": 874} {"train_loss": -10.421646118164062, "global_step": 146924, "epoch": 874} {"train_loss": -10.577885627746582, "global_step": 146925, "epoch": 874} {"train_loss": -10.523189544677734, "global_step": 146926, "epoch": 874} {"train_loss": -10.588517189025879, "global_step": 146927, "epoch": 874} {"train_loss": -10.420305252075195, "global_step": 146928, "epoch": 874} {"train_loss": -10.476461410522461, "global_step": 146929, "epoch": 874} {"train_loss": -10.671489715576172, "global_step": 146930, "epoch": 874} {"train_loss": -10.534601211547852, "global_step": 146931, "epoch": 874} {"train_loss": -10.690408706665039, "global_step": 146932, "epoch": 874} {"train_loss": -10.611781120300293, "global_step": 146933, "epoch": 874} {"train_loss": -10.675827026367188, "global_step": 146934, "epoch": 874} {"train_loss": -10.746254920959473, "global_step": 146935, "epoch": 874} {"train_loss": -10.806326866149902, "global_step": 146936, "epoch": 874} {"train_loss": -10.663839340209961, "global_step": 146937, "epoch": 874} {"train_loss": -10.690232276916504, "global_step": 146938, "epoch": 874} {"train_loss": -10.666360855102539, "global_step": 146939, "epoch": 874} {"train_loss": -10.792150497436523, "global_step": 146940, "epoch": 874} {"train_loss": -10.693546295166016, "global_step": 146941, "epoch": 874} {"train_loss": -10.717016220092773, "global_step": 146942, "epoch": 874} {"train_loss": -10.725846290588379, "global_step": 146943, "epoch": 874} {"train_loss": -10.740922927856445, "global_step": 146944, "epoch": 874} {"train_loss": -10.515083312988281, "global_step": 146945, "epoch": 874} {"train_loss": -10.765254974365234, "global_step": 146946, "epoch": 874} {"train_loss": -10.33177375793457, "global_step": 146947, "epoch": 874} {"train_loss": -10.885554313659668, "global_step": 146948, "epoch": 874} {"train_loss": -10.715539932250977, "global_step": 146949, "epoch": 874} {"train_loss": -10.877300262451172, "global_step": 146950, "epoch": 874} {"train_loss": -10.625677108764648, "global_step": 146951, "epoch": 874} {"train_loss": -10.337215423583984, "global_step": 146952, "epoch": 874} {"train_loss": -10.728784561157227, "global_step": 146953, "epoch": 874} {"train_loss": -10.82103443145752, "global_step": 146954, "epoch": 874} {"train_loss": -10.601177215576172, "global_step": 146955, "epoch": 874} {"train_loss": -10.809486389160156, "global_step": 146956, "epoch": 874} {"train_loss": -10.662639617919922, "global_step": 146957, "epoch": 874} {"train_loss": -10.8145112991333, "global_step": 146958, "epoch": 874} {"train_loss": -10.889928817749023, "global_step": 146959, "epoch": 874} {"train_loss": -10.468181610107422, "global_step": 146960, "epoch": 874} {"train_loss": -10.797782897949219, "global_step": 146961, "epoch": 874} {"train_loss": -10.699636459350586, "global_step": 146962, "epoch": 874} {"train_loss": -10.482047080993652, "global_step": 146963, "epoch": 874} {"train_loss": -10.980501174926758, "global_step": 146964, "epoch": 874} {"train_loss": -10.787464141845703, "global_step": 146965, "epoch": 874} {"train_loss": -10.935646057128906, "global_step": 146966, "epoch": 874} {"train_loss": -10.679497718811035, "global_step": 146967, "epoch": 874} {"train_loss": -11.039205551147461, "global_step": 146968, "epoch": 874} {"train_loss": -10.791717529296875, "global_step": 146969, "epoch": 874} {"train_loss": -10.82331657409668, "global_step": 146970, "epoch": 874} {"train_loss": -10.823020935058594, "global_step": 146971, "epoch": 874} {"train_loss": -10.836345672607422, "global_step": 146972, "epoch": 874} {"train_loss": -10.903632164001465, "global_step": 146973, "epoch": 874} {"train_loss": -10.645323753356934, "global_step": 146974, "epoch": 874} {"train_loss": -10.472112655639648, "global_step": 146975, "epoch": 874} {"train_loss": -10.859699249267578, "global_step": 146976, "epoch": 874} {"train_loss": -10.887096405029297, "global_step": 146977, "epoch": 874} {"train_loss": -10.931510925292969, "global_step": 146978, "epoch": 874} {"train_loss": -10.858030319213867, "global_step": 146979, "epoch": 874} {"train_loss": -10.899426460266113, "global_step": 146980, "epoch": 874} {"train_loss": -10.822750091552734, "global_step": 146981, "epoch": 874} {"train_loss": -10.757612228393555, "global_step": 146982, "epoch": 874} {"train_loss": -10.816883087158203, "global_step": 146983, "epoch": 874} {"train_loss": -10.797250747680664, "global_step": 146984, "epoch": 874} {"train_loss": -10.482561111450195, "global_step": 146985, "epoch": 874} {"train_loss": -10.776204109191895, "global_step": 146986, "epoch": 874} {"train_loss": -10.767754554748535, "global_step": 146987, "epoch": 874} {"train_loss": -10.913074493408203, "global_step": 146988, "epoch": 874} {"train_loss": -10.88379955291748, "global_step": 146989, "epoch": 874} {"train_loss": -10.911218643188477, "global_step": 146990, "epoch": 874} {"train_loss": -10.822864532470703, "global_step": 146991, "epoch": 874} {"train_loss": -10.880772590637207, "global_step": 146992, "epoch": 874} {"train_loss": -10.71051025390625, "global_step": 146993, "epoch": 874} {"train_loss": -11.107735633850098, "global_step": 146994, "epoch": 874} {"train_loss": -10.865427017211914, "global_step": 146995, "epoch": 874} {"train_loss": -11.104578018188477, "global_step": 146996, "epoch": 874} {"train_loss": -10.766508102416992, "global_step": 146997, "epoch": 874} {"train_loss": -10.723382949829102, "global_step": 146998, "epoch": 874} {"train_loss": -10.649485037440346, "global_step": 146999, "epoch": 874, "val_loss": 229015.203125} {"train_loss": -10.853509902954102, "global_step": 147000, "epoch": 875} {"train_loss": -11.02599811553955, "global_step": 147001, "epoch": 875} {"train_loss": -10.736723899841309, "global_step": 147002, "epoch": 875} {"train_loss": -10.729702949523926, "global_step": 147003, "epoch": 875} {"train_loss": -11.016932487487793, "global_step": 147004, "epoch": 875} {"train_loss": -10.636556625366211, "global_step": 147005, "epoch": 875} {"train_loss": -10.518810272216797, "global_step": 147006, "epoch": 875} {"train_loss": -10.756651878356934, "global_step": 147007, "epoch": 875} {"train_loss": -10.645075798034668, "global_step": 147008, "epoch": 875} {"train_loss": -10.592292785644531, "global_step": 147009, "epoch": 875} {"train_loss": -10.608635902404785, "global_step": 147010, "epoch": 875} {"train_loss": -11.01006031036377, "global_step": 147011, "epoch": 875} {"train_loss": -10.587841987609863, "global_step": 147012, "epoch": 875} {"train_loss": -10.916377067565918, "global_step": 147013, "epoch": 875} {"train_loss": -10.884721755981445, "global_step": 147014, "epoch": 875} {"train_loss": -10.574895858764648, "global_step": 147015, "epoch": 875} {"train_loss": -10.430741310119629, "global_step": 147016, "epoch": 875} {"train_loss": -10.36555004119873, "global_step": 147017, "epoch": 875} {"train_loss": -10.594686508178711, "global_step": 147018, "epoch": 875} {"train_loss": -10.842817306518555, "global_step": 147019, "epoch": 875} {"train_loss": -9.915498733520508, "global_step": 147020, "epoch": 875} {"train_loss": -10.442537307739258, "global_step": 147021, "epoch": 875} {"train_loss": -10.682000160217285, "global_step": 147022, "epoch": 875} {"train_loss": -10.651899337768555, "global_step": 147023, "epoch": 875} {"train_loss": -10.726284980773926, "global_step": 147024, "epoch": 875} {"train_loss": -10.794111251831055, "global_step": 147025, "epoch": 875} {"train_loss": -10.661345481872559, "global_step": 147026, "epoch": 875} {"train_loss": -10.860982894897461, "global_step": 147027, "epoch": 875} {"train_loss": -10.568205833435059, "global_step": 147028, "epoch": 875} {"train_loss": -10.858449935913086, "global_step": 147029, "epoch": 875} {"train_loss": -10.772806167602539, "global_step": 147030, "epoch": 875} {"train_loss": -10.21752643585205, "global_step": 147031, "epoch": 875} {"train_loss": -10.773128509521484, "global_step": 147032, "epoch": 875} {"train_loss": -10.404452323913574, "global_step": 147033, "epoch": 875} {"train_loss": -10.401850700378418, "global_step": 147034, "epoch": 875} {"train_loss": -10.349193572998047, "global_step": 147035, "epoch": 875} {"train_loss": -10.790958404541016, "global_step": 147036, "epoch": 875} {"train_loss": -10.551603317260742, "global_step": 147037, "epoch": 875} {"train_loss": -10.357027053833008, "global_step": 147038, "epoch": 875} {"train_loss": -10.676790237426758, "global_step": 147039, "epoch": 875} {"train_loss": -10.386423110961914, "global_step": 147040, "epoch": 875} {"train_loss": -10.729608535766602, "global_step": 147041, "epoch": 875} {"train_loss": -10.259902000427246, "global_step": 147042, "epoch": 875} {"train_loss": -10.599761009216309, "global_step": 147043, "epoch": 875} {"train_loss": -10.730112075805664, "global_step": 147044, "epoch": 875} {"train_loss": -10.359865188598633, "global_step": 147045, "epoch": 875} {"train_loss": -10.809898376464844, "global_step": 147046, "epoch": 875} {"train_loss": -10.822696685791016, "global_step": 147047, "epoch": 875} {"train_loss": -10.681478500366211, "global_step": 147048, "epoch": 875} {"train_loss": -10.745129585266113, "global_step": 147049, "epoch": 875} {"train_loss": -10.560750007629395, "global_step": 147050, "epoch": 875} {"train_loss": -10.590038299560547, "global_step": 147051, "epoch": 875} {"train_loss": -10.634187698364258, "global_step": 147052, "epoch": 875} {"train_loss": -10.823307037353516, "global_step": 147053, "epoch": 875} {"train_loss": -10.778017044067383, "global_step": 147054, "epoch": 875} {"train_loss": -10.559541702270508, "global_step": 147055, "epoch": 875} {"train_loss": -10.764808654785156, "global_step": 147056, "epoch": 875} {"train_loss": -10.544706344604492, "global_step": 147057, "epoch": 875} {"train_loss": -10.774088859558105, "global_step": 147058, "epoch": 875} {"train_loss": -10.758504867553711, "global_step": 147059, "epoch": 875} {"train_loss": -10.804478645324707, "global_step": 147060, "epoch": 875} {"train_loss": -10.739036560058594, "global_step": 147061, "epoch": 875} {"train_loss": -10.846807479858398, "global_step": 147062, "epoch": 875} {"train_loss": -10.781518936157227, "global_step": 147063, "epoch": 875} {"train_loss": -10.890592575073242, "global_step": 147064, "epoch": 875} {"train_loss": -10.979377746582031, "global_step": 147065, "epoch": 875} {"train_loss": -10.580642700195312, "global_step": 147066, "epoch": 875} {"train_loss": -10.680235862731934, "global_step": 147067, "epoch": 875} {"train_loss": -10.30993938446045, "global_step": 147068, "epoch": 875} {"train_loss": -10.21330451965332, "global_step": 147069, "epoch": 875} {"train_loss": -10.748827934265137, "global_step": 147070, "epoch": 875} {"train_loss": -10.256696701049805, "global_step": 147071, "epoch": 875} {"train_loss": -10.786638259887695, "global_step": 147072, "epoch": 875} {"train_loss": -10.44087028503418, "global_step": 147073, "epoch": 875} {"train_loss": -10.331550598144531, "global_step": 147074, "epoch": 875} {"train_loss": -11.003650665283203, "global_step": 147075, "epoch": 875} {"train_loss": -10.754390716552734, "global_step": 147076, "epoch": 875} {"train_loss": -10.685982704162598, "global_step": 147077, "epoch": 875} {"train_loss": -10.961406707763672, "global_step": 147078, "epoch": 875} {"train_loss": -10.785255432128906, "global_step": 147079, "epoch": 875} {"train_loss": -10.699474334716797, "global_step": 147080, "epoch": 875} {"train_loss": -10.979948997497559, "global_step": 147081, "epoch": 875} {"train_loss": -10.801130294799805, "global_step": 147082, "epoch": 875} {"train_loss": -10.512968063354492, "global_step": 147083, "epoch": 875} {"train_loss": -10.797481536865234, "global_step": 147084, "epoch": 875} {"train_loss": -10.62542724609375, "global_step": 147085, "epoch": 875} {"train_loss": -10.490324020385742, "global_step": 147086, "epoch": 875} {"train_loss": -9.970780372619629, "global_step": 147087, "epoch": 875} {"train_loss": -10.595571517944336, "global_step": 147088, "epoch": 875} {"train_loss": -10.686162948608398, "global_step": 147089, "epoch": 875} {"train_loss": -10.4717435836792, "global_step": 147090, "epoch": 875} {"train_loss": -10.78555679321289, "global_step": 147091, "epoch": 875} {"train_loss": -10.562908172607422, "global_step": 147092, "epoch": 875} {"train_loss": -10.840662956237793, "global_step": 147093, "epoch": 875} {"train_loss": -10.688477516174316, "global_step": 147094, "epoch": 875} {"train_loss": -10.573227882385254, "global_step": 147095, "epoch": 875} {"train_loss": -10.744833946228027, "global_step": 147096, "epoch": 875} {"train_loss": -10.685382843017578, "global_step": 147097, "epoch": 875} {"train_loss": -10.815760612487793, "global_step": 147098, "epoch": 875} {"train_loss": -10.700733184814453, "global_step": 147099, "epoch": 875} {"train_loss": -10.92215347290039, "global_step": 147100, "epoch": 875} {"train_loss": -10.660848617553711, "global_step": 147101, "epoch": 875} {"train_loss": -10.75185775756836, "global_step": 147102, "epoch": 875} {"train_loss": -10.443815231323242, "global_step": 147103, "epoch": 875} {"train_loss": -10.757299423217773, "global_step": 147104, "epoch": 875} {"train_loss": -10.815929412841797, "global_step": 147105, "epoch": 875} {"train_loss": -10.731250762939453, "global_step": 147106, "epoch": 875} {"train_loss": -10.851224899291992, "global_step": 147107, "epoch": 875} {"train_loss": -10.840843200683594, "global_step": 147108, "epoch": 875} {"train_loss": -10.68697452545166, "global_step": 147109, "epoch": 875} {"train_loss": -10.594326972961426, "global_step": 147110, "epoch": 875} {"train_loss": -10.80810546875, "global_step": 147111, "epoch": 875} {"train_loss": -10.841812133789062, "global_step": 147112, "epoch": 875} {"train_loss": -10.427438735961914, "global_step": 147113, "epoch": 875} {"train_loss": -10.704496383666992, "global_step": 147114, "epoch": 875} {"train_loss": -10.872594833374023, "global_step": 147115, "epoch": 875} {"train_loss": -10.420330047607422, "global_step": 147116, "epoch": 875} {"train_loss": -10.83161735534668, "global_step": 147117, "epoch": 875} {"train_loss": -10.53385066986084, "global_step": 147118, "epoch": 875} {"train_loss": -10.943475723266602, "global_step": 147119, "epoch": 875} {"train_loss": -10.906816482543945, "global_step": 147120, "epoch": 875} {"train_loss": -10.683536529541016, "global_step": 147121, "epoch": 875} {"train_loss": -10.668974876403809, "global_step": 147122, "epoch": 875} {"train_loss": -10.316214561462402, "global_step": 147123, "epoch": 875} {"train_loss": -10.637392044067383, "global_step": 147124, "epoch": 875} {"train_loss": -10.473226547241211, "global_step": 147125, "epoch": 875} {"train_loss": -10.740765571594238, "global_step": 147126, "epoch": 875} {"train_loss": -9.949674606323242, "global_step": 147127, "epoch": 875} {"train_loss": -10.6256103515625, "global_step": 147128, "epoch": 875} {"train_loss": -10.415295600891113, "global_step": 147129, "epoch": 875} {"train_loss": -10.043477058410645, "global_step": 147130, "epoch": 875} {"train_loss": -10.525872230529785, "global_step": 147131, "epoch": 875} {"train_loss": -9.77370834350586, "global_step": 147132, "epoch": 875} {"train_loss": -9.898680686950684, "global_step": 147133, "epoch": 875} {"train_loss": -10.523317337036133, "global_step": 147134, "epoch": 875} {"train_loss": -10.025257110595703, "global_step": 147135, "epoch": 875} {"train_loss": -10.242642402648926, "global_step": 147136, "epoch": 875} {"train_loss": -9.467599868774414, "global_step": 147137, "epoch": 875} {"train_loss": -10.299662590026855, "global_step": 147138, "epoch": 875} {"train_loss": -10.42027473449707, "global_step": 147139, "epoch": 875} {"train_loss": -10.440905570983887, "global_step": 147140, "epoch": 875} {"train_loss": -10.807226181030273, "global_step": 147141, "epoch": 875} {"train_loss": -10.512474060058594, "global_step": 147142, "epoch": 875} {"train_loss": -10.324261665344238, "global_step": 147143, "epoch": 875} {"train_loss": -10.253003120422363, "global_step": 147144, "epoch": 875} {"train_loss": -10.622148513793945, "global_step": 147145, "epoch": 875} {"train_loss": -10.465544700622559, "global_step": 147146, "epoch": 875} {"train_loss": -10.63320541381836, "global_step": 147147, "epoch": 875} {"train_loss": -10.747293472290039, "global_step": 147148, "epoch": 875} {"train_loss": -10.515299797058105, "global_step": 147149, "epoch": 875} {"train_loss": -10.668743133544922, "global_step": 147150, "epoch": 875} {"train_loss": -10.506539344787598, "global_step": 147151, "epoch": 875} {"train_loss": -10.378721237182617, "global_step": 147152, "epoch": 875} {"train_loss": -10.528779983520508, "global_step": 147153, "epoch": 875} {"train_loss": -10.463489532470703, "global_step": 147154, "epoch": 875} {"train_loss": -10.787727355957031, "global_step": 147155, "epoch": 875} {"train_loss": -10.399005889892578, "global_step": 147156, "epoch": 875} {"train_loss": -10.788843154907227, "global_step": 147157, "epoch": 875} {"train_loss": -10.447105407714844, "global_step": 147158, "epoch": 875} {"train_loss": -10.75510311126709, "global_step": 147159, "epoch": 875} {"train_loss": -10.364843368530273, "global_step": 147160, "epoch": 875} {"train_loss": -10.541862487792969, "global_step": 147161, "epoch": 875} {"train_loss": -10.419017791748047, "global_step": 147162, "epoch": 875} {"train_loss": -10.564332008361816, "global_step": 147163, "epoch": 875} {"train_loss": -10.500597953796387, "global_step": 147164, "epoch": 875} {"train_loss": -10.212440490722656, "global_step": 147165, "epoch": 875} {"train_loss": -10.466019630432129, "global_step": 147166, "epoch": 875} {"train_loss": -10.601326550756182, "global_step": 147167, "epoch": 875, "val_loss": 228640.28125, "train_action_mse_error": 0.8148704171180725} {"train_loss": -10.460953712463379, "global_step": 147168, "epoch": 876} {"train_loss": -9.947800636291504, "global_step": 147169, "epoch": 876} {"train_loss": -10.552303314208984, "global_step": 147170, "epoch": 876} {"train_loss": -9.810015678405762, "global_step": 147171, "epoch": 876} {"train_loss": -10.415040969848633, "global_step": 147172, "epoch": 876} {"train_loss": -10.287282943725586, "global_step": 147173, "epoch": 876} {"train_loss": -10.168160438537598, "global_step": 147174, "epoch": 876} {"train_loss": -10.502218246459961, "global_step": 147175, "epoch": 876} {"train_loss": -10.096851348876953, "global_step": 147176, "epoch": 876} {"train_loss": -10.499813079833984, "global_step": 147177, "epoch": 876} {"train_loss": -10.149364471435547, "global_step": 147178, "epoch": 876} {"train_loss": -10.419816970825195, "global_step": 147179, "epoch": 876} {"train_loss": -10.505186080932617, "global_step": 147180, "epoch": 876} {"train_loss": -10.21786117553711, "global_step": 147181, "epoch": 876} {"train_loss": -10.546577453613281, "global_step": 147182, "epoch": 876} {"train_loss": -10.263171195983887, "global_step": 147183, "epoch": 876} {"train_loss": -10.592438697814941, "global_step": 147184, "epoch": 876} {"train_loss": -10.61341381072998, "global_step": 147185, "epoch": 876} {"train_loss": -10.659856796264648, "global_step": 147186, "epoch": 876} {"train_loss": -10.871283531188965, "global_step": 147187, "epoch": 876} {"train_loss": -10.73141860961914, "global_step": 147188, "epoch": 876} {"train_loss": -10.79281234741211, "global_step": 147189, "epoch": 876} {"train_loss": -10.726284980773926, "global_step": 147190, "epoch": 876} {"train_loss": -10.805603981018066, "global_step": 147191, "epoch": 876} {"train_loss": -10.976936340332031, "global_step": 147192, "epoch": 876} {"train_loss": -10.734197616577148, "global_step": 147193, "epoch": 876} {"train_loss": -10.911917686462402, "global_step": 147194, "epoch": 876} {"train_loss": -10.927124977111816, "global_step": 147195, "epoch": 876} {"train_loss": -10.81254768371582, "global_step": 147196, "epoch": 876} {"train_loss": -10.944392204284668, "global_step": 147197, "epoch": 876} {"train_loss": -10.96365737915039, "global_step": 147198, "epoch": 876} {"train_loss": -10.828598976135254, "global_step": 147199, "epoch": 876} {"train_loss": -10.993310928344727, "global_step": 147200, "epoch": 876} {"train_loss": -10.951188087463379, "global_step": 147201, "epoch": 876} {"train_loss": -11.220354080200195, "global_step": 147202, "epoch": 876} {"train_loss": -10.832719802856445, "global_step": 147203, "epoch": 876} {"train_loss": -10.993046760559082, "global_step": 147204, "epoch": 876} {"train_loss": -11.049285888671875, "global_step": 147205, "epoch": 876} {"train_loss": -11.13494873046875, "global_step": 147206, "epoch": 876} {"train_loss": -10.799934387207031, "global_step": 147207, "epoch": 876} {"train_loss": -11.204564094543457, "global_step": 147208, "epoch": 876} {"train_loss": -10.843719482421875, "global_step": 147209, "epoch": 876} {"train_loss": -10.889092445373535, "global_step": 147210, "epoch": 876} {"train_loss": -10.934032440185547, "global_step": 147211, "epoch": 876} {"train_loss": -10.98324203491211, "global_step": 147212, "epoch": 876} {"train_loss": -11.076047897338867, "global_step": 147213, "epoch": 876} {"train_loss": -10.967742919921875, "global_step": 147214, "epoch": 876} {"train_loss": -10.988523483276367, "global_step": 147215, "epoch": 876} {"train_loss": -10.994401931762695, "global_step": 147216, "epoch": 876} {"train_loss": -11.08247184753418, "global_step": 147217, "epoch": 876} {"train_loss": -10.825492858886719, "global_step": 147218, "epoch": 876} {"train_loss": -11.196636199951172, "global_step": 147219, "epoch": 876} {"train_loss": -10.943469047546387, "global_step": 147220, "epoch": 876} {"train_loss": -10.85478401184082, "global_step": 147221, "epoch": 876} {"train_loss": -10.625019073486328, "global_step": 147222, "epoch": 876} {"train_loss": -10.798131942749023, "global_step": 147223, "epoch": 876} {"train_loss": -10.6350736618042, "global_step": 147224, "epoch": 876} {"train_loss": -10.96363639831543, "global_step": 147225, "epoch": 876} {"train_loss": -10.51760482788086, "global_step": 147226, "epoch": 876} {"train_loss": -9.87804889678955, "global_step": 147227, "epoch": 876} {"train_loss": -10.902064323425293, "global_step": 147228, "epoch": 876} {"train_loss": -10.567659378051758, "global_step": 147229, "epoch": 876} {"train_loss": -10.609162330627441, "global_step": 147230, "epoch": 876} {"train_loss": -10.51183032989502, "global_step": 147231, "epoch": 876} {"train_loss": -11.012396812438965, "global_step": 147232, "epoch": 876} {"train_loss": -10.533673286437988, "global_step": 147233, "epoch": 876} {"train_loss": -10.506856918334961, "global_step": 147234, "epoch": 876} {"train_loss": -10.757627487182617, "global_step": 147235, "epoch": 876} {"train_loss": -10.80363941192627, "global_step": 147236, "epoch": 876} {"train_loss": -9.319053649902344, "global_step": 147237, "epoch": 876} {"train_loss": -10.226173400878906, "global_step": 147238, "epoch": 876} {"train_loss": -10.526962280273438, "global_step": 147239, "epoch": 876} {"train_loss": -8.886625289916992, "global_step": 147240, "epoch": 876} {"train_loss": -10.452823638916016, "global_step": 147241, "epoch": 876} {"train_loss": -9.83323860168457, "global_step": 147242, "epoch": 876} {"train_loss": -8.899173736572266, "global_step": 147243, "epoch": 876} {"train_loss": -9.530179977416992, "global_step": 147244, "epoch": 876} {"train_loss": -9.199520111083984, "global_step": 147245, "epoch": 876} {"train_loss": -10.398263931274414, "global_step": 147246, "epoch": 876} {"train_loss": -9.199821472167969, "global_step": 147247, "epoch": 876} {"train_loss": -10.285937309265137, "global_step": 147248, "epoch": 876} {"train_loss": -8.892192840576172, "global_step": 147249, "epoch": 876} {"train_loss": -10.387511253356934, "global_step": 147250, "epoch": 876} {"train_loss": -9.500228881835938, "global_step": 147251, "epoch": 876} {"train_loss": -9.967409133911133, "global_step": 147252, "epoch": 876} {"train_loss": -9.408639907836914, "global_step": 147253, "epoch": 876} {"train_loss": -9.594724655151367, "global_step": 147254, "epoch": 876} {"train_loss": -9.677019119262695, "global_step": 147255, "epoch": 876} {"train_loss": -9.81492805480957, "global_step": 147256, "epoch": 876} {"train_loss": -9.95501708984375, "global_step": 147257, "epoch": 876} {"train_loss": -10.363938331604004, "global_step": 147258, "epoch": 876} {"train_loss": -9.880685806274414, "global_step": 147259, "epoch": 876} {"train_loss": -10.102161407470703, "global_step": 147260, "epoch": 876} {"train_loss": -9.945520401000977, "global_step": 147261, "epoch": 876} {"train_loss": -10.36118221282959, "global_step": 147262, "epoch": 876} {"train_loss": -10.110857009887695, "global_step": 147263, "epoch": 876} {"train_loss": -10.093746185302734, "global_step": 147264, "epoch": 876} {"train_loss": -10.338844299316406, "global_step": 147265, "epoch": 876} {"train_loss": -10.172388076782227, "global_step": 147266, "epoch": 876} {"train_loss": -10.258810043334961, "global_step": 147267, "epoch": 876} {"train_loss": -10.094435691833496, "global_step": 147268, "epoch": 876} {"train_loss": -10.37558650970459, "global_step": 147269, "epoch": 876} {"train_loss": -10.304651260375977, "global_step": 147270, "epoch": 876} {"train_loss": -10.102343559265137, "global_step": 147271, "epoch": 876} {"train_loss": -10.525802612304688, "global_step": 147272, "epoch": 876} {"train_loss": -10.446377754211426, "global_step": 147273, "epoch": 876} {"train_loss": -10.33352279663086, "global_step": 147274, "epoch": 876} {"train_loss": -10.56788444519043, "global_step": 147275, "epoch": 876} {"train_loss": -10.459016799926758, "global_step": 147276, "epoch": 876} {"train_loss": -10.403322219848633, "global_step": 147277, "epoch": 876} {"train_loss": -10.428442001342773, "global_step": 147278, "epoch": 876} {"train_loss": -10.389823913574219, "global_step": 147279, "epoch": 876} {"train_loss": -10.498422622680664, "global_step": 147280, "epoch": 876} {"train_loss": -10.328810691833496, "global_step": 147281, "epoch": 876} {"train_loss": -10.408089637756348, "global_step": 147282, "epoch": 876} {"train_loss": -10.657480239868164, "global_step": 147283, "epoch": 876} {"train_loss": -10.352239608764648, "global_step": 147284, "epoch": 876} {"train_loss": -10.576292991638184, "global_step": 147285, "epoch": 876} {"train_loss": -10.735228538513184, "global_step": 147286, "epoch": 876} {"train_loss": -10.617773056030273, "global_step": 147287, "epoch": 876} {"train_loss": -10.730555534362793, "global_step": 147288, "epoch": 876} {"train_loss": -10.515898704528809, "global_step": 147289, "epoch": 876} {"train_loss": -10.687271118164062, "global_step": 147290, "epoch": 876} {"train_loss": -10.757976531982422, "global_step": 147291, "epoch": 876} {"train_loss": -10.75285530090332, "global_step": 147292, "epoch": 876} {"train_loss": -10.786836624145508, "global_step": 147293, "epoch": 876} {"train_loss": -10.745058059692383, "global_step": 147294, "epoch": 876} {"train_loss": -10.982013702392578, "global_step": 147295, "epoch": 876} {"train_loss": -10.971881866455078, "global_step": 147296, "epoch": 876} {"train_loss": -11.020984649658203, "global_step": 147297, "epoch": 876} {"train_loss": -10.846399307250977, "global_step": 147298, "epoch": 876} {"train_loss": -10.764875411987305, "global_step": 147299, "epoch": 876} {"train_loss": -10.81450080871582, "global_step": 147300, "epoch": 876} {"train_loss": -10.948522567749023, "global_step": 147301, "epoch": 876} {"train_loss": -10.717975616455078, "global_step": 147302, "epoch": 876} {"train_loss": -10.943592071533203, "global_step": 147303, "epoch": 876} {"train_loss": -10.826911926269531, "global_step": 147304, "epoch": 876} {"train_loss": -10.653389930725098, "global_step": 147305, "epoch": 876} {"train_loss": -10.896831512451172, "global_step": 147306, "epoch": 876} {"train_loss": -10.805154800415039, "global_step": 147307, "epoch": 876} {"train_loss": -11.032398223876953, "global_step": 147308, "epoch": 876} {"train_loss": -10.87503433227539, "global_step": 147309, "epoch": 876} {"train_loss": -10.781999588012695, "global_step": 147310, "epoch": 876} {"train_loss": -11.009615898132324, "global_step": 147311, "epoch": 876} {"train_loss": -10.922195434570312, "global_step": 147312, "epoch": 876} {"train_loss": -10.969388961791992, "global_step": 147313, "epoch": 876} {"train_loss": -10.591333389282227, "global_step": 147314, "epoch": 876} {"train_loss": -10.90599536895752, "global_step": 147315, "epoch": 876} {"train_loss": -10.79287338256836, "global_step": 147316, "epoch": 876} {"train_loss": -10.416641235351562, "global_step": 147317, "epoch": 876} {"train_loss": -10.63736343383789, "global_step": 147318, "epoch": 876} {"train_loss": -11.075419425964355, "global_step": 147319, "epoch": 876} {"train_loss": -10.592913627624512, "global_step": 147320, "epoch": 876} {"train_loss": -10.776226043701172, "global_step": 147321, "epoch": 876} {"train_loss": -10.624211311340332, "global_step": 147322, "epoch": 876} {"train_loss": -10.513998031616211, "global_step": 147323, "epoch": 876} {"train_loss": -10.176048278808594, "global_step": 147324, "epoch": 876} {"train_loss": -10.884931564331055, "global_step": 147325, "epoch": 876} {"train_loss": -10.466513633728027, "global_step": 147326, "epoch": 876} {"train_loss": -10.561750411987305, "global_step": 147327, "epoch": 876} {"train_loss": -10.754642486572266, "global_step": 147328, "epoch": 876} {"train_loss": -10.46296501159668, "global_step": 147329, "epoch": 876} {"train_loss": -10.931159019470215, "global_step": 147330, "epoch": 876} {"train_loss": -10.849864959716797, "global_step": 147331, "epoch": 876} {"train_loss": -10.65169906616211, "global_step": 147332, "epoch": 876} {"train_loss": -10.892229080200195, "global_step": 147333, "epoch": 876} {"train_loss": -10.513219833374023, "global_step": 147334, "epoch": 876} {"train_loss": -10.5334693250202, "global_step": 147335, "epoch": 876, "val_loss": 225844.078125} {"train_loss": -10.562898635864258, "global_step": 147336, "epoch": 877} {"train_loss": -9.878498077392578, "global_step": 147337, "epoch": 877} {"train_loss": -10.572098731994629, "global_step": 147338, "epoch": 877} {"train_loss": -10.014909744262695, "global_step": 147339, "epoch": 877} {"train_loss": -9.782415390014648, "global_step": 147340, "epoch": 877} {"train_loss": -10.427176475524902, "global_step": 147341, "epoch": 877} {"train_loss": -9.66073226928711, "global_step": 147342, "epoch": 877} {"train_loss": -10.289142608642578, "global_step": 147343, "epoch": 877} {"train_loss": -9.686758041381836, "global_step": 147344, "epoch": 877} {"train_loss": -10.34448528289795, "global_step": 147345, "epoch": 877} {"train_loss": -9.979880332946777, "global_step": 147346, "epoch": 877} {"train_loss": -10.356258392333984, "global_step": 147347, "epoch": 877} {"train_loss": -10.097970962524414, "global_step": 147348, "epoch": 877} {"train_loss": -10.309080123901367, "global_step": 147349, "epoch": 877} {"train_loss": -10.326231002807617, "global_step": 147350, "epoch": 877} {"train_loss": -10.36551284790039, "global_step": 147351, "epoch": 877} {"train_loss": -10.121984481811523, "global_step": 147352, "epoch": 877} {"train_loss": -10.362275123596191, "global_step": 147353, "epoch": 877} {"train_loss": -10.29504108428955, "global_step": 147354, "epoch": 877} {"train_loss": -10.338054656982422, "global_step": 147355, "epoch": 877} {"train_loss": -9.988658905029297, "global_step": 147356, "epoch": 877} {"train_loss": -10.255874633789062, "global_step": 147357, "epoch": 877} {"train_loss": -10.356719970703125, "global_step": 147358, "epoch": 877} {"train_loss": -10.258755683898926, "global_step": 147359, "epoch": 877} {"train_loss": -10.391212463378906, "global_step": 147360, "epoch": 877} {"train_loss": -10.348398208618164, "global_step": 147361, "epoch": 877} {"train_loss": -10.43415641784668, "global_step": 147362, "epoch": 877} {"train_loss": -10.401752471923828, "global_step": 147363, "epoch": 877} {"train_loss": -10.60600471496582, "global_step": 147364, "epoch": 877} {"train_loss": -10.168877601623535, "global_step": 147365, "epoch": 877} {"train_loss": -10.424365043640137, "global_step": 147366, "epoch": 877} {"train_loss": -10.502023696899414, "global_step": 147367, "epoch": 877} {"train_loss": -10.55862808227539, "global_step": 147368, "epoch": 877} {"train_loss": -10.686655044555664, "global_step": 147369, "epoch": 877} {"train_loss": -10.801889419555664, "global_step": 147370, "epoch": 877} {"train_loss": -10.786619186401367, "global_step": 147371, "epoch": 877} {"train_loss": -10.453554153442383, "global_step": 147372, "epoch": 877} {"train_loss": -10.556623458862305, "global_step": 147373, "epoch": 877} {"train_loss": -10.488770484924316, "global_step": 147374, "epoch": 877} {"train_loss": -10.56374740600586, "global_step": 147375, "epoch": 877} {"train_loss": -10.763479232788086, "global_step": 147376, "epoch": 877} {"train_loss": -10.724087715148926, "global_step": 147377, "epoch": 877} {"train_loss": -10.839151382446289, "global_step": 147378, "epoch": 877} {"train_loss": -10.649080276489258, "global_step": 147379, "epoch": 877} {"train_loss": -10.9227294921875, "global_step": 147380, "epoch": 877} {"train_loss": -10.493073463439941, "global_step": 147381, "epoch": 877} {"train_loss": -10.73383903503418, "global_step": 147382, "epoch": 877} {"train_loss": -10.649100303649902, "global_step": 147383, "epoch": 877} {"train_loss": -10.708964347839355, "global_step": 147384, "epoch": 877} {"train_loss": -10.840126037597656, "global_step": 147385, "epoch": 877} {"train_loss": -10.702850341796875, "global_step": 147386, "epoch": 877} {"train_loss": -10.674344062805176, "global_step": 147387, "epoch": 877} {"train_loss": -10.587895393371582, "global_step": 147388, "epoch": 877} {"train_loss": -10.833984375, "global_step": 147389, "epoch": 877} {"train_loss": -10.98201847076416, "global_step": 147390, "epoch": 877} {"train_loss": -10.802511215209961, "global_step": 147391, "epoch": 877} {"train_loss": -10.896900177001953, "global_step": 147392, "epoch": 877} {"train_loss": -10.834997177124023, "global_step": 147393, "epoch": 877} {"train_loss": -10.752382278442383, "global_step": 147394, "epoch": 877} {"train_loss": -10.909015655517578, "global_step": 147395, "epoch": 877} {"train_loss": -11.075210571289062, "global_step": 147396, "epoch": 877} {"train_loss": -10.823911666870117, "global_step": 147397, "epoch": 877} {"train_loss": -10.915447235107422, "global_step": 147398, "epoch": 877} {"train_loss": -10.730315208435059, "global_step": 147399, "epoch": 877} {"train_loss": -10.709171295166016, "global_step": 147400, "epoch": 877} {"train_loss": -10.851873397827148, "global_step": 147401, "epoch": 877} {"train_loss": -10.599082946777344, "global_step": 147402, "epoch": 877} {"train_loss": -10.964618682861328, "global_step": 147403, "epoch": 877} {"train_loss": -10.923294067382812, "global_step": 147404, "epoch": 877} {"train_loss": -10.867342948913574, "global_step": 147405, "epoch": 877} {"train_loss": -10.91765022277832, "global_step": 147406, "epoch": 877} {"train_loss": -11.056928634643555, "global_step": 147407, "epoch": 877} {"train_loss": -10.808303833007812, "global_step": 147408, "epoch": 877} {"train_loss": -10.9337797164917, "global_step": 147409, "epoch": 877} {"train_loss": -11.081913948059082, "global_step": 147410, "epoch": 877} {"train_loss": -10.905797958374023, "global_step": 147411, "epoch": 877} {"train_loss": -10.902607917785645, "global_step": 147412, "epoch": 877} {"train_loss": -10.965241432189941, "global_step": 147413, "epoch": 877} {"train_loss": -10.828734397888184, "global_step": 147414, "epoch": 877} {"train_loss": -10.630168914794922, "global_step": 147415, "epoch": 877} {"train_loss": -10.85130786895752, "global_step": 147416, "epoch": 877} {"train_loss": -10.782515525817871, "global_step": 147417, "epoch": 877} {"train_loss": -10.532597541809082, "global_step": 147418, "epoch": 877} {"train_loss": -10.75308609008789, "global_step": 147419, "epoch": 877} {"train_loss": -10.815214157104492, "global_step": 147420, "epoch": 877} {"train_loss": -10.629541397094727, "global_step": 147421, "epoch": 877} {"train_loss": -11.094337463378906, "global_step": 147422, "epoch": 877} {"train_loss": -10.84434700012207, "global_step": 147423, "epoch": 877} {"train_loss": -10.412150382995605, "global_step": 147424, "epoch": 877} {"train_loss": -10.019926071166992, "global_step": 147425, "epoch": 877} {"train_loss": -10.875631332397461, "global_step": 147426, "epoch": 877} {"train_loss": -9.986459732055664, "global_step": 147427, "epoch": 877} {"train_loss": -10.059648513793945, "global_step": 147428, "epoch": 877} {"train_loss": -10.548674583435059, "global_step": 147429, "epoch": 877} {"train_loss": -9.226825714111328, "global_step": 147430, "epoch": 877} {"train_loss": -10.10799503326416, "global_step": 147431, "epoch": 877} {"train_loss": -10.86029052734375, "global_step": 147432, "epoch": 877} {"train_loss": -10.164205551147461, "global_step": 147433, "epoch": 877} {"train_loss": -10.50606632232666, "global_step": 147434, "epoch": 877} {"train_loss": -10.252874374389648, "global_step": 147435, "epoch": 877} {"train_loss": -10.196670532226562, "global_step": 147436, "epoch": 877} {"train_loss": -10.220782279968262, "global_step": 147437, "epoch": 877} {"train_loss": -10.474530220031738, "global_step": 147438, "epoch": 877} {"train_loss": -10.043329238891602, "global_step": 147439, "epoch": 877} {"train_loss": -10.417808532714844, "global_step": 147440, "epoch": 877} {"train_loss": -10.461552619934082, "global_step": 147441, "epoch": 877} {"train_loss": -10.272186279296875, "global_step": 147442, "epoch": 877} {"train_loss": -10.13315200805664, "global_step": 147443, "epoch": 877} {"train_loss": -10.623991012573242, "global_step": 147444, "epoch": 877} {"train_loss": -10.362834930419922, "global_step": 147445, "epoch": 877} {"train_loss": -10.711463928222656, "global_step": 147446, "epoch": 877} {"train_loss": -10.409648895263672, "global_step": 147447, "epoch": 877} {"train_loss": -10.708951950073242, "global_step": 147448, "epoch": 877} {"train_loss": -10.576236724853516, "global_step": 147449, "epoch": 877} {"train_loss": -10.371099472045898, "global_step": 147450, "epoch": 877} {"train_loss": -10.523126602172852, "global_step": 147451, "epoch": 877} {"train_loss": -10.452156066894531, "global_step": 147452, "epoch": 877} {"train_loss": -10.340044021606445, "global_step": 147453, "epoch": 877} {"train_loss": -10.526275634765625, "global_step": 147454, "epoch": 877} {"train_loss": -10.705400466918945, "global_step": 147455, "epoch": 877} {"train_loss": -10.251859664916992, "global_step": 147456, "epoch": 877} {"train_loss": -10.695597648620605, "global_step": 147457, "epoch": 877} {"train_loss": -10.343952178955078, "global_step": 147458, "epoch": 877} {"train_loss": -10.537206649780273, "global_step": 147459, "epoch": 877} {"train_loss": -10.390873908996582, "global_step": 147460, "epoch": 877} {"train_loss": -10.59846019744873, "global_step": 147461, "epoch": 877} {"train_loss": -10.504121780395508, "global_step": 147462, "epoch": 877} {"train_loss": -10.682588577270508, "global_step": 147463, "epoch": 877} {"train_loss": -10.7278413772583, "global_step": 147464, "epoch": 877} {"train_loss": -10.655095100402832, "global_step": 147465, "epoch": 877} {"train_loss": -10.65064525604248, "global_step": 147466, "epoch": 877} {"train_loss": -10.731316566467285, "global_step": 147467, "epoch": 877} {"train_loss": -10.755691528320312, "global_step": 147468, "epoch": 877} {"train_loss": -10.969036102294922, "global_step": 147469, "epoch": 877} {"train_loss": -10.50899600982666, "global_step": 147470, "epoch": 877} {"train_loss": -10.863076210021973, "global_step": 147471, "epoch": 877} {"train_loss": -10.722481727600098, "global_step": 147472, "epoch": 877} {"train_loss": -10.752388000488281, "global_step": 147473, "epoch": 877} {"train_loss": -10.770242691040039, "global_step": 147474, "epoch": 877} {"train_loss": -10.77833366394043, "global_step": 147475, "epoch": 877} {"train_loss": -11.004203796386719, "global_step": 147476, "epoch": 877} {"train_loss": -10.84720230102539, "global_step": 147477, "epoch": 877} {"train_loss": -10.721955299377441, "global_step": 147478, "epoch": 877} {"train_loss": -10.730995178222656, "global_step": 147479, "epoch": 877} {"train_loss": -10.850800514221191, "global_step": 147480, "epoch": 877} {"train_loss": -10.717344284057617, "global_step": 147481, "epoch": 877} {"train_loss": -10.868597984313965, "global_step": 147482, "epoch": 877} {"train_loss": -10.664281845092773, "global_step": 147483, "epoch": 877} {"train_loss": -10.729799270629883, "global_step": 147484, "epoch": 877} {"train_loss": -10.864757537841797, "global_step": 147485, "epoch": 877} {"train_loss": -10.854125022888184, "global_step": 147486, "epoch": 877} {"train_loss": -11.068743705749512, "global_step": 147487, "epoch": 877} {"train_loss": -10.844730377197266, "global_step": 147488, "epoch": 877} {"train_loss": -10.908893585205078, "global_step": 147489, "epoch": 877} {"train_loss": -11.122576713562012, "global_step": 147490, "epoch": 877} {"train_loss": -10.930440902709961, "global_step": 147491, "epoch": 877} {"train_loss": -10.912636756896973, "global_step": 147492, "epoch": 877} {"train_loss": -11.047426223754883, "global_step": 147493, "epoch": 877} {"train_loss": -10.597138404846191, "global_step": 147494, "epoch": 877} {"train_loss": -10.600366592407227, "global_step": 147495, "epoch": 877} {"train_loss": -10.471433639526367, "global_step": 147496, "epoch": 877} {"train_loss": -10.869930267333984, "global_step": 147497, "epoch": 877} {"train_loss": -10.920820236206055, "global_step": 147498, "epoch": 877} {"train_loss": -11.064102172851562, "global_step": 147499, "epoch": 877} {"train_loss": -10.81546401977539, "global_step": 147500, "epoch": 877} {"train_loss": -10.959942817687988, "global_step": 147501, "epoch": 877} {"train_loss": -10.828929901123047, "global_step": 147502, "epoch": 877} {"train_loss": -10.593926588694254, "global_step": 147503, "epoch": 877, "val_loss": 227959.1875} {"train_loss": -10.875358581542969, "global_step": 147504, "epoch": 878} {"train_loss": -10.835262298583984, "global_step": 147505, "epoch": 878} {"train_loss": -10.553351402282715, "global_step": 147506, "epoch": 878} {"train_loss": -11.06629753112793, "global_step": 147507, "epoch": 878} {"train_loss": -10.337408065795898, "global_step": 147508, "epoch": 878} {"train_loss": -10.837517738342285, "global_step": 147509, "epoch": 878} {"train_loss": -10.807958602905273, "global_step": 147510, "epoch": 878} {"train_loss": -10.740926742553711, "global_step": 147511, "epoch": 878} {"train_loss": -10.664680480957031, "global_step": 147512, "epoch": 878} {"train_loss": -10.684322357177734, "global_step": 147513, "epoch": 878} {"train_loss": -10.482519149780273, "global_step": 147514, "epoch": 878} {"train_loss": -10.844017028808594, "global_step": 147515, "epoch": 878} {"train_loss": -10.582761764526367, "global_step": 147516, "epoch": 878} {"train_loss": -9.749073028564453, "global_step": 147517, "epoch": 878} {"train_loss": -10.519875526428223, "global_step": 147518, "epoch": 878} {"train_loss": -10.214274406433105, "global_step": 147519, "epoch": 878} {"train_loss": -10.352559089660645, "global_step": 147520, "epoch": 878} {"train_loss": -10.098968505859375, "global_step": 147521, "epoch": 878} {"train_loss": -10.709567070007324, "global_step": 147522, "epoch": 878} {"train_loss": -10.102840423583984, "global_step": 147523, "epoch": 878} {"train_loss": -10.314420700073242, "global_step": 147524, "epoch": 878} {"train_loss": -10.718631744384766, "global_step": 147525, "epoch": 878} {"train_loss": -10.061063766479492, "global_step": 147526, "epoch": 878} {"train_loss": -10.551810264587402, "global_step": 147527, "epoch": 878} {"train_loss": -9.364049911499023, "global_step": 147528, "epoch": 878} {"train_loss": -10.454991340637207, "global_step": 147529, "epoch": 878} {"train_loss": -10.422212600708008, "global_step": 147530, "epoch": 878} {"train_loss": -10.32158088684082, "global_step": 147531, "epoch": 878} {"train_loss": -10.547660827636719, "global_step": 147532, "epoch": 878} {"train_loss": -10.238604545593262, "global_step": 147533, "epoch": 878} {"train_loss": -10.506978034973145, "global_step": 147534, "epoch": 878} {"train_loss": -10.263452529907227, "global_step": 147535, "epoch": 878} {"train_loss": -10.259861946105957, "global_step": 147536, "epoch": 878} {"train_loss": -10.595123291015625, "global_step": 147537, "epoch": 878} {"train_loss": -10.50550651550293, "global_step": 147538, "epoch": 878} {"train_loss": -10.676961898803711, "global_step": 147539, "epoch": 878} {"train_loss": -10.377978324890137, "global_step": 147540, "epoch": 878} {"train_loss": -10.724807739257812, "global_step": 147541, "epoch": 878} {"train_loss": -10.416925430297852, "global_step": 147542, "epoch": 878} {"train_loss": -10.781862258911133, "global_step": 147543, "epoch": 878} {"train_loss": -10.394275665283203, "global_step": 147544, "epoch": 878} {"train_loss": -10.697155952453613, "global_step": 147545, "epoch": 878} {"train_loss": -10.719143867492676, "global_step": 147546, "epoch": 878} {"train_loss": -10.666788101196289, "global_step": 147547, "epoch": 878} {"train_loss": -10.617729187011719, "global_step": 147548, "epoch": 878} {"train_loss": -10.496659278869629, "global_step": 147549, "epoch": 878} {"train_loss": -10.38235855102539, "global_step": 147550, "epoch": 878} {"train_loss": -10.034782409667969, "global_step": 147551, "epoch": 878} {"train_loss": -10.291430473327637, "global_step": 147552, "epoch": 878} {"train_loss": -10.297515869140625, "global_step": 147553, "epoch": 878} {"train_loss": -10.629837036132812, "global_step": 147554, "epoch": 878} {"train_loss": -10.269968032836914, "global_step": 147555, "epoch": 878} {"train_loss": -10.789592742919922, "global_step": 147556, "epoch": 878} {"train_loss": -10.474912643432617, "global_step": 147557, "epoch": 878} {"train_loss": -10.758800506591797, "global_step": 147558, "epoch": 878} {"train_loss": -10.443527221679688, "global_step": 147559, "epoch": 878} {"train_loss": -10.890222549438477, "global_step": 147560, "epoch": 878} {"train_loss": -10.622688293457031, "global_step": 147561, "epoch": 878} {"train_loss": -10.50732707977295, "global_step": 147562, "epoch": 878} {"train_loss": -10.905974388122559, "global_step": 147563, "epoch": 878} {"train_loss": -10.62427806854248, "global_step": 147564, "epoch": 878} {"train_loss": -10.608626365661621, "global_step": 147565, "epoch": 878} {"train_loss": -10.309539794921875, "global_step": 147566, "epoch": 878} {"train_loss": -10.72244930267334, "global_step": 147567, "epoch": 878} {"train_loss": -10.391944885253906, "global_step": 147568, "epoch": 878} {"train_loss": -11.009784698486328, "global_step": 147569, "epoch": 878} {"train_loss": -10.341485977172852, "global_step": 147570, "epoch": 878} {"train_loss": -10.900875091552734, "global_step": 147571, "epoch": 878} {"train_loss": -10.388678550720215, "global_step": 147572, "epoch": 878} {"train_loss": -10.624984741210938, "global_step": 147573, "epoch": 878} {"train_loss": -10.690423965454102, "global_step": 147574, "epoch": 878} {"train_loss": -10.806026458740234, "global_step": 147575, "epoch": 878} {"train_loss": -11.02090072631836, "global_step": 147576, "epoch": 878} {"train_loss": -10.617152214050293, "global_step": 147577, "epoch": 878} {"train_loss": -10.915385246276855, "global_step": 147578, "epoch": 878} {"train_loss": -10.7667236328125, "global_step": 147579, "epoch": 878} {"train_loss": -10.724390029907227, "global_step": 147580, "epoch": 878} {"train_loss": -10.578962326049805, "global_step": 147581, "epoch": 878} {"train_loss": -10.900993347167969, "global_step": 147582, "epoch": 878} {"train_loss": -10.652606010437012, "global_step": 147583, "epoch": 878} {"train_loss": -10.20578670501709, "global_step": 147584, "epoch": 878} {"train_loss": -10.952335357666016, "global_step": 147585, "epoch": 878} {"train_loss": -10.356840133666992, "global_step": 147586, "epoch": 878} {"train_loss": -10.654045104980469, "global_step": 147587, "epoch": 878} {"train_loss": -10.931896209716797, "global_step": 147588, "epoch": 878} {"train_loss": -10.493897438049316, "global_step": 147589, "epoch": 878} {"train_loss": -11.032880783081055, "global_step": 147590, "epoch": 878} {"train_loss": -10.55091667175293, "global_step": 147591, "epoch": 878} {"train_loss": -10.857722282409668, "global_step": 147592, "epoch": 878} {"train_loss": -10.571222305297852, "global_step": 147593, "epoch": 878} {"train_loss": -10.71242904663086, "global_step": 147594, "epoch": 878} {"train_loss": -10.618988037109375, "global_step": 147595, "epoch": 878} {"train_loss": -10.600261688232422, "global_step": 147596, "epoch": 878} {"train_loss": -10.720819473266602, "global_step": 147597, "epoch": 878} {"train_loss": -10.50042724609375, "global_step": 147598, "epoch": 878} {"train_loss": -10.360082626342773, "global_step": 147599, "epoch": 878} {"train_loss": -10.264284133911133, "global_step": 147600, "epoch": 878} {"train_loss": -10.440423965454102, "global_step": 147601, "epoch": 878} {"train_loss": -10.636100769042969, "global_step": 147602, "epoch": 878} {"train_loss": -10.396347045898438, "global_step": 147603, "epoch": 878} {"train_loss": -10.519264221191406, "global_step": 147604, "epoch": 878} {"train_loss": -10.424371719360352, "global_step": 147605, "epoch": 878} {"train_loss": -10.163552284240723, "global_step": 147606, "epoch": 878} {"train_loss": -10.496358871459961, "global_step": 147607, "epoch": 878} {"train_loss": -9.876701354980469, "global_step": 147608, "epoch": 878} {"train_loss": -10.729432106018066, "global_step": 147609, "epoch": 878} {"train_loss": -10.282594680786133, "global_step": 147610, "epoch": 878} {"train_loss": -10.782588958740234, "global_step": 147611, "epoch": 878} {"train_loss": -10.258838653564453, "global_step": 147612, "epoch": 878} {"train_loss": -10.550186157226562, "global_step": 147613, "epoch": 878} {"train_loss": -10.592611312866211, "global_step": 147614, "epoch": 878} {"train_loss": -10.627092361450195, "global_step": 147615, "epoch": 878} {"train_loss": -10.566665649414062, "global_step": 147616, "epoch": 878} {"train_loss": -10.812814712524414, "global_step": 147617, "epoch": 878} {"train_loss": -10.688328742980957, "global_step": 147618, "epoch": 878} {"train_loss": -10.828174591064453, "global_step": 147619, "epoch": 878} {"train_loss": -10.794790267944336, "global_step": 147620, "epoch": 878} {"train_loss": -10.767610549926758, "global_step": 147621, "epoch": 878} {"train_loss": -10.88846492767334, "global_step": 147622, "epoch": 878} {"train_loss": -10.867746353149414, "global_step": 147623, "epoch": 878} {"train_loss": -11.09655475616455, "global_step": 147624, "epoch": 878} {"train_loss": -10.760797500610352, "global_step": 147625, "epoch": 878} {"train_loss": -10.876220703125, "global_step": 147626, "epoch": 878} {"train_loss": -10.949798583984375, "global_step": 147627, "epoch": 878} {"train_loss": -10.941383361816406, "global_step": 147628, "epoch": 878} {"train_loss": -10.867036819458008, "global_step": 147629, "epoch": 878} {"train_loss": -10.927738189697266, "global_step": 147630, "epoch": 878} {"train_loss": -10.633760452270508, "global_step": 147631, "epoch": 878} {"train_loss": -10.65503978729248, "global_step": 147632, "epoch": 878} {"train_loss": -11.011866569519043, "global_step": 147633, "epoch": 878} {"train_loss": -10.69884967803955, "global_step": 147634, "epoch": 878} {"train_loss": -10.59127426147461, "global_step": 147635, "epoch": 878} {"train_loss": -10.731337547302246, "global_step": 147636, "epoch": 878} {"train_loss": -10.435230255126953, "global_step": 147637, "epoch": 878} {"train_loss": -10.752519607543945, "global_step": 147638, "epoch": 878} {"train_loss": -10.423701286315918, "global_step": 147639, "epoch": 878} {"train_loss": -10.666006088256836, "global_step": 147640, "epoch": 878} {"train_loss": -10.646639823913574, "global_step": 147641, "epoch": 878} {"train_loss": -10.505995750427246, "global_step": 147642, "epoch": 878} {"train_loss": -10.562551498413086, "global_step": 147643, "epoch": 878} {"train_loss": -10.500569343566895, "global_step": 147644, "epoch": 878} {"train_loss": -10.661591529846191, "global_step": 147645, "epoch": 878} {"train_loss": -11.102140426635742, "global_step": 147646, "epoch": 878} {"train_loss": -10.844090461730957, "global_step": 147647, "epoch": 878} {"train_loss": -10.893266677856445, "global_step": 147648, "epoch": 878} {"train_loss": -10.798530578613281, "global_step": 147649, "epoch": 878} {"train_loss": -10.941710472106934, "global_step": 147650, "epoch": 878} {"train_loss": -10.74098014831543, "global_step": 147651, "epoch": 878} {"train_loss": -10.9544038772583, "global_step": 147652, "epoch": 878} {"train_loss": -10.834752082824707, "global_step": 147653, "epoch": 878} {"train_loss": -10.846857070922852, "global_step": 147654, "epoch": 878} {"train_loss": -10.533742904663086, "global_step": 147655, "epoch": 878} {"train_loss": -11.095244407653809, "global_step": 147656, "epoch": 878} {"train_loss": -10.361124038696289, "global_step": 147657, "epoch": 878} {"train_loss": -10.723634719848633, "global_step": 147658, "epoch": 878} {"train_loss": -10.77069091796875, "global_step": 147659, "epoch": 878} {"train_loss": -10.629257202148438, "global_step": 147660, "epoch": 878} {"train_loss": -10.619222640991211, "global_step": 147661, "epoch": 878} {"train_loss": -11.050044059753418, "global_step": 147662, "epoch": 878} {"train_loss": -10.611326217651367, "global_step": 147663, "epoch": 878} {"train_loss": -10.744308471679688, "global_step": 147664, "epoch": 878} {"train_loss": -10.766761779785156, "global_step": 147665, "epoch": 878} {"train_loss": -11.083166122436523, "global_step": 147666, "epoch": 878} {"train_loss": -10.898887634277344, "global_step": 147667, "epoch": 878} {"train_loss": -10.921174049377441, "global_step": 147668, "epoch": 878} {"train_loss": -10.657529830932617, "global_step": 147669, "epoch": 878} {"train_loss": -11.022112846374512, "global_step": 147670, "epoch": 878} {"train_loss": -10.619802276293436, "global_step": 147671, "epoch": 878, "val_loss": 227966.5625} {"train_loss": -10.948601722717285, "global_step": 147672, "epoch": 879} {"train_loss": -10.642404556274414, "global_step": 147673, "epoch": 879} {"train_loss": -10.639928817749023, "global_step": 147674, "epoch": 879} {"train_loss": -10.468673706054688, "global_step": 147675, "epoch": 879} {"train_loss": -10.614069938659668, "global_step": 147676, "epoch": 879} {"train_loss": -10.552163124084473, "global_step": 147677, "epoch": 879} {"train_loss": -10.777178764343262, "global_step": 147678, "epoch": 879} {"train_loss": -10.610713958740234, "global_step": 147679, "epoch": 879} {"train_loss": -10.677631378173828, "global_step": 147680, "epoch": 879} {"train_loss": -10.666084289550781, "global_step": 147681, "epoch": 879} {"train_loss": -10.350654602050781, "global_step": 147682, "epoch": 879} {"train_loss": -10.51774787902832, "global_step": 147683, "epoch": 879} {"train_loss": -10.777256965637207, "global_step": 147684, "epoch": 879} {"train_loss": -10.513711929321289, "global_step": 147685, "epoch": 879} {"train_loss": -10.79188346862793, "global_step": 147686, "epoch": 879} {"train_loss": -10.3792724609375, "global_step": 147687, "epoch": 879} {"train_loss": -10.20803451538086, "global_step": 147688, "epoch": 879} {"train_loss": -10.570623397827148, "global_step": 147689, "epoch": 879} {"train_loss": -10.487570762634277, "global_step": 147690, "epoch": 879} {"train_loss": -10.433788299560547, "global_step": 147691, "epoch": 879} {"train_loss": -10.709636688232422, "global_step": 147692, "epoch": 879} {"train_loss": -10.612591743469238, "global_step": 147693, "epoch": 879} {"train_loss": -10.770153999328613, "global_step": 147694, "epoch": 879} {"train_loss": -10.617338180541992, "global_step": 147695, "epoch": 879} {"train_loss": -10.74251651763916, "global_step": 147696, "epoch": 879} {"train_loss": -10.616649627685547, "global_step": 147697, "epoch": 879} {"train_loss": -10.644281387329102, "global_step": 147698, "epoch": 879} {"train_loss": -10.78817367553711, "global_step": 147699, "epoch": 879} {"train_loss": -10.746490478515625, "global_step": 147700, "epoch": 879} {"train_loss": -10.664701461791992, "global_step": 147701, "epoch": 879} {"train_loss": -10.564964294433594, "global_step": 147702, "epoch": 879} {"train_loss": -10.303878784179688, "global_step": 147703, "epoch": 879} {"train_loss": -10.692527770996094, "global_step": 147704, "epoch": 879} {"train_loss": -10.131688117980957, "global_step": 147705, "epoch": 879} {"train_loss": -10.663043022155762, "global_step": 147706, "epoch": 879} {"train_loss": -10.476691246032715, "global_step": 147707, "epoch": 879} {"train_loss": -10.294439315795898, "global_step": 147708, "epoch": 879} {"train_loss": -10.321861267089844, "global_step": 147709, "epoch": 879} {"train_loss": -10.5551176071167, "global_step": 147710, "epoch": 879} {"train_loss": -10.617647171020508, "global_step": 147711, "epoch": 879} {"train_loss": -10.680925369262695, "global_step": 147712, "epoch": 879} {"train_loss": -10.845420837402344, "global_step": 147713, "epoch": 879} {"train_loss": -10.28911018371582, "global_step": 147714, "epoch": 879} {"train_loss": -10.80984878540039, "global_step": 147715, "epoch": 879} {"train_loss": -10.276341438293457, "global_step": 147716, "epoch": 879} {"train_loss": -10.502010345458984, "global_step": 147717, "epoch": 879} {"train_loss": -10.281982421875, "global_step": 147718, "epoch": 879} {"train_loss": -10.25620174407959, "global_step": 147719, "epoch": 879} {"train_loss": -10.638703346252441, "global_step": 147720, "epoch": 879} {"train_loss": -10.739997863769531, "global_step": 147721, "epoch": 879} {"train_loss": -10.920382499694824, "global_step": 147722, "epoch": 879} {"train_loss": -10.419086456298828, "global_step": 147723, "epoch": 879} {"train_loss": -10.372034072875977, "global_step": 147724, "epoch": 879} {"train_loss": -10.30778694152832, "global_step": 147725, "epoch": 879} {"train_loss": -10.80907154083252, "global_step": 147726, "epoch": 879} {"train_loss": -10.688519477844238, "global_step": 147727, "epoch": 879} {"train_loss": -10.545003890991211, "global_step": 147728, "epoch": 879} {"train_loss": -10.787162780761719, "global_step": 147729, "epoch": 879} {"train_loss": -10.27183723449707, "global_step": 147730, "epoch": 879} {"train_loss": -10.38313102722168, "global_step": 147731, "epoch": 879} {"train_loss": -10.737085342407227, "global_step": 147732, "epoch": 879} {"train_loss": -10.492395401000977, "global_step": 147733, "epoch": 879} {"train_loss": -10.255633354187012, "global_step": 147734, "epoch": 879} {"train_loss": -10.445542335510254, "global_step": 147735, "epoch": 879} {"train_loss": -10.65839958190918, "global_step": 147736, "epoch": 879} {"train_loss": -10.545331954956055, "global_step": 147737, "epoch": 879} {"train_loss": -10.814419746398926, "global_step": 147738, "epoch": 879} {"train_loss": -10.547468185424805, "global_step": 147739, "epoch": 879} {"train_loss": -10.775497436523438, "global_step": 147740, "epoch": 879} {"train_loss": -10.455825805664062, "global_step": 147741, "epoch": 879} {"train_loss": -10.60315227508545, "global_step": 147742, "epoch": 879} {"train_loss": -10.645881652832031, "global_step": 147743, "epoch": 879} {"train_loss": -10.332479476928711, "global_step": 147744, "epoch": 879} {"train_loss": -10.678338050842285, "global_step": 147745, "epoch": 879} {"train_loss": -10.42154312133789, "global_step": 147746, "epoch": 879} {"train_loss": -10.69277572631836, "global_step": 147747, "epoch": 879} {"train_loss": -10.231393814086914, "global_step": 147748, "epoch": 879} {"train_loss": -9.938163757324219, "global_step": 147749, "epoch": 879} {"train_loss": -10.683982849121094, "global_step": 147750, "epoch": 879} {"train_loss": -10.589215278625488, "global_step": 147751, "epoch": 879} {"train_loss": -10.37095832824707, "global_step": 147752, "epoch": 879} {"train_loss": -10.827760696411133, "global_step": 147753, "epoch": 879} {"train_loss": -10.299251556396484, "global_step": 147754, "epoch": 879} {"train_loss": -10.812067031860352, "global_step": 147755, "epoch": 879} {"train_loss": -10.221151351928711, "global_step": 147756, "epoch": 879} {"train_loss": -10.451375007629395, "global_step": 147757, "epoch": 879} {"train_loss": -10.554832458496094, "global_step": 147758, "epoch": 879} {"train_loss": -10.155878067016602, "global_step": 147759, "epoch": 879} {"train_loss": -10.731146812438965, "global_step": 147760, "epoch": 879} {"train_loss": -10.122444152832031, "global_step": 147761, "epoch": 879} {"train_loss": -10.623870849609375, "global_step": 147762, "epoch": 879} {"train_loss": -10.271546363830566, "global_step": 147763, "epoch": 879} {"train_loss": -10.586458206176758, "global_step": 147764, "epoch": 879} {"train_loss": -10.631887435913086, "global_step": 147765, "epoch": 879} {"train_loss": -10.44404411315918, "global_step": 147766, "epoch": 879} {"train_loss": -10.733576774597168, "global_step": 147767, "epoch": 879} {"train_loss": -10.565444946289062, "global_step": 147768, "epoch": 879} {"train_loss": -10.63123893737793, "global_step": 147769, "epoch": 879} {"train_loss": -10.310111999511719, "global_step": 147770, "epoch": 879} {"train_loss": -10.670601844787598, "global_step": 147771, "epoch": 879} {"train_loss": -10.119318008422852, "global_step": 147772, "epoch": 879} {"train_loss": -10.347067832946777, "global_step": 147773, "epoch": 879} {"train_loss": -9.659873962402344, "global_step": 147774, "epoch": 879} {"train_loss": -10.43389892578125, "global_step": 147775, "epoch": 879} {"train_loss": -10.03880500793457, "global_step": 147776, "epoch": 879} {"train_loss": -10.293083190917969, "global_step": 147777, "epoch": 879} {"train_loss": -10.220600128173828, "global_step": 147778, "epoch": 879} {"train_loss": -10.029150009155273, "global_step": 147779, "epoch": 879} {"train_loss": -10.173307418823242, "global_step": 147780, "epoch": 879} {"train_loss": -10.371822357177734, "global_step": 147781, "epoch": 879} {"train_loss": -10.375141143798828, "global_step": 147782, "epoch": 879} {"train_loss": -10.53133773803711, "global_step": 147783, "epoch": 879} {"train_loss": -10.747199058532715, "global_step": 147784, "epoch": 879} {"train_loss": -10.519771575927734, "global_step": 147785, "epoch": 879} {"train_loss": -10.7935152053833, "global_step": 147786, "epoch": 879} {"train_loss": -10.815468788146973, "global_step": 147787, "epoch": 879} {"train_loss": -10.432592391967773, "global_step": 147788, "epoch": 879} {"train_loss": -10.871387481689453, "global_step": 147789, "epoch": 879} {"train_loss": -10.363398551940918, "global_step": 147790, "epoch": 879} {"train_loss": -10.511934280395508, "global_step": 147791, "epoch": 879} {"train_loss": -10.604829788208008, "global_step": 147792, "epoch": 879} {"train_loss": -10.668774604797363, "global_step": 147793, "epoch": 879} {"train_loss": -10.447080612182617, "global_step": 147794, "epoch": 879} {"train_loss": -10.872882843017578, "global_step": 147795, "epoch": 879} {"train_loss": -10.688045501708984, "global_step": 147796, "epoch": 879} {"train_loss": -10.422769546508789, "global_step": 147797, "epoch": 879} {"train_loss": -10.942472457885742, "global_step": 147798, "epoch": 879} {"train_loss": -10.689507484436035, "global_step": 147799, "epoch": 879} {"train_loss": -10.89388656616211, "global_step": 147800, "epoch": 879} {"train_loss": -10.902714729309082, "global_step": 147801, "epoch": 879} {"train_loss": -10.593350410461426, "global_step": 147802, "epoch": 879} {"train_loss": -10.951692581176758, "global_step": 147803, "epoch": 879} {"train_loss": -10.656978607177734, "global_step": 147804, "epoch": 879} {"train_loss": -10.53386402130127, "global_step": 147805, "epoch": 879} {"train_loss": -10.726442337036133, "global_step": 147806, "epoch": 879} {"train_loss": -10.921937942504883, "global_step": 147807, "epoch": 879} {"train_loss": -10.509896278381348, "global_step": 147808, "epoch": 879} {"train_loss": -10.917091369628906, "global_step": 147809, "epoch": 879} {"train_loss": -10.633256912231445, "global_step": 147810, "epoch": 879} {"train_loss": -10.894938468933105, "global_step": 147811, "epoch": 879} {"train_loss": -10.77145004272461, "global_step": 147812, "epoch": 879} {"train_loss": -10.854676246643066, "global_step": 147813, "epoch": 879} {"train_loss": -10.894954681396484, "global_step": 147814, "epoch": 879} {"train_loss": -10.843053817749023, "global_step": 147815, "epoch": 879} {"train_loss": -10.691619873046875, "global_step": 147816, "epoch": 879} {"train_loss": -11.079621315002441, "global_step": 147817, "epoch": 879} {"train_loss": -10.416290283203125, "global_step": 147818, "epoch": 879} {"train_loss": -10.943900108337402, "global_step": 147819, "epoch": 879} {"train_loss": -10.939569473266602, "global_step": 147820, "epoch": 879} {"train_loss": -10.979402542114258, "global_step": 147821, "epoch": 879} {"train_loss": -11.049352645874023, "global_step": 147822, "epoch": 879} {"train_loss": -11.06570816040039, "global_step": 147823, "epoch": 879} {"train_loss": -10.988082885742188, "global_step": 147824, "epoch": 879} {"train_loss": -10.883103370666504, "global_step": 147825, "epoch": 879} {"train_loss": -11.092708587646484, "global_step": 147826, "epoch": 879} {"train_loss": -10.72116756439209, "global_step": 147827, "epoch": 879} {"train_loss": -10.7786865234375, "global_step": 147828, "epoch": 879} {"train_loss": -10.295589447021484, "global_step": 147829, "epoch": 879} {"train_loss": -10.715370178222656, "global_step": 147830, "epoch": 879} {"train_loss": -10.992599487304688, "global_step": 147831, "epoch": 879} {"train_loss": -10.81001091003418, "global_step": 147832, "epoch": 879} {"train_loss": -10.904550552368164, "global_step": 147833, "epoch": 879} {"train_loss": -10.349920272827148, "global_step": 147834, "epoch": 879} {"train_loss": -10.554880142211914, "global_step": 147835, "epoch": 879} {"train_loss": -10.612920761108398, "global_step": 147836, "epoch": 879} {"train_loss": -10.747171401977539, "global_step": 147837, "epoch": 879} {"train_loss": -10.36672592163086, "global_step": 147838, "epoch": 879} {"train_loss": -10.58935949348268, "global_step": 147839, "epoch": 879, "val_loss": 227974.0625} {"train_loss": -10.686749458312988, "global_step": 147840, "epoch": 880} {"train_loss": -10.550140380859375, "global_step": 147841, "epoch": 880} {"train_loss": -10.677398681640625, "global_step": 147842, "epoch": 880} {"train_loss": -10.889108657836914, "global_step": 147843, "epoch": 880} {"train_loss": -10.530916213989258, "global_step": 147844, "epoch": 880} {"train_loss": -9.699291229248047, "global_step": 147845, "epoch": 880} {"train_loss": -9.902347564697266, "global_step": 147846, "epoch": 880} {"train_loss": -10.2507963180542, "global_step": 147847, "epoch": 880} {"train_loss": -10.203458786010742, "global_step": 147848, "epoch": 880} {"train_loss": -6.804441928863525, "global_step": 147849, "epoch": 880} {"train_loss": -9.937335968017578, "global_step": 147850, "epoch": 880} {"train_loss": -10.365850448608398, "global_step": 147851, "epoch": 880} {"train_loss": -9.463541030883789, "global_step": 147852, "epoch": 880} {"train_loss": -8.06755256652832, "global_step": 147853, "epoch": 880} {"train_loss": -9.021245956420898, "global_step": 147854, "epoch": 880} {"train_loss": -9.247737884521484, "global_step": 147855, "epoch": 880} {"train_loss": -8.845145225524902, "global_step": 147856, "epoch": 880} {"train_loss": -8.150514602661133, "global_step": 147857, "epoch": 880} {"train_loss": -9.169376373291016, "global_step": 147858, "epoch": 880} {"train_loss": -8.6688814163208, "global_step": 147859, "epoch": 880} {"train_loss": -9.055758476257324, "global_step": 147860, "epoch": 880} {"train_loss": -8.516135215759277, "global_step": 147861, "epoch": 880} {"train_loss": -9.320327758789062, "global_step": 147862, "epoch": 880} {"train_loss": -8.934383392333984, "global_step": 147863, "epoch": 880} {"train_loss": -9.004154205322266, "global_step": 147864, "epoch": 880} {"train_loss": -9.000219345092773, "global_step": 147865, "epoch": 880} {"train_loss": -9.464746475219727, "global_step": 147866, "epoch": 880} {"train_loss": -9.194604873657227, "global_step": 147867, "epoch": 880} {"train_loss": -8.806926727294922, "global_step": 147868, "epoch": 880} {"train_loss": -9.504289627075195, "global_step": 147869, "epoch": 880} {"train_loss": -9.064132690429688, "global_step": 147870, "epoch": 880} {"train_loss": -9.612030982971191, "global_step": 147871, "epoch": 880} {"train_loss": -9.137948989868164, "global_step": 147872, "epoch": 880} {"train_loss": -9.357261657714844, "global_step": 147873, "epoch": 880} {"train_loss": -9.840188026428223, "global_step": 147874, "epoch": 880} {"train_loss": -9.516777038574219, "global_step": 147875, "epoch": 880} {"train_loss": -9.513209342956543, "global_step": 147876, "epoch": 880} {"train_loss": -9.722257614135742, "global_step": 147877, "epoch": 880} {"train_loss": -9.18355941772461, "global_step": 147878, "epoch": 880} {"train_loss": -9.686046600341797, "global_step": 147879, "epoch": 880} {"train_loss": -9.778569221496582, "global_step": 147880, "epoch": 880} {"train_loss": -9.128901481628418, "global_step": 147881, "epoch": 880} {"train_loss": -9.345681190490723, "global_step": 147882, "epoch": 880} {"train_loss": -9.320606231689453, "global_step": 147883, "epoch": 880} {"train_loss": -9.704156875610352, "global_step": 147884, "epoch": 880} {"train_loss": -9.817333221435547, "global_step": 147885, "epoch": 880} {"train_loss": -9.903446197509766, "global_step": 147886, "epoch": 880} {"train_loss": -9.87488079071045, "global_step": 147887, "epoch": 880} {"train_loss": -9.892871856689453, "global_step": 147888, "epoch": 880} {"train_loss": -10.078737258911133, "global_step": 147889, "epoch": 880} {"train_loss": -9.692054748535156, "global_step": 147890, "epoch": 880} {"train_loss": -10.138751983642578, "global_step": 147891, "epoch": 880} {"train_loss": -10.129671096801758, "global_step": 147892, "epoch": 880} {"train_loss": -9.888463973999023, "global_step": 147893, "epoch": 880} {"train_loss": -9.854458808898926, "global_step": 147894, "epoch": 880} {"train_loss": -10.26678466796875, "global_step": 147895, "epoch": 880} {"train_loss": -9.994470596313477, "global_step": 147896, "epoch": 880} {"train_loss": -10.294424057006836, "global_step": 147897, "epoch": 880} {"train_loss": -10.282971382141113, "global_step": 147898, "epoch": 880} {"train_loss": -10.015411376953125, "global_step": 147899, "epoch": 880} {"train_loss": -10.281938552856445, "global_step": 147900, "epoch": 880} {"train_loss": -10.343544006347656, "global_step": 147901, "epoch": 880} {"train_loss": -10.166852951049805, "global_step": 147902, "epoch": 880} {"train_loss": -10.229341506958008, "global_step": 147903, "epoch": 880} {"train_loss": -10.296967506408691, "global_step": 147904, "epoch": 880} {"train_loss": -10.499095916748047, "global_step": 147905, "epoch": 880} {"train_loss": -10.212684631347656, "global_step": 147906, "epoch": 880} {"train_loss": -10.563163757324219, "global_step": 147907, "epoch": 880} {"train_loss": -10.347379684448242, "global_step": 147908, "epoch": 880} {"train_loss": -10.611457824707031, "global_step": 147909, "epoch": 880} {"train_loss": -10.133460998535156, "global_step": 147910, "epoch": 880} {"train_loss": -10.624688148498535, "global_step": 147911, "epoch": 880} {"train_loss": -10.534815788269043, "global_step": 147912, "epoch": 880} {"train_loss": -10.692588806152344, "global_step": 147913, "epoch": 880} {"train_loss": -10.609560012817383, "global_step": 147914, "epoch": 880} {"train_loss": -10.662795066833496, "global_step": 147915, "epoch": 880} {"train_loss": -10.457033157348633, "global_step": 147916, "epoch": 880} {"train_loss": -10.61340045928955, "global_step": 147917, "epoch": 880} {"train_loss": -10.468022346496582, "global_step": 147918, "epoch": 880} {"train_loss": -10.8494234085083, "global_step": 147919, "epoch": 880} {"train_loss": -10.98659896850586, "global_step": 147920, "epoch": 880} {"train_loss": -10.942887306213379, "global_step": 147921, "epoch": 880} {"train_loss": -10.692527770996094, "global_step": 147922, "epoch": 880} {"train_loss": -10.5665283203125, "global_step": 147923, "epoch": 880} {"train_loss": -10.52029037475586, "global_step": 147924, "epoch": 880} {"train_loss": -10.984882354736328, "global_step": 147925, "epoch": 880} {"train_loss": -10.773021697998047, "global_step": 147926, "epoch": 880} {"train_loss": -10.730688095092773, "global_step": 147927, "epoch": 880} {"train_loss": -10.9159574508667, "global_step": 147928, "epoch": 880} {"train_loss": -10.621969223022461, "global_step": 147929, "epoch": 880} {"train_loss": -10.829680442810059, "global_step": 147930, "epoch": 880} {"train_loss": -10.800734519958496, "global_step": 147931, "epoch": 880} {"train_loss": -10.90341567993164, "global_step": 147932, "epoch": 880} {"train_loss": -10.929176330566406, "global_step": 147933, "epoch": 880} {"train_loss": -10.833961486816406, "global_step": 147934, "epoch": 880} {"train_loss": -10.862005233764648, "global_step": 147935, "epoch": 880} {"train_loss": -10.859794616699219, "global_step": 147936, "epoch": 880} {"train_loss": -10.736003875732422, "global_step": 147937, "epoch": 880} {"train_loss": -10.187193870544434, "global_step": 147938, "epoch": 880} {"train_loss": -10.770414352416992, "global_step": 147939, "epoch": 880} {"train_loss": -10.628568649291992, "global_step": 147940, "epoch": 880} {"train_loss": -10.778244018554688, "global_step": 147941, "epoch": 880} {"train_loss": -10.81820297241211, "global_step": 147942, "epoch": 880} {"train_loss": -10.805020332336426, "global_step": 147943, "epoch": 880} {"train_loss": -10.633987426757812, "global_step": 147944, "epoch": 880} {"train_loss": -10.851253509521484, "global_step": 147945, "epoch": 880} {"train_loss": -10.242691040039062, "global_step": 147946, "epoch": 880} {"train_loss": -10.769906044006348, "global_step": 147947, "epoch": 880} {"train_loss": -10.393035888671875, "global_step": 147948, "epoch": 880} {"train_loss": -10.157416343688965, "global_step": 147949, "epoch": 880} {"train_loss": -9.977941513061523, "global_step": 147950, "epoch": 880} {"train_loss": -10.643625259399414, "global_step": 147951, "epoch": 880} {"train_loss": -10.464670181274414, "global_step": 147952, "epoch": 880} {"train_loss": -10.290135383605957, "global_step": 147953, "epoch": 880} {"train_loss": -10.463653564453125, "global_step": 147954, "epoch": 880} {"train_loss": -10.535758972167969, "global_step": 147955, "epoch": 880} {"train_loss": -10.490671157836914, "global_step": 147956, "epoch": 880} {"train_loss": -10.49498176574707, "global_step": 147957, "epoch": 880} {"train_loss": -10.573820114135742, "global_step": 147958, "epoch": 880} {"train_loss": -10.31022834777832, "global_step": 147959, "epoch": 880} {"train_loss": -10.45659065246582, "global_step": 147960, "epoch": 880} {"train_loss": -10.837586402893066, "global_step": 147961, "epoch": 880} {"train_loss": -10.204841613769531, "global_step": 147962, "epoch": 880} {"train_loss": -10.760735511779785, "global_step": 147963, "epoch": 880} {"train_loss": -10.696084976196289, "global_step": 147964, "epoch": 880} {"train_loss": -10.422260284423828, "global_step": 147965, "epoch": 880} {"train_loss": -10.76773738861084, "global_step": 147966, "epoch": 880} {"train_loss": -10.488712310791016, "global_step": 147967, "epoch": 880} {"train_loss": -10.739702224731445, "global_step": 147968, "epoch": 880} {"train_loss": -10.880380630493164, "global_step": 147969, "epoch": 880} {"train_loss": -10.06877326965332, "global_step": 147970, "epoch": 880} {"train_loss": -9.954267501831055, "global_step": 147971, "epoch": 880} {"train_loss": -10.356486320495605, "global_step": 147972, "epoch": 880} {"train_loss": -9.759035110473633, "global_step": 147973, "epoch": 880} {"train_loss": -10.812479019165039, "global_step": 147974, "epoch": 880} {"train_loss": -10.199085235595703, "global_step": 147975, "epoch": 880} {"train_loss": -10.453147888183594, "global_step": 147976, "epoch": 880} {"train_loss": -10.05042552947998, "global_step": 147977, "epoch": 880} {"train_loss": -10.268998146057129, "global_step": 147978, "epoch": 880} {"train_loss": -10.382598876953125, "global_step": 147979, "epoch": 880} {"train_loss": -10.385022163391113, "global_step": 147980, "epoch": 880} {"train_loss": -10.555164337158203, "global_step": 147981, "epoch": 880} {"train_loss": -10.669742584228516, "global_step": 147982, "epoch": 880} {"train_loss": -10.443624496459961, "global_step": 147983, "epoch": 880} {"train_loss": -10.718790054321289, "global_step": 147984, "epoch": 880} {"train_loss": -10.514533996582031, "global_step": 147985, "epoch": 880} {"train_loss": -9.879966735839844, "global_step": 147986, "epoch": 880} {"train_loss": -10.507148742675781, "global_step": 147987, "epoch": 880} {"train_loss": -10.548673629760742, "global_step": 147988, "epoch": 880} {"train_loss": -10.405235290527344, "global_step": 147989, "epoch": 880} {"train_loss": -10.305174827575684, "global_step": 147990, "epoch": 880} {"train_loss": -10.305500030517578, "global_step": 147991, "epoch": 880} {"train_loss": -10.436935424804688, "global_step": 147992, "epoch": 880} {"train_loss": -10.659452438354492, "global_step": 147993, "epoch": 880} {"train_loss": -10.539118766784668, "global_step": 147994, "epoch": 880} {"train_loss": -10.321687698364258, "global_step": 147995, "epoch": 880} {"train_loss": -10.466557502746582, "global_step": 147996, "epoch": 880} {"train_loss": -10.499713897705078, "global_step": 147997, "epoch": 880} {"train_loss": -10.307384490966797, "global_step": 147998, "epoch": 880} {"train_loss": -10.491710662841797, "global_step": 147999, "epoch": 880} {"train_loss": -10.365142822265625, "global_step": 148000, "epoch": 880} {"train_loss": -10.430231094360352, "global_step": 148001, "epoch": 880} {"train_loss": -10.45156192779541, "global_step": 148002, "epoch": 880} {"train_loss": -10.547353744506836, "global_step": 148003, "epoch": 880} {"train_loss": -10.159857749938965, "global_step": 148004, "epoch": 880} {"train_loss": -10.45749282836914, "global_step": 148005, "epoch": 880} {"train_loss": -10.56570053100586, "global_step": 148006, "epoch": 880} {"train_loss": -10.17326298497972, "global_step": 148007, "epoch": 880, "val_loss": 226933.84375, "train_action_mse_error": 8.039557456970215} {"train_loss": -9.813949584960938, "global_step": 148008, "epoch": 881} {"train_loss": -10.198141098022461, "global_step": 148009, "epoch": 881} {"train_loss": -10.062490463256836, "global_step": 148010, "epoch": 881} {"train_loss": -10.537397384643555, "global_step": 148011, "epoch": 881} {"train_loss": -10.147882461547852, "global_step": 148012, "epoch": 881} {"train_loss": -10.349604606628418, "global_step": 148013, "epoch": 881} {"train_loss": -10.362274169921875, "global_step": 148014, "epoch": 881} {"train_loss": -10.224202156066895, "global_step": 148015, "epoch": 881} {"train_loss": -9.981269836425781, "global_step": 148016, "epoch": 881} {"train_loss": -10.55467414855957, "global_step": 148017, "epoch": 881} {"train_loss": -9.646758079528809, "global_step": 148018, "epoch": 881} {"train_loss": -10.492720603942871, "global_step": 148019, "epoch": 881} {"train_loss": -10.142647743225098, "global_step": 148020, "epoch": 881} {"train_loss": -10.404539108276367, "global_step": 148021, "epoch": 881} {"train_loss": -10.649696350097656, "global_step": 148022, "epoch": 881} {"train_loss": -10.334101676940918, "global_step": 148023, "epoch": 881} {"train_loss": -10.393543243408203, "global_step": 148024, "epoch": 881} {"train_loss": -10.5302734375, "global_step": 148025, "epoch": 881} {"train_loss": -10.616158485412598, "global_step": 148026, "epoch": 881} {"train_loss": -10.233063697814941, "global_step": 148027, "epoch": 881} {"train_loss": -10.664681434631348, "global_step": 148028, "epoch": 881} {"train_loss": -10.3837308883667, "global_step": 148029, "epoch": 881} {"train_loss": -10.28927230834961, "global_step": 148030, "epoch": 881} {"train_loss": -10.520431518554688, "global_step": 148031, "epoch": 881} {"train_loss": -10.360113143920898, "global_step": 148032, "epoch": 881} {"train_loss": -10.269227981567383, "global_step": 148033, "epoch": 881} {"train_loss": -10.636686325073242, "global_step": 148034, "epoch": 881} {"train_loss": -10.718477249145508, "global_step": 148035, "epoch": 881} {"train_loss": -10.610235214233398, "global_step": 148036, "epoch": 881} {"train_loss": -10.549259185791016, "global_step": 148037, "epoch": 881} {"train_loss": -10.671241760253906, "global_step": 148038, "epoch": 881} {"train_loss": -10.944683074951172, "global_step": 148039, "epoch": 881} {"train_loss": -10.976456642150879, "global_step": 148040, "epoch": 881} {"train_loss": -10.858692169189453, "global_step": 148041, "epoch": 881} {"train_loss": -10.665059089660645, "global_step": 148042, "epoch": 881} {"train_loss": -10.85258674621582, "global_step": 148043, "epoch": 881} {"train_loss": -10.82054328918457, "global_step": 148044, "epoch": 881} {"train_loss": -10.790592193603516, "global_step": 148045, "epoch": 881} {"train_loss": -10.966592788696289, "global_step": 148046, "epoch": 881} {"train_loss": -10.97319221496582, "global_step": 148047, "epoch": 881} {"train_loss": -10.798166275024414, "global_step": 148048, "epoch": 881} {"train_loss": -10.949236869812012, "global_step": 148049, "epoch": 881} {"train_loss": -10.970222473144531, "global_step": 148050, "epoch": 881} {"train_loss": -11.01099967956543, "global_step": 148051, "epoch": 881} {"train_loss": -10.90463924407959, "global_step": 148052, "epoch": 881} {"train_loss": -10.786450386047363, "global_step": 148053, "epoch": 881} {"train_loss": -10.457696914672852, "global_step": 148054, "epoch": 881} {"train_loss": -10.533510208129883, "global_step": 148055, "epoch": 881} {"train_loss": -10.398837089538574, "global_step": 148056, "epoch": 881} {"train_loss": -10.745709419250488, "global_step": 148057, "epoch": 881} {"train_loss": -10.46396255493164, "global_step": 148058, "epoch": 881} {"train_loss": -11.076234817504883, "global_step": 148059, "epoch": 881} {"train_loss": -10.633630752563477, "global_step": 148060, "epoch": 881} {"train_loss": -10.826250076293945, "global_step": 148061, "epoch": 881} {"train_loss": -10.842172622680664, "global_step": 148062, "epoch": 881} {"train_loss": -10.646857261657715, "global_step": 148063, "epoch": 881} {"train_loss": -10.416412353515625, "global_step": 148064, "epoch": 881} {"train_loss": -10.220294952392578, "global_step": 148065, "epoch": 881} {"train_loss": -10.874631881713867, "global_step": 148066, "epoch": 881} {"train_loss": -10.451667785644531, "global_step": 148067, "epoch": 881} {"train_loss": -10.384004592895508, "global_step": 148068, "epoch": 881} {"train_loss": -10.673848152160645, "global_step": 148069, "epoch": 881} {"train_loss": -10.746066093444824, "global_step": 148070, "epoch": 881} {"train_loss": -10.585515975952148, "global_step": 148071, "epoch": 881} {"train_loss": -10.691157341003418, "global_step": 148072, "epoch": 881} {"train_loss": -10.447872161865234, "global_step": 148073, "epoch": 881} {"train_loss": -10.590556144714355, "global_step": 148074, "epoch": 881} {"train_loss": -10.675506591796875, "global_step": 148075, "epoch": 881} {"train_loss": -10.244536399841309, "global_step": 148076, "epoch": 881} {"train_loss": -9.953764915466309, "global_step": 148077, "epoch": 881} {"train_loss": -10.272010803222656, "global_step": 148078, "epoch": 881} {"train_loss": -9.394808769226074, "global_step": 148079, "epoch": 881} {"train_loss": -9.709049224853516, "global_step": 148080, "epoch": 881} {"train_loss": -10.304553985595703, "global_step": 148081, "epoch": 881} {"train_loss": -8.790837287902832, "global_step": 148082, "epoch": 881} {"train_loss": -9.289932250976562, "global_step": 148083, "epoch": 881} {"train_loss": -10.545461654663086, "global_step": 148084, "epoch": 881} {"train_loss": -9.45011043548584, "global_step": 148085, "epoch": 881} {"train_loss": -10.18882942199707, "global_step": 148086, "epoch": 881} {"train_loss": -10.248807907104492, "global_step": 148087, "epoch": 881} {"train_loss": -10.211390495300293, "global_step": 148088, "epoch": 881} {"train_loss": -10.180208206176758, "global_step": 148089, "epoch": 881} {"train_loss": -9.714554786682129, "global_step": 148090, "epoch": 881} {"train_loss": -10.05385684967041, "global_step": 148091, "epoch": 881} {"train_loss": -10.035625457763672, "global_step": 148092, "epoch": 881} {"train_loss": -10.430501937866211, "global_step": 148093, "epoch": 881} {"train_loss": -10.198488235473633, "global_step": 148094, "epoch": 881} {"train_loss": -10.622360229492188, "global_step": 148095, "epoch": 881} {"train_loss": -10.50864315032959, "global_step": 148096, "epoch": 881} {"train_loss": -10.435887336730957, "global_step": 148097, "epoch": 881} {"train_loss": -10.380640983581543, "global_step": 148098, "epoch": 881} {"train_loss": -10.644211769104004, "global_step": 148099, "epoch": 881} {"train_loss": -10.660070419311523, "global_step": 148100, "epoch": 881} {"train_loss": -10.434408187866211, "global_step": 148101, "epoch": 881} {"train_loss": -10.563562393188477, "global_step": 148102, "epoch": 881} {"train_loss": -10.325807571411133, "global_step": 148103, "epoch": 881} {"train_loss": -10.385507583618164, "global_step": 148104, "epoch": 881} {"train_loss": -10.236557006835938, "global_step": 148105, "epoch": 881} {"train_loss": -10.551603317260742, "global_step": 148106, "epoch": 881} {"train_loss": -10.107705116271973, "global_step": 148107, "epoch": 881} {"train_loss": -10.457157135009766, "global_step": 148108, "epoch": 881} {"train_loss": -10.42314338684082, "global_step": 148109, "epoch": 881} {"train_loss": -10.294231414794922, "global_step": 148110, "epoch": 881} {"train_loss": -10.675198554992676, "global_step": 148111, "epoch": 881} {"train_loss": -10.216331481933594, "global_step": 148112, "epoch": 881} {"train_loss": -10.574369430541992, "global_step": 148113, "epoch": 881} {"train_loss": -10.44524097442627, "global_step": 148114, "epoch": 881} {"train_loss": -10.601725578308105, "global_step": 148115, "epoch": 881} {"train_loss": -10.728034973144531, "global_step": 148116, "epoch": 881} {"train_loss": -10.446427345275879, "global_step": 148117, "epoch": 881} {"train_loss": -10.729808807373047, "global_step": 148118, "epoch": 881} {"train_loss": -10.580543518066406, "global_step": 148119, "epoch": 881} {"train_loss": -10.778210639953613, "global_step": 148120, "epoch": 881} {"train_loss": -10.590970993041992, "global_step": 148121, "epoch": 881} {"train_loss": -10.738731384277344, "global_step": 148122, "epoch": 881} {"train_loss": -10.7013578414917, "global_step": 148123, "epoch": 881} {"train_loss": -10.420791625976562, "global_step": 148124, "epoch": 881} {"train_loss": -10.733600616455078, "global_step": 148125, "epoch": 881} {"train_loss": -10.393732070922852, "global_step": 148126, "epoch": 881} {"train_loss": -10.660400390625, "global_step": 148127, "epoch": 881} {"train_loss": -10.526020050048828, "global_step": 148128, "epoch": 881} {"train_loss": -10.696794509887695, "global_step": 148129, "epoch": 881} {"train_loss": -10.57988166809082, "global_step": 148130, "epoch": 881} {"train_loss": -10.375029563903809, "global_step": 148131, "epoch": 881} {"train_loss": -10.370830535888672, "global_step": 148132, "epoch": 881} {"train_loss": -10.813867568969727, "global_step": 148133, "epoch": 881} {"train_loss": -10.520496368408203, "global_step": 148134, "epoch": 881} {"train_loss": -10.758010864257812, "global_step": 148135, "epoch": 881} {"train_loss": -10.754785537719727, "global_step": 148136, "epoch": 881} {"train_loss": -10.697240829467773, "global_step": 148137, "epoch": 881} {"train_loss": -10.786470413208008, "global_step": 148138, "epoch": 881} {"train_loss": -10.886027336120605, "global_step": 148139, "epoch": 881} {"train_loss": -10.747846603393555, "global_step": 148140, "epoch": 881} {"train_loss": -10.82634162902832, "global_step": 148141, "epoch": 881} {"train_loss": -10.808633804321289, "global_step": 148142, "epoch": 881} {"train_loss": -10.842872619628906, "global_step": 148143, "epoch": 881} {"train_loss": -10.437986373901367, "global_step": 148144, "epoch": 881} {"train_loss": -10.551593780517578, "global_step": 148145, "epoch": 881} {"train_loss": -10.745861053466797, "global_step": 148146, "epoch": 881} {"train_loss": -10.43580150604248, "global_step": 148147, "epoch": 881} {"train_loss": -10.459478378295898, "global_step": 148148, "epoch": 881} {"train_loss": -10.639058113098145, "global_step": 148149, "epoch": 881} {"train_loss": -10.099760055541992, "global_step": 148150, "epoch": 881} {"train_loss": -10.25261402130127, "global_step": 148151, "epoch": 881} {"train_loss": -10.785799980163574, "global_step": 148152, "epoch": 881} {"train_loss": -9.662038803100586, "global_step": 148153, "epoch": 881} {"train_loss": -10.726301193237305, "global_step": 148154, "epoch": 881} {"train_loss": -10.353605270385742, "global_step": 148155, "epoch": 881} {"train_loss": -10.460949897766113, "global_step": 148156, "epoch": 881} {"train_loss": -9.625764846801758, "global_step": 148157, "epoch": 881} {"train_loss": -10.297097206115723, "global_step": 148158, "epoch": 881} {"train_loss": -9.794472694396973, "global_step": 148159, "epoch": 881} {"train_loss": -10.091669082641602, "global_step": 148160, "epoch": 881} {"train_loss": -10.063941955566406, "global_step": 148161, "epoch": 881} {"train_loss": -9.585672378540039, "global_step": 148162, "epoch": 881} {"train_loss": -10.009027481079102, "global_step": 148163, "epoch": 881} {"train_loss": -10.263046264648438, "global_step": 148164, "epoch": 881} {"train_loss": -10.569306373596191, "global_step": 148165, "epoch": 881} {"train_loss": -10.224990844726562, "global_step": 148166, "epoch": 881} {"train_loss": -10.427862167358398, "global_step": 148167, "epoch": 881} {"train_loss": -10.427263259887695, "global_step": 148168, "epoch": 881} {"train_loss": -10.40220832824707, "global_step": 148169, "epoch": 881} {"train_loss": -10.292811393737793, "global_step": 148170, "epoch": 881} {"train_loss": -10.705764770507812, "global_step": 148171, "epoch": 881} {"train_loss": -10.409391403198242, "global_step": 148172, "epoch": 881} {"train_loss": -10.721510887145996, "global_step": 148173, "epoch": 881} {"train_loss": -10.710555076599121, "global_step": 148174, "epoch": 881} {"train_loss": -10.452143845104036, "global_step": 148175, "epoch": 881, "val_loss": 229049.609375} {"train_loss": -10.486992835998535, "global_step": 148176, "epoch": 882} {"train_loss": -10.56126594543457, "global_step": 148177, "epoch": 882} {"train_loss": -10.347188949584961, "global_step": 148178, "epoch": 882} {"train_loss": -10.846723556518555, "global_step": 148179, "epoch": 882} {"train_loss": -10.27314281463623, "global_step": 148180, "epoch": 882} {"train_loss": -10.670021057128906, "global_step": 148181, "epoch": 882} {"train_loss": -10.41899585723877, "global_step": 148182, "epoch": 882} {"train_loss": -10.811659812927246, "global_step": 148183, "epoch": 882} {"train_loss": -10.494054794311523, "global_step": 148184, "epoch": 882} {"train_loss": -10.622562408447266, "global_step": 148185, "epoch": 882} {"train_loss": -10.67101764678955, "global_step": 148186, "epoch": 882} {"train_loss": -10.773653984069824, "global_step": 148187, "epoch": 882} {"train_loss": -10.693008422851562, "global_step": 148188, "epoch": 882} {"train_loss": -10.837187767028809, "global_step": 148189, "epoch": 882} {"train_loss": -10.88174057006836, "global_step": 148190, "epoch": 882} {"train_loss": -10.680912017822266, "global_step": 148191, "epoch": 882} {"train_loss": -10.72146224975586, "global_step": 148192, "epoch": 882} {"train_loss": -10.333761215209961, "global_step": 148193, "epoch": 882} {"train_loss": -10.76597785949707, "global_step": 148194, "epoch": 882} {"train_loss": -10.422073364257812, "global_step": 148195, "epoch": 882} {"train_loss": -10.71265983581543, "global_step": 148196, "epoch": 882} {"train_loss": -10.570820808410645, "global_step": 148197, "epoch": 882} {"train_loss": -10.808938980102539, "global_step": 148198, "epoch": 882} {"train_loss": -10.624187469482422, "global_step": 148199, "epoch": 882} {"train_loss": -10.76673698425293, "global_step": 148200, "epoch": 882} {"train_loss": -10.646366119384766, "global_step": 148201, "epoch": 882} {"train_loss": -10.794790267944336, "global_step": 148202, "epoch": 882} {"train_loss": -10.840164184570312, "global_step": 148203, "epoch": 882} {"train_loss": -10.647518157958984, "global_step": 148204, "epoch": 882} {"train_loss": -10.596748352050781, "global_step": 148205, "epoch": 882} {"train_loss": -10.571134567260742, "global_step": 148206, "epoch": 882} {"train_loss": -10.680261611938477, "global_step": 148207, "epoch": 882} {"train_loss": -10.655478477478027, "global_step": 148208, "epoch": 882} {"train_loss": -10.984502792358398, "global_step": 148209, "epoch": 882} {"train_loss": -10.945512771606445, "global_step": 148210, "epoch": 882} {"train_loss": -10.90263557434082, "global_step": 148211, "epoch": 882} {"train_loss": -10.515687942504883, "global_step": 148212, "epoch": 882} {"train_loss": -10.822324752807617, "global_step": 148213, "epoch": 882} {"train_loss": -10.73681926727295, "global_step": 148214, "epoch": 882} {"train_loss": -10.453001022338867, "global_step": 148215, "epoch": 882} {"train_loss": -10.593018531799316, "global_step": 148216, "epoch": 882} {"train_loss": -10.081417083740234, "global_step": 148217, "epoch": 882} {"train_loss": -10.39596939086914, "global_step": 148218, "epoch": 882} {"train_loss": -9.956392288208008, "global_step": 148219, "epoch": 882} {"train_loss": -10.203210830688477, "global_step": 148220, "epoch": 882} {"train_loss": -10.245841979980469, "global_step": 148221, "epoch": 882} {"train_loss": -9.762150764465332, "global_step": 148222, "epoch": 882} {"train_loss": -10.316709518432617, "global_step": 148223, "epoch": 882} {"train_loss": -9.822785377502441, "global_step": 148224, "epoch": 882} {"train_loss": -10.025811195373535, "global_step": 148225, "epoch": 882} {"train_loss": -10.408439636230469, "global_step": 148226, "epoch": 882} {"train_loss": -10.219655990600586, "global_step": 148227, "epoch": 882} {"train_loss": -10.515630722045898, "global_step": 148228, "epoch": 882} {"train_loss": -10.254718780517578, "global_step": 148229, "epoch": 882} {"train_loss": -10.070413589477539, "global_step": 148230, "epoch": 882} {"train_loss": -9.925981521606445, "global_step": 148231, "epoch": 882} {"train_loss": -10.527047157287598, "global_step": 148232, "epoch": 882} {"train_loss": -10.110664367675781, "global_step": 148233, "epoch": 882} {"train_loss": -10.553378105163574, "global_step": 148234, "epoch": 882} {"train_loss": -10.3658447265625, "global_step": 148235, "epoch": 882} {"train_loss": -10.258970260620117, "global_step": 148236, "epoch": 882} {"train_loss": -10.676608085632324, "global_step": 148237, "epoch": 882} {"train_loss": -10.429916381835938, "global_step": 148238, "epoch": 882} {"train_loss": -10.231974601745605, "global_step": 148239, "epoch": 882} {"train_loss": -10.75042724609375, "global_step": 148240, "epoch": 882} {"train_loss": -10.157872200012207, "global_step": 148241, "epoch": 882} {"train_loss": -10.612403869628906, "global_step": 148242, "epoch": 882} {"train_loss": -10.77447509765625, "global_step": 148243, "epoch": 882} {"train_loss": -10.52847957611084, "global_step": 148244, "epoch": 882} {"train_loss": -10.925134658813477, "global_step": 148245, "epoch": 882} {"train_loss": -10.78931999206543, "global_step": 148246, "epoch": 882} {"train_loss": -10.64436149597168, "global_step": 148247, "epoch": 882} {"train_loss": -10.527532577514648, "global_step": 148248, "epoch": 882} {"train_loss": -10.834919929504395, "global_step": 148249, "epoch": 882} {"train_loss": -10.814458847045898, "global_step": 148250, "epoch": 882} {"train_loss": -10.686729431152344, "global_step": 148251, "epoch": 882} {"train_loss": -10.97169303894043, "global_step": 148252, "epoch": 882} {"train_loss": -10.603010177612305, "global_step": 148253, "epoch": 882} {"train_loss": -10.854726791381836, "global_step": 148254, "epoch": 882} {"train_loss": -10.710359573364258, "global_step": 148255, "epoch": 882} {"train_loss": -10.567829132080078, "global_step": 148256, "epoch": 882} {"train_loss": -10.793001174926758, "global_step": 148257, "epoch": 882} {"train_loss": -10.518080711364746, "global_step": 148258, "epoch": 882} {"train_loss": -10.742874145507812, "global_step": 148259, "epoch": 882} {"train_loss": -10.71528434753418, "global_step": 148260, "epoch": 882} {"train_loss": -10.569921493530273, "global_step": 148261, "epoch": 882} {"train_loss": -10.81550121307373, "global_step": 148262, "epoch": 882} {"train_loss": -10.770885467529297, "global_step": 148263, "epoch": 882} {"train_loss": -10.680784225463867, "global_step": 148264, "epoch": 882} {"train_loss": -10.95222282409668, "global_step": 148265, "epoch": 882} {"train_loss": -10.817744255065918, "global_step": 148266, "epoch": 882} {"train_loss": -11.052288055419922, "global_step": 148267, "epoch": 882} {"train_loss": -10.994112968444824, "global_step": 148268, "epoch": 882} {"train_loss": -11.03260612487793, "global_step": 148269, "epoch": 882} {"train_loss": -10.83944320678711, "global_step": 148270, "epoch": 882} {"train_loss": -10.756160736083984, "global_step": 148271, "epoch": 882} {"train_loss": -10.384281158447266, "global_step": 148272, "epoch": 882} {"train_loss": -10.742382049560547, "global_step": 148273, "epoch": 882} {"train_loss": -11.042654037475586, "global_step": 148274, "epoch": 882} {"train_loss": -11.072548866271973, "global_step": 148275, "epoch": 882} {"train_loss": -11.065065383911133, "global_step": 148276, "epoch": 882} {"train_loss": -10.906597137451172, "global_step": 148277, "epoch": 882} {"train_loss": -11.11454963684082, "global_step": 148278, "epoch": 882} {"train_loss": -10.813433647155762, "global_step": 148279, "epoch": 882} {"train_loss": -10.763723373413086, "global_step": 148280, "epoch": 882} {"train_loss": -10.79560661315918, "global_step": 148281, "epoch": 882} {"train_loss": -10.874589920043945, "global_step": 148282, "epoch": 882} {"train_loss": -10.660765647888184, "global_step": 148283, "epoch": 882} {"train_loss": -10.592874526977539, "global_step": 148284, "epoch": 882} {"train_loss": -10.677544593811035, "global_step": 148285, "epoch": 882} {"train_loss": -11.03837776184082, "global_step": 148286, "epoch": 882} {"train_loss": -10.808748245239258, "global_step": 148287, "epoch": 882} {"train_loss": -10.846343994140625, "global_step": 148288, "epoch": 882} {"train_loss": -10.720368385314941, "global_step": 148289, "epoch": 882} {"train_loss": -10.84373664855957, "global_step": 148290, "epoch": 882} {"train_loss": -10.54155158996582, "global_step": 148291, "epoch": 882} {"train_loss": -10.761921882629395, "global_step": 148292, "epoch": 882} {"train_loss": -10.945302963256836, "global_step": 148293, "epoch": 882} {"train_loss": -11.064815521240234, "global_step": 148294, "epoch": 882} {"train_loss": -10.835195541381836, "global_step": 148295, "epoch": 882} {"train_loss": -10.880069732666016, "global_step": 148296, "epoch": 882} {"train_loss": -10.9950532913208, "global_step": 148297, "epoch": 882} {"train_loss": -10.80970573425293, "global_step": 148298, "epoch": 882} {"train_loss": -10.740732192993164, "global_step": 148299, "epoch": 882} {"train_loss": -10.679067611694336, "global_step": 148300, "epoch": 882} {"train_loss": -10.426567077636719, "global_step": 148301, "epoch": 882} {"train_loss": -10.924468994140625, "global_step": 148302, "epoch": 882} {"train_loss": -10.20248794555664, "global_step": 148303, "epoch": 882} {"train_loss": -10.75936508178711, "global_step": 148304, "epoch": 882} {"train_loss": -10.507033348083496, "global_step": 148305, "epoch": 882} {"train_loss": -10.816740036010742, "global_step": 148306, "epoch": 882} {"train_loss": -10.32624626159668, "global_step": 148307, "epoch": 882} {"train_loss": -10.938231468200684, "global_step": 148308, "epoch": 882} {"train_loss": -10.006790161132812, "global_step": 148309, "epoch": 882} {"train_loss": -10.998310089111328, "global_step": 148310, "epoch": 882} {"train_loss": -10.024947166442871, "global_step": 148311, "epoch": 882} {"train_loss": -10.061372756958008, "global_step": 148312, "epoch": 882} {"train_loss": -10.370985984802246, "global_step": 148313, "epoch": 882} {"train_loss": -10.749824523925781, "global_step": 148314, "epoch": 882} {"train_loss": -10.3517484664917, "global_step": 148315, "epoch": 882} {"train_loss": -10.660704612731934, "global_step": 148316, "epoch": 882} {"train_loss": -9.815910339355469, "global_step": 148317, "epoch": 882} {"train_loss": -10.2393217086792, "global_step": 148318, "epoch": 882} {"train_loss": -10.075254440307617, "global_step": 148319, "epoch": 882} {"train_loss": -9.198331832885742, "global_step": 148320, "epoch": 882} {"train_loss": -10.657670021057129, "global_step": 148321, "epoch": 882} {"train_loss": -9.78587532043457, "global_step": 148322, "epoch": 882} {"train_loss": -10.470978736877441, "global_step": 148323, "epoch": 882} {"train_loss": -9.718302726745605, "global_step": 148324, "epoch": 882} {"train_loss": -9.706738471984863, "global_step": 148325, "epoch": 882} {"train_loss": -9.809043884277344, "global_step": 148326, "epoch": 882} {"train_loss": -9.876129150390625, "global_step": 148327, "epoch": 882} {"train_loss": -9.986272811889648, "global_step": 148328, "epoch": 882} {"train_loss": -9.915986061096191, "global_step": 148329, "epoch": 882} {"train_loss": -10.472823143005371, "global_step": 148330, "epoch": 882} {"train_loss": -9.97940731048584, "global_step": 148331, "epoch": 882} {"train_loss": -10.401679992675781, "global_step": 148332, "epoch": 882} {"train_loss": -10.168244361877441, "global_step": 148333, "epoch": 882} {"train_loss": -10.036090850830078, "global_step": 148334, "epoch": 882} {"train_loss": -10.604937553405762, "global_step": 148335, "epoch": 882} {"train_loss": -9.990732192993164, "global_step": 148336, "epoch": 882} {"train_loss": -10.532574653625488, "global_step": 148337, "epoch": 882} {"train_loss": -10.283374786376953, "global_step": 148338, "epoch": 882} {"train_loss": -10.376899719238281, "global_step": 148339, "epoch": 882} {"train_loss": -10.411515235900879, "global_step": 148340, "epoch": 882} {"train_loss": -10.181473731994629, "global_step": 148341, "epoch": 882} {"train_loss": -10.601821899414062, "global_step": 148342, "epoch": 882} {"train_loss": -10.54743132137117, "global_step": 148343, "epoch": 882, "val_loss": 228455.40625} {"train_loss": -10.497906684875488, "global_step": 148344, "epoch": 883} {"train_loss": -10.327524185180664, "global_step": 148345, "epoch": 883} {"train_loss": -10.404165267944336, "global_step": 148346, "epoch": 883} {"train_loss": -10.4176025390625, "global_step": 148347, "epoch": 883} {"train_loss": -10.263147354125977, "global_step": 148348, "epoch": 883} {"train_loss": -10.385774612426758, "global_step": 148349, "epoch": 883} {"train_loss": -10.245492935180664, "global_step": 148350, "epoch": 883} {"train_loss": -10.616296768188477, "global_step": 148351, "epoch": 883} {"train_loss": -10.476463317871094, "global_step": 148352, "epoch": 883} {"train_loss": -10.610023498535156, "global_step": 148353, "epoch": 883} {"train_loss": -10.62566089630127, "global_step": 148354, "epoch": 883} {"train_loss": -10.600086212158203, "global_step": 148355, "epoch": 883} {"train_loss": -10.390387535095215, "global_step": 148356, "epoch": 883} {"train_loss": -10.36169719696045, "global_step": 148357, "epoch": 883} {"train_loss": -10.679489135742188, "global_step": 148358, "epoch": 883} {"train_loss": -10.214288711547852, "global_step": 148359, "epoch": 883} {"train_loss": -10.692061424255371, "global_step": 148360, "epoch": 883} {"train_loss": -10.45413589477539, "global_step": 148361, "epoch": 883} {"train_loss": -10.751456260681152, "global_step": 148362, "epoch": 883} {"train_loss": -10.561466217041016, "global_step": 148363, "epoch": 883} {"train_loss": -10.363631248474121, "global_step": 148364, "epoch": 883} {"train_loss": -10.762303352355957, "global_step": 148365, "epoch": 883} {"train_loss": -10.400081634521484, "global_step": 148366, "epoch": 883} {"train_loss": -10.692526817321777, "global_step": 148367, "epoch": 883} {"train_loss": -10.559341430664062, "global_step": 148368, "epoch": 883} {"train_loss": -10.79071044921875, "global_step": 148369, "epoch": 883} {"train_loss": -10.58911418914795, "global_step": 148370, "epoch": 883} {"train_loss": -10.576568603515625, "global_step": 148371, "epoch": 883} {"train_loss": -10.446535110473633, "global_step": 148372, "epoch": 883} {"train_loss": -10.42280387878418, "global_step": 148373, "epoch": 883} {"train_loss": -10.837678909301758, "global_step": 148374, "epoch": 883} {"train_loss": -10.326740264892578, "global_step": 148375, "epoch": 883} {"train_loss": -10.744377136230469, "global_step": 148376, "epoch": 883} {"train_loss": -10.505081176757812, "global_step": 148377, "epoch": 883} {"train_loss": -10.704773902893066, "global_step": 148378, "epoch": 883} {"train_loss": -10.15732192993164, "global_step": 148379, "epoch": 883} {"train_loss": -10.800539016723633, "global_step": 148380, "epoch": 883} {"train_loss": -10.175053596496582, "global_step": 148381, "epoch": 883} {"train_loss": -10.664389610290527, "global_step": 148382, "epoch": 883} {"train_loss": -10.20254135131836, "global_step": 148383, "epoch": 883} {"train_loss": -10.37637710571289, "global_step": 148384, "epoch": 883} {"train_loss": -10.386662483215332, "global_step": 148385, "epoch": 883} {"train_loss": -10.18483829498291, "global_step": 148386, "epoch": 883} {"train_loss": -10.687437057495117, "global_step": 148387, "epoch": 883} {"train_loss": -10.218901634216309, "global_step": 148388, "epoch": 883} {"train_loss": -10.470743179321289, "global_step": 148389, "epoch": 883} {"train_loss": -10.226642608642578, "global_step": 148390, "epoch": 883} {"train_loss": -10.67781925201416, "global_step": 148391, "epoch": 883} {"train_loss": -10.598836898803711, "global_step": 148392, "epoch": 883} {"train_loss": -10.317298889160156, "global_step": 148393, "epoch": 883} {"train_loss": -10.798120498657227, "global_step": 148394, "epoch": 883} {"train_loss": -10.493266105651855, "global_step": 148395, "epoch": 883} {"train_loss": -10.804704666137695, "global_step": 148396, "epoch": 883} {"train_loss": -10.644935607910156, "global_step": 148397, "epoch": 883} {"train_loss": -10.65576171875, "global_step": 148398, "epoch": 883} {"train_loss": -10.918594360351562, "global_step": 148399, "epoch": 883} {"train_loss": -10.853998184204102, "global_step": 148400, "epoch": 883} {"train_loss": -10.721160888671875, "global_step": 148401, "epoch": 883} {"train_loss": -10.903043746948242, "global_step": 148402, "epoch": 883} {"train_loss": -10.494585037231445, "global_step": 148403, "epoch": 883} {"train_loss": -10.881738662719727, "global_step": 148404, "epoch": 883} {"train_loss": -10.748880386352539, "global_step": 148405, "epoch": 883} {"train_loss": -11.000944137573242, "global_step": 148406, "epoch": 883} {"train_loss": -10.87541389465332, "global_step": 148407, "epoch": 883} {"train_loss": -10.817654609680176, "global_step": 148408, "epoch": 883} {"train_loss": -10.909144401550293, "global_step": 148409, "epoch": 883} {"train_loss": -10.804681777954102, "global_step": 148410, "epoch": 883} {"train_loss": -10.875083923339844, "global_step": 148411, "epoch": 883} {"train_loss": -11.116771697998047, "global_step": 148412, "epoch": 883} {"train_loss": -11.006224632263184, "global_step": 148413, "epoch": 883} {"train_loss": -11.086475372314453, "global_step": 148414, "epoch": 883} {"train_loss": -11.072265625, "global_step": 148415, "epoch": 883} {"train_loss": -10.875106811523438, "global_step": 148416, "epoch": 883} {"train_loss": -10.729732513427734, "global_step": 148417, "epoch": 883} {"train_loss": -11.04392147064209, "global_step": 148418, "epoch": 883} {"train_loss": -10.869197845458984, "global_step": 148419, "epoch": 883} {"train_loss": -10.64187240600586, "global_step": 148420, "epoch": 883} {"train_loss": -10.898962020874023, "global_step": 148421, "epoch": 883} {"train_loss": -11.05357551574707, "global_step": 148422, "epoch": 883} {"train_loss": -10.850531578063965, "global_step": 148423, "epoch": 883} {"train_loss": -11.177497863769531, "global_step": 148424, "epoch": 883} {"train_loss": -11.04765796661377, "global_step": 148425, "epoch": 883} {"train_loss": -10.886879920959473, "global_step": 148426, "epoch": 883} {"train_loss": -10.813101768493652, "global_step": 148427, "epoch": 883} {"train_loss": -10.854490280151367, "global_step": 148428, "epoch": 883} {"train_loss": -10.76560115814209, "global_step": 148429, "epoch": 883} {"train_loss": -10.741948127746582, "global_step": 148430, "epoch": 883} {"train_loss": -10.899001121520996, "global_step": 148431, "epoch": 883} {"train_loss": -10.436408996582031, "global_step": 148432, "epoch": 883} {"train_loss": -10.591039657592773, "global_step": 148433, "epoch": 883} {"train_loss": -10.350801467895508, "global_step": 148434, "epoch": 883} {"train_loss": -10.519342422485352, "global_step": 148435, "epoch": 883} {"train_loss": -10.590587615966797, "global_step": 148436, "epoch": 883} {"train_loss": -11.10374641418457, "global_step": 148437, "epoch": 883} {"train_loss": -10.533349990844727, "global_step": 148438, "epoch": 883} {"train_loss": -11.003446578979492, "global_step": 148439, "epoch": 883} {"train_loss": -10.224743843078613, "global_step": 148440, "epoch": 883} {"train_loss": -10.690988540649414, "global_step": 148441, "epoch": 883} {"train_loss": -10.667710304260254, "global_step": 148442, "epoch": 883} {"train_loss": -10.710624694824219, "global_step": 148443, "epoch": 883} {"train_loss": -9.559671401977539, "global_step": 148444, "epoch": 883} {"train_loss": -10.32917594909668, "global_step": 148445, "epoch": 883} {"train_loss": -10.029474258422852, "global_step": 148446, "epoch": 883} {"train_loss": -9.898479461669922, "global_step": 148447, "epoch": 883} {"train_loss": -10.460619926452637, "global_step": 148448, "epoch": 883} {"train_loss": -10.51217269897461, "global_step": 148449, "epoch": 883} {"train_loss": -10.553871154785156, "global_step": 148450, "epoch": 883} {"train_loss": -10.654284477233887, "global_step": 148451, "epoch": 883} {"train_loss": -10.698175430297852, "global_step": 148452, "epoch": 883} {"train_loss": -10.700851440429688, "global_step": 148453, "epoch": 883} {"train_loss": -10.551322937011719, "global_step": 148454, "epoch": 883} {"train_loss": -10.523155212402344, "global_step": 148455, "epoch": 883} {"train_loss": -10.481637954711914, "global_step": 148456, "epoch": 883} {"train_loss": -10.303781509399414, "global_step": 148457, "epoch": 883} {"train_loss": -10.488994598388672, "global_step": 148458, "epoch": 883} {"train_loss": -10.612689971923828, "global_step": 148459, "epoch": 883} {"train_loss": -10.365137100219727, "global_step": 148460, "epoch": 883} {"train_loss": -10.422094345092773, "global_step": 148461, "epoch": 883} {"train_loss": -10.18043327331543, "global_step": 148462, "epoch": 883} {"train_loss": -10.419014930725098, "global_step": 148463, "epoch": 883} {"train_loss": -10.799847602844238, "global_step": 148464, "epoch": 883} {"train_loss": -10.557605743408203, "global_step": 148465, "epoch": 883} {"train_loss": -10.543127059936523, "global_step": 148466, "epoch": 883} {"train_loss": -10.807212829589844, "global_step": 148467, "epoch": 883} {"train_loss": -10.561506271362305, "global_step": 148468, "epoch": 883} {"train_loss": -10.732250213623047, "global_step": 148469, "epoch": 883} {"train_loss": -10.69862174987793, "global_step": 148470, "epoch": 883} {"train_loss": -10.861038208007812, "global_step": 148471, "epoch": 883} {"train_loss": -10.832193374633789, "global_step": 148472, "epoch": 883} {"train_loss": -10.728139877319336, "global_step": 148473, "epoch": 883} {"train_loss": -10.766143798828125, "global_step": 148474, "epoch": 883} {"train_loss": -10.741018295288086, "global_step": 148475, "epoch": 883} {"train_loss": -10.50937271118164, "global_step": 148476, "epoch": 883} {"train_loss": -10.324678421020508, "global_step": 148477, "epoch": 883} {"train_loss": -10.65180778503418, "global_step": 148478, "epoch": 883} {"train_loss": -10.364744186401367, "global_step": 148479, "epoch": 883} {"train_loss": -10.508567810058594, "global_step": 148480, "epoch": 883} {"train_loss": -10.730167388916016, "global_step": 148481, "epoch": 883} {"train_loss": -10.58492660522461, "global_step": 148482, "epoch": 883} {"train_loss": -10.887445449829102, "global_step": 148483, "epoch": 883} {"train_loss": -10.68945598602295, "global_step": 148484, "epoch": 883} {"train_loss": -10.433927536010742, "global_step": 148485, "epoch": 883} {"train_loss": -10.699525833129883, "global_step": 148486, "epoch": 883} {"train_loss": -10.123268127441406, "global_step": 148487, "epoch": 883} {"train_loss": -10.675994873046875, "global_step": 148488, "epoch": 883} {"train_loss": -10.54350471496582, "global_step": 148489, "epoch": 883} {"train_loss": -10.718175888061523, "global_step": 148490, "epoch": 883} {"train_loss": -10.69024658203125, "global_step": 148491, "epoch": 883} {"train_loss": -10.703483581542969, "global_step": 148492, "epoch": 883} {"train_loss": -10.901232719421387, "global_step": 148493, "epoch": 883} {"train_loss": -10.763688087463379, "global_step": 148494, "epoch": 883} {"train_loss": -10.696374893188477, "global_step": 148495, "epoch": 883} {"train_loss": -10.875704765319824, "global_step": 148496, "epoch": 883} {"train_loss": -10.713220596313477, "global_step": 148497, "epoch": 883} {"train_loss": -10.673504829406738, "global_step": 148498, "epoch": 883} {"train_loss": -10.796021461486816, "global_step": 148499, "epoch": 883} {"train_loss": -10.40176010131836, "global_step": 148500, "epoch": 883} {"train_loss": -10.871512413024902, "global_step": 148501, "epoch": 883} {"train_loss": -10.403834342956543, "global_step": 148502, "epoch": 883} {"train_loss": -10.422994613647461, "global_step": 148503, "epoch": 883} {"train_loss": -10.749858856201172, "global_step": 148504, "epoch": 883} {"train_loss": -10.597421646118164, "global_step": 148505, "epoch": 883} {"train_loss": -10.553054809570312, "global_step": 148506, "epoch": 883} {"train_loss": -10.64688491821289, "global_step": 148507, "epoch": 883} {"train_loss": -10.459205627441406, "global_step": 148508, "epoch": 883} {"train_loss": -10.834274291992188, "global_step": 148509, "epoch": 883} {"train_loss": -10.528722763061523, "global_step": 148510, "epoch": 883} {"train_loss": -10.613329524085636, "global_step": 148511, "epoch": 883, "val_loss": 228384.953125} {"train_loss": -10.506609916687012, "global_step": 148512, "epoch": 884} {"train_loss": -10.152626991271973, "global_step": 148513, "epoch": 884} {"train_loss": -10.777589797973633, "global_step": 148514, "epoch": 884} {"train_loss": -9.619220733642578, "global_step": 148515, "epoch": 884} {"train_loss": -10.713357925415039, "global_step": 148516, "epoch": 884} {"train_loss": -9.461403846740723, "global_step": 148517, "epoch": 884} {"train_loss": -10.621789932250977, "global_step": 148518, "epoch": 884} {"train_loss": -9.667022705078125, "global_step": 148519, "epoch": 884} {"train_loss": -9.884472846984863, "global_step": 148520, "epoch": 884} {"train_loss": -9.703158378601074, "global_step": 148521, "epoch": 884} {"train_loss": -10.361223220825195, "global_step": 148522, "epoch": 884} {"train_loss": -9.254571914672852, "global_step": 148523, "epoch": 884} {"train_loss": -10.79554557800293, "global_step": 148524, "epoch": 884} {"train_loss": -9.244794845581055, "global_step": 148525, "epoch": 884} {"train_loss": -10.413032531738281, "global_step": 148526, "epoch": 884} {"train_loss": -9.60922622680664, "global_step": 148527, "epoch": 884} {"train_loss": -10.241924285888672, "global_step": 148528, "epoch": 884} {"train_loss": -9.762518882751465, "global_step": 148529, "epoch": 884} {"train_loss": -10.19417953491211, "global_step": 148530, "epoch": 884} {"train_loss": -10.297843933105469, "global_step": 148531, "epoch": 884} {"train_loss": -10.500171661376953, "global_step": 148532, "epoch": 884} {"train_loss": -9.874435424804688, "global_step": 148533, "epoch": 884} {"train_loss": -10.70762825012207, "global_step": 148534, "epoch": 884} {"train_loss": -10.16933822631836, "global_step": 148535, "epoch": 884} {"train_loss": -10.38396167755127, "global_step": 148536, "epoch": 884} {"train_loss": -10.053837776184082, "global_step": 148537, "epoch": 884} {"train_loss": -10.639339447021484, "global_step": 148538, "epoch": 884} {"train_loss": -10.092470169067383, "global_step": 148539, "epoch": 884} {"train_loss": -10.652069091796875, "global_step": 148540, "epoch": 884} {"train_loss": -10.431865692138672, "global_step": 148541, "epoch": 884} {"train_loss": -10.319110870361328, "global_step": 148542, "epoch": 884} {"train_loss": -10.621932983398438, "global_step": 148543, "epoch": 884} {"train_loss": -10.677221298217773, "global_step": 148544, "epoch": 884} {"train_loss": -10.749334335327148, "global_step": 148545, "epoch": 884} {"train_loss": -10.8103666305542, "global_step": 148546, "epoch": 884} {"train_loss": -10.639654159545898, "global_step": 148547, "epoch": 884} {"train_loss": -10.653348922729492, "global_step": 148548, "epoch": 884} {"train_loss": -10.690343856811523, "global_step": 148549, "epoch": 884} {"train_loss": -10.778059959411621, "global_step": 148550, "epoch": 884} {"train_loss": -10.756643295288086, "global_step": 148551, "epoch": 884} {"train_loss": -10.695245742797852, "global_step": 148552, "epoch": 884} {"train_loss": -10.858887672424316, "global_step": 148553, "epoch": 884} {"train_loss": -10.540956497192383, "global_step": 148554, "epoch": 884} {"train_loss": -10.788919448852539, "global_step": 148555, "epoch": 884} {"train_loss": -10.556092262268066, "global_step": 148556, "epoch": 884} {"train_loss": -10.6864595413208, "global_step": 148557, "epoch": 884} {"train_loss": -10.575773239135742, "global_step": 148558, "epoch": 884} {"train_loss": -10.772153854370117, "global_step": 148559, "epoch": 884} {"train_loss": -10.760213851928711, "global_step": 148560, "epoch": 884} {"train_loss": -10.712355613708496, "global_step": 148561, "epoch": 884} {"train_loss": -10.902280807495117, "global_step": 148562, "epoch": 884} {"train_loss": -10.82185173034668, "global_step": 148563, "epoch": 884} {"train_loss": -10.709336280822754, "global_step": 148564, "epoch": 884} {"train_loss": -10.488077163696289, "global_step": 148565, "epoch": 884} {"train_loss": -10.79038143157959, "global_step": 148566, "epoch": 884} {"train_loss": -10.31386661529541, "global_step": 148567, "epoch": 884} {"train_loss": -10.901593208312988, "global_step": 148568, "epoch": 884} {"train_loss": -10.455416679382324, "global_step": 148569, "epoch": 884} {"train_loss": -10.800006866455078, "global_step": 148570, "epoch": 884} {"train_loss": -10.530990600585938, "global_step": 148571, "epoch": 884} {"train_loss": -10.726673126220703, "global_step": 148572, "epoch": 884} {"train_loss": -10.405387878417969, "global_step": 148573, "epoch": 884} {"train_loss": -10.758260726928711, "global_step": 148574, "epoch": 884} {"train_loss": -10.24119758605957, "global_step": 148575, "epoch": 884} {"train_loss": -9.529135704040527, "global_step": 148576, "epoch": 884} {"train_loss": -10.421724319458008, "global_step": 148577, "epoch": 884} {"train_loss": -10.26186752319336, "global_step": 148578, "epoch": 884} {"train_loss": -9.98577880859375, "global_step": 148579, "epoch": 884} {"train_loss": -10.589841842651367, "global_step": 148580, "epoch": 884} {"train_loss": -9.928570747375488, "global_step": 148581, "epoch": 884} {"train_loss": -9.833169937133789, "global_step": 148582, "epoch": 884} {"train_loss": -10.605064392089844, "global_step": 148583, "epoch": 884} {"train_loss": -9.897866249084473, "global_step": 148584, "epoch": 884} {"train_loss": -10.479012489318848, "global_step": 148585, "epoch": 884} {"train_loss": -10.221927642822266, "global_step": 148586, "epoch": 884} {"train_loss": -10.396729469299316, "global_step": 148587, "epoch": 884} {"train_loss": -10.339351654052734, "global_step": 148588, "epoch": 884} {"train_loss": -10.560233116149902, "global_step": 148589, "epoch": 884} {"train_loss": -10.39543628692627, "global_step": 148590, "epoch": 884} {"train_loss": -10.403594017028809, "global_step": 148591, "epoch": 884} {"train_loss": -10.50714111328125, "global_step": 148592, "epoch": 884} {"train_loss": -10.540351867675781, "global_step": 148593, "epoch": 884} {"train_loss": -10.578513145446777, "global_step": 148594, "epoch": 884} {"train_loss": -10.625612258911133, "global_step": 148595, "epoch": 884} {"train_loss": -10.903404235839844, "global_step": 148596, "epoch": 884} {"train_loss": -10.774749755859375, "global_step": 148597, "epoch": 884} {"train_loss": -10.683475494384766, "global_step": 148598, "epoch": 884} {"train_loss": -10.829044342041016, "global_step": 148599, "epoch": 884} {"train_loss": -10.72787094116211, "global_step": 148600, "epoch": 884} {"train_loss": -10.763734817504883, "global_step": 148601, "epoch": 884} {"train_loss": -10.916299819946289, "global_step": 148602, "epoch": 884} {"train_loss": -11.041544914245605, "global_step": 148603, "epoch": 884} {"train_loss": -10.799629211425781, "global_step": 148604, "epoch": 884} {"train_loss": -10.940755844116211, "global_step": 148605, "epoch": 884} {"train_loss": -10.805045127868652, "global_step": 148606, "epoch": 884} {"train_loss": -10.935691833496094, "global_step": 148607, "epoch": 884} {"train_loss": -10.700685501098633, "global_step": 148608, "epoch": 884} {"train_loss": -10.831750869750977, "global_step": 148609, "epoch": 884} {"train_loss": -10.977180480957031, "global_step": 148610, "epoch": 884} {"train_loss": -10.788755416870117, "global_step": 148611, "epoch": 884} {"train_loss": -10.858343124389648, "global_step": 148612, "epoch": 884} {"train_loss": -10.59248161315918, "global_step": 148613, "epoch": 884} {"train_loss": -11.071821212768555, "global_step": 148614, "epoch": 884} {"train_loss": -10.755694389343262, "global_step": 148615, "epoch": 884} {"train_loss": -11.019161224365234, "global_step": 148616, "epoch": 884} {"train_loss": -10.77665901184082, "global_step": 148617, "epoch": 884} {"train_loss": -10.90848159790039, "global_step": 148618, "epoch": 884} {"train_loss": -10.780477523803711, "global_step": 148619, "epoch": 884} {"train_loss": -10.647022247314453, "global_step": 148620, "epoch": 884} {"train_loss": -10.918392181396484, "global_step": 148621, "epoch": 884} {"train_loss": -10.832258224487305, "global_step": 148622, "epoch": 884} {"train_loss": -11.185404777526855, "global_step": 148623, "epoch": 884} {"train_loss": -10.708080291748047, "global_step": 148624, "epoch": 884} {"train_loss": -10.47265625, "global_step": 148625, "epoch": 884} {"train_loss": -10.8150634765625, "global_step": 148626, "epoch": 884} {"train_loss": -10.52495288848877, "global_step": 148627, "epoch": 884} {"train_loss": -10.500965118408203, "global_step": 148628, "epoch": 884} {"train_loss": -10.658939361572266, "global_step": 148629, "epoch": 884} {"train_loss": -10.710686683654785, "global_step": 148630, "epoch": 884} {"train_loss": -10.512033462524414, "global_step": 148631, "epoch": 884} {"train_loss": -10.566703796386719, "global_step": 148632, "epoch": 884} {"train_loss": -10.593517303466797, "global_step": 148633, "epoch": 884} {"train_loss": -10.748167991638184, "global_step": 148634, "epoch": 884} {"train_loss": -10.582254409790039, "global_step": 148635, "epoch": 884} {"train_loss": -10.552499771118164, "global_step": 148636, "epoch": 884} {"train_loss": -10.86894702911377, "global_step": 148637, "epoch": 884} {"train_loss": -11.013814926147461, "global_step": 148638, "epoch": 884} {"train_loss": -11.175342559814453, "global_step": 148639, "epoch": 884} {"train_loss": -10.697081565856934, "global_step": 148640, "epoch": 884} {"train_loss": -10.69235897064209, "global_step": 148641, "epoch": 884} {"train_loss": -10.791458129882812, "global_step": 148642, "epoch": 884} {"train_loss": -11.11669921875, "global_step": 148643, "epoch": 884} {"train_loss": -10.577155113220215, "global_step": 148644, "epoch": 884} {"train_loss": -11.05960464477539, "global_step": 148645, "epoch": 884} {"train_loss": -10.513866424560547, "global_step": 148646, "epoch": 884} {"train_loss": -10.606145858764648, "global_step": 148647, "epoch": 884} {"train_loss": -10.70512580871582, "global_step": 148648, "epoch": 884} {"train_loss": -10.626801490783691, "global_step": 148649, "epoch": 884} {"train_loss": -10.663166046142578, "global_step": 148650, "epoch": 884} {"train_loss": -10.027059555053711, "global_step": 148651, "epoch": 884} {"train_loss": -10.745125770568848, "global_step": 148652, "epoch": 884} {"train_loss": -10.132282257080078, "global_step": 148653, "epoch": 884} {"train_loss": -10.577402114868164, "global_step": 148654, "epoch": 884} {"train_loss": -10.41517448425293, "global_step": 148655, "epoch": 884} {"train_loss": -10.74471378326416, "global_step": 148656, "epoch": 884} {"train_loss": -10.637977600097656, "global_step": 148657, "epoch": 884} {"train_loss": -10.407781600952148, "global_step": 148658, "epoch": 884} {"train_loss": -11.07525634765625, "global_step": 148659, "epoch": 884} {"train_loss": -10.53430461883545, "global_step": 148660, "epoch": 884} {"train_loss": -10.526729583740234, "global_step": 148661, "epoch": 884} {"train_loss": -10.422143936157227, "global_step": 148662, "epoch": 884} {"train_loss": -10.750335693359375, "global_step": 148663, "epoch": 884} {"train_loss": -10.73883056640625, "global_step": 148664, "epoch": 884} {"train_loss": -10.435466766357422, "global_step": 148665, "epoch": 884} {"train_loss": -10.627633094787598, "global_step": 148666, "epoch": 884} {"train_loss": -10.411336898803711, "global_step": 148667, "epoch": 884} {"train_loss": -10.634157180786133, "global_step": 148668, "epoch": 884} {"train_loss": -10.75307846069336, "global_step": 148669, "epoch": 884} {"train_loss": -10.488946914672852, "global_step": 148670, "epoch": 884} {"train_loss": -10.826484680175781, "global_step": 148671, "epoch": 884} {"train_loss": -10.621101379394531, "global_step": 148672, "epoch": 884} {"train_loss": -10.70836067199707, "global_step": 148673, "epoch": 884} {"train_loss": -10.438745498657227, "global_step": 148674, "epoch": 884} {"train_loss": -10.61274528503418, "global_step": 148675, "epoch": 884} {"train_loss": -10.49540901184082, "global_step": 148676, "epoch": 884} {"train_loss": -10.471092224121094, "global_step": 148677, "epoch": 884} {"train_loss": -10.51304817199707, "global_step": 148678, "epoch": 884} {"train_loss": -10.550773859024048, "global_step": 148679, "epoch": 884, "val_loss": 227830.875} {"train_loss": -10.061637878417969, "global_step": 148680, "epoch": 885} {"train_loss": -10.386720657348633, "global_step": 148681, "epoch": 885} {"train_loss": -10.5565824508667, "global_step": 148682, "epoch": 885} {"train_loss": -10.5574951171875, "global_step": 148683, "epoch": 885} {"train_loss": -10.331171035766602, "global_step": 148684, "epoch": 885} {"train_loss": -10.027700424194336, "global_step": 148685, "epoch": 885} {"train_loss": -10.449472427368164, "global_step": 148686, "epoch": 885} {"train_loss": -10.258899688720703, "global_step": 148687, "epoch": 885} {"train_loss": -10.32475471496582, "global_step": 148688, "epoch": 885} {"train_loss": -10.442464828491211, "global_step": 148689, "epoch": 885} {"train_loss": -10.203147888183594, "global_step": 148690, "epoch": 885} {"train_loss": -10.477371215820312, "global_step": 148691, "epoch": 885} {"train_loss": -10.074661254882812, "global_step": 148692, "epoch": 885} {"train_loss": -10.933540344238281, "global_step": 148693, "epoch": 885} {"train_loss": -10.56187915802002, "global_step": 148694, "epoch": 885} {"train_loss": -11.079606056213379, "global_step": 148695, "epoch": 885} {"train_loss": -10.695503234863281, "global_step": 148696, "epoch": 885} {"train_loss": -10.91724967956543, "global_step": 148697, "epoch": 885} {"train_loss": -10.563460350036621, "global_step": 148698, "epoch": 885} {"train_loss": -10.762874603271484, "global_step": 148699, "epoch": 885} {"train_loss": -10.830081939697266, "global_step": 148700, "epoch": 885} {"train_loss": -10.941784858703613, "global_step": 148701, "epoch": 885} {"train_loss": -10.699161529541016, "global_step": 148702, "epoch": 885} {"train_loss": -10.693982124328613, "global_step": 148703, "epoch": 885} {"train_loss": -11.019874572753906, "global_step": 148704, "epoch": 885} {"train_loss": -10.793659210205078, "global_step": 148705, "epoch": 885} {"train_loss": -10.981966018676758, "global_step": 148706, "epoch": 885} {"train_loss": -10.695331573486328, "global_step": 148707, "epoch": 885} {"train_loss": -11.052990913391113, "global_step": 148708, "epoch": 885} {"train_loss": -10.853446960449219, "global_step": 148709, "epoch": 885} {"train_loss": -10.963045120239258, "global_step": 148710, "epoch": 885} {"train_loss": -10.768717765808105, "global_step": 148711, "epoch": 885} {"train_loss": -11.162891387939453, "global_step": 148712, "epoch": 885} {"train_loss": -10.883102416992188, "global_step": 148713, "epoch": 885} {"train_loss": -10.98969841003418, "global_step": 148714, "epoch": 885} {"train_loss": -11.05178451538086, "global_step": 148715, "epoch": 885} {"train_loss": -11.051590919494629, "global_step": 148716, "epoch": 885} {"train_loss": -11.009307861328125, "global_step": 148717, "epoch": 885} {"train_loss": -11.118732452392578, "global_step": 148718, "epoch": 885} {"train_loss": -10.933228492736816, "global_step": 148719, "epoch": 885} {"train_loss": -11.163801193237305, "global_step": 148720, "epoch": 885} {"train_loss": -10.994922637939453, "global_step": 148721, "epoch": 885} {"train_loss": -10.823348999023438, "global_step": 148722, "epoch": 885} {"train_loss": -10.497550964355469, "global_step": 148723, "epoch": 885} {"train_loss": -11.006471633911133, "global_step": 148724, "epoch": 885} {"train_loss": -10.721076965332031, "global_step": 148725, "epoch": 885} {"train_loss": -10.265764236450195, "global_step": 148726, "epoch": 885} {"train_loss": -10.811005592346191, "global_step": 148727, "epoch": 885} {"train_loss": -10.76315689086914, "global_step": 148728, "epoch": 885} {"train_loss": -10.8038330078125, "global_step": 148729, "epoch": 885} {"train_loss": -10.231535911560059, "global_step": 148730, "epoch": 885} {"train_loss": -9.830738067626953, "global_step": 148731, "epoch": 885} {"train_loss": -10.6857271194458, "global_step": 148732, "epoch": 885} {"train_loss": -10.930274963378906, "global_step": 148733, "epoch": 885} {"train_loss": -10.799795150756836, "global_step": 148734, "epoch": 885} {"train_loss": -10.480430603027344, "global_step": 148735, "epoch": 885} {"train_loss": -10.875804901123047, "global_step": 148736, "epoch": 885} {"train_loss": -10.899948120117188, "global_step": 148737, "epoch": 885} {"train_loss": -10.728133201599121, "global_step": 148738, "epoch": 885} {"train_loss": -11.01716136932373, "global_step": 148739, "epoch": 885} {"train_loss": -10.824448585510254, "global_step": 148740, "epoch": 885} {"train_loss": -10.829133987426758, "global_step": 148741, "epoch": 885} {"train_loss": -10.685708999633789, "global_step": 148742, "epoch": 885} {"train_loss": -10.812183380126953, "global_step": 148743, "epoch": 885} {"train_loss": -10.630537033081055, "global_step": 148744, "epoch": 885} {"train_loss": -11.099149703979492, "global_step": 148745, "epoch": 885} {"train_loss": -10.333972930908203, "global_step": 148746, "epoch": 885} {"train_loss": -10.625022888183594, "global_step": 148747, "epoch": 885} {"train_loss": -10.559242248535156, "global_step": 148748, "epoch": 885} {"train_loss": -10.88078498840332, "global_step": 148749, "epoch": 885} {"train_loss": -10.614550590515137, "global_step": 148750, "epoch": 885} {"train_loss": -10.853156089782715, "global_step": 148751, "epoch": 885} {"train_loss": -10.604944229125977, "global_step": 148752, "epoch": 885} {"train_loss": -10.708137512207031, "global_step": 148753, "epoch": 885} {"train_loss": -10.425275802612305, "global_step": 148754, "epoch": 885} {"train_loss": -10.633827209472656, "global_step": 148755, "epoch": 885} {"train_loss": -10.790372848510742, "global_step": 148756, "epoch": 885} {"train_loss": -10.384368896484375, "global_step": 148757, "epoch": 885} {"train_loss": -11.102354049682617, "global_step": 148758, "epoch": 885} {"train_loss": -10.384635925292969, "global_step": 148759, "epoch": 885} {"train_loss": -10.699081420898438, "global_step": 148760, "epoch": 885} {"train_loss": -10.676480293273926, "global_step": 148761, "epoch": 885} {"train_loss": -10.740949630737305, "global_step": 148762, "epoch": 885} {"train_loss": -10.470766067504883, "global_step": 148763, "epoch": 885} {"train_loss": -10.525885581970215, "global_step": 148764, "epoch": 885} {"train_loss": -10.607280731201172, "global_step": 148765, "epoch": 885} {"train_loss": -10.513426780700684, "global_step": 148766, "epoch": 885} {"train_loss": -10.416452407836914, "global_step": 148767, "epoch": 885} {"train_loss": -10.664344787597656, "global_step": 148768, "epoch": 885} {"train_loss": -10.650254249572754, "global_step": 148769, "epoch": 885} {"train_loss": -10.628708839416504, "global_step": 148770, "epoch": 885} {"train_loss": -10.775331497192383, "global_step": 148771, "epoch": 885} {"train_loss": -10.642762184143066, "global_step": 148772, "epoch": 885} {"train_loss": -10.786433219909668, "global_step": 148773, "epoch": 885} {"train_loss": -10.646320343017578, "global_step": 148774, "epoch": 885} {"train_loss": -10.738365173339844, "global_step": 148775, "epoch": 885} {"train_loss": -10.515454292297363, "global_step": 148776, "epoch": 885} {"train_loss": -10.236217498779297, "global_step": 148777, "epoch": 885} {"train_loss": -10.62409496307373, "global_step": 148778, "epoch": 885} {"train_loss": -10.104795455932617, "global_step": 148779, "epoch": 885} {"train_loss": -10.526860237121582, "global_step": 148780, "epoch": 885} {"train_loss": -9.55600357055664, "global_step": 148781, "epoch": 885} {"train_loss": -9.949697494506836, "global_step": 148782, "epoch": 885} {"train_loss": -10.016919136047363, "global_step": 148783, "epoch": 885} {"train_loss": -10.524417877197266, "global_step": 148784, "epoch": 885} {"train_loss": -10.317829132080078, "global_step": 148785, "epoch": 885} {"train_loss": -10.659975051879883, "global_step": 148786, "epoch": 885} {"train_loss": -10.181026458740234, "global_step": 148787, "epoch": 885} {"train_loss": -10.236004829406738, "global_step": 148788, "epoch": 885} {"train_loss": -10.217573165893555, "global_step": 148789, "epoch": 885} {"train_loss": -10.260845184326172, "global_step": 148790, "epoch": 885} {"train_loss": -10.31289291381836, "global_step": 148791, "epoch": 885} {"train_loss": -10.223519325256348, "global_step": 148792, "epoch": 885} {"train_loss": -10.35079288482666, "global_step": 148793, "epoch": 885} {"train_loss": -10.51050853729248, "global_step": 148794, "epoch": 885} {"train_loss": -9.708484649658203, "global_step": 148795, "epoch": 885} {"train_loss": -10.613855361938477, "global_step": 148796, "epoch": 885} {"train_loss": -10.186405181884766, "global_step": 148797, "epoch": 885} {"train_loss": -9.982138633728027, "global_step": 148798, "epoch": 885} {"train_loss": -10.527618408203125, "global_step": 148799, "epoch": 885} {"train_loss": -10.267662048339844, "global_step": 148800, "epoch": 885} {"train_loss": -9.995708465576172, "global_step": 148801, "epoch": 885} {"train_loss": -10.075549125671387, "global_step": 148802, "epoch": 885} {"train_loss": -10.558581352233887, "global_step": 148803, "epoch": 885} {"train_loss": -10.095752716064453, "global_step": 148804, "epoch": 885} {"train_loss": -10.630073547363281, "global_step": 148805, "epoch": 885} {"train_loss": -10.339540481567383, "global_step": 148806, "epoch": 885} {"train_loss": -10.496686935424805, "global_step": 148807, "epoch": 885} {"train_loss": -10.50107192993164, "global_step": 148808, "epoch": 885} {"train_loss": -10.456825256347656, "global_step": 148809, "epoch": 885} {"train_loss": -10.40082836151123, "global_step": 148810, "epoch": 885} {"train_loss": -10.374391555786133, "global_step": 148811, "epoch": 885} {"train_loss": -10.494373321533203, "global_step": 148812, "epoch": 885} {"train_loss": -10.52882194519043, "global_step": 148813, "epoch": 885} {"train_loss": -10.468482971191406, "global_step": 148814, "epoch": 885} {"train_loss": -10.509942054748535, "global_step": 148815, "epoch": 885} {"train_loss": -10.360780715942383, "global_step": 148816, "epoch": 885} {"train_loss": -10.562850952148438, "global_step": 148817, "epoch": 885} {"train_loss": -10.424919128417969, "global_step": 148818, "epoch": 885} {"train_loss": -10.597497940063477, "global_step": 148819, "epoch": 885} {"train_loss": -10.451727867126465, "global_step": 148820, "epoch": 885} {"train_loss": -10.727807998657227, "global_step": 148821, "epoch": 885} {"train_loss": -10.930521011352539, "global_step": 148822, "epoch": 885} {"train_loss": -10.598372459411621, "global_step": 148823, "epoch": 885} {"train_loss": -10.732812881469727, "global_step": 148824, "epoch": 885} {"train_loss": -10.629216194152832, "global_step": 148825, "epoch": 885} {"train_loss": -10.656906127929688, "global_step": 148826, "epoch": 885} {"train_loss": -10.695744514465332, "global_step": 148827, "epoch": 885} {"train_loss": -10.76839542388916, "global_step": 148828, "epoch": 885} {"train_loss": -10.523445129394531, "global_step": 148829, "epoch": 885} {"train_loss": -10.686847686767578, "global_step": 148830, "epoch": 885} {"train_loss": -10.407525062561035, "global_step": 148831, "epoch": 885} {"train_loss": -10.87169361114502, "global_step": 148832, "epoch": 885} {"train_loss": -10.13223648071289, "global_step": 148833, "epoch": 885} {"train_loss": -10.719398498535156, "global_step": 148834, "epoch": 885} {"train_loss": -10.533180236816406, "global_step": 148835, "epoch": 885} {"train_loss": -10.703554153442383, "global_step": 148836, "epoch": 885} {"train_loss": -10.682430267333984, "global_step": 148837, "epoch": 885} {"train_loss": -10.23974895477295, "global_step": 148838, "epoch": 885} {"train_loss": -10.790485382080078, "global_step": 148839, "epoch": 885} {"train_loss": -10.335456848144531, "global_step": 148840, "epoch": 885} {"train_loss": -10.02784538269043, "global_step": 148841, "epoch": 885} {"train_loss": -10.565174102783203, "global_step": 148842, "epoch": 885} {"train_loss": -10.666154861450195, "global_step": 148843, "epoch": 885} {"train_loss": -10.21190071105957, "global_step": 148844, "epoch": 885} {"train_loss": -10.534133911132812, "global_step": 148845, "epoch": 885} {"train_loss": -10.217634201049805, "global_step": 148846, "epoch": 885} {"train_loss": -10.574753551256089, "global_step": 148847, "epoch": 885, "val_loss": 230082.296875, "train_action_mse_error": 10.000646591186523} {"train_loss": -10.752588272094727, "global_step": 148848, "epoch": 886} {"train_loss": -10.491532325744629, "global_step": 148849, "epoch": 886} {"train_loss": -10.701414108276367, "global_step": 148850, "epoch": 886} {"train_loss": -10.339762687683105, "global_step": 148851, "epoch": 886} {"train_loss": -9.506185531616211, "global_step": 148852, "epoch": 886} {"train_loss": -10.475909233093262, "global_step": 148853, "epoch": 886} {"train_loss": -10.445009231567383, "global_step": 148854, "epoch": 886} {"train_loss": -10.164200782775879, "global_step": 148855, "epoch": 886} {"train_loss": -10.5847806930542, "global_step": 148856, "epoch": 886} {"train_loss": -10.455621719360352, "global_step": 148857, "epoch": 886} {"train_loss": -10.485809326171875, "global_step": 148858, "epoch": 886} {"train_loss": -10.48713493347168, "global_step": 148859, "epoch": 886} {"train_loss": -10.345470428466797, "global_step": 148860, "epoch": 886} {"train_loss": -10.758930206298828, "global_step": 148861, "epoch": 886} {"train_loss": -10.119511604309082, "global_step": 148862, "epoch": 886} {"train_loss": -10.553271293640137, "global_step": 148863, "epoch": 886} {"train_loss": -10.479785919189453, "global_step": 148864, "epoch": 886} {"train_loss": -10.705589294433594, "global_step": 148865, "epoch": 886} {"train_loss": -10.79690170288086, "global_step": 148866, "epoch": 886} {"train_loss": -10.623432159423828, "global_step": 148867, "epoch": 886} {"train_loss": -10.786920547485352, "global_step": 148868, "epoch": 886} {"train_loss": -10.8623628616333, "global_step": 148869, "epoch": 886} {"train_loss": -10.600944519042969, "global_step": 148870, "epoch": 886} {"train_loss": -10.88292407989502, "global_step": 148871, "epoch": 886} {"train_loss": -10.949433326721191, "global_step": 148872, "epoch": 886} {"train_loss": -10.604999542236328, "global_step": 148873, "epoch": 886} {"train_loss": -11.015607833862305, "global_step": 148874, "epoch": 886} {"train_loss": -10.947920799255371, "global_step": 148875, "epoch": 886} {"train_loss": -10.75993824005127, "global_step": 148876, "epoch": 886} {"train_loss": -10.75632381439209, "global_step": 148877, "epoch": 886} {"train_loss": -10.59460735321045, "global_step": 148878, "epoch": 886} {"train_loss": -10.960542678833008, "global_step": 148879, "epoch": 886} {"train_loss": -10.655027389526367, "global_step": 148880, "epoch": 886} {"train_loss": -10.545034408569336, "global_step": 148881, "epoch": 886} {"train_loss": -10.794804573059082, "global_step": 148882, "epoch": 886} {"train_loss": -10.562305450439453, "global_step": 148883, "epoch": 886} {"train_loss": -10.998649597167969, "global_step": 148884, "epoch": 886} {"train_loss": -10.640708923339844, "global_step": 148885, "epoch": 886} {"train_loss": -10.737617492675781, "global_step": 148886, "epoch": 886} {"train_loss": -10.637201309204102, "global_step": 148887, "epoch": 886} {"train_loss": -10.854576110839844, "global_step": 148888, "epoch": 886} {"train_loss": -10.700940132141113, "global_step": 148889, "epoch": 886} {"train_loss": -10.393339157104492, "global_step": 148890, "epoch": 886} {"train_loss": -11.013019561767578, "global_step": 148891, "epoch": 886} {"train_loss": -10.629154205322266, "global_step": 148892, "epoch": 886} {"train_loss": -10.957845687866211, "global_step": 148893, "epoch": 886} {"train_loss": -10.622472763061523, "global_step": 148894, "epoch": 886} {"train_loss": -10.477225303649902, "global_step": 148895, "epoch": 886} {"train_loss": -10.495529174804688, "global_step": 148896, "epoch": 886} {"train_loss": -10.172456741333008, "global_step": 148897, "epoch": 886} {"train_loss": -11.149882316589355, "global_step": 148898, "epoch": 886} {"train_loss": -9.843830108642578, "global_step": 148899, "epoch": 886} {"train_loss": -10.383955001831055, "global_step": 148900, "epoch": 886} {"train_loss": -10.021160125732422, "global_step": 148901, "epoch": 886} {"train_loss": -9.991199493408203, "global_step": 148902, "epoch": 886} {"train_loss": -10.820497512817383, "global_step": 148903, "epoch": 886} {"train_loss": -10.05207347869873, "global_step": 148904, "epoch": 886} {"train_loss": -10.524381637573242, "global_step": 148905, "epoch": 886} {"train_loss": -10.17058277130127, "global_step": 148906, "epoch": 886} {"train_loss": -10.337620735168457, "global_step": 148907, "epoch": 886} {"train_loss": -10.685977935791016, "global_step": 148908, "epoch": 886} {"train_loss": -10.266077995300293, "global_step": 148909, "epoch": 886} {"train_loss": -10.500564575195312, "global_step": 148910, "epoch": 886} {"train_loss": -10.512428283691406, "global_step": 148911, "epoch": 886} {"train_loss": -10.62598705291748, "global_step": 148912, "epoch": 886} {"train_loss": -10.37173843383789, "global_step": 148913, "epoch": 886} {"train_loss": -10.253745079040527, "global_step": 148914, "epoch": 886} {"train_loss": -10.725664138793945, "global_step": 148915, "epoch": 886} {"train_loss": -10.354978561401367, "global_step": 148916, "epoch": 886} {"train_loss": -10.558019638061523, "global_step": 148917, "epoch": 886} {"train_loss": -10.330863952636719, "global_step": 148918, "epoch": 886} {"train_loss": -10.336517333984375, "global_step": 148919, "epoch": 886} {"train_loss": -10.581140518188477, "global_step": 148920, "epoch": 886} {"train_loss": -10.148752212524414, "global_step": 148921, "epoch": 886} {"train_loss": -10.233762741088867, "global_step": 148922, "epoch": 886} {"train_loss": -10.405414581298828, "global_step": 148923, "epoch": 886} {"train_loss": -10.021428108215332, "global_step": 148924, "epoch": 886} {"train_loss": -10.454204559326172, "global_step": 148925, "epoch": 886} {"train_loss": -9.768014907836914, "global_step": 148926, "epoch": 886} {"train_loss": -10.500911712646484, "global_step": 148927, "epoch": 886} {"train_loss": -9.927284240722656, "global_step": 148928, "epoch": 886} {"train_loss": -10.51583194732666, "global_step": 148929, "epoch": 886} {"train_loss": -9.843025207519531, "global_step": 148930, "epoch": 886} {"train_loss": -10.304777145385742, "global_step": 148931, "epoch": 886} {"train_loss": -10.291616439819336, "global_step": 148932, "epoch": 886} {"train_loss": -10.676446914672852, "global_step": 148933, "epoch": 886} {"train_loss": -10.271276473999023, "global_step": 148934, "epoch": 886} {"train_loss": -10.63786506652832, "global_step": 148935, "epoch": 886} {"train_loss": -10.068361282348633, "global_step": 148936, "epoch": 886} {"train_loss": -10.122782707214355, "global_step": 148937, "epoch": 886} {"train_loss": -10.387947082519531, "global_step": 148938, "epoch": 886} {"train_loss": -10.335142135620117, "global_step": 148939, "epoch": 886} {"train_loss": -10.333459854125977, "global_step": 148940, "epoch": 886} {"train_loss": -10.194981575012207, "global_step": 148941, "epoch": 886} {"train_loss": -10.602327346801758, "global_step": 148942, "epoch": 886} {"train_loss": -10.146917343139648, "global_step": 148943, "epoch": 886} {"train_loss": -10.38223648071289, "global_step": 148944, "epoch": 886} {"train_loss": -10.401756286621094, "global_step": 148945, "epoch": 886} {"train_loss": -10.245722770690918, "global_step": 148946, "epoch": 886} {"train_loss": -10.6360502243042, "global_step": 148947, "epoch": 886} {"train_loss": -10.154083251953125, "global_step": 148948, "epoch": 886} {"train_loss": -10.648115158081055, "global_step": 148949, "epoch": 886} {"train_loss": -10.301027297973633, "global_step": 148950, "epoch": 886} {"train_loss": -10.503684997558594, "global_step": 148951, "epoch": 886} {"train_loss": -10.916271209716797, "global_step": 148952, "epoch": 886} {"train_loss": -10.346710205078125, "global_step": 148953, "epoch": 886} {"train_loss": -10.779975891113281, "global_step": 148954, "epoch": 886} {"train_loss": -10.612435340881348, "global_step": 148955, "epoch": 886} {"train_loss": -10.454267501831055, "global_step": 148956, "epoch": 886} {"train_loss": -10.6900053024292, "global_step": 148957, "epoch": 886} {"train_loss": -10.786566734313965, "global_step": 148958, "epoch": 886} {"train_loss": -10.648805618286133, "global_step": 148959, "epoch": 886} {"train_loss": -10.621763229370117, "global_step": 148960, "epoch": 886} {"train_loss": -10.591243743896484, "global_step": 148961, "epoch": 886} {"train_loss": -10.385454177856445, "global_step": 148962, "epoch": 886} {"train_loss": -10.70305061340332, "global_step": 148963, "epoch": 886} {"train_loss": -10.287489891052246, "global_step": 148964, "epoch": 886} {"train_loss": -10.658008575439453, "global_step": 148965, "epoch": 886} {"train_loss": -10.071001052856445, "global_step": 148966, "epoch": 886} {"train_loss": -10.66964340209961, "global_step": 148967, "epoch": 886} {"train_loss": -10.430816650390625, "global_step": 148968, "epoch": 886} {"train_loss": -10.07800006866455, "global_step": 148969, "epoch": 886} {"train_loss": -10.824525833129883, "global_step": 148970, "epoch": 886} {"train_loss": -10.493185997009277, "global_step": 148971, "epoch": 886} {"train_loss": -10.856508255004883, "global_step": 148972, "epoch": 886} {"train_loss": -10.352258682250977, "global_step": 148973, "epoch": 886} {"train_loss": -10.626254081726074, "global_step": 148974, "epoch": 886} {"train_loss": -10.396309852600098, "global_step": 148975, "epoch": 886} {"train_loss": -10.246006965637207, "global_step": 148976, "epoch": 886} {"train_loss": -10.672274589538574, "global_step": 148977, "epoch": 886} {"train_loss": -10.182284355163574, "global_step": 148978, "epoch": 886} {"train_loss": -10.8988037109375, "global_step": 148979, "epoch": 886} {"train_loss": -10.509116172790527, "global_step": 148980, "epoch": 886} {"train_loss": -10.689230918884277, "global_step": 148981, "epoch": 886} {"train_loss": -10.530426979064941, "global_step": 148982, "epoch": 886} {"train_loss": -10.85000228881836, "global_step": 148983, "epoch": 886} {"train_loss": -10.302964210510254, "global_step": 148984, "epoch": 886} {"train_loss": -10.743403434753418, "global_step": 148985, "epoch": 886} {"train_loss": -10.503374099731445, "global_step": 148986, "epoch": 886} {"train_loss": -10.281194686889648, "global_step": 148987, "epoch": 886} {"train_loss": -10.625502586364746, "global_step": 148988, "epoch": 886} {"train_loss": -10.2952299118042, "global_step": 148989, "epoch": 886} {"train_loss": -10.766962051391602, "global_step": 148990, "epoch": 886} {"train_loss": -10.635173797607422, "global_step": 148991, "epoch": 886} {"train_loss": -10.492210388183594, "global_step": 148992, "epoch": 886} {"train_loss": -10.819890975952148, "global_step": 148993, "epoch": 886} {"train_loss": -10.462114334106445, "global_step": 148994, "epoch": 886} {"train_loss": -10.560197830200195, "global_step": 148995, "epoch": 886} {"train_loss": -10.86740493774414, "global_step": 148996, "epoch": 886} {"train_loss": -10.473846435546875, "global_step": 148997, "epoch": 886} {"train_loss": -10.81129264831543, "global_step": 148998, "epoch": 886} {"train_loss": -10.772555351257324, "global_step": 148999, "epoch": 886} {"train_loss": -10.832218170166016, "global_step": 149000, "epoch": 886} {"train_loss": -10.88463306427002, "global_step": 149001, "epoch": 886} {"train_loss": -10.79591178894043, "global_step": 149002, "epoch": 886} {"train_loss": -10.898118019104004, "global_step": 149003, "epoch": 886} {"train_loss": -10.721633911132812, "global_step": 149004, "epoch": 886} {"train_loss": -10.921607971191406, "global_step": 149005, "epoch": 886} {"train_loss": -10.802989959716797, "global_step": 149006, "epoch": 886} {"train_loss": -10.910246849060059, "global_step": 149007, "epoch": 886} {"train_loss": -10.958450317382812, "global_step": 149008, "epoch": 886} {"train_loss": -10.990427017211914, "global_step": 149009, "epoch": 886} {"train_loss": -10.69578742980957, "global_step": 149010, "epoch": 886} {"train_loss": -10.940641403198242, "global_step": 149011, "epoch": 886} {"train_loss": -10.903803825378418, "global_step": 149012, "epoch": 886} {"train_loss": -11.104530334472656, "global_step": 149013, "epoch": 886} {"train_loss": -11.073147773742676, "global_step": 149014, "epoch": 886} {"train_loss": -10.54369824840909, "global_step": 149015, "epoch": 886, "val_loss": 228895.546875} {"train_loss": -10.84322452545166, "global_step": 149016, "epoch": 887} {"train_loss": -10.627201080322266, "global_step": 149017, "epoch": 887} {"train_loss": -10.981189727783203, "global_step": 149018, "epoch": 887} {"train_loss": -10.736152648925781, "global_step": 149019, "epoch": 887} {"train_loss": -10.836480140686035, "global_step": 149020, "epoch": 887} {"train_loss": -10.6426362991333, "global_step": 149021, "epoch": 887} {"train_loss": -11.0571870803833, "global_step": 149022, "epoch": 887} {"train_loss": -11.06678295135498, "global_step": 149023, "epoch": 887} {"train_loss": -10.54118537902832, "global_step": 149024, "epoch": 887} {"train_loss": -11.161510467529297, "global_step": 149025, "epoch": 887} {"train_loss": -10.755276679992676, "global_step": 149026, "epoch": 887} {"train_loss": -10.711433410644531, "global_step": 149027, "epoch": 887} {"train_loss": -10.747676849365234, "global_step": 149028, "epoch": 887} {"train_loss": -10.984755516052246, "global_step": 149029, "epoch": 887} {"train_loss": -10.428866386413574, "global_step": 149030, "epoch": 887} {"train_loss": -10.96928596496582, "global_step": 149031, "epoch": 887} {"train_loss": -11.01927375793457, "global_step": 149032, "epoch": 887} {"train_loss": -10.853473663330078, "global_step": 149033, "epoch": 887} {"train_loss": -10.330002784729004, "global_step": 149034, "epoch": 887} {"train_loss": -10.894737243652344, "global_step": 149035, "epoch": 887} {"train_loss": -10.63182544708252, "global_step": 149036, "epoch": 887} {"train_loss": -10.446268081665039, "global_step": 149037, "epoch": 887} {"train_loss": -10.08774185180664, "global_step": 149038, "epoch": 887} {"train_loss": -10.270614624023438, "global_step": 149039, "epoch": 887} {"train_loss": -10.916056632995605, "global_step": 149040, "epoch": 887} {"train_loss": -10.759572982788086, "global_step": 149041, "epoch": 887} {"train_loss": -10.264216423034668, "global_step": 149042, "epoch": 887} {"train_loss": -10.830266952514648, "global_step": 149043, "epoch": 887} {"train_loss": -10.650287628173828, "global_step": 149044, "epoch": 887} {"train_loss": -11.019746780395508, "global_step": 149045, "epoch": 887} {"train_loss": -10.703949928283691, "global_step": 149046, "epoch": 887} {"train_loss": -10.854488372802734, "global_step": 149047, "epoch": 887} {"train_loss": -10.795503616333008, "global_step": 149048, "epoch": 887} {"train_loss": -10.863960266113281, "global_step": 149049, "epoch": 887} {"train_loss": -11.022336959838867, "global_step": 149050, "epoch": 887} {"train_loss": -10.698556900024414, "global_step": 149051, "epoch": 887} {"train_loss": -10.800050735473633, "global_step": 149052, "epoch": 887} {"train_loss": -10.859617233276367, "global_step": 149053, "epoch": 887} {"train_loss": -10.619993209838867, "global_step": 149054, "epoch": 887} {"train_loss": -10.967942237854004, "global_step": 149055, "epoch": 887} {"train_loss": -10.690503120422363, "global_step": 149056, "epoch": 887} {"train_loss": -10.222625732421875, "global_step": 149057, "epoch": 887} {"train_loss": -10.871667861938477, "global_step": 149058, "epoch": 887} {"train_loss": -10.57295036315918, "global_step": 149059, "epoch": 887} {"train_loss": -10.336494445800781, "global_step": 149060, "epoch": 887} {"train_loss": -10.802486419677734, "global_step": 149061, "epoch": 887} {"train_loss": -10.828512191772461, "global_step": 149062, "epoch": 887} {"train_loss": -10.3189058303833, "global_step": 149063, "epoch": 887} {"train_loss": -10.660521507263184, "global_step": 149064, "epoch": 887} {"train_loss": -10.981607437133789, "global_step": 149065, "epoch": 887} {"train_loss": -10.647150039672852, "global_step": 149066, "epoch": 887} {"train_loss": -10.791357040405273, "global_step": 149067, "epoch": 887} {"train_loss": -10.968679428100586, "global_step": 149068, "epoch": 887} {"train_loss": -10.534696578979492, "global_step": 149069, "epoch": 887} {"train_loss": -10.5306396484375, "global_step": 149070, "epoch": 887} {"train_loss": -10.416109085083008, "global_step": 149071, "epoch": 887} {"train_loss": -10.798002243041992, "global_step": 149072, "epoch": 887} {"train_loss": -10.568044662475586, "global_step": 149073, "epoch": 887} {"train_loss": -10.666788101196289, "global_step": 149074, "epoch": 887} {"train_loss": -10.903815269470215, "global_step": 149075, "epoch": 887} {"train_loss": -10.663932800292969, "global_step": 149076, "epoch": 887} {"train_loss": -10.855788230895996, "global_step": 149077, "epoch": 887} {"train_loss": -10.054051399230957, "global_step": 149078, "epoch": 887} {"train_loss": -10.493975639343262, "global_step": 149079, "epoch": 887} {"train_loss": -10.66417121887207, "global_step": 149080, "epoch": 887} {"train_loss": -10.582233428955078, "global_step": 149081, "epoch": 887} {"train_loss": -10.938721656799316, "global_step": 149082, "epoch": 887} {"train_loss": -10.490781784057617, "global_step": 149083, "epoch": 887} {"train_loss": -10.839792251586914, "global_step": 149084, "epoch": 887} {"train_loss": -10.69052791595459, "global_step": 149085, "epoch": 887} {"train_loss": -10.625053405761719, "global_step": 149086, "epoch": 887} {"train_loss": -10.59895133972168, "global_step": 149087, "epoch": 887} {"train_loss": -10.675712585449219, "global_step": 149088, "epoch": 887} {"train_loss": -10.545312881469727, "global_step": 149089, "epoch": 887} {"train_loss": -10.857231140136719, "global_step": 149090, "epoch": 887} {"train_loss": -10.604524612426758, "global_step": 149091, "epoch": 887} {"train_loss": -10.964500427246094, "global_step": 149092, "epoch": 887} {"train_loss": -10.64016342163086, "global_step": 149093, "epoch": 887} {"train_loss": -10.854009628295898, "global_step": 149094, "epoch": 887} {"train_loss": -10.76706314086914, "global_step": 149095, "epoch": 887} {"train_loss": -10.642541885375977, "global_step": 149096, "epoch": 887} {"train_loss": -10.998329162597656, "global_step": 149097, "epoch": 887} {"train_loss": -10.569477081298828, "global_step": 149098, "epoch": 887} {"train_loss": -10.7406644821167, "global_step": 149099, "epoch": 887} {"train_loss": -10.851715087890625, "global_step": 149100, "epoch": 887} {"train_loss": -10.634867668151855, "global_step": 149101, "epoch": 887} {"train_loss": -10.851668357849121, "global_step": 149102, "epoch": 887} {"train_loss": -10.703980445861816, "global_step": 149103, "epoch": 887} {"train_loss": -10.93037223815918, "global_step": 149104, "epoch": 887} {"train_loss": -10.841550827026367, "global_step": 149105, "epoch": 887} {"train_loss": -10.763908386230469, "global_step": 149106, "epoch": 887} {"train_loss": -10.707189559936523, "global_step": 149107, "epoch": 887} {"train_loss": -10.838708877563477, "global_step": 149108, "epoch": 887} {"train_loss": -10.885604858398438, "global_step": 149109, "epoch": 887} {"train_loss": -10.805678367614746, "global_step": 149110, "epoch": 887} {"train_loss": -10.76545524597168, "global_step": 149111, "epoch": 887} {"train_loss": -10.966312408447266, "global_step": 149112, "epoch": 887} {"train_loss": -11.000560760498047, "global_step": 149113, "epoch": 887} {"train_loss": -10.725957870483398, "global_step": 149114, "epoch": 887} {"train_loss": -10.970253944396973, "global_step": 149115, "epoch": 887} {"train_loss": -10.882370948791504, "global_step": 149116, "epoch": 887} {"train_loss": -10.69968032836914, "global_step": 149117, "epoch": 887} {"train_loss": -10.822014808654785, "global_step": 149118, "epoch": 887} {"train_loss": -10.706727981567383, "global_step": 149119, "epoch": 887} {"train_loss": -10.392065048217773, "global_step": 149120, "epoch": 887} {"train_loss": -10.893457412719727, "global_step": 149121, "epoch": 887} {"train_loss": -10.401737213134766, "global_step": 149122, "epoch": 887} {"train_loss": -10.423494338989258, "global_step": 149123, "epoch": 887} {"train_loss": -11.001501083374023, "global_step": 149124, "epoch": 887} {"train_loss": -10.29446792602539, "global_step": 149125, "epoch": 887} {"train_loss": -10.311115264892578, "global_step": 149126, "epoch": 887} {"train_loss": -10.871208190917969, "global_step": 149127, "epoch": 887} {"train_loss": -10.069811820983887, "global_step": 149128, "epoch": 887} {"train_loss": -10.578256607055664, "global_step": 149129, "epoch": 887} {"train_loss": -10.529130935668945, "global_step": 149130, "epoch": 887} {"train_loss": -10.388803482055664, "global_step": 149131, "epoch": 887} {"train_loss": -10.808066368103027, "global_step": 149132, "epoch": 887} {"train_loss": -10.510004997253418, "global_step": 149133, "epoch": 887} {"train_loss": -10.238310813903809, "global_step": 149134, "epoch": 887} {"train_loss": -10.763191223144531, "global_step": 149135, "epoch": 887} {"train_loss": -10.23604965209961, "global_step": 149136, "epoch": 887} {"train_loss": -10.56109619140625, "global_step": 149137, "epoch": 887} {"train_loss": -10.531534194946289, "global_step": 149138, "epoch": 887} {"train_loss": -10.442441940307617, "global_step": 149139, "epoch": 887} {"train_loss": -10.508072853088379, "global_step": 149140, "epoch": 887} {"train_loss": -10.70610237121582, "global_step": 149141, "epoch": 887} {"train_loss": -10.198729515075684, "global_step": 149142, "epoch": 887} {"train_loss": -10.72005558013916, "global_step": 149143, "epoch": 887} {"train_loss": -10.571579933166504, "global_step": 149144, "epoch": 887} {"train_loss": -10.662007331848145, "global_step": 149145, "epoch": 887} {"train_loss": -10.677623748779297, "global_step": 149146, "epoch": 887} {"train_loss": -10.653066635131836, "global_step": 149147, "epoch": 887} {"train_loss": -10.896385192871094, "global_step": 149148, "epoch": 887} {"train_loss": -10.534605026245117, "global_step": 149149, "epoch": 887} {"train_loss": -10.95962142944336, "global_step": 149150, "epoch": 887} {"train_loss": -10.816588401794434, "global_step": 149151, "epoch": 887} {"train_loss": -10.942448616027832, "global_step": 149152, "epoch": 887} {"train_loss": -10.689345359802246, "global_step": 149153, "epoch": 887} {"train_loss": -10.789512634277344, "global_step": 149154, "epoch": 887} {"train_loss": -10.930335998535156, "global_step": 149155, "epoch": 887} {"train_loss": -10.780082702636719, "global_step": 149156, "epoch": 887} {"train_loss": -11.0963134765625, "global_step": 149157, "epoch": 887} {"train_loss": -10.898420333862305, "global_step": 149158, "epoch": 887} {"train_loss": -10.950881958007812, "global_step": 149159, "epoch": 887} {"train_loss": -10.928606986999512, "global_step": 149160, "epoch": 887} {"train_loss": -10.903520584106445, "global_step": 149161, "epoch": 887} {"train_loss": -11.016127586364746, "global_step": 149162, "epoch": 887} {"train_loss": -11.080554962158203, "global_step": 149163, "epoch": 887} {"train_loss": -10.947091102600098, "global_step": 149164, "epoch": 887} {"train_loss": -11.104154586791992, "global_step": 149165, "epoch": 887} {"train_loss": -10.859760284423828, "global_step": 149166, "epoch": 887} {"train_loss": -10.659759521484375, "global_step": 149167, "epoch": 887} {"train_loss": -10.943022727966309, "global_step": 149168, "epoch": 887} {"train_loss": -10.581239700317383, "global_step": 149169, "epoch": 887} {"train_loss": -10.967299461364746, "global_step": 149170, "epoch": 887} {"train_loss": -10.35716438293457, "global_step": 149171, "epoch": 887} {"train_loss": -10.952198028564453, "global_step": 149172, "epoch": 887} {"train_loss": -10.90271282196045, "global_step": 149173, "epoch": 887} {"train_loss": -10.755577087402344, "global_step": 149174, "epoch": 887} {"train_loss": -10.800222396850586, "global_step": 149175, "epoch": 887} {"train_loss": -11.21562385559082, "global_step": 149176, "epoch": 887} {"train_loss": -10.614827156066895, "global_step": 149177, "epoch": 887} {"train_loss": -10.80711555480957, "global_step": 149178, "epoch": 887} {"train_loss": -10.854969024658203, "global_step": 149179, "epoch": 887} {"train_loss": -10.951288223266602, "global_step": 149180, "epoch": 887} {"train_loss": -10.343446731567383, "global_step": 149181, "epoch": 887} {"train_loss": -10.323999404907227, "global_step": 149182, "epoch": 887} {"train_loss": -10.72138260092054, "global_step": 149183, "epoch": 887, "val_loss": 229651.46875} {"train_loss": -10.00986099243164, "global_step": 149184, "epoch": 888} {"train_loss": -10.427362442016602, "global_step": 149185, "epoch": 888} {"train_loss": -10.704259872436523, "global_step": 149186, "epoch": 888} {"train_loss": -10.152423858642578, "global_step": 149187, "epoch": 888} {"train_loss": -10.505581855773926, "global_step": 149188, "epoch": 888} {"train_loss": -10.903392791748047, "global_step": 149189, "epoch": 888} {"train_loss": -10.369525909423828, "global_step": 149190, "epoch": 888} {"train_loss": -10.150308609008789, "global_step": 149191, "epoch": 888} {"train_loss": -10.704458236694336, "global_step": 149192, "epoch": 888} {"train_loss": -10.424243927001953, "global_step": 149193, "epoch": 888} {"train_loss": -10.463699340820312, "global_step": 149194, "epoch": 888} {"train_loss": -10.524503707885742, "global_step": 149195, "epoch": 888} {"train_loss": -10.58380126953125, "global_step": 149196, "epoch": 888} {"train_loss": -10.25385570526123, "global_step": 149197, "epoch": 888} {"train_loss": -9.762840270996094, "global_step": 149198, "epoch": 888} {"train_loss": -10.220303535461426, "global_step": 149199, "epoch": 888} {"train_loss": -9.966720581054688, "global_step": 149200, "epoch": 888} {"train_loss": -9.7992582321167, "global_step": 149201, "epoch": 888} {"train_loss": -10.574222564697266, "global_step": 149202, "epoch": 888} {"train_loss": -9.606149673461914, "global_step": 149203, "epoch": 888} {"train_loss": -10.063454627990723, "global_step": 149204, "epoch": 888} {"train_loss": -10.331640243530273, "global_step": 149205, "epoch": 888} {"train_loss": -9.471364974975586, "global_step": 149206, "epoch": 888} {"train_loss": -10.544743537902832, "global_step": 149207, "epoch": 888} {"train_loss": -10.065608978271484, "global_step": 149208, "epoch": 888} {"train_loss": -9.97158432006836, "global_step": 149209, "epoch": 888} {"train_loss": -10.599971771240234, "global_step": 149210, "epoch": 888} {"train_loss": -10.27437973022461, "global_step": 149211, "epoch": 888} {"train_loss": -10.057861328125, "global_step": 149212, "epoch": 888} {"train_loss": -10.518692016601562, "global_step": 149213, "epoch": 888} {"train_loss": -10.066344261169434, "global_step": 149214, "epoch": 888} {"train_loss": -10.28246784210205, "global_step": 149215, "epoch": 888} {"train_loss": -10.63351821899414, "global_step": 149216, "epoch": 888} {"train_loss": -10.156379699707031, "global_step": 149217, "epoch": 888} {"train_loss": -10.515555381774902, "global_step": 149218, "epoch": 888} {"train_loss": -10.57783317565918, "global_step": 149219, "epoch": 888} {"train_loss": -10.200834274291992, "global_step": 149220, "epoch": 888} {"train_loss": -10.476238250732422, "global_step": 149221, "epoch": 888} {"train_loss": -10.822114944458008, "global_step": 149222, "epoch": 888} {"train_loss": -10.510808944702148, "global_step": 149223, "epoch": 888} {"train_loss": -10.956466674804688, "global_step": 149224, "epoch": 888} {"train_loss": -10.686552047729492, "global_step": 149225, "epoch": 888} {"train_loss": -10.746564865112305, "global_step": 149226, "epoch": 888} {"train_loss": -10.753755569458008, "global_step": 149227, "epoch": 888} {"train_loss": -10.753332138061523, "global_step": 149228, "epoch": 888} {"train_loss": -10.762557983398438, "global_step": 149229, "epoch": 888} {"train_loss": -10.864677429199219, "global_step": 149230, "epoch": 888} {"train_loss": -10.927743911743164, "global_step": 149231, "epoch": 888} {"train_loss": -10.644240379333496, "global_step": 149232, "epoch": 888} {"train_loss": -10.904394149780273, "global_step": 149233, "epoch": 888} {"train_loss": -10.723199844360352, "global_step": 149234, "epoch": 888} {"train_loss": -10.925569534301758, "global_step": 149235, "epoch": 888} {"train_loss": -10.8569917678833, "global_step": 149236, "epoch": 888} {"train_loss": -11.031688690185547, "global_step": 149237, "epoch": 888} {"train_loss": -10.982426643371582, "global_step": 149238, "epoch": 888} {"train_loss": -10.858606338500977, "global_step": 149239, "epoch": 888} {"train_loss": -11.004547119140625, "global_step": 149240, "epoch": 888} {"train_loss": -10.880831718444824, "global_step": 149241, "epoch": 888} {"train_loss": -10.9044771194458, "global_step": 149242, "epoch": 888} {"train_loss": -10.824453353881836, "global_step": 149243, "epoch": 888} {"train_loss": -10.914825439453125, "global_step": 149244, "epoch": 888} {"train_loss": -10.952733993530273, "global_step": 149245, "epoch": 888} {"train_loss": -11.018022537231445, "global_step": 149246, "epoch": 888} {"train_loss": -11.22482967376709, "global_step": 149247, "epoch": 888} {"train_loss": -11.031898498535156, "global_step": 149248, "epoch": 888} {"train_loss": -11.126948356628418, "global_step": 149249, "epoch": 888} {"train_loss": -10.83816909790039, "global_step": 149250, "epoch": 888} {"train_loss": -11.086155891418457, "global_step": 149251, "epoch": 888} {"train_loss": -10.890783309936523, "global_step": 149252, "epoch": 888} {"train_loss": -10.665727615356445, "global_step": 149253, "epoch": 888} {"train_loss": -10.91964054107666, "global_step": 149254, "epoch": 888} {"train_loss": -11.098105430603027, "global_step": 149255, "epoch": 888} {"train_loss": -10.697242736816406, "global_step": 149256, "epoch": 888} {"train_loss": -10.93101692199707, "global_step": 149257, "epoch": 888} {"train_loss": -10.535638809204102, "global_step": 149258, "epoch": 888} {"train_loss": -11.024624824523926, "global_step": 149259, "epoch": 888} {"train_loss": -10.98115348815918, "global_step": 149260, "epoch": 888} {"train_loss": -10.899142265319824, "global_step": 149261, "epoch": 888} {"train_loss": -10.855807304382324, "global_step": 149262, "epoch": 888} {"train_loss": -10.740849494934082, "global_step": 149263, "epoch": 888} {"train_loss": -9.945930480957031, "global_step": 149264, "epoch": 888} {"train_loss": -9.829429626464844, "global_step": 149265, "epoch": 888} {"train_loss": -10.872112274169922, "global_step": 149266, "epoch": 888} {"train_loss": -9.587430000305176, "global_step": 149267, "epoch": 888} {"train_loss": -10.302960395812988, "global_step": 149268, "epoch": 888} {"train_loss": -10.451345443725586, "global_step": 149269, "epoch": 888} {"train_loss": -10.562667846679688, "global_step": 149270, "epoch": 888} {"train_loss": -9.862499237060547, "global_step": 149271, "epoch": 888} {"train_loss": -10.090948104858398, "global_step": 149272, "epoch": 888} {"train_loss": -9.860357284545898, "global_step": 149273, "epoch": 888} {"train_loss": -9.03632640838623, "global_step": 149274, "epoch": 888} {"train_loss": -10.672330856323242, "global_step": 149275, "epoch": 888} {"train_loss": -8.781489372253418, "global_step": 149276, "epoch": 888} {"train_loss": -10.641600608825684, "global_step": 149277, "epoch": 888} {"train_loss": -9.172163009643555, "global_step": 149278, "epoch": 888} {"train_loss": -10.525976181030273, "global_step": 149279, "epoch": 888} {"train_loss": -9.863966941833496, "global_step": 149280, "epoch": 888} {"train_loss": -9.709335327148438, "global_step": 149281, "epoch": 888} {"train_loss": -10.506567001342773, "global_step": 149282, "epoch": 888} {"train_loss": -9.818865776062012, "global_step": 149283, "epoch": 888} {"train_loss": -10.090054512023926, "global_step": 149284, "epoch": 888} {"train_loss": -10.300498008728027, "global_step": 149285, "epoch": 888} {"train_loss": -10.047855377197266, "global_step": 149286, "epoch": 888} {"train_loss": -10.608417510986328, "global_step": 149287, "epoch": 888} {"train_loss": -10.143464088439941, "global_step": 149288, "epoch": 888} {"train_loss": -10.66491985321045, "global_step": 149289, "epoch": 888} {"train_loss": -10.092557907104492, "global_step": 149290, "epoch": 888} {"train_loss": -10.468430519104004, "global_step": 149291, "epoch": 888} {"train_loss": -10.270952224731445, "global_step": 149292, "epoch": 888} {"train_loss": -10.271173477172852, "global_step": 149293, "epoch": 888} {"train_loss": -10.254064559936523, "global_step": 149294, "epoch": 888} {"train_loss": -10.429313659667969, "global_step": 149295, "epoch": 888} {"train_loss": -10.424318313598633, "global_step": 149296, "epoch": 888} {"train_loss": -10.234346389770508, "global_step": 149297, "epoch": 888} {"train_loss": -10.573768615722656, "global_step": 149298, "epoch": 888} {"train_loss": -10.681903839111328, "global_step": 149299, "epoch": 888} {"train_loss": -10.63153076171875, "global_step": 149300, "epoch": 888} {"train_loss": -10.820070266723633, "global_step": 149301, "epoch": 888} {"train_loss": -10.630467414855957, "global_step": 149302, "epoch": 888} {"train_loss": -10.628934860229492, "global_step": 149303, "epoch": 888} {"train_loss": -10.54591178894043, "global_step": 149304, "epoch": 888} {"train_loss": -10.631281852722168, "global_step": 149305, "epoch": 888} {"train_loss": -10.572793960571289, "global_step": 149306, "epoch": 888} {"train_loss": -10.347450256347656, "global_step": 149307, "epoch": 888} {"train_loss": -10.708269119262695, "global_step": 149308, "epoch": 888} {"train_loss": -10.818384170532227, "global_step": 149309, "epoch": 888} {"train_loss": -10.777087211608887, "global_step": 149310, "epoch": 888} {"train_loss": -10.91705322265625, "global_step": 149311, "epoch": 888} {"train_loss": -10.79684066772461, "global_step": 149312, "epoch": 888} {"train_loss": -10.970417022705078, "global_step": 149313, "epoch": 888} {"train_loss": -10.978755950927734, "global_step": 149314, "epoch": 888} {"train_loss": -11.004612922668457, "global_step": 149315, "epoch": 888} {"train_loss": -10.896604537963867, "global_step": 149316, "epoch": 888} {"train_loss": -10.736771583557129, "global_step": 149317, "epoch": 888} {"train_loss": -10.84744644165039, "global_step": 149318, "epoch": 888} {"train_loss": -10.874002456665039, "global_step": 149319, "epoch": 888} {"train_loss": -10.852391242980957, "global_step": 149320, "epoch": 888} {"train_loss": -10.678953170776367, "global_step": 149321, "epoch": 888} {"train_loss": -10.894956588745117, "global_step": 149322, "epoch": 888} {"train_loss": -10.977404594421387, "global_step": 149323, "epoch": 888} {"train_loss": -10.662574768066406, "global_step": 149324, "epoch": 888} {"train_loss": -10.654314041137695, "global_step": 149325, "epoch": 888} {"train_loss": -10.467391014099121, "global_step": 149326, "epoch": 888} {"train_loss": -10.88825798034668, "global_step": 149327, "epoch": 888} {"train_loss": -10.8971529006958, "global_step": 149328, "epoch": 888} {"train_loss": -10.677413940429688, "global_step": 149329, "epoch": 888} {"train_loss": -10.907023429870605, "global_step": 149330, "epoch": 888} {"train_loss": -10.801280975341797, "global_step": 149331, "epoch": 888} {"train_loss": -10.993053436279297, "global_step": 149332, "epoch": 888} {"train_loss": -10.669830322265625, "global_step": 149333, "epoch": 888} {"train_loss": -10.773904800415039, "global_step": 149334, "epoch": 888} {"train_loss": -10.945993423461914, "global_step": 149335, "epoch": 888} {"train_loss": -10.928484916687012, "global_step": 149336, "epoch": 888} {"train_loss": -10.976320266723633, "global_step": 149337, "epoch": 888} {"train_loss": -11.120328903198242, "global_step": 149338, "epoch": 888} {"train_loss": -10.861446380615234, "global_step": 149339, "epoch": 888} {"train_loss": -10.996787071228027, "global_step": 149340, "epoch": 888} {"train_loss": -11.226167678833008, "global_step": 149341, "epoch": 888} {"train_loss": -10.840527534484863, "global_step": 149342, "epoch": 888} {"train_loss": -11.144429206848145, "global_step": 149343, "epoch": 888} {"train_loss": -10.764071464538574, "global_step": 149344, "epoch": 888} {"train_loss": -10.221051216125488, "global_step": 149345, "epoch": 888} {"train_loss": -10.185205459594727, "global_step": 149346, "epoch": 888} {"train_loss": -10.841468811035156, "global_step": 149347, "epoch": 888} {"train_loss": -9.332671165466309, "global_step": 149348, "epoch": 888} {"train_loss": -10.251046180725098, "global_step": 149349, "epoch": 888} {"train_loss": -10.572002410888672, "global_step": 149350, "epoch": 888} {"train_loss": -10.543147768293109, "global_step": 149351, "epoch": 888, "val_loss": 231168.15625} {"train_loss": -10.735245704650879, "global_step": 149352, "epoch": 889} {"train_loss": -9.721988677978516, "global_step": 149353, "epoch": 889} {"train_loss": -10.294892311096191, "global_step": 149354, "epoch": 889} {"train_loss": -9.55632209777832, "global_step": 149355, "epoch": 889} {"train_loss": -10.064119338989258, "global_step": 149356, "epoch": 889} {"train_loss": -9.918756484985352, "global_step": 149357, "epoch": 889} {"train_loss": -9.955514907836914, "global_step": 149358, "epoch": 889} {"train_loss": -10.720908164978027, "global_step": 149359, "epoch": 889} {"train_loss": -9.968231201171875, "global_step": 149360, "epoch": 889} {"train_loss": -10.346973419189453, "global_step": 149361, "epoch": 889} {"train_loss": -10.639389991760254, "global_step": 149362, "epoch": 889} {"train_loss": -10.746320724487305, "global_step": 149363, "epoch": 889} {"train_loss": -10.63758373260498, "global_step": 149364, "epoch": 889} {"train_loss": -10.672938346862793, "global_step": 149365, "epoch": 889} {"train_loss": -10.854508399963379, "global_step": 149366, "epoch": 889} {"train_loss": -10.553199768066406, "global_step": 149367, "epoch": 889} {"train_loss": -10.558773040771484, "global_step": 149368, "epoch": 889} {"train_loss": -10.556166648864746, "global_step": 149369, "epoch": 889} {"train_loss": -10.503154754638672, "global_step": 149370, "epoch": 889} {"train_loss": -10.701898574829102, "global_step": 149371, "epoch": 889} {"train_loss": -10.57897663116455, "global_step": 149372, "epoch": 889} {"train_loss": -10.572674751281738, "global_step": 149373, "epoch": 889} {"train_loss": -10.968037605285645, "global_step": 149374, "epoch": 889} {"train_loss": -10.57878589630127, "global_step": 149375, "epoch": 889} {"train_loss": -10.642852783203125, "global_step": 149376, "epoch": 889} {"train_loss": -10.6729736328125, "global_step": 149377, "epoch": 889} {"train_loss": -10.618897438049316, "global_step": 149378, "epoch": 889} {"train_loss": -10.832818984985352, "global_step": 149379, "epoch": 889} {"train_loss": -11.186016082763672, "global_step": 149380, "epoch": 889} {"train_loss": -10.66551685333252, "global_step": 149381, "epoch": 889} {"train_loss": -10.781988143920898, "global_step": 149382, "epoch": 889} {"train_loss": -10.93513011932373, "global_step": 149383, "epoch": 889} {"train_loss": -10.59787368774414, "global_step": 149384, "epoch": 889} {"train_loss": -11.02953052520752, "global_step": 149385, "epoch": 889} {"train_loss": -10.790051460266113, "global_step": 149386, "epoch": 889} {"train_loss": -10.700943946838379, "global_step": 149387, "epoch": 889} {"train_loss": -10.955387115478516, "global_step": 149388, "epoch": 889} {"train_loss": -10.885808944702148, "global_step": 149389, "epoch": 889} {"train_loss": -10.385927200317383, "global_step": 149390, "epoch": 889} {"train_loss": -10.898386001586914, "global_step": 149391, "epoch": 889} {"train_loss": -10.61569881439209, "global_step": 149392, "epoch": 889} {"train_loss": -10.727216720581055, "global_step": 149393, "epoch": 889} {"train_loss": -10.82795524597168, "global_step": 149394, "epoch": 889} {"train_loss": -10.625629425048828, "global_step": 149395, "epoch": 889} {"train_loss": -11.150306701660156, "global_step": 149396, "epoch": 889} {"train_loss": -10.687653541564941, "global_step": 149397, "epoch": 889} {"train_loss": -10.867136001586914, "global_step": 149398, "epoch": 889} {"train_loss": -11.069289207458496, "global_step": 149399, "epoch": 889} {"train_loss": -10.829286575317383, "global_step": 149400, "epoch": 889} {"train_loss": -10.789922714233398, "global_step": 149401, "epoch": 889} {"train_loss": -11.078603744506836, "global_step": 149402, "epoch": 889} {"train_loss": -11.113661766052246, "global_step": 149403, "epoch": 889} {"train_loss": -10.979691505432129, "global_step": 149404, "epoch": 889} {"train_loss": -11.127967834472656, "global_step": 149405, "epoch": 889} {"train_loss": -11.02326488494873, "global_step": 149406, "epoch": 889} {"train_loss": -11.002500534057617, "global_step": 149407, "epoch": 889} {"train_loss": -10.804737091064453, "global_step": 149408, "epoch": 889} {"train_loss": -10.702299118041992, "global_step": 149409, "epoch": 889} {"train_loss": -10.807411193847656, "global_step": 149410, "epoch": 889} {"train_loss": -10.958732604980469, "global_step": 149411, "epoch": 889} {"train_loss": -10.380806922912598, "global_step": 149412, "epoch": 889} {"train_loss": -10.542055130004883, "global_step": 149413, "epoch": 889} {"train_loss": -10.80488395690918, "global_step": 149414, "epoch": 889} {"train_loss": -10.333117485046387, "global_step": 149415, "epoch": 889} {"train_loss": -10.226139068603516, "global_step": 149416, "epoch": 889} {"train_loss": -10.33232307434082, "global_step": 149417, "epoch": 889} {"train_loss": -9.567955017089844, "global_step": 149418, "epoch": 889} {"train_loss": -10.226156234741211, "global_step": 149419, "epoch": 889} {"train_loss": -10.4913330078125, "global_step": 149420, "epoch": 889} {"train_loss": -9.916866302490234, "global_step": 149421, "epoch": 889} {"train_loss": -10.525224685668945, "global_step": 149422, "epoch": 889} {"train_loss": -10.250889778137207, "global_step": 149423, "epoch": 889} {"train_loss": -10.084495544433594, "global_step": 149424, "epoch": 889} {"train_loss": -10.311626434326172, "global_step": 149425, "epoch": 889} {"train_loss": -9.849326133728027, "global_step": 149426, "epoch": 889} {"train_loss": -10.27694034576416, "global_step": 149427, "epoch": 889} {"train_loss": -10.667919158935547, "global_step": 149428, "epoch": 889} {"train_loss": -10.470468521118164, "global_step": 149429, "epoch": 889} {"train_loss": -10.600536346435547, "global_step": 149430, "epoch": 889} {"train_loss": -10.453393936157227, "global_step": 149431, "epoch": 889} {"train_loss": -10.556949615478516, "global_step": 149432, "epoch": 889} {"train_loss": -10.461089134216309, "global_step": 149433, "epoch": 889} {"train_loss": -10.62747573852539, "global_step": 149434, "epoch": 889} {"train_loss": -10.60360336303711, "global_step": 149435, "epoch": 889} {"train_loss": -10.389002799987793, "global_step": 149436, "epoch": 889} {"train_loss": -10.538932800292969, "global_step": 149437, "epoch": 889} {"train_loss": -10.460113525390625, "global_step": 149438, "epoch": 889} {"train_loss": -10.069636344909668, "global_step": 149439, "epoch": 889} {"train_loss": -10.525806427001953, "global_step": 149440, "epoch": 889} {"train_loss": -10.1666841506958, "global_step": 149441, "epoch": 889} {"train_loss": -10.329590797424316, "global_step": 149442, "epoch": 889} {"train_loss": -10.48511028289795, "global_step": 149443, "epoch": 889} {"train_loss": -10.32699203491211, "global_step": 149444, "epoch": 889} {"train_loss": -10.444781303405762, "global_step": 149445, "epoch": 889} {"train_loss": -10.432718276977539, "global_step": 149446, "epoch": 889} {"train_loss": -10.609115600585938, "global_step": 149447, "epoch": 889} {"train_loss": -10.2933349609375, "global_step": 149448, "epoch": 889} {"train_loss": -10.64888858795166, "global_step": 149449, "epoch": 889} {"train_loss": -10.306663513183594, "global_step": 149450, "epoch": 889} {"train_loss": -10.63056755065918, "global_step": 149451, "epoch": 889} {"train_loss": -10.76342487335205, "global_step": 149452, "epoch": 889} {"train_loss": -10.676060676574707, "global_step": 149453, "epoch": 889} {"train_loss": -10.44930648803711, "global_step": 149454, "epoch": 889} {"train_loss": -10.752059936523438, "global_step": 149455, "epoch": 889} {"train_loss": -10.662551879882812, "global_step": 149456, "epoch": 889} {"train_loss": -10.79152774810791, "global_step": 149457, "epoch": 889} {"train_loss": -10.704928398132324, "global_step": 149458, "epoch": 889} {"train_loss": -10.675113677978516, "global_step": 149459, "epoch": 889} {"train_loss": -10.672135353088379, "global_step": 149460, "epoch": 889} {"train_loss": -10.807666778564453, "global_step": 149461, "epoch": 889} {"train_loss": -10.975419044494629, "global_step": 149462, "epoch": 889} {"train_loss": -10.947068214416504, "global_step": 149463, "epoch": 889} {"train_loss": -10.984457015991211, "global_step": 149464, "epoch": 889} {"train_loss": -10.619172096252441, "global_step": 149465, "epoch": 889} {"train_loss": -10.791950225830078, "global_step": 149466, "epoch": 889} {"train_loss": -10.82408332824707, "global_step": 149467, "epoch": 889} {"train_loss": -10.996814727783203, "global_step": 149468, "epoch": 889} {"train_loss": -10.648686408996582, "global_step": 149469, "epoch": 889} {"train_loss": -10.865575790405273, "global_step": 149470, "epoch": 889} {"train_loss": -10.608570098876953, "global_step": 149471, "epoch": 889} {"train_loss": -10.969499588012695, "global_step": 149472, "epoch": 889} {"train_loss": -10.498068809509277, "global_step": 149473, "epoch": 889} {"train_loss": -10.635902404785156, "global_step": 149474, "epoch": 889} {"train_loss": -10.777406692504883, "global_step": 149475, "epoch": 889} {"train_loss": -10.321990966796875, "global_step": 149476, "epoch": 889} {"train_loss": -10.721981048583984, "global_step": 149477, "epoch": 889} {"train_loss": -10.785726547241211, "global_step": 149478, "epoch": 889} {"train_loss": -10.543563842773438, "global_step": 149479, "epoch": 889} {"train_loss": -10.749265670776367, "global_step": 149480, "epoch": 889} {"train_loss": -10.44965648651123, "global_step": 149481, "epoch": 889} {"train_loss": -10.604576110839844, "global_step": 149482, "epoch": 889} {"train_loss": -10.340190887451172, "global_step": 149483, "epoch": 889} {"train_loss": -10.327096939086914, "global_step": 149484, "epoch": 889} {"train_loss": -10.740673065185547, "global_step": 149485, "epoch": 889} {"train_loss": -10.210358619689941, "global_step": 149486, "epoch": 889} {"train_loss": -10.931452751159668, "global_step": 149487, "epoch": 889} {"train_loss": -10.42563247680664, "global_step": 149488, "epoch": 889} {"train_loss": -10.54965591430664, "global_step": 149489, "epoch": 889} {"train_loss": -10.35622787475586, "global_step": 149490, "epoch": 889} {"train_loss": -11.032876968383789, "global_step": 149491, "epoch": 889} {"train_loss": -10.699081420898438, "global_step": 149492, "epoch": 889} {"train_loss": -10.734916687011719, "global_step": 149493, "epoch": 889} {"train_loss": -10.423229217529297, "global_step": 149494, "epoch": 889} {"train_loss": -10.582796096801758, "global_step": 149495, "epoch": 889} {"train_loss": -10.816360473632812, "global_step": 149496, "epoch": 889} {"train_loss": -10.763479232788086, "global_step": 149497, "epoch": 889} {"train_loss": -11.035219192504883, "global_step": 149498, "epoch": 889} {"train_loss": -10.888198852539062, "global_step": 149499, "epoch": 889} {"train_loss": -10.957277297973633, "global_step": 149500, "epoch": 889} {"train_loss": -10.803766250610352, "global_step": 149501, "epoch": 889} {"train_loss": -10.804905891418457, "global_step": 149502, "epoch": 889} {"train_loss": -11.016777038574219, "global_step": 149503, "epoch": 889} {"train_loss": -10.80041217803955, "global_step": 149504, "epoch": 889} {"train_loss": -11.028430938720703, "global_step": 149505, "epoch": 889} {"train_loss": -10.860212326049805, "global_step": 149506, "epoch": 889} {"train_loss": -10.93227767944336, "global_step": 149507, "epoch": 889} {"train_loss": -11.03709602355957, "global_step": 149508, "epoch": 889} {"train_loss": -10.751669883728027, "global_step": 149509, "epoch": 889} {"train_loss": -11.191106796264648, "global_step": 149510, "epoch": 889} {"train_loss": -10.959080696105957, "global_step": 149511, "epoch": 889} {"train_loss": -10.974920272827148, "global_step": 149512, "epoch": 889} {"train_loss": -10.85981559753418, "global_step": 149513, "epoch": 889} {"train_loss": -11.090095520019531, "global_step": 149514, "epoch": 889} {"train_loss": -10.742923736572266, "global_step": 149515, "epoch": 889} {"train_loss": -11.082817077636719, "global_step": 149516, "epoch": 889} {"train_loss": -10.885963439941406, "global_step": 149517, "epoch": 889} {"train_loss": -10.533163070678711, "global_step": 149518, "epoch": 889} {"train_loss": -10.63650371347155, "global_step": 149519, "epoch": 889, "val_loss": 231666.765625} {"train_loss": -11.227395057678223, "global_step": 149520, "epoch": 890} {"train_loss": -10.671908378601074, "global_step": 149521, "epoch": 890} {"train_loss": -11.000982284545898, "global_step": 149522, "epoch": 890} {"train_loss": -10.69278335571289, "global_step": 149523, "epoch": 890} {"train_loss": -9.803606033325195, "global_step": 149524, "epoch": 890} {"train_loss": -10.608085632324219, "global_step": 149525, "epoch": 890} {"train_loss": -10.113551139831543, "global_step": 149526, "epoch": 890} {"train_loss": -10.251920700073242, "global_step": 149527, "epoch": 890} {"train_loss": -10.26431655883789, "global_step": 149528, "epoch": 890} {"train_loss": -10.153079986572266, "global_step": 149529, "epoch": 890} {"train_loss": -10.76441764831543, "global_step": 149530, "epoch": 890} {"train_loss": -10.305758476257324, "global_step": 149531, "epoch": 890} {"train_loss": -9.958023071289062, "global_step": 149532, "epoch": 890} {"train_loss": -11.035083770751953, "global_step": 149533, "epoch": 890} {"train_loss": -10.000231742858887, "global_step": 149534, "epoch": 890} {"train_loss": -9.866294860839844, "global_step": 149535, "epoch": 890} {"train_loss": -11.015902519226074, "global_step": 149536, "epoch": 890} {"train_loss": -9.582483291625977, "global_step": 149537, "epoch": 890} {"train_loss": -10.829273223876953, "global_step": 149538, "epoch": 890} {"train_loss": -10.068719863891602, "global_step": 149539, "epoch": 890} {"train_loss": -10.602014541625977, "global_step": 149540, "epoch": 890} {"train_loss": -9.73599624633789, "global_step": 149541, "epoch": 890} {"train_loss": -9.974321365356445, "global_step": 149542, "epoch": 890} {"train_loss": -9.86290168762207, "global_step": 149543, "epoch": 890} {"train_loss": -10.00123119354248, "global_step": 149544, "epoch": 890} {"train_loss": -10.047245979309082, "global_step": 149545, "epoch": 890} {"train_loss": -9.780136108398438, "global_step": 149546, "epoch": 890} {"train_loss": -9.862985610961914, "global_step": 149547, "epoch": 890} {"train_loss": -9.912286758422852, "global_step": 149548, "epoch": 890} {"train_loss": -9.518506050109863, "global_step": 149549, "epoch": 890} {"train_loss": -9.787105560302734, "global_step": 149550, "epoch": 890} {"train_loss": -8.995634078979492, "global_step": 149551, "epoch": 890} {"train_loss": -10.675116539001465, "global_step": 149552, "epoch": 890} {"train_loss": -9.210596084594727, "global_step": 149553, "epoch": 890} {"train_loss": -10.224649429321289, "global_step": 149554, "epoch": 890} {"train_loss": -10.360995292663574, "global_step": 149555, "epoch": 890} {"train_loss": -10.125263214111328, "global_step": 149556, "epoch": 890} {"train_loss": -10.36485481262207, "global_step": 149557, "epoch": 890} {"train_loss": -10.432827949523926, "global_step": 149558, "epoch": 890} {"train_loss": -10.287134170532227, "global_step": 149559, "epoch": 890} {"train_loss": -10.355576515197754, "global_step": 149560, "epoch": 890} {"train_loss": -10.44484806060791, "global_step": 149561, "epoch": 890} {"train_loss": -10.331049919128418, "global_step": 149562, "epoch": 890} {"train_loss": -10.379409790039062, "global_step": 149563, "epoch": 890} {"train_loss": -10.700215339660645, "global_step": 149564, "epoch": 890} {"train_loss": -10.396652221679688, "global_step": 149565, "epoch": 890} {"train_loss": -10.470190048217773, "global_step": 149566, "epoch": 890} {"train_loss": -10.652107238769531, "global_step": 149567, "epoch": 890} {"train_loss": -10.325166702270508, "global_step": 149568, "epoch": 890} {"train_loss": -10.703330039978027, "global_step": 149569, "epoch": 890} {"train_loss": -10.61320972442627, "global_step": 149570, "epoch": 890} {"train_loss": -10.764071464538574, "global_step": 149571, "epoch": 890} {"train_loss": -10.660198211669922, "global_step": 149572, "epoch": 890} {"train_loss": -10.682536125183105, "global_step": 149573, "epoch": 890} {"train_loss": -10.728704452514648, "global_step": 149574, "epoch": 890} {"train_loss": -10.677578926086426, "global_step": 149575, "epoch": 890} {"train_loss": -10.652996063232422, "global_step": 149576, "epoch": 890} {"train_loss": -10.64963150024414, "global_step": 149577, "epoch": 890} {"train_loss": -10.764104843139648, "global_step": 149578, "epoch": 890} {"train_loss": -10.65893840789795, "global_step": 149579, "epoch": 890} {"train_loss": -10.86381721496582, "global_step": 149580, "epoch": 890} {"train_loss": -10.815216064453125, "global_step": 149581, "epoch": 890} {"train_loss": -10.738386154174805, "global_step": 149582, "epoch": 890} {"train_loss": -10.738723754882812, "global_step": 149583, "epoch": 890} {"train_loss": -10.761459350585938, "global_step": 149584, "epoch": 890} {"train_loss": -10.72998332977295, "global_step": 149585, "epoch": 890} {"train_loss": -10.686840057373047, "global_step": 149586, "epoch": 890} {"train_loss": -10.862865447998047, "global_step": 149587, "epoch": 890} {"train_loss": -10.991390228271484, "global_step": 149588, "epoch": 890} {"train_loss": -10.997443199157715, "global_step": 149589, "epoch": 890} {"train_loss": -11.034751892089844, "global_step": 149590, "epoch": 890} {"train_loss": -10.790040969848633, "global_step": 149591, "epoch": 890} {"train_loss": -10.862335205078125, "global_step": 149592, "epoch": 890} {"train_loss": -10.898201942443848, "global_step": 149593, "epoch": 890} {"train_loss": -10.799449920654297, "global_step": 149594, "epoch": 890} {"train_loss": -10.988706588745117, "global_step": 149595, "epoch": 890} {"train_loss": -10.985528945922852, "global_step": 149596, "epoch": 890} {"train_loss": -10.635929107666016, "global_step": 149597, "epoch": 890} {"train_loss": -10.992720603942871, "global_step": 149598, "epoch": 890} {"train_loss": -10.792425155639648, "global_step": 149599, "epoch": 890} {"train_loss": -10.591970443725586, "global_step": 149600, "epoch": 890} {"train_loss": -10.805696487426758, "global_step": 149601, "epoch": 890} {"train_loss": -11.195865631103516, "global_step": 149602, "epoch": 890} {"train_loss": -10.805224418640137, "global_step": 149603, "epoch": 890} {"train_loss": -10.951375961303711, "global_step": 149604, "epoch": 890} {"train_loss": -10.95074462890625, "global_step": 149605, "epoch": 890} {"train_loss": -10.649303436279297, "global_step": 149606, "epoch": 890} {"train_loss": -11.020984649658203, "global_step": 149607, "epoch": 890} {"train_loss": -10.682317733764648, "global_step": 149608, "epoch": 890} {"train_loss": -11.240805625915527, "global_step": 149609, "epoch": 890} {"train_loss": -10.878745079040527, "global_step": 149610, "epoch": 890} {"train_loss": -10.849853515625, "global_step": 149611, "epoch": 890} {"train_loss": -10.59061050415039, "global_step": 149612, "epoch": 890} {"train_loss": -10.987577438354492, "global_step": 149613, "epoch": 890} {"train_loss": -10.47724723815918, "global_step": 149614, "epoch": 890} {"train_loss": -10.825424194335938, "global_step": 149615, "epoch": 890} {"train_loss": -10.750310897827148, "global_step": 149616, "epoch": 890} {"train_loss": -10.814447402954102, "global_step": 149617, "epoch": 890} {"train_loss": -11.104790687561035, "global_step": 149618, "epoch": 890} {"train_loss": -10.215814590454102, "global_step": 149619, "epoch": 890} {"train_loss": -10.551481246948242, "global_step": 149620, "epoch": 890} {"train_loss": -10.416180610656738, "global_step": 149621, "epoch": 890} {"train_loss": -10.787545204162598, "global_step": 149622, "epoch": 890} {"train_loss": -10.616233825683594, "global_step": 149623, "epoch": 890} {"train_loss": -10.50455093383789, "global_step": 149624, "epoch": 890} {"train_loss": -11.168638229370117, "global_step": 149625, "epoch": 890} {"train_loss": -10.931661605834961, "global_step": 149626, "epoch": 890} {"train_loss": -10.800601959228516, "global_step": 149627, "epoch": 890} {"train_loss": -11.214645385742188, "global_step": 149628, "epoch": 890} {"train_loss": -10.777393341064453, "global_step": 149629, "epoch": 890} {"train_loss": -11.099367141723633, "global_step": 149630, "epoch": 890} {"train_loss": -10.969244003295898, "global_step": 149631, "epoch": 890} {"train_loss": -10.96402359008789, "global_step": 149632, "epoch": 890} {"train_loss": -10.861410140991211, "global_step": 149633, "epoch": 890} {"train_loss": -11.145453453063965, "global_step": 149634, "epoch": 890} {"train_loss": -10.495841979980469, "global_step": 149635, "epoch": 890} {"train_loss": -10.928301811218262, "global_step": 149636, "epoch": 890} {"train_loss": -11.04956340789795, "global_step": 149637, "epoch": 890} {"train_loss": -10.90743637084961, "global_step": 149638, "epoch": 890} {"train_loss": -10.812715530395508, "global_step": 149639, "epoch": 890} {"train_loss": -10.509317398071289, "global_step": 149640, "epoch": 890} {"train_loss": -10.431563377380371, "global_step": 149641, "epoch": 890} {"train_loss": -10.495040893554688, "global_step": 149642, "epoch": 890} {"train_loss": -10.31324577331543, "global_step": 149643, "epoch": 890} {"train_loss": -10.618278503417969, "global_step": 149644, "epoch": 890} {"train_loss": -10.57036018371582, "global_step": 149645, "epoch": 890} {"train_loss": -10.387504577636719, "global_step": 149646, "epoch": 890} {"train_loss": -10.266393661499023, "global_step": 149647, "epoch": 890} {"train_loss": -9.97866439819336, "global_step": 149648, "epoch": 890} {"train_loss": -10.581515312194824, "global_step": 149649, "epoch": 890} {"train_loss": -10.419488906860352, "global_step": 149650, "epoch": 890} {"train_loss": -10.473052978515625, "global_step": 149651, "epoch": 890} {"train_loss": -10.312555313110352, "global_step": 149652, "epoch": 890} {"train_loss": -10.133153915405273, "global_step": 149653, "epoch": 890} {"train_loss": -10.489046096801758, "global_step": 149654, "epoch": 890} {"train_loss": -10.211181640625, "global_step": 149655, "epoch": 890} {"train_loss": -10.942794799804688, "global_step": 149656, "epoch": 890} {"train_loss": -9.936384201049805, "global_step": 149657, "epoch": 890} {"train_loss": -10.369987487792969, "global_step": 149658, "epoch": 890} {"train_loss": -10.144144058227539, "global_step": 149659, "epoch": 890} {"train_loss": -10.25130844116211, "global_step": 149660, "epoch": 890} {"train_loss": -10.820764541625977, "global_step": 149661, "epoch": 890} {"train_loss": -9.966102600097656, "global_step": 149662, "epoch": 890} {"train_loss": -10.862932205200195, "global_step": 149663, "epoch": 890} {"train_loss": -10.183507919311523, "global_step": 149664, "epoch": 890} {"train_loss": -10.670354843139648, "global_step": 149665, "epoch": 890} {"train_loss": -10.633596420288086, "global_step": 149666, "epoch": 890} {"train_loss": -10.347762107849121, "global_step": 149667, "epoch": 890} {"train_loss": -10.363435745239258, "global_step": 149668, "epoch": 890} {"train_loss": -10.663784980773926, "global_step": 149669, "epoch": 890} {"train_loss": -10.387526512145996, "global_step": 149670, "epoch": 890} {"train_loss": -10.507490158081055, "global_step": 149671, "epoch": 890} {"train_loss": -10.350080490112305, "global_step": 149672, "epoch": 890} {"train_loss": -10.41274642944336, "global_step": 149673, "epoch": 890} {"train_loss": -10.560327529907227, "global_step": 149674, "epoch": 890} {"train_loss": -10.365474700927734, "global_step": 149675, "epoch": 890} {"train_loss": -10.83730697631836, "global_step": 149676, "epoch": 890} {"train_loss": -10.498366355895996, "global_step": 149677, "epoch": 890} {"train_loss": -10.841907501220703, "global_step": 149678, "epoch": 890} {"train_loss": -10.53265380859375, "global_step": 149679, "epoch": 890} {"train_loss": -10.535158157348633, "global_step": 149680, "epoch": 890} {"train_loss": -10.32770824432373, "global_step": 149681, "epoch": 890} {"train_loss": -10.52059555053711, "global_step": 149682, "epoch": 890} {"train_loss": -10.698358535766602, "global_step": 149683, "epoch": 890} {"train_loss": -10.936127662658691, "global_step": 149684, "epoch": 890} {"train_loss": -10.581079483032227, "global_step": 149685, "epoch": 890} {"train_loss": -10.618688583374023, "global_step": 149686, "epoch": 890} {"train_loss": -10.549622654914856, "global_step": 149687, "epoch": 890, "val_loss": 229060.78125, "train_action_mse_error": 4.487435817718506} {"train_loss": -10.193930625915527, "global_step": 149688, "epoch": 891} {"train_loss": -10.058795928955078, "global_step": 149689, "epoch": 891} {"train_loss": -10.182735443115234, "global_step": 149690, "epoch": 891} {"train_loss": -10.425884246826172, "global_step": 149691, "epoch": 891} {"train_loss": -10.463884353637695, "global_step": 149692, "epoch": 891} {"train_loss": -10.681861877441406, "global_step": 149693, "epoch": 891} {"train_loss": -10.443392753601074, "global_step": 149694, "epoch": 891} {"train_loss": -10.292675018310547, "global_step": 149695, "epoch": 891} {"train_loss": -10.65575122833252, "global_step": 149696, "epoch": 891} {"train_loss": -10.226640701293945, "global_step": 149697, "epoch": 891} {"train_loss": -11.007246017456055, "global_step": 149698, "epoch": 891} {"train_loss": -10.330911636352539, "global_step": 149699, "epoch": 891} {"train_loss": -10.778680801391602, "global_step": 149700, "epoch": 891} {"train_loss": -10.61793041229248, "global_step": 149701, "epoch": 891} {"train_loss": -10.576330184936523, "global_step": 149702, "epoch": 891} {"train_loss": -10.491804122924805, "global_step": 149703, "epoch": 891} {"train_loss": -11.010740280151367, "global_step": 149704, "epoch": 891} {"train_loss": -10.875137329101562, "global_step": 149705, "epoch": 891} {"train_loss": -10.941215515136719, "global_step": 149706, "epoch": 891} {"train_loss": -10.72877311706543, "global_step": 149707, "epoch": 891} {"train_loss": -10.74173641204834, "global_step": 149708, "epoch": 891} {"train_loss": -10.913605690002441, "global_step": 149709, "epoch": 891} {"train_loss": -10.817986488342285, "global_step": 149710, "epoch": 891} {"train_loss": -10.744863510131836, "global_step": 149711, "epoch": 891} {"train_loss": -10.84048843383789, "global_step": 149712, "epoch": 891} {"train_loss": -10.870405197143555, "global_step": 149713, "epoch": 891} {"train_loss": -11.053081512451172, "global_step": 149714, "epoch": 891} {"train_loss": -11.036787033081055, "global_step": 149715, "epoch": 891} {"train_loss": -11.092813491821289, "global_step": 149716, "epoch": 891} {"train_loss": -10.946211814880371, "global_step": 149717, "epoch": 891} {"train_loss": -10.912174224853516, "global_step": 149718, "epoch": 891} {"train_loss": -10.832066535949707, "global_step": 149719, "epoch": 891} {"train_loss": -11.024367332458496, "global_step": 149720, "epoch": 891} {"train_loss": -11.10379695892334, "global_step": 149721, "epoch": 891} {"train_loss": -11.096405029296875, "global_step": 149722, "epoch": 891} {"train_loss": -10.757060050964355, "global_step": 149723, "epoch": 891} {"train_loss": -10.91312313079834, "global_step": 149724, "epoch": 891} {"train_loss": -10.972212791442871, "global_step": 149725, "epoch": 891} {"train_loss": -11.057355880737305, "global_step": 149726, "epoch": 891} {"train_loss": -11.272470474243164, "global_step": 149727, "epoch": 891} {"train_loss": -10.982633590698242, "global_step": 149728, "epoch": 891} {"train_loss": -10.930749893188477, "global_step": 149729, "epoch": 891} {"train_loss": -10.96959400177002, "global_step": 149730, "epoch": 891} {"train_loss": -10.873685836791992, "global_step": 149731, "epoch": 891} {"train_loss": -10.98335075378418, "global_step": 149732, "epoch": 891} {"train_loss": -11.134672164916992, "global_step": 149733, "epoch": 891} {"train_loss": -10.735965728759766, "global_step": 149734, "epoch": 891} {"train_loss": -10.861928939819336, "global_step": 149735, "epoch": 891} {"train_loss": -10.961684226989746, "global_step": 149736, "epoch": 891} {"train_loss": -10.719761848449707, "global_step": 149737, "epoch": 891} {"train_loss": -10.78598690032959, "global_step": 149738, "epoch": 891} {"train_loss": -11.002164840698242, "global_step": 149739, "epoch": 891} {"train_loss": -10.973020553588867, "global_step": 149740, "epoch": 891} {"train_loss": -11.047246932983398, "global_step": 149741, "epoch": 891} {"train_loss": -10.99271011352539, "global_step": 149742, "epoch": 891} {"train_loss": -10.987737655639648, "global_step": 149743, "epoch": 891} {"train_loss": -10.477649688720703, "global_step": 149744, "epoch": 891} {"train_loss": -10.388299942016602, "global_step": 149745, "epoch": 891} {"train_loss": -10.478944778442383, "global_step": 149746, "epoch": 891} {"train_loss": -10.299995422363281, "global_step": 149747, "epoch": 891} {"train_loss": -10.067975997924805, "global_step": 149748, "epoch": 891} {"train_loss": -10.660322189331055, "global_step": 149749, "epoch": 891} {"train_loss": -10.7836275100708, "global_step": 149750, "epoch": 891} {"train_loss": -9.045072555541992, "global_step": 149751, "epoch": 891} {"train_loss": -9.62800407409668, "global_step": 149752, "epoch": 891} {"train_loss": -10.469242095947266, "global_step": 149753, "epoch": 891} {"train_loss": -9.988126754760742, "global_step": 149754, "epoch": 891} {"train_loss": -10.495984077453613, "global_step": 149755, "epoch": 891} {"train_loss": -10.545772552490234, "global_step": 149756, "epoch": 891} {"train_loss": -9.771379470825195, "global_step": 149757, "epoch": 891} {"train_loss": -10.044778823852539, "global_step": 149758, "epoch": 891} {"train_loss": -10.391298294067383, "global_step": 149759, "epoch": 891} {"train_loss": -10.294759750366211, "global_step": 149760, "epoch": 891} {"train_loss": -10.377605438232422, "global_step": 149761, "epoch": 891} {"train_loss": -10.824210166931152, "global_step": 149762, "epoch": 891} {"train_loss": -10.727383613586426, "global_step": 149763, "epoch": 891} {"train_loss": -10.695895195007324, "global_step": 149764, "epoch": 891} {"train_loss": -10.609421730041504, "global_step": 149765, "epoch": 891} {"train_loss": -10.637042999267578, "global_step": 149766, "epoch": 891} {"train_loss": -10.671260833740234, "global_step": 149767, "epoch": 891} {"train_loss": -10.691060066223145, "global_step": 149768, "epoch": 891} {"train_loss": -10.74040412902832, "global_step": 149769, "epoch": 891} {"train_loss": -10.781084060668945, "global_step": 149770, "epoch": 891} {"train_loss": -10.401803970336914, "global_step": 149771, "epoch": 891} {"train_loss": -10.630228042602539, "global_step": 149772, "epoch": 891} {"train_loss": -10.556968688964844, "global_step": 149773, "epoch": 891} {"train_loss": -10.487289428710938, "global_step": 149774, "epoch": 891} {"train_loss": -10.76247787475586, "global_step": 149775, "epoch": 891} {"train_loss": -10.596134185791016, "global_step": 149776, "epoch": 891} {"train_loss": -10.587198257446289, "global_step": 149777, "epoch": 891} {"train_loss": -10.79240894317627, "global_step": 149778, "epoch": 891} {"train_loss": -10.912803649902344, "global_step": 149779, "epoch": 891} {"train_loss": -10.48487663269043, "global_step": 149780, "epoch": 891} {"train_loss": -10.830154418945312, "global_step": 149781, "epoch": 891} {"train_loss": -10.913914680480957, "global_step": 149782, "epoch": 891} {"train_loss": -10.807633399963379, "global_step": 149783, "epoch": 891} {"train_loss": -11.021248817443848, "global_step": 149784, "epoch": 891} {"train_loss": -10.667699813842773, "global_step": 149785, "epoch": 891} {"train_loss": -10.957136154174805, "global_step": 149786, "epoch": 891} {"train_loss": -10.8744535446167, "global_step": 149787, "epoch": 891} {"train_loss": -10.879759788513184, "global_step": 149788, "epoch": 891} {"train_loss": -10.54781723022461, "global_step": 149789, "epoch": 891} {"train_loss": -11.00067138671875, "global_step": 149790, "epoch": 891} {"train_loss": -10.77700424194336, "global_step": 149791, "epoch": 891} {"train_loss": -10.740227699279785, "global_step": 149792, "epoch": 891} {"train_loss": -10.902015686035156, "global_step": 149793, "epoch": 891} {"train_loss": -10.73537826538086, "global_step": 149794, "epoch": 891} {"train_loss": -10.510025024414062, "global_step": 149795, "epoch": 891} {"train_loss": -10.947125434875488, "global_step": 149796, "epoch": 891} {"train_loss": -10.156021118164062, "global_step": 149797, "epoch": 891} {"train_loss": -10.7813138961792, "global_step": 149798, "epoch": 891} {"train_loss": -10.840631484985352, "global_step": 149799, "epoch": 891} {"train_loss": -10.815999984741211, "global_step": 149800, "epoch": 891} {"train_loss": -10.572394371032715, "global_step": 149801, "epoch": 891} {"train_loss": -10.569128036499023, "global_step": 149802, "epoch": 891} {"train_loss": -10.410390853881836, "global_step": 149803, "epoch": 891} {"train_loss": -10.883893013000488, "global_step": 149804, "epoch": 891} {"train_loss": -10.072802543640137, "global_step": 149805, "epoch": 891} {"train_loss": -10.295248985290527, "global_step": 149806, "epoch": 891} {"train_loss": -9.86358642578125, "global_step": 149807, "epoch": 891} {"train_loss": -10.056510925292969, "global_step": 149808, "epoch": 891} {"train_loss": -10.748703002929688, "global_step": 149809, "epoch": 891} {"train_loss": -10.157235145568848, "global_step": 149810, "epoch": 891} {"train_loss": -10.953817367553711, "global_step": 149811, "epoch": 891} {"train_loss": -9.999645233154297, "global_step": 149812, "epoch": 891} {"train_loss": -10.841312408447266, "global_step": 149813, "epoch": 891} {"train_loss": -10.037312507629395, "global_step": 149814, "epoch": 891} {"train_loss": -10.654088973999023, "global_step": 149815, "epoch": 891} {"train_loss": -9.883216857910156, "global_step": 149816, "epoch": 891} {"train_loss": -10.696523666381836, "global_step": 149817, "epoch": 891} {"train_loss": -10.101373672485352, "global_step": 149818, "epoch": 891} {"train_loss": -10.73552131652832, "global_step": 149819, "epoch": 891} {"train_loss": -10.399406433105469, "global_step": 149820, "epoch": 891} {"train_loss": -10.834152221679688, "global_step": 149821, "epoch": 891} {"train_loss": -10.596925735473633, "global_step": 149822, "epoch": 891} {"train_loss": -10.798629760742188, "global_step": 149823, "epoch": 891} {"train_loss": -10.719147682189941, "global_step": 149824, "epoch": 891} {"train_loss": -10.658180236816406, "global_step": 149825, "epoch": 891} {"train_loss": -10.432565689086914, "global_step": 149826, "epoch": 891} {"train_loss": -10.733976364135742, "global_step": 149827, "epoch": 891} {"train_loss": -10.636429786682129, "global_step": 149828, "epoch": 891} {"train_loss": -10.689699172973633, "global_step": 149829, "epoch": 891} {"train_loss": -10.451115608215332, "global_step": 149830, "epoch": 891} {"train_loss": -10.781780242919922, "global_step": 149831, "epoch": 891} {"train_loss": -10.154037475585938, "global_step": 149832, "epoch": 891} {"train_loss": -10.591318130493164, "global_step": 149833, "epoch": 891} {"train_loss": -10.604520797729492, "global_step": 149834, "epoch": 891} {"train_loss": -10.960676193237305, "global_step": 149835, "epoch": 891} {"train_loss": -10.634686470031738, "global_step": 149836, "epoch": 891} {"train_loss": -10.872920989990234, "global_step": 149837, "epoch": 891} {"train_loss": -10.797258377075195, "global_step": 149838, "epoch": 891} {"train_loss": -10.793923377990723, "global_step": 149839, "epoch": 891} {"train_loss": -10.718564987182617, "global_step": 149840, "epoch": 891} {"train_loss": -11.007636070251465, "global_step": 149841, "epoch": 891} {"train_loss": -10.675107955932617, "global_step": 149842, "epoch": 891} {"train_loss": -10.716294288635254, "global_step": 149843, "epoch": 891} {"train_loss": -10.826432228088379, "global_step": 149844, "epoch": 891} {"train_loss": -10.832386016845703, "global_step": 149845, "epoch": 891} {"train_loss": -10.863622665405273, "global_step": 149846, "epoch": 891} {"train_loss": -10.854153633117676, "global_step": 149847, "epoch": 891} {"train_loss": -10.774848937988281, "global_step": 149848, "epoch": 891} {"train_loss": -10.806941986083984, "global_step": 149849, "epoch": 891} {"train_loss": -10.939041137695312, "global_step": 149850, "epoch": 891} {"train_loss": -10.73429012298584, "global_step": 149851, "epoch": 891} {"train_loss": -11.13945198059082, "global_step": 149852, "epoch": 891} {"train_loss": -10.696063995361328, "global_step": 149853, "epoch": 891} {"train_loss": -10.975923538208008, "global_step": 149854, "epoch": 891} {"train_loss": -10.664105602673121, "global_step": 149855, "epoch": 891, "val_loss": 224413.671875} {"train_loss": -11.09762954711914, "global_step": 149856, "epoch": 892} {"train_loss": -10.687248229980469, "global_step": 149857, "epoch": 892} {"train_loss": -10.933954238891602, "global_step": 149858, "epoch": 892} {"train_loss": -10.80712890625, "global_step": 149859, "epoch": 892} {"train_loss": -10.79065990447998, "global_step": 149860, "epoch": 892} {"train_loss": -11.075918197631836, "global_step": 149861, "epoch": 892} {"train_loss": -10.932762145996094, "global_step": 149862, "epoch": 892} {"train_loss": -11.156697273254395, "global_step": 149863, "epoch": 892} {"train_loss": -10.819097518920898, "global_step": 149864, "epoch": 892} {"train_loss": -11.02794075012207, "global_step": 149865, "epoch": 892} {"train_loss": -11.145008087158203, "global_step": 149866, "epoch": 892} {"train_loss": -10.784454345703125, "global_step": 149867, "epoch": 892} {"train_loss": -10.909299850463867, "global_step": 149868, "epoch": 892} {"train_loss": -10.92314338684082, "global_step": 149869, "epoch": 892} {"train_loss": -10.483768463134766, "global_step": 149870, "epoch": 892} {"train_loss": -9.786378860473633, "global_step": 149871, "epoch": 892} {"train_loss": -10.842443466186523, "global_step": 149872, "epoch": 892} {"train_loss": -9.929966926574707, "global_step": 149873, "epoch": 892} {"train_loss": -9.165765762329102, "global_step": 149874, "epoch": 892} {"train_loss": -9.278532028198242, "global_step": 149875, "epoch": 892} {"train_loss": -8.279065132141113, "global_step": 149876, "epoch": 892} {"train_loss": -10.155790328979492, "global_step": 149877, "epoch": 892} {"train_loss": -9.137116432189941, "global_step": 149878, "epoch": 892} {"train_loss": -9.698711395263672, "global_step": 149879, "epoch": 892} {"train_loss": -8.247252464294434, "global_step": 149880, "epoch": 892} {"train_loss": -9.784151077270508, "global_step": 149881, "epoch": 892} {"train_loss": -8.761994361877441, "global_step": 149882, "epoch": 892} {"train_loss": -9.837799072265625, "global_step": 149883, "epoch": 892} {"train_loss": -9.017402648925781, "global_step": 149884, "epoch": 892} {"train_loss": -8.769632339477539, "global_step": 149885, "epoch": 892} {"train_loss": -10.092422485351562, "global_step": 149886, "epoch": 892} {"train_loss": -9.402379989624023, "global_step": 149887, "epoch": 892} {"train_loss": -10.105042457580566, "global_step": 149888, "epoch": 892} {"train_loss": -9.779975891113281, "global_step": 149889, "epoch": 892} {"train_loss": -10.100740432739258, "global_step": 149890, "epoch": 892} {"train_loss": -10.080041885375977, "global_step": 149891, "epoch": 892} {"train_loss": -9.508417129516602, "global_step": 149892, "epoch": 892} {"train_loss": -10.260908126831055, "global_step": 149893, "epoch": 892} {"train_loss": -9.893070220947266, "global_step": 149894, "epoch": 892} {"train_loss": -10.40588092803955, "global_step": 149895, "epoch": 892} {"train_loss": -10.052145004272461, "global_step": 149896, "epoch": 892} {"train_loss": -10.198802947998047, "global_step": 149897, "epoch": 892} {"train_loss": -10.420675277709961, "global_step": 149898, "epoch": 892} {"train_loss": -9.88232421875, "global_step": 149899, "epoch": 892} {"train_loss": -10.504463195800781, "global_step": 149900, "epoch": 892} {"train_loss": -10.314062118530273, "global_step": 149901, "epoch": 892} {"train_loss": -10.47695541381836, "global_step": 149902, "epoch": 892} {"train_loss": -10.306191444396973, "global_step": 149903, "epoch": 892} {"train_loss": -10.311290740966797, "global_step": 149904, "epoch": 892} {"train_loss": -10.43120002746582, "global_step": 149905, "epoch": 892} {"train_loss": -10.556763648986816, "global_step": 149906, "epoch": 892} {"train_loss": -10.689998626708984, "global_step": 149907, "epoch": 892} {"train_loss": -10.524738311767578, "global_step": 149908, "epoch": 892} {"train_loss": -10.448562622070312, "global_step": 149909, "epoch": 892} {"train_loss": -10.443723678588867, "global_step": 149910, "epoch": 892} {"train_loss": -10.55630874633789, "global_step": 149911, "epoch": 892} {"train_loss": -10.716958999633789, "global_step": 149912, "epoch": 892} {"train_loss": -10.678499221801758, "global_step": 149913, "epoch": 892} {"train_loss": -10.626736640930176, "global_step": 149914, "epoch": 892} {"train_loss": -10.604881286621094, "global_step": 149915, "epoch": 892} {"train_loss": -10.782281875610352, "global_step": 149916, "epoch": 892} {"train_loss": -10.566194534301758, "global_step": 149917, "epoch": 892} {"train_loss": -10.554801940917969, "global_step": 149918, "epoch": 892} {"train_loss": -10.609895706176758, "global_step": 149919, "epoch": 892} {"train_loss": -10.840093612670898, "global_step": 149920, "epoch": 892} {"train_loss": -10.473909378051758, "global_step": 149921, "epoch": 892} {"train_loss": -10.66518783569336, "global_step": 149922, "epoch": 892} {"train_loss": -10.658184051513672, "global_step": 149923, "epoch": 892} {"train_loss": -10.737164497375488, "global_step": 149924, "epoch": 892} {"train_loss": -10.776236534118652, "global_step": 149925, "epoch": 892} {"train_loss": -10.751298904418945, "global_step": 149926, "epoch": 892} {"train_loss": -10.615320205688477, "global_step": 149927, "epoch": 892} {"train_loss": -10.694486618041992, "global_step": 149928, "epoch": 892} {"train_loss": -10.629199981689453, "global_step": 149929, "epoch": 892} {"train_loss": -11.004212379455566, "global_step": 149930, "epoch": 892} {"train_loss": -10.664240837097168, "global_step": 149931, "epoch": 892} {"train_loss": -11.063857078552246, "global_step": 149932, "epoch": 892} {"train_loss": -10.9564208984375, "global_step": 149933, "epoch": 892} {"train_loss": -10.932583808898926, "global_step": 149934, "epoch": 892} {"train_loss": -10.821671485900879, "global_step": 149935, "epoch": 892} {"train_loss": -10.924517631530762, "global_step": 149936, "epoch": 892} {"train_loss": -10.903316497802734, "global_step": 149937, "epoch": 892} {"train_loss": -10.826173782348633, "global_step": 149938, "epoch": 892} {"train_loss": -10.501279830932617, "global_step": 149939, "epoch": 892} {"train_loss": -10.922374725341797, "global_step": 149940, "epoch": 892} {"train_loss": -10.735398292541504, "global_step": 149941, "epoch": 892} {"train_loss": -10.844100952148438, "global_step": 149942, "epoch": 892} {"train_loss": -10.755361557006836, "global_step": 149943, "epoch": 892} {"train_loss": -11.018522262573242, "global_step": 149944, "epoch": 892} {"train_loss": -10.766539573669434, "global_step": 149945, "epoch": 892} {"train_loss": -10.819077491760254, "global_step": 149946, "epoch": 892} {"train_loss": -10.950238227844238, "global_step": 149947, "epoch": 892} {"train_loss": -10.937321662902832, "global_step": 149948, "epoch": 892} {"train_loss": -10.517048835754395, "global_step": 149949, "epoch": 892} {"train_loss": -10.836901664733887, "global_step": 149950, "epoch": 892} {"train_loss": -10.631382942199707, "global_step": 149951, "epoch": 892} {"train_loss": -10.628249168395996, "global_step": 149952, "epoch": 892} {"train_loss": -10.678361892700195, "global_step": 149953, "epoch": 892} {"train_loss": -10.908713340759277, "global_step": 149954, "epoch": 892} {"train_loss": -10.702661514282227, "global_step": 149955, "epoch": 892} {"train_loss": -10.934642791748047, "global_step": 149956, "epoch": 892} {"train_loss": -11.073416709899902, "global_step": 149957, "epoch": 892} {"train_loss": -10.667179107666016, "global_step": 149958, "epoch": 892} {"train_loss": -10.88311767578125, "global_step": 149959, "epoch": 892} {"train_loss": -10.956575393676758, "global_step": 149960, "epoch": 892} {"train_loss": -10.820850372314453, "global_step": 149961, "epoch": 892} {"train_loss": -10.795904159545898, "global_step": 149962, "epoch": 892} {"train_loss": -10.85864543914795, "global_step": 149963, "epoch": 892} {"train_loss": -10.867666244506836, "global_step": 149964, "epoch": 892} {"train_loss": -10.67318344116211, "global_step": 149965, "epoch": 892} {"train_loss": -10.798727035522461, "global_step": 149966, "epoch": 892} {"train_loss": -10.519988059997559, "global_step": 149967, "epoch": 892} {"train_loss": -10.084392547607422, "global_step": 149968, "epoch": 892} {"train_loss": -10.72216796875, "global_step": 149969, "epoch": 892} {"train_loss": -10.229172706604004, "global_step": 149970, "epoch": 892} {"train_loss": -10.615073204040527, "global_step": 149971, "epoch": 892} {"train_loss": -10.570819854736328, "global_step": 149972, "epoch": 892} {"train_loss": -10.011086463928223, "global_step": 149973, "epoch": 892} {"train_loss": -10.142532348632812, "global_step": 149974, "epoch": 892} {"train_loss": -10.461782455444336, "global_step": 149975, "epoch": 892} {"train_loss": -10.432109832763672, "global_step": 149976, "epoch": 892} {"train_loss": -10.625844955444336, "global_step": 149977, "epoch": 892} {"train_loss": -10.692787170410156, "global_step": 149978, "epoch": 892} {"train_loss": -10.478540420532227, "global_step": 149979, "epoch": 892} {"train_loss": -10.483081817626953, "global_step": 149980, "epoch": 892} {"train_loss": -10.545835494995117, "global_step": 149981, "epoch": 892} {"train_loss": -10.618878364562988, "global_step": 149982, "epoch": 892} {"train_loss": -10.614521026611328, "global_step": 149983, "epoch": 892} {"train_loss": -10.530052185058594, "global_step": 149984, "epoch": 892} {"train_loss": -10.635292053222656, "global_step": 149985, "epoch": 892} {"train_loss": -10.59866714477539, "global_step": 149986, "epoch": 892} {"train_loss": -10.608171463012695, "global_step": 149987, "epoch": 892} {"train_loss": -10.426214218139648, "global_step": 149988, "epoch": 892} {"train_loss": -10.558135986328125, "global_step": 149989, "epoch": 892} {"train_loss": -10.674419403076172, "global_step": 149990, "epoch": 892} {"train_loss": -10.749555587768555, "global_step": 149991, "epoch": 892} {"train_loss": -10.423213958740234, "global_step": 149992, "epoch": 892} {"train_loss": -10.567704200744629, "global_step": 149993, "epoch": 892} {"train_loss": -10.766703605651855, "global_step": 149994, "epoch": 892} {"train_loss": -10.82728385925293, "global_step": 149995, "epoch": 892} {"train_loss": -11.0103120803833, "global_step": 149996, "epoch": 892} {"train_loss": -10.778192520141602, "global_step": 149997, "epoch": 892} {"train_loss": -11.05169677734375, "global_step": 149998, "epoch": 892} {"train_loss": -10.819496154785156, "global_step": 149999, "epoch": 892} {"train_loss": -10.893991470336914, "global_step": 150000, "epoch": 892} {"train_loss": -10.951082229614258, "global_step": 150001, "epoch": 892} {"train_loss": -10.784295082092285, "global_step": 150002, "epoch": 892} {"train_loss": -10.843997955322266, "global_step": 150003, "epoch": 892} {"train_loss": -10.758966445922852, "global_step": 150004, "epoch": 892} {"train_loss": -10.950126647949219, "global_step": 150005, "epoch": 892} {"train_loss": -10.884153366088867, "global_step": 150006, "epoch": 892} {"train_loss": -10.74614143371582, "global_step": 150007, "epoch": 892} {"train_loss": -10.972445487976074, "global_step": 150008, "epoch": 892} {"train_loss": -10.948257446289062, "global_step": 150009, "epoch": 892} {"train_loss": -10.820816040039062, "global_step": 150010, "epoch": 892} {"train_loss": -10.62816333770752, "global_step": 150011, "epoch": 892} {"train_loss": -10.644190788269043, "global_step": 150012, "epoch": 892} {"train_loss": -10.721589088439941, "global_step": 150013, "epoch": 892} {"train_loss": -10.454307556152344, "global_step": 150014, "epoch": 892} {"train_loss": -10.855903625488281, "global_step": 150015, "epoch": 892} {"train_loss": -10.174880027770996, "global_step": 150016, "epoch": 892} {"train_loss": -11.073552131652832, "global_step": 150017, "epoch": 892} {"train_loss": -10.485333442687988, "global_step": 150018, "epoch": 892} {"train_loss": -10.069178581237793, "global_step": 150019, "epoch": 892} {"train_loss": -10.946755409240723, "global_step": 150020, "epoch": 892} {"train_loss": -10.191694259643555, "global_step": 150021, "epoch": 892} {"train_loss": -10.849996566772461, "global_step": 150022, "epoch": 892} {"train_loss": -10.529139893395561, "global_step": 150023, "epoch": 892, "val_loss": 230995.203125} {"train_loss": -9.845399856567383, "global_step": 150024, "epoch": 893} {"train_loss": -10.585771560668945, "global_step": 150025, "epoch": 893} {"train_loss": -10.692617416381836, "global_step": 150026, "epoch": 893} {"train_loss": -10.28885269165039, "global_step": 150027, "epoch": 893} {"train_loss": -10.747835159301758, "global_step": 150028, "epoch": 893} {"train_loss": -10.417684555053711, "global_step": 150029, "epoch": 893} {"train_loss": -10.444999694824219, "global_step": 150030, "epoch": 893} {"train_loss": -10.57543659210205, "global_step": 150031, "epoch": 893} {"train_loss": -10.159492492675781, "global_step": 150032, "epoch": 893} {"train_loss": -10.685501098632812, "global_step": 150033, "epoch": 893} {"train_loss": -9.852081298828125, "global_step": 150034, "epoch": 893} {"train_loss": -10.423422813415527, "global_step": 150035, "epoch": 893} {"train_loss": -10.49826431274414, "global_step": 150036, "epoch": 893} {"train_loss": -10.364509582519531, "global_step": 150037, "epoch": 893} {"train_loss": -10.614644050598145, "global_step": 150038, "epoch": 893} {"train_loss": -10.490266799926758, "global_step": 150039, "epoch": 893} {"train_loss": -10.520987510681152, "global_step": 150040, "epoch": 893} {"train_loss": -10.855615615844727, "global_step": 150041, "epoch": 893} {"train_loss": -10.415497779846191, "global_step": 150042, "epoch": 893} {"train_loss": -10.863678932189941, "global_step": 150043, "epoch": 893} {"train_loss": -10.654829025268555, "global_step": 150044, "epoch": 893} {"train_loss": -11.000858306884766, "global_step": 150045, "epoch": 893} {"train_loss": -10.693866729736328, "global_step": 150046, "epoch": 893} {"train_loss": -10.771846771240234, "global_step": 150047, "epoch": 893} {"train_loss": -11.199480056762695, "global_step": 150048, "epoch": 893} {"train_loss": -10.664983749389648, "global_step": 150049, "epoch": 893} {"train_loss": -11.03201675415039, "global_step": 150050, "epoch": 893} {"train_loss": -10.806831359863281, "global_step": 150051, "epoch": 893} {"train_loss": -10.942476272583008, "global_step": 150052, "epoch": 893} {"train_loss": -10.651430130004883, "global_step": 150053, "epoch": 893} {"train_loss": -10.812235832214355, "global_step": 150054, "epoch": 893} {"train_loss": -10.921710968017578, "global_step": 150055, "epoch": 893} {"train_loss": -10.569353103637695, "global_step": 150056, "epoch": 893} {"train_loss": -10.785921096801758, "global_step": 150057, "epoch": 893} {"train_loss": -10.937021255493164, "global_step": 150058, "epoch": 893} {"train_loss": -10.570708274841309, "global_step": 150059, "epoch": 893} {"train_loss": -11.059799194335938, "global_step": 150060, "epoch": 893} {"train_loss": -10.597919464111328, "global_step": 150061, "epoch": 893} {"train_loss": -10.959800720214844, "global_step": 150062, "epoch": 893} {"train_loss": -10.729671478271484, "global_step": 150063, "epoch": 893} {"train_loss": -10.593655586242676, "global_step": 150064, "epoch": 893} {"train_loss": -10.470466613769531, "global_step": 150065, "epoch": 893} {"train_loss": -10.653924942016602, "global_step": 150066, "epoch": 893} {"train_loss": -10.805110931396484, "global_step": 150067, "epoch": 893} {"train_loss": -10.612040519714355, "global_step": 150068, "epoch": 893} {"train_loss": -11.026813507080078, "global_step": 150069, "epoch": 893} {"train_loss": -10.592597961425781, "global_step": 150070, "epoch": 893} {"train_loss": -10.880468368530273, "global_step": 150071, "epoch": 893} {"train_loss": -10.94433879852295, "global_step": 150072, "epoch": 893} {"train_loss": -10.926448822021484, "global_step": 150073, "epoch": 893} {"train_loss": -10.979194641113281, "global_step": 150074, "epoch": 893} {"train_loss": -10.849655151367188, "global_step": 150075, "epoch": 893} {"train_loss": -10.828203201293945, "global_step": 150076, "epoch": 893} {"train_loss": -11.07956314086914, "global_step": 150077, "epoch": 893} {"train_loss": -10.901274681091309, "global_step": 150078, "epoch": 893} {"train_loss": -10.870061874389648, "global_step": 150079, "epoch": 893} {"train_loss": -10.909854888916016, "global_step": 150080, "epoch": 893} {"train_loss": -10.947970390319824, "global_step": 150081, "epoch": 893} {"train_loss": -10.899182319641113, "global_step": 150082, "epoch": 893} {"train_loss": -10.96587085723877, "global_step": 150083, "epoch": 893} {"train_loss": -10.860244750976562, "global_step": 150084, "epoch": 893} {"train_loss": -10.533958435058594, "global_step": 150085, "epoch": 893} {"train_loss": -10.848224639892578, "global_step": 150086, "epoch": 893} {"train_loss": -11.11661434173584, "global_step": 150087, "epoch": 893} {"train_loss": -10.990234375, "global_step": 150088, "epoch": 893} {"train_loss": -10.978269577026367, "global_step": 150089, "epoch": 893} {"train_loss": -11.147576332092285, "global_step": 150090, "epoch": 893} {"train_loss": -10.5029296875, "global_step": 150091, "epoch": 893} {"train_loss": -9.73082160949707, "global_step": 150092, "epoch": 893} {"train_loss": -10.9054594039917, "global_step": 150093, "epoch": 893} {"train_loss": -10.312723159790039, "global_step": 150094, "epoch": 893} {"train_loss": -10.457459449768066, "global_step": 150095, "epoch": 893} {"train_loss": -11.005611419677734, "global_step": 150096, "epoch": 893} {"train_loss": -10.111549377441406, "global_step": 150097, "epoch": 893} {"train_loss": -10.001762390136719, "global_step": 150098, "epoch": 893} {"train_loss": -10.440790176391602, "global_step": 150099, "epoch": 893} {"train_loss": -10.445333480834961, "global_step": 150100, "epoch": 893} {"train_loss": -10.302364349365234, "global_step": 150101, "epoch": 893} {"train_loss": -10.276020050048828, "global_step": 150102, "epoch": 893} {"train_loss": -10.36589241027832, "global_step": 150103, "epoch": 893} {"train_loss": -10.605077743530273, "global_step": 150104, "epoch": 893} {"train_loss": -10.275718688964844, "global_step": 150105, "epoch": 893} {"train_loss": -10.127755165100098, "global_step": 150106, "epoch": 893} {"train_loss": -10.330713272094727, "global_step": 150107, "epoch": 893} {"train_loss": -10.142980575561523, "global_step": 150108, "epoch": 893} {"train_loss": -10.31493091583252, "global_step": 150109, "epoch": 893} {"train_loss": -10.498478889465332, "global_step": 150110, "epoch": 893} {"train_loss": -9.910270690917969, "global_step": 150111, "epoch": 893} {"train_loss": -10.697789192199707, "global_step": 150112, "epoch": 893} {"train_loss": -10.46458625793457, "global_step": 150113, "epoch": 893} {"train_loss": -10.54415225982666, "global_step": 150114, "epoch": 893} {"train_loss": -10.658903121948242, "global_step": 150115, "epoch": 893} {"train_loss": -10.210168838500977, "global_step": 150116, "epoch": 893} {"train_loss": -10.744199752807617, "global_step": 150117, "epoch": 893} {"train_loss": -10.614509582519531, "global_step": 150118, "epoch": 893} {"train_loss": -10.3443021774292, "global_step": 150119, "epoch": 893} {"train_loss": -10.876543045043945, "global_step": 150120, "epoch": 893} {"train_loss": -10.506301879882812, "global_step": 150121, "epoch": 893} {"train_loss": -10.396001815795898, "global_step": 150122, "epoch": 893} {"train_loss": -10.908058166503906, "global_step": 150123, "epoch": 893} {"train_loss": -10.495058059692383, "global_step": 150124, "epoch": 893} {"train_loss": -10.72717571258545, "global_step": 150125, "epoch": 893} {"train_loss": -10.605892181396484, "global_step": 150126, "epoch": 893} {"train_loss": -10.507538795471191, "global_step": 150127, "epoch": 893} {"train_loss": -10.825206756591797, "global_step": 150128, "epoch": 893} {"train_loss": -10.490256309509277, "global_step": 150129, "epoch": 893} {"train_loss": -10.546215057373047, "global_step": 150130, "epoch": 893} {"train_loss": -10.345320701599121, "global_step": 150131, "epoch": 893} {"train_loss": -10.761703491210938, "global_step": 150132, "epoch": 893} {"train_loss": -9.907045364379883, "global_step": 150133, "epoch": 893} {"train_loss": -10.426532745361328, "global_step": 150134, "epoch": 893} {"train_loss": -10.33465576171875, "global_step": 150135, "epoch": 893} {"train_loss": -10.455337524414062, "global_step": 150136, "epoch": 893} {"train_loss": -10.386713027954102, "global_step": 150137, "epoch": 893} {"train_loss": -10.090242385864258, "global_step": 150138, "epoch": 893} {"train_loss": -10.7916898727417, "global_step": 150139, "epoch": 893} {"train_loss": -9.978826522827148, "global_step": 150140, "epoch": 893} {"train_loss": -10.75464153289795, "global_step": 150141, "epoch": 893} {"train_loss": -10.413702011108398, "global_step": 150142, "epoch": 893} {"train_loss": -10.614198684692383, "global_step": 150143, "epoch": 893} {"train_loss": -10.777523040771484, "global_step": 150144, "epoch": 893} {"train_loss": -10.630241394042969, "global_step": 150145, "epoch": 893} {"train_loss": -10.395614624023438, "global_step": 150146, "epoch": 893} {"train_loss": -10.822004318237305, "global_step": 150147, "epoch": 893} {"train_loss": -10.236072540283203, "global_step": 150148, "epoch": 893} {"train_loss": -10.745380401611328, "global_step": 150149, "epoch": 893} {"train_loss": -10.580766677856445, "global_step": 150150, "epoch": 893} {"train_loss": -10.845901489257812, "global_step": 150151, "epoch": 893} {"train_loss": -10.641040802001953, "global_step": 150152, "epoch": 893} {"train_loss": -10.283284187316895, "global_step": 150153, "epoch": 893} {"train_loss": -10.43984317779541, "global_step": 150154, "epoch": 893} {"train_loss": -10.87612533569336, "global_step": 150155, "epoch": 893} {"train_loss": -10.771373748779297, "global_step": 150156, "epoch": 893} {"train_loss": -10.706676483154297, "global_step": 150157, "epoch": 893} {"train_loss": -10.722345352172852, "global_step": 150158, "epoch": 893} {"train_loss": -10.785228729248047, "global_step": 150159, "epoch": 893} {"train_loss": -10.136850357055664, "global_step": 150160, "epoch": 893} {"train_loss": -10.763362884521484, "global_step": 150161, "epoch": 893} {"train_loss": -10.089029312133789, "global_step": 150162, "epoch": 893} {"train_loss": -10.777534484863281, "global_step": 150163, "epoch": 893} {"train_loss": -10.367368698120117, "global_step": 150164, "epoch": 893} {"train_loss": -10.193412780761719, "global_step": 150165, "epoch": 893} {"train_loss": -10.872613906860352, "global_step": 150166, "epoch": 893} {"train_loss": -10.445009231567383, "global_step": 150167, "epoch": 893} {"train_loss": -10.396310806274414, "global_step": 150168, "epoch": 893} {"train_loss": -10.666258811950684, "global_step": 150169, "epoch": 893} {"train_loss": -10.944540023803711, "global_step": 150170, "epoch": 893} {"train_loss": -10.669309616088867, "global_step": 150171, "epoch": 893} {"train_loss": -10.650665283203125, "global_step": 150172, "epoch": 893} {"train_loss": -10.317943572998047, "global_step": 150173, "epoch": 893} {"train_loss": -10.782894134521484, "global_step": 150174, "epoch": 893} {"train_loss": -10.718709945678711, "global_step": 150175, "epoch": 893} {"train_loss": -10.797455787658691, "global_step": 150176, "epoch": 893} {"train_loss": -10.84223747253418, "global_step": 150177, "epoch": 893} {"train_loss": -10.908044815063477, "global_step": 150178, "epoch": 893} {"train_loss": -10.592158317565918, "global_step": 150179, "epoch": 893} {"train_loss": -10.966328620910645, "global_step": 150180, "epoch": 893} {"train_loss": -10.979244232177734, "global_step": 150181, "epoch": 893} {"train_loss": -10.801172256469727, "global_step": 150182, "epoch": 893} {"train_loss": -10.523083686828613, "global_step": 150183, "epoch": 893} {"train_loss": -10.706945419311523, "global_step": 150184, "epoch": 893} {"train_loss": -10.5906982421875, "global_step": 150185, "epoch": 893} {"train_loss": -10.294953346252441, "global_step": 150186, "epoch": 893} {"train_loss": -10.674050331115723, "global_step": 150187, "epoch": 893} {"train_loss": -9.954490661621094, "global_step": 150188, "epoch": 893} {"train_loss": -10.324028968811035, "global_step": 150189, "epoch": 893} {"train_loss": -10.057491302490234, "global_step": 150190, "epoch": 893} {"train_loss": -10.59847751117888, "global_step": 150191, "epoch": 893, "val_loss": 230016.28125} {"train_loss": -10.497061729431152, "global_step": 150192, "epoch": 894} {"train_loss": -10.281641006469727, "global_step": 150193, "epoch": 894} {"train_loss": -10.651729583740234, "global_step": 150194, "epoch": 894} {"train_loss": -10.419215202331543, "global_step": 150195, "epoch": 894} {"train_loss": -10.73868179321289, "global_step": 150196, "epoch": 894} {"train_loss": -10.344467163085938, "global_step": 150197, "epoch": 894} {"train_loss": -10.639293670654297, "global_step": 150198, "epoch": 894} {"train_loss": -10.434632301330566, "global_step": 150199, "epoch": 894} {"train_loss": -10.677027702331543, "global_step": 150200, "epoch": 894} {"train_loss": -10.63278579711914, "global_step": 150201, "epoch": 894} {"train_loss": -10.209244728088379, "global_step": 150202, "epoch": 894} {"train_loss": -10.38895320892334, "global_step": 150203, "epoch": 894} {"train_loss": -10.53945255279541, "global_step": 150204, "epoch": 894} {"train_loss": -9.764670372009277, "global_step": 150205, "epoch": 894} {"train_loss": -10.94025993347168, "global_step": 150206, "epoch": 894} {"train_loss": -9.94377326965332, "global_step": 150207, "epoch": 894} {"train_loss": -10.764127731323242, "global_step": 150208, "epoch": 894} {"train_loss": -10.657465934753418, "global_step": 150209, "epoch": 894} {"train_loss": -10.510432243347168, "global_step": 150210, "epoch": 894} {"train_loss": -10.49156665802002, "global_step": 150211, "epoch": 894} {"train_loss": -10.593790054321289, "global_step": 150212, "epoch": 894} {"train_loss": -10.399569511413574, "global_step": 150213, "epoch": 894} {"train_loss": -10.791786193847656, "global_step": 150214, "epoch": 894} {"train_loss": -10.378963470458984, "global_step": 150215, "epoch": 894} {"train_loss": -10.504202842712402, "global_step": 150216, "epoch": 894} {"train_loss": -10.748200416564941, "global_step": 150217, "epoch": 894} {"train_loss": -10.660917282104492, "global_step": 150218, "epoch": 894} {"train_loss": -10.803464889526367, "global_step": 150219, "epoch": 894} {"train_loss": -10.557666778564453, "global_step": 150220, "epoch": 894} {"train_loss": -10.671601295471191, "global_step": 150221, "epoch": 894} {"train_loss": -10.477487564086914, "global_step": 150222, "epoch": 894} {"train_loss": -10.71676254272461, "global_step": 150223, "epoch": 894} {"train_loss": -10.531201362609863, "global_step": 150224, "epoch": 894} {"train_loss": -10.804945945739746, "global_step": 150225, "epoch": 894} {"train_loss": -10.690138816833496, "global_step": 150226, "epoch": 894} {"train_loss": -10.60662841796875, "global_step": 150227, "epoch": 894} {"train_loss": -10.784689903259277, "global_step": 150228, "epoch": 894} {"train_loss": -10.884742736816406, "global_step": 150229, "epoch": 894} {"train_loss": -10.397008895874023, "global_step": 150230, "epoch": 894} {"train_loss": -10.60694408416748, "global_step": 150231, "epoch": 894} {"train_loss": -10.945759773254395, "global_step": 150232, "epoch": 894} {"train_loss": -10.460554122924805, "global_step": 150233, "epoch": 894} {"train_loss": -10.627143859863281, "global_step": 150234, "epoch": 894} {"train_loss": -10.273374557495117, "global_step": 150235, "epoch": 894} {"train_loss": -10.831062316894531, "global_step": 150236, "epoch": 894} {"train_loss": -10.457754135131836, "global_step": 150237, "epoch": 894} {"train_loss": -10.485177040100098, "global_step": 150238, "epoch": 894} {"train_loss": -10.502359390258789, "global_step": 150239, "epoch": 894} {"train_loss": -10.512011528015137, "global_step": 150240, "epoch": 894} {"train_loss": -10.695837020874023, "global_step": 150241, "epoch": 894} {"train_loss": -10.83750057220459, "global_step": 150242, "epoch": 894} {"train_loss": -10.711576461791992, "global_step": 150243, "epoch": 894} {"train_loss": -10.628621101379395, "global_step": 150244, "epoch": 894} {"train_loss": -10.858102798461914, "global_step": 150245, "epoch": 894} {"train_loss": -10.793800354003906, "global_step": 150246, "epoch": 894} {"train_loss": -10.778383255004883, "global_step": 150247, "epoch": 894} {"train_loss": -10.77344036102295, "global_step": 150248, "epoch": 894} {"train_loss": -10.559173583984375, "global_step": 150249, "epoch": 894} {"train_loss": -10.7698974609375, "global_step": 150250, "epoch": 894} {"train_loss": -10.661717414855957, "global_step": 150251, "epoch": 894} {"train_loss": -10.43263053894043, "global_step": 150252, "epoch": 894} {"train_loss": -10.69095230102539, "global_step": 150253, "epoch": 894} {"train_loss": -10.562849998474121, "global_step": 150254, "epoch": 894} {"train_loss": -10.344976425170898, "global_step": 150255, "epoch": 894} {"train_loss": -10.438464164733887, "global_step": 150256, "epoch": 894} {"train_loss": -10.60434341430664, "global_step": 150257, "epoch": 894} {"train_loss": -10.546863555908203, "global_step": 150258, "epoch": 894} {"train_loss": -10.722407341003418, "global_step": 150259, "epoch": 894} {"train_loss": -10.555912017822266, "global_step": 150260, "epoch": 894} {"train_loss": -10.246190071105957, "global_step": 150261, "epoch": 894} {"train_loss": -10.441497802734375, "global_step": 150262, "epoch": 894} {"train_loss": -9.937318801879883, "global_step": 150263, "epoch": 894} {"train_loss": -10.226261138916016, "global_step": 150264, "epoch": 894} {"train_loss": -10.384939193725586, "global_step": 150265, "epoch": 894} {"train_loss": -10.152617454528809, "global_step": 150266, "epoch": 894} {"train_loss": -10.60430908203125, "global_step": 150267, "epoch": 894} {"train_loss": -10.078803062438965, "global_step": 150268, "epoch": 894} {"train_loss": -10.230733871459961, "global_step": 150269, "epoch": 894} {"train_loss": -10.352017402648926, "global_step": 150270, "epoch": 894} {"train_loss": -10.452323913574219, "global_step": 150271, "epoch": 894} {"train_loss": -10.442281723022461, "global_step": 150272, "epoch": 894} {"train_loss": -10.722641944885254, "global_step": 150273, "epoch": 894} {"train_loss": -9.950599670410156, "global_step": 150274, "epoch": 894} {"train_loss": -10.609518051147461, "global_step": 150275, "epoch": 894} {"train_loss": -10.687612533569336, "global_step": 150276, "epoch": 894} {"train_loss": -9.694524765014648, "global_step": 150277, "epoch": 894} {"train_loss": -10.2445707321167, "global_step": 150278, "epoch": 894} {"train_loss": -10.341354370117188, "global_step": 150279, "epoch": 894} {"train_loss": -9.655208587646484, "global_step": 150280, "epoch": 894} {"train_loss": -10.074117660522461, "global_step": 150281, "epoch": 894} {"train_loss": -10.32361888885498, "global_step": 150282, "epoch": 894} {"train_loss": -10.162174224853516, "global_step": 150283, "epoch": 894} {"train_loss": -9.833688735961914, "global_step": 150284, "epoch": 894} {"train_loss": -10.086756706237793, "global_step": 150285, "epoch": 894} {"train_loss": -10.613727569580078, "global_step": 150286, "epoch": 894} {"train_loss": -10.211097717285156, "global_step": 150287, "epoch": 894} {"train_loss": -10.036164283752441, "global_step": 150288, "epoch": 894} {"train_loss": -10.751504898071289, "global_step": 150289, "epoch": 894} {"train_loss": -10.265403747558594, "global_step": 150290, "epoch": 894} {"train_loss": -10.13912582397461, "global_step": 150291, "epoch": 894} {"train_loss": -10.831271171569824, "global_step": 150292, "epoch": 894} {"train_loss": -10.770992279052734, "global_step": 150293, "epoch": 894} {"train_loss": -10.79758071899414, "global_step": 150294, "epoch": 894} {"train_loss": -10.559814453125, "global_step": 150295, "epoch": 894} {"train_loss": -10.704965591430664, "global_step": 150296, "epoch": 894} {"train_loss": -10.708943367004395, "global_step": 150297, "epoch": 894} {"train_loss": -10.762825012207031, "global_step": 150298, "epoch": 894} {"train_loss": -10.660969734191895, "global_step": 150299, "epoch": 894} {"train_loss": -10.787786483764648, "global_step": 150300, "epoch": 894} {"train_loss": -10.622817993164062, "global_step": 150301, "epoch": 894} {"train_loss": -10.914708137512207, "global_step": 150302, "epoch": 894} {"train_loss": -10.74836254119873, "global_step": 150303, "epoch": 894} {"train_loss": -10.838615417480469, "global_step": 150304, "epoch": 894} {"train_loss": -10.88398551940918, "global_step": 150305, "epoch": 894} {"train_loss": -10.672046661376953, "global_step": 150306, "epoch": 894} {"train_loss": -10.821157455444336, "global_step": 150307, "epoch": 894} {"train_loss": -10.96519660949707, "global_step": 150308, "epoch": 894} {"train_loss": -10.91169261932373, "global_step": 150309, "epoch": 894} {"train_loss": -10.960491180419922, "global_step": 150310, "epoch": 894} {"train_loss": -10.874682426452637, "global_step": 150311, "epoch": 894} {"train_loss": -10.789863586425781, "global_step": 150312, "epoch": 894} {"train_loss": -10.804679870605469, "global_step": 150313, "epoch": 894} {"train_loss": -10.746679306030273, "global_step": 150314, "epoch": 894} {"train_loss": -10.707757949829102, "global_step": 150315, "epoch": 894} {"train_loss": -10.714048385620117, "global_step": 150316, "epoch": 894} {"train_loss": -10.71155834197998, "global_step": 150317, "epoch": 894} {"train_loss": -10.708491325378418, "global_step": 150318, "epoch": 894} {"train_loss": -10.324014663696289, "global_step": 150319, "epoch": 894} {"train_loss": -10.851314544677734, "global_step": 150320, "epoch": 894} {"train_loss": -10.54574203491211, "global_step": 150321, "epoch": 894} {"train_loss": -11.137117385864258, "global_step": 150322, "epoch": 894} {"train_loss": -10.696587562561035, "global_step": 150323, "epoch": 894} {"train_loss": -10.379179954528809, "global_step": 150324, "epoch": 894} {"train_loss": -10.231163024902344, "global_step": 150325, "epoch": 894} {"train_loss": -10.428872108459473, "global_step": 150326, "epoch": 894} {"train_loss": -10.901548385620117, "global_step": 150327, "epoch": 894} {"train_loss": -10.346155166625977, "global_step": 150328, "epoch": 894} {"train_loss": -10.908281326293945, "global_step": 150329, "epoch": 894} {"train_loss": -10.639398574829102, "global_step": 150330, "epoch": 894} {"train_loss": -10.772174835205078, "global_step": 150331, "epoch": 894} {"train_loss": -10.723822593688965, "global_step": 150332, "epoch": 894} {"train_loss": -10.683916091918945, "global_step": 150333, "epoch": 894} {"train_loss": -10.676992416381836, "global_step": 150334, "epoch": 894} {"train_loss": -10.124799728393555, "global_step": 150335, "epoch": 894} {"train_loss": -10.580879211425781, "global_step": 150336, "epoch": 894} {"train_loss": -10.370918273925781, "global_step": 150337, "epoch": 894} {"train_loss": -10.846580505371094, "global_step": 150338, "epoch": 894} {"train_loss": -10.811166763305664, "global_step": 150339, "epoch": 894} {"train_loss": -10.636022567749023, "global_step": 150340, "epoch": 894} {"train_loss": -10.90396499633789, "global_step": 150341, "epoch": 894} {"train_loss": -10.474272727966309, "global_step": 150342, "epoch": 894} {"train_loss": -10.65109634399414, "global_step": 150343, "epoch": 894} {"train_loss": -10.285309791564941, "global_step": 150344, "epoch": 894} {"train_loss": -10.314104080200195, "global_step": 150345, "epoch": 894} {"train_loss": -10.606132507324219, "global_step": 150346, "epoch": 894} {"train_loss": -8.64526081085205, "global_step": 150347, "epoch": 894} {"train_loss": -10.040116310119629, "global_step": 150348, "epoch": 894} {"train_loss": -9.11825942993164, "global_step": 150349, "epoch": 894} {"train_loss": -8.936866760253906, "global_step": 150350, "epoch": 894} {"train_loss": -9.416183471679688, "global_step": 150351, "epoch": 894} {"train_loss": -9.640414237976074, "global_step": 150352, "epoch": 894} {"train_loss": -9.5684175491333, "global_step": 150353, "epoch": 894} {"train_loss": -10.198659896850586, "global_step": 150354, "epoch": 894} {"train_loss": -10.195866584777832, "global_step": 150355, "epoch": 894} {"train_loss": -9.534170150756836, "global_step": 150356, "epoch": 894} {"train_loss": -10.148216247558594, "global_step": 150357, "epoch": 894} {"train_loss": -9.818766593933105, "global_step": 150358, "epoch": 894} {"train_loss": -10.483990498951503, "global_step": 150359, "epoch": 894, "val_loss": 227919.90625} {"train_loss": -9.990761756896973, "global_step": 150360, "epoch": 895} {"train_loss": -9.796881675720215, "global_step": 150361, "epoch": 895} {"train_loss": -9.822685241699219, "global_step": 150362, "epoch": 895} {"train_loss": -10.050106048583984, "global_step": 150363, "epoch": 895} {"train_loss": -10.216813087463379, "global_step": 150364, "epoch": 895} {"train_loss": -9.885701179504395, "global_step": 150365, "epoch": 895} {"train_loss": -10.556519508361816, "global_step": 150366, "epoch": 895} {"train_loss": -10.119539260864258, "global_step": 150367, "epoch": 895} {"train_loss": -10.417633056640625, "global_step": 150368, "epoch": 895} {"train_loss": -10.409788131713867, "global_step": 150369, "epoch": 895} {"train_loss": -10.576803207397461, "global_step": 150370, "epoch": 895} {"train_loss": -10.706991195678711, "global_step": 150371, "epoch": 895} {"train_loss": -10.36109733581543, "global_step": 150372, "epoch": 895} {"train_loss": -10.670455932617188, "global_step": 150373, "epoch": 895} {"train_loss": -10.622241020202637, "global_step": 150374, "epoch": 895} {"train_loss": -10.513887405395508, "global_step": 150375, "epoch": 895} {"train_loss": -10.581888198852539, "global_step": 150376, "epoch": 895} {"train_loss": -10.706860542297363, "global_step": 150377, "epoch": 895} {"train_loss": -10.721153259277344, "global_step": 150378, "epoch": 895} {"train_loss": -10.859281539916992, "global_step": 150379, "epoch": 895} {"train_loss": -10.631603240966797, "global_step": 150380, "epoch": 895} {"train_loss": -10.781660079956055, "global_step": 150381, "epoch": 895} {"train_loss": -10.567804336547852, "global_step": 150382, "epoch": 895} {"train_loss": -10.708701133728027, "global_step": 150383, "epoch": 895} {"train_loss": -10.682787895202637, "global_step": 150384, "epoch": 895} {"train_loss": -10.786659240722656, "global_step": 150385, "epoch": 895} {"train_loss": -10.87269401550293, "global_step": 150386, "epoch": 895} {"train_loss": -10.858098983764648, "global_step": 150387, "epoch": 895} {"train_loss": -10.62929916381836, "global_step": 150388, "epoch": 895} {"train_loss": -10.904424667358398, "global_step": 150389, "epoch": 895} {"train_loss": -10.722782135009766, "global_step": 150390, "epoch": 895} {"train_loss": -10.807910919189453, "global_step": 150391, "epoch": 895} {"train_loss": -10.641155242919922, "global_step": 150392, "epoch": 895} {"train_loss": -10.698175430297852, "global_step": 150393, "epoch": 895} {"train_loss": -10.734283447265625, "global_step": 150394, "epoch": 895} {"train_loss": -10.997674942016602, "global_step": 150395, "epoch": 895} {"train_loss": -11.029075622558594, "global_step": 150396, "epoch": 895} {"train_loss": -10.840578079223633, "global_step": 150397, "epoch": 895} {"train_loss": -11.06058120727539, "global_step": 150398, "epoch": 895} {"train_loss": -11.04377555847168, "global_step": 150399, "epoch": 895} {"train_loss": -11.000904083251953, "global_step": 150400, "epoch": 895} {"train_loss": -11.053171157836914, "global_step": 150401, "epoch": 895} {"train_loss": -10.860442161560059, "global_step": 150402, "epoch": 895} {"train_loss": -10.926105499267578, "global_step": 150403, "epoch": 895} {"train_loss": -11.03457260131836, "global_step": 150404, "epoch": 895} {"train_loss": -11.242390632629395, "global_step": 150405, "epoch": 895} {"train_loss": -11.123547554016113, "global_step": 150406, "epoch": 895} {"train_loss": -11.108400344848633, "global_step": 150407, "epoch": 895} {"train_loss": -10.808353424072266, "global_step": 150408, "epoch": 895} {"train_loss": -11.123880386352539, "global_step": 150409, "epoch": 895} {"train_loss": -10.911449432373047, "global_step": 150410, "epoch": 895} {"train_loss": -11.031074523925781, "global_step": 150411, "epoch": 895} {"train_loss": -11.031530380249023, "global_step": 150412, "epoch": 895} {"train_loss": -11.105731964111328, "global_step": 150413, "epoch": 895} {"train_loss": -10.97004508972168, "global_step": 150414, "epoch": 895} {"train_loss": -10.998254776000977, "global_step": 150415, "epoch": 895} {"train_loss": -10.883405685424805, "global_step": 150416, "epoch": 895} {"train_loss": -10.724952697753906, "global_step": 150417, "epoch": 895} {"train_loss": -10.85048770904541, "global_step": 150418, "epoch": 895} {"train_loss": -10.592437744140625, "global_step": 150419, "epoch": 895} {"train_loss": -9.984320640563965, "global_step": 150420, "epoch": 895} {"train_loss": -10.386520385742188, "global_step": 150421, "epoch": 895} {"train_loss": -10.14786434173584, "global_step": 150422, "epoch": 895} {"train_loss": -10.333625793457031, "global_step": 150423, "epoch": 895} {"train_loss": -10.160476684570312, "global_step": 150424, "epoch": 895} {"train_loss": -9.413352966308594, "global_step": 150425, "epoch": 895} {"train_loss": -10.287300109863281, "global_step": 150426, "epoch": 895} {"train_loss": -9.687406539916992, "global_step": 150427, "epoch": 895} {"train_loss": -9.531364440917969, "global_step": 150428, "epoch": 895} {"train_loss": -10.302973747253418, "global_step": 150429, "epoch": 895} {"train_loss": -10.502510070800781, "global_step": 150430, "epoch": 895} {"train_loss": -10.315217971801758, "global_step": 150431, "epoch": 895} {"train_loss": -10.852521896362305, "global_step": 150432, "epoch": 895} {"train_loss": -9.938949584960938, "global_step": 150433, "epoch": 895} {"train_loss": -10.844720840454102, "global_step": 150434, "epoch": 895} {"train_loss": -10.819520950317383, "global_step": 150435, "epoch": 895} {"train_loss": -10.294321060180664, "global_step": 150436, "epoch": 895} {"train_loss": -10.830756187438965, "global_step": 150437, "epoch": 895} {"train_loss": -10.52965259552002, "global_step": 150438, "epoch": 895} {"train_loss": -10.54835033416748, "global_step": 150439, "epoch": 895} {"train_loss": -10.5173978805542, "global_step": 150440, "epoch": 895} {"train_loss": -10.460100173950195, "global_step": 150441, "epoch": 895} {"train_loss": -10.459277153015137, "global_step": 150442, "epoch": 895} {"train_loss": -10.760843276977539, "global_step": 150443, "epoch": 895} {"train_loss": -10.769830703735352, "global_step": 150444, "epoch": 895} {"train_loss": -10.865978240966797, "global_step": 150445, "epoch": 895} {"train_loss": -10.372774124145508, "global_step": 150446, "epoch": 895} {"train_loss": -10.680727005004883, "global_step": 150447, "epoch": 895} {"train_loss": -10.291467666625977, "global_step": 150448, "epoch": 895} {"train_loss": -10.760161399841309, "global_step": 150449, "epoch": 895} {"train_loss": -10.768402099609375, "global_step": 150450, "epoch": 895} {"train_loss": -10.505836486816406, "global_step": 150451, "epoch": 895} {"train_loss": -10.3120756149292, "global_step": 150452, "epoch": 895} {"train_loss": -10.684200286865234, "global_step": 150453, "epoch": 895} {"train_loss": -10.490133285522461, "global_step": 150454, "epoch": 895} {"train_loss": -10.745515823364258, "global_step": 150455, "epoch": 895} {"train_loss": -10.578765869140625, "global_step": 150456, "epoch": 895} {"train_loss": -10.450713157653809, "global_step": 150457, "epoch": 895} {"train_loss": -10.890019416809082, "global_step": 150458, "epoch": 895} {"train_loss": -10.476360321044922, "global_step": 150459, "epoch": 895} {"train_loss": -10.943421363830566, "global_step": 150460, "epoch": 895} {"train_loss": -10.62830924987793, "global_step": 150461, "epoch": 895} {"train_loss": -10.943000793457031, "global_step": 150462, "epoch": 895} {"train_loss": -10.597997665405273, "global_step": 150463, "epoch": 895} {"train_loss": -10.701156616210938, "global_step": 150464, "epoch": 895} {"train_loss": -10.529096603393555, "global_step": 150465, "epoch": 895} {"train_loss": -10.74374008178711, "global_step": 150466, "epoch": 895} {"train_loss": -10.41052532196045, "global_step": 150467, "epoch": 895} {"train_loss": -10.655658721923828, "global_step": 150468, "epoch": 895} {"train_loss": -10.655078887939453, "global_step": 150469, "epoch": 895} {"train_loss": -10.552631378173828, "global_step": 150470, "epoch": 895} {"train_loss": -10.848627090454102, "global_step": 150471, "epoch": 895} {"train_loss": -10.281439781188965, "global_step": 150472, "epoch": 895} {"train_loss": -10.927419662475586, "global_step": 150473, "epoch": 895} {"train_loss": -10.132696151733398, "global_step": 150474, "epoch": 895} {"train_loss": -10.788008689880371, "global_step": 150475, "epoch": 895} {"train_loss": -10.183819770812988, "global_step": 150476, "epoch": 895} {"train_loss": -10.680994033813477, "global_step": 150477, "epoch": 895} {"train_loss": -10.30673599243164, "global_step": 150478, "epoch": 895} {"train_loss": -10.954756736755371, "global_step": 150479, "epoch": 895} {"train_loss": -9.747754096984863, "global_step": 150480, "epoch": 895} {"train_loss": -10.803836822509766, "global_step": 150481, "epoch": 895} {"train_loss": -10.116537094116211, "global_step": 150482, "epoch": 895} {"train_loss": -10.691192626953125, "global_step": 150483, "epoch": 895} {"train_loss": -10.436126708984375, "global_step": 150484, "epoch": 895} {"train_loss": -10.545160293579102, "global_step": 150485, "epoch": 895} {"train_loss": -10.441747665405273, "global_step": 150486, "epoch": 895} {"train_loss": -10.574295043945312, "global_step": 150487, "epoch": 895} {"train_loss": -10.59574031829834, "global_step": 150488, "epoch": 895} {"train_loss": -10.407556533813477, "global_step": 150489, "epoch": 895} {"train_loss": -10.605247497558594, "global_step": 150490, "epoch": 895} {"train_loss": -10.428091049194336, "global_step": 150491, "epoch": 895} {"train_loss": -10.583259582519531, "global_step": 150492, "epoch": 895} {"train_loss": -10.647911071777344, "global_step": 150493, "epoch": 895} {"train_loss": -10.842443466186523, "global_step": 150494, "epoch": 895} {"train_loss": -10.773233413696289, "global_step": 150495, "epoch": 895} {"train_loss": -10.859416007995605, "global_step": 150496, "epoch": 895} {"train_loss": -10.600870132446289, "global_step": 150497, "epoch": 895} {"train_loss": -10.903249740600586, "global_step": 150498, "epoch": 895} {"train_loss": -11.04710865020752, "global_step": 150499, "epoch": 895} {"train_loss": -10.732820510864258, "global_step": 150500, "epoch": 895} {"train_loss": -10.80903148651123, "global_step": 150501, "epoch": 895} {"train_loss": -10.735081672668457, "global_step": 150502, "epoch": 895} {"train_loss": -10.868419647216797, "global_step": 150503, "epoch": 895} {"train_loss": -10.855578422546387, "global_step": 150504, "epoch": 895} {"train_loss": -10.791997909545898, "global_step": 150505, "epoch": 895} {"train_loss": -10.943418502807617, "global_step": 150506, "epoch": 895} {"train_loss": -10.277563095092773, "global_step": 150507, "epoch": 895} {"train_loss": -11.180864334106445, "global_step": 150508, "epoch": 895} {"train_loss": -10.45454216003418, "global_step": 150509, "epoch": 895} {"train_loss": -10.818086624145508, "global_step": 150510, "epoch": 895} {"train_loss": -10.68842887878418, "global_step": 150511, "epoch": 895} {"train_loss": -10.763967514038086, "global_step": 150512, "epoch": 895} {"train_loss": -10.892260551452637, "global_step": 150513, "epoch": 895} {"train_loss": -10.825307846069336, "global_step": 150514, "epoch": 895} {"train_loss": -10.661144256591797, "global_step": 150515, "epoch": 895} {"train_loss": -11.030794143676758, "global_step": 150516, "epoch": 895} {"train_loss": -11.178739547729492, "global_step": 150517, "epoch": 895} {"train_loss": -10.852034568786621, "global_step": 150518, "epoch": 895} {"train_loss": -10.857540130615234, "global_step": 150519, "epoch": 895} {"train_loss": -10.967096328735352, "global_step": 150520, "epoch": 895} {"train_loss": -10.93558120727539, "global_step": 150521, "epoch": 895} {"train_loss": -11.084362030029297, "global_step": 150522, "epoch": 895} {"train_loss": -10.930816650390625, "global_step": 150523, "epoch": 895} {"train_loss": -10.879112243652344, "global_step": 150524, "epoch": 895} {"train_loss": -11.105965614318848, "global_step": 150525, "epoch": 895} {"train_loss": -10.996988296508789, "global_step": 150526, "epoch": 895} {"train_loss": -10.647694076810565, "global_step": 150527, "epoch": 895, "val_loss": 231094.40625, "train_action_mse_error": 1.3307342529296875} {"train_loss": -10.827287673950195, "global_step": 150528, "epoch": 896} {"train_loss": -10.824844360351562, "global_step": 150529, "epoch": 896} {"train_loss": -10.604973793029785, "global_step": 150530, "epoch": 896} {"train_loss": -10.813356399536133, "global_step": 150531, "epoch": 896} {"train_loss": -10.45827865600586, "global_step": 150532, "epoch": 896} {"train_loss": -9.84571647644043, "global_step": 150533, "epoch": 896} {"train_loss": -9.821062088012695, "global_step": 150534, "epoch": 896} {"train_loss": -11.028173446655273, "global_step": 150535, "epoch": 896} {"train_loss": -10.599159240722656, "global_step": 150536, "epoch": 896} {"train_loss": -10.190250396728516, "global_step": 150537, "epoch": 896} {"train_loss": -9.393917083740234, "global_step": 150538, "epoch": 896} {"train_loss": -9.510214805603027, "global_step": 150539, "epoch": 896} {"train_loss": -7.605401992797852, "global_step": 150540, "epoch": 896} {"train_loss": -7.853382110595703, "global_step": 150541, "epoch": 896} {"train_loss": -9.23792552947998, "global_step": 150542, "epoch": 896} {"train_loss": -5.521332740783691, "global_step": 150543, "epoch": 896} {"train_loss": -8.628372192382812, "global_step": 150544, "epoch": 896} {"train_loss": -7.883530139923096, "global_step": 150545, "epoch": 896} {"train_loss": -10.022514343261719, "global_step": 150546, "epoch": 896} {"train_loss": -8.774422645568848, "global_step": 150547, "epoch": 896} {"train_loss": -10.327890396118164, "global_step": 150548, "epoch": 896} {"train_loss": -9.619001388549805, "global_step": 150549, "epoch": 896} {"train_loss": -9.256689071655273, "global_step": 150550, "epoch": 896} {"train_loss": -10.125115394592285, "global_step": 150551, "epoch": 896} {"train_loss": -9.743646621704102, "global_step": 150552, "epoch": 896} {"train_loss": -9.507564544677734, "global_step": 150553, "epoch": 896} {"train_loss": -10.108430862426758, "global_step": 150554, "epoch": 896} {"train_loss": -10.093297004699707, "global_step": 150555, "epoch": 896} {"train_loss": -10.117448806762695, "global_step": 150556, "epoch": 896} {"train_loss": -10.135612487792969, "global_step": 150557, "epoch": 896} {"train_loss": -10.256065368652344, "global_step": 150558, "epoch": 896} {"train_loss": -10.46912670135498, "global_step": 150559, "epoch": 896} {"train_loss": -9.946069717407227, "global_step": 150560, "epoch": 896} {"train_loss": -10.107160568237305, "global_step": 150561, "epoch": 896} {"train_loss": -10.293176651000977, "global_step": 150562, "epoch": 896} {"train_loss": -10.157175064086914, "global_step": 150563, "epoch": 896} {"train_loss": -10.037084579467773, "global_step": 150564, "epoch": 896} {"train_loss": -10.262664794921875, "global_step": 150565, "epoch": 896} {"train_loss": -10.215456008911133, "global_step": 150566, "epoch": 896} {"train_loss": -10.545345306396484, "global_step": 150567, "epoch": 896} {"train_loss": -10.289140701293945, "global_step": 150568, "epoch": 896} {"train_loss": -10.18974494934082, "global_step": 150569, "epoch": 896} {"train_loss": -10.603504180908203, "global_step": 150570, "epoch": 896} {"train_loss": -10.436614990234375, "global_step": 150571, "epoch": 896} {"train_loss": -10.479873657226562, "global_step": 150572, "epoch": 896} {"train_loss": -10.719070434570312, "global_step": 150573, "epoch": 896} {"train_loss": -10.593520164489746, "global_step": 150574, "epoch": 896} {"train_loss": -10.548273086547852, "global_step": 150575, "epoch": 896} {"train_loss": -10.684282302856445, "global_step": 150576, "epoch": 896} {"train_loss": -10.772699356079102, "global_step": 150577, "epoch": 896} {"train_loss": -10.841553688049316, "global_step": 150578, "epoch": 896} {"train_loss": -10.515035629272461, "global_step": 150579, "epoch": 896} {"train_loss": -10.583869934082031, "global_step": 150580, "epoch": 896} {"train_loss": -10.885001182556152, "global_step": 150581, "epoch": 896} {"train_loss": -10.677759170532227, "global_step": 150582, "epoch": 896} {"train_loss": -10.759684562683105, "global_step": 150583, "epoch": 896} {"train_loss": -10.76972770690918, "global_step": 150584, "epoch": 896} {"train_loss": -10.701284408569336, "global_step": 150585, "epoch": 896} {"train_loss": -10.905050277709961, "global_step": 150586, "epoch": 896} {"train_loss": -10.912302017211914, "global_step": 150587, "epoch": 896} {"train_loss": -10.640645980834961, "global_step": 150588, "epoch": 896} {"train_loss": -10.947080612182617, "global_step": 150589, "epoch": 896} {"train_loss": -10.767681121826172, "global_step": 150590, "epoch": 896} {"train_loss": -10.917492866516113, "global_step": 150591, "epoch": 896} {"train_loss": -10.705511093139648, "global_step": 150592, "epoch": 896} {"train_loss": -10.908087730407715, "global_step": 150593, "epoch": 896} {"train_loss": -10.978900909423828, "global_step": 150594, "epoch": 896} {"train_loss": -10.783090591430664, "global_step": 150595, "epoch": 896} {"train_loss": -10.849034309387207, "global_step": 150596, "epoch": 896} {"train_loss": -10.895896911621094, "global_step": 150597, "epoch": 896} {"train_loss": -11.197961807250977, "global_step": 150598, "epoch": 896} {"train_loss": -10.845799446105957, "global_step": 150599, "epoch": 896} {"train_loss": -10.975605010986328, "global_step": 150600, "epoch": 896} {"train_loss": -10.99653434753418, "global_step": 150601, "epoch": 896} {"train_loss": -11.148924827575684, "global_step": 150602, "epoch": 896} {"train_loss": -11.075380325317383, "global_step": 150603, "epoch": 896} {"train_loss": -11.02322769165039, "global_step": 150604, "epoch": 896} {"train_loss": -11.217046737670898, "global_step": 150605, "epoch": 896} {"train_loss": -11.110958099365234, "global_step": 150606, "epoch": 896} {"train_loss": -11.000748634338379, "global_step": 150607, "epoch": 896} {"train_loss": -10.942720413208008, "global_step": 150608, "epoch": 896} {"train_loss": -10.910829544067383, "global_step": 150609, "epoch": 896} {"train_loss": -10.961145401000977, "global_step": 150610, "epoch": 896} {"train_loss": -10.88869857788086, "global_step": 150611, "epoch": 896} {"train_loss": -11.190552711486816, "global_step": 150612, "epoch": 896} {"train_loss": -10.894451141357422, "global_step": 150613, "epoch": 896} {"train_loss": -10.855667114257812, "global_step": 150614, "epoch": 896} {"train_loss": -10.141439437866211, "global_step": 150615, "epoch": 896} {"train_loss": -9.992637634277344, "global_step": 150616, "epoch": 896} {"train_loss": -10.86235237121582, "global_step": 150617, "epoch": 896} {"train_loss": -10.907432556152344, "global_step": 150618, "epoch": 896} {"train_loss": -10.871511459350586, "global_step": 150619, "epoch": 896} {"train_loss": -10.226625442504883, "global_step": 150620, "epoch": 896} {"train_loss": -10.412784576416016, "global_step": 150621, "epoch": 896} {"train_loss": -10.3090238571167, "global_step": 150622, "epoch": 896} {"train_loss": -10.722713470458984, "global_step": 150623, "epoch": 896} {"train_loss": -11.102882385253906, "global_step": 150624, "epoch": 896} {"train_loss": -10.572183609008789, "global_step": 150625, "epoch": 896} {"train_loss": -10.826608657836914, "global_step": 150626, "epoch": 896} {"train_loss": -10.635035514831543, "global_step": 150627, "epoch": 896} {"train_loss": -10.842682838439941, "global_step": 150628, "epoch": 896} {"train_loss": -10.797569274902344, "global_step": 150629, "epoch": 896} {"train_loss": -10.984952926635742, "global_step": 150630, "epoch": 896} {"train_loss": -10.846108436584473, "global_step": 150631, "epoch": 896} {"train_loss": -10.705971717834473, "global_step": 150632, "epoch": 896} {"train_loss": -10.899188041687012, "global_step": 150633, "epoch": 896} {"train_loss": -10.439773559570312, "global_step": 150634, "epoch": 896} {"train_loss": -10.965740203857422, "global_step": 150635, "epoch": 896} {"train_loss": -10.348950386047363, "global_step": 150636, "epoch": 896} {"train_loss": -10.51417064666748, "global_step": 150637, "epoch": 896} {"train_loss": -10.263187408447266, "global_step": 150638, "epoch": 896} {"train_loss": -10.117471694946289, "global_step": 150639, "epoch": 896} {"train_loss": -10.105911254882812, "global_step": 150640, "epoch": 896} {"train_loss": -10.555395126342773, "global_step": 150641, "epoch": 896} {"train_loss": -9.88896369934082, "global_step": 150642, "epoch": 896} {"train_loss": -10.634515762329102, "global_step": 150643, "epoch": 896} {"train_loss": -10.29471206665039, "global_step": 150644, "epoch": 896} {"train_loss": -10.553302764892578, "global_step": 150645, "epoch": 896} {"train_loss": -10.836480140686035, "global_step": 150646, "epoch": 896} {"train_loss": -10.413934707641602, "global_step": 150647, "epoch": 896} {"train_loss": -10.540326118469238, "global_step": 150648, "epoch": 896} {"train_loss": -10.75314712524414, "global_step": 150649, "epoch": 896} {"train_loss": -10.329761505126953, "global_step": 150650, "epoch": 896} {"train_loss": -10.102090835571289, "global_step": 150651, "epoch": 896} {"train_loss": -10.346651077270508, "global_step": 150652, "epoch": 896} {"train_loss": -9.46849250793457, "global_step": 150653, "epoch": 896} {"train_loss": -10.56135368347168, "global_step": 150654, "epoch": 896} {"train_loss": -9.47402572631836, "global_step": 150655, "epoch": 896} {"train_loss": -10.227829933166504, "global_step": 150656, "epoch": 896} {"train_loss": -10.727986335754395, "global_step": 150657, "epoch": 896} {"train_loss": -9.992897033691406, "global_step": 150658, "epoch": 896} {"train_loss": -10.617210388183594, "global_step": 150659, "epoch": 896} {"train_loss": -10.563640594482422, "global_step": 150660, "epoch": 896} {"train_loss": -10.390326499938965, "global_step": 150661, "epoch": 896} {"train_loss": -10.580795288085938, "global_step": 150662, "epoch": 896} {"train_loss": -10.714085578918457, "global_step": 150663, "epoch": 896} {"train_loss": -10.152128219604492, "global_step": 150664, "epoch": 896} {"train_loss": -10.592979431152344, "global_step": 150665, "epoch": 896} {"train_loss": -10.297323226928711, "global_step": 150666, "epoch": 896} {"train_loss": -10.636088371276855, "global_step": 150667, "epoch": 896} {"train_loss": -10.617389678955078, "global_step": 150668, "epoch": 896} {"train_loss": -10.464571952819824, "global_step": 150669, "epoch": 896} {"train_loss": -10.523347854614258, "global_step": 150670, "epoch": 896} {"train_loss": -10.574518203735352, "global_step": 150671, "epoch": 896} {"train_loss": -10.600471496582031, "global_step": 150672, "epoch": 896} {"train_loss": -10.791215896606445, "global_step": 150673, "epoch": 896} {"train_loss": -10.524537086486816, "global_step": 150674, "epoch": 896} {"train_loss": -10.730621337890625, "global_step": 150675, "epoch": 896} {"train_loss": -10.709064483642578, "global_step": 150676, "epoch": 896} {"train_loss": -10.763046264648438, "global_step": 150677, "epoch": 896} {"train_loss": -10.67734146118164, "global_step": 150678, "epoch": 896} {"train_loss": -10.910100936889648, "global_step": 150679, "epoch": 896} {"train_loss": -10.778711318969727, "global_step": 150680, "epoch": 896} {"train_loss": -10.435026168823242, "global_step": 150681, "epoch": 896} {"train_loss": -10.81020450592041, "global_step": 150682, "epoch": 896} {"train_loss": -10.700725555419922, "global_step": 150683, "epoch": 896} {"train_loss": -10.88187313079834, "global_step": 150684, "epoch": 896} {"train_loss": -10.696562767028809, "global_step": 150685, "epoch": 896} {"train_loss": -10.831632614135742, "global_step": 150686, "epoch": 896} {"train_loss": -10.818675994873047, "global_step": 150687, "epoch": 896} {"train_loss": -10.736198425292969, "global_step": 150688, "epoch": 896} {"train_loss": -10.889091491699219, "global_step": 150689, "epoch": 896} {"train_loss": -10.566455841064453, "global_step": 150690, "epoch": 896} {"train_loss": -10.858989715576172, "global_step": 150691, "epoch": 896} {"train_loss": -10.844490051269531, "global_step": 150692, "epoch": 896} {"train_loss": -10.922103881835938, "global_step": 150693, "epoch": 896} {"train_loss": -10.897808074951172, "global_step": 150694, "epoch": 896} {"train_loss": -10.448188495068322, "global_step": 150695, "epoch": 896, "val_loss": 222529.125} {"train_loss": -11.207902908325195, "global_step": 150696, "epoch": 897} {"train_loss": -10.712457656860352, "global_step": 150697, "epoch": 897} {"train_loss": -10.905694961547852, "global_step": 150698, "epoch": 897} {"train_loss": -10.451136589050293, "global_step": 150699, "epoch": 897} {"train_loss": -10.969014167785645, "global_step": 150700, "epoch": 897} {"train_loss": -10.359068870544434, "global_step": 150701, "epoch": 897} {"train_loss": -10.963472366333008, "global_step": 150702, "epoch": 897} {"train_loss": -10.943929672241211, "global_step": 150703, "epoch": 897} {"train_loss": -10.708656311035156, "global_step": 150704, "epoch": 897} {"train_loss": -10.892991065979004, "global_step": 150705, "epoch": 897} {"train_loss": -10.547828674316406, "global_step": 150706, "epoch": 897} {"train_loss": -10.643362998962402, "global_step": 150707, "epoch": 897} {"train_loss": -10.697427749633789, "global_step": 150708, "epoch": 897} {"train_loss": -10.828977584838867, "global_step": 150709, "epoch": 897} {"train_loss": -10.872539520263672, "global_step": 150710, "epoch": 897} {"train_loss": -10.654034614562988, "global_step": 150711, "epoch": 897} {"train_loss": -10.65388298034668, "global_step": 150712, "epoch": 897} {"train_loss": -10.666143417358398, "global_step": 150713, "epoch": 897} {"train_loss": -10.470993041992188, "global_step": 150714, "epoch": 897} {"train_loss": -10.647281646728516, "global_step": 150715, "epoch": 897} {"train_loss": -9.839581489562988, "global_step": 150716, "epoch": 897} {"train_loss": -10.704383850097656, "global_step": 150717, "epoch": 897} {"train_loss": -10.561887741088867, "global_step": 150718, "epoch": 897} {"train_loss": -10.416468620300293, "global_step": 150719, "epoch": 897} {"train_loss": -10.699014663696289, "global_step": 150720, "epoch": 897} {"train_loss": -10.2440185546875, "global_step": 150721, "epoch": 897} {"train_loss": -10.716588973999023, "global_step": 150722, "epoch": 897} {"train_loss": -10.475939750671387, "global_step": 150723, "epoch": 897} {"train_loss": -10.536584854125977, "global_step": 150724, "epoch": 897} {"train_loss": -10.919061660766602, "global_step": 150725, "epoch": 897} {"train_loss": -10.407318115234375, "global_step": 150726, "epoch": 897} {"train_loss": -10.68195915222168, "global_step": 150727, "epoch": 897} {"train_loss": -10.740982055664062, "global_step": 150728, "epoch": 897} {"train_loss": -10.458526611328125, "global_step": 150729, "epoch": 897} {"train_loss": -10.59153938293457, "global_step": 150730, "epoch": 897} {"train_loss": -10.555256843566895, "global_step": 150731, "epoch": 897} {"train_loss": -10.772176742553711, "global_step": 150732, "epoch": 897} {"train_loss": -10.505845069885254, "global_step": 150733, "epoch": 897} {"train_loss": -10.889842987060547, "global_step": 150734, "epoch": 897} {"train_loss": -10.70075798034668, "global_step": 150735, "epoch": 897} {"train_loss": -10.756275177001953, "global_step": 150736, "epoch": 897} {"train_loss": -10.655113220214844, "global_step": 150737, "epoch": 897} {"train_loss": -10.469919204711914, "global_step": 150738, "epoch": 897} {"train_loss": -10.991748809814453, "global_step": 150739, "epoch": 897} {"train_loss": -10.553534507751465, "global_step": 150740, "epoch": 897} {"train_loss": -10.379629135131836, "global_step": 150741, "epoch": 897} {"train_loss": -10.58989143371582, "global_step": 150742, "epoch": 897} {"train_loss": -10.5888090133667, "global_step": 150743, "epoch": 897} {"train_loss": -10.955562591552734, "global_step": 150744, "epoch": 897} {"train_loss": -10.759087562561035, "global_step": 150745, "epoch": 897} {"train_loss": -10.95870590209961, "global_step": 150746, "epoch": 897} {"train_loss": -10.664054870605469, "global_step": 150747, "epoch": 897} {"train_loss": -10.360251426696777, "global_step": 150748, "epoch": 897} {"train_loss": -10.744070053100586, "global_step": 150749, "epoch": 897} {"train_loss": -10.55860424041748, "global_step": 150750, "epoch": 897} {"train_loss": -10.723358154296875, "global_step": 150751, "epoch": 897} {"train_loss": -10.593353271484375, "global_step": 150752, "epoch": 897} {"train_loss": -10.921989440917969, "global_step": 150753, "epoch": 897} {"train_loss": -10.594616889953613, "global_step": 150754, "epoch": 897} {"train_loss": -10.765257835388184, "global_step": 150755, "epoch": 897} {"train_loss": -10.681218147277832, "global_step": 150756, "epoch": 897} {"train_loss": -10.92114543914795, "global_step": 150757, "epoch": 897} {"train_loss": -10.722746849060059, "global_step": 150758, "epoch": 897} {"train_loss": -10.778830528259277, "global_step": 150759, "epoch": 897} {"train_loss": -10.928452491760254, "global_step": 150760, "epoch": 897} {"train_loss": -10.79665756225586, "global_step": 150761, "epoch": 897} {"train_loss": -10.920321464538574, "global_step": 150762, "epoch": 897} {"train_loss": -11.012248992919922, "global_step": 150763, "epoch": 897} {"train_loss": -10.935099601745605, "global_step": 150764, "epoch": 897} {"train_loss": -10.947973251342773, "global_step": 150765, "epoch": 897} {"train_loss": -10.763740539550781, "global_step": 150766, "epoch": 897} {"train_loss": -10.902276039123535, "global_step": 150767, "epoch": 897} {"train_loss": -10.851856231689453, "global_step": 150768, "epoch": 897} {"train_loss": -10.92222785949707, "global_step": 150769, "epoch": 897} {"train_loss": -10.91627025604248, "global_step": 150770, "epoch": 897} {"train_loss": -10.791093826293945, "global_step": 150771, "epoch": 897} {"train_loss": -10.908232688903809, "global_step": 150772, "epoch": 897} {"train_loss": -11.006662368774414, "global_step": 150773, "epoch": 897} {"train_loss": -10.810699462890625, "global_step": 150774, "epoch": 897} {"train_loss": -10.987668991088867, "global_step": 150775, "epoch": 897} {"train_loss": -10.974370956420898, "global_step": 150776, "epoch": 897} {"train_loss": -10.89097785949707, "global_step": 150777, "epoch": 897} {"train_loss": -10.812597274780273, "global_step": 150778, "epoch": 897} {"train_loss": -10.778382301330566, "global_step": 150779, "epoch": 897} {"train_loss": -10.710895538330078, "global_step": 150780, "epoch": 897} {"train_loss": -10.894173622131348, "global_step": 150781, "epoch": 897} {"train_loss": -10.894918441772461, "global_step": 150782, "epoch": 897} {"train_loss": -10.729949951171875, "global_step": 150783, "epoch": 897} {"train_loss": -10.866151809692383, "global_step": 150784, "epoch": 897} {"train_loss": -10.945012092590332, "global_step": 150785, "epoch": 897} {"train_loss": -10.638930320739746, "global_step": 150786, "epoch": 897} {"train_loss": -10.76760482788086, "global_step": 150787, "epoch": 897} {"train_loss": -11.113804817199707, "global_step": 150788, "epoch": 897} {"train_loss": -10.446476936340332, "global_step": 150789, "epoch": 897} {"train_loss": -10.496976852416992, "global_step": 150790, "epoch": 897} {"train_loss": -10.691629409790039, "global_step": 150791, "epoch": 897} {"train_loss": -10.742891311645508, "global_step": 150792, "epoch": 897} {"train_loss": -8.961372375488281, "global_step": 150793, "epoch": 897} {"train_loss": -9.735942840576172, "global_step": 150794, "epoch": 897} {"train_loss": -10.253532409667969, "global_step": 150795, "epoch": 897} {"train_loss": -8.76494026184082, "global_step": 150796, "epoch": 897} {"train_loss": -10.426582336425781, "global_step": 150797, "epoch": 897} {"train_loss": -9.467866897583008, "global_step": 150798, "epoch": 897} {"train_loss": -9.938961029052734, "global_step": 150799, "epoch": 897} {"train_loss": -10.327340126037598, "global_step": 150800, "epoch": 897} {"train_loss": -9.920490264892578, "global_step": 150801, "epoch": 897} {"train_loss": -10.62750244140625, "global_step": 150802, "epoch": 897} {"train_loss": -10.22165298461914, "global_step": 150803, "epoch": 897} {"train_loss": -10.27275276184082, "global_step": 150804, "epoch": 897} {"train_loss": -10.283487319946289, "global_step": 150805, "epoch": 897} {"train_loss": -10.373279571533203, "global_step": 150806, "epoch": 897} {"train_loss": -10.141288757324219, "global_step": 150807, "epoch": 897} {"train_loss": -10.663265228271484, "global_step": 150808, "epoch": 897} {"train_loss": -10.300010681152344, "global_step": 150809, "epoch": 897} {"train_loss": -10.397665977478027, "global_step": 150810, "epoch": 897} {"train_loss": -10.496572494506836, "global_step": 150811, "epoch": 897} {"train_loss": -10.57093334197998, "global_step": 150812, "epoch": 897} {"train_loss": -10.536808013916016, "global_step": 150813, "epoch": 897} {"train_loss": -10.618399620056152, "global_step": 150814, "epoch": 897} {"train_loss": -10.719056129455566, "global_step": 150815, "epoch": 897} {"train_loss": -10.579874992370605, "global_step": 150816, "epoch": 897} {"train_loss": -10.644990921020508, "global_step": 150817, "epoch": 897} {"train_loss": -10.79580307006836, "global_step": 150818, "epoch": 897} {"train_loss": -10.701881408691406, "global_step": 150819, "epoch": 897} {"train_loss": -10.767074584960938, "global_step": 150820, "epoch": 897} {"train_loss": -10.69961166381836, "global_step": 150821, "epoch": 897} {"train_loss": -10.631868362426758, "global_step": 150822, "epoch": 897} {"train_loss": -10.81877326965332, "global_step": 150823, "epoch": 897} {"train_loss": -10.819013595581055, "global_step": 150824, "epoch": 897} {"train_loss": -10.793106079101562, "global_step": 150825, "epoch": 897} {"train_loss": -10.782959938049316, "global_step": 150826, "epoch": 897} {"train_loss": -10.64531135559082, "global_step": 150827, "epoch": 897} {"train_loss": -10.833823204040527, "global_step": 150828, "epoch": 897} {"train_loss": -10.812457084655762, "global_step": 150829, "epoch": 897} {"train_loss": -10.740096092224121, "global_step": 150830, "epoch": 897} {"train_loss": -10.94471263885498, "global_step": 150831, "epoch": 897} {"train_loss": -10.671165466308594, "global_step": 150832, "epoch": 897} {"train_loss": -10.976848602294922, "global_step": 150833, "epoch": 897} {"train_loss": -10.356558799743652, "global_step": 150834, "epoch": 897} {"train_loss": -10.803243637084961, "global_step": 150835, "epoch": 897} {"train_loss": -10.78607177734375, "global_step": 150836, "epoch": 897} {"train_loss": -10.389646530151367, "global_step": 150837, "epoch": 897} {"train_loss": -10.841326713562012, "global_step": 150838, "epoch": 897} {"train_loss": -10.954099655151367, "global_step": 150839, "epoch": 897} {"train_loss": -10.53567123413086, "global_step": 150840, "epoch": 897} {"train_loss": -10.968537330627441, "global_step": 150841, "epoch": 897} {"train_loss": -10.535255432128906, "global_step": 150842, "epoch": 897} {"train_loss": -10.719858169555664, "global_step": 150843, "epoch": 897} {"train_loss": -10.846907615661621, "global_step": 150844, "epoch": 897} {"train_loss": -10.798739433288574, "global_step": 150845, "epoch": 897} {"train_loss": -11.053739547729492, "global_step": 150846, "epoch": 897} {"train_loss": -10.717184066772461, "global_step": 150847, "epoch": 897} {"train_loss": -11.035116195678711, "global_step": 150848, "epoch": 897} {"train_loss": -10.359640121459961, "global_step": 150849, "epoch": 897} {"train_loss": -10.676719665527344, "global_step": 150850, "epoch": 897} {"train_loss": -10.971805572509766, "global_step": 150851, "epoch": 897} {"train_loss": -10.625539779663086, "global_step": 150852, "epoch": 897} {"train_loss": -10.487306594848633, "global_step": 150853, "epoch": 897} {"train_loss": -10.940864562988281, "global_step": 150854, "epoch": 897} {"train_loss": -10.593121528625488, "global_step": 150855, "epoch": 897} {"train_loss": -10.918556213378906, "global_step": 150856, "epoch": 897} {"train_loss": -10.83460807800293, "global_step": 150857, "epoch": 897} {"train_loss": -10.870546340942383, "global_step": 150858, "epoch": 897} {"train_loss": -10.723541259765625, "global_step": 150859, "epoch": 897} {"train_loss": -10.9444580078125, "global_step": 150860, "epoch": 897} {"train_loss": -10.844278335571289, "global_step": 150861, "epoch": 897} {"train_loss": -10.959754943847656, "global_step": 150862, "epoch": 897} {"train_loss": -10.66305851368677, "global_step": 150863, "epoch": 897, "val_loss": 225358.96875} {"train_loss": -10.654777526855469, "global_step": 150864, "epoch": 898} {"train_loss": -10.788383483886719, "global_step": 150865, "epoch": 898} {"train_loss": -10.707382202148438, "global_step": 150866, "epoch": 898} {"train_loss": -10.930286407470703, "global_step": 150867, "epoch": 898} {"train_loss": -10.78292465209961, "global_step": 150868, "epoch": 898} {"train_loss": -10.787995338439941, "global_step": 150869, "epoch": 898} {"train_loss": -10.732906341552734, "global_step": 150870, "epoch": 898} {"train_loss": -10.737756729125977, "global_step": 150871, "epoch": 898} {"train_loss": -10.622692108154297, "global_step": 150872, "epoch": 898} {"train_loss": -10.7807035446167, "global_step": 150873, "epoch": 898} {"train_loss": -10.467620849609375, "global_step": 150874, "epoch": 898} {"train_loss": -10.79556655883789, "global_step": 150875, "epoch": 898} {"train_loss": -10.555665016174316, "global_step": 150876, "epoch": 898} {"train_loss": -10.945072174072266, "global_step": 150877, "epoch": 898} {"train_loss": -10.432567596435547, "global_step": 150878, "epoch": 898} {"train_loss": -10.747272491455078, "global_step": 150879, "epoch": 898} {"train_loss": -10.142271041870117, "global_step": 150880, "epoch": 898} {"train_loss": -9.818949699401855, "global_step": 150881, "epoch": 898} {"train_loss": -9.699880599975586, "global_step": 150882, "epoch": 898} {"train_loss": -9.087311744689941, "global_step": 150883, "epoch": 898} {"train_loss": -9.22723388671875, "global_step": 150884, "epoch": 898} {"train_loss": -9.859643936157227, "global_step": 150885, "epoch": 898} {"train_loss": -9.387418746948242, "global_step": 150886, "epoch": 898} {"train_loss": -10.163596153259277, "global_step": 150887, "epoch": 898} {"train_loss": -9.958427429199219, "global_step": 150888, "epoch": 898} {"train_loss": -9.813753128051758, "global_step": 150889, "epoch": 898} {"train_loss": -10.231829643249512, "global_step": 150890, "epoch": 898} {"train_loss": -9.494638442993164, "global_step": 150891, "epoch": 898} {"train_loss": -9.258926391601562, "global_step": 150892, "epoch": 898} {"train_loss": -10.372127532958984, "global_step": 150893, "epoch": 898} {"train_loss": -8.750711441040039, "global_step": 150894, "epoch": 898} {"train_loss": -9.278090476989746, "global_step": 150895, "epoch": 898} {"train_loss": -10.269989013671875, "global_step": 150896, "epoch": 898} {"train_loss": -9.695660591125488, "global_step": 150897, "epoch": 898} {"train_loss": -9.00027084350586, "global_step": 150898, "epoch": 898} {"train_loss": -10.350469589233398, "global_step": 150899, "epoch": 898} {"train_loss": -10.01815414428711, "global_step": 150900, "epoch": 898} {"train_loss": -9.444072723388672, "global_step": 150901, "epoch": 898} {"train_loss": -10.345861434936523, "global_step": 150902, "epoch": 898} {"train_loss": -9.930498123168945, "global_step": 150903, "epoch": 898} {"train_loss": -9.860108375549316, "global_step": 150904, "epoch": 898} {"train_loss": -10.018420219421387, "global_step": 150905, "epoch": 898} {"train_loss": -10.277750015258789, "global_step": 150906, "epoch": 898} {"train_loss": -10.089178085327148, "global_step": 150907, "epoch": 898} {"train_loss": -10.124832153320312, "global_step": 150908, "epoch": 898} {"train_loss": -10.404787063598633, "global_step": 150909, "epoch": 898} {"train_loss": -10.090269088745117, "global_step": 150910, "epoch": 898} {"train_loss": -10.634597778320312, "global_step": 150911, "epoch": 898} {"train_loss": -10.020698547363281, "global_step": 150912, "epoch": 898} {"train_loss": -10.475879669189453, "global_step": 150913, "epoch": 898} {"train_loss": -10.450664520263672, "global_step": 150914, "epoch": 898} {"train_loss": -10.321674346923828, "global_step": 150915, "epoch": 898} {"train_loss": -10.41309928894043, "global_step": 150916, "epoch": 898} {"train_loss": -10.479818344116211, "global_step": 150917, "epoch": 898} {"train_loss": -10.450699806213379, "global_step": 150918, "epoch": 898} {"train_loss": -10.616334915161133, "global_step": 150919, "epoch": 898} {"train_loss": -10.558141708374023, "global_step": 150920, "epoch": 898} {"train_loss": -10.772909164428711, "global_step": 150921, "epoch": 898} {"train_loss": -10.690254211425781, "global_step": 150922, "epoch": 898} {"train_loss": -10.496025085449219, "global_step": 150923, "epoch": 898} {"train_loss": -10.67711353302002, "global_step": 150924, "epoch": 898} {"train_loss": -10.651433944702148, "global_step": 150925, "epoch": 898} {"train_loss": -10.669393539428711, "global_step": 150926, "epoch": 898} {"train_loss": -10.597662925720215, "global_step": 150927, "epoch": 898} {"train_loss": -10.46845817565918, "global_step": 150928, "epoch": 898} {"train_loss": -10.729419708251953, "global_step": 150929, "epoch": 898} {"train_loss": -10.736464500427246, "global_step": 150930, "epoch": 898} {"train_loss": -10.58456802368164, "global_step": 150931, "epoch": 898} {"train_loss": -10.833610534667969, "global_step": 150932, "epoch": 898} {"train_loss": -10.796926498413086, "global_step": 150933, "epoch": 898} {"train_loss": -10.752395629882812, "global_step": 150934, "epoch": 898} {"train_loss": -10.763080596923828, "global_step": 150935, "epoch": 898} {"train_loss": -10.888336181640625, "global_step": 150936, "epoch": 898} {"train_loss": -10.679521560668945, "global_step": 150937, "epoch": 898} {"train_loss": -10.937549591064453, "global_step": 150938, "epoch": 898} {"train_loss": -10.818193435668945, "global_step": 150939, "epoch": 898} {"train_loss": -10.777650833129883, "global_step": 150940, "epoch": 898} {"train_loss": -10.943580627441406, "global_step": 150941, "epoch": 898} {"train_loss": -10.857949256896973, "global_step": 150942, "epoch": 898} {"train_loss": -11.01125717163086, "global_step": 150943, "epoch": 898} {"train_loss": -11.071608543395996, "global_step": 150944, "epoch": 898} {"train_loss": -11.040019989013672, "global_step": 150945, "epoch": 898} {"train_loss": -10.956287384033203, "global_step": 150946, "epoch": 898} {"train_loss": -11.25898265838623, "global_step": 150947, "epoch": 898} {"train_loss": -11.051900863647461, "global_step": 150948, "epoch": 898} {"train_loss": -10.854650497436523, "global_step": 150949, "epoch": 898} {"train_loss": -11.006696701049805, "global_step": 150950, "epoch": 898} {"train_loss": -11.01430606842041, "global_step": 150951, "epoch": 898} {"train_loss": -10.952481269836426, "global_step": 150952, "epoch": 898} {"train_loss": -11.203533172607422, "global_step": 150953, "epoch": 898} {"train_loss": -11.067540168762207, "global_step": 150954, "epoch": 898} {"train_loss": -10.785351753234863, "global_step": 150955, "epoch": 898} {"train_loss": -11.230767250061035, "global_step": 150956, "epoch": 898} {"train_loss": -11.194721221923828, "global_step": 150957, "epoch": 898} {"train_loss": -10.885232925415039, "global_step": 150958, "epoch": 898} {"train_loss": -11.331491470336914, "global_step": 150959, "epoch": 898} {"train_loss": -11.306343078613281, "global_step": 150960, "epoch": 898} {"train_loss": -11.333674430847168, "global_step": 150961, "epoch": 898} {"train_loss": -10.942132949829102, "global_step": 150962, "epoch": 898} {"train_loss": -11.012895584106445, "global_step": 150963, "epoch": 898} {"train_loss": -11.057876586914062, "global_step": 150964, "epoch": 898} {"train_loss": -11.309319496154785, "global_step": 150965, "epoch": 898} {"train_loss": -11.191780090332031, "global_step": 150966, "epoch": 898} {"train_loss": -10.663307189941406, "global_step": 150967, "epoch": 898} {"train_loss": -9.964781761169434, "global_step": 150968, "epoch": 898} {"train_loss": -10.516633987426758, "global_step": 150969, "epoch": 898} {"train_loss": -9.49018669128418, "global_step": 150970, "epoch": 898} {"train_loss": -9.432548522949219, "global_step": 150971, "epoch": 898} {"train_loss": -10.06515121459961, "global_step": 150972, "epoch": 898} {"train_loss": -9.715333938598633, "global_step": 150973, "epoch": 898} {"train_loss": -9.42707633972168, "global_step": 150974, "epoch": 898} {"train_loss": -9.268659591674805, "global_step": 150975, "epoch": 898} {"train_loss": -10.088080406188965, "global_step": 150976, "epoch": 898} {"train_loss": -9.869115829467773, "global_step": 150977, "epoch": 898} {"train_loss": -10.315988540649414, "global_step": 150978, "epoch": 898} {"train_loss": -10.333314895629883, "global_step": 150979, "epoch": 898} {"train_loss": -9.793947219848633, "global_step": 150980, "epoch": 898} {"train_loss": -9.874313354492188, "global_step": 150981, "epoch": 898} {"train_loss": -9.857890129089355, "global_step": 150982, "epoch": 898} {"train_loss": -10.244354248046875, "global_step": 150983, "epoch": 898} {"train_loss": -10.106561660766602, "global_step": 150984, "epoch": 898} {"train_loss": -10.172281265258789, "global_step": 150985, "epoch": 898} {"train_loss": -10.226339340209961, "global_step": 150986, "epoch": 898} {"train_loss": -9.807415008544922, "global_step": 150987, "epoch": 898} {"train_loss": -10.382436752319336, "global_step": 150988, "epoch": 898} {"train_loss": -10.430889129638672, "global_step": 150989, "epoch": 898} {"train_loss": -10.402030944824219, "global_step": 150990, "epoch": 898} {"train_loss": -10.4934663772583, "global_step": 150991, "epoch": 898} {"train_loss": -10.185436248779297, "global_step": 150992, "epoch": 898} {"train_loss": -10.322354316711426, "global_step": 150993, "epoch": 898} {"train_loss": -9.976465225219727, "global_step": 150994, "epoch": 898} {"train_loss": -10.66750717163086, "global_step": 150995, "epoch": 898} {"train_loss": -9.91585922241211, "global_step": 150996, "epoch": 898} {"train_loss": -10.287983894348145, "global_step": 150997, "epoch": 898} {"train_loss": -10.764457702636719, "global_step": 150998, "epoch": 898} {"train_loss": -10.098101615905762, "global_step": 150999, "epoch": 898} {"train_loss": -10.310310363769531, "global_step": 151000, "epoch": 898} {"train_loss": -10.538127899169922, "global_step": 151001, "epoch": 898} {"train_loss": -10.316502571105957, "global_step": 151002, "epoch": 898} {"train_loss": -10.043675422668457, "global_step": 151003, "epoch": 898} {"train_loss": -10.803750038146973, "global_step": 151004, "epoch": 898} {"train_loss": -10.426528930664062, "global_step": 151005, "epoch": 898} {"train_loss": -10.138540267944336, "global_step": 151006, "epoch": 898} {"train_loss": -10.70596694946289, "global_step": 151007, "epoch": 898} {"train_loss": -10.489736557006836, "global_step": 151008, "epoch": 898} {"train_loss": -10.411216735839844, "global_step": 151009, "epoch": 898} {"train_loss": -10.383880615234375, "global_step": 151010, "epoch": 898} {"train_loss": -10.592796325683594, "global_step": 151011, "epoch": 898} {"train_loss": -10.430038452148438, "global_step": 151012, "epoch": 898} {"train_loss": -10.434591293334961, "global_step": 151013, "epoch": 898} {"train_loss": -10.775938034057617, "global_step": 151014, "epoch": 898} {"train_loss": -10.66499137878418, "global_step": 151015, "epoch": 898} {"train_loss": -10.712989807128906, "global_step": 151016, "epoch": 898} {"train_loss": -10.70599365234375, "global_step": 151017, "epoch": 898} {"train_loss": -10.551980972290039, "global_step": 151018, "epoch": 898} {"train_loss": -10.610860824584961, "global_step": 151019, "epoch": 898} {"train_loss": -10.749395370483398, "global_step": 151020, "epoch": 898} {"train_loss": -10.608606338500977, "global_step": 151021, "epoch": 898} {"train_loss": -10.909196853637695, "global_step": 151022, "epoch": 898} {"train_loss": -10.844411849975586, "global_step": 151023, "epoch": 898} {"train_loss": -10.803576469421387, "global_step": 151024, "epoch": 898} {"train_loss": -10.831947326660156, "global_step": 151025, "epoch": 898} {"train_loss": -10.849245071411133, "global_step": 151026, "epoch": 898} {"train_loss": -10.830001831054688, "global_step": 151027, "epoch": 898} {"train_loss": -10.81360149383545, "global_step": 151028, "epoch": 898} {"train_loss": -10.926200866699219, "global_step": 151029, "epoch": 898} {"train_loss": -10.756355285644531, "global_step": 151030, "epoch": 898} {"train_loss": -10.449865988322667, "global_step": 151031, "epoch": 898, "val_loss": 227949.765625} {"train_loss": -10.625249862670898, "global_step": 151032, "epoch": 899} {"train_loss": -10.882097244262695, "global_step": 151033, "epoch": 899} {"train_loss": -10.814458847045898, "global_step": 151034, "epoch": 899} {"train_loss": -10.903703689575195, "global_step": 151035, "epoch": 899} {"train_loss": -10.976521492004395, "global_step": 151036, "epoch": 899} {"train_loss": -10.759499549865723, "global_step": 151037, "epoch": 899} {"train_loss": -10.695280075073242, "global_step": 151038, "epoch": 899} {"train_loss": -10.88214111328125, "global_step": 151039, "epoch": 899} {"train_loss": -10.820075988769531, "global_step": 151040, "epoch": 899} {"train_loss": -10.801066398620605, "global_step": 151041, "epoch": 899} {"train_loss": -10.937095642089844, "global_step": 151042, "epoch": 899} {"train_loss": -10.584029197692871, "global_step": 151043, "epoch": 899} {"train_loss": -10.810463905334473, "global_step": 151044, "epoch": 899} {"train_loss": -10.585371017456055, "global_step": 151045, "epoch": 899} {"train_loss": -10.452962875366211, "global_step": 151046, "epoch": 899} {"train_loss": -10.922882080078125, "global_step": 151047, "epoch": 899} {"train_loss": -10.604997634887695, "global_step": 151048, "epoch": 899} {"train_loss": -10.811717987060547, "global_step": 151049, "epoch": 899} {"train_loss": -10.953569412231445, "global_step": 151050, "epoch": 899} {"train_loss": -10.647109985351562, "global_step": 151051, "epoch": 899} {"train_loss": -10.74549674987793, "global_step": 151052, "epoch": 899} {"train_loss": -10.840553283691406, "global_step": 151053, "epoch": 899} {"train_loss": -10.791853904724121, "global_step": 151054, "epoch": 899} {"train_loss": -10.880867004394531, "global_step": 151055, "epoch": 899} {"train_loss": -10.6727876663208, "global_step": 151056, "epoch": 899} {"train_loss": -10.968893051147461, "global_step": 151057, "epoch": 899} {"train_loss": -10.839893341064453, "global_step": 151058, "epoch": 899} {"train_loss": -10.443662643432617, "global_step": 151059, "epoch": 899} {"train_loss": -10.903620719909668, "global_step": 151060, "epoch": 899} {"train_loss": -10.546499252319336, "global_step": 151061, "epoch": 899} {"train_loss": -10.49226188659668, "global_step": 151062, "epoch": 899} {"train_loss": -10.477980613708496, "global_step": 151063, "epoch": 899} {"train_loss": -10.678443908691406, "global_step": 151064, "epoch": 899} {"train_loss": -10.853493690490723, "global_step": 151065, "epoch": 899} {"train_loss": -10.865900039672852, "global_step": 151066, "epoch": 899} {"train_loss": -10.787883758544922, "global_step": 151067, "epoch": 899} {"train_loss": -10.992239952087402, "global_step": 151068, "epoch": 899} {"train_loss": -10.760313034057617, "global_step": 151069, "epoch": 899} {"train_loss": -10.851987838745117, "global_step": 151070, "epoch": 899} {"train_loss": -10.97541618347168, "global_step": 151071, "epoch": 899} {"train_loss": -10.85191535949707, "global_step": 151072, "epoch": 899} {"train_loss": -10.5643310546875, "global_step": 151073, "epoch": 899} {"train_loss": -10.66438102722168, "global_step": 151074, "epoch": 899} {"train_loss": -10.664665222167969, "global_step": 151075, "epoch": 899} {"train_loss": -10.414674758911133, "global_step": 151076, "epoch": 899} {"train_loss": -10.86618423461914, "global_step": 151077, "epoch": 899} {"train_loss": -10.539438247680664, "global_step": 151078, "epoch": 899} {"train_loss": -10.896787643432617, "global_step": 151079, "epoch": 899} {"train_loss": -10.577125549316406, "global_step": 151080, "epoch": 899} {"train_loss": -10.71509838104248, "global_step": 151081, "epoch": 899} {"train_loss": -11.047691345214844, "global_step": 151082, "epoch": 899} {"train_loss": -10.756905555725098, "global_step": 151083, "epoch": 899} {"train_loss": -10.651676177978516, "global_step": 151084, "epoch": 899} {"train_loss": -10.822484970092773, "global_step": 151085, "epoch": 899} {"train_loss": -10.739912033081055, "global_step": 151086, "epoch": 899} {"train_loss": -10.841633796691895, "global_step": 151087, "epoch": 899} {"train_loss": -10.826921463012695, "global_step": 151088, "epoch": 899} {"train_loss": -10.800979614257812, "global_step": 151089, "epoch": 899} {"train_loss": -10.88257122039795, "global_step": 151090, "epoch": 899} {"train_loss": -10.737394332885742, "global_step": 151091, "epoch": 899} {"train_loss": -10.38532543182373, "global_step": 151092, "epoch": 899} {"train_loss": -10.645037651062012, "global_step": 151093, "epoch": 899} {"train_loss": -10.753707885742188, "global_step": 151094, "epoch": 899} {"train_loss": -10.799022674560547, "global_step": 151095, "epoch": 899} {"train_loss": -10.742575645446777, "global_step": 151096, "epoch": 899} {"train_loss": -10.659982681274414, "global_step": 151097, "epoch": 899} {"train_loss": -10.821386337280273, "global_step": 151098, "epoch": 899} {"train_loss": -10.796289443969727, "global_step": 151099, "epoch": 899} {"train_loss": -10.740821838378906, "global_step": 151100, "epoch": 899} {"train_loss": -10.755159378051758, "global_step": 151101, "epoch": 899} {"train_loss": -10.930549621582031, "global_step": 151102, "epoch": 899} {"train_loss": -10.726229667663574, "global_step": 151103, "epoch": 899} {"train_loss": -10.120497703552246, "global_step": 151104, "epoch": 899} {"train_loss": -10.458471298217773, "global_step": 151105, "epoch": 899} {"train_loss": -11.0084228515625, "global_step": 151106, "epoch": 899} {"train_loss": -10.644964218139648, "global_step": 151107, "epoch": 899} {"train_loss": -10.787046432495117, "global_step": 151108, "epoch": 899} {"train_loss": -10.889348983764648, "global_step": 151109, "epoch": 899} {"train_loss": -10.708454132080078, "global_step": 151110, "epoch": 899} {"train_loss": -10.641002655029297, "global_step": 151111, "epoch": 899} {"train_loss": -11.010171890258789, "global_step": 151112, "epoch": 899} {"train_loss": -10.604035377502441, "global_step": 151113, "epoch": 899} {"train_loss": -10.462228775024414, "global_step": 151114, "epoch": 899} {"train_loss": -10.58733081817627, "global_step": 151115, "epoch": 899} {"train_loss": -10.697848320007324, "global_step": 151116, "epoch": 899} {"train_loss": -10.805205345153809, "global_step": 151117, "epoch": 899} {"train_loss": -10.497365951538086, "global_step": 151118, "epoch": 899} {"train_loss": -11.19322395324707, "global_step": 151119, "epoch": 899} {"train_loss": -10.74209213256836, "global_step": 151120, "epoch": 899} {"train_loss": -10.82729721069336, "global_step": 151121, "epoch": 899} {"train_loss": -10.819671630859375, "global_step": 151122, "epoch": 899} {"train_loss": -10.70660400390625, "global_step": 151123, "epoch": 899} {"train_loss": -10.597837448120117, "global_step": 151124, "epoch": 899} {"train_loss": -10.79749870300293, "global_step": 151125, "epoch": 899} {"train_loss": -10.704130172729492, "global_step": 151126, "epoch": 899} {"train_loss": -10.92030143737793, "global_step": 151127, "epoch": 899} {"train_loss": -10.73364543914795, "global_step": 151128, "epoch": 899} {"train_loss": -10.534978866577148, "global_step": 151129, "epoch": 899} {"train_loss": -10.319355010986328, "global_step": 151130, "epoch": 899} {"train_loss": -10.853788375854492, "global_step": 151131, "epoch": 899} {"train_loss": -10.43536376953125, "global_step": 151132, "epoch": 899} {"train_loss": -10.419905662536621, "global_step": 151133, "epoch": 899} {"train_loss": -10.688922882080078, "global_step": 151134, "epoch": 899} {"train_loss": -10.444547653198242, "global_step": 151135, "epoch": 899} {"train_loss": -10.705450057983398, "global_step": 151136, "epoch": 899} {"train_loss": -10.968917846679688, "global_step": 151137, "epoch": 899} {"train_loss": -10.50407886505127, "global_step": 151138, "epoch": 899} {"train_loss": -11.016889572143555, "global_step": 151139, "epoch": 899} {"train_loss": -10.85300064086914, "global_step": 151140, "epoch": 899} {"train_loss": -10.487987518310547, "global_step": 151141, "epoch": 899} {"train_loss": -10.888277053833008, "global_step": 151142, "epoch": 899} {"train_loss": -10.731441497802734, "global_step": 151143, "epoch": 899} {"train_loss": -10.804132461547852, "global_step": 151144, "epoch": 899} {"train_loss": -11.03318977355957, "global_step": 151145, "epoch": 899} {"train_loss": -10.848628044128418, "global_step": 151146, "epoch": 899} {"train_loss": -10.925945281982422, "global_step": 151147, "epoch": 899} {"train_loss": -10.70264720916748, "global_step": 151148, "epoch": 899} {"train_loss": -10.827726364135742, "global_step": 151149, "epoch": 899} {"train_loss": -10.788406372070312, "global_step": 151150, "epoch": 899} {"train_loss": -10.863986015319824, "global_step": 151151, "epoch": 899} {"train_loss": -10.812676429748535, "global_step": 151152, "epoch": 899} {"train_loss": -10.86751937866211, "global_step": 151153, "epoch": 899} {"train_loss": -10.536218643188477, "global_step": 151154, "epoch": 899} {"train_loss": -11.055018424987793, "global_step": 151155, "epoch": 899} {"train_loss": -10.489690780639648, "global_step": 151156, "epoch": 899} {"train_loss": -10.96438980102539, "global_step": 151157, "epoch": 899} {"train_loss": -10.696501731872559, "global_step": 151158, "epoch": 899} {"train_loss": -10.803524017333984, "global_step": 151159, "epoch": 899} {"train_loss": -10.845277786254883, "global_step": 151160, "epoch": 899} {"train_loss": -10.669479370117188, "global_step": 151161, "epoch": 899} {"train_loss": -11.050511360168457, "global_step": 151162, "epoch": 899} {"train_loss": -10.438484191894531, "global_step": 151163, "epoch": 899} {"train_loss": -10.79586410522461, "global_step": 151164, "epoch": 899} {"train_loss": -10.789535522460938, "global_step": 151165, "epoch": 899} {"train_loss": -10.659224510192871, "global_step": 151166, "epoch": 899} {"train_loss": -11.094179153442383, "global_step": 151167, "epoch": 899} {"train_loss": -10.857085227966309, "global_step": 151168, "epoch": 899} {"train_loss": -10.80462646484375, "global_step": 151169, "epoch": 899} {"train_loss": -11.039093017578125, "global_step": 151170, "epoch": 899} {"train_loss": -10.616691589355469, "global_step": 151171, "epoch": 899} {"train_loss": -11.09422492980957, "global_step": 151172, "epoch": 899} {"train_loss": -10.651268005371094, "global_step": 151173, "epoch": 899} {"train_loss": -10.725249290466309, "global_step": 151174, "epoch": 899} {"train_loss": -11.011899948120117, "global_step": 151175, "epoch": 899} {"train_loss": -10.619498252868652, "global_step": 151176, "epoch": 899} {"train_loss": -10.53518009185791, "global_step": 151177, "epoch": 899} {"train_loss": -10.611283302307129, "global_step": 151178, "epoch": 899} {"train_loss": -10.798762321472168, "global_step": 151179, "epoch": 899} {"train_loss": -10.54348373413086, "global_step": 151180, "epoch": 899} {"train_loss": -10.920005798339844, "global_step": 151181, "epoch": 899} {"train_loss": -10.84644603729248, "global_step": 151182, "epoch": 899} {"train_loss": -10.78390121459961, "global_step": 151183, "epoch": 899} {"train_loss": -10.669692993164062, "global_step": 151184, "epoch": 899} {"train_loss": -11.087747573852539, "global_step": 151185, "epoch": 899} {"train_loss": -10.740362167358398, "global_step": 151186, "epoch": 899} {"train_loss": -10.74386215209961, "global_step": 151187, "epoch": 899} {"train_loss": -10.62741756439209, "global_step": 151188, "epoch": 899} {"train_loss": -10.65824031829834, "global_step": 151189, "epoch": 899} {"train_loss": -10.331255912780762, "global_step": 151190, "epoch": 899} {"train_loss": -10.598289489746094, "global_step": 151191, "epoch": 899} {"train_loss": -10.665553092956543, "global_step": 151192, "epoch": 899} {"train_loss": -10.346532821655273, "global_step": 151193, "epoch": 899} {"train_loss": -10.64111042022705, "global_step": 151194, "epoch": 899} {"train_loss": -10.766148567199707, "global_step": 151195, "epoch": 899} {"train_loss": -10.793721199035645, "global_step": 151196, "epoch": 899} {"train_loss": -10.873979568481445, "global_step": 151197, "epoch": 899} {"train_loss": -10.639327049255371, "global_step": 151198, "epoch": 899} {"train_loss": -10.744470130829583, "global_step": 151199, "epoch": 899, "val_loss": 229950.59375} {"train_loss": -10.592564582824707, "global_step": 151200, "epoch": 900} {"train_loss": -10.77224349975586, "global_step": 151201, "epoch": 900} {"train_loss": -10.6976318359375, "global_step": 151202, "epoch": 900} {"train_loss": -10.83671760559082, "global_step": 151203, "epoch": 900} {"train_loss": -10.956976890563965, "global_step": 151204, "epoch": 900} {"train_loss": -11.009286880493164, "global_step": 151205, "epoch": 900} {"train_loss": -10.913052558898926, "global_step": 151206, "epoch": 900} {"train_loss": -10.684713363647461, "global_step": 151207, "epoch": 900} {"train_loss": -10.907573699951172, "global_step": 151208, "epoch": 900} {"train_loss": -10.956239700317383, "global_step": 151209, "epoch": 900} {"train_loss": -10.83091926574707, "global_step": 151210, "epoch": 900} {"train_loss": -11.108602523803711, "global_step": 151211, "epoch": 900} {"train_loss": -10.785541534423828, "global_step": 151212, "epoch": 900} {"train_loss": -10.7833251953125, "global_step": 151213, "epoch": 900} {"train_loss": -10.974774360656738, "global_step": 151214, "epoch": 900} {"train_loss": -10.604249000549316, "global_step": 151215, "epoch": 900} {"train_loss": -10.93864917755127, "global_step": 151216, "epoch": 900} {"train_loss": -10.85859489440918, "global_step": 151217, "epoch": 900} {"train_loss": -10.83720874786377, "global_step": 151218, "epoch": 900} {"train_loss": -10.811036109924316, "global_step": 151219, "epoch": 900} {"train_loss": -10.204416275024414, "global_step": 151220, "epoch": 900} {"train_loss": -10.541332244873047, "global_step": 151221, "epoch": 900} {"train_loss": -10.58268928527832, "global_step": 151222, "epoch": 900} {"train_loss": -10.43542766571045, "global_step": 151223, "epoch": 900} {"train_loss": -10.759363174438477, "global_step": 151224, "epoch": 900} {"train_loss": -10.374336242675781, "global_step": 151225, "epoch": 900} {"train_loss": -10.889202117919922, "global_step": 151226, "epoch": 900} {"train_loss": -10.730815887451172, "global_step": 151227, "epoch": 900} {"train_loss": -10.736546516418457, "global_step": 151228, "epoch": 900} {"train_loss": -10.472443580627441, "global_step": 151229, "epoch": 900} {"train_loss": -10.764688491821289, "global_step": 151230, "epoch": 900} {"train_loss": -10.702821731567383, "global_step": 151231, "epoch": 900} {"train_loss": -10.982508659362793, "global_step": 151232, "epoch": 900} {"train_loss": -10.963912963867188, "global_step": 151233, "epoch": 900} {"train_loss": -10.799546241760254, "global_step": 151234, "epoch": 900} {"train_loss": -10.650118827819824, "global_step": 151235, "epoch": 900} {"train_loss": -10.706178665161133, "global_step": 151236, "epoch": 900} {"train_loss": -10.529916763305664, "global_step": 151237, "epoch": 900} {"train_loss": -10.795430183410645, "global_step": 151238, "epoch": 900} {"train_loss": -10.73044204711914, "global_step": 151239, "epoch": 900} {"train_loss": -9.895057678222656, "global_step": 151240, "epoch": 900} {"train_loss": -9.97527027130127, "global_step": 151241, "epoch": 900} {"train_loss": -9.864518165588379, "global_step": 151242, "epoch": 900} {"train_loss": -10.069564819335938, "global_step": 151243, "epoch": 900} {"train_loss": -9.977372169494629, "global_step": 151244, "epoch": 900} {"train_loss": -10.625401496887207, "global_step": 151245, "epoch": 900} {"train_loss": -10.024515151977539, "global_step": 151246, "epoch": 900} {"train_loss": -9.941092491149902, "global_step": 151247, "epoch": 900} {"train_loss": -10.585763931274414, "global_step": 151248, "epoch": 900} {"train_loss": -9.861457824707031, "global_step": 151249, "epoch": 900} {"train_loss": -10.34820556640625, "global_step": 151250, "epoch": 900} {"train_loss": -10.462722778320312, "global_step": 151251, "epoch": 900} {"train_loss": -10.313587188720703, "global_step": 151252, "epoch": 900} {"train_loss": -10.310274124145508, "global_step": 151253, "epoch": 900} {"train_loss": -10.161499977111816, "global_step": 151254, "epoch": 900} {"train_loss": -9.44400405883789, "global_step": 151255, "epoch": 900} {"train_loss": -10.511619567871094, "global_step": 151256, "epoch": 900} {"train_loss": -9.453302383422852, "global_step": 151257, "epoch": 900} {"train_loss": -10.213232040405273, "global_step": 151258, "epoch": 900} {"train_loss": -10.633176803588867, "global_step": 151259, "epoch": 900} {"train_loss": -9.70591926574707, "global_step": 151260, "epoch": 900} {"train_loss": -10.101883888244629, "global_step": 151261, "epoch": 900} {"train_loss": -10.245210647583008, "global_step": 151262, "epoch": 900} {"train_loss": -10.19470500946045, "global_step": 151263, "epoch": 900} {"train_loss": -10.077385902404785, "global_step": 151264, "epoch": 900} {"train_loss": -10.484814643859863, "global_step": 151265, "epoch": 900} {"train_loss": -9.913431167602539, "global_step": 151266, "epoch": 900} {"train_loss": -10.491493225097656, "global_step": 151267, "epoch": 900} {"train_loss": -10.21053695678711, "global_step": 151268, "epoch": 900} {"train_loss": -10.397950172424316, "global_step": 151269, "epoch": 900} {"train_loss": -10.10062313079834, "global_step": 151270, "epoch": 900} {"train_loss": -10.230123519897461, "global_step": 151271, "epoch": 900} {"train_loss": -10.25307559967041, "global_step": 151272, "epoch": 900} {"train_loss": -10.401729583740234, "global_step": 151273, "epoch": 900} {"train_loss": -10.265338897705078, "global_step": 151274, "epoch": 900} {"train_loss": -10.585460662841797, "global_step": 151275, "epoch": 900} {"train_loss": -10.437821388244629, "global_step": 151276, "epoch": 900} {"train_loss": -10.53541088104248, "global_step": 151277, "epoch": 900} {"train_loss": -10.38386058807373, "global_step": 151278, "epoch": 900} {"train_loss": -10.616557121276855, "global_step": 151279, "epoch": 900} {"train_loss": -10.784741401672363, "global_step": 151280, "epoch": 900} {"train_loss": -10.500137329101562, "global_step": 151281, "epoch": 900} {"train_loss": -10.82991886138916, "global_step": 151282, "epoch": 900} {"train_loss": -10.442787170410156, "global_step": 151283, "epoch": 900} {"train_loss": -10.34279727935791, "global_step": 151284, "epoch": 900} {"train_loss": -10.74621295928955, "global_step": 151285, "epoch": 900} {"train_loss": -10.682327270507812, "global_step": 151286, "epoch": 900} {"train_loss": -10.607730865478516, "global_step": 151287, "epoch": 900} {"train_loss": -10.705087661743164, "global_step": 151288, "epoch": 900} {"train_loss": -10.60832691192627, "global_step": 151289, "epoch": 900} {"train_loss": -10.556768417358398, "global_step": 151290, "epoch": 900} {"train_loss": -10.75078296661377, "global_step": 151291, "epoch": 900} {"train_loss": -10.651529312133789, "global_step": 151292, "epoch": 900} {"train_loss": -10.879911422729492, "global_step": 151293, "epoch": 900} {"train_loss": -11.018291473388672, "global_step": 151294, "epoch": 900} {"train_loss": -10.654976844787598, "global_step": 151295, "epoch": 900} {"train_loss": -10.713201522827148, "global_step": 151296, "epoch": 900} {"train_loss": -10.965686798095703, "global_step": 151297, "epoch": 900} {"train_loss": -10.747884750366211, "global_step": 151298, "epoch": 900} {"train_loss": -10.876863479614258, "global_step": 151299, "epoch": 900} {"train_loss": -11.021259307861328, "global_step": 151300, "epoch": 900} {"train_loss": -11.158857345581055, "global_step": 151301, "epoch": 900} {"train_loss": -10.873828887939453, "global_step": 151302, "epoch": 900} {"train_loss": -11.018655776977539, "global_step": 151303, "epoch": 900} {"train_loss": -11.009361267089844, "global_step": 151304, "epoch": 900} {"train_loss": -10.94950008392334, "global_step": 151305, "epoch": 900} {"train_loss": -11.058279037475586, "global_step": 151306, "epoch": 900} {"train_loss": -10.92329216003418, "global_step": 151307, "epoch": 900} {"train_loss": -11.047369956970215, "global_step": 151308, "epoch": 900} {"train_loss": -11.056741714477539, "global_step": 151309, "epoch": 900} {"train_loss": -11.015148162841797, "global_step": 151310, "epoch": 900} {"train_loss": -11.187381744384766, "global_step": 151311, "epoch": 900} {"train_loss": -11.054582595825195, "global_step": 151312, "epoch": 900} {"train_loss": -11.06132698059082, "global_step": 151313, "epoch": 900} {"train_loss": -11.120781898498535, "global_step": 151314, "epoch": 900} {"train_loss": -10.419763565063477, "global_step": 151315, "epoch": 900} {"train_loss": -11.211090087890625, "global_step": 151316, "epoch": 900} {"train_loss": -10.048563003540039, "global_step": 151317, "epoch": 900} {"train_loss": -9.827166557312012, "global_step": 151318, "epoch": 900} {"train_loss": -10.740377426147461, "global_step": 151319, "epoch": 900} {"train_loss": -10.927572250366211, "global_step": 151320, "epoch": 900} {"train_loss": -10.26583480834961, "global_step": 151321, "epoch": 900} {"train_loss": -10.713217735290527, "global_step": 151322, "epoch": 900} {"train_loss": -10.414363861083984, "global_step": 151323, "epoch": 900} {"train_loss": -10.435413360595703, "global_step": 151324, "epoch": 900} {"train_loss": -10.59109115600586, "global_step": 151325, "epoch": 900} {"train_loss": -10.695840835571289, "global_step": 151326, "epoch": 900} {"train_loss": -10.504741668701172, "global_step": 151327, "epoch": 900} {"train_loss": -10.808223724365234, "global_step": 151328, "epoch": 900} {"train_loss": -10.748952865600586, "global_step": 151329, "epoch": 900} {"train_loss": -10.836297988891602, "global_step": 151330, "epoch": 900} {"train_loss": -10.58901596069336, "global_step": 151331, "epoch": 900} {"train_loss": -10.088041305541992, "global_step": 151332, "epoch": 900} {"train_loss": -10.609660148620605, "global_step": 151333, "epoch": 900} {"train_loss": -10.503606796264648, "global_step": 151334, "epoch": 900} {"train_loss": -9.942329406738281, "global_step": 151335, "epoch": 900} {"train_loss": -10.250617980957031, "global_step": 151336, "epoch": 900} {"train_loss": -10.109293937683105, "global_step": 151337, "epoch": 900} {"train_loss": -10.542242050170898, "global_step": 151338, "epoch": 900} {"train_loss": -10.14175033569336, "global_step": 151339, "epoch": 900} {"train_loss": -10.719306945800781, "global_step": 151340, "epoch": 900} {"train_loss": -10.664509773254395, "global_step": 151341, "epoch": 900} {"train_loss": -10.014217376708984, "global_step": 151342, "epoch": 900} {"train_loss": -10.87990951538086, "global_step": 151343, "epoch": 900} {"train_loss": -10.180561065673828, "global_step": 151344, "epoch": 900} {"train_loss": -10.689291954040527, "global_step": 151345, "epoch": 900} {"train_loss": -10.019973754882812, "global_step": 151346, "epoch": 900} {"train_loss": -9.8920316696167, "global_step": 151347, "epoch": 900} {"train_loss": -10.207110404968262, "global_step": 151348, "epoch": 900} {"train_loss": -9.749536514282227, "global_step": 151349, "epoch": 900} {"train_loss": -10.06654167175293, "global_step": 151350, "epoch": 900} {"train_loss": -9.901260375976562, "global_step": 151351, "epoch": 900} {"train_loss": -10.185493469238281, "global_step": 151352, "epoch": 900} {"train_loss": -10.070101737976074, "global_step": 151353, "epoch": 900} {"train_loss": -10.505009651184082, "global_step": 151354, "epoch": 900} {"train_loss": -10.093284606933594, "global_step": 151355, "epoch": 900} {"train_loss": -10.689535140991211, "global_step": 151356, "epoch": 900} {"train_loss": -10.375265121459961, "global_step": 151357, "epoch": 900} {"train_loss": -10.304786682128906, "global_step": 151358, "epoch": 900} {"train_loss": -10.595782279968262, "global_step": 151359, "epoch": 900} {"train_loss": -10.56406021118164, "global_step": 151360, "epoch": 900} {"train_loss": -10.405284881591797, "global_step": 151361, "epoch": 900} {"train_loss": -10.667146682739258, "global_step": 151362, "epoch": 900} {"train_loss": -10.435934066772461, "global_step": 151363, "epoch": 900} {"train_loss": -10.545698165893555, "global_step": 151364, "epoch": 900} {"train_loss": -10.70263385772705, "global_step": 151365, "epoch": 900} {"train_loss": -10.658382415771484, "global_step": 151366, "epoch": 900} {"train_loss": -10.536910584994725, "global_step": 151367, "epoch": 900, "train/sim_max_reward_0": 0.6978829053846353, "train/sim_max_reward_1": 0.9303559551576747, "train/sim_max_reward_2": 0.0025880710534002607, "train/sim_max_reward_3": 0.4092199025454383, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.6060603333048284, "test/sim_max_reward_4400000": 0.943501167506887, "test/sim_max_reward_4400001": 0.5013458291018055, "test/sim_max_reward_4400002": 0.3830926638333893, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.7030337671737539, "test/sim_max_reward_4400005": 0.545928495212781, "test/sim_max_reward_4400006": 0.9924927642684557, "test/sim_max_reward_4400007": 0.3746912251200851, "test/sim_max_reward_4400008": 0.5337540508807206, "test/sim_max_reward_4400009": 0.4258486185805211, "test/sim_max_reward_4400010": 0.9527371373017927, "test/sim_max_reward_4400011": 0.9052644999105354, "test/sim_max_reward_4400012": 0.9850508495370668, "test/sim_max_reward_4400013": 0.9673708216399567, "test/sim_max_reward_4400014": 0.9878866087648434, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9785948244860271, "test/sim_max_reward_4400019": 0.5571032947794742, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 0.6820714363372322, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.979825250150993, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.5278727449993836, "test/sim_max_reward_4400026": 0.05119924696960886, "test/sim_max_reward_4400027": 1.0, "test/sim_max_reward_4400028": 0.9826515763408721, "test/sim_max_reward_4400029": 0.5634451767379163, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.4137263033918443, "test/sim_max_reward_4400033": 0.1516031290595102, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.9818420151722205, "test/sim_max_reward_4400036": 0.3750095616137531, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.165221925589658, "test/sim_max_reward_4400042": 0.02371452493172055, "test/sim_max_reward_4400043": 0.0426097770686025, "test/sim_max_reward_4400044": 0.9944343223468822, "test/sim_max_reward_4400045": 0.4046816280804956, "test/sim_max_reward_4400046": 0.3199091863852579, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6076845279076628, "test/mean_score": 0.6099164214019138, "val_loss": 232077.53125, "train_action_mse_error": 1.142057180404663} {"train_loss": -10.741065979003906, "global_step": 151368, "epoch": 901} {"train_loss": -10.693650245666504, "global_step": 151369, "epoch": 901} {"train_loss": -10.677605628967285, "global_step": 151370, "epoch": 901} {"train_loss": -10.560310363769531, "global_step": 151371, "epoch": 901} {"train_loss": -10.737640380859375, "global_step": 151372, "epoch": 901} {"train_loss": -10.698820114135742, "global_step": 151373, "epoch": 901} {"train_loss": -10.802103996276855, "global_step": 151374, "epoch": 901} {"train_loss": -10.714279174804688, "global_step": 151375, "epoch": 901} {"train_loss": -10.833357810974121, "global_step": 151376, "epoch": 901} {"train_loss": -10.900419235229492, "global_step": 151377, "epoch": 901} {"train_loss": -10.853158950805664, "global_step": 151378, "epoch": 901} {"train_loss": -10.765604019165039, "global_step": 151379, "epoch": 901} {"train_loss": -10.890780448913574, "global_step": 151380, "epoch": 901} {"train_loss": -10.632577896118164, "global_step": 151381, "epoch": 901} {"train_loss": -10.995159149169922, "global_step": 151382, "epoch": 901} {"train_loss": -10.393515586853027, "global_step": 151383, "epoch": 901} {"train_loss": -10.837959289550781, "global_step": 151384, "epoch": 901} {"train_loss": -10.756986618041992, "global_step": 151385, "epoch": 901} {"train_loss": -10.88388729095459, "global_step": 151386, "epoch": 901} {"train_loss": -10.749626159667969, "global_step": 151387, "epoch": 901} {"train_loss": -10.64462661743164, "global_step": 151388, "epoch": 901} {"train_loss": -10.767321586608887, "global_step": 151389, "epoch": 901} {"train_loss": -10.977725982666016, "global_step": 151390, "epoch": 901} {"train_loss": -10.976431846618652, "global_step": 151391, "epoch": 901} {"train_loss": -10.834312438964844, "global_step": 151392, "epoch": 901} {"train_loss": -10.839049339294434, "global_step": 151393, "epoch": 901} {"train_loss": -10.947736740112305, "global_step": 151394, "epoch": 901} {"train_loss": -10.986891746520996, "global_step": 151395, "epoch": 901} {"train_loss": -11.110641479492188, "global_step": 151396, "epoch": 901} {"train_loss": -10.948123931884766, "global_step": 151397, "epoch": 901} {"train_loss": -11.033272743225098, "global_step": 151398, "epoch": 901} {"train_loss": -11.022661209106445, "global_step": 151399, "epoch": 901} {"train_loss": -11.216243743896484, "global_step": 151400, "epoch": 901} {"train_loss": -10.891018867492676, "global_step": 151401, "epoch": 901} {"train_loss": -10.814353942871094, "global_step": 151402, "epoch": 901} {"train_loss": -11.008451461791992, "global_step": 151403, "epoch": 901} {"train_loss": -10.961935043334961, "global_step": 151404, "epoch": 901} {"train_loss": -10.981128692626953, "global_step": 151405, "epoch": 901} {"train_loss": -11.044342994689941, "global_step": 151406, "epoch": 901} {"train_loss": -10.848182678222656, "global_step": 151407, "epoch": 901} {"train_loss": -11.176309585571289, "global_step": 151408, "epoch": 901} {"train_loss": -10.87166976928711, "global_step": 151409, "epoch": 901} {"train_loss": -10.932262420654297, "global_step": 151410, "epoch": 901} {"train_loss": -11.091405868530273, "global_step": 151411, "epoch": 901} {"train_loss": -10.700187683105469, "global_step": 151412, "epoch": 901} {"train_loss": -10.795343399047852, "global_step": 151413, "epoch": 901} {"train_loss": -11.031449317932129, "global_step": 151414, "epoch": 901} {"train_loss": -11.11320686340332, "global_step": 151415, "epoch": 901} {"train_loss": -10.685150146484375, "global_step": 151416, "epoch": 901} {"train_loss": -11.10361385345459, "global_step": 151417, "epoch": 901} {"train_loss": -10.747085571289062, "global_step": 151418, "epoch": 901} {"train_loss": -11.049798965454102, "global_step": 151419, "epoch": 901} {"train_loss": -10.913439750671387, "global_step": 151420, "epoch": 901} {"train_loss": -10.704718589782715, "global_step": 151421, "epoch": 901} {"train_loss": -11.059675216674805, "global_step": 151422, "epoch": 901} {"train_loss": -10.963104248046875, "global_step": 151423, "epoch": 901} {"train_loss": -10.718486785888672, "global_step": 151424, "epoch": 901} {"train_loss": -11.148491859436035, "global_step": 151425, "epoch": 901} {"train_loss": -10.367996215820312, "global_step": 151426, "epoch": 901} {"train_loss": -10.831761360168457, "global_step": 151427, "epoch": 901} {"train_loss": -10.639188766479492, "global_step": 151428, "epoch": 901} {"train_loss": -10.442212104797363, "global_step": 151429, "epoch": 901} {"train_loss": -10.462682723999023, "global_step": 151430, "epoch": 901} {"train_loss": -10.10168743133545, "global_step": 151431, "epoch": 901} {"train_loss": -10.300873756408691, "global_step": 151432, "epoch": 901} {"train_loss": -10.536125183105469, "global_step": 151433, "epoch": 901} {"train_loss": -10.449342727661133, "global_step": 151434, "epoch": 901} {"train_loss": -10.531865119934082, "global_step": 151435, "epoch": 901} {"train_loss": -10.809854507446289, "global_step": 151436, "epoch": 901} {"train_loss": -10.77053451538086, "global_step": 151437, "epoch": 901} {"train_loss": -10.391297340393066, "global_step": 151438, "epoch": 901} {"train_loss": -10.558022499084473, "global_step": 151439, "epoch": 901} {"train_loss": -10.88333797454834, "global_step": 151440, "epoch": 901} {"train_loss": -10.495367050170898, "global_step": 151441, "epoch": 901} {"train_loss": -10.51912784576416, "global_step": 151442, "epoch": 901} {"train_loss": -10.377432823181152, "global_step": 151443, "epoch": 901} {"train_loss": -10.145505905151367, "global_step": 151444, "epoch": 901} {"train_loss": -10.4284029006958, "global_step": 151445, "epoch": 901} {"train_loss": -9.84511947631836, "global_step": 151446, "epoch": 901} {"train_loss": -10.45626449584961, "global_step": 151447, "epoch": 901} {"train_loss": -10.546698570251465, "global_step": 151448, "epoch": 901} {"train_loss": -10.438257217407227, "global_step": 151449, "epoch": 901} {"train_loss": -10.159111976623535, "global_step": 151450, "epoch": 901} {"train_loss": -10.477621078491211, "global_step": 151451, "epoch": 901} {"train_loss": -10.345218658447266, "global_step": 151452, "epoch": 901} {"train_loss": -10.261483192443848, "global_step": 151453, "epoch": 901} {"train_loss": -10.198562622070312, "global_step": 151454, "epoch": 901} {"train_loss": -10.642644882202148, "global_step": 151455, "epoch": 901} {"train_loss": -9.670467376708984, "global_step": 151456, "epoch": 901} {"train_loss": -10.434392929077148, "global_step": 151457, "epoch": 901} {"train_loss": -10.127950668334961, "global_step": 151458, "epoch": 901} {"train_loss": -9.421442031860352, "global_step": 151459, "epoch": 901} {"train_loss": -10.829261779785156, "global_step": 151460, "epoch": 901} {"train_loss": -9.341493606567383, "global_step": 151461, "epoch": 901} {"train_loss": -10.226333618164062, "global_step": 151462, "epoch": 901} {"train_loss": -10.083776473999023, "global_step": 151463, "epoch": 901} {"train_loss": -9.550973892211914, "global_step": 151464, "epoch": 901} {"train_loss": -9.970609664916992, "global_step": 151465, "epoch": 901} {"train_loss": -10.622357368469238, "global_step": 151466, "epoch": 901} {"train_loss": -9.479757308959961, "global_step": 151467, "epoch": 901} {"train_loss": -10.138493537902832, "global_step": 151468, "epoch": 901} {"train_loss": -10.395011901855469, "global_step": 151469, "epoch": 901} {"train_loss": -9.859100341796875, "global_step": 151470, "epoch": 901} {"train_loss": -10.41018295288086, "global_step": 151471, "epoch": 901} {"train_loss": -9.812267303466797, "global_step": 151472, "epoch": 901} {"train_loss": -10.15305233001709, "global_step": 151473, "epoch": 901} {"train_loss": -10.228983879089355, "global_step": 151474, "epoch": 901} {"train_loss": -10.09719467163086, "global_step": 151475, "epoch": 901} {"train_loss": -10.578102111816406, "global_step": 151476, "epoch": 901} {"train_loss": -10.153627395629883, "global_step": 151477, "epoch": 901} {"train_loss": -10.6223783493042, "global_step": 151478, "epoch": 901} {"train_loss": -9.968746185302734, "global_step": 151479, "epoch": 901} {"train_loss": -10.574658393859863, "global_step": 151480, "epoch": 901} {"train_loss": -10.095331192016602, "global_step": 151481, "epoch": 901} {"train_loss": -10.392014503479004, "global_step": 151482, "epoch": 901} {"train_loss": -10.65774154663086, "global_step": 151483, "epoch": 901} {"train_loss": -10.442416191101074, "global_step": 151484, "epoch": 901} {"train_loss": -10.274328231811523, "global_step": 151485, "epoch": 901} {"train_loss": -10.727579116821289, "global_step": 151486, "epoch": 901} {"train_loss": -10.357662200927734, "global_step": 151487, "epoch": 901} {"train_loss": -10.636628150939941, "global_step": 151488, "epoch": 901} {"train_loss": -10.568387031555176, "global_step": 151489, "epoch": 901} {"train_loss": -10.718832015991211, "global_step": 151490, "epoch": 901} {"train_loss": -10.532745361328125, "global_step": 151491, "epoch": 901} {"train_loss": -10.64266586303711, "global_step": 151492, "epoch": 901} {"train_loss": -10.587833404541016, "global_step": 151493, "epoch": 901} {"train_loss": -10.783740997314453, "global_step": 151494, "epoch": 901} {"train_loss": -10.604249000549316, "global_step": 151495, "epoch": 901} {"train_loss": -10.792218208312988, "global_step": 151496, "epoch": 901} {"train_loss": -10.693408966064453, "global_step": 151497, "epoch": 901} {"train_loss": -10.850343704223633, "global_step": 151498, "epoch": 901} {"train_loss": -10.887392044067383, "global_step": 151499, "epoch": 901} {"train_loss": -10.692424774169922, "global_step": 151500, "epoch": 901} {"train_loss": -10.870386123657227, "global_step": 151501, "epoch": 901} {"train_loss": -10.894617080688477, "global_step": 151502, "epoch": 901} {"train_loss": -10.975072860717773, "global_step": 151503, "epoch": 901} {"train_loss": -10.826809883117676, "global_step": 151504, "epoch": 901} {"train_loss": -10.723116874694824, "global_step": 151505, "epoch": 901} {"train_loss": -11.038006782531738, "global_step": 151506, "epoch": 901} {"train_loss": -10.9429292678833, "global_step": 151507, "epoch": 901} {"train_loss": -11.039501190185547, "global_step": 151508, "epoch": 901} {"train_loss": -10.906473159790039, "global_step": 151509, "epoch": 901} {"train_loss": -10.926088333129883, "global_step": 151510, "epoch": 901} {"train_loss": -10.981249809265137, "global_step": 151511, "epoch": 901} {"train_loss": -10.984121322631836, "global_step": 151512, "epoch": 901} {"train_loss": -11.100579261779785, "global_step": 151513, "epoch": 901} {"train_loss": -10.91192626953125, "global_step": 151514, "epoch": 901} {"train_loss": -10.951422691345215, "global_step": 151515, "epoch": 901} {"train_loss": -10.784843444824219, "global_step": 151516, "epoch": 901} {"train_loss": -10.6827974319458, "global_step": 151517, "epoch": 901} {"train_loss": -10.88116455078125, "global_step": 151518, "epoch": 901} {"train_loss": -10.980310440063477, "global_step": 151519, "epoch": 901} {"train_loss": -10.919967651367188, "global_step": 151520, "epoch": 901} {"train_loss": -10.967386245727539, "global_step": 151521, "epoch": 901} {"train_loss": -11.049274444580078, "global_step": 151522, "epoch": 901} {"train_loss": -11.140714645385742, "global_step": 151523, "epoch": 901} {"train_loss": -11.068052291870117, "global_step": 151524, "epoch": 901} {"train_loss": -10.993385314941406, "global_step": 151525, "epoch": 901} {"train_loss": -10.74462890625, "global_step": 151526, "epoch": 901} {"train_loss": -11.25631046295166, "global_step": 151527, "epoch": 901} {"train_loss": -11.050960540771484, "global_step": 151528, "epoch": 901} {"train_loss": -11.161977767944336, "global_step": 151529, "epoch": 901} {"train_loss": -10.985193252563477, "global_step": 151530, "epoch": 901} {"train_loss": -11.105579376220703, "global_step": 151531, "epoch": 901} {"train_loss": -10.862432479858398, "global_step": 151532, "epoch": 901} {"train_loss": -10.701465606689453, "global_step": 151533, "epoch": 901} {"train_loss": -10.686692237854004, "global_step": 151534, "epoch": 901} {"train_loss": -10.664978753952752, "global_step": 151535, "epoch": 901, "val_loss": 229143.375} {"train_loss": -10.347381591796875, "global_step": 151536, "epoch": 902} {"train_loss": -10.154550552368164, "global_step": 151537, "epoch": 902} {"train_loss": -10.979193687438965, "global_step": 151538, "epoch": 902} {"train_loss": -10.20341682434082, "global_step": 151539, "epoch": 902} {"train_loss": -10.144350051879883, "global_step": 151540, "epoch": 902} {"train_loss": -10.756745338439941, "global_step": 151541, "epoch": 902} {"train_loss": -10.745365142822266, "global_step": 151542, "epoch": 902} {"train_loss": -10.74041748046875, "global_step": 151543, "epoch": 902} {"train_loss": -10.536757469177246, "global_step": 151544, "epoch": 902} {"train_loss": -10.726095199584961, "global_step": 151545, "epoch": 902} {"train_loss": -10.858343124389648, "global_step": 151546, "epoch": 902} {"train_loss": -10.507265090942383, "global_step": 151547, "epoch": 902} {"train_loss": -10.819698333740234, "global_step": 151548, "epoch": 902} {"train_loss": -11.019476890563965, "global_step": 151549, "epoch": 902} {"train_loss": -10.725818634033203, "global_step": 151550, "epoch": 902} {"train_loss": -10.735212326049805, "global_step": 151551, "epoch": 902} {"train_loss": -10.949234008789062, "global_step": 151552, "epoch": 902} {"train_loss": -10.715866088867188, "global_step": 151553, "epoch": 902} {"train_loss": -10.703943252563477, "global_step": 151554, "epoch": 902} {"train_loss": -10.11422348022461, "global_step": 151555, "epoch": 902} {"train_loss": -10.616127014160156, "global_step": 151556, "epoch": 902} {"train_loss": -10.598512649536133, "global_step": 151557, "epoch": 902} {"train_loss": -10.503824234008789, "global_step": 151558, "epoch": 902} {"train_loss": -10.673393249511719, "global_step": 151559, "epoch": 902} {"train_loss": -10.715353012084961, "global_step": 151560, "epoch": 902} {"train_loss": -10.65245532989502, "global_step": 151561, "epoch": 902} {"train_loss": -10.38821792602539, "global_step": 151562, "epoch": 902} {"train_loss": -10.696813583374023, "global_step": 151563, "epoch": 902} {"train_loss": -10.576011657714844, "global_step": 151564, "epoch": 902} {"train_loss": -10.709898948669434, "global_step": 151565, "epoch": 902} {"train_loss": -10.620702743530273, "global_step": 151566, "epoch": 902} {"train_loss": -10.376897811889648, "global_step": 151567, "epoch": 902} {"train_loss": -10.799921035766602, "global_step": 151568, "epoch": 902} {"train_loss": -10.279890060424805, "global_step": 151569, "epoch": 902} {"train_loss": -10.710290908813477, "global_step": 151570, "epoch": 902} {"train_loss": -10.334972381591797, "global_step": 151571, "epoch": 902} {"train_loss": -10.951375961303711, "global_step": 151572, "epoch": 902} {"train_loss": -10.218856811523438, "global_step": 151573, "epoch": 902} {"train_loss": -10.484752655029297, "global_step": 151574, "epoch": 902} {"train_loss": -10.853878021240234, "global_step": 151575, "epoch": 902} {"train_loss": -10.649372100830078, "global_step": 151576, "epoch": 902} {"train_loss": -10.70865249633789, "global_step": 151577, "epoch": 902} {"train_loss": -10.89509391784668, "global_step": 151578, "epoch": 902} {"train_loss": -10.531797409057617, "global_step": 151579, "epoch": 902} {"train_loss": -11.068313598632812, "global_step": 151580, "epoch": 902} {"train_loss": -10.72597885131836, "global_step": 151581, "epoch": 902} {"train_loss": -10.846744537353516, "global_step": 151582, "epoch": 902} {"train_loss": -10.842327117919922, "global_step": 151583, "epoch": 902} {"train_loss": -10.75657844543457, "global_step": 151584, "epoch": 902} {"train_loss": -10.73145866394043, "global_step": 151585, "epoch": 902} {"train_loss": -10.522785186767578, "global_step": 151586, "epoch": 902} {"train_loss": -10.710506439208984, "global_step": 151587, "epoch": 902} {"train_loss": -10.629715919494629, "global_step": 151588, "epoch": 902} {"train_loss": -10.74979019165039, "global_step": 151589, "epoch": 902} {"train_loss": -10.60647201538086, "global_step": 151590, "epoch": 902} {"train_loss": -10.947805404663086, "global_step": 151591, "epoch": 902} {"train_loss": -10.60923957824707, "global_step": 151592, "epoch": 902} {"train_loss": -10.736732482910156, "global_step": 151593, "epoch": 902} {"train_loss": -10.72884750366211, "global_step": 151594, "epoch": 902} {"train_loss": -10.633556365966797, "global_step": 151595, "epoch": 902} {"train_loss": -10.788803100585938, "global_step": 151596, "epoch": 902} {"train_loss": -10.682324409484863, "global_step": 151597, "epoch": 902} {"train_loss": -10.423528671264648, "global_step": 151598, "epoch": 902} {"train_loss": -10.580678939819336, "global_step": 151599, "epoch": 902} {"train_loss": -10.752450942993164, "global_step": 151600, "epoch": 902} {"train_loss": -10.731886863708496, "global_step": 151601, "epoch": 902} {"train_loss": -10.483282089233398, "global_step": 151602, "epoch": 902} {"train_loss": -10.47360897064209, "global_step": 151603, "epoch": 902} {"train_loss": -10.285056114196777, "global_step": 151604, "epoch": 902} {"train_loss": -10.343622207641602, "global_step": 151605, "epoch": 902} {"train_loss": -10.323324203491211, "global_step": 151606, "epoch": 902} {"train_loss": -10.126818656921387, "global_step": 151607, "epoch": 902} {"train_loss": -10.479339599609375, "global_step": 151608, "epoch": 902} {"train_loss": -10.35795783996582, "global_step": 151609, "epoch": 902} {"train_loss": -10.087178230285645, "global_step": 151610, "epoch": 902} {"train_loss": -10.442037582397461, "global_step": 151611, "epoch": 902} {"train_loss": -10.708148956298828, "global_step": 151612, "epoch": 902} {"train_loss": -10.483783721923828, "global_step": 151613, "epoch": 902} {"train_loss": -10.42115592956543, "global_step": 151614, "epoch": 902} {"train_loss": -10.497312545776367, "global_step": 151615, "epoch": 902} {"train_loss": -10.348551750183105, "global_step": 151616, "epoch": 902} {"train_loss": -10.8956937789917, "global_step": 151617, "epoch": 902} {"train_loss": -10.001087188720703, "global_step": 151618, "epoch": 902} {"train_loss": -10.150505065917969, "global_step": 151619, "epoch": 902} {"train_loss": -10.09211254119873, "global_step": 151620, "epoch": 902} {"train_loss": -10.302058219909668, "global_step": 151621, "epoch": 902} {"train_loss": -10.111940383911133, "global_step": 151622, "epoch": 902} {"train_loss": -9.954257011413574, "global_step": 151623, "epoch": 902} {"train_loss": -9.104150772094727, "global_step": 151624, "epoch": 902} {"train_loss": -10.081523895263672, "global_step": 151625, "epoch": 902} {"train_loss": -9.356407165527344, "global_step": 151626, "epoch": 902} {"train_loss": -10.401031494140625, "global_step": 151627, "epoch": 902} {"train_loss": -9.835746765136719, "global_step": 151628, "epoch": 902} {"train_loss": -10.063817977905273, "global_step": 151629, "epoch": 902} {"train_loss": -10.4303617477417, "global_step": 151630, "epoch": 902} {"train_loss": -9.910989761352539, "global_step": 151631, "epoch": 902} {"train_loss": -10.239021301269531, "global_step": 151632, "epoch": 902} {"train_loss": -10.457866668701172, "global_step": 151633, "epoch": 902} {"train_loss": -10.170978546142578, "global_step": 151634, "epoch": 902} {"train_loss": -10.577858924865723, "global_step": 151635, "epoch": 902} {"train_loss": -10.543859481811523, "global_step": 151636, "epoch": 902} {"train_loss": -10.4244384765625, "global_step": 151637, "epoch": 902} {"train_loss": -10.400247573852539, "global_step": 151638, "epoch": 902} {"train_loss": -10.470087051391602, "global_step": 151639, "epoch": 902} {"train_loss": -10.617053985595703, "global_step": 151640, "epoch": 902} {"train_loss": -10.248291015625, "global_step": 151641, "epoch": 902} {"train_loss": -10.681112289428711, "global_step": 151642, "epoch": 902} {"train_loss": -10.408055305480957, "global_step": 151643, "epoch": 902} {"train_loss": -10.597076416015625, "global_step": 151644, "epoch": 902} {"train_loss": -10.709700584411621, "global_step": 151645, "epoch": 902} {"train_loss": -10.731701850891113, "global_step": 151646, "epoch": 902} {"train_loss": -10.840277671813965, "global_step": 151647, "epoch": 902} {"train_loss": -10.49653434753418, "global_step": 151648, "epoch": 902} {"train_loss": -10.849466323852539, "global_step": 151649, "epoch": 902} {"train_loss": -10.48130989074707, "global_step": 151650, "epoch": 902} {"train_loss": -10.611983299255371, "global_step": 151651, "epoch": 902} {"train_loss": -10.453335762023926, "global_step": 151652, "epoch": 902} {"train_loss": -10.767298698425293, "global_step": 151653, "epoch": 902} {"train_loss": -10.731547355651855, "global_step": 151654, "epoch": 902} {"train_loss": -10.812324523925781, "global_step": 151655, "epoch": 902} {"train_loss": -10.664939880371094, "global_step": 151656, "epoch": 902} {"train_loss": -10.88302230834961, "global_step": 151657, "epoch": 902} {"train_loss": -10.637748718261719, "global_step": 151658, "epoch": 902} {"train_loss": -11.13730525970459, "global_step": 151659, "epoch": 902} {"train_loss": -10.522899627685547, "global_step": 151660, "epoch": 902} {"train_loss": -10.831417083740234, "global_step": 151661, "epoch": 902} {"train_loss": -10.39083194732666, "global_step": 151662, "epoch": 902} {"train_loss": -10.840522766113281, "global_step": 151663, "epoch": 902} {"train_loss": -10.536165237426758, "global_step": 151664, "epoch": 902} {"train_loss": -10.940153121948242, "global_step": 151665, "epoch": 902} {"train_loss": -10.867937088012695, "global_step": 151666, "epoch": 902} {"train_loss": -10.894340515136719, "global_step": 151667, "epoch": 902} {"train_loss": -10.948519706726074, "global_step": 151668, "epoch": 902} {"train_loss": -10.896642684936523, "global_step": 151669, "epoch": 902} {"train_loss": -11.029327392578125, "global_step": 151670, "epoch": 902} {"train_loss": -10.975210189819336, "global_step": 151671, "epoch": 902} {"train_loss": -10.676322937011719, "global_step": 151672, "epoch": 902} {"train_loss": -10.936203002929688, "global_step": 151673, "epoch": 902} {"train_loss": -10.855077743530273, "global_step": 151674, "epoch": 902} {"train_loss": -10.693621635437012, "global_step": 151675, "epoch": 902} {"train_loss": -11.194278717041016, "global_step": 151676, "epoch": 902} {"train_loss": -10.771883964538574, "global_step": 151677, "epoch": 902} {"train_loss": -11.111248016357422, "global_step": 151678, "epoch": 902} {"train_loss": -10.866779327392578, "global_step": 151679, "epoch": 902} {"train_loss": -10.98874282836914, "global_step": 151680, "epoch": 902} {"train_loss": -11.021584510803223, "global_step": 151681, "epoch": 902} {"train_loss": -10.971923828125, "global_step": 151682, "epoch": 902} {"train_loss": -11.263319969177246, "global_step": 151683, "epoch": 902} {"train_loss": -10.709975242614746, "global_step": 151684, "epoch": 902} {"train_loss": -10.9178466796875, "global_step": 151685, "epoch": 902} {"train_loss": -10.967575073242188, "global_step": 151686, "epoch": 902} {"train_loss": -10.768531799316406, "global_step": 151687, "epoch": 902} {"train_loss": -10.922243118286133, "global_step": 151688, "epoch": 902} {"train_loss": -10.650632858276367, "global_step": 151689, "epoch": 902} {"train_loss": -9.66571044921875, "global_step": 151690, "epoch": 902} {"train_loss": -10.762861251831055, "global_step": 151691, "epoch": 902} {"train_loss": -10.84648323059082, "global_step": 151692, "epoch": 902} {"train_loss": -10.401386260986328, "global_step": 151693, "epoch": 902} {"train_loss": -10.965402603149414, "global_step": 151694, "epoch": 902} {"train_loss": -10.690202713012695, "global_step": 151695, "epoch": 902} {"train_loss": -10.646263122558594, "global_step": 151696, "epoch": 902} {"train_loss": -10.687237739562988, "global_step": 151697, "epoch": 902} {"train_loss": -10.792901039123535, "global_step": 151698, "epoch": 902} {"train_loss": -10.303120613098145, "global_step": 151699, "epoch": 902} {"train_loss": -10.633888244628906, "global_step": 151700, "epoch": 902} {"train_loss": -10.612846374511719, "global_step": 151701, "epoch": 902} {"train_loss": -10.479503631591797, "global_step": 151702, "epoch": 902} {"train_loss": -10.595946817171006, "global_step": 151703, "epoch": 902, "val_loss": 229869.84375} {"train_loss": -10.677982330322266, "global_step": 151704, "epoch": 903} {"train_loss": -10.714055061340332, "global_step": 151705, "epoch": 903} {"train_loss": -10.598979949951172, "global_step": 151706, "epoch": 903} {"train_loss": -10.540475845336914, "global_step": 151707, "epoch": 903} {"train_loss": -10.520828247070312, "global_step": 151708, "epoch": 903} {"train_loss": -10.827594757080078, "global_step": 151709, "epoch": 903} {"train_loss": -10.660591125488281, "global_step": 151710, "epoch": 903} {"train_loss": -10.437840461730957, "global_step": 151711, "epoch": 903} {"train_loss": -10.880866050720215, "global_step": 151712, "epoch": 903} {"train_loss": -10.497405052185059, "global_step": 151713, "epoch": 903} {"train_loss": -10.879678726196289, "global_step": 151714, "epoch": 903} {"train_loss": -10.479053497314453, "global_step": 151715, "epoch": 903} {"train_loss": -10.710086822509766, "global_step": 151716, "epoch": 903} {"train_loss": -10.774103164672852, "global_step": 151717, "epoch": 903} {"train_loss": -10.57547378540039, "global_step": 151718, "epoch": 903} {"train_loss": -10.564148902893066, "global_step": 151719, "epoch": 903} {"train_loss": -10.719696044921875, "global_step": 151720, "epoch": 903} {"train_loss": -10.61288070678711, "global_step": 151721, "epoch": 903} {"train_loss": -10.75993537902832, "global_step": 151722, "epoch": 903} {"train_loss": -10.963188171386719, "global_step": 151723, "epoch": 903} {"train_loss": -10.831216812133789, "global_step": 151724, "epoch": 903} {"train_loss": -10.75808334350586, "global_step": 151725, "epoch": 903} {"train_loss": -10.773046493530273, "global_step": 151726, "epoch": 903} {"train_loss": -10.624608993530273, "global_step": 151727, "epoch": 903} {"train_loss": -10.682421684265137, "global_step": 151728, "epoch": 903} {"train_loss": -10.695775032043457, "global_step": 151729, "epoch": 903} {"train_loss": -10.847597122192383, "global_step": 151730, "epoch": 903} {"train_loss": -10.519987106323242, "global_step": 151731, "epoch": 903} {"train_loss": -10.761970520019531, "global_step": 151732, "epoch": 903} {"train_loss": -10.737726211547852, "global_step": 151733, "epoch": 903} {"train_loss": -10.597553253173828, "global_step": 151734, "epoch": 903} {"train_loss": -10.954912185668945, "global_step": 151735, "epoch": 903} {"train_loss": -10.471185684204102, "global_step": 151736, "epoch": 903} {"train_loss": -10.777021408081055, "global_step": 151737, "epoch": 903} {"train_loss": -10.669601440429688, "global_step": 151738, "epoch": 903} {"train_loss": -10.698745727539062, "global_step": 151739, "epoch": 903} {"train_loss": -10.666682243347168, "global_step": 151740, "epoch": 903} {"train_loss": -10.591193199157715, "global_step": 151741, "epoch": 903} {"train_loss": -10.906574249267578, "global_step": 151742, "epoch": 903} {"train_loss": -10.709776878356934, "global_step": 151743, "epoch": 903} {"train_loss": -10.954191207885742, "global_step": 151744, "epoch": 903} {"train_loss": -10.771778106689453, "global_step": 151745, "epoch": 903} {"train_loss": -10.722911834716797, "global_step": 151746, "epoch": 903} {"train_loss": -11.120620727539062, "global_step": 151747, "epoch": 903} {"train_loss": -10.579660415649414, "global_step": 151748, "epoch": 903} {"train_loss": -11.100568771362305, "global_step": 151749, "epoch": 903} {"train_loss": -10.7069673538208, "global_step": 151750, "epoch": 903} {"train_loss": -10.98236083984375, "global_step": 151751, "epoch": 903} {"train_loss": -10.688837051391602, "global_step": 151752, "epoch": 903} {"train_loss": -10.736631393432617, "global_step": 151753, "epoch": 903} {"train_loss": -10.75537395477295, "global_step": 151754, "epoch": 903} {"train_loss": -10.414949417114258, "global_step": 151755, "epoch": 903} {"train_loss": -11.012611389160156, "global_step": 151756, "epoch": 903} {"train_loss": -10.599589347839355, "global_step": 151757, "epoch": 903} {"train_loss": -10.446695327758789, "global_step": 151758, "epoch": 903} {"train_loss": -10.783373832702637, "global_step": 151759, "epoch": 903} {"train_loss": -10.281136512756348, "global_step": 151760, "epoch": 903} {"train_loss": -10.846403121948242, "global_step": 151761, "epoch": 903} {"train_loss": -10.545001983642578, "global_step": 151762, "epoch": 903} {"train_loss": -10.333984375, "global_step": 151763, "epoch": 903} {"train_loss": -10.832011222839355, "global_step": 151764, "epoch": 903} {"train_loss": -10.233551979064941, "global_step": 151765, "epoch": 903} {"train_loss": -10.781773567199707, "global_step": 151766, "epoch": 903} {"train_loss": -9.74950885772705, "global_step": 151767, "epoch": 903} {"train_loss": -10.838590621948242, "global_step": 151768, "epoch": 903} {"train_loss": -10.592527389526367, "global_step": 151769, "epoch": 903} {"train_loss": -10.689558029174805, "global_step": 151770, "epoch": 903} {"train_loss": -10.64184856414795, "global_step": 151771, "epoch": 903} {"train_loss": -10.49191951751709, "global_step": 151772, "epoch": 903} {"train_loss": -10.876604080200195, "global_step": 151773, "epoch": 903} {"train_loss": -10.686275482177734, "global_step": 151774, "epoch": 903} {"train_loss": -10.767675399780273, "global_step": 151775, "epoch": 903} {"train_loss": -10.782880783081055, "global_step": 151776, "epoch": 903} {"train_loss": -10.890810012817383, "global_step": 151777, "epoch": 903} {"train_loss": -10.705114364624023, "global_step": 151778, "epoch": 903} {"train_loss": -10.853553771972656, "global_step": 151779, "epoch": 903} {"train_loss": -10.829267501831055, "global_step": 151780, "epoch": 903} {"train_loss": -10.91303825378418, "global_step": 151781, "epoch": 903} {"train_loss": -10.875812530517578, "global_step": 151782, "epoch": 903} {"train_loss": -10.779781341552734, "global_step": 151783, "epoch": 903} {"train_loss": -11.078012466430664, "global_step": 151784, "epoch": 903} {"train_loss": -10.772600173950195, "global_step": 151785, "epoch": 903} {"train_loss": -10.922450065612793, "global_step": 151786, "epoch": 903} {"train_loss": -10.943687438964844, "global_step": 151787, "epoch": 903} {"train_loss": -10.976303100585938, "global_step": 151788, "epoch": 903} {"train_loss": -10.8735933303833, "global_step": 151789, "epoch": 903} {"train_loss": -10.649333953857422, "global_step": 151790, "epoch": 903} {"train_loss": -10.493768692016602, "global_step": 151791, "epoch": 903} {"train_loss": -10.814403533935547, "global_step": 151792, "epoch": 903} {"train_loss": -10.803871154785156, "global_step": 151793, "epoch": 903} {"train_loss": -10.806058883666992, "global_step": 151794, "epoch": 903} {"train_loss": -10.745529174804688, "global_step": 151795, "epoch": 903} {"train_loss": -10.836515426635742, "global_step": 151796, "epoch": 903} {"train_loss": -10.692173957824707, "global_step": 151797, "epoch": 903} {"train_loss": -10.773369789123535, "global_step": 151798, "epoch": 903} {"train_loss": -10.91006088256836, "global_step": 151799, "epoch": 903} {"train_loss": -11.029912948608398, "global_step": 151800, "epoch": 903} {"train_loss": -10.825963973999023, "global_step": 151801, "epoch": 903} {"train_loss": -11.064249038696289, "global_step": 151802, "epoch": 903} {"train_loss": -11.055378913879395, "global_step": 151803, "epoch": 903} {"train_loss": -11.039520263671875, "global_step": 151804, "epoch": 903} {"train_loss": -10.97633171081543, "global_step": 151805, "epoch": 903} {"train_loss": -10.93746566772461, "global_step": 151806, "epoch": 903} {"train_loss": -11.127912521362305, "global_step": 151807, "epoch": 903} {"train_loss": -10.932326316833496, "global_step": 151808, "epoch": 903} {"train_loss": -10.949438095092773, "global_step": 151809, "epoch": 903} {"train_loss": -11.115276336669922, "global_step": 151810, "epoch": 903} {"train_loss": -10.667141914367676, "global_step": 151811, "epoch": 903} {"train_loss": -11.084281921386719, "global_step": 151812, "epoch": 903} {"train_loss": -10.671531677246094, "global_step": 151813, "epoch": 903} {"train_loss": -10.979812622070312, "global_step": 151814, "epoch": 903} {"train_loss": -10.969327926635742, "global_step": 151815, "epoch": 903} {"train_loss": -10.242072105407715, "global_step": 151816, "epoch": 903} {"train_loss": -9.464216232299805, "global_step": 151817, "epoch": 903} {"train_loss": -10.849761962890625, "global_step": 151818, "epoch": 903} {"train_loss": -8.91760540008545, "global_step": 151819, "epoch": 903} {"train_loss": -8.791437149047852, "global_step": 151820, "epoch": 903} {"train_loss": -10.44637680053711, "global_step": 151821, "epoch": 903} {"train_loss": -6.198758125305176, "global_step": 151822, "epoch": 903} {"train_loss": -8.521890640258789, "global_step": 151823, "epoch": 903} {"train_loss": -8.370086669921875, "global_step": 151824, "epoch": 903} {"train_loss": -10.529045104980469, "global_step": 151825, "epoch": 903} {"train_loss": -9.089666366577148, "global_step": 151826, "epoch": 903} {"train_loss": -9.960102081298828, "global_step": 151827, "epoch": 903} {"train_loss": -8.599955558776855, "global_step": 151828, "epoch": 903} {"train_loss": -9.07895278930664, "global_step": 151829, "epoch": 903} {"train_loss": -8.744009017944336, "global_step": 151830, "epoch": 903} {"train_loss": -9.637643814086914, "global_step": 151831, "epoch": 903} {"train_loss": -9.182283401489258, "global_step": 151832, "epoch": 903} {"train_loss": -9.606952667236328, "global_step": 151833, "epoch": 903} {"train_loss": -9.906608581542969, "global_step": 151834, "epoch": 903} {"train_loss": -8.552336692810059, "global_step": 151835, "epoch": 903} {"train_loss": -9.841008186340332, "global_step": 151836, "epoch": 903} {"train_loss": -9.663080215454102, "global_step": 151837, "epoch": 903} {"train_loss": -9.504081726074219, "global_step": 151838, "epoch": 903} {"train_loss": -10.219215393066406, "global_step": 151839, "epoch": 903} {"train_loss": -10.031204223632812, "global_step": 151840, "epoch": 903} {"train_loss": -10.037038803100586, "global_step": 151841, "epoch": 903} {"train_loss": -9.814693450927734, "global_step": 151842, "epoch": 903} {"train_loss": -9.784598350524902, "global_step": 151843, "epoch": 903} {"train_loss": -10.282806396484375, "global_step": 151844, "epoch": 903} {"train_loss": -9.896636009216309, "global_step": 151845, "epoch": 903} {"train_loss": -9.759380340576172, "global_step": 151846, "epoch": 903} {"train_loss": -10.288145065307617, "global_step": 151847, "epoch": 903} {"train_loss": -9.965850830078125, "global_step": 151848, "epoch": 903} {"train_loss": -10.33199691772461, "global_step": 151849, "epoch": 903} {"train_loss": -10.527368545532227, "global_step": 151850, "epoch": 903} {"train_loss": -10.26976203918457, "global_step": 151851, "epoch": 903} {"train_loss": -10.305147171020508, "global_step": 151852, "epoch": 903} {"train_loss": -10.212532043457031, "global_step": 151853, "epoch": 903} {"train_loss": -10.303714752197266, "global_step": 151854, "epoch": 903} {"train_loss": -10.484319686889648, "global_step": 151855, "epoch": 903} {"train_loss": -10.389785766601562, "global_step": 151856, "epoch": 903} {"train_loss": -10.427530288696289, "global_step": 151857, "epoch": 903} {"train_loss": -10.534648895263672, "global_step": 151858, "epoch": 903} {"train_loss": -10.295524597167969, "global_step": 151859, "epoch": 903} {"train_loss": -10.648154258728027, "global_step": 151860, "epoch": 903} {"train_loss": -10.493818283081055, "global_step": 151861, "epoch": 903} {"train_loss": -10.490715026855469, "global_step": 151862, "epoch": 903} {"train_loss": -10.719930648803711, "global_step": 151863, "epoch": 903} {"train_loss": -10.29782485961914, "global_step": 151864, "epoch": 903} {"train_loss": -10.507147789001465, "global_step": 151865, "epoch": 903} {"train_loss": -10.705010414123535, "global_step": 151866, "epoch": 903} {"train_loss": -10.602499008178711, "global_step": 151867, "epoch": 903} {"train_loss": -10.682483673095703, "global_step": 151868, "epoch": 903} {"train_loss": -10.580206871032715, "global_step": 151869, "epoch": 903} {"train_loss": -10.676013946533203, "global_step": 151870, "epoch": 903} {"train_loss": -10.472046886171613, "global_step": 151871, "epoch": 903, "val_loss": 219696.53125} {"train_loss": -10.828510284423828, "global_step": 151872, "epoch": 904} {"train_loss": -10.723337173461914, "global_step": 151873, "epoch": 904} {"train_loss": -10.652511596679688, "global_step": 151874, "epoch": 904} {"train_loss": -10.964265823364258, "global_step": 151875, "epoch": 904} {"train_loss": -10.768463134765625, "global_step": 151876, "epoch": 904} {"train_loss": -10.802701950073242, "global_step": 151877, "epoch": 904} {"train_loss": -10.842252731323242, "global_step": 151878, "epoch": 904} {"train_loss": -10.920404434204102, "global_step": 151879, "epoch": 904} {"train_loss": -10.806404113769531, "global_step": 151880, "epoch": 904} {"train_loss": -10.834932327270508, "global_step": 151881, "epoch": 904} {"train_loss": -10.546807289123535, "global_step": 151882, "epoch": 904} {"train_loss": -11.018465042114258, "global_step": 151883, "epoch": 904} {"train_loss": -10.981025695800781, "global_step": 151884, "epoch": 904} {"train_loss": -10.76673698425293, "global_step": 151885, "epoch": 904} {"train_loss": -10.876520156860352, "global_step": 151886, "epoch": 904} {"train_loss": -10.713826179504395, "global_step": 151887, "epoch": 904} {"train_loss": -10.775640487670898, "global_step": 151888, "epoch": 904} {"train_loss": -11.151148796081543, "global_step": 151889, "epoch": 904} {"train_loss": -10.809235572814941, "global_step": 151890, "epoch": 904} {"train_loss": -10.822982788085938, "global_step": 151891, "epoch": 904} {"train_loss": -11.060761451721191, "global_step": 151892, "epoch": 904} {"train_loss": -11.106598854064941, "global_step": 151893, "epoch": 904} {"train_loss": -11.151895523071289, "global_step": 151894, "epoch": 904} {"train_loss": -11.095552444458008, "global_step": 151895, "epoch": 904} {"train_loss": -10.744444847106934, "global_step": 151896, "epoch": 904} {"train_loss": -11.144246101379395, "global_step": 151897, "epoch": 904} {"train_loss": -10.955780029296875, "global_step": 151898, "epoch": 904} {"train_loss": -11.071809768676758, "global_step": 151899, "epoch": 904} {"train_loss": -11.058309555053711, "global_step": 151900, "epoch": 904} {"train_loss": -11.148778915405273, "global_step": 151901, "epoch": 904} {"train_loss": -11.090194702148438, "global_step": 151902, "epoch": 904} {"train_loss": -10.965140342712402, "global_step": 151903, "epoch": 904} {"train_loss": -10.896080017089844, "global_step": 151904, "epoch": 904} {"train_loss": -10.884822845458984, "global_step": 151905, "epoch": 904} {"train_loss": -11.17870807647705, "global_step": 151906, "epoch": 904} {"train_loss": -10.89858627319336, "global_step": 151907, "epoch": 904} {"train_loss": -10.75045394897461, "global_step": 151908, "epoch": 904} {"train_loss": -11.047704696655273, "global_step": 151909, "epoch": 904} {"train_loss": -10.901145935058594, "global_step": 151910, "epoch": 904} {"train_loss": -10.75596809387207, "global_step": 151911, "epoch": 904} {"train_loss": -9.259532928466797, "global_step": 151912, "epoch": 904} {"train_loss": -9.307951927185059, "global_step": 151913, "epoch": 904} {"train_loss": -10.42755126953125, "global_step": 151914, "epoch": 904} {"train_loss": -10.355096817016602, "global_step": 151915, "epoch": 904} {"train_loss": -9.9552001953125, "global_step": 151916, "epoch": 904} {"train_loss": -9.995153427124023, "global_step": 151917, "epoch": 904} {"train_loss": -9.739943504333496, "global_step": 151918, "epoch": 904} {"train_loss": -9.873542785644531, "global_step": 151919, "epoch": 904} {"train_loss": -9.038118362426758, "global_step": 151920, "epoch": 904} {"train_loss": -10.624772071838379, "global_step": 151921, "epoch": 904} {"train_loss": -9.41448974609375, "global_step": 151922, "epoch": 904} {"train_loss": -10.328239440917969, "global_step": 151923, "epoch": 904} {"train_loss": -9.83454704284668, "global_step": 151924, "epoch": 904} {"train_loss": -9.766799926757812, "global_step": 151925, "epoch": 904} {"train_loss": -10.360278129577637, "global_step": 151926, "epoch": 904} {"train_loss": -10.231622695922852, "global_step": 151927, "epoch": 904} {"train_loss": -10.2437744140625, "global_step": 151928, "epoch": 904} {"train_loss": -10.703886032104492, "global_step": 151929, "epoch": 904} {"train_loss": -10.333463668823242, "global_step": 151930, "epoch": 904} {"train_loss": -10.368160247802734, "global_step": 151931, "epoch": 904} {"train_loss": -10.41446304321289, "global_step": 151932, "epoch": 904} {"train_loss": -10.194095611572266, "global_step": 151933, "epoch": 904} {"train_loss": -10.143131256103516, "global_step": 151934, "epoch": 904} {"train_loss": -10.150158882141113, "global_step": 151935, "epoch": 904} {"train_loss": -10.254179000854492, "global_step": 151936, "epoch": 904} {"train_loss": -10.371806144714355, "global_step": 151937, "epoch": 904} {"train_loss": -10.447479248046875, "global_step": 151938, "epoch": 904} {"train_loss": -10.233471870422363, "global_step": 151939, "epoch": 904} {"train_loss": -10.545740127563477, "global_step": 151940, "epoch": 904} {"train_loss": -10.49041748046875, "global_step": 151941, "epoch": 904} {"train_loss": -10.218341827392578, "global_step": 151942, "epoch": 904} {"train_loss": -10.451770782470703, "global_step": 151943, "epoch": 904} {"train_loss": -10.472691535949707, "global_step": 151944, "epoch": 904} {"train_loss": -10.486358642578125, "global_step": 151945, "epoch": 904} {"train_loss": -10.702095031738281, "global_step": 151946, "epoch": 904} {"train_loss": -10.688600540161133, "global_step": 151947, "epoch": 904} {"train_loss": -10.464970588684082, "global_step": 151948, "epoch": 904} {"train_loss": -10.672581672668457, "global_step": 151949, "epoch": 904} {"train_loss": -10.687966346740723, "global_step": 151950, "epoch": 904} {"train_loss": -10.416152954101562, "global_step": 151951, "epoch": 904} {"train_loss": -10.870166778564453, "global_step": 151952, "epoch": 904} {"train_loss": -10.61977767944336, "global_step": 151953, "epoch": 904} {"train_loss": -10.78088092803955, "global_step": 151954, "epoch": 904} {"train_loss": -10.971656799316406, "global_step": 151955, "epoch": 904} {"train_loss": -10.814881324768066, "global_step": 151956, "epoch": 904} {"train_loss": -10.848286628723145, "global_step": 151957, "epoch": 904} {"train_loss": -10.902713775634766, "global_step": 151958, "epoch": 904} {"train_loss": -10.965904235839844, "global_step": 151959, "epoch": 904} {"train_loss": -10.807607650756836, "global_step": 151960, "epoch": 904} {"train_loss": -10.799427032470703, "global_step": 151961, "epoch": 904} {"train_loss": -10.907561302185059, "global_step": 151962, "epoch": 904} {"train_loss": -11.014669418334961, "global_step": 151963, "epoch": 904} {"train_loss": -10.709672927856445, "global_step": 151964, "epoch": 904} {"train_loss": -10.727258682250977, "global_step": 151965, "epoch": 904} {"train_loss": -10.95224666595459, "global_step": 151966, "epoch": 904} {"train_loss": -10.809946060180664, "global_step": 151967, "epoch": 904} {"train_loss": -11.006683349609375, "global_step": 151968, "epoch": 904} {"train_loss": -10.73398494720459, "global_step": 151969, "epoch": 904} {"train_loss": -11.120170593261719, "global_step": 151970, "epoch": 904} {"train_loss": -10.825294494628906, "global_step": 151971, "epoch": 904} {"train_loss": -10.982115745544434, "global_step": 151972, "epoch": 904} {"train_loss": -10.886454582214355, "global_step": 151973, "epoch": 904} {"train_loss": -10.912286758422852, "global_step": 151974, "epoch": 904} {"train_loss": -10.93932056427002, "global_step": 151975, "epoch": 904} {"train_loss": -10.973875045776367, "global_step": 151976, "epoch": 904} {"train_loss": -10.995275497436523, "global_step": 151977, "epoch": 904} {"train_loss": -10.820796966552734, "global_step": 151978, "epoch": 904} {"train_loss": -10.8136568069458, "global_step": 151979, "epoch": 904} {"train_loss": -11.013614654541016, "global_step": 151980, "epoch": 904} {"train_loss": -10.883298873901367, "global_step": 151981, "epoch": 904} {"train_loss": -11.227624893188477, "global_step": 151982, "epoch": 904} {"train_loss": -10.994989395141602, "global_step": 151983, "epoch": 904} {"train_loss": -11.168853759765625, "global_step": 151984, "epoch": 904} {"train_loss": -10.74284553527832, "global_step": 151985, "epoch": 904} {"train_loss": -11.041650772094727, "global_step": 151986, "epoch": 904} {"train_loss": -10.75914478302002, "global_step": 151987, "epoch": 904} {"train_loss": -10.94713020324707, "global_step": 151988, "epoch": 904} {"train_loss": -10.692209243774414, "global_step": 151989, "epoch": 904} {"train_loss": -11.165014266967773, "global_step": 151990, "epoch": 904} {"train_loss": -10.888266563415527, "global_step": 151991, "epoch": 904} {"train_loss": -11.169723510742188, "global_step": 151992, "epoch": 904} {"train_loss": -10.87091064453125, "global_step": 151993, "epoch": 904} {"train_loss": -11.005359649658203, "global_step": 151994, "epoch": 904} {"train_loss": -10.943836212158203, "global_step": 151995, "epoch": 904} {"train_loss": -11.014389038085938, "global_step": 151996, "epoch": 904} {"train_loss": -10.526790618896484, "global_step": 151997, "epoch": 904} {"train_loss": -10.671245574951172, "global_step": 151998, "epoch": 904} {"train_loss": -10.714658737182617, "global_step": 151999, "epoch": 904} {"train_loss": -10.85283088684082, "global_step": 152000, "epoch": 904} {"train_loss": -10.82960319519043, "global_step": 152001, "epoch": 904} {"train_loss": -10.13250732421875, "global_step": 152002, "epoch": 904} {"train_loss": -10.391758918762207, "global_step": 152003, "epoch": 904} {"train_loss": -10.67251968383789, "global_step": 152004, "epoch": 904} {"train_loss": -10.4987211227417, "global_step": 152005, "epoch": 904} {"train_loss": -10.074361801147461, "global_step": 152006, "epoch": 904} {"train_loss": -10.819769859313965, "global_step": 152007, "epoch": 904} {"train_loss": -10.30694580078125, "global_step": 152008, "epoch": 904} {"train_loss": -10.699967384338379, "global_step": 152009, "epoch": 904} {"train_loss": -10.715921401977539, "global_step": 152010, "epoch": 904} {"train_loss": -10.154895782470703, "global_step": 152011, "epoch": 904} {"train_loss": -10.50619125366211, "global_step": 152012, "epoch": 904} {"train_loss": -10.212032318115234, "global_step": 152013, "epoch": 904} {"train_loss": -10.400723457336426, "global_step": 152014, "epoch": 904} {"train_loss": -10.57448959350586, "global_step": 152015, "epoch": 904} {"train_loss": -10.121111869812012, "global_step": 152016, "epoch": 904} {"train_loss": -10.133527755737305, "global_step": 152017, "epoch": 904} {"train_loss": -9.702054977416992, "global_step": 152018, "epoch": 904} {"train_loss": -10.1903076171875, "global_step": 152019, "epoch": 904} {"train_loss": -10.08332633972168, "global_step": 152020, "epoch": 904} {"train_loss": -10.523359298706055, "global_step": 152021, "epoch": 904} {"train_loss": -10.019763946533203, "global_step": 152022, "epoch": 904} {"train_loss": -10.235660552978516, "global_step": 152023, "epoch": 904} {"train_loss": -10.374988555908203, "global_step": 152024, "epoch": 904} {"train_loss": -9.966591835021973, "global_step": 152025, "epoch": 904} {"train_loss": -10.265159606933594, "global_step": 152026, "epoch": 904} {"train_loss": -10.062911987304688, "global_step": 152027, "epoch": 904} {"train_loss": -9.78756332397461, "global_step": 152028, "epoch": 904} {"train_loss": -10.52929401397705, "global_step": 152029, "epoch": 904} {"train_loss": -9.758466720581055, "global_step": 152030, "epoch": 904} {"train_loss": -10.656292915344238, "global_step": 152031, "epoch": 904} {"train_loss": -10.130805969238281, "global_step": 152032, "epoch": 904} {"train_loss": -10.446237564086914, "global_step": 152033, "epoch": 904} {"train_loss": -10.321353912353516, "global_step": 152034, "epoch": 904} {"train_loss": -10.726445198059082, "global_step": 152035, "epoch": 904} {"train_loss": -10.31620979309082, "global_step": 152036, "epoch": 904} {"train_loss": -10.585126876831055, "global_step": 152037, "epoch": 904} {"train_loss": -10.551363945007324, "global_step": 152038, "epoch": 904} {"train_loss": -10.606096227963766, "global_step": 152039, "epoch": 904, "val_loss": 230227.625} {"train_loss": -10.182710647583008, "global_step": 152040, "epoch": 905} {"train_loss": -10.632747650146484, "global_step": 152041, "epoch": 905} {"train_loss": -10.35950756072998, "global_step": 152042, "epoch": 905} {"train_loss": -10.234939575195312, "global_step": 152043, "epoch": 905} {"train_loss": -10.162988662719727, "global_step": 152044, "epoch": 905} {"train_loss": -10.057732582092285, "global_step": 152045, "epoch": 905} {"train_loss": -9.94555377960205, "global_step": 152046, "epoch": 905} {"train_loss": -10.430978775024414, "global_step": 152047, "epoch": 905} {"train_loss": -10.14021110534668, "global_step": 152048, "epoch": 905} {"train_loss": -10.700502395629883, "global_step": 152049, "epoch": 905} {"train_loss": -10.047861099243164, "global_step": 152050, "epoch": 905} {"train_loss": -10.65986156463623, "global_step": 152051, "epoch": 905} {"train_loss": -10.359468460083008, "global_step": 152052, "epoch": 905} {"train_loss": -10.55740737915039, "global_step": 152053, "epoch": 905} {"train_loss": -10.625579833984375, "global_step": 152054, "epoch": 905} {"train_loss": -10.781414031982422, "global_step": 152055, "epoch": 905} {"train_loss": -10.466201782226562, "global_step": 152056, "epoch": 905} {"train_loss": -10.616776466369629, "global_step": 152057, "epoch": 905} {"train_loss": -10.63546085357666, "global_step": 152058, "epoch": 905} {"train_loss": -10.740142822265625, "global_step": 152059, "epoch": 905} {"train_loss": -10.391508102416992, "global_step": 152060, "epoch": 905} {"train_loss": -10.714158058166504, "global_step": 152061, "epoch": 905} {"train_loss": -10.503567695617676, "global_step": 152062, "epoch": 905} {"train_loss": -10.616741180419922, "global_step": 152063, "epoch": 905} {"train_loss": -10.712453842163086, "global_step": 152064, "epoch": 905} {"train_loss": -10.806707382202148, "global_step": 152065, "epoch": 905} {"train_loss": -10.489208221435547, "global_step": 152066, "epoch": 905} {"train_loss": -10.770295143127441, "global_step": 152067, "epoch": 905} {"train_loss": -10.65611743927002, "global_step": 152068, "epoch": 905} {"train_loss": -10.619439125061035, "global_step": 152069, "epoch": 905} {"train_loss": -10.854066848754883, "global_step": 152070, "epoch": 905} {"train_loss": -10.733383178710938, "global_step": 152071, "epoch": 905} {"train_loss": -10.846600532531738, "global_step": 152072, "epoch": 905} {"train_loss": -10.99635124206543, "global_step": 152073, "epoch": 905} {"train_loss": -10.836514472961426, "global_step": 152074, "epoch": 905} {"train_loss": -10.980890274047852, "global_step": 152075, "epoch": 905} {"train_loss": -10.767068862915039, "global_step": 152076, "epoch": 905} {"train_loss": -10.933382987976074, "global_step": 152077, "epoch": 905} {"train_loss": -11.126810073852539, "global_step": 152078, "epoch": 905} {"train_loss": -10.934932708740234, "global_step": 152079, "epoch": 905} {"train_loss": -10.999921798706055, "global_step": 152080, "epoch": 905} {"train_loss": -10.826737403869629, "global_step": 152081, "epoch": 905} {"train_loss": -10.642545700073242, "global_step": 152082, "epoch": 905} {"train_loss": -10.680761337280273, "global_step": 152083, "epoch": 905} {"train_loss": -10.51595401763916, "global_step": 152084, "epoch": 905} {"train_loss": -10.535072326660156, "global_step": 152085, "epoch": 905} {"train_loss": -10.677298545837402, "global_step": 152086, "epoch": 905} {"train_loss": -10.385538101196289, "global_step": 152087, "epoch": 905} {"train_loss": -10.7771577835083, "global_step": 152088, "epoch": 905} {"train_loss": -10.238412857055664, "global_step": 152089, "epoch": 905} {"train_loss": -10.455333709716797, "global_step": 152090, "epoch": 905} {"train_loss": -10.909832000732422, "global_step": 152091, "epoch": 905} {"train_loss": -10.366734504699707, "global_step": 152092, "epoch": 905} {"train_loss": -11.062395095825195, "global_step": 152093, "epoch": 905} {"train_loss": -10.090319633483887, "global_step": 152094, "epoch": 905} {"train_loss": -10.999749183654785, "global_step": 152095, "epoch": 905} {"train_loss": -10.374550819396973, "global_step": 152096, "epoch": 905} {"train_loss": -10.310291290283203, "global_step": 152097, "epoch": 905} {"train_loss": -10.893641471862793, "global_step": 152098, "epoch": 905} {"train_loss": -10.770444869995117, "global_step": 152099, "epoch": 905} {"train_loss": -10.787117958068848, "global_step": 152100, "epoch": 905} {"train_loss": -10.657901763916016, "global_step": 152101, "epoch": 905} {"train_loss": -11.038616180419922, "global_step": 152102, "epoch": 905} {"train_loss": -10.673040390014648, "global_step": 152103, "epoch": 905} {"train_loss": -10.619617462158203, "global_step": 152104, "epoch": 905} {"train_loss": -10.923033714294434, "global_step": 152105, "epoch": 905} {"train_loss": -10.618488311767578, "global_step": 152106, "epoch": 905} {"train_loss": -10.774380683898926, "global_step": 152107, "epoch": 905} {"train_loss": -10.649632453918457, "global_step": 152108, "epoch": 905} {"train_loss": -10.498299598693848, "global_step": 152109, "epoch": 905} {"train_loss": -10.950674057006836, "global_step": 152110, "epoch": 905} {"train_loss": -10.610034942626953, "global_step": 152111, "epoch": 905} {"train_loss": -10.900782585144043, "global_step": 152112, "epoch": 905} {"train_loss": -10.895963668823242, "global_step": 152113, "epoch": 905} {"train_loss": -10.677443504333496, "global_step": 152114, "epoch": 905} {"train_loss": -10.913256645202637, "global_step": 152115, "epoch": 905} {"train_loss": -10.50904655456543, "global_step": 152116, "epoch": 905} {"train_loss": -10.787384033203125, "global_step": 152117, "epoch": 905} {"train_loss": -10.755481719970703, "global_step": 152118, "epoch": 905} {"train_loss": -10.64057445526123, "global_step": 152119, "epoch": 905} {"train_loss": -10.846592903137207, "global_step": 152120, "epoch": 905} {"train_loss": -10.869450569152832, "global_step": 152121, "epoch": 905} {"train_loss": -10.834646224975586, "global_step": 152122, "epoch": 905} {"train_loss": -10.867512702941895, "global_step": 152123, "epoch": 905} {"train_loss": -10.669846534729004, "global_step": 152124, "epoch": 905} {"train_loss": -11.126031875610352, "global_step": 152125, "epoch": 905} {"train_loss": -10.970544815063477, "global_step": 152126, "epoch": 905} {"train_loss": -10.960397720336914, "global_step": 152127, "epoch": 905} {"train_loss": -10.88320255279541, "global_step": 152128, "epoch": 905} {"train_loss": -10.523615837097168, "global_step": 152129, "epoch": 905} {"train_loss": -10.880041122436523, "global_step": 152130, "epoch": 905} {"train_loss": -10.247047424316406, "global_step": 152131, "epoch": 905} {"train_loss": -10.212486267089844, "global_step": 152132, "epoch": 905} {"train_loss": -10.901212692260742, "global_step": 152133, "epoch": 905} {"train_loss": -10.04538345336914, "global_step": 152134, "epoch": 905} {"train_loss": -10.701944351196289, "global_step": 152135, "epoch": 905} {"train_loss": -10.483912467956543, "global_step": 152136, "epoch": 905} {"train_loss": -10.218127250671387, "global_step": 152137, "epoch": 905} {"train_loss": -10.883119583129883, "global_step": 152138, "epoch": 905} {"train_loss": -10.184664726257324, "global_step": 152139, "epoch": 905} {"train_loss": -10.412410736083984, "global_step": 152140, "epoch": 905} {"train_loss": -10.644530296325684, "global_step": 152141, "epoch": 905} {"train_loss": -10.372968673706055, "global_step": 152142, "epoch": 905} {"train_loss": -10.660468101501465, "global_step": 152143, "epoch": 905} {"train_loss": -10.459864616394043, "global_step": 152144, "epoch": 905} {"train_loss": -10.904212951660156, "global_step": 152145, "epoch": 905} {"train_loss": -10.423649787902832, "global_step": 152146, "epoch": 905} {"train_loss": -10.63461685180664, "global_step": 152147, "epoch": 905} {"train_loss": -10.437082290649414, "global_step": 152148, "epoch": 905} {"train_loss": -10.491145133972168, "global_step": 152149, "epoch": 905} {"train_loss": -10.36365032196045, "global_step": 152150, "epoch": 905} {"train_loss": -10.363592147827148, "global_step": 152151, "epoch": 905} {"train_loss": -10.332107543945312, "global_step": 152152, "epoch": 905} {"train_loss": -10.465412139892578, "global_step": 152153, "epoch": 905} {"train_loss": -10.323591232299805, "global_step": 152154, "epoch": 905} {"train_loss": -10.416223526000977, "global_step": 152155, "epoch": 905} {"train_loss": -10.476295471191406, "global_step": 152156, "epoch": 905} {"train_loss": -10.039579391479492, "global_step": 152157, "epoch": 905} {"train_loss": -10.855279922485352, "global_step": 152158, "epoch": 905} {"train_loss": -10.483530044555664, "global_step": 152159, "epoch": 905} {"train_loss": -10.885140419006348, "global_step": 152160, "epoch": 905} {"train_loss": -10.487442016601562, "global_step": 152161, "epoch": 905} {"train_loss": -10.394277572631836, "global_step": 152162, "epoch": 905} {"train_loss": -10.467880249023438, "global_step": 152163, "epoch": 905} {"train_loss": -10.555463790893555, "global_step": 152164, "epoch": 905} {"train_loss": -10.612403869628906, "global_step": 152165, "epoch": 905} {"train_loss": -10.522126197814941, "global_step": 152166, "epoch": 905} {"train_loss": -10.303709030151367, "global_step": 152167, "epoch": 905} {"train_loss": -10.629804611206055, "global_step": 152168, "epoch": 905} {"train_loss": -10.925341606140137, "global_step": 152169, "epoch": 905} {"train_loss": -10.54223918914795, "global_step": 152170, "epoch": 905} {"train_loss": -10.67191219329834, "global_step": 152171, "epoch": 905} {"train_loss": -10.645837783813477, "global_step": 152172, "epoch": 905} {"train_loss": -10.311856269836426, "global_step": 152173, "epoch": 905} {"train_loss": -10.905599594116211, "global_step": 152174, "epoch": 905} {"train_loss": -10.723577499389648, "global_step": 152175, "epoch": 905} {"train_loss": -10.894453048706055, "global_step": 152176, "epoch": 905} {"train_loss": -10.794492721557617, "global_step": 152177, "epoch": 905} {"train_loss": -10.820287704467773, "global_step": 152178, "epoch": 905} {"train_loss": -10.838088989257812, "global_step": 152179, "epoch": 905} {"train_loss": -10.913419723510742, "global_step": 152180, "epoch": 905} {"train_loss": -10.872184753417969, "global_step": 152181, "epoch": 905} {"train_loss": -10.821878433227539, "global_step": 152182, "epoch": 905} {"train_loss": -10.85015869140625, "global_step": 152183, "epoch": 905} {"train_loss": -11.033013343811035, "global_step": 152184, "epoch": 905} {"train_loss": -10.705820083618164, "global_step": 152185, "epoch": 905} {"train_loss": -10.73297119140625, "global_step": 152186, "epoch": 905} {"train_loss": -10.879858016967773, "global_step": 152187, "epoch": 905} {"train_loss": -10.887818336486816, "global_step": 152188, "epoch": 905} {"train_loss": -10.857110977172852, "global_step": 152189, "epoch": 905} {"train_loss": -10.70921516418457, "global_step": 152190, "epoch": 905} {"train_loss": -10.717083930969238, "global_step": 152191, "epoch": 905} {"train_loss": -10.879899978637695, "global_step": 152192, "epoch": 905} {"train_loss": -10.94743537902832, "global_step": 152193, "epoch": 905} {"train_loss": -10.771888732910156, "global_step": 152194, "epoch": 905} {"train_loss": -10.996625900268555, "global_step": 152195, "epoch": 905} {"train_loss": -10.690017700195312, "global_step": 152196, "epoch": 905} {"train_loss": -10.97297191619873, "global_step": 152197, "epoch": 905} {"train_loss": -10.73592472076416, "global_step": 152198, "epoch": 905} {"train_loss": -10.692461013793945, "global_step": 152199, "epoch": 905} {"train_loss": -10.87500286102295, "global_step": 152200, "epoch": 905} {"train_loss": -10.422245025634766, "global_step": 152201, "epoch": 905} {"train_loss": -10.528972625732422, "global_step": 152202, "epoch": 905} {"train_loss": -11.015769958496094, "global_step": 152203, "epoch": 905} {"train_loss": -10.566854476928711, "global_step": 152204, "epoch": 905} {"train_loss": -10.853578567504883, "global_step": 152205, "epoch": 905} {"train_loss": -10.798816680908203, "global_step": 152206, "epoch": 905} {"train_loss": -10.650597424734206, "global_step": 152207, "epoch": 905, "val_loss": 230662.0625, "train_action_mse_error": 1.7092193365097046} {"train_loss": -10.947015762329102, "global_step": 152208, "epoch": 906} {"train_loss": -10.979562759399414, "global_step": 152209, "epoch": 906} {"train_loss": -11.210968017578125, "global_step": 152210, "epoch": 906} {"train_loss": -10.890249252319336, "global_step": 152211, "epoch": 906} {"train_loss": -10.942645072937012, "global_step": 152212, "epoch": 906} {"train_loss": -11.009410858154297, "global_step": 152213, "epoch": 906} {"train_loss": -10.941349029541016, "global_step": 152214, "epoch": 906} {"train_loss": -11.042734146118164, "global_step": 152215, "epoch": 906} {"train_loss": -11.0224027633667, "global_step": 152216, "epoch": 906} {"train_loss": -10.873462677001953, "global_step": 152217, "epoch": 906} {"train_loss": -10.873307228088379, "global_step": 152218, "epoch": 906} {"train_loss": -10.92673397064209, "global_step": 152219, "epoch": 906} {"train_loss": -10.168248176574707, "global_step": 152220, "epoch": 906} {"train_loss": -10.812967300415039, "global_step": 152221, "epoch": 906} {"train_loss": -10.951913833618164, "global_step": 152222, "epoch": 906} {"train_loss": -10.236237525939941, "global_step": 152223, "epoch": 906} {"train_loss": -10.861486434936523, "global_step": 152224, "epoch": 906} {"train_loss": -10.817415237426758, "global_step": 152225, "epoch": 906} {"train_loss": -10.290634155273438, "global_step": 152226, "epoch": 906} {"train_loss": -10.647941589355469, "global_step": 152227, "epoch": 906} {"train_loss": -10.731008529663086, "global_step": 152228, "epoch": 906} {"train_loss": -10.944801330566406, "global_step": 152229, "epoch": 906} {"train_loss": -10.333288192749023, "global_step": 152230, "epoch": 906} {"train_loss": -11.114242553710938, "global_step": 152231, "epoch": 906} {"train_loss": -10.171686172485352, "global_step": 152232, "epoch": 906} {"train_loss": -10.575819969177246, "global_step": 152233, "epoch": 906} {"train_loss": -10.760910987854004, "global_step": 152234, "epoch": 906} {"train_loss": -10.691991806030273, "global_step": 152235, "epoch": 906} {"train_loss": -11.000444412231445, "global_step": 152236, "epoch": 906} {"train_loss": -10.03687858581543, "global_step": 152237, "epoch": 906} {"train_loss": -10.45020866394043, "global_step": 152238, "epoch": 906} {"train_loss": -10.59959602355957, "global_step": 152239, "epoch": 906} {"train_loss": -9.874130249023438, "global_step": 152240, "epoch": 906} {"train_loss": -10.4126558303833, "global_step": 152241, "epoch": 906} {"train_loss": -10.584871292114258, "global_step": 152242, "epoch": 906} {"train_loss": -10.117083549499512, "global_step": 152243, "epoch": 906} {"train_loss": -10.734636306762695, "global_step": 152244, "epoch": 906} {"train_loss": -10.828878402709961, "global_step": 152245, "epoch": 906} {"train_loss": -10.565053939819336, "global_step": 152246, "epoch": 906} {"train_loss": -10.592130661010742, "global_step": 152247, "epoch": 906} {"train_loss": -10.718374252319336, "global_step": 152248, "epoch": 906} {"train_loss": -10.848548889160156, "global_step": 152249, "epoch": 906} {"train_loss": -10.829972267150879, "global_step": 152250, "epoch": 906} {"train_loss": -10.298609733581543, "global_step": 152251, "epoch": 906} {"train_loss": -10.86147403717041, "global_step": 152252, "epoch": 906} {"train_loss": -10.767704010009766, "global_step": 152253, "epoch": 906} {"train_loss": -10.820324897766113, "global_step": 152254, "epoch": 906} {"train_loss": -10.504366874694824, "global_step": 152255, "epoch": 906} {"train_loss": -10.64573860168457, "global_step": 152256, "epoch": 906} {"train_loss": -10.562215805053711, "global_step": 152257, "epoch": 906} {"train_loss": -10.381694793701172, "global_step": 152258, "epoch": 906} {"train_loss": -10.834131240844727, "global_step": 152259, "epoch": 906} {"train_loss": -10.772303581237793, "global_step": 152260, "epoch": 906} {"train_loss": -10.76407527923584, "global_step": 152261, "epoch": 906} {"train_loss": -10.718297958374023, "global_step": 152262, "epoch": 906} {"train_loss": -10.818231582641602, "global_step": 152263, "epoch": 906} {"train_loss": -10.937251091003418, "global_step": 152264, "epoch": 906} {"train_loss": -10.901843070983887, "global_step": 152265, "epoch": 906} {"train_loss": -11.021909713745117, "global_step": 152266, "epoch": 906} {"train_loss": -10.953839302062988, "global_step": 152267, "epoch": 906} {"train_loss": -11.179344177246094, "global_step": 152268, "epoch": 906} {"train_loss": -11.008600234985352, "global_step": 152269, "epoch": 906} {"train_loss": -10.94514274597168, "global_step": 152270, "epoch": 906} {"train_loss": -11.198078155517578, "global_step": 152271, "epoch": 906} {"train_loss": -10.768082618713379, "global_step": 152272, "epoch": 906} {"train_loss": -11.058757781982422, "global_step": 152273, "epoch": 906} {"train_loss": -10.819225311279297, "global_step": 152274, "epoch": 906} {"train_loss": -10.850677490234375, "global_step": 152275, "epoch": 906} {"train_loss": -10.978538513183594, "global_step": 152276, "epoch": 906} {"train_loss": -10.694416999816895, "global_step": 152277, "epoch": 906} {"train_loss": -11.069914817810059, "global_step": 152278, "epoch": 906} {"train_loss": -10.904886245727539, "global_step": 152279, "epoch": 906} {"train_loss": -10.952062606811523, "global_step": 152280, "epoch": 906} {"train_loss": -11.049423217773438, "global_step": 152281, "epoch": 906} {"train_loss": -10.994247436523438, "global_step": 152282, "epoch": 906} {"train_loss": -11.261094093322754, "global_step": 152283, "epoch": 906} {"train_loss": -11.007896423339844, "global_step": 152284, "epoch": 906} {"train_loss": -11.067747116088867, "global_step": 152285, "epoch": 906} {"train_loss": -10.849766731262207, "global_step": 152286, "epoch": 906} {"train_loss": -11.039422988891602, "global_step": 152287, "epoch": 906} {"train_loss": -10.980329513549805, "global_step": 152288, "epoch": 906} {"train_loss": -11.06772232055664, "global_step": 152289, "epoch": 906} {"train_loss": -11.287232398986816, "global_step": 152290, "epoch": 906} {"train_loss": -11.14166259765625, "global_step": 152291, "epoch": 906} {"train_loss": -11.135640144348145, "global_step": 152292, "epoch": 906} {"train_loss": -10.953232765197754, "global_step": 152293, "epoch": 906} {"train_loss": -10.8037691116333, "global_step": 152294, "epoch": 906} {"train_loss": -10.922518730163574, "global_step": 152295, "epoch": 906} {"train_loss": -11.00606918334961, "global_step": 152296, "epoch": 906} {"train_loss": -10.090095520019531, "global_step": 152297, "epoch": 906} {"train_loss": -11.020270347595215, "global_step": 152298, "epoch": 906} {"train_loss": -10.099531173706055, "global_step": 152299, "epoch": 906} {"train_loss": -10.599540710449219, "global_step": 152300, "epoch": 906} {"train_loss": -10.617216110229492, "global_step": 152301, "epoch": 906} {"train_loss": -10.386842727661133, "global_step": 152302, "epoch": 906} {"train_loss": -10.296976089477539, "global_step": 152303, "epoch": 906} {"train_loss": -10.956997871398926, "global_step": 152304, "epoch": 906} {"train_loss": -10.469895362854004, "global_step": 152305, "epoch": 906} {"train_loss": -10.212217330932617, "global_step": 152306, "epoch": 906} {"train_loss": -10.275376319885254, "global_step": 152307, "epoch": 906} {"train_loss": -10.792960166931152, "global_step": 152308, "epoch": 906} {"train_loss": -10.299585342407227, "global_step": 152309, "epoch": 906} {"train_loss": -10.638895034790039, "global_step": 152310, "epoch": 906} {"train_loss": -10.582450866699219, "global_step": 152311, "epoch": 906} {"train_loss": -10.773994445800781, "global_step": 152312, "epoch": 906} {"train_loss": -10.839971542358398, "global_step": 152313, "epoch": 906} {"train_loss": -10.796647071838379, "global_step": 152314, "epoch": 906} {"train_loss": -10.78695011138916, "global_step": 152315, "epoch": 906} {"train_loss": -10.678055763244629, "global_step": 152316, "epoch": 906} {"train_loss": -10.513628959655762, "global_step": 152317, "epoch": 906} {"train_loss": -10.522262573242188, "global_step": 152318, "epoch": 906} {"train_loss": -10.900182723999023, "global_step": 152319, "epoch": 906} {"train_loss": -10.566466331481934, "global_step": 152320, "epoch": 906} {"train_loss": -10.859007835388184, "global_step": 152321, "epoch": 906} {"train_loss": -10.964359283447266, "global_step": 152322, "epoch": 906} {"train_loss": -10.650399208068848, "global_step": 152323, "epoch": 906} {"train_loss": -10.520844459533691, "global_step": 152324, "epoch": 906} {"train_loss": -10.907319068908691, "global_step": 152325, "epoch": 906} {"train_loss": -10.864982604980469, "global_step": 152326, "epoch": 906} {"train_loss": -10.985099792480469, "global_step": 152327, "epoch": 906} {"train_loss": -10.610130310058594, "global_step": 152328, "epoch": 906} {"train_loss": -10.7660551071167, "global_step": 152329, "epoch": 906} {"train_loss": -11.09556770324707, "global_step": 152330, "epoch": 906} {"train_loss": -10.85529613494873, "global_step": 152331, "epoch": 906} {"train_loss": -10.793805122375488, "global_step": 152332, "epoch": 906} {"train_loss": -10.822786331176758, "global_step": 152333, "epoch": 906} {"train_loss": -10.693963050842285, "global_step": 152334, "epoch": 906} {"train_loss": -10.906207084655762, "global_step": 152335, "epoch": 906} {"train_loss": -10.809589385986328, "global_step": 152336, "epoch": 906} {"train_loss": -10.597999572753906, "global_step": 152337, "epoch": 906} {"train_loss": -10.798076629638672, "global_step": 152338, "epoch": 906} {"train_loss": -10.874238967895508, "global_step": 152339, "epoch": 906} {"train_loss": -10.702320098876953, "global_step": 152340, "epoch": 906} {"train_loss": -10.912324905395508, "global_step": 152341, "epoch": 906} {"train_loss": -10.768546104431152, "global_step": 152342, "epoch": 906} {"train_loss": -11.145242691040039, "global_step": 152343, "epoch": 906} {"train_loss": -11.007170677185059, "global_step": 152344, "epoch": 906} {"train_loss": -10.899255752563477, "global_step": 152345, "epoch": 906} {"train_loss": -11.02524185180664, "global_step": 152346, "epoch": 906} {"train_loss": -10.762452125549316, "global_step": 152347, "epoch": 906} {"train_loss": -10.782991409301758, "global_step": 152348, "epoch": 906} {"train_loss": -10.816597938537598, "global_step": 152349, "epoch": 906} {"train_loss": -10.314104080200195, "global_step": 152350, "epoch": 906} {"train_loss": -10.69244384765625, "global_step": 152351, "epoch": 906} {"train_loss": -10.6616849899292, "global_step": 152352, "epoch": 906} {"train_loss": -10.202431678771973, "global_step": 152353, "epoch": 906} {"train_loss": -10.631872177124023, "global_step": 152354, "epoch": 906} {"train_loss": -10.224174499511719, "global_step": 152355, "epoch": 906} {"train_loss": -11.022300720214844, "global_step": 152356, "epoch": 906} {"train_loss": -10.457006454467773, "global_step": 152357, "epoch": 906} {"train_loss": -10.458032608032227, "global_step": 152358, "epoch": 906} {"train_loss": -10.715075492858887, "global_step": 152359, "epoch": 906} {"train_loss": -10.108949661254883, "global_step": 152360, "epoch": 906} {"train_loss": -10.594433784484863, "global_step": 152361, "epoch": 906} {"train_loss": -10.068647384643555, "global_step": 152362, "epoch": 906} {"train_loss": -10.751077651977539, "global_step": 152363, "epoch": 906} {"train_loss": -10.355905532836914, "global_step": 152364, "epoch": 906} {"train_loss": -10.499591827392578, "global_step": 152365, "epoch": 906} {"train_loss": -10.84745979309082, "global_step": 152366, "epoch": 906} {"train_loss": -10.513681411743164, "global_step": 152367, "epoch": 906} {"train_loss": -10.817239761352539, "global_step": 152368, "epoch": 906} {"train_loss": -10.461450576782227, "global_step": 152369, "epoch": 906} {"train_loss": -10.845118522644043, "global_step": 152370, "epoch": 906} {"train_loss": -10.652795791625977, "global_step": 152371, "epoch": 906} {"train_loss": -10.807619094848633, "global_step": 152372, "epoch": 906} {"train_loss": -10.797246932983398, "global_step": 152373, "epoch": 906} {"train_loss": -10.637964248657227, "global_step": 152374, "epoch": 906} {"train_loss": -10.737465427035378, "global_step": 152375, "epoch": 906, "val_loss": 233781.09375} {"train_loss": -10.703852653503418, "global_step": 152376, "epoch": 907} {"train_loss": -10.485623359680176, "global_step": 152377, "epoch": 907} {"train_loss": -10.413873672485352, "global_step": 152378, "epoch": 907} {"train_loss": -10.653711318969727, "global_step": 152379, "epoch": 907} {"train_loss": -10.469057083129883, "global_step": 152380, "epoch": 907} {"train_loss": -10.510604858398438, "global_step": 152381, "epoch": 907} {"train_loss": -10.736063003540039, "global_step": 152382, "epoch": 907} {"train_loss": -10.479507446289062, "global_step": 152383, "epoch": 907} {"train_loss": -10.993688583374023, "global_step": 152384, "epoch": 907} {"train_loss": -10.40329360961914, "global_step": 152385, "epoch": 907} {"train_loss": -10.911564826965332, "global_step": 152386, "epoch": 907} {"train_loss": -10.76971435546875, "global_step": 152387, "epoch": 907} {"train_loss": -10.522614479064941, "global_step": 152388, "epoch": 907} {"train_loss": -10.821867942810059, "global_step": 152389, "epoch": 907} {"train_loss": -10.693992614746094, "global_step": 152390, "epoch": 907} {"train_loss": -10.858017921447754, "global_step": 152391, "epoch": 907} {"train_loss": -10.914592742919922, "global_step": 152392, "epoch": 907} {"train_loss": -10.916610717773438, "global_step": 152393, "epoch": 907} {"train_loss": -10.741188049316406, "global_step": 152394, "epoch": 907} {"train_loss": -10.660479545593262, "global_step": 152395, "epoch": 907} {"train_loss": -10.514930725097656, "global_step": 152396, "epoch": 907} {"train_loss": -10.493940353393555, "global_step": 152397, "epoch": 907} {"train_loss": -10.84146785736084, "global_step": 152398, "epoch": 907} {"train_loss": -10.946479797363281, "global_step": 152399, "epoch": 907} {"train_loss": -10.924629211425781, "global_step": 152400, "epoch": 907} {"train_loss": -10.637639999389648, "global_step": 152401, "epoch": 907} {"train_loss": -10.428173065185547, "global_step": 152402, "epoch": 907} {"train_loss": -10.81721305847168, "global_step": 152403, "epoch": 907} {"train_loss": -10.177957534790039, "global_step": 152404, "epoch": 907} {"train_loss": -10.361127853393555, "global_step": 152405, "epoch": 907} {"train_loss": -10.718778610229492, "global_step": 152406, "epoch": 907} {"train_loss": -10.436744689941406, "global_step": 152407, "epoch": 907} {"train_loss": -10.908746719360352, "global_step": 152408, "epoch": 907} {"train_loss": -9.988140106201172, "global_step": 152409, "epoch": 907} {"train_loss": -10.726032257080078, "global_step": 152410, "epoch": 907} {"train_loss": -10.504878997802734, "global_step": 152411, "epoch": 907} {"train_loss": -10.53976821899414, "global_step": 152412, "epoch": 907} {"train_loss": -10.568739891052246, "global_step": 152413, "epoch": 907} {"train_loss": -10.736949920654297, "global_step": 152414, "epoch": 907} {"train_loss": -10.339635848999023, "global_step": 152415, "epoch": 907} {"train_loss": -10.557356834411621, "global_step": 152416, "epoch": 907} {"train_loss": -10.33525276184082, "global_step": 152417, "epoch": 907} {"train_loss": -10.985274314880371, "global_step": 152418, "epoch": 907} {"train_loss": -10.762775421142578, "global_step": 152419, "epoch": 907} {"train_loss": -11.045103073120117, "global_step": 152420, "epoch": 907} {"train_loss": -10.760017395019531, "global_step": 152421, "epoch": 907} {"train_loss": -10.650714874267578, "global_step": 152422, "epoch": 907} {"train_loss": -10.708761215209961, "global_step": 152423, "epoch": 907} {"train_loss": -10.801151275634766, "global_step": 152424, "epoch": 907} {"train_loss": -10.357196807861328, "global_step": 152425, "epoch": 907} {"train_loss": -10.645445823669434, "global_step": 152426, "epoch": 907} {"train_loss": -10.499602317810059, "global_step": 152427, "epoch": 907} {"train_loss": -11.016218185424805, "global_step": 152428, "epoch": 907} {"train_loss": -10.524928092956543, "global_step": 152429, "epoch": 907} {"train_loss": -10.446128845214844, "global_step": 152430, "epoch": 907} {"train_loss": -10.783124923706055, "global_step": 152431, "epoch": 907} {"train_loss": -10.318656921386719, "global_step": 152432, "epoch": 907} {"train_loss": -10.805437088012695, "global_step": 152433, "epoch": 907} {"train_loss": -10.540996551513672, "global_step": 152434, "epoch": 907} {"train_loss": -10.649503707885742, "global_step": 152435, "epoch": 907} {"train_loss": -10.89680290222168, "global_step": 152436, "epoch": 907} {"train_loss": -10.578125953674316, "global_step": 152437, "epoch": 907} {"train_loss": -10.628072738647461, "global_step": 152438, "epoch": 907} {"train_loss": -11.011709213256836, "global_step": 152439, "epoch": 907} {"train_loss": -10.635589599609375, "global_step": 152440, "epoch": 907} {"train_loss": -10.990073204040527, "global_step": 152441, "epoch": 907} {"train_loss": -10.573476791381836, "global_step": 152442, "epoch": 907} {"train_loss": -10.978926658630371, "global_step": 152443, "epoch": 907} {"train_loss": -11.161404609680176, "global_step": 152444, "epoch": 907} {"train_loss": -10.846761703491211, "global_step": 152445, "epoch": 907} {"train_loss": -10.855704307556152, "global_step": 152446, "epoch": 907} {"train_loss": -10.972749710083008, "global_step": 152447, "epoch": 907} {"train_loss": -10.823567390441895, "global_step": 152448, "epoch": 907} {"train_loss": -10.915205001831055, "global_step": 152449, "epoch": 907} {"train_loss": -10.91281795501709, "global_step": 152450, "epoch": 907} {"train_loss": -11.022726058959961, "global_step": 152451, "epoch": 907} {"train_loss": -11.052331924438477, "global_step": 152452, "epoch": 907} {"train_loss": -10.680684089660645, "global_step": 152453, "epoch": 907} {"train_loss": -11.103297233581543, "global_step": 152454, "epoch": 907} {"train_loss": -10.6431245803833, "global_step": 152455, "epoch": 907} {"train_loss": -10.942331314086914, "global_step": 152456, "epoch": 907} {"train_loss": -10.766304969787598, "global_step": 152457, "epoch": 907} {"train_loss": -10.722156524658203, "global_step": 152458, "epoch": 907} {"train_loss": -10.970263481140137, "global_step": 152459, "epoch": 907} {"train_loss": -10.752800941467285, "global_step": 152460, "epoch": 907} {"train_loss": -11.0360746383667, "global_step": 152461, "epoch": 907} {"train_loss": -11.054435729980469, "global_step": 152462, "epoch": 907} {"train_loss": -11.119141578674316, "global_step": 152463, "epoch": 907} {"train_loss": -10.784432411193848, "global_step": 152464, "epoch": 907} {"train_loss": -10.924541473388672, "global_step": 152465, "epoch": 907} {"train_loss": -11.08138656616211, "global_step": 152466, "epoch": 907} {"train_loss": -10.857503890991211, "global_step": 152467, "epoch": 907} {"train_loss": -11.252595901489258, "global_step": 152468, "epoch": 907} {"train_loss": -10.859889030456543, "global_step": 152469, "epoch": 907} {"train_loss": -10.992694854736328, "global_step": 152470, "epoch": 907} {"train_loss": -10.86888599395752, "global_step": 152471, "epoch": 907} {"train_loss": -11.128975868225098, "global_step": 152472, "epoch": 907} {"train_loss": -10.696370124816895, "global_step": 152473, "epoch": 907} {"train_loss": -10.815536499023438, "global_step": 152474, "epoch": 907} {"train_loss": -11.16573429107666, "global_step": 152475, "epoch": 907} {"train_loss": -11.069990158081055, "global_step": 152476, "epoch": 907} {"train_loss": -10.70508098602295, "global_step": 152477, "epoch": 907} {"train_loss": -9.804037094116211, "global_step": 152478, "epoch": 907} {"train_loss": -9.912118911743164, "global_step": 152479, "epoch": 907} {"train_loss": -10.377742767333984, "global_step": 152480, "epoch": 907} {"train_loss": -7.981984615325928, "global_step": 152481, "epoch": 907} {"train_loss": -9.960721969604492, "global_step": 152482, "epoch": 907} {"train_loss": -9.043960571289062, "global_step": 152483, "epoch": 907} {"train_loss": -8.619956016540527, "global_step": 152484, "epoch": 907} {"train_loss": -8.470848083496094, "global_step": 152485, "epoch": 907} {"train_loss": -9.116546630859375, "global_step": 152486, "epoch": 907} {"train_loss": -7.809307098388672, "global_step": 152487, "epoch": 907} {"train_loss": -8.995615005493164, "global_step": 152488, "epoch": 907} {"train_loss": -7.512248516082764, "global_step": 152489, "epoch": 907} {"train_loss": -9.183987617492676, "global_step": 152490, "epoch": 907} {"train_loss": -9.096097946166992, "global_step": 152491, "epoch": 907} {"train_loss": -9.442946434020996, "global_step": 152492, "epoch": 907} {"train_loss": -10.414590835571289, "global_step": 152493, "epoch": 907} {"train_loss": -9.60794448852539, "global_step": 152494, "epoch": 907} {"train_loss": -9.653799057006836, "global_step": 152495, "epoch": 907} {"train_loss": -10.05294418334961, "global_step": 152496, "epoch": 907} {"train_loss": -9.675418853759766, "global_step": 152497, "epoch": 907} {"train_loss": -10.311866760253906, "global_step": 152498, "epoch": 907} {"train_loss": -10.193741798400879, "global_step": 152499, "epoch": 907} {"train_loss": -9.861505508422852, "global_step": 152500, "epoch": 907} {"train_loss": -10.429909706115723, "global_step": 152501, "epoch": 907} {"train_loss": -9.659478187561035, "global_step": 152502, "epoch": 907} {"train_loss": -10.240167617797852, "global_step": 152503, "epoch": 907} {"train_loss": -10.278922080993652, "global_step": 152504, "epoch": 907} {"train_loss": -9.576343536376953, "global_step": 152505, "epoch": 907} {"train_loss": -10.205663681030273, "global_step": 152506, "epoch": 907} {"train_loss": -10.54414176940918, "global_step": 152507, "epoch": 907} {"train_loss": -10.000739097595215, "global_step": 152508, "epoch": 907} {"train_loss": -10.120535850524902, "global_step": 152509, "epoch": 907} {"train_loss": -10.475021362304688, "global_step": 152510, "epoch": 907} {"train_loss": -10.496278762817383, "global_step": 152511, "epoch": 907} {"train_loss": -10.285314559936523, "global_step": 152512, "epoch": 907} {"train_loss": -10.373405456542969, "global_step": 152513, "epoch": 907} {"train_loss": -10.18925952911377, "global_step": 152514, "epoch": 907} {"train_loss": -10.633378982543945, "global_step": 152515, "epoch": 907} {"train_loss": -10.588614463806152, "global_step": 152516, "epoch": 907} {"train_loss": -10.371137619018555, "global_step": 152517, "epoch": 907} {"train_loss": -10.383124351501465, "global_step": 152518, "epoch": 907} {"train_loss": -10.464214324951172, "global_step": 152519, "epoch": 907} {"train_loss": -10.600512504577637, "global_step": 152520, "epoch": 907} {"train_loss": -10.7113676071167, "global_step": 152521, "epoch": 907} {"train_loss": -10.535959243774414, "global_step": 152522, "epoch": 907} {"train_loss": -10.621667861938477, "global_step": 152523, "epoch": 907} {"train_loss": -10.674942970275879, "global_step": 152524, "epoch": 907} {"train_loss": -10.423078536987305, "global_step": 152525, "epoch": 907} {"train_loss": -10.7134370803833, "global_step": 152526, "epoch": 907} {"train_loss": -10.729326248168945, "global_step": 152527, "epoch": 907} {"train_loss": -10.515321731567383, "global_step": 152528, "epoch": 907} {"train_loss": -10.881537437438965, "global_step": 152529, "epoch": 907} {"train_loss": -10.767122268676758, "global_step": 152530, "epoch": 907} {"train_loss": -10.740499496459961, "global_step": 152531, "epoch": 907} {"train_loss": -10.867213249206543, "global_step": 152532, "epoch": 907} {"train_loss": -10.862987518310547, "global_step": 152533, "epoch": 907} {"train_loss": -10.722901344299316, "global_step": 152534, "epoch": 907} {"train_loss": -10.762954711914062, "global_step": 152535, "epoch": 907} {"train_loss": -11.010443687438965, "global_step": 152536, "epoch": 907} {"train_loss": -10.732080459594727, "global_step": 152537, "epoch": 907} {"train_loss": -10.994316101074219, "global_step": 152538, "epoch": 907} {"train_loss": -10.870820999145508, "global_step": 152539, "epoch": 907} {"train_loss": -10.80217170715332, "global_step": 152540, "epoch": 907} {"train_loss": -10.87872314453125, "global_step": 152541, "epoch": 907} {"train_loss": -10.752937316894531, "global_step": 152542, "epoch": 907} {"train_loss": -10.503450791041056, "global_step": 152543, "epoch": 907, "val_loss": 225205.59375} {"train_loss": -10.662908554077148, "global_step": 152544, "epoch": 908} {"train_loss": -10.452762603759766, "global_step": 152545, "epoch": 908} {"train_loss": -10.711334228515625, "global_step": 152546, "epoch": 908} {"train_loss": -10.963479995727539, "global_step": 152547, "epoch": 908} {"train_loss": -10.725593566894531, "global_step": 152548, "epoch": 908} {"train_loss": -10.988504409790039, "global_step": 152549, "epoch": 908} {"train_loss": -10.692315101623535, "global_step": 152550, "epoch": 908} {"train_loss": -10.879030227661133, "global_step": 152551, "epoch": 908} {"train_loss": -10.787395477294922, "global_step": 152552, "epoch": 908} {"train_loss": -10.997440338134766, "global_step": 152553, "epoch": 908} {"train_loss": -10.759871482849121, "global_step": 152554, "epoch": 908} {"train_loss": -10.809432029724121, "global_step": 152555, "epoch": 908} {"train_loss": -10.822528839111328, "global_step": 152556, "epoch": 908} {"train_loss": -10.52325439453125, "global_step": 152557, "epoch": 908} {"train_loss": -10.494775772094727, "global_step": 152558, "epoch": 908} {"train_loss": -10.814277648925781, "global_step": 152559, "epoch": 908} {"train_loss": -10.801504135131836, "global_step": 152560, "epoch": 908} {"train_loss": -10.358307838439941, "global_step": 152561, "epoch": 908} {"train_loss": -10.975013732910156, "global_step": 152562, "epoch": 908} {"train_loss": -10.796541213989258, "global_step": 152563, "epoch": 908} {"train_loss": -10.890420913696289, "global_step": 152564, "epoch": 908} {"train_loss": -10.750680923461914, "global_step": 152565, "epoch": 908} {"train_loss": -11.043660163879395, "global_step": 152566, "epoch": 908} {"train_loss": -10.639167785644531, "global_step": 152567, "epoch": 908} {"train_loss": -10.986780166625977, "global_step": 152568, "epoch": 908} {"train_loss": -10.710545539855957, "global_step": 152569, "epoch": 908} {"train_loss": -10.644184112548828, "global_step": 152570, "epoch": 908} {"train_loss": -10.936689376831055, "global_step": 152571, "epoch": 908} {"train_loss": -10.825922012329102, "global_step": 152572, "epoch": 908} {"train_loss": -10.809019088745117, "global_step": 152573, "epoch": 908} {"train_loss": -10.796908378601074, "global_step": 152574, "epoch": 908} {"train_loss": -11.05543327331543, "global_step": 152575, "epoch": 908} {"train_loss": -10.880024909973145, "global_step": 152576, "epoch": 908} {"train_loss": -10.702486991882324, "global_step": 152577, "epoch": 908} {"train_loss": -11.010860443115234, "global_step": 152578, "epoch": 908} {"train_loss": -10.974658012390137, "global_step": 152579, "epoch": 908} {"train_loss": -10.518596649169922, "global_step": 152580, "epoch": 908} {"train_loss": -10.693680763244629, "global_step": 152581, "epoch": 908} {"train_loss": -10.886632919311523, "global_step": 152582, "epoch": 908} {"train_loss": -10.960762977600098, "global_step": 152583, "epoch": 908} {"train_loss": -10.459142684936523, "global_step": 152584, "epoch": 908} {"train_loss": -10.672164916992188, "global_step": 152585, "epoch": 908} {"train_loss": -11.079520225524902, "global_step": 152586, "epoch": 908} {"train_loss": -10.249168395996094, "global_step": 152587, "epoch": 908} {"train_loss": -10.909361839294434, "global_step": 152588, "epoch": 908} {"train_loss": -10.495320320129395, "global_step": 152589, "epoch": 908} {"train_loss": -10.502974510192871, "global_step": 152590, "epoch": 908} {"train_loss": -10.677106857299805, "global_step": 152591, "epoch": 908} {"train_loss": -9.977436065673828, "global_step": 152592, "epoch": 908} {"train_loss": -10.779890060424805, "global_step": 152593, "epoch": 908} {"train_loss": -10.559200286865234, "global_step": 152594, "epoch": 908} {"train_loss": -9.66069221496582, "global_step": 152595, "epoch": 908} {"train_loss": -10.749109268188477, "global_step": 152596, "epoch": 908} {"train_loss": -10.662466049194336, "global_step": 152597, "epoch": 908} {"train_loss": -10.521703720092773, "global_step": 152598, "epoch": 908} {"train_loss": -10.579401016235352, "global_step": 152599, "epoch": 908} {"train_loss": -10.186789512634277, "global_step": 152600, "epoch": 908} {"train_loss": -10.096532821655273, "global_step": 152601, "epoch": 908} {"train_loss": -10.615827560424805, "global_step": 152602, "epoch": 908} {"train_loss": -10.31523323059082, "global_step": 152603, "epoch": 908} {"train_loss": -10.952544212341309, "global_step": 152604, "epoch": 908} {"train_loss": -10.716403007507324, "global_step": 152605, "epoch": 908} {"train_loss": -10.545249938964844, "global_step": 152606, "epoch": 908} {"train_loss": -10.66937255859375, "global_step": 152607, "epoch": 908} {"train_loss": -10.280052185058594, "global_step": 152608, "epoch": 908} {"train_loss": -10.542616844177246, "global_step": 152609, "epoch": 908} {"train_loss": -10.024423599243164, "global_step": 152610, "epoch": 908} {"train_loss": -10.32342529296875, "global_step": 152611, "epoch": 908} {"train_loss": -10.539721488952637, "global_step": 152612, "epoch": 908} {"train_loss": -9.953084945678711, "global_step": 152613, "epoch": 908} {"train_loss": -10.51607894897461, "global_step": 152614, "epoch": 908} {"train_loss": -10.381630897521973, "global_step": 152615, "epoch": 908} {"train_loss": -10.153437614440918, "global_step": 152616, "epoch": 908} {"train_loss": -10.560371398925781, "global_step": 152617, "epoch": 908} {"train_loss": -10.355752944946289, "global_step": 152618, "epoch": 908} {"train_loss": -10.389545440673828, "global_step": 152619, "epoch": 908} {"train_loss": -10.827814102172852, "global_step": 152620, "epoch": 908} {"train_loss": -10.239910125732422, "global_step": 152621, "epoch": 908} {"train_loss": -10.478346824645996, "global_step": 152622, "epoch": 908} {"train_loss": -10.644859313964844, "global_step": 152623, "epoch": 908} {"train_loss": -10.446426391601562, "global_step": 152624, "epoch": 908} {"train_loss": -10.131061553955078, "global_step": 152625, "epoch": 908} {"train_loss": -10.950961112976074, "global_step": 152626, "epoch": 908} {"train_loss": -10.286666870117188, "global_step": 152627, "epoch": 908} {"train_loss": -10.514810562133789, "global_step": 152628, "epoch": 908} {"train_loss": -10.596914291381836, "global_step": 152629, "epoch": 908} {"train_loss": -10.799019813537598, "global_step": 152630, "epoch": 908} {"train_loss": -10.433308601379395, "global_step": 152631, "epoch": 908} {"train_loss": -10.691747665405273, "global_step": 152632, "epoch": 908} {"train_loss": -10.538911819458008, "global_step": 152633, "epoch": 908} {"train_loss": -10.746896743774414, "global_step": 152634, "epoch": 908} {"train_loss": -10.620200157165527, "global_step": 152635, "epoch": 908} {"train_loss": -11.055646896362305, "global_step": 152636, "epoch": 908} {"train_loss": -10.670943260192871, "global_step": 152637, "epoch": 908} {"train_loss": -10.724462509155273, "global_step": 152638, "epoch": 908} {"train_loss": -10.788077354431152, "global_step": 152639, "epoch": 908} {"train_loss": -10.68319320678711, "global_step": 152640, "epoch": 908} {"train_loss": -10.793233871459961, "global_step": 152641, "epoch": 908} {"train_loss": -10.579570770263672, "global_step": 152642, "epoch": 908} {"train_loss": -10.953436851501465, "global_step": 152643, "epoch": 908} {"train_loss": -10.522294998168945, "global_step": 152644, "epoch": 908} {"train_loss": -10.708290100097656, "global_step": 152645, "epoch": 908} {"train_loss": -10.70560073852539, "global_step": 152646, "epoch": 908} {"train_loss": -10.73853874206543, "global_step": 152647, "epoch": 908} {"train_loss": -10.542268753051758, "global_step": 152648, "epoch": 908} {"train_loss": -10.98263168334961, "global_step": 152649, "epoch": 908} {"train_loss": -10.657917976379395, "global_step": 152650, "epoch": 908} {"train_loss": -11.07852554321289, "global_step": 152651, "epoch": 908} {"train_loss": -10.894841194152832, "global_step": 152652, "epoch": 908} {"train_loss": -10.94975471496582, "global_step": 152653, "epoch": 908} {"train_loss": -10.930840492248535, "global_step": 152654, "epoch": 908} {"train_loss": -11.246374130249023, "global_step": 152655, "epoch": 908} {"train_loss": -10.984149932861328, "global_step": 152656, "epoch": 908} {"train_loss": -10.921826362609863, "global_step": 152657, "epoch": 908} {"train_loss": -11.123486518859863, "global_step": 152658, "epoch": 908} {"train_loss": -10.943181037902832, "global_step": 152659, "epoch": 908} {"train_loss": -11.080689430236816, "global_step": 152660, "epoch": 908} {"train_loss": -11.137004852294922, "global_step": 152661, "epoch": 908} {"train_loss": -11.10263729095459, "global_step": 152662, "epoch": 908} {"train_loss": -10.980825424194336, "global_step": 152663, "epoch": 908} {"train_loss": -11.055215835571289, "global_step": 152664, "epoch": 908} {"train_loss": -11.203571319580078, "global_step": 152665, "epoch": 908} {"train_loss": -10.868976593017578, "global_step": 152666, "epoch": 908} {"train_loss": -11.132390022277832, "global_step": 152667, "epoch": 908} {"train_loss": -11.012008666992188, "global_step": 152668, "epoch": 908} {"train_loss": -11.323862075805664, "global_step": 152669, "epoch": 908} {"train_loss": -10.938016891479492, "global_step": 152670, "epoch": 908} {"train_loss": -11.004446029663086, "global_step": 152671, "epoch": 908} {"train_loss": -10.558797836303711, "global_step": 152672, "epoch": 908} {"train_loss": -11.044867515563965, "global_step": 152673, "epoch": 908} {"train_loss": -11.033859252929688, "global_step": 152674, "epoch": 908} {"train_loss": -10.539018630981445, "global_step": 152675, "epoch": 908} {"train_loss": -11.125361442565918, "global_step": 152676, "epoch": 908} {"train_loss": -11.015440940856934, "global_step": 152677, "epoch": 908} {"train_loss": -10.517524719238281, "global_step": 152678, "epoch": 908} {"train_loss": -10.805482864379883, "global_step": 152679, "epoch": 908} {"train_loss": -10.495246887207031, "global_step": 152680, "epoch": 908} {"train_loss": -10.862860679626465, "global_step": 152681, "epoch": 908} {"train_loss": -10.51481819152832, "global_step": 152682, "epoch": 908} {"train_loss": -10.352706909179688, "global_step": 152683, "epoch": 908} {"train_loss": -10.238638877868652, "global_step": 152684, "epoch": 908} {"train_loss": -9.815876007080078, "global_step": 152685, "epoch": 908} {"train_loss": -10.733718872070312, "global_step": 152686, "epoch": 908} {"train_loss": -10.789423942565918, "global_step": 152687, "epoch": 908} {"train_loss": -10.512588500976562, "global_step": 152688, "epoch": 908} {"train_loss": -10.752799987792969, "global_step": 152689, "epoch": 908} {"train_loss": -10.506719589233398, "global_step": 152690, "epoch": 908} {"train_loss": -10.701925277709961, "global_step": 152691, "epoch": 908} {"train_loss": -10.019607543945312, "global_step": 152692, "epoch": 908} {"train_loss": -10.47814655303955, "global_step": 152693, "epoch": 908} {"train_loss": -10.320558547973633, "global_step": 152694, "epoch": 908} {"train_loss": -10.206436157226562, "global_step": 152695, "epoch": 908} {"train_loss": -10.600919723510742, "global_step": 152696, "epoch": 908} {"train_loss": -9.94869613647461, "global_step": 152697, "epoch": 908} {"train_loss": -10.300504684448242, "global_step": 152698, "epoch": 908} {"train_loss": -10.66859245300293, "global_step": 152699, "epoch": 908} {"train_loss": -9.901309967041016, "global_step": 152700, "epoch": 908} {"train_loss": -10.863670349121094, "global_step": 152701, "epoch": 908} {"train_loss": -10.643563270568848, "global_step": 152702, "epoch": 908} {"train_loss": -10.531036376953125, "global_step": 152703, "epoch": 908} {"train_loss": -10.608880043029785, "global_step": 152704, "epoch": 908} {"train_loss": -10.605064392089844, "global_step": 152705, "epoch": 908} {"train_loss": -10.507433891296387, "global_step": 152706, "epoch": 908} {"train_loss": -10.330327987670898, "global_step": 152707, "epoch": 908} {"train_loss": -10.445328712463379, "global_step": 152708, "epoch": 908} {"train_loss": -10.241510391235352, "global_step": 152709, "epoch": 908} {"train_loss": -10.60842514038086, "global_step": 152710, "epoch": 908} {"train_loss": -10.66446578502655, "global_step": 152711, "epoch": 908, "val_loss": 233954.90625} {"train_loss": -10.572355270385742, "global_step": 152712, "epoch": 909} {"train_loss": -10.484216690063477, "global_step": 152713, "epoch": 909} {"train_loss": -10.682405471801758, "global_step": 152714, "epoch": 909} {"train_loss": -10.687345504760742, "global_step": 152715, "epoch": 909} {"train_loss": -10.792119979858398, "global_step": 152716, "epoch": 909} {"train_loss": -10.801046371459961, "global_step": 152717, "epoch": 909} {"train_loss": -10.73210334777832, "global_step": 152718, "epoch": 909} {"train_loss": -10.845858573913574, "global_step": 152719, "epoch": 909} {"train_loss": -10.75531005859375, "global_step": 152720, "epoch": 909} {"train_loss": -10.794936180114746, "global_step": 152721, "epoch": 909} {"train_loss": -10.487561225891113, "global_step": 152722, "epoch": 909} {"train_loss": -10.719257354736328, "global_step": 152723, "epoch": 909} {"train_loss": -10.527070999145508, "global_step": 152724, "epoch": 909} {"train_loss": -10.854442596435547, "global_step": 152725, "epoch": 909} {"train_loss": -10.384028434753418, "global_step": 152726, "epoch": 909} {"train_loss": -10.792651176452637, "global_step": 152727, "epoch": 909} {"train_loss": -10.553689956665039, "global_step": 152728, "epoch": 909} {"train_loss": -10.690583229064941, "global_step": 152729, "epoch": 909} {"train_loss": -10.63210678100586, "global_step": 152730, "epoch": 909} {"train_loss": -10.465866088867188, "global_step": 152731, "epoch": 909} {"train_loss": -10.809707641601562, "global_step": 152732, "epoch": 909} {"train_loss": -10.633624076843262, "global_step": 152733, "epoch": 909} {"train_loss": -10.811129570007324, "global_step": 152734, "epoch": 909} {"train_loss": -10.758306503295898, "global_step": 152735, "epoch": 909} {"train_loss": -10.83535099029541, "global_step": 152736, "epoch": 909} {"train_loss": -10.793365478515625, "global_step": 152737, "epoch": 909} {"train_loss": -10.78195858001709, "global_step": 152738, "epoch": 909} {"train_loss": -10.7268648147583, "global_step": 152739, "epoch": 909} {"train_loss": -10.90640640258789, "global_step": 152740, "epoch": 909} {"train_loss": -10.435322761535645, "global_step": 152741, "epoch": 909} {"train_loss": -10.719090461730957, "global_step": 152742, "epoch": 909} {"train_loss": -10.924901962280273, "global_step": 152743, "epoch": 909} {"train_loss": -10.4064359664917, "global_step": 152744, "epoch": 909} {"train_loss": -10.929914474487305, "global_step": 152745, "epoch": 909} {"train_loss": -11.005936622619629, "global_step": 152746, "epoch": 909} {"train_loss": -10.756006240844727, "global_step": 152747, "epoch": 909} {"train_loss": -10.732044219970703, "global_step": 152748, "epoch": 909} {"train_loss": -11.031976699829102, "global_step": 152749, "epoch": 909} {"train_loss": -10.957807540893555, "global_step": 152750, "epoch": 909} {"train_loss": -11.084888458251953, "global_step": 152751, "epoch": 909} {"train_loss": -10.808151245117188, "global_step": 152752, "epoch": 909} {"train_loss": -10.99691390991211, "global_step": 152753, "epoch": 909} {"train_loss": -11.007966995239258, "global_step": 152754, "epoch": 909} {"train_loss": -11.001054763793945, "global_step": 152755, "epoch": 909} {"train_loss": -10.938087463378906, "global_step": 152756, "epoch": 909} {"train_loss": -10.847143173217773, "global_step": 152757, "epoch": 909} {"train_loss": -11.150986671447754, "global_step": 152758, "epoch": 909} {"train_loss": -10.760972023010254, "global_step": 152759, "epoch": 909} {"train_loss": -11.167287826538086, "global_step": 152760, "epoch": 909} {"train_loss": -10.852285385131836, "global_step": 152761, "epoch": 909} {"train_loss": -10.83482551574707, "global_step": 152762, "epoch": 909} {"train_loss": -10.823335647583008, "global_step": 152763, "epoch": 909} {"train_loss": -10.644628524780273, "global_step": 152764, "epoch": 909} {"train_loss": -10.70163345336914, "global_step": 152765, "epoch": 909} {"train_loss": -11.333373069763184, "global_step": 152766, "epoch": 909} {"train_loss": -10.995477676391602, "global_step": 152767, "epoch": 909} {"train_loss": -11.09982681274414, "global_step": 152768, "epoch": 909} {"train_loss": -10.813468933105469, "global_step": 152769, "epoch": 909} {"train_loss": -10.999217987060547, "global_step": 152770, "epoch": 909} {"train_loss": -10.89448070526123, "global_step": 152771, "epoch": 909} {"train_loss": -10.936040878295898, "global_step": 152772, "epoch": 909} {"train_loss": -11.078145980834961, "global_step": 152773, "epoch": 909} {"train_loss": -10.970684051513672, "global_step": 152774, "epoch": 909} {"train_loss": -10.52511215209961, "global_step": 152775, "epoch": 909} {"train_loss": -10.623542785644531, "global_step": 152776, "epoch": 909} {"train_loss": -11.003398895263672, "global_step": 152777, "epoch": 909} {"train_loss": -10.96157455444336, "global_step": 152778, "epoch": 909} {"train_loss": -10.66817855834961, "global_step": 152779, "epoch": 909} {"train_loss": -11.067768096923828, "global_step": 152780, "epoch": 909} {"train_loss": -10.404315948486328, "global_step": 152781, "epoch": 909} {"train_loss": -10.723855018615723, "global_step": 152782, "epoch": 909} {"train_loss": -10.622884750366211, "global_step": 152783, "epoch": 909} {"train_loss": -11.131601333618164, "global_step": 152784, "epoch": 909} {"train_loss": -10.942182540893555, "global_step": 152785, "epoch": 909} {"train_loss": -10.529580116271973, "global_step": 152786, "epoch": 909} {"train_loss": -10.349289894104004, "global_step": 152787, "epoch": 909} {"train_loss": -11.046144485473633, "global_step": 152788, "epoch": 909} {"train_loss": -9.99946403503418, "global_step": 152789, "epoch": 909} {"train_loss": -10.185691833496094, "global_step": 152790, "epoch": 909} {"train_loss": -10.813800811767578, "global_step": 152791, "epoch": 909} {"train_loss": -9.983297348022461, "global_step": 152792, "epoch": 909} {"train_loss": -9.891555786132812, "global_step": 152793, "epoch": 909} {"train_loss": -9.980588912963867, "global_step": 152794, "epoch": 909} {"train_loss": -9.261213302612305, "global_step": 152795, "epoch": 909} {"train_loss": -9.891207695007324, "global_step": 152796, "epoch": 909} {"train_loss": -8.607728958129883, "global_step": 152797, "epoch": 909} {"train_loss": -9.512276649475098, "global_step": 152798, "epoch": 909} {"train_loss": -8.5428466796875, "global_step": 152799, "epoch": 909} {"train_loss": -9.628860473632812, "global_step": 152800, "epoch": 909} {"train_loss": -9.8572998046875, "global_step": 152801, "epoch": 909} {"train_loss": -9.881285667419434, "global_step": 152802, "epoch": 909} {"train_loss": -9.508563041687012, "global_step": 152803, "epoch": 909} {"train_loss": -9.936569213867188, "global_step": 152804, "epoch": 909} {"train_loss": -10.022317886352539, "global_step": 152805, "epoch": 909} {"train_loss": -8.568482398986816, "global_step": 152806, "epoch": 909} {"train_loss": -9.973760604858398, "global_step": 152807, "epoch": 909} {"train_loss": -9.443585395812988, "global_step": 152808, "epoch": 909} {"train_loss": -9.740973472595215, "global_step": 152809, "epoch": 909} {"train_loss": -9.33029556274414, "global_step": 152810, "epoch": 909} {"train_loss": -9.57848072052002, "global_step": 152811, "epoch": 909} {"train_loss": -9.804715156555176, "global_step": 152812, "epoch": 909} {"train_loss": -9.194442749023438, "global_step": 152813, "epoch": 909} {"train_loss": -10.101350784301758, "global_step": 152814, "epoch": 909} {"train_loss": -9.423748016357422, "global_step": 152815, "epoch": 909} {"train_loss": -10.048606872558594, "global_step": 152816, "epoch": 909} {"train_loss": -10.178196907043457, "global_step": 152817, "epoch": 909} {"train_loss": -9.688834190368652, "global_step": 152818, "epoch": 909} {"train_loss": -10.118927001953125, "global_step": 152819, "epoch": 909} {"train_loss": -10.378837585449219, "global_step": 152820, "epoch": 909} {"train_loss": -9.940882682800293, "global_step": 152821, "epoch": 909} {"train_loss": -10.045661926269531, "global_step": 152822, "epoch": 909} {"train_loss": -10.548681259155273, "global_step": 152823, "epoch": 909} {"train_loss": -10.228608131408691, "global_step": 152824, "epoch": 909} {"train_loss": -10.331991195678711, "global_step": 152825, "epoch": 909} {"train_loss": -10.16267204284668, "global_step": 152826, "epoch": 909} {"train_loss": -10.405667304992676, "global_step": 152827, "epoch": 909} {"train_loss": -10.248920440673828, "global_step": 152828, "epoch": 909} {"train_loss": -10.505640029907227, "global_step": 152829, "epoch": 909} {"train_loss": -10.555471420288086, "global_step": 152830, "epoch": 909} {"train_loss": -10.519726753234863, "global_step": 152831, "epoch": 909} {"train_loss": -10.559402465820312, "global_step": 152832, "epoch": 909} {"train_loss": -10.608118057250977, "global_step": 152833, "epoch": 909} {"train_loss": -10.547791481018066, "global_step": 152834, "epoch": 909} {"train_loss": -10.436416625976562, "global_step": 152835, "epoch": 909} {"train_loss": -10.531330108642578, "global_step": 152836, "epoch": 909} {"train_loss": -10.475227355957031, "global_step": 152837, "epoch": 909} {"train_loss": -10.603500366210938, "global_step": 152838, "epoch": 909} {"train_loss": -10.589313507080078, "global_step": 152839, "epoch": 909} {"train_loss": -10.29719352722168, "global_step": 152840, "epoch": 909} {"train_loss": -10.896598815917969, "global_step": 152841, "epoch": 909} {"train_loss": -10.697793960571289, "global_step": 152842, "epoch": 909} {"train_loss": -10.744483947753906, "global_step": 152843, "epoch": 909} {"train_loss": -10.606034278869629, "global_step": 152844, "epoch": 909} {"train_loss": -10.562320709228516, "global_step": 152845, "epoch": 909} {"train_loss": -10.604320526123047, "global_step": 152846, "epoch": 909} {"train_loss": -10.73597526550293, "global_step": 152847, "epoch": 909} {"train_loss": -10.88524055480957, "global_step": 152848, "epoch": 909} {"train_loss": -10.881027221679688, "global_step": 152849, "epoch": 909} {"train_loss": -10.848464965820312, "global_step": 152850, "epoch": 909} {"train_loss": -10.78653621673584, "global_step": 152851, "epoch": 909} {"train_loss": -10.805944442749023, "global_step": 152852, "epoch": 909} {"train_loss": -10.866241455078125, "global_step": 152853, "epoch": 909} {"train_loss": -11.006145477294922, "global_step": 152854, "epoch": 909} {"train_loss": -10.82182788848877, "global_step": 152855, "epoch": 909} {"train_loss": -11.079723358154297, "global_step": 152856, "epoch": 909} {"train_loss": -11.075115203857422, "global_step": 152857, "epoch": 909} {"train_loss": -11.157512664794922, "global_step": 152858, "epoch": 909} {"train_loss": -10.935789108276367, "global_step": 152859, "epoch": 909} {"train_loss": -11.15103530883789, "global_step": 152860, "epoch": 909} {"train_loss": -10.795324325561523, "global_step": 152861, "epoch": 909} {"train_loss": -10.936185836791992, "global_step": 152862, "epoch": 909} {"train_loss": -10.923673629760742, "global_step": 152863, "epoch": 909} {"train_loss": -10.924820899963379, "global_step": 152864, "epoch": 909} {"train_loss": -10.63888931274414, "global_step": 152865, "epoch": 909} {"train_loss": -11.129146575927734, "global_step": 152866, "epoch": 909} {"train_loss": -10.727607727050781, "global_step": 152867, "epoch": 909} {"train_loss": -10.765912055969238, "global_step": 152868, "epoch": 909} {"train_loss": -10.612504959106445, "global_step": 152869, "epoch": 909} {"train_loss": -10.9165678024292, "global_step": 152870, "epoch": 909} {"train_loss": -10.94761848449707, "global_step": 152871, "epoch": 909} {"train_loss": -10.776521682739258, "global_step": 152872, "epoch": 909} {"train_loss": -10.833355903625488, "global_step": 152873, "epoch": 909} {"train_loss": -11.116950988769531, "global_step": 152874, "epoch": 909} {"train_loss": -10.892557144165039, "global_step": 152875, "epoch": 909} {"train_loss": -10.792081832885742, "global_step": 152876, "epoch": 909} {"train_loss": -10.86870002746582, "global_step": 152877, "epoch": 909} {"train_loss": -10.687477111816406, "global_step": 152878, "epoch": 909} {"train_loss": -10.560869682402839, "global_step": 152879, "epoch": 909, "val_loss": 230572.25} {"train_loss": -10.918275833129883, "global_step": 152880, "epoch": 910} {"train_loss": -10.824647903442383, "global_step": 152881, "epoch": 910} {"train_loss": -11.036624908447266, "global_step": 152882, "epoch": 910} {"train_loss": -10.71694564819336, "global_step": 152883, "epoch": 910} {"train_loss": -10.660208702087402, "global_step": 152884, "epoch": 910} {"train_loss": -10.694772720336914, "global_step": 152885, "epoch": 910} {"train_loss": -10.855850219726562, "global_step": 152886, "epoch": 910} {"train_loss": -10.892921447753906, "global_step": 152887, "epoch": 910} {"train_loss": -10.878804206848145, "global_step": 152888, "epoch": 910} {"train_loss": -10.837602615356445, "global_step": 152889, "epoch": 910} {"train_loss": -10.885868072509766, "global_step": 152890, "epoch": 910} {"train_loss": -10.94239616394043, "global_step": 152891, "epoch": 910} {"train_loss": -10.809799194335938, "global_step": 152892, "epoch": 910} {"train_loss": -10.216400146484375, "global_step": 152893, "epoch": 910} {"train_loss": -10.873180389404297, "global_step": 152894, "epoch": 910} {"train_loss": -10.913093566894531, "global_step": 152895, "epoch": 910} {"train_loss": -10.677403450012207, "global_step": 152896, "epoch": 910} {"train_loss": -10.458944320678711, "global_step": 152897, "epoch": 910} {"train_loss": -11.103330612182617, "global_step": 152898, "epoch": 910} {"train_loss": -10.541955947875977, "global_step": 152899, "epoch": 910} {"train_loss": -10.8063325881958, "global_step": 152900, "epoch": 910} {"train_loss": -10.809446334838867, "global_step": 152901, "epoch": 910} {"train_loss": -10.401371002197266, "global_step": 152902, "epoch": 910} {"train_loss": -10.571483612060547, "global_step": 152903, "epoch": 910} {"train_loss": -10.48696231842041, "global_step": 152904, "epoch": 910} {"train_loss": -10.792508125305176, "global_step": 152905, "epoch": 910} {"train_loss": -10.314912796020508, "global_step": 152906, "epoch": 910} {"train_loss": -10.825390815734863, "global_step": 152907, "epoch": 910} {"train_loss": -10.190176010131836, "global_step": 152908, "epoch": 910} {"train_loss": -10.577239036560059, "global_step": 152909, "epoch": 910} {"train_loss": -9.186455726623535, "global_step": 152910, "epoch": 910} {"train_loss": -10.523752212524414, "global_step": 152911, "epoch": 910} {"train_loss": -9.384344100952148, "global_step": 152912, "epoch": 910} {"train_loss": -9.942520141601562, "global_step": 152913, "epoch": 910} {"train_loss": -9.858831405639648, "global_step": 152914, "epoch": 910} {"train_loss": -9.724123001098633, "global_step": 152915, "epoch": 910} {"train_loss": -10.568624496459961, "global_step": 152916, "epoch": 910} {"train_loss": -9.945854187011719, "global_step": 152917, "epoch": 910} {"train_loss": -10.282270431518555, "global_step": 152918, "epoch": 910} {"train_loss": -10.235400199890137, "global_step": 152919, "epoch": 910} {"train_loss": -9.981086730957031, "global_step": 152920, "epoch": 910} {"train_loss": -10.491311073303223, "global_step": 152921, "epoch": 910} {"train_loss": -10.421794891357422, "global_step": 152922, "epoch": 910} {"train_loss": -10.531333923339844, "global_step": 152923, "epoch": 910} {"train_loss": -10.564312934875488, "global_step": 152924, "epoch": 910} {"train_loss": -10.601755142211914, "global_step": 152925, "epoch": 910} {"train_loss": -10.357967376708984, "global_step": 152926, "epoch": 910} {"train_loss": -10.547896385192871, "global_step": 152927, "epoch": 910} {"train_loss": -10.539268493652344, "global_step": 152928, "epoch": 910} {"train_loss": -10.636672973632812, "global_step": 152929, "epoch": 910} {"train_loss": -10.56673812866211, "global_step": 152930, "epoch": 910} {"train_loss": -10.532110214233398, "global_step": 152931, "epoch": 910} {"train_loss": -10.398683547973633, "global_step": 152932, "epoch": 910} {"train_loss": -10.546113967895508, "global_step": 152933, "epoch": 910} {"train_loss": -10.339913368225098, "global_step": 152934, "epoch": 910} {"train_loss": -10.339048385620117, "global_step": 152935, "epoch": 910} {"train_loss": -10.617347717285156, "global_step": 152936, "epoch": 910} {"train_loss": -10.489900588989258, "global_step": 152937, "epoch": 910} {"train_loss": -10.684295654296875, "global_step": 152938, "epoch": 910} {"train_loss": -10.646512985229492, "global_step": 152939, "epoch": 910} {"train_loss": -10.750947952270508, "global_step": 152940, "epoch": 910} {"train_loss": -10.62106704711914, "global_step": 152941, "epoch": 910} {"train_loss": -10.895352363586426, "global_step": 152942, "epoch": 910} {"train_loss": -10.435197830200195, "global_step": 152943, "epoch": 910} {"train_loss": -10.455662727355957, "global_step": 152944, "epoch": 910} {"train_loss": -10.953678131103516, "global_step": 152945, "epoch": 910} {"train_loss": -10.754436492919922, "global_step": 152946, "epoch": 910} {"train_loss": -10.512434005737305, "global_step": 152947, "epoch": 910} {"train_loss": -11.054962158203125, "global_step": 152948, "epoch": 910} {"train_loss": -10.842039108276367, "global_step": 152949, "epoch": 910} {"train_loss": -10.47523021697998, "global_step": 152950, "epoch": 910} {"train_loss": -10.837953567504883, "global_step": 152951, "epoch": 910} {"train_loss": -10.610231399536133, "global_step": 152952, "epoch": 910} {"train_loss": -10.608729362487793, "global_step": 152953, "epoch": 910} {"train_loss": -10.670788764953613, "global_step": 152954, "epoch": 910} {"train_loss": -10.591110229492188, "global_step": 152955, "epoch": 910} {"train_loss": -10.850318908691406, "global_step": 152956, "epoch": 910} {"train_loss": -11.01642894744873, "global_step": 152957, "epoch": 910} {"train_loss": -10.353536605834961, "global_step": 152958, "epoch": 910} {"train_loss": -10.835063934326172, "global_step": 152959, "epoch": 910} {"train_loss": -10.622398376464844, "global_step": 152960, "epoch": 910} {"train_loss": -10.691995620727539, "global_step": 152961, "epoch": 910} {"train_loss": -10.871858596801758, "global_step": 152962, "epoch": 910} {"train_loss": -11.020700454711914, "global_step": 152963, "epoch": 910} {"train_loss": -10.943544387817383, "global_step": 152964, "epoch": 910} {"train_loss": -11.086949348449707, "global_step": 152965, "epoch": 910} {"train_loss": -11.146806716918945, "global_step": 152966, "epoch": 910} {"train_loss": -10.9852294921875, "global_step": 152967, "epoch": 910} {"train_loss": -10.916637420654297, "global_step": 152968, "epoch": 910} {"train_loss": -11.189533233642578, "global_step": 152969, "epoch": 910} {"train_loss": -10.854881286621094, "global_step": 152970, "epoch": 910} {"train_loss": -11.042283058166504, "global_step": 152971, "epoch": 910} {"train_loss": -11.092386245727539, "global_step": 152972, "epoch": 910} {"train_loss": -10.861398696899414, "global_step": 152973, "epoch": 910} {"train_loss": -10.694055557250977, "global_step": 152974, "epoch": 910} {"train_loss": -10.510974884033203, "global_step": 152975, "epoch": 910} {"train_loss": -10.045316696166992, "global_step": 152976, "epoch": 910} {"train_loss": -9.600975036621094, "global_step": 152977, "epoch": 910} {"train_loss": -10.776664733886719, "global_step": 152978, "epoch": 910} {"train_loss": -9.799790382385254, "global_step": 152979, "epoch": 910} {"train_loss": -9.915971755981445, "global_step": 152980, "epoch": 910} {"train_loss": -10.488231658935547, "global_step": 152981, "epoch": 910} {"train_loss": -9.924116134643555, "global_step": 152982, "epoch": 910} {"train_loss": -10.23419189453125, "global_step": 152983, "epoch": 910} {"train_loss": -10.688760757446289, "global_step": 152984, "epoch": 910} {"train_loss": -10.274344444274902, "global_step": 152985, "epoch": 910} {"train_loss": -10.279901504516602, "global_step": 152986, "epoch": 910} {"train_loss": -9.48896312713623, "global_step": 152987, "epoch": 910} {"train_loss": -10.476765632629395, "global_step": 152988, "epoch": 910} {"train_loss": -9.894275665283203, "global_step": 152989, "epoch": 910} {"train_loss": -9.584009170532227, "global_step": 152990, "epoch": 910} {"train_loss": -10.335210800170898, "global_step": 152991, "epoch": 910} {"train_loss": -9.463488578796387, "global_step": 152992, "epoch": 910} {"train_loss": -9.578298568725586, "global_step": 152993, "epoch": 910} {"train_loss": -10.550962448120117, "global_step": 152994, "epoch": 910} {"train_loss": -9.73979377746582, "global_step": 152995, "epoch": 910} {"train_loss": -10.336965560913086, "global_step": 152996, "epoch": 910} {"train_loss": -10.058290481567383, "global_step": 152997, "epoch": 910} {"train_loss": -9.565927505493164, "global_step": 152998, "epoch": 910} {"train_loss": -10.471376419067383, "global_step": 152999, "epoch": 910} {"train_loss": -10.237303733825684, "global_step": 153000, "epoch": 910} {"train_loss": -9.992425918579102, "global_step": 153001, "epoch": 910} {"train_loss": -10.526758193969727, "global_step": 153002, "epoch": 910} {"train_loss": -10.320151329040527, "global_step": 153003, "epoch": 910} {"train_loss": -10.265081405639648, "global_step": 153004, "epoch": 910} {"train_loss": -10.659769058227539, "global_step": 153005, "epoch": 910} {"train_loss": -10.34249496459961, "global_step": 153006, "epoch": 910} {"train_loss": -10.430644035339355, "global_step": 153007, "epoch": 910} {"train_loss": -10.616493225097656, "global_step": 153008, "epoch": 910} {"train_loss": -10.560999870300293, "global_step": 153009, "epoch": 910} {"train_loss": -10.293254852294922, "global_step": 153010, "epoch": 910} {"train_loss": -10.580568313598633, "global_step": 153011, "epoch": 910} {"train_loss": -10.420217514038086, "global_step": 153012, "epoch": 910} {"train_loss": -10.448708534240723, "global_step": 153013, "epoch": 910} {"train_loss": -10.48063850402832, "global_step": 153014, "epoch": 910} {"train_loss": -10.592706680297852, "global_step": 153015, "epoch": 910} {"train_loss": -10.656806945800781, "global_step": 153016, "epoch": 910} {"train_loss": -10.632390975952148, "global_step": 153017, "epoch": 910} {"train_loss": -10.585922241210938, "global_step": 153018, "epoch": 910} {"train_loss": -10.636682510375977, "global_step": 153019, "epoch": 910} {"train_loss": -10.682499885559082, "global_step": 153020, "epoch": 910} {"train_loss": -10.867974281311035, "global_step": 153021, "epoch": 910} {"train_loss": -10.794229507446289, "global_step": 153022, "epoch": 910} {"train_loss": -10.637874603271484, "global_step": 153023, "epoch": 910} {"train_loss": -10.859794616699219, "global_step": 153024, "epoch": 910} {"train_loss": -10.839134216308594, "global_step": 153025, "epoch": 910} {"train_loss": -10.742962837219238, "global_step": 153026, "epoch": 910} {"train_loss": -10.889217376708984, "global_step": 153027, "epoch": 910} {"train_loss": -11.00454044342041, "global_step": 153028, "epoch": 910} {"train_loss": -10.793436050415039, "global_step": 153029, "epoch": 910} {"train_loss": -11.02263069152832, "global_step": 153030, "epoch": 910} {"train_loss": -10.975298881530762, "global_step": 153031, "epoch": 910} {"train_loss": -10.990070343017578, "global_step": 153032, "epoch": 910} {"train_loss": -10.880683898925781, "global_step": 153033, "epoch": 910} {"train_loss": -11.069135665893555, "global_step": 153034, "epoch": 910} {"train_loss": -11.262829780578613, "global_step": 153035, "epoch": 910} {"train_loss": -11.111547470092773, "global_step": 153036, "epoch": 910} {"train_loss": -11.056331634521484, "global_step": 153037, "epoch": 910} {"train_loss": -11.035679817199707, "global_step": 153038, "epoch": 910} {"train_loss": -11.264800071716309, "global_step": 153039, "epoch": 910} {"train_loss": -11.041804313659668, "global_step": 153040, "epoch": 910} {"train_loss": -11.079706192016602, "global_step": 153041, "epoch": 910} {"train_loss": -11.022645950317383, "global_step": 153042, "epoch": 910} {"train_loss": -10.889944076538086, "global_step": 153043, "epoch": 910} {"train_loss": -11.134571075439453, "global_step": 153044, "epoch": 910} {"train_loss": -11.018850326538086, "global_step": 153045, "epoch": 910} {"train_loss": -11.197221755981445, "global_step": 153046, "epoch": 910} {"train_loss": -10.582785384995598, "global_step": 153047, "epoch": 910, "val_loss": 233416.953125, "train_action_mse_error": 1.6274784803390503} {"train_loss": -11.086616516113281, "global_step": 153048, "epoch": 911} {"train_loss": -11.30978012084961, "global_step": 153049, "epoch": 911} {"train_loss": -10.940055847167969, "global_step": 153050, "epoch": 911} {"train_loss": -10.923734664916992, "global_step": 153051, "epoch": 911} {"train_loss": -11.241096496582031, "global_step": 153052, "epoch": 911} {"train_loss": -11.084606170654297, "global_step": 153053, "epoch": 911} {"train_loss": -10.837467193603516, "global_step": 153054, "epoch": 911} {"train_loss": -11.053276062011719, "global_step": 153055, "epoch": 911} {"train_loss": -10.593833923339844, "global_step": 153056, "epoch": 911} {"train_loss": -11.13003921508789, "global_step": 153057, "epoch": 911} {"train_loss": -10.979851722717285, "global_step": 153058, "epoch": 911} {"train_loss": -10.799044609069824, "global_step": 153059, "epoch": 911} {"train_loss": -10.557779312133789, "global_step": 153060, "epoch": 911} {"train_loss": -10.611888885498047, "global_step": 153061, "epoch": 911} {"train_loss": -10.85232162475586, "global_step": 153062, "epoch": 911} {"train_loss": -10.435480117797852, "global_step": 153063, "epoch": 911} {"train_loss": -10.137264251708984, "global_step": 153064, "epoch": 911} {"train_loss": -10.451702117919922, "global_step": 153065, "epoch": 911} {"train_loss": -10.791524887084961, "global_step": 153066, "epoch": 911} {"train_loss": -9.986639022827148, "global_step": 153067, "epoch": 911} {"train_loss": -10.703155517578125, "global_step": 153068, "epoch": 911} {"train_loss": -10.698040008544922, "global_step": 153069, "epoch": 911} {"train_loss": -9.633037567138672, "global_step": 153070, "epoch": 911} {"train_loss": -10.438992500305176, "global_step": 153071, "epoch": 911} {"train_loss": -10.72870922088623, "global_step": 153072, "epoch": 911} {"train_loss": -10.081698417663574, "global_step": 153073, "epoch": 911} {"train_loss": -9.679134368896484, "global_step": 153074, "epoch": 911} {"train_loss": -10.523885726928711, "global_step": 153075, "epoch": 911} {"train_loss": -10.662544250488281, "global_step": 153076, "epoch": 911} {"train_loss": -9.836058616638184, "global_step": 153077, "epoch": 911} {"train_loss": -10.296797752380371, "global_step": 153078, "epoch": 911} {"train_loss": -9.332228660583496, "global_step": 153079, "epoch": 911} {"train_loss": -10.658628463745117, "global_step": 153080, "epoch": 911} {"train_loss": -10.312762260437012, "global_step": 153081, "epoch": 911} {"train_loss": -10.10107421875, "global_step": 153082, "epoch": 911} {"train_loss": -10.14686393737793, "global_step": 153083, "epoch": 911} {"train_loss": -9.966461181640625, "global_step": 153084, "epoch": 911} {"train_loss": -9.38437271118164, "global_step": 153085, "epoch": 911} {"train_loss": -9.900781631469727, "global_step": 153086, "epoch": 911} {"train_loss": -10.572920799255371, "global_step": 153087, "epoch": 911} {"train_loss": -9.506206512451172, "global_step": 153088, "epoch": 911} {"train_loss": -10.545194625854492, "global_step": 153089, "epoch": 911} {"train_loss": -10.024835586547852, "global_step": 153090, "epoch": 911} {"train_loss": -10.495999336242676, "global_step": 153091, "epoch": 911} {"train_loss": -10.433902740478516, "global_step": 153092, "epoch": 911} {"train_loss": -10.571075439453125, "global_step": 153093, "epoch": 911} {"train_loss": -10.635831832885742, "global_step": 153094, "epoch": 911} {"train_loss": -10.571683883666992, "global_step": 153095, "epoch": 911} {"train_loss": -10.636458396911621, "global_step": 153096, "epoch": 911} {"train_loss": -10.528505325317383, "global_step": 153097, "epoch": 911} {"train_loss": -10.684358596801758, "global_step": 153098, "epoch": 911} {"train_loss": -10.364494323730469, "global_step": 153099, "epoch": 911} {"train_loss": -10.690031051635742, "global_step": 153100, "epoch": 911} {"train_loss": -10.635087013244629, "global_step": 153101, "epoch": 911} {"train_loss": -10.628013610839844, "global_step": 153102, "epoch": 911} {"train_loss": -10.608312606811523, "global_step": 153103, "epoch": 911} {"train_loss": -10.564543724060059, "global_step": 153104, "epoch": 911} {"train_loss": -10.876311302185059, "global_step": 153105, "epoch": 911} {"train_loss": -10.689481735229492, "global_step": 153106, "epoch": 911} {"train_loss": -10.666860580444336, "global_step": 153107, "epoch": 911} {"train_loss": -10.474851608276367, "global_step": 153108, "epoch": 911} {"train_loss": -10.561640739440918, "global_step": 153109, "epoch": 911} {"train_loss": -10.742942810058594, "global_step": 153110, "epoch": 911} {"train_loss": -10.649295806884766, "global_step": 153111, "epoch": 911} {"train_loss": -10.585103988647461, "global_step": 153112, "epoch": 911} {"train_loss": -10.887591361999512, "global_step": 153113, "epoch": 911} {"train_loss": -10.856756210327148, "global_step": 153114, "epoch": 911} {"train_loss": -10.742212295532227, "global_step": 153115, "epoch": 911} {"train_loss": -10.856815338134766, "global_step": 153116, "epoch": 911} {"train_loss": -10.608579635620117, "global_step": 153117, "epoch": 911} {"train_loss": -10.759122848510742, "global_step": 153118, "epoch": 911} {"train_loss": -11.107053756713867, "global_step": 153119, "epoch": 911} {"train_loss": -10.909849166870117, "global_step": 153120, "epoch": 911} {"train_loss": -10.85189151763916, "global_step": 153121, "epoch": 911} {"train_loss": -11.030498504638672, "global_step": 153122, "epoch": 911} {"train_loss": -10.910037994384766, "global_step": 153123, "epoch": 911} {"train_loss": -10.939286231994629, "global_step": 153124, "epoch": 911} {"train_loss": -10.888774871826172, "global_step": 153125, "epoch": 911} {"train_loss": -10.958699226379395, "global_step": 153126, "epoch": 911} {"train_loss": -10.950958251953125, "global_step": 153127, "epoch": 911} {"train_loss": -10.778672218322754, "global_step": 153128, "epoch": 911} {"train_loss": -10.731401443481445, "global_step": 153129, "epoch": 911} {"train_loss": -10.832169532775879, "global_step": 153130, "epoch": 911} {"train_loss": -10.875658988952637, "global_step": 153131, "epoch": 911} {"train_loss": -10.911714553833008, "global_step": 153132, "epoch": 911} {"train_loss": -11.068809509277344, "global_step": 153133, "epoch": 911} {"train_loss": -10.8026704788208, "global_step": 153134, "epoch": 911} {"train_loss": -10.982623100280762, "global_step": 153135, "epoch": 911} {"train_loss": -10.93303108215332, "global_step": 153136, "epoch": 911} {"train_loss": -10.72166919708252, "global_step": 153137, "epoch": 911} {"train_loss": -11.157926559448242, "global_step": 153138, "epoch": 911} {"train_loss": -10.910025596618652, "global_step": 153139, "epoch": 911} {"train_loss": -11.00604248046875, "global_step": 153140, "epoch": 911} {"train_loss": -11.10896110534668, "global_step": 153141, "epoch": 911} {"train_loss": -10.706583023071289, "global_step": 153142, "epoch": 911} {"train_loss": -10.926897048950195, "global_step": 153143, "epoch": 911} {"train_loss": -10.800989151000977, "global_step": 153144, "epoch": 911} {"train_loss": -10.745081901550293, "global_step": 153145, "epoch": 911} {"train_loss": -10.9436674118042, "global_step": 153146, "epoch": 911} {"train_loss": -10.844108581542969, "global_step": 153147, "epoch": 911} {"train_loss": -10.437341690063477, "global_step": 153148, "epoch": 911} {"train_loss": -10.912578582763672, "global_step": 153149, "epoch": 911} {"train_loss": -10.911084175109863, "global_step": 153150, "epoch": 911} {"train_loss": -10.875444412231445, "global_step": 153151, "epoch": 911} {"train_loss": -10.655023574829102, "global_step": 153152, "epoch": 911} {"train_loss": -10.813097953796387, "global_step": 153153, "epoch": 911} {"train_loss": -10.923454284667969, "global_step": 153154, "epoch": 911} {"train_loss": -10.690374374389648, "global_step": 153155, "epoch": 911} {"train_loss": -10.695745468139648, "global_step": 153156, "epoch": 911} {"train_loss": -11.056396484375, "global_step": 153157, "epoch": 911} {"train_loss": -10.601801872253418, "global_step": 153158, "epoch": 911} {"train_loss": -10.475797653198242, "global_step": 153159, "epoch": 911} {"train_loss": -10.889708518981934, "global_step": 153160, "epoch": 911} {"train_loss": -10.584562301635742, "global_step": 153161, "epoch": 911} {"train_loss": -11.122156143188477, "global_step": 153162, "epoch": 911} {"train_loss": -10.764734268188477, "global_step": 153163, "epoch": 911} {"train_loss": -10.804243087768555, "global_step": 153164, "epoch": 911} {"train_loss": -10.690507888793945, "global_step": 153165, "epoch": 911} {"train_loss": -10.76019287109375, "global_step": 153166, "epoch": 911} {"train_loss": -11.170406341552734, "global_step": 153167, "epoch": 911} {"train_loss": -10.730428695678711, "global_step": 153168, "epoch": 911} {"train_loss": -10.909403800964355, "global_step": 153169, "epoch": 911} {"train_loss": -10.774085998535156, "global_step": 153170, "epoch": 911} {"train_loss": -10.982828140258789, "global_step": 153171, "epoch": 911} {"train_loss": -10.636649131774902, "global_step": 153172, "epoch": 911} {"train_loss": -10.998703002929688, "global_step": 153173, "epoch": 911} {"train_loss": -10.41000747680664, "global_step": 153174, "epoch": 911} {"train_loss": -10.804607391357422, "global_step": 153175, "epoch": 911} {"train_loss": -10.473021507263184, "global_step": 153176, "epoch": 911} {"train_loss": -10.506004333496094, "global_step": 153177, "epoch": 911} {"train_loss": -10.847265243530273, "global_step": 153178, "epoch": 911} {"train_loss": -10.57229995727539, "global_step": 153179, "epoch": 911} {"train_loss": -10.96159553527832, "global_step": 153180, "epoch": 911} {"train_loss": -10.535013198852539, "global_step": 153181, "epoch": 911} {"train_loss": -10.69127082824707, "global_step": 153182, "epoch": 911} {"train_loss": -10.434789657592773, "global_step": 153183, "epoch": 911} {"train_loss": -10.646293640136719, "global_step": 153184, "epoch": 911} {"train_loss": -10.909839630126953, "global_step": 153185, "epoch": 911} {"train_loss": -10.280118942260742, "global_step": 153186, "epoch": 911} {"train_loss": -10.795051574707031, "global_step": 153187, "epoch": 911} {"train_loss": -10.363597869873047, "global_step": 153188, "epoch": 911} {"train_loss": -10.23386287689209, "global_step": 153189, "epoch": 911} {"train_loss": -10.564085006713867, "global_step": 153190, "epoch": 911} {"train_loss": -10.5256986618042, "global_step": 153191, "epoch": 911} {"train_loss": -10.705358505249023, "global_step": 153192, "epoch": 911} {"train_loss": -10.46385383605957, "global_step": 153193, "epoch": 911} {"train_loss": -10.543919563293457, "global_step": 153194, "epoch": 911} {"train_loss": -10.239035606384277, "global_step": 153195, "epoch": 911} {"train_loss": -10.519207000732422, "global_step": 153196, "epoch": 911} {"train_loss": -10.542356491088867, "global_step": 153197, "epoch": 911} {"train_loss": -10.15499210357666, "global_step": 153198, "epoch": 911} {"train_loss": -10.644655227661133, "global_step": 153199, "epoch": 911} {"train_loss": -10.013978004455566, "global_step": 153200, "epoch": 911} {"train_loss": -10.560197830200195, "global_step": 153201, "epoch": 911} {"train_loss": -10.253097534179688, "global_step": 153202, "epoch": 911} {"train_loss": -10.658731460571289, "global_step": 153203, "epoch": 911} {"train_loss": -10.209664344787598, "global_step": 153204, "epoch": 911} {"train_loss": -10.680458068847656, "global_step": 153205, "epoch": 911} {"train_loss": -10.249395370483398, "global_step": 153206, "epoch": 911} {"train_loss": -10.932117462158203, "global_step": 153207, "epoch": 911} {"train_loss": -10.677276611328125, "global_step": 153208, "epoch": 911} {"train_loss": -10.740248680114746, "global_step": 153209, "epoch": 911} {"train_loss": -10.64454174041748, "global_step": 153210, "epoch": 911} {"train_loss": -11.009330749511719, "global_step": 153211, "epoch": 911} {"train_loss": -10.733287811279297, "global_step": 153212, "epoch": 911} {"train_loss": -10.427438735961914, "global_step": 153213, "epoch": 911} {"train_loss": -10.796717643737793, "global_step": 153214, "epoch": 911} {"train_loss": -10.645148816562834, "global_step": 153215, "epoch": 911, "val_loss": 227913.265625} {"train_loss": -10.817706108093262, "global_step": 153216, "epoch": 912} {"train_loss": -10.491838455200195, "global_step": 153217, "epoch": 912} {"train_loss": -10.916753768920898, "global_step": 153218, "epoch": 912} {"train_loss": -10.902637481689453, "global_step": 153219, "epoch": 912} {"train_loss": -10.911684036254883, "global_step": 153220, "epoch": 912} {"train_loss": -11.007243156433105, "global_step": 153221, "epoch": 912} {"train_loss": -10.938447952270508, "global_step": 153222, "epoch": 912} {"train_loss": -10.867599487304688, "global_step": 153223, "epoch": 912} {"train_loss": -10.89886474609375, "global_step": 153224, "epoch": 912} {"train_loss": -10.540632247924805, "global_step": 153225, "epoch": 912} {"train_loss": -11.051761627197266, "global_step": 153226, "epoch": 912} {"train_loss": -10.993302345275879, "global_step": 153227, "epoch": 912} {"train_loss": -10.795872688293457, "global_step": 153228, "epoch": 912} {"train_loss": -11.04644775390625, "global_step": 153229, "epoch": 912} {"train_loss": -11.041708946228027, "global_step": 153230, "epoch": 912} {"train_loss": -10.780075073242188, "global_step": 153231, "epoch": 912} {"train_loss": -10.796228408813477, "global_step": 153232, "epoch": 912} {"train_loss": -11.123538970947266, "global_step": 153233, "epoch": 912} {"train_loss": -10.926591873168945, "global_step": 153234, "epoch": 912} {"train_loss": -10.910150527954102, "global_step": 153235, "epoch": 912} {"train_loss": -11.00015640258789, "global_step": 153236, "epoch": 912} {"train_loss": -11.075594902038574, "global_step": 153237, "epoch": 912} {"train_loss": -10.820968627929688, "global_step": 153238, "epoch": 912} {"train_loss": -10.913251876831055, "global_step": 153239, "epoch": 912} {"train_loss": -11.180766105651855, "global_step": 153240, "epoch": 912} {"train_loss": -10.769771575927734, "global_step": 153241, "epoch": 912} {"train_loss": -11.138981819152832, "global_step": 153242, "epoch": 912} {"train_loss": -10.975040435791016, "global_step": 153243, "epoch": 912} {"train_loss": -11.1279878616333, "global_step": 153244, "epoch": 912} {"train_loss": -11.102513313293457, "global_step": 153245, "epoch": 912} {"train_loss": -11.033841133117676, "global_step": 153246, "epoch": 912} {"train_loss": -11.021355628967285, "global_step": 153247, "epoch": 912} {"train_loss": -10.923476219177246, "global_step": 153248, "epoch": 912} {"train_loss": -10.97195816040039, "global_step": 153249, "epoch": 912} {"train_loss": -10.85173225402832, "global_step": 153250, "epoch": 912} {"train_loss": -10.395492553710938, "global_step": 153251, "epoch": 912} {"train_loss": -11.105195999145508, "global_step": 153252, "epoch": 912} {"train_loss": -10.604713439941406, "global_step": 153253, "epoch": 912} {"train_loss": -10.565685272216797, "global_step": 153254, "epoch": 912} {"train_loss": -10.771455764770508, "global_step": 153255, "epoch": 912} {"train_loss": -11.065254211425781, "global_step": 153256, "epoch": 912} {"train_loss": -11.046677589416504, "global_step": 153257, "epoch": 912} {"train_loss": -11.09292221069336, "global_step": 153258, "epoch": 912} {"train_loss": -10.844125747680664, "global_step": 153259, "epoch": 912} {"train_loss": -10.954486846923828, "global_step": 153260, "epoch": 912} {"train_loss": -11.178787231445312, "global_step": 153261, "epoch": 912} {"train_loss": -11.072306632995605, "global_step": 153262, "epoch": 912} {"train_loss": -10.974491119384766, "global_step": 153263, "epoch": 912} {"train_loss": -10.866059303283691, "global_step": 153264, "epoch": 912} {"train_loss": -11.019244194030762, "global_step": 153265, "epoch": 912} {"train_loss": -11.095966339111328, "global_step": 153266, "epoch": 912} {"train_loss": -11.11898422241211, "global_step": 153267, "epoch": 912} {"train_loss": -10.847969055175781, "global_step": 153268, "epoch": 912} {"train_loss": -11.14873218536377, "global_step": 153269, "epoch": 912} {"train_loss": -10.97642993927002, "global_step": 153270, "epoch": 912} {"train_loss": -10.900755882263184, "global_step": 153271, "epoch": 912} {"train_loss": -10.9056396484375, "global_step": 153272, "epoch": 912} {"train_loss": -11.052273750305176, "global_step": 153273, "epoch": 912} {"train_loss": -10.979843139648438, "global_step": 153274, "epoch": 912} {"train_loss": -11.231663703918457, "global_step": 153275, "epoch": 912} {"train_loss": -10.789525985717773, "global_step": 153276, "epoch": 912} {"train_loss": -10.960088729858398, "global_step": 153277, "epoch": 912} {"train_loss": -11.025599479675293, "global_step": 153278, "epoch": 912} {"train_loss": -10.6307954788208, "global_step": 153279, "epoch": 912} {"train_loss": -10.08708381652832, "global_step": 153280, "epoch": 912} {"train_loss": -10.221502304077148, "global_step": 153281, "epoch": 912} {"train_loss": -10.311796188354492, "global_step": 153282, "epoch": 912} {"train_loss": -9.771967887878418, "global_step": 153283, "epoch": 912} {"train_loss": -10.741230010986328, "global_step": 153284, "epoch": 912} {"train_loss": -10.181678771972656, "global_step": 153285, "epoch": 912} {"train_loss": -9.780460357666016, "global_step": 153286, "epoch": 912} {"train_loss": -10.839473724365234, "global_step": 153287, "epoch": 912} {"train_loss": -9.528718948364258, "global_step": 153288, "epoch": 912} {"train_loss": -10.291030883789062, "global_step": 153289, "epoch": 912} {"train_loss": -10.227580070495605, "global_step": 153290, "epoch": 912} {"train_loss": -9.788463592529297, "global_step": 153291, "epoch": 912} {"train_loss": -10.897039413452148, "global_step": 153292, "epoch": 912} {"train_loss": -10.109624862670898, "global_step": 153293, "epoch": 912} {"train_loss": -10.628718376159668, "global_step": 153294, "epoch": 912} {"train_loss": -10.066709518432617, "global_step": 153295, "epoch": 912} {"train_loss": -10.388105392456055, "global_step": 153296, "epoch": 912} {"train_loss": -10.466391563415527, "global_step": 153297, "epoch": 912} {"train_loss": -9.879264831542969, "global_step": 153298, "epoch": 912} {"train_loss": -10.609527587890625, "global_step": 153299, "epoch": 912} {"train_loss": -9.729448318481445, "global_step": 153300, "epoch": 912} {"train_loss": -10.62246322631836, "global_step": 153301, "epoch": 912} {"train_loss": -10.37232494354248, "global_step": 153302, "epoch": 912} {"train_loss": -10.51763916015625, "global_step": 153303, "epoch": 912} {"train_loss": -10.318323135375977, "global_step": 153304, "epoch": 912} {"train_loss": -10.731470108032227, "global_step": 153305, "epoch": 912} {"train_loss": -10.55008602142334, "global_step": 153306, "epoch": 912} {"train_loss": -10.5972261428833, "global_step": 153307, "epoch": 912} {"train_loss": -10.77875804901123, "global_step": 153308, "epoch": 912} {"train_loss": -10.538705825805664, "global_step": 153309, "epoch": 912} {"train_loss": -10.17697811126709, "global_step": 153310, "epoch": 912} {"train_loss": -10.511894226074219, "global_step": 153311, "epoch": 912} {"train_loss": -10.670255661010742, "global_step": 153312, "epoch": 912} {"train_loss": -10.7506742477417, "global_step": 153313, "epoch": 912} {"train_loss": -10.727274894714355, "global_step": 153314, "epoch": 912} {"train_loss": -10.535367965698242, "global_step": 153315, "epoch": 912} {"train_loss": -10.835580825805664, "global_step": 153316, "epoch": 912} {"train_loss": -10.451897621154785, "global_step": 153317, "epoch": 912} {"train_loss": -10.820796012878418, "global_step": 153318, "epoch": 912} {"train_loss": -10.621524810791016, "global_step": 153319, "epoch": 912} {"train_loss": -10.823990821838379, "global_step": 153320, "epoch": 912} {"train_loss": -10.872587203979492, "global_step": 153321, "epoch": 912} {"train_loss": -10.735406875610352, "global_step": 153322, "epoch": 912} {"train_loss": -10.908171653747559, "global_step": 153323, "epoch": 912} {"train_loss": -10.68988037109375, "global_step": 153324, "epoch": 912} {"train_loss": -10.991898536682129, "global_step": 153325, "epoch": 912} {"train_loss": -10.818750381469727, "global_step": 153326, "epoch": 912} {"train_loss": -10.865792274475098, "global_step": 153327, "epoch": 912} {"train_loss": -10.950711250305176, "global_step": 153328, "epoch": 912} {"train_loss": -10.778148651123047, "global_step": 153329, "epoch": 912} {"train_loss": -10.999107360839844, "global_step": 153330, "epoch": 912} {"train_loss": -11.014505386352539, "global_step": 153331, "epoch": 912} {"train_loss": -10.682218551635742, "global_step": 153332, "epoch": 912} {"train_loss": -11.053826332092285, "global_step": 153333, "epoch": 912} {"train_loss": -10.644376754760742, "global_step": 153334, "epoch": 912} {"train_loss": -11.14329719543457, "global_step": 153335, "epoch": 912} {"train_loss": -10.927173614501953, "global_step": 153336, "epoch": 912} {"train_loss": -11.243459701538086, "global_step": 153337, "epoch": 912} {"train_loss": -10.84077262878418, "global_step": 153338, "epoch": 912} {"train_loss": -11.229470252990723, "global_step": 153339, "epoch": 912} {"train_loss": -10.858030319213867, "global_step": 153340, "epoch": 912} {"train_loss": -11.137325286865234, "global_step": 153341, "epoch": 912} {"train_loss": -10.630268096923828, "global_step": 153342, "epoch": 912} {"train_loss": -10.812518119812012, "global_step": 153343, "epoch": 912} {"train_loss": -10.924371719360352, "global_step": 153344, "epoch": 912} {"train_loss": -10.784481048583984, "global_step": 153345, "epoch": 912} {"train_loss": -11.029693603515625, "global_step": 153346, "epoch": 912} {"train_loss": -10.799310684204102, "global_step": 153347, "epoch": 912} {"train_loss": -10.594932556152344, "global_step": 153348, "epoch": 912} {"train_loss": -10.905315399169922, "global_step": 153349, "epoch": 912} {"train_loss": -10.724748611450195, "global_step": 153350, "epoch": 912} {"train_loss": -10.017332077026367, "global_step": 153351, "epoch": 912} {"train_loss": -10.940653800964355, "global_step": 153352, "epoch": 912} {"train_loss": -10.66796875, "global_step": 153353, "epoch": 912} {"train_loss": -10.544233322143555, "global_step": 153354, "epoch": 912} {"train_loss": -11.009212493896484, "global_step": 153355, "epoch": 912} {"train_loss": -10.633251190185547, "global_step": 153356, "epoch": 912} {"train_loss": -10.739645957946777, "global_step": 153357, "epoch": 912} {"train_loss": -10.539880752563477, "global_step": 153358, "epoch": 912} {"train_loss": -9.782512664794922, "global_step": 153359, "epoch": 912} {"train_loss": -10.509785652160645, "global_step": 153360, "epoch": 912} {"train_loss": -10.026920318603516, "global_step": 153361, "epoch": 912} {"train_loss": -9.192142486572266, "global_step": 153362, "epoch": 912} {"train_loss": -10.595921516418457, "global_step": 153363, "epoch": 912} {"train_loss": -10.521693229675293, "global_step": 153364, "epoch": 912} {"train_loss": -10.290201187133789, "global_step": 153365, "epoch": 912} {"train_loss": -10.340463638305664, "global_step": 153366, "epoch": 912} {"train_loss": -10.180049896240234, "global_step": 153367, "epoch": 912} {"train_loss": -10.39852523803711, "global_step": 153368, "epoch": 912} {"train_loss": -10.159130096435547, "global_step": 153369, "epoch": 912} {"train_loss": -9.473886489868164, "global_step": 153370, "epoch": 912} {"train_loss": -10.367359161376953, "global_step": 153371, "epoch": 912} {"train_loss": -9.970970153808594, "global_step": 153372, "epoch": 912} {"train_loss": -10.018821716308594, "global_step": 153373, "epoch": 912} {"train_loss": -10.32239818572998, "global_step": 153374, "epoch": 912} {"train_loss": -9.940229415893555, "global_step": 153375, "epoch": 912} {"train_loss": -10.018243789672852, "global_step": 153376, "epoch": 912} {"train_loss": -10.069368362426758, "global_step": 153377, "epoch": 912} {"train_loss": -9.725088119506836, "global_step": 153378, "epoch": 912} {"train_loss": -10.049463272094727, "global_step": 153379, "epoch": 912} {"train_loss": -9.977585792541504, "global_step": 153380, "epoch": 912} {"train_loss": -10.185979843139648, "global_step": 153381, "epoch": 912} {"train_loss": -10.21541690826416, "global_step": 153382, "epoch": 912} {"train_loss": -10.660505641074408, "global_step": 153383, "epoch": 912, "val_loss": 231693.25} {"train_loss": -9.684673309326172, "global_step": 153384, "epoch": 913} {"train_loss": -10.465733528137207, "global_step": 153385, "epoch": 913} {"train_loss": -10.345132827758789, "global_step": 153386, "epoch": 913} {"train_loss": -10.398130416870117, "global_step": 153387, "epoch": 913} {"train_loss": -10.430461883544922, "global_step": 153388, "epoch": 913} {"train_loss": -10.247465133666992, "global_step": 153389, "epoch": 913} {"train_loss": -10.650851249694824, "global_step": 153390, "epoch": 913} {"train_loss": -10.195320129394531, "global_step": 153391, "epoch": 913} {"train_loss": -10.220893859863281, "global_step": 153392, "epoch": 913} {"train_loss": -10.694929122924805, "global_step": 153393, "epoch": 913} {"train_loss": -10.069089889526367, "global_step": 153394, "epoch": 913} {"train_loss": -10.388410568237305, "global_step": 153395, "epoch": 913} {"train_loss": -10.609111785888672, "global_step": 153396, "epoch": 913} {"train_loss": -10.3680419921875, "global_step": 153397, "epoch": 913} {"train_loss": -10.582054138183594, "global_step": 153398, "epoch": 913} {"train_loss": -10.528097152709961, "global_step": 153399, "epoch": 913} {"train_loss": -10.423778533935547, "global_step": 153400, "epoch": 913} {"train_loss": -10.764469146728516, "global_step": 153401, "epoch": 913} {"train_loss": -10.59929084777832, "global_step": 153402, "epoch": 913} {"train_loss": -10.782392501831055, "global_step": 153403, "epoch": 913} {"train_loss": -10.71062183380127, "global_step": 153404, "epoch": 913} {"train_loss": -10.798834800720215, "global_step": 153405, "epoch": 913} {"train_loss": -10.685824394226074, "global_step": 153406, "epoch": 913} {"train_loss": -10.833616256713867, "global_step": 153407, "epoch": 913} {"train_loss": -10.881098747253418, "global_step": 153408, "epoch": 913} {"train_loss": -10.957618713378906, "global_step": 153409, "epoch": 913} {"train_loss": -10.983598709106445, "global_step": 153410, "epoch": 913} {"train_loss": -10.794761657714844, "global_step": 153411, "epoch": 913} {"train_loss": -11.131438255310059, "global_step": 153412, "epoch": 913} {"train_loss": -10.805032730102539, "global_step": 153413, "epoch": 913} {"train_loss": -11.081327438354492, "global_step": 153414, "epoch": 913} {"train_loss": -10.935235977172852, "global_step": 153415, "epoch": 913} {"train_loss": -11.000114440917969, "global_step": 153416, "epoch": 913} {"train_loss": -11.219258308410645, "global_step": 153417, "epoch": 913} {"train_loss": -11.038673400878906, "global_step": 153418, "epoch": 913} {"train_loss": -11.203511238098145, "global_step": 153419, "epoch": 913} {"train_loss": -10.915628433227539, "global_step": 153420, "epoch": 913} {"train_loss": -10.698784828186035, "global_step": 153421, "epoch": 913} {"train_loss": -10.888261795043945, "global_step": 153422, "epoch": 913} {"train_loss": -10.14715576171875, "global_step": 153423, "epoch": 913} {"train_loss": -11.040472030639648, "global_step": 153424, "epoch": 913} {"train_loss": -10.722352981567383, "global_step": 153425, "epoch": 913} {"train_loss": -10.023502349853516, "global_step": 153426, "epoch": 913} {"train_loss": -10.455056190490723, "global_step": 153427, "epoch": 913} {"train_loss": -10.614535331726074, "global_step": 153428, "epoch": 913} {"train_loss": -10.446385383605957, "global_step": 153429, "epoch": 913} {"train_loss": -10.497427940368652, "global_step": 153430, "epoch": 913} {"train_loss": -10.660343170166016, "global_step": 153431, "epoch": 913} {"train_loss": -10.580020904541016, "global_step": 153432, "epoch": 913} {"train_loss": -11.010488510131836, "global_step": 153433, "epoch": 913} {"train_loss": -10.76944351196289, "global_step": 153434, "epoch": 913} {"train_loss": -10.92441177368164, "global_step": 153435, "epoch": 913} {"train_loss": -10.851819038391113, "global_step": 153436, "epoch": 913} {"train_loss": -10.971525192260742, "global_step": 153437, "epoch": 913} {"train_loss": -11.030183792114258, "global_step": 153438, "epoch": 913} {"train_loss": -10.421243667602539, "global_step": 153439, "epoch": 913} {"train_loss": -10.938468933105469, "global_step": 153440, "epoch": 913} {"train_loss": -10.66790771484375, "global_step": 153441, "epoch": 913} {"train_loss": -10.967281341552734, "global_step": 153442, "epoch": 913} {"train_loss": -10.762760162353516, "global_step": 153443, "epoch": 913} {"train_loss": -10.898225784301758, "global_step": 153444, "epoch": 913} {"train_loss": -10.745257377624512, "global_step": 153445, "epoch": 913} {"train_loss": -10.874725341796875, "global_step": 153446, "epoch": 913} {"train_loss": -10.535215377807617, "global_step": 153447, "epoch": 913} {"train_loss": -10.572994232177734, "global_step": 153448, "epoch": 913} {"train_loss": -10.711699485778809, "global_step": 153449, "epoch": 913} {"train_loss": -10.698881149291992, "global_step": 153450, "epoch": 913} {"train_loss": -10.960204124450684, "global_step": 153451, "epoch": 913} {"train_loss": -10.387144088745117, "global_step": 153452, "epoch": 913} {"train_loss": -10.904754638671875, "global_step": 153453, "epoch": 913} {"train_loss": -10.362520217895508, "global_step": 153454, "epoch": 913} {"train_loss": -10.801458358764648, "global_step": 153455, "epoch": 913} {"train_loss": -10.68491268157959, "global_step": 153456, "epoch": 913} {"train_loss": -10.201045989990234, "global_step": 153457, "epoch": 913} {"train_loss": -11.084976196289062, "global_step": 153458, "epoch": 913} {"train_loss": -10.410712242126465, "global_step": 153459, "epoch": 913} {"train_loss": -10.517632484436035, "global_step": 153460, "epoch": 913} {"train_loss": -10.46957015991211, "global_step": 153461, "epoch": 913} {"train_loss": -10.461116790771484, "global_step": 153462, "epoch": 913} {"train_loss": -10.676895141601562, "global_step": 153463, "epoch": 913} {"train_loss": -10.252050399780273, "global_step": 153464, "epoch": 913} {"train_loss": -10.914861679077148, "global_step": 153465, "epoch": 913} {"train_loss": -10.874505996704102, "global_step": 153466, "epoch": 913} {"train_loss": -10.699188232421875, "global_step": 153467, "epoch": 913} {"train_loss": -10.836045265197754, "global_step": 153468, "epoch": 913} {"train_loss": -10.883939743041992, "global_step": 153469, "epoch": 913} {"train_loss": -10.6741361618042, "global_step": 153470, "epoch": 913} {"train_loss": -10.900339126586914, "global_step": 153471, "epoch": 913} {"train_loss": -10.953694343566895, "global_step": 153472, "epoch": 913} {"train_loss": -10.689451217651367, "global_step": 153473, "epoch": 913} {"train_loss": -10.764267921447754, "global_step": 153474, "epoch": 913} {"train_loss": -10.859025001525879, "global_step": 153475, "epoch": 913} {"train_loss": -11.00677490234375, "global_step": 153476, "epoch": 913} {"train_loss": -10.463529586791992, "global_step": 153477, "epoch": 913} {"train_loss": -11.01472282409668, "global_step": 153478, "epoch": 913} {"train_loss": -11.045137405395508, "global_step": 153479, "epoch": 913} {"train_loss": -10.632933616638184, "global_step": 153480, "epoch": 913} {"train_loss": -11.00212287902832, "global_step": 153481, "epoch": 913} {"train_loss": -10.839306831359863, "global_step": 153482, "epoch": 913} {"train_loss": -10.839202880859375, "global_step": 153483, "epoch": 913} {"train_loss": -10.688579559326172, "global_step": 153484, "epoch": 913} {"train_loss": -10.893631935119629, "global_step": 153485, "epoch": 913} {"train_loss": -10.808577537536621, "global_step": 153486, "epoch": 913} {"train_loss": -10.72811222076416, "global_step": 153487, "epoch": 913} {"train_loss": -10.641565322875977, "global_step": 153488, "epoch": 913} {"train_loss": -10.740617752075195, "global_step": 153489, "epoch": 913} {"train_loss": -10.635005950927734, "global_step": 153490, "epoch": 913} {"train_loss": -10.481596946716309, "global_step": 153491, "epoch": 913} {"train_loss": -10.831337928771973, "global_step": 153492, "epoch": 913} {"train_loss": -10.607945442199707, "global_step": 153493, "epoch": 913} {"train_loss": -10.875763893127441, "global_step": 153494, "epoch": 913} {"train_loss": -10.85399055480957, "global_step": 153495, "epoch": 913} {"train_loss": -10.486042022705078, "global_step": 153496, "epoch": 913} {"train_loss": -10.953451156616211, "global_step": 153497, "epoch": 913} {"train_loss": -10.565145492553711, "global_step": 153498, "epoch": 913} {"train_loss": -10.967893600463867, "global_step": 153499, "epoch": 913} {"train_loss": -10.930774688720703, "global_step": 153500, "epoch": 913} {"train_loss": -10.663496017456055, "global_step": 153501, "epoch": 913} {"train_loss": -11.037538528442383, "global_step": 153502, "epoch": 913} {"train_loss": -10.482927322387695, "global_step": 153503, "epoch": 913} {"train_loss": -10.92227554321289, "global_step": 153504, "epoch": 913} {"train_loss": -10.495780944824219, "global_step": 153505, "epoch": 913} {"train_loss": -10.262166023254395, "global_step": 153506, "epoch": 913} {"train_loss": -10.904635429382324, "global_step": 153507, "epoch": 913} {"train_loss": -10.894402503967285, "global_step": 153508, "epoch": 913} {"train_loss": -10.78785228729248, "global_step": 153509, "epoch": 913} {"train_loss": -11.06423568725586, "global_step": 153510, "epoch": 913} {"train_loss": -10.873634338378906, "global_step": 153511, "epoch": 913} {"train_loss": -10.867945671081543, "global_step": 153512, "epoch": 913} {"train_loss": -10.861778259277344, "global_step": 153513, "epoch": 913} {"train_loss": -11.19472599029541, "global_step": 153514, "epoch": 913} {"train_loss": -10.780363082885742, "global_step": 153515, "epoch": 913} {"train_loss": -10.960477828979492, "global_step": 153516, "epoch": 913} {"train_loss": -10.973669052124023, "global_step": 153517, "epoch": 913} {"train_loss": -10.800402641296387, "global_step": 153518, "epoch": 913} {"train_loss": -10.91247844696045, "global_step": 153519, "epoch": 913} {"train_loss": -10.969463348388672, "global_step": 153520, "epoch": 913} {"train_loss": -10.837165832519531, "global_step": 153521, "epoch": 913} {"train_loss": -10.971933364868164, "global_step": 153522, "epoch": 913} {"train_loss": -10.656417846679688, "global_step": 153523, "epoch": 913} {"train_loss": -10.152982711791992, "global_step": 153524, "epoch": 913} {"train_loss": -10.797126770019531, "global_step": 153525, "epoch": 913} {"train_loss": -10.524471282958984, "global_step": 153526, "epoch": 913} {"train_loss": -10.411476135253906, "global_step": 153527, "epoch": 913} {"train_loss": -10.673961639404297, "global_step": 153528, "epoch": 913} {"train_loss": -9.728337287902832, "global_step": 153529, "epoch": 913} {"train_loss": -10.800222396850586, "global_step": 153530, "epoch": 913} {"train_loss": -10.107691764831543, "global_step": 153531, "epoch": 913} {"train_loss": -10.151098251342773, "global_step": 153532, "epoch": 913} {"train_loss": -10.773649215698242, "global_step": 153533, "epoch": 913} {"train_loss": -9.74852180480957, "global_step": 153534, "epoch": 913} {"train_loss": -10.934441566467285, "global_step": 153535, "epoch": 913} {"train_loss": -10.471179962158203, "global_step": 153536, "epoch": 913} {"train_loss": -10.256492614746094, "global_step": 153537, "epoch": 913} {"train_loss": -10.57042121887207, "global_step": 153538, "epoch": 913} {"train_loss": -10.565519332885742, "global_step": 153539, "epoch": 913} {"train_loss": -10.670942306518555, "global_step": 153540, "epoch": 913} {"train_loss": -10.697893142700195, "global_step": 153541, "epoch": 913} {"train_loss": -10.261240005493164, "global_step": 153542, "epoch": 913} {"train_loss": -10.767004013061523, "global_step": 153543, "epoch": 913} {"train_loss": -10.082256317138672, "global_step": 153544, "epoch": 913} {"train_loss": -10.906664848327637, "global_step": 153545, "epoch": 913} {"train_loss": -10.72761058807373, "global_step": 153546, "epoch": 913} {"train_loss": -10.493207931518555, "global_step": 153547, "epoch": 913} {"train_loss": -10.707902908325195, "global_step": 153548, "epoch": 913} {"train_loss": -10.37661075592041, "global_step": 153549, "epoch": 913} {"train_loss": -10.792928695678711, "global_step": 153550, "epoch": 913} {"train_loss": -10.685730167797633, "global_step": 153551, "epoch": 913, "val_loss": 231734.0625} {"train_loss": -10.483724594116211, "global_step": 153552, "epoch": 914} {"train_loss": -10.570707321166992, "global_step": 153553, "epoch": 914} {"train_loss": -10.820327758789062, "global_step": 153554, "epoch": 914} {"train_loss": -10.478630065917969, "global_step": 153555, "epoch": 914} {"train_loss": -10.7752685546875, "global_step": 153556, "epoch": 914} {"train_loss": -10.53732681274414, "global_step": 153557, "epoch": 914} {"train_loss": -10.758947372436523, "global_step": 153558, "epoch": 914} {"train_loss": -10.898536682128906, "global_step": 153559, "epoch": 914} {"train_loss": -10.868890762329102, "global_step": 153560, "epoch": 914} {"train_loss": -10.914051055908203, "global_step": 153561, "epoch": 914} {"train_loss": -10.665855407714844, "global_step": 153562, "epoch": 914} {"train_loss": -10.833706855773926, "global_step": 153563, "epoch": 914} {"train_loss": -10.633097648620605, "global_step": 153564, "epoch": 914} {"train_loss": -11.100349426269531, "global_step": 153565, "epoch": 914} {"train_loss": -10.749317169189453, "global_step": 153566, "epoch": 914} {"train_loss": -10.851236343383789, "global_step": 153567, "epoch": 914} {"train_loss": -10.525699615478516, "global_step": 153568, "epoch": 914} {"train_loss": -10.864175796508789, "global_step": 153569, "epoch": 914} {"train_loss": -10.783740997314453, "global_step": 153570, "epoch": 914} {"train_loss": -10.787962913513184, "global_step": 153571, "epoch": 914} {"train_loss": -10.950652122497559, "global_step": 153572, "epoch": 914} {"train_loss": -10.780176162719727, "global_step": 153573, "epoch": 914} {"train_loss": -10.900602340698242, "global_step": 153574, "epoch": 914} {"train_loss": -10.851819038391113, "global_step": 153575, "epoch": 914} {"train_loss": -11.127013206481934, "global_step": 153576, "epoch": 914} {"train_loss": -10.842080116271973, "global_step": 153577, "epoch": 914} {"train_loss": -10.750617980957031, "global_step": 153578, "epoch": 914} {"train_loss": -10.954024314880371, "global_step": 153579, "epoch": 914} {"train_loss": -11.177014350891113, "global_step": 153580, "epoch": 914} {"train_loss": -10.837366104125977, "global_step": 153581, "epoch": 914} {"train_loss": -11.208060264587402, "global_step": 153582, "epoch": 914} {"train_loss": -10.951042175292969, "global_step": 153583, "epoch": 914} {"train_loss": -11.027514457702637, "global_step": 153584, "epoch": 914} {"train_loss": -11.116886138916016, "global_step": 153585, "epoch": 914} {"train_loss": -11.34174919128418, "global_step": 153586, "epoch": 914} {"train_loss": -10.757539749145508, "global_step": 153587, "epoch": 914} {"train_loss": -11.189018249511719, "global_step": 153588, "epoch": 914} {"train_loss": -11.131203651428223, "global_step": 153589, "epoch": 914} {"train_loss": -10.86397933959961, "global_step": 153590, "epoch": 914} {"train_loss": -10.818085670471191, "global_step": 153591, "epoch": 914} {"train_loss": -11.121368408203125, "global_step": 153592, "epoch": 914} {"train_loss": -11.127933502197266, "global_step": 153593, "epoch": 914} {"train_loss": -10.764004707336426, "global_step": 153594, "epoch": 914} {"train_loss": -10.944683074951172, "global_step": 153595, "epoch": 914} {"train_loss": -11.037939071655273, "global_step": 153596, "epoch": 914} {"train_loss": -10.397573471069336, "global_step": 153597, "epoch": 914} {"train_loss": -10.912153244018555, "global_step": 153598, "epoch": 914} {"train_loss": -10.448514938354492, "global_step": 153599, "epoch": 914} {"train_loss": -9.907867431640625, "global_step": 153600, "epoch": 914} {"train_loss": -10.69455337524414, "global_step": 153601, "epoch": 914} {"train_loss": -9.645933151245117, "global_step": 153602, "epoch": 914} {"train_loss": -9.889627456665039, "global_step": 153603, "epoch": 914} {"train_loss": -10.09376335144043, "global_step": 153604, "epoch": 914} {"train_loss": -9.302362442016602, "global_step": 153605, "epoch": 914} {"train_loss": -9.785490036010742, "global_step": 153606, "epoch": 914} {"train_loss": -10.12368106842041, "global_step": 153607, "epoch": 914} {"train_loss": -9.846217155456543, "global_step": 153608, "epoch": 914} {"train_loss": -10.71395492553711, "global_step": 153609, "epoch": 914} {"train_loss": -10.241276741027832, "global_step": 153610, "epoch": 914} {"train_loss": -10.395537376403809, "global_step": 153611, "epoch": 914} {"train_loss": -9.862114906311035, "global_step": 153612, "epoch": 914} {"train_loss": -10.330028533935547, "global_step": 153613, "epoch": 914} {"train_loss": -9.507766723632812, "global_step": 153614, "epoch": 914} {"train_loss": -10.55286979675293, "global_step": 153615, "epoch": 914} {"train_loss": -10.177513122558594, "global_step": 153616, "epoch": 914} {"train_loss": -10.165512084960938, "global_step": 153617, "epoch": 914} {"train_loss": -10.253301620483398, "global_step": 153618, "epoch": 914} {"train_loss": -10.242715835571289, "global_step": 153619, "epoch": 914} {"train_loss": -10.235223770141602, "global_step": 153620, "epoch": 914} {"train_loss": -10.742745399475098, "global_step": 153621, "epoch": 914} {"train_loss": -9.812684059143066, "global_step": 153622, "epoch": 914} {"train_loss": -10.368513107299805, "global_step": 153623, "epoch": 914} {"train_loss": -10.214279174804688, "global_step": 153624, "epoch": 914} {"train_loss": -10.404775619506836, "global_step": 153625, "epoch": 914} {"train_loss": -10.558584213256836, "global_step": 153626, "epoch": 914} {"train_loss": -10.351693153381348, "global_step": 153627, "epoch": 914} {"train_loss": -10.35552978515625, "global_step": 153628, "epoch": 914} {"train_loss": -10.407499313354492, "global_step": 153629, "epoch": 914} {"train_loss": -10.602694511413574, "global_step": 153630, "epoch": 914} {"train_loss": -10.121732711791992, "global_step": 153631, "epoch": 914} {"train_loss": -10.858137130737305, "global_step": 153632, "epoch": 914} {"train_loss": -10.6004638671875, "global_step": 153633, "epoch": 914} {"train_loss": -10.73114013671875, "global_step": 153634, "epoch": 914} {"train_loss": -10.824943542480469, "global_step": 153635, "epoch": 914} {"train_loss": -10.792228698730469, "global_step": 153636, "epoch": 914} {"train_loss": -10.815240859985352, "global_step": 153637, "epoch": 914} {"train_loss": -10.791116714477539, "global_step": 153638, "epoch": 914} {"train_loss": -10.798564910888672, "global_step": 153639, "epoch": 914} {"train_loss": -10.734661102294922, "global_step": 153640, "epoch": 914} {"train_loss": -11.014108657836914, "global_step": 153641, "epoch": 914} {"train_loss": -10.850564002990723, "global_step": 153642, "epoch": 914} {"train_loss": -11.055387496948242, "global_step": 153643, "epoch": 914} {"train_loss": -10.946346282958984, "global_step": 153644, "epoch": 914} {"train_loss": -10.769206047058105, "global_step": 153645, "epoch": 914} {"train_loss": -10.902135848999023, "global_step": 153646, "epoch": 914} {"train_loss": -11.072619438171387, "global_step": 153647, "epoch": 914} {"train_loss": -10.871434211730957, "global_step": 153648, "epoch": 914} {"train_loss": -10.706188201904297, "global_step": 153649, "epoch": 914} {"train_loss": -10.951560974121094, "global_step": 153650, "epoch": 914} {"train_loss": -10.88570785522461, "global_step": 153651, "epoch": 914} {"train_loss": -10.976043701171875, "global_step": 153652, "epoch": 914} {"train_loss": -10.738882064819336, "global_step": 153653, "epoch": 914} {"train_loss": -11.042341232299805, "global_step": 153654, "epoch": 914} {"train_loss": -10.55345344543457, "global_step": 153655, "epoch": 914} {"train_loss": -10.730179786682129, "global_step": 153656, "epoch": 914} {"train_loss": -11.161709785461426, "global_step": 153657, "epoch": 914} {"train_loss": -10.621859550476074, "global_step": 153658, "epoch": 914} {"train_loss": -11.111360549926758, "global_step": 153659, "epoch": 914} {"train_loss": -10.791202545166016, "global_step": 153660, "epoch": 914} {"train_loss": -10.855672836303711, "global_step": 153661, "epoch": 914} {"train_loss": -10.977957725524902, "global_step": 153662, "epoch": 914} {"train_loss": -11.188919067382812, "global_step": 153663, "epoch": 914} {"train_loss": -10.862884521484375, "global_step": 153664, "epoch": 914} {"train_loss": -10.92724609375, "global_step": 153665, "epoch": 914} {"train_loss": -10.905572891235352, "global_step": 153666, "epoch": 914} {"train_loss": -11.237527847290039, "global_step": 153667, "epoch": 914} {"train_loss": -10.72653579711914, "global_step": 153668, "epoch": 914} {"train_loss": -10.907369613647461, "global_step": 153669, "epoch": 914} {"train_loss": -11.130352020263672, "global_step": 153670, "epoch": 914} {"train_loss": -10.835333824157715, "global_step": 153671, "epoch": 914} {"train_loss": -10.830117225646973, "global_step": 153672, "epoch": 914} {"train_loss": -10.818510055541992, "global_step": 153673, "epoch": 914} {"train_loss": -10.964643478393555, "global_step": 153674, "epoch": 914} {"train_loss": -10.412138938903809, "global_step": 153675, "epoch": 914} {"train_loss": -10.375528335571289, "global_step": 153676, "epoch": 914} {"train_loss": -11.02845573425293, "global_step": 153677, "epoch": 914} {"train_loss": -10.613842010498047, "global_step": 153678, "epoch": 914} {"train_loss": -10.492740631103516, "global_step": 153679, "epoch": 914} {"train_loss": -10.828033447265625, "global_step": 153680, "epoch": 914} {"train_loss": -10.768780708312988, "global_step": 153681, "epoch": 914} {"train_loss": -10.623237609863281, "global_step": 153682, "epoch": 914} {"train_loss": -10.716939926147461, "global_step": 153683, "epoch": 914} {"train_loss": -10.772632598876953, "global_step": 153684, "epoch": 914} {"train_loss": -10.732303619384766, "global_step": 153685, "epoch": 914} {"train_loss": -10.563377380371094, "global_step": 153686, "epoch": 914} {"train_loss": -10.75870132446289, "global_step": 153687, "epoch": 914} {"train_loss": -10.626504898071289, "global_step": 153688, "epoch": 914} {"train_loss": -10.43157958984375, "global_step": 153689, "epoch": 914} {"train_loss": -10.114502906799316, "global_step": 153690, "epoch": 914} {"train_loss": -10.081332206726074, "global_step": 153691, "epoch": 914} {"train_loss": -10.671939849853516, "global_step": 153692, "epoch": 914} {"train_loss": -10.19554615020752, "global_step": 153693, "epoch": 914} {"train_loss": -9.921812057495117, "global_step": 153694, "epoch": 914} {"train_loss": -10.746124267578125, "global_step": 153695, "epoch": 914} {"train_loss": -9.316776275634766, "global_step": 153696, "epoch": 914} {"train_loss": -10.565135955810547, "global_step": 153697, "epoch": 914} {"train_loss": -10.133557319641113, "global_step": 153698, "epoch": 914} {"train_loss": -10.082134246826172, "global_step": 153699, "epoch": 914} {"train_loss": -10.729265213012695, "global_step": 153700, "epoch": 914} {"train_loss": -10.043010711669922, "global_step": 153701, "epoch": 914} {"train_loss": -10.747209548950195, "global_step": 153702, "epoch": 914} {"train_loss": -10.410383224487305, "global_step": 153703, "epoch": 914} {"train_loss": -10.534125328063965, "global_step": 153704, "epoch": 914} {"train_loss": -10.704146385192871, "global_step": 153705, "epoch": 914} {"train_loss": -10.583993911743164, "global_step": 153706, "epoch": 914} {"train_loss": -10.676429748535156, "global_step": 153707, "epoch": 914} {"train_loss": -10.751277923583984, "global_step": 153708, "epoch": 914} {"train_loss": -10.487142562866211, "global_step": 153709, "epoch": 914} {"train_loss": -10.641407012939453, "global_step": 153710, "epoch": 914} {"train_loss": -10.517672538757324, "global_step": 153711, "epoch": 914} {"train_loss": -10.559362411499023, "global_step": 153712, "epoch": 914} {"train_loss": -10.7347412109375, "global_step": 153713, "epoch": 914} {"train_loss": -10.472232818603516, "global_step": 153714, "epoch": 914} {"train_loss": -10.519768714904785, "global_step": 153715, "epoch": 914} {"train_loss": -10.521936416625977, "global_step": 153716, "epoch": 914} {"train_loss": -10.618606567382812, "global_step": 153717, "epoch": 914} {"train_loss": -10.638593673706055, "global_step": 153718, "epoch": 914} {"train_loss": -10.643571240561348, "global_step": 153719, "epoch": 914, "val_loss": 230763.828125} {"train_loss": -10.417776107788086, "global_step": 153720, "epoch": 915} {"train_loss": -10.735321998596191, "global_step": 153721, "epoch": 915} {"train_loss": -10.452217102050781, "global_step": 153722, "epoch": 915} {"train_loss": -10.834733963012695, "global_step": 153723, "epoch": 915} {"train_loss": -10.687112808227539, "global_step": 153724, "epoch": 915} {"train_loss": -10.855827331542969, "global_step": 153725, "epoch": 915} {"train_loss": -10.602997779846191, "global_step": 153726, "epoch": 915} {"train_loss": -10.911015510559082, "global_step": 153727, "epoch": 915} {"train_loss": -10.790106773376465, "global_step": 153728, "epoch": 915} {"train_loss": -10.76539421081543, "global_step": 153729, "epoch": 915} {"train_loss": -10.77760124206543, "global_step": 153730, "epoch": 915} {"train_loss": -10.48082447052002, "global_step": 153731, "epoch": 915} {"train_loss": -10.713799476623535, "global_step": 153732, "epoch": 915} {"train_loss": -10.880016326904297, "global_step": 153733, "epoch": 915} {"train_loss": -10.735057830810547, "global_step": 153734, "epoch": 915} {"train_loss": -10.964455604553223, "global_step": 153735, "epoch": 915} {"train_loss": -10.710086822509766, "global_step": 153736, "epoch": 915} {"train_loss": -10.544378280639648, "global_step": 153737, "epoch": 915} {"train_loss": -10.821139335632324, "global_step": 153738, "epoch": 915} {"train_loss": -10.437549591064453, "global_step": 153739, "epoch": 915} {"train_loss": -10.7941255569458, "global_step": 153740, "epoch": 915} {"train_loss": -10.576330184936523, "global_step": 153741, "epoch": 915} {"train_loss": -10.72085952758789, "global_step": 153742, "epoch": 915} {"train_loss": -10.833725929260254, "global_step": 153743, "epoch": 915} {"train_loss": -10.567484855651855, "global_step": 153744, "epoch": 915} {"train_loss": -10.829949378967285, "global_step": 153745, "epoch": 915} {"train_loss": -10.624741554260254, "global_step": 153746, "epoch": 915} {"train_loss": -10.781576156616211, "global_step": 153747, "epoch": 915} {"train_loss": -10.47552490234375, "global_step": 153748, "epoch": 915} {"train_loss": -10.775014877319336, "global_step": 153749, "epoch": 915} {"train_loss": -11.001313209533691, "global_step": 153750, "epoch": 915} {"train_loss": -10.929805755615234, "global_step": 153751, "epoch": 915} {"train_loss": -10.477866172790527, "global_step": 153752, "epoch": 915} {"train_loss": -10.826192855834961, "global_step": 153753, "epoch": 915} {"train_loss": -10.788735389709473, "global_step": 153754, "epoch": 915} {"train_loss": -10.213838577270508, "global_step": 153755, "epoch": 915} {"train_loss": -10.893733024597168, "global_step": 153756, "epoch": 915} {"train_loss": -10.754843711853027, "global_step": 153757, "epoch": 915} {"train_loss": -10.900169372558594, "global_step": 153758, "epoch": 915} {"train_loss": -10.822395324707031, "global_step": 153759, "epoch": 915} {"train_loss": -10.80925178527832, "global_step": 153760, "epoch": 915} {"train_loss": -10.923636436462402, "global_step": 153761, "epoch": 915} {"train_loss": -10.945867538452148, "global_step": 153762, "epoch": 915} {"train_loss": -10.904147148132324, "global_step": 153763, "epoch": 915} {"train_loss": -10.739211082458496, "global_step": 153764, "epoch": 915} {"train_loss": -10.931421279907227, "global_step": 153765, "epoch": 915} {"train_loss": -10.792616844177246, "global_step": 153766, "epoch": 915} {"train_loss": -10.731853485107422, "global_step": 153767, "epoch": 915} {"train_loss": -10.920160293579102, "global_step": 153768, "epoch": 915} {"train_loss": -10.874898910522461, "global_step": 153769, "epoch": 915} {"train_loss": -11.042182922363281, "global_step": 153770, "epoch": 915} {"train_loss": -10.885427474975586, "global_step": 153771, "epoch": 915} {"train_loss": -10.9097318649292, "global_step": 153772, "epoch": 915} {"train_loss": -11.048162460327148, "global_step": 153773, "epoch": 915} {"train_loss": -11.145076751708984, "global_step": 153774, "epoch": 915} {"train_loss": -10.795419692993164, "global_step": 153775, "epoch": 915} {"train_loss": -10.854439735412598, "global_step": 153776, "epoch": 915} {"train_loss": -11.101730346679688, "global_step": 153777, "epoch": 915} {"train_loss": -10.731915473937988, "global_step": 153778, "epoch": 915} {"train_loss": -10.593616485595703, "global_step": 153779, "epoch": 915} {"train_loss": -10.502612113952637, "global_step": 153780, "epoch": 915} {"train_loss": -10.175421714782715, "global_step": 153781, "epoch": 915} {"train_loss": -9.935827255249023, "global_step": 153782, "epoch": 915} {"train_loss": -9.949191093444824, "global_step": 153783, "epoch": 915} {"train_loss": -9.469335556030273, "global_step": 153784, "epoch": 915} {"train_loss": -9.897128105163574, "global_step": 153785, "epoch": 915} {"train_loss": -9.870363235473633, "global_step": 153786, "epoch": 915} {"train_loss": -10.587706565856934, "global_step": 153787, "epoch": 915} {"train_loss": -9.114879608154297, "global_step": 153788, "epoch": 915} {"train_loss": -10.936187744140625, "global_step": 153789, "epoch": 915} {"train_loss": -9.951929092407227, "global_step": 153790, "epoch": 915} {"train_loss": -10.536087036132812, "global_step": 153791, "epoch": 915} {"train_loss": -9.825959205627441, "global_step": 153792, "epoch": 915} {"train_loss": -10.638162612915039, "global_step": 153793, "epoch": 915} {"train_loss": -10.104534149169922, "global_step": 153794, "epoch": 915} {"train_loss": -10.689769744873047, "global_step": 153795, "epoch": 915} {"train_loss": -10.304527282714844, "global_step": 153796, "epoch": 915} {"train_loss": -10.290267944335938, "global_step": 153797, "epoch": 915} {"train_loss": -10.287044525146484, "global_step": 153798, "epoch": 915} {"train_loss": -10.753059387207031, "global_step": 153799, "epoch": 915} {"train_loss": -10.159382820129395, "global_step": 153800, "epoch": 915} {"train_loss": -10.480865478515625, "global_step": 153801, "epoch": 915} {"train_loss": -10.552886962890625, "global_step": 153802, "epoch": 915} {"train_loss": -10.071250915527344, "global_step": 153803, "epoch": 915} {"train_loss": -10.527061462402344, "global_step": 153804, "epoch": 915} {"train_loss": -10.412818908691406, "global_step": 153805, "epoch": 915} {"train_loss": -10.597800254821777, "global_step": 153806, "epoch": 915} {"train_loss": -10.516307830810547, "global_step": 153807, "epoch": 915} {"train_loss": -10.53347110748291, "global_step": 153808, "epoch": 915} {"train_loss": -10.565407752990723, "global_step": 153809, "epoch": 915} {"train_loss": -10.88395881652832, "global_step": 153810, "epoch": 915} {"train_loss": -10.262514114379883, "global_step": 153811, "epoch": 915} {"train_loss": -10.702266693115234, "global_step": 153812, "epoch": 915} {"train_loss": -10.479488372802734, "global_step": 153813, "epoch": 915} {"train_loss": -10.288150787353516, "global_step": 153814, "epoch": 915} {"train_loss": -10.451751708984375, "global_step": 153815, "epoch": 915} {"train_loss": -10.60798454284668, "global_step": 153816, "epoch": 915} {"train_loss": -10.657943725585938, "global_step": 153817, "epoch": 915} {"train_loss": -10.580253601074219, "global_step": 153818, "epoch": 915} {"train_loss": -10.727914810180664, "global_step": 153819, "epoch": 915} {"train_loss": -10.684534072875977, "global_step": 153820, "epoch": 915} {"train_loss": -10.470588684082031, "global_step": 153821, "epoch": 915} {"train_loss": -10.945863723754883, "global_step": 153822, "epoch": 915} {"train_loss": -10.772079467773438, "global_step": 153823, "epoch": 915} {"train_loss": -10.82766056060791, "global_step": 153824, "epoch": 915} {"train_loss": -10.8438720703125, "global_step": 153825, "epoch": 915} {"train_loss": -10.90357494354248, "global_step": 153826, "epoch": 915} {"train_loss": -10.558107376098633, "global_step": 153827, "epoch": 915} {"train_loss": -10.814034461975098, "global_step": 153828, "epoch": 915} {"train_loss": -10.923490524291992, "global_step": 153829, "epoch": 915} {"train_loss": -10.918384552001953, "global_step": 153830, "epoch": 915} {"train_loss": -10.906996726989746, "global_step": 153831, "epoch": 915} {"train_loss": -10.870002746582031, "global_step": 153832, "epoch": 915} {"train_loss": -10.978174209594727, "global_step": 153833, "epoch": 915} {"train_loss": -10.712617874145508, "global_step": 153834, "epoch": 915} {"train_loss": -10.957939147949219, "global_step": 153835, "epoch": 915} {"train_loss": -11.089120864868164, "global_step": 153836, "epoch": 915} {"train_loss": -10.877954483032227, "global_step": 153837, "epoch": 915} {"train_loss": -11.139181137084961, "global_step": 153838, "epoch": 915} {"train_loss": -10.857667922973633, "global_step": 153839, "epoch": 915} {"train_loss": -10.75516128540039, "global_step": 153840, "epoch": 915} {"train_loss": -11.155220985412598, "global_step": 153841, "epoch": 915} {"train_loss": -10.744223594665527, "global_step": 153842, "epoch": 915} {"train_loss": -11.061742782592773, "global_step": 153843, "epoch": 915} {"train_loss": -10.746224403381348, "global_step": 153844, "epoch": 915} {"train_loss": -10.88342571258545, "global_step": 153845, "epoch": 915} {"train_loss": -10.878345489501953, "global_step": 153846, "epoch": 915} {"train_loss": -10.882330894470215, "global_step": 153847, "epoch": 915} {"train_loss": -10.882429122924805, "global_step": 153848, "epoch": 915} {"train_loss": -11.044793128967285, "global_step": 153849, "epoch": 915} {"train_loss": -10.96148681640625, "global_step": 153850, "epoch": 915} {"train_loss": -10.992448806762695, "global_step": 153851, "epoch": 915} {"train_loss": -11.039387702941895, "global_step": 153852, "epoch": 915} {"train_loss": -10.883792877197266, "global_step": 153853, "epoch": 915} {"train_loss": -11.14554214477539, "global_step": 153854, "epoch": 915} {"train_loss": -10.938368797302246, "global_step": 153855, "epoch": 915} {"train_loss": -10.878878593444824, "global_step": 153856, "epoch": 915} {"train_loss": -9.909963607788086, "global_step": 153857, "epoch": 915} {"train_loss": -10.783230781555176, "global_step": 153858, "epoch": 915} {"train_loss": -10.60922908782959, "global_step": 153859, "epoch": 915} {"train_loss": -10.730239868164062, "global_step": 153860, "epoch": 915} {"train_loss": -10.942102432250977, "global_step": 153861, "epoch": 915} {"train_loss": -10.551186561584473, "global_step": 153862, "epoch": 915} {"train_loss": -10.589098930358887, "global_step": 153863, "epoch": 915} {"train_loss": -9.686662673950195, "global_step": 153864, "epoch": 915} {"train_loss": -10.509824752807617, "global_step": 153865, "epoch": 915} {"train_loss": -10.430588722229004, "global_step": 153866, "epoch": 915} {"train_loss": -10.688828468322754, "global_step": 153867, "epoch": 915} {"train_loss": -10.319572448730469, "global_step": 153868, "epoch": 915} {"train_loss": -10.488349914550781, "global_step": 153869, "epoch": 915} {"train_loss": -10.714365005493164, "global_step": 153870, "epoch": 915} {"train_loss": -10.779873847961426, "global_step": 153871, "epoch": 915} {"train_loss": -10.561378479003906, "global_step": 153872, "epoch": 915} {"train_loss": -10.57310676574707, "global_step": 153873, "epoch": 915} {"train_loss": -10.18936538696289, "global_step": 153874, "epoch": 915} {"train_loss": -10.3099365234375, "global_step": 153875, "epoch": 915} {"train_loss": -10.104304313659668, "global_step": 153876, "epoch": 915} {"train_loss": -10.312575340270996, "global_step": 153877, "epoch": 915} {"train_loss": -10.058350563049316, "global_step": 153878, "epoch": 915} {"train_loss": -10.629344940185547, "global_step": 153879, "epoch": 915} {"train_loss": -10.480684280395508, "global_step": 153880, "epoch": 915} {"train_loss": -10.318502426147461, "global_step": 153881, "epoch": 915} {"train_loss": -10.418478012084961, "global_step": 153882, "epoch": 915} {"train_loss": -10.796445846557617, "global_step": 153883, "epoch": 915} {"train_loss": -10.451154708862305, "global_step": 153884, "epoch": 915} {"train_loss": -10.582755088806152, "global_step": 153885, "epoch": 915} {"train_loss": -10.314848899841309, "global_step": 153886, "epoch": 915} {"train_loss": -10.640761869294304, "global_step": 153887, "epoch": 915, "val_loss": 234353.328125, "train_action_mse_error": 2.358168363571167} {"train_loss": -10.573270797729492, "global_step": 153888, "epoch": 916} {"train_loss": -10.56568717956543, "global_step": 153889, "epoch": 916} {"train_loss": -10.626811981201172, "global_step": 153890, "epoch": 916} {"train_loss": -10.579792976379395, "global_step": 153891, "epoch": 916} {"train_loss": -10.69974136352539, "global_step": 153892, "epoch": 916} {"train_loss": -10.527938842773438, "global_step": 153893, "epoch": 916} {"train_loss": -10.946891784667969, "global_step": 153894, "epoch": 916} {"train_loss": -10.798308372497559, "global_step": 153895, "epoch": 916} {"train_loss": -10.921432495117188, "global_step": 153896, "epoch": 916} {"train_loss": -10.873659133911133, "global_step": 153897, "epoch": 916} {"train_loss": -10.90253734588623, "global_step": 153898, "epoch": 916} {"train_loss": -10.92414665222168, "global_step": 153899, "epoch": 916} {"train_loss": -10.840927124023438, "global_step": 153900, "epoch": 916} {"train_loss": -11.011550903320312, "global_step": 153901, "epoch": 916} {"train_loss": -10.867887496948242, "global_step": 153902, "epoch": 916} {"train_loss": -10.604068756103516, "global_step": 153903, "epoch": 916} {"train_loss": -10.876121520996094, "global_step": 153904, "epoch": 916} {"train_loss": -10.965431213378906, "global_step": 153905, "epoch": 916} {"train_loss": -10.80118179321289, "global_step": 153906, "epoch": 916} {"train_loss": -11.077041625976562, "global_step": 153907, "epoch": 916} {"train_loss": -10.976262092590332, "global_step": 153908, "epoch": 916} {"train_loss": -10.949626922607422, "global_step": 153909, "epoch": 916} {"train_loss": -10.966941833496094, "global_step": 153910, "epoch": 916} {"train_loss": -10.896221160888672, "global_step": 153911, "epoch": 916} {"train_loss": -10.947436332702637, "global_step": 153912, "epoch": 916} {"train_loss": -10.973228454589844, "global_step": 153913, "epoch": 916} {"train_loss": -11.0806884765625, "global_step": 153914, "epoch": 916} {"train_loss": -11.032196044921875, "global_step": 153915, "epoch": 916} {"train_loss": -10.706615447998047, "global_step": 153916, "epoch": 916} {"train_loss": -11.008474349975586, "global_step": 153917, "epoch": 916} {"train_loss": -10.898612022399902, "global_step": 153918, "epoch": 916} {"train_loss": -11.113544464111328, "global_step": 153919, "epoch": 916} {"train_loss": -11.110397338867188, "global_step": 153920, "epoch": 916} {"train_loss": -10.890335083007812, "global_step": 153921, "epoch": 916} {"train_loss": -11.120512008666992, "global_step": 153922, "epoch": 916} {"train_loss": -10.999499320983887, "global_step": 153923, "epoch": 916} {"train_loss": -10.708328247070312, "global_step": 153924, "epoch": 916} {"train_loss": -11.04116439819336, "global_step": 153925, "epoch": 916} {"train_loss": -10.765703201293945, "global_step": 153926, "epoch": 916} {"train_loss": -11.17409896850586, "global_step": 153927, "epoch": 916} {"train_loss": -10.963229179382324, "global_step": 153928, "epoch": 916} {"train_loss": -10.646719932556152, "global_step": 153929, "epoch": 916} {"train_loss": -10.69428539276123, "global_step": 153930, "epoch": 916} {"train_loss": -10.967044830322266, "global_step": 153931, "epoch": 916} {"train_loss": -10.671932220458984, "global_step": 153932, "epoch": 916} {"train_loss": -10.744856834411621, "global_step": 153933, "epoch": 916} {"train_loss": -10.80504035949707, "global_step": 153934, "epoch": 916} {"train_loss": -11.130081176757812, "global_step": 153935, "epoch": 916} {"train_loss": -10.601109504699707, "global_step": 153936, "epoch": 916} {"train_loss": -10.501705169677734, "global_step": 153937, "epoch": 916} {"train_loss": -9.65022087097168, "global_step": 153938, "epoch": 916} {"train_loss": -10.783432006835938, "global_step": 153939, "epoch": 916} {"train_loss": -9.538797378540039, "global_step": 153940, "epoch": 916} {"train_loss": -10.160877227783203, "global_step": 153941, "epoch": 916} {"train_loss": -10.224760055541992, "global_step": 153942, "epoch": 916} {"train_loss": -9.751100540161133, "global_step": 153943, "epoch": 916} {"train_loss": -10.486356735229492, "global_step": 153944, "epoch": 916} {"train_loss": -9.841529846191406, "global_step": 153945, "epoch": 916} {"train_loss": -9.798738479614258, "global_step": 153946, "epoch": 916} {"train_loss": -10.283202171325684, "global_step": 153947, "epoch": 916} {"train_loss": -9.795036315917969, "global_step": 153948, "epoch": 916} {"train_loss": -10.488397598266602, "global_step": 153949, "epoch": 916} {"train_loss": -10.411714553833008, "global_step": 153950, "epoch": 916} {"train_loss": -10.276544570922852, "global_step": 153951, "epoch": 916} {"train_loss": -10.373119354248047, "global_step": 153952, "epoch": 916} {"train_loss": -10.323973655700684, "global_step": 153953, "epoch": 916} {"train_loss": -10.316415786743164, "global_step": 153954, "epoch": 916} {"train_loss": -10.140695571899414, "global_step": 153955, "epoch": 916} {"train_loss": -10.521635055541992, "global_step": 153956, "epoch": 916} {"train_loss": -10.4443359375, "global_step": 153957, "epoch": 916} {"train_loss": -10.515263557434082, "global_step": 153958, "epoch": 916} {"train_loss": -10.12710189819336, "global_step": 153959, "epoch": 916} {"train_loss": -10.606142044067383, "global_step": 153960, "epoch": 916} {"train_loss": -10.695380210876465, "global_step": 153961, "epoch": 916} {"train_loss": -10.729167938232422, "global_step": 153962, "epoch": 916} {"train_loss": -10.74246597290039, "global_step": 153963, "epoch": 916} {"train_loss": -10.747063636779785, "global_step": 153964, "epoch": 916} {"train_loss": -10.622793197631836, "global_step": 153965, "epoch": 916} {"train_loss": -10.848283767700195, "global_step": 153966, "epoch": 916} {"train_loss": -10.671177864074707, "global_step": 153967, "epoch": 916} {"train_loss": -10.817046165466309, "global_step": 153968, "epoch": 916} {"train_loss": -10.643142700195312, "global_step": 153969, "epoch": 916} {"train_loss": -10.481321334838867, "global_step": 153970, "epoch": 916} {"train_loss": -11.017367362976074, "global_step": 153971, "epoch": 916} {"train_loss": -10.805551528930664, "global_step": 153972, "epoch": 916} {"train_loss": -10.910286903381348, "global_step": 153973, "epoch": 916} {"train_loss": -10.723349571228027, "global_step": 153974, "epoch": 916} {"train_loss": -10.604838371276855, "global_step": 153975, "epoch": 916} {"train_loss": -11.061253547668457, "global_step": 153976, "epoch": 916} {"train_loss": -10.772880554199219, "global_step": 153977, "epoch": 916} {"train_loss": -10.741742134094238, "global_step": 153978, "epoch": 916} {"train_loss": -10.807723999023438, "global_step": 153979, "epoch": 916} {"train_loss": -10.883685111999512, "global_step": 153980, "epoch": 916} {"train_loss": -10.910929679870605, "global_step": 153981, "epoch": 916} {"train_loss": -10.952348709106445, "global_step": 153982, "epoch": 916} {"train_loss": -10.710522651672363, "global_step": 153983, "epoch": 916} {"train_loss": -11.016241073608398, "global_step": 153984, "epoch": 916} {"train_loss": -10.967918395996094, "global_step": 153985, "epoch": 916} {"train_loss": -10.656695365905762, "global_step": 153986, "epoch": 916} {"train_loss": -10.95798110961914, "global_step": 153987, "epoch": 916} {"train_loss": -10.93880844116211, "global_step": 153988, "epoch": 916} {"train_loss": -10.790594100952148, "global_step": 153989, "epoch": 916} {"train_loss": -10.695234298706055, "global_step": 153990, "epoch": 916} {"train_loss": -10.500455856323242, "global_step": 153991, "epoch": 916} {"train_loss": -10.750459671020508, "global_step": 153992, "epoch": 916} {"train_loss": -11.15872859954834, "global_step": 153993, "epoch": 916} {"train_loss": -10.969688415527344, "global_step": 153994, "epoch": 916} {"train_loss": -10.866230964660645, "global_step": 153995, "epoch": 916} {"train_loss": -10.66966438293457, "global_step": 153996, "epoch": 916} {"train_loss": -11.162601470947266, "global_step": 153997, "epoch": 916} {"train_loss": -10.762287139892578, "global_step": 153998, "epoch": 916} {"train_loss": -11.22490119934082, "global_step": 153999, "epoch": 916} {"train_loss": -10.936649322509766, "global_step": 154000, "epoch": 916} {"train_loss": -10.928905487060547, "global_step": 154001, "epoch": 916} {"train_loss": -11.14113712310791, "global_step": 154002, "epoch": 916} {"train_loss": -10.618309020996094, "global_step": 154003, "epoch": 916} {"train_loss": -10.870655059814453, "global_step": 154004, "epoch": 916} {"train_loss": -10.722391128540039, "global_step": 154005, "epoch": 916} {"train_loss": -10.903848648071289, "global_step": 154006, "epoch": 916} {"train_loss": -10.914873123168945, "global_step": 154007, "epoch": 916} {"train_loss": -10.976166725158691, "global_step": 154008, "epoch": 916} {"train_loss": -10.799842834472656, "global_step": 154009, "epoch": 916} {"train_loss": -10.922914505004883, "global_step": 154010, "epoch": 916} {"train_loss": -10.603038787841797, "global_step": 154011, "epoch": 916} {"train_loss": -10.976103782653809, "global_step": 154012, "epoch": 916} {"train_loss": -10.610564231872559, "global_step": 154013, "epoch": 916} {"train_loss": -11.17658519744873, "global_step": 154014, "epoch": 916} {"train_loss": -10.798931121826172, "global_step": 154015, "epoch": 916} {"train_loss": -10.612013816833496, "global_step": 154016, "epoch": 916} {"train_loss": -10.749053001403809, "global_step": 154017, "epoch": 916} {"train_loss": -10.345715522766113, "global_step": 154018, "epoch": 916} {"train_loss": -11.028443336486816, "global_step": 154019, "epoch": 916} {"train_loss": -10.5114107131958, "global_step": 154020, "epoch": 916} {"train_loss": -10.080446243286133, "global_step": 154021, "epoch": 916} {"train_loss": -10.70132064819336, "global_step": 154022, "epoch": 916} {"train_loss": -10.484325408935547, "global_step": 154023, "epoch": 916} {"train_loss": -10.978198051452637, "global_step": 154024, "epoch": 916} {"train_loss": -10.92456340789795, "global_step": 154025, "epoch": 916} {"train_loss": -10.595458984375, "global_step": 154026, "epoch": 916} {"train_loss": -10.309149742126465, "global_step": 154027, "epoch": 916} {"train_loss": -10.849052429199219, "global_step": 154028, "epoch": 916} {"train_loss": -10.791922569274902, "global_step": 154029, "epoch": 916} {"train_loss": -10.6454496383667, "global_step": 154030, "epoch": 916} {"train_loss": -10.918862342834473, "global_step": 154031, "epoch": 916} {"train_loss": -10.863632202148438, "global_step": 154032, "epoch": 916} {"train_loss": -10.692398071289062, "global_step": 154033, "epoch": 916} {"train_loss": -10.798521995544434, "global_step": 154034, "epoch": 916} {"train_loss": -10.897148132324219, "global_step": 154035, "epoch": 916} {"train_loss": -10.839902877807617, "global_step": 154036, "epoch": 916} {"train_loss": -10.774789810180664, "global_step": 154037, "epoch": 916} {"train_loss": -10.68651008605957, "global_step": 154038, "epoch": 916} {"train_loss": -10.866504669189453, "global_step": 154039, "epoch": 916} {"train_loss": -10.887744903564453, "global_step": 154040, "epoch": 916} {"train_loss": -10.79709529876709, "global_step": 154041, "epoch": 916} {"train_loss": -10.605890274047852, "global_step": 154042, "epoch": 916} {"train_loss": -10.701658248901367, "global_step": 154043, "epoch": 916} {"train_loss": -10.95255184173584, "global_step": 154044, "epoch": 916} {"train_loss": -10.851661682128906, "global_step": 154045, "epoch": 916} {"train_loss": -10.95610237121582, "global_step": 154046, "epoch": 916} {"train_loss": -11.012439727783203, "global_step": 154047, "epoch": 916} {"train_loss": -10.79452896118164, "global_step": 154048, "epoch": 916} {"train_loss": -10.986364364624023, "global_step": 154049, "epoch": 916} {"train_loss": -10.859223365783691, "global_step": 154050, "epoch": 916} {"train_loss": -10.604527473449707, "global_step": 154051, "epoch": 916} {"train_loss": -10.65196418762207, "global_step": 154052, "epoch": 916} {"train_loss": -10.763345718383789, "global_step": 154053, "epoch": 916} {"train_loss": -10.573143005371094, "global_step": 154054, "epoch": 916} {"train_loss": -10.731643966266088, "global_step": 154055, "epoch": 916, "val_loss": 232244.15625} {"train_loss": -10.579580307006836, "global_step": 154056, "epoch": 917} {"train_loss": -10.948394775390625, "global_step": 154057, "epoch": 917} {"train_loss": -10.319454193115234, "global_step": 154058, "epoch": 917} {"train_loss": -10.899808883666992, "global_step": 154059, "epoch": 917} {"train_loss": -9.938446044921875, "global_step": 154060, "epoch": 917} {"train_loss": -10.69024658203125, "global_step": 154061, "epoch": 917} {"train_loss": -10.642679214477539, "global_step": 154062, "epoch": 917} {"train_loss": -10.366313934326172, "global_step": 154063, "epoch": 917} {"train_loss": -10.472783088684082, "global_step": 154064, "epoch": 917} {"train_loss": -10.437850952148438, "global_step": 154065, "epoch": 917} {"train_loss": -10.291068077087402, "global_step": 154066, "epoch": 917} {"train_loss": -10.611930847167969, "global_step": 154067, "epoch": 917} {"train_loss": -10.215906143188477, "global_step": 154068, "epoch": 917} {"train_loss": -10.609676361083984, "global_step": 154069, "epoch": 917} {"train_loss": -10.368553161621094, "global_step": 154070, "epoch": 917} {"train_loss": -10.364809036254883, "global_step": 154071, "epoch": 917} {"train_loss": -10.589962005615234, "global_step": 154072, "epoch": 917} {"train_loss": -10.434894561767578, "global_step": 154073, "epoch": 917} {"train_loss": -10.442211151123047, "global_step": 154074, "epoch": 917} {"train_loss": -10.631948471069336, "global_step": 154075, "epoch": 917} {"train_loss": -10.86186695098877, "global_step": 154076, "epoch": 917} {"train_loss": -10.383506774902344, "global_step": 154077, "epoch": 917} {"train_loss": -10.382955551147461, "global_step": 154078, "epoch": 917} {"train_loss": -10.525453567504883, "global_step": 154079, "epoch": 917} {"train_loss": -10.754399299621582, "global_step": 154080, "epoch": 917} {"train_loss": -10.60319709777832, "global_step": 154081, "epoch": 917} {"train_loss": -10.568929672241211, "global_step": 154082, "epoch": 917} {"train_loss": -10.482873916625977, "global_step": 154083, "epoch": 917} {"train_loss": -10.67702865600586, "global_step": 154084, "epoch": 917} {"train_loss": -10.513347625732422, "global_step": 154085, "epoch": 917} {"train_loss": -10.738617897033691, "global_step": 154086, "epoch": 917} {"train_loss": -10.695128440856934, "global_step": 154087, "epoch": 917} {"train_loss": -10.592240333557129, "global_step": 154088, "epoch": 917} {"train_loss": -10.563484191894531, "global_step": 154089, "epoch": 917} {"train_loss": -10.803060531616211, "global_step": 154090, "epoch": 917} {"train_loss": -10.300847053527832, "global_step": 154091, "epoch": 917} {"train_loss": -10.400519371032715, "global_step": 154092, "epoch": 917} {"train_loss": -10.516096115112305, "global_step": 154093, "epoch": 917} {"train_loss": -10.705133438110352, "global_step": 154094, "epoch": 917} {"train_loss": -10.60047721862793, "global_step": 154095, "epoch": 917} {"train_loss": -10.504762649536133, "global_step": 154096, "epoch": 917} {"train_loss": -10.500231742858887, "global_step": 154097, "epoch": 917} {"train_loss": -10.647703170776367, "global_step": 154098, "epoch": 917} {"train_loss": -10.731049537658691, "global_step": 154099, "epoch": 917} {"train_loss": -10.595758438110352, "global_step": 154100, "epoch": 917} {"train_loss": -10.609216690063477, "global_step": 154101, "epoch": 917} {"train_loss": -10.527307510375977, "global_step": 154102, "epoch": 917} {"train_loss": -10.654281616210938, "global_step": 154103, "epoch": 917} {"train_loss": -10.984274864196777, "global_step": 154104, "epoch": 917} {"train_loss": -10.720446586608887, "global_step": 154105, "epoch": 917} {"train_loss": -10.743511199951172, "global_step": 154106, "epoch": 917} {"train_loss": -10.630010604858398, "global_step": 154107, "epoch": 917} {"train_loss": -10.695049285888672, "global_step": 154108, "epoch": 917} {"train_loss": -10.3385591506958, "global_step": 154109, "epoch": 917} {"train_loss": -10.994165420532227, "global_step": 154110, "epoch": 917} {"train_loss": -10.603727340698242, "global_step": 154111, "epoch": 917} {"train_loss": -10.747640609741211, "global_step": 154112, "epoch": 917} {"train_loss": -10.68443775177002, "global_step": 154113, "epoch": 917} {"train_loss": -10.309813499450684, "global_step": 154114, "epoch": 917} {"train_loss": -11.05356216430664, "global_step": 154115, "epoch": 917} {"train_loss": -10.382177352905273, "global_step": 154116, "epoch": 917} {"train_loss": -10.795981407165527, "global_step": 154117, "epoch": 917} {"train_loss": -10.69308090209961, "global_step": 154118, "epoch": 917} {"train_loss": -10.748558044433594, "global_step": 154119, "epoch": 917} {"train_loss": -10.914332389831543, "global_step": 154120, "epoch": 917} {"train_loss": -10.599599838256836, "global_step": 154121, "epoch": 917} {"train_loss": -10.866718292236328, "global_step": 154122, "epoch": 917} {"train_loss": -10.500931739807129, "global_step": 154123, "epoch": 917} {"train_loss": -10.604286193847656, "global_step": 154124, "epoch": 917} {"train_loss": -10.97037124633789, "global_step": 154125, "epoch": 917} {"train_loss": -10.880157470703125, "global_step": 154126, "epoch": 917} {"train_loss": -10.984136581420898, "global_step": 154127, "epoch": 917} {"train_loss": -11.023431777954102, "global_step": 154128, "epoch": 917} {"train_loss": -10.700155258178711, "global_step": 154129, "epoch": 917} {"train_loss": -10.820219993591309, "global_step": 154130, "epoch": 917} {"train_loss": -10.68763542175293, "global_step": 154131, "epoch": 917} {"train_loss": -10.667163848876953, "global_step": 154132, "epoch": 917} {"train_loss": -10.9173002243042, "global_step": 154133, "epoch": 917} {"train_loss": -10.796424865722656, "global_step": 154134, "epoch": 917} {"train_loss": -10.546041488647461, "global_step": 154135, "epoch": 917} {"train_loss": -10.925145149230957, "global_step": 154136, "epoch": 917} {"train_loss": -11.03061294555664, "global_step": 154137, "epoch": 917} {"train_loss": -10.603096008300781, "global_step": 154138, "epoch": 917} {"train_loss": -10.921453475952148, "global_step": 154139, "epoch": 917} {"train_loss": -10.753030776977539, "global_step": 154140, "epoch": 917} {"train_loss": -10.855833053588867, "global_step": 154141, "epoch": 917} {"train_loss": -10.920775413513184, "global_step": 154142, "epoch": 917} {"train_loss": -10.913753509521484, "global_step": 154143, "epoch": 917} {"train_loss": -10.83021354675293, "global_step": 154144, "epoch": 917} {"train_loss": -10.868630409240723, "global_step": 154145, "epoch": 917} {"train_loss": -10.97562026977539, "global_step": 154146, "epoch": 917} {"train_loss": -10.971636772155762, "global_step": 154147, "epoch": 917} {"train_loss": -10.726409912109375, "global_step": 154148, "epoch": 917} {"train_loss": -10.902134895324707, "global_step": 154149, "epoch": 917} {"train_loss": -10.918325424194336, "global_step": 154150, "epoch": 917} {"train_loss": -10.578709602355957, "global_step": 154151, "epoch": 917} {"train_loss": -11.197206497192383, "global_step": 154152, "epoch": 917} {"train_loss": -11.05272102355957, "global_step": 154153, "epoch": 917} {"train_loss": -10.78731918334961, "global_step": 154154, "epoch": 917} {"train_loss": -11.017829895019531, "global_step": 154155, "epoch": 917} {"train_loss": -11.351547241210938, "global_step": 154156, "epoch": 917} {"train_loss": -10.917875289916992, "global_step": 154157, "epoch": 917} {"train_loss": -11.07394790649414, "global_step": 154158, "epoch": 917} {"train_loss": -10.927923202514648, "global_step": 154159, "epoch": 917} {"train_loss": -11.045918464660645, "global_step": 154160, "epoch": 917} {"train_loss": -11.146015167236328, "global_step": 154161, "epoch": 917} {"train_loss": -10.814024925231934, "global_step": 154162, "epoch": 917} {"train_loss": -10.934316635131836, "global_step": 154163, "epoch": 917} {"train_loss": -10.696182250976562, "global_step": 154164, "epoch": 917} {"train_loss": -11.025775909423828, "global_step": 154165, "epoch": 917} {"train_loss": -10.414203643798828, "global_step": 154166, "epoch": 917} {"train_loss": -10.222883224487305, "global_step": 154167, "epoch": 917} {"train_loss": -9.589832305908203, "global_step": 154168, "epoch": 917} {"train_loss": -10.366060256958008, "global_step": 154169, "epoch": 917} {"train_loss": -10.562531471252441, "global_step": 154170, "epoch": 917} {"train_loss": -9.779483795166016, "global_step": 154171, "epoch": 917} {"train_loss": -9.663580894470215, "global_step": 154172, "epoch": 917} {"train_loss": -10.313783645629883, "global_step": 154173, "epoch": 917} {"train_loss": -10.356521606445312, "global_step": 154174, "epoch": 917} {"train_loss": -10.398477554321289, "global_step": 154175, "epoch": 917} {"train_loss": -10.261357307434082, "global_step": 154176, "epoch": 917} {"train_loss": -10.645824432373047, "global_step": 154177, "epoch": 917} {"train_loss": -10.51681137084961, "global_step": 154178, "epoch": 917} {"train_loss": -10.493927001953125, "global_step": 154179, "epoch": 917} {"train_loss": -10.836725234985352, "global_step": 154180, "epoch": 917} {"train_loss": -10.472898483276367, "global_step": 154181, "epoch": 917} {"train_loss": -10.942425727844238, "global_step": 154182, "epoch": 917} {"train_loss": -10.376096725463867, "global_step": 154183, "epoch": 917} {"train_loss": -10.755746841430664, "global_step": 154184, "epoch": 917} {"train_loss": -10.78964614868164, "global_step": 154185, "epoch": 917} {"train_loss": -10.615021705627441, "global_step": 154186, "epoch": 917} {"train_loss": -10.732219696044922, "global_step": 154187, "epoch": 917} {"train_loss": -10.701796531677246, "global_step": 154188, "epoch": 917} {"train_loss": -10.681455612182617, "global_step": 154189, "epoch": 917} {"train_loss": -10.875775337219238, "global_step": 154190, "epoch": 917} {"train_loss": -10.865896224975586, "global_step": 154191, "epoch": 917} {"train_loss": -10.554059982299805, "global_step": 154192, "epoch": 917} {"train_loss": -10.85783576965332, "global_step": 154193, "epoch": 917} {"train_loss": -10.110334396362305, "global_step": 154194, "epoch": 917} {"train_loss": -10.969091415405273, "global_step": 154195, "epoch": 917} {"train_loss": -10.301074981689453, "global_step": 154196, "epoch": 917} {"train_loss": -10.474567413330078, "global_step": 154197, "epoch": 917} {"train_loss": -10.704605102539062, "global_step": 154198, "epoch": 917} {"train_loss": -10.857837677001953, "global_step": 154199, "epoch": 917} {"train_loss": -10.70138168334961, "global_step": 154200, "epoch": 917} {"train_loss": -10.607938766479492, "global_step": 154201, "epoch": 917} {"train_loss": -10.241629600524902, "global_step": 154202, "epoch": 917} {"train_loss": -10.884035110473633, "global_step": 154203, "epoch": 917} {"train_loss": -10.722216606140137, "global_step": 154204, "epoch": 917} {"train_loss": -10.52302360534668, "global_step": 154205, "epoch": 917} {"train_loss": -10.887322425842285, "global_step": 154206, "epoch": 917} {"train_loss": -10.140382766723633, "global_step": 154207, "epoch": 917} {"train_loss": -10.982227325439453, "global_step": 154208, "epoch": 917} {"train_loss": -10.600861549377441, "global_step": 154209, "epoch": 917} {"train_loss": -10.6850004196167, "global_step": 154210, "epoch": 917} {"train_loss": -10.582088470458984, "global_step": 154211, "epoch": 917} {"train_loss": -10.93150520324707, "global_step": 154212, "epoch": 917} {"train_loss": -10.839899063110352, "global_step": 154213, "epoch": 917} {"train_loss": -10.736893653869629, "global_step": 154214, "epoch": 917} {"train_loss": -11.025971412658691, "global_step": 154215, "epoch": 917} {"train_loss": -10.139978408813477, "global_step": 154216, "epoch": 917} {"train_loss": -10.851630210876465, "global_step": 154217, "epoch": 917} {"train_loss": -10.209320068359375, "global_step": 154218, "epoch": 917} {"train_loss": -10.921127319335938, "global_step": 154219, "epoch": 917} {"train_loss": -10.320229530334473, "global_step": 154220, "epoch": 917} {"train_loss": -10.563392639160156, "global_step": 154221, "epoch": 917} {"train_loss": -10.437837600708008, "global_step": 154222, "epoch": 917} {"train_loss": -10.65235195841108, "global_step": 154223, "epoch": 917, "val_loss": 231032.296875} {"train_loss": -10.687742233276367, "global_step": 154224, "epoch": 918} {"train_loss": -10.432634353637695, "global_step": 154225, "epoch": 918} {"train_loss": -10.740567207336426, "global_step": 154226, "epoch": 918} {"train_loss": -10.390620231628418, "global_step": 154227, "epoch": 918} {"train_loss": -10.750341415405273, "global_step": 154228, "epoch": 918} {"train_loss": -10.243097305297852, "global_step": 154229, "epoch": 918} {"train_loss": -10.758060455322266, "global_step": 154230, "epoch": 918} {"train_loss": -10.271109580993652, "global_step": 154231, "epoch": 918} {"train_loss": -10.893245697021484, "global_step": 154232, "epoch": 918} {"train_loss": -10.413585662841797, "global_step": 154233, "epoch": 918} {"train_loss": -10.766627311706543, "global_step": 154234, "epoch": 918} {"train_loss": -10.32008171081543, "global_step": 154235, "epoch": 918} {"train_loss": -10.439136505126953, "global_step": 154236, "epoch": 918} {"train_loss": -9.613618850708008, "global_step": 154237, "epoch": 918} {"train_loss": -10.4645414352417, "global_step": 154238, "epoch": 918} {"train_loss": -9.701735496520996, "global_step": 154239, "epoch": 918} {"train_loss": -9.135455131530762, "global_step": 154240, "epoch": 918} {"train_loss": -10.780633926391602, "global_step": 154241, "epoch": 918} {"train_loss": -9.078195571899414, "global_step": 154242, "epoch": 918} {"train_loss": -10.45715045928955, "global_step": 154243, "epoch": 918} {"train_loss": -9.475443840026855, "global_step": 154244, "epoch": 918} {"train_loss": -10.34742546081543, "global_step": 154245, "epoch": 918} {"train_loss": -10.298978805541992, "global_step": 154246, "epoch": 918} {"train_loss": -9.967761039733887, "global_step": 154247, "epoch": 918} {"train_loss": -10.410569190979004, "global_step": 154248, "epoch": 918} {"train_loss": -9.948025703430176, "global_step": 154249, "epoch": 918} {"train_loss": -10.184814453125, "global_step": 154250, "epoch": 918} {"train_loss": -10.280497550964355, "global_step": 154251, "epoch": 918} {"train_loss": -10.3545503616333, "global_step": 154252, "epoch": 918} {"train_loss": -10.201240539550781, "global_step": 154253, "epoch": 918} {"train_loss": -10.269200325012207, "global_step": 154254, "epoch": 918} {"train_loss": -10.612140655517578, "global_step": 154255, "epoch": 918} {"train_loss": -10.271774291992188, "global_step": 154256, "epoch": 918} {"train_loss": -10.887884140014648, "global_step": 154257, "epoch": 918} {"train_loss": -10.631063461303711, "global_step": 154258, "epoch": 918} {"train_loss": -10.461828231811523, "global_step": 154259, "epoch": 918} {"train_loss": -10.788590431213379, "global_step": 154260, "epoch": 918} {"train_loss": -10.738325119018555, "global_step": 154261, "epoch": 918} {"train_loss": -10.791683197021484, "global_step": 154262, "epoch": 918} {"train_loss": -10.66850471496582, "global_step": 154263, "epoch": 918} {"train_loss": -10.675345420837402, "global_step": 154264, "epoch": 918} {"train_loss": -10.546371459960938, "global_step": 154265, "epoch": 918} {"train_loss": -10.47182846069336, "global_step": 154266, "epoch": 918} {"train_loss": -10.74909782409668, "global_step": 154267, "epoch": 918} {"train_loss": -10.65203857421875, "global_step": 154268, "epoch": 918} {"train_loss": -10.54417610168457, "global_step": 154269, "epoch": 918} {"train_loss": -10.817627906799316, "global_step": 154270, "epoch": 918} {"train_loss": -10.8973388671875, "global_step": 154271, "epoch": 918} {"train_loss": -10.572454452514648, "global_step": 154272, "epoch": 918} {"train_loss": -10.779687881469727, "global_step": 154273, "epoch": 918} {"train_loss": -10.933283805847168, "global_step": 154274, "epoch": 918} {"train_loss": -10.85919189453125, "global_step": 154275, "epoch": 918} {"train_loss": -10.94792366027832, "global_step": 154276, "epoch": 918} {"train_loss": -10.887845993041992, "global_step": 154277, "epoch": 918} {"train_loss": -11.009740829467773, "global_step": 154278, "epoch": 918} {"train_loss": -10.794873237609863, "global_step": 154279, "epoch": 918} {"train_loss": -10.860135078430176, "global_step": 154280, "epoch": 918} {"train_loss": -10.916010856628418, "global_step": 154281, "epoch": 918} {"train_loss": -11.072549819946289, "global_step": 154282, "epoch": 918} {"train_loss": -10.898719787597656, "global_step": 154283, "epoch": 918} {"train_loss": -11.204144477844238, "global_step": 154284, "epoch": 918} {"train_loss": -11.108331680297852, "global_step": 154285, "epoch": 918} {"train_loss": -10.854730606079102, "global_step": 154286, "epoch": 918} {"train_loss": -10.896709442138672, "global_step": 154287, "epoch": 918} {"train_loss": -10.880088806152344, "global_step": 154288, "epoch": 918} {"train_loss": -11.138206481933594, "global_step": 154289, "epoch": 918} {"train_loss": -10.951717376708984, "global_step": 154290, "epoch": 918} {"train_loss": -11.098409652709961, "global_step": 154291, "epoch": 918} {"train_loss": -11.16501235961914, "global_step": 154292, "epoch": 918} {"train_loss": -11.340341567993164, "global_step": 154293, "epoch": 918} {"train_loss": -11.191006660461426, "global_step": 154294, "epoch": 918} {"train_loss": -11.225011825561523, "global_step": 154295, "epoch": 918} {"train_loss": -11.112565994262695, "global_step": 154296, "epoch": 918} {"train_loss": -11.058150291442871, "global_step": 154297, "epoch": 918} {"train_loss": -10.510461807250977, "global_step": 154298, "epoch": 918} {"train_loss": -10.199105262756348, "global_step": 154299, "epoch": 918} {"train_loss": -10.91313362121582, "global_step": 154300, "epoch": 918} {"train_loss": -10.4575777053833, "global_step": 154301, "epoch": 918} {"train_loss": -9.80699634552002, "global_step": 154302, "epoch": 918} {"train_loss": -10.634078025817871, "global_step": 154303, "epoch": 918} {"train_loss": -10.637750625610352, "global_step": 154304, "epoch": 918} {"train_loss": -8.16810417175293, "global_step": 154305, "epoch": 918} {"train_loss": -10.586275100708008, "global_step": 154306, "epoch": 918} {"train_loss": -8.053210258483887, "global_step": 154307, "epoch": 918} {"train_loss": -10.030704498291016, "global_step": 154308, "epoch": 918} {"train_loss": -8.823264122009277, "global_step": 154309, "epoch": 918} {"train_loss": -8.541261672973633, "global_step": 154310, "epoch": 918} {"train_loss": -9.387106895446777, "global_step": 154311, "epoch": 918} {"train_loss": -7.9351301193237305, "global_step": 154312, "epoch": 918} {"train_loss": -9.570499420166016, "global_step": 154313, "epoch": 918} {"train_loss": -9.861116409301758, "global_step": 154314, "epoch": 918} {"train_loss": -10.302043914794922, "global_step": 154315, "epoch": 918} {"train_loss": -9.210229873657227, "global_step": 154316, "epoch": 918} {"train_loss": -10.253337860107422, "global_step": 154317, "epoch": 918} {"train_loss": -9.079005241394043, "global_step": 154318, "epoch": 918} {"train_loss": -10.150321960449219, "global_step": 154319, "epoch": 918} {"train_loss": -10.080991744995117, "global_step": 154320, "epoch": 918} {"train_loss": -9.499488830566406, "global_step": 154321, "epoch": 918} {"train_loss": -9.946561813354492, "global_step": 154322, "epoch": 918} {"train_loss": -10.173744201660156, "global_step": 154323, "epoch": 918} {"train_loss": -10.12297248840332, "global_step": 154324, "epoch": 918} {"train_loss": -10.063963890075684, "global_step": 154325, "epoch": 918} {"train_loss": -10.354408264160156, "global_step": 154326, "epoch": 918} {"train_loss": -10.219768524169922, "global_step": 154327, "epoch": 918} {"train_loss": -9.944403648376465, "global_step": 154328, "epoch": 918} {"train_loss": -10.57721996307373, "global_step": 154329, "epoch": 918} {"train_loss": -10.068872451782227, "global_step": 154330, "epoch": 918} {"train_loss": -10.255498886108398, "global_step": 154331, "epoch": 918} {"train_loss": -10.332497596740723, "global_step": 154332, "epoch": 918} {"train_loss": -10.205812454223633, "global_step": 154333, "epoch": 918} {"train_loss": -10.3947172164917, "global_step": 154334, "epoch": 918} {"train_loss": -10.32628059387207, "global_step": 154335, "epoch": 918} {"train_loss": -10.542596817016602, "global_step": 154336, "epoch": 918} {"train_loss": -10.268890380859375, "global_step": 154337, "epoch": 918} {"train_loss": -10.458385467529297, "global_step": 154338, "epoch": 918} {"train_loss": -10.383942604064941, "global_step": 154339, "epoch": 918} {"train_loss": -10.302952766418457, "global_step": 154340, "epoch": 918} {"train_loss": -10.559200286865234, "global_step": 154341, "epoch": 918} {"train_loss": -10.691537857055664, "global_step": 154342, "epoch": 918} {"train_loss": -10.549413681030273, "global_step": 154343, "epoch": 918} {"train_loss": -10.569548606872559, "global_step": 154344, "epoch": 918} {"train_loss": -10.60582160949707, "global_step": 154345, "epoch": 918} {"train_loss": -10.60913372039795, "global_step": 154346, "epoch": 918} {"train_loss": -10.713716506958008, "global_step": 154347, "epoch": 918} {"train_loss": -10.521303176879883, "global_step": 154348, "epoch": 918} {"train_loss": -10.542848587036133, "global_step": 154349, "epoch": 918} {"train_loss": -10.64346981048584, "global_step": 154350, "epoch": 918} {"train_loss": -10.609596252441406, "global_step": 154351, "epoch": 918} {"train_loss": -10.752671241760254, "global_step": 154352, "epoch": 918} {"train_loss": -10.666205406188965, "global_step": 154353, "epoch": 918} {"train_loss": -10.551289558410645, "global_step": 154354, "epoch": 918} {"train_loss": -10.787574768066406, "global_step": 154355, "epoch": 918} {"train_loss": -10.724300384521484, "global_step": 154356, "epoch": 918} {"train_loss": -10.78005599975586, "global_step": 154357, "epoch": 918} {"train_loss": -10.844430923461914, "global_step": 154358, "epoch": 918} {"train_loss": -10.88272476196289, "global_step": 154359, "epoch": 918} {"train_loss": -10.896587371826172, "global_step": 154360, "epoch": 918} {"train_loss": -11.113876342773438, "global_step": 154361, "epoch": 918} {"train_loss": -10.870223999023438, "global_step": 154362, "epoch": 918} {"train_loss": -10.683710098266602, "global_step": 154363, "epoch": 918} {"train_loss": -10.999353408813477, "global_step": 154364, "epoch": 918} {"train_loss": -11.002252578735352, "global_step": 154365, "epoch": 918} {"train_loss": -11.018688201904297, "global_step": 154366, "epoch": 918} {"train_loss": -11.148124694824219, "global_step": 154367, "epoch": 918} {"train_loss": -11.148443222045898, "global_step": 154368, "epoch": 918} {"train_loss": -11.077596664428711, "global_step": 154369, "epoch": 918} {"train_loss": -11.092765808105469, "global_step": 154370, "epoch": 918} {"train_loss": -11.14160442352295, "global_step": 154371, "epoch": 918} {"train_loss": -11.287154197692871, "global_step": 154372, "epoch": 918} {"train_loss": -11.260780334472656, "global_step": 154373, "epoch": 918} {"train_loss": -11.208866119384766, "global_step": 154374, "epoch": 918} {"train_loss": -11.18385124206543, "global_step": 154375, "epoch": 918} {"train_loss": -11.13999080657959, "global_step": 154376, "epoch": 918} {"train_loss": -11.172761917114258, "global_step": 154377, "epoch": 918} {"train_loss": -11.287813186645508, "global_step": 154378, "epoch": 918} {"train_loss": -11.205179214477539, "global_step": 154379, "epoch": 918} {"train_loss": -11.186065673828125, "global_step": 154380, "epoch": 918} {"train_loss": -11.100748062133789, "global_step": 154381, "epoch": 918} {"train_loss": -11.313749313354492, "global_step": 154382, "epoch": 918} {"train_loss": -10.839783668518066, "global_step": 154383, "epoch": 918} {"train_loss": -11.136792182922363, "global_step": 154384, "epoch": 918} {"train_loss": -11.19006061553955, "global_step": 154385, "epoch": 918} {"train_loss": -10.795812606811523, "global_step": 154386, "epoch": 918} {"train_loss": -10.97526741027832, "global_step": 154387, "epoch": 918} {"train_loss": -11.133247375488281, "global_step": 154388, "epoch": 918} {"train_loss": -10.948125839233398, "global_step": 154389, "epoch": 918} {"train_loss": -10.2216157913208, "global_step": 154390, "epoch": 918} {"train_loss": -10.530713563873654, "global_step": 154391, "epoch": 918, "val_loss": 232828.375} {"train_loss": -10.866300582885742, "global_step": 154392, "epoch": 919} {"train_loss": -10.49526596069336, "global_step": 154393, "epoch": 919} {"train_loss": -10.570062637329102, "global_step": 154394, "epoch": 919} {"train_loss": -10.934782981872559, "global_step": 154395, "epoch": 919} {"train_loss": -9.92097282409668, "global_step": 154396, "epoch": 919} {"train_loss": -10.623830795288086, "global_step": 154397, "epoch": 919} {"train_loss": -10.833431243896484, "global_step": 154398, "epoch": 919} {"train_loss": -9.907610893249512, "global_step": 154399, "epoch": 919} {"train_loss": -10.431264877319336, "global_step": 154400, "epoch": 919} {"train_loss": -9.620979309082031, "global_step": 154401, "epoch": 919} {"train_loss": -10.356670379638672, "global_step": 154402, "epoch": 919} {"train_loss": -9.143810272216797, "global_step": 154403, "epoch": 919} {"train_loss": -9.779884338378906, "global_step": 154404, "epoch": 919} {"train_loss": -9.352743148803711, "global_step": 154405, "epoch": 919} {"train_loss": -7.990722179412842, "global_step": 154406, "epoch": 919} {"train_loss": -7.801385879516602, "global_step": 154407, "epoch": 919} {"train_loss": -8.183100700378418, "global_step": 154408, "epoch": 919} {"train_loss": -9.75705623626709, "global_step": 154409, "epoch": 919} {"train_loss": -9.387086868286133, "global_step": 154410, "epoch": 919} {"train_loss": -8.909982681274414, "global_step": 154411, "epoch": 919} {"train_loss": -8.290498733520508, "global_step": 154412, "epoch": 919} {"train_loss": -9.825804710388184, "global_step": 154413, "epoch": 919} {"train_loss": -9.122209548950195, "global_step": 154414, "epoch": 919} {"train_loss": -9.493586540222168, "global_step": 154415, "epoch": 919} {"train_loss": -10.166842460632324, "global_step": 154416, "epoch": 919} {"train_loss": -9.592360496520996, "global_step": 154417, "epoch": 919} {"train_loss": -9.653364181518555, "global_step": 154418, "epoch": 919} {"train_loss": -10.094015121459961, "global_step": 154419, "epoch": 919} {"train_loss": -9.721521377563477, "global_step": 154420, "epoch": 919} {"train_loss": -9.662521362304688, "global_step": 154421, "epoch": 919} {"train_loss": -9.819597244262695, "global_step": 154422, "epoch": 919} {"train_loss": -10.032987594604492, "global_step": 154423, "epoch": 919} {"train_loss": -10.321441650390625, "global_step": 154424, "epoch": 919} {"train_loss": -9.845376014709473, "global_step": 154425, "epoch": 919} {"train_loss": -10.027585983276367, "global_step": 154426, "epoch": 919} {"train_loss": -10.247684478759766, "global_step": 154427, "epoch": 919} {"train_loss": -9.64480972290039, "global_step": 154428, "epoch": 919} {"train_loss": -10.275897026062012, "global_step": 154429, "epoch": 919} {"train_loss": -10.342924118041992, "global_step": 154430, "epoch": 919} {"train_loss": -10.250015258789062, "global_step": 154431, "epoch": 919} {"train_loss": -10.387898445129395, "global_step": 154432, "epoch": 919} {"train_loss": -10.290447235107422, "global_step": 154433, "epoch": 919} {"train_loss": -10.283317565917969, "global_step": 154434, "epoch": 919} {"train_loss": -10.26138973236084, "global_step": 154435, "epoch": 919} {"train_loss": -10.326105117797852, "global_step": 154436, "epoch": 919} {"train_loss": -10.395404815673828, "global_step": 154437, "epoch": 919} {"train_loss": -10.28160285949707, "global_step": 154438, "epoch": 919} {"train_loss": -10.426932334899902, "global_step": 154439, "epoch": 919} {"train_loss": -10.49643325805664, "global_step": 154440, "epoch": 919} {"train_loss": -10.468477249145508, "global_step": 154441, "epoch": 919} {"train_loss": -10.70612621307373, "global_step": 154442, "epoch": 919} {"train_loss": -10.352659225463867, "global_step": 154443, "epoch": 919} {"train_loss": -10.615678787231445, "global_step": 154444, "epoch": 919} {"train_loss": -10.677017211914062, "global_step": 154445, "epoch": 919} {"train_loss": -10.317943572998047, "global_step": 154446, "epoch": 919} {"train_loss": -10.61793041229248, "global_step": 154447, "epoch": 919} {"train_loss": -10.552794456481934, "global_step": 154448, "epoch": 919} {"train_loss": -10.626379013061523, "global_step": 154449, "epoch": 919} {"train_loss": -10.545555114746094, "global_step": 154450, "epoch": 919} {"train_loss": -10.659140586853027, "global_step": 154451, "epoch": 919} {"train_loss": -10.866498947143555, "global_step": 154452, "epoch": 919} {"train_loss": -10.862109184265137, "global_step": 154453, "epoch": 919} {"train_loss": -10.740394592285156, "global_step": 154454, "epoch": 919} {"train_loss": -10.894523620605469, "global_step": 154455, "epoch": 919} {"train_loss": -10.77786636352539, "global_step": 154456, "epoch": 919} {"train_loss": -10.660304069519043, "global_step": 154457, "epoch": 919} {"train_loss": -10.90282154083252, "global_step": 154458, "epoch": 919} {"train_loss": -10.751507759094238, "global_step": 154459, "epoch": 919} {"train_loss": -10.897217750549316, "global_step": 154460, "epoch": 919} {"train_loss": -10.98959732055664, "global_step": 154461, "epoch": 919} {"train_loss": -10.969179153442383, "global_step": 154462, "epoch": 919} {"train_loss": -10.908918380737305, "global_step": 154463, "epoch": 919} {"train_loss": -10.795452117919922, "global_step": 154464, "epoch": 919} {"train_loss": -11.081879615783691, "global_step": 154465, "epoch": 919} {"train_loss": -11.215047836303711, "global_step": 154466, "epoch": 919} {"train_loss": -10.809822082519531, "global_step": 154467, "epoch": 919} {"train_loss": -11.231673240661621, "global_step": 154468, "epoch": 919} {"train_loss": -11.244894027709961, "global_step": 154469, "epoch": 919} {"train_loss": -11.118946075439453, "global_step": 154470, "epoch": 919} {"train_loss": -11.174490928649902, "global_step": 154471, "epoch": 919} {"train_loss": -11.155058860778809, "global_step": 154472, "epoch": 919} {"train_loss": -11.042757987976074, "global_step": 154473, "epoch": 919} {"train_loss": -11.143936157226562, "global_step": 154474, "epoch": 919} {"train_loss": -11.121277809143066, "global_step": 154475, "epoch": 919} {"train_loss": -10.957568168640137, "global_step": 154476, "epoch": 919} {"train_loss": -11.000875473022461, "global_step": 154477, "epoch": 919} {"train_loss": -11.149866104125977, "global_step": 154478, "epoch": 919} {"train_loss": -10.989328384399414, "global_step": 154479, "epoch": 919} {"train_loss": -11.204622268676758, "global_step": 154480, "epoch": 919} {"train_loss": -11.213447570800781, "global_step": 154481, "epoch": 919} {"train_loss": -11.102219581604004, "global_step": 154482, "epoch": 919} {"train_loss": -11.067155838012695, "global_step": 154483, "epoch": 919} {"train_loss": -10.765695571899414, "global_step": 154484, "epoch": 919} {"train_loss": -11.02145767211914, "global_step": 154485, "epoch": 919} {"train_loss": -11.11630630493164, "global_step": 154486, "epoch": 919} {"train_loss": -10.92766284942627, "global_step": 154487, "epoch": 919} {"train_loss": -11.362091064453125, "global_step": 154488, "epoch": 919} {"train_loss": -10.866302490234375, "global_step": 154489, "epoch": 919} {"train_loss": -10.944156646728516, "global_step": 154490, "epoch": 919} {"train_loss": -10.93190860748291, "global_step": 154491, "epoch": 919} {"train_loss": -11.073273658752441, "global_step": 154492, "epoch": 919} {"train_loss": -10.963798522949219, "global_step": 154493, "epoch": 919} {"train_loss": -10.382291793823242, "global_step": 154494, "epoch": 919} {"train_loss": -11.098196983337402, "global_step": 154495, "epoch": 919} {"train_loss": -10.885456085205078, "global_step": 154496, "epoch": 919} {"train_loss": -10.009973526000977, "global_step": 154497, "epoch": 919} {"train_loss": -9.667654037475586, "global_step": 154498, "epoch": 919} {"train_loss": -10.736200332641602, "global_step": 154499, "epoch": 919} {"train_loss": -9.848405838012695, "global_step": 154500, "epoch": 919} {"train_loss": -9.534046173095703, "global_step": 154501, "epoch": 919} {"train_loss": -9.328437805175781, "global_step": 154502, "epoch": 919} {"train_loss": -10.146117210388184, "global_step": 154503, "epoch": 919} {"train_loss": -9.191679000854492, "global_step": 154504, "epoch": 919} {"train_loss": -9.859636306762695, "global_step": 154505, "epoch": 919} {"train_loss": -9.816896438598633, "global_step": 154506, "epoch": 919} {"train_loss": -10.042402267456055, "global_step": 154507, "epoch": 919} {"train_loss": -9.870000839233398, "global_step": 154508, "epoch": 919} {"train_loss": -9.852856636047363, "global_step": 154509, "epoch": 919} {"train_loss": -10.715754508972168, "global_step": 154510, "epoch": 919} {"train_loss": -9.612981796264648, "global_step": 154511, "epoch": 919} {"train_loss": -9.974868774414062, "global_step": 154512, "epoch": 919} {"train_loss": -9.988762855529785, "global_step": 154513, "epoch": 919} {"train_loss": -9.8564453125, "global_step": 154514, "epoch": 919} {"train_loss": -10.252359390258789, "global_step": 154515, "epoch": 919} {"train_loss": -10.37722110748291, "global_step": 154516, "epoch": 919} {"train_loss": -10.168757438659668, "global_step": 154517, "epoch": 919} {"train_loss": -10.2975435256958, "global_step": 154518, "epoch": 919} {"train_loss": -10.290016174316406, "global_step": 154519, "epoch": 919} {"train_loss": -10.238593101501465, "global_step": 154520, "epoch": 919} {"train_loss": -10.31785774230957, "global_step": 154521, "epoch": 919} {"train_loss": -10.243497848510742, "global_step": 154522, "epoch": 919} {"train_loss": -10.350458145141602, "global_step": 154523, "epoch": 919} {"train_loss": -10.414436340332031, "global_step": 154524, "epoch": 919} {"train_loss": -10.367990493774414, "global_step": 154525, "epoch": 919} {"train_loss": -10.411983489990234, "global_step": 154526, "epoch": 919} {"train_loss": -10.586678504943848, "global_step": 154527, "epoch": 919} {"train_loss": -10.530123710632324, "global_step": 154528, "epoch": 919} {"train_loss": -10.712486267089844, "global_step": 154529, "epoch": 919} {"train_loss": -10.63110637664795, "global_step": 154530, "epoch": 919} {"train_loss": -10.870550155639648, "global_step": 154531, "epoch": 919} {"train_loss": -10.365570068359375, "global_step": 154532, "epoch": 919} {"train_loss": -10.74267864227295, "global_step": 154533, "epoch": 919} {"train_loss": -10.581573486328125, "global_step": 154534, "epoch": 919} {"train_loss": -10.438228607177734, "global_step": 154535, "epoch": 919} {"train_loss": -10.49860668182373, "global_step": 154536, "epoch": 919} {"train_loss": -10.645751953125, "global_step": 154537, "epoch": 919} {"train_loss": -10.510932922363281, "global_step": 154538, "epoch": 919} {"train_loss": -10.522726058959961, "global_step": 154539, "epoch": 919} {"train_loss": -10.43708610534668, "global_step": 154540, "epoch": 919} {"train_loss": -10.427186965942383, "global_step": 154541, "epoch": 919} {"train_loss": -10.813776016235352, "global_step": 154542, "epoch": 919} {"train_loss": -10.22913646697998, "global_step": 154543, "epoch": 919} {"train_loss": -10.620209693908691, "global_step": 154544, "epoch": 919} {"train_loss": -10.363680839538574, "global_step": 154545, "epoch": 919} {"train_loss": -10.858556747436523, "global_step": 154546, "epoch": 919} {"train_loss": -10.463879585266113, "global_step": 154547, "epoch": 919} {"train_loss": -10.777900695800781, "global_step": 154548, "epoch": 919} {"train_loss": -10.46900749206543, "global_step": 154549, "epoch": 919} {"train_loss": -10.70434856414795, "global_step": 154550, "epoch": 919} {"train_loss": -10.929421424865723, "global_step": 154551, "epoch": 919} {"train_loss": -10.503677368164062, "global_step": 154552, "epoch": 919} {"train_loss": -10.744291305541992, "global_step": 154553, "epoch": 919} {"train_loss": -10.62736701965332, "global_step": 154554, "epoch": 919} {"train_loss": -10.958444595336914, "global_step": 154555, "epoch": 919} {"train_loss": -10.74740219116211, "global_step": 154556, "epoch": 919} {"train_loss": -11.093596458435059, "global_step": 154557, "epoch": 919} {"train_loss": -10.587461471557617, "global_step": 154558, "epoch": 919} {"train_loss": -10.401500988574256, "global_step": 154559, "epoch": 919, "val_loss": 225309.25} {"train_loss": -10.507015228271484, "global_step": 154560, "epoch": 920} {"train_loss": -10.923226356506348, "global_step": 154561, "epoch": 920} {"train_loss": -10.785449028015137, "global_step": 154562, "epoch": 920} {"train_loss": -10.780804634094238, "global_step": 154563, "epoch": 920} {"train_loss": -10.45364761352539, "global_step": 154564, "epoch": 920} {"train_loss": -10.710723876953125, "global_step": 154565, "epoch": 920} {"train_loss": -10.146661758422852, "global_step": 154566, "epoch": 920} {"train_loss": -10.156478881835938, "global_step": 154567, "epoch": 920} {"train_loss": -10.580900192260742, "global_step": 154568, "epoch": 920} {"train_loss": -10.69031047821045, "global_step": 154569, "epoch": 920} {"train_loss": -10.46828556060791, "global_step": 154570, "epoch": 920} {"train_loss": -10.908292770385742, "global_step": 154571, "epoch": 920} {"train_loss": -10.307876586914062, "global_step": 154572, "epoch": 920} {"train_loss": -10.854145050048828, "global_step": 154573, "epoch": 920} {"train_loss": -10.539447784423828, "global_step": 154574, "epoch": 920} {"train_loss": -10.85084342956543, "global_step": 154575, "epoch": 920} {"train_loss": -10.607278823852539, "global_step": 154576, "epoch": 920} {"train_loss": -10.689599990844727, "global_step": 154577, "epoch": 920} {"train_loss": -10.631162643432617, "global_step": 154578, "epoch": 920} {"train_loss": -10.745874404907227, "global_step": 154579, "epoch": 920} {"train_loss": -10.740434646606445, "global_step": 154580, "epoch": 920} {"train_loss": -10.785263061523438, "global_step": 154581, "epoch": 920} {"train_loss": -10.634316444396973, "global_step": 154582, "epoch": 920} {"train_loss": -10.608372688293457, "global_step": 154583, "epoch": 920} {"train_loss": -10.480939865112305, "global_step": 154584, "epoch": 920} {"train_loss": -10.792866706848145, "global_step": 154585, "epoch": 920} {"train_loss": -10.781726837158203, "global_step": 154586, "epoch": 920} {"train_loss": -10.441253662109375, "global_step": 154587, "epoch": 920} {"train_loss": -10.952975273132324, "global_step": 154588, "epoch": 920} {"train_loss": -10.761615753173828, "global_step": 154589, "epoch": 920} {"train_loss": -10.914498329162598, "global_step": 154590, "epoch": 920} {"train_loss": -10.796756744384766, "global_step": 154591, "epoch": 920} {"train_loss": -11.043834686279297, "global_step": 154592, "epoch": 920} {"train_loss": -10.961081504821777, "global_step": 154593, "epoch": 920} {"train_loss": -10.823507308959961, "global_step": 154594, "epoch": 920} {"train_loss": -11.010942459106445, "global_step": 154595, "epoch": 920} {"train_loss": -10.987789154052734, "global_step": 154596, "epoch": 920} {"train_loss": -10.975794792175293, "global_step": 154597, "epoch": 920} {"train_loss": -10.969390869140625, "global_step": 154598, "epoch": 920} {"train_loss": -11.150777816772461, "global_step": 154599, "epoch": 920} {"train_loss": -10.964508056640625, "global_step": 154600, "epoch": 920} {"train_loss": -10.917551040649414, "global_step": 154601, "epoch": 920} {"train_loss": -10.773067474365234, "global_step": 154602, "epoch": 920} {"train_loss": -10.921310424804688, "global_step": 154603, "epoch": 920} {"train_loss": -10.914934158325195, "global_step": 154604, "epoch": 920} {"train_loss": -11.007035255432129, "global_step": 154605, "epoch": 920} {"train_loss": -10.89635181427002, "global_step": 154606, "epoch": 920} {"train_loss": -11.054040908813477, "global_step": 154607, "epoch": 920} {"train_loss": -11.159219741821289, "global_step": 154608, "epoch": 920} {"train_loss": -10.954940795898438, "global_step": 154609, "epoch": 920} {"train_loss": -11.040681838989258, "global_step": 154610, "epoch": 920} {"train_loss": -10.806573867797852, "global_step": 154611, "epoch": 920} {"train_loss": -10.931938171386719, "global_step": 154612, "epoch": 920} {"train_loss": -11.048952102661133, "global_step": 154613, "epoch": 920} {"train_loss": -10.776788711547852, "global_step": 154614, "epoch": 920} {"train_loss": -11.097648620605469, "global_step": 154615, "epoch": 920} {"train_loss": -10.97718620300293, "global_step": 154616, "epoch": 920} {"train_loss": -11.243561744689941, "global_step": 154617, "epoch": 920} {"train_loss": -11.107948303222656, "global_step": 154618, "epoch": 920} {"train_loss": -11.124215126037598, "global_step": 154619, "epoch": 920} {"train_loss": -11.066041946411133, "global_step": 154620, "epoch": 920} {"train_loss": -10.839313507080078, "global_step": 154621, "epoch": 920} {"train_loss": -10.82974624633789, "global_step": 154622, "epoch": 920} {"train_loss": -10.805635452270508, "global_step": 154623, "epoch": 920} {"train_loss": -10.933316230773926, "global_step": 154624, "epoch": 920} {"train_loss": -10.640701293945312, "global_step": 154625, "epoch": 920} {"train_loss": -10.863449096679688, "global_step": 154626, "epoch": 920} {"train_loss": -10.844253540039062, "global_step": 154627, "epoch": 920} {"train_loss": -10.582401275634766, "global_step": 154628, "epoch": 920} {"train_loss": -10.706951141357422, "global_step": 154629, "epoch": 920} {"train_loss": -10.66625690460205, "global_step": 154630, "epoch": 920} {"train_loss": -10.284686088562012, "global_step": 154631, "epoch": 920} {"train_loss": -10.796009063720703, "global_step": 154632, "epoch": 920} {"train_loss": -10.551485061645508, "global_step": 154633, "epoch": 920} {"train_loss": -10.439632415771484, "global_step": 154634, "epoch": 920} {"train_loss": -10.505179405212402, "global_step": 154635, "epoch": 920} {"train_loss": -10.313722610473633, "global_step": 154636, "epoch": 920} {"train_loss": -10.043874740600586, "global_step": 154637, "epoch": 920} {"train_loss": -10.474237442016602, "global_step": 154638, "epoch": 920} {"train_loss": -9.789939880371094, "global_step": 154639, "epoch": 920} {"train_loss": -10.082064628601074, "global_step": 154640, "epoch": 920} {"train_loss": -10.381977081298828, "global_step": 154641, "epoch": 920} {"train_loss": -10.161884307861328, "global_step": 154642, "epoch": 920} {"train_loss": -10.569658279418945, "global_step": 154643, "epoch": 920} {"train_loss": -10.15283203125, "global_step": 154644, "epoch": 920} {"train_loss": -9.816976547241211, "global_step": 154645, "epoch": 920} {"train_loss": -10.354947090148926, "global_step": 154646, "epoch": 920} {"train_loss": -9.967802047729492, "global_step": 154647, "epoch": 920} {"train_loss": -10.235381126403809, "global_step": 154648, "epoch": 920} {"train_loss": -9.714834213256836, "global_step": 154649, "epoch": 920} {"train_loss": -10.325096130371094, "global_step": 154650, "epoch": 920} {"train_loss": -10.026715278625488, "global_step": 154651, "epoch": 920} {"train_loss": -10.151901245117188, "global_step": 154652, "epoch": 920} {"train_loss": -10.402608871459961, "global_step": 154653, "epoch": 920} {"train_loss": -10.162008285522461, "global_step": 154654, "epoch": 920} {"train_loss": -10.027715682983398, "global_step": 154655, "epoch": 920} {"train_loss": -9.413721084594727, "global_step": 154656, "epoch": 920} {"train_loss": -9.828407287597656, "global_step": 154657, "epoch": 920} {"train_loss": -9.004230499267578, "global_step": 154658, "epoch": 920} {"train_loss": -10.097481727600098, "global_step": 154659, "epoch": 920} {"train_loss": -9.247968673706055, "global_step": 154660, "epoch": 920} {"train_loss": -9.418767929077148, "global_step": 154661, "epoch": 920} {"train_loss": -10.427247047424316, "global_step": 154662, "epoch": 920} {"train_loss": -9.258577346801758, "global_step": 154663, "epoch": 920} {"train_loss": -10.479959487915039, "global_step": 154664, "epoch": 920} {"train_loss": -9.705684661865234, "global_step": 154665, "epoch": 920} {"train_loss": -10.022356033325195, "global_step": 154666, "epoch": 920} {"train_loss": -10.41733169555664, "global_step": 154667, "epoch": 920} {"train_loss": -9.725170135498047, "global_step": 154668, "epoch": 920} {"train_loss": -10.294401168823242, "global_step": 154669, "epoch": 920} {"train_loss": -10.42031192779541, "global_step": 154670, "epoch": 920} {"train_loss": -10.174680709838867, "global_step": 154671, "epoch": 920} {"train_loss": -10.447280883789062, "global_step": 154672, "epoch": 920} {"train_loss": -10.213584899902344, "global_step": 154673, "epoch": 920} {"train_loss": -10.476167678833008, "global_step": 154674, "epoch": 920} {"train_loss": -10.395147323608398, "global_step": 154675, "epoch": 920} {"train_loss": -10.446752548217773, "global_step": 154676, "epoch": 920} {"train_loss": -10.507272720336914, "global_step": 154677, "epoch": 920} {"train_loss": -10.606637954711914, "global_step": 154678, "epoch": 920} {"train_loss": -10.595830917358398, "global_step": 154679, "epoch": 920} {"train_loss": -10.6475830078125, "global_step": 154680, "epoch": 920} {"train_loss": -10.319902420043945, "global_step": 154681, "epoch": 920} {"train_loss": -10.571812629699707, "global_step": 154682, "epoch": 920} {"train_loss": -10.531143188476562, "global_step": 154683, "epoch": 920} {"train_loss": -10.76175308227539, "global_step": 154684, "epoch": 920} {"train_loss": -10.799894332885742, "global_step": 154685, "epoch": 920} {"train_loss": -10.628552436828613, "global_step": 154686, "epoch": 920} {"train_loss": -10.764772415161133, "global_step": 154687, "epoch": 920} {"train_loss": -10.541576385498047, "global_step": 154688, "epoch": 920} {"train_loss": -10.785243034362793, "global_step": 154689, "epoch": 920} {"train_loss": -11.003094673156738, "global_step": 154690, "epoch": 920} {"train_loss": -10.952310562133789, "global_step": 154691, "epoch": 920} {"train_loss": -10.68797492980957, "global_step": 154692, "epoch": 920} {"train_loss": -10.920082092285156, "global_step": 154693, "epoch": 920} {"train_loss": -10.93878173828125, "global_step": 154694, "epoch": 920} {"train_loss": -10.813621520996094, "global_step": 154695, "epoch": 920} {"train_loss": -10.841072082519531, "global_step": 154696, "epoch": 920} {"train_loss": -10.748174667358398, "global_step": 154697, "epoch": 920} {"train_loss": -10.812407493591309, "global_step": 154698, "epoch": 920} {"train_loss": -11.039915084838867, "global_step": 154699, "epoch": 920} {"train_loss": -10.973237037658691, "global_step": 154700, "epoch": 920} {"train_loss": -10.98226547241211, "global_step": 154701, "epoch": 920} {"train_loss": -10.788557052612305, "global_step": 154702, "epoch": 920} {"train_loss": -10.833983421325684, "global_step": 154703, "epoch": 920} {"train_loss": -11.08802604675293, "global_step": 154704, "epoch": 920} {"train_loss": -11.074886322021484, "global_step": 154705, "epoch": 920} {"train_loss": -11.14834213256836, "global_step": 154706, "epoch": 920} {"train_loss": -11.165766716003418, "global_step": 154707, "epoch": 920} {"train_loss": -11.056291580200195, "global_step": 154708, "epoch": 920} {"train_loss": -11.038589477539062, "global_step": 154709, "epoch": 920} {"train_loss": -11.11274528503418, "global_step": 154710, "epoch": 920} {"train_loss": -10.946967124938965, "global_step": 154711, "epoch": 920} {"train_loss": -11.070669174194336, "global_step": 154712, "epoch": 920} {"train_loss": -10.968696594238281, "global_step": 154713, "epoch": 920} {"train_loss": -11.032797813415527, "global_step": 154714, "epoch": 920} {"train_loss": -11.048507690429688, "global_step": 154715, "epoch": 920} {"train_loss": -11.017483711242676, "global_step": 154716, "epoch": 920} {"train_loss": -11.117663383483887, "global_step": 154717, "epoch": 920} {"train_loss": -10.973931312561035, "global_step": 154718, "epoch": 920} {"train_loss": -11.207633972167969, "global_step": 154719, "epoch": 920} {"train_loss": -10.572303771972656, "global_step": 154720, "epoch": 920} {"train_loss": -11.101591110229492, "global_step": 154721, "epoch": 920} {"train_loss": -11.010520935058594, "global_step": 154722, "epoch": 920} {"train_loss": -11.054027557373047, "global_step": 154723, "epoch": 920} {"train_loss": -11.04470443725586, "global_step": 154724, "epoch": 920} {"train_loss": -11.116368293762207, "global_step": 154725, "epoch": 920} {"train_loss": -11.01130485534668, "global_step": 154726, "epoch": 920} {"train_loss": -10.645949988138108, "global_step": 154727, "epoch": 920, "val_loss": 227719.28125, "train_action_mse_error": 1.6064496040344238} {"train_loss": -9.98773193359375, "global_step": 154728, "epoch": 921} {"train_loss": -10.555140495300293, "global_step": 154729, "epoch": 921} {"train_loss": -10.686864852905273, "global_step": 154730, "epoch": 921} {"train_loss": -10.322338104248047, "global_step": 154731, "epoch": 921} {"train_loss": -10.745112419128418, "global_step": 154732, "epoch": 921} {"train_loss": -11.018651962280273, "global_step": 154733, "epoch": 921} {"train_loss": -10.604244232177734, "global_step": 154734, "epoch": 921} {"train_loss": -10.958596229553223, "global_step": 154735, "epoch": 921} {"train_loss": -10.786066055297852, "global_step": 154736, "epoch": 921} {"train_loss": -10.718048095703125, "global_step": 154737, "epoch": 921} {"train_loss": -10.599946022033691, "global_step": 154738, "epoch": 921} {"train_loss": -10.458337783813477, "global_step": 154739, "epoch": 921} {"train_loss": -10.588235855102539, "global_step": 154740, "epoch": 921} {"train_loss": -10.674735069274902, "global_step": 154741, "epoch": 921} {"train_loss": -10.48709487915039, "global_step": 154742, "epoch": 921} {"train_loss": -10.931023597717285, "global_step": 154743, "epoch": 921} {"train_loss": -9.760855674743652, "global_step": 154744, "epoch": 921} {"train_loss": -10.50764274597168, "global_step": 154745, "epoch": 921} {"train_loss": -10.337396621704102, "global_step": 154746, "epoch": 921} {"train_loss": -10.197593688964844, "global_step": 154747, "epoch": 921} {"train_loss": -10.528495788574219, "global_step": 154748, "epoch": 921} {"train_loss": -10.681291580200195, "global_step": 154749, "epoch": 921} {"train_loss": -10.904989242553711, "global_step": 154750, "epoch": 921} {"train_loss": -10.549637794494629, "global_step": 154751, "epoch": 921} {"train_loss": -10.804407119750977, "global_step": 154752, "epoch": 921} {"train_loss": -10.661445617675781, "global_step": 154753, "epoch": 921} {"train_loss": -10.502357482910156, "global_step": 154754, "epoch": 921} {"train_loss": -10.965076446533203, "global_step": 154755, "epoch": 921} {"train_loss": -10.837788581848145, "global_step": 154756, "epoch": 921} {"train_loss": -10.308469772338867, "global_step": 154757, "epoch": 921} {"train_loss": -10.927842140197754, "global_step": 154758, "epoch": 921} {"train_loss": -10.334651947021484, "global_step": 154759, "epoch": 921} {"train_loss": -10.812716484069824, "global_step": 154760, "epoch": 921} {"train_loss": -10.395252227783203, "global_step": 154761, "epoch": 921} {"train_loss": -10.578069686889648, "global_step": 154762, "epoch": 921} {"train_loss": -10.137826919555664, "global_step": 154763, "epoch": 921} {"train_loss": -10.675769805908203, "global_step": 154764, "epoch": 921} {"train_loss": -10.428319931030273, "global_step": 154765, "epoch": 921} {"train_loss": -10.95862102508545, "global_step": 154766, "epoch": 921} {"train_loss": -10.532573699951172, "global_step": 154767, "epoch": 921} {"train_loss": -10.804969787597656, "global_step": 154768, "epoch": 921} {"train_loss": -10.86467170715332, "global_step": 154769, "epoch": 921} {"train_loss": -10.663785934448242, "global_step": 154770, "epoch": 921} {"train_loss": -10.946849822998047, "global_step": 154771, "epoch": 921} {"train_loss": -10.88100814819336, "global_step": 154772, "epoch": 921} {"train_loss": -10.85224723815918, "global_step": 154773, "epoch": 921} {"train_loss": -10.9412841796875, "global_step": 154774, "epoch": 921} {"train_loss": -10.66602897644043, "global_step": 154775, "epoch": 921} {"train_loss": -10.810014724731445, "global_step": 154776, "epoch": 921} {"train_loss": -10.92410659790039, "global_step": 154777, "epoch": 921} {"train_loss": -10.790264129638672, "global_step": 154778, "epoch": 921} {"train_loss": -10.988492965698242, "global_step": 154779, "epoch": 921} {"train_loss": -10.97097396850586, "global_step": 154780, "epoch": 921} {"train_loss": -10.864999771118164, "global_step": 154781, "epoch": 921} {"train_loss": -10.913684844970703, "global_step": 154782, "epoch": 921} {"train_loss": -10.568229675292969, "global_step": 154783, "epoch": 921} {"train_loss": -10.952356338500977, "global_step": 154784, "epoch": 921} {"train_loss": -10.74046516418457, "global_step": 154785, "epoch": 921} {"train_loss": -10.884602546691895, "global_step": 154786, "epoch": 921} {"train_loss": -10.860925674438477, "global_step": 154787, "epoch": 921} {"train_loss": -10.941216468811035, "global_step": 154788, "epoch": 921} {"train_loss": -11.201085090637207, "global_step": 154789, "epoch": 921} {"train_loss": -10.915679931640625, "global_step": 154790, "epoch": 921} {"train_loss": -10.87867546081543, "global_step": 154791, "epoch": 921} {"train_loss": -11.098252296447754, "global_step": 154792, "epoch": 921} {"train_loss": -11.017083168029785, "global_step": 154793, "epoch": 921} {"train_loss": -10.80133056640625, "global_step": 154794, "epoch": 921} {"train_loss": -10.976930618286133, "global_step": 154795, "epoch": 921} {"train_loss": -10.994258880615234, "global_step": 154796, "epoch": 921} {"train_loss": -10.957454681396484, "global_step": 154797, "epoch": 921} {"train_loss": -10.992195129394531, "global_step": 154798, "epoch": 921} {"train_loss": -10.90866470336914, "global_step": 154799, "epoch": 921} {"train_loss": -10.86266040802002, "global_step": 154800, "epoch": 921} {"train_loss": -10.864974975585938, "global_step": 154801, "epoch": 921} {"train_loss": -10.88255500793457, "global_step": 154802, "epoch": 921} {"train_loss": -10.816149711608887, "global_step": 154803, "epoch": 921} {"train_loss": -11.240041732788086, "global_step": 154804, "epoch": 921} {"train_loss": -10.840194702148438, "global_step": 154805, "epoch": 921} {"train_loss": -10.91477108001709, "global_step": 154806, "epoch": 921} {"train_loss": -10.957453727722168, "global_step": 154807, "epoch": 921} {"train_loss": -11.123537063598633, "global_step": 154808, "epoch": 921} {"train_loss": -10.917588233947754, "global_step": 154809, "epoch": 921} {"train_loss": -10.650978088378906, "global_step": 154810, "epoch": 921} {"train_loss": -11.00640869140625, "global_step": 154811, "epoch": 921} {"train_loss": -10.908267974853516, "global_step": 154812, "epoch": 921} {"train_loss": -10.770258903503418, "global_step": 154813, "epoch": 921} {"train_loss": -10.773652076721191, "global_step": 154814, "epoch": 921} {"train_loss": -10.903606414794922, "global_step": 154815, "epoch": 921} {"train_loss": -10.789734840393066, "global_step": 154816, "epoch": 921} {"train_loss": -10.907207489013672, "global_step": 154817, "epoch": 921} {"train_loss": -10.836074829101562, "global_step": 154818, "epoch": 921} {"train_loss": -10.802046775817871, "global_step": 154819, "epoch": 921} {"train_loss": -10.91446304321289, "global_step": 154820, "epoch": 921} {"train_loss": -10.496143341064453, "global_step": 154821, "epoch": 921} {"train_loss": -10.455118179321289, "global_step": 154822, "epoch": 921} {"train_loss": -9.860794067382812, "global_step": 154823, "epoch": 921} {"train_loss": -10.317164421081543, "global_step": 154824, "epoch": 921} {"train_loss": -9.724967956542969, "global_step": 154825, "epoch": 921} {"train_loss": -9.409682273864746, "global_step": 154826, "epoch": 921} {"train_loss": -9.614259719848633, "global_step": 154827, "epoch": 921} {"train_loss": -8.814861297607422, "global_step": 154828, "epoch": 921} {"train_loss": -8.863418579101562, "global_step": 154829, "epoch": 921} {"train_loss": -10.539480209350586, "global_step": 154830, "epoch": 921} {"train_loss": -9.331907272338867, "global_step": 154831, "epoch": 921} {"train_loss": -10.172961235046387, "global_step": 154832, "epoch": 921} {"train_loss": -9.699377059936523, "global_step": 154833, "epoch": 921} {"train_loss": -9.880620956420898, "global_step": 154834, "epoch": 921} {"train_loss": -10.086602210998535, "global_step": 154835, "epoch": 921} {"train_loss": -10.036913871765137, "global_step": 154836, "epoch": 921} {"train_loss": -9.694270133972168, "global_step": 154837, "epoch": 921} {"train_loss": -10.648524284362793, "global_step": 154838, "epoch": 921} {"train_loss": -9.80919075012207, "global_step": 154839, "epoch": 921} {"train_loss": -10.285261154174805, "global_step": 154840, "epoch": 921} {"train_loss": -9.456869125366211, "global_step": 154841, "epoch": 921} {"train_loss": -10.675500869750977, "global_step": 154842, "epoch": 921} {"train_loss": -9.864799499511719, "global_step": 154843, "epoch": 921} {"train_loss": -9.95944595336914, "global_step": 154844, "epoch": 921} {"train_loss": -10.172346115112305, "global_step": 154845, "epoch": 921} {"train_loss": -9.801191329956055, "global_step": 154846, "epoch": 921} {"train_loss": -10.564502716064453, "global_step": 154847, "epoch": 921} {"train_loss": -10.217390060424805, "global_step": 154848, "epoch": 921} {"train_loss": -10.15372085571289, "global_step": 154849, "epoch": 921} {"train_loss": -10.18147087097168, "global_step": 154850, "epoch": 921} {"train_loss": -9.808696746826172, "global_step": 154851, "epoch": 921} {"train_loss": -10.361894607543945, "global_step": 154852, "epoch": 921} {"train_loss": -10.269444465637207, "global_step": 154853, "epoch": 921} {"train_loss": -9.978994369506836, "global_step": 154854, "epoch": 921} {"train_loss": -10.596898078918457, "global_step": 154855, "epoch": 921} {"train_loss": -10.317455291748047, "global_step": 154856, "epoch": 921} {"train_loss": -10.089107513427734, "global_step": 154857, "epoch": 921} {"train_loss": -10.461499214172363, "global_step": 154858, "epoch": 921} {"train_loss": -10.48336410522461, "global_step": 154859, "epoch": 921} {"train_loss": -10.454421997070312, "global_step": 154860, "epoch": 921} {"train_loss": -10.504079818725586, "global_step": 154861, "epoch": 921} {"train_loss": -10.639287948608398, "global_step": 154862, "epoch": 921} {"train_loss": -10.471243858337402, "global_step": 154863, "epoch": 921} {"train_loss": -10.735372543334961, "global_step": 154864, "epoch": 921} {"train_loss": -10.489625930786133, "global_step": 154865, "epoch": 921} {"train_loss": -10.770095825195312, "global_step": 154866, "epoch": 921} {"train_loss": -10.502269744873047, "global_step": 154867, "epoch": 921} {"train_loss": -10.687638282775879, "global_step": 154868, "epoch": 921} {"train_loss": -10.488082885742188, "global_step": 154869, "epoch": 921} {"train_loss": -10.620330810546875, "global_step": 154870, "epoch": 921} {"train_loss": -10.675369262695312, "global_step": 154871, "epoch": 921} {"train_loss": -10.658830642700195, "global_step": 154872, "epoch": 921} {"train_loss": -10.88547134399414, "global_step": 154873, "epoch": 921} {"train_loss": -10.796440124511719, "global_step": 154874, "epoch": 921} {"train_loss": -10.92753791809082, "global_step": 154875, "epoch": 921} {"train_loss": -10.704894065856934, "global_step": 154876, "epoch": 921} {"train_loss": -10.867509841918945, "global_step": 154877, "epoch": 921} {"train_loss": -10.879804611206055, "global_step": 154878, "epoch": 921} {"train_loss": -10.812318801879883, "global_step": 154879, "epoch": 921} {"train_loss": -10.901203155517578, "global_step": 154880, "epoch": 921} {"train_loss": -10.935953140258789, "global_step": 154881, "epoch": 921} {"train_loss": -10.83747673034668, "global_step": 154882, "epoch": 921} {"train_loss": -10.811655044555664, "global_step": 154883, "epoch": 921} {"train_loss": -11.059176445007324, "global_step": 154884, "epoch": 921} {"train_loss": -10.87272834777832, "global_step": 154885, "epoch": 921} {"train_loss": -10.77261734008789, "global_step": 154886, "epoch": 921} {"train_loss": -10.948614120483398, "global_step": 154887, "epoch": 921} {"train_loss": -10.946564674377441, "global_step": 154888, "epoch": 921} {"train_loss": -10.9727144241333, "global_step": 154889, "epoch": 921} {"train_loss": -11.18378734588623, "global_step": 154890, "epoch": 921} {"train_loss": -11.110603332519531, "global_step": 154891, "epoch": 921} {"train_loss": -11.199320793151855, "global_step": 154892, "epoch": 921} {"train_loss": -11.069841384887695, "global_step": 154893, "epoch": 921} {"train_loss": -10.958503723144531, "global_step": 154894, "epoch": 921} {"train_loss": -10.601063285555158, "global_step": 154895, "epoch": 921, "val_loss": 231492.921875} {"train_loss": -11.22784423828125, "global_step": 154896, "epoch": 922} {"train_loss": -11.033337593078613, "global_step": 154897, "epoch": 922} {"train_loss": -11.095702171325684, "global_step": 154898, "epoch": 922} {"train_loss": -10.97978401184082, "global_step": 154899, "epoch": 922} {"train_loss": -10.897102355957031, "global_step": 154900, "epoch": 922} {"train_loss": -11.194198608398438, "global_step": 154901, "epoch": 922} {"train_loss": -10.841357231140137, "global_step": 154902, "epoch": 922} {"train_loss": -10.892023086547852, "global_step": 154903, "epoch": 922} {"train_loss": -10.986922264099121, "global_step": 154904, "epoch": 922} {"train_loss": -10.84847640991211, "global_step": 154905, "epoch": 922} {"train_loss": -10.550267219543457, "global_step": 154906, "epoch": 922} {"train_loss": -10.327798843383789, "global_step": 154907, "epoch": 922} {"train_loss": -10.793038368225098, "global_step": 154908, "epoch": 922} {"train_loss": -10.419364929199219, "global_step": 154909, "epoch": 922} {"train_loss": -10.671411514282227, "global_step": 154910, "epoch": 922} {"train_loss": -10.7662992477417, "global_step": 154911, "epoch": 922} {"train_loss": -10.741741180419922, "global_step": 154912, "epoch": 922} {"train_loss": -10.7357177734375, "global_step": 154913, "epoch": 922} {"train_loss": -11.051596641540527, "global_step": 154914, "epoch": 922} {"train_loss": -10.969252586364746, "global_step": 154915, "epoch": 922} {"train_loss": -11.102180480957031, "global_step": 154916, "epoch": 922} {"train_loss": -10.866744995117188, "global_step": 154917, "epoch": 922} {"train_loss": -10.7855224609375, "global_step": 154918, "epoch": 922} {"train_loss": -10.590815544128418, "global_step": 154919, "epoch": 922} {"train_loss": -10.924956321716309, "global_step": 154920, "epoch": 922} {"train_loss": -10.353835105895996, "global_step": 154921, "epoch": 922} {"train_loss": -10.713600158691406, "global_step": 154922, "epoch": 922} {"train_loss": -10.638062477111816, "global_step": 154923, "epoch": 922} {"train_loss": -10.590662002563477, "global_step": 154924, "epoch": 922} {"train_loss": -10.828950881958008, "global_step": 154925, "epoch": 922} {"train_loss": -10.222742080688477, "global_step": 154926, "epoch": 922} {"train_loss": -10.495959281921387, "global_step": 154927, "epoch": 922} {"train_loss": -10.622781753540039, "global_step": 154928, "epoch": 922} {"train_loss": -10.515729904174805, "global_step": 154929, "epoch": 922} {"train_loss": -10.659001350402832, "global_step": 154930, "epoch": 922} {"train_loss": -10.713976860046387, "global_step": 154931, "epoch": 922} {"train_loss": -10.975862503051758, "global_step": 154932, "epoch": 922} {"train_loss": -10.644508361816406, "global_step": 154933, "epoch": 922} {"train_loss": -10.701532363891602, "global_step": 154934, "epoch": 922} {"train_loss": -10.881637573242188, "global_step": 154935, "epoch": 922} {"train_loss": -10.726115226745605, "global_step": 154936, "epoch": 922} {"train_loss": -10.571453094482422, "global_step": 154937, "epoch": 922} {"train_loss": -10.923133850097656, "global_step": 154938, "epoch": 922} {"train_loss": -10.80374526977539, "global_step": 154939, "epoch": 922} {"train_loss": -10.824098587036133, "global_step": 154940, "epoch": 922} {"train_loss": -11.222031593322754, "global_step": 154941, "epoch": 922} {"train_loss": -10.845905303955078, "global_step": 154942, "epoch": 922} {"train_loss": -10.94070816040039, "global_step": 154943, "epoch": 922} {"train_loss": -11.073251724243164, "global_step": 154944, "epoch": 922} {"train_loss": -10.447206497192383, "global_step": 154945, "epoch": 922} {"train_loss": -10.962333679199219, "global_step": 154946, "epoch": 922} {"train_loss": -10.923425674438477, "global_step": 154947, "epoch": 922} {"train_loss": -10.664674758911133, "global_step": 154948, "epoch": 922} {"train_loss": -10.713737487792969, "global_step": 154949, "epoch": 922} {"train_loss": -11.113174438476562, "global_step": 154950, "epoch": 922} {"train_loss": -10.518518447875977, "global_step": 154951, "epoch": 922} {"train_loss": -10.918746948242188, "global_step": 154952, "epoch": 922} {"train_loss": -9.990621566772461, "global_step": 154953, "epoch": 922} {"train_loss": -10.84184741973877, "global_step": 154954, "epoch": 922} {"train_loss": -10.426515579223633, "global_step": 154955, "epoch": 922} {"train_loss": -10.296334266662598, "global_step": 154956, "epoch": 922} {"train_loss": -11.019685745239258, "global_step": 154957, "epoch": 922} {"train_loss": -10.387845039367676, "global_step": 154958, "epoch": 922} {"train_loss": -10.933773040771484, "global_step": 154959, "epoch": 922} {"train_loss": -10.370800971984863, "global_step": 154960, "epoch": 922} {"train_loss": -10.890775680541992, "global_step": 154961, "epoch": 922} {"train_loss": -10.426315307617188, "global_step": 154962, "epoch": 922} {"train_loss": -10.502182006835938, "global_step": 154963, "epoch": 922} {"train_loss": -10.747902870178223, "global_step": 154964, "epoch": 922} {"train_loss": -10.40633773803711, "global_step": 154965, "epoch": 922} {"train_loss": -10.98823356628418, "global_step": 154966, "epoch": 922} {"train_loss": -10.809623718261719, "global_step": 154967, "epoch": 922} {"train_loss": -10.84161376953125, "global_step": 154968, "epoch": 922} {"train_loss": -10.972410202026367, "global_step": 154969, "epoch": 922} {"train_loss": -10.639516830444336, "global_step": 154970, "epoch": 922} {"train_loss": -10.80116081237793, "global_step": 154971, "epoch": 922} {"train_loss": -10.70134449005127, "global_step": 154972, "epoch": 922} {"train_loss": -10.849458694458008, "global_step": 154973, "epoch": 922} {"train_loss": -10.73669719696045, "global_step": 154974, "epoch": 922} {"train_loss": -10.696712493896484, "global_step": 154975, "epoch": 922} {"train_loss": -10.583141326904297, "global_step": 154976, "epoch": 922} {"train_loss": -10.255840301513672, "global_step": 154977, "epoch": 922} {"train_loss": -10.701925277709961, "global_step": 154978, "epoch": 922} {"train_loss": -10.44993782043457, "global_step": 154979, "epoch": 922} {"train_loss": -10.884244918823242, "global_step": 154980, "epoch": 922} {"train_loss": -10.217348098754883, "global_step": 154981, "epoch": 922} {"train_loss": -10.85110092163086, "global_step": 154982, "epoch": 922} {"train_loss": -10.421093940734863, "global_step": 154983, "epoch": 922} {"train_loss": -10.818244934082031, "global_step": 154984, "epoch": 922} {"train_loss": -10.708657264709473, "global_step": 154985, "epoch": 922} {"train_loss": -10.715936660766602, "global_step": 154986, "epoch": 922} {"train_loss": -10.795745849609375, "global_step": 154987, "epoch": 922} {"train_loss": -10.785123825073242, "global_step": 154988, "epoch": 922} {"train_loss": -10.892778396606445, "global_step": 154989, "epoch": 922} {"train_loss": -10.79904556274414, "global_step": 154990, "epoch": 922} {"train_loss": -10.86521053314209, "global_step": 154991, "epoch": 922} {"train_loss": -10.682256698608398, "global_step": 154992, "epoch": 922} {"train_loss": -10.714399337768555, "global_step": 154993, "epoch": 922} {"train_loss": -10.692089080810547, "global_step": 154994, "epoch": 922} {"train_loss": -10.965831756591797, "global_step": 154995, "epoch": 922} {"train_loss": -10.450642585754395, "global_step": 154996, "epoch": 922} {"train_loss": -10.794597625732422, "global_step": 154997, "epoch": 922} {"train_loss": -10.792304992675781, "global_step": 154998, "epoch": 922} {"train_loss": -10.857803344726562, "global_step": 154999, "epoch": 922} {"train_loss": -10.636341094970703, "global_step": 155000, "epoch": 922} {"train_loss": -10.789619445800781, "global_step": 155001, "epoch": 922} {"train_loss": -10.970440864562988, "global_step": 155002, "epoch": 922} {"train_loss": -10.643173217773438, "global_step": 155003, "epoch": 922} {"train_loss": -10.798086166381836, "global_step": 155004, "epoch": 922} {"train_loss": -10.26414966583252, "global_step": 155005, "epoch": 922} {"train_loss": -10.870624542236328, "global_step": 155006, "epoch": 922} {"train_loss": -10.704753875732422, "global_step": 155007, "epoch": 922} {"train_loss": -10.853925704956055, "global_step": 155008, "epoch": 922} {"train_loss": -10.86758804321289, "global_step": 155009, "epoch": 922} {"train_loss": -10.719181060791016, "global_step": 155010, "epoch": 922} {"train_loss": -11.027128219604492, "global_step": 155011, "epoch": 922} {"train_loss": -10.958106994628906, "global_step": 155012, "epoch": 922} {"train_loss": -10.937925338745117, "global_step": 155013, "epoch": 922} {"train_loss": -10.83339786529541, "global_step": 155014, "epoch": 922} {"train_loss": -10.750982284545898, "global_step": 155015, "epoch": 922} {"train_loss": -11.01268196105957, "global_step": 155016, "epoch": 922} {"train_loss": -10.894134521484375, "global_step": 155017, "epoch": 922} {"train_loss": -10.931787490844727, "global_step": 155018, "epoch": 922} {"train_loss": -10.730955123901367, "global_step": 155019, "epoch": 922} {"train_loss": -10.642526626586914, "global_step": 155020, "epoch": 922} {"train_loss": -10.680948257446289, "global_step": 155021, "epoch": 922} {"train_loss": -10.768877029418945, "global_step": 155022, "epoch": 922} {"train_loss": -11.113189697265625, "global_step": 155023, "epoch": 922} {"train_loss": -10.43765640258789, "global_step": 155024, "epoch": 922} {"train_loss": -10.91657829284668, "global_step": 155025, "epoch": 922} {"train_loss": -10.294711112976074, "global_step": 155026, "epoch": 922} {"train_loss": -10.560726165771484, "global_step": 155027, "epoch": 922} {"train_loss": -10.92226505279541, "global_step": 155028, "epoch": 922} {"train_loss": -10.352149963378906, "global_step": 155029, "epoch": 922} {"train_loss": -10.837783813476562, "global_step": 155030, "epoch": 922} {"train_loss": -10.430550575256348, "global_step": 155031, "epoch": 922} {"train_loss": -10.678062438964844, "global_step": 155032, "epoch": 922} {"train_loss": -10.480514526367188, "global_step": 155033, "epoch": 922} {"train_loss": -10.375160217285156, "global_step": 155034, "epoch": 922} {"train_loss": -10.785392761230469, "global_step": 155035, "epoch": 922} {"train_loss": -10.099634170532227, "global_step": 155036, "epoch": 922} {"train_loss": -10.953173637390137, "global_step": 155037, "epoch": 922} {"train_loss": -10.643237113952637, "global_step": 155038, "epoch": 922} {"train_loss": -10.595680236816406, "global_step": 155039, "epoch": 922} {"train_loss": -10.695884704589844, "global_step": 155040, "epoch": 922} {"train_loss": -10.62714958190918, "global_step": 155041, "epoch": 922} {"train_loss": -10.777029037475586, "global_step": 155042, "epoch": 922} {"train_loss": -10.743797302246094, "global_step": 155043, "epoch": 922} {"train_loss": -10.715385437011719, "global_step": 155044, "epoch": 922} {"train_loss": -10.226905822753906, "global_step": 155045, "epoch": 922} {"train_loss": -10.649347305297852, "global_step": 155046, "epoch": 922} {"train_loss": -10.47147274017334, "global_step": 155047, "epoch": 922} {"train_loss": -10.434532165527344, "global_step": 155048, "epoch": 922} {"train_loss": -10.630632400512695, "global_step": 155049, "epoch": 922} {"train_loss": -10.56912612915039, "global_step": 155050, "epoch": 922} {"train_loss": -10.217764854431152, "global_step": 155051, "epoch": 922} {"train_loss": -10.055017471313477, "global_step": 155052, "epoch": 922} {"train_loss": -10.43558120727539, "global_step": 155053, "epoch": 922} {"train_loss": -10.600014686584473, "global_step": 155054, "epoch": 922} {"train_loss": -10.241559982299805, "global_step": 155055, "epoch": 922} {"train_loss": -11.031859397888184, "global_step": 155056, "epoch": 922} {"train_loss": -10.566561698913574, "global_step": 155057, "epoch": 922} {"train_loss": -10.891478538513184, "global_step": 155058, "epoch": 922} {"train_loss": -10.686412811279297, "global_step": 155059, "epoch": 922} {"train_loss": -10.71888542175293, "global_step": 155060, "epoch": 922} {"train_loss": -10.450387954711914, "global_step": 155061, "epoch": 922} {"train_loss": -10.81512451171875, "global_step": 155062, "epoch": 922} {"train_loss": -10.711619547435216, "global_step": 155063, "epoch": 922, "val_loss": 233029.296875} {"train_loss": -10.877640724182129, "global_step": 155064, "epoch": 923} {"train_loss": -10.930231094360352, "global_step": 155065, "epoch": 923} {"train_loss": -10.786656379699707, "global_step": 155066, "epoch": 923} {"train_loss": -10.592419624328613, "global_step": 155067, "epoch": 923} {"train_loss": -10.737649917602539, "global_step": 155068, "epoch": 923} {"train_loss": -10.783882141113281, "global_step": 155069, "epoch": 923} {"train_loss": -10.645938873291016, "global_step": 155070, "epoch": 923} {"train_loss": -10.846895217895508, "global_step": 155071, "epoch": 923} {"train_loss": -11.019927978515625, "global_step": 155072, "epoch": 923} {"train_loss": -10.724678039550781, "global_step": 155073, "epoch": 923} {"train_loss": -10.92628288269043, "global_step": 155074, "epoch": 923} {"train_loss": -10.917471885681152, "global_step": 155075, "epoch": 923} {"train_loss": -10.620445251464844, "global_step": 155076, "epoch": 923} {"train_loss": -11.0399169921875, "global_step": 155077, "epoch": 923} {"train_loss": -10.559810638427734, "global_step": 155078, "epoch": 923} {"train_loss": -10.783151626586914, "global_step": 155079, "epoch": 923} {"train_loss": -10.570388793945312, "global_step": 155080, "epoch": 923} {"train_loss": -10.686491966247559, "global_step": 155081, "epoch": 923} {"train_loss": -11.039665222167969, "global_step": 155082, "epoch": 923} {"train_loss": -10.963194847106934, "global_step": 155083, "epoch": 923} {"train_loss": -10.451221466064453, "global_step": 155084, "epoch": 923} {"train_loss": -10.631872177124023, "global_step": 155085, "epoch": 923} {"train_loss": -10.690502166748047, "global_step": 155086, "epoch": 923} {"train_loss": -10.481689453125, "global_step": 155087, "epoch": 923} {"train_loss": -10.408787727355957, "global_step": 155088, "epoch": 923} {"train_loss": -10.344270706176758, "global_step": 155089, "epoch": 923} {"train_loss": -10.440641403198242, "global_step": 155090, "epoch": 923} {"train_loss": -10.403818130493164, "global_step": 155091, "epoch": 923} {"train_loss": -10.468910217285156, "global_step": 155092, "epoch": 923} {"train_loss": -10.052763938903809, "global_step": 155093, "epoch": 923} {"train_loss": -10.062472343444824, "global_step": 155094, "epoch": 923} {"train_loss": -9.805013656616211, "global_step": 155095, "epoch": 923} {"train_loss": -9.495086669921875, "global_step": 155096, "epoch": 923} {"train_loss": -10.141143798828125, "global_step": 155097, "epoch": 923} {"train_loss": -8.817582130432129, "global_step": 155098, "epoch": 923} {"train_loss": -10.311184883117676, "global_step": 155099, "epoch": 923} {"train_loss": -8.824947357177734, "global_step": 155100, "epoch": 923} {"train_loss": -10.561798095703125, "global_step": 155101, "epoch": 923} {"train_loss": -9.16309928894043, "global_step": 155102, "epoch": 923} {"train_loss": -10.316734313964844, "global_step": 155103, "epoch": 923} {"train_loss": -9.893945693969727, "global_step": 155104, "epoch": 923} {"train_loss": -10.434555053710938, "global_step": 155105, "epoch": 923} {"train_loss": -10.51864242553711, "global_step": 155106, "epoch": 923} {"train_loss": -10.40735912322998, "global_step": 155107, "epoch": 923} {"train_loss": -10.46673583984375, "global_step": 155108, "epoch": 923} {"train_loss": -10.409727096557617, "global_step": 155109, "epoch": 923} {"train_loss": -10.692495346069336, "global_step": 155110, "epoch": 923} {"train_loss": -10.461236000061035, "global_step": 155111, "epoch": 923} {"train_loss": -10.602165222167969, "global_step": 155112, "epoch": 923} {"train_loss": -10.501376152038574, "global_step": 155113, "epoch": 923} {"train_loss": -10.441827774047852, "global_step": 155114, "epoch": 923} {"train_loss": -10.395322799682617, "global_step": 155115, "epoch": 923} {"train_loss": -10.55006217956543, "global_step": 155116, "epoch": 923} {"train_loss": -10.55352783203125, "global_step": 155117, "epoch": 923} {"train_loss": -10.42512035369873, "global_step": 155118, "epoch": 923} {"train_loss": -10.93984603881836, "global_step": 155119, "epoch": 923} {"train_loss": -10.420448303222656, "global_step": 155120, "epoch": 923} {"train_loss": -10.680220603942871, "global_step": 155121, "epoch": 923} {"train_loss": -10.688074111938477, "global_step": 155122, "epoch": 923} {"train_loss": -10.27957534790039, "global_step": 155123, "epoch": 923} {"train_loss": -10.571657180786133, "global_step": 155124, "epoch": 923} {"train_loss": -10.606813430786133, "global_step": 155125, "epoch": 923} {"train_loss": -10.843358993530273, "global_step": 155126, "epoch": 923} {"train_loss": -10.880434036254883, "global_step": 155127, "epoch": 923} {"train_loss": -10.762523651123047, "global_step": 155128, "epoch": 923} {"train_loss": -10.975872039794922, "global_step": 155129, "epoch": 923} {"train_loss": -10.667404174804688, "global_step": 155130, "epoch": 923} {"train_loss": -10.908899307250977, "global_step": 155131, "epoch": 923} {"train_loss": -10.771610260009766, "global_step": 155132, "epoch": 923} {"train_loss": -10.81307601928711, "global_step": 155133, "epoch": 923} {"train_loss": -10.753313064575195, "global_step": 155134, "epoch": 923} {"train_loss": -10.923383712768555, "global_step": 155135, "epoch": 923} {"train_loss": -10.891530990600586, "global_step": 155136, "epoch": 923} {"train_loss": -10.984060287475586, "global_step": 155137, "epoch": 923} {"train_loss": -10.894758224487305, "global_step": 155138, "epoch": 923} {"train_loss": -10.996131896972656, "global_step": 155139, "epoch": 923} {"train_loss": -11.11530590057373, "global_step": 155140, "epoch": 923} {"train_loss": -10.973182678222656, "global_step": 155141, "epoch": 923} {"train_loss": -11.042486190795898, "global_step": 155142, "epoch": 923} {"train_loss": -10.951356887817383, "global_step": 155143, "epoch": 923} {"train_loss": -11.099126815795898, "global_step": 155144, "epoch": 923} {"train_loss": -10.99718189239502, "global_step": 155145, "epoch": 923} {"train_loss": -11.214587211608887, "global_step": 155146, "epoch": 923} {"train_loss": -10.997588157653809, "global_step": 155147, "epoch": 923} {"train_loss": -11.24567985534668, "global_step": 155148, "epoch": 923} {"train_loss": -11.074703216552734, "global_step": 155149, "epoch": 923} {"train_loss": -11.183911323547363, "global_step": 155150, "epoch": 923} {"train_loss": -11.21506118774414, "global_step": 155151, "epoch": 923} {"train_loss": -11.261529922485352, "global_step": 155152, "epoch": 923} {"train_loss": -11.144065856933594, "global_step": 155153, "epoch": 923} {"train_loss": -11.283890724182129, "global_step": 155154, "epoch": 923} {"train_loss": -11.084857940673828, "global_step": 155155, "epoch": 923} {"train_loss": -10.899641036987305, "global_step": 155156, "epoch": 923} {"train_loss": -11.142122268676758, "global_step": 155157, "epoch": 923} {"train_loss": -11.044795989990234, "global_step": 155158, "epoch": 923} {"train_loss": -10.716676712036133, "global_step": 155159, "epoch": 923} {"train_loss": -11.037378311157227, "global_step": 155160, "epoch": 923} {"train_loss": -10.649136543273926, "global_step": 155161, "epoch": 923} {"train_loss": -10.557558059692383, "global_step": 155162, "epoch": 923} {"train_loss": -10.76340389251709, "global_step": 155163, "epoch": 923} {"train_loss": -10.924949645996094, "global_step": 155164, "epoch": 923} {"train_loss": -10.232866287231445, "global_step": 155165, "epoch": 923} {"train_loss": -10.320257186889648, "global_step": 155166, "epoch": 923} {"train_loss": -10.874898910522461, "global_step": 155167, "epoch": 923} {"train_loss": -10.708337783813477, "global_step": 155168, "epoch": 923} {"train_loss": -10.98823356628418, "global_step": 155169, "epoch": 923} {"train_loss": -10.927316665649414, "global_step": 155170, "epoch": 923} {"train_loss": -10.862495422363281, "global_step": 155171, "epoch": 923} {"train_loss": -10.74073600769043, "global_step": 155172, "epoch": 923} {"train_loss": -10.745529174804688, "global_step": 155173, "epoch": 923} {"train_loss": -10.933914184570312, "global_step": 155174, "epoch": 923} {"train_loss": -10.933837890625, "global_step": 155175, "epoch": 923} {"train_loss": -10.758848190307617, "global_step": 155176, "epoch": 923} {"train_loss": -10.544182777404785, "global_step": 155177, "epoch": 923} {"train_loss": -10.96115493774414, "global_step": 155178, "epoch": 923} {"train_loss": -10.833183288574219, "global_step": 155179, "epoch": 923} {"train_loss": -10.295780181884766, "global_step": 155180, "epoch": 923} {"train_loss": -10.85429573059082, "global_step": 155181, "epoch": 923} {"train_loss": -10.944780349731445, "global_step": 155182, "epoch": 923} {"train_loss": -10.288091659545898, "global_step": 155183, "epoch": 923} {"train_loss": -10.90461540222168, "global_step": 155184, "epoch": 923} {"train_loss": -10.954666137695312, "global_step": 155185, "epoch": 923} {"train_loss": -10.763786315917969, "global_step": 155186, "epoch": 923} {"train_loss": -10.899736404418945, "global_step": 155187, "epoch": 923} {"train_loss": -10.464115142822266, "global_step": 155188, "epoch": 923} {"train_loss": -10.877056121826172, "global_step": 155189, "epoch": 923} {"train_loss": -10.851323127746582, "global_step": 155190, "epoch": 923} {"train_loss": -10.377647399902344, "global_step": 155191, "epoch": 923} {"train_loss": -10.71091365814209, "global_step": 155192, "epoch": 923} {"train_loss": -10.932313919067383, "global_step": 155193, "epoch": 923} {"train_loss": -10.35536003112793, "global_step": 155194, "epoch": 923} {"train_loss": -10.74510383605957, "global_step": 155195, "epoch": 923} {"train_loss": -10.968588829040527, "global_step": 155196, "epoch": 923} {"train_loss": -10.5826997756958, "global_step": 155197, "epoch": 923} {"train_loss": -11.011571884155273, "global_step": 155198, "epoch": 923} {"train_loss": -10.691320419311523, "global_step": 155199, "epoch": 923} {"train_loss": -11.023999214172363, "global_step": 155200, "epoch": 923} {"train_loss": -10.766254425048828, "global_step": 155201, "epoch": 923} {"train_loss": -11.076662063598633, "global_step": 155202, "epoch": 923} {"train_loss": -11.074068069458008, "global_step": 155203, "epoch": 923} {"train_loss": -10.776139259338379, "global_step": 155204, "epoch": 923} {"train_loss": -10.989910125732422, "global_step": 155205, "epoch": 923} {"train_loss": -10.85033893585205, "global_step": 155206, "epoch": 923} {"train_loss": -11.081608772277832, "global_step": 155207, "epoch": 923} {"train_loss": -10.94924545288086, "global_step": 155208, "epoch": 923} {"train_loss": -10.96297836303711, "global_step": 155209, "epoch": 923} {"train_loss": -11.034475326538086, "global_step": 155210, "epoch": 923} {"train_loss": -10.8663969039917, "global_step": 155211, "epoch": 923} {"train_loss": -11.058026313781738, "global_step": 155212, "epoch": 923} {"train_loss": -11.01562213897705, "global_step": 155213, "epoch": 923} {"train_loss": -10.693716049194336, "global_step": 155214, "epoch": 923} {"train_loss": -10.91630744934082, "global_step": 155215, "epoch": 923} {"train_loss": -10.82311725616455, "global_step": 155216, "epoch": 923} {"train_loss": -10.57846450805664, "global_step": 155217, "epoch": 923} {"train_loss": -10.844852447509766, "global_step": 155218, "epoch": 923} {"train_loss": -10.916467666625977, "global_step": 155219, "epoch": 923} {"train_loss": -11.019378662109375, "global_step": 155220, "epoch": 923} {"train_loss": -10.752254486083984, "global_step": 155221, "epoch": 923} {"train_loss": -10.878469467163086, "global_step": 155222, "epoch": 923} {"train_loss": -10.444734573364258, "global_step": 155223, "epoch": 923} {"train_loss": -10.834489822387695, "global_step": 155224, "epoch": 923} {"train_loss": -10.801076889038086, "global_step": 155225, "epoch": 923} {"train_loss": -10.536989212036133, "global_step": 155226, "epoch": 923} {"train_loss": -10.930334091186523, "global_step": 155227, "epoch": 923} {"train_loss": -10.61435317993164, "global_step": 155228, "epoch": 923} {"train_loss": -10.851306915283203, "global_step": 155229, "epoch": 923} {"train_loss": -11.013132095336914, "global_step": 155230, "epoch": 923} {"train_loss": -10.714845509756179, "global_step": 155231, "epoch": 923, "val_loss": 231033.3125} {"train_loss": -10.858098030090332, "global_step": 155232, "epoch": 924} {"train_loss": -10.878823280334473, "global_step": 155233, "epoch": 924} {"train_loss": -10.67978286743164, "global_step": 155234, "epoch": 924} {"train_loss": -10.845619201660156, "global_step": 155235, "epoch": 924} {"train_loss": -10.550957679748535, "global_step": 155236, "epoch": 924} {"train_loss": -10.95414924621582, "global_step": 155237, "epoch": 924} {"train_loss": -10.815107345581055, "global_step": 155238, "epoch": 924} {"train_loss": -10.701489448547363, "global_step": 155239, "epoch": 924} {"train_loss": -11.162664413452148, "global_step": 155240, "epoch": 924} {"train_loss": -10.644063949584961, "global_step": 155241, "epoch": 924} {"train_loss": -10.864948272705078, "global_step": 155242, "epoch": 924} {"train_loss": -10.775579452514648, "global_step": 155243, "epoch": 924} {"train_loss": -10.92827033996582, "global_step": 155244, "epoch": 924} {"train_loss": -10.533044815063477, "global_step": 155245, "epoch": 924} {"train_loss": -10.43649959564209, "global_step": 155246, "epoch": 924} {"train_loss": -10.307624816894531, "global_step": 155247, "epoch": 924} {"train_loss": -10.434560775756836, "global_step": 155248, "epoch": 924} {"train_loss": -10.548398971557617, "global_step": 155249, "epoch": 924} {"train_loss": -10.397296905517578, "global_step": 155250, "epoch": 924} {"train_loss": -10.669905662536621, "global_step": 155251, "epoch": 924} {"train_loss": -9.900650978088379, "global_step": 155252, "epoch": 924} {"train_loss": -10.867822647094727, "global_step": 155253, "epoch": 924} {"train_loss": -10.525192260742188, "global_step": 155254, "epoch": 924} {"train_loss": -10.817703247070312, "global_step": 155255, "epoch": 924} {"train_loss": -10.864860534667969, "global_step": 155256, "epoch": 924} {"train_loss": -10.535806655883789, "global_step": 155257, "epoch": 924} {"train_loss": -10.441011428833008, "global_step": 155258, "epoch": 924} {"train_loss": -10.564393997192383, "global_step": 155259, "epoch": 924} {"train_loss": -10.622434616088867, "global_step": 155260, "epoch": 924} {"train_loss": -10.644052505493164, "global_step": 155261, "epoch": 924} {"train_loss": -10.684728622436523, "global_step": 155262, "epoch": 924} {"train_loss": -10.837569236755371, "global_step": 155263, "epoch": 924} {"train_loss": -10.758657455444336, "global_step": 155264, "epoch": 924} {"train_loss": -10.901290893554688, "global_step": 155265, "epoch": 924} {"train_loss": -10.842697143554688, "global_step": 155266, "epoch": 924} {"train_loss": -10.837814331054688, "global_step": 155267, "epoch": 924} {"train_loss": -10.772819519042969, "global_step": 155268, "epoch": 924} {"train_loss": -10.881719589233398, "global_step": 155269, "epoch": 924} {"train_loss": -10.893379211425781, "global_step": 155270, "epoch": 924} {"train_loss": -11.027936935424805, "global_step": 155271, "epoch": 924} {"train_loss": -11.190691947937012, "global_step": 155272, "epoch": 924} {"train_loss": -10.906821250915527, "global_step": 155273, "epoch": 924} {"train_loss": -11.001996994018555, "global_step": 155274, "epoch": 924} {"train_loss": -10.960409164428711, "global_step": 155275, "epoch": 924} {"train_loss": -10.987905502319336, "global_step": 155276, "epoch": 924} {"train_loss": -11.21073055267334, "global_step": 155277, "epoch": 924} {"train_loss": -10.590707778930664, "global_step": 155278, "epoch": 924} {"train_loss": -11.082130432128906, "global_step": 155279, "epoch": 924} {"train_loss": -10.901851654052734, "global_step": 155280, "epoch": 924} {"train_loss": -10.864889144897461, "global_step": 155281, "epoch": 924} {"train_loss": -11.02093505859375, "global_step": 155282, "epoch": 924} {"train_loss": -10.95984935760498, "global_step": 155283, "epoch": 924} {"train_loss": -11.080638885498047, "global_step": 155284, "epoch": 924} {"train_loss": -10.88873291015625, "global_step": 155285, "epoch": 924} {"train_loss": -10.880867004394531, "global_step": 155286, "epoch": 924} {"train_loss": -11.232101440429688, "global_step": 155287, "epoch": 924} {"train_loss": -10.733976364135742, "global_step": 155288, "epoch": 924} {"train_loss": -11.088735580444336, "global_step": 155289, "epoch": 924} {"train_loss": -11.086566925048828, "global_step": 155290, "epoch": 924} {"train_loss": -11.407355308532715, "global_step": 155291, "epoch": 924} {"train_loss": -11.029226303100586, "global_step": 155292, "epoch": 924} {"train_loss": -10.656890869140625, "global_step": 155293, "epoch": 924} {"train_loss": -10.698033332824707, "global_step": 155294, "epoch": 924} {"train_loss": -10.867592811584473, "global_step": 155295, "epoch": 924} {"train_loss": -11.231260299682617, "global_step": 155296, "epoch": 924} {"train_loss": -10.895750999450684, "global_step": 155297, "epoch": 924} {"train_loss": -11.171341896057129, "global_step": 155298, "epoch": 924} {"train_loss": -10.739667892456055, "global_step": 155299, "epoch": 924} {"train_loss": -10.76811695098877, "global_step": 155300, "epoch": 924} {"train_loss": -11.258240699768066, "global_step": 155301, "epoch": 924} {"train_loss": -11.000703811645508, "global_step": 155302, "epoch": 924} {"train_loss": -11.031684875488281, "global_step": 155303, "epoch": 924} {"train_loss": -11.002243995666504, "global_step": 155304, "epoch": 924} {"train_loss": -11.274299621582031, "global_step": 155305, "epoch": 924} {"train_loss": -11.029935836791992, "global_step": 155306, "epoch": 924} {"train_loss": -10.928544998168945, "global_step": 155307, "epoch": 924} {"train_loss": -11.105045318603516, "global_step": 155308, "epoch": 924} {"train_loss": -10.821964263916016, "global_step": 155309, "epoch": 924} {"train_loss": -11.022416114807129, "global_step": 155310, "epoch": 924} {"train_loss": -10.412673950195312, "global_step": 155311, "epoch": 924} {"train_loss": -10.950838088989258, "global_step": 155312, "epoch": 924} {"train_loss": -10.553260803222656, "global_step": 155313, "epoch": 924} {"train_loss": -10.973894119262695, "global_step": 155314, "epoch": 924} {"train_loss": -10.814236640930176, "global_step": 155315, "epoch": 924} {"train_loss": -10.871217727661133, "global_step": 155316, "epoch": 924} {"train_loss": -10.870136260986328, "global_step": 155317, "epoch": 924} {"train_loss": -10.861283302307129, "global_step": 155318, "epoch": 924} {"train_loss": -10.829103469848633, "global_step": 155319, "epoch": 924} {"train_loss": -10.722797393798828, "global_step": 155320, "epoch": 924} {"train_loss": -10.98706340789795, "global_step": 155321, "epoch": 924} {"train_loss": -10.83874797821045, "global_step": 155322, "epoch": 924} {"train_loss": -10.79737663269043, "global_step": 155323, "epoch": 924} {"train_loss": -10.662935256958008, "global_step": 155324, "epoch": 924} {"train_loss": -10.887155532836914, "global_step": 155325, "epoch": 924} {"train_loss": -10.500736236572266, "global_step": 155326, "epoch": 924} {"train_loss": -10.750381469726562, "global_step": 155327, "epoch": 924} {"train_loss": -10.999307632446289, "global_step": 155328, "epoch": 924} {"train_loss": -10.198508262634277, "global_step": 155329, "epoch": 924} {"train_loss": -10.547842025756836, "global_step": 155330, "epoch": 924} {"train_loss": -10.711709022521973, "global_step": 155331, "epoch": 924} {"train_loss": -10.412938117980957, "global_step": 155332, "epoch": 924} {"train_loss": -10.319477081298828, "global_step": 155333, "epoch": 924} {"train_loss": -10.837617874145508, "global_step": 155334, "epoch": 924} {"train_loss": -9.726991653442383, "global_step": 155335, "epoch": 924} {"train_loss": -10.682003021240234, "global_step": 155336, "epoch": 924} {"train_loss": -10.624309539794922, "global_step": 155337, "epoch": 924} {"train_loss": -10.344343185424805, "global_step": 155338, "epoch": 924} {"train_loss": -11.043188095092773, "global_step": 155339, "epoch": 924} {"train_loss": -10.597761154174805, "global_step": 155340, "epoch": 924} {"train_loss": -10.947687149047852, "global_step": 155341, "epoch": 924} {"train_loss": -10.774320602416992, "global_step": 155342, "epoch": 924} {"train_loss": -10.414546966552734, "global_step": 155343, "epoch": 924} {"train_loss": -10.556739807128906, "global_step": 155344, "epoch": 924} {"train_loss": -10.304969787597656, "global_step": 155345, "epoch": 924} {"train_loss": -10.590353965759277, "global_step": 155346, "epoch": 924} {"train_loss": -10.053810119628906, "global_step": 155347, "epoch": 924} {"train_loss": -10.963642120361328, "global_step": 155348, "epoch": 924} {"train_loss": -10.154513359069824, "global_step": 155349, "epoch": 924} {"train_loss": -10.664385795593262, "global_step": 155350, "epoch": 924} {"train_loss": -10.364173889160156, "global_step": 155351, "epoch": 924} {"train_loss": -10.385875701904297, "global_step": 155352, "epoch": 924} {"train_loss": -10.348217010498047, "global_step": 155353, "epoch": 924} {"train_loss": -10.568355560302734, "global_step": 155354, "epoch": 924} {"train_loss": -10.778556823730469, "global_step": 155355, "epoch": 924} {"train_loss": -10.6224365234375, "global_step": 155356, "epoch": 924} {"train_loss": -10.72597885131836, "global_step": 155357, "epoch": 924} {"train_loss": -10.521596908569336, "global_step": 155358, "epoch": 924} {"train_loss": -10.667486190795898, "global_step": 155359, "epoch": 924} {"train_loss": -10.759883880615234, "global_step": 155360, "epoch": 924} {"train_loss": -10.839364051818848, "global_step": 155361, "epoch": 924} {"train_loss": -10.800546646118164, "global_step": 155362, "epoch": 924} {"train_loss": -10.652885437011719, "global_step": 155363, "epoch": 924} {"train_loss": -10.71810245513916, "global_step": 155364, "epoch": 924} {"train_loss": -10.874457359313965, "global_step": 155365, "epoch": 924} {"train_loss": -10.79823112487793, "global_step": 155366, "epoch": 924} {"train_loss": -10.959880828857422, "global_step": 155367, "epoch": 924} {"train_loss": -10.662479400634766, "global_step": 155368, "epoch": 924} {"train_loss": -10.997644424438477, "global_step": 155369, "epoch": 924} {"train_loss": -10.887866973876953, "global_step": 155370, "epoch": 924} {"train_loss": -10.724544525146484, "global_step": 155371, "epoch": 924} {"train_loss": -10.561129570007324, "global_step": 155372, "epoch": 924} {"train_loss": -10.819124221801758, "global_step": 155373, "epoch": 924} {"train_loss": -10.902209281921387, "global_step": 155374, "epoch": 924} {"train_loss": -10.578258514404297, "global_step": 155375, "epoch": 924} {"train_loss": -10.820348739624023, "global_step": 155376, "epoch": 924} {"train_loss": -10.921773910522461, "global_step": 155377, "epoch": 924} {"train_loss": -10.85737419128418, "global_step": 155378, "epoch": 924} {"train_loss": -10.908842086791992, "global_step": 155379, "epoch": 924} {"train_loss": -10.468428611755371, "global_step": 155380, "epoch": 924} {"train_loss": -10.867559432983398, "global_step": 155381, "epoch": 924} {"train_loss": -10.704280853271484, "global_step": 155382, "epoch": 924} {"train_loss": -10.81318473815918, "global_step": 155383, "epoch": 924} {"train_loss": -10.943710327148438, "global_step": 155384, "epoch": 924} {"train_loss": -10.757942199707031, "global_step": 155385, "epoch": 924} {"train_loss": -10.949539184570312, "global_step": 155386, "epoch": 924} {"train_loss": -10.474124908447266, "global_step": 155387, "epoch": 924} {"train_loss": -10.999699592590332, "global_step": 155388, "epoch": 924} {"train_loss": -10.592508316040039, "global_step": 155389, "epoch": 924} {"train_loss": -10.967639923095703, "global_step": 155390, "epoch": 924} {"train_loss": -10.992387771606445, "global_step": 155391, "epoch": 924} {"train_loss": -10.234737396240234, "global_step": 155392, "epoch": 924} {"train_loss": -10.970460891723633, "global_step": 155393, "epoch": 924} {"train_loss": -10.712069511413574, "global_step": 155394, "epoch": 924} {"train_loss": -10.401784896850586, "global_step": 155395, "epoch": 924} {"train_loss": -10.97223949432373, "global_step": 155396, "epoch": 924} {"train_loss": -10.616470336914062, "global_step": 155397, "epoch": 924} {"train_loss": -10.827629089355469, "global_step": 155398, "epoch": 924} {"train_loss": -10.765550164949326, "global_step": 155399, "epoch": 924, "val_loss": 230141.65625} {"train_loss": -10.964868545532227, "global_step": 155400, "epoch": 925} {"train_loss": -10.959327697753906, "global_step": 155401, "epoch": 925} {"train_loss": -10.8026762008667, "global_step": 155402, "epoch": 925} {"train_loss": -11.278724670410156, "global_step": 155403, "epoch": 925} {"train_loss": -10.770061492919922, "global_step": 155404, "epoch": 925} {"train_loss": -10.750367164611816, "global_step": 155405, "epoch": 925} {"train_loss": -10.813283920288086, "global_step": 155406, "epoch": 925} {"train_loss": -10.287612915039062, "global_step": 155407, "epoch": 925} {"train_loss": -10.348808288574219, "global_step": 155408, "epoch": 925} {"train_loss": -10.568071365356445, "global_step": 155409, "epoch": 925} {"train_loss": -10.26082992553711, "global_step": 155410, "epoch": 925} {"train_loss": -10.52228832244873, "global_step": 155411, "epoch": 925} {"train_loss": -10.547513961791992, "global_step": 155412, "epoch": 925} {"train_loss": -10.289345741271973, "global_step": 155413, "epoch": 925} {"train_loss": -10.453907012939453, "global_step": 155414, "epoch": 925} {"train_loss": -9.947286605834961, "global_step": 155415, "epoch": 925} {"train_loss": -10.200323104858398, "global_step": 155416, "epoch": 925} {"train_loss": -10.819999694824219, "global_step": 155417, "epoch": 925} {"train_loss": -10.298315048217773, "global_step": 155418, "epoch": 925} {"train_loss": -10.879936218261719, "global_step": 155419, "epoch": 925} {"train_loss": -10.375248908996582, "global_step": 155420, "epoch": 925} {"train_loss": -10.599055290222168, "global_step": 155421, "epoch": 925} {"train_loss": -10.420796394348145, "global_step": 155422, "epoch": 925} {"train_loss": -10.911687850952148, "global_step": 155423, "epoch": 925} {"train_loss": -10.71524429321289, "global_step": 155424, "epoch": 925} {"train_loss": -10.828546524047852, "global_step": 155425, "epoch": 925} {"train_loss": -10.696273803710938, "global_step": 155426, "epoch": 925} {"train_loss": -10.684749603271484, "global_step": 155427, "epoch": 925} {"train_loss": -10.841485977172852, "global_step": 155428, "epoch": 925} {"train_loss": -10.883692741394043, "global_step": 155429, "epoch": 925} {"train_loss": -10.571945190429688, "global_step": 155430, "epoch": 925} {"train_loss": -10.800289154052734, "global_step": 155431, "epoch": 925} {"train_loss": -10.627692222595215, "global_step": 155432, "epoch": 925} {"train_loss": -11.033707618713379, "global_step": 155433, "epoch": 925} {"train_loss": -10.731144905090332, "global_step": 155434, "epoch": 925} {"train_loss": -11.092090606689453, "global_step": 155435, "epoch": 925} {"train_loss": -10.592561721801758, "global_step": 155436, "epoch": 925} {"train_loss": -11.009713172912598, "global_step": 155437, "epoch": 925} {"train_loss": -10.94882869720459, "global_step": 155438, "epoch": 925} {"train_loss": -11.153572082519531, "global_step": 155439, "epoch": 925} {"train_loss": -10.861621856689453, "global_step": 155440, "epoch": 925} {"train_loss": -11.175729751586914, "global_step": 155441, "epoch": 925} {"train_loss": -10.963400840759277, "global_step": 155442, "epoch": 925} {"train_loss": -10.98894214630127, "global_step": 155443, "epoch": 925} {"train_loss": -11.011749267578125, "global_step": 155444, "epoch": 925} {"train_loss": -10.916906356811523, "global_step": 155445, "epoch": 925} {"train_loss": -10.964847564697266, "global_step": 155446, "epoch": 925} {"train_loss": -10.670454025268555, "global_step": 155447, "epoch": 925} {"train_loss": -10.856613159179688, "global_step": 155448, "epoch": 925} {"train_loss": -10.882543563842773, "global_step": 155449, "epoch": 925} {"train_loss": -10.70707893371582, "global_step": 155450, "epoch": 925} {"train_loss": -11.125123977661133, "global_step": 155451, "epoch": 925} {"train_loss": -10.726570129394531, "global_step": 155452, "epoch": 925} {"train_loss": -10.82573127746582, "global_step": 155453, "epoch": 925} {"train_loss": -11.040961265563965, "global_step": 155454, "epoch": 925} {"train_loss": -10.994453430175781, "global_step": 155455, "epoch": 925} {"train_loss": -10.911794662475586, "global_step": 155456, "epoch": 925} {"train_loss": -10.964080810546875, "global_step": 155457, "epoch": 925} {"train_loss": -10.95622730255127, "global_step": 155458, "epoch": 925} {"train_loss": -11.032644271850586, "global_step": 155459, "epoch": 925} {"train_loss": -10.867015838623047, "global_step": 155460, "epoch": 925} {"train_loss": -10.54541301727295, "global_step": 155461, "epoch": 925} {"train_loss": -10.309551239013672, "global_step": 155462, "epoch": 925} {"train_loss": -10.833629608154297, "global_step": 155463, "epoch": 925} {"train_loss": -10.36528205871582, "global_step": 155464, "epoch": 925} {"train_loss": -10.912557601928711, "global_step": 155465, "epoch": 925} {"train_loss": -10.585351943969727, "global_step": 155466, "epoch": 925} {"train_loss": -11.161809921264648, "global_step": 155467, "epoch": 925} {"train_loss": -10.318658828735352, "global_step": 155468, "epoch": 925} {"train_loss": -10.588214874267578, "global_step": 155469, "epoch": 925} {"train_loss": -10.663101196289062, "global_step": 155470, "epoch": 925} {"train_loss": -10.421707153320312, "global_step": 155471, "epoch": 925} {"train_loss": -10.792348861694336, "global_step": 155472, "epoch": 925} {"train_loss": -9.745738983154297, "global_step": 155473, "epoch": 925} {"train_loss": -10.722329139709473, "global_step": 155474, "epoch": 925} {"train_loss": -10.302391052246094, "global_step": 155475, "epoch": 925} {"train_loss": -10.60162353515625, "global_step": 155476, "epoch": 925} {"train_loss": -10.688871383666992, "global_step": 155477, "epoch": 925} {"train_loss": -10.862080574035645, "global_step": 155478, "epoch": 925} {"train_loss": -10.560752868652344, "global_step": 155479, "epoch": 925} {"train_loss": -10.581313133239746, "global_step": 155480, "epoch": 925} {"train_loss": -10.753484725952148, "global_step": 155481, "epoch": 925} {"train_loss": -10.619857788085938, "global_step": 155482, "epoch": 925} {"train_loss": -10.550613403320312, "global_step": 155483, "epoch": 925} {"train_loss": -10.905106544494629, "global_step": 155484, "epoch": 925} {"train_loss": -10.461542129516602, "global_step": 155485, "epoch": 925} {"train_loss": -10.93966007232666, "global_step": 155486, "epoch": 925} {"train_loss": -10.66514778137207, "global_step": 155487, "epoch": 925} {"train_loss": -10.782020568847656, "global_step": 155488, "epoch": 925} {"train_loss": -10.877346992492676, "global_step": 155489, "epoch": 925} {"train_loss": -10.781442642211914, "global_step": 155490, "epoch": 925} {"train_loss": -10.793863296508789, "global_step": 155491, "epoch": 925} {"train_loss": -10.26559066772461, "global_step": 155492, "epoch": 925} {"train_loss": -10.775915145874023, "global_step": 155493, "epoch": 925} {"train_loss": -10.922719955444336, "global_step": 155494, "epoch": 925} {"train_loss": -10.820544242858887, "global_step": 155495, "epoch": 925} {"train_loss": -10.909599304199219, "global_step": 155496, "epoch": 925} {"train_loss": -10.754688262939453, "global_step": 155497, "epoch": 925} {"train_loss": -10.814953804016113, "global_step": 155498, "epoch": 925} {"train_loss": -10.771455764770508, "global_step": 155499, "epoch": 925} {"train_loss": -10.97239875793457, "global_step": 155500, "epoch": 925} {"train_loss": -10.828944206237793, "global_step": 155501, "epoch": 925} {"train_loss": -10.846117973327637, "global_step": 155502, "epoch": 925} {"train_loss": -10.607147216796875, "global_step": 155503, "epoch": 925} {"train_loss": -11.023720741271973, "global_step": 155504, "epoch": 925} {"train_loss": -10.709980964660645, "global_step": 155505, "epoch": 925} {"train_loss": -10.832145690917969, "global_step": 155506, "epoch": 925} {"train_loss": -10.462392807006836, "global_step": 155507, "epoch": 925} {"train_loss": -10.915528297424316, "global_step": 155508, "epoch": 925} {"train_loss": -10.720155715942383, "global_step": 155509, "epoch": 925} {"train_loss": -10.485939025878906, "global_step": 155510, "epoch": 925} {"train_loss": -10.914339065551758, "global_step": 155511, "epoch": 925} {"train_loss": -10.449987411499023, "global_step": 155512, "epoch": 925} {"train_loss": -10.570745468139648, "global_step": 155513, "epoch": 925} {"train_loss": -10.261842727661133, "global_step": 155514, "epoch": 925} {"train_loss": -10.703882217407227, "global_step": 155515, "epoch": 925} {"train_loss": -10.706657409667969, "global_step": 155516, "epoch": 925} {"train_loss": -10.2801513671875, "global_step": 155517, "epoch": 925} {"train_loss": -10.945552825927734, "global_step": 155518, "epoch": 925} {"train_loss": -10.588007926940918, "global_step": 155519, "epoch": 925} {"train_loss": -10.582491874694824, "global_step": 155520, "epoch": 925} {"train_loss": -10.868732452392578, "global_step": 155521, "epoch": 925} {"train_loss": -10.112960815429688, "global_step": 155522, "epoch": 925} {"train_loss": -10.993103981018066, "global_step": 155523, "epoch": 925} {"train_loss": -10.389688491821289, "global_step": 155524, "epoch": 925} {"train_loss": -10.671207427978516, "global_step": 155525, "epoch": 925} {"train_loss": -11.060065269470215, "global_step": 155526, "epoch": 925} {"train_loss": -10.459770202636719, "global_step": 155527, "epoch": 925} {"train_loss": -10.79796028137207, "global_step": 155528, "epoch": 925} {"train_loss": -10.547279357910156, "global_step": 155529, "epoch": 925} {"train_loss": -10.655790328979492, "global_step": 155530, "epoch": 925} {"train_loss": -10.701578140258789, "global_step": 155531, "epoch": 925} {"train_loss": -10.327945709228516, "global_step": 155532, "epoch": 925} {"train_loss": -10.289970397949219, "global_step": 155533, "epoch": 925} {"train_loss": -10.337968826293945, "global_step": 155534, "epoch": 925} {"train_loss": -10.161612510681152, "global_step": 155535, "epoch": 925} {"train_loss": -10.72639274597168, "global_step": 155536, "epoch": 925} {"train_loss": -9.683781623840332, "global_step": 155537, "epoch": 925} {"train_loss": -10.857765197753906, "global_step": 155538, "epoch": 925} {"train_loss": -10.226089477539062, "global_step": 155539, "epoch": 925} {"train_loss": -10.68215560913086, "global_step": 155540, "epoch": 925} {"train_loss": -10.358302116394043, "global_step": 155541, "epoch": 925} {"train_loss": -10.143892288208008, "global_step": 155542, "epoch": 925} {"train_loss": -10.660333633422852, "global_step": 155543, "epoch": 925} {"train_loss": -10.103368759155273, "global_step": 155544, "epoch": 925} {"train_loss": -10.638261795043945, "global_step": 155545, "epoch": 925} {"train_loss": -10.752603530883789, "global_step": 155546, "epoch": 925} {"train_loss": -10.288288116455078, "global_step": 155547, "epoch": 925} {"train_loss": -10.919655799865723, "global_step": 155548, "epoch": 925} {"train_loss": -10.333091735839844, "global_step": 155549, "epoch": 925} {"train_loss": -10.58096694946289, "global_step": 155550, "epoch": 925} {"train_loss": -10.460155487060547, "global_step": 155551, "epoch": 925} {"train_loss": -10.703581809997559, "global_step": 155552, "epoch": 925} {"train_loss": -10.722359657287598, "global_step": 155553, "epoch": 925} {"train_loss": -10.574195861816406, "global_step": 155554, "epoch": 925} {"train_loss": -10.768104553222656, "global_step": 155555, "epoch": 925} {"train_loss": -10.858525276184082, "global_step": 155556, "epoch": 925} {"train_loss": -10.66714096069336, "global_step": 155557, "epoch": 925} {"train_loss": -10.898153305053711, "global_step": 155558, "epoch": 925} {"train_loss": -10.447696685791016, "global_step": 155559, "epoch": 925} {"train_loss": -10.60073184967041, "global_step": 155560, "epoch": 925} {"train_loss": -10.810884475708008, "global_step": 155561, "epoch": 925} {"train_loss": -10.435287475585938, "global_step": 155562, "epoch": 925} {"train_loss": -11.048177719116211, "global_step": 155563, "epoch": 925} {"train_loss": -10.249122619628906, "global_step": 155564, "epoch": 925} {"train_loss": -10.894674301147461, "global_step": 155565, "epoch": 925} {"train_loss": -10.723088264465332, "global_step": 155566, "epoch": 925} {"train_loss": -10.67634554136367, "global_step": 155567, "epoch": 925, "val_loss": 232564.171875, "train_action_mse_error": 1.442600965499878} {"train_loss": -10.787985801696777, "global_step": 155568, "epoch": 926} {"train_loss": -10.627937316894531, "global_step": 155569, "epoch": 926} {"train_loss": -10.960567474365234, "global_step": 155570, "epoch": 926} {"train_loss": -10.4208402633667, "global_step": 155571, "epoch": 926} {"train_loss": -10.904150009155273, "global_step": 155572, "epoch": 926} {"train_loss": -10.528560638427734, "global_step": 155573, "epoch": 926} {"train_loss": -11.118581771850586, "global_step": 155574, "epoch": 926} {"train_loss": -11.115690231323242, "global_step": 155575, "epoch": 926} {"train_loss": -10.821584701538086, "global_step": 155576, "epoch": 926} {"train_loss": -10.912925720214844, "global_step": 155577, "epoch": 926} {"train_loss": -10.786012649536133, "global_step": 155578, "epoch": 926} {"train_loss": -11.138422012329102, "global_step": 155579, "epoch": 926} {"train_loss": -11.025035858154297, "global_step": 155580, "epoch": 926} {"train_loss": -10.917095184326172, "global_step": 155581, "epoch": 926} {"train_loss": -10.90023422241211, "global_step": 155582, "epoch": 926} {"train_loss": -10.939332962036133, "global_step": 155583, "epoch": 926} {"train_loss": -10.80120849609375, "global_step": 155584, "epoch": 926} {"train_loss": -11.064901351928711, "global_step": 155585, "epoch": 926} {"train_loss": -10.939065933227539, "global_step": 155586, "epoch": 926} {"train_loss": -11.063363075256348, "global_step": 155587, "epoch": 926} {"train_loss": -10.971654891967773, "global_step": 155588, "epoch": 926} {"train_loss": -11.162618637084961, "global_step": 155589, "epoch": 926} {"train_loss": -11.1268310546875, "global_step": 155590, "epoch": 926} {"train_loss": -11.212182998657227, "global_step": 155591, "epoch": 926} {"train_loss": -11.162216186523438, "global_step": 155592, "epoch": 926} {"train_loss": -10.941028594970703, "global_step": 155593, "epoch": 926} {"train_loss": -10.981084823608398, "global_step": 155594, "epoch": 926} {"train_loss": -11.085295677185059, "global_step": 155595, "epoch": 926} {"train_loss": -11.229974746704102, "global_step": 155596, "epoch": 926} {"train_loss": -10.996862411499023, "global_step": 155597, "epoch": 926} {"train_loss": -11.223442077636719, "global_step": 155598, "epoch": 926} {"train_loss": -11.034738540649414, "global_step": 155599, "epoch": 926} {"train_loss": -10.923592567443848, "global_step": 155600, "epoch": 926} {"train_loss": -10.753297805786133, "global_step": 155601, "epoch": 926} {"train_loss": -10.920888900756836, "global_step": 155602, "epoch": 926} {"train_loss": -10.445191383361816, "global_step": 155603, "epoch": 926} {"train_loss": -10.811504364013672, "global_step": 155604, "epoch": 926} {"train_loss": -11.032182693481445, "global_step": 155605, "epoch": 926} {"train_loss": -10.812907218933105, "global_step": 155606, "epoch": 926} {"train_loss": -10.317743301391602, "global_step": 155607, "epoch": 926} {"train_loss": -10.935559272766113, "global_step": 155608, "epoch": 926} {"train_loss": -10.382427215576172, "global_step": 155609, "epoch": 926} {"train_loss": -9.313203811645508, "global_step": 155610, "epoch": 926} {"train_loss": -10.760030746459961, "global_step": 155611, "epoch": 926} {"train_loss": -10.233497619628906, "global_step": 155612, "epoch": 926} {"train_loss": -9.915040969848633, "global_step": 155613, "epoch": 926} {"train_loss": -10.729467391967773, "global_step": 155614, "epoch": 926} {"train_loss": -10.135746955871582, "global_step": 155615, "epoch": 926} {"train_loss": -10.5466947555542, "global_step": 155616, "epoch": 926} {"train_loss": -10.45228099822998, "global_step": 155617, "epoch": 926} {"train_loss": -10.378942489624023, "global_step": 155618, "epoch": 926} {"train_loss": -10.581101417541504, "global_step": 155619, "epoch": 926} {"train_loss": -10.477813720703125, "global_step": 155620, "epoch": 926} {"train_loss": -10.673593521118164, "global_step": 155621, "epoch": 926} {"train_loss": -10.501107215881348, "global_step": 155622, "epoch": 926} {"train_loss": -10.78105354309082, "global_step": 155623, "epoch": 926} {"train_loss": -10.57707405090332, "global_step": 155624, "epoch": 926} {"train_loss": -10.613363265991211, "global_step": 155625, "epoch": 926} {"train_loss": -10.722879409790039, "global_step": 155626, "epoch": 926} {"train_loss": -10.46855354309082, "global_step": 155627, "epoch": 926} {"train_loss": -10.926742553710938, "global_step": 155628, "epoch": 926} {"train_loss": -10.447317123413086, "global_step": 155629, "epoch": 926} {"train_loss": -10.896757125854492, "global_step": 155630, "epoch": 926} {"train_loss": -10.136246681213379, "global_step": 155631, "epoch": 926} {"train_loss": -10.429351806640625, "global_step": 155632, "epoch": 926} {"train_loss": -10.772115707397461, "global_step": 155633, "epoch": 926} {"train_loss": -10.363174438476562, "global_step": 155634, "epoch": 926} {"train_loss": -10.75279712677002, "global_step": 155635, "epoch": 926} {"train_loss": -10.236879348754883, "global_step": 155636, "epoch": 926} {"train_loss": -10.850436210632324, "global_step": 155637, "epoch": 926} {"train_loss": -10.278200149536133, "global_step": 155638, "epoch": 926} {"train_loss": -10.432927131652832, "global_step": 155639, "epoch": 926} {"train_loss": -10.64213752746582, "global_step": 155640, "epoch": 926} {"train_loss": -10.496016502380371, "global_step": 155641, "epoch": 926} {"train_loss": -10.78068733215332, "global_step": 155642, "epoch": 926} {"train_loss": -10.973844528198242, "global_step": 155643, "epoch": 926} {"train_loss": -10.52120590209961, "global_step": 155644, "epoch": 926} {"train_loss": -10.802225112915039, "global_step": 155645, "epoch": 926} {"train_loss": -10.596585273742676, "global_step": 155646, "epoch": 926} {"train_loss": -10.97603988647461, "global_step": 155647, "epoch": 926} {"train_loss": -10.566499710083008, "global_step": 155648, "epoch": 926} {"train_loss": -10.692501068115234, "global_step": 155649, "epoch": 926} {"train_loss": -10.504671096801758, "global_step": 155650, "epoch": 926} {"train_loss": -10.860427856445312, "global_step": 155651, "epoch": 926} {"train_loss": -10.52773666381836, "global_step": 155652, "epoch": 926} {"train_loss": -11.189882278442383, "global_step": 155653, "epoch": 926} {"train_loss": -10.821283340454102, "global_step": 155654, "epoch": 926} {"train_loss": -11.016613960266113, "global_step": 155655, "epoch": 926} {"train_loss": -10.733266830444336, "global_step": 155656, "epoch": 926} {"train_loss": -10.636229515075684, "global_step": 155657, "epoch": 926} {"train_loss": -10.62150764465332, "global_step": 155658, "epoch": 926} {"train_loss": -10.750547409057617, "global_step": 155659, "epoch": 926} {"train_loss": -11.103866577148438, "global_step": 155660, "epoch": 926} {"train_loss": -11.004556655883789, "global_step": 155661, "epoch": 926} {"train_loss": -11.137924194335938, "global_step": 155662, "epoch": 926} {"train_loss": -11.0198392868042, "global_step": 155663, "epoch": 926} {"train_loss": -11.17890739440918, "global_step": 155664, "epoch": 926} {"train_loss": -10.847967147827148, "global_step": 155665, "epoch": 926} {"train_loss": -11.176362991333008, "global_step": 155666, "epoch": 926} {"train_loss": -11.063921928405762, "global_step": 155667, "epoch": 926} {"train_loss": -11.038235664367676, "global_step": 155668, "epoch": 926} {"train_loss": -10.817434310913086, "global_step": 155669, "epoch": 926} {"train_loss": -10.91319465637207, "global_step": 155670, "epoch": 926} {"train_loss": -10.858505249023438, "global_step": 155671, "epoch": 926} {"train_loss": -10.940193176269531, "global_step": 155672, "epoch": 926} {"train_loss": -10.750541687011719, "global_step": 155673, "epoch": 926} {"train_loss": -10.57750415802002, "global_step": 155674, "epoch": 926} {"train_loss": -10.914388656616211, "global_step": 155675, "epoch": 926} {"train_loss": -10.517696380615234, "global_step": 155676, "epoch": 926} {"train_loss": -10.618913650512695, "global_step": 155677, "epoch": 926} {"train_loss": -10.792901992797852, "global_step": 155678, "epoch": 926} {"train_loss": -10.593694686889648, "global_step": 155679, "epoch": 926} {"train_loss": -10.694652557373047, "global_step": 155680, "epoch": 926} {"train_loss": -10.635638236999512, "global_step": 155681, "epoch": 926} {"train_loss": -10.93370246887207, "global_step": 155682, "epoch": 926} {"train_loss": -10.69713306427002, "global_step": 155683, "epoch": 926} {"train_loss": -10.900535583496094, "global_step": 155684, "epoch": 926} {"train_loss": -10.252522468566895, "global_step": 155685, "epoch": 926} {"train_loss": -10.127631187438965, "global_step": 155686, "epoch": 926} {"train_loss": -10.180351257324219, "global_step": 155687, "epoch": 926} {"train_loss": -10.665918350219727, "global_step": 155688, "epoch": 926} {"train_loss": -9.244089126586914, "global_step": 155689, "epoch": 926} {"train_loss": -10.607409477233887, "global_step": 155690, "epoch": 926} {"train_loss": -10.308399200439453, "global_step": 155691, "epoch": 926} {"train_loss": -10.631523132324219, "global_step": 155692, "epoch": 926} {"train_loss": -10.315788269042969, "global_step": 155693, "epoch": 926} {"train_loss": -10.332573890686035, "global_step": 155694, "epoch": 926} {"train_loss": -10.505511283874512, "global_step": 155695, "epoch": 926} {"train_loss": -10.72308349609375, "global_step": 155696, "epoch": 926} {"train_loss": -10.568463325500488, "global_step": 155697, "epoch": 926} {"train_loss": -10.644111633300781, "global_step": 155698, "epoch": 926} {"train_loss": -10.295787811279297, "global_step": 155699, "epoch": 926} {"train_loss": -10.622812271118164, "global_step": 155700, "epoch": 926} {"train_loss": -10.79037857055664, "global_step": 155701, "epoch": 926} {"train_loss": -10.420174598693848, "global_step": 155702, "epoch": 926} {"train_loss": -10.6947021484375, "global_step": 155703, "epoch": 926} {"train_loss": -10.57540512084961, "global_step": 155704, "epoch": 926} {"train_loss": -10.643898010253906, "global_step": 155705, "epoch": 926} {"train_loss": -10.79999828338623, "global_step": 155706, "epoch": 926} {"train_loss": -10.692628860473633, "global_step": 155707, "epoch": 926} {"train_loss": -10.452424049377441, "global_step": 155708, "epoch": 926} {"train_loss": -10.544239044189453, "global_step": 155709, "epoch": 926} {"train_loss": -10.967527389526367, "global_step": 155710, "epoch": 926} {"train_loss": -10.66389274597168, "global_step": 155711, "epoch": 926} {"train_loss": -10.817075729370117, "global_step": 155712, "epoch": 926} {"train_loss": -10.62794303894043, "global_step": 155713, "epoch": 926} {"train_loss": -10.594521522521973, "global_step": 155714, "epoch": 926} {"train_loss": -11.009112358093262, "global_step": 155715, "epoch": 926} {"train_loss": -10.364171028137207, "global_step": 155716, "epoch": 926} {"train_loss": -10.857062339782715, "global_step": 155717, "epoch": 926} {"train_loss": -10.500577926635742, "global_step": 155718, "epoch": 926} {"train_loss": -10.729894638061523, "global_step": 155719, "epoch": 926} {"train_loss": -10.8084135055542, "global_step": 155720, "epoch": 926} {"train_loss": -10.960536003112793, "global_step": 155721, "epoch": 926} {"train_loss": -10.872476577758789, "global_step": 155722, "epoch": 926} {"train_loss": -10.871850967407227, "global_step": 155723, "epoch": 926} {"train_loss": -11.166306495666504, "global_step": 155724, "epoch": 926} {"train_loss": -10.828080177307129, "global_step": 155725, "epoch": 926} {"train_loss": -11.007013320922852, "global_step": 155726, "epoch": 926} {"train_loss": -10.937530517578125, "global_step": 155727, "epoch": 926} {"train_loss": -11.002729415893555, "global_step": 155728, "epoch": 926} {"train_loss": -11.01960563659668, "global_step": 155729, "epoch": 926} {"train_loss": -11.07601547241211, "global_step": 155730, "epoch": 926} {"train_loss": -10.930841445922852, "global_step": 155731, "epoch": 926} {"train_loss": -11.05612564086914, "global_step": 155732, "epoch": 926} {"train_loss": -11.065556526184082, "global_step": 155733, "epoch": 926} {"train_loss": -11.072484970092773, "global_step": 155734, "epoch": 926} {"train_loss": -10.735158982731047, "global_step": 155735, "epoch": 926, "val_loss": 233122.390625} {"train_loss": -11.00833511352539, "global_step": 155736, "epoch": 927} {"train_loss": -11.2234468460083, "global_step": 155737, "epoch": 927} {"train_loss": -11.00512409210205, "global_step": 155738, "epoch": 927} {"train_loss": -11.090167999267578, "global_step": 155739, "epoch": 927} {"train_loss": -11.02286434173584, "global_step": 155740, "epoch": 927} {"train_loss": -11.1111478805542, "global_step": 155741, "epoch": 927} {"train_loss": -11.093818664550781, "global_step": 155742, "epoch": 927} {"train_loss": -11.026880264282227, "global_step": 155743, "epoch": 927} {"train_loss": -11.171627044677734, "global_step": 155744, "epoch": 927} {"train_loss": -11.077330589294434, "global_step": 155745, "epoch": 927} {"train_loss": -11.236647605895996, "global_step": 155746, "epoch": 927} {"train_loss": -11.11473274230957, "global_step": 155747, "epoch": 927} {"train_loss": -11.013274192810059, "global_step": 155748, "epoch": 927} {"train_loss": -10.966651916503906, "global_step": 155749, "epoch": 927} {"train_loss": -10.945390701293945, "global_step": 155750, "epoch": 927} {"train_loss": -11.147684097290039, "global_step": 155751, "epoch": 927} {"train_loss": -11.048828125, "global_step": 155752, "epoch": 927} {"train_loss": -10.896240234375, "global_step": 155753, "epoch": 927} {"train_loss": -10.584823608398438, "global_step": 155754, "epoch": 927} {"train_loss": -10.825977325439453, "global_step": 155755, "epoch": 927} {"train_loss": -10.896961212158203, "global_step": 155756, "epoch": 927} {"train_loss": -11.15340805053711, "global_step": 155757, "epoch": 927} {"train_loss": -10.785865783691406, "global_step": 155758, "epoch": 927} {"train_loss": -10.178062438964844, "global_step": 155759, "epoch": 927} {"train_loss": -10.740297317504883, "global_step": 155760, "epoch": 927} {"train_loss": -10.694356918334961, "global_step": 155761, "epoch": 927} {"train_loss": -9.699637413024902, "global_step": 155762, "epoch": 927} {"train_loss": -10.938472747802734, "global_step": 155763, "epoch": 927} {"train_loss": -10.29593276977539, "global_step": 155764, "epoch": 927} {"train_loss": -10.472978591918945, "global_step": 155765, "epoch": 927} {"train_loss": -10.537040710449219, "global_step": 155766, "epoch": 927} {"train_loss": -10.475896835327148, "global_step": 155767, "epoch": 927} {"train_loss": -10.832257270812988, "global_step": 155768, "epoch": 927} {"train_loss": -10.198188781738281, "global_step": 155769, "epoch": 927} {"train_loss": -11.0174560546875, "global_step": 155770, "epoch": 927} {"train_loss": -10.647059440612793, "global_step": 155771, "epoch": 927} {"train_loss": -10.541004180908203, "global_step": 155772, "epoch": 927} {"train_loss": -10.460451126098633, "global_step": 155773, "epoch": 927} {"train_loss": -10.718883514404297, "global_step": 155774, "epoch": 927} {"train_loss": -10.236000061035156, "global_step": 155775, "epoch": 927} {"train_loss": -10.783002853393555, "global_step": 155776, "epoch": 927} {"train_loss": -10.664440155029297, "global_step": 155777, "epoch": 927} {"train_loss": -10.83489990234375, "global_step": 155778, "epoch": 927} {"train_loss": -10.800569534301758, "global_step": 155779, "epoch": 927} {"train_loss": -10.467660903930664, "global_step": 155780, "epoch": 927} {"train_loss": -10.722002029418945, "global_step": 155781, "epoch": 927} {"train_loss": -10.891871452331543, "global_step": 155782, "epoch": 927} {"train_loss": -10.363275527954102, "global_step": 155783, "epoch": 927} {"train_loss": -10.757064819335938, "global_step": 155784, "epoch": 927} {"train_loss": -10.876492500305176, "global_step": 155785, "epoch": 927} {"train_loss": -10.735723495483398, "global_step": 155786, "epoch": 927} {"train_loss": -10.57965087890625, "global_step": 155787, "epoch": 927} {"train_loss": -10.949163436889648, "global_step": 155788, "epoch": 927} {"train_loss": -10.94876480102539, "global_step": 155789, "epoch": 927} {"train_loss": -10.93582534790039, "global_step": 155790, "epoch": 927} {"train_loss": -10.890054702758789, "global_step": 155791, "epoch": 927} {"train_loss": -10.824020385742188, "global_step": 155792, "epoch": 927} {"train_loss": -10.750818252563477, "global_step": 155793, "epoch": 927} {"train_loss": -10.823579788208008, "global_step": 155794, "epoch": 927} {"train_loss": -10.819316864013672, "global_step": 155795, "epoch": 927} {"train_loss": -10.881765365600586, "global_step": 155796, "epoch": 927} {"train_loss": -10.893098831176758, "global_step": 155797, "epoch": 927} {"train_loss": -11.025453567504883, "global_step": 155798, "epoch": 927} {"train_loss": -11.26491641998291, "global_step": 155799, "epoch": 927} {"train_loss": -10.961104393005371, "global_step": 155800, "epoch": 927} {"train_loss": -10.997843742370605, "global_step": 155801, "epoch": 927} {"train_loss": -11.040428161621094, "global_step": 155802, "epoch": 927} {"train_loss": -10.884195327758789, "global_step": 155803, "epoch": 927} {"train_loss": -11.174644470214844, "global_step": 155804, "epoch": 927} {"train_loss": -10.980817794799805, "global_step": 155805, "epoch": 927} {"train_loss": -11.08975887298584, "global_step": 155806, "epoch": 927} {"train_loss": -11.088295936584473, "global_step": 155807, "epoch": 927} {"train_loss": -11.140678405761719, "global_step": 155808, "epoch": 927} {"train_loss": -10.843327522277832, "global_step": 155809, "epoch": 927} {"train_loss": -10.986637115478516, "global_step": 155810, "epoch": 927} {"train_loss": -10.928756713867188, "global_step": 155811, "epoch": 927} {"train_loss": -11.204265594482422, "global_step": 155812, "epoch": 927} {"train_loss": -11.1751070022583, "global_step": 155813, "epoch": 927} {"train_loss": -11.128597259521484, "global_step": 155814, "epoch": 927} {"train_loss": -11.329994201660156, "global_step": 155815, "epoch": 927} {"train_loss": -11.250431060791016, "global_step": 155816, "epoch": 927} {"train_loss": -11.143548965454102, "global_step": 155817, "epoch": 927} {"train_loss": -11.193403244018555, "global_step": 155818, "epoch": 927} {"train_loss": -11.490679740905762, "global_step": 155819, "epoch": 927} {"train_loss": -11.106292724609375, "global_step": 155820, "epoch": 927} {"train_loss": -11.342499732971191, "global_step": 155821, "epoch": 927} {"train_loss": -11.164632797241211, "global_step": 155822, "epoch": 927} {"train_loss": -11.126845359802246, "global_step": 155823, "epoch": 927} {"train_loss": -10.978229522705078, "global_step": 155824, "epoch": 927} {"train_loss": -10.833085060119629, "global_step": 155825, "epoch": 927} {"train_loss": -10.929561614990234, "global_step": 155826, "epoch": 927} {"train_loss": -11.069899559020996, "global_step": 155827, "epoch": 927} {"train_loss": -10.60014533996582, "global_step": 155828, "epoch": 927} {"train_loss": -10.06213665008545, "global_step": 155829, "epoch": 927} {"train_loss": -10.537456512451172, "global_step": 155830, "epoch": 927} {"train_loss": -10.656063079833984, "global_step": 155831, "epoch": 927} {"train_loss": -9.925880432128906, "global_step": 155832, "epoch": 927} {"train_loss": -10.657492637634277, "global_step": 155833, "epoch": 927} {"train_loss": -10.333608627319336, "global_step": 155834, "epoch": 927} {"train_loss": -10.659412384033203, "global_step": 155835, "epoch": 927} {"train_loss": -9.42922306060791, "global_step": 155836, "epoch": 927} {"train_loss": -10.66916275024414, "global_step": 155837, "epoch": 927} {"train_loss": -9.013669967651367, "global_step": 155838, "epoch": 927} {"train_loss": -8.949344635009766, "global_step": 155839, "epoch": 927} {"train_loss": -9.864631652832031, "global_step": 155840, "epoch": 927} {"train_loss": -9.681346893310547, "global_step": 155841, "epoch": 927} {"train_loss": -9.25526237487793, "global_step": 155842, "epoch": 927} {"train_loss": -10.79078483581543, "global_step": 155843, "epoch": 927} {"train_loss": -8.983016967773438, "global_step": 155844, "epoch": 927} {"train_loss": -9.750635147094727, "global_step": 155845, "epoch": 927} {"train_loss": -10.291058540344238, "global_step": 155846, "epoch": 927} {"train_loss": -10.158428192138672, "global_step": 155847, "epoch": 927} {"train_loss": -10.499496459960938, "global_step": 155848, "epoch": 927} {"train_loss": -9.497949600219727, "global_step": 155849, "epoch": 927} {"train_loss": -10.233757972717285, "global_step": 155850, "epoch": 927} {"train_loss": -10.544906616210938, "global_step": 155851, "epoch": 927} {"train_loss": -9.914362907409668, "global_step": 155852, "epoch": 927} {"train_loss": -10.63698673248291, "global_step": 155853, "epoch": 927} {"train_loss": -10.431532859802246, "global_step": 155854, "epoch": 927} {"train_loss": -9.936614036560059, "global_step": 155855, "epoch": 927} {"train_loss": -10.72578239440918, "global_step": 155856, "epoch": 927} {"train_loss": -10.398143768310547, "global_step": 155857, "epoch": 927} {"train_loss": -10.293960571289062, "global_step": 155858, "epoch": 927} {"train_loss": -10.302760124206543, "global_step": 155859, "epoch": 927} {"train_loss": -10.389748573303223, "global_step": 155860, "epoch": 927} {"train_loss": -10.077486991882324, "global_step": 155861, "epoch": 927} {"train_loss": -10.623798370361328, "global_step": 155862, "epoch": 927} {"train_loss": -10.37704849243164, "global_step": 155863, "epoch": 927} {"train_loss": -10.197569847106934, "global_step": 155864, "epoch": 927} {"train_loss": -10.398096084594727, "global_step": 155865, "epoch": 927} {"train_loss": -10.610360145568848, "global_step": 155866, "epoch": 927} {"train_loss": -10.460179328918457, "global_step": 155867, "epoch": 927} {"train_loss": -10.441845893859863, "global_step": 155868, "epoch": 927} {"train_loss": -10.818855285644531, "global_step": 155869, "epoch": 927} {"train_loss": -10.316055297851562, "global_step": 155870, "epoch": 927} {"train_loss": -10.524145126342773, "global_step": 155871, "epoch": 927} {"train_loss": -10.78642463684082, "global_step": 155872, "epoch": 927} {"train_loss": -10.752880096435547, "global_step": 155873, "epoch": 927} {"train_loss": -10.728415489196777, "global_step": 155874, "epoch": 927} {"train_loss": -10.668333053588867, "global_step": 155875, "epoch": 927} {"train_loss": -10.631278991699219, "global_step": 155876, "epoch": 927} {"train_loss": -10.70447826385498, "global_step": 155877, "epoch": 927} {"train_loss": -10.699724197387695, "global_step": 155878, "epoch": 927} {"train_loss": -10.768512725830078, "global_step": 155879, "epoch": 927} {"train_loss": -10.910323143005371, "global_step": 155880, "epoch": 927} {"train_loss": -10.928975105285645, "global_step": 155881, "epoch": 927} {"train_loss": -10.816886901855469, "global_step": 155882, "epoch": 927} {"train_loss": -11.000617980957031, "global_step": 155883, "epoch": 927} {"train_loss": -11.015336036682129, "global_step": 155884, "epoch": 927} {"train_loss": -10.89997673034668, "global_step": 155885, "epoch": 927} {"train_loss": -10.976673126220703, "global_step": 155886, "epoch": 927} {"train_loss": -10.887628555297852, "global_step": 155887, "epoch": 927} {"train_loss": -11.136117935180664, "global_step": 155888, "epoch": 927} {"train_loss": -11.024091720581055, "global_step": 155889, "epoch": 927} {"train_loss": -10.895763397216797, "global_step": 155890, "epoch": 927} {"train_loss": -10.703765869140625, "global_step": 155891, "epoch": 927} {"train_loss": -10.938087463378906, "global_step": 155892, "epoch": 927} {"train_loss": -10.77018928527832, "global_step": 155893, "epoch": 927} {"train_loss": -11.152759552001953, "global_step": 155894, "epoch": 927} {"train_loss": -10.935544967651367, "global_step": 155895, "epoch": 927} {"train_loss": -11.20315170288086, "global_step": 155896, "epoch": 927} {"train_loss": -11.073599815368652, "global_step": 155897, "epoch": 927} {"train_loss": -11.205970764160156, "global_step": 155898, "epoch": 927} {"train_loss": -11.074524879455566, "global_step": 155899, "epoch": 927} {"train_loss": -10.990989685058594, "global_step": 155900, "epoch": 927} {"train_loss": -10.921097755432129, "global_step": 155901, "epoch": 927} {"train_loss": -11.188024520874023, "global_step": 155902, "epoch": 927} {"train_loss": -10.717404291743325, "global_step": 155903, "epoch": 927, "val_loss": 226988.71875} {"train_loss": -11.253701210021973, "global_step": 155904, "epoch": 928} {"train_loss": -11.166986465454102, "global_step": 155905, "epoch": 928} {"train_loss": -11.216443061828613, "global_step": 155906, "epoch": 928} {"train_loss": -11.079683303833008, "global_step": 155907, "epoch": 928} {"train_loss": -11.02074909210205, "global_step": 155908, "epoch": 928} {"train_loss": -11.04699420928955, "global_step": 155909, "epoch": 928} {"train_loss": -10.969709396362305, "global_step": 155910, "epoch": 928} {"train_loss": -11.09345817565918, "global_step": 155911, "epoch": 928} {"train_loss": -10.752481460571289, "global_step": 155912, "epoch": 928} {"train_loss": -10.187881469726562, "global_step": 155913, "epoch": 928} {"train_loss": -10.989715576171875, "global_step": 155914, "epoch": 928} {"train_loss": -10.651447296142578, "global_step": 155915, "epoch": 928} {"train_loss": -10.282909393310547, "global_step": 155916, "epoch": 928} {"train_loss": -10.673505783081055, "global_step": 155917, "epoch": 928} {"train_loss": -9.932920455932617, "global_step": 155918, "epoch": 928} {"train_loss": -9.897356033325195, "global_step": 155919, "epoch": 928} {"train_loss": -10.352777481079102, "global_step": 155920, "epoch": 928} {"train_loss": -10.065454483032227, "global_step": 155921, "epoch": 928} {"train_loss": -9.927680969238281, "global_step": 155922, "epoch": 928} {"train_loss": -9.438249588012695, "global_step": 155923, "epoch": 928} {"train_loss": -10.271768569946289, "global_step": 155924, "epoch": 928} {"train_loss": -10.035013198852539, "global_step": 155925, "epoch": 928} {"train_loss": -9.222816467285156, "global_step": 155926, "epoch": 928} {"train_loss": -10.837444305419922, "global_step": 155927, "epoch": 928} {"train_loss": -9.947502136230469, "global_step": 155928, "epoch": 928} {"train_loss": -10.764103889465332, "global_step": 155929, "epoch": 928} {"train_loss": -10.330076217651367, "global_step": 155930, "epoch": 928} {"train_loss": -10.302949905395508, "global_step": 155931, "epoch": 928} {"train_loss": -10.551360130310059, "global_step": 155932, "epoch": 928} {"train_loss": -10.265031814575195, "global_step": 155933, "epoch": 928} {"train_loss": -10.608609199523926, "global_step": 155934, "epoch": 928} {"train_loss": -10.473642349243164, "global_step": 155935, "epoch": 928} {"train_loss": -10.392351150512695, "global_step": 155936, "epoch": 928} {"train_loss": -10.383495330810547, "global_step": 155937, "epoch": 928} {"train_loss": -10.751008987426758, "global_step": 155938, "epoch": 928} {"train_loss": -10.384540557861328, "global_step": 155939, "epoch": 928} {"train_loss": -10.794097900390625, "global_step": 155940, "epoch": 928} {"train_loss": -10.557425498962402, "global_step": 155941, "epoch": 928} {"train_loss": -10.998120307922363, "global_step": 155942, "epoch": 928} {"train_loss": -10.61642074584961, "global_step": 155943, "epoch": 928} {"train_loss": -10.721065521240234, "global_step": 155944, "epoch": 928} {"train_loss": -10.762994766235352, "global_step": 155945, "epoch": 928} {"train_loss": -10.499994277954102, "global_step": 155946, "epoch": 928} {"train_loss": -10.718687057495117, "global_step": 155947, "epoch": 928} {"train_loss": -10.755213737487793, "global_step": 155948, "epoch": 928} {"train_loss": -10.779695510864258, "global_step": 155949, "epoch": 928} {"train_loss": -10.6873197555542, "global_step": 155950, "epoch": 928} {"train_loss": -10.911519050598145, "global_step": 155951, "epoch": 928} {"train_loss": -10.825910568237305, "global_step": 155952, "epoch": 928} {"train_loss": -11.009247779846191, "global_step": 155953, "epoch": 928} {"train_loss": -10.815790176391602, "global_step": 155954, "epoch": 928} {"train_loss": -11.047771453857422, "global_step": 155955, "epoch": 928} {"train_loss": -10.955639839172363, "global_step": 155956, "epoch": 928} {"train_loss": -10.895334243774414, "global_step": 155957, "epoch": 928} {"train_loss": -10.93386459350586, "global_step": 155958, "epoch": 928} {"train_loss": -10.916105270385742, "global_step": 155959, "epoch": 928} {"train_loss": -10.972755432128906, "global_step": 155960, "epoch": 928} {"train_loss": -10.995328903198242, "global_step": 155961, "epoch": 928} {"train_loss": -10.960163116455078, "global_step": 155962, "epoch": 928} {"train_loss": -10.929729461669922, "global_step": 155963, "epoch": 928} {"train_loss": -10.84360122680664, "global_step": 155964, "epoch": 928} {"train_loss": -10.858114242553711, "global_step": 155965, "epoch": 928} {"train_loss": -11.05496597290039, "global_step": 155966, "epoch": 928} {"train_loss": -10.97330093383789, "global_step": 155967, "epoch": 928} {"train_loss": -10.884496688842773, "global_step": 155968, "epoch": 928} {"train_loss": -11.143501281738281, "global_step": 155969, "epoch": 928} {"train_loss": -10.931821823120117, "global_step": 155970, "epoch": 928} {"train_loss": -10.82590103149414, "global_step": 155971, "epoch": 928} {"train_loss": -10.868638038635254, "global_step": 155972, "epoch": 928} {"train_loss": -11.043384552001953, "global_step": 155973, "epoch": 928} {"train_loss": -10.766483306884766, "global_step": 155974, "epoch": 928} {"train_loss": -11.09528636932373, "global_step": 155975, "epoch": 928} {"train_loss": -10.907227516174316, "global_step": 155976, "epoch": 928} {"train_loss": -10.863932609558105, "global_step": 155977, "epoch": 928} {"train_loss": -11.0516996383667, "global_step": 155978, "epoch": 928} {"train_loss": -11.031293869018555, "global_step": 155979, "epoch": 928} {"train_loss": -10.917681694030762, "global_step": 155980, "epoch": 928} {"train_loss": -10.957956314086914, "global_step": 155981, "epoch": 928} {"train_loss": -11.091322898864746, "global_step": 155982, "epoch": 928} {"train_loss": -11.136709213256836, "global_step": 155983, "epoch": 928} {"train_loss": -11.030016899108887, "global_step": 155984, "epoch": 928} {"train_loss": -11.090901374816895, "global_step": 155985, "epoch": 928} {"train_loss": -10.891186714172363, "global_step": 155986, "epoch": 928} {"train_loss": -11.225079536437988, "global_step": 155987, "epoch": 928} {"train_loss": -11.107803344726562, "global_step": 155988, "epoch": 928} {"train_loss": -11.050615310668945, "global_step": 155989, "epoch": 928} {"train_loss": -10.94382095336914, "global_step": 155990, "epoch": 928} {"train_loss": -10.484992027282715, "global_step": 155991, "epoch": 928} {"train_loss": -9.831941604614258, "global_step": 155992, "epoch": 928} {"train_loss": -10.492843627929688, "global_step": 155993, "epoch": 928} {"train_loss": -10.780252456665039, "global_step": 155994, "epoch": 928} {"train_loss": -10.035440444946289, "global_step": 155995, "epoch": 928} {"train_loss": -9.010822296142578, "global_step": 155996, "epoch": 928} {"train_loss": -10.606996536254883, "global_step": 155997, "epoch": 928} {"train_loss": -9.151281356811523, "global_step": 155998, "epoch": 928} {"train_loss": -8.821484565734863, "global_step": 155999, "epoch": 928} {"train_loss": -8.765689849853516, "global_step": 156000, "epoch": 928} {"train_loss": -9.27216911315918, "global_step": 156001, "epoch": 928} {"train_loss": -8.864654541015625, "global_step": 156002, "epoch": 928} {"train_loss": -9.11110782623291, "global_step": 156003, "epoch": 928} {"train_loss": -8.983341217041016, "global_step": 156004, "epoch": 928} {"train_loss": -10.07888412475586, "global_step": 156005, "epoch": 928} {"train_loss": -8.766569137573242, "global_step": 156006, "epoch": 928} {"train_loss": -10.106682777404785, "global_step": 156007, "epoch": 928} {"train_loss": -9.284364700317383, "global_step": 156008, "epoch": 928} {"train_loss": -10.079017639160156, "global_step": 156009, "epoch": 928} {"train_loss": -9.839224815368652, "global_step": 156010, "epoch": 928} {"train_loss": -9.428316116333008, "global_step": 156011, "epoch": 928} {"train_loss": -9.999794960021973, "global_step": 156012, "epoch": 928} {"train_loss": -9.678903579711914, "global_step": 156013, "epoch": 928} {"train_loss": -10.071878433227539, "global_step": 156014, "epoch": 928} {"train_loss": -9.460382461547852, "global_step": 156015, "epoch": 928} {"train_loss": -10.340391159057617, "global_step": 156016, "epoch": 928} {"train_loss": -9.882554054260254, "global_step": 156017, "epoch": 928} {"train_loss": -9.747100830078125, "global_step": 156018, "epoch": 928} {"train_loss": -10.463571548461914, "global_step": 156019, "epoch": 928} {"train_loss": -9.8970365524292, "global_step": 156020, "epoch": 928} {"train_loss": -10.05688190460205, "global_step": 156021, "epoch": 928} {"train_loss": -10.417520523071289, "global_step": 156022, "epoch": 928} {"train_loss": -9.964192390441895, "global_step": 156023, "epoch": 928} {"train_loss": -10.398868560791016, "global_step": 156024, "epoch": 928} {"train_loss": -10.274009704589844, "global_step": 156025, "epoch": 928} {"train_loss": -10.505539894104004, "global_step": 156026, "epoch": 928} {"train_loss": -10.261747360229492, "global_step": 156027, "epoch": 928} {"train_loss": -10.318087577819824, "global_step": 156028, "epoch": 928} {"train_loss": -10.45144271850586, "global_step": 156029, "epoch": 928} {"train_loss": -10.462479591369629, "global_step": 156030, "epoch": 928} {"train_loss": -10.36648941040039, "global_step": 156031, "epoch": 928} {"train_loss": -10.588886260986328, "global_step": 156032, "epoch": 928} {"train_loss": -10.437737464904785, "global_step": 156033, "epoch": 928} {"train_loss": -10.553640365600586, "global_step": 156034, "epoch": 928} {"train_loss": -10.422531127929688, "global_step": 156035, "epoch": 928} {"train_loss": -10.64065933227539, "global_step": 156036, "epoch": 928} {"train_loss": -10.521770477294922, "global_step": 156037, "epoch": 928} {"train_loss": -10.649561882019043, "global_step": 156038, "epoch": 928} {"train_loss": -10.539649963378906, "global_step": 156039, "epoch": 928} {"train_loss": -10.783392906188965, "global_step": 156040, "epoch": 928} {"train_loss": -10.584229469299316, "global_step": 156041, "epoch": 928} {"train_loss": -10.721661567687988, "global_step": 156042, "epoch": 928} {"train_loss": -10.63232135772705, "global_step": 156043, "epoch": 928} {"train_loss": -10.30599308013916, "global_step": 156044, "epoch": 928} {"train_loss": -10.690214157104492, "global_step": 156045, "epoch": 928} {"train_loss": -10.750778198242188, "global_step": 156046, "epoch": 928} {"train_loss": -10.698543548583984, "global_step": 156047, "epoch": 928} {"train_loss": -10.885786056518555, "global_step": 156048, "epoch": 928} {"train_loss": -10.894279479980469, "global_step": 156049, "epoch": 928} {"train_loss": -10.687255859375, "global_step": 156050, "epoch": 928} {"train_loss": -10.927672386169434, "global_step": 156051, "epoch": 928} {"train_loss": -10.872023582458496, "global_step": 156052, "epoch": 928} {"train_loss": -11.003779411315918, "global_step": 156053, "epoch": 928} {"train_loss": -11.02355670928955, "global_step": 156054, "epoch": 928} {"train_loss": -10.927271842956543, "global_step": 156055, "epoch": 928} {"train_loss": -11.119049072265625, "global_step": 156056, "epoch": 928} {"train_loss": -10.967374801635742, "global_step": 156057, "epoch": 928} {"train_loss": -10.818769454956055, "global_step": 156058, "epoch": 928} {"train_loss": -10.945953369140625, "global_step": 156059, "epoch": 928} {"train_loss": -11.043512344360352, "global_step": 156060, "epoch": 928} {"train_loss": -11.186138153076172, "global_step": 156061, "epoch": 928} {"train_loss": -11.017475128173828, "global_step": 156062, "epoch": 928} {"train_loss": -11.099466323852539, "global_step": 156063, "epoch": 928} {"train_loss": -11.1182279586792, "global_step": 156064, "epoch": 928} {"train_loss": -10.962039947509766, "global_step": 156065, "epoch": 928} {"train_loss": -11.054533958435059, "global_step": 156066, "epoch": 928} {"train_loss": -10.965848922729492, "global_step": 156067, "epoch": 928} {"train_loss": -10.988886833190918, "global_step": 156068, "epoch": 928} {"train_loss": -10.897342681884766, "global_step": 156069, "epoch": 928} {"train_loss": -11.047452926635742, "global_step": 156070, "epoch": 928} {"train_loss": -10.544692930721101, "global_step": 156071, "epoch": 928, "val_loss": 225499.0} {"train_loss": -11.163492202758789, "global_step": 156072, "epoch": 929} {"train_loss": -10.781661987304688, "global_step": 156073, "epoch": 929} {"train_loss": -10.809428215026855, "global_step": 156074, "epoch": 929} {"train_loss": -11.254982948303223, "global_step": 156075, "epoch": 929} {"train_loss": -10.676040649414062, "global_step": 156076, "epoch": 929} {"train_loss": -11.00344467163086, "global_step": 156077, "epoch": 929} {"train_loss": -11.111333847045898, "global_step": 156078, "epoch": 929} {"train_loss": -10.517339706420898, "global_step": 156079, "epoch": 929} {"train_loss": -10.8526611328125, "global_step": 156080, "epoch": 929} {"train_loss": -10.86761474609375, "global_step": 156081, "epoch": 929} {"train_loss": -10.428443908691406, "global_step": 156082, "epoch": 929} {"train_loss": -10.866619110107422, "global_step": 156083, "epoch": 929} {"train_loss": -10.897415161132812, "global_step": 156084, "epoch": 929} {"train_loss": -10.855293273925781, "global_step": 156085, "epoch": 929} {"train_loss": -11.21658706665039, "global_step": 156086, "epoch": 929} {"train_loss": -10.923778533935547, "global_step": 156087, "epoch": 929} {"train_loss": -11.20889663696289, "global_step": 156088, "epoch": 929} {"train_loss": -10.809221267700195, "global_step": 156089, "epoch": 929} {"train_loss": -11.119029998779297, "global_step": 156090, "epoch": 929} {"train_loss": -10.887853622436523, "global_step": 156091, "epoch": 929} {"train_loss": -10.828392028808594, "global_step": 156092, "epoch": 929} {"train_loss": -10.926727294921875, "global_step": 156093, "epoch": 929} {"train_loss": -11.002599716186523, "global_step": 156094, "epoch": 929} {"train_loss": -10.952284812927246, "global_step": 156095, "epoch": 929} {"train_loss": -10.99332046508789, "global_step": 156096, "epoch": 929} {"train_loss": -10.958396911621094, "global_step": 156097, "epoch": 929} {"train_loss": -10.744403839111328, "global_step": 156098, "epoch": 929} {"train_loss": -10.965593338012695, "global_step": 156099, "epoch": 929} {"train_loss": -10.74970817565918, "global_step": 156100, "epoch": 929} {"train_loss": -10.877304077148438, "global_step": 156101, "epoch": 929} {"train_loss": -10.54342269897461, "global_step": 156102, "epoch": 929} {"train_loss": -10.579690933227539, "global_step": 156103, "epoch": 929} {"train_loss": -10.506040573120117, "global_step": 156104, "epoch": 929} {"train_loss": -10.780685424804688, "global_step": 156105, "epoch": 929} {"train_loss": -10.633777618408203, "global_step": 156106, "epoch": 929} {"train_loss": -10.662869453430176, "global_step": 156107, "epoch": 929} {"train_loss": -10.572036743164062, "global_step": 156108, "epoch": 929} {"train_loss": -10.849994659423828, "global_step": 156109, "epoch": 929} {"train_loss": -10.731517791748047, "global_step": 156110, "epoch": 929} {"train_loss": -10.53969955444336, "global_step": 156111, "epoch": 929} {"train_loss": -10.896696090698242, "global_step": 156112, "epoch": 929} {"train_loss": -10.594917297363281, "global_step": 156113, "epoch": 929} {"train_loss": -10.60487174987793, "global_step": 156114, "epoch": 929} {"train_loss": -10.380287170410156, "global_step": 156115, "epoch": 929} {"train_loss": -10.8402681350708, "global_step": 156116, "epoch": 929} {"train_loss": -10.594827651977539, "global_step": 156117, "epoch": 929} {"train_loss": -10.845510482788086, "global_step": 156118, "epoch": 929} {"train_loss": -10.698455810546875, "global_step": 156119, "epoch": 929} {"train_loss": -10.74690055847168, "global_step": 156120, "epoch": 929} {"train_loss": -10.991249084472656, "global_step": 156121, "epoch": 929} {"train_loss": -10.706544876098633, "global_step": 156122, "epoch": 929} {"train_loss": -10.858299255371094, "global_step": 156123, "epoch": 929} {"train_loss": -10.607646942138672, "global_step": 156124, "epoch": 929} {"train_loss": -11.066791534423828, "global_step": 156125, "epoch": 929} {"train_loss": -10.625384330749512, "global_step": 156126, "epoch": 929} {"train_loss": -10.973596572875977, "global_step": 156127, "epoch": 929} {"train_loss": -10.616264343261719, "global_step": 156128, "epoch": 929} {"train_loss": -10.914045333862305, "global_step": 156129, "epoch": 929} {"train_loss": -10.858036041259766, "global_step": 156130, "epoch": 929} {"train_loss": -10.854580879211426, "global_step": 156131, "epoch": 929} {"train_loss": -10.760523796081543, "global_step": 156132, "epoch": 929} {"train_loss": -11.065861701965332, "global_step": 156133, "epoch": 929} {"train_loss": -11.217145919799805, "global_step": 156134, "epoch": 929} {"train_loss": -10.996481895446777, "global_step": 156135, "epoch": 929} {"train_loss": -11.005495071411133, "global_step": 156136, "epoch": 929} {"train_loss": -10.909773826599121, "global_step": 156137, "epoch": 929} {"train_loss": -11.048852920532227, "global_step": 156138, "epoch": 929} {"train_loss": -11.084761619567871, "global_step": 156139, "epoch": 929} {"train_loss": -11.091470718383789, "global_step": 156140, "epoch": 929} {"train_loss": -10.83510971069336, "global_step": 156141, "epoch": 929} {"train_loss": -11.014142990112305, "global_step": 156142, "epoch": 929} {"train_loss": -10.888700485229492, "global_step": 156143, "epoch": 929} {"train_loss": -11.179277420043945, "global_step": 156144, "epoch": 929} {"train_loss": -10.992508888244629, "global_step": 156145, "epoch": 929} {"train_loss": -11.106413841247559, "global_step": 156146, "epoch": 929} {"train_loss": -10.969633102416992, "global_step": 156147, "epoch": 929} {"train_loss": -11.178281784057617, "global_step": 156148, "epoch": 929} {"train_loss": -11.014896392822266, "global_step": 156149, "epoch": 929} {"train_loss": -10.947464942932129, "global_step": 156150, "epoch": 929} {"train_loss": -11.231874465942383, "global_step": 156151, "epoch": 929} {"train_loss": -11.069025039672852, "global_step": 156152, "epoch": 929} {"train_loss": -11.38582992553711, "global_step": 156153, "epoch": 929} {"train_loss": -11.11629867553711, "global_step": 156154, "epoch": 929} {"train_loss": -11.038589477539062, "global_step": 156155, "epoch": 929} {"train_loss": -11.219557762145996, "global_step": 156156, "epoch": 929} {"train_loss": -11.155647277832031, "global_step": 156157, "epoch": 929} {"train_loss": -10.970198631286621, "global_step": 156158, "epoch": 929} {"train_loss": -10.960283279418945, "global_step": 156159, "epoch": 929} {"train_loss": -10.979107856750488, "global_step": 156160, "epoch": 929} {"train_loss": -11.186625480651855, "global_step": 156161, "epoch": 929} {"train_loss": -10.951233863830566, "global_step": 156162, "epoch": 929} {"train_loss": -10.857004165649414, "global_step": 156163, "epoch": 929} {"train_loss": -10.847246170043945, "global_step": 156164, "epoch": 929} {"train_loss": -11.095993041992188, "global_step": 156165, "epoch": 929} {"train_loss": -10.80497932434082, "global_step": 156166, "epoch": 929} {"train_loss": -10.916762351989746, "global_step": 156167, "epoch": 929} {"train_loss": -10.873391151428223, "global_step": 156168, "epoch": 929} {"train_loss": -10.714316368103027, "global_step": 156169, "epoch": 929} {"train_loss": -10.806648254394531, "global_step": 156170, "epoch": 929} {"train_loss": -10.542129516601562, "global_step": 156171, "epoch": 929} {"train_loss": -9.819438934326172, "global_step": 156172, "epoch": 929} {"train_loss": -10.764129638671875, "global_step": 156173, "epoch": 929} {"train_loss": -10.681273460388184, "global_step": 156174, "epoch": 929} {"train_loss": -10.207563400268555, "global_step": 156175, "epoch": 929} {"train_loss": -10.251544952392578, "global_step": 156176, "epoch": 929} {"train_loss": -10.824256896972656, "global_step": 156177, "epoch": 929} {"train_loss": -9.151384353637695, "global_step": 156178, "epoch": 929} {"train_loss": -11.025103569030762, "global_step": 156179, "epoch": 929} {"train_loss": -10.504992485046387, "global_step": 156180, "epoch": 929} {"train_loss": -10.618249893188477, "global_step": 156181, "epoch": 929} {"train_loss": -10.523518562316895, "global_step": 156182, "epoch": 929} {"train_loss": -10.230657577514648, "global_step": 156183, "epoch": 929} {"train_loss": -10.546232223510742, "global_step": 156184, "epoch": 929} {"train_loss": -9.90606689453125, "global_step": 156185, "epoch": 929} {"train_loss": -9.529741287231445, "global_step": 156186, "epoch": 929} {"train_loss": -10.35877799987793, "global_step": 156187, "epoch": 929} {"train_loss": -9.75136947631836, "global_step": 156188, "epoch": 929} {"train_loss": -10.648417472839355, "global_step": 156189, "epoch": 929} {"train_loss": -10.235162734985352, "global_step": 156190, "epoch": 929} {"train_loss": -10.50616455078125, "global_step": 156191, "epoch": 929} {"train_loss": -10.332172393798828, "global_step": 156192, "epoch": 929} {"train_loss": -10.492353439331055, "global_step": 156193, "epoch": 929} {"train_loss": -10.289592742919922, "global_step": 156194, "epoch": 929} {"train_loss": -10.668521881103516, "global_step": 156195, "epoch": 929} {"train_loss": -10.522485733032227, "global_step": 156196, "epoch": 929} {"train_loss": -10.69160270690918, "global_step": 156197, "epoch": 929} {"train_loss": -10.515715599060059, "global_step": 156198, "epoch": 929} {"train_loss": -10.768585205078125, "global_step": 156199, "epoch": 929} {"train_loss": -10.730462074279785, "global_step": 156200, "epoch": 929} {"train_loss": -10.486082077026367, "global_step": 156201, "epoch": 929} {"train_loss": -10.795884132385254, "global_step": 156202, "epoch": 929} {"train_loss": -10.414604187011719, "global_step": 156203, "epoch": 929} {"train_loss": -10.66640567779541, "global_step": 156204, "epoch": 929} {"train_loss": -10.503267288208008, "global_step": 156205, "epoch": 929} {"train_loss": -10.647436141967773, "global_step": 156206, "epoch": 929} {"train_loss": -10.806499481201172, "global_step": 156207, "epoch": 929} {"train_loss": -10.848991394042969, "global_step": 156208, "epoch": 929} {"train_loss": -10.601622581481934, "global_step": 156209, "epoch": 929} {"train_loss": -10.768148422241211, "global_step": 156210, "epoch": 929} {"train_loss": -10.839866638183594, "global_step": 156211, "epoch": 929} {"train_loss": -10.687662124633789, "global_step": 156212, "epoch": 929} {"train_loss": -10.630434036254883, "global_step": 156213, "epoch": 929} {"train_loss": -10.60844898223877, "global_step": 156214, "epoch": 929} {"train_loss": -10.903367042541504, "global_step": 156215, "epoch": 929} {"train_loss": -10.701692581176758, "global_step": 156216, "epoch": 929} {"train_loss": -10.871417999267578, "global_step": 156217, "epoch": 929} {"train_loss": -10.633064270019531, "global_step": 156218, "epoch": 929} {"train_loss": -10.825071334838867, "global_step": 156219, "epoch": 929} {"train_loss": -10.643511772155762, "global_step": 156220, "epoch": 929} {"train_loss": -10.722463607788086, "global_step": 156221, "epoch": 929} {"train_loss": -10.725335121154785, "global_step": 156222, "epoch": 929} {"train_loss": -11.016359329223633, "global_step": 156223, "epoch": 929} {"train_loss": -10.644807815551758, "global_step": 156224, "epoch": 929} {"train_loss": -10.711893081665039, "global_step": 156225, "epoch": 929} {"train_loss": -10.63305950164795, "global_step": 156226, "epoch": 929} {"train_loss": -10.483047485351562, "global_step": 156227, "epoch": 929} {"train_loss": -10.819787979125977, "global_step": 156228, "epoch": 929} {"train_loss": -10.089177131652832, "global_step": 156229, "epoch": 929} {"train_loss": -10.682575225830078, "global_step": 156230, "epoch": 929} {"train_loss": -10.765045166015625, "global_step": 156231, "epoch": 929} {"train_loss": -10.447556495666504, "global_step": 156232, "epoch": 929} {"train_loss": -11.133742332458496, "global_step": 156233, "epoch": 929} {"train_loss": -10.567875862121582, "global_step": 156234, "epoch": 929} {"train_loss": -10.592920303344727, "global_step": 156235, "epoch": 929} {"train_loss": -10.981534004211426, "global_step": 156236, "epoch": 929} {"train_loss": -10.875831604003906, "global_step": 156237, "epoch": 929} {"train_loss": -10.613628387451172, "global_step": 156238, "epoch": 929} {"train_loss": -10.756405614671253, "global_step": 156239, "epoch": 929, "val_loss": 234631.890625} {"train_loss": -10.823290824890137, "global_step": 156240, "epoch": 930} {"train_loss": -10.91086483001709, "global_step": 156241, "epoch": 930} {"train_loss": -10.527944564819336, "global_step": 156242, "epoch": 930} {"train_loss": -10.738201141357422, "global_step": 156243, "epoch": 930} {"train_loss": -10.992033958435059, "global_step": 156244, "epoch": 930} {"train_loss": -10.716930389404297, "global_step": 156245, "epoch": 930} {"train_loss": -11.006726264953613, "global_step": 156246, "epoch": 930} {"train_loss": -10.958900451660156, "global_step": 156247, "epoch": 930} {"train_loss": -10.859901428222656, "global_step": 156248, "epoch": 930} {"train_loss": -11.012992858886719, "global_step": 156249, "epoch": 930} {"train_loss": -10.856100082397461, "global_step": 156250, "epoch": 930} {"train_loss": -10.969961166381836, "global_step": 156251, "epoch": 930} {"train_loss": -11.009119033813477, "global_step": 156252, "epoch": 930} {"train_loss": -10.892145156860352, "global_step": 156253, "epoch": 930} {"train_loss": -10.825944900512695, "global_step": 156254, "epoch": 930} {"train_loss": -10.962482452392578, "global_step": 156255, "epoch": 930} {"train_loss": -10.31328010559082, "global_step": 156256, "epoch": 930} {"train_loss": -11.205524444580078, "global_step": 156257, "epoch": 930} {"train_loss": -10.389213562011719, "global_step": 156258, "epoch": 930} {"train_loss": -10.826539993286133, "global_step": 156259, "epoch": 930} {"train_loss": -10.71444320678711, "global_step": 156260, "epoch": 930} {"train_loss": -10.714176177978516, "global_step": 156261, "epoch": 930} {"train_loss": -10.8836669921875, "global_step": 156262, "epoch": 930} {"train_loss": -10.635088920593262, "global_step": 156263, "epoch": 930} {"train_loss": -10.709251403808594, "global_step": 156264, "epoch": 930} {"train_loss": -10.992380142211914, "global_step": 156265, "epoch": 930} {"train_loss": -11.088631629943848, "global_step": 156266, "epoch": 930} {"train_loss": -11.206277847290039, "global_step": 156267, "epoch": 930} {"train_loss": -11.063282012939453, "global_step": 156268, "epoch": 930} {"train_loss": -11.135878562927246, "global_step": 156269, "epoch": 930} {"train_loss": -11.101114273071289, "global_step": 156270, "epoch": 930} {"train_loss": -11.064020156860352, "global_step": 156271, "epoch": 930} {"train_loss": -11.14423656463623, "global_step": 156272, "epoch": 930} {"train_loss": -11.080058097839355, "global_step": 156273, "epoch": 930} {"train_loss": -10.979806900024414, "global_step": 156274, "epoch": 930} {"train_loss": -11.050936698913574, "global_step": 156275, "epoch": 930} {"train_loss": -11.095062255859375, "global_step": 156276, "epoch": 930} {"train_loss": -11.230605125427246, "global_step": 156277, "epoch": 930} {"train_loss": -11.199382781982422, "global_step": 156278, "epoch": 930} {"train_loss": -11.100537300109863, "global_step": 156279, "epoch": 930} {"train_loss": -10.96080207824707, "global_step": 156280, "epoch": 930} {"train_loss": -11.072145462036133, "global_step": 156281, "epoch": 930} {"train_loss": -10.950841903686523, "global_step": 156282, "epoch": 930} {"train_loss": -10.954174041748047, "global_step": 156283, "epoch": 930} {"train_loss": -11.093670845031738, "global_step": 156284, "epoch": 930} {"train_loss": -11.03544807434082, "global_step": 156285, "epoch": 930} {"train_loss": -11.09785270690918, "global_step": 156286, "epoch": 930} {"train_loss": -11.07959270477295, "global_step": 156287, "epoch": 930} {"train_loss": -11.072265625, "global_step": 156288, "epoch": 930} {"train_loss": -10.881851196289062, "global_step": 156289, "epoch": 930} {"train_loss": -10.611383438110352, "global_step": 156290, "epoch": 930} {"train_loss": -10.38101863861084, "global_step": 156291, "epoch": 930} {"train_loss": -10.37208080291748, "global_step": 156292, "epoch": 930} {"train_loss": -10.545893669128418, "global_step": 156293, "epoch": 930} {"train_loss": -10.774643898010254, "global_step": 156294, "epoch": 930} {"train_loss": -9.88382625579834, "global_step": 156295, "epoch": 930} {"train_loss": -10.521421432495117, "global_step": 156296, "epoch": 930} {"train_loss": -10.826894760131836, "global_step": 156297, "epoch": 930} {"train_loss": -10.531160354614258, "global_step": 156298, "epoch": 930} {"train_loss": -10.715856552124023, "global_step": 156299, "epoch": 930} {"train_loss": -10.471479415893555, "global_step": 156300, "epoch": 930} {"train_loss": -10.271857261657715, "global_step": 156301, "epoch": 930} {"train_loss": -10.964948654174805, "global_step": 156302, "epoch": 930} {"train_loss": -10.670510292053223, "global_step": 156303, "epoch": 930} {"train_loss": -10.670252799987793, "global_step": 156304, "epoch": 930} {"train_loss": -10.723358154296875, "global_step": 156305, "epoch": 930} {"train_loss": -10.461503982543945, "global_step": 156306, "epoch": 930} {"train_loss": -10.968608856201172, "global_step": 156307, "epoch": 930} {"train_loss": -10.375152587890625, "global_step": 156308, "epoch": 930} {"train_loss": -10.433666229248047, "global_step": 156309, "epoch": 930} {"train_loss": -10.459352493286133, "global_step": 156310, "epoch": 930} {"train_loss": -10.285672187805176, "global_step": 156311, "epoch": 930} {"train_loss": -10.680828094482422, "global_step": 156312, "epoch": 930} {"train_loss": -10.21369743347168, "global_step": 156313, "epoch": 930} {"train_loss": -10.639789581298828, "global_step": 156314, "epoch": 930} {"train_loss": -10.058893203735352, "global_step": 156315, "epoch": 930} {"train_loss": -10.571980476379395, "global_step": 156316, "epoch": 930} {"train_loss": -10.331419944763184, "global_step": 156317, "epoch": 930} {"train_loss": -10.781047821044922, "global_step": 156318, "epoch": 930} {"train_loss": -10.403099060058594, "global_step": 156319, "epoch": 930} {"train_loss": -10.728594779968262, "global_step": 156320, "epoch": 930} {"train_loss": -10.491113662719727, "global_step": 156321, "epoch": 930} {"train_loss": -10.850299835205078, "global_step": 156322, "epoch": 930} {"train_loss": -10.714754104614258, "global_step": 156323, "epoch": 930} {"train_loss": -10.638956069946289, "global_step": 156324, "epoch": 930} {"train_loss": -10.893571853637695, "global_step": 156325, "epoch": 930} {"train_loss": -10.796049118041992, "global_step": 156326, "epoch": 930} {"train_loss": -10.43020248413086, "global_step": 156327, "epoch": 930} {"train_loss": -10.815595626831055, "global_step": 156328, "epoch": 930} {"train_loss": -10.569122314453125, "global_step": 156329, "epoch": 930} {"train_loss": -10.693471908569336, "global_step": 156330, "epoch": 930} {"train_loss": -10.60604476928711, "global_step": 156331, "epoch": 930} {"train_loss": -11.0237455368042, "global_step": 156332, "epoch": 930} {"train_loss": -10.54885482788086, "global_step": 156333, "epoch": 930} {"train_loss": -10.792210578918457, "global_step": 156334, "epoch": 930} {"train_loss": -10.91053581237793, "global_step": 156335, "epoch": 930} {"train_loss": -10.617961883544922, "global_step": 156336, "epoch": 930} {"train_loss": -11.03154468536377, "global_step": 156337, "epoch": 930} {"train_loss": -10.911055564880371, "global_step": 156338, "epoch": 930} {"train_loss": -11.044158935546875, "global_step": 156339, "epoch": 930} {"train_loss": -10.855167388916016, "global_step": 156340, "epoch": 930} {"train_loss": -10.56382942199707, "global_step": 156341, "epoch": 930} {"train_loss": -10.659492492675781, "global_step": 156342, "epoch": 930} {"train_loss": -10.909638404846191, "global_step": 156343, "epoch": 930} {"train_loss": -10.863214492797852, "global_step": 156344, "epoch": 930} {"train_loss": -10.974268913269043, "global_step": 156345, "epoch": 930} {"train_loss": -10.930051803588867, "global_step": 156346, "epoch": 930} {"train_loss": -10.731182098388672, "global_step": 156347, "epoch": 930} {"train_loss": -11.036995887756348, "global_step": 156348, "epoch": 930} {"train_loss": -10.925397872924805, "global_step": 156349, "epoch": 930} {"train_loss": -10.863609313964844, "global_step": 156350, "epoch": 930} {"train_loss": -10.907291412353516, "global_step": 156351, "epoch": 930} {"train_loss": -10.623082160949707, "global_step": 156352, "epoch": 930} {"train_loss": -10.727209091186523, "global_step": 156353, "epoch": 930} {"train_loss": -10.956832885742188, "global_step": 156354, "epoch": 930} {"train_loss": -10.733285903930664, "global_step": 156355, "epoch": 930} {"train_loss": -11.140787124633789, "global_step": 156356, "epoch": 930} {"train_loss": -10.718721389770508, "global_step": 156357, "epoch": 930} {"train_loss": -10.902263641357422, "global_step": 156358, "epoch": 930} {"train_loss": -10.686345100402832, "global_step": 156359, "epoch": 930} {"train_loss": -11.175008773803711, "global_step": 156360, "epoch": 930} {"train_loss": -10.517732620239258, "global_step": 156361, "epoch": 930} {"train_loss": -10.948863983154297, "global_step": 156362, "epoch": 930} {"train_loss": -10.841142654418945, "global_step": 156363, "epoch": 930} {"train_loss": -10.89004898071289, "global_step": 156364, "epoch": 930} {"train_loss": -10.55034065246582, "global_step": 156365, "epoch": 930} {"train_loss": -10.032200813293457, "global_step": 156366, "epoch": 930} {"train_loss": -10.48044204711914, "global_step": 156367, "epoch": 930} {"train_loss": -9.0997314453125, "global_step": 156368, "epoch": 930} {"train_loss": -8.750869750976562, "global_step": 156369, "epoch": 930} {"train_loss": -10.157445907592773, "global_step": 156370, "epoch": 930} {"train_loss": -7.816717147827148, "global_step": 156371, "epoch": 930} {"train_loss": -10.11645793914795, "global_step": 156372, "epoch": 930} {"train_loss": -8.173078536987305, "global_step": 156373, "epoch": 930} {"train_loss": -9.70385456085205, "global_step": 156374, "epoch": 930} {"train_loss": -8.285009384155273, "global_step": 156375, "epoch": 930} {"train_loss": -8.491531372070312, "global_step": 156376, "epoch": 930} {"train_loss": -8.884464263916016, "global_step": 156377, "epoch": 930} {"train_loss": -9.263509750366211, "global_step": 156378, "epoch": 930} {"train_loss": -9.586320877075195, "global_step": 156379, "epoch": 930} {"train_loss": -8.998018264770508, "global_step": 156380, "epoch": 930} {"train_loss": -9.287909507751465, "global_step": 156381, "epoch": 930} {"train_loss": -8.902223587036133, "global_step": 156382, "epoch": 930} {"train_loss": -9.649637222290039, "global_step": 156383, "epoch": 930} {"train_loss": -9.497090339660645, "global_step": 156384, "epoch": 930} {"train_loss": -9.217864990234375, "global_step": 156385, "epoch": 930} {"train_loss": -10.233017921447754, "global_step": 156386, "epoch": 930} {"train_loss": -9.504549980163574, "global_step": 156387, "epoch": 930} {"train_loss": -10.002155303955078, "global_step": 156388, "epoch": 930} {"train_loss": -9.898658752441406, "global_step": 156389, "epoch": 930} {"train_loss": -9.910350799560547, "global_step": 156390, "epoch": 930} {"train_loss": -10.233512878417969, "global_step": 156391, "epoch": 930} {"train_loss": -10.419576644897461, "global_step": 156392, "epoch": 930} {"train_loss": -9.929099082946777, "global_step": 156393, "epoch": 930} {"train_loss": -10.3673095703125, "global_step": 156394, "epoch": 930} {"train_loss": -10.075187683105469, "global_step": 156395, "epoch": 930} {"train_loss": -10.307848930358887, "global_step": 156396, "epoch": 930} {"train_loss": -10.291299819946289, "global_step": 156397, "epoch": 930} {"train_loss": -10.432904243469238, "global_step": 156398, "epoch": 930} {"train_loss": -10.043193817138672, "global_step": 156399, "epoch": 930} {"train_loss": -10.318326950073242, "global_step": 156400, "epoch": 930} {"train_loss": -10.3224458694458, "global_step": 156401, "epoch": 930} {"train_loss": -10.316144943237305, "global_step": 156402, "epoch": 930} {"train_loss": -10.58267879486084, "global_step": 156403, "epoch": 930} {"train_loss": -10.610677719116211, "global_step": 156404, "epoch": 930} {"train_loss": -10.473241806030273, "global_step": 156405, "epoch": 930} {"train_loss": -10.541985511779785, "global_step": 156406, "epoch": 930} {"train_loss": -10.5324809721538, "global_step": 156407, "epoch": 930, "val_loss": 231864.96875, "train_action_mse_error": 2.654449701309204} {"train_loss": -10.561843872070312, "global_step": 156408, "epoch": 931} {"train_loss": -10.56747817993164, "global_step": 156409, "epoch": 931} {"train_loss": -10.64508056640625, "global_step": 156410, "epoch": 931} {"train_loss": -10.545778274536133, "global_step": 156411, "epoch": 931} {"train_loss": -10.885293960571289, "global_step": 156412, "epoch": 931} {"train_loss": -10.625852584838867, "global_step": 156413, "epoch": 931} {"train_loss": -10.546607971191406, "global_step": 156414, "epoch": 931} {"train_loss": -10.686788558959961, "global_step": 156415, "epoch": 931} {"train_loss": -10.753646850585938, "global_step": 156416, "epoch": 931} {"train_loss": -10.85135269165039, "global_step": 156417, "epoch": 931} {"train_loss": -10.995381355285645, "global_step": 156418, "epoch": 931} {"train_loss": -10.846677780151367, "global_step": 156419, "epoch": 931} {"train_loss": -10.955028533935547, "global_step": 156420, "epoch": 931} {"train_loss": -11.051067352294922, "global_step": 156421, "epoch": 931} {"train_loss": -10.801664352416992, "global_step": 156422, "epoch": 931} {"train_loss": -11.038410186767578, "global_step": 156423, "epoch": 931} {"train_loss": -11.00335693359375, "global_step": 156424, "epoch": 931} {"train_loss": -10.919841766357422, "global_step": 156425, "epoch": 931} {"train_loss": -10.98251724243164, "global_step": 156426, "epoch": 931} {"train_loss": -10.797025680541992, "global_step": 156427, "epoch": 931} {"train_loss": -11.030303955078125, "global_step": 156428, "epoch": 931} {"train_loss": -11.021207809448242, "global_step": 156429, "epoch": 931} {"train_loss": -10.949596405029297, "global_step": 156430, "epoch": 931} {"train_loss": -11.098922729492188, "global_step": 156431, "epoch": 931} {"train_loss": -10.932830810546875, "global_step": 156432, "epoch": 931} {"train_loss": -11.179056167602539, "global_step": 156433, "epoch": 931} {"train_loss": -11.088826179504395, "global_step": 156434, "epoch": 931} {"train_loss": -10.993016242980957, "global_step": 156435, "epoch": 931} {"train_loss": -11.027982711791992, "global_step": 156436, "epoch": 931} {"train_loss": -11.136076927185059, "global_step": 156437, "epoch": 931} {"train_loss": -10.938394546508789, "global_step": 156438, "epoch": 931} {"train_loss": -10.909448623657227, "global_step": 156439, "epoch": 931} {"train_loss": -10.988969802856445, "global_step": 156440, "epoch": 931} {"train_loss": -10.61172866821289, "global_step": 156441, "epoch": 931} {"train_loss": -11.288477897644043, "global_step": 156442, "epoch": 931} {"train_loss": -10.734920501708984, "global_step": 156443, "epoch": 931} {"train_loss": -10.93239974975586, "global_step": 156444, "epoch": 931} {"train_loss": -10.978731155395508, "global_step": 156445, "epoch": 931} {"train_loss": -11.146169662475586, "global_step": 156446, "epoch": 931} {"train_loss": -10.813663482666016, "global_step": 156447, "epoch": 931} {"train_loss": -11.11154556274414, "global_step": 156448, "epoch": 931} {"train_loss": -11.092042922973633, "global_step": 156449, "epoch": 931} {"train_loss": -10.865787506103516, "global_step": 156450, "epoch": 931} {"train_loss": -11.193639755249023, "global_step": 156451, "epoch": 931} {"train_loss": -11.253740310668945, "global_step": 156452, "epoch": 931} {"train_loss": -10.963113784790039, "global_step": 156453, "epoch": 931} {"train_loss": -10.969593048095703, "global_step": 156454, "epoch": 931} {"train_loss": -10.710023880004883, "global_step": 156455, "epoch": 931} {"train_loss": -11.12554931640625, "global_step": 156456, "epoch": 931} {"train_loss": -10.423168182373047, "global_step": 156457, "epoch": 931} {"train_loss": -10.847415924072266, "global_step": 156458, "epoch": 931} {"train_loss": -10.791729927062988, "global_step": 156459, "epoch": 931} {"train_loss": -9.935029029846191, "global_step": 156460, "epoch": 931} {"train_loss": -10.918428421020508, "global_step": 156461, "epoch": 931} {"train_loss": -9.690849304199219, "global_step": 156462, "epoch": 931} {"train_loss": -9.890491485595703, "global_step": 156463, "epoch": 931} {"train_loss": -10.662029266357422, "global_step": 156464, "epoch": 931} {"train_loss": -10.339771270751953, "global_step": 156465, "epoch": 931} {"train_loss": -9.885307312011719, "global_step": 156466, "epoch": 931} {"train_loss": -9.780757904052734, "global_step": 156467, "epoch": 931} {"train_loss": -9.455583572387695, "global_step": 156468, "epoch": 931} {"train_loss": -9.6044921875, "global_step": 156469, "epoch": 931} {"train_loss": -9.40798282623291, "global_step": 156470, "epoch": 931} {"train_loss": -9.491395950317383, "global_step": 156471, "epoch": 931} {"train_loss": -9.6556978225708, "global_step": 156472, "epoch": 931} {"train_loss": -9.766387939453125, "global_step": 156473, "epoch": 931} {"train_loss": -9.625720977783203, "global_step": 156474, "epoch": 931} {"train_loss": -10.258544921875, "global_step": 156475, "epoch": 931} {"train_loss": -9.905155181884766, "global_step": 156476, "epoch": 931} {"train_loss": -10.186275482177734, "global_step": 156477, "epoch": 931} {"train_loss": -10.093093872070312, "global_step": 156478, "epoch": 931} {"train_loss": -10.342297554016113, "global_step": 156479, "epoch": 931} {"train_loss": -10.352588653564453, "global_step": 156480, "epoch": 931} {"train_loss": -9.821434020996094, "global_step": 156481, "epoch": 931} {"train_loss": -10.194843292236328, "global_step": 156482, "epoch": 931} {"train_loss": -9.972516059875488, "global_step": 156483, "epoch": 931} {"train_loss": -10.253324508666992, "global_step": 156484, "epoch": 931} {"train_loss": -10.148719787597656, "global_step": 156485, "epoch": 931} {"train_loss": -10.304213523864746, "global_step": 156486, "epoch": 931} {"train_loss": -10.533613204956055, "global_step": 156487, "epoch": 931} {"train_loss": -10.652518272399902, "global_step": 156488, "epoch": 931} {"train_loss": -10.549795150756836, "global_step": 156489, "epoch": 931} {"train_loss": -10.721667289733887, "global_step": 156490, "epoch": 931} {"train_loss": -10.544200897216797, "global_step": 156491, "epoch": 931} {"train_loss": -10.724359512329102, "global_step": 156492, "epoch": 931} {"train_loss": -10.712516784667969, "global_step": 156493, "epoch": 931} {"train_loss": -10.806136131286621, "global_step": 156494, "epoch": 931} {"train_loss": -10.855033874511719, "global_step": 156495, "epoch": 931} {"train_loss": -10.699050903320312, "global_step": 156496, "epoch": 931} {"train_loss": -10.632291793823242, "global_step": 156497, "epoch": 931} {"train_loss": -10.621496200561523, "global_step": 156498, "epoch": 931} {"train_loss": -10.775426864624023, "global_step": 156499, "epoch": 931} {"train_loss": -10.925639152526855, "global_step": 156500, "epoch": 931} {"train_loss": -10.796709060668945, "global_step": 156501, "epoch": 931} {"train_loss": -10.806819915771484, "global_step": 156502, "epoch": 931} {"train_loss": -10.787637710571289, "global_step": 156503, "epoch": 931} {"train_loss": -11.035659790039062, "global_step": 156504, "epoch": 931} {"train_loss": -10.912613868713379, "global_step": 156505, "epoch": 931} {"train_loss": -10.890325546264648, "global_step": 156506, "epoch": 931} {"train_loss": -11.052660942077637, "global_step": 156507, "epoch": 931} {"train_loss": -10.857141494750977, "global_step": 156508, "epoch": 931} {"train_loss": -10.960752487182617, "global_step": 156509, "epoch": 931} {"train_loss": -11.1122465133667, "global_step": 156510, "epoch": 931} {"train_loss": -11.170188903808594, "global_step": 156511, "epoch": 931} {"train_loss": -11.064793586730957, "global_step": 156512, "epoch": 931} {"train_loss": -10.74412727355957, "global_step": 156513, "epoch": 931} {"train_loss": -10.922577857971191, "global_step": 156514, "epoch": 931} {"train_loss": -11.014156341552734, "global_step": 156515, "epoch": 931} {"train_loss": -11.00758171081543, "global_step": 156516, "epoch": 931} {"train_loss": -11.086038589477539, "global_step": 156517, "epoch": 931} {"train_loss": -10.840435028076172, "global_step": 156518, "epoch": 931} {"train_loss": -11.175174713134766, "global_step": 156519, "epoch": 931} {"train_loss": -11.020915985107422, "global_step": 156520, "epoch": 931} {"train_loss": -11.022734642028809, "global_step": 156521, "epoch": 931} {"train_loss": -11.070120811462402, "global_step": 156522, "epoch": 931} {"train_loss": -11.052775382995605, "global_step": 156523, "epoch": 931} {"train_loss": -10.517114639282227, "global_step": 156524, "epoch": 931} {"train_loss": -10.538299560546875, "global_step": 156525, "epoch": 931} {"train_loss": -10.957117080688477, "global_step": 156526, "epoch": 931} {"train_loss": -11.217353820800781, "global_step": 156527, "epoch": 931} {"train_loss": -10.797700881958008, "global_step": 156528, "epoch": 931} {"train_loss": -11.11706829071045, "global_step": 156529, "epoch": 931} {"train_loss": -10.912389755249023, "global_step": 156530, "epoch": 931} {"train_loss": -11.014948844909668, "global_step": 156531, "epoch": 931} {"train_loss": -11.194616317749023, "global_step": 156532, "epoch": 931} {"train_loss": -10.619678497314453, "global_step": 156533, "epoch": 931} {"train_loss": -10.392388343811035, "global_step": 156534, "epoch": 931} {"train_loss": -10.331992149353027, "global_step": 156535, "epoch": 931} {"train_loss": -11.13306999206543, "global_step": 156536, "epoch": 931} {"train_loss": -11.029753684997559, "global_step": 156537, "epoch": 931} {"train_loss": -10.52581787109375, "global_step": 156538, "epoch": 931} {"train_loss": -10.764582633972168, "global_step": 156539, "epoch": 931} {"train_loss": -10.661650657653809, "global_step": 156540, "epoch": 931} {"train_loss": -11.218761444091797, "global_step": 156541, "epoch": 931} {"train_loss": -11.035852432250977, "global_step": 156542, "epoch": 931} {"train_loss": -10.927377700805664, "global_step": 156543, "epoch": 931} {"train_loss": -10.866305351257324, "global_step": 156544, "epoch": 931} {"train_loss": -10.714159965515137, "global_step": 156545, "epoch": 931} {"train_loss": -11.168712615966797, "global_step": 156546, "epoch": 931} {"train_loss": -10.916054725646973, "global_step": 156547, "epoch": 931} {"train_loss": -11.056779861450195, "global_step": 156548, "epoch": 931} {"train_loss": -10.989866256713867, "global_step": 156549, "epoch": 931} {"train_loss": -10.503734588623047, "global_step": 156550, "epoch": 931} {"train_loss": -10.865428924560547, "global_step": 156551, "epoch": 931} {"train_loss": -11.085358619689941, "global_step": 156552, "epoch": 931} {"train_loss": -10.690558433532715, "global_step": 156553, "epoch": 931} {"train_loss": -10.871957778930664, "global_step": 156554, "epoch": 931} {"train_loss": -10.927499771118164, "global_step": 156555, "epoch": 931} {"train_loss": -10.617975234985352, "global_step": 156556, "epoch": 931} {"train_loss": -10.714024543762207, "global_step": 156557, "epoch": 931} {"train_loss": -10.922662734985352, "global_step": 156558, "epoch": 931} {"train_loss": -10.999032020568848, "global_step": 156559, "epoch": 931} {"train_loss": -10.682670593261719, "global_step": 156560, "epoch": 931} {"train_loss": -10.458850860595703, "global_step": 156561, "epoch": 931} {"train_loss": -10.37936019897461, "global_step": 156562, "epoch": 931} {"train_loss": -9.219486236572266, "global_step": 156563, "epoch": 931} {"train_loss": -10.581560134887695, "global_step": 156564, "epoch": 931} {"train_loss": -9.929210662841797, "global_step": 156565, "epoch": 931} {"train_loss": -8.968291282653809, "global_step": 156566, "epoch": 931} {"train_loss": -9.48265552520752, "global_step": 156567, "epoch": 931} {"train_loss": -9.132182121276855, "global_step": 156568, "epoch": 931} {"train_loss": -9.967676162719727, "global_step": 156569, "epoch": 931} {"train_loss": -9.335620880126953, "global_step": 156570, "epoch": 931} {"train_loss": -9.54054069519043, "global_step": 156571, "epoch": 931} {"train_loss": -8.578052520751953, "global_step": 156572, "epoch": 931} {"train_loss": -7.816983222961426, "global_step": 156573, "epoch": 931} {"train_loss": -9.149309158325195, "global_step": 156574, "epoch": 931} {"train_loss": -10.610929869470143, "global_step": 156575, "epoch": 931, "val_loss": 228142.953125} {"train_loss": -9.711796760559082, "global_step": 156576, "epoch": 932} {"train_loss": -9.439617156982422, "global_step": 156577, "epoch": 932} {"train_loss": -8.701090812683105, "global_step": 156578, "epoch": 932} {"train_loss": -9.886563301086426, "global_step": 156579, "epoch": 932} {"train_loss": -9.93825626373291, "global_step": 156580, "epoch": 932} {"train_loss": -8.67023754119873, "global_step": 156581, "epoch": 932} {"train_loss": -9.666644096374512, "global_step": 156582, "epoch": 932} {"train_loss": -9.662952423095703, "global_step": 156583, "epoch": 932} {"train_loss": -10.292547225952148, "global_step": 156584, "epoch": 932} {"train_loss": -9.639236450195312, "global_step": 156585, "epoch": 932} {"train_loss": -9.71603775024414, "global_step": 156586, "epoch": 932} {"train_loss": -10.387712478637695, "global_step": 156587, "epoch": 932} {"train_loss": -9.973358154296875, "global_step": 156588, "epoch": 932} {"train_loss": -9.992412567138672, "global_step": 156589, "epoch": 932} {"train_loss": -10.467968940734863, "global_step": 156590, "epoch": 932} {"train_loss": -10.407123565673828, "global_step": 156591, "epoch": 932} {"train_loss": -10.217738151550293, "global_step": 156592, "epoch": 932} {"train_loss": -9.976217269897461, "global_step": 156593, "epoch": 932} {"train_loss": -10.438194274902344, "global_step": 156594, "epoch": 932} {"train_loss": -10.470722198486328, "global_step": 156595, "epoch": 932} {"train_loss": -10.351086616516113, "global_step": 156596, "epoch": 932} {"train_loss": -10.432840347290039, "global_step": 156597, "epoch": 932} {"train_loss": -10.547521591186523, "global_step": 156598, "epoch": 932} {"train_loss": -10.582197189331055, "global_step": 156599, "epoch": 932} {"train_loss": -10.512123107910156, "global_step": 156600, "epoch": 932} {"train_loss": -10.31447982788086, "global_step": 156601, "epoch": 932} {"train_loss": -10.544205665588379, "global_step": 156602, "epoch": 932} {"train_loss": -10.842344284057617, "global_step": 156603, "epoch": 932} {"train_loss": -10.480964660644531, "global_step": 156604, "epoch": 932} {"train_loss": -10.657079696655273, "global_step": 156605, "epoch": 932} {"train_loss": -10.623645782470703, "global_step": 156606, "epoch": 932} {"train_loss": -10.70324993133545, "global_step": 156607, "epoch": 932} {"train_loss": -10.496194839477539, "global_step": 156608, "epoch": 932} {"train_loss": -10.644453048706055, "global_step": 156609, "epoch": 932} {"train_loss": -10.82625961303711, "global_step": 156610, "epoch": 932} {"train_loss": -10.837794303894043, "global_step": 156611, "epoch": 932} {"train_loss": -10.71224594116211, "global_step": 156612, "epoch": 932} {"train_loss": -10.748625755310059, "global_step": 156613, "epoch": 932} {"train_loss": -10.68054485321045, "global_step": 156614, "epoch": 932} {"train_loss": -10.919912338256836, "global_step": 156615, "epoch": 932} {"train_loss": -10.82364273071289, "global_step": 156616, "epoch": 932} {"train_loss": -10.96723461151123, "global_step": 156617, "epoch": 932} {"train_loss": -10.804853439331055, "global_step": 156618, "epoch": 932} {"train_loss": -10.901688575744629, "global_step": 156619, "epoch": 932} {"train_loss": -10.985841751098633, "global_step": 156620, "epoch": 932} {"train_loss": -10.85013198852539, "global_step": 156621, "epoch": 932} {"train_loss": -11.08022689819336, "global_step": 156622, "epoch": 932} {"train_loss": -11.075971603393555, "global_step": 156623, "epoch": 932} {"train_loss": -10.9684419631958, "global_step": 156624, "epoch": 932} {"train_loss": -10.954706192016602, "global_step": 156625, "epoch": 932} {"train_loss": -10.905786514282227, "global_step": 156626, "epoch": 932} {"train_loss": -11.08541202545166, "global_step": 156627, "epoch": 932} {"train_loss": -10.961884498596191, "global_step": 156628, "epoch": 932} {"train_loss": -11.148771286010742, "global_step": 156629, "epoch": 932} {"train_loss": -10.983098030090332, "global_step": 156630, "epoch": 932} {"train_loss": -11.142170906066895, "global_step": 156631, "epoch": 932} {"train_loss": -11.053038597106934, "global_step": 156632, "epoch": 932} {"train_loss": -10.747598648071289, "global_step": 156633, "epoch": 932} {"train_loss": -10.726479530334473, "global_step": 156634, "epoch": 932} {"train_loss": -10.950376510620117, "global_step": 156635, "epoch": 932} {"train_loss": -10.896434783935547, "global_step": 156636, "epoch": 932} {"train_loss": -10.254098892211914, "global_step": 156637, "epoch": 932} {"train_loss": -10.825885772705078, "global_step": 156638, "epoch": 932} {"train_loss": -10.999217987060547, "global_step": 156639, "epoch": 932} {"train_loss": -10.799935340881348, "global_step": 156640, "epoch": 932} {"train_loss": -11.137138366699219, "global_step": 156641, "epoch": 932} {"train_loss": -10.883302688598633, "global_step": 156642, "epoch": 932} {"train_loss": -10.913352966308594, "global_step": 156643, "epoch": 932} {"train_loss": -10.79609203338623, "global_step": 156644, "epoch": 932} {"train_loss": -11.107696533203125, "global_step": 156645, "epoch": 932} {"train_loss": -10.948724746704102, "global_step": 156646, "epoch": 932} {"train_loss": -10.432087898254395, "global_step": 156647, "epoch": 932} {"train_loss": -10.473403930664062, "global_step": 156648, "epoch": 932} {"train_loss": -10.74236011505127, "global_step": 156649, "epoch": 932} {"train_loss": -10.443565368652344, "global_step": 156650, "epoch": 932} {"train_loss": -10.3474702835083, "global_step": 156651, "epoch": 932} {"train_loss": -10.99487590789795, "global_step": 156652, "epoch": 932} {"train_loss": -10.763433456420898, "global_step": 156653, "epoch": 932} {"train_loss": -10.832036972045898, "global_step": 156654, "epoch": 932} {"train_loss": -10.672195434570312, "global_step": 156655, "epoch": 932} {"train_loss": -10.038379669189453, "global_step": 156656, "epoch": 932} {"train_loss": -10.62450885772705, "global_step": 156657, "epoch": 932} {"train_loss": -11.094675064086914, "global_step": 156658, "epoch": 932} {"train_loss": -11.002771377563477, "global_step": 156659, "epoch": 932} {"train_loss": -10.971298217773438, "global_step": 156660, "epoch": 932} {"train_loss": -10.982074737548828, "global_step": 156661, "epoch": 932} {"train_loss": -10.86426830291748, "global_step": 156662, "epoch": 932} {"train_loss": -11.095441818237305, "global_step": 156663, "epoch": 932} {"train_loss": -10.624421119689941, "global_step": 156664, "epoch": 932} {"train_loss": -10.828325271606445, "global_step": 156665, "epoch": 932} {"train_loss": -10.887431144714355, "global_step": 156666, "epoch": 932} {"train_loss": -11.179194450378418, "global_step": 156667, "epoch": 932} {"train_loss": -10.803693771362305, "global_step": 156668, "epoch": 932} {"train_loss": -10.763898849487305, "global_step": 156669, "epoch": 932} {"train_loss": -11.120779037475586, "global_step": 156670, "epoch": 932} {"train_loss": -10.794069290161133, "global_step": 156671, "epoch": 932} {"train_loss": -10.849437713623047, "global_step": 156672, "epoch": 932} {"train_loss": -10.913485527038574, "global_step": 156673, "epoch": 932} {"train_loss": -10.846302032470703, "global_step": 156674, "epoch": 932} {"train_loss": -10.860336303710938, "global_step": 156675, "epoch": 932} {"train_loss": -10.57477855682373, "global_step": 156676, "epoch": 932} {"train_loss": -10.706340789794922, "global_step": 156677, "epoch": 932} {"train_loss": -11.057323455810547, "global_step": 156678, "epoch": 932} {"train_loss": -10.340051651000977, "global_step": 156679, "epoch": 932} {"train_loss": -10.954934120178223, "global_step": 156680, "epoch": 932} {"train_loss": -10.525277137756348, "global_step": 156681, "epoch": 932} {"train_loss": -10.768333435058594, "global_step": 156682, "epoch": 932} {"train_loss": -10.40285873413086, "global_step": 156683, "epoch": 932} {"train_loss": -11.020228385925293, "global_step": 156684, "epoch": 932} {"train_loss": -10.712774276733398, "global_step": 156685, "epoch": 932} {"train_loss": -10.733675003051758, "global_step": 156686, "epoch": 932} {"train_loss": -10.895809173583984, "global_step": 156687, "epoch": 932} {"train_loss": -10.5433349609375, "global_step": 156688, "epoch": 932} {"train_loss": -10.634795188903809, "global_step": 156689, "epoch": 932} {"train_loss": -10.519987106323242, "global_step": 156690, "epoch": 932} {"train_loss": -11.012229919433594, "global_step": 156691, "epoch": 932} {"train_loss": -10.746265411376953, "global_step": 156692, "epoch": 932} {"train_loss": -10.780832290649414, "global_step": 156693, "epoch": 932} {"train_loss": -10.609421730041504, "global_step": 156694, "epoch": 932} {"train_loss": -10.851780891418457, "global_step": 156695, "epoch": 932} {"train_loss": -10.924741744995117, "global_step": 156696, "epoch": 932} {"train_loss": -10.598047256469727, "global_step": 156697, "epoch": 932} {"train_loss": -11.105865478515625, "global_step": 156698, "epoch": 932} {"train_loss": -10.35578727722168, "global_step": 156699, "epoch": 932} {"train_loss": -10.953176498413086, "global_step": 156700, "epoch": 932} {"train_loss": -10.385904312133789, "global_step": 156701, "epoch": 932} {"train_loss": -10.972026824951172, "global_step": 156702, "epoch": 932} {"train_loss": -11.02632999420166, "global_step": 156703, "epoch": 932} {"train_loss": -10.811349868774414, "global_step": 156704, "epoch": 932} {"train_loss": -11.027885437011719, "global_step": 156705, "epoch": 932} {"train_loss": -10.629890441894531, "global_step": 156706, "epoch": 932} {"train_loss": -10.965354919433594, "global_step": 156707, "epoch": 932} {"train_loss": -10.202723503112793, "global_step": 156708, "epoch": 932} {"train_loss": -10.738381385803223, "global_step": 156709, "epoch": 932} {"train_loss": -9.7357177734375, "global_step": 156710, "epoch": 932} {"train_loss": -10.420259475708008, "global_step": 156711, "epoch": 932} {"train_loss": -10.213069915771484, "global_step": 156712, "epoch": 932} {"train_loss": -10.279143333435059, "global_step": 156713, "epoch": 932} {"train_loss": -9.792383193969727, "global_step": 156714, "epoch": 932} {"train_loss": -9.886743545532227, "global_step": 156715, "epoch": 932} {"train_loss": -8.960949897766113, "global_step": 156716, "epoch": 932} {"train_loss": -10.311649322509766, "global_step": 156717, "epoch": 932} {"train_loss": -9.387866020202637, "global_step": 156718, "epoch": 932} {"train_loss": -10.448878288269043, "global_step": 156719, "epoch": 932} {"train_loss": -9.926610946655273, "global_step": 156720, "epoch": 932} {"train_loss": -10.342560768127441, "global_step": 156721, "epoch": 932} {"train_loss": -10.000686645507812, "global_step": 156722, "epoch": 932} {"train_loss": -10.628217697143555, "global_step": 156723, "epoch": 932} {"train_loss": -10.01038932800293, "global_step": 156724, "epoch": 932} {"train_loss": -10.657476425170898, "global_step": 156725, "epoch": 932} {"train_loss": -10.291040420532227, "global_step": 156726, "epoch": 932} {"train_loss": -10.7703218460083, "global_step": 156727, "epoch": 932} {"train_loss": -10.597026824951172, "global_step": 156728, "epoch": 932} {"train_loss": -10.52685546875, "global_step": 156729, "epoch": 932} {"train_loss": -10.597062110900879, "global_step": 156730, "epoch": 932} {"train_loss": -10.352763175964355, "global_step": 156731, "epoch": 932} {"train_loss": -10.706077575683594, "global_step": 156732, "epoch": 932} {"train_loss": -10.725309371948242, "global_step": 156733, "epoch": 932} {"train_loss": -10.675983428955078, "global_step": 156734, "epoch": 932} {"train_loss": -10.797374725341797, "global_step": 156735, "epoch": 932} {"train_loss": -10.590723037719727, "global_step": 156736, "epoch": 932} {"train_loss": -10.529229164123535, "global_step": 156737, "epoch": 932} {"train_loss": -10.761905670166016, "global_step": 156738, "epoch": 932} {"train_loss": -10.885128021240234, "global_step": 156739, "epoch": 932} {"train_loss": -10.837297439575195, "global_step": 156740, "epoch": 932} {"train_loss": -10.734484672546387, "global_step": 156741, "epoch": 932} {"train_loss": -10.792267799377441, "global_step": 156742, "epoch": 932} {"train_loss": -10.593449439321246, "global_step": 156743, "epoch": 932, "val_loss": 234874.125} {"train_loss": -10.860910415649414, "global_step": 156744, "epoch": 933} {"train_loss": -11.127452850341797, "global_step": 156745, "epoch": 933} {"train_loss": -10.9424409866333, "global_step": 156746, "epoch": 933} {"train_loss": -10.681989669799805, "global_step": 156747, "epoch": 933} {"train_loss": -10.978212356567383, "global_step": 156748, "epoch": 933} {"train_loss": -10.989361763000488, "global_step": 156749, "epoch": 933} {"train_loss": -10.779234886169434, "global_step": 156750, "epoch": 933} {"train_loss": -10.87085247039795, "global_step": 156751, "epoch": 933} {"train_loss": -11.028534889221191, "global_step": 156752, "epoch": 933} {"train_loss": -10.965553283691406, "global_step": 156753, "epoch": 933} {"train_loss": -10.981512069702148, "global_step": 156754, "epoch": 933} {"train_loss": -10.863823890686035, "global_step": 156755, "epoch": 933} {"train_loss": -10.881568908691406, "global_step": 156756, "epoch": 933} {"train_loss": -11.100227355957031, "global_step": 156757, "epoch": 933} {"train_loss": -10.953641891479492, "global_step": 156758, "epoch": 933} {"train_loss": -11.03989028930664, "global_step": 156759, "epoch": 933} {"train_loss": -11.298870086669922, "global_step": 156760, "epoch": 933} {"train_loss": -11.150634765625, "global_step": 156761, "epoch": 933} {"train_loss": -11.153308868408203, "global_step": 156762, "epoch": 933} {"train_loss": -11.169524192810059, "global_step": 156763, "epoch": 933} {"train_loss": -11.152791976928711, "global_step": 156764, "epoch": 933} {"train_loss": -10.994630813598633, "global_step": 156765, "epoch": 933} {"train_loss": -10.966373443603516, "global_step": 156766, "epoch": 933} {"train_loss": -11.092628479003906, "global_step": 156767, "epoch": 933} {"train_loss": -11.022710800170898, "global_step": 156768, "epoch": 933} {"train_loss": -11.040225982666016, "global_step": 156769, "epoch": 933} {"train_loss": -10.919370651245117, "global_step": 156770, "epoch": 933} {"train_loss": -11.002565383911133, "global_step": 156771, "epoch": 933} {"train_loss": -11.189424514770508, "global_step": 156772, "epoch": 933} {"train_loss": -10.969257354736328, "global_step": 156773, "epoch": 933} {"train_loss": -10.907529830932617, "global_step": 156774, "epoch": 933} {"train_loss": -10.527369499206543, "global_step": 156775, "epoch": 933} {"train_loss": -10.828325271606445, "global_step": 156776, "epoch": 933} {"train_loss": -10.63778305053711, "global_step": 156777, "epoch": 933} {"train_loss": -10.460614204406738, "global_step": 156778, "epoch": 933} {"train_loss": -10.983110427856445, "global_step": 156779, "epoch": 933} {"train_loss": -10.721908569335938, "global_step": 156780, "epoch": 933} {"train_loss": -10.538999557495117, "global_step": 156781, "epoch": 933} {"train_loss": -10.581006050109863, "global_step": 156782, "epoch": 933} {"train_loss": -10.784022331237793, "global_step": 156783, "epoch": 933} {"train_loss": -9.958426475524902, "global_step": 156784, "epoch": 933} {"train_loss": -10.880020141601562, "global_step": 156785, "epoch": 933} {"train_loss": -9.796092987060547, "global_step": 156786, "epoch": 933} {"train_loss": -9.910513877868652, "global_step": 156787, "epoch": 933} {"train_loss": -10.195446014404297, "global_step": 156788, "epoch": 933} {"train_loss": -10.63528823852539, "global_step": 156789, "epoch": 933} {"train_loss": -8.830608367919922, "global_step": 156790, "epoch": 933} {"train_loss": -9.893543243408203, "global_step": 156791, "epoch": 933} {"train_loss": -9.827322006225586, "global_step": 156792, "epoch": 933} {"train_loss": -10.522985458374023, "global_step": 156793, "epoch": 933} {"train_loss": -10.490779876708984, "global_step": 156794, "epoch": 933} {"train_loss": -10.219505310058594, "global_step": 156795, "epoch": 933} {"train_loss": -10.496124267578125, "global_step": 156796, "epoch": 933} {"train_loss": -10.700479507446289, "global_step": 156797, "epoch": 933} {"train_loss": -10.673067092895508, "global_step": 156798, "epoch": 933} {"train_loss": -10.912811279296875, "global_step": 156799, "epoch": 933} {"train_loss": -10.609490394592285, "global_step": 156800, "epoch": 933} {"train_loss": -10.84327220916748, "global_step": 156801, "epoch": 933} {"train_loss": -10.915058135986328, "global_step": 156802, "epoch": 933} {"train_loss": -10.633931159973145, "global_step": 156803, "epoch": 933} {"train_loss": -10.887054443359375, "global_step": 156804, "epoch": 933} {"train_loss": -10.620943069458008, "global_step": 156805, "epoch": 933} {"train_loss": -10.840689659118652, "global_step": 156806, "epoch": 933} {"train_loss": -10.646595001220703, "global_step": 156807, "epoch": 933} {"train_loss": -10.938538551330566, "global_step": 156808, "epoch": 933} {"train_loss": -10.859618186950684, "global_step": 156809, "epoch": 933} {"train_loss": -10.816125869750977, "global_step": 156810, "epoch": 933} {"train_loss": -10.779806137084961, "global_step": 156811, "epoch": 933} {"train_loss": -10.880294799804688, "global_step": 156812, "epoch": 933} {"train_loss": -11.080464363098145, "global_step": 156813, "epoch": 933} {"train_loss": -10.651613235473633, "global_step": 156814, "epoch": 933} {"train_loss": -11.11226749420166, "global_step": 156815, "epoch": 933} {"train_loss": -10.863431930541992, "global_step": 156816, "epoch": 933} {"train_loss": -11.036706924438477, "global_step": 156817, "epoch": 933} {"train_loss": -10.900125503540039, "global_step": 156818, "epoch": 933} {"train_loss": -10.887892723083496, "global_step": 156819, "epoch": 933} {"train_loss": -10.846420288085938, "global_step": 156820, "epoch": 933} {"train_loss": -10.903277397155762, "global_step": 156821, "epoch": 933} {"train_loss": -10.683021545410156, "global_step": 156822, "epoch": 933} {"train_loss": -10.849617004394531, "global_step": 156823, "epoch": 933} {"train_loss": -10.647104263305664, "global_step": 156824, "epoch": 933} {"train_loss": -11.038003921508789, "global_step": 156825, "epoch": 933} {"train_loss": -10.620590209960938, "global_step": 156826, "epoch": 933} {"train_loss": -10.661707878112793, "global_step": 156827, "epoch": 933} {"train_loss": -11.141788482666016, "global_step": 156828, "epoch": 933} {"train_loss": -10.982109069824219, "global_step": 156829, "epoch": 933} {"train_loss": -11.008989334106445, "global_step": 156830, "epoch": 933} {"train_loss": -10.83216381072998, "global_step": 156831, "epoch": 933} {"train_loss": -11.219573020935059, "global_step": 156832, "epoch": 933} {"train_loss": -10.640403747558594, "global_step": 156833, "epoch": 933} {"train_loss": -10.877521514892578, "global_step": 156834, "epoch": 933} {"train_loss": -10.94253921508789, "global_step": 156835, "epoch": 933} {"train_loss": -10.966869354248047, "global_step": 156836, "epoch": 933} {"train_loss": -10.923064231872559, "global_step": 156837, "epoch": 933} {"train_loss": -10.851999282836914, "global_step": 156838, "epoch": 933} {"train_loss": -10.928234100341797, "global_step": 156839, "epoch": 933} {"train_loss": -10.808865547180176, "global_step": 156840, "epoch": 933} {"train_loss": -11.031106948852539, "global_step": 156841, "epoch": 933} {"train_loss": -10.829560279846191, "global_step": 156842, "epoch": 933} {"train_loss": -11.112122535705566, "global_step": 156843, "epoch": 933} {"train_loss": -11.193653106689453, "global_step": 156844, "epoch": 933} {"train_loss": -10.855854034423828, "global_step": 156845, "epoch": 933} {"train_loss": -11.042612075805664, "global_step": 156846, "epoch": 933} {"train_loss": -10.808212280273438, "global_step": 156847, "epoch": 933} {"train_loss": -11.029081344604492, "global_step": 156848, "epoch": 933} {"train_loss": -11.06814193725586, "global_step": 156849, "epoch": 933} {"train_loss": -10.761201858520508, "global_step": 156850, "epoch": 933} {"train_loss": -10.62491226196289, "global_step": 156851, "epoch": 933} {"train_loss": -11.17082691192627, "global_step": 156852, "epoch": 933} {"train_loss": -10.752201080322266, "global_step": 156853, "epoch": 933} {"train_loss": -10.462783813476562, "global_step": 156854, "epoch": 933} {"train_loss": -11.083486557006836, "global_step": 156855, "epoch": 933} {"train_loss": -10.779864311218262, "global_step": 156856, "epoch": 933} {"train_loss": -11.195549011230469, "global_step": 156857, "epoch": 933} {"train_loss": -10.601058959960938, "global_step": 156858, "epoch": 933} {"train_loss": -10.743416786193848, "global_step": 156859, "epoch": 933} {"train_loss": -10.770532608032227, "global_step": 156860, "epoch": 933} {"train_loss": -10.810985565185547, "global_step": 156861, "epoch": 933} {"train_loss": -10.922040939331055, "global_step": 156862, "epoch": 933} {"train_loss": -10.799945831298828, "global_step": 156863, "epoch": 933} {"train_loss": -10.634024620056152, "global_step": 156864, "epoch": 933} {"train_loss": -10.93156623840332, "global_step": 156865, "epoch": 933} {"train_loss": -10.639348983764648, "global_step": 156866, "epoch": 933} {"train_loss": -10.894725799560547, "global_step": 156867, "epoch": 933} {"train_loss": -10.90591812133789, "global_step": 156868, "epoch": 933} {"train_loss": -10.719886779785156, "global_step": 156869, "epoch": 933} {"train_loss": -10.551485061645508, "global_step": 156870, "epoch": 933} {"train_loss": -10.913414001464844, "global_step": 156871, "epoch": 933} {"train_loss": -10.478473663330078, "global_step": 156872, "epoch": 933} {"train_loss": -10.794916152954102, "global_step": 156873, "epoch": 933} {"train_loss": -10.595624923706055, "global_step": 156874, "epoch": 933} {"train_loss": -10.672861099243164, "global_step": 156875, "epoch": 933} {"train_loss": -10.271455764770508, "global_step": 156876, "epoch": 933} {"train_loss": -10.368744850158691, "global_step": 156877, "epoch": 933} {"train_loss": -11.077975273132324, "global_step": 156878, "epoch": 933} {"train_loss": -10.078819274902344, "global_step": 156879, "epoch": 933} {"train_loss": -10.139168739318848, "global_step": 156880, "epoch": 933} {"train_loss": -10.59407901763916, "global_step": 156881, "epoch": 933} {"train_loss": -10.619718551635742, "global_step": 156882, "epoch": 933} {"train_loss": -9.96652603149414, "global_step": 156883, "epoch": 933} {"train_loss": -10.509757041931152, "global_step": 156884, "epoch": 933} {"train_loss": -10.715130805969238, "global_step": 156885, "epoch": 933} {"train_loss": -10.143135070800781, "global_step": 156886, "epoch": 933} {"train_loss": -10.810837745666504, "global_step": 156887, "epoch": 933} {"train_loss": -10.65351676940918, "global_step": 156888, "epoch": 933} {"train_loss": -10.623682022094727, "global_step": 156889, "epoch": 933} {"train_loss": -10.850910186767578, "global_step": 156890, "epoch": 933} {"train_loss": -10.558635711669922, "global_step": 156891, "epoch": 933} {"train_loss": -10.79772663116455, "global_step": 156892, "epoch": 933} {"train_loss": -10.736665725708008, "global_step": 156893, "epoch": 933} {"train_loss": -10.598651885986328, "global_step": 156894, "epoch": 933} {"train_loss": -10.965265274047852, "global_step": 156895, "epoch": 933} {"train_loss": -10.406864166259766, "global_step": 156896, "epoch": 933} {"train_loss": -11.004570007324219, "global_step": 156897, "epoch": 933} {"train_loss": -10.409984588623047, "global_step": 156898, "epoch": 933} {"train_loss": -10.986448287963867, "global_step": 156899, "epoch": 933} {"train_loss": -10.60617446899414, "global_step": 156900, "epoch": 933} {"train_loss": -10.985907554626465, "global_step": 156901, "epoch": 933} {"train_loss": -10.872060775756836, "global_step": 156902, "epoch": 933} {"train_loss": -10.91567611694336, "global_step": 156903, "epoch": 933} {"train_loss": -10.840616226196289, "global_step": 156904, "epoch": 933} {"train_loss": -11.114148139953613, "global_step": 156905, "epoch": 933} {"train_loss": -10.779560089111328, "global_step": 156906, "epoch": 933} {"train_loss": -11.1572265625, "global_step": 156907, "epoch": 933} {"train_loss": -10.891874313354492, "global_step": 156908, "epoch": 933} {"train_loss": -10.83271312713623, "global_step": 156909, "epoch": 933} {"train_loss": -10.867905616760254, "global_step": 156910, "epoch": 933} {"train_loss": -10.774165125120254, "global_step": 156911, "epoch": 933, "val_loss": 234675.75} {"train_loss": -10.969161987304688, "global_step": 156912, "epoch": 934} {"train_loss": -10.958358764648438, "global_step": 156913, "epoch": 934} {"train_loss": -11.019318580627441, "global_step": 156914, "epoch": 934} {"train_loss": -11.066295623779297, "global_step": 156915, "epoch": 934} {"train_loss": -11.185873031616211, "global_step": 156916, "epoch": 934} {"train_loss": -11.029932022094727, "global_step": 156917, "epoch": 934} {"train_loss": -11.151216506958008, "global_step": 156918, "epoch": 934} {"train_loss": -10.912849426269531, "global_step": 156919, "epoch": 934} {"train_loss": -11.127098083496094, "global_step": 156920, "epoch": 934} {"train_loss": -10.988237380981445, "global_step": 156921, "epoch": 934} {"train_loss": -11.19745922088623, "global_step": 156922, "epoch": 934} {"train_loss": -11.053970336914062, "global_step": 156923, "epoch": 934} {"train_loss": -10.998146057128906, "global_step": 156924, "epoch": 934} {"train_loss": -11.028091430664062, "global_step": 156925, "epoch": 934} {"train_loss": -11.047605514526367, "global_step": 156926, "epoch": 934} {"train_loss": -11.199102401733398, "global_step": 156927, "epoch": 934} {"train_loss": -11.172503471374512, "global_step": 156928, "epoch": 934} {"train_loss": -11.182881355285645, "global_step": 156929, "epoch": 934} {"train_loss": -10.99463176727295, "global_step": 156930, "epoch": 934} {"train_loss": -11.386075973510742, "global_step": 156931, "epoch": 934} {"train_loss": -10.790337562561035, "global_step": 156932, "epoch": 934} {"train_loss": -11.0526704788208, "global_step": 156933, "epoch": 934} {"train_loss": -10.921743392944336, "global_step": 156934, "epoch": 934} {"train_loss": -10.8851900100708, "global_step": 156935, "epoch": 934} {"train_loss": -10.86047649383545, "global_step": 156936, "epoch": 934} {"train_loss": -11.07255744934082, "global_step": 156937, "epoch": 934} {"train_loss": -10.90546703338623, "global_step": 156938, "epoch": 934} {"train_loss": -10.290145874023438, "global_step": 156939, "epoch": 934} {"train_loss": -10.659236907958984, "global_step": 156940, "epoch": 934} {"train_loss": -10.67623519897461, "global_step": 156941, "epoch": 934} {"train_loss": -10.768306732177734, "global_step": 156942, "epoch": 934} {"train_loss": -10.884543418884277, "global_step": 156943, "epoch": 934} {"train_loss": -10.362236022949219, "global_step": 156944, "epoch": 934} {"train_loss": -9.663103103637695, "global_step": 156945, "epoch": 934} {"train_loss": -10.56015396118164, "global_step": 156946, "epoch": 934} {"train_loss": -9.905017852783203, "global_step": 156947, "epoch": 934} {"train_loss": -9.588997840881348, "global_step": 156948, "epoch": 934} {"train_loss": -10.528508186340332, "global_step": 156949, "epoch": 934} {"train_loss": -10.372888565063477, "global_step": 156950, "epoch": 934} {"train_loss": -10.810108184814453, "global_step": 156951, "epoch": 934} {"train_loss": -10.623050689697266, "global_step": 156952, "epoch": 934} {"train_loss": -10.167531967163086, "global_step": 156953, "epoch": 934} {"train_loss": -10.222367286682129, "global_step": 156954, "epoch": 934} {"train_loss": -10.46298599243164, "global_step": 156955, "epoch": 934} {"train_loss": -10.099138259887695, "global_step": 156956, "epoch": 934} {"train_loss": -9.889490127563477, "global_step": 156957, "epoch": 934} {"train_loss": -9.646529197692871, "global_step": 156958, "epoch": 934} {"train_loss": -9.773324966430664, "global_step": 156959, "epoch": 934} {"train_loss": -10.605132102966309, "global_step": 156960, "epoch": 934} {"train_loss": -9.679176330566406, "global_step": 156961, "epoch": 934} {"train_loss": -10.677724838256836, "global_step": 156962, "epoch": 934} {"train_loss": -10.041462898254395, "global_step": 156963, "epoch": 934} {"train_loss": -10.3716402053833, "global_step": 156964, "epoch": 934} {"train_loss": -10.527471542358398, "global_step": 156965, "epoch": 934} {"train_loss": -10.676464080810547, "global_step": 156966, "epoch": 934} {"train_loss": -10.32546615600586, "global_step": 156967, "epoch": 934} {"train_loss": -10.730892181396484, "global_step": 156968, "epoch": 934} {"train_loss": -10.502660751342773, "global_step": 156969, "epoch": 934} {"train_loss": -10.705471992492676, "global_step": 156970, "epoch": 934} {"train_loss": -10.271657943725586, "global_step": 156971, "epoch": 934} {"train_loss": -10.347694396972656, "global_step": 156972, "epoch": 934} {"train_loss": -10.572013854980469, "global_step": 156973, "epoch": 934} {"train_loss": -10.51699447631836, "global_step": 156974, "epoch": 934} {"train_loss": -10.531351089477539, "global_step": 156975, "epoch": 934} {"train_loss": -11.038309097290039, "global_step": 156976, "epoch": 934} {"train_loss": -10.584771156311035, "global_step": 156977, "epoch": 934} {"train_loss": -10.40412425994873, "global_step": 156978, "epoch": 934} {"train_loss": -10.745147705078125, "global_step": 156979, "epoch": 934} {"train_loss": -10.555206298828125, "global_step": 156980, "epoch": 934} {"train_loss": -10.880549430847168, "global_step": 156981, "epoch": 934} {"train_loss": -10.866453170776367, "global_step": 156982, "epoch": 934} {"train_loss": -10.621528625488281, "global_step": 156983, "epoch": 934} {"train_loss": -10.981952667236328, "global_step": 156984, "epoch": 934} {"train_loss": -10.750700950622559, "global_step": 156985, "epoch": 934} {"train_loss": -10.789639472961426, "global_step": 156986, "epoch": 934} {"train_loss": -11.02170181274414, "global_step": 156987, "epoch": 934} {"train_loss": -10.891363143920898, "global_step": 156988, "epoch": 934} {"train_loss": -10.733453750610352, "global_step": 156989, "epoch": 934} {"train_loss": -10.941576957702637, "global_step": 156990, "epoch": 934} {"train_loss": -10.994304656982422, "global_step": 156991, "epoch": 934} {"train_loss": -10.695241928100586, "global_step": 156992, "epoch": 934} {"train_loss": -10.831537246704102, "global_step": 156993, "epoch": 934} {"train_loss": -10.903339385986328, "global_step": 156994, "epoch": 934} {"train_loss": -11.06826400756836, "global_step": 156995, "epoch": 934} {"train_loss": -11.015873908996582, "global_step": 156996, "epoch": 934} {"train_loss": -11.167147636413574, "global_step": 156997, "epoch": 934} {"train_loss": -10.861335754394531, "global_step": 156998, "epoch": 934} {"train_loss": -11.142457008361816, "global_step": 156999, "epoch": 934} {"train_loss": -10.896490097045898, "global_step": 157000, "epoch": 934} {"train_loss": -10.872234344482422, "global_step": 157001, "epoch": 934} {"train_loss": -11.19796371459961, "global_step": 157002, "epoch": 934} {"train_loss": -10.780158996582031, "global_step": 157003, "epoch": 934} {"train_loss": -11.093330383300781, "global_step": 157004, "epoch": 934} {"train_loss": -11.156000137329102, "global_step": 157005, "epoch": 934} {"train_loss": -10.841575622558594, "global_step": 157006, "epoch": 934} {"train_loss": -11.159748077392578, "global_step": 157007, "epoch": 934} {"train_loss": -11.029966354370117, "global_step": 157008, "epoch": 934} {"train_loss": -10.967262268066406, "global_step": 157009, "epoch": 934} {"train_loss": -10.860522270202637, "global_step": 157010, "epoch": 934} {"train_loss": -10.685726165771484, "global_step": 157011, "epoch": 934} {"train_loss": -10.44824504852295, "global_step": 157012, "epoch": 934} {"train_loss": -10.964003562927246, "global_step": 157013, "epoch": 934} {"train_loss": -10.718339920043945, "global_step": 157014, "epoch": 934} {"train_loss": -10.534019470214844, "global_step": 157015, "epoch": 934} {"train_loss": -10.660970687866211, "global_step": 157016, "epoch": 934} {"train_loss": -10.527106285095215, "global_step": 157017, "epoch": 934} {"train_loss": -10.93189811706543, "global_step": 157018, "epoch": 934} {"train_loss": -10.484899520874023, "global_step": 157019, "epoch": 934} {"train_loss": -10.957901954650879, "global_step": 157020, "epoch": 934} {"train_loss": -11.079255104064941, "global_step": 157021, "epoch": 934} {"train_loss": -11.027084350585938, "global_step": 157022, "epoch": 934} {"train_loss": -11.349440574645996, "global_step": 157023, "epoch": 934} {"train_loss": -10.977886199951172, "global_step": 157024, "epoch": 934} {"train_loss": -10.784664154052734, "global_step": 157025, "epoch": 934} {"train_loss": -11.183267593383789, "global_step": 157026, "epoch": 934} {"train_loss": -10.833338737487793, "global_step": 157027, "epoch": 934} {"train_loss": -11.288885116577148, "global_step": 157028, "epoch": 934} {"train_loss": -10.892645835876465, "global_step": 157029, "epoch": 934} {"train_loss": -10.908025741577148, "global_step": 157030, "epoch": 934} {"train_loss": -10.685428619384766, "global_step": 157031, "epoch": 934} {"train_loss": -10.90913200378418, "global_step": 157032, "epoch": 934} {"train_loss": -10.835329055786133, "global_step": 157033, "epoch": 934} {"train_loss": -11.336756706237793, "global_step": 157034, "epoch": 934} {"train_loss": -10.894617080688477, "global_step": 157035, "epoch": 934} {"train_loss": -10.888797760009766, "global_step": 157036, "epoch": 934} {"train_loss": -10.713241577148438, "global_step": 157037, "epoch": 934} {"train_loss": -11.100162506103516, "global_step": 157038, "epoch": 934} {"train_loss": -10.919878005981445, "global_step": 157039, "epoch": 934} {"train_loss": -10.818592071533203, "global_step": 157040, "epoch": 934} {"train_loss": -10.866077423095703, "global_step": 157041, "epoch": 934} {"train_loss": -10.927870750427246, "global_step": 157042, "epoch": 934} {"train_loss": -10.943270683288574, "global_step": 157043, "epoch": 934} {"train_loss": -11.124905586242676, "global_step": 157044, "epoch": 934} {"train_loss": -10.712392807006836, "global_step": 157045, "epoch": 934} {"train_loss": -10.785600662231445, "global_step": 157046, "epoch": 934} {"train_loss": -10.800399780273438, "global_step": 157047, "epoch": 934} {"train_loss": -10.568878173828125, "global_step": 157048, "epoch": 934} {"train_loss": -10.803075790405273, "global_step": 157049, "epoch": 934} {"train_loss": -10.564895629882812, "global_step": 157050, "epoch": 934} {"train_loss": -11.096885681152344, "global_step": 157051, "epoch": 934} {"train_loss": -10.646620750427246, "global_step": 157052, "epoch": 934} {"train_loss": -10.823158264160156, "global_step": 157053, "epoch": 934} {"train_loss": -10.799518585205078, "global_step": 157054, "epoch": 934} {"train_loss": -10.525955200195312, "global_step": 157055, "epoch": 934} {"train_loss": -10.914546966552734, "global_step": 157056, "epoch": 934} {"train_loss": -10.453688621520996, "global_step": 157057, "epoch": 934} {"train_loss": -11.006757736206055, "global_step": 157058, "epoch": 934} {"train_loss": -11.133077621459961, "global_step": 157059, "epoch": 934} {"train_loss": -10.944341659545898, "global_step": 157060, "epoch": 934} {"train_loss": -11.07887077331543, "global_step": 157061, "epoch": 934} {"train_loss": -11.073332786560059, "global_step": 157062, "epoch": 934} {"train_loss": -10.911362648010254, "global_step": 157063, "epoch": 934} {"train_loss": -11.057195663452148, "global_step": 157064, "epoch": 934} {"train_loss": -11.0526762008667, "global_step": 157065, "epoch": 934} {"train_loss": -11.083106994628906, "global_step": 157066, "epoch": 934} {"train_loss": -11.003630638122559, "global_step": 157067, "epoch": 934} {"train_loss": -10.961102485656738, "global_step": 157068, "epoch": 934} {"train_loss": -10.804922103881836, "global_step": 157069, "epoch": 934} {"train_loss": -10.777259826660156, "global_step": 157070, "epoch": 934} {"train_loss": -11.183431625366211, "global_step": 157071, "epoch": 934} {"train_loss": -11.003375053405762, "global_step": 157072, "epoch": 934} {"train_loss": -11.048867225646973, "global_step": 157073, "epoch": 934} {"train_loss": -11.06381607055664, "global_step": 157074, "epoch": 934} {"train_loss": -10.941213607788086, "global_step": 157075, "epoch": 934} {"train_loss": -10.902759552001953, "global_step": 157076, "epoch": 934} {"train_loss": -11.091711044311523, "global_step": 157077, "epoch": 934} {"train_loss": -10.968844413757324, "global_step": 157078, "epoch": 934} {"train_loss": -10.800442548025222, "global_step": 157079, "epoch": 934, "val_loss": 232849.296875} {"train_loss": -11.186054229736328, "global_step": 157080, "epoch": 935} {"train_loss": -10.909463882446289, "global_step": 157081, "epoch": 935} {"train_loss": -10.944628715515137, "global_step": 157082, "epoch": 935} {"train_loss": -11.100444793701172, "global_step": 157083, "epoch": 935} {"train_loss": -10.853789329528809, "global_step": 157084, "epoch": 935} {"train_loss": -10.78555679321289, "global_step": 157085, "epoch": 935} {"train_loss": -11.076221466064453, "global_step": 157086, "epoch": 935} {"train_loss": -11.117359161376953, "global_step": 157087, "epoch": 935} {"train_loss": -11.211231231689453, "global_step": 157088, "epoch": 935} {"train_loss": -11.13028335571289, "global_step": 157089, "epoch": 935} {"train_loss": -10.90904712677002, "global_step": 157090, "epoch": 935} {"train_loss": -10.886240005493164, "global_step": 157091, "epoch": 935} {"train_loss": -11.028450012207031, "global_step": 157092, "epoch": 935} {"train_loss": -10.67770004272461, "global_step": 157093, "epoch": 935} {"train_loss": -10.864925384521484, "global_step": 157094, "epoch": 935} {"train_loss": -11.021221160888672, "global_step": 157095, "epoch": 935} {"train_loss": -10.732398986816406, "global_step": 157096, "epoch": 935} {"train_loss": -10.60716724395752, "global_step": 157097, "epoch": 935} {"train_loss": -10.73147201538086, "global_step": 157098, "epoch": 935} {"train_loss": -10.075539588928223, "global_step": 157099, "epoch": 935} {"train_loss": -9.622894287109375, "global_step": 157100, "epoch": 935} {"train_loss": -10.711432456970215, "global_step": 157101, "epoch": 935} {"train_loss": -10.555925369262695, "global_step": 157102, "epoch": 935} {"train_loss": -9.890209197998047, "global_step": 157103, "epoch": 935} {"train_loss": -10.696643829345703, "global_step": 157104, "epoch": 935} {"train_loss": -10.476476669311523, "global_step": 157105, "epoch": 935} {"train_loss": -9.80693244934082, "global_step": 157106, "epoch": 935} {"train_loss": -10.762279510498047, "global_step": 157107, "epoch": 935} {"train_loss": -10.02895736694336, "global_step": 157108, "epoch": 935} {"train_loss": -9.755182266235352, "global_step": 157109, "epoch": 935} {"train_loss": -10.280085563659668, "global_step": 157110, "epoch": 935} {"train_loss": -9.518760681152344, "global_step": 157111, "epoch": 935} {"train_loss": -10.40770149230957, "global_step": 157112, "epoch": 935} {"train_loss": -10.422432899475098, "global_step": 157113, "epoch": 935} {"train_loss": -10.270953178405762, "global_step": 157114, "epoch": 935} {"train_loss": -10.242671966552734, "global_step": 157115, "epoch": 935} {"train_loss": -10.00088119506836, "global_step": 157116, "epoch": 935} {"train_loss": -10.66955280303955, "global_step": 157117, "epoch": 935} {"train_loss": -10.66530990600586, "global_step": 157118, "epoch": 935} {"train_loss": -10.74107551574707, "global_step": 157119, "epoch": 935} {"train_loss": -10.516464233398438, "global_step": 157120, "epoch": 935} {"train_loss": -10.842660903930664, "global_step": 157121, "epoch": 935} {"train_loss": -10.568599700927734, "global_step": 157122, "epoch": 935} {"train_loss": -10.847578048706055, "global_step": 157123, "epoch": 935} {"train_loss": -10.683204650878906, "global_step": 157124, "epoch": 935} {"train_loss": -10.314318656921387, "global_step": 157125, "epoch": 935} {"train_loss": -10.877944946289062, "global_step": 157126, "epoch": 935} {"train_loss": -10.333344459533691, "global_step": 157127, "epoch": 935} {"train_loss": -10.731045722961426, "global_step": 157128, "epoch": 935} {"train_loss": -10.54039478302002, "global_step": 157129, "epoch": 935} {"train_loss": -10.387699127197266, "global_step": 157130, "epoch": 935} {"train_loss": -10.56431770324707, "global_step": 157131, "epoch": 935} {"train_loss": -10.460378646850586, "global_step": 157132, "epoch": 935} {"train_loss": -10.54544448852539, "global_step": 157133, "epoch": 935} {"train_loss": -10.747759819030762, "global_step": 157134, "epoch": 935} {"train_loss": -10.578849792480469, "global_step": 157135, "epoch": 935} {"train_loss": -10.751008987426758, "global_step": 157136, "epoch": 935} {"train_loss": -10.829418182373047, "global_step": 157137, "epoch": 935} {"train_loss": -11.032403945922852, "global_step": 157138, "epoch": 935} {"train_loss": -10.63913631439209, "global_step": 157139, "epoch": 935} {"train_loss": -10.756948471069336, "global_step": 157140, "epoch": 935} {"train_loss": -10.84619140625, "global_step": 157141, "epoch": 935} {"train_loss": -11.00857162475586, "global_step": 157142, "epoch": 935} {"train_loss": -10.38545036315918, "global_step": 157143, "epoch": 935} {"train_loss": -10.938000679016113, "global_step": 157144, "epoch": 935} {"train_loss": -10.788731575012207, "global_step": 157145, "epoch": 935} {"train_loss": -10.593976020812988, "global_step": 157146, "epoch": 935} {"train_loss": -10.640222549438477, "global_step": 157147, "epoch": 935} {"train_loss": -10.908864974975586, "global_step": 157148, "epoch": 935} {"train_loss": -10.325098037719727, "global_step": 157149, "epoch": 935} {"train_loss": -11.249811172485352, "global_step": 157150, "epoch": 935} {"train_loss": -10.393092155456543, "global_step": 157151, "epoch": 935} {"train_loss": -10.882024765014648, "global_step": 157152, "epoch": 935} {"train_loss": -10.647189140319824, "global_step": 157153, "epoch": 935} {"train_loss": -10.895675659179688, "global_step": 157154, "epoch": 935} {"train_loss": -10.790033340454102, "global_step": 157155, "epoch": 935} {"train_loss": -10.731796264648438, "global_step": 157156, "epoch": 935} {"train_loss": -11.012896537780762, "global_step": 157157, "epoch": 935} {"train_loss": -10.723700523376465, "global_step": 157158, "epoch": 935} {"train_loss": -10.801860809326172, "global_step": 157159, "epoch": 935} {"train_loss": -10.992505073547363, "global_step": 157160, "epoch": 935} {"train_loss": -10.659015655517578, "global_step": 157161, "epoch": 935} {"train_loss": -10.987489700317383, "global_step": 157162, "epoch": 935} {"train_loss": -10.763967514038086, "global_step": 157163, "epoch": 935} {"train_loss": -10.822547912597656, "global_step": 157164, "epoch": 935} {"train_loss": -10.863110542297363, "global_step": 157165, "epoch": 935} {"train_loss": -10.525857925415039, "global_step": 157166, "epoch": 935} {"train_loss": -11.063804626464844, "global_step": 157167, "epoch": 935} {"train_loss": -10.337667465209961, "global_step": 157168, "epoch": 935} {"train_loss": -11.235599517822266, "global_step": 157169, "epoch": 935} {"train_loss": -10.864267349243164, "global_step": 157170, "epoch": 935} {"train_loss": -10.772245407104492, "global_step": 157171, "epoch": 935} {"train_loss": -11.045096397399902, "global_step": 157172, "epoch": 935} {"train_loss": -10.954680442810059, "global_step": 157173, "epoch": 935} {"train_loss": -11.179615020751953, "global_step": 157174, "epoch": 935} {"train_loss": -11.038522720336914, "global_step": 157175, "epoch": 935} {"train_loss": -11.002998352050781, "global_step": 157176, "epoch": 935} {"train_loss": -11.064126014709473, "global_step": 157177, "epoch": 935} {"train_loss": -10.829038619995117, "global_step": 157178, "epoch": 935} {"train_loss": -10.888139724731445, "global_step": 157179, "epoch": 935} {"train_loss": -11.021028518676758, "global_step": 157180, "epoch": 935} {"train_loss": -10.793296813964844, "global_step": 157181, "epoch": 935} {"train_loss": -11.086149215698242, "global_step": 157182, "epoch": 935} {"train_loss": -11.060218811035156, "global_step": 157183, "epoch": 935} {"train_loss": -11.206098556518555, "global_step": 157184, "epoch": 935} {"train_loss": -11.074414253234863, "global_step": 157185, "epoch": 935} {"train_loss": -11.216135025024414, "global_step": 157186, "epoch": 935} {"train_loss": -10.687121391296387, "global_step": 157187, "epoch": 935} {"train_loss": -10.69326114654541, "global_step": 157188, "epoch": 935} {"train_loss": -11.104549407958984, "global_step": 157189, "epoch": 935} {"train_loss": -10.75765609741211, "global_step": 157190, "epoch": 935} {"train_loss": -10.813163757324219, "global_step": 157191, "epoch": 935} {"train_loss": -11.003786087036133, "global_step": 157192, "epoch": 935} {"train_loss": -10.595442771911621, "global_step": 157193, "epoch": 935} {"train_loss": -10.451504707336426, "global_step": 157194, "epoch": 935} {"train_loss": -10.600266456604004, "global_step": 157195, "epoch": 935} {"train_loss": -9.88994312286377, "global_step": 157196, "epoch": 935} {"train_loss": -10.539674758911133, "global_step": 157197, "epoch": 935} {"train_loss": -10.270652770996094, "global_step": 157198, "epoch": 935} {"train_loss": -10.267026901245117, "global_step": 157199, "epoch": 935} {"train_loss": -10.411190032958984, "global_step": 157200, "epoch": 935} {"train_loss": -9.213933944702148, "global_step": 157201, "epoch": 935} {"train_loss": -10.472749710083008, "global_step": 157202, "epoch": 935} {"train_loss": -9.54820728302002, "global_step": 157203, "epoch": 935} {"train_loss": -9.563035011291504, "global_step": 157204, "epoch": 935} {"train_loss": -9.561986923217773, "global_step": 157205, "epoch": 935} {"train_loss": -9.809242248535156, "global_step": 157206, "epoch": 935} {"train_loss": -9.68539810180664, "global_step": 157207, "epoch": 935} {"train_loss": -10.027714729309082, "global_step": 157208, "epoch": 935} {"train_loss": -9.244494438171387, "global_step": 157209, "epoch": 935} {"train_loss": -10.06985855102539, "global_step": 157210, "epoch": 935} {"train_loss": -8.988892555236816, "global_step": 157211, "epoch": 935} {"train_loss": -10.121606826782227, "global_step": 157212, "epoch": 935} {"train_loss": -9.477920532226562, "global_step": 157213, "epoch": 935} {"train_loss": -10.00011920928955, "global_step": 157214, "epoch": 935} {"train_loss": -9.910776138305664, "global_step": 157215, "epoch": 935} {"train_loss": -10.114890098571777, "global_step": 157216, "epoch": 935} {"train_loss": -10.029000282287598, "global_step": 157217, "epoch": 935} {"train_loss": -10.19173812866211, "global_step": 157218, "epoch": 935} {"train_loss": -10.419456481933594, "global_step": 157219, "epoch": 935} {"train_loss": -10.373336791992188, "global_step": 157220, "epoch": 935} {"train_loss": -10.291238784790039, "global_step": 157221, "epoch": 935} {"train_loss": -10.52072525024414, "global_step": 157222, "epoch": 935} {"train_loss": -10.284965515136719, "global_step": 157223, "epoch": 935} {"train_loss": -10.524770736694336, "global_step": 157224, "epoch": 935} {"train_loss": -10.228632926940918, "global_step": 157225, "epoch": 935} {"train_loss": -10.530879020690918, "global_step": 157226, "epoch": 935} {"train_loss": -10.596853256225586, "global_step": 157227, "epoch": 935} {"train_loss": -10.516891479492188, "global_step": 157228, "epoch": 935} {"train_loss": -10.70862102508545, "global_step": 157229, "epoch": 935} {"train_loss": -10.605918884277344, "global_step": 157230, "epoch": 935} {"train_loss": -10.40789794921875, "global_step": 157231, "epoch": 935} {"train_loss": -10.605084419250488, "global_step": 157232, "epoch": 935} {"train_loss": -10.551519393920898, "global_step": 157233, "epoch": 935} {"train_loss": -10.80470085144043, "global_step": 157234, "epoch": 935} {"train_loss": -10.714329719543457, "global_step": 157235, "epoch": 935} {"train_loss": -10.655299186706543, "global_step": 157236, "epoch": 935} {"train_loss": -10.752107620239258, "global_step": 157237, "epoch": 935} {"train_loss": -10.897604942321777, "global_step": 157238, "epoch": 935} {"train_loss": -10.71023178100586, "global_step": 157239, "epoch": 935} {"train_loss": -10.857929229736328, "global_step": 157240, "epoch": 935} {"train_loss": -10.876897811889648, "global_step": 157241, "epoch": 935} {"train_loss": -10.980165481567383, "global_step": 157242, "epoch": 935} {"train_loss": -10.96241569519043, "global_step": 157243, "epoch": 935} {"train_loss": -10.677522659301758, "global_step": 157244, "epoch": 935} {"train_loss": -10.928903579711914, "global_step": 157245, "epoch": 935} {"train_loss": -10.997182846069336, "global_step": 157246, "epoch": 935} {"train_loss": -10.595681514058795, "global_step": 157247, "epoch": 935, "val_loss": 234383.890625, "train_action_mse_error": 1.8689148426055908} {"train_loss": -10.9215087890625, "global_step": 157248, "epoch": 936} {"train_loss": -10.651832580566406, "global_step": 157249, "epoch": 936} {"train_loss": -11.102287292480469, "global_step": 157250, "epoch": 936} {"train_loss": -10.930448532104492, "global_step": 157251, "epoch": 936} {"train_loss": -11.074359893798828, "global_step": 157252, "epoch": 936} {"train_loss": -11.056023597717285, "global_step": 157253, "epoch": 936} {"train_loss": -11.090304374694824, "global_step": 157254, "epoch": 936} {"train_loss": -11.020877838134766, "global_step": 157255, "epoch": 936} {"train_loss": -11.085436820983887, "global_step": 157256, "epoch": 936} {"train_loss": -10.837281227111816, "global_step": 157257, "epoch": 936} {"train_loss": -11.078788757324219, "global_step": 157258, "epoch": 936} {"train_loss": -10.814266204833984, "global_step": 157259, "epoch": 936} {"train_loss": -10.990327835083008, "global_step": 157260, "epoch": 936} {"train_loss": -11.157400131225586, "global_step": 157261, "epoch": 936} {"train_loss": -11.250929832458496, "global_step": 157262, "epoch": 936} {"train_loss": -11.282085418701172, "global_step": 157263, "epoch": 936} {"train_loss": -11.044734954833984, "global_step": 157264, "epoch": 936} {"train_loss": -11.178764343261719, "global_step": 157265, "epoch": 936} {"train_loss": -11.289623260498047, "global_step": 157266, "epoch": 936} {"train_loss": -11.136859893798828, "global_step": 157267, "epoch": 936} {"train_loss": -11.13824462890625, "global_step": 157268, "epoch": 936} {"train_loss": -11.144857406616211, "global_step": 157269, "epoch": 936} {"train_loss": -11.166887283325195, "global_step": 157270, "epoch": 936} {"train_loss": -11.233800888061523, "global_step": 157271, "epoch": 936} {"train_loss": -11.103962898254395, "global_step": 157272, "epoch": 936} {"train_loss": -10.970964431762695, "global_step": 157273, "epoch": 936} {"train_loss": -11.12651538848877, "global_step": 157274, "epoch": 936} {"train_loss": -10.968637466430664, "global_step": 157275, "epoch": 936} {"train_loss": -10.978763580322266, "global_step": 157276, "epoch": 936} {"train_loss": -11.108564376831055, "global_step": 157277, "epoch": 936} {"train_loss": -10.883150100708008, "global_step": 157278, "epoch": 936} {"train_loss": -10.997411727905273, "global_step": 157279, "epoch": 936} {"train_loss": -10.759566307067871, "global_step": 157280, "epoch": 936} {"train_loss": -10.673431396484375, "global_step": 157281, "epoch": 936} {"train_loss": -11.153331756591797, "global_step": 157282, "epoch": 936} {"train_loss": -10.963994026184082, "global_step": 157283, "epoch": 936} {"train_loss": -10.939038276672363, "global_step": 157284, "epoch": 936} {"train_loss": -10.946571350097656, "global_step": 157285, "epoch": 936} {"train_loss": -10.56155014038086, "global_step": 157286, "epoch": 936} {"train_loss": -11.149539947509766, "global_step": 157287, "epoch": 936} {"train_loss": -10.639842987060547, "global_step": 157288, "epoch": 936} {"train_loss": -9.925954818725586, "global_step": 157289, "epoch": 936} {"train_loss": -9.976285934448242, "global_step": 157290, "epoch": 936} {"train_loss": -10.46115779876709, "global_step": 157291, "epoch": 936} {"train_loss": -8.806112289428711, "global_step": 157292, "epoch": 936} {"train_loss": -9.834650039672852, "global_step": 157293, "epoch": 936} {"train_loss": -9.207687377929688, "global_step": 157294, "epoch": 936} {"train_loss": -10.332948684692383, "global_step": 157295, "epoch": 936} {"train_loss": -8.744365692138672, "global_step": 157296, "epoch": 936} {"train_loss": -10.163228988647461, "global_step": 157297, "epoch": 936} {"train_loss": -9.50838851928711, "global_step": 157298, "epoch": 936} {"train_loss": -10.22184944152832, "global_step": 157299, "epoch": 936} {"train_loss": -10.266145706176758, "global_step": 157300, "epoch": 936} {"train_loss": -10.01996898651123, "global_step": 157301, "epoch": 936} {"train_loss": -10.365326881408691, "global_step": 157302, "epoch": 936} {"train_loss": -10.453791618347168, "global_step": 157303, "epoch": 936} {"train_loss": -10.625677108764648, "global_step": 157304, "epoch": 936} {"train_loss": -10.39796257019043, "global_step": 157305, "epoch": 936} {"train_loss": -10.190999984741211, "global_step": 157306, "epoch": 936} {"train_loss": -10.262929916381836, "global_step": 157307, "epoch": 936} {"train_loss": -10.193151473999023, "global_step": 157308, "epoch": 936} {"train_loss": -10.59951400756836, "global_step": 157309, "epoch": 936} {"train_loss": -10.44182014465332, "global_step": 157310, "epoch": 936} {"train_loss": -10.51732349395752, "global_step": 157311, "epoch": 936} {"train_loss": -10.087905883789062, "global_step": 157312, "epoch": 936} {"train_loss": -10.560945510864258, "global_step": 157313, "epoch": 936} {"train_loss": -10.092386245727539, "global_step": 157314, "epoch": 936} {"train_loss": -10.082437515258789, "global_step": 157315, "epoch": 936} {"train_loss": -10.523246765136719, "global_step": 157316, "epoch": 936} {"train_loss": -9.856173515319824, "global_step": 157317, "epoch": 936} {"train_loss": -10.628586769104004, "global_step": 157318, "epoch": 936} {"train_loss": -9.936262130737305, "global_step": 157319, "epoch": 936} {"train_loss": -10.540332794189453, "global_step": 157320, "epoch": 936} {"train_loss": -10.4568452835083, "global_step": 157321, "epoch": 936} {"train_loss": -10.316730499267578, "global_step": 157322, "epoch": 936} {"train_loss": -10.587796211242676, "global_step": 157323, "epoch": 936} {"train_loss": -10.475146293640137, "global_step": 157324, "epoch": 936} {"train_loss": -10.171567916870117, "global_step": 157325, "epoch": 936} {"train_loss": -10.764730453491211, "global_step": 157326, "epoch": 936} {"train_loss": -10.29411792755127, "global_step": 157327, "epoch": 936} {"train_loss": -10.538833618164062, "global_step": 157328, "epoch": 936} {"train_loss": -10.51363468170166, "global_step": 157329, "epoch": 936} {"train_loss": -10.318208694458008, "global_step": 157330, "epoch": 936} {"train_loss": -10.708778381347656, "global_step": 157331, "epoch": 936} {"train_loss": -10.610427856445312, "global_step": 157332, "epoch": 936} {"train_loss": -10.41505241394043, "global_step": 157333, "epoch": 936} {"train_loss": -10.762027740478516, "global_step": 157334, "epoch": 936} {"train_loss": -10.55727767944336, "global_step": 157335, "epoch": 936} {"train_loss": -10.703873634338379, "global_step": 157336, "epoch": 936} {"train_loss": -10.78896713256836, "global_step": 157337, "epoch": 936} {"train_loss": -10.541881561279297, "global_step": 157338, "epoch": 936} {"train_loss": -10.810270309448242, "global_step": 157339, "epoch": 936} {"train_loss": -10.77347469329834, "global_step": 157340, "epoch": 936} {"train_loss": -10.7921724319458, "global_step": 157341, "epoch": 936} {"train_loss": -10.683573722839355, "global_step": 157342, "epoch": 936} {"train_loss": -10.779316902160645, "global_step": 157343, "epoch": 936} {"train_loss": -10.888062477111816, "global_step": 157344, "epoch": 936} {"train_loss": -11.04151725769043, "global_step": 157345, "epoch": 936} {"train_loss": -10.819318771362305, "global_step": 157346, "epoch": 936} {"train_loss": -10.838216781616211, "global_step": 157347, "epoch": 936} {"train_loss": -10.977479934692383, "global_step": 157348, "epoch": 936} {"train_loss": -10.522336959838867, "global_step": 157349, "epoch": 936} {"train_loss": -10.95695686340332, "global_step": 157350, "epoch": 936} {"train_loss": -10.776525497436523, "global_step": 157351, "epoch": 936} {"train_loss": -10.829547882080078, "global_step": 157352, "epoch": 936} {"train_loss": -10.940101623535156, "global_step": 157353, "epoch": 936} {"train_loss": -11.04084587097168, "global_step": 157354, "epoch": 936} {"train_loss": -10.491170883178711, "global_step": 157355, "epoch": 936} {"train_loss": -10.892256736755371, "global_step": 157356, "epoch": 936} {"train_loss": -10.766786575317383, "global_step": 157357, "epoch": 936} {"train_loss": -11.093311309814453, "global_step": 157358, "epoch": 936} {"train_loss": -10.71087646484375, "global_step": 157359, "epoch": 936} {"train_loss": -10.861062049865723, "global_step": 157360, "epoch": 936} {"train_loss": -11.155258178710938, "global_step": 157361, "epoch": 936} {"train_loss": -11.14178466796875, "global_step": 157362, "epoch": 936} {"train_loss": -11.005694389343262, "global_step": 157363, "epoch": 936} {"train_loss": -11.171061515808105, "global_step": 157364, "epoch": 936} {"train_loss": -11.132505416870117, "global_step": 157365, "epoch": 936} {"train_loss": -11.202003479003906, "global_step": 157366, "epoch": 936} {"train_loss": -11.094314575195312, "global_step": 157367, "epoch": 936} {"train_loss": -11.225414276123047, "global_step": 157368, "epoch": 936} {"train_loss": -11.062137603759766, "global_step": 157369, "epoch": 936} {"train_loss": -11.191583633422852, "global_step": 157370, "epoch": 936} {"train_loss": -11.13734245300293, "global_step": 157371, "epoch": 936} {"train_loss": -11.251614570617676, "global_step": 157372, "epoch": 936} {"train_loss": -11.155773162841797, "global_step": 157373, "epoch": 936} {"train_loss": -11.19504165649414, "global_step": 157374, "epoch": 936} {"train_loss": -11.216964721679688, "global_step": 157375, "epoch": 936} {"train_loss": -11.207823753356934, "global_step": 157376, "epoch": 936} {"train_loss": -11.034954071044922, "global_step": 157377, "epoch": 936} {"train_loss": -11.170215606689453, "global_step": 157378, "epoch": 936} {"train_loss": -11.20790958404541, "global_step": 157379, "epoch": 936} {"train_loss": -11.102594375610352, "global_step": 157380, "epoch": 936} {"train_loss": -10.98295783996582, "global_step": 157381, "epoch": 936} {"train_loss": -11.16506290435791, "global_step": 157382, "epoch": 936} {"train_loss": -11.19719123840332, "global_step": 157383, "epoch": 936} {"train_loss": -11.330483436584473, "global_step": 157384, "epoch": 936} {"train_loss": -11.256498336791992, "global_step": 157385, "epoch": 936} {"train_loss": -11.30891227722168, "global_step": 157386, "epoch": 936} {"train_loss": -11.024977684020996, "global_step": 157387, "epoch": 936} {"train_loss": -11.193473815917969, "global_step": 157388, "epoch": 936} {"train_loss": -11.063881874084473, "global_step": 157389, "epoch": 936} {"train_loss": -11.024385452270508, "global_step": 157390, "epoch": 936} {"train_loss": -11.146862030029297, "global_step": 157391, "epoch": 936} {"train_loss": -10.865853309631348, "global_step": 157392, "epoch": 936} {"train_loss": -11.149362564086914, "global_step": 157393, "epoch": 936} {"train_loss": -10.920953750610352, "global_step": 157394, "epoch": 936} {"train_loss": -11.007638931274414, "global_step": 157395, "epoch": 936} {"train_loss": -10.288869857788086, "global_step": 157396, "epoch": 936} {"train_loss": -9.9642333984375, "global_step": 157397, "epoch": 936} {"train_loss": -10.354514122009277, "global_step": 157398, "epoch": 936} {"train_loss": -10.840887069702148, "global_step": 157399, "epoch": 936} {"train_loss": -9.611607551574707, "global_step": 157400, "epoch": 936} {"train_loss": -9.375829696655273, "global_step": 157401, "epoch": 936} {"train_loss": -10.8851900100708, "global_step": 157402, "epoch": 936} {"train_loss": -9.046401977539062, "global_step": 157403, "epoch": 936} {"train_loss": -10.028165817260742, "global_step": 157404, "epoch": 936} {"train_loss": -10.00532341003418, "global_step": 157405, "epoch": 936} {"train_loss": -10.208536148071289, "global_step": 157406, "epoch": 936} {"train_loss": -10.037050247192383, "global_step": 157407, "epoch": 936} {"train_loss": -9.301902770996094, "global_step": 157408, "epoch": 936} {"train_loss": -10.37327766418457, "global_step": 157409, "epoch": 936} {"train_loss": -9.867393493652344, "global_step": 157410, "epoch": 936} {"train_loss": -10.18832015991211, "global_step": 157411, "epoch": 936} {"train_loss": -9.812315940856934, "global_step": 157412, "epoch": 936} {"train_loss": -10.169495582580566, "global_step": 157413, "epoch": 936} {"train_loss": -9.868867874145508, "global_step": 157414, "epoch": 936} {"train_loss": -10.670521781558083, "global_step": 157415, "epoch": 936, "val_loss": 233262.78125} {"train_loss": -10.178108215332031, "global_step": 157416, "epoch": 937} {"train_loss": -9.974742889404297, "global_step": 157417, "epoch": 937} {"train_loss": -9.981188774108887, "global_step": 157418, "epoch": 937} {"train_loss": -10.126246452331543, "global_step": 157419, "epoch": 937} {"train_loss": -10.288481712341309, "global_step": 157420, "epoch": 937} {"train_loss": -10.306604385375977, "global_step": 157421, "epoch": 937} {"train_loss": -9.972341537475586, "global_step": 157422, "epoch": 937} {"train_loss": -10.101217269897461, "global_step": 157423, "epoch": 937} {"train_loss": -9.802265167236328, "global_step": 157424, "epoch": 937} {"train_loss": -10.600775718688965, "global_step": 157425, "epoch": 937} {"train_loss": -10.378114700317383, "global_step": 157426, "epoch": 937} {"train_loss": -10.301273345947266, "global_step": 157427, "epoch": 937} {"train_loss": -10.499059677124023, "global_step": 157428, "epoch": 937} {"train_loss": -10.212688446044922, "global_step": 157429, "epoch": 937} {"train_loss": -10.571709632873535, "global_step": 157430, "epoch": 937} {"train_loss": -10.494169235229492, "global_step": 157431, "epoch": 937} {"train_loss": -10.426248550415039, "global_step": 157432, "epoch": 937} {"train_loss": -10.671753883361816, "global_step": 157433, "epoch": 937} {"train_loss": -10.542686462402344, "global_step": 157434, "epoch": 937} {"train_loss": -10.648124694824219, "global_step": 157435, "epoch": 937} {"train_loss": -10.446130752563477, "global_step": 157436, "epoch": 937} {"train_loss": -10.447961807250977, "global_step": 157437, "epoch": 937} {"train_loss": -10.666597366333008, "global_step": 157438, "epoch": 937} {"train_loss": -10.67624568939209, "global_step": 157439, "epoch": 937} {"train_loss": -10.714999198913574, "global_step": 157440, "epoch": 937} {"train_loss": -10.350643157958984, "global_step": 157441, "epoch": 937} {"train_loss": -10.444375991821289, "global_step": 157442, "epoch": 937} {"train_loss": -10.796478271484375, "global_step": 157443, "epoch": 937} {"train_loss": -10.716415405273438, "global_step": 157444, "epoch": 937} {"train_loss": -10.767040252685547, "global_step": 157445, "epoch": 937} {"train_loss": -10.823967933654785, "global_step": 157446, "epoch": 937} {"train_loss": -10.845826148986816, "global_step": 157447, "epoch": 937} {"train_loss": -10.705329895019531, "global_step": 157448, "epoch": 937} {"train_loss": -10.629569053649902, "global_step": 157449, "epoch": 937} {"train_loss": -10.982813835144043, "global_step": 157450, "epoch": 937} {"train_loss": -10.83901596069336, "global_step": 157451, "epoch": 937} {"train_loss": -10.802730560302734, "global_step": 157452, "epoch": 937} {"train_loss": -11.014144897460938, "global_step": 157453, "epoch": 937} {"train_loss": -10.811088562011719, "global_step": 157454, "epoch": 937} {"train_loss": -11.055733680725098, "global_step": 157455, "epoch": 937} {"train_loss": -11.095787048339844, "global_step": 157456, "epoch": 937} {"train_loss": -11.073972702026367, "global_step": 157457, "epoch": 937} {"train_loss": -11.044309616088867, "global_step": 157458, "epoch": 937} {"train_loss": -10.959053039550781, "global_step": 157459, "epoch": 937} {"train_loss": -11.046341896057129, "global_step": 157460, "epoch": 937} {"train_loss": -10.948047637939453, "global_step": 157461, "epoch": 937} {"train_loss": -11.061579704284668, "global_step": 157462, "epoch": 937} {"train_loss": -10.881470680236816, "global_step": 157463, "epoch": 937} {"train_loss": -11.028581619262695, "global_step": 157464, "epoch": 937} {"train_loss": -11.094789505004883, "global_step": 157465, "epoch": 937} {"train_loss": -11.082621574401855, "global_step": 157466, "epoch": 937} {"train_loss": -10.95823860168457, "global_step": 157467, "epoch": 937} {"train_loss": -11.102291107177734, "global_step": 157468, "epoch": 937} {"train_loss": -10.851231575012207, "global_step": 157469, "epoch": 937} {"train_loss": -10.740724563598633, "global_step": 157470, "epoch": 937} {"train_loss": -11.20840835571289, "global_step": 157471, "epoch": 937} {"train_loss": -10.684296607971191, "global_step": 157472, "epoch": 937} {"train_loss": -10.895853042602539, "global_step": 157473, "epoch": 937} {"train_loss": -11.094990730285645, "global_step": 157474, "epoch": 937} {"train_loss": -10.38726806640625, "global_step": 157475, "epoch": 937} {"train_loss": -10.720077514648438, "global_step": 157476, "epoch": 937} {"train_loss": -10.494056701660156, "global_step": 157477, "epoch": 937} {"train_loss": -10.268798828125, "global_step": 157478, "epoch": 937} {"train_loss": -10.864059448242188, "global_step": 157479, "epoch": 937} {"train_loss": -10.541635513305664, "global_step": 157480, "epoch": 937} {"train_loss": -10.371208190917969, "global_step": 157481, "epoch": 937} {"train_loss": -10.934457778930664, "global_step": 157482, "epoch": 937} {"train_loss": -10.445671081542969, "global_step": 157483, "epoch": 937} {"train_loss": -10.610879898071289, "global_step": 157484, "epoch": 937} {"train_loss": -10.513737678527832, "global_step": 157485, "epoch": 937} {"train_loss": -10.556907653808594, "global_step": 157486, "epoch": 937} {"train_loss": -9.910665512084961, "global_step": 157487, "epoch": 937} {"train_loss": -10.87387466430664, "global_step": 157488, "epoch": 937} {"train_loss": -10.478772163391113, "global_step": 157489, "epoch": 937} {"train_loss": -10.66729736328125, "global_step": 157490, "epoch": 937} {"train_loss": -10.241841316223145, "global_step": 157491, "epoch": 937} {"train_loss": -10.561363220214844, "global_step": 157492, "epoch": 937} {"train_loss": -10.671499252319336, "global_step": 157493, "epoch": 937} {"train_loss": -10.488049507141113, "global_step": 157494, "epoch": 937} {"train_loss": -10.644193649291992, "global_step": 157495, "epoch": 937} {"train_loss": -9.526430130004883, "global_step": 157496, "epoch": 937} {"train_loss": -10.741700172424316, "global_step": 157497, "epoch": 937} {"train_loss": -10.065988540649414, "global_step": 157498, "epoch": 937} {"train_loss": -10.78428840637207, "global_step": 157499, "epoch": 937} {"train_loss": -10.324712753295898, "global_step": 157500, "epoch": 937} {"train_loss": -9.853055953979492, "global_step": 157501, "epoch": 937} {"train_loss": -11.00636100769043, "global_step": 157502, "epoch": 937} {"train_loss": -10.112893104553223, "global_step": 157503, "epoch": 937} {"train_loss": -10.69192886352539, "global_step": 157504, "epoch": 937} {"train_loss": -10.813346862792969, "global_step": 157505, "epoch": 937} {"train_loss": -10.193076133728027, "global_step": 157506, "epoch": 937} {"train_loss": -10.751241683959961, "global_step": 157507, "epoch": 937} {"train_loss": -10.631576538085938, "global_step": 157508, "epoch": 937} {"train_loss": -10.765840530395508, "global_step": 157509, "epoch": 937} {"train_loss": -10.980064392089844, "global_step": 157510, "epoch": 937} {"train_loss": -10.515707015991211, "global_step": 157511, "epoch": 937} {"train_loss": -10.419337272644043, "global_step": 157512, "epoch": 937} {"train_loss": -10.624811172485352, "global_step": 157513, "epoch": 937} {"train_loss": -10.448296546936035, "global_step": 157514, "epoch": 937} {"train_loss": -10.615402221679688, "global_step": 157515, "epoch": 937} {"train_loss": -10.61162281036377, "global_step": 157516, "epoch": 937} {"train_loss": -10.45810317993164, "global_step": 157517, "epoch": 937} {"train_loss": -10.636877059936523, "global_step": 157518, "epoch": 937} {"train_loss": -10.64004135131836, "global_step": 157519, "epoch": 937} {"train_loss": -10.553498268127441, "global_step": 157520, "epoch": 937} {"train_loss": -10.793798446655273, "global_step": 157521, "epoch": 937} {"train_loss": -10.865734100341797, "global_step": 157522, "epoch": 937} {"train_loss": -10.711868286132812, "global_step": 157523, "epoch": 937} {"train_loss": -10.792770385742188, "global_step": 157524, "epoch": 937} {"train_loss": -10.583549499511719, "global_step": 157525, "epoch": 937} {"train_loss": -10.908905029296875, "global_step": 157526, "epoch": 937} {"train_loss": -10.631206512451172, "global_step": 157527, "epoch": 937} {"train_loss": -11.001480102539062, "global_step": 157528, "epoch": 937} {"train_loss": -11.032784461975098, "global_step": 157529, "epoch": 937} {"train_loss": -11.163994789123535, "global_step": 157530, "epoch": 937} {"train_loss": -10.9085111618042, "global_step": 157531, "epoch": 937} {"train_loss": -10.93118667602539, "global_step": 157532, "epoch": 937} {"train_loss": -10.955560684204102, "global_step": 157533, "epoch": 937} {"train_loss": -11.055776596069336, "global_step": 157534, "epoch": 937} {"train_loss": -11.083599090576172, "global_step": 157535, "epoch": 937} {"train_loss": -11.083515167236328, "global_step": 157536, "epoch": 937} {"train_loss": -11.08077621459961, "global_step": 157537, "epoch": 937} {"train_loss": -11.027113914489746, "global_step": 157538, "epoch": 937} {"train_loss": -11.081710815429688, "global_step": 157539, "epoch": 937} {"train_loss": -11.274781227111816, "global_step": 157540, "epoch": 937} {"train_loss": -11.162567138671875, "global_step": 157541, "epoch": 937} {"train_loss": -11.137849807739258, "global_step": 157542, "epoch": 937} {"train_loss": -10.814123153686523, "global_step": 157543, "epoch": 937} {"train_loss": -11.20602035522461, "global_step": 157544, "epoch": 937} {"train_loss": -11.104066848754883, "global_step": 157545, "epoch": 937} {"train_loss": -10.951836585998535, "global_step": 157546, "epoch": 937} {"train_loss": -10.94218635559082, "global_step": 157547, "epoch": 937} {"train_loss": -10.633132934570312, "global_step": 157548, "epoch": 937} {"train_loss": -11.050087928771973, "global_step": 157549, "epoch": 937} {"train_loss": -10.719066619873047, "global_step": 157550, "epoch": 937} {"train_loss": -10.987194061279297, "global_step": 157551, "epoch": 937} {"train_loss": -11.017457008361816, "global_step": 157552, "epoch": 937} {"train_loss": -11.14384937286377, "global_step": 157553, "epoch": 937} {"train_loss": -11.11530876159668, "global_step": 157554, "epoch": 937} {"train_loss": -11.351746559143066, "global_step": 157555, "epoch": 937} {"train_loss": -11.246206283569336, "global_step": 157556, "epoch": 937} {"train_loss": -11.144245147705078, "global_step": 157557, "epoch": 937} {"train_loss": -11.105690956115723, "global_step": 157558, "epoch": 937} {"train_loss": -11.279762268066406, "global_step": 157559, "epoch": 937} {"train_loss": -11.191679000854492, "global_step": 157560, "epoch": 937} {"train_loss": -11.1771240234375, "global_step": 157561, "epoch": 937} {"train_loss": -11.278738021850586, "global_step": 157562, "epoch": 937} {"train_loss": -11.027769088745117, "global_step": 157563, "epoch": 937} {"train_loss": -11.024134635925293, "global_step": 157564, "epoch": 937} {"train_loss": -11.310562133789062, "global_step": 157565, "epoch": 937} {"train_loss": -11.273309707641602, "global_step": 157566, "epoch": 937} {"train_loss": -11.241202354431152, "global_step": 157567, "epoch": 937} {"train_loss": -11.222661972045898, "global_step": 157568, "epoch": 937} {"train_loss": -11.450824737548828, "global_step": 157569, "epoch": 937} {"train_loss": -11.330266952514648, "global_step": 157570, "epoch": 937} {"train_loss": -11.149249076843262, "global_step": 157571, "epoch": 937} {"train_loss": -11.181817054748535, "global_step": 157572, "epoch": 937} {"train_loss": -11.499649047851562, "global_step": 157573, "epoch": 937} {"train_loss": -11.08005142211914, "global_step": 157574, "epoch": 937} {"train_loss": -10.938070297241211, "global_step": 157575, "epoch": 937} {"train_loss": -11.217397689819336, "global_step": 157576, "epoch": 937} {"train_loss": -11.291398048400879, "global_step": 157577, "epoch": 937} {"train_loss": -11.188557624816895, "global_step": 157578, "epoch": 937} {"train_loss": -11.237648963928223, "global_step": 157579, "epoch": 937} {"train_loss": -10.985321044921875, "global_step": 157580, "epoch": 937} {"train_loss": -10.565166473388672, "global_step": 157581, "epoch": 937} {"train_loss": -11.2132568359375, "global_step": 157582, "epoch": 937} {"train_loss": -10.769662096386863, "global_step": 157583, "epoch": 937, "val_loss": 233792.203125} {"train_loss": -9.665143966674805, "global_step": 157584, "epoch": 938} {"train_loss": -9.412653923034668, "global_step": 157585, "epoch": 938} {"train_loss": -9.626996994018555, "global_step": 157586, "epoch": 938} {"train_loss": -9.36662483215332, "global_step": 157587, "epoch": 938} {"train_loss": -8.455793380737305, "global_step": 157588, "epoch": 938} {"train_loss": -8.439502716064453, "global_step": 157589, "epoch": 938} {"train_loss": -9.501214981079102, "global_step": 157590, "epoch": 938} {"train_loss": -9.177450180053711, "global_step": 157591, "epoch": 938} {"train_loss": -9.481294631958008, "global_step": 157592, "epoch": 938} {"train_loss": -9.233978271484375, "global_step": 157593, "epoch": 938} {"train_loss": -9.580965042114258, "global_step": 157594, "epoch": 938} {"train_loss": -8.152450561523438, "global_step": 157595, "epoch": 938} {"train_loss": -9.12560749053955, "global_step": 157596, "epoch": 938} {"train_loss": -8.264307975769043, "global_step": 157597, "epoch": 938} {"train_loss": -9.97217082977295, "global_step": 157598, "epoch": 938} {"train_loss": -8.561684608459473, "global_step": 157599, "epoch": 938} {"train_loss": -9.81889533996582, "global_step": 157600, "epoch": 938} {"train_loss": -9.649612426757812, "global_step": 157601, "epoch": 938} {"train_loss": -9.726415634155273, "global_step": 157602, "epoch": 938} {"train_loss": -9.73671817779541, "global_step": 157603, "epoch": 938} {"train_loss": -9.953670501708984, "global_step": 157604, "epoch": 938} {"train_loss": -9.909011840820312, "global_step": 157605, "epoch": 938} {"train_loss": -9.866534233093262, "global_step": 157606, "epoch": 938} {"train_loss": -9.295289993286133, "global_step": 157607, "epoch": 938} {"train_loss": -10.022624015808105, "global_step": 157608, "epoch": 938} {"train_loss": -9.385712623596191, "global_step": 157609, "epoch": 938} {"train_loss": -9.53675651550293, "global_step": 157610, "epoch": 938} {"train_loss": -10.24432373046875, "global_step": 157611, "epoch": 938} {"train_loss": -9.689176559448242, "global_step": 157612, "epoch": 938} {"train_loss": -10.063989639282227, "global_step": 157613, "epoch": 938} {"train_loss": -10.145431518554688, "global_step": 157614, "epoch": 938} {"train_loss": -9.816949844360352, "global_step": 157615, "epoch": 938} {"train_loss": -9.918943405151367, "global_step": 157616, "epoch": 938} {"train_loss": -10.321813583374023, "global_step": 157617, "epoch": 938} {"train_loss": -10.078144073486328, "global_step": 157618, "epoch": 938} {"train_loss": -10.033330917358398, "global_step": 157619, "epoch": 938} {"train_loss": -10.355989456176758, "global_step": 157620, "epoch": 938} {"train_loss": -9.890586853027344, "global_step": 157621, "epoch": 938} {"train_loss": -10.238637924194336, "global_step": 157622, "epoch": 938} {"train_loss": -10.107049942016602, "global_step": 157623, "epoch": 938} {"train_loss": -10.198308944702148, "global_step": 157624, "epoch": 938} {"train_loss": -10.387916564941406, "global_step": 157625, "epoch": 938} {"train_loss": -10.207954406738281, "global_step": 157626, "epoch": 938} {"train_loss": -10.425934791564941, "global_step": 157627, "epoch": 938} {"train_loss": -10.642793655395508, "global_step": 157628, "epoch": 938} {"train_loss": -10.421924591064453, "global_step": 157629, "epoch": 938} {"train_loss": -10.44766902923584, "global_step": 157630, "epoch": 938} {"train_loss": -10.42862606048584, "global_step": 157631, "epoch": 938} {"train_loss": -10.452613830566406, "global_step": 157632, "epoch": 938} {"train_loss": -10.353280067443848, "global_step": 157633, "epoch": 938} {"train_loss": -10.513729095458984, "global_step": 157634, "epoch": 938} {"train_loss": -10.600433349609375, "global_step": 157635, "epoch": 938} {"train_loss": -10.540935516357422, "global_step": 157636, "epoch": 938} {"train_loss": -10.573530197143555, "global_step": 157637, "epoch": 938} {"train_loss": -10.548075675964355, "global_step": 157638, "epoch": 938} {"train_loss": -10.795976638793945, "global_step": 157639, "epoch": 938} {"train_loss": -10.615217208862305, "global_step": 157640, "epoch": 938} {"train_loss": -10.756373405456543, "global_step": 157641, "epoch": 938} {"train_loss": -10.692081451416016, "global_step": 157642, "epoch": 938} {"train_loss": -10.715686798095703, "global_step": 157643, "epoch": 938} {"train_loss": -10.868621826171875, "global_step": 157644, "epoch": 938} {"train_loss": -10.759899139404297, "global_step": 157645, "epoch": 938} {"train_loss": -10.879030227661133, "global_step": 157646, "epoch": 938} {"train_loss": -10.97449779510498, "global_step": 157647, "epoch": 938} {"train_loss": -10.752007484436035, "global_step": 157648, "epoch": 938} {"train_loss": -10.894475936889648, "global_step": 157649, "epoch": 938} {"train_loss": -10.965168952941895, "global_step": 157650, "epoch": 938} {"train_loss": -10.813844680786133, "global_step": 157651, "epoch": 938} {"train_loss": -10.731988906860352, "global_step": 157652, "epoch": 938} {"train_loss": -10.956138610839844, "global_step": 157653, "epoch": 938} {"train_loss": -11.038545608520508, "global_step": 157654, "epoch": 938} {"train_loss": -10.894737243652344, "global_step": 157655, "epoch": 938} {"train_loss": -11.061805725097656, "global_step": 157656, "epoch": 938} {"train_loss": -10.829131126403809, "global_step": 157657, "epoch": 938} {"train_loss": -10.894697189331055, "global_step": 157658, "epoch": 938} {"train_loss": -10.729728698730469, "global_step": 157659, "epoch": 938} {"train_loss": -11.186593055725098, "global_step": 157660, "epoch": 938} {"train_loss": -11.146407127380371, "global_step": 157661, "epoch": 938} {"train_loss": -10.864995002746582, "global_step": 157662, "epoch": 938} {"train_loss": -10.684150695800781, "global_step": 157663, "epoch": 938} {"train_loss": -10.792343139648438, "global_step": 157664, "epoch": 938} {"train_loss": -10.796123504638672, "global_step": 157665, "epoch": 938} {"train_loss": -10.376335144042969, "global_step": 157666, "epoch": 938} {"train_loss": -10.986396789550781, "global_step": 157667, "epoch": 938} {"train_loss": -10.779220581054688, "global_step": 157668, "epoch": 938} {"train_loss": -10.886590957641602, "global_step": 157669, "epoch": 938} {"train_loss": -10.95779037475586, "global_step": 157670, "epoch": 938} {"train_loss": -10.655498504638672, "global_step": 157671, "epoch": 938} {"train_loss": -11.01224136352539, "global_step": 157672, "epoch": 938} {"train_loss": -11.003313064575195, "global_step": 157673, "epoch": 938} {"train_loss": -11.11948299407959, "global_step": 157674, "epoch": 938} {"train_loss": -11.17922592163086, "global_step": 157675, "epoch": 938} {"train_loss": -10.995247840881348, "global_step": 157676, "epoch": 938} {"train_loss": -10.955242156982422, "global_step": 157677, "epoch": 938} {"train_loss": -10.974522590637207, "global_step": 157678, "epoch": 938} {"train_loss": -10.911371231079102, "global_step": 157679, "epoch": 938} {"train_loss": -11.000767707824707, "global_step": 157680, "epoch": 938} {"train_loss": -11.317727088928223, "global_step": 157681, "epoch": 938} {"train_loss": -11.064155578613281, "global_step": 157682, "epoch": 938} {"train_loss": -11.118488311767578, "global_step": 157683, "epoch": 938} {"train_loss": -11.061742782592773, "global_step": 157684, "epoch": 938} {"train_loss": -11.133909225463867, "global_step": 157685, "epoch": 938} {"train_loss": -10.930294036865234, "global_step": 157686, "epoch": 938} {"train_loss": -11.157404899597168, "global_step": 157687, "epoch": 938} {"train_loss": -11.263778686523438, "global_step": 157688, "epoch": 938} {"train_loss": -10.97951889038086, "global_step": 157689, "epoch": 938} {"train_loss": -11.224720001220703, "global_step": 157690, "epoch": 938} {"train_loss": -11.205965042114258, "global_step": 157691, "epoch": 938} {"train_loss": -11.192319869995117, "global_step": 157692, "epoch": 938} {"train_loss": -11.010644912719727, "global_step": 157693, "epoch": 938} {"train_loss": -10.960752487182617, "global_step": 157694, "epoch": 938} {"train_loss": -10.992185592651367, "global_step": 157695, "epoch": 938} {"train_loss": -11.337831497192383, "global_step": 157696, "epoch": 938} {"train_loss": -10.96666145324707, "global_step": 157697, "epoch": 938} {"train_loss": -10.85378646850586, "global_step": 157698, "epoch": 938} {"train_loss": -10.834611892700195, "global_step": 157699, "epoch": 938} {"train_loss": -9.916027069091797, "global_step": 157700, "epoch": 938} {"train_loss": -10.308691024780273, "global_step": 157701, "epoch": 938} {"train_loss": -11.239120483398438, "global_step": 157702, "epoch": 938} {"train_loss": -10.75672435760498, "global_step": 157703, "epoch": 938} {"train_loss": -10.785743713378906, "global_step": 157704, "epoch": 938} {"train_loss": -11.187590599060059, "global_step": 157705, "epoch": 938} {"train_loss": -10.54034423828125, "global_step": 157706, "epoch": 938} {"train_loss": -10.67392349243164, "global_step": 157707, "epoch": 938} {"train_loss": -10.940472602844238, "global_step": 157708, "epoch": 938} {"train_loss": -10.475737571716309, "global_step": 157709, "epoch": 938} {"train_loss": -10.663963317871094, "global_step": 157710, "epoch": 938} {"train_loss": -11.15123176574707, "global_step": 157711, "epoch": 938} {"train_loss": -10.40495491027832, "global_step": 157712, "epoch": 938} {"train_loss": -11.035061836242676, "global_step": 157713, "epoch": 938} {"train_loss": -10.83647346496582, "global_step": 157714, "epoch": 938} {"train_loss": -10.967294692993164, "global_step": 157715, "epoch": 938} {"train_loss": -11.05435562133789, "global_step": 157716, "epoch": 938} {"train_loss": -10.685023307800293, "global_step": 157717, "epoch": 938} {"train_loss": -10.793628692626953, "global_step": 157718, "epoch": 938} {"train_loss": -10.620223045349121, "global_step": 157719, "epoch": 938} {"train_loss": -10.829366683959961, "global_step": 157720, "epoch": 938} {"train_loss": -11.070932388305664, "global_step": 157721, "epoch": 938} {"train_loss": -10.806673049926758, "global_step": 157722, "epoch": 938} {"train_loss": -10.911595344543457, "global_step": 157723, "epoch": 938} {"train_loss": -10.909219741821289, "global_step": 157724, "epoch": 938} {"train_loss": -11.033845901489258, "global_step": 157725, "epoch": 938} {"train_loss": -11.067795753479004, "global_step": 157726, "epoch": 938} {"train_loss": -10.790407180786133, "global_step": 157727, "epoch": 938} {"train_loss": -10.784276008605957, "global_step": 157728, "epoch": 938} {"train_loss": -11.20229721069336, "global_step": 157729, "epoch": 938} {"train_loss": -11.027277946472168, "global_step": 157730, "epoch": 938} {"train_loss": -10.952173233032227, "global_step": 157731, "epoch": 938} {"train_loss": -10.754152297973633, "global_step": 157732, "epoch": 938} {"train_loss": -10.25343132019043, "global_step": 157733, "epoch": 938} {"train_loss": -10.305234909057617, "global_step": 157734, "epoch": 938} {"train_loss": -10.958657264709473, "global_step": 157735, "epoch": 938} {"train_loss": -10.690958976745605, "global_step": 157736, "epoch": 938} {"train_loss": -10.204179763793945, "global_step": 157737, "epoch": 938} {"train_loss": -10.90604305267334, "global_step": 157738, "epoch": 938} {"train_loss": -10.928627967834473, "global_step": 157739, "epoch": 938} {"train_loss": -10.703853607177734, "global_step": 157740, "epoch": 938} {"train_loss": -10.388197898864746, "global_step": 157741, "epoch": 938} {"train_loss": -10.289135932922363, "global_step": 157742, "epoch": 938} {"train_loss": -10.198431968688965, "global_step": 157743, "epoch": 938} {"train_loss": -8.915653228759766, "global_step": 157744, "epoch": 938} {"train_loss": -10.232709884643555, "global_step": 157745, "epoch": 938} {"train_loss": -9.167261123657227, "global_step": 157746, "epoch": 938} {"train_loss": -9.656020164489746, "global_step": 157747, "epoch": 938} {"train_loss": -10.3765230178833, "global_step": 157748, "epoch": 938} {"train_loss": -9.716939926147461, "global_step": 157749, "epoch": 938} {"train_loss": -9.577767372131348, "global_step": 157750, "epoch": 938} {"train_loss": -10.46833248365493, "global_step": 157751, "epoch": 938, "val_loss": 231443.296875} {"train_loss": -10.32302474975586, "global_step": 157752, "epoch": 939} {"train_loss": -9.938898086547852, "global_step": 157753, "epoch": 939} {"train_loss": -10.525724411010742, "global_step": 157754, "epoch": 939} {"train_loss": -9.468927383422852, "global_step": 157755, "epoch": 939} {"train_loss": -10.320821762084961, "global_step": 157756, "epoch": 939} {"train_loss": -10.294561386108398, "global_step": 157757, "epoch": 939} {"train_loss": -10.0894775390625, "global_step": 157758, "epoch": 939} {"train_loss": -10.133405685424805, "global_step": 157759, "epoch": 939} {"train_loss": -10.488594055175781, "global_step": 157760, "epoch": 939} {"train_loss": -10.064812660217285, "global_step": 157761, "epoch": 939} {"train_loss": -10.414945602416992, "global_step": 157762, "epoch": 939} {"train_loss": -10.564598083496094, "global_step": 157763, "epoch": 939} {"train_loss": -10.407691955566406, "global_step": 157764, "epoch": 939} {"train_loss": -10.372208595275879, "global_step": 157765, "epoch": 939} {"train_loss": -10.735864639282227, "global_step": 157766, "epoch": 939} {"train_loss": -10.700002670288086, "global_step": 157767, "epoch": 939} {"train_loss": -10.503629684448242, "global_step": 157768, "epoch": 939} {"train_loss": -10.479710578918457, "global_step": 157769, "epoch": 939} {"train_loss": -10.735898971557617, "global_step": 157770, "epoch": 939} {"train_loss": -10.266019821166992, "global_step": 157771, "epoch": 939} {"train_loss": -10.607622146606445, "global_step": 157772, "epoch": 939} {"train_loss": -10.826435089111328, "global_step": 157773, "epoch": 939} {"train_loss": -10.194832801818848, "global_step": 157774, "epoch": 939} {"train_loss": -10.567605972290039, "global_step": 157775, "epoch": 939} {"train_loss": -10.442741394042969, "global_step": 157776, "epoch": 939} {"train_loss": -10.625879287719727, "global_step": 157777, "epoch": 939} {"train_loss": -10.601476669311523, "global_step": 157778, "epoch": 939} {"train_loss": -10.743762016296387, "global_step": 157779, "epoch": 939} {"train_loss": -10.688846588134766, "global_step": 157780, "epoch": 939} {"train_loss": -10.79572868347168, "global_step": 157781, "epoch": 939} {"train_loss": -10.678322792053223, "global_step": 157782, "epoch": 939} {"train_loss": -10.705974578857422, "global_step": 157783, "epoch": 939} {"train_loss": -10.766595840454102, "global_step": 157784, "epoch": 939} {"train_loss": -10.848272323608398, "global_step": 157785, "epoch": 939} {"train_loss": -10.853910446166992, "global_step": 157786, "epoch": 939} {"train_loss": -10.923860549926758, "global_step": 157787, "epoch": 939} {"train_loss": -10.691868782043457, "global_step": 157788, "epoch": 939} {"train_loss": -10.665818214416504, "global_step": 157789, "epoch": 939} {"train_loss": -10.93882942199707, "global_step": 157790, "epoch": 939} {"train_loss": -10.743762016296387, "global_step": 157791, "epoch": 939} {"train_loss": -11.013099670410156, "global_step": 157792, "epoch": 939} {"train_loss": -10.905868530273438, "global_step": 157793, "epoch": 939} {"train_loss": -10.928333282470703, "global_step": 157794, "epoch": 939} {"train_loss": -11.067353248596191, "global_step": 157795, "epoch": 939} {"train_loss": -11.066680908203125, "global_step": 157796, "epoch": 939} {"train_loss": -10.943216323852539, "global_step": 157797, "epoch": 939} {"train_loss": -10.905230522155762, "global_step": 157798, "epoch": 939} {"train_loss": -11.13005256652832, "global_step": 157799, "epoch": 939} {"train_loss": -11.031393051147461, "global_step": 157800, "epoch": 939} {"train_loss": -11.126853942871094, "global_step": 157801, "epoch": 939} {"train_loss": -10.98045825958252, "global_step": 157802, "epoch": 939} {"train_loss": -10.973307609558105, "global_step": 157803, "epoch": 939} {"train_loss": -11.014788627624512, "global_step": 157804, "epoch": 939} {"train_loss": -11.10827350616455, "global_step": 157805, "epoch": 939} {"train_loss": -11.122264862060547, "global_step": 157806, "epoch": 939} {"train_loss": -11.111464500427246, "global_step": 157807, "epoch": 939} {"train_loss": -10.904112815856934, "global_step": 157808, "epoch": 939} {"train_loss": -10.842748641967773, "global_step": 157809, "epoch": 939} {"train_loss": -10.858036994934082, "global_step": 157810, "epoch": 939} {"train_loss": -11.06950855255127, "global_step": 157811, "epoch": 939} {"train_loss": -10.598421096801758, "global_step": 157812, "epoch": 939} {"train_loss": -10.457730293273926, "global_step": 157813, "epoch": 939} {"train_loss": -10.844354629516602, "global_step": 157814, "epoch": 939} {"train_loss": -10.69965934753418, "global_step": 157815, "epoch": 939} {"train_loss": -10.742914199829102, "global_step": 157816, "epoch": 939} {"train_loss": -11.029500961303711, "global_step": 157817, "epoch": 939} {"train_loss": -10.605438232421875, "global_step": 157818, "epoch": 939} {"train_loss": -10.784421920776367, "global_step": 157819, "epoch": 939} {"train_loss": -10.881959915161133, "global_step": 157820, "epoch": 939} {"train_loss": -10.261794090270996, "global_step": 157821, "epoch": 939} {"train_loss": -11.013303756713867, "global_step": 157822, "epoch": 939} {"train_loss": -10.357542991638184, "global_step": 157823, "epoch": 939} {"train_loss": -9.760042190551758, "global_step": 157824, "epoch": 939} {"train_loss": -10.817264556884766, "global_step": 157825, "epoch": 939} {"train_loss": -9.601165771484375, "global_step": 157826, "epoch": 939} {"train_loss": -9.803145408630371, "global_step": 157827, "epoch": 939} {"train_loss": -10.570446014404297, "global_step": 157828, "epoch": 939} {"train_loss": -10.032073020935059, "global_step": 157829, "epoch": 939} {"train_loss": -9.955883026123047, "global_step": 157830, "epoch": 939} {"train_loss": -10.858283042907715, "global_step": 157831, "epoch": 939} {"train_loss": -9.351593017578125, "global_step": 157832, "epoch": 939} {"train_loss": -10.709298133850098, "global_step": 157833, "epoch": 939} {"train_loss": -9.384489059448242, "global_step": 157834, "epoch": 939} {"train_loss": -10.59062385559082, "global_step": 157835, "epoch": 939} {"train_loss": -9.427915573120117, "global_step": 157836, "epoch": 939} {"train_loss": -10.330507278442383, "global_step": 157837, "epoch": 939} {"train_loss": -10.450607299804688, "global_step": 157838, "epoch": 939} {"train_loss": -10.22607135772705, "global_step": 157839, "epoch": 939} {"train_loss": -10.479097366333008, "global_step": 157840, "epoch": 939} {"train_loss": -10.891504287719727, "global_step": 157841, "epoch": 939} {"train_loss": -10.53620719909668, "global_step": 157842, "epoch": 939} {"train_loss": -10.846147537231445, "global_step": 157843, "epoch": 939} {"train_loss": -10.308998107910156, "global_step": 157844, "epoch": 939} {"train_loss": -10.646707534790039, "global_step": 157845, "epoch": 939} {"train_loss": -10.3629789352417, "global_step": 157846, "epoch": 939} {"train_loss": -10.491067886352539, "global_step": 157847, "epoch": 939} {"train_loss": -10.724525451660156, "global_step": 157848, "epoch": 939} {"train_loss": -10.791419982910156, "global_step": 157849, "epoch": 939} {"train_loss": -10.649072647094727, "global_step": 157850, "epoch": 939} {"train_loss": -10.846385955810547, "global_step": 157851, "epoch": 939} {"train_loss": -10.811501502990723, "global_step": 157852, "epoch": 939} {"train_loss": -10.912332534790039, "global_step": 157853, "epoch": 939} {"train_loss": -10.942892074584961, "global_step": 157854, "epoch": 939} {"train_loss": -10.870930671691895, "global_step": 157855, "epoch": 939} {"train_loss": -10.605145454406738, "global_step": 157856, "epoch": 939} {"train_loss": -10.855812072753906, "global_step": 157857, "epoch": 939} {"train_loss": -11.040844917297363, "global_step": 157858, "epoch": 939} {"train_loss": -10.896760940551758, "global_step": 157859, "epoch": 939} {"train_loss": -11.158870697021484, "global_step": 157860, "epoch": 939} {"train_loss": -10.59825611114502, "global_step": 157861, "epoch": 939} {"train_loss": -10.883378028869629, "global_step": 157862, "epoch": 939} {"train_loss": -10.755560874938965, "global_step": 157863, "epoch": 939} {"train_loss": -10.796941757202148, "global_step": 157864, "epoch": 939} {"train_loss": -10.920516014099121, "global_step": 157865, "epoch": 939} {"train_loss": -10.902608871459961, "global_step": 157866, "epoch": 939} {"train_loss": -10.994941711425781, "global_step": 157867, "epoch": 939} {"train_loss": -11.106266975402832, "global_step": 157868, "epoch": 939} {"train_loss": -11.00448226928711, "global_step": 157869, "epoch": 939} {"train_loss": -10.985260009765625, "global_step": 157870, "epoch": 939} {"train_loss": -10.967246055603027, "global_step": 157871, "epoch": 939} {"train_loss": -11.210908889770508, "global_step": 157872, "epoch": 939} {"train_loss": -11.079710006713867, "global_step": 157873, "epoch": 939} {"train_loss": -11.11454963684082, "global_step": 157874, "epoch": 939} {"train_loss": -11.022361755371094, "global_step": 157875, "epoch": 939} {"train_loss": -11.143407821655273, "global_step": 157876, "epoch": 939} {"train_loss": -11.126412391662598, "global_step": 157877, "epoch": 939} {"train_loss": -10.849214553833008, "global_step": 157878, "epoch": 939} {"train_loss": -11.233875274658203, "global_step": 157879, "epoch": 939} {"train_loss": -11.182462692260742, "global_step": 157880, "epoch": 939} {"train_loss": -10.874350547790527, "global_step": 157881, "epoch": 939} {"train_loss": -11.009634017944336, "global_step": 157882, "epoch": 939} {"train_loss": -10.746091842651367, "global_step": 157883, "epoch": 939} {"train_loss": -10.717217445373535, "global_step": 157884, "epoch": 939} {"train_loss": -10.874856948852539, "global_step": 157885, "epoch": 939} {"train_loss": -11.051836013793945, "global_step": 157886, "epoch": 939} {"train_loss": -10.427262306213379, "global_step": 157887, "epoch": 939} {"train_loss": -10.896051406860352, "global_step": 157888, "epoch": 939} {"train_loss": -10.047721862792969, "global_step": 157889, "epoch": 939} {"train_loss": -10.582024574279785, "global_step": 157890, "epoch": 939} {"train_loss": -10.270097732543945, "global_step": 157891, "epoch": 939} {"train_loss": -10.884370803833008, "global_step": 157892, "epoch": 939} {"train_loss": -10.722047805786133, "global_step": 157893, "epoch": 939} {"train_loss": -10.42831802368164, "global_step": 157894, "epoch": 939} {"train_loss": -10.655567169189453, "global_step": 157895, "epoch": 939} {"train_loss": -9.989859580993652, "global_step": 157896, "epoch": 939} {"train_loss": -10.923358917236328, "global_step": 157897, "epoch": 939} {"train_loss": -10.496322631835938, "global_step": 157898, "epoch": 939} {"train_loss": -10.7255277633667, "global_step": 157899, "epoch": 939} {"train_loss": -10.449440002441406, "global_step": 157900, "epoch": 939} {"train_loss": -10.484862327575684, "global_step": 157901, "epoch": 939} {"train_loss": -10.760709762573242, "global_step": 157902, "epoch": 939} {"train_loss": -10.263384819030762, "global_step": 157903, "epoch": 939} {"train_loss": -10.617209434509277, "global_step": 157904, "epoch": 939} {"train_loss": -9.743218421936035, "global_step": 157905, "epoch": 939} {"train_loss": -10.451021194458008, "global_step": 157906, "epoch": 939} {"train_loss": -10.115167617797852, "global_step": 157907, "epoch": 939} {"train_loss": -10.574416160583496, "global_step": 157908, "epoch": 939} {"train_loss": -9.809020042419434, "global_step": 157909, "epoch": 939} {"train_loss": -10.649545669555664, "global_step": 157910, "epoch": 939} {"train_loss": -9.73442554473877, "global_step": 157911, "epoch": 939} {"train_loss": -10.68289852142334, "global_step": 157912, "epoch": 939} {"train_loss": -10.065343856811523, "global_step": 157913, "epoch": 939} {"train_loss": -10.749090194702148, "global_step": 157914, "epoch": 939} {"train_loss": -10.489923477172852, "global_step": 157915, "epoch": 939} {"train_loss": -10.759905815124512, "global_step": 157916, "epoch": 939} {"train_loss": -10.581792831420898, "global_step": 157917, "epoch": 939} {"train_loss": -10.750085830688477, "global_step": 157918, "epoch": 939} {"train_loss": -10.63490190960112, "global_step": 157919, "epoch": 939, "val_loss": 231838.328125} {"train_loss": -10.785184860229492, "global_step": 157920, "epoch": 940} {"train_loss": -10.339361190795898, "global_step": 157921, "epoch": 940} {"train_loss": -10.610368728637695, "global_step": 157922, "epoch": 940} {"train_loss": -10.326461791992188, "global_step": 157923, "epoch": 940} {"train_loss": -10.39732551574707, "global_step": 157924, "epoch": 940} {"train_loss": -10.428403854370117, "global_step": 157925, "epoch": 940} {"train_loss": -10.514093399047852, "global_step": 157926, "epoch": 940} {"train_loss": -10.383369445800781, "global_step": 157927, "epoch": 940} {"train_loss": -10.700162887573242, "global_step": 157928, "epoch": 940} {"train_loss": -10.646865844726562, "global_step": 157929, "epoch": 940} {"train_loss": -10.707947731018066, "global_step": 157930, "epoch": 940} {"train_loss": -11.098034858703613, "global_step": 157931, "epoch": 940} {"train_loss": -10.649566650390625, "global_step": 157932, "epoch": 940} {"train_loss": -10.953760147094727, "global_step": 157933, "epoch": 940} {"train_loss": -10.953409194946289, "global_step": 157934, "epoch": 940} {"train_loss": -10.917945861816406, "global_step": 157935, "epoch": 940} {"train_loss": -10.848907470703125, "global_step": 157936, "epoch": 940} {"train_loss": -10.889551162719727, "global_step": 157937, "epoch": 940} {"train_loss": -11.038829803466797, "global_step": 157938, "epoch": 940} {"train_loss": -10.840499877929688, "global_step": 157939, "epoch": 940} {"train_loss": -10.915143013000488, "global_step": 157940, "epoch": 940} {"train_loss": -10.633947372436523, "global_step": 157941, "epoch": 940} {"train_loss": -11.073765754699707, "global_step": 157942, "epoch": 940} {"train_loss": -11.154009819030762, "global_step": 157943, "epoch": 940} {"train_loss": -11.042241096496582, "global_step": 157944, "epoch": 940} {"train_loss": -11.106414794921875, "global_step": 157945, "epoch": 940} {"train_loss": -11.03154182434082, "global_step": 157946, "epoch": 940} {"train_loss": -10.800392150878906, "global_step": 157947, "epoch": 940} {"train_loss": -10.840887069702148, "global_step": 157948, "epoch": 940} {"train_loss": -11.03286075592041, "global_step": 157949, "epoch": 940} {"train_loss": -10.96414566040039, "global_step": 157950, "epoch": 940} {"train_loss": -10.981285095214844, "global_step": 157951, "epoch": 940} {"train_loss": -11.036832809448242, "global_step": 157952, "epoch": 940} {"train_loss": -10.954751014709473, "global_step": 157953, "epoch": 940} {"train_loss": -11.349641799926758, "global_step": 157954, "epoch": 940} {"train_loss": -10.713578224182129, "global_step": 157955, "epoch": 940} {"train_loss": -10.918289184570312, "global_step": 157956, "epoch": 940} {"train_loss": -11.00955581665039, "global_step": 157957, "epoch": 940} {"train_loss": -10.705187797546387, "global_step": 157958, "epoch": 940} {"train_loss": -10.646631240844727, "global_step": 157959, "epoch": 940} {"train_loss": -11.07365608215332, "global_step": 157960, "epoch": 940} {"train_loss": -10.438016891479492, "global_step": 157961, "epoch": 940} {"train_loss": -10.45083236694336, "global_step": 157962, "epoch": 940} {"train_loss": -11.218683242797852, "global_step": 157963, "epoch": 940} {"train_loss": -10.230205535888672, "global_step": 157964, "epoch": 940} {"train_loss": -10.616673469543457, "global_step": 157965, "epoch": 940} {"train_loss": -11.128547668457031, "global_step": 157966, "epoch": 940} {"train_loss": -10.05490779876709, "global_step": 157967, "epoch": 940} {"train_loss": -11.128284454345703, "global_step": 157968, "epoch": 940} {"train_loss": -10.443710327148438, "global_step": 157969, "epoch": 940} {"train_loss": -10.182201385498047, "global_step": 157970, "epoch": 940} {"train_loss": -10.33926010131836, "global_step": 157971, "epoch": 940} {"train_loss": -10.589212417602539, "global_step": 157972, "epoch": 940} {"train_loss": -10.553201675415039, "global_step": 157973, "epoch": 940} {"train_loss": -10.775702476501465, "global_step": 157974, "epoch": 940} {"train_loss": -9.795689582824707, "global_step": 157975, "epoch": 940} {"train_loss": -10.876657485961914, "global_step": 157976, "epoch": 940} {"train_loss": -10.25126838684082, "global_step": 157977, "epoch": 940} {"train_loss": -10.708366394042969, "global_step": 157978, "epoch": 940} {"train_loss": -10.146588325500488, "global_step": 157979, "epoch": 940} {"train_loss": -10.383400917053223, "global_step": 157980, "epoch": 940} {"train_loss": -9.240620613098145, "global_step": 157981, "epoch": 940} {"train_loss": -10.644303321838379, "global_step": 157982, "epoch": 940} {"train_loss": -9.581687927246094, "global_step": 157983, "epoch": 940} {"train_loss": -10.805719375610352, "global_step": 157984, "epoch": 940} {"train_loss": -10.25395393371582, "global_step": 157985, "epoch": 940} {"train_loss": -11.065674781799316, "global_step": 157986, "epoch": 940} {"train_loss": -10.385786056518555, "global_step": 157987, "epoch": 940} {"train_loss": -10.663204193115234, "global_step": 157988, "epoch": 940} {"train_loss": -10.445979118347168, "global_step": 157989, "epoch": 940} {"train_loss": -10.58017635345459, "global_step": 157990, "epoch": 940} {"train_loss": -10.369827270507812, "global_step": 157991, "epoch": 940} {"train_loss": -10.783552169799805, "global_step": 157992, "epoch": 940} {"train_loss": -10.73360824584961, "global_step": 157993, "epoch": 940} {"train_loss": -10.63726806640625, "global_step": 157994, "epoch": 940} {"train_loss": -10.810720443725586, "global_step": 157995, "epoch": 940} {"train_loss": -10.748404502868652, "global_step": 157996, "epoch": 940} {"train_loss": -10.767959594726562, "global_step": 157997, "epoch": 940} {"train_loss": -10.740888595581055, "global_step": 157998, "epoch": 940} {"train_loss": -10.603959083557129, "global_step": 157999, "epoch": 940} {"train_loss": -10.43419075012207, "global_step": 158000, "epoch": 940} {"train_loss": -10.875574111938477, "global_step": 158001, "epoch": 940} {"train_loss": -10.586784362792969, "global_step": 158002, "epoch": 940} {"train_loss": -10.942665100097656, "global_step": 158003, "epoch": 940} {"train_loss": -10.913159370422363, "global_step": 158004, "epoch": 940} {"train_loss": -10.842127799987793, "global_step": 158005, "epoch": 940} {"train_loss": -10.955779075622559, "global_step": 158006, "epoch": 940} {"train_loss": -11.112330436706543, "global_step": 158007, "epoch": 940} {"train_loss": -10.865174293518066, "global_step": 158008, "epoch": 940} {"train_loss": -11.10962963104248, "global_step": 158009, "epoch": 940} {"train_loss": -11.180929183959961, "global_step": 158010, "epoch": 940} {"train_loss": -10.735326766967773, "global_step": 158011, "epoch": 940} {"train_loss": -10.804120063781738, "global_step": 158012, "epoch": 940} {"train_loss": -10.700684547424316, "global_step": 158013, "epoch": 940} {"train_loss": -10.584676742553711, "global_step": 158014, "epoch": 940} {"train_loss": -10.996073722839355, "global_step": 158015, "epoch": 940} {"train_loss": -10.936870574951172, "global_step": 158016, "epoch": 940} {"train_loss": -10.942697525024414, "global_step": 158017, "epoch": 940} {"train_loss": -11.045851707458496, "global_step": 158018, "epoch": 940} {"train_loss": -10.868605613708496, "global_step": 158019, "epoch": 940} {"train_loss": -10.88075065612793, "global_step": 158020, "epoch": 940} {"train_loss": -10.930949211120605, "global_step": 158021, "epoch": 940} {"train_loss": -11.071149826049805, "global_step": 158022, "epoch": 940} {"train_loss": -11.080766677856445, "global_step": 158023, "epoch": 940} {"train_loss": -10.871622085571289, "global_step": 158024, "epoch": 940} {"train_loss": -11.044675827026367, "global_step": 158025, "epoch": 940} {"train_loss": -11.161210060119629, "global_step": 158026, "epoch": 940} {"train_loss": -10.957620620727539, "global_step": 158027, "epoch": 940} {"train_loss": -11.061497688293457, "global_step": 158028, "epoch": 940} {"train_loss": -11.200517654418945, "global_step": 158029, "epoch": 940} {"train_loss": -10.839147567749023, "global_step": 158030, "epoch": 940} {"train_loss": -11.152923583984375, "global_step": 158031, "epoch": 940} {"train_loss": -10.943130493164062, "global_step": 158032, "epoch": 940} {"train_loss": -11.082881927490234, "global_step": 158033, "epoch": 940} {"train_loss": -11.227278709411621, "global_step": 158034, "epoch": 940} {"train_loss": -10.853191375732422, "global_step": 158035, "epoch": 940} {"train_loss": -11.145606994628906, "global_step": 158036, "epoch": 940} {"train_loss": -11.155776977539062, "global_step": 158037, "epoch": 940} {"train_loss": -11.009361267089844, "global_step": 158038, "epoch": 940} {"train_loss": -11.147207260131836, "global_step": 158039, "epoch": 940} {"train_loss": -11.231195449829102, "global_step": 158040, "epoch": 940} {"train_loss": -11.061798095703125, "global_step": 158041, "epoch": 940} {"train_loss": -11.157026290893555, "global_step": 158042, "epoch": 940} {"train_loss": -11.417099952697754, "global_step": 158043, "epoch": 940} {"train_loss": -11.124862670898438, "global_step": 158044, "epoch": 940} {"train_loss": -11.019155502319336, "global_step": 158045, "epoch": 940} {"train_loss": -11.204919815063477, "global_step": 158046, "epoch": 940} {"train_loss": -11.192375183105469, "global_step": 158047, "epoch": 940} {"train_loss": -10.319561004638672, "global_step": 158048, "epoch": 940} {"train_loss": -9.316631317138672, "global_step": 158049, "epoch": 940} {"train_loss": -10.820706367492676, "global_step": 158050, "epoch": 940} {"train_loss": -10.536245346069336, "global_step": 158051, "epoch": 940} {"train_loss": -9.54658317565918, "global_step": 158052, "epoch": 940} {"train_loss": -10.04025936126709, "global_step": 158053, "epoch": 940} {"train_loss": -10.422636032104492, "global_step": 158054, "epoch": 940} {"train_loss": -9.177613258361816, "global_step": 158055, "epoch": 940} {"train_loss": -9.60387134552002, "global_step": 158056, "epoch": 940} {"train_loss": -10.671623229980469, "global_step": 158057, "epoch": 940} {"train_loss": -9.783910751342773, "global_step": 158058, "epoch": 940} {"train_loss": -10.183355331420898, "global_step": 158059, "epoch": 940} {"train_loss": -10.389703750610352, "global_step": 158060, "epoch": 940} {"train_loss": -10.790046691894531, "global_step": 158061, "epoch": 940} {"train_loss": -10.52971076965332, "global_step": 158062, "epoch": 940} {"train_loss": -10.283439636230469, "global_step": 158063, "epoch": 940} {"train_loss": -10.669448852539062, "global_step": 158064, "epoch": 940} {"train_loss": -10.15856647491455, "global_step": 158065, "epoch": 940} {"train_loss": -10.476065635681152, "global_step": 158066, "epoch": 940} {"train_loss": -10.644819259643555, "global_step": 158067, "epoch": 940} {"train_loss": -10.491883277893066, "global_step": 158068, "epoch": 940} {"train_loss": -10.716228485107422, "global_step": 158069, "epoch": 940} {"train_loss": -10.629546165466309, "global_step": 158070, "epoch": 940} {"train_loss": -10.681528091430664, "global_step": 158071, "epoch": 940} {"train_loss": -10.59549331665039, "global_step": 158072, "epoch": 940} {"train_loss": -10.319113731384277, "global_step": 158073, "epoch": 940} {"train_loss": -10.499524116516113, "global_step": 158074, "epoch": 940} {"train_loss": -10.939691543579102, "global_step": 158075, "epoch": 940} {"train_loss": -10.552314758300781, "global_step": 158076, "epoch": 940} {"train_loss": -10.891368865966797, "global_step": 158077, "epoch": 940} {"train_loss": -10.610776901245117, "global_step": 158078, "epoch": 940} {"train_loss": -10.76177978515625, "global_step": 158079, "epoch": 940} {"train_loss": -10.7342529296875, "global_step": 158080, "epoch": 940} {"train_loss": -10.895835876464844, "global_step": 158081, "epoch": 940} {"train_loss": -10.744844436645508, "global_step": 158082, "epoch": 940} {"train_loss": -11.00936222076416, "global_step": 158083, "epoch": 940} {"train_loss": -10.732500076293945, "global_step": 158084, "epoch": 940} {"train_loss": -10.640481948852539, "global_step": 158085, "epoch": 940} {"train_loss": -10.870216369628906, "global_step": 158086, "epoch": 940} {"train_loss": -10.71790231409527, "global_step": 158087, "epoch": 940, "val_loss": 233549.328125, "train_action_mse_error": 1.4326035976409912} {"train_loss": -10.879987716674805, "global_step": 158088, "epoch": 941} {"train_loss": -10.9744873046875, "global_step": 158089, "epoch": 941} {"train_loss": -11.028421401977539, "global_step": 158090, "epoch": 941} {"train_loss": -11.096719741821289, "global_step": 158091, "epoch": 941} {"train_loss": -11.059319496154785, "global_step": 158092, "epoch": 941} {"train_loss": -10.663843154907227, "global_step": 158093, "epoch": 941} {"train_loss": -11.182060241699219, "global_step": 158094, "epoch": 941} {"train_loss": -10.823007583618164, "global_step": 158095, "epoch": 941} {"train_loss": -11.12622356414795, "global_step": 158096, "epoch": 941} {"train_loss": -10.974708557128906, "global_step": 158097, "epoch": 941} {"train_loss": -11.109874725341797, "global_step": 158098, "epoch": 941} {"train_loss": -11.157243728637695, "global_step": 158099, "epoch": 941} {"train_loss": -11.052634239196777, "global_step": 158100, "epoch": 941} {"train_loss": -11.101537704467773, "global_step": 158101, "epoch": 941} {"train_loss": -11.193302154541016, "global_step": 158102, "epoch": 941} {"train_loss": -11.11582088470459, "global_step": 158103, "epoch": 941} {"train_loss": -10.882862091064453, "global_step": 158104, "epoch": 941} {"train_loss": -11.066125869750977, "global_step": 158105, "epoch": 941} {"train_loss": -11.12009048461914, "global_step": 158106, "epoch": 941} {"train_loss": -10.866820335388184, "global_step": 158107, "epoch": 941} {"train_loss": -10.721105575561523, "global_step": 158108, "epoch": 941} {"train_loss": -11.024114608764648, "global_step": 158109, "epoch": 941} {"train_loss": -10.843856811523438, "global_step": 158110, "epoch": 941} {"train_loss": -10.797980308532715, "global_step": 158111, "epoch": 941} {"train_loss": -10.891267776489258, "global_step": 158112, "epoch": 941} {"train_loss": -10.845687866210938, "global_step": 158113, "epoch": 941} {"train_loss": -10.511449813842773, "global_step": 158114, "epoch": 941} {"train_loss": -10.497980117797852, "global_step": 158115, "epoch": 941} {"train_loss": -11.130653381347656, "global_step": 158116, "epoch": 941} {"train_loss": -10.291933059692383, "global_step": 158117, "epoch": 941} {"train_loss": -10.6564302444458, "global_step": 158118, "epoch": 941} {"train_loss": -10.856176376342773, "global_step": 158119, "epoch": 941} {"train_loss": -10.375926971435547, "global_step": 158120, "epoch": 941} {"train_loss": -10.828457832336426, "global_step": 158121, "epoch": 941} {"train_loss": -10.360152244567871, "global_step": 158122, "epoch": 941} {"train_loss": -10.797012329101562, "global_step": 158123, "epoch": 941} {"train_loss": -10.252540588378906, "global_step": 158124, "epoch": 941} {"train_loss": -10.732995986938477, "global_step": 158125, "epoch": 941} {"train_loss": -10.92043399810791, "global_step": 158126, "epoch": 941} {"train_loss": -10.401708602905273, "global_step": 158127, "epoch": 941} {"train_loss": -10.616695404052734, "global_step": 158128, "epoch": 941} {"train_loss": -10.622541427612305, "global_step": 158129, "epoch": 941} {"train_loss": -10.47800064086914, "global_step": 158130, "epoch": 941} {"train_loss": -10.787775993347168, "global_step": 158131, "epoch": 941} {"train_loss": -10.146932601928711, "global_step": 158132, "epoch": 941} {"train_loss": -10.933622360229492, "global_step": 158133, "epoch": 941} {"train_loss": -10.264141082763672, "global_step": 158134, "epoch": 941} {"train_loss": -10.184431076049805, "global_step": 158135, "epoch": 941} {"train_loss": -10.605409622192383, "global_step": 158136, "epoch": 941} {"train_loss": -10.731678009033203, "global_step": 158137, "epoch": 941} {"train_loss": -10.802665710449219, "global_step": 158138, "epoch": 941} {"train_loss": -10.591867446899414, "global_step": 158139, "epoch": 941} {"train_loss": -10.946795463562012, "global_step": 158140, "epoch": 941} {"train_loss": -10.546974182128906, "global_step": 158141, "epoch": 941} {"train_loss": -10.779211044311523, "global_step": 158142, "epoch": 941} {"train_loss": -10.799917221069336, "global_step": 158143, "epoch": 941} {"train_loss": -10.774503707885742, "global_step": 158144, "epoch": 941} {"train_loss": -10.614701271057129, "global_step": 158145, "epoch": 941} {"train_loss": -10.744121551513672, "global_step": 158146, "epoch": 941} {"train_loss": -10.72515869140625, "global_step": 158147, "epoch": 941} {"train_loss": -10.971939086914062, "global_step": 158148, "epoch": 941} {"train_loss": -10.782264709472656, "global_step": 158149, "epoch": 941} {"train_loss": -11.061407089233398, "global_step": 158150, "epoch": 941} {"train_loss": -10.842453956604004, "global_step": 158151, "epoch": 941} {"train_loss": -11.081624984741211, "global_step": 158152, "epoch": 941} {"train_loss": -11.00904655456543, "global_step": 158153, "epoch": 941} {"train_loss": -10.960397720336914, "global_step": 158154, "epoch": 941} {"train_loss": -10.95427131652832, "global_step": 158155, "epoch": 941} {"train_loss": -10.833555221557617, "global_step": 158156, "epoch": 941} {"train_loss": -10.85982894897461, "global_step": 158157, "epoch": 941} {"train_loss": -11.020674705505371, "global_step": 158158, "epoch": 941} {"train_loss": -10.825698852539062, "global_step": 158159, "epoch": 941} {"train_loss": -11.016985893249512, "global_step": 158160, "epoch": 941} {"train_loss": -10.927963256835938, "global_step": 158161, "epoch": 941} {"train_loss": -10.910027503967285, "global_step": 158162, "epoch": 941} {"train_loss": -10.87612247467041, "global_step": 158163, "epoch": 941} {"train_loss": -10.987848281860352, "global_step": 158164, "epoch": 941} {"train_loss": -11.217973709106445, "global_step": 158165, "epoch": 941} {"train_loss": -11.345196723937988, "global_step": 158166, "epoch": 941} {"train_loss": -11.001014709472656, "global_step": 158167, "epoch": 941} {"train_loss": -11.238880157470703, "global_step": 158168, "epoch": 941} {"train_loss": -10.778388977050781, "global_step": 158169, "epoch": 941} {"train_loss": -11.107038497924805, "global_step": 158170, "epoch": 941} {"train_loss": -11.066564559936523, "global_step": 158171, "epoch": 941} {"train_loss": -11.200185775756836, "global_step": 158172, "epoch": 941} {"train_loss": -10.885517120361328, "global_step": 158173, "epoch": 941} {"train_loss": -10.813035011291504, "global_step": 158174, "epoch": 941} {"train_loss": -11.23202133178711, "global_step": 158175, "epoch": 941} {"train_loss": -11.077274322509766, "global_step": 158176, "epoch": 941} {"train_loss": -11.083760261535645, "global_step": 158177, "epoch": 941} {"train_loss": -10.974588394165039, "global_step": 158178, "epoch": 941} {"train_loss": -10.984845161437988, "global_step": 158179, "epoch": 941} {"train_loss": -10.763486862182617, "global_step": 158180, "epoch": 941} {"train_loss": -10.804845809936523, "global_step": 158181, "epoch": 941} {"train_loss": -10.974821090698242, "global_step": 158182, "epoch": 941} {"train_loss": -11.029888153076172, "global_step": 158183, "epoch": 941} {"train_loss": -11.062479019165039, "global_step": 158184, "epoch": 941} {"train_loss": -11.27434253692627, "global_step": 158185, "epoch": 941} {"train_loss": -11.340847969055176, "global_step": 158186, "epoch": 941} {"train_loss": -11.239381790161133, "global_step": 158187, "epoch": 941} {"train_loss": -11.252439498901367, "global_step": 158188, "epoch": 941} {"train_loss": -11.099149703979492, "global_step": 158189, "epoch": 941} {"train_loss": -11.108863830566406, "global_step": 158190, "epoch": 941} {"train_loss": -10.632864952087402, "global_step": 158191, "epoch": 941} {"train_loss": -11.068183898925781, "global_step": 158192, "epoch": 941} {"train_loss": -11.116254806518555, "global_step": 158193, "epoch": 941} {"train_loss": -10.75332260131836, "global_step": 158194, "epoch": 941} {"train_loss": -10.47500991821289, "global_step": 158195, "epoch": 941} {"train_loss": -10.610045433044434, "global_step": 158196, "epoch": 941} {"train_loss": -10.78486442565918, "global_step": 158197, "epoch": 941} {"train_loss": -10.565605163574219, "global_step": 158198, "epoch": 941} {"train_loss": -10.83462142944336, "global_step": 158199, "epoch": 941} {"train_loss": -10.731375694274902, "global_step": 158200, "epoch": 941} {"train_loss": -10.157153129577637, "global_step": 158201, "epoch": 941} {"train_loss": -10.670621871948242, "global_step": 158202, "epoch": 941} {"train_loss": -10.42110824584961, "global_step": 158203, "epoch": 941} {"train_loss": -9.78079891204834, "global_step": 158204, "epoch": 941} {"train_loss": -9.294949531555176, "global_step": 158205, "epoch": 941} {"train_loss": -9.822602272033691, "global_step": 158206, "epoch": 941} {"train_loss": -7.724635124206543, "global_step": 158207, "epoch": 941} {"train_loss": -8.528816223144531, "global_step": 158208, "epoch": 941} {"train_loss": -9.264337539672852, "global_step": 158209, "epoch": 941} {"train_loss": -7.397158145904541, "global_step": 158210, "epoch": 941} {"train_loss": -8.041461944580078, "global_step": 158211, "epoch": 941} {"train_loss": -6.625419616699219, "global_step": 158212, "epoch": 941} {"train_loss": -8.13514232635498, "global_step": 158213, "epoch": 941} {"train_loss": -7.627837181091309, "global_step": 158214, "epoch": 941} {"train_loss": -8.466718673706055, "global_step": 158215, "epoch": 941} {"train_loss": -8.761783599853516, "global_step": 158216, "epoch": 941} {"train_loss": -8.325345039367676, "global_step": 158217, "epoch": 941} {"train_loss": -8.65365219116211, "global_step": 158218, "epoch": 941} {"train_loss": -9.841442108154297, "global_step": 158219, "epoch": 941} {"train_loss": -8.869564056396484, "global_step": 158220, "epoch": 941} {"train_loss": -8.804130554199219, "global_step": 158221, "epoch": 941} {"train_loss": -9.764297485351562, "global_step": 158222, "epoch": 941} {"train_loss": -9.431998252868652, "global_step": 158223, "epoch": 941} {"train_loss": -9.290288925170898, "global_step": 158224, "epoch": 941} {"train_loss": -10.084312438964844, "global_step": 158225, "epoch": 941} {"train_loss": -9.955368041992188, "global_step": 158226, "epoch": 941} {"train_loss": -9.537574768066406, "global_step": 158227, "epoch": 941} {"train_loss": -9.659217834472656, "global_step": 158228, "epoch": 941} {"train_loss": -10.022796630859375, "global_step": 158229, "epoch": 941} {"train_loss": -10.081119537353516, "global_step": 158230, "epoch": 941} {"train_loss": -9.964075088500977, "global_step": 158231, "epoch": 941} {"train_loss": -9.809157371520996, "global_step": 158232, "epoch": 941} {"train_loss": -9.780778884887695, "global_step": 158233, "epoch": 941} {"train_loss": -10.339242935180664, "global_step": 158234, "epoch": 941} {"train_loss": -10.045347213745117, "global_step": 158235, "epoch": 941} {"train_loss": -10.170722961425781, "global_step": 158236, "epoch": 941} {"train_loss": -10.287261962890625, "global_step": 158237, "epoch": 941} {"train_loss": -10.24654483795166, "global_step": 158238, "epoch": 941} {"train_loss": -10.122627258300781, "global_step": 158239, "epoch": 941} {"train_loss": -10.158029556274414, "global_step": 158240, "epoch": 941} {"train_loss": -10.376056671142578, "global_step": 158241, "epoch": 941} {"train_loss": -10.40682315826416, "global_step": 158242, "epoch": 941} {"train_loss": -10.46552848815918, "global_step": 158243, "epoch": 941} {"train_loss": -10.559131622314453, "global_step": 158244, "epoch": 941} {"train_loss": -10.356634140014648, "global_step": 158245, "epoch": 941} {"train_loss": -10.443059921264648, "global_step": 158246, "epoch": 941} {"train_loss": -10.531469345092773, "global_step": 158247, "epoch": 941} {"train_loss": -10.488381385803223, "global_step": 158248, "epoch": 941} {"train_loss": -10.562318801879883, "global_step": 158249, "epoch": 941} {"train_loss": -10.597221374511719, "global_step": 158250, "epoch": 941} {"train_loss": -10.673506736755371, "global_step": 158251, "epoch": 941} {"train_loss": -10.614396095275879, "global_step": 158252, "epoch": 941} {"train_loss": -10.624628067016602, "global_step": 158253, "epoch": 941} {"train_loss": -10.724417686462402, "global_step": 158254, "epoch": 941} {"train_loss": -10.478364027681804, "global_step": 158255, "epoch": 941, "val_loss": 224122.609375} {"train_loss": -10.748979568481445, "global_step": 158256, "epoch": 942} {"train_loss": -10.765007972717285, "global_step": 158257, "epoch": 942} {"train_loss": -10.752460479736328, "global_step": 158258, "epoch": 942} {"train_loss": -10.734187126159668, "global_step": 158259, "epoch": 942} {"train_loss": -10.865008354187012, "global_step": 158260, "epoch": 942} {"train_loss": -10.730472564697266, "global_step": 158261, "epoch": 942} {"train_loss": -10.962625503540039, "global_step": 158262, "epoch": 942} {"train_loss": -10.992130279541016, "global_step": 158263, "epoch": 942} {"train_loss": -10.886285781860352, "global_step": 158264, "epoch": 942} {"train_loss": -10.877421379089355, "global_step": 158265, "epoch": 942} {"train_loss": -10.75477409362793, "global_step": 158266, "epoch": 942} {"train_loss": -10.887242317199707, "global_step": 158267, "epoch": 942} {"train_loss": -10.904898643493652, "global_step": 158268, "epoch": 942} {"train_loss": -10.702152252197266, "global_step": 158269, "epoch": 942} {"train_loss": -10.886856079101562, "global_step": 158270, "epoch": 942} {"train_loss": -10.90570068359375, "global_step": 158271, "epoch": 942} {"train_loss": -11.015111923217773, "global_step": 158272, "epoch": 942} {"train_loss": -11.148446083068848, "global_step": 158273, "epoch": 942} {"train_loss": -10.998937606811523, "global_step": 158274, "epoch": 942} {"train_loss": -11.153007507324219, "global_step": 158275, "epoch": 942} {"train_loss": -10.897428512573242, "global_step": 158276, "epoch": 942} {"train_loss": -11.113351821899414, "global_step": 158277, "epoch": 942} {"train_loss": -11.139827728271484, "global_step": 158278, "epoch": 942} {"train_loss": -11.156332015991211, "global_step": 158279, "epoch": 942} {"train_loss": -11.035070419311523, "global_step": 158280, "epoch": 942} {"train_loss": -10.948724746704102, "global_step": 158281, "epoch": 942} {"train_loss": -11.16457462310791, "global_step": 158282, "epoch": 942} {"train_loss": -11.070623397827148, "global_step": 158283, "epoch": 942} {"train_loss": -11.109424591064453, "global_step": 158284, "epoch": 942} {"train_loss": -10.989503860473633, "global_step": 158285, "epoch": 942} {"train_loss": -11.02140998840332, "global_step": 158286, "epoch": 942} {"train_loss": -11.08119010925293, "global_step": 158287, "epoch": 942} {"train_loss": -11.006937026977539, "global_step": 158288, "epoch": 942} {"train_loss": -11.018224716186523, "global_step": 158289, "epoch": 942} {"train_loss": -10.884114265441895, "global_step": 158290, "epoch": 942} {"train_loss": -10.844435691833496, "global_step": 158291, "epoch": 942} {"train_loss": -11.456437110900879, "global_step": 158292, "epoch": 942} {"train_loss": -10.870702743530273, "global_step": 158293, "epoch": 942} {"train_loss": -11.115543365478516, "global_step": 158294, "epoch": 942} {"train_loss": -11.085067749023438, "global_step": 158295, "epoch": 942} {"train_loss": -11.224699020385742, "global_step": 158296, "epoch": 942} {"train_loss": -10.944230079650879, "global_step": 158297, "epoch": 942} {"train_loss": -10.474906921386719, "global_step": 158298, "epoch": 942} {"train_loss": -10.954231262207031, "global_step": 158299, "epoch": 942} {"train_loss": -11.20335865020752, "global_step": 158300, "epoch": 942} {"train_loss": -10.827357292175293, "global_step": 158301, "epoch": 942} {"train_loss": -10.628811836242676, "global_step": 158302, "epoch": 942} {"train_loss": -10.485639572143555, "global_step": 158303, "epoch": 942} {"train_loss": -10.16252613067627, "global_step": 158304, "epoch": 942} {"train_loss": -11.249052047729492, "global_step": 158305, "epoch": 942} {"train_loss": -10.33976936340332, "global_step": 158306, "epoch": 942} {"train_loss": -10.430763244628906, "global_step": 158307, "epoch": 942} {"train_loss": -10.479249954223633, "global_step": 158308, "epoch": 942} {"train_loss": -10.54619026184082, "global_step": 158309, "epoch": 942} {"train_loss": -10.456003189086914, "global_step": 158310, "epoch": 942} {"train_loss": -10.749916076660156, "global_step": 158311, "epoch": 942} {"train_loss": -10.608476638793945, "global_step": 158312, "epoch": 942} {"train_loss": -9.837785720825195, "global_step": 158313, "epoch": 942} {"train_loss": -10.930156707763672, "global_step": 158314, "epoch": 942} {"train_loss": -10.111228942871094, "global_step": 158315, "epoch": 942} {"train_loss": -10.986405372619629, "global_step": 158316, "epoch": 942} {"train_loss": -10.753734588623047, "global_step": 158317, "epoch": 942} {"train_loss": -9.927098274230957, "global_step": 158318, "epoch": 942} {"train_loss": -10.660253524780273, "global_step": 158319, "epoch": 942} {"train_loss": -10.326972961425781, "global_step": 158320, "epoch": 942} {"train_loss": -10.452616691589355, "global_step": 158321, "epoch": 942} {"train_loss": -10.237977027893066, "global_step": 158322, "epoch": 942} {"train_loss": -10.617331504821777, "global_step": 158323, "epoch": 942} {"train_loss": -10.565508842468262, "global_step": 158324, "epoch": 942} {"train_loss": -10.256227493286133, "global_step": 158325, "epoch": 942} {"train_loss": -10.9085111618042, "global_step": 158326, "epoch": 942} {"train_loss": -10.356803894042969, "global_step": 158327, "epoch": 942} {"train_loss": -10.680302619934082, "global_step": 158328, "epoch": 942} {"train_loss": -10.750551223754883, "global_step": 158329, "epoch": 942} {"train_loss": -10.753137588500977, "global_step": 158330, "epoch": 942} {"train_loss": -10.511676788330078, "global_step": 158331, "epoch": 942} {"train_loss": -10.765541076660156, "global_step": 158332, "epoch": 942} {"train_loss": -10.846014022827148, "global_step": 158333, "epoch": 942} {"train_loss": -10.778341293334961, "global_step": 158334, "epoch": 942} {"train_loss": -10.748035430908203, "global_step": 158335, "epoch": 942} {"train_loss": -10.82144546508789, "global_step": 158336, "epoch": 942} {"train_loss": -10.603036880493164, "global_step": 158337, "epoch": 942} {"train_loss": -11.093184471130371, "global_step": 158338, "epoch": 942} {"train_loss": -10.502821922302246, "global_step": 158339, "epoch": 942} {"train_loss": -10.807266235351562, "global_step": 158340, "epoch": 942} {"train_loss": -10.494833946228027, "global_step": 158341, "epoch": 942} {"train_loss": -10.822375297546387, "global_step": 158342, "epoch": 942} {"train_loss": -10.5594482421875, "global_step": 158343, "epoch": 942} {"train_loss": -10.89087200164795, "global_step": 158344, "epoch": 942} {"train_loss": -10.759681701660156, "global_step": 158345, "epoch": 942} {"train_loss": -10.821784019470215, "global_step": 158346, "epoch": 942} {"train_loss": -11.013648986816406, "global_step": 158347, "epoch": 942} {"train_loss": -10.68758773803711, "global_step": 158348, "epoch": 942} {"train_loss": -10.609281539916992, "global_step": 158349, "epoch": 942} {"train_loss": -10.853067398071289, "global_step": 158350, "epoch": 942} {"train_loss": -10.724752426147461, "global_step": 158351, "epoch": 942} {"train_loss": -11.091712951660156, "global_step": 158352, "epoch": 942} {"train_loss": -10.80974006652832, "global_step": 158353, "epoch": 942} {"train_loss": -10.923185348510742, "global_step": 158354, "epoch": 942} {"train_loss": -10.889307022094727, "global_step": 158355, "epoch": 942} {"train_loss": -10.802559852600098, "global_step": 158356, "epoch": 942} {"train_loss": -11.072443008422852, "global_step": 158357, "epoch": 942} {"train_loss": -10.900402069091797, "global_step": 158358, "epoch": 942} {"train_loss": -11.018155097961426, "global_step": 158359, "epoch": 942} {"train_loss": -10.887956619262695, "global_step": 158360, "epoch": 942} {"train_loss": -10.999669075012207, "global_step": 158361, "epoch": 942} {"train_loss": -10.734052658081055, "global_step": 158362, "epoch": 942} {"train_loss": -10.947147369384766, "global_step": 158363, "epoch": 942} {"train_loss": -10.605484008789062, "global_step": 158364, "epoch": 942} {"train_loss": -10.879655838012695, "global_step": 158365, "epoch": 942} {"train_loss": -10.442160606384277, "global_step": 158366, "epoch": 942} {"train_loss": -10.83734130859375, "global_step": 158367, "epoch": 942} {"train_loss": -10.656612396240234, "global_step": 158368, "epoch": 942} {"train_loss": -10.602851867675781, "global_step": 158369, "epoch": 942} {"train_loss": -10.710031509399414, "global_step": 158370, "epoch": 942} {"train_loss": -10.833541870117188, "global_step": 158371, "epoch": 942} {"train_loss": -10.975301742553711, "global_step": 158372, "epoch": 942} {"train_loss": -10.830528259277344, "global_step": 158373, "epoch": 942} {"train_loss": -10.928885459899902, "global_step": 158374, "epoch": 942} {"train_loss": -10.794452667236328, "global_step": 158375, "epoch": 942} {"train_loss": -10.776470184326172, "global_step": 158376, "epoch": 942} {"train_loss": -10.73094367980957, "global_step": 158377, "epoch": 942} {"train_loss": -10.881861686706543, "global_step": 158378, "epoch": 942} {"train_loss": -10.977533340454102, "global_step": 158379, "epoch": 942} {"train_loss": -11.101545333862305, "global_step": 158380, "epoch": 942} {"train_loss": -10.770669937133789, "global_step": 158381, "epoch": 942} {"train_loss": -10.744693756103516, "global_step": 158382, "epoch": 942} {"train_loss": -10.88284969329834, "global_step": 158383, "epoch": 942} {"train_loss": -10.091757774353027, "global_step": 158384, "epoch": 942} {"train_loss": -11.05978012084961, "global_step": 158385, "epoch": 942} {"train_loss": -10.667760848999023, "global_step": 158386, "epoch": 942} {"train_loss": -11.033232688903809, "global_step": 158387, "epoch": 942} {"train_loss": -10.64528751373291, "global_step": 158388, "epoch": 942} {"train_loss": -10.53421401977539, "global_step": 158389, "epoch": 942} {"train_loss": -10.602031707763672, "global_step": 158390, "epoch": 942} {"train_loss": -10.184662818908691, "global_step": 158391, "epoch": 942} {"train_loss": -10.116174697875977, "global_step": 158392, "epoch": 942} {"train_loss": -9.358179092407227, "global_step": 158393, "epoch": 942} {"train_loss": -10.116997718811035, "global_step": 158394, "epoch": 942} {"train_loss": -10.23477840423584, "global_step": 158395, "epoch": 942} {"train_loss": -9.825700759887695, "global_step": 158396, "epoch": 942} {"train_loss": -10.434167861938477, "global_step": 158397, "epoch": 942} {"train_loss": -10.260334014892578, "global_step": 158398, "epoch": 942} {"train_loss": -10.006847381591797, "global_step": 158399, "epoch": 942} {"train_loss": -10.909990310668945, "global_step": 158400, "epoch": 942} {"train_loss": -10.086686134338379, "global_step": 158401, "epoch": 942} {"train_loss": -10.67280101776123, "global_step": 158402, "epoch": 942} {"train_loss": -10.541744232177734, "global_step": 158403, "epoch": 942} {"train_loss": -10.105377197265625, "global_step": 158404, "epoch": 942} {"train_loss": -10.362955093383789, "global_step": 158405, "epoch": 942} {"train_loss": -10.389636993408203, "global_step": 158406, "epoch": 942} {"train_loss": -10.322835922241211, "global_step": 158407, "epoch": 942} {"train_loss": -10.774535179138184, "global_step": 158408, "epoch": 942} {"train_loss": -10.215338706970215, "global_step": 158409, "epoch": 942} {"train_loss": -10.504475593566895, "global_step": 158410, "epoch": 942} {"train_loss": -10.567614555358887, "global_step": 158411, "epoch": 942} {"train_loss": -10.366793632507324, "global_step": 158412, "epoch": 942} {"train_loss": -10.522941589355469, "global_step": 158413, "epoch": 942} {"train_loss": -10.634604454040527, "global_step": 158414, "epoch": 942} {"train_loss": -10.489126205444336, "global_step": 158415, "epoch": 942} {"train_loss": -10.599666595458984, "global_step": 158416, "epoch": 942} {"train_loss": -10.664040565490723, "global_step": 158417, "epoch": 942} {"train_loss": -10.403975486755371, "global_step": 158418, "epoch": 942} {"train_loss": -10.393885612487793, "global_step": 158419, "epoch": 942} {"train_loss": -10.221870422363281, "global_step": 158420, "epoch": 942} {"train_loss": -10.431312561035156, "global_step": 158421, "epoch": 942} {"train_loss": -10.508612632751465, "global_step": 158422, "epoch": 942} {"train_loss": -10.708553450448173, "global_step": 158423, "epoch": 942, "val_loss": 233886.734375} {"train_loss": -10.298945426940918, "global_step": 158424, "epoch": 943} {"train_loss": -10.637598037719727, "global_step": 158425, "epoch": 943} {"train_loss": -10.651334762573242, "global_step": 158426, "epoch": 943} {"train_loss": -10.856050491333008, "global_step": 158427, "epoch": 943} {"train_loss": -10.612772941589355, "global_step": 158428, "epoch": 943} {"train_loss": -10.495847702026367, "global_step": 158429, "epoch": 943} {"train_loss": -10.372664451599121, "global_step": 158430, "epoch": 943} {"train_loss": -10.74789047241211, "global_step": 158431, "epoch": 943} {"train_loss": -10.678818702697754, "global_step": 158432, "epoch": 943} {"train_loss": -10.372537612915039, "global_step": 158433, "epoch": 943} {"train_loss": -10.727982521057129, "global_step": 158434, "epoch": 943} {"train_loss": -10.877046585083008, "global_step": 158435, "epoch": 943} {"train_loss": -10.742424011230469, "global_step": 158436, "epoch": 943} {"train_loss": -11.05245304107666, "global_step": 158437, "epoch": 943} {"train_loss": -10.707160949707031, "global_step": 158438, "epoch": 943} {"train_loss": -10.741640090942383, "global_step": 158439, "epoch": 943} {"train_loss": -10.94333267211914, "global_step": 158440, "epoch": 943} {"train_loss": -10.593050003051758, "global_step": 158441, "epoch": 943} {"train_loss": -10.977521896362305, "global_step": 158442, "epoch": 943} {"train_loss": -10.971031188964844, "global_step": 158443, "epoch": 943} {"train_loss": -10.910808563232422, "global_step": 158444, "epoch": 943} {"train_loss": -11.16244888305664, "global_step": 158445, "epoch": 943} {"train_loss": -11.031896591186523, "global_step": 158446, "epoch": 943} {"train_loss": -10.844921112060547, "global_step": 158447, "epoch": 943} {"train_loss": -10.919898986816406, "global_step": 158448, "epoch": 943} {"train_loss": -10.811419486999512, "global_step": 158449, "epoch": 943} {"train_loss": -10.66332721710205, "global_step": 158450, "epoch": 943} {"train_loss": -10.867836952209473, "global_step": 158451, "epoch": 943} {"train_loss": -10.592878341674805, "global_step": 158452, "epoch": 943} {"train_loss": -10.60697078704834, "global_step": 158453, "epoch": 943} {"train_loss": -10.594474792480469, "global_step": 158454, "epoch": 943} {"train_loss": -10.731490135192871, "global_step": 158455, "epoch": 943} {"train_loss": -10.824983596801758, "global_step": 158456, "epoch": 943} {"train_loss": -10.624262809753418, "global_step": 158457, "epoch": 943} {"train_loss": -10.667890548706055, "global_step": 158458, "epoch": 943} {"train_loss": -10.287216186523438, "global_step": 158459, "epoch": 943} {"train_loss": -10.282011032104492, "global_step": 158460, "epoch": 943} {"train_loss": -10.88463020324707, "global_step": 158461, "epoch": 943} {"train_loss": -10.603612899780273, "global_step": 158462, "epoch": 943} {"train_loss": -11.005447387695312, "global_step": 158463, "epoch": 943} {"train_loss": -10.731813430786133, "global_step": 158464, "epoch": 943} {"train_loss": -10.855573654174805, "global_step": 158465, "epoch": 943} {"train_loss": -10.618095397949219, "global_step": 158466, "epoch": 943} {"train_loss": -11.101444244384766, "global_step": 158467, "epoch": 943} {"train_loss": -10.996419906616211, "global_step": 158468, "epoch": 943} {"train_loss": -10.801084518432617, "global_step": 158469, "epoch": 943} {"train_loss": -10.979436874389648, "global_step": 158470, "epoch": 943} {"train_loss": -10.985166549682617, "global_step": 158471, "epoch": 943} {"train_loss": -11.17486572265625, "global_step": 158472, "epoch": 943} {"train_loss": -10.988526344299316, "global_step": 158473, "epoch": 943} {"train_loss": -11.109437942504883, "global_step": 158474, "epoch": 943} {"train_loss": -11.179804801940918, "global_step": 158475, "epoch": 943} {"train_loss": -11.201231956481934, "global_step": 158476, "epoch": 943} {"train_loss": -11.104829788208008, "global_step": 158477, "epoch": 943} {"train_loss": -10.981687545776367, "global_step": 158478, "epoch": 943} {"train_loss": -10.996204376220703, "global_step": 158479, "epoch": 943} {"train_loss": -11.007915496826172, "global_step": 158480, "epoch": 943} {"train_loss": -10.826468467712402, "global_step": 158481, "epoch": 943} {"train_loss": -11.058183670043945, "global_step": 158482, "epoch": 943} {"train_loss": -10.979717254638672, "global_step": 158483, "epoch": 943} {"train_loss": -11.207904815673828, "global_step": 158484, "epoch": 943} {"train_loss": -11.17447280883789, "global_step": 158485, "epoch": 943} {"train_loss": -10.81462287902832, "global_step": 158486, "epoch": 943} {"train_loss": -11.067011833190918, "global_step": 158487, "epoch": 943} {"train_loss": -10.985980987548828, "global_step": 158488, "epoch": 943} {"train_loss": -11.111509323120117, "global_step": 158489, "epoch": 943} {"train_loss": -10.972408294677734, "global_step": 158490, "epoch": 943} {"train_loss": -11.105018615722656, "global_step": 158491, "epoch": 943} {"train_loss": -11.022850036621094, "global_step": 158492, "epoch": 943} {"train_loss": -11.081291198730469, "global_step": 158493, "epoch": 943} {"train_loss": -11.182165145874023, "global_step": 158494, "epoch": 943} {"train_loss": -10.898090362548828, "global_step": 158495, "epoch": 943} {"train_loss": -10.981168746948242, "global_step": 158496, "epoch": 943} {"train_loss": -11.03783893585205, "global_step": 158497, "epoch": 943} {"train_loss": -10.85561752319336, "global_step": 158498, "epoch": 943} {"train_loss": -10.872095108032227, "global_step": 158499, "epoch": 943} {"train_loss": -11.080699920654297, "global_step": 158500, "epoch": 943} {"train_loss": -10.860000610351562, "global_step": 158501, "epoch": 943} {"train_loss": -10.904751777648926, "global_step": 158502, "epoch": 943} {"train_loss": -11.135560989379883, "global_step": 158503, "epoch": 943} {"train_loss": -10.84830093383789, "global_step": 158504, "epoch": 943} {"train_loss": -11.357318878173828, "global_step": 158505, "epoch": 943} {"train_loss": -11.246210098266602, "global_step": 158506, "epoch": 943} {"train_loss": -11.1429443359375, "global_step": 158507, "epoch": 943} {"train_loss": -10.922311782836914, "global_step": 158508, "epoch": 943} {"train_loss": -11.10162353515625, "global_step": 158509, "epoch": 943} {"train_loss": -10.91547679901123, "global_step": 158510, "epoch": 943} {"train_loss": -11.093235969543457, "global_step": 158511, "epoch": 943} {"train_loss": -11.262940406799316, "global_step": 158512, "epoch": 943} {"train_loss": -11.030097007751465, "global_step": 158513, "epoch": 943} {"train_loss": -10.851852416992188, "global_step": 158514, "epoch": 943} {"train_loss": -10.541637420654297, "global_step": 158515, "epoch": 943} {"train_loss": -10.092181205749512, "global_step": 158516, "epoch": 943} {"train_loss": -10.218076705932617, "global_step": 158517, "epoch": 943} {"train_loss": -11.083906173706055, "global_step": 158518, "epoch": 943} {"train_loss": -9.931846618652344, "global_step": 158519, "epoch": 943} {"train_loss": -10.47556209564209, "global_step": 158520, "epoch": 943} {"train_loss": -10.47293472290039, "global_step": 158521, "epoch": 943} {"train_loss": -9.473918914794922, "global_step": 158522, "epoch": 943} {"train_loss": -10.697540283203125, "global_step": 158523, "epoch": 943} {"train_loss": -8.920787811279297, "global_step": 158524, "epoch": 943} {"train_loss": -10.54949951171875, "global_step": 158525, "epoch": 943} {"train_loss": -9.177350044250488, "global_step": 158526, "epoch": 943} {"train_loss": -10.136153221130371, "global_step": 158527, "epoch": 943} {"train_loss": -9.948456764221191, "global_step": 158528, "epoch": 943} {"train_loss": -10.318525314331055, "global_step": 158529, "epoch": 943} {"train_loss": -9.857076644897461, "global_step": 158530, "epoch": 943} {"train_loss": -10.223471641540527, "global_step": 158531, "epoch": 943} {"train_loss": -10.277406692504883, "global_step": 158532, "epoch": 943} {"train_loss": -10.515225410461426, "global_step": 158533, "epoch": 943} {"train_loss": -10.28191089630127, "global_step": 158534, "epoch": 943} {"train_loss": -10.237561225891113, "global_step": 158535, "epoch": 943} {"train_loss": -10.450028419494629, "global_step": 158536, "epoch": 943} {"train_loss": -10.428586959838867, "global_step": 158537, "epoch": 943} {"train_loss": -10.633007049560547, "global_step": 158538, "epoch": 943} {"train_loss": -10.672602653503418, "global_step": 158539, "epoch": 943} {"train_loss": -10.182402610778809, "global_step": 158540, "epoch": 943} {"train_loss": -10.792213439941406, "global_step": 158541, "epoch": 943} {"train_loss": -10.332722663879395, "global_step": 158542, "epoch": 943} {"train_loss": -10.68824577331543, "global_step": 158543, "epoch": 943} {"train_loss": -10.219451904296875, "global_step": 158544, "epoch": 943} {"train_loss": -10.632237434387207, "global_step": 158545, "epoch": 943} {"train_loss": -10.403264999389648, "global_step": 158546, "epoch": 943} {"train_loss": -10.93746280670166, "global_step": 158547, "epoch": 943} {"train_loss": -10.627376556396484, "global_step": 158548, "epoch": 943} {"train_loss": -10.777620315551758, "global_step": 158549, "epoch": 943} {"train_loss": -10.794846534729004, "global_step": 158550, "epoch": 943} {"train_loss": -10.781051635742188, "global_step": 158551, "epoch": 943} {"train_loss": -10.646831512451172, "global_step": 158552, "epoch": 943} {"train_loss": -10.519137382507324, "global_step": 158553, "epoch": 943} {"train_loss": -10.720353126525879, "global_step": 158554, "epoch": 943} {"train_loss": -10.874076843261719, "global_step": 158555, "epoch": 943} {"train_loss": -11.007840156555176, "global_step": 158556, "epoch": 943} {"train_loss": -10.343894958496094, "global_step": 158557, "epoch": 943} {"train_loss": -10.951683044433594, "global_step": 158558, "epoch": 943} {"train_loss": -10.674145698547363, "global_step": 158559, "epoch": 943} {"train_loss": -10.760910987854004, "global_step": 158560, "epoch": 943} {"train_loss": -10.834312438964844, "global_step": 158561, "epoch": 943} {"train_loss": -10.791364669799805, "global_step": 158562, "epoch": 943} {"train_loss": -10.477169036865234, "global_step": 158563, "epoch": 943} {"train_loss": -10.733893394470215, "global_step": 158564, "epoch": 943} {"train_loss": -10.677967071533203, "global_step": 158565, "epoch": 943} {"train_loss": -10.596549987792969, "global_step": 158566, "epoch": 943} {"train_loss": -10.46017837524414, "global_step": 158567, "epoch": 943} {"train_loss": -10.791947364807129, "global_step": 158568, "epoch": 943} {"train_loss": -10.538797378540039, "global_step": 158569, "epoch": 943} {"train_loss": -10.861061096191406, "global_step": 158570, "epoch": 943} {"train_loss": -10.629380226135254, "global_step": 158571, "epoch": 943} {"train_loss": -10.731772422790527, "global_step": 158572, "epoch": 943} {"train_loss": -10.638813018798828, "global_step": 158573, "epoch": 943} {"train_loss": -10.771292686462402, "global_step": 158574, "epoch": 943} {"train_loss": -10.699483871459961, "global_step": 158575, "epoch": 943} {"train_loss": -10.864324569702148, "global_step": 158576, "epoch": 943} {"train_loss": -10.899187088012695, "global_step": 158577, "epoch": 943} {"train_loss": -10.94741439819336, "global_step": 158578, "epoch": 943} {"train_loss": -10.723526954650879, "global_step": 158579, "epoch": 943} {"train_loss": -10.887561798095703, "global_step": 158580, "epoch": 943} {"train_loss": -10.833757400512695, "global_step": 158581, "epoch": 943} {"train_loss": -10.853662490844727, "global_step": 158582, "epoch": 943} {"train_loss": -11.088910102844238, "global_step": 158583, "epoch": 943} {"train_loss": -11.011054039001465, "global_step": 158584, "epoch": 943} {"train_loss": -11.084135055541992, "global_step": 158585, "epoch": 943} {"train_loss": -10.990214347839355, "global_step": 158586, "epoch": 943} {"train_loss": -11.011103630065918, "global_step": 158587, "epoch": 943} {"train_loss": -10.939196586608887, "global_step": 158588, "epoch": 943} {"train_loss": -11.191547393798828, "global_step": 158589, "epoch": 943} {"train_loss": -10.751749038696289, "global_step": 158590, "epoch": 943} {"train_loss": -10.747952682631356, "global_step": 158591, "epoch": 943, "val_loss": 233940.078125} {"train_loss": -10.981855392456055, "global_step": 158592, "epoch": 944} {"train_loss": -11.124706268310547, "global_step": 158593, "epoch": 944} {"train_loss": -11.062051773071289, "global_step": 158594, "epoch": 944} {"train_loss": -10.811708450317383, "global_step": 158595, "epoch": 944} {"train_loss": -10.94855785369873, "global_step": 158596, "epoch": 944} {"train_loss": -10.638360977172852, "global_step": 158597, "epoch": 944} {"train_loss": -11.064971923828125, "global_step": 158598, "epoch": 944} {"train_loss": -10.851007461547852, "global_step": 158599, "epoch": 944} {"train_loss": -11.184160232543945, "global_step": 158600, "epoch": 944} {"train_loss": -10.699463844299316, "global_step": 158601, "epoch": 944} {"train_loss": -10.999407768249512, "global_step": 158602, "epoch": 944} {"train_loss": -10.669598579406738, "global_step": 158603, "epoch": 944} {"train_loss": -10.899484634399414, "global_step": 158604, "epoch": 944} {"train_loss": -11.029678344726562, "global_step": 158605, "epoch": 944} {"train_loss": -10.74612045288086, "global_step": 158606, "epoch": 944} {"train_loss": -11.042322158813477, "global_step": 158607, "epoch": 944} {"train_loss": -10.492050170898438, "global_step": 158608, "epoch": 944} {"train_loss": -10.7623291015625, "global_step": 158609, "epoch": 944} {"train_loss": -10.20124340057373, "global_step": 158610, "epoch": 944} {"train_loss": -9.574241638183594, "global_step": 158611, "epoch": 944} {"train_loss": -10.09988021850586, "global_step": 158612, "epoch": 944} {"train_loss": -10.4029541015625, "global_step": 158613, "epoch": 944} {"train_loss": -10.36579418182373, "global_step": 158614, "epoch": 944} {"train_loss": -10.145989418029785, "global_step": 158615, "epoch": 944} {"train_loss": -10.044332504272461, "global_step": 158616, "epoch": 944} {"train_loss": -9.477930068969727, "global_step": 158617, "epoch": 944} {"train_loss": -10.171106338500977, "global_step": 158618, "epoch": 944} {"train_loss": -9.484355926513672, "global_step": 158619, "epoch": 944} {"train_loss": -10.53795337677002, "global_step": 158620, "epoch": 944} {"train_loss": -9.90194320678711, "global_step": 158621, "epoch": 944} {"train_loss": -10.104034423828125, "global_step": 158622, "epoch": 944} {"train_loss": -10.557518005371094, "global_step": 158623, "epoch": 944} {"train_loss": -10.39531135559082, "global_step": 158624, "epoch": 944} {"train_loss": -10.702478408813477, "global_step": 158625, "epoch": 944} {"train_loss": -10.704893112182617, "global_step": 158626, "epoch": 944} {"train_loss": -10.17855167388916, "global_step": 158627, "epoch": 944} {"train_loss": -10.425017356872559, "global_step": 158628, "epoch": 944} {"train_loss": -10.399345397949219, "global_step": 158629, "epoch": 944} {"train_loss": -9.993365287780762, "global_step": 158630, "epoch": 944} {"train_loss": -10.85896110534668, "global_step": 158631, "epoch": 944} {"train_loss": -10.205068588256836, "global_step": 158632, "epoch": 944} {"train_loss": -10.46068000793457, "global_step": 158633, "epoch": 944} {"train_loss": -10.494955062866211, "global_step": 158634, "epoch": 944} {"train_loss": -10.131683349609375, "global_step": 158635, "epoch": 944} {"train_loss": -10.60120677947998, "global_step": 158636, "epoch": 944} {"train_loss": -10.62697982788086, "global_step": 158637, "epoch": 944} {"train_loss": -10.512228965759277, "global_step": 158638, "epoch": 944} {"train_loss": -10.778620719909668, "global_step": 158639, "epoch": 944} {"train_loss": -10.673858642578125, "global_step": 158640, "epoch": 944} {"train_loss": -10.64829158782959, "global_step": 158641, "epoch": 944} {"train_loss": -10.848548889160156, "global_step": 158642, "epoch": 944} {"train_loss": -10.561589241027832, "global_step": 158643, "epoch": 944} {"train_loss": -10.719988822937012, "global_step": 158644, "epoch": 944} {"train_loss": -10.915998458862305, "global_step": 158645, "epoch": 944} {"train_loss": -10.519964218139648, "global_step": 158646, "epoch": 944} {"train_loss": -10.93419361114502, "global_step": 158647, "epoch": 944} {"train_loss": -10.805665969848633, "global_step": 158648, "epoch": 944} {"train_loss": -10.734601974487305, "global_step": 158649, "epoch": 944} {"train_loss": -10.806861877441406, "global_step": 158650, "epoch": 944} {"train_loss": -10.956504821777344, "global_step": 158651, "epoch": 944} {"train_loss": -10.971611022949219, "global_step": 158652, "epoch": 944} {"train_loss": -10.71358585357666, "global_step": 158653, "epoch": 944} {"train_loss": -11.128596305847168, "global_step": 158654, "epoch": 944} {"train_loss": -10.729351043701172, "global_step": 158655, "epoch": 944} {"train_loss": -10.942560195922852, "global_step": 158656, "epoch": 944} {"train_loss": -10.596883773803711, "global_step": 158657, "epoch": 944} {"train_loss": -10.972569465637207, "global_step": 158658, "epoch": 944} {"train_loss": -10.953348159790039, "global_step": 158659, "epoch": 944} {"train_loss": -10.996371269226074, "global_step": 158660, "epoch": 944} {"train_loss": -10.774995803833008, "global_step": 158661, "epoch": 944} {"train_loss": -11.164300918579102, "global_step": 158662, "epoch": 944} {"train_loss": -11.20801067352295, "global_step": 158663, "epoch": 944} {"train_loss": -11.118294715881348, "global_step": 158664, "epoch": 944} {"train_loss": -11.015018463134766, "global_step": 158665, "epoch": 944} {"train_loss": -11.171923637390137, "global_step": 158666, "epoch": 944} {"train_loss": -10.983497619628906, "global_step": 158667, "epoch": 944} {"train_loss": -11.309629440307617, "global_step": 158668, "epoch": 944} {"train_loss": -11.23841667175293, "global_step": 158669, "epoch": 944} {"train_loss": -11.135171890258789, "global_step": 158670, "epoch": 944} {"train_loss": -10.984291076660156, "global_step": 158671, "epoch": 944} {"train_loss": -11.30378532409668, "global_step": 158672, "epoch": 944} {"train_loss": -11.031148910522461, "global_step": 158673, "epoch": 944} {"train_loss": -11.161853790283203, "global_step": 158674, "epoch": 944} {"train_loss": -11.068353652954102, "global_step": 158675, "epoch": 944} {"train_loss": -11.246480941772461, "global_step": 158676, "epoch": 944} {"train_loss": -11.021671295166016, "global_step": 158677, "epoch": 944} {"train_loss": -10.904495239257812, "global_step": 158678, "epoch": 944} {"train_loss": -11.176063537597656, "global_step": 158679, "epoch": 944} {"train_loss": -10.76530933380127, "global_step": 158680, "epoch": 944} {"train_loss": -10.80072021484375, "global_step": 158681, "epoch": 944} {"train_loss": -10.895219802856445, "global_step": 158682, "epoch": 944} {"train_loss": -10.84084415435791, "global_step": 158683, "epoch": 944} {"train_loss": -10.44312858581543, "global_step": 158684, "epoch": 944} {"train_loss": -10.839075088500977, "global_step": 158685, "epoch": 944} {"train_loss": -10.686731338500977, "global_step": 158686, "epoch": 944} {"train_loss": -10.334403991699219, "global_step": 158687, "epoch": 944} {"train_loss": -10.378668785095215, "global_step": 158688, "epoch": 944} {"train_loss": -10.954545974731445, "global_step": 158689, "epoch": 944} {"train_loss": -10.435590744018555, "global_step": 158690, "epoch": 944} {"train_loss": -10.510110855102539, "global_step": 158691, "epoch": 944} {"train_loss": -10.823698043823242, "global_step": 158692, "epoch": 944} {"train_loss": -10.267792701721191, "global_step": 158693, "epoch": 944} {"train_loss": -10.257261276245117, "global_step": 158694, "epoch": 944} {"train_loss": -10.533727645874023, "global_step": 158695, "epoch": 944} {"train_loss": -9.981523513793945, "global_step": 158696, "epoch": 944} {"train_loss": -10.860241889953613, "global_step": 158697, "epoch": 944} {"train_loss": -10.465484619140625, "global_step": 158698, "epoch": 944} {"train_loss": -10.402807235717773, "global_step": 158699, "epoch": 944} {"train_loss": -10.598652839660645, "global_step": 158700, "epoch": 944} {"train_loss": -10.461357116699219, "global_step": 158701, "epoch": 944} {"train_loss": -10.49325180053711, "global_step": 158702, "epoch": 944} {"train_loss": -10.0557861328125, "global_step": 158703, "epoch": 944} {"train_loss": -10.550363540649414, "global_step": 158704, "epoch": 944} {"train_loss": -10.568504333496094, "global_step": 158705, "epoch": 944} {"train_loss": -10.709933280944824, "global_step": 158706, "epoch": 944} {"train_loss": -10.611373901367188, "global_step": 158707, "epoch": 944} {"train_loss": -10.211094856262207, "global_step": 158708, "epoch": 944} {"train_loss": -10.6783447265625, "global_step": 158709, "epoch": 944} {"train_loss": -10.536582946777344, "global_step": 158710, "epoch": 944} {"train_loss": -10.672943115234375, "global_step": 158711, "epoch": 944} {"train_loss": -10.504478454589844, "global_step": 158712, "epoch": 944} {"train_loss": -10.4246826171875, "global_step": 158713, "epoch": 944} {"train_loss": -10.692682266235352, "global_step": 158714, "epoch": 944} {"train_loss": -10.542144775390625, "global_step": 158715, "epoch": 944} {"train_loss": -10.669681549072266, "global_step": 158716, "epoch": 944} {"train_loss": -10.207047462463379, "global_step": 158717, "epoch": 944} {"train_loss": -10.793785095214844, "global_step": 158718, "epoch": 944} {"train_loss": -10.609334945678711, "global_step": 158719, "epoch": 944} {"train_loss": -10.726771354675293, "global_step": 158720, "epoch": 944} {"train_loss": -10.829132080078125, "global_step": 158721, "epoch": 944} {"train_loss": -10.813695907592773, "global_step": 158722, "epoch": 944} {"train_loss": -10.886054992675781, "global_step": 158723, "epoch": 944} {"train_loss": -10.912839889526367, "global_step": 158724, "epoch": 944} {"train_loss": -10.885808944702148, "global_step": 158725, "epoch": 944} {"train_loss": -10.808794975280762, "global_step": 158726, "epoch": 944} {"train_loss": -10.820730209350586, "global_step": 158727, "epoch": 944} {"train_loss": -10.68088436126709, "global_step": 158728, "epoch": 944} {"train_loss": -10.824514389038086, "global_step": 158729, "epoch": 944} {"train_loss": -10.91513442993164, "global_step": 158730, "epoch": 944} {"train_loss": -10.8049955368042, "global_step": 158731, "epoch": 944} {"train_loss": -10.954912185668945, "global_step": 158732, "epoch": 944} {"train_loss": -10.774138450622559, "global_step": 158733, "epoch": 944} {"train_loss": -10.929641723632812, "global_step": 158734, "epoch": 944} {"train_loss": -11.160937309265137, "global_step": 158735, "epoch": 944} {"train_loss": -10.896564483642578, "global_step": 158736, "epoch": 944} {"train_loss": -11.132613182067871, "global_step": 158737, "epoch": 944} {"train_loss": -10.858295440673828, "global_step": 158738, "epoch": 944} {"train_loss": -11.043403625488281, "global_step": 158739, "epoch": 944} {"train_loss": -10.732194900512695, "global_step": 158740, "epoch": 944} {"train_loss": -10.91007137298584, "global_step": 158741, "epoch": 944} {"train_loss": -10.909562110900879, "global_step": 158742, "epoch": 944} {"train_loss": -11.129985809326172, "global_step": 158743, "epoch": 944} {"train_loss": -10.891876220703125, "global_step": 158744, "epoch": 944} {"train_loss": -10.994901657104492, "global_step": 158745, "epoch": 944} {"train_loss": -10.893062591552734, "global_step": 158746, "epoch": 944} {"train_loss": -10.971223831176758, "global_step": 158747, "epoch": 944} {"train_loss": -11.068815231323242, "global_step": 158748, "epoch": 944} {"train_loss": -10.904178619384766, "global_step": 158749, "epoch": 944} {"train_loss": -11.08881950378418, "global_step": 158750, "epoch": 944} {"train_loss": -10.919975280761719, "global_step": 158751, "epoch": 944} {"train_loss": -11.067750930786133, "global_step": 158752, "epoch": 944} {"train_loss": -10.741026878356934, "global_step": 158753, "epoch": 944} {"train_loss": -11.004148483276367, "global_step": 158754, "epoch": 944} {"train_loss": -11.123507499694824, "global_step": 158755, "epoch": 944} {"train_loss": -10.832964897155762, "global_step": 158756, "epoch": 944} {"train_loss": -11.145627975463867, "global_step": 158757, "epoch": 944} {"train_loss": -10.870880126953125, "global_step": 158758, "epoch": 944} {"train_loss": -10.723730518704368, "global_step": 158759, "epoch": 944, "val_loss": 233906.421875} {"train_loss": -10.657719612121582, "global_step": 158760, "epoch": 945} {"train_loss": -10.306384086608887, "global_step": 158761, "epoch": 945} {"train_loss": -10.912630081176758, "global_step": 158762, "epoch": 945} {"train_loss": -10.588897705078125, "global_step": 158763, "epoch": 945} {"train_loss": -10.529502868652344, "global_step": 158764, "epoch": 945} {"train_loss": -10.537546157836914, "global_step": 158765, "epoch": 945} {"train_loss": -10.285079956054688, "global_step": 158766, "epoch": 945} {"train_loss": -10.960633277893066, "global_step": 158767, "epoch": 945} {"train_loss": -10.386685371398926, "global_step": 158768, "epoch": 945} {"train_loss": -10.136893272399902, "global_step": 158769, "epoch": 945} {"train_loss": -10.836904525756836, "global_step": 158770, "epoch": 945} {"train_loss": -9.90830135345459, "global_step": 158771, "epoch": 945} {"train_loss": -10.776346206665039, "global_step": 158772, "epoch": 945} {"train_loss": -10.372334480285645, "global_step": 158773, "epoch": 945} {"train_loss": -10.004767417907715, "global_step": 158774, "epoch": 945} {"train_loss": -10.009283065795898, "global_step": 158775, "epoch": 945} {"train_loss": -10.051373481750488, "global_step": 158776, "epoch": 945} {"train_loss": -10.428339004516602, "global_step": 158777, "epoch": 945} {"train_loss": -10.029884338378906, "global_step": 158778, "epoch": 945} {"train_loss": -10.376249313354492, "global_step": 158779, "epoch": 945} {"train_loss": -10.615056991577148, "global_step": 158780, "epoch": 945} {"train_loss": -10.781387329101562, "global_step": 158781, "epoch": 945} {"train_loss": -10.468713760375977, "global_step": 158782, "epoch": 945} {"train_loss": -10.482828140258789, "global_step": 158783, "epoch": 945} {"train_loss": -10.575754165649414, "global_step": 158784, "epoch": 945} {"train_loss": -10.408774375915527, "global_step": 158785, "epoch": 945} {"train_loss": -10.826033592224121, "global_step": 158786, "epoch": 945} {"train_loss": -10.731788635253906, "global_step": 158787, "epoch": 945} {"train_loss": -10.567243576049805, "global_step": 158788, "epoch": 945} {"train_loss": -10.551401138305664, "global_step": 158789, "epoch": 945} {"train_loss": -10.611242294311523, "global_step": 158790, "epoch": 945} {"train_loss": -10.635858535766602, "global_step": 158791, "epoch": 945} {"train_loss": -10.795197486877441, "global_step": 158792, "epoch": 945} {"train_loss": -10.894088745117188, "global_step": 158793, "epoch": 945} {"train_loss": -10.896512985229492, "global_step": 158794, "epoch": 945} {"train_loss": -10.777166366577148, "global_step": 158795, "epoch": 945} {"train_loss": -10.849365234375, "global_step": 158796, "epoch": 945} {"train_loss": -10.697260856628418, "global_step": 158797, "epoch": 945} {"train_loss": -10.946632385253906, "global_step": 158798, "epoch": 945} {"train_loss": -10.693928718566895, "global_step": 158799, "epoch": 945} {"train_loss": -10.938600540161133, "global_step": 158800, "epoch": 945} {"train_loss": -10.540013313293457, "global_step": 158801, "epoch": 945} {"train_loss": -10.69322395324707, "global_step": 158802, "epoch": 945} {"train_loss": -10.967540740966797, "global_step": 158803, "epoch": 945} {"train_loss": -10.712502479553223, "global_step": 158804, "epoch": 945} {"train_loss": -10.899317741394043, "global_step": 158805, "epoch": 945} {"train_loss": -11.067875862121582, "global_step": 158806, "epoch": 945} {"train_loss": -10.7330904006958, "global_step": 158807, "epoch": 945} {"train_loss": -10.957686424255371, "global_step": 158808, "epoch": 945} {"train_loss": -10.620035171508789, "global_step": 158809, "epoch": 945} {"train_loss": -11.136176109313965, "global_step": 158810, "epoch": 945} {"train_loss": -10.96983528137207, "global_step": 158811, "epoch": 945} {"train_loss": -11.104011535644531, "global_step": 158812, "epoch": 945} {"train_loss": -10.82094955444336, "global_step": 158813, "epoch": 945} {"train_loss": -10.789161682128906, "global_step": 158814, "epoch": 945} {"train_loss": -10.812214851379395, "global_step": 158815, "epoch": 945} {"train_loss": -11.079740524291992, "global_step": 158816, "epoch": 945} {"train_loss": -11.015108108520508, "global_step": 158817, "epoch": 945} {"train_loss": -11.157758712768555, "global_step": 158818, "epoch": 945} {"train_loss": -11.074529647827148, "global_step": 158819, "epoch": 945} {"train_loss": -11.30341911315918, "global_step": 158820, "epoch": 945} {"train_loss": -11.190820693969727, "global_step": 158821, "epoch": 945} {"train_loss": -11.174985885620117, "global_step": 158822, "epoch": 945} {"train_loss": -11.08155632019043, "global_step": 158823, "epoch": 945} {"train_loss": -11.107368469238281, "global_step": 158824, "epoch": 945} {"train_loss": -11.190286636352539, "global_step": 158825, "epoch": 945} {"train_loss": -11.150761604309082, "global_step": 158826, "epoch": 945} {"train_loss": -11.221797943115234, "global_step": 158827, "epoch": 945} {"train_loss": -11.174468994140625, "global_step": 158828, "epoch": 945} {"train_loss": -11.273218154907227, "global_step": 158829, "epoch": 945} {"train_loss": -11.1757173538208, "global_step": 158830, "epoch": 945} {"train_loss": -10.857669830322266, "global_step": 158831, "epoch": 945} {"train_loss": -11.177321434020996, "global_step": 158832, "epoch": 945} {"train_loss": -11.371582984924316, "global_step": 158833, "epoch": 945} {"train_loss": -10.822463989257812, "global_step": 158834, "epoch": 945} {"train_loss": -11.124502182006836, "global_step": 158835, "epoch": 945} {"train_loss": -11.149994850158691, "global_step": 158836, "epoch": 945} {"train_loss": -11.12173843383789, "global_step": 158837, "epoch": 945} {"train_loss": -11.002704620361328, "global_step": 158838, "epoch": 945} {"train_loss": -11.062044143676758, "global_step": 158839, "epoch": 945} {"train_loss": -11.219796180725098, "global_step": 158840, "epoch": 945} {"train_loss": -10.642814636230469, "global_step": 158841, "epoch": 945} {"train_loss": -10.64933967590332, "global_step": 158842, "epoch": 945} {"train_loss": -11.085817337036133, "global_step": 158843, "epoch": 945} {"train_loss": -11.297622680664062, "global_step": 158844, "epoch": 945} {"train_loss": -11.230687141418457, "global_step": 158845, "epoch": 945} {"train_loss": -10.938078880310059, "global_step": 158846, "epoch": 945} {"train_loss": -10.034425735473633, "global_step": 158847, "epoch": 945} {"train_loss": -10.406394958496094, "global_step": 158848, "epoch": 945} {"train_loss": -10.122501373291016, "global_step": 158849, "epoch": 945} {"train_loss": -11.120377540588379, "global_step": 158850, "epoch": 945} {"train_loss": -10.462900161743164, "global_step": 158851, "epoch": 945} {"train_loss": -11.081432342529297, "global_step": 158852, "epoch": 945} {"train_loss": -10.951311111450195, "global_step": 158853, "epoch": 945} {"train_loss": -10.877486228942871, "global_step": 158854, "epoch": 945} {"train_loss": -10.489638328552246, "global_step": 158855, "epoch": 945} {"train_loss": -10.434874534606934, "global_step": 158856, "epoch": 945} {"train_loss": -10.918989181518555, "global_step": 158857, "epoch": 945} {"train_loss": -10.264298439025879, "global_step": 158858, "epoch": 945} {"train_loss": -10.78384780883789, "global_step": 158859, "epoch": 945} {"train_loss": -10.01348876953125, "global_step": 158860, "epoch": 945} {"train_loss": -10.887079238891602, "global_step": 158861, "epoch": 945} {"train_loss": -9.890430450439453, "global_step": 158862, "epoch": 945} {"train_loss": -11.054363250732422, "global_step": 158863, "epoch": 945} {"train_loss": -10.267325401306152, "global_step": 158864, "epoch": 945} {"train_loss": -10.96870231628418, "global_step": 158865, "epoch": 945} {"train_loss": -10.520912170410156, "global_step": 158866, "epoch": 945} {"train_loss": -10.165910720825195, "global_step": 158867, "epoch": 945} {"train_loss": -10.834405899047852, "global_step": 158868, "epoch": 945} {"train_loss": -10.146339416503906, "global_step": 158869, "epoch": 945} {"train_loss": -10.913049697875977, "global_step": 158870, "epoch": 945} {"train_loss": -10.995261192321777, "global_step": 158871, "epoch": 945} {"train_loss": -10.663583755493164, "global_step": 158872, "epoch": 945} {"train_loss": -10.682064056396484, "global_step": 158873, "epoch": 945} {"train_loss": -10.680608749389648, "global_step": 158874, "epoch": 945} {"train_loss": -10.935262680053711, "global_step": 158875, "epoch": 945} {"train_loss": -10.387859344482422, "global_step": 158876, "epoch": 945} {"train_loss": -10.990230560302734, "global_step": 158877, "epoch": 945} {"train_loss": -10.507561683654785, "global_step": 158878, "epoch": 945} {"train_loss": -10.384620666503906, "global_step": 158879, "epoch": 945} {"train_loss": -10.89920711517334, "global_step": 158880, "epoch": 945} {"train_loss": -10.728618621826172, "global_step": 158881, "epoch": 945} {"train_loss": -10.526032447814941, "global_step": 158882, "epoch": 945} {"train_loss": -10.793283462524414, "global_step": 158883, "epoch": 945} {"train_loss": -10.882553100585938, "global_step": 158884, "epoch": 945} {"train_loss": -11.098167419433594, "global_step": 158885, "epoch": 945} {"train_loss": -10.736366271972656, "global_step": 158886, "epoch": 945} {"train_loss": -10.83806037902832, "global_step": 158887, "epoch": 945} {"train_loss": -10.750228881835938, "global_step": 158888, "epoch": 945} {"train_loss": -10.779333114624023, "global_step": 158889, "epoch": 945} {"train_loss": -10.94334602355957, "global_step": 158890, "epoch": 945} {"train_loss": -10.934489250183105, "global_step": 158891, "epoch": 945} {"train_loss": -10.78931713104248, "global_step": 158892, "epoch": 945} {"train_loss": -10.673206329345703, "global_step": 158893, "epoch": 945} {"train_loss": -10.887307167053223, "global_step": 158894, "epoch": 945} {"train_loss": -10.781759262084961, "global_step": 158895, "epoch": 945} {"train_loss": -10.62191104888916, "global_step": 158896, "epoch": 945} {"train_loss": -11.02144718170166, "global_step": 158897, "epoch": 945} {"train_loss": -10.747651100158691, "global_step": 158898, "epoch": 945} {"train_loss": -10.544658660888672, "global_step": 158899, "epoch": 945} {"train_loss": -10.899577140808105, "global_step": 158900, "epoch": 945} {"train_loss": -10.92463493347168, "global_step": 158901, "epoch": 945} {"train_loss": -11.204086303710938, "global_step": 158902, "epoch": 945} {"train_loss": -10.976198196411133, "global_step": 158903, "epoch": 945} {"train_loss": -10.92928695678711, "global_step": 158904, "epoch": 945} {"train_loss": -10.967681884765625, "global_step": 158905, "epoch": 945} {"train_loss": -10.757761001586914, "global_step": 158906, "epoch": 945} {"train_loss": -11.140619277954102, "global_step": 158907, "epoch": 945} {"train_loss": -10.752994537353516, "global_step": 158908, "epoch": 945} {"train_loss": -10.896095275878906, "global_step": 158909, "epoch": 945} {"train_loss": -11.125077247619629, "global_step": 158910, "epoch": 945} {"train_loss": -10.727446556091309, "global_step": 158911, "epoch": 945} {"train_loss": -11.262455940246582, "global_step": 158912, "epoch": 945} {"train_loss": -10.800575256347656, "global_step": 158913, "epoch": 945} {"train_loss": -11.116748809814453, "global_step": 158914, "epoch": 945} {"train_loss": -11.086262702941895, "global_step": 158915, "epoch": 945} {"train_loss": -11.163942337036133, "global_step": 158916, "epoch": 945} {"train_loss": -11.101330757141113, "global_step": 158917, "epoch": 945} {"train_loss": -11.185636520385742, "global_step": 158918, "epoch": 945} {"train_loss": -11.112403869628906, "global_step": 158919, "epoch": 945} {"train_loss": -11.00096321105957, "global_step": 158920, "epoch": 945} {"train_loss": -11.037881851196289, "global_step": 158921, "epoch": 945} {"train_loss": -10.957414627075195, "global_step": 158922, "epoch": 945} {"train_loss": -11.004225730895996, "global_step": 158923, "epoch": 945} {"train_loss": -10.968392372131348, "global_step": 158924, "epoch": 945} {"train_loss": -10.797113418579102, "global_step": 158925, "epoch": 945} {"train_loss": -11.08971881866455, "global_step": 158926, "epoch": 945} {"train_loss": -10.794214651698159, "global_step": 158927, "epoch": 945, "val_loss": 236158.421875, "train_action_mse_error": 2.163194417953491} {"train_loss": -11.088434219360352, "global_step": 158928, "epoch": 946} {"train_loss": -10.795228958129883, "global_step": 158929, "epoch": 946} {"train_loss": -10.796883583068848, "global_step": 158930, "epoch": 946} {"train_loss": -10.858997344970703, "global_step": 158931, "epoch": 946} {"train_loss": -11.132970809936523, "global_step": 158932, "epoch": 946} {"train_loss": -10.36705207824707, "global_step": 158933, "epoch": 946} {"train_loss": -10.503618240356445, "global_step": 158934, "epoch": 946} {"train_loss": -9.91038703918457, "global_step": 158935, "epoch": 946} {"train_loss": -10.959903717041016, "global_step": 158936, "epoch": 946} {"train_loss": -10.573196411132812, "global_step": 158937, "epoch": 946} {"train_loss": -10.737068176269531, "global_step": 158938, "epoch": 946} {"train_loss": -10.735851287841797, "global_step": 158939, "epoch": 946} {"train_loss": -10.761877059936523, "global_step": 158940, "epoch": 946} {"train_loss": -10.8323974609375, "global_step": 158941, "epoch": 946} {"train_loss": -10.80931282043457, "global_step": 158942, "epoch": 946} {"train_loss": -11.110568046569824, "global_step": 158943, "epoch": 946} {"train_loss": -10.997841835021973, "global_step": 158944, "epoch": 946} {"train_loss": -10.700071334838867, "global_step": 158945, "epoch": 946} {"train_loss": -11.039435386657715, "global_step": 158946, "epoch": 946} {"train_loss": -10.431995391845703, "global_step": 158947, "epoch": 946} {"train_loss": -10.644615173339844, "global_step": 158948, "epoch": 946} {"train_loss": -10.719175338745117, "global_step": 158949, "epoch": 946} {"train_loss": -10.871753692626953, "global_step": 158950, "epoch": 946} {"train_loss": -10.712442398071289, "global_step": 158951, "epoch": 946} {"train_loss": -10.45245361328125, "global_step": 158952, "epoch": 946} {"train_loss": -10.501214981079102, "global_step": 158953, "epoch": 946} {"train_loss": -10.468927383422852, "global_step": 158954, "epoch": 946} {"train_loss": -10.868090629577637, "global_step": 158955, "epoch": 946} {"train_loss": -10.529388427734375, "global_step": 158956, "epoch": 946} {"train_loss": -10.400765419006348, "global_step": 158957, "epoch": 946} {"train_loss": -10.622129440307617, "global_step": 158958, "epoch": 946} {"train_loss": -10.387466430664062, "global_step": 158959, "epoch": 946} {"train_loss": -10.387001037597656, "global_step": 158960, "epoch": 946} {"train_loss": -10.260181427001953, "global_step": 158961, "epoch": 946} {"train_loss": -10.866708755493164, "global_step": 158962, "epoch": 946} {"train_loss": -10.378985404968262, "global_step": 158963, "epoch": 946} {"train_loss": -10.741514205932617, "global_step": 158964, "epoch": 946} {"train_loss": -11.030132293701172, "global_step": 158965, "epoch": 946} {"train_loss": -10.880958557128906, "global_step": 158966, "epoch": 946} {"train_loss": -10.691661834716797, "global_step": 158967, "epoch": 946} {"train_loss": -10.91535758972168, "global_step": 158968, "epoch": 946} {"train_loss": -10.747274398803711, "global_step": 158969, "epoch": 946} {"train_loss": -10.738889694213867, "global_step": 158970, "epoch": 946} {"train_loss": -10.7455472946167, "global_step": 158971, "epoch": 946} {"train_loss": -10.981372833251953, "global_step": 158972, "epoch": 946} {"train_loss": -10.824579238891602, "global_step": 158973, "epoch": 946} {"train_loss": -10.990269660949707, "global_step": 158974, "epoch": 946} {"train_loss": -10.86115837097168, "global_step": 158975, "epoch": 946} {"train_loss": -10.616287231445312, "global_step": 158976, "epoch": 946} {"train_loss": -10.81280517578125, "global_step": 158977, "epoch": 946} {"train_loss": -11.182458877563477, "global_step": 158978, "epoch": 946} {"train_loss": -10.826576232910156, "global_step": 158979, "epoch": 946} {"train_loss": -11.095454216003418, "global_step": 158980, "epoch": 946} {"train_loss": -11.044180870056152, "global_step": 158981, "epoch": 946} {"train_loss": -10.896398544311523, "global_step": 158982, "epoch": 946} {"train_loss": -10.944967269897461, "global_step": 158983, "epoch": 946} {"train_loss": -10.948068618774414, "global_step": 158984, "epoch": 946} {"train_loss": -10.896020889282227, "global_step": 158985, "epoch": 946} {"train_loss": -11.145708084106445, "global_step": 158986, "epoch": 946} {"train_loss": -10.979043960571289, "global_step": 158987, "epoch": 946} {"train_loss": -10.823640823364258, "global_step": 158988, "epoch": 946} {"train_loss": -11.063758850097656, "global_step": 158989, "epoch": 946} {"train_loss": -10.873247146606445, "global_step": 158990, "epoch": 946} {"train_loss": -11.026432037353516, "global_step": 158991, "epoch": 946} {"train_loss": -10.941368103027344, "global_step": 158992, "epoch": 946} {"train_loss": -11.180126190185547, "global_step": 158993, "epoch": 946} {"train_loss": -11.13549518585205, "global_step": 158994, "epoch": 946} {"train_loss": -11.091123580932617, "global_step": 158995, "epoch": 946} {"train_loss": -11.16630744934082, "global_step": 158996, "epoch": 946} {"train_loss": -10.973020553588867, "global_step": 158997, "epoch": 946} {"train_loss": -11.163267135620117, "global_step": 158998, "epoch": 946} {"train_loss": -11.053182601928711, "global_step": 158999, "epoch": 946} {"train_loss": -11.31765079498291, "global_step": 159000, "epoch": 946} {"train_loss": -11.024412155151367, "global_step": 159001, "epoch": 946} {"train_loss": -11.140372276306152, "global_step": 159002, "epoch": 946} {"train_loss": -11.151874542236328, "global_step": 159003, "epoch": 946} {"train_loss": -11.045341491699219, "global_step": 159004, "epoch": 946} {"train_loss": -11.285589218139648, "global_step": 159005, "epoch": 946} {"train_loss": -10.963761329650879, "global_step": 159006, "epoch": 946} {"train_loss": -11.251946449279785, "global_step": 159007, "epoch": 946} {"train_loss": -10.904467582702637, "global_step": 159008, "epoch": 946} {"train_loss": -11.46923828125, "global_step": 159009, "epoch": 946} {"train_loss": -11.333759307861328, "global_step": 159010, "epoch": 946} {"train_loss": -11.234673500061035, "global_step": 159011, "epoch": 946} {"train_loss": -11.114755630493164, "global_step": 159012, "epoch": 946} {"train_loss": -11.275670051574707, "global_step": 159013, "epoch": 946} {"train_loss": -11.266569137573242, "global_step": 159014, "epoch": 946} {"train_loss": -11.102840423583984, "global_step": 159015, "epoch": 946} {"train_loss": -11.383136749267578, "global_step": 159016, "epoch": 946} {"train_loss": -11.220006942749023, "global_step": 159017, "epoch": 946} {"train_loss": -11.306567192077637, "global_step": 159018, "epoch": 946} {"train_loss": -11.048755645751953, "global_step": 159019, "epoch": 946} {"train_loss": -11.061534881591797, "global_step": 159020, "epoch": 946} {"train_loss": -10.936238288879395, "global_step": 159021, "epoch": 946} {"train_loss": -11.276423454284668, "global_step": 159022, "epoch": 946} {"train_loss": -10.722930908203125, "global_step": 159023, "epoch": 946} {"train_loss": -10.858013153076172, "global_step": 159024, "epoch": 946} {"train_loss": -11.080633163452148, "global_step": 159025, "epoch": 946} {"train_loss": -10.765680313110352, "global_step": 159026, "epoch": 946} {"train_loss": -10.233526229858398, "global_step": 159027, "epoch": 946} {"train_loss": -10.288751602172852, "global_step": 159028, "epoch": 946} {"train_loss": -10.775725364685059, "global_step": 159029, "epoch": 946} {"train_loss": -10.793603897094727, "global_step": 159030, "epoch": 946} {"train_loss": -9.561084747314453, "global_step": 159031, "epoch": 946} {"train_loss": -9.904654502868652, "global_step": 159032, "epoch": 946} {"train_loss": -9.968493461608887, "global_step": 159033, "epoch": 946} {"train_loss": -9.926248550415039, "global_step": 159034, "epoch": 946} {"train_loss": -9.683149337768555, "global_step": 159035, "epoch": 946} {"train_loss": -9.905275344848633, "global_step": 159036, "epoch": 946} {"train_loss": -9.617826461791992, "global_step": 159037, "epoch": 946} {"train_loss": -9.798504829406738, "global_step": 159038, "epoch": 946} {"train_loss": -9.818243026733398, "global_step": 159039, "epoch": 946} {"train_loss": -9.043612480163574, "global_step": 159040, "epoch": 946} {"train_loss": -9.561830520629883, "global_step": 159041, "epoch": 946} {"train_loss": -10.159570693969727, "global_step": 159042, "epoch": 946} {"train_loss": -9.754051208496094, "global_step": 159043, "epoch": 946} {"train_loss": -10.224262237548828, "global_step": 159044, "epoch": 946} {"train_loss": -10.228267669677734, "global_step": 159045, "epoch": 946} {"train_loss": -9.985100746154785, "global_step": 159046, "epoch": 946} {"train_loss": -10.137045860290527, "global_step": 159047, "epoch": 946} {"train_loss": -10.413156509399414, "global_step": 159048, "epoch": 946} {"train_loss": -10.307004928588867, "global_step": 159049, "epoch": 946} {"train_loss": -10.460418701171875, "global_step": 159050, "epoch": 946} {"train_loss": -10.212478637695312, "global_step": 159051, "epoch": 946} {"train_loss": -10.221799850463867, "global_step": 159052, "epoch": 946} {"train_loss": -10.297554016113281, "global_step": 159053, "epoch": 946} {"train_loss": -10.314931869506836, "global_step": 159054, "epoch": 946} {"train_loss": -10.600309371948242, "global_step": 159055, "epoch": 946} {"train_loss": -10.69741153717041, "global_step": 159056, "epoch": 946} {"train_loss": -10.696492195129395, "global_step": 159057, "epoch": 946} {"train_loss": -10.446918487548828, "global_step": 159058, "epoch": 946} {"train_loss": -10.821420669555664, "global_step": 159059, "epoch": 946} {"train_loss": -10.58515739440918, "global_step": 159060, "epoch": 946} {"train_loss": -10.607089042663574, "global_step": 159061, "epoch": 946} {"train_loss": -10.534004211425781, "global_step": 159062, "epoch": 946} {"train_loss": -10.745071411132812, "global_step": 159063, "epoch": 946} {"train_loss": -10.497888565063477, "global_step": 159064, "epoch": 946} {"train_loss": -10.690074920654297, "global_step": 159065, "epoch": 946} {"train_loss": -10.55546760559082, "global_step": 159066, "epoch": 946} {"train_loss": -10.736963272094727, "global_step": 159067, "epoch": 946} {"train_loss": -10.654499053955078, "global_step": 159068, "epoch": 946} {"train_loss": -10.759054183959961, "global_step": 159069, "epoch": 946} {"train_loss": -10.829120635986328, "global_step": 159070, "epoch": 946} {"train_loss": -10.7240629196167, "global_step": 159071, "epoch": 946} {"train_loss": -10.700551986694336, "global_step": 159072, "epoch": 946} {"train_loss": -11.024593353271484, "global_step": 159073, "epoch": 946} {"train_loss": -10.952609062194824, "global_step": 159074, "epoch": 946} {"train_loss": -10.66879940032959, "global_step": 159075, "epoch": 946} {"train_loss": -10.93414306640625, "global_step": 159076, "epoch": 946} {"train_loss": -10.863588333129883, "global_step": 159077, "epoch": 946} {"train_loss": -10.895121574401855, "global_step": 159078, "epoch": 946} {"train_loss": -10.931243896484375, "global_step": 159079, "epoch": 946} {"train_loss": -11.037872314453125, "global_step": 159080, "epoch": 946} {"train_loss": -10.936500549316406, "global_step": 159081, "epoch": 946} {"train_loss": -10.822750091552734, "global_step": 159082, "epoch": 946} {"train_loss": -10.85071086883545, "global_step": 159083, "epoch": 946} {"train_loss": -10.799585342407227, "global_step": 159084, "epoch": 946} {"train_loss": -11.049843788146973, "global_step": 159085, "epoch": 946} {"train_loss": -10.892330169677734, "global_step": 159086, "epoch": 946} {"train_loss": -10.953611373901367, "global_step": 159087, "epoch": 946} {"train_loss": -10.957765579223633, "global_step": 159088, "epoch": 946} {"train_loss": -10.83078670501709, "global_step": 159089, "epoch": 946} {"train_loss": -11.006563186645508, "global_step": 159090, "epoch": 946} {"train_loss": -10.701991081237793, "global_step": 159091, "epoch": 946} {"train_loss": -11.131677627563477, "global_step": 159092, "epoch": 946} {"train_loss": -11.011249542236328, "global_step": 159093, "epoch": 946} {"train_loss": -10.92447280883789, "global_step": 159094, "epoch": 946} {"train_loss": -10.734799952734084, "global_step": 159095, "epoch": 946, "val_loss": 235906.375} {"train_loss": -10.800745010375977, "global_step": 159096, "epoch": 947} {"train_loss": -11.014192581176758, "global_step": 159097, "epoch": 947} {"train_loss": -10.539104461669922, "global_step": 159098, "epoch": 947} {"train_loss": -11.196199417114258, "global_step": 159099, "epoch": 947} {"train_loss": -10.8814697265625, "global_step": 159100, "epoch": 947} {"train_loss": -10.943140029907227, "global_step": 159101, "epoch": 947} {"train_loss": -11.148174285888672, "global_step": 159102, "epoch": 947} {"train_loss": -11.100180625915527, "global_step": 159103, "epoch": 947} {"train_loss": -11.069171905517578, "global_step": 159104, "epoch": 947} {"train_loss": -11.139986991882324, "global_step": 159105, "epoch": 947} {"train_loss": -10.96615982055664, "global_step": 159106, "epoch": 947} {"train_loss": -11.095703125, "global_step": 159107, "epoch": 947} {"train_loss": -11.035916328430176, "global_step": 159108, "epoch": 947} {"train_loss": -11.438596725463867, "global_step": 159109, "epoch": 947} {"train_loss": -11.14013957977295, "global_step": 159110, "epoch": 947} {"train_loss": -10.91387939453125, "global_step": 159111, "epoch": 947} {"train_loss": -10.691439628601074, "global_step": 159112, "epoch": 947} {"train_loss": -11.138031005859375, "global_step": 159113, "epoch": 947} {"train_loss": -10.582796096801758, "global_step": 159114, "epoch": 947} {"train_loss": -9.910453796386719, "global_step": 159115, "epoch": 947} {"train_loss": -9.879969596862793, "global_step": 159116, "epoch": 947} {"train_loss": -10.90910530090332, "global_step": 159117, "epoch": 947} {"train_loss": -8.82054328918457, "global_step": 159118, "epoch": 947} {"train_loss": -10.884939193725586, "global_step": 159119, "epoch": 947} {"train_loss": -9.593193054199219, "global_step": 159120, "epoch": 947} {"train_loss": -10.17099380493164, "global_step": 159121, "epoch": 947} {"train_loss": -10.383105278015137, "global_step": 159122, "epoch": 947} {"train_loss": -9.787235260009766, "global_step": 159123, "epoch": 947} {"train_loss": -10.557498931884766, "global_step": 159124, "epoch": 947} {"train_loss": -10.447196960449219, "global_step": 159125, "epoch": 947} {"train_loss": -10.568397521972656, "global_step": 159126, "epoch": 947} {"train_loss": -10.64799976348877, "global_step": 159127, "epoch": 947} {"train_loss": -10.231527328491211, "global_step": 159128, "epoch": 947} {"train_loss": -10.744710922241211, "global_step": 159129, "epoch": 947} {"train_loss": -10.07011604309082, "global_step": 159130, "epoch": 947} {"train_loss": -10.78272819519043, "global_step": 159131, "epoch": 947} {"train_loss": -10.51954460144043, "global_step": 159132, "epoch": 947} {"train_loss": -10.840347290039062, "global_step": 159133, "epoch": 947} {"train_loss": -10.783527374267578, "global_step": 159134, "epoch": 947} {"train_loss": -10.499555587768555, "global_step": 159135, "epoch": 947} {"train_loss": -10.90261173248291, "global_step": 159136, "epoch": 947} {"train_loss": -10.617881774902344, "global_step": 159137, "epoch": 947} {"train_loss": -10.792948722839355, "global_step": 159138, "epoch": 947} {"train_loss": -10.634401321411133, "global_step": 159139, "epoch": 947} {"train_loss": -10.827118873596191, "global_step": 159140, "epoch": 947} {"train_loss": -10.648235321044922, "global_step": 159141, "epoch": 947} {"train_loss": -10.917464256286621, "global_step": 159142, "epoch": 947} {"train_loss": -10.386266708374023, "global_step": 159143, "epoch": 947} {"train_loss": -10.835394859313965, "global_step": 159144, "epoch": 947} {"train_loss": -10.638545036315918, "global_step": 159145, "epoch": 947} {"train_loss": -10.766727447509766, "global_step": 159146, "epoch": 947} {"train_loss": -10.674240112304688, "global_step": 159147, "epoch": 947} {"train_loss": -10.799285888671875, "global_step": 159148, "epoch": 947} {"train_loss": -10.871469497680664, "global_step": 159149, "epoch": 947} {"train_loss": -10.975057601928711, "global_step": 159150, "epoch": 947} {"train_loss": -10.671880722045898, "global_step": 159151, "epoch": 947} {"train_loss": -10.601421356201172, "global_step": 159152, "epoch": 947} {"train_loss": -10.861310958862305, "global_step": 159153, "epoch": 947} {"train_loss": -10.755128860473633, "global_step": 159154, "epoch": 947} {"train_loss": -10.77711296081543, "global_step": 159155, "epoch": 947} {"train_loss": -10.610248565673828, "global_step": 159156, "epoch": 947} {"train_loss": -10.670945167541504, "global_step": 159157, "epoch": 947} {"train_loss": -10.712114334106445, "global_step": 159158, "epoch": 947} {"train_loss": -10.730927467346191, "global_step": 159159, "epoch": 947} {"train_loss": -10.672109603881836, "global_step": 159160, "epoch": 947} {"train_loss": -10.70964241027832, "global_step": 159161, "epoch": 947} {"train_loss": -10.81760311126709, "global_step": 159162, "epoch": 947} {"train_loss": -10.982259750366211, "global_step": 159163, "epoch": 947} {"train_loss": -10.939801216125488, "global_step": 159164, "epoch": 947} {"train_loss": -11.029743194580078, "global_step": 159165, "epoch": 947} {"train_loss": -10.832761764526367, "global_step": 159166, "epoch": 947} {"train_loss": -10.937519073486328, "global_step": 159167, "epoch": 947} {"train_loss": -10.659829139709473, "global_step": 159168, "epoch": 947} {"train_loss": -11.192405700683594, "global_step": 159169, "epoch": 947} {"train_loss": -10.972999572753906, "global_step": 159170, "epoch": 947} {"train_loss": -11.022698402404785, "global_step": 159171, "epoch": 947} {"train_loss": -11.210613250732422, "global_step": 159172, "epoch": 947} {"train_loss": -11.025531768798828, "global_step": 159173, "epoch": 947} {"train_loss": -10.953509330749512, "global_step": 159174, "epoch": 947} {"train_loss": -11.123611450195312, "global_step": 159175, "epoch": 947} {"train_loss": -11.054521560668945, "global_step": 159176, "epoch": 947} {"train_loss": -11.106999397277832, "global_step": 159177, "epoch": 947} {"train_loss": -11.267518997192383, "global_step": 159178, "epoch": 947} {"train_loss": -11.226791381835938, "global_step": 159179, "epoch": 947} {"train_loss": -11.188077926635742, "global_step": 159180, "epoch": 947} {"train_loss": -11.177888870239258, "global_step": 159181, "epoch": 947} {"train_loss": -11.159017562866211, "global_step": 159182, "epoch": 947} {"train_loss": -11.078633308410645, "global_step": 159183, "epoch": 947} {"train_loss": -11.244325637817383, "global_step": 159184, "epoch": 947} {"train_loss": -11.305521965026855, "global_step": 159185, "epoch": 947} {"train_loss": -11.194591522216797, "global_step": 159186, "epoch": 947} {"train_loss": -11.213537216186523, "global_step": 159187, "epoch": 947} {"train_loss": -11.39763069152832, "global_step": 159188, "epoch": 947} {"train_loss": -11.274884223937988, "global_step": 159189, "epoch": 947} {"train_loss": -11.078256607055664, "global_step": 159190, "epoch": 947} {"train_loss": -11.188379287719727, "global_step": 159191, "epoch": 947} {"train_loss": -11.055231094360352, "global_step": 159192, "epoch": 947} {"train_loss": -11.431020736694336, "global_step": 159193, "epoch": 947} {"train_loss": -10.92403507232666, "global_step": 159194, "epoch": 947} {"train_loss": -11.072702407836914, "global_step": 159195, "epoch": 947} {"train_loss": -10.291834831237793, "global_step": 159196, "epoch": 947} {"train_loss": -11.308971405029297, "global_step": 159197, "epoch": 947} {"train_loss": -10.498686790466309, "global_step": 159198, "epoch": 947} {"train_loss": -10.871017456054688, "global_step": 159199, "epoch": 947} {"train_loss": -10.897764205932617, "global_step": 159200, "epoch": 947} {"train_loss": -11.008398056030273, "global_step": 159201, "epoch": 947} {"train_loss": -10.738256454467773, "global_step": 159202, "epoch": 947} {"train_loss": -9.928743362426758, "global_step": 159203, "epoch": 947} {"train_loss": -10.57922649383545, "global_step": 159204, "epoch": 947} {"train_loss": -10.918248176574707, "global_step": 159205, "epoch": 947} {"train_loss": -10.57231330871582, "global_step": 159206, "epoch": 947} {"train_loss": -10.549884796142578, "global_step": 159207, "epoch": 947} {"train_loss": -11.222787857055664, "global_step": 159208, "epoch": 947} {"train_loss": -10.69803237915039, "global_step": 159209, "epoch": 947} {"train_loss": -10.766036987304688, "global_step": 159210, "epoch": 947} {"train_loss": -10.975139617919922, "global_step": 159211, "epoch": 947} {"train_loss": -10.954950332641602, "global_step": 159212, "epoch": 947} {"train_loss": -11.037142753601074, "global_step": 159213, "epoch": 947} {"train_loss": -10.913681030273438, "global_step": 159214, "epoch": 947} {"train_loss": -10.984697341918945, "global_step": 159215, "epoch": 947} {"train_loss": -10.928498268127441, "global_step": 159216, "epoch": 947} {"train_loss": -11.081521987915039, "global_step": 159217, "epoch": 947} {"train_loss": -11.149124145507812, "global_step": 159218, "epoch": 947} {"train_loss": -10.827001571655273, "global_step": 159219, "epoch": 947} {"train_loss": -10.429410934448242, "global_step": 159220, "epoch": 947} {"train_loss": -10.58610725402832, "global_step": 159221, "epoch": 947} {"train_loss": -10.559755325317383, "global_step": 159222, "epoch": 947} {"train_loss": -10.394416809082031, "global_step": 159223, "epoch": 947} {"train_loss": -10.612302780151367, "global_step": 159224, "epoch": 947} {"train_loss": -10.716999053955078, "global_step": 159225, "epoch": 947} {"train_loss": -10.91374683380127, "global_step": 159226, "epoch": 947} {"train_loss": -10.663475036621094, "global_step": 159227, "epoch": 947} {"train_loss": -11.04971694946289, "global_step": 159228, "epoch": 947} {"train_loss": -10.689336776733398, "global_step": 159229, "epoch": 947} {"train_loss": -11.008617401123047, "global_step": 159230, "epoch": 947} {"train_loss": -10.518977165222168, "global_step": 159231, "epoch": 947} {"train_loss": -10.990280151367188, "global_step": 159232, "epoch": 947} {"train_loss": -10.347677230834961, "global_step": 159233, "epoch": 947} {"train_loss": -11.13485336303711, "global_step": 159234, "epoch": 947} {"train_loss": -10.776575088500977, "global_step": 159235, "epoch": 947} {"train_loss": -10.547603607177734, "global_step": 159236, "epoch": 947} {"train_loss": -10.786520004272461, "global_step": 159237, "epoch": 947} {"train_loss": -10.271785736083984, "global_step": 159238, "epoch": 947} {"train_loss": -10.95098876953125, "global_step": 159239, "epoch": 947} {"train_loss": -10.133101463317871, "global_step": 159240, "epoch": 947} {"train_loss": -10.856637001037598, "global_step": 159241, "epoch": 947} {"train_loss": -10.361684799194336, "global_step": 159242, "epoch": 947} {"train_loss": -10.749215126037598, "global_step": 159243, "epoch": 947} {"train_loss": -10.524046897888184, "global_step": 159244, "epoch": 947} {"train_loss": -10.694700241088867, "global_step": 159245, "epoch": 947} {"train_loss": -10.764973640441895, "global_step": 159246, "epoch": 947} {"train_loss": -10.206705093383789, "global_step": 159247, "epoch": 947} {"train_loss": -10.754963874816895, "global_step": 159248, "epoch": 947} {"train_loss": -10.770532608032227, "global_step": 159249, "epoch": 947} {"train_loss": -10.866053581237793, "global_step": 159250, "epoch": 947} {"train_loss": -10.879425048828125, "global_step": 159251, "epoch": 947} {"train_loss": -10.954316139221191, "global_step": 159252, "epoch": 947} {"train_loss": -10.416858673095703, "global_step": 159253, "epoch": 947} {"train_loss": -10.964009284973145, "global_step": 159254, "epoch": 947} {"train_loss": -10.909802436828613, "global_step": 159255, "epoch": 947} {"train_loss": -10.691598892211914, "global_step": 159256, "epoch": 947} {"train_loss": -10.938186645507812, "global_step": 159257, "epoch": 947} {"train_loss": -10.6993408203125, "global_step": 159258, "epoch": 947} {"train_loss": -10.81147575378418, "global_step": 159259, "epoch": 947} {"train_loss": -10.871384620666504, "global_step": 159260, "epoch": 947} {"train_loss": -10.844535827636719, "global_step": 159261, "epoch": 947} {"train_loss": -10.984376907348633, "global_step": 159262, "epoch": 947} {"train_loss": -10.795244534810385, "global_step": 159263, "epoch": 947, "val_loss": 235033.703125} {"train_loss": -10.818643569946289, "global_step": 159264, "epoch": 948} {"train_loss": -10.922592163085938, "global_step": 159265, "epoch": 948} {"train_loss": -11.025900840759277, "global_step": 159266, "epoch": 948} {"train_loss": -10.901025772094727, "global_step": 159267, "epoch": 948} {"train_loss": -11.05672836303711, "global_step": 159268, "epoch": 948} {"train_loss": -11.08340835571289, "global_step": 159269, "epoch": 948} {"train_loss": -11.285959243774414, "global_step": 159270, "epoch": 948} {"train_loss": -10.906013488769531, "global_step": 159271, "epoch": 948} {"train_loss": -10.980239868164062, "global_step": 159272, "epoch": 948} {"train_loss": -11.121737480163574, "global_step": 159273, "epoch": 948} {"train_loss": -11.118186950683594, "global_step": 159274, "epoch": 948} {"train_loss": -10.967254638671875, "global_step": 159275, "epoch": 948} {"train_loss": -10.914920806884766, "global_step": 159276, "epoch": 948} {"train_loss": -10.918325424194336, "global_step": 159277, "epoch": 948} {"train_loss": -10.767892837524414, "global_step": 159278, "epoch": 948} {"train_loss": -10.775739669799805, "global_step": 159279, "epoch": 948} {"train_loss": -11.131446838378906, "global_step": 159280, "epoch": 948} {"train_loss": -11.075459480285645, "global_step": 159281, "epoch": 948} {"train_loss": -11.155523300170898, "global_step": 159282, "epoch": 948} {"train_loss": -11.049036026000977, "global_step": 159283, "epoch": 948} {"train_loss": -11.050395011901855, "global_step": 159284, "epoch": 948} {"train_loss": -11.031984329223633, "global_step": 159285, "epoch": 948} {"train_loss": -11.173189163208008, "global_step": 159286, "epoch": 948} {"train_loss": -11.065940856933594, "global_step": 159287, "epoch": 948} {"train_loss": -11.039852142333984, "global_step": 159288, "epoch": 948} {"train_loss": -11.029642105102539, "global_step": 159289, "epoch": 948} {"train_loss": -11.07965087890625, "global_step": 159290, "epoch": 948} {"train_loss": -10.87481689453125, "global_step": 159291, "epoch": 948} {"train_loss": -11.12845230102539, "global_step": 159292, "epoch": 948} {"train_loss": -11.041038513183594, "global_step": 159293, "epoch": 948} {"train_loss": -10.631326675415039, "global_step": 159294, "epoch": 948} {"train_loss": -10.693464279174805, "global_step": 159295, "epoch": 948} {"train_loss": -10.53539752960205, "global_step": 159296, "epoch": 948} {"train_loss": -10.95162296295166, "global_step": 159297, "epoch": 948} {"train_loss": -10.812402725219727, "global_step": 159298, "epoch": 948} {"train_loss": -10.49474048614502, "global_step": 159299, "epoch": 948} {"train_loss": -10.58511734008789, "global_step": 159300, "epoch": 948} {"train_loss": -10.888169288635254, "global_step": 159301, "epoch": 948} {"train_loss": -10.307535171508789, "global_step": 159302, "epoch": 948} {"train_loss": -10.47034740447998, "global_step": 159303, "epoch": 948} {"train_loss": -10.73512077331543, "global_step": 159304, "epoch": 948} {"train_loss": -10.503792762756348, "global_step": 159305, "epoch": 948} {"train_loss": -10.532068252563477, "global_step": 159306, "epoch": 948} {"train_loss": -9.959843635559082, "global_step": 159307, "epoch": 948} {"train_loss": -9.995840072631836, "global_step": 159308, "epoch": 948} {"train_loss": -10.479955673217773, "global_step": 159309, "epoch": 948} {"train_loss": -10.27949333190918, "global_step": 159310, "epoch": 948} {"train_loss": -10.796808242797852, "global_step": 159311, "epoch": 948} {"train_loss": -10.811511993408203, "global_step": 159312, "epoch": 948} {"train_loss": -10.275153160095215, "global_step": 159313, "epoch": 948} {"train_loss": -10.758729934692383, "global_step": 159314, "epoch": 948} {"train_loss": -10.483068466186523, "global_step": 159315, "epoch": 948} {"train_loss": -10.606762886047363, "global_step": 159316, "epoch": 948} {"train_loss": -10.905888557434082, "global_step": 159317, "epoch": 948} {"train_loss": -10.652582168579102, "global_step": 159318, "epoch": 948} {"train_loss": -10.46265983581543, "global_step": 159319, "epoch": 948} {"train_loss": -10.590546607971191, "global_step": 159320, "epoch": 948} {"train_loss": -10.913339614868164, "global_step": 159321, "epoch": 948} {"train_loss": -10.534622192382812, "global_step": 159322, "epoch": 948} {"train_loss": -10.774650573730469, "global_step": 159323, "epoch": 948} {"train_loss": -10.322227478027344, "global_step": 159324, "epoch": 948} {"train_loss": -10.524845123291016, "global_step": 159325, "epoch": 948} {"train_loss": -11.171438217163086, "global_step": 159326, "epoch": 948} {"train_loss": -10.589305877685547, "global_step": 159327, "epoch": 948} {"train_loss": -11.172065734863281, "global_step": 159328, "epoch": 948} {"train_loss": -10.524779319763184, "global_step": 159329, "epoch": 948} {"train_loss": -10.909992218017578, "global_step": 159330, "epoch": 948} {"train_loss": -10.455708503723145, "global_step": 159331, "epoch": 948} {"train_loss": -10.786764144897461, "global_step": 159332, "epoch": 948} {"train_loss": -10.792684555053711, "global_step": 159333, "epoch": 948} {"train_loss": -10.922211647033691, "global_step": 159334, "epoch": 948} {"train_loss": -10.71150016784668, "global_step": 159335, "epoch": 948} {"train_loss": -10.646541595458984, "global_step": 159336, "epoch": 948} {"train_loss": -10.765954971313477, "global_step": 159337, "epoch": 948} {"train_loss": -10.872808456420898, "global_step": 159338, "epoch": 948} {"train_loss": -10.992179870605469, "global_step": 159339, "epoch": 948} {"train_loss": -10.791000366210938, "global_step": 159340, "epoch": 948} {"train_loss": -11.062581062316895, "global_step": 159341, "epoch": 948} {"train_loss": -10.888818740844727, "global_step": 159342, "epoch": 948} {"train_loss": -10.98556137084961, "global_step": 159343, "epoch": 948} {"train_loss": -10.933784484863281, "global_step": 159344, "epoch": 948} {"train_loss": -10.934776306152344, "global_step": 159345, "epoch": 948} {"train_loss": -10.854606628417969, "global_step": 159346, "epoch": 948} {"train_loss": -11.063238143920898, "global_step": 159347, "epoch": 948} {"train_loss": -10.733657836914062, "global_step": 159348, "epoch": 948} {"train_loss": -11.099578857421875, "global_step": 159349, "epoch": 948} {"train_loss": -10.587244987487793, "global_step": 159350, "epoch": 948} {"train_loss": -10.756043434143066, "global_step": 159351, "epoch": 948} {"train_loss": -10.71027660369873, "global_step": 159352, "epoch": 948} {"train_loss": -10.974565505981445, "global_step": 159353, "epoch": 948} {"train_loss": -11.11484146118164, "global_step": 159354, "epoch": 948} {"train_loss": -11.08462905883789, "global_step": 159355, "epoch": 948} {"train_loss": -10.773183822631836, "global_step": 159356, "epoch": 948} {"train_loss": -10.91468334197998, "global_step": 159357, "epoch": 948} {"train_loss": -10.913990020751953, "global_step": 159358, "epoch": 948} {"train_loss": -11.083561897277832, "global_step": 159359, "epoch": 948} {"train_loss": -11.096097946166992, "global_step": 159360, "epoch": 948} {"train_loss": -11.233221054077148, "global_step": 159361, "epoch": 948} {"train_loss": -11.127690315246582, "global_step": 159362, "epoch": 948} {"train_loss": -11.20254135131836, "global_step": 159363, "epoch": 948} {"train_loss": -11.259127616882324, "global_step": 159364, "epoch": 948} {"train_loss": -11.304967880249023, "global_step": 159365, "epoch": 948} {"train_loss": -11.361217498779297, "global_step": 159366, "epoch": 948} {"train_loss": -11.284290313720703, "global_step": 159367, "epoch": 948} {"train_loss": -11.175071716308594, "global_step": 159368, "epoch": 948} {"train_loss": -11.279427528381348, "global_step": 159369, "epoch": 948} {"train_loss": -11.397248268127441, "global_step": 159370, "epoch": 948} {"train_loss": -11.213661193847656, "global_step": 159371, "epoch": 948} {"train_loss": -11.278081893920898, "global_step": 159372, "epoch": 948} {"train_loss": -11.252687454223633, "global_step": 159373, "epoch": 948} {"train_loss": -10.887014389038086, "global_step": 159374, "epoch": 948} {"train_loss": -10.696625709533691, "global_step": 159375, "epoch": 948} {"train_loss": -10.736754417419434, "global_step": 159376, "epoch": 948} {"train_loss": -11.055397033691406, "global_step": 159377, "epoch": 948} {"train_loss": -10.844534873962402, "global_step": 159378, "epoch": 948} {"train_loss": -10.723661422729492, "global_step": 159379, "epoch": 948} {"train_loss": -11.162893295288086, "global_step": 159380, "epoch": 948} {"train_loss": -11.065860748291016, "global_step": 159381, "epoch": 948} {"train_loss": -11.264053344726562, "global_step": 159382, "epoch": 948} {"train_loss": -10.729028701782227, "global_step": 159383, "epoch": 948} {"train_loss": -11.278974533081055, "global_step": 159384, "epoch": 948} {"train_loss": -11.141092300415039, "global_step": 159385, "epoch": 948} {"train_loss": -11.094507217407227, "global_step": 159386, "epoch": 948} {"train_loss": -11.191366195678711, "global_step": 159387, "epoch": 948} {"train_loss": -10.717103004455566, "global_step": 159388, "epoch": 948} {"train_loss": -10.544364929199219, "global_step": 159389, "epoch": 948} {"train_loss": -10.694366455078125, "global_step": 159390, "epoch": 948} {"train_loss": -10.495119094848633, "global_step": 159391, "epoch": 948} {"train_loss": -9.852521896362305, "global_step": 159392, "epoch": 948} {"train_loss": -10.022579193115234, "global_step": 159393, "epoch": 948} {"train_loss": -11.129623413085938, "global_step": 159394, "epoch": 948} {"train_loss": -10.126039505004883, "global_step": 159395, "epoch": 948} {"train_loss": -11.260238647460938, "global_step": 159396, "epoch": 948} {"train_loss": -10.59637451171875, "global_step": 159397, "epoch": 948} {"train_loss": -9.51144790649414, "global_step": 159398, "epoch": 948} {"train_loss": -10.874592781066895, "global_step": 159399, "epoch": 948} {"train_loss": -9.461446762084961, "global_step": 159400, "epoch": 948} {"train_loss": -10.866739273071289, "global_step": 159401, "epoch": 948} {"train_loss": -9.860601425170898, "global_step": 159402, "epoch": 948} {"train_loss": -10.644516944885254, "global_step": 159403, "epoch": 948} {"train_loss": -9.840198516845703, "global_step": 159404, "epoch": 948} {"train_loss": -10.199567794799805, "global_step": 159405, "epoch": 948} {"train_loss": -10.491756439208984, "global_step": 159406, "epoch": 948} {"train_loss": -10.077431678771973, "global_step": 159407, "epoch": 948} {"train_loss": -10.399889945983887, "global_step": 159408, "epoch": 948} {"train_loss": -10.303061485290527, "global_step": 159409, "epoch": 948} {"train_loss": -10.771926879882812, "global_step": 159410, "epoch": 948} {"train_loss": -10.418352127075195, "global_step": 159411, "epoch": 948} {"train_loss": -10.590291023254395, "global_step": 159412, "epoch": 948} {"train_loss": -10.6640625, "global_step": 159413, "epoch": 948} {"train_loss": -10.716299057006836, "global_step": 159414, "epoch": 948} {"train_loss": -10.84800910949707, "global_step": 159415, "epoch": 948} {"train_loss": -10.569110870361328, "global_step": 159416, "epoch": 948} {"train_loss": -10.583932876586914, "global_step": 159417, "epoch": 948} {"train_loss": -10.626702308654785, "global_step": 159418, "epoch": 948} {"train_loss": -10.539133071899414, "global_step": 159419, "epoch": 948} {"train_loss": -10.81185245513916, "global_step": 159420, "epoch": 948} {"train_loss": -10.485798835754395, "global_step": 159421, "epoch": 948} {"train_loss": -10.972707748413086, "global_step": 159422, "epoch": 948} {"train_loss": -10.796592712402344, "global_step": 159423, "epoch": 948} {"train_loss": -10.698726654052734, "global_step": 159424, "epoch": 948} {"train_loss": -10.589095115661621, "global_step": 159425, "epoch": 948} {"train_loss": -10.7561616897583, "global_step": 159426, "epoch": 948} {"train_loss": -10.95357894897461, "global_step": 159427, "epoch": 948} {"train_loss": -10.77242660522461, "global_step": 159428, "epoch": 948} {"train_loss": -10.941213607788086, "global_step": 159429, "epoch": 948} {"train_loss": -10.790721893310547, "global_step": 159430, "epoch": 948} {"train_loss": -10.794306193079267, "global_step": 159431, "epoch": 948, "val_loss": 232358.484375} {"train_loss": -10.32978630065918, "global_step": 159432, "epoch": 949} {"train_loss": -11.003384590148926, "global_step": 159433, "epoch": 949} {"train_loss": -10.357251167297363, "global_step": 159434, "epoch": 949} {"train_loss": -10.928707122802734, "global_step": 159435, "epoch": 949} {"train_loss": -10.497712135314941, "global_step": 159436, "epoch": 949} {"train_loss": -11.097232818603516, "global_step": 159437, "epoch": 949} {"train_loss": -10.677679061889648, "global_step": 159438, "epoch": 949} {"train_loss": -11.024267196655273, "global_step": 159439, "epoch": 949} {"train_loss": -10.739559173583984, "global_step": 159440, "epoch": 949} {"train_loss": -10.820526123046875, "global_step": 159441, "epoch": 949} {"train_loss": -10.54112434387207, "global_step": 159442, "epoch": 949} {"train_loss": -10.596333503723145, "global_step": 159443, "epoch": 949} {"train_loss": -10.664606094360352, "global_step": 159444, "epoch": 949} {"train_loss": -10.722821235656738, "global_step": 159445, "epoch": 949} {"train_loss": -10.622139930725098, "global_step": 159446, "epoch": 949} {"train_loss": -10.524971008300781, "global_step": 159447, "epoch": 949} {"train_loss": -10.78953742980957, "global_step": 159448, "epoch": 949} {"train_loss": -10.520336151123047, "global_step": 159449, "epoch": 949} {"train_loss": -10.993648529052734, "global_step": 159450, "epoch": 949} {"train_loss": -10.742021560668945, "global_step": 159451, "epoch": 949} {"train_loss": -10.972003936767578, "global_step": 159452, "epoch": 949} {"train_loss": -10.877782821655273, "global_step": 159453, "epoch": 949} {"train_loss": -10.72283935546875, "global_step": 159454, "epoch": 949} {"train_loss": -10.952162742614746, "global_step": 159455, "epoch": 949} {"train_loss": -10.935678482055664, "global_step": 159456, "epoch": 949} {"train_loss": -10.713493347167969, "global_step": 159457, "epoch": 949} {"train_loss": -11.026126861572266, "global_step": 159458, "epoch": 949} {"train_loss": -10.51366901397705, "global_step": 159459, "epoch": 949} {"train_loss": -10.745845794677734, "global_step": 159460, "epoch": 949} {"train_loss": -10.998226165771484, "global_step": 159461, "epoch": 949} {"train_loss": -10.892520904541016, "global_step": 159462, "epoch": 949} {"train_loss": -11.300003051757812, "global_step": 159463, "epoch": 949} {"train_loss": -10.763566970825195, "global_step": 159464, "epoch": 949} {"train_loss": -10.969450950622559, "global_step": 159465, "epoch": 949} {"train_loss": -10.656137466430664, "global_step": 159466, "epoch": 949} {"train_loss": -11.275997161865234, "global_step": 159467, "epoch": 949} {"train_loss": -10.76662826538086, "global_step": 159468, "epoch": 949} {"train_loss": -10.930364608764648, "global_step": 159469, "epoch": 949} {"train_loss": -11.07236099243164, "global_step": 159470, "epoch": 949} {"train_loss": -10.796977996826172, "global_step": 159471, "epoch": 949} {"train_loss": -10.787446975708008, "global_step": 159472, "epoch": 949} {"train_loss": -10.810102462768555, "global_step": 159473, "epoch": 949} {"train_loss": -10.391898155212402, "global_step": 159474, "epoch": 949} {"train_loss": -10.65733528137207, "global_step": 159475, "epoch": 949} {"train_loss": -10.792295455932617, "global_step": 159476, "epoch": 949} {"train_loss": -10.685707092285156, "global_step": 159477, "epoch": 949} {"train_loss": -10.558494567871094, "global_step": 159478, "epoch": 949} {"train_loss": -10.948173522949219, "global_step": 159479, "epoch": 949} {"train_loss": -10.528427124023438, "global_step": 159480, "epoch": 949} {"train_loss": -10.900941848754883, "global_step": 159481, "epoch": 949} {"train_loss": -10.84848403930664, "global_step": 159482, "epoch": 949} {"train_loss": -10.349615097045898, "global_step": 159483, "epoch": 949} {"train_loss": -11.113346099853516, "global_step": 159484, "epoch": 949} {"train_loss": -10.331048965454102, "global_step": 159485, "epoch": 949} {"train_loss": -10.787646293640137, "global_step": 159486, "epoch": 949} {"train_loss": -10.581692695617676, "global_step": 159487, "epoch": 949} {"train_loss": -10.863935470581055, "global_step": 159488, "epoch": 949} {"train_loss": -10.55327033996582, "global_step": 159489, "epoch": 949} {"train_loss": -10.640864372253418, "global_step": 159490, "epoch": 949} {"train_loss": -10.507981300354004, "global_step": 159491, "epoch": 949} {"train_loss": -10.895238876342773, "global_step": 159492, "epoch": 949} {"train_loss": -10.792116165161133, "global_step": 159493, "epoch": 949} {"train_loss": -10.839040756225586, "global_step": 159494, "epoch": 949} {"train_loss": -10.574629783630371, "global_step": 159495, "epoch": 949} {"train_loss": -10.711231231689453, "global_step": 159496, "epoch": 949} {"train_loss": -11.004234313964844, "global_step": 159497, "epoch": 949} {"train_loss": -10.6909818649292, "global_step": 159498, "epoch": 949} {"train_loss": -10.731446266174316, "global_step": 159499, "epoch": 949} {"train_loss": -10.93079948425293, "global_step": 159500, "epoch": 949} {"train_loss": -10.716501235961914, "global_step": 159501, "epoch": 949} {"train_loss": -10.782875061035156, "global_step": 159502, "epoch": 949} {"train_loss": -10.90743637084961, "global_step": 159503, "epoch": 949} {"train_loss": -10.706748962402344, "global_step": 159504, "epoch": 949} {"train_loss": -10.838052749633789, "global_step": 159505, "epoch": 949} {"train_loss": -10.630667686462402, "global_step": 159506, "epoch": 949} {"train_loss": -11.184569358825684, "global_step": 159507, "epoch": 949} {"train_loss": -10.783807754516602, "global_step": 159508, "epoch": 949} {"train_loss": -11.139915466308594, "global_step": 159509, "epoch": 949} {"train_loss": -10.85255241394043, "global_step": 159510, "epoch": 949} {"train_loss": -11.184331893920898, "global_step": 159511, "epoch": 949} {"train_loss": -10.962087631225586, "global_step": 159512, "epoch": 949} {"train_loss": -11.152379989624023, "global_step": 159513, "epoch": 949} {"train_loss": -11.128250122070312, "global_step": 159514, "epoch": 949} {"train_loss": -10.922125816345215, "global_step": 159515, "epoch": 949} {"train_loss": -10.814697265625, "global_step": 159516, "epoch": 949} {"train_loss": -10.829102516174316, "global_step": 159517, "epoch": 949} {"train_loss": -10.986334800720215, "global_step": 159518, "epoch": 949} {"train_loss": -11.216512680053711, "global_step": 159519, "epoch": 949} {"train_loss": -10.666346549987793, "global_step": 159520, "epoch": 949} {"train_loss": -10.916095733642578, "global_step": 159521, "epoch": 949} {"train_loss": -10.51338005065918, "global_step": 159522, "epoch": 949} {"train_loss": -10.756159782409668, "global_step": 159523, "epoch": 949} {"train_loss": -10.475461959838867, "global_step": 159524, "epoch": 949} {"train_loss": -10.369171142578125, "global_step": 159525, "epoch": 949} {"train_loss": -10.151636123657227, "global_step": 159526, "epoch": 949} {"train_loss": -8.997392654418945, "global_step": 159527, "epoch": 949} {"train_loss": -10.479049682617188, "global_step": 159528, "epoch": 949} {"train_loss": -8.638923645019531, "global_step": 159529, "epoch": 949} {"train_loss": -9.922347068786621, "global_step": 159530, "epoch": 949} {"train_loss": -8.980491638183594, "global_step": 159531, "epoch": 949} {"train_loss": -10.329212188720703, "global_step": 159532, "epoch": 949} {"train_loss": -8.787726402282715, "global_step": 159533, "epoch": 949} {"train_loss": -9.945862770080566, "global_step": 159534, "epoch": 949} {"train_loss": -9.172779083251953, "global_step": 159535, "epoch": 949} {"train_loss": -9.654729843139648, "global_step": 159536, "epoch": 949} {"train_loss": -9.239770889282227, "global_step": 159537, "epoch": 949} {"train_loss": -9.073203086853027, "global_step": 159538, "epoch": 949} {"train_loss": -10.840224266052246, "global_step": 159539, "epoch": 949} {"train_loss": -9.27301025390625, "global_step": 159540, "epoch": 949} {"train_loss": -10.455621719360352, "global_step": 159541, "epoch": 949} {"train_loss": -9.510997772216797, "global_step": 159542, "epoch": 949} {"train_loss": -9.552946090698242, "global_step": 159543, "epoch": 949} {"train_loss": -10.307198524475098, "global_step": 159544, "epoch": 949} {"train_loss": -9.186147689819336, "global_step": 159545, "epoch": 949} {"train_loss": -10.321479797363281, "global_step": 159546, "epoch": 949} {"train_loss": -10.128973007202148, "global_step": 159547, "epoch": 949} {"train_loss": -9.762747764587402, "global_step": 159548, "epoch": 949} {"train_loss": -10.259883880615234, "global_step": 159549, "epoch": 949} {"train_loss": -9.674070358276367, "global_step": 159550, "epoch": 949} {"train_loss": -9.864311218261719, "global_step": 159551, "epoch": 949} {"train_loss": -10.375273704528809, "global_step": 159552, "epoch": 949} {"train_loss": -10.273321151733398, "global_step": 159553, "epoch": 949} {"train_loss": -10.339279174804688, "global_step": 159554, "epoch": 949} {"train_loss": -10.391759872436523, "global_step": 159555, "epoch": 949} {"train_loss": -10.313615798950195, "global_step": 159556, "epoch": 949} {"train_loss": -10.284065246582031, "global_step": 159557, "epoch": 949} {"train_loss": -10.561145782470703, "global_step": 159558, "epoch": 949} {"train_loss": -10.047577857971191, "global_step": 159559, "epoch": 949} {"train_loss": -10.129298210144043, "global_step": 159560, "epoch": 949} {"train_loss": -10.561186790466309, "global_step": 159561, "epoch": 949} {"train_loss": -10.410430908203125, "global_step": 159562, "epoch": 949} {"train_loss": -10.076589584350586, "global_step": 159563, "epoch": 949} {"train_loss": -10.706007957458496, "global_step": 159564, "epoch": 949} {"train_loss": -10.67330551147461, "global_step": 159565, "epoch": 949} {"train_loss": -10.555595397949219, "global_step": 159566, "epoch": 949} {"train_loss": -10.373310089111328, "global_step": 159567, "epoch": 949} {"train_loss": -10.364640235900879, "global_step": 159568, "epoch": 949} {"train_loss": -10.654592514038086, "global_step": 159569, "epoch": 949} {"train_loss": -10.517614364624023, "global_step": 159570, "epoch": 949} {"train_loss": -10.61678409576416, "global_step": 159571, "epoch": 949} {"train_loss": -10.743354797363281, "global_step": 159572, "epoch": 949} {"train_loss": -10.839125633239746, "global_step": 159573, "epoch": 949} {"train_loss": -10.779862403869629, "global_step": 159574, "epoch": 949} {"train_loss": -10.679498672485352, "global_step": 159575, "epoch": 949} {"train_loss": -10.831914901733398, "global_step": 159576, "epoch": 949} {"train_loss": -10.78990364074707, "global_step": 159577, "epoch": 949} {"train_loss": -10.806376457214355, "global_step": 159578, "epoch": 949} {"train_loss": -10.912957191467285, "global_step": 159579, "epoch": 949} {"train_loss": -10.937695503234863, "global_step": 159580, "epoch": 949} {"train_loss": -10.845827102661133, "global_step": 159581, "epoch": 949} {"train_loss": -10.995969772338867, "global_step": 159582, "epoch": 949} {"train_loss": -10.872188568115234, "global_step": 159583, "epoch": 949} {"train_loss": -10.895151138305664, "global_step": 159584, "epoch": 949} {"train_loss": -10.895489692687988, "global_step": 159585, "epoch": 949} {"train_loss": -10.909729957580566, "global_step": 159586, "epoch": 949} {"train_loss": -11.012426376342773, "global_step": 159587, "epoch": 949} {"train_loss": -10.902242660522461, "global_step": 159588, "epoch": 949} {"train_loss": -11.052936553955078, "global_step": 159589, "epoch": 949} {"train_loss": -11.018012046813965, "global_step": 159590, "epoch": 949} {"train_loss": -11.081932067871094, "global_step": 159591, "epoch": 949} {"train_loss": -11.007491111755371, "global_step": 159592, "epoch": 949} {"train_loss": -11.13520336151123, "global_step": 159593, "epoch": 949} {"train_loss": -11.016271591186523, "global_step": 159594, "epoch": 949} {"train_loss": -11.186056137084961, "global_step": 159595, "epoch": 949} {"train_loss": -11.035320281982422, "global_step": 159596, "epoch": 949} {"train_loss": -11.003763198852539, "global_step": 159597, "epoch": 949} {"train_loss": -11.203638076782227, "global_step": 159598, "epoch": 949} {"train_loss": -10.603969290142967, "global_step": 159599, "epoch": 949, "val_loss": 233615.28125} {"train_loss": -11.090509414672852, "global_step": 159600, "epoch": 950} {"train_loss": -11.11414909362793, "global_step": 159601, "epoch": 950} {"train_loss": -11.163217544555664, "global_step": 159602, "epoch": 950} {"train_loss": -11.25926399230957, "global_step": 159603, "epoch": 950} {"train_loss": -11.102749824523926, "global_step": 159604, "epoch": 950} {"train_loss": -10.799507141113281, "global_step": 159605, "epoch": 950} {"train_loss": -11.373311996459961, "global_step": 159606, "epoch": 950} {"train_loss": -10.706324577331543, "global_step": 159607, "epoch": 950} {"train_loss": -10.691181182861328, "global_step": 159608, "epoch": 950} {"train_loss": -11.103360176086426, "global_step": 159609, "epoch": 950} {"train_loss": -11.192262649536133, "global_step": 159610, "epoch": 950} {"train_loss": -11.042035102844238, "global_step": 159611, "epoch": 950} {"train_loss": -11.13433837890625, "global_step": 159612, "epoch": 950} {"train_loss": -10.994016647338867, "global_step": 159613, "epoch": 950} {"train_loss": -11.125007629394531, "global_step": 159614, "epoch": 950} {"train_loss": -11.054208755493164, "global_step": 159615, "epoch": 950} {"train_loss": -10.92943000793457, "global_step": 159616, "epoch": 950} {"train_loss": -11.32913875579834, "global_step": 159617, "epoch": 950} {"train_loss": -11.160011291503906, "global_step": 159618, "epoch": 950} {"train_loss": -10.828142166137695, "global_step": 159619, "epoch": 950} {"train_loss": -10.667608261108398, "global_step": 159620, "epoch": 950} {"train_loss": -11.196502685546875, "global_step": 159621, "epoch": 950} {"train_loss": -11.24720573425293, "global_step": 159622, "epoch": 950} {"train_loss": -11.035009384155273, "global_step": 159623, "epoch": 950} {"train_loss": -10.922171592712402, "global_step": 159624, "epoch": 950} {"train_loss": -11.052789688110352, "global_step": 159625, "epoch": 950} {"train_loss": -10.95040512084961, "global_step": 159626, "epoch": 950} {"train_loss": -10.507659912109375, "global_step": 159627, "epoch": 950} {"train_loss": -10.630151748657227, "global_step": 159628, "epoch": 950} {"train_loss": -11.187213897705078, "global_step": 159629, "epoch": 950} {"train_loss": -10.950030326843262, "global_step": 159630, "epoch": 950} {"train_loss": -11.138582229614258, "global_step": 159631, "epoch": 950} {"train_loss": -11.033620834350586, "global_step": 159632, "epoch": 950} {"train_loss": -10.956993103027344, "global_step": 159633, "epoch": 950} {"train_loss": -11.103025436401367, "global_step": 159634, "epoch": 950} {"train_loss": -11.22430419921875, "global_step": 159635, "epoch": 950} {"train_loss": -10.884285926818848, "global_step": 159636, "epoch": 950} {"train_loss": -10.879480361938477, "global_step": 159637, "epoch": 950} {"train_loss": -10.946773529052734, "global_step": 159638, "epoch": 950} {"train_loss": -11.0864839553833, "global_step": 159639, "epoch": 950} {"train_loss": -10.360183715820312, "global_step": 159640, "epoch": 950} {"train_loss": -10.249018669128418, "global_step": 159641, "epoch": 950} {"train_loss": -10.779120445251465, "global_step": 159642, "epoch": 950} {"train_loss": -10.477840423583984, "global_step": 159643, "epoch": 950} {"train_loss": -9.323112487792969, "global_step": 159644, "epoch": 950} {"train_loss": -10.656938552856445, "global_step": 159645, "epoch": 950} {"train_loss": -10.216291427612305, "global_step": 159646, "epoch": 950} {"train_loss": -10.409762382507324, "global_step": 159647, "epoch": 950} {"train_loss": -10.30723762512207, "global_step": 159648, "epoch": 950} {"train_loss": -10.83267593383789, "global_step": 159649, "epoch": 950} {"train_loss": -10.426925659179688, "global_step": 159650, "epoch": 950} {"train_loss": -10.827627182006836, "global_step": 159651, "epoch": 950} {"train_loss": -9.88886833190918, "global_step": 159652, "epoch": 950} {"train_loss": -10.35909652709961, "global_step": 159653, "epoch": 950} {"train_loss": -10.265644073486328, "global_step": 159654, "epoch": 950} {"train_loss": -10.27174186706543, "global_step": 159655, "epoch": 950} {"train_loss": -11.266759872436523, "global_step": 159656, "epoch": 950} {"train_loss": -10.428031921386719, "global_step": 159657, "epoch": 950} {"train_loss": -10.907119750976562, "global_step": 159658, "epoch": 950} {"train_loss": -10.153181076049805, "global_step": 159659, "epoch": 950} {"train_loss": -10.632274627685547, "global_step": 159660, "epoch": 950} {"train_loss": -10.593746185302734, "global_step": 159661, "epoch": 950} {"train_loss": -10.665498733520508, "global_step": 159662, "epoch": 950} {"train_loss": -11.017618179321289, "global_step": 159663, "epoch": 950} {"train_loss": -10.973396301269531, "global_step": 159664, "epoch": 950} {"train_loss": -11.044719696044922, "global_step": 159665, "epoch": 950} {"train_loss": -10.869787216186523, "global_step": 159666, "epoch": 950} {"train_loss": -10.785853385925293, "global_step": 159667, "epoch": 950} {"train_loss": -11.003633499145508, "global_step": 159668, "epoch": 950} {"train_loss": -10.701016426086426, "global_step": 159669, "epoch": 950} {"train_loss": -10.946407318115234, "global_step": 159670, "epoch": 950} {"train_loss": -10.66383171081543, "global_step": 159671, "epoch": 950} {"train_loss": -10.904004096984863, "global_step": 159672, "epoch": 950} {"train_loss": -10.814290046691895, "global_step": 159673, "epoch": 950} {"train_loss": -11.240669250488281, "global_step": 159674, "epoch": 950} {"train_loss": -11.084378242492676, "global_step": 159675, "epoch": 950} {"train_loss": -11.129806518554688, "global_step": 159676, "epoch": 950} {"train_loss": -11.20991325378418, "global_step": 159677, "epoch": 950} {"train_loss": -10.985876083374023, "global_step": 159678, "epoch": 950} {"train_loss": -10.85312557220459, "global_step": 159679, "epoch": 950} {"train_loss": -10.954663276672363, "global_step": 159680, "epoch": 950} {"train_loss": -11.181588172912598, "global_step": 159681, "epoch": 950} {"train_loss": -10.88852596282959, "global_step": 159682, "epoch": 950} {"train_loss": -11.292682647705078, "global_step": 159683, "epoch": 950} {"train_loss": -11.140599250793457, "global_step": 159684, "epoch": 950} {"train_loss": -11.134521484375, "global_step": 159685, "epoch": 950} {"train_loss": -11.094186782836914, "global_step": 159686, "epoch": 950} {"train_loss": -11.140689849853516, "global_step": 159687, "epoch": 950} {"train_loss": -11.052967071533203, "global_step": 159688, "epoch": 950} {"train_loss": -11.02313232421875, "global_step": 159689, "epoch": 950} {"train_loss": -10.973321914672852, "global_step": 159690, "epoch": 950} {"train_loss": -11.173333168029785, "global_step": 159691, "epoch": 950} {"train_loss": -11.021682739257812, "global_step": 159692, "epoch": 950} {"train_loss": -10.988592147827148, "global_step": 159693, "epoch": 950} {"train_loss": -11.157965660095215, "global_step": 159694, "epoch": 950} {"train_loss": -11.034675598144531, "global_step": 159695, "epoch": 950} {"train_loss": -11.012125015258789, "global_step": 159696, "epoch": 950} {"train_loss": -11.205659866333008, "global_step": 159697, "epoch": 950} {"train_loss": -10.907804489135742, "global_step": 159698, "epoch": 950} {"train_loss": -10.942667961120605, "global_step": 159699, "epoch": 950} {"train_loss": -11.113470077514648, "global_step": 159700, "epoch": 950} {"train_loss": -11.040618896484375, "global_step": 159701, "epoch": 950} {"train_loss": -11.065454483032227, "global_step": 159702, "epoch": 950} {"train_loss": -10.997490882873535, "global_step": 159703, "epoch": 950} {"train_loss": -10.196136474609375, "global_step": 159704, "epoch": 950} {"train_loss": -10.413826942443848, "global_step": 159705, "epoch": 950} {"train_loss": -10.912108421325684, "global_step": 159706, "epoch": 950} {"train_loss": -10.118907928466797, "global_step": 159707, "epoch": 950} {"train_loss": -9.787860870361328, "global_step": 159708, "epoch": 950} {"train_loss": -10.338598251342773, "global_step": 159709, "epoch": 950} {"train_loss": -8.462146759033203, "global_step": 159710, "epoch": 950} {"train_loss": -10.226417541503906, "global_step": 159711, "epoch": 950} {"train_loss": -8.213815689086914, "global_step": 159712, "epoch": 950} {"train_loss": -8.24095344543457, "global_step": 159713, "epoch": 950} {"train_loss": -8.563591003417969, "global_step": 159714, "epoch": 950} {"train_loss": -8.216802597045898, "global_step": 159715, "epoch": 950} {"train_loss": -10.499216079711914, "global_step": 159716, "epoch": 950} {"train_loss": -9.492219924926758, "global_step": 159717, "epoch": 950} {"train_loss": -10.051158905029297, "global_step": 159718, "epoch": 950} {"train_loss": -9.33609390258789, "global_step": 159719, "epoch": 950} {"train_loss": -10.034659385681152, "global_step": 159720, "epoch": 950} {"train_loss": -9.169687271118164, "global_step": 159721, "epoch": 950} {"train_loss": -9.482688903808594, "global_step": 159722, "epoch": 950} {"train_loss": -9.982599258422852, "global_step": 159723, "epoch": 950} {"train_loss": -9.854168891906738, "global_step": 159724, "epoch": 950} {"train_loss": -10.388862609863281, "global_step": 159725, "epoch": 950} {"train_loss": -10.491594314575195, "global_step": 159726, "epoch": 950} {"train_loss": -10.370853424072266, "global_step": 159727, "epoch": 950} {"train_loss": -10.191093444824219, "global_step": 159728, "epoch": 950} {"train_loss": -10.184648513793945, "global_step": 159729, "epoch": 950} {"train_loss": -10.466878890991211, "global_step": 159730, "epoch": 950} {"train_loss": -9.311912536621094, "global_step": 159731, "epoch": 950} {"train_loss": -10.511299133300781, "global_step": 159732, "epoch": 950} {"train_loss": -10.194664001464844, "global_step": 159733, "epoch": 950} {"train_loss": -9.94002914428711, "global_step": 159734, "epoch": 950} {"train_loss": -10.471902847290039, "global_step": 159735, "epoch": 950} {"train_loss": -10.577120780944824, "global_step": 159736, "epoch": 950} {"train_loss": -10.241647720336914, "global_step": 159737, "epoch": 950} {"train_loss": -10.406364440917969, "global_step": 159738, "epoch": 950} {"train_loss": -10.549043655395508, "global_step": 159739, "epoch": 950} {"train_loss": -10.44835090637207, "global_step": 159740, "epoch": 950} {"train_loss": -10.379348754882812, "global_step": 159741, "epoch": 950} {"train_loss": -10.56649398803711, "global_step": 159742, "epoch": 950} {"train_loss": -10.489458084106445, "global_step": 159743, "epoch": 950} {"train_loss": -10.344904899597168, "global_step": 159744, "epoch": 950} {"train_loss": -10.723335266113281, "global_step": 159745, "epoch": 950} {"train_loss": -10.67005729675293, "global_step": 159746, "epoch": 950} {"train_loss": -10.746087074279785, "global_step": 159747, "epoch": 950} {"train_loss": -10.812776565551758, "global_step": 159748, "epoch": 950} {"train_loss": -10.595497131347656, "global_step": 159749, "epoch": 950} {"train_loss": -10.538955688476562, "global_step": 159750, "epoch": 950} {"train_loss": -10.642583847045898, "global_step": 159751, "epoch": 950} {"train_loss": -10.683077812194824, "global_step": 159752, "epoch": 950} {"train_loss": -10.705116271972656, "global_step": 159753, "epoch": 950} {"train_loss": -10.719805717468262, "global_step": 159754, "epoch": 950} {"train_loss": -10.51630973815918, "global_step": 159755, "epoch": 950} {"train_loss": -10.738204956054688, "global_step": 159756, "epoch": 950} {"train_loss": -10.76780891418457, "global_step": 159757, "epoch": 950} {"train_loss": -10.581218719482422, "global_step": 159758, "epoch": 950} {"train_loss": -10.792366981506348, "global_step": 159759, "epoch": 950} {"train_loss": -10.598413467407227, "global_step": 159760, "epoch": 950} {"train_loss": -10.83034896850586, "global_step": 159761, "epoch": 950} {"train_loss": -10.951047897338867, "global_step": 159762, "epoch": 950} {"train_loss": -10.811393737792969, "global_step": 159763, "epoch": 950} {"train_loss": -10.717491149902344, "global_step": 159764, "epoch": 950} {"train_loss": -10.93228530883789, "global_step": 159765, "epoch": 950} {"train_loss": -10.82611083984375, "global_step": 159766, "epoch": 950} {"train_loss": -10.640625073796226, "global_step": 159767, "epoch": 950, "train/sim_max_reward_0": 0.573979841446635, "train/sim_max_reward_1": 0.9895872319235572, "train/sim_max_reward_2": 0.0029969291458238775, "train/sim_max_reward_3": 0.6425428823847464, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.4571865327368184, "test/sim_max_reward_4400002": 0.1628277555228391, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.40814071109869754, "test/sim_max_reward_4400005": 0.9583714955473247, "test/sim_max_reward_4400006": 0.26825213219862576, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.567653652884615, "test/sim_max_reward_4400009": 0.3991175952053837, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 0.9731514048648306, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.6036039754883554, "test/sim_max_reward_4400015": 0.9521203616690448, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.8930278162205075, "test/sim_max_reward_4400019": 0.19626037715622682, "test/sim_max_reward_4400020": 0.41652318828918256, "test/sim_max_reward_4400021": 0.5663729136700071, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.1356135359734134, "test/sim_max_reward_4400024": 1.0, "test/sim_max_reward_4400025": 0.9924273432115637, "test/sim_max_reward_4400026": 0.07816619646384944, "test/sim_max_reward_4400027": 0.9786295744235123, "test/sim_max_reward_4400028": 0.707909907171495, "test/sim_max_reward_4400029": 0.45464205747934094, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.9887314190007382, "test/sim_max_reward_4400032": 0.04040707623084906, "test/sim_max_reward_4400033": 0.17238172397058038, "test/sim_max_reward_4400034": 0.9903689699464774, "test/sim_max_reward_4400035": 0.9592557789761414, "test/sim_max_reward_4400036": 0.36694891115854156, "test/sim_max_reward_4400037": 0.9468352003654759, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.14862008916973368, "test/sim_max_reward_4400042": 1.0, "test/sim_max_reward_4400043": 0.9981957817087616, "test/sim_max_reward_4400044": 0.9662125115768705, "test/sim_max_reward_4400045": 0.5247864718560478, "test/sim_max_reward_4400046": 0.33314568420183993, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.3448315390644214, "train/mean_score": 0.567015274043825, "test/mean_score": 0.5990143936900423, "val_loss": 231366.34375, "train_action_mse_error": 1.1497929096221924} {"train_loss": -10.958544731140137, "global_step": 159768, "epoch": 951} {"train_loss": -10.841154098510742, "global_step": 159769, "epoch": 951} {"train_loss": -11.022193908691406, "global_step": 159770, "epoch": 951} {"train_loss": -10.946599006652832, "global_step": 159771, "epoch": 951} {"train_loss": -10.848915100097656, "global_step": 159772, "epoch": 951} {"train_loss": -10.890556335449219, "global_step": 159773, "epoch": 951} {"train_loss": -11.015619277954102, "global_step": 159774, "epoch": 951} {"train_loss": -10.995779991149902, "global_step": 159775, "epoch": 951} {"train_loss": -11.26314926147461, "global_step": 159776, "epoch": 951} {"train_loss": -11.043660163879395, "global_step": 159777, "epoch": 951} {"train_loss": -10.801822662353516, "global_step": 159778, "epoch": 951} {"train_loss": -11.146583557128906, "global_step": 159779, "epoch": 951} {"train_loss": -10.854619026184082, "global_step": 159780, "epoch": 951} {"train_loss": -11.18063735961914, "global_step": 159781, "epoch": 951} {"train_loss": -11.16408920288086, "global_step": 159782, "epoch": 951} {"train_loss": -10.945112228393555, "global_step": 159783, "epoch": 951} {"train_loss": -11.015182495117188, "global_step": 159784, "epoch": 951} {"train_loss": -11.040595054626465, "global_step": 159785, "epoch": 951} {"train_loss": -10.874654769897461, "global_step": 159786, "epoch": 951} {"train_loss": -11.196479797363281, "global_step": 159787, "epoch": 951} {"train_loss": -11.06591510772705, "global_step": 159788, "epoch": 951} {"train_loss": -10.61819076538086, "global_step": 159789, "epoch": 951} {"train_loss": -10.93623161315918, "global_step": 159790, "epoch": 951} {"train_loss": -11.010408401489258, "global_step": 159791, "epoch": 951} {"train_loss": -10.868947982788086, "global_step": 159792, "epoch": 951} {"train_loss": -11.238229751586914, "global_step": 159793, "epoch": 951} {"train_loss": -11.009479522705078, "global_step": 159794, "epoch": 951} {"train_loss": -10.996383666992188, "global_step": 159795, "epoch": 951} {"train_loss": -10.911995887756348, "global_step": 159796, "epoch": 951} {"train_loss": -10.548843383789062, "global_step": 159797, "epoch": 951} {"train_loss": -11.279491424560547, "global_step": 159798, "epoch": 951} {"train_loss": -10.445932388305664, "global_step": 159799, "epoch": 951} {"train_loss": -9.748682975769043, "global_step": 159800, "epoch": 951} {"train_loss": -10.585098266601562, "global_step": 159801, "epoch": 951} {"train_loss": -10.73295783996582, "global_step": 159802, "epoch": 951} {"train_loss": -9.393636703491211, "global_step": 159803, "epoch": 951} {"train_loss": -10.976558685302734, "global_step": 159804, "epoch": 951} {"train_loss": -10.096912384033203, "global_step": 159805, "epoch": 951} {"train_loss": -9.588155746459961, "global_step": 159806, "epoch": 951} {"train_loss": -10.468240737915039, "global_step": 159807, "epoch": 951} {"train_loss": -9.09214973449707, "global_step": 159808, "epoch": 951} {"train_loss": -10.325382232666016, "global_step": 159809, "epoch": 951} {"train_loss": -10.161048889160156, "global_step": 159810, "epoch": 951} {"train_loss": -10.10324764251709, "global_step": 159811, "epoch": 951} {"train_loss": -9.897390365600586, "global_step": 159812, "epoch": 951} {"train_loss": -10.046594619750977, "global_step": 159813, "epoch": 951} {"train_loss": -9.696560859680176, "global_step": 159814, "epoch": 951} {"train_loss": -9.915689468383789, "global_step": 159815, "epoch": 951} {"train_loss": -9.798215866088867, "global_step": 159816, "epoch": 951} {"train_loss": -9.134340286254883, "global_step": 159817, "epoch": 951} {"train_loss": -10.013821601867676, "global_step": 159818, "epoch": 951} {"train_loss": -9.988073348999023, "global_step": 159819, "epoch": 951} {"train_loss": -9.9500150680542, "global_step": 159820, "epoch": 951} {"train_loss": -9.96362018585205, "global_step": 159821, "epoch": 951} {"train_loss": -9.899605751037598, "global_step": 159822, "epoch": 951} {"train_loss": -10.64189338684082, "global_step": 159823, "epoch": 951} {"train_loss": -10.202247619628906, "global_step": 159824, "epoch": 951} {"train_loss": -10.40439224243164, "global_step": 159825, "epoch": 951} {"train_loss": -10.702835083007812, "global_step": 159826, "epoch": 951} {"train_loss": -10.326526641845703, "global_step": 159827, "epoch": 951} {"train_loss": -10.556400299072266, "global_step": 159828, "epoch": 951} {"train_loss": -10.771772384643555, "global_step": 159829, "epoch": 951} {"train_loss": -10.04731559753418, "global_step": 159830, "epoch": 951} {"train_loss": -10.656172752380371, "global_step": 159831, "epoch": 951} {"train_loss": -10.593562126159668, "global_step": 159832, "epoch": 951} {"train_loss": -10.491691589355469, "global_step": 159833, "epoch": 951} {"train_loss": -10.67923355102539, "global_step": 159834, "epoch": 951} {"train_loss": -10.532825469970703, "global_step": 159835, "epoch": 951} {"train_loss": -10.661853790283203, "global_step": 159836, "epoch": 951} {"train_loss": -10.68006420135498, "global_step": 159837, "epoch": 951} {"train_loss": -10.847371101379395, "global_step": 159838, "epoch": 951} {"train_loss": -10.340622901916504, "global_step": 159839, "epoch": 951} {"train_loss": -10.847448348999023, "global_step": 159840, "epoch": 951} {"train_loss": -10.796133995056152, "global_step": 159841, "epoch": 951} {"train_loss": -10.899299621582031, "global_step": 159842, "epoch": 951} {"train_loss": -10.558107376098633, "global_step": 159843, "epoch": 951} {"train_loss": -10.748884201049805, "global_step": 159844, "epoch": 951} {"train_loss": -10.906982421875, "global_step": 159845, "epoch": 951} {"train_loss": -10.752717018127441, "global_step": 159846, "epoch": 951} {"train_loss": -10.896677017211914, "global_step": 159847, "epoch": 951} {"train_loss": -10.879326820373535, "global_step": 159848, "epoch": 951} {"train_loss": -10.852680206298828, "global_step": 159849, "epoch": 951} {"train_loss": -11.106904983520508, "global_step": 159850, "epoch": 951} {"train_loss": -11.02475357055664, "global_step": 159851, "epoch": 951} {"train_loss": -10.942750930786133, "global_step": 159852, "epoch": 951} {"train_loss": -10.906407356262207, "global_step": 159853, "epoch": 951} {"train_loss": -10.97269058227539, "global_step": 159854, "epoch": 951} {"train_loss": -11.158710479736328, "global_step": 159855, "epoch": 951} {"train_loss": -11.071797370910645, "global_step": 159856, "epoch": 951} {"train_loss": -10.93464183807373, "global_step": 159857, "epoch": 951} {"train_loss": -10.876829147338867, "global_step": 159858, "epoch": 951} {"train_loss": -11.069950103759766, "global_step": 159859, "epoch": 951} {"train_loss": -11.124752044677734, "global_step": 159860, "epoch": 951} {"train_loss": -11.168180465698242, "global_step": 159861, "epoch": 951} {"train_loss": -11.199723243713379, "global_step": 159862, "epoch": 951} {"train_loss": -11.222809791564941, "global_step": 159863, "epoch": 951} {"train_loss": -11.262134552001953, "global_step": 159864, "epoch": 951} {"train_loss": -10.99720573425293, "global_step": 159865, "epoch": 951} {"train_loss": -11.052244186401367, "global_step": 159866, "epoch": 951} {"train_loss": -11.182658195495605, "global_step": 159867, "epoch": 951} {"train_loss": -11.17034912109375, "global_step": 159868, "epoch": 951} {"train_loss": -11.03662109375, "global_step": 159869, "epoch": 951} {"train_loss": -11.293678283691406, "global_step": 159870, "epoch": 951} {"train_loss": -10.917619705200195, "global_step": 159871, "epoch": 951} {"train_loss": -11.052647590637207, "global_step": 159872, "epoch": 951} {"train_loss": -10.946318626403809, "global_step": 159873, "epoch": 951} {"train_loss": -11.069618225097656, "global_step": 159874, "epoch": 951} {"train_loss": -11.094366073608398, "global_step": 159875, "epoch": 951} {"train_loss": -11.097538948059082, "global_step": 159876, "epoch": 951} {"train_loss": -10.9895601272583, "global_step": 159877, "epoch": 951} {"train_loss": -11.177765846252441, "global_step": 159878, "epoch": 951} {"train_loss": -11.005746841430664, "global_step": 159879, "epoch": 951} {"train_loss": -10.812978744506836, "global_step": 159880, "epoch": 951} {"train_loss": -11.089075088500977, "global_step": 159881, "epoch": 951} {"train_loss": -11.123239517211914, "global_step": 159882, "epoch": 951} {"train_loss": -11.028143882751465, "global_step": 159883, "epoch": 951} {"train_loss": -11.150440216064453, "global_step": 159884, "epoch": 951} {"train_loss": -10.87106704711914, "global_step": 159885, "epoch": 951} {"train_loss": -11.287862777709961, "global_step": 159886, "epoch": 951} {"train_loss": -10.81650447845459, "global_step": 159887, "epoch": 951} {"train_loss": -10.379826545715332, "global_step": 159888, "epoch": 951} {"train_loss": -10.957906723022461, "global_step": 159889, "epoch": 951} {"train_loss": -10.945096969604492, "global_step": 159890, "epoch": 951} {"train_loss": -11.132944107055664, "global_step": 159891, "epoch": 951} {"train_loss": -10.816716194152832, "global_step": 159892, "epoch": 951} {"train_loss": -11.042953491210938, "global_step": 159893, "epoch": 951} {"train_loss": -10.634483337402344, "global_step": 159894, "epoch": 951} {"train_loss": -10.637731552124023, "global_step": 159895, "epoch": 951} {"train_loss": -10.732998847961426, "global_step": 159896, "epoch": 951} {"train_loss": -10.794881820678711, "global_step": 159897, "epoch": 951} {"train_loss": -10.333247184753418, "global_step": 159898, "epoch": 951} {"train_loss": -10.50248908996582, "global_step": 159899, "epoch": 951} {"train_loss": -9.858587265014648, "global_step": 159900, "epoch": 951} {"train_loss": -9.206228256225586, "global_step": 159901, "epoch": 951} {"train_loss": -10.00809097290039, "global_step": 159902, "epoch": 951} {"train_loss": -9.603168487548828, "global_step": 159903, "epoch": 951} {"train_loss": -10.223155975341797, "global_step": 159904, "epoch": 951} {"train_loss": -9.270748138427734, "global_step": 159905, "epoch": 951} {"train_loss": -10.32150936126709, "global_step": 159906, "epoch": 951} {"train_loss": -9.540332794189453, "global_step": 159907, "epoch": 951} {"train_loss": -10.331693649291992, "global_step": 159908, "epoch": 951} {"train_loss": -9.37437629699707, "global_step": 159909, "epoch": 951} {"train_loss": -9.311938285827637, "global_step": 159910, "epoch": 951} {"train_loss": -10.501798629760742, "global_step": 159911, "epoch": 951} {"train_loss": -9.907041549682617, "global_step": 159912, "epoch": 951} {"train_loss": -9.901726722717285, "global_step": 159913, "epoch": 951} {"train_loss": -10.376949310302734, "global_step": 159914, "epoch": 951} {"train_loss": -10.005291938781738, "global_step": 159915, "epoch": 951} {"train_loss": -10.3792724609375, "global_step": 159916, "epoch": 951} {"train_loss": -10.189168930053711, "global_step": 159917, "epoch": 951} {"train_loss": -10.436233520507812, "global_step": 159918, "epoch": 951} {"train_loss": -9.722955703735352, "global_step": 159919, "epoch": 951} {"train_loss": -10.601032257080078, "global_step": 159920, "epoch": 951} {"train_loss": -9.970836639404297, "global_step": 159921, "epoch": 951} {"train_loss": -9.99936294555664, "global_step": 159922, "epoch": 951} {"train_loss": -10.224237442016602, "global_step": 159923, "epoch": 951} {"train_loss": -9.874156951904297, "global_step": 159924, "epoch": 951} {"train_loss": -10.48971176147461, "global_step": 159925, "epoch": 951} {"train_loss": -10.257065773010254, "global_step": 159926, "epoch": 951} {"train_loss": -10.410195350646973, "global_step": 159927, "epoch": 951} {"train_loss": -10.313186645507812, "global_step": 159928, "epoch": 951} {"train_loss": -10.244863510131836, "global_step": 159929, "epoch": 951} {"train_loss": -10.506567001342773, "global_step": 159930, "epoch": 951} {"train_loss": -9.876909255981445, "global_step": 159931, "epoch": 951} {"train_loss": -10.924077033996582, "global_step": 159932, "epoch": 951} {"train_loss": -10.357406616210938, "global_step": 159933, "epoch": 951} {"train_loss": -10.4824857711792, "global_step": 159934, "epoch": 951} {"train_loss": -10.599344452222189, "global_step": 159935, "epoch": 951, "val_loss": 237112.15625} {"train_loss": -10.612588882446289, "global_step": 159936, "epoch": 952} {"train_loss": -10.641387939453125, "global_step": 159937, "epoch": 952} {"train_loss": -10.612561225891113, "global_step": 159938, "epoch": 952} {"train_loss": -10.813041687011719, "global_step": 159939, "epoch": 952} {"train_loss": -10.649312973022461, "global_step": 159940, "epoch": 952} {"train_loss": -10.664892196655273, "global_step": 159941, "epoch": 952} {"train_loss": -10.855650901794434, "global_step": 159942, "epoch": 952} {"train_loss": -10.759946823120117, "global_step": 159943, "epoch": 952} {"train_loss": -10.64881706237793, "global_step": 159944, "epoch": 952} {"train_loss": -10.910516738891602, "global_step": 159945, "epoch": 952} {"train_loss": -10.568746566772461, "global_step": 159946, "epoch": 952} {"train_loss": -10.987756729125977, "global_step": 159947, "epoch": 952} {"train_loss": -10.614442825317383, "global_step": 159948, "epoch": 952} {"train_loss": -10.76552963256836, "global_step": 159949, "epoch": 952} {"train_loss": -10.644981384277344, "global_step": 159950, "epoch": 952} {"train_loss": -11.038318634033203, "global_step": 159951, "epoch": 952} {"train_loss": -10.740684509277344, "global_step": 159952, "epoch": 952} {"train_loss": -10.714733123779297, "global_step": 159953, "epoch": 952} {"train_loss": -11.00516128540039, "global_step": 159954, "epoch": 952} {"train_loss": -11.014711380004883, "global_step": 159955, "epoch": 952} {"train_loss": -10.94354248046875, "global_step": 159956, "epoch": 952} {"train_loss": -11.009271621704102, "global_step": 159957, "epoch": 952} {"train_loss": -10.77131175994873, "global_step": 159958, "epoch": 952} {"train_loss": -10.859598159790039, "global_step": 159959, "epoch": 952} {"train_loss": -11.07387924194336, "global_step": 159960, "epoch": 952} {"train_loss": -11.13967514038086, "global_step": 159961, "epoch": 952} {"train_loss": -11.027200698852539, "global_step": 159962, "epoch": 952} {"train_loss": -11.014408111572266, "global_step": 159963, "epoch": 952} {"train_loss": -11.132601737976074, "global_step": 159964, "epoch": 952} {"train_loss": -10.924823760986328, "global_step": 159965, "epoch": 952} {"train_loss": -10.921252250671387, "global_step": 159966, "epoch": 952} {"train_loss": -11.106225967407227, "global_step": 159967, "epoch": 952} {"train_loss": -11.193391799926758, "global_step": 159968, "epoch": 952} {"train_loss": -11.18986701965332, "global_step": 159969, "epoch": 952} {"train_loss": -10.988424301147461, "global_step": 159970, "epoch": 952} {"train_loss": -11.13770580291748, "global_step": 159971, "epoch": 952} {"train_loss": -11.129789352416992, "global_step": 159972, "epoch": 952} {"train_loss": -11.299399375915527, "global_step": 159973, "epoch": 952} {"train_loss": -11.283140182495117, "global_step": 159974, "epoch": 952} {"train_loss": -11.270491600036621, "global_step": 159975, "epoch": 952} {"train_loss": -11.217572212219238, "global_step": 159976, "epoch": 952} {"train_loss": -11.301201820373535, "global_step": 159977, "epoch": 952} {"train_loss": -11.182659149169922, "global_step": 159978, "epoch": 952} {"train_loss": -11.208316802978516, "global_step": 159979, "epoch": 952} {"train_loss": -11.236007690429688, "global_step": 159980, "epoch": 952} {"train_loss": -10.98558235168457, "global_step": 159981, "epoch": 952} {"train_loss": -10.887147903442383, "global_step": 159982, "epoch": 952} {"train_loss": -10.912647247314453, "global_step": 159983, "epoch": 952} {"train_loss": -8.949238777160645, "global_step": 159984, "epoch": 952} {"train_loss": -9.913602828979492, "global_step": 159985, "epoch": 952} {"train_loss": -7.722530364990234, "global_step": 159986, "epoch": 952} {"train_loss": -9.713393211364746, "global_step": 159987, "epoch": 952} {"train_loss": -9.635163307189941, "global_step": 159988, "epoch": 952} {"train_loss": -9.174869537353516, "global_step": 159989, "epoch": 952} {"train_loss": -10.532718658447266, "global_step": 159990, "epoch": 952} {"train_loss": -10.170793533325195, "global_step": 159991, "epoch": 952} {"train_loss": -10.289942741394043, "global_step": 159992, "epoch": 952} {"train_loss": -10.05508041381836, "global_step": 159993, "epoch": 952} {"train_loss": -9.627513885498047, "global_step": 159994, "epoch": 952} {"train_loss": -9.970137596130371, "global_step": 159995, "epoch": 952} {"train_loss": -9.67113208770752, "global_step": 159996, "epoch": 952} {"train_loss": -10.02624797821045, "global_step": 159997, "epoch": 952} {"train_loss": -10.392629623413086, "global_step": 159998, "epoch": 952} {"train_loss": -9.812973022460938, "global_step": 159999, "epoch": 952} {"train_loss": -10.478532791137695, "global_step": 160000, "epoch": 952} {"train_loss": -10.009456634521484, "global_step": 160001, "epoch": 952} {"train_loss": -10.23933219909668, "global_step": 160002, "epoch": 952} {"train_loss": -9.989349365234375, "global_step": 160003, "epoch": 952} {"train_loss": -10.145585060119629, "global_step": 160004, "epoch": 952} {"train_loss": -10.26255989074707, "global_step": 160005, "epoch": 952} {"train_loss": -9.81303596496582, "global_step": 160006, "epoch": 952} {"train_loss": -9.933483123779297, "global_step": 160007, "epoch": 952} {"train_loss": -9.935745239257812, "global_step": 160008, "epoch": 952} {"train_loss": -9.847740173339844, "global_step": 160009, "epoch": 952} {"train_loss": -10.435714721679688, "global_step": 160010, "epoch": 952} {"train_loss": -10.43642807006836, "global_step": 160011, "epoch": 952} {"train_loss": -9.916885375976562, "global_step": 160012, "epoch": 952} {"train_loss": -10.641331672668457, "global_step": 160013, "epoch": 952} {"train_loss": -10.254660606384277, "global_step": 160014, "epoch": 952} {"train_loss": -10.437338829040527, "global_step": 160015, "epoch": 952} {"train_loss": -10.588418960571289, "global_step": 160016, "epoch": 952} {"train_loss": -10.351767539978027, "global_step": 160017, "epoch": 952} {"train_loss": -10.529125213623047, "global_step": 160018, "epoch": 952} {"train_loss": -10.509145736694336, "global_step": 160019, "epoch": 952} {"train_loss": -10.695682525634766, "global_step": 160020, "epoch": 952} {"train_loss": -10.432092666625977, "global_step": 160021, "epoch": 952} {"train_loss": -10.385416030883789, "global_step": 160022, "epoch": 952} {"train_loss": -10.703556060791016, "global_step": 160023, "epoch": 952} {"train_loss": -10.740705490112305, "global_step": 160024, "epoch": 952} {"train_loss": -10.703518867492676, "global_step": 160025, "epoch": 952} {"train_loss": -10.76774787902832, "global_step": 160026, "epoch": 952} {"train_loss": -10.609132766723633, "global_step": 160027, "epoch": 952} {"train_loss": -10.72701644897461, "global_step": 160028, "epoch": 952} {"train_loss": -10.715875625610352, "global_step": 160029, "epoch": 952} {"train_loss": -10.858782768249512, "global_step": 160030, "epoch": 952} {"train_loss": -10.723283767700195, "global_step": 160031, "epoch": 952} {"train_loss": -11.012834548950195, "global_step": 160032, "epoch": 952} {"train_loss": -10.628128051757812, "global_step": 160033, "epoch": 952} {"train_loss": -10.949682235717773, "global_step": 160034, "epoch": 952} {"train_loss": -10.954012870788574, "global_step": 160035, "epoch": 952} {"train_loss": -10.881744384765625, "global_step": 160036, "epoch": 952} {"train_loss": -10.833429336547852, "global_step": 160037, "epoch": 952} {"train_loss": -11.167665481567383, "global_step": 160038, "epoch": 952} {"train_loss": -10.957578659057617, "global_step": 160039, "epoch": 952} {"train_loss": -11.024855613708496, "global_step": 160040, "epoch": 952} {"train_loss": -11.099928855895996, "global_step": 160041, "epoch": 952} {"train_loss": -10.961405754089355, "global_step": 160042, "epoch": 952} {"train_loss": -11.031925201416016, "global_step": 160043, "epoch": 952} {"train_loss": -10.86125373840332, "global_step": 160044, "epoch": 952} {"train_loss": -11.22767448425293, "global_step": 160045, "epoch": 952} {"train_loss": -10.926308631896973, "global_step": 160046, "epoch": 952} {"train_loss": -11.054494857788086, "global_step": 160047, "epoch": 952} {"train_loss": -11.020073890686035, "global_step": 160048, "epoch": 952} {"train_loss": -11.12659740447998, "global_step": 160049, "epoch": 952} {"train_loss": -11.032562255859375, "global_step": 160050, "epoch": 952} {"train_loss": -11.133316993713379, "global_step": 160051, "epoch": 952} {"train_loss": -10.718048095703125, "global_step": 160052, "epoch": 952} {"train_loss": -10.865961074829102, "global_step": 160053, "epoch": 952} {"train_loss": -11.066863059997559, "global_step": 160054, "epoch": 952} {"train_loss": -11.025975227355957, "global_step": 160055, "epoch": 952} {"train_loss": -11.05026626586914, "global_step": 160056, "epoch": 952} {"train_loss": -11.237959861755371, "global_step": 160057, "epoch": 952} {"train_loss": -10.925516128540039, "global_step": 160058, "epoch": 952} {"train_loss": -11.302940368652344, "global_step": 160059, "epoch": 952} {"train_loss": -11.105520248413086, "global_step": 160060, "epoch": 952} {"train_loss": -11.358129501342773, "global_step": 160061, "epoch": 952} {"train_loss": -11.303359985351562, "global_step": 160062, "epoch": 952} {"train_loss": -11.168954849243164, "global_step": 160063, "epoch": 952} {"train_loss": -11.353313446044922, "global_step": 160064, "epoch": 952} {"train_loss": -11.21848201751709, "global_step": 160065, "epoch": 952} {"train_loss": -11.310905456542969, "global_step": 160066, "epoch": 952} {"train_loss": -11.201618194580078, "global_step": 160067, "epoch": 952} {"train_loss": -11.309662818908691, "global_step": 160068, "epoch": 952} {"train_loss": -11.128724098205566, "global_step": 160069, "epoch": 952} {"train_loss": -11.386167526245117, "global_step": 160070, "epoch": 952} {"train_loss": -11.044017791748047, "global_step": 160071, "epoch": 952} {"train_loss": -10.869831085205078, "global_step": 160072, "epoch": 952} {"train_loss": -11.022773742675781, "global_step": 160073, "epoch": 952} {"train_loss": -11.15776252746582, "global_step": 160074, "epoch": 952} {"train_loss": -11.20411491394043, "global_step": 160075, "epoch": 952} {"train_loss": -10.99249267578125, "global_step": 160076, "epoch": 952} {"train_loss": -11.103670120239258, "global_step": 160077, "epoch": 952} {"train_loss": -10.98164176940918, "global_step": 160078, "epoch": 952} {"train_loss": -10.884360313415527, "global_step": 160079, "epoch": 952} {"train_loss": -10.700898170471191, "global_step": 160080, "epoch": 952} {"train_loss": -10.174615859985352, "global_step": 160081, "epoch": 952} {"train_loss": -10.250229835510254, "global_step": 160082, "epoch": 952} {"train_loss": -11.332886695861816, "global_step": 160083, "epoch": 952} {"train_loss": -10.325088500976562, "global_step": 160084, "epoch": 952} {"train_loss": -10.321269989013672, "global_step": 160085, "epoch": 952} {"train_loss": -10.2281494140625, "global_step": 160086, "epoch": 952} {"train_loss": -10.004786491394043, "global_step": 160087, "epoch": 952} {"train_loss": -7.84710693359375, "global_step": 160088, "epoch": 952} {"train_loss": -8.483988761901855, "global_step": 160089, "epoch": 952} {"train_loss": -10.230396270751953, "global_step": 160090, "epoch": 952} {"train_loss": -8.777027130126953, "global_step": 160091, "epoch": 952} {"train_loss": -8.541519165039062, "global_step": 160092, "epoch": 952} {"train_loss": -9.164299011230469, "global_step": 160093, "epoch": 952} {"train_loss": -9.155752182006836, "global_step": 160094, "epoch": 952} {"train_loss": -9.040071487426758, "global_step": 160095, "epoch": 952} {"train_loss": -10.419893264770508, "global_step": 160096, "epoch": 952} {"train_loss": -9.783758163452148, "global_step": 160097, "epoch": 952} {"train_loss": -10.140349388122559, "global_step": 160098, "epoch": 952} {"train_loss": -10.246597290039062, "global_step": 160099, "epoch": 952} {"train_loss": -10.2389554977417, "global_step": 160100, "epoch": 952} {"train_loss": -9.950833320617676, "global_step": 160101, "epoch": 952} {"train_loss": -10.358369827270508, "global_step": 160102, "epoch": 952} {"train_loss": -10.599383655048552, "global_step": 160103, "epoch": 952, "val_loss": 221510.46875} {"train_loss": -10.417192459106445, "global_step": 160104, "epoch": 953} {"train_loss": -10.123777389526367, "global_step": 160105, "epoch": 953} {"train_loss": -10.542051315307617, "global_step": 160106, "epoch": 953} {"train_loss": -10.2135009765625, "global_step": 160107, "epoch": 953} {"train_loss": -10.600841522216797, "global_step": 160108, "epoch": 953} {"train_loss": -10.402231216430664, "global_step": 160109, "epoch": 953} {"train_loss": -10.330979347229004, "global_step": 160110, "epoch": 953} {"train_loss": -10.682085990905762, "global_step": 160111, "epoch": 953} {"train_loss": -10.748037338256836, "global_step": 160112, "epoch": 953} {"train_loss": -10.544815063476562, "global_step": 160113, "epoch": 953} {"train_loss": -10.578227043151855, "global_step": 160114, "epoch": 953} {"train_loss": -10.717484474182129, "global_step": 160115, "epoch": 953} {"train_loss": -10.801815032958984, "global_step": 160116, "epoch": 953} {"train_loss": -10.598688125610352, "global_step": 160117, "epoch": 953} {"train_loss": -10.705117225646973, "global_step": 160118, "epoch": 953} {"train_loss": -10.785783767700195, "global_step": 160119, "epoch": 953} {"train_loss": -10.923934936523438, "global_step": 160120, "epoch": 953} {"train_loss": -10.746357917785645, "global_step": 160121, "epoch": 953} {"train_loss": -10.714401245117188, "global_step": 160122, "epoch": 953} {"train_loss": -10.75713062286377, "global_step": 160123, "epoch": 953} {"train_loss": -10.730987548828125, "global_step": 160124, "epoch": 953} {"train_loss": -10.770086288452148, "global_step": 160125, "epoch": 953} {"train_loss": -11.10948371887207, "global_step": 160126, "epoch": 953} {"train_loss": -10.701372146606445, "global_step": 160127, "epoch": 953} {"train_loss": -10.753377914428711, "global_step": 160128, "epoch": 953} {"train_loss": -10.95608901977539, "global_step": 160129, "epoch": 953} {"train_loss": -10.840019226074219, "global_step": 160130, "epoch": 953} {"train_loss": -10.845687866210938, "global_step": 160131, "epoch": 953} {"train_loss": -10.840957641601562, "global_step": 160132, "epoch": 953} {"train_loss": -10.893294334411621, "global_step": 160133, "epoch": 953} {"train_loss": -10.774665832519531, "global_step": 160134, "epoch": 953} {"train_loss": -10.741802215576172, "global_step": 160135, "epoch": 953} {"train_loss": -10.842998504638672, "global_step": 160136, "epoch": 953} {"train_loss": -11.023826599121094, "global_step": 160137, "epoch": 953} {"train_loss": -10.852493286132812, "global_step": 160138, "epoch": 953} {"train_loss": -10.758560180664062, "global_step": 160139, "epoch": 953} {"train_loss": -11.017766952514648, "global_step": 160140, "epoch": 953} {"train_loss": -11.07416820526123, "global_step": 160141, "epoch": 953} {"train_loss": -11.094454765319824, "global_step": 160142, "epoch": 953} {"train_loss": -10.862030029296875, "global_step": 160143, "epoch": 953} {"train_loss": -10.79566764831543, "global_step": 160144, "epoch": 953} {"train_loss": -11.314237594604492, "global_step": 160145, "epoch": 953} {"train_loss": -10.981393814086914, "global_step": 160146, "epoch": 953} {"train_loss": -11.121564865112305, "global_step": 160147, "epoch": 953} {"train_loss": -11.139200210571289, "global_step": 160148, "epoch": 953} {"train_loss": -10.928472518920898, "global_step": 160149, "epoch": 953} {"train_loss": -11.103192329406738, "global_step": 160150, "epoch": 953} {"train_loss": -10.916463851928711, "global_step": 160151, "epoch": 953} {"train_loss": -11.033552169799805, "global_step": 160152, "epoch": 953} {"train_loss": -10.993001937866211, "global_step": 160153, "epoch": 953} {"train_loss": -10.95404052734375, "global_step": 160154, "epoch": 953} {"train_loss": -11.065642356872559, "global_step": 160155, "epoch": 953} {"train_loss": -10.702466011047363, "global_step": 160156, "epoch": 953} {"train_loss": -10.950835227966309, "global_step": 160157, "epoch": 953} {"train_loss": -10.90471076965332, "global_step": 160158, "epoch": 953} {"train_loss": -10.928024291992188, "global_step": 160159, "epoch": 953} {"train_loss": -10.488306999206543, "global_step": 160160, "epoch": 953} {"train_loss": -10.44681167602539, "global_step": 160161, "epoch": 953} {"train_loss": -10.599413871765137, "global_step": 160162, "epoch": 953} {"train_loss": -10.561769485473633, "global_step": 160163, "epoch": 953} {"train_loss": -10.83411979675293, "global_step": 160164, "epoch": 953} {"train_loss": -10.870779037475586, "global_step": 160165, "epoch": 953} {"train_loss": -10.458709716796875, "global_step": 160166, "epoch": 953} {"train_loss": -10.405942916870117, "global_step": 160167, "epoch": 953} {"train_loss": -10.306877136230469, "global_step": 160168, "epoch": 953} {"train_loss": -10.200215339660645, "global_step": 160169, "epoch": 953} {"train_loss": -9.458578109741211, "global_step": 160170, "epoch": 953} {"train_loss": -10.29286003112793, "global_step": 160171, "epoch": 953} {"train_loss": -10.634581565856934, "global_step": 160172, "epoch": 953} {"train_loss": -10.294569969177246, "global_step": 160173, "epoch": 953} {"train_loss": -10.35584831237793, "global_step": 160174, "epoch": 953} {"train_loss": -10.808876037597656, "global_step": 160175, "epoch": 953} {"train_loss": -10.117789268493652, "global_step": 160176, "epoch": 953} {"train_loss": -10.651815414428711, "global_step": 160177, "epoch": 953} {"train_loss": -10.511186599731445, "global_step": 160178, "epoch": 953} {"train_loss": -10.278960227966309, "global_step": 160179, "epoch": 953} {"train_loss": -10.487092971801758, "global_step": 160180, "epoch": 953} {"train_loss": -10.753728866577148, "global_step": 160181, "epoch": 953} {"train_loss": -10.761627197265625, "global_step": 160182, "epoch": 953} {"train_loss": -10.956674575805664, "global_step": 160183, "epoch": 953} {"train_loss": -10.833346366882324, "global_step": 160184, "epoch": 953} {"train_loss": -10.733405113220215, "global_step": 160185, "epoch": 953} {"train_loss": -10.851380348205566, "global_step": 160186, "epoch": 953} {"train_loss": -10.61945915222168, "global_step": 160187, "epoch": 953} {"train_loss": -10.895998001098633, "global_step": 160188, "epoch": 953} {"train_loss": -10.749181747436523, "global_step": 160189, "epoch": 953} {"train_loss": -10.607503890991211, "global_step": 160190, "epoch": 953} {"train_loss": -10.831398010253906, "global_step": 160191, "epoch": 953} {"train_loss": -10.8125581741333, "global_step": 160192, "epoch": 953} {"train_loss": -10.97862434387207, "global_step": 160193, "epoch": 953} {"train_loss": -10.657940864562988, "global_step": 160194, "epoch": 953} {"train_loss": -10.96876049041748, "global_step": 160195, "epoch": 953} {"train_loss": -11.182159423828125, "global_step": 160196, "epoch": 953} {"train_loss": -10.763078689575195, "global_step": 160197, "epoch": 953} {"train_loss": -10.763338088989258, "global_step": 160198, "epoch": 953} {"train_loss": -10.628118515014648, "global_step": 160199, "epoch": 953} {"train_loss": -11.068814277648926, "global_step": 160200, "epoch": 953} {"train_loss": -10.7210693359375, "global_step": 160201, "epoch": 953} {"train_loss": -10.645805358886719, "global_step": 160202, "epoch": 953} {"train_loss": -11.097578048706055, "global_step": 160203, "epoch": 953} {"train_loss": -10.659646987915039, "global_step": 160204, "epoch": 953} {"train_loss": -10.962387084960938, "global_step": 160205, "epoch": 953} {"train_loss": -10.695137023925781, "global_step": 160206, "epoch": 953} {"train_loss": -10.806857109069824, "global_step": 160207, "epoch": 953} {"train_loss": -10.784395217895508, "global_step": 160208, "epoch": 953} {"train_loss": -10.556074142456055, "global_step": 160209, "epoch": 953} {"train_loss": -10.421041488647461, "global_step": 160210, "epoch": 953} {"train_loss": -10.602400779724121, "global_step": 160211, "epoch": 953} {"train_loss": -10.753913879394531, "global_step": 160212, "epoch": 953} {"train_loss": -10.636404991149902, "global_step": 160213, "epoch": 953} {"train_loss": -10.766647338867188, "global_step": 160214, "epoch": 953} {"train_loss": -11.186182022094727, "global_step": 160215, "epoch": 953} {"train_loss": -11.003312110900879, "global_step": 160216, "epoch": 953} {"train_loss": -10.587971687316895, "global_step": 160217, "epoch": 953} {"train_loss": -10.7740478515625, "global_step": 160218, "epoch": 953} {"train_loss": -10.524465560913086, "global_step": 160219, "epoch": 953} {"train_loss": -10.891592979431152, "global_step": 160220, "epoch": 953} {"train_loss": -10.740449905395508, "global_step": 160221, "epoch": 953} {"train_loss": -10.666560173034668, "global_step": 160222, "epoch": 953} {"train_loss": -10.894943237304688, "global_step": 160223, "epoch": 953} {"train_loss": -10.506898880004883, "global_step": 160224, "epoch": 953} {"train_loss": -10.597705841064453, "global_step": 160225, "epoch": 953} {"train_loss": -10.704546928405762, "global_step": 160226, "epoch": 953} {"train_loss": -10.855224609375, "global_step": 160227, "epoch": 953} {"train_loss": -10.932072639465332, "global_step": 160228, "epoch": 953} {"train_loss": -11.030109405517578, "global_step": 160229, "epoch": 953} {"train_loss": -10.678525924682617, "global_step": 160230, "epoch": 953} {"train_loss": -10.68786907196045, "global_step": 160231, "epoch": 953} {"train_loss": -10.900375366210938, "global_step": 160232, "epoch": 953} {"train_loss": -10.629279136657715, "global_step": 160233, "epoch": 953} {"train_loss": -11.18738842010498, "global_step": 160234, "epoch": 953} {"train_loss": -11.081021308898926, "global_step": 160235, "epoch": 953} {"train_loss": -10.779901504516602, "global_step": 160236, "epoch": 953} {"train_loss": -11.096308708190918, "global_step": 160237, "epoch": 953} {"train_loss": -10.930855751037598, "global_step": 160238, "epoch": 953} {"train_loss": -11.14799976348877, "global_step": 160239, "epoch": 953} {"train_loss": -10.979515075683594, "global_step": 160240, "epoch": 953} {"train_loss": -11.120800018310547, "global_step": 160241, "epoch": 953} {"train_loss": -10.944358825683594, "global_step": 160242, "epoch": 953} {"train_loss": -11.039817810058594, "global_step": 160243, "epoch": 953} {"train_loss": -11.034589767456055, "global_step": 160244, "epoch": 953} {"train_loss": -11.138195037841797, "global_step": 160245, "epoch": 953} {"train_loss": -11.293906211853027, "global_step": 160246, "epoch": 953} {"train_loss": -11.078253746032715, "global_step": 160247, "epoch": 953} {"train_loss": -11.056260108947754, "global_step": 160248, "epoch": 953} {"train_loss": -11.040035247802734, "global_step": 160249, "epoch": 953} {"train_loss": -11.06755256652832, "global_step": 160250, "epoch": 953} {"train_loss": -11.18746566772461, "global_step": 160251, "epoch": 953} {"train_loss": -11.105486869812012, "global_step": 160252, "epoch": 953} {"train_loss": -11.167146682739258, "global_step": 160253, "epoch": 953} {"train_loss": -11.035781860351562, "global_step": 160254, "epoch": 953} {"train_loss": -11.127975463867188, "global_step": 160255, "epoch": 953} {"train_loss": -11.112272262573242, "global_step": 160256, "epoch": 953} {"train_loss": -11.129295349121094, "global_step": 160257, "epoch": 953} {"train_loss": -11.423774719238281, "global_step": 160258, "epoch": 953} {"train_loss": -11.104926109313965, "global_step": 160259, "epoch": 953} {"train_loss": -11.108702659606934, "global_step": 160260, "epoch": 953} {"train_loss": -11.202367782592773, "global_step": 160261, "epoch": 953} {"train_loss": -11.018770217895508, "global_step": 160262, "epoch": 953} {"train_loss": -11.07734203338623, "global_step": 160263, "epoch": 953} {"train_loss": -11.275093078613281, "global_step": 160264, "epoch": 953} {"train_loss": -11.137443542480469, "global_step": 160265, "epoch": 953} {"train_loss": -11.042680740356445, "global_step": 160266, "epoch": 953} {"train_loss": -11.004481315612793, "global_step": 160267, "epoch": 953} {"train_loss": -11.141592979431152, "global_step": 160268, "epoch": 953} {"train_loss": -10.862659454345703, "global_step": 160269, "epoch": 953} {"train_loss": -11.220196723937988, "global_step": 160270, "epoch": 953} {"train_loss": -10.814780751864115, "global_step": 160271, "epoch": 953, "val_loss": 233132.5} {"train_loss": -9.898529052734375, "global_step": 160272, "epoch": 954} {"train_loss": -10.307315826416016, "global_step": 160273, "epoch": 954} {"train_loss": -10.05908203125, "global_step": 160274, "epoch": 954} {"train_loss": -10.407245635986328, "global_step": 160275, "epoch": 954} {"train_loss": -10.494152069091797, "global_step": 160276, "epoch": 954} {"train_loss": -10.340080261230469, "global_step": 160277, "epoch": 954} {"train_loss": -10.022680282592773, "global_step": 160278, "epoch": 954} {"train_loss": -10.699649810791016, "global_step": 160279, "epoch": 954} {"train_loss": -9.792476654052734, "global_step": 160280, "epoch": 954} {"train_loss": -10.466758728027344, "global_step": 160281, "epoch": 954} {"train_loss": -10.373332977294922, "global_step": 160282, "epoch": 954} {"train_loss": -9.902040481567383, "global_step": 160283, "epoch": 954} {"train_loss": -10.661581039428711, "global_step": 160284, "epoch": 954} {"train_loss": -10.217815399169922, "global_step": 160285, "epoch": 954} {"train_loss": -10.495718002319336, "global_step": 160286, "epoch": 954} {"train_loss": -10.60856819152832, "global_step": 160287, "epoch": 954} {"train_loss": -10.378385543823242, "global_step": 160288, "epoch": 954} {"train_loss": -10.772157669067383, "global_step": 160289, "epoch": 954} {"train_loss": -10.463664054870605, "global_step": 160290, "epoch": 954} {"train_loss": -10.206469535827637, "global_step": 160291, "epoch": 954} {"train_loss": -10.63850212097168, "global_step": 160292, "epoch": 954} {"train_loss": -10.738774299621582, "global_step": 160293, "epoch": 954} {"train_loss": -10.799208641052246, "global_step": 160294, "epoch": 954} {"train_loss": -10.913625717163086, "global_step": 160295, "epoch": 954} {"train_loss": -10.58165168762207, "global_step": 160296, "epoch": 954} {"train_loss": -10.59846305847168, "global_step": 160297, "epoch": 954} {"train_loss": -10.849868774414062, "global_step": 160298, "epoch": 954} {"train_loss": -10.80597972869873, "global_step": 160299, "epoch": 954} {"train_loss": -10.647085189819336, "global_step": 160300, "epoch": 954} {"train_loss": -10.934770584106445, "global_step": 160301, "epoch": 954} {"train_loss": -10.932195663452148, "global_step": 160302, "epoch": 954} {"train_loss": -10.782782554626465, "global_step": 160303, "epoch": 954} {"train_loss": -10.61398696899414, "global_step": 160304, "epoch": 954} {"train_loss": -10.945053100585938, "global_step": 160305, "epoch": 954} {"train_loss": -10.49180793762207, "global_step": 160306, "epoch": 954} {"train_loss": -10.928564071655273, "global_step": 160307, "epoch": 954} {"train_loss": -10.748714447021484, "global_step": 160308, "epoch": 954} {"train_loss": -10.480386734008789, "global_step": 160309, "epoch": 954} {"train_loss": -10.665245056152344, "global_step": 160310, "epoch": 954} {"train_loss": -10.558834075927734, "global_step": 160311, "epoch": 954} {"train_loss": -11.0845947265625, "global_step": 160312, "epoch": 954} {"train_loss": -10.524460792541504, "global_step": 160313, "epoch": 954} {"train_loss": -10.738997459411621, "global_step": 160314, "epoch": 954} {"train_loss": -10.449722290039062, "global_step": 160315, "epoch": 954} {"train_loss": -10.332050323486328, "global_step": 160316, "epoch": 954} {"train_loss": -10.636449813842773, "global_step": 160317, "epoch": 954} {"train_loss": -10.490275382995605, "global_step": 160318, "epoch": 954} {"train_loss": -10.775398254394531, "global_step": 160319, "epoch": 954} {"train_loss": -10.55196762084961, "global_step": 160320, "epoch": 954} {"train_loss": -10.677453994750977, "global_step": 160321, "epoch": 954} {"train_loss": -10.54060173034668, "global_step": 160322, "epoch": 954} {"train_loss": -10.416292190551758, "global_step": 160323, "epoch": 954} {"train_loss": -10.933311462402344, "global_step": 160324, "epoch": 954} {"train_loss": -10.909099578857422, "global_step": 160325, "epoch": 954} {"train_loss": -10.489255905151367, "global_step": 160326, "epoch": 954} {"train_loss": -10.80825424194336, "global_step": 160327, "epoch": 954} {"train_loss": -10.9679536819458, "global_step": 160328, "epoch": 954} {"train_loss": -10.887362480163574, "global_step": 160329, "epoch": 954} {"train_loss": -10.80561637878418, "global_step": 160330, "epoch": 954} {"train_loss": -10.981537818908691, "global_step": 160331, "epoch": 954} {"train_loss": -10.791574478149414, "global_step": 160332, "epoch": 954} {"train_loss": -10.730457305908203, "global_step": 160333, "epoch": 954} {"train_loss": -10.876133918762207, "global_step": 160334, "epoch": 954} {"train_loss": -10.805391311645508, "global_step": 160335, "epoch": 954} {"train_loss": -11.009822845458984, "global_step": 160336, "epoch": 954} {"train_loss": -10.898488998413086, "global_step": 160337, "epoch": 954} {"train_loss": -10.904195785522461, "global_step": 160338, "epoch": 954} {"train_loss": -11.009047508239746, "global_step": 160339, "epoch": 954} {"train_loss": -10.848995208740234, "global_step": 160340, "epoch": 954} {"train_loss": -10.890776634216309, "global_step": 160341, "epoch": 954} {"train_loss": -10.936495780944824, "global_step": 160342, "epoch": 954} {"train_loss": -10.88093376159668, "global_step": 160343, "epoch": 954} {"train_loss": -10.850975036621094, "global_step": 160344, "epoch": 954} {"train_loss": -10.890214920043945, "global_step": 160345, "epoch": 954} {"train_loss": -10.780755996704102, "global_step": 160346, "epoch": 954} {"train_loss": -11.021602630615234, "global_step": 160347, "epoch": 954} {"train_loss": -10.97523307800293, "global_step": 160348, "epoch": 954} {"train_loss": -10.937736511230469, "global_step": 160349, "epoch": 954} {"train_loss": -11.10568618774414, "global_step": 160350, "epoch": 954} {"train_loss": -11.065465927124023, "global_step": 160351, "epoch": 954} {"train_loss": -11.228353500366211, "global_step": 160352, "epoch": 954} {"train_loss": -11.103889465332031, "global_step": 160353, "epoch": 954} {"train_loss": -11.273124694824219, "global_step": 160354, "epoch": 954} {"train_loss": -11.188557624816895, "global_step": 160355, "epoch": 954} {"train_loss": -10.914840698242188, "global_step": 160356, "epoch": 954} {"train_loss": -11.197314262390137, "global_step": 160357, "epoch": 954} {"train_loss": -11.02743911743164, "global_step": 160358, "epoch": 954} {"train_loss": -11.08126163482666, "global_step": 160359, "epoch": 954} {"train_loss": -11.264694213867188, "global_step": 160360, "epoch": 954} {"train_loss": -11.15493392944336, "global_step": 160361, "epoch": 954} {"train_loss": -11.100292205810547, "global_step": 160362, "epoch": 954} {"train_loss": -11.068602561950684, "global_step": 160363, "epoch": 954} {"train_loss": -11.117165565490723, "global_step": 160364, "epoch": 954} {"train_loss": -11.274436950683594, "global_step": 160365, "epoch": 954} {"train_loss": -10.81104850769043, "global_step": 160366, "epoch": 954} {"train_loss": -11.372335433959961, "global_step": 160367, "epoch": 954} {"train_loss": -11.023818969726562, "global_step": 160368, "epoch": 954} {"train_loss": -11.296036720275879, "global_step": 160369, "epoch": 954} {"train_loss": -11.419479370117188, "global_step": 160370, "epoch": 954} {"train_loss": -10.76645278930664, "global_step": 160371, "epoch": 954} {"train_loss": -11.341448783874512, "global_step": 160372, "epoch": 954} {"train_loss": -10.685145378112793, "global_step": 160373, "epoch": 954} {"train_loss": -10.694639205932617, "global_step": 160374, "epoch": 954} {"train_loss": -10.558149337768555, "global_step": 160375, "epoch": 954} {"train_loss": -10.831779479980469, "global_step": 160376, "epoch": 954} {"train_loss": -10.546525955200195, "global_step": 160377, "epoch": 954} {"train_loss": -10.798973083496094, "global_step": 160378, "epoch": 954} {"train_loss": -10.774024963378906, "global_step": 160379, "epoch": 954} {"train_loss": -11.019157409667969, "global_step": 160380, "epoch": 954} {"train_loss": -11.129891395568848, "global_step": 160381, "epoch": 954} {"train_loss": -10.394500732421875, "global_step": 160382, "epoch": 954} {"train_loss": -10.856385231018066, "global_step": 160383, "epoch": 954} {"train_loss": -10.58076286315918, "global_step": 160384, "epoch": 954} {"train_loss": -11.027090072631836, "global_step": 160385, "epoch": 954} {"train_loss": -10.404372215270996, "global_step": 160386, "epoch": 954} {"train_loss": -10.552892684936523, "global_step": 160387, "epoch": 954} {"train_loss": -10.249998092651367, "global_step": 160388, "epoch": 954} {"train_loss": -10.545156478881836, "global_step": 160389, "epoch": 954} {"train_loss": -10.724133491516113, "global_step": 160390, "epoch": 954} {"train_loss": -10.900707244873047, "global_step": 160391, "epoch": 954} {"train_loss": -10.982455253601074, "global_step": 160392, "epoch": 954} {"train_loss": -10.862750053405762, "global_step": 160393, "epoch": 954} {"train_loss": -11.194685935974121, "global_step": 160394, "epoch": 954} {"train_loss": -10.995265007019043, "global_step": 160395, "epoch": 954} {"train_loss": -10.925798416137695, "global_step": 160396, "epoch": 954} {"train_loss": -10.988120079040527, "global_step": 160397, "epoch": 954} {"train_loss": -10.49468994140625, "global_step": 160398, "epoch": 954} {"train_loss": -11.053321838378906, "global_step": 160399, "epoch": 954} {"train_loss": -10.589576721191406, "global_step": 160400, "epoch": 954} {"train_loss": -10.881123542785645, "global_step": 160401, "epoch": 954} {"train_loss": -10.850900650024414, "global_step": 160402, "epoch": 954} {"train_loss": -10.730441093444824, "global_step": 160403, "epoch": 954} {"train_loss": -11.125179290771484, "global_step": 160404, "epoch": 954} {"train_loss": -10.39615535736084, "global_step": 160405, "epoch": 954} {"train_loss": -11.030832290649414, "global_step": 160406, "epoch": 954} {"train_loss": -10.001850128173828, "global_step": 160407, "epoch": 954} {"train_loss": -10.662221908569336, "global_step": 160408, "epoch": 954} {"train_loss": -10.645940780639648, "global_step": 160409, "epoch": 954} {"train_loss": -10.473288536071777, "global_step": 160410, "epoch": 954} {"train_loss": -10.467118263244629, "global_step": 160411, "epoch": 954} {"train_loss": -10.49586296081543, "global_step": 160412, "epoch": 954} {"train_loss": -10.645350456237793, "global_step": 160413, "epoch": 954} {"train_loss": -10.869771957397461, "global_step": 160414, "epoch": 954} {"train_loss": -10.77298355102539, "global_step": 160415, "epoch": 954} {"train_loss": -10.658761024475098, "global_step": 160416, "epoch": 954} {"train_loss": -10.965197563171387, "global_step": 160417, "epoch": 954} {"train_loss": -10.552309036254883, "global_step": 160418, "epoch": 954} {"train_loss": -10.763702392578125, "global_step": 160419, "epoch": 954} {"train_loss": -10.500799179077148, "global_step": 160420, "epoch": 954} {"train_loss": -9.934102058410645, "global_step": 160421, "epoch": 954} {"train_loss": -10.79196548461914, "global_step": 160422, "epoch": 954} {"train_loss": -10.516218185424805, "global_step": 160423, "epoch": 954} {"train_loss": -10.530115127563477, "global_step": 160424, "epoch": 954} {"train_loss": -10.6455078125, "global_step": 160425, "epoch": 954} {"train_loss": -10.758460998535156, "global_step": 160426, "epoch": 954} {"train_loss": -11.013121604919434, "global_step": 160427, "epoch": 954} {"train_loss": -10.521191596984863, "global_step": 160428, "epoch": 954} {"train_loss": -10.9427490234375, "global_step": 160429, "epoch": 954} {"train_loss": -10.397972106933594, "global_step": 160430, "epoch": 954} {"train_loss": -10.954049110412598, "global_step": 160431, "epoch": 954} {"train_loss": -10.314932823181152, "global_step": 160432, "epoch": 954} {"train_loss": -10.476707458496094, "global_step": 160433, "epoch": 954} {"train_loss": -10.432692527770996, "global_step": 160434, "epoch": 954} {"train_loss": -10.759910583496094, "global_step": 160435, "epoch": 954} {"train_loss": -10.709564208984375, "global_step": 160436, "epoch": 954} {"train_loss": -10.92419147491455, "global_step": 160437, "epoch": 954} {"train_loss": -11.010595321655273, "global_step": 160438, "epoch": 954} {"train_loss": -10.743721854119073, "global_step": 160439, "epoch": 954, "val_loss": 236009.234375} {"train_loss": -10.736096382141113, "global_step": 160440, "epoch": 955} {"train_loss": -10.970532417297363, "global_step": 160441, "epoch": 955} {"train_loss": -10.945674896240234, "global_step": 160442, "epoch": 955} {"train_loss": -10.998210906982422, "global_step": 160443, "epoch": 955} {"train_loss": -11.031630516052246, "global_step": 160444, "epoch": 955} {"train_loss": -11.319225311279297, "global_step": 160445, "epoch": 955} {"train_loss": -11.202874183654785, "global_step": 160446, "epoch": 955} {"train_loss": -11.02707290649414, "global_step": 160447, "epoch": 955} {"train_loss": -11.150907516479492, "global_step": 160448, "epoch": 955} {"train_loss": -11.252354621887207, "global_step": 160449, "epoch": 955} {"train_loss": -11.255958557128906, "global_step": 160450, "epoch": 955} {"train_loss": -11.049382209777832, "global_step": 160451, "epoch": 955} {"train_loss": -11.026267051696777, "global_step": 160452, "epoch": 955} {"train_loss": -11.210552215576172, "global_step": 160453, "epoch": 955} {"train_loss": -10.974102973937988, "global_step": 160454, "epoch": 955} {"train_loss": -11.366242408752441, "global_step": 160455, "epoch": 955} {"train_loss": -11.206653594970703, "global_step": 160456, "epoch": 955} {"train_loss": -11.164973258972168, "global_step": 160457, "epoch": 955} {"train_loss": -11.069109916687012, "global_step": 160458, "epoch": 955} {"train_loss": -10.971759796142578, "global_step": 160459, "epoch": 955} {"train_loss": -11.0455322265625, "global_step": 160460, "epoch": 955} {"train_loss": -10.876623153686523, "global_step": 160461, "epoch": 955} {"train_loss": -11.340860366821289, "global_step": 160462, "epoch": 955} {"train_loss": -11.101522445678711, "global_step": 160463, "epoch": 955} {"train_loss": -10.934627532958984, "global_step": 160464, "epoch": 955} {"train_loss": -11.018997192382812, "global_step": 160465, "epoch": 955} {"train_loss": -10.75963306427002, "global_step": 160466, "epoch": 955} {"train_loss": -11.186836242675781, "global_step": 160467, "epoch": 955} {"train_loss": -11.15079402923584, "global_step": 160468, "epoch": 955} {"train_loss": -11.044395446777344, "global_step": 160469, "epoch": 955} {"train_loss": -11.233478546142578, "global_step": 160470, "epoch": 955} {"train_loss": -11.195640563964844, "global_step": 160471, "epoch": 955} {"train_loss": -10.972537994384766, "global_step": 160472, "epoch": 955} {"train_loss": -11.11392593383789, "global_step": 160473, "epoch": 955} {"train_loss": -11.140059471130371, "global_step": 160474, "epoch": 955} {"train_loss": -10.707537651062012, "global_step": 160475, "epoch": 955} {"train_loss": -11.01584529876709, "global_step": 160476, "epoch": 955} {"train_loss": -10.912337303161621, "global_step": 160477, "epoch": 955} {"train_loss": -10.613203048706055, "global_step": 160478, "epoch": 955} {"train_loss": -10.983631134033203, "global_step": 160479, "epoch": 955} {"train_loss": -11.269937515258789, "global_step": 160480, "epoch": 955} {"train_loss": -11.263870239257812, "global_step": 160481, "epoch": 955} {"train_loss": -10.767380714416504, "global_step": 160482, "epoch": 955} {"train_loss": -11.111217498779297, "global_step": 160483, "epoch": 955} {"train_loss": -11.449514389038086, "global_step": 160484, "epoch": 955} {"train_loss": -11.15312671661377, "global_step": 160485, "epoch": 955} {"train_loss": -10.795719146728516, "global_step": 160486, "epoch": 955} {"train_loss": -10.699995040893555, "global_step": 160487, "epoch": 955} {"train_loss": -10.731485366821289, "global_step": 160488, "epoch": 955} {"train_loss": -10.703231811523438, "global_step": 160489, "epoch": 955} {"train_loss": -11.134233474731445, "global_step": 160490, "epoch": 955} {"train_loss": -11.001119613647461, "global_step": 160491, "epoch": 955} {"train_loss": -10.881229400634766, "global_step": 160492, "epoch": 955} {"train_loss": -10.610343933105469, "global_step": 160493, "epoch": 955} {"train_loss": -10.803766250610352, "global_step": 160494, "epoch": 955} {"train_loss": -11.019983291625977, "global_step": 160495, "epoch": 955} {"train_loss": -10.850530624389648, "global_step": 160496, "epoch": 955} {"train_loss": -10.878113746643066, "global_step": 160497, "epoch": 955} {"train_loss": -10.840374946594238, "global_step": 160498, "epoch": 955} {"train_loss": -10.341176986694336, "global_step": 160499, "epoch": 955} {"train_loss": -10.46578311920166, "global_step": 160500, "epoch": 955} {"train_loss": -9.593628883361816, "global_step": 160501, "epoch": 955} {"train_loss": -10.844740867614746, "global_step": 160502, "epoch": 955} {"train_loss": -9.357735633850098, "global_step": 160503, "epoch": 955} {"train_loss": -10.682432174682617, "global_step": 160504, "epoch": 955} {"train_loss": -10.413427352905273, "global_step": 160505, "epoch": 955} {"train_loss": -10.39852523803711, "global_step": 160506, "epoch": 955} {"train_loss": -10.77865219116211, "global_step": 160507, "epoch": 955} {"train_loss": -10.292193412780762, "global_step": 160508, "epoch": 955} {"train_loss": -10.737311363220215, "global_step": 160509, "epoch": 955} {"train_loss": -9.89577579498291, "global_step": 160510, "epoch": 955} {"train_loss": -10.836370468139648, "global_step": 160511, "epoch": 955} {"train_loss": -10.553946495056152, "global_step": 160512, "epoch": 955} {"train_loss": -10.737114906311035, "global_step": 160513, "epoch": 955} {"train_loss": -10.468378067016602, "global_step": 160514, "epoch": 955} {"train_loss": -10.614090919494629, "global_step": 160515, "epoch": 955} {"train_loss": -10.9689302444458, "global_step": 160516, "epoch": 955} {"train_loss": -10.75112533569336, "global_step": 160517, "epoch": 955} {"train_loss": -10.780230522155762, "global_step": 160518, "epoch": 955} {"train_loss": -10.618395805358887, "global_step": 160519, "epoch": 955} {"train_loss": -10.79649543762207, "global_step": 160520, "epoch": 955} {"train_loss": -10.979316711425781, "global_step": 160521, "epoch": 955} {"train_loss": -10.723398208618164, "global_step": 160522, "epoch": 955} {"train_loss": -10.970922470092773, "global_step": 160523, "epoch": 955} {"train_loss": -10.764120101928711, "global_step": 160524, "epoch": 955} {"train_loss": -10.968775749206543, "global_step": 160525, "epoch": 955} {"train_loss": -10.74945068359375, "global_step": 160526, "epoch": 955} {"train_loss": -10.715075492858887, "global_step": 160527, "epoch": 955} {"train_loss": -10.669994354248047, "global_step": 160528, "epoch": 955} {"train_loss": -10.493935585021973, "global_step": 160529, "epoch": 955} {"train_loss": -10.305269241333008, "global_step": 160530, "epoch": 955} {"train_loss": -11.065155029296875, "global_step": 160531, "epoch": 955} {"train_loss": -10.59826946258545, "global_step": 160532, "epoch": 955} {"train_loss": -10.672063827514648, "global_step": 160533, "epoch": 955} {"train_loss": -10.579025268554688, "global_step": 160534, "epoch": 955} {"train_loss": -10.309120178222656, "global_step": 160535, "epoch": 955} {"train_loss": -10.69304084777832, "global_step": 160536, "epoch": 955} {"train_loss": -9.880359649658203, "global_step": 160537, "epoch": 955} {"train_loss": -10.349225044250488, "global_step": 160538, "epoch": 955} {"train_loss": -10.139464378356934, "global_step": 160539, "epoch": 955} {"train_loss": -10.491891860961914, "global_step": 160540, "epoch": 955} {"train_loss": -10.296558380126953, "global_step": 160541, "epoch": 955} {"train_loss": -10.170684814453125, "global_step": 160542, "epoch": 955} {"train_loss": -10.558778762817383, "global_step": 160543, "epoch": 955} {"train_loss": -10.324970245361328, "global_step": 160544, "epoch": 955} {"train_loss": -9.905698776245117, "global_step": 160545, "epoch": 955} {"train_loss": -10.620612144470215, "global_step": 160546, "epoch": 955} {"train_loss": -10.003204345703125, "global_step": 160547, "epoch": 955} {"train_loss": -10.171218872070312, "global_step": 160548, "epoch": 955} {"train_loss": -10.58706283569336, "global_step": 160549, "epoch": 955} {"train_loss": -10.459393501281738, "global_step": 160550, "epoch": 955} {"train_loss": -10.265570640563965, "global_step": 160551, "epoch": 955} {"train_loss": -10.957822799682617, "global_step": 160552, "epoch": 955} {"train_loss": -10.345049858093262, "global_step": 160553, "epoch": 955} {"train_loss": -10.249465942382812, "global_step": 160554, "epoch": 955} {"train_loss": -11.052204132080078, "global_step": 160555, "epoch": 955} {"train_loss": -10.626066207885742, "global_step": 160556, "epoch": 955} {"train_loss": -10.760708808898926, "global_step": 160557, "epoch": 955} {"train_loss": -10.873064041137695, "global_step": 160558, "epoch": 955} {"train_loss": -10.893594741821289, "global_step": 160559, "epoch": 955} {"train_loss": -10.68628215789795, "global_step": 160560, "epoch": 955} {"train_loss": -10.915342330932617, "global_step": 160561, "epoch": 955} {"train_loss": -10.531949043273926, "global_step": 160562, "epoch": 955} {"train_loss": -10.826041221618652, "global_step": 160563, "epoch": 955} {"train_loss": -10.930282592773438, "global_step": 160564, "epoch": 955} {"train_loss": -10.73597526550293, "global_step": 160565, "epoch": 955} {"train_loss": -10.713125228881836, "global_step": 160566, "epoch": 955} {"train_loss": -10.791933059692383, "global_step": 160567, "epoch": 955} {"train_loss": -11.061210632324219, "global_step": 160568, "epoch": 955} {"train_loss": -10.731184005737305, "global_step": 160569, "epoch": 955} {"train_loss": -11.072399139404297, "global_step": 160570, "epoch": 955} {"train_loss": -11.045126914978027, "global_step": 160571, "epoch": 955} {"train_loss": -11.048249244689941, "global_step": 160572, "epoch": 955} {"train_loss": -10.81757926940918, "global_step": 160573, "epoch": 955} {"train_loss": -10.930891036987305, "global_step": 160574, "epoch": 955} {"train_loss": -11.213768005371094, "global_step": 160575, "epoch": 955} {"train_loss": -11.011310577392578, "global_step": 160576, "epoch": 955} {"train_loss": -11.00648021697998, "global_step": 160577, "epoch": 955} {"train_loss": -10.867950439453125, "global_step": 160578, "epoch": 955} {"train_loss": -10.81421184539795, "global_step": 160579, "epoch": 955} {"train_loss": -10.814391136169434, "global_step": 160580, "epoch": 955} {"train_loss": -11.068758964538574, "global_step": 160581, "epoch": 955} {"train_loss": -10.660279273986816, "global_step": 160582, "epoch": 955} {"train_loss": -10.675758361816406, "global_step": 160583, "epoch": 955} {"train_loss": -10.807080268859863, "global_step": 160584, "epoch": 955} {"train_loss": -10.925450325012207, "global_step": 160585, "epoch": 955} {"train_loss": -11.08035945892334, "global_step": 160586, "epoch": 955} {"train_loss": -10.789429664611816, "global_step": 160587, "epoch": 955} {"train_loss": -10.893156051635742, "global_step": 160588, "epoch": 955} {"train_loss": -11.01643180847168, "global_step": 160589, "epoch": 955} {"train_loss": -11.085057258605957, "global_step": 160590, "epoch": 955} {"train_loss": -11.091705322265625, "global_step": 160591, "epoch": 955} {"train_loss": -10.610228538513184, "global_step": 160592, "epoch": 955} {"train_loss": -10.855257987976074, "global_step": 160593, "epoch": 955} {"train_loss": -11.170632362365723, "global_step": 160594, "epoch": 955} {"train_loss": -10.597475051879883, "global_step": 160595, "epoch": 955} {"train_loss": -11.165072441101074, "global_step": 160596, "epoch": 955} {"train_loss": -10.630529403686523, "global_step": 160597, "epoch": 955} {"train_loss": -11.102598190307617, "global_step": 160598, "epoch": 955} {"train_loss": -10.869743347167969, "global_step": 160599, "epoch": 955} {"train_loss": -10.621328353881836, "global_step": 160600, "epoch": 955} {"train_loss": -11.217691421508789, "global_step": 160601, "epoch": 955} {"train_loss": -10.51333236694336, "global_step": 160602, "epoch": 955} {"train_loss": -10.352853775024414, "global_step": 160603, "epoch": 955} {"train_loss": -10.980751037597656, "global_step": 160604, "epoch": 955} {"train_loss": -10.818166732788086, "global_step": 160605, "epoch": 955} {"train_loss": -10.590299606323242, "global_step": 160606, "epoch": 955} {"train_loss": -10.798751666432334, "global_step": 160607, "epoch": 955, "val_loss": 234845.03125, "train_action_mse_error": 2.2872354984283447} {"train_loss": -10.382966995239258, "global_step": 160608, "epoch": 956} {"train_loss": -10.901819229125977, "global_step": 160609, "epoch": 956} {"train_loss": -10.567113876342773, "global_step": 160610, "epoch": 956} {"train_loss": -10.772038459777832, "global_step": 160611, "epoch": 956} {"train_loss": -11.022805213928223, "global_step": 160612, "epoch": 956} {"train_loss": -10.485395431518555, "global_step": 160613, "epoch": 956} {"train_loss": -10.293551445007324, "global_step": 160614, "epoch": 956} {"train_loss": -10.908437728881836, "global_step": 160615, "epoch": 956} {"train_loss": -10.462618827819824, "global_step": 160616, "epoch": 956} {"train_loss": -10.835607528686523, "global_step": 160617, "epoch": 956} {"train_loss": -10.414308547973633, "global_step": 160618, "epoch": 956} {"train_loss": -10.58289909362793, "global_step": 160619, "epoch": 956} {"train_loss": -10.566679000854492, "global_step": 160620, "epoch": 956} {"train_loss": -10.52927303314209, "global_step": 160621, "epoch": 956} {"train_loss": -10.677961349487305, "global_step": 160622, "epoch": 956} {"train_loss": -10.387070655822754, "global_step": 160623, "epoch": 956} {"train_loss": -10.567214965820312, "global_step": 160624, "epoch": 956} {"train_loss": -10.775494575500488, "global_step": 160625, "epoch": 956} {"train_loss": -10.968294143676758, "global_step": 160626, "epoch": 956} {"train_loss": -10.955175399780273, "global_step": 160627, "epoch": 956} {"train_loss": -11.087236404418945, "global_step": 160628, "epoch": 956} {"train_loss": -10.838281631469727, "global_step": 160629, "epoch": 956} {"train_loss": -10.982696533203125, "global_step": 160630, "epoch": 956} {"train_loss": -10.690718650817871, "global_step": 160631, "epoch": 956} {"train_loss": -10.68464469909668, "global_step": 160632, "epoch": 956} {"train_loss": -10.965713500976562, "global_step": 160633, "epoch": 956} {"train_loss": -10.576082229614258, "global_step": 160634, "epoch": 956} {"train_loss": -10.797283172607422, "global_step": 160635, "epoch": 956} {"train_loss": -10.964126586914062, "global_step": 160636, "epoch": 956} {"train_loss": -10.9488525390625, "global_step": 160637, "epoch": 956} {"train_loss": -10.870880126953125, "global_step": 160638, "epoch": 956} {"train_loss": -10.939558982849121, "global_step": 160639, "epoch": 956} {"train_loss": -10.511678695678711, "global_step": 160640, "epoch": 956} {"train_loss": -10.756887435913086, "global_step": 160641, "epoch": 956} {"train_loss": -10.814128875732422, "global_step": 160642, "epoch": 956} {"train_loss": -10.785449981689453, "global_step": 160643, "epoch": 956} {"train_loss": -10.886699676513672, "global_step": 160644, "epoch": 956} {"train_loss": -11.067023277282715, "global_step": 160645, "epoch": 956} {"train_loss": -10.975472450256348, "global_step": 160646, "epoch": 956} {"train_loss": -10.743045806884766, "global_step": 160647, "epoch": 956} {"train_loss": -10.975337028503418, "global_step": 160648, "epoch": 956} {"train_loss": -10.66736125946045, "global_step": 160649, "epoch": 956} {"train_loss": -11.087955474853516, "global_step": 160650, "epoch": 956} {"train_loss": -11.167882919311523, "global_step": 160651, "epoch": 956} {"train_loss": -10.802011489868164, "global_step": 160652, "epoch": 956} {"train_loss": -11.08317756652832, "global_step": 160653, "epoch": 956} {"train_loss": -10.922809600830078, "global_step": 160654, "epoch": 956} {"train_loss": -11.049184799194336, "global_step": 160655, "epoch": 956} {"train_loss": -11.080180168151855, "global_step": 160656, "epoch": 956} {"train_loss": -10.88508415222168, "global_step": 160657, "epoch": 956} {"train_loss": -11.062246322631836, "global_step": 160658, "epoch": 956} {"train_loss": -11.115005493164062, "global_step": 160659, "epoch": 956} {"train_loss": -11.1759033203125, "global_step": 160660, "epoch": 956} {"train_loss": -11.242266654968262, "global_step": 160661, "epoch": 956} {"train_loss": -11.190784454345703, "global_step": 160662, "epoch": 956} {"train_loss": -11.225883483886719, "global_step": 160663, "epoch": 956} {"train_loss": -10.94904899597168, "global_step": 160664, "epoch": 956} {"train_loss": -11.137511253356934, "global_step": 160665, "epoch": 956} {"train_loss": -10.855859756469727, "global_step": 160666, "epoch": 956} {"train_loss": -11.145406723022461, "global_step": 160667, "epoch": 956} {"train_loss": -11.123641014099121, "global_step": 160668, "epoch": 956} {"train_loss": -11.005188941955566, "global_step": 160669, "epoch": 956} {"train_loss": -11.056123733520508, "global_step": 160670, "epoch": 956} {"train_loss": -11.116327285766602, "global_step": 160671, "epoch": 956} {"train_loss": -10.729095458984375, "global_step": 160672, "epoch": 956} {"train_loss": -11.215181350708008, "global_step": 160673, "epoch": 956} {"train_loss": -10.666213989257812, "global_step": 160674, "epoch": 956} {"train_loss": -10.855356216430664, "global_step": 160675, "epoch": 956} {"train_loss": -10.87228775024414, "global_step": 160676, "epoch": 956} {"train_loss": -11.109223365783691, "global_step": 160677, "epoch": 956} {"train_loss": -10.837632179260254, "global_step": 160678, "epoch": 956} {"train_loss": -10.884720802307129, "global_step": 160679, "epoch": 956} {"train_loss": -10.894684791564941, "global_step": 160680, "epoch": 956} {"train_loss": -10.57981014251709, "global_step": 160681, "epoch": 956} {"train_loss": -10.48663330078125, "global_step": 160682, "epoch": 956} {"train_loss": -10.616975784301758, "global_step": 160683, "epoch": 956} {"train_loss": -11.040140151977539, "global_step": 160684, "epoch": 956} {"train_loss": -10.408123016357422, "global_step": 160685, "epoch": 956} {"train_loss": -10.242966651916504, "global_step": 160686, "epoch": 956} {"train_loss": -11.197763442993164, "global_step": 160687, "epoch": 956} {"train_loss": -10.404621124267578, "global_step": 160688, "epoch": 956} {"train_loss": -10.866294860839844, "global_step": 160689, "epoch": 956} {"train_loss": -11.042359352111816, "global_step": 160690, "epoch": 956} {"train_loss": -10.641206741333008, "global_step": 160691, "epoch": 956} {"train_loss": -10.589912414550781, "global_step": 160692, "epoch": 956} {"train_loss": -10.690999984741211, "global_step": 160693, "epoch": 956} {"train_loss": -11.098997116088867, "global_step": 160694, "epoch": 956} {"train_loss": -10.731417655944824, "global_step": 160695, "epoch": 956} {"train_loss": -10.724693298339844, "global_step": 160696, "epoch": 956} {"train_loss": -10.766658782958984, "global_step": 160697, "epoch": 956} {"train_loss": -10.760032653808594, "global_step": 160698, "epoch": 956} {"train_loss": -10.851472854614258, "global_step": 160699, "epoch": 956} {"train_loss": -10.745193481445312, "global_step": 160700, "epoch": 956} {"train_loss": -10.735597610473633, "global_step": 160701, "epoch": 956} {"train_loss": -10.709638595581055, "global_step": 160702, "epoch": 956} {"train_loss": -10.380651473999023, "global_step": 160703, "epoch": 956} {"train_loss": -10.790071487426758, "global_step": 160704, "epoch": 956} {"train_loss": -11.020017623901367, "global_step": 160705, "epoch": 956} {"train_loss": -10.30640983581543, "global_step": 160706, "epoch": 956} {"train_loss": -10.718038558959961, "global_step": 160707, "epoch": 956} {"train_loss": -10.581487655639648, "global_step": 160708, "epoch": 956} {"train_loss": -11.061527252197266, "global_step": 160709, "epoch": 956} {"train_loss": -10.922004699707031, "global_step": 160710, "epoch": 956} {"train_loss": -11.091032981872559, "global_step": 160711, "epoch": 956} {"train_loss": -11.022321701049805, "global_step": 160712, "epoch": 956} {"train_loss": -10.755729675292969, "global_step": 160713, "epoch": 956} {"train_loss": -10.912562370300293, "global_step": 160714, "epoch": 956} {"train_loss": -10.965048789978027, "global_step": 160715, "epoch": 956} {"train_loss": -10.75822925567627, "global_step": 160716, "epoch": 956} {"train_loss": -11.195605278015137, "global_step": 160717, "epoch": 956} {"train_loss": -10.843987464904785, "global_step": 160718, "epoch": 956} {"train_loss": -11.140645980834961, "global_step": 160719, "epoch": 956} {"train_loss": -11.138971328735352, "global_step": 160720, "epoch": 956} {"train_loss": -10.971020698547363, "global_step": 160721, "epoch": 956} {"train_loss": -11.004501342773438, "global_step": 160722, "epoch": 956} {"train_loss": -11.156463623046875, "global_step": 160723, "epoch": 956} {"train_loss": -11.056079864501953, "global_step": 160724, "epoch": 956} {"train_loss": -10.924168586730957, "global_step": 160725, "epoch": 956} {"train_loss": -10.924156188964844, "global_step": 160726, "epoch": 956} {"train_loss": -10.671865463256836, "global_step": 160727, "epoch": 956} {"train_loss": -11.063997268676758, "global_step": 160728, "epoch": 956} {"train_loss": -10.686752319335938, "global_step": 160729, "epoch": 956} {"train_loss": -10.921551704406738, "global_step": 160730, "epoch": 956} {"train_loss": -10.893367767333984, "global_step": 160731, "epoch": 956} {"train_loss": -10.901067733764648, "global_step": 160732, "epoch": 956} {"train_loss": -11.005365371704102, "global_step": 160733, "epoch": 956} {"train_loss": -11.023222923278809, "global_step": 160734, "epoch": 956} {"train_loss": -11.013429641723633, "global_step": 160735, "epoch": 956} {"train_loss": -11.110488891601562, "global_step": 160736, "epoch": 956} {"train_loss": -10.965850830078125, "global_step": 160737, "epoch": 956} {"train_loss": -10.89190673828125, "global_step": 160738, "epoch": 956} {"train_loss": -11.12718391418457, "global_step": 160739, "epoch": 956} {"train_loss": -10.879776954650879, "global_step": 160740, "epoch": 956} {"train_loss": -11.030539512634277, "global_step": 160741, "epoch": 956} {"train_loss": -10.887134552001953, "global_step": 160742, "epoch": 956} {"train_loss": -11.117424011230469, "global_step": 160743, "epoch": 956} {"train_loss": -11.163039207458496, "global_step": 160744, "epoch": 956} {"train_loss": -10.929841995239258, "global_step": 160745, "epoch": 956} {"train_loss": -11.288470268249512, "global_step": 160746, "epoch": 956} {"train_loss": -10.817014694213867, "global_step": 160747, "epoch": 956} {"train_loss": -10.744058609008789, "global_step": 160748, "epoch": 956} {"train_loss": -10.960587501525879, "global_step": 160749, "epoch": 956} {"train_loss": -10.712783813476562, "global_step": 160750, "epoch": 956} {"train_loss": -10.88076400756836, "global_step": 160751, "epoch": 956} {"train_loss": -10.293268203735352, "global_step": 160752, "epoch": 956} {"train_loss": -11.279827117919922, "global_step": 160753, "epoch": 956} {"train_loss": -10.423049926757812, "global_step": 160754, "epoch": 956} {"train_loss": -10.870583534240723, "global_step": 160755, "epoch": 956} {"train_loss": -10.305052757263184, "global_step": 160756, "epoch": 956} {"train_loss": -10.442865371704102, "global_step": 160757, "epoch": 956} {"train_loss": -10.285526275634766, "global_step": 160758, "epoch": 956} {"train_loss": -10.506904602050781, "global_step": 160759, "epoch": 956} {"train_loss": -10.383260726928711, "global_step": 160760, "epoch": 956} {"train_loss": -9.601014137268066, "global_step": 160761, "epoch": 956} {"train_loss": -9.94827651977539, "global_step": 160762, "epoch": 956} {"train_loss": -9.506645202636719, "global_step": 160763, "epoch": 956} {"train_loss": -9.292741775512695, "global_step": 160764, "epoch": 956} {"train_loss": -10.18203353881836, "global_step": 160765, "epoch": 956} {"train_loss": -9.163494110107422, "global_step": 160766, "epoch": 956} {"train_loss": -8.99560546875, "global_step": 160767, "epoch": 956} {"train_loss": -10.05443000793457, "global_step": 160768, "epoch": 956} {"train_loss": -9.462116241455078, "global_step": 160769, "epoch": 956} {"train_loss": -10.300479888916016, "global_step": 160770, "epoch": 956} {"train_loss": -8.835514068603516, "global_step": 160771, "epoch": 956} {"train_loss": -8.50535774230957, "global_step": 160772, "epoch": 956} {"train_loss": -9.73696517944336, "global_step": 160773, "epoch": 956} {"train_loss": -10.153657913208008, "global_step": 160774, "epoch": 956} {"train_loss": -10.732811836969285, "global_step": 160775, "epoch": 956, "val_loss": 230883.359375} {"train_loss": -9.573912620544434, "global_step": 160776, "epoch": 957} {"train_loss": -9.748758316040039, "global_step": 160777, "epoch": 957} {"train_loss": -10.660531997680664, "global_step": 160778, "epoch": 957} {"train_loss": -9.652933120727539, "global_step": 160779, "epoch": 957} {"train_loss": -9.798391342163086, "global_step": 160780, "epoch": 957} {"train_loss": -10.676301002502441, "global_step": 160781, "epoch": 957} {"train_loss": -9.545541763305664, "global_step": 160782, "epoch": 957} {"train_loss": -10.168641090393066, "global_step": 160783, "epoch": 957} {"train_loss": -9.986696243286133, "global_step": 160784, "epoch": 957} {"train_loss": -10.298839569091797, "global_step": 160785, "epoch": 957} {"train_loss": -10.198505401611328, "global_step": 160786, "epoch": 957} {"train_loss": -10.14345932006836, "global_step": 160787, "epoch": 957} {"train_loss": -10.643967628479004, "global_step": 160788, "epoch": 957} {"train_loss": -10.154730796813965, "global_step": 160789, "epoch": 957} {"train_loss": -10.055326461791992, "global_step": 160790, "epoch": 957} {"train_loss": -10.550661087036133, "global_step": 160791, "epoch": 957} {"train_loss": -10.352978706359863, "global_step": 160792, "epoch": 957} {"train_loss": -10.461265563964844, "global_step": 160793, "epoch": 957} {"train_loss": -10.504081726074219, "global_step": 160794, "epoch": 957} {"train_loss": -10.389686584472656, "global_step": 160795, "epoch": 957} {"train_loss": -10.606744766235352, "global_step": 160796, "epoch": 957} {"train_loss": -10.6309814453125, "global_step": 160797, "epoch": 957} {"train_loss": -10.178909301757812, "global_step": 160798, "epoch": 957} {"train_loss": -10.772482872009277, "global_step": 160799, "epoch": 957} {"train_loss": -10.330320358276367, "global_step": 160800, "epoch": 957} {"train_loss": -10.547212600708008, "global_step": 160801, "epoch": 957} {"train_loss": -10.819565773010254, "global_step": 160802, "epoch": 957} {"train_loss": -10.303056716918945, "global_step": 160803, "epoch": 957} {"train_loss": -10.53227424621582, "global_step": 160804, "epoch": 957} {"train_loss": -10.823087692260742, "global_step": 160805, "epoch": 957} {"train_loss": -10.41141414642334, "global_step": 160806, "epoch": 957} {"train_loss": -10.71554183959961, "global_step": 160807, "epoch": 957} {"train_loss": -10.568851470947266, "global_step": 160808, "epoch": 957} {"train_loss": -10.58542251586914, "global_step": 160809, "epoch": 957} {"train_loss": -10.930573463439941, "global_step": 160810, "epoch": 957} {"train_loss": -10.317855834960938, "global_step": 160811, "epoch": 957} {"train_loss": -10.519484519958496, "global_step": 160812, "epoch": 957} {"train_loss": -10.783337593078613, "global_step": 160813, "epoch": 957} {"train_loss": -10.478578567504883, "global_step": 160814, "epoch": 957} {"train_loss": -10.66094970703125, "global_step": 160815, "epoch": 957} {"train_loss": -10.791333198547363, "global_step": 160816, "epoch": 957} {"train_loss": -10.618403434753418, "global_step": 160817, "epoch": 957} {"train_loss": -10.66850757598877, "global_step": 160818, "epoch": 957} {"train_loss": -10.811851501464844, "global_step": 160819, "epoch": 957} {"train_loss": -10.84807300567627, "global_step": 160820, "epoch": 957} {"train_loss": -10.648670196533203, "global_step": 160821, "epoch": 957} {"train_loss": -10.931395530700684, "global_step": 160822, "epoch": 957} {"train_loss": -10.975828170776367, "global_step": 160823, "epoch": 957} {"train_loss": -10.827677726745605, "global_step": 160824, "epoch": 957} {"train_loss": -10.988893508911133, "global_step": 160825, "epoch": 957} {"train_loss": -10.988667488098145, "global_step": 160826, "epoch": 957} {"train_loss": -10.98997688293457, "global_step": 160827, "epoch": 957} {"train_loss": -10.916330337524414, "global_step": 160828, "epoch": 957} {"train_loss": -11.111289978027344, "global_step": 160829, "epoch": 957} {"train_loss": -11.174092292785645, "global_step": 160830, "epoch": 957} {"train_loss": -11.038935661315918, "global_step": 160831, "epoch": 957} {"train_loss": -11.13385009765625, "global_step": 160832, "epoch": 957} {"train_loss": -11.127618789672852, "global_step": 160833, "epoch": 957} {"train_loss": -11.079009056091309, "global_step": 160834, "epoch": 957} {"train_loss": -10.997173309326172, "global_step": 160835, "epoch": 957} {"train_loss": -11.031509399414062, "global_step": 160836, "epoch": 957} {"train_loss": -10.953374862670898, "global_step": 160837, "epoch": 957} {"train_loss": -11.034371376037598, "global_step": 160838, "epoch": 957} {"train_loss": -10.852940559387207, "global_step": 160839, "epoch": 957} {"train_loss": -11.115379333496094, "global_step": 160840, "epoch": 957} {"train_loss": -10.996451377868652, "global_step": 160841, "epoch": 957} {"train_loss": -11.12364673614502, "global_step": 160842, "epoch": 957} {"train_loss": -10.873826026916504, "global_step": 160843, "epoch": 957} {"train_loss": -11.13862419128418, "global_step": 160844, "epoch": 957} {"train_loss": -10.888827323913574, "global_step": 160845, "epoch": 957} {"train_loss": -11.100896835327148, "global_step": 160846, "epoch": 957} {"train_loss": -11.120790481567383, "global_step": 160847, "epoch": 957} {"train_loss": -11.244829177856445, "global_step": 160848, "epoch": 957} {"train_loss": -10.913713455200195, "global_step": 160849, "epoch": 957} {"train_loss": -11.096484184265137, "global_step": 160850, "epoch": 957} {"train_loss": -11.006645202636719, "global_step": 160851, "epoch": 957} {"train_loss": -10.665224075317383, "global_step": 160852, "epoch": 957} {"train_loss": -9.64586067199707, "global_step": 160853, "epoch": 957} {"train_loss": -10.807790756225586, "global_step": 160854, "epoch": 957} {"train_loss": -10.323638916015625, "global_step": 160855, "epoch": 957} {"train_loss": -10.128984451293945, "global_step": 160856, "epoch": 957} {"train_loss": -9.192493438720703, "global_step": 160857, "epoch": 957} {"train_loss": -10.51180648803711, "global_step": 160858, "epoch": 957} {"train_loss": -9.733802795410156, "global_step": 160859, "epoch": 957} {"train_loss": -10.336771011352539, "global_step": 160860, "epoch": 957} {"train_loss": -9.56987476348877, "global_step": 160861, "epoch": 957} {"train_loss": -9.371901512145996, "global_step": 160862, "epoch": 957} {"train_loss": -10.924681663513184, "global_step": 160863, "epoch": 957} {"train_loss": -9.086028099060059, "global_step": 160864, "epoch": 957} {"train_loss": -10.00385856628418, "global_step": 160865, "epoch": 957} {"train_loss": -9.180084228515625, "global_step": 160866, "epoch": 957} {"train_loss": -9.410079956054688, "global_step": 160867, "epoch": 957} {"train_loss": -8.948135375976562, "global_step": 160868, "epoch": 957} {"train_loss": -9.676891326904297, "global_step": 160869, "epoch": 957} {"train_loss": -9.867865562438965, "global_step": 160870, "epoch": 957} {"train_loss": -8.5772705078125, "global_step": 160871, "epoch": 957} {"train_loss": -9.677806854248047, "global_step": 160872, "epoch": 957} {"train_loss": -9.564277648925781, "global_step": 160873, "epoch": 957} {"train_loss": -10.037607192993164, "global_step": 160874, "epoch": 957} {"train_loss": -9.707586288452148, "global_step": 160875, "epoch": 957} {"train_loss": -10.418545722961426, "global_step": 160876, "epoch": 957} {"train_loss": -9.488409042358398, "global_step": 160877, "epoch": 957} {"train_loss": -10.204926490783691, "global_step": 160878, "epoch": 957} {"train_loss": -10.03872299194336, "global_step": 160879, "epoch": 957} {"train_loss": -10.088597297668457, "global_step": 160880, "epoch": 957} {"train_loss": -10.217440605163574, "global_step": 160881, "epoch": 957} {"train_loss": -10.193132400512695, "global_step": 160882, "epoch": 957} {"train_loss": -10.351232528686523, "global_step": 160883, "epoch": 957} {"train_loss": -9.929847717285156, "global_step": 160884, "epoch": 957} {"train_loss": -9.985427856445312, "global_step": 160885, "epoch": 957} {"train_loss": -10.111608505249023, "global_step": 160886, "epoch": 957} {"train_loss": -10.064209938049316, "global_step": 160887, "epoch": 957} {"train_loss": -10.321632385253906, "global_step": 160888, "epoch": 957} {"train_loss": -9.927748680114746, "global_step": 160889, "epoch": 957} {"train_loss": -10.225919723510742, "global_step": 160890, "epoch": 957} {"train_loss": -10.090085983276367, "global_step": 160891, "epoch": 957} {"train_loss": -10.125308990478516, "global_step": 160892, "epoch": 957} {"train_loss": -10.284656524658203, "global_step": 160893, "epoch": 957} {"train_loss": -10.250993728637695, "global_step": 160894, "epoch": 957} {"train_loss": -10.421937942504883, "global_step": 160895, "epoch": 957} {"train_loss": -10.296270370483398, "global_step": 160896, "epoch": 957} {"train_loss": -10.48719310760498, "global_step": 160897, "epoch": 957} {"train_loss": -10.279367446899414, "global_step": 160898, "epoch": 957} {"train_loss": -10.646729469299316, "global_step": 160899, "epoch": 957} {"train_loss": -10.782774925231934, "global_step": 160900, "epoch": 957} {"train_loss": -10.658418655395508, "global_step": 160901, "epoch": 957} {"train_loss": -10.556215286254883, "global_step": 160902, "epoch": 957} {"train_loss": -10.590593338012695, "global_step": 160903, "epoch": 957} {"train_loss": -10.619560241699219, "global_step": 160904, "epoch": 957} {"train_loss": -10.577990531921387, "global_step": 160905, "epoch": 957} {"train_loss": -10.652128219604492, "global_step": 160906, "epoch": 957} {"train_loss": -10.651881217956543, "global_step": 160907, "epoch": 957} {"train_loss": -10.641739845275879, "global_step": 160908, "epoch": 957} {"train_loss": -10.749673843383789, "global_step": 160909, "epoch": 957} {"train_loss": -10.855204582214355, "global_step": 160910, "epoch": 957} {"train_loss": -10.835617065429688, "global_step": 160911, "epoch": 957} {"train_loss": -10.855672836303711, "global_step": 160912, "epoch": 957} {"train_loss": -11.016449928283691, "global_step": 160913, "epoch": 957} {"train_loss": -10.784343719482422, "global_step": 160914, "epoch": 957} {"train_loss": -10.923821449279785, "global_step": 160915, "epoch": 957} {"train_loss": -11.078994750976562, "global_step": 160916, "epoch": 957} {"train_loss": -11.17136001586914, "global_step": 160917, "epoch": 957} {"train_loss": -10.783122062683105, "global_step": 160918, "epoch": 957} {"train_loss": -11.027628898620605, "global_step": 160919, "epoch": 957} {"train_loss": -10.882346153259277, "global_step": 160920, "epoch": 957} {"train_loss": -10.883317947387695, "global_step": 160921, "epoch": 957} {"train_loss": -11.038768768310547, "global_step": 160922, "epoch": 957} {"train_loss": -11.146034240722656, "global_step": 160923, "epoch": 957} {"train_loss": -11.14371109008789, "global_step": 160924, "epoch": 957} {"train_loss": -11.13655948638916, "global_step": 160925, "epoch": 957} {"train_loss": -11.114009857177734, "global_step": 160926, "epoch": 957} {"train_loss": -11.114113807678223, "global_step": 160927, "epoch": 957} {"train_loss": -10.979702949523926, "global_step": 160928, "epoch": 957} {"train_loss": -11.070625305175781, "global_step": 160929, "epoch": 957} {"train_loss": -11.02646255493164, "global_step": 160930, "epoch": 957} {"train_loss": -11.110804557800293, "global_step": 160931, "epoch": 957} {"train_loss": -11.248258590698242, "global_step": 160932, "epoch": 957} {"train_loss": -10.796018600463867, "global_step": 160933, "epoch": 957} {"train_loss": -10.961465835571289, "global_step": 160934, "epoch": 957} {"train_loss": -10.814544677734375, "global_step": 160935, "epoch": 957} {"train_loss": -11.016931533813477, "global_step": 160936, "epoch": 957} {"train_loss": -11.251914978027344, "global_step": 160937, "epoch": 957} {"train_loss": -10.974956512451172, "global_step": 160938, "epoch": 957} {"train_loss": -11.030624389648438, "global_step": 160939, "epoch": 957} {"train_loss": -11.281471252441406, "global_step": 160940, "epoch": 957} {"train_loss": -10.947221755981445, "global_step": 160941, "epoch": 957} {"train_loss": -11.36859130859375, "global_step": 160942, "epoch": 957} {"train_loss": -10.540855367978414, "global_step": 160943, "epoch": 957, "val_loss": 235522.46875} {"train_loss": -11.341119766235352, "global_step": 160944, "epoch": 958} {"train_loss": -11.10222053527832, "global_step": 160945, "epoch": 958} {"train_loss": -11.180526733398438, "global_step": 160946, "epoch": 958} {"train_loss": -10.862205505371094, "global_step": 160947, "epoch": 958} {"train_loss": -11.353230476379395, "global_step": 160948, "epoch": 958} {"train_loss": -11.210793495178223, "global_step": 160949, "epoch": 958} {"train_loss": -11.051881790161133, "global_step": 160950, "epoch": 958} {"train_loss": -10.547795295715332, "global_step": 160951, "epoch": 958} {"train_loss": -11.19387435913086, "global_step": 160952, "epoch": 958} {"train_loss": -10.55581283569336, "global_step": 160953, "epoch": 958} {"train_loss": -10.92402172088623, "global_step": 160954, "epoch": 958} {"train_loss": -10.959375381469727, "global_step": 160955, "epoch": 958} {"train_loss": -10.96381664276123, "global_step": 160956, "epoch": 958} {"train_loss": -10.56710433959961, "global_step": 160957, "epoch": 958} {"train_loss": -10.873188018798828, "global_step": 160958, "epoch": 958} {"train_loss": -11.000007629394531, "global_step": 160959, "epoch": 958} {"train_loss": -11.071656227111816, "global_step": 160960, "epoch": 958} {"train_loss": -10.541252136230469, "global_step": 160961, "epoch": 958} {"train_loss": -10.829324722290039, "global_step": 160962, "epoch": 958} {"train_loss": -10.197731018066406, "global_step": 160963, "epoch": 958} {"train_loss": -10.35623550415039, "global_step": 160964, "epoch": 958} {"train_loss": -10.524805068969727, "global_step": 160965, "epoch": 958} {"train_loss": -10.350849151611328, "global_step": 160966, "epoch": 958} {"train_loss": -9.6357421875, "global_step": 160967, "epoch": 958} {"train_loss": -10.87083911895752, "global_step": 160968, "epoch": 958} {"train_loss": -9.57946491241455, "global_step": 160969, "epoch": 958} {"train_loss": -9.13441276550293, "global_step": 160970, "epoch": 958} {"train_loss": -10.278044700622559, "global_step": 160971, "epoch": 958} {"train_loss": -9.444456100463867, "global_step": 160972, "epoch": 958} {"train_loss": -10.317071914672852, "global_step": 160973, "epoch": 958} {"train_loss": -9.422601699829102, "global_step": 160974, "epoch": 958} {"train_loss": -10.245360374450684, "global_step": 160975, "epoch": 958} {"train_loss": -10.355779647827148, "global_step": 160976, "epoch": 958} {"train_loss": -10.438840866088867, "global_step": 160977, "epoch": 958} {"train_loss": -9.947967529296875, "global_step": 160978, "epoch": 958} {"train_loss": -10.513229370117188, "global_step": 160979, "epoch": 958} {"train_loss": -10.366114616394043, "global_step": 160980, "epoch": 958} {"train_loss": -10.546091079711914, "global_step": 160981, "epoch": 958} {"train_loss": -10.744826316833496, "global_step": 160982, "epoch": 958} {"train_loss": -10.621885299682617, "global_step": 160983, "epoch": 958} {"train_loss": -10.475530624389648, "global_step": 160984, "epoch": 958} {"train_loss": -10.712300300598145, "global_step": 160985, "epoch": 958} {"train_loss": -10.29251480102539, "global_step": 160986, "epoch": 958} {"train_loss": -10.271968841552734, "global_step": 160987, "epoch": 958} {"train_loss": -10.275675773620605, "global_step": 160988, "epoch": 958} {"train_loss": -10.457721710205078, "global_step": 160989, "epoch": 958} {"train_loss": -10.20928955078125, "global_step": 160990, "epoch": 958} {"train_loss": -10.686952590942383, "global_step": 160991, "epoch": 958} {"train_loss": -9.968082427978516, "global_step": 160992, "epoch": 958} {"train_loss": -10.612714767456055, "global_step": 160993, "epoch": 958} {"train_loss": -10.669950485229492, "global_step": 160994, "epoch": 958} {"train_loss": -10.498348236083984, "global_step": 160995, "epoch": 958} {"train_loss": -10.532743453979492, "global_step": 160996, "epoch": 958} {"train_loss": -10.750564575195312, "global_step": 160997, "epoch": 958} {"train_loss": -10.61311149597168, "global_step": 160998, "epoch": 958} {"train_loss": -10.835755348205566, "global_step": 160999, "epoch": 958} {"train_loss": -10.706239700317383, "global_step": 161000, "epoch": 958} {"train_loss": -10.695674896240234, "global_step": 161001, "epoch": 958} {"train_loss": -10.849023818969727, "global_step": 161002, "epoch": 958} {"train_loss": -10.853311538696289, "global_step": 161003, "epoch": 958} {"train_loss": -10.93892765045166, "global_step": 161004, "epoch": 958} {"train_loss": -10.71581745147705, "global_step": 161005, "epoch": 958} {"train_loss": -11.094673156738281, "global_step": 161006, "epoch": 958} {"train_loss": -10.850950241088867, "global_step": 161007, "epoch": 958} {"train_loss": -10.973072052001953, "global_step": 161008, "epoch": 958} {"train_loss": -11.027864456176758, "global_step": 161009, "epoch": 958} {"train_loss": -11.004034042358398, "global_step": 161010, "epoch": 958} {"train_loss": -11.082266807556152, "global_step": 161011, "epoch": 958} {"train_loss": -11.114297866821289, "global_step": 161012, "epoch": 958} {"train_loss": -11.082290649414062, "global_step": 161013, "epoch": 958} {"train_loss": -11.231487274169922, "global_step": 161014, "epoch": 958} {"train_loss": -11.226558685302734, "global_step": 161015, "epoch": 958} {"train_loss": -11.191581726074219, "global_step": 161016, "epoch": 958} {"train_loss": -10.93704605102539, "global_step": 161017, "epoch": 958} {"train_loss": -10.904772758483887, "global_step": 161018, "epoch": 958} {"train_loss": -11.176187515258789, "global_step": 161019, "epoch": 958} {"train_loss": -10.905117988586426, "global_step": 161020, "epoch": 958} {"train_loss": -11.199776649475098, "global_step": 161021, "epoch": 958} {"train_loss": -11.026331901550293, "global_step": 161022, "epoch": 958} {"train_loss": -11.131683349609375, "global_step": 161023, "epoch": 958} {"train_loss": -10.766658782958984, "global_step": 161024, "epoch": 958} {"train_loss": -11.207674026489258, "global_step": 161025, "epoch": 958} {"train_loss": -11.232369422912598, "global_step": 161026, "epoch": 958} {"train_loss": -10.999940872192383, "global_step": 161027, "epoch": 958} {"train_loss": -10.84672737121582, "global_step": 161028, "epoch": 958} {"train_loss": -11.018792152404785, "global_step": 161029, "epoch": 958} {"train_loss": -10.989476203918457, "global_step": 161030, "epoch": 958} {"train_loss": -11.29745864868164, "global_step": 161031, "epoch": 958} {"train_loss": -11.007551193237305, "global_step": 161032, "epoch": 958} {"train_loss": -11.267682075500488, "global_step": 161033, "epoch": 958} {"train_loss": -10.723483085632324, "global_step": 161034, "epoch": 958} {"train_loss": -11.294574737548828, "global_step": 161035, "epoch": 958} {"train_loss": -11.052970886230469, "global_step": 161036, "epoch": 958} {"train_loss": -11.443735122680664, "global_step": 161037, "epoch": 958} {"train_loss": -10.725831985473633, "global_step": 161038, "epoch": 958} {"train_loss": -11.18693733215332, "global_step": 161039, "epoch": 958} {"train_loss": -11.178284645080566, "global_step": 161040, "epoch": 958} {"train_loss": -11.344676971435547, "global_step": 161041, "epoch": 958} {"train_loss": -11.237221717834473, "global_step": 161042, "epoch": 958} {"train_loss": -11.284818649291992, "global_step": 161043, "epoch": 958} {"train_loss": -11.26984977722168, "global_step": 161044, "epoch": 958} {"train_loss": -11.130331039428711, "global_step": 161045, "epoch": 958} {"train_loss": -10.419137001037598, "global_step": 161046, "epoch": 958} {"train_loss": -11.257640838623047, "global_step": 161047, "epoch": 958} {"train_loss": -10.749931335449219, "global_step": 161048, "epoch": 958} {"train_loss": -11.031123161315918, "global_step": 161049, "epoch": 958} {"train_loss": -10.912564277648926, "global_step": 161050, "epoch": 958} {"train_loss": -10.974504470825195, "global_step": 161051, "epoch": 958} {"train_loss": -10.975372314453125, "global_step": 161052, "epoch": 958} {"train_loss": -10.84307861328125, "global_step": 161053, "epoch": 958} {"train_loss": -10.938849449157715, "global_step": 161054, "epoch": 958} {"train_loss": -11.137920379638672, "global_step": 161055, "epoch": 958} {"train_loss": -10.952417373657227, "global_step": 161056, "epoch": 958} {"train_loss": -10.7939453125, "global_step": 161057, "epoch": 958} {"train_loss": -11.3089017868042, "global_step": 161058, "epoch": 958} {"train_loss": -11.050086975097656, "global_step": 161059, "epoch": 958} {"train_loss": -11.241372108459473, "global_step": 161060, "epoch": 958} {"train_loss": -11.301024436950684, "global_step": 161061, "epoch": 958} {"train_loss": -10.919061660766602, "global_step": 161062, "epoch": 958} {"train_loss": -10.881922721862793, "global_step": 161063, "epoch": 958} {"train_loss": -11.298090934753418, "global_step": 161064, "epoch": 958} {"train_loss": -11.081645965576172, "global_step": 161065, "epoch": 958} {"train_loss": -11.12730884552002, "global_step": 161066, "epoch": 958} {"train_loss": -10.817699432373047, "global_step": 161067, "epoch": 958} {"train_loss": -10.912419319152832, "global_step": 161068, "epoch": 958} {"train_loss": -10.785085678100586, "global_step": 161069, "epoch": 958} {"train_loss": -10.68114948272705, "global_step": 161070, "epoch": 958} {"train_loss": -10.375125885009766, "global_step": 161071, "epoch": 958} {"train_loss": -10.978967666625977, "global_step": 161072, "epoch": 958} {"train_loss": -10.198667526245117, "global_step": 161073, "epoch": 958} {"train_loss": -10.617416381835938, "global_step": 161074, "epoch": 958} {"train_loss": -10.709620475769043, "global_step": 161075, "epoch": 958} {"train_loss": -10.820737838745117, "global_step": 161076, "epoch": 958} {"train_loss": -10.887052536010742, "global_step": 161077, "epoch": 958} {"train_loss": -10.20570182800293, "global_step": 161078, "epoch": 958} {"train_loss": -10.51349925994873, "global_step": 161079, "epoch": 958} {"train_loss": -9.867792129516602, "global_step": 161080, "epoch": 958} {"train_loss": -9.860025405883789, "global_step": 161081, "epoch": 958} {"train_loss": -10.797380447387695, "global_step": 161082, "epoch": 958} {"train_loss": -9.993903160095215, "global_step": 161083, "epoch": 958} {"train_loss": -10.346382141113281, "global_step": 161084, "epoch": 958} {"train_loss": -11.022598266601562, "global_step": 161085, "epoch": 958} {"train_loss": -10.418017387390137, "global_step": 161086, "epoch": 958} {"train_loss": -10.523950576782227, "global_step": 161087, "epoch": 958} {"train_loss": -10.521028518676758, "global_step": 161088, "epoch": 958} {"train_loss": -10.262540817260742, "global_step": 161089, "epoch": 958} {"train_loss": -10.698080062866211, "global_step": 161090, "epoch": 958} {"train_loss": -10.508750915527344, "global_step": 161091, "epoch": 958} {"train_loss": -10.01876449584961, "global_step": 161092, "epoch": 958} {"train_loss": -10.876947402954102, "global_step": 161093, "epoch": 958} {"train_loss": -10.376874923706055, "global_step": 161094, "epoch": 958} {"train_loss": -10.806846618652344, "global_step": 161095, "epoch": 958} {"train_loss": -10.758940696716309, "global_step": 161096, "epoch": 958} {"train_loss": -10.640155792236328, "global_step": 161097, "epoch": 958} {"train_loss": -10.678680419921875, "global_step": 161098, "epoch": 958} {"train_loss": -10.829207420349121, "global_step": 161099, "epoch": 958} {"train_loss": -10.629432678222656, "global_step": 161100, "epoch": 958} {"train_loss": -10.747056007385254, "global_step": 161101, "epoch": 958} {"train_loss": -10.66650390625, "global_step": 161102, "epoch": 958} {"train_loss": -11.007925033569336, "global_step": 161103, "epoch": 958} {"train_loss": -10.652366638183594, "global_step": 161104, "epoch": 958} {"train_loss": -10.888324737548828, "global_step": 161105, "epoch": 958} {"train_loss": -10.484214782714844, "global_step": 161106, "epoch": 958} {"train_loss": -10.616405487060547, "global_step": 161107, "epoch": 958} {"train_loss": -10.557814598083496, "global_step": 161108, "epoch": 958} {"train_loss": -10.731094360351562, "global_step": 161109, "epoch": 958} {"train_loss": -10.91494369506836, "global_step": 161110, "epoch": 958} {"train_loss": -10.751577167283921, "global_step": 161111, "epoch": 958, "val_loss": 233736.296875} {"train_loss": -10.787434577941895, "global_step": 161112, "epoch": 959} {"train_loss": -10.877056121826172, "global_step": 161113, "epoch": 959} {"train_loss": -10.403509140014648, "global_step": 161114, "epoch": 959} {"train_loss": -11.09647274017334, "global_step": 161115, "epoch": 959} {"train_loss": -10.949597358703613, "global_step": 161116, "epoch": 959} {"train_loss": -10.750171661376953, "global_step": 161117, "epoch": 959} {"train_loss": -10.890329360961914, "global_step": 161118, "epoch": 959} {"train_loss": -10.849915504455566, "global_step": 161119, "epoch": 959} {"train_loss": -10.761659622192383, "global_step": 161120, "epoch": 959} {"train_loss": -10.773981094360352, "global_step": 161121, "epoch": 959} {"train_loss": -10.94828987121582, "global_step": 161122, "epoch": 959} {"train_loss": -11.03654670715332, "global_step": 161123, "epoch": 959} {"train_loss": -10.795244216918945, "global_step": 161124, "epoch": 959} {"train_loss": -11.070024490356445, "global_step": 161125, "epoch": 959} {"train_loss": -10.934701919555664, "global_step": 161126, "epoch": 959} {"train_loss": -11.13399887084961, "global_step": 161127, "epoch": 959} {"train_loss": -10.89182186126709, "global_step": 161128, "epoch": 959} {"train_loss": -11.097885131835938, "global_step": 161129, "epoch": 959} {"train_loss": -11.185445785522461, "global_step": 161130, "epoch": 959} {"train_loss": -11.116243362426758, "global_step": 161131, "epoch": 959} {"train_loss": -11.41771125793457, "global_step": 161132, "epoch": 959} {"train_loss": -10.984296798706055, "global_step": 161133, "epoch": 959} {"train_loss": -11.347051620483398, "global_step": 161134, "epoch": 959} {"train_loss": -11.279773712158203, "global_step": 161135, "epoch": 959} {"train_loss": -11.193955421447754, "global_step": 161136, "epoch": 959} {"train_loss": -11.219625473022461, "global_step": 161137, "epoch": 959} {"train_loss": -11.06314468383789, "global_step": 161138, "epoch": 959} {"train_loss": -11.278360366821289, "global_step": 161139, "epoch": 959} {"train_loss": -10.933280944824219, "global_step": 161140, "epoch": 959} {"train_loss": -11.190563201904297, "global_step": 161141, "epoch": 959} {"train_loss": -11.245370864868164, "global_step": 161142, "epoch": 959} {"train_loss": -10.707381248474121, "global_step": 161143, "epoch": 959} {"train_loss": -10.883060455322266, "global_step": 161144, "epoch": 959} {"train_loss": -11.001459121704102, "global_step": 161145, "epoch": 959} {"train_loss": -10.888325691223145, "global_step": 161146, "epoch": 959} {"train_loss": -11.325540542602539, "global_step": 161147, "epoch": 959} {"train_loss": -10.531980514526367, "global_step": 161148, "epoch": 959} {"train_loss": -9.654792785644531, "global_step": 161149, "epoch": 959} {"train_loss": -11.183449745178223, "global_step": 161150, "epoch": 959} {"train_loss": -10.646515846252441, "global_step": 161151, "epoch": 959} {"train_loss": -10.744927406311035, "global_step": 161152, "epoch": 959} {"train_loss": -10.99954891204834, "global_step": 161153, "epoch": 959} {"train_loss": -10.405264854431152, "global_step": 161154, "epoch": 959} {"train_loss": -10.90068244934082, "global_step": 161155, "epoch": 959} {"train_loss": -10.539494514465332, "global_step": 161156, "epoch": 959} {"train_loss": -9.73288631439209, "global_step": 161157, "epoch": 959} {"train_loss": -10.828274726867676, "global_step": 161158, "epoch": 959} {"train_loss": -10.118734359741211, "global_step": 161159, "epoch": 959} {"train_loss": -9.891138076782227, "global_step": 161160, "epoch": 959} {"train_loss": -10.188013076782227, "global_step": 161161, "epoch": 959} {"train_loss": -9.100912094116211, "global_step": 161162, "epoch": 959} {"train_loss": -9.909101486206055, "global_step": 161163, "epoch": 959} {"train_loss": -9.362564086914062, "global_step": 161164, "epoch": 959} {"train_loss": -9.71639347076416, "global_step": 161165, "epoch": 959} {"train_loss": -10.263059616088867, "global_step": 161166, "epoch": 959} {"train_loss": -10.408211708068848, "global_step": 161167, "epoch": 959} {"train_loss": -9.78526496887207, "global_step": 161168, "epoch": 959} {"train_loss": -10.658954620361328, "global_step": 161169, "epoch": 959} {"train_loss": -10.387649536132812, "global_step": 161170, "epoch": 959} {"train_loss": -10.62969970703125, "global_step": 161171, "epoch": 959} {"train_loss": -10.014790534973145, "global_step": 161172, "epoch": 959} {"train_loss": -10.485515594482422, "global_step": 161173, "epoch": 959} {"train_loss": -10.526158332824707, "global_step": 161174, "epoch": 959} {"train_loss": -10.471004486083984, "global_step": 161175, "epoch": 959} {"train_loss": -10.68110466003418, "global_step": 161176, "epoch": 959} {"train_loss": -10.66258716583252, "global_step": 161177, "epoch": 959} {"train_loss": -10.668667793273926, "global_step": 161178, "epoch": 959} {"train_loss": -10.924701690673828, "global_step": 161179, "epoch": 959} {"train_loss": -10.813777923583984, "global_step": 161180, "epoch": 959} {"train_loss": -10.632209777832031, "global_step": 161181, "epoch": 959} {"train_loss": -10.879496574401855, "global_step": 161182, "epoch": 959} {"train_loss": -10.901905059814453, "global_step": 161183, "epoch": 959} {"train_loss": -10.897974967956543, "global_step": 161184, "epoch": 959} {"train_loss": -10.86131763458252, "global_step": 161185, "epoch": 959} {"train_loss": -10.645281791687012, "global_step": 161186, "epoch": 959} {"train_loss": -10.736804962158203, "global_step": 161187, "epoch": 959} {"train_loss": -10.95684814453125, "global_step": 161188, "epoch": 959} {"train_loss": -10.893974304199219, "global_step": 161189, "epoch": 959} {"train_loss": -10.870527267456055, "global_step": 161190, "epoch": 959} {"train_loss": -10.792202949523926, "global_step": 161191, "epoch": 959} {"train_loss": -10.8270263671875, "global_step": 161192, "epoch": 959} {"train_loss": -10.931337356567383, "global_step": 161193, "epoch": 959} {"train_loss": -10.869544982910156, "global_step": 161194, "epoch": 959} {"train_loss": -11.065608024597168, "global_step": 161195, "epoch": 959} {"train_loss": -11.051941871643066, "global_step": 161196, "epoch": 959} {"train_loss": -10.927579879760742, "global_step": 161197, "epoch": 959} {"train_loss": -10.850435256958008, "global_step": 161198, "epoch": 959} {"train_loss": -10.966943740844727, "global_step": 161199, "epoch": 959} {"train_loss": -11.056715965270996, "global_step": 161200, "epoch": 959} {"train_loss": -11.114758491516113, "global_step": 161201, "epoch": 959} {"train_loss": -11.135303497314453, "global_step": 161202, "epoch": 959} {"train_loss": -11.06879997253418, "global_step": 161203, "epoch": 959} {"train_loss": -10.999895095825195, "global_step": 161204, "epoch": 959} {"train_loss": -11.176630020141602, "global_step": 161205, "epoch": 959} {"train_loss": -11.138097763061523, "global_step": 161206, "epoch": 959} {"train_loss": -11.225303649902344, "global_step": 161207, "epoch": 959} {"train_loss": -11.501005172729492, "global_step": 161208, "epoch": 959} {"train_loss": -11.345134735107422, "global_step": 161209, "epoch": 959} {"train_loss": -11.250236511230469, "global_step": 161210, "epoch": 959} {"train_loss": -11.06823444366455, "global_step": 161211, "epoch": 959} {"train_loss": -11.290655136108398, "global_step": 161212, "epoch": 959} {"train_loss": -11.105691909790039, "global_step": 161213, "epoch": 959} {"train_loss": -11.296138763427734, "global_step": 161214, "epoch": 959} {"train_loss": -11.350902557373047, "global_step": 161215, "epoch": 959} {"train_loss": -11.043237686157227, "global_step": 161216, "epoch": 959} {"train_loss": -11.152462005615234, "global_step": 161217, "epoch": 959} {"train_loss": -10.939584732055664, "global_step": 161218, "epoch": 959} {"train_loss": -11.32559871673584, "global_step": 161219, "epoch": 959} {"train_loss": -11.092100143432617, "global_step": 161220, "epoch": 959} {"train_loss": -10.93758773803711, "global_step": 161221, "epoch": 959} {"train_loss": -10.863694190979004, "global_step": 161222, "epoch": 959} {"train_loss": -11.18890380859375, "global_step": 161223, "epoch": 959} {"train_loss": -11.012619018554688, "global_step": 161224, "epoch": 959} {"train_loss": -10.684783935546875, "global_step": 161225, "epoch": 959} {"train_loss": -11.09925651550293, "global_step": 161226, "epoch": 959} {"train_loss": -11.19210433959961, "global_step": 161227, "epoch": 959} {"train_loss": -10.850178718566895, "global_step": 161228, "epoch": 959} {"train_loss": -10.240970611572266, "global_step": 161229, "epoch": 959} {"train_loss": -11.117355346679688, "global_step": 161230, "epoch": 959} {"train_loss": -11.09189510345459, "global_step": 161231, "epoch": 959} {"train_loss": -9.780576705932617, "global_step": 161232, "epoch": 959} {"train_loss": -10.856252670288086, "global_step": 161233, "epoch": 959} {"train_loss": -10.954122543334961, "global_step": 161234, "epoch": 959} {"train_loss": -9.828043937683105, "global_step": 161235, "epoch": 959} {"train_loss": -10.086874961853027, "global_step": 161236, "epoch": 959} {"train_loss": -10.995555877685547, "global_step": 161237, "epoch": 959} {"train_loss": -10.530278205871582, "global_step": 161238, "epoch": 959} {"train_loss": -10.565013885498047, "global_step": 161239, "epoch": 959} {"train_loss": -10.60293197631836, "global_step": 161240, "epoch": 959} {"train_loss": -10.455450057983398, "global_step": 161241, "epoch": 959} {"train_loss": -10.382146835327148, "global_step": 161242, "epoch": 959} {"train_loss": -10.515436172485352, "global_step": 161243, "epoch": 959} {"train_loss": -10.395746231079102, "global_step": 161244, "epoch": 959} {"train_loss": -10.636493682861328, "global_step": 161245, "epoch": 959} {"train_loss": -9.69675350189209, "global_step": 161246, "epoch": 959} {"train_loss": -10.862686157226562, "global_step": 161247, "epoch": 959} {"train_loss": -9.806657791137695, "global_step": 161248, "epoch": 959} {"train_loss": -10.300814628601074, "global_step": 161249, "epoch": 959} {"train_loss": -9.048540115356445, "global_step": 161250, "epoch": 959} {"train_loss": -10.404173851013184, "global_step": 161251, "epoch": 959} {"train_loss": -9.081753730773926, "global_step": 161252, "epoch": 959} {"train_loss": -10.615065574645996, "global_step": 161253, "epoch": 959} {"train_loss": -9.26717758178711, "global_step": 161254, "epoch": 959} {"train_loss": -9.981670379638672, "global_step": 161255, "epoch": 959} {"train_loss": -9.479917526245117, "global_step": 161256, "epoch": 959} {"train_loss": -9.949675559997559, "global_step": 161257, "epoch": 959} {"train_loss": -9.927433013916016, "global_step": 161258, "epoch": 959} {"train_loss": -9.767704010009766, "global_step": 161259, "epoch": 959} {"train_loss": -9.873144149780273, "global_step": 161260, "epoch": 959} {"train_loss": -9.704160690307617, "global_step": 161261, "epoch": 959} {"train_loss": -10.029619216918945, "global_step": 161262, "epoch": 959} {"train_loss": -10.192602157592773, "global_step": 161263, "epoch": 959} {"train_loss": -9.875417709350586, "global_step": 161264, "epoch": 959} {"train_loss": -10.468199729919434, "global_step": 161265, "epoch": 959} {"train_loss": -10.191719055175781, "global_step": 161266, "epoch": 959} {"train_loss": -10.548868179321289, "global_step": 161267, "epoch": 959} {"train_loss": -10.27078628540039, "global_step": 161268, "epoch": 959} {"train_loss": -10.20942497253418, "global_step": 161269, "epoch": 959} {"train_loss": -10.477986335754395, "global_step": 161270, "epoch": 959} {"train_loss": -10.00679874420166, "global_step": 161271, "epoch": 959} {"train_loss": -10.64747428894043, "global_step": 161272, "epoch": 959} {"train_loss": -10.000494956970215, "global_step": 161273, "epoch": 959} {"train_loss": -10.175491333007812, "global_step": 161274, "epoch": 959} {"train_loss": -10.835409164428711, "global_step": 161275, "epoch": 959} {"train_loss": -10.031455993652344, "global_step": 161276, "epoch": 959} {"train_loss": -10.70746898651123, "global_step": 161277, "epoch": 959} {"train_loss": -10.468544006347656, "global_step": 161278, "epoch": 959} {"train_loss": -10.650635407084511, "global_step": 161279, "epoch": 959, "val_loss": 238061.796875} {"train_loss": -10.548989295959473, "global_step": 161280, "epoch": 960} {"train_loss": -10.384669303894043, "global_step": 161281, "epoch": 960} {"train_loss": -10.60949420928955, "global_step": 161282, "epoch": 960} {"train_loss": -10.612302780151367, "global_step": 161283, "epoch": 960} {"train_loss": -10.387791633605957, "global_step": 161284, "epoch": 960} {"train_loss": -10.749787330627441, "global_step": 161285, "epoch": 960} {"train_loss": -10.551931381225586, "global_step": 161286, "epoch": 960} {"train_loss": -10.78907299041748, "global_step": 161287, "epoch": 960} {"train_loss": -10.84532356262207, "global_step": 161288, "epoch": 960} {"train_loss": -10.697331428527832, "global_step": 161289, "epoch": 960} {"train_loss": -10.68162727355957, "global_step": 161290, "epoch": 960} {"train_loss": -11.031536102294922, "global_step": 161291, "epoch": 960} {"train_loss": -10.958669662475586, "global_step": 161292, "epoch": 960} {"train_loss": -10.874686241149902, "global_step": 161293, "epoch": 960} {"train_loss": -10.821292877197266, "global_step": 161294, "epoch": 960} {"train_loss": -10.854169845581055, "global_step": 161295, "epoch": 960} {"train_loss": -10.884315490722656, "global_step": 161296, "epoch": 960} {"train_loss": -10.932149887084961, "global_step": 161297, "epoch": 960} {"train_loss": -11.125547409057617, "global_step": 161298, "epoch": 960} {"train_loss": -10.95524787902832, "global_step": 161299, "epoch": 960} {"train_loss": -11.08868408203125, "global_step": 161300, "epoch": 960} {"train_loss": -11.013697624206543, "global_step": 161301, "epoch": 960} {"train_loss": -11.050732612609863, "global_step": 161302, "epoch": 960} {"train_loss": -10.892595291137695, "global_step": 161303, "epoch": 960} {"train_loss": -11.082572937011719, "global_step": 161304, "epoch": 960} {"train_loss": -10.981760025024414, "global_step": 161305, "epoch": 960} {"train_loss": -11.089515686035156, "global_step": 161306, "epoch": 960} {"train_loss": -11.1424560546875, "global_step": 161307, "epoch": 960} {"train_loss": -10.929300308227539, "global_step": 161308, "epoch": 960} {"train_loss": -11.096430778503418, "global_step": 161309, "epoch": 960} {"train_loss": -11.030855178833008, "global_step": 161310, "epoch": 960} {"train_loss": -11.016158103942871, "global_step": 161311, "epoch": 960} {"train_loss": -11.173069953918457, "global_step": 161312, "epoch": 960} {"train_loss": -11.19126033782959, "global_step": 161313, "epoch": 960} {"train_loss": -10.977399826049805, "global_step": 161314, "epoch": 960} {"train_loss": -11.132040023803711, "global_step": 161315, "epoch": 960} {"train_loss": -11.043754577636719, "global_step": 161316, "epoch": 960} {"train_loss": -11.293120384216309, "global_step": 161317, "epoch": 960} {"train_loss": -11.088029861450195, "global_step": 161318, "epoch": 960} {"train_loss": -11.444228172302246, "global_step": 161319, "epoch": 960} {"train_loss": -11.35097885131836, "global_step": 161320, "epoch": 960} {"train_loss": -11.011906623840332, "global_step": 161321, "epoch": 960} {"train_loss": -11.020606994628906, "global_step": 161322, "epoch": 960} {"train_loss": -11.226147651672363, "global_step": 161323, "epoch": 960} {"train_loss": -11.137380599975586, "global_step": 161324, "epoch": 960} {"train_loss": -11.085325241088867, "global_step": 161325, "epoch": 960} {"train_loss": -11.010687828063965, "global_step": 161326, "epoch": 960} {"train_loss": -11.366594314575195, "global_step": 161327, "epoch": 960} {"train_loss": -10.971892356872559, "global_step": 161328, "epoch": 960} {"train_loss": -11.22562313079834, "global_step": 161329, "epoch": 960} {"train_loss": -11.353507995605469, "global_step": 161330, "epoch": 960} {"train_loss": -11.135677337646484, "global_step": 161331, "epoch": 960} {"train_loss": -11.230436325073242, "global_step": 161332, "epoch": 960} {"train_loss": -11.493772506713867, "global_step": 161333, "epoch": 960} {"train_loss": -11.450331687927246, "global_step": 161334, "epoch": 960} {"train_loss": -11.228761672973633, "global_step": 161335, "epoch": 960} {"train_loss": -11.015094757080078, "global_step": 161336, "epoch": 960} {"train_loss": -11.086042404174805, "global_step": 161337, "epoch": 960} {"train_loss": -11.131643295288086, "global_step": 161338, "epoch": 960} {"train_loss": -11.0999174118042, "global_step": 161339, "epoch": 960} {"train_loss": -10.28261661529541, "global_step": 161340, "epoch": 960} {"train_loss": -10.51817512512207, "global_step": 161341, "epoch": 960} {"train_loss": -11.013884544372559, "global_step": 161342, "epoch": 960} {"train_loss": -10.296815872192383, "global_step": 161343, "epoch": 960} {"train_loss": -11.12728500366211, "global_step": 161344, "epoch": 960} {"train_loss": -10.836090087890625, "global_step": 161345, "epoch": 960} {"train_loss": -10.815628051757812, "global_step": 161346, "epoch": 960} {"train_loss": -10.67324161529541, "global_step": 161347, "epoch": 960} {"train_loss": -10.893804550170898, "global_step": 161348, "epoch": 960} {"train_loss": -9.86575698852539, "global_step": 161349, "epoch": 960} {"train_loss": -10.15185832977295, "global_step": 161350, "epoch": 960} {"train_loss": -10.284425735473633, "global_step": 161351, "epoch": 960} {"train_loss": -9.89785099029541, "global_step": 161352, "epoch": 960} {"train_loss": -10.616228103637695, "global_step": 161353, "epoch": 960} {"train_loss": -10.574540138244629, "global_step": 161354, "epoch": 960} {"train_loss": -10.397054672241211, "global_step": 161355, "epoch": 960} {"train_loss": -10.237676620483398, "global_step": 161356, "epoch": 960} {"train_loss": -10.568999290466309, "global_step": 161357, "epoch": 960} {"train_loss": -10.541043281555176, "global_step": 161358, "epoch": 960} {"train_loss": -10.567815780639648, "global_step": 161359, "epoch": 960} {"train_loss": -10.399046897888184, "global_step": 161360, "epoch": 960} {"train_loss": -10.229708671569824, "global_step": 161361, "epoch": 960} {"train_loss": -10.634364128112793, "global_step": 161362, "epoch": 960} {"train_loss": -10.602925300598145, "global_step": 161363, "epoch": 960} {"train_loss": -10.65118408203125, "global_step": 161364, "epoch": 960} {"train_loss": -10.771592140197754, "global_step": 161365, "epoch": 960} {"train_loss": -10.37629222869873, "global_step": 161366, "epoch": 960} {"train_loss": -10.788530349731445, "global_step": 161367, "epoch": 960} {"train_loss": -9.933952331542969, "global_step": 161368, "epoch": 960} {"train_loss": -10.828841209411621, "global_step": 161369, "epoch": 960} {"train_loss": -9.22302532196045, "global_step": 161370, "epoch": 960} {"train_loss": -10.223417282104492, "global_step": 161371, "epoch": 960} {"train_loss": -9.940996170043945, "global_step": 161372, "epoch": 960} {"train_loss": -10.572802543640137, "global_step": 161373, "epoch": 960} {"train_loss": -10.014810562133789, "global_step": 161374, "epoch": 960} {"train_loss": -10.506772994995117, "global_step": 161375, "epoch": 960} {"train_loss": -10.131407737731934, "global_step": 161376, "epoch": 960} {"train_loss": -10.306785583496094, "global_step": 161377, "epoch": 960} {"train_loss": -10.435514450073242, "global_step": 161378, "epoch": 960} {"train_loss": -9.978227615356445, "global_step": 161379, "epoch": 960} {"train_loss": -10.53851318359375, "global_step": 161380, "epoch": 960} {"train_loss": -10.256200790405273, "global_step": 161381, "epoch": 960} {"train_loss": -10.778425216674805, "global_step": 161382, "epoch": 960} {"train_loss": -10.21197509765625, "global_step": 161383, "epoch": 960} {"train_loss": -10.322956085205078, "global_step": 161384, "epoch": 960} {"train_loss": -10.265989303588867, "global_step": 161385, "epoch": 960} {"train_loss": -10.7716703414917, "global_step": 161386, "epoch": 960} {"train_loss": -10.163217544555664, "global_step": 161387, "epoch": 960} {"train_loss": -10.516679763793945, "global_step": 161388, "epoch": 960} {"train_loss": -10.636643409729004, "global_step": 161389, "epoch": 960} {"train_loss": -10.431453704833984, "global_step": 161390, "epoch": 960} {"train_loss": -10.536447525024414, "global_step": 161391, "epoch": 960} {"train_loss": -10.549053192138672, "global_step": 161392, "epoch": 960} {"train_loss": -10.441155433654785, "global_step": 161393, "epoch": 960} {"train_loss": -10.508418083190918, "global_step": 161394, "epoch": 960} {"train_loss": -10.804950714111328, "global_step": 161395, "epoch": 960} {"train_loss": -11.016294479370117, "global_step": 161396, "epoch": 960} {"train_loss": -10.6768798828125, "global_step": 161397, "epoch": 960} {"train_loss": -10.910160064697266, "global_step": 161398, "epoch": 960} {"train_loss": -10.79206371307373, "global_step": 161399, "epoch": 960} {"train_loss": -10.651657104492188, "global_step": 161400, "epoch": 960} {"train_loss": -10.731705665588379, "global_step": 161401, "epoch": 960} {"train_loss": -10.689176559448242, "global_step": 161402, "epoch": 960} {"train_loss": -10.89827823638916, "global_step": 161403, "epoch": 960} {"train_loss": -10.640142440795898, "global_step": 161404, "epoch": 960} {"train_loss": -10.88962173461914, "global_step": 161405, "epoch": 960} {"train_loss": -10.967948913574219, "global_step": 161406, "epoch": 960} {"train_loss": -10.973846435546875, "global_step": 161407, "epoch": 960} {"train_loss": -10.7565279006958, "global_step": 161408, "epoch": 960} {"train_loss": -10.647665023803711, "global_step": 161409, "epoch": 960} {"train_loss": -10.917604446411133, "global_step": 161410, "epoch": 960} {"train_loss": -11.039660453796387, "global_step": 161411, "epoch": 960} {"train_loss": -10.837970733642578, "global_step": 161412, "epoch": 960} {"train_loss": -10.938375473022461, "global_step": 161413, "epoch": 960} {"train_loss": -10.792803764343262, "global_step": 161414, "epoch": 960} {"train_loss": -10.99562931060791, "global_step": 161415, "epoch": 960} {"train_loss": -11.090946197509766, "global_step": 161416, "epoch": 960} {"train_loss": -10.923933982849121, "global_step": 161417, "epoch": 960} {"train_loss": -10.82418441772461, "global_step": 161418, "epoch": 960} {"train_loss": -10.870664596557617, "global_step": 161419, "epoch": 960} {"train_loss": -10.997900009155273, "global_step": 161420, "epoch": 960} {"train_loss": -10.762985229492188, "global_step": 161421, "epoch": 960} {"train_loss": -10.950695037841797, "global_step": 161422, "epoch": 960} {"train_loss": -10.95295524597168, "global_step": 161423, "epoch": 960} {"train_loss": -11.084321975708008, "global_step": 161424, "epoch": 960} {"train_loss": -10.998452186584473, "global_step": 161425, "epoch": 960} {"train_loss": -10.956031799316406, "global_step": 161426, "epoch": 960} {"train_loss": -10.805764198303223, "global_step": 161427, "epoch": 960} {"train_loss": -11.044452667236328, "global_step": 161428, "epoch": 960} {"train_loss": -10.566462516784668, "global_step": 161429, "epoch": 960} {"train_loss": -10.956941604614258, "global_step": 161430, "epoch": 960} {"train_loss": -10.605222702026367, "global_step": 161431, "epoch": 960} {"train_loss": -10.899770736694336, "global_step": 161432, "epoch": 960} {"train_loss": -10.534756660461426, "global_step": 161433, "epoch": 960} {"train_loss": -11.160774230957031, "global_step": 161434, "epoch": 960} {"train_loss": -10.726858139038086, "global_step": 161435, "epoch": 960} {"train_loss": -10.877119064331055, "global_step": 161436, "epoch": 960} {"train_loss": -10.847667694091797, "global_step": 161437, "epoch": 960} {"train_loss": -10.869547843933105, "global_step": 161438, "epoch": 960} {"train_loss": -10.796350479125977, "global_step": 161439, "epoch": 960} {"train_loss": -10.921182632446289, "global_step": 161440, "epoch": 960} {"train_loss": -10.651496887207031, "global_step": 161441, "epoch": 960} {"train_loss": -10.667200088500977, "global_step": 161442, "epoch": 960} {"train_loss": -11.156390190124512, "global_step": 161443, "epoch": 960} {"train_loss": -10.572675704956055, "global_step": 161444, "epoch": 960} {"train_loss": -11.126731872558594, "global_step": 161445, "epoch": 960} {"train_loss": -10.688154220581055, "global_step": 161446, "epoch": 960} {"train_loss": -10.77031683921814, "global_step": 161447, "epoch": 960, "val_loss": 236722.3125, "train_action_mse_error": 1.7471632957458496} {"train_loss": -10.868667602539062, "global_step": 161448, "epoch": 961} {"train_loss": -10.707212448120117, "global_step": 161449, "epoch": 961} {"train_loss": -10.808311462402344, "global_step": 161450, "epoch": 961} {"train_loss": -10.777860641479492, "global_step": 161451, "epoch": 961} {"train_loss": -10.894439697265625, "global_step": 161452, "epoch": 961} {"train_loss": -10.811990737915039, "global_step": 161453, "epoch": 961} {"train_loss": -10.96969223022461, "global_step": 161454, "epoch": 961} {"train_loss": -10.650991439819336, "global_step": 161455, "epoch": 961} {"train_loss": -10.892215728759766, "global_step": 161456, "epoch": 961} {"train_loss": -11.065591812133789, "global_step": 161457, "epoch": 961} {"train_loss": -11.017034530639648, "global_step": 161458, "epoch": 961} {"train_loss": -10.8802490234375, "global_step": 161459, "epoch": 961} {"train_loss": -11.269216537475586, "global_step": 161460, "epoch": 961} {"train_loss": -11.05913257598877, "global_step": 161461, "epoch": 961} {"train_loss": -11.286066055297852, "global_step": 161462, "epoch": 961} {"train_loss": -10.852896690368652, "global_step": 161463, "epoch": 961} {"train_loss": -11.113588333129883, "global_step": 161464, "epoch": 961} {"train_loss": -10.999641418457031, "global_step": 161465, "epoch": 961} {"train_loss": -11.084911346435547, "global_step": 161466, "epoch": 961} {"train_loss": -11.064051628112793, "global_step": 161467, "epoch": 961} {"train_loss": -10.782404899597168, "global_step": 161468, "epoch": 961} {"train_loss": -11.309096336364746, "global_step": 161469, "epoch": 961} {"train_loss": -10.876672744750977, "global_step": 161470, "epoch": 961} {"train_loss": -10.869463920593262, "global_step": 161471, "epoch": 961} {"train_loss": -11.046690940856934, "global_step": 161472, "epoch": 961} {"train_loss": -10.992427825927734, "global_step": 161473, "epoch": 961} {"train_loss": -10.52400016784668, "global_step": 161474, "epoch": 961} {"train_loss": -10.848912239074707, "global_step": 161475, "epoch": 961} {"train_loss": -10.122576713562012, "global_step": 161476, "epoch": 961} {"train_loss": -10.500057220458984, "global_step": 161477, "epoch": 961} {"train_loss": -11.021080017089844, "global_step": 161478, "epoch": 961} {"train_loss": -10.223804473876953, "global_step": 161479, "epoch": 961} {"train_loss": -10.956125259399414, "global_step": 161480, "epoch": 961} {"train_loss": -10.688446044921875, "global_step": 161481, "epoch": 961} {"train_loss": -10.17263126373291, "global_step": 161482, "epoch": 961} {"train_loss": -10.79199504852295, "global_step": 161483, "epoch": 961} {"train_loss": -10.573663711547852, "global_step": 161484, "epoch": 961} {"train_loss": -10.258949279785156, "global_step": 161485, "epoch": 961} {"train_loss": -10.980611801147461, "global_step": 161486, "epoch": 961} {"train_loss": -10.015188217163086, "global_step": 161487, "epoch": 961} {"train_loss": -10.81389045715332, "global_step": 161488, "epoch": 961} {"train_loss": -10.410087585449219, "global_step": 161489, "epoch": 961} {"train_loss": -10.110982894897461, "global_step": 161490, "epoch": 961} {"train_loss": -10.943157196044922, "global_step": 161491, "epoch": 961} {"train_loss": -10.07437801361084, "global_step": 161492, "epoch": 961} {"train_loss": -10.809057235717773, "global_step": 161493, "epoch": 961} {"train_loss": -10.145296096801758, "global_step": 161494, "epoch": 961} {"train_loss": -10.997214317321777, "global_step": 161495, "epoch": 961} {"train_loss": -10.289702415466309, "global_step": 161496, "epoch": 961} {"train_loss": -9.866321563720703, "global_step": 161497, "epoch": 961} {"train_loss": -10.79857063293457, "global_step": 161498, "epoch": 961} {"train_loss": -10.291966438293457, "global_step": 161499, "epoch": 961} {"train_loss": -10.355759620666504, "global_step": 161500, "epoch": 961} {"train_loss": -10.230424880981445, "global_step": 161501, "epoch": 961} {"train_loss": -10.447222709655762, "global_step": 161502, "epoch": 961} {"train_loss": -10.246343612670898, "global_step": 161503, "epoch": 961} {"train_loss": -10.49835205078125, "global_step": 161504, "epoch": 961} {"train_loss": -10.410369873046875, "global_step": 161505, "epoch": 961} {"train_loss": -10.367311477661133, "global_step": 161506, "epoch": 961} {"train_loss": -11.064912796020508, "global_step": 161507, "epoch": 961} {"train_loss": -10.466340065002441, "global_step": 161508, "epoch": 961} {"train_loss": -10.856724739074707, "global_step": 161509, "epoch": 961} {"train_loss": -10.738162994384766, "global_step": 161510, "epoch": 961} {"train_loss": -10.728569030761719, "global_step": 161511, "epoch": 961} {"train_loss": -10.752477645874023, "global_step": 161512, "epoch": 961} {"train_loss": -10.636129379272461, "global_step": 161513, "epoch": 961} {"train_loss": -10.890218734741211, "global_step": 161514, "epoch": 961} {"train_loss": -10.875418663024902, "global_step": 161515, "epoch": 961} {"train_loss": -10.765434265136719, "global_step": 161516, "epoch": 961} {"train_loss": -10.732259750366211, "global_step": 161517, "epoch": 961} {"train_loss": -11.120563507080078, "global_step": 161518, "epoch": 961} {"train_loss": -11.094184875488281, "global_step": 161519, "epoch": 961} {"train_loss": -10.888582229614258, "global_step": 161520, "epoch": 961} {"train_loss": -11.027074813842773, "global_step": 161521, "epoch": 961} {"train_loss": -11.193984985351562, "global_step": 161522, "epoch": 961} {"train_loss": -10.933324813842773, "global_step": 161523, "epoch": 961} {"train_loss": -11.014972686767578, "global_step": 161524, "epoch": 961} {"train_loss": -11.208264350891113, "global_step": 161525, "epoch": 961} {"train_loss": -10.933378219604492, "global_step": 161526, "epoch": 961} {"train_loss": -11.151455879211426, "global_step": 161527, "epoch": 961} {"train_loss": -11.122512817382812, "global_step": 161528, "epoch": 961} {"train_loss": -11.119937896728516, "global_step": 161529, "epoch": 961} {"train_loss": -11.100236892700195, "global_step": 161530, "epoch": 961} {"train_loss": -11.122102737426758, "global_step": 161531, "epoch": 961} {"train_loss": -11.200363159179688, "global_step": 161532, "epoch": 961} {"train_loss": -11.140153884887695, "global_step": 161533, "epoch": 961} {"train_loss": -11.259309768676758, "global_step": 161534, "epoch": 961} {"train_loss": -11.197938919067383, "global_step": 161535, "epoch": 961} {"train_loss": -11.098678588867188, "global_step": 161536, "epoch": 961} {"train_loss": -11.119241714477539, "global_step": 161537, "epoch": 961} {"train_loss": -11.315590858459473, "global_step": 161538, "epoch": 961} {"train_loss": -10.999520301818848, "global_step": 161539, "epoch": 961} {"train_loss": -11.1827392578125, "global_step": 161540, "epoch": 961} {"train_loss": -11.028170585632324, "global_step": 161541, "epoch": 961} {"train_loss": -10.918113708496094, "global_step": 161542, "epoch": 961} {"train_loss": -11.09492015838623, "global_step": 161543, "epoch": 961} {"train_loss": -11.195358276367188, "global_step": 161544, "epoch": 961} {"train_loss": -11.166624069213867, "global_step": 161545, "epoch": 961} {"train_loss": -10.966136932373047, "global_step": 161546, "epoch": 961} {"train_loss": -11.077754974365234, "global_step": 161547, "epoch": 961} {"train_loss": -11.102483749389648, "global_step": 161548, "epoch": 961} {"train_loss": -11.362974166870117, "global_step": 161549, "epoch": 961} {"train_loss": -11.207816123962402, "global_step": 161550, "epoch": 961} {"train_loss": -11.22341251373291, "global_step": 161551, "epoch": 961} {"train_loss": -11.211891174316406, "global_step": 161552, "epoch": 961} {"train_loss": -11.362472534179688, "global_step": 161553, "epoch": 961} {"train_loss": -11.328776359558105, "global_step": 161554, "epoch": 961} {"train_loss": -11.145965576171875, "global_step": 161555, "epoch": 961} {"train_loss": -11.187744140625, "global_step": 161556, "epoch": 961} {"train_loss": -11.348194122314453, "global_step": 161557, "epoch": 961} {"train_loss": -11.383066177368164, "global_step": 161558, "epoch": 961} {"train_loss": -11.249042510986328, "global_step": 161559, "epoch": 961} {"train_loss": -11.243108749389648, "global_step": 161560, "epoch": 961} {"train_loss": -11.212202072143555, "global_step": 161561, "epoch": 961} {"train_loss": -11.157075881958008, "global_step": 161562, "epoch": 961} {"train_loss": -11.233657836914062, "global_step": 161563, "epoch": 961} {"train_loss": -11.186258316040039, "global_step": 161564, "epoch": 961} {"train_loss": -11.033159255981445, "global_step": 161565, "epoch": 961} {"train_loss": -11.150976181030273, "global_step": 161566, "epoch": 961} {"train_loss": -11.201483726501465, "global_step": 161567, "epoch": 961} {"train_loss": -11.150074005126953, "global_step": 161568, "epoch": 961} {"train_loss": -11.158849716186523, "global_step": 161569, "epoch": 961} {"train_loss": -10.894153594970703, "global_step": 161570, "epoch": 961} {"train_loss": -11.168351173400879, "global_step": 161571, "epoch": 961} {"train_loss": -11.266471862792969, "global_step": 161572, "epoch": 961} {"train_loss": -10.838088989257812, "global_step": 161573, "epoch": 961} {"train_loss": -10.40254020690918, "global_step": 161574, "epoch": 961} {"train_loss": -11.172842025756836, "global_step": 161575, "epoch": 961} {"train_loss": -10.523992538452148, "global_step": 161576, "epoch": 961} {"train_loss": -10.530404090881348, "global_step": 161577, "epoch": 961} {"train_loss": -11.045188903808594, "global_step": 161578, "epoch": 961} {"train_loss": -10.461316108703613, "global_step": 161579, "epoch": 961} {"train_loss": -10.70025634765625, "global_step": 161580, "epoch": 961} {"train_loss": -10.701266288757324, "global_step": 161581, "epoch": 961} {"train_loss": -10.977585792541504, "global_step": 161582, "epoch": 961} {"train_loss": -10.2875394821167, "global_step": 161583, "epoch": 961} {"train_loss": -10.544307708740234, "global_step": 161584, "epoch": 961} {"train_loss": -10.919519424438477, "global_step": 161585, "epoch": 961} {"train_loss": -10.05601692199707, "global_step": 161586, "epoch": 961} {"train_loss": -10.076086044311523, "global_step": 161587, "epoch": 961} {"train_loss": -9.441082000732422, "global_step": 161588, "epoch": 961} {"train_loss": -9.903130531311035, "global_step": 161589, "epoch": 961} {"train_loss": -10.708213806152344, "global_step": 161590, "epoch": 961} {"train_loss": -9.804306983947754, "global_step": 161591, "epoch": 961} {"train_loss": -10.592056274414062, "global_step": 161592, "epoch": 961} {"train_loss": -10.000104904174805, "global_step": 161593, "epoch": 961} {"train_loss": -9.595849990844727, "global_step": 161594, "epoch": 961} {"train_loss": -10.170950889587402, "global_step": 161595, "epoch": 961} {"train_loss": -10.167518615722656, "global_step": 161596, "epoch": 961} {"train_loss": -10.152870178222656, "global_step": 161597, "epoch": 961} {"train_loss": -9.917510986328125, "global_step": 161598, "epoch": 961} {"train_loss": -10.15401840209961, "global_step": 161599, "epoch": 961} {"train_loss": -9.994422912597656, "global_step": 161600, "epoch": 961} {"train_loss": -10.254315376281738, "global_step": 161601, "epoch": 961} {"train_loss": -10.138124465942383, "global_step": 161602, "epoch": 961} {"train_loss": -10.415314674377441, "global_step": 161603, "epoch": 961} {"train_loss": -10.177611351013184, "global_step": 161604, "epoch": 961} {"train_loss": -10.438636779785156, "global_step": 161605, "epoch": 961} {"train_loss": -10.319753646850586, "global_step": 161606, "epoch": 961} {"train_loss": -10.657918930053711, "global_step": 161607, "epoch": 961} {"train_loss": -10.242317199707031, "global_step": 161608, "epoch": 961} {"train_loss": -10.501594543457031, "global_step": 161609, "epoch": 961} {"train_loss": -10.70385456085205, "global_step": 161610, "epoch": 961} {"train_loss": -10.689010620117188, "global_step": 161611, "epoch": 961} {"train_loss": -10.76543140411377, "global_step": 161612, "epoch": 961} {"train_loss": -10.430170059204102, "global_step": 161613, "epoch": 961} {"train_loss": -10.683972358703613, "global_step": 161614, "epoch": 961} {"train_loss": -10.76722796758016, "global_step": 161615, "epoch": 961, "val_loss": 236042.59375} {"train_loss": -10.560417175292969, "global_step": 161616, "epoch": 962} {"train_loss": -10.576568603515625, "global_step": 161617, "epoch": 962} {"train_loss": -10.4174222946167, "global_step": 161618, "epoch": 962} {"train_loss": -10.572916030883789, "global_step": 161619, "epoch": 962} {"train_loss": -10.711687088012695, "global_step": 161620, "epoch": 962} {"train_loss": -10.684703826904297, "global_step": 161621, "epoch": 962} {"train_loss": -10.733389854431152, "global_step": 161622, "epoch": 962} {"train_loss": -10.707523345947266, "global_step": 161623, "epoch": 962} {"train_loss": -10.761770248413086, "global_step": 161624, "epoch": 962} {"train_loss": -10.751605033874512, "global_step": 161625, "epoch": 962} {"train_loss": -10.810799598693848, "global_step": 161626, "epoch": 962} {"train_loss": -10.730550765991211, "global_step": 161627, "epoch": 962} {"train_loss": -10.564538955688477, "global_step": 161628, "epoch": 962} {"train_loss": -10.921503067016602, "global_step": 161629, "epoch": 962} {"train_loss": -10.497883796691895, "global_step": 161630, "epoch": 962} {"train_loss": -10.476893424987793, "global_step": 161631, "epoch": 962} {"train_loss": -10.859735488891602, "global_step": 161632, "epoch": 962} {"train_loss": -10.543807029724121, "global_step": 161633, "epoch": 962} {"train_loss": -10.637359619140625, "global_step": 161634, "epoch": 962} {"train_loss": -10.680383682250977, "global_step": 161635, "epoch": 962} {"train_loss": -10.727155685424805, "global_step": 161636, "epoch": 962} {"train_loss": -10.90402889251709, "global_step": 161637, "epoch": 962} {"train_loss": -10.763487815856934, "global_step": 161638, "epoch": 962} {"train_loss": -10.857067108154297, "global_step": 161639, "epoch": 962} {"train_loss": -10.72880744934082, "global_step": 161640, "epoch": 962} {"train_loss": -10.960775375366211, "global_step": 161641, "epoch": 962} {"train_loss": -10.957565307617188, "global_step": 161642, "epoch": 962} {"train_loss": -10.934944152832031, "global_step": 161643, "epoch": 962} {"train_loss": -10.75344467163086, "global_step": 161644, "epoch": 962} {"train_loss": -10.940046310424805, "global_step": 161645, "epoch": 962} {"train_loss": -10.559032440185547, "global_step": 161646, "epoch": 962} {"train_loss": -10.86131477355957, "global_step": 161647, "epoch": 962} {"train_loss": -10.606900215148926, "global_step": 161648, "epoch": 962} {"train_loss": -10.887033462524414, "global_step": 161649, "epoch": 962} {"train_loss": -10.577962875366211, "global_step": 161650, "epoch": 962} {"train_loss": -10.85983657836914, "global_step": 161651, "epoch": 962} {"train_loss": -10.581090927124023, "global_step": 161652, "epoch": 962} {"train_loss": -11.045827865600586, "global_step": 161653, "epoch": 962} {"train_loss": -10.508129119873047, "global_step": 161654, "epoch": 962} {"train_loss": -11.131121635437012, "global_step": 161655, "epoch": 962} {"train_loss": -10.64921760559082, "global_step": 161656, "epoch": 962} {"train_loss": -11.102642059326172, "global_step": 161657, "epoch": 962} {"train_loss": -10.612544059753418, "global_step": 161658, "epoch": 962} {"train_loss": -11.099102020263672, "global_step": 161659, "epoch": 962} {"train_loss": -10.831525802612305, "global_step": 161660, "epoch": 962} {"train_loss": -11.035271644592285, "global_step": 161661, "epoch": 962} {"train_loss": -11.000762939453125, "global_step": 161662, "epoch": 962} {"train_loss": -10.609831809997559, "global_step": 161663, "epoch": 962} {"train_loss": -11.062437057495117, "global_step": 161664, "epoch": 962} {"train_loss": -10.824691772460938, "global_step": 161665, "epoch": 962} {"train_loss": -10.908098220825195, "global_step": 161666, "epoch": 962} {"train_loss": -10.811544418334961, "global_step": 161667, "epoch": 962} {"train_loss": -10.798498153686523, "global_step": 161668, "epoch": 962} {"train_loss": -11.110345840454102, "global_step": 161669, "epoch": 962} {"train_loss": -10.905938148498535, "global_step": 161670, "epoch": 962} {"train_loss": -10.968876838684082, "global_step": 161671, "epoch": 962} {"train_loss": -10.753506660461426, "global_step": 161672, "epoch": 962} {"train_loss": -11.041326522827148, "global_step": 161673, "epoch": 962} {"train_loss": -10.846409797668457, "global_step": 161674, "epoch": 962} {"train_loss": -11.091777801513672, "global_step": 161675, "epoch": 962} {"train_loss": -11.074933052062988, "global_step": 161676, "epoch": 962} {"train_loss": -10.943496704101562, "global_step": 161677, "epoch": 962} {"train_loss": -11.264452934265137, "global_step": 161678, "epoch": 962} {"train_loss": -11.247549057006836, "global_step": 161679, "epoch": 962} {"train_loss": -11.216521263122559, "global_step": 161680, "epoch": 962} {"train_loss": -11.098770141601562, "global_step": 161681, "epoch": 962} {"train_loss": -11.068826675415039, "global_step": 161682, "epoch": 962} {"train_loss": -11.048860549926758, "global_step": 161683, "epoch": 962} {"train_loss": -11.181187629699707, "global_step": 161684, "epoch": 962} {"train_loss": -11.211527824401855, "global_step": 161685, "epoch": 962} {"train_loss": -10.965229034423828, "global_step": 161686, "epoch": 962} {"train_loss": -11.070670127868652, "global_step": 161687, "epoch": 962} {"train_loss": -10.841150283813477, "global_step": 161688, "epoch": 962} {"train_loss": -11.264999389648438, "global_step": 161689, "epoch": 962} {"train_loss": -11.287667274475098, "global_step": 161690, "epoch": 962} {"train_loss": -11.068267822265625, "global_step": 161691, "epoch": 962} {"train_loss": -11.279220581054688, "global_step": 161692, "epoch": 962} {"train_loss": -10.876019477844238, "global_step": 161693, "epoch": 962} {"train_loss": -11.086738586425781, "global_step": 161694, "epoch": 962} {"train_loss": -11.145058631896973, "global_step": 161695, "epoch": 962} {"train_loss": -11.230484008789062, "global_step": 161696, "epoch": 962} {"train_loss": -10.978546142578125, "global_step": 161697, "epoch": 962} {"train_loss": -11.09959602355957, "global_step": 161698, "epoch": 962} {"train_loss": -11.119467735290527, "global_step": 161699, "epoch": 962} {"train_loss": -11.262258529663086, "global_step": 161700, "epoch": 962} {"train_loss": -10.786312103271484, "global_step": 161701, "epoch": 962} {"train_loss": -10.849748611450195, "global_step": 161702, "epoch": 962} {"train_loss": -10.764888763427734, "global_step": 161703, "epoch": 962} {"train_loss": -10.395386695861816, "global_step": 161704, "epoch": 962} {"train_loss": -10.555264472961426, "global_step": 161705, "epoch": 962} {"train_loss": -10.87416934967041, "global_step": 161706, "epoch": 962} {"train_loss": -10.547121047973633, "global_step": 161707, "epoch": 962} {"train_loss": -10.660262107849121, "global_step": 161708, "epoch": 962} {"train_loss": -10.577629089355469, "global_step": 161709, "epoch": 962} {"train_loss": -10.32175064086914, "global_step": 161710, "epoch": 962} {"train_loss": -10.918976783752441, "global_step": 161711, "epoch": 962} {"train_loss": -10.332108497619629, "global_step": 161712, "epoch": 962} {"train_loss": -10.379928588867188, "global_step": 161713, "epoch": 962} {"train_loss": -11.125945091247559, "global_step": 161714, "epoch": 962} {"train_loss": -9.918144226074219, "global_step": 161715, "epoch": 962} {"train_loss": -11.000030517578125, "global_step": 161716, "epoch": 962} {"train_loss": -10.376461029052734, "global_step": 161717, "epoch": 962} {"train_loss": -10.735980987548828, "global_step": 161718, "epoch": 962} {"train_loss": -10.75684642791748, "global_step": 161719, "epoch": 962} {"train_loss": -10.479767799377441, "global_step": 161720, "epoch": 962} {"train_loss": -10.687806129455566, "global_step": 161721, "epoch": 962} {"train_loss": -10.585567474365234, "global_step": 161722, "epoch": 962} {"train_loss": -10.475777626037598, "global_step": 161723, "epoch": 962} {"train_loss": -10.434152603149414, "global_step": 161724, "epoch": 962} {"train_loss": -10.513713836669922, "global_step": 161725, "epoch": 962} {"train_loss": -10.67613410949707, "global_step": 161726, "epoch": 962} {"train_loss": -10.451278686523438, "global_step": 161727, "epoch": 962} {"train_loss": -10.448585510253906, "global_step": 161728, "epoch": 962} {"train_loss": -10.367500305175781, "global_step": 161729, "epoch": 962} {"train_loss": -10.743968963623047, "global_step": 161730, "epoch": 962} {"train_loss": -10.729934692382812, "global_step": 161731, "epoch": 962} {"train_loss": -10.562716484069824, "global_step": 161732, "epoch": 962} {"train_loss": -10.515329360961914, "global_step": 161733, "epoch": 962} {"train_loss": -10.357829093933105, "global_step": 161734, "epoch": 962} {"train_loss": -10.282783508300781, "global_step": 161735, "epoch": 962} {"train_loss": -10.732535362243652, "global_step": 161736, "epoch": 962} {"train_loss": -10.212913513183594, "global_step": 161737, "epoch": 962} {"train_loss": -10.388202667236328, "global_step": 161738, "epoch": 962} {"train_loss": -9.584554672241211, "global_step": 161739, "epoch": 962} {"train_loss": -10.180315017700195, "global_step": 161740, "epoch": 962} {"train_loss": -10.033648490905762, "global_step": 161741, "epoch": 962} {"train_loss": -10.242161750793457, "global_step": 161742, "epoch": 962} {"train_loss": -10.480899810791016, "global_step": 161743, "epoch": 962} {"train_loss": -10.182748794555664, "global_step": 161744, "epoch": 962} {"train_loss": -10.773443222045898, "global_step": 161745, "epoch": 962} {"train_loss": -10.40936279296875, "global_step": 161746, "epoch": 962} {"train_loss": -10.60047721862793, "global_step": 161747, "epoch": 962} {"train_loss": -10.526708602905273, "global_step": 161748, "epoch": 962} {"train_loss": -10.672822952270508, "global_step": 161749, "epoch": 962} {"train_loss": -10.397443771362305, "global_step": 161750, "epoch": 962} {"train_loss": -10.629959106445312, "global_step": 161751, "epoch": 962} {"train_loss": -10.479388236999512, "global_step": 161752, "epoch": 962} {"train_loss": -10.758905410766602, "global_step": 161753, "epoch": 962} {"train_loss": -10.675433158874512, "global_step": 161754, "epoch": 962} {"train_loss": -10.618911743164062, "global_step": 161755, "epoch": 962} {"train_loss": -10.841010093688965, "global_step": 161756, "epoch": 962} {"train_loss": -10.458342552185059, "global_step": 161757, "epoch": 962} {"train_loss": -10.928914070129395, "global_step": 161758, "epoch": 962} {"train_loss": -10.679433822631836, "global_step": 161759, "epoch": 962} {"train_loss": -10.818975448608398, "global_step": 161760, "epoch": 962} {"train_loss": -10.59893798828125, "global_step": 161761, "epoch": 962} {"train_loss": -11.0626220703125, "global_step": 161762, "epoch": 962} {"train_loss": -10.787256240844727, "global_step": 161763, "epoch": 962} {"train_loss": -10.825613021850586, "global_step": 161764, "epoch": 962} {"train_loss": -10.880659103393555, "global_step": 161765, "epoch": 962} {"train_loss": -10.971715927124023, "global_step": 161766, "epoch": 962} {"train_loss": -10.857353210449219, "global_step": 161767, "epoch": 962} {"train_loss": -10.958373069763184, "global_step": 161768, "epoch": 962} {"train_loss": -10.821226119995117, "global_step": 161769, "epoch": 962} {"train_loss": -11.026629447937012, "global_step": 161770, "epoch": 962} {"train_loss": -10.890655517578125, "global_step": 161771, "epoch": 962} {"train_loss": -11.007803916931152, "global_step": 161772, "epoch": 962} {"train_loss": -11.078912734985352, "global_step": 161773, "epoch": 962} {"train_loss": -10.58939266204834, "global_step": 161774, "epoch": 962} {"train_loss": -11.127920150756836, "global_step": 161775, "epoch": 962} {"train_loss": -11.016626358032227, "global_step": 161776, "epoch": 962} {"train_loss": -11.130651473999023, "global_step": 161777, "epoch": 962} {"train_loss": -11.168313980102539, "global_step": 161778, "epoch": 962} {"train_loss": -11.01071548461914, "global_step": 161779, "epoch": 962} {"train_loss": -11.206998825073242, "global_step": 161780, "epoch": 962} {"train_loss": -11.012667655944824, "global_step": 161781, "epoch": 962} {"train_loss": -11.288263320922852, "global_step": 161782, "epoch": 962} {"train_loss": -10.775795879818144, "global_step": 161783, "epoch": 962, "val_loss": 235205.359375} {"train_loss": -11.17061710357666, "global_step": 161784, "epoch": 963} {"train_loss": -11.079195976257324, "global_step": 161785, "epoch": 963} {"train_loss": -11.25312614440918, "global_step": 161786, "epoch": 963} {"train_loss": -11.077299118041992, "global_step": 161787, "epoch": 963} {"train_loss": -11.206466674804688, "global_step": 161788, "epoch": 963} {"train_loss": -10.929332733154297, "global_step": 161789, "epoch": 963} {"train_loss": -11.157166481018066, "global_step": 161790, "epoch": 963} {"train_loss": -10.88463020324707, "global_step": 161791, "epoch": 963} {"train_loss": -11.07331657409668, "global_step": 161792, "epoch": 963} {"train_loss": -11.288558959960938, "global_step": 161793, "epoch": 963} {"train_loss": -10.900049209594727, "global_step": 161794, "epoch": 963} {"train_loss": -11.340998649597168, "global_step": 161795, "epoch": 963} {"train_loss": -10.359938621520996, "global_step": 161796, "epoch": 963} {"train_loss": -11.143020629882812, "global_step": 161797, "epoch": 963} {"train_loss": -10.605091094970703, "global_step": 161798, "epoch": 963} {"train_loss": -10.804031372070312, "global_step": 161799, "epoch": 963} {"train_loss": -11.168288230895996, "global_step": 161800, "epoch": 963} {"train_loss": -10.692394256591797, "global_step": 161801, "epoch": 963} {"train_loss": -10.945113182067871, "global_step": 161802, "epoch": 963} {"train_loss": -10.882041931152344, "global_step": 161803, "epoch": 963} {"train_loss": -10.474494934082031, "global_step": 161804, "epoch": 963} {"train_loss": -10.658222198486328, "global_step": 161805, "epoch": 963} {"train_loss": -10.551336288452148, "global_step": 161806, "epoch": 963} {"train_loss": -10.51941967010498, "global_step": 161807, "epoch": 963} {"train_loss": -10.798641204833984, "global_step": 161808, "epoch": 963} {"train_loss": -10.39921760559082, "global_step": 161809, "epoch": 963} {"train_loss": -10.695818901062012, "global_step": 161810, "epoch": 963} {"train_loss": -10.13616943359375, "global_step": 161811, "epoch": 963} {"train_loss": -9.346426010131836, "global_step": 161812, "epoch": 963} {"train_loss": -10.107343673706055, "global_step": 161813, "epoch": 963} {"train_loss": -9.575275421142578, "global_step": 161814, "epoch": 963} {"train_loss": -9.29463005065918, "global_step": 161815, "epoch": 963} {"train_loss": -9.798760414123535, "global_step": 161816, "epoch": 963} {"train_loss": -10.079683303833008, "global_step": 161817, "epoch": 963} {"train_loss": -8.342945098876953, "global_step": 161818, "epoch": 963} {"train_loss": -10.170469284057617, "global_step": 161819, "epoch": 963} {"train_loss": -10.160505294799805, "global_step": 161820, "epoch": 963} {"train_loss": -9.921953201293945, "global_step": 161821, "epoch": 963} {"train_loss": -10.124234199523926, "global_step": 161822, "epoch": 963} {"train_loss": -10.08991813659668, "global_step": 161823, "epoch": 963} {"train_loss": -10.332208633422852, "global_step": 161824, "epoch": 963} {"train_loss": -9.96357536315918, "global_step": 161825, "epoch": 963} {"train_loss": -10.48997688293457, "global_step": 161826, "epoch": 963} {"train_loss": -10.332541465759277, "global_step": 161827, "epoch": 963} {"train_loss": -10.666988372802734, "global_step": 161828, "epoch": 963} {"train_loss": -10.223197937011719, "global_step": 161829, "epoch": 963} {"train_loss": -10.302602767944336, "global_step": 161830, "epoch": 963} {"train_loss": -10.445093154907227, "global_step": 161831, "epoch": 963} {"train_loss": -10.529229164123535, "global_step": 161832, "epoch": 963} {"train_loss": -10.398655891418457, "global_step": 161833, "epoch": 963} {"train_loss": -10.52597427368164, "global_step": 161834, "epoch": 963} {"train_loss": -10.544807434082031, "global_step": 161835, "epoch": 963} {"train_loss": -10.429865837097168, "global_step": 161836, "epoch": 963} {"train_loss": -10.627290725708008, "global_step": 161837, "epoch": 963} {"train_loss": -10.510541915893555, "global_step": 161838, "epoch": 963} {"train_loss": -10.75179672241211, "global_step": 161839, "epoch": 963} {"train_loss": -10.516769409179688, "global_step": 161840, "epoch": 963} {"train_loss": -10.848091125488281, "global_step": 161841, "epoch": 963} {"train_loss": -10.77979850769043, "global_step": 161842, "epoch": 963} {"train_loss": -10.815969467163086, "global_step": 161843, "epoch": 963} {"train_loss": -10.814706802368164, "global_step": 161844, "epoch": 963} {"train_loss": -10.609870910644531, "global_step": 161845, "epoch": 963} {"train_loss": -10.857255935668945, "global_step": 161846, "epoch": 963} {"train_loss": -10.849369049072266, "global_step": 161847, "epoch": 963} {"train_loss": -10.621771812438965, "global_step": 161848, "epoch": 963} {"train_loss": -10.950851440429688, "global_step": 161849, "epoch": 963} {"train_loss": -10.726034164428711, "global_step": 161850, "epoch": 963} {"train_loss": -11.04720401763916, "global_step": 161851, "epoch": 963} {"train_loss": -10.814827919006348, "global_step": 161852, "epoch": 963} {"train_loss": -10.849420547485352, "global_step": 161853, "epoch": 963} {"train_loss": -10.845244407653809, "global_step": 161854, "epoch": 963} {"train_loss": -10.908855438232422, "global_step": 161855, "epoch": 963} {"train_loss": -11.103067398071289, "global_step": 161856, "epoch": 963} {"train_loss": -10.950898170471191, "global_step": 161857, "epoch": 963} {"train_loss": -10.983996391296387, "global_step": 161858, "epoch": 963} {"train_loss": -10.764317512512207, "global_step": 161859, "epoch": 963} {"train_loss": -10.670315742492676, "global_step": 161860, "epoch": 963} {"train_loss": -11.257865905761719, "global_step": 161861, "epoch": 963} {"train_loss": -11.03322982788086, "global_step": 161862, "epoch": 963} {"train_loss": -10.987394332885742, "global_step": 161863, "epoch": 963} {"train_loss": -11.000617980957031, "global_step": 161864, "epoch": 963} {"train_loss": -11.127670288085938, "global_step": 161865, "epoch": 963} {"train_loss": -10.899282455444336, "global_step": 161866, "epoch": 963} {"train_loss": -11.104982376098633, "global_step": 161867, "epoch": 963} {"train_loss": -11.074161529541016, "global_step": 161868, "epoch": 963} {"train_loss": -11.084504127502441, "global_step": 161869, "epoch": 963} {"train_loss": -11.021474838256836, "global_step": 161870, "epoch": 963} {"train_loss": -11.056529998779297, "global_step": 161871, "epoch": 963} {"train_loss": -10.949954986572266, "global_step": 161872, "epoch": 963} {"train_loss": -11.215622901916504, "global_step": 161873, "epoch": 963} {"train_loss": -11.095306396484375, "global_step": 161874, "epoch": 963} {"train_loss": -11.27777099609375, "global_step": 161875, "epoch": 963} {"train_loss": -11.194469451904297, "global_step": 161876, "epoch": 963} {"train_loss": -11.062435150146484, "global_step": 161877, "epoch": 963} {"train_loss": -11.014841079711914, "global_step": 161878, "epoch": 963} {"train_loss": -11.181910514831543, "global_step": 161879, "epoch": 963} {"train_loss": -11.261472702026367, "global_step": 161880, "epoch": 963} {"train_loss": -11.234110832214355, "global_step": 161881, "epoch": 963} {"train_loss": -11.219504356384277, "global_step": 161882, "epoch": 963} {"train_loss": -11.4450044631958, "global_step": 161883, "epoch": 963} {"train_loss": -11.427633285522461, "global_step": 161884, "epoch": 963} {"train_loss": -11.019797325134277, "global_step": 161885, "epoch": 963} {"train_loss": -11.019051551818848, "global_step": 161886, "epoch": 963} {"train_loss": -10.979279518127441, "global_step": 161887, "epoch": 963} {"train_loss": -11.121752738952637, "global_step": 161888, "epoch": 963} {"train_loss": -10.673023223876953, "global_step": 161889, "epoch": 963} {"train_loss": -10.730554580688477, "global_step": 161890, "epoch": 963} {"train_loss": -10.705909729003906, "global_step": 161891, "epoch": 963} {"train_loss": -11.2430419921875, "global_step": 161892, "epoch": 963} {"train_loss": -10.667335510253906, "global_step": 161893, "epoch": 963} {"train_loss": -10.448497772216797, "global_step": 161894, "epoch": 963} {"train_loss": -10.947755813598633, "global_step": 161895, "epoch": 963} {"train_loss": -11.103811264038086, "global_step": 161896, "epoch": 963} {"train_loss": -10.260828971862793, "global_step": 161897, "epoch": 963} {"train_loss": -10.821104049682617, "global_step": 161898, "epoch": 963} {"train_loss": -11.304803848266602, "global_step": 161899, "epoch": 963} {"train_loss": -10.810609817504883, "global_step": 161900, "epoch": 963} {"train_loss": -10.763701438903809, "global_step": 161901, "epoch": 963} {"train_loss": -11.035179138183594, "global_step": 161902, "epoch": 963} {"train_loss": -10.816518783569336, "global_step": 161903, "epoch": 963} {"train_loss": -10.979764938354492, "global_step": 161904, "epoch": 963} {"train_loss": -10.850565910339355, "global_step": 161905, "epoch": 963} {"train_loss": -10.928228378295898, "global_step": 161906, "epoch": 963} {"train_loss": -10.669919967651367, "global_step": 161907, "epoch": 963} {"train_loss": -10.566378593444824, "global_step": 161908, "epoch": 963} {"train_loss": -10.799459457397461, "global_step": 161909, "epoch": 963} {"train_loss": -10.858489990234375, "global_step": 161910, "epoch": 963} {"train_loss": -10.874065399169922, "global_step": 161911, "epoch": 963} {"train_loss": -10.726950645446777, "global_step": 161912, "epoch": 963} {"train_loss": -10.721450805664062, "global_step": 161913, "epoch": 963} {"train_loss": -10.655288696289062, "global_step": 161914, "epoch": 963} {"train_loss": -10.457037925720215, "global_step": 161915, "epoch": 963} {"train_loss": -10.337146759033203, "global_step": 161916, "epoch": 963} {"train_loss": -10.511507987976074, "global_step": 161917, "epoch": 963} {"train_loss": -10.005533218383789, "global_step": 161918, "epoch": 963} {"train_loss": -10.380334854125977, "global_step": 161919, "epoch": 963} {"train_loss": -10.305431365966797, "global_step": 161920, "epoch": 963} {"train_loss": -10.668618202209473, "global_step": 161921, "epoch": 963} {"train_loss": -9.99203872680664, "global_step": 161922, "epoch": 963} {"train_loss": -10.785015106201172, "global_step": 161923, "epoch": 963} {"train_loss": -10.053467750549316, "global_step": 161924, "epoch": 963} {"train_loss": -10.280139923095703, "global_step": 161925, "epoch": 963} {"train_loss": -10.399951934814453, "global_step": 161926, "epoch": 963} {"train_loss": -10.581295013427734, "global_step": 161927, "epoch": 963} {"train_loss": -10.534006118774414, "global_step": 161928, "epoch": 963} {"train_loss": -10.441326141357422, "global_step": 161929, "epoch": 963} {"train_loss": -10.485669136047363, "global_step": 161930, "epoch": 963} {"train_loss": -10.401641845703125, "global_step": 161931, "epoch": 963} {"train_loss": -9.997788429260254, "global_step": 161932, "epoch": 963} {"train_loss": -10.186042785644531, "global_step": 161933, "epoch": 963} {"train_loss": -10.446454048156738, "global_step": 161934, "epoch": 963} {"train_loss": -9.667746543884277, "global_step": 161935, "epoch": 963} {"train_loss": -10.556008338928223, "global_step": 161936, "epoch": 963} {"train_loss": -10.257177352905273, "global_step": 161937, "epoch": 963} {"train_loss": -9.893238067626953, "global_step": 161938, "epoch": 963} {"train_loss": -10.297172546386719, "global_step": 161939, "epoch": 963} {"train_loss": -10.198554039001465, "global_step": 161940, "epoch": 963} {"train_loss": -10.379931449890137, "global_step": 161941, "epoch": 963} {"train_loss": -10.339733123779297, "global_step": 161942, "epoch": 963} {"train_loss": -10.53011703491211, "global_step": 161943, "epoch": 963} {"train_loss": -10.02520751953125, "global_step": 161944, "epoch": 963} {"train_loss": -11.052055358886719, "global_step": 161945, "epoch": 963} {"train_loss": -10.48063850402832, "global_step": 161946, "epoch": 963} {"train_loss": -10.52301025390625, "global_step": 161947, "epoch": 963} {"train_loss": -10.45465087890625, "global_step": 161948, "epoch": 963} {"train_loss": -10.805397033691406, "global_step": 161949, "epoch": 963} {"train_loss": -10.563618659973145, "global_step": 161950, "epoch": 963} {"train_loss": -10.665526287896293, "global_step": 161951, "epoch": 963, "val_loss": 235478.328125} {"train_loss": -10.509905815124512, "global_step": 161952, "epoch": 964} {"train_loss": -10.719717025756836, "global_step": 161953, "epoch": 964} {"train_loss": -10.767318725585938, "global_step": 161954, "epoch": 964} {"train_loss": -10.807035446166992, "global_step": 161955, "epoch": 964} {"train_loss": -10.827343940734863, "global_step": 161956, "epoch": 964} {"train_loss": -10.858028411865234, "global_step": 161957, "epoch": 964} {"train_loss": -10.796707153320312, "global_step": 161958, "epoch": 964} {"train_loss": -10.906501770019531, "global_step": 161959, "epoch": 964} {"train_loss": -10.731295585632324, "global_step": 161960, "epoch": 964} {"train_loss": -11.069889068603516, "global_step": 161961, "epoch": 964} {"train_loss": -10.829244613647461, "global_step": 161962, "epoch": 964} {"train_loss": -10.988740921020508, "global_step": 161963, "epoch": 964} {"train_loss": -10.997897148132324, "global_step": 161964, "epoch": 964} {"train_loss": -10.710375785827637, "global_step": 161965, "epoch": 964} {"train_loss": -11.023233413696289, "global_step": 161966, "epoch": 964} {"train_loss": -10.870031356811523, "global_step": 161967, "epoch": 964} {"train_loss": -10.863316535949707, "global_step": 161968, "epoch": 964} {"train_loss": -10.9423828125, "global_step": 161969, "epoch": 964} {"train_loss": -10.842962265014648, "global_step": 161970, "epoch": 964} {"train_loss": -11.037120819091797, "global_step": 161971, "epoch": 964} {"train_loss": -11.017358779907227, "global_step": 161972, "epoch": 964} {"train_loss": -11.263132095336914, "global_step": 161973, "epoch": 964} {"train_loss": -10.96962833404541, "global_step": 161974, "epoch": 964} {"train_loss": -11.121501922607422, "global_step": 161975, "epoch": 964} {"train_loss": -11.093631744384766, "global_step": 161976, "epoch": 964} {"train_loss": -11.261006355285645, "global_step": 161977, "epoch": 964} {"train_loss": -11.173173904418945, "global_step": 161978, "epoch": 964} {"train_loss": -11.069662094116211, "global_step": 161979, "epoch": 964} {"train_loss": -11.125648498535156, "global_step": 161980, "epoch": 964} {"train_loss": -11.166204452514648, "global_step": 161981, "epoch": 964} {"train_loss": -11.132147789001465, "global_step": 161982, "epoch": 964} {"train_loss": -11.279622077941895, "global_step": 161983, "epoch": 964} {"train_loss": -11.327302932739258, "global_step": 161984, "epoch": 964} {"train_loss": -11.131293296813965, "global_step": 161985, "epoch": 964} {"train_loss": -11.31208610534668, "global_step": 161986, "epoch": 964} {"train_loss": -11.07383918762207, "global_step": 161987, "epoch": 964} {"train_loss": -11.192743301391602, "global_step": 161988, "epoch": 964} {"train_loss": -11.236688613891602, "global_step": 161989, "epoch": 964} {"train_loss": -11.203527450561523, "global_step": 161990, "epoch": 964} {"train_loss": -11.164466857910156, "global_step": 161991, "epoch": 964} {"train_loss": -11.24995231628418, "global_step": 161992, "epoch": 964} {"train_loss": -11.158670425415039, "global_step": 161993, "epoch": 964} {"train_loss": -11.24660587310791, "global_step": 161994, "epoch": 964} {"train_loss": -10.98824405670166, "global_step": 161995, "epoch": 964} {"train_loss": -10.573820114135742, "global_step": 161996, "epoch": 964} {"train_loss": -10.184785842895508, "global_step": 161997, "epoch": 964} {"train_loss": -10.783123970031738, "global_step": 161998, "epoch": 964} {"train_loss": -10.628981590270996, "global_step": 161999, "epoch": 964} {"train_loss": -9.696176528930664, "global_step": 162000, "epoch": 964} {"train_loss": -10.75436782836914, "global_step": 162001, "epoch": 964} {"train_loss": -10.509424209594727, "global_step": 162002, "epoch": 964} {"train_loss": -9.969866752624512, "global_step": 162003, "epoch": 964} {"train_loss": -10.666647911071777, "global_step": 162004, "epoch": 964} {"train_loss": -10.945247650146484, "global_step": 162005, "epoch": 964} {"train_loss": -10.816189765930176, "global_step": 162006, "epoch": 964} {"train_loss": -10.607048034667969, "global_step": 162007, "epoch": 964} {"train_loss": -10.11226749420166, "global_step": 162008, "epoch": 964} {"train_loss": -10.202086448669434, "global_step": 162009, "epoch": 964} {"train_loss": -10.779443740844727, "global_step": 162010, "epoch": 964} {"train_loss": -9.126737594604492, "global_step": 162011, "epoch": 964} {"train_loss": -10.591104507446289, "global_step": 162012, "epoch": 964} {"train_loss": -10.059053421020508, "global_step": 162013, "epoch": 964} {"train_loss": -11.011585235595703, "global_step": 162014, "epoch": 964} {"train_loss": -10.655059814453125, "global_step": 162015, "epoch": 964} {"train_loss": -10.458513259887695, "global_step": 162016, "epoch": 964} {"train_loss": -10.368524551391602, "global_step": 162017, "epoch": 964} {"train_loss": -10.555898666381836, "global_step": 162018, "epoch": 964} {"train_loss": -10.728060722351074, "global_step": 162019, "epoch": 964} {"train_loss": -11.115377426147461, "global_step": 162020, "epoch": 964} {"train_loss": -10.74543571472168, "global_step": 162021, "epoch": 964} {"train_loss": -10.885749816894531, "global_step": 162022, "epoch": 964} {"train_loss": -10.739500999450684, "global_step": 162023, "epoch": 964} {"train_loss": -10.768716812133789, "global_step": 162024, "epoch": 964} {"train_loss": -10.753640174865723, "global_step": 162025, "epoch": 964} {"train_loss": -10.747407913208008, "global_step": 162026, "epoch": 964} {"train_loss": -10.854069709777832, "global_step": 162027, "epoch": 964} {"train_loss": -10.959797859191895, "global_step": 162028, "epoch": 964} {"train_loss": -10.867268562316895, "global_step": 162029, "epoch": 964} {"train_loss": -10.852807998657227, "global_step": 162030, "epoch": 964} {"train_loss": -11.017024993896484, "global_step": 162031, "epoch": 964} {"train_loss": -11.09824275970459, "global_step": 162032, "epoch": 964} {"train_loss": -10.925637245178223, "global_step": 162033, "epoch": 964} {"train_loss": -11.233034133911133, "global_step": 162034, "epoch": 964} {"train_loss": -11.002395629882812, "global_step": 162035, "epoch": 964} {"train_loss": -10.9409818649292, "global_step": 162036, "epoch": 964} {"train_loss": -10.944849014282227, "global_step": 162037, "epoch": 964} {"train_loss": -10.97293472290039, "global_step": 162038, "epoch": 964} {"train_loss": -11.139060974121094, "global_step": 162039, "epoch": 964} {"train_loss": -10.922516822814941, "global_step": 162040, "epoch": 964} {"train_loss": -11.343757629394531, "global_step": 162041, "epoch": 964} {"train_loss": -11.018144607543945, "global_step": 162042, "epoch": 964} {"train_loss": -11.238129615783691, "global_step": 162043, "epoch": 964} {"train_loss": -11.352598190307617, "global_step": 162044, "epoch": 964} {"train_loss": -11.058300018310547, "global_step": 162045, "epoch": 964} {"train_loss": -10.966127395629883, "global_step": 162046, "epoch": 964} {"train_loss": -11.206160545349121, "global_step": 162047, "epoch": 964} {"train_loss": -10.978525161743164, "global_step": 162048, "epoch": 964} {"train_loss": -11.348600387573242, "global_step": 162049, "epoch": 964} {"train_loss": -11.098262786865234, "global_step": 162050, "epoch": 964} {"train_loss": -11.078851699829102, "global_step": 162051, "epoch": 964} {"train_loss": -11.05827522277832, "global_step": 162052, "epoch": 964} {"train_loss": -11.2603759765625, "global_step": 162053, "epoch": 964} {"train_loss": -11.289472579956055, "global_step": 162054, "epoch": 964} {"train_loss": -10.92059326171875, "global_step": 162055, "epoch": 964} {"train_loss": -11.029290199279785, "global_step": 162056, "epoch": 964} {"train_loss": -11.15881633758545, "global_step": 162057, "epoch": 964} {"train_loss": -11.045228004455566, "global_step": 162058, "epoch": 964} {"train_loss": -10.698188781738281, "global_step": 162059, "epoch": 964} {"train_loss": -11.161941528320312, "global_step": 162060, "epoch": 964} {"train_loss": -11.184175491333008, "global_step": 162061, "epoch": 964} {"train_loss": -11.278606414794922, "global_step": 162062, "epoch": 964} {"train_loss": -11.28411865234375, "global_step": 162063, "epoch": 964} {"train_loss": -11.403905868530273, "global_step": 162064, "epoch": 964} {"train_loss": -11.344907760620117, "global_step": 162065, "epoch": 964} {"train_loss": -11.048680305480957, "global_step": 162066, "epoch": 964} {"train_loss": -11.265434265136719, "global_step": 162067, "epoch": 964} {"train_loss": -11.241907119750977, "global_step": 162068, "epoch": 964} {"train_loss": -11.231911659240723, "global_step": 162069, "epoch": 964} {"train_loss": -11.126419067382812, "global_step": 162070, "epoch": 964} {"train_loss": -11.101968765258789, "global_step": 162071, "epoch": 964} {"train_loss": -11.477693557739258, "global_step": 162072, "epoch": 964} {"train_loss": -11.242443084716797, "global_step": 162073, "epoch": 964} {"train_loss": -10.70727825164795, "global_step": 162074, "epoch": 964} {"train_loss": -10.80872631072998, "global_step": 162075, "epoch": 964} {"train_loss": -10.659982681274414, "global_step": 162076, "epoch": 964} {"train_loss": -11.131366729736328, "global_step": 162077, "epoch": 964} {"train_loss": -10.4967679977417, "global_step": 162078, "epoch": 964} {"train_loss": -10.321219444274902, "global_step": 162079, "epoch": 964} {"train_loss": -10.660244941711426, "global_step": 162080, "epoch": 964} {"train_loss": -10.720621109008789, "global_step": 162081, "epoch": 964} {"train_loss": -10.408000946044922, "global_step": 162082, "epoch": 964} {"train_loss": -10.900742530822754, "global_step": 162083, "epoch": 964} {"train_loss": -10.754770278930664, "global_step": 162084, "epoch": 964} {"train_loss": -10.754864692687988, "global_step": 162085, "epoch": 964} {"train_loss": -10.748770713806152, "global_step": 162086, "epoch": 964} {"train_loss": -10.286757469177246, "global_step": 162087, "epoch": 964} {"train_loss": -10.691659927368164, "global_step": 162088, "epoch": 964} {"train_loss": -10.760462760925293, "global_step": 162089, "epoch": 964} {"train_loss": -10.867380142211914, "global_step": 162090, "epoch": 964} {"train_loss": -10.883975982666016, "global_step": 162091, "epoch": 964} {"train_loss": -10.638994216918945, "global_step": 162092, "epoch": 964} {"train_loss": -10.983053207397461, "global_step": 162093, "epoch": 964} {"train_loss": -10.697895050048828, "global_step": 162094, "epoch": 964} {"train_loss": -11.048452377319336, "global_step": 162095, "epoch": 964} {"train_loss": -11.058154106140137, "global_step": 162096, "epoch": 964} {"train_loss": -10.555639266967773, "global_step": 162097, "epoch": 964} {"train_loss": -10.810392379760742, "global_step": 162098, "epoch": 964} {"train_loss": -10.985122680664062, "global_step": 162099, "epoch": 964} {"train_loss": -10.973617553710938, "global_step": 162100, "epoch": 964} {"train_loss": -10.96438217163086, "global_step": 162101, "epoch": 964} {"train_loss": -10.801344871520996, "global_step": 162102, "epoch": 964} {"train_loss": -10.686441421508789, "global_step": 162103, "epoch": 964} {"train_loss": -10.731565475463867, "global_step": 162104, "epoch": 964} {"train_loss": -10.773672103881836, "global_step": 162105, "epoch": 964} {"train_loss": -10.432466506958008, "global_step": 162106, "epoch": 964} {"train_loss": -10.949141502380371, "global_step": 162107, "epoch": 964} {"train_loss": -10.516983985900879, "global_step": 162108, "epoch": 964} {"train_loss": -10.869840621948242, "global_step": 162109, "epoch": 964} {"train_loss": -10.89791202545166, "global_step": 162110, "epoch": 964} {"train_loss": -10.456382751464844, "global_step": 162111, "epoch": 964} {"train_loss": -10.995197296142578, "global_step": 162112, "epoch": 964} {"train_loss": -10.692877769470215, "global_step": 162113, "epoch": 964} {"train_loss": -10.88347339630127, "global_step": 162114, "epoch": 964} {"train_loss": -10.79023551940918, "global_step": 162115, "epoch": 964} {"train_loss": -10.479711532592773, "global_step": 162116, "epoch": 964} {"train_loss": -10.509224891662598, "global_step": 162117, "epoch": 964} {"train_loss": -10.488901138305664, "global_step": 162118, "epoch": 964} {"train_loss": -10.880837451843988, "global_step": 162119, "epoch": 964, "val_loss": 237554.96875} {"train_loss": -10.315912246704102, "global_step": 162120, "epoch": 965} {"train_loss": -11.259038925170898, "global_step": 162121, "epoch": 965} {"train_loss": -10.467475891113281, "global_step": 162122, "epoch": 965} {"train_loss": -10.807655334472656, "global_step": 162123, "epoch": 965} {"train_loss": -10.578471183776855, "global_step": 162124, "epoch": 965} {"train_loss": -10.462591171264648, "global_step": 162125, "epoch": 965} {"train_loss": -10.899368286132812, "global_step": 162126, "epoch": 965} {"train_loss": -10.611053466796875, "global_step": 162127, "epoch": 965} {"train_loss": -11.166482925415039, "global_step": 162128, "epoch": 965} {"train_loss": -10.907529830932617, "global_step": 162129, "epoch": 965} {"train_loss": -11.103322982788086, "global_step": 162130, "epoch": 965} {"train_loss": -10.843497276306152, "global_step": 162131, "epoch": 965} {"train_loss": -10.889925003051758, "global_step": 162132, "epoch": 965} {"train_loss": -11.085227966308594, "global_step": 162133, "epoch": 965} {"train_loss": -10.849925994873047, "global_step": 162134, "epoch": 965} {"train_loss": -10.927045822143555, "global_step": 162135, "epoch": 965} {"train_loss": -11.128040313720703, "global_step": 162136, "epoch": 965} {"train_loss": -11.076517105102539, "global_step": 162137, "epoch": 965} {"train_loss": -10.795553207397461, "global_step": 162138, "epoch": 965} {"train_loss": -11.199095726013184, "global_step": 162139, "epoch": 965} {"train_loss": -11.284282684326172, "global_step": 162140, "epoch": 965} {"train_loss": -10.965337753295898, "global_step": 162141, "epoch": 965} {"train_loss": -10.90160846710205, "global_step": 162142, "epoch": 965} {"train_loss": -11.207143783569336, "global_step": 162143, "epoch": 965} {"train_loss": -11.119384765625, "global_step": 162144, "epoch": 965} {"train_loss": -11.046401023864746, "global_step": 162145, "epoch": 965} {"train_loss": -11.059370994567871, "global_step": 162146, "epoch": 965} {"train_loss": -11.011589050292969, "global_step": 162147, "epoch": 965} {"train_loss": -11.102819442749023, "global_step": 162148, "epoch": 965} {"train_loss": -11.09245491027832, "global_step": 162149, "epoch": 965} {"train_loss": -10.90081787109375, "global_step": 162150, "epoch": 965} {"train_loss": -11.087353706359863, "global_step": 162151, "epoch": 965} {"train_loss": -11.245752334594727, "global_step": 162152, "epoch": 965} {"train_loss": -11.128436088562012, "global_step": 162153, "epoch": 965} {"train_loss": -11.290529251098633, "global_step": 162154, "epoch": 965} {"train_loss": -10.943318367004395, "global_step": 162155, "epoch": 965} {"train_loss": -11.284017562866211, "global_step": 162156, "epoch": 965} {"train_loss": -11.113640785217285, "global_step": 162157, "epoch": 965} {"train_loss": -11.278793334960938, "global_step": 162158, "epoch": 965} {"train_loss": -10.858434677124023, "global_step": 162159, "epoch": 965} {"train_loss": -10.991083145141602, "global_step": 162160, "epoch": 965} {"train_loss": -10.543623924255371, "global_step": 162161, "epoch": 965} {"train_loss": -10.901116371154785, "global_step": 162162, "epoch": 965} {"train_loss": -10.663694381713867, "global_step": 162163, "epoch": 965} {"train_loss": -10.943888664245605, "global_step": 162164, "epoch": 965} {"train_loss": -10.516672134399414, "global_step": 162165, "epoch": 965} {"train_loss": -10.63637924194336, "global_step": 162166, "epoch": 965} {"train_loss": -10.858682632446289, "global_step": 162167, "epoch": 965} {"train_loss": -10.12044620513916, "global_step": 162168, "epoch": 965} {"train_loss": -10.250682830810547, "global_step": 162169, "epoch": 965} {"train_loss": -10.81688117980957, "global_step": 162170, "epoch": 965} {"train_loss": -10.939070701599121, "global_step": 162171, "epoch": 965} {"train_loss": -10.468969345092773, "global_step": 162172, "epoch": 965} {"train_loss": -11.170486450195312, "global_step": 162173, "epoch": 965} {"train_loss": -10.65762710571289, "global_step": 162174, "epoch": 965} {"train_loss": -11.096549987792969, "global_step": 162175, "epoch": 965} {"train_loss": -10.638566970825195, "global_step": 162176, "epoch": 965} {"train_loss": -11.091511726379395, "global_step": 162177, "epoch": 965} {"train_loss": -10.728246688842773, "global_step": 162178, "epoch": 965} {"train_loss": -10.560723304748535, "global_step": 162179, "epoch": 965} {"train_loss": -11.06866455078125, "global_step": 162180, "epoch": 965} {"train_loss": -10.36000919342041, "global_step": 162181, "epoch": 965} {"train_loss": -10.744625091552734, "global_step": 162182, "epoch": 965} {"train_loss": -10.724811553955078, "global_step": 162183, "epoch": 965} {"train_loss": -10.494114875793457, "global_step": 162184, "epoch": 965} {"train_loss": -10.739388465881348, "global_step": 162185, "epoch": 965} {"train_loss": -10.697568893432617, "global_step": 162186, "epoch": 965} {"train_loss": -10.909943580627441, "global_step": 162187, "epoch": 965} {"train_loss": -10.718583106994629, "global_step": 162188, "epoch": 965} {"train_loss": -10.592958450317383, "global_step": 162189, "epoch": 965} {"train_loss": -10.626951217651367, "global_step": 162190, "epoch": 965} {"train_loss": -10.652320861816406, "global_step": 162191, "epoch": 965} {"train_loss": -10.826528549194336, "global_step": 162192, "epoch": 965} {"train_loss": -10.670906066894531, "global_step": 162193, "epoch": 965} {"train_loss": -10.474481582641602, "global_step": 162194, "epoch": 965} {"train_loss": -10.7875337600708, "global_step": 162195, "epoch": 965} {"train_loss": -10.781782150268555, "global_step": 162196, "epoch": 965} {"train_loss": -10.690645217895508, "global_step": 162197, "epoch": 965} {"train_loss": -10.29161548614502, "global_step": 162198, "epoch": 965} {"train_loss": -10.541614532470703, "global_step": 162199, "epoch": 965} {"train_loss": -10.748100280761719, "global_step": 162200, "epoch": 965} {"train_loss": -10.12730598449707, "global_step": 162201, "epoch": 965} {"train_loss": -10.75202465057373, "global_step": 162202, "epoch": 965} {"train_loss": -10.90720272064209, "global_step": 162203, "epoch": 965} {"train_loss": -10.381548881530762, "global_step": 162204, "epoch": 965} {"train_loss": -10.546972274780273, "global_step": 162205, "epoch": 965} {"train_loss": -10.045343399047852, "global_step": 162206, "epoch": 965} {"train_loss": -10.500036239624023, "global_step": 162207, "epoch": 965} {"train_loss": -10.424991607666016, "global_step": 162208, "epoch": 965} {"train_loss": -10.427310943603516, "global_step": 162209, "epoch": 965} {"train_loss": -10.72914981842041, "global_step": 162210, "epoch": 965} {"train_loss": -10.340120315551758, "global_step": 162211, "epoch": 965} {"train_loss": -10.795341491699219, "global_step": 162212, "epoch": 965} {"train_loss": -10.56817626953125, "global_step": 162213, "epoch": 965} {"train_loss": -10.892053604125977, "global_step": 162214, "epoch": 965} {"train_loss": -10.513786315917969, "global_step": 162215, "epoch": 965} {"train_loss": -10.800602912902832, "global_step": 162216, "epoch": 965} {"train_loss": -10.498103141784668, "global_step": 162217, "epoch": 965} {"train_loss": -10.63869857788086, "global_step": 162218, "epoch": 965} {"train_loss": -10.756925582885742, "global_step": 162219, "epoch": 965} {"train_loss": -10.555994033813477, "global_step": 162220, "epoch": 965} {"train_loss": -10.988300323486328, "global_step": 162221, "epoch": 965} {"train_loss": -10.359331130981445, "global_step": 162222, "epoch": 965} {"train_loss": -11.090632438659668, "global_step": 162223, "epoch": 965} {"train_loss": -10.83500862121582, "global_step": 162224, "epoch": 965} {"train_loss": -10.799381256103516, "global_step": 162225, "epoch": 965} {"train_loss": -10.820602416992188, "global_step": 162226, "epoch": 965} {"train_loss": -10.702823638916016, "global_step": 162227, "epoch": 965} {"train_loss": -10.7957124710083, "global_step": 162228, "epoch": 965} {"train_loss": -10.763307571411133, "global_step": 162229, "epoch": 965} {"train_loss": -10.915461540222168, "global_step": 162230, "epoch": 965} {"train_loss": -11.06057357788086, "global_step": 162231, "epoch": 965} {"train_loss": -10.863953590393066, "global_step": 162232, "epoch": 965} {"train_loss": -10.743510246276855, "global_step": 162233, "epoch": 965} {"train_loss": -10.913633346557617, "global_step": 162234, "epoch": 965} {"train_loss": -10.844463348388672, "global_step": 162235, "epoch": 965} {"train_loss": -11.207000732421875, "global_step": 162236, "epoch": 965} {"train_loss": -10.882589340209961, "global_step": 162237, "epoch": 965} {"train_loss": -10.978950500488281, "global_step": 162238, "epoch": 965} {"train_loss": -10.976577758789062, "global_step": 162239, "epoch": 965} {"train_loss": -11.020512580871582, "global_step": 162240, "epoch": 965} {"train_loss": -11.149820327758789, "global_step": 162241, "epoch": 965} {"train_loss": -10.904855728149414, "global_step": 162242, "epoch": 965} {"train_loss": -11.017675399780273, "global_step": 162243, "epoch": 965} {"train_loss": -10.875886917114258, "global_step": 162244, "epoch": 965} {"train_loss": -11.160255432128906, "global_step": 162245, "epoch": 965} {"train_loss": -10.892974853515625, "global_step": 162246, "epoch": 965} {"train_loss": -10.889168739318848, "global_step": 162247, "epoch": 965} {"train_loss": -10.97790813446045, "global_step": 162248, "epoch": 965} {"train_loss": -10.8994140625, "global_step": 162249, "epoch": 965} {"train_loss": -11.045169830322266, "global_step": 162250, "epoch": 965} {"train_loss": -11.174039840698242, "global_step": 162251, "epoch": 965} {"train_loss": -11.02175235748291, "global_step": 162252, "epoch": 965} {"train_loss": -10.956863403320312, "global_step": 162253, "epoch": 965} {"train_loss": -11.138157844543457, "global_step": 162254, "epoch": 965} {"train_loss": -11.102277755737305, "global_step": 162255, "epoch": 965} {"train_loss": -11.405258178710938, "global_step": 162256, "epoch": 965} {"train_loss": -10.96010971069336, "global_step": 162257, "epoch": 965} {"train_loss": -11.215553283691406, "global_step": 162258, "epoch": 965} {"train_loss": -11.138399124145508, "global_step": 162259, "epoch": 965} {"train_loss": -10.78236198425293, "global_step": 162260, "epoch": 965} {"train_loss": -10.854957580566406, "global_step": 162261, "epoch": 965} {"train_loss": -10.980598449707031, "global_step": 162262, "epoch": 965} {"train_loss": -10.647965431213379, "global_step": 162263, "epoch": 965} {"train_loss": -10.927289962768555, "global_step": 162264, "epoch": 965} {"train_loss": -11.045553207397461, "global_step": 162265, "epoch": 965} {"train_loss": -10.480785369873047, "global_step": 162266, "epoch": 965} {"train_loss": -10.512088775634766, "global_step": 162267, "epoch": 965} {"train_loss": -11.039216041564941, "global_step": 162268, "epoch": 965} {"train_loss": -10.34521484375, "global_step": 162269, "epoch": 965} {"train_loss": -10.629446029663086, "global_step": 162270, "epoch": 965} {"train_loss": -11.133888244628906, "global_step": 162271, "epoch": 965} {"train_loss": -10.4963960647583, "global_step": 162272, "epoch": 965} {"train_loss": -11.194364547729492, "global_step": 162273, "epoch": 965} {"train_loss": -10.386842727661133, "global_step": 162274, "epoch": 965} {"train_loss": -11.152704238891602, "global_step": 162275, "epoch": 965} {"train_loss": -10.837288856506348, "global_step": 162276, "epoch": 965} {"train_loss": -10.600189208984375, "global_step": 162277, "epoch": 965} {"train_loss": -10.761475563049316, "global_step": 162278, "epoch": 965} {"train_loss": -10.760612487792969, "global_step": 162279, "epoch": 965} {"train_loss": -10.801054954528809, "global_step": 162280, "epoch": 965} {"train_loss": -9.70378303527832, "global_step": 162281, "epoch": 965} {"train_loss": -10.789535522460938, "global_step": 162282, "epoch": 965} {"train_loss": -10.428703308105469, "global_step": 162283, "epoch": 965} {"train_loss": -10.971068382263184, "global_step": 162284, "epoch": 965} {"train_loss": -10.283656120300293, "global_step": 162285, "epoch": 965} {"train_loss": -10.151981353759766, "global_step": 162286, "epoch": 965} {"train_loss": -10.807967855816795, "global_step": 162287, "epoch": 965, "val_loss": 236629.21875, "train_action_mse_error": 2.764408588409424} {"train_loss": -9.696343421936035, "global_step": 162288, "epoch": 966} {"train_loss": -10.580568313598633, "global_step": 162289, "epoch": 966} {"train_loss": -10.34639835357666, "global_step": 162290, "epoch": 966} {"train_loss": -10.330673217773438, "global_step": 162291, "epoch": 966} {"train_loss": -10.420806884765625, "global_step": 162292, "epoch": 966} {"train_loss": -10.204122543334961, "global_step": 162293, "epoch": 966} {"train_loss": -10.314598083496094, "global_step": 162294, "epoch": 966} {"train_loss": -10.332106590270996, "global_step": 162295, "epoch": 966} {"train_loss": -10.201979637145996, "global_step": 162296, "epoch": 966} {"train_loss": -10.4132719039917, "global_step": 162297, "epoch": 966} {"train_loss": -10.427302360534668, "global_step": 162298, "epoch": 966} {"train_loss": -10.712221145629883, "global_step": 162299, "epoch": 966} {"train_loss": -10.542057037353516, "global_step": 162300, "epoch": 966} {"train_loss": -10.741785049438477, "global_step": 162301, "epoch": 966} {"train_loss": -10.562421798706055, "global_step": 162302, "epoch": 966} {"train_loss": -10.738879203796387, "global_step": 162303, "epoch": 966} {"train_loss": -10.917543411254883, "global_step": 162304, "epoch": 966} {"train_loss": -10.380956649780273, "global_step": 162305, "epoch": 966} {"train_loss": -10.822168350219727, "global_step": 162306, "epoch": 966} {"train_loss": -10.76909351348877, "global_step": 162307, "epoch": 966} {"train_loss": -10.53256893157959, "global_step": 162308, "epoch": 966} {"train_loss": -11.042200088500977, "global_step": 162309, "epoch": 966} {"train_loss": -10.691800117492676, "global_step": 162310, "epoch": 966} {"train_loss": -10.701536178588867, "global_step": 162311, "epoch": 966} {"train_loss": -10.782378196716309, "global_step": 162312, "epoch": 966} {"train_loss": -10.926315307617188, "global_step": 162313, "epoch": 966} {"train_loss": -11.112897872924805, "global_step": 162314, "epoch": 966} {"train_loss": -10.831573486328125, "global_step": 162315, "epoch": 966} {"train_loss": -10.81599235534668, "global_step": 162316, "epoch": 966} {"train_loss": -11.07082462310791, "global_step": 162317, "epoch": 966} {"train_loss": -10.936609268188477, "global_step": 162318, "epoch": 966} {"train_loss": -10.80146312713623, "global_step": 162319, "epoch": 966} {"train_loss": -10.961492538452148, "global_step": 162320, "epoch": 966} {"train_loss": -10.886726379394531, "global_step": 162321, "epoch": 966} {"train_loss": -11.01030158996582, "global_step": 162322, "epoch": 966} {"train_loss": -11.015010833740234, "global_step": 162323, "epoch": 966} {"train_loss": -11.018016815185547, "global_step": 162324, "epoch": 966} {"train_loss": -10.927075386047363, "global_step": 162325, "epoch": 966} {"train_loss": -11.020829200744629, "global_step": 162326, "epoch": 966} {"train_loss": -10.945940017700195, "global_step": 162327, "epoch": 966} {"train_loss": -10.945172309875488, "global_step": 162328, "epoch": 966} {"train_loss": -10.99227523803711, "global_step": 162329, "epoch": 966} {"train_loss": -10.706887245178223, "global_step": 162330, "epoch": 966} {"train_loss": -11.053570747375488, "global_step": 162331, "epoch": 966} {"train_loss": -10.965583801269531, "global_step": 162332, "epoch": 966} {"train_loss": -10.979736328125, "global_step": 162333, "epoch": 966} {"train_loss": -11.038475036621094, "global_step": 162334, "epoch": 966} {"train_loss": -11.183123588562012, "global_step": 162335, "epoch": 966} {"train_loss": -11.170215606689453, "global_step": 162336, "epoch": 966} {"train_loss": -11.130708694458008, "global_step": 162337, "epoch": 966} {"train_loss": -10.926210403442383, "global_step": 162338, "epoch": 966} {"train_loss": -11.13197135925293, "global_step": 162339, "epoch": 966} {"train_loss": -10.812963485717773, "global_step": 162340, "epoch": 966} {"train_loss": -11.23548412322998, "global_step": 162341, "epoch": 966} {"train_loss": -10.730836868286133, "global_step": 162342, "epoch": 966} {"train_loss": -11.171255111694336, "global_step": 162343, "epoch": 966} {"train_loss": -11.010120391845703, "global_step": 162344, "epoch": 966} {"train_loss": -11.054973602294922, "global_step": 162345, "epoch": 966} {"train_loss": -11.120918273925781, "global_step": 162346, "epoch": 966} {"train_loss": -11.252269744873047, "global_step": 162347, "epoch": 966} {"train_loss": -11.314868927001953, "global_step": 162348, "epoch": 966} {"train_loss": -11.28848934173584, "global_step": 162349, "epoch": 966} {"train_loss": -11.070218086242676, "global_step": 162350, "epoch": 966} {"train_loss": -11.29603385925293, "global_step": 162351, "epoch": 966} {"train_loss": -10.866146087646484, "global_step": 162352, "epoch": 966} {"train_loss": -11.336858749389648, "global_step": 162353, "epoch": 966} {"train_loss": -11.163116455078125, "global_step": 162354, "epoch": 966} {"train_loss": -10.994965553283691, "global_step": 162355, "epoch": 966} {"train_loss": -11.327924728393555, "global_step": 162356, "epoch": 966} {"train_loss": -11.144598007202148, "global_step": 162357, "epoch": 966} {"train_loss": -11.14303970336914, "global_step": 162358, "epoch": 966} {"train_loss": -11.39420223236084, "global_step": 162359, "epoch": 966} {"train_loss": -10.744852066040039, "global_step": 162360, "epoch": 966} {"train_loss": -11.21749496459961, "global_step": 162361, "epoch": 966} {"train_loss": -11.230417251586914, "global_step": 162362, "epoch": 966} {"train_loss": -10.801008224487305, "global_step": 162363, "epoch": 966} {"train_loss": -11.317829132080078, "global_step": 162364, "epoch": 966} {"train_loss": -10.808917999267578, "global_step": 162365, "epoch": 966} {"train_loss": -10.951791763305664, "global_step": 162366, "epoch": 966} {"train_loss": -10.941156387329102, "global_step": 162367, "epoch": 966} {"train_loss": -10.205607414245605, "global_step": 162368, "epoch": 966} {"train_loss": -9.928756713867188, "global_step": 162369, "epoch": 966} {"train_loss": -10.580678939819336, "global_step": 162370, "epoch": 966} {"train_loss": -10.268083572387695, "global_step": 162371, "epoch": 966} {"train_loss": -10.242876052856445, "global_step": 162372, "epoch": 966} {"train_loss": -9.903106689453125, "global_step": 162373, "epoch": 966} {"train_loss": -10.22031021118164, "global_step": 162374, "epoch": 966} {"train_loss": -10.666791915893555, "global_step": 162375, "epoch": 966} {"train_loss": -9.50274658203125, "global_step": 162376, "epoch": 966} {"train_loss": -10.55384635925293, "global_step": 162377, "epoch": 966} {"train_loss": -9.84427261352539, "global_step": 162378, "epoch": 966} {"train_loss": -9.87272834777832, "global_step": 162379, "epoch": 966} {"train_loss": -10.518352508544922, "global_step": 162380, "epoch": 966} {"train_loss": -10.66441535949707, "global_step": 162381, "epoch": 966} {"train_loss": -10.527928352355957, "global_step": 162382, "epoch": 966} {"train_loss": -10.50860595703125, "global_step": 162383, "epoch": 966} {"train_loss": -9.994108200073242, "global_step": 162384, "epoch": 966} {"train_loss": -10.744431495666504, "global_step": 162385, "epoch": 966} {"train_loss": -10.73202896118164, "global_step": 162386, "epoch": 966} {"train_loss": -10.915550231933594, "global_step": 162387, "epoch": 966} {"train_loss": -10.769380569458008, "global_step": 162388, "epoch": 966} {"train_loss": -10.550252914428711, "global_step": 162389, "epoch": 966} {"train_loss": -10.754432678222656, "global_step": 162390, "epoch": 966} {"train_loss": -10.664651870727539, "global_step": 162391, "epoch": 966} {"train_loss": -10.929925918579102, "global_step": 162392, "epoch": 966} {"train_loss": -10.65848159790039, "global_step": 162393, "epoch": 966} {"train_loss": -10.707487106323242, "global_step": 162394, "epoch": 966} {"train_loss": -10.651372909545898, "global_step": 162395, "epoch": 966} {"train_loss": -10.915532112121582, "global_step": 162396, "epoch": 966} {"train_loss": -10.332000732421875, "global_step": 162397, "epoch": 966} {"train_loss": -10.990755081176758, "global_step": 162398, "epoch": 966} {"train_loss": -10.194330215454102, "global_step": 162399, "epoch": 966} {"train_loss": -10.561338424682617, "global_step": 162400, "epoch": 966} {"train_loss": -10.640907287597656, "global_step": 162401, "epoch": 966} {"train_loss": -10.601089477539062, "global_step": 162402, "epoch": 966} {"train_loss": -10.693116188049316, "global_step": 162403, "epoch": 966} {"train_loss": -10.76560115814209, "global_step": 162404, "epoch": 966} {"train_loss": -10.560648918151855, "global_step": 162405, "epoch": 966} {"train_loss": -10.56190299987793, "global_step": 162406, "epoch": 966} {"train_loss": -10.90738582611084, "global_step": 162407, "epoch": 966} {"train_loss": -10.62820053100586, "global_step": 162408, "epoch": 966} {"train_loss": -10.680097579956055, "global_step": 162409, "epoch": 966} {"train_loss": -10.483190536499023, "global_step": 162410, "epoch": 966} {"train_loss": -10.735953330993652, "global_step": 162411, "epoch": 966} {"train_loss": -10.914934158325195, "global_step": 162412, "epoch": 966} {"train_loss": -10.619667053222656, "global_step": 162413, "epoch": 966} {"train_loss": -10.63025188446045, "global_step": 162414, "epoch": 966} {"train_loss": -10.753129959106445, "global_step": 162415, "epoch": 966} {"train_loss": -10.917295455932617, "global_step": 162416, "epoch": 966} {"train_loss": -10.681878089904785, "global_step": 162417, "epoch": 966} {"train_loss": -10.674796104431152, "global_step": 162418, "epoch": 966} {"train_loss": -10.765392303466797, "global_step": 162419, "epoch": 966} {"train_loss": -11.182411193847656, "global_step": 162420, "epoch": 966} {"train_loss": -11.05246639251709, "global_step": 162421, "epoch": 966} {"train_loss": -10.687496185302734, "global_step": 162422, "epoch": 966} {"train_loss": -10.866669654846191, "global_step": 162423, "epoch": 966} {"train_loss": -10.973995208740234, "global_step": 162424, "epoch": 966} {"train_loss": -10.569894790649414, "global_step": 162425, "epoch": 966} {"train_loss": -11.283148765563965, "global_step": 162426, "epoch": 966} {"train_loss": -10.71400260925293, "global_step": 162427, "epoch": 966} {"train_loss": -10.7049560546875, "global_step": 162428, "epoch": 966} {"train_loss": -11.0189208984375, "global_step": 162429, "epoch": 966} {"train_loss": -10.801356315612793, "global_step": 162430, "epoch": 966} {"train_loss": -11.039268493652344, "global_step": 162431, "epoch": 966} {"train_loss": -10.882999420166016, "global_step": 162432, "epoch": 966} {"train_loss": -11.066864013671875, "global_step": 162433, "epoch": 966} {"train_loss": -11.011215209960938, "global_step": 162434, "epoch": 966} {"train_loss": -10.862792015075684, "global_step": 162435, "epoch": 966} {"train_loss": -10.877519607543945, "global_step": 162436, "epoch": 966} {"train_loss": -11.058547019958496, "global_step": 162437, "epoch": 966} {"train_loss": -11.214649200439453, "global_step": 162438, "epoch": 966} {"train_loss": -11.254547119140625, "global_step": 162439, "epoch": 966} {"train_loss": -10.924571990966797, "global_step": 162440, "epoch": 966} {"train_loss": -10.982842445373535, "global_step": 162441, "epoch": 966} {"train_loss": -10.940483093261719, "global_step": 162442, "epoch": 966} {"train_loss": -10.975034713745117, "global_step": 162443, "epoch": 966} {"train_loss": -10.715152740478516, "global_step": 162444, "epoch": 966} {"train_loss": -11.175334930419922, "global_step": 162445, "epoch": 966} {"train_loss": -11.059707641601562, "global_step": 162446, "epoch": 966} {"train_loss": -10.922861099243164, "global_step": 162447, "epoch": 966} {"train_loss": -10.831502914428711, "global_step": 162448, "epoch": 966} {"train_loss": -11.014543533325195, "global_step": 162449, "epoch": 966} {"train_loss": -10.71945858001709, "global_step": 162450, "epoch": 966} {"train_loss": -10.698812484741211, "global_step": 162451, "epoch": 966} {"train_loss": -11.179058074951172, "global_step": 162452, "epoch": 966} {"train_loss": -10.646817207336426, "global_step": 162453, "epoch": 966} {"train_loss": -10.437103271484375, "global_step": 162454, "epoch": 966} {"train_loss": -10.784564245314826, "global_step": 162455, "epoch": 966, "val_loss": 234675.390625} {"train_loss": -11.042859077453613, "global_step": 162456, "epoch": 967} {"train_loss": -10.514715194702148, "global_step": 162457, "epoch": 967} {"train_loss": -11.159208297729492, "global_step": 162458, "epoch": 967} {"train_loss": -10.383176803588867, "global_step": 162459, "epoch": 967} {"train_loss": -10.85501480102539, "global_step": 162460, "epoch": 967} {"train_loss": -11.250028610229492, "global_step": 162461, "epoch": 967} {"train_loss": -10.36886215209961, "global_step": 162462, "epoch": 967} {"train_loss": -11.036197662353516, "global_step": 162463, "epoch": 967} {"train_loss": -10.933267593383789, "global_step": 162464, "epoch": 967} {"train_loss": -10.976438522338867, "global_step": 162465, "epoch": 967} {"train_loss": -10.945890426635742, "global_step": 162466, "epoch": 967} {"train_loss": -10.835660934448242, "global_step": 162467, "epoch": 967} {"train_loss": -10.528635025024414, "global_step": 162468, "epoch": 967} {"train_loss": -11.018982887268066, "global_step": 162469, "epoch": 967} {"train_loss": -10.714999198913574, "global_step": 162470, "epoch": 967} {"train_loss": -10.580133438110352, "global_step": 162471, "epoch": 967} {"train_loss": -10.250520706176758, "global_step": 162472, "epoch": 967} {"train_loss": -9.52853775024414, "global_step": 162473, "epoch": 967} {"train_loss": -10.592035293579102, "global_step": 162474, "epoch": 967} {"train_loss": -9.469738006591797, "global_step": 162475, "epoch": 967} {"train_loss": -10.778233528137207, "global_step": 162476, "epoch": 967} {"train_loss": -10.381979942321777, "global_step": 162477, "epoch": 967} {"train_loss": -10.22450065612793, "global_step": 162478, "epoch": 967} {"train_loss": -11.079183578491211, "global_step": 162479, "epoch": 967} {"train_loss": -10.183889389038086, "global_step": 162480, "epoch": 967} {"train_loss": -10.79212760925293, "global_step": 162481, "epoch": 967} {"train_loss": -10.838300704956055, "global_step": 162482, "epoch": 967} {"train_loss": -10.857224464416504, "global_step": 162483, "epoch": 967} {"train_loss": -10.733112335205078, "global_step": 162484, "epoch": 967} {"train_loss": -10.768150329589844, "global_step": 162485, "epoch": 967} {"train_loss": -10.789745330810547, "global_step": 162486, "epoch": 967} {"train_loss": -10.881071090698242, "global_step": 162487, "epoch": 967} {"train_loss": -10.7969388961792, "global_step": 162488, "epoch": 967} {"train_loss": -11.042622566223145, "global_step": 162489, "epoch": 967} {"train_loss": -10.779592514038086, "global_step": 162490, "epoch": 967} {"train_loss": -10.647665023803711, "global_step": 162491, "epoch": 967} {"train_loss": -10.817819595336914, "global_step": 162492, "epoch": 967} {"train_loss": -11.000411033630371, "global_step": 162493, "epoch": 967} {"train_loss": -10.933436393737793, "global_step": 162494, "epoch": 967} {"train_loss": -11.032089233398438, "global_step": 162495, "epoch": 967} {"train_loss": -10.733650207519531, "global_step": 162496, "epoch": 967} {"train_loss": -10.836912155151367, "global_step": 162497, "epoch": 967} {"train_loss": -10.734376907348633, "global_step": 162498, "epoch": 967} {"train_loss": -10.70997428894043, "global_step": 162499, "epoch": 967} {"train_loss": -10.731096267700195, "global_step": 162500, "epoch": 967} {"train_loss": -10.433538436889648, "global_step": 162501, "epoch": 967} {"train_loss": -10.478853225708008, "global_step": 162502, "epoch": 967} {"train_loss": -10.712617874145508, "global_step": 162503, "epoch": 967} {"train_loss": -10.729874610900879, "global_step": 162504, "epoch": 967} {"train_loss": -10.552560806274414, "global_step": 162505, "epoch": 967} {"train_loss": -10.977517127990723, "global_step": 162506, "epoch": 967} {"train_loss": -10.859352111816406, "global_step": 162507, "epoch": 967} {"train_loss": -10.49850845336914, "global_step": 162508, "epoch": 967} {"train_loss": -11.094564437866211, "global_step": 162509, "epoch": 967} {"train_loss": -10.752593040466309, "global_step": 162510, "epoch": 967} {"train_loss": -10.88685417175293, "global_step": 162511, "epoch": 967} {"train_loss": -10.91826057434082, "global_step": 162512, "epoch": 967} {"train_loss": -10.928668975830078, "global_step": 162513, "epoch": 967} {"train_loss": -11.052922248840332, "global_step": 162514, "epoch": 967} {"train_loss": -10.981014251708984, "global_step": 162515, "epoch": 967} {"train_loss": -11.021549224853516, "global_step": 162516, "epoch": 967} {"train_loss": -10.977398872375488, "global_step": 162517, "epoch": 967} {"train_loss": -11.013113021850586, "global_step": 162518, "epoch": 967} {"train_loss": -11.009471893310547, "global_step": 162519, "epoch": 967} {"train_loss": -11.151798248291016, "global_step": 162520, "epoch": 967} {"train_loss": -11.049302101135254, "global_step": 162521, "epoch": 967} {"train_loss": -11.185977935791016, "global_step": 162522, "epoch": 967} {"train_loss": -11.166473388671875, "global_step": 162523, "epoch": 967} {"train_loss": -10.888517379760742, "global_step": 162524, "epoch": 967} {"train_loss": -11.266799926757812, "global_step": 162525, "epoch": 967} {"train_loss": -11.253240585327148, "global_step": 162526, "epoch": 967} {"train_loss": -11.011690139770508, "global_step": 162527, "epoch": 967} {"train_loss": -11.433433532714844, "global_step": 162528, "epoch": 967} {"train_loss": -10.969752311706543, "global_step": 162529, "epoch": 967} {"train_loss": -11.012909889221191, "global_step": 162530, "epoch": 967} {"train_loss": -11.019769668579102, "global_step": 162531, "epoch": 967} {"train_loss": -11.142831802368164, "global_step": 162532, "epoch": 967} {"train_loss": -11.108999252319336, "global_step": 162533, "epoch": 967} {"train_loss": -11.340604782104492, "global_step": 162534, "epoch": 967} {"train_loss": -11.226581573486328, "global_step": 162535, "epoch": 967} {"train_loss": -11.173566818237305, "global_step": 162536, "epoch": 967} {"train_loss": -10.913171768188477, "global_step": 162537, "epoch": 967} {"train_loss": -11.121578216552734, "global_step": 162538, "epoch": 967} {"train_loss": -11.257902145385742, "global_step": 162539, "epoch": 967} {"train_loss": -11.18736457824707, "global_step": 162540, "epoch": 967} {"train_loss": -11.361109733581543, "global_step": 162541, "epoch": 967} {"train_loss": -11.316520690917969, "global_step": 162542, "epoch": 967} {"train_loss": -11.292993545532227, "global_step": 162543, "epoch": 967} {"train_loss": -11.011690139770508, "global_step": 162544, "epoch": 967} {"train_loss": -11.161580085754395, "global_step": 162545, "epoch": 967} {"train_loss": -10.724444389343262, "global_step": 162546, "epoch": 967} {"train_loss": -10.99055004119873, "global_step": 162547, "epoch": 967} {"train_loss": -11.181766510009766, "global_step": 162548, "epoch": 967} {"train_loss": -10.710664749145508, "global_step": 162549, "epoch": 967} {"train_loss": -10.768539428710938, "global_step": 162550, "epoch": 967} {"train_loss": -10.684211730957031, "global_step": 162551, "epoch": 967} {"train_loss": -10.848642349243164, "global_step": 162552, "epoch": 967} {"train_loss": -10.545646667480469, "global_step": 162553, "epoch": 967} {"train_loss": -10.915672302246094, "global_step": 162554, "epoch": 967} {"train_loss": -10.757768630981445, "global_step": 162555, "epoch": 967} {"train_loss": -10.934309005737305, "global_step": 162556, "epoch": 967} {"train_loss": -10.855437278747559, "global_step": 162557, "epoch": 967} {"train_loss": -10.662708282470703, "global_step": 162558, "epoch": 967} {"train_loss": -11.066732406616211, "global_step": 162559, "epoch": 967} {"train_loss": -10.910581588745117, "global_step": 162560, "epoch": 967} {"train_loss": -10.553753852844238, "global_step": 162561, "epoch": 967} {"train_loss": -10.416130065917969, "global_step": 162562, "epoch": 967} {"train_loss": -10.37321662902832, "global_step": 162563, "epoch": 967} {"train_loss": -10.020471572875977, "global_step": 162564, "epoch": 967} {"train_loss": -10.101380348205566, "global_step": 162565, "epoch": 967} {"train_loss": -10.535469055175781, "global_step": 162566, "epoch": 967} {"train_loss": -9.027196884155273, "global_step": 162567, "epoch": 967} {"train_loss": -9.559389114379883, "global_step": 162568, "epoch": 967} {"train_loss": -9.088616371154785, "global_step": 162569, "epoch": 967} {"train_loss": -9.647443771362305, "global_step": 162570, "epoch": 967} {"train_loss": -10.004277229309082, "global_step": 162571, "epoch": 967} {"train_loss": -10.153642654418945, "global_step": 162572, "epoch": 967} {"train_loss": -9.96879768371582, "global_step": 162573, "epoch": 967} {"train_loss": -10.576050758361816, "global_step": 162574, "epoch": 967} {"train_loss": -10.234070777893066, "global_step": 162575, "epoch": 967} {"train_loss": -10.391355514526367, "global_step": 162576, "epoch": 967} {"train_loss": -10.747112274169922, "global_step": 162577, "epoch": 967} {"train_loss": -10.363146781921387, "global_step": 162578, "epoch": 967} {"train_loss": -10.40634822845459, "global_step": 162579, "epoch": 967} {"train_loss": -10.98187255859375, "global_step": 162580, "epoch": 967} {"train_loss": -10.303730010986328, "global_step": 162581, "epoch": 967} {"train_loss": -10.084030151367188, "global_step": 162582, "epoch": 967} {"train_loss": -10.489513397216797, "global_step": 162583, "epoch": 967} {"train_loss": -10.308425903320312, "global_step": 162584, "epoch": 967} {"train_loss": -10.11172866821289, "global_step": 162585, "epoch": 967} {"train_loss": -10.187458992004395, "global_step": 162586, "epoch": 967} {"train_loss": -10.476487159729004, "global_step": 162587, "epoch": 967} {"train_loss": -9.484859466552734, "global_step": 162588, "epoch": 967} {"train_loss": -10.839445114135742, "global_step": 162589, "epoch": 967} {"train_loss": -10.13157844543457, "global_step": 162590, "epoch": 967} {"train_loss": -9.52155876159668, "global_step": 162591, "epoch": 967} {"train_loss": -10.688438415527344, "global_step": 162592, "epoch": 967} {"train_loss": -10.21870231628418, "global_step": 162593, "epoch": 967} {"train_loss": -10.418420791625977, "global_step": 162594, "epoch": 967} {"train_loss": -10.435994148254395, "global_step": 162595, "epoch": 967} {"train_loss": -10.584394454956055, "global_step": 162596, "epoch": 967} {"train_loss": -10.339130401611328, "global_step": 162597, "epoch": 967} {"train_loss": -10.827887535095215, "global_step": 162598, "epoch": 967} {"train_loss": -10.83620834350586, "global_step": 162599, "epoch": 967} {"train_loss": -10.520591735839844, "global_step": 162600, "epoch": 967} {"train_loss": -10.636930465698242, "global_step": 162601, "epoch": 967} {"train_loss": -10.62043285369873, "global_step": 162602, "epoch": 967} {"train_loss": -10.748154640197754, "global_step": 162603, "epoch": 967} {"train_loss": -10.531152725219727, "global_step": 162604, "epoch": 967} {"train_loss": -10.977216720581055, "global_step": 162605, "epoch": 967} {"train_loss": -10.776371002197266, "global_step": 162606, "epoch": 967} {"train_loss": -10.918855667114258, "global_step": 162607, "epoch": 967} {"train_loss": -10.717196464538574, "global_step": 162608, "epoch": 967} {"train_loss": -10.970802307128906, "global_step": 162609, "epoch": 967} {"train_loss": -10.746028900146484, "global_step": 162610, "epoch": 967} {"train_loss": -10.930670738220215, "global_step": 162611, "epoch": 967} {"train_loss": -10.953132629394531, "global_step": 162612, "epoch": 967} {"train_loss": -11.014023780822754, "global_step": 162613, "epoch": 967} {"train_loss": -10.977489471435547, "global_step": 162614, "epoch": 967} {"train_loss": -10.77955436706543, "global_step": 162615, "epoch": 967} {"train_loss": -11.023651123046875, "global_step": 162616, "epoch": 967} {"train_loss": -10.964073181152344, "global_step": 162617, "epoch": 967} {"train_loss": -11.003898620605469, "global_step": 162618, "epoch": 967} {"train_loss": -10.835999488830566, "global_step": 162619, "epoch": 967} {"train_loss": -11.113277435302734, "global_step": 162620, "epoch": 967} {"train_loss": -11.132208824157715, "global_step": 162621, "epoch": 967} {"train_loss": -10.9541015625, "global_step": 162622, "epoch": 967} {"train_loss": -10.720163850557237, "global_step": 162623, "epoch": 967, "val_loss": 235993.546875} {"train_loss": -10.880247116088867, "global_step": 162624, "epoch": 968} {"train_loss": -10.925909042358398, "global_step": 162625, "epoch": 968} {"train_loss": -10.894201278686523, "global_step": 162626, "epoch": 968} {"train_loss": -10.818594932556152, "global_step": 162627, "epoch": 968} {"train_loss": -10.874754905700684, "global_step": 162628, "epoch": 968} {"train_loss": -11.007118225097656, "global_step": 162629, "epoch": 968} {"train_loss": -10.75442123413086, "global_step": 162630, "epoch": 968} {"train_loss": -10.601396560668945, "global_step": 162631, "epoch": 968} {"train_loss": -10.902603149414062, "global_step": 162632, "epoch": 968} {"train_loss": -10.786874771118164, "global_step": 162633, "epoch": 968} {"train_loss": -11.178577423095703, "global_step": 162634, "epoch": 968} {"train_loss": -11.017019271850586, "global_step": 162635, "epoch": 968} {"train_loss": -10.753959655761719, "global_step": 162636, "epoch": 968} {"train_loss": -10.899988174438477, "global_step": 162637, "epoch": 968} {"train_loss": -10.970083236694336, "global_step": 162638, "epoch": 968} {"train_loss": -10.710921287536621, "global_step": 162639, "epoch": 968} {"train_loss": -10.457292556762695, "global_step": 162640, "epoch": 968} {"train_loss": -10.790969848632812, "global_step": 162641, "epoch": 968} {"train_loss": -10.204401016235352, "global_step": 162642, "epoch": 968} {"train_loss": -10.20792007446289, "global_step": 162643, "epoch": 968} {"train_loss": -11.032404899597168, "global_step": 162644, "epoch": 968} {"train_loss": -10.155531883239746, "global_step": 162645, "epoch": 968} {"train_loss": -10.800904273986816, "global_step": 162646, "epoch": 968} {"train_loss": -10.475882530212402, "global_step": 162647, "epoch": 968} {"train_loss": -10.522300720214844, "global_step": 162648, "epoch": 968} {"train_loss": -11.211614608764648, "global_step": 162649, "epoch": 968} {"train_loss": -10.314926147460938, "global_step": 162650, "epoch": 968} {"train_loss": -10.785626411437988, "global_step": 162651, "epoch": 968} {"train_loss": -10.24724006652832, "global_step": 162652, "epoch": 968} {"train_loss": -10.900565147399902, "global_step": 162653, "epoch": 968} {"train_loss": -10.199798583984375, "global_step": 162654, "epoch": 968} {"train_loss": -10.527690887451172, "global_step": 162655, "epoch": 968} {"train_loss": -10.784173965454102, "global_step": 162656, "epoch": 968} {"train_loss": -10.31308650970459, "global_step": 162657, "epoch": 968} {"train_loss": -10.456175804138184, "global_step": 162658, "epoch": 968} {"train_loss": -10.700153350830078, "global_step": 162659, "epoch": 968} {"train_loss": -10.294078826904297, "global_step": 162660, "epoch": 968} {"train_loss": -10.89988899230957, "global_step": 162661, "epoch": 968} {"train_loss": -10.454331398010254, "global_step": 162662, "epoch": 968} {"train_loss": -10.848345756530762, "global_step": 162663, "epoch": 968} {"train_loss": -10.363289833068848, "global_step": 162664, "epoch": 968} {"train_loss": -10.620660781860352, "global_step": 162665, "epoch": 968} {"train_loss": -10.252479553222656, "global_step": 162666, "epoch": 968} {"train_loss": -10.628334045410156, "global_step": 162667, "epoch": 968} {"train_loss": -10.226394653320312, "global_step": 162668, "epoch": 968} {"train_loss": -10.652427673339844, "global_step": 162669, "epoch": 968} {"train_loss": -10.324492454528809, "global_step": 162670, "epoch": 968} {"train_loss": -11.013934135437012, "global_step": 162671, "epoch": 968} {"train_loss": -10.621086120605469, "global_step": 162672, "epoch": 968} {"train_loss": -11.074660301208496, "global_step": 162673, "epoch": 968} {"train_loss": -10.684776306152344, "global_step": 162674, "epoch": 968} {"train_loss": -10.774612426757812, "global_step": 162675, "epoch": 968} {"train_loss": -10.651498794555664, "global_step": 162676, "epoch": 968} {"train_loss": -10.811830520629883, "global_step": 162677, "epoch": 968} {"train_loss": -10.708740234375, "global_step": 162678, "epoch": 968} {"train_loss": -10.812324523925781, "global_step": 162679, "epoch": 968} {"train_loss": -10.73659896850586, "global_step": 162680, "epoch": 968} {"train_loss": -10.809133529663086, "global_step": 162681, "epoch": 968} {"train_loss": -11.0089111328125, "global_step": 162682, "epoch": 968} {"train_loss": -10.799755096435547, "global_step": 162683, "epoch": 968} {"train_loss": -10.919896125793457, "global_step": 162684, "epoch": 968} {"train_loss": -10.684218406677246, "global_step": 162685, "epoch": 968} {"train_loss": -10.830890655517578, "global_step": 162686, "epoch": 968} {"train_loss": -10.972007751464844, "global_step": 162687, "epoch": 968} {"train_loss": -10.91357421875, "global_step": 162688, "epoch": 968} {"train_loss": -10.923250198364258, "global_step": 162689, "epoch": 968} {"train_loss": -10.977424621582031, "global_step": 162690, "epoch": 968} {"train_loss": -10.725601196289062, "global_step": 162691, "epoch": 968} {"train_loss": -11.063253402709961, "global_step": 162692, "epoch": 968} {"train_loss": -11.153757095336914, "global_step": 162693, "epoch": 968} {"train_loss": -10.820301055908203, "global_step": 162694, "epoch": 968} {"train_loss": -10.921300888061523, "global_step": 162695, "epoch": 968} {"train_loss": -11.033613204956055, "global_step": 162696, "epoch": 968} {"train_loss": -10.514693260192871, "global_step": 162697, "epoch": 968} {"train_loss": -11.106822967529297, "global_step": 162698, "epoch": 968} {"train_loss": -10.899894714355469, "global_step": 162699, "epoch": 968} {"train_loss": -10.7705078125, "global_step": 162700, "epoch": 968} {"train_loss": -11.214567184448242, "global_step": 162701, "epoch": 968} {"train_loss": -11.051700592041016, "global_step": 162702, "epoch": 968} {"train_loss": -11.086862564086914, "global_step": 162703, "epoch": 968} {"train_loss": -10.95218563079834, "global_step": 162704, "epoch": 968} {"train_loss": -11.168327331542969, "global_step": 162705, "epoch": 968} {"train_loss": -10.888980865478516, "global_step": 162706, "epoch": 968} {"train_loss": -11.221471786499023, "global_step": 162707, "epoch": 968} {"train_loss": -11.03817367553711, "global_step": 162708, "epoch": 968} {"train_loss": -11.198110580444336, "global_step": 162709, "epoch": 968} {"train_loss": -10.841541290283203, "global_step": 162710, "epoch": 968} {"train_loss": -11.139333724975586, "global_step": 162711, "epoch": 968} {"train_loss": -10.949806213378906, "global_step": 162712, "epoch": 968} {"train_loss": -10.59264850616455, "global_step": 162713, "epoch": 968} {"train_loss": -11.109416961669922, "global_step": 162714, "epoch": 968} {"train_loss": -11.035056114196777, "global_step": 162715, "epoch": 968} {"train_loss": -11.126749038696289, "global_step": 162716, "epoch": 968} {"train_loss": -10.968887329101562, "global_step": 162717, "epoch": 968} {"train_loss": -11.354570388793945, "global_step": 162718, "epoch": 968} {"train_loss": -10.904523849487305, "global_step": 162719, "epoch": 968} {"train_loss": -11.050374984741211, "global_step": 162720, "epoch": 968} {"train_loss": -11.161215782165527, "global_step": 162721, "epoch": 968} {"train_loss": -10.990091323852539, "global_step": 162722, "epoch": 968} {"train_loss": -11.135194778442383, "global_step": 162723, "epoch": 968} {"train_loss": -10.957197189331055, "global_step": 162724, "epoch": 968} {"train_loss": -10.771052360534668, "global_step": 162725, "epoch": 968} {"train_loss": -10.485468864440918, "global_step": 162726, "epoch": 968} {"train_loss": -11.054492950439453, "global_step": 162727, "epoch": 968} {"train_loss": -10.387746810913086, "global_step": 162728, "epoch": 968} {"train_loss": -10.101900100708008, "global_step": 162729, "epoch": 968} {"train_loss": -10.366515159606934, "global_step": 162730, "epoch": 968} {"train_loss": -10.000199317932129, "global_step": 162731, "epoch": 968} {"train_loss": -9.996786117553711, "global_step": 162732, "epoch": 968} {"train_loss": -10.541486740112305, "global_step": 162733, "epoch": 968} {"train_loss": -10.913694381713867, "global_step": 162734, "epoch": 968} {"train_loss": -10.112428665161133, "global_step": 162735, "epoch": 968} {"train_loss": -10.9099760055542, "global_step": 162736, "epoch": 968} {"train_loss": -10.466596603393555, "global_step": 162737, "epoch": 968} {"train_loss": -10.957027435302734, "global_step": 162738, "epoch": 968} {"train_loss": -10.789704322814941, "global_step": 162739, "epoch": 968} {"train_loss": -10.553033828735352, "global_step": 162740, "epoch": 968} {"train_loss": -11.033178329467773, "global_step": 162741, "epoch": 968} {"train_loss": -10.733633995056152, "global_step": 162742, "epoch": 968} {"train_loss": -11.042350769042969, "global_step": 162743, "epoch": 968} {"train_loss": -10.398866653442383, "global_step": 162744, "epoch": 968} {"train_loss": -10.953389167785645, "global_step": 162745, "epoch": 968} {"train_loss": -10.47776985168457, "global_step": 162746, "epoch": 968} {"train_loss": -10.95610237121582, "global_step": 162747, "epoch": 968} {"train_loss": -10.781346321105957, "global_step": 162748, "epoch": 968} {"train_loss": -10.742595672607422, "global_step": 162749, "epoch": 968} {"train_loss": -10.784460067749023, "global_step": 162750, "epoch": 968} {"train_loss": -10.824874877929688, "global_step": 162751, "epoch": 968} {"train_loss": -10.817984580993652, "global_step": 162752, "epoch": 968} {"train_loss": -10.713011741638184, "global_step": 162753, "epoch": 968} {"train_loss": -11.00523567199707, "global_step": 162754, "epoch": 968} {"train_loss": -11.069869995117188, "global_step": 162755, "epoch": 968} {"train_loss": -10.786371231079102, "global_step": 162756, "epoch": 968} {"train_loss": -11.027429580688477, "global_step": 162757, "epoch": 968} {"train_loss": -10.625907897949219, "global_step": 162758, "epoch": 968} {"train_loss": -10.717060089111328, "global_step": 162759, "epoch": 968} {"train_loss": -11.132062911987305, "global_step": 162760, "epoch": 968} {"train_loss": -10.839227676391602, "global_step": 162761, "epoch": 968} {"train_loss": -10.884427070617676, "global_step": 162762, "epoch": 968} {"train_loss": -10.892316818237305, "global_step": 162763, "epoch": 968} {"train_loss": -10.976699829101562, "global_step": 162764, "epoch": 968} {"train_loss": -10.816787719726562, "global_step": 162765, "epoch": 968} {"train_loss": -10.85647964477539, "global_step": 162766, "epoch": 968} {"train_loss": -11.13984489440918, "global_step": 162767, "epoch": 968} {"train_loss": -10.89429759979248, "global_step": 162768, "epoch": 968} {"train_loss": -10.8798828125, "global_step": 162769, "epoch": 968} {"train_loss": -10.972270965576172, "global_step": 162770, "epoch": 968} {"train_loss": -11.008864402770996, "global_step": 162771, "epoch": 968} {"train_loss": -11.199502944946289, "global_step": 162772, "epoch": 968} {"train_loss": -10.842214584350586, "global_step": 162773, "epoch": 968} {"train_loss": -10.918622016906738, "global_step": 162774, "epoch": 968} {"train_loss": -10.810080528259277, "global_step": 162775, "epoch": 968} {"train_loss": -10.874673843383789, "global_step": 162776, "epoch": 968} {"train_loss": -10.846695899963379, "global_step": 162777, "epoch": 968} {"train_loss": -10.714561462402344, "global_step": 162778, "epoch": 968} {"train_loss": -10.503324508666992, "global_step": 162779, "epoch": 968} {"train_loss": -10.73805046081543, "global_step": 162780, "epoch": 968} {"train_loss": -10.64217472076416, "global_step": 162781, "epoch": 968} {"train_loss": -10.678394317626953, "global_step": 162782, "epoch": 968} {"train_loss": -10.676976203918457, "global_step": 162783, "epoch": 968} {"train_loss": -10.545945167541504, "global_step": 162784, "epoch": 968} {"train_loss": -10.37000560760498, "global_step": 162785, "epoch": 968} {"train_loss": -10.384439468383789, "global_step": 162786, "epoch": 968} {"train_loss": -10.736014366149902, "global_step": 162787, "epoch": 968} {"train_loss": -10.53672981262207, "global_step": 162788, "epoch": 968} {"train_loss": -10.973289489746094, "global_step": 162789, "epoch": 968} {"train_loss": -10.684586524963379, "global_step": 162790, "epoch": 968} {"train_loss": -10.780188384510222, "global_step": 162791, "epoch": 968, "val_loss": 235348.8125} {"train_loss": -10.614897727966309, "global_step": 162792, "epoch": 969} {"train_loss": -10.955070495605469, "global_step": 162793, "epoch": 969} {"train_loss": -10.602804183959961, "global_step": 162794, "epoch": 969} {"train_loss": -10.9259033203125, "global_step": 162795, "epoch": 969} {"train_loss": -10.714921951293945, "global_step": 162796, "epoch": 969} {"train_loss": -10.63650894165039, "global_step": 162797, "epoch": 969} {"train_loss": -10.871843338012695, "global_step": 162798, "epoch": 969} {"train_loss": -10.415313720703125, "global_step": 162799, "epoch": 969} {"train_loss": -10.913325309753418, "global_step": 162800, "epoch": 969} {"train_loss": -10.982908248901367, "global_step": 162801, "epoch": 969} {"train_loss": -10.991621017456055, "global_step": 162802, "epoch": 969} {"train_loss": -10.806169509887695, "global_step": 162803, "epoch": 969} {"train_loss": -10.89480209350586, "global_step": 162804, "epoch": 969} {"train_loss": -10.928685188293457, "global_step": 162805, "epoch": 969} {"train_loss": -11.020929336547852, "global_step": 162806, "epoch": 969} {"train_loss": -10.833549499511719, "global_step": 162807, "epoch": 969} {"train_loss": -10.67227554321289, "global_step": 162808, "epoch": 969} {"train_loss": -10.274847030639648, "global_step": 162809, "epoch": 969} {"train_loss": -10.557991027832031, "global_step": 162810, "epoch": 969} {"train_loss": -11.009733200073242, "global_step": 162811, "epoch": 969} {"train_loss": -10.500866889953613, "global_step": 162812, "epoch": 969} {"train_loss": -11.037379264831543, "global_step": 162813, "epoch": 969} {"train_loss": -10.877534866333008, "global_step": 162814, "epoch": 969} {"train_loss": -11.086018562316895, "global_step": 162815, "epoch": 969} {"train_loss": -10.759757995605469, "global_step": 162816, "epoch": 969} {"train_loss": -10.109267234802246, "global_step": 162817, "epoch": 969} {"train_loss": -11.159337997436523, "global_step": 162818, "epoch": 969} {"train_loss": -10.404041290283203, "global_step": 162819, "epoch": 969} {"train_loss": -10.700416564941406, "global_step": 162820, "epoch": 969} {"train_loss": -11.113458633422852, "global_step": 162821, "epoch": 969} {"train_loss": -10.49959945678711, "global_step": 162822, "epoch": 969} {"train_loss": -11.148031234741211, "global_step": 162823, "epoch": 969} {"train_loss": -10.737220764160156, "global_step": 162824, "epoch": 969} {"train_loss": -11.009912490844727, "global_step": 162825, "epoch": 969} {"train_loss": -10.881589889526367, "global_step": 162826, "epoch": 969} {"train_loss": -10.482243537902832, "global_step": 162827, "epoch": 969} {"train_loss": -10.953590393066406, "global_step": 162828, "epoch": 969} {"train_loss": -10.696451187133789, "global_step": 162829, "epoch": 969} {"train_loss": -10.722965240478516, "global_step": 162830, "epoch": 969} {"train_loss": -10.847705841064453, "global_step": 162831, "epoch": 969} {"train_loss": -10.890660285949707, "global_step": 162832, "epoch": 969} {"train_loss": -11.144861221313477, "global_step": 162833, "epoch": 969} {"train_loss": -10.892553329467773, "global_step": 162834, "epoch": 969} {"train_loss": -10.989665985107422, "global_step": 162835, "epoch": 969} {"train_loss": -11.25379753112793, "global_step": 162836, "epoch": 969} {"train_loss": -10.802848815917969, "global_step": 162837, "epoch": 969} {"train_loss": -11.022001266479492, "global_step": 162838, "epoch": 969} {"train_loss": -10.94896411895752, "global_step": 162839, "epoch": 969} {"train_loss": -11.10322380065918, "global_step": 162840, "epoch": 969} {"train_loss": -11.14230728149414, "global_step": 162841, "epoch": 969} {"train_loss": -10.910154342651367, "global_step": 162842, "epoch": 969} {"train_loss": -10.878120422363281, "global_step": 162843, "epoch": 969} {"train_loss": -10.777900695800781, "global_step": 162844, "epoch": 969} {"train_loss": -10.775166511535645, "global_step": 162845, "epoch": 969} {"train_loss": -11.127985000610352, "global_step": 162846, "epoch": 969} {"train_loss": -10.555837631225586, "global_step": 162847, "epoch": 969} {"train_loss": -10.946209907531738, "global_step": 162848, "epoch": 969} {"train_loss": -10.686777114868164, "global_step": 162849, "epoch": 969} {"train_loss": -11.101263999938965, "global_step": 162850, "epoch": 969} {"train_loss": -10.892977714538574, "global_step": 162851, "epoch": 969} {"train_loss": -11.037803649902344, "global_step": 162852, "epoch": 969} {"train_loss": -10.794059753417969, "global_step": 162853, "epoch": 969} {"train_loss": -11.169046401977539, "global_step": 162854, "epoch": 969} {"train_loss": -11.012628555297852, "global_step": 162855, "epoch": 969} {"train_loss": -10.84709358215332, "global_step": 162856, "epoch": 969} {"train_loss": -11.35368824005127, "global_step": 162857, "epoch": 969} {"train_loss": -10.713600158691406, "global_step": 162858, "epoch": 969} {"train_loss": -11.107959747314453, "global_step": 162859, "epoch": 969} {"train_loss": -10.673019409179688, "global_step": 162860, "epoch": 969} {"train_loss": -10.872036933898926, "global_step": 162861, "epoch": 969} {"train_loss": -10.830665588378906, "global_step": 162862, "epoch": 969} {"train_loss": -10.0012788772583, "global_step": 162863, "epoch": 969} {"train_loss": -10.956695556640625, "global_step": 162864, "epoch": 969} {"train_loss": -10.374483108520508, "global_step": 162865, "epoch": 969} {"train_loss": -10.099032402038574, "global_step": 162866, "epoch": 969} {"train_loss": -10.372319221496582, "global_step": 162867, "epoch": 969} {"train_loss": -10.408485412597656, "global_step": 162868, "epoch": 969} {"train_loss": -9.753260612487793, "global_step": 162869, "epoch": 969} {"train_loss": -10.767960548400879, "global_step": 162870, "epoch": 969} {"train_loss": -9.866514205932617, "global_step": 162871, "epoch": 969} {"train_loss": -10.539413452148438, "global_step": 162872, "epoch": 969} {"train_loss": -10.651128768920898, "global_step": 162873, "epoch": 969} {"train_loss": -10.373513221740723, "global_step": 162874, "epoch": 969} {"train_loss": -10.7826509475708, "global_step": 162875, "epoch": 969} {"train_loss": -10.228649139404297, "global_step": 162876, "epoch": 969} {"train_loss": -10.734430313110352, "global_step": 162877, "epoch": 969} {"train_loss": -10.570083618164062, "global_step": 162878, "epoch": 969} {"train_loss": -10.686400413513184, "global_step": 162879, "epoch": 969} {"train_loss": -10.626407623291016, "global_step": 162880, "epoch": 969} {"train_loss": -10.72407054901123, "global_step": 162881, "epoch": 969} {"train_loss": -10.445594787597656, "global_step": 162882, "epoch": 969} {"train_loss": -10.878520965576172, "global_step": 162883, "epoch": 969} {"train_loss": -10.265029907226562, "global_step": 162884, "epoch": 969} {"train_loss": -10.558334350585938, "global_step": 162885, "epoch": 969} {"train_loss": -10.157472610473633, "global_step": 162886, "epoch": 969} {"train_loss": -10.451603889465332, "global_step": 162887, "epoch": 969} {"train_loss": -10.085929870605469, "global_step": 162888, "epoch": 969} {"train_loss": -10.595108032226562, "global_step": 162889, "epoch": 969} {"train_loss": -10.563592910766602, "global_step": 162890, "epoch": 969} {"train_loss": -9.748066902160645, "global_step": 162891, "epoch": 969} {"train_loss": -10.259499549865723, "global_step": 162892, "epoch": 969} {"train_loss": -10.3620023727417, "global_step": 162893, "epoch": 969} {"train_loss": -10.013428688049316, "global_step": 162894, "epoch": 969} {"train_loss": -10.364564895629883, "global_step": 162895, "epoch": 969} {"train_loss": -10.730424880981445, "global_step": 162896, "epoch": 969} {"train_loss": -10.513747215270996, "global_step": 162897, "epoch": 969} {"train_loss": -10.786249160766602, "global_step": 162898, "epoch": 969} {"train_loss": -10.771092414855957, "global_step": 162899, "epoch": 969} {"train_loss": -10.555692672729492, "global_step": 162900, "epoch": 969} {"train_loss": -10.882596969604492, "global_step": 162901, "epoch": 969} {"train_loss": -10.324522972106934, "global_step": 162902, "epoch": 969} {"train_loss": -10.603469848632812, "global_step": 162903, "epoch": 969} {"train_loss": -10.589460372924805, "global_step": 162904, "epoch": 969} {"train_loss": -10.937435150146484, "global_step": 162905, "epoch": 969} {"train_loss": -10.61479663848877, "global_step": 162906, "epoch": 969} {"train_loss": -10.979280471801758, "global_step": 162907, "epoch": 969} {"train_loss": -10.73808479309082, "global_step": 162908, "epoch": 969} {"train_loss": -10.743317604064941, "global_step": 162909, "epoch": 969} {"train_loss": -10.771272659301758, "global_step": 162910, "epoch": 969} {"train_loss": -10.83395004272461, "global_step": 162911, "epoch": 969} {"train_loss": -10.894638061523438, "global_step": 162912, "epoch": 969} {"train_loss": -11.202239036560059, "global_step": 162913, "epoch": 969} {"train_loss": -10.955543518066406, "global_step": 162914, "epoch": 969} {"train_loss": -11.059103012084961, "global_step": 162915, "epoch": 969} {"train_loss": -11.158409118652344, "global_step": 162916, "epoch": 969} {"train_loss": -10.983531951904297, "global_step": 162917, "epoch": 969} {"train_loss": -10.93768310546875, "global_step": 162918, "epoch": 969} {"train_loss": -11.106927871704102, "global_step": 162919, "epoch": 969} {"train_loss": -10.910197257995605, "global_step": 162920, "epoch": 969} {"train_loss": -11.0133695602417, "global_step": 162921, "epoch": 969} {"train_loss": -11.093913078308105, "global_step": 162922, "epoch": 969} {"train_loss": -11.025781631469727, "global_step": 162923, "epoch": 969} {"train_loss": -11.195905685424805, "global_step": 162924, "epoch": 969} {"train_loss": -11.11635684967041, "global_step": 162925, "epoch": 969} {"train_loss": -10.999821662902832, "global_step": 162926, "epoch": 969} {"train_loss": -11.31507396697998, "global_step": 162927, "epoch": 969} {"train_loss": -10.924152374267578, "global_step": 162928, "epoch": 969} {"train_loss": -11.394552230834961, "global_step": 162929, "epoch": 969} {"train_loss": -11.241166114807129, "global_step": 162930, "epoch": 969} {"train_loss": -11.295188903808594, "global_step": 162931, "epoch": 969} {"train_loss": -11.128110885620117, "global_step": 162932, "epoch": 969} {"train_loss": -11.28447151184082, "global_step": 162933, "epoch": 969} {"train_loss": -11.144758224487305, "global_step": 162934, "epoch": 969} {"train_loss": -11.217368125915527, "global_step": 162935, "epoch": 969} {"train_loss": -11.285645484924316, "global_step": 162936, "epoch": 969} {"train_loss": -11.259333610534668, "global_step": 162937, "epoch": 969} {"train_loss": -11.333285331726074, "global_step": 162938, "epoch": 969} {"train_loss": -11.170238494873047, "global_step": 162939, "epoch": 969} {"train_loss": -10.944995880126953, "global_step": 162940, "epoch": 969} {"train_loss": -11.149188995361328, "global_step": 162941, "epoch": 969} {"train_loss": -10.962897300720215, "global_step": 162942, "epoch": 969} {"train_loss": -11.004884719848633, "global_step": 162943, "epoch": 969} {"train_loss": -11.09704303741455, "global_step": 162944, "epoch": 969} {"train_loss": -10.860102653503418, "global_step": 162945, "epoch": 969} {"train_loss": -11.248835563659668, "global_step": 162946, "epoch": 969} {"train_loss": -10.864025115966797, "global_step": 162947, "epoch": 969} {"train_loss": -11.220396995544434, "global_step": 162948, "epoch": 969} {"train_loss": -11.119699478149414, "global_step": 162949, "epoch": 969} {"train_loss": -11.238103866577148, "global_step": 162950, "epoch": 969} {"train_loss": -10.46093463897705, "global_step": 162951, "epoch": 969} {"train_loss": -9.368722915649414, "global_step": 162952, "epoch": 969} {"train_loss": -10.52588176727295, "global_step": 162953, "epoch": 969} {"train_loss": -10.691399574279785, "global_step": 162954, "epoch": 969} {"train_loss": -10.689892768859863, "global_step": 162955, "epoch": 969} {"train_loss": -9.589716911315918, "global_step": 162956, "epoch": 969} {"train_loss": -10.656333923339844, "global_step": 162957, "epoch": 969} {"train_loss": -10.58537483215332, "global_step": 162958, "epoch": 969} {"train_loss": -10.78568202540988, "global_step": 162959, "epoch": 969, "val_loss": 234791.96875} {"train_loss": -9.920093536376953, "global_step": 162960, "epoch": 970} {"train_loss": -10.87319564819336, "global_step": 162961, "epoch": 970} {"train_loss": -10.48699951171875, "global_step": 162962, "epoch": 970} {"train_loss": -10.479671478271484, "global_step": 162963, "epoch": 970} {"train_loss": -10.876018524169922, "global_step": 162964, "epoch": 970} {"train_loss": -9.89122200012207, "global_step": 162965, "epoch": 970} {"train_loss": -10.550127983093262, "global_step": 162966, "epoch": 970} {"train_loss": -10.301332473754883, "global_step": 162967, "epoch": 970} {"train_loss": -10.171796798706055, "global_step": 162968, "epoch": 970} {"train_loss": -10.689363479614258, "global_step": 162969, "epoch": 970} {"train_loss": -9.934019088745117, "global_step": 162970, "epoch": 970} {"train_loss": -10.90615177154541, "global_step": 162971, "epoch": 970} {"train_loss": -10.427959442138672, "global_step": 162972, "epoch": 970} {"train_loss": -10.61460018157959, "global_step": 162973, "epoch": 970} {"train_loss": -10.824007034301758, "global_step": 162974, "epoch": 970} {"train_loss": -10.341485977172852, "global_step": 162975, "epoch": 970} {"train_loss": -10.800952911376953, "global_step": 162976, "epoch": 970} {"train_loss": -10.47041130065918, "global_step": 162977, "epoch": 970} {"train_loss": -10.742159843444824, "global_step": 162978, "epoch": 970} {"train_loss": -10.918194770812988, "global_step": 162979, "epoch": 970} {"train_loss": -10.856439590454102, "global_step": 162980, "epoch": 970} {"train_loss": -10.947320938110352, "global_step": 162981, "epoch": 970} {"train_loss": -10.960558891296387, "global_step": 162982, "epoch": 970} {"train_loss": -10.62891960144043, "global_step": 162983, "epoch": 970} {"train_loss": -10.676532745361328, "global_step": 162984, "epoch": 970} {"train_loss": -10.589164733886719, "global_step": 162985, "epoch": 970} {"train_loss": -10.664548873901367, "global_step": 162986, "epoch": 970} {"train_loss": -10.914987564086914, "global_step": 162987, "epoch": 970} {"train_loss": -10.955992698669434, "global_step": 162988, "epoch": 970} {"train_loss": -10.746805191040039, "global_step": 162989, "epoch": 970} {"train_loss": -10.638120651245117, "global_step": 162990, "epoch": 970} {"train_loss": -11.161489486694336, "global_step": 162991, "epoch": 970} {"train_loss": -10.838902473449707, "global_step": 162992, "epoch": 970} {"train_loss": -11.165074348449707, "global_step": 162993, "epoch": 970} {"train_loss": -10.89599609375, "global_step": 162994, "epoch": 970} {"train_loss": -11.03195571899414, "global_step": 162995, "epoch": 970} {"train_loss": -10.920239448547363, "global_step": 162996, "epoch": 970} {"train_loss": -11.111215591430664, "global_step": 162997, "epoch": 970} {"train_loss": -10.965047836303711, "global_step": 162998, "epoch": 970} {"train_loss": -11.092390060424805, "global_step": 162999, "epoch": 970} {"train_loss": -10.986970901489258, "global_step": 163000, "epoch": 970} {"train_loss": -11.033221244812012, "global_step": 163001, "epoch": 970} {"train_loss": -11.145071983337402, "global_step": 163002, "epoch": 970} {"train_loss": -11.036108016967773, "global_step": 163003, "epoch": 970} {"train_loss": -10.72317123413086, "global_step": 163004, "epoch": 970} {"train_loss": -11.2162504196167, "global_step": 163005, "epoch": 970} {"train_loss": -11.221002578735352, "global_step": 163006, "epoch": 970} {"train_loss": -11.100298881530762, "global_step": 163007, "epoch": 970} {"train_loss": -11.00680923461914, "global_step": 163008, "epoch": 970} {"train_loss": -10.9197998046875, "global_step": 163009, "epoch": 970} {"train_loss": -11.094051361083984, "global_step": 163010, "epoch": 970} {"train_loss": -11.126632690429688, "global_step": 163011, "epoch": 970} {"train_loss": -11.033060073852539, "global_step": 163012, "epoch": 970} {"train_loss": -10.817439079284668, "global_step": 163013, "epoch": 970} {"train_loss": -10.847124099731445, "global_step": 163014, "epoch": 970} {"train_loss": -11.034727096557617, "global_step": 163015, "epoch": 970} {"train_loss": -11.047765731811523, "global_step": 163016, "epoch": 970} {"train_loss": -10.705097198486328, "global_step": 163017, "epoch": 970} {"train_loss": -10.950068473815918, "global_step": 163018, "epoch": 970} {"train_loss": -10.903304100036621, "global_step": 163019, "epoch": 970} {"train_loss": -10.48690414428711, "global_step": 163020, "epoch": 970} {"train_loss": -11.383357048034668, "global_step": 163021, "epoch": 970} {"train_loss": -10.387531280517578, "global_step": 163022, "epoch": 970} {"train_loss": -10.762713432312012, "global_step": 163023, "epoch": 970} {"train_loss": -11.066181182861328, "global_step": 163024, "epoch": 970} {"train_loss": -10.658815383911133, "global_step": 163025, "epoch": 970} {"train_loss": -10.819714546203613, "global_step": 163026, "epoch": 970} {"train_loss": -10.986757278442383, "global_step": 163027, "epoch": 970} {"train_loss": -10.098817825317383, "global_step": 163028, "epoch": 970} {"train_loss": -11.054010391235352, "global_step": 163029, "epoch": 970} {"train_loss": -10.68738842010498, "global_step": 163030, "epoch": 970} {"train_loss": -10.696534156799316, "global_step": 163031, "epoch": 970} {"train_loss": -10.779257774353027, "global_step": 163032, "epoch": 970} {"train_loss": -9.577627182006836, "global_step": 163033, "epoch": 970} {"train_loss": -10.487916946411133, "global_step": 163034, "epoch": 970} {"train_loss": -9.162519454956055, "global_step": 163035, "epoch": 970} {"train_loss": -9.694079399108887, "global_step": 163036, "epoch": 970} {"train_loss": -11.120111465454102, "global_step": 163037, "epoch": 970} {"train_loss": -9.68939208984375, "global_step": 163038, "epoch": 970} {"train_loss": -10.983526229858398, "global_step": 163039, "epoch": 970} {"train_loss": -10.794876098632812, "global_step": 163040, "epoch": 970} {"train_loss": -10.806218147277832, "global_step": 163041, "epoch": 970} {"train_loss": -10.726825714111328, "global_step": 163042, "epoch": 970} {"train_loss": -10.791193962097168, "global_step": 163043, "epoch": 970} {"train_loss": -10.765962600708008, "global_step": 163044, "epoch": 970} {"train_loss": -10.566680908203125, "global_step": 163045, "epoch": 970} {"train_loss": -10.651632308959961, "global_step": 163046, "epoch": 970} {"train_loss": -10.577609062194824, "global_step": 163047, "epoch": 970} {"train_loss": -10.588497161865234, "global_step": 163048, "epoch": 970} {"train_loss": -10.934355735778809, "global_step": 163049, "epoch": 970} {"train_loss": -10.616039276123047, "global_step": 163050, "epoch": 970} {"train_loss": -10.562467575073242, "global_step": 163051, "epoch": 970} {"train_loss": -10.69698429107666, "global_step": 163052, "epoch": 970} {"train_loss": -10.75267219543457, "global_step": 163053, "epoch": 970} {"train_loss": -10.880712509155273, "global_step": 163054, "epoch": 970} {"train_loss": -10.707023620605469, "global_step": 163055, "epoch": 970} {"train_loss": -10.991796493530273, "global_step": 163056, "epoch": 970} {"train_loss": -10.642078399658203, "global_step": 163057, "epoch": 970} {"train_loss": -10.740276336669922, "global_step": 163058, "epoch": 970} {"train_loss": -10.901037216186523, "global_step": 163059, "epoch": 970} {"train_loss": -10.889091491699219, "global_step": 163060, "epoch": 970} {"train_loss": -10.911195755004883, "global_step": 163061, "epoch": 970} {"train_loss": -10.947967529296875, "global_step": 163062, "epoch": 970} {"train_loss": -11.080679893493652, "global_step": 163063, "epoch": 970} {"train_loss": -10.847524642944336, "global_step": 163064, "epoch": 970} {"train_loss": -10.865026473999023, "global_step": 163065, "epoch": 970} {"train_loss": -11.107295036315918, "global_step": 163066, "epoch": 970} {"train_loss": -10.763378143310547, "global_step": 163067, "epoch": 970} {"train_loss": -11.076543807983398, "global_step": 163068, "epoch": 970} {"train_loss": -11.10672378540039, "global_step": 163069, "epoch": 970} {"train_loss": -10.961015701293945, "global_step": 163070, "epoch": 970} {"train_loss": -11.134639739990234, "global_step": 163071, "epoch": 970} {"train_loss": -10.807299613952637, "global_step": 163072, "epoch": 970} {"train_loss": -11.005697250366211, "global_step": 163073, "epoch": 970} {"train_loss": -10.730788230895996, "global_step": 163074, "epoch": 970} {"train_loss": -11.20206069946289, "global_step": 163075, "epoch": 970} {"train_loss": -10.554752349853516, "global_step": 163076, "epoch": 970} {"train_loss": -10.974315643310547, "global_step": 163077, "epoch": 970} {"train_loss": -10.9191255569458, "global_step": 163078, "epoch": 970} {"train_loss": -10.790011405944824, "global_step": 163079, "epoch": 970} {"train_loss": -10.78524112701416, "global_step": 163080, "epoch": 970} {"train_loss": -10.484371185302734, "global_step": 163081, "epoch": 970} {"train_loss": -10.88593864440918, "global_step": 163082, "epoch": 970} {"train_loss": -10.589157104492188, "global_step": 163083, "epoch": 970} {"train_loss": -10.394886016845703, "global_step": 163084, "epoch": 970} {"train_loss": -10.893016815185547, "global_step": 163085, "epoch": 970} {"train_loss": -10.666010856628418, "global_step": 163086, "epoch": 970} {"train_loss": -10.58633804321289, "global_step": 163087, "epoch": 970} {"train_loss": -10.568510055541992, "global_step": 163088, "epoch": 970} {"train_loss": -10.561140060424805, "global_step": 163089, "epoch": 970} {"train_loss": -10.78885555267334, "global_step": 163090, "epoch": 970} {"train_loss": -10.938966751098633, "global_step": 163091, "epoch": 970} {"train_loss": -10.852865219116211, "global_step": 163092, "epoch": 970} {"train_loss": -11.063980102539062, "global_step": 163093, "epoch": 970} {"train_loss": -10.891539573669434, "global_step": 163094, "epoch": 970} {"train_loss": -10.792776107788086, "global_step": 163095, "epoch": 970} {"train_loss": -11.23138427734375, "global_step": 163096, "epoch": 970} {"train_loss": -10.83112907409668, "global_step": 163097, "epoch": 970} {"train_loss": -11.124995231628418, "global_step": 163098, "epoch": 970} {"train_loss": -10.89669418334961, "global_step": 163099, "epoch": 970} {"train_loss": -11.130353927612305, "global_step": 163100, "epoch": 970} {"train_loss": -10.656612396240234, "global_step": 163101, "epoch": 970} {"train_loss": -10.726028442382812, "global_step": 163102, "epoch": 970} {"train_loss": -11.141365051269531, "global_step": 163103, "epoch": 970} {"train_loss": -11.114645004272461, "global_step": 163104, "epoch": 970} {"train_loss": -10.825267791748047, "global_step": 163105, "epoch": 970} {"train_loss": -11.028213500976562, "global_step": 163106, "epoch": 970} {"train_loss": -10.923262596130371, "global_step": 163107, "epoch": 970} {"train_loss": -10.988070487976074, "global_step": 163108, "epoch": 970} {"train_loss": -10.795675277709961, "global_step": 163109, "epoch": 970} {"train_loss": -10.702555656433105, "global_step": 163110, "epoch": 970} {"train_loss": -10.868852615356445, "global_step": 163111, "epoch": 970} {"train_loss": -11.20557975769043, "global_step": 163112, "epoch": 970} {"train_loss": -10.860279083251953, "global_step": 163113, "epoch": 970} {"train_loss": -10.22669792175293, "global_step": 163114, "epoch": 970} {"train_loss": -10.716635704040527, "global_step": 163115, "epoch": 970} {"train_loss": -10.24079418182373, "global_step": 163116, "epoch": 970} {"train_loss": -10.55971622467041, "global_step": 163117, "epoch": 970} {"train_loss": -10.69480037689209, "global_step": 163118, "epoch": 970} {"train_loss": -9.95862865447998, "global_step": 163119, "epoch": 970} {"train_loss": -10.535634994506836, "global_step": 163120, "epoch": 970} {"train_loss": -10.705907821655273, "global_step": 163121, "epoch": 970} {"train_loss": -10.544133186340332, "global_step": 163122, "epoch": 970} {"train_loss": -10.46081256866455, "global_step": 163123, "epoch": 970} {"train_loss": -10.83922004699707, "global_step": 163124, "epoch": 970} {"train_loss": -10.759830474853516, "global_step": 163125, "epoch": 970} {"train_loss": -10.850349426269531, "global_step": 163126, "epoch": 970} {"train_loss": -10.764970626149859, "global_step": 163127, "epoch": 970, "val_loss": 238702.90625, "train_action_mse_error": 0.5813063383102417} {"train_loss": -10.832356452941895, "global_step": 163128, "epoch": 971} {"train_loss": -11.00673770904541, "global_step": 163129, "epoch": 971} {"train_loss": -10.518852233886719, "global_step": 163130, "epoch": 971} {"train_loss": -10.692989349365234, "global_step": 163131, "epoch": 971} {"train_loss": -10.522665977478027, "global_step": 163132, "epoch": 971} {"train_loss": -10.647579193115234, "global_step": 163133, "epoch": 971} {"train_loss": -10.611701965332031, "global_step": 163134, "epoch": 971} {"train_loss": -10.017939567565918, "global_step": 163135, "epoch": 971} {"train_loss": -10.928947448730469, "global_step": 163136, "epoch": 971} {"train_loss": -9.99661636352539, "global_step": 163137, "epoch": 971} {"train_loss": -10.421802520751953, "global_step": 163138, "epoch": 971} {"train_loss": -10.128927230834961, "global_step": 163139, "epoch": 971} {"train_loss": -9.736907005310059, "global_step": 163140, "epoch": 971} {"train_loss": -10.18153190612793, "global_step": 163141, "epoch": 971} {"train_loss": -9.443473815917969, "global_step": 163142, "epoch": 971} {"train_loss": -10.661382675170898, "global_step": 163143, "epoch": 971} {"train_loss": -8.848587989807129, "global_step": 163144, "epoch": 971} {"train_loss": -9.435853004455566, "global_step": 163145, "epoch": 971} {"train_loss": -10.206460952758789, "global_step": 163146, "epoch": 971} {"train_loss": -10.030230522155762, "global_step": 163147, "epoch": 971} {"train_loss": -9.741130828857422, "global_step": 163148, "epoch": 971} {"train_loss": -10.832704544067383, "global_step": 163149, "epoch": 971} {"train_loss": -10.112531661987305, "global_step": 163150, "epoch": 971} {"train_loss": -10.134683609008789, "global_step": 163151, "epoch": 971} {"train_loss": -10.668956756591797, "global_step": 163152, "epoch": 971} {"train_loss": -10.412702560424805, "global_step": 163153, "epoch": 971} {"train_loss": -10.569517135620117, "global_step": 163154, "epoch": 971} {"train_loss": -10.563584327697754, "global_step": 163155, "epoch": 971} {"train_loss": -10.649971961975098, "global_step": 163156, "epoch": 971} {"train_loss": -10.73059368133545, "global_step": 163157, "epoch": 971} {"train_loss": -10.815238952636719, "global_step": 163158, "epoch": 971} {"train_loss": -10.728888511657715, "global_step": 163159, "epoch": 971} {"train_loss": -10.62512493133545, "global_step": 163160, "epoch": 971} {"train_loss": -10.711459159851074, "global_step": 163161, "epoch": 971} {"train_loss": -10.8599214553833, "global_step": 163162, "epoch": 971} {"train_loss": -10.73553466796875, "global_step": 163163, "epoch": 971} {"train_loss": -10.487324714660645, "global_step": 163164, "epoch": 971} {"train_loss": -10.982172012329102, "global_step": 163165, "epoch": 971} {"train_loss": -10.977208137512207, "global_step": 163166, "epoch": 971} {"train_loss": -10.648613929748535, "global_step": 163167, "epoch": 971} {"train_loss": -11.048535346984863, "global_step": 163168, "epoch": 971} {"train_loss": -10.90627670288086, "global_step": 163169, "epoch": 971} {"train_loss": -10.59404182434082, "global_step": 163170, "epoch": 971} {"train_loss": -11.074581146240234, "global_step": 163171, "epoch": 971} {"train_loss": -10.759979248046875, "global_step": 163172, "epoch": 971} {"train_loss": -10.805496215820312, "global_step": 163173, "epoch": 971} {"train_loss": -10.971489906311035, "global_step": 163174, "epoch": 971} {"train_loss": -11.057565689086914, "global_step": 163175, "epoch": 971} {"train_loss": -10.98246955871582, "global_step": 163176, "epoch": 971} {"train_loss": -11.091609954833984, "global_step": 163177, "epoch": 971} {"train_loss": -11.200586318969727, "global_step": 163178, "epoch": 971} {"train_loss": -11.203147888183594, "global_step": 163179, "epoch": 971} {"train_loss": -10.858901977539062, "global_step": 163180, "epoch": 971} {"train_loss": -11.138233184814453, "global_step": 163181, "epoch": 971} {"train_loss": -11.068553924560547, "global_step": 163182, "epoch": 971} {"train_loss": -11.027591705322266, "global_step": 163183, "epoch": 971} {"train_loss": -10.996877670288086, "global_step": 163184, "epoch": 971} {"train_loss": -11.249000549316406, "global_step": 163185, "epoch": 971} {"train_loss": -11.147911071777344, "global_step": 163186, "epoch": 971} {"train_loss": -11.160898208618164, "global_step": 163187, "epoch": 971} {"train_loss": -11.198407173156738, "global_step": 163188, "epoch": 971} {"train_loss": -11.08818531036377, "global_step": 163189, "epoch": 971} {"train_loss": -11.213562965393066, "global_step": 163190, "epoch": 971} {"train_loss": -11.215633392333984, "global_step": 163191, "epoch": 971} {"train_loss": -11.079216003417969, "global_step": 163192, "epoch": 971} {"train_loss": -11.104728698730469, "global_step": 163193, "epoch": 971} {"train_loss": -11.221416473388672, "global_step": 163194, "epoch": 971} {"train_loss": -11.01823616027832, "global_step": 163195, "epoch": 971} {"train_loss": -11.2426176071167, "global_step": 163196, "epoch": 971} {"train_loss": -10.646275520324707, "global_step": 163197, "epoch": 971} {"train_loss": -10.463738441467285, "global_step": 163198, "epoch": 971} {"train_loss": -11.325060844421387, "global_step": 163199, "epoch": 971} {"train_loss": -10.58156681060791, "global_step": 163200, "epoch": 971} {"train_loss": -10.808920860290527, "global_step": 163201, "epoch": 971} {"train_loss": -11.082782745361328, "global_step": 163202, "epoch": 971} {"train_loss": -11.012207984924316, "global_step": 163203, "epoch": 971} {"train_loss": -10.36739444732666, "global_step": 163204, "epoch": 971} {"train_loss": -10.722739219665527, "global_step": 163205, "epoch": 971} {"train_loss": -11.201142311096191, "global_step": 163206, "epoch": 971} {"train_loss": -10.77246379852295, "global_step": 163207, "epoch": 971} {"train_loss": -11.370429039001465, "global_step": 163208, "epoch": 971} {"train_loss": -11.03635025024414, "global_step": 163209, "epoch": 971} {"train_loss": -11.230989456176758, "global_step": 163210, "epoch": 971} {"train_loss": -11.199261665344238, "global_step": 163211, "epoch": 971} {"train_loss": -11.27485466003418, "global_step": 163212, "epoch": 971} {"train_loss": -11.279922485351562, "global_step": 163213, "epoch": 971} {"train_loss": -10.877037048339844, "global_step": 163214, "epoch": 971} {"train_loss": -11.20302677154541, "global_step": 163215, "epoch": 971} {"train_loss": -11.14171028137207, "global_step": 163216, "epoch": 971} {"train_loss": -11.213491439819336, "global_step": 163217, "epoch": 971} {"train_loss": -10.901368141174316, "global_step": 163218, "epoch": 971} {"train_loss": -10.811971664428711, "global_step": 163219, "epoch": 971} {"train_loss": -10.953238487243652, "global_step": 163220, "epoch": 971} {"train_loss": -10.792900085449219, "global_step": 163221, "epoch": 971} {"train_loss": -10.425846099853516, "global_step": 163222, "epoch": 971} {"train_loss": -10.995996475219727, "global_step": 163223, "epoch": 971} {"train_loss": -10.344609260559082, "global_step": 163224, "epoch": 971} {"train_loss": -10.818678855895996, "global_step": 163225, "epoch": 971} {"train_loss": -10.50422191619873, "global_step": 163226, "epoch": 971} {"train_loss": -10.574817657470703, "global_step": 163227, "epoch": 971} {"train_loss": -10.824179649353027, "global_step": 163228, "epoch": 971} {"train_loss": -10.426974296569824, "global_step": 163229, "epoch": 971} {"train_loss": -10.846765518188477, "global_step": 163230, "epoch": 971} {"train_loss": -10.553766250610352, "global_step": 163231, "epoch": 971} {"train_loss": -9.829066276550293, "global_step": 163232, "epoch": 971} {"train_loss": -10.962896347045898, "global_step": 163233, "epoch": 971} {"train_loss": -10.291803359985352, "global_step": 163234, "epoch": 971} {"train_loss": -10.929859161376953, "global_step": 163235, "epoch": 971} {"train_loss": -10.26784896850586, "global_step": 163236, "epoch": 971} {"train_loss": -10.540249824523926, "global_step": 163237, "epoch": 971} {"train_loss": -10.708369255065918, "global_step": 163238, "epoch": 971} {"train_loss": -10.067699432373047, "global_step": 163239, "epoch": 971} {"train_loss": -10.94708251953125, "global_step": 163240, "epoch": 971} {"train_loss": -10.48816967010498, "global_step": 163241, "epoch": 971} {"train_loss": -10.777769088745117, "global_step": 163242, "epoch": 971} {"train_loss": -10.513235092163086, "global_step": 163243, "epoch": 971} {"train_loss": -10.941095352172852, "global_step": 163244, "epoch": 971} {"train_loss": -10.553668975830078, "global_step": 163245, "epoch": 971} {"train_loss": -11.092171669006348, "global_step": 163246, "epoch": 971} {"train_loss": -10.748031616210938, "global_step": 163247, "epoch": 971} {"train_loss": -10.423799514770508, "global_step": 163248, "epoch": 971} {"train_loss": -10.969819068908691, "global_step": 163249, "epoch": 971} {"train_loss": -10.766079902648926, "global_step": 163250, "epoch": 971} {"train_loss": -10.776612281799316, "global_step": 163251, "epoch": 971} {"train_loss": -10.637167930603027, "global_step": 163252, "epoch": 971} {"train_loss": -10.652287483215332, "global_step": 163253, "epoch": 971} {"train_loss": -11.046557426452637, "global_step": 163254, "epoch": 971} {"train_loss": -10.597912788391113, "global_step": 163255, "epoch": 971} {"train_loss": -10.98891544342041, "global_step": 163256, "epoch": 971} {"train_loss": -10.90810775756836, "global_step": 163257, "epoch": 971} {"train_loss": -10.822636604309082, "global_step": 163258, "epoch": 971} {"train_loss": -10.64059829711914, "global_step": 163259, "epoch": 971} {"train_loss": -10.838993072509766, "global_step": 163260, "epoch": 971} {"train_loss": -11.041300773620605, "global_step": 163261, "epoch": 971} {"train_loss": -10.712177276611328, "global_step": 163262, "epoch": 971} {"train_loss": -10.818984985351562, "global_step": 163263, "epoch": 971} {"train_loss": -10.199050903320312, "global_step": 163264, "epoch": 971} {"train_loss": -10.82827377319336, "global_step": 163265, "epoch": 971} {"train_loss": -10.698368072509766, "global_step": 163266, "epoch": 971} {"train_loss": -10.787741661071777, "global_step": 163267, "epoch": 971} {"train_loss": -10.586666107177734, "global_step": 163268, "epoch": 971} {"train_loss": -10.95151424407959, "global_step": 163269, "epoch": 971} {"train_loss": -10.597661972045898, "global_step": 163270, "epoch": 971} {"train_loss": -10.496664047241211, "global_step": 163271, "epoch": 971} {"train_loss": -10.85181999206543, "global_step": 163272, "epoch": 971} {"train_loss": -10.361474990844727, "global_step": 163273, "epoch": 971} {"train_loss": -10.922826766967773, "global_step": 163274, "epoch": 971} {"train_loss": -10.286114692687988, "global_step": 163275, "epoch": 971} {"train_loss": -11.051213264465332, "global_step": 163276, "epoch": 971} {"train_loss": -10.579385757446289, "global_step": 163277, "epoch": 971} {"train_loss": -10.789324760437012, "global_step": 163278, "epoch": 971} {"train_loss": -10.781585693359375, "global_step": 163279, "epoch": 971} {"train_loss": -10.60896110534668, "global_step": 163280, "epoch": 971} {"train_loss": -10.640911102294922, "global_step": 163281, "epoch": 971} {"train_loss": -10.850271224975586, "global_step": 163282, "epoch": 971} {"train_loss": -10.356529235839844, "global_step": 163283, "epoch": 971} {"train_loss": -10.670251846313477, "global_step": 163284, "epoch": 971} {"train_loss": -10.343576431274414, "global_step": 163285, "epoch": 971} {"train_loss": -10.90634822845459, "global_step": 163286, "epoch": 971} {"train_loss": -10.528660774230957, "global_step": 163287, "epoch": 971} {"train_loss": -10.70294189453125, "global_step": 163288, "epoch": 971} {"train_loss": -10.743173599243164, "global_step": 163289, "epoch": 971} {"train_loss": -10.757925033569336, "global_step": 163290, "epoch": 971} {"train_loss": -10.707207679748535, "global_step": 163291, "epoch": 971} {"train_loss": -10.715571403503418, "global_step": 163292, "epoch": 971} {"train_loss": -10.753792762756348, "global_step": 163293, "epoch": 971} {"train_loss": -10.934409141540527, "global_step": 163294, "epoch": 971} {"train_loss": -10.727455576260885, "global_step": 163295, "epoch": 971, "val_loss": 238958.9375} {"train_loss": -10.882129669189453, "global_step": 163296, "epoch": 972} {"train_loss": -10.937487602233887, "global_step": 163297, "epoch": 972} {"train_loss": -10.797245025634766, "global_step": 163298, "epoch": 972} {"train_loss": -11.082817077636719, "global_step": 163299, "epoch": 972} {"train_loss": -10.964620590209961, "global_step": 163300, "epoch": 972} {"train_loss": -10.761480331420898, "global_step": 163301, "epoch": 972} {"train_loss": -11.081535339355469, "global_step": 163302, "epoch": 972} {"train_loss": -11.080867767333984, "global_step": 163303, "epoch": 972} {"train_loss": -10.893101692199707, "global_step": 163304, "epoch": 972} {"train_loss": -10.73690128326416, "global_step": 163305, "epoch": 972} {"train_loss": -10.462198257446289, "global_step": 163306, "epoch": 972} {"train_loss": -10.78018569946289, "global_step": 163307, "epoch": 972} {"train_loss": -10.468910217285156, "global_step": 163308, "epoch": 972} {"train_loss": -11.088043212890625, "global_step": 163309, "epoch": 972} {"train_loss": -10.820459365844727, "global_step": 163310, "epoch": 972} {"train_loss": -10.995709419250488, "global_step": 163311, "epoch": 972} {"train_loss": -10.697587966918945, "global_step": 163312, "epoch": 972} {"train_loss": -10.539257049560547, "global_step": 163313, "epoch": 972} {"train_loss": -10.82138442993164, "global_step": 163314, "epoch": 972} {"train_loss": -10.160266876220703, "global_step": 163315, "epoch": 972} {"train_loss": -11.099970817565918, "global_step": 163316, "epoch": 972} {"train_loss": -9.86681079864502, "global_step": 163317, "epoch": 972} {"train_loss": -10.681480407714844, "global_step": 163318, "epoch": 972} {"train_loss": -10.643529891967773, "global_step": 163319, "epoch": 972} {"train_loss": -10.188238143920898, "global_step": 163320, "epoch": 972} {"train_loss": -10.735086441040039, "global_step": 163321, "epoch": 972} {"train_loss": -10.494367599487305, "global_step": 163322, "epoch": 972} {"train_loss": -10.404335021972656, "global_step": 163323, "epoch": 972} {"train_loss": -10.535816192626953, "global_step": 163324, "epoch": 972} {"train_loss": -10.512994766235352, "global_step": 163325, "epoch": 972} {"train_loss": -10.889768600463867, "global_step": 163326, "epoch": 972} {"train_loss": -10.821996688842773, "global_step": 163327, "epoch": 972} {"train_loss": -10.781335830688477, "global_step": 163328, "epoch": 972} {"train_loss": -10.752706527709961, "global_step": 163329, "epoch": 972} {"train_loss": -10.699607849121094, "global_step": 163330, "epoch": 972} {"train_loss": -10.792623519897461, "global_step": 163331, "epoch": 972} {"train_loss": -10.681303977966309, "global_step": 163332, "epoch": 972} {"train_loss": -10.677547454833984, "global_step": 163333, "epoch": 972} {"train_loss": -10.841604232788086, "global_step": 163334, "epoch": 972} {"train_loss": -10.634984970092773, "global_step": 163335, "epoch": 972} {"train_loss": -11.04812240600586, "global_step": 163336, "epoch": 972} {"train_loss": -10.581450462341309, "global_step": 163337, "epoch": 972} {"train_loss": -10.804183006286621, "global_step": 163338, "epoch": 972} {"train_loss": -10.4992036819458, "global_step": 163339, "epoch": 972} {"train_loss": -10.80405044555664, "global_step": 163340, "epoch": 972} {"train_loss": -10.04298210144043, "global_step": 163341, "epoch": 972} {"train_loss": -10.469398498535156, "global_step": 163342, "epoch": 972} {"train_loss": -10.67061710357666, "global_step": 163343, "epoch": 972} {"train_loss": -10.856220245361328, "global_step": 163344, "epoch": 972} {"train_loss": -10.677993774414062, "global_step": 163345, "epoch": 972} {"train_loss": -10.461088180541992, "global_step": 163346, "epoch": 972} {"train_loss": -10.90519905090332, "global_step": 163347, "epoch": 972} {"train_loss": -10.975767135620117, "global_step": 163348, "epoch": 972} {"train_loss": -10.640856742858887, "global_step": 163349, "epoch": 972} {"train_loss": -11.090846061706543, "global_step": 163350, "epoch": 972} {"train_loss": -10.776175498962402, "global_step": 163351, "epoch": 972} {"train_loss": -10.96021842956543, "global_step": 163352, "epoch": 972} {"train_loss": -10.824769973754883, "global_step": 163353, "epoch": 972} {"train_loss": -11.087146759033203, "global_step": 163354, "epoch": 972} {"train_loss": -10.965694427490234, "global_step": 163355, "epoch": 972} {"train_loss": -11.161835670471191, "global_step": 163356, "epoch": 972} {"train_loss": -11.141132354736328, "global_step": 163357, "epoch": 972} {"train_loss": -11.169174194335938, "global_step": 163358, "epoch": 972} {"train_loss": -11.115533828735352, "global_step": 163359, "epoch": 972} {"train_loss": -11.18305778503418, "global_step": 163360, "epoch": 972} {"train_loss": -11.026430130004883, "global_step": 163361, "epoch": 972} {"train_loss": -11.252127647399902, "global_step": 163362, "epoch": 972} {"train_loss": -11.244058609008789, "global_step": 163363, "epoch": 972} {"train_loss": -11.02157974243164, "global_step": 163364, "epoch": 972} {"train_loss": -11.227794647216797, "global_step": 163365, "epoch": 972} {"train_loss": -11.038274765014648, "global_step": 163366, "epoch": 972} {"train_loss": -10.907764434814453, "global_step": 163367, "epoch": 972} {"train_loss": -10.862338066101074, "global_step": 163368, "epoch": 972} {"train_loss": -10.996774673461914, "global_step": 163369, "epoch": 972} {"train_loss": -11.167004585266113, "global_step": 163370, "epoch": 972} {"train_loss": -11.183713912963867, "global_step": 163371, "epoch": 972} {"train_loss": -11.044910430908203, "global_step": 163372, "epoch": 972} {"train_loss": -10.995769500732422, "global_step": 163373, "epoch": 972} {"train_loss": -10.735904693603516, "global_step": 163374, "epoch": 972} {"train_loss": -10.569856643676758, "global_step": 163375, "epoch": 972} {"train_loss": -11.079177856445312, "global_step": 163376, "epoch": 972} {"train_loss": -10.96222972869873, "global_step": 163377, "epoch": 972} {"train_loss": -10.795818328857422, "global_step": 163378, "epoch": 972} {"train_loss": -11.12810230255127, "global_step": 163379, "epoch": 972} {"train_loss": -10.801762580871582, "global_step": 163380, "epoch": 972} {"train_loss": -10.760404586791992, "global_step": 163381, "epoch": 972} {"train_loss": -11.041346549987793, "global_step": 163382, "epoch": 972} {"train_loss": -9.887771606445312, "global_step": 163383, "epoch": 972} {"train_loss": -10.93222713470459, "global_step": 163384, "epoch": 972} {"train_loss": -11.194958686828613, "global_step": 163385, "epoch": 972} {"train_loss": -10.507425308227539, "global_step": 163386, "epoch": 972} {"train_loss": -11.09277057647705, "global_step": 163387, "epoch": 972} {"train_loss": -10.762571334838867, "global_step": 163388, "epoch": 972} {"train_loss": -10.772806167602539, "global_step": 163389, "epoch": 972} {"train_loss": -11.161772727966309, "global_step": 163390, "epoch": 972} {"train_loss": -10.88705062866211, "global_step": 163391, "epoch": 972} {"train_loss": -10.796998977661133, "global_step": 163392, "epoch": 972} {"train_loss": -10.46327018737793, "global_step": 163393, "epoch": 972} {"train_loss": -10.8712739944458, "global_step": 163394, "epoch": 972} {"train_loss": -10.434712409973145, "global_step": 163395, "epoch": 972} {"train_loss": -10.701485633850098, "global_step": 163396, "epoch": 972} {"train_loss": -10.45895767211914, "global_step": 163397, "epoch": 972} {"train_loss": -11.09903335571289, "global_step": 163398, "epoch": 972} {"train_loss": -10.306680679321289, "global_step": 163399, "epoch": 972} {"train_loss": -11.176652908325195, "global_step": 163400, "epoch": 972} {"train_loss": -10.472395896911621, "global_step": 163401, "epoch": 972} {"train_loss": -10.501649856567383, "global_step": 163402, "epoch": 972} {"train_loss": -10.982202529907227, "global_step": 163403, "epoch": 972} {"train_loss": -10.247941017150879, "global_step": 163404, "epoch": 972} {"train_loss": -11.081180572509766, "global_step": 163405, "epoch": 972} {"train_loss": -10.638002395629883, "global_step": 163406, "epoch": 972} {"train_loss": -10.972476959228516, "global_step": 163407, "epoch": 972} {"train_loss": -10.962668418884277, "global_step": 163408, "epoch": 972} {"train_loss": -10.779459953308105, "global_step": 163409, "epoch": 972} {"train_loss": -10.932626724243164, "global_step": 163410, "epoch": 972} {"train_loss": -11.159225463867188, "global_step": 163411, "epoch": 972} {"train_loss": -10.974502563476562, "global_step": 163412, "epoch": 972} {"train_loss": -10.854975700378418, "global_step": 163413, "epoch": 972} {"train_loss": -11.148599624633789, "global_step": 163414, "epoch": 972} {"train_loss": -11.040313720703125, "global_step": 163415, "epoch": 972} {"train_loss": -11.297937393188477, "global_step": 163416, "epoch": 972} {"train_loss": -10.727630615234375, "global_step": 163417, "epoch": 972} {"train_loss": -11.167110443115234, "global_step": 163418, "epoch": 972} {"train_loss": -10.76827621459961, "global_step": 163419, "epoch": 972} {"train_loss": -10.974790573120117, "global_step": 163420, "epoch": 972} {"train_loss": -10.706615447998047, "global_step": 163421, "epoch": 972} {"train_loss": -10.81093978881836, "global_step": 163422, "epoch": 972} {"train_loss": -10.8245210647583, "global_step": 163423, "epoch": 972} {"train_loss": -10.672633171081543, "global_step": 163424, "epoch": 972} {"train_loss": -11.13233757019043, "global_step": 163425, "epoch": 972} {"train_loss": -10.805608749389648, "global_step": 163426, "epoch": 972} {"train_loss": -11.025812149047852, "global_step": 163427, "epoch": 972} {"train_loss": -11.09027099609375, "global_step": 163428, "epoch": 972} {"train_loss": -11.164456367492676, "global_step": 163429, "epoch": 972} {"train_loss": -10.873649597167969, "global_step": 163430, "epoch": 972} {"train_loss": -11.267716407775879, "global_step": 163431, "epoch": 972} {"train_loss": -10.685705184936523, "global_step": 163432, "epoch": 972} {"train_loss": -11.15474796295166, "global_step": 163433, "epoch": 972} {"train_loss": -10.887571334838867, "global_step": 163434, "epoch": 972} {"train_loss": -11.199600219726562, "global_step": 163435, "epoch": 972} {"train_loss": -11.157990455627441, "global_step": 163436, "epoch": 972} {"train_loss": -10.620183944702148, "global_step": 163437, "epoch": 972} {"train_loss": -11.041783332824707, "global_step": 163438, "epoch": 972} {"train_loss": -10.231775283813477, "global_step": 163439, "epoch": 972} {"train_loss": -11.085041999816895, "global_step": 163440, "epoch": 972} {"train_loss": -10.299238204956055, "global_step": 163441, "epoch": 972} {"train_loss": -11.001152038574219, "global_step": 163442, "epoch": 972} {"train_loss": -10.413444519042969, "global_step": 163443, "epoch": 972} {"train_loss": -10.901590347290039, "global_step": 163444, "epoch": 972} {"train_loss": -10.530285835266113, "global_step": 163445, "epoch": 972} {"train_loss": -10.195714950561523, "global_step": 163446, "epoch": 972} {"train_loss": -11.037665367126465, "global_step": 163447, "epoch": 972} {"train_loss": -10.854449272155762, "global_step": 163448, "epoch": 972} {"train_loss": -10.793625831604004, "global_step": 163449, "epoch": 972} {"train_loss": -10.669851303100586, "global_step": 163450, "epoch": 972} {"train_loss": -10.943920135498047, "global_step": 163451, "epoch": 972} {"train_loss": -10.962142944335938, "global_step": 163452, "epoch": 972} {"train_loss": -10.518314361572266, "global_step": 163453, "epoch": 972} {"train_loss": -10.841536521911621, "global_step": 163454, "epoch": 972} {"train_loss": -10.79083251953125, "global_step": 163455, "epoch": 972} {"train_loss": -10.045587539672852, "global_step": 163456, "epoch": 972} {"train_loss": -10.94668197631836, "global_step": 163457, "epoch": 972} {"train_loss": -10.590333938598633, "global_step": 163458, "epoch": 972} {"train_loss": -10.559967041015625, "global_step": 163459, "epoch": 972} {"train_loss": -10.986734390258789, "global_step": 163460, "epoch": 972} {"train_loss": -10.511116981506348, "global_step": 163461, "epoch": 972} {"train_loss": -10.547853469848633, "global_step": 163462, "epoch": 972} {"train_loss": -10.815302786372957, "global_step": 163463, "epoch": 972, "val_loss": 238128.015625} {"train_loss": -10.134143829345703, "global_step": 163464, "epoch": 973} {"train_loss": -10.98995304107666, "global_step": 163465, "epoch": 973} {"train_loss": -10.76168155670166, "global_step": 163466, "epoch": 973} {"train_loss": -10.553400039672852, "global_step": 163467, "epoch": 973} {"train_loss": -10.633052825927734, "global_step": 163468, "epoch": 973} {"train_loss": -10.55255126953125, "global_step": 163469, "epoch": 973} {"train_loss": -10.604936599731445, "global_step": 163470, "epoch": 973} {"train_loss": -10.626413345336914, "global_step": 163471, "epoch": 973} {"train_loss": -10.51636791229248, "global_step": 163472, "epoch": 973} {"train_loss": -10.72824764251709, "global_step": 163473, "epoch": 973} {"train_loss": -10.36306095123291, "global_step": 163474, "epoch": 973} {"train_loss": -10.717880249023438, "global_step": 163475, "epoch": 973} {"train_loss": -10.536252975463867, "global_step": 163476, "epoch": 973} {"train_loss": -10.593118667602539, "global_step": 163477, "epoch": 973} {"train_loss": -10.715407371520996, "global_step": 163478, "epoch": 973} {"train_loss": -10.79588508605957, "global_step": 163479, "epoch": 973} {"train_loss": -10.787443161010742, "global_step": 163480, "epoch": 973} {"train_loss": -10.899800300598145, "global_step": 163481, "epoch": 973} {"train_loss": -10.442527770996094, "global_step": 163482, "epoch": 973} {"train_loss": -10.85896110534668, "global_step": 163483, "epoch": 973} {"train_loss": -10.657569885253906, "global_step": 163484, "epoch": 973} {"train_loss": -10.865859985351562, "global_step": 163485, "epoch": 973} {"train_loss": -10.793852806091309, "global_step": 163486, "epoch": 973} {"train_loss": -10.985823631286621, "global_step": 163487, "epoch": 973} {"train_loss": -10.905288696289062, "global_step": 163488, "epoch": 973} {"train_loss": -10.874290466308594, "global_step": 163489, "epoch": 973} {"train_loss": -10.826873779296875, "global_step": 163490, "epoch": 973} {"train_loss": -10.833030700683594, "global_step": 163491, "epoch": 973} {"train_loss": -11.030282974243164, "global_step": 163492, "epoch": 973} {"train_loss": -11.114025115966797, "global_step": 163493, "epoch": 973} {"train_loss": -10.89837646484375, "global_step": 163494, "epoch": 973} {"train_loss": -11.053343772888184, "global_step": 163495, "epoch": 973} {"train_loss": -10.976112365722656, "global_step": 163496, "epoch": 973} {"train_loss": -10.882752418518066, "global_step": 163497, "epoch": 973} {"train_loss": -10.994941711425781, "global_step": 163498, "epoch": 973} {"train_loss": -10.934724807739258, "global_step": 163499, "epoch": 973} {"train_loss": -10.803654670715332, "global_step": 163500, "epoch": 973} {"train_loss": -11.034296035766602, "global_step": 163501, "epoch": 973} {"train_loss": -11.033973693847656, "global_step": 163502, "epoch": 973} {"train_loss": -10.985523223876953, "global_step": 163503, "epoch": 973} {"train_loss": -11.032782554626465, "global_step": 163504, "epoch": 973} {"train_loss": -11.06695556640625, "global_step": 163505, "epoch": 973} {"train_loss": -10.967241287231445, "global_step": 163506, "epoch": 973} {"train_loss": -10.954058647155762, "global_step": 163507, "epoch": 973} {"train_loss": -11.123546600341797, "global_step": 163508, "epoch": 973} {"train_loss": -10.956469535827637, "global_step": 163509, "epoch": 973} {"train_loss": -10.990747451782227, "global_step": 163510, "epoch": 973} {"train_loss": -10.986990928649902, "global_step": 163511, "epoch": 973} {"train_loss": -10.764036178588867, "global_step": 163512, "epoch": 973} {"train_loss": -11.134271621704102, "global_step": 163513, "epoch": 973} {"train_loss": -11.094728469848633, "global_step": 163514, "epoch": 973} {"train_loss": -11.142696380615234, "global_step": 163515, "epoch": 973} {"train_loss": -11.122365951538086, "global_step": 163516, "epoch": 973} {"train_loss": -11.175747871398926, "global_step": 163517, "epoch": 973} {"train_loss": -11.145824432373047, "global_step": 163518, "epoch": 973} {"train_loss": -11.076773643493652, "global_step": 163519, "epoch": 973} {"train_loss": -11.090246200561523, "global_step": 163520, "epoch": 973} {"train_loss": -10.919130325317383, "global_step": 163521, "epoch": 973} {"train_loss": -11.078882217407227, "global_step": 163522, "epoch": 973} {"train_loss": -11.3740873336792, "global_step": 163523, "epoch": 973} {"train_loss": -11.37241268157959, "global_step": 163524, "epoch": 973} {"train_loss": -11.108742713928223, "global_step": 163525, "epoch": 973} {"train_loss": -10.67230224609375, "global_step": 163526, "epoch": 973} {"train_loss": -10.761602401733398, "global_step": 163527, "epoch": 973} {"train_loss": -10.841901779174805, "global_step": 163528, "epoch": 973} {"train_loss": -11.12919807434082, "global_step": 163529, "epoch": 973} {"train_loss": -10.49483871459961, "global_step": 163530, "epoch": 973} {"train_loss": -11.143082618713379, "global_step": 163531, "epoch": 973} {"train_loss": -10.643150329589844, "global_step": 163532, "epoch": 973} {"train_loss": -9.683906555175781, "global_step": 163533, "epoch": 973} {"train_loss": -10.279497146606445, "global_step": 163534, "epoch": 973} {"train_loss": -10.362258911132812, "global_step": 163535, "epoch": 973} {"train_loss": -9.618719100952148, "global_step": 163536, "epoch": 973} {"train_loss": -11.062482833862305, "global_step": 163537, "epoch": 973} {"train_loss": -10.051990509033203, "global_step": 163538, "epoch": 973} {"train_loss": -10.364230155944824, "global_step": 163539, "epoch": 973} {"train_loss": -11.042304039001465, "global_step": 163540, "epoch": 973} {"train_loss": -10.73137092590332, "global_step": 163541, "epoch": 973} {"train_loss": -11.006311416625977, "global_step": 163542, "epoch": 973} {"train_loss": -10.763517379760742, "global_step": 163543, "epoch": 973} {"train_loss": -10.585344314575195, "global_step": 163544, "epoch": 973} {"train_loss": -9.708303451538086, "global_step": 163545, "epoch": 973} {"train_loss": -10.236116409301758, "global_step": 163546, "epoch": 973} {"train_loss": -10.272322654724121, "global_step": 163547, "epoch": 973} {"train_loss": -10.757224082946777, "global_step": 163548, "epoch": 973} {"train_loss": -10.060086250305176, "global_step": 163549, "epoch": 973} {"train_loss": -10.407470703125, "global_step": 163550, "epoch": 973} {"train_loss": -10.266721725463867, "global_step": 163551, "epoch": 973} {"train_loss": -10.332077026367188, "global_step": 163552, "epoch": 973} {"train_loss": -10.819015502929688, "global_step": 163553, "epoch": 973} {"train_loss": -10.451578140258789, "global_step": 163554, "epoch": 973} {"train_loss": -10.728090286254883, "global_step": 163555, "epoch": 973} {"train_loss": -10.984989166259766, "global_step": 163556, "epoch": 973} {"train_loss": -10.29788875579834, "global_step": 163557, "epoch": 973} {"train_loss": -10.929611206054688, "global_step": 163558, "epoch": 973} {"train_loss": -10.642655372619629, "global_step": 163559, "epoch": 973} {"train_loss": -10.599376678466797, "global_step": 163560, "epoch": 973} {"train_loss": -10.959976196289062, "global_step": 163561, "epoch": 973} {"train_loss": -10.382657051086426, "global_step": 163562, "epoch": 973} {"train_loss": -10.667972564697266, "global_step": 163563, "epoch": 973} {"train_loss": -10.872096061706543, "global_step": 163564, "epoch": 973} {"train_loss": -10.36845588684082, "global_step": 163565, "epoch": 973} {"train_loss": -10.782613754272461, "global_step": 163566, "epoch": 973} {"train_loss": -10.177545547485352, "global_step": 163567, "epoch": 973} {"train_loss": -10.433904647827148, "global_step": 163568, "epoch": 973} {"train_loss": -10.7508544921875, "global_step": 163569, "epoch": 973} {"train_loss": -10.429222106933594, "global_step": 163570, "epoch": 973} {"train_loss": -10.878866195678711, "global_step": 163571, "epoch": 973} {"train_loss": -10.652374267578125, "global_step": 163572, "epoch": 973} {"train_loss": -10.49051284790039, "global_step": 163573, "epoch": 973} {"train_loss": -10.635708808898926, "global_step": 163574, "epoch": 973} {"train_loss": -10.774947166442871, "global_step": 163575, "epoch": 973} {"train_loss": -10.59227180480957, "global_step": 163576, "epoch": 973} {"train_loss": -10.959238052368164, "global_step": 163577, "epoch": 973} {"train_loss": -10.611324310302734, "global_step": 163578, "epoch": 973} {"train_loss": -10.814593315124512, "global_step": 163579, "epoch": 973} {"train_loss": -10.811891555786133, "global_step": 163580, "epoch": 973} {"train_loss": -10.950849533081055, "global_step": 163581, "epoch": 973} {"train_loss": -10.74998664855957, "global_step": 163582, "epoch": 973} {"train_loss": -11.140600204467773, "global_step": 163583, "epoch": 973} {"train_loss": -10.738109588623047, "global_step": 163584, "epoch": 973} {"train_loss": -10.835076332092285, "global_step": 163585, "epoch": 973} {"train_loss": -10.82789421081543, "global_step": 163586, "epoch": 973} {"train_loss": -10.892414093017578, "global_step": 163587, "epoch": 973} {"train_loss": -10.80636978149414, "global_step": 163588, "epoch": 973} {"train_loss": -10.908149719238281, "global_step": 163589, "epoch": 973} {"train_loss": -11.145271301269531, "global_step": 163590, "epoch": 973} {"train_loss": -11.015649795532227, "global_step": 163591, "epoch": 973} {"train_loss": -11.08193588256836, "global_step": 163592, "epoch": 973} {"train_loss": -10.78969955444336, "global_step": 163593, "epoch": 973} {"train_loss": -10.97330093383789, "global_step": 163594, "epoch": 973} {"train_loss": -10.943428993225098, "global_step": 163595, "epoch": 973} {"train_loss": -11.010684967041016, "global_step": 163596, "epoch": 973} {"train_loss": -11.06839370727539, "global_step": 163597, "epoch": 973} {"train_loss": -11.003910064697266, "global_step": 163598, "epoch": 973} {"train_loss": -11.046903610229492, "global_step": 163599, "epoch": 973} {"train_loss": -11.045063018798828, "global_step": 163600, "epoch": 973} {"train_loss": -11.151674270629883, "global_step": 163601, "epoch": 973} {"train_loss": -11.04376220703125, "global_step": 163602, "epoch": 973} {"train_loss": -10.967906951904297, "global_step": 163603, "epoch": 973} {"train_loss": -10.91218376159668, "global_step": 163604, "epoch": 973} {"train_loss": -10.956830024719238, "global_step": 163605, "epoch": 973} {"train_loss": -10.928133010864258, "global_step": 163606, "epoch": 973} {"train_loss": -11.119922637939453, "global_step": 163607, "epoch": 973} {"train_loss": -10.996435165405273, "global_step": 163608, "epoch": 973} {"train_loss": -11.1583833694458, "global_step": 163609, "epoch": 973} {"train_loss": -11.224160194396973, "global_step": 163610, "epoch": 973} {"train_loss": -11.149121284484863, "global_step": 163611, "epoch": 973} {"train_loss": -11.083267211914062, "global_step": 163612, "epoch": 973} {"train_loss": -11.087671279907227, "global_step": 163613, "epoch": 973} {"train_loss": -11.14891242980957, "global_step": 163614, "epoch": 973} {"train_loss": -11.218069076538086, "global_step": 163615, "epoch": 973} {"train_loss": -11.091385841369629, "global_step": 163616, "epoch": 973} {"train_loss": -10.994534492492676, "global_step": 163617, "epoch": 973} {"train_loss": -11.145106315612793, "global_step": 163618, "epoch": 973} {"train_loss": -10.685522079467773, "global_step": 163619, "epoch": 973} {"train_loss": -10.778682708740234, "global_step": 163620, "epoch": 973} {"train_loss": -10.752531051635742, "global_step": 163621, "epoch": 973} {"train_loss": -10.703648567199707, "global_step": 163622, "epoch": 973} {"train_loss": -11.101110458374023, "global_step": 163623, "epoch": 973} {"train_loss": -10.932209968566895, "global_step": 163624, "epoch": 973} {"train_loss": -10.715092658996582, "global_step": 163625, "epoch": 973} {"train_loss": -11.256660461425781, "global_step": 163626, "epoch": 973} {"train_loss": -10.946470260620117, "global_step": 163627, "epoch": 973} {"train_loss": -11.080491065979004, "global_step": 163628, "epoch": 973} {"train_loss": -10.62748908996582, "global_step": 163629, "epoch": 973} {"train_loss": -11.063539505004883, "global_step": 163630, "epoch": 973} {"train_loss": -10.81178693544297, "global_step": 163631, "epoch": 973, "val_loss": 236131.75} {"train_loss": -11.0510892868042, "global_step": 163632, "epoch": 974} {"train_loss": -10.908267974853516, "global_step": 163633, "epoch": 974} {"train_loss": -11.016841888427734, "global_step": 163634, "epoch": 974} {"train_loss": -10.6687593460083, "global_step": 163635, "epoch": 974} {"train_loss": -11.057526588439941, "global_step": 163636, "epoch": 974} {"train_loss": -10.914259910583496, "global_step": 163637, "epoch": 974} {"train_loss": -11.00031852722168, "global_step": 163638, "epoch": 974} {"train_loss": -11.140036582946777, "global_step": 163639, "epoch": 974} {"train_loss": -10.973925590515137, "global_step": 163640, "epoch": 974} {"train_loss": -11.206958770751953, "global_step": 163641, "epoch": 974} {"train_loss": -10.802291870117188, "global_step": 163642, "epoch": 974} {"train_loss": -10.907760620117188, "global_step": 163643, "epoch": 974} {"train_loss": -10.870217323303223, "global_step": 163644, "epoch": 974} {"train_loss": -10.565120697021484, "global_step": 163645, "epoch": 974} {"train_loss": -10.437085151672363, "global_step": 163646, "epoch": 974} {"train_loss": -10.882824897766113, "global_step": 163647, "epoch": 974} {"train_loss": -10.881845474243164, "global_step": 163648, "epoch": 974} {"train_loss": -10.051688194274902, "global_step": 163649, "epoch": 974} {"train_loss": -10.846378326416016, "global_step": 163650, "epoch": 974} {"train_loss": -10.814496040344238, "global_step": 163651, "epoch": 974} {"train_loss": -11.315123558044434, "global_step": 163652, "epoch": 974} {"train_loss": -11.030281066894531, "global_step": 163653, "epoch": 974} {"train_loss": -11.101066589355469, "global_step": 163654, "epoch": 974} {"train_loss": -10.860330581665039, "global_step": 163655, "epoch": 974} {"train_loss": -10.829654693603516, "global_step": 163656, "epoch": 974} {"train_loss": -10.681702613830566, "global_step": 163657, "epoch": 974} {"train_loss": -10.813329696655273, "global_step": 163658, "epoch": 974} {"train_loss": -10.75619888305664, "global_step": 163659, "epoch": 974} {"train_loss": -11.18454360961914, "global_step": 163660, "epoch": 974} {"train_loss": -10.839845657348633, "global_step": 163661, "epoch": 974} {"train_loss": -11.145059585571289, "global_step": 163662, "epoch": 974} {"train_loss": -11.0092134475708, "global_step": 163663, "epoch": 974} {"train_loss": -11.209844589233398, "global_step": 163664, "epoch": 974} {"train_loss": -10.9380464553833, "global_step": 163665, "epoch": 974} {"train_loss": -11.154716491699219, "global_step": 163666, "epoch": 974} {"train_loss": -10.877297401428223, "global_step": 163667, "epoch": 974} {"train_loss": -10.955007553100586, "global_step": 163668, "epoch": 974} {"train_loss": -11.160042762756348, "global_step": 163669, "epoch": 974} {"train_loss": -10.992839813232422, "global_step": 163670, "epoch": 974} {"train_loss": -10.85954475402832, "global_step": 163671, "epoch": 974} {"train_loss": -10.944021224975586, "global_step": 163672, "epoch": 974} {"train_loss": -10.874078750610352, "global_step": 163673, "epoch": 974} {"train_loss": -10.849184036254883, "global_step": 163674, "epoch": 974} {"train_loss": -10.657424926757812, "global_step": 163675, "epoch": 974} {"train_loss": -11.027989387512207, "global_step": 163676, "epoch": 974} {"train_loss": -10.760440826416016, "global_step": 163677, "epoch": 974} {"train_loss": -11.243359565734863, "global_step": 163678, "epoch": 974} {"train_loss": -10.805343627929688, "global_step": 163679, "epoch": 974} {"train_loss": -11.176790237426758, "global_step": 163680, "epoch": 974} {"train_loss": -11.19586181640625, "global_step": 163681, "epoch": 974} {"train_loss": -11.066234588623047, "global_step": 163682, "epoch": 974} {"train_loss": -11.092719078063965, "global_step": 163683, "epoch": 974} {"train_loss": -10.996767044067383, "global_step": 163684, "epoch": 974} {"train_loss": -11.212085723876953, "global_step": 163685, "epoch": 974} {"train_loss": -10.910308837890625, "global_step": 163686, "epoch": 974} {"train_loss": -10.926310539245605, "global_step": 163687, "epoch": 974} {"train_loss": -10.931821823120117, "global_step": 163688, "epoch": 974} {"train_loss": -10.814827919006348, "global_step": 163689, "epoch": 974} {"train_loss": -10.801005363464355, "global_step": 163690, "epoch": 974} {"train_loss": -10.966142654418945, "global_step": 163691, "epoch": 974} {"train_loss": -10.724973678588867, "global_step": 163692, "epoch": 974} {"train_loss": -10.722650527954102, "global_step": 163693, "epoch": 974} {"train_loss": -10.592653274536133, "global_step": 163694, "epoch": 974} {"train_loss": -10.727025985717773, "global_step": 163695, "epoch": 974} {"train_loss": -10.71322250366211, "global_step": 163696, "epoch": 974} {"train_loss": -10.887458801269531, "global_step": 163697, "epoch": 974} {"train_loss": -10.566340446472168, "global_step": 163698, "epoch": 974} {"train_loss": -10.753665924072266, "global_step": 163699, "epoch": 974} {"train_loss": -9.972587585449219, "global_step": 163700, "epoch": 974} {"train_loss": -10.72729778289795, "global_step": 163701, "epoch": 974} {"train_loss": -9.867781639099121, "global_step": 163702, "epoch": 974} {"train_loss": -10.773841857910156, "global_step": 163703, "epoch": 974} {"train_loss": -10.58895492553711, "global_step": 163704, "epoch": 974} {"train_loss": -10.776155471801758, "global_step": 163705, "epoch": 974} {"train_loss": -10.766928672790527, "global_step": 163706, "epoch": 974} {"train_loss": -10.712488174438477, "global_step": 163707, "epoch": 974} {"train_loss": -10.784845352172852, "global_step": 163708, "epoch": 974} {"train_loss": -10.32326602935791, "global_step": 163709, "epoch": 974} {"train_loss": -11.028604507446289, "global_step": 163710, "epoch": 974} {"train_loss": -10.608628273010254, "global_step": 163711, "epoch": 974} {"train_loss": -11.025384902954102, "global_step": 163712, "epoch": 974} {"train_loss": -10.894804954528809, "global_step": 163713, "epoch": 974} {"train_loss": -10.640113830566406, "global_step": 163714, "epoch": 974} {"train_loss": -11.075788497924805, "global_step": 163715, "epoch": 974} {"train_loss": -11.118045806884766, "global_step": 163716, "epoch": 974} {"train_loss": -10.774313926696777, "global_step": 163717, "epoch": 974} {"train_loss": -11.005889892578125, "global_step": 163718, "epoch": 974} {"train_loss": -10.795161247253418, "global_step": 163719, "epoch": 974} {"train_loss": -10.972021102905273, "global_step": 163720, "epoch": 974} {"train_loss": -10.9081449508667, "global_step": 163721, "epoch": 974} {"train_loss": -11.075685501098633, "global_step": 163722, "epoch": 974} {"train_loss": -11.060127258300781, "global_step": 163723, "epoch": 974} {"train_loss": -10.836420059204102, "global_step": 163724, "epoch": 974} {"train_loss": -10.85063362121582, "global_step": 163725, "epoch": 974} {"train_loss": -11.066551208496094, "global_step": 163726, "epoch": 974} {"train_loss": -10.975432395935059, "global_step": 163727, "epoch": 974} {"train_loss": -10.679431915283203, "global_step": 163728, "epoch": 974} {"train_loss": -11.308967590332031, "global_step": 163729, "epoch": 974} {"train_loss": -10.847536087036133, "global_step": 163730, "epoch": 974} {"train_loss": -11.14338493347168, "global_step": 163731, "epoch": 974} {"train_loss": -10.976424217224121, "global_step": 163732, "epoch": 974} {"train_loss": -11.138961791992188, "global_step": 163733, "epoch": 974} {"train_loss": -11.078765869140625, "global_step": 163734, "epoch": 974} {"train_loss": -11.036806106567383, "global_step": 163735, "epoch": 974} {"train_loss": -11.07646369934082, "global_step": 163736, "epoch": 974} {"train_loss": -10.950636863708496, "global_step": 163737, "epoch": 974} {"train_loss": -10.930145263671875, "global_step": 163738, "epoch": 974} {"train_loss": -11.22675895690918, "global_step": 163739, "epoch": 974} {"train_loss": -10.75792121887207, "global_step": 163740, "epoch": 974} {"train_loss": -10.807897567749023, "global_step": 163741, "epoch": 974} {"train_loss": -11.038305282592773, "global_step": 163742, "epoch": 974} {"train_loss": -10.803218841552734, "global_step": 163743, "epoch": 974} {"train_loss": -10.950267791748047, "global_step": 163744, "epoch": 974} {"train_loss": -10.961874008178711, "global_step": 163745, "epoch": 974} {"train_loss": -10.731180191040039, "global_step": 163746, "epoch": 974} {"train_loss": -10.473014831542969, "global_step": 163747, "epoch": 974} {"train_loss": -10.856801986694336, "global_step": 163748, "epoch": 974} {"train_loss": -11.153884887695312, "global_step": 163749, "epoch": 974} {"train_loss": -10.62282943725586, "global_step": 163750, "epoch": 974} {"train_loss": -11.179101943969727, "global_step": 163751, "epoch": 974} {"train_loss": -10.927583694458008, "global_step": 163752, "epoch": 974} {"train_loss": -10.72414493560791, "global_step": 163753, "epoch": 974} {"train_loss": -10.916061401367188, "global_step": 163754, "epoch": 974} {"train_loss": -10.950244903564453, "global_step": 163755, "epoch": 974} {"train_loss": -10.85617446899414, "global_step": 163756, "epoch": 974} {"train_loss": -10.980592727661133, "global_step": 163757, "epoch": 974} {"train_loss": -11.12150764465332, "global_step": 163758, "epoch": 974} {"train_loss": -10.928171157836914, "global_step": 163759, "epoch": 974} {"train_loss": -11.209842681884766, "global_step": 163760, "epoch": 974} {"train_loss": -11.248807907104492, "global_step": 163761, "epoch": 974} {"train_loss": -11.158926010131836, "global_step": 163762, "epoch": 974} {"train_loss": -11.102754592895508, "global_step": 163763, "epoch": 974} {"train_loss": -11.023447036743164, "global_step": 163764, "epoch": 974} {"train_loss": -10.711140632629395, "global_step": 163765, "epoch": 974} {"train_loss": -10.936055183410645, "global_step": 163766, "epoch": 974} {"train_loss": -10.876906394958496, "global_step": 163767, "epoch": 974} {"train_loss": -11.03414249420166, "global_step": 163768, "epoch": 974} {"train_loss": -11.14838695526123, "global_step": 163769, "epoch": 974} {"train_loss": -11.009611129760742, "global_step": 163770, "epoch": 974} {"train_loss": -10.852767944335938, "global_step": 163771, "epoch": 974} {"train_loss": -10.827335357666016, "global_step": 163772, "epoch": 974} {"train_loss": -10.708841323852539, "global_step": 163773, "epoch": 974} {"train_loss": -10.892898559570312, "global_step": 163774, "epoch": 974} {"train_loss": -10.583470344543457, "global_step": 163775, "epoch": 974} {"train_loss": -10.906295776367188, "global_step": 163776, "epoch": 974} {"train_loss": -11.086235046386719, "global_step": 163777, "epoch": 974} {"train_loss": -11.101554870605469, "global_step": 163778, "epoch": 974} {"train_loss": -11.075149536132812, "global_step": 163779, "epoch": 974} {"train_loss": -10.868168830871582, "global_step": 163780, "epoch": 974} {"train_loss": -11.14958381652832, "global_step": 163781, "epoch": 974} {"train_loss": -11.113712310791016, "global_step": 163782, "epoch": 974} {"train_loss": -11.015923500061035, "global_step": 163783, "epoch": 974} {"train_loss": -11.148180961608887, "global_step": 163784, "epoch": 974} {"train_loss": -11.08963680267334, "global_step": 163785, "epoch": 974} {"train_loss": -10.473155975341797, "global_step": 163786, "epoch": 974} {"train_loss": -10.58665657043457, "global_step": 163787, "epoch": 974} {"train_loss": -11.181912422180176, "global_step": 163788, "epoch": 974} {"train_loss": -10.790390968322754, "global_step": 163789, "epoch": 974} {"train_loss": -10.807815551757812, "global_step": 163790, "epoch": 974} {"train_loss": -10.621187210083008, "global_step": 163791, "epoch": 974} {"train_loss": -11.12506103515625, "global_step": 163792, "epoch": 974} {"train_loss": -10.447720527648926, "global_step": 163793, "epoch": 974} {"train_loss": -10.837913513183594, "global_step": 163794, "epoch": 974} {"train_loss": -10.940013885498047, "global_step": 163795, "epoch": 974} {"train_loss": -10.213957786560059, "global_step": 163796, "epoch": 974} {"train_loss": -10.65673828125, "global_step": 163797, "epoch": 974} {"train_loss": -10.712638854980469, "global_step": 163798, "epoch": 974} {"train_loss": -10.886078465552558, "global_step": 163799, "epoch": 974, "val_loss": 235552.234375} {"train_loss": -10.695135116577148, "global_step": 163800, "epoch": 975} {"train_loss": -10.32314682006836, "global_step": 163801, "epoch": 975} {"train_loss": -10.362232208251953, "global_step": 163802, "epoch": 975} {"train_loss": -10.45351505279541, "global_step": 163803, "epoch": 975} {"train_loss": -10.269673347473145, "global_step": 163804, "epoch": 975} {"train_loss": -10.537291526794434, "global_step": 163805, "epoch": 975} {"train_loss": -10.501582145690918, "global_step": 163806, "epoch": 975} {"train_loss": -10.244972229003906, "global_step": 163807, "epoch": 975} {"train_loss": -10.597918510437012, "global_step": 163808, "epoch": 975} {"train_loss": -10.551071166992188, "global_step": 163809, "epoch": 975} {"train_loss": -10.834782600402832, "global_step": 163810, "epoch": 975} {"train_loss": -10.751666069030762, "global_step": 163811, "epoch": 975} {"train_loss": -10.513769149780273, "global_step": 163812, "epoch": 975} {"train_loss": -10.911959648132324, "global_step": 163813, "epoch": 975} {"train_loss": -10.36848258972168, "global_step": 163814, "epoch": 975} {"train_loss": -10.878205299377441, "global_step": 163815, "epoch": 975} {"train_loss": -10.910733222961426, "global_step": 163816, "epoch": 975} {"train_loss": -10.647527694702148, "global_step": 163817, "epoch": 975} {"train_loss": -10.845020294189453, "global_step": 163818, "epoch": 975} {"train_loss": -11.014381408691406, "global_step": 163819, "epoch": 975} {"train_loss": -10.652657508850098, "global_step": 163820, "epoch": 975} {"train_loss": -10.574088096618652, "global_step": 163821, "epoch": 975} {"train_loss": -10.853433609008789, "global_step": 163822, "epoch": 975} {"train_loss": -10.660274505615234, "global_step": 163823, "epoch": 975} {"train_loss": -11.042888641357422, "global_step": 163824, "epoch": 975} {"train_loss": -11.003107070922852, "global_step": 163825, "epoch": 975} {"train_loss": -10.97652530670166, "global_step": 163826, "epoch": 975} {"train_loss": -10.927203178405762, "global_step": 163827, "epoch": 975} {"train_loss": -10.773634910583496, "global_step": 163828, "epoch": 975} {"train_loss": -10.84150505065918, "global_step": 163829, "epoch": 975} {"train_loss": -11.154747009277344, "global_step": 163830, "epoch": 975} {"train_loss": -11.207353591918945, "global_step": 163831, "epoch": 975} {"train_loss": -11.039163589477539, "global_step": 163832, "epoch": 975} {"train_loss": -10.765754699707031, "global_step": 163833, "epoch": 975} {"train_loss": -10.911480903625488, "global_step": 163834, "epoch": 975} {"train_loss": -10.8859224319458, "global_step": 163835, "epoch": 975} {"train_loss": -10.982786178588867, "global_step": 163836, "epoch": 975} {"train_loss": -11.120124816894531, "global_step": 163837, "epoch": 975} {"train_loss": -11.063173294067383, "global_step": 163838, "epoch": 975} {"train_loss": -10.854140281677246, "global_step": 163839, "epoch": 975} {"train_loss": -11.145257949829102, "global_step": 163840, "epoch": 975} {"train_loss": -10.797500610351562, "global_step": 163841, "epoch": 975} {"train_loss": -10.684161186218262, "global_step": 163842, "epoch": 975} {"train_loss": -10.871545791625977, "global_step": 163843, "epoch": 975} {"train_loss": -11.078451156616211, "global_step": 163844, "epoch": 975} {"train_loss": -11.049487113952637, "global_step": 163845, "epoch": 975} {"train_loss": -10.677675247192383, "global_step": 163846, "epoch": 975} {"train_loss": -11.180559158325195, "global_step": 163847, "epoch": 975} {"train_loss": -10.5653076171875, "global_step": 163848, "epoch": 975} {"train_loss": -10.92470645904541, "global_step": 163849, "epoch": 975} {"train_loss": -11.122733116149902, "global_step": 163850, "epoch": 975} {"train_loss": -10.543766975402832, "global_step": 163851, "epoch": 975} {"train_loss": -11.174894332885742, "global_step": 163852, "epoch": 975} {"train_loss": -10.749381065368652, "global_step": 163853, "epoch": 975} {"train_loss": -11.055059432983398, "global_step": 163854, "epoch": 975} {"train_loss": -10.974757194519043, "global_step": 163855, "epoch": 975} {"train_loss": -11.13748550415039, "global_step": 163856, "epoch": 975} {"train_loss": -10.91705322265625, "global_step": 163857, "epoch": 975} {"train_loss": -11.195575714111328, "global_step": 163858, "epoch": 975} {"train_loss": -11.090328216552734, "global_step": 163859, "epoch": 975} {"train_loss": -11.233203887939453, "global_step": 163860, "epoch": 975} {"train_loss": -11.112000465393066, "global_step": 163861, "epoch": 975} {"train_loss": -10.982592582702637, "global_step": 163862, "epoch": 975} {"train_loss": -11.34555435180664, "global_step": 163863, "epoch": 975} {"train_loss": -11.218347549438477, "global_step": 163864, "epoch": 975} {"train_loss": -11.205453872680664, "global_step": 163865, "epoch": 975} {"train_loss": -10.993043899536133, "global_step": 163866, "epoch": 975} {"train_loss": -11.391414642333984, "global_step": 163867, "epoch": 975} {"train_loss": -11.411264419555664, "global_step": 163868, "epoch": 975} {"train_loss": -10.912313461303711, "global_step": 163869, "epoch": 975} {"train_loss": -11.205259323120117, "global_step": 163870, "epoch": 975} {"train_loss": -11.098834991455078, "global_step": 163871, "epoch": 975} {"train_loss": -11.200399398803711, "global_step": 163872, "epoch": 975} {"train_loss": -11.02301025390625, "global_step": 163873, "epoch": 975} {"train_loss": -11.144830703735352, "global_step": 163874, "epoch": 975} {"train_loss": -11.06076431274414, "global_step": 163875, "epoch": 975} {"train_loss": -11.079080581665039, "global_step": 163876, "epoch": 975} {"train_loss": -11.350950241088867, "global_step": 163877, "epoch": 975} {"train_loss": -11.051095962524414, "global_step": 163878, "epoch": 975} {"train_loss": -10.79521369934082, "global_step": 163879, "epoch": 975} {"train_loss": -11.17165756225586, "global_step": 163880, "epoch": 975} {"train_loss": -11.296039581298828, "global_step": 163881, "epoch": 975} {"train_loss": -11.406604766845703, "global_step": 163882, "epoch": 975} {"train_loss": -11.302543640136719, "global_step": 163883, "epoch": 975} {"train_loss": -10.839786529541016, "global_step": 163884, "epoch": 975} {"train_loss": -10.915019035339355, "global_step": 163885, "epoch": 975} {"train_loss": -11.08681869506836, "global_step": 163886, "epoch": 975} {"train_loss": -11.144588470458984, "global_step": 163887, "epoch": 975} {"train_loss": -10.868549346923828, "global_step": 163888, "epoch": 975} {"train_loss": -11.065821647644043, "global_step": 163889, "epoch": 975} {"train_loss": -11.28989028930664, "global_step": 163890, "epoch": 975} {"train_loss": -10.72739028930664, "global_step": 163891, "epoch": 975} {"train_loss": -10.359031677246094, "global_step": 163892, "epoch": 975} {"train_loss": -10.465433120727539, "global_step": 163893, "epoch": 975} {"train_loss": -10.758874893188477, "global_step": 163894, "epoch": 975} {"train_loss": -10.830733299255371, "global_step": 163895, "epoch": 975} {"train_loss": -11.029684066772461, "global_step": 163896, "epoch": 975} {"train_loss": -10.424042701721191, "global_step": 163897, "epoch": 975} {"train_loss": -11.004209518432617, "global_step": 163898, "epoch": 975} {"train_loss": -11.029277801513672, "global_step": 163899, "epoch": 975} {"train_loss": -11.1612548828125, "global_step": 163900, "epoch": 975} {"train_loss": -10.94498348236084, "global_step": 163901, "epoch": 975} {"train_loss": -10.67812728881836, "global_step": 163902, "epoch": 975} {"train_loss": -11.055366516113281, "global_step": 163903, "epoch": 975} {"train_loss": -11.258064270019531, "global_step": 163904, "epoch": 975} {"train_loss": -11.045092582702637, "global_step": 163905, "epoch": 975} {"train_loss": -11.035285949707031, "global_step": 163906, "epoch": 975} {"train_loss": -11.244876861572266, "global_step": 163907, "epoch": 975} {"train_loss": -10.780061721801758, "global_step": 163908, "epoch": 975} {"train_loss": -11.101308822631836, "global_step": 163909, "epoch": 975} {"train_loss": -10.962152481079102, "global_step": 163910, "epoch": 975} {"train_loss": -10.851808547973633, "global_step": 163911, "epoch": 975} {"train_loss": -10.954400062561035, "global_step": 163912, "epoch": 975} {"train_loss": -11.119399070739746, "global_step": 163913, "epoch": 975} {"train_loss": -10.975787162780762, "global_step": 163914, "epoch": 975} {"train_loss": -11.002912521362305, "global_step": 163915, "epoch": 975} {"train_loss": -11.178406715393066, "global_step": 163916, "epoch": 975} {"train_loss": -11.27504825592041, "global_step": 163917, "epoch": 975} {"train_loss": -11.204280853271484, "global_step": 163918, "epoch": 975} {"train_loss": -10.8441801071167, "global_step": 163919, "epoch": 975} {"train_loss": -11.09908676147461, "global_step": 163920, "epoch": 975} {"train_loss": -10.903942108154297, "global_step": 163921, "epoch": 975} {"train_loss": -11.064920425415039, "global_step": 163922, "epoch": 975} {"train_loss": -10.922110557556152, "global_step": 163923, "epoch": 975} {"train_loss": -11.186729431152344, "global_step": 163924, "epoch": 975} {"train_loss": -10.856910705566406, "global_step": 163925, "epoch": 975} {"train_loss": -10.867471694946289, "global_step": 163926, "epoch": 975} {"train_loss": -11.017013549804688, "global_step": 163927, "epoch": 975} {"train_loss": -10.996831893920898, "global_step": 163928, "epoch": 975} {"train_loss": -10.858020782470703, "global_step": 163929, "epoch": 975} {"train_loss": -10.547040939331055, "global_step": 163930, "epoch": 975} {"train_loss": -9.92414665222168, "global_step": 163931, "epoch": 975} {"train_loss": -10.811407089233398, "global_step": 163932, "epoch": 975} {"train_loss": -9.16529655456543, "global_step": 163933, "epoch": 975} {"train_loss": -10.449101448059082, "global_step": 163934, "epoch": 975} {"train_loss": -9.19575309753418, "global_step": 163935, "epoch": 975} {"train_loss": -10.078325271606445, "global_step": 163936, "epoch": 975} {"train_loss": -9.981474876403809, "global_step": 163937, "epoch": 975} {"train_loss": -9.552077293395996, "global_step": 163938, "epoch": 975} {"train_loss": -9.00599479675293, "global_step": 163939, "epoch": 975} {"train_loss": -10.410526275634766, "global_step": 163940, "epoch": 975} {"train_loss": -9.764789581298828, "global_step": 163941, "epoch": 975} {"train_loss": -8.564105987548828, "global_step": 163942, "epoch": 975} {"train_loss": -10.416438102722168, "global_step": 163943, "epoch": 975} {"train_loss": -9.292800903320312, "global_step": 163944, "epoch": 975} {"train_loss": -9.91954517364502, "global_step": 163945, "epoch": 975} {"train_loss": -10.093575477600098, "global_step": 163946, "epoch": 975} {"train_loss": -10.647531509399414, "global_step": 163947, "epoch": 975} {"train_loss": -10.369901657104492, "global_step": 163948, "epoch": 975} {"train_loss": -9.958501815795898, "global_step": 163949, "epoch": 975} {"train_loss": -10.161834716796875, "global_step": 163950, "epoch": 975} {"train_loss": -10.173093795776367, "global_step": 163951, "epoch": 975} {"train_loss": -9.990472793579102, "global_step": 163952, "epoch": 975} {"train_loss": -10.674047470092773, "global_step": 163953, "epoch": 975} {"train_loss": -10.335805892944336, "global_step": 163954, "epoch": 975} {"train_loss": -10.44430160522461, "global_step": 163955, "epoch": 975} {"train_loss": -10.427013397216797, "global_step": 163956, "epoch": 975} {"train_loss": -10.510087966918945, "global_step": 163957, "epoch": 975} {"train_loss": -10.54796028137207, "global_step": 163958, "epoch": 975} {"train_loss": -10.358243942260742, "global_step": 163959, "epoch": 975} {"train_loss": -10.559385299682617, "global_step": 163960, "epoch": 975} {"train_loss": -10.531599044799805, "global_step": 163961, "epoch": 975} {"train_loss": -10.55482006072998, "global_step": 163962, "epoch": 975} {"train_loss": -10.602044105529785, "global_step": 163963, "epoch": 975} {"train_loss": -10.409095764160156, "global_step": 163964, "epoch": 975} {"train_loss": -10.844646453857422, "global_step": 163965, "epoch": 975} {"train_loss": -10.25130844116211, "global_step": 163966, "epoch": 975} {"train_loss": -10.760879999115353, "global_step": 163967, "epoch": 975, "val_loss": 233144.734375, "train_action_mse_error": 3.4353654384613037} {"train_loss": -10.648956298828125, "global_step": 163968, "epoch": 976} {"train_loss": -10.234740257263184, "global_step": 163969, "epoch": 976} {"train_loss": -10.352705001831055, "global_step": 163970, "epoch": 976} {"train_loss": -10.790742874145508, "global_step": 163971, "epoch": 976} {"train_loss": -10.576384544372559, "global_step": 163972, "epoch": 976} {"train_loss": -10.800895690917969, "global_step": 163973, "epoch": 976} {"train_loss": -10.58254623413086, "global_step": 163974, "epoch": 976} {"train_loss": -10.605554580688477, "global_step": 163975, "epoch": 976} {"train_loss": -10.868030548095703, "global_step": 163976, "epoch": 976} {"train_loss": -10.705629348754883, "global_step": 163977, "epoch": 976} {"train_loss": -10.922320365905762, "global_step": 163978, "epoch": 976} {"train_loss": -10.802581787109375, "global_step": 163979, "epoch": 976} {"train_loss": -10.592133522033691, "global_step": 163980, "epoch": 976} {"train_loss": -10.944051742553711, "global_step": 163981, "epoch": 976} {"train_loss": -10.805137634277344, "global_step": 163982, "epoch": 976} {"train_loss": -11.080578804016113, "global_step": 163983, "epoch": 976} {"train_loss": -10.911727905273438, "global_step": 163984, "epoch": 976} {"train_loss": -11.019258499145508, "global_step": 163985, "epoch": 976} {"train_loss": -11.00288200378418, "global_step": 163986, "epoch": 976} {"train_loss": -10.963838577270508, "global_step": 163987, "epoch": 976} {"train_loss": -10.935829162597656, "global_step": 163988, "epoch": 976} {"train_loss": -11.085136413574219, "global_step": 163989, "epoch": 976} {"train_loss": -11.126068115234375, "global_step": 163990, "epoch": 976} {"train_loss": -11.053163528442383, "global_step": 163991, "epoch": 976} {"train_loss": -11.051143646240234, "global_step": 163992, "epoch": 976} {"train_loss": -10.972503662109375, "global_step": 163993, "epoch": 976} {"train_loss": -11.115264892578125, "global_step": 163994, "epoch": 976} {"train_loss": -11.11284065246582, "global_step": 163995, "epoch": 976} {"train_loss": -11.225924491882324, "global_step": 163996, "epoch": 976} {"train_loss": -11.171343803405762, "global_step": 163997, "epoch": 976} {"train_loss": -10.997079849243164, "global_step": 163998, "epoch": 976} {"train_loss": -11.091758728027344, "global_step": 163999, "epoch": 976} {"train_loss": -11.085259437561035, "global_step": 164000, "epoch": 976} {"train_loss": -10.847187042236328, "global_step": 164001, "epoch": 976} {"train_loss": -10.909826278686523, "global_step": 164002, "epoch": 976} {"train_loss": -10.900022506713867, "global_step": 164003, "epoch": 976} {"train_loss": -10.845430374145508, "global_step": 164004, "epoch": 976} {"train_loss": -10.706756591796875, "global_step": 164005, "epoch": 976} {"train_loss": -11.073871612548828, "global_step": 164006, "epoch": 976} {"train_loss": -10.939549446105957, "global_step": 164007, "epoch": 976} {"train_loss": -11.066283226013184, "global_step": 164008, "epoch": 976} {"train_loss": -10.738792419433594, "global_step": 164009, "epoch": 976} {"train_loss": -10.993053436279297, "global_step": 164010, "epoch": 976} {"train_loss": -10.91852855682373, "global_step": 164011, "epoch": 976} {"train_loss": -10.8580904006958, "global_step": 164012, "epoch": 976} {"train_loss": -11.156045913696289, "global_step": 164013, "epoch": 976} {"train_loss": -10.732179641723633, "global_step": 164014, "epoch": 976} {"train_loss": -11.133277893066406, "global_step": 164015, "epoch": 976} {"train_loss": -10.446574211120605, "global_step": 164016, "epoch": 976} {"train_loss": -10.889074325561523, "global_step": 164017, "epoch": 976} {"train_loss": -10.836661338806152, "global_step": 164018, "epoch": 976} {"train_loss": -10.869284629821777, "global_step": 164019, "epoch": 976} {"train_loss": -10.904264450073242, "global_step": 164020, "epoch": 976} {"train_loss": -10.95792007446289, "global_step": 164021, "epoch": 976} {"train_loss": -10.794510841369629, "global_step": 164022, "epoch": 976} {"train_loss": -10.976086616516113, "global_step": 164023, "epoch": 976} {"train_loss": -10.785907745361328, "global_step": 164024, "epoch": 976} {"train_loss": -10.830255508422852, "global_step": 164025, "epoch": 976} {"train_loss": -11.00312614440918, "global_step": 164026, "epoch": 976} {"train_loss": -10.744937896728516, "global_step": 164027, "epoch": 976} {"train_loss": -11.141704559326172, "global_step": 164028, "epoch": 976} {"train_loss": -10.515196800231934, "global_step": 164029, "epoch": 976} {"train_loss": -10.967565536499023, "global_step": 164030, "epoch": 976} {"train_loss": -10.774628639221191, "global_step": 164031, "epoch": 976} {"train_loss": -10.931962013244629, "global_step": 164032, "epoch": 976} {"train_loss": -11.207901954650879, "global_step": 164033, "epoch": 976} {"train_loss": -10.799514770507812, "global_step": 164034, "epoch": 976} {"train_loss": -11.203620910644531, "global_step": 164035, "epoch": 976} {"train_loss": -11.030661582946777, "global_step": 164036, "epoch": 976} {"train_loss": -10.742598533630371, "global_step": 164037, "epoch": 976} {"train_loss": -11.000408172607422, "global_step": 164038, "epoch": 976} {"train_loss": -10.795164108276367, "global_step": 164039, "epoch": 976} {"train_loss": -11.006592750549316, "global_step": 164040, "epoch": 976} {"train_loss": -10.946944236755371, "global_step": 164041, "epoch": 976} {"train_loss": -10.698009490966797, "global_step": 164042, "epoch": 976} {"train_loss": -10.75333023071289, "global_step": 164043, "epoch": 976} {"train_loss": -10.92895793914795, "global_step": 164044, "epoch": 976} {"train_loss": -11.14074993133545, "global_step": 164045, "epoch": 976} {"train_loss": -10.810260772705078, "global_step": 164046, "epoch": 976} {"train_loss": -11.144744873046875, "global_step": 164047, "epoch": 976} {"train_loss": -11.048603057861328, "global_step": 164048, "epoch": 976} {"train_loss": -10.982492446899414, "global_step": 164049, "epoch": 976} {"train_loss": -11.169350624084473, "global_step": 164050, "epoch": 976} {"train_loss": -11.00075912475586, "global_step": 164051, "epoch": 976} {"train_loss": -11.154376983642578, "global_step": 164052, "epoch": 976} {"train_loss": -10.753791809082031, "global_step": 164053, "epoch": 976} {"train_loss": -10.958284378051758, "global_step": 164054, "epoch": 976} {"train_loss": -11.322224617004395, "global_step": 164055, "epoch": 976} {"train_loss": -10.922026634216309, "global_step": 164056, "epoch": 976} {"train_loss": -11.22359848022461, "global_step": 164057, "epoch": 976} {"train_loss": -10.9503173828125, "global_step": 164058, "epoch": 976} {"train_loss": -11.158856391906738, "global_step": 164059, "epoch": 976} {"train_loss": -10.74913215637207, "global_step": 164060, "epoch": 976} {"train_loss": -10.984249114990234, "global_step": 164061, "epoch": 976} {"train_loss": -11.2430419921875, "global_step": 164062, "epoch": 976} {"train_loss": -11.098274230957031, "global_step": 164063, "epoch": 976} {"train_loss": -11.119363784790039, "global_step": 164064, "epoch": 976} {"train_loss": -11.273977279663086, "global_step": 164065, "epoch": 976} {"train_loss": -11.196133613586426, "global_step": 164066, "epoch": 976} {"train_loss": -11.050880432128906, "global_step": 164067, "epoch": 976} {"train_loss": -11.027359962463379, "global_step": 164068, "epoch": 976} {"train_loss": -10.91772174835205, "global_step": 164069, "epoch": 976} {"train_loss": -10.608583450317383, "global_step": 164070, "epoch": 976} {"train_loss": -10.768489837646484, "global_step": 164071, "epoch": 976} {"train_loss": -10.356935501098633, "global_step": 164072, "epoch": 976} {"train_loss": -11.025416374206543, "global_step": 164073, "epoch": 976} {"train_loss": -10.59847640991211, "global_step": 164074, "epoch": 976} {"train_loss": -11.05594539642334, "global_step": 164075, "epoch": 976} {"train_loss": -10.271864891052246, "global_step": 164076, "epoch": 976} {"train_loss": -10.279572486877441, "global_step": 164077, "epoch": 976} {"train_loss": -10.426407814025879, "global_step": 164078, "epoch": 976} {"train_loss": -11.126602172851562, "global_step": 164079, "epoch": 976} {"train_loss": -10.662225723266602, "global_step": 164080, "epoch": 976} {"train_loss": -10.619729995727539, "global_step": 164081, "epoch": 976} {"train_loss": -9.185623168945312, "global_step": 164082, "epoch": 976} {"train_loss": -10.901627540588379, "global_step": 164083, "epoch": 976} {"train_loss": -10.104265213012695, "global_step": 164084, "epoch": 976} {"train_loss": -10.426398277282715, "global_step": 164085, "epoch": 976} {"train_loss": -10.759876251220703, "global_step": 164086, "epoch": 976} {"train_loss": -10.54068660736084, "global_step": 164087, "epoch": 976} {"train_loss": -10.964933395385742, "global_step": 164088, "epoch": 976} {"train_loss": -10.343086242675781, "global_step": 164089, "epoch": 976} {"train_loss": -10.96030330657959, "global_step": 164090, "epoch": 976} {"train_loss": -10.528703689575195, "global_step": 164091, "epoch": 976} {"train_loss": -10.963611602783203, "global_step": 164092, "epoch": 976} {"train_loss": -10.557472229003906, "global_step": 164093, "epoch": 976} {"train_loss": -10.923622131347656, "global_step": 164094, "epoch": 976} {"train_loss": -10.867822647094727, "global_step": 164095, "epoch": 976} {"train_loss": -10.680038452148438, "global_step": 164096, "epoch": 976} {"train_loss": -10.718511581420898, "global_step": 164097, "epoch": 976} {"train_loss": -10.995282173156738, "global_step": 164098, "epoch": 976} {"train_loss": -10.90396499633789, "global_step": 164099, "epoch": 976} {"train_loss": -11.063130378723145, "global_step": 164100, "epoch": 976} {"train_loss": -10.963958740234375, "global_step": 164101, "epoch": 976} {"train_loss": -10.97027587890625, "global_step": 164102, "epoch": 976} {"train_loss": -10.787580490112305, "global_step": 164103, "epoch": 976} {"train_loss": -11.005485534667969, "global_step": 164104, "epoch": 976} {"train_loss": -10.793607711791992, "global_step": 164105, "epoch": 976} {"train_loss": -11.148383140563965, "global_step": 164106, "epoch": 976} {"train_loss": -11.215906143188477, "global_step": 164107, "epoch": 976} {"train_loss": -10.942404747009277, "global_step": 164108, "epoch": 976} {"train_loss": -10.901180267333984, "global_step": 164109, "epoch": 976} {"train_loss": -10.879471778869629, "global_step": 164110, "epoch": 976} {"train_loss": -11.010643005371094, "global_step": 164111, "epoch": 976} {"train_loss": -11.04393196105957, "global_step": 164112, "epoch": 976} {"train_loss": -10.878337860107422, "global_step": 164113, "epoch": 976} {"train_loss": -11.164592742919922, "global_step": 164114, "epoch": 976} {"train_loss": -10.818451881408691, "global_step": 164115, "epoch": 976} {"train_loss": -11.094605445861816, "global_step": 164116, "epoch": 976} {"train_loss": -11.0733060836792, "global_step": 164117, "epoch": 976} {"train_loss": -10.912040710449219, "global_step": 164118, "epoch": 976} {"train_loss": -11.136570930480957, "global_step": 164119, "epoch": 976} {"train_loss": -10.797964096069336, "global_step": 164120, "epoch": 976} {"train_loss": -11.012707710266113, "global_step": 164121, "epoch": 976} {"train_loss": -10.761637687683105, "global_step": 164122, "epoch": 976} {"train_loss": -10.380599021911621, "global_step": 164123, "epoch": 976} {"train_loss": -11.18869400024414, "global_step": 164124, "epoch": 976} {"train_loss": -10.603048324584961, "global_step": 164125, "epoch": 976} {"train_loss": -10.954545974731445, "global_step": 164126, "epoch": 976} {"train_loss": -11.135299682617188, "global_step": 164127, "epoch": 976} {"train_loss": -10.98198127746582, "global_step": 164128, "epoch": 976} {"train_loss": -11.228099822998047, "global_step": 164129, "epoch": 976} {"train_loss": -10.870379447937012, "global_step": 164130, "epoch": 976} {"train_loss": -11.229440689086914, "global_step": 164131, "epoch": 976} {"train_loss": -11.133212089538574, "global_step": 164132, "epoch": 976} {"train_loss": -11.137638092041016, "global_step": 164133, "epoch": 976} {"train_loss": -11.282113075256348, "global_step": 164134, "epoch": 976} {"train_loss": -10.890825129690624, "global_step": 164135, "epoch": 976, "val_loss": 238178.84375} {"train_loss": -11.11639404296875, "global_step": 164136, "epoch": 977} {"train_loss": -11.280024528503418, "global_step": 164137, "epoch": 977} {"train_loss": -11.405740737915039, "global_step": 164138, "epoch": 977} {"train_loss": -11.084510803222656, "global_step": 164139, "epoch": 977} {"train_loss": -11.218172073364258, "global_step": 164140, "epoch": 977} {"train_loss": -11.095710754394531, "global_step": 164141, "epoch": 977} {"train_loss": -11.142484664916992, "global_step": 164142, "epoch": 977} {"train_loss": -11.225637435913086, "global_step": 164143, "epoch": 977} {"train_loss": -11.14540958404541, "global_step": 164144, "epoch": 977} {"train_loss": -11.468232154846191, "global_step": 164145, "epoch": 977} {"train_loss": -11.264605522155762, "global_step": 164146, "epoch": 977} {"train_loss": -11.285606384277344, "global_step": 164147, "epoch": 977} {"train_loss": -11.116206169128418, "global_step": 164148, "epoch": 977} {"train_loss": -11.508419036865234, "global_step": 164149, "epoch": 977} {"train_loss": -11.217309951782227, "global_step": 164150, "epoch": 977} {"train_loss": -11.298605918884277, "global_step": 164151, "epoch": 977} {"train_loss": -11.234106063842773, "global_step": 164152, "epoch": 977} {"train_loss": -11.261173248291016, "global_step": 164153, "epoch": 977} {"train_loss": -11.187179565429688, "global_step": 164154, "epoch": 977} {"train_loss": -11.05084228515625, "global_step": 164155, "epoch": 977} {"train_loss": -11.047998428344727, "global_step": 164156, "epoch": 977} {"train_loss": -10.989721298217773, "global_step": 164157, "epoch": 977} {"train_loss": -11.315055847167969, "global_step": 164158, "epoch": 977} {"train_loss": -11.289546966552734, "global_step": 164159, "epoch": 977} {"train_loss": -11.49147891998291, "global_step": 164160, "epoch": 977} {"train_loss": -11.021415710449219, "global_step": 164161, "epoch": 977} {"train_loss": -10.933018684387207, "global_step": 164162, "epoch": 977} {"train_loss": -10.896392822265625, "global_step": 164163, "epoch": 977} {"train_loss": -11.264678001403809, "global_step": 164164, "epoch": 977} {"train_loss": -10.796991348266602, "global_step": 164165, "epoch": 977} {"train_loss": -11.167867660522461, "global_step": 164166, "epoch": 977} {"train_loss": -11.156554222106934, "global_step": 164167, "epoch": 977} {"train_loss": -11.207599639892578, "global_step": 164168, "epoch": 977} {"train_loss": -10.706308364868164, "global_step": 164169, "epoch": 977} {"train_loss": -10.496438026428223, "global_step": 164170, "epoch": 977} {"train_loss": -10.396061897277832, "global_step": 164171, "epoch": 977} {"train_loss": -10.896879196166992, "global_step": 164172, "epoch": 977} {"train_loss": -11.106500625610352, "global_step": 164173, "epoch": 977} {"train_loss": -10.917001724243164, "global_step": 164174, "epoch": 977} {"train_loss": -11.354788780212402, "global_step": 164175, "epoch": 977} {"train_loss": -11.15084457397461, "global_step": 164176, "epoch": 977} {"train_loss": -11.05295181274414, "global_step": 164177, "epoch": 977} {"train_loss": -11.080662727355957, "global_step": 164178, "epoch": 977} {"train_loss": -11.443978309631348, "global_step": 164179, "epoch": 977} {"train_loss": -10.72622299194336, "global_step": 164180, "epoch": 977} {"train_loss": -10.842281341552734, "global_step": 164181, "epoch": 977} {"train_loss": -11.22492790222168, "global_step": 164182, "epoch": 977} {"train_loss": -11.20571231842041, "global_step": 164183, "epoch": 977} {"train_loss": -11.417831420898438, "global_step": 164184, "epoch": 977} {"train_loss": -11.245675086975098, "global_step": 164185, "epoch": 977} {"train_loss": -11.199743270874023, "global_step": 164186, "epoch": 977} {"train_loss": -11.313165664672852, "global_step": 164187, "epoch": 977} {"train_loss": -11.112150192260742, "global_step": 164188, "epoch": 977} {"train_loss": -11.114757537841797, "global_step": 164189, "epoch": 977} {"train_loss": -11.245013236999512, "global_step": 164190, "epoch": 977} {"train_loss": -10.88851547241211, "global_step": 164191, "epoch": 977} {"train_loss": -11.049480438232422, "global_step": 164192, "epoch": 977} {"train_loss": -11.262314796447754, "global_step": 164193, "epoch": 977} {"train_loss": -11.088838577270508, "global_step": 164194, "epoch": 977} {"train_loss": -10.855439186096191, "global_step": 164195, "epoch": 977} {"train_loss": -11.027579307556152, "global_step": 164196, "epoch": 977} {"train_loss": -11.39108657836914, "global_step": 164197, "epoch": 977} {"train_loss": -11.190404891967773, "global_step": 164198, "epoch": 977} {"train_loss": -11.18090534210205, "global_step": 164199, "epoch": 977} {"train_loss": -10.860700607299805, "global_step": 164200, "epoch": 977} {"train_loss": -10.624893188476562, "global_step": 164201, "epoch": 977} {"train_loss": -10.735546112060547, "global_step": 164202, "epoch": 977} {"train_loss": -10.98802661895752, "global_step": 164203, "epoch": 977} {"train_loss": -10.353996276855469, "global_step": 164204, "epoch": 977} {"train_loss": -10.145176887512207, "global_step": 164205, "epoch": 977} {"train_loss": -10.475095748901367, "global_step": 164206, "epoch": 977} {"train_loss": -10.535262107849121, "global_step": 164207, "epoch": 977} {"train_loss": -10.176868438720703, "global_step": 164208, "epoch": 977} {"train_loss": -10.582686424255371, "global_step": 164209, "epoch": 977} {"train_loss": -10.427375793457031, "global_step": 164210, "epoch": 977} {"train_loss": -10.194463729858398, "global_step": 164211, "epoch": 977} {"train_loss": -10.041905403137207, "global_step": 164212, "epoch": 977} {"train_loss": -10.99598503112793, "global_step": 164213, "epoch": 977} {"train_loss": -10.431453704833984, "global_step": 164214, "epoch": 977} {"train_loss": -9.841146469116211, "global_step": 164215, "epoch": 977} {"train_loss": -10.31500244140625, "global_step": 164216, "epoch": 977} {"train_loss": -10.056791305541992, "global_step": 164217, "epoch": 977} {"train_loss": -10.435918807983398, "global_step": 164218, "epoch": 977} {"train_loss": -9.522668838500977, "global_step": 164219, "epoch": 977} {"train_loss": -10.73193359375, "global_step": 164220, "epoch": 977} {"train_loss": -10.144235610961914, "global_step": 164221, "epoch": 977} {"train_loss": -9.956998825073242, "global_step": 164222, "epoch": 977} {"train_loss": -10.52005386352539, "global_step": 164223, "epoch": 977} {"train_loss": -10.222957611083984, "global_step": 164224, "epoch": 977} {"train_loss": -10.53538703918457, "global_step": 164225, "epoch": 977} {"train_loss": -10.415995597839355, "global_step": 164226, "epoch": 977} {"train_loss": -9.89910888671875, "global_step": 164227, "epoch": 977} {"train_loss": -10.662461280822754, "global_step": 164228, "epoch": 977} {"train_loss": -10.301741600036621, "global_step": 164229, "epoch": 977} {"train_loss": -10.042902946472168, "global_step": 164230, "epoch": 977} {"train_loss": -10.170040130615234, "global_step": 164231, "epoch": 977} {"train_loss": -10.38715934753418, "global_step": 164232, "epoch": 977} {"train_loss": -10.17807674407959, "global_step": 164233, "epoch": 977} {"train_loss": -10.855781555175781, "global_step": 164234, "epoch": 977} {"train_loss": -10.535640716552734, "global_step": 164235, "epoch": 977} {"train_loss": -10.61663818359375, "global_step": 164236, "epoch": 977} {"train_loss": -10.475414276123047, "global_step": 164237, "epoch": 977} {"train_loss": -10.695122718811035, "global_step": 164238, "epoch": 977} {"train_loss": -10.756851196289062, "global_step": 164239, "epoch": 977} {"train_loss": -10.948870658874512, "global_step": 164240, "epoch": 977} {"train_loss": -10.559869766235352, "global_step": 164241, "epoch": 977} {"train_loss": -10.712825775146484, "global_step": 164242, "epoch": 977} {"train_loss": -10.735450744628906, "global_step": 164243, "epoch": 977} {"train_loss": -10.561838150024414, "global_step": 164244, "epoch": 977} {"train_loss": -10.795791625976562, "global_step": 164245, "epoch": 977} {"train_loss": -10.83282470703125, "global_step": 164246, "epoch": 977} {"train_loss": -10.941780090332031, "global_step": 164247, "epoch": 977} {"train_loss": -10.949775695800781, "global_step": 164248, "epoch": 977} {"train_loss": -10.867810249328613, "global_step": 164249, "epoch": 977} {"train_loss": -10.913224220275879, "global_step": 164250, "epoch": 977} {"train_loss": -11.03068733215332, "global_step": 164251, "epoch": 977} {"train_loss": -11.044624328613281, "global_step": 164252, "epoch": 977} {"train_loss": -10.992838859558105, "global_step": 164253, "epoch": 977} {"train_loss": -11.104433059692383, "global_step": 164254, "epoch": 977} {"train_loss": -11.102663040161133, "global_step": 164255, "epoch": 977} {"train_loss": -11.091245651245117, "global_step": 164256, "epoch": 977} {"train_loss": -10.932729721069336, "global_step": 164257, "epoch": 977} {"train_loss": -10.994600296020508, "global_step": 164258, "epoch": 977} {"train_loss": -11.111919403076172, "global_step": 164259, "epoch": 977} {"train_loss": -11.113378524780273, "global_step": 164260, "epoch": 977} {"train_loss": -10.999762535095215, "global_step": 164261, "epoch": 977} {"train_loss": -11.145015716552734, "global_step": 164262, "epoch": 977} {"train_loss": -11.19028091430664, "global_step": 164263, "epoch": 977} {"train_loss": -11.249478340148926, "global_step": 164264, "epoch": 977} {"train_loss": -11.237703323364258, "global_step": 164265, "epoch": 977} {"train_loss": -11.268882751464844, "global_step": 164266, "epoch": 977} {"train_loss": -11.479361534118652, "global_step": 164267, "epoch": 977} {"train_loss": -11.169336318969727, "global_step": 164268, "epoch": 977} {"train_loss": -11.07243537902832, "global_step": 164269, "epoch": 977} {"train_loss": -11.450258255004883, "global_step": 164270, "epoch": 977} {"train_loss": -11.244682312011719, "global_step": 164271, "epoch": 977} {"train_loss": -11.450767517089844, "global_step": 164272, "epoch": 977} {"train_loss": -10.932985305786133, "global_step": 164273, "epoch": 977} {"train_loss": -11.401873588562012, "global_step": 164274, "epoch": 977} {"train_loss": -11.390802383422852, "global_step": 164275, "epoch": 977} {"train_loss": -11.378427505493164, "global_step": 164276, "epoch": 977} {"train_loss": -11.338197708129883, "global_step": 164277, "epoch": 977} {"train_loss": -11.421327590942383, "global_step": 164278, "epoch": 977} {"train_loss": -11.374958992004395, "global_step": 164279, "epoch": 977} {"train_loss": -11.242485046386719, "global_step": 164280, "epoch": 977} {"train_loss": -11.310927391052246, "global_step": 164281, "epoch": 977} {"train_loss": -11.337057113647461, "global_step": 164282, "epoch": 977} {"train_loss": -11.410603523254395, "global_step": 164283, "epoch": 977} {"train_loss": -11.532133102416992, "global_step": 164284, "epoch": 977} {"train_loss": -11.088964462280273, "global_step": 164285, "epoch": 977} {"train_loss": -11.205583572387695, "global_step": 164286, "epoch": 977} {"train_loss": -11.30295467376709, "global_step": 164287, "epoch": 977} {"train_loss": -11.544235229492188, "global_step": 164288, "epoch": 977} {"train_loss": -11.273353576660156, "global_step": 164289, "epoch": 977} {"train_loss": -11.21330451965332, "global_step": 164290, "epoch": 977} {"train_loss": -11.355082511901855, "global_step": 164291, "epoch": 977} {"train_loss": -11.413201332092285, "global_step": 164292, "epoch": 977} {"train_loss": -11.148113250732422, "global_step": 164293, "epoch": 977} {"train_loss": -11.077217102050781, "global_step": 164294, "epoch": 977} {"train_loss": -10.516051292419434, "global_step": 164295, "epoch": 977} {"train_loss": -10.101543426513672, "global_step": 164296, "epoch": 977} {"train_loss": -9.35669994354248, "global_step": 164297, "epoch": 977} {"train_loss": -9.82271957397461, "global_step": 164298, "epoch": 977} {"train_loss": -9.104710578918457, "global_step": 164299, "epoch": 977} {"train_loss": -8.979129791259766, "global_step": 164300, "epoch": 977} {"train_loss": -8.137842178344727, "global_step": 164301, "epoch": 977} {"train_loss": -9.142948150634766, "global_step": 164302, "epoch": 977} {"train_loss": -10.866971600623359, "global_step": 164303, "epoch": 977, "val_loss": 232380.015625} {"train_loss": -7.167934417724609, "global_step": 164304, "epoch": 978} {"train_loss": -7.610551357269287, "global_step": 164305, "epoch": 978} {"train_loss": -8.528112411499023, "global_step": 164306, "epoch": 978} {"train_loss": -8.042200088500977, "global_step": 164307, "epoch": 978} {"train_loss": -8.281624794006348, "global_step": 164308, "epoch": 978} {"train_loss": -7.35532808303833, "global_step": 164309, "epoch": 978} {"train_loss": -8.921173095703125, "global_step": 164310, "epoch": 978} {"train_loss": -8.418231964111328, "global_step": 164311, "epoch": 978} {"train_loss": -9.497203826904297, "global_step": 164312, "epoch": 978} {"train_loss": -8.835371017456055, "global_step": 164313, "epoch": 978} {"train_loss": -9.209485054016113, "global_step": 164314, "epoch": 978} {"train_loss": -9.370811462402344, "global_step": 164315, "epoch": 978} {"train_loss": -9.532777786254883, "global_step": 164316, "epoch": 978} {"train_loss": -9.33488655090332, "global_step": 164317, "epoch": 978} {"train_loss": -10.027331352233887, "global_step": 164318, "epoch": 978} {"train_loss": -9.435848236083984, "global_step": 164319, "epoch": 978} {"train_loss": -9.537164688110352, "global_step": 164320, "epoch": 978} {"train_loss": -10.068374633789062, "global_step": 164321, "epoch": 978} {"train_loss": -9.645268440246582, "global_step": 164322, "epoch": 978} {"train_loss": -9.888837814331055, "global_step": 164323, "epoch": 978} {"train_loss": -10.019598007202148, "global_step": 164324, "epoch": 978} {"train_loss": -9.942672729492188, "global_step": 164325, "epoch": 978} {"train_loss": -9.784513473510742, "global_step": 164326, "epoch": 978} {"train_loss": -10.212486267089844, "global_step": 164327, "epoch": 978} {"train_loss": -10.115604400634766, "global_step": 164328, "epoch": 978} {"train_loss": -10.066930770874023, "global_step": 164329, "epoch": 978} {"train_loss": -10.262330055236816, "global_step": 164330, "epoch": 978} {"train_loss": -10.145355224609375, "global_step": 164331, "epoch": 978} {"train_loss": -10.235733032226562, "global_step": 164332, "epoch": 978} {"train_loss": -9.988435745239258, "global_step": 164333, "epoch": 978} {"train_loss": -10.019285202026367, "global_step": 164334, "epoch": 978} {"train_loss": -10.0249605178833, "global_step": 164335, "epoch": 978} {"train_loss": -10.009649276733398, "global_step": 164336, "epoch": 978} {"train_loss": -10.145280838012695, "global_step": 164337, "epoch": 978} {"train_loss": -10.336281776428223, "global_step": 164338, "epoch": 978} {"train_loss": -10.11298942565918, "global_step": 164339, "epoch": 978} {"train_loss": -10.200944900512695, "global_step": 164340, "epoch": 978} {"train_loss": -10.50108528137207, "global_step": 164341, "epoch": 978} {"train_loss": -10.229342460632324, "global_step": 164342, "epoch": 978} {"train_loss": -10.088785171508789, "global_step": 164343, "epoch": 978} {"train_loss": -10.343473434448242, "global_step": 164344, "epoch": 978} {"train_loss": -10.393146514892578, "global_step": 164345, "epoch": 978} {"train_loss": -10.302915573120117, "global_step": 164346, "epoch": 978} {"train_loss": -10.309686660766602, "global_step": 164347, "epoch": 978} {"train_loss": -10.471576690673828, "global_step": 164348, "epoch": 978} {"train_loss": -10.474862098693848, "global_step": 164349, "epoch": 978} {"train_loss": -10.786503791809082, "global_step": 164350, "epoch": 978} {"train_loss": -10.342611312866211, "global_step": 164351, "epoch": 978} {"train_loss": -10.638161659240723, "global_step": 164352, "epoch": 978} {"train_loss": -10.478752136230469, "global_step": 164353, "epoch": 978} {"train_loss": -10.657861709594727, "global_step": 164354, "epoch": 978} {"train_loss": -10.585552215576172, "global_step": 164355, "epoch": 978} {"train_loss": -10.698505401611328, "global_step": 164356, "epoch": 978} {"train_loss": -10.741376876831055, "global_step": 164357, "epoch": 978} {"train_loss": -10.919303894042969, "global_step": 164358, "epoch": 978} {"train_loss": -10.733778953552246, "global_step": 164359, "epoch": 978} {"train_loss": -10.760817527770996, "global_step": 164360, "epoch": 978} {"train_loss": -10.70975112915039, "global_step": 164361, "epoch": 978} {"train_loss": -10.823646545410156, "global_step": 164362, "epoch": 978} {"train_loss": -10.730901718139648, "global_step": 164363, "epoch": 978} {"train_loss": -10.819297790527344, "global_step": 164364, "epoch": 978} {"train_loss": -10.891986846923828, "global_step": 164365, "epoch": 978} {"train_loss": -10.916646957397461, "global_step": 164366, "epoch": 978} {"train_loss": -11.023662567138672, "global_step": 164367, "epoch": 978} {"train_loss": -10.734888076782227, "global_step": 164368, "epoch": 978} {"train_loss": -11.023113250732422, "global_step": 164369, "epoch": 978} {"train_loss": -11.102773666381836, "global_step": 164370, "epoch": 978} {"train_loss": -10.957435607910156, "global_step": 164371, "epoch": 978} {"train_loss": -11.019510269165039, "global_step": 164372, "epoch": 978} {"train_loss": -10.750204086303711, "global_step": 164373, "epoch": 978} {"train_loss": -10.790609359741211, "global_step": 164374, "epoch": 978} {"train_loss": -11.080857276916504, "global_step": 164375, "epoch": 978} {"train_loss": -11.134190559387207, "global_step": 164376, "epoch": 978} {"train_loss": -11.053665161132812, "global_step": 164377, "epoch": 978} {"train_loss": -11.274420738220215, "global_step": 164378, "epoch": 978} {"train_loss": -10.96786117553711, "global_step": 164379, "epoch": 978} {"train_loss": -10.913003921508789, "global_step": 164380, "epoch": 978} {"train_loss": -11.025569915771484, "global_step": 164381, "epoch": 978} {"train_loss": -11.027392387390137, "global_step": 164382, "epoch": 978} {"train_loss": -10.876520156860352, "global_step": 164383, "epoch": 978} {"train_loss": -11.075681686401367, "global_step": 164384, "epoch": 978} {"train_loss": -11.033170700073242, "global_step": 164385, "epoch": 978} {"train_loss": -10.920160293579102, "global_step": 164386, "epoch": 978} {"train_loss": -11.033587455749512, "global_step": 164387, "epoch": 978} {"train_loss": -11.29625415802002, "global_step": 164388, "epoch": 978} {"train_loss": -10.997404098510742, "global_step": 164389, "epoch": 978} {"train_loss": -11.067337036132812, "global_step": 164390, "epoch": 978} {"train_loss": -11.278846740722656, "global_step": 164391, "epoch": 978} {"train_loss": -11.185171127319336, "global_step": 164392, "epoch": 978} {"train_loss": -11.232572555541992, "global_step": 164393, "epoch": 978} {"train_loss": -11.27602767944336, "global_step": 164394, "epoch": 978} {"train_loss": -11.396078109741211, "global_step": 164395, "epoch": 978} {"train_loss": -11.452978134155273, "global_step": 164396, "epoch": 978} {"train_loss": -11.167280197143555, "global_step": 164397, "epoch": 978} {"train_loss": -11.255035400390625, "global_step": 164398, "epoch": 978} {"train_loss": -11.32951545715332, "global_step": 164399, "epoch": 978} {"train_loss": -11.353360176086426, "global_step": 164400, "epoch": 978} {"train_loss": -11.354850769042969, "global_step": 164401, "epoch": 978} {"train_loss": -11.27139663696289, "global_step": 164402, "epoch": 978} {"train_loss": -11.05728530883789, "global_step": 164403, "epoch": 978} {"train_loss": -11.305374145507812, "global_step": 164404, "epoch": 978} {"train_loss": -11.24781608581543, "global_step": 164405, "epoch": 978} {"train_loss": -11.288238525390625, "global_step": 164406, "epoch": 978} {"train_loss": -11.222082138061523, "global_step": 164407, "epoch": 978} {"train_loss": -10.935855865478516, "global_step": 164408, "epoch": 978} {"train_loss": -11.45880126953125, "global_step": 164409, "epoch": 978} {"train_loss": -11.06330680847168, "global_step": 164410, "epoch": 978} {"train_loss": -11.247699737548828, "global_step": 164411, "epoch": 978} {"train_loss": -11.013179779052734, "global_step": 164412, "epoch": 978} {"train_loss": -11.495009422302246, "global_step": 164413, "epoch": 978} {"train_loss": -11.015666961669922, "global_step": 164414, "epoch": 978} {"train_loss": -11.353254318237305, "global_step": 164415, "epoch": 978} {"train_loss": -11.338401794433594, "global_step": 164416, "epoch": 978} {"train_loss": -11.329194068908691, "global_step": 164417, "epoch": 978} {"train_loss": -11.477497100830078, "global_step": 164418, "epoch": 978} {"train_loss": -11.25727653503418, "global_step": 164419, "epoch": 978} {"train_loss": -11.3828125, "global_step": 164420, "epoch": 978} {"train_loss": -11.067363739013672, "global_step": 164421, "epoch": 978} {"train_loss": -11.47053050994873, "global_step": 164422, "epoch": 978} {"train_loss": -11.407360076904297, "global_step": 164423, "epoch": 978} {"train_loss": -11.09504222869873, "global_step": 164424, "epoch": 978} {"train_loss": -10.995287895202637, "global_step": 164425, "epoch": 978} {"train_loss": -11.221729278564453, "global_step": 164426, "epoch": 978} {"train_loss": -11.208635330200195, "global_step": 164427, "epoch": 978} {"train_loss": -10.999137878417969, "global_step": 164428, "epoch": 978} {"train_loss": -10.15096664428711, "global_step": 164429, "epoch": 978} {"train_loss": -7.963037490844727, "global_step": 164430, "epoch": 978} {"train_loss": -9.403034210205078, "global_step": 164431, "epoch": 978} {"train_loss": -8.475851058959961, "global_step": 164432, "epoch": 978} {"train_loss": -10.429205894470215, "global_step": 164433, "epoch": 978} {"train_loss": -7.619612693786621, "global_step": 164434, "epoch": 978} {"train_loss": -9.478687286376953, "global_step": 164435, "epoch": 978} {"train_loss": -8.271707534790039, "global_step": 164436, "epoch": 978} {"train_loss": -9.106175422668457, "global_step": 164437, "epoch": 978} {"train_loss": -10.209732055664062, "global_step": 164438, "epoch": 978} {"train_loss": -8.460737228393555, "global_step": 164439, "epoch": 978} {"train_loss": -9.516761779785156, "global_step": 164440, "epoch": 978} {"train_loss": -8.576700210571289, "global_step": 164441, "epoch": 978} {"train_loss": -9.627786636352539, "global_step": 164442, "epoch": 978} {"train_loss": -9.186960220336914, "global_step": 164443, "epoch": 978} {"train_loss": -9.147737503051758, "global_step": 164444, "epoch": 978} {"train_loss": -9.79356575012207, "global_step": 164445, "epoch": 978} {"train_loss": -8.735217094421387, "global_step": 164446, "epoch": 978} {"train_loss": -9.56147289276123, "global_step": 164447, "epoch": 978} {"train_loss": -9.732120513916016, "global_step": 164448, "epoch": 978} {"train_loss": -8.956769943237305, "global_step": 164449, "epoch": 978} {"train_loss": -9.136124610900879, "global_step": 164450, "epoch": 978} {"train_loss": -9.13184928894043, "global_step": 164451, "epoch": 978} {"train_loss": -9.492438316345215, "global_step": 164452, "epoch": 978} {"train_loss": -10.073891639709473, "global_step": 164453, "epoch": 978} {"train_loss": -8.938467025756836, "global_step": 164454, "epoch": 978} {"train_loss": -10.136878967285156, "global_step": 164455, "epoch": 978} {"train_loss": -10.248750686645508, "global_step": 164456, "epoch": 978} {"train_loss": -9.39452838897705, "global_step": 164457, "epoch": 978} {"train_loss": -9.647438049316406, "global_step": 164458, "epoch": 978} {"train_loss": -9.978103637695312, "global_step": 164459, "epoch": 978} {"train_loss": -10.020550727844238, "global_step": 164460, "epoch": 978} {"train_loss": -10.077905654907227, "global_step": 164461, "epoch": 978} {"train_loss": -10.115431785583496, "global_step": 164462, "epoch": 978} {"train_loss": -10.321762084960938, "global_step": 164463, "epoch": 978} {"train_loss": -10.131864547729492, "global_step": 164464, "epoch": 978} {"train_loss": -9.771652221679688, "global_step": 164465, "epoch": 978} {"train_loss": -10.305831909179688, "global_step": 164466, "epoch": 978} {"train_loss": -10.412833213806152, "global_step": 164467, "epoch": 978} {"train_loss": -10.2489013671875, "global_step": 164468, "epoch": 978} {"train_loss": -10.232316970825195, "global_step": 164469, "epoch": 978} {"train_loss": -10.463747024536133, "global_step": 164470, "epoch": 978} {"train_loss": -10.289337385268439, "global_step": 164471, "epoch": 978, "val_loss": 237612.90625} {"train_loss": -10.256731033325195, "global_step": 164472, "epoch": 979} {"train_loss": -10.451229095458984, "global_step": 164473, "epoch": 979} {"train_loss": -10.339566230773926, "global_step": 164474, "epoch": 979} {"train_loss": -10.188518524169922, "global_step": 164475, "epoch": 979} {"train_loss": -10.371853828430176, "global_step": 164476, "epoch": 979} {"train_loss": -10.639793395996094, "global_step": 164477, "epoch": 979} {"train_loss": -10.656373977661133, "global_step": 164478, "epoch": 979} {"train_loss": -10.416419982910156, "global_step": 164479, "epoch": 979} {"train_loss": -10.666328430175781, "global_step": 164480, "epoch": 979} {"train_loss": -10.529887199401855, "global_step": 164481, "epoch": 979} {"train_loss": -10.655155181884766, "global_step": 164482, "epoch": 979} {"train_loss": -10.67515754699707, "global_step": 164483, "epoch": 979} {"train_loss": -10.686403274536133, "global_step": 164484, "epoch": 979} {"train_loss": -10.806489944458008, "global_step": 164485, "epoch": 979} {"train_loss": -10.891534805297852, "global_step": 164486, "epoch": 979} {"train_loss": -10.75319766998291, "global_step": 164487, "epoch": 979} {"train_loss": -10.702969551086426, "global_step": 164488, "epoch": 979} {"train_loss": -10.908206939697266, "global_step": 164489, "epoch": 979} {"train_loss": -10.812652587890625, "global_step": 164490, "epoch": 979} {"train_loss": -10.503190994262695, "global_step": 164491, "epoch": 979} {"train_loss": -10.763896942138672, "global_step": 164492, "epoch": 979} {"train_loss": -10.923693656921387, "global_step": 164493, "epoch": 979} {"train_loss": -10.873252868652344, "global_step": 164494, "epoch": 979} {"train_loss": -10.900798797607422, "global_step": 164495, "epoch": 979} {"train_loss": -10.96657943725586, "global_step": 164496, "epoch": 979} {"train_loss": -11.128026962280273, "global_step": 164497, "epoch": 979} {"train_loss": -10.84794807434082, "global_step": 164498, "epoch": 979} {"train_loss": -11.115275382995605, "global_step": 164499, "epoch": 979} {"train_loss": -11.06889533996582, "global_step": 164500, "epoch": 979} {"train_loss": -10.885209083557129, "global_step": 164501, "epoch": 979} {"train_loss": -11.038765907287598, "global_step": 164502, "epoch": 979} {"train_loss": -11.06200885772705, "global_step": 164503, "epoch": 979} {"train_loss": -11.175195693969727, "global_step": 164504, "epoch": 979} {"train_loss": -11.214296340942383, "global_step": 164505, "epoch": 979} {"train_loss": -10.839997291564941, "global_step": 164506, "epoch": 979} {"train_loss": -11.1031494140625, "global_step": 164507, "epoch": 979} {"train_loss": -11.303363800048828, "global_step": 164508, "epoch": 979} {"train_loss": -11.135296821594238, "global_step": 164509, "epoch": 979} {"train_loss": -10.97760009765625, "global_step": 164510, "epoch": 979} {"train_loss": -11.108144760131836, "global_step": 164511, "epoch": 979} {"train_loss": -11.314085006713867, "global_step": 164512, "epoch": 979} {"train_loss": -11.097663879394531, "global_step": 164513, "epoch": 979} {"train_loss": -11.402958869934082, "global_step": 164514, "epoch": 979} {"train_loss": -11.247782707214355, "global_step": 164515, "epoch": 979} {"train_loss": -11.155546188354492, "global_step": 164516, "epoch": 979} {"train_loss": -11.308280944824219, "global_step": 164517, "epoch": 979} {"train_loss": -11.107574462890625, "global_step": 164518, "epoch": 979} {"train_loss": -11.23092269897461, "global_step": 164519, "epoch": 979} {"train_loss": -11.406325340270996, "global_step": 164520, "epoch": 979} {"train_loss": -11.41914176940918, "global_step": 164521, "epoch": 979} {"train_loss": -11.089239120483398, "global_step": 164522, "epoch": 979} {"train_loss": -11.387784957885742, "global_step": 164523, "epoch": 979} {"train_loss": -11.455963134765625, "global_step": 164524, "epoch": 979} {"train_loss": -11.058401107788086, "global_step": 164525, "epoch": 979} {"train_loss": -11.05820083618164, "global_step": 164526, "epoch": 979} {"train_loss": -11.230976104736328, "global_step": 164527, "epoch": 979} {"train_loss": -11.125144958496094, "global_step": 164528, "epoch": 979} {"train_loss": -11.451311111450195, "global_step": 164529, "epoch": 979} {"train_loss": -11.096317291259766, "global_step": 164530, "epoch": 979} {"train_loss": -10.99144172668457, "global_step": 164531, "epoch": 979} {"train_loss": -11.079097747802734, "global_step": 164532, "epoch": 979} {"train_loss": -11.25423526763916, "global_step": 164533, "epoch": 979} {"train_loss": -11.024803161621094, "global_step": 164534, "epoch": 979} {"train_loss": -11.121674537658691, "global_step": 164535, "epoch": 979} {"train_loss": -11.056890487670898, "global_step": 164536, "epoch": 979} {"train_loss": -10.780885696411133, "global_step": 164537, "epoch": 979} {"train_loss": -10.921432495117188, "global_step": 164538, "epoch": 979} {"train_loss": -10.74848747253418, "global_step": 164539, "epoch": 979} {"train_loss": -10.912797927856445, "global_step": 164540, "epoch": 979} {"train_loss": -10.83853530883789, "global_step": 164541, "epoch": 979} {"train_loss": -11.016195297241211, "global_step": 164542, "epoch": 979} {"train_loss": -10.630391120910645, "global_step": 164543, "epoch": 979} {"train_loss": -11.059090614318848, "global_step": 164544, "epoch": 979} {"train_loss": -10.673601150512695, "global_step": 164545, "epoch": 979} {"train_loss": -10.654272079467773, "global_step": 164546, "epoch": 979} {"train_loss": -10.612614631652832, "global_step": 164547, "epoch": 979} {"train_loss": -11.081331253051758, "global_step": 164548, "epoch": 979} {"train_loss": -10.08427619934082, "global_step": 164549, "epoch": 979} {"train_loss": -11.207971572875977, "global_step": 164550, "epoch": 979} {"train_loss": -10.792701721191406, "global_step": 164551, "epoch": 979} {"train_loss": -11.019643783569336, "global_step": 164552, "epoch": 979} {"train_loss": -10.972545623779297, "global_step": 164553, "epoch": 979} {"train_loss": -11.124406814575195, "global_step": 164554, "epoch": 979} {"train_loss": -11.371423721313477, "global_step": 164555, "epoch": 979} {"train_loss": -11.101966857910156, "global_step": 164556, "epoch": 979} {"train_loss": -11.172805786132812, "global_step": 164557, "epoch": 979} {"train_loss": -11.054962158203125, "global_step": 164558, "epoch": 979} {"train_loss": -10.74687671661377, "global_step": 164559, "epoch": 979} {"train_loss": -10.810770034790039, "global_step": 164560, "epoch": 979} {"train_loss": -10.874347686767578, "global_step": 164561, "epoch": 979} {"train_loss": -10.963817596435547, "global_step": 164562, "epoch": 979} {"train_loss": -10.619288444519043, "global_step": 164563, "epoch": 979} {"train_loss": -10.8880615234375, "global_step": 164564, "epoch": 979} {"train_loss": -10.628928184509277, "global_step": 164565, "epoch": 979} {"train_loss": -10.921783447265625, "global_step": 164566, "epoch": 979} {"train_loss": -11.058083534240723, "global_step": 164567, "epoch": 979} {"train_loss": -10.900440216064453, "global_step": 164568, "epoch": 979} {"train_loss": -11.003772735595703, "global_step": 164569, "epoch": 979} {"train_loss": -10.88477897644043, "global_step": 164570, "epoch": 979} {"train_loss": -10.945342063903809, "global_step": 164571, "epoch": 979} {"train_loss": -10.840888977050781, "global_step": 164572, "epoch": 979} {"train_loss": -10.920740127563477, "global_step": 164573, "epoch": 979} {"train_loss": -11.07818603515625, "global_step": 164574, "epoch": 979} {"train_loss": -10.903522491455078, "global_step": 164575, "epoch": 979} {"train_loss": -11.222509384155273, "global_step": 164576, "epoch": 979} {"train_loss": -10.913408279418945, "global_step": 164577, "epoch": 979} {"train_loss": -10.457592010498047, "global_step": 164578, "epoch": 979} {"train_loss": -10.970001220703125, "global_step": 164579, "epoch": 979} {"train_loss": -11.152603149414062, "global_step": 164580, "epoch": 979} {"train_loss": -10.810413360595703, "global_step": 164581, "epoch": 979} {"train_loss": -10.985788345336914, "global_step": 164582, "epoch": 979} {"train_loss": -10.739879608154297, "global_step": 164583, "epoch": 979} {"train_loss": -10.205978393554688, "global_step": 164584, "epoch": 979} {"train_loss": -10.846721649169922, "global_step": 164585, "epoch": 979} {"train_loss": -10.406511306762695, "global_step": 164586, "epoch": 979} {"train_loss": -10.27098274230957, "global_step": 164587, "epoch": 979} {"train_loss": -10.874241828918457, "global_step": 164588, "epoch": 979} {"train_loss": -10.498025894165039, "global_step": 164589, "epoch": 979} {"train_loss": -10.799481391906738, "global_step": 164590, "epoch": 979} {"train_loss": -10.45289421081543, "global_step": 164591, "epoch": 979} {"train_loss": -10.303062438964844, "global_step": 164592, "epoch": 979} {"train_loss": -10.877482414245605, "global_step": 164593, "epoch": 979} {"train_loss": -10.452068328857422, "global_step": 164594, "epoch": 979} {"train_loss": -10.734736442565918, "global_step": 164595, "epoch": 979} {"train_loss": -10.691701889038086, "global_step": 164596, "epoch": 979} {"train_loss": -10.628015518188477, "global_step": 164597, "epoch": 979} {"train_loss": -10.627440452575684, "global_step": 164598, "epoch": 979} {"train_loss": -10.415054321289062, "global_step": 164599, "epoch": 979} {"train_loss": -9.830799102783203, "global_step": 164600, "epoch": 979} {"train_loss": -11.092233657836914, "global_step": 164601, "epoch": 979} {"train_loss": -9.928543090820312, "global_step": 164602, "epoch": 979} {"train_loss": -10.78204345703125, "global_step": 164603, "epoch": 979} {"train_loss": -10.033988952636719, "global_step": 164604, "epoch": 979} {"train_loss": -10.53423023223877, "global_step": 164605, "epoch": 979} {"train_loss": -10.765034675598145, "global_step": 164606, "epoch": 979} {"train_loss": -10.020550727844238, "global_step": 164607, "epoch": 979} {"train_loss": -10.616022109985352, "global_step": 164608, "epoch": 979} {"train_loss": -10.491305351257324, "global_step": 164609, "epoch": 979} {"train_loss": -10.582780838012695, "global_step": 164610, "epoch": 979} {"train_loss": -10.849862098693848, "global_step": 164611, "epoch": 979} {"train_loss": -10.356751441955566, "global_step": 164612, "epoch": 979} {"train_loss": -10.748697280883789, "global_step": 164613, "epoch": 979} {"train_loss": -10.833841323852539, "global_step": 164614, "epoch": 979} {"train_loss": -10.591289520263672, "global_step": 164615, "epoch": 979} {"train_loss": -11.017021179199219, "global_step": 164616, "epoch": 979} {"train_loss": -10.622915267944336, "global_step": 164617, "epoch": 979} {"train_loss": -10.707587242126465, "global_step": 164618, "epoch": 979} {"train_loss": -10.913698196411133, "global_step": 164619, "epoch": 979} {"train_loss": -10.771331787109375, "global_step": 164620, "epoch": 979} {"train_loss": -10.969154357910156, "global_step": 164621, "epoch": 979} {"train_loss": -10.863286972045898, "global_step": 164622, "epoch": 979} {"train_loss": -10.828339576721191, "global_step": 164623, "epoch": 979} {"train_loss": -11.142541885375977, "global_step": 164624, "epoch": 979} {"train_loss": -10.913505554199219, "global_step": 164625, "epoch": 979} {"train_loss": -10.985420227050781, "global_step": 164626, "epoch": 979} {"train_loss": -11.074432373046875, "global_step": 164627, "epoch": 979} {"train_loss": -10.886765480041504, "global_step": 164628, "epoch": 979} {"train_loss": -10.950855255126953, "global_step": 164629, "epoch": 979} {"train_loss": -10.783544540405273, "global_step": 164630, "epoch": 979} {"train_loss": -11.174907684326172, "global_step": 164631, "epoch": 979} {"train_loss": -11.012617111206055, "global_step": 164632, "epoch": 979} {"train_loss": -10.902263641357422, "global_step": 164633, "epoch": 979} {"train_loss": -11.01594352722168, "global_step": 164634, "epoch": 979} {"train_loss": -11.035223007202148, "global_step": 164635, "epoch": 979} {"train_loss": -10.864429473876953, "global_step": 164636, "epoch": 979} {"train_loss": -11.070533752441406, "global_step": 164637, "epoch": 979} {"train_loss": -11.105880737304688, "global_step": 164638, "epoch": 979} {"train_loss": -10.859974077769689, "global_step": 164639, "epoch": 979, "val_loss": 238359.1875} {"train_loss": -11.107190132141113, "global_step": 164640, "epoch": 980} {"train_loss": -11.157317161560059, "global_step": 164641, "epoch": 980} {"train_loss": -10.95553970336914, "global_step": 164642, "epoch": 980} {"train_loss": -10.937211990356445, "global_step": 164643, "epoch": 980} {"train_loss": -10.826898574829102, "global_step": 164644, "epoch": 980} {"train_loss": -11.14522933959961, "global_step": 164645, "epoch": 980} {"train_loss": -10.767154693603516, "global_step": 164646, "epoch": 980} {"train_loss": -10.974413871765137, "global_step": 164647, "epoch": 980} {"train_loss": -10.569637298583984, "global_step": 164648, "epoch": 980} {"train_loss": -10.740283012390137, "global_step": 164649, "epoch": 980} {"train_loss": -10.863301277160645, "global_step": 164650, "epoch": 980} {"train_loss": -10.582601547241211, "global_step": 164651, "epoch": 980} {"train_loss": -10.964033126831055, "global_step": 164652, "epoch": 980} {"train_loss": -10.390115737915039, "global_step": 164653, "epoch": 980} {"train_loss": -10.649381637573242, "global_step": 164654, "epoch": 980} {"train_loss": -10.957845687866211, "global_step": 164655, "epoch": 980} {"train_loss": -10.703609466552734, "global_step": 164656, "epoch": 980} {"train_loss": -11.03260612487793, "global_step": 164657, "epoch": 980} {"train_loss": -10.87228012084961, "global_step": 164658, "epoch": 980} {"train_loss": -11.057003021240234, "global_step": 164659, "epoch": 980} {"train_loss": -11.031139373779297, "global_step": 164660, "epoch": 980} {"train_loss": -10.966739654541016, "global_step": 164661, "epoch": 980} {"train_loss": -10.763630867004395, "global_step": 164662, "epoch": 980} {"train_loss": -10.61352252960205, "global_step": 164663, "epoch": 980} {"train_loss": -10.545767784118652, "global_step": 164664, "epoch": 980} {"train_loss": -10.936687469482422, "global_step": 164665, "epoch": 980} {"train_loss": -11.049939155578613, "global_step": 164666, "epoch": 980} {"train_loss": -10.76858139038086, "global_step": 164667, "epoch": 980} {"train_loss": -10.978076934814453, "global_step": 164668, "epoch": 980} {"train_loss": -10.75421142578125, "global_step": 164669, "epoch": 980} {"train_loss": -10.789742469787598, "global_step": 164670, "epoch": 980} {"train_loss": -10.67768669128418, "global_step": 164671, "epoch": 980} {"train_loss": -10.534003257751465, "global_step": 164672, "epoch": 980} {"train_loss": -10.915245056152344, "global_step": 164673, "epoch": 980} {"train_loss": -10.713342666625977, "global_step": 164674, "epoch": 980} {"train_loss": -10.86964225769043, "global_step": 164675, "epoch": 980} {"train_loss": -11.029969215393066, "global_step": 164676, "epoch": 980} {"train_loss": -10.965269088745117, "global_step": 164677, "epoch": 980} {"train_loss": -10.837516784667969, "global_step": 164678, "epoch": 980} {"train_loss": -11.008832931518555, "global_step": 164679, "epoch": 980} {"train_loss": -10.999109268188477, "global_step": 164680, "epoch": 980} {"train_loss": -10.820030212402344, "global_step": 164681, "epoch": 980} {"train_loss": -10.7972412109375, "global_step": 164682, "epoch": 980} {"train_loss": -11.163515090942383, "global_step": 164683, "epoch": 980} {"train_loss": -11.070927619934082, "global_step": 164684, "epoch": 980} {"train_loss": -11.267950057983398, "global_step": 164685, "epoch": 980} {"train_loss": -10.972920417785645, "global_step": 164686, "epoch": 980} {"train_loss": -11.178519248962402, "global_step": 164687, "epoch": 980} {"train_loss": -11.043456077575684, "global_step": 164688, "epoch": 980} {"train_loss": -11.4335298538208, "global_step": 164689, "epoch": 980} {"train_loss": -11.024664878845215, "global_step": 164690, "epoch": 980} {"train_loss": -10.950785636901855, "global_step": 164691, "epoch": 980} {"train_loss": -11.242300033569336, "global_step": 164692, "epoch": 980} {"train_loss": -10.668877601623535, "global_step": 164693, "epoch": 980} {"train_loss": -10.85479736328125, "global_step": 164694, "epoch": 980} {"train_loss": -11.205327987670898, "global_step": 164695, "epoch": 980} {"train_loss": -10.828916549682617, "global_step": 164696, "epoch": 980} {"train_loss": -11.084362030029297, "global_step": 164697, "epoch": 980} {"train_loss": -10.976438522338867, "global_step": 164698, "epoch": 980} {"train_loss": -10.73044490814209, "global_step": 164699, "epoch": 980} {"train_loss": -11.019277572631836, "global_step": 164700, "epoch": 980} {"train_loss": -10.678417205810547, "global_step": 164701, "epoch": 980} {"train_loss": -11.085716247558594, "global_step": 164702, "epoch": 980} {"train_loss": -10.909746170043945, "global_step": 164703, "epoch": 980} {"train_loss": -10.899866104125977, "global_step": 164704, "epoch": 980} {"train_loss": -11.080873489379883, "global_step": 164705, "epoch": 980} {"train_loss": -10.574616432189941, "global_step": 164706, "epoch": 980} {"train_loss": -11.035932540893555, "global_step": 164707, "epoch": 980} {"train_loss": -10.509798049926758, "global_step": 164708, "epoch": 980} {"train_loss": -11.44736099243164, "global_step": 164709, "epoch": 980} {"train_loss": -10.761364936828613, "global_step": 164710, "epoch": 980} {"train_loss": -10.943140029907227, "global_step": 164711, "epoch": 980} {"train_loss": -11.365474700927734, "global_step": 164712, "epoch": 980} {"train_loss": -10.90965461730957, "global_step": 164713, "epoch": 980} {"train_loss": -11.097600936889648, "global_step": 164714, "epoch": 980} {"train_loss": -10.741518020629883, "global_step": 164715, "epoch": 980} {"train_loss": -10.988037109375, "global_step": 164716, "epoch": 980} {"train_loss": -10.79005241394043, "global_step": 164717, "epoch": 980} {"train_loss": -10.909893035888672, "global_step": 164718, "epoch": 980} {"train_loss": -11.025174140930176, "global_step": 164719, "epoch": 980} {"train_loss": -10.737384796142578, "global_step": 164720, "epoch": 980} {"train_loss": -10.966736793518066, "global_step": 164721, "epoch": 980} {"train_loss": -10.92630672454834, "global_step": 164722, "epoch": 980} {"train_loss": -10.729057312011719, "global_step": 164723, "epoch": 980} {"train_loss": -11.175403594970703, "global_step": 164724, "epoch": 980} {"train_loss": -11.014114379882812, "global_step": 164725, "epoch": 980} {"train_loss": -11.306090354919434, "global_step": 164726, "epoch": 980} {"train_loss": -10.822785377502441, "global_step": 164727, "epoch": 980} {"train_loss": -10.922714233398438, "global_step": 164728, "epoch": 980} {"train_loss": -11.042762756347656, "global_step": 164729, "epoch": 980} {"train_loss": -10.641395568847656, "global_step": 164730, "epoch": 980} {"train_loss": -10.66130542755127, "global_step": 164731, "epoch": 980} {"train_loss": -10.839494705200195, "global_step": 164732, "epoch": 980} {"train_loss": -10.600162506103516, "global_step": 164733, "epoch": 980} {"train_loss": -10.485077857971191, "global_step": 164734, "epoch": 980} {"train_loss": -11.052237510681152, "global_step": 164735, "epoch": 980} {"train_loss": -10.87697696685791, "global_step": 164736, "epoch": 980} {"train_loss": -10.785621643066406, "global_step": 164737, "epoch": 980} {"train_loss": -10.713438987731934, "global_step": 164738, "epoch": 980} {"train_loss": -10.137674331665039, "global_step": 164739, "epoch": 980} {"train_loss": -11.077821731567383, "global_step": 164740, "epoch": 980} {"train_loss": -10.543172836303711, "global_step": 164741, "epoch": 980} {"train_loss": -10.444945335388184, "global_step": 164742, "epoch": 980} {"train_loss": -10.908787727355957, "global_step": 164743, "epoch": 980} {"train_loss": -10.293798446655273, "global_step": 164744, "epoch": 980} {"train_loss": -11.003349304199219, "global_step": 164745, "epoch": 980} {"train_loss": -10.277206420898438, "global_step": 164746, "epoch": 980} {"train_loss": -10.013457298278809, "global_step": 164747, "epoch": 980} {"train_loss": -10.98421573638916, "global_step": 164748, "epoch": 980} {"train_loss": -10.323973655700684, "global_step": 164749, "epoch": 980} {"train_loss": -10.520078659057617, "global_step": 164750, "epoch": 980} {"train_loss": -10.362516403198242, "global_step": 164751, "epoch": 980} {"train_loss": -10.907469749450684, "global_step": 164752, "epoch": 980} {"train_loss": -10.371431350708008, "global_step": 164753, "epoch": 980} {"train_loss": -11.017393112182617, "global_step": 164754, "epoch": 980} {"train_loss": -10.45573616027832, "global_step": 164755, "epoch": 980} {"train_loss": -10.583168029785156, "global_step": 164756, "epoch": 980} {"train_loss": -10.911092758178711, "global_step": 164757, "epoch": 980} {"train_loss": -10.484963417053223, "global_step": 164758, "epoch": 980} {"train_loss": -10.840323448181152, "global_step": 164759, "epoch": 980} {"train_loss": -10.753213882446289, "global_step": 164760, "epoch": 980} {"train_loss": -10.670639038085938, "global_step": 164761, "epoch": 980} {"train_loss": -10.814577102661133, "global_step": 164762, "epoch": 980} {"train_loss": -10.513046264648438, "global_step": 164763, "epoch": 980} {"train_loss": -10.833934783935547, "global_step": 164764, "epoch": 980} {"train_loss": -10.828516006469727, "global_step": 164765, "epoch": 980} {"train_loss": -10.71856689453125, "global_step": 164766, "epoch": 980} {"train_loss": -10.92426872253418, "global_step": 164767, "epoch": 980} {"train_loss": -10.901627540588379, "global_step": 164768, "epoch": 980} {"train_loss": -10.648527145385742, "global_step": 164769, "epoch": 980} {"train_loss": -10.55224323272705, "global_step": 164770, "epoch": 980} {"train_loss": -10.44184398651123, "global_step": 164771, "epoch": 980} {"train_loss": -10.654565811157227, "global_step": 164772, "epoch": 980} {"train_loss": -10.714948654174805, "global_step": 164773, "epoch": 980} {"train_loss": -10.733081817626953, "global_step": 164774, "epoch": 980} {"train_loss": -10.6132173538208, "global_step": 164775, "epoch": 980} {"train_loss": -10.84522819519043, "global_step": 164776, "epoch": 980} {"train_loss": -10.768648147583008, "global_step": 164777, "epoch": 980} {"train_loss": -10.775896072387695, "global_step": 164778, "epoch": 980} {"train_loss": -10.730010986328125, "global_step": 164779, "epoch": 980} {"train_loss": -10.579530715942383, "global_step": 164780, "epoch": 980} {"train_loss": -10.45931339263916, "global_step": 164781, "epoch": 980} {"train_loss": -11.071712493896484, "global_step": 164782, "epoch": 980} {"train_loss": -10.814363479614258, "global_step": 164783, "epoch": 980} {"train_loss": -10.906274795532227, "global_step": 164784, "epoch": 980} {"train_loss": -10.636817932128906, "global_step": 164785, "epoch": 980} {"train_loss": -11.052494049072266, "global_step": 164786, "epoch": 980} {"train_loss": -11.029438018798828, "global_step": 164787, "epoch": 980} {"train_loss": -11.148604393005371, "global_step": 164788, "epoch": 980} {"train_loss": -10.934440612792969, "global_step": 164789, "epoch": 980} {"train_loss": -11.124547004699707, "global_step": 164790, "epoch": 980} {"train_loss": -10.93752670288086, "global_step": 164791, "epoch": 980} {"train_loss": -11.162467002868652, "global_step": 164792, "epoch": 980} {"train_loss": -11.01496696472168, "global_step": 164793, "epoch": 980} {"train_loss": -10.992294311523438, "global_step": 164794, "epoch": 980} {"train_loss": -11.113374710083008, "global_step": 164795, "epoch": 980} {"train_loss": -11.243868827819824, "global_step": 164796, "epoch": 980} {"train_loss": -10.9169921875, "global_step": 164797, "epoch": 980} {"train_loss": -11.343721389770508, "global_step": 164798, "epoch": 980} {"train_loss": -11.095867156982422, "global_step": 164799, "epoch": 980} {"train_loss": -11.124463081359863, "global_step": 164800, "epoch": 980} {"train_loss": -11.056258201599121, "global_step": 164801, "epoch": 980} {"train_loss": -11.152420043945312, "global_step": 164802, "epoch": 980} {"train_loss": -11.36235237121582, "global_step": 164803, "epoch": 980} {"train_loss": -11.176839828491211, "global_step": 164804, "epoch": 980} {"train_loss": -11.327522277832031, "global_step": 164805, "epoch": 980} {"train_loss": -11.268277168273926, "global_step": 164806, "epoch": 980} {"train_loss": -10.86635130360013, "global_step": 164807, "epoch": 980, "val_loss": 238236.6875, "train_action_mse_error": 2.0180583000183105} {"train_loss": -11.10885238647461, "global_step": 164808, "epoch": 981} {"train_loss": -11.224336624145508, "global_step": 164809, "epoch": 981} {"train_loss": -11.167640686035156, "global_step": 164810, "epoch": 981} {"train_loss": -11.210087776184082, "global_step": 164811, "epoch": 981} {"train_loss": -11.357452392578125, "global_step": 164812, "epoch": 981} {"train_loss": -11.199100494384766, "global_step": 164813, "epoch": 981} {"train_loss": -11.34981632232666, "global_step": 164814, "epoch": 981} {"train_loss": -11.0169677734375, "global_step": 164815, "epoch": 981} {"train_loss": -11.336084365844727, "global_step": 164816, "epoch": 981} {"train_loss": -10.957670211791992, "global_step": 164817, "epoch": 981} {"train_loss": -11.248502731323242, "global_step": 164818, "epoch": 981} {"train_loss": -11.25018310546875, "global_step": 164819, "epoch": 981} {"train_loss": -11.15815258026123, "global_step": 164820, "epoch": 981} {"train_loss": -11.225968360900879, "global_step": 164821, "epoch": 981} {"train_loss": -11.330249786376953, "global_step": 164822, "epoch": 981} {"train_loss": -11.357267379760742, "global_step": 164823, "epoch": 981} {"train_loss": -11.395713806152344, "global_step": 164824, "epoch": 981} {"train_loss": -11.149749755859375, "global_step": 164825, "epoch": 981} {"train_loss": -11.207279205322266, "global_step": 164826, "epoch": 981} {"train_loss": -10.951102256774902, "global_step": 164827, "epoch": 981} {"train_loss": -10.718626022338867, "global_step": 164828, "epoch": 981} {"train_loss": -10.667619705200195, "global_step": 164829, "epoch": 981} {"train_loss": -11.020347595214844, "global_step": 164830, "epoch": 981} {"train_loss": -10.964088439941406, "global_step": 164831, "epoch": 981} {"train_loss": -11.166291236877441, "global_step": 164832, "epoch": 981} {"train_loss": -11.09953498840332, "global_step": 164833, "epoch": 981} {"train_loss": -11.031242370605469, "global_step": 164834, "epoch": 981} {"train_loss": -10.435779571533203, "global_step": 164835, "epoch": 981} {"train_loss": -10.946489334106445, "global_step": 164836, "epoch": 981} {"train_loss": -10.890220642089844, "global_step": 164837, "epoch": 981} {"train_loss": -11.193624496459961, "global_step": 164838, "epoch": 981} {"train_loss": -10.769231796264648, "global_step": 164839, "epoch": 981} {"train_loss": -10.420816421508789, "global_step": 164840, "epoch": 981} {"train_loss": -10.250828742980957, "global_step": 164841, "epoch": 981} {"train_loss": -10.344538688659668, "global_step": 164842, "epoch": 981} {"train_loss": -9.457793235778809, "global_step": 164843, "epoch": 981} {"train_loss": -9.915163040161133, "global_step": 164844, "epoch": 981} {"train_loss": -9.636748313903809, "global_step": 164845, "epoch": 981} {"train_loss": -9.982837677001953, "global_step": 164846, "epoch": 981} {"train_loss": -10.632001876831055, "global_step": 164847, "epoch": 981} {"train_loss": -10.354610443115234, "global_step": 164848, "epoch": 981} {"train_loss": -10.812124252319336, "global_step": 164849, "epoch": 981} {"train_loss": -10.471842765808105, "global_step": 164850, "epoch": 981} {"train_loss": -10.970379829406738, "global_step": 164851, "epoch": 981} {"train_loss": -10.595712661743164, "global_step": 164852, "epoch": 981} {"train_loss": -10.700154304504395, "global_step": 164853, "epoch": 981} {"train_loss": -10.78726577758789, "global_step": 164854, "epoch": 981} {"train_loss": -10.70091724395752, "global_step": 164855, "epoch": 981} {"train_loss": -10.759599685668945, "global_step": 164856, "epoch": 981} {"train_loss": -11.054304122924805, "global_step": 164857, "epoch": 981} {"train_loss": -10.465019226074219, "global_step": 164858, "epoch": 981} {"train_loss": -10.960134506225586, "global_step": 164859, "epoch": 981} {"train_loss": -10.606332778930664, "global_step": 164860, "epoch": 981} {"train_loss": -10.808349609375, "global_step": 164861, "epoch": 981} {"train_loss": -10.48478889465332, "global_step": 164862, "epoch": 981} {"train_loss": -10.934804916381836, "global_step": 164863, "epoch": 981} {"train_loss": -10.648743629455566, "global_step": 164864, "epoch": 981} {"train_loss": -10.650405883789062, "global_step": 164865, "epoch": 981} {"train_loss": -10.629827499389648, "global_step": 164866, "epoch": 981} {"train_loss": -10.64906120300293, "global_step": 164867, "epoch": 981} {"train_loss": -10.106500625610352, "global_step": 164868, "epoch": 981} {"train_loss": -10.66614818572998, "global_step": 164869, "epoch": 981} {"train_loss": -10.693580627441406, "global_step": 164870, "epoch": 981} {"train_loss": -9.545991897583008, "global_step": 164871, "epoch": 981} {"train_loss": -10.363594055175781, "global_step": 164872, "epoch": 981} {"train_loss": -9.676481246948242, "global_step": 164873, "epoch": 981} {"train_loss": -10.556568145751953, "global_step": 164874, "epoch": 981} {"train_loss": -9.594539642333984, "global_step": 164875, "epoch": 981} {"train_loss": -10.670944213867188, "global_step": 164876, "epoch": 981} {"train_loss": -9.587385177612305, "global_step": 164877, "epoch": 981} {"train_loss": -10.694015502929688, "global_step": 164878, "epoch": 981} {"train_loss": -10.441816329956055, "global_step": 164879, "epoch": 981} {"train_loss": -10.234919548034668, "global_step": 164880, "epoch": 981} {"train_loss": -10.333503723144531, "global_step": 164881, "epoch": 981} {"train_loss": -10.545294761657715, "global_step": 164882, "epoch": 981} {"train_loss": -10.14503288269043, "global_step": 164883, "epoch": 981} {"train_loss": -10.67971420288086, "global_step": 164884, "epoch": 981} {"train_loss": -10.926372528076172, "global_step": 164885, "epoch": 981} {"train_loss": -10.409135818481445, "global_step": 164886, "epoch": 981} {"train_loss": -10.221125602722168, "global_step": 164887, "epoch": 981} {"train_loss": -10.822403907775879, "global_step": 164888, "epoch": 981} {"train_loss": -10.408212661743164, "global_step": 164889, "epoch": 981} {"train_loss": -11.021482467651367, "global_step": 164890, "epoch": 981} {"train_loss": -10.499748229980469, "global_step": 164891, "epoch": 981} {"train_loss": -10.522867202758789, "global_step": 164892, "epoch": 981} {"train_loss": -10.588272094726562, "global_step": 164893, "epoch": 981} {"train_loss": -10.714550018310547, "global_step": 164894, "epoch": 981} {"train_loss": -10.58687973022461, "global_step": 164895, "epoch": 981} {"train_loss": -10.898387908935547, "global_step": 164896, "epoch": 981} {"train_loss": -10.581008911132812, "global_step": 164897, "epoch": 981} {"train_loss": -10.957087516784668, "global_step": 164898, "epoch": 981} {"train_loss": -10.876500129699707, "global_step": 164899, "epoch": 981} {"train_loss": -11.00667667388916, "global_step": 164900, "epoch": 981} {"train_loss": -10.597539901733398, "global_step": 164901, "epoch": 981} {"train_loss": -10.821700096130371, "global_step": 164902, "epoch": 981} {"train_loss": -10.745819091796875, "global_step": 164903, "epoch": 981} {"train_loss": -10.702404022216797, "global_step": 164904, "epoch": 981} {"train_loss": -10.968412399291992, "global_step": 164905, "epoch": 981} {"train_loss": -10.925325393676758, "global_step": 164906, "epoch": 981} {"train_loss": -11.033185005187988, "global_step": 164907, "epoch": 981} {"train_loss": -10.878042221069336, "global_step": 164908, "epoch": 981} {"train_loss": -10.845224380493164, "global_step": 164909, "epoch": 981} {"train_loss": -11.091718673706055, "global_step": 164910, "epoch": 981} {"train_loss": -11.00685977935791, "global_step": 164911, "epoch": 981} {"train_loss": -11.104694366455078, "global_step": 164912, "epoch": 981} {"train_loss": -10.892572402954102, "global_step": 164913, "epoch": 981} {"train_loss": -11.17055892944336, "global_step": 164914, "epoch": 981} {"train_loss": -11.059852600097656, "global_step": 164915, "epoch": 981} {"train_loss": -11.056458473205566, "global_step": 164916, "epoch": 981} {"train_loss": -11.042562484741211, "global_step": 164917, "epoch": 981} {"train_loss": -11.085136413574219, "global_step": 164918, "epoch": 981} {"train_loss": -11.102444648742676, "global_step": 164919, "epoch": 981} {"train_loss": -11.005544662475586, "global_step": 164920, "epoch": 981} {"train_loss": -11.219990730285645, "global_step": 164921, "epoch": 981} {"train_loss": -11.178422927856445, "global_step": 164922, "epoch": 981} {"train_loss": -11.356358528137207, "global_step": 164923, "epoch": 981} {"train_loss": -11.276875495910645, "global_step": 164924, "epoch": 981} {"train_loss": -11.209747314453125, "global_step": 164925, "epoch": 981} {"train_loss": -11.147272109985352, "global_step": 164926, "epoch": 981} {"train_loss": -11.213191986083984, "global_step": 164927, "epoch": 981} {"train_loss": -11.351759910583496, "global_step": 164928, "epoch": 981} {"train_loss": -11.460201263427734, "global_step": 164929, "epoch": 981} {"train_loss": -11.262359619140625, "global_step": 164930, "epoch": 981} {"train_loss": -11.40377426147461, "global_step": 164931, "epoch": 981} {"train_loss": -11.356407165527344, "global_step": 164932, "epoch": 981} {"train_loss": -11.37874984741211, "global_step": 164933, "epoch": 981} {"train_loss": -11.0447998046875, "global_step": 164934, "epoch": 981} {"train_loss": -11.162005424499512, "global_step": 164935, "epoch": 981} {"train_loss": -11.197256088256836, "global_step": 164936, "epoch": 981} {"train_loss": -11.334857940673828, "global_step": 164937, "epoch": 981} {"train_loss": -11.263782501220703, "global_step": 164938, "epoch": 981} {"train_loss": -11.360018730163574, "global_step": 164939, "epoch": 981} {"train_loss": -10.63535213470459, "global_step": 164940, "epoch": 981} {"train_loss": -11.035545349121094, "global_step": 164941, "epoch": 981} {"train_loss": -11.35400676727295, "global_step": 164942, "epoch": 981} {"train_loss": -10.894424438476562, "global_step": 164943, "epoch": 981} {"train_loss": -11.318020820617676, "global_step": 164944, "epoch": 981} {"train_loss": -11.338869094848633, "global_step": 164945, "epoch": 981} {"train_loss": -11.239192962646484, "global_step": 164946, "epoch": 981} {"train_loss": -10.61763858795166, "global_step": 164947, "epoch": 981} {"train_loss": -10.091259002685547, "global_step": 164948, "epoch": 981} {"train_loss": -11.296646118164062, "global_step": 164949, "epoch": 981} {"train_loss": -10.54223346710205, "global_step": 164950, "epoch": 981} {"train_loss": -10.61202621459961, "global_step": 164951, "epoch": 981} {"train_loss": -11.173620223999023, "global_step": 164952, "epoch": 981} {"train_loss": -10.005319595336914, "global_step": 164953, "epoch": 981} {"train_loss": -9.435134887695312, "global_step": 164954, "epoch": 981} {"train_loss": -10.967936515808105, "global_step": 164955, "epoch": 981} {"train_loss": -10.384883880615234, "global_step": 164956, "epoch": 981} {"train_loss": -9.240034103393555, "global_step": 164957, "epoch": 981} {"train_loss": -9.83942985534668, "global_step": 164958, "epoch": 981} {"train_loss": -10.848746299743652, "global_step": 164959, "epoch": 981} {"train_loss": -10.138181686401367, "global_step": 164960, "epoch": 981} {"train_loss": -10.140143394470215, "global_step": 164961, "epoch": 981} {"train_loss": -10.592952728271484, "global_step": 164962, "epoch": 981} {"train_loss": -10.352885246276855, "global_step": 164963, "epoch": 981} {"train_loss": -10.392141342163086, "global_step": 164964, "epoch": 981} {"train_loss": -10.702552795410156, "global_step": 164965, "epoch": 981} {"train_loss": -10.785280227661133, "global_step": 164966, "epoch": 981} {"train_loss": -10.816024780273438, "global_step": 164967, "epoch": 981} {"train_loss": -10.776046752929688, "global_step": 164968, "epoch": 981} {"train_loss": -10.944744110107422, "global_step": 164969, "epoch": 981} {"train_loss": -10.767951011657715, "global_step": 164970, "epoch": 981} {"train_loss": -10.794143676757812, "global_step": 164971, "epoch": 981} {"train_loss": -10.893641471862793, "global_step": 164972, "epoch": 981} {"train_loss": -11.104314804077148, "global_step": 164973, "epoch": 981} {"train_loss": -10.947277069091797, "global_step": 164974, "epoch": 981} {"train_loss": -10.787729427928017, "global_step": 164975, "epoch": 981, "val_loss": 235418.96875} {"train_loss": -10.97146987915039, "global_step": 164976, "epoch": 982} {"train_loss": -10.84400749206543, "global_step": 164977, "epoch": 982} {"train_loss": -10.975885391235352, "global_step": 164978, "epoch": 982} {"train_loss": -10.829225540161133, "global_step": 164979, "epoch": 982} {"train_loss": -10.903776168823242, "global_step": 164980, "epoch": 982} {"train_loss": -10.776561737060547, "global_step": 164981, "epoch": 982} {"train_loss": -10.94299602508545, "global_step": 164982, "epoch": 982} {"train_loss": -10.914436340332031, "global_step": 164983, "epoch": 982} {"train_loss": -11.099934577941895, "global_step": 164984, "epoch": 982} {"train_loss": -10.680612564086914, "global_step": 164985, "epoch": 982} {"train_loss": -10.796968460083008, "global_step": 164986, "epoch": 982} {"train_loss": -11.015298843383789, "global_step": 164987, "epoch": 982} {"train_loss": -10.56836223602295, "global_step": 164988, "epoch": 982} {"train_loss": -10.386667251586914, "global_step": 164989, "epoch": 982} {"train_loss": -10.962484359741211, "global_step": 164990, "epoch": 982} {"train_loss": -10.300592422485352, "global_step": 164991, "epoch": 982} {"train_loss": -9.970666885375977, "global_step": 164992, "epoch": 982} {"train_loss": -10.814413070678711, "global_step": 164993, "epoch": 982} {"train_loss": -10.347489356994629, "global_step": 164994, "epoch": 982} {"train_loss": -10.810659408569336, "global_step": 164995, "epoch": 982} {"train_loss": -10.212150573730469, "global_step": 164996, "epoch": 982} {"train_loss": -10.467211723327637, "global_step": 164997, "epoch": 982} {"train_loss": -10.595932960510254, "global_step": 164998, "epoch": 982} {"train_loss": -10.083263397216797, "global_step": 164999, "epoch": 982} {"train_loss": -10.241720199584961, "global_step": 165000, "epoch": 982} {"train_loss": -10.53758430480957, "global_step": 165001, "epoch": 982} {"train_loss": -10.422061920166016, "global_step": 165002, "epoch": 982} {"train_loss": -10.645752906799316, "global_step": 165003, "epoch": 982} {"train_loss": -10.223732948303223, "global_step": 165004, "epoch": 982} {"train_loss": -10.358081817626953, "global_step": 165005, "epoch": 982} {"train_loss": -10.499408721923828, "global_step": 165006, "epoch": 982} {"train_loss": -11.028524398803711, "global_step": 165007, "epoch": 982} {"train_loss": -9.579367637634277, "global_step": 165008, "epoch": 982} {"train_loss": -10.664901733398438, "global_step": 165009, "epoch": 982} {"train_loss": -9.886259078979492, "global_step": 165010, "epoch": 982} {"train_loss": -10.288724899291992, "global_step": 165011, "epoch": 982} {"train_loss": -10.48156452178955, "global_step": 165012, "epoch": 982} {"train_loss": -10.239518165588379, "global_step": 165013, "epoch": 982} {"train_loss": -10.643963813781738, "global_step": 165014, "epoch": 982} {"train_loss": -10.647285461425781, "global_step": 165015, "epoch": 982} {"train_loss": -10.741217613220215, "global_step": 165016, "epoch": 982} {"train_loss": -10.367050170898438, "global_step": 165017, "epoch": 982} {"train_loss": -10.76849365234375, "global_step": 165018, "epoch": 982} {"train_loss": -10.579447746276855, "global_step": 165019, "epoch": 982} {"train_loss": -10.622489929199219, "global_step": 165020, "epoch": 982} {"train_loss": -10.572595596313477, "global_step": 165021, "epoch": 982} {"train_loss": -10.944998741149902, "global_step": 165022, "epoch": 982} {"train_loss": -10.628371238708496, "global_step": 165023, "epoch": 982} {"train_loss": -10.798895835876465, "global_step": 165024, "epoch": 982} {"train_loss": -10.89552116394043, "global_step": 165025, "epoch": 982} {"train_loss": -10.564981460571289, "global_step": 165026, "epoch": 982} {"train_loss": -10.876035690307617, "global_step": 165027, "epoch": 982} {"train_loss": -10.853815078735352, "global_step": 165028, "epoch": 982} {"train_loss": -10.858707427978516, "global_step": 165029, "epoch": 982} {"train_loss": -10.881134033203125, "global_step": 165030, "epoch": 982} {"train_loss": -10.832623481750488, "global_step": 165031, "epoch": 982} {"train_loss": -10.896404266357422, "global_step": 165032, "epoch": 982} {"train_loss": -10.629119873046875, "global_step": 165033, "epoch": 982} {"train_loss": -10.898292541503906, "global_step": 165034, "epoch": 982} {"train_loss": -10.46468734741211, "global_step": 165035, "epoch": 982} {"train_loss": -10.882171630859375, "global_step": 165036, "epoch": 982} {"train_loss": -10.360228538513184, "global_step": 165037, "epoch": 982} {"train_loss": -11.07143783569336, "global_step": 165038, "epoch": 982} {"train_loss": -10.84816837310791, "global_step": 165039, "epoch": 982} {"train_loss": -11.007513046264648, "global_step": 165040, "epoch": 982} {"train_loss": -10.918600082397461, "global_step": 165041, "epoch": 982} {"train_loss": -10.808805465698242, "global_step": 165042, "epoch": 982} {"train_loss": -10.84268569946289, "global_step": 165043, "epoch": 982} {"train_loss": -11.04772663116455, "global_step": 165044, "epoch": 982} {"train_loss": -11.036139488220215, "global_step": 165045, "epoch": 982} {"train_loss": -11.030746459960938, "global_step": 165046, "epoch": 982} {"train_loss": -10.784831047058105, "global_step": 165047, "epoch": 982} {"train_loss": -11.180246353149414, "global_step": 165048, "epoch": 982} {"train_loss": -10.841205596923828, "global_step": 165049, "epoch": 982} {"train_loss": -10.869585037231445, "global_step": 165050, "epoch": 982} {"train_loss": -10.648685455322266, "global_step": 165051, "epoch": 982} {"train_loss": -11.100858688354492, "global_step": 165052, "epoch": 982} {"train_loss": -10.497063636779785, "global_step": 165053, "epoch": 982} {"train_loss": -10.831646919250488, "global_step": 165054, "epoch": 982} {"train_loss": -10.956107139587402, "global_step": 165055, "epoch": 982} {"train_loss": -10.832422256469727, "global_step": 165056, "epoch": 982} {"train_loss": -10.977167129516602, "global_step": 165057, "epoch": 982} {"train_loss": -10.93725299835205, "global_step": 165058, "epoch": 982} {"train_loss": -10.461448669433594, "global_step": 165059, "epoch": 982} {"train_loss": -11.071249008178711, "global_step": 165060, "epoch": 982} {"train_loss": -10.560303688049316, "global_step": 165061, "epoch": 982} {"train_loss": -10.884624481201172, "global_step": 165062, "epoch": 982} {"train_loss": -11.031635284423828, "global_step": 165063, "epoch": 982} {"train_loss": -10.884800910949707, "global_step": 165064, "epoch": 982} {"train_loss": -10.760299682617188, "global_step": 165065, "epoch": 982} {"train_loss": -11.119219779968262, "global_step": 165066, "epoch": 982} {"train_loss": -10.64553165435791, "global_step": 165067, "epoch": 982} {"train_loss": -11.038785934448242, "global_step": 165068, "epoch": 982} {"train_loss": -10.703859329223633, "global_step": 165069, "epoch": 982} {"train_loss": -11.061163902282715, "global_step": 165070, "epoch": 982} {"train_loss": -11.056889533996582, "global_step": 165071, "epoch": 982} {"train_loss": -11.087085723876953, "global_step": 165072, "epoch": 982} {"train_loss": -11.006739616394043, "global_step": 165073, "epoch": 982} {"train_loss": -11.299295425415039, "global_step": 165074, "epoch": 982} {"train_loss": -10.929216384887695, "global_step": 165075, "epoch": 982} {"train_loss": -11.1295166015625, "global_step": 165076, "epoch": 982} {"train_loss": -11.119950294494629, "global_step": 165077, "epoch": 982} {"train_loss": -11.010841369628906, "global_step": 165078, "epoch": 982} {"train_loss": -10.726441383361816, "global_step": 165079, "epoch": 982} {"train_loss": -11.065840721130371, "global_step": 165080, "epoch": 982} {"train_loss": -11.111576080322266, "global_step": 165081, "epoch": 982} {"train_loss": -10.979968070983887, "global_step": 165082, "epoch": 982} {"train_loss": -11.033254623413086, "global_step": 165083, "epoch": 982} {"train_loss": -10.816802978515625, "global_step": 165084, "epoch": 982} {"train_loss": -11.206855773925781, "global_step": 165085, "epoch": 982} {"train_loss": -11.16225528717041, "global_step": 165086, "epoch": 982} {"train_loss": -10.848498344421387, "global_step": 165087, "epoch": 982} {"train_loss": -11.163379669189453, "global_step": 165088, "epoch": 982} {"train_loss": -10.75460433959961, "global_step": 165089, "epoch": 982} {"train_loss": -11.375638008117676, "global_step": 165090, "epoch": 982} {"train_loss": -11.140109062194824, "global_step": 165091, "epoch": 982} {"train_loss": -11.281610488891602, "global_step": 165092, "epoch": 982} {"train_loss": -11.067911148071289, "global_step": 165093, "epoch": 982} {"train_loss": -11.35373306274414, "global_step": 165094, "epoch": 982} {"train_loss": -11.100994110107422, "global_step": 165095, "epoch": 982} {"train_loss": -11.254910469055176, "global_step": 165096, "epoch": 982} {"train_loss": -11.284477233886719, "global_step": 165097, "epoch": 982} {"train_loss": -11.358728408813477, "global_step": 165098, "epoch": 982} {"train_loss": -11.37657356262207, "global_step": 165099, "epoch": 982} {"train_loss": -11.428387641906738, "global_step": 165100, "epoch": 982} {"train_loss": -11.091983795166016, "global_step": 165101, "epoch": 982} {"train_loss": -11.041147232055664, "global_step": 165102, "epoch": 982} {"train_loss": -11.140920639038086, "global_step": 165103, "epoch": 982} {"train_loss": -11.11186695098877, "global_step": 165104, "epoch": 982} {"train_loss": -11.121759414672852, "global_step": 165105, "epoch": 982} {"train_loss": -10.406867027282715, "global_step": 165106, "epoch": 982} {"train_loss": -10.719377517700195, "global_step": 165107, "epoch": 982} {"train_loss": -10.953729629516602, "global_step": 165108, "epoch": 982} {"train_loss": -10.324209213256836, "global_step": 165109, "epoch": 982} {"train_loss": -10.180356979370117, "global_step": 165110, "epoch": 982} {"train_loss": -10.377923011779785, "global_step": 165111, "epoch": 982} {"train_loss": -11.141565322875977, "global_step": 165112, "epoch": 982} {"train_loss": -9.598413467407227, "global_step": 165113, "epoch": 982} {"train_loss": -10.264434814453125, "global_step": 165114, "epoch": 982} {"train_loss": -10.134134292602539, "global_step": 165115, "epoch": 982} {"train_loss": -8.607995986938477, "global_step": 165116, "epoch": 982} {"train_loss": -10.512141227722168, "global_step": 165117, "epoch": 982} {"train_loss": -7.501513481140137, "global_step": 165118, "epoch": 982} {"train_loss": -7.992895126342773, "global_step": 165119, "epoch": 982} {"train_loss": -8.869503021240234, "global_step": 165120, "epoch": 982} {"train_loss": -9.379231452941895, "global_step": 165121, "epoch": 982} {"train_loss": -8.454580307006836, "global_step": 165122, "epoch": 982} {"train_loss": -7.58711576461792, "global_step": 165123, "epoch": 982} {"train_loss": -9.842232704162598, "global_step": 165124, "epoch": 982} {"train_loss": -9.062395095825195, "global_step": 165125, "epoch": 982} {"train_loss": -8.413915634155273, "global_step": 165126, "epoch": 982} {"train_loss": -9.796905517578125, "global_step": 165127, "epoch": 982} {"train_loss": -9.744525909423828, "global_step": 165128, "epoch": 982} {"train_loss": -9.667390823364258, "global_step": 165129, "epoch": 982} {"train_loss": -9.927629470825195, "global_step": 165130, "epoch": 982} {"train_loss": -10.32502555847168, "global_step": 165131, "epoch": 982} {"train_loss": -10.149022102355957, "global_step": 165132, "epoch": 982} {"train_loss": -10.263071060180664, "global_step": 165133, "epoch": 982} {"train_loss": -10.330703735351562, "global_step": 165134, "epoch": 982} {"train_loss": -10.4144287109375, "global_step": 165135, "epoch": 982} {"train_loss": -10.551885604858398, "global_step": 165136, "epoch": 982} {"train_loss": -10.716448783874512, "global_step": 165137, "epoch": 982} {"train_loss": -10.460477828979492, "global_step": 165138, "epoch": 982} {"train_loss": -10.476462364196777, "global_step": 165139, "epoch": 982} {"train_loss": -10.59781551361084, "global_step": 165140, "epoch": 982} {"train_loss": -10.50620174407959, "global_step": 165141, "epoch": 982} {"train_loss": -10.466632843017578, "global_step": 165142, "epoch": 982} {"train_loss": -10.609352222510747, "global_step": 165143, "epoch": 982, "val_loss": 230906.609375} {"train_loss": -10.562715530395508, "global_step": 165144, "epoch": 983} {"train_loss": -10.580036163330078, "global_step": 165145, "epoch": 983} {"train_loss": -10.582000732421875, "global_step": 165146, "epoch": 983} {"train_loss": -10.481937408447266, "global_step": 165147, "epoch": 983} {"train_loss": -10.506423950195312, "global_step": 165148, "epoch": 983} {"train_loss": -10.333314895629883, "global_step": 165149, "epoch": 983} {"train_loss": -10.6497802734375, "global_step": 165150, "epoch": 983} {"train_loss": -10.833707809448242, "global_step": 165151, "epoch": 983} {"train_loss": -10.661457061767578, "global_step": 165152, "epoch": 983} {"train_loss": -10.76093864440918, "global_step": 165153, "epoch": 983} {"train_loss": -10.954971313476562, "global_step": 165154, "epoch": 983} {"train_loss": -10.573530197143555, "global_step": 165155, "epoch": 983} {"train_loss": -10.487892150878906, "global_step": 165156, "epoch": 983} {"train_loss": -10.796283721923828, "global_step": 165157, "epoch": 983} {"train_loss": -10.902209281921387, "global_step": 165158, "epoch": 983} {"train_loss": -10.66332721710205, "global_step": 165159, "epoch": 983} {"train_loss": -10.851633071899414, "global_step": 165160, "epoch": 983} {"train_loss": -10.826287269592285, "global_step": 165161, "epoch": 983} {"train_loss": -10.904847145080566, "global_step": 165162, "epoch": 983} {"train_loss": -10.832816123962402, "global_step": 165163, "epoch": 983} {"train_loss": -11.091238021850586, "global_step": 165164, "epoch": 983} {"train_loss": -10.954516410827637, "global_step": 165165, "epoch": 983} {"train_loss": -11.011128425598145, "global_step": 165166, "epoch": 983} {"train_loss": -10.970602035522461, "global_step": 165167, "epoch": 983} {"train_loss": -10.886109352111816, "global_step": 165168, "epoch": 983} {"train_loss": -11.054704666137695, "global_step": 165169, "epoch": 983} {"train_loss": -11.017366409301758, "global_step": 165170, "epoch": 983} {"train_loss": -11.153169631958008, "global_step": 165171, "epoch": 983} {"train_loss": -11.062688827514648, "global_step": 165172, "epoch": 983} {"train_loss": -11.197395324707031, "global_step": 165173, "epoch": 983} {"train_loss": -11.072376251220703, "global_step": 165174, "epoch": 983} {"train_loss": -11.035289764404297, "global_step": 165175, "epoch": 983} {"train_loss": -11.37187385559082, "global_step": 165176, "epoch": 983} {"train_loss": -11.126352310180664, "global_step": 165177, "epoch": 983} {"train_loss": -11.11124038696289, "global_step": 165178, "epoch": 983} {"train_loss": -11.096561431884766, "global_step": 165179, "epoch": 983} {"train_loss": -10.988672256469727, "global_step": 165180, "epoch": 983} {"train_loss": -11.205472946166992, "global_step": 165181, "epoch": 983} {"train_loss": -10.942730903625488, "global_step": 165182, "epoch": 983} {"train_loss": -11.105936050415039, "global_step": 165183, "epoch": 983} {"train_loss": -10.988672256469727, "global_step": 165184, "epoch": 983} {"train_loss": -11.022281646728516, "global_step": 165185, "epoch": 983} {"train_loss": -10.732036590576172, "global_step": 165186, "epoch": 983} {"train_loss": -10.345630645751953, "global_step": 165187, "epoch": 983} {"train_loss": -10.951034545898438, "global_step": 165188, "epoch": 983} {"train_loss": -10.6187105178833, "global_step": 165189, "epoch": 983} {"train_loss": -10.642866134643555, "global_step": 165190, "epoch": 983} {"train_loss": -10.574249267578125, "global_step": 165191, "epoch": 983} {"train_loss": -11.28478717803955, "global_step": 165192, "epoch": 983} {"train_loss": -10.46982192993164, "global_step": 165193, "epoch": 983} {"train_loss": -11.044634819030762, "global_step": 165194, "epoch": 983} {"train_loss": -10.765542984008789, "global_step": 165195, "epoch": 983} {"train_loss": -9.620403289794922, "global_step": 165196, "epoch": 983} {"train_loss": -10.818496704101562, "global_step": 165197, "epoch": 983} {"train_loss": -10.496006965637207, "global_step": 165198, "epoch": 983} {"train_loss": -10.169981002807617, "global_step": 165199, "epoch": 983} {"train_loss": -11.006847381591797, "global_step": 165200, "epoch": 983} {"train_loss": -10.916184425354004, "global_step": 165201, "epoch": 983} {"train_loss": -11.045434951782227, "global_step": 165202, "epoch": 983} {"train_loss": -10.884105682373047, "global_step": 165203, "epoch": 983} {"train_loss": -10.774256706237793, "global_step": 165204, "epoch": 983} {"train_loss": -10.045160293579102, "global_step": 165205, "epoch": 983} {"train_loss": -10.901172637939453, "global_step": 165206, "epoch": 983} {"train_loss": -10.536066055297852, "global_step": 165207, "epoch": 983} {"train_loss": -10.698232650756836, "global_step": 165208, "epoch": 983} {"train_loss": -10.399402618408203, "global_step": 165209, "epoch": 983} {"train_loss": -10.850557327270508, "global_step": 165210, "epoch": 983} {"train_loss": -10.662434577941895, "global_step": 165211, "epoch": 983} {"train_loss": -10.29537582397461, "global_step": 165212, "epoch": 983} {"train_loss": -10.944955825805664, "global_step": 165213, "epoch": 983} {"train_loss": -10.773609161376953, "global_step": 165214, "epoch": 983} {"train_loss": -11.0604887008667, "global_step": 165215, "epoch": 983} {"train_loss": -10.678993225097656, "global_step": 165216, "epoch": 983} {"train_loss": -11.166021347045898, "global_step": 165217, "epoch": 983} {"train_loss": -10.947307586669922, "global_step": 165218, "epoch": 983} {"train_loss": -10.832345962524414, "global_step": 165219, "epoch": 983} {"train_loss": -11.051460266113281, "global_step": 165220, "epoch": 983} {"train_loss": -10.915267944335938, "global_step": 165221, "epoch": 983} {"train_loss": -11.019180297851562, "global_step": 165222, "epoch": 983} {"train_loss": -11.063558578491211, "global_step": 165223, "epoch": 983} {"train_loss": -11.150769233703613, "global_step": 165224, "epoch": 983} {"train_loss": -11.031582832336426, "global_step": 165225, "epoch": 983} {"train_loss": -11.08875846862793, "global_step": 165226, "epoch": 983} {"train_loss": -11.026130676269531, "global_step": 165227, "epoch": 983} {"train_loss": -11.014741897583008, "global_step": 165228, "epoch": 983} {"train_loss": -11.167886734008789, "global_step": 165229, "epoch": 983} {"train_loss": -10.985669136047363, "global_step": 165230, "epoch": 983} {"train_loss": -10.901701927185059, "global_step": 165231, "epoch": 983} {"train_loss": -10.729461669921875, "global_step": 165232, "epoch": 983} {"train_loss": -11.178146362304688, "global_step": 165233, "epoch": 983} {"train_loss": -10.473482131958008, "global_step": 165234, "epoch": 983} {"train_loss": -10.976255416870117, "global_step": 165235, "epoch": 983} {"train_loss": -10.768593788146973, "global_step": 165236, "epoch": 983} {"train_loss": -10.668512344360352, "global_step": 165237, "epoch": 983} {"train_loss": -10.89535140991211, "global_step": 165238, "epoch": 983} {"train_loss": -10.881429672241211, "global_step": 165239, "epoch": 983} {"train_loss": -10.636155128479004, "global_step": 165240, "epoch": 983} {"train_loss": -10.932592391967773, "global_step": 165241, "epoch": 983} {"train_loss": -10.833145141601562, "global_step": 165242, "epoch": 983} {"train_loss": -10.779428482055664, "global_step": 165243, "epoch": 983} {"train_loss": -10.794456481933594, "global_step": 165244, "epoch": 983} {"train_loss": -10.651275634765625, "global_step": 165245, "epoch": 983} {"train_loss": -11.081558227539062, "global_step": 165246, "epoch": 983} {"train_loss": -10.956583023071289, "global_step": 165247, "epoch": 983} {"train_loss": -10.358336448669434, "global_step": 165248, "epoch": 983} {"train_loss": -10.952157020568848, "global_step": 165249, "epoch": 983} {"train_loss": -10.99284553527832, "global_step": 165250, "epoch": 983} {"train_loss": -10.974614143371582, "global_step": 165251, "epoch": 983} {"train_loss": -11.1036958694458, "global_step": 165252, "epoch": 983} {"train_loss": -11.168218612670898, "global_step": 165253, "epoch": 983} {"train_loss": -11.315229415893555, "global_step": 165254, "epoch": 983} {"train_loss": -10.803030014038086, "global_step": 165255, "epoch": 983} {"train_loss": -11.166716575622559, "global_step": 165256, "epoch": 983} {"train_loss": -11.152251243591309, "global_step": 165257, "epoch": 983} {"train_loss": -11.068565368652344, "global_step": 165258, "epoch": 983} {"train_loss": -11.060998916625977, "global_step": 165259, "epoch": 983} {"train_loss": -10.870214462280273, "global_step": 165260, "epoch": 983} {"train_loss": -11.271178245544434, "global_step": 165261, "epoch": 983} {"train_loss": -11.176345825195312, "global_step": 165262, "epoch": 983} {"train_loss": -11.047693252563477, "global_step": 165263, "epoch": 983} {"train_loss": -11.097991943359375, "global_step": 165264, "epoch": 983} {"train_loss": -11.145206451416016, "global_step": 165265, "epoch": 983} {"train_loss": -11.100198745727539, "global_step": 165266, "epoch": 983} {"train_loss": -11.181432723999023, "global_step": 165267, "epoch": 983} {"train_loss": -11.097131729125977, "global_step": 165268, "epoch": 983} {"train_loss": -11.241902351379395, "global_step": 165269, "epoch": 983} {"train_loss": -11.176276206970215, "global_step": 165270, "epoch": 983} {"train_loss": -10.98458480834961, "global_step": 165271, "epoch": 983} {"train_loss": -10.918224334716797, "global_step": 165272, "epoch": 983} {"train_loss": -11.128133773803711, "global_step": 165273, "epoch": 983} {"train_loss": -10.88014030456543, "global_step": 165274, "epoch": 983} {"train_loss": -11.341829299926758, "global_step": 165275, "epoch": 983} {"train_loss": -11.094844818115234, "global_step": 165276, "epoch": 983} {"train_loss": -10.477046966552734, "global_step": 165277, "epoch": 983} {"train_loss": -10.959123611450195, "global_step": 165278, "epoch": 983} {"train_loss": -11.216705322265625, "global_step": 165279, "epoch": 983} {"train_loss": -10.390402793884277, "global_step": 165280, "epoch": 983} {"train_loss": -10.944162368774414, "global_step": 165281, "epoch": 983} {"train_loss": -10.344518661499023, "global_step": 165282, "epoch": 983} {"train_loss": -9.909099578857422, "global_step": 165283, "epoch": 983} {"train_loss": -10.520450592041016, "global_step": 165284, "epoch": 983} {"train_loss": -10.672233581542969, "global_step": 165285, "epoch": 983} {"train_loss": -9.707590103149414, "global_step": 165286, "epoch": 983} {"train_loss": -10.968812942504883, "global_step": 165287, "epoch": 983} {"train_loss": -10.502813339233398, "global_step": 165288, "epoch": 983} {"train_loss": -10.739612579345703, "global_step": 165289, "epoch": 983} {"train_loss": -10.658546447753906, "global_step": 165290, "epoch": 983} {"train_loss": -10.299067497253418, "global_step": 165291, "epoch": 983} {"train_loss": -10.788286209106445, "global_step": 165292, "epoch": 983} {"train_loss": -10.21173095703125, "global_step": 165293, "epoch": 983} {"train_loss": -10.421622276306152, "global_step": 165294, "epoch": 983} {"train_loss": -10.580583572387695, "global_step": 165295, "epoch": 983} {"train_loss": -10.774060249328613, "global_step": 165296, "epoch": 983} {"train_loss": -10.390701293945312, "global_step": 165297, "epoch": 983} {"train_loss": -10.884183883666992, "global_step": 165298, "epoch": 983} {"train_loss": -10.561264038085938, "global_step": 165299, "epoch": 983} {"train_loss": -10.593022346496582, "global_step": 165300, "epoch": 983} {"train_loss": -10.618093490600586, "global_step": 165301, "epoch": 983} {"train_loss": -10.49789047241211, "global_step": 165302, "epoch": 983} {"train_loss": -10.810676574707031, "global_step": 165303, "epoch": 983} {"train_loss": -10.366782188415527, "global_step": 165304, "epoch": 983} {"train_loss": -10.821667671203613, "global_step": 165305, "epoch": 983} {"train_loss": -10.34549617767334, "global_step": 165306, "epoch": 983} {"train_loss": -11.017324447631836, "global_step": 165307, "epoch": 983} {"train_loss": -10.462625503540039, "global_step": 165308, "epoch": 983} {"train_loss": -11.032114028930664, "global_step": 165309, "epoch": 983} {"train_loss": -10.711158752441406, "global_step": 165310, "epoch": 983} {"train_loss": -10.82595579964774, "global_step": 165311, "epoch": 983, "val_loss": 233630.84375} {"train_loss": -10.829266548156738, "global_step": 165312, "epoch": 984} {"train_loss": -10.923219680786133, "global_step": 165313, "epoch": 984} {"train_loss": -10.717671394348145, "global_step": 165314, "epoch": 984} {"train_loss": -10.999045372009277, "global_step": 165315, "epoch": 984} {"train_loss": -10.959882736206055, "global_step": 165316, "epoch": 984} {"train_loss": -10.879499435424805, "global_step": 165317, "epoch": 984} {"train_loss": -10.93998908996582, "global_step": 165318, "epoch": 984} {"train_loss": -11.183891296386719, "global_step": 165319, "epoch": 984} {"train_loss": -10.86160945892334, "global_step": 165320, "epoch": 984} {"train_loss": -11.137269973754883, "global_step": 165321, "epoch": 984} {"train_loss": -11.145618438720703, "global_step": 165322, "epoch": 984} {"train_loss": -11.051980018615723, "global_step": 165323, "epoch": 984} {"train_loss": -11.08425521850586, "global_step": 165324, "epoch": 984} {"train_loss": -11.070266723632812, "global_step": 165325, "epoch": 984} {"train_loss": -11.001302719116211, "global_step": 165326, "epoch": 984} {"train_loss": -11.188470840454102, "global_step": 165327, "epoch": 984} {"train_loss": -11.071748733520508, "global_step": 165328, "epoch": 984} {"train_loss": -10.949810981750488, "global_step": 165329, "epoch": 984} {"train_loss": -11.21545124053955, "global_step": 165330, "epoch": 984} {"train_loss": -11.091503143310547, "global_step": 165331, "epoch": 984} {"train_loss": -11.179239273071289, "global_step": 165332, "epoch": 984} {"train_loss": -11.02618408203125, "global_step": 165333, "epoch": 984} {"train_loss": -11.047412872314453, "global_step": 165334, "epoch": 984} {"train_loss": -11.283844947814941, "global_step": 165335, "epoch": 984} {"train_loss": -11.051025390625, "global_step": 165336, "epoch": 984} {"train_loss": -11.213403701782227, "global_step": 165337, "epoch": 984} {"train_loss": -11.089242935180664, "global_step": 165338, "epoch": 984} {"train_loss": -11.158808708190918, "global_step": 165339, "epoch": 984} {"train_loss": -11.06645393371582, "global_step": 165340, "epoch": 984} {"train_loss": -11.09315013885498, "global_step": 165341, "epoch": 984} {"train_loss": -11.29611873626709, "global_step": 165342, "epoch": 984} {"train_loss": -10.979022979736328, "global_step": 165343, "epoch": 984} {"train_loss": -11.360865592956543, "global_step": 165344, "epoch": 984} {"train_loss": -11.009495735168457, "global_step": 165345, "epoch": 984} {"train_loss": -11.157776832580566, "global_step": 165346, "epoch": 984} {"train_loss": -11.200492858886719, "global_step": 165347, "epoch": 984} {"train_loss": -10.90079116821289, "global_step": 165348, "epoch": 984} {"train_loss": -10.774983406066895, "global_step": 165349, "epoch": 984} {"train_loss": -11.148176193237305, "global_step": 165350, "epoch": 984} {"train_loss": -10.98103141784668, "global_step": 165351, "epoch": 984} {"train_loss": -10.984511375427246, "global_step": 165352, "epoch": 984} {"train_loss": -11.443120002746582, "global_step": 165353, "epoch": 984} {"train_loss": -10.95370864868164, "global_step": 165354, "epoch": 984} {"train_loss": -11.233237266540527, "global_step": 165355, "epoch": 984} {"train_loss": -11.049196243286133, "global_step": 165356, "epoch": 984} {"train_loss": -11.057038307189941, "global_step": 165357, "epoch": 984} {"train_loss": -11.343122482299805, "global_step": 165358, "epoch": 984} {"train_loss": -11.056382179260254, "global_step": 165359, "epoch": 984} {"train_loss": -10.732406616210938, "global_step": 165360, "epoch": 984} {"train_loss": -11.152530670166016, "global_step": 165361, "epoch": 984} {"train_loss": -10.943551063537598, "global_step": 165362, "epoch": 984} {"train_loss": -10.252910614013672, "global_step": 165363, "epoch": 984} {"train_loss": -10.439582824707031, "global_step": 165364, "epoch": 984} {"train_loss": -10.087247848510742, "global_step": 165365, "epoch": 984} {"train_loss": -11.037986755371094, "global_step": 165366, "epoch": 984} {"train_loss": -11.02668571472168, "global_step": 165367, "epoch": 984} {"train_loss": -10.26708984375, "global_step": 165368, "epoch": 984} {"train_loss": -11.177286148071289, "global_step": 165369, "epoch": 984} {"train_loss": -10.420809745788574, "global_step": 165370, "epoch": 984} {"train_loss": -11.013803482055664, "global_step": 165371, "epoch": 984} {"train_loss": -10.510751724243164, "global_step": 165372, "epoch": 984} {"train_loss": -10.795469284057617, "global_step": 165373, "epoch": 984} {"train_loss": -10.17413330078125, "global_step": 165374, "epoch": 984} {"train_loss": -10.982640266418457, "global_step": 165375, "epoch": 984} {"train_loss": -10.940736770629883, "global_step": 165376, "epoch": 984} {"train_loss": -10.47560977935791, "global_step": 165377, "epoch": 984} {"train_loss": -10.875920295715332, "global_step": 165378, "epoch": 984} {"train_loss": -10.260896682739258, "global_step": 165379, "epoch": 984} {"train_loss": -10.854339599609375, "global_step": 165380, "epoch": 984} {"train_loss": -10.258478164672852, "global_step": 165381, "epoch": 984} {"train_loss": -10.786825180053711, "global_step": 165382, "epoch": 984} {"train_loss": -10.207578659057617, "global_step": 165383, "epoch": 984} {"train_loss": -10.282806396484375, "global_step": 165384, "epoch": 984} {"train_loss": -10.785860061645508, "global_step": 165385, "epoch": 984} {"train_loss": -10.477685928344727, "global_step": 165386, "epoch": 984} {"train_loss": -10.807527542114258, "global_step": 165387, "epoch": 984} {"train_loss": -10.238245964050293, "global_step": 165388, "epoch": 984} {"train_loss": -10.952703475952148, "global_step": 165389, "epoch": 984} {"train_loss": -10.739967346191406, "global_step": 165390, "epoch": 984} {"train_loss": -10.497915267944336, "global_step": 165391, "epoch": 984} {"train_loss": -10.630451202392578, "global_step": 165392, "epoch": 984} {"train_loss": -10.39136028289795, "global_step": 165393, "epoch": 984} {"train_loss": -10.633047103881836, "global_step": 165394, "epoch": 984} {"train_loss": -10.69430160522461, "global_step": 165395, "epoch": 984} {"train_loss": -11.037775993347168, "global_step": 165396, "epoch": 984} {"train_loss": -10.829683303833008, "global_step": 165397, "epoch": 984} {"train_loss": -11.048924446105957, "global_step": 165398, "epoch": 984} {"train_loss": -10.945871353149414, "global_step": 165399, "epoch": 984} {"train_loss": -11.059591293334961, "global_step": 165400, "epoch": 984} {"train_loss": -11.099209785461426, "global_step": 165401, "epoch": 984} {"train_loss": -11.118498802185059, "global_step": 165402, "epoch": 984} {"train_loss": -10.983552932739258, "global_step": 165403, "epoch": 984} {"train_loss": -10.99154281616211, "global_step": 165404, "epoch": 984} {"train_loss": -10.95224380493164, "global_step": 165405, "epoch": 984} {"train_loss": -11.092716217041016, "global_step": 165406, "epoch": 984} {"train_loss": -10.855874061584473, "global_step": 165407, "epoch": 984} {"train_loss": -11.182060241699219, "global_step": 165408, "epoch": 984} {"train_loss": -11.000728607177734, "global_step": 165409, "epoch": 984} {"train_loss": -10.822888374328613, "global_step": 165410, "epoch": 984} {"train_loss": -10.638629913330078, "global_step": 165411, "epoch": 984} {"train_loss": -11.031305313110352, "global_step": 165412, "epoch": 984} {"train_loss": -10.618420600891113, "global_step": 165413, "epoch": 984} {"train_loss": -10.999773025512695, "global_step": 165414, "epoch": 984} {"train_loss": -10.838325500488281, "global_step": 165415, "epoch": 984} {"train_loss": -10.762431144714355, "global_step": 165416, "epoch": 984} {"train_loss": -11.008586883544922, "global_step": 165417, "epoch": 984} {"train_loss": -10.93189811706543, "global_step": 165418, "epoch": 984} {"train_loss": -10.911749839782715, "global_step": 165419, "epoch": 984} {"train_loss": -10.67202377319336, "global_step": 165420, "epoch": 984} {"train_loss": -10.796921730041504, "global_step": 165421, "epoch": 984} {"train_loss": -10.559473991394043, "global_step": 165422, "epoch": 984} {"train_loss": -11.083200454711914, "global_step": 165423, "epoch": 984} {"train_loss": -10.92453384399414, "global_step": 165424, "epoch": 984} {"train_loss": -11.001678466796875, "global_step": 165425, "epoch": 984} {"train_loss": -10.94156265258789, "global_step": 165426, "epoch": 984} {"train_loss": -11.117598533630371, "global_step": 165427, "epoch": 984} {"train_loss": -10.842845916748047, "global_step": 165428, "epoch": 984} {"train_loss": -11.040180206298828, "global_step": 165429, "epoch": 984} {"train_loss": -10.612737655639648, "global_step": 165430, "epoch": 984} {"train_loss": -10.773195266723633, "global_step": 165431, "epoch": 984} {"train_loss": -10.843405723571777, "global_step": 165432, "epoch": 984} {"train_loss": -10.899604797363281, "global_step": 165433, "epoch": 984} {"train_loss": -10.9634370803833, "global_step": 165434, "epoch": 984} {"train_loss": -10.606953620910645, "global_step": 165435, "epoch": 984} {"train_loss": -10.8726167678833, "global_step": 165436, "epoch": 984} {"train_loss": -10.823962211608887, "global_step": 165437, "epoch": 984} {"train_loss": -11.131847381591797, "global_step": 165438, "epoch": 984} {"train_loss": -10.996124267578125, "global_step": 165439, "epoch": 984} {"train_loss": -11.073505401611328, "global_step": 165440, "epoch": 984} {"train_loss": -11.13320255279541, "global_step": 165441, "epoch": 984} {"train_loss": -11.091897964477539, "global_step": 165442, "epoch": 984} {"train_loss": -10.731303215026855, "global_step": 165443, "epoch": 984} {"train_loss": -10.869796752929688, "global_step": 165444, "epoch": 984} {"train_loss": -10.407464981079102, "global_step": 165445, "epoch": 984} {"train_loss": -10.742889404296875, "global_step": 165446, "epoch": 984} {"train_loss": -10.52763557434082, "global_step": 165447, "epoch": 984} {"train_loss": -10.347139358520508, "global_step": 165448, "epoch": 984} {"train_loss": -10.632880210876465, "global_step": 165449, "epoch": 984} {"train_loss": -10.026180267333984, "global_step": 165450, "epoch": 984} {"train_loss": -10.600664138793945, "global_step": 165451, "epoch": 984} {"train_loss": -9.87510871887207, "global_step": 165452, "epoch": 984} {"train_loss": -10.861978530883789, "global_step": 165453, "epoch": 984} {"train_loss": -10.460101127624512, "global_step": 165454, "epoch": 984} {"train_loss": -10.35501766204834, "global_step": 165455, "epoch": 984} {"train_loss": -10.340381622314453, "global_step": 165456, "epoch": 984} {"train_loss": -9.992979049682617, "global_step": 165457, "epoch": 984} {"train_loss": -10.40864372253418, "global_step": 165458, "epoch": 984} {"train_loss": -10.687642097473145, "global_step": 165459, "epoch": 984} {"train_loss": -10.093640327453613, "global_step": 165460, "epoch": 984} {"train_loss": -10.496171951293945, "global_step": 165461, "epoch": 984} {"train_loss": -10.330055236816406, "global_step": 165462, "epoch": 984} {"train_loss": -9.872079849243164, "global_step": 165463, "epoch": 984} {"train_loss": -10.427894592285156, "global_step": 165464, "epoch": 984} {"train_loss": -10.040742874145508, "global_step": 165465, "epoch": 984} {"train_loss": -10.855942726135254, "global_step": 165466, "epoch": 984} {"train_loss": -10.01164436340332, "global_step": 165467, "epoch": 984} {"train_loss": -11.000149726867676, "global_step": 165468, "epoch": 984} {"train_loss": -10.43759536743164, "global_step": 165469, "epoch": 984} {"train_loss": -10.858259201049805, "global_step": 165470, "epoch": 984} {"train_loss": -10.119014739990234, "global_step": 165471, "epoch": 984} {"train_loss": -10.726410865783691, "global_step": 165472, "epoch": 984} {"train_loss": -10.417177200317383, "global_step": 165473, "epoch": 984} {"train_loss": -10.74460220336914, "global_step": 165474, "epoch": 984} {"train_loss": -10.835077285766602, "global_step": 165475, "epoch": 984} {"train_loss": -10.937071800231934, "global_step": 165476, "epoch": 984} {"train_loss": -11.08464241027832, "global_step": 165477, "epoch": 984} {"train_loss": -11.000946044921875, "global_step": 165478, "epoch": 984} {"train_loss": -10.813824335734049, "global_step": 165479, "epoch": 984, "val_loss": 237223.65625} {"train_loss": -10.817140579223633, "global_step": 165480, "epoch": 985} {"train_loss": -10.958976745605469, "global_step": 165481, "epoch": 985} {"train_loss": -10.784714698791504, "global_step": 165482, "epoch": 985} {"train_loss": -10.974668502807617, "global_step": 165483, "epoch": 985} {"train_loss": -10.92343521118164, "global_step": 165484, "epoch": 985} {"train_loss": -10.671647071838379, "global_step": 165485, "epoch": 985} {"train_loss": -10.82032585144043, "global_step": 165486, "epoch": 985} {"train_loss": -10.990944862365723, "global_step": 165487, "epoch": 985} {"train_loss": -10.798980712890625, "global_step": 165488, "epoch": 985} {"train_loss": -11.032491683959961, "global_step": 165489, "epoch": 985} {"train_loss": -10.998381614685059, "global_step": 165490, "epoch": 985} {"train_loss": -10.920220375061035, "global_step": 165491, "epoch": 985} {"train_loss": -11.034693717956543, "global_step": 165492, "epoch": 985} {"train_loss": -10.993759155273438, "global_step": 165493, "epoch": 985} {"train_loss": -11.116532325744629, "global_step": 165494, "epoch": 985} {"train_loss": -11.071596145629883, "global_step": 165495, "epoch": 985} {"train_loss": -11.101171493530273, "global_step": 165496, "epoch": 985} {"train_loss": -11.005964279174805, "global_step": 165497, "epoch": 985} {"train_loss": -10.953035354614258, "global_step": 165498, "epoch": 985} {"train_loss": -10.998483657836914, "global_step": 165499, "epoch": 985} {"train_loss": -11.16503620147705, "global_step": 165500, "epoch": 985} {"train_loss": -11.069961547851562, "global_step": 165501, "epoch": 985} {"train_loss": -11.042296409606934, "global_step": 165502, "epoch": 985} {"train_loss": -11.085216522216797, "global_step": 165503, "epoch": 985} {"train_loss": -11.064929962158203, "global_step": 165504, "epoch": 985} {"train_loss": -11.174007415771484, "global_step": 165505, "epoch": 985} {"train_loss": -11.042726516723633, "global_step": 165506, "epoch": 985} {"train_loss": -10.82147216796875, "global_step": 165507, "epoch": 985} {"train_loss": -11.152822494506836, "global_step": 165508, "epoch": 985} {"train_loss": -10.550914764404297, "global_step": 165509, "epoch": 985} {"train_loss": -10.94062614440918, "global_step": 165510, "epoch": 985} {"train_loss": -10.956520080566406, "global_step": 165511, "epoch": 985} {"train_loss": -11.019529342651367, "global_step": 165512, "epoch": 985} {"train_loss": -11.116626739501953, "global_step": 165513, "epoch": 985} {"train_loss": -11.109979629516602, "global_step": 165514, "epoch": 985} {"train_loss": -11.077899932861328, "global_step": 165515, "epoch": 985} {"train_loss": -11.204602241516113, "global_step": 165516, "epoch": 985} {"train_loss": -10.929786682128906, "global_step": 165517, "epoch": 985} {"train_loss": -10.959259986877441, "global_step": 165518, "epoch": 985} {"train_loss": -10.82761287689209, "global_step": 165519, "epoch": 985} {"train_loss": -10.704437255859375, "global_step": 165520, "epoch": 985} {"train_loss": -11.403898239135742, "global_step": 165521, "epoch": 985} {"train_loss": -10.610299110412598, "global_step": 165522, "epoch": 985} {"train_loss": -11.182024002075195, "global_step": 165523, "epoch": 985} {"train_loss": -10.5360689163208, "global_step": 165524, "epoch": 985} {"train_loss": -11.056658744812012, "global_step": 165525, "epoch": 985} {"train_loss": -10.90869140625, "global_step": 165526, "epoch": 985} {"train_loss": -10.929484367370605, "global_step": 165527, "epoch": 985} {"train_loss": -11.345298767089844, "global_step": 165528, "epoch": 985} {"train_loss": -10.571698188781738, "global_step": 165529, "epoch": 985} {"train_loss": -11.077178955078125, "global_step": 165530, "epoch": 985} {"train_loss": -11.19708251953125, "global_step": 165531, "epoch": 985} {"train_loss": -11.169472694396973, "global_step": 165532, "epoch": 985} {"train_loss": -11.016414642333984, "global_step": 165533, "epoch": 985} {"train_loss": -11.086000442504883, "global_step": 165534, "epoch": 985} {"train_loss": -10.947717666625977, "global_step": 165535, "epoch": 985} {"train_loss": -11.059228897094727, "global_step": 165536, "epoch": 985} {"train_loss": -11.20503044128418, "global_step": 165537, "epoch": 985} {"train_loss": -10.911439895629883, "global_step": 165538, "epoch": 985} {"train_loss": -10.925933837890625, "global_step": 165539, "epoch": 985} {"train_loss": -10.90693187713623, "global_step": 165540, "epoch": 985} {"train_loss": -10.807241439819336, "global_step": 165541, "epoch": 985} {"train_loss": -10.971556663513184, "global_step": 165542, "epoch": 985} {"train_loss": -11.103666305541992, "global_step": 165543, "epoch": 985} {"train_loss": -11.029241561889648, "global_step": 165544, "epoch": 985} {"train_loss": -10.757347106933594, "global_step": 165545, "epoch": 985} {"train_loss": -11.191298484802246, "global_step": 165546, "epoch": 985} {"train_loss": -11.241602897644043, "global_step": 165547, "epoch": 985} {"train_loss": -10.83594799041748, "global_step": 165548, "epoch": 985} {"train_loss": -10.68011474609375, "global_step": 165549, "epoch": 985} {"train_loss": -11.084181785583496, "global_step": 165550, "epoch": 985} {"train_loss": -10.645698547363281, "global_step": 165551, "epoch": 985} {"train_loss": -11.315439224243164, "global_step": 165552, "epoch": 985} {"train_loss": -10.974781036376953, "global_step": 165553, "epoch": 985} {"train_loss": -10.944259643554688, "global_step": 165554, "epoch": 985} {"train_loss": -11.255025863647461, "global_step": 165555, "epoch": 985} {"train_loss": -10.971132278442383, "global_step": 165556, "epoch": 985} {"train_loss": -10.961821556091309, "global_step": 165557, "epoch": 985} {"train_loss": -10.548971176147461, "global_step": 165558, "epoch": 985} {"train_loss": -10.618207931518555, "global_step": 165559, "epoch": 985} {"train_loss": -11.035696983337402, "global_step": 165560, "epoch": 985} {"train_loss": -10.525586128234863, "global_step": 165561, "epoch": 985} {"train_loss": -10.889814376831055, "global_step": 165562, "epoch": 985} {"train_loss": -11.117311477661133, "global_step": 165563, "epoch": 985} {"train_loss": -11.054864883422852, "global_step": 165564, "epoch": 985} {"train_loss": -10.773796081542969, "global_step": 165565, "epoch": 985} {"train_loss": -10.940382957458496, "global_step": 165566, "epoch": 985} {"train_loss": -10.848590850830078, "global_step": 165567, "epoch": 985} {"train_loss": -10.775472640991211, "global_step": 165568, "epoch": 985} {"train_loss": -11.196260452270508, "global_step": 165569, "epoch": 985} {"train_loss": -10.938629150390625, "global_step": 165570, "epoch": 985} {"train_loss": -11.226221084594727, "global_step": 165571, "epoch": 985} {"train_loss": -11.141717910766602, "global_step": 165572, "epoch": 985} {"train_loss": -10.912392616271973, "global_step": 165573, "epoch": 985} {"train_loss": -11.153532028198242, "global_step": 165574, "epoch": 985} {"train_loss": -11.186721801757812, "global_step": 165575, "epoch": 985} {"train_loss": -11.263359069824219, "global_step": 165576, "epoch": 985} {"train_loss": -11.236015319824219, "global_step": 165577, "epoch": 985} {"train_loss": -11.232240676879883, "global_step": 165578, "epoch": 985} {"train_loss": -10.762079238891602, "global_step": 165579, "epoch": 985} {"train_loss": -10.912580490112305, "global_step": 165580, "epoch": 985} {"train_loss": -10.952696800231934, "global_step": 165581, "epoch": 985} {"train_loss": -11.269092559814453, "global_step": 165582, "epoch": 985} {"train_loss": -11.321395874023438, "global_step": 165583, "epoch": 985} {"train_loss": -11.245647430419922, "global_step": 165584, "epoch": 985} {"train_loss": -10.657384872436523, "global_step": 165585, "epoch": 985} {"train_loss": -10.983190536499023, "global_step": 165586, "epoch": 985} {"train_loss": -10.601099967956543, "global_step": 165587, "epoch": 985} {"train_loss": -10.933690071105957, "global_step": 165588, "epoch": 985} {"train_loss": -11.09309196472168, "global_step": 165589, "epoch": 985} {"train_loss": -11.066200256347656, "global_step": 165590, "epoch": 985} {"train_loss": -10.579095840454102, "global_step": 165591, "epoch": 985} {"train_loss": -11.160195350646973, "global_step": 165592, "epoch": 985} {"train_loss": -10.784358024597168, "global_step": 165593, "epoch": 985} {"train_loss": -10.777911186218262, "global_step": 165594, "epoch": 985} {"train_loss": -10.909401893615723, "global_step": 165595, "epoch": 985} {"train_loss": -10.552862167358398, "global_step": 165596, "epoch": 985} {"train_loss": -10.78257942199707, "global_step": 165597, "epoch": 985} {"train_loss": -10.510469436645508, "global_step": 165598, "epoch": 985} {"train_loss": -10.933740615844727, "global_step": 165599, "epoch": 985} {"train_loss": -10.655184745788574, "global_step": 165600, "epoch": 985} {"train_loss": -11.00932502746582, "global_step": 165601, "epoch": 985} {"train_loss": -10.75885009765625, "global_step": 165602, "epoch": 985} {"train_loss": -10.75686264038086, "global_step": 165603, "epoch": 985} {"train_loss": -10.807308197021484, "global_step": 165604, "epoch": 985} {"train_loss": -10.039708137512207, "global_step": 165605, "epoch": 985} {"train_loss": -11.053779602050781, "global_step": 165606, "epoch": 985} {"train_loss": -10.494918823242188, "global_step": 165607, "epoch": 985} {"train_loss": -10.563255310058594, "global_step": 165608, "epoch": 985} {"train_loss": -10.47612476348877, "global_step": 165609, "epoch": 985} {"train_loss": -10.46981430053711, "global_step": 165610, "epoch": 985} {"train_loss": -11.058782577514648, "global_step": 165611, "epoch": 985} {"train_loss": -10.454862594604492, "global_step": 165612, "epoch": 985} {"train_loss": -10.69010066986084, "global_step": 165613, "epoch": 985} {"train_loss": -10.599443435668945, "global_step": 165614, "epoch": 985} {"train_loss": -10.719993591308594, "global_step": 165615, "epoch": 985} {"train_loss": -10.55091381072998, "global_step": 165616, "epoch": 985} {"train_loss": -10.665124893188477, "global_step": 165617, "epoch": 985} {"train_loss": -10.86789608001709, "global_step": 165618, "epoch": 985} {"train_loss": -10.722145080566406, "global_step": 165619, "epoch": 985} {"train_loss": -10.908435821533203, "global_step": 165620, "epoch": 985} {"train_loss": -10.775710105895996, "global_step": 165621, "epoch": 985} {"train_loss": -10.779180526733398, "global_step": 165622, "epoch": 985} {"train_loss": -11.005168914794922, "global_step": 165623, "epoch": 985} {"train_loss": -10.26523208618164, "global_step": 165624, "epoch": 985} {"train_loss": -10.91545581817627, "global_step": 165625, "epoch": 985} {"train_loss": -10.321803092956543, "global_step": 165626, "epoch": 985} {"train_loss": -10.741016387939453, "global_step": 165627, "epoch": 985} {"train_loss": -10.248764991760254, "global_step": 165628, "epoch": 985} {"train_loss": -10.6823148727417, "global_step": 165629, "epoch": 985} {"train_loss": -10.21611213684082, "global_step": 165630, "epoch": 985} {"train_loss": -10.300496101379395, "global_step": 165631, "epoch": 985} {"train_loss": -10.47610092163086, "global_step": 165632, "epoch": 985} {"train_loss": -10.099920272827148, "global_step": 165633, "epoch": 985} {"train_loss": -10.658854484558105, "global_step": 165634, "epoch": 985} {"train_loss": -10.426125526428223, "global_step": 165635, "epoch": 985} {"train_loss": -10.681892395019531, "global_step": 165636, "epoch": 985} {"train_loss": -9.910297393798828, "global_step": 165637, "epoch": 985} {"train_loss": -10.741920471191406, "global_step": 165638, "epoch": 985} {"train_loss": -10.5460205078125, "global_step": 165639, "epoch": 985} {"train_loss": -10.28109359741211, "global_step": 165640, "epoch": 985} {"train_loss": -10.689516067504883, "global_step": 165641, "epoch": 985} {"train_loss": -10.054887771606445, "global_step": 165642, "epoch": 985} {"train_loss": -10.675222396850586, "global_step": 165643, "epoch": 985} {"train_loss": -9.991844177246094, "global_step": 165644, "epoch": 985} {"train_loss": -10.570084571838379, "global_step": 165645, "epoch": 985} {"train_loss": -10.376485824584961, "global_step": 165646, "epoch": 985} {"train_loss": -10.85563938390641, "global_step": 165647, "epoch": 985, "val_loss": 238066.109375, "train_action_mse_error": 0.8581658601760864} {"train_loss": -10.016777038574219, "global_step": 165648, "epoch": 986} {"train_loss": -10.620689392089844, "global_step": 165649, "epoch": 986} {"train_loss": -10.43284797668457, "global_step": 165650, "epoch": 986} {"train_loss": -10.810964584350586, "global_step": 165651, "epoch": 986} {"train_loss": -10.410694122314453, "global_step": 165652, "epoch": 986} {"train_loss": -10.624990463256836, "global_step": 165653, "epoch": 986} {"train_loss": -10.695152282714844, "global_step": 165654, "epoch": 986} {"train_loss": -10.705695152282715, "global_step": 165655, "epoch": 986} {"train_loss": -10.601080894470215, "global_step": 165656, "epoch": 986} {"train_loss": -11.052599906921387, "global_step": 165657, "epoch": 986} {"train_loss": -10.624237060546875, "global_step": 165658, "epoch": 986} {"train_loss": -10.880956649780273, "global_step": 165659, "epoch": 986} {"train_loss": -10.599625587463379, "global_step": 165660, "epoch": 986} {"train_loss": -10.933836936950684, "global_step": 165661, "epoch": 986} {"train_loss": -10.590576171875, "global_step": 165662, "epoch": 986} {"train_loss": -10.78908920288086, "global_step": 165663, "epoch": 986} {"train_loss": -10.698945999145508, "global_step": 165664, "epoch": 986} {"train_loss": -10.95687484741211, "global_step": 165665, "epoch": 986} {"train_loss": -10.783821105957031, "global_step": 165666, "epoch": 986} {"train_loss": -11.048736572265625, "global_step": 165667, "epoch": 986} {"train_loss": -11.084304809570312, "global_step": 165668, "epoch": 986} {"train_loss": -11.250659942626953, "global_step": 165669, "epoch": 986} {"train_loss": -11.000619888305664, "global_step": 165670, "epoch": 986} {"train_loss": -11.172562599182129, "global_step": 165671, "epoch": 986} {"train_loss": -10.749919891357422, "global_step": 165672, "epoch": 986} {"train_loss": -10.859302520751953, "global_step": 165673, "epoch": 986} {"train_loss": -10.999800682067871, "global_step": 165674, "epoch": 986} {"train_loss": -11.094173431396484, "global_step": 165675, "epoch": 986} {"train_loss": -11.12411880493164, "global_step": 165676, "epoch": 986} {"train_loss": -11.15323257446289, "global_step": 165677, "epoch": 986} {"train_loss": -11.051652908325195, "global_step": 165678, "epoch": 986} {"train_loss": -11.275785446166992, "global_step": 165679, "epoch": 986} {"train_loss": -11.287663459777832, "global_step": 165680, "epoch": 986} {"train_loss": -11.133520126342773, "global_step": 165681, "epoch": 986} {"train_loss": -11.281183242797852, "global_step": 165682, "epoch": 986} {"train_loss": -11.231391906738281, "global_step": 165683, "epoch": 986} {"train_loss": -11.024389266967773, "global_step": 165684, "epoch": 986} {"train_loss": -11.119645118713379, "global_step": 165685, "epoch": 986} {"train_loss": -11.32185173034668, "global_step": 165686, "epoch": 986} {"train_loss": -11.086714744567871, "global_step": 165687, "epoch": 986} {"train_loss": -11.25440788269043, "global_step": 165688, "epoch": 986} {"train_loss": -11.509418487548828, "global_step": 165689, "epoch": 986} {"train_loss": -11.252643585205078, "global_step": 165690, "epoch": 986} {"train_loss": -11.281954765319824, "global_step": 165691, "epoch": 986} {"train_loss": -11.248699188232422, "global_step": 165692, "epoch": 986} {"train_loss": -11.051496505737305, "global_step": 165693, "epoch": 986} {"train_loss": -11.379642486572266, "global_step": 165694, "epoch": 986} {"train_loss": -11.241531372070312, "global_step": 165695, "epoch": 986} {"train_loss": -11.496763229370117, "global_step": 165696, "epoch": 986} {"train_loss": -11.143023490905762, "global_step": 165697, "epoch": 986} {"train_loss": -11.402522087097168, "global_step": 165698, "epoch": 986} {"train_loss": -11.244154930114746, "global_step": 165699, "epoch": 986} {"train_loss": -11.454402923583984, "global_step": 165700, "epoch": 986} {"train_loss": -11.294015884399414, "global_step": 165701, "epoch": 986} {"train_loss": -11.366388320922852, "global_step": 165702, "epoch": 986} {"train_loss": -11.483207702636719, "global_step": 165703, "epoch": 986} {"train_loss": -11.65332317352295, "global_step": 165704, "epoch": 986} {"train_loss": -11.150383949279785, "global_step": 165705, "epoch": 986} {"train_loss": -11.321632385253906, "global_step": 165706, "epoch": 986} {"train_loss": -11.34882640838623, "global_step": 165707, "epoch": 986} {"train_loss": -11.239629745483398, "global_step": 165708, "epoch": 986} {"train_loss": -10.955472946166992, "global_step": 165709, "epoch": 986} {"train_loss": -11.003927230834961, "global_step": 165710, "epoch": 986} {"train_loss": -11.275876998901367, "global_step": 165711, "epoch": 986} {"train_loss": -9.55996036529541, "global_step": 165712, "epoch": 986} {"train_loss": -9.636800765991211, "global_step": 165713, "epoch": 986} {"train_loss": -9.727365493774414, "global_step": 165714, "epoch": 986} {"train_loss": -9.548282623291016, "global_step": 165715, "epoch": 986} {"train_loss": -10.877447128295898, "global_step": 165716, "epoch": 986} {"train_loss": -8.643672943115234, "global_step": 165717, "epoch": 986} {"train_loss": -9.14987564086914, "global_step": 165718, "epoch": 986} {"train_loss": -9.714334487915039, "global_step": 165719, "epoch": 986} {"train_loss": -8.961417198181152, "global_step": 165720, "epoch": 986} {"train_loss": -9.50158977508545, "global_step": 165721, "epoch": 986} {"train_loss": -9.11369514465332, "global_step": 165722, "epoch": 986} {"train_loss": -10.561118125915527, "global_step": 165723, "epoch": 986} {"train_loss": -9.926655769348145, "global_step": 165724, "epoch": 986} {"train_loss": -10.657657623291016, "global_step": 165725, "epoch": 986} {"train_loss": -10.232147216796875, "global_step": 165726, "epoch": 986} {"train_loss": -10.731715202331543, "global_step": 165727, "epoch": 986} {"train_loss": -10.495491027832031, "global_step": 165728, "epoch": 986} {"train_loss": -10.737753868103027, "global_step": 165729, "epoch": 986} {"train_loss": -9.894964218139648, "global_step": 165730, "epoch": 986} {"train_loss": -10.758983612060547, "global_step": 165731, "epoch": 986} {"train_loss": -10.081353187561035, "global_step": 165732, "epoch": 986} {"train_loss": -10.449725151062012, "global_step": 165733, "epoch": 986} {"train_loss": -10.455862045288086, "global_step": 165734, "epoch": 986} {"train_loss": -10.957361221313477, "global_step": 165735, "epoch": 986} {"train_loss": -10.633914947509766, "global_step": 165736, "epoch": 986} {"train_loss": -10.589570999145508, "global_step": 165737, "epoch": 986} {"train_loss": -10.548627853393555, "global_step": 165738, "epoch": 986} {"train_loss": -10.624380111694336, "global_step": 165739, "epoch": 986} {"train_loss": -11.008323669433594, "global_step": 165740, "epoch": 986} {"train_loss": -10.802875518798828, "global_step": 165741, "epoch": 986} {"train_loss": -10.78921890258789, "global_step": 165742, "epoch": 986} {"train_loss": -10.71256160736084, "global_step": 165743, "epoch": 986} {"train_loss": -10.950428009033203, "global_step": 165744, "epoch": 986} {"train_loss": -10.697427749633789, "global_step": 165745, "epoch": 986} {"train_loss": -10.752584457397461, "global_step": 165746, "epoch": 986} {"train_loss": -10.972123146057129, "global_step": 165747, "epoch": 986} {"train_loss": -10.889849662780762, "global_step": 165748, "epoch": 986} {"train_loss": -10.879244804382324, "global_step": 165749, "epoch": 986} {"train_loss": -10.897270202636719, "global_step": 165750, "epoch": 986} {"train_loss": -10.69581413269043, "global_step": 165751, "epoch": 986} {"train_loss": -10.95046329498291, "global_step": 165752, "epoch": 986} {"train_loss": -10.886284828186035, "global_step": 165753, "epoch": 986} {"train_loss": -11.027050018310547, "global_step": 165754, "epoch": 986} {"train_loss": -10.830920219421387, "global_step": 165755, "epoch": 986} {"train_loss": -11.018901824951172, "global_step": 165756, "epoch": 986} {"train_loss": -10.968515396118164, "global_step": 165757, "epoch": 986} {"train_loss": -11.145278930664062, "global_step": 165758, "epoch": 986} {"train_loss": -10.956368446350098, "global_step": 165759, "epoch": 986} {"train_loss": -11.058563232421875, "global_step": 165760, "epoch": 986} {"train_loss": -11.035333633422852, "global_step": 165761, "epoch": 986} {"train_loss": -10.876436233520508, "global_step": 165762, "epoch": 986} {"train_loss": -11.120716094970703, "global_step": 165763, "epoch": 986} {"train_loss": -11.142837524414062, "global_step": 165764, "epoch": 986} {"train_loss": -11.027538299560547, "global_step": 165765, "epoch": 986} {"train_loss": -11.169332504272461, "global_step": 165766, "epoch": 986} {"train_loss": -11.185256958007812, "global_step": 165767, "epoch": 986} {"train_loss": -11.091509819030762, "global_step": 165768, "epoch": 986} {"train_loss": -11.193205833435059, "global_step": 165769, "epoch": 986} {"train_loss": -11.293367385864258, "global_step": 165770, "epoch": 986} {"train_loss": -11.28532600402832, "global_step": 165771, "epoch": 986} {"train_loss": -11.161701202392578, "global_step": 165772, "epoch": 986} {"train_loss": -10.902328491210938, "global_step": 165773, "epoch": 986} {"train_loss": -11.212100982666016, "global_step": 165774, "epoch": 986} {"train_loss": -11.058446884155273, "global_step": 165775, "epoch": 986} {"train_loss": -11.233939170837402, "global_step": 165776, "epoch": 986} {"train_loss": -11.08779525756836, "global_step": 165777, "epoch": 986} {"train_loss": -11.273061752319336, "global_step": 165778, "epoch": 986} {"train_loss": -11.436498641967773, "global_step": 165779, "epoch": 986} {"train_loss": -11.182050704956055, "global_step": 165780, "epoch": 986} {"train_loss": -11.397756576538086, "global_step": 165781, "epoch": 986} {"train_loss": -11.135223388671875, "global_step": 165782, "epoch": 986} {"train_loss": -11.530364036560059, "global_step": 165783, "epoch": 986} {"train_loss": -11.267631530761719, "global_step": 165784, "epoch": 986} {"train_loss": -11.380727767944336, "global_step": 165785, "epoch": 986} {"train_loss": -11.109453201293945, "global_step": 165786, "epoch": 986} {"train_loss": -11.190595626831055, "global_step": 165787, "epoch": 986} {"train_loss": -11.439961433410645, "global_step": 165788, "epoch": 986} {"train_loss": -11.2921142578125, "global_step": 165789, "epoch": 986} {"train_loss": -11.406893730163574, "global_step": 165790, "epoch": 986} {"train_loss": -11.632888793945312, "global_step": 165791, "epoch": 986} {"train_loss": -10.770042419433594, "global_step": 165792, "epoch": 986} {"train_loss": -11.292688369750977, "global_step": 165793, "epoch": 986} {"train_loss": -11.188276290893555, "global_step": 165794, "epoch": 986} {"train_loss": -10.823192596435547, "global_step": 165795, "epoch": 986} {"train_loss": -11.114852905273438, "global_step": 165796, "epoch": 986} {"train_loss": -11.033256530761719, "global_step": 165797, "epoch": 986} {"train_loss": -11.026790618896484, "global_step": 165798, "epoch": 986} {"train_loss": -11.125965118408203, "global_step": 165799, "epoch": 986} {"train_loss": -10.71414566040039, "global_step": 165800, "epoch": 986} {"train_loss": -9.868892669677734, "global_step": 165801, "epoch": 986} {"train_loss": -10.624011993408203, "global_step": 165802, "epoch": 986} {"train_loss": -10.853776931762695, "global_step": 165803, "epoch": 986} {"train_loss": -10.800756454467773, "global_step": 165804, "epoch": 986} {"train_loss": -10.161809921264648, "global_step": 165805, "epoch": 986} {"train_loss": -10.471569061279297, "global_step": 165806, "epoch": 986} {"train_loss": -10.868362426757812, "global_step": 165807, "epoch": 986} {"train_loss": -10.90939998626709, "global_step": 165808, "epoch": 986} {"train_loss": -11.145952224731445, "global_step": 165809, "epoch": 986} {"train_loss": -10.597916603088379, "global_step": 165810, "epoch": 986} {"train_loss": -10.986875534057617, "global_step": 165811, "epoch": 986} {"train_loss": -10.619887351989746, "global_step": 165812, "epoch": 986} {"train_loss": -10.953924179077148, "global_step": 165813, "epoch": 986} {"train_loss": -10.603139877319336, "global_step": 165814, "epoch": 986} {"train_loss": -10.866444723946708, "global_step": 165815, "epoch": 986, "val_loss": 234915.375} {"train_loss": -9.4063138961792, "global_step": 165816, "epoch": 987} {"train_loss": -9.947419166564941, "global_step": 165817, "epoch": 987} {"train_loss": -9.105424880981445, "global_step": 165818, "epoch": 987} {"train_loss": -10.28256607055664, "global_step": 165819, "epoch": 987} {"train_loss": -8.863399505615234, "global_step": 165820, "epoch": 987} {"train_loss": -10.859429359436035, "global_step": 165821, "epoch": 987} {"train_loss": -9.274463653564453, "global_step": 165822, "epoch": 987} {"train_loss": -10.619583129882812, "global_step": 165823, "epoch": 987} {"train_loss": -9.902973175048828, "global_step": 165824, "epoch": 987} {"train_loss": -10.667662620544434, "global_step": 165825, "epoch": 987} {"train_loss": -10.252787590026855, "global_step": 165826, "epoch": 987} {"train_loss": -10.330886840820312, "global_step": 165827, "epoch": 987} {"train_loss": -10.51931095123291, "global_step": 165828, "epoch": 987} {"train_loss": -10.46357536315918, "global_step": 165829, "epoch": 987} {"train_loss": -10.475399017333984, "global_step": 165830, "epoch": 987} {"train_loss": -10.469583511352539, "global_step": 165831, "epoch": 987} {"train_loss": -10.410280227661133, "global_step": 165832, "epoch": 987} {"train_loss": -10.76243782043457, "global_step": 165833, "epoch": 987} {"train_loss": -10.468372344970703, "global_step": 165834, "epoch": 987} {"train_loss": -10.728897094726562, "global_step": 165835, "epoch": 987} {"train_loss": -10.465858459472656, "global_step": 165836, "epoch": 987} {"train_loss": -10.836074829101562, "global_step": 165837, "epoch": 987} {"train_loss": -10.435127258300781, "global_step": 165838, "epoch": 987} {"train_loss": -10.953113555908203, "global_step": 165839, "epoch": 987} {"train_loss": -10.479490280151367, "global_step": 165840, "epoch": 987} {"train_loss": -10.657265663146973, "global_step": 165841, "epoch": 987} {"train_loss": -10.745226860046387, "global_step": 165842, "epoch": 987} {"train_loss": -11.103845596313477, "global_step": 165843, "epoch": 987} {"train_loss": -10.763504028320312, "global_step": 165844, "epoch": 987} {"train_loss": -10.624737739562988, "global_step": 165845, "epoch": 987} {"train_loss": -10.810717582702637, "global_step": 165846, "epoch": 987} {"train_loss": -10.812769889831543, "global_step": 165847, "epoch": 987} {"train_loss": -10.795909881591797, "global_step": 165848, "epoch": 987} {"train_loss": -11.087753295898438, "global_step": 165849, "epoch": 987} {"train_loss": -10.937308311462402, "global_step": 165850, "epoch": 987} {"train_loss": -10.964984893798828, "global_step": 165851, "epoch": 987} {"train_loss": -10.822092056274414, "global_step": 165852, "epoch": 987} {"train_loss": -10.97743034362793, "global_step": 165853, "epoch": 987} {"train_loss": -11.111464500427246, "global_step": 165854, "epoch": 987} {"train_loss": -11.030509948730469, "global_step": 165855, "epoch": 987} {"train_loss": -11.057470321655273, "global_step": 165856, "epoch": 987} {"train_loss": -11.023283004760742, "global_step": 165857, "epoch": 987} {"train_loss": -11.083345413208008, "global_step": 165858, "epoch": 987} {"train_loss": -10.975631713867188, "global_step": 165859, "epoch": 987} {"train_loss": -11.073440551757812, "global_step": 165860, "epoch": 987} {"train_loss": -11.062385559082031, "global_step": 165861, "epoch": 987} {"train_loss": -11.11498737335205, "global_step": 165862, "epoch": 987} {"train_loss": -11.179295539855957, "global_step": 165863, "epoch": 987} {"train_loss": -11.256416320800781, "global_step": 165864, "epoch": 987} {"train_loss": -11.218177795410156, "global_step": 165865, "epoch": 987} {"train_loss": -11.15803050994873, "global_step": 165866, "epoch": 987} {"train_loss": -11.333427429199219, "global_step": 165867, "epoch": 987} {"train_loss": -11.348756790161133, "global_step": 165868, "epoch": 987} {"train_loss": -11.459186553955078, "global_step": 165869, "epoch": 987} {"train_loss": -11.294936180114746, "global_step": 165870, "epoch": 987} {"train_loss": -11.372269630432129, "global_step": 165871, "epoch": 987} {"train_loss": -11.374401092529297, "global_step": 165872, "epoch": 987} {"train_loss": -11.381217956542969, "global_step": 165873, "epoch": 987} {"train_loss": -11.209701538085938, "global_step": 165874, "epoch": 987} {"train_loss": -11.20045280456543, "global_step": 165875, "epoch": 987} {"train_loss": -11.457269668579102, "global_step": 165876, "epoch": 987} {"train_loss": -11.33798599243164, "global_step": 165877, "epoch": 987} {"train_loss": -11.343225479125977, "global_step": 165878, "epoch": 987} {"train_loss": -11.352262496948242, "global_step": 165879, "epoch": 987} {"train_loss": -11.197998046875, "global_step": 165880, "epoch": 987} {"train_loss": -11.295442581176758, "global_step": 165881, "epoch": 987} {"train_loss": -11.311361312866211, "global_step": 165882, "epoch": 987} {"train_loss": -11.15546989440918, "global_step": 165883, "epoch": 987} {"train_loss": -10.899406433105469, "global_step": 165884, "epoch": 987} {"train_loss": -11.038896560668945, "global_step": 165885, "epoch": 987} {"train_loss": -11.177438735961914, "global_step": 165886, "epoch": 987} {"train_loss": -10.959041595458984, "global_step": 165887, "epoch": 987} {"train_loss": -10.702588081359863, "global_step": 165888, "epoch": 987} {"train_loss": -11.026037216186523, "global_step": 165889, "epoch": 987} {"train_loss": -11.012772560119629, "global_step": 165890, "epoch": 987} {"train_loss": -11.16588306427002, "global_step": 165891, "epoch": 987} {"train_loss": -10.942667961120605, "global_step": 165892, "epoch": 987} {"train_loss": -11.299444198608398, "global_step": 165893, "epoch": 987} {"train_loss": -10.960402488708496, "global_step": 165894, "epoch": 987} {"train_loss": -11.393107414245605, "global_step": 165895, "epoch": 987} {"train_loss": -10.852547645568848, "global_step": 165896, "epoch": 987} {"train_loss": -11.109195709228516, "global_step": 165897, "epoch": 987} {"train_loss": -10.823711395263672, "global_step": 165898, "epoch": 987} {"train_loss": -10.453709602355957, "global_step": 165899, "epoch": 987} {"train_loss": -10.683820724487305, "global_step": 165900, "epoch": 987} {"train_loss": -11.152414321899414, "global_step": 165901, "epoch": 987} {"train_loss": -10.045616149902344, "global_step": 165902, "epoch": 987} {"train_loss": -11.312267303466797, "global_step": 165903, "epoch": 987} {"train_loss": -11.13840103149414, "global_step": 165904, "epoch": 987} {"train_loss": -10.999223709106445, "global_step": 165905, "epoch": 987} {"train_loss": -10.787313461303711, "global_step": 165906, "epoch": 987} {"train_loss": -10.973755836486816, "global_step": 165907, "epoch": 987} {"train_loss": -10.724493026733398, "global_step": 165908, "epoch": 987} {"train_loss": -10.584676742553711, "global_step": 165909, "epoch": 987} {"train_loss": -10.827420234680176, "global_step": 165910, "epoch": 987} {"train_loss": -11.011710166931152, "global_step": 165911, "epoch": 987} {"train_loss": -10.319219589233398, "global_step": 165912, "epoch": 987} {"train_loss": -10.840662002563477, "global_step": 165913, "epoch": 987} {"train_loss": -10.349142074584961, "global_step": 165914, "epoch": 987} {"train_loss": -10.028965950012207, "global_step": 165915, "epoch": 987} {"train_loss": -10.243549346923828, "global_step": 165916, "epoch": 987} {"train_loss": -10.62198543548584, "global_step": 165917, "epoch": 987} {"train_loss": -9.964049339294434, "global_step": 165918, "epoch": 987} {"train_loss": -10.89905834197998, "global_step": 165919, "epoch": 987} {"train_loss": -10.599773406982422, "global_step": 165920, "epoch": 987} {"train_loss": -10.623941421508789, "global_step": 165921, "epoch": 987} {"train_loss": -10.716812133789062, "global_step": 165922, "epoch": 987} {"train_loss": -10.58660888671875, "global_step": 165923, "epoch": 987} {"train_loss": -10.509965896606445, "global_step": 165924, "epoch": 987} {"train_loss": -10.5847749710083, "global_step": 165925, "epoch": 987} {"train_loss": -10.712428092956543, "global_step": 165926, "epoch": 987} {"train_loss": -10.854140281677246, "global_step": 165927, "epoch": 987} {"train_loss": -10.571027755737305, "global_step": 165928, "epoch": 987} {"train_loss": -10.591808319091797, "global_step": 165929, "epoch": 987} {"train_loss": -10.974180221557617, "global_step": 165930, "epoch": 987} {"train_loss": -10.179084777832031, "global_step": 165931, "epoch": 987} {"train_loss": -10.806157112121582, "global_step": 165932, "epoch": 987} {"train_loss": -10.457382202148438, "global_step": 165933, "epoch": 987} {"train_loss": -10.588594436645508, "global_step": 165934, "epoch": 987} {"train_loss": -10.861709594726562, "global_step": 165935, "epoch": 987} {"train_loss": -10.645347595214844, "global_step": 165936, "epoch": 987} {"train_loss": -10.65311050415039, "global_step": 165937, "epoch": 987} {"train_loss": -10.958809852600098, "global_step": 165938, "epoch": 987} {"train_loss": -10.469415664672852, "global_step": 165939, "epoch": 987} {"train_loss": -10.992415428161621, "global_step": 165940, "epoch": 987} {"train_loss": -10.828840255737305, "global_step": 165941, "epoch": 987} {"train_loss": -11.146954536437988, "global_step": 165942, "epoch": 987} {"train_loss": -10.651504516601562, "global_step": 165943, "epoch": 987} {"train_loss": -11.307683944702148, "global_step": 165944, "epoch": 987} {"train_loss": -10.803071975708008, "global_step": 165945, "epoch": 987} {"train_loss": -11.246288299560547, "global_step": 165946, "epoch": 987} {"train_loss": -11.076415061950684, "global_step": 165947, "epoch": 987} {"train_loss": -11.131689071655273, "global_step": 165948, "epoch": 987} {"train_loss": -11.109728813171387, "global_step": 165949, "epoch": 987} {"train_loss": -11.136127471923828, "global_step": 165950, "epoch": 987} {"train_loss": -11.095434188842773, "global_step": 165951, "epoch": 987} {"train_loss": -11.42021369934082, "global_step": 165952, "epoch": 987} {"train_loss": -11.101640701293945, "global_step": 165953, "epoch": 987} {"train_loss": -11.07425308227539, "global_step": 165954, "epoch": 987} {"train_loss": -11.124923706054688, "global_step": 165955, "epoch": 987} {"train_loss": -11.101568222045898, "global_step": 165956, "epoch": 987} {"train_loss": -11.206028938293457, "global_step": 165957, "epoch": 987} {"train_loss": -11.276691436767578, "global_step": 165958, "epoch": 987} {"train_loss": -11.328310012817383, "global_step": 165959, "epoch": 987} {"train_loss": -11.06568717956543, "global_step": 165960, "epoch": 987} {"train_loss": -11.226118087768555, "global_step": 165961, "epoch": 987} {"train_loss": -11.10912799835205, "global_step": 165962, "epoch": 987} {"train_loss": -11.2518310546875, "global_step": 165963, "epoch": 987} {"train_loss": -11.044519424438477, "global_step": 165964, "epoch": 987} {"train_loss": -11.015087127685547, "global_step": 165965, "epoch": 987} {"train_loss": -11.14549446105957, "global_step": 165966, "epoch": 987} {"train_loss": -10.859474182128906, "global_step": 165967, "epoch": 987} {"train_loss": -11.161218643188477, "global_step": 165968, "epoch": 987} {"train_loss": -11.285205841064453, "global_step": 165969, "epoch": 987} {"train_loss": -10.922317504882812, "global_step": 165970, "epoch": 987} {"train_loss": -11.148736953735352, "global_step": 165971, "epoch": 987} {"train_loss": -10.677857398986816, "global_step": 165972, "epoch": 987} {"train_loss": -11.269208908081055, "global_step": 165973, "epoch": 987} {"train_loss": -11.129633903503418, "global_step": 165974, "epoch": 987} {"train_loss": -11.296045303344727, "global_step": 165975, "epoch": 987} {"train_loss": -11.403564453125, "global_step": 165976, "epoch": 987} {"train_loss": -11.108487129211426, "global_step": 165977, "epoch": 987} {"train_loss": -11.315752029418945, "global_step": 165978, "epoch": 987} {"train_loss": -11.17685317993164, "global_step": 165979, "epoch": 987} {"train_loss": -11.290389060974121, "global_step": 165980, "epoch": 987} {"train_loss": -11.475919723510742, "global_step": 165981, "epoch": 987} {"train_loss": -11.298896789550781, "global_step": 165982, "epoch": 987} {"train_loss": -10.876941056478591, "global_step": 165983, "epoch": 987, "val_loss": 237240.34375} {"train_loss": -10.930374145507812, "global_step": 165984, "epoch": 988} {"train_loss": -11.298601150512695, "global_step": 165985, "epoch": 988} {"train_loss": -11.180266380310059, "global_step": 165986, "epoch": 988} {"train_loss": -11.452518463134766, "global_step": 165987, "epoch": 988} {"train_loss": -11.105981826782227, "global_step": 165988, "epoch": 988} {"train_loss": -11.087690353393555, "global_step": 165989, "epoch": 988} {"train_loss": -11.072760581970215, "global_step": 165990, "epoch": 988} {"train_loss": -11.490045547485352, "global_step": 165991, "epoch": 988} {"train_loss": -10.775165557861328, "global_step": 165992, "epoch": 988} {"train_loss": -10.010095596313477, "global_step": 165993, "epoch": 988} {"train_loss": -10.52995491027832, "global_step": 165994, "epoch": 988} {"train_loss": -10.690909385681152, "global_step": 165995, "epoch": 988} {"train_loss": -9.524641036987305, "global_step": 165996, "epoch": 988} {"train_loss": -11.28198528289795, "global_step": 165997, "epoch": 988} {"train_loss": -10.207927703857422, "global_step": 165998, "epoch": 988} {"train_loss": -10.249910354614258, "global_step": 165999, "epoch": 988} {"train_loss": -10.042118072509766, "global_step": 166000, "epoch": 988} {"train_loss": -10.795154571533203, "global_step": 166001, "epoch": 988} {"train_loss": -9.89809513092041, "global_step": 166002, "epoch": 988} {"train_loss": -10.599081039428711, "global_step": 166003, "epoch": 988} {"train_loss": -11.200028419494629, "global_step": 166004, "epoch": 988} {"train_loss": -9.907903671264648, "global_step": 166005, "epoch": 988} {"train_loss": -10.175375938415527, "global_step": 166006, "epoch": 988} {"train_loss": -10.448736190795898, "global_step": 166007, "epoch": 988} {"train_loss": -9.688486099243164, "global_step": 166008, "epoch": 988} {"train_loss": -10.90146541595459, "global_step": 166009, "epoch": 988} {"train_loss": -9.826717376708984, "global_step": 166010, "epoch": 988} {"train_loss": -10.21221923828125, "global_step": 166011, "epoch": 988} {"train_loss": -10.650764465332031, "global_step": 166012, "epoch": 988} {"train_loss": -9.637348175048828, "global_step": 166013, "epoch": 988} {"train_loss": -10.361201286315918, "global_step": 166014, "epoch": 988} {"train_loss": -9.295671463012695, "global_step": 166015, "epoch": 988} {"train_loss": -10.539487838745117, "global_step": 166016, "epoch": 988} {"train_loss": -9.877002716064453, "global_step": 166017, "epoch": 988} {"train_loss": -10.78182601928711, "global_step": 166018, "epoch": 988} {"train_loss": -9.052196502685547, "global_step": 166019, "epoch": 988} {"train_loss": -10.660943031311035, "global_step": 166020, "epoch": 988} {"train_loss": -9.726245880126953, "global_step": 166021, "epoch": 988} {"train_loss": -10.48565673828125, "global_step": 166022, "epoch": 988} {"train_loss": -9.894060134887695, "global_step": 166023, "epoch": 988} {"train_loss": -10.280975341796875, "global_step": 166024, "epoch": 988} {"train_loss": -10.03729248046875, "global_step": 166025, "epoch": 988} {"train_loss": -10.792346000671387, "global_step": 166026, "epoch": 988} {"train_loss": -10.378927230834961, "global_step": 166027, "epoch": 988} {"train_loss": -10.099014282226562, "global_step": 166028, "epoch": 988} {"train_loss": -10.581174850463867, "global_step": 166029, "epoch": 988} {"train_loss": -10.225502967834473, "global_step": 166030, "epoch": 988} {"train_loss": -10.297386169433594, "global_step": 166031, "epoch": 988} {"train_loss": -10.708759307861328, "global_step": 166032, "epoch": 988} {"train_loss": -10.434979438781738, "global_step": 166033, "epoch": 988} {"train_loss": -10.143081665039062, "global_step": 166034, "epoch": 988} {"train_loss": -10.669313430786133, "global_step": 166035, "epoch": 988} {"train_loss": -10.733890533447266, "global_step": 166036, "epoch": 988} {"train_loss": -10.265707969665527, "global_step": 166037, "epoch": 988} {"train_loss": -10.514490127563477, "global_step": 166038, "epoch": 988} {"train_loss": -10.57392692565918, "global_step": 166039, "epoch": 988} {"train_loss": -10.620966911315918, "global_step": 166040, "epoch": 988} {"train_loss": -10.901359558105469, "global_step": 166041, "epoch": 988} {"train_loss": -10.736994743347168, "global_step": 166042, "epoch": 988} {"train_loss": -10.70302963256836, "global_step": 166043, "epoch": 988} {"train_loss": -10.861477851867676, "global_step": 166044, "epoch": 988} {"train_loss": -10.946298599243164, "global_step": 166045, "epoch": 988} {"train_loss": -10.715010643005371, "global_step": 166046, "epoch": 988} {"train_loss": -10.783445358276367, "global_step": 166047, "epoch": 988} {"train_loss": -11.107953071594238, "global_step": 166048, "epoch": 988} {"train_loss": -10.713468551635742, "global_step": 166049, "epoch": 988} {"train_loss": -10.801614761352539, "global_step": 166050, "epoch": 988} {"train_loss": -10.842297554016113, "global_step": 166051, "epoch": 988} {"train_loss": -11.058517456054688, "global_step": 166052, "epoch": 988} {"train_loss": -10.919239044189453, "global_step": 166053, "epoch": 988} {"train_loss": -10.838211059570312, "global_step": 166054, "epoch": 988} {"train_loss": -10.96773910522461, "global_step": 166055, "epoch": 988} {"train_loss": -10.759967803955078, "global_step": 166056, "epoch": 988} {"train_loss": -11.177783966064453, "global_step": 166057, "epoch": 988} {"train_loss": -11.089353561401367, "global_step": 166058, "epoch": 988} {"train_loss": -11.044021606445312, "global_step": 166059, "epoch": 988} {"train_loss": -10.97774600982666, "global_step": 166060, "epoch": 988} {"train_loss": -11.093169212341309, "global_step": 166061, "epoch": 988} {"train_loss": -11.118814468383789, "global_step": 166062, "epoch": 988} {"train_loss": -11.222565650939941, "global_step": 166063, "epoch": 988} {"train_loss": -10.961835861206055, "global_step": 166064, "epoch": 988} {"train_loss": -11.149995803833008, "global_step": 166065, "epoch": 988} {"train_loss": -11.20566177368164, "global_step": 166066, "epoch": 988} {"train_loss": -11.121725082397461, "global_step": 166067, "epoch": 988} {"train_loss": -11.112274169921875, "global_step": 166068, "epoch": 988} {"train_loss": -11.096426010131836, "global_step": 166069, "epoch": 988} {"train_loss": -11.177995681762695, "global_step": 166070, "epoch": 988} {"train_loss": -11.22125244140625, "global_step": 166071, "epoch": 988} {"train_loss": -11.102595329284668, "global_step": 166072, "epoch": 988} {"train_loss": -11.123259544372559, "global_step": 166073, "epoch": 988} {"train_loss": -11.214174270629883, "global_step": 166074, "epoch": 988} {"train_loss": -11.26237964630127, "global_step": 166075, "epoch": 988} {"train_loss": -11.039304733276367, "global_step": 166076, "epoch": 988} {"train_loss": -11.284507751464844, "global_step": 166077, "epoch": 988} {"train_loss": -11.135919570922852, "global_step": 166078, "epoch": 988} {"train_loss": -11.329690933227539, "global_step": 166079, "epoch": 988} {"train_loss": -11.09688949584961, "global_step": 166080, "epoch": 988} {"train_loss": -11.269987106323242, "global_step": 166081, "epoch": 988} {"train_loss": -11.393436431884766, "global_step": 166082, "epoch": 988} {"train_loss": -11.286405563354492, "global_step": 166083, "epoch": 988} {"train_loss": -11.394561767578125, "global_step": 166084, "epoch": 988} {"train_loss": -11.385355949401855, "global_step": 166085, "epoch": 988} {"train_loss": -11.361237525939941, "global_step": 166086, "epoch": 988} {"train_loss": -11.124503135681152, "global_step": 166087, "epoch": 988} {"train_loss": -11.323097229003906, "global_step": 166088, "epoch": 988} {"train_loss": -11.37507438659668, "global_step": 166089, "epoch": 988} {"train_loss": -11.02499771118164, "global_step": 166090, "epoch": 988} {"train_loss": -10.415450096130371, "global_step": 166091, "epoch": 988} {"train_loss": -10.812383651733398, "global_step": 166092, "epoch": 988} {"train_loss": -10.862628936767578, "global_step": 166093, "epoch": 988} {"train_loss": -9.875235557556152, "global_step": 166094, "epoch": 988} {"train_loss": -10.68822193145752, "global_step": 166095, "epoch": 988} {"train_loss": -10.667825698852539, "global_step": 166096, "epoch": 988} {"train_loss": -10.584354400634766, "global_step": 166097, "epoch": 988} {"train_loss": -11.235549926757812, "global_step": 166098, "epoch": 988} {"train_loss": -10.683052062988281, "global_step": 166099, "epoch": 988} {"train_loss": -10.964592933654785, "global_step": 166100, "epoch": 988} {"train_loss": -11.004690170288086, "global_step": 166101, "epoch": 988} {"train_loss": -10.276440620422363, "global_step": 166102, "epoch": 988} {"train_loss": -9.26982307434082, "global_step": 166103, "epoch": 988} {"train_loss": -10.647758483886719, "global_step": 166104, "epoch": 988} {"train_loss": -9.891565322875977, "global_step": 166105, "epoch": 988} {"train_loss": -10.161236763000488, "global_step": 166106, "epoch": 988} {"train_loss": -10.769493103027344, "global_step": 166107, "epoch": 988} {"train_loss": -10.15570068359375, "global_step": 166108, "epoch": 988} {"train_loss": -10.959595680236816, "global_step": 166109, "epoch": 988} {"train_loss": -9.978018760681152, "global_step": 166110, "epoch": 988} {"train_loss": -10.91227912902832, "global_step": 166111, "epoch": 988} {"train_loss": -10.749441146850586, "global_step": 166112, "epoch": 988} {"train_loss": -10.652420997619629, "global_step": 166113, "epoch": 988} {"train_loss": -10.895115852355957, "global_step": 166114, "epoch": 988} {"train_loss": -10.626138687133789, "global_step": 166115, "epoch": 988} {"train_loss": -10.24864387512207, "global_step": 166116, "epoch": 988} {"train_loss": -10.734031677246094, "global_step": 166117, "epoch": 988} {"train_loss": -10.22793197631836, "global_step": 166118, "epoch": 988} {"train_loss": -11.050869941711426, "global_step": 166119, "epoch": 988} {"train_loss": -10.107732772827148, "global_step": 166120, "epoch": 988} {"train_loss": -10.679278373718262, "global_step": 166121, "epoch": 988} {"train_loss": -10.674619674682617, "global_step": 166122, "epoch": 988} {"train_loss": -10.399910926818848, "global_step": 166123, "epoch": 988} {"train_loss": -10.638747215270996, "global_step": 166124, "epoch": 988} {"train_loss": -10.561009407043457, "global_step": 166125, "epoch": 988} {"train_loss": -10.976746559143066, "global_step": 166126, "epoch": 988} {"train_loss": -10.530937194824219, "global_step": 166127, "epoch": 988} {"train_loss": -10.765716552734375, "global_step": 166128, "epoch": 988} {"train_loss": -10.580480575561523, "global_step": 166129, "epoch": 988} {"train_loss": -10.659239768981934, "global_step": 166130, "epoch": 988} {"train_loss": -10.316965103149414, "global_step": 166131, "epoch": 988} {"train_loss": -10.912033081054688, "global_step": 166132, "epoch": 988} {"train_loss": -10.657726287841797, "global_step": 166133, "epoch": 988} {"train_loss": -10.68923568725586, "global_step": 166134, "epoch": 988} {"train_loss": -10.92453670501709, "global_step": 166135, "epoch": 988} {"train_loss": -10.672762870788574, "global_step": 166136, "epoch": 988} {"train_loss": -10.559666633605957, "global_step": 166137, "epoch": 988} {"train_loss": -10.859271049499512, "global_step": 166138, "epoch": 988} {"train_loss": -10.689824104309082, "global_step": 166139, "epoch": 988} {"train_loss": -10.937570571899414, "global_step": 166140, "epoch": 988} {"train_loss": -10.949090003967285, "global_step": 166141, "epoch": 988} {"train_loss": -10.741239547729492, "global_step": 166142, "epoch": 988} {"train_loss": -11.236743927001953, "global_step": 166143, "epoch": 988} {"train_loss": -10.57589340209961, "global_step": 166144, "epoch": 988} {"train_loss": -10.566680908203125, "global_step": 166145, "epoch": 988} {"train_loss": -10.723845481872559, "global_step": 166146, "epoch": 988} {"train_loss": -10.609606742858887, "global_step": 166147, "epoch": 988} {"train_loss": -10.70331859588623, "global_step": 166148, "epoch": 988} {"train_loss": -10.729496955871582, "global_step": 166149, "epoch": 988} {"train_loss": -10.575481414794922, "global_step": 166150, "epoch": 988} {"train_loss": -10.693250207673936, "global_step": 166151, "epoch": 988, "val_loss": 239979.359375} {"train_loss": -11.060447692871094, "global_step": 166152, "epoch": 989} {"train_loss": -10.615108489990234, "global_step": 166153, "epoch": 989} {"train_loss": -11.023712158203125, "global_step": 166154, "epoch": 989} {"train_loss": -10.762662887573242, "global_step": 166155, "epoch": 989} {"train_loss": -10.815643310546875, "global_step": 166156, "epoch": 989} {"train_loss": -10.768255233764648, "global_step": 166157, "epoch": 989} {"train_loss": -10.663566589355469, "global_step": 166158, "epoch": 989} {"train_loss": -11.077285766601562, "global_step": 166159, "epoch": 989} {"train_loss": -10.958788871765137, "global_step": 166160, "epoch": 989} {"train_loss": -10.911388397216797, "global_step": 166161, "epoch": 989} {"train_loss": -11.065547943115234, "global_step": 166162, "epoch": 989} {"train_loss": -10.960878372192383, "global_step": 166163, "epoch": 989} {"train_loss": -10.74718952178955, "global_step": 166164, "epoch": 989} {"train_loss": -10.95535659790039, "global_step": 166165, "epoch": 989} {"train_loss": -10.980755805969238, "global_step": 166166, "epoch": 989} {"train_loss": -10.964452743530273, "global_step": 166167, "epoch": 989} {"train_loss": -11.176177024841309, "global_step": 166168, "epoch": 989} {"train_loss": -10.829357147216797, "global_step": 166169, "epoch": 989} {"train_loss": -10.8181734085083, "global_step": 166170, "epoch": 989} {"train_loss": -11.243611335754395, "global_step": 166171, "epoch": 989} {"train_loss": -10.974956512451172, "global_step": 166172, "epoch": 989} {"train_loss": -11.237140655517578, "global_step": 166173, "epoch": 989} {"train_loss": -10.984214782714844, "global_step": 166174, "epoch": 989} {"train_loss": -11.145586967468262, "global_step": 166175, "epoch": 989} {"train_loss": -11.102130889892578, "global_step": 166176, "epoch": 989} {"train_loss": -11.286761283874512, "global_step": 166177, "epoch": 989} {"train_loss": -11.32808780670166, "global_step": 166178, "epoch": 989} {"train_loss": -11.087675094604492, "global_step": 166179, "epoch": 989} {"train_loss": -11.313377380371094, "global_step": 166180, "epoch": 989} {"train_loss": -11.170642852783203, "global_step": 166181, "epoch": 989} {"train_loss": -11.38284683227539, "global_step": 166182, "epoch": 989} {"train_loss": -11.336219787597656, "global_step": 166183, "epoch": 989} {"train_loss": -11.032073974609375, "global_step": 166184, "epoch": 989} {"train_loss": -11.112743377685547, "global_step": 166185, "epoch": 989} {"train_loss": -11.139860153198242, "global_step": 166186, "epoch": 989} {"train_loss": -11.182977676391602, "global_step": 166187, "epoch": 989} {"train_loss": -10.964010238647461, "global_step": 166188, "epoch": 989} {"train_loss": -11.36538314819336, "global_step": 166189, "epoch": 989} {"train_loss": -10.576631546020508, "global_step": 166190, "epoch": 989} {"train_loss": -11.419139862060547, "global_step": 166191, "epoch": 989} {"train_loss": -11.216344833374023, "global_step": 166192, "epoch": 989} {"train_loss": -11.148170471191406, "global_step": 166193, "epoch": 989} {"train_loss": -11.131771087646484, "global_step": 166194, "epoch": 989} {"train_loss": -11.17132568359375, "global_step": 166195, "epoch": 989} {"train_loss": -11.348438262939453, "global_step": 166196, "epoch": 989} {"train_loss": -11.206212997436523, "global_step": 166197, "epoch": 989} {"train_loss": -11.388822555541992, "global_step": 166198, "epoch": 989} {"train_loss": -11.225176811218262, "global_step": 166199, "epoch": 989} {"train_loss": -11.348915100097656, "global_step": 166200, "epoch": 989} {"train_loss": -10.954044342041016, "global_step": 166201, "epoch": 989} {"train_loss": -11.255414962768555, "global_step": 166202, "epoch": 989} {"train_loss": -11.231512069702148, "global_step": 166203, "epoch": 989} {"train_loss": -11.19576358795166, "global_step": 166204, "epoch": 989} {"train_loss": -11.461355209350586, "global_step": 166205, "epoch": 989} {"train_loss": -11.036405563354492, "global_step": 166206, "epoch": 989} {"train_loss": -11.250459671020508, "global_step": 166207, "epoch": 989} {"train_loss": -10.50632381439209, "global_step": 166208, "epoch": 989} {"train_loss": -10.265462875366211, "global_step": 166209, "epoch": 989} {"train_loss": -10.035690307617188, "global_step": 166210, "epoch": 989} {"train_loss": -11.155891418457031, "global_step": 166211, "epoch": 989} {"train_loss": -9.453078269958496, "global_step": 166212, "epoch": 989} {"train_loss": -10.551156997680664, "global_step": 166213, "epoch": 989} {"train_loss": -10.486658096313477, "global_step": 166214, "epoch": 989} {"train_loss": -9.964208602905273, "global_step": 166215, "epoch": 989} {"train_loss": -10.545528411865234, "global_step": 166216, "epoch": 989} {"train_loss": -8.559249877929688, "global_step": 166217, "epoch": 989} {"train_loss": -10.745076179504395, "global_step": 166218, "epoch": 989} {"train_loss": -8.942479133605957, "global_step": 166219, "epoch": 989} {"train_loss": -10.13973617553711, "global_step": 166220, "epoch": 989} {"train_loss": -10.69367504119873, "global_step": 166221, "epoch": 989} {"train_loss": -9.629858016967773, "global_step": 166222, "epoch": 989} {"train_loss": -10.512467384338379, "global_step": 166223, "epoch": 989} {"train_loss": -10.12049674987793, "global_step": 166224, "epoch": 989} {"train_loss": -10.409388542175293, "global_step": 166225, "epoch": 989} {"train_loss": -10.156070709228516, "global_step": 166226, "epoch": 989} {"train_loss": -10.38957405090332, "global_step": 166227, "epoch": 989} {"train_loss": -10.829838752746582, "global_step": 166228, "epoch": 989} {"train_loss": -10.415316581726074, "global_step": 166229, "epoch": 989} {"train_loss": -10.529661178588867, "global_step": 166230, "epoch": 989} {"train_loss": -10.766559600830078, "global_step": 166231, "epoch": 989} {"train_loss": -10.556924819946289, "global_step": 166232, "epoch": 989} {"train_loss": -10.742279052734375, "global_step": 166233, "epoch": 989} {"train_loss": -10.711816787719727, "global_step": 166234, "epoch": 989} {"train_loss": -10.785516738891602, "global_step": 166235, "epoch": 989} {"train_loss": -11.107495307922363, "global_step": 166236, "epoch": 989} {"train_loss": -10.71778392791748, "global_step": 166237, "epoch": 989} {"train_loss": -10.987186431884766, "global_step": 166238, "epoch": 989} {"train_loss": -11.03558349609375, "global_step": 166239, "epoch": 989} {"train_loss": -10.766134262084961, "global_step": 166240, "epoch": 989} {"train_loss": -10.886153221130371, "global_step": 166241, "epoch": 989} {"train_loss": -10.71446704864502, "global_step": 166242, "epoch": 989} {"train_loss": -10.773853302001953, "global_step": 166243, "epoch": 989} {"train_loss": -10.757524490356445, "global_step": 166244, "epoch": 989} {"train_loss": -10.682356834411621, "global_step": 166245, "epoch": 989} {"train_loss": -10.901354789733887, "global_step": 166246, "epoch": 989} {"train_loss": -11.065225601196289, "global_step": 166247, "epoch": 989} {"train_loss": -10.702230453491211, "global_step": 166248, "epoch": 989} {"train_loss": -11.08143424987793, "global_step": 166249, "epoch": 989} {"train_loss": -10.645889282226562, "global_step": 166250, "epoch": 989} {"train_loss": -11.127699851989746, "global_step": 166251, "epoch": 989} {"train_loss": -10.751188278198242, "global_step": 166252, "epoch": 989} {"train_loss": -10.822219848632812, "global_step": 166253, "epoch": 989} {"train_loss": -10.779607772827148, "global_step": 166254, "epoch": 989} {"train_loss": -10.95372200012207, "global_step": 166255, "epoch": 989} {"train_loss": -11.016243934631348, "global_step": 166256, "epoch": 989} {"train_loss": -10.747966766357422, "global_step": 166257, "epoch": 989} {"train_loss": -11.127481460571289, "global_step": 166258, "epoch": 989} {"train_loss": -10.795395851135254, "global_step": 166259, "epoch": 989} {"train_loss": -11.220888137817383, "global_step": 166260, "epoch": 989} {"train_loss": -10.683658599853516, "global_step": 166261, "epoch": 989} {"train_loss": -11.165184020996094, "global_step": 166262, "epoch": 989} {"train_loss": -10.816657066345215, "global_step": 166263, "epoch": 989} {"train_loss": -11.263628959655762, "global_step": 166264, "epoch": 989} {"train_loss": -10.759480476379395, "global_step": 166265, "epoch": 989} {"train_loss": -11.172500610351562, "global_step": 166266, "epoch": 989} {"train_loss": -11.076109886169434, "global_step": 166267, "epoch": 989} {"train_loss": -11.21335220336914, "global_step": 166268, "epoch": 989} {"train_loss": -11.148465156555176, "global_step": 166269, "epoch": 989} {"train_loss": -11.381739616394043, "global_step": 166270, "epoch": 989} {"train_loss": -10.986833572387695, "global_step": 166271, "epoch": 989} {"train_loss": -10.94985580444336, "global_step": 166272, "epoch": 989} {"train_loss": -11.24897575378418, "global_step": 166273, "epoch": 989} {"train_loss": -11.304899215698242, "global_step": 166274, "epoch": 989} {"train_loss": -10.982999801635742, "global_step": 166275, "epoch": 989} {"train_loss": -11.1228609085083, "global_step": 166276, "epoch": 989} {"train_loss": -11.13453197479248, "global_step": 166277, "epoch": 989} {"train_loss": -11.060022354125977, "global_step": 166278, "epoch": 989} {"train_loss": -11.082956314086914, "global_step": 166279, "epoch": 989} {"train_loss": -11.214395523071289, "global_step": 166280, "epoch": 989} {"train_loss": -11.119955062866211, "global_step": 166281, "epoch": 989} {"train_loss": -11.21817398071289, "global_step": 166282, "epoch": 989} {"train_loss": -11.397915840148926, "global_step": 166283, "epoch": 989} {"train_loss": -11.201454162597656, "global_step": 166284, "epoch": 989} {"train_loss": -10.987752914428711, "global_step": 166285, "epoch": 989} {"train_loss": -11.274495124816895, "global_step": 166286, "epoch": 989} {"train_loss": -11.412805557250977, "global_step": 166287, "epoch": 989} {"train_loss": -11.202095031738281, "global_step": 166288, "epoch": 989} {"train_loss": -11.274876594543457, "global_step": 166289, "epoch": 989} {"train_loss": -11.385051727294922, "global_step": 166290, "epoch": 989} {"train_loss": -10.701335906982422, "global_step": 166291, "epoch": 989} {"train_loss": -11.438959121704102, "global_step": 166292, "epoch": 989} {"train_loss": -10.595388412475586, "global_step": 166293, "epoch": 989} {"train_loss": -10.556020736694336, "global_step": 166294, "epoch": 989} {"train_loss": -11.300331115722656, "global_step": 166295, "epoch": 989} {"train_loss": -10.840926170349121, "global_step": 166296, "epoch": 989} {"train_loss": -10.619647979736328, "global_step": 166297, "epoch": 989} {"train_loss": -11.329349517822266, "global_step": 166298, "epoch": 989} {"train_loss": -10.074728012084961, "global_step": 166299, "epoch": 989} {"train_loss": -10.805829048156738, "global_step": 166300, "epoch": 989} {"train_loss": -10.429472923278809, "global_step": 166301, "epoch": 989} {"train_loss": -10.33080768585205, "global_step": 166302, "epoch": 989} {"train_loss": -10.317281723022461, "global_step": 166303, "epoch": 989} {"train_loss": -10.781606674194336, "global_step": 166304, "epoch": 989} {"train_loss": -10.088367462158203, "global_step": 166305, "epoch": 989} {"train_loss": -10.446928024291992, "global_step": 166306, "epoch": 989} {"train_loss": -10.465595245361328, "global_step": 166307, "epoch": 989} {"train_loss": -10.288750648498535, "global_step": 166308, "epoch": 989} {"train_loss": -10.407249450683594, "global_step": 166309, "epoch": 989} {"train_loss": -8.552206039428711, "global_step": 166310, "epoch": 989} {"train_loss": -9.164491653442383, "global_step": 166311, "epoch": 989} {"train_loss": -10.200776100158691, "global_step": 166312, "epoch": 989} {"train_loss": -9.694443702697754, "global_step": 166313, "epoch": 989} {"train_loss": -10.044754028320312, "global_step": 166314, "epoch": 989} {"train_loss": -10.588421821594238, "global_step": 166315, "epoch": 989} {"train_loss": -10.209421157836914, "global_step": 166316, "epoch": 989} {"train_loss": -10.8147554397583, "global_step": 166317, "epoch": 989} {"train_loss": -10.274077415466309, "global_step": 166318, "epoch": 989} {"train_loss": -10.818892109961737, "global_step": 166319, "epoch": 989, "val_loss": 233435.203125} {"train_loss": -10.321361541748047, "global_step": 166320, "epoch": 990} {"train_loss": -9.931347846984863, "global_step": 166321, "epoch": 990} {"train_loss": -10.443244934082031, "global_step": 166322, "epoch": 990} {"train_loss": -10.838944435119629, "global_step": 166323, "epoch": 990} {"train_loss": -9.853313446044922, "global_step": 166324, "epoch": 990} {"train_loss": -10.841625213623047, "global_step": 166325, "epoch": 990} {"train_loss": -10.116132736206055, "global_step": 166326, "epoch": 990} {"train_loss": -10.745601654052734, "global_step": 166327, "epoch": 990} {"train_loss": -10.693781852722168, "global_step": 166328, "epoch": 990} {"train_loss": -10.579133987426758, "global_step": 166329, "epoch": 990} {"train_loss": -10.770273208618164, "global_step": 166330, "epoch": 990} {"train_loss": -10.812273979187012, "global_step": 166331, "epoch": 990} {"train_loss": -10.569414138793945, "global_step": 166332, "epoch": 990} {"train_loss": -10.86373519897461, "global_step": 166333, "epoch": 990} {"train_loss": -10.679816246032715, "global_step": 166334, "epoch": 990} {"train_loss": -10.817010879516602, "global_step": 166335, "epoch": 990} {"train_loss": -10.343204498291016, "global_step": 166336, "epoch": 990} {"train_loss": -10.897347450256348, "global_step": 166337, "epoch": 990} {"train_loss": -10.601053237915039, "global_step": 166338, "epoch": 990} {"train_loss": -10.8421630859375, "global_step": 166339, "epoch": 990} {"train_loss": -10.590855598449707, "global_step": 166340, "epoch": 990} {"train_loss": -10.5230712890625, "global_step": 166341, "epoch": 990} {"train_loss": -10.942560195922852, "global_step": 166342, "epoch": 990} {"train_loss": -10.575298309326172, "global_step": 166343, "epoch": 990} {"train_loss": -10.976747512817383, "global_step": 166344, "epoch": 990} {"train_loss": -10.782476425170898, "global_step": 166345, "epoch": 990} {"train_loss": -11.092118263244629, "global_step": 166346, "epoch": 990} {"train_loss": -10.856584548950195, "global_step": 166347, "epoch": 990} {"train_loss": -11.155475616455078, "global_step": 166348, "epoch": 990} {"train_loss": -10.944828033447266, "global_step": 166349, "epoch": 990} {"train_loss": -10.963293075561523, "global_step": 166350, "epoch": 990} {"train_loss": -11.101767539978027, "global_step": 166351, "epoch": 990} {"train_loss": -10.790897369384766, "global_step": 166352, "epoch": 990} {"train_loss": -11.306081771850586, "global_step": 166353, "epoch": 990} {"train_loss": -10.894529342651367, "global_step": 166354, "epoch": 990} {"train_loss": -11.145155906677246, "global_step": 166355, "epoch": 990} {"train_loss": -10.912036895751953, "global_step": 166356, "epoch": 990} {"train_loss": -10.804819107055664, "global_step": 166357, "epoch": 990} {"train_loss": -10.907903671264648, "global_step": 166358, "epoch": 990} {"train_loss": -11.228111267089844, "global_step": 166359, "epoch": 990} {"train_loss": -10.99402141571045, "global_step": 166360, "epoch": 990} {"train_loss": -11.241311073303223, "global_step": 166361, "epoch": 990} {"train_loss": -11.009639739990234, "global_step": 166362, "epoch": 990} {"train_loss": -11.259949684143066, "global_step": 166363, "epoch": 990} {"train_loss": -11.000597953796387, "global_step": 166364, "epoch": 990} {"train_loss": -11.273571014404297, "global_step": 166365, "epoch": 990} {"train_loss": -11.164127349853516, "global_step": 166366, "epoch": 990} {"train_loss": -11.17894458770752, "global_step": 166367, "epoch": 990} {"train_loss": -11.347702980041504, "global_step": 166368, "epoch": 990} {"train_loss": -11.301782608032227, "global_step": 166369, "epoch": 990} {"train_loss": -11.10078239440918, "global_step": 166370, "epoch": 990} {"train_loss": -11.095230102539062, "global_step": 166371, "epoch": 990} {"train_loss": -11.019761085510254, "global_step": 166372, "epoch": 990} {"train_loss": -11.12109088897705, "global_step": 166373, "epoch": 990} {"train_loss": -10.963114738464355, "global_step": 166374, "epoch": 990} {"train_loss": -11.118581771850586, "global_step": 166375, "epoch": 990} {"train_loss": -11.180061340332031, "global_step": 166376, "epoch": 990} {"train_loss": -11.247718811035156, "global_step": 166377, "epoch": 990} {"train_loss": -11.13726806640625, "global_step": 166378, "epoch": 990} {"train_loss": -10.549968719482422, "global_step": 166379, "epoch": 990} {"train_loss": -11.232746124267578, "global_step": 166380, "epoch": 990} {"train_loss": -11.158514022827148, "global_step": 166381, "epoch": 990} {"train_loss": -11.007912635803223, "global_step": 166382, "epoch": 990} {"train_loss": -11.118646621704102, "global_step": 166383, "epoch": 990} {"train_loss": -11.215347290039062, "global_step": 166384, "epoch": 990} {"train_loss": -11.391731262207031, "global_step": 166385, "epoch": 990} {"train_loss": -11.384419441223145, "global_step": 166386, "epoch": 990} {"train_loss": -11.041728973388672, "global_step": 166387, "epoch": 990} {"train_loss": -11.119926452636719, "global_step": 166388, "epoch": 990} {"train_loss": -11.043695449829102, "global_step": 166389, "epoch": 990} {"train_loss": -10.793166160583496, "global_step": 166390, "epoch": 990} {"train_loss": -10.990686416625977, "global_step": 166391, "epoch": 990} {"train_loss": -10.880731582641602, "global_step": 166392, "epoch": 990} {"train_loss": -11.220906257629395, "global_step": 166393, "epoch": 990} {"train_loss": -10.573461532592773, "global_step": 166394, "epoch": 990} {"train_loss": -11.210834503173828, "global_step": 166395, "epoch": 990} {"train_loss": -10.683786392211914, "global_step": 166396, "epoch": 990} {"train_loss": -10.451973915100098, "global_step": 166397, "epoch": 990} {"train_loss": -11.154523849487305, "global_step": 166398, "epoch": 990} {"train_loss": -10.91808032989502, "global_step": 166399, "epoch": 990} {"train_loss": -10.583812713623047, "global_step": 166400, "epoch": 990} {"train_loss": -10.555037498474121, "global_step": 166401, "epoch": 990} {"train_loss": -10.77542781829834, "global_step": 166402, "epoch": 990} {"train_loss": -11.11492919921875, "global_step": 166403, "epoch": 990} {"train_loss": -10.345331192016602, "global_step": 166404, "epoch": 990} {"train_loss": -11.055253982543945, "global_step": 166405, "epoch": 990} {"train_loss": -10.612960815429688, "global_step": 166406, "epoch": 990} {"train_loss": -10.900121688842773, "global_step": 166407, "epoch": 990} {"train_loss": -10.644376754760742, "global_step": 166408, "epoch": 990} {"train_loss": -10.663729667663574, "global_step": 166409, "epoch": 990} {"train_loss": -10.695281982421875, "global_step": 166410, "epoch": 990} {"train_loss": -10.087169647216797, "global_step": 166411, "epoch": 990} {"train_loss": -10.094114303588867, "global_step": 166412, "epoch": 990} {"train_loss": -10.529664039611816, "global_step": 166413, "epoch": 990} {"train_loss": -9.33515453338623, "global_step": 166414, "epoch": 990} {"train_loss": -10.601545333862305, "global_step": 166415, "epoch": 990} {"train_loss": -10.016595840454102, "global_step": 166416, "epoch": 990} {"train_loss": -9.731781005859375, "global_step": 166417, "epoch": 990} {"train_loss": -10.432056427001953, "global_step": 166418, "epoch": 990} {"train_loss": -10.040842056274414, "global_step": 166419, "epoch": 990} {"train_loss": -10.046248435974121, "global_step": 166420, "epoch": 990} {"train_loss": -10.127164840698242, "global_step": 166421, "epoch": 990} {"train_loss": -10.017274856567383, "global_step": 166422, "epoch": 990} {"train_loss": -10.573844909667969, "global_step": 166423, "epoch": 990} {"train_loss": -10.118335723876953, "global_step": 166424, "epoch": 990} {"train_loss": -10.21615982055664, "global_step": 166425, "epoch": 990} {"train_loss": -10.314237594604492, "global_step": 166426, "epoch": 990} {"train_loss": -10.423799514770508, "global_step": 166427, "epoch": 990} {"train_loss": -10.51312255859375, "global_step": 166428, "epoch": 990} {"train_loss": -10.531113624572754, "global_step": 166429, "epoch": 990} {"train_loss": -10.351622581481934, "global_step": 166430, "epoch": 990} {"train_loss": -10.977699279785156, "global_step": 166431, "epoch": 990} {"train_loss": -10.427889823913574, "global_step": 166432, "epoch": 990} {"train_loss": -10.643179893493652, "global_step": 166433, "epoch": 990} {"train_loss": -10.865701675415039, "global_step": 166434, "epoch": 990} {"train_loss": -10.479940414428711, "global_step": 166435, "epoch": 990} {"train_loss": -10.842352867126465, "global_step": 166436, "epoch": 990} {"train_loss": -10.597314834594727, "global_step": 166437, "epoch": 990} {"train_loss": -10.76611614227295, "global_step": 166438, "epoch": 990} {"train_loss": -10.802196502685547, "global_step": 166439, "epoch": 990} {"train_loss": -10.812880516052246, "global_step": 166440, "epoch": 990} {"train_loss": -10.859384536743164, "global_step": 166441, "epoch": 990} {"train_loss": -10.81090259552002, "global_step": 166442, "epoch": 990} {"train_loss": -10.902936935424805, "global_step": 166443, "epoch": 990} {"train_loss": -10.827926635742188, "global_step": 166444, "epoch": 990} {"train_loss": -10.924575805664062, "global_step": 166445, "epoch": 990} {"train_loss": -10.763642311096191, "global_step": 166446, "epoch": 990} {"train_loss": -10.993444442749023, "global_step": 166447, "epoch": 990} {"train_loss": -10.830389022827148, "global_step": 166448, "epoch": 990} {"train_loss": -10.955850601196289, "global_step": 166449, "epoch": 990} {"train_loss": -10.972127914428711, "global_step": 166450, "epoch": 990} {"train_loss": -10.930571556091309, "global_step": 166451, "epoch": 990} {"train_loss": -10.77795696258545, "global_step": 166452, "epoch": 990} {"train_loss": -11.071060180664062, "global_step": 166453, "epoch": 990} {"train_loss": -11.156225204467773, "global_step": 166454, "epoch": 990} {"train_loss": -11.043464660644531, "global_step": 166455, "epoch": 990} {"train_loss": -10.939050674438477, "global_step": 166456, "epoch": 990} {"train_loss": -11.055599212646484, "global_step": 166457, "epoch": 990} {"train_loss": -11.09988784790039, "global_step": 166458, "epoch": 990} {"train_loss": -10.975089073181152, "global_step": 166459, "epoch": 990} {"train_loss": -11.123737335205078, "global_step": 166460, "epoch": 990} {"train_loss": -10.998878479003906, "global_step": 166461, "epoch": 990} {"train_loss": -11.37322998046875, "global_step": 166462, "epoch": 990} {"train_loss": -11.02385139465332, "global_step": 166463, "epoch": 990} {"train_loss": -11.107540130615234, "global_step": 166464, "epoch": 990} {"train_loss": -11.073917388916016, "global_step": 166465, "epoch": 990} {"train_loss": -11.154024124145508, "global_step": 166466, "epoch": 990} {"train_loss": -10.92403793334961, "global_step": 166467, "epoch": 990} {"train_loss": -11.206066131591797, "global_step": 166468, "epoch": 990} {"train_loss": -11.060234069824219, "global_step": 166469, "epoch": 990} {"train_loss": -11.160252571105957, "global_step": 166470, "epoch": 990} {"train_loss": -11.114627838134766, "global_step": 166471, "epoch": 990} {"train_loss": -11.016944885253906, "global_step": 166472, "epoch": 990} {"train_loss": -11.297324180603027, "global_step": 166473, "epoch": 990} {"train_loss": -11.319640159606934, "global_step": 166474, "epoch": 990} {"train_loss": -11.2410306930542, "global_step": 166475, "epoch": 990} {"train_loss": -10.86176872253418, "global_step": 166476, "epoch": 990} {"train_loss": -11.030816078186035, "global_step": 166477, "epoch": 990} {"train_loss": -11.085723876953125, "global_step": 166478, "epoch": 990} {"train_loss": -11.011877059936523, "global_step": 166479, "epoch": 990} {"train_loss": -11.129955291748047, "global_step": 166480, "epoch": 990} {"train_loss": -11.168445587158203, "global_step": 166481, "epoch": 990} {"train_loss": -10.578620910644531, "global_step": 166482, "epoch": 990} {"train_loss": -11.19729232788086, "global_step": 166483, "epoch": 990} {"train_loss": -11.105415344238281, "global_step": 166484, "epoch": 990} {"train_loss": -10.404889106750488, "global_step": 166485, "epoch": 990} {"train_loss": -10.943004608154297, "global_step": 166486, "epoch": 990} {"train_loss": -10.830380468141465, "global_step": 166487, "epoch": 990, "val_loss": 241397.75, "train_action_mse_error": 3.514577865600586} {"train_loss": -10.775543212890625, "global_step": 166488, "epoch": 991} {"train_loss": -11.068009376525879, "global_step": 166489, "epoch": 991} {"train_loss": -11.181629180908203, "global_step": 166490, "epoch": 991} {"train_loss": -9.98422622680664, "global_step": 166491, "epoch": 991} {"train_loss": -11.09555721282959, "global_step": 166492, "epoch": 991} {"train_loss": -10.411508560180664, "global_step": 166493, "epoch": 991} {"train_loss": -9.922628402709961, "global_step": 166494, "epoch": 991} {"train_loss": -10.98161506652832, "global_step": 166495, "epoch": 991} {"train_loss": -10.281982421875, "global_step": 166496, "epoch": 991} {"train_loss": -11.146171569824219, "global_step": 166497, "epoch": 991} {"train_loss": -10.504573822021484, "global_step": 166498, "epoch": 991} {"train_loss": -11.032882690429688, "global_step": 166499, "epoch": 991} {"train_loss": -10.795615196228027, "global_step": 166500, "epoch": 991} {"train_loss": -10.752456665039062, "global_step": 166501, "epoch": 991} {"train_loss": -11.034454345703125, "global_step": 166502, "epoch": 991} {"train_loss": -10.677515983581543, "global_step": 166503, "epoch": 991} {"train_loss": -11.082784652709961, "global_step": 166504, "epoch": 991} {"train_loss": -10.288789749145508, "global_step": 166505, "epoch": 991} {"train_loss": -10.826242446899414, "global_step": 166506, "epoch": 991} {"train_loss": -10.877229690551758, "global_step": 166507, "epoch": 991} {"train_loss": -11.072465896606445, "global_step": 166508, "epoch": 991} {"train_loss": -11.020586013793945, "global_step": 166509, "epoch": 991} {"train_loss": -10.849992752075195, "global_step": 166510, "epoch": 991} {"train_loss": -11.073701858520508, "global_step": 166511, "epoch": 991} {"train_loss": -10.59554672241211, "global_step": 166512, "epoch": 991} {"train_loss": -10.861161231994629, "global_step": 166513, "epoch": 991} {"train_loss": -10.746170043945312, "global_step": 166514, "epoch": 991} {"train_loss": -10.433804512023926, "global_step": 166515, "epoch": 991} {"train_loss": -10.896761894226074, "global_step": 166516, "epoch": 991} {"train_loss": -10.49020004272461, "global_step": 166517, "epoch": 991} {"train_loss": -10.969106674194336, "global_step": 166518, "epoch": 991} {"train_loss": -10.561187744140625, "global_step": 166519, "epoch": 991} {"train_loss": -11.022419929504395, "global_step": 166520, "epoch": 991} {"train_loss": -10.777219772338867, "global_step": 166521, "epoch": 991} {"train_loss": -10.546860694885254, "global_step": 166522, "epoch": 991} {"train_loss": -11.052536010742188, "global_step": 166523, "epoch": 991} {"train_loss": -10.620451927185059, "global_step": 166524, "epoch": 991} {"train_loss": -10.78515338897705, "global_step": 166525, "epoch": 991} {"train_loss": -10.53940486907959, "global_step": 166526, "epoch": 991} {"train_loss": -10.980627059936523, "global_step": 166527, "epoch": 991} {"train_loss": -10.556573867797852, "global_step": 166528, "epoch": 991} {"train_loss": -10.880938529968262, "global_step": 166529, "epoch": 991} {"train_loss": -10.747138977050781, "global_step": 166530, "epoch": 991} {"train_loss": -11.063779830932617, "global_step": 166531, "epoch": 991} {"train_loss": -10.527534484863281, "global_step": 166532, "epoch": 991} {"train_loss": -11.101829528808594, "global_step": 166533, "epoch": 991} {"train_loss": -10.298978805541992, "global_step": 166534, "epoch": 991} {"train_loss": -11.065673828125, "global_step": 166535, "epoch": 991} {"train_loss": -10.280240058898926, "global_step": 166536, "epoch": 991} {"train_loss": -10.90821647644043, "global_step": 166537, "epoch": 991} {"train_loss": -10.232906341552734, "global_step": 166538, "epoch": 991} {"train_loss": -10.980138778686523, "global_step": 166539, "epoch": 991} {"train_loss": -10.765132904052734, "global_step": 166540, "epoch": 991} {"train_loss": -10.54500675201416, "global_step": 166541, "epoch": 991} {"train_loss": -10.720783233642578, "global_step": 166542, "epoch": 991} {"train_loss": -10.566539764404297, "global_step": 166543, "epoch": 991} {"train_loss": -10.955445289611816, "global_step": 166544, "epoch": 991} {"train_loss": -10.52204704284668, "global_step": 166545, "epoch": 991} {"train_loss": -10.950376510620117, "global_step": 166546, "epoch": 991} {"train_loss": -10.651849746704102, "global_step": 166547, "epoch": 991} {"train_loss": -10.69384765625, "global_step": 166548, "epoch": 991} {"train_loss": -10.862035751342773, "global_step": 166549, "epoch": 991} {"train_loss": -10.601494789123535, "global_step": 166550, "epoch": 991} {"train_loss": -11.168008804321289, "global_step": 166551, "epoch": 991} {"train_loss": -10.850005149841309, "global_step": 166552, "epoch": 991} {"train_loss": -10.943233489990234, "global_step": 166553, "epoch": 991} {"train_loss": -10.701517105102539, "global_step": 166554, "epoch": 991} {"train_loss": -10.851186752319336, "global_step": 166555, "epoch": 991} {"train_loss": -10.648406028747559, "global_step": 166556, "epoch": 991} {"train_loss": -10.884220123291016, "global_step": 166557, "epoch": 991} {"train_loss": -10.708884239196777, "global_step": 166558, "epoch": 991} {"train_loss": -10.819068908691406, "global_step": 166559, "epoch": 991} {"train_loss": -11.037734031677246, "global_step": 166560, "epoch": 991} {"train_loss": -11.06838607788086, "global_step": 166561, "epoch": 991} {"train_loss": -10.846712112426758, "global_step": 166562, "epoch": 991} {"train_loss": -10.78095817565918, "global_step": 166563, "epoch": 991} {"train_loss": -11.040544509887695, "global_step": 166564, "epoch": 991} {"train_loss": -10.981717109680176, "global_step": 166565, "epoch": 991} {"train_loss": -10.93548583984375, "global_step": 166566, "epoch": 991} {"train_loss": -11.203845977783203, "global_step": 166567, "epoch": 991} {"train_loss": -10.957958221435547, "global_step": 166568, "epoch": 991} {"train_loss": -11.079712867736816, "global_step": 166569, "epoch": 991} {"train_loss": -11.133811950683594, "global_step": 166570, "epoch": 991} {"train_loss": -10.933296203613281, "global_step": 166571, "epoch": 991} {"train_loss": -11.053777694702148, "global_step": 166572, "epoch": 991} {"train_loss": -10.896232604980469, "global_step": 166573, "epoch": 991} {"train_loss": -11.466110229492188, "global_step": 166574, "epoch": 991} {"train_loss": -11.036428451538086, "global_step": 166575, "epoch": 991} {"train_loss": -11.269240379333496, "global_step": 166576, "epoch": 991} {"train_loss": -11.130005836486816, "global_step": 166577, "epoch": 991} {"train_loss": -11.065698623657227, "global_step": 166578, "epoch": 991} {"train_loss": -11.31119155883789, "global_step": 166579, "epoch": 991} {"train_loss": -10.974327087402344, "global_step": 166580, "epoch": 991} {"train_loss": -11.329190254211426, "global_step": 166581, "epoch": 991} {"train_loss": -11.175997734069824, "global_step": 166582, "epoch": 991} {"train_loss": -11.371614456176758, "global_step": 166583, "epoch": 991} {"train_loss": -11.378541946411133, "global_step": 166584, "epoch": 991} {"train_loss": -11.406309127807617, "global_step": 166585, "epoch": 991} {"train_loss": -11.34490966796875, "global_step": 166586, "epoch": 991} {"train_loss": -11.174840927124023, "global_step": 166587, "epoch": 991} {"train_loss": -11.37310791015625, "global_step": 166588, "epoch": 991} {"train_loss": -11.184277534484863, "global_step": 166589, "epoch": 991} {"train_loss": -11.371895790100098, "global_step": 166590, "epoch": 991} {"train_loss": -11.307136535644531, "global_step": 166591, "epoch": 991} {"train_loss": -11.210763931274414, "global_step": 166592, "epoch": 991} {"train_loss": -10.937599182128906, "global_step": 166593, "epoch": 991} {"train_loss": -11.337833404541016, "global_step": 166594, "epoch": 991} {"train_loss": -11.26485824584961, "global_step": 166595, "epoch": 991} {"train_loss": -10.954233169555664, "global_step": 166596, "epoch": 991} {"train_loss": -11.293391227722168, "global_step": 166597, "epoch": 991} {"train_loss": -11.088740348815918, "global_step": 166598, "epoch": 991} {"train_loss": -10.457744598388672, "global_step": 166599, "epoch": 991} {"train_loss": -11.298260688781738, "global_step": 166600, "epoch": 991} {"train_loss": -11.111562728881836, "global_step": 166601, "epoch": 991} {"train_loss": -11.163717269897461, "global_step": 166602, "epoch": 991} {"train_loss": -10.449697494506836, "global_step": 166603, "epoch": 991} {"train_loss": -10.943391799926758, "global_step": 166604, "epoch": 991} {"train_loss": -10.736111640930176, "global_step": 166605, "epoch": 991} {"train_loss": -10.454444885253906, "global_step": 166606, "epoch": 991} {"train_loss": -10.610193252563477, "global_step": 166607, "epoch": 991} {"train_loss": -10.86662483215332, "global_step": 166608, "epoch": 991} {"train_loss": -10.67234992980957, "global_step": 166609, "epoch": 991} {"train_loss": -10.045100212097168, "global_step": 166610, "epoch": 991} {"train_loss": -10.801021575927734, "global_step": 166611, "epoch": 991} {"train_loss": -10.977906227111816, "global_step": 166612, "epoch": 991} {"train_loss": -10.244730949401855, "global_step": 166613, "epoch": 991} {"train_loss": -10.814535140991211, "global_step": 166614, "epoch": 991} {"train_loss": -10.710224151611328, "global_step": 166615, "epoch": 991} {"train_loss": -10.617427825927734, "global_step": 166616, "epoch": 991} {"train_loss": -11.052217483520508, "global_step": 166617, "epoch": 991} {"train_loss": -10.530755996704102, "global_step": 166618, "epoch": 991} {"train_loss": -10.51681137084961, "global_step": 166619, "epoch": 991} {"train_loss": -10.898637771606445, "global_step": 166620, "epoch": 991} {"train_loss": -10.599275588989258, "global_step": 166621, "epoch": 991} {"train_loss": -11.199336051940918, "global_step": 166622, "epoch": 991} {"train_loss": -10.456704139709473, "global_step": 166623, "epoch": 991} {"train_loss": -10.600969314575195, "global_step": 166624, "epoch": 991} {"train_loss": -10.902019500732422, "global_step": 166625, "epoch": 991} {"train_loss": -10.656295776367188, "global_step": 166626, "epoch": 991} {"train_loss": -10.87860107421875, "global_step": 166627, "epoch": 991} {"train_loss": -10.493587493896484, "global_step": 166628, "epoch": 991} {"train_loss": -10.969778060913086, "global_step": 166629, "epoch": 991} {"train_loss": -10.649214744567871, "global_step": 166630, "epoch": 991} {"train_loss": -10.550338745117188, "global_step": 166631, "epoch": 991} {"train_loss": -11.145008087158203, "global_step": 166632, "epoch": 991} {"train_loss": -10.989309310913086, "global_step": 166633, "epoch": 991} {"train_loss": -11.15744400024414, "global_step": 166634, "epoch": 991} {"train_loss": -10.850605010986328, "global_step": 166635, "epoch": 991} {"train_loss": -10.921360969543457, "global_step": 166636, "epoch": 991} {"train_loss": -11.052266120910645, "global_step": 166637, "epoch": 991} {"train_loss": -11.055009841918945, "global_step": 166638, "epoch": 991} {"train_loss": -11.054952621459961, "global_step": 166639, "epoch": 991} {"train_loss": -10.973733901977539, "global_step": 166640, "epoch": 991} {"train_loss": -11.055171012878418, "global_step": 166641, "epoch": 991} {"train_loss": -10.899706840515137, "global_step": 166642, "epoch": 991} {"train_loss": -10.865432739257812, "global_step": 166643, "epoch": 991} {"train_loss": -11.080656051635742, "global_step": 166644, "epoch": 991} {"train_loss": -10.940238952636719, "global_step": 166645, "epoch": 991} {"train_loss": -10.949435234069824, "global_step": 166646, "epoch": 991} {"train_loss": -11.229928970336914, "global_step": 166647, "epoch": 991} {"train_loss": -11.106916427612305, "global_step": 166648, "epoch": 991} {"train_loss": -11.29140853881836, "global_step": 166649, "epoch": 991} {"train_loss": -11.044745445251465, "global_step": 166650, "epoch": 991} {"train_loss": -11.149473190307617, "global_step": 166651, "epoch": 991} {"train_loss": -11.274274826049805, "global_step": 166652, "epoch": 991} {"train_loss": -11.199625015258789, "global_step": 166653, "epoch": 991} {"train_loss": -11.313642501831055, "global_step": 166654, "epoch": 991} {"train_loss": -10.887435385159083, "global_step": 166655, "epoch": 991, "val_loss": 238458.40625} {"train_loss": -11.202853202819824, "global_step": 166656, "epoch": 992} {"train_loss": -11.175262451171875, "global_step": 166657, "epoch": 992} {"train_loss": -11.299663543701172, "global_step": 166658, "epoch": 992} {"train_loss": -11.424919128417969, "global_step": 166659, "epoch": 992} {"train_loss": -11.117040634155273, "global_step": 166660, "epoch": 992} {"train_loss": -11.113973617553711, "global_step": 166661, "epoch": 992} {"train_loss": -11.17831802368164, "global_step": 166662, "epoch": 992} {"train_loss": -11.25094985961914, "global_step": 166663, "epoch": 992} {"train_loss": -11.242271423339844, "global_step": 166664, "epoch": 992} {"train_loss": -11.215991020202637, "global_step": 166665, "epoch": 992} {"train_loss": -11.204299926757812, "global_step": 166666, "epoch": 992} {"train_loss": -11.376065254211426, "global_step": 166667, "epoch": 992} {"train_loss": -11.294212341308594, "global_step": 166668, "epoch": 992} {"train_loss": -11.424982070922852, "global_step": 166669, "epoch": 992} {"train_loss": -11.18877124786377, "global_step": 166670, "epoch": 992} {"train_loss": -11.145395278930664, "global_step": 166671, "epoch": 992} {"train_loss": -11.161643981933594, "global_step": 166672, "epoch": 992} {"train_loss": -10.97215461730957, "global_step": 166673, "epoch": 992} {"train_loss": -10.538347244262695, "global_step": 166674, "epoch": 992} {"train_loss": -11.014204025268555, "global_step": 166675, "epoch": 992} {"train_loss": -10.972383499145508, "global_step": 166676, "epoch": 992} {"train_loss": -10.084412574768066, "global_step": 166677, "epoch": 992} {"train_loss": -10.948744773864746, "global_step": 166678, "epoch": 992} {"train_loss": -11.08621597290039, "global_step": 166679, "epoch": 992} {"train_loss": -10.368736267089844, "global_step": 166680, "epoch": 992} {"train_loss": -10.673895835876465, "global_step": 166681, "epoch": 992} {"train_loss": -10.604499816894531, "global_step": 166682, "epoch": 992} {"train_loss": -10.22374153137207, "global_step": 166683, "epoch": 992} {"train_loss": -10.37051010131836, "global_step": 166684, "epoch": 992} {"train_loss": -10.819231033325195, "global_step": 166685, "epoch": 992} {"train_loss": -10.0881929397583, "global_step": 166686, "epoch": 992} {"train_loss": -10.778185844421387, "global_step": 166687, "epoch": 992} {"train_loss": -10.479378700256348, "global_step": 166688, "epoch": 992} {"train_loss": -10.906233787536621, "global_step": 166689, "epoch": 992} {"train_loss": -10.910892486572266, "global_step": 166690, "epoch": 992} {"train_loss": -10.638486862182617, "global_step": 166691, "epoch": 992} {"train_loss": -11.129165649414062, "global_step": 166692, "epoch": 992} {"train_loss": -10.728153228759766, "global_step": 166693, "epoch": 992} {"train_loss": -10.658792495727539, "global_step": 166694, "epoch": 992} {"train_loss": -10.986978530883789, "global_step": 166695, "epoch": 992} {"train_loss": -10.770490646362305, "global_step": 166696, "epoch": 992} {"train_loss": -10.541971206665039, "global_step": 166697, "epoch": 992} {"train_loss": -10.578585624694824, "global_step": 166698, "epoch": 992} {"train_loss": -10.97973346710205, "global_step": 166699, "epoch": 992} {"train_loss": -10.631521224975586, "global_step": 166700, "epoch": 992} {"train_loss": -11.06347942352295, "global_step": 166701, "epoch": 992} {"train_loss": -10.86448860168457, "global_step": 166702, "epoch": 992} {"train_loss": -10.797304153442383, "global_step": 166703, "epoch": 992} {"train_loss": -10.994710922241211, "global_step": 166704, "epoch": 992} {"train_loss": -10.705394744873047, "global_step": 166705, "epoch": 992} {"train_loss": -10.813359260559082, "global_step": 166706, "epoch": 992} {"train_loss": -10.82559585571289, "global_step": 166707, "epoch": 992} {"train_loss": -11.01060676574707, "global_step": 166708, "epoch": 992} {"train_loss": -10.654237747192383, "global_step": 166709, "epoch": 992} {"train_loss": -10.950782775878906, "global_step": 166710, "epoch": 992} {"train_loss": -10.919885635375977, "global_step": 166711, "epoch": 992} {"train_loss": -10.918371200561523, "global_step": 166712, "epoch": 992} {"train_loss": -11.222654342651367, "global_step": 166713, "epoch": 992} {"train_loss": -11.175556182861328, "global_step": 166714, "epoch": 992} {"train_loss": -10.9091796875, "global_step": 166715, "epoch": 992} {"train_loss": -11.092596054077148, "global_step": 166716, "epoch": 992} {"train_loss": -11.040494918823242, "global_step": 166717, "epoch": 992} {"train_loss": -11.059209823608398, "global_step": 166718, "epoch": 992} {"train_loss": -10.993179321289062, "global_step": 166719, "epoch": 992} {"train_loss": -10.917637825012207, "global_step": 166720, "epoch": 992} {"train_loss": -11.030939102172852, "global_step": 166721, "epoch": 992} {"train_loss": -11.151044845581055, "global_step": 166722, "epoch": 992} {"train_loss": -10.731889724731445, "global_step": 166723, "epoch": 992} {"train_loss": -11.230777740478516, "global_step": 166724, "epoch": 992} {"train_loss": -11.163926124572754, "global_step": 166725, "epoch": 992} {"train_loss": -11.43467903137207, "global_step": 166726, "epoch": 992} {"train_loss": -11.294233322143555, "global_step": 166727, "epoch": 992} {"train_loss": -11.409050941467285, "global_step": 166728, "epoch": 992} {"train_loss": -11.22656536102295, "global_step": 166729, "epoch": 992} {"train_loss": -11.356094360351562, "global_step": 166730, "epoch": 992} {"train_loss": -11.2483491897583, "global_step": 166731, "epoch": 992} {"train_loss": -11.077085494995117, "global_step": 166732, "epoch": 992} {"train_loss": -11.349081993103027, "global_step": 166733, "epoch": 992} {"train_loss": -11.16122055053711, "global_step": 166734, "epoch": 992} {"train_loss": -11.247027397155762, "global_step": 166735, "epoch": 992} {"train_loss": -11.324134826660156, "global_step": 166736, "epoch": 992} {"train_loss": -11.143739700317383, "global_step": 166737, "epoch": 992} {"train_loss": -10.821621894836426, "global_step": 166738, "epoch": 992} {"train_loss": -11.256134986877441, "global_step": 166739, "epoch": 992} {"train_loss": -11.058280944824219, "global_step": 166740, "epoch": 992} {"train_loss": -11.281519889831543, "global_step": 166741, "epoch": 992} {"train_loss": -11.246708869934082, "global_step": 166742, "epoch": 992} {"train_loss": -11.005163192749023, "global_step": 166743, "epoch": 992} {"train_loss": -10.94690227508545, "global_step": 166744, "epoch": 992} {"train_loss": -10.81714916229248, "global_step": 166745, "epoch": 992} {"train_loss": -11.340706825256348, "global_step": 166746, "epoch": 992} {"train_loss": -11.242347717285156, "global_step": 166747, "epoch": 992} {"train_loss": -11.017475128173828, "global_step": 166748, "epoch": 992} {"train_loss": -11.380390167236328, "global_step": 166749, "epoch": 992} {"train_loss": -10.851871490478516, "global_step": 166750, "epoch": 992} {"train_loss": -10.80972957611084, "global_step": 166751, "epoch": 992} {"train_loss": -10.969019889831543, "global_step": 166752, "epoch": 992} {"train_loss": -11.136432647705078, "global_step": 166753, "epoch": 992} {"train_loss": -11.133197784423828, "global_step": 166754, "epoch": 992} {"train_loss": -11.064949035644531, "global_step": 166755, "epoch": 992} {"train_loss": -11.372320175170898, "global_step": 166756, "epoch": 992} {"train_loss": -10.708499908447266, "global_step": 166757, "epoch": 992} {"train_loss": -11.307843208312988, "global_step": 166758, "epoch": 992} {"train_loss": -11.172196388244629, "global_step": 166759, "epoch": 992} {"train_loss": -10.830755233764648, "global_step": 166760, "epoch": 992} {"train_loss": -11.051660537719727, "global_step": 166761, "epoch": 992} {"train_loss": -10.809078216552734, "global_step": 166762, "epoch": 992} {"train_loss": -10.602350234985352, "global_step": 166763, "epoch": 992} {"train_loss": -10.758995056152344, "global_step": 166764, "epoch": 992} {"train_loss": -10.772062301635742, "global_step": 166765, "epoch": 992} {"train_loss": -9.820198059082031, "global_step": 166766, "epoch": 992} {"train_loss": -11.059507369995117, "global_step": 166767, "epoch": 992} {"train_loss": -9.841508865356445, "global_step": 166768, "epoch": 992} {"train_loss": -10.953250885009766, "global_step": 166769, "epoch": 992} {"train_loss": -10.273212432861328, "global_step": 166770, "epoch": 992} {"train_loss": -10.229658126831055, "global_step": 166771, "epoch": 992} {"train_loss": -10.432653427124023, "global_step": 166772, "epoch": 992} {"train_loss": -10.339138984680176, "global_step": 166773, "epoch": 992} {"train_loss": -10.683279037475586, "global_step": 166774, "epoch": 992} {"train_loss": -10.338327407836914, "global_step": 166775, "epoch": 992} {"train_loss": -10.481460571289062, "global_step": 166776, "epoch": 992} {"train_loss": -10.548188209533691, "global_step": 166777, "epoch": 992} {"train_loss": -10.700109481811523, "global_step": 166778, "epoch": 992} {"train_loss": -10.554084777832031, "global_step": 166779, "epoch": 992} {"train_loss": -10.702898979187012, "global_step": 166780, "epoch": 992} {"train_loss": -10.411101341247559, "global_step": 166781, "epoch": 992} {"train_loss": -10.627437591552734, "global_step": 166782, "epoch": 992} {"train_loss": -9.875995635986328, "global_step": 166783, "epoch": 992} {"train_loss": -10.807318687438965, "global_step": 166784, "epoch": 992} {"train_loss": -10.001840591430664, "global_step": 166785, "epoch": 992} {"train_loss": -10.775032997131348, "global_step": 166786, "epoch": 992} {"train_loss": -10.558660507202148, "global_step": 166787, "epoch": 992} {"train_loss": -10.718330383300781, "global_step": 166788, "epoch": 992} {"train_loss": -10.944633483886719, "global_step": 166789, "epoch": 992} {"train_loss": -10.76115608215332, "global_step": 166790, "epoch": 992} {"train_loss": -11.025949478149414, "global_step": 166791, "epoch": 992} {"train_loss": -10.463651657104492, "global_step": 166792, "epoch": 992} {"train_loss": -10.797515869140625, "global_step": 166793, "epoch": 992} {"train_loss": -10.723098754882812, "global_step": 166794, "epoch": 992} {"train_loss": -10.866388320922852, "global_step": 166795, "epoch": 992} {"train_loss": -10.619962692260742, "global_step": 166796, "epoch": 992} {"train_loss": -10.641764640808105, "global_step": 166797, "epoch": 992} {"train_loss": -10.579687118530273, "global_step": 166798, "epoch": 992} {"train_loss": -10.954413414001465, "global_step": 166799, "epoch": 992} {"train_loss": -10.212899208068848, "global_step": 166800, "epoch": 992} {"train_loss": -11.027427673339844, "global_step": 166801, "epoch": 992} {"train_loss": -10.721818923950195, "global_step": 166802, "epoch": 992} {"train_loss": -10.831687927246094, "global_step": 166803, "epoch": 992} {"train_loss": -10.934328079223633, "global_step": 166804, "epoch": 992} {"train_loss": -10.947126388549805, "global_step": 166805, "epoch": 992} {"train_loss": -11.001157760620117, "global_step": 166806, "epoch": 992} {"train_loss": -10.950565338134766, "global_step": 166807, "epoch": 992} {"train_loss": -10.726582527160645, "global_step": 166808, "epoch": 992} {"train_loss": -10.915901184082031, "global_step": 166809, "epoch": 992} {"train_loss": -10.952796936035156, "global_step": 166810, "epoch": 992} {"train_loss": -10.886970520019531, "global_step": 166811, "epoch": 992} {"train_loss": -10.932480812072754, "global_step": 166812, "epoch": 992} {"train_loss": -10.799112319946289, "global_step": 166813, "epoch": 992} {"train_loss": -11.039692878723145, "global_step": 166814, "epoch": 992} {"train_loss": -10.91658878326416, "global_step": 166815, "epoch": 992} {"train_loss": -10.848442077636719, "global_step": 166816, "epoch": 992} {"train_loss": -10.87725830078125, "global_step": 166817, "epoch": 992} {"train_loss": -11.128522872924805, "global_step": 166818, "epoch": 992} {"train_loss": -11.053135871887207, "global_step": 166819, "epoch": 992} {"train_loss": -10.9603271484375, "global_step": 166820, "epoch": 992} {"train_loss": -11.181913375854492, "global_step": 166821, "epoch": 992} {"train_loss": -11.188385963439941, "global_step": 166822, "epoch": 992} {"train_loss": -10.894366769563584, "global_step": 166823, "epoch": 992, "val_loss": 237754.046875} {"train_loss": -11.216592788696289, "global_step": 166824, "epoch": 993} {"train_loss": -11.255046844482422, "global_step": 166825, "epoch": 993} {"train_loss": -11.288860321044922, "global_step": 166826, "epoch": 993} {"train_loss": -11.422531127929688, "global_step": 166827, "epoch": 993} {"train_loss": -11.361577987670898, "global_step": 166828, "epoch": 993} {"train_loss": -11.182487487792969, "global_step": 166829, "epoch": 993} {"train_loss": -10.926700592041016, "global_step": 166830, "epoch": 993} {"train_loss": -11.277122497558594, "global_step": 166831, "epoch": 993} {"train_loss": -11.239973068237305, "global_step": 166832, "epoch": 993} {"train_loss": -11.12639045715332, "global_step": 166833, "epoch": 993} {"train_loss": -11.376842498779297, "global_step": 166834, "epoch": 993} {"train_loss": -11.153482437133789, "global_step": 166835, "epoch": 993} {"train_loss": -10.897527694702148, "global_step": 166836, "epoch": 993} {"train_loss": -11.29958724975586, "global_step": 166837, "epoch": 993} {"train_loss": -10.863053321838379, "global_step": 166838, "epoch": 993} {"train_loss": -10.946877479553223, "global_step": 166839, "epoch": 993} {"train_loss": -11.000337600708008, "global_step": 166840, "epoch": 993} {"train_loss": -10.880879402160645, "global_step": 166841, "epoch": 993} {"train_loss": -11.02930736541748, "global_step": 166842, "epoch": 993} {"train_loss": -11.080841064453125, "global_step": 166843, "epoch": 993} {"train_loss": -11.354825973510742, "global_step": 166844, "epoch": 993} {"train_loss": -11.194843292236328, "global_step": 166845, "epoch": 993} {"train_loss": -11.238519668579102, "global_step": 166846, "epoch": 993} {"train_loss": -11.337072372436523, "global_step": 166847, "epoch": 993} {"train_loss": -11.089177131652832, "global_step": 166848, "epoch": 993} {"train_loss": -11.515212059020996, "global_step": 166849, "epoch": 993} {"train_loss": -11.366146087646484, "global_step": 166850, "epoch": 993} {"train_loss": -11.26319694519043, "global_step": 166851, "epoch": 993} {"train_loss": -11.548555374145508, "global_step": 166852, "epoch": 993} {"train_loss": -11.371655464172363, "global_step": 166853, "epoch": 993} {"train_loss": -11.33146858215332, "global_step": 166854, "epoch": 993} {"train_loss": -11.261181831359863, "global_step": 166855, "epoch": 993} {"train_loss": -11.23990249633789, "global_step": 166856, "epoch": 993} {"train_loss": -11.565326690673828, "global_step": 166857, "epoch": 993} {"train_loss": -11.22264575958252, "global_step": 166858, "epoch": 993} {"train_loss": -11.130517959594727, "global_step": 166859, "epoch": 993} {"train_loss": -11.29348087310791, "global_step": 166860, "epoch": 993} {"train_loss": -10.666162490844727, "global_step": 166861, "epoch": 993} {"train_loss": -10.465405464172363, "global_step": 166862, "epoch": 993} {"train_loss": -10.890849113464355, "global_step": 166863, "epoch": 993} {"train_loss": -11.011903762817383, "global_step": 166864, "epoch": 993} {"train_loss": -11.236854553222656, "global_step": 166865, "epoch": 993} {"train_loss": -10.87010669708252, "global_step": 166866, "epoch": 993} {"train_loss": -11.349311828613281, "global_step": 166867, "epoch": 993} {"train_loss": -10.98039436340332, "global_step": 166868, "epoch": 993} {"train_loss": -10.722883224487305, "global_step": 166869, "epoch": 993} {"train_loss": -10.470626831054688, "global_step": 166870, "epoch": 993} {"train_loss": -11.141119003295898, "global_step": 166871, "epoch": 993} {"train_loss": -10.983240127563477, "global_step": 166872, "epoch": 993} {"train_loss": -11.126480102539062, "global_step": 166873, "epoch": 993} {"train_loss": -11.038034439086914, "global_step": 166874, "epoch": 993} {"train_loss": -10.790412902832031, "global_step": 166875, "epoch": 993} {"train_loss": -10.453088760375977, "global_step": 166876, "epoch": 993} {"train_loss": -11.28361988067627, "global_step": 166877, "epoch": 993} {"train_loss": -10.625228881835938, "global_step": 166878, "epoch": 993} {"train_loss": -10.787322998046875, "global_step": 166879, "epoch": 993} {"train_loss": -11.089208602905273, "global_step": 166880, "epoch": 993} {"train_loss": -10.998103141784668, "global_step": 166881, "epoch": 993} {"train_loss": -11.126453399658203, "global_step": 166882, "epoch": 993} {"train_loss": -11.290125846862793, "global_step": 166883, "epoch": 993} {"train_loss": -10.87015151977539, "global_step": 166884, "epoch": 993} {"train_loss": -11.227712631225586, "global_step": 166885, "epoch": 993} {"train_loss": -10.537215232849121, "global_step": 166886, "epoch": 993} {"train_loss": -10.988425254821777, "global_step": 166887, "epoch": 993} {"train_loss": -10.472757339477539, "global_step": 166888, "epoch": 993} {"train_loss": -11.03113079071045, "global_step": 166889, "epoch": 993} {"train_loss": -10.827826499938965, "global_step": 166890, "epoch": 993} {"train_loss": -10.311342239379883, "global_step": 166891, "epoch": 993} {"train_loss": -11.187749862670898, "global_step": 166892, "epoch": 993} {"train_loss": -10.676018714904785, "global_step": 166893, "epoch": 993} {"train_loss": -11.3924560546875, "global_step": 166894, "epoch": 993} {"train_loss": -10.639455795288086, "global_step": 166895, "epoch": 993} {"train_loss": -10.921342849731445, "global_step": 166896, "epoch": 993} {"train_loss": -11.05171012878418, "global_step": 166897, "epoch": 993} {"train_loss": -10.756948471069336, "global_step": 166898, "epoch": 993} {"train_loss": -11.315276145935059, "global_step": 166899, "epoch": 993} {"train_loss": -10.84019947052002, "global_step": 166900, "epoch": 993} {"train_loss": -11.10238265991211, "global_step": 166901, "epoch": 993} {"train_loss": -10.640852928161621, "global_step": 166902, "epoch": 993} {"train_loss": -11.011333465576172, "global_step": 166903, "epoch": 993} {"train_loss": -11.03780746459961, "global_step": 166904, "epoch": 993} {"train_loss": -10.853201866149902, "global_step": 166905, "epoch": 993} {"train_loss": -10.807718276977539, "global_step": 166906, "epoch": 993} {"train_loss": -10.770475387573242, "global_step": 166907, "epoch": 993} {"train_loss": -11.080167770385742, "global_step": 166908, "epoch": 993} {"train_loss": -10.544422149658203, "global_step": 166909, "epoch": 993} {"train_loss": -11.17060661315918, "global_step": 166910, "epoch": 993} {"train_loss": -10.640494346618652, "global_step": 166911, "epoch": 993} {"train_loss": -11.232095718383789, "global_step": 166912, "epoch": 993} {"train_loss": -11.211772918701172, "global_step": 166913, "epoch": 993} {"train_loss": -11.163839340209961, "global_step": 166914, "epoch": 993} {"train_loss": -11.358627319335938, "global_step": 166915, "epoch": 993} {"train_loss": -11.11830997467041, "global_step": 166916, "epoch": 993} {"train_loss": -11.295598983764648, "global_step": 166917, "epoch": 993} {"train_loss": -11.230710983276367, "global_step": 166918, "epoch": 993} {"train_loss": -11.184520721435547, "global_step": 166919, "epoch": 993} {"train_loss": -11.222513198852539, "global_step": 166920, "epoch": 993} {"train_loss": -11.254462242126465, "global_step": 166921, "epoch": 993} {"train_loss": -11.222097396850586, "global_step": 166922, "epoch": 993} {"train_loss": -11.185883522033691, "global_step": 166923, "epoch": 993} {"train_loss": -11.131673812866211, "global_step": 166924, "epoch": 993} {"train_loss": -10.871906280517578, "global_step": 166925, "epoch": 993} {"train_loss": -11.476720809936523, "global_step": 166926, "epoch": 993} {"train_loss": -11.237369537353516, "global_step": 166927, "epoch": 993} {"train_loss": -10.853310585021973, "global_step": 166928, "epoch": 993} {"train_loss": -10.731921195983887, "global_step": 166929, "epoch": 993} {"train_loss": -11.09626579284668, "global_step": 166930, "epoch": 993} {"train_loss": -10.697246551513672, "global_step": 166931, "epoch": 993} {"train_loss": -11.364566802978516, "global_step": 166932, "epoch": 993} {"train_loss": -10.854228019714355, "global_step": 166933, "epoch": 993} {"train_loss": -10.846701622009277, "global_step": 166934, "epoch": 993} {"train_loss": -10.680299758911133, "global_step": 166935, "epoch": 993} {"train_loss": -10.997013092041016, "global_step": 166936, "epoch": 993} {"train_loss": -11.249247550964355, "global_step": 166937, "epoch": 993} {"train_loss": -11.181347846984863, "global_step": 166938, "epoch": 993} {"train_loss": -10.8846435546875, "global_step": 166939, "epoch": 993} {"train_loss": -10.767973899841309, "global_step": 166940, "epoch": 993} {"train_loss": -11.080097198486328, "global_step": 166941, "epoch": 993} {"train_loss": -10.937305450439453, "global_step": 166942, "epoch": 993} {"train_loss": -11.209480285644531, "global_step": 166943, "epoch": 993} {"train_loss": -11.279253005981445, "global_step": 166944, "epoch": 993} {"train_loss": -11.048362731933594, "global_step": 166945, "epoch": 993} {"train_loss": -11.272150993347168, "global_step": 166946, "epoch": 993} {"train_loss": -11.351533889770508, "global_step": 166947, "epoch": 993} {"train_loss": -11.175739288330078, "global_step": 166948, "epoch": 993} {"train_loss": -11.269816398620605, "global_step": 166949, "epoch": 993} {"train_loss": -10.778181076049805, "global_step": 166950, "epoch": 993} {"train_loss": -10.57856559753418, "global_step": 166951, "epoch": 993} {"train_loss": -10.797097206115723, "global_step": 166952, "epoch": 993} {"train_loss": -10.662725448608398, "global_step": 166953, "epoch": 993} {"train_loss": -11.02845573425293, "global_step": 166954, "epoch": 993} {"train_loss": -10.539848327636719, "global_step": 166955, "epoch": 993} {"train_loss": -11.195924758911133, "global_step": 166956, "epoch": 993} {"train_loss": -10.1970853805542, "global_step": 166957, "epoch": 993} {"train_loss": -10.928810119628906, "global_step": 166958, "epoch": 993} {"train_loss": -10.751129150390625, "global_step": 166959, "epoch": 993} {"train_loss": -10.773141860961914, "global_step": 166960, "epoch": 993} {"train_loss": -10.593377113342285, "global_step": 166961, "epoch": 993} {"train_loss": -10.880298614501953, "global_step": 166962, "epoch": 993} {"train_loss": -11.165562629699707, "global_step": 166963, "epoch": 993} {"train_loss": -10.782203674316406, "global_step": 166964, "epoch": 993} {"train_loss": -10.782649040222168, "global_step": 166965, "epoch": 993} {"train_loss": -10.929232597351074, "global_step": 166966, "epoch": 993} {"train_loss": -10.910051345825195, "global_step": 166967, "epoch": 993} {"train_loss": -11.11944580078125, "global_step": 166968, "epoch": 993} {"train_loss": -10.676523208618164, "global_step": 166969, "epoch": 993} {"train_loss": -10.41464614868164, "global_step": 166970, "epoch": 993} {"train_loss": -10.377364158630371, "global_step": 166971, "epoch": 993} {"train_loss": -10.531996726989746, "global_step": 166972, "epoch": 993} {"train_loss": -10.66464614868164, "global_step": 166973, "epoch": 993} {"train_loss": -10.405486106872559, "global_step": 166974, "epoch": 993} {"train_loss": -10.744464874267578, "global_step": 166975, "epoch": 993} {"train_loss": -10.09908676147461, "global_step": 166976, "epoch": 993} {"train_loss": -10.584127426147461, "global_step": 166977, "epoch": 993} {"train_loss": -9.560354232788086, "global_step": 166978, "epoch": 993} {"train_loss": -10.43604564666748, "global_step": 166979, "epoch": 993} {"train_loss": -9.336481094360352, "global_step": 166980, "epoch": 993} {"train_loss": -9.695165634155273, "global_step": 166981, "epoch": 993} {"train_loss": -9.468783378601074, "global_step": 166982, "epoch": 993} {"train_loss": -10.213644027709961, "global_step": 166983, "epoch": 993} {"train_loss": -9.274728775024414, "global_step": 166984, "epoch": 993} {"train_loss": -10.647281646728516, "global_step": 166985, "epoch": 993} {"train_loss": -10.229037284851074, "global_step": 166986, "epoch": 993} {"train_loss": -10.192089080810547, "global_step": 166987, "epoch": 993} {"train_loss": -10.877331733703613, "global_step": 166988, "epoch": 993} {"train_loss": -10.210237503051758, "global_step": 166989, "epoch": 993} {"train_loss": -10.437281608581543, "global_step": 166990, "epoch": 993} {"train_loss": -10.919237290109907, "global_step": 166991, "epoch": 993, "val_loss": 234358.46875} {"train_loss": -10.382366180419922, "global_step": 166992, "epoch": 994} {"train_loss": -9.345259666442871, "global_step": 166993, "epoch": 994} {"train_loss": -10.971867561340332, "global_step": 166994, "epoch": 994} {"train_loss": -10.815164566040039, "global_step": 166995, "epoch": 994} {"train_loss": -10.217348098754883, "global_step": 166996, "epoch": 994} {"train_loss": -11.030189514160156, "global_step": 166997, "epoch": 994} {"train_loss": -10.786704063415527, "global_step": 166998, "epoch": 994} {"train_loss": -10.509245872497559, "global_step": 166999, "epoch": 994} {"train_loss": -11.059320449829102, "global_step": 167000, "epoch": 994} {"train_loss": -10.718040466308594, "global_step": 167001, "epoch": 994} {"train_loss": -10.841473579406738, "global_step": 167002, "epoch": 994} {"train_loss": -10.5458984375, "global_step": 167003, "epoch": 994} {"train_loss": -10.817428588867188, "global_step": 167004, "epoch": 994} {"train_loss": -10.689679145812988, "global_step": 167005, "epoch": 994} {"train_loss": -11.005777359008789, "global_step": 167006, "epoch": 994} {"train_loss": -11.029581069946289, "global_step": 167007, "epoch": 994} {"train_loss": -10.768808364868164, "global_step": 167008, "epoch": 994} {"train_loss": -11.047319412231445, "global_step": 167009, "epoch": 994} {"train_loss": -11.011548042297363, "global_step": 167010, "epoch": 994} {"train_loss": -11.016670227050781, "global_step": 167011, "epoch": 994} {"train_loss": -10.987894058227539, "global_step": 167012, "epoch": 994} {"train_loss": -11.10978889465332, "global_step": 167013, "epoch": 994} {"train_loss": -11.115710258483887, "global_step": 167014, "epoch": 994} {"train_loss": -11.178239822387695, "global_step": 167015, "epoch": 994} {"train_loss": -10.83753776550293, "global_step": 167016, "epoch": 994} {"train_loss": -11.252827644348145, "global_step": 167017, "epoch": 994} {"train_loss": -11.108301162719727, "global_step": 167018, "epoch": 994} {"train_loss": -11.160430908203125, "global_step": 167019, "epoch": 994} {"train_loss": -11.003800392150879, "global_step": 167020, "epoch": 994} {"train_loss": -11.149737358093262, "global_step": 167021, "epoch": 994} {"train_loss": -11.143869400024414, "global_step": 167022, "epoch": 994} {"train_loss": -11.153969764709473, "global_step": 167023, "epoch": 994} {"train_loss": -11.07528305053711, "global_step": 167024, "epoch": 994} {"train_loss": -10.95109748840332, "global_step": 167025, "epoch": 994} {"train_loss": -11.233415603637695, "global_step": 167026, "epoch": 994} {"train_loss": -11.192630767822266, "global_step": 167027, "epoch": 994} {"train_loss": -10.99853515625, "global_step": 167028, "epoch": 994} {"train_loss": -11.378710746765137, "global_step": 167029, "epoch": 994} {"train_loss": -11.080968856811523, "global_step": 167030, "epoch": 994} {"train_loss": -11.008234024047852, "global_step": 167031, "epoch": 994} {"train_loss": -10.884300231933594, "global_step": 167032, "epoch": 994} {"train_loss": -11.070907592773438, "global_step": 167033, "epoch": 994} {"train_loss": -11.250715255737305, "global_step": 167034, "epoch": 994} {"train_loss": -11.054032325744629, "global_step": 167035, "epoch": 994} {"train_loss": -11.241125106811523, "global_step": 167036, "epoch": 994} {"train_loss": -11.008203506469727, "global_step": 167037, "epoch": 994} {"train_loss": -11.121976852416992, "global_step": 167038, "epoch": 994} {"train_loss": -11.133062362670898, "global_step": 167039, "epoch": 994} {"train_loss": -11.012510299682617, "global_step": 167040, "epoch": 994} {"train_loss": -11.351726531982422, "global_step": 167041, "epoch": 994} {"train_loss": -11.035774230957031, "global_step": 167042, "epoch": 994} {"train_loss": -10.953495025634766, "global_step": 167043, "epoch": 994} {"train_loss": -11.434407234191895, "global_step": 167044, "epoch": 994} {"train_loss": -11.105138778686523, "global_step": 167045, "epoch": 994} {"train_loss": -11.06196403503418, "global_step": 167046, "epoch": 994} {"train_loss": -11.307098388671875, "global_step": 167047, "epoch": 994} {"train_loss": -11.211052894592285, "global_step": 167048, "epoch": 994} {"train_loss": -11.416510581970215, "global_step": 167049, "epoch": 994} {"train_loss": -11.546772956848145, "global_step": 167050, "epoch": 994} {"train_loss": -11.389389038085938, "global_step": 167051, "epoch": 994} {"train_loss": -11.518655776977539, "global_step": 167052, "epoch": 994} {"train_loss": -11.625555038452148, "global_step": 167053, "epoch": 994} {"train_loss": -11.454910278320312, "global_step": 167054, "epoch": 994} {"train_loss": -11.353723526000977, "global_step": 167055, "epoch": 994} {"train_loss": -11.259087562561035, "global_step": 167056, "epoch": 994} {"train_loss": -11.191783905029297, "global_step": 167057, "epoch": 994} {"train_loss": -11.265422821044922, "global_step": 167058, "epoch": 994} {"train_loss": -11.19340705871582, "global_step": 167059, "epoch": 994} {"train_loss": -11.030354499816895, "global_step": 167060, "epoch": 994} {"train_loss": -10.983882904052734, "global_step": 167061, "epoch": 994} {"train_loss": -11.10026741027832, "global_step": 167062, "epoch": 994} {"train_loss": -11.199316024780273, "global_step": 167063, "epoch": 994} {"train_loss": -11.173506736755371, "global_step": 167064, "epoch": 994} {"train_loss": -10.348894119262695, "global_step": 167065, "epoch": 994} {"train_loss": -10.336259841918945, "global_step": 167066, "epoch": 994} {"train_loss": -10.706474304199219, "global_step": 167067, "epoch": 994} {"train_loss": -11.216026306152344, "global_step": 167068, "epoch": 994} {"train_loss": -10.35503101348877, "global_step": 167069, "epoch": 994} {"train_loss": -9.890514373779297, "global_step": 167070, "epoch": 994} {"train_loss": -10.665599822998047, "global_step": 167071, "epoch": 994} {"train_loss": -10.55868911743164, "global_step": 167072, "epoch": 994} {"train_loss": -10.420265197753906, "global_step": 167073, "epoch": 994} {"train_loss": -10.986178398132324, "global_step": 167074, "epoch": 994} {"train_loss": -10.711483001708984, "global_step": 167075, "epoch": 994} {"train_loss": -10.395355224609375, "global_step": 167076, "epoch": 994} {"train_loss": -10.220791816711426, "global_step": 167077, "epoch": 994} {"train_loss": -9.359846115112305, "global_step": 167078, "epoch": 994} {"train_loss": -10.750003814697266, "global_step": 167079, "epoch": 994} {"train_loss": -9.359294891357422, "global_step": 167080, "epoch": 994} {"train_loss": -9.544280052185059, "global_step": 167081, "epoch": 994} {"train_loss": -10.65951156616211, "global_step": 167082, "epoch": 994} {"train_loss": -10.105098724365234, "global_step": 167083, "epoch": 994} {"train_loss": -9.99087905883789, "global_step": 167084, "epoch": 994} {"train_loss": -10.442831039428711, "global_step": 167085, "epoch": 994} {"train_loss": -9.384101867675781, "global_step": 167086, "epoch": 994} {"train_loss": -10.57293701171875, "global_step": 167087, "epoch": 994} {"train_loss": -9.74736499786377, "global_step": 167088, "epoch": 994} {"train_loss": -10.384868621826172, "global_step": 167089, "epoch": 994} {"train_loss": -10.772138595581055, "global_step": 167090, "epoch": 994} {"train_loss": -10.060321807861328, "global_step": 167091, "epoch": 994} {"train_loss": -10.296814918518066, "global_step": 167092, "epoch": 994} {"train_loss": -10.205857276916504, "global_step": 167093, "epoch": 994} {"train_loss": -9.688758850097656, "global_step": 167094, "epoch": 994} {"train_loss": -10.439123153686523, "global_step": 167095, "epoch": 994} {"train_loss": -10.391626358032227, "global_step": 167096, "epoch": 994} {"train_loss": -9.913084983825684, "global_step": 167097, "epoch": 994} {"train_loss": -10.508920669555664, "global_step": 167098, "epoch": 994} {"train_loss": -10.210186004638672, "global_step": 167099, "epoch": 994} {"train_loss": -10.821588516235352, "global_step": 167100, "epoch": 994} {"train_loss": -10.746932029724121, "global_step": 167101, "epoch": 994} {"train_loss": -10.502252578735352, "global_step": 167102, "epoch": 994} {"train_loss": -10.33796501159668, "global_step": 167103, "epoch": 994} {"train_loss": -10.65565013885498, "global_step": 167104, "epoch": 994} {"train_loss": -10.863259315490723, "global_step": 167105, "epoch": 994} {"train_loss": -10.193706512451172, "global_step": 167106, "epoch": 994} {"train_loss": -10.818784713745117, "global_step": 167107, "epoch": 994} {"train_loss": -10.648097038269043, "global_step": 167108, "epoch": 994} {"train_loss": -10.491543769836426, "global_step": 167109, "epoch": 994} {"train_loss": -10.682832717895508, "global_step": 167110, "epoch": 994} {"train_loss": -10.70888900756836, "global_step": 167111, "epoch": 994} {"train_loss": -10.72852897644043, "global_step": 167112, "epoch": 994} {"train_loss": -10.731643676757812, "global_step": 167113, "epoch": 994} {"train_loss": -10.999756813049316, "global_step": 167114, "epoch": 994} {"train_loss": -10.808597564697266, "global_step": 167115, "epoch": 994} {"train_loss": -10.686117172241211, "global_step": 167116, "epoch": 994} {"train_loss": -11.047921180725098, "global_step": 167117, "epoch": 994} {"train_loss": -10.89207935333252, "global_step": 167118, "epoch": 994} {"train_loss": -10.822062492370605, "global_step": 167119, "epoch": 994} {"train_loss": -11.0317964553833, "global_step": 167120, "epoch": 994} {"train_loss": -11.005141258239746, "global_step": 167121, "epoch": 994} {"train_loss": -11.035581588745117, "global_step": 167122, "epoch": 994} {"train_loss": -11.028251647949219, "global_step": 167123, "epoch": 994} {"train_loss": -10.976865768432617, "global_step": 167124, "epoch": 994} {"train_loss": -10.878366470336914, "global_step": 167125, "epoch": 994} {"train_loss": -11.094528198242188, "global_step": 167126, "epoch": 994} {"train_loss": -11.163498878479004, "global_step": 167127, "epoch": 994} {"train_loss": -11.239280700683594, "global_step": 167128, "epoch": 994} {"train_loss": -11.075255393981934, "global_step": 167129, "epoch": 994} {"train_loss": -11.068502426147461, "global_step": 167130, "epoch": 994} {"train_loss": -10.917155265808105, "global_step": 167131, "epoch": 994} {"train_loss": -11.317869186401367, "global_step": 167132, "epoch": 994} {"train_loss": -11.141690254211426, "global_step": 167133, "epoch": 994} {"train_loss": -11.156638145446777, "global_step": 167134, "epoch": 994} {"train_loss": -11.140176773071289, "global_step": 167135, "epoch": 994} {"train_loss": -11.349634170532227, "global_step": 167136, "epoch": 994} {"train_loss": -11.226651191711426, "global_step": 167137, "epoch": 994} {"train_loss": -11.085838317871094, "global_step": 167138, "epoch": 994} {"train_loss": -11.134239196777344, "global_step": 167139, "epoch": 994} {"train_loss": -11.193583488464355, "global_step": 167140, "epoch": 994} {"train_loss": -11.370853424072266, "global_step": 167141, "epoch": 994} {"train_loss": -11.194018363952637, "global_step": 167142, "epoch": 994} {"train_loss": -11.371442794799805, "global_step": 167143, "epoch": 994} {"train_loss": -11.161872863769531, "global_step": 167144, "epoch": 994} {"train_loss": -11.088927268981934, "global_step": 167145, "epoch": 994} {"train_loss": -10.9821138381958, "global_step": 167146, "epoch": 994} {"train_loss": -10.899803161621094, "global_step": 167147, "epoch": 994} {"train_loss": -11.372772216796875, "global_step": 167148, "epoch": 994} {"train_loss": -11.024927139282227, "global_step": 167149, "epoch": 994} {"train_loss": -10.74278450012207, "global_step": 167150, "epoch": 994} {"train_loss": -11.15433120727539, "global_step": 167151, "epoch": 994} {"train_loss": -11.126276969909668, "global_step": 167152, "epoch": 994} {"train_loss": -11.030989646911621, "global_step": 167153, "epoch": 994} {"train_loss": -11.087105751037598, "global_step": 167154, "epoch": 994} {"train_loss": -11.045751571655273, "global_step": 167155, "epoch": 994} {"train_loss": -11.444430351257324, "global_step": 167156, "epoch": 994} {"train_loss": -11.09425163269043, "global_step": 167157, "epoch": 994} {"train_loss": -11.423967361450195, "global_step": 167158, "epoch": 994} {"train_loss": -10.867050080072312, "global_step": 167159, "epoch": 994, "val_loss": 239099.84375} {"train_loss": -11.296398162841797, "global_step": 167160, "epoch": 995} {"train_loss": -10.76269817352295, "global_step": 167161, "epoch": 995} {"train_loss": -11.239044189453125, "global_step": 167162, "epoch": 995} {"train_loss": -11.241296768188477, "global_step": 167163, "epoch": 995} {"train_loss": -11.076763153076172, "global_step": 167164, "epoch": 995} {"train_loss": -10.988194465637207, "global_step": 167165, "epoch": 995} {"train_loss": -11.0204439163208, "global_step": 167166, "epoch": 995} {"train_loss": -11.189343452453613, "global_step": 167167, "epoch": 995} {"train_loss": -11.183177947998047, "global_step": 167168, "epoch": 995} {"train_loss": -10.39249038696289, "global_step": 167169, "epoch": 995} {"train_loss": -10.521279335021973, "global_step": 167170, "epoch": 995} {"train_loss": -10.299392700195312, "global_step": 167171, "epoch": 995} {"train_loss": -11.2608642578125, "global_step": 167172, "epoch": 995} {"train_loss": -10.787459373474121, "global_step": 167173, "epoch": 995} {"train_loss": -10.033391952514648, "global_step": 167174, "epoch": 995} {"train_loss": -10.170310974121094, "global_step": 167175, "epoch": 995} {"train_loss": -10.958070755004883, "global_step": 167176, "epoch": 995} {"train_loss": -10.795509338378906, "global_step": 167177, "epoch": 995} {"train_loss": -9.786627769470215, "global_step": 167178, "epoch": 995} {"train_loss": -11.040396690368652, "global_step": 167179, "epoch": 995} {"train_loss": -10.483179092407227, "global_step": 167180, "epoch": 995} {"train_loss": -9.950166702270508, "global_step": 167181, "epoch": 995} {"train_loss": -10.718374252319336, "global_step": 167182, "epoch": 995} {"train_loss": -9.867384910583496, "global_step": 167183, "epoch": 995} {"train_loss": -10.541391372680664, "global_step": 167184, "epoch": 995} {"train_loss": -10.368690490722656, "global_step": 167185, "epoch": 995} {"train_loss": -10.789619445800781, "global_step": 167186, "epoch": 995} {"train_loss": -10.154394149780273, "global_step": 167187, "epoch": 995} {"train_loss": -10.308111190795898, "global_step": 167188, "epoch": 995} {"train_loss": -9.889859199523926, "global_step": 167189, "epoch": 995} {"train_loss": -9.999517440795898, "global_step": 167190, "epoch": 995} {"train_loss": -10.450096130371094, "global_step": 167191, "epoch": 995} {"train_loss": -9.220561981201172, "global_step": 167192, "epoch": 995} {"train_loss": -10.581692695617676, "global_step": 167193, "epoch": 995} {"train_loss": -9.661575317382812, "global_step": 167194, "epoch": 995} {"train_loss": -9.54272174835205, "global_step": 167195, "epoch": 995} {"train_loss": -10.112508773803711, "global_step": 167196, "epoch": 995} {"train_loss": -10.115391731262207, "global_step": 167197, "epoch": 995} {"train_loss": -9.981443405151367, "global_step": 167198, "epoch": 995} {"train_loss": -10.04430866241455, "global_step": 167199, "epoch": 995} {"train_loss": -9.978544235229492, "global_step": 167200, "epoch": 995} {"train_loss": -10.021141052246094, "global_step": 167201, "epoch": 995} {"train_loss": -10.464818954467773, "global_step": 167202, "epoch": 995} {"train_loss": -10.041454315185547, "global_step": 167203, "epoch": 995} {"train_loss": -10.377117156982422, "global_step": 167204, "epoch": 995} {"train_loss": -10.299694061279297, "global_step": 167205, "epoch": 995} {"train_loss": -9.999320983886719, "global_step": 167206, "epoch": 995} {"train_loss": -10.50407886505127, "global_step": 167207, "epoch": 995} {"train_loss": -10.303879737854004, "global_step": 167208, "epoch": 995} {"train_loss": -10.357329368591309, "global_step": 167209, "epoch": 995} {"train_loss": -10.246891975402832, "global_step": 167210, "epoch": 995} {"train_loss": -10.435347557067871, "global_step": 167211, "epoch": 995} {"train_loss": -10.749029159545898, "global_step": 167212, "epoch": 995} {"train_loss": -10.146478652954102, "global_step": 167213, "epoch": 995} {"train_loss": -10.534069061279297, "global_step": 167214, "epoch": 995} {"train_loss": -10.317230224609375, "global_step": 167215, "epoch": 995} {"train_loss": -10.634357452392578, "global_step": 167216, "epoch": 995} {"train_loss": -10.865140914916992, "global_step": 167217, "epoch": 995} {"train_loss": -10.483846664428711, "global_step": 167218, "epoch": 995} {"train_loss": -10.757001876831055, "global_step": 167219, "epoch": 995} {"train_loss": -10.443048477172852, "global_step": 167220, "epoch": 995} {"train_loss": -10.664586067199707, "global_step": 167221, "epoch": 995} {"train_loss": -10.769164085388184, "global_step": 167222, "epoch": 995} {"train_loss": -10.731998443603516, "global_step": 167223, "epoch": 995} {"train_loss": -10.914974212646484, "global_step": 167224, "epoch": 995} {"train_loss": -10.869159698486328, "global_step": 167225, "epoch": 995} {"train_loss": -10.971820831298828, "global_step": 167226, "epoch": 995} {"train_loss": -10.93313217163086, "global_step": 167227, "epoch": 995} {"train_loss": -10.918953895568848, "global_step": 167228, "epoch": 995} {"train_loss": -10.76884651184082, "global_step": 167229, "epoch": 995} {"train_loss": -10.947701454162598, "global_step": 167230, "epoch": 995} {"train_loss": -10.883407592773438, "global_step": 167231, "epoch": 995} {"train_loss": -10.984899520874023, "global_step": 167232, "epoch": 995} {"train_loss": -11.095258712768555, "global_step": 167233, "epoch": 995} {"train_loss": -11.046708106994629, "global_step": 167234, "epoch": 995} {"train_loss": -10.910465240478516, "global_step": 167235, "epoch": 995} {"train_loss": -10.937894821166992, "global_step": 167236, "epoch": 995} {"train_loss": -11.072942733764648, "global_step": 167237, "epoch": 995} {"train_loss": -11.148124694824219, "global_step": 167238, "epoch": 995} {"train_loss": -11.308815002441406, "global_step": 167239, "epoch": 995} {"train_loss": -11.204418182373047, "global_step": 167240, "epoch": 995} {"train_loss": -11.197675704956055, "global_step": 167241, "epoch": 995} {"train_loss": -10.97343635559082, "global_step": 167242, "epoch": 995} {"train_loss": -11.039703369140625, "global_step": 167243, "epoch": 995} {"train_loss": -10.988601684570312, "global_step": 167244, "epoch": 995} {"train_loss": -11.066299438476562, "global_step": 167245, "epoch": 995} {"train_loss": -11.281253814697266, "global_step": 167246, "epoch": 995} {"train_loss": -11.31100845336914, "global_step": 167247, "epoch": 995} {"train_loss": -11.347917556762695, "global_step": 167248, "epoch": 995} {"train_loss": -11.274648666381836, "global_step": 167249, "epoch": 995} {"train_loss": -11.228574752807617, "global_step": 167250, "epoch": 995} {"train_loss": -11.335859298706055, "global_step": 167251, "epoch": 995} {"train_loss": -11.347454071044922, "global_step": 167252, "epoch": 995} {"train_loss": -11.123368263244629, "global_step": 167253, "epoch": 995} {"train_loss": -11.523757934570312, "global_step": 167254, "epoch": 995} {"train_loss": -11.323432922363281, "global_step": 167255, "epoch": 995} {"train_loss": -11.34041976928711, "global_step": 167256, "epoch": 995} {"train_loss": -11.40250015258789, "global_step": 167257, "epoch": 995} {"train_loss": -11.147468566894531, "global_step": 167258, "epoch": 995} {"train_loss": -11.530660629272461, "global_step": 167259, "epoch": 995} {"train_loss": -11.442154884338379, "global_step": 167260, "epoch": 995} {"train_loss": -10.987683296203613, "global_step": 167261, "epoch": 995} {"train_loss": -10.818582534790039, "global_step": 167262, "epoch": 995} {"train_loss": -11.413358688354492, "global_step": 167263, "epoch": 995} {"train_loss": -10.923419952392578, "global_step": 167264, "epoch": 995} {"train_loss": -11.223051071166992, "global_step": 167265, "epoch": 995} {"train_loss": -11.235857009887695, "global_step": 167266, "epoch": 995} {"train_loss": -11.137411117553711, "global_step": 167267, "epoch": 995} {"train_loss": -11.05947494506836, "global_step": 167268, "epoch": 995} {"train_loss": -10.940640449523926, "global_step": 167269, "epoch": 995} {"train_loss": -10.683109283447266, "global_step": 167270, "epoch": 995} {"train_loss": -11.130346298217773, "global_step": 167271, "epoch": 995} {"train_loss": -10.939245223999023, "global_step": 167272, "epoch": 995} {"train_loss": -11.196381568908691, "global_step": 167273, "epoch": 995} {"train_loss": -10.725227355957031, "global_step": 167274, "epoch": 995} {"train_loss": -11.305503845214844, "global_step": 167275, "epoch": 995} {"train_loss": -10.982101440429688, "global_step": 167276, "epoch": 995} {"train_loss": -10.91774845123291, "global_step": 167277, "epoch": 995} {"train_loss": -10.841514587402344, "global_step": 167278, "epoch": 995} {"train_loss": -11.183439254760742, "global_step": 167279, "epoch": 995} {"train_loss": -10.866691589355469, "global_step": 167280, "epoch": 995} {"train_loss": -10.951910018920898, "global_step": 167281, "epoch": 995} {"train_loss": -11.42561149597168, "global_step": 167282, "epoch": 995} {"train_loss": -11.130607604980469, "global_step": 167283, "epoch": 995} {"train_loss": -11.10322380065918, "global_step": 167284, "epoch": 995} {"train_loss": -11.203317642211914, "global_step": 167285, "epoch": 995} {"train_loss": -11.28965950012207, "global_step": 167286, "epoch": 995} {"train_loss": -10.805683135986328, "global_step": 167287, "epoch": 995} {"train_loss": -11.236239433288574, "global_step": 167288, "epoch": 995} {"train_loss": -11.283378601074219, "global_step": 167289, "epoch": 995} {"train_loss": -11.024230003356934, "global_step": 167290, "epoch": 995} {"train_loss": -11.102028846740723, "global_step": 167291, "epoch": 995} {"train_loss": -11.423778533935547, "global_step": 167292, "epoch": 995} {"train_loss": -11.214048385620117, "global_step": 167293, "epoch": 995} {"train_loss": -11.18427848815918, "global_step": 167294, "epoch": 995} {"train_loss": -11.137591361999512, "global_step": 167295, "epoch": 995} {"train_loss": -11.296745300292969, "global_step": 167296, "epoch": 995} {"train_loss": -11.038063049316406, "global_step": 167297, "epoch": 995} {"train_loss": -10.828643798828125, "global_step": 167298, "epoch": 995} {"train_loss": -11.059257507324219, "global_step": 167299, "epoch": 995} {"train_loss": -10.570100784301758, "global_step": 167300, "epoch": 995} {"train_loss": -10.68411922454834, "global_step": 167301, "epoch": 995} {"train_loss": -10.710416793823242, "global_step": 167302, "epoch": 995} {"train_loss": -10.204032897949219, "global_step": 167303, "epoch": 995} {"train_loss": -10.045747756958008, "global_step": 167304, "epoch": 995} {"train_loss": -10.188230514526367, "global_step": 167305, "epoch": 995} {"train_loss": -9.279386520385742, "global_step": 167306, "epoch": 995} {"train_loss": -9.480851173400879, "global_step": 167307, "epoch": 995} {"train_loss": -10.561605453491211, "global_step": 167308, "epoch": 995} {"train_loss": -9.69163990020752, "global_step": 167309, "epoch": 995} {"train_loss": -9.890342712402344, "global_step": 167310, "epoch": 995} {"train_loss": -9.899085998535156, "global_step": 167311, "epoch": 995} {"train_loss": -9.721244812011719, "global_step": 167312, "epoch": 995} {"train_loss": -10.384469985961914, "global_step": 167313, "epoch": 995} {"train_loss": -9.459112167358398, "global_step": 167314, "epoch": 995} {"train_loss": -10.519857406616211, "global_step": 167315, "epoch": 995} {"train_loss": -9.73806381225586, "global_step": 167316, "epoch": 995} {"train_loss": -10.434389114379883, "global_step": 167317, "epoch": 995} {"train_loss": -10.02783203125, "global_step": 167318, "epoch": 995} {"train_loss": -10.720436096191406, "global_step": 167319, "epoch": 995} {"train_loss": -9.403934478759766, "global_step": 167320, "epoch": 995} {"train_loss": -10.55885124206543, "global_step": 167321, "epoch": 995} {"train_loss": -10.121759414672852, "global_step": 167322, "epoch": 995} {"train_loss": -9.932044982910156, "global_step": 167323, "epoch": 995} {"train_loss": -10.631126403808594, "global_step": 167324, "epoch": 995} {"train_loss": -10.29296588897705, "global_step": 167325, "epoch": 995} {"train_loss": -10.063117980957031, "global_step": 167326, "epoch": 995} {"train_loss": -10.697865230696541, "global_step": 167327, "epoch": 995, "val_loss": 235377.4375, "train_action_mse_error": 1.396528720855713} {"train_loss": -10.658151626586914, "global_step": 167328, "epoch": 996} {"train_loss": -10.616016387939453, "global_step": 167329, "epoch": 996} {"train_loss": -10.651737213134766, "global_step": 167330, "epoch": 996} {"train_loss": -10.43426513671875, "global_step": 167331, "epoch": 996} {"train_loss": -10.59719181060791, "global_step": 167332, "epoch": 996} {"train_loss": -10.890203475952148, "global_step": 167333, "epoch": 996} {"train_loss": -10.438034057617188, "global_step": 167334, "epoch": 996} {"train_loss": -10.833906173706055, "global_step": 167335, "epoch": 996} {"train_loss": -10.734987258911133, "global_step": 167336, "epoch": 996} {"train_loss": -10.849411964416504, "global_step": 167337, "epoch": 996} {"train_loss": -10.800865173339844, "global_step": 167338, "epoch": 996} {"train_loss": -10.961627960205078, "global_step": 167339, "epoch": 996} {"train_loss": -10.906497955322266, "global_step": 167340, "epoch": 996} {"train_loss": -10.899364471435547, "global_step": 167341, "epoch": 996} {"train_loss": -10.87747859954834, "global_step": 167342, "epoch": 996} {"train_loss": -10.863492965698242, "global_step": 167343, "epoch": 996} {"train_loss": -11.027153015136719, "global_step": 167344, "epoch": 996} {"train_loss": -10.825143814086914, "global_step": 167345, "epoch": 996} {"train_loss": -10.75697135925293, "global_step": 167346, "epoch": 996} {"train_loss": -11.077020645141602, "global_step": 167347, "epoch": 996} {"train_loss": -11.15997314453125, "global_step": 167348, "epoch": 996} {"train_loss": -10.887914657592773, "global_step": 167349, "epoch": 996} {"train_loss": -11.046171188354492, "global_step": 167350, "epoch": 996} {"train_loss": -10.987150192260742, "global_step": 167351, "epoch": 996} {"train_loss": -11.104804992675781, "global_step": 167352, "epoch": 996} {"train_loss": -11.04548454284668, "global_step": 167353, "epoch": 996} {"train_loss": -10.863897323608398, "global_step": 167354, "epoch": 996} {"train_loss": -11.157796859741211, "global_step": 167355, "epoch": 996} {"train_loss": -10.918754577636719, "global_step": 167356, "epoch": 996} {"train_loss": -11.229586601257324, "global_step": 167357, "epoch": 996} {"train_loss": -11.157487869262695, "global_step": 167358, "epoch": 996} {"train_loss": -11.145164489746094, "global_step": 167359, "epoch": 996} {"train_loss": -11.143771171569824, "global_step": 167360, "epoch": 996} {"train_loss": -11.20583438873291, "global_step": 167361, "epoch": 996} {"train_loss": -11.1817045211792, "global_step": 167362, "epoch": 996} {"train_loss": -11.159896850585938, "global_step": 167363, "epoch": 996} {"train_loss": -11.26370906829834, "global_step": 167364, "epoch": 996} {"train_loss": -11.199304580688477, "global_step": 167365, "epoch": 996} {"train_loss": -11.18874454498291, "global_step": 167366, "epoch": 996} {"train_loss": -11.300155639648438, "global_step": 167367, "epoch": 996} {"train_loss": -11.221855163574219, "global_step": 167368, "epoch": 996} {"train_loss": -11.229336738586426, "global_step": 167369, "epoch": 996} {"train_loss": -11.287666320800781, "global_step": 167370, "epoch": 996} {"train_loss": -11.158088684082031, "global_step": 167371, "epoch": 996} {"train_loss": -11.190059661865234, "global_step": 167372, "epoch": 996} {"train_loss": -10.801074981689453, "global_step": 167373, "epoch": 996} {"train_loss": -11.26514720916748, "global_step": 167374, "epoch": 996} {"train_loss": -11.199329376220703, "global_step": 167375, "epoch": 996} {"train_loss": -11.239500045776367, "global_step": 167376, "epoch": 996} {"train_loss": -10.886180877685547, "global_step": 167377, "epoch": 996} {"train_loss": -11.191667556762695, "global_step": 167378, "epoch": 996} {"train_loss": -11.318316459655762, "global_step": 167379, "epoch": 996} {"train_loss": -11.062816619873047, "global_step": 167380, "epoch": 996} {"train_loss": -11.210838317871094, "global_step": 167381, "epoch": 996} {"train_loss": -11.170438766479492, "global_step": 167382, "epoch": 996} {"train_loss": -11.527849197387695, "global_step": 167383, "epoch": 996} {"train_loss": -10.822856903076172, "global_step": 167384, "epoch": 996} {"train_loss": -11.177705764770508, "global_step": 167385, "epoch": 996} {"train_loss": -11.189525604248047, "global_step": 167386, "epoch": 996} {"train_loss": -11.07959270477295, "global_step": 167387, "epoch": 996} {"train_loss": -10.982784271240234, "global_step": 167388, "epoch": 996} {"train_loss": -10.816551208496094, "global_step": 167389, "epoch": 996} {"train_loss": -11.129883766174316, "global_step": 167390, "epoch": 996} {"train_loss": -10.694965362548828, "global_step": 167391, "epoch": 996} {"train_loss": -11.312830924987793, "global_step": 167392, "epoch": 996} {"train_loss": -10.58616828918457, "global_step": 167393, "epoch": 996} {"train_loss": -10.998086929321289, "global_step": 167394, "epoch": 996} {"train_loss": -10.231416702270508, "global_step": 167395, "epoch": 996} {"train_loss": -10.544482231140137, "global_step": 167396, "epoch": 996} {"train_loss": -10.825883865356445, "global_step": 167397, "epoch": 996} {"train_loss": -10.603631019592285, "global_step": 167398, "epoch": 996} {"train_loss": -10.62912368774414, "global_step": 167399, "epoch": 996} {"train_loss": -11.07718276977539, "global_step": 167400, "epoch": 996} {"train_loss": -10.946626663208008, "global_step": 167401, "epoch": 996} {"train_loss": -11.183406829833984, "global_step": 167402, "epoch": 996} {"train_loss": -10.753825187683105, "global_step": 167403, "epoch": 996} {"train_loss": -11.214932441711426, "global_step": 167404, "epoch": 996} {"train_loss": -10.843572616577148, "global_step": 167405, "epoch": 996} {"train_loss": -11.050924301147461, "global_step": 167406, "epoch": 996} {"train_loss": -10.753580093383789, "global_step": 167407, "epoch": 996} {"train_loss": -10.807138442993164, "global_step": 167408, "epoch": 996} {"train_loss": -10.462217330932617, "global_step": 167409, "epoch": 996} {"train_loss": -10.860034942626953, "global_step": 167410, "epoch": 996} {"train_loss": -10.882884979248047, "global_step": 167411, "epoch": 996} {"train_loss": -11.119662284851074, "global_step": 167412, "epoch": 996} {"train_loss": -10.580099105834961, "global_step": 167413, "epoch": 996} {"train_loss": -10.505956649780273, "global_step": 167414, "epoch": 996} {"train_loss": -10.943506240844727, "global_step": 167415, "epoch": 996} {"train_loss": -10.41389274597168, "global_step": 167416, "epoch": 996} {"train_loss": -11.060537338256836, "global_step": 167417, "epoch": 996} {"train_loss": -10.613471031188965, "global_step": 167418, "epoch": 996} {"train_loss": -10.945507049560547, "global_step": 167419, "epoch": 996} {"train_loss": -10.816173553466797, "global_step": 167420, "epoch": 996} {"train_loss": -10.660350799560547, "global_step": 167421, "epoch": 996} {"train_loss": -10.551719665527344, "global_step": 167422, "epoch": 996} {"train_loss": -10.795564651489258, "global_step": 167423, "epoch": 996} {"train_loss": -10.349628448486328, "global_step": 167424, "epoch": 996} {"train_loss": -10.559865951538086, "global_step": 167425, "epoch": 996} {"train_loss": -10.664514541625977, "global_step": 167426, "epoch": 996} {"train_loss": -10.68098258972168, "global_step": 167427, "epoch": 996} {"train_loss": -10.434840202331543, "global_step": 167428, "epoch": 996} {"train_loss": -11.001765251159668, "global_step": 167429, "epoch": 996} {"train_loss": -9.869503021240234, "global_step": 167430, "epoch": 996} {"train_loss": -11.079669952392578, "global_step": 167431, "epoch": 996} {"train_loss": -10.586641311645508, "global_step": 167432, "epoch": 996} {"train_loss": -10.354652404785156, "global_step": 167433, "epoch": 996} {"train_loss": -10.798088073730469, "global_step": 167434, "epoch": 996} {"train_loss": -10.452323913574219, "global_step": 167435, "epoch": 996} {"train_loss": -10.828401565551758, "global_step": 167436, "epoch": 996} {"train_loss": -10.52419662475586, "global_step": 167437, "epoch": 996} {"train_loss": -10.923154830932617, "global_step": 167438, "epoch": 996} {"train_loss": -10.41378116607666, "global_step": 167439, "epoch": 996} {"train_loss": -10.69725227355957, "global_step": 167440, "epoch": 996} {"train_loss": -10.644610404968262, "global_step": 167441, "epoch": 996} {"train_loss": -10.851377487182617, "global_step": 167442, "epoch": 996} {"train_loss": -11.02880573272705, "global_step": 167443, "epoch": 996} {"train_loss": -10.781951904296875, "global_step": 167444, "epoch": 996} {"train_loss": -10.633759498596191, "global_step": 167445, "epoch": 996} {"train_loss": -10.898859024047852, "global_step": 167446, "epoch": 996} {"train_loss": -10.938453674316406, "global_step": 167447, "epoch": 996} {"train_loss": -11.189001083374023, "global_step": 167448, "epoch": 996} {"train_loss": -10.938389778137207, "global_step": 167449, "epoch": 996} {"train_loss": -11.016183853149414, "global_step": 167450, "epoch": 996} {"train_loss": -10.914031982421875, "global_step": 167451, "epoch": 996} {"train_loss": -10.986727714538574, "global_step": 167452, "epoch": 996} {"train_loss": -11.002317428588867, "global_step": 167453, "epoch": 996} {"train_loss": -11.134684562683105, "global_step": 167454, "epoch": 996} {"train_loss": -11.043144226074219, "global_step": 167455, "epoch": 996} {"train_loss": -11.310714721679688, "global_step": 167456, "epoch": 996} {"train_loss": -11.106781005859375, "global_step": 167457, "epoch": 996} {"train_loss": -11.162307739257812, "global_step": 167458, "epoch": 996} {"train_loss": -11.197093963623047, "global_step": 167459, "epoch": 996} {"train_loss": -11.104183197021484, "global_step": 167460, "epoch": 996} {"train_loss": -11.258158683776855, "global_step": 167461, "epoch": 996} {"train_loss": -11.072443008422852, "global_step": 167462, "epoch": 996} {"train_loss": -11.198356628417969, "global_step": 167463, "epoch": 996} {"train_loss": -11.131959915161133, "global_step": 167464, "epoch": 996} {"train_loss": -11.268030166625977, "global_step": 167465, "epoch": 996} {"train_loss": -11.309341430664062, "global_step": 167466, "epoch": 996} {"train_loss": -10.974967956542969, "global_step": 167467, "epoch": 996} {"train_loss": -11.213438034057617, "global_step": 167468, "epoch": 996} {"train_loss": -11.201053619384766, "global_step": 167469, "epoch": 996} {"train_loss": -11.041921615600586, "global_step": 167470, "epoch": 996} {"train_loss": -11.079246520996094, "global_step": 167471, "epoch": 996} {"train_loss": -11.191478729248047, "global_step": 167472, "epoch": 996} {"train_loss": -11.144245147705078, "global_step": 167473, "epoch": 996} {"train_loss": -11.104930877685547, "global_step": 167474, "epoch": 996} {"train_loss": -11.289016723632812, "global_step": 167475, "epoch": 996} {"train_loss": -11.194924354553223, "global_step": 167476, "epoch": 996} {"train_loss": -11.141998291015625, "global_step": 167477, "epoch": 996} {"train_loss": -11.18936538696289, "global_step": 167478, "epoch": 996} {"train_loss": -10.98015308380127, "global_step": 167479, "epoch": 996} {"train_loss": -11.133806228637695, "global_step": 167480, "epoch": 996} {"train_loss": -11.09457778930664, "global_step": 167481, "epoch": 996} {"train_loss": -11.24345874786377, "global_step": 167482, "epoch": 996} {"train_loss": -11.543781280517578, "global_step": 167483, "epoch": 996} {"train_loss": -11.108097076416016, "global_step": 167484, "epoch": 996} {"train_loss": -11.341282844543457, "global_step": 167485, "epoch": 996} {"train_loss": -11.06584358215332, "global_step": 167486, "epoch": 996} {"train_loss": -11.30111026763916, "global_step": 167487, "epoch": 996} {"train_loss": -11.240364074707031, "global_step": 167488, "epoch": 996} {"train_loss": -10.674142837524414, "global_step": 167489, "epoch": 996} {"train_loss": -10.688323020935059, "global_step": 167490, "epoch": 996} {"train_loss": -11.175688743591309, "global_step": 167491, "epoch": 996} {"train_loss": -10.75963306427002, "global_step": 167492, "epoch": 996} {"train_loss": -10.003154754638672, "global_step": 167493, "epoch": 996} {"train_loss": -11.198182106018066, "global_step": 167494, "epoch": 996} {"train_loss": -10.938270370165506, "global_step": 167495, "epoch": 996, "val_loss": 235491.03125} {"train_loss": -9.333551406860352, "global_step": 167496, "epoch": 997} {"train_loss": -10.654998779296875, "global_step": 167497, "epoch": 997} {"train_loss": -8.890020370483398, "global_step": 167498, "epoch": 997} {"train_loss": -10.885534286499023, "global_step": 167499, "epoch": 997} {"train_loss": -9.10350227355957, "global_step": 167500, "epoch": 997} {"train_loss": -11.02165412902832, "global_step": 167501, "epoch": 997} {"train_loss": -10.09592056274414, "global_step": 167502, "epoch": 997} {"train_loss": -10.794290542602539, "global_step": 167503, "epoch": 997} {"train_loss": -10.358088493347168, "global_step": 167504, "epoch": 997} {"train_loss": -10.609787940979004, "global_step": 167505, "epoch": 997} {"train_loss": -10.830084800720215, "global_step": 167506, "epoch": 997} {"train_loss": -10.755670547485352, "global_step": 167507, "epoch": 997} {"train_loss": -11.16041088104248, "global_step": 167508, "epoch": 997} {"train_loss": -10.723026275634766, "global_step": 167509, "epoch": 997} {"train_loss": -10.977815628051758, "global_step": 167510, "epoch": 997} {"train_loss": -11.006200790405273, "global_step": 167511, "epoch": 997} {"train_loss": -10.947504043579102, "global_step": 167512, "epoch": 997} {"train_loss": -11.149600982666016, "global_step": 167513, "epoch": 997} {"train_loss": -10.90866470336914, "global_step": 167514, "epoch": 997} {"train_loss": -10.941286087036133, "global_step": 167515, "epoch": 997} {"train_loss": -10.652505874633789, "global_step": 167516, "epoch": 997} {"train_loss": -10.66544246673584, "global_step": 167517, "epoch": 997} {"train_loss": -10.893277168273926, "global_step": 167518, "epoch": 997} {"train_loss": -10.855300903320312, "global_step": 167519, "epoch": 997} {"train_loss": -10.735700607299805, "global_step": 167520, "epoch": 997} {"train_loss": -11.164108276367188, "global_step": 167521, "epoch": 997} {"train_loss": -10.569028854370117, "global_step": 167522, "epoch": 997} {"train_loss": -10.826597213745117, "global_step": 167523, "epoch": 997} {"train_loss": -11.068085670471191, "global_step": 167524, "epoch": 997} {"train_loss": -10.556735038757324, "global_step": 167525, "epoch": 997} {"train_loss": -11.068707466125488, "global_step": 167526, "epoch": 997} {"train_loss": -10.706926345825195, "global_step": 167527, "epoch": 997} {"train_loss": -10.977813720703125, "global_step": 167528, "epoch": 997} {"train_loss": -10.892337799072266, "global_step": 167529, "epoch": 997} {"train_loss": -10.475706100463867, "global_step": 167530, "epoch": 997} {"train_loss": -10.623672485351562, "global_step": 167531, "epoch": 997} {"train_loss": -11.059703826904297, "global_step": 167532, "epoch": 997} {"train_loss": -10.832256317138672, "global_step": 167533, "epoch": 997} {"train_loss": -11.046164512634277, "global_step": 167534, "epoch": 997} {"train_loss": -10.977481842041016, "global_step": 167535, "epoch": 997} {"train_loss": -10.515748977661133, "global_step": 167536, "epoch": 997} {"train_loss": -11.088959693908691, "global_step": 167537, "epoch": 997} {"train_loss": -10.667459487915039, "global_step": 167538, "epoch": 997} {"train_loss": -11.087912559509277, "global_step": 167539, "epoch": 997} {"train_loss": -10.535425186157227, "global_step": 167540, "epoch": 997} {"train_loss": -10.898098945617676, "global_step": 167541, "epoch": 997} {"train_loss": -10.772976875305176, "global_step": 167542, "epoch": 997} {"train_loss": -11.187732696533203, "global_step": 167543, "epoch": 997} {"train_loss": -10.601868629455566, "global_step": 167544, "epoch": 997} {"train_loss": -10.880541801452637, "global_step": 167545, "epoch": 997} {"train_loss": -10.905385971069336, "global_step": 167546, "epoch": 997} {"train_loss": -10.864734649658203, "global_step": 167547, "epoch": 997} {"train_loss": -10.929729461669922, "global_step": 167548, "epoch": 997} {"train_loss": -10.661288261413574, "global_step": 167549, "epoch": 997} {"train_loss": -10.819536209106445, "global_step": 167550, "epoch": 997} {"train_loss": -10.844497680664062, "global_step": 167551, "epoch": 997} {"train_loss": -10.978164672851562, "global_step": 167552, "epoch": 997} {"train_loss": -10.785329818725586, "global_step": 167553, "epoch": 997} {"train_loss": -11.251762390136719, "global_step": 167554, "epoch": 997} {"train_loss": -10.852483749389648, "global_step": 167555, "epoch": 997} {"train_loss": -11.249918937683105, "global_step": 167556, "epoch": 997} {"train_loss": -10.802928924560547, "global_step": 167557, "epoch": 997} {"train_loss": -10.94704532623291, "global_step": 167558, "epoch": 997} {"train_loss": -11.225444793701172, "global_step": 167559, "epoch": 997} {"train_loss": -11.147360801696777, "global_step": 167560, "epoch": 997} {"train_loss": -11.194353103637695, "global_step": 167561, "epoch": 997} {"train_loss": -11.168209075927734, "global_step": 167562, "epoch": 997} {"train_loss": -11.195683479309082, "global_step": 167563, "epoch": 997} {"train_loss": -11.066222190856934, "global_step": 167564, "epoch": 997} {"train_loss": -11.251136779785156, "global_step": 167565, "epoch": 997} {"train_loss": -11.096142768859863, "global_step": 167566, "epoch": 997} {"train_loss": -11.123023986816406, "global_step": 167567, "epoch": 997} {"train_loss": -10.99463176727295, "global_step": 167568, "epoch": 997} {"train_loss": -11.093469619750977, "global_step": 167569, "epoch": 997} {"train_loss": -11.236982345581055, "global_step": 167570, "epoch": 997} {"train_loss": -11.264496803283691, "global_step": 167571, "epoch": 997} {"train_loss": -11.290512084960938, "global_step": 167572, "epoch": 997} {"train_loss": -11.126128196716309, "global_step": 167573, "epoch": 997} {"train_loss": -11.404956817626953, "global_step": 167574, "epoch": 997} {"train_loss": -11.417470932006836, "global_step": 167575, "epoch": 997} {"train_loss": -11.106141090393066, "global_step": 167576, "epoch": 997} {"train_loss": -11.207235336303711, "global_step": 167577, "epoch": 997} {"train_loss": -11.334961891174316, "global_step": 167578, "epoch": 997} {"train_loss": -10.97271728515625, "global_step": 167579, "epoch": 997} {"train_loss": -11.32189655303955, "global_step": 167580, "epoch": 997} {"train_loss": -11.133712768554688, "global_step": 167581, "epoch": 997} {"train_loss": -11.288381576538086, "global_step": 167582, "epoch": 997} {"train_loss": -11.179259300231934, "global_step": 167583, "epoch": 997} {"train_loss": -11.399847984313965, "global_step": 167584, "epoch": 997} {"train_loss": -11.457298278808594, "global_step": 167585, "epoch": 997} {"train_loss": -11.471088409423828, "global_step": 167586, "epoch": 997} {"train_loss": -11.290876388549805, "global_step": 167587, "epoch": 997} {"train_loss": -11.393410682678223, "global_step": 167588, "epoch": 997} {"train_loss": -11.322290420532227, "global_step": 167589, "epoch": 997} {"train_loss": -11.090929985046387, "global_step": 167590, "epoch": 997} {"train_loss": -11.37020492553711, "global_step": 167591, "epoch": 997} {"train_loss": -11.207603454589844, "global_step": 167592, "epoch": 997} {"train_loss": -11.214468002319336, "global_step": 167593, "epoch": 997} {"train_loss": -11.196320533752441, "global_step": 167594, "epoch": 997} {"train_loss": -11.29066276550293, "global_step": 167595, "epoch": 997} {"train_loss": -11.507343292236328, "global_step": 167596, "epoch": 997} {"train_loss": -10.82149887084961, "global_step": 167597, "epoch": 997} {"train_loss": -10.08350944519043, "global_step": 167598, "epoch": 997} {"train_loss": -10.125699996948242, "global_step": 167599, "epoch": 997} {"train_loss": -10.623708724975586, "global_step": 167600, "epoch": 997} {"train_loss": -10.252981185913086, "global_step": 167601, "epoch": 997} {"train_loss": -9.001554489135742, "global_step": 167602, "epoch": 997} {"train_loss": -10.293625831604004, "global_step": 167603, "epoch": 997} {"train_loss": -10.711145401000977, "global_step": 167604, "epoch": 997} {"train_loss": -10.841313362121582, "global_step": 167605, "epoch": 997} {"train_loss": -10.80527400970459, "global_step": 167606, "epoch": 997} {"train_loss": -10.878124237060547, "global_step": 167607, "epoch": 997} {"train_loss": -9.742260932922363, "global_step": 167608, "epoch": 997} {"train_loss": -11.15909194946289, "global_step": 167609, "epoch": 997} {"train_loss": -9.938486099243164, "global_step": 167610, "epoch": 997} {"train_loss": -9.970903396606445, "global_step": 167611, "epoch": 997} {"train_loss": -10.910213470458984, "global_step": 167612, "epoch": 997} {"train_loss": -9.934980392456055, "global_step": 167613, "epoch": 997} {"train_loss": -10.732791900634766, "global_step": 167614, "epoch": 997} {"train_loss": -10.606630325317383, "global_step": 167615, "epoch": 997} {"train_loss": -10.881750106811523, "global_step": 167616, "epoch": 997} {"train_loss": -11.04278564453125, "global_step": 167617, "epoch": 997} {"train_loss": -10.815336227416992, "global_step": 167618, "epoch": 997} {"train_loss": -10.722677230834961, "global_step": 167619, "epoch": 997} {"train_loss": -10.722578048706055, "global_step": 167620, "epoch": 997} {"train_loss": -10.908960342407227, "global_step": 167621, "epoch": 997} {"train_loss": -10.555587768554688, "global_step": 167622, "epoch": 997} {"train_loss": -10.983329772949219, "global_step": 167623, "epoch": 997} {"train_loss": -10.826078414916992, "global_step": 167624, "epoch": 997} {"train_loss": -10.793701171875, "global_step": 167625, "epoch": 997} {"train_loss": -10.99401569366455, "global_step": 167626, "epoch": 997} {"train_loss": -10.719226837158203, "global_step": 167627, "epoch": 997} {"train_loss": -10.828054428100586, "global_step": 167628, "epoch": 997} {"train_loss": -10.782073974609375, "global_step": 167629, "epoch": 997} {"train_loss": -10.95313835144043, "global_step": 167630, "epoch": 997} {"train_loss": -10.772727966308594, "global_step": 167631, "epoch": 997} {"train_loss": -11.145173072814941, "global_step": 167632, "epoch": 997} {"train_loss": -11.153087615966797, "global_step": 167633, "epoch": 997} {"train_loss": -10.895951271057129, "global_step": 167634, "epoch": 997} {"train_loss": -11.010229110717773, "global_step": 167635, "epoch": 997} {"train_loss": -10.970386505126953, "global_step": 167636, "epoch": 997} {"train_loss": -10.828563690185547, "global_step": 167637, "epoch": 997} {"train_loss": -10.768668174743652, "global_step": 167638, "epoch": 997} {"train_loss": -11.096805572509766, "global_step": 167639, "epoch": 997} {"train_loss": -11.038427352905273, "global_step": 167640, "epoch": 997} {"train_loss": -11.084794998168945, "global_step": 167641, "epoch": 997} {"train_loss": -10.91510009765625, "global_step": 167642, "epoch": 997} {"train_loss": -10.99752140045166, "global_step": 167643, "epoch": 997} {"train_loss": -10.461974143981934, "global_step": 167644, "epoch": 997} {"train_loss": -10.763162612915039, "global_step": 167645, "epoch": 997} {"train_loss": -11.050477981567383, "global_step": 167646, "epoch": 997} {"train_loss": -10.27121353149414, "global_step": 167647, "epoch": 997} {"train_loss": -11.134822845458984, "global_step": 167648, "epoch": 997} {"train_loss": -10.548959732055664, "global_step": 167649, "epoch": 997} {"train_loss": -11.196399688720703, "global_step": 167650, "epoch": 997} {"train_loss": -10.822555541992188, "global_step": 167651, "epoch": 997} {"train_loss": -10.960906028747559, "global_step": 167652, "epoch": 997} {"train_loss": -10.931537628173828, "global_step": 167653, "epoch": 997} {"train_loss": -10.955499649047852, "global_step": 167654, "epoch": 997} {"train_loss": -11.09284782409668, "global_step": 167655, "epoch": 997} {"train_loss": -11.065001487731934, "global_step": 167656, "epoch": 997} {"train_loss": -11.100343704223633, "global_step": 167657, "epoch": 997} {"train_loss": -11.178825378417969, "global_step": 167658, "epoch": 997} {"train_loss": -11.218969345092773, "global_step": 167659, "epoch": 997} {"train_loss": -11.224687576293945, "global_step": 167660, "epoch": 997} {"train_loss": -10.902647972106934, "global_step": 167661, "epoch": 997} {"train_loss": -11.15089225769043, "global_step": 167662, "epoch": 997} {"train_loss": -10.875214497248331, "global_step": 167663, "epoch": 997, "val_loss": 238724.5} {"train_loss": -11.045818328857422, "global_step": 167664, "epoch": 998} {"train_loss": -11.207988739013672, "global_step": 167665, "epoch": 998} {"train_loss": -11.291050910949707, "global_step": 167666, "epoch": 998} {"train_loss": -11.13870906829834, "global_step": 167667, "epoch": 998} {"train_loss": -11.158607482910156, "global_step": 167668, "epoch": 998} {"train_loss": -11.01683235168457, "global_step": 167669, "epoch": 998} {"train_loss": -11.120587348937988, "global_step": 167670, "epoch": 998} {"train_loss": -11.256597518920898, "global_step": 167671, "epoch": 998} {"train_loss": -10.821810722351074, "global_step": 167672, "epoch": 998} {"train_loss": -11.098389625549316, "global_step": 167673, "epoch": 998} {"train_loss": -11.045647621154785, "global_step": 167674, "epoch": 998} {"train_loss": -10.829046249389648, "global_step": 167675, "epoch": 998} {"train_loss": -11.160027503967285, "global_step": 167676, "epoch": 998} {"train_loss": -11.203877449035645, "global_step": 167677, "epoch": 998} {"train_loss": -11.0115385055542, "global_step": 167678, "epoch": 998} {"train_loss": -11.02823543548584, "global_step": 167679, "epoch": 998} {"train_loss": -10.74131965637207, "global_step": 167680, "epoch": 998} {"train_loss": -11.281227111816406, "global_step": 167681, "epoch": 998} {"train_loss": -11.185312271118164, "global_step": 167682, "epoch": 998} {"train_loss": -11.242706298828125, "global_step": 167683, "epoch": 998} {"train_loss": -11.257126808166504, "global_step": 167684, "epoch": 998} {"train_loss": -11.033927917480469, "global_step": 167685, "epoch": 998} {"train_loss": -11.306692123413086, "global_step": 167686, "epoch": 998} {"train_loss": -10.894482612609863, "global_step": 167687, "epoch": 998} {"train_loss": -11.247583389282227, "global_step": 167688, "epoch": 998} {"train_loss": -10.817911148071289, "global_step": 167689, "epoch": 998} {"train_loss": -11.0885648727417, "global_step": 167690, "epoch": 998} {"train_loss": -10.99310302734375, "global_step": 167691, "epoch": 998} {"train_loss": -10.413589477539062, "global_step": 167692, "epoch": 998} {"train_loss": -10.797773361206055, "global_step": 167693, "epoch": 998} {"train_loss": -10.94297981262207, "global_step": 167694, "epoch": 998} {"train_loss": -11.024348258972168, "global_step": 167695, "epoch": 998} {"train_loss": -11.076889038085938, "global_step": 167696, "epoch": 998} {"train_loss": -10.973592758178711, "global_step": 167697, "epoch": 998} {"train_loss": -10.940256118774414, "global_step": 167698, "epoch": 998} {"train_loss": -10.831338882446289, "global_step": 167699, "epoch": 998} {"train_loss": -11.350448608398438, "global_step": 167700, "epoch": 998} {"train_loss": -10.757585525512695, "global_step": 167701, "epoch": 998} {"train_loss": -10.945825576782227, "global_step": 167702, "epoch": 998} {"train_loss": -10.766419410705566, "global_step": 167703, "epoch": 998} {"train_loss": -11.126876831054688, "global_step": 167704, "epoch": 998} {"train_loss": -11.254135131835938, "global_step": 167705, "epoch": 998} {"train_loss": -11.230379104614258, "global_step": 167706, "epoch": 998} {"train_loss": -11.10837173461914, "global_step": 167707, "epoch": 998} {"train_loss": -11.301312446594238, "global_step": 167708, "epoch": 998} {"train_loss": -11.214838027954102, "global_step": 167709, "epoch": 998} {"train_loss": -11.033066749572754, "global_step": 167710, "epoch": 998} {"train_loss": -11.006889343261719, "global_step": 167711, "epoch": 998} {"train_loss": -11.154117584228516, "global_step": 167712, "epoch": 998} {"train_loss": -11.00072193145752, "global_step": 167713, "epoch": 998} {"train_loss": -11.094696044921875, "global_step": 167714, "epoch": 998} {"train_loss": -11.158697128295898, "global_step": 167715, "epoch": 998} {"train_loss": -11.118513107299805, "global_step": 167716, "epoch": 998} {"train_loss": -11.23287582397461, "global_step": 167717, "epoch": 998} {"train_loss": -11.36363410949707, "global_step": 167718, "epoch": 998} {"train_loss": -10.889875411987305, "global_step": 167719, "epoch": 998} {"train_loss": -10.911291122436523, "global_step": 167720, "epoch": 998} {"train_loss": -10.645328521728516, "global_step": 167721, "epoch": 998} {"train_loss": -10.915766716003418, "global_step": 167722, "epoch": 998} {"train_loss": -11.293877601623535, "global_step": 167723, "epoch": 998} {"train_loss": -10.91172981262207, "global_step": 167724, "epoch": 998} {"train_loss": -11.172362327575684, "global_step": 167725, "epoch": 998} {"train_loss": -10.942621231079102, "global_step": 167726, "epoch": 998} {"train_loss": -10.96413803100586, "global_step": 167727, "epoch": 998} {"train_loss": -11.166597366333008, "global_step": 167728, "epoch": 998} {"train_loss": -10.656978607177734, "global_step": 167729, "epoch": 998} {"train_loss": -10.243473052978516, "global_step": 167730, "epoch": 998} {"train_loss": -11.104232788085938, "global_step": 167731, "epoch": 998} {"train_loss": -10.299713134765625, "global_step": 167732, "epoch": 998} {"train_loss": -11.292683601379395, "global_step": 167733, "epoch": 998} {"train_loss": -10.576974868774414, "global_step": 167734, "epoch": 998} {"train_loss": -10.848001480102539, "global_step": 167735, "epoch": 998} {"train_loss": -11.047220230102539, "global_step": 167736, "epoch": 998} {"train_loss": -10.55057430267334, "global_step": 167737, "epoch": 998} {"train_loss": -11.082539558410645, "global_step": 167738, "epoch": 998} {"train_loss": -10.616065979003906, "global_step": 167739, "epoch": 998} {"train_loss": -10.21420955657959, "global_step": 167740, "epoch": 998} {"train_loss": -10.107829093933105, "global_step": 167741, "epoch": 998} {"train_loss": -9.678345680236816, "global_step": 167742, "epoch": 998} {"train_loss": -10.439987182617188, "global_step": 167743, "epoch": 998} {"train_loss": -9.759014129638672, "global_step": 167744, "epoch": 998} {"train_loss": -10.475131034851074, "global_step": 167745, "epoch": 998} {"train_loss": -10.044970512390137, "global_step": 167746, "epoch": 998} {"train_loss": -10.966692924499512, "global_step": 167747, "epoch": 998} {"train_loss": -10.217066764831543, "global_step": 167748, "epoch": 998} {"train_loss": -11.002717971801758, "global_step": 167749, "epoch": 998} {"train_loss": -10.536201477050781, "global_step": 167750, "epoch": 998} {"train_loss": -10.987224578857422, "global_step": 167751, "epoch": 998} {"train_loss": -10.489639282226562, "global_step": 167752, "epoch": 998} {"train_loss": -10.788786888122559, "global_step": 167753, "epoch": 998} {"train_loss": -10.783760070800781, "global_step": 167754, "epoch": 998} {"train_loss": -10.85167121887207, "global_step": 167755, "epoch": 998} {"train_loss": -10.900390625, "global_step": 167756, "epoch": 998} {"train_loss": -11.040144920349121, "global_step": 167757, "epoch": 998} {"train_loss": -10.874399185180664, "global_step": 167758, "epoch": 998} {"train_loss": -10.86562728881836, "global_step": 167759, "epoch": 998} {"train_loss": -11.008975982666016, "global_step": 167760, "epoch": 998} {"train_loss": -11.004803657531738, "global_step": 167761, "epoch": 998} {"train_loss": -11.05031967163086, "global_step": 167762, "epoch": 998} {"train_loss": -10.888319969177246, "global_step": 167763, "epoch": 998} {"train_loss": -11.173246383666992, "global_step": 167764, "epoch": 998} {"train_loss": -11.043718338012695, "global_step": 167765, "epoch": 998} {"train_loss": -10.851835250854492, "global_step": 167766, "epoch": 998} {"train_loss": -11.190673828125, "global_step": 167767, "epoch": 998} {"train_loss": -10.992513656616211, "global_step": 167768, "epoch": 998} {"train_loss": -10.841264724731445, "global_step": 167769, "epoch": 998} {"train_loss": -11.251670837402344, "global_step": 167770, "epoch": 998} {"train_loss": -11.383783340454102, "global_step": 167771, "epoch": 998} {"train_loss": -10.98611068725586, "global_step": 167772, "epoch": 998} {"train_loss": -11.141609191894531, "global_step": 167773, "epoch": 998} {"train_loss": -11.299638748168945, "global_step": 167774, "epoch": 998} {"train_loss": -11.221571922302246, "global_step": 167775, "epoch": 998} {"train_loss": -11.361612319946289, "global_step": 167776, "epoch": 998} {"train_loss": -11.2119140625, "global_step": 167777, "epoch": 998} {"train_loss": -11.416095733642578, "global_step": 167778, "epoch": 998} {"train_loss": -11.364724159240723, "global_step": 167779, "epoch": 998} {"train_loss": -11.36628246307373, "global_step": 167780, "epoch": 998} {"train_loss": -11.307503700256348, "global_step": 167781, "epoch": 998} {"train_loss": -11.320384979248047, "global_step": 167782, "epoch": 998} {"train_loss": -11.340324401855469, "global_step": 167783, "epoch": 998} {"train_loss": -11.475128173828125, "global_step": 167784, "epoch": 998} {"train_loss": -11.259933471679688, "global_step": 167785, "epoch": 998} {"train_loss": -11.428496360778809, "global_step": 167786, "epoch": 998} {"train_loss": -11.25462532043457, "global_step": 167787, "epoch": 998} {"train_loss": -10.982108116149902, "global_step": 167788, "epoch": 998} {"train_loss": -11.34859848022461, "global_step": 167789, "epoch": 998} {"train_loss": -11.257060050964355, "global_step": 167790, "epoch": 998} {"train_loss": -11.03161334991455, "global_step": 167791, "epoch": 998} {"train_loss": -11.114566802978516, "global_step": 167792, "epoch": 998} {"train_loss": -11.26905632019043, "global_step": 167793, "epoch": 998} {"train_loss": -11.324625968933105, "global_step": 167794, "epoch": 998} {"train_loss": -11.002447128295898, "global_step": 167795, "epoch": 998} {"train_loss": -10.545684814453125, "global_step": 167796, "epoch": 998} {"train_loss": -10.825704574584961, "global_step": 167797, "epoch": 998} {"train_loss": -11.001749038696289, "global_step": 167798, "epoch": 998} {"train_loss": -10.991222381591797, "global_step": 167799, "epoch": 998} {"train_loss": -10.217832565307617, "global_step": 167800, "epoch": 998} {"train_loss": -10.723932266235352, "global_step": 167801, "epoch": 998} {"train_loss": -10.461063385009766, "global_step": 167802, "epoch": 998} {"train_loss": -10.677024841308594, "global_step": 167803, "epoch": 998} {"train_loss": -9.659371376037598, "global_step": 167804, "epoch": 998} {"train_loss": -10.917325973510742, "global_step": 167805, "epoch": 998} {"train_loss": -8.673541069030762, "global_step": 167806, "epoch": 998} {"train_loss": -10.514887809753418, "global_step": 167807, "epoch": 998} {"train_loss": -8.78165340423584, "global_step": 167808, "epoch": 998} {"train_loss": -10.082602500915527, "global_step": 167809, "epoch": 998} {"train_loss": -10.268486022949219, "global_step": 167810, "epoch": 998} {"train_loss": -9.73238754272461, "global_step": 167811, "epoch": 998} {"train_loss": -10.749181747436523, "global_step": 167812, "epoch": 998} {"train_loss": -9.215773582458496, "global_step": 167813, "epoch": 998} {"train_loss": -10.62601375579834, "global_step": 167814, "epoch": 998} {"train_loss": -10.401012420654297, "global_step": 167815, "epoch": 998} {"train_loss": -10.754030227661133, "global_step": 167816, "epoch": 998} {"train_loss": -10.898193359375, "global_step": 167817, "epoch": 998} {"train_loss": -10.278986930847168, "global_step": 167818, "epoch": 998} {"train_loss": -10.808219909667969, "global_step": 167819, "epoch": 998} {"train_loss": -10.805240631103516, "global_step": 167820, "epoch": 998} {"train_loss": -10.958996772766113, "global_step": 167821, "epoch": 998} {"train_loss": -10.591470718383789, "global_step": 167822, "epoch": 998} {"train_loss": -10.589375495910645, "global_step": 167823, "epoch": 998} {"train_loss": -10.472051620483398, "global_step": 167824, "epoch": 998} {"train_loss": -10.618922233581543, "global_step": 167825, "epoch": 998} {"train_loss": -10.318577766418457, "global_step": 167826, "epoch": 998} {"train_loss": -10.828178405761719, "global_step": 167827, "epoch": 998} {"train_loss": -10.168134689331055, "global_step": 167828, "epoch": 998} {"train_loss": -10.774642944335938, "global_step": 167829, "epoch": 998} {"train_loss": -10.229846954345703, "global_step": 167830, "epoch": 998} {"train_loss": -10.86347344375792, "global_step": 167831, "epoch": 998, "val_loss": 237616.8125} {"train_loss": -10.972769737243652, "global_step": 167832, "epoch": 999} {"train_loss": -10.38479995727539, "global_step": 167833, "epoch": 999} {"train_loss": -10.834948539733887, "global_step": 167834, "epoch": 999} {"train_loss": -10.509584426879883, "global_step": 167835, "epoch": 999} {"train_loss": -10.278712272644043, "global_step": 167836, "epoch": 999} {"train_loss": -10.85611343383789, "global_step": 167837, "epoch": 999} {"train_loss": -10.862162590026855, "global_step": 167838, "epoch": 999} {"train_loss": -10.59414291381836, "global_step": 167839, "epoch": 999} {"train_loss": -10.985047340393066, "global_step": 167840, "epoch": 999} {"train_loss": -10.598346710205078, "global_step": 167841, "epoch": 999} {"train_loss": -10.922788619995117, "global_step": 167842, "epoch": 999} {"train_loss": -10.994254112243652, "global_step": 167843, "epoch": 999} {"train_loss": -10.572259902954102, "global_step": 167844, "epoch": 999} {"train_loss": -10.928268432617188, "global_step": 167845, "epoch": 999} {"train_loss": -11.084525108337402, "global_step": 167846, "epoch": 999} {"train_loss": -10.837991714477539, "global_step": 167847, "epoch": 999} {"train_loss": -11.18274211883545, "global_step": 167848, "epoch": 999} {"train_loss": -10.989084243774414, "global_step": 167849, "epoch": 999} {"train_loss": -11.243637084960938, "global_step": 167850, "epoch": 999} {"train_loss": -10.989198684692383, "global_step": 167851, "epoch": 999} {"train_loss": -10.901350021362305, "global_step": 167852, "epoch": 999} {"train_loss": -11.160972595214844, "global_step": 167853, "epoch": 999} {"train_loss": -10.77777099609375, "global_step": 167854, "epoch": 999} {"train_loss": -11.091390609741211, "global_step": 167855, "epoch": 999} {"train_loss": -11.135356903076172, "global_step": 167856, "epoch": 999} {"train_loss": -10.902217864990234, "global_step": 167857, "epoch": 999} {"train_loss": -11.16773796081543, "global_step": 167858, "epoch": 999} {"train_loss": -10.68213176727295, "global_step": 167859, "epoch": 999} {"train_loss": -11.091282844543457, "global_step": 167860, "epoch": 999} {"train_loss": -10.940524101257324, "global_step": 167861, "epoch": 999} {"train_loss": -11.059425354003906, "global_step": 167862, "epoch": 999} {"train_loss": -10.779492378234863, "global_step": 167863, "epoch": 999} {"train_loss": -11.340432167053223, "global_step": 167864, "epoch": 999} {"train_loss": -10.953187942504883, "global_step": 167865, "epoch": 999} {"train_loss": -11.030717849731445, "global_step": 167866, "epoch": 999} {"train_loss": -11.096065521240234, "global_step": 167867, "epoch": 999} {"train_loss": -10.968805313110352, "global_step": 167868, "epoch": 999} {"train_loss": -11.16104793548584, "global_step": 167869, "epoch": 999} {"train_loss": -10.892675399780273, "global_step": 167870, "epoch": 999} {"train_loss": -11.273252487182617, "global_step": 167871, "epoch": 999} {"train_loss": -11.053689956665039, "global_step": 167872, "epoch": 999} {"train_loss": -11.336225509643555, "global_step": 167873, "epoch": 999} {"train_loss": -10.915950775146484, "global_step": 167874, "epoch": 999} {"train_loss": -11.24409008026123, "global_step": 167875, "epoch": 999} {"train_loss": -11.390640258789062, "global_step": 167876, "epoch": 999} {"train_loss": -11.169143676757812, "global_step": 167877, "epoch": 999} {"train_loss": -11.180656433105469, "global_step": 167878, "epoch": 999} {"train_loss": -11.095926284790039, "global_step": 167879, "epoch": 999} {"train_loss": -11.180242538452148, "global_step": 167880, "epoch": 999} {"train_loss": -11.236724853515625, "global_step": 167881, "epoch": 999} {"train_loss": -11.459185600280762, "global_step": 167882, "epoch": 999} {"train_loss": -11.294670104980469, "global_step": 167883, "epoch": 999} {"train_loss": -11.2225923538208, "global_step": 167884, "epoch": 999} {"train_loss": -11.286898612976074, "global_step": 167885, "epoch": 999} {"train_loss": -11.506119728088379, "global_step": 167886, "epoch": 999} {"train_loss": -11.226705551147461, "global_step": 167887, "epoch": 999} {"train_loss": -11.523579597473145, "global_step": 167888, "epoch": 999} {"train_loss": -10.954729080200195, "global_step": 167889, "epoch": 999} {"train_loss": -10.808991432189941, "global_step": 167890, "epoch": 999} {"train_loss": -10.73483657836914, "global_step": 167891, "epoch": 999} {"train_loss": -11.185691833496094, "global_step": 167892, "epoch": 999} {"train_loss": -10.017928123474121, "global_step": 167893, "epoch": 999} {"train_loss": -10.43989086151123, "global_step": 167894, "epoch": 999} {"train_loss": -11.070892333984375, "global_step": 167895, "epoch": 999} {"train_loss": -10.770566940307617, "global_step": 167896, "epoch": 999} {"train_loss": -9.565298080444336, "global_step": 167897, "epoch": 999} {"train_loss": -11.176362991333008, "global_step": 167898, "epoch": 999} {"train_loss": -11.019759178161621, "global_step": 167899, "epoch": 999} {"train_loss": -10.638933181762695, "global_step": 167900, "epoch": 999} {"train_loss": -10.935970306396484, "global_step": 167901, "epoch": 999} {"train_loss": -10.736865997314453, "global_step": 167902, "epoch": 999} {"train_loss": -10.449494361877441, "global_step": 167903, "epoch": 999} {"train_loss": -11.168601989746094, "global_step": 167904, "epoch": 999} {"train_loss": -10.449442863464355, "global_step": 167905, "epoch": 999} {"train_loss": -10.907397270202637, "global_step": 167906, "epoch": 999} {"train_loss": -10.598793029785156, "global_step": 167907, "epoch": 999} {"train_loss": -10.60803508758545, "global_step": 167908, "epoch": 999} {"train_loss": -10.781238555908203, "global_step": 167909, "epoch": 999} {"train_loss": -10.870792388916016, "global_step": 167910, "epoch": 999} {"train_loss": -10.935308456420898, "global_step": 167911, "epoch": 999} {"train_loss": -10.895753860473633, "global_step": 167912, "epoch": 999} {"train_loss": -10.648871421813965, "global_step": 167913, "epoch": 999} {"train_loss": -10.976167678833008, "global_step": 167914, "epoch": 999} {"train_loss": -10.596555709838867, "global_step": 167915, "epoch": 999} {"train_loss": -10.972127914428711, "global_step": 167916, "epoch": 999} {"train_loss": -10.65074348449707, "global_step": 167917, "epoch": 999} {"train_loss": -10.575126647949219, "global_step": 167918, "epoch": 999} {"train_loss": -10.89765453338623, "global_step": 167919, "epoch": 999} {"train_loss": -10.787348747253418, "global_step": 167920, "epoch": 999} {"train_loss": -10.461207389831543, "global_step": 167921, "epoch": 999} {"train_loss": -10.476951599121094, "global_step": 167922, "epoch": 999} {"train_loss": -9.8536376953125, "global_step": 167923, "epoch": 999} {"train_loss": -10.48200798034668, "global_step": 167924, "epoch": 999} {"train_loss": -9.943977355957031, "global_step": 167925, "epoch": 999} {"train_loss": -10.78164291381836, "global_step": 167926, "epoch": 999} {"train_loss": -10.637124061584473, "global_step": 167927, "epoch": 999} {"train_loss": -10.432092666625977, "global_step": 167928, "epoch": 999} {"train_loss": -10.471946716308594, "global_step": 167929, "epoch": 999} {"train_loss": -10.277870178222656, "global_step": 167930, "epoch": 999} {"train_loss": -10.298016548156738, "global_step": 167931, "epoch": 999} {"train_loss": -10.659777641296387, "global_step": 167932, "epoch": 999} {"train_loss": -10.003732681274414, "global_step": 167933, "epoch": 999} {"train_loss": -10.805580139160156, "global_step": 167934, "epoch": 999} {"train_loss": -10.691198348999023, "global_step": 167935, "epoch": 999} {"train_loss": -10.577653884887695, "global_step": 167936, "epoch": 999} {"train_loss": -10.885549545288086, "global_step": 167937, "epoch": 999} {"train_loss": -10.56850814819336, "global_step": 167938, "epoch": 999} {"train_loss": -10.747081756591797, "global_step": 167939, "epoch": 999} {"train_loss": -10.685848236083984, "global_step": 167940, "epoch": 999} {"train_loss": -10.57960033416748, "global_step": 167941, "epoch": 999} {"train_loss": -10.899100303649902, "global_step": 167942, "epoch": 999} {"train_loss": -10.666086196899414, "global_step": 167943, "epoch": 999} {"train_loss": -10.893879890441895, "global_step": 167944, "epoch": 999} {"train_loss": -10.912012100219727, "global_step": 167945, "epoch": 999} {"train_loss": -10.96090316772461, "global_step": 167946, "epoch": 999} {"train_loss": -10.65818977355957, "global_step": 167947, "epoch": 999} {"train_loss": -11.129768371582031, "global_step": 167948, "epoch": 999} {"train_loss": -10.924076080322266, "global_step": 167949, "epoch": 999} {"train_loss": -10.470462799072266, "global_step": 167950, "epoch": 999} {"train_loss": -10.99693489074707, "global_step": 167951, "epoch": 999} {"train_loss": -10.79849624633789, "global_step": 167952, "epoch": 999} {"train_loss": -10.761320114135742, "global_step": 167953, "epoch": 999} {"train_loss": -11.094476699829102, "global_step": 167954, "epoch": 999} {"train_loss": -10.763589859008789, "global_step": 167955, "epoch": 999} {"train_loss": -11.05070686340332, "global_step": 167956, "epoch": 999} {"train_loss": -10.986860275268555, "global_step": 167957, "epoch": 999} {"train_loss": -11.035390853881836, "global_step": 167958, "epoch": 999} {"train_loss": -11.04391098022461, "global_step": 167959, "epoch": 999} {"train_loss": -11.015279769897461, "global_step": 167960, "epoch": 999} {"train_loss": -11.064204216003418, "global_step": 167961, "epoch": 999} {"train_loss": -11.127784729003906, "global_step": 167962, "epoch": 999} {"train_loss": -11.250137329101562, "global_step": 167963, "epoch": 999} {"train_loss": -10.737592697143555, "global_step": 167964, "epoch": 999} {"train_loss": -11.252449035644531, "global_step": 167965, "epoch": 999} {"train_loss": -11.207603454589844, "global_step": 167966, "epoch": 999} {"train_loss": -10.969698905944824, "global_step": 167967, "epoch": 999} {"train_loss": -11.134655952453613, "global_step": 167968, "epoch": 999} {"train_loss": -11.00190544128418, "global_step": 167969, "epoch": 999} {"train_loss": -11.39530086517334, "global_step": 167970, "epoch": 999} {"train_loss": -11.239208221435547, "global_step": 167971, "epoch": 999} {"train_loss": -11.195623397827148, "global_step": 167972, "epoch": 999} {"train_loss": -11.181564331054688, "global_step": 167973, "epoch": 999} {"train_loss": -11.360702514648438, "global_step": 167974, "epoch": 999} {"train_loss": -11.281496047973633, "global_step": 167975, "epoch": 999} {"train_loss": -11.28021240234375, "global_step": 167976, "epoch": 999} {"train_loss": -11.192136764526367, "global_step": 167977, "epoch": 999} {"train_loss": -11.319047927856445, "global_step": 167978, "epoch": 999} {"train_loss": -11.291370391845703, "global_step": 167979, "epoch": 999} {"train_loss": -11.229597091674805, "global_step": 167980, "epoch": 999} {"train_loss": -11.289012908935547, "global_step": 167981, "epoch": 999} {"train_loss": -11.402124404907227, "global_step": 167982, "epoch": 999} {"train_loss": -11.389507293701172, "global_step": 167983, "epoch": 999} {"train_loss": -11.309164047241211, "global_step": 167984, "epoch": 999} {"train_loss": -11.375593185424805, "global_step": 167985, "epoch": 999} {"train_loss": -11.39151382446289, "global_step": 167986, "epoch": 999} {"train_loss": -11.441757202148438, "global_step": 167987, "epoch": 999} {"train_loss": -11.199605941772461, "global_step": 167988, "epoch": 999} {"train_loss": -11.411087036132812, "global_step": 167989, "epoch": 999} {"train_loss": -11.288202285766602, "global_step": 167990, "epoch": 999} {"train_loss": -11.388740539550781, "global_step": 167991, "epoch": 999} {"train_loss": -11.484827041625977, "global_step": 167992, "epoch": 999} {"train_loss": -11.457897186279297, "global_step": 167993, "epoch": 999} {"train_loss": -11.591083526611328, "global_step": 167994, "epoch": 999} {"train_loss": -11.13746452331543, "global_step": 167995, "epoch": 999} {"train_loss": -11.0927734375, "global_step": 167996, "epoch": 999} {"train_loss": -11.194989204406738, "global_step": 167997, "epoch": 999} {"train_loss": -11.168062210083008, "global_step": 167998, "epoch": 999} {"train_loss": -10.946111565544491, "global_step": 167999, "epoch": 999, "val_loss": 241091.71875} {"train_loss": -11.221935272216797, "global_step": 168000, "epoch": 1000} {"train_loss": -10.504199981689453, "global_step": 168001, "epoch": 1000} {"train_loss": -10.175317764282227, "global_step": 168002, "epoch": 1000} {"train_loss": -10.975761413574219, "global_step": 168003, "epoch": 1000} {"train_loss": -10.016661643981934, "global_step": 168004, "epoch": 1000} {"train_loss": -10.225353240966797, "global_step": 168005, "epoch": 1000} {"train_loss": -10.20937728881836, "global_step": 168006, "epoch": 1000} {"train_loss": -9.555159568786621, "global_step": 168007, "epoch": 1000} {"train_loss": -10.169327735900879, "global_step": 168008, "epoch": 1000} {"train_loss": -10.525301933288574, "global_step": 168009, "epoch": 1000} {"train_loss": -10.368141174316406, "global_step": 168010, "epoch": 1000} {"train_loss": -9.50252914428711, "global_step": 168011, "epoch": 1000} {"train_loss": -10.398527145385742, "global_step": 168012, "epoch": 1000} {"train_loss": -10.339311599731445, "global_step": 168013, "epoch": 1000} {"train_loss": -9.786198616027832, "global_step": 168014, "epoch": 1000} {"train_loss": -10.727153778076172, "global_step": 168015, "epoch": 1000} {"train_loss": -8.470803260803223, "global_step": 168016, "epoch": 1000} {"train_loss": -10.212481498718262, "global_step": 168017, "epoch": 1000} {"train_loss": -9.257051467895508, "global_step": 168018, "epoch": 1000} {"train_loss": -9.739124298095703, "global_step": 168019, "epoch": 1000} {"train_loss": -10.393810272216797, "global_step": 168020, "epoch": 1000} {"train_loss": -9.975704193115234, "global_step": 168021, "epoch": 1000} {"train_loss": -10.540668487548828, "global_step": 168022, "epoch": 1000} {"train_loss": -9.921321868896484, "global_step": 168023, "epoch": 1000} {"train_loss": -10.426773071289062, "global_step": 168024, "epoch": 1000} {"train_loss": -10.51352310180664, "global_step": 168025, "epoch": 1000} {"train_loss": -10.7919340133667, "global_step": 168026, "epoch": 1000} {"train_loss": -10.438802719116211, "global_step": 168027, "epoch": 1000} {"train_loss": -10.858622550964355, "global_step": 168028, "epoch": 1000} {"train_loss": -10.647249221801758, "global_step": 168029, "epoch": 1000} {"train_loss": -10.767133712768555, "global_step": 168030, "epoch": 1000} {"train_loss": -10.707563400268555, "global_step": 168031, "epoch": 1000} {"train_loss": -10.75484848022461, "global_step": 168032, "epoch": 1000} {"train_loss": -10.884048461914062, "global_step": 168033, "epoch": 1000} {"train_loss": -10.969465255737305, "global_step": 168034, "epoch": 1000} {"train_loss": -10.837638854980469, "global_step": 168035, "epoch": 1000} {"train_loss": -10.681619644165039, "global_step": 168036, "epoch": 1000} {"train_loss": -11.199566841125488, "global_step": 168037, "epoch": 1000} {"train_loss": -10.791953086853027, "global_step": 168038, "epoch": 1000} {"train_loss": -10.913805961608887, "global_step": 168039, "epoch": 1000} {"train_loss": -10.989514350891113, "global_step": 168040, "epoch": 1000} {"train_loss": -10.807212829589844, "global_step": 168041, "epoch": 1000} {"train_loss": -10.899913787841797, "global_step": 168042, "epoch": 1000} {"train_loss": -10.917935371398926, "global_step": 168043, "epoch": 1000} {"train_loss": -11.02410888671875, "global_step": 168044, "epoch": 1000} {"train_loss": -10.883455276489258, "global_step": 168045, "epoch": 1000} {"train_loss": -10.90771484375, "global_step": 168046, "epoch": 1000} {"train_loss": -10.849776268005371, "global_step": 168047, "epoch": 1000} {"train_loss": -11.106071472167969, "global_step": 168048, "epoch": 1000} {"train_loss": -10.91595458984375, "global_step": 168049, "epoch": 1000} {"train_loss": -10.917924880981445, "global_step": 168050, "epoch": 1000} {"train_loss": -11.038348197937012, "global_step": 168051, "epoch": 1000} {"train_loss": -10.871304512023926, "global_step": 168052, "epoch": 1000} {"train_loss": -10.90903091430664, "global_step": 168053, "epoch": 1000} {"train_loss": -11.01321792602539, "global_step": 168054, "epoch": 1000} {"train_loss": -10.920228004455566, "global_step": 168055, "epoch": 1000} {"train_loss": -10.874185562133789, "global_step": 168056, "epoch": 1000} {"train_loss": -11.142681121826172, "global_step": 168057, "epoch": 1000} {"train_loss": -11.214208602905273, "global_step": 168058, "epoch": 1000} {"train_loss": -10.964622497558594, "global_step": 168059, "epoch": 1000} {"train_loss": -11.200370788574219, "global_step": 168060, "epoch": 1000} {"train_loss": -10.84520149230957, "global_step": 168061, "epoch": 1000} {"train_loss": -11.205965042114258, "global_step": 168062, "epoch": 1000} {"train_loss": -11.152385711669922, "global_step": 168063, "epoch": 1000} {"train_loss": -11.088850021362305, "global_step": 168064, "epoch": 1000} {"train_loss": -11.179286003112793, "global_step": 168065, "epoch": 1000} {"train_loss": -11.217561721801758, "global_step": 168066, "epoch": 1000} {"train_loss": -11.33517837524414, "global_step": 168067, "epoch": 1000} {"train_loss": -11.064154624938965, "global_step": 168068, "epoch": 1000} {"train_loss": -11.209413528442383, "global_step": 168069, "epoch": 1000} {"train_loss": -11.371293067932129, "global_step": 168070, "epoch": 1000} {"train_loss": -11.237712860107422, "global_step": 168071, "epoch": 1000} {"train_loss": -11.268409729003906, "global_step": 168072, "epoch": 1000} {"train_loss": -11.351306915283203, "global_step": 168073, "epoch": 1000} {"train_loss": -11.376554489135742, "global_step": 168074, "epoch": 1000} {"train_loss": -11.356853485107422, "global_step": 168075, "epoch": 1000} {"train_loss": -11.314567565917969, "global_step": 168076, "epoch": 1000} {"train_loss": -11.420150756835938, "global_step": 168077, "epoch": 1000} {"train_loss": -11.243510246276855, "global_step": 168078, "epoch": 1000} {"train_loss": -11.256235122680664, "global_step": 168079, "epoch": 1000} {"train_loss": -11.340089797973633, "global_step": 168080, "epoch": 1000} {"train_loss": -11.414571762084961, "global_step": 168081, "epoch": 1000} {"train_loss": -11.206920623779297, "global_step": 168082, "epoch": 1000} {"train_loss": -11.32061767578125, "global_step": 168083, "epoch": 1000} {"train_loss": -11.33132553100586, "global_step": 168084, "epoch": 1000} {"train_loss": -11.064765930175781, "global_step": 168085, "epoch": 1000} {"train_loss": -11.238935470581055, "global_step": 168086, "epoch": 1000} {"train_loss": -10.560504913330078, "global_step": 168087, "epoch": 1000} {"train_loss": -10.546452522277832, "global_step": 168088, "epoch": 1000} {"train_loss": -10.522197723388672, "global_step": 168089, "epoch": 1000} {"train_loss": -10.810636520385742, "global_step": 168090, "epoch": 1000} {"train_loss": -10.378755569458008, "global_step": 168091, "epoch": 1000} {"train_loss": -10.839759826660156, "global_step": 168092, "epoch": 1000} {"train_loss": -10.443103790283203, "global_step": 168093, "epoch": 1000} {"train_loss": -9.993067741394043, "global_step": 168094, "epoch": 1000} {"train_loss": -10.744237899780273, "global_step": 168095, "epoch": 1000} {"train_loss": -9.742959976196289, "global_step": 168096, "epoch": 1000} {"train_loss": -8.570779800415039, "global_step": 168097, "epoch": 1000} {"train_loss": -9.80721664428711, "global_step": 168098, "epoch": 1000} {"train_loss": -10.491588592529297, "global_step": 168099, "epoch": 1000} {"train_loss": -8.876754760742188, "global_step": 168100, "epoch": 1000} {"train_loss": -10.470474243164062, "global_step": 168101, "epoch": 1000} {"train_loss": -8.707023620605469, "global_step": 168102, "epoch": 1000} {"train_loss": -9.839014053344727, "global_step": 168103, "epoch": 1000} {"train_loss": -9.658112525939941, "global_step": 168104, "epoch": 1000} {"train_loss": -9.404870986938477, "global_step": 168105, "epoch": 1000} {"train_loss": -9.68661117553711, "global_step": 168106, "epoch": 1000} {"train_loss": -10.145160675048828, "global_step": 168107, "epoch": 1000} {"train_loss": -8.945419311523438, "global_step": 168108, "epoch": 1000} {"train_loss": -9.87032699584961, "global_step": 168109, "epoch": 1000} {"train_loss": -10.312692642211914, "global_step": 168110, "epoch": 1000} {"train_loss": -9.95149040222168, "global_step": 168111, "epoch": 1000} {"train_loss": -9.733989715576172, "global_step": 168112, "epoch": 1000} {"train_loss": -9.974223136901855, "global_step": 168113, "epoch": 1000} {"train_loss": -9.631200790405273, "global_step": 168114, "epoch": 1000} {"train_loss": -10.182701110839844, "global_step": 168115, "epoch": 1000} {"train_loss": -10.637588500976562, "global_step": 168116, "epoch": 1000} {"train_loss": -10.583640098571777, "global_step": 168117, "epoch": 1000} {"train_loss": -10.596627235412598, "global_step": 168118, "epoch": 1000} {"train_loss": -10.523880004882812, "global_step": 168119, "epoch": 1000} {"train_loss": -10.815908432006836, "global_step": 168120, "epoch": 1000} {"train_loss": -10.612688064575195, "global_step": 168121, "epoch": 1000} {"train_loss": -10.27864933013916, "global_step": 168122, "epoch": 1000} {"train_loss": -10.585801124572754, "global_step": 168123, "epoch": 1000} {"train_loss": -10.419208526611328, "global_step": 168124, "epoch": 1000} {"train_loss": -10.561315536499023, "global_step": 168125, "epoch": 1000} {"train_loss": -10.733851432800293, "global_step": 168126, "epoch": 1000} {"train_loss": -10.717738151550293, "global_step": 168127, "epoch": 1000} {"train_loss": -10.739078521728516, "global_step": 168128, "epoch": 1000} {"train_loss": -10.807053565979004, "global_step": 168129, "epoch": 1000} {"train_loss": -10.670965194702148, "global_step": 168130, "epoch": 1000} {"train_loss": -11.063897132873535, "global_step": 168131, "epoch": 1000} {"train_loss": -10.933065414428711, "global_step": 168132, "epoch": 1000} {"train_loss": -10.756841659545898, "global_step": 168133, "epoch": 1000} {"train_loss": -10.75476360321045, "global_step": 168134, "epoch": 1000} {"train_loss": -10.797574996948242, "global_step": 168135, "epoch": 1000} {"train_loss": -10.736982345581055, "global_step": 168136, "epoch": 1000} {"train_loss": -10.906399726867676, "global_step": 168137, "epoch": 1000} {"train_loss": -11.013710021972656, "global_step": 168138, "epoch": 1000} {"train_loss": -11.070019721984863, "global_step": 168139, "epoch": 1000} {"train_loss": -10.764734268188477, "global_step": 168140, "epoch": 1000} {"train_loss": -11.11961555480957, "global_step": 168141, "epoch": 1000} {"train_loss": -10.99612045288086, "global_step": 168142, "epoch": 1000} {"train_loss": -10.917047500610352, "global_step": 168143, "epoch": 1000} {"train_loss": -11.104751586914062, "global_step": 168144, "epoch": 1000} {"train_loss": -11.194171905517578, "global_step": 168145, "epoch": 1000} {"train_loss": -11.094667434692383, "global_step": 168146, "epoch": 1000} {"train_loss": -10.996026039123535, "global_step": 168147, "epoch": 1000} {"train_loss": -10.996339797973633, "global_step": 168148, "epoch": 1000} {"train_loss": -11.221098899841309, "global_step": 168149, "epoch": 1000} {"train_loss": -11.182087898254395, "global_step": 168150, "epoch": 1000} {"train_loss": -10.97030258178711, "global_step": 168151, "epoch": 1000} {"train_loss": -11.332950592041016, "global_step": 168152, "epoch": 1000} {"train_loss": -11.010242462158203, "global_step": 168153, "epoch": 1000} {"train_loss": -11.207517623901367, "global_step": 168154, "epoch": 1000} {"train_loss": -11.052224159240723, "global_step": 168155, "epoch": 1000} {"train_loss": -11.4292631149292, "global_step": 168156, "epoch": 1000} {"train_loss": -11.097935676574707, "global_step": 168157, "epoch": 1000} {"train_loss": -11.354047775268555, "global_step": 168158, "epoch": 1000} {"train_loss": -10.98748779296875, "global_step": 168159, "epoch": 1000} {"train_loss": -11.340736389160156, "global_step": 168160, "epoch": 1000} {"train_loss": -11.299684524536133, "global_step": 168161, "epoch": 1000} {"train_loss": -11.186233520507812, "global_step": 168162, "epoch": 1000} {"train_loss": -11.219375610351562, "global_step": 168163, "epoch": 1000} {"train_loss": -11.302473068237305, "global_step": 168164, "epoch": 1000} {"train_loss": -11.065778732299805, "global_step": 168165, "epoch": 1000} {"train_loss": -11.380704879760742, "global_step": 168166, "epoch": 1000} {"train_loss": -10.691411461148943, "global_step": 168167, "epoch": 1000, "train/sim_max_reward_0": 0.5032860928806826, "train/sim_max_reward_1": 0.9084017774907511, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.6532337277600182, "train/sim_max_reward_4": 0.03420504838247046, "train/sim_max_reward_5": 0.6314759671795821, "test/sim_max_reward_4400000": 0.9839731310302358, "test/sim_max_reward_4400001": 0.36410196591655064, "test/sim_max_reward_4400002": 0.06370394981487607, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.9394645934411335, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 0.26972539241140586, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.7165787155869648, "test/sim_max_reward_4400009": 0.3752433434780029, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 0.9962472099702273, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.953510556368557, "test/sim_max_reward_4400014": 0.6787210530138287, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9107512082138084, "test/sim_max_reward_4400019": 0.4950344796798975, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 1.0, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 1.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.6039376016833723, "test/sim_max_reward_4400026": 0.05186311283631327, "test/sim_max_reward_4400027": 0.5604267590924903, "test/sim_max_reward_4400028": 1.0, "test/sim_max_reward_4400029": 0.6757784507360663, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.9980901399324671, "test/sim_max_reward_4400032": 0.1623051927201185, "test/sim_max_reward_4400033": 0.6777778455841815, "test/sim_max_reward_4400034": 0.5273294011856833, "test/sim_max_reward_4400035": 1.0, "test/sim_max_reward_4400036": 0.37329132752935607, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.959007815806348, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.716081035245126, "test/sim_max_reward_4400042": 1.0, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.20565420780941668, "test/sim_max_reward_4400045": 0.4688764103992116, "test/sim_max_reward_4400046": 0.31625851470559585, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.4551004356155841, "test/mean_score": 0.6028450097323841, "val_loss": 236570.015625, "train_action_mse_error": 1.5465816259384155} {"train_loss": -11.291717529296875, "global_step": 168168, "epoch": 1001} {"train_loss": -10.996931076049805, "global_step": 168169, "epoch": 1001} {"train_loss": -11.32495403289795, "global_step": 168170, "epoch": 1001} {"train_loss": -11.231790542602539, "global_step": 168171, "epoch": 1001} {"train_loss": -11.416319847106934, "global_step": 168172, "epoch": 1001} {"train_loss": -11.180005073547363, "global_step": 168173, "epoch": 1001} {"train_loss": -11.034331321716309, "global_step": 168174, "epoch": 1001} {"train_loss": -11.19231128692627, "global_step": 168175, "epoch": 1001} {"train_loss": -10.937089920043945, "global_step": 168176, "epoch": 1001} {"train_loss": -11.267190933227539, "global_step": 168177, "epoch": 1001} {"train_loss": -11.220266342163086, "global_step": 168178, "epoch": 1001} {"train_loss": -11.045637130737305, "global_step": 168179, "epoch": 1001} {"train_loss": -11.447235107421875, "global_step": 168180, "epoch": 1001} {"train_loss": -10.826433181762695, "global_step": 168181, "epoch": 1001} {"train_loss": -11.317219734191895, "global_step": 168182, "epoch": 1001} {"train_loss": -11.164731979370117, "global_step": 168183, "epoch": 1001} {"train_loss": -11.330635070800781, "global_step": 168184, "epoch": 1001} {"train_loss": -11.442095756530762, "global_step": 168185, "epoch": 1001} {"train_loss": -10.820493698120117, "global_step": 168186, "epoch": 1001} {"train_loss": -10.852752685546875, "global_step": 168187, "epoch": 1001} {"train_loss": -11.146697998046875, "global_step": 168188, "epoch": 1001} {"train_loss": -10.676888465881348, "global_step": 168189, "epoch": 1001} {"train_loss": -10.103527069091797, "global_step": 168190, "epoch": 1001} {"train_loss": -10.707277297973633, "global_step": 168191, "epoch": 1001} {"train_loss": -10.737009048461914, "global_step": 168192, "epoch": 1001} {"train_loss": -10.613574981689453, "global_step": 168193, "epoch": 1001} {"train_loss": -9.44816780090332, "global_step": 168194, "epoch": 1001} {"train_loss": -10.534796714782715, "global_step": 168195, "epoch": 1001} {"train_loss": -10.543510437011719, "global_step": 168196, "epoch": 1001} {"train_loss": -10.372926712036133, "global_step": 168197, "epoch": 1001} {"train_loss": -10.51997184753418, "global_step": 168198, "epoch": 1001} {"train_loss": -10.472375869750977, "global_step": 168199, "epoch": 1001} {"train_loss": -10.896539688110352, "global_step": 168200, "epoch": 1001} {"train_loss": -10.288887023925781, "global_step": 168201, "epoch": 1001} {"train_loss": -10.656761169433594, "global_step": 168202, "epoch": 1001} {"train_loss": -10.311904907226562, "global_step": 168203, "epoch": 1001} {"train_loss": -10.689994812011719, "global_step": 168204, "epoch": 1001} {"train_loss": -10.742351531982422, "global_step": 168205, "epoch": 1001} {"train_loss": -10.674844741821289, "global_step": 168206, "epoch": 1001} {"train_loss": -11.175220489501953, "global_step": 168207, "epoch": 1001} {"train_loss": -10.8271484375, "global_step": 168208, "epoch": 1001} {"train_loss": -11.02135181427002, "global_step": 168209, "epoch": 1001} {"train_loss": -10.645263671875, "global_step": 168210, "epoch": 1001} {"train_loss": -10.833091735839844, "global_step": 168211, "epoch": 1001} {"train_loss": -10.9892578125, "global_step": 168212, "epoch": 1001} {"train_loss": -10.54611873626709, "global_step": 168213, "epoch": 1001} {"train_loss": -10.610370635986328, "global_step": 168214, "epoch": 1001} {"train_loss": -10.561630249023438, "global_step": 168215, "epoch": 1001} {"train_loss": -10.960663795471191, "global_step": 168216, "epoch": 1001} {"train_loss": -10.842782974243164, "global_step": 168217, "epoch": 1001} {"train_loss": -10.888561248779297, "global_step": 168218, "epoch": 1001} {"train_loss": -10.778732299804688, "global_step": 168219, "epoch": 1001} {"train_loss": -10.756041526794434, "global_step": 168220, "epoch": 1001} {"train_loss": -10.951692581176758, "global_step": 168221, "epoch": 1001} {"train_loss": -10.633857727050781, "global_step": 168222, "epoch": 1001} {"train_loss": -11.127817153930664, "global_step": 168223, "epoch": 1001} {"train_loss": -11.097050666809082, "global_step": 168224, "epoch": 1001} {"train_loss": -10.952765464782715, "global_step": 168225, "epoch": 1001} {"train_loss": -11.091148376464844, "global_step": 168226, "epoch": 1001} {"train_loss": -10.827692031860352, "global_step": 168227, "epoch": 1001} {"train_loss": -11.068916320800781, "global_step": 168228, "epoch": 1001} {"train_loss": -11.080756187438965, "global_step": 168229, "epoch": 1001} {"train_loss": -10.914741516113281, "global_step": 168230, "epoch": 1001} {"train_loss": -10.900423049926758, "global_step": 168231, "epoch": 1001} {"train_loss": -11.104613304138184, "global_step": 168232, "epoch": 1001} {"train_loss": -11.013368606567383, "global_step": 168233, "epoch": 1001} {"train_loss": -11.205132484436035, "global_step": 168234, "epoch": 1001} {"train_loss": -10.875244140625, "global_step": 168235, "epoch": 1001} {"train_loss": -11.198187828063965, "global_step": 168236, "epoch": 1001} {"train_loss": -11.116839408874512, "global_step": 168237, "epoch": 1001} {"train_loss": -11.119738578796387, "global_step": 168238, "epoch": 1001} {"train_loss": -11.139419555664062, "global_step": 168239, "epoch": 1001} {"train_loss": -11.13244915008545, "global_step": 168240, "epoch": 1001} {"train_loss": -11.143521308898926, "global_step": 168241, "epoch": 1001} {"train_loss": -10.966180801391602, "global_step": 168242, "epoch": 1001} {"train_loss": -11.03213119506836, "global_step": 168243, "epoch": 1001} {"train_loss": -10.803516387939453, "global_step": 168244, "epoch": 1001} {"train_loss": -11.067784309387207, "global_step": 168245, "epoch": 1001} {"train_loss": -10.729549407958984, "global_step": 168246, "epoch": 1001} {"train_loss": -10.515201568603516, "global_step": 168247, "epoch": 1001} {"train_loss": -10.953969955444336, "global_step": 168248, "epoch": 1001} {"train_loss": -10.517410278320312, "global_step": 168249, "epoch": 1001} {"train_loss": -10.583876609802246, "global_step": 168250, "epoch": 1001} {"train_loss": -10.774089813232422, "global_step": 168251, "epoch": 1001} {"train_loss": -10.850048065185547, "global_step": 168252, "epoch": 1001} {"train_loss": -10.98633861541748, "global_step": 168253, "epoch": 1001} {"train_loss": -10.556199073791504, "global_step": 168254, "epoch": 1001} {"train_loss": -10.686556816101074, "global_step": 168255, "epoch": 1001} {"train_loss": -10.387849807739258, "global_step": 168256, "epoch": 1001} {"train_loss": -10.777922630310059, "global_step": 168257, "epoch": 1001} {"train_loss": -10.93721866607666, "global_step": 168258, "epoch": 1001} {"train_loss": -10.787440299987793, "global_step": 168259, "epoch": 1001} {"train_loss": -10.745452880859375, "global_step": 168260, "epoch": 1001} {"train_loss": -10.580587387084961, "global_step": 168261, "epoch": 1001} {"train_loss": -10.647224426269531, "global_step": 168262, "epoch": 1001} {"train_loss": -10.987001419067383, "global_step": 168263, "epoch": 1001} {"train_loss": -10.654844284057617, "global_step": 168264, "epoch": 1001} {"train_loss": -10.645798683166504, "global_step": 168265, "epoch": 1001} {"train_loss": -10.384326934814453, "global_step": 168266, "epoch": 1001} {"train_loss": -10.865178108215332, "global_step": 168267, "epoch": 1001} {"train_loss": -10.588948249816895, "global_step": 168268, "epoch": 1001} {"train_loss": -11.167428016662598, "global_step": 168269, "epoch": 1001} {"train_loss": -11.018365859985352, "global_step": 168270, "epoch": 1001} {"train_loss": -10.976739883422852, "global_step": 168271, "epoch": 1001} {"train_loss": -11.19604778289795, "global_step": 168272, "epoch": 1001} {"train_loss": -10.711644172668457, "global_step": 168273, "epoch": 1001} {"train_loss": -11.14317798614502, "global_step": 168274, "epoch": 1001} {"train_loss": -10.786773681640625, "global_step": 168275, "epoch": 1001} {"train_loss": -11.150897026062012, "global_step": 168276, "epoch": 1001} {"train_loss": -10.875534057617188, "global_step": 168277, "epoch": 1001} {"train_loss": -11.137174606323242, "global_step": 168278, "epoch": 1001} {"train_loss": -10.878294944763184, "global_step": 168279, "epoch": 1001} {"train_loss": -11.097524642944336, "global_step": 168280, "epoch": 1001} {"train_loss": -10.797346115112305, "global_step": 168281, "epoch": 1001} {"train_loss": -11.168055534362793, "global_step": 168282, "epoch": 1001} {"train_loss": -10.886636734008789, "global_step": 168283, "epoch": 1001} {"train_loss": -10.7706880569458, "global_step": 168284, "epoch": 1001} {"train_loss": -10.79556655883789, "global_step": 168285, "epoch": 1001} {"train_loss": -11.313541412353516, "global_step": 168286, "epoch": 1001} {"train_loss": -10.515216827392578, "global_step": 168287, "epoch": 1001} {"train_loss": -11.30746841430664, "global_step": 168288, "epoch": 1001} {"train_loss": -11.01850700378418, "global_step": 168289, "epoch": 1001} {"train_loss": -10.908299446105957, "global_step": 168290, "epoch": 1001} {"train_loss": -11.256401062011719, "global_step": 168291, "epoch": 1001} {"train_loss": -11.015552520751953, "global_step": 168292, "epoch": 1001} {"train_loss": -10.704627990722656, "global_step": 168293, "epoch": 1001} {"train_loss": -11.208107948303223, "global_step": 168294, "epoch": 1001} {"train_loss": -10.672567367553711, "global_step": 168295, "epoch": 1001} {"train_loss": -10.847578048706055, "global_step": 168296, "epoch": 1001} {"train_loss": -11.100045204162598, "global_step": 168297, "epoch": 1001} {"train_loss": -10.917139053344727, "global_step": 168298, "epoch": 1001} {"train_loss": -11.094199180603027, "global_step": 168299, "epoch": 1001} {"train_loss": -11.02692985534668, "global_step": 168300, "epoch": 1001} {"train_loss": -11.00576114654541, "global_step": 168301, "epoch": 1001} {"train_loss": -11.067392349243164, "global_step": 168302, "epoch": 1001} {"train_loss": -10.905660629272461, "global_step": 168303, "epoch": 1001} {"train_loss": -11.079984664916992, "global_step": 168304, "epoch": 1001} {"train_loss": -11.23559284210205, "global_step": 168305, "epoch": 1001} {"train_loss": -11.038200378417969, "global_step": 168306, "epoch": 1001} {"train_loss": -11.195988655090332, "global_step": 168307, "epoch": 1001} {"train_loss": -11.243101119995117, "global_step": 168308, "epoch": 1001} {"train_loss": -11.190479278564453, "global_step": 168309, "epoch": 1001} {"train_loss": -11.057031631469727, "global_step": 168310, "epoch": 1001} {"train_loss": -11.156740188598633, "global_step": 168311, "epoch": 1001} {"train_loss": -11.147697448730469, "global_step": 168312, "epoch": 1001} {"train_loss": -11.030035018920898, "global_step": 168313, "epoch": 1001} {"train_loss": -11.265250205993652, "global_step": 168314, "epoch": 1001} {"train_loss": -10.981779098510742, "global_step": 168315, "epoch": 1001} {"train_loss": -11.16828441619873, "global_step": 168316, "epoch": 1001} {"train_loss": -10.747695922851562, "global_step": 168317, "epoch": 1001} {"train_loss": -11.317726135253906, "global_step": 168318, "epoch": 1001} {"train_loss": -10.806278228759766, "global_step": 168319, "epoch": 1001} {"train_loss": -10.799467086791992, "global_step": 168320, "epoch": 1001} {"train_loss": -11.180353164672852, "global_step": 168321, "epoch": 1001} {"train_loss": -10.854901313781738, "global_step": 168322, "epoch": 1001} {"train_loss": -11.172778129577637, "global_step": 168323, "epoch": 1001} {"train_loss": -11.237712860107422, "global_step": 168324, "epoch": 1001} {"train_loss": -10.620926856994629, "global_step": 168325, "epoch": 1001} {"train_loss": -11.118021011352539, "global_step": 168326, "epoch": 1001} {"train_loss": -11.124651908874512, "global_step": 168327, "epoch": 1001} {"train_loss": -10.855539321899414, "global_step": 168328, "epoch": 1001} {"train_loss": -11.183235168457031, "global_step": 168329, "epoch": 1001} {"train_loss": -10.471406936645508, "global_step": 168330, "epoch": 1001} {"train_loss": -11.26774787902832, "global_step": 168331, "epoch": 1001} {"train_loss": -11.061800956726074, "global_step": 168332, "epoch": 1001} {"train_loss": -11.366994857788086, "global_step": 168333, "epoch": 1001} {"train_loss": -11.006563186645508, "global_step": 168334, "epoch": 1001} {"train_loss": -10.925180599803017, "global_step": 168335, "epoch": 1001, "val_loss": 241041.1875} {"train_loss": -10.952638626098633, "global_step": 168336, "epoch": 1002} {"train_loss": -11.010250091552734, "global_step": 168337, "epoch": 1002} {"train_loss": -11.186640739440918, "global_step": 168338, "epoch": 1002} {"train_loss": -11.353485107421875, "global_step": 168339, "epoch": 1002} {"train_loss": -11.286399841308594, "global_step": 168340, "epoch": 1002} {"train_loss": -10.839381217956543, "global_step": 168341, "epoch": 1002} {"train_loss": -11.01121997833252, "global_step": 168342, "epoch": 1002} {"train_loss": -11.259315490722656, "global_step": 168343, "epoch": 1002} {"train_loss": -11.069087982177734, "global_step": 168344, "epoch": 1002} {"train_loss": -11.38090991973877, "global_step": 168345, "epoch": 1002} {"train_loss": -11.046116828918457, "global_step": 168346, "epoch": 1002} {"train_loss": -11.285516738891602, "global_step": 168347, "epoch": 1002} {"train_loss": -11.216451644897461, "global_step": 168348, "epoch": 1002} {"train_loss": -10.932744979858398, "global_step": 168349, "epoch": 1002} {"train_loss": -11.092305183410645, "global_step": 168350, "epoch": 1002} {"train_loss": -11.069948196411133, "global_step": 168351, "epoch": 1002} {"train_loss": -10.687703132629395, "global_step": 168352, "epoch": 1002} {"train_loss": -11.315058708190918, "global_step": 168353, "epoch": 1002} {"train_loss": -11.127154350280762, "global_step": 168354, "epoch": 1002} {"train_loss": -11.143404006958008, "global_step": 168355, "epoch": 1002} {"train_loss": -11.08171272277832, "global_step": 168356, "epoch": 1002} {"train_loss": -11.286394119262695, "global_step": 168357, "epoch": 1002} {"train_loss": -10.886089324951172, "global_step": 168358, "epoch": 1002} {"train_loss": -11.175912857055664, "global_step": 168359, "epoch": 1002} {"train_loss": -10.879922866821289, "global_step": 168360, "epoch": 1002} {"train_loss": -11.399544715881348, "global_step": 168361, "epoch": 1002} {"train_loss": -11.042375564575195, "global_step": 168362, "epoch": 1002} {"train_loss": -10.93759536743164, "global_step": 168363, "epoch": 1002} {"train_loss": -10.928775787353516, "global_step": 168364, "epoch": 1002} {"train_loss": -11.239404678344727, "global_step": 168365, "epoch": 1002} {"train_loss": -10.85002326965332, "global_step": 168366, "epoch": 1002} {"train_loss": -10.189502716064453, "global_step": 168367, "epoch": 1002} {"train_loss": -10.490962982177734, "global_step": 168368, "epoch": 1002} {"train_loss": -10.335427284240723, "global_step": 168369, "epoch": 1002} {"train_loss": -9.238452911376953, "global_step": 168370, "epoch": 1002} {"train_loss": -9.885294914245605, "global_step": 168371, "epoch": 1002} {"train_loss": -9.282732963562012, "global_step": 168372, "epoch": 1002} {"train_loss": -8.525888442993164, "global_step": 168373, "epoch": 1002} {"train_loss": -10.467275619506836, "global_step": 168374, "epoch": 1002} {"train_loss": -9.263293266296387, "global_step": 168375, "epoch": 1002} {"train_loss": -8.6409912109375, "global_step": 168376, "epoch": 1002} {"train_loss": -8.626962661743164, "global_step": 168377, "epoch": 1002} {"train_loss": -10.560468673706055, "global_step": 168378, "epoch": 1002} {"train_loss": -7.487543106079102, "global_step": 168379, "epoch": 1002} {"train_loss": -10.422351837158203, "global_step": 168380, "epoch": 1002} {"train_loss": -9.234329223632812, "global_step": 168381, "epoch": 1002} {"train_loss": -10.54959487915039, "global_step": 168382, "epoch": 1002} {"train_loss": -9.775792121887207, "global_step": 168383, "epoch": 1002} {"train_loss": -10.488264083862305, "global_step": 168384, "epoch": 1002} {"train_loss": -10.09830093383789, "global_step": 168385, "epoch": 1002} {"train_loss": -10.293822288513184, "global_step": 168386, "epoch": 1002} {"train_loss": -10.464226722717285, "global_step": 168387, "epoch": 1002} {"train_loss": -9.873376846313477, "global_step": 168388, "epoch": 1002} {"train_loss": -10.500720977783203, "global_step": 168389, "epoch": 1002} {"train_loss": -10.187161445617676, "global_step": 168390, "epoch": 1002} {"train_loss": -10.405454635620117, "global_step": 168391, "epoch": 1002} {"train_loss": -9.8287353515625, "global_step": 168392, "epoch": 1002} {"train_loss": -10.606555938720703, "global_step": 168393, "epoch": 1002} {"train_loss": -10.136738777160645, "global_step": 168394, "epoch": 1002} {"train_loss": -10.080848693847656, "global_step": 168395, "epoch": 1002} {"train_loss": -10.473014831542969, "global_step": 168396, "epoch": 1002} {"train_loss": -10.139860153198242, "global_step": 168397, "epoch": 1002} {"train_loss": -10.140494346618652, "global_step": 168398, "epoch": 1002} {"train_loss": -10.126044273376465, "global_step": 168399, "epoch": 1002} {"train_loss": -10.549449920654297, "global_step": 168400, "epoch": 1002} {"train_loss": -10.315624237060547, "global_step": 168401, "epoch": 1002} {"train_loss": -9.879746437072754, "global_step": 168402, "epoch": 1002} {"train_loss": -10.506036758422852, "global_step": 168403, "epoch": 1002} {"train_loss": -10.4044828414917, "global_step": 168404, "epoch": 1002} {"train_loss": -10.07422924041748, "global_step": 168405, "epoch": 1002} {"train_loss": -10.513113021850586, "global_step": 168406, "epoch": 1002} {"train_loss": -10.527205467224121, "global_step": 168407, "epoch": 1002} {"train_loss": -10.133654594421387, "global_step": 168408, "epoch": 1002} {"train_loss": -10.475273132324219, "global_step": 168409, "epoch": 1002} {"train_loss": -10.50490951538086, "global_step": 168410, "epoch": 1002} {"train_loss": -10.512633323669434, "global_step": 168411, "epoch": 1002} {"train_loss": -10.591856002807617, "global_step": 168412, "epoch": 1002} {"train_loss": -10.648472785949707, "global_step": 168413, "epoch": 1002} {"train_loss": -10.660663604736328, "global_step": 168414, "epoch": 1002} {"train_loss": -10.730260848999023, "global_step": 168415, "epoch": 1002} {"train_loss": -10.676580429077148, "global_step": 168416, "epoch": 1002} {"train_loss": -10.81237506866455, "global_step": 168417, "epoch": 1002} {"train_loss": -10.870020866394043, "global_step": 168418, "epoch": 1002} {"train_loss": -10.737447738647461, "global_step": 168419, "epoch": 1002} {"train_loss": -10.634758949279785, "global_step": 168420, "epoch": 1002} {"train_loss": -10.936966896057129, "global_step": 168421, "epoch": 1002} {"train_loss": -10.764595985412598, "global_step": 168422, "epoch": 1002} {"train_loss": -10.987147331237793, "global_step": 168423, "epoch": 1002} {"train_loss": -10.804224014282227, "global_step": 168424, "epoch": 1002} {"train_loss": -10.658916473388672, "global_step": 168425, "epoch": 1002} {"train_loss": -10.944446563720703, "global_step": 168426, "epoch": 1002} {"train_loss": -10.959585189819336, "global_step": 168427, "epoch": 1002} {"train_loss": -10.926813125610352, "global_step": 168428, "epoch": 1002} {"train_loss": -10.938526153564453, "global_step": 168429, "epoch": 1002} {"train_loss": -11.099926948547363, "global_step": 168430, "epoch": 1002} {"train_loss": -11.218700408935547, "global_step": 168431, "epoch": 1002} {"train_loss": -11.0300874710083, "global_step": 168432, "epoch": 1002} {"train_loss": -11.28016471862793, "global_step": 168433, "epoch": 1002} {"train_loss": -11.183696746826172, "global_step": 168434, "epoch": 1002} {"train_loss": -11.248766899108887, "global_step": 168435, "epoch": 1002} {"train_loss": -11.190265655517578, "global_step": 168436, "epoch": 1002} {"train_loss": -11.256102561950684, "global_step": 168437, "epoch": 1002} {"train_loss": -11.26435661315918, "global_step": 168438, "epoch": 1002} {"train_loss": -11.185386657714844, "global_step": 168439, "epoch": 1002} {"train_loss": -11.12966251373291, "global_step": 168440, "epoch": 1002} {"train_loss": -11.245661735534668, "global_step": 168441, "epoch": 1002} {"train_loss": -11.197378158569336, "global_step": 168442, "epoch": 1002} {"train_loss": -11.086040496826172, "global_step": 168443, "epoch": 1002} {"train_loss": -11.126338958740234, "global_step": 168444, "epoch": 1002} {"train_loss": -11.462028503417969, "global_step": 168445, "epoch": 1002} {"train_loss": -11.303587913513184, "global_step": 168446, "epoch": 1002} {"train_loss": -11.347363471984863, "global_step": 168447, "epoch": 1002} {"train_loss": -11.224123001098633, "global_step": 168448, "epoch": 1002} {"train_loss": -11.28443717956543, "global_step": 168449, "epoch": 1002} {"train_loss": -11.28365707397461, "global_step": 168450, "epoch": 1002} {"train_loss": -11.490152359008789, "global_step": 168451, "epoch": 1002} {"train_loss": -11.103425979614258, "global_step": 168452, "epoch": 1002} {"train_loss": -11.459012985229492, "global_step": 168453, "epoch": 1002} {"train_loss": -11.486151695251465, "global_step": 168454, "epoch": 1002} {"train_loss": -11.29364013671875, "global_step": 168455, "epoch": 1002} {"train_loss": -11.17220401763916, "global_step": 168456, "epoch": 1002} {"train_loss": -11.476177215576172, "global_step": 168457, "epoch": 1002} {"train_loss": -11.393987655639648, "global_step": 168458, "epoch": 1002} {"train_loss": -11.415721893310547, "global_step": 168459, "epoch": 1002} {"train_loss": -11.479608535766602, "global_step": 168460, "epoch": 1002} {"train_loss": -11.368406295776367, "global_step": 168461, "epoch": 1002} {"train_loss": -11.429401397705078, "global_step": 168462, "epoch": 1002} {"train_loss": -11.21383285522461, "global_step": 168463, "epoch": 1002} {"train_loss": -10.89393424987793, "global_step": 168464, "epoch": 1002} {"train_loss": -11.23392105102539, "global_step": 168465, "epoch": 1002} {"train_loss": -11.55003547668457, "global_step": 168466, "epoch": 1002} {"train_loss": -11.106809616088867, "global_step": 168467, "epoch": 1002} {"train_loss": -11.147035598754883, "global_step": 168468, "epoch": 1002} {"train_loss": -11.352998733520508, "global_step": 168469, "epoch": 1002} {"train_loss": -11.224594116210938, "global_step": 168470, "epoch": 1002} {"train_loss": -10.898754119873047, "global_step": 168471, "epoch": 1002} {"train_loss": -11.44332218170166, "global_step": 168472, "epoch": 1002} {"train_loss": -11.131324768066406, "global_step": 168473, "epoch": 1002} {"train_loss": -10.896282196044922, "global_step": 168474, "epoch": 1002} {"train_loss": -11.094659805297852, "global_step": 168475, "epoch": 1002} {"train_loss": -10.709924697875977, "global_step": 168476, "epoch": 1002} {"train_loss": -10.752374649047852, "global_step": 168477, "epoch": 1002} {"train_loss": -10.927295684814453, "global_step": 168478, "epoch": 1002} {"train_loss": -11.036808013916016, "global_step": 168479, "epoch": 1002} {"train_loss": -11.060665130615234, "global_step": 168480, "epoch": 1002} {"train_loss": -10.048277854919434, "global_step": 168481, "epoch": 1002} {"train_loss": -8.862298965454102, "global_step": 168482, "epoch": 1002} {"train_loss": -10.45098876953125, "global_step": 168483, "epoch": 1002} {"train_loss": -10.188918113708496, "global_step": 168484, "epoch": 1002} {"train_loss": -7.250088691711426, "global_step": 168485, "epoch": 1002} {"train_loss": -9.86695671081543, "global_step": 168486, "epoch": 1002} {"train_loss": -8.349873542785645, "global_step": 168487, "epoch": 1002} {"train_loss": -10.282660484313965, "global_step": 168488, "epoch": 1002} {"train_loss": -9.089814186096191, "global_step": 168489, "epoch": 1002} {"train_loss": -9.592351913452148, "global_step": 168490, "epoch": 1002} {"train_loss": -8.587892532348633, "global_step": 168491, "epoch": 1002} {"train_loss": -9.172224044799805, "global_step": 168492, "epoch": 1002} {"train_loss": -8.039617538452148, "global_step": 168493, "epoch": 1002} {"train_loss": -8.50685977935791, "global_step": 168494, "epoch": 1002} {"train_loss": -9.989469528198242, "global_step": 168495, "epoch": 1002} {"train_loss": -9.010528564453125, "global_step": 168496, "epoch": 1002} {"train_loss": -8.43970775604248, "global_step": 168497, "epoch": 1002} {"train_loss": -9.845279693603516, "global_step": 168498, "epoch": 1002} {"train_loss": -10.235698699951172, "global_step": 168499, "epoch": 1002} {"train_loss": -9.094018936157227, "global_step": 168500, "epoch": 1002} {"train_loss": -9.09338092803955, "global_step": 168501, "epoch": 1002} {"train_loss": -9.57009506225586, "global_step": 168502, "epoch": 1002} {"train_loss": -10.5653848250707, "global_step": 168503, "epoch": 1002, "val_loss": 234531.84375} {"train_loss": -9.031599044799805, "global_step": 168504, "epoch": 1003} {"train_loss": -10.086596488952637, "global_step": 168505, "epoch": 1003} {"train_loss": -10.043172836303711, "global_step": 168506, "epoch": 1003} {"train_loss": -9.924905776977539, "global_step": 168507, "epoch": 1003} {"train_loss": -9.6190767288208, "global_step": 168508, "epoch": 1003} {"train_loss": -9.885009765625, "global_step": 168509, "epoch": 1003} {"train_loss": -10.50721263885498, "global_step": 168510, "epoch": 1003} {"train_loss": -10.07887077331543, "global_step": 168511, "epoch": 1003} {"train_loss": -9.628616333007812, "global_step": 168512, "epoch": 1003} {"train_loss": -10.226293563842773, "global_step": 168513, "epoch": 1003} {"train_loss": -9.85976791381836, "global_step": 168514, "epoch": 1003} {"train_loss": -9.912827491760254, "global_step": 168515, "epoch": 1003} {"train_loss": -10.36691665649414, "global_step": 168516, "epoch": 1003} {"train_loss": -10.16025161743164, "global_step": 168517, "epoch": 1003} {"train_loss": -10.159706115722656, "global_step": 168518, "epoch": 1003} {"train_loss": -9.974876403808594, "global_step": 168519, "epoch": 1003} {"train_loss": -10.389947891235352, "global_step": 168520, "epoch": 1003} {"train_loss": -10.568114280700684, "global_step": 168521, "epoch": 1003} {"train_loss": -10.422192573547363, "global_step": 168522, "epoch": 1003} {"train_loss": -10.120170593261719, "global_step": 168523, "epoch": 1003} {"train_loss": -10.729681015014648, "global_step": 168524, "epoch": 1003} {"train_loss": -10.58366584777832, "global_step": 168525, "epoch": 1003} {"train_loss": -10.428119659423828, "global_step": 168526, "epoch": 1003} {"train_loss": -10.214981079101562, "global_step": 168527, "epoch": 1003} {"train_loss": -10.424367904663086, "global_step": 168528, "epoch": 1003} {"train_loss": -10.5966796875, "global_step": 168529, "epoch": 1003} {"train_loss": -10.55457878112793, "global_step": 168530, "epoch": 1003} {"train_loss": -10.583642959594727, "global_step": 168531, "epoch": 1003} {"train_loss": -10.717458724975586, "global_step": 168532, "epoch": 1003} {"train_loss": -10.379598617553711, "global_step": 168533, "epoch": 1003} {"train_loss": -10.433218955993652, "global_step": 168534, "epoch": 1003} {"train_loss": -10.611595153808594, "global_step": 168535, "epoch": 1003} {"train_loss": -10.628621101379395, "global_step": 168536, "epoch": 1003} {"train_loss": -10.726541519165039, "global_step": 168537, "epoch": 1003} {"train_loss": -10.851999282836914, "global_step": 168538, "epoch": 1003} {"train_loss": -10.667333602905273, "global_step": 168539, "epoch": 1003} {"train_loss": -10.899626731872559, "global_step": 168540, "epoch": 1003} {"train_loss": -10.659712791442871, "global_step": 168541, "epoch": 1003} {"train_loss": -10.8305025100708, "global_step": 168542, "epoch": 1003} {"train_loss": -10.686064720153809, "global_step": 168543, "epoch": 1003} {"train_loss": -10.844160079956055, "global_step": 168544, "epoch": 1003} {"train_loss": -10.860361099243164, "global_step": 168545, "epoch": 1003} {"train_loss": -10.943643569946289, "global_step": 168546, "epoch": 1003} {"train_loss": -10.69392204284668, "global_step": 168547, "epoch": 1003} {"train_loss": -10.795883178710938, "global_step": 168548, "epoch": 1003} {"train_loss": -10.789572715759277, "global_step": 168549, "epoch": 1003} {"train_loss": -10.908754348754883, "global_step": 168550, "epoch": 1003} {"train_loss": -11.08004379272461, "global_step": 168551, "epoch": 1003} {"train_loss": -11.007546424865723, "global_step": 168552, "epoch": 1003} {"train_loss": -11.162147521972656, "global_step": 168553, "epoch": 1003} {"train_loss": -10.886245727539062, "global_step": 168554, "epoch": 1003} {"train_loss": -11.158880233764648, "global_step": 168555, "epoch": 1003} {"train_loss": -10.884843826293945, "global_step": 168556, "epoch": 1003} {"train_loss": -11.121174812316895, "global_step": 168557, "epoch": 1003} {"train_loss": -11.099536895751953, "global_step": 168558, "epoch": 1003} {"train_loss": -11.060722351074219, "global_step": 168559, "epoch": 1003} {"train_loss": -11.041877746582031, "global_step": 168560, "epoch": 1003} {"train_loss": -11.235306739807129, "global_step": 168561, "epoch": 1003} {"train_loss": -10.80512523651123, "global_step": 168562, "epoch": 1003} {"train_loss": -11.07750129699707, "global_step": 168563, "epoch": 1003} {"train_loss": -11.270406723022461, "global_step": 168564, "epoch": 1003} {"train_loss": -11.29305362701416, "global_step": 168565, "epoch": 1003} {"train_loss": -11.277139663696289, "global_step": 168566, "epoch": 1003} {"train_loss": -11.112874031066895, "global_step": 168567, "epoch": 1003} {"train_loss": -11.036314964294434, "global_step": 168568, "epoch": 1003} {"train_loss": -11.24270248413086, "global_step": 168569, "epoch": 1003} {"train_loss": -10.80007266998291, "global_step": 168570, "epoch": 1003} {"train_loss": -11.45598030090332, "global_step": 168571, "epoch": 1003} {"train_loss": -11.258495330810547, "global_step": 168572, "epoch": 1003} {"train_loss": -11.131587982177734, "global_step": 168573, "epoch": 1003} {"train_loss": -11.274372100830078, "global_step": 168574, "epoch": 1003} {"train_loss": -11.21419906616211, "global_step": 168575, "epoch": 1003} {"train_loss": -11.182832717895508, "global_step": 168576, "epoch": 1003} {"train_loss": -10.967947006225586, "global_step": 168577, "epoch": 1003} {"train_loss": -11.012858390808105, "global_step": 168578, "epoch": 1003} {"train_loss": -11.139370918273926, "global_step": 168579, "epoch": 1003} {"train_loss": -10.837538719177246, "global_step": 168580, "epoch": 1003} {"train_loss": -11.009963989257812, "global_step": 168581, "epoch": 1003} {"train_loss": -11.236905097961426, "global_step": 168582, "epoch": 1003} {"train_loss": -11.165994644165039, "global_step": 168583, "epoch": 1003} {"train_loss": -11.255016326904297, "global_step": 168584, "epoch": 1003} {"train_loss": -11.156654357910156, "global_step": 168585, "epoch": 1003} {"train_loss": -11.20688247680664, "global_step": 168586, "epoch": 1003} {"train_loss": -11.078432083129883, "global_step": 168587, "epoch": 1003} {"train_loss": -11.23409652709961, "global_step": 168588, "epoch": 1003} {"train_loss": -10.934423446655273, "global_step": 168589, "epoch": 1003} {"train_loss": -11.426050186157227, "global_step": 168590, "epoch": 1003} {"train_loss": -11.313813209533691, "global_step": 168591, "epoch": 1003} {"train_loss": -11.40145492553711, "global_step": 168592, "epoch": 1003} {"train_loss": -11.353165626525879, "global_step": 168593, "epoch": 1003} {"train_loss": -11.092950820922852, "global_step": 168594, "epoch": 1003} {"train_loss": -11.033366203308105, "global_step": 168595, "epoch": 1003} {"train_loss": -11.195383071899414, "global_step": 168596, "epoch": 1003} {"train_loss": -11.29269027709961, "global_step": 168597, "epoch": 1003} {"train_loss": -11.3558349609375, "global_step": 168598, "epoch": 1003} {"train_loss": -11.43720817565918, "global_step": 168599, "epoch": 1003} {"train_loss": -11.035371780395508, "global_step": 168600, "epoch": 1003} {"train_loss": -11.31715202331543, "global_step": 168601, "epoch": 1003} {"train_loss": -11.028351783752441, "global_step": 168602, "epoch": 1003} {"train_loss": -11.3853759765625, "global_step": 168603, "epoch": 1003} {"train_loss": -11.338159561157227, "global_step": 168604, "epoch": 1003} {"train_loss": -10.2994384765625, "global_step": 168605, "epoch": 1003} {"train_loss": -10.535764694213867, "global_step": 168606, "epoch": 1003} {"train_loss": -11.000914573669434, "global_step": 168607, "epoch": 1003} {"train_loss": -10.797595977783203, "global_step": 168608, "epoch": 1003} {"train_loss": -10.344888687133789, "global_step": 168609, "epoch": 1003} {"train_loss": -11.189305305480957, "global_step": 168610, "epoch": 1003} {"train_loss": -11.080999374389648, "global_step": 168611, "epoch": 1003} {"train_loss": -10.901028633117676, "global_step": 168612, "epoch": 1003} {"train_loss": -11.055885314941406, "global_step": 168613, "epoch": 1003} {"train_loss": -10.237390518188477, "global_step": 168614, "epoch": 1003} {"train_loss": -10.62166976928711, "global_step": 168615, "epoch": 1003} {"train_loss": -11.005584716796875, "global_step": 168616, "epoch": 1003} {"train_loss": -9.94411849975586, "global_step": 168617, "epoch": 1003} {"train_loss": -10.087495803833008, "global_step": 168618, "epoch": 1003} {"train_loss": -9.868961334228516, "global_step": 168619, "epoch": 1003} {"train_loss": -9.995687484741211, "global_step": 168620, "epoch": 1003} {"train_loss": -10.610203742980957, "global_step": 168621, "epoch": 1003} {"train_loss": -10.435646057128906, "global_step": 168622, "epoch": 1003} {"train_loss": -10.140945434570312, "global_step": 168623, "epoch": 1003} {"train_loss": -10.178946495056152, "global_step": 168624, "epoch": 1003} {"train_loss": -10.23989200592041, "global_step": 168625, "epoch": 1003} {"train_loss": -10.12109088897705, "global_step": 168626, "epoch": 1003} {"train_loss": -9.739171028137207, "global_step": 168627, "epoch": 1003} {"train_loss": -9.523591995239258, "global_step": 168628, "epoch": 1003} {"train_loss": -10.303262710571289, "global_step": 168629, "epoch": 1003} {"train_loss": -9.983861923217773, "global_step": 168630, "epoch": 1003} {"train_loss": -9.703564643859863, "global_step": 168631, "epoch": 1003} {"train_loss": -10.227182388305664, "global_step": 168632, "epoch": 1003} {"train_loss": -9.287010192871094, "global_step": 168633, "epoch": 1003} {"train_loss": -9.872982025146484, "global_step": 168634, "epoch": 1003} {"train_loss": -10.260238647460938, "global_step": 168635, "epoch": 1003} {"train_loss": -10.0902099609375, "global_step": 168636, "epoch": 1003} {"train_loss": -10.527321815490723, "global_step": 168637, "epoch": 1003} {"train_loss": -10.417362213134766, "global_step": 168638, "epoch": 1003} {"train_loss": -10.356901168823242, "global_step": 168639, "epoch": 1003} {"train_loss": -10.326988220214844, "global_step": 168640, "epoch": 1003} {"train_loss": -10.384861946105957, "global_step": 168641, "epoch": 1003} {"train_loss": -10.478360176086426, "global_step": 168642, "epoch": 1003} {"train_loss": -10.420249938964844, "global_step": 168643, "epoch": 1003} {"train_loss": -10.613227844238281, "global_step": 168644, "epoch": 1003} {"train_loss": -10.3431396484375, "global_step": 168645, "epoch": 1003} {"train_loss": -10.384437561035156, "global_step": 168646, "epoch": 1003} {"train_loss": -10.756756782531738, "global_step": 168647, "epoch": 1003} {"train_loss": -10.518784523010254, "global_step": 168648, "epoch": 1003} {"train_loss": -10.39879322052002, "global_step": 168649, "epoch": 1003} {"train_loss": -10.793933868408203, "global_step": 168650, "epoch": 1003} {"train_loss": -10.502397537231445, "global_step": 168651, "epoch": 1003} {"train_loss": -10.771732330322266, "global_step": 168652, "epoch": 1003} {"train_loss": -10.654576301574707, "global_step": 168653, "epoch": 1003} {"train_loss": -10.85521125793457, "global_step": 168654, "epoch": 1003} {"train_loss": -10.698644638061523, "global_step": 168655, "epoch": 1003} {"train_loss": -10.803770065307617, "global_step": 168656, "epoch": 1003} {"train_loss": -11.041842460632324, "global_step": 168657, "epoch": 1003} {"train_loss": -10.759977340698242, "global_step": 168658, "epoch": 1003} {"train_loss": -10.732370376586914, "global_step": 168659, "epoch": 1003} {"train_loss": -10.67529582977295, "global_step": 168660, "epoch": 1003} {"train_loss": -10.949579238891602, "global_step": 168661, "epoch": 1003} {"train_loss": -11.025679588317871, "global_step": 168662, "epoch": 1003} {"train_loss": -10.76895523071289, "global_step": 168663, "epoch": 1003} {"train_loss": -10.83665943145752, "global_step": 168664, "epoch": 1003} {"train_loss": -10.709392547607422, "global_step": 168665, "epoch": 1003} {"train_loss": -11.158519744873047, "global_step": 168666, "epoch": 1003} {"train_loss": -10.672104835510254, "global_step": 168667, "epoch": 1003} {"train_loss": -10.996088027954102, "global_step": 168668, "epoch": 1003} {"train_loss": -11.062894821166992, "global_step": 168669, "epoch": 1003} {"train_loss": -11.099404335021973, "global_step": 168670, "epoch": 1003} {"train_loss": -10.687759722982134, "global_step": 168671, "epoch": 1003, "val_loss": 239215.796875} {"train_loss": -11.111952781677246, "global_step": 168672, "epoch": 1004} {"train_loss": -11.132097244262695, "global_step": 168673, "epoch": 1004} {"train_loss": -11.12778091430664, "global_step": 168674, "epoch": 1004} {"train_loss": -11.25900650024414, "global_step": 168675, "epoch": 1004} {"train_loss": -11.292972564697266, "global_step": 168676, "epoch": 1004} {"train_loss": -11.16151237487793, "global_step": 168677, "epoch": 1004} {"train_loss": -11.170352935791016, "global_step": 168678, "epoch": 1004} {"train_loss": -11.19896125793457, "global_step": 168679, "epoch": 1004} {"train_loss": -11.291720390319824, "global_step": 168680, "epoch": 1004} {"train_loss": -11.224483489990234, "global_step": 168681, "epoch": 1004} {"train_loss": -11.18967342376709, "global_step": 168682, "epoch": 1004} {"train_loss": -11.22158432006836, "global_step": 168683, "epoch": 1004} {"train_loss": -11.301385879516602, "global_step": 168684, "epoch": 1004} {"train_loss": -11.292534828186035, "global_step": 168685, "epoch": 1004} {"train_loss": -11.183150291442871, "global_step": 168686, "epoch": 1004} {"train_loss": -11.257559776306152, "global_step": 168687, "epoch": 1004} {"train_loss": -11.374761581420898, "global_step": 168688, "epoch": 1004} {"train_loss": -11.24955940246582, "global_step": 168689, "epoch": 1004} {"train_loss": -11.540338516235352, "global_step": 168690, "epoch": 1004} {"train_loss": -11.391385078430176, "global_step": 168691, "epoch": 1004} {"train_loss": -11.350521087646484, "global_step": 168692, "epoch": 1004} {"train_loss": -11.29166316986084, "global_step": 168693, "epoch": 1004} {"train_loss": -11.19791030883789, "global_step": 168694, "epoch": 1004} {"train_loss": -11.457940101623535, "global_step": 168695, "epoch": 1004} {"train_loss": -11.535116195678711, "global_step": 168696, "epoch": 1004} {"train_loss": -11.276055335998535, "global_step": 168697, "epoch": 1004} {"train_loss": -11.420557975769043, "global_step": 168698, "epoch": 1004} {"train_loss": -11.332767486572266, "global_step": 168699, "epoch": 1004} {"train_loss": -11.356010437011719, "global_step": 168700, "epoch": 1004} {"train_loss": -11.260990142822266, "global_step": 168701, "epoch": 1004} {"train_loss": -11.29134750366211, "global_step": 168702, "epoch": 1004} {"train_loss": -10.812387466430664, "global_step": 168703, "epoch": 1004} {"train_loss": -11.464043617248535, "global_step": 168704, "epoch": 1004} {"train_loss": -11.558317184448242, "global_step": 168705, "epoch": 1004} {"train_loss": -11.046463012695312, "global_step": 168706, "epoch": 1004} {"train_loss": -11.261531829833984, "global_step": 168707, "epoch": 1004} {"train_loss": -11.393316268920898, "global_step": 168708, "epoch": 1004} {"train_loss": -11.38996696472168, "global_step": 168709, "epoch": 1004} {"train_loss": -11.210336685180664, "global_step": 168710, "epoch": 1004} {"train_loss": -10.546998977661133, "global_step": 168711, "epoch": 1004} {"train_loss": -10.411722183227539, "global_step": 168712, "epoch": 1004} {"train_loss": -10.692171096801758, "global_step": 168713, "epoch": 1004} {"train_loss": -10.401786804199219, "global_step": 168714, "epoch": 1004} {"train_loss": -9.391003608703613, "global_step": 168715, "epoch": 1004} {"train_loss": -11.253707885742188, "global_step": 168716, "epoch": 1004} {"train_loss": -10.37657356262207, "global_step": 168717, "epoch": 1004} {"train_loss": -9.58387565612793, "global_step": 168718, "epoch": 1004} {"train_loss": -10.859845161437988, "global_step": 168719, "epoch": 1004} {"train_loss": -9.708080291748047, "global_step": 168720, "epoch": 1004} {"train_loss": -10.4676513671875, "global_step": 168721, "epoch": 1004} {"train_loss": -10.573486328125, "global_step": 168722, "epoch": 1004} {"train_loss": -9.87744426727295, "global_step": 168723, "epoch": 1004} {"train_loss": -10.758733749389648, "global_step": 168724, "epoch": 1004} {"train_loss": -10.641931533813477, "global_step": 168725, "epoch": 1004} {"train_loss": -10.763660430908203, "global_step": 168726, "epoch": 1004} {"train_loss": -10.91777229309082, "global_step": 168727, "epoch": 1004} {"train_loss": -10.412668228149414, "global_step": 168728, "epoch": 1004} {"train_loss": -10.84830379486084, "global_step": 168729, "epoch": 1004} {"train_loss": -10.723991394042969, "global_step": 168730, "epoch": 1004} {"train_loss": -10.965831756591797, "global_step": 168731, "epoch": 1004} {"train_loss": -10.795516967773438, "global_step": 168732, "epoch": 1004} {"train_loss": -10.92939567565918, "global_step": 168733, "epoch": 1004} {"train_loss": -11.027632713317871, "global_step": 168734, "epoch": 1004} {"train_loss": -10.751870155334473, "global_step": 168735, "epoch": 1004} {"train_loss": -10.57016372680664, "global_step": 168736, "epoch": 1004} {"train_loss": -10.921501159667969, "global_step": 168737, "epoch": 1004} {"train_loss": -10.189361572265625, "global_step": 168738, "epoch": 1004} {"train_loss": -10.657135009765625, "global_step": 168739, "epoch": 1004} {"train_loss": -10.75561809539795, "global_step": 168740, "epoch": 1004} {"train_loss": -10.683598518371582, "global_step": 168741, "epoch": 1004} {"train_loss": -10.728538513183594, "global_step": 168742, "epoch": 1004} {"train_loss": -10.1349458694458, "global_step": 168743, "epoch": 1004} {"train_loss": -10.716756820678711, "global_step": 168744, "epoch": 1004} {"train_loss": -10.745922088623047, "global_step": 168745, "epoch": 1004} {"train_loss": -10.785585403442383, "global_step": 168746, "epoch": 1004} {"train_loss": -10.702669143676758, "global_step": 168747, "epoch": 1004} {"train_loss": -10.906652450561523, "global_step": 168748, "epoch": 1004} {"train_loss": -10.84719467163086, "global_step": 168749, "epoch": 1004} {"train_loss": -11.098541259765625, "global_step": 168750, "epoch": 1004} {"train_loss": -10.857276916503906, "global_step": 168751, "epoch": 1004} {"train_loss": -10.913311958312988, "global_step": 168752, "epoch": 1004} {"train_loss": -11.009576797485352, "global_step": 168753, "epoch": 1004} {"train_loss": -11.104228019714355, "global_step": 168754, "epoch": 1004} {"train_loss": -10.925455093383789, "global_step": 168755, "epoch": 1004} {"train_loss": -10.942516326904297, "global_step": 168756, "epoch": 1004} {"train_loss": -11.103363990783691, "global_step": 168757, "epoch": 1004} {"train_loss": -11.206483840942383, "global_step": 168758, "epoch": 1004} {"train_loss": -10.994913101196289, "global_step": 168759, "epoch": 1004} {"train_loss": -11.216432571411133, "global_step": 168760, "epoch": 1004} {"train_loss": -11.16329574584961, "global_step": 168761, "epoch": 1004} {"train_loss": -11.00395393371582, "global_step": 168762, "epoch": 1004} {"train_loss": -11.259603500366211, "global_step": 168763, "epoch": 1004} {"train_loss": -11.174593925476074, "global_step": 168764, "epoch": 1004} {"train_loss": -11.252046585083008, "global_step": 168765, "epoch": 1004} {"train_loss": -11.126592636108398, "global_step": 168766, "epoch": 1004} {"train_loss": -11.004257202148438, "global_step": 168767, "epoch": 1004} {"train_loss": -11.108692169189453, "global_step": 168768, "epoch": 1004} {"train_loss": -11.31348705291748, "global_step": 168769, "epoch": 1004} {"train_loss": -11.082647323608398, "global_step": 168770, "epoch": 1004} {"train_loss": -11.330934524536133, "global_step": 168771, "epoch": 1004} {"train_loss": -11.219118118286133, "global_step": 168772, "epoch": 1004} {"train_loss": -11.388863563537598, "global_step": 168773, "epoch": 1004} {"train_loss": -11.179170608520508, "global_step": 168774, "epoch": 1004} {"train_loss": -11.170915603637695, "global_step": 168775, "epoch": 1004} {"train_loss": -11.376472473144531, "global_step": 168776, "epoch": 1004} {"train_loss": -11.314016342163086, "global_step": 168777, "epoch": 1004} {"train_loss": -11.203474044799805, "global_step": 168778, "epoch": 1004} {"train_loss": -11.487373352050781, "global_step": 168779, "epoch": 1004} {"train_loss": -11.420575141906738, "global_step": 168780, "epoch": 1004} {"train_loss": -11.268640518188477, "global_step": 168781, "epoch": 1004} {"train_loss": -11.34572696685791, "global_step": 168782, "epoch": 1004} {"train_loss": -11.470725059509277, "global_step": 168783, "epoch": 1004} {"train_loss": -11.274284362792969, "global_step": 168784, "epoch": 1004} {"train_loss": -11.33515739440918, "global_step": 168785, "epoch": 1004} {"train_loss": -11.143346786499023, "global_step": 168786, "epoch": 1004} {"train_loss": -11.549203872680664, "global_step": 168787, "epoch": 1004} {"train_loss": -11.362095832824707, "global_step": 168788, "epoch": 1004} {"train_loss": -11.296052932739258, "global_step": 168789, "epoch": 1004} {"train_loss": -11.111209869384766, "global_step": 168790, "epoch": 1004} {"train_loss": -11.332527160644531, "global_step": 168791, "epoch": 1004} {"train_loss": -10.641345977783203, "global_step": 168792, "epoch": 1004} {"train_loss": -11.047521591186523, "global_step": 168793, "epoch": 1004} {"train_loss": -11.042991638183594, "global_step": 168794, "epoch": 1004} {"train_loss": -10.715633392333984, "global_step": 168795, "epoch": 1004} {"train_loss": -10.711627960205078, "global_step": 168796, "epoch": 1004} {"train_loss": -10.465290069580078, "global_step": 168797, "epoch": 1004} {"train_loss": -10.158636093139648, "global_step": 168798, "epoch": 1004} {"train_loss": -8.956913948059082, "global_step": 168799, "epoch": 1004} {"train_loss": -9.674585342407227, "global_step": 168800, "epoch": 1004} {"train_loss": -10.602502822875977, "global_step": 168801, "epoch": 1004} {"train_loss": -10.221920013427734, "global_step": 168802, "epoch": 1004} {"train_loss": -10.109426498413086, "global_step": 168803, "epoch": 1004} {"train_loss": -10.864526748657227, "global_step": 168804, "epoch": 1004} {"train_loss": -10.83268928527832, "global_step": 168805, "epoch": 1004} {"train_loss": -10.76805305480957, "global_step": 168806, "epoch": 1004} {"train_loss": -10.433611869812012, "global_step": 168807, "epoch": 1004} {"train_loss": -11.031545639038086, "global_step": 168808, "epoch": 1004} {"train_loss": -10.489261627197266, "global_step": 168809, "epoch": 1004} {"train_loss": -10.087058067321777, "global_step": 168810, "epoch": 1004} {"train_loss": -10.09817886352539, "global_step": 168811, "epoch": 1004} {"train_loss": -10.931794166564941, "global_step": 168812, "epoch": 1004} {"train_loss": -10.990992546081543, "global_step": 168813, "epoch": 1004} {"train_loss": -10.88475227355957, "global_step": 168814, "epoch": 1004} {"train_loss": -10.942180633544922, "global_step": 168815, "epoch": 1004} {"train_loss": -10.761652946472168, "global_step": 168816, "epoch": 1004} {"train_loss": -10.714210510253906, "global_step": 168817, "epoch": 1004} {"train_loss": -10.793648719787598, "global_step": 168818, "epoch": 1004} {"train_loss": -10.602436065673828, "global_step": 168819, "epoch": 1004} {"train_loss": -10.974815368652344, "global_step": 168820, "epoch": 1004} {"train_loss": -10.850478172302246, "global_step": 168821, "epoch": 1004} {"train_loss": -10.70619010925293, "global_step": 168822, "epoch": 1004} {"train_loss": -10.03235149383545, "global_step": 168823, "epoch": 1004} {"train_loss": -10.017431259155273, "global_step": 168824, "epoch": 1004} {"train_loss": -10.73493480682373, "global_step": 168825, "epoch": 1004} {"train_loss": -10.402975082397461, "global_step": 168826, "epoch": 1004} {"train_loss": -10.647476196289062, "global_step": 168827, "epoch": 1004} {"train_loss": -9.958686828613281, "global_step": 168828, "epoch": 1004} {"train_loss": -10.60224723815918, "global_step": 168829, "epoch": 1004} {"train_loss": -9.807981491088867, "global_step": 168830, "epoch": 1004} {"train_loss": -10.284181594848633, "global_step": 168831, "epoch": 1004} {"train_loss": -9.565752029418945, "global_step": 168832, "epoch": 1004} {"train_loss": -10.446439743041992, "global_step": 168833, "epoch": 1004} {"train_loss": -9.365636825561523, "global_step": 168834, "epoch": 1004} {"train_loss": -10.511345863342285, "global_step": 168835, "epoch": 1004} {"train_loss": -9.927312850952148, "global_step": 168836, "epoch": 1004} {"train_loss": -10.10666275024414, "global_step": 168837, "epoch": 1004} {"train_loss": -9.79018497467041, "global_step": 168838, "epoch": 1004} {"train_loss": -10.857207133656456, "global_step": 168839, "epoch": 1004, "val_loss": 228607.640625} {"train_loss": -10.170671463012695, "global_step": 168840, "epoch": 1005} {"train_loss": -9.240697860717773, "global_step": 168841, "epoch": 1005} {"train_loss": -10.687603950500488, "global_step": 168842, "epoch": 1005} {"train_loss": -9.53813362121582, "global_step": 168843, "epoch": 1005} {"train_loss": -10.005287170410156, "global_step": 168844, "epoch": 1005} {"train_loss": -10.209691047668457, "global_step": 168845, "epoch": 1005} {"train_loss": -9.394491195678711, "global_step": 168846, "epoch": 1005} {"train_loss": -10.023384094238281, "global_step": 168847, "epoch": 1005} {"train_loss": -9.821887969970703, "global_step": 168848, "epoch": 1005} {"train_loss": -10.629074096679688, "global_step": 168849, "epoch": 1005} {"train_loss": -10.287727355957031, "global_step": 168850, "epoch": 1005} {"train_loss": -10.017396926879883, "global_step": 168851, "epoch": 1005} {"train_loss": -10.708457946777344, "global_step": 168852, "epoch": 1005} {"train_loss": -10.330181121826172, "global_step": 168853, "epoch": 1005} {"train_loss": -10.311704635620117, "global_step": 168854, "epoch": 1005} {"train_loss": -10.505104064941406, "global_step": 168855, "epoch": 1005} {"train_loss": -10.135309219360352, "global_step": 168856, "epoch": 1005} {"train_loss": -10.623601913452148, "global_step": 168857, "epoch": 1005} {"train_loss": -10.425360679626465, "global_step": 168858, "epoch": 1005} {"train_loss": -10.32598876953125, "global_step": 168859, "epoch": 1005} {"train_loss": -10.747020721435547, "global_step": 168860, "epoch": 1005} {"train_loss": -10.477948188781738, "global_step": 168861, "epoch": 1005} {"train_loss": -10.508684158325195, "global_step": 168862, "epoch": 1005} {"train_loss": -10.725744247436523, "global_step": 168863, "epoch": 1005} {"train_loss": -10.633489608764648, "global_step": 168864, "epoch": 1005} {"train_loss": -10.704524040222168, "global_step": 168865, "epoch": 1005} {"train_loss": -10.472311973571777, "global_step": 168866, "epoch": 1005} {"train_loss": -10.315471649169922, "global_step": 168867, "epoch": 1005} {"train_loss": -10.859062194824219, "global_step": 168868, "epoch": 1005} {"train_loss": -10.428616523742676, "global_step": 168869, "epoch": 1005} {"train_loss": -10.714367866516113, "global_step": 168870, "epoch": 1005} {"train_loss": -10.908387184143066, "global_step": 168871, "epoch": 1005} {"train_loss": -10.55162525177002, "global_step": 168872, "epoch": 1005} {"train_loss": -10.912221908569336, "global_step": 168873, "epoch": 1005} {"train_loss": -10.725217819213867, "global_step": 168874, "epoch": 1005} {"train_loss": -10.664986610412598, "global_step": 168875, "epoch": 1005} {"train_loss": -10.980167388916016, "global_step": 168876, "epoch": 1005} {"train_loss": -10.827384948730469, "global_step": 168877, "epoch": 1005} {"train_loss": -10.919408798217773, "global_step": 168878, "epoch": 1005} {"train_loss": -10.925701141357422, "global_step": 168879, "epoch": 1005} {"train_loss": -10.849205017089844, "global_step": 168880, "epoch": 1005} {"train_loss": -10.811867713928223, "global_step": 168881, "epoch": 1005} {"train_loss": -10.772357940673828, "global_step": 168882, "epoch": 1005} {"train_loss": -10.809398651123047, "global_step": 168883, "epoch": 1005} {"train_loss": -10.82273006439209, "global_step": 168884, "epoch": 1005} {"train_loss": -10.92674446105957, "global_step": 168885, "epoch": 1005} {"train_loss": -10.927128791809082, "global_step": 168886, "epoch": 1005} {"train_loss": -11.135541915893555, "global_step": 168887, "epoch": 1005} {"train_loss": -10.946024894714355, "global_step": 168888, "epoch": 1005} {"train_loss": -11.040637969970703, "global_step": 168889, "epoch": 1005} {"train_loss": -10.963688850402832, "global_step": 168890, "epoch": 1005} {"train_loss": -11.146920204162598, "global_step": 168891, "epoch": 1005} {"train_loss": -11.219276428222656, "global_step": 168892, "epoch": 1005} {"train_loss": -11.14533519744873, "global_step": 168893, "epoch": 1005} {"train_loss": -11.210524559020996, "global_step": 168894, "epoch": 1005} {"train_loss": -11.12491226196289, "global_step": 168895, "epoch": 1005} {"train_loss": -11.12038516998291, "global_step": 168896, "epoch": 1005} {"train_loss": -10.959196090698242, "global_step": 168897, "epoch": 1005} {"train_loss": -11.311124801635742, "global_step": 168898, "epoch": 1005} {"train_loss": -11.170698165893555, "global_step": 168899, "epoch": 1005} {"train_loss": -11.148872375488281, "global_step": 168900, "epoch": 1005} {"train_loss": -11.392068862915039, "global_step": 168901, "epoch": 1005} {"train_loss": -11.252697944641113, "global_step": 168902, "epoch": 1005} {"train_loss": -11.28559684753418, "global_step": 168903, "epoch": 1005} {"train_loss": -11.238781929016113, "global_step": 168904, "epoch": 1005} {"train_loss": -11.302413940429688, "global_step": 168905, "epoch": 1005} {"train_loss": -11.344964981079102, "global_step": 168906, "epoch": 1005} {"train_loss": -11.18869686126709, "global_step": 168907, "epoch": 1005} {"train_loss": -11.350597381591797, "global_step": 168908, "epoch": 1005} {"train_loss": -11.414130210876465, "global_step": 168909, "epoch": 1005} {"train_loss": -11.251373291015625, "global_step": 168910, "epoch": 1005} {"train_loss": -11.181661605834961, "global_step": 168911, "epoch": 1005} {"train_loss": -11.382329940795898, "global_step": 168912, "epoch": 1005} {"train_loss": -11.331348419189453, "global_step": 168913, "epoch": 1005} {"train_loss": -11.503499984741211, "global_step": 168914, "epoch": 1005} {"train_loss": -10.766960144042969, "global_step": 168915, "epoch": 1005} {"train_loss": -11.239107131958008, "global_step": 168916, "epoch": 1005} {"train_loss": -11.19552993774414, "global_step": 168917, "epoch": 1005} {"train_loss": -11.164285659790039, "global_step": 168918, "epoch": 1005} {"train_loss": -11.249410629272461, "global_step": 168919, "epoch": 1005} {"train_loss": -11.204019546508789, "global_step": 168920, "epoch": 1005} {"train_loss": -11.347070693969727, "global_step": 168921, "epoch": 1005} {"train_loss": -11.287128448486328, "global_step": 168922, "epoch": 1005} {"train_loss": -11.134262084960938, "global_step": 168923, "epoch": 1005} {"train_loss": -11.38663101196289, "global_step": 168924, "epoch": 1005} {"train_loss": -11.258248329162598, "global_step": 168925, "epoch": 1005} {"train_loss": -10.870572090148926, "global_step": 168926, "epoch": 1005} {"train_loss": -10.424840927124023, "global_step": 168927, "epoch": 1005} {"train_loss": -10.63262939453125, "global_step": 168928, "epoch": 1005} {"train_loss": -11.293709754943848, "global_step": 168929, "epoch": 1005} {"train_loss": -10.313505172729492, "global_step": 168930, "epoch": 1005} {"train_loss": -8.428378105163574, "global_step": 168931, "epoch": 1005} {"train_loss": -10.020164489746094, "global_step": 168932, "epoch": 1005} {"train_loss": -8.208023071289062, "global_step": 168933, "epoch": 1005} {"train_loss": -8.952812194824219, "global_step": 168934, "epoch": 1005} {"train_loss": -8.023856163024902, "global_step": 168935, "epoch": 1005} {"train_loss": -10.243334770202637, "global_step": 168936, "epoch": 1005} {"train_loss": -7.845830917358398, "global_step": 168937, "epoch": 1005} {"train_loss": -9.585002899169922, "global_step": 168938, "epoch": 1005} {"train_loss": -9.402481079101562, "global_step": 168939, "epoch": 1005} {"train_loss": -9.331472396850586, "global_step": 168940, "epoch": 1005} {"train_loss": -10.451047897338867, "global_step": 168941, "epoch": 1005} {"train_loss": -9.694635391235352, "global_step": 168942, "epoch": 1005} {"train_loss": -10.100933074951172, "global_step": 168943, "epoch": 1005} {"train_loss": -9.766093254089355, "global_step": 168944, "epoch": 1005} {"train_loss": -10.039968490600586, "global_step": 168945, "epoch": 1005} {"train_loss": -10.063257217407227, "global_step": 168946, "epoch": 1005} {"train_loss": -10.089742660522461, "global_step": 168947, "epoch": 1005} {"train_loss": -9.744894027709961, "global_step": 168948, "epoch": 1005} {"train_loss": -10.474146842956543, "global_step": 168949, "epoch": 1005} {"train_loss": -10.359678268432617, "global_step": 168950, "epoch": 1005} {"train_loss": -10.719191551208496, "global_step": 168951, "epoch": 1005} {"train_loss": -10.806638717651367, "global_step": 168952, "epoch": 1005} {"train_loss": -10.342554092407227, "global_step": 168953, "epoch": 1005} {"train_loss": -10.753423690795898, "global_step": 168954, "epoch": 1005} {"train_loss": -10.702564239501953, "global_step": 168955, "epoch": 1005} {"train_loss": -10.591936111450195, "global_step": 168956, "epoch": 1005} {"train_loss": -10.339959144592285, "global_step": 168957, "epoch": 1005} {"train_loss": -10.734715461730957, "global_step": 168958, "epoch": 1005} {"train_loss": -10.496858596801758, "global_step": 168959, "epoch": 1005} {"train_loss": -10.531013488769531, "global_step": 168960, "epoch": 1005} {"train_loss": -10.784388542175293, "global_step": 168961, "epoch": 1005} {"train_loss": -10.646774291992188, "global_step": 168962, "epoch": 1005} {"train_loss": -10.919455528259277, "global_step": 168963, "epoch": 1005} {"train_loss": -10.587985038757324, "global_step": 168964, "epoch": 1005} {"train_loss": -11.005722999572754, "global_step": 168965, "epoch": 1005} {"train_loss": -10.615531921386719, "global_step": 168966, "epoch": 1005} {"train_loss": -10.684305191040039, "global_step": 168967, "epoch": 1005} {"train_loss": -10.870553016662598, "global_step": 168968, "epoch": 1005} {"train_loss": -10.693745613098145, "global_step": 168969, "epoch": 1005} {"train_loss": -10.638853073120117, "global_step": 168970, "epoch": 1005} {"train_loss": -10.554948806762695, "global_step": 168971, "epoch": 1005} {"train_loss": -10.936528205871582, "global_step": 168972, "epoch": 1005} {"train_loss": -10.927249908447266, "global_step": 168973, "epoch": 1005} {"train_loss": -10.779919624328613, "global_step": 168974, "epoch": 1005} {"train_loss": -11.271642684936523, "global_step": 168975, "epoch": 1005} {"train_loss": -10.908136367797852, "global_step": 168976, "epoch": 1005} {"train_loss": -11.090141296386719, "global_step": 168977, "epoch": 1005} {"train_loss": -10.95882797241211, "global_step": 168978, "epoch": 1005} {"train_loss": -10.951628684997559, "global_step": 168979, "epoch": 1005} {"train_loss": -10.866207122802734, "global_step": 168980, "epoch": 1005} {"train_loss": -11.081183433532715, "global_step": 168981, "epoch": 1005} {"train_loss": -10.806253433227539, "global_step": 168982, "epoch": 1005} {"train_loss": -11.071310043334961, "global_step": 168983, "epoch": 1005} {"train_loss": -10.86335563659668, "global_step": 168984, "epoch": 1005} {"train_loss": -11.10464096069336, "global_step": 168985, "epoch": 1005} {"train_loss": -11.038501739501953, "global_step": 168986, "epoch": 1005} {"train_loss": -11.234601974487305, "global_step": 168987, "epoch": 1005} {"train_loss": -11.239810943603516, "global_step": 168988, "epoch": 1005} {"train_loss": -11.177431106567383, "global_step": 168989, "epoch": 1005} {"train_loss": -11.136246681213379, "global_step": 168990, "epoch": 1005} {"train_loss": -11.13166332244873, "global_step": 168991, "epoch": 1005} {"train_loss": -11.025742530822754, "global_step": 168992, "epoch": 1005} {"train_loss": -11.132146835327148, "global_step": 168993, "epoch": 1005} {"train_loss": -11.151796340942383, "global_step": 168994, "epoch": 1005} {"train_loss": -11.221395492553711, "global_step": 168995, "epoch": 1005} {"train_loss": -11.111366271972656, "global_step": 168996, "epoch": 1005} {"train_loss": -11.09872055053711, "global_step": 168997, "epoch": 1005} {"train_loss": -11.270416259765625, "global_step": 168998, "epoch": 1005} {"train_loss": -11.13784122467041, "global_step": 168999, "epoch": 1005} {"train_loss": -11.223318099975586, "global_step": 169000, "epoch": 1005} {"train_loss": -11.344669342041016, "global_step": 169001, "epoch": 1005} {"train_loss": -11.116609573364258, "global_step": 169002, "epoch": 1005} {"train_loss": -11.225770950317383, "global_step": 169003, "epoch": 1005} {"train_loss": -11.160353660583496, "global_step": 169004, "epoch": 1005} {"train_loss": -11.093137741088867, "global_step": 169005, "epoch": 1005} {"train_loss": -11.020790100097656, "global_step": 169006, "epoch": 1005} {"train_loss": -10.700357187361945, "global_step": 169007, "epoch": 1005, "val_loss": 235642.734375, "train_action_mse_error": 0.6419930458068848} {"train_loss": -11.015691757202148, "global_step": 169008, "epoch": 1006} {"train_loss": -10.924752235412598, "global_step": 169009, "epoch": 1006} {"train_loss": -11.342670440673828, "global_step": 169010, "epoch": 1006} {"train_loss": -10.752866744995117, "global_step": 169011, "epoch": 1006} {"train_loss": -10.963043212890625, "global_step": 169012, "epoch": 1006} {"train_loss": -11.080755233764648, "global_step": 169013, "epoch": 1006} {"train_loss": -11.058582305908203, "global_step": 169014, "epoch": 1006} {"train_loss": -11.25678539276123, "global_step": 169015, "epoch": 1006} {"train_loss": -11.175271987915039, "global_step": 169016, "epoch": 1006} {"train_loss": -10.55258846282959, "global_step": 169017, "epoch": 1006} {"train_loss": -11.089975357055664, "global_step": 169018, "epoch": 1006} {"train_loss": -10.595208168029785, "global_step": 169019, "epoch": 1006} {"train_loss": -10.795845031738281, "global_step": 169020, "epoch": 1006} {"train_loss": -11.080918312072754, "global_step": 169021, "epoch": 1006} {"train_loss": -10.860633850097656, "global_step": 169022, "epoch": 1006} {"train_loss": -11.389074325561523, "global_step": 169023, "epoch": 1006} {"train_loss": -10.918933868408203, "global_step": 169024, "epoch": 1006} {"train_loss": -10.551762580871582, "global_step": 169025, "epoch": 1006} {"train_loss": -10.748428344726562, "global_step": 169026, "epoch": 1006} {"train_loss": -10.545796394348145, "global_step": 169027, "epoch": 1006} {"train_loss": -11.159135818481445, "global_step": 169028, "epoch": 1006} {"train_loss": -10.836637496948242, "global_step": 169029, "epoch": 1006} {"train_loss": -10.768653869628906, "global_step": 169030, "epoch": 1006} {"train_loss": -10.992581367492676, "global_step": 169031, "epoch": 1006} {"train_loss": -10.823843002319336, "global_step": 169032, "epoch": 1006} {"train_loss": -10.918392181396484, "global_step": 169033, "epoch": 1006} {"train_loss": -10.973421096801758, "global_step": 169034, "epoch": 1006} {"train_loss": -10.389847755432129, "global_step": 169035, "epoch": 1006} {"train_loss": -10.853951454162598, "global_step": 169036, "epoch": 1006} {"train_loss": -10.478126525878906, "global_step": 169037, "epoch": 1006} {"train_loss": -10.38891887664795, "global_step": 169038, "epoch": 1006} {"train_loss": -11.114253997802734, "global_step": 169039, "epoch": 1006} {"train_loss": -10.772010803222656, "global_step": 169040, "epoch": 1006} {"train_loss": -11.00370979309082, "global_step": 169041, "epoch": 1006} {"train_loss": -11.123455047607422, "global_step": 169042, "epoch": 1006} {"train_loss": -11.040424346923828, "global_step": 169043, "epoch": 1006} {"train_loss": -11.18929672241211, "global_step": 169044, "epoch": 1006} {"train_loss": -11.00724983215332, "global_step": 169045, "epoch": 1006} {"train_loss": -11.058338165283203, "global_step": 169046, "epoch": 1006} {"train_loss": -11.00586986541748, "global_step": 169047, "epoch": 1006} {"train_loss": -11.350506782531738, "global_step": 169048, "epoch": 1006} {"train_loss": -11.279918670654297, "global_step": 169049, "epoch": 1006} {"train_loss": -11.421440124511719, "global_step": 169050, "epoch": 1006} {"train_loss": -10.920173645019531, "global_step": 169051, "epoch": 1006} {"train_loss": -10.989232063293457, "global_step": 169052, "epoch": 1006} {"train_loss": -11.10295581817627, "global_step": 169053, "epoch": 1006} {"train_loss": -10.764911651611328, "global_step": 169054, "epoch": 1006} {"train_loss": -11.204702377319336, "global_step": 169055, "epoch": 1006} {"train_loss": -11.146805763244629, "global_step": 169056, "epoch": 1006} {"train_loss": -11.065780639648438, "global_step": 169057, "epoch": 1006} {"train_loss": -11.235807418823242, "global_step": 169058, "epoch": 1006} {"train_loss": -11.193872451782227, "global_step": 169059, "epoch": 1006} {"train_loss": -11.061976432800293, "global_step": 169060, "epoch": 1006} {"train_loss": -10.851273536682129, "global_step": 169061, "epoch": 1006} {"train_loss": -10.647012710571289, "global_step": 169062, "epoch": 1006} {"train_loss": -10.759140014648438, "global_step": 169063, "epoch": 1006} {"train_loss": -10.852890014648438, "global_step": 169064, "epoch": 1006} {"train_loss": -10.419553756713867, "global_step": 169065, "epoch": 1006} {"train_loss": -11.036699295043945, "global_step": 169066, "epoch": 1006} {"train_loss": -10.542173385620117, "global_step": 169067, "epoch": 1006} {"train_loss": -10.664902687072754, "global_step": 169068, "epoch": 1006} {"train_loss": -10.747198104858398, "global_step": 169069, "epoch": 1006} {"train_loss": -10.958043098449707, "global_step": 169070, "epoch": 1006} {"train_loss": -10.559379577636719, "global_step": 169071, "epoch": 1006} {"train_loss": -10.918045997619629, "global_step": 169072, "epoch": 1006} {"train_loss": -10.395903587341309, "global_step": 169073, "epoch": 1006} {"train_loss": -11.003579139709473, "global_step": 169074, "epoch": 1006} {"train_loss": -10.866273880004883, "global_step": 169075, "epoch": 1006} {"train_loss": -11.191789627075195, "global_step": 169076, "epoch": 1006} {"train_loss": -11.009174346923828, "global_step": 169077, "epoch": 1006} {"train_loss": -10.911211013793945, "global_step": 169078, "epoch": 1006} {"train_loss": -10.84649658203125, "global_step": 169079, "epoch": 1006} {"train_loss": -11.118627548217773, "global_step": 169080, "epoch": 1006} {"train_loss": -10.747237205505371, "global_step": 169081, "epoch": 1006} {"train_loss": -10.915220260620117, "global_step": 169082, "epoch": 1006} {"train_loss": -10.992566108703613, "global_step": 169083, "epoch": 1006} {"train_loss": -10.968536376953125, "global_step": 169084, "epoch": 1006} {"train_loss": -10.949945449829102, "global_step": 169085, "epoch": 1006} {"train_loss": -10.932945251464844, "global_step": 169086, "epoch": 1006} {"train_loss": -10.790653228759766, "global_step": 169087, "epoch": 1006} {"train_loss": -10.764486312866211, "global_step": 169088, "epoch": 1006} {"train_loss": -10.998954772949219, "global_step": 169089, "epoch": 1006} {"train_loss": -10.790820121765137, "global_step": 169090, "epoch": 1006} {"train_loss": -10.700752258300781, "global_step": 169091, "epoch": 1006} {"train_loss": -10.861858367919922, "global_step": 169092, "epoch": 1006} {"train_loss": -10.746617317199707, "global_step": 169093, "epoch": 1006} {"train_loss": -11.212589263916016, "global_step": 169094, "epoch": 1006} {"train_loss": -10.704643249511719, "global_step": 169095, "epoch": 1006} {"train_loss": -10.778341293334961, "global_step": 169096, "epoch": 1006} {"train_loss": -10.770788192749023, "global_step": 169097, "epoch": 1006} {"train_loss": -10.622608184814453, "global_step": 169098, "epoch": 1006} {"train_loss": -11.124139785766602, "global_step": 169099, "epoch": 1006} {"train_loss": -11.034284591674805, "global_step": 169100, "epoch": 1006} {"train_loss": -10.91526985168457, "global_step": 169101, "epoch": 1006} {"train_loss": -10.86793041229248, "global_step": 169102, "epoch": 1006} {"train_loss": -10.815075874328613, "global_step": 169103, "epoch": 1006} {"train_loss": -11.114461898803711, "global_step": 169104, "epoch": 1006} {"train_loss": -11.076756477355957, "global_step": 169105, "epoch": 1006} {"train_loss": -11.04446792602539, "global_step": 169106, "epoch": 1006} {"train_loss": -10.882579803466797, "global_step": 169107, "epoch": 1006} {"train_loss": -10.824860572814941, "global_step": 169108, "epoch": 1006} {"train_loss": -11.174406051635742, "global_step": 169109, "epoch": 1006} {"train_loss": -11.29074478149414, "global_step": 169110, "epoch": 1006} {"train_loss": -10.941205024719238, "global_step": 169111, "epoch": 1006} {"train_loss": -11.263274192810059, "global_step": 169112, "epoch": 1006} {"train_loss": -11.021692276000977, "global_step": 169113, "epoch": 1006} {"train_loss": -11.100775718688965, "global_step": 169114, "epoch": 1006} {"train_loss": -11.197912216186523, "global_step": 169115, "epoch": 1006} {"train_loss": -11.34326171875, "global_step": 169116, "epoch": 1006} {"train_loss": -10.89836311340332, "global_step": 169117, "epoch": 1006} {"train_loss": -11.207817077636719, "global_step": 169118, "epoch": 1006} {"train_loss": -11.198600769042969, "global_step": 169119, "epoch": 1006} {"train_loss": -11.176774978637695, "global_step": 169120, "epoch": 1006} {"train_loss": -11.13853645324707, "global_step": 169121, "epoch": 1006} {"train_loss": -10.717514991760254, "global_step": 169122, "epoch": 1006} {"train_loss": -10.939634323120117, "global_step": 169123, "epoch": 1006} {"train_loss": -10.93341064453125, "global_step": 169124, "epoch": 1006} {"train_loss": -11.20866584777832, "global_step": 169125, "epoch": 1006} {"train_loss": -11.115547180175781, "global_step": 169126, "epoch": 1006} {"train_loss": -10.959968566894531, "global_step": 169127, "epoch": 1006} {"train_loss": -11.078951835632324, "global_step": 169128, "epoch": 1006} {"train_loss": -11.323563575744629, "global_step": 169129, "epoch": 1006} {"train_loss": -10.893028259277344, "global_step": 169130, "epoch": 1006} {"train_loss": -11.21395492553711, "global_step": 169131, "epoch": 1006} {"train_loss": -10.672635078430176, "global_step": 169132, "epoch": 1006} {"train_loss": -11.175199508666992, "global_step": 169133, "epoch": 1006} {"train_loss": -10.675680160522461, "global_step": 169134, "epoch": 1006} {"train_loss": -10.671882629394531, "global_step": 169135, "epoch": 1006} {"train_loss": -10.830941200256348, "global_step": 169136, "epoch": 1006} {"train_loss": -10.425331115722656, "global_step": 169137, "epoch": 1006} {"train_loss": -10.74654769897461, "global_step": 169138, "epoch": 1006} {"train_loss": -10.530986785888672, "global_step": 169139, "epoch": 1006} {"train_loss": -10.721501350402832, "global_step": 169140, "epoch": 1006} {"train_loss": -10.182596206665039, "global_step": 169141, "epoch": 1006} {"train_loss": -10.759883880615234, "global_step": 169142, "epoch": 1006} {"train_loss": -10.442628860473633, "global_step": 169143, "epoch": 1006} {"train_loss": -10.657981872558594, "global_step": 169144, "epoch": 1006} {"train_loss": -10.796897888183594, "global_step": 169145, "epoch": 1006} {"train_loss": -10.533207893371582, "global_step": 169146, "epoch": 1006} {"train_loss": -11.091499328613281, "global_step": 169147, "epoch": 1006} {"train_loss": -10.294166564941406, "global_step": 169148, "epoch": 1006} {"train_loss": -11.146963119506836, "global_step": 169149, "epoch": 1006} {"train_loss": -10.41845417022705, "global_step": 169150, "epoch": 1006} {"train_loss": -11.000617980957031, "global_step": 169151, "epoch": 1006} {"train_loss": -10.50983715057373, "global_step": 169152, "epoch": 1006} {"train_loss": -10.960685729980469, "global_step": 169153, "epoch": 1006} {"train_loss": -11.063240051269531, "global_step": 169154, "epoch": 1006} {"train_loss": -10.592771530151367, "global_step": 169155, "epoch": 1006} {"train_loss": -10.958625793457031, "global_step": 169156, "epoch": 1006} {"train_loss": -10.66767692565918, "global_step": 169157, "epoch": 1006} {"train_loss": -11.19257640838623, "global_step": 169158, "epoch": 1006} {"train_loss": -10.619793891906738, "global_step": 169159, "epoch": 1006} {"train_loss": -10.439562797546387, "global_step": 169160, "epoch": 1006} {"train_loss": -10.908065795898438, "global_step": 169161, "epoch": 1006} {"train_loss": -9.558002471923828, "global_step": 169162, "epoch": 1006} {"train_loss": -10.65411376953125, "global_step": 169163, "epoch": 1006} {"train_loss": -9.435855865478516, "global_step": 169164, "epoch": 1006} {"train_loss": -10.869543075561523, "global_step": 169165, "epoch": 1006} {"train_loss": -10.09912109375, "global_step": 169166, "epoch": 1006} {"train_loss": -10.296292304992676, "global_step": 169167, "epoch": 1006} {"train_loss": -10.849493980407715, "global_step": 169168, "epoch": 1006} {"train_loss": -10.293282508850098, "global_step": 169169, "epoch": 1006} {"train_loss": -10.589899063110352, "global_step": 169170, "epoch": 1006} {"train_loss": -10.738824844360352, "global_step": 169171, "epoch": 1006} {"train_loss": -10.25442123413086, "global_step": 169172, "epoch": 1006} {"train_loss": -10.729464530944824, "global_step": 169173, "epoch": 1006} {"train_loss": -10.432025909423828, "global_step": 169174, "epoch": 1006} {"train_loss": -10.863315729867844, "global_step": 169175, "epoch": 1006, "val_loss": 239013.265625} {"train_loss": -10.828025817871094, "global_step": 169176, "epoch": 1007} {"train_loss": -10.598814010620117, "global_step": 169177, "epoch": 1007} {"train_loss": -10.592178344726562, "global_step": 169178, "epoch": 1007} {"train_loss": -10.897912979125977, "global_step": 169179, "epoch": 1007} {"train_loss": -10.712642669677734, "global_step": 169180, "epoch": 1007} {"train_loss": -11.000919342041016, "global_step": 169181, "epoch": 1007} {"train_loss": -10.681130409240723, "global_step": 169182, "epoch": 1007} {"train_loss": -10.906253814697266, "global_step": 169183, "epoch": 1007} {"train_loss": -10.869585037231445, "global_step": 169184, "epoch": 1007} {"train_loss": -10.995233535766602, "global_step": 169185, "epoch": 1007} {"train_loss": -11.04063892364502, "global_step": 169186, "epoch": 1007} {"train_loss": -10.99034595489502, "global_step": 169187, "epoch": 1007} {"train_loss": -10.890802383422852, "global_step": 169188, "epoch": 1007} {"train_loss": -10.805220603942871, "global_step": 169189, "epoch": 1007} {"train_loss": -11.036492347717285, "global_step": 169190, "epoch": 1007} {"train_loss": -10.8076810836792, "global_step": 169191, "epoch": 1007} {"train_loss": -10.864629745483398, "global_step": 169192, "epoch": 1007} {"train_loss": -10.852274894714355, "global_step": 169193, "epoch": 1007} {"train_loss": -11.003761291503906, "global_step": 169194, "epoch": 1007} {"train_loss": -11.095523834228516, "global_step": 169195, "epoch": 1007} {"train_loss": -11.049529075622559, "global_step": 169196, "epoch": 1007} {"train_loss": -11.08365249633789, "global_step": 169197, "epoch": 1007} {"train_loss": -11.124004364013672, "global_step": 169198, "epoch": 1007} {"train_loss": -11.308442115783691, "global_step": 169199, "epoch": 1007} {"train_loss": -10.994414329528809, "global_step": 169200, "epoch": 1007} {"train_loss": -11.241156578063965, "global_step": 169201, "epoch": 1007} {"train_loss": -11.22819709777832, "global_step": 169202, "epoch": 1007} {"train_loss": -11.083338737487793, "global_step": 169203, "epoch": 1007} {"train_loss": -11.282032012939453, "global_step": 169204, "epoch": 1007} {"train_loss": -11.213695526123047, "global_step": 169205, "epoch": 1007} {"train_loss": -10.966379165649414, "global_step": 169206, "epoch": 1007} {"train_loss": -11.062397956848145, "global_step": 169207, "epoch": 1007} {"train_loss": -11.150196075439453, "global_step": 169208, "epoch": 1007} {"train_loss": -11.142985343933105, "global_step": 169209, "epoch": 1007} {"train_loss": -10.919421195983887, "global_step": 169210, "epoch": 1007} {"train_loss": -10.80910873413086, "global_step": 169211, "epoch": 1007} {"train_loss": -10.749293327331543, "global_step": 169212, "epoch": 1007} {"train_loss": -11.091476440429688, "global_step": 169213, "epoch": 1007} {"train_loss": -10.21029281616211, "global_step": 169214, "epoch": 1007} {"train_loss": -10.883039474487305, "global_step": 169215, "epoch": 1007} {"train_loss": -11.050209045410156, "global_step": 169216, "epoch": 1007} {"train_loss": -10.838973999023438, "global_step": 169217, "epoch": 1007} {"train_loss": -11.043366432189941, "global_step": 169218, "epoch": 1007} {"train_loss": -10.572662353515625, "global_step": 169219, "epoch": 1007} {"train_loss": -10.272555351257324, "global_step": 169220, "epoch": 1007} {"train_loss": -10.732450485229492, "global_step": 169221, "epoch": 1007} {"train_loss": -10.019378662109375, "global_step": 169222, "epoch": 1007} {"train_loss": -10.557613372802734, "global_step": 169223, "epoch": 1007} {"train_loss": -10.755768775939941, "global_step": 169224, "epoch": 1007} {"train_loss": -9.81429672241211, "global_step": 169225, "epoch": 1007} {"train_loss": -11.020256042480469, "global_step": 169226, "epoch": 1007} {"train_loss": -9.783933639526367, "global_step": 169227, "epoch": 1007} {"train_loss": -11.082468032836914, "global_step": 169228, "epoch": 1007} {"train_loss": -10.10213851928711, "global_step": 169229, "epoch": 1007} {"train_loss": -10.977643966674805, "global_step": 169230, "epoch": 1007} {"train_loss": -10.543094635009766, "global_step": 169231, "epoch": 1007} {"train_loss": -10.88206672668457, "global_step": 169232, "epoch": 1007} {"train_loss": -10.482720375061035, "global_step": 169233, "epoch": 1007} {"train_loss": -10.563238143920898, "global_step": 169234, "epoch": 1007} {"train_loss": -10.509593963623047, "global_step": 169235, "epoch": 1007} {"train_loss": -10.915169715881348, "global_step": 169236, "epoch": 1007} {"train_loss": -11.153079986572266, "global_step": 169237, "epoch": 1007} {"train_loss": -11.008764266967773, "global_step": 169238, "epoch": 1007} {"train_loss": -10.85999870300293, "global_step": 169239, "epoch": 1007} {"train_loss": -11.011608123779297, "global_step": 169240, "epoch": 1007} {"train_loss": -10.82581615447998, "global_step": 169241, "epoch": 1007} {"train_loss": -11.147370338439941, "global_step": 169242, "epoch": 1007} {"train_loss": -10.817635536193848, "global_step": 169243, "epoch": 1007} {"train_loss": -11.117136001586914, "global_step": 169244, "epoch": 1007} {"train_loss": -11.037614822387695, "global_step": 169245, "epoch": 1007} {"train_loss": -11.16415786743164, "global_step": 169246, "epoch": 1007} {"train_loss": -10.948217391967773, "global_step": 169247, "epoch": 1007} {"train_loss": -11.064292907714844, "global_step": 169248, "epoch": 1007} {"train_loss": -11.194955825805664, "global_step": 169249, "epoch": 1007} {"train_loss": -11.192378997802734, "global_step": 169250, "epoch": 1007} {"train_loss": -11.326921463012695, "global_step": 169251, "epoch": 1007} {"train_loss": -10.962337493896484, "global_step": 169252, "epoch": 1007} {"train_loss": -11.028541564941406, "global_step": 169253, "epoch": 1007} {"train_loss": -10.927244186401367, "global_step": 169254, "epoch": 1007} {"train_loss": -11.313474655151367, "global_step": 169255, "epoch": 1007} {"train_loss": -11.199117660522461, "global_step": 169256, "epoch": 1007} {"train_loss": -11.268486022949219, "global_step": 169257, "epoch": 1007} {"train_loss": -11.310745239257812, "global_step": 169258, "epoch": 1007} {"train_loss": -11.257204055786133, "global_step": 169259, "epoch": 1007} {"train_loss": -11.162487030029297, "global_step": 169260, "epoch": 1007} {"train_loss": -11.335138320922852, "global_step": 169261, "epoch": 1007} {"train_loss": -11.464924812316895, "global_step": 169262, "epoch": 1007} {"train_loss": -11.38404655456543, "global_step": 169263, "epoch": 1007} {"train_loss": -11.081296920776367, "global_step": 169264, "epoch": 1007} {"train_loss": -11.332910537719727, "global_step": 169265, "epoch": 1007} {"train_loss": -11.232036590576172, "global_step": 169266, "epoch": 1007} {"train_loss": -11.230816841125488, "global_step": 169267, "epoch": 1007} {"train_loss": -11.240467071533203, "global_step": 169268, "epoch": 1007} {"train_loss": -11.226390838623047, "global_step": 169269, "epoch": 1007} {"train_loss": -11.219547271728516, "global_step": 169270, "epoch": 1007} {"train_loss": -11.328826904296875, "global_step": 169271, "epoch": 1007} {"train_loss": -11.398468971252441, "global_step": 169272, "epoch": 1007} {"train_loss": -11.280160903930664, "global_step": 169273, "epoch": 1007} {"train_loss": -11.044543266296387, "global_step": 169274, "epoch": 1007} {"train_loss": -11.267908096313477, "global_step": 169275, "epoch": 1007} {"train_loss": -11.177067756652832, "global_step": 169276, "epoch": 1007} {"train_loss": -11.162055015563965, "global_step": 169277, "epoch": 1007} {"train_loss": -11.259904861450195, "global_step": 169278, "epoch": 1007} {"train_loss": -11.165342330932617, "global_step": 169279, "epoch": 1007} {"train_loss": -11.423883438110352, "global_step": 169280, "epoch": 1007} {"train_loss": -11.276994705200195, "global_step": 169281, "epoch": 1007} {"train_loss": -11.38534164428711, "global_step": 169282, "epoch": 1007} {"train_loss": -11.259394645690918, "global_step": 169283, "epoch": 1007} {"train_loss": -11.341710090637207, "global_step": 169284, "epoch": 1007} {"train_loss": -11.153646469116211, "global_step": 169285, "epoch": 1007} {"train_loss": -10.968316078186035, "global_step": 169286, "epoch": 1007} {"train_loss": -11.268526077270508, "global_step": 169287, "epoch": 1007} {"train_loss": -10.712627410888672, "global_step": 169288, "epoch": 1007} {"train_loss": -11.079200744628906, "global_step": 169289, "epoch": 1007} {"train_loss": -10.323719024658203, "global_step": 169290, "epoch": 1007} {"train_loss": -10.978225708007812, "global_step": 169291, "epoch": 1007} {"train_loss": -10.67298698425293, "global_step": 169292, "epoch": 1007} {"train_loss": -10.375831604003906, "global_step": 169293, "epoch": 1007} {"train_loss": -10.148994445800781, "global_step": 169294, "epoch": 1007} {"train_loss": -10.477968215942383, "global_step": 169295, "epoch": 1007} {"train_loss": -10.828631401062012, "global_step": 169296, "epoch": 1007} {"train_loss": -9.081548690795898, "global_step": 169297, "epoch": 1007} {"train_loss": -10.986404418945312, "global_step": 169298, "epoch": 1007} {"train_loss": -9.751062393188477, "global_step": 169299, "epoch": 1007} {"train_loss": -10.21432876586914, "global_step": 169300, "epoch": 1007} {"train_loss": -10.118141174316406, "global_step": 169301, "epoch": 1007} {"train_loss": -10.188610076904297, "global_step": 169302, "epoch": 1007} {"train_loss": -10.529770851135254, "global_step": 169303, "epoch": 1007} {"train_loss": -10.433026313781738, "global_step": 169304, "epoch": 1007} {"train_loss": -10.7385835647583, "global_step": 169305, "epoch": 1007} {"train_loss": -10.473648071289062, "global_step": 169306, "epoch": 1007} {"train_loss": -10.722874641418457, "global_step": 169307, "epoch": 1007} {"train_loss": -10.627869606018066, "global_step": 169308, "epoch": 1007} {"train_loss": -10.753700256347656, "global_step": 169309, "epoch": 1007} {"train_loss": -10.392013549804688, "global_step": 169310, "epoch": 1007} {"train_loss": -10.958988189697266, "global_step": 169311, "epoch": 1007} {"train_loss": -10.482608795166016, "global_step": 169312, "epoch": 1007} {"train_loss": -11.02297592163086, "global_step": 169313, "epoch": 1007} {"train_loss": -10.583467483520508, "global_step": 169314, "epoch": 1007} {"train_loss": -10.870403289794922, "global_step": 169315, "epoch": 1007} {"train_loss": -10.723816871643066, "global_step": 169316, "epoch": 1007} {"train_loss": -10.8756103515625, "global_step": 169317, "epoch": 1007} {"train_loss": -10.94654655456543, "global_step": 169318, "epoch": 1007} {"train_loss": -11.006136894226074, "global_step": 169319, "epoch": 1007} {"train_loss": -10.980932235717773, "global_step": 169320, "epoch": 1007} {"train_loss": -11.06942367553711, "global_step": 169321, "epoch": 1007} {"train_loss": -10.868965148925781, "global_step": 169322, "epoch": 1007} {"train_loss": -10.876428604125977, "global_step": 169323, "epoch": 1007} {"train_loss": -10.985965728759766, "global_step": 169324, "epoch": 1007} {"train_loss": -10.977720260620117, "global_step": 169325, "epoch": 1007} {"train_loss": -10.792457580566406, "global_step": 169326, "epoch": 1007} {"train_loss": -11.142417907714844, "global_step": 169327, "epoch": 1007} {"train_loss": -10.764032363891602, "global_step": 169328, "epoch": 1007} {"train_loss": -11.032323837280273, "global_step": 169329, "epoch": 1007} {"train_loss": -10.888233184814453, "global_step": 169330, "epoch": 1007} {"train_loss": -11.058429718017578, "global_step": 169331, "epoch": 1007} {"train_loss": -10.737716674804688, "global_step": 169332, "epoch": 1007} {"train_loss": -11.03620719909668, "global_step": 169333, "epoch": 1007} {"train_loss": -10.740140914916992, "global_step": 169334, "epoch": 1007} {"train_loss": -10.929486274719238, "global_step": 169335, "epoch": 1007} {"train_loss": -10.914361953735352, "global_step": 169336, "epoch": 1007} {"train_loss": -10.972555160522461, "global_step": 169337, "epoch": 1007} {"train_loss": -10.791587829589844, "global_step": 169338, "epoch": 1007} {"train_loss": -10.99079704284668, "global_step": 169339, "epoch": 1007} {"train_loss": -10.759002685546875, "global_step": 169340, "epoch": 1007} {"train_loss": -10.997912406921387, "global_step": 169341, "epoch": 1007} {"train_loss": -10.986137390136719, "global_step": 169342, "epoch": 1007} {"train_loss": -10.900950255848112, "global_step": 169343, "epoch": 1007, "val_loss": 238888.34375} {"train_loss": -11.021608352661133, "global_step": 169344, "epoch": 1008} {"train_loss": -10.98948860168457, "global_step": 169345, "epoch": 1008} {"train_loss": -11.098013877868652, "global_step": 169346, "epoch": 1008} {"train_loss": -10.98219108581543, "global_step": 169347, "epoch": 1008} {"train_loss": -11.128130912780762, "global_step": 169348, "epoch": 1008} {"train_loss": -11.091545104980469, "global_step": 169349, "epoch": 1008} {"train_loss": -11.279391288757324, "global_step": 169350, "epoch": 1008} {"train_loss": -11.162866592407227, "global_step": 169351, "epoch": 1008} {"train_loss": -11.466949462890625, "global_step": 169352, "epoch": 1008} {"train_loss": -11.163362503051758, "global_step": 169353, "epoch": 1008} {"train_loss": -11.124711990356445, "global_step": 169354, "epoch": 1008} {"train_loss": -11.076107025146484, "global_step": 169355, "epoch": 1008} {"train_loss": -11.137413024902344, "global_step": 169356, "epoch": 1008} {"train_loss": -10.930996894836426, "global_step": 169357, "epoch": 1008} {"train_loss": -11.133149147033691, "global_step": 169358, "epoch": 1008} {"train_loss": -10.896673202514648, "global_step": 169359, "epoch": 1008} {"train_loss": -10.921802520751953, "global_step": 169360, "epoch": 1008} {"train_loss": -10.99807071685791, "global_step": 169361, "epoch": 1008} {"train_loss": -11.027050018310547, "global_step": 169362, "epoch": 1008} {"train_loss": -10.861763000488281, "global_step": 169363, "epoch": 1008} {"train_loss": -11.313060760498047, "global_step": 169364, "epoch": 1008} {"train_loss": -11.136919021606445, "global_step": 169365, "epoch": 1008} {"train_loss": -10.763083457946777, "global_step": 169366, "epoch": 1008} {"train_loss": -11.28543472290039, "global_step": 169367, "epoch": 1008} {"train_loss": -10.974175453186035, "global_step": 169368, "epoch": 1008} {"train_loss": -10.721334457397461, "global_step": 169369, "epoch": 1008} {"train_loss": -11.376723289489746, "global_step": 169370, "epoch": 1008} {"train_loss": -11.044122695922852, "global_step": 169371, "epoch": 1008} {"train_loss": -10.696020126342773, "global_step": 169372, "epoch": 1008} {"train_loss": -10.594670295715332, "global_step": 169373, "epoch": 1008} {"train_loss": -11.438764572143555, "global_step": 169374, "epoch": 1008} {"train_loss": -11.001886367797852, "global_step": 169375, "epoch": 1008} {"train_loss": -10.606775283813477, "global_step": 169376, "epoch": 1008} {"train_loss": -10.782157897949219, "global_step": 169377, "epoch": 1008} {"train_loss": -11.186830520629883, "global_step": 169378, "epoch": 1008} {"train_loss": -11.27328109741211, "global_step": 169379, "epoch": 1008} {"train_loss": -11.337743759155273, "global_step": 169380, "epoch": 1008} {"train_loss": -11.265556335449219, "global_step": 169381, "epoch": 1008} {"train_loss": -10.973779678344727, "global_step": 169382, "epoch": 1008} {"train_loss": -11.095270156860352, "global_step": 169383, "epoch": 1008} {"train_loss": -11.20042610168457, "global_step": 169384, "epoch": 1008} {"train_loss": -10.844282150268555, "global_step": 169385, "epoch": 1008} {"train_loss": -10.728395462036133, "global_step": 169386, "epoch": 1008} {"train_loss": -10.605522155761719, "global_step": 169387, "epoch": 1008} {"train_loss": -10.824641227722168, "global_step": 169388, "epoch": 1008} {"train_loss": -10.330339431762695, "global_step": 169389, "epoch": 1008} {"train_loss": -10.65598201751709, "global_step": 169390, "epoch": 1008} {"train_loss": -10.445276260375977, "global_step": 169391, "epoch": 1008} {"train_loss": -9.514994621276855, "global_step": 169392, "epoch": 1008} {"train_loss": -9.076385498046875, "global_step": 169393, "epoch": 1008} {"train_loss": -10.510790824890137, "global_step": 169394, "epoch": 1008} {"train_loss": -9.650400161743164, "global_step": 169395, "epoch": 1008} {"train_loss": -10.993368148803711, "global_step": 169396, "epoch": 1008} {"train_loss": -9.720836639404297, "global_step": 169397, "epoch": 1008} {"train_loss": -10.515342712402344, "global_step": 169398, "epoch": 1008} {"train_loss": -10.529523849487305, "global_step": 169399, "epoch": 1008} {"train_loss": -10.504003524780273, "global_step": 169400, "epoch": 1008} {"train_loss": -10.722124099731445, "global_step": 169401, "epoch": 1008} {"train_loss": -10.17613410949707, "global_step": 169402, "epoch": 1008} {"train_loss": -10.657902717590332, "global_step": 169403, "epoch": 1008} {"train_loss": -10.424905776977539, "global_step": 169404, "epoch": 1008} {"train_loss": -10.844350814819336, "global_step": 169405, "epoch": 1008} {"train_loss": -10.393488883972168, "global_step": 169406, "epoch": 1008} {"train_loss": -10.92019271850586, "global_step": 169407, "epoch": 1008} {"train_loss": -10.733833312988281, "global_step": 169408, "epoch": 1008} {"train_loss": -10.502584457397461, "global_step": 169409, "epoch": 1008} {"train_loss": -10.89214038848877, "global_step": 169410, "epoch": 1008} {"train_loss": -10.845224380493164, "global_step": 169411, "epoch": 1008} {"train_loss": -10.819662094116211, "global_step": 169412, "epoch": 1008} {"train_loss": -10.954978942871094, "global_step": 169413, "epoch": 1008} {"train_loss": -10.559240341186523, "global_step": 169414, "epoch": 1008} {"train_loss": -10.682616233825684, "global_step": 169415, "epoch": 1008} {"train_loss": -10.818747520446777, "global_step": 169416, "epoch": 1008} {"train_loss": -10.855003356933594, "global_step": 169417, "epoch": 1008} {"train_loss": -10.598085403442383, "global_step": 169418, "epoch": 1008} {"train_loss": -10.618020057678223, "global_step": 169419, "epoch": 1008} {"train_loss": -10.766471862792969, "global_step": 169420, "epoch": 1008} {"train_loss": -10.348091125488281, "global_step": 169421, "epoch": 1008} {"train_loss": -10.934208869934082, "global_step": 169422, "epoch": 1008} {"train_loss": -10.068748474121094, "global_step": 169423, "epoch": 1008} {"train_loss": -10.801048278808594, "global_step": 169424, "epoch": 1008} {"train_loss": -10.91112995147705, "global_step": 169425, "epoch": 1008} {"train_loss": -10.69827651977539, "global_step": 169426, "epoch": 1008} {"train_loss": -10.858827590942383, "global_step": 169427, "epoch": 1008} {"train_loss": -10.79348087310791, "global_step": 169428, "epoch": 1008} {"train_loss": -10.877866744995117, "global_step": 169429, "epoch": 1008} {"train_loss": -11.029918670654297, "global_step": 169430, "epoch": 1008} {"train_loss": -10.92707633972168, "global_step": 169431, "epoch": 1008} {"train_loss": -10.796944618225098, "global_step": 169432, "epoch": 1008} {"train_loss": -10.889886856079102, "global_step": 169433, "epoch": 1008} {"train_loss": -10.776081085205078, "global_step": 169434, "epoch": 1008} {"train_loss": -11.088621139526367, "global_step": 169435, "epoch": 1008} {"train_loss": -11.069849014282227, "global_step": 169436, "epoch": 1008} {"train_loss": -11.235980987548828, "global_step": 169437, "epoch": 1008} {"train_loss": -11.01144790649414, "global_step": 169438, "epoch": 1008} {"train_loss": -11.075424194335938, "global_step": 169439, "epoch": 1008} {"train_loss": -10.85513687133789, "global_step": 169440, "epoch": 1008} {"train_loss": -11.10956859588623, "global_step": 169441, "epoch": 1008} {"train_loss": -11.258218765258789, "global_step": 169442, "epoch": 1008} {"train_loss": -10.85895824432373, "global_step": 169443, "epoch": 1008} {"train_loss": -11.21644401550293, "global_step": 169444, "epoch": 1008} {"train_loss": -10.945709228515625, "global_step": 169445, "epoch": 1008} {"train_loss": -11.189325332641602, "global_step": 169446, "epoch": 1008} {"train_loss": -10.940559387207031, "global_step": 169447, "epoch": 1008} {"train_loss": -11.01633071899414, "global_step": 169448, "epoch": 1008} {"train_loss": -11.27214241027832, "global_step": 169449, "epoch": 1008} {"train_loss": -11.041666030883789, "global_step": 169450, "epoch": 1008} {"train_loss": -11.383238792419434, "global_step": 169451, "epoch": 1008} {"train_loss": -11.266319274902344, "global_step": 169452, "epoch": 1008} {"train_loss": -11.24262809753418, "global_step": 169453, "epoch": 1008} {"train_loss": -11.196634292602539, "global_step": 169454, "epoch": 1008} {"train_loss": -11.293452262878418, "global_step": 169455, "epoch": 1008} {"train_loss": -11.179890632629395, "global_step": 169456, "epoch": 1008} {"train_loss": -10.963970184326172, "global_step": 169457, "epoch": 1008} {"train_loss": -11.24625015258789, "global_step": 169458, "epoch": 1008} {"train_loss": -11.255237579345703, "global_step": 169459, "epoch": 1008} {"train_loss": -11.125699996948242, "global_step": 169460, "epoch": 1008} {"train_loss": -11.489004135131836, "global_step": 169461, "epoch": 1008} {"train_loss": -11.025042533874512, "global_step": 169462, "epoch": 1008} {"train_loss": -11.242364883422852, "global_step": 169463, "epoch": 1008} {"train_loss": -11.054099082946777, "global_step": 169464, "epoch": 1008} {"train_loss": -11.111672401428223, "global_step": 169465, "epoch": 1008} {"train_loss": -11.0018310546875, "global_step": 169466, "epoch": 1008} {"train_loss": -10.935831069946289, "global_step": 169467, "epoch": 1008} {"train_loss": -10.890121459960938, "global_step": 169468, "epoch": 1008} {"train_loss": -11.232526779174805, "global_step": 169469, "epoch": 1008} {"train_loss": -11.088730812072754, "global_step": 169470, "epoch": 1008} {"train_loss": -10.699030876159668, "global_step": 169471, "epoch": 1008} {"train_loss": -11.282980918884277, "global_step": 169472, "epoch": 1008} {"train_loss": -11.009466171264648, "global_step": 169473, "epoch": 1008} {"train_loss": -10.935688018798828, "global_step": 169474, "epoch": 1008} {"train_loss": -10.928336143493652, "global_step": 169475, "epoch": 1008} {"train_loss": -10.785646438598633, "global_step": 169476, "epoch": 1008} {"train_loss": -11.252459526062012, "global_step": 169477, "epoch": 1008} {"train_loss": -11.128406524658203, "global_step": 169478, "epoch": 1008} {"train_loss": -11.335606575012207, "global_step": 169479, "epoch": 1008} {"train_loss": -11.178177833557129, "global_step": 169480, "epoch": 1008} {"train_loss": -11.231407165527344, "global_step": 169481, "epoch": 1008} {"train_loss": -11.138772010803223, "global_step": 169482, "epoch": 1008} {"train_loss": -11.017768859863281, "global_step": 169483, "epoch": 1008} {"train_loss": -10.860097885131836, "global_step": 169484, "epoch": 1008} {"train_loss": -11.289674758911133, "global_step": 169485, "epoch": 1008} {"train_loss": -11.281240463256836, "global_step": 169486, "epoch": 1008} {"train_loss": -11.321575164794922, "global_step": 169487, "epoch": 1008} {"train_loss": -11.063192367553711, "global_step": 169488, "epoch": 1008} {"train_loss": -11.340638160705566, "global_step": 169489, "epoch": 1008} {"train_loss": -11.32033920288086, "global_step": 169490, "epoch": 1008} {"train_loss": -11.099371910095215, "global_step": 169491, "epoch": 1008} {"train_loss": -11.328744888305664, "global_step": 169492, "epoch": 1008} {"train_loss": -11.127155303955078, "global_step": 169493, "epoch": 1008} {"train_loss": -11.359822273254395, "global_step": 169494, "epoch": 1008} {"train_loss": -11.283679962158203, "global_step": 169495, "epoch": 1008} {"train_loss": -11.343579292297363, "global_step": 169496, "epoch": 1008} {"train_loss": -11.341934204101562, "global_step": 169497, "epoch": 1008} {"train_loss": -11.34541130065918, "global_step": 169498, "epoch": 1008} {"train_loss": -11.0511474609375, "global_step": 169499, "epoch": 1008} {"train_loss": -11.166546821594238, "global_step": 169500, "epoch": 1008} {"train_loss": -11.00922679901123, "global_step": 169501, "epoch": 1008} {"train_loss": -10.98681640625, "global_step": 169502, "epoch": 1008} {"train_loss": -11.197564125061035, "global_step": 169503, "epoch": 1008} {"train_loss": -11.268823623657227, "global_step": 169504, "epoch": 1008} {"train_loss": -11.256643295288086, "global_step": 169505, "epoch": 1008} {"train_loss": -11.048755645751953, "global_step": 169506, "epoch": 1008} {"train_loss": -11.149499893188477, "global_step": 169507, "epoch": 1008} {"train_loss": -11.14944076538086, "global_step": 169508, "epoch": 1008} {"train_loss": -11.164704322814941, "global_step": 169509, "epoch": 1008} {"train_loss": -10.798355102539062, "global_step": 169510, "epoch": 1008} {"train_loss": -10.955858860697065, "global_step": 169511, "epoch": 1008, "val_loss": 236463.609375} {"train_loss": -10.50853443145752, "global_step": 169512, "epoch": 1009} {"train_loss": -10.693906784057617, "global_step": 169513, "epoch": 1009} {"train_loss": -11.308027267456055, "global_step": 169514, "epoch": 1009} {"train_loss": -10.67203426361084, "global_step": 169515, "epoch": 1009} {"train_loss": -11.106616973876953, "global_step": 169516, "epoch": 1009} {"train_loss": -11.018308639526367, "global_step": 169517, "epoch": 1009} {"train_loss": -11.007783889770508, "global_step": 169518, "epoch": 1009} {"train_loss": -11.035114288330078, "global_step": 169519, "epoch": 1009} {"train_loss": -11.230790138244629, "global_step": 169520, "epoch": 1009} {"train_loss": -10.999858856201172, "global_step": 169521, "epoch": 1009} {"train_loss": -11.195390701293945, "global_step": 169522, "epoch": 1009} {"train_loss": -10.979677200317383, "global_step": 169523, "epoch": 1009} {"train_loss": -10.804685592651367, "global_step": 169524, "epoch": 1009} {"train_loss": -11.030754089355469, "global_step": 169525, "epoch": 1009} {"train_loss": -11.164997100830078, "global_step": 169526, "epoch": 1009} {"train_loss": -10.461568832397461, "global_step": 169527, "epoch": 1009} {"train_loss": -11.359943389892578, "global_step": 169528, "epoch": 1009} {"train_loss": -10.31381607055664, "global_step": 169529, "epoch": 1009} {"train_loss": -11.310552597045898, "global_step": 169530, "epoch": 1009} {"train_loss": -10.200067520141602, "global_step": 169531, "epoch": 1009} {"train_loss": -10.584224700927734, "global_step": 169532, "epoch": 1009} {"train_loss": -10.651729583740234, "global_step": 169533, "epoch": 1009} {"train_loss": -10.852221488952637, "global_step": 169534, "epoch": 1009} {"train_loss": -10.63280963897705, "global_step": 169535, "epoch": 1009} {"train_loss": -10.547942161560059, "global_step": 169536, "epoch": 1009} {"train_loss": -10.886430740356445, "global_step": 169537, "epoch": 1009} {"train_loss": -10.936681747436523, "global_step": 169538, "epoch": 1009} {"train_loss": -10.744468688964844, "global_step": 169539, "epoch": 1009} {"train_loss": -11.168851852416992, "global_step": 169540, "epoch": 1009} {"train_loss": -10.870412826538086, "global_step": 169541, "epoch": 1009} {"train_loss": -10.614602088928223, "global_step": 169542, "epoch": 1009} {"train_loss": -10.712135314941406, "global_step": 169543, "epoch": 1009} {"train_loss": -10.671655654907227, "global_step": 169544, "epoch": 1009} {"train_loss": -10.397125244140625, "global_step": 169545, "epoch": 1009} {"train_loss": -10.841604232788086, "global_step": 169546, "epoch": 1009} {"train_loss": -10.06702709197998, "global_step": 169547, "epoch": 1009} {"train_loss": -10.788188934326172, "global_step": 169548, "epoch": 1009} {"train_loss": -10.498125076293945, "global_step": 169549, "epoch": 1009} {"train_loss": -10.698907852172852, "global_step": 169550, "epoch": 1009} {"train_loss": -10.2369966506958, "global_step": 169551, "epoch": 1009} {"train_loss": -10.100898742675781, "global_step": 169552, "epoch": 1009} {"train_loss": -10.4273042678833, "global_step": 169553, "epoch": 1009} {"train_loss": -10.180667877197266, "global_step": 169554, "epoch": 1009} {"train_loss": -10.235797882080078, "global_step": 169555, "epoch": 1009} {"train_loss": -10.464441299438477, "global_step": 169556, "epoch": 1009} {"train_loss": -10.668854713439941, "global_step": 169557, "epoch": 1009} {"train_loss": -10.005753517150879, "global_step": 169558, "epoch": 1009} {"train_loss": -10.80401611328125, "global_step": 169559, "epoch": 1009} {"train_loss": -10.41100788116455, "global_step": 169560, "epoch": 1009} {"train_loss": -10.595596313476562, "global_step": 169561, "epoch": 1009} {"train_loss": -10.612208366394043, "global_step": 169562, "epoch": 1009} {"train_loss": -10.932832717895508, "global_step": 169563, "epoch": 1009} {"train_loss": -10.915775299072266, "global_step": 169564, "epoch": 1009} {"train_loss": -10.684627532958984, "global_step": 169565, "epoch": 1009} {"train_loss": -10.921839714050293, "global_step": 169566, "epoch": 1009} {"train_loss": -11.011103630065918, "global_step": 169567, "epoch": 1009} {"train_loss": -10.542695045471191, "global_step": 169568, "epoch": 1009} {"train_loss": -10.838750839233398, "global_step": 169569, "epoch": 1009} {"train_loss": -11.178702354431152, "global_step": 169570, "epoch": 1009} {"train_loss": -10.59989070892334, "global_step": 169571, "epoch": 1009} {"train_loss": -10.934253692626953, "global_step": 169572, "epoch": 1009} {"train_loss": -10.629080772399902, "global_step": 169573, "epoch": 1009} {"train_loss": -10.946365356445312, "global_step": 169574, "epoch": 1009} {"train_loss": -10.77789306640625, "global_step": 169575, "epoch": 1009} {"train_loss": -10.886484146118164, "global_step": 169576, "epoch": 1009} {"train_loss": -10.710529327392578, "global_step": 169577, "epoch": 1009} {"train_loss": -10.963041305541992, "global_step": 169578, "epoch": 1009} {"train_loss": -10.755419731140137, "global_step": 169579, "epoch": 1009} {"train_loss": -11.000570297241211, "global_step": 169580, "epoch": 1009} {"train_loss": -10.830041885375977, "global_step": 169581, "epoch": 1009} {"train_loss": -10.78205680847168, "global_step": 169582, "epoch": 1009} {"train_loss": -10.812431335449219, "global_step": 169583, "epoch": 1009} {"train_loss": -11.30024242401123, "global_step": 169584, "epoch": 1009} {"train_loss": -10.766508102416992, "global_step": 169585, "epoch": 1009} {"train_loss": -11.000410079956055, "global_step": 169586, "epoch": 1009} {"train_loss": -11.049747467041016, "global_step": 169587, "epoch": 1009} {"train_loss": -11.167442321777344, "global_step": 169588, "epoch": 1009} {"train_loss": -10.921632766723633, "global_step": 169589, "epoch": 1009} {"train_loss": -11.079084396362305, "global_step": 169590, "epoch": 1009} {"train_loss": -11.137175559997559, "global_step": 169591, "epoch": 1009} {"train_loss": -11.22030258178711, "global_step": 169592, "epoch": 1009} {"train_loss": -11.226619720458984, "global_step": 169593, "epoch": 1009} {"train_loss": -11.10551643371582, "global_step": 169594, "epoch": 1009} {"train_loss": -11.035776138305664, "global_step": 169595, "epoch": 1009} {"train_loss": -11.12271499633789, "global_step": 169596, "epoch": 1009} {"train_loss": -11.183935165405273, "global_step": 169597, "epoch": 1009} {"train_loss": -11.212126731872559, "global_step": 169598, "epoch": 1009} {"train_loss": -11.037843704223633, "global_step": 169599, "epoch": 1009} {"train_loss": -11.124130249023438, "global_step": 169600, "epoch": 1009} {"train_loss": -11.157732009887695, "global_step": 169601, "epoch": 1009} {"train_loss": -11.087947845458984, "global_step": 169602, "epoch": 1009} {"train_loss": -10.999585151672363, "global_step": 169603, "epoch": 1009} {"train_loss": -11.336345672607422, "global_step": 169604, "epoch": 1009} {"train_loss": -11.011550903320312, "global_step": 169605, "epoch": 1009} {"train_loss": -10.756231307983398, "global_step": 169606, "epoch": 1009} {"train_loss": -11.319159507751465, "global_step": 169607, "epoch": 1009} {"train_loss": -10.910417556762695, "global_step": 169608, "epoch": 1009} {"train_loss": -11.359817504882812, "global_step": 169609, "epoch": 1009} {"train_loss": -10.942678451538086, "global_step": 169610, "epoch": 1009} {"train_loss": -11.207168579101562, "global_step": 169611, "epoch": 1009} {"train_loss": -11.123612403869629, "global_step": 169612, "epoch": 1009} {"train_loss": -10.896329879760742, "global_step": 169613, "epoch": 1009} {"train_loss": -11.009214401245117, "global_step": 169614, "epoch": 1009} {"train_loss": -11.062019348144531, "global_step": 169615, "epoch": 1009} {"train_loss": -11.236286163330078, "global_step": 169616, "epoch": 1009} {"train_loss": -10.813419342041016, "global_step": 169617, "epoch": 1009} {"train_loss": -11.120559692382812, "global_step": 169618, "epoch": 1009} {"train_loss": -11.363568305969238, "global_step": 169619, "epoch": 1009} {"train_loss": -11.196005821228027, "global_step": 169620, "epoch": 1009} {"train_loss": -10.93355941772461, "global_step": 169621, "epoch": 1009} {"train_loss": -11.040023803710938, "global_step": 169622, "epoch": 1009} {"train_loss": -10.912399291992188, "global_step": 169623, "epoch": 1009} {"train_loss": -10.729776382446289, "global_step": 169624, "epoch": 1009} {"train_loss": -11.005014419555664, "global_step": 169625, "epoch": 1009} {"train_loss": -11.25590705871582, "global_step": 169626, "epoch": 1009} {"train_loss": -11.149222373962402, "global_step": 169627, "epoch": 1009} {"train_loss": -11.084707260131836, "global_step": 169628, "epoch": 1009} {"train_loss": -10.91202163696289, "global_step": 169629, "epoch": 1009} {"train_loss": -11.100997924804688, "global_step": 169630, "epoch": 1009} {"train_loss": -11.249279022216797, "global_step": 169631, "epoch": 1009} {"train_loss": -11.202934265136719, "global_step": 169632, "epoch": 1009} {"train_loss": -11.13467788696289, "global_step": 169633, "epoch": 1009} {"train_loss": -11.236664772033691, "global_step": 169634, "epoch": 1009} {"train_loss": -10.925273895263672, "global_step": 169635, "epoch": 1009} {"train_loss": -10.935393333435059, "global_step": 169636, "epoch": 1009} {"train_loss": -11.009359359741211, "global_step": 169637, "epoch": 1009} {"train_loss": -10.916559219360352, "global_step": 169638, "epoch": 1009} {"train_loss": -10.956504821777344, "global_step": 169639, "epoch": 1009} {"train_loss": -10.466689109802246, "global_step": 169640, "epoch": 1009} {"train_loss": -10.747087478637695, "global_step": 169641, "epoch": 1009} {"train_loss": -11.121965408325195, "global_step": 169642, "epoch": 1009} {"train_loss": -10.765380859375, "global_step": 169643, "epoch": 1009} {"train_loss": -11.329912185668945, "global_step": 169644, "epoch": 1009} {"train_loss": -10.982653617858887, "global_step": 169645, "epoch": 1009} {"train_loss": -10.73403549194336, "global_step": 169646, "epoch": 1009} {"train_loss": -11.202098846435547, "global_step": 169647, "epoch": 1009} {"train_loss": -10.885110855102539, "global_step": 169648, "epoch": 1009} {"train_loss": -11.117376327514648, "global_step": 169649, "epoch": 1009} {"train_loss": -11.011080741882324, "global_step": 169650, "epoch": 1009} {"train_loss": -11.12844467163086, "global_step": 169651, "epoch": 1009} {"train_loss": -11.264735221862793, "global_step": 169652, "epoch": 1009} {"train_loss": -11.012813568115234, "global_step": 169653, "epoch": 1009} {"train_loss": -11.195780754089355, "global_step": 169654, "epoch": 1009} {"train_loss": -10.860239028930664, "global_step": 169655, "epoch": 1009} {"train_loss": -10.930557250976562, "global_step": 169656, "epoch": 1009} {"train_loss": -10.732795715332031, "global_step": 169657, "epoch": 1009} {"train_loss": -10.86046314239502, "global_step": 169658, "epoch": 1009} {"train_loss": -10.96029281616211, "global_step": 169659, "epoch": 1009} {"train_loss": -10.606456756591797, "global_step": 169660, "epoch": 1009} {"train_loss": -10.70787239074707, "global_step": 169661, "epoch": 1009} {"train_loss": -11.00688648223877, "global_step": 169662, "epoch": 1009} {"train_loss": -11.228622436523438, "global_step": 169663, "epoch": 1009} {"train_loss": -10.844091415405273, "global_step": 169664, "epoch": 1009} {"train_loss": -11.018885612487793, "global_step": 169665, "epoch": 1009} {"train_loss": -11.168078422546387, "global_step": 169666, "epoch": 1009} {"train_loss": -10.978790283203125, "global_step": 169667, "epoch": 1009} {"train_loss": -10.66128921508789, "global_step": 169668, "epoch": 1009} {"train_loss": -11.117958068847656, "global_step": 169669, "epoch": 1009} {"train_loss": -10.91240119934082, "global_step": 169670, "epoch": 1009} {"train_loss": -10.053406715393066, "global_step": 169671, "epoch": 1009} {"train_loss": -10.126752853393555, "global_step": 169672, "epoch": 1009} {"train_loss": -10.562091827392578, "global_step": 169673, "epoch": 1009} {"train_loss": -9.24924087524414, "global_step": 169674, "epoch": 1009} {"train_loss": -10.934797286987305, "global_step": 169675, "epoch": 1009} {"train_loss": -10.242513656616211, "global_step": 169676, "epoch": 1009} {"train_loss": -10.520027160644531, "global_step": 169677, "epoch": 1009} {"train_loss": -10.499147415161133, "global_step": 169678, "epoch": 1009} {"train_loss": -10.871903396788097, "global_step": 169679, "epoch": 1009, "val_loss": 241052.4375} {"train_loss": -10.609827995300293, "global_step": 169680, "epoch": 1010} {"train_loss": -10.37234878540039, "global_step": 169681, "epoch": 1010} {"train_loss": -10.82691764831543, "global_step": 169682, "epoch": 1010} {"train_loss": -10.23858642578125, "global_step": 169683, "epoch": 1010} {"train_loss": -10.907855033874512, "global_step": 169684, "epoch": 1010} {"train_loss": -10.614500045776367, "global_step": 169685, "epoch": 1010} {"train_loss": -10.759101867675781, "global_step": 169686, "epoch": 1010} {"train_loss": -10.220494270324707, "global_step": 169687, "epoch": 1010} {"train_loss": -10.440244674682617, "global_step": 169688, "epoch": 1010} {"train_loss": -10.628969192504883, "global_step": 169689, "epoch": 1010} {"train_loss": -10.556163787841797, "global_step": 169690, "epoch": 1010} {"train_loss": -10.89507007598877, "global_step": 169691, "epoch": 1010} {"train_loss": -10.701727867126465, "global_step": 169692, "epoch": 1010} {"train_loss": -10.740942001342773, "global_step": 169693, "epoch": 1010} {"train_loss": -10.763964653015137, "global_step": 169694, "epoch": 1010} {"train_loss": -10.614227294921875, "global_step": 169695, "epoch": 1010} {"train_loss": -10.519161224365234, "global_step": 169696, "epoch": 1010} {"train_loss": -10.835142135620117, "global_step": 169697, "epoch": 1010} {"train_loss": -10.677534103393555, "global_step": 169698, "epoch": 1010} {"train_loss": -10.962308883666992, "global_step": 169699, "epoch": 1010} {"train_loss": -10.926614761352539, "global_step": 169700, "epoch": 1010} {"train_loss": -10.735944747924805, "global_step": 169701, "epoch": 1010} {"train_loss": -10.929952621459961, "global_step": 169702, "epoch": 1010} {"train_loss": -10.832904815673828, "global_step": 169703, "epoch": 1010} {"train_loss": -10.851824760437012, "global_step": 169704, "epoch": 1010} {"train_loss": -11.12851333618164, "global_step": 169705, "epoch": 1010} {"train_loss": -10.897432327270508, "global_step": 169706, "epoch": 1010} {"train_loss": -11.0973539352417, "global_step": 169707, "epoch": 1010} {"train_loss": -10.746023178100586, "global_step": 169708, "epoch": 1010} {"train_loss": -11.127285957336426, "global_step": 169709, "epoch": 1010} {"train_loss": -11.248482704162598, "global_step": 169710, "epoch": 1010} {"train_loss": -11.111320495605469, "global_step": 169711, "epoch": 1010} {"train_loss": -10.926753997802734, "global_step": 169712, "epoch": 1010} {"train_loss": -10.989187240600586, "global_step": 169713, "epoch": 1010} {"train_loss": -11.072977066040039, "global_step": 169714, "epoch": 1010} {"train_loss": -11.147283554077148, "global_step": 169715, "epoch": 1010} {"train_loss": -11.171831130981445, "global_step": 169716, "epoch": 1010} {"train_loss": -11.163397789001465, "global_step": 169717, "epoch": 1010} {"train_loss": -11.323053359985352, "global_step": 169718, "epoch": 1010} {"train_loss": -10.959653854370117, "global_step": 169719, "epoch": 1010} {"train_loss": -11.265204429626465, "global_step": 169720, "epoch": 1010} {"train_loss": -11.046728134155273, "global_step": 169721, "epoch": 1010} {"train_loss": -11.197420120239258, "global_step": 169722, "epoch": 1010} {"train_loss": -11.286151885986328, "global_step": 169723, "epoch": 1010} {"train_loss": -11.121682167053223, "global_step": 169724, "epoch": 1010} {"train_loss": -11.129659652709961, "global_step": 169725, "epoch": 1010} {"train_loss": -11.332350730895996, "global_step": 169726, "epoch": 1010} {"train_loss": -11.44089126586914, "global_step": 169727, "epoch": 1010} {"train_loss": -11.462257385253906, "global_step": 169728, "epoch": 1010} {"train_loss": -11.387012481689453, "global_step": 169729, "epoch": 1010} {"train_loss": -11.361356735229492, "global_step": 169730, "epoch": 1010} {"train_loss": -11.148937225341797, "global_step": 169731, "epoch": 1010} {"train_loss": -11.35693073272705, "global_step": 169732, "epoch": 1010} {"train_loss": -11.350942611694336, "global_step": 169733, "epoch": 1010} {"train_loss": -10.918814659118652, "global_step": 169734, "epoch": 1010} {"train_loss": -11.208257675170898, "global_step": 169735, "epoch": 1010} {"train_loss": -11.534515380859375, "global_step": 169736, "epoch": 1010} {"train_loss": -11.057868003845215, "global_step": 169737, "epoch": 1010} {"train_loss": -11.260226249694824, "global_step": 169738, "epoch": 1010} {"train_loss": -11.169597625732422, "global_step": 169739, "epoch": 1010} {"train_loss": -10.92786979675293, "global_step": 169740, "epoch": 1010} {"train_loss": -11.120899200439453, "global_step": 169741, "epoch": 1010} {"train_loss": -11.134697914123535, "global_step": 169742, "epoch": 1010} {"train_loss": -10.734147071838379, "global_step": 169743, "epoch": 1010} {"train_loss": -10.616820335388184, "global_step": 169744, "epoch": 1010} {"train_loss": -11.124223709106445, "global_step": 169745, "epoch": 1010} {"train_loss": -10.602447509765625, "global_step": 169746, "epoch": 1010} {"train_loss": -10.786077499389648, "global_step": 169747, "epoch": 1010} {"train_loss": -11.064231872558594, "global_step": 169748, "epoch": 1010} {"train_loss": -10.832642555236816, "global_step": 169749, "epoch": 1010} {"train_loss": -10.944731712341309, "global_step": 169750, "epoch": 1010} {"train_loss": -10.927801132202148, "global_step": 169751, "epoch": 1010} {"train_loss": -11.114219665527344, "global_step": 169752, "epoch": 1010} {"train_loss": -10.895383834838867, "global_step": 169753, "epoch": 1010} {"train_loss": -11.088171005249023, "global_step": 169754, "epoch": 1010} {"train_loss": -10.311891555786133, "global_step": 169755, "epoch": 1010} {"train_loss": -11.267877578735352, "global_step": 169756, "epoch": 1010} {"train_loss": -10.606983184814453, "global_step": 169757, "epoch": 1010} {"train_loss": -11.215154647827148, "global_step": 169758, "epoch": 1010} {"train_loss": -10.58761215209961, "global_step": 169759, "epoch": 1010} {"train_loss": -11.100648880004883, "global_step": 169760, "epoch": 1010} {"train_loss": -10.413787841796875, "global_step": 169761, "epoch": 1010} {"train_loss": -10.590924263000488, "global_step": 169762, "epoch": 1010} {"train_loss": -11.020875930786133, "global_step": 169763, "epoch": 1010} {"train_loss": -10.755670547485352, "global_step": 169764, "epoch": 1010} {"train_loss": -10.435982704162598, "global_step": 169765, "epoch": 1010} {"train_loss": -10.046165466308594, "global_step": 169766, "epoch": 1010} {"train_loss": -9.925714492797852, "global_step": 169767, "epoch": 1010} {"train_loss": -10.188960075378418, "global_step": 169768, "epoch": 1010} {"train_loss": -10.283594131469727, "global_step": 169769, "epoch": 1010} {"train_loss": -10.23784351348877, "global_step": 169770, "epoch": 1010} {"train_loss": -10.571002960205078, "global_step": 169771, "epoch": 1010} {"train_loss": -10.236801147460938, "global_step": 169772, "epoch": 1010} {"train_loss": -10.388357162475586, "global_step": 169773, "epoch": 1010} {"train_loss": -9.797887802124023, "global_step": 169774, "epoch": 1010} {"train_loss": -10.020078659057617, "global_step": 169775, "epoch": 1010} {"train_loss": -10.192293167114258, "global_step": 169776, "epoch": 1010} {"train_loss": -10.055436134338379, "global_step": 169777, "epoch": 1010} {"train_loss": -10.565326690673828, "global_step": 169778, "epoch": 1010} {"train_loss": -10.640433311462402, "global_step": 169779, "epoch": 1010} {"train_loss": -10.718339920043945, "global_step": 169780, "epoch": 1010} {"train_loss": -10.38027572631836, "global_step": 169781, "epoch": 1010} {"train_loss": -10.694058418273926, "global_step": 169782, "epoch": 1010} {"train_loss": -9.991998672485352, "global_step": 169783, "epoch": 1010} {"train_loss": -10.965494155883789, "global_step": 169784, "epoch": 1010} {"train_loss": -10.390195846557617, "global_step": 169785, "epoch": 1010} {"train_loss": -10.573081016540527, "global_step": 169786, "epoch": 1010} {"train_loss": -10.6919527053833, "global_step": 169787, "epoch": 1010} {"train_loss": -10.778482437133789, "global_step": 169788, "epoch": 1010} {"train_loss": -10.836463928222656, "global_step": 169789, "epoch": 1010} {"train_loss": -10.788192749023438, "global_step": 169790, "epoch": 1010} {"train_loss": -10.684040069580078, "global_step": 169791, "epoch": 1010} {"train_loss": -10.919843673706055, "global_step": 169792, "epoch": 1010} {"train_loss": -10.45570182800293, "global_step": 169793, "epoch": 1010} {"train_loss": -11.10372543334961, "global_step": 169794, "epoch": 1010} {"train_loss": -10.722885131835938, "global_step": 169795, "epoch": 1010} {"train_loss": -10.845064163208008, "global_step": 169796, "epoch": 1010} {"train_loss": -10.982189178466797, "global_step": 169797, "epoch": 1010} {"train_loss": -10.683156967163086, "global_step": 169798, "epoch": 1010} {"train_loss": -11.050806045532227, "global_step": 169799, "epoch": 1010} {"train_loss": -10.938056945800781, "global_step": 169800, "epoch": 1010} {"train_loss": -10.9346284866333, "global_step": 169801, "epoch": 1010} {"train_loss": -10.876917839050293, "global_step": 169802, "epoch": 1010} {"train_loss": -10.90102481842041, "global_step": 169803, "epoch": 1010} {"train_loss": -10.823378562927246, "global_step": 169804, "epoch": 1010} {"train_loss": -11.101724624633789, "global_step": 169805, "epoch": 1010} {"train_loss": -10.820423126220703, "global_step": 169806, "epoch": 1010} {"train_loss": -11.077035903930664, "global_step": 169807, "epoch": 1010} {"train_loss": -11.26170539855957, "global_step": 169808, "epoch": 1010} {"train_loss": -11.140815734863281, "global_step": 169809, "epoch": 1010} {"train_loss": -11.005104064941406, "global_step": 169810, "epoch": 1010} {"train_loss": -11.201480865478516, "global_step": 169811, "epoch": 1010} {"train_loss": -10.91172981262207, "global_step": 169812, "epoch": 1010} {"train_loss": -11.077207565307617, "global_step": 169813, "epoch": 1010} {"train_loss": -10.609721183776855, "global_step": 169814, "epoch": 1010} {"train_loss": -10.744640350341797, "global_step": 169815, "epoch": 1010} {"train_loss": -10.675065994262695, "global_step": 169816, "epoch": 1010} {"train_loss": -10.246192932128906, "global_step": 169817, "epoch": 1010} {"train_loss": -11.22433853149414, "global_step": 169818, "epoch": 1010} {"train_loss": -10.13958740234375, "global_step": 169819, "epoch": 1010} {"train_loss": -11.135769844055176, "global_step": 169820, "epoch": 1010} {"train_loss": -10.016013145446777, "global_step": 169821, "epoch": 1010} {"train_loss": -10.81093692779541, "global_step": 169822, "epoch": 1010} {"train_loss": -10.766904830932617, "global_step": 169823, "epoch": 1010} {"train_loss": -10.640694618225098, "global_step": 169824, "epoch": 1010} {"train_loss": -11.143720626831055, "global_step": 169825, "epoch": 1010} {"train_loss": -10.594892501831055, "global_step": 169826, "epoch": 1010} {"train_loss": -10.589128494262695, "global_step": 169827, "epoch": 1010} {"train_loss": -11.040142059326172, "global_step": 169828, "epoch": 1010} {"train_loss": -10.959070205688477, "global_step": 169829, "epoch": 1010} {"train_loss": -11.02156925201416, "global_step": 169830, "epoch": 1010} {"train_loss": -11.177011489868164, "global_step": 169831, "epoch": 1010} {"train_loss": -10.939203262329102, "global_step": 169832, "epoch": 1010} {"train_loss": -10.958316802978516, "global_step": 169833, "epoch": 1010} {"train_loss": -11.30507755279541, "global_step": 169834, "epoch": 1010} {"train_loss": -10.853546142578125, "global_step": 169835, "epoch": 1010} {"train_loss": -11.004170417785645, "global_step": 169836, "epoch": 1010} {"train_loss": -11.09771728515625, "global_step": 169837, "epoch": 1010} {"train_loss": -11.09162712097168, "global_step": 169838, "epoch": 1010} {"train_loss": -11.069448471069336, "global_step": 169839, "epoch": 1010} {"train_loss": -11.263433456420898, "global_step": 169840, "epoch": 1010} {"train_loss": -11.232025146484375, "global_step": 169841, "epoch": 1010} {"train_loss": -11.088109016418457, "global_step": 169842, "epoch": 1010} {"train_loss": -11.094545364379883, "global_step": 169843, "epoch": 1010} {"train_loss": -10.930802345275879, "global_step": 169844, "epoch": 1010} {"train_loss": -11.259876251220703, "global_step": 169845, "epoch": 1010} {"train_loss": -10.835646629333496, "global_step": 169846, "epoch": 1010} {"train_loss": -10.849727011862255, "global_step": 169847, "epoch": 1010, "val_loss": 241269.515625, "train_action_mse_error": 1.4225515127182007} {"train_loss": -10.719453811645508, "global_step": 169848, "epoch": 1011} {"train_loss": -11.100634574890137, "global_step": 169849, "epoch": 1011} {"train_loss": -11.245967864990234, "global_step": 169850, "epoch": 1011} {"train_loss": -11.161277770996094, "global_step": 169851, "epoch": 1011} {"train_loss": -11.143009185791016, "global_step": 169852, "epoch": 1011} {"train_loss": -11.180290222167969, "global_step": 169853, "epoch": 1011} {"train_loss": -11.203142166137695, "global_step": 169854, "epoch": 1011} {"train_loss": -11.176237106323242, "global_step": 169855, "epoch": 1011} {"train_loss": -11.429140090942383, "global_step": 169856, "epoch": 1011} {"train_loss": -11.368313789367676, "global_step": 169857, "epoch": 1011} {"train_loss": -11.096036911010742, "global_step": 169858, "epoch": 1011} {"train_loss": -11.455825805664062, "global_step": 169859, "epoch": 1011} {"train_loss": -11.298161506652832, "global_step": 169860, "epoch": 1011} {"train_loss": -11.205242156982422, "global_step": 169861, "epoch": 1011} {"train_loss": -11.304102897644043, "global_step": 169862, "epoch": 1011} {"train_loss": -11.578559875488281, "global_step": 169863, "epoch": 1011} {"train_loss": -11.096878051757812, "global_step": 169864, "epoch": 1011} {"train_loss": -11.579429626464844, "global_step": 169865, "epoch": 1011} {"train_loss": -11.24911117553711, "global_step": 169866, "epoch": 1011} {"train_loss": -11.412854194641113, "global_step": 169867, "epoch": 1011} {"train_loss": -11.501370429992676, "global_step": 169868, "epoch": 1011} {"train_loss": -11.375882148742676, "global_step": 169869, "epoch": 1011} {"train_loss": -11.33610725402832, "global_step": 169870, "epoch": 1011} {"train_loss": -11.577079772949219, "global_step": 169871, "epoch": 1011} {"train_loss": -11.14596939086914, "global_step": 169872, "epoch": 1011} {"train_loss": -11.480924606323242, "global_step": 169873, "epoch": 1011} {"train_loss": -11.547500610351562, "global_step": 169874, "epoch": 1011} {"train_loss": -11.447749137878418, "global_step": 169875, "epoch": 1011} {"train_loss": -11.025094985961914, "global_step": 169876, "epoch": 1011} {"train_loss": -11.28449821472168, "global_step": 169877, "epoch": 1011} {"train_loss": -11.315901756286621, "global_step": 169878, "epoch": 1011} {"train_loss": -11.020975112915039, "global_step": 169879, "epoch": 1011} {"train_loss": -11.2965087890625, "global_step": 169880, "epoch": 1011} {"train_loss": -11.389033317565918, "global_step": 169881, "epoch": 1011} {"train_loss": -11.291387557983398, "global_step": 169882, "epoch": 1011} {"train_loss": -11.140464782714844, "global_step": 169883, "epoch": 1011} {"train_loss": -10.888004302978516, "global_step": 169884, "epoch": 1011} {"train_loss": -10.39045238494873, "global_step": 169885, "epoch": 1011} {"train_loss": -10.752525329589844, "global_step": 169886, "epoch": 1011} {"train_loss": -11.028142929077148, "global_step": 169887, "epoch": 1011} {"train_loss": -10.874168395996094, "global_step": 169888, "epoch": 1011} {"train_loss": -10.76742172241211, "global_step": 169889, "epoch": 1011} {"train_loss": -10.640400886535645, "global_step": 169890, "epoch": 1011} {"train_loss": -11.074378967285156, "global_step": 169891, "epoch": 1011} {"train_loss": -10.648584365844727, "global_step": 169892, "epoch": 1011} {"train_loss": -10.75218391418457, "global_step": 169893, "epoch": 1011} {"train_loss": -10.218189239501953, "global_step": 169894, "epoch": 1011} {"train_loss": -10.997310638427734, "global_step": 169895, "epoch": 1011} {"train_loss": -10.076857566833496, "global_step": 169896, "epoch": 1011} {"train_loss": -10.85931396484375, "global_step": 169897, "epoch": 1011} {"train_loss": -10.733129501342773, "global_step": 169898, "epoch": 1011} {"train_loss": -11.23742961883545, "global_step": 169899, "epoch": 1011} {"train_loss": -10.136283874511719, "global_step": 169900, "epoch": 1011} {"train_loss": -11.270845413208008, "global_step": 169901, "epoch": 1011} {"train_loss": -10.835905075073242, "global_step": 169902, "epoch": 1011} {"train_loss": -10.379319190979004, "global_step": 169903, "epoch": 1011} {"train_loss": -10.70871353149414, "global_step": 169904, "epoch": 1011} {"train_loss": -10.724245071411133, "global_step": 169905, "epoch": 1011} {"train_loss": -10.543693542480469, "global_step": 169906, "epoch": 1011} {"train_loss": -10.7476224899292, "global_step": 169907, "epoch": 1011} {"train_loss": -10.512466430664062, "global_step": 169908, "epoch": 1011} {"train_loss": -10.878819465637207, "global_step": 169909, "epoch": 1011} {"train_loss": -10.149455070495605, "global_step": 169910, "epoch": 1011} {"train_loss": -10.94853401184082, "global_step": 169911, "epoch": 1011} {"train_loss": -9.946707725524902, "global_step": 169912, "epoch": 1011} {"train_loss": -10.861804962158203, "global_step": 169913, "epoch": 1011} {"train_loss": -10.412004470825195, "global_step": 169914, "epoch": 1011} {"train_loss": -10.439024925231934, "global_step": 169915, "epoch": 1011} {"train_loss": -10.496023178100586, "global_step": 169916, "epoch": 1011} {"train_loss": -9.78689956665039, "global_step": 169917, "epoch": 1011} {"train_loss": -10.729063034057617, "global_step": 169918, "epoch": 1011} {"train_loss": -9.465310096740723, "global_step": 169919, "epoch": 1011} {"train_loss": -10.439279556274414, "global_step": 169920, "epoch": 1011} {"train_loss": -10.053658485412598, "global_step": 169921, "epoch": 1011} {"train_loss": -10.612422943115234, "global_step": 169922, "epoch": 1011} {"train_loss": -10.080350875854492, "global_step": 169923, "epoch": 1011} {"train_loss": -10.950959205627441, "global_step": 169924, "epoch": 1011} {"train_loss": -10.106365203857422, "global_step": 169925, "epoch": 1011} {"train_loss": -10.417787551879883, "global_step": 169926, "epoch": 1011} {"train_loss": -10.220346450805664, "global_step": 169927, "epoch": 1011} {"train_loss": -10.539007186889648, "global_step": 169928, "epoch": 1011} {"train_loss": -10.668937683105469, "global_step": 169929, "epoch": 1011} {"train_loss": -10.430203437805176, "global_step": 169930, "epoch": 1011} {"train_loss": -10.95878791809082, "global_step": 169931, "epoch": 1011} {"train_loss": -10.358976364135742, "global_step": 169932, "epoch": 1011} {"train_loss": -10.846126556396484, "global_step": 169933, "epoch": 1011} {"train_loss": -10.539915084838867, "global_step": 169934, "epoch": 1011} {"train_loss": -10.98291015625, "global_step": 169935, "epoch": 1011} {"train_loss": -10.619842529296875, "global_step": 169936, "epoch": 1011} {"train_loss": -11.015478134155273, "global_step": 169937, "epoch": 1011} {"train_loss": -10.8233642578125, "global_step": 169938, "epoch": 1011} {"train_loss": -10.868898391723633, "global_step": 169939, "epoch": 1011} {"train_loss": -10.773900985717773, "global_step": 169940, "epoch": 1011} {"train_loss": -11.047347068786621, "global_step": 169941, "epoch": 1011} {"train_loss": -10.791723251342773, "global_step": 169942, "epoch": 1011} {"train_loss": -10.891409873962402, "global_step": 169943, "epoch": 1011} {"train_loss": -11.011710166931152, "global_step": 169944, "epoch": 1011} {"train_loss": -11.046016693115234, "global_step": 169945, "epoch": 1011} {"train_loss": -10.760334014892578, "global_step": 169946, "epoch": 1011} {"train_loss": -11.13204288482666, "global_step": 169947, "epoch": 1011} {"train_loss": -11.047094345092773, "global_step": 169948, "epoch": 1011} {"train_loss": -11.274818420410156, "global_step": 169949, "epoch": 1011} {"train_loss": -10.932722091674805, "global_step": 169950, "epoch": 1011} {"train_loss": -11.02255630493164, "global_step": 169951, "epoch": 1011} {"train_loss": -11.124773025512695, "global_step": 169952, "epoch": 1011} {"train_loss": -11.157743453979492, "global_step": 169953, "epoch": 1011} {"train_loss": -11.198236465454102, "global_step": 169954, "epoch": 1011} {"train_loss": -11.222396850585938, "global_step": 169955, "epoch": 1011} {"train_loss": -11.101966857910156, "global_step": 169956, "epoch": 1011} {"train_loss": -11.349923133850098, "global_step": 169957, "epoch": 1011} {"train_loss": -11.062461853027344, "global_step": 169958, "epoch": 1011} {"train_loss": -11.169787406921387, "global_step": 169959, "epoch": 1011} {"train_loss": -11.114740371704102, "global_step": 169960, "epoch": 1011} {"train_loss": -11.222652435302734, "global_step": 169961, "epoch": 1011} {"train_loss": -11.286430358886719, "global_step": 169962, "epoch": 1011} {"train_loss": -11.390890121459961, "global_step": 169963, "epoch": 1011} {"train_loss": -11.093839645385742, "global_step": 169964, "epoch": 1011} {"train_loss": -11.301671028137207, "global_step": 169965, "epoch": 1011} {"train_loss": -11.417825698852539, "global_step": 169966, "epoch": 1011} {"train_loss": -11.132973670959473, "global_step": 169967, "epoch": 1011} {"train_loss": -11.218796730041504, "global_step": 169968, "epoch": 1011} {"train_loss": -11.028600692749023, "global_step": 169969, "epoch": 1011} {"train_loss": -11.424468994140625, "global_step": 169970, "epoch": 1011} {"train_loss": -11.172101974487305, "global_step": 169971, "epoch": 1011} {"train_loss": -11.38077163696289, "global_step": 169972, "epoch": 1011} {"train_loss": -11.324499130249023, "global_step": 169973, "epoch": 1011} {"train_loss": -11.180098533630371, "global_step": 169974, "epoch": 1011} {"train_loss": -11.455591201782227, "global_step": 169975, "epoch": 1011} {"train_loss": -11.182413101196289, "global_step": 169976, "epoch": 1011} {"train_loss": -11.476309776306152, "global_step": 169977, "epoch": 1011} {"train_loss": -11.385686874389648, "global_step": 169978, "epoch": 1011} {"train_loss": -11.598810195922852, "global_step": 169979, "epoch": 1011} {"train_loss": -11.263959884643555, "global_step": 169980, "epoch": 1011} {"train_loss": -11.38504695892334, "global_step": 169981, "epoch": 1011} {"train_loss": -11.407989501953125, "global_step": 169982, "epoch": 1011} {"train_loss": -11.533931732177734, "global_step": 169983, "epoch": 1011} {"train_loss": -10.955039024353027, "global_step": 169984, "epoch": 1011} {"train_loss": -11.48339557647705, "global_step": 169985, "epoch": 1011} {"train_loss": -11.217225074768066, "global_step": 169986, "epoch": 1011} {"train_loss": -10.619100570678711, "global_step": 169987, "epoch": 1011} {"train_loss": -10.962074279785156, "global_step": 169988, "epoch": 1011} {"train_loss": -10.70361328125, "global_step": 169989, "epoch": 1011} {"train_loss": -10.609243392944336, "global_step": 169990, "epoch": 1011} {"train_loss": -10.805373191833496, "global_step": 169991, "epoch": 1011} {"train_loss": -10.322994232177734, "global_step": 169992, "epoch": 1011} {"train_loss": -9.73524284362793, "global_step": 169993, "epoch": 1011} {"train_loss": -7.897513389587402, "global_step": 169994, "epoch": 1011} {"train_loss": -8.952442169189453, "global_step": 169995, "epoch": 1011} {"train_loss": -8.390071868896484, "global_step": 169996, "epoch": 1011} {"train_loss": -10.776698112487793, "global_step": 169997, "epoch": 1011} {"train_loss": -9.082275390625, "global_step": 169998, "epoch": 1011} {"train_loss": -10.233317375183105, "global_step": 169999, "epoch": 1011} {"train_loss": -8.996963500976562, "global_step": 170000, "epoch": 1011} {"train_loss": -9.456157684326172, "global_step": 170001, "epoch": 1011} {"train_loss": -9.964040756225586, "global_step": 170002, "epoch": 1011} {"train_loss": -10.001272201538086, "global_step": 170003, "epoch": 1011} {"train_loss": -9.381597518920898, "global_step": 170004, "epoch": 1011} {"train_loss": -10.612637519836426, "global_step": 170005, "epoch": 1011} {"train_loss": -9.699953079223633, "global_step": 170006, "epoch": 1011} {"train_loss": -10.514541625976562, "global_step": 170007, "epoch": 1011} {"train_loss": -10.326360702514648, "global_step": 170008, "epoch": 1011} {"train_loss": -10.101850509643555, "global_step": 170009, "epoch": 1011} {"train_loss": -10.319095611572266, "global_step": 170010, "epoch": 1011} {"train_loss": -10.599602699279785, "global_step": 170011, "epoch": 1011} {"train_loss": -9.974761009216309, "global_step": 170012, "epoch": 1011} {"train_loss": -10.660955429077148, "global_step": 170013, "epoch": 1011} {"train_loss": -9.996063232421875, "global_step": 170014, "epoch": 1011} {"train_loss": -10.80823272182828, "global_step": 170015, "epoch": 1011, "val_loss": 229700.53125} {"train_loss": -10.074206352233887, "global_step": 170016, "epoch": 1012} {"train_loss": -10.1846923828125, "global_step": 170017, "epoch": 1012} {"train_loss": -10.58728313446045, "global_step": 170018, "epoch": 1012} {"train_loss": -10.417622566223145, "global_step": 170019, "epoch": 1012} {"train_loss": -10.389461517333984, "global_step": 170020, "epoch": 1012} {"train_loss": -10.56329345703125, "global_step": 170021, "epoch": 1012} {"train_loss": -10.497486114501953, "global_step": 170022, "epoch": 1012} {"train_loss": -10.490331649780273, "global_step": 170023, "epoch": 1012} {"train_loss": -10.347545623779297, "global_step": 170024, "epoch": 1012} {"train_loss": -10.661214828491211, "global_step": 170025, "epoch": 1012} {"train_loss": -10.702078819274902, "global_step": 170026, "epoch": 1012} {"train_loss": -10.352499008178711, "global_step": 170027, "epoch": 1012} {"train_loss": -10.463390350341797, "global_step": 170028, "epoch": 1012} {"train_loss": -10.746363639831543, "global_step": 170029, "epoch": 1012} {"train_loss": -10.339516639709473, "global_step": 170030, "epoch": 1012} {"train_loss": -10.680328369140625, "global_step": 170031, "epoch": 1012} {"train_loss": -10.666756629943848, "global_step": 170032, "epoch": 1012} {"train_loss": -10.700092315673828, "global_step": 170033, "epoch": 1012} {"train_loss": -10.752019882202148, "global_step": 170034, "epoch": 1012} {"train_loss": -10.694217681884766, "global_step": 170035, "epoch": 1012} {"train_loss": -10.685654640197754, "global_step": 170036, "epoch": 1012} {"train_loss": -10.974902153015137, "global_step": 170037, "epoch": 1012} {"train_loss": -10.872159957885742, "global_step": 170038, "epoch": 1012} {"train_loss": -10.983470916748047, "global_step": 170039, "epoch": 1012} {"train_loss": -11.061042785644531, "global_step": 170040, "epoch": 1012} {"train_loss": -10.961956977844238, "global_step": 170041, "epoch": 1012} {"train_loss": -11.090900421142578, "global_step": 170042, "epoch": 1012} {"train_loss": -10.939445495605469, "global_step": 170043, "epoch": 1012} {"train_loss": -11.102384567260742, "global_step": 170044, "epoch": 1012} {"train_loss": -10.990427017211914, "global_step": 170045, "epoch": 1012} {"train_loss": -10.644996643066406, "global_step": 170046, "epoch": 1012} {"train_loss": -10.92592716217041, "global_step": 170047, "epoch": 1012} {"train_loss": -11.091039657592773, "global_step": 170048, "epoch": 1012} {"train_loss": -11.201315879821777, "global_step": 170049, "epoch": 1012} {"train_loss": -11.09705924987793, "global_step": 170050, "epoch": 1012} {"train_loss": -11.070659637451172, "global_step": 170051, "epoch": 1012} {"train_loss": -11.04068374633789, "global_step": 170052, "epoch": 1012} {"train_loss": -11.326107025146484, "global_step": 170053, "epoch": 1012} {"train_loss": -11.22938346862793, "global_step": 170054, "epoch": 1012} {"train_loss": -10.92529582977295, "global_step": 170055, "epoch": 1012} {"train_loss": -11.107527732849121, "global_step": 170056, "epoch": 1012} {"train_loss": -11.108724594116211, "global_step": 170057, "epoch": 1012} {"train_loss": -11.110325813293457, "global_step": 170058, "epoch": 1012} {"train_loss": -11.351228713989258, "global_step": 170059, "epoch": 1012} {"train_loss": -11.18071174621582, "global_step": 170060, "epoch": 1012} {"train_loss": -11.309398651123047, "global_step": 170061, "epoch": 1012} {"train_loss": -11.090914726257324, "global_step": 170062, "epoch": 1012} {"train_loss": -11.317249298095703, "global_step": 170063, "epoch": 1012} {"train_loss": -10.996514320373535, "global_step": 170064, "epoch": 1012} {"train_loss": -11.120370864868164, "global_step": 170065, "epoch": 1012} {"train_loss": -10.909786224365234, "global_step": 170066, "epoch": 1012} {"train_loss": -10.970073699951172, "global_step": 170067, "epoch": 1012} {"train_loss": -10.823537826538086, "global_step": 170068, "epoch": 1012} {"train_loss": -11.102143287658691, "global_step": 170069, "epoch": 1012} {"train_loss": -11.190300941467285, "global_step": 170070, "epoch": 1012} {"train_loss": -11.2086181640625, "global_step": 170071, "epoch": 1012} {"train_loss": -11.14502239227295, "global_step": 170072, "epoch": 1012} {"train_loss": -11.298097610473633, "global_step": 170073, "epoch": 1012} {"train_loss": -11.09935188293457, "global_step": 170074, "epoch": 1012} {"train_loss": -11.330541610717773, "global_step": 170075, "epoch": 1012} {"train_loss": -11.17691421508789, "global_step": 170076, "epoch": 1012} {"train_loss": -11.395874977111816, "global_step": 170077, "epoch": 1012} {"train_loss": -11.229677200317383, "global_step": 170078, "epoch": 1012} {"train_loss": -11.381851196289062, "global_step": 170079, "epoch": 1012} {"train_loss": -11.340950965881348, "global_step": 170080, "epoch": 1012} {"train_loss": -11.518880844116211, "global_step": 170081, "epoch": 1012} {"train_loss": -10.98239803314209, "global_step": 170082, "epoch": 1012} {"train_loss": -11.57654094696045, "global_step": 170083, "epoch": 1012} {"train_loss": -11.465389251708984, "global_step": 170084, "epoch": 1012} {"train_loss": -11.389410972595215, "global_step": 170085, "epoch": 1012} {"train_loss": -11.492530822753906, "global_step": 170086, "epoch": 1012} {"train_loss": -11.391658782958984, "global_step": 170087, "epoch": 1012} {"train_loss": -11.212226867675781, "global_step": 170088, "epoch": 1012} {"train_loss": -11.298624038696289, "global_step": 170089, "epoch": 1012} {"train_loss": -11.219669342041016, "global_step": 170090, "epoch": 1012} {"train_loss": -11.061840057373047, "global_step": 170091, "epoch": 1012} {"train_loss": -10.810037612915039, "global_step": 170092, "epoch": 1012} {"train_loss": -10.673219680786133, "global_step": 170093, "epoch": 1012} {"train_loss": -11.222640991210938, "global_step": 170094, "epoch": 1012} {"train_loss": -10.870197296142578, "global_step": 170095, "epoch": 1012} {"train_loss": -10.94858169555664, "global_step": 170096, "epoch": 1012} {"train_loss": -9.471338272094727, "global_step": 170097, "epoch": 1012} {"train_loss": -9.240859985351562, "global_step": 170098, "epoch": 1012} {"train_loss": -10.484861373901367, "global_step": 170099, "epoch": 1012} {"train_loss": -9.187322616577148, "global_step": 170100, "epoch": 1012} {"train_loss": -8.040520668029785, "global_step": 170101, "epoch": 1012} {"train_loss": -7.817049503326416, "global_step": 170102, "epoch": 1012} {"train_loss": -9.991703033447266, "global_step": 170103, "epoch": 1012} {"train_loss": -7.637651443481445, "global_step": 170104, "epoch": 1012} {"train_loss": -7.009808540344238, "global_step": 170105, "epoch": 1012} {"train_loss": -7.534295558929443, "global_step": 170106, "epoch": 1012} {"train_loss": -6.6042962074279785, "global_step": 170107, "epoch": 1012} {"train_loss": -7.251555442810059, "global_step": 170108, "epoch": 1012} {"train_loss": -8.498778343200684, "global_step": 170109, "epoch": 1012} {"train_loss": -8.961464881896973, "global_step": 170110, "epoch": 1012} {"train_loss": -9.195809364318848, "global_step": 170111, "epoch": 1012} {"train_loss": -8.401545524597168, "global_step": 170112, "epoch": 1012} {"train_loss": -8.57634162902832, "global_step": 170113, "epoch": 1012} {"train_loss": -9.618890762329102, "global_step": 170114, "epoch": 1012} {"train_loss": -9.967029571533203, "global_step": 170115, "epoch": 1012} {"train_loss": -9.890436172485352, "global_step": 170116, "epoch": 1012} {"train_loss": -9.873733520507812, "global_step": 170117, "epoch": 1012} {"train_loss": -10.258129119873047, "global_step": 170118, "epoch": 1012} {"train_loss": -9.974857330322266, "global_step": 170119, "epoch": 1012} {"train_loss": -9.035812377929688, "global_step": 170120, "epoch": 1012} {"train_loss": -9.758967399597168, "global_step": 170121, "epoch": 1012} {"train_loss": -9.90681266784668, "global_step": 170122, "epoch": 1012} {"train_loss": -9.199586868286133, "global_step": 170123, "epoch": 1012} {"train_loss": -10.077192306518555, "global_step": 170124, "epoch": 1012} {"train_loss": -10.178693771362305, "global_step": 170125, "epoch": 1012} {"train_loss": -10.055597305297852, "global_step": 170126, "epoch": 1012} {"train_loss": -9.818007469177246, "global_step": 170127, "epoch": 1012} {"train_loss": -10.094403266906738, "global_step": 170128, "epoch": 1012} {"train_loss": -10.083715438842773, "global_step": 170129, "epoch": 1012} {"train_loss": -10.491264343261719, "global_step": 170130, "epoch": 1012} {"train_loss": -10.428142547607422, "global_step": 170131, "epoch": 1012} {"train_loss": -10.426803588867188, "global_step": 170132, "epoch": 1012} {"train_loss": -10.531885147094727, "global_step": 170133, "epoch": 1012} {"train_loss": -10.457330703735352, "global_step": 170134, "epoch": 1012} {"train_loss": -10.457487106323242, "global_step": 170135, "epoch": 1012} {"train_loss": -10.382060050964355, "global_step": 170136, "epoch": 1012} {"train_loss": -10.320428848266602, "global_step": 170137, "epoch": 1012} {"train_loss": -10.61058235168457, "global_step": 170138, "epoch": 1012} {"train_loss": -10.490116119384766, "global_step": 170139, "epoch": 1012} {"train_loss": -10.433120727539062, "global_step": 170140, "epoch": 1012} {"train_loss": -10.551630020141602, "global_step": 170141, "epoch": 1012} {"train_loss": -10.586811065673828, "global_step": 170142, "epoch": 1012} {"train_loss": -10.522845268249512, "global_step": 170143, "epoch": 1012} {"train_loss": -10.631446838378906, "global_step": 170144, "epoch": 1012} {"train_loss": -10.859413146972656, "global_step": 170145, "epoch": 1012} {"train_loss": -10.523370742797852, "global_step": 170146, "epoch": 1012} {"train_loss": -10.666308403015137, "global_step": 170147, "epoch": 1012} {"train_loss": -10.978540420532227, "global_step": 170148, "epoch": 1012} {"train_loss": -10.691622734069824, "global_step": 170149, "epoch": 1012} {"train_loss": -10.863080024719238, "global_step": 170150, "epoch": 1012} {"train_loss": -10.72900676727295, "global_step": 170151, "epoch": 1012} {"train_loss": -10.983020782470703, "global_step": 170152, "epoch": 1012} {"train_loss": -10.963613510131836, "global_step": 170153, "epoch": 1012} {"train_loss": -11.040937423706055, "global_step": 170154, "epoch": 1012} {"train_loss": -10.91940689086914, "global_step": 170155, "epoch": 1012} {"train_loss": -10.83222484588623, "global_step": 170156, "epoch": 1012} {"train_loss": -10.973112106323242, "global_step": 170157, "epoch": 1012} {"train_loss": -10.897875785827637, "global_step": 170158, "epoch": 1012} {"train_loss": -11.03561019897461, "global_step": 170159, "epoch": 1012} {"train_loss": -11.007662773132324, "global_step": 170160, "epoch": 1012} {"train_loss": -11.138288497924805, "global_step": 170161, "epoch": 1012} {"train_loss": -10.937544822692871, "global_step": 170162, "epoch": 1012} {"train_loss": -10.988424301147461, "global_step": 170163, "epoch": 1012} {"train_loss": -10.93518352508545, "global_step": 170164, "epoch": 1012} {"train_loss": -11.08413028717041, "global_step": 170165, "epoch": 1012} {"train_loss": -11.037596702575684, "global_step": 170166, "epoch": 1012} {"train_loss": -11.179258346557617, "global_step": 170167, "epoch": 1012} {"train_loss": -11.015653610229492, "global_step": 170168, "epoch": 1012} {"train_loss": -11.251124382019043, "global_step": 170169, "epoch": 1012} {"train_loss": -11.054778099060059, "global_step": 170170, "epoch": 1012} {"train_loss": -11.25422477722168, "global_step": 170171, "epoch": 1012} {"train_loss": -11.193653106689453, "global_step": 170172, "epoch": 1012} {"train_loss": -11.159117698669434, "global_step": 170173, "epoch": 1012} {"train_loss": -11.318534851074219, "global_step": 170174, "epoch": 1012} {"train_loss": -11.331514358520508, "global_step": 170175, "epoch": 1012} {"train_loss": -11.224958419799805, "global_step": 170176, "epoch": 1012} {"train_loss": -11.163830757141113, "global_step": 170177, "epoch": 1012} {"train_loss": -11.392059326171875, "global_step": 170178, "epoch": 1012} {"train_loss": -11.25473403930664, "global_step": 170179, "epoch": 1012} {"train_loss": -11.3260498046875, "global_step": 170180, "epoch": 1012} {"train_loss": -11.32998275756836, "global_step": 170181, "epoch": 1012} {"train_loss": -11.376026153564453, "global_step": 170182, "epoch": 1012} {"train_loss": -10.590260803699493, "global_step": 170183, "epoch": 1012, "val_loss": 233261.546875} {"train_loss": -11.15479850769043, "global_step": 170184, "epoch": 1013} {"train_loss": -11.232939720153809, "global_step": 170185, "epoch": 1013} {"train_loss": -10.982539176940918, "global_step": 170186, "epoch": 1013} {"train_loss": -11.284740447998047, "global_step": 170187, "epoch": 1013} {"train_loss": -11.019207954406738, "global_step": 170188, "epoch": 1013} {"train_loss": -11.072619438171387, "global_step": 170189, "epoch": 1013} {"train_loss": -11.464652061462402, "global_step": 170190, "epoch": 1013} {"train_loss": -11.298025131225586, "global_step": 170191, "epoch": 1013} {"train_loss": -11.179378509521484, "global_step": 170192, "epoch": 1013} {"train_loss": -11.254446029663086, "global_step": 170193, "epoch": 1013} {"train_loss": -11.10957145690918, "global_step": 170194, "epoch": 1013} {"train_loss": -11.101791381835938, "global_step": 170195, "epoch": 1013} {"train_loss": -11.161033630371094, "global_step": 170196, "epoch": 1013} {"train_loss": -11.189725875854492, "global_step": 170197, "epoch": 1013} {"train_loss": -11.256418228149414, "global_step": 170198, "epoch": 1013} {"train_loss": -11.197755813598633, "global_step": 170199, "epoch": 1013} {"train_loss": -11.134500503540039, "global_step": 170200, "epoch": 1013} {"train_loss": -10.815311431884766, "global_step": 170201, "epoch": 1013} {"train_loss": -10.794116020202637, "global_step": 170202, "epoch": 1013} {"train_loss": -10.477067947387695, "global_step": 170203, "epoch": 1013} {"train_loss": -9.997982025146484, "global_step": 170204, "epoch": 1013} {"train_loss": -10.796432495117188, "global_step": 170205, "epoch": 1013} {"train_loss": -10.887939453125, "global_step": 170206, "epoch": 1013} {"train_loss": -9.88228988647461, "global_step": 170207, "epoch": 1013} {"train_loss": -10.82176685333252, "global_step": 170208, "epoch": 1013} {"train_loss": -10.540962219238281, "global_step": 170209, "epoch": 1013} {"train_loss": -9.63122844696045, "global_step": 170210, "epoch": 1013} {"train_loss": -10.864876747131348, "global_step": 170211, "epoch": 1013} {"train_loss": -9.880722045898438, "global_step": 170212, "epoch": 1013} {"train_loss": -10.440479278564453, "global_step": 170213, "epoch": 1013} {"train_loss": -10.505155563354492, "global_step": 170214, "epoch": 1013} {"train_loss": -9.935251235961914, "global_step": 170215, "epoch": 1013} {"train_loss": -10.367422103881836, "global_step": 170216, "epoch": 1013} {"train_loss": -10.812948226928711, "global_step": 170217, "epoch": 1013} {"train_loss": -10.198423385620117, "global_step": 170218, "epoch": 1013} {"train_loss": -11.007661819458008, "global_step": 170219, "epoch": 1013} {"train_loss": -10.824808120727539, "global_step": 170220, "epoch": 1013} {"train_loss": -10.504558563232422, "global_step": 170221, "epoch": 1013} {"train_loss": -10.965288162231445, "global_step": 170222, "epoch": 1013} {"train_loss": -10.379114151000977, "global_step": 170223, "epoch": 1013} {"train_loss": -10.572834968566895, "global_step": 170224, "epoch": 1013} {"train_loss": -10.766788482666016, "global_step": 170225, "epoch": 1013} {"train_loss": -10.489139556884766, "global_step": 170226, "epoch": 1013} {"train_loss": -11.029132843017578, "global_step": 170227, "epoch": 1013} {"train_loss": -10.930410385131836, "global_step": 170228, "epoch": 1013} {"train_loss": -10.786523818969727, "global_step": 170229, "epoch": 1013} {"train_loss": -10.845305442810059, "global_step": 170230, "epoch": 1013} {"train_loss": -10.7794189453125, "global_step": 170231, "epoch": 1013} {"train_loss": -10.93106460571289, "global_step": 170232, "epoch": 1013} {"train_loss": -10.708372116088867, "global_step": 170233, "epoch": 1013} {"train_loss": -11.0667142868042, "global_step": 170234, "epoch": 1013} {"train_loss": -11.174457550048828, "global_step": 170235, "epoch": 1013} {"train_loss": -11.067851066589355, "global_step": 170236, "epoch": 1013} {"train_loss": -11.057474136352539, "global_step": 170237, "epoch": 1013} {"train_loss": -10.860675811767578, "global_step": 170238, "epoch": 1013} {"train_loss": -10.905619621276855, "global_step": 170239, "epoch": 1013} {"train_loss": -10.937522888183594, "global_step": 170240, "epoch": 1013} {"train_loss": -10.900569915771484, "global_step": 170241, "epoch": 1013} {"train_loss": -11.048528671264648, "global_step": 170242, "epoch": 1013} {"train_loss": -10.926671981811523, "global_step": 170243, "epoch": 1013} {"train_loss": -11.15833568572998, "global_step": 170244, "epoch": 1013} {"train_loss": -10.874273300170898, "global_step": 170245, "epoch": 1013} {"train_loss": -11.279340744018555, "global_step": 170246, "epoch": 1013} {"train_loss": -11.18629264831543, "global_step": 170247, "epoch": 1013} {"train_loss": -11.112367630004883, "global_step": 170248, "epoch": 1013} {"train_loss": -11.275215148925781, "global_step": 170249, "epoch": 1013} {"train_loss": -11.22636604309082, "global_step": 170250, "epoch": 1013} {"train_loss": -11.250642776489258, "global_step": 170251, "epoch": 1013} {"train_loss": -11.365437507629395, "global_step": 170252, "epoch": 1013} {"train_loss": -11.103864669799805, "global_step": 170253, "epoch": 1013} {"train_loss": -11.493212699890137, "global_step": 170254, "epoch": 1013} {"train_loss": -11.033509254455566, "global_step": 170255, "epoch": 1013} {"train_loss": -11.403053283691406, "global_step": 170256, "epoch": 1013} {"train_loss": -11.380212783813477, "global_step": 170257, "epoch": 1013} {"train_loss": -11.377347946166992, "global_step": 170258, "epoch": 1013} {"train_loss": -11.33674430847168, "global_step": 170259, "epoch": 1013} {"train_loss": -11.118391036987305, "global_step": 170260, "epoch": 1013} {"train_loss": -11.211299896240234, "global_step": 170261, "epoch": 1013} {"train_loss": -11.216242790222168, "global_step": 170262, "epoch": 1013} {"train_loss": -11.500746726989746, "global_step": 170263, "epoch": 1013} {"train_loss": -11.342048645019531, "global_step": 170264, "epoch": 1013} {"train_loss": -11.165127754211426, "global_step": 170265, "epoch": 1013} {"train_loss": -11.359123229980469, "global_step": 170266, "epoch": 1013} {"train_loss": -11.050623893737793, "global_step": 170267, "epoch": 1013} {"train_loss": -11.485136032104492, "global_step": 170268, "epoch": 1013} {"train_loss": -11.105722427368164, "global_step": 170269, "epoch": 1013} {"train_loss": -11.347529411315918, "global_step": 170270, "epoch": 1013} {"train_loss": -11.435898780822754, "global_step": 170271, "epoch": 1013} {"train_loss": -11.471155166625977, "global_step": 170272, "epoch": 1013} {"train_loss": -11.298870086669922, "global_step": 170273, "epoch": 1013} {"train_loss": -11.478523254394531, "global_step": 170274, "epoch": 1013} {"train_loss": -11.489994049072266, "global_step": 170275, "epoch": 1013} {"train_loss": -11.215782165527344, "global_step": 170276, "epoch": 1013} {"train_loss": -10.982833862304688, "global_step": 170277, "epoch": 1013} {"train_loss": -11.211727142333984, "global_step": 170278, "epoch": 1013} {"train_loss": -11.227253913879395, "global_step": 170279, "epoch": 1013} {"train_loss": -11.315484046936035, "global_step": 170280, "epoch": 1013} {"train_loss": -11.30213451385498, "global_step": 170281, "epoch": 1013} {"train_loss": -11.193315505981445, "global_step": 170282, "epoch": 1013} {"train_loss": -11.060750961303711, "global_step": 170283, "epoch": 1013} {"train_loss": -10.975955963134766, "global_step": 170284, "epoch": 1013} {"train_loss": -11.30919075012207, "global_step": 170285, "epoch": 1013} {"train_loss": -10.80007553100586, "global_step": 170286, "epoch": 1013} {"train_loss": -10.24928092956543, "global_step": 170287, "epoch": 1013} {"train_loss": -9.913009643554688, "global_step": 170288, "epoch": 1013} {"train_loss": -10.198110580444336, "global_step": 170289, "epoch": 1013} {"train_loss": -8.129129409790039, "global_step": 170290, "epoch": 1013} {"train_loss": -10.550167083740234, "global_step": 170291, "epoch": 1013} {"train_loss": -9.220293998718262, "global_step": 170292, "epoch": 1013} {"train_loss": -9.838512420654297, "global_step": 170293, "epoch": 1013} {"train_loss": -10.450254440307617, "global_step": 170294, "epoch": 1013} {"train_loss": -8.298600196838379, "global_step": 170295, "epoch": 1013} {"train_loss": -10.742410659790039, "global_step": 170296, "epoch": 1013} {"train_loss": -9.876593589782715, "global_step": 170297, "epoch": 1013} {"train_loss": -8.890190124511719, "global_step": 170298, "epoch": 1013} {"train_loss": -9.231460571289062, "global_step": 170299, "epoch": 1013} {"train_loss": -9.896305084228516, "global_step": 170300, "epoch": 1013} {"train_loss": -9.39915657043457, "global_step": 170301, "epoch": 1013} {"train_loss": -9.595451354980469, "global_step": 170302, "epoch": 1013} {"train_loss": -9.581624984741211, "global_step": 170303, "epoch": 1013} {"train_loss": -10.370187759399414, "global_step": 170304, "epoch": 1013} {"train_loss": -9.57992172241211, "global_step": 170305, "epoch": 1013} {"train_loss": -10.261198997497559, "global_step": 170306, "epoch": 1013} {"train_loss": -9.9141263961792, "global_step": 170307, "epoch": 1013} {"train_loss": -10.620157241821289, "global_step": 170308, "epoch": 1013} {"train_loss": -10.424064636230469, "global_step": 170309, "epoch": 1013} {"train_loss": -9.918943405151367, "global_step": 170310, "epoch": 1013} {"train_loss": -10.464445114135742, "global_step": 170311, "epoch": 1013} {"train_loss": -9.807828903198242, "global_step": 170312, "epoch": 1013} {"train_loss": -10.197994232177734, "global_step": 170313, "epoch": 1013} {"train_loss": -10.69263744354248, "global_step": 170314, "epoch": 1013} {"train_loss": -10.472543716430664, "global_step": 170315, "epoch": 1013} {"train_loss": -10.647150039672852, "global_step": 170316, "epoch": 1013} {"train_loss": -10.586204528808594, "global_step": 170317, "epoch": 1013} {"train_loss": -10.50814437866211, "global_step": 170318, "epoch": 1013} {"train_loss": -10.669133186340332, "global_step": 170319, "epoch": 1013} {"train_loss": -10.531347274780273, "global_step": 170320, "epoch": 1013} {"train_loss": -10.723947525024414, "global_step": 170321, "epoch": 1013} {"train_loss": -10.591503143310547, "global_step": 170322, "epoch": 1013} {"train_loss": -10.677255630493164, "global_step": 170323, "epoch": 1013} {"train_loss": -10.970414161682129, "global_step": 170324, "epoch": 1013} {"train_loss": -10.597780227661133, "global_step": 170325, "epoch": 1013} {"train_loss": -10.7509765625, "global_step": 170326, "epoch": 1013} {"train_loss": -10.790414810180664, "global_step": 170327, "epoch": 1013} {"train_loss": -10.816424369812012, "global_step": 170328, "epoch": 1013} {"train_loss": -10.714231491088867, "global_step": 170329, "epoch": 1013} {"train_loss": -11.08764362335205, "global_step": 170330, "epoch": 1013} {"train_loss": -10.713663101196289, "global_step": 170331, "epoch": 1013} {"train_loss": -10.816251754760742, "global_step": 170332, "epoch": 1013} {"train_loss": -10.945045471191406, "global_step": 170333, "epoch": 1013} {"train_loss": -11.018860816955566, "global_step": 170334, "epoch": 1013} {"train_loss": -10.916666030883789, "global_step": 170335, "epoch": 1013} {"train_loss": -11.0325927734375, "global_step": 170336, "epoch": 1013} {"train_loss": -10.78353500366211, "global_step": 170337, "epoch": 1013} {"train_loss": -10.96230697631836, "global_step": 170338, "epoch": 1013} {"train_loss": -11.046075820922852, "global_step": 170339, "epoch": 1013} {"train_loss": -10.958537101745605, "global_step": 170340, "epoch": 1013} {"train_loss": -11.038884162902832, "global_step": 170341, "epoch": 1013} {"train_loss": -10.852632522583008, "global_step": 170342, "epoch": 1013} {"train_loss": -11.050929069519043, "global_step": 170343, "epoch": 1013} {"train_loss": -10.966596603393555, "global_step": 170344, "epoch": 1013} {"train_loss": -11.155526161193848, "global_step": 170345, "epoch": 1013} {"train_loss": -11.098974227905273, "global_step": 170346, "epoch": 1013} {"train_loss": -11.053129196166992, "global_step": 170347, "epoch": 1013} {"train_loss": -11.182053565979004, "global_step": 170348, "epoch": 1013} {"train_loss": -11.150397300720215, "global_step": 170349, "epoch": 1013} {"train_loss": -11.012214660644531, "global_step": 170350, "epoch": 1013} {"train_loss": -10.77984825202397, "global_step": 170351, "epoch": 1013, "val_loss": 237392.609375} {"train_loss": -11.313880920410156, "global_step": 170352, "epoch": 1014} {"train_loss": -11.188793182373047, "global_step": 170353, "epoch": 1014} {"train_loss": -11.104961395263672, "global_step": 170354, "epoch": 1014} {"train_loss": -11.277647018432617, "global_step": 170355, "epoch": 1014} {"train_loss": -11.238399505615234, "global_step": 170356, "epoch": 1014} {"train_loss": -11.38657283782959, "global_step": 170357, "epoch": 1014} {"train_loss": -11.364887237548828, "global_step": 170358, "epoch": 1014} {"train_loss": -11.250316619873047, "global_step": 170359, "epoch": 1014} {"train_loss": -11.167445182800293, "global_step": 170360, "epoch": 1014} {"train_loss": -11.404870986938477, "global_step": 170361, "epoch": 1014} {"train_loss": -11.133596420288086, "global_step": 170362, "epoch": 1014} {"train_loss": -11.034687042236328, "global_step": 170363, "epoch": 1014} {"train_loss": -11.243377685546875, "global_step": 170364, "epoch": 1014} {"train_loss": -11.229400634765625, "global_step": 170365, "epoch": 1014} {"train_loss": -11.544329643249512, "global_step": 170366, "epoch": 1014} {"train_loss": -11.273466110229492, "global_step": 170367, "epoch": 1014} {"train_loss": -11.219791412353516, "global_step": 170368, "epoch": 1014} {"train_loss": -11.266891479492188, "global_step": 170369, "epoch": 1014} {"train_loss": -11.272937774658203, "global_step": 170370, "epoch": 1014} {"train_loss": -11.060979843139648, "global_step": 170371, "epoch": 1014} {"train_loss": -11.273168563842773, "global_step": 170372, "epoch": 1014} {"train_loss": -11.277366638183594, "global_step": 170373, "epoch": 1014} {"train_loss": -11.07088851928711, "global_step": 170374, "epoch": 1014} {"train_loss": -11.50377082824707, "global_step": 170375, "epoch": 1014} {"train_loss": -11.1854887008667, "global_step": 170376, "epoch": 1014} {"train_loss": -11.384235382080078, "global_step": 170377, "epoch": 1014} {"train_loss": -11.166271209716797, "global_step": 170378, "epoch": 1014} {"train_loss": -11.246971130371094, "global_step": 170379, "epoch": 1014} {"train_loss": -11.149303436279297, "global_step": 170380, "epoch": 1014} {"train_loss": -11.06094741821289, "global_step": 170381, "epoch": 1014} {"train_loss": -11.554550170898438, "global_step": 170382, "epoch": 1014} {"train_loss": -11.19106674194336, "global_step": 170383, "epoch": 1014} {"train_loss": -11.108199119567871, "global_step": 170384, "epoch": 1014} {"train_loss": -11.255790710449219, "global_step": 170385, "epoch": 1014} {"train_loss": -11.427851676940918, "global_step": 170386, "epoch": 1014} {"train_loss": -10.716109275817871, "global_step": 170387, "epoch": 1014} {"train_loss": -10.94581127166748, "global_step": 170388, "epoch": 1014} {"train_loss": -11.517756462097168, "global_step": 170389, "epoch": 1014} {"train_loss": -10.915229797363281, "global_step": 170390, "epoch": 1014} {"train_loss": -11.121400833129883, "global_step": 170391, "epoch": 1014} {"train_loss": -11.50759220123291, "global_step": 170392, "epoch": 1014} {"train_loss": -11.210332870483398, "global_step": 170393, "epoch": 1014} {"train_loss": -11.228242874145508, "global_step": 170394, "epoch": 1014} {"train_loss": -11.093040466308594, "global_step": 170395, "epoch": 1014} {"train_loss": -10.956448554992676, "global_step": 170396, "epoch": 1014} {"train_loss": -11.315038681030273, "global_step": 170397, "epoch": 1014} {"train_loss": -11.249763488769531, "global_step": 170398, "epoch": 1014} {"train_loss": -10.845992088317871, "global_step": 170399, "epoch": 1014} {"train_loss": -11.27729320526123, "global_step": 170400, "epoch": 1014} {"train_loss": -11.052361488342285, "global_step": 170401, "epoch": 1014} {"train_loss": -11.243753433227539, "global_step": 170402, "epoch": 1014} {"train_loss": -11.079317092895508, "global_step": 170403, "epoch": 1014} {"train_loss": -11.282639503479004, "global_step": 170404, "epoch": 1014} {"train_loss": -11.243444442749023, "global_step": 170405, "epoch": 1014} {"train_loss": -11.41096305847168, "global_step": 170406, "epoch": 1014} {"train_loss": -10.950414657592773, "global_step": 170407, "epoch": 1014} {"train_loss": -11.02700424194336, "global_step": 170408, "epoch": 1014} {"train_loss": -11.065279006958008, "global_step": 170409, "epoch": 1014} {"train_loss": -11.006814002990723, "global_step": 170410, "epoch": 1014} {"train_loss": -11.121024131774902, "global_step": 170411, "epoch": 1014} {"train_loss": -11.19171142578125, "global_step": 170412, "epoch": 1014} {"train_loss": -10.867326736450195, "global_step": 170413, "epoch": 1014} {"train_loss": -10.674253463745117, "global_step": 170414, "epoch": 1014} {"train_loss": -10.924922943115234, "global_step": 170415, "epoch": 1014} {"train_loss": -10.835975646972656, "global_step": 170416, "epoch": 1014} {"train_loss": -11.251194953918457, "global_step": 170417, "epoch": 1014} {"train_loss": -10.597103118896484, "global_step": 170418, "epoch": 1014} {"train_loss": -10.732471466064453, "global_step": 170419, "epoch": 1014} {"train_loss": -10.978161811828613, "global_step": 170420, "epoch": 1014} {"train_loss": -10.555727005004883, "global_step": 170421, "epoch": 1014} {"train_loss": -11.316650390625, "global_step": 170422, "epoch": 1014} {"train_loss": -11.020491600036621, "global_step": 170423, "epoch": 1014} {"train_loss": -10.953283309936523, "global_step": 170424, "epoch": 1014} {"train_loss": -11.200732231140137, "global_step": 170425, "epoch": 1014} {"train_loss": -11.101713180541992, "global_step": 170426, "epoch": 1014} {"train_loss": -10.998756408691406, "global_step": 170427, "epoch": 1014} {"train_loss": -11.058246612548828, "global_step": 170428, "epoch": 1014} {"train_loss": -10.97637939453125, "global_step": 170429, "epoch": 1014} {"train_loss": -10.818611145019531, "global_step": 170430, "epoch": 1014} {"train_loss": -11.08392333984375, "global_step": 170431, "epoch": 1014} {"train_loss": -10.419084548950195, "global_step": 170432, "epoch": 1014} {"train_loss": -10.282301902770996, "global_step": 170433, "epoch": 1014} {"train_loss": -11.000442504882812, "global_step": 170434, "epoch": 1014} {"train_loss": -9.847380638122559, "global_step": 170435, "epoch": 1014} {"train_loss": -9.71077823638916, "global_step": 170436, "epoch": 1014} {"train_loss": -10.323952674865723, "global_step": 170437, "epoch": 1014} {"train_loss": -9.024953842163086, "global_step": 170438, "epoch": 1014} {"train_loss": -10.24457836151123, "global_step": 170439, "epoch": 1014} {"train_loss": -10.244386672973633, "global_step": 170440, "epoch": 1014} {"train_loss": -9.435030937194824, "global_step": 170441, "epoch": 1014} {"train_loss": -9.604433059692383, "global_step": 170442, "epoch": 1014} {"train_loss": -9.03769302368164, "global_step": 170443, "epoch": 1014} {"train_loss": -8.934389114379883, "global_step": 170444, "epoch": 1014} {"train_loss": -9.757610321044922, "global_step": 170445, "epoch": 1014} {"train_loss": -10.023262977600098, "global_step": 170446, "epoch": 1014} {"train_loss": -9.09333610534668, "global_step": 170447, "epoch": 1014} {"train_loss": -10.300568580627441, "global_step": 170448, "epoch": 1014} {"train_loss": -9.966355323791504, "global_step": 170449, "epoch": 1014} {"train_loss": -10.19131851196289, "global_step": 170450, "epoch": 1014} {"train_loss": -10.279754638671875, "global_step": 170451, "epoch": 1014} {"train_loss": -10.510848045349121, "global_step": 170452, "epoch": 1014} {"train_loss": -10.29592514038086, "global_step": 170453, "epoch": 1014} {"train_loss": -10.156377792358398, "global_step": 170454, "epoch": 1014} {"train_loss": -10.312413215637207, "global_step": 170455, "epoch": 1014} {"train_loss": -10.33773422241211, "global_step": 170456, "epoch": 1014} {"train_loss": -10.471946716308594, "global_step": 170457, "epoch": 1014} {"train_loss": -10.639562606811523, "global_step": 170458, "epoch": 1014} {"train_loss": -10.478166580200195, "global_step": 170459, "epoch": 1014} {"train_loss": -10.74290943145752, "global_step": 170460, "epoch": 1014} {"train_loss": -10.759336471557617, "global_step": 170461, "epoch": 1014} {"train_loss": -10.825855255126953, "global_step": 170462, "epoch": 1014} {"train_loss": -10.751222610473633, "global_step": 170463, "epoch": 1014} {"train_loss": -10.815025329589844, "global_step": 170464, "epoch": 1014} {"train_loss": -10.92459487915039, "global_step": 170465, "epoch": 1014} {"train_loss": -10.899232864379883, "global_step": 170466, "epoch": 1014} {"train_loss": -11.174306869506836, "global_step": 170467, "epoch": 1014} {"train_loss": -10.950582504272461, "global_step": 170468, "epoch": 1014} {"train_loss": -10.979424476623535, "global_step": 170469, "epoch": 1014} {"train_loss": -10.906232833862305, "global_step": 170470, "epoch": 1014} {"train_loss": -10.914819717407227, "global_step": 170471, "epoch": 1014} {"train_loss": -11.148360252380371, "global_step": 170472, "epoch": 1014} {"train_loss": -11.099959373474121, "global_step": 170473, "epoch": 1014} {"train_loss": -10.981405258178711, "global_step": 170474, "epoch": 1014} {"train_loss": -10.966157913208008, "global_step": 170475, "epoch": 1014} {"train_loss": -10.900068283081055, "global_step": 170476, "epoch": 1014} {"train_loss": -10.908656120300293, "global_step": 170477, "epoch": 1014} {"train_loss": -11.182525634765625, "global_step": 170478, "epoch": 1014} {"train_loss": -11.209745407104492, "global_step": 170479, "epoch": 1014} {"train_loss": -11.103737831115723, "global_step": 170480, "epoch": 1014} {"train_loss": -11.208846092224121, "global_step": 170481, "epoch": 1014} {"train_loss": -11.206279754638672, "global_step": 170482, "epoch": 1014} {"train_loss": -11.085880279541016, "global_step": 170483, "epoch": 1014} {"train_loss": -11.159961700439453, "global_step": 170484, "epoch": 1014} {"train_loss": -11.217477798461914, "global_step": 170485, "epoch": 1014} {"train_loss": -11.152165412902832, "global_step": 170486, "epoch": 1014} {"train_loss": -11.316438674926758, "global_step": 170487, "epoch": 1014} {"train_loss": -11.269243240356445, "global_step": 170488, "epoch": 1014} {"train_loss": -11.262243270874023, "global_step": 170489, "epoch": 1014} {"train_loss": -11.234106063842773, "global_step": 170490, "epoch": 1014} {"train_loss": -11.15636157989502, "global_step": 170491, "epoch": 1014} {"train_loss": -11.31199836730957, "global_step": 170492, "epoch": 1014} {"train_loss": -11.30984878540039, "global_step": 170493, "epoch": 1014} {"train_loss": -11.327128410339355, "global_step": 170494, "epoch": 1014} {"train_loss": -11.234543800354004, "global_step": 170495, "epoch": 1014} {"train_loss": -11.141847610473633, "global_step": 170496, "epoch": 1014} {"train_loss": -11.32257080078125, "global_step": 170497, "epoch": 1014} {"train_loss": -11.370410919189453, "global_step": 170498, "epoch": 1014} {"train_loss": -11.032727241516113, "global_step": 170499, "epoch": 1014} {"train_loss": -11.326193809509277, "global_step": 170500, "epoch": 1014} {"train_loss": -10.807104110717773, "global_step": 170501, "epoch": 1014} {"train_loss": -11.100959777832031, "global_step": 170502, "epoch": 1014} {"train_loss": -11.451761245727539, "global_step": 170503, "epoch": 1014} {"train_loss": -11.017522811889648, "global_step": 170504, "epoch": 1014} {"train_loss": -11.09640884399414, "global_step": 170505, "epoch": 1014} {"train_loss": -11.424560546875, "global_step": 170506, "epoch": 1014} {"train_loss": -10.94996452331543, "global_step": 170507, "epoch": 1014} {"train_loss": -10.568017959594727, "global_step": 170508, "epoch": 1014} {"train_loss": -11.40413761138916, "global_step": 170509, "epoch": 1014} {"train_loss": -11.325397491455078, "global_step": 170510, "epoch": 1014} {"train_loss": -10.933662414550781, "global_step": 170511, "epoch": 1014} {"train_loss": -11.280984878540039, "global_step": 170512, "epoch": 1014} {"train_loss": -11.325772285461426, "global_step": 170513, "epoch": 1014} {"train_loss": -11.040748596191406, "global_step": 170514, "epoch": 1014} {"train_loss": -11.184016227722168, "global_step": 170515, "epoch": 1014} {"train_loss": -11.1670503616333, "global_step": 170516, "epoch": 1014} {"train_loss": -11.198539733886719, "global_step": 170517, "epoch": 1014} {"train_loss": -10.849578857421875, "global_step": 170518, "epoch": 1014} {"train_loss": -10.943148351850963, "global_step": 170519, "epoch": 1014, "val_loss": 238175.21875} {"train_loss": -10.773503303527832, "global_step": 170520, "epoch": 1015} {"train_loss": -10.583166122436523, "global_step": 170521, "epoch": 1015} {"train_loss": -10.891379356384277, "global_step": 170522, "epoch": 1015} {"train_loss": -10.755343437194824, "global_step": 170523, "epoch": 1015} {"train_loss": -10.678954124450684, "global_step": 170524, "epoch": 1015} {"train_loss": -10.476480484008789, "global_step": 170525, "epoch": 1015} {"train_loss": -10.418990135192871, "global_step": 170526, "epoch": 1015} {"train_loss": -10.857866287231445, "global_step": 170527, "epoch": 1015} {"train_loss": -10.358612060546875, "global_step": 170528, "epoch": 1015} {"train_loss": -10.533587455749512, "global_step": 170529, "epoch": 1015} {"train_loss": -10.634880065917969, "global_step": 170530, "epoch": 1015} {"train_loss": -9.964454650878906, "global_step": 170531, "epoch": 1015} {"train_loss": -10.975564956665039, "global_step": 170532, "epoch": 1015} {"train_loss": -9.757537841796875, "global_step": 170533, "epoch": 1015} {"train_loss": -9.837051391601562, "global_step": 170534, "epoch": 1015} {"train_loss": -10.71237564086914, "global_step": 170535, "epoch": 1015} {"train_loss": -9.883800506591797, "global_step": 170536, "epoch": 1015} {"train_loss": -10.486017227172852, "global_step": 170537, "epoch": 1015} {"train_loss": -10.209615707397461, "global_step": 170538, "epoch": 1015} {"train_loss": -10.353957176208496, "global_step": 170539, "epoch": 1015} {"train_loss": -10.274492263793945, "global_step": 170540, "epoch": 1015} {"train_loss": -9.988994598388672, "global_step": 170541, "epoch": 1015} {"train_loss": -10.661977767944336, "global_step": 170542, "epoch": 1015} {"train_loss": -9.70016098022461, "global_step": 170543, "epoch": 1015} {"train_loss": -10.807769775390625, "global_step": 170544, "epoch": 1015} {"train_loss": -10.71490478515625, "global_step": 170545, "epoch": 1015} {"train_loss": -10.367073059082031, "global_step": 170546, "epoch": 1015} {"train_loss": -11.03628158569336, "global_step": 170547, "epoch": 1015} {"train_loss": -10.566595077514648, "global_step": 170548, "epoch": 1015} {"train_loss": -10.880315780639648, "global_step": 170549, "epoch": 1015} {"train_loss": -10.509796142578125, "global_step": 170550, "epoch": 1015} {"train_loss": -10.970466613769531, "global_step": 170551, "epoch": 1015} {"train_loss": -11.052156448364258, "global_step": 170552, "epoch": 1015} {"train_loss": -10.567947387695312, "global_step": 170553, "epoch": 1015} {"train_loss": -11.01453971862793, "global_step": 170554, "epoch": 1015} {"train_loss": -10.660836219787598, "global_step": 170555, "epoch": 1015} {"train_loss": -10.432195663452148, "global_step": 170556, "epoch": 1015} {"train_loss": -11.04212760925293, "global_step": 170557, "epoch": 1015} {"train_loss": -10.587813377380371, "global_step": 170558, "epoch": 1015} {"train_loss": -10.965681076049805, "global_step": 170559, "epoch": 1015} {"train_loss": -10.962545394897461, "global_step": 170560, "epoch": 1015} {"train_loss": -10.925056457519531, "global_step": 170561, "epoch": 1015} {"train_loss": -10.766486167907715, "global_step": 170562, "epoch": 1015} {"train_loss": -11.131068229675293, "global_step": 170563, "epoch": 1015} {"train_loss": -10.849580764770508, "global_step": 170564, "epoch": 1015} {"train_loss": -10.882533073425293, "global_step": 170565, "epoch": 1015} {"train_loss": -10.97811508178711, "global_step": 170566, "epoch": 1015} {"train_loss": -11.22898006439209, "global_step": 170567, "epoch": 1015} {"train_loss": -11.084112167358398, "global_step": 170568, "epoch": 1015} {"train_loss": -11.110109329223633, "global_step": 170569, "epoch": 1015} {"train_loss": -11.206548690795898, "global_step": 170570, "epoch": 1015} {"train_loss": -11.407875061035156, "global_step": 170571, "epoch": 1015} {"train_loss": -11.251835823059082, "global_step": 170572, "epoch": 1015} {"train_loss": -11.11460018157959, "global_step": 170573, "epoch": 1015} {"train_loss": -11.314641952514648, "global_step": 170574, "epoch": 1015} {"train_loss": -11.17020034790039, "global_step": 170575, "epoch": 1015} {"train_loss": -11.164899826049805, "global_step": 170576, "epoch": 1015} {"train_loss": -11.256304740905762, "global_step": 170577, "epoch": 1015} {"train_loss": -11.44225788116455, "global_step": 170578, "epoch": 1015} {"train_loss": -11.252613067626953, "global_step": 170579, "epoch": 1015} {"train_loss": -11.377378463745117, "global_step": 170580, "epoch": 1015} {"train_loss": -11.247514724731445, "global_step": 170581, "epoch": 1015} {"train_loss": -11.036945343017578, "global_step": 170582, "epoch": 1015} {"train_loss": -11.399391174316406, "global_step": 170583, "epoch": 1015} {"train_loss": -11.275504112243652, "global_step": 170584, "epoch": 1015} {"train_loss": -11.219621658325195, "global_step": 170585, "epoch": 1015} {"train_loss": -11.394269943237305, "global_step": 170586, "epoch": 1015} {"train_loss": -11.289098739624023, "global_step": 170587, "epoch": 1015} {"train_loss": -11.147706985473633, "global_step": 170588, "epoch": 1015} {"train_loss": -11.276199340820312, "global_step": 170589, "epoch": 1015} {"train_loss": -11.518973350524902, "global_step": 170590, "epoch": 1015} {"train_loss": -11.454753875732422, "global_step": 170591, "epoch": 1015} {"train_loss": -11.369341850280762, "global_step": 170592, "epoch": 1015} {"train_loss": -11.44482421875, "global_step": 170593, "epoch": 1015} {"train_loss": -11.374011993408203, "global_step": 170594, "epoch": 1015} {"train_loss": -11.559891700744629, "global_step": 170595, "epoch": 1015} {"train_loss": -11.370287895202637, "global_step": 170596, "epoch": 1015} {"train_loss": -11.256656646728516, "global_step": 170597, "epoch": 1015} {"train_loss": -11.270594596862793, "global_step": 170598, "epoch": 1015} {"train_loss": -11.287038803100586, "global_step": 170599, "epoch": 1015} {"train_loss": -11.21939468383789, "global_step": 170600, "epoch": 1015} {"train_loss": -11.358731269836426, "global_step": 170601, "epoch": 1015} {"train_loss": -11.21646785736084, "global_step": 170602, "epoch": 1015} {"train_loss": -11.22221851348877, "global_step": 170603, "epoch": 1015} {"train_loss": -11.444990158081055, "global_step": 170604, "epoch": 1015} {"train_loss": -11.333720207214355, "global_step": 170605, "epoch": 1015} {"train_loss": -11.079061508178711, "global_step": 170606, "epoch": 1015} {"train_loss": -11.267492294311523, "global_step": 170607, "epoch": 1015} {"train_loss": -11.2797212600708, "global_step": 170608, "epoch": 1015} {"train_loss": -10.664463996887207, "global_step": 170609, "epoch": 1015} {"train_loss": -10.09537124633789, "global_step": 170610, "epoch": 1015} {"train_loss": -10.61566162109375, "global_step": 170611, "epoch": 1015} {"train_loss": -11.064126968383789, "global_step": 170612, "epoch": 1015} {"train_loss": -10.386357307434082, "global_step": 170613, "epoch": 1015} {"train_loss": -10.6163330078125, "global_step": 170614, "epoch": 1015} {"train_loss": -10.650894165039062, "global_step": 170615, "epoch": 1015} {"train_loss": -10.768014907836914, "global_step": 170616, "epoch": 1015} {"train_loss": -10.38584041595459, "global_step": 170617, "epoch": 1015} {"train_loss": -9.917160034179688, "global_step": 170618, "epoch": 1015} {"train_loss": -10.517829895019531, "global_step": 170619, "epoch": 1015} {"train_loss": -9.552252769470215, "global_step": 170620, "epoch": 1015} {"train_loss": -9.961847305297852, "global_step": 170621, "epoch": 1015} {"train_loss": -10.881786346435547, "global_step": 170622, "epoch": 1015} {"train_loss": -10.138357162475586, "global_step": 170623, "epoch": 1015} {"train_loss": -10.883503913879395, "global_step": 170624, "epoch": 1015} {"train_loss": -10.783315658569336, "global_step": 170625, "epoch": 1015} {"train_loss": -10.911606788635254, "global_step": 170626, "epoch": 1015} {"train_loss": -10.22361946105957, "global_step": 170627, "epoch": 1015} {"train_loss": -10.413650512695312, "global_step": 170628, "epoch": 1015} {"train_loss": -10.802654266357422, "global_step": 170629, "epoch": 1015} {"train_loss": -10.283385276794434, "global_step": 170630, "epoch": 1015} {"train_loss": -10.698772430419922, "global_step": 170631, "epoch": 1015} {"train_loss": -9.9111909866333, "global_step": 170632, "epoch": 1015} {"train_loss": -10.834808349609375, "global_step": 170633, "epoch": 1015} {"train_loss": -10.153364181518555, "global_step": 170634, "epoch": 1015} {"train_loss": -10.944082260131836, "global_step": 170635, "epoch": 1015} {"train_loss": -9.802988052368164, "global_step": 170636, "epoch": 1015} {"train_loss": -10.899933815002441, "global_step": 170637, "epoch": 1015} {"train_loss": -10.456533432006836, "global_step": 170638, "epoch": 1015} {"train_loss": -10.873266220092773, "global_step": 170639, "epoch": 1015} {"train_loss": -10.777996063232422, "global_step": 170640, "epoch": 1015} {"train_loss": -10.621313095092773, "global_step": 170641, "epoch": 1015} {"train_loss": -10.465576171875, "global_step": 170642, "epoch": 1015} {"train_loss": -10.779060363769531, "global_step": 170643, "epoch": 1015} {"train_loss": -10.46457290649414, "global_step": 170644, "epoch": 1015} {"train_loss": -11.070880889892578, "global_step": 170645, "epoch": 1015} {"train_loss": -10.700604438781738, "global_step": 170646, "epoch": 1015} {"train_loss": -10.965875625610352, "global_step": 170647, "epoch": 1015} {"train_loss": -10.927570343017578, "global_step": 170648, "epoch": 1015} {"train_loss": -11.148661613464355, "global_step": 170649, "epoch": 1015} {"train_loss": -10.700679779052734, "global_step": 170650, "epoch": 1015} {"train_loss": -10.894776344299316, "global_step": 170651, "epoch": 1015} {"train_loss": -10.846029281616211, "global_step": 170652, "epoch": 1015} {"train_loss": -11.09656047821045, "global_step": 170653, "epoch": 1015} {"train_loss": -10.960972785949707, "global_step": 170654, "epoch": 1015} {"train_loss": -10.998800277709961, "global_step": 170655, "epoch": 1015} {"train_loss": -10.939552307128906, "global_step": 170656, "epoch": 1015} {"train_loss": -11.094734191894531, "global_step": 170657, "epoch": 1015} {"train_loss": -10.817839622497559, "global_step": 170658, "epoch": 1015} {"train_loss": -10.963705062866211, "global_step": 170659, "epoch": 1015} {"train_loss": -11.114728927612305, "global_step": 170660, "epoch": 1015} {"train_loss": -10.945348739624023, "global_step": 170661, "epoch": 1015} {"train_loss": -11.06224250793457, "global_step": 170662, "epoch": 1015} {"train_loss": -11.18075942993164, "global_step": 170663, "epoch": 1015} {"train_loss": -11.22899055480957, "global_step": 170664, "epoch": 1015} {"train_loss": -11.142723083496094, "global_step": 170665, "epoch": 1015} {"train_loss": -11.160274505615234, "global_step": 170666, "epoch": 1015} {"train_loss": -11.24547004699707, "global_step": 170667, "epoch": 1015} {"train_loss": -11.265584945678711, "global_step": 170668, "epoch": 1015} {"train_loss": -11.091071128845215, "global_step": 170669, "epoch": 1015} {"train_loss": -11.187174797058105, "global_step": 170670, "epoch": 1015} {"train_loss": -11.14753246307373, "global_step": 170671, "epoch": 1015} {"train_loss": -11.101320266723633, "global_step": 170672, "epoch": 1015} {"train_loss": -11.311595916748047, "global_step": 170673, "epoch": 1015} {"train_loss": -11.207789421081543, "global_step": 170674, "epoch": 1015} {"train_loss": -11.10461711883545, "global_step": 170675, "epoch": 1015} {"train_loss": -11.255322456359863, "global_step": 170676, "epoch": 1015} {"train_loss": -10.909454345703125, "global_step": 170677, "epoch": 1015} {"train_loss": -11.51722526550293, "global_step": 170678, "epoch": 1015} {"train_loss": -10.944295883178711, "global_step": 170679, "epoch": 1015} {"train_loss": -11.326460838317871, "global_step": 170680, "epoch": 1015} {"train_loss": -10.919054985046387, "global_step": 170681, "epoch": 1015} {"train_loss": -11.185628890991211, "global_step": 170682, "epoch": 1015} {"train_loss": -11.138065338134766, "global_step": 170683, "epoch": 1015} {"train_loss": -11.337228775024414, "global_step": 170684, "epoch": 1015} {"train_loss": -11.071802139282227, "global_step": 170685, "epoch": 1015} {"train_loss": -11.180364608764648, "global_step": 170686, "epoch": 1015} {"train_loss": -10.878188343275161, "global_step": 170687, "epoch": 1015, "val_loss": 239235.84375, "train_action_mse_error": 1.4173940420150757} {"train_loss": -11.164742469787598, "global_step": 170688, "epoch": 1016} {"train_loss": -11.342626571655273, "global_step": 170689, "epoch": 1016} {"train_loss": -11.109870910644531, "global_step": 170690, "epoch": 1016} {"train_loss": -11.31740665435791, "global_step": 170691, "epoch": 1016} {"train_loss": -11.268556594848633, "global_step": 170692, "epoch": 1016} {"train_loss": -11.20516586303711, "global_step": 170693, "epoch": 1016} {"train_loss": -11.332244873046875, "global_step": 170694, "epoch": 1016} {"train_loss": -11.310303688049316, "global_step": 170695, "epoch": 1016} {"train_loss": -11.381464004516602, "global_step": 170696, "epoch": 1016} {"train_loss": -11.571200370788574, "global_step": 170697, "epoch": 1016} {"train_loss": -11.399848937988281, "global_step": 170698, "epoch": 1016} {"train_loss": -11.166181564331055, "global_step": 170699, "epoch": 1016} {"train_loss": -11.49322509765625, "global_step": 170700, "epoch": 1016} {"train_loss": -11.439068794250488, "global_step": 170701, "epoch": 1016} {"train_loss": -11.068968772888184, "global_step": 170702, "epoch": 1016} {"train_loss": -11.127761840820312, "global_step": 170703, "epoch": 1016} {"train_loss": -11.467541694641113, "global_step": 170704, "epoch": 1016} {"train_loss": -11.237009048461914, "global_step": 170705, "epoch": 1016} {"train_loss": -11.444311141967773, "global_step": 170706, "epoch": 1016} {"train_loss": -10.93674087524414, "global_step": 170707, "epoch": 1016} {"train_loss": -10.661861419677734, "global_step": 170708, "epoch": 1016} {"train_loss": -11.389801025390625, "global_step": 170709, "epoch": 1016} {"train_loss": -10.9342041015625, "global_step": 170710, "epoch": 1016} {"train_loss": -10.687143325805664, "global_step": 170711, "epoch": 1016} {"train_loss": -10.776769638061523, "global_step": 170712, "epoch": 1016} {"train_loss": -10.971155166625977, "global_step": 170713, "epoch": 1016} {"train_loss": -10.602168083190918, "global_step": 170714, "epoch": 1016} {"train_loss": -10.86354923248291, "global_step": 170715, "epoch": 1016} {"train_loss": -10.792760848999023, "global_step": 170716, "epoch": 1016} {"train_loss": -10.796030044555664, "global_step": 170717, "epoch": 1016} {"train_loss": -10.697490692138672, "global_step": 170718, "epoch": 1016} {"train_loss": -10.78764533996582, "global_step": 170719, "epoch": 1016} {"train_loss": -10.87480640411377, "global_step": 170720, "epoch": 1016} {"train_loss": -10.896330833435059, "global_step": 170721, "epoch": 1016} {"train_loss": -10.784078598022461, "global_step": 170722, "epoch": 1016} {"train_loss": -10.661819458007812, "global_step": 170723, "epoch": 1016} {"train_loss": -11.078412055969238, "global_step": 170724, "epoch": 1016} {"train_loss": -10.611186981201172, "global_step": 170725, "epoch": 1016} {"train_loss": -10.2278413772583, "global_step": 170726, "epoch": 1016} {"train_loss": -10.775690078735352, "global_step": 170727, "epoch": 1016} {"train_loss": -10.893848419189453, "global_step": 170728, "epoch": 1016} {"train_loss": -10.46584701538086, "global_step": 170729, "epoch": 1016} {"train_loss": -10.653003692626953, "global_step": 170730, "epoch": 1016} {"train_loss": -10.825350761413574, "global_step": 170731, "epoch": 1016} {"train_loss": -10.387625694274902, "global_step": 170732, "epoch": 1016} {"train_loss": -10.517478942871094, "global_step": 170733, "epoch": 1016} {"train_loss": -10.497058868408203, "global_step": 170734, "epoch": 1016} {"train_loss": -9.951332092285156, "global_step": 170735, "epoch": 1016} {"train_loss": -10.93028450012207, "global_step": 170736, "epoch": 1016} {"train_loss": -9.796613693237305, "global_step": 170737, "epoch": 1016} {"train_loss": -10.420452117919922, "global_step": 170738, "epoch": 1016} {"train_loss": -9.958145141601562, "global_step": 170739, "epoch": 1016} {"train_loss": -10.341278076171875, "global_step": 170740, "epoch": 1016} {"train_loss": -10.12276840209961, "global_step": 170741, "epoch": 1016} {"train_loss": -10.332828521728516, "global_step": 170742, "epoch": 1016} {"train_loss": -10.597723007202148, "global_step": 170743, "epoch": 1016} {"train_loss": -10.221763610839844, "global_step": 170744, "epoch": 1016} {"train_loss": -10.55929946899414, "global_step": 170745, "epoch": 1016} {"train_loss": -10.23274040222168, "global_step": 170746, "epoch": 1016} {"train_loss": -10.807147026062012, "global_step": 170747, "epoch": 1016} {"train_loss": -10.246740341186523, "global_step": 170748, "epoch": 1016} {"train_loss": -10.683581352233887, "global_step": 170749, "epoch": 1016} {"train_loss": -10.770668029785156, "global_step": 170750, "epoch": 1016} {"train_loss": -9.90850830078125, "global_step": 170751, "epoch": 1016} {"train_loss": -10.844097137451172, "global_step": 170752, "epoch": 1016} {"train_loss": -10.56814193725586, "global_step": 170753, "epoch": 1016} {"train_loss": -10.54992389678955, "global_step": 170754, "epoch": 1016} {"train_loss": -10.656379699707031, "global_step": 170755, "epoch": 1016} {"train_loss": -10.815532684326172, "global_step": 170756, "epoch": 1016} {"train_loss": -10.490567207336426, "global_step": 170757, "epoch": 1016} {"train_loss": -11.035072326660156, "global_step": 170758, "epoch": 1016} {"train_loss": -10.929756164550781, "global_step": 170759, "epoch": 1016} {"train_loss": -10.910041809082031, "global_step": 170760, "epoch": 1016} {"train_loss": -10.763866424560547, "global_step": 170761, "epoch": 1016} {"train_loss": -11.15601634979248, "global_step": 170762, "epoch": 1016} {"train_loss": -10.828386306762695, "global_step": 170763, "epoch": 1016} {"train_loss": -10.950467109680176, "global_step": 170764, "epoch": 1016} {"train_loss": -10.958712577819824, "global_step": 170765, "epoch": 1016} {"train_loss": -11.115753173828125, "global_step": 170766, "epoch": 1016} {"train_loss": -10.969850540161133, "global_step": 170767, "epoch": 1016} {"train_loss": -11.054159164428711, "global_step": 170768, "epoch": 1016} {"train_loss": -10.917048454284668, "global_step": 170769, "epoch": 1016} {"train_loss": -10.999138832092285, "global_step": 170770, "epoch": 1016} {"train_loss": -10.70168399810791, "global_step": 170771, "epoch": 1016} {"train_loss": -11.160945892333984, "global_step": 170772, "epoch": 1016} {"train_loss": -10.559807777404785, "global_step": 170773, "epoch": 1016} {"train_loss": -11.157217025756836, "global_step": 170774, "epoch": 1016} {"train_loss": -11.064268112182617, "global_step": 170775, "epoch": 1016} {"train_loss": -11.188183784484863, "global_step": 170776, "epoch": 1016} {"train_loss": -10.941997528076172, "global_step": 170777, "epoch": 1016} {"train_loss": -11.050359725952148, "global_step": 170778, "epoch": 1016} {"train_loss": -10.829717636108398, "global_step": 170779, "epoch": 1016} {"train_loss": -11.073261260986328, "global_step": 170780, "epoch": 1016} {"train_loss": -10.992166519165039, "global_step": 170781, "epoch": 1016} {"train_loss": -11.147823333740234, "global_step": 170782, "epoch": 1016} {"train_loss": -11.178239822387695, "global_step": 170783, "epoch": 1016} {"train_loss": -10.875646591186523, "global_step": 170784, "epoch": 1016} {"train_loss": -11.30780029296875, "global_step": 170785, "epoch": 1016} {"train_loss": -11.186132431030273, "global_step": 170786, "epoch": 1016} {"train_loss": -11.16583251953125, "global_step": 170787, "epoch": 1016} {"train_loss": -11.338418960571289, "global_step": 170788, "epoch": 1016} {"train_loss": -11.229406356811523, "global_step": 170789, "epoch": 1016} {"train_loss": -11.249383926391602, "global_step": 170790, "epoch": 1016} {"train_loss": -11.387995719909668, "global_step": 170791, "epoch": 1016} {"train_loss": -11.224610328674316, "global_step": 170792, "epoch": 1016} {"train_loss": -11.441604614257812, "global_step": 170793, "epoch": 1016} {"train_loss": -11.419194221496582, "global_step": 170794, "epoch": 1016} {"train_loss": -11.332853317260742, "global_step": 170795, "epoch": 1016} {"train_loss": -11.305376052856445, "global_step": 170796, "epoch": 1016} {"train_loss": -11.319742202758789, "global_step": 170797, "epoch": 1016} {"train_loss": -11.248392105102539, "global_step": 170798, "epoch": 1016} {"train_loss": -11.330814361572266, "global_step": 170799, "epoch": 1016} {"train_loss": -11.356430053710938, "global_step": 170800, "epoch": 1016} {"train_loss": -11.423103332519531, "global_step": 170801, "epoch": 1016} {"train_loss": -11.184395790100098, "global_step": 170802, "epoch": 1016} {"train_loss": -11.362984657287598, "global_step": 170803, "epoch": 1016} {"train_loss": -11.454826354980469, "global_step": 170804, "epoch": 1016} {"train_loss": -11.37628173828125, "global_step": 170805, "epoch": 1016} {"train_loss": -11.383451461791992, "global_step": 170806, "epoch": 1016} {"train_loss": -11.350914001464844, "global_step": 170807, "epoch": 1016} {"train_loss": -11.278203964233398, "global_step": 170808, "epoch": 1016} {"train_loss": -11.519784927368164, "global_step": 170809, "epoch": 1016} {"train_loss": -11.226032257080078, "global_step": 170810, "epoch": 1016} {"train_loss": -11.354814529418945, "global_step": 170811, "epoch": 1016} {"train_loss": -11.39831829071045, "global_step": 170812, "epoch": 1016} {"train_loss": -11.164566993713379, "global_step": 170813, "epoch": 1016} {"train_loss": -11.365884780883789, "global_step": 170814, "epoch": 1016} {"train_loss": -11.35440731048584, "global_step": 170815, "epoch": 1016} {"train_loss": -11.278983116149902, "global_step": 170816, "epoch": 1016} {"train_loss": -11.271587371826172, "global_step": 170817, "epoch": 1016} {"train_loss": -11.284384727478027, "global_step": 170818, "epoch": 1016} {"train_loss": -11.120986938476562, "global_step": 170819, "epoch": 1016} {"train_loss": -11.112117767333984, "global_step": 170820, "epoch": 1016} {"train_loss": -11.34771728515625, "global_step": 170821, "epoch": 1016} {"train_loss": -11.374300956726074, "global_step": 170822, "epoch": 1016} {"train_loss": -11.031177520751953, "global_step": 170823, "epoch": 1016} {"train_loss": -11.504936218261719, "global_step": 170824, "epoch": 1016} {"train_loss": -11.367847442626953, "global_step": 170825, "epoch": 1016} {"train_loss": -11.497759819030762, "global_step": 170826, "epoch": 1016} {"train_loss": -11.353172302246094, "global_step": 170827, "epoch": 1016} {"train_loss": -11.171751976013184, "global_step": 170828, "epoch": 1016} {"train_loss": -11.152294158935547, "global_step": 170829, "epoch": 1016} {"train_loss": -11.483259201049805, "global_step": 170830, "epoch": 1016} {"train_loss": -11.387467384338379, "global_step": 170831, "epoch": 1016} {"train_loss": -11.099024772644043, "global_step": 170832, "epoch": 1016} {"train_loss": -11.073837280273438, "global_step": 170833, "epoch": 1016} {"train_loss": -10.854856491088867, "global_step": 170834, "epoch": 1016} {"train_loss": -10.817479133605957, "global_step": 170835, "epoch": 1016} {"train_loss": -11.157869338989258, "global_step": 170836, "epoch": 1016} {"train_loss": -10.897940635681152, "global_step": 170837, "epoch": 1016} {"train_loss": -10.990008354187012, "global_step": 170838, "epoch": 1016} {"train_loss": -10.516681671142578, "global_step": 170839, "epoch": 1016} {"train_loss": -10.615534782409668, "global_step": 170840, "epoch": 1016} {"train_loss": -11.314974784851074, "global_step": 170841, "epoch": 1016} {"train_loss": -9.692587852478027, "global_step": 170842, "epoch": 1016} {"train_loss": -8.842620849609375, "global_step": 170843, "epoch": 1016} {"train_loss": -10.660820007324219, "global_step": 170844, "epoch": 1016} {"train_loss": -6.669835567474365, "global_step": 170845, "epoch": 1016} {"train_loss": -9.872690200805664, "global_step": 170846, "epoch": 1016} {"train_loss": -6.314117431640625, "global_step": 170847, "epoch": 1016} {"train_loss": -7.443865776062012, "global_step": 170848, "epoch": 1016} {"train_loss": -8.261556625366211, "global_step": 170849, "epoch": 1016} {"train_loss": -7.369891166687012, "global_step": 170850, "epoch": 1016} {"train_loss": -9.691253662109375, "global_step": 170851, "epoch": 1016} {"train_loss": -8.16057014465332, "global_step": 170852, "epoch": 1016} {"train_loss": -10.038782119750977, "global_step": 170853, "epoch": 1016} {"train_loss": -9.765059471130371, "global_step": 170854, "epoch": 1016} {"train_loss": -10.809272388617197, "global_step": 170855, "epoch": 1016, "val_loss": 231997.765625} {"train_loss": -10.228822708129883, "global_step": 170856, "epoch": 1017} {"train_loss": -10.336359024047852, "global_step": 170857, "epoch": 1017} {"train_loss": -9.992948532104492, "global_step": 170858, "epoch": 1017} {"train_loss": -10.36562442779541, "global_step": 170859, "epoch": 1017} {"train_loss": -10.567886352539062, "global_step": 170860, "epoch": 1017} {"train_loss": -10.331478118896484, "global_step": 170861, "epoch": 1017} {"train_loss": -10.17401123046875, "global_step": 170862, "epoch": 1017} {"train_loss": -10.638301849365234, "global_step": 170863, "epoch": 1017} {"train_loss": -9.991857528686523, "global_step": 170864, "epoch": 1017} {"train_loss": -10.453286170959473, "global_step": 170865, "epoch": 1017} {"train_loss": -10.554698944091797, "global_step": 170866, "epoch": 1017} {"train_loss": -10.149581909179688, "global_step": 170867, "epoch": 1017} {"train_loss": -10.620573043823242, "global_step": 170868, "epoch": 1017} {"train_loss": -10.505626678466797, "global_step": 170869, "epoch": 1017} {"train_loss": -10.497408866882324, "global_step": 170870, "epoch": 1017} {"train_loss": -10.693327903747559, "global_step": 170871, "epoch": 1017} {"train_loss": -10.69778823852539, "global_step": 170872, "epoch": 1017} {"train_loss": -10.610885620117188, "global_step": 170873, "epoch": 1017} {"train_loss": -10.573901176452637, "global_step": 170874, "epoch": 1017} {"train_loss": -10.654293060302734, "global_step": 170875, "epoch": 1017} {"train_loss": -10.668821334838867, "global_step": 170876, "epoch": 1017} {"train_loss": -10.840639114379883, "global_step": 170877, "epoch": 1017} {"train_loss": -10.834928512573242, "global_step": 170878, "epoch": 1017} {"train_loss": -10.550036430358887, "global_step": 170879, "epoch": 1017} {"train_loss": -10.946115493774414, "global_step": 170880, "epoch": 1017} {"train_loss": -10.930749893188477, "global_step": 170881, "epoch": 1017} {"train_loss": -10.819413185119629, "global_step": 170882, "epoch": 1017} {"train_loss": -10.749639511108398, "global_step": 170883, "epoch": 1017} {"train_loss": -11.013493537902832, "global_step": 170884, "epoch": 1017} {"train_loss": -10.815461158752441, "global_step": 170885, "epoch": 1017} {"train_loss": -10.875821113586426, "global_step": 170886, "epoch": 1017} {"train_loss": -10.645615577697754, "global_step": 170887, "epoch": 1017} {"train_loss": -10.709360122680664, "global_step": 170888, "epoch": 1017} {"train_loss": -10.841343879699707, "global_step": 170889, "epoch": 1017} {"train_loss": -10.930432319641113, "global_step": 170890, "epoch": 1017} {"train_loss": -11.171531677246094, "global_step": 170891, "epoch": 1017} {"train_loss": -10.966226577758789, "global_step": 170892, "epoch": 1017} {"train_loss": -10.865302085876465, "global_step": 170893, "epoch": 1017} {"train_loss": -10.844520568847656, "global_step": 170894, "epoch": 1017} {"train_loss": -11.067164421081543, "global_step": 170895, "epoch": 1017} {"train_loss": -11.027063369750977, "global_step": 170896, "epoch": 1017} {"train_loss": -11.27119255065918, "global_step": 170897, "epoch": 1017} {"train_loss": -10.832451820373535, "global_step": 170898, "epoch": 1017} {"train_loss": -11.191129684448242, "global_step": 170899, "epoch": 1017} {"train_loss": -11.02098274230957, "global_step": 170900, "epoch": 1017} {"train_loss": -11.013847351074219, "global_step": 170901, "epoch": 1017} {"train_loss": -10.935032844543457, "global_step": 170902, "epoch": 1017} {"train_loss": -10.977275848388672, "global_step": 170903, "epoch": 1017} {"train_loss": -11.105295181274414, "global_step": 170904, "epoch": 1017} {"train_loss": -11.095114707946777, "global_step": 170905, "epoch": 1017} {"train_loss": -11.126022338867188, "global_step": 170906, "epoch": 1017} {"train_loss": -11.056119918823242, "global_step": 170907, "epoch": 1017} {"train_loss": -11.064620971679688, "global_step": 170908, "epoch": 1017} {"train_loss": -11.168313980102539, "global_step": 170909, "epoch": 1017} {"train_loss": -11.284097671508789, "global_step": 170910, "epoch": 1017} {"train_loss": -11.279645919799805, "global_step": 170911, "epoch": 1017} {"train_loss": -11.003385543823242, "global_step": 170912, "epoch": 1017} {"train_loss": -11.051168441772461, "global_step": 170913, "epoch": 1017} {"train_loss": -11.085443496704102, "global_step": 170914, "epoch": 1017} {"train_loss": -10.979299545288086, "global_step": 170915, "epoch": 1017} {"train_loss": -11.17300033569336, "global_step": 170916, "epoch": 1017} {"train_loss": -11.144037246704102, "global_step": 170917, "epoch": 1017} {"train_loss": -10.968377113342285, "global_step": 170918, "epoch": 1017} {"train_loss": -11.133342742919922, "global_step": 170919, "epoch": 1017} {"train_loss": -11.343522071838379, "global_step": 170920, "epoch": 1017} {"train_loss": -11.146519660949707, "global_step": 170921, "epoch": 1017} {"train_loss": -11.050804138183594, "global_step": 170922, "epoch": 1017} {"train_loss": -11.16240119934082, "global_step": 170923, "epoch": 1017} {"train_loss": -10.787797927856445, "global_step": 170924, "epoch": 1017} {"train_loss": -10.948002815246582, "global_step": 170925, "epoch": 1017} {"train_loss": -11.311223030090332, "global_step": 170926, "epoch": 1017} {"train_loss": -11.28648567199707, "global_step": 170927, "epoch": 1017} {"train_loss": -10.929924011230469, "global_step": 170928, "epoch": 1017} {"train_loss": -11.099483489990234, "global_step": 170929, "epoch": 1017} {"train_loss": -11.510319709777832, "global_step": 170930, "epoch": 1017} {"train_loss": -11.146930694580078, "global_step": 170931, "epoch": 1017} {"train_loss": -11.269889831542969, "global_step": 170932, "epoch": 1017} {"train_loss": -11.214751243591309, "global_step": 170933, "epoch": 1017} {"train_loss": -11.28297233581543, "global_step": 170934, "epoch": 1017} {"train_loss": -11.423080444335938, "global_step": 170935, "epoch": 1017} {"train_loss": -11.320333480834961, "global_step": 170936, "epoch": 1017} {"train_loss": -11.538010597229004, "global_step": 170937, "epoch": 1017} {"train_loss": -11.339982032775879, "global_step": 170938, "epoch": 1017} {"train_loss": -11.509075164794922, "global_step": 170939, "epoch": 1017} {"train_loss": -11.197296142578125, "global_step": 170940, "epoch": 1017} {"train_loss": -11.448918342590332, "global_step": 170941, "epoch": 1017} {"train_loss": -11.47993278503418, "global_step": 170942, "epoch": 1017} {"train_loss": -11.239866256713867, "global_step": 170943, "epoch": 1017} {"train_loss": -11.455202102661133, "global_step": 170944, "epoch": 1017} {"train_loss": -11.237688064575195, "global_step": 170945, "epoch": 1017} {"train_loss": -11.378129005432129, "global_step": 170946, "epoch": 1017} {"train_loss": -11.366104125976562, "global_step": 170947, "epoch": 1017} {"train_loss": -11.150918960571289, "global_step": 170948, "epoch": 1017} {"train_loss": -11.152475357055664, "global_step": 170949, "epoch": 1017} {"train_loss": -10.834052085876465, "global_step": 170950, "epoch": 1017} {"train_loss": -10.923667907714844, "global_step": 170951, "epoch": 1017} {"train_loss": -11.320108413696289, "global_step": 170952, "epoch": 1017} {"train_loss": -10.702240943908691, "global_step": 170953, "epoch": 1017} {"train_loss": -10.794081687927246, "global_step": 170954, "epoch": 1017} {"train_loss": -11.173600196838379, "global_step": 170955, "epoch": 1017} {"train_loss": -11.248913764953613, "global_step": 170956, "epoch": 1017} {"train_loss": -11.280797004699707, "global_step": 170957, "epoch": 1017} {"train_loss": -11.265365600585938, "global_step": 170958, "epoch": 1017} {"train_loss": -10.936002731323242, "global_step": 170959, "epoch": 1017} {"train_loss": -11.0114107131958, "global_step": 170960, "epoch": 1017} {"train_loss": -11.333081245422363, "global_step": 170961, "epoch": 1017} {"train_loss": -11.099893569946289, "global_step": 170962, "epoch": 1017} {"train_loss": -10.970139503479004, "global_step": 170963, "epoch": 1017} {"train_loss": -11.163370132446289, "global_step": 170964, "epoch": 1017} {"train_loss": -10.501489639282227, "global_step": 170965, "epoch": 1017} {"train_loss": -11.258973121643066, "global_step": 170966, "epoch": 1017} {"train_loss": -10.786136627197266, "global_step": 170967, "epoch": 1017} {"train_loss": -10.787737846374512, "global_step": 170968, "epoch": 1017} {"train_loss": -10.632551193237305, "global_step": 170969, "epoch": 1017} {"train_loss": -11.399234771728516, "global_step": 170970, "epoch": 1017} {"train_loss": -10.911934852600098, "global_step": 170971, "epoch": 1017} {"train_loss": -11.085271835327148, "global_step": 170972, "epoch": 1017} {"train_loss": -11.193907737731934, "global_step": 170973, "epoch": 1017} {"train_loss": -11.174015998840332, "global_step": 170974, "epoch": 1017} {"train_loss": -9.816651344299316, "global_step": 170975, "epoch": 1017} {"train_loss": -10.504865646362305, "global_step": 170976, "epoch": 1017} {"train_loss": -10.927871704101562, "global_step": 170977, "epoch": 1017} {"train_loss": -10.751766204833984, "global_step": 170978, "epoch": 1017} {"train_loss": -11.173646926879883, "global_step": 170979, "epoch": 1017} {"train_loss": -10.832133293151855, "global_step": 170980, "epoch": 1017} {"train_loss": -10.939014434814453, "global_step": 170981, "epoch": 1017} {"train_loss": -11.317229270935059, "global_step": 170982, "epoch": 1017} {"train_loss": -10.987530708312988, "global_step": 170983, "epoch": 1017} {"train_loss": -11.154516220092773, "global_step": 170984, "epoch": 1017} {"train_loss": -11.035534858703613, "global_step": 170985, "epoch": 1017} {"train_loss": -11.03116226196289, "global_step": 170986, "epoch": 1017} {"train_loss": -11.145578384399414, "global_step": 170987, "epoch": 1017} {"train_loss": -11.213305473327637, "global_step": 170988, "epoch": 1017} {"train_loss": -11.063630104064941, "global_step": 170989, "epoch": 1017} {"train_loss": -11.088651657104492, "global_step": 170990, "epoch": 1017} {"train_loss": -11.21308708190918, "global_step": 170991, "epoch": 1017} {"train_loss": -10.82901382446289, "global_step": 170992, "epoch": 1017} {"train_loss": -11.241813659667969, "global_step": 170993, "epoch": 1017} {"train_loss": -11.027320861816406, "global_step": 170994, "epoch": 1017} {"train_loss": -10.812774658203125, "global_step": 170995, "epoch": 1017} {"train_loss": -10.910874366760254, "global_step": 170996, "epoch": 1017} {"train_loss": -10.199159622192383, "global_step": 170997, "epoch": 1017} {"train_loss": -9.403371810913086, "global_step": 170998, "epoch": 1017} {"train_loss": -10.47469711303711, "global_step": 170999, "epoch": 1017} {"train_loss": -10.87038803100586, "global_step": 171000, "epoch": 1017} {"train_loss": -10.025367736816406, "global_step": 171001, "epoch": 1017} {"train_loss": -10.970989227294922, "global_step": 171002, "epoch": 1017} {"train_loss": -10.427725791931152, "global_step": 171003, "epoch": 1017} {"train_loss": -10.975555419921875, "global_step": 171004, "epoch": 1017} {"train_loss": -10.656312942504883, "global_step": 171005, "epoch": 1017} {"train_loss": -10.935354232788086, "global_step": 171006, "epoch": 1017} {"train_loss": -10.539495468139648, "global_step": 171007, "epoch": 1017} {"train_loss": -10.911540031433105, "global_step": 171008, "epoch": 1017} {"train_loss": -10.817678451538086, "global_step": 171009, "epoch": 1017} {"train_loss": -10.818467140197754, "global_step": 171010, "epoch": 1017} {"train_loss": -10.98705005645752, "global_step": 171011, "epoch": 1017} {"train_loss": -11.047131538391113, "global_step": 171012, "epoch": 1017} {"train_loss": -10.567829132080078, "global_step": 171013, "epoch": 1017} {"train_loss": -11.115111351013184, "global_step": 171014, "epoch": 1017} {"train_loss": -10.999580383300781, "global_step": 171015, "epoch": 1017} {"train_loss": -11.217029571533203, "global_step": 171016, "epoch": 1017} {"train_loss": -10.936141014099121, "global_step": 171017, "epoch": 1017} {"train_loss": -10.960546493530273, "global_step": 171018, "epoch": 1017} {"train_loss": -11.209997177124023, "global_step": 171019, "epoch": 1017} {"train_loss": -10.986689567565918, "global_step": 171020, "epoch": 1017} {"train_loss": -10.888429641723633, "global_step": 171021, "epoch": 1017} {"train_loss": -11.144024848937988, "global_step": 171022, "epoch": 1017} {"train_loss": -10.935810367266336, "global_step": 171023, "epoch": 1017, "val_loss": 235296.109375} {"train_loss": -10.887551307678223, "global_step": 171024, "epoch": 1018} {"train_loss": -11.269362449645996, "global_step": 171025, "epoch": 1018} {"train_loss": -11.138311386108398, "global_step": 171026, "epoch": 1018} {"train_loss": -11.084348678588867, "global_step": 171027, "epoch": 1018} {"train_loss": -11.098368644714355, "global_step": 171028, "epoch": 1018} {"train_loss": -11.243518829345703, "global_step": 171029, "epoch": 1018} {"train_loss": -10.89283561706543, "global_step": 171030, "epoch": 1018} {"train_loss": -11.24110221862793, "global_step": 171031, "epoch": 1018} {"train_loss": -10.859621047973633, "global_step": 171032, "epoch": 1018} {"train_loss": -11.301887512207031, "global_step": 171033, "epoch": 1018} {"train_loss": -10.830303192138672, "global_step": 171034, "epoch": 1018} {"train_loss": -11.258164405822754, "global_step": 171035, "epoch": 1018} {"train_loss": -11.222556114196777, "global_step": 171036, "epoch": 1018} {"train_loss": -10.871010780334473, "global_step": 171037, "epoch": 1018} {"train_loss": -11.34204387664795, "global_step": 171038, "epoch": 1018} {"train_loss": -10.6031494140625, "global_step": 171039, "epoch": 1018} {"train_loss": -11.116548538208008, "global_step": 171040, "epoch": 1018} {"train_loss": -10.933242797851562, "global_step": 171041, "epoch": 1018} {"train_loss": -10.782855987548828, "global_step": 171042, "epoch": 1018} {"train_loss": -11.248868942260742, "global_step": 171043, "epoch": 1018} {"train_loss": -11.07415771484375, "global_step": 171044, "epoch": 1018} {"train_loss": -11.097677230834961, "global_step": 171045, "epoch": 1018} {"train_loss": -11.320024490356445, "global_step": 171046, "epoch": 1018} {"train_loss": -11.008365631103516, "global_step": 171047, "epoch": 1018} {"train_loss": -11.053987503051758, "global_step": 171048, "epoch": 1018} {"train_loss": -10.943159103393555, "global_step": 171049, "epoch": 1018} {"train_loss": -10.734151840209961, "global_step": 171050, "epoch": 1018} {"train_loss": -11.237014770507812, "global_step": 171051, "epoch": 1018} {"train_loss": -10.877337455749512, "global_step": 171052, "epoch": 1018} {"train_loss": -11.028703689575195, "global_step": 171053, "epoch": 1018} {"train_loss": -10.789726257324219, "global_step": 171054, "epoch": 1018} {"train_loss": -10.978715896606445, "global_step": 171055, "epoch": 1018} {"train_loss": -10.984594345092773, "global_step": 171056, "epoch": 1018} {"train_loss": -11.227680206298828, "global_step": 171057, "epoch": 1018} {"train_loss": -11.391193389892578, "global_step": 171058, "epoch": 1018} {"train_loss": -11.162824630737305, "global_step": 171059, "epoch": 1018} {"train_loss": -11.352763175964355, "global_step": 171060, "epoch": 1018} {"train_loss": -11.240079879760742, "global_step": 171061, "epoch": 1018} {"train_loss": -11.520329475402832, "global_step": 171062, "epoch": 1018} {"train_loss": -10.871538162231445, "global_step": 171063, "epoch": 1018} {"train_loss": -10.775165557861328, "global_step": 171064, "epoch": 1018} {"train_loss": -11.011909484863281, "global_step": 171065, "epoch": 1018} {"train_loss": -10.71933364868164, "global_step": 171066, "epoch": 1018} {"train_loss": -10.770870208740234, "global_step": 171067, "epoch": 1018} {"train_loss": -10.818217277526855, "global_step": 171068, "epoch": 1018} {"train_loss": -10.812566757202148, "global_step": 171069, "epoch": 1018} {"train_loss": -10.756455421447754, "global_step": 171070, "epoch": 1018} {"train_loss": -10.71319580078125, "global_step": 171071, "epoch": 1018} {"train_loss": -10.804073333740234, "global_step": 171072, "epoch": 1018} {"train_loss": -11.117044448852539, "global_step": 171073, "epoch": 1018} {"train_loss": -10.785420417785645, "global_step": 171074, "epoch": 1018} {"train_loss": -11.10749340057373, "global_step": 171075, "epoch": 1018} {"train_loss": -10.689414978027344, "global_step": 171076, "epoch": 1018} {"train_loss": -10.602252006530762, "global_step": 171077, "epoch": 1018} {"train_loss": -10.810445785522461, "global_step": 171078, "epoch": 1018} {"train_loss": -10.74130630493164, "global_step": 171079, "epoch": 1018} {"train_loss": -11.099885940551758, "global_step": 171080, "epoch": 1018} {"train_loss": -10.76317024230957, "global_step": 171081, "epoch": 1018} {"train_loss": -10.99457836151123, "global_step": 171082, "epoch": 1018} {"train_loss": -11.109475135803223, "global_step": 171083, "epoch": 1018} {"train_loss": -11.008185386657715, "global_step": 171084, "epoch": 1018} {"train_loss": -10.806456565856934, "global_step": 171085, "epoch": 1018} {"train_loss": -10.997945785522461, "global_step": 171086, "epoch": 1018} {"train_loss": -10.779363632202148, "global_step": 171087, "epoch": 1018} {"train_loss": -11.007207870483398, "global_step": 171088, "epoch": 1018} {"train_loss": -10.98236083984375, "global_step": 171089, "epoch": 1018} {"train_loss": -10.702934265136719, "global_step": 171090, "epoch": 1018} {"train_loss": -11.219465255737305, "global_step": 171091, "epoch": 1018} {"train_loss": -10.804384231567383, "global_step": 171092, "epoch": 1018} {"train_loss": -10.69101333618164, "global_step": 171093, "epoch": 1018} {"train_loss": -11.391180992126465, "global_step": 171094, "epoch": 1018} {"train_loss": -11.062859535217285, "global_step": 171095, "epoch": 1018} {"train_loss": -11.031210899353027, "global_step": 171096, "epoch": 1018} {"train_loss": -11.119564056396484, "global_step": 171097, "epoch": 1018} {"train_loss": -11.168842315673828, "global_step": 171098, "epoch": 1018} {"train_loss": -10.880439758300781, "global_step": 171099, "epoch": 1018} {"train_loss": -11.020132064819336, "global_step": 171100, "epoch": 1018} {"train_loss": -10.540947914123535, "global_step": 171101, "epoch": 1018} {"train_loss": -10.47586441040039, "global_step": 171102, "epoch": 1018} {"train_loss": -10.967700004577637, "global_step": 171103, "epoch": 1018} {"train_loss": -9.99409008026123, "global_step": 171104, "epoch": 1018} {"train_loss": -11.235400199890137, "global_step": 171105, "epoch": 1018} {"train_loss": -10.506333351135254, "global_step": 171106, "epoch": 1018} {"train_loss": -10.603267669677734, "global_step": 171107, "epoch": 1018} {"train_loss": -11.075305938720703, "global_step": 171108, "epoch": 1018} {"train_loss": -10.64675521850586, "global_step": 171109, "epoch": 1018} {"train_loss": -10.867103576660156, "global_step": 171110, "epoch": 1018} {"train_loss": -10.910956382751465, "global_step": 171111, "epoch": 1018} {"train_loss": -10.940055847167969, "global_step": 171112, "epoch": 1018} {"train_loss": -11.13170051574707, "global_step": 171113, "epoch": 1018} {"train_loss": -10.883377075195312, "global_step": 171114, "epoch": 1018} {"train_loss": -11.026571273803711, "global_step": 171115, "epoch": 1018} {"train_loss": -11.134628295898438, "global_step": 171116, "epoch": 1018} {"train_loss": -11.05084228515625, "global_step": 171117, "epoch": 1018} {"train_loss": -11.21853256225586, "global_step": 171118, "epoch": 1018} {"train_loss": -11.104019165039062, "global_step": 171119, "epoch": 1018} {"train_loss": -11.040451049804688, "global_step": 171120, "epoch": 1018} {"train_loss": -11.230987548828125, "global_step": 171121, "epoch": 1018} {"train_loss": -11.248054504394531, "global_step": 171122, "epoch": 1018} {"train_loss": -11.106576919555664, "global_step": 171123, "epoch": 1018} {"train_loss": -11.374740600585938, "global_step": 171124, "epoch": 1018} {"train_loss": -11.173044204711914, "global_step": 171125, "epoch": 1018} {"train_loss": -11.253576278686523, "global_step": 171126, "epoch": 1018} {"train_loss": -11.281829833984375, "global_step": 171127, "epoch": 1018} {"train_loss": -11.418069839477539, "global_step": 171128, "epoch": 1018} {"train_loss": -11.341676712036133, "global_step": 171129, "epoch": 1018} {"train_loss": -11.313379287719727, "global_step": 171130, "epoch": 1018} {"train_loss": -11.022153854370117, "global_step": 171131, "epoch": 1018} {"train_loss": -11.499370574951172, "global_step": 171132, "epoch": 1018} {"train_loss": -11.195545196533203, "global_step": 171133, "epoch": 1018} {"train_loss": -11.26679801940918, "global_step": 171134, "epoch": 1018} {"train_loss": -11.141975402832031, "global_step": 171135, "epoch": 1018} {"train_loss": -11.294157028198242, "global_step": 171136, "epoch": 1018} {"train_loss": -11.359009742736816, "global_step": 171137, "epoch": 1018} {"train_loss": -11.359100341796875, "global_step": 171138, "epoch": 1018} {"train_loss": -11.501630783081055, "global_step": 171139, "epoch": 1018} {"train_loss": -11.364048957824707, "global_step": 171140, "epoch": 1018} {"train_loss": -10.964864730834961, "global_step": 171141, "epoch": 1018} {"train_loss": -11.585832595825195, "global_step": 171142, "epoch": 1018} {"train_loss": -11.493056297302246, "global_step": 171143, "epoch": 1018} {"train_loss": -11.402114868164062, "global_step": 171144, "epoch": 1018} {"train_loss": -11.336105346679688, "global_step": 171145, "epoch": 1018} {"train_loss": -11.292887687683105, "global_step": 171146, "epoch": 1018} {"train_loss": -11.426007270812988, "global_step": 171147, "epoch": 1018} {"train_loss": -11.220603942871094, "global_step": 171148, "epoch": 1018} {"train_loss": -11.344533920288086, "global_step": 171149, "epoch": 1018} {"train_loss": -11.421134948730469, "global_step": 171150, "epoch": 1018} {"train_loss": -11.319727897644043, "global_step": 171151, "epoch": 1018} {"train_loss": -11.269025802612305, "global_step": 171152, "epoch": 1018} {"train_loss": -11.362117767333984, "global_step": 171153, "epoch": 1018} {"train_loss": -11.091784477233887, "global_step": 171154, "epoch": 1018} {"train_loss": -11.406057357788086, "global_step": 171155, "epoch": 1018} {"train_loss": -11.408695220947266, "global_step": 171156, "epoch": 1018} {"train_loss": -10.39299488067627, "global_step": 171157, "epoch": 1018} {"train_loss": -10.405420303344727, "global_step": 171158, "epoch": 1018} {"train_loss": -10.686017990112305, "global_step": 171159, "epoch": 1018} {"train_loss": -9.662915229797363, "global_step": 171160, "epoch": 1018} {"train_loss": -10.102721214294434, "global_step": 171161, "epoch": 1018} {"train_loss": -10.930974006652832, "global_step": 171162, "epoch": 1018} {"train_loss": -9.370237350463867, "global_step": 171163, "epoch": 1018} {"train_loss": -9.595142364501953, "global_step": 171164, "epoch": 1018} {"train_loss": -10.104447364807129, "global_step": 171165, "epoch": 1018} {"train_loss": -10.25442886352539, "global_step": 171166, "epoch": 1018} {"train_loss": -8.737080574035645, "global_step": 171167, "epoch": 1018} {"train_loss": -8.830703735351562, "global_step": 171168, "epoch": 1018} {"train_loss": -9.062466621398926, "global_step": 171169, "epoch": 1018} {"train_loss": -9.582967758178711, "global_step": 171170, "epoch": 1018} {"train_loss": -8.880138397216797, "global_step": 171171, "epoch": 1018} {"train_loss": -9.29271125793457, "global_step": 171172, "epoch": 1018} {"train_loss": -9.336008071899414, "global_step": 171173, "epoch": 1018} {"train_loss": -8.996786117553711, "global_step": 171174, "epoch": 1018} {"train_loss": -8.749757766723633, "global_step": 171175, "epoch": 1018} {"train_loss": -9.334844589233398, "global_step": 171176, "epoch": 1018} {"train_loss": -9.111539840698242, "global_step": 171177, "epoch": 1018} {"train_loss": -8.491861343383789, "global_step": 171178, "epoch": 1018} {"train_loss": -9.353328704833984, "global_step": 171179, "epoch": 1018} {"train_loss": -10.474113464355469, "global_step": 171180, "epoch": 1018} {"train_loss": -9.650772094726562, "global_step": 171181, "epoch": 1018} {"train_loss": -8.940553665161133, "global_step": 171182, "epoch": 1018} {"train_loss": -9.87228775024414, "global_step": 171183, "epoch": 1018} {"train_loss": -10.279434204101562, "global_step": 171184, "epoch": 1018} {"train_loss": -10.075157165527344, "global_step": 171185, "epoch": 1018} {"train_loss": -9.86140251159668, "global_step": 171186, "epoch": 1018} {"train_loss": -10.154867172241211, "global_step": 171187, "epoch": 1018} {"train_loss": -10.755878448486328, "global_step": 171188, "epoch": 1018} {"train_loss": -9.653263092041016, "global_step": 171189, "epoch": 1018} {"train_loss": -9.951065063476562, "global_step": 171190, "epoch": 1018} {"train_loss": -10.778356398854937, "global_step": 171191, "epoch": 1018, "val_loss": 237684.0} {"train_loss": -10.342737197875977, "global_step": 171192, "epoch": 1019} {"train_loss": -10.190582275390625, "global_step": 171193, "epoch": 1019} {"train_loss": -10.291613578796387, "global_step": 171194, "epoch": 1019} {"train_loss": -10.627700805664062, "global_step": 171195, "epoch": 1019} {"train_loss": -10.583708763122559, "global_step": 171196, "epoch": 1019} {"train_loss": -10.200945854187012, "global_step": 171197, "epoch": 1019} {"train_loss": -10.451155662536621, "global_step": 171198, "epoch": 1019} {"train_loss": -10.665058135986328, "global_step": 171199, "epoch": 1019} {"train_loss": -10.51091194152832, "global_step": 171200, "epoch": 1019} {"train_loss": -10.40328311920166, "global_step": 171201, "epoch": 1019} {"train_loss": -10.658333778381348, "global_step": 171202, "epoch": 1019} {"train_loss": -10.706802368164062, "global_step": 171203, "epoch": 1019} {"train_loss": -10.521944046020508, "global_step": 171204, "epoch": 1019} {"train_loss": -10.6334867477417, "global_step": 171205, "epoch": 1019} {"train_loss": -10.825202941894531, "global_step": 171206, "epoch": 1019} {"train_loss": -10.961784362792969, "global_step": 171207, "epoch": 1019} {"train_loss": -10.702869415283203, "global_step": 171208, "epoch": 1019} {"train_loss": -10.706809997558594, "global_step": 171209, "epoch": 1019} {"train_loss": -10.679298400878906, "global_step": 171210, "epoch": 1019} {"train_loss": -10.891361236572266, "global_step": 171211, "epoch": 1019} {"train_loss": -10.834389686584473, "global_step": 171212, "epoch": 1019} {"train_loss": -10.78687858581543, "global_step": 171213, "epoch": 1019} {"train_loss": -10.899245262145996, "global_step": 171214, "epoch": 1019} {"train_loss": -10.906791687011719, "global_step": 171215, "epoch": 1019} {"train_loss": -10.975019454956055, "global_step": 171216, "epoch": 1019} {"train_loss": -11.042201042175293, "global_step": 171217, "epoch": 1019} {"train_loss": -11.188688278198242, "global_step": 171218, "epoch": 1019} {"train_loss": -10.877957344055176, "global_step": 171219, "epoch": 1019} {"train_loss": -11.06603717803955, "global_step": 171220, "epoch": 1019} {"train_loss": -11.082359313964844, "global_step": 171221, "epoch": 1019} {"train_loss": -11.02488899230957, "global_step": 171222, "epoch": 1019} {"train_loss": -11.063880920410156, "global_step": 171223, "epoch": 1019} {"train_loss": -11.0614595413208, "global_step": 171224, "epoch": 1019} {"train_loss": -11.021339416503906, "global_step": 171225, "epoch": 1019} {"train_loss": -11.189737319946289, "global_step": 171226, "epoch": 1019} {"train_loss": -11.089200973510742, "global_step": 171227, "epoch": 1019} {"train_loss": -11.24669361114502, "global_step": 171228, "epoch": 1019} {"train_loss": -11.026559829711914, "global_step": 171229, "epoch": 1019} {"train_loss": -11.098294258117676, "global_step": 171230, "epoch": 1019} {"train_loss": -11.184842109680176, "global_step": 171231, "epoch": 1019} {"train_loss": -11.18838119506836, "global_step": 171232, "epoch": 1019} {"train_loss": -10.996101379394531, "global_step": 171233, "epoch": 1019} {"train_loss": -11.313447952270508, "global_step": 171234, "epoch": 1019} {"train_loss": -11.227278709411621, "global_step": 171235, "epoch": 1019} {"train_loss": -11.017741203308105, "global_step": 171236, "epoch": 1019} {"train_loss": -11.31412410736084, "global_step": 171237, "epoch": 1019} {"train_loss": -11.080766677856445, "global_step": 171238, "epoch": 1019} {"train_loss": -11.351116180419922, "global_step": 171239, "epoch": 1019} {"train_loss": -11.088897705078125, "global_step": 171240, "epoch": 1019} {"train_loss": -11.272964477539062, "global_step": 171241, "epoch": 1019} {"train_loss": -11.19313907623291, "global_step": 171242, "epoch": 1019} {"train_loss": -11.3138427734375, "global_step": 171243, "epoch": 1019} {"train_loss": -11.362098693847656, "global_step": 171244, "epoch": 1019} {"train_loss": -11.318704605102539, "global_step": 171245, "epoch": 1019} {"train_loss": -11.286030769348145, "global_step": 171246, "epoch": 1019} {"train_loss": -11.283892631530762, "global_step": 171247, "epoch": 1019} {"train_loss": -11.302878379821777, "global_step": 171248, "epoch": 1019} {"train_loss": -11.242687225341797, "global_step": 171249, "epoch": 1019} {"train_loss": -11.319812774658203, "global_step": 171250, "epoch": 1019} {"train_loss": -11.306840896606445, "global_step": 171251, "epoch": 1019} {"train_loss": -11.510761260986328, "global_step": 171252, "epoch": 1019} {"train_loss": -11.366443634033203, "global_step": 171253, "epoch": 1019} {"train_loss": -11.389415740966797, "global_step": 171254, "epoch": 1019} {"train_loss": -11.357492446899414, "global_step": 171255, "epoch": 1019} {"train_loss": -11.198827743530273, "global_step": 171256, "epoch": 1019} {"train_loss": -11.195310592651367, "global_step": 171257, "epoch": 1019} {"train_loss": -11.180339813232422, "global_step": 171258, "epoch": 1019} {"train_loss": -11.07365608215332, "global_step": 171259, "epoch": 1019} {"train_loss": -11.137771606445312, "global_step": 171260, "epoch": 1019} {"train_loss": -10.420970916748047, "global_step": 171261, "epoch": 1019} {"train_loss": -9.535758018493652, "global_step": 171262, "epoch": 1019} {"train_loss": -10.465351104736328, "global_step": 171263, "epoch": 1019} {"train_loss": -11.053150177001953, "global_step": 171264, "epoch": 1019} {"train_loss": -10.035117149353027, "global_step": 171265, "epoch": 1019} {"train_loss": -9.88065242767334, "global_step": 171266, "epoch": 1019} {"train_loss": -11.186979293823242, "global_step": 171267, "epoch": 1019} {"train_loss": -8.957294464111328, "global_step": 171268, "epoch": 1019} {"train_loss": -10.303159713745117, "global_step": 171269, "epoch": 1019} {"train_loss": -10.582889556884766, "global_step": 171270, "epoch": 1019} {"train_loss": -8.88691234588623, "global_step": 171271, "epoch": 1019} {"train_loss": -10.727922439575195, "global_step": 171272, "epoch": 1019} {"train_loss": -8.309986114501953, "global_step": 171273, "epoch": 1019} {"train_loss": -9.974630355834961, "global_step": 171274, "epoch": 1019} {"train_loss": -8.221612930297852, "global_step": 171275, "epoch": 1019} {"train_loss": -8.36120319366455, "global_step": 171276, "epoch": 1019} {"train_loss": -8.955812454223633, "global_step": 171277, "epoch": 1019} {"train_loss": -7.146143913269043, "global_step": 171278, "epoch": 1019} {"train_loss": -8.740917205810547, "global_step": 171279, "epoch": 1019} {"train_loss": -7.4437150955200195, "global_step": 171280, "epoch": 1019} {"train_loss": -7.58992862701416, "global_step": 171281, "epoch": 1019} {"train_loss": -10.21941089630127, "global_step": 171282, "epoch": 1019} {"train_loss": -9.244739532470703, "global_step": 171283, "epoch": 1019} {"train_loss": -9.591226577758789, "global_step": 171284, "epoch": 1019} {"train_loss": -9.822580337524414, "global_step": 171285, "epoch": 1019} {"train_loss": -9.713043212890625, "global_step": 171286, "epoch": 1019} {"train_loss": -9.910178184509277, "global_step": 171287, "epoch": 1019} {"train_loss": -9.77907943725586, "global_step": 171288, "epoch": 1019} {"train_loss": -10.548351287841797, "global_step": 171289, "epoch": 1019} {"train_loss": -9.598176002502441, "global_step": 171290, "epoch": 1019} {"train_loss": -10.025230407714844, "global_step": 171291, "epoch": 1019} {"train_loss": -10.242773056030273, "global_step": 171292, "epoch": 1019} {"train_loss": -10.331252098083496, "global_step": 171293, "epoch": 1019} {"train_loss": -10.479337692260742, "global_step": 171294, "epoch": 1019} {"train_loss": -10.864734649658203, "global_step": 171295, "epoch": 1019} {"train_loss": -10.579763412475586, "global_step": 171296, "epoch": 1019} {"train_loss": -10.43165111541748, "global_step": 171297, "epoch": 1019} {"train_loss": -10.753995895385742, "global_step": 171298, "epoch": 1019} {"train_loss": -10.581095695495605, "global_step": 171299, "epoch": 1019} {"train_loss": -10.709846496582031, "global_step": 171300, "epoch": 1019} {"train_loss": -10.812883377075195, "global_step": 171301, "epoch": 1019} {"train_loss": -10.906588554382324, "global_step": 171302, "epoch": 1019} {"train_loss": -10.708066940307617, "global_step": 171303, "epoch": 1019} {"train_loss": -10.775346755981445, "global_step": 171304, "epoch": 1019} {"train_loss": -10.718473434448242, "global_step": 171305, "epoch": 1019} {"train_loss": -10.934183120727539, "global_step": 171306, "epoch": 1019} {"train_loss": -10.595589637756348, "global_step": 171307, "epoch": 1019} {"train_loss": -10.606544494628906, "global_step": 171308, "epoch": 1019} {"train_loss": -10.922561645507812, "global_step": 171309, "epoch": 1019} {"train_loss": -10.715463638305664, "global_step": 171310, "epoch": 1019} {"train_loss": -10.852823257446289, "global_step": 171311, "epoch": 1019} {"train_loss": -10.662599563598633, "global_step": 171312, "epoch": 1019} {"train_loss": -11.02589225769043, "global_step": 171313, "epoch": 1019} {"train_loss": -10.940227508544922, "global_step": 171314, "epoch": 1019} {"train_loss": -11.01851749420166, "global_step": 171315, "epoch": 1019} {"train_loss": -10.875551223754883, "global_step": 171316, "epoch": 1019} {"train_loss": -10.989557266235352, "global_step": 171317, "epoch": 1019} {"train_loss": -10.78620719909668, "global_step": 171318, "epoch": 1019} {"train_loss": -10.935955047607422, "global_step": 171319, "epoch": 1019} {"train_loss": -10.929195404052734, "global_step": 171320, "epoch": 1019} {"train_loss": -11.099056243896484, "global_step": 171321, "epoch": 1019} {"train_loss": -10.893226623535156, "global_step": 171322, "epoch": 1019} {"train_loss": -11.189635276794434, "global_step": 171323, "epoch": 1019} {"train_loss": -11.12625503540039, "global_step": 171324, "epoch": 1019} {"train_loss": -10.959010124206543, "global_step": 171325, "epoch": 1019} {"train_loss": -10.97744369506836, "global_step": 171326, "epoch": 1019} {"train_loss": -11.056695938110352, "global_step": 171327, "epoch": 1019} {"train_loss": -11.178525924682617, "global_step": 171328, "epoch": 1019} {"train_loss": -11.206722259521484, "global_step": 171329, "epoch": 1019} {"train_loss": -11.049467086791992, "global_step": 171330, "epoch": 1019} {"train_loss": -11.192856788635254, "global_step": 171331, "epoch": 1019} {"train_loss": -10.954835891723633, "global_step": 171332, "epoch": 1019} {"train_loss": -11.186697959899902, "global_step": 171333, "epoch": 1019} {"train_loss": -10.869792938232422, "global_step": 171334, "epoch": 1019} {"train_loss": -11.22500228881836, "global_step": 171335, "epoch": 1019} {"train_loss": -11.164153099060059, "global_step": 171336, "epoch": 1019} {"train_loss": -11.165889739990234, "global_step": 171337, "epoch": 1019} {"train_loss": -11.142566680908203, "global_step": 171338, "epoch": 1019} {"train_loss": -10.91975212097168, "global_step": 171339, "epoch": 1019} {"train_loss": -11.170778274536133, "global_step": 171340, "epoch": 1019} {"train_loss": -10.83957290649414, "global_step": 171341, "epoch": 1019} {"train_loss": -11.099289894104004, "global_step": 171342, "epoch": 1019} {"train_loss": -10.966943740844727, "global_step": 171343, "epoch": 1019} {"train_loss": -10.994752883911133, "global_step": 171344, "epoch": 1019} {"train_loss": -10.910039901733398, "global_step": 171345, "epoch": 1019} {"train_loss": -11.388847351074219, "global_step": 171346, "epoch": 1019} {"train_loss": -10.504243850708008, "global_step": 171347, "epoch": 1019} {"train_loss": -11.353654861450195, "global_step": 171348, "epoch": 1019} {"train_loss": -10.934526443481445, "global_step": 171349, "epoch": 1019} {"train_loss": -10.991483688354492, "global_step": 171350, "epoch": 1019} {"train_loss": -11.044533729553223, "global_step": 171351, "epoch": 1019} {"train_loss": -10.936483383178711, "global_step": 171352, "epoch": 1019} {"train_loss": -11.0087890625, "global_step": 171353, "epoch": 1019} {"train_loss": -11.257261276245117, "global_step": 171354, "epoch": 1019} {"train_loss": -10.918100357055664, "global_step": 171355, "epoch": 1019} {"train_loss": -11.016960144042969, "global_step": 171356, "epoch": 1019} {"train_loss": -11.111563682556152, "global_step": 171357, "epoch": 1019} {"train_loss": -11.185514450073242, "global_step": 171358, "epoch": 1019} {"train_loss": -10.696022516205197, "global_step": 171359, "epoch": 1019, "val_loss": 231654.953125} {"train_loss": -11.209098815917969, "global_step": 171360, "epoch": 1020} {"train_loss": -11.092918395996094, "global_step": 171361, "epoch": 1020} {"train_loss": -10.963340759277344, "global_step": 171362, "epoch": 1020} {"train_loss": -11.209273338317871, "global_step": 171363, "epoch": 1020} {"train_loss": -11.293292999267578, "global_step": 171364, "epoch": 1020} {"train_loss": -10.968353271484375, "global_step": 171365, "epoch": 1020} {"train_loss": -11.272913932800293, "global_step": 171366, "epoch": 1020} {"train_loss": -10.898222923278809, "global_step": 171367, "epoch": 1020} {"train_loss": -11.212505340576172, "global_step": 171368, "epoch": 1020} {"train_loss": -10.492780685424805, "global_step": 171369, "epoch": 1020} {"train_loss": -10.883354187011719, "global_step": 171370, "epoch": 1020} {"train_loss": -10.995734214782715, "global_step": 171371, "epoch": 1020} {"train_loss": -11.179288864135742, "global_step": 171372, "epoch": 1020} {"train_loss": -10.835234642028809, "global_step": 171373, "epoch": 1020} {"train_loss": -11.025161743164062, "global_step": 171374, "epoch": 1020} {"train_loss": -10.563156127929688, "global_step": 171375, "epoch": 1020} {"train_loss": -11.26763916015625, "global_step": 171376, "epoch": 1020} {"train_loss": -10.91137981414795, "global_step": 171377, "epoch": 1020} {"train_loss": -11.03004264831543, "global_step": 171378, "epoch": 1020} {"train_loss": -10.480484008789062, "global_step": 171379, "epoch": 1020} {"train_loss": -10.257105827331543, "global_step": 171380, "epoch": 1020} {"train_loss": -10.738015174865723, "global_step": 171381, "epoch": 1020} {"train_loss": -10.26416015625, "global_step": 171382, "epoch": 1020} {"train_loss": -9.594746589660645, "global_step": 171383, "epoch": 1020} {"train_loss": -10.89391803741455, "global_step": 171384, "epoch": 1020} {"train_loss": -10.614654541015625, "global_step": 171385, "epoch": 1020} {"train_loss": -10.543513298034668, "global_step": 171386, "epoch": 1020} {"train_loss": -10.965054512023926, "global_step": 171387, "epoch": 1020} {"train_loss": -10.67255973815918, "global_step": 171388, "epoch": 1020} {"train_loss": -10.636472702026367, "global_step": 171389, "epoch": 1020} {"train_loss": -11.030618667602539, "global_step": 171390, "epoch": 1020} {"train_loss": -10.77297592163086, "global_step": 171391, "epoch": 1020} {"train_loss": -10.696256637573242, "global_step": 171392, "epoch": 1020} {"train_loss": -10.580564498901367, "global_step": 171393, "epoch": 1020} {"train_loss": -10.763358116149902, "global_step": 171394, "epoch": 1020} {"train_loss": -10.591760635375977, "global_step": 171395, "epoch": 1020} {"train_loss": -10.458746910095215, "global_step": 171396, "epoch": 1020} {"train_loss": -10.432339668273926, "global_step": 171397, "epoch": 1020} {"train_loss": -10.579965591430664, "global_step": 171398, "epoch": 1020} {"train_loss": -10.29159164428711, "global_step": 171399, "epoch": 1020} {"train_loss": -10.732925415039062, "global_step": 171400, "epoch": 1020} {"train_loss": -10.047046661376953, "global_step": 171401, "epoch": 1020} {"train_loss": -10.700996398925781, "global_step": 171402, "epoch": 1020} {"train_loss": -10.669499397277832, "global_step": 171403, "epoch": 1020} {"train_loss": -10.374778747558594, "global_step": 171404, "epoch": 1020} {"train_loss": -10.719171524047852, "global_step": 171405, "epoch": 1020} {"train_loss": -10.60103988647461, "global_step": 171406, "epoch": 1020} {"train_loss": -10.541011810302734, "global_step": 171407, "epoch": 1020} {"train_loss": -10.77735424041748, "global_step": 171408, "epoch": 1020} {"train_loss": -10.48824405670166, "global_step": 171409, "epoch": 1020} {"train_loss": -10.766006469726562, "global_step": 171410, "epoch": 1020} {"train_loss": -10.81731128692627, "global_step": 171411, "epoch": 1020} {"train_loss": -10.671985626220703, "global_step": 171412, "epoch": 1020} {"train_loss": -10.708881378173828, "global_step": 171413, "epoch": 1020} {"train_loss": -10.81379508972168, "global_step": 171414, "epoch": 1020} {"train_loss": -10.67129135131836, "global_step": 171415, "epoch": 1020} {"train_loss": -10.749099731445312, "global_step": 171416, "epoch": 1020} {"train_loss": -10.677694320678711, "global_step": 171417, "epoch": 1020} {"train_loss": -10.843799591064453, "global_step": 171418, "epoch": 1020} {"train_loss": -10.58427906036377, "global_step": 171419, "epoch": 1020} {"train_loss": -10.789525985717773, "global_step": 171420, "epoch": 1020} {"train_loss": -11.049356460571289, "global_step": 171421, "epoch": 1020} {"train_loss": -10.532280921936035, "global_step": 171422, "epoch": 1020} {"train_loss": -10.959188461303711, "global_step": 171423, "epoch": 1020} {"train_loss": -10.405576705932617, "global_step": 171424, "epoch": 1020} {"train_loss": -10.895843505859375, "global_step": 171425, "epoch": 1020} {"train_loss": -10.452131271362305, "global_step": 171426, "epoch": 1020} {"train_loss": -10.695348739624023, "global_step": 171427, "epoch": 1020} {"train_loss": -10.799215316772461, "global_step": 171428, "epoch": 1020} {"train_loss": -10.793144226074219, "global_step": 171429, "epoch": 1020} {"train_loss": -10.738454818725586, "global_step": 171430, "epoch": 1020} {"train_loss": -10.866212844848633, "global_step": 171431, "epoch": 1020} {"train_loss": -10.71420955657959, "global_step": 171432, "epoch": 1020} {"train_loss": -10.744804382324219, "global_step": 171433, "epoch": 1020} {"train_loss": -10.631977081298828, "global_step": 171434, "epoch": 1020} {"train_loss": -10.895613670349121, "global_step": 171435, "epoch": 1020} {"train_loss": -10.890724182128906, "global_step": 171436, "epoch": 1020} {"train_loss": -11.159358978271484, "global_step": 171437, "epoch": 1020} {"train_loss": -10.790170669555664, "global_step": 171438, "epoch": 1020} {"train_loss": -10.880739212036133, "global_step": 171439, "epoch": 1020} {"train_loss": -10.547945976257324, "global_step": 171440, "epoch": 1020} {"train_loss": -10.935657501220703, "global_step": 171441, "epoch": 1020} {"train_loss": -10.978342056274414, "global_step": 171442, "epoch": 1020} {"train_loss": -10.994363784790039, "global_step": 171443, "epoch": 1020} {"train_loss": -10.978950500488281, "global_step": 171444, "epoch": 1020} {"train_loss": -11.13088321685791, "global_step": 171445, "epoch": 1020} {"train_loss": -11.170120239257812, "global_step": 171446, "epoch": 1020} {"train_loss": -10.839250564575195, "global_step": 171447, "epoch": 1020} {"train_loss": -11.051100730895996, "global_step": 171448, "epoch": 1020} {"train_loss": -11.097555160522461, "global_step": 171449, "epoch": 1020} {"train_loss": -11.100004196166992, "global_step": 171450, "epoch": 1020} {"train_loss": -11.203222274780273, "global_step": 171451, "epoch": 1020} {"train_loss": -11.075531005859375, "global_step": 171452, "epoch": 1020} {"train_loss": -11.177156448364258, "global_step": 171453, "epoch": 1020} {"train_loss": -10.906099319458008, "global_step": 171454, "epoch": 1020} {"train_loss": -10.803096771240234, "global_step": 171455, "epoch": 1020} {"train_loss": -11.083572387695312, "global_step": 171456, "epoch": 1020} {"train_loss": -11.23298454284668, "global_step": 171457, "epoch": 1020} {"train_loss": -10.675140380859375, "global_step": 171458, "epoch": 1020} {"train_loss": -10.955854415893555, "global_step": 171459, "epoch": 1020} {"train_loss": -10.74189281463623, "global_step": 171460, "epoch": 1020} {"train_loss": -10.783998489379883, "global_step": 171461, "epoch": 1020} {"train_loss": -11.173713684082031, "global_step": 171462, "epoch": 1020} {"train_loss": -10.737672805786133, "global_step": 171463, "epoch": 1020} {"train_loss": -11.173094749450684, "global_step": 171464, "epoch": 1020} {"train_loss": -10.938850402832031, "global_step": 171465, "epoch": 1020} {"train_loss": -10.974565505981445, "global_step": 171466, "epoch": 1020} {"train_loss": -10.52072811126709, "global_step": 171467, "epoch": 1020} {"train_loss": -11.438301086425781, "global_step": 171468, "epoch": 1020} {"train_loss": -10.57394027709961, "global_step": 171469, "epoch": 1020} {"train_loss": -11.13717269897461, "global_step": 171470, "epoch": 1020} {"train_loss": -10.425310134887695, "global_step": 171471, "epoch": 1020} {"train_loss": -10.68511962890625, "global_step": 171472, "epoch": 1020} {"train_loss": -10.990713119506836, "global_step": 171473, "epoch": 1020} {"train_loss": -10.546133995056152, "global_step": 171474, "epoch": 1020} {"train_loss": -10.17469310760498, "global_step": 171475, "epoch": 1020} {"train_loss": -10.843027114868164, "global_step": 171476, "epoch": 1020} {"train_loss": -10.345881462097168, "global_step": 171477, "epoch": 1020} {"train_loss": -11.016671180725098, "global_step": 171478, "epoch": 1020} {"train_loss": -10.961785316467285, "global_step": 171479, "epoch": 1020} {"train_loss": -10.948443412780762, "global_step": 171480, "epoch": 1020} {"train_loss": -10.9710054397583, "global_step": 171481, "epoch": 1020} {"train_loss": -11.335659980773926, "global_step": 171482, "epoch": 1020} {"train_loss": -10.895669937133789, "global_step": 171483, "epoch": 1020} {"train_loss": -10.927892684936523, "global_step": 171484, "epoch": 1020} {"train_loss": -10.774707794189453, "global_step": 171485, "epoch": 1020} {"train_loss": -10.88104248046875, "global_step": 171486, "epoch": 1020} {"train_loss": -11.27849292755127, "global_step": 171487, "epoch": 1020} {"train_loss": -10.683979034423828, "global_step": 171488, "epoch": 1020} {"train_loss": -11.00787353515625, "global_step": 171489, "epoch": 1020} {"train_loss": -10.545341491699219, "global_step": 171490, "epoch": 1020} {"train_loss": -10.942007064819336, "global_step": 171491, "epoch": 1020} {"train_loss": -10.78645133972168, "global_step": 171492, "epoch": 1020} {"train_loss": -10.601879119873047, "global_step": 171493, "epoch": 1020} {"train_loss": -10.609525680541992, "global_step": 171494, "epoch": 1020} {"train_loss": -10.785345077514648, "global_step": 171495, "epoch": 1020} {"train_loss": -10.850341796875, "global_step": 171496, "epoch": 1020} {"train_loss": -10.963085174560547, "global_step": 171497, "epoch": 1020} {"train_loss": -10.811214447021484, "global_step": 171498, "epoch": 1020} {"train_loss": -11.292318344116211, "global_step": 171499, "epoch": 1020} {"train_loss": -10.673027038574219, "global_step": 171500, "epoch": 1020} {"train_loss": -11.151050567626953, "global_step": 171501, "epoch": 1020} {"train_loss": -10.911040306091309, "global_step": 171502, "epoch": 1020} {"train_loss": -11.256103515625, "global_step": 171503, "epoch": 1020} {"train_loss": -10.871665000915527, "global_step": 171504, "epoch": 1020} {"train_loss": -10.823196411132812, "global_step": 171505, "epoch": 1020} {"train_loss": -11.196341514587402, "global_step": 171506, "epoch": 1020} {"train_loss": -10.709983825683594, "global_step": 171507, "epoch": 1020} {"train_loss": -11.26197624206543, "global_step": 171508, "epoch": 1020} {"train_loss": -11.09937572479248, "global_step": 171509, "epoch": 1020} {"train_loss": -11.23582935333252, "global_step": 171510, "epoch": 1020} {"train_loss": -11.170360565185547, "global_step": 171511, "epoch": 1020} {"train_loss": -11.079692840576172, "global_step": 171512, "epoch": 1020} {"train_loss": -11.258780479431152, "global_step": 171513, "epoch": 1020} {"train_loss": -10.962631225585938, "global_step": 171514, "epoch": 1020} {"train_loss": -11.1848783493042, "global_step": 171515, "epoch": 1020} {"train_loss": -11.050789833068848, "global_step": 171516, "epoch": 1020} {"train_loss": -11.23482894897461, "global_step": 171517, "epoch": 1020} {"train_loss": -11.256780624389648, "global_step": 171518, "epoch": 1020} {"train_loss": -11.240031242370605, "global_step": 171519, "epoch": 1020} {"train_loss": -11.305832862854004, "global_step": 171520, "epoch": 1020} {"train_loss": -11.204259872436523, "global_step": 171521, "epoch": 1020} {"train_loss": -11.237594604492188, "global_step": 171522, "epoch": 1020} {"train_loss": -10.969539642333984, "global_step": 171523, "epoch": 1020} {"train_loss": -10.845887184143066, "global_step": 171524, "epoch": 1020} {"train_loss": -11.129356384277344, "global_step": 171525, "epoch": 1020} {"train_loss": -10.826423645019531, "global_step": 171526, "epoch": 1020} {"train_loss": -10.857704957326254, "global_step": 171527, "epoch": 1020, "val_loss": 236314.640625, "train_action_mse_error": 0.3226850628852844} {"train_loss": -10.689252853393555, "global_step": 171528, "epoch": 1021} {"train_loss": -10.9412260055542, "global_step": 171529, "epoch": 1021} {"train_loss": -10.818355560302734, "global_step": 171530, "epoch": 1021} {"train_loss": -11.010740280151367, "global_step": 171531, "epoch": 1021} {"train_loss": -11.090484619140625, "global_step": 171532, "epoch": 1021} {"train_loss": -10.701669692993164, "global_step": 171533, "epoch": 1021} {"train_loss": -11.33298397064209, "global_step": 171534, "epoch": 1021} {"train_loss": -10.627765655517578, "global_step": 171535, "epoch": 1021} {"train_loss": -10.969548225402832, "global_step": 171536, "epoch": 1021} {"train_loss": -10.663373947143555, "global_step": 171537, "epoch": 1021} {"train_loss": -10.64535140991211, "global_step": 171538, "epoch": 1021} {"train_loss": -10.96992301940918, "global_step": 171539, "epoch": 1021} {"train_loss": -10.901265144348145, "global_step": 171540, "epoch": 1021} {"train_loss": -10.96546459197998, "global_step": 171541, "epoch": 1021} {"train_loss": -10.497907638549805, "global_step": 171542, "epoch": 1021} {"train_loss": -11.387163162231445, "global_step": 171543, "epoch": 1021} {"train_loss": -10.827723503112793, "global_step": 171544, "epoch": 1021} {"train_loss": -11.280423164367676, "global_step": 171545, "epoch": 1021} {"train_loss": -10.762453079223633, "global_step": 171546, "epoch": 1021} {"train_loss": -10.860687255859375, "global_step": 171547, "epoch": 1021} {"train_loss": -10.912694931030273, "global_step": 171548, "epoch": 1021} {"train_loss": -10.792011260986328, "global_step": 171549, "epoch": 1021} {"train_loss": -11.068781852722168, "global_step": 171550, "epoch": 1021} {"train_loss": -10.708879470825195, "global_step": 171551, "epoch": 1021} {"train_loss": -10.785344123840332, "global_step": 171552, "epoch": 1021} {"train_loss": -11.08988094329834, "global_step": 171553, "epoch": 1021} {"train_loss": -10.893049240112305, "global_step": 171554, "epoch": 1021} {"train_loss": -11.230610847473145, "global_step": 171555, "epoch": 1021} {"train_loss": -10.811822891235352, "global_step": 171556, "epoch": 1021} {"train_loss": -10.856081008911133, "global_step": 171557, "epoch": 1021} {"train_loss": -11.403593063354492, "global_step": 171558, "epoch": 1021} {"train_loss": -10.815513610839844, "global_step": 171559, "epoch": 1021} {"train_loss": -10.990830421447754, "global_step": 171560, "epoch": 1021} {"train_loss": -10.872634887695312, "global_step": 171561, "epoch": 1021} {"train_loss": -10.659676551818848, "global_step": 171562, "epoch": 1021} {"train_loss": -10.668506622314453, "global_step": 171563, "epoch": 1021} {"train_loss": -10.962684631347656, "global_step": 171564, "epoch": 1021} {"train_loss": -10.636960983276367, "global_step": 171565, "epoch": 1021} {"train_loss": -11.004555702209473, "global_step": 171566, "epoch": 1021} {"train_loss": -10.603856086730957, "global_step": 171567, "epoch": 1021} {"train_loss": -10.827642440795898, "global_step": 171568, "epoch": 1021} {"train_loss": -11.041152954101562, "global_step": 171569, "epoch": 1021} {"train_loss": -10.495831489562988, "global_step": 171570, "epoch": 1021} {"train_loss": -11.02579116821289, "global_step": 171571, "epoch": 1021} {"train_loss": -10.740118980407715, "global_step": 171572, "epoch": 1021} {"train_loss": -11.014493942260742, "global_step": 171573, "epoch": 1021} {"train_loss": -10.866634368896484, "global_step": 171574, "epoch": 1021} {"train_loss": -11.128971099853516, "global_step": 171575, "epoch": 1021} {"train_loss": -11.01876449584961, "global_step": 171576, "epoch": 1021} {"train_loss": -10.858770370483398, "global_step": 171577, "epoch": 1021} {"train_loss": -11.229703903198242, "global_step": 171578, "epoch": 1021} {"train_loss": -11.05571174621582, "global_step": 171579, "epoch": 1021} {"train_loss": -11.170125961303711, "global_step": 171580, "epoch": 1021} {"train_loss": -11.027729034423828, "global_step": 171581, "epoch": 1021} {"train_loss": -11.236116409301758, "global_step": 171582, "epoch": 1021} {"train_loss": -11.199793815612793, "global_step": 171583, "epoch": 1021} {"train_loss": -11.045218467712402, "global_step": 171584, "epoch": 1021} {"train_loss": -11.217817306518555, "global_step": 171585, "epoch": 1021} {"train_loss": -11.353976249694824, "global_step": 171586, "epoch": 1021} {"train_loss": -11.27486801147461, "global_step": 171587, "epoch": 1021} {"train_loss": -11.1505126953125, "global_step": 171588, "epoch": 1021} {"train_loss": -11.059076309204102, "global_step": 171589, "epoch": 1021} {"train_loss": -11.22317886352539, "global_step": 171590, "epoch": 1021} {"train_loss": -11.071704864501953, "global_step": 171591, "epoch": 1021} {"train_loss": -11.053861618041992, "global_step": 171592, "epoch": 1021} {"train_loss": -11.267057418823242, "global_step": 171593, "epoch": 1021} {"train_loss": -11.19196605682373, "global_step": 171594, "epoch": 1021} {"train_loss": -11.135964393615723, "global_step": 171595, "epoch": 1021} {"train_loss": -11.392609596252441, "global_step": 171596, "epoch": 1021} {"train_loss": -11.137350082397461, "global_step": 171597, "epoch": 1021} {"train_loss": -10.014841079711914, "global_step": 171598, "epoch": 1021} {"train_loss": -11.087770462036133, "global_step": 171599, "epoch": 1021} {"train_loss": -11.152820587158203, "global_step": 171600, "epoch": 1021} {"train_loss": -10.480507850646973, "global_step": 171601, "epoch": 1021} {"train_loss": -10.949056625366211, "global_step": 171602, "epoch": 1021} {"train_loss": -10.511722564697266, "global_step": 171603, "epoch": 1021} {"train_loss": -10.44442367553711, "global_step": 171604, "epoch": 1021} {"train_loss": -10.879219055175781, "global_step": 171605, "epoch": 1021} {"train_loss": -10.807662963867188, "global_step": 171606, "epoch": 1021} {"train_loss": -10.655399322509766, "global_step": 171607, "epoch": 1021} {"train_loss": -10.966825485229492, "global_step": 171608, "epoch": 1021} {"train_loss": -10.90991497039795, "global_step": 171609, "epoch": 1021} {"train_loss": -10.81513786315918, "global_step": 171610, "epoch": 1021} {"train_loss": -10.367151260375977, "global_step": 171611, "epoch": 1021} {"train_loss": -11.136590957641602, "global_step": 171612, "epoch": 1021} {"train_loss": -11.209400177001953, "global_step": 171613, "epoch": 1021} {"train_loss": -10.740691184997559, "global_step": 171614, "epoch": 1021} {"train_loss": -11.172257423400879, "global_step": 171615, "epoch": 1021} {"train_loss": -10.903614044189453, "global_step": 171616, "epoch": 1021} {"train_loss": -11.062811851501465, "global_step": 171617, "epoch": 1021} {"train_loss": -11.041210174560547, "global_step": 171618, "epoch": 1021} {"train_loss": -10.985648155212402, "global_step": 171619, "epoch": 1021} {"train_loss": -10.716863632202148, "global_step": 171620, "epoch": 1021} {"train_loss": -11.1598482131958, "global_step": 171621, "epoch": 1021} {"train_loss": -11.05887508392334, "global_step": 171622, "epoch": 1021} {"train_loss": -10.999195098876953, "global_step": 171623, "epoch": 1021} {"train_loss": -11.093193054199219, "global_step": 171624, "epoch": 1021} {"train_loss": -10.979461669921875, "global_step": 171625, "epoch": 1021} {"train_loss": -11.388418197631836, "global_step": 171626, "epoch": 1021} {"train_loss": -11.195831298828125, "global_step": 171627, "epoch": 1021} {"train_loss": -11.10103988647461, "global_step": 171628, "epoch": 1021} {"train_loss": -11.210299491882324, "global_step": 171629, "epoch": 1021} {"train_loss": -11.03573226928711, "global_step": 171630, "epoch": 1021} {"train_loss": -10.876901626586914, "global_step": 171631, "epoch": 1021} {"train_loss": -11.113809585571289, "global_step": 171632, "epoch": 1021} {"train_loss": -11.086023330688477, "global_step": 171633, "epoch": 1021} {"train_loss": -10.969426155090332, "global_step": 171634, "epoch": 1021} {"train_loss": -10.822893142700195, "global_step": 171635, "epoch": 1021} {"train_loss": -11.025358200073242, "global_step": 171636, "epoch": 1021} {"train_loss": -11.068574905395508, "global_step": 171637, "epoch": 1021} {"train_loss": -10.91979694366455, "global_step": 171638, "epoch": 1021} {"train_loss": -10.865827560424805, "global_step": 171639, "epoch": 1021} {"train_loss": -10.946208953857422, "global_step": 171640, "epoch": 1021} {"train_loss": -10.571901321411133, "global_step": 171641, "epoch": 1021} {"train_loss": -10.982866287231445, "global_step": 171642, "epoch": 1021} {"train_loss": -9.919831275939941, "global_step": 171643, "epoch": 1021} {"train_loss": -10.655439376831055, "global_step": 171644, "epoch": 1021} {"train_loss": -11.049382209777832, "global_step": 171645, "epoch": 1021} {"train_loss": -9.992164611816406, "global_step": 171646, "epoch": 1021} {"train_loss": -10.82891845703125, "global_step": 171647, "epoch": 1021} {"train_loss": -10.558712005615234, "global_step": 171648, "epoch": 1021} {"train_loss": -10.92827320098877, "global_step": 171649, "epoch": 1021} {"train_loss": -11.211994171142578, "global_step": 171650, "epoch": 1021} {"train_loss": -10.587849617004395, "global_step": 171651, "epoch": 1021} {"train_loss": -11.269079208374023, "global_step": 171652, "epoch": 1021} {"train_loss": -10.728216171264648, "global_step": 171653, "epoch": 1021} {"train_loss": -11.204535484313965, "global_step": 171654, "epoch": 1021} {"train_loss": -10.824108123779297, "global_step": 171655, "epoch": 1021} {"train_loss": -11.196741104125977, "global_step": 171656, "epoch": 1021} {"train_loss": -10.87588119506836, "global_step": 171657, "epoch": 1021} {"train_loss": -11.249198913574219, "global_step": 171658, "epoch": 1021} {"train_loss": -10.921660423278809, "global_step": 171659, "epoch": 1021} {"train_loss": -11.22149658203125, "global_step": 171660, "epoch": 1021} {"train_loss": -11.241125106811523, "global_step": 171661, "epoch": 1021} {"train_loss": -11.035263061523438, "global_step": 171662, "epoch": 1021} {"train_loss": -11.200130462646484, "global_step": 171663, "epoch": 1021} {"train_loss": -11.253559112548828, "global_step": 171664, "epoch": 1021} {"train_loss": -11.005823135375977, "global_step": 171665, "epoch": 1021} {"train_loss": -11.08323860168457, "global_step": 171666, "epoch": 1021} {"train_loss": -11.2884521484375, "global_step": 171667, "epoch": 1021} {"train_loss": -11.313155174255371, "global_step": 171668, "epoch": 1021} {"train_loss": -11.176591873168945, "global_step": 171669, "epoch": 1021} {"train_loss": -11.125005722045898, "global_step": 171670, "epoch": 1021} {"train_loss": -11.173835754394531, "global_step": 171671, "epoch": 1021} {"train_loss": -11.392585754394531, "global_step": 171672, "epoch": 1021} {"train_loss": -11.259984970092773, "global_step": 171673, "epoch": 1021} {"train_loss": -11.244367599487305, "global_step": 171674, "epoch": 1021} {"train_loss": -11.140646934509277, "global_step": 171675, "epoch": 1021} {"train_loss": -11.047342300415039, "global_step": 171676, "epoch": 1021} {"train_loss": -11.455223083496094, "global_step": 171677, "epoch": 1021} {"train_loss": -10.697851181030273, "global_step": 171678, "epoch": 1021} {"train_loss": -10.936440467834473, "global_step": 171679, "epoch": 1021} {"train_loss": -11.23725700378418, "global_step": 171680, "epoch": 1021} {"train_loss": -11.07705307006836, "global_step": 171681, "epoch": 1021} {"train_loss": -11.330516815185547, "global_step": 171682, "epoch": 1021} {"train_loss": -10.896799087524414, "global_step": 171683, "epoch": 1021} {"train_loss": -10.98331356048584, "global_step": 171684, "epoch": 1021} {"train_loss": -11.003337860107422, "global_step": 171685, "epoch": 1021} {"train_loss": -11.242252349853516, "global_step": 171686, "epoch": 1021} {"train_loss": -11.1514892578125, "global_step": 171687, "epoch": 1021} {"train_loss": -11.309104919433594, "global_step": 171688, "epoch": 1021} {"train_loss": -11.187137603759766, "global_step": 171689, "epoch": 1021} {"train_loss": -10.81899642944336, "global_step": 171690, "epoch": 1021} {"train_loss": -11.044407844543457, "global_step": 171691, "epoch": 1021} {"train_loss": -11.177024841308594, "global_step": 171692, "epoch": 1021} {"train_loss": -11.000373840332031, "global_step": 171693, "epoch": 1021} {"train_loss": -11.268228530883789, "global_step": 171694, "epoch": 1021} {"train_loss": -10.98233001005082, "global_step": 171695, "epoch": 1021, "val_loss": 237566.578125} {"train_loss": -11.216032028198242, "global_step": 171696, "epoch": 1022} {"train_loss": -11.179641723632812, "global_step": 171697, "epoch": 1022} {"train_loss": -10.871417999267578, "global_step": 171698, "epoch": 1022} {"train_loss": -11.125027656555176, "global_step": 171699, "epoch": 1022} {"train_loss": -11.295445442199707, "global_step": 171700, "epoch": 1022} {"train_loss": -10.770503997802734, "global_step": 171701, "epoch": 1022} {"train_loss": -11.165889739990234, "global_step": 171702, "epoch": 1022} {"train_loss": -11.131380081176758, "global_step": 171703, "epoch": 1022} {"train_loss": -11.115340232849121, "global_step": 171704, "epoch": 1022} {"train_loss": -11.19727897644043, "global_step": 171705, "epoch": 1022} {"train_loss": -11.397176742553711, "global_step": 171706, "epoch": 1022} {"train_loss": -10.998255729675293, "global_step": 171707, "epoch": 1022} {"train_loss": -11.41944694519043, "global_step": 171708, "epoch": 1022} {"train_loss": -11.350461959838867, "global_step": 171709, "epoch": 1022} {"train_loss": -11.240440368652344, "global_step": 171710, "epoch": 1022} {"train_loss": -11.040167808532715, "global_step": 171711, "epoch": 1022} {"train_loss": -11.200455665588379, "global_step": 171712, "epoch": 1022} {"train_loss": -11.365026473999023, "global_step": 171713, "epoch": 1022} {"train_loss": -11.194578170776367, "global_step": 171714, "epoch": 1022} {"train_loss": -11.597237586975098, "global_step": 171715, "epoch": 1022} {"train_loss": -11.608169555664062, "global_step": 171716, "epoch": 1022} {"train_loss": -11.248123168945312, "global_step": 171717, "epoch": 1022} {"train_loss": -11.249269485473633, "global_step": 171718, "epoch": 1022} {"train_loss": -11.577583312988281, "global_step": 171719, "epoch": 1022} {"train_loss": -11.498220443725586, "global_step": 171720, "epoch": 1022} {"train_loss": -11.372190475463867, "global_step": 171721, "epoch": 1022} {"train_loss": -11.296051979064941, "global_step": 171722, "epoch": 1022} {"train_loss": -11.302241325378418, "global_step": 171723, "epoch": 1022} {"train_loss": -11.380340576171875, "global_step": 171724, "epoch": 1022} {"train_loss": -10.992694854736328, "global_step": 171725, "epoch": 1022} {"train_loss": -11.242877960205078, "global_step": 171726, "epoch": 1022} {"train_loss": -11.220331192016602, "global_step": 171727, "epoch": 1022} {"train_loss": -10.101463317871094, "global_step": 171728, "epoch": 1022} {"train_loss": -11.009197235107422, "global_step": 171729, "epoch": 1022} {"train_loss": -10.911336898803711, "global_step": 171730, "epoch": 1022} {"train_loss": -9.832371711730957, "global_step": 171731, "epoch": 1022} {"train_loss": -9.716840744018555, "global_step": 171732, "epoch": 1022} {"train_loss": -11.192596435546875, "global_step": 171733, "epoch": 1022} {"train_loss": -10.545188903808594, "global_step": 171734, "epoch": 1022} {"train_loss": -10.485873222351074, "global_step": 171735, "epoch": 1022} {"train_loss": -10.70201301574707, "global_step": 171736, "epoch": 1022} {"train_loss": -9.823763847351074, "global_step": 171737, "epoch": 1022} {"train_loss": -10.717456817626953, "global_step": 171738, "epoch": 1022} {"train_loss": -8.77420425415039, "global_step": 171739, "epoch": 1022} {"train_loss": -10.835983276367188, "global_step": 171740, "epoch": 1022} {"train_loss": -9.32353401184082, "global_step": 171741, "epoch": 1022} {"train_loss": -10.916114807128906, "global_step": 171742, "epoch": 1022} {"train_loss": -10.407187461853027, "global_step": 171743, "epoch": 1022} {"train_loss": -11.036161422729492, "global_step": 171744, "epoch": 1022} {"train_loss": -10.435503005981445, "global_step": 171745, "epoch": 1022} {"train_loss": -11.01943588256836, "global_step": 171746, "epoch": 1022} {"train_loss": -11.130685806274414, "global_step": 171747, "epoch": 1022} {"train_loss": -10.80589485168457, "global_step": 171748, "epoch": 1022} {"train_loss": -11.029520034790039, "global_step": 171749, "epoch": 1022} {"train_loss": -10.73559284210205, "global_step": 171750, "epoch": 1022} {"train_loss": -11.126653671264648, "global_step": 171751, "epoch": 1022} {"train_loss": -10.875175476074219, "global_step": 171752, "epoch": 1022} {"train_loss": -11.178424835205078, "global_step": 171753, "epoch": 1022} {"train_loss": -10.890186309814453, "global_step": 171754, "epoch": 1022} {"train_loss": -10.808571815490723, "global_step": 171755, "epoch": 1022} {"train_loss": -11.10930061340332, "global_step": 171756, "epoch": 1022} {"train_loss": -10.835762023925781, "global_step": 171757, "epoch": 1022} {"train_loss": -11.002849578857422, "global_step": 171758, "epoch": 1022} {"train_loss": -10.656515121459961, "global_step": 171759, "epoch": 1022} {"train_loss": -10.6113862991333, "global_step": 171760, "epoch": 1022} {"train_loss": -10.806097030639648, "global_step": 171761, "epoch": 1022} {"train_loss": -10.736591339111328, "global_step": 171762, "epoch": 1022} {"train_loss": -11.088516235351562, "global_step": 171763, "epoch": 1022} {"train_loss": -11.049076080322266, "global_step": 171764, "epoch": 1022} {"train_loss": -11.047471046447754, "global_step": 171765, "epoch": 1022} {"train_loss": -10.89415168762207, "global_step": 171766, "epoch": 1022} {"train_loss": -10.877281188964844, "global_step": 171767, "epoch": 1022} {"train_loss": -10.98032283782959, "global_step": 171768, "epoch": 1022} {"train_loss": -10.519615173339844, "global_step": 171769, "epoch": 1022} {"train_loss": -10.68048095703125, "global_step": 171770, "epoch": 1022} {"train_loss": -10.874399185180664, "global_step": 171771, "epoch": 1022} {"train_loss": -11.242305755615234, "global_step": 171772, "epoch": 1022} {"train_loss": -11.15890884399414, "global_step": 171773, "epoch": 1022} {"train_loss": -11.188156127929688, "global_step": 171774, "epoch": 1022} {"train_loss": -11.123771667480469, "global_step": 171775, "epoch": 1022} {"train_loss": -11.083128929138184, "global_step": 171776, "epoch": 1022} {"train_loss": -10.830782890319824, "global_step": 171777, "epoch": 1022} {"train_loss": -11.188295364379883, "global_step": 171778, "epoch": 1022} {"train_loss": -11.040085792541504, "global_step": 171779, "epoch": 1022} {"train_loss": -11.340753555297852, "global_step": 171780, "epoch": 1022} {"train_loss": -11.05160903930664, "global_step": 171781, "epoch": 1022} {"train_loss": -10.941041946411133, "global_step": 171782, "epoch": 1022} {"train_loss": -11.000049591064453, "global_step": 171783, "epoch": 1022} {"train_loss": -11.06480598449707, "global_step": 171784, "epoch": 1022} {"train_loss": -10.691230773925781, "global_step": 171785, "epoch": 1022} {"train_loss": -10.817703247070312, "global_step": 171786, "epoch": 1022} {"train_loss": -11.070878982543945, "global_step": 171787, "epoch": 1022} {"train_loss": -10.500328063964844, "global_step": 171788, "epoch": 1022} {"train_loss": -11.252212524414062, "global_step": 171789, "epoch": 1022} {"train_loss": -10.736251831054688, "global_step": 171790, "epoch": 1022} {"train_loss": -10.708106994628906, "global_step": 171791, "epoch": 1022} {"train_loss": -11.298059463500977, "global_step": 171792, "epoch": 1022} {"train_loss": -10.709470748901367, "global_step": 171793, "epoch": 1022} {"train_loss": -11.2162446975708, "global_step": 171794, "epoch": 1022} {"train_loss": -11.077486038208008, "global_step": 171795, "epoch": 1022} {"train_loss": -11.101239204406738, "global_step": 171796, "epoch": 1022} {"train_loss": -10.97330093383789, "global_step": 171797, "epoch": 1022} {"train_loss": -11.128084182739258, "global_step": 171798, "epoch": 1022} {"train_loss": -10.856584548950195, "global_step": 171799, "epoch": 1022} {"train_loss": -10.783088684082031, "global_step": 171800, "epoch": 1022} {"train_loss": -10.463611602783203, "global_step": 171801, "epoch": 1022} {"train_loss": -10.56098747253418, "global_step": 171802, "epoch": 1022} {"train_loss": -10.838750839233398, "global_step": 171803, "epoch": 1022} {"train_loss": -10.117019653320312, "global_step": 171804, "epoch": 1022} {"train_loss": -10.384428024291992, "global_step": 171805, "epoch": 1022} {"train_loss": -10.912328720092773, "global_step": 171806, "epoch": 1022} {"train_loss": -10.440947532653809, "global_step": 171807, "epoch": 1022} {"train_loss": -9.47716236114502, "global_step": 171808, "epoch": 1022} {"train_loss": -10.996706008911133, "global_step": 171809, "epoch": 1022} {"train_loss": -9.558509826660156, "global_step": 171810, "epoch": 1022} {"train_loss": -10.70926284790039, "global_step": 171811, "epoch": 1022} {"train_loss": -9.482023239135742, "global_step": 171812, "epoch": 1022} {"train_loss": -10.355587005615234, "global_step": 171813, "epoch": 1022} {"train_loss": -10.630023956298828, "global_step": 171814, "epoch": 1022} {"train_loss": -10.39741325378418, "global_step": 171815, "epoch": 1022} {"train_loss": -10.702585220336914, "global_step": 171816, "epoch": 1022} {"train_loss": -10.692939758300781, "global_step": 171817, "epoch": 1022} {"train_loss": -10.939144134521484, "global_step": 171818, "epoch": 1022} {"train_loss": -10.23686695098877, "global_step": 171819, "epoch": 1022} {"train_loss": -10.741411209106445, "global_step": 171820, "epoch": 1022} {"train_loss": -10.170221328735352, "global_step": 171821, "epoch": 1022} {"train_loss": -10.473095893859863, "global_step": 171822, "epoch": 1022} {"train_loss": -10.204166412353516, "global_step": 171823, "epoch": 1022} {"train_loss": -10.426419258117676, "global_step": 171824, "epoch": 1022} {"train_loss": -10.457564353942871, "global_step": 171825, "epoch": 1022} {"train_loss": -10.528400421142578, "global_step": 171826, "epoch": 1022} {"train_loss": -10.311765670776367, "global_step": 171827, "epoch": 1022} {"train_loss": -10.862080574035645, "global_step": 171828, "epoch": 1022} {"train_loss": -10.787330627441406, "global_step": 171829, "epoch": 1022} {"train_loss": -10.914728164672852, "global_step": 171830, "epoch": 1022} {"train_loss": -10.978715896606445, "global_step": 171831, "epoch": 1022} {"train_loss": -10.810700416564941, "global_step": 171832, "epoch": 1022} {"train_loss": -11.107671737670898, "global_step": 171833, "epoch": 1022} {"train_loss": -11.069832801818848, "global_step": 171834, "epoch": 1022} {"train_loss": -10.68045425415039, "global_step": 171835, "epoch": 1022} {"train_loss": -10.92951774597168, "global_step": 171836, "epoch": 1022} {"train_loss": -10.642558097839355, "global_step": 171837, "epoch": 1022} {"train_loss": -10.862852096557617, "global_step": 171838, "epoch": 1022} {"train_loss": -11.009472846984863, "global_step": 171839, "epoch": 1022} {"train_loss": -10.766834259033203, "global_step": 171840, "epoch": 1022} {"train_loss": -10.922971725463867, "global_step": 171841, "epoch": 1022} {"train_loss": -10.965999603271484, "global_step": 171842, "epoch": 1022} {"train_loss": -10.98185920715332, "global_step": 171843, "epoch": 1022} {"train_loss": -10.97637939453125, "global_step": 171844, "epoch": 1022} {"train_loss": -11.067503929138184, "global_step": 171845, "epoch": 1022} {"train_loss": -10.715347290039062, "global_step": 171846, "epoch": 1022} {"train_loss": -10.973821640014648, "global_step": 171847, "epoch": 1022} {"train_loss": -11.073430061340332, "global_step": 171848, "epoch": 1022} {"train_loss": -11.058248519897461, "global_step": 171849, "epoch": 1022} {"train_loss": -11.055534362792969, "global_step": 171850, "epoch": 1022} {"train_loss": -11.032614707946777, "global_step": 171851, "epoch": 1022} {"train_loss": -10.712465286254883, "global_step": 171852, "epoch": 1022} {"train_loss": -11.360021591186523, "global_step": 171853, "epoch": 1022} {"train_loss": -10.826643943786621, "global_step": 171854, "epoch": 1022} {"train_loss": -11.299552917480469, "global_step": 171855, "epoch": 1022} {"train_loss": -10.81415843963623, "global_step": 171856, "epoch": 1022} {"train_loss": -11.206000328063965, "global_step": 171857, "epoch": 1022} {"train_loss": -10.991908073425293, "global_step": 171858, "epoch": 1022} {"train_loss": -10.840644836425781, "global_step": 171859, "epoch": 1022} {"train_loss": -11.320255279541016, "global_step": 171860, "epoch": 1022} {"train_loss": -10.719478607177734, "global_step": 171861, "epoch": 1022} {"train_loss": -11.157159805297852, "global_step": 171862, "epoch": 1022} {"train_loss": -10.863713746979123, "global_step": 171863, "epoch": 1022, "val_loss": 239272.703125} {"train_loss": -10.830385208129883, "global_step": 171864, "epoch": 1023} {"train_loss": -11.29145622253418, "global_step": 171865, "epoch": 1023} {"train_loss": -10.559301376342773, "global_step": 171866, "epoch": 1023} {"train_loss": -10.899134635925293, "global_step": 171867, "epoch": 1023} {"train_loss": -10.951088905334473, "global_step": 171868, "epoch": 1023} {"train_loss": -10.978131294250488, "global_step": 171869, "epoch": 1023} {"train_loss": -11.085453033447266, "global_step": 171870, "epoch": 1023} {"train_loss": -10.983797073364258, "global_step": 171871, "epoch": 1023} {"train_loss": -11.302745819091797, "global_step": 171872, "epoch": 1023} {"train_loss": -11.120658874511719, "global_step": 171873, "epoch": 1023} {"train_loss": -10.814248085021973, "global_step": 171874, "epoch": 1023} {"train_loss": -11.158830642700195, "global_step": 171875, "epoch": 1023} {"train_loss": -10.452592849731445, "global_step": 171876, "epoch": 1023} {"train_loss": -11.148561477661133, "global_step": 171877, "epoch": 1023} {"train_loss": -10.687111854553223, "global_step": 171878, "epoch": 1023} {"train_loss": -11.198046684265137, "global_step": 171879, "epoch": 1023} {"train_loss": -10.862077713012695, "global_step": 171880, "epoch": 1023} {"train_loss": -10.771800994873047, "global_step": 171881, "epoch": 1023} {"train_loss": -11.00350284576416, "global_step": 171882, "epoch": 1023} {"train_loss": -11.168609619140625, "global_step": 171883, "epoch": 1023} {"train_loss": -11.398980140686035, "global_step": 171884, "epoch": 1023} {"train_loss": -11.102306365966797, "global_step": 171885, "epoch": 1023} {"train_loss": -10.812383651733398, "global_step": 171886, "epoch": 1023} {"train_loss": -10.715938568115234, "global_step": 171887, "epoch": 1023} {"train_loss": -10.939647674560547, "global_step": 171888, "epoch": 1023} {"train_loss": -11.041557312011719, "global_step": 171889, "epoch": 1023} {"train_loss": -10.443655014038086, "global_step": 171890, "epoch": 1023} {"train_loss": -11.179048538208008, "global_step": 171891, "epoch": 1023} {"train_loss": -10.36468505859375, "global_step": 171892, "epoch": 1023} {"train_loss": -11.210895538330078, "global_step": 171893, "epoch": 1023} {"train_loss": -10.3164644241333, "global_step": 171894, "epoch": 1023} {"train_loss": -11.151137351989746, "global_step": 171895, "epoch": 1023} {"train_loss": -10.59621810913086, "global_step": 171896, "epoch": 1023} {"train_loss": -11.10400676727295, "global_step": 171897, "epoch": 1023} {"train_loss": -10.526285171508789, "global_step": 171898, "epoch": 1023} {"train_loss": -10.527471542358398, "global_step": 171899, "epoch": 1023} {"train_loss": -10.67558765411377, "global_step": 171900, "epoch": 1023} {"train_loss": -10.77441120147705, "global_step": 171901, "epoch": 1023} {"train_loss": -10.895200729370117, "global_step": 171902, "epoch": 1023} {"train_loss": -10.970136642456055, "global_step": 171903, "epoch": 1023} {"train_loss": -10.872797966003418, "global_step": 171904, "epoch": 1023} {"train_loss": -10.966146469116211, "global_step": 171905, "epoch": 1023} {"train_loss": -10.889001846313477, "global_step": 171906, "epoch": 1023} {"train_loss": -10.714527130126953, "global_step": 171907, "epoch": 1023} {"train_loss": -10.796329498291016, "global_step": 171908, "epoch": 1023} {"train_loss": -11.279267311096191, "global_step": 171909, "epoch": 1023} {"train_loss": -10.816801071166992, "global_step": 171910, "epoch": 1023} {"train_loss": -11.27178955078125, "global_step": 171911, "epoch": 1023} {"train_loss": -10.929220199584961, "global_step": 171912, "epoch": 1023} {"train_loss": -11.14073657989502, "global_step": 171913, "epoch": 1023} {"train_loss": -10.651856422424316, "global_step": 171914, "epoch": 1023} {"train_loss": -10.839492797851562, "global_step": 171915, "epoch": 1023} {"train_loss": -10.948955535888672, "global_step": 171916, "epoch": 1023} {"train_loss": -11.043514251708984, "global_step": 171917, "epoch": 1023} {"train_loss": -11.0, "global_step": 171918, "epoch": 1023} {"train_loss": -11.18592643737793, "global_step": 171919, "epoch": 1023} {"train_loss": -10.95138168334961, "global_step": 171920, "epoch": 1023} {"train_loss": -11.184638977050781, "global_step": 171921, "epoch": 1023} {"train_loss": -10.985819816589355, "global_step": 171922, "epoch": 1023} {"train_loss": -10.845667839050293, "global_step": 171923, "epoch": 1023} {"train_loss": -10.818031311035156, "global_step": 171924, "epoch": 1023} {"train_loss": -10.702728271484375, "global_step": 171925, "epoch": 1023} {"train_loss": -11.067676544189453, "global_step": 171926, "epoch": 1023} {"train_loss": -11.03675651550293, "global_step": 171927, "epoch": 1023} {"train_loss": -11.011787414550781, "global_step": 171928, "epoch": 1023} {"train_loss": -11.20543098449707, "global_step": 171929, "epoch": 1023} {"train_loss": -10.775306701660156, "global_step": 171930, "epoch": 1023} {"train_loss": -10.85395336151123, "global_step": 171931, "epoch": 1023} {"train_loss": -10.9105806350708, "global_step": 171932, "epoch": 1023} {"train_loss": -11.104558944702148, "global_step": 171933, "epoch": 1023} {"train_loss": -11.038267135620117, "global_step": 171934, "epoch": 1023} {"train_loss": -11.083925247192383, "global_step": 171935, "epoch": 1023} {"train_loss": -11.104650497436523, "global_step": 171936, "epoch": 1023} {"train_loss": -10.911754608154297, "global_step": 171937, "epoch": 1023} {"train_loss": -11.156152725219727, "global_step": 171938, "epoch": 1023} {"train_loss": -11.251131057739258, "global_step": 171939, "epoch": 1023} {"train_loss": -10.97234058380127, "global_step": 171940, "epoch": 1023} {"train_loss": -10.825654029846191, "global_step": 171941, "epoch": 1023} {"train_loss": -11.112680435180664, "global_step": 171942, "epoch": 1023} {"train_loss": -11.055252075195312, "global_step": 171943, "epoch": 1023} {"train_loss": -11.191189765930176, "global_step": 171944, "epoch": 1023} {"train_loss": -11.129096984863281, "global_step": 171945, "epoch": 1023} {"train_loss": -11.191524505615234, "global_step": 171946, "epoch": 1023} {"train_loss": -10.864103317260742, "global_step": 171947, "epoch": 1023} {"train_loss": -11.067441940307617, "global_step": 171948, "epoch": 1023} {"train_loss": -11.150257110595703, "global_step": 171949, "epoch": 1023} {"train_loss": -11.294181823730469, "global_step": 171950, "epoch": 1023} {"train_loss": -11.226866722106934, "global_step": 171951, "epoch": 1023} {"train_loss": -11.199811935424805, "global_step": 171952, "epoch": 1023} {"train_loss": -11.29911994934082, "global_step": 171953, "epoch": 1023} {"train_loss": -10.915103912353516, "global_step": 171954, "epoch": 1023} {"train_loss": -11.19235610961914, "global_step": 171955, "epoch": 1023} {"train_loss": -11.098234176635742, "global_step": 171956, "epoch": 1023} {"train_loss": -11.153411865234375, "global_step": 171957, "epoch": 1023} {"train_loss": -11.035550117492676, "global_step": 171958, "epoch": 1023} {"train_loss": -11.127561569213867, "global_step": 171959, "epoch": 1023} {"train_loss": -11.06261920928955, "global_step": 171960, "epoch": 1023} {"train_loss": -10.836694717407227, "global_step": 171961, "epoch": 1023} {"train_loss": -11.015979766845703, "global_step": 171962, "epoch": 1023} {"train_loss": -10.896464347839355, "global_step": 171963, "epoch": 1023} {"train_loss": -11.2889986038208, "global_step": 171964, "epoch": 1023} {"train_loss": -10.995031356811523, "global_step": 171965, "epoch": 1023} {"train_loss": -11.119430541992188, "global_step": 171966, "epoch": 1023} {"train_loss": -10.90146255493164, "global_step": 171967, "epoch": 1023} {"train_loss": -11.179443359375, "global_step": 171968, "epoch": 1023} {"train_loss": -11.034340858459473, "global_step": 171969, "epoch": 1023} {"train_loss": -11.115859985351562, "global_step": 171970, "epoch": 1023} {"train_loss": -11.260213851928711, "global_step": 171971, "epoch": 1023} {"train_loss": -10.57127857208252, "global_step": 171972, "epoch": 1023} {"train_loss": -10.769256591796875, "global_step": 171973, "epoch": 1023} {"train_loss": -11.01051139831543, "global_step": 171974, "epoch": 1023} {"train_loss": -10.421491622924805, "global_step": 171975, "epoch": 1023} {"train_loss": -10.72054672241211, "global_step": 171976, "epoch": 1023} {"train_loss": -10.837187767028809, "global_step": 171977, "epoch": 1023} {"train_loss": -10.373302459716797, "global_step": 171978, "epoch": 1023} {"train_loss": -10.671422958374023, "global_step": 171979, "epoch": 1023} {"train_loss": -10.41391372680664, "global_step": 171980, "epoch": 1023} {"train_loss": -9.165247917175293, "global_step": 171981, "epoch": 1023} {"train_loss": -10.178367614746094, "global_step": 171982, "epoch": 1023} {"train_loss": -9.73353385925293, "global_step": 171983, "epoch": 1023} {"train_loss": -9.493703842163086, "global_step": 171984, "epoch": 1023} {"train_loss": -10.008326530456543, "global_step": 171985, "epoch": 1023} {"train_loss": -9.052366256713867, "global_step": 171986, "epoch": 1023} {"train_loss": -11.053424835205078, "global_step": 171987, "epoch": 1023} {"train_loss": -9.622337341308594, "global_step": 171988, "epoch": 1023} {"train_loss": -10.372650146484375, "global_step": 171989, "epoch": 1023} {"train_loss": -10.425064086914062, "global_step": 171990, "epoch": 1023} {"train_loss": -10.234708786010742, "global_step": 171991, "epoch": 1023} {"train_loss": -10.73960018157959, "global_step": 171992, "epoch": 1023} {"train_loss": -10.62257194519043, "global_step": 171993, "epoch": 1023} {"train_loss": -10.460393905639648, "global_step": 171994, "epoch": 1023} {"train_loss": -10.733948707580566, "global_step": 171995, "epoch": 1023} {"train_loss": -10.526211738586426, "global_step": 171996, "epoch": 1023} {"train_loss": -10.651298522949219, "global_step": 171997, "epoch": 1023} {"train_loss": -10.683845520019531, "global_step": 171998, "epoch": 1023} {"train_loss": -10.752708435058594, "global_step": 171999, "epoch": 1023} {"train_loss": -10.622811317443848, "global_step": 172000, "epoch": 1023} {"train_loss": -10.973884582519531, "global_step": 172001, "epoch": 1023} {"train_loss": -10.735150337219238, "global_step": 172002, "epoch": 1023} {"train_loss": -10.91754150390625, "global_step": 172003, "epoch": 1023} {"train_loss": -10.870025634765625, "global_step": 172004, "epoch": 1023} {"train_loss": -10.879928588867188, "global_step": 172005, "epoch": 1023} {"train_loss": -11.127918243408203, "global_step": 172006, "epoch": 1023} {"train_loss": -10.938179969787598, "global_step": 172007, "epoch": 1023} {"train_loss": -11.016603469848633, "global_step": 172008, "epoch": 1023} {"train_loss": -11.021186828613281, "global_step": 172009, "epoch": 1023} {"train_loss": -11.035402297973633, "global_step": 172010, "epoch": 1023} {"train_loss": -11.169034957885742, "global_step": 172011, "epoch": 1023} {"train_loss": -11.213129997253418, "global_step": 172012, "epoch": 1023} {"train_loss": -11.147438049316406, "global_step": 172013, "epoch": 1023} {"train_loss": -11.107196807861328, "global_step": 172014, "epoch": 1023} {"train_loss": -11.046245574951172, "global_step": 172015, "epoch": 1023} {"train_loss": -11.040938377380371, "global_step": 172016, "epoch": 1023} {"train_loss": -11.11806583404541, "global_step": 172017, "epoch": 1023} {"train_loss": -11.073134422302246, "global_step": 172018, "epoch": 1023} {"train_loss": -11.071638107299805, "global_step": 172019, "epoch": 1023} {"train_loss": -11.35599136352539, "global_step": 172020, "epoch": 1023} {"train_loss": -11.098949432373047, "global_step": 172021, "epoch": 1023} {"train_loss": -11.030734062194824, "global_step": 172022, "epoch": 1023} {"train_loss": -11.097790718078613, "global_step": 172023, "epoch": 1023} {"train_loss": -11.050657272338867, "global_step": 172024, "epoch": 1023} {"train_loss": -11.26500129699707, "global_step": 172025, "epoch": 1023} {"train_loss": -11.181640625, "global_step": 172026, "epoch": 1023} {"train_loss": -11.397970199584961, "global_step": 172027, "epoch": 1023} {"train_loss": -11.300386428833008, "global_step": 172028, "epoch": 1023} {"train_loss": -11.44064712524414, "global_step": 172029, "epoch": 1023} {"train_loss": -11.143891334533691, "global_step": 172030, "epoch": 1023} {"train_loss": -10.899880630629402, "global_step": 172031, "epoch": 1023, "val_loss": 241895.90625} {"train_loss": -11.217310905456543, "global_step": 172032, "epoch": 1024} {"train_loss": -11.222187995910645, "global_step": 172033, "epoch": 1024} {"train_loss": -11.228147506713867, "global_step": 172034, "epoch": 1024} {"train_loss": -11.122358322143555, "global_step": 172035, "epoch": 1024} {"train_loss": -11.277580261230469, "global_step": 172036, "epoch": 1024} {"train_loss": -11.085739135742188, "global_step": 172037, "epoch": 1024} {"train_loss": -11.507181167602539, "global_step": 172038, "epoch": 1024} {"train_loss": -10.988533020019531, "global_step": 172039, "epoch": 1024} {"train_loss": -11.32449722290039, "global_step": 172040, "epoch": 1024} {"train_loss": -11.413267135620117, "global_step": 172041, "epoch": 1024} {"train_loss": -11.241618156433105, "global_step": 172042, "epoch": 1024} {"train_loss": -11.367485046386719, "global_step": 172043, "epoch": 1024} {"train_loss": -11.380226135253906, "global_step": 172044, "epoch": 1024} {"train_loss": -11.451704025268555, "global_step": 172045, "epoch": 1024} {"train_loss": -11.499216079711914, "global_step": 172046, "epoch": 1024} {"train_loss": -11.091350555419922, "global_step": 172047, "epoch": 1024} {"train_loss": -11.147645950317383, "global_step": 172048, "epoch": 1024} {"train_loss": -11.36129379272461, "global_step": 172049, "epoch": 1024} {"train_loss": -11.417494773864746, "global_step": 172050, "epoch": 1024} {"train_loss": -11.27688980102539, "global_step": 172051, "epoch": 1024} {"train_loss": -11.277984619140625, "global_step": 172052, "epoch": 1024} {"train_loss": -10.94561767578125, "global_step": 172053, "epoch": 1024} {"train_loss": -11.45176887512207, "global_step": 172054, "epoch": 1024} {"train_loss": -10.333023071289062, "global_step": 172055, "epoch": 1024} {"train_loss": -11.204113006591797, "global_step": 172056, "epoch": 1024} {"train_loss": -10.97576904296875, "global_step": 172057, "epoch": 1024} {"train_loss": -10.6495361328125, "global_step": 172058, "epoch": 1024} {"train_loss": -11.30981731414795, "global_step": 172059, "epoch": 1024} {"train_loss": -11.060050964355469, "global_step": 172060, "epoch": 1024} {"train_loss": -10.377132415771484, "global_step": 172061, "epoch": 1024} {"train_loss": -11.171415328979492, "global_step": 172062, "epoch": 1024} {"train_loss": -11.490663528442383, "global_step": 172063, "epoch": 1024} {"train_loss": -11.030754089355469, "global_step": 172064, "epoch": 1024} {"train_loss": -10.942158699035645, "global_step": 172065, "epoch": 1024} {"train_loss": -11.411009788513184, "global_step": 172066, "epoch": 1024} {"train_loss": -10.611940383911133, "global_step": 172067, "epoch": 1024} {"train_loss": -11.242087364196777, "global_step": 172068, "epoch": 1024} {"train_loss": -11.148544311523438, "global_step": 172069, "epoch": 1024} {"train_loss": -11.001821517944336, "global_step": 172070, "epoch": 1024} {"train_loss": -11.162885665893555, "global_step": 172071, "epoch": 1024} {"train_loss": -11.185023307800293, "global_step": 172072, "epoch": 1024} {"train_loss": -10.37559700012207, "global_step": 172073, "epoch": 1024} {"train_loss": -10.346736907958984, "global_step": 172074, "epoch": 1024} {"train_loss": -11.05202579498291, "global_step": 172075, "epoch": 1024} {"train_loss": -10.483556747436523, "global_step": 172076, "epoch": 1024} {"train_loss": -11.251916885375977, "global_step": 172077, "epoch": 1024} {"train_loss": -10.188966751098633, "global_step": 172078, "epoch": 1024} {"train_loss": -10.546551704406738, "global_step": 172079, "epoch": 1024} {"train_loss": -10.739256858825684, "global_step": 172080, "epoch": 1024} {"train_loss": -10.075986862182617, "global_step": 172081, "epoch": 1024} {"train_loss": -10.60579776763916, "global_step": 172082, "epoch": 1024} {"train_loss": -10.520320892333984, "global_step": 172083, "epoch": 1024} {"train_loss": -10.581409454345703, "global_step": 172084, "epoch": 1024} {"train_loss": -10.753536224365234, "global_step": 172085, "epoch": 1024} {"train_loss": -10.031621932983398, "global_step": 172086, "epoch": 1024} {"train_loss": -10.510498046875, "global_step": 172087, "epoch": 1024} {"train_loss": -10.950596809387207, "global_step": 172088, "epoch": 1024} {"train_loss": -10.448902130126953, "global_step": 172089, "epoch": 1024} {"train_loss": -10.953693389892578, "global_step": 172090, "epoch": 1024} {"train_loss": -10.04417610168457, "global_step": 172091, "epoch": 1024} {"train_loss": -10.580825805664062, "global_step": 172092, "epoch": 1024} {"train_loss": -10.941394805908203, "global_step": 172093, "epoch": 1024} {"train_loss": -10.649087905883789, "global_step": 172094, "epoch": 1024} {"train_loss": -10.97347640991211, "global_step": 172095, "epoch": 1024} {"train_loss": -10.543343544006348, "global_step": 172096, "epoch": 1024} {"train_loss": -10.415874481201172, "global_step": 172097, "epoch": 1024} {"train_loss": -10.801246643066406, "global_step": 172098, "epoch": 1024} {"train_loss": -10.56148624420166, "global_step": 172099, "epoch": 1024} {"train_loss": -10.715932846069336, "global_step": 172100, "epoch": 1024} {"train_loss": -10.704538345336914, "global_step": 172101, "epoch": 1024} {"train_loss": -10.609674453735352, "global_step": 172102, "epoch": 1024} {"train_loss": -10.57598876953125, "global_step": 172103, "epoch": 1024} {"train_loss": -10.833176612854004, "global_step": 172104, "epoch": 1024} {"train_loss": -10.310686111450195, "global_step": 172105, "epoch": 1024} {"train_loss": -10.984562873840332, "global_step": 172106, "epoch": 1024} {"train_loss": -10.531240463256836, "global_step": 172107, "epoch": 1024} {"train_loss": -10.950114250183105, "global_step": 172108, "epoch": 1024} {"train_loss": -10.64189338684082, "global_step": 172109, "epoch": 1024} {"train_loss": -10.71446418762207, "global_step": 172110, "epoch": 1024} {"train_loss": -10.46904182434082, "global_step": 172111, "epoch": 1024} {"train_loss": -10.778854370117188, "global_step": 172112, "epoch": 1024} {"train_loss": -10.579780578613281, "global_step": 172113, "epoch": 1024} {"train_loss": -10.751904487609863, "global_step": 172114, "epoch": 1024} {"train_loss": -10.757684707641602, "global_step": 172115, "epoch": 1024} {"train_loss": -10.584589004516602, "global_step": 172116, "epoch": 1024} {"train_loss": -10.250713348388672, "global_step": 172117, "epoch": 1024} {"train_loss": -10.472541809082031, "global_step": 172118, "epoch": 1024} {"train_loss": -9.990371704101562, "global_step": 172119, "epoch": 1024} {"train_loss": -11.013885498046875, "global_step": 172120, "epoch": 1024} {"train_loss": -10.138511657714844, "global_step": 172121, "epoch": 1024} {"train_loss": -10.879369735717773, "global_step": 172122, "epoch": 1024} {"train_loss": -10.511054992675781, "global_step": 172123, "epoch": 1024} {"train_loss": -10.427436828613281, "global_step": 172124, "epoch": 1024} {"train_loss": -10.762828826904297, "global_step": 172125, "epoch": 1024} {"train_loss": -10.862356185913086, "global_step": 172126, "epoch": 1024} {"train_loss": -10.376405715942383, "global_step": 172127, "epoch": 1024} {"train_loss": -10.863420486450195, "global_step": 172128, "epoch": 1024} {"train_loss": -10.542624473571777, "global_step": 172129, "epoch": 1024} {"train_loss": -10.772475242614746, "global_step": 172130, "epoch": 1024} {"train_loss": -10.94129467010498, "global_step": 172131, "epoch": 1024} {"train_loss": -10.617731094360352, "global_step": 172132, "epoch": 1024} {"train_loss": -10.894158363342285, "global_step": 172133, "epoch": 1024} {"train_loss": -10.709354400634766, "global_step": 172134, "epoch": 1024} {"train_loss": -11.04443645477295, "global_step": 172135, "epoch": 1024} {"train_loss": -10.899871826171875, "global_step": 172136, "epoch": 1024} {"train_loss": -10.805000305175781, "global_step": 172137, "epoch": 1024} {"train_loss": -11.107610702514648, "global_step": 172138, "epoch": 1024} {"train_loss": -10.874950408935547, "global_step": 172139, "epoch": 1024} {"train_loss": -11.06760311126709, "global_step": 172140, "epoch": 1024} {"train_loss": -11.017502784729004, "global_step": 172141, "epoch": 1024} {"train_loss": -11.041898727416992, "global_step": 172142, "epoch": 1024} {"train_loss": -11.135732650756836, "global_step": 172143, "epoch": 1024} {"train_loss": -11.135658264160156, "global_step": 172144, "epoch": 1024} {"train_loss": -11.12736701965332, "global_step": 172145, "epoch": 1024} {"train_loss": -11.161489486694336, "global_step": 172146, "epoch": 1024} {"train_loss": -11.140047073364258, "global_step": 172147, "epoch": 1024} {"train_loss": -11.2565336227417, "global_step": 172148, "epoch": 1024} {"train_loss": -11.139825820922852, "global_step": 172149, "epoch": 1024} {"train_loss": -11.142568588256836, "global_step": 172150, "epoch": 1024} {"train_loss": -11.061623573303223, "global_step": 172151, "epoch": 1024} {"train_loss": -11.340859413146973, "global_step": 172152, "epoch": 1024} {"train_loss": -11.05645751953125, "global_step": 172153, "epoch": 1024} {"train_loss": -11.296220779418945, "global_step": 172154, "epoch": 1024} {"train_loss": -11.10290813446045, "global_step": 172155, "epoch": 1024} {"train_loss": -11.277438163757324, "global_step": 172156, "epoch": 1024} {"train_loss": -11.230676651000977, "global_step": 172157, "epoch": 1024} {"train_loss": -11.253458023071289, "global_step": 172158, "epoch": 1024} {"train_loss": -11.386077880859375, "global_step": 172159, "epoch": 1024} {"train_loss": -11.273499488830566, "global_step": 172160, "epoch": 1024} {"train_loss": -11.156393051147461, "global_step": 172161, "epoch": 1024} {"train_loss": -11.374409675598145, "global_step": 172162, "epoch": 1024} {"train_loss": -11.17300796508789, "global_step": 172163, "epoch": 1024} {"train_loss": -11.317798614501953, "global_step": 172164, "epoch": 1024} {"train_loss": -11.373760223388672, "global_step": 172165, "epoch": 1024} {"train_loss": -11.04511833190918, "global_step": 172166, "epoch": 1024} {"train_loss": -11.293232917785645, "global_step": 172167, "epoch": 1024} {"train_loss": -11.04454231262207, "global_step": 172168, "epoch": 1024} {"train_loss": -10.743391036987305, "global_step": 172169, "epoch": 1024} {"train_loss": -11.059690475463867, "global_step": 172170, "epoch": 1024} {"train_loss": -11.496953964233398, "global_step": 172171, "epoch": 1024} {"train_loss": -10.702917098999023, "global_step": 172172, "epoch": 1024} {"train_loss": -11.122138023376465, "global_step": 172173, "epoch": 1024} {"train_loss": -11.115644454956055, "global_step": 172174, "epoch": 1024} {"train_loss": -10.81411361694336, "global_step": 172175, "epoch": 1024} {"train_loss": -10.41688346862793, "global_step": 172176, "epoch": 1024} {"train_loss": -11.414957046508789, "global_step": 172177, "epoch": 1024} {"train_loss": -10.609624862670898, "global_step": 172178, "epoch": 1024} {"train_loss": -11.057502746582031, "global_step": 172179, "epoch": 1024} {"train_loss": -11.20966625213623, "global_step": 172180, "epoch": 1024} {"train_loss": -11.103704452514648, "global_step": 172181, "epoch": 1024} {"train_loss": -10.91091251373291, "global_step": 172182, "epoch": 1024} {"train_loss": -10.890233039855957, "global_step": 172183, "epoch": 1024} {"train_loss": -11.395721435546875, "global_step": 172184, "epoch": 1024} {"train_loss": -10.678008079528809, "global_step": 172185, "epoch": 1024} {"train_loss": -11.344812393188477, "global_step": 172186, "epoch": 1024} {"train_loss": -11.212132453918457, "global_step": 172187, "epoch": 1024} {"train_loss": -10.518905639648438, "global_step": 172188, "epoch": 1024} {"train_loss": -11.326419830322266, "global_step": 172189, "epoch": 1024} {"train_loss": -10.984746932983398, "global_step": 172190, "epoch": 1024} {"train_loss": -10.243227005004883, "global_step": 172191, "epoch": 1024} {"train_loss": -10.366745948791504, "global_step": 172192, "epoch": 1024} {"train_loss": -9.899551391601562, "global_step": 172193, "epoch": 1024} {"train_loss": -10.756957054138184, "global_step": 172194, "epoch": 1024} {"train_loss": -10.513187408447266, "global_step": 172195, "epoch": 1024} {"train_loss": -10.822050094604492, "global_step": 172196, "epoch": 1024} {"train_loss": -10.453372955322266, "global_step": 172197, "epoch": 1024} {"train_loss": -10.981138229370117, "global_step": 172198, "epoch": 1024} {"train_loss": -10.90554568313417, "global_step": 172199, "epoch": 1024, "val_loss": 242020.078125} {"train_loss": -10.797740936279297, "global_step": 172200, "epoch": 1025} {"train_loss": -10.59726333618164, "global_step": 172201, "epoch": 1025} {"train_loss": -10.700631141662598, "global_step": 172202, "epoch": 1025} {"train_loss": -10.55052375793457, "global_step": 172203, "epoch": 1025} {"train_loss": -10.72386360168457, "global_step": 172204, "epoch": 1025} {"train_loss": -10.538154602050781, "global_step": 172205, "epoch": 1025} {"train_loss": -11.08036994934082, "global_step": 172206, "epoch": 1025} {"train_loss": -10.941680908203125, "global_step": 172207, "epoch": 1025} {"train_loss": -10.76097297668457, "global_step": 172208, "epoch": 1025} {"train_loss": -10.854835510253906, "global_step": 172209, "epoch": 1025} {"train_loss": -10.615348815917969, "global_step": 172210, "epoch": 1025} {"train_loss": -11.219388961791992, "global_step": 172211, "epoch": 1025} {"train_loss": -10.936293601989746, "global_step": 172212, "epoch": 1025} {"train_loss": -11.070718765258789, "global_step": 172213, "epoch": 1025} {"train_loss": -10.945602416992188, "global_step": 172214, "epoch": 1025} {"train_loss": -11.134382247924805, "global_step": 172215, "epoch": 1025} {"train_loss": -11.078667640686035, "global_step": 172216, "epoch": 1025} {"train_loss": -10.948299407958984, "global_step": 172217, "epoch": 1025} {"train_loss": -11.004612922668457, "global_step": 172218, "epoch": 1025} {"train_loss": -11.180337905883789, "global_step": 172219, "epoch": 1025} {"train_loss": -11.021560668945312, "global_step": 172220, "epoch": 1025} {"train_loss": -10.856267929077148, "global_step": 172221, "epoch": 1025} {"train_loss": -10.71059799194336, "global_step": 172222, "epoch": 1025} {"train_loss": -11.25350570678711, "global_step": 172223, "epoch": 1025} {"train_loss": -10.787979125976562, "global_step": 172224, "epoch": 1025} {"train_loss": -11.23243522644043, "global_step": 172225, "epoch": 1025} {"train_loss": -11.219156265258789, "global_step": 172226, "epoch": 1025} {"train_loss": -11.118240356445312, "global_step": 172227, "epoch": 1025} {"train_loss": -11.29517936706543, "global_step": 172228, "epoch": 1025} {"train_loss": -11.16147232055664, "global_step": 172229, "epoch": 1025} {"train_loss": -11.408809661865234, "global_step": 172230, "epoch": 1025} {"train_loss": -11.381508827209473, "global_step": 172231, "epoch": 1025} {"train_loss": -11.060577392578125, "global_step": 172232, "epoch": 1025} {"train_loss": -11.240453720092773, "global_step": 172233, "epoch": 1025} {"train_loss": -11.1695556640625, "global_step": 172234, "epoch": 1025} {"train_loss": -11.254833221435547, "global_step": 172235, "epoch": 1025} {"train_loss": -11.252703666687012, "global_step": 172236, "epoch": 1025} {"train_loss": -11.22107219696045, "global_step": 172237, "epoch": 1025} {"train_loss": -11.137375831604004, "global_step": 172238, "epoch": 1025} {"train_loss": -11.045188903808594, "global_step": 172239, "epoch": 1025} {"train_loss": -11.306739807128906, "global_step": 172240, "epoch": 1025} {"train_loss": -11.428775787353516, "global_step": 172241, "epoch": 1025} {"train_loss": -11.244707107543945, "global_step": 172242, "epoch": 1025} {"train_loss": -11.39004135131836, "global_step": 172243, "epoch": 1025} {"train_loss": -11.199508666992188, "global_step": 172244, "epoch": 1025} {"train_loss": -11.432585716247559, "global_step": 172245, "epoch": 1025} {"train_loss": -11.270238876342773, "global_step": 172246, "epoch": 1025} {"train_loss": -11.23794937133789, "global_step": 172247, "epoch": 1025} {"train_loss": -11.01289176940918, "global_step": 172248, "epoch": 1025} {"train_loss": -11.455012321472168, "global_step": 172249, "epoch": 1025} {"train_loss": -11.42934513092041, "global_step": 172250, "epoch": 1025} {"train_loss": -11.50029182434082, "global_step": 172251, "epoch": 1025} {"train_loss": -11.459434509277344, "global_step": 172252, "epoch": 1025} {"train_loss": -11.467920303344727, "global_step": 172253, "epoch": 1025} {"train_loss": -11.283613204956055, "global_step": 172254, "epoch": 1025} {"train_loss": -11.262428283691406, "global_step": 172255, "epoch": 1025} {"train_loss": -11.330676078796387, "global_step": 172256, "epoch": 1025} {"train_loss": -11.364351272583008, "global_step": 172257, "epoch": 1025} {"train_loss": -11.226127624511719, "global_step": 172258, "epoch": 1025} {"train_loss": -10.940498352050781, "global_step": 172259, "epoch": 1025} {"train_loss": -11.38455581665039, "global_step": 172260, "epoch": 1025} {"train_loss": -11.237509727478027, "global_step": 172261, "epoch": 1025} {"train_loss": -11.20463752746582, "global_step": 172262, "epoch": 1025} {"train_loss": -11.374247550964355, "global_step": 172263, "epoch": 1025} {"train_loss": -11.231792449951172, "global_step": 172264, "epoch": 1025} {"train_loss": -11.198736190795898, "global_step": 172265, "epoch": 1025} {"train_loss": -11.306058883666992, "global_step": 172266, "epoch": 1025} {"train_loss": -11.35557746887207, "global_step": 172267, "epoch": 1025} {"train_loss": -11.191611289978027, "global_step": 172268, "epoch": 1025} {"train_loss": -10.863481521606445, "global_step": 172269, "epoch": 1025} {"train_loss": -10.616865158081055, "global_step": 172270, "epoch": 1025} {"train_loss": -10.969572067260742, "global_step": 172271, "epoch": 1025} {"train_loss": -10.767559051513672, "global_step": 172272, "epoch": 1025} {"train_loss": -10.738588333129883, "global_step": 172273, "epoch": 1025} {"train_loss": -9.64065170288086, "global_step": 172274, "epoch": 1025} {"train_loss": -9.727376937866211, "global_step": 172275, "epoch": 1025} {"train_loss": -9.141096115112305, "global_step": 172276, "epoch": 1025} {"train_loss": -9.411337852478027, "global_step": 172277, "epoch": 1025} {"train_loss": -10.66363525390625, "global_step": 172278, "epoch": 1025} {"train_loss": -9.204480171203613, "global_step": 172279, "epoch": 1025} {"train_loss": -10.595829010009766, "global_step": 172280, "epoch": 1025} {"train_loss": -9.22799301147461, "global_step": 172281, "epoch": 1025} {"train_loss": -10.51573371887207, "global_step": 172282, "epoch": 1025} {"train_loss": -10.263656616210938, "global_step": 172283, "epoch": 1025} {"train_loss": -10.144990921020508, "global_step": 172284, "epoch": 1025} {"train_loss": -10.588411331176758, "global_step": 172285, "epoch": 1025} {"train_loss": -10.29327392578125, "global_step": 172286, "epoch": 1025} {"train_loss": -10.833476066589355, "global_step": 172287, "epoch": 1025} {"train_loss": -10.298928260803223, "global_step": 172288, "epoch": 1025} {"train_loss": -10.68905258178711, "global_step": 172289, "epoch": 1025} {"train_loss": -10.39776611328125, "global_step": 172290, "epoch": 1025} {"train_loss": -10.781664848327637, "global_step": 172291, "epoch": 1025} {"train_loss": -10.880985260009766, "global_step": 172292, "epoch": 1025} {"train_loss": -10.501264572143555, "global_step": 172293, "epoch": 1025} {"train_loss": -10.754350662231445, "global_step": 172294, "epoch": 1025} {"train_loss": -10.859382629394531, "global_step": 172295, "epoch": 1025} {"train_loss": -10.728165626525879, "global_step": 172296, "epoch": 1025} {"train_loss": -11.110260009765625, "global_step": 172297, "epoch": 1025} {"train_loss": -10.66680908203125, "global_step": 172298, "epoch": 1025} {"train_loss": -10.857187271118164, "global_step": 172299, "epoch": 1025} {"train_loss": -11.051788330078125, "global_step": 172300, "epoch": 1025} {"train_loss": -10.828189849853516, "global_step": 172301, "epoch": 1025} {"train_loss": -11.252274513244629, "global_step": 172302, "epoch": 1025} {"train_loss": -11.04399299621582, "global_step": 172303, "epoch": 1025} {"train_loss": -10.939903259277344, "global_step": 172304, "epoch": 1025} {"train_loss": -10.941463470458984, "global_step": 172305, "epoch": 1025} {"train_loss": -11.091649055480957, "global_step": 172306, "epoch": 1025} {"train_loss": -11.138886451721191, "global_step": 172307, "epoch": 1025} {"train_loss": -10.998501777648926, "global_step": 172308, "epoch": 1025} {"train_loss": -11.151838302612305, "global_step": 172309, "epoch": 1025} {"train_loss": -11.267531394958496, "global_step": 172310, "epoch": 1025} {"train_loss": -10.965619087219238, "global_step": 172311, "epoch": 1025} {"train_loss": -11.038543701171875, "global_step": 172312, "epoch": 1025} {"train_loss": -11.262088775634766, "global_step": 172313, "epoch": 1025} {"train_loss": -11.056095123291016, "global_step": 172314, "epoch": 1025} {"train_loss": -11.079710006713867, "global_step": 172315, "epoch": 1025} {"train_loss": -10.975117683410645, "global_step": 172316, "epoch": 1025} {"train_loss": -11.184026718139648, "global_step": 172317, "epoch": 1025} {"train_loss": -11.24950122833252, "global_step": 172318, "epoch": 1025} {"train_loss": -11.178752899169922, "global_step": 172319, "epoch": 1025} {"train_loss": -10.948314666748047, "global_step": 172320, "epoch": 1025} {"train_loss": -11.281867027282715, "global_step": 172321, "epoch": 1025} {"train_loss": -11.242376327514648, "global_step": 172322, "epoch": 1025} {"train_loss": -11.158241271972656, "global_step": 172323, "epoch": 1025} {"train_loss": -11.298734664916992, "global_step": 172324, "epoch": 1025} {"train_loss": -11.22063159942627, "global_step": 172325, "epoch": 1025} {"train_loss": -11.328418731689453, "global_step": 172326, "epoch": 1025} {"train_loss": -11.486377716064453, "global_step": 172327, "epoch": 1025} {"train_loss": -11.290852546691895, "global_step": 172328, "epoch": 1025} {"train_loss": -11.228240966796875, "global_step": 172329, "epoch": 1025} {"train_loss": -11.331904411315918, "global_step": 172330, "epoch": 1025} {"train_loss": -11.312881469726562, "global_step": 172331, "epoch": 1025} {"train_loss": -11.276817321777344, "global_step": 172332, "epoch": 1025} {"train_loss": -11.339630126953125, "global_step": 172333, "epoch": 1025} {"train_loss": -11.4483060836792, "global_step": 172334, "epoch": 1025} {"train_loss": -11.504977226257324, "global_step": 172335, "epoch": 1025} {"train_loss": -11.36636734008789, "global_step": 172336, "epoch": 1025} {"train_loss": -11.307555198669434, "global_step": 172337, "epoch": 1025} {"train_loss": -11.494559288024902, "global_step": 172338, "epoch": 1025} {"train_loss": -11.269554138183594, "global_step": 172339, "epoch": 1025} {"train_loss": -11.09072494506836, "global_step": 172340, "epoch": 1025} {"train_loss": -10.921592712402344, "global_step": 172341, "epoch": 1025} {"train_loss": -11.041389465332031, "global_step": 172342, "epoch": 1025} {"train_loss": -11.2252779006958, "global_step": 172343, "epoch": 1025} {"train_loss": -11.303380966186523, "global_step": 172344, "epoch": 1025} {"train_loss": -10.715747833251953, "global_step": 172345, "epoch": 1025} {"train_loss": -10.727714538574219, "global_step": 172346, "epoch": 1025} {"train_loss": -11.014713287353516, "global_step": 172347, "epoch": 1025} {"train_loss": -10.923213958740234, "global_step": 172348, "epoch": 1025} {"train_loss": -10.609075546264648, "global_step": 172349, "epoch": 1025} {"train_loss": -10.54509162902832, "global_step": 172350, "epoch": 1025} {"train_loss": -11.22281551361084, "global_step": 172351, "epoch": 1025} {"train_loss": -10.742170333862305, "global_step": 172352, "epoch": 1025} {"train_loss": -10.818916320800781, "global_step": 172353, "epoch": 1025} {"train_loss": -10.837404251098633, "global_step": 172354, "epoch": 1025} {"train_loss": -10.638811111450195, "global_step": 172355, "epoch": 1025} {"train_loss": -10.399995803833008, "global_step": 172356, "epoch": 1025} {"train_loss": -11.43327522277832, "global_step": 172357, "epoch": 1025} {"train_loss": -11.222214698791504, "global_step": 172358, "epoch": 1025} {"train_loss": -11.355348587036133, "global_step": 172359, "epoch": 1025} {"train_loss": -11.262075424194336, "global_step": 172360, "epoch": 1025} {"train_loss": -10.970512390136719, "global_step": 172361, "epoch": 1025} {"train_loss": -11.239044189453125, "global_step": 172362, "epoch": 1025} {"train_loss": -10.976619720458984, "global_step": 172363, "epoch": 1025} {"train_loss": -11.13254451751709, "global_step": 172364, "epoch": 1025} {"train_loss": -11.057769775390625, "global_step": 172365, "epoch": 1025} {"train_loss": -10.304279327392578, "global_step": 172366, "epoch": 1025} {"train_loss": -10.983822816894168, "global_step": 172367, "epoch": 1025, "val_loss": 240930.578125, "train_action_mse_error": 1.4054689407348633} {"train_loss": -10.84853458404541, "global_step": 172368, "epoch": 1026} {"train_loss": -10.141962051391602, "global_step": 172369, "epoch": 1026} {"train_loss": -11.073433876037598, "global_step": 172370, "epoch": 1026} {"train_loss": -10.559648513793945, "global_step": 172371, "epoch": 1026} {"train_loss": -10.707738876342773, "global_step": 172372, "epoch": 1026} {"train_loss": -10.746971130371094, "global_step": 172373, "epoch": 1026} {"train_loss": -10.370588302612305, "global_step": 172374, "epoch": 1026} {"train_loss": -11.058351516723633, "global_step": 172375, "epoch": 1026} {"train_loss": -10.735727310180664, "global_step": 172376, "epoch": 1026} {"train_loss": -11.02026653289795, "global_step": 172377, "epoch": 1026} {"train_loss": -10.788710594177246, "global_step": 172378, "epoch": 1026} {"train_loss": -11.152266502380371, "global_step": 172379, "epoch": 1026} {"train_loss": -10.599750518798828, "global_step": 172380, "epoch": 1026} {"train_loss": -10.98449420928955, "global_step": 172381, "epoch": 1026} {"train_loss": -10.98421573638916, "global_step": 172382, "epoch": 1026} {"train_loss": -11.07210636138916, "global_step": 172383, "epoch": 1026} {"train_loss": -10.713705062866211, "global_step": 172384, "epoch": 1026} {"train_loss": -10.594955444335938, "global_step": 172385, "epoch": 1026} {"train_loss": -10.69677734375, "global_step": 172386, "epoch": 1026} {"train_loss": -10.677249908447266, "global_step": 172387, "epoch": 1026} {"train_loss": -10.40981674194336, "global_step": 172388, "epoch": 1026} {"train_loss": -11.030205726623535, "global_step": 172389, "epoch": 1026} {"train_loss": -10.880393981933594, "global_step": 172390, "epoch": 1026} {"train_loss": -10.856806755065918, "global_step": 172391, "epoch": 1026} {"train_loss": -11.284767150878906, "global_step": 172392, "epoch": 1026} {"train_loss": -10.755485534667969, "global_step": 172393, "epoch": 1026} {"train_loss": -11.049718856811523, "global_step": 172394, "epoch": 1026} {"train_loss": -11.408490180969238, "global_step": 172395, "epoch": 1026} {"train_loss": -11.050613403320312, "global_step": 172396, "epoch": 1026} {"train_loss": -10.790628433227539, "global_step": 172397, "epoch": 1026} {"train_loss": -10.861093521118164, "global_step": 172398, "epoch": 1026} {"train_loss": -10.672739028930664, "global_step": 172399, "epoch": 1026} {"train_loss": -10.994476318359375, "global_step": 172400, "epoch": 1026} {"train_loss": -10.824254989624023, "global_step": 172401, "epoch": 1026} {"train_loss": -11.001222610473633, "global_step": 172402, "epoch": 1026} {"train_loss": -10.844171524047852, "global_step": 172403, "epoch": 1026} {"train_loss": -10.84595012664795, "global_step": 172404, "epoch": 1026} {"train_loss": -11.088940620422363, "global_step": 172405, "epoch": 1026} {"train_loss": -11.061487197875977, "global_step": 172406, "epoch": 1026} {"train_loss": -11.004414558410645, "global_step": 172407, "epoch": 1026} {"train_loss": -11.224550247192383, "global_step": 172408, "epoch": 1026} {"train_loss": -10.807636260986328, "global_step": 172409, "epoch": 1026} {"train_loss": -11.309732437133789, "global_step": 172410, "epoch": 1026} {"train_loss": -11.218058586120605, "global_step": 172411, "epoch": 1026} {"train_loss": -10.950867652893066, "global_step": 172412, "epoch": 1026} {"train_loss": -11.477132797241211, "global_step": 172413, "epoch": 1026} {"train_loss": -11.25074577331543, "global_step": 172414, "epoch": 1026} {"train_loss": -11.326108932495117, "global_step": 172415, "epoch": 1026} {"train_loss": -11.306270599365234, "global_step": 172416, "epoch": 1026} {"train_loss": -11.027780532836914, "global_step": 172417, "epoch": 1026} {"train_loss": -11.320883750915527, "global_step": 172418, "epoch": 1026} {"train_loss": -11.214824676513672, "global_step": 172419, "epoch": 1026} {"train_loss": -10.937149047851562, "global_step": 172420, "epoch": 1026} {"train_loss": -11.311140060424805, "global_step": 172421, "epoch": 1026} {"train_loss": -11.25374984741211, "global_step": 172422, "epoch": 1026} {"train_loss": -11.11916732788086, "global_step": 172423, "epoch": 1026} {"train_loss": -11.34429931640625, "global_step": 172424, "epoch": 1026} {"train_loss": -11.544729232788086, "global_step": 172425, "epoch": 1026} {"train_loss": -11.039041519165039, "global_step": 172426, "epoch": 1026} {"train_loss": -11.34251594543457, "global_step": 172427, "epoch": 1026} {"train_loss": -11.366528511047363, "global_step": 172428, "epoch": 1026} {"train_loss": -11.269454956054688, "global_step": 172429, "epoch": 1026} {"train_loss": -11.181624412536621, "global_step": 172430, "epoch": 1026} {"train_loss": -11.109969139099121, "global_step": 172431, "epoch": 1026} {"train_loss": -10.55415153503418, "global_step": 172432, "epoch": 1026} {"train_loss": -11.133627891540527, "global_step": 172433, "epoch": 1026} {"train_loss": -10.57684326171875, "global_step": 172434, "epoch": 1026} {"train_loss": -10.945959091186523, "global_step": 172435, "epoch": 1026} {"train_loss": -11.344964027404785, "global_step": 172436, "epoch": 1026} {"train_loss": -11.139581680297852, "global_step": 172437, "epoch": 1026} {"train_loss": -11.158796310424805, "global_step": 172438, "epoch": 1026} {"train_loss": -11.177919387817383, "global_step": 172439, "epoch": 1026} {"train_loss": -11.539056777954102, "global_step": 172440, "epoch": 1026} {"train_loss": -11.448458671569824, "global_step": 172441, "epoch": 1026} {"train_loss": -11.170387268066406, "global_step": 172442, "epoch": 1026} {"train_loss": -11.340961456298828, "global_step": 172443, "epoch": 1026} {"train_loss": -10.89807415008545, "global_step": 172444, "epoch": 1026} {"train_loss": -10.345259666442871, "global_step": 172445, "epoch": 1026} {"train_loss": -11.373411178588867, "global_step": 172446, "epoch": 1026} {"train_loss": -10.809347152709961, "global_step": 172447, "epoch": 1026} {"train_loss": -10.429679870605469, "global_step": 172448, "epoch": 1026} {"train_loss": -11.161497116088867, "global_step": 172449, "epoch": 1026} {"train_loss": -10.893747329711914, "global_step": 172450, "epoch": 1026} {"train_loss": -10.721733093261719, "global_step": 172451, "epoch": 1026} {"train_loss": -11.178544998168945, "global_step": 172452, "epoch": 1026} {"train_loss": -11.266095161437988, "global_step": 172453, "epoch": 1026} {"train_loss": -11.1600923538208, "global_step": 172454, "epoch": 1026} {"train_loss": -11.124481201171875, "global_step": 172455, "epoch": 1026} {"train_loss": -10.976917266845703, "global_step": 172456, "epoch": 1026} {"train_loss": -11.184075355529785, "global_step": 172457, "epoch": 1026} {"train_loss": -11.302742004394531, "global_step": 172458, "epoch": 1026} {"train_loss": -10.997882843017578, "global_step": 172459, "epoch": 1026} {"train_loss": -11.137380599975586, "global_step": 172460, "epoch": 1026} {"train_loss": -10.64093017578125, "global_step": 172461, "epoch": 1026} {"train_loss": -11.260932922363281, "global_step": 172462, "epoch": 1026} {"train_loss": -10.072917938232422, "global_step": 172463, "epoch": 1026} {"train_loss": -10.732932090759277, "global_step": 172464, "epoch": 1026} {"train_loss": -10.735611915588379, "global_step": 172465, "epoch": 1026} {"train_loss": -10.938117980957031, "global_step": 172466, "epoch": 1026} {"train_loss": -10.324935913085938, "global_step": 172467, "epoch": 1026} {"train_loss": -10.978153228759766, "global_step": 172468, "epoch": 1026} {"train_loss": -10.100370407104492, "global_step": 172469, "epoch": 1026} {"train_loss": -10.730066299438477, "global_step": 172470, "epoch": 1026} {"train_loss": -10.92097282409668, "global_step": 172471, "epoch": 1026} {"train_loss": -10.476654052734375, "global_step": 172472, "epoch": 1026} {"train_loss": -11.324975967407227, "global_step": 172473, "epoch": 1026} {"train_loss": -10.86559772491455, "global_step": 172474, "epoch": 1026} {"train_loss": -10.763761520385742, "global_step": 172475, "epoch": 1026} {"train_loss": -10.746797561645508, "global_step": 172476, "epoch": 1026} {"train_loss": -11.015932083129883, "global_step": 172477, "epoch": 1026} {"train_loss": -11.169635772705078, "global_step": 172478, "epoch": 1026} {"train_loss": -10.786855697631836, "global_step": 172479, "epoch": 1026} {"train_loss": -10.959410667419434, "global_step": 172480, "epoch": 1026} {"train_loss": -10.959724426269531, "global_step": 172481, "epoch": 1026} {"train_loss": -11.427103042602539, "global_step": 172482, "epoch": 1026} {"train_loss": -11.092702865600586, "global_step": 172483, "epoch": 1026} {"train_loss": -11.373538970947266, "global_step": 172484, "epoch": 1026} {"train_loss": -11.118490219116211, "global_step": 172485, "epoch": 1026} {"train_loss": -11.23326587677002, "global_step": 172486, "epoch": 1026} {"train_loss": -11.102184295654297, "global_step": 172487, "epoch": 1026} {"train_loss": -11.069580078125, "global_step": 172488, "epoch": 1026} {"train_loss": -11.31533432006836, "global_step": 172489, "epoch": 1026} {"train_loss": -10.874687194824219, "global_step": 172490, "epoch": 1026} {"train_loss": -11.384804725646973, "global_step": 172491, "epoch": 1026} {"train_loss": -11.048069953918457, "global_step": 172492, "epoch": 1026} {"train_loss": -11.07573413848877, "global_step": 172493, "epoch": 1026} {"train_loss": -11.037306785583496, "global_step": 172494, "epoch": 1026} {"train_loss": -11.016826629638672, "global_step": 172495, "epoch": 1026} {"train_loss": -11.067461013793945, "global_step": 172496, "epoch": 1026} {"train_loss": -10.942331314086914, "global_step": 172497, "epoch": 1026} {"train_loss": -10.819671630859375, "global_step": 172498, "epoch": 1026} {"train_loss": -10.717719078063965, "global_step": 172499, "epoch": 1026} {"train_loss": -11.035123825073242, "global_step": 172500, "epoch": 1026} {"train_loss": -10.802820205688477, "global_step": 172501, "epoch": 1026} {"train_loss": -10.543703079223633, "global_step": 172502, "epoch": 1026} {"train_loss": -10.972393035888672, "global_step": 172503, "epoch": 1026} {"train_loss": -10.632356643676758, "global_step": 172504, "epoch": 1026} {"train_loss": -10.913545608520508, "global_step": 172505, "epoch": 1026} {"train_loss": -10.97146224975586, "global_step": 172506, "epoch": 1026} {"train_loss": -10.545125007629395, "global_step": 172507, "epoch": 1026} {"train_loss": -11.074604034423828, "global_step": 172508, "epoch": 1026} {"train_loss": -10.837047576904297, "global_step": 172509, "epoch": 1026} {"train_loss": -11.053651809692383, "global_step": 172510, "epoch": 1026} {"train_loss": -11.078628540039062, "global_step": 172511, "epoch": 1026} {"train_loss": -10.075550079345703, "global_step": 172512, "epoch": 1026} {"train_loss": -11.052413940429688, "global_step": 172513, "epoch": 1026} {"train_loss": -10.736778259277344, "global_step": 172514, "epoch": 1026} {"train_loss": -10.999749183654785, "global_step": 172515, "epoch": 1026} {"train_loss": -10.935011863708496, "global_step": 172516, "epoch": 1026} {"train_loss": -10.968846321105957, "global_step": 172517, "epoch": 1026} {"train_loss": -11.06537914276123, "global_step": 172518, "epoch": 1026} {"train_loss": -10.886823654174805, "global_step": 172519, "epoch": 1026} {"train_loss": -11.13172721862793, "global_step": 172520, "epoch": 1026} {"train_loss": -10.902650833129883, "global_step": 172521, "epoch": 1026} {"train_loss": -11.136234283447266, "global_step": 172522, "epoch": 1026} {"train_loss": -11.030290603637695, "global_step": 172523, "epoch": 1026} {"train_loss": -11.141387939453125, "global_step": 172524, "epoch": 1026} {"train_loss": -10.611934661865234, "global_step": 172525, "epoch": 1026} {"train_loss": -11.30640983581543, "global_step": 172526, "epoch": 1026} {"train_loss": -11.216796875, "global_step": 172527, "epoch": 1026} {"train_loss": -10.957569122314453, "global_step": 172528, "epoch": 1026} {"train_loss": -11.337373733520508, "global_step": 172529, "epoch": 1026} {"train_loss": -11.087711334228516, "global_step": 172530, "epoch": 1026} {"train_loss": -11.330764770507812, "global_step": 172531, "epoch": 1026} {"train_loss": -11.304956436157227, "global_step": 172532, "epoch": 1026} {"train_loss": -11.38237190246582, "global_step": 172533, "epoch": 1026} {"train_loss": -11.060648918151855, "global_step": 172534, "epoch": 1026} {"train_loss": -10.985026115462894, "global_step": 172535, "epoch": 1026, "val_loss": 243527.359375} {"train_loss": -11.138742446899414, "global_step": 172536, "epoch": 1027} {"train_loss": -11.316605567932129, "global_step": 172537, "epoch": 1027} {"train_loss": -11.223348617553711, "global_step": 172538, "epoch": 1027} {"train_loss": -11.131985664367676, "global_step": 172539, "epoch": 1027} {"train_loss": -11.153564453125, "global_step": 172540, "epoch": 1027} {"train_loss": -11.310797691345215, "global_step": 172541, "epoch": 1027} {"train_loss": -10.95097541809082, "global_step": 172542, "epoch": 1027} {"train_loss": -11.275815963745117, "global_step": 172543, "epoch": 1027} {"train_loss": -11.141769409179688, "global_step": 172544, "epoch": 1027} {"train_loss": -11.27546501159668, "global_step": 172545, "epoch": 1027} {"train_loss": -11.075075149536133, "global_step": 172546, "epoch": 1027} {"train_loss": -11.327095985412598, "global_step": 172547, "epoch": 1027} {"train_loss": -11.18655014038086, "global_step": 172548, "epoch": 1027} {"train_loss": -10.979244232177734, "global_step": 172549, "epoch": 1027} {"train_loss": -11.068981170654297, "global_step": 172550, "epoch": 1027} {"train_loss": -10.807442665100098, "global_step": 172551, "epoch": 1027} {"train_loss": -10.311946868896484, "global_step": 172552, "epoch": 1027} {"train_loss": -10.679914474487305, "global_step": 172553, "epoch": 1027} {"train_loss": -10.292951583862305, "global_step": 172554, "epoch": 1027} {"train_loss": -10.884950637817383, "global_step": 172555, "epoch": 1027} {"train_loss": -10.871091842651367, "global_step": 172556, "epoch": 1027} {"train_loss": -10.847094535827637, "global_step": 172557, "epoch": 1027} {"train_loss": -10.891085624694824, "global_step": 172558, "epoch": 1027} {"train_loss": -10.77918815612793, "global_step": 172559, "epoch": 1027} {"train_loss": -10.967704772949219, "global_step": 172560, "epoch": 1027} {"train_loss": -10.908716201782227, "global_step": 172561, "epoch": 1027} {"train_loss": -11.09019660949707, "global_step": 172562, "epoch": 1027} {"train_loss": -11.163064956665039, "global_step": 172563, "epoch": 1027} {"train_loss": -10.938804626464844, "global_step": 172564, "epoch": 1027} {"train_loss": -11.15446662902832, "global_step": 172565, "epoch": 1027} {"train_loss": -10.957966804504395, "global_step": 172566, "epoch": 1027} {"train_loss": -10.755107879638672, "global_step": 172567, "epoch": 1027} {"train_loss": -10.600296020507812, "global_step": 172568, "epoch": 1027} {"train_loss": -10.842022895812988, "global_step": 172569, "epoch": 1027} {"train_loss": -11.044468879699707, "global_step": 172570, "epoch": 1027} {"train_loss": -10.868183135986328, "global_step": 172571, "epoch": 1027} {"train_loss": -10.932575225830078, "global_step": 172572, "epoch": 1027} {"train_loss": -10.750941276550293, "global_step": 172573, "epoch": 1027} {"train_loss": -10.811811447143555, "global_step": 172574, "epoch": 1027} {"train_loss": -10.476346015930176, "global_step": 172575, "epoch": 1027} {"train_loss": -10.952936172485352, "global_step": 172576, "epoch": 1027} {"train_loss": -10.47086238861084, "global_step": 172577, "epoch": 1027} {"train_loss": -11.107912063598633, "global_step": 172578, "epoch": 1027} {"train_loss": -10.806953430175781, "global_step": 172579, "epoch": 1027} {"train_loss": -11.018928527832031, "global_step": 172580, "epoch": 1027} {"train_loss": -10.985240936279297, "global_step": 172581, "epoch": 1027} {"train_loss": -10.968422889709473, "global_step": 172582, "epoch": 1027} {"train_loss": -11.223334312438965, "global_step": 172583, "epoch": 1027} {"train_loss": -10.931087493896484, "global_step": 172584, "epoch": 1027} {"train_loss": -10.785778999328613, "global_step": 172585, "epoch": 1027} {"train_loss": -10.846871376037598, "global_step": 172586, "epoch": 1027} {"train_loss": -11.23057746887207, "global_step": 172587, "epoch": 1027} {"train_loss": -10.822660446166992, "global_step": 172588, "epoch": 1027} {"train_loss": -11.006795883178711, "global_step": 172589, "epoch": 1027} {"train_loss": -10.967307090759277, "global_step": 172590, "epoch": 1027} {"train_loss": -10.76768684387207, "global_step": 172591, "epoch": 1027} {"train_loss": -11.408792495727539, "global_step": 172592, "epoch": 1027} {"train_loss": -10.72256851196289, "global_step": 172593, "epoch": 1027} {"train_loss": -11.240474700927734, "global_step": 172594, "epoch": 1027} {"train_loss": -11.004058837890625, "global_step": 172595, "epoch": 1027} {"train_loss": -11.101836204528809, "global_step": 172596, "epoch": 1027} {"train_loss": -11.07608699798584, "global_step": 172597, "epoch": 1027} {"train_loss": -11.095161437988281, "global_step": 172598, "epoch": 1027} {"train_loss": -11.179515838623047, "global_step": 172599, "epoch": 1027} {"train_loss": -10.639589309692383, "global_step": 172600, "epoch": 1027} {"train_loss": -11.14750862121582, "global_step": 172601, "epoch": 1027} {"train_loss": -11.13090991973877, "global_step": 172602, "epoch": 1027} {"train_loss": -11.068870544433594, "global_step": 172603, "epoch": 1027} {"train_loss": -10.541736602783203, "global_step": 172604, "epoch": 1027} {"train_loss": -11.127547264099121, "global_step": 172605, "epoch": 1027} {"train_loss": -10.912739753723145, "global_step": 172606, "epoch": 1027} {"train_loss": -11.09534740447998, "global_step": 172607, "epoch": 1027} {"train_loss": -11.038724899291992, "global_step": 172608, "epoch": 1027} {"train_loss": -11.065300941467285, "global_step": 172609, "epoch": 1027} {"train_loss": -11.067583084106445, "global_step": 172610, "epoch": 1027} {"train_loss": -10.913394927978516, "global_step": 172611, "epoch": 1027} {"train_loss": -10.98686695098877, "global_step": 172612, "epoch": 1027} {"train_loss": -11.202071189880371, "global_step": 172613, "epoch": 1027} {"train_loss": -11.304471969604492, "global_step": 172614, "epoch": 1027} {"train_loss": -10.957869529724121, "global_step": 172615, "epoch": 1027} {"train_loss": -11.307430267333984, "global_step": 172616, "epoch": 1027} {"train_loss": -11.20361614227295, "global_step": 172617, "epoch": 1027} {"train_loss": -11.183837890625, "global_step": 172618, "epoch": 1027} {"train_loss": -11.13105583190918, "global_step": 172619, "epoch": 1027} {"train_loss": -11.077641487121582, "global_step": 172620, "epoch": 1027} {"train_loss": -11.012381553649902, "global_step": 172621, "epoch": 1027} {"train_loss": -11.174505233764648, "global_step": 172622, "epoch": 1027} {"train_loss": -10.857553482055664, "global_step": 172623, "epoch": 1027} {"train_loss": -10.929068565368652, "global_step": 172624, "epoch": 1027} {"train_loss": -11.054622650146484, "global_step": 172625, "epoch": 1027} {"train_loss": -10.42544937133789, "global_step": 172626, "epoch": 1027} {"train_loss": -11.365910530090332, "global_step": 172627, "epoch": 1027} {"train_loss": -10.601912498474121, "global_step": 172628, "epoch": 1027} {"train_loss": -11.211048126220703, "global_step": 172629, "epoch": 1027} {"train_loss": -10.737832069396973, "global_step": 172630, "epoch": 1027} {"train_loss": -10.822403907775879, "global_step": 172631, "epoch": 1027} {"train_loss": -11.042230606079102, "global_step": 172632, "epoch": 1027} {"train_loss": -10.694466590881348, "global_step": 172633, "epoch": 1027} {"train_loss": -10.749043464660645, "global_step": 172634, "epoch": 1027} {"train_loss": -10.657276153564453, "global_step": 172635, "epoch": 1027} {"train_loss": -10.893672943115234, "global_step": 172636, "epoch": 1027} {"train_loss": -10.68478775024414, "global_step": 172637, "epoch": 1027} {"train_loss": -10.827767372131348, "global_step": 172638, "epoch": 1027} {"train_loss": -10.383532524108887, "global_step": 172639, "epoch": 1027} {"train_loss": -10.955533981323242, "global_step": 172640, "epoch": 1027} {"train_loss": -10.054169654846191, "global_step": 172641, "epoch": 1027} {"train_loss": -9.912969589233398, "global_step": 172642, "epoch": 1027} {"train_loss": -10.63074779510498, "global_step": 172643, "epoch": 1027} {"train_loss": -10.314860343933105, "global_step": 172644, "epoch": 1027} {"train_loss": -10.786014556884766, "global_step": 172645, "epoch": 1027} {"train_loss": -9.499878883361816, "global_step": 172646, "epoch": 1027} {"train_loss": -10.56383991241455, "global_step": 172647, "epoch": 1027} {"train_loss": -10.005435943603516, "global_step": 172648, "epoch": 1027} {"train_loss": -10.501960754394531, "global_step": 172649, "epoch": 1027} {"train_loss": -10.588374137878418, "global_step": 172650, "epoch": 1027} {"train_loss": -10.842279434204102, "global_step": 172651, "epoch": 1027} {"train_loss": -10.307854652404785, "global_step": 172652, "epoch": 1027} {"train_loss": -11.031874656677246, "global_step": 172653, "epoch": 1027} {"train_loss": -10.368237495422363, "global_step": 172654, "epoch": 1027} {"train_loss": -10.560983657836914, "global_step": 172655, "epoch": 1027} {"train_loss": -10.72977352142334, "global_step": 172656, "epoch": 1027} {"train_loss": -10.833635330200195, "global_step": 172657, "epoch": 1027} {"train_loss": -10.433079719543457, "global_step": 172658, "epoch": 1027} {"train_loss": -11.043164253234863, "global_step": 172659, "epoch": 1027} {"train_loss": -10.53321647644043, "global_step": 172660, "epoch": 1027} {"train_loss": -10.925100326538086, "global_step": 172661, "epoch": 1027} {"train_loss": -10.664376258850098, "global_step": 172662, "epoch": 1027} {"train_loss": -10.812686920166016, "global_step": 172663, "epoch": 1027} {"train_loss": -10.966422080993652, "global_step": 172664, "epoch": 1027} {"train_loss": -10.897168159484863, "global_step": 172665, "epoch": 1027} {"train_loss": -11.21116828918457, "global_step": 172666, "epoch": 1027} {"train_loss": -10.755661010742188, "global_step": 172667, "epoch": 1027} {"train_loss": -11.09303092956543, "global_step": 172668, "epoch": 1027} {"train_loss": -10.873740196228027, "global_step": 172669, "epoch": 1027} {"train_loss": -10.95429515838623, "global_step": 172670, "epoch": 1027} {"train_loss": -11.172054290771484, "global_step": 172671, "epoch": 1027} {"train_loss": -10.753253936767578, "global_step": 172672, "epoch": 1027} {"train_loss": -10.992096900939941, "global_step": 172673, "epoch": 1027} {"train_loss": -11.108325958251953, "global_step": 172674, "epoch": 1027} {"train_loss": -11.274694442749023, "global_step": 172675, "epoch": 1027} {"train_loss": -11.135313034057617, "global_step": 172676, "epoch": 1027} {"train_loss": -11.085001945495605, "global_step": 172677, "epoch": 1027} {"train_loss": -11.257096290588379, "global_step": 172678, "epoch": 1027} {"train_loss": -11.004805564880371, "global_step": 172679, "epoch": 1027} {"train_loss": -11.315852165222168, "global_step": 172680, "epoch": 1027} {"train_loss": -11.120136260986328, "global_step": 172681, "epoch": 1027} {"train_loss": -11.048263549804688, "global_step": 172682, "epoch": 1027} {"train_loss": -11.037202835083008, "global_step": 172683, "epoch": 1027} {"train_loss": -11.29806137084961, "global_step": 172684, "epoch": 1027} {"train_loss": -11.403133392333984, "global_step": 172685, "epoch": 1027} {"train_loss": -11.145050048828125, "global_step": 172686, "epoch": 1027} {"train_loss": -11.065061569213867, "global_step": 172687, "epoch": 1027} {"train_loss": -11.256671905517578, "global_step": 172688, "epoch": 1027} {"train_loss": -11.302728652954102, "global_step": 172689, "epoch": 1027} {"train_loss": -11.247282028198242, "global_step": 172690, "epoch": 1027} {"train_loss": -11.422147750854492, "global_step": 172691, "epoch": 1027} {"train_loss": -11.27128791809082, "global_step": 172692, "epoch": 1027} {"train_loss": -11.324341773986816, "global_step": 172693, "epoch": 1027} {"train_loss": -11.08277702331543, "global_step": 172694, "epoch": 1027} {"train_loss": -11.335761070251465, "global_step": 172695, "epoch": 1027} {"train_loss": -11.01156997680664, "global_step": 172696, "epoch": 1027} {"train_loss": -11.156935691833496, "global_step": 172697, "epoch": 1027} {"train_loss": -11.104889869689941, "global_step": 172698, "epoch": 1027} {"train_loss": -11.239317893981934, "global_step": 172699, "epoch": 1027} {"train_loss": -11.355306625366211, "global_step": 172700, "epoch": 1027} {"train_loss": -11.339398384094238, "global_step": 172701, "epoch": 1027} {"train_loss": -11.015121459960938, "global_step": 172702, "epoch": 1027} {"train_loss": -10.944299141565958, "global_step": 172703, "epoch": 1027, "val_loss": 240931.046875} {"train_loss": -11.343757629394531, "global_step": 172704, "epoch": 1028} {"train_loss": -10.979143142700195, "global_step": 172705, "epoch": 1028} {"train_loss": -11.614246368408203, "global_step": 172706, "epoch": 1028} {"train_loss": -10.940434455871582, "global_step": 172707, "epoch": 1028} {"train_loss": -11.100927352905273, "global_step": 172708, "epoch": 1028} {"train_loss": -11.482101440429688, "global_step": 172709, "epoch": 1028} {"train_loss": -10.965816497802734, "global_step": 172710, "epoch": 1028} {"train_loss": -10.843099594116211, "global_step": 172711, "epoch": 1028} {"train_loss": -11.190845489501953, "global_step": 172712, "epoch": 1028} {"train_loss": -11.65778923034668, "global_step": 172713, "epoch": 1028} {"train_loss": -11.559820175170898, "global_step": 172714, "epoch": 1028} {"train_loss": -11.285712242126465, "global_step": 172715, "epoch": 1028} {"train_loss": -11.361457824707031, "global_step": 172716, "epoch": 1028} {"train_loss": -11.353717803955078, "global_step": 172717, "epoch": 1028} {"train_loss": -11.13652229309082, "global_step": 172718, "epoch": 1028} {"train_loss": -11.245862007141113, "global_step": 172719, "epoch": 1028} {"train_loss": -11.29847526550293, "global_step": 172720, "epoch": 1028} {"train_loss": -11.11075210571289, "global_step": 172721, "epoch": 1028} {"train_loss": -10.789438247680664, "global_step": 172722, "epoch": 1028} {"train_loss": -11.087181091308594, "global_step": 172723, "epoch": 1028} {"train_loss": -10.998981475830078, "global_step": 172724, "epoch": 1028} {"train_loss": -10.826187133789062, "global_step": 172725, "epoch": 1028} {"train_loss": -11.243300437927246, "global_step": 172726, "epoch": 1028} {"train_loss": -11.088479995727539, "global_step": 172727, "epoch": 1028} {"train_loss": -11.203601837158203, "global_step": 172728, "epoch": 1028} {"train_loss": -10.860954284667969, "global_step": 172729, "epoch": 1028} {"train_loss": -11.377786636352539, "global_step": 172730, "epoch": 1028} {"train_loss": -11.259906768798828, "global_step": 172731, "epoch": 1028} {"train_loss": -10.554095268249512, "global_step": 172732, "epoch": 1028} {"train_loss": -10.669394493103027, "global_step": 172733, "epoch": 1028} {"train_loss": -10.341525077819824, "global_step": 172734, "epoch": 1028} {"train_loss": -9.802364349365234, "global_step": 172735, "epoch": 1028} {"train_loss": -10.769356727600098, "global_step": 172736, "epoch": 1028} {"train_loss": -9.545267105102539, "global_step": 172737, "epoch": 1028} {"train_loss": -9.806768417358398, "global_step": 172738, "epoch": 1028} {"train_loss": -10.47449016571045, "global_step": 172739, "epoch": 1028} {"train_loss": -9.325254440307617, "global_step": 172740, "epoch": 1028} {"train_loss": -10.742330551147461, "global_step": 172741, "epoch": 1028} {"train_loss": -9.7777681350708, "global_step": 172742, "epoch": 1028} {"train_loss": -10.045079231262207, "global_step": 172743, "epoch": 1028} {"train_loss": -10.7166109085083, "global_step": 172744, "epoch": 1028} {"train_loss": -9.37164306640625, "global_step": 172745, "epoch": 1028} {"train_loss": -9.862446784973145, "global_step": 172746, "epoch": 1028} {"train_loss": -9.987424850463867, "global_step": 172747, "epoch": 1028} {"train_loss": -9.880167007446289, "global_step": 172748, "epoch": 1028} {"train_loss": -10.368444442749023, "global_step": 172749, "epoch": 1028} {"train_loss": -9.933082580566406, "global_step": 172750, "epoch": 1028} {"train_loss": -9.725204467773438, "global_step": 172751, "epoch": 1028} {"train_loss": -10.371718406677246, "global_step": 172752, "epoch": 1028} {"train_loss": -10.356258392333984, "global_step": 172753, "epoch": 1028} {"train_loss": -9.703664779663086, "global_step": 172754, "epoch": 1028} {"train_loss": -10.033584594726562, "global_step": 172755, "epoch": 1028} {"train_loss": -10.40672779083252, "global_step": 172756, "epoch": 1028} {"train_loss": -9.727705001831055, "global_step": 172757, "epoch": 1028} {"train_loss": -10.665694236755371, "global_step": 172758, "epoch": 1028} {"train_loss": -10.631872177124023, "global_step": 172759, "epoch": 1028} {"train_loss": -10.526281356811523, "global_step": 172760, "epoch": 1028} {"train_loss": -10.598945617675781, "global_step": 172761, "epoch": 1028} {"train_loss": -10.67489242553711, "global_step": 172762, "epoch": 1028} {"train_loss": -10.421531677246094, "global_step": 172763, "epoch": 1028} {"train_loss": -10.720739364624023, "global_step": 172764, "epoch": 1028} {"train_loss": -10.756139755249023, "global_step": 172765, "epoch": 1028} {"train_loss": -10.507516860961914, "global_step": 172766, "epoch": 1028} {"train_loss": -11.023416519165039, "global_step": 172767, "epoch": 1028} {"train_loss": -10.924367904663086, "global_step": 172768, "epoch": 1028} {"train_loss": -10.978452682495117, "global_step": 172769, "epoch": 1028} {"train_loss": -10.718530654907227, "global_step": 172770, "epoch": 1028} {"train_loss": -10.81313705444336, "global_step": 172771, "epoch": 1028} {"train_loss": -10.989105224609375, "global_step": 172772, "epoch": 1028} {"train_loss": -10.899304389953613, "global_step": 172773, "epoch": 1028} {"train_loss": -11.074583053588867, "global_step": 172774, "epoch": 1028} {"train_loss": -10.946939468383789, "global_step": 172775, "epoch": 1028} {"train_loss": -11.021615028381348, "global_step": 172776, "epoch": 1028} {"train_loss": -11.055497169494629, "global_step": 172777, "epoch": 1028} {"train_loss": -10.792688369750977, "global_step": 172778, "epoch": 1028} {"train_loss": -10.932491302490234, "global_step": 172779, "epoch": 1028} {"train_loss": -10.969552040100098, "global_step": 172780, "epoch": 1028} {"train_loss": -10.12763500213623, "global_step": 172781, "epoch": 1028} {"train_loss": -11.246325492858887, "global_step": 172782, "epoch": 1028} {"train_loss": -10.550697326660156, "global_step": 172783, "epoch": 1028} {"train_loss": -10.924493789672852, "global_step": 172784, "epoch": 1028} {"train_loss": -11.097735404968262, "global_step": 172785, "epoch": 1028} {"train_loss": -10.855844497680664, "global_step": 172786, "epoch": 1028} {"train_loss": -10.847149848937988, "global_step": 172787, "epoch": 1028} {"train_loss": -11.018404006958008, "global_step": 172788, "epoch": 1028} {"train_loss": -10.856203079223633, "global_step": 172789, "epoch": 1028} {"train_loss": -10.971176147460938, "global_step": 172790, "epoch": 1028} {"train_loss": -10.978473663330078, "global_step": 172791, "epoch": 1028} {"train_loss": -10.89597225189209, "global_step": 172792, "epoch": 1028} {"train_loss": -11.114222526550293, "global_step": 172793, "epoch": 1028} {"train_loss": -11.227505683898926, "global_step": 172794, "epoch": 1028} {"train_loss": -10.972702026367188, "global_step": 172795, "epoch": 1028} {"train_loss": -10.984679222106934, "global_step": 172796, "epoch": 1028} {"train_loss": -11.230972290039062, "global_step": 172797, "epoch": 1028} {"train_loss": -11.228700637817383, "global_step": 172798, "epoch": 1028} {"train_loss": -11.310754776000977, "global_step": 172799, "epoch": 1028} {"train_loss": -11.127994537353516, "global_step": 172800, "epoch": 1028} {"train_loss": -11.070758819580078, "global_step": 172801, "epoch": 1028} {"train_loss": -11.374500274658203, "global_step": 172802, "epoch": 1028} {"train_loss": -11.170511245727539, "global_step": 172803, "epoch": 1028} {"train_loss": -11.265146255493164, "global_step": 172804, "epoch": 1028} {"train_loss": -11.408404350280762, "global_step": 172805, "epoch": 1028} {"train_loss": -11.287543296813965, "global_step": 172806, "epoch": 1028} {"train_loss": -11.3218355178833, "global_step": 172807, "epoch": 1028} {"train_loss": -11.358240127563477, "global_step": 172808, "epoch": 1028} {"train_loss": -11.065396308898926, "global_step": 172809, "epoch": 1028} {"train_loss": -11.17133617401123, "global_step": 172810, "epoch": 1028} {"train_loss": -11.364083290100098, "global_step": 172811, "epoch": 1028} {"train_loss": -11.259109497070312, "global_step": 172812, "epoch": 1028} {"train_loss": -11.4892578125, "global_step": 172813, "epoch": 1028} {"train_loss": -11.2616548538208, "global_step": 172814, "epoch": 1028} {"train_loss": -11.326324462890625, "global_step": 172815, "epoch": 1028} {"train_loss": -11.344493865966797, "global_step": 172816, "epoch": 1028} {"train_loss": -11.268743515014648, "global_step": 172817, "epoch": 1028} {"train_loss": -11.408404350280762, "global_step": 172818, "epoch": 1028} {"train_loss": -11.089021682739258, "global_step": 172819, "epoch": 1028} {"train_loss": -11.39210033416748, "global_step": 172820, "epoch": 1028} {"train_loss": -11.45833969116211, "global_step": 172821, "epoch": 1028} {"train_loss": -11.134305000305176, "global_step": 172822, "epoch": 1028} {"train_loss": -11.23473072052002, "global_step": 172823, "epoch": 1028} {"train_loss": -10.879120826721191, "global_step": 172824, "epoch": 1028} {"train_loss": -11.054193496704102, "global_step": 172825, "epoch": 1028} {"train_loss": -11.072197914123535, "global_step": 172826, "epoch": 1028} {"train_loss": -10.235788345336914, "global_step": 172827, "epoch": 1028} {"train_loss": -11.452127456665039, "global_step": 172828, "epoch": 1028} {"train_loss": -10.439800262451172, "global_step": 172829, "epoch": 1028} {"train_loss": -10.758049011230469, "global_step": 172830, "epoch": 1028} {"train_loss": -10.947041511535645, "global_step": 172831, "epoch": 1028} {"train_loss": -10.653032302856445, "global_step": 172832, "epoch": 1028} {"train_loss": -10.825258255004883, "global_step": 172833, "epoch": 1028} {"train_loss": -10.764833450317383, "global_step": 172834, "epoch": 1028} {"train_loss": -9.756002426147461, "global_step": 172835, "epoch": 1028} {"train_loss": -10.676456451416016, "global_step": 172836, "epoch": 1028} {"train_loss": -11.096030235290527, "global_step": 172837, "epoch": 1028} {"train_loss": -10.63910961151123, "global_step": 172838, "epoch": 1028} {"train_loss": -11.171868324279785, "global_step": 172839, "epoch": 1028} {"train_loss": -10.76585578918457, "global_step": 172840, "epoch": 1028} {"train_loss": -11.07373332977295, "global_step": 172841, "epoch": 1028} {"train_loss": -10.925460815429688, "global_step": 172842, "epoch": 1028} {"train_loss": -10.765575408935547, "global_step": 172843, "epoch": 1028} {"train_loss": -11.165288925170898, "global_step": 172844, "epoch": 1028} {"train_loss": -11.116004943847656, "global_step": 172845, "epoch": 1028} {"train_loss": -10.892558097839355, "global_step": 172846, "epoch": 1028} {"train_loss": -10.811887741088867, "global_step": 172847, "epoch": 1028} {"train_loss": -10.68984317779541, "global_step": 172848, "epoch": 1028} {"train_loss": -10.75739860534668, "global_step": 172849, "epoch": 1028} {"train_loss": -10.8536376953125, "global_step": 172850, "epoch": 1028} {"train_loss": -10.539923667907715, "global_step": 172851, "epoch": 1028} {"train_loss": -11.221384048461914, "global_step": 172852, "epoch": 1028} {"train_loss": -10.839176177978516, "global_step": 172853, "epoch": 1028} {"train_loss": -11.005895614624023, "global_step": 172854, "epoch": 1028} {"train_loss": -11.196512222290039, "global_step": 172855, "epoch": 1028} {"train_loss": -11.122404098510742, "global_step": 172856, "epoch": 1028} {"train_loss": -10.935888290405273, "global_step": 172857, "epoch": 1028} {"train_loss": -11.160888671875, "global_step": 172858, "epoch": 1028} {"train_loss": -11.208868980407715, "global_step": 172859, "epoch": 1028} {"train_loss": -10.925655364990234, "global_step": 172860, "epoch": 1028} {"train_loss": -10.98880672454834, "global_step": 172861, "epoch": 1028} {"train_loss": -10.935365676879883, "global_step": 172862, "epoch": 1028} {"train_loss": -10.779229164123535, "global_step": 172863, "epoch": 1028} {"train_loss": -10.984942436218262, "global_step": 172864, "epoch": 1028} {"train_loss": -10.955142974853516, "global_step": 172865, "epoch": 1028} {"train_loss": -11.141778945922852, "global_step": 172866, "epoch": 1028} {"train_loss": -10.614297866821289, "global_step": 172867, "epoch": 1028} {"train_loss": -11.075708389282227, "global_step": 172868, "epoch": 1028} {"train_loss": -10.893146514892578, "global_step": 172869, "epoch": 1028} {"train_loss": -11.036519050598145, "global_step": 172870, "epoch": 1028} {"train_loss": -10.868705187525068, "global_step": 172871, "epoch": 1028, "val_loss": 240514.15625} {"train_loss": -10.893508911132812, "global_step": 172872, "epoch": 1029} {"train_loss": -11.377021789550781, "global_step": 172873, "epoch": 1029} {"train_loss": -11.054587364196777, "global_step": 172874, "epoch": 1029} {"train_loss": -11.058313369750977, "global_step": 172875, "epoch": 1029} {"train_loss": -11.269498825073242, "global_step": 172876, "epoch": 1029} {"train_loss": -11.012471199035645, "global_step": 172877, "epoch": 1029} {"train_loss": -11.442793846130371, "global_step": 172878, "epoch": 1029} {"train_loss": -10.973543167114258, "global_step": 172879, "epoch": 1029} {"train_loss": -11.435935020446777, "global_step": 172880, "epoch": 1029} {"train_loss": -11.13530158996582, "global_step": 172881, "epoch": 1029} {"train_loss": -11.069671630859375, "global_step": 172882, "epoch": 1029} {"train_loss": -11.328693389892578, "global_step": 172883, "epoch": 1029} {"train_loss": -11.168858528137207, "global_step": 172884, "epoch": 1029} {"train_loss": -11.321188926696777, "global_step": 172885, "epoch": 1029} {"train_loss": -11.192922592163086, "global_step": 172886, "epoch": 1029} {"train_loss": -11.326017379760742, "global_step": 172887, "epoch": 1029} {"train_loss": -10.93643856048584, "global_step": 172888, "epoch": 1029} {"train_loss": -11.421184539794922, "global_step": 172889, "epoch": 1029} {"train_loss": -11.034649848937988, "global_step": 172890, "epoch": 1029} {"train_loss": -11.202255249023438, "global_step": 172891, "epoch": 1029} {"train_loss": -11.105246543884277, "global_step": 172892, "epoch": 1029} {"train_loss": -11.210186004638672, "global_step": 172893, "epoch": 1029} {"train_loss": -10.705080032348633, "global_step": 172894, "epoch": 1029} {"train_loss": -10.944974899291992, "global_step": 172895, "epoch": 1029} {"train_loss": -11.041862487792969, "global_step": 172896, "epoch": 1029} {"train_loss": -10.653963088989258, "global_step": 172897, "epoch": 1029} {"train_loss": -11.06677532196045, "global_step": 172898, "epoch": 1029} {"train_loss": -10.867748260498047, "global_step": 172899, "epoch": 1029} {"train_loss": -10.886041641235352, "global_step": 172900, "epoch": 1029} {"train_loss": -10.323917388916016, "global_step": 172901, "epoch": 1029} {"train_loss": -10.868831634521484, "global_step": 172902, "epoch": 1029} {"train_loss": -10.938667297363281, "global_step": 172903, "epoch": 1029} {"train_loss": -10.427228927612305, "global_step": 172904, "epoch": 1029} {"train_loss": -11.135154724121094, "global_step": 172905, "epoch": 1029} {"train_loss": -10.395065307617188, "global_step": 172906, "epoch": 1029} {"train_loss": -11.05941104888916, "global_step": 172907, "epoch": 1029} {"train_loss": -10.940329551696777, "global_step": 172908, "epoch": 1029} {"train_loss": -10.503045082092285, "global_step": 172909, "epoch": 1029} {"train_loss": -10.921529769897461, "global_step": 172910, "epoch": 1029} {"train_loss": -10.809487342834473, "global_step": 172911, "epoch": 1029} {"train_loss": -10.80246353149414, "global_step": 172912, "epoch": 1029} {"train_loss": -10.882625579833984, "global_step": 172913, "epoch": 1029} {"train_loss": -11.028453826904297, "global_step": 172914, "epoch": 1029} {"train_loss": -10.707728385925293, "global_step": 172915, "epoch": 1029} {"train_loss": -11.42829704284668, "global_step": 172916, "epoch": 1029} {"train_loss": -10.553275108337402, "global_step": 172917, "epoch": 1029} {"train_loss": -11.074033737182617, "global_step": 172918, "epoch": 1029} {"train_loss": -10.286149024963379, "global_step": 172919, "epoch": 1029} {"train_loss": -11.261155128479004, "global_step": 172920, "epoch": 1029} {"train_loss": -10.333100318908691, "global_step": 172921, "epoch": 1029} {"train_loss": -10.676572799682617, "global_step": 172922, "epoch": 1029} {"train_loss": -10.880681991577148, "global_step": 172923, "epoch": 1029} {"train_loss": -10.860818862915039, "global_step": 172924, "epoch": 1029} {"train_loss": -10.868988037109375, "global_step": 172925, "epoch": 1029} {"train_loss": -11.045865058898926, "global_step": 172926, "epoch": 1029} {"train_loss": -10.285338401794434, "global_step": 172927, "epoch": 1029} {"train_loss": -11.159061431884766, "global_step": 172928, "epoch": 1029} {"train_loss": -10.738523483276367, "global_step": 172929, "epoch": 1029} {"train_loss": -10.722396850585938, "global_step": 172930, "epoch": 1029} {"train_loss": -10.863697052001953, "global_step": 172931, "epoch": 1029} {"train_loss": -10.973861694335938, "global_step": 172932, "epoch": 1029} {"train_loss": -10.614265441894531, "global_step": 172933, "epoch": 1029} {"train_loss": -10.90163516998291, "global_step": 172934, "epoch": 1029} {"train_loss": -10.635051727294922, "global_step": 172935, "epoch": 1029} {"train_loss": -10.662019729614258, "global_step": 172936, "epoch": 1029} {"train_loss": -10.889472961425781, "global_step": 172937, "epoch": 1029} {"train_loss": -10.98773193359375, "global_step": 172938, "epoch": 1029} {"train_loss": -10.848081588745117, "global_step": 172939, "epoch": 1029} {"train_loss": -11.051225662231445, "global_step": 172940, "epoch": 1029} {"train_loss": -10.949807167053223, "global_step": 172941, "epoch": 1029} {"train_loss": -11.241018295288086, "global_step": 172942, "epoch": 1029} {"train_loss": -11.199910163879395, "global_step": 172943, "epoch": 1029} {"train_loss": -11.012594223022461, "global_step": 172944, "epoch": 1029} {"train_loss": -11.103830337524414, "global_step": 172945, "epoch": 1029} {"train_loss": -10.9791841506958, "global_step": 172946, "epoch": 1029} {"train_loss": -11.263568878173828, "global_step": 172947, "epoch": 1029} {"train_loss": -10.881807327270508, "global_step": 172948, "epoch": 1029} {"train_loss": -11.08115291595459, "global_step": 172949, "epoch": 1029} {"train_loss": -11.076297760009766, "global_step": 172950, "epoch": 1029} {"train_loss": -11.072065353393555, "global_step": 172951, "epoch": 1029} {"train_loss": -10.976936340332031, "global_step": 172952, "epoch": 1029} {"train_loss": -11.078733444213867, "global_step": 172953, "epoch": 1029} {"train_loss": -11.214235305786133, "global_step": 172954, "epoch": 1029} {"train_loss": -10.989400863647461, "global_step": 172955, "epoch": 1029} {"train_loss": -11.074583053588867, "global_step": 172956, "epoch": 1029} {"train_loss": -11.124067306518555, "global_step": 172957, "epoch": 1029} {"train_loss": -11.110696792602539, "global_step": 172958, "epoch": 1029} {"train_loss": -11.004535675048828, "global_step": 172959, "epoch": 1029} {"train_loss": -11.070985794067383, "global_step": 172960, "epoch": 1029} {"train_loss": -11.099325180053711, "global_step": 172961, "epoch": 1029} {"train_loss": -11.130494117736816, "global_step": 172962, "epoch": 1029} {"train_loss": -10.749605178833008, "global_step": 172963, "epoch": 1029} {"train_loss": -11.07489013671875, "global_step": 172964, "epoch": 1029} {"train_loss": -11.341974258422852, "global_step": 172965, "epoch": 1029} {"train_loss": -11.146080017089844, "global_step": 172966, "epoch": 1029} {"train_loss": -10.888355255126953, "global_step": 172967, "epoch": 1029} {"train_loss": -11.456799507141113, "global_step": 172968, "epoch": 1029} {"train_loss": -11.060846328735352, "global_step": 172969, "epoch": 1029} {"train_loss": -11.124078750610352, "global_step": 172970, "epoch": 1029} {"train_loss": -11.044672012329102, "global_step": 172971, "epoch": 1029} {"train_loss": -10.827695846557617, "global_step": 172972, "epoch": 1029} {"train_loss": -10.991189956665039, "global_step": 172973, "epoch": 1029} {"train_loss": -11.127429962158203, "global_step": 172974, "epoch": 1029} {"train_loss": -11.282076835632324, "global_step": 172975, "epoch": 1029} {"train_loss": -10.987442016601562, "global_step": 172976, "epoch": 1029} {"train_loss": -11.074172019958496, "global_step": 172977, "epoch": 1029} {"train_loss": -11.047966003417969, "global_step": 172978, "epoch": 1029} {"train_loss": -11.228614807128906, "global_step": 172979, "epoch": 1029} {"train_loss": -11.061847686767578, "global_step": 172980, "epoch": 1029} {"train_loss": -11.19425106048584, "global_step": 172981, "epoch": 1029} {"train_loss": -11.013935089111328, "global_step": 172982, "epoch": 1029} {"train_loss": -11.169182777404785, "global_step": 172983, "epoch": 1029} {"train_loss": -11.262107849121094, "global_step": 172984, "epoch": 1029} {"train_loss": -11.09478759765625, "global_step": 172985, "epoch": 1029} {"train_loss": -11.283421516418457, "global_step": 172986, "epoch": 1029} {"train_loss": -11.16789436340332, "global_step": 172987, "epoch": 1029} {"train_loss": -11.20830249786377, "global_step": 172988, "epoch": 1029} {"train_loss": -11.230554580688477, "global_step": 172989, "epoch": 1029} {"train_loss": -11.258909225463867, "global_step": 172990, "epoch": 1029} {"train_loss": -11.34038257598877, "global_step": 172991, "epoch": 1029} {"train_loss": -11.06077766418457, "global_step": 172992, "epoch": 1029} {"train_loss": -11.450529098510742, "global_step": 172993, "epoch": 1029} {"train_loss": -11.265934944152832, "global_step": 172994, "epoch": 1029} {"train_loss": -11.33529281616211, "global_step": 172995, "epoch": 1029} {"train_loss": -11.012676239013672, "global_step": 172996, "epoch": 1029} {"train_loss": -10.967191696166992, "global_step": 172997, "epoch": 1029} {"train_loss": -11.280241966247559, "global_step": 172998, "epoch": 1029} {"train_loss": -11.282228469848633, "global_step": 172999, "epoch": 1029} {"train_loss": -11.263383865356445, "global_step": 173000, "epoch": 1029} {"train_loss": -11.300189971923828, "global_step": 173001, "epoch": 1029} {"train_loss": -11.114660263061523, "global_step": 173002, "epoch": 1029} {"train_loss": -11.281519889831543, "global_step": 173003, "epoch": 1029} {"train_loss": -10.94399642944336, "global_step": 173004, "epoch": 1029} {"train_loss": -11.261127471923828, "global_step": 173005, "epoch": 1029} {"train_loss": -11.083236694335938, "global_step": 173006, "epoch": 1029} {"train_loss": -11.202729225158691, "global_step": 173007, "epoch": 1029} {"train_loss": -9.884927749633789, "global_step": 173008, "epoch": 1029} {"train_loss": -10.057031631469727, "global_step": 173009, "epoch": 1029} {"train_loss": -10.069385528564453, "global_step": 173010, "epoch": 1029} {"train_loss": -11.27342700958252, "global_step": 173011, "epoch": 1029} {"train_loss": -10.352667808532715, "global_step": 173012, "epoch": 1029} {"train_loss": -10.289036750793457, "global_step": 173013, "epoch": 1029} {"train_loss": -10.808850288391113, "global_step": 173014, "epoch": 1029} {"train_loss": -9.240784645080566, "global_step": 173015, "epoch": 1029} {"train_loss": -10.755599975585938, "global_step": 173016, "epoch": 1029} {"train_loss": -10.627763748168945, "global_step": 173017, "epoch": 1029} {"train_loss": -9.481260299682617, "global_step": 173018, "epoch": 1029} {"train_loss": -10.41714096069336, "global_step": 173019, "epoch": 1029} {"train_loss": -10.331562042236328, "global_step": 173020, "epoch": 1029} {"train_loss": -10.680776596069336, "global_step": 173021, "epoch": 1029} {"train_loss": -10.08499813079834, "global_step": 173022, "epoch": 1029} {"train_loss": -10.309259414672852, "global_step": 173023, "epoch": 1029} {"train_loss": -9.969100952148438, "global_step": 173024, "epoch": 1029} {"train_loss": -10.354284286499023, "global_step": 173025, "epoch": 1029} {"train_loss": -9.068930625915527, "global_step": 173026, "epoch": 1029} {"train_loss": -10.552156448364258, "global_step": 173027, "epoch": 1029} {"train_loss": -10.028923034667969, "global_step": 173028, "epoch": 1029} {"train_loss": -10.94813060760498, "global_step": 173029, "epoch": 1029} {"train_loss": -10.058767318725586, "global_step": 173030, "epoch": 1029} {"train_loss": -10.528167724609375, "global_step": 173031, "epoch": 1029} {"train_loss": -10.289300918579102, "global_step": 173032, "epoch": 1029} {"train_loss": -10.144103050231934, "global_step": 173033, "epoch": 1029} {"train_loss": -10.692889213562012, "global_step": 173034, "epoch": 1029} {"train_loss": -10.527965545654297, "global_step": 173035, "epoch": 1029} {"train_loss": -10.837132453918457, "global_step": 173036, "epoch": 1029} {"train_loss": -10.703407287597656, "global_step": 173037, "epoch": 1029} {"train_loss": -10.793882369995117, "global_step": 173038, "epoch": 1029} {"train_loss": -10.89939536367144, "global_step": 173039, "epoch": 1029, "val_loss": 237947.453125} {"train_loss": -10.650186538696289, "global_step": 173040, "epoch": 1030} {"train_loss": -10.752931594848633, "global_step": 173041, "epoch": 1030} {"train_loss": -10.826692581176758, "global_step": 173042, "epoch": 1030} {"train_loss": -10.780563354492188, "global_step": 173043, "epoch": 1030} {"train_loss": -10.753002166748047, "global_step": 173044, "epoch": 1030} {"train_loss": -10.916460037231445, "global_step": 173045, "epoch": 1030} {"train_loss": -10.726020812988281, "global_step": 173046, "epoch": 1030} {"train_loss": -10.843313217163086, "global_step": 173047, "epoch": 1030} {"train_loss": -10.840109825134277, "global_step": 173048, "epoch": 1030} {"train_loss": -10.885552406311035, "global_step": 173049, "epoch": 1030} {"train_loss": -10.969386100769043, "global_step": 173050, "epoch": 1030} {"train_loss": -10.808882713317871, "global_step": 173051, "epoch": 1030} {"train_loss": -10.878807067871094, "global_step": 173052, "epoch": 1030} {"train_loss": -11.008312225341797, "global_step": 173053, "epoch": 1030} {"train_loss": -11.082075119018555, "global_step": 173054, "epoch": 1030} {"train_loss": -11.100442886352539, "global_step": 173055, "epoch": 1030} {"train_loss": -11.294519424438477, "global_step": 173056, "epoch": 1030} {"train_loss": -10.780025482177734, "global_step": 173057, "epoch": 1030} {"train_loss": -11.157258987426758, "global_step": 173058, "epoch": 1030} {"train_loss": -11.313618659973145, "global_step": 173059, "epoch": 1030} {"train_loss": -11.199014663696289, "global_step": 173060, "epoch": 1030} {"train_loss": -11.155569076538086, "global_step": 173061, "epoch": 1030} {"train_loss": -11.092172622680664, "global_step": 173062, "epoch": 1030} {"train_loss": -11.203102111816406, "global_step": 173063, "epoch": 1030} {"train_loss": -11.115091323852539, "global_step": 173064, "epoch": 1030} {"train_loss": -11.310369491577148, "global_step": 173065, "epoch": 1030} {"train_loss": -11.10588264465332, "global_step": 173066, "epoch": 1030} {"train_loss": -10.96693229675293, "global_step": 173067, "epoch": 1030} {"train_loss": -11.225493431091309, "global_step": 173068, "epoch": 1030} {"train_loss": -11.198270797729492, "global_step": 173069, "epoch": 1030} {"train_loss": -11.126750946044922, "global_step": 173070, "epoch": 1030} {"train_loss": -11.262292861938477, "global_step": 173071, "epoch": 1030} {"train_loss": -11.163297653198242, "global_step": 173072, "epoch": 1030} {"train_loss": -11.241244316101074, "global_step": 173073, "epoch": 1030} {"train_loss": -11.297274589538574, "global_step": 173074, "epoch": 1030} {"train_loss": -11.294499397277832, "global_step": 173075, "epoch": 1030} {"train_loss": -11.31619930267334, "global_step": 173076, "epoch": 1030} {"train_loss": -11.648733139038086, "global_step": 173077, "epoch": 1030} {"train_loss": -11.555780410766602, "global_step": 173078, "epoch": 1030} {"train_loss": -11.282491683959961, "global_step": 173079, "epoch": 1030} {"train_loss": -11.238138198852539, "global_step": 173080, "epoch": 1030} {"train_loss": -11.10288143157959, "global_step": 173081, "epoch": 1030} {"train_loss": -11.398991584777832, "global_step": 173082, "epoch": 1030} {"train_loss": -11.188892364501953, "global_step": 173083, "epoch": 1030} {"train_loss": -11.134744644165039, "global_step": 173084, "epoch": 1030} {"train_loss": -11.348991394042969, "global_step": 173085, "epoch": 1030} {"train_loss": -11.440914154052734, "global_step": 173086, "epoch": 1030} {"train_loss": -11.283733367919922, "global_step": 173087, "epoch": 1030} {"train_loss": -11.330270767211914, "global_step": 173088, "epoch": 1030} {"train_loss": -11.144065856933594, "global_step": 173089, "epoch": 1030} {"train_loss": -11.374523162841797, "global_step": 173090, "epoch": 1030} {"train_loss": -11.55945110321045, "global_step": 173091, "epoch": 1030} {"train_loss": -11.553180694580078, "global_step": 173092, "epoch": 1030} {"train_loss": -11.566291809082031, "global_step": 173093, "epoch": 1030} {"train_loss": -11.398048400878906, "global_step": 173094, "epoch": 1030} {"train_loss": -11.245172500610352, "global_step": 173095, "epoch": 1030} {"train_loss": -11.363189697265625, "global_step": 173096, "epoch": 1030} {"train_loss": -11.52137565612793, "global_step": 173097, "epoch": 1030} {"train_loss": -11.113298416137695, "global_step": 173098, "epoch": 1030} {"train_loss": -11.016226768493652, "global_step": 173099, "epoch": 1030} {"train_loss": -11.519902229309082, "global_step": 173100, "epoch": 1030} {"train_loss": -11.402703285217285, "global_step": 173101, "epoch": 1030} {"train_loss": -11.095603942871094, "global_step": 173102, "epoch": 1030} {"train_loss": -11.304425239562988, "global_step": 173103, "epoch": 1030} {"train_loss": -11.29100227355957, "global_step": 173104, "epoch": 1030} {"train_loss": -11.324328422546387, "global_step": 173105, "epoch": 1030} {"train_loss": -11.21573257446289, "global_step": 173106, "epoch": 1030} {"train_loss": -11.274566650390625, "global_step": 173107, "epoch": 1030} {"train_loss": -11.156440734863281, "global_step": 173108, "epoch": 1030} {"train_loss": -11.0698881149292, "global_step": 173109, "epoch": 1030} {"train_loss": -11.318243026733398, "global_step": 173110, "epoch": 1030} {"train_loss": -11.169296264648438, "global_step": 173111, "epoch": 1030} {"train_loss": -11.078516006469727, "global_step": 173112, "epoch": 1030} {"train_loss": -11.270890235900879, "global_step": 173113, "epoch": 1030} {"train_loss": -10.620161056518555, "global_step": 173114, "epoch": 1030} {"train_loss": -10.918536186218262, "global_step": 173115, "epoch": 1030} {"train_loss": -10.919881820678711, "global_step": 173116, "epoch": 1030} {"train_loss": -11.439070701599121, "global_step": 173117, "epoch": 1030} {"train_loss": -10.997486114501953, "global_step": 173118, "epoch": 1030} {"train_loss": -11.251276969909668, "global_step": 173119, "epoch": 1030} {"train_loss": -11.327498435974121, "global_step": 173120, "epoch": 1030} {"train_loss": -11.505552291870117, "global_step": 173121, "epoch": 1030} {"train_loss": -11.11141300201416, "global_step": 173122, "epoch": 1030} {"train_loss": -10.167455673217773, "global_step": 173123, "epoch": 1030} {"train_loss": -10.342635154724121, "global_step": 173124, "epoch": 1030} {"train_loss": -10.79144287109375, "global_step": 173125, "epoch": 1030} {"train_loss": -10.50819206237793, "global_step": 173126, "epoch": 1030} {"train_loss": -9.539262771606445, "global_step": 173127, "epoch": 1030} {"train_loss": -10.51294994354248, "global_step": 173128, "epoch": 1030} {"train_loss": -8.814192771911621, "global_step": 173129, "epoch": 1030} {"train_loss": -10.616632461547852, "global_step": 173130, "epoch": 1030} {"train_loss": -9.583559036254883, "global_step": 173131, "epoch": 1030} {"train_loss": -10.400871276855469, "global_step": 173132, "epoch": 1030} {"train_loss": -9.546445846557617, "global_step": 173133, "epoch": 1030} {"train_loss": -9.029001235961914, "global_step": 173134, "epoch": 1030} {"train_loss": -10.13442611694336, "global_step": 173135, "epoch": 1030} {"train_loss": -9.00783920288086, "global_step": 173136, "epoch": 1030} {"train_loss": -10.438172340393066, "global_step": 173137, "epoch": 1030} {"train_loss": -8.897575378417969, "global_step": 173138, "epoch": 1030} {"train_loss": -10.20422077178955, "global_step": 173139, "epoch": 1030} {"train_loss": -9.069751739501953, "global_step": 173140, "epoch": 1030} {"train_loss": -9.945533752441406, "global_step": 173141, "epoch": 1030} {"train_loss": -9.251686096191406, "global_step": 173142, "epoch": 1030} {"train_loss": -10.52124309539795, "global_step": 173143, "epoch": 1030} {"train_loss": -9.643780708312988, "global_step": 173144, "epoch": 1030} {"train_loss": -10.37630844116211, "global_step": 173145, "epoch": 1030} {"train_loss": -9.91937255859375, "global_step": 173146, "epoch": 1030} {"train_loss": -10.718911170959473, "global_step": 173147, "epoch": 1030} {"train_loss": -9.856405258178711, "global_step": 173148, "epoch": 1030} {"train_loss": -10.72958755493164, "global_step": 173149, "epoch": 1030} {"train_loss": -9.53902816772461, "global_step": 173150, "epoch": 1030} {"train_loss": -10.416778564453125, "global_step": 173151, "epoch": 1030} {"train_loss": -10.2796630859375, "global_step": 173152, "epoch": 1030} {"train_loss": -9.984861373901367, "global_step": 173153, "epoch": 1030} {"train_loss": -10.238510131835938, "global_step": 173154, "epoch": 1030} {"train_loss": -9.495015144348145, "global_step": 173155, "epoch": 1030} {"train_loss": -10.686766624450684, "global_step": 173156, "epoch": 1030} {"train_loss": -9.702802658081055, "global_step": 173157, "epoch": 1030} {"train_loss": -10.283560752868652, "global_step": 173158, "epoch": 1030} {"train_loss": -10.434656143188477, "global_step": 173159, "epoch": 1030} {"train_loss": -9.951502799987793, "global_step": 173160, "epoch": 1030} {"train_loss": -10.548593521118164, "global_step": 173161, "epoch": 1030} {"train_loss": -10.215166091918945, "global_step": 173162, "epoch": 1030} {"train_loss": -10.367131233215332, "global_step": 173163, "epoch": 1030} {"train_loss": -10.739364624023438, "global_step": 173164, "epoch": 1030} {"train_loss": -10.351661682128906, "global_step": 173165, "epoch": 1030} {"train_loss": -10.581123352050781, "global_step": 173166, "epoch": 1030} {"train_loss": -10.187223434448242, "global_step": 173167, "epoch": 1030} {"train_loss": -10.662820816040039, "global_step": 173168, "epoch": 1030} {"train_loss": -10.513099670410156, "global_step": 173169, "epoch": 1030} {"train_loss": -10.675214767456055, "global_step": 173170, "epoch": 1030} {"train_loss": -10.846763610839844, "global_step": 173171, "epoch": 1030} {"train_loss": -10.54321002960205, "global_step": 173172, "epoch": 1030} {"train_loss": -10.911778450012207, "global_step": 173173, "epoch": 1030} {"train_loss": -10.672196388244629, "global_step": 173174, "epoch": 1030} {"train_loss": -10.882486343383789, "global_step": 173175, "epoch": 1030} {"train_loss": -10.80671501159668, "global_step": 173176, "epoch": 1030} {"train_loss": -10.777790069580078, "global_step": 173177, "epoch": 1030} {"train_loss": -11.102203369140625, "global_step": 173178, "epoch": 1030} {"train_loss": -10.864381790161133, "global_step": 173179, "epoch": 1030} {"train_loss": -10.9593505859375, "global_step": 173180, "epoch": 1030} {"train_loss": -10.89563274383545, "global_step": 173181, "epoch": 1030} {"train_loss": -10.907108306884766, "global_step": 173182, "epoch": 1030} {"train_loss": -11.13251781463623, "global_step": 173183, "epoch": 1030} {"train_loss": -10.9609375, "global_step": 173184, "epoch": 1030} {"train_loss": -11.15629768371582, "global_step": 173185, "epoch": 1030} {"train_loss": -11.22389030456543, "global_step": 173186, "epoch": 1030} {"train_loss": -11.095029830932617, "global_step": 173187, "epoch": 1030} {"train_loss": -11.134763717651367, "global_step": 173188, "epoch": 1030} {"train_loss": -11.223302841186523, "global_step": 173189, "epoch": 1030} {"train_loss": -11.161642074584961, "global_step": 173190, "epoch": 1030} {"train_loss": -11.281566619873047, "global_step": 173191, "epoch": 1030} {"train_loss": -11.166959762573242, "global_step": 173192, "epoch": 1030} {"train_loss": -11.228721618652344, "global_step": 173193, "epoch": 1030} {"train_loss": -11.32929801940918, "global_step": 173194, "epoch": 1030} {"train_loss": -11.259108543395996, "global_step": 173195, "epoch": 1030} {"train_loss": -11.204854965209961, "global_step": 173196, "epoch": 1030} {"train_loss": -11.25570297241211, "global_step": 173197, "epoch": 1030} {"train_loss": -11.214998245239258, "global_step": 173198, "epoch": 1030} {"train_loss": -11.029939651489258, "global_step": 173199, "epoch": 1030} {"train_loss": -11.249226570129395, "global_step": 173200, "epoch": 1030} {"train_loss": -11.427852630615234, "global_step": 173201, "epoch": 1030} {"train_loss": -11.279762268066406, "global_step": 173202, "epoch": 1030} {"train_loss": -11.314459800720215, "global_step": 173203, "epoch": 1030} {"train_loss": -11.096128463745117, "global_step": 173204, "epoch": 1030} {"train_loss": -11.326888084411621, "global_step": 173205, "epoch": 1030} {"train_loss": -11.479399681091309, "global_step": 173206, "epoch": 1030} {"train_loss": -10.846767743428549, "global_step": 173207, "epoch": 1030, "val_loss": 239230.828125, "train_action_mse_error": 1.869854211807251} {"train_loss": -11.218973159790039, "global_step": 173208, "epoch": 1031} {"train_loss": -11.518258094787598, "global_step": 173209, "epoch": 1031} {"train_loss": -11.395255088806152, "global_step": 173210, "epoch": 1031} {"train_loss": -11.408452033996582, "global_step": 173211, "epoch": 1031} {"train_loss": -11.443408966064453, "global_step": 173212, "epoch": 1031} {"train_loss": -11.440359115600586, "global_step": 173213, "epoch": 1031} {"train_loss": -11.710634231567383, "global_step": 173214, "epoch": 1031} {"train_loss": -11.4281005859375, "global_step": 173215, "epoch": 1031} {"train_loss": -11.41506576538086, "global_step": 173216, "epoch": 1031} {"train_loss": -11.431188583374023, "global_step": 173217, "epoch": 1031} {"train_loss": -11.398350715637207, "global_step": 173218, "epoch": 1031} {"train_loss": -11.226367950439453, "global_step": 173219, "epoch": 1031} {"train_loss": -11.584732055664062, "global_step": 173220, "epoch": 1031} {"train_loss": -11.325998306274414, "global_step": 173221, "epoch": 1031} {"train_loss": -11.569787979125977, "global_step": 173222, "epoch": 1031} {"train_loss": -11.528924942016602, "global_step": 173223, "epoch": 1031} {"train_loss": -11.30363655090332, "global_step": 173224, "epoch": 1031} {"train_loss": -11.32990837097168, "global_step": 173225, "epoch": 1031} {"train_loss": -11.365427017211914, "global_step": 173226, "epoch": 1031} {"train_loss": -11.465361595153809, "global_step": 173227, "epoch": 1031} {"train_loss": -11.276653289794922, "global_step": 173228, "epoch": 1031} {"train_loss": -11.55685806274414, "global_step": 173229, "epoch": 1031} {"train_loss": -10.802750587463379, "global_step": 173230, "epoch": 1031} {"train_loss": -11.073091506958008, "global_step": 173231, "epoch": 1031} {"train_loss": -11.337355613708496, "global_step": 173232, "epoch": 1031} {"train_loss": -11.523021697998047, "global_step": 173233, "epoch": 1031} {"train_loss": -11.218835830688477, "global_step": 173234, "epoch": 1031} {"train_loss": -10.9697265625, "global_step": 173235, "epoch": 1031} {"train_loss": -11.196710586547852, "global_step": 173236, "epoch": 1031} {"train_loss": -11.34177303314209, "global_step": 173237, "epoch": 1031} {"train_loss": -10.880075454711914, "global_step": 173238, "epoch": 1031} {"train_loss": -11.036067008972168, "global_step": 173239, "epoch": 1031} {"train_loss": -10.83070182800293, "global_step": 173240, "epoch": 1031} {"train_loss": -10.275516510009766, "global_step": 173241, "epoch": 1031} {"train_loss": -10.490120887756348, "global_step": 173242, "epoch": 1031} {"train_loss": -10.801631927490234, "global_step": 173243, "epoch": 1031} {"train_loss": -10.818777084350586, "global_step": 173244, "epoch": 1031} {"train_loss": -10.924728393554688, "global_step": 173245, "epoch": 1031} {"train_loss": -11.346771240234375, "global_step": 173246, "epoch": 1031} {"train_loss": -10.970172882080078, "global_step": 173247, "epoch": 1031} {"train_loss": -11.038101196289062, "global_step": 173248, "epoch": 1031} {"train_loss": -10.933375358581543, "global_step": 173249, "epoch": 1031} {"train_loss": -11.094188690185547, "global_step": 173250, "epoch": 1031} {"train_loss": -10.430440902709961, "global_step": 173251, "epoch": 1031} {"train_loss": -11.187227249145508, "global_step": 173252, "epoch": 1031} {"train_loss": -10.630584716796875, "global_step": 173253, "epoch": 1031} {"train_loss": -11.198911666870117, "global_step": 173254, "epoch": 1031} {"train_loss": -11.013051986694336, "global_step": 173255, "epoch": 1031} {"train_loss": -11.082067489624023, "global_step": 173256, "epoch": 1031} {"train_loss": -10.820284843444824, "global_step": 173257, "epoch": 1031} {"train_loss": -10.885669708251953, "global_step": 173258, "epoch": 1031} {"train_loss": -10.329839706420898, "global_step": 173259, "epoch": 1031} {"train_loss": -10.685998916625977, "global_step": 173260, "epoch": 1031} {"train_loss": -10.949411392211914, "global_step": 173261, "epoch": 1031} {"train_loss": -10.391617774963379, "global_step": 173262, "epoch": 1031} {"train_loss": -10.55081558227539, "global_step": 173263, "epoch": 1031} {"train_loss": -11.16147232055664, "global_step": 173264, "epoch": 1031} {"train_loss": -9.898664474487305, "global_step": 173265, "epoch": 1031} {"train_loss": -9.821043014526367, "global_step": 173266, "epoch": 1031} {"train_loss": -10.572368621826172, "global_step": 173267, "epoch": 1031} {"train_loss": -9.416448593139648, "global_step": 173268, "epoch": 1031} {"train_loss": -10.400794982910156, "global_step": 173269, "epoch": 1031} {"train_loss": -10.584213256835938, "global_step": 173270, "epoch": 1031} {"train_loss": -10.575432777404785, "global_step": 173271, "epoch": 1031} {"train_loss": -9.948220252990723, "global_step": 173272, "epoch": 1031} {"train_loss": -10.828937530517578, "global_step": 173273, "epoch": 1031} {"train_loss": -10.210734367370605, "global_step": 173274, "epoch": 1031} {"train_loss": -10.802844047546387, "global_step": 173275, "epoch": 1031} {"train_loss": -10.95372200012207, "global_step": 173276, "epoch": 1031} {"train_loss": -10.410019874572754, "global_step": 173277, "epoch": 1031} {"train_loss": -11.034347534179688, "global_step": 173278, "epoch": 1031} {"train_loss": -10.69179630279541, "global_step": 173279, "epoch": 1031} {"train_loss": -10.565715789794922, "global_step": 173280, "epoch": 1031} {"train_loss": -10.930801391601562, "global_step": 173281, "epoch": 1031} {"train_loss": -10.591777801513672, "global_step": 173282, "epoch": 1031} {"train_loss": -10.854070663452148, "global_step": 173283, "epoch": 1031} {"train_loss": -10.636772155761719, "global_step": 173284, "epoch": 1031} {"train_loss": -10.911478996276855, "global_step": 173285, "epoch": 1031} {"train_loss": -10.515523910522461, "global_step": 173286, "epoch": 1031} {"train_loss": -10.929529190063477, "global_step": 173287, "epoch": 1031} {"train_loss": -10.904586791992188, "global_step": 173288, "epoch": 1031} {"train_loss": -10.687233924865723, "global_step": 173289, "epoch": 1031} {"train_loss": -11.203182220458984, "global_step": 173290, "epoch": 1031} {"train_loss": -10.624555587768555, "global_step": 173291, "epoch": 1031} {"train_loss": -11.027219772338867, "global_step": 173292, "epoch": 1031} {"train_loss": -10.767881393432617, "global_step": 173293, "epoch": 1031} {"train_loss": -10.907245635986328, "global_step": 173294, "epoch": 1031} {"train_loss": -10.703008651733398, "global_step": 173295, "epoch": 1031} {"train_loss": -11.003442764282227, "global_step": 173296, "epoch": 1031} {"train_loss": -11.071483612060547, "global_step": 173297, "epoch": 1031} {"train_loss": -11.112510681152344, "global_step": 173298, "epoch": 1031} {"train_loss": -11.093015670776367, "global_step": 173299, "epoch": 1031} {"train_loss": -11.225400924682617, "global_step": 173300, "epoch": 1031} {"train_loss": -11.015527725219727, "global_step": 173301, "epoch": 1031} {"train_loss": -11.181855201721191, "global_step": 173302, "epoch": 1031} {"train_loss": -11.186775207519531, "global_step": 173303, "epoch": 1031} {"train_loss": -10.968127250671387, "global_step": 173304, "epoch": 1031} {"train_loss": -11.378124237060547, "global_step": 173305, "epoch": 1031} {"train_loss": -11.268365859985352, "global_step": 173306, "epoch": 1031} {"train_loss": -11.157907485961914, "global_step": 173307, "epoch": 1031} {"train_loss": -11.292095184326172, "global_step": 173308, "epoch": 1031} {"train_loss": -11.03028392791748, "global_step": 173309, "epoch": 1031} {"train_loss": -11.121953964233398, "global_step": 173310, "epoch": 1031} {"train_loss": -11.135719299316406, "global_step": 173311, "epoch": 1031} {"train_loss": -11.161986351013184, "global_step": 173312, "epoch": 1031} {"train_loss": -11.307348251342773, "global_step": 173313, "epoch": 1031} {"train_loss": -11.254880905151367, "global_step": 173314, "epoch": 1031} {"train_loss": -11.182112693786621, "global_step": 173315, "epoch": 1031} {"train_loss": -11.144477844238281, "global_step": 173316, "epoch": 1031} {"train_loss": -10.948598861694336, "global_step": 173317, "epoch": 1031} {"train_loss": -11.307449340820312, "global_step": 173318, "epoch": 1031} {"train_loss": -11.031881332397461, "global_step": 173319, "epoch": 1031} {"train_loss": -11.427000045776367, "global_step": 173320, "epoch": 1031} {"train_loss": -11.103726387023926, "global_step": 173321, "epoch": 1031} {"train_loss": -11.324638366699219, "global_step": 173322, "epoch": 1031} {"train_loss": -10.893840789794922, "global_step": 173323, "epoch": 1031} {"train_loss": -11.007259368896484, "global_step": 173324, "epoch": 1031} {"train_loss": -10.912775039672852, "global_step": 173325, "epoch": 1031} {"train_loss": -10.608501434326172, "global_step": 173326, "epoch": 1031} {"train_loss": -10.55910873413086, "global_step": 173327, "epoch": 1031} {"train_loss": -11.039775848388672, "global_step": 173328, "epoch": 1031} {"train_loss": -10.641645431518555, "global_step": 173329, "epoch": 1031} {"train_loss": -10.836929321289062, "global_step": 173330, "epoch": 1031} {"train_loss": -10.768918991088867, "global_step": 173331, "epoch": 1031} {"train_loss": -10.188194274902344, "global_step": 173332, "epoch": 1031} {"train_loss": -11.386148452758789, "global_step": 173333, "epoch": 1031} {"train_loss": -10.56955337524414, "global_step": 173334, "epoch": 1031} {"train_loss": -10.925115585327148, "global_step": 173335, "epoch": 1031} {"train_loss": -11.108124732971191, "global_step": 173336, "epoch": 1031} {"train_loss": -10.323646545410156, "global_step": 173337, "epoch": 1031} {"train_loss": -10.900899887084961, "global_step": 173338, "epoch": 1031} {"train_loss": -10.357534408569336, "global_step": 173339, "epoch": 1031} {"train_loss": -10.661030769348145, "global_step": 173340, "epoch": 1031} {"train_loss": -10.67152214050293, "global_step": 173341, "epoch": 1031} {"train_loss": -10.236851692199707, "global_step": 173342, "epoch": 1031} {"train_loss": -11.205638885498047, "global_step": 173343, "epoch": 1031} {"train_loss": -10.141525268554688, "global_step": 173344, "epoch": 1031} {"train_loss": -11.173941612243652, "global_step": 173345, "epoch": 1031} {"train_loss": -10.259376525878906, "global_step": 173346, "epoch": 1031} {"train_loss": -10.80588436126709, "global_step": 173347, "epoch": 1031} {"train_loss": -10.891290664672852, "global_step": 173348, "epoch": 1031} {"train_loss": -10.254781723022461, "global_step": 173349, "epoch": 1031} {"train_loss": -11.074485778808594, "global_step": 173350, "epoch": 1031} {"train_loss": -10.359554290771484, "global_step": 173351, "epoch": 1031} {"train_loss": -10.88435173034668, "global_step": 173352, "epoch": 1031} {"train_loss": -10.549617767333984, "global_step": 173353, "epoch": 1031} {"train_loss": -11.014883041381836, "global_step": 173354, "epoch": 1031} {"train_loss": -10.382715225219727, "global_step": 173355, "epoch": 1031} {"train_loss": -11.044185638427734, "global_step": 173356, "epoch": 1031} {"train_loss": -10.331371307373047, "global_step": 173357, "epoch": 1031} {"train_loss": -11.001733779907227, "global_step": 173358, "epoch": 1031} {"train_loss": -10.439004898071289, "global_step": 173359, "epoch": 1031} {"train_loss": -10.958772659301758, "global_step": 173360, "epoch": 1031} {"train_loss": -10.915966033935547, "global_step": 173361, "epoch": 1031} {"train_loss": -10.866065979003906, "global_step": 173362, "epoch": 1031} {"train_loss": -10.965459823608398, "global_step": 173363, "epoch": 1031} {"train_loss": -11.024552345275879, "global_step": 173364, "epoch": 1031} {"train_loss": -10.905233383178711, "global_step": 173365, "epoch": 1031} {"train_loss": -11.08798599243164, "global_step": 173366, "epoch": 1031} {"train_loss": -11.15256118774414, "global_step": 173367, "epoch": 1031} {"train_loss": -11.114479064941406, "global_step": 173368, "epoch": 1031} {"train_loss": -10.879284858703613, "global_step": 173369, "epoch": 1031} {"train_loss": -11.014345169067383, "global_step": 173370, "epoch": 1031} {"train_loss": -10.995952606201172, "global_step": 173371, "epoch": 1031} {"train_loss": -11.004161834716797, "global_step": 173372, "epoch": 1031} {"train_loss": -11.18244743347168, "global_step": 173373, "epoch": 1031} {"train_loss": -10.737224578857422, "global_step": 173374, "epoch": 1031} {"train_loss": -10.928589139665876, "global_step": 173375, "epoch": 1031, "val_loss": 242632.59375} {"train_loss": -10.628922462463379, "global_step": 173376, "epoch": 1032} {"train_loss": -10.203478813171387, "global_step": 173377, "epoch": 1032} {"train_loss": -10.786443710327148, "global_step": 173378, "epoch": 1032} {"train_loss": -10.093786239624023, "global_step": 173379, "epoch": 1032} {"train_loss": -10.39686393737793, "global_step": 173380, "epoch": 1032} {"train_loss": -10.452929496765137, "global_step": 173381, "epoch": 1032} {"train_loss": -10.287446975708008, "global_step": 173382, "epoch": 1032} {"train_loss": -11.005924224853516, "global_step": 173383, "epoch": 1032} {"train_loss": -10.514578819274902, "global_step": 173384, "epoch": 1032} {"train_loss": -10.489995956420898, "global_step": 173385, "epoch": 1032} {"train_loss": -11.03061580657959, "global_step": 173386, "epoch": 1032} {"train_loss": -10.697308540344238, "global_step": 173387, "epoch": 1032} {"train_loss": -10.98906135559082, "global_step": 173388, "epoch": 1032} {"train_loss": -10.816158294677734, "global_step": 173389, "epoch": 1032} {"train_loss": -10.856058120727539, "global_step": 173390, "epoch": 1032} {"train_loss": -10.8603515625, "global_step": 173391, "epoch": 1032} {"train_loss": -10.834321975708008, "global_step": 173392, "epoch": 1032} {"train_loss": -11.02226448059082, "global_step": 173393, "epoch": 1032} {"train_loss": -11.195621490478516, "global_step": 173394, "epoch": 1032} {"train_loss": -10.976766586303711, "global_step": 173395, "epoch": 1032} {"train_loss": -11.088037490844727, "global_step": 173396, "epoch": 1032} {"train_loss": -11.104717254638672, "global_step": 173397, "epoch": 1032} {"train_loss": -10.744611740112305, "global_step": 173398, "epoch": 1032} {"train_loss": -11.383485794067383, "global_step": 173399, "epoch": 1032} {"train_loss": -11.085527420043945, "global_step": 173400, "epoch": 1032} {"train_loss": -11.245482444763184, "global_step": 173401, "epoch": 1032} {"train_loss": -11.344663619995117, "global_step": 173402, "epoch": 1032} {"train_loss": -11.122711181640625, "global_step": 173403, "epoch": 1032} {"train_loss": -11.281644821166992, "global_step": 173404, "epoch": 1032} {"train_loss": -11.143482208251953, "global_step": 173405, "epoch": 1032} {"train_loss": -11.139307022094727, "global_step": 173406, "epoch": 1032} {"train_loss": -11.226638793945312, "global_step": 173407, "epoch": 1032} {"train_loss": -10.981294631958008, "global_step": 173408, "epoch": 1032} {"train_loss": -10.965428352355957, "global_step": 173409, "epoch": 1032} {"train_loss": -11.300324440002441, "global_step": 173410, "epoch": 1032} {"train_loss": -10.997541427612305, "global_step": 173411, "epoch": 1032} {"train_loss": -11.024394989013672, "global_step": 173412, "epoch": 1032} {"train_loss": -11.328937530517578, "global_step": 173413, "epoch": 1032} {"train_loss": -11.23080825805664, "global_step": 173414, "epoch": 1032} {"train_loss": -11.220983505249023, "global_step": 173415, "epoch": 1032} {"train_loss": -11.289533615112305, "global_step": 173416, "epoch": 1032} {"train_loss": -11.059483528137207, "global_step": 173417, "epoch": 1032} {"train_loss": -11.250740051269531, "global_step": 173418, "epoch": 1032} {"train_loss": -11.125753402709961, "global_step": 173419, "epoch": 1032} {"train_loss": -11.302505493164062, "global_step": 173420, "epoch": 1032} {"train_loss": -11.356122970581055, "global_step": 173421, "epoch": 1032} {"train_loss": -11.029440879821777, "global_step": 173422, "epoch": 1032} {"train_loss": -11.281606674194336, "global_step": 173423, "epoch": 1032} {"train_loss": -11.292001724243164, "global_step": 173424, "epoch": 1032} {"train_loss": -11.305638313293457, "global_step": 173425, "epoch": 1032} {"train_loss": -10.460201263427734, "global_step": 173426, "epoch": 1032} {"train_loss": -11.141874313354492, "global_step": 173427, "epoch": 1032} {"train_loss": -10.961833953857422, "global_step": 173428, "epoch": 1032} {"train_loss": -10.221134185791016, "global_step": 173429, "epoch": 1032} {"train_loss": -10.454593658447266, "global_step": 173430, "epoch": 1032} {"train_loss": -11.252304077148438, "global_step": 173431, "epoch": 1032} {"train_loss": -9.768057823181152, "global_step": 173432, "epoch": 1032} {"train_loss": -10.661466598510742, "global_step": 173433, "epoch": 1032} {"train_loss": -10.94962215423584, "global_step": 173434, "epoch": 1032} {"train_loss": -9.91972541809082, "global_step": 173435, "epoch": 1032} {"train_loss": -11.10029125213623, "global_step": 173436, "epoch": 1032} {"train_loss": -9.780793190002441, "global_step": 173437, "epoch": 1032} {"train_loss": -10.79360580444336, "global_step": 173438, "epoch": 1032} {"train_loss": -11.081390380859375, "global_step": 173439, "epoch": 1032} {"train_loss": -10.245218276977539, "global_step": 173440, "epoch": 1032} {"train_loss": -10.828523635864258, "global_step": 173441, "epoch": 1032} {"train_loss": -10.016845703125, "global_step": 173442, "epoch": 1032} {"train_loss": -11.045980453491211, "global_step": 173443, "epoch": 1032} {"train_loss": -9.873403549194336, "global_step": 173444, "epoch": 1032} {"train_loss": -10.784414291381836, "global_step": 173445, "epoch": 1032} {"train_loss": -10.71155834197998, "global_step": 173446, "epoch": 1032} {"train_loss": -10.077314376831055, "global_step": 173447, "epoch": 1032} {"train_loss": -11.250351905822754, "global_step": 173448, "epoch": 1032} {"train_loss": -9.755573272705078, "global_step": 173449, "epoch": 1032} {"train_loss": -10.820257186889648, "global_step": 173450, "epoch": 1032} {"train_loss": -10.039600372314453, "global_step": 173451, "epoch": 1032} {"train_loss": -11.092663764953613, "global_step": 173452, "epoch": 1032} {"train_loss": -10.271785736083984, "global_step": 173453, "epoch": 1032} {"train_loss": -11.003063201904297, "global_step": 173454, "epoch": 1032} {"train_loss": -10.610960006713867, "global_step": 173455, "epoch": 1032} {"train_loss": -11.109916687011719, "global_step": 173456, "epoch": 1032} {"train_loss": -10.617391586303711, "global_step": 173457, "epoch": 1032} {"train_loss": -11.204187393188477, "global_step": 173458, "epoch": 1032} {"train_loss": -10.620861053466797, "global_step": 173459, "epoch": 1032} {"train_loss": -11.20433235168457, "global_step": 173460, "epoch": 1032} {"train_loss": -10.64964771270752, "global_step": 173461, "epoch": 1032} {"train_loss": -11.094438552856445, "global_step": 173462, "epoch": 1032} {"train_loss": -10.930353164672852, "global_step": 173463, "epoch": 1032} {"train_loss": -10.851795196533203, "global_step": 173464, "epoch": 1032} {"train_loss": -11.116735458374023, "global_step": 173465, "epoch": 1032} {"train_loss": -10.916152954101562, "global_step": 173466, "epoch": 1032} {"train_loss": -11.301451683044434, "global_step": 173467, "epoch": 1032} {"train_loss": -10.941168785095215, "global_step": 173468, "epoch": 1032} {"train_loss": -11.222900390625, "global_step": 173469, "epoch": 1032} {"train_loss": -10.915499687194824, "global_step": 173470, "epoch": 1032} {"train_loss": -11.3093843460083, "global_step": 173471, "epoch": 1032} {"train_loss": -11.19519329071045, "global_step": 173472, "epoch": 1032} {"train_loss": -11.016908645629883, "global_step": 173473, "epoch": 1032} {"train_loss": -10.99453353881836, "global_step": 173474, "epoch": 1032} {"train_loss": -11.323370933532715, "global_step": 173475, "epoch": 1032} {"train_loss": -10.989431381225586, "global_step": 173476, "epoch": 1032} {"train_loss": -11.359312057495117, "global_step": 173477, "epoch": 1032} {"train_loss": -10.944026947021484, "global_step": 173478, "epoch": 1032} {"train_loss": -10.93647575378418, "global_step": 173479, "epoch": 1032} {"train_loss": -11.106450080871582, "global_step": 173480, "epoch": 1032} {"train_loss": -11.40072250366211, "global_step": 173481, "epoch": 1032} {"train_loss": -11.233125686645508, "global_step": 173482, "epoch": 1032} {"train_loss": -11.335569381713867, "global_step": 173483, "epoch": 1032} {"train_loss": -11.098618507385254, "global_step": 173484, "epoch": 1032} {"train_loss": -11.092330932617188, "global_step": 173485, "epoch": 1032} {"train_loss": -11.49445915222168, "global_step": 173486, "epoch": 1032} {"train_loss": -11.223974227905273, "global_step": 173487, "epoch": 1032} {"train_loss": -11.214921951293945, "global_step": 173488, "epoch": 1032} {"train_loss": -11.13502311706543, "global_step": 173489, "epoch": 1032} {"train_loss": -11.169511795043945, "global_step": 173490, "epoch": 1032} {"train_loss": -11.167781829833984, "global_step": 173491, "epoch": 1032} {"train_loss": -10.895146369934082, "global_step": 173492, "epoch": 1032} {"train_loss": -11.081856727600098, "global_step": 173493, "epoch": 1032} {"train_loss": -11.191150665283203, "global_step": 173494, "epoch": 1032} {"train_loss": -11.189650535583496, "global_step": 173495, "epoch": 1032} {"train_loss": -10.757393836975098, "global_step": 173496, "epoch": 1032} {"train_loss": -11.300487518310547, "global_step": 173497, "epoch": 1032} {"train_loss": -10.941757202148438, "global_step": 173498, "epoch": 1032} {"train_loss": -10.885573387145996, "global_step": 173499, "epoch": 1032} {"train_loss": -11.02584457397461, "global_step": 173500, "epoch": 1032} {"train_loss": -11.179502487182617, "global_step": 173501, "epoch": 1032} {"train_loss": -11.388345718383789, "global_step": 173502, "epoch": 1032} {"train_loss": -11.395414352416992, "global_step": 173503, "epoch": 1032} {"train_loss": -11.101890563964844, "global_step": 173504, "epoch": 1032} {"train_loss": -10.994941711425781, "global_step": 173505, "epoch": 1032} {"train_loss": -11.176471710205078, "global_step": 173506, "epoch": 1032} {"train_loss": -10.96137809753418, "global_step": 173507, "epoch": 1032} {"train_loss": -11.305686950683594, "global_step": 173508, "epoch": 1032} {"train_loss": -10.756414413452148, "global_step": 173509, "epoch": 1032} {"train_loss": -10.896961212158203, "global_step": 173510, "epoch": 1032} {"train_loss": -11.066047668457031, "global_step": 173511, "epoch": 1032} {"train_loss": -11.275333404541016, "global_step": 173512, "epoch": 1032} {"train_loss": -11.136909484863281, "global_step": 173513, "epoch": 1032} {"train_loss": -11.247944831848145, "global_step": 173514, "epoch": 1032} {"train_loss": -11.280415534973145, "global_step": 173515, "epoch": 1032} {"train_loss": -10.997991561889648, "global_step": 173516, "epoch": 1032} {"train_loss": -11.231050491333008, "global_step": 173517, "epoch": 1032} {"train_loss": -11.317586898803711, "global_step": 173518, "epoch": 1032} {"train_loss": -11.112205505371094, "global_step": 173519, "epoch": 1032} {"train_loss": -11.356975555419922, "global_step": 173520, "epoch": 1032} {"train_loss": -10.524700164794922, "global_step": 173521, "epoch": 1032} {"train_loss": -11.417503356933594, "global_step": 173522, "epoch": 1032} {"train_loss": -10.725200653076172, "global_step": 173523, "epoch": 1032} {"train_loss": -11.126372337341309, "global_step": 173524, "epoch": 1032} {"train_loss": -10.598152160644531, "global_step": 173525, "epoch": 1032} {"train_loss": -11.102794647216797, "global_step": 173526, "epoch": 1032} {"train_loss": -10.893058776855469, "global_step": 173527, "epoch": 1032} {"train_loss": -10.938282012939453, "global_step": 173528, "epoch": 1032} {"train_loss": -10.96084976196289, "global_step": 173529, "epoch": 1032} {"train_loss": -10.944182395935059, "global_step": 173530, "epoch": 1032} {"train_loss": -10.674939155578613, "global_step": 173531, "epoch": 1032} {"train_loss": -10.627634048461914, "global_step": 173532, "epoch": 1032} {"train_loss": -10.256446838378906, "global_step": 173533, "epoch": 1032} {"train_loss": -11.09360122680664, "global_step": 173534, "epoch": 1032} {"train_loss": -10.504196166992188, "global_step": 173535, "epoch": 1032} {"train_loss": -11.164543151855469, "global_step": 173536, "epoch": 1032} {"train_loss": -10.670316696166992, "global_step": 173537, "epoch": 1032} {"train_loss": -10.79555606842041, "global_step": 173538, "epoch": 1032} {"train_loss": -10.636552810668945, "global_step": 173539, "epoch": 1032} {"train_loss": -10.241996765136719, "global_step": 173540, "epoch": 1032} {"train_loss": -11.064720153808594, "global_step": 173541, "epoch": 1032} {"train_loss": -9.618549346923828, "global_step": 173542, "epoch": 1032} {"train_loss": -10.925327352115087, "global_step": 173543, "epoch": 1032, "val_loss": 241847.203125} {"train_loss": -10.52374267578125, "global_step": 173544, "epoch": 1033} {"train_loss": -10.754143714904785, "global_step": 173545, "epoch": 1033} {"train_loss": -10.545526504516602, "global_step": 173546, "epoch": 1033} {"train_loss": -10.7074613571167, "global_step": 173547, "epoch": 1033} {"train_loss": -10.673654556274414, "global_step": 173548, "epoch": 1033} {"train_loss": -10.800725936889648, "global_step": 173549, "epoch": 1033} {"train_loss": -10.509571075439453, "global_step": 173550, "epoch": 1033} {"train_loss": -10.950515747070312, "global_step": 173551, "epoch": 1033} {"train_loss": -10.46273422241211, "global_step": 173552, "epoch": 1033} {"train_loss": -9.632734298706055, "global_step": 173553, "epoch": 1033} {"train_loss": -10.92961311340332, "global_step": 173554, "epoch": 1033} {"train_loss": -9.33464241027832, "global_step": 173555, "epoch": 1033} {"train_loss": -10.590584754943848, "global_step": 173556, "epoch": 1033} {"train_loss": -9.953056335449219, "global_step": 173557, "epoch": 1033} {"train_loss": -10.668684005737305, "global_step": 173558, "epoch": 1033} {"train_loss": -10.677257537841797, "global_step": 173559, "epoch": 1033} {"train_loss": -10.377510070800781, "global_step": 173560, "epoch": 1033} {"train_loss": -10.990524291992188, "global_step": 173561, "epoch": 1033} {"train_loss": -10.304226875305176, "global_step": 173562, "epoch": 1033} {"train_loss": -10.781288146972656, "global_step": 173563, "epoch": 1033} {"train_loss": -10.407833099365234, "global_step": 173564, "epoch": 1033} {"train_loss": -10.98790454864502, "global_step": 173565, "epoch": 1033} {"train_loss": -10.519392013549805, "global_step": 173566, "epoch": 1033} {"train_loss": -11.076095581054688, "global_step": 173567, "epoch": 1033} {"train_loss": -10.508321762084961, "global_step": 173568, "epoch": 1033} {"train_loss": -10.987480163574219, "global_step": 173569, "epoch": 1033} {"train_loss": -10.575347900390625, "global_step": 173570, "epoch": 1033} {"train_loss": -11.15099048614502, "global_step": 173571, "epoch": 1033} {"train_loss": -10.641225814819336, "global_step": 173572, "epoch": 1033} {"train_loss": -10.786592483520508, "global_step": 173573, "epoch": 1033} {"train_loss": -10.860234260559082, "global_step": 173574, "epoch": 1033} {"train_loss": -10.435587882995605, "global_step": 173575, "epoch": 1033} {"train_loss": -10.81375503540039, "global_step": 173576, "epoch": 1033} {"train_loss": -10.765296936035156, "global_step": 173577, "epoch": 1033} {"train_loss": -11.067390441894531, "global_step": 173578, "epoch": 1033} {"train_loss": -10.796574592590332, "global_step": 173579, "epoch": 1033} {"train_loss": -11.161327362060547, "global_step": 173580, "epoch": 1033} {"train_loss": -10.846071243286133, "global_step": 173581, "epoch": 1033} {"train_loss": -10.829446792602539, "global_step": 173582, "epoch": 1033} {"train_loss": -10.83398151397705, "global_step": 173583, "epoch": 1033} {"train_loss": -11.08993148803711, "global_step": 173584, "epoch": 1033} {"train_loss": -11.124678611755371, "global_step": 173585, "epoch": 1033} {"train_loss": -11.154090881347656, "global_step": 173586, "epoch": 1033} {"train_loss": -11.26229476928711, "global_step": 173587, "epoch": 1033} {"train_loss": -11.254755973815918, "global_step": 173588, "epoch": 1033} {"train_loss": -11.283465385437012, "global_step": 173589, "epoch": 1033} {"train_loss": -11.185800552368164, "global_step": 173590, "epoch": 1033} {"train_loss": -11.304445266723633, "global_step": 173591, "epoch": 1033} {"train_loss": -11.162527084350586, "global_step": 173592, "epoch": 1033} {"train_loss": -11.380168914794922, "global_step": 173593, "epoch": 1033} {"train_loss": -11.430316925048828, "global_step": 173594, "epoch": 1033} {"train_loss": -11.517848014831543, "global_step": 173595, "epoch": 1033} {"train_loss": -11.40169620513916, "global_step": 173596, "epoch": 1033} {"train_loss": -11.198064804077148, "global_step": 173597, "epoch": 1033} {"train_loss": -11.361226081848145, "global_step": 173598, "epoch": 1033} {"train_loss": -11.309639930725098, "global_step": 173599, "epoch": 1033} {"train_loss": -11.31895637512207, "global_step": 173600, "epoch": 1033} {"train_loss": -11.205735206604004, "global_step": 173601, "epoch": 1033} {"train_loss": -11.54705810546875, "global_step": 173602, "epoch": 1033} {"train_loss": -11.140397071838379, "global_step": 173603, "epoch": 1033} {"train_loss": -11.151328086853027, "global_step": 173604, "epoch": 1033} {"train_loss": -11.287870407104492, "global_step": 173605, "epoch": 1033} {"train_loss": -11.311702728271484, "global_step": 173606, "epoch": 1033} {"train_loss": -11.482555389404297, "global_step": 173607, "epoch": 1033} {"train_loss": -11.245296478271484, "global_step": 173608, "epoch": 1033} {"train_loss": -11.297721862792969, "global_step": 173609, "epoch": 1033} {"train_loss": -11.426549911499023, "global_step": 173610, "epoch": 1033} {"train_loss": -11.329620361328125, "global_step": 173611, "epoch": 1033} {"train_loss": -11.436944961547852, "global_step": 173612, "epoch": 1033} {"train_loss": -11.504429817199707, "global_step": 173613, "epoch": 1033} {"train_loss": -11.409764289855957, "global_step": 173614, "epoch": 1033} {"train_loss": -11.459968566894531, "global_step": 173615, "epoch": 1033} {"train_loss": -11.36628532409668, "global_step": 173616, "epoch": 1033} {"train_loss": -11.364971160888672, "global_step": 173617, "epoch": 1033} {"train_loss": -11.260875701904297, "global_step": 173618, "epoch": 1033} {"train_loss": -11.55793571472168, "global_step": 173619, "epoch": 1033} {"train_loss": -11.232643127441406, "global_step": 173620, "epoch": 1033} {"train_loss": -11.504287719726562, "global_step": 173621, "epoch": 1033} {"train_loss": -11.327478408813477, "global_step": 173622, "epoch": 1033} {"train_loss": -11.490079879760742, "global_step": 173623, "epoch": 1033} {"train_loss": -11.44345474243164, "global_step": 173624, "epoch": 1033} {"train_loss": -11.232278823852539, "global_step": 173625, "epoch": 1033} {"train_loss": -10.914536476135254, "global_step": 173626, "epoch": 1033} {"train_loss": -10.844406127929688, "global_step": 173627, "epoch": 1033} {"train_loss": -11.210277557373047, "global_step": 173628, "epoch": 1033} {"train_loss": -10.815265655517578, "global_step": 173629, "epoch": 1033} {"train_loss": -10.844308853149414, "global_step": 173630, "epoch": 1033} {"train_loss": -10.771700859069824, "global_step": 173631, "epoch": 1033} {"train_loss": -11.160128593444824, "global_step": 173632, "epoch": 1033} {"train_loss": -10.827156066894531, "global_step": 173633, "epoch": 1033} {"train_loss": -10.78266716003418, "global_step": 173634, "epoch": 1033} {"train_loss": -10.83830738067627, "global_step": 173635, "epoch": 1033} {"train_loss": -10.053146362304688, "global_step": 173636, "epoch": 1033} {"train_loss": -10.368577003479004, "global_step": 173637, "epoch": 1033} {"train_loss": -10.57658576965332, "global_step": 173638, "epoch": 1033} {"train_loss": -11.105314254760742, "global_step": 173639, "epoch": 1033} {"train_loss": -10.257962226867676, "global_step": 173640, "epoch": 1033} {"train_loss": -10.81326675415039, "global_step": 173641, "epoch": 1033} {"train_loss": -10.729618072509766, "global_step": 173642, "epoch": 1033} {"train_loss": -10.291202545166016, "global_step": 173643, "epoch": 1033} {"train_loss": -10.727837562561035, "global_step": 173644, "epoch": 1033} {"train_loss": -11.099274635314941, "global_step": 173645, "epoch": 1033} {"train_loss": -10.764111518859863, "global_step": 173646, "epoch": 1033} {"train_loss": -10.79476261138916, "global_step": 173647, "epoch": 1033} {"train_loss": -10.684548377990723, "global_step": 173648, "epoch": 1033} {"train_loss": -10.47391128540039, "global_step": 173649, "epoch": 1033} {"train_loss": -11.046537399291992, "global_step": 173650, "epoch": 1033} {"train_loss": -11.085394859313965, "global_step": 173651, "epoch": 1033} {"train_loss": -10.58243179321289, "global_step": 173652, "epoch": 1033} {"train_loss": -10.805931091308594, "global_step": 173653, "epoch": 1033} {"train_loss": -11.043901443481445, "global_step": 173654, "epoch": 1033} {"train_loss": -10.91622543334961, "global_step": 173655, "epoch": 1033} {"train_loss": -11.15423583984375, "global_step": 173656, "epoch": 1033} {"train_loss": -11.126256942749023, "global_step": 173657, "epoch": 1033} {"train_loss": -10.879203796386719, "global_step": 173658, "epoch": 1033} {"train_loss": -10.825352668762207, "global_step": 173659, "epoch": 1033} {"train_loss": -10.583898544311523, "global_step": 173660, "epoch": 1033} {"train_loss": -10.8704195022583, "global_step": 173661, "epoch": 1033} {"train_loss": -11.064409255981445, "global_step": 173662, "epoch": 1033} {"train_loss": -10.666431427001953, "global_step": 173663, "epoch": 1033} {"train_loss": -11.113937377929688, "global_step": 173664, "epoch": 1033} {"train_loss": -10.85389232635498, "global_step": 173665, "epoch": 1033} {"train_loss": -11.05734634399414, "global_step": 173666, "epoch": 1033} {"train_loss": -10.864362716674805, "global_step": 173667, "epoch": 1033} {"train_loss": -10.967950820922852, "global_step": 173668, "epoch": 1033} {"train_loss": -10.965219497680664, "global_step": 173669, "epoch": 1033} {"train_loss": -10.765762329101562, "global_step": 173670, "epoch": 1033} {"train_loss": -11.161094665527344, "global_step": 173671, "epoch": 1033} {"train_loss": -10.954191207885742, "global_step": 173672, "epoch": 1033} {"train_loss": -10.935547828674316, "global_step": 173673, "epoch": 1033} {"train_loss": -10.92120361328125, "global_step": 173674, "epoch": 1033} {"train_loss": -10.968013763427734, "global_step": 173675, "epoch": 1033} {"train_loss": -11.032108306884766, "global_step": 173676, "epoch": 1033} {"train_loss": -11.063392639160156, "global_step": 173677, "epoch": 1033} {"train_loss": -10.772424697875977, "global_step": 173678, "epoch": 1033} {"train_loss": -11.237337112426758, "global_step": 173679, "epoch": 1033} {"train_loss": -10.828834533691406, "global_step": 173680, "epoch": 1033} {"train_loss": -11.229569435119629, "global_step": 173681, "epoch": 1033} {"train_loss": -10.894268035888672, "global_step": 173682, "epoch": 1033} {"train_loss": -11.274858474731445, "global_step": 173683, "epoch": 1033} {"train_loss": -10.97789192199707, "global_step": 173684, "epoch": 1033} {"train_loss": -10.981151580810547, "global_step": 173685, "epoch": 1033} {"train_loss": -11.02128791809082, "global_step": 173686, "epoch": 1033} {"train_loss": -10.818452835083008, "global_step": 173687, "epoch": 1033} {"train_loss": -11.02409839630127, "global_step": 173688, "epoch": 1033} {"train_loss": -10.796318054199219, "global_step": 173689, "epoch": 1033} {"train_loss": -11.148536682128906, "global_step": 173690, "epoch": 1033} {"train_loss": -10.557645797729492, "global_step": 173691, "epoch": 1033} {"train_loss": -11.042000770568848, "global_step": 173692, "epoch": 1033} {"train_loss": -10.740516662597656, "global_step": 173693, "epoch": 1033} {"train_loss": -10.524921417236328, "global_step": 173694, "epoch": 1033} {"train_loss": -11.045721054077148, "global_step": 173695, "epoch": 1033} {"train_loss": -10.309181213378906, "global_step": 173696, "epoch": 1033} {"train_loss": -10.90008544921875, "global_step": 173697, "epoch": 1033} {"train_loss": -10.680376052856445, "global_step": 173698, "epoch": 1033} {"train_loss": -10.86482048034668, "global_step": 173699, "epoch": 1033} {"train_loss": -10.728238105773926, "global_step": 173700, "epoch": 1033} {"train_loss": -11.013374328613281, "global_step": 173701, "epoch": 1033} {"train_loss": -10.905786514282227, "global_step": 173702, "epoch": 1033} {"train_loss": -10.843194007873535, "global_step": 173703, "epoch": 1033} {"train_loss": -10.853482246398926, "global_step": 173704, "epoch": 1033} {"train_loss": -10.532450675964355, "global_step": 173705, "epoch": 1033} {"train_loss": -10.451242446899414, "global_step": 173706, "epoch": 1033} {"train_loss": -10.715819358825684, "global_step": 173707, "epoch": 1033} {"train_loss": -11.107940673828125, "global_step": 173708, "epoch": 1033} {"train_loss": -10.510724067687988, "global_step": 173709, "epoch": 1033} {"train_loss": -10.991449356079102, "global_step": 173710, "epoch": 1033} {"train_loss": -10.92371516000657, "global_step": 173711, "epoch": 1033, "val_loss": 240123.546875} {"train_loss": -10.901182174682617, "global_step": 173712, "epoch": 1034} {"train_loss": -10.999876022338867, "global_step": 173713, "epoch": 1034} {"train_loss": -10.864538192749023, "global_step": 173714, "epoch": 1034} {"train_loss": -11.039505004882812, "global_step": 173715, "epoch": 1034} {"train_loss": -11.208520889282227, "global_step": 173716, "epoch": 1034} {"train_loss": -11.143292427062988, "global_step": 173717, "epoch": 1034} {"train_loss": -11.229171752929688, "global_step": 173718, "epoch": 1034} {"train_loss": -11.08626937866211, "global_step": 173719, "epoch": 1034} {"train_loss": -11.234519958496094, "global_step": 173720, "epoch": 1034} {"train_loss": -10.948610305786133, "global_step": 173721, "epoch": 1034} {"train_loss": -11.123882293701172, "global_step": 173722, "epoch": 1034} {"train_loss": -10.986172676086426, "global_step": 173723, "epoch": 1034} {"train_loss": -11.322500228881836, "global_step": 173724, "epoch": 1034} {"train_loss": -11.258394241333008, "global_step": 173725, "epoch": 1034} {"train_loss": -11.163949012756348, "global_step": 173726, "epoch": 1034} {"train_loss": -11.450641632080078, "global_step": 173727, "epoch": 1034} {"train_loss": -11.216937065124512, "global_step": 173728, "epoch": 1034} {"train_loss": -11.075749397277832, "global_step": 173729, "epoch": 1034} {"train_loss": -11.305699348449707, "global_step": 173730, "epoch": 1034} {"train_loss": -10.94325065612793, "global_step": 173731, "epoch": 1034} {"train_loss": -11.387784957885742, "global_step": 173732, "epoch": 1034} {"train_loss": -11.219669342041016, "global_step": 173733, "epoch": 1034} {"train_loss": -11.257041931152344, "global_step": 173734, "epoch": 1034} {"train_loss": -11.288188934326172, "global_step": 173735, "epoch": 1034} {"train_loss": -11.1204833984375, "global_step": 173736, "epoch": 1034} {"train_loss": -11.220130920410156, "global_step": 173737, "epoch": 1034} {"train_loss": -11.119967460632324, "global_step": 173738, "epoch": 1034} {"train_loss": -11.413307189941406, "global_step": 173739, "epoch": 1034} {"train_loss": -11.17300033569336, "global_step": 173740, "epoch": 1034} {"train_loss": -11.055208206176758, "global_step": 173741, "epoch": 1034} {"train_loss": -11.210176467895508, "global_step": 173742, "epoch": 1034} {"train_loss": -10.826726913452148, "global_step": 173743, "epoch": 1034} {"train_loss": -11.195347785949707, "global_step": 173744, "epoch": 1034} {"train_loss": -11.048645973205566, "global_step": 173745, "epoch": 1034} {"train_loss": -11.258209228515625, "global_step": 173746, "epoch": 1034} {"train_loss": -11.381589889526367, "global_step": 173747, "epoch": 1034} {"train_loss": -11.27772331237793, "global_step": 173748, "epoch": 1034} {"train_loss": -11.248523712158203, "global_step": 173749, "epoch": 1034} {"train_loss": -11.30065631866455, "global_step": 173750, "epoch": 1034} {"train_loss": -11.169692993164062, "global_step": 173751, "epoch": 1034} {"train_loss": -11.0286865234375, "global_step": 173752, "epoch": 1034} {"train_loss": -11.309412956237793, "global_step": 173753, "epoch": 1034} {"train_loss": -11.099952697753906, "global_step": 173754, "epoch": 1034} {"train_loss": -11.025957107543945, "global_step": 173755, "epoch": 1034} {"train_loss": -11.261280059814453, "global_step": 173756, "epoch": 1034} {"train_loss": -10.75617790222168, "global_step": 173757, "epoch": 1034} {"train_loss": -11.278249740600586, "global_step": 173758, "epoch": 1034} {"train_loss": -10.49794864654541, "global_step": 173759, "epoch": 1034} {"train_loss": -10.267803192138672, "global_step": 173760, "epoch": 1034} {"train_loss": -10.644547462463379, "global_step": 173761, "epoch": 1034} {"train_loss": -10.911163330078125, "global_step": 173762, "epoch": 1034} {"train_loss": -10.133198738098145, "global_step": 173763, "epoch": 1034} {"train_loss": -10.9968900680542, "global_step": 173764, "epoch": 1034} {"train_loss": -10.517729759216309, "global_step": 173765, "epoch": 1034} {"train_loss": -10.332719802856445, "global_step": 173766, "epoch": 1034} {"train_loss": -10.946624755859375, "global_step": 173767, "epoch": 1034} {"train_loss": -10.420904159545898, "global_step": 173768, "epoch": 1034} {"train_loss": -10.48277759552002, "global_step": 173769, "epoch": 1034} {"train_loss": -10.321290016174316, "global_step": 173770, "epoch": 1034} {"train_loss": -10.269652366638184, "global_step": 173771, "epoch": 1034} {"train_loss": -11.0706205368042, "global_step": 173772, "epoch": 1034} {"train_loss": -10.720746040344238, "global_step": 173773, "epoch": 1034} {"train_loss": -10.77000617980957, "global_step": 173774, "epoch": 1034} {"train_loss": -10.720060348510742, "global_step": 173775, "epoch": 1034} {"train_loss": -10.876710891723633, "global_step": 173776, "epoch": 1034} {"train_loss": -11.074329376220703, "global_step": 173777, "epoch": 1034} {"train_loss": -10.574052810668945, "global_step": 173778, "epoch": 1034} {"train_loss": -11.111865043640137, "global_step": 173779, "epoch": 1034} {"train_loss": -10.99339485168457, "global_step": 173780, "epoch": 1034} {"train_loss": -10.72518539428711, "global_step": 173781, "epoch": 1034} {"train_loss": -11.200623512268066, "global_step": 173782, "epoch": 1034} {"train_loss": -10.705236434936523, "global_step": 173783, "epoch": 1034} {"train_loss": -10.945115089416504, "global_step": 173784, "epoch": 1034} {"train_loss": -11.051921844482422, "global_step": 173785, "epoch": 1034} {"train_loss": -11.012373924255371, "global_step": 173786, "epoch": 1034} {"train_loss": -10.95073127746582, "global_step": 173787, "epoch": 1034} {"train_loss": -11.091123580932617, "global_step": 173788, "epoch": 1034} {"train_loss": -10.738162994384766, "global_step": 173789, "epoch": 1034} {"train_loss": -10.929773330688477, "global_step": 173790, "epoch": 1034} {"train_loss": -10.887701034545898, "global_step": 173791, "epoch": 1034} {"train_loss": -11.30046558380127, "global_step": 173792, "epoch": 1034} {"train_loss": -11.068087577819824, "global_step": 173793, "epoch": 1034} {"train_loss": -11.255971908569336, "global_step": 173794, "epoch": 1034} {"train_loss": -10.897337913513184, "global_step": 173795, "epoch": 1034} {"train_loss": -11.322137832641602, "global_step": 173796, "epoch": 1034} {"train_loss": -10.716651916503906, "global_step": 173797, "epoch": 1034} {"train_loss": -10.641777038574219, "global_step": 173798, "epoch": 1034} {"train_loss": -11.130215644836426, "global_step": 173799, "epoch": 1034} {"train_loss": -10.105376243591309, "global_step": 173800, "epoch": 1034} {"train_loss": -11.134157180786133, "global_step": 173801, "epoch": 1034} {"train_loss": -10.516216278076172, "global_step": 173802, "epoch": 1034} {"train_loss": -11.142099380493164, "global_step": 173803, "epoch": 1034} {"train_loss": -10.785694122314453, "global_step": 173804, "epoch": 1034} {"train_loss": -11.066770553588867, "global_step": 173805, "epoch": 1034} {"train_loss": -11.270572662353516, "global_step": 173806, "epoch": 1034} {"train_loss": -10.891871452331543, "global_step": 173807, "epoch": 1034} {"train_loss": -11.257173538208008, "global_step": 173808, "epoch": 1034} {"train_loss": -11.100807189941406, "global_step": 173809, "epoch": 1034} {"train_loss": -11.238388061523438, "global_step": 173810, "epoch": 1034} {"train_loss": -11.203554153442383, "global_step": 173811, "epoch": 1034} {"train_loss": -10.721866607666016, "global_step": 173812, "epoch": 1034} {"train_loss": -11.200540542602539, "global_step": 173813, "epoch": 1034} {"train_loss": -11.063892364501953, "global_step": 173814, "epoch": 1034} {"train_loss": -11.120580673217773, "global_step": 173815, "epoch": 1034} {"train_loss": -11.453603744506836, "global_step": 173816, "epoch": 1034} {"train_loss": -11.221161842346191, "global_step": 173817, "epoch": 1034} {"train_loss": -11.363622665405273, "global_step": 173818, "epoch": 1034} {"train_loss": -11.08749008178711, "global_step": 173819, "epoch": 1034} {"train_loss": -11.445735931396484, "global_step": 173820, "epoch": 1034} {"train_loss": -10.875943183898926, "global_step": 173821, "epoch": 1034} {"train_loss": -11.130411148071289, "global_step": 173822, "epoch": 1034} {"train_loss": -11.029106140136719, "global_step": 173823, "epoch": 1034} {"train_loss": -11.140482902526855, "global_step": 173824, "epoch": 1034} {"train_loss": -11.121241569519043, "global_step": 173825, "epoch": 1034} {"train_loss": -11.282136917114258, "global_step": 173826, "epoch": 1034} {"train_loss": -11.186592102050781, "global_step": 173827, "epoch": 1034} {"train_loss": -11.279317855834961, "global_step": 173828, "epoch": 1034} {"train_loss": -11.108236312866211, "global_step": 173829, "epoch": 1034} {"train_loss": -11.068106651306152, "global_step": 173830, "epoch": 1034} {"train_loss": -10.655416488647461, "global_step": 173831, "epoch": 1034} {"train_loss": -10.741844177246094, "global_step": 173832, "epoch": 1034} {"train_loss": -11.006521224975586, "global_step": 173833, "epoch": 1034} {"train_loss": -10.720823287963867, "global_step": 173834, "epoch": 1034} {"train_loss": -11.065277099609375, "global_step": 173835, "epoch": 1034} {"train_loss": -10.480962753295898, "global_step": 173836, "epoch": 1034} {"train_loss": -11.178001403808594, "global_step": 173837, "epoch": 1034} {"train_loss": -10.516616821289062, "global_step": 173838, "epoch": 1034} {"train_loss": -11.339178085327148, "global_step": 173839, "epoch": 1034} {"train_loss": -10.615055084228516, "global_step": 173840, "epoch": 1034} {"train_loss": -10.572888374328613, "global_step": 173841, "epoch": 1034} {"train_loss": -11.291622161865234, "global_step": 173842, "epoch": 1034} {"train_loss": -10.703824043273926, "global_step": 173843, "epoch": 1034} {"train_loss": -10.996660232543945, "global_step": 173844, "epoch": 1034} {"train_loss": -10.710527420043945, "global_step": 173845, "epoch": 1034} {"train_loss": -11.092878341674805, "global_step": 173846, "epoch": 1034} {"train_loss": -10.886517524719238, "global_step": 173847, "epoch": 1034} {"train_loss": -11.19972038269043, "global_step": 173848, "epoch": 1034} {"train_loss": -11.065776824951172, "global_step": 173849, "epoch": 1034} {"train_loss": -11.204465866088867, "global_step": 173850, "epoch": 1034} {"train_loss": -11.249641418457031, "global_step": 173851, "epoch": 1034} {"train_loss": -11.134265899658203, "global_step": 173852, "epoch": 1034} {"train_loss": -11.222575187683105, "global_step": 173853, "epoch": 1034} {"train_loss": -11.174897193908691, "global_step": 173854, "epoch": 1034} {"train_loss": -10.925798416137695, "global_step": 173855, "epoch": 1034} {"train_loss": -10.771276473999023, "global_step": 173856, "epoch": 1034} {"train_loss": -10.679893493652344, "global_step": 173857, "epoch": 1034} {"train_loss": -10.231629371643066, "global_step": 173858, "epoch": 1034} {"train_loss": -10.928815841674805, "global_step": 173859, "epoch": 1034} {"train_loss": -9.84979248046875, "global_step": 173860, "epoch": 1034} {"train_loss": -10.428709983825684, "global_step": 173861, "epoch": 1034} {"train_loss": -10.8223876953125, "global_step": 173862, "epoch": 1034} {"train_loss": -10.37863826751709, "global_step": 173863, "epoch": 1034} {"train_loss": -11.037528991699219, "global_step": 173864, "epoch": 1034} {"train_loss": -10.067626953125, "global_step": 173865, "epoch": 1034} {"train_loss": -10.8746337890625, "global_step": 173866, "epoch": 1034} {"train_loss": -10.522237777709961, "global_step": 173867, "epoch": 1034} {"train_loss": -10.875629425048828, "global_step": 173868, "epoch": 1034} {"train_loss": -10.584598541259766, "global_step": 173869, "epoch": 1034} {"train_loss": -10.428373336791992, "global_step": 173870, "epoch": 1034} {"train_loss": -10.434432983398438, "global_step": 173871, "epoch": 1034} {"train_loss": -10.085733413696289, "global_step": 173872, "epoch": 1034} {"train_loss": -10.632638931274414, "global_step": 173873, "epoch": 1034} {"train_loss": -9.71536636352539, "global_step": 173874, "epoch": 1034} {"train_loss": -10.7225341796875, "global_step": 173875, "epoch": 1034} {"train_loss": -9.90108871459961, "global_step": 173876, "epoch": 1034} {"train_loss": -10.90522575378418, "global_step": 173877, "epoch": 1034} {"train_loss": -10.159884452819824, "global_step": 173878, "epoch": 1034} {"train_loss": -10.930393871806917, "global_step": 173879, "epoch": 1034, "val_loss": 241372.390625} {"train_loss": -10.429101943969727, "global_step": 173880, "epoch": 1035} {"train_loss": -10.260414123535156, "global_step": 173881, "epoch": 1035} {"train_loss": -10.333749771118164, "global_step": 173882, "epoch": 1035} {"train_loss": -10.790305137634277, "global_step": 173883, "epoch": 1035} {"train_loss": -9.942094802856445, "global_step": 173884, "epoch": 1035} {"train_loss": -10.406448364257812, "global_step": 173885, "epoch": 1035} {"train_loss": -10.713151931762695, "global_step": 173886, "epoch": 1035} {"train_loss": -10.693135261535645, "global_step": 173887, "epoch": 1035} {"train_loss": -10.414056777954102, "global_step": 173888, "epoch": 1035} {"train_loss": -10.896745681762695, "global_step": 173889, "epoch": 1035} {"train_loss": -10.454740524291992, "global_step": 173890, "epoch": 1035} {"train_loss": -10.896347045898438, "global_step": 173891, "epoch": 1035} {"train_loss": -10.956578254699707, "global_step": 173892, "epoch": 1035} {"train_loss": -10.549694061279297, "global_step": 173893, "epoch": 1035} {"train_loss": -10.913707733154297, "global_step": 173894, "epoch": 1035} {"train_loss": -10.615726470947266, "global_step": 173895, "epoch": 1035} {"train_loss": -10.998335838317871, "global_step": 173896, "epoch": 1035} {"train_loss": -10.805578231811523, "global_step": 173897, "epoch": 1035} {"train_loss": -10.692326545715332, "global_step": 173898, "epoch": 1035} {"train_loss": -10.878299713134766, "global_step": 173899, "epoch": 1035} {"train_loss": -11.073446273803711, "global_step": 173900, "epoch": 1035} {"train_loss": -10.812850952148438, "global_step": 173901, "epoch": 1035} {"train_loss": -11.087358474731445, "global_step": 173902, "epoch": 1035} {"train_loss": -10.96989631652832, "global_step": 173903, "epoch": 1035} {"train_loss": -11.01171588897705, "global_step": 173904, "epoch": 1035} {"train_loss": -11.217777252197266, "global_step": 173905, "epoch": 1035} {"train_loss": -10.880081176757812, "global_step": 173906, "epoch": 1035} {"train_loss": -11.025527954101562, "global_step": 173907, "epoch": 1035} {"train_loss": -11.049644470214844, "global_step": 173908, "epoch": 1035} {"train_loss": -10.934988021850586, "global_step": 173909, "epoch": 1035} {"train_loss": -10.973075866699219, "global_step": 173910, "epoch": 1035} {"train_loss": -11.090173721313477, "global_step": 173911, "epoch": 1035} {"train_loss": -10.911993026733398, "global_step": 173912, "epoch": 1035} {"train_loss": -11.116212844848633, "global_step": 173913, "epoch": 1035} {"train_loss": -11.203216552734375, "global_step": 173914, "epoch": 1035} {"train_loss": -11.082381248474121, "global_step": 173915, "epoch": 1035} {"train_loss": -10.960042953491211, "global_step": 173916, "epoch": 1035} {"train_loss": -11.138091087341309, "global_step": 173917, "epoch": 1035} {"train_loss": -10.869998931884766, "global_step": 173918, "epoch": 1035} {"train_loss": -11.44516658782959, "global_step": 173919, "epoch": 1035} {"train_loss": -10.708213806152344, "global_step": 173920, "epoch": 1035} {"train_loss": -11.223371505737305, "global_step": 173921, "epoch": 1035} {"train_loss": -10.766359329223633, "global_step": 173922, "epoch": 1035} {"train_loss": -11.312772750854492, "global_step": 173923, "epoch": 1035} {"train_loss": -10.840702056884766, "global_step": 173924, "epoch": 1035} {"train_loss": -11.275715827941895, "global_step": 173925, "epoch": 1035} {"train_loss": -10.84958553314209, "global_step": 173926, "epoch": 1035} {"train_loss": -10.721134185791016, "global_step": 173927, "epoch": 1035} {"train_loss": -11.259544372558594, "global_step": 173928, "epoch": 1035} {"train_loss": -11.068914413452148, "global_step": 173929, "epoch": 1035} {"train_loss": -11.026573181152344, "global_step": 173930, "epoch": 1035} {"train_loss": -11.2963228225708, "global_step": 173931, "epoch": 1035} {"train_loss": -10.989360809326172, "global_step": 173932, "epoch": 1035} {"train_loss": -11.375457763671875, "global_step": 173933, "epoch": 1035} {"train_loss": -11.188337326049805, "global_step": 173934, "epoch": 1035} {"train_loss": -11.371906280517578, "global_step": 173935, "epoch": 1035} {"train_loss": -11.30681324005127, "global_step": 173936, "epoch": 1035} {"train_loss": -11.119016647338867, "global_step": 173937, "epoch": 1035} {"train_loss": -11.417264938354492, "global_step": 173938, "epoch": 1035} {"train_loss": -11.131267547607422, "global_step": 173939, "epoch": 1035} {"train_loss": -11.332889556884766, "global_step": 173940, "epoch": 1035} {"train_loss": -11.402490615844727, "global_step": 173941, "epoch": 1035} {"train_loss": -11.50752067565918, "global_step": 173942, "epoch": 1035} {"train_loss": -11.468694686889648, "global_step": 173943, "epoch": 1035} {"train_loss": -11.343572616577148, "global_step": 173944, "epoch": 1035} {"train_loss": -11.497271537780762, "global_step": 173945, "epoch": 1035} {"train_loss": -11.2822265625, "global_step": 173946, "epoch": 1035} {"train_loss": -11.571686744689941, "global_step": 173947, "epoch": 1035} {"train_loss": -11.29544448852539, "global_step": 173948, "epoch": 1035} {"train_loss": -11.401491165161133, "global_step": 173949, "epoch": 1035} {"train_loss": -11.319622039794922, "global_step": 173950, "epoch": 1035} {"train_loss": -11.219770431518555, "global_step": 173951, "epoch": 1035} {"train_loss": -11.338485717773438, "global_step": 173952, "epoch": 1035} {"train_loss": -11.162883758544922, "global_step": 173953, "epoch": 1035} {"train_loss": -11.52072525024414, "global_step": 173954, "epoch": 1035} {"train_loss": -11.139930725097656, "global_step": 173955, "epoch": 1035} {"train_loss": -11.252915382385254, "global_step": 173956, "epoch": 1035} {"train_loss": -11.155332565307617, "global_step": 173957, "epoch": 1035} {"train_loss": -11.221303939819336, "global_step": 173958, "epoch": 1035} {"train_loss": -10.865535736083984, "global_step": 173959, "epoch": 1035} {"train_loss": -11.096912384033203, "global_step": 173960, "epoch": 1035} {"train_loss": -10.95150375366211, "global_step": 173961, "epoch": 1035} {"train_loss": -11.506265640258789, "global_step": 173962, "epoch": 1035} {"train_loss": -11.292960166931152, "global_step": 173963, "epoch": 1035} {"train_loss": -11.353574752807617, "global_step": 173964, "epoch": 1035} {"train_loss": -11.178384780883789, "global_step": 173965, "epoch": 1035} {"train_loss": -11.303360939025879, "global_step": 173966, "epoch": 1035} {"train_loss": -10.983431816101074, "global_step": 173967, "epoch": 1035} {"train_loss": -11.192987442016602, "global_step": 173968, "epoch": 1035} {"train_loss": -11.488465309143066, "global_step": 173969, "epoch": 1035} {"train_loss": -10.461759567260742, "global_step": 173970, "epoch": 1035} {"train_loss": -10.810205459594727, "global_step": 173971, "epoch": 1035} {"train_loss": -11.18887710571289, "global_step": 173972, "epoch": 1035} {"train_loss": -11.092833518981934, "global_step": 173973, "epoch": 1035} {"train_loss": -10.989492416381836, "global_step": 173974, "epoch": 1035} {"train_loss": -11.52234935760498, "global_step": 173975, "epoch": 1035} {"train_loss": -11.400955200195312, "global_step": 173976, "epoch": 1035} {"train_loss": -11.08841323852539, "global_step": 173977, "epoch": 1035} {"train_loss": -11.101954460144043, "global_step": 173978, "epoch": 1035} {"train_loss": -11.242959976196289, "global_step": 173979, "epoch": 1035} {"train_loss": -10.926788330078125, "global_step": 173980, "epoch": 1035} {"train_loss": -11.387195587158203, "global_step": 173981, "epoch": 1035} {"train_loss": -11.28905200958252, "global_step": 173982, "epoch": 1035} {"train_loss": -10.928167343139648, "global_step": 173983, "epoch": 1035} {"train_loss": -11.382606506347656, "global_step": 173984, "epoch": 1035} {"train_loss": -10.61734390258789, "global_step": 173985, "epoch": 1035} {"train_loss": -11.102325439453125, "global_step": 173986, "epoch": 1035} {"train_loss": -10.896883010864258, "global_step": 173987, "epoch": 1035} {"train_loss": -10.970904350280762, "global_step": 173988, "epoch": 1035} {"train_loss": -11.139516830444336, "global_step": 173989, "epoch": 1035} {"train_loss": -10.849111557006836, "global_step": 173990, "epoch": 1035} {"train_loss": -10.941454887390137, "global_step": 173991, "epoch": 1035} {"train_loss": -11.228035926818848, "global_step": 173992, "epoch": 1035} {"train_loss": -11.232525825500488, "global_step": 173993, "epoch": 1035} {"train_loss": -10.974617004394531, "global_step": 173994, "epoch": 1035} {"train_loss": -10.939153671264648, "global_step": 173995, "epoch": 1035} {"train_loss": -10.781425476074219, "global_step": 173996, "epoch": 1035} {"train_loss": -10.329814910888672, "global_step": 173997, "epoch": 1035} {"train_loss": -11.137306213378906, "global_step": 173998, "epoch": 1035} {"train_loss": -10.860344886779785, "global_step": 173999, "epoch": 1035} {"train_loss": -10.983461380004883, "global_step": 174000, "epoch": 1035} {"train_loss": -10.721162796020508, "global_step": 174001, "epoch": 1035} {"train_loss": -10.592914581298828, "global_step": 174002, "epoch": 1035} {"train_loss": -8.540267944335938, "global_step": 174003, "epoch": 1035} {"train_loss": -11.28941535949707, "global_step": 174004, "epoch": 1035} {"train_loss": -10.212045669555664, "global_step": 174005, "epoch": 1035} {"train_loss": -9.828093528747559, "global_step": 174006, "epoch": 1035} {"train_loss": -10.943929672241211, "global_step": 174007, "epoch": 1035} {"train_loss": -8.776668548583984, "global_step": 174008, "epoch": 1035} {"train_loss": -9.841968536376953, "global_step": 174009, "epoch": 1035} {"train_loss": -10.821672439575195, "global_step": 174010, "epoch": 1035} {"train_loss": -9.582171440124512, "global_step": 174011, "epoch": 1035} {"train_loss": -10.507331848144531, "global_step": 174012, "epoch": 1035} {"train_loss": -10.44206428527832, "global_step": 174013, "epoch": 1035} {"train_loss": -9.93045711517334, "global_step": 174014, "epoch": 1035} {"train_loss": -10.226827621459961, "global_step": 174015, "epoch": 1035} {"train_loss": -9.23387336730957, "global_step": 174016, "epoch": 1035} {"train_loss": -9.772553443908691, "global_step": 174017, "epoch": 1035} {"train_loss": -9.621369361877441, "global_step": 174018, "epoch": 1035} {"train_loss": -10.152729034423828, "global_step": 174019, "epoch": 1035} {"train_loss": -9.842388153076172, "global_step": 174020, "epoch": 1035} {"train_loss": -10.43159008026123, "global_step": 174021, "epoch": 1035} {"train_loss": -10.238008499145508, "global_step": 174022, "epoch": 1035} {"train_loss": -10.74625301361084, "global_step": 174023, "epoch": 1035} {"train_loss": -11.087204933166504, "global_step": 174024, "epoch": 1035} {"train_loss": -10.39938735961914, "global_step": 174025, "epoch": 1035} {"train_loss": -10.60534381866455, "global_step": 174026, "epoch": 1035} {"train_loss": -10.665254592895508, "global_step": 174027, "epoch": 1035} {"train_loss": -10.537214279174805, "global_step": 174028, "epoch": 1035} {"train_loss": -10.862325668334961, "global_step": 174029, "epoch": 1035} {"train_loss": -10.739686965942383, "global_step": 174030, "epoch": 1035} {"train_loss": -10.614991188049316, "global_step": 174031, "epoch": 1035} {"train_loss": -10.991573333740234, "global_step": 174032, "epoch": 1035} {"train_loss": -10.861620903015137, "global_step": 174033, "epoch": 1035} {"train_loss": -11.022167205810547, "global_step": 174034, "epoch": 1035} {"train_loss": -10.76241397857666, "global_step": 174035, "epoch": 1035} {"train_loss": -10.957986831665039, "global_step": 174036, "epoch": 1035} {"train_loss": -11.018326759338379, "global_step": 174037, "epoch": 1035} {"train_loss": -10.864789009094238, "global_step": 174038, "epoch": 1035} {"train_loss": -10.898807525634766, "global_step": 174039, "epoch": 1035} {"train_loss": -10.863042831420898, "global_step": 174040, "epoch": 1035} {"train_loss": -11.056999206542969, "global_step": 174041, "epoch": 1035} {"train_loss": -11.000850677490234, "global_step": 174042, "epoch": 1035} {"train_loss": -11.00307559967041, "global_step": 174043, "epoch": 1035} {"train_loss": -10.975648880004883, "global_step": 174044, "epoch": 1035} {"train_loss": -11.286659240722656, "global_step": 174045, "epoch": 1035} {"train_loss": -10.94396686553955, "global_step": 174046, "epoch": 1035} {"train_loss": -10.890922137669154, "global_step": 174047, "epoch": 1035, "val_loss": 229516.234375, "train_action_mse_error": 2.098525047302246} {"train_loss": -11.134862899780273, "global_step": 174048, "epoch": 1036} {"train_loss": -10.732280731201172, "global_step": 174049, "epoch": 1036} {"train_loss": -10.926008224487305, "global_step": 174050, "epoch": 1036} {"train_loss": -11.016918182373047, "global_step": 174051, "epoch": 1036} {"train_loss": -11.276089668273926, "global_step": 174052, "epoch": 1036} {"train_loss": -11.113887786865234, "global_step": 174053, "epoch": 1036} {"train_loss": -11.260292053222656, "global_step": 174054, "epoch": 1036} {"train_loss": -10.971694946289062, "global_step": 174055, "epoch": 1036} {"train_loss": -11.240161895751953, "global_step": 174056, "epoch": 1036} {"train_loss": -11.092070579528809, "global_step": 174057, "epoch": 1036} {"train_loss": -11.129352569580078, "global_step": 174058, "epoch": 1036} {"train_loss": -11.122559547424316, "global_step": 174059, "epoch": 1036} {"train_loss": -11.277140617370605, "global_step": 174060, "epoch": 1036} {"train_loss": -11.141255378723145, "global_step": 174061, "epoch": 1036} {"train_loss": -11.143239974975586, "global_step": 174062, "epoch": 1036} {"train_loss": -11.359896659851074, "global_step": 174063, "epoch": 1036} {"train_loss": -11.248125076293945, "global_step": 174064, "epoch": 1036} {"train_loss": -11.239015579223633, "global_step": 174065, "epoch": 1036} {"train_loss": -11.328058242797852, "global_step": 174066, "epoch": 1036} {"train_loss": -11.18033218383789, "global_step": 174067, "epoch": 1036} {"train_loss": -11.109071731567383, "global_step": 174068, "epoch": 1036} {"train_loss": -11.010109901428223, "global_step": 174069, "epoch": 1036} {"train_loss": -11.324070930480957, "global_step": 174070, "epoch": 1036} {"train_loss": -11.115795135498047, "global_step": 174071, "epoch": 1036} {"train_loss": -11.423946380615234, "global_step": 174072, "epoch": 1036} {"train_loss": -11.122802734375, "global_step": 174073, "epoch": 1036} {"train_loss": -11.076416015625, "global_step": 174074, "epoch": 1036} {"train_loss": -11.155860900878906, "global_step": 174075, "epoch": 1036} {"train_loss": -11.21474838256836, "global_step": 174076, "epoch": 1036} {"train_loss": -11.290426254272461, "global_step": 174077, "epoch": 1036} {"train_loss": -11.514677047729492, "global_step": 174078, "epoch": 1036} {"train_loss": -11.37929630279541, "global_step": 174079, "epoch": 1036} {"train_loss": -10.993505477905273, "global_step": 174080, "epoch": 1036} {"train_loss": -11.246004104614258, "global_step": 174081, "epoch": 1036} {"train_loss": -11.00582504272461, "global_step": 174082, "epoch": 1036} {"train_loss": -10.839653015136719, "global_step": 174083, "epoch": 1036} {"train_loss": -10.594502449035645, "global_step": 174084, "epoch": 1036} {"train_loss": -11.167073249816895, "global_step": 174085, "epoch": 1036} {"train_loss": -11.105327606201172, "global_step": 174086, "epoch": 1036} {"train_loss": -11.110538482666016, "global_step": 174087, "epoch": 1036} {"train_loss": -11.12974739074707, "global_step": 174088, "epoch": 1036} {"train_loss": -11.300954818725586, "global_step": 174089, "epoch": 1036} {"train_loss": -11.313915252685547, "global_step": 174090, "epoch": 1036} {"train_loss": -11.064170837402344, "global_step": 174091, "epoch": 1036} {"train_loss": -10.777402877807617, "global_step": 174092, "epoch": 1036} {"train_loss": -11.202494621276855, "global_step": 174093, "epoch": 1036} {"train_loss": -10.748884201049805, "global_step": 174094, "epoch": 1036} {"train_loss": -10.603157043457031, "global_step": 174095, "epoch": 1036} {"train_loss": -9.174545288085938, "global_step": 174096, "epoch": 1036} {"train_loss": -10.635936737060547, "global_step": 174097, "epoch": 1036} {"train_loss": -9.27645492553711, "global_step": 174098, "epoch": 1036} {"train_loss": -8.433725357055664, "global_step": 174099, "epoch": 1036} {"train_loss": -9.545509338378906, "global_step": 174100, "epoch": 1036} {"train_loss": -9.446617126464844, "global_step": 174101, "epoch": 1036} {"train_loss": -9.598590850830078, "global_step": 174102, "epoch": 1036} {"train_loss": -10.00196647644043, "global_step": 174103, "epoch": 1036} {"train_loss": -10.324432373046875, "global_step": 174104, "epoch": 1036} {"train_loss": -10.024209976196289, "global_step": 174105, "epoch": 1036} {"train_loss": -10.664133071899414, "global_step": 174106, "epoch": 1036} {"train_loss": -9.832690238952637, "global_step": 174107, "epoch": 1036} {"train_loss": -10.405996322631836, "global_step": 174108, "epoch": 1036} {"train_loss": -9.775188446044922, "global_step": 174109, "epoch": 1036} {"train_loss": -10.403034210205078, "global_step": 174110, "epoch": 1036} {"train_loss": -10.513550758361816, "global_step": 174111, "epoch": 1036} {"train_loss": -10.116596221923828, "global_step": 174112, "epoch": 1036} {"train_loss": -10.76572036743164, "global_step": 174113, "epoch": 1036} {"train_loss": -10.361438751220703, "global_step": 174114, "epoch": 1036} {"train_loss": -10.246302604675293, "global_step": 174115, "epoch": 1036} {"train_loss": -10.927386283874512, "global_step": 174116, "epoch": 1036} {"train_loss": -10.817747116088867, "global_step": 174117, "epoch": 1036} {"train_loss": -10.69765853881836, "global_step": 174118, "epoch": 1036} {"train_loss": -10.79395866394043, "global_step": 174119, "epoch": 1036} {"train_loss": -10.365133285522461, "global_step": 174120, "epoch": 1036} {"train_loss": -10.640403747558594, "global_step": 174121, "epoch": 1036} {"train_loss": -10.845434188842773, "global_step": 174122, "epoch": 1036} {"train_loss": -10.549540519714355, "global_step": 174123, "epoch": 1036} {"train_loss": -10.686609268188477, "global_step": 174124, "epoch": 1036} {"train_loss": -10.225107192993164, "global_step": 174125, "epoch": 1036} {"train_loss": -10.729840278625488, "global_step": 174126, "epoch": 1036} {"train_loss": -10.935527801513672, "global_step": 174127, "epoch": 1036} {"train_loss": -10.693904876708984, "global_step": 174128, "epoch": 1036} {"train_loss": -10.760311126708984, "global_step": 174129, "epoch": 1036} {"train_loss": -10.691617965698242, "global_step": 174130, "epoch": 1036} {"train_loss": -10.796004295349121, "global_step": 174131, "epoch": 1036} {"train_loss": -10.506721496582031, "global_step": 174132, "epoch": 1036} {"train_loss": -10.88123893737793, "global_step": 174133, "epoch": 1036} {"train_loss": -10.781044960021973, "global_step": 174134, "epoch": 1036} {"train_loss": -10.990789413452148, "global_step": 174135, "epoch": 1036} {"train_loss": -10.761335372924805, "global_step": 174136, "epoch": 1036} {"train_loss": -11.269512176513672, "global_step": 174137, "epoch": 1036} {"train_loss": -10.787965774536133, "global_step": 174138, "epoch": 1036} {"train_loss": -10.905994415283203, "global_step": 174139, "epoch": 1036} {"train_loss": -10.981841087341309, "global_step": 174140, "epoch": 1036} {"train_loss": -10.93751335144043, "global_step": 174141, "epoch": 1036} {"train_loss": -10.921506881713867, "global_step": 174142, "epoch": 1036} {"train_loss": -10.964869499206543, "global_step": 174143, "epoch": 1036} {"train_loss": -11.047088623046875, "global_step": 174144, "epoch": 1036} {"train_loss": -10.882536888122559, "global_step": 174145, "epoch": 1036} {"train_loss": -11.125765800476074, "global_step": 174146, "epoch": 1036} {"train_loss": -10.995744705200195, "global_step": 174147, "epoch": 1036} {"train_loss": -11.163276672363281, "global_step": 174148, "epoch": 1036} {"train_loss": -11.035558700561523, "global_step": 174149, "epoch": 1036} {"train_loss": -11.206127166748047, "global_step": 174150, "epoch": 1036} {"train_loss": -11.186417579650879, "global_step": 174151, "epoch": 1036} {"train_loss": -11.063934326171875, "global_step": 174152, "epoch": 1036} {"train_loss": -11.232681274414062, "global_step": 174153, "epoch": 1036} {"train_loss": -11.252504348754883, "global_step": 174154, "epoch": 1036} {"train_loss": -10.955345153808594, "global_step": 174155, "epoch": 1036} {"train_loss": -11.449609756469727, "global_step": 174156, "epoch": 1036} {"train_loss": -11.231302261352539, "global_step": 174157, "epoch": 1036} {"train_loss": -11.34115219116211, "global_step": 174158, "epoch": 1036} {"train_loss": -11.3255615234375, "global_step": 174159, "epoch": 1036} {"train_loss": -11.150705337524414, "global_step": 174160, "epoch": 1036} {"train_loss": -11.34202766418457, "global_step": 174161, "epoch": 1036} {"train_loss": -11.341590881347656, "global_step": 174162, "epoch": 1036} {"train_loss": -11.367749214172363, "global_step": 174163, "epoch": 1036} {"train_loss": -11.410562515258789, "global_step": 174164, "epoch": 1036} {"train_loss": -11.18947982788086, "global_step": 174165, "epoch": 1036} {"train_loss": -11.126029014587402, "global_step": 174166, "epoch": 1036} {"train_loss": -11.432012557983398, "global_step": 174167, "epoch": 1036} {"train_loss": -11.098138809204102, "global_step": 174168, "epoch": 1036} {"train_loss": -11.487570762634277, "global_step": 174169, "epoch": 1036} {"train_loss": -11.09585952758789, "global_step": 174170, "epoch": 1036} {"train_loss": -11.340609550476074, "global_step": 174171, "epoch": 1036} {"train_loss": -11.498827934265137, "global_step": 174172, "epoch": 1036} {"train_loss": -11.419429779052734, "global_step": 174173, "epoch": 1036} {"train_loss": -11.434507369995117, "global_step": 174174, "epoch": 1036} {"train_loss": -11.373468399047852, "global_step": 174175, "epoch": 1036} {"train_loss": -11.345714569091797, "global_step": 174176, "epoch": 1036} {"train_loss": -11.310641288757324, "global_step": 174177, "epoch": 1036} {"train_loss": -11.264835357666016, "global_step": 174178, "epoch": 1036} {"train_loss": -11.452205657958984, "global_step": 174179, "epoch": 1036} {"train_loss": -11.354394912719727, "global_step": 174180, "epoch": 1036} {"train_loss": -10.990036964416504, "global_step": 174181, "epoch": 1036} {"train_loss": -11.342367172241211, "global_step": 174182, "epoch": 1036} {"train_loss": -11.141483306884766, "global_step": 174183, "epoch": 1036} {"train_loss": -10.915542602539062, "global_step": 174184, "epoch": 1036} {"train_loss": -10.59173583984375, "global_step": 174185, "epoch": 1036} {"train_loss": -11.42558765411377, "global_step": 174186, "epoch": 1036} {"train_loss": -10.79949951171875, "global_step": 174187, "epoch": 1036} {"train_loss": -11.048345565795898, "global_step": 174188, "epoch": 1036} {"train_loss": -11.323078155517578, "global_step": 174189, "epoch": 1036} {"train_loss": -10.513574600219727, "global_step": 174190, "epoch": 1036} {"train_loss": -9.577554702758789, "global_step": 174191, "epoch": 1036} {"train_loss": -9.406972885131836, "global_step": 174192, "epoch": 1036} {"train_loss": -10.821812629699707, "global_step": 174193, "epoch": 1036} {"train_loss": -9.014715194702148, "global_step": 174194, "epoch": 1036} {"train_loss": -10.161856651306152, "global_step": 174195, "epoch": 1036} {"train_loss": -9.037429809570312, "global_step": 174196, "epoch": 1036} {"train_loss": -9.543952941894531, "global_step": 174197, "epoch": 1036} {"train_loss": -10.477361679077148, "global_step": 174198, "epoch": 1036} {"train_loss": -9.262663841247559, "global_step": 174199, "epoch": 1036} {"train_loss": -9.380197525024414, "global_step": 174200, "epoch": 1036} {"train_loss": -10.085233688354492, "global_step": 174201, "epoch": 1036} {"train_loss": -9.45353889465332, "global_step": 174202, "epoch": 1036} {"train_loss": -9.585491180419922, "global_step": 174203, "epoch": 1036} {"train_loss": -10.79544448852539, "global_step": 174204, "epoch": 1036} {"train_loss": -9.698213577270508, "global_step": 174205, "epoch": 1036} {"train_loss": -9.76374340057373, "global_step": 174206, "epoch": 1036} {"train_loss": -10.226497650146484, "global_step": 174207, "epoch": 1036} {"train_loss": -9.749119758605957, "global_step": 174208, "epoch": 1036} {"train_loss": -10.287069320678711, "global_step": 174209, "epoch": 1036} {"train_loss": -10.585962295532227, "global_step": 174210, "epoch": 1036} {"train_loss": -10.334823608398438, "global_step": 174211, "epoch": 1036} {"train_loss": -10.223298072814941, "global_step": 174212, "epoch": 1036} {"train_loss": -10.816482543945312, "global_step": 174213, "epoch": 1036} {"train_loss": -10.000836372375488, "global_step": 174214, "epoch": 1036} {"train_loss": -10.773515241486686, "global_step": 174215, "epoch": 1036, "val_loss": 242396.53125} {"train_loss": -10.584909439086914, "global_step": 174216, "epoch": 1037} {"train_loss": -10.002422332763672, "global_step": 174217, "epoch": 1037} {"train_loss": -10.475711822509766, "global_step": 174218, "epoch": 1037} {"train_loss": -10.523510932922363, "global_step": 174219, "epoch": 1037} {"train_loss": -10.668785095214844, "global_step": 174220, "epoch": 1037} {"train_loss": -10.811468124389648, "global_step": 174221, "epoch": 1037} {"train_loss": -10.270648956298828, "global_step": 174222, "epoch": 1037} {"train_loss": -10.599557876586914, "global_step": 174223, "epoch": 1037} {"train_loss": -10.806713104248047, "global_step": 174224, "epoch": 1037} {"train_loss": -10.33251953125, "global_step": 174225, "epoch": 1037} {"train_loss": -10.516406059265137, "global_step": 174226, "epoch": 1037} {"train_loss": -10.92034912109375, "global_step": 174227, "epoch": 1037} {"train_loss": -10.623360633850098, "global_step": 174228, "epoch": 1037} {"train_loss": -10.544698715209961, "global_step": 174229, "epoch": 1037} {"train_loss": -10.491307258605957, "global_step": 174230, "epoch": 1037} {"train_loss": -10.65510082244873, "global_step": 174231, "epoch": 1037} {"train_loss": -10.863931655883789, "global_step": 174232, "epoch": 1037} {"train_loss": -10.581786155700684, "global_step": 174233, "epoch": 1037} {"train_loss": -10.860799789428711, "global_step": 174234, "epoch": 1037} {"train_loss": -11.070030212402344, "global_step": 174235, "epoch": 1037} {"train_loss": -10.876335144042969, "global_step": 174236, "epoch": 1037} {"train_loss": -10.991249084472656, "global_step": 174237, "epoch": 1037} {"train_loss": -10.993269920349121, "global_step": 174238, "epoch": 1037} {"train_loss": -11.039665222167969, "global_step": 174239, "epoch": 1037} {"train_loss": -10.885143280029297, "global_step": 174240, "epoch": 1037} {"train_loss": -11.038849830627441, "global_step": 174241, "epoch": 1037} {"train_loss": -10.938127517700195, "global_step": 174242, "epoch": 1037} {"train_loss": -11.07494831085205, "global_step": 174243, "epoch": 1037} {"train_loss": -11.103811264038086, "global_step": 174244, "epoch": 1037} {"train_loss": -11.224546432495117, "global_step": 174245, "epoch": 1037} {"train_loss": -10.846829414367676, "global_step": 174246, "epoch": 1037} {"train_loss": -10.873028755187988, "global_step": 174247, "epoch": 1037} {"train_loss": -11.053306579589844, "global_step": 174248, "epoch": 1037} {"train_loss": -10.907140731811523, "global_step": 174249, "epoch": 1037} {"train_loss": -10.904245376586914, "global_step": 174250, "epoch": 1037} {"train_loss": -11.189651489257812, "global_step": 174251, "epoch": 1037} {"train_loss": -11.005613327026367, "global_step": 174252, "epoch": 1037} {"train_loss": -11.324762344360352, "global_step": 174253, "epoch": 1037} {"train_loss": -11.074152946472168, "global_step": 174254, "epoch": 1037} {"train_loss": -11.061569213867188, "global_step": 174255, "epoch": 1037} {"train_loss": -11.158571243286133, "global_step": 174256, "epoch": 1037} {"train_loss": -11.319924354553223, "global_step": 174257, "epoch": 1037} {"train_loss": -11.24105453491211, "global_step": 174258, "epoch": 1037} {"train_loss": -11.230981826782227, "global_step": 174259, "epoch": 1037} {"train_loss": -11.318815231323242, "global_step": 174260, "epoch": 1037} {"train_loss": -11.284384727478027, "global_step": 174261, "epoch": 1037} {"train_loss": -11.29440689086914, "global_step": 174262, "epoch": 1037} {"train_loss": -11.297538757324219, "global_step": 174263, "epoch": 1037} {"train_loss": -11.206330299377441, "global_step": 174264, "epoch": 1037} {"train_loss": -11.228809356689453, "global_step": 174265, "epoch": 1037} {"train_loss": -11.286294937133789, "global_step": 174266, "epoch": 1037} {"train_loss": -11.25597095489502, "global_step": 174267, "epoch": 1037} {"train_loss": -11.444690704345703, "global_step": 174268, "epoch": 1037} {"train_loss": -11.390207290649414, "global_step": 174269, "epoch": 1037} {"train_loss": -11.172388076782227, "global_step": 174270, "epoch": 1037} {"train_loss": -11.343849182128906, "global_step": 174271, "epoch": 1037} {"train_loss": -11.462907791137695, "global_step": 174272, "epoch": 1037} {"train_loss": -11.394590377807617, "global_step": 174273, "epoch": 1037} {"train_loss": -11.01541519165039, "global_step": 174274, "epoch": 1037} {"train_loss": -11.505142211914062, "global_step": 174275, "epoch": 1037} {"train_loss": -11.120014190673828, "global_step": 174276, "epoch": 1037} {"train_loss": -11.380901336669922, "global_step": 174277, "epoch": 1037} {"train_loss": -11.166391372680664, "global_step": 174278, "epoch": 1037} {"train_loss": -11.136935234069824, "global_step": 174279, "epoch": 1037} {"train_loss": -10.864404678344727, "global_step": 174280, "epoch": 1037} {"train_loss": -10.838120460510254, "global_step": 174281, "epoch": 1037} {"train_loss": -11.403989791870117, "global_step": 174282, "epoch": 1037} {"train_loss": -11.217924118041992, "global_step": 174283, "epoch": 1037} {"train_loss": -11.535356521606445, "global_step": 174284, "epoch": 1037} {"train_loss": -11.438817024230957, "global_step": 174285, "epoch": 1037} {"train_loss": -10.670087814331055, "global_step": 174286, "epoch": 1037} {"train_loss": -10.826387405395508, "global_step": 174287, "epoch": 1037} {"train_loss": -11.30329704284668, "global_step": 174288, "epoch": 1037} {"train_loss": -11.318737030029297, "global_step": 174289, "epoch": 1037} {"train_loss": -11.319076538085938, "global_step": 174290, "epoch": 1037} {"train_loss": -10.716666221618652, "global_step": 174291, "epoch": 1037} {"train_loss": -11.258174896240234, "global_step": 174292, "epoch": 1037} {"train_loss": -9.833066940307617, "global_step": 174293, "epoch": 1037} {"train_loss": -10.008577346801758, "global_step": 174294, "epoch": 1037} {"train_loss": -10.241600036621094, "global_step": 174295, "epoch": 1037} {"train_loss": -8.857656478881836, "global_step": 174296, "epoch": 1037} {"train_loss": -9.552112579345703, "global_step": 174297, "epoch": 1037} {"train_loss": -9.772217750549316, "global_step": 174298, "epoch": 1037} {"train_loss": -10.021234512329102, "global_step": 174299, "epoch": 1037} {"train_loss": -10.757542610168457, "global_step": 174300, "epoch": 1037} {"train_loss": -9.863653182983398, "global_step": 174301, "epoch": 1037} {"train_loss": -10.896800994873047, "global_step": 174302, "epoch": 1037} {"train_loss": -10.602398872375488, "global_step": 174303, "epoch": 1037} {"train_loss": -10.963557243347168, "global_step": 174304, "epoch": 1037} {"train_loss": -10.572830200195312, "global_step": 174305, "epoch": 1037} {"train_loss": -11.042449951171875, "global_step": 174306, "epoch": 1037} {"train_loss": -10.639440536499023, "global_step": 174307, "epoch": 1037} {"train_loss": -10.631668090820312, "global_step": 174308, "epoch": 1037} {"train_loss": -11.026378631591797, "global_step": 174309, "epoch": 1037} {"train_loss": -10.980274200439453, "global_step": 174310, "epoch": 1037} {"train_loss": -10.501150131225586, "global_step": 174311, "epoch": 1037} {"train_loss": -10.956786155700684, "global_step": 174312, "epoch": 1037} {"train_loss": -10.88650894165039, "global_step": 174313, "epoch": 1037} {"train_loss": -11.08764362335205, "global_step": 174314, "epoch": 1037} {"train_loss": -10.708066940307617, "global_step": 174315, "epoch": 1037} {"train_loss": -10.771796226501465, "global_step": 174316, "epoch": 1037} {"train_loss": -11.241655349731445, "global_step": 174317, "epoch": 1037} {"train_loss": -10.608040809631348, "global_step": 174318, "epoch": 1037} {"train_loss": -10.973230361938477, "global_step": 174319, "epoch": 1037} {"train_loss": -10.600114822387695, "global_step": 174320, "epoch": 1037} {"train_loss": -10.913637161254883, "global_step": 174321, "epoch": 1037} {"train_loss": -10.769041061401367, "global_step": 174322, "epoch": 1037} {"train_loss": -10.723489761352539, "global_step": 174323, "epoch": 1037} {"train_loss": -10.612180709838867, "global_step": 174324, "epoch": 1037} {"train_loss": -10.827543258666992, "global_step": 174325, "epoch": 1037} {"train_loss": -10.160333633422852, "global_step": 174326, "epoch": 1037} {"train_loss": -10.790689468383789, "global_step": 174327, "epoch": 1037} {"train_loss": -10.370477676391602, "global_step": 174328, "epoch": 1037} {"train_loss": -10.51954460144043, "global_step": 174329, "epoch": 1037} {"train_loss": -10.641141891479492, "global_step": 174330, "epoch": 1037} {"train_loss": -10.948375701904297, "global_step": 174331, "epoch": 1037} {"train_loss": -10.415349960327148, "global_step": 174332, "epoch": 1037} {"train_loss": -10.854558944702148, "global_step": 174333, "epoch": 1037} {"train_loss": -10.919187545776367, "global_step": 174334, "epoch": 1037} {"train_loss": -10.379264831542969, "global_step": 174335, "epoch": 1037} {"train_loss": -11.081354141235352, "global_step": 174336, "epoch": 1037} {"train_loss": -10.36518669128418, "global_step": 174337, "epoch": 1037} {"train_loss": -10.98326301574707, "global_step": 174338, "epoch": 1037} {"train_loss": -11.08195686340332, "global_step": 174339, "epoch": 1037} {"train_loss": -10.628238677978516, "global_step": 174340, "epoch": 1037} {"train_loss": -11.078774452209473, "global_step": 174341, "epoch": 1037} {"train_loss": -10.649917602539062, "global_step": 174342, "epoch": 1037} {"train_loss": -10.294588088989258, "global_step": 174343, "epoch": 1037} {"train_loss": -11.057116508483887, "global_step": 174344, "epoch": 1037} {"train_loss": -10.71009635925293, "global_step": 174345, "epoch": 1037} {"train_loss": -11.103898048400879, "global_step": 174346, "epoch": 1037} {"train_loss": -11.101505279541016, "global_step": 174347, "epoch": 1037} {"train_loss": -10.818357467651367, "global_step": 174348, "epoch": 1037} {"train_loss": -11.005024909973145, "global_step": 174349, "epoch": 1037} {"train_loss": -11.218245506286621, "global_step": 174350, "epoch": 1037} {"train_loss": -10.96602725982666, "global_step": 174351, "epoch": 1037} {"train_loss": -11.227434158325195, "global_step": 174352, "epoch": 1037} {"train_loss": -11.005451202392578, "global_step": 174353, "epoch": 1037} {"train_loss": -11.189180374145508, "global_step": 174354, "epoch": 1037} {"train_loss": -11.428348541259766, "global_step": 174355, "epoch": 1037} {"train_loss": -11.155374526977539, "global_step": 174356, "epoch": 1037} {"train_loss": -11.251739501953125, "global_step": 174357, "epoch": 1037} {"train_loss": -11.213043212890625, "global_step": 174358, "epoch": 1037} {"train_loss": -11.261775970458984, "global_step": 174359, "epoch": 1037} {"train_loss": -11.32727336883545, "global_step": 174360, "epoch": 1037} {"train_loss": -11.256948471069336, "global_step": 174361, "epoch": 1037} {"train_loss": -11.174059867858887, "global_step": 174362, "epoch": 1037} {"train_loss": -11.322053909301758, "global_step": 174363, "epoch": 1037} {"train_loss": -10.88375186920166, "global_step": 174364, "epoch": 1037} {"train_loss": -11.163755416870117, "global_step": 174365, "epoch": 1037} {"train_loss": -11.233855247497559, "global_step": 174366, "epoch": 1037} {"train_loss": -11.136648178100586, "global_step": 174367, "epoch": 1037} {"train_loss": -11.292848587036133, "global_step": 174368, "epoch": 1037} {"train_loss": -11.282072067260742, "global_step": 174369, "epoch": 1037} {"train_loss": -11.063789367675781, "global_step": 174370, "epoch": 1037} {"train_loss": -11.142932891845703, "global_step": 174371, "epoch": 1037} {"train_loss": -11.202415466308594, "global_step": 174372, "epoch": 1037} {"train_loss": -10.979772567749023, "global_step": 174373, "epoch": 1037} {"train_loss": -11.208992004394531, "global_step": 174374, "epoch": 1037} {"train_loss": -11.21954345703125, "global_step": 174375, "epoch": 1037} {"train_loss": -11.128952026367188, "global_step": 174376, "epoch": 1037} {"train_loss": -11.305444717407227, "global_step": 174377, "epoch": 1037} {"train_loss": -11.301921844482422, "global_step": 174378, "epoch": 1037} {"train_loss": -10.962194442749023, "global_step": 174379, "epoch": 1037} {"train_loss": -11.28664779663086, "global_step": 174380, "epoch": 1037} {"train_loss": -11.299152374267578, "global_step": 174381, "epoch": 1037} {"train_loss": -11.351409912109375, "global_step": 174382, "epoch": 1037} {"train_loss": -10.919848061743236, "global_step": 174383, "epoch": 1037, "val_loss": 240734.1875} {"train_loss": -11.075695037841797, "global_step": 174384, "epoch": 1038} {"train_loss": -10.381217002868652, "global_step": 174385, "epoch": 1038} {"train_loss": -10.269718170166016, "global_step": 174386, "epoch": 1038} {"train_loss": -10.344087600708008, "global_step": 174387, "epoch": 1038} {"train_loss": -10.964599609375, "global_step": 174388, "epoch": 1038} {"train_loss": -10.458965301513672, "global_step": 174389, "epoch": 1038} {"train_loss": -9.311975479125977, "global_step": 174390, "epoch": 1038} {"train_loss": -10.579203605651855, "global_step": 174391, "epoch": 1038} {"train_loss": -10.196550369262695, "global_step": 174392, "epoch": 1038} {"train_loss": -9.007993698120117, "global_step": 174393, "epoch": 1038} {"train_loss": -9.528951644897461, "global_step": 174394, "epoch": 1038} {"train_loss": -10.316162109375, "global_step": 174395, "epoch": 1038} {"train_loss": -10.302226066589355, "global_step": 174396, "epoch": 1038} {"train_loss": -10.227299690246582, "global_step": 174397, "epoch": 1038} {"train_loss": -10.740671157836914, "global_step": 174398, "epoch": 1038} {"train_loss": -9.786966323852539, "global_step": 174399, "epoch": 1038} {"train_loss": -10.983617782592773, "global_step": 174400, "epoch": 1038} {"train_loss": -9.858272552490234, "global_step": 174401, "epoch": 1038} {"train_loss": -10.590185165405273, "global_step": 174402, "epoch": 1038} {"train_loss": -10.508316040039062, "global_step": 174403, "epoch": 1038} {"train_loss": -10.835543632507324, "global_step": 174404, "epoch": 1038} {"train_loss": -10.52202033996582, "global_step": 174405, "epoch": 1038} {"train_loss": -11.257858276367188, "global_step": 174406, "epoch": 1038} {"train_loss": -10.701810836791992, "global_step": 174407, "epoch": 1038} {"train_loss": -11.073291778564453, "global_step": 174408, "epoch": 1038} {"train_loss": -10.610774040222168, "global_step": 174409, "epoch": 1038} {"train_loss": -11.006644248962402, "global_step": 174410, "epoch": 1038} {"train_loss": -10.975448608398438, "global_step": 174411, "epoch": 1038} {"train_loss": -10.745294570922852, "global_step": 174412, "epoch": 1038} {"train_loss": -11.107787132263184, "global_step": 174413, "epoch": 1038} {"train_loss": -11.06814956665039, "global_step": 174414, "epoch": 1038} {"train_loss": -10.972570419311523, "global_step": 174415, "epoch": 1038} {"train_loss": -11.035243034362793, "global_step": 174416, "epoch": 1038} {"train_loss": -11.239288330078125, "global_step": 174417, "epoch": 1038} {"train_loss": -11.09044075012207, "global_step": 174418, "epoch": 1038} {"train_loss": -10.932348251342773, "global_step": 174419, "epoch": 1038} {"train_loss": -10.823783874511719, "global_step": 174420, "epoch": 1038} {"train_loss": -11.166065216064453, "global_step": 174421, "epoch": 1038} {"train_loss": -10.520256042480469, "global_step": 174422, "epoch": 1038} {"train_loss": -10.880475997924805, "global_step": 174423, "epoch": 1038} {"train_loss": -10.347942352294922, "global_step": 174424, "epoch": 1038} {"train_loss": -10.987249374389648, "global_step": 174425, "epoch": 1038} {"train_loss": -10.725586891174316, "global_step": 174426, "epoch": 1038} {"train_loss": -10.607949256896973, "global_step": 174427, "epoch": 1038} {"train_loss": -10.845205307006836, "global_step": 174428, "epoch": 1038} {"train_loss": -10.540688514709473, "global_step": 174429, "epoch": 1038} {"train_loss": -10.8051176071167, "global_step": 174430, "epoch": 1038} {"train_loss": -11.152015686035156, "global_step": 174431, "epoch": 1038} {"train_loss": -10.587921142578125, "global_step": 174432, "epoch": 1038} {"train_loss": -10.986817359924316, "global_step": 174433, "epoch": 1038} {"train_loss": -10.8048677444458, "global_step": 174434, "epoch": 1038} {"train_loss": -10.999798774719238, "global_step": 174435, "epoch": 1038} {"train_loss": -10.959559440612793, "global_step": 174436, "epoch": 1038} {"train_loss": -10.637128829956055, "global_step": 174437, "epoch": 1038} {"train_loss": -10.758763313293457, "global_step": 174438, "epoch": 1038} {"train_loss": -10.941953659057617, "global_step": 174439, "epoch": 1038} {"train_loss": -10.654277801513672, "global_step": 174440, "epoch": 1038} {"train_loss": -11.085268020629883, "global_step": 174441, "epoch": 1038} {"train_loss": -10.861295700073242, "global_step": 174442, "epoch": 1038} {"train_loss": -10.830759048461914, "global_step": 174443, "epoch": 1038} {"train_loss": -11.298351287841797, "global_step": 174444, "epoch": 1038} {"train_loss": -10.894926071166992, "global_step": 174445, "epoch": 1038} {"train_loss": -11.121777534484863, "global_step": 174446, "epoch": 1038} {"train_loss": -10.777843475341797, "global_step": 174447, "epoch": 1038} {"train_loss": -11.128973960876465, "global_step": 174448, "epoch": 1038} {"train_loss": -11.045011520385742, "global_step": 174449, "epoch": 1038} {"train_loss": -11.292559623718262, "global_step": 174450, "epoch": 1038} {"train_loss": -11.211837768554688, "global_step": 174451, "epoch": 1038} {"train_loss": -11.01346492767334, "global_step": 174452, "epoch": 1038} {"train_loss": -11.294532775878906, "global_step": 174453, "epoch": 1038} {"train_loss": -11.129812240600586, "global_step": 174454, "epoch": 1038} {"train_loss": -11.121785163879395, "global_step": 174455, "epoch": 1038} {"train_loss": -11.332611083984375, "global_step": 174456, "epoch": 1038} {"train_loss": -11.279245376586914, "global_step": 174457, "epoch": 1038} {"train_loss": -11.417211532592773, "global_step": 174458, "epoch": 1038} {"train_loss": -11.255908966064453, "global_step": 174459, "epoch": 1038} {"train_loss": -11.364489555358887, "global_step": 174460, "epoch": 1038} {"train_loss": -11.451961517333984, "global_step": 174461, "epoch": 1038} {"train_loss": -11.366401672363281, "global_step": 174462, "epoch": 1038} {"train_loss": -11.158442497253418, "global_step": 174463, "epoch": 1038} {"train_loss": -11.188957214355469, "global_step": 174464, "epoch": 1038} {"train_loss": -11.223430633544922, "global_step": 174465, "epoch": 1038} {"train_loss": -11.230762481689453, "global_step": 174466, "epoch": 1038} {"train_loss": -11.530379295349121, "global_step": 174467, "epoch": 1038} {"train_loss": -11.216089248657227, "global_step": 174468, "epoch": 1038} {"train_loss": -11.490804672241211, "global_step": 174469, "epoch": 1038} {"train_loss": -11.487676620483398, "global_step": 174470, "epoch": 1038} {"train_loss": -11.519576072692871, "global_step": 174471, "epoch": 1038} {"train_loss": -11.474183082580566, "global_step": 174472, "epoch": 1038} {"train_loss": -11.237208366394043, "global_step": 174473, "epoch": 1038} {"train_loss": -11.386268615722656, "global_step": 174474, "epoch": 1038} {"train_loss": -11.080292701721191, "global_step": 174475, "epoch": 1038} {"train_loss": -11.256125450134277, "global_step": 174476, "epoch": 1038} {"train_loss": -11.26725959777832, "global_step": 174477, "epoch": 1038} {"train_loss": -11.026477813720703, "global_step": 174478, "epoch": 1038} {"train_loss": -11.166202545166016, "global_step": 174479, "epoch": 1038} {"train_loss": -11.58082389831543, "global_step": 174480, "epoch": 1038} {"train_loss": -11.577251434326172, "global_step": 174481, "epoch": 1038} {"train_loss": -11.480194091796875, "global_step": 174482, "epoch": 1038} {"train_loss": -11.477439880371094, "global_step": 174483, "epoch": 1038} {"train_loss": -11.570991516113281, "global_step": 174484, "epoch": 1038} {"train_loss": -11.266136169433594, "global_step": 174485, "epoch": 1038} {"train_loss": -11.465150833129883, "global_step": 174486, "epoch": 1038} {"train_loss": -11.601386070251465, "global_step": 174487, "epoch": 1038} {"train_loss": -11.460580825805664, "global_step": 174488, "epoch": 1038} {"train_loss": -11.490876197814941, "global_step": 174489, "epoch": 1038} {"train_loss": -11.343084335327148, "global_step": 174490, "epoch": 1038} {"train_loss": -11.402436256408691, "global_step": 174491, "epoch": 1038} {"train_loss": -11.158642768859863, "global_step": 174492, "epoch": 1038} {"train_loss": -11.160039901733398, "global_step": 174493, "epoch": 1038} {"train_loss": -10.651588439941406, "global_step": 174494, "epoch": 1038} {"train_loss": -11.339512825012207, "global_step": 174495, "epoch": 1038} {"train_loss": -10.58804702758789, "global_step": 174496, "epoch": 1038} {"train_loss": -10.134834289550781, "global_step": 174497, "epoch": 1038} {"train_loss": -9.89309310913086, "global_step": 174498, "epoch": 1038} {"train_loss": -10.57402229309082, "global_step": 174499, "epoch": 1038} {"train_loss": -7.3147382736206055, "global_step": 174500, "epoch": 1038} {"train_loss": -9.793846130371094, "global_step": 174501, "epoch": 1038} {"train_loss": -8.778608322143555, "global_step": 174502, "epoch": 1038} {"train_loss": -8.69943618774414, "global_step": 174503, "epoch": 1038} {"train_loss": -10.342920303344727, "global_step": 174504, "epoch": 1038} {"train_loss": -9.361720085144043, "global_step": 174505, "epoch": 1038} {"train_loss": -9.370341300964355, "global_step": 174506, "epoch": 1038} {"train_loss": -10.319296836853027, "global_step": 174507, "epoch": 1038} {"train_loss": -9.775136947631836, "global_step": 174508, "epoch": 1038} {"train_loss": -10.04330825805664, "global_step": 174509, "epoch": 1038} {"train_loss": -10.271753311157227, "global_step": 174510, "epoch": 1038} {"train_loss": -10.097335815429688, "global_step": 174511, "epoch": 1038} {"train_loss": -10.634808540344238, "global_step": 174512, "epoch": 1038} {"train_loss": -10.354981422424316, "global_step": 174513, "epoch": 1038} {"train_loss": -9.930164337158203, "global_step": 174514, "epoch": 1038} {"train_loss": -10.568146705627441, "global_step": 174515, "epoch": 1038} {"train_loss": -10.229120254516602, "global_step": 174516, "epoch": 1038} {"train_loss": -10.322868347167969, "global_step": 174517, "epoch": 1038} {"train_loss": -10.174534797668457, "global_step": 174518, "epoch": 1038} {"train_loss": -10.780922889709473, "global_step": 174519, "epoch": 1038} {"train_loss": -9.77663803100586, "global_step": 174520, "epoch": 1038} {"train_loss": -10.695056915283203, "global_step": 174521, "epoch": 1038} {"train_loss": -10.29098892211914, "global_step": 174522, "epoch": 1038} {"train_loss": -9.9652681350708, "global_step": 174523, "epoch": 1038} {"train_loss": -10.29773235321045, "global_step": 174524, "epoch": 1038} {"train_loss": -10.668663024902344, "global_step": 174525, "epoch": 1038} {"train_loss": -10.099372863769531, "global_step": 174526, "epoch": 1038} {"train_loss": -10.626409530639648, "global_step": 174527, "epoch": 1038} {"train_loss": -10.558401107788086, "global_step": 174528, "epoch": 1038} {"train_loss": -10.57386589050293, "global_step": 174529, "epoch": 1038} {"train_loss": -10.611315727233887, "global_step": 174530, "epoch": 1038} {"train_loss": -10.751824378967285, "global_step": 174531, "epoch": 1038} {"train_loss": -10.39521598815918, "global_step": 174532, "epoch": 1038} {"train_loss": -10.425020217895508, "global_step": 174533, "epoch": 1038} {"train_loss": -10.806039810180664, "global_step": 174534, "epoch": 1038} {"train_loss": -10.558624267578125, "global_step": 174535, "epoch": 1038} {"train_loss": -10.74848461151123, "global_step": 174536, "epoch": 1038} {"train_loss": -11.031620025634766, "global_step": 174537, "epoch": 1038} {"train_loss": -10.649574279785156, "global_step": 174538, "epoch": 1038} {"train_loss": -10.797924041748047, "global_step": 174539, "epoch": 1038} {"train_loss": -10.840536117553711, "global_step": 174540, "epoch": 1038} {"train_loss": -10.906585693359375, "global_step": 174541, "epoch": 1038} {"train_loss": -10.848129272460938, "global_step": 174542, "epoch": 1038} {"train_loss": -11.033434867858887, "global_step": 174543, "epoch": 1038} {"train_loss": -10.829916000366211, "global_step": 174544, "epoch": 1038} {"train_loss": -10.961742401123047, "global_step": 174545, "epoch": 1038} {"train_loss": -10.967775344848633, "global_step": 174546, "epoch": 1038} {"train_loss": -10.937744140625, "global_step": 174547, "epoch": 1038} {"train_loss": -11.09350872039795, "global_step": 174548, "epoch": 1038} {"train_loss": -10.84278392791748, "global_step": 174549, "epoch": 1038} {"train_loss": -11.10205078125, "global_step": 174550, "epoch": 1038} {"train_loss": -10.754461572283791, "global_step": 174551, "epoch": 1038, "val_loss": 228674.0625} {"train_loss": -11.033336639404297, "global_step": 174552, "epoch": 1039} {"train_loss": -11.008333206176758, "global_step": 174553, "epoch": 1039} {"train_loss": -11.067750930786133, "global_step": 174554, "epoch": 1039} {"train_loss": -11.092151641845703, "global_step": 174555, "epoch": 1039} {"train_loss": -11.282462120056152, "global_step": 174556, "epoch": 1039} {"train_loss": -10.939831733703613, "global_step": 174557, "epoch": 1039} {"train_loss": -11.068033218383789, "global_step": 174558, "epoch": 1039} {"train_loss": -11.317695617675781, "global_step": 174559, "epoch": 1039} {"train_loss": -11.293917655944824, "global_step": 174560, "epoch": 1039} {"train_loss": -11.17941665649414, "global_step": 174561, "epoch": 1039} {"train_loss": -11.309612274169922, "global_step": 174562, "epoch": 1039} {"train_loss": -11.310569763183594, "global_step": 174563, "epoch": 1039} {"train_loss": -11.371511459350586, "global_step": 174564, "epoch": 1039} {"train_loss": -11.425829887390137, "global_step": 174565, "epoch": 1039} {"train_loss": -11.471258163452148, "global_step": 174566, "epoch": 1039} {"train_loss": -11.164131164550781, "global_step": 174567, "epoch": 1039} {"train_loss": -11.417293548583984, "global_step": 174568, "epoch": 1039} {"train_loss": -11.19890022277832, "global_step": 174569, "epoch": 1039} {"train_loss": -11.132776260375977, "global_step": 174570, "epoch": 1039} {"train_loss": -11.396733283996582, "global_step": 174571, "epoch": 1039} {"train_loss": -11.351469039916992, "global_step": 174572, "epoch": 1039} {"train_loss": -11.476768493652344, "global_step": 174573, "epoch": 1039} {"train_loss": -11.285697937011719, "global_step": 174574, "epoch": 1039} {"train_loss": -11.429956436157227, "global_step": 174575, "epoch": 1039} {"train_loss": -11.101852416992188, "global_step": 174576, "epoch": 1039} {"train_loss": -11.377435684204102, "global_step": 174577, "epoch": 1039} {"train_loss": -11.34487533569336, "global_step": 174578, "epoch": 1039} {"train_loss": -11.50656795501709, "global_step": 174579, "epoch": 1039} {"train_loss": -11.469964981079102, "global_step": 174580, "epoch": 1039} {"train_loss": -11.390061378479004, "global_step": 174581, "epoch": 1039} {"train_loss": -11.325078964233398, "global_step": 174582, "epoch": 1039} {"train_loss": -11.513996124267578, "global_step": 174583, "epoch": 1039} {"train_loss": -11.493175506591797, "global_step": 174584, "epoch": 1039} {"train_loss": -11.536781311035156, "global_step": 174585, "epoch": 1039} {"train_loss": -11.41885757446289, "global_step": 174586, "epoch": 1039} {"train_loss": -11.504430770874023, "global_step": 174587, "epoch": 1039} {"train_loss": -11.600448608398438, "global_step": 174588, "epoch": 1039} {"train_loss": -11.251344680786133, "global_step": 174589, "epoch": 1039} {"train_loss": -11.343400001525879, "global_step": 174590, "epoch": 1039} {"train_loss": -11.216085433959961, "global_step": 174591, "epoch": 1039} {"train_loss": -11.27922534942627, "global_step": 174592, "epoch": 1039} {"train_loss": -11.523712158203125, "global_step": 174593, "epoch": 1039} {"train_loss": -11.34469223022461, "global_step": 174594, "epoch": 1039} {"train_loss": -11.369671821594238, "global_step": 174595, "epoch": 1039} {"train_loss": -10.746227264404297, "global_step": 174596, "epoch": 1039} {"train_loss": -11.509849548339844, "global_step": 174597, "epoch": 1039} {"train_loss": -10.651975631713867, "global_step": 174598, "epoch": 1039} {"train_loss": -10.364035606384277, "global_step": 174599, "epoch": 1039} {"train_loss": -9.973431587219238, "global_step": 174600, "epoch": 1039} {"train_loss": -11.174376487731934, "global_step": 174601, "epoch": 1039} {"train_loss": -11.28724479675293, "global_step": 174602, "epoch": 1039} {"train_loss": -10.820724487304688, "global_step": 174603, "epoch": 1039} {"train_loss": -10.921161651611328, "global_step": 174604, "epoch": 1039} {"train_loss": -11.149003982543945, "global_step": 174605, "epoch": 1039} {"train_loss": -10.935084342956543, "global_step": 174606, "epoch": 1039} {"train_loss": -10.913249969482422, "global_step": 174607, "epoch": 1039} {"train_loss": -11.260110855102539, "global_step": 174608, "epoch": 1039} {"train_loss": -11.240964889526367, "global_step": 174609, "epoch": 1039} {"train_loss": -11.068986892700195, "global_step": 174610, "epoch": 1039} {"train_loss": -11.255330085754395, "global_step": 174611, "epoch": 1039} {"train_loss": -10.67424201965332, "global_step": 174612, "epoch": 1039} {"train_loss": -11.266729354858398, "global_step": 174613, "epoch": 1039} {"train_loss": -11.260629653930664, "global_step": 174614, "epoch": 1039} {"train_loss": -10.707669258117676, "global_step": 174615, "epoch": 1039} {"train_loss": -10.978570938110352, "global_step": 174616, "epoch": 1039} {"train_loss": -11.222433090209961, "global_step": 174617, "epoch": 1039} {"train_loss": -10.819168090820312, "global_step": 174618, "epoch": 1039} {"train_loss": -10.844847679138184, "global_step": 174619, "epoch": 1039} {"train_loss": -11.194350242614746, "global_step": 174620, "epoch": 1039} {"train_loss": -10.67689323425293, "global_step": 174621, "epoch": 1039} {"train_loss": -10.76107120513916, "global_step": 174622, "epoch": 1039} {"train_loss": -9.903796195983887, "global_step": 174623, "epoch": 1039} {"train_loss": -10.988359451293945, "global_step": 174624, "epoch": 1039} {"train_loss": -10.32922649383545, "global_step": 174625, "epoch": 1039} {"train_loss": -11.00784683227539, "global_step": 174626, "epoch": 1039} {"train_loss": -11.245609283447266, "global_step": 174627, "epoch": 1039} {"train_loss": -11.394632339477539, "global_step": 174628, "epoch": 1039} {"train_loss": -10.774395942687988, "global_step": 174629, "epoch": 1039} {"train_loss": -11.03029727935791, "global_step": 174630, "epoch": 1039} {"train_loss": -11.379796981811523, "global_step": 174631, "epoch": 1039} {"train_loss": -11.257671356201172, "global_step": 174632, "epoch": 1039} {"train_loss": -10.971883773803711, "global_step": 174633, "epoch": 1039} {"train_loss": -11.129570007324219, "global_step": 174634, "epoch": 1039} {"train_loss": -11.302976608276367, "global_step": 174635, "epoch": 1039} {"train_loss": -11.202411651611328, "global_step": 174636, "epoch": 1039} {"train_loss": -11.344989776611328, "global_step": 174637, "epoch": 1039} {"train_loss": -11.181585311889648, "global_step": 174638, "epoch": 1039} {"train_loss": -11.325763702392578, "global_step": 174639, "epoch": 1039} {"train_loss": -11.274288177490234, "global_step": 174640, "epoch": 1039} {"train_loss": -11.475727081298828, "global_step": 174641, "epoch": 1039} {"train_loss": -11.360307693481445, "global_step": 174642, "epoch": 1039} {"train_loss": -11.369525909423828, "global_step": 174643, "epoch": 1039} {"train_loss": -11.191905975341797, "global_step": 174644, "epoch": 1039} {"train_loss": -11.516104698181152, "global_step": 174645, "epoch": 1039} {"train_loss": -10.933666229248047, "global_step": 174646, "epoch": 1039} {"train_loss": -11.22265625, "global_step": 174647, "epoch": 1039} {"train_loss": -10.987504959106445, "global_step": 174648, "epoch": 1039} {"train_loss": -11.443020820617676, "global_step": 174649, "epoch": 1039} {"train_loss": -11.06933879852295, "global_step": 174650, "epoch": 1039} {"train_loss": -10.910325050354004, "global_step": 174651, "epoch": 1039} {"train_loss": -11.303487777709961, "global_step": 174652, "epoch": 1039} {"train_loss": -11.199939727783203, "global_step": 174653, "epoch": 1039} {"train_loss": -11.254166603088379, "global_step": 174654, "epoch": 1039} {"train_loss": -11.292500495910645, "global_step": 174655, "epoch": 1039} {"train_loss": -11.30557918548584, "global_step": 174656, "epoch": 1039} {"train_loss": -11.157238006591797, "global_step": 174657, "epoch": 1039} {"train_loss": -11.137223243713379, "global_step": 174658, "epoch": 1039} {"train_loss": -11.523457527160645, "global_step": 174659, "epoch": 1039} {"train_loss": -11.373592376708984, "global_step": 174660, "epoch": 1039} {"train_loss": -11.192468643188477, "global_step": 174661, "epoch": 1039} {"train_loss": -11.31757640838623, "global_step": 174662, "epoch": 1039} {"train_loss": -11.191913604736328, "global_step": 174663, "epoch": 1039} {"train_loss": -11.195823669433594, "global_step": 174664, "epoch": 1039} {"train_loss": -11.39378547668457, "global_step": 174665, "epoch": 1039} {"train_loss": -11.240705490112305, "global_step": 174666, "epoch": 1039} {"train_loss": -11.108991622924805, "global_step": 174667, "epoch": 1039} {"train_loss": -10.538471221923828, "global_step": 174668, "epoch": 1039} {"train_loss": -10.945608139038086, "global_step": 174669, "epoch": 1039} {"train_loss": -10.429910659790039, "global_step": 174670, "epoch": 1039} {"train_loss": -9.89364242553711, "global_step": 174671, "epoch": 1039} {"train_loss": -10.936423301696777, "global_step": 174672, "epoch": 1039} {"train_loss": -10.67985725402832, "global_step": 174673, "epoch": 1039} {"train_loss": -9.510133743286133, "global_step": 174674, "epoch": 1039} {"train_loss": -11.016782760620117, "global_step": 174675, "epoch": 1039} {"train_loss": -10.13943862915039, "global_step": 174676, "epoch": 1039} {"train_loss": -10.534494400024414, "global_step": 174677, "epoch": 1039} {"train_loss": -11.258302688598633, "global_step": 174678, "epoch": 1039} {"train_loss": -10.793806076049805, "global_step": 174679, "epoch": 1039} {"train_loss": -11.156980514526367, "global_step": 174680, "epoch": 1039} {"train_loss": -10.98219108581543, "global_step": 174681, "epoch": 1039} {"train_loss": -10.449005126953125, "global_step": 174682, "epoch": 1039} {"train_loss": -10.342679023742676, "global_step": 174683, "epoch": 1039} {"train_loss": -11.048868179321289, "global_step": 174684, "epoch": 1039} {"train_loss": -10.642566680908203, "global_step": 174685, "epoch": 1039} {"train_loss": -11.035455703735352, "global_step": 174686, "epoch": 1039} {"train_loss": -10.870401382446289, "global_step": 174687, "epoch": 1039} {"train_loss": -11.281892776489258, "global_step": 174688, "epoch": 1039} {"train_loss": -10.99972152709961, "global_step": 174689, "epoch": 1039} {"train_loss": -11.15742301940918, "global_step": 174690, "epoch": 1039} {"train_loss": -11.195999145507812, "global_step": 174691, "epoch": 1039} {"train_loss": -10.986291885375977, "global_step": 174692, "epoch": 1039} {"train_loss": -10.853294372558594, "global_step": 174693, "epoch": 1039} {"train_loss": -10.899211883544922, "global_step": 174694, "epoch": 1039} {"train_loss": -11.16651439666748, "global_step": 174695, "epoch": 1039} {"train_loss": -10.960983276367188, "global_step": 174696, "epoch": 1039} {"train_loss": -11.16788387298584, "global_step": 174697, "epoch": 1039} {"train_loss": -10.774487495422363, "global_step": 174698, "epoch": 1039} {"train_loss": -11.25206470489502, "global_step": 174699, "epoch": 1039} {"train_loss": -11.084554672241211, "global_step": 174700, "epoch": 1039} {"train_loss": -11.205286979675293, "global_step": 174701, "epoch": 1039} {"train_loss": -11.326583862304688, "global_step": 174702, "epoch": 1039} {"train_loss": -11.157052993774414, "global_step": 174703, "epoch": 1039} {"train_loss": -11.299827575683594, "global_step": 174704, "epoch": 1039} {"train_loss": -10.976232528686523, "global_step": 174705, "epoch": 1039} {"train_loss": -11.160764694213867, "global_step": 174706, "epoch": 1039} {"train_loss": -10.981560707092285, "global_step": 174707, "epoch": 1039} {"train_loss": -11.239569664001465, "global_step": 174708, "epoch": 1039} {"train_loss": -11.301689147949219, "global_step": 174709, "epoch": 1039} {"train_loss": -11.246783256530762, "global_step": 174710, "epoch": 1039} {"train_loss": -11.337567329406738, "global_step": 174711, "epoch": 1039} {"train_loss": -11.298482894897461, "global_step": 174712, "epoch": 1039} {"train_loss": -11.523019790649414, "global_step": 174713, "epoch": 1039} {"train_loss": -11.006547927856445, "global_step": 174714, "epoch": 1039} {"train_loss": -11.224980354309082, "global_step": 174715, "epoch": 1039} {"train_loss": -11.360441207885742, "global_step": 174716, "epoch": 1039} {"train_loss": -11.480767250061035, "global_step": 174717, "epoch": 1039} {"train_loss": -11.049689292907715, "global_step": 174718, "epoch": 1039} {"train_loss": -11.112258843013219, "global_step": 174719, "epoch": 1039, "val_loss": 240971.5} {"train_loss": -11.413395881652832, "global_step": 174720, "epoch": 1040} {"train_loss": -11.200468063354492, "global_step": 174721, "epoch": 1040} {"train_loss": -11.293136596679688, "global_step": 174722, "epoch": 1040} {"train_loss": -11.319405555725098, "global_step": 174723, "epoch": 1040} {"train_loss": -11.55252456665039, "global_step": 174724, "epoch": 1040} {"train_loss": -11.41070556640625, "global_step": 174725, "epoch": 1040} {"train_loss": -11.49710750579834, "global_step": 174726, "epoch": 1040} {"train_loss": -11.384420394897461, "global_step": 174727, "epoch": 1040} {"train_loss": -11.557456016540527, "global_step": 174728, "epoch": 1040} {"train_loss": -11.053616523742676, "global_step": 174729, "epoch": 1040} {"train_loss": -10.793014526367188, "global_step": 174730, "epoch": 1040} {"train_loss": -11.473442077636719, "global_step": 174731, "epoch": 1040} {"train_loss": -11.528165817260742, "global_step": 174732, "epoch": 1040} {"train_loss": -11.314901351928711, "global_step": 174733, "epoch": 1040} {"train_loss": -11.123610496520996, "global_step": 174734, "epoch": 1040} {"train_loss": -11.421701431274414, "global_step": 174735, "epoch": 1040} {"train_loss": -11.320777893066406, "global_step": 174736, "epoch": 1040} {"train_loss": -11.21519660949707, "global_step": 174737, "epoch": 1040} {"train_loss": -11.302011489868164, "global_step": 174738, "epoch": 1040} {"train_loss": -11.24276351928711, "global_step": 174739, "epoch": 1040} {"train_loss": -11.141298294067383, "global_step": 174740, "epoch": 1040} {"train_loss": -11.623361587524414, "global_step": 174741, "epoch": 1040} {"train_loss": -11.08993148803711, "global_step": 174742, "epoch": 1040} {"train_loss": -10.60452651977539, "global_step": 174743, "epoch": 1040} {"train_loss": -11.352272033691406, "global_step": 174744, "epoch": 1040} {"train_loss": -10.513507843017578, "global_step": 174745, "epoch": 1040} {"train_loss": -11.348735809326172, "global_step": 174746, "epoch": 1040} {"train_loss": -11.180559158325195, "global_step": 174747, "epoch": 1040} {"train_loss": -10.25344467163086, "global_step": 174748, "epoch": 1040} {"train_loss": -11.222606658935547, "global_step": 174749, "epoch": 1040} {"train_loss": -11.088666915893555, "global_step": 174750, "epoch": 1040} {"train_loss": -10.743063926696777, "global_step": 174751, "epoch": 1040} {"train_loss": -10.628250122070312, "global_step": 174752, "epoch": 1040} {"train_loss": -11.120363235473633, "global_step": 174753, "epoch": 1040} {"train_loss": -9.089521408081055, "global_step": 174754, "epoch": 1040} {"train_loss": -11.278425216674805, "global_step": 174755, "epoch": 1040} {"train_loss": -10.007472038269043, "global_step": 174756, "epoch": 1040} {"train_loss": -9.659112930297852, "global_step": 174757, "epoch": 1040} {"train_loss": -11.011093139648438, "global_step": 174758, "epoch": 1040} {"train_loss": -10.588805198669434, "global_step": 174759, "epoch": 1040} {"train_loss": -10.753314018249512, "global_step": 174760, "epoch": 1040} {"train_loss": -11.052776336669922, "global_step": 174761, "epoch": 1040} {"train_loss": -10.438338279724121, "global_step": 174762, "epoch": 1040} {"train_loss": -10.828643798828125, "global_step": 174763, "epoch": 1040} {"train_loss": -10.25714111328125, "global_step": 174764, "epoch": 1040} {"train_loss": -10.781248092651367, "global_step": 174765, "epoch": 1040} {"train_loss": -10.990134239196777, "global_step": 174766, "epoch": 1040} {"train_loss": -10.50080394744873, "global_step": 174767, "epoch": 1040} {"train_loss": -11.02769947052002, "global_step": 174768, "epoch": 1040} {"train_loss": -10.806076049804688, "global_step": 174769, "epoch": 1040} {"train_loss": -10.81531047821045, "global_step": 174770, "epoch": 1040} {"train_loss": -10.753766059875488, "global_step": 174771, "epoch": 1040} {"train_loss": -10.8469877243042, "global_step": 174772, "epoch": 1040} {"train_loss": -11.070539474487305, "global_step": 174773, "epoch": 1040} {"train_loss": -11.222747802734375, "global_step": 174774, "epoch": 1040} {"train_loss": -11.046388626098633, "global_step": 174775, "epoch": 1040} {"train_loss": -11.03823471069336, "global_step": 174776, "epoch": 1040} {"train_loss": -10.951467514038086, "global_step": 174777, "epoch": 1040} {"train_loss": -11.022468566894531, "global_step": 174778, "epoch": 1040} {"train_loss": -11.157191276550293, "global_step": 174779, "epoch": 1040} {"train_loss": -11.048355102539062, "global_step": 174780, "epoch": 1040} {"train_loss": -11.033260345458984, "global_step": 174781, "epoch": 1040} {"train_loss": -11.009673118591309, "global_step": 174782, "epoch": 1040} {"train_loss": -11.078754425048828, "global_step": 174783, "epoch": 1040} {"train_loss": -11.118847846984863, "global_step": 174784, "epoch": 1040} {"train_loss": -10.937777519226074, "global_step": 174785, "epoch": 1040} {"train_loss": -10.954505920410156, "global_step": 174786, "epoch": 1040} {"train_loss": -11.179133415222168, "global_step": 174787, "epoch": 1040} {"train_loss": -10.952733993530273, "global_step": 174788, "epoch": 1040} {"train_loss": -10.58668327331543, "global_step": 174789, "epoch": 1040} {"train_loss": -11.121498107910156, "global_step": 174790, "epoch": 1040} {"train_loss": -10.792173385620117, "global_step": 174791, "epoch": 1040} {"train_loss": -10.969038009643555, "global_step": 174792, "epoch": 1040} {"train_loss": -10.828348159790039, "global_step": 174793, "epoch": 1040} {"train_loss": -10.656421661376953, "global_step": 174794, "epoch": 1040} {"train_loss": -11.037263870239258, "global_step": 174795, "epoch": 1040} {"train_loss": -10.846456527709961, "global_step": 174796, "epoch": 1040} {"train_loss": -11.052175521850586, "global_step": 174797, "epoch": 1040} {"train_loss": -10.986696243286133, "global_step": 174798, "epoch": 1040} {"train_loss": -10.745962142944336, "global_step": 174799, "epoch": 1040} {"train_loss": -10.891316413879395, "global_step": 174800, "epoch": 1040} {"train_loss": -11.00823974609375, "global_step": 174801, "epoch": 1040} {"train_loss": -10.73556900024414, "global_step": 174802, "epoch": 1040} {"train_loss": -11.15915298461914, "global_step": 174803, "epoch": 1040} {"train_loss": -11.079526901245117, "global_step": 174804, "epoch": 1040} {"train_loss": -11.190069198608398, "global_step": 174805, "epoch": 1040} {"train_loss": -10.990595817565918, "global_step": 174806, "epoch": 1040} {"train_loss": -11.235015869140625, "global_step": 174807, "epoch": 1040} {"train_loss": -10.850202560424805, "global_step": 174808, "epoch": 1040} {"train_loss": -11.143747329711914, "global_step": 174809, "epoch": 1040} {"train_loss": -11.208789825439453, "global_step": 174810, "epoch": 1040} {"train_loss": -11.193670272827148, "global_step": 174811, "epoch": 1040} {"train_loss": -11.098836898803711, "global_step": 174812, "epoch": 1040} {"train_loss": -10.800946235656738, "global_step": 174813, "epoch": 1040} {"train_loss": -10.905915260314941, "global_step": 174814, "epoch": 1040} {"train_loss": -10.934566497802734, "global_step": 174815, "epoch": 1040} {"train_loss": -10.803834915161133, "global_step": 174816, "epoch": 1040} {"train_loss": -10.798026084899902, "global_step": 174817, "epoch": 1040} {"train_loss": -11.05472469329834, "global_step": 174818, "epoch": 1040} {"train_loss": -10.860549926757812, "global_step": 174819, "epoch": 1040} {"train_loss": -10.863531112670898, "global_step": 174820, "epoch": 1040} {"train_loss": -11.069686889648438, "global_step": 174821, "epoch": 1040} {"train_loss": -11.004541397094727, "global_step": 174822, "epoch": 1040} {"train_loss": -11.160744667053223, "global_step": 174823, "epoch": 1040} {"train_loss": -11.284818649291992, "global_step": 174824, "epoch": 1040} {"train_loss": -11.185563087463379, "global_step": 174825, "epoch": 1040} {"train_loss": -11.050760269165039, "global_step": 174826, "epoch": 1040} {"train_loss": -11.27907943725586, "global_step": 174827, "epoch": 1040} {"train_loss": -11.17595100402832, "global_step": 174828, "epoch": 1040} {"train_loss": -11.076871871948242, "global_step": 174829, "epoch": 1040} {"train_loss": -11.254676818847656, "global_step": 174830, "epoch": 1040} {"train_loss": -11.209064483642578, "global_step": 174831, "epoch": 1040} {"train_loss": -11.236492156982422, "global_step": 174832, "epoch": 1040} {"train_loss": -11.330903053283691, "global_step": 174833, "epoch": 1040} {"train_loss": -11.011398315429688, "global_step": 174834, "epoch": 1040} {"train_loss": -11.36846923828125, "global_step": 174835, "epoch": 1040} {"train_loss": -10.919431686401367, "global_step": 174836, "epoch": 1040} {"train_loss": -11.429200172424316, "global_step": 174837, "epoch": 1040} {"train_loss": -11.411874771118164, "global_step": 174838, "epoch": 1040} {"train_loss": -11.074930191040039, "global_step": 174839, "epoch": 1040} {"train_loss": -11.169252395629883, "global_step": 174840, "epoch": 1040} {"train_loss": -11.172980308532715, "global_step": 174841, "epoch": 1040} {"train_loss": -11.22264575958252, "global_step": 174842, "epoch": 1040} {"train_loss": -11.28268814086914, "global_step": 174843, "epoch": 1040} {"train_loss": -11.246749877929688, "global_step": 174844, "epoch": 1040} {"train_loss": -11.178150177001953, "global_step": 174845, "epoch": 1040} {"train_loss": -11.151640892028809, "global_step": 174846, "epoch": 1040} {"train_loss": -10.798139572143555, "global_step": 174847, "epoch": 1040} {"train_loss": -11.035737991333008, "global_step": 174848, "epoch": 1040} {"train_loss": -10.378190994262695, "global_step": 174849, "epoch": 1040} {"train_loss": -11.204313278198242, "global_step": 174850, "epoch": 1040} {"train_loss": -10.590351104736328, "global_step": 174851, "epoch": 1040} {"train_loss": -10.945291519165039, "global_step": 174852, "epoch": 1040} {"train_loss": -10.652721405029297, "global_step": 174853, "epoch": 1040} {"train_loss": -10.959708213806152, "global_step": 174854, "epoch": 1040} {"train_loss": -10.94804573059082, "global_step": 174855, "epoch": 1040} {"train_loss": -11.150872230529785, "global_step": 174856, "epoch": 1040} {"train_loss": -10.881328582763672, "global_step": 174857, "epoch": 1040} {"train_loss": -11.287873268127441, "global_step": 174858, "epoch": 1040} {"train_loss": -10.998313903808594, "global_step": 174859, "epoch": 1040} {"train_loss": -11.127071380615234, "global_step": 174860, "epoch": 1040} {"train_loss": -10.832310676574707, "global_step": 174861, "epoch": 1040} {"train_loss": -11.218840599060059, "global_step": 174862, "epoch": 1040} {"train_loss": -11.14908504486084, "global_step": 174863, "epoch": 1040} {"train_loss": -10.954930305480957, "global_step": 174864, "epoch": 1040} {"train_loss": -10.887450218200684, "global_step": 174865, "epoch": 1040} {"train_loss": -10.514445304870605, "global_step": 174866, "epoch": 1040} {"train_loss": -11.316594123840332, "global_step": 174867, "epoch": 1040} {"train_loss": -10.899232864379883, "global_step": 174868, "epoch": 1040} {"train_loss": -11.215675354003906, "global_step": 174869, "epoch": 1040} {"train_loss": -11.123006820678711, "global_step": 174870, "epoch": 1040} {"train_loss": -11.005637168884277, "global_step": 174871, "epoch": 1040} {"train_loss": -11.098806381225586, "global_step": 174872, "epoch": 1040} {"train_loss": -11.388187408447266, "global_step": 174873, "epoch": 1040} {"train_loss": -11.107090950012207, "global_step": 174874, "epoch": 1040} {"train_loss": -11.224390029907227, "global_step": 174875, "epoch": 1040} {"train_loss": -11.133352279663086, "global_step": 174876, "epoch": 1040} {"train_loss": -11.281820297241211, "global_step": 174877, "epoch": 1040} {"train_loss": -11.112564086914062, "global_step": 174878, "epoch": 1040} {"train_loss": -11.335345268249512, "global_step": 174879, "epoch": 1040} {"train_loss": -11.203218460083008, "global_step": 174880, "epoch": 1040} {"train_loss": -11.079338073730469, "global_step": 174881, "epoch": 1040} {"train_loss": -11.320585250854492, "global_step": 174882, "epoch": 1040} {"train_loss": -11.035913467407227, "global_step": 174883, "epoch": 1040} {"train_loss": -11.1649751663208, "global_step": 174884, "epoch": 1040} {"train_loss": -11.452611923217773, "global_step": 174885, "epoch": 1040} {"train_loss": -11.051206588745117, "global_step": 174886, "epoch": 1040} {"train_loss": -11.030959350722176, "global_step": 174887, "epoch": 1040, "val_loss": 242829.484375, "train_action_mse_error": 2.0545871257781982} {"train_loss": -11.18974494934082, "global_step": 174888, "epoch": 1041} {"train_loss": -11.176502227783203, "global_step": 174889, "epoch": 1041} {"train_loss": -11.176244735717773, "global_step": 174890, "epoch": 1041} {"train_loss": -11.443475723266602, "global_step": 174891, "epoch": 1041} {"train_loss": -11.111082077026367, "global_step": 174892, "epoch": 1041} {"train_loss": -11.14256477355957, "global_step": 174893, "epoch": 1041} {"train_loss": -11.136129379272461, "global_step": 174894, "epoch": 1041} {"train_loss": -11.130780220031738, "global_step": 174895, "epoch": 1041} {"train_loss": -10.9326753616333, "global_step": 174896, "epoch": 1041} {"train_loss": -11.197038650512695, "global_step": 174897, "epoch": 1041} {"train_loss": -11.427946090698242, "global_step": 174898, "epoch": 1041} {"train_loss": -11.031000137329102, "global_step": 174899, "epoch": 1041} {"train_loss": -10.981494903564453, "global_step": 174900, "epoch": 1041} {"train_loss": -11.016020774841309, "global_step": 174901, "epoch": 1041} {"train_loss": -11.318581581115723, "global_step": 174902, "epoch": 1041} {"train_loss": -11.516538619995117, "global_step": 174903, "epoch": 1041} {"train_loss": -11.113615036010742, "global_step": 174904, "epoch": 1041} {"train_loss": -10.951436996459961, "global_step": 174905, "epoch": 1041} {"train_loss": -11.286492347717285, "global_step": 174906, "epoch": 1041} {"train_loss": -10.884057998657227, "global_step": 174907, "epoch": 1041} {"train_loss": -11.324308395385742, "global_step": 174908, "epoch": 1041} {"train_loss": -11.097715377807617, "global_step": 174909, "epoch": 1041} {"train_loss": -10.958783149719238, "global_step": 174910, "epoch": 1041} {"train_loss": -10.21890640258789, "global_step": 174911, "epoch": 1041} {"train_loss": -10.562797546386719, "global_step": 174912, "epoch": 1041} {"train_loss": -9.88491439819336, "global_step": 174913, "epoch": 1041} {"train_loss": -8.709146499633789, "global_step": 174914, "epoch": 1041} {"train_loss": -7.672146797180176, "global_step": 174915, "epoch": 1041} {"train_loss": -9.291961669921875, "global_step": 174916, "epoch": 1041} {"train_loss": -9.061272621154785, "global_step": 174917, "epoch": 1041} {"train_loss": -8.625055313110352, "global_step": 174918, "epoch": 1041} {"train_loss": -8.373942375183105, "global_step": 174919, "epoch": 1041} {"train_loss": -8.8289794921875, "global_step": 174920, "epoch": 1041} {"train_loss": -9.259263038635254, "global_step": 174921, "epoch": 1041} {"train_loss": -9.354493141174316, "global_step": 174922, "epoch": 1041} {"train_loss": -9.30630111694336, "global_step": 174923, "epoch": 1041} {"train_loss": -8.430856704711914, "global_step": 174924, "epoch": 1041} {"train_loss": -9.167064666748047, "global_step": 174925, "epoch": 1041} {"train_loss": -9.158217430114746, "global_step": 174926, "epoch": 1041} {"train_loss": -8.049041748046875, "global_step": 174927, "epoch": 1041} {"train_loss": -10.020129203796387, "global_step": 174928, "epoch": 1041} {"train_loss": -8.973803520202637, "global_step": 174929, "epoch": 1041} {"train_loss": -10.228497505187988, "global_step": 174930, "epoch": 1041} {"train_loss": -9.622682571411133, "global_step": 174931, "epoch": 1041} {"train_loss": -10.744598388671875, "global_step": 174932, "epoch": 1041} {"train_loss": -9.9452486038208, "global_step": 174933, "epoch": 1041} {"train_loss": -9.985432624816895, "global_step": 174934, "epoch": 1041} {"train_loss": -10.485832214355469, "global_step": 174935, "epoch": 1041} {"train_loss": -10.215433120727539, "global_step": 174936, "epoch": 1041} {"train_loss": -10.663533210754395, "global_step": 174937, "epoch": 1041} {"train_loss": -10.488079071044922, "global_step": 174938, "epoch": 1041} {"train_loss": -10.794391632080078, "global_step": 174939, "epoch": 1041} {"train_loss": -10.62099552154541, "global_step": 174940, "epoch": 1041} {"train_loss": -10.525761604309082, "global_step": 174941, "epoch": 1041} {"train_loss": -10.761070251464844, "global_step": 174942, "epoch": 1041} {"train_loss": -10.877401351928711, "global_step": 174943, "epoch": 1041} {"train_loss": -10.511506080627441, "global_step": 174944, "epoch": 1041} {"train_loss": -10.67765998840332, "global_step": 174945, "epoch": 1041} {"train_loss": -10.846292495727539, "global_step": 174946, "epoch": 1041} {"train_loss": -10.584358215332031, "global_step": 174947, "epoch": 1041} {"train_loss": -10.765560150146484, "global_step": 174948, "epoch": 1041} {"train_loss": -10.827069282531738, "global_step": 174949, "epoch": 1041} {"train_loss": -10.746967315673828, "global_step": 174950, "epoch": 1041} {"train_loss": -10.927255630493164, "global_step": 174951, "epoch": 1041} {"train_loss": -10.798080444335938, "global_step": 174952, "epoch": 1041} {"train_loss": -10.834115982055664, "global_step": 174953, "epoch": 1041} {"train_loss": -10.900032043457031, "global_step": 174954, "epoch": 1041} {"train_loss": -10.837681770324707, "global_step": 174955, "epoch": 1041} {"train_loss": -10.933484077453613, "global_step": 174956, "epoch": 1041} {"train_loss": -10.901100158691406, "global_step": 174957, "epoch": 1041} {"train_loss": -10.809089660644531, "global_step": 174958, "epoch": 1041} {"train_loss": -11.139606475830078, "global_step": 174959, "epoch": 1041} {"train_loss": -10.905840873718262, "global_step": 174960, "epoch": 1041} {"train_loss": -11.10319709777832, "global_step": 174961, "epoch": 1041} {"train_loss": -11.048698425292969, "global_step": 174962, "epoch": 1041} {"train_loss": -10.937088012695312, "global_step": 174963, "epoch": 1041} {"train_loss": -11.172626495361328, "global_step": 174964, "epoch": 1041} {"train_loss": -10.783651351928711, "global_step": 174965, "epoch": 1041} {"train_loss": -11.153996467590332, "global_step": 174966, "epoch": 1041} {"train_loss": -11.08888053894043, "global_step": 174967, "epoch": 1041} {"train_loss": -11.11174201965332, "global_step": 174968, "epoch": 1041} {"train_loss": -11.225851058959961, "global_step": 174969, "epoch": 1041} {"train_loss": -11.094654083251953, "global_step": 174970, "epoch": 1041} {"train_loss": -11.280139923095703, "global_step": 174971, "epoch": 1041} {"train_loss": -11.278118133544922, "global_step": 174972, "epoch": 1041} {"train_loss": -11.124156951904297, "global_step": 174973, "epoch": 1041} {"train_loss": -11.298161506652832, "global_step": 174974, "epoch": 1041} {"train_loss": -11.241472244262695, "global_step": 174975, "epoch": 1041} {"train_loss": -11.236034393310547, "global_step": 174976, "epoch": 1041} {"train_loss": -11.255098342895508, "global_step": 174977, "epoch": 1041} {"train_loss": -11.271854400634766, "global_step": 174978, "epoch": 1041} {"train_loss": -11.372551918029785, "global_step": 174979, "epoch": 1041} {"train_loss": -11.335819244384766, "global_step": 174980, "epoch": 1041} {"train_loss": -11.070503234863281, "global_step": 174981, "epoch": 1041} {"train_loss": -11.394195556640625, "global_step": 174982, "epoch": 1041} {"train_loss": -11.062145233154297, "global_step": 174983, "epoch": 1041} {"train_loss": -11.109260559082031, "global_step": 174984, "epoch": 1041} {"train_loss": -11.278827667236328, "global_step": 174985, "epoch": 1041} {"train_loss": -11.306730270385742, "global_step": 174986, "epoch": 1041} {"train_loss": -11.12846851348877, "global_step": 174987, "epoch": 1041} {"train_loss": -11.192035675048828, "global_step": 174988, "epoch": 1041} {"train_loss": -11.214994430541992, "global_step": 174989, "epoch": 1041} {"train_loss": -11.287664413452148, "global_step": 174990, "epoch": 1041} {"train_loss": -11.4667387008667, "global_step": 174991, "epoch": 1041} {"train_loss": -11.323473930358887, "global_step": 174992, "epoch": 1041} {"train_loss": -11.22873592376709, "global_step": 174993, "epoch": 1041} {"train_loss": -10.885242462158203, "global_step": 174994, "epoch": 1041} {"train_loss": -11.079683303833008, "global_step": 174995, "epoch": 1041} {"train_loss": -11.31254768371582, "global_step": 174996, "epoch": 1041} {"train_loss": -10.638525009155273, "global_step": 174997, "epoch": 1041} {"train_loss": -9.92291259765625, "global_step": 174998, "epoch": 1041} {"train_loss": -11.14286994934082, "global_step": 174999, "epoch": 1041} {"train_loss": -10.845725059509277, "global_step": 175000, "epoch": 1041} {"train_loss": -10.984685897827148, "global_step": 175001, "epoch": 1041} {"train_loss": -11.121480941772461, "global_step": 175002, "epoch": 1041} {"train_loss": -11.311901092529297, "global_step": 175003, "epoch": 1041} {"train_loss": -11.115119934082031, "global_step": 175004, "epoch": 1041} {"train_loss": -11.498979568481445, "global_step": 175005, "epoch": 1041} {"train_loss": -10.995834350585938, "global_step": 175006, "epoch": 1041} {"train_loss": -11.4509859085083, "global_step": 175007, "epoch": 1041} {"train_loss": -11.32593822479248, "global_step": 175008, "epoch": 1041} {"train_loss": -11.294888496398926, "global_step": 175009, "epoch": 1041} {"train_loss": -11.327014923095703, "global_step": 175010, "epoch": 1041} {"train_loss": -11.227310180664062, "global_step": 175011, "epoch": 1041} {"train_loss": -11.211264610290527, "global_step": 175012, "epoch": 1041} {"train_loss": -11.25466537475586, "global_step": 175013, "epoch": 1041} {"train_loss": -11.149599075317383, "global_step": 175014, "epoch": 1041} {"train_loss": -11.084493637084961, "global_step": 175015, "epoch": 1041} {"train_loss": -11.38946533203125, "global_step": 175016, "epoch": 1041} {"train_loss": -11.190279006958008, "global_step": 175017, "epoch": 1041} {"train_loss": -11.250877380371094, "global_step": 175018, "epoch": 1041} {"train_loss": -11.184778213500977, "global_step": 175019, "epoch": 1041} {"train_loss": -10.793489456176758, "global_step": 175020, "epoch": 1041} {"train_loss": -11.218742370605469, "global_step": 175021, "epoch": 1041} {"train_loss": -10.813063621520996, "global_step": 175022, "epoch": 1041} {"train_loss": -10.84492301940918, "global_step": 175023, "epoch": 1041} {"train_loss": -11.230350494384766, "global_step": 175024, "epoch": 1041} {"train_loss": -10.012275695800781, "global_step": 175025, "epoch": 1041} {"train_loss": -10.432981491088867, "global_step": 175026, "epoch": 1041} {"train_loss": -10.906042098999023, "global_step": 175027, "epoch": 1041} {"train_loss": -10.730568885803223, "global_step": 175028, "epoch": 1041} {"train_loss": -10.880847930908203, "global_step": 175029, "epoch": 1041} {"train_loss": -10.97576904296875, "global_step": 175030, "epoch": 1041} {"train_loss": -11.063756942749023, "global_step": 175031, "epoch": 1041} {"train_loss": -10.608226776123047, "global_step": 175032, "epoch": 1041} {"train_loss": -11.115694046020508, "global_step": 175033, "epoch": 1041} {"train_loss": -10.633878707885742, "global_step": 175034, "epoch": 1041} {"train_loss": -11.079048156738281, "global_step": 175035, "epoch": 1041} {"train_loss": -10.64150619506836, "global_step": 175036, "epoch": 1041} {"train_loss": -10.89914608001709, "global_step": 175037, "epoch": 1041} {"train_loss": -10.673773765563965, "global_step": 175038, "epoch": 1041} {"train_loss": -10.72546100616455, "global_step": 175039, "epoch": 1041} {"train_loss": -10.195037841796875, "global_step": 175040, "epoch": 1041} {"train_loss": -10.86573314666748, "global_step": 175041, "epoch": 1041} {"train_loss": -10.637090682983398, "global_step": 175042, "epoch": 1041} {"train_loss": -10.71477222442627, "global_step": 175043, "epoch": 1041} {"train_loss": -11.195173263549805, "global_step": 175044, "epoch": 1041} {"train_loss": -10.575467109680176, "global_step": 175045, "epoch": 1041} {"train_loss": -11.070079803466797, "global_step": 175046, "epoch": 1041} {"train_loss": -10.849772453308105, "global_step": 175047, "epoch": 1041} {"train_loss": -10.4100341796875, "global_step": 175048, "epoch": 1041} {"train_loss": -10.873188018798828, "global_step": 175049, "epoch": 1041} {"train_loss": -10.410635948181152, "global_step": 175050, "epoch": 1041} {"train_loss": -10.549707412719727, "global_step": 175051, "epoch": 1041} {"train_loss": -10.463499069213867, "global_step": 175052, "epoch": 1041} {"train_loss": -10.671854019165039, "global_step": 175053, "epoch": 1041} {"train_loss": -10.662033081054688, "global_step": 175054, "epoch": 1041} {"train_loss": -10.743439555168152, "global_step": 175055, "epoch": 1041, "val_loss": 241960.875} {"train_loss": -10.514446258544922, "global_step": 175056, "epoch": 1042} {"train_loss": -10.905691146850586, "global_step": 175057, "epoch": 1042} {"train_loss": -10.673248291015625, "global_step": 175058, "epoch": 1042} {"train_loss": -11.257182121276855, "global_step": 175059, "epoch": 1042} {"train_loss": -11.079057693481445, "global_step": 175060, "epoch": 1042} {"train_loss": -11.062301635742188, "global_step": 175061, "epoch": 1042} {"train_loss": -10.879210472106934, "global_step": 175062, "epoch": 1042} {"train_loss": -10.845932960510254, "global_step": 175063, "epoch": 1042} {"train_loss": -10.81873893737793, "global_step": 175064, "epoch": 1042} {"train_loss": -11.159195899963379, "global_step": 175065, "epoch": 1042} {"train_loss": -10.666356086730957, "global_step": 175066, "epoch": 1042} {"train_loss": -11.3142728805542, "global_step": 175067, "epoch": 1042} {"train_loss": -10.493634223937988, "global_step": 175068, "epoch": 1042} {"train_loss": -11.148109436035156, "global_step": 175069, "epoch": 1042} {"train_loss": -11.0060453414917, "global_step": 175070, "epoch": 1042} {"train_loss": -11.218820571899414, "global_step": 175071, "epoch": 1042} {"train_loss": -11.025638580322266, "global_step": 175072, "epoch": 1042} {"train_loss": -11.313894271850586, "global_step": 175073, "epoch": 1042} {"train_loss": -10.979547500610352, "global_step": 175074, "epoch": 1042} {"train_loss": -11.3554105758667, "global_step": 175075, "epoch": 1042} {"train_loss": -10.981451988220215, "global_step": 175076, "epoch": 1042} {"train_loss": -11.21491527557373, "global_step": 175077, "epoch": 1042} {"train_loss": -11.127281188964844, "global_step": 175078, "epoch": 1042} {"train_loss": -11.190411567687988, "global_step": 175079, "epoch": 1042} {"train_loss": -11.207782745361328, "global_step": 175080, "epoch": 1042} {"train_loss": -11.279955863952637, "global_step": 175081, "epoch": 1042} {"train_loss": -11.389505386352539, "global_step": 175082, "epoch": 1042} {"train_loss": -11.255494117736816, "global_step": 175083, "epoch": 1042} {"train_loss": -11.176370620727539, "global_step": 175084, "epoch": 1042} {"train_loss": -11.173955917358398, "global_step": 175085, "epoch": 1042} {"train_loss": -11.32571029663086, "global_step": 175086, "epoch": 1042} {"train_loss": -11.209309577941895, "global_step": 175087, "epoch": 1042} {"train_loss": -11.263795852661133, "global_step": 175088, "epoch": 1042} {"train_loss": -11.029996871948242, "global_step": 175089, "epoch": 1042} {"train_loss": -11.282510757446289, "global_step": 175090, "epoch": 1042} {"train_loss": -11.181512832641602, "global_step": 175091, "epoch": 1042} {"train_loss": -11.25820541381836, "global_step": 175092, "epoch": 1042} {"train_loss": -11.429121017456055, "global_step": 175093, "epoch": 1042} {"train_loss": -11.321938514709473, "global_step": 175094, "epoch": 1042} {"train_loss": -11.099567413330078, "global_step": 175095, "epoch": 1042} {"train_loss": -10.911941528320312, "global_step": 175096, "epoch": 1042} {"train_loss": -11.313177108764648, "global_step": 175097, "epoch": 1042} {"train_loss": -10.918761253356934, "global_step": 175098, "epoch": 1042} {"train_loss": -10.882513046264648, "global_step": 175099, "epoch": 1042} {"train_loss": -11.162325859069824, "global_step": 175100, "epoch": 1042} {"train_loss": -11.413283348083496, "global_step": 175101, "epoch": 1042} {"train_loss": -10.968647003173828, "global_step": 175102, "epoch": 1042} {"train_loss": -11.400165557861328, "global_step": 175103, "epoch": 1042} {"train_loss": -10.81931209564209, "global_step": 175104, "epoch": 1042} {"train_loss": -11.175143241882324, "global_step": 175105, "epoch": 1042} {"train_loss": -11.117050170898438, "global_step": 175106, "epoch": 1042} {"train_loss": -11.114495277404785, "global_step": 175107, "epoch": 1042} {"train_loss": -10.990951538085938, "global_step": 175108, "epoch": 1042} {"train_loss": -11.089644432067871, "global_step": 175109, "epoch": 1042} {"train_loss": -10.749713897705078, "global_step": 175110, "epoch": 1042} {"train_loss": -11.347288131713867, "global_step": 175111, "epoch": 1042} {"train_loss": -11.053744316101074, "global_step": 175112, "epoch": 1042} {"train_loss": -11.168633460998535, "global_step": 175113, "epoch": 1042} {"train_loss": -11.32404899597168, "global_step": 175114, "epoch": 1042} {"train_loss": -11.49460506439209, "global_step": 175115, "epoch": 1042} {"train_loss": -11.13366985321045, "global_step": 175116, "epoch": 1042} {"train_loss": -10.9073486328125, "global_step": 175117, "epoch": 1042} {"train_loss": -10.728952407836914, "global_step": 175118, "epoch": 1042} {"train_loss": -10.18593978881836, "global_step": 175119, "epoch": 1042} {"train_loss": -10.679289817810059, "global_step": 175120, "epoch": 1042} {"train_loss": -10.709755897521973, "global_step": 175121, "epoch": 1042} {"train_loss": -9.415840148925781, "global_step": 175122, "epoch": 1042} {"train_loss": -10.043254852294922, "global_step": 175123, "epoch": 1042} {"train_loss": -9.57552719116211, "global_step": 175124, "epoch": 1042} {"train_loss": -10.778701782226562, "global_step": 175125, "epoch": 1042} {"train_loss": -9.388222694396973, "global_step": 175126, "epoch": 1042} {"train_loss": -10.55871868133545, "global_step": 175127, "epoch": 1042} {"train_loss": -10.35431957244873, "global_step": 175128, "epoch": 1042} {"train_loss": -10.572694778442383, "global_step": 175129, "epoch": 1042} {"train_loss": -10.512596130371094, "global_step": 175130, "epoch": 1042} {"train_loss": -10.597057342529297, "global_step": 175131, "epoch": 1042} {"train_loss": -10.616811752319336, "global_step": 175132, "epoch": 1042} {"train_loss": -10.54014778137207, "global_step": 175133, "epoch": 1042} {"train_loss": -10.299413681030273, "global_step": 175134, "epoch": 1042} {"train_loss": -10.922599792480469, "global_step": 175135, "epoch": 1042} {"train_loss": -10.61860179901123, "global_step": 175136, "epoch": 1042} {"train_loss": -10.920918464660645, "global_step": 175137, "epoch": 1042} {"train_loss": -10.502041816711426, "global_step": 175138, "epoch": 1042} {"train_loss": -10.597810745239258, "global_step": 175139, "epoch": 1042} {"train_loss": -10.515216827392578, "global_step": 175140, "epoch": 1042} {"train_loss": -10.965681076049805, "global_step": 175141, "epoch": 1042} {"train_loss": -10.89678955078125, "global_step": 175142, "epoch": 1042} {"train_loss": -10.755399703979492, "global_step": 175143, "epoch": 1042} {"train_loss": -10.739486694335938, "global_step": 175144, "epoch": 1042} {"train_loss": -10.757994651794434, "global_step": 175145, "epoch": 1042} {"train_loss": -10.598877906799316, "global_step": 175146, "epoch": 1042} {"train_loss": -11.04310131072998, "global_step": 175147, "epoch": 1042} {"train_loss": -10.831329345703125, "global_step": 175148, "epoch": 1042} {"train_loss": -10.966079711914062, "global_step": 175149, "epoch": 1042} {"train_loss": -10.420823097229004, "global_step": 175150, "epoch": 1042} {"train_loss": -10.662178039550781, "global_step": 175151, "epoch": 1042} {"train_loss": -10.703149795532227, "global_step": 175152, "epoch": 1042} {"train_loss": -10.76905345916748, "global_step": 175153, "epoch": 1042} {"train_loss": -10.797246932983398, "global_step": 175154, "epoch": 1042} {"train_loss": -10.79193115234375, "global_step": 175155, "epoch": 1042} {"train_loss": -10.768929481506348, "global_step": 175156, "epoch": 1042} {"train_loss": -10.497498512268066, "global_step": 175157, "epoch": 1042} {"train_loss": -10.901521682739258, "global_step": 175158, "epoch": 1042} {"train_loss": -11.211589813232422, "global_step": 175159, "epoch": 1042} {"train_loss": -10.561177253723145, "global_step": 175160, "epoch": 1042} {"train_loss": -10.926421165466309, "global_step": 175161, "epoch": 1042} {"train_loss": -11.115633010864258, "global_step": 175162, "epoch": 1042} {"train_loss": -11.069507598876953, "global_step": 175163, "epoch": 1042} {"train_loss": -11.115477561950684, "global_step": 175164, "epoch": 1042} {"train_loss": -10.965463638305664, "global_step": 175165, "epoch": 1042} {"train_loss": -11.356130599975586, "global_step": 175166, "epoch": 1042} {"train_loss": -10.920881271362305, "global_step": 175167, "epoch": 1042} {"train_loss": -11.07962703704834, "global_step": 175168, "epoch": 1042} {"train_loss": -11.149412155151367, "global_step": 175169, "epoch": 1042} {"train_loss": -11.07154655456543, "global_step": 175170, "epoch": 1042} {"train_loss": -11.147454261779785, "global_step": 175171, "epoch": 1042} {"train_loss": -11.025115966796875, "global_step": 175172, "epoch": 1042} {"train_loss": -10.972475051879883, "global_step": 175173, "epoch": 1042} {"train_loss": -10.921238899230957, "global_step": 175174, "epoch": 1042} {"train_loss": -11.03649616241455, "global_step": 175175, "epoch": 1042} {"train_loss": -11.222238540649414, "global_step": 175176, "epoch": 1042} {"train_loss": -11.39983081817627, "global_step": 175177, "epoch": 1042} {"train_loss": -11.070966720581055, "global_step": 175178, "epoch": 1042} {"train_loss": -11.31379508972168, "global_step": 175179, "epoch": 1042} {"train_loss": -11.361804008483887, "global_step": 175180, "epoch": 1042} {"train_loss": -11.33100414276123, "global_step": 175181, "epoch": 1042} {"train_loss": -11.399505615234375, "global_step": 175182, "epoch": 1042} {"train_loss": -11.140535354614258, "global_step": 175183, "epoch": 1042} {"train_loss": -11.29780387878418, "global_step": 175184, "epoch": 1042} {"train_loss": -11.308225631713867, "global_step": 175185, "epoch": 1042} {"train_loss": -11.407890319824219, "global_step": 175186, "epoch": 1042} {"train_loss": -11.61924934387207, "global_step": 175187, "epoch": 1042} {"train_loss": -11.13000202178955, "global_step": 175188, "epoch": 1042} {"train_loss": -11.198671340942383, "global_step": 175189, "epoch": 1042} {"train_loss": -11.423925399780273, "global_step": 175190, "epoch": 1042} {"train_loss": -11.391424179077148, "global_step": 175191, "epoch": 1042} {"train_loss": -11.374314308166504, "global_step": 175192, "epoch": 1042} {"train_loss": -11.309582710266113, "global_step": 175193, "epoch": 1042} {"train_loss": -11.46743392944336, "global_step": 175194, "epoch": 1042} {"train_loss": -11.550128936767578, "global_step": 175195, "epoch": 1042} {"train_loss": -11.330696105957031, "global_step": 175196, "epoch": 1042} {"train_loss": -11.48432731628418, "global_step": 175197, "epoch": 1042} {"train_loss": -11.262157440185547, "global_step": 175198, "epoch": 1042} {"train_loss": -11.490671157836914, "global_step": 175199, "epoch": 1042} {"train_loss": -11.337013244628906, "global_step": 175200, "epoch": 1042} {"train_loss": -11.561542510986328, "global_step": 175201, "epoch": 1042} {"train_loss": -11.40745735168457, "global_step": 175202, "epoch": 1042} {"train_loss": -11.522915840148926, "global_step": 175203, "epoch": 1042} {"train_loss": -11.315387725830078, "global_step": 175204, "epoch": 1042} {"train_loss": -11.236175537109375, "global_step": 175205, "epoch": 1042} {"train_loss": -11.48107624053955, "global_step": 175206, "epoch": 1042} {"train_loss": -11.460700988769531, "global_step": 175207, "epoch": 1042} {"train_loss": -11.409080505371094, "global_step": 175208, "epoch": 1042} {"train_loss": -11.286819458007812, "global_step": 175209, "epoch": 1042} {"train_loss": -10.758906364440918, "global_step": 175210, "epoch": 1042} {"train_loss": -11.541574478149414, "global_step": 175211, "epoch": 1042} {"train_loss": -11.218360900878906, "global_step": 175212, "epoch": 1042} {"train_loss": -11.017097473144531, "global_step": 175213, "epoch": 1042} {"train_loss": -11.251850128173828, "global_step": 175214, "epoch": 1042} {"train_loss": -11.32754898071289, "global_step": 175215, "epoch": 1042} {"train_loss": -11.315681457519531, "global_step": 175216, "epoch": 1042} {"train_loss": -11.09179401397705, "global_step": 175217, "epoch": 1042} {"train_loss": -11.235218048095703, "global_step": 175218, "epoch": 1042} {"train_loss": -10.375981330871582, "global_step": 175219, "epoch": 1042} {"train_loss": -10.83613395690918, "global_step": 175220, "epoch": 1042} {"train_loss": -11.150349617004395, "global_step": 175221, "epoch": 1042} {"train_loss": -10.873640060424805, "global_step": 175222, "epoch": 1042} {"train_loss": -11.019138597306751, "global_step": 175223, "epoch": 1042, "val_loss": 241381.390625} {"train_loss": -10.639108657836914, "global_step": 175224, "epoch": 1043} {"train_loss": -10.084318161010742, "global_step": 175225, "epoch": 1043} {"train_loss": -11.073735237121582, "global_step": 175226, "epoch": 1043} {"train_loss": -10.453319549560547, "global_step": 175227, "epoch": 1043} {"train_loss": -10.199668884277344, "global_step": 175228, "epoch": 1043} {"train_loss": -10.591419219970703, "global_step": 175229, "epoch": 1043} {"train_loss": -9.540130615234375, "global_step": 175230, "epoch": 1043} {"train_loss": -9.078620910644531, "global_step": 175231, "epoch": 1043} {"train_loss": -10.265514373779297, "global_step": 175232, "epoch": 1043} {"train_loss": -10.001127243041992, "global_step": 175233, "epoch": 1043} {"train_loss": -10.225613594055176, "global_step": 175234, "epoch": 1043} {"train_loss": -10.39764404296875, "global_step": 175235, "epoch": 1043} {"train_loss": -10.351011276245117, "global_step": 175236, "epoch": 1043} {"train_loss": -10.484746932983398, "global_step": 175237, "epoch": 1043} {"train_loss": -10.670156478881836, "global_step": 175238, "epoch": 1043} {"train_loss": -10.392919540405273, "global_step": 175239, "epoch": 1043} {"train_loss": -11.092498779296875, "global_step": 175240, "epoch": 1043} {"train_loss": -10.886869430541992, "global_step": 175241, "epoch": 1043} {"train_loss": -10.959357261657715, "global_step": 175242, "epoch": 1043} {"train_loss": -10.601767539978027, "global_step": 175243, "epoch": 1043} {"train_loss": -10.499597549438477, "global_step": 175244, "epoch": 1043} {"train_loss": -10.870155334472656, "global_step": 175245, "epoch": 1043} {"train_loss": -10.73483943939209, "global_step": 175246, "epoch": 1043} {"train_loss": -10.909390449523926, "global_step": 175247, "epoch": 1043} {"train_loss": -10.725879669189453, "global_step": 175248, "epoch": 1043} {"train_loss": -10.535268783569336, "global_step": 175249, "epoch": 1043} {"train_loss": -10.752230644226074, "global_step": 175250, "epoch": 1043} {"train_loss": -10.587992668151855, "global_step": 175251, "epoch": 1043} {"train_loss": -10.664666175842285, "global_step": 175252, "epoch": 1043} {"train_loss": -10.967584609985352, "global_step": 175253, "epoch": 1043} {"train_loss": -10.739236831665039, "global_step": 175254, "epoch": 1043} {"train_loss": -10.794151306152344, "global_step": 175255, "epoch": 1043} {"train_loss": -10.83060359954834, "global_step": 175256, "epoch": 1043} {"train_loss": -10.76870059967041, "global_step": 175257, "epoch": 1043} {"train_loss": -10.697349548339844, "global_step": 175258, "epoch": 1043} {"train_loss": -10.940628051757812, "global_step": 175259, "epoch": 1043} {"train_loss": -10.80528736114502, "global_step": 175260, "epoch": 1043} {"train_loss": -11.101089477539062, "global_step": 175261, "epoch": 1043} {"train_loss": -10.713798522949219, "global_step": 175262, "epoch": 1043} {"train_loss": -11.07132339477539, "global_step": 175263, "epoch": 1043} {"train_loss": -10.738713264465332, "global_step": 175264, "epoch": 1043} {"train_loss": -10.926891326904297, "global_step": 175265, "epoch": 1043} {"train_loss": -11.022943496704102, "global_step": 175266, "epoch": 1043} {"train_loss": -11.138404846191406, "global_step": 175267, "epoch": 1043} {"train_loss": -11.228723526000977, "global_step": 175268, "epoch": 1043} {"train_loss": -10.788915634155273, "global_step": 175269, "epoch": 1043} {"train_loss": -10.888547897338867, "global_step": 175270, "epoch": 1043} {"train_loss": -10.873537063598633, "global_step": 175271, "epoch": 1043} {"train_loss": -10.990483283996582, "global_step": 175272, "epoch": 1043} {"train_loss": -10.967782020568848, "global_step": 175273, "epoch": 1043} {"train_loss": -11.070969581604004, "global_step": 175274, "epoch": 1043} {"train_loss": -10.876869201660156, "global_step": 175275, "epoch": 1043} {"train_loss": -11.115592002868652, "global_step": 175276, "epoch": 1043} {"train_loss": -10.70008659362793, "global_step": 175277, "epoch": 1043} {"train_loss": -11.176165580749512, "global_step": 175278, "epoch": 1043} {"train_loss": -10.728487968444824, "global_step": 175279, "epoch": 1043} {"train_loss": -11.02583122253418, "global_step": 175280, "epoch": 1043} {"train_loss": -10.639914512634277, "global_step": 175281, "epoch": 1043} {"train_loss": -11.17818832397461, "global_step": 175282, "epoch": 1043} {"train_loss": -10.652181625366211, "global_step": 175283, "epoch": 1043} {"train_loss": -11.434450149536133, "global_step": 175284, "epoch": 1043} {"train_loss": -10.773427963256836, "global_step": 175285, "epoch": 1043} {"train_loss": -11.151257514953613, "global_step": 175286, "epoch": 1043} {"train_loss": -10.832305908203125, "global_step": 175287, "epoch": 1043} {"train_loss": -10.65092945098877, "global_step": 175288, "epoch": 1043} {"train_loss": -11.124202728271484, "global_step": 175289, "epoch": 1043} {"train_loss": -10.398584365844727, "global_step": 175290, "epoch": 1043} {"train_loss": -10.823463439941406, "global_step": 175291, "epoch": 1043} {"train_loss": -11.128704071044922, "global_step": 175292, "epoch": 1043} {"train_loss": -9.493982315063477, "global_step": 175293, "epoch": 1043} {"train_loss": -11.173416137695312, "global_step": 175294, "epoch": 1043} {"train_loss": -10.436445236206055, "global_step": 175295, "epoch": 1043} {"train_loss": -11.006619453430176, "global_step": 175296, "epoch": 1043} {"train_loss": -10.27153491973877, "global_step": 175297, "epoch": 1043} {"train_loss": -10.667119026184082, "global_step": 175298, "epoch": 1043} {"train_loss": -10.808513641357422, "global_step": 175299, "epoch": 1043} {"train_loss": -10.279745101928711, "global_step": 175300, "epoch": 1043} {"train_loss": -10.758056640625, "global_step": 175301, "epoch": 1043} {"train_loss": -10.502281188964844, "global_step": 175302, "epoch": 1043} {"train_loss": -10.896312713623047, "global_step": 175303, "epoch": 1043} {"train_loss": -10.620505332946777, "global_step": 175304, "epoch": 1043} {"train_loss": -11.196115493774414, "global_step": 175305, "epoch": 1043} {"train_loss": -10.516424179077148, "global_step": 175306, "epoch": 1043} {"train_loss": -10.918906211853027, "global_step": 175307, "epoch": 1043} {"train_loss": -10.45875358581543, "global_step": 175308, "epoch": 1043} {"train_loss": -10.70894718170166, "global_step": 175309, "epoch": 1043} {"train_loss": -10.837882041931152, "global_step": 175310, "epoch": 1043} {"train_loss": -10.821953773498535, "global_step": 175311, "epoch": 1043} {"train_loss": -10.705421447753906, "global_step": 175312, "epoch": 1043} {"train_loss": -10.356245994567871, "global_step": 175313, "epoch": 1043} {"train_loss": -10.910356521606445, "global_step": 175314, "epoch": 1043} {"train_loss": -10.140323638916016, "global_step": 175315, "epoch": 1043} {"train_loss": -10.806180953979492, "global_step": 175316, "epoch": 1043} {"train_loss": -10.442909240722656, "global_step": 175317, "epoch": 1043} {"train_loss": -11.08427619934082, "global_step": 175318, "epoch": 1043} {"train_loss": -10.610408782958984, "global_step": 175319, "epoch": 1043} {"train_loss": -11.007369995117188, "global_step": 175320, "epoch": 1043} {"train_loss": -10.793869018554688, "global_step": 175321, "epoch": 1043} {"train_loss": -10.976431846618652, "global_step": 175322, "epoch": 1043} {"train_loss": -10.674314498901367, "global_step": 175323, "epoch": 1043} {"train_loss": -11.08671760559082, "global_step": 175324, "epoch": 1043} {"train_loss": -11.015260696411133, "global_step": 175325, "epoch": 1043} {"train_loss": -11.127793312072754, "global_step": 175326, "epoch": 1043} {"train_loss": -11.03751277923584, "global_step": 175327, "epoch": 1043} {"train_loss": -10.719030380249023, "global_step": 175328, "epoch": 1043} {"train_loss": -10.841794967651367, "global_step": 175329, "epoch": 1043} {"train_loss": -10.78257942199707, "global_step": 175330, "epoch": 1043} {"train_loss": -10.892374038696289, "global_step": 175331, "epoch": 1043} {"train_loss": -10.909059524536133, "global_step": 175332, "epoch": 1043} {"train_loss": -11.049997329711914, "global_step": 175333, "epoch": 1043} {"train_loss": -10.734821319580078, "global_step": 175334, "epoch": 1043} {"train_loss": -10.883737564086914, "global_step": 175335, "epoch": 1043} {"train_loss": -10.85603141784668, "global_step": 175336, "epoch": 1043} {"train_loss": -10.921412467956543, "global_step": 175337, "epoch": 1043} {"train_loss": -10.831304550170898, "global_step": 175338, "epoch": 1043} {"train_loss": -11.091429710388184, "global_step": 175339, "epoch": 1043} {"train_loss": -11.109295845031738, "global_step": 175340, "epoch": 1043} {"train_loss": -11.178678512573242, "global_step": 175341, "epoch": 1043} {"train_loss": -11.030282974243164, "global_step": 175342, "epoch": 1043} {"train_loss": -11.160747528076172, "global_step": 175343, "epoch": 1043} {"train_loss": -11.386961936950684, "global_step": 175344, "epoch": 1043} {"train_loss": -11.232076644897461, "global_step": 175345, "epoch": 1043} {"train_loss": -11.180876731872559, "global_step": 175346, "epoch": 1043} {"train_loss": -10.989278793334961, "global_step": 175347, "epoch": 1043} {"train_loss": -10.914108276367188, "global_step": 175348, "epoch": 1043} {"train_loss": -10.957845687866211, "global_step": 175349, "epoch": 1043} {"train_loss": -11.052633285522461, "global_step": 175350, "epoch": 1043} {"train_loss": -11.023933410644531, "global_step": 175351, "epoch": 1043} {"train_loss": -10.966079711914062, "global_step": 175352, "epoch": 1043} {"train_loss": -10.706840515136719, "global_step": 175353, "epoch": 1043} {"train_loss": -11.297783851623535, "global_step": 175354, "epoch": 1043} {"train_loss": -11.213964462280273, "global_step": 175355, "epoch": 1043} {"train_loss": -11.147161483764648, "global_step": 175356, "epoch": 1043} {"train_loss": -11.277143478393555, "global_step": 175357, "epoch": 1043} {"train_loss": -11.284196853637695, "global_step": 175358, "epoch": 1043} {"train_loss": -11.208625793457031, "global_step": 175359, "epoch": 1043} {"train_loss": -11.249031066894531, "global_step": 175360, "epoch": 1043} {"train_loss": -11.373147964477539, "global_step": 175361, "epoch": 1043} {"train_loss": -11.096556663513184, "global_step": 175362, "epoch": 1043} {"train_loss": -11.227911949157715, "global_step": 175363, "epoch": 1043} {"train_loss": -11.389533042907715, "global_step": 175364, "epoch": 1043} {"train_loss": -11.077259063720703, "global_step": 175365, "epoch": 1043} {"train_loss": -11.339864730834961, "global_step": 175366, "epoch": 1043} {"train_loss": -10.949892044067383, "global_step": 175367, "epoch": 1043} {"train_loss": -11.093133926391602, "global_step": 175368, "epoch": 1043} {"train_loss": -11.1572904586792, "global_step": 175369, "epoch": 1043} {"train_loss": -11.063915252685547, "global_step": 175370, "epoch": 1043} {"train_loss": -11.188006401062012, "global_step": 175371, "epoch": 1043} {"train_loss": -11.386892318725586, "global_step": 175372, "epoch": 1043} {"train_loss": -11.069236755371094, "global_step": 175373, "epoch": 1043} {"train_loss": -11.207969665527344, "global_step": 175374, "epoch": 1043} {"train_loss": -11.494787216186523, "global_step": 175375, "epoch": 1043} {"train_loss": -11.435842514038086, "global_step": 175376, "epoch": 1043} {"train_loss": -11.30174732208252, "global_step": 175377, "epoch": 1043} {"train_loss": -11.131731986999512, "global_step": 175378, "epoch": 1043} {"train_loss": -11.356822967529297, "global_step": 175379, "epoch": 1043} {"train_loss": -11.44815444946289, "global_step": 175380, "epoch": 1043} {"train_loss": -11.243108749389648, "global_step": 175381, "epoch": 1043} {"train_loss": -11.261930465698242, "global_step": 175382, "epoch": 1043} {"train_loss": -11.309680938720703, "global_step": 175383, "epoch": 1043} {"train_loss": -10.9219970703125, "global_step": 175384, "epoch": 1043} {"train_loss": -11.371145248413086, "global_step": 175385, "epoch": 1043} {"train_loss": -11.038177490234375, "global_step": 175386, "epoch": 1043} {"train_loss": -10.921616554260254, "global_step": 175387, "epoch": 1043} {"train_loss": -11.38231086730957, "global_step": 175388, "epoch": 1043} {"train_loss": -10.852559089660645, "global_step": 175389, "epoch": 1043} {"train_loss": -11.277920722961426, "global_step": 175390, "epoch": 1043} {"train_loss": -10.879460306394668, "global_step": 175391, "epoch": 1043, "val_loss": 242843.234375} {"train_loss": -10.96042251586914, "global_step": 175392, "epoch": 1044} {"train_loss": -11.286520004272461, "global_step": 175393, "epoch": 1044} {"train_loss": -11.16713809967041, "global_step": 175394, "epoch": 1044} {"train_loss": -11.269939422607422, "global_step": 175395, "epoch": 1044} {"train_loss": -10.949553489685059, "global_step": 175396, "epoch": 1044} {"train_loss": -11.362881660461426, "global_step": 175397, "epoch": 1044} {"train_loss": -11.177563667297363, "global_step": 175398, "epoch": 1044} {"train_loss": -11.160057067871094, "global_step": 175399, "epoch": 1044} {"train_loss": -11.479288101196289, "global_step": 175400, "epoch": 1044} {"train_loss": -11.18443489074707, "global_step": 175401, "epoch": 1044} {"train_loss": -11.063323974609375, "global_step": 175402, "epoch": 1044} {"train_loss": -11.134815216064453, "global_step": 175403, "epoch": 1044} {"train_loss": -10.991561889648438, "global_step": 175404, "epoch": 1044} {"train_loss": -10.969310760498047, "global_step": 175405, "epoch": 1044} {"train_loss": -11.053349494934082, "global_step": 175406, "epoch": 1044} {"train_loss": -11.263029098510742, "global_step": 175407, "epoch": 1044} {"train_loss": -10.923486709594727, "global_step": 175408, "epoch": 1044} {"train_loss": -10.819177627563477, "global_step": 175409, "epoch": 1044} {"train_loss": -11.459037780761719, "global_step": 175410, "epoch": 1044} {"train_loss": -10.911523818969727, "global_step": 175411, "epoch": 1044} {"train_loss": -11.490621566772461, "global_step": 175412, "epoch": 1044} {"train_loss": -11.129247665405273, "global_step": 175413, "epoch": 1044} {"train_loss": -10.583919525146484, "global_step": 175414, "epoch": 1044} {"train_loss": -11.152175903320312, "global_step": 175415, "epoch": 1044} {"train_loss": -10.748865127563477, "global_step": 175416, "epoch": 1044} {"train_loss": -10.862058639526367, "global_step": 175417, "epoch": 1044} {"train_loss": -11.07563591003418, "global_step": 175418, "epoch": 1044} {"train_loss": -10.285367012023926, "global_step": 175419, "epoch": 1044} {"train_loss": -11.241907119750977, "global_step": 175420, "epoch": 1044} {"train_loss": -11.043756484985352, "global_step": 175421, "epoch": 1044} {"train_loss": -10.550853729248047, "global_step": 175422, "epoch": 1044} {"train_loss": -11.34473991394043, "global_step": 175423, "epoch": 1044} {"train_loss": -10.784747123718262, "global_step": 175424, "epoch": 1044} {"train_loss": -11.073287010192871, "global_step": 175425, "epoch": 1044} {"train_loss": -10.684162139892578, "global_step": 175426, "epoch": 1044} {"train_loss": -10.667844772338867, "global_step": 175427, "epoch": 1044} {"train_loss": -11.188133239746094, "global_step": 175428, "epoch": 1044} {"train_loss": -10.204248428344727, "global_step": 175429, "epoch": 1044} {"train_loss": -10.745168685913086, "global_step": 175430, "epoch": 1044} {"train_loss": -10.147806167602539, "global_step": 175431, "epoch": 1044} {"train_loss": -9.914627075195312, "global_step": 175432, "epoch": 1044} {"train_loss": -10.349228858947754, "global_step": 175433, "epoch": 1044} {"train_loss": -11.192167282104492, "global_step": 175434, "epoch": 1044} {"train_loss": -10.495559692382812, "global_step": 175435, "epoch": 1044} {"train_loss": -10.729098320007324, "global_step": 175436, "epoch": 1044} {"train_loss": -10.478029251098633, "global_step": 175437, "epoch": 1044} {"train_loss": -10.51144790649414, "global_step": 175438, "epoch": 1044} {"train_loss": -10.65278434753418, "global_step": 175439, "epoch": 1044} {"train_loss": -10.460041046142578, "global_step": 175440, "epoch": 1044} {"train_loss": -10.545120239257812, "global_step": 175441, "epoch": 1044} {"train_loss": -10.454544067382812, "global_step": 175442, "epoch": 1044} {"train_loss": -10.236212730407715, "global_step": 175443, "epoch": 1044} {"train_loss": -10.443180084228516, "global_step": 175444, "epoch": 1044} {"train_loss": -10.711698532104492, "global_step": 175445, "epoch": 1044} {"train_loss": -10.373181343078613, "global_step": 175446, "epoch": 1044} {"train_loss": -10.725990295410156, "global_step": 175447, "epoch": 1044} {"train_loss": -10.506064414978027, "global_step": 175448, "epoch": 1044} {"train_loss": -10.873146057128906, "global_step": 175449, "epoch": 1044} {"train_loss": -10.568134307861328, "global_step": 175450, "epoch": 1044} {"train_loss": -10.649653434753418, "global_step": 175451, "epoch": 1044} {"train_loss": -10.877391815185547, "global_step": 175452, "epoch": 1044} {"train_loss": -10.882905960083008, "global_step": 175453, "epoch": 1044} {"train_loss": -10.738645553588867, "global_step": 175454, "epoch": 1044} {"train_loss": -11.067985534667969, "global_step": 175455, "epoch": 1044} {"train_loss": -10.805309295654297, "global_step": 175456, "epoch": 1044} {"train_loss": -10.934274673461914, "global_step": 175457, "epoch": 1044} {"train_loss": -10.773550033569336, "global_step": 175458, "epoch": 1044} {"train_loss": -11.023269653320312, "global_step": 175459, "epoch": 1044} {"train_loss": -10.85378646850586, "global_step": 175460, "epoch": 1044} {"train_loss": -10.886138916015625, "global_step": 175461, "epoch": 1044} {"train_loss": -10.879980087280273, "global_step": 175462, "epoch": 1044} {"train_loss": -11.08155632019043, "global_step": 175463, "epoch": 1044} {"train_loss": -11.229862213134766, "global_step": 175464, "epoch": 1044} {"train_loss": -11.212902069091797, "global_step": 175465, "epoch": 1044} {"train_loss": -10.973556518554688, "global_step": 175466, "epoch": 1044} {"train_loss": -11.148258209228516, "global_step": 175467, "epoch": 1044} {"train_loss": -11.054215431213379, "global_step": 175468, "epoch": 1044} {"train_loss": -11.092575073242188, "global_step": 175469, "epoch": 1044} {"train_loss": -11.270768165588379, "global_step": 175470, "epoch": 1044} {"train_loss": -11.06646728515625, "global_step": 175471, "epoch": 1044} {"train_loss": -11.397296905517578, "global_step": 175472, "epoch": 1044} {"train_loss": -11.254749298095703, "global_step": 175473, "epoch": 1044} {"train_loss": -11.318669319152832, "global_step": 175474, "epoch": 1044} {"train_loss": -10.918779373168945, "global_step": 175475, "epoch": 1044} {"train_loss": -11.093475341796875, "global_step": 175476, "epoch": 1044} {"train_loss": -11.257245063781738, "global_step": 175477, "epoch": 1044} {"train_loss": -11.085626602172852, "global_step": 175478, "epoch": 1044} {"train_loss": -11.199432373046875, "global_step": 175479, "epoch": 1044} {"train_loss": -11.138420104980469, "global_step": 175480, "epoch": 1044} {"train_loss": -11.251829147338867, "global_step": 175481, "epoch": 1044} {"train_loss": -11.308551788330078, "global_step": 175482, "epoch": 1044} {"train_loss": -11.406872749328613, "global_step": 175483, "epoch": 1044} {"train_loss": -11.14234447479248, "global_step": 175484, "epoch": 1044} {"train_loss": -11.332852363586426, "global_step": 175485, "epoch": 1044} {"train_loss": -11.2124605178833, "global_step": 175486, "epoch": 1044} {"train_loss": -11.080584526062012, "global_step": 175487, "epoch": 1044} {"train_loss": -11.328964233398438, "global_step": 175488, "epoch": 1044} {"train_loss": -11.182624816894531, "global_step": 175489, "epoch": 1044} {"train_loss": -11.256187438964844, "global_step": 175490, "epoch": 1044} {"train_loss": -11.176435470581055, "global_step": 175491, "epoch": 1044} {"train_loss": -10.805864334106445, "global_step": 175492, "epoch": 1044} {"train_loss": -11.41262435913086, "global_step": 175493, "epoch": 1044} {"train_loss": -10.797990798950195, "global_step": 175494, "epoch": 1044} {"train_loss": -11.265250205993652, "global_step": 175495, "epoch": 1044} {"train_loss": -10.703104019165039, "global_step": 175496, "epoch": 1044} {"train_loss": -11.3797025680542, "global_step": 175497, "epoch": 1044} {"train_loss": -11.06036376953125, "global_step": 175498, "epoch": 1044} {"train_loss": -10.868854522705078, "global_step": 175499, "epoch": 1044} {"train_loss": -10.95195198059082, "global_step": 175500, "epoch": 1044} {"train_loss": -10.920077323913574, "global_step": 175501, "epoch": 1044} {"train_loss": -11.172529220581055, "global_step": 175502, "epoch": 1044} {"train_loss": -11.052865982055664, "global_step": 175503, "epoch": 1044} {"train_loss": -11.215957641601562, "global_step": 175504, "epoch": 1044} {"train_loss": -11.316590309143066, "global_step": 175505, "epoch": 1044} {"train_loss": -10.888908386230469, "global_step": 175506, "epoch": 1044} {"train_loss": -11.221736907958984, "global_step": 175507, "epoch": 1044} {"train_loss": -11.154550552368164, "global_step": 175508, "epoch": 1044} {"train_loss": -11.382913589477539, "global_step": 175509, "epoch": 1044} {"train_loss": -11.094887733459473, "global_step": 175510, "epoch": 1044} {"train_loss": -11.00157356262207, "global_step": 175511, "epoch": 1044} {"train_loss": -11.077722549438477, "global_step": 175512, "epoch": 1044} {"train_loss": -10.555085182189941, "global_step": 175513, "epoch": 1044} {"train_loss": -10.399042129516602, "global_step": 175514, "epoch": 1044} {"train_loss": -10.881854057312012, "global_step": 175515, "epoch": 1044} {"train_loss": -10.277021408081055, "global_step": 175516, "epoch": 1044} {"train_loss": -10.656344413757324, "global_step": 175517, "epoch": 1044} {"train_loss": -10.764610290527344, "global_step": 175518, "epoch": 1044} {"train_loss": -10.464250564575195, "global_step": 175519, "epoch": 1044} {"train_loss": -10.647537231445312, "global_step": 175520, "epoch": 1044} {"train_loss": -10.737570762634277, "global_step": 175521, "epoch": 1044} {"train_loss": -10.068241119384766, "global_step": 175522, "epoch": 1044} {"train_loss": -10.804804801940918, "global_step": 175523, "epoch": 1044} {"train_loss": -10.468128204345703, "global_step": 175524, "epoch": 1044} {"train_loss": -10.866606712341309, "global_step": 175525, "epoch": 1044} {"train_loss": -10.562414169311523, "global_step": 175526, "epoch": 1044} {"train_loss": -10.93535041809082, "global_step": 175527, "epoch": 1044} {"train_loss": -10.447718620300293, "global_step": 175528, "epoch": 1044} {"train_loss": -10.819476127624512, "global_step": 175529, "epoch": 1044} {"train_loss": -10.892007827758789, "global_step": 175530, "epoch": 1044} {"train_loss": -10.869173049926758, "global_step": 175531, "epoch": 1044} {"train_loss": -10.656537055969238, "global_step": 175532, "epoch": 1044} {"train_loss": -11.247976303100586, "global_step": 175533, "epoch": 1044} {"train_loss": -10.805278778076172, "global_step": 175534, "epoch": 1044} {"train_loss": -11.071505546569824, "global_step": 175535, "epoch": 1044} {"train_loss": -11.359054565429688, "global_step": 175536, "epoch": 1044} {"train_loss": -11.182029724121094, "global_step": 175537, "epoch": 1044} {"train_loss": -11.158111572265625, "global_step": 175538, "epoch": 1044} {"train_loss": -11.236085891723633, "global_step": 175539, "epoch": 1044} {"train_loss": -11.05974006652832, "global_step": 175540, "epoch": 1044} {"train_loss": -11.448713302612305, "global_step": 175541, "epoch": 1044} {"train_loss": -11.275321006774902, "global_step": 175542, "epoch": 1044} {"train_loss": -11.125679969787598, "global_step": 175543, "epoch": 1044} {"train_loss": -11.355087280273438, "global_step": 175544, "epoch": 1044} {"train_loss": -11.179681777954102, "global_step": 175545, "epoch": 1044} {"train_loss": -11.29915714263916, "global_step": 175546, "epoch": 1044} {"train_loss": -11.349066734313965, "global_step": 175547, "epoch": 1044} {"train_loss": -11.237037658691406, "global_step": 175548, "epoch": 1044} {"train_loss": -11.28744888305664, "global_step": 175549, "epoch": 1044} {"train_loss": -11.24711799621582, "global_step": 175550, "epoch": 1044} {"train_loss": -11.303311347961426, "global_step": 175551, "epoch": 1044} {"train_loss": -11.279340744018555, "global_step": 175552, "epoch": 1044} {"train_loss": -11.26933479309082, "global_step": 175553, "epoch": 1044} {"train_loss": -11.178922653198242, "global_step": 175554, "epoch": 1044} {"train_loss": -11.262359619140625, "global_step": 175555, "epoch": 1044} {"train_loss": -11.245871543884277, "global_step": 175556, "epoch": 1044} {"train_loss": -11.2559232711792, "global_step": 175557, "epoch": 1044} {"train_loss": -11.477198600769043, "global_step": 175558, "epoch": 1044} {"train_loss": -10.97406618368058, "global_step": 175559, "epoch": 1044, "val_loss": 245519.171875} {"train_loss": -11.195655822753906, "global_step": 175560, "epoch": 1045} {"train_loss": -11.357311248779297, "global_step": 175561, "epoch": 1045} {"train_loss": -10.686027526855469, "global_step": 175562, "epoch": 1045} {"train_loss": -11.004066467285156, "global_step": 175563, "epoch": 1045} {"train_loss": -10.45242691040039, "global_step": 175564, "epoch": 1045} {"train_loss": -10.554179191589355, "global_step": 175565, "epoch": 1045} {"train_loss": -10.751544952392578, "global_step": 175566, "epoch": 1045} {"train_loss": -10.581965446472168, "global_step": 175567, "epoch": 1045} {"train_loss": -10.943334579467773, "global_step": 175568, "epoch": 1045} {"train_loss": -10.075859069824219, "global_step": 175569, "epoch": 1045} {"train_loss": -10.360607147216797, "global_step": 175570, "epoch": 1045} {"train_loss": -10.092426300048828, "global_step": 175571, "epoch": 1045} {"train_loss": -10.477849960327148, "global_step": 175572, "epoch": 1045} {"train_loss": -11.046711921691895, "global_step": 175573, "epoch": 1045} {"train_loss": -9.609360694885254, "global_step": 175574, "epoch": 1045} {"train_loss": -10.35218334197998, "global_step": 175575, "epoch": 1045} {"train_loss": -9.465984344482422, "global_step": 175576, "epoch": 1045} {"train_loss": -9.413166046142578, "global_step": 175577, "epoch": 1045} {"train_loss": -10.888431549072266, "global_step": 175578, "epoch": 1045} {"train_loss": -9.17261791229248, "global_step": 175579, "epoch": 1045} {"train_loss": -10.612354278564453, "global_step": 175580, "epoch": 1045} {"train_loss": -9.720207214355469, "global_step": 175581, "epoch": 1045} {"train_loss": -10.384600639343262, "global_step": 175582, "epoch": 1045} {"train_loss": -10.608631134033203, "global_step": 175583, "epoch": 1045} {"train_loss": -10.46995735168457, "global_step": 175584, "epoch": 1045} {"train_loss": -10.992975234985352, "global_step": 175585, "epoch": 1045} {"train_loss": -10.410552024841309, "global_step": 175586, "epoch": 1045} {"train_loss": -10.70217227935791, "global_step": 175587, "epoch": 1045} {"train_loss": -10.739962577819824, "global_step": 175588, "epoch": 1045} {"train_loss": -11.000192642211914, "global_step": 175589, "epoch": 1045} {"train_loss": -10.979373931884766, "global_step": 175590, "epoch": 1045} {"train_loss": -11.046342849731445, "global_step": 175591, "epoch": 1045} {"train_loss": -10.953023910522461, "global_step": 175592, "epoch": 1045} {"train_loss": -10.970929145812988, "global_step": 175593, "epoch": 1045} {"train_loss": -10.807974815368652, "global_step": 175594, "epoch": 1045} {"train_loss": -10.990525245666504, "global_step": 175595, "epoch": 1045} {"train_loss": -10.877555847167969, "global_step": 175596, "epoch": 1045} {"train_loss": -11.176374435424805, "global_step": 175597, "epoch": 1045} {"train_loss": -11.079185485839844, "global_step": 175598, "epoch": 1045} {"train_loss": -11.136299133300781, "global_step": 175599, "epoch": 1045} {"train_loss": -11.20653247833252, "global_step": 175600, "epoch": 1045} {"train_loss": -10.969318389892578, "global_step": 175601, "epoch": 1045} {"train_loss": -11.245274543762207, "global_step": 175602, "epoch": 1045} {"train_loss": -11.143251419067383, "global_step": 175603, "epoch": 1045} {"train_loss": -11.34947681427002, "global_step": 175604, "epoch": 1045} {"train_loss": -11.198474884033203, "global_step": 175605, "epoch": 1045} {"train_loss": -11.236580848693848, "global_step": 175606, "epoch": 1045} {"train_loss": -11.209421157836914, "global_step": 175607, "epoch": 1045} {"train_loss": -11.10394287109375, "global_step": 175608, "epoch": 1045} {"train_loss": -11.266462326049805, "global_step": 175609, "epoch": 1045} {"train_loss": -11.063451766967773, "global_step": 175610, "epoch": 1045} {"train_loss": -11.129786491394043, "global_step": 175611, "epoch": 1045} {"train_loss": -11.37728500366211, "global_step": 175612, "epoch": 1045} {"train_loss": -11.35460090637207, "global_step": 175613, "epoch": 1045} {"train_loss": -11.153160095214844, "global_step": 175614, "epoch": 1045} {"train_loss": -11.254091262817383, "global_step": 175615, "epoch": 1045} {"train_loss": -11.180079460144043, "global_step": 175616, "epoch": 1045} {"train_loss": -11.342041015625, "global_step": 175617, "epoch": 1045} {"train_loss": -11.193168640136719, "global_step": 175618, "epoch": 1045} {"train_loss": -11.182060241699219, "global_step": 175619, "epoch": 1045} {"train_loss": -11.36220645904541, "global_step": 175620, "epoch": 1045} {"train_loss": -11.322957038879395, "global_step": 175621, "epoch": 1045} {"train_loss": -11.330955505371094, "global_step": 175622, "epoch": 1045} {"train_loss": -11.350828170776367, "global_step": 175623, "epoch": 1045} {"train_loss": -11.373409271240234, "global_step": 175624, "epoch": 1045} {"train_loss": -11.230754852294922, "global_step": 175625, "epoch": 1045} {"train_loss": -11.271769523620605, "global_step": 175626, "epoch": 1045} {"train_loss": -11.36784553527832, "global_step": 175627, "epoch": 1045} {"train_loss": -11.436136245727539, "global_step": 175628, "epoch": 1045} {"train_loss": -11.386310577392578, "global_step": 175629, "epoch": 1045} {"train_loss": -11.044710159301758, "global_step": 175630, "epoch": 1045} {"train_loss": -11.25187873840332, "global_step": 175631, "epoch": 1045} {"train_loss": -11.265804290771484, "global_step": 175632, "epoch": 1045} {"train_loss": -11.2570161819458, "global_step": 175633, "epoch": 1045} {"train_loss": -11.352685928344727, "global_step": 175634, "epoch": 1045} {"train_loss": -11.117231369018555, "global_step": 175635, "epoch": 1045} {"train_loss": -10.747361183166504, "global_step": 175636, "epoch": 1045} {"train_loss": -11.185359954833984, "global_step": 175637, "epoch": 1045} {"train_loss": -11.163166046142578, "global_step": 175638, "epoch": 1045} {"train_loss": -11.28637409210205, "global_step": 175639, "epoch": 1045} {"train_loss": -11.001251220703125, "global_step": 175640, "epoch": 1045} {"train_loss": -11.226768493652344, "global_step": 175641, "epoch": 1045} {"train_loss": -11.065115928649902, "global_step": 175642, "epoch": 1045} {"train_loss": -11.334159851074219, "global_step": 175643, "epoch": 1045} {"train_loss": -11.12420654296875, "global_step": 175644, "epoch": 1045} {"train_loss": -11.27069091796875, "global_step": 175645, "epoch": 1045} {"train_loss": -11.147830963134766, "global_step": 175646, "epoch": 1045} {"train_loss": -10.927197456359863, "global_step": 175647, "epoch": 1045} {"train_loss": -11.310566902160645, "global_step": 175648, "epoch": 1045} {"train_loss": -11.349258422851562, "global_step": 175649, "epoch": 1045} {"train_loss": -11.36788558959961, "global_step": 175650, "epoch": 1045} {"train_loss": -11.206790924072266, "global_step": 175651, "epoch": 1045} {"train_loss": -11.588886260986328, "global_step": 175652, "epoch": 1045} {"train_loss": -11.077618598937988, "global_step": 175653, "epoch": 1045} {"train_loss": -11.247156143188477, "global_step": 175654, "epoch": 1045} {"train_loss": -11.309797286987305, "global_step": 175655, "epoch": 1045} {"train_loss": -10.609305381774902, "global_step": 175656, "epoch": 1045} {"train_loss": -11.290782928466797, "global_step": 175657, "epoch": 1045} {"train_loss": -11.20994758605957, "global_step": 175658, "epoch": 1045} {"train_loss": -10.778509140014648, "global_step": 175659, "epoch": 1045} {"train_loss": -10.66258716583252, "global_step": 175660, "epoch": 1045} {"train_loss": -11.091024398803711, "global_step": 175661, "epoch": 1045} {"train_loss": -10.569204330444336, "global_step": 175662, "epoch": 1045} {"train_loss": -11.263654708862305, "global_step": 175663, "epoch": 1045} {"train_loss": -10.347977638244629, "global_step": 175664, "epoch": 1045} {"train_loss": -11.09764289855957, "global_step": 175665, "epoch": 1045} {"train_loss": -11.213581085205078, "global_step": 175666, "epoch": 1045} {"train_loss": -11.08967399597168, "global_step": 175667, "epoch": 1045} {"train_loss": -10.485767364501953, "global_step": 175668, "epoch": 1045} {"train_loss": -11.33026123046875, "global_step": 175669, "epoch": 1045} {"train_loss": -10.777408599853516, "global_step": 175670, "epoch": 1045} {"train_loss": -11.271608352661133, "global_step": 175671, "epoch": 1045} {"train_loss": -10.826278686523438, "global_step": 175672, "epoch": 1045} {"train_loss": -11.061868667602539, "global_step": 175673, "epoch": 1045} {"train_loss": -11.240049362182617, "global_step": 175674, "epoch": 1045} {"train_loss": -11.121357917785645, "global_step": 175675, "epoch": 1045} {"train_loss": -11.368611335754395, "global_step": 175676, "epoch": 1045} {"train_loss": -11.316564559936523, "global_step": 175677, "epoch": 1045} {"train_loss": -11.084789276123047, "global_step": 175678, "epoch": 1045} {"train_loss": -11.417226791381836, "global_step": 175679, "epoch": 1045} {"train_loss": -11.045893669128418, "global_step": 175680, "epoch": 1045} {"train_loss": -11.149003982543945, "global_step": 175681, "epoch": 1045} {"train_loss": -10.715473175048828, "global_step": 175682, "epoch": 1045} {"train_loss": -11.045324325561523, "global_step": 175683, "epoch": 1045} {"train_loss": -11.127270698547363, "global_step": 175684, "epoch": 1045} {"train_loss": -10.428031921386719, "global_step": 175685, "epoch": 1045} {"train_loss": -11.217758178710938, "global_step": 175686, "epoch": 1045} {"train_loss": -10.931686401367188, "global_step": 175687, "epoch": 1045} {"train_loss": -11.105084419250488, "global_step": 175688, "epoch": 1045} {"train_loss": -10.695661544799805, "global_step": 175689, "epoch": 1045} {"train_loss": -10.107105255126953, "global_step": 175690, "epoch": 1045} {"train_loss": -11.457056045532227, "global_step": 175691, "epoch": 1045} {"train_loss": -10.626995086669922, "global_step": 175692, "epoch": 1045} {"train_loss": -11.174005508422852, "global_step": 175693, "epoch": 1045} {"train_loss": -11.216781616210938, "global_step": 175694, "epoch": 1045} {"train_loss": -11.064306259155273, "global_step": 175695, "epoch": 1045} {"train_loss": -11.167381286621094, "global_step": 175696, "epoch": 1045} {"train_loss": -10.84005355834961, "global_step": 175697, "epoch": 1045} {"train_loss": -11.072280883789062, "global_step": 175698, "epoch": 1045} {"train_loss": -11.271495819091797, "global_step": 175699, "epoch": 1045} {"train_loss": -11.188015937805176, "global_step": 175700, "epoch": 1045} {"train_loss": -11.215166091918945, "global_step": 175701, "epoch": 1045} {"train_loss": -11.170724868774414, "global_step": 175702, "epoch": 1045} {"train_loss": -11.196008682250977, "global_step": 175703, "epoch": 1045} {"train_loss": -11.361749649047852, "global_step": 175704, "epoch": 1045} {"train_loss": -11.236117362976074, "global_step": 175705, "epoch": 1045} {"train_loss": -11.378182411193848, "global_step": 175706, "epoch": 1045} {"train_loss": -11.17521858215332, "global_step": 175707, "epoch": 1045} {"train_loss": -11.416949272155762, "global_step": 175708, "epoch": 1045} {"train_loss": -11.164802551269531, "global_step": 175709, "epoch": 1045} {"train_loss": -11.398025512695312, "global_step": 175710, "epoch": 1045} {"train_loss": -11.25658130645752, "global_step": 175711, "epoch": 1045} {"train_loss": -11.312849044799805, "global_step": 175712, "epoch": 1045} {"train_loss": -11.407276153564453, "global_step": 175713, "epoch": 1045} {"train_loss": -11.093252182006836, "global_step": 175714, "epoch": 1045} {"train_loss": -11.40653133392334, "global_step": 175715, "epoch": 1045} {"train_loss": -11.080232620239258, "global_step": 175716, "epoch": 1045} {"train_loss": -11.304689407348633, "global_step": 175717, "epoch": 1045} {"train_loss": -11.597759246826172, "global_step": 175718, "epoch": 1045} {"train_loss": -11.108173370361328, "global_step": 175719, "epoch": 1045} {"train_loss": -11.27680778503418, "global_step": 175720, "epoch": 1045} {"train_loss": -11.2391939163208, "global_step": 175721, "epoch": 1045} {"train_loss": -11.300981521606445, "global_step": 175722, "epoch": 1045} {"train_loss": -11.002998352050781, "global_step": 175723, "epoch": 1045} {"train_loss": -11.270453453063965, "global_step": 175724, "epoch": 1045} {"train_loss": -11.307289123535156, "global_step": 175725, "epoch": 1045} {"train_loss": -11.32101058959961, "global_step": 175726, "epoch": 1045} {"train_loss": -11.023006166730609, "global_step": 175727, "epoch": 1045, "val_loss": 243198.109375, "train_action_mse_error": 0.39789068698883057} {"train_loss": -11.351306915283203, "global_step": 175728, "epoch": 1046} {"train_loss": -10.953750610351562, "global_step": 175729, "epoch": 1046} {"train_loss": -10.841740608215332, "global_step": 175730, "epoch": 1046} {"train_loss": -11.024700164794922, "global_step": 175731, "epoch": 1046} {"train_loss": -11.20462417602539, "global_step": 175732, "epoch": 1046} {"train_loss": -10.873211860656738, "global_step": 175733, "epoch": 1046} {"train_loss": -10.159233093261719, "global_step": 175734, "epoch": 1046} {"train_loss": -10.656013488769531, "global_step": 175735, "epoch": 1046} {"train_loss": -11.085179328918457, "global_step": 175736, "epoch": 1046} {"train_loss": -9.751371383666992, "global_step": 175737, "epoch": 1046} {"train_loss": -10.956022262573242, "global_step": 175738, "epoch": 1046} {"train_loss": -10.905097961425781, "global_step": 175739, "epoch": 1046} {"train_loss": -10.567728042602539, "global_step": 175740, "epoch": 1046} {"train_loss": -10.859752655029297, "global_step": 175741, "epoch": 1046} {"train_loss": -10.518182754516602, "global_step": 175742, "epoch": 1046} {"train_loss": -10.790461540222168, "global_step": 175743, "epoch": 1046} {"train_loss": -10.501083374023438, "global_step": 175744, "epoch": 1046} {"train_loss": -10.845682144165039, "global_step": 175745, "epoch": 1046} {"train_loss": -10.140512466430664, "global_step": 175746, "epoch": 1046} {"train_loss": -11.034324645996094, "global_step": 175747, "epoch": 1046} {"train_loss": -10.57974624633789, "global_step": 175748, "epoch": 1046} {"train_loss": -11.147058486938477, "global_step": 175749, "epoch": 1046} {"train_loss": -10.699352264404297, "global_step": 175750, "epoch": 1046} {"train_loss": -11.01667594909668, "global_step": 175751, "epoch": 1046} {"train_loss": -10.640129089355469, "global_step": 175752, "epoch": 1046} {"train_loss": -10.937089920043945, "global_step": 175753, "epoch": 1046} {"train_loss": -11.04861831665039, "global_step": 175754, "epoch": 1046} {"train_loss": -10.384256362915039, "global_step": 175755, "epoch": 1046} {"train_loss": -11.067656517028809, "global_step": 175756, "epoch": 1046} {"train_loss": -10.550564765930176, "global_step": 175757, "epoch": 1046} {"train_loss": -11.132049560546875, "global_step": 175758, "epoch": 1046} {"train_loss": -10.406290054321289, "global_step": 175759, "epoch": 1046} {"train_loss": -11.00516414642334, "global_step": 175760, "epoch": 1046} {"train_loss": -10.464794158935547, "global_step": 175761, "epoch": 1046} {"train_loss": -10.911581039428711, "global_step": 175762, "epoch": 1046} {"train_loss": -10.684967041015625, "global_step": 175763, "epoch": 1046} {"train_loss": -10.867103576660156, "global_step": 175764, "epoch": 1046} {"train_loss": -10.489097595214844, "global_step": 175765, "epoch": 1046} {"train_loss": -10.995967864990234, "global_step": 175766, "epoch": 1046} {"train_loss": -10.168804168701172, "global_step": 175767, "epoch": 1046} {"train_loss": -11.076250076293945, "global_step": 175768, "epoch": 1046} {"train_loss": -10.391457557678223, "global_step": 175769, "epoch": 1046} {"train_loss": -10.782122611999512, "global_step": 175770, "epoch": 1046} {"train_loss": -10.836501121520996, "global_step": 175771, "epoch": 1046} {"train_loss": -10.815573692321777, "global_step": 175772, "epoch": 1046} {"train_loss": -10.747734069824219, "global_step": 175773, "epoch": 1046} {"train_loss": -10.883975982666016, "global_step": 175774, "epoch": 1046} {"train_loss": -10.987369537353516, "global_step": 175775, "epoch": 1046} {"train_loss": -11.25317096710205, "global_step": 175776, "epoch": 1046} {"train_loss": -10.90138053894043, "global_step": 175777, "epoch": 1046} {"train_loss": -11.260290145874023, "global_step": 175778, "epoch": 1046} {"train_loss": -11.073488235473633, "global_step": 175779, "epoch": 1046} {"train_loss": -11.280056953430176, "global_step": 175780, "epoch": 1046} {"train_loss": -11.243563652038574, "global_step": 175781, "epoch": 1046} {"train_loss": -11.263053894042969, "global_step": 175782, "epoch": 1046} {"train_loss": -11.05763053894043, "global_step": 175783, "epoch": 1046} {"train_loss": -11.000113487243652, "global_step": 175784, "epoch": 1046} {"train_loss": -11.250791549682617, "global_step": 175785, "epoch": 1046} {"train_loss": -11.20370864868164, "global_step": 175786, "epoch": 1046} {"train_loss": -10.99815559387207, "global_step": 175787, "epoch": 1046} {"train_loss": -11.338973999023438, "global_step": 175788, "epoch": 1046} {"train_loss": -11.278047561645508, "global_step": 175789, "epoch": 1046} {"train_loss": -11.042421340942383, "global_step": 175790, "epoch": 1046} {"train_loss": -11.087573051452637, "global_step": 175791, "epoch": 1046} {"train_loss": -11.170639991760254, "global_step": 175792, "epoch": 1046} {"train_loss": -11.292677879333496, "global_step": 175793, "epoch": 1046} {"train_loss": -11.226808547973633, "global_step": 175794, "epoch": 1046} {"train_loss": -11.06431770324707, "global_step": 175795, "epoch": 1046} {"train_loss": -11.158231735229492, "global_step": 175796, "epoch": 1046} {"train_loss": -11.296009063720703, "global_step": 175797, "epoch": 1046} {"train_loss": -11.150981903076172, "global_step": 175798, "epoch": 1046} {"train_loss": -11.392352104187012, "global_step": 175799, "epoch": 1046} {"train_loss": -11.235612869262695, "global_step": 175800, "epoch": 1046} {"train_loss": -11.161961555480957, "global_step": 175801, "epoch": 1046} {"train_loss": -11.36538314819336, "global_step": 175802, "epoch": 1046} {"train_loss": -11.283772468566895, "global_step": 175803, "epoch": 1046} {"train_loss": -11.27398681640625, "global_step": 175804, "epoch": 1046} {"train_loss": -11.004671096801758, "global_step": 175805, "epoch": 1046} {"train_loss": -11.313350677490234, "global_step": 175806, "epoch": 1046} {"train_loss": -11.213083267211914, "global_step": 175807, "epoch": 1046} {"train_loss": -11.358125686645508, "global_step": 175808, "epoch": 1046} {"train_loss": -11.166747093200684, "global_step": 175809, "epoch": 1046} {"train_loss": -11.357057571411133, "global_step": 175810, "epoch": 1046} {"train_loss": -11.104873657226562, "global_step": 175811, "epoch": 1046} {"train_loss": -11.179388999938965, "global_step": 175812, "epoch": 1046} {"train_loss": -11.030806541442871, "global_step": 175813, "epoch": 1046} {"train_loss": -11.430595397949219, "global_step": 175814, "epoch": 1046} {"train_loss": -11.149112701416016, "global_step": 175815, "epoch": 1046} {"train_loss": -11.409324645996094, "global_step": 175816, "epoch": 1046} {"train_loss": -11.396656036376953, "global_step": 175817, "epoch": 1046} {"train_loss": -11.257019996643066, "global_step": 175818, "epoch": 1046} {"train_loss": -11.493767738342285, "global_step": 175819, "epoch": 1046} {"train_loss": -10.40005111694336, "global_step": 175820, "epoch": 1046} {"train_loss": -11.270176887512207, "global_step": 175821, "epoch": 1046} {"train_loss": -11.133756637573242, "global_step": 175822, "epoch": 1046} {"train_loss": -11.02686882019043, "global_step": 175823, "epoch": 1046} {"train_loss": -10.974380493164062, "global_step": 175824, "epoch": 1046} {"train_loss": -11.095165252685547, "global_step": 175825, "epoch": 1046} {"train_loss": -11.33987808227539, "global_step": 175826, "epoch": 1046} {"train_loss": -11.200804710388184, "global_step": 175827, "epoch": 1046} {"train_loss": -11.056655883789062, "global_step": 175828, "epoch": 1046} {"train_loss": -11.111223220825195, "global_step": 175829, "epoch": 1046} {"train_loss": -10.976357460021973, "global_step": 175830, "epoch": 1046} {"train_loss": -11.148313522338867, "global_step": 175831, "epoch": 1046} {"train_loss": -11.193885803222656, "global_step": 175832, "epoch": 1046} {"train_loss": -11.251131057739258, "global_step": 175833, "epoch": 1046} {"train_loss": -11.20188045501709, "global_step": 175834, "epoch": 1046} {"train_loss": -10.228344917297363, "global_step": 175835, "epoch": 1046} {"train_loss": -11.101683616638184, "global_step": 175836, "epoch": 1046} {"train_loss": -10.621538162231445, "global_step": 175837, "epoch": 1046} {"train_loss": -10.770828247070312, "global_step": 175838, "epoch": 1046} {"train_loss": -10.82242202758789, "global_step": 175839, "epoch": 1046} {"train_loss": -10.622431755065918, "global_step": 175840, "epoch": 1046} {"train_loss": -10.86262321472168, "global_step": 175841, "epoch": 1046} {"train_loss": -10.923956871032715, "global_step": 175842, "epoch": 1046} {"train_loss": -10.928613662719727, "global_step": 175843, "epoch": 1046} {"train_loss": -10.841992378234863, "global_step": 175844, "epoch": 1046} {"train_loss": -10.908205032348633, "global_step": 175845, "epoch": 1046} {"train_loss": -11.11613941192627, "global_step": 175846, "epoch": 1046} {"train_loss": -10.716790199279785, "global_step": 175847, "epoch": 1046} {"train_loss": -11.020868301391602, "global_step": 175848, "epoch": 1046} {"train_loss": -11.095354080200195, "global_step": 175849, "epoch": 1046} {"train_loss": -10.783477783203125, "global_step": 175850, "epoch": 1046} {"train_loss": -10.989206314086914, "global_step": 175851, "epoch": 1046} {"train_loss": -11.153861999511719, "global_step": 175852, "epoch": 1046} {"train_loss": -11.070375442504883, "global_step": 175853, "epoch": 1046} {"train_loss": -10.958866119384766, "global_step": 175854, "epoch": 1046} {"train_loss": -10.694865226745605, "global_step": 175855, "epoch": 1046} {"train_loss": -10.91352367401123, "global_step": 175856, "epoch": 1046} {"train_loss": -11.16775131225586, "global_step": 175857, "epoch": 1046} {"train_loss": -10.863409042358398, "global_step": 175858, "epoch": 1046} {"train_loss": -11.133781433105469, "global_step": 175859, "epoch": 1046} {"train_loss": -10.982436180114746, "global_step": 175860, "epoch": 1046} {"train_loss": -11.276073455810547, "global_step": 175861, "epoch": 1046} {"train_loss": -10.920938491821289, "global_step": 175862, "epoch": 1046} {"train_loss": -11.207460403442383, "global_step": 175863, "epoch": 1046} {"train_loss": -10.938756942749023, "global_step": 175864, "epoch": 1046} {"train_loss": -10.883621215820312, "global_step": 175865, "epoch": 1046} {"train_loss": -11.080968856811523, "global_step": 175866, "epoch": 1046} {"train_loss": -11.147475242614746, "global_step": 175867, "epoch": 1046} {"train_loss": -11.23253059387207, "global_step": 175868, "epoch": 1046} {"train_loss": -11.031173706054688, "global_step": 175869, "epoch": 1046} {"train_loss": -10.99842643737793, "global_step": 175870, "epoch": 1046} {"train_loss": -11.117046356201172, "global_step": 175871, "epoch": 1046} {"train_loss": -11.316119194030762, "global_step": 175872, "epoch": 1046} {"train_loss": -11.272201538085938, "global_step": 175873, "epoch": 1046} {"train_loss": -11.243425369262695, "global_step": 175874, "epoch": 1046} {"train_loss": -11.355754852294922, "global_step": 175875, "epoch": 1046} {"train_loss": -11.476350784301758, "global_step": 175876, "epoch": 1046} {"train_loss": -11.482059478759766, "global_step": 175877, "epoch": 1046} {"train_loss": -11.314363479614258, "global_step": 175878, "epoch": 1046} {"train_loss": -11.400733947753906, "global_step": 175879, "epoch": 1046} {"train_loss": -11.076541900634766, "global_step": 175880, "epoch": 1046} {"train_loss": -11.449853897094727, "global_step": 175881, "epoch": 1046} {"train_loss": -11.32501220703125, "global_step": 175882, "epoch": 1046} {"train_loss": -11.279260635375977, "global_step": 175883, "epoch": 1046} {"train_loss": -11.250419616699219, "global_step": 175884, "epoch": 1046} {"train_loss": -11.383575439453125, "global_step": 175885, "epoch": 1046} {"train_loss": -11.244203567504883, "global_step": 175886, "epoch": 1046} {"train_loss": -11.197364807128906, "global_step": 175887, "epoch": 1046} {"train_loss": -11.601461410522461, "global_step": 175888, "epoch": 1046} {"train_loss": -11.299506187438965, "global_step": 175889, "epoch": 1046} {"train_loss": -11.178318977355957, "global_step": 175890, "epoch": 1046} {"train_loss": -11.641670227050781, "global_step": 175891, "epoch": 1046} {"train_loss": -11.251424789428711, "global_step": 175892, "epoch": 1046} {"train_loss": -11.098947525024414, "global_step": 175893, "epoch": 1046} {"train_loss": -11.414607048034668, "global_step": 175894, "epoch": 1046} {"train_loss": -11.032337676911126, "global_step": 175895, "epoch": 1046, "val_loss": 243774.59375} {"train_loss": -11.392027854919434, "global_step": 175896, "epoch": 1047} {"train_loss": -11.271926879882812, "global_step": 175897, "epoch": 1047} {"train_loss": -11.227560043334961, "global_step": 175898, "epoch": 1047} {"train_loss": -10.741880416870117, "global_step": 175899, "epoch": 1047} {"train_loss": -11.342246055603027, "global_step": 175900, "epoch": 1047} {"train_loss": -10.218393325805664, "global_step": 175901, "epoch": 1047} {"train_loss": -10.569934844970703, "global_step": 175902, "epoch": 1047} {"train_loss": -10.732427597045898, "global_step": 175903, "epoch": 1047} {"train_loss": -11.232666015625, "global_step": 175904, "epoch": 1047} {"train_loss": -10.24530029296875, "global_step": 175905, "epoch": 1047} {"train_loss": -10.480712890625, "global_step": 175906, "epoch": 1047} {"train_loss": -11.25716781616211, "global_step": 175907, "epoch": 1047} {"train_loss": -10.432778358459473, "global_step": 175908, "epoch": 1047} {"train_loss": -10.996231079101562, "global_step": 175909, "epoch": 1047} {"train_loss": -10.906949996948242, "global_step": 175910, "epoch": 1047} {"train_loss": -10.744632720947266, "global_step": 175911, "epoch": 1047} {"train_loss": -11.190783500671387, "global_step": 175912, "epoch": 1047} {"train_loss": -10.858681678771973, "global_step": 175913, "epoch": 1047} {"train_loss": -10.888935089111328, "global_step": 175914, "epoch": 1047} {"train_loss": -11.203353881835938, "global_step": 175915, "epoch": 1047} {"train_loss": -11.042180061340332, "global_step": 175916, "epoch": 1047} {"train_loss": -10.898809432983398, "global_step": 175917, "epoch": 1047} {"train_loss": -11.139058113098145, "global_step": 175918, "epoch": 1047} {"train_loss": -11.09251594543457, "global_step": 175919, "epoch": 1047} {"train_loss": -11.311153411865234, "global_step": 175920, "epoch": 1047} {"train_loss": -11.114436149597168, "global_step": 175921, "epoch": 1047} {"train_loss": -11.105157852172852, "global_step": 175922, "epoch": 1047} {"train_loss": -11.115012168884277, "global_step": 175923, "epoch": 1047} {"train_loss": -11.47992992401123, "global_step": 175924, "epoch": 1047} {"train_loss": -11.03697395324707, "global_step": 175925, "epoch": 1047} {"train_loss": -10.775476455688477, "global_step": 175926, "epoch": 1047} {"train_loss": -10.873502731323242, "global_step": 175927, "epoch": 1047} {"train_loss": -10.767047882080078, "global_step": 175928, "epoch": 1047} {"train_loss": -11.142411231994629, "global_step": 175929, "epoch": 1047} {"train_loss": -10.757061958312988, "global_step": 175930, "epoch": 1047} {"train_loss": -10.690549850463867, "global_step": 175931, "epoch": 1047} {"train_loss": -10.732015609741211, "global_step": 175932, "epoch": 1047} {"train_loss": -10.297767639160156, "global_step": 175933, "epoch": 1047} {"train_loss": -11.266597747802734, "global_step": 175934, "epoch": 1047} {"train_loss": -10.838258743286133, "global_step": 175935, "epoch": 1047} {"train_loss": -10.269210815429688, "global_step": 175936, "epoch": 1047} {"train_loss": -11.207198143005371, "global_step": 175937, "epoch": 1047} {"train_loss": -10.53996753692627, "global_step": 175938, "epoch": 1047} {"train_loss": -11.08745002746582, "global_step": 175939, "epoch": 1047} {"train_loss": -10.545757293701172, "global_step": 175940, "epoch": 1047} {"train_loss": -10.557605743408203, "global_step": 175941, "epoch": 1047} {"train_loss": -10.95926284790039, "global_step": 175942, "epoch": 1047} {"train_loss": -10.643261909484863, "global_step": 175943, "epoch": 1047} {"train_loss": -11.322157859802246, "global_step": 175944, "epoch": 1047} {"train_loss": -10.457906723022461, "global_step": 175945, "epoch": 1047} {"train_loss": -11.00711441040039, "global_step": 175946, "epoch": 1047} {"train_loss": -10.772710800170898, "global_step": 175947, "epoch": 1047} {"train_loss": -11.17072868347168, "global_step": 175948, "epoch": 1047} {"train_loss": -10.513853073120117, "global_step": 175949, "epoch": 1047} {"train_loss": -11.093606948852539, "global_step": 175950, "epoch": 1047} {"train_loss": -10.346456527709961, "global_step": 175951, "epoch": 1047} {"train_loss": -10.7017183303833, "global_step": 175952, "epoch": 1047} {"train_loss": -10.65388298034668, "global_step": 175953, "epoch": 1047} {"train_loss": -11.034109115600586, "global_step": 175954, "epoch": 1047} {"train_loss": -10.67841625213623, "global_step": 175955, "epoch": 1047} {"train_loss": -10.747320175170898, "global_step": 175956, "epoch": 1047} {"train_loss": -11.063241004943848, "global_step": 175957, "epoch": 1047} {"train_loss": -11.01767349243164, "global_step": 175958, "epoch": 1047} {"train_loss": -10.854522705078125, "global_step": 175959, "epoch": 1047} {"train_loss": -11.165290832519531, "global_step": 175960, "epoch": 1047} {"train_loss": -10.85578441619873, "global_step": 175961, "epoch": 1047} {"train_loss": -10.744876861572266, "global_step": 175962, "epoch": 1047} {"train_loss": -10.669734954833984, "global_step": 175963, "epoch": 1047} {"train_loss": -10.908414840698242, "global_step": 175964, "epoch": 1047} {"train_loss": -10.772910118103027, "global_step": 175965, "epoch": 1047} {"train_loss": -10.877204895019531, "global_step": 175966, "epoch": 1047} {"train_loss": -11.159305572509766, "global_step": 175967, "epoch": 1047} {"train_loss": -10.817596435546875, "global_step": 175968, "epoch": 1047} {"train_loss": -11.130610466003418, "global_step": 175969, "epoch": 1047} {"train_loss": -10.840814590454102, "global_step": 175970, "epoch": 1047} {"train_loss": -11.373106002807617, "global_step": 175971, "epoch": 1047} {"train_loss": -10.918221473693848, "global_step": 175972, "epoch": 1047} {"train_loss": -11.09181022644043, "global_step": 175973, "epoch": 1047} {"train_loss": -11.278404235839844, "global_step": 175974, "epoch": 1047} {"train_loss": -11.137587547302246, "global_step": 175975, "epoch": 1047} {"train_loss": -11.173905372619629, "global_step": 175976, "epoch": 1047} {"train_loss": -11.325881004333496, "global_step": 175977, "epoch": 1047} {"train_loss": -11.25661849975586, "global_step": 175978, "epoch": 1047} {"train_loss": -11.380603790283203, "global_step": 175979, "epoch": 1047} {"train_loss": -11.274913787841797, "global_step": 175980, "epoch": 1047} {"train_loss": -11.39577865600586, "global_step": 175981, "epoch": 1047} {"train_loss": -11.512194633483887, "global_step": 175982, "epoch": 1047} {"train_loss": -11.229766845703125, "global_step": 175983, "epoch": 1047} {"train_loss": -11.057097434997559, "global_step": 175984, "epoch": 1047} {"train_loss": -11.002701759338379, "global_step": 175985, "epoch": 1047} {"train_loss": -11.312813758850098, "global_step": 175986, "epoch": 1047} {"train_loss": -11.495233535766602, "global_step": 175987, "epoch": 1047} {"train_loss": -11.303890228271484, "global_step": 175988, "epoch": 1047} {"train_loss": -11.454360961914062, "global_step": 175989, "epoch": 1047} {"train_loss": -11.31686019897461, "global_step": 175990, "epoch": 1047} {"train_loss": -10.816055297851562, "global_step": 175991, "epoch": 1047} {"train_loss": -11.42915153503418, "global_step": 175992, "epoch": 1047} {"train_loss": -10.856094360351562, "global_step": 175993, "epoch": 1047} {"train_loss": -11.06126594543457, "global_step": 175994, "epoch": 1047} {"train_loss": -11.422723770141602, "global_step": 175995, "epoch": 1047} {"train_loss": -10.663515090942383, "global_step": 175996, "epoch": 1047} {"train_loss": -11.271190643310547, "global_step": 175997, "epoch": 1047} {"train_loss": -11.27270793914795, "global_step": 175998, "epoch": 1047} {"train_loss": -11.312296867370605, "global_step": 175999, "epoch": 1047} {"train_loss": -11.25776195526123, "global_step": 176000, "epoch": 1047} {"train_loss": -11.20543384552002, "global_step": 176001, "epoch": 1047} {"train_loss": -10.955148696899414, "global_step": 176002, "epoch": 1047} {"train_loss": -10.909313201904297, "global_step": 176003, "epoch": 1047} {"train_loss": -11.193662643432617, "global_step": 176004, "epoch": 1047} {"train_loss": -10.549352645874023, "global_step": 176005, "epoch": 1047} {"train_loss": -10.898111343383789, "global_step": 176006, "epoch": 1047} {"train_loss": -11.144370079040527, "global_step": 176007, "epoch": 1047} {"train_loss": -10.564247131347656, "global_step": 176008, "epoch": 1047} {"train_loss": -10.848925590515137, "global_step": 176009, "epoch": 1047} {"train_loss": -10.768659591674805, "global_step": 176010, "epoch": 1047} {"train_loss": -11.321218490600586, "global_step": 176011, "epoch": 1047} {"train_loss": -10.858478546142578, "global_step": 176012, "epoch": 1047} {"train_loss": -11.407023429870605, "global_step": 176013, "epoch": 1047} {"train_loss": -11.135738372802734, "global_step": 176014, "epoch": 1047} {"train_loss": -11.30229377746582, "global_step": 176015, "epoch": 1047} {"train_loss": -11.600629806518555, "global_step": 176016, "epoch": 1047} {"train_loss": -11.089056968688965, "global_step": 176017, "epoch": 1047} {"train_loss": -11.181912422180176, "global_step": 176018, "epoch": 1047} {"train_loss": -11.18514633178711, "global_step": 176019, "epoch": 1047} {"train_loss": -11.439929962158203, "global_step": 176020, "epoch": 1047} {"train_loss": -11.31678581237793, "global_step": 176021, "epoch": 1047} {"train_loss": -11.36619758605957, "global_step": 176022, "epoch": 1047} {"train_loss": -11.259522438049316, "global_step": 176023, "epoch": 1047} {"train_loss": -11.173662185668945, "global_step": 176024, "epoch": 1047} {"train_loss": -11.239145278930664, "global_step": 176025, "epoch": 1047} {"train_loss": -11.239266395568848, "global_step": 176026, "epoch": 1047} {"train_loss": -11.159027099609375, "global_step": 176027, "epoch": 1047} {"train_loss": -11.078105926513672, "global_step": 176028, "epoch": 1047} {"train_loss": -10.509103775024414, "global_step": 176029, "epoch": 1047} {"train_loss": -11.317219734191895, "global_step": 176030, "epoch": 1047} {"train_loss": -10.433359146118164, "global_step": 176031, "epoch": 1047} {"train_loss": -10.861932754516602, "global_step": 176032, "epoch": 1047} {"train_loss": -10.616086959838867, "global_step": 176033, "epoch": 1047} {"train_loss": -10.649250030517578, "global_step": 176034, "epoch": 1047} {"train_loss": -11.419774055480957, "global_step": 176035, "epoch": 1047} {"train_loss": -10.584897994995117, "global_step": 176036, "epoch": 1047} {"train_loss": -11.354262351989746, "global_step": 176037, "epoch": 1047} {"train_loss": -10.7044677734375, "global_step": 176038, "epoch": 1047} {"train_loss": -11.522459030151367, "global_step": 176039, "epoch": 1047} {"train_loss": -11.136970520019531, "global_step": 176040, "epoch": 1047} {"train_loss": -11.273271560668945, "global_step": 176041, "epoch": 1047} {"train_loss": -11.185542106628418, "global_step": 176042, "epoch": 1047} {"train_loss": -10.982418060302734, "global_step": 176043, "epoch": 1047} {"train_loss": -11.404060363769531, "global_step": 176044, "epoch": 1047} {"train_loss": -10.95889949798584, "global_step": 176045, "epoch": 1047} {"train_loss": -10.709997177124023, "global_step": 176046, "epoch": 1047} {"train_loss": -11.253506660461426, "global_step": 176047, "epoch": 1047} {"train_loss": -10.860139846801758, "global_step": 176048, "epoch": 1047} {"train_loss": -11.157388687133789, "global_step": 176049, "epoch": 1047} {"train_loss": -10.816057205200195, "global_step": 176050, "epoch": 1047} {"train_loss": -10.730911254882812, "global_step": 176051, "epoch": 1047} {"train_loss": -11.223577499389648, "global_step": 176052, "epoch": 1047} {"train_loss": -10.575295448303223, "global_step": 176053, "epoch": 1047} {"train_loss": -11.203497886657715, "global_step": 176054, "epoch": 1047} {"train_loss": -10.789260864257812, "global_step": 176055, "epoch": 1047} {"train_loss": -10.864134788513184, "global_step": 176056, "epoch": 1047} {"train_loss": -11.038593292236328, "global_step": 176057, "epoch": 1047} {"train_loss": -11.056713104248047, "global_step": 176058, "epoch": 1047} {"train_loss": -10.838150024414062, "global_step": 176059, "epoch": 1047} {"train_loss": -10.77663803100586, "global_step": 176060, "epoch": 1047} {"train_loss": -10.750054359436035, "global_step": 176061, "epoch": 1047} {"train_loss": -10.83392333984375, "global_step": 176062, "epoch": 1047} {"train_loss": -11.001936503819056, "global_step": 176063, "epoch": 1047, "val_loss": 244069.75} {"train_loss": -11.079278945922852, "global_step": 176064, "epoch": 1048} {"train_loss": -11.179883003234863, "global_step": 176065, "epoch": 1048} {"train_loss": -10.943163871765137, "global_step": 176066, "epoch": 1048} {"train_loss": -11.206212043762207, "global_step": 176067, "epoch": 1048} {"train_loss": -11.461424827575684, "global_step": 176068, "epoch": 1048} {"train_loss": -11.504776000976562, "global_step": 176069, "epoch": 1048} {"train_loss": -11.141867637634277, "global_step": 176070, "epoch": 1048} {"train_loss": -11.178200721740723, "global_step": 176071, "epoch": 1048} {"train_loss": -10.806164741516113, "global_step": 176072, "epoch": 1048} {"train_loss": -11.204910278320312, "global_step": 176073, "epoch": 1048} {"train_loss": -11.110800743103027, "global_step": 176074, "epoch": 1048} {"train_loss": -10.660301208496094, "global_step": 176075, "epoch": 1048} {"train_loss": -11.16497802734375, "global_step": 176076, "epoch": 1048} {"train_loss": -10.9683256149292, "global_step": 176077, "epoch": 1048} {"train_loss": -10.817039489746094, "global_step": 176078, "epoch": 1048} {"train_loss": -11.163469314575195, "global_step": 176079, "epoch": 1048} {"train_loss": -10.940171241760254, "global_step": 176080, "epoch": 1048} {"train_loss": -10.978139877319336, "global_step": 176081, "epoch": 1048} {"train_loss": -11.164080619812012, "global_step": 176082, "epoch": 1048} {"train_loss": -10.99644660949707, "global_step": 176083, "epoch": 1048} {"train_loss": -11.395194053649902, "global_step": 176084, "epoch": 1048} {"train_loss": -11.039899826049805, "global_step": 176085, "epoch": 1048} {"train_loss": -10.843791961669922, "global_step": 176086, "epoch": 1048} {"train_loss": -10.9008207321167, "global_step": 176087, "epoch": 1048} {"train_loss": -9.901505470275879, "global_step": 176088, "epoch": 1048} {"train_loss": -10.686009407043457, "global_step": 176089, "epoch": 1048} {"train_loss": -11.099882125854492, "global_step": 176090, "epoch": 1048} {"train_loss": -10.671247482299805, "global_step": 176091, "epoch": 1048} {"train_loss": -11.378520965576172, "global_step": 176092, "epoch": 1048} {"train_loss": -10.52358341217041, "global_step": 176093, "epoch": 1048} {"train_loss": -10.683035850524902, "global_step": 176094, "epoch": 1048} {"train_loss": -11.23570728302002, "global_step": 176095, "epoch": 1048} {"train_loss": -11.163252830505371, "global_step": 176096, "epoch": 1048} {"train_loss": -11.272359848022461, "global_step": 176097, "epoch": 1048} {"train_loss": -11.075126647949219, "global_step": 176098, "epoch": 1048} {"train_loss": -11.1229248046875, "global_step": 176099, "epoch": 1048} {"train_loss": -11.342232704162598, "global_step": 176100, "epoch": 1048} {"train_loss": -10.916162490844727, "global_step": 176101, "epoch": 1048} {"train_loss": -11.021137237548828, "global_step": 176102, "epoch": 1048} {"train_loss": -10.98187255859375, "global_step": 176103, "epoch": 1048} {"train_loss": -11.181425094604492, "global_step": 176104, "epoch": 1048} {"train_loss": -10.667545318603516, "global_step": 176105, "epoch": 1048} {"train_loss": -11.260038375854492, "global_step": 176106, "epoch": 1048} {"train_loss": -11.214329719543457, "global_step": 176107, "epoch": 1048} {"train_loss": -11.14341926574707, "global_step": 176108, "epoch": 1048} {"train_loss": -10.984029769897461, "global_step": 176109, "epoch": 1048} {"train_loss": -10.825704574584961, "global_step": 176110, "epoch": 1048} {"train_loss": -11.297012329101562, "global_step": 176111, "epoch": 1048} {"train_loss": -11.103853225708008, "global_step": 176112, "epoch": 1048} {"train_loss": -11.157220840454102, "global_step": 176113, "epoch": 1048} {"train_loss": -11.23705005645752, "global_step": 176114, "epoch": 1048} {"train_loss": -10.851046562194824, "global_step": 176115, "epoch": 1048} {"train_loss": -11.370697021484375, "global_step": 176116, "epoch": 1048} {"train_loss": -10.84864616394043, "global_step": 176117, "epoch": 1048} {"train_loss": -11.193010330200195, "global_step": 176118, "epoch": 1048} {"train_loss": -11.288846969604492, "global_step": 176119, "epoch": 1048} {"train_loss": -11.380586624145508, "global_step": 176120, "epoch": 1048} {"train_loss": -11.10853099822998, "global_step": 176121, "epoch": 1048} {"train_loss": -11.320615768432617, "global_step": 176122, "epoch": 1048} {"train_loss": -11.19582748413086, "global_step": 176123, "epoch": 1048} {"train_loss": -11.104181289672852, "global_step": 176124, "epoch": 1048} {"train_loss": -11.51321029663086, "global_step": 176125, "epoch": 1048} {"train_loss": -10.823596000671387, "global_step": 176126, "epoch": 1048} {"train_loss": -11.116761207580566, "global_step": 176127, "epoch": 1048} {"train_loss": -11.404309272766113, "global_step": 176128, "epoch": 1048} {"train_loss": -10.93415641784668, "global_step": 176129, "epoch": 1048} {"train_loss": -11.317656517028809, "global_step": 176130, "epoch": 1048} {"train_loss": -11.25326156616211, "global_step": 176131, "epoch": 1048} {"train_loss": -11.034457206726074, "global_step": 176132, "epoch": 1048} {"train_loss": -11.418773651123047, "global_step": 176133, "epoch": 1048} {"train_loss": -11.232786178588867, "global_step": 176134, "epoch": 1048} {"train_loss": -11.42646598815918, "global_step": 176135, "epoch": 1048} {"train_loss": -11.303518295288086, "global_step": 176136, "epoch": 1048} {"train_loss": -11.152904510498047, "global_step": 176137, "epoch": 1048} {"train_loss": -11.258049011230469, "global_step": 176138, "epoch": 1048} {"train_loss": -11.35129165649414, "global_step": 176139, "epoch": 1048} {"train_loss": -10.99828052520752, "global_step": 176140, "epoch": 1048} {"train_loss": -11.113197326660156, "global_step": 176141, "epoch": 1048} {"train_loss": -11.000273704528809, "global_step": 176142, "epoch": 1048} {"train_loss": -10.79946231842041, "global_step": 176143, "epoch": 1048} {"train_loss": -10.958093643188477, "global_step": 176144, "epoch": 1048} {"train_loss": -11.013267517089844, "global_step": 176145, "epoch": 1048} {"train_loss": -10.7593994140625, "global_step": 176146, "epoch": 1048} {"train_loss": -11.218239784240723, "global_step": 176147, "epoch": 1048} {"train_loss": -10.400468826293945, "global_step": 176148, "epoch": 1048} {"train_loss": -10.497987747192383, "global_step": 176149, "epoch": 1048} {"train_loss": -11.226208686828613, "global_step": 176150, "epoch": 1048} {"train_loss": -10.826845169067383, "global_step": 176151, "epoch": 1048} {"train_loss": -11.241854667663574, "global_step": 176152, "epoch": 1048} {"train_loss": -11.016340255737305, "global_step": 176153, "epoch": 1048} {"train_loss": -10.485147476196289, "global_step": 176154, "epoch": 1048} {"train_loss": -11.234919548034668, "global_step": 176155, "epoch": 1048} {"train_loss": -10.78692626953125, "global_step": 176156, "epoch": 1048} {"train_loss": -11.022672653198242, "global_step": 176157, "epoch": 1048} {"train_loss": -11.326923370361328, "global_step": 176158, "epoch": 1048} {"train_loss": -10.831438064575195, "global_step": 176159, "epoch": 1048} {"train_loss": -10.982534408569336, "global_step": 176160, "epoch": 1048} {"train_loss": -10.700511932373047, "global_step": 176161, "epoch": 1048} {"train_loss": -11.103241920471191, "global_step": 176162, "epoch": 1048} {"train_loss": -10.890192031860352, "global_step": 176163, "epoch": 1048} {"train_loss": -10.638387680053711, "global_step": 176164, "epoch": 1048} {"train_loss": -11.184277534484863, "global_step": 176165, "epoch": 1048} {"train_loss": -10.275785446166992, "global_step": 176166, "epoch": 1048} {"train_loss": -10.797687530517578, "global_step": 176167, "epoch": 1048} {"train_loss": -10.766060829162598, "global_step": 176168, "epoch": 1048} {"train_loss": -9.813886642456055, "global_step": 176169, "epoch": 1048} {"train_loss": -11.15048885345459, "global_step": 176170, "epoch": 1048} {"train_loss": -10.438193321228027, "global_step": 176171, "epoch": 1048} {"train_loss": -10.984626770019531, "global_step": 176172, "epoch": 1048} {"train_loss": -10.857657432556152, "global_step": 176173, "epoch": 1048} {"train_loss": -10.754652976989746, "global_step": 176174, "epoch": 1048} {"train_loss": -10.830774307250977, "global_step": 176175, "epoch": 1048} {"train_loss": -11.185283660888672, "global_step": 176176, "epoch": 1048} {"train_loss": -11.130241394042969, "global_step": 176177, "epoch": 1048} {"train_loss": -10.756266593933105, "global_step": 176178, "epoch": 1048} {"train_loss": -11.245844841003418, "global_step": 176179, "epoch": 1048} {"train_loss": -11.27833366394043, "global_step": 176180, "epoch": 1048} {"train_loss": -11.03399658203125, "global_step": 176181, "epoch": 1048} {"train_loss": -11.107095718383789, "global_step": 176182, "epoch": 1048} {"train_loss": -10.93615436553955, "global_step": 176183, "epoch": 1048} {"train_loss": -10.926193237304688, "global_step": 176184, "epoch": 1048} {"train_loss": -10.920096397399902, "global_step": 176185, "epoch": 1048} {"train_loss": -10.53087043762207, "global_step": 176186, "epoch": 1048} {"train_loss": -10.953929901123047, "global_step": 176187, "epoch": 1048} {"train_loss": -10.645716667175293, "global_step": 176188, "epoch": 1048} {"train_loss": -11.169102668762207, "global_step": 176189, "epoch": 1048} {"train_loss": -10.801925659179688, "global_step": 176190, "epoch": 1048} {"train_loss": -10.986427307128906, "global_step": 176191, "epoch": 1048} {"train_loss": -11.315753936767578, "global_step": 176192, "epoch": 1048} {"train_loss": -10.802657127380371, "global_step": 176193, "epoch": 1048} {"train_loss": -10.86080265045166, "global_step": 176194, "epoch": 1048} {"train_loss": -10.671794891357422, "global_step": 176195, "epoch": 1048} {"train_loss": -10.524297714233398, "global_step": 176196, "epoch": 1048} {"train_loss": -10.899551391601562, "global_step": 176197, "epoch": 1048} {"train_loss": -10.716800689697266, "global_step": 176198, "epoch": 1048} {"train_loss": -10.743743896484375, "global_step": 176199, "epoch": 1048} {"train_loss": -10.82990837097168, "global_step": 176200, "epoch": 1048} {"train_loss": -10.994325637817383, "global_step": 176201, "epoch": 1048} {"train_loss": -10.849501609802246, "global_step": 176202, "epoch": 1048} {"train_loss": -11.176240921020508, "global_step": 176203, "epoch": 1048} {"train_loss": -10.953361511230469, "global_step": 176204, "epoch": 1048} {"train_loss": -10.930957794189453, "global_step": 176205, "epoch": 1048} {"train_loss": -10.705684661865234, "global_step": 176206, "epoch": 1048} {"train_loss": -10.832975387573242, "global_step": 176207, "epoch": 1048} {"train_loss": -11.11790943145752, "global_step": 176208, "epoch": 1048} {"train_loss": -10.89899730682373, "global_step": 176209, "epoch": 1048} {"train_loss": -11.195487976074219, "global_step": 176210, "epoch": 1048} {"train_loss": -10.897306442260742, "global_step": 176211, "epoch": 1048} {"train_loss": -10.904142379760742, "global_step": 176212, "epoch": 1048} {"train_loss": -11.17735481262207, "global_step": 176213, "epoch": 1048} {"train_loss": -11.054675102233887, "global_step": 176214, "epoch": 1048} {"train_loss": -11.332427024841309, "global_step": 176215, "epoch": 1048} {"train_loss": -10.955955505371094, "global_step": 176216, "epoch": 1048} {"train_loss": -11.38128662109375, "global_step": 176217, "epoch": 1048} {"train_loss": -11.102089881896973, "global_step": 176218, "epoch": 1048} {"train_loss": -11.286503791809082, "global_step": 176219, "epoch": 1048} {"train_loss": -11.016641616821289, "global_step": 176220, "epoch": 1048} {"train_loss": -11.319637298583984, "global_step": 176221, "epoch": 1048} {"train_loss": -11.048095703125, "global_step": 176222, "epoch": 1048} {"train_loss": -11.14619255065918, "global_step": 176223, "epoch": 1048} {"train_loss": -11.191237449645996, "global_step": 176224, "epoch": 1048} {"train_loss": -11.043346405029297, "global_step": 176225, "epoch": 1048} {"train_loss": -11.266766548156738, "global_step": 176226, "epoch": 1048} {"train_loss": -11.050910949707031, "global_step": 176227, "epoch": 1048} {"train_loss": -11.293773651123047, "global_step": 176228, "epoch": 1048} {"train_loss": -11.075984954833984, "global_step": 176229, "epoch": 1048} {"train_loss": -11.23997974395752, "global_step": 176230, "epoch": 1048} {"train_loss": -11.014746597834996, "global_step": 176231, "epoch": 1048, "val_loss": 242832.28125} {"train_loss": -11.22110652923584, "global_step": 176232, "epoch": 1049} {"train_loss": -11.32737922668457, "global_step": 176233, "epoch": 1049} {"train_loss": -11.064048767089844, "global_step": 176234, "epoch": 1049} {"train_loss": -11.122020721435547, "global_step": 176235, "epoch": 1049} {"train_loss": -11.111709594726562, "global_step": 176236, "epoch": 1049} {"train_loss": -11.082139015197754, "global_step": 176237, "epoch": 1049} {"train_loss": -11.317045211791992, "global_step": 176238, "epoch": 1049} {"train_loss": -11.203598976135254, "global_step": 176239, "epoch": 1049} {"train_loss": -11.152149200439453, "global_step": 176240, "epoch": 1049} {"train_loss": -11.091080665588379, "global_step": 176241, "epoch": 1049} {"train_loss": -11.390582084655762, "global_step": 176242, "epoch": 1049} {"train_loss": -10.773442268371582, "global_step": 176243, "epoch": 1049} {"train_loss": -10.903472900390625, "global_step": 176244, "epoch": 1049} {"train_loss": -11.124162673950195, "global_step": 176245, "epoch": 1049} {"train_loss": -10.35715103149414, "global_step": 176246, "epoch": 1049} {"train_loss": -10.495920181274414, "global_step": 176247, "epoch": 1049} {"train_loss": -11.22068977355957, "global_step": 176248, "epoch": 1049} {"train_loss": -10.702554702758789, "global_step": 176249, "epoch": 1049} {"train_loss": -10.421371459960938, "global_step": 176250, "epoch": 1049} {"train_loss": -9.850606918334961, "global_step": 176251, "epoch": 1049} {"train_loss": -9.082286834716797, "global_step": 176252, "epoch": 1049} {"train_loss": -9.420953750610352, "global_step": 176253, "epoch": 1049} {"train_loss": -10.287952423095703, "global_step": 176254, "epoch": 1049} {"train_loss": -9.50599479675293, "global_step": 176255, "epoch": 1049} {"train_loss": -8.310691833496094, "global_step": 176256, "epoch": 1049} {"train_loss": -10.331912994384766, "global_step": 176257, "epoch": 1049} {"train_loss": -10.543634414672852, "global_step": 176258, "epoch": 1049} {"train_loss": -9.885990142822266, "global_step": 176259, "epoch": 1049} {"train_loss": -10.785470962524414, "global_step": 176260, "epoch": 1049} {"train_loss": -10.15926742553711, "global_step": 176261, "epoch": 1049} {"train_loss": -10.464675903320312, "global_step": 176262, "epoch": 1049} {"train_loss": -10.694473266601562, "global_step": 176263, "epoch": 1049} {"train_loss": -10.651594161987305, "global_step": 176264, "epoch": 1049} {"train_loss": -10.694059371948242, "global_step": 176265, "epoch": 1049} {"train_loss": -10.96374225616455, "global_step": 176266, "epoch": 1049} {"train_loss": -10.640625, "global_step": 176267, "epoch": 1049} {"train_loss": -10.737865447998047, "global_step": 176268, "epoch": 1049} {"train_loss": -10.830365180969238, "global_step": 176269, "epoch": 1049} {"train_loss": -10.7536039352417, "global_step": 176270, "epoch": 1049} {"train_loss": -10.861832618713379, "global_step": 176271, "epoch": 1049} {"train_loss": -10.926115036010742, "global_step": 176272, "epoch": 1049} {"train_loss": -10.476757049560547, "global_step": 176273, "epoch": 1049} {"train_loss": -10.827377319335938, "global_step": 176274, "epoch": 1049} {"train_loss": -10.484352111816406, "global_step": 176275, "epoch": 1049} {"train_loss": -10.32144546508789, "global_step": 176276, "epoch": 1049} {"train_loss": -10.673135757446289, "global_step": 176277, "epoch": 1049} {"train_loss": -10.965774536132812, "global_step": 176278, "epoch": 1049} {"train_loss": -10.333694458007812, "global_step": 176279, "epoch": 1049} {"train_loss": -10.87699031829834, "global_step": 176280, "epoch": 1049} {"train_loss": -10.71063232421875, "global_step": 176281, "epoch": 1049} {"train_loss": -10.708794593811035, "global_step": 176282, "epoch": 1049} {"train_loss": -10.739033699035645, "global_step": 176283, "epoch": 1049} {"train_loss": -10.872644424438477, "global_step": 176284, "epoch": 1049} {"train_loss": -10.790668487548828, "global_step": 176285, "epoch": 1049} {"train_loss": -10.983080863952637, "global_step": 176286, "epoch": 1049} {"train_loss": -10.8670072555542, "global_step": 176287, "epoch": 1049} {"train_loss": -11.086177825927734, "global_step": 176288, "epoch": 1049} {"train_loss": -11.074787139892578, "global_step": 176289, "epoch": 1049} {"train_loss": -10.99679183959961, "global_step": 176290, "epoch": 1049} {"train_loss": -11.092291831970215, "global_step": 176291, "epoch": 1049} {"train_loss": -10.931172370910645, "global_step": 176292, "epoch": 1049} {"train_loss": -10.680360794067383, "global_step": 176293, "epoch": 1049} {"train_loss": -11.23431396484375, "global_step": 176294, "epoch": 1049} {"train_loss": -10.694023132324219, "global_step": 176295, "epoch": 1049} {"train_loss": -11.148168563842773, "global_step": 176296, "epoch": 1049} {"train_loss": -10.78612995147705, "global_step": 176297, "epoch": 1049} {"train_loss": -11.159860610961914, "global_step": 176298, "epoch": 1049} {"train_loss": -10.883895874023438, "global_step": 176299, "epoch": 1049} {"train_loss": -11.102685928344727, "global_step": 176300, "epoch": 1049} {"train_loss": -11.04702377319336, "global_step": 176301, "epoch": 1049} {"train_loss": -10.918511390686035, "global_step": 176302, "epoch": 1049} {"train_loss": -10.997631072998047, "global_step": 176303, "epoch": 1049} {"train_loss": -10.788471221923828, "global_step": 176304, "epoch": 1049} {"train_loss": -10.938501358032227, "global_step": 176305, "epoch": 1049} {"train_loss": -10.978096008300781, "global_step": 176306, "epoch": 1049} {"train_loss": -11.046767234802246, "global_step": 176307, "epoch": 1049} {"train_loss": -11.09880542755127, "global_step": 176308, "epoch": 1049} {"train_loss": -11.193992614746094, "global_step": 176309, "epoch": 1049} {"train_loss": -11.10584831237793, "global_step": 176310, "epoch": 1049} {"train_loss": -11.246831893920898, "global_step": 176311, "epoch": 1049} {"train_loss": -11.246238708496094, "global_step": 176312, "epoch": 1049} {"train_loss": -11.037118911743164, "global_step": 176313, "epoch": 1049} {"train_loss": -11.289772033691406, "global_step": 176314, "epoch": 1049} {"train_loss": -11.084173202514648, "global_step": 176315, "epoch": 1049} {"train_loss": -11.209905624389648, "global_step": 176316, "epoch": 1049} {"train_loss": -11.016143798828125, "global_step": 176317, "epoch": 1049} {"train_loss": -11.409303665161133, "global_step": 176318, "epoch": 1049} {"train_loss": -10.933524131774902, "global_step": 176319, "epoch": 1049} {"train_loss": -11.351226806640625, "global_step": 176320, "epoch": 1049} {"train_loss": -11.03778076171875, "global_step": 176321, "epoch": 1049} {"train_loss": -11.347053527832031, "global_step": 176322, "epoch": 1049} {"train_loss": -11.131043434143066, "global_step": 176323, "epoch": 1049} {"train_loss": -11.01228141784668, "global_step": 176324, "epoch": 1049} {"train_loss": -11.36395263671875, "global_step": 176325, "epoch": 1049} {"train_loss": -11.17323112487793, "global_step": 176326, "epoch": 1049} {"train_loss": -11.363177299499512, "global_step": 176327, "epoch": 1049} {"train_loss": -11.232714653015137, "global_step": 176328, "epoch": 1049} {"train_loss": -11.330894470214844, "global_step": 176329, "epoch": 1049} {"train_loss": -11.195871353149414, "global_step": 176330, "epoch": 1049} {"train_loss": -11.323282241821289, "global_step": 176331, "epoch": 1049} {"train_loss": -11.121200561523438, "global_step": 176332, "epoch": 1049} {"train_loss": -11.333030700683594, "global_step": 176333, "epoch": 1049} {"train_loss": -10.939398765563965, "global_step": 176334, "epoch": 1049} {"train_loss": -11.51087760925293, "global_step": 176335, "epoch": 1049} {"train_loss": -11.157588958740234, "global_step": 176336, "epoch": 1049} {"train_loss": -11.50601577758789, "global_step": 176337, "epoch": 1049} {"train_loss": -11.235898971557617, "global_step": 176338, "epoch": 1049} {"train_loss": -11.25156021118164, "global_step": 176339, "epoch": 1049} {"train_loss": -11.117973327636719, "global_step": 176340, "epoch": 1049} {"train_loss": -10.879873275756836, "global_step": 176341, "epoch": 1049} {"train_loss": -11.232503890991211, "global_step": 176342, "epoch": 1049} {"train_loss": -10.937719345092773, "global_step": 176343, "epoch": 1049} {"train_loss": -11.39484977722168, "global_step": 176344, "epoch": 1049} {"train_loss": -10.98643684387207, "global_step": 176345, "epoch": 1049} {"train_loss": -10.936659812927246, "global_step": 176346, "epoch": 1049} {"train_loss": -10.785950660705566, "global_step": 176347, "epoch": 1049} {"train_loss": -10.82550048828125, "global_step": 176348, "epoch": 1049} {"train_loss": -11.043628692626953, "global_step": 176349, "epoch": 1049} {"train_loss": -10.732307434082031, "global_step": 176350, "epoch": 1049} {"train_loss": -11.106678009033203, "global_step": 176351, "epoch": 1049} {"train_loss": -10.77157974243164, "global_step": 176352, "epoch": 1049} {"train_loss": -11.332923889160156, "global_step": 176353, "epoch": 1049} {"train_loss": -11.072834014892578, "global_step": 176354, "epoch": 1049} {"train_loss": -11.009672164916992, "global_step": 176355, "epoch": 1049} {"train_loss": -11.148544311523438, "global_step": 176356, "epoch": 1049} {"train_loss": -10.740062713623047, "global_step": 176357, "epoch": 1049} {"train_loss": -11.08554744720459, "global_step": 176358, "epoch": 1049} {"train_loss": -10.677253723144531, "global_step": 176359, "epoch": 1049} {"train_loss": -11.044382095336914, "global_step": 176360, "epoch": 1049} {"train_loss": -11.142250061035156, "global_step": 176361, "epoch": 1049} {"train_loss": -11.019937515258789, "global_step": 176362, "epoch": 1049} {"train_loss": -11.230630874633789, "global_step": 176363, "epoch": 1049} {"train_loss": -11.115446090698242, "global_step": 176364, "epoch": 1049} {"train_loss": -10.87221908569336, "global_step": 176365, "epoch": 1049} {"train_loss": -10.315166473388672, "global_step": 176366, "epoch": 1049} {"train_loss": -10.771109580993652, "global_step": 176367, "epoch": 1049} {"train_loss": -11.215691566467285, "global_step": 176368, "epoch": 1049} {"train_loss": -10.41089916229248, "global_step": 176369, "epoch": 1049} {"train_loss": -10.231626510620117, "global_step": 176370, "epoch": 1049} {"train_loss": -11.14211368560791, "global_step": 176371, "epoch": 1049} {"train_loss": -10.416946411132812, "global_step": 176372, "epoch": 1049} {"train_loss": -10.351947784423828, "global_step": 176373, "epoch": 1049} {"train_loss": -11.154802322387695, "global_step": 176374, "epoch": 1049} {"train_loss": -10.766058921813965, "global_step": 176375, "epoch": 1049} {"train_loss": -10.81269645690918, "global_step": 176376, "epoch": 1049} {"train_loss": -10.975556373596191, "global_step": 176377, "epoch": 1049} {"train_loss": -10.988138198852539, "global_step": 176378, "epoch": 1049} {"train_loss": -11.183395385742188, "global_step": 176379, "epoch": 1049} {"train_loss": -10.73654842376709, "global_step": 176380, "epoch": 1049} {"train_loss": -11.168140411376953, "global_step": 176381, "epoch": 1049} {"train_loss": -11.037198066711426, "global_step": 176382, "epoch": 1049} {"train_loss": -11.143290519714355, "global_step": 176383, "epoch": 1049} {"train_loss": -10.970447540283203, "global_step": 176384, "epoch": 1049} {"train_loss": -10.998283386230469, "global_step": 176385, "epoch": 1049} {"train_loss": -10.935049057006836, "global_step": 176386, "epoch": 1049} {"train_loss": -10.981451034545898, "global_step": 176387, "epoch": 1049} {"train_loss": -11.174893379211426, "global_step": 176388, "epoch": 1049} {"train_loss": -11.2193021774292, "global_step": 176389, "epoch": 1049} {"train_loss": -10.83652114868164, "global_step": 176390, "epoch": 1049} {"train_loss": -11.03809642791748, "global_step": 176391, "epoch": 1049} {"train_loss": -11.148759841918945, "global_step": 176392, "epoch": 1049} {"train_loss": -11.114335060119629, "global_step": 176393, "epoch": 1049} {"train_loss": -11.255292892456055, "global_step": 176394, "epoch": 1049} {"train_loss": -11.215632438659668, "global_step": 176395, "epoch": 1049} {"train_loss": -11.184803009033203, "global_step": 176396, "epoch": 1049} {"train_loss": -11.116519927978516, "global_step": 176397, "epoch": 1049} {"train_loss": -11.167917251586914, "global_step": 176398, "epoch": 1049} {"train_loss": -10.911332647005716, "global_step": 176399, "epoch": 1049, "val_loss": 235668.703125} {"train_loss": -10.970693588256836, "global_step": 176400, "epoch": 1050} {"train_loss": -11.100759506225586, "global_step": 176401, "epoch": 1050} {"train_loss": -11.08952522277832, "global_step": 176402, "epoch": 1050} {"train_loss": -11.139432907104492, "global_step": 176403, "epoch": 1050} {"train_loss": -11.002274513244629, "global_step": 176404, "epoch": 1050} {"train_loss": -10.895002365112305, "global_step": 176405, "epoch": 1050} {"train_loss": -11.286531448364258, "global_step": 176406, "epoch": 1050} {"train_loss": -11.29136848449707, "global_step": 176407, "epoch": 1050} {"train_loss": -11.230653762817383, "global_step": 176408, "epoch": 1050} {"train_loss": -11.193793296813965, "global_step": 176409, "epoch": 1050} {"train_loss": -10.716899871826172, "global_step": 176410, "epoch": 1050} {"train_loss": -10.72789192199707, "global_step": 176411, "epoch": 1050} {"train_loss": -11.198896408081055, "global_step": 176412, "epoch": 1050} {"train_loss": -10.462264060974121, "global_step": 176413, "epoch": 1050} {"train_loss": -10.180026054382324, "global_step": 176414, "epoch": 1050} {"train_loss": -10.94601058959961, "global_step": 176415, "epoch": 1050} {"train_loss": -10.697001457214355, "global_step": 176416, "epoch": 1050} {"train_loss": -10.829261779785156, "global_step": 176417, "epoch": 1050} {"train_loss": -11.108687400817871, "global_step": 176418, "epoch": 1050} {"train_loss": -10.957389831542969, "global_step": 176419, "epoch": 1050} {"train_loss": -11.202430725097656, "global_step": 176420, "epoch": 1050} {"train_loss": -11.11071491241455, "global_step": 176421, "epoch": 1050} {"train_loss": -11.136959075927734, "global_step": 176422, "epoch": 1050} {"train_loss": -11.035905838012695, "global_step": 176423, "epoch": 1050} {"train_loss": -11.12997055053711, "global_step": 176424, "epoch": 1050} {"train_loss": -11.238908767700195, "global_step": 176425, "epoch": 1050} {"train_loss": -11.183757781982422, "global_step": 176426, "epoch": 1050} {"train_loss": -11.335834503173828, "global_step": 176427, "epoch": 1050} {"train_loss": -11.143190383911133, "global_step": 176428, "epoch": 1050} {"train_loss": -11.110639572143555, "global_step": 176429, "epoch": 1050} {"train_loss": -11.333272933959961, "global_step": 176430, "epoch": 1050} {"train_loss": -11.329988479614258, "global_step": 176431, "epoch": 1050} {"train_loss": -11.120410919189453, "global_step": 176432, "epoch": 1050} {"train_loss": -11.169957160949707, "global_step": 176433, "epoch": 1050} {"train_loss": -11.316437721252441, "global_step": 176434, "epoch": 1050} {"train_loss": -11.197667121887207, "global_step": 176435, "epoch": 1050} {"train_loss": -11.275955200195312, "global_step": 176436, "epoch": 1050} {"train_loss": -10.97596263885498, "global_step": 176437, "epoch": 1050} {"train_loss": -11.032776832580566, "global_step": 176438, "epoch": 1050} {"train_loss": -10.934778213500977, "global_step": 176439, "epoch": 1050} {"train_loss": -10.834016799926758, "global_step": 176440, "epoch": 1050} {"train_loss": -10.947490692138672, "global_step": 176441, "epoch": 1050} {"train_loss": -10.985696792602539, "global_step": 176442, "epoch": 1050} {"train_loss": -10.953636169433594, "global_step": 176443, "epoch": 1050} {"train_loss": -10.491661071777344, "global_step": 176444, "epoch": 1050} {"train_loss": -10.909965515136719, "global_step": 176445, "epoch": 1050} {"train_loss": -10.019617080688477, "global_step": 176446, "epoch": 1050} {"train_loss": -10.761236190795898, "global_step": 176447, "epoch": 1050} {"train_loss": -10.050519943237305, "global_step": 176448, "epoch": 1050} {"train_loss": -11.00056266784668, "global_step": 176449, "epoch": 1050} {"train_loss": -10.242719650268555, "global_step": 176450, "epoch": 1050} {"train_loss": -10.853100776672363, "global_step": 176451, "epoch": 1050} {"train_loss": -10.750093460083008, "global_step": 176452, "epoch": 1050} {"train_loss": -10.861614227294922, "global_step": 176453, "epoch": 1050} {"train_loss": -10.53866195678711, "global_step": 176454, "epoch": 1050} {"train_loss": -10.967134475708008, "global_step": 176455, "epoch": 1050} {"train_loss": -10.861902236938477, "global_step": 176456, "epoch": 1050} {"train_loss": -10.848505020141602, "global_step": 176457, "epoch": 1050} {"train_loss": -10.70316219329834, "global_step": 176458, "epoch": 1050} {"train_loss": -10.780755043029785, "global_step": 176459, "epoch": 1050} {"train_loss": -10.57274341583252, "global_step": 176460, "epoch": 1050} {"train_loss": -10.826513290405273, "global_step": 176461, "epoch": 1050} {"train_loss": -10.952104568481445, "global_step": 176462, "epoch": 1050} {"train_loss": -11.00330638885498, "global_step": 176463, "epoch": 1050} {"train_loss": -10.368803024291992, "global_step": 176464, "epoch": 1050} {"train_loss": -11.019357681274414, "global_step": 176465, "epoch": 1050} {"train_loss": -10.648194313049316, "global_step": 176466, "epoch": 1050} {"train_loss": -10.555567741394043, "global_step": 176467, "epoch": 1050} {"train_loss": -11.1118803024292, "global_step": 176468, "epoch": 1050} {"train_loss": -10.55645751953125, "global_step": 176469, "epoch": 1050} {"train_loss": -11.051004409790039, "global_step": 176470, "epoch": 1050} {"train_loss": -10.704305648803711, "global_step": 176471, "epoch": 1050} {"train_loss": -11.107193946838379, "global_step": 176472, "epoch": 1050} {"train_loss": -10.879351615905762, "global_step": 176473, "epoch": 1050} {"train_loss": -10.976029396057129, "global_step": 176474, "epoch": 1050} {"train_loss": -11.031391143798828, "global_step": 176475, "epoch": 1050} {"train_loss": -10.76606559753418, "global_step": 176476, "epoch": 1050} {"train_loss": -11.256868362426758, "global_step": 176477, "epoch": 1050} {"train_loss": -10.707273483276367, "global_step": 176478, "epoch": 1050} {"train_loss": -11.127522468566895, "global_step": 176479, "epoch": 1050} {"train_loss": -11.119693756103516, "global_step": 176480, "epoch": 1050} {"train_loss": -10.936748504638672, "global_step": 176481, "epoch": 1050} {"train_loss": -10.429346084594727, "global_step": 176482, "epoch": 1050} {"train_loss": -11.17357349395752, "global_step": 176483, "epoch": 1050} {"train_loss": -10.788267135620117, "global_step": 176484, "epoch": 1050} {"train_loss": -11.257020950317383, "global_step": 176485, "epoch": 1050} {"train_loss": -11.325183868408203, "global_step": 176486, "epoch": 1050} {"train_loss": -10.985925674438477, "global_step": 176487, "epoch": 1050} {"train_loss": -11.13952350616455, "global_step": 176488, "epoch": 1050} {"train_loss": -11.131546020507812, "global_step": 176489, "epoch": 1050} {"train_loss": -10.947680473327637, "global_step": 176490, "epoch": 1050} {"train_loss": -11.445396423339844, "global_step": 176491, "epoch": 1050} {"train_loss": -11.134363174438477, "global_step": 176492, "epoch": 1050} {"train_loss": -11.421623229980469, "global_step": 176493, "epoch": 1050} {"train_loss": -11.07205867767334, "global_step": 176494, "epoch": 1050} {"train_loss": -11.377141952514648, "global_step": 176495, "epoch": 1050} {"train_loss": -11.114295959472656, "global_step": 176496, "epoch": 1050} {"train_loss": -11.166460037231445, "global_step": 176497, "epoch": 1050} {"train_loss": -11.202707290649414, "global_step": 176498, "epoch": 1050} {"train_loss": -11.257068634033203, "global_step": 176499, "epoch": 1050} {"train_loss": -11.571916580200195, "global_step": 176500, "epoch": 1050} {"train_loss": -11.297460556030273, "global_step": 176501, "epoch": 1050} {"train_loss": -11.176925659179688, "global_step": 176502, "epoch": 1050} {"train_loss": -11.21501350402832, "global_step": 176503, "epoch": 1050} {"train_loss": -11.404048919677734, "global_step": 176504, "epoch": 1050} {"train_loss": -11.194390296936035, "global_step": 176505, "epoch": 1050} {"train_loss": -11.452045440673828, "global_step": 176506, "epoch": 1050} {"train_loss": -11.425609588623047, "global_step": 176507, "epoch": 1050} {"train_loss": -11.232929229736328, "global_step": 176508, "epoch": 1050} {"train_loss": -11.404987335205078, "global_step": 176509, "epoch": 1050} {"train_loss": -11.244711875915527, "global_step": 176510, "epoch": 1050} {"train_loss": -11.385017395019531, "global_step": 176511, "epoch": 1050} {"train_loss": -11.322677612304688, "global_step": 176512, "epoch": 1050} {"train_loss": -11.482604026794434, "global_step": 176513, "epoch": 1050} {"train_loss": -11.312261581420898, "global_step": 176514, "epoch": 1050} {"train_loss": -11.227986335754395, "global_step": 176515, "epoch": 1050} {"train_loss": -11.471952438354492, "global_step": 176516, "epoch": 1050} {"train_loss": -11.494115829467773, "global_step": 176517, "epoch": 1050} {"train_loss": -11.241848945617676, "global_step": 176518, "epoch": 1050} {"train_loss": -11.404809951782227, "global_step": 176519, "epoch": 1050} {"train_loss": -11.283468246459961, "global_step": 176520, "epoch": 1050} {"train_loss": -11.262368202209473, "global_step": 176521, "epoch": 1050} {"train_loss": -11.445976257324219, "global_step": 176522, "epoch": 1050} {"train_loss": -11.242867469787598, "global_step": 176523, "epoch": 1050} {"train_loss": -10.696858406066895, "global_step": 176524, "epoch": 1050} {"train_loss": -10.816779136657715, "global_step": 176525, "epoch": 1050} {"train_loss": -10.713882446289062, "global_step": 176526, "epoch": 1050} {"train_loss": -11.254419326782227, "global_step": 176527, "epoch": 1050} {"train_loss": -10.66309642791748, "global_step": 176528, "epoch": 1050} {"train_loss": -11.18263053894043, "global_step": 176529, "epoch": 1050} {"train_loss": -10.562438011169434, "global_step": 176530, "epoch": 1050} {"train_loss": -10.531420707702637, "global_step": 176531, "epoch": 1050} {"train_loss": -11.134540557861328, "global_step": 176532, "epoch": 1050} {"train_loss": -10.495305061340332, "global_step": 176533, "epoch": 1050} {"train_loss": -11.216361999511719, "global_step": 176534, "epoch": 1050} {"train_loss": -10.797266960144043, "global_step": 176535, "epoch": 1050} {"train_loss": -10.530782699584961, "global_step": 176536, "epoch": 1050} {"train_loss": -11.274871826171875, "global_step": 176537, "epoch": 1050} {"train_loss": -11.196685791015625, "global_step": 176538, "epoch": 1050} {"train_loss": -11.106122016906738, "global_step": 176539, "epoch": 1050} {"train_loss": -11.07778263092041, "global_step": 176540, "epoch": 1050} {"train_loss": -10.878128051757812, "global_step": 176541, "epoch": 1050} {"train_loss": -11.32841682434082, "global_step": 176542, "epoch": 1050} {"train_loss": -11.271051406860352, "global_step": 176543, "epoch": 1050} {"train_loss": -11.079069137573242, "global_step": 176544, "epoch": 1050} {"train_loss": -11.082940101623535, "global_step": 176545, "epoch": 1050} {"train_loss": -11.344377517700195, "global_step": 176546, "epoch": 1050} {"train_loss": -11.190378189086914, "global_step": 176547, "epoch": 1050} {"train_loss": -11.176493644714355, "global_step": 176548, "epoch": 1050} {"train_loss": -11.153069496154785, "global_step": 176549, "epoch": 1050} {"train_loss": -11.472474098205566, "global_step": 176550, "epoch": 1050} {"train_loss": -11.122894287109375, "global_step": 176551, "epoch": 1050} {"train_loss": -11.42287826538086, "global_step": 176552, "epoch": 1050} {"train_loss": -11.332329750061035, "global_step": 176553, "epoch": 1050} {"train_loss": -11.27022933959961, "global_step": 176554, "epoch": 1050} {"train_loss": -11.420616149902344, "global_step": 176555, "epoch": 1050} {"train_loss": -11.464052200317383, "global_step": 176556, "epoch": 1050} {"train_loss": -11.328324317932129, "global_step": 176557, "epoch": 1050} {"train_loss": -11.387470245361328, "global_step": 176558, "epoch": 1050} {"train_loss": -11.515161514282227, "global_step": 176559, "epoch": 1050} {"train_loss": -11.225619316101074, "global_step": 176560, "epoch": 1050} {"train_loss": -11.28113842010498, "global_step": 176561, "epoch": 1050} {"train_loss": -10.567185401916504, "global_step": 176562, "epoch": 1050} {"train_loss": -10.850330352783203, "global_step": 176563, "epoch": 1050} {"train_loss": -10.922225952148438, "global_step": 176564, "epoch": 1050} {"train_loss": -10.637840270996094, "global_step": 176565, "epoch": 1050} {"train_loss": -10.858377456665039, "global_step": 176566, "epoch": 1050} {"train_loss": -11.042256139573597, "global_step": 176567, "epoch": 1050, "train/sim_max_reward_0": 0.7058140152359585, "train/sim_max_reward_1": 0.946667704634238, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.977479632746017, "train/sim_max_reward_5": 0.5355923654728834, "test/sim_max_reward_4400000": 0.28175326047576305, "test/sim_max_reward_4400001": 0.364932942673326, "test/sim_max_reward_4400002": 0.9973379527420058, "test/sim_max_reward_4400003": 0.06357807717109666, "test/sim_max_reward_4400004": 0.5536329669904398, "test/sim_max_reward_4400005": 0.9728353120452424, "test/sim_max_reward_4400006": 0.536207122758185, "test/sim_max_reward_4400007": 0.9813413744230727, "test/sim_max_reward_4400008": 0.5383711153914227, "test/sim_max_reward_4400009": 0.030719245219636905, "test/sim_max_reward_4400010": 0.9949365281137841, "test/sim_max_reward_4400011": 0.988513043115253, "test/sim_max_reward_4400012": 0.9582294922894831, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.994685311426148, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.41169696133425343, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.5175708178631364, "test/sim_max_reward_4400021": 0.5537346816804123, "test/sim_max_reward_4400022": 0.9863337976132397, "test/sim_max_reward_4400023": 0.1318632772526034, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.5992585544021667, "test/sim_max_reward_4400026": 0.05854271404182818, "test/sim_max_reward_4400027": 0.9812537531200077, "test/sim_max_reward_4400028": 1.0, "test/sim_max_reward_4400029": 0.45962323607590205, "test/sim_max_reward_4400030": 0.9625692710239838, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.17302002754822962, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 1.0, "test/sim_max_reward_4400036": 0.4927157020376689, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.9869428507433281, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.17213107967474614, "test/sim_max_reward_4400042": 0.04074093812777559, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.991886617023709, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6942589530148494, "test/mean_score": 0.5975052934243898, "val_loss": 239914.3125, "train_action_mse_error": 1.3472957611083984} {"train_loss": -11.092233657836914, "global_step": 176568, "epoch": 1051} {"train_loss": -10.915261268615723, "global_step": 176569, "epoch": 1051} {"train_loss": -10.776925086975098, "global_step": 176570, "epoch": 1051} {"train_loss": -10.523115158081055, "global_step": 176571, "epoch": 1051} {"train_loss": -11.130512237548828, "global_step": 176572, "epoch": 1051} {"train_loss": -9.996423721313477, "global_step": 176573, "epoch": 1051} {"train_loss": -11.045339584350586, "global_step": 176574, "epoch": 1051} {"train_loss": -9.878751754760742, "global_step": 176575, "epoch": 1051} {"train_loss": -8.643512725830078, "global_step": 176576, "epoch": 1051} {"train_loss": -10.657608032226562, "global_step": 176577, "epoch": 1051} {"train_loss": -9.071584701538086, "global_step": 176578, "epoch": 1051} {"train_loss": -10.150590896606445, "global_step": 176579, "epoch": 1051} {"train_loss": -9.058372497558594, "global_step": 176580, "epoch": 1051} {"train_loss": -9.925005912780762, "global_step": 176581, "epoch": 1051} {"train_loss": -9.266308784484863, "global_step": 176582, "epoch": 1051} {"train_loss": -10.37428092956543, "global_step": 176583, "epoch": 1051} {"train_loss": -9.25436782836914, "global_step": 176584, "epoch": 1051} {"train_loss": -9.80282211303711, "global_step": 176585, "epoch": 1051} {"train_loss": -9.805045127868652, "global_step": 176586, "epoch": 1051} {"train_loss": -10.209136962890625, "global_step": 176587, "epoch": 1051} {"train_loss": -10.222482681274414, "global_step": 176588, "epoch": 1051} {"train_loss": -10.596134185791016, "global_step": 176589, "epoch": 1051} {"train_loss": -10.310160636901855, "global_step": 176590, "epoch": 1051} {"train_loss": -10.088414192199707, "global_step": 176591, "epoch": 1051} {"train_loss": -10.83459186553955, "global_step": 176592, "epoch": 1051} {"train_loss": -9.96817398071289, "global_step": 176593, "epoch": 1051} {"train_loss": -10.718779563903809, "global_step": 176594, "epoch": 1051} {"train_loss": -9.819563865661621, "global_step": 176595, "epoch": 1051} {"train_loss": -10.462393760681152, "global_step": 176596, "epoch": 1051} {"train_loss": -10.509556770324707, "global_step": 176597, "epoch": 1051} {"train_loss": -10.546110153198242, "global_step": 176598, "epoch": 1051} {"train_loss": -10.674337387084961, "global_step": 176599, "epoch": 1051} {"train_loss": -10.486446380615234, "global_step": 176600, "epoch": 1051} {"train_loss": -10.971963882446289, "global_step": 176601, "epoch": 1051} {"train_loss": -11.01451301574707, "global_step": 176602, "epoch": 1051} {"train_loss": -10.627144813537598, "global_step": 176603, "epoch": 1051} {"train_loss": -10.78775405883789, "global_step": 176604, "epoch": 1051} {"train_loss": -10.754377365112305, "global_step": 176605, "epoch": 1051} {"train_loss": -10.730428695678711, "global_step": 176606, "epoch": 1051} {"train_loss": -10.835773468017578, "global_step": 176607, "epoch": 1051} {"train_loss": -10.999786376953125, "global_step": 176608, "epoch": 1051} {"train_loss": -10.86838150024414, "global_step": 176609, "epoch": 1051} {"train_loss": -10.961950302124023, "global_step": 176610, "epoch": 1051} {"train_loss": -11.168075561523438, "global_step": 176611, "epoch": 1051} {"train_loss": -10.897449493408203, "global_step": 176612, "epoch": 1051} {"train_loss": -11.192963600158691, "global_step": 176613, "epoch": 1051} {"train_loss": -10.934013366699219, "global_step": 176614, "epoch": 1051} {"train_loss": -11.138566017150879, "global_step": 176615, "epoch": 1051} {"train_loss": -11.044100761413574, "global_step": 176616, "epoch": 1051} {"train_loss": -11.17380142211914, "global_step": 176617, "epoch": 1051} {"train_loss": -11.070137023925781, "global_step": 176618, "epoch": 1051} {"train_loss": -11.345478057861328, "global_step": 176619, "epoch": 1051} {"train_loss": -11.142822265625, "global_step": 176620, "epoch": 1051} {"train_loss": -11.225410461425781, "global_step": 176621, "epoch": 1051} {"train_loss": -11.072511672973633, "global_step": 176622, "epoch": 1051} {"train_loss": -11.20930290222168, "global_step": 176623, "epoch": 1051} {"train_loss": -11.059576988220215, "global_step": 176624, "epoch": 1051} {"train_loss": -11.25568962097168, "global_step": 176625, "epoch": 1051} {"train_loss": -10.978822708129883, "global_step": 176626, "epoch": 1051} {"train_loss": -11.287483215332031, "global_step": 176627, "epoch": 1051} {"train_loss": -11.11270809173584, "global_step": 176628, "epoch": 1051} {"train_loss": -11.155477523803711, "global_step": 176629, "epoch": 1051} {"train_loss": -11.271705627441406, "global_step": 176630, "epoch": 1051} {"train_loss": -11.338544845581055, "global_step": 176631, "epoch": 1051} {"train_loss": -11.169455528259277, "global_step": 176632, "epoch": 1051} {"train_loss": -11.381683349609375, "global_step": 176633, "epoch": 1051} {"train_loss": -11.274473190307617, "global_step": 176634, "epoch": 1051} {"train_loss": -11.296161651611328, "global_step": 176635, "epoch": 1051} {"train_loss": -11.159786224365234, "global_step": 176636, "epoch": 1051} {"train_loss": -11.441566467285156, "global_step": 176637, "epoch": 1051} {"train_loss": -11.20925521850586, "global_step": 176638, "epoch": 1051} {"train_loss": -11.535090446472168, "global_step": 176639, "epoch": 1051} {"train_loss": -11.188825607299805, "global_step": 176640, "epoch": 1051} {"train_loss": -11.314817428588867, "global_step": 176641, "epoch": 1051} {"train_loss": -11.39406681060791, "global_step": 176642, "epoch": 1051} {"train_loss": -11.153324127197266, "global_step": 176643, "epoch": 1051} {"train_loss": -11.086788177490234, "global_step": 176644, "epoch": 1051} {"train_loss": -11.107808113098145, "global_step": 176645, "epoch": 1051} {"train_loss": -11.42086410522461, "global_step": 176646, "epoch": 1051} {"train_loss": -11.444781303405762, "global_step": 176647, "epoch": 1051} {"train_loss": -11.285146713256836, "global_step": 176648, "epoch": 1051} {"train_loss": -11.316911697387695, "global_step": 176649, "epoch": 1051} {"train_loss": -11.302608489990234, "global_step": 176650, "epoch": 1051} {"train_loss": -11.46180248260498, "global_step": 176651, "epoch": 1051} {"train_loss": -11.635778427124023, "global_step": 176652, "epoch": 1051} {"train_loss": -11.036466598510742, "global_step": 176653, "epoch": 1051} {"train_loss": -10.843303680419922, "global_step": 176654, "epoch": 1051} {"train_loss": -11.497600555419922, "global_step": 176655, "epoch": 1051} {"train_loss": -11.300867080688477, "global_step": 176656, "epoch": 1051} {"train_loss": -10.602232933044434, "global_step": 176657, "epoch": 1051} {"train_loss": -10.593351364135742, "global_step": 176658, "epoch": 1051} {"train_loss": -10.941784858703613, "global_step": 176659, "epoch": 1051} {"train_loss": -11.175222396850586, "global_step": 176660, "epoch": 1051} {"train_loss": -10.296846389770508, "global_step": 176661, "epoch": 1051} {"train_loss": -10.504538536071777, "global_step": 176662, "epoch": 1051} {"train_loss": -11.452900886535645, "global_step": 176663, "epoch": 1051} {"train_loss": -11.283082008361816, "global_step": 176664, "epoch": 1051} {"train_loss": -11.364690780639648, "global_step": 176665, "epoch": 1051} {"train_loss": -11.004890441894531, "global_step": 176666, "epoch": 1051} {"train_loss": -11.135148048400879, "global_step": 176667, "epoch": 1051} {"train_loss": -11.266056060791016, "global_step": 176668, "epoch": 1051} {"train_loss": -11.0777006149292, "global_step": 176669, "epoch": 1051} {"train_loss": -10.732242584228516, "global_step": 176670, "epoch": 1051} {"train_loss": -11.316619873046875, "global_step": 176671, "epoch": 1051} {"train_loss": -10.892818450927734, "global_step": 176672, "epoch": 1051} {"train_loss": -10.437583923339844, "global_step": 176673, "epoch": 1051} {"train_loss": -11.230307579040527, "global_step": 176674, "epoch": 1051} {"train_loss": -10.888713836669922, "global_step": 176675, "epoch": 1051} {"train_loss": -10.816768646240234, "global_step": 176676, "epoch": 1051} {"train_loss": -10.560897827148438, "global_step": 176677, "epoch": 1051} {"train_loss": -11.13704776763916, "global_step": 176678, "epoch": 1051} {"train_loss": -11.018310546875, "global_step": 176679, "epoch": 1051} {"train_loss": -10.799450874328613, "global_step": 176680, "epoch": 1051} {"train_loss": -10.897712707519531, "global_step": 176681, "epoch": 1051} {"train_loss": -10.878935813903809, "global_step": 176682, "epoch": 1051} {"train_loss": -10.711246490478516, "global_step": 176683, "epoch": 1051} {"train_loss": -11.406366348266602, "global_step": 176684, "epoch": 1051} {"train_loss": -10.629652976989746, "global_step": 176685, "epoch": 1051} {"train_loss": -11.141481399536133, "global_step": 176686, "epoch": 1051} {"train_loss": -10.985249519348145, "global_step": 176687, "epoch": 1051} {"train_loss": -10.700441360473633, "global_step": 176688, "epoch": 1051} {"train_loss": -10.948441505432129, "global_step": 176689, "epoch": 1051} {"train_loss": -10.883539199829102, "global_step": 176690, "epoch": 1051} {"train_loss": -10.937434196472168, "global_step": 176691, "epoch": 1051} {"train_loss": -10.46760082244873, "global_step": 176692, "epoch": 1051} {"train_loss": -10.923059463500977, "global_step": 176693, "epoch": 1051} {"train_loss": -10.960033416748047, "global_step": 176694, "epoch": 1051} {"train_loss": -10.70095157623291, "global_step": 176695, "epoch": 1051} {"train_loss": -10.121005058288574, "global_step": 176696, "epoch": 1051} {"train_loss": -10.381979942321777, "global_step": 176697, "epoch": 1051} {"train_loss": -10.196791648864746, "global_step": 176698, "epoch": 1051} {"train_loss": -9.994099617004395, "global_step": 176699, "epoch": 1051} {"train_loss": -11.119316101074219, "global_step": 176700, "epoch": 1051} {"train_loss": -9.823492050170898, "global_step": 176701, "epoch": 1051} {"train_loss": -10.84011459350586, "global_step": 176702, "epoch": 1051} {"train_loss": -11.092660903930664, "global_step": 176703, "epoch": 1051} {"train_loss": -10.858353614807129, "global_step": 176704, "epoch": 1051} {"train_loss": -10.955562591552734, "global_step": 176705, "epoch": 1051} {"train_loss": -10.8104829788208, "global_step": 176706, "epoch": 1051} {"train_loss": -10.828795433044434, "global_step": 176707, "epoch": 1051} {"train_loss": -10.98035717010498, "global_step": 176708, "epoch": 1051} {"train_loss": -11.045734405517578, "global_step": 176709, "epoch": 1051} {"train_loss": -11.188138008117676, "global_step": 176710, "epoch": 1051} {"train_loss": -11.020031929016113, "global_step": 176711, "epoch": 1051} {"train_loss": -10.919719696044922, "global_step": 176712, "epoch": 1051} {"train_loss": -10.848636627197266, "global_step": 176713, "epoch": 1051} {"train_loss": -11.101716041564941, "global_step": 176714, "epoch": 1051} {"train_loss": -10.827909469604492, "global_step": 176715, "epoch": 1051} {"train_loss": -11.036958694458008, "global_step": 176716, "epoch": 1051} {"train_loss": -11.00336742401123, "global_step": 176717, "epoch": 1051} {"train_loss": -11.217079162597656, "global_step": 176718, "epoch": 1051} {"train_loss": -11.108633041381836, "global_step": 176719, "epoch": 1051} {"train_loss": -11.19874382019043, "global_step": 176720, "epoch": 1051} {"train_loss": -11.04813003540039, "global_step": 176721, "epoch": 1051} {"train_loss": -11.288592338562012, "global_step": 176722, "epoch": 1051} {"train_loss": -11.180137634277344, "global_step": 176723, "epoch": 1051} {"train_loss": -11.036520004272461, "global_step": 176724, "epoch": 1051} {"train_loss": -11.062938690185547, "global_step": 176725, "epoch": 1051} {"train_loss": -11.014994621276855, "global_step": 176726, "epoch": 1051} {"train_loss": -11.3029203414917, "global_step": 176727, "epoch": 1051} {"train_loss": -10.863409042358398, "global_step": 176728, "epoch": 1051} {"train_loss": -11.142016410827637, "global_step": 176729, "epoch": 1051} {"train_loss": -11.214614868164062, "global_step": 176730, "epoch": 1051} {"train_loss": -11.142576217651367, "global_step": 176731, "epoch": 1051} {"train_loss": -11.37855052947998, "global_step": 176732, "epoch": 1051} {"train_loss": -11.052328109741211, "global_step": 176733, "epoch": 1051} {"train_loss": -11.341898918151855, "global_step": 176734, "epoch": 1051} {"train_loss": -10.864028266498021, "global_step": 176735, "epoch": 1051, "val_loss": 243866.46875} {"train_loss": -11.318815231323242, "global_step": 176736, "epoch": 1052} {"train_loss": -11.477217674255371, "global_step": 176737, "epoch": 1052} {"train_loss": -11.17810344696045, "global_step": 176738, "epoch": 1052} {"train_loss": -11.474980354309082, "global_step": 176739, "epoch": 1052} {"train_loss": -11.41165542602539, "global_step": 176740, "epoch": 1052} {"train_loss": -11.300468444824219, "global_step": 176741, "epoch": 1052} {"train_loss": -11.373564720153809, "global_step": 176742, "epoch": 1052} {"train_loss": -11.28568172454834, "global_step": 176743, "epoch": 1052} {"train_loss": -11.604765892028809, "global_step": 176744, "epoch": 1052} {"train_loss": -11.220785140991211, "global_step": 176745, "epoch": 1052} {"train_loss": -11.451777458190918, "global_step": 176746, "epoch": 1052} {"train_loss": -11.338586807250977, "global_step": 176747, "epoch": 1052} {"train_loss": -11.121416091918945, "global_step": 176748, "epoch": 1052} {"train_loss": -11.4050874710083, "global_step": 176749, "epoch": 1052} {"train_loss": -11.519762992858887, "global_step": 176750, "epoch": 1052} {"train_loss": -10.711931228637695, "global_step": 176751, "epoch": 1052} {"train_loss": -10.835641860961914, "global_step": 176752, "epoch": 1052} {"train_loss": -11.403671264648438, "global_step": 176753, "epoch": 1052} {"train_loss": -10.63869571685791, "global_step": 176754, "epoch": 1052} {"train_loss": -11.110158920288086, "global_step": 176755, "epoch": 1052} {"train_loss": -11.20979118347168, "global_step": 176756, "epoch": 1052} {"train_loss": -10.135889053344727, "global_step": 176757, "epoch": 1052} {"train_loss": -10.940840721130371, "global_step": 176758, "epoch": 1052} {"train_loss": -10.422975540161133, "global_step": 176759, "epoch": 1052} {"train_loss": -9.961030960083008, "global_step": 176760, "epoch": 1052} {"train_loss": -10.781779289245605, "global_step": 176761, "epoch": 1052} {"train_loss": -10.70714282989502, "global_step": 176762, "epoch": 1052} {"train_loss": -10.913244247436523, "global_step": 176763, "epoch": 1052} {"train_loss": -10.702484130859375, "global_step": 176764, "epoch": 1052} {"train_loss": -10.561652183532715, "global_step": 176765, "epoch": 1052} {"train_loss": -10.177305221557617, "global_step": 176766, "epoch": 1052} {"train_loss": -9.823874473571777, "global_step": 176767, "epoch": 1052} {"train_loss": -9.821378707885742, "global_step": 176768, "epoch": 1052} {"train_loss": -9.900447845458984, "global_step": 176769, "epoch": 1052} {"train_loss": -9.878263473510742, "global_step": 176770, "epoch": 1052} {"train_loss": -9.623635292053223, "global_step": 176771, "epoch": 1052} {"train_loss": -10.138628005981445, "global_step": 176772, "epoch": 1052} {"train_loss": -10.14326000213623, "global_step": 176773, "epoch": 1052} {"train_loss": -10.269388198852539, "global_step": 176774, "epoch": 1052} {"train_loss": -10.106433868408203, "global_step": 176775, "epoch": 1052} {"train_loss": -10.224254608154297, "global_step": 176776, "epoch": 1052} {"train_loss": -9.278366088867188, "global_step": 176777, "epoch": 1052} {"train_loss": -10.408855438232422, "global_step": 176778, "epoch": 1052} {"train_loss": -9.850933074951172, "global_step": 176779, "epoch": 1052} {"train_loss": -9.916934967041016, "global_step": 176780, "epoch": 1052} {"train_loss": -10.56403636932373, "global_step": 176781, "epoch": 1052} {"train_loss": -9.803937911987305, "global_step": 176782, "epoch": 1052} {"train_loss": -10.429617881774902, "global_step": 176783, "epoch": 1052} {"train_loss": -10.271190643310547, "global_step": 176784, "epoch": 1052} {"train_loss": -10.266769409179688, "global_step": 176785, "epoch": 1052} {"train_loss": -9.91331672668457, "global_step": 176786, "epoch": 1052} {"train_loss": -10.804605484008789, "global_step": 176787, "epoch": 1052} {"train_loss": -10.125584602355957, "global_step": 176788, "epoch": 1052} {"train_loss": -10.591819763183594, "global_step": 176789, "epoch": 1052} {"train_loss": -10.636566162109375, "global_step": 176790, "epoch": 1052} {"train_loss": -10.701349258422852, "global_step": 176791, "epoch": 1052} {"train_loss": -10.604280471801758, "global_step": 176792, "epoch": 1052} {"train_loss": -10.455507278442383, "global_step": 176793, "epoch": 1052} {"train_loss": -10.907732963562012, "global_step": 176794, "epoch": 1052} {"train_loss": -10.550479888916016, "global_step": 176795, "epoch": 1052} {"train_loss": -10.75291633605957, "global_step": 176796, "epoch": 1052} {"train_loss": -10.74087905883789, "global_step": 176797, "epoch": 1052} {"train_loss": -10.714350700378418, "global_step": 176798, "epoch": 1052} {"train_loss": -10.44941520690918, "global_step": 176799, "epoch": 1052} {"train_loss": -10.920831680297852, "global_step": 176800, "epoch": 1052} {"train_loss": -10.761703491210938, "global_step": 176801, "epoch": 1052} {"train_loss": -10.714366912841797, "global_step": 176802, "epoch": 1052} {"train_loss": -11.041227340698242, "global_step": 176803, "epoch": 1052} {"train_loss": -10.846916198730469, "global_step": 176804, "epoch": 1052} {"train_loss": -10.803678512573242, "global_step": 176805, "epoch": 1052} {"train_loss": -10.696152687072754, "global_step": 176806, "epoch": 1052} {"train_loss": -10.79726791381836, "global_step": 176807, "epoch": 1052} {"train_loss": -10.95266056060791, "global_step": 176808, "epoch": 1052} {"train_loss": -11.03321361541748, "global_step": 176809, "epoch": 1052} {"train_loss": -10.815078735351562, "global_step": 176810, "epoch": 1052} {"train_loss": -11.097960472106934, "global_step": 176811, "epoch": 1052} {"train_loss": -10.765926361083984, "global_step": 176812, "epoch": 1052} {"train_loss": -10.844545364379883, "global_step": 176813, "epoch": 1052} {"train_loss": -11.283443450927734, "global_step": 176814, "epoch": 1052} {"train_loss": -10.603893280029297, "global_step": 176815, "epoch": 1052} {"train_loss": -11.074796676635742, "global_step": 176816, "epoch": 1052} {"train_loss": -11.09404182434082, "global_step": 176817, "epoch": 1052} {"train_loss": -11.012630462646484, "global_step": 176818, "epoch": 1052} {"train_loss": -11.142505645751953, "global_step": 176819, "epoch": 1052} {"train_loss": -11.089585304260254, "global_step": 176820, "epoch": 1052} {"train_loss": -11.041082382202148, "global_step": 176821, "epoch": 1052} {"train_loss": -11.007530212402344, "global_step": 176822, "epoch": 1052} {"train_loss": -11.245400428771973, "global_step": 176823, "epoch": 1052} {"train_loss": -11.22704792022705, "global_step": 176824, "epoch": 1052} {"train_loss": -11.334209442138672, "global_step": 176825, "epoch": 1052} {"train_loss": -11.056681632995605, "global_step": 176826, "epoch": 1052} {"train_loss": -11.278172492980957, "global_step": 176827, "epoch": 1052} {"train_loss": -11.295011520385742, "global_step": 176828, "epoch": 1052} {"train_loss": -11.069316864013672, "global_step": 176829, "epoch": 1052} {"train_loss": -11.346061706542969, "global_step": 176830, "epoch": 1052} {"train_loss": -11.24349594116211, "global_step": 176831, "epoch": 1052} {"train_loss": -11.401342391967773, "global_step": 176832, "epoch": 1052} {"train_loss": -11.389379501342773, "global_step": 176833, "epoch": 1052} {"train_loss": -11.267143249511719, "global_step": 176834, "epoch": 1052} {"train_loss": -11.425506591796875, "global_step": 176835, "epoch": 1052} {"train_loss": -11.312774658203125, "global_step": 176836, "epoch": 1052} {"train_loss": -11.276787757873535, "global_step": 176837, "epoch": 1052} {"train_loss": -11.2498197555542, "global_step": 176838, "epoch": 1052} {"train_loss": -11.219234466552734, "global_step": 176839, "epoch": 1052} {"train_loss": -11.182735443115234, "global_step": 176840, "epoch": 1052} {"train_loss": -10.782820701599121, "global_step": 176841, "epoch": 1052} {"train_loss": -11.292049407958984, "global_step": 176842, "epoch": 1052} {"train_loss": -11.26518440246582, "global_step": 176843, "epoch": 1052} {"train_loss": -11.135257720947266, "global_step": 176844, "epoch": 1052} {"train_loss": -11.515752792358398, "global_step": 176845, "epoch": 1052} {"train_loss": -11.233474731445312, "global_step": 176846, "epoch": 1052} {"train_loss": -11.106708526611328, "global_step": 176847, "epoch": 1052} {"train_loss": -11.210373878479004, "global_step": 176848, "epoch": 1052} {"train_loss": -11.302010536193848, "global_step": 176849, "epoch": 1052} {"train_loss": -11.090618133544922, "global_step": 176850, "epoch": 1052} {"train_loss": -11.146440505981445, "global_step": 176851, "epoch": 1052} {"train_loss": -11.312997817993164, "global_step": 176852, "epoch": 1052} {"train_loss": -11.063884735107422, "global_step": 176853, "epoch": 1052} {"train_loss": -11.465335845947266, "global_step": 176854, "epoch": 1052} {"train_loss": -11.058394432067871, "global_step": 176855, "epoch": 1052} {"train_loss": -11.492311477661133, "global_step": 176856, "epoch": 1052} {"train_loss": -11.135868072509766, "global_step": 176857, "epoch": 1052} {"train_loss": -11.420745849609375, "global_step": 176858, "epoch": 1052} {"train_loss": -11.204471588134766, "global_step": 176859, "epoch": 1052} {"train_loss": -10.90554428100586, "global_step": 176860, "epoch": 1052} {"train_loss": -10.938677787780762, "global_step": 176861, "epoch": 1052} {"train_loss": -11.196836471557617, "global_step": 176862, "epoch": 1052} {"train_loss": -10.820886611938477, "global_step": 176863, "epoch": 1052} {"train_loss": -9.419124603271484, "global_step": 176864, "epoch": 1052} {"train_loss": -11.185630798339844, "global_step": 176865, "epoch": 1052} {"train_loss": -9.66578483581543, "global_step": 176866, "epoch": 1052} {"train_loss": -10.31396484375, "global_step": 176867, "epoch": 1052} {"train_loss": -10.49443244934082, "global_step": 176868, "epoch": 1052} {"train_loss": -8.827142715454102, "global_step": 176869, "epoch": 1052} {"train_loss": -9.375962257385254, "global_step": 176870, "epoch": 1052} {"train_loss": -9.916555404663086, "global_step": 176871, "epoch": 1052} {"train_loss": -9.23923110961914, "global_step": 176872, "epoch": 1052} {"train_loss": -9.336235046386719, "global_step": 176873, "epoch": 1052} {"train_loss": -9.959686279296875, "global_step": 176874, "epoch": 1052} {"train_loss": -9.045175552368164, "global_step": 176875, "epoch": 1052} {"train_loss": -10.725227355957031, "global_step": 176876, "epoch": 1052} {"train_loss": -9.657217979431152, "global_step": 176877, "epoch": 1052} {"train_loss": -9.711347579956055, "global_step": 176878, "epoch": 1052} {"train_loss": -10.472997665405273, "global_step": 176879, "epoch": 1052} {"train_loss": -9.842281341552734, "global_step": 176880, "epoch": 1052} {"train_loss": -9.858205795288086, "global_step": 176881, "epoch": 1052} {"train_loss": -10.260587692260742, "global_step": 176882, "epoch": 1052} {"train_loss": -10.583581924438477, "global_step": 176883, "epoch": 1052} {"train_loss": -10.42322063446045, "global_step": 176884, "epoch": 1052} {"train_loss": -10.699438095092773, "global_step": 176885, "epoch": 1052} {"train_loss": -10.535685539245605, "global_step": 176886, "epoch": 1052} {"train_loss": -10.755348205566406, "global_step": 176887, "epoch": 1052} {"train_loss": -10.27833080291748, "global_step": 176888, "epoch": 1052} {"train_loss": -10.647729873657227, "global_step": 176889, "epoch": 1052} {"train_loss": -10.84123420715332, "global_step": 176890, "epoch": 1052} {"train_loss": -10.625835418701172, "global_step": 176891, "epoch": 1052} {"train_loss": -10.752584457397461, "global_step": 176892, "epoch": 1052} {"train_loss": -10.877363204956055, "global_step": 176893, "epoch": 1052} {"train_loss": -10.855213165283203, "global_step": 176894, "epoch": 1052} {"train_loss": -10.592214584350586, "global_step": 176895, "epoch": 1052} {"train_loss": -10.966264724731445, "global_step": 176896, "epoch": 1052} {"train_loss": -10.916553497314453, "global_step": 176897, "epoch": 1052} {"train_loss": -10.592121124267578, "global_step": 176898, "epoch": 1052} {"train_loss": -10.915058135986328, "global_step": 176899, "epoch": 1052} {"train_loss": -10.981910705566406, "global_step": 176900, "epoch": 1052} {"train_loss": -10.626851081848145, "global_step": 176901, "epoch": 1052} {"train_loss": -11.291497230529785, "global_step": 176902, "epoch": 1052} {"train_loss": -10.741230720565433, "global_step": 176903, "epoch": 1052, "val_loss": 236881.296875} {"train_loss": -11.099628448486328, "global_step": 176904, "epoch": 1053} {"train_loss": -11.079442024230957, "global_step": 176905, "epoch": 1053} {"train_loss": -11.1505126953125, "global_step": 176906, "epoch": 1053} {"train_loss": -11.028810501098633, "global_step": 176907, "epoch": 1053} {"train_loss": -11.163818359375, "global_step": 176908, "epoch": 1053} {"train_loss": -10.831056594848633, "global_step": 176909, "epoch": 1053} {"train_loss": -11.20511245727539, "global_step": 176910, "epoch": 1053} {"train_loss": -10.930365562438965, "global_step": 176911, "epoch": 1053} {"train_loss": -11.236515998840332, "global_step": 176912, "epoch": 1053} {"train_loss": -11.193815231323242, "global_step": 176913, "epoch": 1053} {"train_loss": -11.272858619689941, "global_step": 176914, "epoch": 1053} {"train_loss": -11.198183059692383, "global_step": 176915, "epoch": 1053} {"train_loss": -11.272342681884766, "global_step": 176916, "epoch": 1053} {"train_loss": -11.206704139709473, "global_step": 176917, "epoch": 1053} {"train_loss": -11.34531021118164, "global_step": 176918, "epoch": 1053} {"train_loss": -11.432600975036621, "global_step": 176919, "epoch": 1053} {"train_loss": -11.23220157623291, "global_step": 176920, "epoch": 1053} {"train_loss": -11.324298858642578, "global_step": 176921, "epoch": 1053} {"train_loss": -11.372516632080078, "global_step": 176922, "epoch": 1053} {"train_loss": -11.175861358642578, "global_step": 176923, "epoch": 1053} {"train_loss": -11.242685317993164, "global_step": 176924, "epoch": 1053} {"train_loss": -11.3345308303833, "global_step": 176925, "epoch": 1053} {"train_loss": -11.379375457763672, "global_step": 176926, "epoch": 1053} {"train_loss": -11.404010772705078, "global_step": 176927, "epoch": 1053} {"train_loss": -11.238256454467773, "global_step": 176928, "epoch": 1053} {"train_loss": -11.43317699432373, "global_step": 176929, "epoch": 1053} {"train_loss": -11.451604843139648, "global_step": 176930, "epoch": 1053} {"train_loss": -11.279884338378906, "global_step": 176931, "epoch": 1053} {"train_loss": -11.508645057678223, "global_step": 176932, "epoch": 1053} {"train_loss": -11.4071044921875, "global_step": 176933, "epoch": 1053} {"train_loss": -11.099985122680664, "global_step": 176934, "epoch": 1053} {"train_loss": -11.46605396270752, "global_step": 176935, "epoch": 1053} {"train_loss": -11.244869232177734, "global_step": 176936, "epoch": 1053} {"train_loss": -11.110763549804688, "global_step": 176937, "epoch": 1053} {"train_loss": -11.355387687683105, "global_step": 176938, "epoch": 1053} {"train_loss": -10.996814727783203, "global_step": 176939, "epoch": 1053} {"train_loss": -11.178984642028809, "global_step": 176940, "epoch": 1053} {"train_loss": -11.451892852783203, "global_step": 176941, "epoch": 1053} {"train_loss": -11.069722175598145, "global_step": 176942, "epoch": 1053} {"train_loss": -11.208196640014648, "global_step": 176943, "epoch": 1053} {"train_loss": -11.511119842529297, "global_step": 176944, "epoch": 1053} {"train_loss": -11.079630851745605, "global_step": 176945, "epoch": 1053} {"train_loss": -11.004209518432617, "global_step": 176946, "epoch": 1053} {"train_loss": -11.539780616760254, "global_step": 176947, "epoch": 1053} {"train_loss": -11.202274322509766, "global_step": 176948, "epoch": 1053} {"train_loss": -11.312784194946289, "global_step": 176949, "epoch": 1053} {"train_loss": -11.456228256225586, "global_step": 176950, "epoch": 1053} {"train_loss": -11.107748031616211, "global_step": 176951, "epoch": 1053} {"train_loss": -11.519438743591309, "global_step": 176952, "epoch": 1053} {"train_loss": -11.123565673828125, "global_step": 176953, "epoch": 1053} {"train_loss": -11.363759994506836, "global_step": 176954, "epoch": 1053} {"train_loss": -11.33438491821289, "global_step": 176955, "epoch": 1053} {"train_loss": -11.36046028137207, "global_step": 176956, "epoch": 1053} {"train_loss": -11.376838684082031, "global_step": 176957, "epoch": 1053} {"train_loss": -11.553749084472656, "global_step": 176958, "epoch": 1053} {"train_loss": -11.168293952941895, "global_step": 176959, "epoch": 1053} {"train_loss": -11.37537956237793, "global_step": 176960, "epoch": 1053} {"train_loss": -11.148030281066895, "global_step": 176961, "epoch": 1053} {"train_loss": -10.999991416931152, "global_step": 176962, "epoch": 1053} {"train_loss": -11.344026565551758, "global_step": 176963, "epoch": 1053} {"train_loss": -11.123798370361328, "global_step": 176964, "epoch": 1053} {"train_loss": -11.471660614013672, "global_step": 176965, "epoch": 1053} {"train_loss": -10.89785385131836, "global_step": 176966, "epoch": 1053} {"train_loss": -11.285215377807617, "global_step": 176967, "epoch": 1053} {"train_loss": -11.438913345336914, "global_step": 176968, "epoch": 1053} {"train_loss": -11.415738105773926, "global_step": 176969, "epoch": 1053} {"train_loss": -11.281285285949707, "global_step": 176970, "epoch": 1053} {"train_loss": -11.389623641967773, "global_step": 176971, "epoch": 1053} {"train_loss": -11.575252532958984, "global_step": 176972, "epoch": 1053} {"train_loss": -11.612361907958984, "global_step": 176973, "epoch": 1053} {"train_loss": -11.283151626586914, "global_step": 176974, "epoch": 1053} {"train_loss": -11.34255599975586, "global_step": 176975, "epoch": 1053} {"train_loss": -11.024749755859375, "global_step": 176976, "epoch": 1053} {"train_loss": -11.292062759399414, "global_step": 176977, "epoch": 1053} {"train_loss": -11.113351821899414, "global_step": 176978, "epoch": 1053} {"train_loss": -11.173755645751953, "global_step": 176979, "epoch": 1053} {"train_loss": -11.217964172363281, "global_step": 176980, "epoch": 1053} {"train_loss": -11.188095092773438, "global_step": 176981, "epoch": 1053} {"train_loss": -10.861238479614258, "global_step": 176982, "epoch": 1053} {"train_loss": -11.252425193786621, "global_step": 176983, "epoch": 1053} {"train_loss": -11.088090896606445, "global_step": 176984, "epoch": 1053} {"train_loss": -10.827323913574219, "global_step": 176985, "epoch": 1053} {"train_loss": -10.277363777160645, "global_step": 176986, "epoch": 1053} {"train_loss": -10.377365112304688, "global_step": 176987, "epoch": 1053} {"train_loss": -10.578936576843262, "global_step": 176988, "epoch": 1053} {"train_loss": -10.445449829101562, "global_step": 176989, "epoch": 1053} {"train_loss": -10.618159294128418, "global_step": 176990, "epoch": 1053} {"train_loss": -10.8469820022583, "global_step": 176991, "epoch": 1053} {"train_loss": -10.954352378845215, "global_step": 176992, "epoch": 1053} {"train_loss": -10.79496955871582, "global_step": 176993, "epoch": 1053} {"train_loss": -11.180389404296875, "global_step": 176994, "epoch": 1053} {"train_loss": -11.001343727111816, "global_step": 176995, "epoch": 1053} {"train_loss": -10.738358497619629, "global_step": 176996, "epoch": 1053} {"train_loss": -10.727188110351562, "global_step": 176997, "epoch": 1053} {"train_loss": -10.948458671569824, "global_step": 176998, "epoch": 1053} {"train_loss": -10.85217571258545, "global_step": 176999, "epoch": 1053} {"train_loss": -10.736722946166992, "global_step": 177000, "epoch": 1053} {"train_loss": -10.903639793395996, "global_step": 177001, "epoch": 1053} {"train_loss": -9.956865310668945, "global_step": 177002, "epoch": 1053} {"train_loss": -10.862838745117188, "global_step": 177003, "epoch": 1053} {"train_loss": -9.963495254516602, "global_step": 177004, "epoch": 1053} {"train_loss": -10.818869590759277, "global_step": 177005, "epoch": 1053} {"train_loss": -10.433269500732422, "global_step": 177006, "epoch": 1053} {"train_loss": -10.472640037536621, "global_step": 177007, "epoch": 1053} {"train_loss": -10.693607330322266, "global_step": 177008, "epoch": 1053} {"train_loss": -10.153450965881348, "global_step": 177009, "epoch": 1053} {"train_loss": -10.774906158447266, "global_step": 177010, "epoch": 1053} {"train_loss": -10.803465843200684, "global_step": 177011, "epoch": 1053} {"train_loss": -10.603751182556152, "global_step": 177012, "epoch": 1053} {"train_loss": -10.997780799865723, "global_step": 177013, "epoch": 1053} {"train_loss": -10.503564834594727, "global_step": 177014, "epoch": 1053} {"train_loss": -10.529447555541992, "global_step": 177015, "epoch": 1053} {"train_loss": -10.575834274291992, "global_step": 177016, "epoch": 1053} {"train_loss": -10.69826889038086, "global_step": 177017, "epoch": 1053} {"train_loss": -10.782325744628906, "global_step": 177018, "epoch": 1053} {"train_loss": -10.333348274230957, "global_step": 177019, "epoch": 1053} {"train_loss": -10.981124877929688, "global_step": 177020, "epoch": 1053} {"train_loss": -10.871463775634766, "global_step": 177021, "epoch": 1053} {"train_loss": -10.8885498046875, "global_step": 177022, "epoch": 1053} {"train_loss": -10.900019645690918, "global_step": 177023, "epoch": 1053} {"train_loss": -10.861106872558594, "global_step": 177024, "epoch": 1053} {"train_loss": -10.948995590209961, "global_step": 177025, "epoch": 1053} {"train_loss": -10.893428802490234, "global_step": 177026, "epoch": 1053} {"train_loss": -10.991336822509766, "global_step": 177027, "epoch": 1053} {"train_loss": -10.82349967956543, "global_step": 177028, "epoch": 1053} {"train_loss": -10.843533515930176, "global_step": 177029, "epoch": 1053} {"train_loss": -11.24681282043457, "global_step": 177030, "epoch": 1053} {"train_loss": -11.017016410827637, "global_step": 177031, "epoch": 1053} {"train_loss": -11.04163646697998, "global_step": 177032, "epoch": 1053} {"train_loss": -10.969186782836914, "global_step": 177033, "epoch": 1053} {"train_loss": -11.12005615234375, "global_step": 177034, "epoch": 1053} {"train_loss": -10.86009407043457, "global_step": 177035, "epoch": 1053} {"train_loss": -11.108473777770996, "global_step": 177036, "epoch": 1053} {"train_loss": -10.892850875854492, "global_step": 177037, "epoch": 1053} {"train_loss": -11.032720565795898, "global_step": 177038, "epoch": 1053} {"train_loss": -11.180530548095703, "global_step": 177039, "epoch": 1053} {"train_loss": -10.87171745300293, "global_step": 177040, "epoch": 1053} {"train_loss": -11.110420227050781, "global_step": 177041, "epoch": 1053} {"train_loss": -11.262417793273926, "global_step": 177042, "epoch": 1053} {"train_loss": -11.096485137939453, "global_step": 177043, "epoch": 1053} {"train_loss": -10.891511917114258, "global_step": 177044, "epoch": 1053} {"train_loss": -11.344066619873047, "global_step": 177045, "epoch": 1053} {"train_loss": -10.983352661132812, "global_step": 177046, "epoch": 1053} {"train_loss": -11.30317497253418, "global_step": 177047, "epoch": 1053} {"train_loss": -11.188812255859375, "global_step": 177048, "epoch": 1053} {"train_loss": -11.067306518554688, "global_step": 177049, "epoch": 1053} {"train_loss": -11.27595043182373, "global_step": 177050, "epoch": 1053} {"train_loss": -11.060218811035156, "global_step": 177051, "epoch": 1053} {"train_loss": -11.133905410766602, "global_step": 177052, "epoch": 1053} {"train_loss": -11.04248046875, "global_step": 177053, "epoch": 1053} {"train_loss": -11.418594360351562, "global_step": 177054, "epoch": 1053} {"train_loss": -11.229541778564453, "global_step": 177055, "epoch": 1053} {"train_loss": -11.137683868408203, "global_step": 177056, "epoch": 1053} {"train_loss": -10.84273910522461, "global_step": 177057, "epoch": 1053} {"train_loss": -11.422598838806152, "global_step": 177058, "epoch": 1053} {"train_loss": -11.341886520385742, "global_step": 177059, "epoch": 1053} {"train_loss": -11.415448188781738, "global_step": 177060, "epoch": 1053} {"train_loss": -11.357820510864258, "global_step": 177061, "epoch": 1053} {"train_loss": -11.09904670715332, "global_step": 177062, "epoch": 1053} {"train_loss": -11.323159217834473, "global_step": 177063, "epoch": 1053} {"train_loss": -11.28415298461914, "global_step": 177064, "epoch": 1053} {"train_loss": -10.877065658569336, "global_step": 177065, "epoch": 1053} {"train_loss": -11.142143249511719, "global_step": 177066, "epoch": 1053} {"train_loss": -11.247135162353516, "global_step": 177067, "epoch": 1053} {"train_loss": -11.470499992370605, "global_step": 177068, "epoch": 1053} {"train_loss": -11.289226531982422, "global_step": 177069, "epoch": 1053} {"train_loss": -11.416255950927734, "global_step": 177070, "epoch": 1053} {"train_loss": -11.085767501876468, "global_step": 177071, "epoch": 1053, "val_loss": 242086.234375} {"train_loss": -11.041618347167969, "global_step": 177072, "epoch": 1054} {"train_loss": -11.552693367004395, "global_step": 177073, "epoch": 1054} {"train_loss": -11.41864013671875, "global_step": 177074, "epoch": 1054} {"train_loss": -11.442032814025879, "global_step": 177075, "epoch": 1054} {"train_loss": -11.210329055786133, "global_step": 177076, "epoch": 1054} {"train_loss": -11.17432975769043, "global_step": 177077, "epoch": 1054} {"train_loss": -10.85753059387207, "global_step": 177078, "epoch": 1054} {"train_loss": -11.060989379882812, "global_step": 177079, "epoch": 1054} {"train_loss": -11.027885437011719, "global_step": 177080, "epoch": 1054} {"train_loss": -10.483170509338379, "global_step": 177081, "epoch": 1054} {"train_loss": -10.398460388183594, "global_step": 177082, "epoch": 1054} {"train_loss": -11.332006454467773, "global_step": 177083, "epoch": 1054} {"train_loss": -10.404467582702637, "global_step": 177084, "epoch": 1054} {"train_loss": -10.719728469848633, "global_step": 177085, "epoch": 1054} {"train_loss": -10.754547119140625, "global_step": 177086, "epoch": 1054} {"train_loss": -10.973490715026855, "global_step": 177087, "epoch": 1054} {"train_loss": -10.76148796081543, "global_step": 177088, "epoch": 1054} {"train_loss": -11.254121780395508, "global_step": 177089, "epoch": 1054} {"train_loss": -11.003568649291992, "global_step": 177090, "epoch": 1054} {"train_loss": -11.291509628295898, "global_step": 177091, "epoch": 1054} {"train_loss": -11.397878646850586, "global_step": 177092, "epoch": 1054} {"train_loss": -10.889331817626953, "global_step": 177093, "epoch": 1054} {"train_loss": -11.12601089477539, "global_step": 177094, "epoch": 1054} {"train_loss": -11.221868515014648, "global_step": 177095, "epoch": 1054} {"train_loss": -11.507515907287598, "global_step": 177096, "epoch": 1054} {"train_loss": -11.187505722045898, "global_step": 177097, "epoch": 1054} {"train_loss": -10.511510848999023, "global_step": 177098, "epoch": 1054} {"train_loss": -11.024517059326172, "global_step": 177099, "epoch": 1054} {"train_loss": -10.804204940795898, "global_step": 177100, "epoch": 1054} {"train_loss": -11.211246490478516, "global_step": 177101, "epoch": 1054} {"train_loss": -10.89866828918457, "global_step": 177102, "epoch": 1054} {"train_loss": -10.815298080444336, "global_step": 177103, "epoch": 1054} {"train_loss": -11.167057037353516, "global_step": 177104, "epoch": 1054} {"train_loss": -11.034351348876953, "global_step": 177105, "epoch": 1054} {"train_loss": -10.571066856384277, "global_step": 177106, "epoch": 1054} {"train_loss": -10.674474716186523, "global_step": 177107, "epoch": 1054} {"train_loss": -11.082866668701172, "global_step": 177108, "epoch": 1054} {"train_loss": -10.4266357421875, "global_step": 177109, "epoch": 1054} {"train_loss": -11.264348983764648, "global_step": 177110, "epoch": 1054} {"train_loss": -10.705022811889648, "global_step": 177111, "epoch": 1054} {"train_loss": -10.891399383544922, "global_step": 177112, "epoch": 1054} {"train_loss": -11.150847434997559, "global_step": 177113, "epoch": 1054} {"train_loss": -10.82778549194336, "global_step": 177114, "epoch": 1054} {"train_loss": -11.255514144897461, "global_step": 177115, "epoch": 1054} {"train_loss": -10.883419036865234, "global_step": 177116, "epoch": 1054} {"train_loss": -10.98617172241211, "global_step": 177117, "epoch": 1054} {"train_loss": -11.099458694458008, "global_step": 177118, "epoch": 1054} {"train_loss": -10.840728759765625, "global_step": 177119, "epoch": 1054} {"train_loss": -10.713868141174316, "global_step": 177120, "epoch": 1054} {"train_loss": -11.190271377563477, "global_step": 177121, "epoch": 1054} {"train_loss": -10.742730140686035, "global_step": 177122, "epoch": 1054} {"train_loss": -11.327260971069336, "global_step": 177123, "epoch": 1054} {"train_loss": -10.931182861328125, "global_step": 177124, "epoch": 1054} {"train_loss": -11.220518112182617, "global_step": 177125, "epoch": 1054} {"train_loss": -10.473884582519531, "global_step": 177126, "epoch": 1054} {"train_loss": -10.747103691101074, "global_step": 177127, "epoch": 1054} {"train_loss": -10.19415283203125, "global_step": 177128, "epoch": 1054} {"train_loss": -10.807340621948242, "global_step": 177129, "epoch": 1054} {"train_loss": -9.345821380615234, "global_step": 177130, "epoch": 1054} {"train_loss": -10.412131309509277, "global_step": 177131, "epoch": 1054} {"train_loss": -10.231078147888184, "global_step": 177132, "epoch": 1054} {"train_loss": -9.969512939453125, "global_step": 177133, "epoch": 1054} {"train_loss": -9.80699348449707, "global_step": 177134, "epoch": 1054} {"train_loss": -10.344239234924316, "global_step": 177135, "epoch": 1054} {"train_loss": -10.555058479309082, "global_step": 177136, "epoch": 1054} {"train_loss": -9.466540336608887, "global_step": 177137, "epoch": 1054} {"train_loss": -10.473627090454102, "global_step": 177138, "epoch": 1054} {"train_loss": -9.880721092224121, "global_step": 177139, "epoch": 1054} {"train_loss": -10.784460067749023, "global_step": 177140, "epoch": 1054} {"train_loss": -10.025642395019531, "global_step": 177141, "epoch": 1054} {"train_loss": -10.539045333862305, "global_step": 177142, "epoch": 1054} {"train_loss": -9.911209106445312, "global_step": 177143, "epoch": 1054} {"train_loss": -10.738485336303711, "global_step": 177144, "epoch": 1054} {"train_loss": -10.146318435668945, "global_step": 177145, "epoch": 1054} {"train_loss": -10.683860778808594, "global_step": 177146, "epoch": 1054} {"train_loss": -10.272624969482422, "global_step": 177147, "epoch": 1054} {"train_loss": -10.695085525512695, "global_step": 177148, "epoch": 1054} {"train_loss": -10.464086532592773, "global_step": 177149, "epoch": 1054} {"train_loss": -9.928319931030273, "global_step": 177150, "epoch": 1054} {"train_loss": -10.846900939941406, "global_step": 177151, "epoch": 1054} {"train_loss": -9.892959594726562, "global_step": 177152, "epoch": 1054} {"train_loss": -10.72724723815918, "global_step": 177153, "epoch": 1054} {"train_loss": -10.468342781066895, "global_step": 177154, "epoch": 1054} {"train_loss": -10.777996063232422, "global_step": 177155, "epoch": 1054} {"train_loss": -10.82441520690918, "global_step": 177156, "epoch": 1054} {"train_loss": -10.890480995178223, "global_step": 177157, "epoch": 1054} {"train_loss": -10.523287773132324, "global_step": 177158, "epoch": 1054} {"train_loss": -10.680970191955566, "global_step": 177159, "epoch": 1054} {"train_loss": -10.853667259216309, "global_step": 177160, "epoch": 1054} {"train_loss": -10.621517181396484, "global_step": 177161, "epoch": 1054} {"train_loss": -10.770844459533691, "global_step": 177162, "epoch": 1054} {"train_loss": -11.087484359741211, "global_step": 177163, "epoch": 1054} {"train_loss": -10.7354736328125, "global_step": 177164, "epoch": 1054} {"train_loss": -11.08914852142334, "global_step": 177165, "epoch": 1054} {"train_loss": -10.8807373046875, "global_step": 177166, "epoch": 1054} {"train_loss": -10.93648624420166, "global_step": 177167, "epoch": 1054} {"train_loss": -11.02639389038086, "global_step": 177168, "epoch": 1054} {"train_loss": -11.180220603942871, "global_step": 177169, "epoch": 1054} {"train_loss": -11.05348014831543, "global_step": 177170, "epoch": 1054} {"train_loss": -11.160258293151855, "global_step": 177171, "epoch": 1054} {"train_loss": -11.119465827941895, "global_step": 177172, "epoch": 1054} {"train_loss": -11.04442024230957, "global_step": 177173, "epoch": 1054} {"train_loss": -11.213237762451172, "global_step": 177174, "epoch": 1054} {"train_loss": -10.983352661132812, "global_step": 177175, "epoch": 1054} {"train_loss": -11.106775283813477, "global_step": 177176, "epoch": 1054} {"train_loss": -11.07455062866211, "global_step": 177177, "epoch": 1054} {"train_loss": -11.166601181030273, "global_step": 177178, "epoch": 1054} {"train_loss": -10.917742729187012, "global_step": 177179, "epoch": 1054} {"train_loss": -11.334442138671875, "global_step": 177180, "epoch": 1054} {"train_loss": -11.129507064819336, "global_step": 177181, "epoch": 1054} {"train_loss": -11.190210342407227, "global_step": 177182, "epoch": 1054} {"train_loss": -11.185306549072266, "global_step": 177183, "epoch": 1054} {"train_loss": -11.08523941040039, "global_step": 177184, "epoch": 1054} {"train_loss": -11.336493492126465, "global_step": 177185, "epoch": 1054} {"train_loss": -11.102277755737305, "global_step": 177186, "epoch": 1054} {"train_loss": -11.032461166381836, "global_step": 177187, "epoch": 1054} {"train_loss": -11.152924537658691, "global_step": 177188, "epoch": 1054} {"train_loss": -10.974882125854492, "global_step": 177189, "epoch": 1054} {"train_loss": -11.146103858947754, "global_step": 177190, "epoch": 1054} {"train_loss": -10.983314514160156, "global_step": 177191, "epoch": 1054} {"train_loss": -11.068571090698242, "global_step": 177192, "epoch": 1054} {"train_loss": -11.123955726623535, "global_step": 177193, "epoch": 1054} {"train_loss": -11.068058013916016, "global_step": 177194, "epoch": 1054} {"train_loss": -11.136466979980469, "global_step": 177195, "epoch": 1054} {"train_loss": -11.112646102905273, "global_step": 177196, "epoch": 1054} {"train_loss": -11.121408462524414, "global_step": 177197, "epoch": 1054} {"train_loss": -11.217809677124023, "global_step": 177198, "epoch": 1054} {"train_loss": -11.062089920043945, "global_step": 177199, "epoch": 1054} {"train_loss": -11.594985961914062, "global_step": 177200, "epoch": 1054} {"train_loss": -10.995038986206055, "global_step": 177201, "epoch": 1054} {"train_loss": -11.047428131103516, "global_step": 177202, "epoch": 1054} {"train_loss": -11.16304874420166, "global_step": 177203, "epoch": 1054} {"train_loss": -10.9909029006958, "global_step": 177204, "epoch": 1054} {"train_loss": -11.41815185546875, "global_step": 177205, "epoch": 1054} {"train_loss": -10.889479637145996, "global_step": 177206, "epoch": 1054} {"train_loss": -11.102213859558105, "global_step": 177207, "epoch": 1054} {"train_loss": -11.198795318603516, "global_step": 177208, "epoch": 1054} {"train_loss": -11.394240379333496, "global_step": 177209, "epoch": 1054} {"train_loss": -11.300788879394531, "global_step": 177210, "epoch": 1054} {"train_loss": -11.000711441040039, "global_step": 177211, "epoch": 1054} {"train_loss": -11.047330856323242, "global_step": 177212, "epoch": 1054} {"train_loss": -11.404403686523438, "global_step": 177213, "epoch": 1054} {"train_loss": -11.491313934326172, "global_step": 177214, "epoch": 1054} {"train_loss": -10.952703475952148, "global_step": 177215, "epoch": 1054} {"train_loss": -11.226259231567383, "global_step": 177216, "epoch": 1054} {"train_loss": -11.019509315490723, "global_step": 177217, "epoch": 1054} {"train_loss": -11.423467636108398, "global_step": 177218, "epoch": 1054} {"train_loss": -11.053970336914062, "global_step": 177219, "epoch": 1054} {"train_loss": -11.322837829589844, "global_step": 177220, "epoch": 1054} {"train_loss": -11.363030433654785, "global_step": 177221, "epoch": 1054} {"train_loss": -11.155933380126953, "global_step": 177222, "epoch": 1054} {"train_loss": -11.379205703735352, "global_step": 177223, "epoch": 1054} {"train_loss": -11.094399452209473, "global_step": 177224, "epoch": 1054} {"train_loss": -11.381233215332031, "global_step": 177225, "epoch": 1054} {"train_loss": -11.127608299255371, "global_step": 177226, "epoch": 1054} {"train_loss": -11.484983444213867, "global_step": 177227, "epoch": 1054} {"train_loss": -11.209576606750488, "global_step": 177228, "epoch": 1054} {"train_loss": -11.106986999511719, "global_step": 177229, "epoch": 1054} {"train_loss": -10.929786682128906, "global_step": 177230, "epoch": 1054} {"train_loss": -11.014876365661621, "global_step": 177231, "epoch": 1054} {"train_loss": -10.976659774780273, "global_step": 177232, "epoch": 1054} {"train_loss": -11.187541961669922, "global_step": 177233, "epoch": 1054} {"train_loss": -11.02028751373291, "global_step": 177234, "epoch": 1054} {"train_loss": -10.274953842163086, "global_step": 177235, "epoch": 1054} {"train_loss": -10.96269416809082, "global_step": 177236, "epoch": 1054} {"train_loss": -10.718871116638184, "global_step": 177237, "epoch": 1054} {"train_loss": -10.074202537536621, "global_step": 177238, "epoch": 1054} {"train_loss": -10.913766804195586, "global_step": 177239, "epoch": 1054, "val_loss": 242042.375} {"train_loss": -9.492361068725586, "global_step": 177240, "epoch": 1055} {"train_loss": -10.757351875305176, "global_step": 177241, "epoch": 1055} {"train_loss": -10.066402435302734, "global_step": 177242, "epoch": 1055} {"train_loss": -10.017317771911621, "global_step": 177243, "epoch": 1055} {"train_loss": -10.375531196594238, "global_step": 177244, "epoch": 1055} {"train_loss": -9.094487190246582, "global_step": 177245, "epoch": 1055} {"train_loss": -11.058342933654785, "global_step": 177246, "epoch": 1055} {"train_loss": -9.462553024291992, "global_step": 177247, "epoch": 1055} {"train_loss": -10.721342086791992, "global_step": 177248, "epoch": 1055} {"train_loss": -10.589425086975098, "global_step": 177249, "epoch": 1055} {"train_loss": -9.836313247680664, "global_step": 177250, "epoch": 1055} {"train_loss": -11.077730178833008, "global_step": 177251, "epoch": 1055} {"train_loss": -10.347225189208984, "global_step": 177252, "epoch": 1055} {"train_loss": -10.904282569885254, "global_step": 177253, "epoch": 1055} {"train_loss": -10.746450424194336, "global_step": 177254, "epoch": 1055} {"train_loss": -11.013469696044922, "global_step": 177255, "epoch": 1055} {"train_loss": -10.312914848327637, "global_step": 177256, "epoch": 1055} {"train_loss": -11.124552726745605, "global_step": 177257, "epoch": 1055} {"train_loss": -10.197595596313477, "global_step": 177258, "epoch": 1055} {"train_loss": -10.825521469116211, "global_step": 177259, "epoch": 1055} {"train_loss": -10.672805786132812, "global_step": 177260, "epoch": 1055} {"train_loss": -10.793073654174805, "global_step": 177261, "epoch": 1055} {"train_loss": -10.867790222167969, "global_step": 177262, "epoch": 1055} {"train_loss": -10.994569778442383, "global_step": 177263, "epoch": 1055} {"train_loss": -10.92524242401123, "global_step": 177264, "epoch": 1055} {"train_loss": -10.930537223815918, "global_step": 177265, "epoch": 1055} {"train_loss": -11.122027397155762, "global_step": 177266, "epoch": 1055} {"train_loss": -11.044511795043945, "global_step": 177267, "epoch": 1055} {"train_loss": -11.137584686279297, "global_step": 177268, "epoch": 1055} {"train_loss": -11.169770240783691, "global_step": 177269, "epoch": 1055} {"train_loss": -11.011430740356445, "global_step": 177270, "epoch": 1055} {"train_loss": -10.936100006103516, "global_step": 177271, "epoch": 1055} {"train_loss": -11.093006134033203, "global_step": 177272, "epoch": 1055} {"train_loss": -11.156601905822754, "global_step": 177273, "epoch": 1055} {"train_loss": -11.112117767333984, "global_step": 177274, "epoch": 1055} {"train_loss": -11.298885345458984, "global_step": 177275, "epoch": 1055} {"train_loss": -11.037160873413086, "global_step": 177276, "epoch": 1055} {"train_loss": -11.175017356872559, "global_step": 177277, "epoch": 1055} {"train_loss": -11.252494812011719, "global_step": 177278, "epoch": 1055} {"train_loss": -11.125391006469727, "global_step": 177279, "epoch": 1055} {"train_loss": -11.106500625610352, "global_step": 177280, "epoch": 1055} {"train_loss": -11.063743591308594, "global_step": 177281, "epoch": 1055} {"train_loss": -11.3499755859375, "global_step": 177282, "epoch": 1055} {"train_loss": -11.145708084106445, "global_step": 177283, "epoch": 1055} {"train_loss": -11.256965637207031, "global_step": 177284, "epoch": 1055} {"train_loss": -11.29645824432373, "global_step": 177285, "epoch": 1055} {"train_loss": -11.232932090759277, "global_step": 177286, "epoch": 1055} {"train_loss": -11.429474830627441, "global_step": 177287, "epoch": 1055} {"train_loss": -11.269561767578125, "global_step": 177288, "epoch": 1055} {"train_loss": -11.069487571716309, "global_step": 177289, "epoch": 1055} {"train_loss": -11.105364799499512, "global_step": 177290, "epoch": 1055} {"train_loss": -11.091747283935547, "global_step": 177291, "epoch": 1055} {"train_loss": -11.016997337341309, "global_step": 177292, "epoch": 1055} {"train_loss": -11.302694320678711, "global_step": 177293, "epoch": 1055} {"train_loss": -11.190635681152344, "global_step": 177294, "epoch": 1055} {"train_loss": -11.106908798217773, "global_step": 177295, "epoch": 1055} {"train_loss": -11.317763328552246, "global_step": 177296, "epoch": 1055} {"train_loss": -11.533889770507812, "global_step": 177297, "epoch": 1055} {"train_loss": -11.283323287963867, "global_step": 177298, "epoch": 1055} {"train_loss": -11.30758285522461, "global_step": 177299, "epoch": 1055} {"train_loss": -11.269660949707031, "global_step": 177300, "epoch": 1055} {"train_loss": -11.223913192749023, "global_step": 177301, "epoch": 1055} {"train_loss": -11.370563507080078, "global_step": 177302, "epoch": 1055} {"train_loss": -11.59848403930664, "global_step": 177303, "epoch": 1055} {"train_loss": -11.291054725646973, "global_step": 177304, "epoch": 1055} {"train_loss": -11.448748588562012, "global_step": 177305, "epoch": 1055} {"train_loss": -11.178016662597656, "global_step": 177306, "epoch": 1055} {"train_loss": -11.37594985961914, "global_step": 177307, "epoch": 1055} {"train_loss": -11.406761169433594, "global_step": 177308, "epoch": 1055} {"train_loss": -11.305879592895508, "global_step": 177309, "epoch": 1055} {"train_loss": -11.448312759399414, "global_step": 177310, "epoch": 1055} {"train_loss": -11.340600967407227, "global_step": 177311, "epoch": 1055} {"train_loss": -11.408021926879883, "global_step": 177312, "epoch": 1055} {"train_loss": -11.190074920654297, "global_step": 177313, "epoch": 1055} {"train_loss": -11.427502632141113, "global_step": 177314, "epoch": 1055} {"train_loss": -11.459979057312012, "global_step": 177315, "epoch": 1055} {"train_loss": -11.388090133666992, "global_step": 177316, "epoch": 1055} {"train_loss": -11.360815048217773, "global_step": 177317, "epoch": 1055} {"train_loss": -11.42308235168457, "global_step": 177318, "epoch": 1055} {"train_loss": -11.265019416809082, "global_step": 177319, "epoch": 1055} {"train_loss": -11.076444625854492, "global_step": 177320, "epoch": 1055} {"train_loss": -10.551652908325195, "global_step": 177321, "epoch": 1055} {"train_loss": -10.962690353393555, "global_step": 177322, "epoch": 1055} {"train_loss": -11.04774284362793, "global_step": 177323, "epoch": 1055} {"train_loss": -10.528553009033203, "global_step": 177324, "epoch": 1055} {"train_loss": -10.896108627319336, "global_step": 177325, "epoch": 1055} {"train_loss": -11.130205154418945, "global_step": 177326, "epoch": 1055} {"train_loss": -9.646308898925781, "global_step": 177327, "epoch": 1055} {"train_loss": -10.25583267211914, "global_step": 177328, "epoch": 1055} {"train_loss": -10.744922637939453, "global_step": 177329, "epoch": 1055} {"train_loss": -10.710694313049316, "global_step": 177330, "epoch": 1055} {"train_loss": -10.812483787536621, "global_step": 177331, "epoch": 1055} {"train_loss": -10.962653160095215, "global_step": 177332, "epoch": 1055} {"train_loss": -11.388631820678711, "global_step": 177333, "epoch": 1055} {"train_loss": -10.767642974853516, "global_step": 177334, "epoch": 1055} {"train_loss": -10.924973487854004, "global_step": 177335, "epoch": 1055} {"train_loss": -10.565223693847656, "global_step": 177336, "epoch": 1055} {"train_loss": -9.846673965454102, "global_step": 177337, "epoch": 1055} {"train_loss": -10.806182861328125, "global_step": 177338, "epoch": 1055} {"train_loss": -9.616759300231934, "global_step": 177339, "epoch": 1055} {"train_loss": -10.307878494262695, "global_step": 177340, "epoch": 1055} {"train_loss": -10.085602760314941, "global_step": 177341, "epoch": 1055} {"train_loss": -9.973225593566895, "global_step": 177342, "epoch": 1055} {"train_loss": -10.618629455566406, "global_step": 177343, "epoch": 1055} {"train_loss": -8.851455688476562, "global_step": 177344, "epoch": 1055} {"train_loss": -10.598906517028809, "global_step": 177345, "epoch": 1055} {"train_loss": -9.289932250976562, "global_step": 177346, "epoch": 1055} {"train_loss": -10.679706573486328, "global_step": 177347, "epoch": 1055} {"train_loss": -9.274128913879395, "global_step": 177348, "epoch": 1055} {"train_loss": -10.738048553466797, "global_step": 177349, "epoch": 1055} {"train_loss": -9.072492599487305, "global_step": 177350, "epoch": 1055} {"train_loss": -10.632277488708496, "global_step": 177351, "epoch": 1055} {"train_loss": -9.788881301879883, "global_step": 177352, "epoch": 1055} {"train_loss": -10.738425254821777, "global_step": 177353, "epoch": 1055} {"train_loss": -9.56704330444336, "global_step": 177354, "epoch": 1055} {"train_loss": -10.460916519165039, "global_step": 177355, "epoch": 1055} {"train_loss": -10.570478439331055, "global_step": 177356, "epoch": 1055} {"train_loss": -10.329668998718262, "global_step": 177357, "epoch": 1055} {"train_loss": -10.367687225341797, "global_step": 177358, "epoch": 1055} {"train_loss": -10.689931869506836, "global_step": 177359, "epoch": 1055} {"train_loss": -10.618131637573242, "global_step": 177360, "epoch": 1055} {"train_loss": -10.217957496643066, "global_step": 177361, "epoch": 1055} {"train_loss": -10.653055191040039, "global_step": 177362, "epoch": 1055} {"train_loss": -10.569563865661621, "global_step": 177363, "epoch": 1055} {"train_loss": -10.080793380737305, "global_step": 177364, "epoch": 1055} {"train_loss": -11.048097610473633, "global_step": 177365, "epoch": 1055} {"train_loss": -10.659879684448242, "global_step": 177366, "epoch": 1055} {"train_loss": -10.505108833312988, "global_step": 177367, "epoch": 1055} {"train_loss": -10.87574577331543, "global_step": 177368, "epoch": 1055} {"train_loss": -10.385324478149414, "global_step": 177369, "epoch": 1055} {"train_loss": -10.783674240112305, "global_step": 177370, "epoch": 1055} {"train_loss": -10.828975677490234, "global_step": 177371, "epoch": 1055} {"train_loss": -11.035297393798828, "global_step": 177372, "epoch": 1055} {"train_loss": -10.621528625488281, "global_step": 177373, "epoch": 1055} {"train_loss": -10.608835220336914, "global_step": 177374, "epoch": 1055} {"train_loss": -11.034192085266113, "global_step": 177375, "epoch": 1055} {"train_loss": -10.59239673614502, "global_step": 177376, "epoch": 1055} {"train_loss": -10.989023208618164, "global_step": 177377, "epoch": 1055} {"train_loss": -10.971057891845703, "global_step": 177378, "epoch": 1055} {"train_loss": -10.79699420928955, "global_step": 177379, "epoch": 1055} {"train_loss": -11.149920463562012, "global_step": 177380, "epoch": 1055} {"train_loss": -11.122550964355469, "global_step": 177381, "epoch": 1055} {"train_loss": -10.976680755615234, "global_step": 177382, "epoch": 1055} {"train_loss": -11.056947708129883, "global_step": 177383, "epoch": 1055} {"train_loss": -11.152956008911133, "global_step": 177384, "epoch": 1055} {"train_loss": -11.047262191772461, "global_step": 177385, "epoch": 1055} {"train_loss": -10.915916442871094, "global_step": 177386, "epoch": 1055} {"train_loss": -11.176079750061035, "global_step": 177387, "epoch": 1055} {"train_loss": -11.025152206420898, "global_step": 177388, "epoch": 1055} {"train_loss": -11.030176162719727, "global_step": 177389, "epoch": 1055} {"train_loss": -11.237019538879395, "global_step": 177390, "epoch": 1055} {"train_loss": -11.336523056030273, "global_step": 177391, "epoch": 1055} {"train_loss": -11.26587963104248, "global_step": 177392, "epoch": 1055} {"train_loss": -11.128864288330078, "global_step": 177393, "epoch": 1055} {"train_loss": -11.248429298400879, "global_step": 177394, "epoch": 1055} {"train_loss": -11.255353927612305, "global_step": 177395, "epoch": 1055} {"train_loss": -11.19509220123291, "global_step": 177396, "epoch": 1055} {"train_loss": -11.270109176635742, "global_step": 177397, "epoch": 1055} {"train_loss": -11.225765228271484, "global_step": 177398, "epoch": 1055} {"train_loss": -11.389949798583984, "global_step": 177399, "epoch": 1055} {"train_loss": -11.408583641052246, "global_step": 177400, "epoch": 1055} {"train_loss": -11.352367401123047, "global_step": 177401, "epoch": 1055} {"train_loss": -11.138799667358398, "global_step": 177402, "epoch": 1055} {"train_loss": -11.287432670593262, "global_step": 177403, "epoch": 1055} {"train_loss": -11.460354804992676, "global_step": 177404, "epoch": 1055} {"train_loss": -11.386240005493164, "global_step": 177405, "epoch": 1055} {"train_loss": -11.332807540893555, "global_step": 177406, "epoch": 1055} {"train_loss": -10.859020306950523, "global_step": 177407, "epoch": 1055, "val_loss": 241192.375, "train_action_mse_error": 2.438239574432373} {"train_loss": -11.289275169372559, "global_step": 177408, "epoch": 1056} {"train_loss": -11.413856506347656, "global_step": 177409, "epoch": 1056} {"train_loss": -11.157356262207031, "global_step": 177410, "epoch": 1056} {"train_loss": -11.542215347290039, "global_step": 177411, "epoch": 1056} {"train_loss": -11.416996955871582, "global_step": 177412, "epoch": 1056} {"train_loss": -11.467704772949219, "global_step": 177413, "epoch": 1056} {"train_loss": -11.524821281433105, "global_step": 177414, "epoch": 1056} {"train_loss": -11.500253677368164, "global_step": 177415, "epoch": 1056} {"train_loss": -11.387115478515625, "global_step": 177416, "epoch": 1056} {"train_loss": -11.567239761352539, "global_step": 177417, "epoch": 1056} {"train_loss": -11.573984146118164, "global_step": 177418, "epoch": 1056} {"train_loss": -11.740715980529785, "global_step": 177419, "epoch": 1056} {"train_loss": -11.680469512939453, "global_step": 177420, "epoch": 1056} {"train_loss": -11.436522483825684, "global_step": 177421, "epoch": 1056} {"train_loss": -11.610413551330566, "global_step": 177422, "epoch": 1056} {"train_loss": -11.819686889648438, "global_step": 177423, "epoch": 1056} {"train_loss": -11.411515235900879, "global_step": 177424, "epoch": 1056} {"train_loss": -11.285112380981445, "global_step": 177425, "epoch": 1056} {"train_loss": -11.150053024291992, "global_step": 177426, "epoch": 1056} {"train_loss": -11.215143203735352, "global_step": 177427, "epoch": 1056} {"train_loss": -10.97937297821045, "global_step": 177428, "epoch": 1056} {"train_loss": -10.757650375366211, "global_step": 177429, "epoch": 1056} {"train_loss": -10.977347373962402, "global_step": 177430, "epoch": 1056} {"train_loss": -11.210832595825195, "global_step": 177431, "epoch": 1056} {"train_loss": -11.578519821166992, "global_step": 177432, "epoch": 1056} {"train_loss": -11.247529029846191, "global_step": 177433, "epoch": 1056} {"train_loss": -10.663817405700684, "global_step": 177434, "epoch": 1056} {"train_loss": -10.797046661376953, "global_step": 177435, "epoch": 1056} {"train_loss": -11.013126373291016, "global_step": 177436, "epoch": 1056} {"train_loss": -10.649825096130371, "global_step": 177437, "epoch": 1056} {"train_loss": -10.457110404968262, "global_step": 177438, "epoch": 1056} {"train_loss": -10.885909080505371, "global_step": 177439, "epoch": 1056} {"train_loss": -11.740748405456543, "global_step": 177440, "epoch": 1056} {"train_loss": -11.334746360778809, "global_step": 177441, "epoch": 1056} {"train_loss": -11.282692909240723, "global_step": 177442, "epoch": 1056} {"train_loss": -11.214653015136719, "global_step": 177443, "epoch": 1056} {"train_loss": -11.333137512207031, "global_step": 177444, "epoch": 1056} {"train_loss": -10.965036392211914, "global_step": 177445, "epoch": 1056} {"train_loss": -11.376500129699707, "global_step": 177446, "epoch": 1056} {"train_loss": -11.319965362548828, "global_step": 177447, "epoch": 1056} {"train_loss": -11.144468307495117, "global_step": 177448, "epoch": 1056} {"train_loss": -11.164079666137695, "global_step": 177449, "epoch": 1056} {"train_loss": -11.516648292541504, "global_step": 177450, "epoch": 1056} {"train_loss": -10.759488105773926, "global_step": 177451, "epoch": 1056} {"train_loss": -11.202717781066895, "global_step": 177452, "epoch": 1056} {"train_loss": -11.155216217041016, "global_step": 177453, "epoch": 1056} {"train_loss": -11.010930061340332, "global_step": 177454, "epoch": 1056} {"train_loss": -10.86481761932373, "global_step": 177455, "epoch": 1056} {"train_loss": -10.711528778076172, "global_step": 177456, "epoch": 1056} {"train_loss": -10.399018287658691, "global_step": 177457, "epoch": 1056} {"train_loss": -11.25006103515625, "global_step": 177458, "epoch": 1056} {"train_loss": -10.746816635131836, "global_step": 177459, "epoch": 1056} {"train_loss": -10.415552139282227, "global_step": 177460, "epoch": 1056} {"train_loss": -10.69159984588623, "global_step": 177461, "epoch": 1056} {"train_loss": -10.607924461364746, "global_step": 177462, "epoch": 1056} {"train_loss": -9.506540298461914, "global_step": 177463, "epoch": 1056} {"train_loss": -11.014177322387695, "global_step": 177464, "epoch": 1056} {"train_loss": -9.969350814819336, "global_step": 177465, "epoch": 1056} {"train_loss": -9.895404815673828, "global_step": 177466, "epoch": 1056} {"train_loss": -10.510523796081543, "global_step": 177467, "epoch": 1056} {"train_loss": -10.48881721496582, "global_step": 177468, "epoch": 1056} {"train_loss": -9.547107696533203, "global_step": 177469, "epoch": 1056} {"train_loss": -9.411535263061523, "global_step": 177470, "epoch": 1056} {"train_loss": -10.28259563446045, "global_step": 177471, "epoch": 1056} {"train_loss": -9.792753219604492, "global_step": 177472, "epoch": 1056} {"train_loss": -10.326530456542969, "global_step": 177473, "epoch": 1056} {"train_loss": -10.53563404083252, "global_step": 177474, "epoch": 1056} {"train_loss": -9.328874588012695, "global_step": 177475, "epoch": 1056} {"train_loss": -10.739934921264648, "global_step": 177476, "epoch": 1056} {"train_loss": -9.551753997802734, "global_step": 177477, "epoch": 1056} {"train_loss": -10.248584747314453, "global_step": 177478, "epoch": 1056} {"train_loss": -10.48183822631836, "global_step": 177479, "epoch": 1056} {"train_loss": -9.882308006286621, "global_step": 177480, "epoch": 1056} {"train_loss": -10.922077178955078, "global_step": 177481, "epoch": 1056} {"train_loss": -10.329596519470215, "global_step": 177482, "epoch": 1056} {"train_loss": -10.55075740814209, "global_step": 177483, "epoch": 1056} {"train_loss": -10.775020599365234, "global_step": 177484, "epoch": 1056} {"train_loss": -10.922388076782227, "global_step": 177485, "epoch": 1056} {"train_loss": -10.900191307067871, "global_step": 177486, "epoch": 1056} {"train_loss": -10.822259902954102, "global_step": 177487, "epoch": 1056} {"train_loss": -11.00700569152832, "global_step": 177488, "epoch": 1056} {"train_loss": -10.803935050964355, "global_step": 177489, "epoch": 1056} {"train_loss": -10.956953048706055, "global_step": 177490, "epoch": 1056} {"train_loss": -10.854167938232422, "global_step": 177491, "epoch": 1056} {"train_loss": -11.00791072845459, "global_step": 177492, "epoch": 1056} {"train_loss": -11.037093162536621, "global_step": 177493, "epoch": 1056} {"train_loss": -10.927116394042969, "global_step": 177494, "epoch": 1056} {"train_loss": -10.904441833496094, "global_step": 177495, "epoch": 1056} {"train_loss": -10.873090744018555, "global_step": 177496, "epoch": 1056} {"train_loss": -11.151016235351562, "global_step": 177497, "epoch": 1056} {"train_loss": -10.837544441223145, "global_step": 177498, "epoch": 1056} {"train_loss": -11.122896194458008, "global_step": 177499, "epoch": 1056} {"train_loss": -11.120490074157715, "global_step": 177500, "epoch": 1056} {"train_loss": -10.963054656982422, "global_step": 177501, "epoch": 1056} {"train_loss": -11.005401611328125, "global_step": 177502, "epoch": 1056} {"train_loss": -11.084916114807129, "global_step": 177503, "epoch": 1056} {"train_loss": -11.203781127929688, "global_step": 177504, "epoch": 1056} {"train_loss": -11.256145477294922, "global_step": 177505, "epoch": 1056} {"train_loss": -11.271175384521484, "global_step": 177506, "epoch": 1056} {"train_loss": -11.222299575805664, "global_step": 177507, "epoch": 1056} {"train_loss": -11.21976375579834, "global_step": 177508, "epoch": 1056} {"train_loss": -11.41551685333252, "global_step": 177509, "epoch": 1056} {"train_loss": -11.278421401977539, "global_step": 177510, "epoch": 1056} {"train_loss": -11.272149085998535, "global_step": 177511, "epoch": 1056} {"train_loss": -11.237642288208008, "global_step": 177512, "epoch": 1056} {"train_loss": -11.231809616088867, "global_step": 177513, "epoch": 1056} {"train_loss": -11.382783889770508, "global_step": 177514, "epoch": 1056} {"train_loss": -11.54002571105957, "global_step": 177515, "epoch": 1056} {"train_loss": -11.515671730041504, "global_step": 177516, "epoch": 1056} {"train_loss": -11.10690689086914, "global_step": 177517, "epoch": 1056} {"train_loss": -11.322835922241211, "global_step": 177518, "epoch": 1056} {"train_loss": -11.209553718566895, "global_step": 177519, "epoch": 1056} {"train_loss": -11.26356315612793, "global_step": 177520, "epoch": 1056} {"train_loss": -11.294060707092285, "global_step": 177521, "epoch": 1056} {"train_loss": -11.341830253601074, "global_step": 177522, "epoch": 1056} {"train_loss": -11.403057098388672, "global_step": 177523, "epoch": 1056} {"train_loss": -11.371788024902344, "global_step": 177524, "epoch": 1056} {"train_loss": -11.25735092163086, "global_step": 177525, "epoch": 1056} {"train_loss": -11.401329040527344, "global_step": 177526, "epoch": 1056} {"train_loss": -11.519472122192383, "global_step": 177527, "epoch": 1056} {"train_loss": -11.457578659057617, "global_step": 177528, "epoch": 1056} {"train_loss": -11.303216934204102, "global_step": 177529, "epoch": 1056} {"train_loss": -11.349613189697266, "global_step": 177530, "epoch": 1056} {"train_loss": -11.266345024108887, "global_step": 177531, "epoch": 1056} {"train_loss": -11.097932815551758, "global_step": 177532, "epoch": 1056} {"train_loss": -11.364673614501953, "global_step": 177533, "epoch": 1056} {"train_loss": -11.335214614868164, "global_step": 177534, "epoch": 1056} {"train_loss": -11.510226249694824, "global_step": 177535, "epoch": 1056} {"train_loss": -11.120115280151367, "global_step": 177536, "epoch": 1056} {"train_loss": -11.345928192138672, "global_step": 177537, "epoch": 1056} {"train_loss": -11.423544883728027, "global_step": 177538, "epoch": 1056} {"train_loss": -11.339678764343262, "global_step": 177539, "epoch": 1056} {"train_loss": -11.216833114624023, "global_step": 177540, "epoch": 1056} {"train_loss": -11.001035690307617, "global_step": 177541, "epoch": 1056} {"train_loss": -11.085610389709473, "global_step": 177542, "epoch": 1056} {"train_loss": -11.309576034545898, "global_step": 177543, "epoch": 1056} {"train_loss": -11.206518173217773, "global_step": 177544, "epoch": 1056} {"train_loss": -10.855256080627441, "global_step": 177545, "epoch": 1056} {"train_loss": -11.137093544006348, "global_step": 177546, "epoch": 1056} {"train_loss": -10.506830215454102, "global_step": 177547, "epoch": 1056} {"train_loss": -10.403352737426758, "global_step": 177548, "epoch": 1056} {"train_loss": -11.019960403442383, "global_step": 177549, "epoch": 1056} {"train_loss": -10.761945724487305, "global_step": 177550, "epoch": 1056} {"train_loss": -10.278416633605957, "global_step": 177551, "epoch": 1056} {"train_loss": -11.395965576171875, "global_step": 177552, "epoch": 1056} {"train_loss": -10.461833953857422, "global_step": 177553, "epoch": 1056} {"train_loss": -10.736831665039062, "global_step": 177554, "epoch": 1056} {"train_loss": -10.839239120483398, "global_step": 177555, "epoch": 1056} {"train_loss": -10.867828369140625, "global_step": 177556, "epoch": 1056} {"train_loss": -10.816099166870117, "global_step": 177557, "epoch": 1056} {"train_loss": -10.830787658691406, "global_step": 177558, "epoch": 1056} {"train_loss": -11.057738304138184, "global_step": 177559, "epoch": 1056} {"train_loss": -11.183517456054688, "global_step": 177560, "epoch": 1056} {"train_loss": -11.190649032592773, "global_step": 177561, "epoch": 1056} {"train_loss": -10.775640487670898, "global_step": 177562, "epoch": 1056} {"train_loss": -10.8485689163208, "global_step": 177563, "epoch": 1056} {"train_loss": -11.167479515075684, "global_step": 177564, "epoch": 1056} {"train_loss": -11.069684982299805, "global_step": 177565, "epoch": 1056} {"train_loss": -11.318204879760742, "global_step": 177566, "epoch": 1056} {"train_loss": -11.421388626098633, "global_step": 177567, "epoch": 1056} {"train_loss": -10.686861991882324, "global_step": 177568, "epoch": 1056} {"train_loss": -10.911001205444336, "global_step": 177569, "epoch": 1056} {"train_loss": -10.543191909790039, "global_step": 177570, "epoch": 1056} {"train_loss": -10.740431785583496, "global_step": 177571, "epoch": 1056} {"train_loss": -10.782485008239746, "global_step": 177572, "epoch": 1056} {"train_loss": -10.676628112792969, "global_step": 177573, "epoch": 1056} {"train_loss": -10.538284301757812, "global_step": 177574, "epoch": 1056} {"train_loss": -10.992096441132682, "global_step": 177575, "epoch": 1056, "val_loss": 241164.171875} {"train_loss": -10.673761367797852, "global_step": 177576, "epoch": 1057} {"train_loss": -10.393909454345703, "global_step": 177577, "epoch": 1057} {"train_loss": -10.835960388183594, "global_step": 177578, "epoch": 1057} {"train_loss": -10.471650123596191, "global_step": 177579, "epoch": 1057} {"train_loss": -10.855679512023926, "global_step": 177580, "epoch": 1057} {"train_loss": -10.955808639526367, "global_step": 177581, "epoch": 1057} {"train_loss": -11.011781692504883, "global_step": 177582, "epoch": 1057} {"train_loss": -10.770336151123047, "global_step": 177583, "epoch": 1057} {"train_loss": -10.989896774291992, "global_step": 177584, "epoch": 1057} {"train_loss": -10.913318634033203, "global_step": 177585, "epoch": 1057} {"train_loss": -10.908329010009766, "global_step": 177586, "epoch": 1057} {"train_loss": -10.891725540161133, "global_step": 177587, "epoch": 1057} {"train_loss": -10.810541152954102, "global_step": 177588, "epoch": 1057} {"train_loss": -10.714546203613281, "global_step": 177589, "epoch": 1057} {"train_loss": -11.183985710144043, "global_step": 177590, "epoch": 1057} {"train_loss": -10.954357147216797, "global_step": 177591, "epoch": 1057} {"train_loss": -11.287866592407227, "global_step": 177592, "epoch": 1057} {"train_loss": -11.103239059448242, "global_step": 177593, "epoch": 1057} {"train_loss": -10.922292709350586, "global_step": 177594, "epoch": 1057} {"train_loss": -11.402464866638184, "global_step": 177595, "epoch": 1057} {"train_loss": -10.920417785644531, "global_step": 177596, "epoch": 1057} {"train_loss": -11.214728355407715, "global_step": 177597, "epoch": 1057} {"train_loss": -11.234026908874512, "global_step": 177598, "epoch": 1057} {"train_loss": -11.115758895874023, "global_step": 177599, "epoch": 1057} {"train_loss": -10.918264389038086, "global_step": 177600, "epoch": 1057} {"train_loss": -11.237631797790527, "global_step": 177601, "epoch": 1057} {"train_loss": -11.221856117248535, "global_step": 177602, "epoch": 1057} {"train_loss": -11.180377006530762, "global_step": 177603, "epoch": 1057} {"train_loss": -10.874737739562988, "global_step": 177604, "epoch": 1057} {"train_loss": -10.996949195861816, "global_step": 177605, "epoch": 1057} {"train_loss": -10.794687271118164, "global_step": 177606, "epoch": 1057} {"train_loss": -10.947649955749512, "global_step": 177607, "epoch": 1057} {"train_loss": -10.916589736938477, "global_step": 177608, "epoch": 1057} {"train_loss": -10.979597091674805, "global_step": 177609, "epoch": 1057} {"train_loss": -10.905752182006836, "global_step": 177610, "epoch": 1057} {"train_loss": -11.300331115722656, "global_step": 177611, "epoch": 1057} {"train_loss": -10.86867904663086, "global_step": 177612, "epoch": 1057} {"train_loss": -10.925615310668945, "global_step": 177613, "epoch": 1057} {"train_loss": -11.094344139099121, "global_step": 177614, "epoch": 1057} {"train_loss": -10.472264289855957, "global_step": 177615, "epoch": 1057} {"train_loss": -10.796951293945312, "global_step": 177616, "epoch": 1057} {"train_loss": -11.42534065246582, "global_step": 177617, "epoch": 1057} {"train_loss": -11.125046730041504, "global_step": 177618, "epoch": 1057} {"train_loss": -11.412907600402832, "global_step": 177619, "epoch": 1057} {"train_loss": -11.147533416748047, "global_step": 177620, "epoch": 1057} {"train_loss": -11.442375183105469, "global_step": 177621, "epoch": 1057} {"train_loss": -11.291731834411621, "global_step": 177622, "epoch": 1057} {"train_loss": -11.171363830566406, "global_step": 177623, "epoch": 1057} {"train_loss": -11.346797943115234, "global_step": 177624, "epoch": 1057} {"train_loss": -11.17162036895752, "global_step": 177625, "epoch": 1057} {"train_loss": -11.291677474975586, "global_step": 177626, "epoch": 1057} {"train_loss": -11.482024192810059, "global_step": 177627, "epoch": 1057} {"train_loss": -11.078776359558105, "global_step": 177628, "epoch": 1057} {"train_loss": -11.308425903320312, "global_step": 177629, "epoch": 1057} {"train_loss": -11.238240242004395, "global_step": 177630, "epoch": 1057} {"train_loss": -11.378202438354492, "global_step": 177631, "epoch": 1057} {"train_loss": -11.49081802368164, "global_step": 177632, "epoch": 1057} {"train_loss": -11.001410484313965, "global_step": 177633, "epoch": 1057} {"train_loss": -11.524179458618164, "global_step": 177634, "epoch": 1057} {"train_loss": -11.174735069274902, "global_step": 177635, "epoch": 1057} {"train_loss": -11.60354995727539, "global_step": 177636, "epoch": 1057} {"train_loss": -11.341012954711914, "global_step": 177637, "epoch": 1057} {"train_loss": -11.45116901397705, "global_step": 177638, "epoch": 1057} {"train_loss": -11.09433650970459, "global_step": 177639, "epoch": 1057} {"train_loss": -11.211662292480469, "global_step": 177640, "epoch": 1057} {"train_loss": -11.317997932434082, "global_step": 177641, "epoch": 1057} {"train_loss": -11.438507080078125, "global_step": 177642, "epoch": 1057} {"train_loss": -11.244333267211914, "global_step": 177643, "epoch": 1057} {"train_loss": -11.402612686157227, "global_step": 177644, "epoch": 1057} {"train_loss": -11.201366424560547, "global_step": 177645, "epoch": 1057} {"train_loss": -11.586235046386719, "global_step": 177646, "epoch": 1057} {"train_loss": -11.411273956298828, "global_step": 177647, "epoch": 1057} {"train_loss": -11.011785507202148, "global_step": 177648, "epoch": 1057} {"train_loss": -11.265348434448242, "global_step": 177649, "epoch": 1057} {"train_loss": -11.503667831420898, "global_step": 177650, "epoch": 1057} {"train_loss": -10.692224502563477, "global_step": 177651, "epoch": 1057} {"train_loss": -10.85453987121582, "global_step": 177652, "epoch": 1057} {"train_loss": -11.520418167114258, "global_step": 177653, "epoch": 1057} {"train_loss": -10.925871849060059, "global_step": 177654, "epoch": 1057} {"train_loss": -10.873573303222656, "global_step": 177655, "epoch": 1057} {"train_loss": -11.566847801208496, "global_step": 177656, "epoch": 1057} {"train_loss": -10.767040252685547, "global_step": 177657, "epoch": 1057} {"train_loss": -10.570394515991211, "global_step": 177658, "epoch": 1057} {"train_loss": -11.030619621276855, "global_step": 177659, "epoch": 1057} {"train_loss": -11.166374206542969, "global_step": 177660, "epoch": 1057} {"train_loss": -11.325773239135742, "global_step": 177661, "epoch": 1057} {"train_loss": -11.301412582397461, "global_step": 177662, "epoch": 1057} {"train_loss": -10.83487319946289, "global_step": 177663, "epoch": 1057} {"train_loss": -11.366846084594727, "global_step": 177664, "epoch": 1057} {"train_loss": -10.615850448608398, "global_step": 177665, "epoch": 1057} {"train_loss": -11.014287948608398, "global_step": 177666, "epoch": 1057} {"train_loss": -10.474037170410156, "global_step": 177667, "epoch": 1057} {"train_loss": -9.290077209472656, "global_step": 177668, "epoch": 1057} {"train_loss": -9.147699356079102, "global_step": 177669, "epoch": 1057} {"train_loss": -10.570878028869629, "global_step": 177670, "epoch": 1057} {"train_loss": -8.529632568359375, "global_step": 177671, "epoch": 1057} {"train_loss": -7.879602909088135, "global_step": 177672, "epoch": 1057} {"train_loss": -9.278525352478027, "global_step": 177673, "epoch": 1057} {"train_loss": -8.690242767333984, "global_step": 177674, "epoch": 1057} {"train_loss": -9.392576217651367, "global_step": 177675, "epoch": 1057} {"train_loss": -10.006277084350586, "global_step": 177676, "epoch": 1057} {"train_loss": -9.195599555969238, "global_step": 177677, "epoch": 1057} {"train_loss": -9.634599685668945, "global_step": 177678, "epoch": 1057} {"train_loss": -9.423962593078613, "global_step": 177679, "epoch": 1057} {"train_loss": -8.222817420959473, "global_step": 177680, "epoch": 1057} {"train_loss": -8.711175918579102, "global_step": 177681, "epoch": 1057} {"train_loss": -9.342241287231445, "global_step": 177682, "epoch": 1057} {"train_loss": -8.403280258178711, "global_step": 177683, "epoch": 1057} {"train_loss": -7.908478736877441, "global_step": 177684, "epoch": 1057} {"train_loss": -10.551457405090332, "global_step": 177685, "epoch": 1057} {"train_loss": -9.412814140319824, "global_step": 177686, "epoch": 1057} {"train_loss": -9.349433898925781, "global_step": 177687, "epoch": 1057} {"train_loss": -9.710172653198242, "global_step": 177688, "epoch": 1057} {"train_loss": -9.702880859375, "global_step": 177689, "epoch": 1057} {"train_loss": -8.563228607177734, "global_step": 177690, "epoch": 1057} {"train_loss": -9.152506828308105, "global_step": 177691, "epoch": 1057} {"train_loss": -10.664742469787598, "global_step": 177692, "epoch": 1057} {"train_loss": -9.618127822875977, "global_step": 177693, "epoch": 1057} {"train_loss": -8.854511260986328, "global_step": 177694, "epoch": 1057} {"train_loss": -10.409835815429688, "global_step": 177695, "epoch": 1057} {"train_loss": -10.395282745361328, "global_step": 177696, "epoch": 1057} {"train_loss": -9.881175994873047, "global_step": 177697, "epoch": 1057} {"train_loss": -9.535886764526367, "global_step": 177698, "epoch": 1057} {"train_loss": -10.474004745483398, "global_step": 177699, "epoch": 1057} {"train_loss": -10.351820945739746, "global_step": 177700, "epoch": 1057} {"train_loss": -10.04344367980957, "global_step": 177701, "epoch": 1057} {"train_loss": -9.8897705078125, "global_step": 177702, "epoch": 1057} {"train_loss": -10.512039184570312, "global_step": 177703, "epoch": 1057} {"train_loss": -10.418813705444336, "global_step": 177704, "epoch": 1057} {"train_loss": -10.36812686920166, "global_step": 177705, "epoch": 1057} {"train_loss": -10.289332389831543, "global_step": 177706, "epoch": 1057} {"train_loss": -10.50369644165039, "global_step": 177707, "epoch": 1057} {"train_loss": -10.676628112792969, "global_step": 177708, "epoch": 1057} {"train_loss": -10.599048614501953, "global_step": 177709, "epoch": 1057} {"train_loss": -10.53809642791748, "global_step": 177710, "epoch": 1057} {"train_loss": -10.519412994384766, "global_step": 177711, "epoch": 1057} {"train_loss": -10.596884727478027, "global_step": 177712, "epoch": 1057} {"train_loss": -10.807353973388672, "global_step": 177713, "epoch": 1057} {"train_loss": -10.350774765014648, "global_step": 177714, "epoch": 1057} {"train_loss": -10.653396606445312, "global_step": 177715, "epoch": 1057} {"train_loss": -10.681645393371582, "global_step": 177716, "epoch": 1057} {"train_loss": -10.569490432739258, "global_step": 177717, "epoch": 1057} {"train_loss": -10.637491226196289, "global_step": 177718, "epoch": 1057} {"train_loss": -10.729392051696777, "global_step": 177719, "epoch": 1057} {"train_loss": -10.674150466918945, "global_step": 177720, "epoch": 1057} {"train_loss": -10.754378318786621, "global_step": 177721, "epoch": 1057} {"train_loss": -10.73200798034668, "global_step": 177722, "epoch": 1057} {"train_loss": -10.844715118408203, "global_step": 177723, "epoch": 1057} {"train_loss": -10.782093048095703, "global_step": 177724, "epoch": 1057} {"train_loss": -10.980836868286133, "global_step": 177725, "epoch": 1057} {"train_loss": -10.883171081542969, "global_step": 177726, "epoch": 1057} {"train_loss": -10.850778579711914, "global_step": 177727, "epoch": 1057} {"train_loss": -10.965213775634766, "global_step": 177728, "epoch": 1057} {"train_loss": -10.877347946166992, "global_step": 177729, "epoch": 1057} {"train_loss": -10.995561599731445, "global_step": 177730, "epoch": 1057} {"train_loss": -11.030397415161133, "global_step": 177731, "epoch": 1057} {"train_loss": -10.838611602783203, "global_step": 177732, "epoch": 1057} {"train_loss": -11.057966232299805, "global_step": 177733, "epoch": 1057} {"train_loss": -11.204198837280273, "global_step": 177734, "epoch": 1057} {"train_loss": -11.302485466003418, "global_step": 177735, "epoch": 1057} {"train_loss": -11.093788146972656, "global_step": 177736, "epoch": 1057} {"train_loss": -10.99996566772461, "global_step": 177737, "epoch": 1057} {"train_loss": -11.208718299865723, "global_step": 177738, "epoch": 1057} {"train_loss": -11.160584449768066, "global_step": 177739, "epoch": 1057} {"train_loss": -11.193174362182617, "global_step": 177740, "epoch": 1057} {"train_loss": -11.20640754699707, "global_step": 177741, "epoch": 1057} {"train_loss": -11.197072982788086, "global_step": 177742, "epoch": 1057} {"train_loss": -10.678291794799623, "global_step": 177743, "epoch": 1057, "val_loss": 236389.078125} {"train_loss": -11.32178020477295, "global_step": 177744, "epoch": 1058} {"train_loss": -11.25049877166748, "global_step": 177745, "epoch": 1058} {"train_loss": -11.246440887451172, "global_step": 177746, "epoch": 1058} {"train_loss": -11.203104019165039, "global_step": 177747, "epoch": 1058} {"train_loss": -11.177591323852539, "global_step": 177748, "epoch": 1058} {"train_loss": -11.287701606750488, "global_step": 177749, "epoch": 1058} {"train_loss": -11.258466720581055, "global_step": 177750, "epoch": 1058} {"train_loss": -11.252523422241211, "global_step": 177751, "epoch": 1058} {"train_loss": -11.32344913482666, "global_step": 177752, "epoch": 1058} {"train_loss": -11.237344741821289, "global_step": 177753, "epoch": 1058} {"train_loss": -11.245172500610352, "global_step": 177754, "epoch": 1058} {"train_loss": -11.26182746887207, "global_step": 177755, "epoch": 1058} {"train_loss": -11.145223617553711, "global_step": 177756, "epoch": 1058} {"train_loss": -11.40868854522705, "global_step": 177757, "epoch": 1058} {"train_loss": -11.434441566467285, "global_step": 177758, "epoch": 1058} {"train_loss": -11.397697448730469, "global_step": 177759, "epoch": 1058} {"train_loss": -11.245500564575195, "global_step": 177760, "epoch": 1058} {"train_loss": -11.417434692382812, "global_step": 177761, "epoch": 1058} {"train_loss": -11.138138771057129, "global_step": 177762, "epoch": 1058} {"train_loss": -11.399134635925293, "global_step": 177763, "epoch": 1058} {"train_loss": -11.392358779907227, "global_step": 177764, "epoch": 1058} {"train_loss": -11.262331008911133, "global_step": 177765, "epoch": 1058} {"train_loss": -11.349420547485352, "global_step": 177766, "epoch": 1058} {"train_loss": -11.378429412841797, "global_step": 177767, "epoch": 1058} {"train_loss": -11.355157852172852, "global_step": 177768, "epoch": 1058} {"train_loss": -11.347197532653809, "global_step": 177769, "epoch": 1058} {"train_loss": -11.284732818603516, "global_step": 177770, "epoch": 1058} {"train_loss": -11.46129035949707, "global_step": 177771, "epoch": 1058} {"train_loss": -11.248774528503418, "global_step": 177772, "epoch": 1058} {"train_loss": -11.304625511169434, "global_step": 177773, "epoch": 1058} {"train_loss": -11.413233757019043, "global_step": 177774, "epoch": 1058} {"train_loss": -11.157771110534668, "global_step": 177775, "epoch": 1058} {"train_loss": -11.251749992370605, "global_step": 177776, "epoch": 1058} {"train_loss": -11.250099182128906, "global_step": 177777, "epoch": 1058} {"train_loss": -11.256954193115234, "global_step": 177778, "epoch": 1058} {"train_loss": -11.147369384765625, "global_step": 177779, "epoch": 1058} {"train_loss": -10.920206069946289, "global_step": 177780, "epoch": 1058} {"train_loss": -10.928884506225586, "global_step": 177781, "epoch": 1058} {"train_loss": -10.295892715454102, "global_step": 177782, "epoch": 1058} {"train_loss": -10.575937271118164, "global_step": 177783, "epoch": 1058} {"train_loss": -10.370596885681152, "global_step": 177784, "epoch": 1058} {"train_loss": -11.24927043914795, "global_step": 177785, "epoch": 1058} {"train_loss": -10.983071327209473, "global_step": 177786, "epoch": 1058} {"train_loss": -11.24777603149414, "global_step": 177787, "epoch": 1058} {"train_loss": -11.089179992675781, "global_step": 177788, "epoch": 1058} {"train_loss": -11.314955711364746, "global_step": 177789, "epoch": 1058} {"train_loss": -11.160440444946289, "global_step": 177790, "epoch": 1058} {"train_loss": -11.259967803955078, "global_step": 177791, "epoch": 1058} {"train_loss": -11.192663192749023, "global_step": 177792, "epoch": 1058} {"train_loss": -10.995564460754395, "global_step": 177793, "epoch": 1058} {"train_loss": -11.370407104492188, "global_step": 177794, "epoch": 1058} {"train_loss": -11.237703323364258, "global_step": 177795, "epoch": 1058} {"train_loss": -11.23337459564209, "global_step": 177796, "epoch": 1058} {"train_loss": -11.449702262878418, "global_step": 177797, "epoch": 1058} {"train_loss": -11.363967895507812, "global_step": 177798, "epoch": 1058} {"train_loss": -11.184654235839844, "global_step": 177799, "epoch": 1058} {"train_loss": -11.276753425598145, "global_step": 177800, "epoch": 1058} {"train_loss": -11.19582748413086, "global_step": 177801, "epoch": 1058} {"train_loss": -11.450944900512695, "global_step": 177802, "epoch": 1058} {"train_loss": -10.971757888793945, "global_step": 177803, "epoch": 1058} {"train_loss": -11.093320846557617, "global_step": 177804, "epoch": 1058} {"train_loss": -11.130302429199219, "global_step": 177805, "epoch": 1058} {"train_loss": -11.035058975219727, "global_step": 177806, "epoch": 1058} {"train_loss": -11.415645599365234, "global_step": 177807, "epoch": 1058} {"train_loss": -11.317960739135742, "global_step": 177808, "epoch": 1058} {"train_loss": -11.426114082336426, "global_step": 177809, "epoch": 1058} {"train_loss": -11.231136322021484, "global_step": 177810, "epoch": 1058} {"train_loss": -10.981779098510742, "global_step": 177811, "epoch": 1058} {"train_loss": -11.29637336730957, "global_step": 177812, "epoch": 1058} {"train_loss": -10.697427749633789, "global_step": 177813, "epoch": 1058} {"train_loss": -10.307279586791992, "global_step": 177814, "epoch": 1058} {"train_loss": -10.782734870910645, "global_step": 177815, "epoch": 1058} {"train_loss": -10.771949768066406, "global_step": 177816, "epoch": 1058} {"train_loss": -10.717781066894531, "global_step": 177817, "epoch": 1058} {"train_loss": -10.350202560424805, "global_step": 177818, "epoch": 1058} {"train_loss": -10.811964988708496, "global_step": 177819, "epoch": 1058} {"train_loss": -10.29045295715332, "global_step": 177820, "epoch": 1058} {"train_loss": -10.3694429397583, "global_step": 177821, "epoch": 1058} {"train_loss": -10.049633026123047, "global_step": 177822, "epoch": 1058} {"train_loss": -10.507539749145508, "global_step": 177823, "epoch": 1058} {"train_loss": -10.561922073364258, "global_step": 177824, "epoch": 1058} {"train_loss": -10.330978393554688, "global_step": 177825, "epoch": 1058} {"train_loss": -10.58638858795166, "global_step": 177826, "epoch": 1058} {"train_loss": -10.261248588562012, "global_step": 177827, "epoch": 1058} {"train_loss": -10.489617347717285, "global_step": 177828, "epoch": 1058} {"train_loss": -10.800056457519531, "global_step": 177829, "epoch": 1058} {"train_loss": -10.443424224853516, "global_step": 177830, "epoch": 1058} {"train_loss": -10.737913131713867, "global_step": 177831, "epoch": 1058} {"train_loss": -10.64148998260498, "global_step": 177832, "epoch": 1058} {"train_loss": -10.382783889770508, "global_step": 177833, "epoch": 1058} {"train_loss": -10.680543899536133, "global_step": 177834, "epoch": 1058} {"train_loss": -10.462308883666992, "global_step": 177835, "epoch": 1058} {"train_loss": -10.917298316955566, "global_step": 177836, "epoch": 1058} {"train_loss": -10.44316291809082, "global_step": 177837, "epoch": 1058} {"train_loss": -10.656702995300293, "global_step": 177838, "epoch": 1058} {"train_loss": -10.794004440307617, "global_step": 177839, "epoch": 1058} {"train_loss": -10.775033950805664, "global_step": 177840, "epoch": 1058} {"train_loss": -10.569269180297852, "global_step": 177841, "epoch": 1058} {"train_loss": -10.949727058410645, "global_step": 177842, "epoch": 1058} {"train_loss": -10.38343620300293, "global_step": 177843, "epoch": 1058} {"train_loss": -10.860807418823242, "global_step": 177844, "epoch": 1058} {"train_loss": -10.888351440429688, "global_step": 177845, "epoch": 1058} {"train_loss": -10.707296371459961, "global_step": 177846, "epoch": 1058} {"train_loss": -10.858150482177734, "global_step": 177847, "epoch": 1058} {"train_loss": -10.67005729675293, "global_step": 177848, "epoch": 1058} {"train_loss": -10.716870307922363, "global_step": 177849, "epoch": 1058} {"train_loss": -10.789530754089355, "global_step": 177850, "epoch": 1058} {"train_loss": -10.761012077331543, "global_step": 177851, "epoch": 1058} {"train_loss": -10.599420547485352, "global_step": 177852, "epoch": 1058} {"train_loss": -10.938741683959961, "global_step": 177853, "epoch": 1058} {"train_loss": -10.54178524017334, "global_step": 177854, "epoch": 1058} {"train_loss": -10.608413696289062, "global_step": 177855, "epoch": 1058} {"train_loss": -10.970926284790039, "global_step": 177856, "epoch": 1058} {"train_loss": -10.75059700012207, "global_step": 177857, "epoch": 1058} {"train_loss": -10.780621528625488, "global_step": 177858, "epoch": 1058} {"train_loss": -11.143829345703125, "global_step": 177859, "epoch": 1058} {"train_loss": -10.606779098510742, "global_step": 177860, "epoch": 1058} {"train_loss": -10.967193603515625, "global_step": 177861, "epoch": 1058} {"train_loss": -10.806446075439453, "global_step": 177862, "epoch": 1058} {"train_loss": -11.180364608764648, "global_step": 177863, "epoch": 1058} {"train_loss": -11.112401962280273, "global_step": 177864, "epoch": 1058} {"train_loss": -10.892558097839355, "global_step": 177865, "epoch": 1058} {"train_loss": -10.902349472045898, "global_step": 177866, "epoch": 1058} {"train_loss": -11.202948570251465, "global_step": 177867, "epoch": 1058} {"train_loss": -10.924087524414062, "global_step": 177868, "epoch": 1058} {"train_loss": -11.04115104675293, "global_step": 177869, "epoch": 1058} {"train_loss": -11.118006706237793, "global_step": 177870, "epoch": 1058} {"train_loss": -10.964818954467773, "global_step": 177871, "epoch": 1058} {"train_loss": -11.36177921295166, "global_step": 177872, "epoch": 1058} {"train_loss": -10.854063034057617, "global_step": 177873, "epoch": 1058} {"train_loss": -11.284326553344727, "global_step": 177874, "epoch": 1058} {"train_loss": -11.241569519042969, "global_step": 177875, "epoch": 1058} {"train_loss": -11.18725299835205, "global_step": 177876, "epoch": 1058} {"train_loss": -11.366409301757812, "global_step": 177877, "epoch": 1058} {"train_loss": -11.030509948730469, "global_step": 177878, "epoch": 1058} {"train_loss": -11.407303810119629, "global_step": 177879, "epoch": 1058} {"train_loss": -11.210797309875488, "global_step": 177880, "epoch": 1058} {"train_loss": -11.438044548034668, "global_step": 177881, "epoch": 1058} {"train_loss": -11.372353553771973, "global_step": 177882, "epoch": 1058} {"train_loss": -11.334506034851074, "global_step": 177883, "epoch": 1058} {"train_loss": -11.246038436889648, "global_step": 177884, "epoch": 1058} {"train_loss": -11.274605751037598, "global_step": 177885, "epoch": 1058} {"train_loss": -11.616065979003906, "global_step": 177886, "epoch": 1058} {"train_loss": -11.198511123657227, "global_step": 177887, "epoch": 1058} {"train_loss": -11.534191131591797, "global_step": 177888, "epoch": 1058} {"train_loss": -10.996978759765625, "global_step": 177889, "epoch": 1058} {"train_loss": -11.483217239379883, "global_step": 177890, "epoch": 1058} {"train_loss": -11.313669204711914, "global_step": 177891, "epoch": 1058} {"train_loss": -11.079139709472656, "global_step": 177892, "epoch": 1058} {"train_loss": -11.409381866455078, "global_step": 177893, "epoch": 1058} {"train_loss": -10.557475090026855, "global_step": 177894, "epoch": 1058} {"train_loss": -10.802082061767578, "global_step": 177895, "epoch": 1058} {"train_loss": -11.401988983154297, "global_step": 177896, "epoch": 1058} {"train_loss": -10.61508846282959, "global_step": 177897, "epoch": 1058} {"train_loss": -11.286635398864746, "global_step": 177898, "epoch": 1058} {"train_loss": -11.072433471679688, "global_step": 177899, "epoch": 1058} {"train_loss": -10.88857650756836, "global_step": 177900, "epoch": 1058} {"train_loss": -11.367658615112305, "global_step": 177901, "epoch": 1058} {"train_loss": -10.308392524719238, "global_step": 177902, "epoch": 1058} {"train_loss": -11.22525405883789, "global_step": 177903, "epoch": 1058} {"train_loss": -10.840641975402832, "global_step": 177904, "epoch": 1058} {"train_loss": -10.545062065124512, "global_step": 177905, "epoch": 1058} {"train_loss": -10.885629653930664, "global_step": 177906, "epoch": 1058} {"train_loss": -10.740432739257812, "global_step": 177907, "epoch": 1058} {"train_loss": -10.799951553344727, "global_step": 177908, "epoch": 1058} {"train_loss": -11.276576042175293, "global_step": 177909, "epoch": 1058} {"train_loss": -11.06412410736084, "global_step": 177910, "epoch": 1058} {"train_loss": -11.016580746287392, "global_step": 177911, "epoch": 1058, "val_loss": 244856.796875} {"train_loss": -11.448036193847656, "global_step": 177912, "epoch": 1059} {"train_loss": -10.993159294128418, "global_step": 177913, "epoch": 1059} {"train_loss": -11.147330284118652, "global_step": 177914, "epoch": 1059} {"train_loss": -11.28622055053711, "global_step": 177915, "epoch": 1059} {"train_loss": -11.071956634521484, "global_step": 177916, "epoch": 1059} {"train_loss": -11.379894256591797, "global_step": 177917, "epoch": 1059} {"train_loss": -10.94044303894043, "global_step": 177918, "epoch": 1059} {"train_loss": -11.251932144165039, "global_step": 177919, "epoch": 1059} {"train_loss": -11.189857482910156, "global_step": 177920, "epoch": 1059} {"train_loss": -11.041345596313477, "global_step": 177921, "epoch": 1059} {"train_loss": -11.281867980957031, "global_step": 177922, "epoch": 1059} {"train_loss": -11.065130233764648, "global_step": 177923, "epoch": 1059} {"train_loss": -11.450063705444336, "global_step": 177924, "epoch": 1059} {"train_loss": -11.251388549804688, "global_step": 177925, "epoch": 1059} {"train_loss": -11.154898643493652, "global_step": 177926, "epoch": 1059} {"train_loss": -11.588505744934082, "global_step": 177927, "epoch": 1059} {"train_loss": -11.255385398864746, "global_step": 177928, "epoch": 1059} {"train_loss": -11.50002670288086, "global_step": 177929, "epoch": 1059} {"train_loss": -11.30052375793457, "global_step": 177930, "epoch": 1059} {"train_loss": -11.045668601989746, "global_step": 177931, "epoch": 1059} {"train_loss": -11.282222747802734, "global_step": 177932, "epoch": 1059} {"train_loss": -11.119081497192383, "global_step": 177933, "epoch": 1059} {"train_loss": -11.114952087402344, "global_step": 177934, "epoch": 1059} {"train_loss": -11.135711669921875, "global_step": 177935, "epoch": 1059} {"train_loss": -10.884031295776367, "global_step": 177936, "epoch": 1059} {"train_loss": -10.843446731567383, "global_step": 177937, "epoch": 1059} {"train_loss": -10.949548721313477, "global_step": 177938, "epoch": 1059} {"train_loss": -10.547941207885742, "global_step": 177939, "epoch": 1059} {"train_loss": -10.733699798583984, "global_step": 177940, "epoch": 1059} {"train_loss": -11.017129898071289, "global_step": 177941, "epoch": 1059} {"train_loss": -10.247516632080078, "global_step": 177942, "epoch": 1059} {"train_loss": -11.248672485351562, "global_step": 177943, "epoch": 1059} {"train_loss": -10.477858543395996, "global_step": 177944, "epoch": 1059} {"train_loss": -9.951249122619629, "global_step": 177945, "epoch": 1059} {"train_loss": -11.010902404785156, "global_step": 177946, "epoch": 1059} {"train_loss": -10.7451171875, "global_step": 177947, "epoch": 1059} {"train_loss": -10.571032524108887, "global_step": 177948, "epoch": 1059} {"train_loss": -10.847646713256836, "global_step": 177949, "epoch": 1059} {"train_loss": -10.403470993041992, "global_step": 177950, "epoch": 1059} {"train_loss": -11.217605590820312, "global_step": 177951, "epoch": 1059} {"train_loss": -10.69588565826416, "global_step": 177952, "epoch": 1059} {"train_loss": -10.811747550964355, "global_step": 177953, "epoch": 1059} {"train_loss": -11.063084602355957, "global_step": 177954, "epoch": 1059} {"train_loss": -10.438870429992676, "global_step": 177955, "epoch": 1059} {"train_loss": -10.33820915222168, "global_step": 177956, "epoch": 1059} {"train_loss": -10.439325332641602, "global_step": 177957, "epoch": 1059} {"train_loss": -9.913482666015625, "global_step": 177958, "epoch": 1059} {"train_loss": -10.573308944702148, "global_step": 177959, "epoch": 1059} {"train_loss": -10.408271789550781, "global_step": 177960, "epoch": 1059} {"train_loss": -10.696910858154297, "global_step": 177961, "epoch": 1059} {"train_loss": -10.248590469360352, "global_step": 177962, "epoch": 1059} {"train_loss": -10.474641799926758, "global_step": 177963, "epoch": 1059} {"train_loss": -10.125067710876465, "global_step": 177964, "epoch": 1059} {"train_loss": -11.046574592590332, "global_step": 177965, "epoch": 1059} {"train_loss": -10.069906234741211, "global_step": 177966, "epoch": 1059} {"train_loss": -10.957524299621582, "global_step": 177967, "epoch": 1059} {"train_loss": -11.011345863342285, "global_step": 177968, "epoch": 1059} {"train_loss": -10.639190673828125, "global_step": 177969, "epoch": 1059} {"train_loss": -10.796142578125, "global_step": 177970, "epoch": 1059} {"train_loss": -10.722589492797852, "global_step": 177971, "epoch": 1059} {"train_loss": -11.170894622802734, "global_step": 177972, "epoch": 1059} {"train_loss": -10.807857513427734, "global_step": 177973, "epoch": 1059} {"train_loss": -11.06110954284668, "global_step": 177974, "epoch": 1059} {"train_loss": -11.070537567138672, "global_step": 177975, "epoch": 1059} {"train_loss": -10.638368606567383, "global_step": 177976, "epoch": 1059} {"train_loss": -11.256495475769043, "global_step": 177977, "epoch": 1059} {"train_loss": -10.918874740600586, "global_step": 177978, "epoch": 1059} {"train_loss": -10.859539985656738, "global_step": 177979, "epoch": 1059} {"train_loss": -11.158613204956055, "global_step": 177980, "epoch": 1059} {"train_loss": -10.960470199584961, "global_step": 177981, "epoch": 1059} {"train_loss": -11.103389739990234, "global_step": 177982, "epoch": 1059} {"train_loss": -11.075244903564453, "global_step": 177983, "epoch": 1059} {"train_loss": -11.055647850036621, "global_step": 177984, "epoch": 1059} {"train_loss": -11.09518051147461, "global_step": 177985, "epoch": 1059} {"train_loss": -11.25643253326416, "global_step": 177986, "epoch": 1059} {"train_loss": -11.132575988769531, "global_step": 177987, "epoch": 1059} {"train_loss": -11.24173355102539, "global_step": 177988, "epoch": 1059} {"train_loss": -11.251617431640625, "global_step": 177989, "epoch": 1059} {"train_loss": -11.194709777832031, "global_step": 177990, "epoch": 1059} {"train_loss": -11.366491317749023, "global_step": 177991, "epoch": 1059} {"train_loss": -11.217047691345215, "global_step": 177992, "epoch": 1059} {"train_loss": -11.065742492675781, "global_step": 177993, "epoch": 1059} {"train_loss": -11.280654907226562, "global_step": 177994, "epoch": 1059} {"train_loss": -11.13310718536377, "global_step": 177995, "epoch": 1059} {"train_loss": -11.507516860961914, "global_step": 177996, "epoch": 1059} {"train_loss": -11.217276573181152, "global_step": 177997, "epoch": 1059} {"train_loss": -11.347639083862305, "global_step": 177998, "epoch": 1059} {"train_loss": -11.229415893554688, "global_step": 177999, "epoch": 1059} {"train_loss": -11.228449821472168, "global_step": 178000, "epoch": 1059} {"train_loss": -11.443550109863281, "global_step": 178001, "epoch": 1059} {"train_loss": -11.275625228881836, "global_step": 178002, "epoch": 1059} {"train_loss": -11.568928718566895, "global_step": 178003, "epoch": 1059} {"train_loss": -11.33334732055664, "global_step": 178004, "epoch": 1059} {"train_loss": -11.023519515991211, "global_step": 178005, "epoch": 1059} {"train_loss": -11.362674713134766, "global_step": 178006, "epoch": 1059} {"train_loss": -11.549020767211914, "global_step": 178007, "epoch": 1059} {"train_loss": -11.182323455810547, "global_step": 178008, "epoch": 1059} {"train_loss": -11.245721817016602, "global_step": 178009, "epoch": 1059} {"train_loss": -11.321409225463867, "global_step": 178010, "epoch": 1059} {"train_loss": -11.374509811401367, "global_step": 178011, "epoch": 1059} {"train_loss": -11.396976470947266, "global_step": 178012, "epoch": 1059} {"train_loss": -11.424152374267578, "global_step": 178013, "epoch": 1059} {"train_loss": -11.225529670715332, "global_step": 178014, "epoch": 1059} {"train_loss": -11.406002044677734, "global_step": 178015, "epoch": 1059} {"train_loss": -11.63770866394043, "global_step": 178016, "epoch": 1059} {"train_loss": -11.339094161987305, "global_step": 178017, "epoch": 1059} {"train_loss": -11.422185897827148, "global_step": 178018, "epoch": 1059} {"train_loss": -11.428466796875, "global_step": 178019, "epoch": 1059} {"train_loss": -11.34201431274414, "global_step": 178020, "epoch": 1059} {"train_loss": -11.162867546081543, "global_step": 178021, "epoch": 1059} {"train_loss": -11.342767715454102, "global_step": 178022, "epoch": 1059} {"train_loss": -11.01012897491455, "global_step": 178023, "epoch": 1059} {"train_loss": -11.590628623962402, "global_step": 178024, "epoch": 1059} {"train_loss": -11.14990234375, "global_step": 178025, "epoch": 1059} {"train_loss": -11.630474090576172, "global_step": 178026, "epoch": 1059} {"train_loss": -11.313211441040039, "global_step": 178027, "epoch": 1059} {"train_loss": -11.395668029785156, "global_step": 178028, "epoch": 1059} {"train_loss": -11.476513862609863, "global_step": 178029, "epoch": 1059} {"train_loss": -11.242791175842285, "global_step": 178030, "epoch": 1059} {"train_loss": -11.392189979553223, "global_step": 178031, "epoch": 1059} {"train_loss": -11.367324829101562, "global_step": 178032, "epoch": 1059} {"train_loss": -11.033038139343262, "global_step": 178033, "epoch": 1059} {"train_loss": -11.419057846069336, "global_step": 178034, "epoch": 1059} {"train_loss": -11.0606107711792, "global_step": 178035, "epoch": 1059} {"train_loss": -10.909305572509766, "global_step": 178036, "epoch": 1059} {"train_loss": -10.825000762939453, "global_step": 178037, "epoch": 1059} {"train_loss": -10.642257690429688, "global_step": 178038, "epoch": 1059} {"train_loss": -9.787961959838867, "global_step": 178039, "epoch": 1059} {"train_loss": -10.444910049438477, "global_step": 178040, "epoch": 1059} {"train_loss": -10.210796356201172, "global_step": 178041, "epoch": 1059} {"train_loss": -8.907336235046387, "global_step": 178042, "epoch": 1059} {"train_loss": -10.852445602416992, "global_step": 178043, "epoch": 1059} {"train_loss": -9.899942398071289, "global_step": 178044, "epoch": 1059} {"train_loss": -10.425222396850586, "global_step": 178045, "epoch": 1059} {"train_loss": -9.561040878295898, "global_step": 178046, "epoch": 1059} {"train_loss": -10.88450813293457, "global_step": 178047, "epoch": 1059} {"train_loss": -9.67203140258789, "global_step": 178048, "epoch": 1059} {"train_loss": -9.70754337310791, "global_step": 178049, "epoch": 1059} {"train_loss": -10.009377479553223, "global_step": 178050, "epoch": 1059} {"train_loss": -9.980449676513672, "global_step": 178051, "epoch": 1059} {"train_loss": -10.396533966064453, "global_step": 178052, "epoch": 1059} {"train_loss": -9.117874145507812, "global_step": 178053, "epoch": 1059} {"train_loss": -10.545377731323242, "global_step": 178054, "epoch": 1059} {"train_loss": -10.104255676269531, "global_step": 178055, "epoch": 1059} {"train_loss": -9.98747444152832, "global_step": 178056, "epoch": 1059} {"train_loss": -10.80103874206543, "global_step": 178057, "epoch": 1059} {"train_loss": -10.423271179199219, "global_step": 178058, "epoch": 1059} {"train_loss": -10.173187255859375, "global_step": 178059, "epoch": 1059} {"train_loss": -10.542058944702148, "global_step": 178060, "epoch": 1059} {"train_loss": -10.569315910339355, "global_step": 178061, "epoch": 1059} {"train_loss": -10.858855247497559, "global_step": 178062, "epoch": 1059} {"train_loss": -10.795562744140625, "global_step": 178063, "epoch": 1059} {"train_loss": -10.56629467010498, "global_step": 178064, "epoch": 1059} {"train_loss": -10.88408374786377, "global_step": 178065, "epoch": 1059} {"train_loss": -10.991476058959961, "global_step": 178066, "epoch": 1059} {"train_loss": -10.974720001220703, "global_step": 178067, "epoch": 1059} {"train_loss": -11.03654670715332, "global_step": 178068, "epoch": 1059} {"train_loss": -10.91806411743164, "global_step": 178069, "epoch": 1059} {"train_loss": -11.089494705200195, "global_step": 178070, "epoch": 1059} {"train_loss": -10.860372543334961, "global_step": 178071, "epoch": 1059} {"train_loss": -11.053609848022461, "global_step": 178072, "epoch": 1059} {"train_loss": -10.943412780761719, "global_step": 178073, "epoch": 1059} {"train_loss": -11.127420425415039, "global_step": 178074, "epoch": 1059} {"train_loss": -11.1429443359375, "global_step": 178075, "epoch": 1059} {"train_loss": -11.180525779724121, "global_step": 178076, "epoch": 1059} {"train_loss": -11.214696884155273, "global_step": 178077, "epoch": 1059} {"train_loss": -11.126969337463379, "global_step": 178078, "epoch": 1059} {"train_loss": -10.926090728668939, "global_step": 178079, "epoch": 1059, "val_loss": 239012.640625} {"train_loss": -11.180370330810547, "global_step": 178080, "epoch": 1060} {"train_loss": -11.201578140258789, "global_step": 178081, "epoch": 1060} {"train_loss": -11.253750801086426, "global_step": 178082, "epoch": 1060} {"train_loss": -11.17191219329834, "global_step": 178083, "epoch": 1060} {"train_loss": -11.090473175048828, "global_step": 178084, "epoch": 1060} {"train_loss": -11.369384765625, "global_step": 178085, "epoch": 1060} {"train_loss": -11.320579528808594, "global_step": 178086, "epoch": 1060} {"train_loss": -11.343208312988281, "global_step": 178087, "epoch": 1060} {"train_loss": -11.38183879852295, "global_step": 178088, "epoch": 1060} {"train_loss": -11.154000282287598, "global_step": 178089, "epoch": 1060} {"train_loss": -11.079755783081055, "global_step": 178090, "epoch": 1060} {"train_loss": -11.272554397583008, "global_step": 178091, "epoch": 1060} {"train_loss": -11.335836410522461, "global_step": 178092, "epoch": 1060} {"train_loss": -11.056314468383789, "global_step": 178093, "epoch": 1060} {"train_loss": -11.334065437316895, "global_step": 178094, "epoch": 1060} {"train_loss": -11.116411209106445, "global_step": 178095, "epoch": 1060} {"train_loss": -11.204303741455078, "global_step": 178096, "epoch": 1060} {"train_loss": -11.1373929977417, "global_step": 178097, "epoch": 1060} {"train_loss": -11.255722045898438, "global_step": 178098, "epoch": 1060} {"train_loss": -11.217507362365723, "global_step": 178099, "epoch": 1060} {"train_loss": -11.36870002746582, "global_step": 178100, "epoch": 1060} {"train_loss": -11.071954727172852, "global_step": 178101, "epoch": 1060} {"train_loss": -11.54397201538086, "global_step": 178102, "epoch": 1060} {"train_loss": -11.241423606872559, "global_step": 178103, "epoch": 1060} {"train_loss": -11.552960395812988, "global_step": 178104, "epoch": 1060} {"train_loss": -11.387479782104492, "global_step": 178105, "epoch": 1060} {"train_loss": -11.116262435913086, "global_step": 178106, "epoch": 1060} {"train_loss": -11.300819396972656, "global_step": 178107, "epoch": 1060} {"train_loss": -11.121618270874023, "global_step": 178108, "epoch": 1060} {"train_loss": -11.186409950256348, "global_step": 178109, "epoch": 1060} {"train_loss": -11.214902877807617, "global_step": 178110, "epoch": 1060} {"train_loss": -11.021657943725586, "global_step": 178111, "epoch": 1060} {"train_loss": -11.276151657104492, "global_step": 178112, "epoch": 1060} {"train_loss": -11.262184143066406, "global_step": 178113, "epoch": 1060} {"train_loss": -10.814810752868652, "global_step": 178114, "epoch": 1060} {"train_loss": -11.268916130065918, "global_step": 178115, "epoch": 1060} {"train_loss": -11.096012115478516, "global_step": 178116, "epoch": 1060} {"train_loss": -10.9882173538208, "global_step": 178117, "epoch": 1060} {"train_loss": -11.509525299072266, "global_step": 178118, "epoch": 1060} {"train_loss": -11.066728591918945, "global_step": 178119, "epoch": 1060} {"train_loss": -11.287161827087402, "global_step": 178120, "epoch": 1060} {"train_loss": -11.239786148071289, "global_step": 178121, "epoch": 1060} {"train_loss": -11.111028671264648, "global_step": 178122, "epoch": 1060} {"train_loss": -11.548147201538086, "global_step": 178123, "epoch": 1060} {"train_loss": -10.683584213256836, "global_step": 178124, "epoch": 1060} {"train_loss": -10.509940147399902, "global_step": 178125, "epoch": 1060} {"train_loss": -11.304718971252441, "global_step": 178126, "epoch": 1060} {"train_loss": -10.177245140075684, "global_step": 178127, "epoch": 1060} {"train_loss": -9.556741714477539, "global_step": 178128, "epoch": 1060} {"train_loss": -11.039316177368164, "global_step": 178129, "epoch": 1060} {"train_loss": -9.867053985595703, "global_step": 178130, "epoch": 1060} {"train_loss": -10.947068214416504, "global_step": 178131, "epoch": 1060} {"train_loss": -10.603507995605469, "global_step": 178132, "epoch": 1060} {"train_loss": -10.261516571044922, "global_step": 178133, "epoch": 1060} {"train_loss": -10.554084777832031, "global_step": 178134, "epoch": 1060} {"train_loss": -10.361129760742188, "global_step": 178135, "epoch": 1060} {"train_loss": -11.021944046020508, "global_step": 178136, "epoch": 1060} {"train_loss": -10.669231414794922, "global_step": 178137, "epoch": 1060} {"train_loss": -10.694826126098633, "global_step": 178138, "epoch": 1060} {"train_loss": -10.87990951538086, "global_step": 178139, "epoch": 1060} {"train_loss": -10.448066711425781, "global_step": 178140, "epoch": 1060} {"train_loss": -11.059478759765625, "global_step": 178141, "epoch": 1060} {"train_loss": -10.575372695922852, "global_step": 178142, "epoch": 1060} {"train_loss": -11.143117904663086, "global_step": 178143, "epoch": 1060} {"train_loss": -10.782060623168945, "global_step": 178144, "epoch": 1060} {"train_loss": -10.72745418548584, "global_step": 178145, "epoch": 1060} {"train_loss": -10.986541748046875, "global_step": 178146, "epoch": 1060} {"train_loss": -10.813934326171875, "global_step": 178147, "epoch": 1060} {"train_loss": -10.774144172668457, "global_step": 178148, "epoch": 1060} {"train_loss": -10.799338340759277, "global_step": 178149, "epoch": 1060} {"train_loss": -11.16727066040039, "global_step": 178150, "epoch": 1060} {"train_loss": -11.079010009765625, "global_step": 178151, "epoch": 1060} {"train_loss": -11.144182205200195, "global_step": 178152, "epoch": 1060} {"train_loss": -10.91534423828125, "global_step": 178153, "epoch": 1060} {"train_loss": -11.299753189086914, "global_step": 178154, "epoch": 1060} {"train_loss": -11.04857063293457, "global_step": 178155, "epoch": 1060} {"train_loss": -11.259546279907227, "global_step": 178156, "epoch": 1060} {"train_loss": -11.154542922973633, "global_step": 178157, "epoch": 1060} {"train_loss": -11.266121864318848, "global_step": 178158, "epoch": 1060} {"train_loss": -10.945952415466309, "global_step": 178159, "epoch": 1060} {"train_loss": -11.187609672546387, "global_step": 178160, "epoch": 1060} {"train_loss": -11.107560157775879, "global_step": 178161, "epoch": 1060} {"train_loss": -11.332528114318848, "global_step": 178162, "epoch": 1060} {"train_loss": -11.042110443115234, "global_step": 178163, "epoch": 1060} {"train_loss": -11.313868522644043, "global_step": 178164, "epoch": 1060} {"train_loss": -11.316998481750488, "global_step": 178165, "epoch": 1060} {"train_loss": -10.892618179321289, "global_step": 178166, "epoch": 1060} {"train_loss": -10.682418823242188, "global_step": 178167, "epoch": 1060} {"train_loss": -10.906354904174805, "global_step": 178168, "epoch": 1060} {"train_loss": -11.065179824829102, "global_step": 178169, "epoch": 1060} {"train_loss": -11.29101276397705, "global_step": 178170, "epoch": 1060} {"train_loss": -10.862377166748047, "global_step": 178171, "epoch": 1060} {"train_loss": -11.281207084655762, "global_step": 178172, "epoch": 1060} {"train_loss": -11.208425521850586, "global_step": 178173, "epoch": 1060} {"train_loss": -11.389388084411621, "global_step": 178174, "epoch": 1060} {"train_loss": -11.270670890808105, "global_step": 178175, "epoch": 1060} {"train_loss": -11.40566635131836, "global_step": 178176, "epoch": 1060} {"train_loss": -11.391996383666992, "global_step": 178177, "epoch": 1060} {"train_loss": -11.487346649169922, "global_step": 178178, "epoch": 1060} {"train_loss": -11.300559997558594, "global_step": 178179, "epoch": 1060} {"train_loss": -11.44465446472168, "global_step": 178180, "epoch": 1060} {"train_loss": -11.348834991455078, "global_step": 178181, "epoch": 1060} {"train_loss": -11.496807098388672, "global_step": 178182, "epoch": 1060} {"train_loss": -11.000064849853516, "global_step": 178183, "epoch": 1060} {"train_loss": -11.446168899536133, "global_step": 178184, "epoch": 1060} {"train_loss": -11.379800796508789, "global_step": 178185, "epoch": 1060} {"train_loss": -11.45754623413086, "global_step": 178186, "epoch": 1060} {"train_loss": -11.395486831665039, "global_step": 178187, "epoch": 1060} {"train_loss": -11.378993034362793, "global_step": 178188, "epoch": 1060} {"train_loss": -11.322486877441406, "global_step": 178189, "epoch": 1060} {"train_loss": -11.590412139892578, "global_step": 178190, "epoch": 1060} {"train_loss": -11.274518013000488, "global_step": 178191, "epoch": 1060} {"train_loss": -11.458268165588379, "global_step": 178192, "epoch": 1060} {"train_loss": -11.107168197631836, "global_step": 178193, "epoch": 1060} {"train_loss": -11.216445922851562, "global_step": 178194, "epoch": 1060} {"train_loss": -11.178308486938477, "global_step": 178195, "epoch": 1060} {"train_loss": -11.628535270690918, "global_step": 178196, "epoch": 1060} {"train_loss": -11.52210807800293, "global_step": 178197, "epoch": 1060} {"train_loss": -11.16678237915039, "global_step": 178198, "epoch": 1060} {"train_loss": -11.139284133911133, "global_step": 178199, "epoch": 1060} {"train_loss": -11.228309631347656, "global_step": 178200, "epoch": 1060} {"train_loss": -11.282373428344727, "global_step": 178201, "epoch": 1060} {"train_loss": -10.895406723022461, "global_step": 178202, "epoch": 1060} {"train_loss": -11.206087112426758, "global_step": 178203, "epoch": 1060} {"train_loss": -10.996149063110352, "global_step": 178204, "epoch": 1060} {"train_loss": -11.270523071289062, "global_step": 178205, "epoch": 1060} {"train_loss": -10.516960144042969, "global_step": 178206, "epoch": 1060} {"train_loss": -10.437543869018555, "global_step": 178207, "epoch": 1060} {"train_loss": -10.340970993041992, "global_step": 178208, "epoch": 1060} {"train_loss": -10.863082885742188, "global_step": 178209, "epoch": 1060} {"train_loss": -10.824941635131836, "global_step": 178210, "epoch": 1060} {"train_loss": -9.253170013427734, "global_step": 178211, "epoch": 1060} {"train_loss": -10.024840354919434, "global_step": 178212, "epoch": 1060} {"train_loss": -11.106999397277832, "global_step": 178213, "epoch": 1060} {"train_loss": -9.519460678100586, "global_step": 178214, "epoch": 1060} {"train_loss": -9.436833381652832, "global_step": 178215, "epoch": 1060} {"train_loss": -10.124604225158691, "global_step": 178216, "epoch": 1060} {"train_loss": -8.568014144897461, "global_step": 178217, "epoch": 1060} {"train_loss": -8.906731605529785, "global_step": 178218, "epoch": 1060} {"train_loss": -7.604464054107666, "global_step": 178219, "epoch": 1060} {"train_loss": -9.172769546508789, "global_step": 178220, "epoch": 1060} {"train_loss": -10.130077362060547, "global_step": 178221, "epoch": 1060} {"train_loss": -8.080414772033691, "global_step": 178222, "epoch": 1060} {"train_loss": -9.42673110961914, "global_step": 178223, "epoch": 1060} {"train_loss": -9.425066947937012, "global_step": 178224, "epoch": 1060} {"train_loss": -9.22274112701416, "global_step": 178225, "epoch": 1060} {"train_loss": -8.616800308227539, "global_step": 178226, "epoch": 1060} {"train_loss": -10.161561965942383, "global_step": 178227, "epoch": 1060} {"train_loss": -8.711531639099121, "global_step": 178228, "epoch": 1060} {"train_loss": -9.735791206359863, "global_step": 178229, "epoch": 1060} {"train_loss": -10.223286628723145, "global_step": 178230, "epoch": 1060} {"train_loss": -8.5792236328125, "global_step": 178231, "epoch": 1060} {"train_loss": -9.650040626525879, "global_step": 178232, "epoch": 1060} {"train_loss": -10.351932525634766, "global_step": 178233, "epoch": 1060} {"train_loss": -9.894415855407715, "global_step": 178234, "epoch": 1060} {"train_loss": -9.413740158081055, "global_step": 178235, "epoch": 1060} {"train_loss": -10.338579177856445, "global_step": 178236, "epoch": 1060} {"train_loss": -10.449790954589844, "global_step": 178237, "epoch": 1060} {"train_loss": -9.607810974121094, "global_step": 178238, "epoch": 1060} {"train_loss": -9.629796981811523, "global_step": 178239, "epoch": 1060} {"train_loss": -10.244528770446777, "global_step": 178240, "epoch": 1060} {"train_loss": -9.959177017211914, "global_step": 178241, "epoch": 1060} {"train_loss": -9.735650062561035, "global_step": 178242, "epoch": 1060} {"train_loss": -10.13326644897461, "global_step": 178243, "epoch": 1060} {"train_loss": -10.342390060424805, "global_step": 178244, "epoch": 1060} {"train_loss": -10.22991943359375, "global_step": 178245, "epoch": 1060} {"train_loss": -10.156805992126465, "global_step": 178246, "epoch": 1060} {"train_loss": -10.772137309823718, "global_step": 178247, "epoch": 1060, "val_loss": 243973.5, "train_action_mse_error": 8.572504997253418} {"train_loss": -10.156991958618164, "global_step": 178248, "epoch": 1061} {"train_loss": -10.202494621276855, "global_step": 178249, "epoch": 1061} {"train_loss": -10.330543518066406, "global_step": 178250, "epoch": 1061} {"train_loss": -10.661975860595703, "global_step": 178251, "epoch": 1061} {"train_loss": -10.496868133544922, "global_step": 178252, "epoch": 1061} {"train_loss": -10.450770378112793, "global_step": 178253, "epoch": 1061} {"train_loss": -10.620316505432129, "global_step": 178254, "epoch": 1061} {"train_loss": -10.184572219848633, "global_step": 178255, "epoch": 1061} {"train_loss": -10.37169075012207, "global_step": 178256, "epoch": 1061} {"train_loss": -10.404969215393066, "global_step": 178257, "epoch": 1061} {"train_loss": -10.600288391113281, "global_step": 178258, "epoch": 1061} {"train_loss": -10.701028823852539, "global_step": 178259, "epoch": 1061} {"train_loss": -10.77324104309082, "global_step": 178260, "epoch": 1061} {"train_loss": -10.591131210327148, "global_step": 178261, "epoch": 1061} {"train_loss": -10.815144538879395, "global_step": 178262, "epoch": 1061} {"train_loss": -10.803642272949219, "global_step": 178263, "epoch": 1061} {"train_loss": -10.680923461914062, "global_step": 178264, "epoch": 1061} {"train_loss": -10.730181694030762, "global_step": 178265, "epoch": 1061} {"train_loss": -10.51762580871582, "global_step": 178266, "epoch": 1061} {"train_loss": -10.724151611328125, "global_step": 178267, "epoch": 1061} {"train_loss": -10.753291130065918, "global_step": 178268, "epoch": 1061} {"train_loss": -10.824989318847656, "global_step": 178269, "epoch": 1061} {"train_loss": -10.682188987731934, "global_step": 178270, "epoch": 1061} {"train_loss": -10.827874183654785, "global_step": 178271, "epoch": 1061} {"train_loss": -10.906098365783691, "global_step": 178272, "epoch": 1061} {"train_loss": -10.85577392578125, "global_step": 178273, "epoch": 1061} {"train_loss": -10.938409805297852, "global_step": 178274, "epoch": 1061} {"train_loss": -10.911474227905273, "global_step": 178275, "epoch": 1061} {"train_loss": -10.973228454589844, "global_step": 178276, "epoch": 1061} {"train_loss": -10.912965774536133, "global_step": 178277, "epoch": 1061} {"train_loss": -11.038835525512695, "global_step": 178278, "epoch": 1061} {"train_loss": -11.119115829467773, "global_step": 178279, "epoch": 1061} {"train_loss": -11.002458572387695, "global_step": 178280, "epoch": 1061} {"train_loss": -11.136675834655762, "global_step": 178281, "epoch": 1061} {"train_loss": -11.056000709533691, "global_step": 178282, "epoch": 1061} {"train_loss": -11.21756362915039, "global_step": 178283, "epoch": 1061} {"train_loss": -11.342412948608398, "global_step": 178284, "epoch": 1061} {"train_loss": -11.252038955688477, "global_step": 178285, "epoch": 1061} {"train_loss": -11.486380577087402, "global_step": 178286, "epoch": 1061} {"train_loss": -11.141550064086914, "global_step": 178287, "epoch": 1061} {"train_loss": -11.227657318115234, "global_step": 178288, "epoch": 1061} {"train_loss": -11.469796180725098, "global_step": 178289, "epoch": 1061} {"train_loss": -11.238668441772461, "global_step": 178290, "epoch": 1061} {"train_loss": -11.314828872680664, "global_step": 178291, "epoch": 1061} {"train_loss": -11.1961030960083, "global_step": 178292, "epoch": 1061} {"train_loss": -11.29211711883545, "global_step": 178293, "epoch": 1061} {"train_loss": -11.487725257873535, "global_step": 178294, "epoch": 1061} {"train_loss": -11.298017501831055, "global_step": 178295, "epoch": 1061} {"train_loss": -11.250675201416016, "global_step": 178296, "epoch": 1061} {"train_loss": -11.343151092529297, "global_step": 178297, "epoch": 1061} {"train_loss": -11.256229400634766, "global_step": 178298, "epoch": 1061} {"train_loss": -11.425191879272461, "global_step": 178299, "epoch": 1061} {"train_loss": -11.295574188232422, "global_step": 178300, "epoch": 1061} {"train_loss": -11.611837387084961, "global_step": 178301, "epoch": 1061} {"train_loss": -11.382085800170898, "global_step": 178302, "epoch": 1061} {"train_loss": -11.512096405029297, "global_step": 178303, "epoch": 1061} {"train_loss": -11.374886512756348, "global_step": 178304, "epoch": 1061} {"train_loss": -11.570196151733398, "global_step": 178305, "epoch": 1061} {"train_loss": -11.265558242797852, "global_step": 178306, "epoch": 1061} {"train_loss": -11.216964721679688, "global_step": 178307, "epoch": 1061} {"train_loss": -11.494963645935059, "global_step": 178308, "epoch": 1061} {"train_loss": -11.377655982971191, "global_step": 178309, "epoch": 1061} {"train_loss": -11.655231475830078, "global_step": 178310, "epoch": 1061} {"train_loss": -11.530976295471191, "global_step": 178311, "epoch": 1061} {"train_loss": -11.375763893127441, "global_step": 178312, "epoch": 1061} {"train_loss": -11.249475479125977, "global_step": 178313, "epoch": 1061} {"train_loss": -11.319562911987305, "global_step": 178314, "epoch": 1061} {"train_loss": -11.497589111328125, "global_step": 178315, "epoch": 1061} {"train_loss": -11.513544082641602, "global_step": 178316, "epoch": 1061} {"train_loss": -11.44775390625, "global_step": 178317, "epoch": 1061} {"train_loss": -11.53091812133789, "global_step": 178318, "epoch": 1061} {"train_loss": -11.364068984985352, "global_step": 178319, "epoch": 1061} {"train_loss": -11.15687370300293, "global_step": 178320, "epoch": 1061} {"train_loss": -11.473878860473633, "global_step": 178321, "epoch": 1061} {"train_loss": -11.227219581604004, "global_step": 178322, "epoch": 1061} {"train_loss": -11.0246000289917, "global_step": 178323, "epoch": 1061} {"train_loss": -10.170166015625, "global_step": 178324, "epoch": 1061} {"train_loss": -9.259109497070312, "global_step": 178325, "epoch": 1061} {"train_loss": -9.119115829467773, "global_step": 178326, "epoch": 1061} {"train_loss": -10.859100341796875, "global_step": 178327, "epoch": 1061} {"train_loss": -9.005943298339844, "global_step": 178328, "epoch": 1061} {"train_loss": -9.566240310668945, "global_step": 178329, "epoch": 1061} {"train_loss": -9.658285140991211, "global_step": 178330, "epoch": 1061} {"train_loss": -10.585052490234375, "global_step": 178331, "epoch": 1061} {"train_loss": -10.560321807861328, "global_step": 178332, "epoch": 1061} {"train_loss": -8.942245483398438, "global_step": 178333, "epoch": 1061} {"train_loss": -10.592862129211426, "global_step": 178334, "epoch": 1061} {"train_loss": -9.808687210083008, "global_step": 178335, "epoch": 1061} {"train_loss": -9.695595741271973, "global_step": 178336, "epoch": 1061} {"train_loss": -10.61211109161377, "global_step": 178337, "epoch": 1061} {"train_loss": -9.95525074005127, "global_step": 178338, "epoch": 1061} {"train_loss": -10.015462875366211, "global_step": 178339, "epoch": 1061} {"train_loss": -10.853433609008789, "global_step": 178340, "epoch": 1061} {"train_loss": -10.072301864624023, "global_step": 178341, "epoch": 1061} {"train_loss": -10.905940055847168, "global_step": 178342, "epoch": 1061} {"train_loss": -10.01675796508789, "global_step": 178343, "epoch": 1061} {"train_loss": -10.88180923461914, "global_step": 178344, "epoch": 1061} {"train_loss": -10.912590980529785, "global_step": 178345, "epoch": 1061} {"train_loss": -10.764671325683594, "global_step": 178346, "epoch": 1061} {"train_loss": -10.55660629272461, "global_step": 178347, "epoch": 1061} {"train_loss": -10.482904434204102, "global_step": 178348, "epoch": 1061} {"train_loss": -10.75996208190918, "global_step": 178349, "epoch": 1061} {"train_loss": -10.814924240112305, "global_step": 178350, "epoch": 1061} {"train_loss": -10.134686470031738, "global_step": 178351, "epoch": 1061} {"train_loss": -10.979446411132812, "global_step": 178352, "epoch": 1061} {"train_loss": -10.767752647399902, "global_step": 178353, "epoch": 1061} {"train_loss": -10.848367691040039, "global_step": 178354, "epoch": 1061} {"train_loss": -11.052863121032715, "global_step": 178355, "epoch": 1061} {"train_loss": -10.679227828979492, "global_step": 178356, "epoch": 1061} {"train_loss": -10.792858123779297, "global_step": 178357, "epoch": 1061} {"train_loss": -11.030609130859375, "global_step": 178358, "epoch": 1061} {"train_loss": -11.131868362426758, "global_step": 178359, "epoch": 1061} {"train_loss": -11.144420623779297, "global_step": 178360, "epoch": 1061} {"train_loss": -11.257576942443848, "global_step": 178361, "epoch": 1061} {"train_loss": -11.326461791992188, "global_step": 178362, "epoch": 1061} {"train_loss": -11.114800453186035, "global_step": 178363, "epoch": 1061} {"train_loss": -11.220134735107422, "global_step": 178364, "epoch": 1061} {"train_loss": -10.932646751403809, "global_step": 178365, "epoch": 1061} {"train_loss": -11.311636924743652, "global_step": 178366, "epoch": 1061} {"train_loss": -11.141639709472656, "global_step": 178367, "epoch": 1061} {"train_loss": -11.107636451721191, "global_step": 178368, "epoch": 1061} {"train_loss": -11.12119197845459, "global_step": 178369, "epoch": 1061} {"train_loss": -11.314382553100586, "global_step": 178370, "epoch": 1061} {"train_loss": -11.256138801574707, "global_step": 178371, "epoch": 1061} {"train_loss": -11.217779159545898, "global_step": 178372, "epoch": 1061} {"train_loss": -11.442893981933594, "global_step": 178373, "epoch": 1061} {"train_loss": -11.2138032913208, "global_step": 178374, "epoch": 1061} {"train_loss": -11.344528198242188, "global_step": 178375, "epoch": 1061} {"train_loss": -11.225156784057617, "global_step": 178376, "epoch": 1061} {"train_loss": -11.283402442932129, "global_step": 178377, "epoch": 1061} {"train_loss": -11.36383056640625, "global_step": 178378, "epoch": 1061} {"train_loss": -11.036495208740234, "global_step": 178379, "epoch": 1061} {"train_loss": -11.183168411254883, "global_step": 178380, "epoch": 1061} {"train_loss": -11.277107238769531, "global_step": 178381, "epoch": 1061} {"train_loss": -10.960915565490723, "global_step": 178382, "epoch": 1061} {"train_loss": -11.235893249511719, "global_step": 178383, "epoch": 1061} {"train_loss": -11.215835571289062, "global_step": 178384, "epoch": 1061} {"train_loss": -11.271553039550781, "global_step": 178385, "epoch": 1061} {"train_loss": -11.281099319458008, "global_step": 178386, "epoch": 1061} {"train_loss": -11.356045722961426, "global_step": 178387, "epoch": 1061} {"train_loss": -11.428665161132812, "global_step": 178388, "epoch": 1061} {"train_loss": -11.348504066467285, "global_step": 178389, "epoch": 1061} {"train_loss": -11.16542911529541, "global_step": 178390, "epoch": 1061} {"train_loss": -11.331389427185059, "global_step": 178391, "epoch": 1061} {"train_loss": -11.365036964416504, "global_step": 178392, "epoch": 1061} {"train_loss": -11.167736053466797, "global_step": 178393, "epoch": 1061} {"train_loss": -11.330951690673828, "global_step": 178394, "epoch": 1061} {"train_loss": -11.05230712890625, "global_step": 178395, "epoch": 1061} {"train_loss": -11.344573974609375, "global_step": 178396, "epoch": 1061} {"train_loss": -11.1451997756958, "global_step": 178397, "epoch": 1061} {"train_loss": -11.503787994384766, "global_step": 178398, "epoch": 1061} {"train_loss": -10.918636322021484, "global_step": 178399, "epoch": 1061} {"train_loss": -10.726861953735352, "global_step": 178400, "epoch": 1061} {"train_loss": -11.086114883422852, "global_step": 178401, "epoch": 1061} {"train_loss": -11.239457130432129, "global_step": 178402, "epoch": 1061} {"train_loss": -10.44123363494873, "global_step": 178403, "epoch": 1061} {"train_loss": -9.869684219360352, "global_step": 178404, "epoch": 1061} {"train_loss": -10.87307071685791, "global_step": 178405, "epoch": 1061} {"train_loss": -9.714263916015625, "global_step": 178406, "epoch": 1061} {"train_loss": -8.997064590454102, "global_step": 178407, "epoch": 1061} {"train_loss": -10.835762977600098, "global_step": 178408, "epoch": 1061} {"train_loss": -8.86241340637207, "global_step": 178409, "epoch": 1061} {"train_loss": -9.637903213500977, "global_step": 178410, "epoch": 1061} {"train_loss": -9.419395446777344, "global_step": 178411, "epoch": 1061} {"train_loss": -9.941535949707031, "global_step": 178412, "epoch": 1061} {"train_loss": -9.271353721618652, "global_step": 178413, "epoch": 1061} {"train_loss": -10.051338195800781, "global_step": 178414, "epoch": 1061} {"train_loss": -10.85540627297901, "global_step": 178415, "epoch": 1061, "val_loss": 239405.453125} {"train_loss": -9.421552658081055, "global_step": 178416, "epoch": 1062} {"train_loss": -10.20203685760498, "global_step": 178417, "epoch": 1062} {"train_loss": -9.519905090332031, "global_step": 178418, "epoch": 1062} {"train_loss": -9.413339614868164, "global_step": 178419, "epoch": 1062} {"train_loss": -10.660400390625, "global_step": 178420, "epoch": 1062} {"train_loss": -9.431343078613281, "global_step": 178421, "epoch": 1062} {"train_loss": -10.113183975219727, "global_step": 178422, "epoch": 1062} {"train_loss": -10.380870819091797, "global_step": 178423, "epoch": 1062} {"train_loss": -9.715648651123047, "global_step": 178424, "epoch": 1062} {"train_loss": -10.46213436126709, "global_step": 178425, "epoch": 1062} {"train_loss": -10.613107681274414, "global_step": 178426, "epoch": 1062} {"train_loss": -10.067490577697754, "global_step": 178427, "epoch": 1062} {"train_loss": -10.737642288208008, "global_step": 178428, "epoch": 1062} {"train_loss": -10.697834014892578, "global_step": 178429, "epoch": 1062} {"train_loss": -10.414390563964844, "global_step": 178430, "epoch": 1062} {"train_loss": -10.604598045349121, "global_step": 178431, "epoch": 1062} {"train_loss": -10.883926391601562, "global_step": 178432, "epoch": 1062} {"train_loss": -10.471466064453125, "global_step": 178433, "epoch": 1062} {"train_loss": -10.758832931518555, "global_step": 178434, "epoch": 1062} {"train_loss": -10.910572052001953, "global_step": 178435, "epoch": 1062} {"train_loss": -10.527425765991211, "global_step": 178436, "epoch": 1062} {"train_loss": -10.788493156433105, "global_step": 178437, "epoch": 1062} {"train_loss": -10.971027374267578, "global_step": 178438, "epoch": 1062} {"train_loss": -10.798370361328125, "global_step": 178439, "epoch": 1062} {"train_loss": -10.937110900878906, "global_step": 178440, "epoch": 1062} {"train_loss": -10.832098007202148, "global_step": 178441, "epoch": 1062} {"train_loss": -11.046072959899902, "global_step": 178442, "epoch": 1062} {"train_loss": -11.003344535827637, "global_step": 178443, "epoch": 1062} {"train_loss": -10.936543464660645, "global_step": 178444, "epoch": 1062} {"train_loss": -11.03602409362793, "global_step": 178445, "epoch": 1062} {"train_loss": -10.996007919311523, "global_step": 178446, "epoch": 1062} {"train_loss": -10.841221809387207, "global_step": 178447, "epoch": 1062} {"train_loss": -10.90097427368164, "global_step": 178448, "epoch": 1062} {"train_loss": -11.291349411010742, "global_step": 178449, "epoch": 1062} {"train_loss": -11.129297256469727, "global_step": 178450, "epoch": 1062} {"train_loss": -11.147302627563477, "global_step": 178451, "epoch": 1062} {"train_loss": -11.01466178894043, "global_step": 178452, "epoch": 1062} {"train_loss": -11.005250930786133, "global_step": 178453, "epoch": 1062} {"train_loss": -11.043638229370117, "global_step": 178454, "epoch": 1062} {"train_loss": -11.09697151184082, "global_step": 178455, "epoch": 1062} {"train_loss": -11.17589282989502, "global_step": 178456, "epoch": 1062} {"train_loss": -11.114484786987305, "global_step": 178457, "epoch": 1062} {"train_loss": -11.23621654510498, "global_step": 178458, "epoch": 1062} {"train_loss": -11.115741729736328, "global_step": 178459, "epoch": 1062} {"train_loss": -11.138327598571777, "global_step": 178460, "epoch": 1062} {"train_loss": -11.238420486450195, "global_step": 178461, "epoch": 1062} {"train_loss": -11.328222274780273, "global_step": 178462, "epoch": 1062} {"train_loss": -11.294321060180664, "global_step": 178463, "epoch": 1062} {"train_loss": -11.369613647460938, "global_step": 178464, "epoch": 1062} {"train_loss": -11.354545593261719, "global_step": 178465, "epoch": 1062} {"train_loss": -11.197122573852539, "global_step": 178466, "epoch": 1062} {"train_loss": -11.458369255065918, "global_step": 178467, "epoch": 1062} {"train_loss": -11.15145492553711, "global_step": 178468, "epoch": 1062} {"train_loss": -11.282970428466797, "global_step": 178469, "epoch": 1062} {"train_loss": -11.371495246887207, "global_step": 178470, "epoch": 1062} {"train_loss": -11.276686668395996, "global_step": 178471, "epoch": 1062} {"train_loss": -11.352031707763672, "global_step": 178472, "epoch": 1062} {"train_loss": -11.364028930664062, "global_step": 178473, "epoch": 1062} {"train_loss": -11.283045768737793, "global_step": 178474, "epoch": 1062} {"train_loss": -11.506475448608398, "global_step": 178475, "epoch": 1062} {"train_loss": -11.388175964355469, "global_step": 178476, "epoch": 1062} {"train_loss": -11.432120323181152, "global_step": 178477, "epoch": 1062} {"train_loss": -11.424060821533203, "global_step": 178478, "epoch": 1062} {"train_loss": -11.498459815979004, "global_step": 178479, "epoch": 1062} {"train_loss": -11.237489700317383, "global_step": 178480, "epoch": 1062} {"train_loss": -11.259295463562012, "global_step": 178481, "epoch": 1062} {"train_loss": -11.456448554992676, "global_step": 178482, "epoch": 1062} {"train_loss": -11.463241577148438, "global_step": 178483, "epoch": 1062} {"train_loss": -11.511411666870117, "global_step": 178484, "epoch": 1062} {"train_loss": -11.522231101989746, "global_step": 178485, "epoch": 1062} {"train_loss": -11.474884986877441, "global_step": 178486, "epoch": 1062} {"train_loss": -11.538883209228516, "global_step": 178487, "epoch": 1062} {"train_loss": -11.557714462280273, "global_step": 178488, "epoch": 1062} {"train_loss": -11.600650787353516, "global_step": 178489, "epoch": 1062} {"train_loss": -11.334035873413086, "global_step": 178490, "epoch": 1062} {"train_loss": -11.149877548217773, "global_step": 178491, "epoch": 1062} {"train_loss": -11.530515670776367, "global_step": 178492, "epoch": 1062} {"train_loss": -10.907516479492188, "global_step": 178493, "epoch": 1062} {"train_loss": -10.995828628540039, "global_step": 178494, "epoch": 1062} {"train_loss": -11.518123626708984, "global_step": 178495, "epoch": 1062} {"train_loss": -11.539745330810547, "global_step": 178496, "epoch": 1062} {"train_loss": -11.327384948730469, "global_step": 178497, "epoch": 1062} {"train_loss": -11.434731483459473, "global_step": 178498, "epoch": 1062} {"train_loss": -11.643407821655273, "global_step": 178499, "epoch": 1062} {"train_loss": -11.513681411743164, "global_step": 178500, "epoch": 1062} {"train_loss": -11.421979904174805, "global_step": 178501, "epoch": 1062} {"train_loss": -11.07614517211914, "global_step": 178502, "epoch": 1062} {"train_loss": -10.716314315795898, "global_step": 178503, "epoch": 1062} {"train_loss": -11.275777816772461, "global_step": 178504, "epoch": 1062} {"train_loss": -10.666637420654297, "global_step": 178505, "epoch": 1062} {"train_loss": -10.201837539672852, "global_step": 178506, "epoch": 1062} {"train_loss": -11.437005996704102, "global_step": 178507, "epoch": 1062} {"train_loss": -11.122926712036133, "global_step": 178508, "epoch": 1062} {"train_loss": -10.54761791229248, "global_step": 178509, "epoch": 1062} {"train_loss": -10.72688102722168, "global_step": 178510, "epoch": 1062} {"train_loss": -11.279645919799805, "global_step": 178511, "epoch": 1062} {"train_loss": -10.936185836791992, "global_step": 178512, "epoch": 1062} {"train_loss": -11.03372859954834, "global_step": 178513, "epoch": 1062} {"train_loss": -10.67843246459961, "global_step": 178514, "epoch": 1062} {"train_loss": -10.809141159057617, "global_step": 178515, "epoch": 1062} {"train_loss": -10.284124374389648, "global_step": 178516, "epoch": 1062} {"train_loss": -10.49627685546875, "global_step": 178517, "epoch": 1062} {"train_loss": -9.703718185424805, "global_step": 178518, "epoch": 1062} {"train_loss": -10.349889755249023, "global_step": 178519, "epoch": 1062} {"train_loss": -10.113471984863281, "global_step": 178520, "epoch": 1062} {"train_loss": -10.008150100708008, "global_step": 178521, "epoch": 1062} {"train_loss": -10.831403732299805, "global_step": 178522, "epoch": 1062} {"train_loss": -9.530593872070312, "global_step": 178523, "epoch": 1062} {"train_loss": -11.110929489135742, "global_step": 178524, "epoch": 1062} {"train_loss": -10.442255020141602, "global_step": 178525, "epoch": 1062} {"train_loss": -10.506284713745117, "global_step": 178526, "epoch": 1062} {"train_loss": -10.698272705078125, "global_step": 178527, "epoch": 1062} {"train_loss": -10.068384170532227, "global_step": 178528, "epoch": 1062} {"train_loss": -10.818742752075195, "global_step": 178529, "epoch": 1062} {"train_loss": -9.788042068481445, "global_step": 178530, "epoch": 1062} {"train_loss": -11.19641399383545, "global_step": 178531, "epoch": 1062} {"train_loss": -10.347296714782715, "global_step": 178532, "epoch": 1062} {"train_loss": -10.985227584838867, "global_step": 178533, "epoch": 1062} {"train_loss": -10.718782424926758, "global_step": 178534, "epoch": 1062} {"train_loss": -10.784662246704102, "global_step": 178535, "epoch": 1062} {"train_loss": -10.750965118408203, "global_step": 178536, "epoch": 1062} {"train_loss": -11.058283805847168, "global_step": 178537, "epoch": 1062} {"train_loss": -10.90880012512207, "global_step": 178538, "epoch": 1062} {"train_loss": -10.781968116760254, "global_step": 178539, "epoch": 1062} {"train_loss": -11.150016784667969, "global_step": 178540, "epoch": 1062} {"train_loss": -10.901859283447266, "global_step": 178541, "epoch": 1062} {"train_loss": -11.130302429199219, "global_step": 178542, "epoch": 1062} {"train_loss": -10.891054153442383, "global_step": 178543, "epoch": 1062} {"train_loss": -11.05514907836914, "global_step": 178544, "epoch": 1062} {"train_loss": -11.050113677978516, "global_step": 178545, "epoch": 1062} {"train_loss": -10.896270751953125, "global_step": 178546, "epoch": 1062} {"train_loss": -10.972311973571777, "global_step": 178547, "epoch": 1062} {"train_loss": -11.110615730285645, "global_step": 178548, "epoch": 1062} {"train_loss": -11.031181335449219, "global_step": 178549, "epoch": 1062} {"train_loss": -11.287517547607422, "global_step": 178550, "epoch": 1062} {"train_loss": -11.082706451416016, "global_step": 178551, "epoch": 1062} {"train_loss": -11.141218185424805, "global_step": 178552, "epoch": 1062} {"train_loss": -11.203910827636719, "global_step": 178553, "epoch": 1062} {"train_loss": -11.172490119934082, "global_step": 178554, "epoch": 1062} {"train_loss": -11.274967193603516, "global_step": 178555, "epoch": 1062} {"train_loss": -11.243602752685547, "global_step": 178556, "epoch": 1062} {"train_loss": -11.25441837310791, "global_step": 178557, "epoch": 1062} {"train_loss": -11.19935417175293, "global_step": 178558, "epoch": 1062} {"train_loss": -11.30941104888916, "global_step": 178559, "epoch": 1062} {"train_loss": -11.261398315429688, "global_step": 178560, "epoch": 1062} {"train_loss": -11.3453950881958, "global_step": 178561, "epoch": 1062} {"train_loss": -11.345222473144531, "global_step": 178562, "epoch": 1062} {"train_loss": -11.27171802520752, "global_step": 178563, "epoch": 1062} {"train_loss": -11.345707893371582, "global_step": 178564, "epoch": 1062} {"train_loss": -11.419530868530273, "global_step": 178565, "epoch": 1062} {"train_loss": -11.496102333068848, "global_step": 178566, "epoch": 1062} {"train_loss": -11.492289543151855, "global_step": 178567, "epoch": 1062} {"train_loss": -11.25639820098877, "global_step": 178568, "epoch": 1062} {"train_loss": -11.114790916442871, "global_step": 178569, "epoch": 1062} {"train_loss": -11.464217185974121, "global_step": 178570, "epoch": 1062} {"train_loss": -11.215615272521973, "global_step": 178571, "epoch": 1062} {"train_loss": -11.426019668579102, "global_step": 178572, "epoch": 1062} {"train_loss": -11.182872772216797, "global_step": 178573, "epoch": 1062} {"train_loss": -11.19141960144043, "global_step": 178574, "epoch": 1062} {"train_loss": -11.175277709960938, "global_step": 178575, "epoch": 1062} {"train_loss": -11.479562759399414, "global_step": 178576, "epoch": 1062} {"train_loss": -11.005586624145508, "global_step": 178577, "epoch": 1062} {"train_loss": -11.270630836486816, "global_step": 178578, "epoch": 1062} {"train_loss": -11.334526062011719, "global_step": 178579, "epoch": 1062} {"train_loss": -11.146921157836914, "global_step": 178580, "epoch": 1062} {"train_loss": -11.30099105834961, "global_step": 178581, "epoch": 1062} {"train_loss": -11.041598320007324, "global_step": 178582, "epoch": 1062} {"train_loss": -10.984545684996105, "global_step": 178583, "epoch": 1062, "val_loss": 245863.078125} {"train_loss": -11.216476440429688, "global_step": 178584, "epoch": 1063} {"train_loss": -10.9700345993042, "global_step": 178585, "epoch": 1063} {"train_loss": -11.273935317993164, "global_step": 178586, "epoch": 1063} {"train_loss": -11.16016960144043, "global_step": 178587, "epoch": 1063} {"train_loss": -11.09676742553711, "global_step": 178588, "epoch": 1063} {"train_loss": -11.618647575378418, "global_step": 178589, "epoch": 1063} {"train_loss": -11.369136810302734, "global_step": 178590, "epoch": 1063} {"train_loss": -11.1441650390625, "global_step": 178591, "epoch": 1063} {"train_loss": -11.414474487304688, "global_step": 178592, "epoch": 1063} {"train_loss": -11.378715515136719, "global_step": 178593, "epoch": 1063} {"train_loss": -11.181600570678711, "global_step": 178594, "epoch": 1063} {"train_loss": -11.137046813964844, "global_step": 178595, "epoch": 1063} {"train_loss": -10.979759216308594, "global_step": 178596, "epoch": 1063} {"train_loss": -10.892078399658203, "global_step": 178597, "epoch": 1063} {"train_loss": -10.917638778686523, "global_step": 178598, "epoch": 1063} {"train_loss": -11.214427947998047, "global_step": 178599, "epoch": 1063} {"train_loss": -10.891155242919922, "global_step": 178600, "epoch": 1063} {"train_loss": -10.613349914550781, "global_step": 178601, "epoch": 1063} {"train_loss": -11.256452560424805, "global_step": 178602, "epoch": 1063} {"train_loss": -11.050761222839355, "global_step": 178603, "epoch": 1063} {"train_loss": -10.460216522216797, "global_step": 178604, "epoch": 1063} {"train_loss": -10.956765174865723, "global_step": 178605, "epoch": 1063} {"train_loss": -10.583353996276855, "global_step": 178606, "epoch": 1063} {"train_loss": -10.548450469970703, "global_step": 178607, "epoch": 1063} {"train_loss": -10.366899490356445, "global_step": 178608, "epoch": 1063} {"train_loss": -11.3329439163208, "global_step": 178609, "epoch": 1063} {"train_loss": -10.766000747680664, "global_step": 178610, "epoch": 1063} {"train_loss": -11.16150951385498, "global_step": 178611, "epoch": 1063} {"train_loss": -11.168376922607422, "global_step": 178612, "epoch": 1063} {"train_loss": -11.104379653930664, "global_step": 178613, "epoch": 1063} {"train_loss": -11.07807731628418, "global_step": 178614, "epoch": 1063} {"train_loss": -11.169483184814453, "global_step": 178615, "epoch": 1063} {"train_loss": -10.959495544433594, "global_step": 178616, "epoch": 1063} {"train_loss": -11.412671089172363, "global_step": 178617, "epoch": 1063} {"train_loss": -11.28748893737793, "global_step": 178618, "epoch": 1063} {"train_loss": -11.319459915161133, "global_step": 178619, "epoch": 1063} {"train_loss": -11.238480567932129, "global_step": 178620, "epoch": 1063} {"train_loss": -11.167886734008789, "global_step": 178621, "epoch": 1063} {"train_loss": -10.999471664428711, "global_step": 178622, "epoch": 1063} {"train_loss": -11.340826988220215, "global_step": 178623, "epoch": 1063} {"train_loss": -11.053138732910156, "global_step": 178624, "epoch": 1063} {"train_loss": -11.186738967895508, "global_step": 178625, "epoch": 1063} {"train_loss": -11.124802589416504, "global_step": 178626, "epoch": 1063} {"train_loss": -11.364675521850586, "global_step": 178627, "epoch": 1063} {"train_loss": -11.264860153198242, "global_step": 178628, "epoch": 1063} {"train_loss": -11.396357536315918, "global_step": 178629, "epoch": 1063} {"train_loss": -11.51954460144043, "global_step": 178630, "epoch": 1063} {"train_loss": -11.233845710754395, "global_step": 178631, "epoch": 1063} {"train_loss": -11.530485153198242, "global_step": 178632, "epoch": 1063} {"train_loss": -11.155780792236328, "global_step": 178633, "epoch": 1063} {"train_loss": -11.345102310180664, "global_step": 178634, "epoch": 1063} {"train_loss": -11.380056381225586, "global_step": 178635, "epoch": 1063} {"train_loss": -11.2689790725708, "global_step": 178636, "epoch": 1063} {"train_loss": -11.134542465209961, "global_step": 178637, "epoch": 1063} {"train_loss": -11.297898292541504, "global_step": 178638, "epoch": 1063} {"train_loss": -11.271313667297363, "global_step": 178639, "epoch": 1063} {"train_loss": -11.495368003845215, "global_step": 178640, "epoch": 1063} {"train_loss": -11.349833488464355, "global_step": 178641, "epoch": 1063} {"train_loss": -11.515022277832031, "global_step": 178642, "epoch": 1063} {"train_loss": -11.522624969482422, "global_step": 178643, "epoch": 1063} {"train_loss": -11.518829345703125, "global_step": 178644, "epoch": 1063} {"train_loss": -11.364940643310547, "global_step": 178645, "epoch": 1063} {"train_loss": -11.477682113647461, "global_step": 178646, "epoch": 1063} {"train_loss": -11.469304084777832, "global_step": 178647, "epoch": 1063} {"train_loss": -11.617477416992188, "global_step": 178648, "epoch": 1063} {"train_loss": -11.72006607055664, "global_step": 178649, "epoch": 1063} {"train_loss": -11.318047523498535, "global_step": 178650, "epoch": 1063} {"train_loss": -11.475421905517578, "global_step": 178651, "epoch": 1063} {"train_loss": -11.300395965576172, "global_step": 178652, "epoch": 1063} {"train_loss": -11.439142227172852, "global_step": 178653, "epoch": 1063} {"train_loss": -11.63791275024414, "global_step": 178654, "epoch": 1063} {"train_loss": -11.443305969238281, "global_step": 178655, "epoch": 1063} {"train_loss": -11.58431625366211, "global_step": 178656, "epoch": 1063} {"train_loss": -11.605328559875488, "global_step": 178657, "epoch": 1063} {"train_loss": -11.541845321655273, "global_step": 178658, "epoch": 1063} {"train_loss": -11.448445320129395, "global_step": 178659, "epoch": 1063} {"train_loss": -11.605560302734375, "global_step": 178660, "epoch": 1063} {"train_loss": -11.38277816772461, "global_step": 178661, "epoch": 1063} {"train_loss": -10.94221305847168, "global_step": 178662, "epoch": 1063} {"train_loss": -10.856054306030273, "global_step": 178663, "epoch": 1063} {"train_loss": -10.791755676269531, "global_step": 178664, "epoch": 1063} {"train_loss": -10.71735954284668, "global_step": 178665, "epoch": 1063} {"train_loss": -10.322412490844727, "global_step": 178666, "epoch": 1063} {"train_loss": -11.38008975982666, "global_step": 178667, "epoch": 1063} {"train_loss": -10.535123825073242, "global_step": 178668, "epoch": 1063} {"train_loss": -11.510900497436523, "global_step": 178669, "epoch": 1063} {"train_loss": -10.637493133544922, "global_step": 178670, "epoch": 1063} {"train_loss": -11.352497100830078, "global_step": 178671, "epoch": 1063} {"train_loss": -10.293044090270996, "global_step": 178672, "epoch": 1063} {"train_loss": -11.005346298217773, "global_step": 178673, "epoch": 1063} {"train_loss": -11.075506210327148, "global_step": 178674, "epoch": 1063} {"train_loss": -10.90259838104248, "global_step": 178675, "epoch": 1063} {"train_loss": -10.125974655151367, "global_step": 178676, "epoch": 1063} {"train_loss": -10.625263214111328, "global_step": 178677, "epoch": 1063} {"train_loss": -10.331235885620117, "global_step": 178678, "epoch": 1063} {"train_loss": -10.426901817321777, "global_step": 178679, "epoch": 1063} {"train_loss": -11.175833702087402, "global_step": 178680, "epoch": 1063} {"train_loss": -9.930065155029297, "global_step": 178681, "epoch": 1063} {"train_loss": -10.27447509765625, "global_step": 178682, "epoch": 1063} {"train_loss": -10.918171882629395, "global_step": 178683, "epoch": 1063} {"train_loss": -10.729557991027832, "global_step": 178684, "epoch": 1063} {"train_loss": -10.18432331085205, "global_step": 178685, "epoch": 1063} {"train_loss": -10.63990592956543, "global_step": 178686, "epoch": 1063} {"train_loss": -10.335243225097656, "global_step": 178687, "epoch": 1063} {"train_loss": -10.210354804992676, "global_step": 178688, "epoch": 1063} {"train_loss": -10.890741348266602, "global_step": 178689, "epoch": 1063} {"train_loss": -10.125917434692383, "global_step": 178690, "epoch": 1063} {"train_loss": -10.797714233398438, "global_step": 178691, "epoch": 1063} {"train_loss": -10.914161682128906, "global_step": 178692, "epoch": 1063} {"train_loss": -10.654889106750488, "global_step": 178693, "epoch": 1063} {"train_loss": -10.69887924194336, "global_step": 178694, "epoch": 1063} {"train_loss": -10.596332550048828, "global_step": 178695, "epoch": 1063} {"train_loss": -10.900545120239258, "global_step": 178696, "epoch": 1063} {"train_loss": -10.323904037475586, "global_step": 178697, "epoch": 1063} {"train_loss": -10.751723289489746, "global_step": 178698, "epoch": 1063} {"train_loss": -10.390556335449219, "global_step": 178699, "epoch": 1063} {"train_loss": -11.019737243652344, "global_step": 178700, "epoch": 1063} {"train_loss": -10.42064094543457, "global_step": 178701, "epoch": 1063} {"train_loss": -10.73298454284668, "global_step": 178702, "epoch": 1063} {"train_loss": -10.354560852050781, "global_step": 178703, "epoch": 1063} {"train_loss": -10.711349487304688, "global_step": 178704, "epoch": 1063} {"train_loss": -10.777514457702637, "global_step": 178705, "epoch": 1063} {"train_loss": -10.82728385925293, "global_step": 178706, "epoch": 1063} {"train_loss": -10.80726432800293, "global_step": 178707, "epoch": 1063} {"train_loss": -10.579435348510742, "global_step": 178708, "epoch": 1063} {"train_loss": -10.643088340759277, "global_step": 178709, "epoch": 1063} {"train_loss": -10.875699996948242, "global_step": 178710, "epoch": 1063} {"train_loss": -10.8589448928833, "global_step": 178711, "epoch": 1063} {"train_loss": -10.934900283813477, "global_step": 178712, "epoch": 1063} {"train_loss": -10.802568435668945, "global_step": 178713, "epoch": 1063} {"train_loss": -10.874361038208008, "global_step": 178714, "epoch": 1063} {"train_loss": -10.983654975891113, "global_step": 178715, "epoch": 1063} {"train_loss": -10.965259552001953, "global_step": 178716, "epoch": 1063} {"train_loss": -11.090314865112305, "global_step": 178717, "epoch": 1063} {"train_loss": -11.106069564819336, "global_step": 178718, "epoch": 1063} {"train_loss": -11.357460021972656, "global_step": 178719, "epoch": 1063} {"train_loss": -10.979687690734863, "global_step": 178720, "epoch": 1063} {"train_loss": -11.178169250488281, "global_step": 178721, "epoch": 1063} {"train_loss": -11.080942153930664, "global_step": 178722, "epoch": 1063} {"train_loss": -10.922163009643555, "global_step": 178723, "epoch": 1063} {"train_loss": -11.04612922668457, "global_step": 178724, "epoch": 1063} {"train_loss": -10.8038911819458, "global_step": 178725, "epoch": 1063} {"train_loss": -10.959550857543945, "global_step": 178726, "epoch": 1063} {"train_loss": -11.273550033569336, "global_step": 178727, "epoch": 1063} {"train_loss": -10.884832382202148, "global_step": 178728, "epoch": 1063} {"train_loss": -11.10738754272461, "global_step": 178729, "epoch": 1063} {"train_loss": -10.721040725708008, "global_step": 178730, "epoch": 1063} {"train_loss": -10.843766212463379, "global_step": 178731, "epoch": 1063} {"train_loss": -11.107885360717773, "global_step": 178732, "epoch": 1063} {"train_loss": -11.012482643127441, "global_step": 178733, "epoch": 1063} {"train_loss": -11.144604682922363, "global_step": 178734, "epoch": 1063} {"train_loss": -11.066205024719238, "global_step": 178735, "epoch": 1063} {"train_loss": -11.033838272094727, "global_step": 178736, "epoch": 1063} {"train_loss": -11.269777297973633, "global_step": 178737, "epoch": 1063} {"train_loss": -11.077211380004883, "global_step": 178738, "epoch": 1063} {"train_loss": -11.380783081054688, "global_step": 178739, "epoch": 1063} {"train_loss": -11.173831939697266, "global_step": 178740, "epoch": 1063} {"train_loss": -11.3251953125, "global_step": 178741, "epoch": 1063} {"train_loss": -11.188993453979492, "global_step": 178742, "epoch": 1063} {"train_loss": -11.158289909362793, "global_step": 178743, "epoch": 1063} {"train_loss": -11.077713012695312, "global_step": 178744, "epoch": 1063} {"train_loss": -10.8753662109375, "global_step": 178745, "epoch": 1063} {"train_loss": -11.245214462280273, "global_step": 178746, "epoch": 1063} {"train_loss": -11.369022369384766, "global_step": 178747, "epoch": 1063} {"train_loss": -11.355342864990234, "global_step": 178748, "epoch": 1063} {"train_loss": -11.338586807250977, "global_step": 178749, "epoch": 1063} {"train_loss": -11.137435913085938, "global_step": 178750, "epoch": 1063} {"train_loss": -11.037034982726688, "global_step": 178751, "epoch": 1063, "val_loss": 246378.859375} {"train_loss": -11.263765335083008, "global_step": 178752, "epoch": 1064} {"train_loss": -11.398582458496094, "global_step": 178753, "epoch": 1064} {"train_loss": -11.156089782714844, "global_step": 178754, "epoch": 1064} {"train_loss": -11.464791297912598, "global_step": 178755, "epoch": 1064} {"train_loss": -11.198906898498535, "global_step": 178756, "epoch": 1064} {"train_loss": -11.439050674438477, "global_step": 178757, "epoch": 1064} {"train_loss": -11.400218963623047, "global_step": 178758, "epoch": 1064} {"train_loss": -11.387702941894531, "global_step": 178759, "epoch": 1064} {"train_loss": -11.26244068145752, "global_step": 178760, "epoch": 1064} {"train_loss": -11.368425369262695, "global_step": 178761, "epoch": 1064} {"train_loss": -11.380313873291016, "global_step": 178762, "epoch": 1064} {"train_loss": -11.059381484985352, "global_step": 178763, "epoch": 1064} {"train_loss": -11.54568862915039, "global_step": 178764, "epoch": 1064} {"train_loss": -11.2353515625, "global_step": 178765, "epoch": 1064} {"train_loss": -11.43824577331543, "global_step": 178766, "epoch": 1064} {"train_loss": -11.438523292541504, "global_step": 178767, "epoch": 1064} {"train_loss": -11.553610801696777, "global_step": 178768, "epoch": 1064} {"train_loss": -11.442928314208984, "global_step": 178769, "epoch": 1064} {"train_loss": -11.365032196044922, "global_step": 178770, "epoch": 1064} {"train_loss": -11.195512771606445, "global_step": 178771, "epoch": 1064} {"train_loss": -11.215564727783203, "global_step": 178772, "epoch": 1064} {"train_loss": -11.552287101745605, "global_step": 178773, "epoch": 1064} {"train_loss": -11.32448959350586, "global_step": 178774, "epoch": 1064} {"train_loss": -11.454553604125977, "global_step": 178775, "epoch": 1064} {"train_loss": -10.886475563049316, "global_step": 178776, "epoch": 1064} {"train_loss": -11.544458389282227, "global_step": 178777, "epoch": 1064} {"train_loss": -10.905366897583008, "global_step": 178778, "epoch": 1064} {"train_loss": -10.92774486541748, "global_step": 178779, "epoch": 1064} {"train_loss": -10.942255973815918, "global_step": 178780, "epoch": 1064} {"train_loss": -11.257091522216797, "global_step": 178781, "epoch": 1064} {"train_loss": -11.1719970703125, "global_step": 178782, "epoch": 1064} {"train_loss": -11.121938705444336, "global_step": 178783, "epoch": 1064} {"train_loss": -10.759767532348633, "global_step": 178784, "epoch": 1064} {"train_loss": -10.43865966796875, "global_step": 178785, "epoch": 1064} {"train_loss": -10.935981750488281, "global_step": 178786, "epoch": 1064} {"train_loss": -10.95399284362793, "global_step": 178787, "epoch": 1064} {"train_loss": -10.339521408081055, "global_step": 178788, "epoch": 1064} {"train_loss": -10.724394798278809, "global_step": 178789, "epoch": 1064} {"train_loss": -11.125181198120117, "global_step": 178790, "epoch": 1064} {"train_loss": -11.108142852783203, "global_step": 178791, "epoch": 1064} {"train_loss": -10.909690856933594, "global_step": 178792, "epoch": 1064} {"train_loss": -11.214960098266602, "global_step": 178793, "epoch": 1064} {"train_loss": -10.695630073547363, "global_step": 178794, "epoch": 1064} {"train_loss": -11.316555976867676, "global_step": 178795, "epoch": 1064} {"train_loss": -11.090917587280273, "global_step": 178796, "epoch": 1064} {"train_loss": -11.27369213104248, "global_step": 178797, "epoch": 1064} {"train_loss": -11.063495635986328, "global_step": 178798, "epoch": 1064} {"train_loss": -11.535808563232422, "global_step": 178799, "epoch": 1064} {"train_loss": -11.087263107299805, "global_step": 178800, "epoch": 1064} {"train_loss": -10.862188339233398, "global_step": 178801, "epoch": 1064} {"train_loss": -11.46728515625, "global_step": 178802, "epoch": 1064} {"train_loss": -11.277823448181152, "global_step": 178803, "epoch": 1064} {"train_loss": -11.3201322555542, "global_step": 178804, "epoch": 1064} {"train_loss": -11.328454971313477, "global_step": 178805, "epoch": 1064} {"train_loss": -10.86716079711914, "global_step": 178806, "epoch": 1064} {"train_loss": -11.21544075012207, "global_step": 178807, "epoch": 1064} {"train_loss": -11.247300148010254, "global_step": 178808, "epoch": 1064} {"train_loss": -11.054658889770508, "global_step": 178809, "epoch": 1064} {"train_loss": -10.390670776367188, "global_step": 178810, "epoch": 1064} {"train_loss": -11.218669891357422, "global_step": 178811, "epoch": 1064} {"train_loss": -9.793588638305664, "global_step": 178812, "epoch": 1064} {"train_loss": -10.682977676391602, "global_step": 178813, "epoch": 1064} {"train_loss": -10.615959167480469, "global_step": 178814, "epoch": 1064} {"train_loss": -10.398853302001953, "global_step": 178815, "epoch": 1064} {"train_loss": -10.358283996582031, "global_step": 178816, "epoch": 1064} {"train_loss": -9.166379928588867, "global_step": 178817, "epoch": 1064} {"train_loss": -10.591142654418945, "global_step": 178818, "epoch": 1064} {"train_loss": -10.125168800354004, "global_step": 178819, "epoch": 1064} {"train_loss": -9.746502876281738, "global_step": 178820, "epoch": 1064} {"train_loss": -10.917207717895508, "global_step": 178821, "epoch": 1064} {"train_loss": -10.105173110961914, "global_step": 178822, "epoch": 1064} {"train_loss": -10.858489990234375, "global_step": 178823, "epoch": 1064} {"train_loss": -10.391100883483887, "global_step": 178824, "epoch": 1064} {"train_loss": -10.332342147827148, "global_step": 178825, "epoch": 1064} {"train_loss": -10.071853637695312, "global_step": 178826, "epoch": 1064} {"train_loss": -9.874003410339355, "global_step": 178827, "epoch": 1064} {"train_loss": -10.509286880493164, "global_step": 178828, "epoch": 1064} {"train_loss": -9.884899139404297, "global_step": 178829, "epoch": 1064} {"train_loss": -10.63502311706543, "global_step": 178830, "epoch": 1064} {"train_loss": -10.337638854980469, "global_step": 178831, "epoch": 1064} {"train_loss": -10.860554695129395, "global_step": 178832, "epoch": 1064} {"train_loss": -10.2911376953125, "global_step": 178833, "epoch": 1064} {"train_loss": -10.9135103225708, "global_step": 178834, "epoch": 1064} {"train_loss": -10.138463973999023, "global_step": 178835, "epoch": 1064} {"train_loss": -10.331436157226562, "global_step": 178836, "epoch": 1064} {"train_loss": -10.004023551940918, "global_step": 178837, "epoch": 1064} {"train_loss": -9.850717544555664, "global_step": 178838, "epoch": 1064} {"train_loss": -10.12271499633789, "global_step": 178839, "epoch": 1064} {"train_loss": -10.83942699432373, "global_step": 178840, "epoch": 1064} {"train_loss": -10.047431945800781, "global_step": 178841, "epoch": 1064} {"train_loss": -10.616752624511719, "global_step": 178842, "epoch": 1064} {"train_loss": -10.712926864624023, "global_step": 178843, "epoch": 1064} {"train_loss": -9.935108184814453, "global_step": 178844, "epoch": 1064} {"train_loss": -10.933287620544434, "global_step": 178845, "epoch": 1064} {"train_loss": -10.275888442993164, "global_step": 178846, "epoch": 1064} {"train_loss": -10.8175687789917, "global_step": 178847, "epoch": 1064} {"train_loss": -10.443086624145508, "global_step": 178848, "epoch": 1064} {"train_loss": -10.918465614318848, "global_step": 178849, "epoch": 1064} {"train_loss": -10.394444465637207, "global_step": 178850, "epoch": 1064} {"train_loss": -10.872039794921875, "global_step": 178851, "epoch": 1064} {"train_loss": -10.798362731933594, "global_step": 178852, "epoch": 1064} {"train_loss": -10.565755844116211, "global_step": 178853, "epoch": 1064} {"train_loss": -10.75966739654541, "global_step": 178854, "epoch": 1064} {"train_loss": -10.303680419921875, "global_step": 178855, "epoch": 1064} {"train_loss": -10.97200870513916, "global_step": 178856, "epoch": 1064} {"train_loss": -10.512077331542969, "global_step": 178857, "epoch": 1064} {"train_loss": -10.73724365234375, "global_step": 178858, "epoch": 1064} {"train_loss": -10.705011367797852, "global_step": 178859, "epoch": 1064} {"train_loss": -10.637106895446777, "global_step": 178860, "epoch": 1064} {"train_loss": -11.179434776306152, "global_step": 178861, "epoch": 1064} {"train_loss": -10.946807861328125, "global_step": 178862, "epoch": 1064} {"train_loss": -11.167150497436523, "global_step": 178863, "epoch": 1064} {"train_loss": -10.685942649841309, "global_step": 178864, "epoch": 1064} {"train_loss": -10.937238693237305, "global_step": 178865, "epoch": 1064} {"train_loss": -10.53304672241211, "global_step": 178866, "epoch": 1064} {"train_loss": -10.914843559265137, "global_step": 178867, "epoch": 1064} {"train_loss": -11.184478759765625, "global_step": 178868, "epoch": 1064} {"train_loss": -10.843131065368652, "global_step": 178869, "epoch": 1064} {"train_loss": -11.25094985961914, "global_step": 178870, "epoch": 1064} {"train_loss": -11.127049446105957, "global_step": 178871, "epoch": 1064} {"train_loss": -11.168684005737305, "global_step": 178872, "epoch": 1064} {"train_loss": -11.238268852233887, "global_step": 178873, "epoch": 1064} {"train_loss": -11.137660026550293, "global_step": 178874, "epoch": 1064} {"train_loss": -11.29574966430664, "global_step": 178875, "epoch": 1064} {"train_loss": -11.20244312286377, "global_step": 178876, "epoch": 1064} {"train_loss": -11.402021408081055, "global_step": 178877, "epoch": 1064} {"train_loss": -11.460918426513672, "global_step": 178878, "epoch": 1064} {"train_loss": -11.464381217956543, "global_step": 178879, "epoch": 1064} {"train_loss": -11.282849311828613, "global_step": 178880, "epoch": 1064} {"train_loss": -11.123635292053223, "global_step": 178881, "epoch": 1064} {"train_loss": -11.500438690185547, "global_step": 178882, "epoch": 1064} {"train_loss": -11.285065650939941, "global_step": 178883, "epoch": 1064} {"train_loss": -11.336029052734375, "global_step": 178884, "epoch": 1064} {"train_loss": -11.497808456420898, "global_step": 178885, "epoch": 1064} {"train_loss": -11.386276245117188, "global_step": 178886, "epoch": 1064} {"train_loss": -11.269437789916992, "global_step": 178887, "epoch": 1064} {"train_loss": -11.453688621520996, "global_step": 178888, "epoch": 1064} {"train_loss": -11.438695907592773, "global_step": 178889, "epoch": 1064} {"train_loss": -11.30300521850586, "global_step": 178890, "epoch": 1064} {"train_loss": -11.361786842346191, "global_step": 178891, "epoch": 1064} {"train_loss": -11.446636199951172, "global_step": 178892, "epoch": 1064} {"train_loss": -11.464035034179688, "global_step": 178893, "epoch": 1064} {"train_loss": -11.33204174041748, "global_step": 178894, "epoch": 1064} {"train_loss": -11.362730979919434, "global_step": 178895, "epoch": 1064} {"train_loss": -11.285274505615234, "global_step": 178896, "epoch": 1064} {"train_loss": -11.39062786102295, "global_step": 178897, "epoch": 1064} {"train_loss": -11.127752304077148, "global_step": 178898, "epoch": 1064} {"train_loss": -11.317362785339355, "global_step": 178899, "epoch": 1064} {"train_loss": -11.232402801513672, "global_step": 178900, "epoch": 1064} {"train_loss": -11.234106063842773, "global_step": 178901, "epoch": 1064} {"train_loss": -11.45650577545166, "global_step": 178902, "epoch": 1064} {"train_loss": -11.533777236938477, "global_step": 178903, "epoch": 1064} {"train_loss": -10.963913917541504, "global_step": 178904, "epoch": 1064} {"train_loss": -11.274051666259766, "global_step": 178905, "epoch": 1064} {"train_loss": -11.250436782836914, "global_step": 178906, "epoch": 1064} {"train_loss": -11.554489135742188, "global_step": 178907, "epoch": 1064} {"train_loss": -11.430356979370117, "global_step": 178908, "epoch": 1064} {"train_loss": -11.312362670898438, "global_step": 178909, "epoch": 1064} {"train_loss": -11.435431480407715, "global_step": 178910, "epoch": 1064} {"train_loss": -11.309000015258789, "global_step": 178911, "epoch": 1064} {"train_loss": -11.315455436706543, "global_step": 178912, "epoch": 1064} {"train_loss": -11.336380004882812, "global_step": 178913, "epoch": 1064} {"train_loss": -11.097137451171875, "global_step": 178914, "epoch": 1064} {"train_loss": -10.975761413574219, "global_step": 178915, "epoch": 1064} {"train_loss": -11.103813171386719, "global_step": 178916, "epoch": 1064} {"train_loss": -11.137295722961426, "global_step": 178917, "epoch": 1064} {"train_loss": -11.456377029418945, "global_step": 178918, "epoch": 1064} {"train_loss": -10.979069352149963, "global_step": 178919, "epoch": 1064, "val_loss": 243579.484375} {"train_loss": -11.369443893432617, "global_step": 178920, "epoch": 1065} {"train_loss": -10.971001625061035, "global_step": 178921, "epoch": 1065} {"train_loss": -11.1583890914917, "global_step": 178922, "epoch": 1065} {"train_loss": -10.972804069519043, "global_step": 178923, "epoch": 1065} {"train_loss": -11.057753562927246, "global_step": 178924, "epoch": 1065} {"train_loss": -11.205831527709961, "global_step": 178925, "epoch": 1065} {"train_loss": -10.958051681518555, "global_step": 178926, "epoch": 1065} {"train_loss": -11.141275405883789, "global_step": 178927, "epoch": 1065} {"train_loss": -10.852204322814941, "global_step": 178928, "epoch": 1065} {"train_loss": -11.131734848022461, "global_step": 178929, "epoch": 1065} {"train_loss": -10.965278625488281, "global_step": 178930, "epoch": 1065} {"train_loss": -11.206047058105469, "global_step": 178931, "epoch": 1065} {"train_loss": -10.95118522644043, "global_step": 178932, "epoch": 1065} {"train_loss": -10.970712661743164, "global_step": 178933, "epoch": 1065} {"train_loss": -10.741066932678223, "global_step": 178934, "epoch": 1065} {"train_loss": -10.436712265014648, "global_step": 178935, "epoch": 1065} {"train_loss": -10.647367477416992, "global_step": 178936, "epoch": 1065} {"train_loss": -10.554377555847168, "global_step": 178937, "epoch": 1065} {"train_loss": -9.58233642578125, "global_step": 178938, "epoch": 1065} {"train_loss": -10.396893501281738, "global_step": 178939, "epoch": 1065} {"train_loss": -10.990984916687012, "global_step": 178940, "epoch": 1065} {"train_loss": -10.457662582397461, "global_step": 178941, "epoch": 1065} {"train_loss": -10.779712677001953, "global_step": 178942, "epoch": 1065} {"train_loss": -10.493480682373047, "global_step": 178943, "epoch": 1065} {"train_loss": -9.826711654663086, "global_step": 178944, "epoch": 1065} {"train_loss": -11.230154037475586, "global_step": 178945, "epoch": 1065} {"train_loss": -9.99022102355957, "global_step": 178946, "epoch": 1065} {"train_loss": -10.634464263916016, "global_step": 178947, "epoch": 1065} {"train_loss": -10.386646270751953, "global_step": 178948, "epoch": 1065} {"train_loss": -10.46195125579834, "global_step": 178949, "epoch": 1065} {"train_loss": -11.023075103759766, "global_step": 178950, "epoch": 1065} {"train_loss": -10.296009063720703, "global_step": 178951, "epoch": 1065} {"train_loss": -10.137499809265137, "global_step": 178952, "epoch": 1065} {"train_loss": -10.860177993774414, "global_step": 178953, "epoch": 1065} {"train_loss": -10.353704452514648, "global_step": 178954, "epoch": 1065} {"train_loss": -10.449808120727539, "global_step": 178955, "epoch": 1065} {"train_loss": -10.88322639465332, "global_step": 178956, "epoch": 1065} {"train_loss": -10.530938148498535, "global_step": 178957, "epoch": 1065} {"train_loss": -10.932907104492188, "global_step": 178958, "epoch": 1065} {"train_loss": -10.633529663085938, "global_step": 178959, "epoch": 1065} {"train_loss": -10.64146614074707, "global_step": 178960, "epoch": 1065} {"train_loss": -11.071516990661621, "global_step": 178961, "epoch": 1065} {"train_loss": -10.598941802978516, "global_step": 178962, "epoch": 1065} {"train_loss": -10.763984680175781, "global_step": 178963, "epoch": 1065} {"train_loss": -10.842867851257324, "global_step": 178964, "epoch": 1065} {"train_loss": -10.902791023254395, "global_step": 178965, "epoch": 1065} {"train_loss": -10.857780456542969, "global_step": 178966, "epoch": 1065} {"train_loss": -11.067037582397461, "global_step": 178967, "epoch": 1065} {"train_loss": -10.70551872253418, "global_step": 178968, "epoch": 1065} {"train_loss": -10.838706970214844, "global_step": 178969, "epoch": 1065} {"train_loss": -10.85042953491211, "global_step": 178970, "epoch": 1065} {"train_loss": -10.93203353881836, "global_step": 178971, "epoch": 1065} {"train_loss": -10.780101776123047, "global_step": 178972, "epoch": 1065} {"train_loss": -11.012619018554688, "global_step": 178973, "epoch": 1065} {"train_loss": -10.68303108215332, "global_step": 178974, "epoch": 1065} {"train_loss": -11.126871109008789, "global_step": 178975, "epoch": 1065} {"train_loss": -11.173462867736816, "global_step": 178976, "epoch": 1065} {"train_loss": -11.244874954223633, "global_step": 178977, "epoch": 1065} {"train_loss": -11.187593460083008, "global_step": 178978, "epoch": 1065} {"train_loss": -11.090645790100098, "global_step": 178979, "epoch": 1065} {"train_loss": -10.941222190856934, "global_step": 178980, "epoch": 1065} {"train_loss": -11.0171537399292, "global_step": 178981, "epoch": 1065} {"train_loss": -11.083879470825195, "global_step": 178982, "epoch": 1065} {"train_loss": -11.215949058532715, "global_step": 178983, "epoch": 1065} {"train_loss": -11.320534706115723, "global_step": 178984, "epoch": 1065} {"train_loss": -11.048688888549805, "global_step": 178985, "epoch": 1065} {"train_loss": -11.213882446289062, "global_step": 178986, "epoch": 1065} {"train_loss": -11.192373275756836, "global_step": 178987, "epoch": 1065} {"train_loss": -11.491894721984863, "global_step": 178988, "epoch": 1065} {"train_loss": -11.063526153564453, "global_step": 178989, "epoch": 1065} {"train_loss": -11.27020263671875, "global_step": 178990, "epoch": 1065} {"train_loss": -10.882732391357422, "global_step": 178991, "epoch": 1065} {"train_loss": -10.91364860534668, "global_step": 178992, "epoch": 1065} {"train_loss": -11.004480361938477, "global_step": 178993, "epoch": 1065} {"train_loss": -10.835082054138184, "global_step": 178994, "epoch": 1065} {"train_loss": -10.650482177734375, "global_step": 178995, "epoch": 1065} {"train_loss": -11.094437599182129, "global_step": 178996, "epoch": 1065} {"train_loss": -10.658111572265625, "global_step": 178997, "epoch": 1065} {"train_loss": -10.742528915405273, "global_step": 178998, "epoch": 1065} {"train_loss": -10.09136962890625, "global_step": 178999, "epoch": 1065} {"train_loss": -10.96045207977295, "global_step": 179000, "epoch": 1065} {"train_loss": -10.85926342010498, "global_step": 179001, "epoch": 1065} {"train_loss": -10.909421920776367, "global_step": 179002, "epoch": 1065} {"train_loss": -10.713434219360352, "global_step": 179003, "epoch": 1065} {"train_loss": -10.528112411499023, "global_step": 179004, "epoch": 1065} {"train_loss": -10.974434852600098, "global_step": 179005, "epoch": 1065} {"train_loss": -10.442020416259766, "global_step": 179006, "epoch": 1065} {"train_loss": -11.372430801391602, "global_step": 179007, "epoch": 1065} {"train_loss": -10.503510475158691, "global_step": 179008, "epoch": 1065} {"train_loss": -11.187705993652344, "global_step": 179009, "epoch": 1065} {"train_loss": -10.891609191894531, "global_step": 179010, "epoch": 1065} {"train_loss": -10.911849975585938, "global_step": 179011, "epoch": 1065} {"train_loss": -11.017112731933594, "global_step": 179012, "epoch": 1065} {"train_loss": -10.860940933227539, "global_step": 179013, "epoch": 1065} {"train_loss": -11.32046890258789, "global_step": 179014, "epoch": 1065} {"train_loss": -11.299006462097168, "global_step": 179015, "epoch": 1065} {"train_loss": -11.193277359008789, "global_step": 179016, "epoch": 1065} {"train_loss": -11.212082862854004, "global_step": 179017, "epoch": 1065} {"train_loss": -11.150026321411133, "global_step": 179018, "epoch": 1065} {"train_loss": -11.20553207397461, "global_step": 179019, "epoch": 1065} {"train_loss": -11.145284652709961, "global_step": 179020, "epoch": 1065} {"train_loss": -11.11720085144043, "global_step": 179021, "epoch": 1065} {"train_loss": -11.108940124511719, "global_step": 179022, "epoch": 1065} {"train_loss": -11.45128059387207, "global_step": 179023, "epoch": 1065} {"train_loss": -11.219255447387695, "global_step": 179024, "epoch": 1065} {"train_loss": -11.249430656433105, "global_step": 179025, "epoch": 1065} {"train_loss": -11.436140060424805, "global_step": 179026, "epoch": 1065} {"train_loss": -10.93924331665039, "global_step": 179027, "epoch": 1065} {"train_loss": -11.170381546020508, "global_step": 179028, "epoch": 1065} {"train_loss": -11.37076187133789, "global_step": 179029, "epoch": 1065} {"train_loss": -11.06259822845459, "global_step": 179030, "epoch": 1065} {"train_loss": -11.05010986328125, "global_step": 179031, "epoch": 1065} {"train_loss": -11.284563064575195, "global_step": 179032, "epoch": 1065} {"train_loss": -11.180930137634277, "global_step": 179033, "epoch": 1065} {"train_loss": -11.167490005493164, "global_step": 179034, "epoch": 1065} {"train_loss": -11.358879089355469, "global_step": 179035, "epoch": 1065} {"train_loss": -11.219510078430176, "global_step": 179036, "epoch": 1065} {"train_loss": -11.536731719970703, "global_step": 179037, "epoch": 1065} {"train_loss": -11.273713111877441, "global_step": 179038, "epoch": 1065} {"train_loss": -11.325126647949219, "global_step": 179039, "epoch": 1065} {"train_loss": -11.278434753417969, "global_step": 179040, "epoch": 1065} {"train_loss": -11.510198593139648, "global_step": 179041, "epoch": 1065} {"train_loss": -11.502832412719727, "global_step": 179042, "epoch": 1065} {"train_loss": -11.32841968536377, "global_step": 179043, "epoch": 1065} {"train_loss": -11.171991348266602, "global_step": 179044, "epoch": 1065} {"train_loss": -11.04904556274414, "global_step": 179045, "epoch": 1065} {"train_loss": -11.042179107666016, "global_step": 179046, "epoch": 1065} {"train_loss": -10.685922622680664, "global_step": 179047, "epoch": 1065} {"train_loss": -11.46082592010498, "global_step": 179048, "epoch": 1065} {"train_loss": -10.539769172668457, "global_step": 179049, "epoch": 1065} {"train_loss": -11.173295021057129, "global_step": 179050, "epoch": 1065} {"train_loss": -11.161483764648438, "global_step": 179051, "epoch": 1065} {"train_loss": -11.123844146728516, "global_step": 179052, "epoch": 1065} {"train_loss": -10.282125473022461, "global_step": 179053, "epoch": 1065} {"train_loss": -10.9111967086792, "global_step": 179054, "epoch": 1065} {"train_loss": -11.180509567260742, "global_step": 179055, "epoch": 1065} {"train_loss": -10.108325958251953, "global_step": 179056, "epoch": 1065} {"train_loss": -11.351395606994629, "global_step": 179057, "epoch": 1065} {"train_loss": -9.716346740722656, "global_step": 179058, "epoch": 1065} {"train_loss": -10.905431747436523, "global_step": 179059, "epoch": 1065} {"train_loss": -9.982339859008789, "global_step": 179060, "epoch": 1065} {"train_loss": -10.559442520141602, "global_step": 179061, "epoch": 1065} {"train_loss": -11.114279747009277, "global_step": 179062, "epoch": 1065} {"train_loss": -10.248970031738281, "global_step": 179063, "epoch": 1065} {"train_loss": -10.856352806091309, "global_step": 179064, "epoch": 1065} {"train_loss": -10.295686721801758, "global_step": 179065, "epoch": 1065} {"train_loss": -9.858785629272461, "global_step": 179066, "epoch": 1065} {"train_loss": -10.893497467041016, "global_step": 179067, "epoch": 1065} {"train_loss": -10.630180358886719, "global_step": 179068, "epoch": 1065} {"train_loss": -10.744208335876465, "global_step": 179069, "epoch": 1065} {"train_loss": -10.373091697692871, "global_step": 179070, "epoch": 1065} {"train_loss": -10.898212432861328, "global_step": 179071, "epoch": 1065} {"train_loss": -11.036706924438477, "global_step": 179072, "epoch": 1065} {"train_loss": -10.562422752380371, "global_step": 179073, "epoch": 1065} {"train_loss": -10.63974380493164, "global_step": 179074, "epoch": 1065} {"train_loss": -10.839515686035156, "global_step": 179075, "epoch": 1065} {"train_loss": -10.544109344482422, "global_step": 179076, "epoch": 1065} {"train_loss": -10.646306991577148, "global_step": 179077, "epoch": 1065} {"train_loss": -10.27574348449707, "global_step": 179078, "epoch": 1065} {"train_loss": -10.661542892456055, "global_step": 179079, "epoch": 1065} {"train_loss": -10.704256057739258, "global_step": 179080, "epoch": 1065} {"train_loss": -10.379037857055664, "global_step": 179081, "epoch": 1065} {"train_loss": -11.022165298461914, "global_step": 179082, "epoch": 1065} {"train_loss": -10.412858009338379, "global_step": 179083, "epoch": 1065} {"train_loss": -10.624738693237305, "global_step": 179084, "epoch": 1065} {"train_loss": -10.857149124145508, "global_step": 179085, "epoch": 1065} {"train_loss": -10.579748153686523, "global_step": 179086, "epoch": 1065} {"train_loss": -10.877530058224997, "global_step": 179087, "epoch": 1065, "val_loss": 242262.34375, "train_action_mse_error": 0.7747131586074829} {"train_loss": -11.196917533874512, "global_step": 179088, "epoch": 1066} {"train_loss": -10.88037109375, "global_step": 179089, "epoch": 1066} {"train_loss": -11.002487182617188, "global_step": 179090, "epoch": 1066} {"train_loss": -11.180936813354492, "global_step": 179091, "epoch": 1066} {"train_loss": -10.70890998840332, "global_step": 179092, "epoch": 1066} {"train_loss": -11.164565086364746, "global_step": 179093, "epoch": 1066} {"train_loss": -11.066123962402344, "global_step": 179094, "epoch": 1066} {"train_loss": -11.070891380310059, "global_step": 179095, "epoch": 1066} {"train_loss": -11.092693328857422, "global_step": 179096, "epoch": 1066} {"train_loss": -11.136205673217773, "global_step": 179097, "epoch": 1066} {"train_loss": -11.026308059692383, "global_step": 179098, "epoch": 1066} {"train_loss": -10.99708080291748, "global_step": 179099, "epoch": 1066} {"train_loss": -10.664400100708008, "global_step": 179100, "epoch": 1066} {"train_loss": -11.029741287231445, "global_step": 179101, "epoch": 1066} {"train_loss": -11.174442291259766, "global_step": 179102, "epoch": 1066} {"train_loss": -11.143394470214844, "global_step": 179103, "epoch": 1066} {"train_loss": -11.018770217895508, "global_step": 179104, "epoch": 1066} {"train_loss": -11.402961730957031, "global_step": 179105, "epoch": 1066} {"train_loss": -11.247428894042969, "global_step": 179106, "epoch": 1066} {"train_loss": -11.393953323364258, "global_step": 179107, "epoch": 1066} {"train_loss": -11.079286575317383, "global_step": 179108, "epoch": 1066} {"train_loss": -11.472892761230469, "global_step": 179109, "epoch": 1066} {"train_loss": -11.186554908752441, "global_step": 179110, "epoch": 1066} {"train_loss": -11.347014427185059, "global_step": 179111, "epoch": 1066} {"train_loss": -11.11198616027832, "global_step": 179112, "epoch": 1066} {"train_loss": -11.225536346435547, "global_step": 179113, "epoch": 1066} {"train_loss": -11.02963638305664, "global_step": 179114, "epoch": 1066} {"train_loss": -11.395959854125977, "global_step": 179115, "epoch": 1066} {"train_loss": -11.060159683227539, "global_step": 179116, "epoch": 1066} {"train_loss": -11.470504760742188, "global_step": 179117, "epoch": 1066} {"train_loss": -11.35196590423584, "global_step": 179118, "epoch": 1066} {"train_loss": -11.181390762329102, "global_step": 179119, "epoch": 1066} {"train_loss": -11.15019416809082, "global_step": 179120, "epoch": 1066} {"train_loss": -11.256464004516602, "global_step": 179121, "epoch": 1066} {"train_loss": -11.38251781463623, "global_step": 179122, "epoch": 1066} {"train_loss": -11.211238861083984, "global_step": 179123, "epoch": 1066} {"train_loss": -11.61181926727295, "global_step": 179124, "epoch": 1066} {"train_loss": -11.377628326416016, "global_step": 179125, "epoch": 1066} {"train_loss": -11.068868637084961, "global_step": 179126, "epoch": 1066} {"train_loss": -11.316178321838379, "global_step": 179127, "epoch": 1066} {"train_loss": -11.501444816589355, "global_step": 179128, "epoch": 1066} {"train_loss": -11.018067359924316, "global_step": 179129, "epoch": 1066} {"train_loss": -11.707125663757324, "global_step": 179130, "epoch": 1066} {"train_loss": -11.130664825439453, "global_step": 179131, "epoch": 1066} {"train_loss": -11.318635940551758, "global_step": 179132, "epoch": 1066} {"train_loss": -11.421088218688965, "global_step": 179133, "epoch": 1066} {"train_loss": -11.389179229736328, "global_step": 179134, "epoch": 1066} {"train_loss": -11.706947326660156, "global_step": 179135, "epoch": 1066} {"train_loss": -11.343472480773926, "global_step": 179136, "epoch": 1066} {"train_loss": -11.522860527038574, "global_step": 179137, "epoch": 1066} {"train_loss": -11.587235450744629, "global_step": 179138, "epoch": 1066} {"train_loss": -11.310787200927734, "global_step": 179139, "epoch": 1066} {"train_loss": -11.685225486755371, "global_step": 179140, "epoch": 1066} {"train_loss": -11.620986938476562, "global_step": 179141, "epoch": 1066} {"train_loss": -11.58881950378418, "global_step": 179142, "epoch": 1066} {"train_loss": -11.47385025024414, "global_step": 179143, "epoch": 1066} {"train_loss": -11.574861526489258, "global_step": 179144, "epoch": 1066} {"train_loss": -11.275635719299316, "global_step": 179145, "epoch": 1066} {"train_loss": -11.29902458190918, "global_step": 179146, "epoch": 1066} {"train_loss": -11.438343048095703, "global_step": 179147, "epoch": 1066} {"train_loss": -11.061595916748047, "global_step": 179148, "epoch": 1066} {"train_loss": -10.323355674743652, "global_step": 179149, "epoch": 1066} {"train_loss": -10.129446983337402, "global_step": 179150, "epoch": 1066} {"train_loss": -10.631412506103516, "global_step": 179151, "epoch": 1066} {"train_loss": -9.830954551696777, "global_step": 179152, "epoch": 1066} {"train_loss": -10.718368530273438, "global_step": 179153, "epoch": 1066} {"train_loss": -9.841894149780273, "global_step": 179154, "epoch": 1066} {"train_loss": -10.409384727478027, "global_step": 179155, "epoch": 1066} {"train_loss": -9.323817253112793, "global_step": 179156, "epoch": 1066} {"train_loss": -7.816530704498291, "global_step": 179157, "epoch": 1066} {"train_loss": -8.959602355957031, "global_step": 179158, "epoch": 1066} {"train_loss": -8.269320487976074, "global_step": 179159, "epoch": 1066} {"train_loss": -9.56871509552002, "global_step": 179160, "epoch": 1066} {"train_loss": -8.984870910644531, "global_step": 179161, "epoch": 1066} {"train_loss": -10.519425392150879, "global_step": 179162, "epoch": 1066} {"train_loss": -9.660460472106934, "global_step": 179163, "epoch": 1066} {"train_loss": -11.011775970458984, "global_step": 179164, "epoch": 1066} {"train_loss": -9.995771408081055, "global_step": 179165, "epoch": 1066} {"train_loss": -10.336814880371094, "global_step": 179166, "epoch": 1066} {"train_loss": -10.774827003479004, "global_step": 179167, "epoch": 1066} {"train_loss": -10.439436912536621, "global_step": 179168, "epoch": 1066} {"train_loss": -10.616312026977539, "global_step": 179169, "epoch": 1066} {"train_loss": -10.152389526367188, "global_step": 179170, "epoch": 1066} {"train_loss": -10.648405075073242, "global_step": 179171, "epoch": 1066} {"train_loss": -10.88807487487793, "global_step": 179172, "epoch": 1066} {"train_loss": -10.465021133422852, "global_step": 179173, "epoch": 1066} {"train_loss": -10.850093841552734, "global_step": 179174, "epoch": 1066} {"train_loss": -10.734442710876465, "global_step": 179175, "epoch": 1066} {"train_loss": -10.622541427612305, "global_step": 179176, "epoch": 1066} {"train_loss": -10.798463821411133, "global_step": 179177, "epoch": 1066} {"train_loss": -10.715435028076172, "global_step": 179178, "epoch": 1066} {"train_loss": -10.910218238830566, "global_step": 179179, "epoch": 1066} {"train_loss": -10.886722564697266, "global_step": 179180, "epoch": 1066} {"train_loss": -10.829298973083496, "global_step": 179181, "epoch": 1066} {"train_loss": -10.856130599975586, "global_step": 179182, "epoch": 1066} {"train_loss": -11.121444702148438, "global_step": 179183, "epoch": 1066} {"train_loss": -10.673768043518066, "global_step": 179184, "epoch": 1066} {"train_loss": -10.954166412353516, "global_step": 179185, "epoch": 1066} {"train_loss": -10.980206489562988, "global_step": 179186, "epoch": 1066} {"train_loss": -10.715110778808594, "global_step": 179187, "epoch": 1066} {"train_loss": -10.96394157409668, "global_step": 179188, "epoch": 1066} {"train_loss": -10.836533546447754, "global_step": 179189, "epoch": 1066} {"train_loss": -10.808646202087402, "global_step": 179190, "epoch": 1066} {"train_loss": -11.1117525100708, "global_step": 179191, "epoch": 1066} {"train_loss": -10.981565475463867, "global_step": 179192, "epoch": 1066} {"train_loss": -10.980391502380371, "global_step": 179193, "epoch": 1066} {"train_loss": -10.935844421386719, "global_step": 179194, "epoch": 1066} {"train_loss": -11.061885833740234, "global_step": 179195, "epoch": 1066} {"train_loss": -11.131933212280273, "global_step": 179196, "epoch": 1066} {"train_loss": -11.242156028747559, "global_step": 179197, "epoch": 1066} {"train_loss": -11.179656982421875, "global_step": 179198, "epoch": 1066} {"train_loss": -11.03665542602539, "global_step": 179199, "epoch": 1066} {"train_loss": -11.174285888671875, "global_step": 179200, "epoch": 1066} {"train_loss": -11.061798095703125, "global_step": 179201, "epoch": 1066} {"train_loss": -11.178393363952637, "global_step": 179202, "epoch": 1066} {"train_loss": -11.098695755004883, "global_step": 179203, "epoch": 1066} {"train_loss": -10.925594329833984, "global_step": 179204, "epoch": 1066} {"train_loss": -11.142389297485352, "global_step": 179205, "epoch": 1066} {"train_loss": -11.319829940795898, "global_step": 179206, "epoch": 1066} {"train_loss": -11.281789779663086, "global_step": 179207, "epoch": 1066} {"train_loss": -11.390947341918945, "global_step": 179208, "epoch": 1066} {"train_loss": -11.329923629760742, "global_step": 179209, "epoch": 1066} {"train_loss": -11.469305038452148, "global_step": 179210, "epoch": 1066} {"train_loss": -11.26302433013916, "global_step": 179211, "epoch": 1066} {"train_loss": -11.287925720214844, "global_step": 179212, "epoch": 1066} {"train_loss": -11.450185775756836, "global_step": 179213, "epoch": 1066} {"train_loss": -11.241552352905273, "global_step": 179214, "epoch": 1066} {"train_loss": -11.129167556762695, "global_step": 179215, "epoch": 1066} {"train_loss": -11.302871704101562, "global_step": 179216, "epoch": 1066} {"train_loss": -11.36552619934082, "global_step": 179217, "epoch": 1066} {"train_loss": -11.611977577209473, "global_step": 179218, "epoch": 1066} {"train_loss": -11.230628967285156, "global_step": 179219, "epoch": 1066} {"train_loss": -11.456684112548828, "global_step": 179220, "epoch": 1066} {"train_loss": -11.276620864868164, "global_step": 179221, "epoch": 1066} {"train_loss": -11.435131072998047, "global_step": 179222, "epoch": 1066} {"train_loss": -11.513521194458008, "global_step": 179223, "epoch": 1066} {"train_loss": -11.62358283996582, "global_step": 179224, "epoch": 1066} {"train_loss": -11.388162612915039, "global_step": 179225, "epoch": 1066} {"train_loss": -11.606250762939453, "global_step": 179226, "epoch": 1066} {"train_loss": -11.141020774841309, "global_step": 179227, "epoch": 1066} {"train_loss": -11.468040466308594, "global_step": 179228, "epoch": 1066} {"train_loss": -11.549243927001953, "global_step": 179229, "epoch": 1066} {"train_loss": -11.309532165527344, "global_step": 179230, "epoch": 1066} {"train_loss": -11.617330551147461, "global_step": 179231, "epoch": 1066} {"train_loss": -11.098392486572266, "global_step": 179232, "epoch": 1066} {"train_loss": -11.07726764678955, "global_step": 179233, "epoch": 1066} {"train_loss": -11.474932670593262, "global_step": 179234, "epoch": 1066} {"train_loss": -10.526244163513184, "global_step": 179235, "epoch": 1066} {"train_loss": -10.856888771057129, "global_step": 179236, "epoch": 1066} {"train_loss": -11.25656509399414, "global_step": 179237, "epoch": 1066} {"train_loss": -11.136743545532227, "global_step": 179238, "epoch": 1066} {"train_loss": -10.419891357421875, "global_step": 179239, "epoch": 1066} {"train_loss": -10.895406723022461, "global_step": 179240, "epoch": 1066} {"train_loss": -11.473065376281738, "global_step": 179241, "epoch": 1066} {"train_loss": -10.896913528442383, "global_step": 179242, "epoch": 1066} {"train_loss": -11.056421279907227, "global_step": 179243, "epoch": 1066} {"train_loss": -11.039112091064453, "global_step": 179244, "epoch": 1066} {"train_loss": -10.581567764282227, "global_step": 179245, "epoch": 1066} {"train_loss": -11.108772277832031, "global_step": 179246, "epoch": 1066} {"train_loss": -11.155268669128418, "global_step": 179247, "epoch": 1066} {"train_loss": -11.058889389038086, "global_step": 179248, "epoch": 1066} {"train_loss": -11.551326751708984, "global_step": 179249, "epoch": 1066} {"train_loss": -11.132816314697266, "global_step": 179250, "epoch": 1066} {"train_loss": -11.461687088012695, "global_step": 179251, "epoch": 1066} {"train_loss": -11.130437850952148, "global_step": 179252, "epoch": 1066} {"train_loss": -11.172148704528809, "global_step": 179253, "epoch": 1066} {"train_loss": -10.997659683227539, "global_step": 179254, "epoch": 1066} {"train_loss": -11.008284452415648, "global_step": 179255, "epoch": 1066, "val_loss": 245311.9375} {"train_loss": -11.443178176879883, "global_step": 179256, "epoch": 1067} {"train_loss": -11.038168907165527, "global_step": 179257, "epoch": 1067} {"train_loss": -11.47899055480957, "global_step": 179258, "epoch": 1067} {"train_loss": -11.209108352661133, "global_step": 179259, "epoch": 1067} {"train_loss": -10.634730339050293, "global_step": 179260, "epoch": 1067} {"train_loss": -11.249540328979492, "global_step": 179261, "epoch": 1067} {"train_loss": -11.365438461303711, "global_step": 179262, "epoch": 1067} {"train_loss": -11.176309585571289, "global_step": 179263, "epoch": 1067} {"train_loss": -11.07590389251709, "global_step": 179264, "epoch": 1067} {"train_loss": -11.222015380859375, "global_step": 179265, "epoch": 1067} {"train_loss": -10.905929565429688, "global_step": 179266, "epoch": 1067} {"train_loss": -11.04887580871582, "global_step": 179267, "epoch": 1067} {"train_loss": -11.074217796325684, "global_step": 179268, "epoch": 1067} {"train_loss": -11.33798885345459, "global_step": 179269, "epoch": 1067} {"train_loss": -10.824928283691406, "global_step": 179270, "epoch": 1067} {"train_loss": -10.784736633300781, "global_step": 179271, "epoch": 1067} {"train_loss": -10.818672180175781, "global_step": 179272, "epoch": 1067} {"train_loss": -10.859240531921387, "global_step": 179273, "epoch": 1067} {"train_loss": -11.013833999633789, "global_step": 179274, "epoch": 1067} {"train_loss": -10.53158950805664, "global_step": 179275, "epoch": 1067} {"train_loss": -11.267045974731445, "global_step": 179276, "epoch": 1067} {"train_loss": -11.117111206054688, "global_step": 179277, "epoch": 1067} {"train_loss": -10.373495101928711, "global_step": 179278, "epoch": 1067} {"train_loss": -11.480179786682129, "global_step": 179279, "epoch": 1067} {"train_loss": -10.63821029663086, "global_step": 179280, "epoch": 1067} {"train_loss": -11.209238052368164, "global_step": 179281, "epoch": 1067} {"train_loss": -10.998540878295898, "global_step": 179282, "epoch": 1067} {"train_loss": -10.485132217407227, "global_step": 179283, "epoch": 1067} {"train_loss": -11.152231216430664, "global_step": 179284, "epoch": 1067} {"train_loss": -10.60012435913086, "global_step": 179285, "epoch": 1067} {"train_loss": -10.880494117736816, "global_step": 179286, "epoch": 1067} {"train_loss": -10.726670265197754, "global_step": 179287, "epoch": 1067} {"train_loss": -10.873394012451172, "global_step": 179288, "epoch": 1067} {"train_loss": -11.068968772888184, "global_step": 179289, "epoch": 1067} {"train_loss": -11.014512062072754, "global_step": 179290, "epoch": 1067} {"train_loss": -11.41356372833252, "global_step": 179291, "epoch": 1067} {"train_loss": -11.039714813232422, "global_step": 179292, "epoch": 1067} {"train_loss": -11.367785453796387, "global_step": 179293, "epoch": 1067} {"train_loss": -11.032609939575195, "global_step": 179294, "epoch": 1067} {"train_loss": -10.946980476379395, "global_step": 179295, "epoch": 1067} {"train_loss": -11.170465469360352, "global_step": 179296, "epoch": 1067} {"train_loss": -11.098312377929688, "global_step": 179297, "epoch": 1067} {"train_loss": -11.303827285766602, "global_step": 179298, "epoch": 1067} {"train_loss": -11.203179359436035, "global_step": 179299, "epoch": 1067} {"train_loss": -11.413564682006836, "global_step": 179300, "epoch": 1067} {"train_loss": -11.093795776367188, "global_step": 179301, "epoch": 1067} {"train_loss": -10.805599212646484, "global_step": 179302, "epoch": 1067} {"train_loss": -11.108125686645508, "global_step": 179303, "epoch": 1067} {"train_loss": -11.225266456604004, "global_step": 179304, "epoch": 1067} {"train_loss": -11.048959732055664, "global_step": 179305, "epoch": 1067} {"train_loss": -11.062332153320312, "global_step": 179306, "epoch": 1067} {"train_loss": -11.176734924316406, "global_step": 179307, "epoch": 1067} {"train_loss": -10.801515579223633, "global_step": 179308, "epoch": 1067} {"train_loss": -11.096691131591797, "global_step": 179309, "epoch": 1067} {"train_loss": -11.193016052246094, "global_step": 179310, "epoch": 1067} {"train_loss": -11.223043441772461, "global_step": 179311, "epoch": 1067} {"train_loss": -11.352283477783203, "global_step": 179312, "epoch": 1067} {"train_loss": -11.294892311096191, "global_step": 179313, "epoch": 1067} {"train_loss": -11.080938339233398, "global_step": 179314, "epoch": 1067} {"train_loss": -11.229118347167969, "global_step": 179315, "epoch": 1067} {"train_loss": -11.147943496704102, "global_step": 179316, "epoch": 1067} {"train_loss": -11.249947547912598, "global_step": 179317, "epoch": 1067} {"train_loss": -11.329719543457031, "global_step": 179318, "epoch": 1067} {"train_loss": -11.207551956176758, "global_step": 179319, "epoch": 1067} {"train_loss": -11.311525344848633, "global_step": 179320, "epoch": 1067} {"train_loss": -11.021551132202148, "global_step": 179321, "epoch": 1067} {"train_loss": -10.92041015625, "global_step": 179322, "epoch": 1067} {"train_loss": -11.341201782226562, "global_step": 179323, "epoch": 1067} {"train_loss": -11.1561279296875, "global_step": 179324, "epoch": 1067} {"train_loss": -10.524591445922852, "global_step": 179325, "epoch": 1067} {"train_loss": -11.455902099609375, "global_step": 179326, "epoch": 1067} {"train_loss": -11.350111961364746, "global_step": 179327, "epoch": 1067} {"train_loss": -11.299339294433594, "global_step": 179328, "epoch": 1067} {"train_loss": -11.388980865478516, "global_step": 179329, "epoch": 1067} {"train_loss": -11.442813873291016, "global_step": 179330, "epoch": 1067} {"train_loss": -11.556018829345703, "global_step": 179331, "epoch": 1067} {"train_loss": -11.423665046691895, "global_step": 179332, "epoch": 1067} {"train_loss": -11.343198776245117, "global_step": 179333, "epoch": 1067} {"train_loss": -11.382410049438477, "global_step": 179334, "epoch": 1067} {"train_loss": -11.517412185668945, "global_step": 179335, "epoch": 1067} {"train_loss": -11.126117706298828, "global_step": 179336, "epoch": 1067} {"train_loss": -11.608601570129395, "global_step": 179337, "epoch": 1067} {"train_loss": -11.339027404785156, "global_step": 179338, "epoch": 1067} {"train_loss": -11.119817733764648, "global_step": 179339, "epoch": 1067} {"train_loss": -11.040559768676758, "global_step": 179340, "epoch": 1067} {"train_loss": -11.22691535949707, "global_step": 179341, "epoch": 1067} {"train_loss": -10.96324634552002, "global_step": 179342, "epoch": 1067} {"train_loss": -11.174398422241211, "global_step": 179343, "epoch": 1067} {"train_loss": -11.343622207641602, "global_step": 179344, "epoch": 1067} {"train_loss": -11.520082473754883, "global_step": 179345, "epoch": 1067} {"train_loss": -11.471511840820312, "global_step": 179346, "epoch": 1067} {"train_loss": -11.530539512634277, "global_step": 179347, "epoch": 1067} {"train_loss": -11.236227035522461, "global_step": 179348, "epoch": 1067} {"train_loss": -11.33492660522461, "global_step": 179349, "epoch": 1067} {"train_loss": -11.150467872619629, "global_step": 179350, "epoch": 1067} {"train_loss": -11.530035018920898, "global_step": 179351, "epoch": 1067} {"train_loss": -11.401605606079102, "global_step": 179352, "epoch": 1067} {"train_loss": -11.57558536529541, "global_step": 179353, "epoch": 1067} {"train_loss": -11.255953788757324, "global_step": 179354, "epoch": 1067} {"train_loss": -11.121689796447754, "global_step": 179355, "epoch": 1067} {"train_loss": -11.340279579162598, "global_step": 179356, "epoch": 1067} {"train_loss": -11.257394790649414, "global_step": 179357, "epoch": 1067} {"train_loss": -11.517534255981445, "global_step": 179358, "epoch": 1067} {"train_loss": -11.30991268157959, "global_step": 179359, "epoch": 1067} {"train_loss": -11.49907112121582, "global_step": 179360, "epoch": 1067} {"train_loss": -11.27601432800293, "global_step": 179361, "epoch": 1067} {"train_loss": -11.165385246276855, "global_step": 179362, "epoch": 1067} {"train_loss": -11.699929237365723, "global_step": 179363, "epoch": 1067} {"train_loss": -11.377924919128418, "global_step": 179364, "epoch": 1067} {"train_loss": -11.156572341918945, "global_step": 179365, "epoch": 1067} {"train_loss": -11.46379566192627, "global_step": 179366, "epoch": 1067} {"train_loss": -11.020421981811523, "global_step": 179367, "epoch": 1067} {"train_loss": -11.164026260375977, "global_step": 179368, "epoch": 1067} {"train_loss": -11.388982772827148, "global_step": 179369, "epoch": 1067} {"train_loss": -11.474992752075195, "global_step": 179370, "epoch": 1067} {"train_loss": -10.68547248840332, "global_step": 179371, "epoch": 1067} {"train_loss": -9.707619667053223, "global_step": 179372, "epoch": 1067} {"train_loss": -10.541622161865234, "global_step": 179373, "epoch": 1067} {"train_loss": -10.698637008666992, "global_step": 179374, "epoch": 1067} {"train_loss": -9.155797004699707, "global_step": 179375, "epoch": 1067} {"train_loss": -10.649321556091309, "global_step": 179376, "epoch": 1067} {"train_loss": -9.739623069763184, "global_step": 179377, "epoch": 1067} {"train_loss": -10.148490905761719, "global_step": 179378, "epoch": 1067} {"train_loss": -10.405176162719727, "global_step": 179379, "epoch": 1067} {"train_loss": -10.019951820373535, "global_step": 179380, "epoch": 1067} {"train_loss": -10.97637939453125, "global_step": 179381, "epoch": 1067} {"train_loss": -10.553644180297852, "global_step": 179382, "epoch": 1067} {"train_loss": -10.956098556518555, "global_step": 179383, "epoch": 1067} {"train_loss": -10.743934631347656, "global_step": 179384, "epoch": 1067} {"train_loss": -10.70516586303711, "global_step": 179385, "epoch": 1067} {"train_loss": -11.057415008544922, "global_step": 179386, "epoch": 1067} {"train_loss": -10.617925643920898, "global_step": 179387, "epoch": 1067} {"train_loss": -10.849651336669922, "global_step": 179388, "epoch": 1067} {"train_loss": -10.89631462097168, "global_step": 179389, "epoch": 1067} {"train_loss": -10.931412696838379, "global_step": 179390, "epoch": 1067} {"train_loss": -11.063705444335938, "global_step": 179391, "epoch": 1067} {"train_loss": -10.623319625854492, "global_step": 179392, "epoch": 1067} {"train_loss": -10.908127784729004, "global_step": 179393, "epoch": 1067} {"train_loss": -10.039192199707031, "global_step": 179394, "epoch": 1067} {"train_loss": -10.76229476928711, "global_step": 179395, "epoch": 1067} {"train_loss": -10.821794509887695, "global_step": 179396, "epoch": 1067} {"train_loss": -10.99891471862793, "global_step": 179397, "epoch": 1067} {"train_loss": -10.717927932739258, "global_step": 179398, "epoch": 1067} {"train_loss": -10.59774398803711, "global_step": 179399, "epoch": 1067} {"train_loss": -10.659576416015625, "global_step": 179400, "epoch": 1067} {"train_loss": -9.861261367797852, "global_step": 179401, "epoch": 1067} {"train_loss": -10.950973510742188, "global_step": 179402, "epoch": 1067} {"train_loss": -9.5408935546875, "global_step": 179403, "epoch": 1067} {"train_loss": -10.701562881469727, "global_step": 179404, "epoch": 1067} {"train_loss": -10.107357025146484, "global_step": 179405, "epoch": 1067} {"train_loss": -10.707255363464355, "global_step": 179406, "epoch": 1067} {"train_loss": -10.466520309448242, "global_step": 179407, "epoch": 1067} {"train_loss": -10.77373218536377, "global_step": 179408, "epoch": 1067} {"train_loss": -10.521543502807617, "global_step": 179409, "epoch": 1067} {"train_loss": -10.395647048950195, "global_step": 179410, "epoch": 1067} {"train_loss": -10.279196739196777, "global_step": 179411, "epoch": 1067} {"train_loss": -11.12656307220459, "global_step": 179412, "epoch": 1067} {"train_loss": -10.489654541015625, "global_step": 179413, "epoch": 1067} {"train_loss": -10.82802963256836, "global_step": 179414, "epoch": 1067} {"train_loss": -10.449953079223633, "global_step": 179415, "epoch": 1067} {"train_loss": -10.695647239685059, "global_step": 179416, "epoch": 1067} {"train_loss": -10.523384094238281, "global_step": 179417, "epoch": 1067} {"train_loss": -10.746646881103516, "global_step": 179418, "epoch": 1067} {"train_loss": -10.731830596923828, "global_step": 179419, "epoch": 1067} {"train_loss": -10.368717193603516, "global_step": 179420, "epoch": 1067} {"train_loss": -10.982800483703613, "global_step": 179421, "epoch": 1067} {"train_loss": -10.55813980102539, "global_step": 179422, "epoch": 1067} {"train_loss": -10.985114194097973, "global_step": 179423, "epoch": 1067, "val_loss": 246161.921875} {"train_loss": -10.9625244140625, "global_step": 179424, "epoch": 1068} {"train_loss": -11.067700386047363, "global_step": 179425, "epoch": 1068} {"train_loss": -10.610589981079102, "global_step": 179426, "epoch": 1068} {"train_loss": -11.015217781066895, "global_step": 179427, "epoch": 1068} {"train_loss": -10.819106101989746, "global_step": 179428, "epoch": 1068} {"train_loss": -11.101874351501465, "global_step": 179429, "epoch": 1068} {"train_loss": -10.890802383422852, "global_step": 179430, "epoch": 1068} {"train_loss": -11.207380294799805, "global_step": 179431, "epoch": 1068} {"train_loss": -10.869253158569336, "global_step": 179432, "epoch": 1068} {"train_loss": -10.942167282104492, "global_step": 179433, "epoch": 1068} {"train_loss": -11.121376037597656, "global_step": 179434, "epoch": 1068} {"train_loss": -11.092155456542969, "global_step": 179435, "epoch": 1068} {"train_loss": -11.23107624053955, "global_step": 179436, "epoch": 1068} {"train_loss": -11.116817474365234, "global_step": 179437, "epoch": 1068} {"train_loss": -11.019243240356445, "global_step": 179438, "epoch": 1068} {"train_loss": -11.034744262695312, "global_step": 179439, "epoch": 1068} {"train_loss": -11.093870162963867, "global_step": 179440, "epoch": 1068} {"train_loss": -11.131359100341797, "global_step": 179441, "epoch": 1068} {"train_loss": -11.258007049560547, "global_step": 179442, "epoch": 1068} {"train_loss": -11.088114738464355, "global_step": 179443, "epoch": 1068} {"train_loss": -11.396514892578125, "global_step": 179444, "epoch": 1068} {"train_loss": -11.339208602905273, "global_step": 179445, "epoch": 1068} {"train_loss": -11.255415916442871, "global_step": 179446, "epoch": 1068} {"train_loss": -11.270162582397461, "global_step": 179447, "epoch": 1068} {"train_loss": -11.051102638244629, "global_step": 179448, "epoch": 1068} {"train_loss": -11.278868675231934, "global_step": 179449, "epoch": 1068} {"train_loss": -11.151790618896484, "global_step": 179450, "epoch": 1068} {"train_loss": -11.495221138000488, "global_step": 179451, "epoch": 1068} {"train_loss": -11.575376510620117, "global_step": 179452, "epoch": 1068} {"train_loss": -11.381298065185547, "global_step": 179453, "epoch": 1068} {"train_loss": -11.359567642211914, "global_step": 179454, "epoch": 1068} {"train_loss": -11.354528427124023, "global_step": 179455, "epoch": 1068} {"train_loss": -11.360298156738281, "global_step": 179456, "epoch": 1068} {"train_loss": -11.611708641052246, "global_step": 179457, "epoch": 1068} {"train_loss": -11.70009994506836, "global_step": 179458, "epoch": 1068} {"train_loss": -11.453694343566895, "global_step": 179459, "epoch": 1068} {"train_loss": -11.481762886047363, "global_step": 179460, "epoch": 1068} {"train_loss": -11.429052352905273, "global_step": 179461, "epoch": 1068} {"train_loss": -11.590700149536133, "global_step": 179462, "epoch": 1068} {"train_loss": -11.378556251525879, "global_step": 179463, "epoch": 1068} {"train_loss": -11.670096397399902, "global_step": 179464, "epoch": 1068} {"train_loss": -11.381842613220215, "global_step": 179465, "epoch": 1068} {"train_loss": -11.712708473205566, "global_step": 179466, "epoch": 1068} {"train_loss": -11.563094139099121, "global_step": 179467, "epoch": 1068} {"train_loss": -11.727070808410645, "global_step": 179468, "epoch": 1068} {"train_loss": -11.609426498413086, "global_step": 179469, "epoch": 1068} {"train_loss": -11.734528541564941, "global_step": 179470, "epoch": 1068} {"train_loss": -11.595686912536621, "global_step": 179471, "epoch": 1068} {"train_loss": -11.384925842285156, "global_step": 179472, "epoch": 1068} {"train_loss": -11.704854965209961, "global_step": 179473, "epoch": 1068} {"train_loss": -11.620037078857422, "global_step": 179474, "epoch": 1068} {"train_loss": -11.36721420288086, "global_step": 179475, "epoch": 1068} {"train_loss": -11.638967514038086, "global_step": 179476, "epoch": 1068} {"train_loss": -11.530780792236328, "global_step": 179477, "epoch": 1068} {"train_loss": -11.077584266662598, "global_step": 179478, "epoch": 1068} {"train_loss": -10.265901565551758, "global_step": 179479, "epoch": 1068} {"train_loss": -10.913392066955566, "global_step": 179480, "epoch": 1068} {"train_loss": -11.16132926940918, "global_step": 179481, "epoch": 1068} {"train_loss": -11.130382537841797, "global_step": 179482, "epoch": 1068} {"train_loss": -10.434447288513184, "global_step": 179483, "epoch": 1068} {"train_loss": -8.958351135253906, "global_step": 179484, "epoch": 1068} {"train_loss": -11.02623176574707, "global_step": 179485, "epoch": 1068} {"train_loss": -9.66873836517334, "global_step": 179486, "epoch": 1068} {"train_loss": -8.640899658203125, "global_step": 179487, "epoch": 1068} {"train_loss": -9.048643112182617, "global_step": 179488, "epoch": 1068} {"train_loss": -9.16230583190918, "global_step": 179489, "epoch": 1068} {"train_loss": -10.870208740234375, "global_step": 179490, "epoch": 1068} {"train_loss": -8.519370079040527, "global_step": 179491, "epoch": 1068} {"train_loss": -9.358383178710938, "global_step": 179492, "epoch": 1068} {"train_loss": -8.879348754882812, "global_step": 179493, "epoch": 1068} {"train_loss": -10.056660652160645, "global_step": 179494, "epoch": 1068} {"train_loss": -8.762374877929688, "global_step": 179495, "epoch": 1068} {"train_loss": -9.721785545349121, "global_step": 179496, "epoch": 1068} {"train_loss": -9.641341209411621, "global_step": 179497, "epoch": 1068} {"train_loss": -10.0714111328125, "global_step": 179498, "epoch": 1068} {"train_loss": -10.287609100341797, "global_step": 179499, "epoch": 1068} {"train_loss": -10.081831932067871, "global_step": 179500, "epoch": 1068} {"train_loss": -9.552027702331543, "global_step": 179501, "epoch": 1068} {"train_loss": -10.645076751708984, "global_step": 179502, "epoch": 1068} {"train_loss": -10.263720512390137, "global_step": 179503, "epoch": 1068} {"train_loss": -9.757070541381836, "global_step": 179504, "epoch": 1068} {"train_loss": -10.501359939575195, "global_step": 179505, "epoch": 1068} {"train_loss": -10.42569351196289, "global_step": 179506, "epoch": 1068} {"train_loss": -10.29644775390625, "global_step": 179507, "epoch": 1068} {"train_loss": -10.547000885009766, "global_step": 179508, "epoch": 1068} {"train_loss": -10.673885345458984, "global_step": 179509, "epoch": 1068} {"train_loss": -10.509012222290039, "global_step": 179510, "epoch": 1068} {"train_loss": -10.54411792755127, "global_step": 179511, "epoch": 1068} {"train_loss": -10.23128604888916, "global_step": 179512, "epoch": 1068} {"train_loss": -10.431349754333496, "global_step": 179513, "epoch": 1068} {"train_loss": -10.914708137512207, "global_step": 179514, "epoch": 1068} {"train_loss": -10.795199394226074, "global_step": 179515, "epoch": 1068} {"train_loss": -10.53235912322998, "global_step": 179516, "epoch": 1068} {"train_loss": -10.83868408203125, "global_step": 179517, "epoch": 1068} {"train_loss": -10.972799301147461, "global_step": 179518, "epoch": 1068} {"train_loss": -10.673389434814453, "global_step": 179519, "epoch": 1068} {"train_loss": -10.741315841674805, "global_step": 179520, "epoch": 1068} {"train_loss": -10.794804573059082, "global_step": 179521, "epoch": 1068} {"train_loss": -10.572996139526367, "global_step": 179522, "epoch": 1068} {"train_loss": -10.883552551269531, "global_step": 179523, "epoch": 1068} {"train_loss": -10.79212474822998, "global_step": 179524, "epoch": 1068} {"train_loss": -10.831039428710938, "global_step": 179525, "epoch": 1068} {"train_loss": -10.927240371704102, "global_step": 179526, "epoch": 1068} {"train_loss": -11.094054222106934, "global_step": 179527, "epoch": 1068} {"train_loss": -11.063567161560059, "global_step": 179528, "epoch": 1068} {"train_loss": -11.054424285888672, "global_step": 179529, "epoch": 1068} {"train_loss": -11.145353317260742, "global_step": 179530, "epoch": 1068} {"train_loss": -11.097657203674316, "global_step": 179531, "epoch": 1068} {"train_loss": -11.142170906066895, "global_step": 179532, "epoch": 1068} {"train_loss": -10.890172958374023, "global_step": 179533, "epoch": 1068} {"train_loss": -10.849257469177246, "global_step": 179534, "epoch": 1068} {"train_loss": -11.156620025634766, "global_step": 179535, "epoch": 1068} {"train_loss": -11.14367961883545, "global_step": 179536, "epoch": 1068} {"train_loss": -11.227025985717773, "global_step": 179537, "epoch": 1068} {"train_loss": -11.287140846252441, "global_step": 179538, "epoch": 1068} {"train_loss": -11.265558242797852, "global_step": 179539, "epoch": 1068} {"train_loss": -11.223434448242188, "global_step": 179540, "epoch": 1068} {"train_loss": -11.401153564453125, "global_step": 179541, "epoch": 1068} {"train_loss": -11.206039428710938, "global_step": 179542, "epoch": 1068} {"train_loss": -11.199262619018555, "global_step": 179543, "epoch": 1068} {"train_loss": -11.266362190246582, "global_step": 179544, "epoch": 1068} {"train_loss": -10.994375228881836, "global_step": 179545, "epoch": 1068} {"train_loss": -11.295122146606445, "global_step": 179546, "epoch": 1068} {"train_loss": -11.13221263885498, "global_step": 179547, "epoch": 1068} {"train_loss": -11.354966163635254, "global_step": 179548, "epoch": 1068} {"train_loss": -11.033722877502441, "global_step": 179549, "epoch": 1068} {"train_loss": -11.255240440368652, "global_step": 179550, "epoch": 1068} {"train_loss": -11.520896911621094, "global_step": 179551, "epoch": 1068} {"train_loss": -11.385797500610352, "global_step": 179552, "epoch": 1068} {"train_loss": -11.409241676330566, "global_step": 179553, "epoch": 1068} {"train_loss": -11.248722076416016, "global_step": 179554, "epoch": 1068} {"train_loss": -11.269981384277344, "global_step": 179555, "epoch": 1068} {"train_loss": -11.216753005981445, "global_step": 179556, "epoch": 1068} {"train_loss": -11.461952209472656, "global_step": 179557, "epoch": 1068} {"train_loss": -11.302331924438477, "global_step": 179558, "epoch": 1068} {"train_loss": -11.485300064086914, "global_step": 179559, "epoch": 1068} {"train_loss": -11.315225601196289, "global_step": 179560, "epoch": 1068} {"train_loss": -11.29620361328125, "global_step": 179561, "epoch": 1068} {"train_loss": -11.366598129272461, "global_step": 179562, "epoch": 1068} {"train_loss": -11.508007049560547, "global_step": 179563, "epoch": 1068} {"train_loss": -11.665512084960938, "global_step": 179564, "epoch": 1068} {"train_loss": -11.50535774230957, "global_step": 179565, "epoch": 1068} {"train_loss": -11.349081993103027, "global_step": 179566, "epoch": 1068} {"train_loss": -11.531805992126465, "global_step": 179567, "epoch": 1068} {"train_loss": -11.479191780090332, "global_step": 179568, "epoch": 1068} {"train_loss": -11.491191864013672, "global_step": 179569, "epoch": 1068} {"train_loss": -11.552574157714844, "global_step": 179570, "epoch": 1068} {"train_loss": -11.592008590698242, "global_step": 179571, "epoch": 1068} {"train_loss": -11.460733413696289, "global_step": 179572, "epoch": 1068} {"train_loss": -11.678861618041992, "global_step": 179573, "epoch": 1068} {"train_loss": -11.682106018066406, "global_step": 179574, "epoch": 1068} {"train_loss": -11.450690269470215, "global_step": 179575, "epoch": 1068} {"train_loss": -11.483787536621094, "global_step": 179576, "epoch": 1068} {"train_loss": -11.680112838745117, "global_step": 179577, "epoch": 1068} {"train_loss": -11.38677978515625, "global_step": 179578, "epoch": 1068} {"train_loss": -11.288933753967285, "global_step": 179579, "epoch": 1068} {"train_loss": -11.159534454345703, "global_step": 179580, "epoch": 1068} {"train_loss": -11.484139442443848, "global_step": 179581, "epoch": 1068} {"train_loss": -11.319368362426758, "global_step": 179582, "epoch": 1068} {"train_loss": -10.649659156799316, "global_step": 179583, "epoch": 1068} {"train_loss": -10.356801986694336, "global_step": 179584, "epoch": 1068} {"train_loss": -11.402531623840332, "global_step": 179585, "epoch": 1068} {"train_loss": -10.959615707397461, "global_step": 179586, "epoch": 1068} {"train_loss": -9.320600509643555, "global_step": 179587, "epoch": 1068} {"train_loss": -10.569025039672852, "global_step": 179588, "epoch": 1068} {"train_loss": -10.803348541259766, "global_step": 179589, "epoch": 1068} {"train_loss": -9.93709659576416, "global_step": 179590, "epoch": 1068} {"train_loss": -10.96446144580841, "global_step": 179591, "epoch": 1068, "val_loss": 244698.75} {"train_loss": -10.565408706665039, "global_step": 179592, "epoch": 1069} {"train_loss": -10.96029281616211, "global_step": 179593, "epoch": 1069} {"train_loss": -10.42177963256836, "global_step": 179594, "epoch": 1069} {"train_loss": -11.171932220458984, "global_step": 179595, "epoch": 1069} {"train_loss": -10.215621948242188, "global_step": 179596, "epoch": 1069} {"train_loss": -10.854351043701172, "global_step": 179597, "epoch": 1069} {"train_loss": -10.495102882385254, "global_step": 179598, "epoch": 1069} {"train_loss": -9.759490013122559, "global_step": 179599, "epoch": 1069} {"train_loss": -10.724285125732422, "global_step": 179600, "epoch": 1069} {"train_loss": -10.637687683105469, "global_step": 179601, "epoch": 1069} {"train_loss": -10.822962760925293, "global_step": 179602, "epoch": 1069} {"train_loss": -11.257978439331055, "global_step": 179603, "epoch": 1069} {"train_loss": -10.583931922912598, "global_step": 179604, "epoch": 1069} {"train_loss": -10.586220741271973, "global_step": 179605, "epoch": 1069} {"train_loss": -10.707111358642578, "global_step": 179606, "epoch": 1069} {"train_loss": -10.610208511352539, "global_step": 179607, "epoch": 1069} {"train_loss": -10.88381576538086, "global_step": 179608, "epoch": 1069} {"train_loss": -10.910823822021484, "global_step": 179609, "epoch": 1069} {"train_loss": -10.985700607299805, "global_step": 179610, "epoch": 1069} {"train_loss": -11.068754196166992, "global_step": 179611, "epoch": 1069} {"train_loss": -10.846179962158203, "global_step": 179612, "epoch": 1069} {"train_loss": -11.106024742126465, "global_step": 179613, "epoch": 1069} {"train_loss": -10.657346725463867, "global_step": 179614, "epoch": 1069} {"train_loss": -10.655289649963379, "global_step": 179615, "epoch": 1069} {"train_loss": -10.362168312072754, "global_step": 179616, "epoch": 1069} {"train_loss": -9.848352432250977, "global_step": 179617, "epoch": 1069} {"train_loss": -10.687297821044922, "global_step": 179618, "epoch": 1069} {"train_loss": -9.93419361114502, "global_step": 179619, "epoch": 1069} {"train_loss": -11.075363159179688, "global_step": 179620, "epoch": 1069} {"train_loss": -10.761800765991211, "global_step": 179621, "epoch": 1069} {"train_loss": -10.994619369506836, "global_step": 179622, "epoch": 1069} {"train_loss": -10.77222728729248, "global_step": 179623, "epoch": 1069} {"train_loss": -11.063339233398438, "global_step": 179624, "epoch": 1069} {"train_loss": -10.584830284118652, "global_step": 179625, "epoch": 1069} {"train_loss": -11.137557983398438, "global_step": 179626, "epoch": 1069} {"train_loss": -10.800891876220703, "global_step": 179627, "epoch": 1069} {"train_loss": -11.082834243774414, "global_step": 179628, "epoch": 1069} {"train_loss": -10.606657028198242, "global_step": 179629, "epoch": 1069} {"train_loss": -10.99924087524414, "global_step": 179630, "epoch": 1069} {"train_loss": -10.681915283203125, "global_step": 179631, "epoch": 1069} {"train_loss": -11.192142486572266, "global_step": 179632, "epoch": 1069} {"train_loss": -10.902861595153809, "global_step": 179633, "epoch": 1069} {"train_loss": -10.936029434204102, "global_step": 179634, "epoch": 1069} {"train_loss": -10.985076904296875, "global_step": 179635, "epoch": 1069} {"train_loss": -10.87744426727295, "global_step": 179636, "epoch": 1069} {"train_loss": -11.275910377502441, "global_step": 179637, "epoch": 1069} {"train_loss": -10.937821388244629, "global_step": 179638, "epoch": 1069} {"train_loss": -11.20230484008789, "global_step": 179639, "epoch": 1069} {"train_loss": -11.307010650634766, "global_step": 179640, "epoch": 1069} {"train_loss": -11.25489616394043, "global_step": 179641, "epoch": 1069} {"train_loss": -11.21379566192627, "global_step": 179642, "epoch": 1069} {"train_loss": -11.24658203125, "global_step": 179643, "epoch": 1069} {"train_loss": -11.344858169555664, "global_step": 179644, "epoch": 1069} {"train_loss": -11.29831600189209, "global_step": 179645, "epoch": 1069} {"train_loss": -11.365835189819336, "global_step": 179646, "epoch": 1069} {"train_loss": -11.208517074584961, "global_step": 179647, "epoch": 1069} {"train_loss": -11.252235412597656, "global_step": 179648, "epoch": 1069} {"train_loss": -11.251220703125, "global_step": 179649, "epoch": 1069} {"train_loss": -11.207684516906738, "global_step": 179650, "epoch": 1069} {"train_loss": -11.456063270568848, "global_step": 179651, "epoch": 1069} {"train_loss": -11.446734428405762, "global_step": 179652, "epoch": 1069} {"train_loss": -11.460737228393555, "global_step": 179653, "epoch": 1069} {"train_loss": -11.64410400390625, "global_step": 179654, "epoch": 1069} {"train_loss": -11.437594413757324, "global_step": 179655, "epoch": 1069} {"train_loss": -11.481176376342773, "global_step": 179656, "epoch": 1069} {"train_loss": -11.254209518432617, "global_step": 179657, "epoch": 1069} {"train_loss": -11.383720397949219, "global_step": 179658, "epoch": 1069} {"train_loss": -11.526185989379883, "global_step": 179659, "epoch": 1069} {"train_loss": -11.582822799682617, "global_step": 179660, "epoch": 1069} {"train_loss": -11.614625930786133, "global_step": 179661, "epoch": 1069} {"train_loss": -11.460363388061523, "global_step": 179662, "epoch": 1069} {"train_loss": -11.57390308380127, "global_step": 179663, "epoch": 1069} {"train_loss": -11.526354789733887, "global_step": 179664, "epoch": 1069} {"train_loss": -11.642037391662598, "global_step": 179665, "epoch": 1069} {"train_loss": -11.59863567352295, "global_step": 179666, "epoch": 1069} {"train_loss": -11.668703079223633, "global_step": 179667, "epoch": 1069} {"train_loss": -11.711235046386719, "global_step": 179668, "epoch": 1069} {"train_loss": -11.47030258178711, "global_step": 179669, "epoch": 1069} {"train_loss": -11.34644889831543, "global_step": 179670, "epoch": 1069} {"train_loss": -11.743415832519531, "global_step": 179671, "epoch": 1069} {"train_loss": -11.63501262664795, "global_step": 179672, "epoch": 1069} {"train_loss": -11.332793235778809, "global_step": 179673, "epoch": 1069} {"train_loss": -11.545259475708008, "global_step": 179674, "epoch": 1069} {"train_loss": -11.405635833740234, "global_step": 179675, "epoch": 1069} {"train_loss": -11.38886547088623, "global_step": 179676, "epoch": 1069} {"train_loss": -11.700094223022461, "global_step": 179677, "epoch": 1069} {"train_loss": -11.437591552734375, "global_step": 179678, "epoch": 1069} {"train_loss": -11.233052253723145, "global_step": 179679, "epoch": 1069} {"train_loss": -10.90911865234375, "global_step": 179680, "epoch": 1069} {"train_loss": -11.01906967163086, "global_step": 179681, "epoch": 1069} {"train_loss": -11.441183090209961, "global_step": 179682, "epoch": 1069} {"train_loss": -10.986289978027344, "global_step": 179683, "epoch": 1069} {"train_loss": -10.895566940307617, "global_step": 179684, "epoch": 1069} {"train_loss": -11.412932395935059, "global_step": 179685, "epoch": 1069} {"train_loss": -10.796244621276855, "global_step": 179686, "epoch": 1069} {"train_loss": -10.107690811157227, "global_step": 179687, "epoch": 1069} {"train_loss": -10.233779907226562, "global_step": 179688, "epoch": 1069} {"train_loss": -10.48243236541748, "global_step": 179689, "epoch": 1069} {"train_loss": -10.50497055053711, "global_step": 179690, "epoch": 1069} {"train_loss": -10.537936210632324, "global_step": 179691, "epoch": 1069} {"train_loss": -10.552297592163086, "global_step": 179692, "epoch": 1069} {"train_loss": -8.99406623840332, "global_step": 179693, "epoch": 1069} {"train_loss": -10.170049667358398, "global_step": 179694, "epoch": 1069} {"train_loss": -10.550348281860352, "global_step": 179695, "epoch": 1069} {"train_loss": -9.597702026367188, "global_step": 179696, "epoch": 1069} {"train_loss": -10.749829292297363, "global_step": 179697, "epoch": 1069} {"train_loss": -10.081335067749023, "global_step": 179698, "epoch": 1069} {"train_loss": -10.408872604370117, "global_step": 179699, "epoch": 1069} {"train_loss": -10.05866813659668, "global_step": 179700, "epoch": 1069} {"train_loss": -10.417450904846191, "global_step": 179701, "epoch": 1069} {"train_loss": -9.927874565124512, "global_step": 179702, "epoch": 1069} {"train_loss": -10.413551330566406, "global_step": 179703, "epoch": 1069} {"train_loss": -10.604207038879395, "global_step": 179704, "epoch": 1069} {"train_loss": -10.122953414916992, "global_step": 179705, "epoch": 1069} {"train_loss": -9.303136825561523, "global_step": 179706, "epoch": 1069} {"train_loss": -11.069780349731445, "global_step": 179707, "epoch": 1069} {"train_loss": -9.635079383850098, "global_step": 179708, "epoch": 1069} {"train_loss": -10.621667861938477, "global_step": 179709, "epoch": 1069} {"train_loss": -9.902839660644531, "global_step": 179710, "epoch": 1069} {"train_loss": -10.979771614074707, "global_step": 179711, "epoch": 1069} {"train_loss": -10.133686065673828, "global_step": 179712, "epoch": 1069} {"train_loss": -10.765996932983398, "global_step": 179713, "epoch": 1069} {"train_loss": -10.68571662902832, "global_step": 179714, "epoch": 1069} {"train_loss": -10.900501251220703, "global_step": 179715, "epoch": 1069} {"train_loss": -10.817484855651855, "global_step": 179716, "epoch": 1069} {"train_loss": -11.028816223144531, "global_step": 179717, "epoch": 1069} {"train_loss": -10.771641731262207, "global_step": 179718, "epoch": 1069} {"train_loss": -10.860280990600586, "global_step": 179719, "epoch": 1069} {"train_loss": -10.889961242675781, "global_step": 179720, "epoch": 1069} {"train_loss": -10.998427391052246, "global_step": 179721, "epoch": 1069} {"train_loss": -10.721651077270508, "global_step": 179722, "epoch": 1069} {"train_loss": -11.15255355834961, "global_step": 179723, "epoch": 1069} {"train_loss": -10.966239929199219, "global_step": 179724, "epoch": 1069} {"train_loss": -10.571083068847656, "global_step": 179725, "epoch": 1069} {"train_loss": -10.941518783569336, "global_step": 179726, "epoch": 1069} {"train_loss": -10.6613187789917, "global_step": 179727, "epoch": 1069} {"train_loss": -10.500865936279297, "global_step": 179728, "epoch": 1069} {"train_loss": -11.100519180297852, "global_step": 179729, "epoch": 1069} {"train_loss": -10.78713607788086, "global_step": 179730, "epoch": 1069} {"train_loss": -10.785850524902344, "global_step": 179731, "epoch": 1069} {"train_loss": -11.075517654418945, "global_step": 179732, "epoch": 1069} {"train_loss": -10.821985244750977, "global_step": 179733, "epoch": 1069} {"train_loss": -10.994401931762695, "global_step": 179734, "epoch": 1069} {"train_loss": -11.071073532104492, "global_step": 179735, "epoch": 1069} {"train_loss": -10.979119300842285, "global_step": 179736, "epoch": 1069} {"train_loss": -11.043037414550781, "global_step": 179737, "epoch": 1069} {"train_loss": -10.688037872314453, "global_step": 179738, "epoch": 1069} {"train_loss": -10.882808685302734, "global_step": 179739, "epoch": 1069} {"train_loss": -11.163576126098633, "global_step": 179740, "epoch": 1069} {"train_loss": -11.065788269042969, "global_step": 179741, "epoch": 1069} {"train_loss": -11.313718795776367, "global_step": 179742, "epoch": 1069} {"train_loss": -10.928908348083496, "global_step": 179743, "epoch": 1069} {"train_loss": -11.299417495727539, "global_step": 179744, "epoch": 1069} {"train_loss": -11.2134370803833, "global_step": 179745, "epoch": 1069} {"train_loss": -11.206842422485352, "global_step": 179746, "epoch": 1069} {"train_loss": -11.15414810180664, "global_step": 179747, "epoch": 1069} {"train_loss": -11.040214538574219, "global_step": 179748, "epoch": 1069} {"train_loss": -11.144052505493164, "global_step": 179749, "epoch": 1069} {"train_loss": -11.289337158203125, "global_step": 179750, "epoch": 1069} {"train_loss": -11.454763412475586, "global_step": 179751, "epoch": 1069} {"train_loss": -11.33519172668457, "global_step": 179752, "epoch": 1069} {"train_loss": -11.402490615844727, "global_step": 179753, "epoch": 1069} {"train_loss": -11.429657936096191, "global_step": 179754, "epoch": 1069} {"train_loss": -11.506175994873047, "global_step": 179755, "epoch": 1069} {"train_loss": -11.536846160888672, "global_step": 179756, "epoch": 1069} {"train_loss": -11.311453819274902, "global_step": 179757, "epoch": 1069} {"train_loss": -11.487123489379883, "global_step": 179758, "epoch": 1069} {"train_loss": -10.937625408172607, "global_step": 179759, "epoch": 1069, "val_loss": 244863.890625} {"train_loss": -11.242762565612793, "global_step": 179760, "epoch": 1070} {"train_loss": -11.231245040893555, "global_step": 179761, "epoch": 1070} {"train_loss": -11.295318603515625, "global_step": 179762, "epoch": 1070} {"train_loss": -11.127357482910156, "global_step": 179763, "epoch": 1070} {"train_loss": -11.48494815826416, "global_step": 179764, "epoch": 1070} {"train_loss": -11.029919624328613, "global_step": 179765, "epoch": 1070} {"train_loss": -11.298727035522461, "global_step": 179766, "epoch": 1070} {"train_loss": -11.012228965759277, "global_step": 179767, "epoch": 1070} {"train_loss": -11.285378456115723, "global_step": 179768, "epoch": 1070} {"train_loss": -10.608807563781738, "global_step": 179769, "epoch": 1070} {"train_loss": -10.437578201293945, "global_step": 179770, "epoch": 1070} {"train_loss": -9.074880599975586, "global_step": 179771, "epoch": 1070} {"train_loss": -10.093467712402344, "global_step": 179772, "epoch": 1070} {"train_loss": -9.915255546569824, "global_step": 179773, "epoch": 1070} {"train_loss": -10.16678237915039, "global_step": 179774, "epoch": 1070} {"train_loss": -9.970929145812988, "global_step": 179775, "epoch": 1070} {"train_loss": -10.05441665649414, "global_step": 179776, "epoch": 1070} {"train_loss": -8.706581115722656, "global_step": 179777, "epoch": 1070} {"train_loss": -10.550600051879883, "global_step": 179778, "epoch": 1070} {"train_loss": -9.724052429199219, "global_step": 179779, "epoch": 1070} {"train_loss": -11.022680282592773, "global_step": 179780, "epoch": 1070} {"train_loss": -9.941278457641602, "global_step": 179781, "epoch": 1070} {"train_loss": -11.111946105957031, "global_step": 179782, "epoch": 1070} {"train_loss": -10.155570030212402, "global_step": 179783, "epoch": 1070} {"train_loss": -10.678293228149414, "global_step": 179784, "epoch": 1070} {"train_loss": -10.781216621398926, "global_step": 179785, "epoch": 1070} {"train_loss": -10.68708324432373, "global_step": 179786, "epoch": 1070} {"train_loss": -10.672468185424805, "global_step": 179787, "epoch": 1070} {"train_loss": -10.964703559875488, "global_step": 179788, "epoch": 1070} {"train_loss": -10.52839469909668, "global_step": 179789, "epoch": 1070} {"train_loss": -10.793737411499023, "global_step": 179790, "epoch": 1070} {"train_loss": -10.95523452758789, "global_step": 179791, "epoch": 1070} {"train_loss": -10.673007011413574, "global_step": 179792, "epoch": 1070} {"train_loss": -10.97551441192627, "global_step": 179793, "epoch": 1070} {"train_loss": -10.378005981445312, "global_step": 179794, "epoch": 1070} {"train_loss": -10.95799446105957, "global_step": 179795, "epoch": 1070} {"train_loss": -10.515002250671387, "global_step": 179796, "epoch": 1070} {"train_loss": -10.92739486694336, "global_step": 179797, "epoch": 1070} {"train_loss": -10.714143753051758, "global_step": 179798, "epoch": 1070} {"train_loss": -10.993086814880371, "global_step": 179799, "epoch": 1070} {"train_loss": -10.892068862915039, "global_step": 179800, "epoch": 1070} {"train_loss": -10.865023612976074, "global_step": 179801, "epoch": 1070} {"train_loss": -11.168771743774414, "global_step": 179802, "epoch": 1070} {"train_loss": -11.003007888793945, "global_step": 179803, "epoch": 1070} {"train_loss": -11.062602996826172, "global_step": 179804, "epoch": 1070} {"train_loss": -11.110627174377441, "global_step": 179805, "epoch": 1070} {"train_loss": -11.08610725402832, "global_step": 179806, "epoch": 1070} {"train_loss": -10.997919082641602, "global_step": 179807, "epoch": 1070} {"train_loss": -11.061246871948242, "global_step": 179808, "epoch": 1070} {"train_loss": -11.304527282714844, "global_step": 179809, "epoch": 1070} {"train_loss": -11.053177833557129, "global_step": 179810, "epoch": 1070} {"train_loss": -10.7882719039917, "global_step": 179811, "epoch": 1070} {"train_loss": -11.197952270507812, "global_step": 179812, "epoch": 1070} {"train_loss": -10.857624053955078, "global_step": 179813, "epoch": 1070} {"train_loss": -11.215810775756836, "global_step": 179814, "epoch": 1070} {"train_loss": -11.267759323120117, "global_step": 179815, "epoch": 1070} {"train_loss": -11.226985931396484, "global_step": 179816, "epoch": 1070} {"train_loss": -11.236220359802246, "global_step": 179817, "epoch": 1070} {"train_loss": -11.155112266540527, "global_step": 179818, "epoch": 1070} {"train_loss": -11.314151763916016, "global_step": 179819, "epoch": 1070} {"train_loss": -11.115279197692871, "global_step": 179820, "epoch": 1070} {"train_loss": -10.946379661560059, "global_step": 179821, "epoch": 1070} {"train_loss": -10.96068000793457, "global_step": 179822, "epoch": 1070} {"train_loss": -11.271377563476562, "global_step": 179823, "epoch": 1070} {"train_loss": -11.233785629272461, "global_step": 179824, "epoch": 1070} {"train_loss": -11.439130783081055, "global_step": 179825, "epoch": 1070} {"train_loss": -11.241591453552246, "global_step": 179826, "epoch": 1070} {"train_loss": -11.434782981872559, "global_step": 179827, "epoch": 1070} {"train_loss": -11.152420043945312, "global_step": 179828, "epoch": 1070} {"train_loss": -11.516830444335938, "global_step": 179829, "epoch": 1070} {"train_loss": -11.420509338378906, "global_step": 179830, "epoch": 1070} {"train_loss": -11.195383071899414, "global_step": 179831, "epoch": 1070} {"train_loss": -11.325237274169922, "global_step": 179832, "epoch": 1070} {"train_loss": -11.251075744628906, "global_step": 179833, "epoch": 1070} {"train_loss": -11.304706573486328, "global_step": 179834, "epoch": 1070} {"train_loss": -11.456289291381836, "global_step": 179835, "epoch": 1070} {"train_loss": -11.311042785644531, "global_step": 179836, "epoch": 1070} {"train_loss": -11.26120662689209, "global_step": 179837, "epoch": 1070} {"train_loss": -11.310583114624023, "global_step": 179838, "epoch": 1070} {"train_loss": -11.399114608764648, "global_step": 179839, "epoch": 1070} {"train_loss": -11.144207954406738, "global_step": 179840, "epoch": 1070} {"train_loss": -11.453177452087402, "global_step": 179841, "epoch": 1070} {"train_loss": -11.268630981445312, "global_step": 179842, "epoch": 1070} {"train_loss": -11.1937255859375, "global_step": 179843, "epoch": 1070} {"train_loss": -11.548501968383789, "global_step": 179844, "epoch": 1070} {"train_loss": -11.609297752380371, "global_step": 179845, "epoch": 1070} {"train_loss": -11.321889877319336, "global_step": 179846, "epoch": 1070} {"train_loss": -11.51103401184082, "global_step": 179847, "epoch": 1070} {"train_loss": -11.370540618896484, "global_step": 179848, "epoch": 1070} {"train_loss": -11.315422058105469, "global_step": 179849, "epoch": 1070} {"train_loss": -11.33045482635498, "global_step": 179850, "epoch": 1070} {"train_loss": -11.523710250854492, "global_step": 179851, "epoch": 1070} {"train_loss": -11.51854133605957, "global_step": 179852, "epoch": 1070} {"train_loss": -11.411232948303223, "global_step": 179853, "epoch": 1070} {"train_loss": -11.462289810180664, "global_step": 179854, "epoch": 1070} {"train_loss": -11.07464599609375, "global_step": 179855, "epoch": 1070} {"train_loss": -11.219306945800781, "global_step": 179856, "epoch": 1070} {"train_loss": -11.346104621887207, "global_step": 179857, "epoch": 1070} {"train_loss": -11.170929908752441, "global_step": 179858, "epoch": 1070} {"train_loss": -10.833425521850586, "global_step": 179859, "epoch": 1070} {"train_loss": -11.274312973022461, "global_step": 179860, "epoch": 1070} {"train_loss": -9.884307861328125, "global_step": 179861, "epoch": 1070} {"train_loss": -11.134210586547852, "global_step": 179862, "epoch": 1070} {"train_loss": -10.68428897857666, "global_step": 179863, "epoch": 1070} {"train_loss": -11.102596282958984, "global_step": 179864, "epoch": 1070} {"train_loss": -11.02869987487793, "global_step": 179865, "epoch": 1070} {"train_loss": -11.237577438354492, "global_step": 179866, "epoch": 1070} {"train_loss": -11.009672164916992, "global_step": 179867, "epoch": 1070} {"train_loss": -10.76579475402832, "global_step": 179868, "epoch": 1070} {"train_loss": -11.311405181884766, "global_step": 179869, "epoch": 1070} {"train_loss": -11.00058650970459, "global_step": 179870, "epoch": 1070} {"train_loss": -11.012722969055176, "global_step": 179871, "epoch": 1070} {"train_loss": -11.379007339477539, "global_step": 179872, "epoch": 1070} {"train_loss": -10.881543159484863, "global_step": 179873, "epoch": 1070} {"train_loss": -11.02505111694336, "global_step": 179874, "epoch": 1070} {"train_loss": -11.162727355957031, "global_step": 179875, "epoch": 1070} {"train_loss": -11.030292510986328, "global_step": 179876, "epoch": 1070} {"train_loss": -11.07328987121582, "global_step": 179877, "epoch": 1070} {"train_loss": -11.345174789428711, "global_step": 179878, "epoch": 1070} {"train_loss": -11.383804321289062, "global_step": 179879, "epoch": 1070} {"train_loss": -11.347993850708008, "global_step": 179880, "epoch": 1070} {"train_loss": -11.2940673828125, "global_step": 179881, "epoch": 1070} {"train_loss": -11.508318901062012, "global_step": 179882, "epoch": 1070} {"train_loss": -11.355527877807617, "global_step": 179883, "epoch": 1070} {"train_loss": -11.434154510498047, "global_step": 179884, "epoch": 1070} {"train_loss": -11.361233711242676, "global_step": 179885, "epoch": 1070} {"train_loss": -11.226836204528809, "global_step": 179886, "epoch": 1070} {"train_loss": -11.427273750305176, "global_step": 179887, "epoch": 1070} {"train_loss": -11.045124053955078, "global_step": 179888, "epoch": 1070} {"train_loss": -10.853679656982422, "global_step": 179889, "epoch": 1070} {"train_loss": -11.000846862792969, "global_step": 179890, "epoch": 1070} {"train_loss": -10.589109420776367, "global_step": 179891, "epoch": 1070} {"train_loss": -11.084146499633789, "global_step": 179892, "epoch": 1070} {"train_loss": -11.105003356933594, "global_step": 179893, "epoch": 1070} {"train_loss": -10.223490715026855, "global_step": 179894, "epoch": 1070} {"train_loss": -10.689533233642578, "global_step": 179895, "epoch": 1070} {"train_loss": -11.07359504699707, "global_step": 179896, "epoch": 1070} {"train_loss": -10.391822814941406, "global_step": 179897, "epoch": 1070} {"train_loss": -10.989086151123047, "global_step": 179898, "epoch": 1070} {"train_loss": -10.304953575134277, "global_step": 179899, "epoch": 1070} {"train_loss": -10.399296760559082, "global_step": 179900, "epoch": 1070} {"train_loss": -11.140329360961914, "global_step": 179901, "epoch": 1070} {"train_loss": -10.83137035369873, "global_step": 179902, "epoch": 1070} {"train_loss": -10.304082870483398, "global_step": 179903, "epoch": 1070} {"train_loss": -11.314949989318848, "global_step": 179904, "epoch": 1070} {"train_loss": -10.57660961151123, "global_step": 179905, "epoch": 1070} {"train_loss": -10.985967636108398, "global_step": 179906, "epoch": 1070} {"train_loss": -10.17689037322998, "global_step": 179907, "epoch": 1070} {"train_loss": -9.821307182312012, "global_step": 179908, "epoch": 1070} {"train_loss": -10.58108139038086, "global_step": 179909, "epoch": 1070} {"train_loss": -8.943197250366211, "global_step": 179910, "epoch": 1070} {"train_loss": -9.937763214111328, "global_step": 179911, "epoch": 1070} {"train_loss": -9.309810638427734, "global_step": 179912, "epoch": 1070} {"train_loss": -10.009035110473633, "global_step": 179913, "epoch": 1070} {"train_loss": -9.257768630981445, "global_step": 179914, "epoch": 1070} {"train_loss": -10.691750526428223, "global_step": 179915, "epoch": 1070} {"train_loss": -10.519754409790039, "global_step": 179916, "epoch": 1070} {"train_loss": -9.795462608337402, "global_step": 179917, "epoch": 1070} {"train_loss": -10.553098678588867, "global_step": 179918, "epoch": 1070} {"train_loss": -10.138612747192383, "global_step": 179919, "epoch": 1070} {"train_loss": -10.202447891235352, "global_step": 179920, "epoch": 1070} {"train_loss": -10.81871223449707, "global_step": 179921, "epoch": 1070} {"train_loss": -10.822019577026367, "global_step": 179922, "epoch": 1070} {"train_loss": -10.438108444213867, "global_step": 179923, "epoch": 1070} {"train_loss": -11.00086784362793, "global_step": 179924, "epoch": 1070} {"train_loss": -10.514558792114258, "global_step": 179925, "epoch": 1070} {"train_loss": -10.839452743530273, "global_step": 179926, "epoch": 1070} {"train_loss": -10.89554108324505, "global_step": 179927, "epoch": 1070, "val_loss": 240944.4375, "train_action_mse_error": 2.66983962059021} {"train_loss": -10.855883598327637, "global_step": 179928, "epoch": 1071} {"train_loss": -11.135343551635742, "global_step": 179929, "epoch": 1071} {"train_loss": -10.838356971740723, "global_step": 179930, "epoch": 1071} {"train_loss": -10.349212646484375, "global_step": 179931, "epoch": 1071} {"train_loss": -10.529775619506836, "global_step": 179932, "epoch": 1071} {"train_loss": -11.008661270141602, "global_step": 179933, "epoch": 1071} {"train_loss": -10.454103469848633, "global_step": 179934, "epoch": 1071} {"train_loss": -10.824477195739746, "global_step": 179935, "epoch": 1071} {"train_loss": -10.68734359741211, "global_step": 179936, "epoch": 1071} {"train_loss": -10.43610668182373, "global_step": 179937, "epoch": 1071} {"train_loss": -10.926466941833496, "global_step": 179938, "epoch": 1071} {"train_loss": -10.553621292114258, "global_step": 179939, "epoch": 1071} {"train_loss": -11.112848281860352, "global_step": 179940, "epoch": 1071} {"train_loss": -10.843896865844727, "global_step": 179941, "epoch": 1071} {"train_loss": -11.0388822555542, "global_step": 179942, "epoch": 1071} {"train_loss": -11.16566276550293, "global_step": 179943, "epoch": 1071} {"train_loss": -10.66407585144043, "global_step": 179944, "epoch": 1071} {"train_loss": -11.072617530822754, "global_step": 179945, "epoch": 1071} {"train_loss": -10.64927864074707, "global_step": 179946, "epoch": 1071} {"train_loss": -11.011043548583984, "global_step": 179947, "epoch": 1071} {"train_loss": -10.899247169494629, "global_step": 179948, "epoch": 1071} {"train_loss": -11.028141021728516, "global_step": 179949, "epoch": 1071} {"train_loss": -11.112388610839844, "global_step": 179950, "epoch": 1071} {"train_loss": -10.905689239501953, "global_step": 179951, "epoch": 1071} {"train_loss": -11.006781578063965, "global_step": 179952, "epoch": 1071} {"train_loss": -10.94416618347168, "global_step": 179953, "epoch": 1071} {"train_loss": -11.065174102783203, "global_step": 179954, "epoch": 1071} {"train_loss": -11.212836265563965, "global_step": 179955, "epoch": 1071} {"train_loss": -11.047886848449707, "global_step": 179956, "epoch": 1071} {"train_loss": -11.030596733093262, "global_step": 179957, "epoch": 1071} {"train_loss": -11.089888572692871, "global_step": 179958, "epoch": 1071} {"train_loss": -11.240259170532227, "global_step": 179959, "epoch": 1071} {"train_loss": -11.179576873779297, "global_step": 179960, "epoch": 1071} {"train_loss": -11.122401237487793, "global_step": 179961, "epoch": 1071} {"train_loss": -11.42974853515625, "global_step": 179962, "epoch": 1071} {"train_loss": -11.28223991394043, "global_step": 179963, "epoch": 1071} {"train_loss": -11.23867130279541, "global_step": 179964, "epoch": 1071} {"train_loss": -11.432363510131836, "global_step": 179965, "epoch": 1071} {"train_loss": -11.122512817382812, "global_step": 179966, "epoch": 1071} {"train_loss": -11.273663520812988, "global_step": 179967, "epoch": 1071} {"train_loss": -10.884349822998047, "global_step": 179968, "epoch": 1071} {"train_loss": -11.234277725219727, "global_step": 179969, "epoch": 1071} {"train_loss": -11.3480224609375, "global_step": 179970, "epoch": 1071} {"train_loss": -11.418405532836914, "global_step": 179971, "epoch": 1071} {"train_loss": -11.349723815917969, "global_step": 179972, "epoch": 1071} {"train_loss": -11.452789306640625, "global_step": 179973, "epoch": 1071} {"train_loss": -11.364846229553223, "global_step": 179974, "epoch": 1071} {"train_loss": -11.058289527893066, "global_step": 179975, "epoch": 1071} {"train_loss": -11.166448593139648, "global_step": 179976, "epoch": 1071} {"train_loss": -11.279277801513672, "global_step": 179977, "epoch": 1071} {"train_loss": -11.629889488220215, "global_step": 179978, "epoch": 1071} {"train_loss": -11.233441352844238, "global_step": 179979, "epoch": 1071} {"train_loss": -11.376277923583984, "global_step": 179980, "epoch": 1071} {"train_loss": -11.396876335144043, "global_step": 179981, "epoch": 1071} {"train_loss": -11.244207382202148, "global_step": 179982, "epoch": 1071} {"train_loss": -11.611412048339844, "global_step": 179983, "epoch": 1071} {"train_loss": -11.597599029541016, "global_step": 179984, "epoch": 1071} {"train_loss": -11.474462509155273, "global_step": 179985, "epoch": 1071} {"train_loss": -11.737265586853027, "global_step": 179986, "epoch": 1071} {"train_loss": -11.472928047180176, "global_step": 179987, "epoch": 1071} {"train_loss": -11.461973190307617, "global_step": 179988, "epoch": 1071} {"train_loss": -11.504505157470703, "global_step": 179989, "epoch": 1071} {"train_loss": -11.505228042602539, "global_step": 179990, "epoch": 1071} {"train_loss": -11.595745086669922, "global_step": 179991, "epoch": 1071} {"train_loss": -11.533235549926758, "global_step": 179992, "epoch": 1071} {"train_loss": -11.57954216003418, "global_step": 179993, "epoch": 1071} {"train_loss": -11.503817558288574, "global_step": 179994, "epoch": 1071} {"train_loss": -11.398921966552734, "global_step": 179995, "epoch": 1071} {"train_loss": -11.626925468444824, "global_step": 179996, "epoch": 1071} {"train_loss": -11.70093822479248, "global_step": 179997, "epoch": 1071} {"train_loss": -11.824094772338867, "global_step": 179998, "epoch": 1071} {"train_loss": -11.664676666259766, "global_step": 179999, "epoch": 1071} {"train_loss": -11.538461685180664, "global_step": 180000, "epoch": 1071} {"train_loss": -11.430937767028809, "global_step": 180001, "epoch": 1071} {"train_loss": -11.67747688293457, "global_step": 180002, "epoch": 1071} {"train_loss": -11.760354995727539, "global_step": 180003, "epoch": 1071} {"train_loss": -11.747047424316406, "global_step": 180004, "epoch": 1071} {"train_loss": -11.626567840576172, "global_step": 180005, "epoch": 1071} {"train_loss": -11.50249195098877, "global_step": 180006, "epoch": 1071} {"train_loss": -11.625243186950684, "global_step": 180007, "epoch": 1071} {"train_loss": -11.702020645141602, "global_step": 180008, "epoch": 1071} {"train_loss": -11.567119598388672, "global_step": 180009, "epoch": 1071} {"train_loss": -11.504066467285156, "global_step": 180010, "epoch": 1071} {"train_loss": -11.46906852722168, "global_step": 180011, "epoch": 1071} {"train_loss": -11.171171188354492, "global_step": 180012, "epoch": 1071} {"train_loss": -11.44735050201416, "global_step": 180013, "epoch": 1071} {"train_loss": -11.044637680053711, "global_step": 180014, "epoch": 1071} {"train_loss": -9.835811614990234, "global_step": 180015, "epoch": 1071} {"train_loss": -9.07581901550293, "global_step": 180016, "epoch": 1071} {"train_loss": -10.273407936096191, "global_step": 180017, "epoch": 1071} {"train_loss": -10.603537559509277, "global_step": 180018, "epoch": 1071} {"train_loss": -10.901819229125977, "global_step": 180019, "epoch": 1071} {"train_loss": -10.603334426879883, "global_step": 180020, "epoch": 1071} {"train_loss": -10.045601844787598, "global_step": 180021, "epoch": 1071} {"train_loss": -9.381701469421387, "global_step": 180022, "epoch": 1071} {"train_loss": -10.907478332519531, "global_step": 180023, "epoch": 1071} {"train_loss": -9.320270538330078, "global_step": 180024, "epoch": 1071} {"train_loss": -9.90776252746582, "global_step": 180025, "epoch": 1071} {"train_loss": -10.170038223266602, "global_step": 180026, "epoch": 1071} {"train_loss": -9.449376106262207, "global_step": 180027, "epoch": 1071} {"train_loss": -9.93519401550293, "global_step": 180028, "epoch": 1071} {"train_loss": -10.97506046295166, "global_step": 180029, "epoch": 1071} {"train_loss": -9.99248218536377, "global_step": 180030, "epoch": 1071} {"train_loss": -10.855266571044922, "global_step": 180031, "epoch": 1071} {"train_loss": -10.453092575073242, "global_step": 180032, "epoch": 1071} {"train_loss": -10.959663391113281, "global_step": 180033, "epoch": 1071} {"train_loss": -10.807979583740234, "global_step": 180034, "epoch": 1071} {"train_loss": -10.752283096313477, "global_step": 180035, "epoch": 1071} {"train_loss": -10.76664924621582, "global_step": 180036, "epoch": 1071} {"train_loss": -10.963370323181152, "global_step": 180037, "epoch": 1071} {"train_loss": -10.96192455291748, "global_step": 180038, "epoch": 1071} {"train_loss": -10.840051651000977, "global_step": 180039, "epoch": 1071} {"train_loss": -11.033241271972656, "global_step": 180040, "epoch": 1071} {"train_loss": -10.733860969543457, "global_step": 180041, "epoch": 1071} {"train_loss": -11.049264907836914, "global_step": 180042, "epoch": 1071} {"train_loss": -10.967527389526367, "global_step": 180043, "epoch": 1071} {"train_loss": -10.711847305297852, "global_step": 180044, "epoch": 1071} {"train_loss": -10.962685585021973, "global_step": 180045, "epoch": 1071} {"train_loss": -11.026335716247559, "global_step": 180046, "epoch": 1071} {"train_loss": -10.858260154724121, "global_step": 180047, "epoch": 1071} {"train_loss": -10.994993209838867, "global_step": 180048, "epoch": 1071} {"train_loss": -10.832993507385254, "global_step": 180049, "epoch": 1071} {"train_loss": -11.07667350769043, "global_step": 180050, "epoch": 1071} {"train_loss": -10.973444938659668, "global_step": 180051, "epoch": 1071} {"train_loss": -10.625740051269531, "global_step": 180052, "epoch": 1071} {"train_loss": -11.288175582885742, "global_step": 180053, "epoch": 1071} {"train_loss": -10.998873710632324, "global_step": 180054, "epoch": 1071} {"train_loss": -11.1248779296875, "global_step": 180055, "epoch": 1071} {"train_loss": -11.023065567016602, "global_step": 180056, "epoch": 1071} {"train_loss": -11.343635559082031, "global_step": 180057, "epoch": 1071} {"train_loss": -11.386507034301758, "global_step": 180058, "epoch": 1071} {"train_loss": -11.136406898498535, "global_step": 180059, "epoch": 1071} {"train_loss": -11.077483177185059, "global_step": 180060, "epoch": 1071} {"train_loss": -11.455926895141602, "global_step": 180061, "epoch": 1071} {"train_loss": -11.315489768981934, "global_step": 180062, "epoch": 1071} {"train_loss": -11.124981880187988, "global_step": 180063, "epoch": 1071} {"train_loss": -11.42188835144043, "global_step": 180064, "epoch": 1071} {"train_loss": -11.304983139038086, "global_step": 180065, "epoch": 1071} {"train_loss": -11.195409774780273, "global_step": 180066, "epoch": 1071} {"train_loss": -11.456491470336914, "global_step": 180067, "epoch": 1071} {"train_loss": -11.350691795349121, "global_step": 180068, "epoch": 1071} {"train_loss": -11.346637725830078, "global_step": 180069, "epoch": 1071} {"train_loss": -11.384122848510742, "global_step": 180070, "epoch": 1071} {"train_loss": -11.63150405883789, "global_step": 180071, "epoch": 1071} {"train_loss": -11.543243408203125, "global_step": 180072, "epoch": 1071} {"train_loss": -11.471552848815918, "global_step": 180073, "epoch": 1071} {"train_loss": -11.487491607666016, "global_step": 180074, "epoch": 1071} {"train_loss": -11.280149459838867, "global_step": 180075, "epoch": 1071} {"train_loss": -11.604628562927246, "global_step": 180076, "epoch": 1071} {"train_loss": -11.460604667663574, "global_step": 180077, "epoch": 1071} {"train_loss": -11.435441970825195, "global_step": 180078, "epoch": 1071} {"train_loss": -11.504522323608398, "global_step": 180079, "epoch": 1071} {"train_loss": -11.26080322265625, "global_step": 180080, "epoch": 1071} {"train_loss": -11.350234985351562, "global_step": 180081, "epoch": 1071} {"train_loss": -11.26986312866211, "global_step": 180082, "epoch": 1071} {"train_loss": -11.334733963012695, "global_step": 180083, "epoch": 1071} {"train_loss": -11.333312034606934, "global_step": 180084, "epoch": 1071} {"train_loss": -11.41347885131836, "global_step": 180085, "epoch": 1071} {"train_loss": -11.212717056274414, "global_step": 180086, "epoch": 1071} {"train_loss": -11.627815246582031, "global_step": 180087, "epoch": 1071} {"train_loss": -11.391523361206055, "global_step": 180088, "epoch": 1071} {"train_loss": -11.360851287841797, "global_step": 180089, "epoch": 1071} {"train_loss": -11.50668716430664, "global_step": 180090, "epoch": 1071} {"train_loss": -11.394367218017578, "global_step": 180091, "epoch": 1071} {"train_loss": -11.136234283447266, "global_step": 180092, "epoch": 1071} {"train_loss": -11.076484680175781, "global_step": 180093, "epoch": 1071} {"train_loss": -11.718282699584961, "global_step": 180094, "epoch": 1071} {"train_loss": -11.10854112534296, "global_step": 180095, "epoch": 1071, "val_loss": 243546.390625} {"train_loss": -11.033181190490723, "global_step": 180096, "epoch": 1072} {"train_loss": -11.185519218444824, "global_step": 180097, "epoch": 1072} {"train_loss": -11.239450454711914, "global_step": 180098, "epoch": 1072} {"train_loss": -10.653106689453125, "global_step": 180099, "epoch": 1072} {"train_loss": -10.533302307128906, "global_step": 180100, "epoch": 1072} {"train_loss": -11.608474731445312, "global_step": 180101, "epoch": 1072} {"train_loss": -11.306511878967285, "global_step": 180102, "epoch": 1072} {"train_loss": -11.286407470703125, "global_step": 180103, "epoch": 1072} {"train_loss": -11.107654571533203, "global_step": 180104, "epoch": 1072} {"train_loss": -11.292068481445312, "global_step": 180105, "epoch": 1072} {"train_loss": -10.805582046508789, "global_step": 180106, "epoch": 1072} {"train_loss": -10.870694160461426, "global_step": 180107, "epoch": 1072} {"train_loss": -10.963855743408203, "global_step": 180108, "epoch": 1072} {"train_loss": -11.455632209777832, "global_step": 180109, "epoch": 1072} {"train_loss": -10.93592643737793, "global_step": 180110, "epoch": 1072} {"train_loss": -11.097505569458008, "global_step": 180111, "epoch": 1072} {"train_loss": -10.877364158630371, "global_step": 180112, "epoch": 1072} {"train_loss": -10.547894477844238, "global_step": 180113, "epoch": 1072} {"train_loss": -10.975746154785156, "global_step": 180114, "epoch": 1072} {"train_loss": -11.051141738891602, "global_step": 180115, "epoch": 1072} {"train_loss": -10.849411010742188, "global_step": 180116, "epoch": 1072} {"train_loss": -11.39798355102539, "global_step": 180117, "epoch": 1072} {"train_loss": -10.998502731323242, "global_step": 180118, "epoch": 1072} {"train_loss": -10.140585899353027, "global_step": 180119, "epoch": 1072} {"train_loss": -11.32440185546875, "global_step": 180120, "epoch": 1072} {"train_loss": -10.436588287353516, "global_step": 180121, "epoch": 1072} {"train_loss": -11.01882553100586, "global_step": 180122, "epoch": 1072} {"train_loss": -10.855120658874512, "global_step": 180123, "epoch": 1072} {"train_loss": -10.763989448547363, "global_step": 180124, "epoch": 1072} {"train_loss": -10.815506935119629, "global_step": 180125, "epoch": 1072} {"train_loss": -10.658649444580078, "global_step": 180126, "epoch": 1072} {"train_loss": -10.518404006958008, "global_step": 180127, "epoch": 1072} {"train_loss": -10.634655952453613, "global_step": 180128, "epoch": 1072} {"train_loss": -10.514413833618164, "global_step": 180129, "epoch": 1072} {"train_loss": -10.993468284606934, "global_step": 180130, "epoch": 1072} {"train_loss": -10.550756454467773, "global_step": 180131, "epoch": 1072} {"train_loss": -10.52810287475586, "global_step": 180132, "epoch": 1072} {"train_loss": -10.454561233520508, "global_step": 180133, "epoch": 1072} {"train_loss": -10.173988342285156, "global_step": 180134, "epoch": 1072} {"train_loss": -9.555255889892578, "global_step": 180135, "epoch": 1072} {"train_loss": -9.882465362548828, "global_step": 180136, "epoch": 1072} {"train_loss": -10.042895317077637, "global_step": 180137, "epoch": 1072} {"train_loss": -9.7761869430542, "global_step": 180138, "epoch": 1072} {"train_loss": -10.345354080200195, "global_step": 180139, "epoch": 1072} {"train_loss": -10.67807388305664, "global_step": 180140, "epoch": 1072} {"train_loss": -10.42182731628418, "global_step": 180141, "epoch": 1072} {"train_loss": -10.217816352844238, "global_step": 180142, "epoch": 1072} {"train_loss": -10.02046012878418, "global_step": 180143, "epoch": 1072} {"train_loss": -10.490445137023926, "global_step": 180144, "epoch": 1072} {"train_loss": -9.931203842163086, "global_step": 180145, "epoch": 1072} {"train_loss": -10.421163558959961, "global_step": 180146, "epoch": 1072} {"train_loss": -10.662850379943848, "global_step": 180147, "epoch": 1072} {"train_loss": -10.25081729888916, "global_step": 180148, "epoch": 1072} {"train_loss": -10.486251831054688, "global_step": 180149, "epoch": 1072} {"train_loss": -10.452795028686523, "global_step": 180150, "epoch": 1072} {"train_loss": -10.611391067504883, "global_step": 180151, "epoch": 1072} {"train_loss": -10.825063705444336, "global_step": 180152, "epoch": 1072} {"train_loss": -10.872000694274902, "global_step": 180153, "epoch": 1072} {"train_loss": -10.813507080078125, "global_step": 180154, "epoch": 1072} {"train_loss": -10.977481842041016, "global_step": 180155, "epoch": 1072} {"train_loss": -10.707326889038086, "global_step": 180156, "epoch": 1072} {"train_loss": -10.892127990722656, "global_step": 180157, "epoch": 1072} {"train_loss": -10.937379837036133, "global_step": 180158, "epoch": 1072} {"train_loss": -10.942303657531738, "global_step": 180159, "epoch": 1072} {"train_loss": -11.1069974899292, "global_step": 180160, "epoch": 1072} {"train_loss": -10.57963752746582, "global_step": 180161, "epoch": 1072} {"train_loss": -11.004672050476074, "global_step": 180162, "epoch": 1072} {"train_loss": -10.992477416992188, "global_step": 180163, "epoch": 1072} {"train_loss": -10.926794052124023, "global_step": 180164, "epoch": 1072} {"train_loss": -11.220264434814453, "global_step": 180165, "epoch": 1072} {"train_loss": -10.917969703674316, "global_step": 180166, "epoch": 1072} {"train_loss": -11.226678848266602, "global_step": 180167, "epoch": 1072} {"train_loss": -11.11387825012207, "global_step": 180168, "epoch": 1072} {"train_loss": -11.072410583496094, "global_step": 180169, "epoch": 1072} {"train_loss": -11.189630508422852, "global_step": 180170, "epoch": 1072} {"train_loss": -11.02816390991211, "global_step": 180171, "epoch": 1072} {"train_loss": -11.08531379699707, "global_step": 180172, "epoch": 1072} {"train_loss": -11.241093635559082, "global_step": 180173, "epoch": 1072} {"train_loss": -11.137659072875977, "global_step": 180174, "epoch": 1072} {"train_loss": -11.163710594177246, "global_step": 180175, "epoch": 1072} {"train_loss": -11.413190841674805, "global_step": 180176, "epoch": 1072} {"train_loss": -11.383394241333008, "global_step": 180177, "epoch": 1072} {"train_loss": -11.09570026397705, "global_step": 180178, "epoch": 1072} {"train_loss": -11.445820808410645, "global_step": 180179, "epoch": 1072} {"train_loss": -11.185525894165039, "global_step": 180180, "epoch": 1072} {"train_loss": -11.388059616088867, "global_step": 180181, "epoch": 1072} {"train_loss": -11.267264366149902, "global_step": 180182, "epoch": 1072} {"train_loss": -11.437786102294922, "global_step": 180183, "epoch": 1072} {"train_loss": -11.190603256225586, "global_step": 180184, "epoch": 1072} {"train_loss": -11.445184707641602, "global_step": 180185, "epoch": 1072} {"train_loss": -11.270301818847656, "global_step": 180186, "epoch": 1072} {"train_loss": -11.405558586120605, "global_step": 180187, "epoch": 1072} {"train_loss": -11.313456535339355, "global_step": 180188, "epoch": 1072} {"train_loss": -11.228192329406738, "global_step": 180189, "epoch": 1072} {"train_loss": -11.461828231811523, "global_step": 180190, "epoch": 1072} {"train_loss": -11.409360885620117, "global_step": 180191, "epoch": 1072} {"train_loss": -11.493650436401367, "global_step": 180192, "epoch": 1072} {"train_loss": -11.48446273803711, "global_step": 180193, "epoch": 1072} {"train_loss": -11.489986419677734, "global_step": 180194, "epoch": 1072} {"train_loss": -11.443330764770508, "global_step": 180195, "epoch": 1072} {"train_loss": -11.338094711303711, "global_step": 180196, "epoch": 1072} {"train_loss": -11.702435493469238, "global_step": 180197, "epoch": 1072} {"train_loss": -11.425920486450195, "global_step": 180198, "epoch": 1072} {"train_loss": -11.455995559692383, "global_step": 180199, "epoch": 1072} {"train_loss": -11.472665786743164, "global_step": 180200, "epoch": 1072} {"train_loss": -11.579486846923828, "global_step": 180201, "epoch": 1072} {"train_loss": -11.176370620727539, "global_step": 180202, "epoch": 1072} {"train_loss": -11.54822063446045, "global_step": 180203, "epoch": 1072} {"train_loss": -11.515533447265625, "global_step": 180204, "epoch": 1072} {"train_loss": -11.329019546508789, "global_step": 180205, "epoch": 1072} {"train_loss": -11.42872428894043, "global_step": 180206, "epoch": 1072} {"train_loss": -11.199899673461914, "global_step": 180207, "epoch": 1072} {"train_loss": -10.356758117675781, "global_step": 180208, "epoch": 1072} {"train_loss": -9.563634872436523, "global_step": 180209, "epoch": 1072} {"train_loss": -11.20176887512207, "global_step": 180210, "epoch": 1072} {"train_loss": -8.879054069519043, "global_step": 180211, "epoch": 1072} {"train_loss": -9.39023208618164, "global_step": 180212, "epoch": 1072} {"train_loss": -8.272863388061523, "global_step": 180213, "epoch": 1072} {"train_loss": -8.823031425476074, "global_step": 180214, "epoch": 1072} {"train_loss": -6.873026371002197, "global_step": 180215, "epoch": 1072} {"train_loss": -6.645914077758789, "global_step": 180216, "epoch": 1072} {"train_loss": -8.075972557067871, "global_step": 180217, "epoch": 1072} {"train_loss": -7.931051254272461, "global_step": 180218, "epoch": 1072} {"train_loss": -8.487462043762207, "global_step": 180219, "epoch": 1072} {"train_loss": -9.575883865356445, "global_step": 180220, "epoch": 1072} {"train_loss": -8.707746505737305, "global_step": 180221, "epoch": 1072} {"train_loss": -9.80901050567627, "global_step": 180222, "epoch": 1072} {"train_loss": -10.3452787399292, "global_step": 180223, "epoch": 1072} {"train_loss": -10.140340805053711, "global_step": 180224, "epoch": 1072} {"train_loss": -9.9713716506958, "global_step": 180225, "epoch": 1072} {"train_loss": -10.17544937133789, "global_step": 180226, "epoch": 1072} {"train_loss": -9.440534591674805, "global_step": 180227, "epoch": 1072} {"train_loss": -9.768705368041992, "global_step": 180228, "epoch": 1072} {"train_loss": -9.758270263671875, "global_step": 180229, "epoch": 1072} {"train_loss": -9.26748275756836, "global_step": 180230, "epoch": 1072} {"train_loss": -9.856155395507812, "global_step": 180231, "epoch": 1072} {"train_loss": -10.130796432495117, "global_step": 180232, "epoch": 1072} {"train_loss": -9.464345932006836, "global_step": 180233, "epoch": 1072} {"train_loss": -10.615364074707031, "global_step": 180234, "epoch": 1072} {"train_loss": -10.492976188659668, "global_step": 180235, "epoch": 1072} {"train_loss": -9.632575988769531, "global_step": 180236, "epoch": 1072} {"train_loss": -10.106799125671387, "global_step": 180237, "epoch": 1072} {"train_loss": -10.685054779052734, "global_step": 180238, "epoch": 1072} {"train_loss": -9.656244277954102, "global_step": 180239, "epoch": 1072} {"train_loss": -10.403846740722656, "global_step": 180240, "epoch": 1072} {"train_loss": -10.847539901733398, "global_step": 180241, "epoch": 1072} {"train_loss": -10.368453025817871, "global_step": 180242, "epoch": 1072} {"train_loss": -10.638442993164062, "global_step": 180243, "epoch": 1072} {"train_loss": -10.383487701416016, "global_step": 180244, "epoch": 1072} {"train_loss": -10.51156234741211, "global_step": 180245, "epoch": 1072} {"train_loss": -10.360727310180664, "global_step": 180246, "epoch": 1072} {"train_loss": -10.679244995117188, "global_step": 180247, "epoch": 1072} {"train_loss": -10.913928985595703, "global_step": 180248, "epoch": 1072} {"train_loss": -10.75972843170166, "global_step": 180249, "epoch": 1072} {"train_loss": -10.702128410339355, "global_step": 180250, "epoch": 1072} {"train_loss": -10.940120697021484, "global_step": 180251, "epoch": 1072} {"train_loss": -10.812402725219727, "global_step": 180252, "epoch": 1072} {"train_loss": -10.629478454589844, "global_step": 180253, "epoch": 1072} {"train_loss": -10.795893669128418, "global_step": 180254, "epoch": 1072} {"train_loss": -10.72944164276123, "global_step": 180255, "epoch": 1072} {"train_loss": -10.998444557189941, "global_step": 180256, "epoch": 1072} {"train_loss": -10.971118927001953, "global_step": 180257, "epoch": 1072} {"train_loss": -11.070866584777832, "global_step": 180258, "epoch": 1072} {"train_loss": -11.197980880737305, "global_step": 180259, "epoch": 1072} {"train_loss": -11.007827758789062, "global_step": 180260, "epoch": 1072} {"train_loss": -11.191827774047852, "global_step": 180261, "epoch": 1072} {"train_loss": -11.153736114501953, "global_step": 180262, "epoch": 1072} {"train_loss": -10.644437367007846, "global_step": 180263, "epoch": 1072, "val_loss": 239022.21875} {"train_loss": -11.052846908569336, "global_step": 180264, "epoch": 1073} {"train_loss": -10.968564987182617, "global_step": 180265, "epoch": 1073} {"train_loss": -10.949047088623047, "global_step": 180266, "epoch": 1073} {"train_loss": -11.188911437988281, "global_step": 180267, "epoch": 1073} {"train_loss": -11.133146286010742, "global_step": 180268, "epoch": 1073} {"train_loss": -11.293978691101074, "global_step": 180269, "epoch": 1073} {"train_loss": -11.255426406860352, "global_step": 180270, "epoch": 1073} {"train_loss": -11.390216827392578, "global_step": 180271, "epoch": 1073} {"train_loss": -11.297320365905762, "global_step": 180272, "epoch": 1073} {"train_loss": -11.214825630187988, "global_step": 180273, "epoch": 1073} {"train_loss": -11.313735961914062, "global_step": 180274, "epoch": 1073} {"train_loss": -11.153791427612305, "global_step": 180275, "epoch": 1073} {"train_loss": -11.153818130493164, "global_step": 180276, "epoch": 1073} {"train_loss": -11.082174301147461, "global_step": 180277, "epoch": 1073} {"train_loss": -11.505008697509766, "global_step": 180278, "epoch": 1073} {"train_loss": -11.412739753723145, "global_step": 180279, "epoch": 1073} {"train_loss": -11.43904972076416, "global_step": 180280, "epoch": 1073} {"train_loss": -11.1729154586792, "global_step": 180281, "epoch": 1073} {"train_loss": -11.31161117553711, "global_step": 180282, "epoch": 1073} {"train_loss": -11.245002746582031, "global_step": 180283, "epoch": 1073} {"train_loss": -11.310304641723633, "global_step": 180284, "epoch": 1073} {"train_loss": -11.07251262664795, "global_step": 180285, "epoch": 1073} {"train_loss": -11.439508438110352, "global_step": 180286, "epoch": 1073} {"train_loss": -11.300527572631836, "global_step": 180287, "epoch": 1073} {"train_loss": -11.31346321105957, "global_step": 180288, "epoch": 1073} {"train_loss": -11.380060195922852, "global_step": 180289, "epoch": 1073} {"train_loss": -11.366838455200195, "global_step": 180290, "epoch": 1073} {"train_loss": -11.361104965209961, "global_step": 180291, "epoch": 1073} {"train_loss": -11.557526588439941, "global_step": 180292, "epoch": 1073} {"train_loss": -11.475163459777832, "global_step": 180293, "epoch": 1073} {"train_loss": -11.28196907043457, "global_step": 180294, "epoch": 1073} {"train_loss": -11.44608211517334, "global_step": 180295, "epoch": 1073} {"train_loss": -11.423942565917969, "global_step": 180296, "epoch": 1073} {"train_loss": -11.222347259521484, "global_step": 180297, "epoch": 1073} {"train_loss": -11.342496871948242, "global_step": 180298, "epoch": 1073} {"train_loss": -11.157824516296387, "global_step": 180299, "epoch": 1073} {"train_loss": -11.059975624084473, "global_step": 180300, "epoch": 1073} {"train_loss": -11.120063781738281, "global_step": 180301, "epoch": 1073} {"train_loss": -11.245893478393555, "global_step": 180302, "epoch": 1073} {"train_loss": -11.11460018157959, "global_step": 180303, "epoch": 1073} {"train_loss": -11.15001392364502, "global_step": 180304, "epoch": 1073} {"train_loss": -11.400969505310059, "global_step": 180305, "epoch": 1073} {"train_loss": -11.098430633544922, "global_step": 180306, "epoch": 1073} {"train_loss": -10.748513221740723, "global_step": 180307, "epoch": 1073} {"train_loss": -10.947458267211914, "global_step": 180308, "epoch": 1073} {"train_loss": -11.093717575073242, "global_step": 180309, "epoch": 1073} {"train_loss": -10.973207473754883, "global_step": 180310, "epoch": 1073} {"train_loss": -11.192066192626953, "global_step": 180311, "epoch": 1073} {"train_loss": -11.130966186523438, "global_step": 180312, "epoch": 1073} {"train_loss": -11.216169357299805, "global_step": 180313, "epoch": 1073} {"train_loss": -11.232978820800781, "global_step": 180314, "epoch": 1073} {"train_loss": -10.798835754394531, "global_step": 180315, "epoch": 1073} {"train_loss": -11.185686111450195, "global_step": 180316, "epoch": 1073} {"train_loss": -10.871143341064453, "global_step": 180317, "epoch": 1073} {"train_loss": -10.690242767333984, "global_step": 180318, "epoch": 1073} {"train_loss": -11.18126392364502, "global_step": 180319, "epoch": 1073} {"train_loss": -10.806697845458984, "global_step": 180320, "epoch": 1073} {"train_loss": -10.916687965393066, "global_step": 180321, "epoch": 1073} {"train_loss": -11.132611274719238, "global_step": 180322, "epoch": 1073} {"train_loss": -11.147079467773438, "global_step": 180323, "epoch": 1073} {"train_loss": -11.319999694824219, "global_step": 180324, "epoch": 1073} {"train_loss": -11.056109428405762, "global_step": 180325, "epoch": 1073} {"train_loss": -11.17828369140625, "global_step": 180326, "epoch": 1073} {"train_loss": -11.215269088745117, "global_step": 180327, "epoch": 1073} {"train_loss": -11.03219985961914, "global_step": 180328, "epoch": 1073} {"train_loss": -11.319765090942383, "global_step": 180329, "epoch": 1073} {"train_loss": -10.925494194030762, "global_step": 180330, "epoch": 1073} {"train_loss": -10.402860641479492, "global_step": 180331, "epoch": 1073} {"train_loss": -11.020030975341797, "global_step": 180332, "epoch": 1073} {"train_loss": -10.595830917358398, "global_step": 180333, "epoch": 1073} {"train_loss": -9.860662460327148, "global_step": 180334, "epoch": 1073} {"train_loss": -10.971794128417969, "global_step": 180335, "epoch": 1073} {"train_loss": -9.299420356750488, "global_step": 180336, "epoch": 1073} {"train_loss": -10.708145141601562, "global_step": 180337, "epoch": 1073} {"train_loss": -9.72981071472168, "global_step": 180338, "epoch": 1073} {"train_loss": -10.724893569946289, "global_step": 180339, "epoch": 1073} {"train_loss": -10.298603057861328, "global_step": 180340, "epoch": 1073} {"train_loss": -10.056821823120117, "global_step": 180341, "epoch": 1073} {"train_loss": -10.049260139465332, "global_step": 180342, "epoch": 1073} {"train_loss": -10.03364372253418, "global_step": 180343, "epoch": 1073} {"train_loss": -10.479799270629883, "global_step": 180344, "epoch": 1073} {"train_loss": -10.10389518737793, "global_step": 180345, "epoch": 1073} {"train_loss": -10.718683242797852, "global_step": 180346, "epoch": 1073} {"train_loss": -10.338488578796387, "global_step": 180347, "epoch": 1073} {"train_loss": -10.91596794128418, "global_step": 180348, "epoch": 1073} {"train_loss": -10.64279556274414, "global_step": 180349, "epoch": 1073} {"train_loss": -11.02001953125, "global_step": 180350, "epoch": 1073} {"train_loss": -10.872859954833984, "global_step": 180351, "epoch": 1073} {"train_loss": -11.072755813598633, "global_step": 180352, "epoch": 1073} {"train_loss": -10.66862678527832, "global_step": 180353, "epoch": 1073} {"train_loss": -11.180197715759277, "global_step": 180354, "epoch": 1073} {"train_loss": -10.672380447387695, "global_step": 180355, "epoch": 1073} {"train_loss": -11.103440284729004, "global_step": 180356, "epoch": 1073} {"train_loss": -10.964954376220703, "global_step": 180357, "epoch": 1073} {"train_loss": -11.169649124145508, "global_step": 180358, "epoch": 1073} {"train_loss": -11.00658893585205, "global_step": 180359, "epoch": 1073} {"train_loss": -11.119124412536621, "global_step": 180360, "epoch": 1073} {"train_loss": -11.311275482177734, "global_step": 180361, "epoch": 1073} {"train_loss": -11.257150650024414, "global_step": 180362, "epoch": 1073} {"train_loss": -10.957998275756836, "global_step": 180363, "epoch": 1073} {"train_loss": -11.019342422485352, "global_step": 180364, "epoch": 1073} {"train_loss": -10.781522750854492, "global_step": 180365, "epoch": 1073} {"train_loss": -11.25235366821289, "global_step": 180366, "epoch": 1073} {"train_loss": -10.850173950195312, "global_step": 180367, "epoch": 1073} {"train_loss": -10.869016647338867, "global_step": 180368, "epoch": 1073} {"train_loss": -10.92119026184082, "global_step": 180369, "epoch": 1073} {"train_loss": -11.250299453735352, "global_step": 180370, "epoch": 1073} {"train_loss": -10.953649520874023, "global_step": 180371, "epoch": 1073} {"train_loss": -11.10194206237793, "global_step": 180372, "epoch": 1073} {"train_loss": -11.116299629211426, "global_step": 180373, "epoch": 1073} {"train_loss": -11.150160789489746, "global_step": 180374, "epoch": 1073} {"train_loss": -11.254030227661133, "global_step": 180375, "epoch": 1073} {"train_loss": -11.056411743164062, "global_step": 180376, "epoch": 1073} {"train_loss": -11.261009216308594, "global_step": 180377, "epoch": 1073} {"train_loss": -11.014091491699219, "global_step": 180378, "epoch": 1073} {"train_loss": -11.202899932861328, "global_step": 180379, "epoch": 1073} {"train_loss": -11.273908615112305, "global_step": 180380, "epoch": 1073} {"train_loss": -11.145838737487793, "global_step": 180381, "epoch": 1073} {"train_loss": -11.176156044006348, "global_step": 180382, "epoch": 1073} {"train_loss": -11.072178840637207, "global_step": 180383, "epoch": 1073} {"train_loss": -11.376620292663574, "global_step": 180384, "epoch": 1073} {"train_loss": -11.265454292297363, "global_step": 180385, "epoch": 1073} {"train_loss": -11.317819595336914, "global_step": 180386, "epoch": 1073} {"train_loss": -11.333535194396973, "global_step": 180387, "epoch": 1073} {"train_loss": -11.317649841308594, "global_step": 180388, "epoch": 1073} {"train_loss": -11.500892639160156, "global_step": 180389, "epoch": 1073} {"train_loss": -11.213766098022461, "global_step": 180390, "epoch": 1073} {"train_loss": -11.517715454101562, "global_step": 180391, "epoch": 1073} {"train_loss": -11.372417449951172, "global_step": 180392, "epoch": 1073} {"train_loss": -11.407718658447266, "global_step": 180393, "epoch": 1073} {"train_loss": -11.301603317260742, "global_step": 180394, "epoch": 1073} {"train_loss": -11.450372695922852, "global_step": 180395, "epoch": 1073} {"train_loss": -11.452249526977539, "global_step": 180396, "epoch": 1073} {"train_loss": -11.232025146484375, "global_step": 180397, "epoch": 1073} {"train_loss": -11.127458572387695, "global_step": 180398, "epoch": 1073} {"train_loss": -11.533194541931152, "global_step": 180399, "epoch": 1073} {"train_loss": -11.157380104064941, "global_step": 180400, "epoch": 1073} {"train_loss": -11.366922378540039, "global_step": 180401, "epoch": 1073} {"train_loss": -11.297676086425781, "global_step": 180402, "epoch": 1073} {"train_loss": -11.381038665771484, "global_step": 180403, "epoch": 1073} {"train_loss": -11.569463729858398, "global_step": 180404, "epoch": 1073} {"train_loss": -11.387018203735352, "global_step": 180405, "epoch": 1073} {"train_loss": -11.563811302185059, "global_step": 180406, "epoch": 1073} {"train_loss": -11.054540634155273, "global_step": 180407, "epoch": 1073} {"train_loss": -11.485549926757812, "global_step": 180408, "epoch": 1073} {"train_loss": -10.65518569946289, "global_step": 180409, "epoch": 1073} {"train_loss": -11.259788513183594, "global_step": 180410, "epoch": 1073} {"train_loss": -11.38415241241455, "global_step": 180411, "epoch": 1073} {"train_loss": -10.731978416442871, "global_step": 180412, "epoch": 1073} {"train_loss": -10.990619659423828, "global_step": 180413, "epoch": 1073} {"train_loss": -10.620562553405762, "global_step": 180414, "epoch": 1073} {"train_loss": -10.589688301086426, "global_step": 180415, "epoch": 1073} {"train_loss": -11.092605590820312, "global_step": 180416, "epoch": 1073} {"train_loss": -10.74375057220459, "global_step": 180417, "epoch": 1073} {"train_loss": -10.695697784423828, "global_step": 180418, "epoch": 1073} {"train_loss": -10.642099380493164, "global_step": 180419, "epoch": 1073} {"train_loss": -9.920295715332031, "global_step": 180420, "epoch": 1073} {"train_loss": -10.806242942810059, "global_step": 180421, "epoch": 1073} {"train_loss": -9.829719543457031, "global_step": 180422, "epoch": 1073} {"train_loss": -10.818500518798828, "global_step": 180423, "epoch": 1073} {"train_loss": -10.273971557617188, "global_step": 180424, "epoch": 1073} {"train_loss": -11.04694938659668, "global_step": 180425, "epoch": 1073} {"train_loss": -10.654984474182129, "global_step": 180426, "epoch": 1073} {"train_loss": -10.775529861450195, "global_step": 180427, "epoch": 1073} {"train_loss": -10.36427116394043, "global_step": 180428, "epoch": 1073} {"train_loss": -10.514459609985352, "global_step": 180429, "epoch": 1073} {"train_loss": -11.268584251403809, "global_step": 180430, "epoch": 1073} {"train_loss": -11.027219062759762, "global_step": 180431, "epoch": 1073, "val_loss": 243832.03125} {"train_loss": -10.855539321899414, "global_step": 180432, "epoch": 1074} {"train_loss": -9.805826187133789, "global_step": 180433, "epoch": 1074} {"train_loss": -10.84736156463623, "global_step": 180434, "epoch": 1074} {"train_loss": -10.068256378173828, "global_step": 180435, "epoch": 1074} {"train_loss": -10.55118179321289, "global_step": 180436, "epoch": 1074} {"train_loss": -10.193255424499512, "global_step": 180437, "epoch": 1074} {"train_loss": -10.780941009521484, "global_step": 180438, "epoch": 1074} {"train_loss": -10.509530067443848, "global_step": 180439, "epoch": 1074} {"train_loss": -10.263383865356445, "global_step": 180440, "epoch": 1074} {"train_loss": -10.651043891906738, "global_step": 180441, "epoch": 1074} {"train_loss": -10.579475402832031, "global_step": 180442, "epoch": 1074} {"train_loss": -10.610824584960938, "global_step": 180443, "epoch": 1074} {"train_loss": -10.744085311889648, "global_step": 180444, "epoch": 1074} {"train_loss": -10.632669448852539, "global_step": 180445, "epoch": 1074} {"train_loss": -10.63235855102539, "global_step": 180446, "epoch": 1074} {"train_loss": -10.907337188720703, "global_step": 180447, "epoch": 1074} {"train_loss": -10.904571533203125, "global_step": 180448, "epoch": 1074} {"train_loss": -11.056072235107422, "global_step": 180449, "epoch": 1074} {"train_loss": -10.926219940185547, "global_step": 180450, "epoch": 1074} {"train_loss": -10.93690299987793, "global_step": 180451, "epoch": 1074} {"train_loss": -11.087909698486328, "global_step": 180452, "epoch": 1074} {"train_loss": -11.224910736083984, "global_step": 180453, "epoch": 1074} {"train_loss": -10.996077537536621, "global_step": 180454, "epoch": 1074} {"train_loss": -11.05518913269043, "global_step": 180455, "epoch": 1074} {"train_loss": -11.103267669677734, "global_step": 180456, "epoch": 1074} {"train_loss": -11.217939376831055, "global_step": 180457, "epoch": 1074} {"train_loss": -11.11886215209961, "global_step": 180458, "epoch": 1074} {"train_loss": -11.009769439697266, "global_step": 180459, "epoch": 1074} {"train_loss": -11.306431770324707, "global_step": 180460, "epoch": 1074} {"train_loss": -11.0614595413208, "global_step": 180461, "epoch": 1074} {"train_loss": -11.0437650680542, "global_step": 180462, "epoch": 1074} {"train_loss": -11.10311222076416, "global_step": 180463, "epoch": 1074} {"train_loss": -11.23749828338623, "global_step": 180464, "epoch": 1074} {"train_loss": -11.353837966918945, "global_step": 180465, "epoch": 1074} {"train_loss": -11.345807075500488, "global_step": 180466, "epoch": 1074} {"train_loss": -11.048702239990234, "global_step": 180467, "epoch": 1074} {"train_loss": -11.252957344055176, "global_step": 180468, "epoch": 1074} {"train_loss": -11.465302467346191, "global_step": 180469, "epoch": 1074} {"train_loss": -11.38753604888916, "global_step": 180470, "epoch": 1074} {"train_loss": -11.237956047058105, "global_step": 180471, "epoch": 1074} {"train_loss": -11.407148361206055, "global_step": 180472, "epoch": 1074} {"train_loss": -11.35761547088623, "global_step": 180473, "epoch": 1074} {"train_loss": -11.149205207824707, "global_step": 180474, "epoch": 1074} {"train_loss": -11.452098846435547, "global_step": 180475, "epoch": 1074} {"train_loss": -11.156508445739746, "global_step": 180476, "epoch": 1074} {"train_loss": -11.4932861328125, "global_step": 180477, "epoch": 1074} {"train_loss": -11.283745765686035, "global_step": 180478, "epoch": 1074} {"train_loss": -11.46867847442627, "global_step": 180479, "epoch": 1074} {"train_loss": -11.441900253295898, "global_step": 180480, "epoch": 1074} {"train_loss": -11.411702156066895, "global_step": 180481, "epoch": 1074} {"train_loss": -11.403030395507812, "global_step": 180482, "epoch": 1074} {"train_loss": -11.529809951782227, "global_step": 180483, "epoch": 1074} {"train_loss": -11.264780044555664, "global_step": 180484, "epoch": 1074} {"train_loss": -11.327275276184082, "global_step": 180485, "epoch": 1074} {"train_loss": -11.474538803100586, "global_step": 180486, "epoch": 1074} {"train_loss": -11.231964111328125, "global_step": 180487, "epoch": 1074} {"train_loss": -11.115234375, "global_step": 180488, "epoch": 1074} {"train_loss": -11.554350852966309, "global_step": 180489, "epoch": 1074} {"train_loss": -11.146491050720215, "global_step": 180490, "epoch": 1074} {"train_loss": -11.121465682983398, "global_step": 180491, "epoch": 1074} {"train_loss": -11.314769744873047, "global_step": 180492, "epoch": 1074} {"train_loss": -11.119893074035645, "global_step": 180493, "epoch": 1074} {"train_loss": -11.18287467956543, "global_step": 180494, "epoch": 1074} {"train_loss": -11.22397518157959, "global_step": 180495, "epoch": 1074} {"train_loss": -11.214615821838379, "global_step": 180496, "epoch": 1074} {"train_loss": -10.742713928222656, "global_step": 180497, "epoch": 1074} {"train_loss": -9.653261184692383, "global_step": 180498, "epoch": 1074} {"train_loss": -10.891934394836426, "global_step": 180499, "epoch": 1074} {"train_loss": -11.005266189575195, "global_step": 180500, "epoch": 1074} {"train_loss": -10.623046875, "global_step": 180501, "epoch": 1074} {"train_loss": -11.62771987915039, "global_step": 180502, "epoch": 1074} {"train_loss": -10.534948348999023, "global_step": 180503, "epoch": 1074} {"train_loss": -10.915207862854004, "global_step": 180504, "epoch": 1074} {"train_loss": -10.532092094421387, "global_step": 180505, "epoch": 1074} {"train_loss": -10.44509506225586, "global_step": 180506, "epoch": 1074} {"train_loss": -11.080361366271973, "global_step": 180507, "epoch": 1074} {"train_loss": -10.788671493530273, "global_step": 180508, "epoch": 1074} {"train_loss": -10.348457336425781, "global_step": 180509, "epoch": 1074} {"train_loss": -11.012913703918457, "global_step": 180510, "epoch": 1074} {"train_loss": -10.779065132141113, "global_step": 180511, "epoch": 1074} {"train_loss": -10.543318748474121, "global_step": 180512, "epoch": 1074} {"train_loss": -11.04030990600586, "global_step": 180513, "epoch": 1074} {"train_loss": -10.896275520324707, "global_step": 180514, "epoch": 1074} {"train_loss": -11.089606285095215, "global_step": 180515, "epoch": 1074} {"train_loss": -10.775199890136719, "global_step": 180516, "epoch": 1074} {"train_loss": -11.158793449401855, "global_step": 180517, "epoch": 1074} {"train_loss": -10.947113037109375, "global_step": 180518, "epoch": 1074} {"train_loss": -10.980589866638184, "global_step": 180519, "epoch": 1074} {"train_loss": -11.09909439086914, "global_step": 180520, "epoch": 1074} {"train_loss": -11.25056266784668, "global_step": 180521, "epoch": 1074} {"train_loss": -11.236774444580078, "global_step": 180522, "epoch": 1074} {"train_loss": -11.26840591430664, "global_step": 180523, "epoch": 1074} {"train_loss": -11.198652267456055, "global_step": 180524, "epoch": 1074} {"train_loss": -11.199302673339844, "global_step": 180525, "epoch": 1074} {"train_loss": -11.035204887390137, "global_step": 180526, "epoch": 1074} {"train_loss": -11.479047775268555, "global_step": 180527, "epoch": 1074} {"train_loss": -11.51407241821289, "global_step": 180528, "epoch": 1074} {"train_loss": -11.010459899902344, "global_step": 180529, "epoch": 1074} {"train_loss": -11.34449291229248, "global_step": 180530, "epoch": 1074} {"train_loss": -10.62434196472168, "global_step": 180531, "epoch": 1074} {"train_loss": -11.265127182006836, "global_step": 180532, "epoch": 1074} {"train_loss": -10.898689270019531, "global_step": 180533, "epoch": 1074} {"train_loss": -10.927562713623047, "global_step": 180534, "epoch": 1074} {"train_loss": -10.762325286865234, "global_step": 180535, "epoch": 1074} {"train_loss": -10.944563865661621, "global_step": 180536, "epoch": 1074} {"train_loss": -10.977804183959961, "global_step": 180537, "epoch": 1074} {"train_loss": -11.02757740020752, "global_step": 180538, "epoch": 1074} {"train_loss": -11.103507995605469, "global_step": 180539, "epoch": 1074} {"train_loss": -11.011697769165039, "global_step": 180540, "epoch": 1074} {"train_loss": -10.934272766113281, "global_step": 180541, "epoch": 1074} {"train_loss": -10.985725402832031, "global_step": 180542, "epoch": 1074} {"train_loss": -11.071109771728516, "global_step": 180543, "epoch": 1074} {"train_loss": -11.166187286376953, "global_step": 180544, "epoch": 1074} {"train_loss": -11.346308708190918, "global_step": 180545, "epoch": 1074} {"train_loss": -11.112019538879395, "global_step": 180546, "epoch": 1074} {"train_loss": -11.31096076965332, "global_step": 180547, "epoch": 1074} {"train_loss": -11.498180389404297, "global_step": 180548, "epoch": 1074} {"train_loss": -11.179227828979492, "global_step": 180549, "epoch": 1074} {"train_loss": -11.251907348632812, "global_step": 180550, "epoch": 1074} {"train_loss": -11.023959159851074, "global_step": 180551, "epoch": 1074} {"train_loss": -10.971427917480469, "global_step": 180552, "epoch": 1074} {"train_loss": -10.997495651245117, "global_step": 180553, "epoch": 1074} {"train_loss": -11.340694427490234, "global_step": 180554, "epoch": 1074} {"train_loss": -11.160346984863281, "global_step": 180555, "epoch": 1074} {"train_loss": -10.514735221862793, "global_step": 180556, "epoch": 1074} {"train_loss": -10.267803192138672, "global_step": 180557, "epoch": 1074} {"train_loss": -10.08940315246582, "global_step": 180558, "epoch": 1074} {"train_loss": -9.004507064819336, "global_step": 180559, "epoch": 1074} {"train_loss": -10.599114418029785, "global_step": 180560, "epoch": 1074} {"train_loss": -10.195466041564941, "global_step": 180561, "epoch": 1074} {"train_loss": -10.14599895477295, "global_step": 180562, "epoch": 1074} {"train_loss": -10.842439651489258, "global_step": 180563, "epoch": 1074} {"train_loss": -10.386106491088867, "global_step": 180564, "epoch": 1074} {"train_loss": -10.826183319091797, "global_step": 180565, "epoch": 1074} {"train_loss": -10.08066177368164, "global_step": 180566, "epoch": 1074} {"train_loss": -10.426223754882812, "global_step": 180567, "epoch": 1074} {"train_loss": -10.538473129272461, "global_step": 180568, "epoch": 1074} {"train_loss": -10.377867698669434, "global_step": 180569, "epoch": 1074} {"train_loss": -11.05654525756836, "global_step": 180570, "epoch": 1074} {"train_loss": -10.641427993774414, "global_step": 180571, "epoch": 1074} {"train_loss": -10.077472686767578, "global_step": 180572, "epoch": 1074} {"train_loss": -10.931819915771484, "global_step": 180573, "epoch": 1074} {"train_loss": -10.597612380981445, "global_step": 180574, "epoch": 1074} {"train_loss": -10.621305465698242, "global_step": 180575, "epoch": 1074} {"train_loss": -10.859108924865723, "global_step": 180576, "epoch": 1074} {"train_loss": -10.714035034179688, "global_step": 180577, "epoch": 1074} {"train_loss": -10.800525665283203, "global_step": 180578, "epoch": 1074} {"train_loss": -10.982876777648926, "global_step": 180579, "epoch": 1074} {"train_loss": -10.736316680908203, "global_step": 180580, "epoch": 1074} {"train_loss": -10.907112121582031, "global_step": 180581, "epoch": 1074} {"train_loss": -10.76939868927002, "global_step": 180582, "epoch": 1074} {"train_loss": -11.023210525512695, "global_step": 180583, "epoch": 1074} {"train_loss": -11.104366302490234, "global_step": 180584, "epoch": 1074} {"train_loss": -10.950713157653809, "global_step": 180585, "epoch": 1074} {"train_loss": -11.123976707458496, "global_step": 180586, "epoch": 1074} {"train_loss": -11.022501945495605, "global_step": 180587, "epoch": 1074} {"train_loss": -11.165169715881348, "global_step": 180588, "epoch": 1074} {"train_loss": -10.779023170471191, "global_step": 180589, "epoch": 1074} {"train_loss": -11.030843734741211, "global_step": 180590, "epoch": 1074} {"train_loss": -11.124059677124023, "global_step": 180591, "epoch": 1074} {"train_loss": -11.265046119689941, "global_step": 180592, "epoch": 1074} {"train_loss": -11.087148666381836, "global_step": 180593, "epoch": 1074} {"train_loss": -11.155197143554688, "global_step": 180594, "epoch": 1074} {"train_loss": -10.993990898132324, "global_step": 180595, "epoch": 1074} {"train_loss": -11.282153129577637, "global_step": 180596, "epoch": 1074} {"train_loss": -10.988749504089355, "global_step": 180597, "epoch": 1074} {"train_loss": -11.228546142578125, "global_step": 180598, "epoch": 1074} {"train_loss": -10.955559344518752, "global_step": 180599, "epoch": 1074, "val_loss": 246684.921875} {"train_loss": -11.209750175476074, "global_step": 180600, "epoch": 1075} {"train_loss": -11.235523223876953, "global_step": 180601, "epoch": 1075} {"train_loss": -11.175870895385742, "global_step": 180602, "epoch": 1075} {"train_loss": -11.073650360107422, "global_step": 180603, "epoch": 1075} {"train_loss": -11.369543075561523, "global_step": 180604, "epoch": 1075} {"train_loss": -11.089120864868164, "global_step": 180605, "epoch": 1075} {"train_loss": -11.373978614807129, "global_step": 180606, "epoch": 1075} {"train_loss": -11.108053207397461, "global_step": 180607, "epoch": 1075} {"train_loss": -11.461515426635742, "global_step": 180608, "epoch": 1075} {"train_loss": -11.210748672485352, "global_step": 180609, "epoch": 1075} {"train_loss": -11.429180145263672, "global_step": 180610, "epoch": 1075} {"train_loss": -11.512514114379883, "global_step": 180611, "epoch": 1075} {"train_loss": -11.343767166137695, "global_step": 180612, "epoch": 1075} {"train_loss": -11.521541595458984, "global_step": 180613, "epoch": 1075} {"train_loss": -11.390138626098633, "global_step": 180614, "epoch": 1075} {"train_loss": -11.351846694946289, "global_step": 180615, "epoch": 1075} {"train_loss": -11.296451568603516, "global_step": 180616, "epoch": 1075} {"train_loss": -11.22429084777832, "global_step": 180617, "epoch": 1075} {"train_loss": -11.211481094360352, "global_step": 180618, "epoch": 1075} {"train_loss": -11.34044361114502, "global_step": 180619, "epoch": 1075} {"train_loss": -10.946283340454102, "global_step": 180620, "epoch": 1075} {"train_loss": -11.508686065673828, "global_step": 180621, "epoch": 1075} {"train_loss": -10.779916763305664, "global_step": 180622, "epoch": 1075} {"train_loss": -11.431661605834961, "global_step": 180623, "epoch": 1075} {"train_loss": -11.202820777893066, "global_step": 180624, "epoch": 1075} {"train_loss": -11.297341346740723, "global_step": 180625, "epoch": 1075} {"train_loss": -11.183295249938965, "global_step": 180626, "epoch": 1075} {"train_loss": -11.422987937927246, "global_step": 180627, "epoch": 1075} {"train_loss": -11.385469436645508, "global_step": 180628, "epoch": 1075} {"train_loss": -11.169137954711914, "global_step": 180629, "epoch": 1075} {"train_loss": -11.334129333496094, "global_step": 180630, "epoch": 1075} {"train_loss": -11.32379150390625, "global_step": 180631, "epoch": 1075} {"train_loss": -11.470974922180176, "global_step": 180632, "epoch": 1075} {"train_loss": -11.186899185180664, "global_step": 180633, "epoch": 1075} {"train_loss": -11.350274085998535, "global_step": 180634, "epoch": 1075} {"train_loss": -10.98586654663086, "global_step": 180635, "epoch": 1075} {"train_loss": -11.337985038757324, "global_step": 180636, "epoch": 1075} {"train_loss": -11.484268188476562, "global_step": 180637, "epoch": 1075} {"train_loss": -11.404305458068848, "global_step": 180638, "epoch": 1075} {"train_loss": -11.324910163879395, "global_step": 180639, "epoch": 1075} {"train_loss": -11.127641677856445, "global_step": 180640, "epoch": 1075} {"train_loss": -11.342754364013672, "global_step": 180641, "epoch": 1075} {"train_loss": -11.629905700683594, "global_step": 180642, "epoch": 1075} {"train_loss": -11.430228233337402, "global_step": 180643, "epoch": 1075} {"train_loss": -11.535213470458984, "global_step": 180644, "epoch": 1075} {"train_loss": -11.421144485473633, "global_step": 180645, "epoch": 1075} {"train_loss": -11.37783432006836, "global_step": 180646, "epoch": 1075} {"train_loss": -11.429769515991211, "global_step": 180647, "epoch": 1075} {"train_loss": -11.516403198242188, "global_step": 180648, "epoch": 1075} {"train_loss": -11.310361862182617, "global_step": 180649, "epoch": 1075} {"train_loss": -11.573725700378418, "global_step": 180650, "epoch": 1075} {"train_loss": -11.210046768188477, "global_step": 180651, "epoch": 1075} {"train_loss": -10.986539840698242, "global_step": 180652, "epoch": 1075} {"train_loss": -11.436678886413574, "global_step": 180653, "epoch": 1075} {"train_loss": -11.392838478088379, "global_step": 180654, "epoch": 1075} {"train_loss": -11.216692924499512, "global_step": 180655, "epoch": 1075} {"train_loss": -11.250112533569336, "global_step": 180656, "epoch": 1075} {"train_loss": -11.174631118774414, "global_step": 180657, "epoch": 1075} {"train_loss": -11.196122169494629, "global_step": 180658, "epoch": 1075} {"train_loss": -11.524197578430176, "global_step": 180659, "epoch": 1075} {"train_loss": -11.573534965515137, "global_step": 180660, "epoch": 1075} {"train_loss": -11.4464693069458, "global_step": 180661, "epoch": 1075} {"train_loss": -11.495635986328125, "global_step": 180662, "epoch": 1075} {"train_loss": -11.247854232788086, "global_step": 180663, "epoch": 1075} {"train_loss": -11.292940139770508, "global_step": 180664, "epoch": 1075} {"train_loss": -11.50295639038086, "global_step": 180665, "epoch": 1075} {"train_loss": -11.104881286621094, "global_step": 180666, "epoch": 1075} {"train_loss": -11.380131721496582, "global_step": 180667, "epoch": 1075} {"train_loss": -11.539498329162598, "global_step": 180668, "epoch": 1075} {"train_loss": -11.672005653381348, "global_step": 180669, "epoch": 1075} {"train_loss": -11.554248809814453, "global_step": 180670, "epoch": 1075} {"train_loss": -11.707101821899414, "global_step": 180671, "epoch": 1075} {"train_loss": -11.53270435333252, "global_step": 180672, "epoch": 1075} {"train_loss": -11.680166244506836, "global_step": 180673, "epoch": 1075} {"train_loss": -11.128862380981445, "global_step": 180674, "epoch": 1075} {"train_loss": -11.389015197753906, "global_step": 180675, "epoch": 1075} {"train_loss": -10.34091854095459, "global_step": 180676, "epoch": 1075} {"train_loss": -9.71939468383789, "global_step": 180677, "epoch": 1075} {"train_loss": -11.425397872924805, "global_step": 180678, "epoch": 1075} {"train_loss": -10.48460865020752, "global_step": 180679, "epoch": 1075} {"train_loss": -9.172658920288086, "global_step": 180680, "epoch": 1075} {"train_loss": -9.930082321166992, "global_step": 180681, "epoch": 1075} {"train_loss": -10.052940368652344, "global_step": 180682, "epoch": 1075} {"train_loss": -9.37177848815918, "global_step": 180683, "epoch": 1075} {"train_loss": -10.27707290649414, "global_step": 180684, "epoch": 1075} {"train_loss": -6.0202789306640625, "global_step": 180685, "epoch": 1075} {"train_loss": -6.663421154022217, "global_step": 180686, "epoch": 1075} {"train_loss": -6.369930744171143, "global_step": 180687, "epoch": 1075} {"train_loss": -7.773343563079834, "global_step": 180688, "epoch": 1075} {"train_loss": -9.075448989868164, "global_step": 180689, "epoch": 1075} {"train_loss": -9.15087890625, "global_step": 180690, "epoch": 1075} {"train_loss": -7.963486671447754, "global_step": 180691, "epoch": 1075} {"train_loss": -7.546327590942383, "global_step": 180692, "epoch": 1075} {"train_loss": -8.925346374511719, "global_step": 180693, "epoch": 1075} {"train_loss": -9.215032577514648, "global_step": 180694, "epoch": 1075} {"train_loss": -7.813436985015869, "global_step": 180695, "epoch": 1075} {"train_loss": -9.339333534240723, "global_step": 180696, "epoch": 1075} {"train_loss": -8.58955192565918, "global_step": 180697, "epoch": 1075} {"train_loss": -9.69087028503418, "global_step": 180698, "epoch": 1075} {"train_loss": -9.86323356628418, "global_step": 180699, "epoch": 1075} {"train_loss": -9.305534362792969, "global_step": 180700, "epoch": 1075} {"train_loss": -9.361823081970215, "global_step": 180701, "epoch": 1075} {"train_loss": -9.094894409179688, "global_step": 180702, "epoch": 1075} {"train_loss": -10.123619079589844, "global_step": 180703, "epoch": 1075} {"train_loss": -9.950366020202637, "global_step": 180704, "epoch": 1075} {"train_loss": -10.298993110656738, "global_step": 180705, "epoch": 1075} {"train_loss": -10.0216064453125, "global_step": 180706, "epoch": 1075} {"train_loss": -10.327876091003418, "global_step": 180707, "epoch": 1075} {"train_loss": -10.380842208862305, "global_step": 180708, "epoch": 1075} {"train_loss": -10.556215286254883, "global_step": 180709, "epoch": 1075} {"train_loss": -10.099929809570312, "global_step": 180710, "epoch": 1075} {"train_loss": -10.684504508972168, "global_step": 180711, "epoch": 1075} {"train_loss": -10.36384391784668, "global_step": 180712, "epoch": 1075} {"train_loss": -10.15660572052002, "global_step": 180713, "epoch": 1075} {"train_loss": -10.49465560913086, "global_step": 180714, "epoch": 1075} {"train_loss": -10.516728401184082, "global_step": 180715, "epoch": 1075} {"train_loss": -10.340686798095703, "global_step": 180716, "epoch": 1075} {"train_loss": -10.434162139892578, "global_step": 180717, "epoch": 1075} {"train_loss": -10.760846138000488, "global_step": 180718, "epoch": 1075} {"train_loss": -10.390707015991211, "global_step": 180719, "epoch": 1075} {"train_loss": -10.231977462768555, "global_step": 180720, "epoch": 1075} {"train_loss": -10.596879959106445, "global_step": 180721, "epoch": 1075} {"train_loss": -10.497030258178711, "global_step": 180722, "epoch": 1075} {"train_loss": -10.90156364440918, "global_step": 180723, "epoch": 1075} {"train_loss": -10.789934158325195, "global_step": 180724, "epoch": 1075} {"train_loss": -10.969442367553711, "global_step": 180725, "epoch": 1075} {"train_loss": -10.656517028808594, "global_step": 180726, "epoch": 1075} {"train_loss": -10.674488067626953, "global_step": 180727, "epoch": 1075} {"train_loss": -10.999533653259277, "global_step": 180728, "epoch": 1075} {"train_loss": -11.01807689666748, "global_step": 180729, "epoch": 1075} {"train_loss": -11.053107261657715, "global_step": 180730, "epoch": 1075} {"train_loss": -10.999166488647461, "global_step": 180731, "epoch": 1075} {"train_loss": -10.960406303405762, "global_step": 180732, "epoch": 1075} {"train_loss": -10.924309730529785, "global_step": 180733, "epoch": 1075} {"train_loss": -11.022632598876953, "global_step": 180734, "epoch": 1075} {"train_loss": -10.912044525146484, "global_step": 180735, "epoch": 1075} {"train_loss": -10.952234268188477, "global_step": 180736, "epoch": 1075} {"train_loss": -10.932485580444336, "global_step": 180737, "epoch": 1075} {"train_loss": -10.906946182250977, "global_step": 180738, "epoch": 1075} {"train_loss": -11.01980209350586, "global_step": 180739, "epoch": 1075} {"train_loss": -11.019412994384766, "global_step": 180740, "epoch": 1075} {"train_loss": -11.071466445922852, "global_step": 180741, "epoch": 1075} {"train_loss": -11.129892349243164, "global_step": 180742, "epoch": 1075} {"train_loss": -11.048633575439453, "global_step": 180743, "epoch": 1075} {"train_loss": -11.301055908203125, "global_step": 180744, "epoch": 1075} {"train_loss": -11.244549751281738, "global_step": 180745, "epoch": 1075} {"train_loss": -11.186814308166504, "global_step": 180746, "epoch": 1075} {"train_loss": -11.17663860321045, "global_step": 180747, "epoch": 1075} {"train_loss": -11.048040390014648, "global_step": 180748, "epoch": 1075} {"train_loss": -11.31144905090332, "global_step": 180749, "epoch": 1075} {"train_loss": -11.264753341674805, "global_step": 180750, "epoch": 1075} {"train_loss": -11.20429801940918, "global_step": 180751, "epoch": 1075} {"train_loss": -11.206992149353027, "global_step": 180752, "epoch": 1075} {"train_loss": -11.393082618713379, "global_step": 180753, "epoch": 1075} {"train_loss": -11.290645599365234, "global_step": 180754, "epoch": 1075} {"train_loss": -11.343746185302734, "global_step": 180755, "epoch": 1075} {"train_loss": -11.30693244934082, "global_step": 180756, "epoch": 1075} {"train_loss": -11.515426635742188, "global_step": 180757, "epoch": 1075} {"train_loss": -11.523874282836914, "global_step": 180758, "epoch": 1075} {"train_loss": -11.494958877563477, "global_step": 180759, "epoch": 1075} {"train_loss": -11.12500286102295, "global_step": 180760, "epoch": 1075} {"train_loss": -11.309545516967773, "global_step": 180761, "epoch": 1075} {"train_loss": -11.368271827697754, "global_step": 180762, "epoch": 1075} {"train_loss": -11.416756629943848, "global_step": 180763, "epoch": 1075} {"train_loss": -11.495494842529297, "global_step": 180764, "epoch": 1075} {"train_loss": -11.397665023803711, "global_step": 180765, "epoch": 1075} {"train_loss": -11.288394927978516, "global_step": 180766, "epoch": 1075} {"train_loss": -10.792259392284212, "global_step": 180767, "epoch": 1075, "val_loss": 233752.53125, "train_action_mse_error": 0.17587798833847046} {"train_loss": -11.416869163513184, "global_step": 180768, "epoch": 1076} {"train_loss": -11.311691284179688, "global_step": 180769, "epoch": 1076} {"train_loss": -11.296772956848145, "global_step": 180770, "epoch": 1076} {"train_loss": -11.35385513305664, "global_step": 180771, "epoch": 1076} {"train_loss": -11.018386840820312, "global_step": 180772, "epoch": 1076} {"train_loss": -11.178293228149414, "global_step": 180773, "epoch": 1076} {"train_loss": -11.308767318725586, "global_step": 180774, "epoch": 1076} {"train_loss": -10.247148513793945, "global_step": 180775, "epoch": 1076} {"train_loss": -10.732322692871094, "global_step": 180776, "epoch": 1076} {"train_loss": -11.212084770202637, "global_step": 180777, "epoch": 1076} {"train_loss": -10.227394104003906, "global_step": 180778, "epoch": 1076} {"train_loss": -10.291189193725586, "global_step": 180779, "epoch": 1076} {"train_loss": -10.978170394897461, "global_step": 180780, "epoch": 1076} {"train_loss": -10.355720520019531, "global_step": 180781, "epoch": 1076} {"train_loss": -11.039551734924316, "global_step": 180782, "epoch": 1076} {"train_loss": -11.327988624572754, "global_step": 180783, "epoch": 1076} {"train_loss": -10.765941619873047, "global_step": 180784, "epoch": 1076} {"train_loss": -11.324017524719238, "global_step": 180785, "epoch": 1076} {"train_loss": -10.5599946975708, "global_step": 180786, "epoch": 1076} {"train_loss": -10.914436340332031, "global_step": 180787, "epoch": 1076} {"train_loss": -11.010181427001953, "global_step": 180788, "epoch": 1076} {"train_loss": -10.063358306884766, "global_step": 180789, "epoch": 1076} {"train_loss": -10.179420471191406, "global_step": 180790, "epoch": 1076} {"train_loss": -10.99628734588623, "global_step": 180791, "epoch": 1076} {"train_loss": -10.595447540283203, "global_step": 180792, "epoch": 1076} {"train_loss": -11.386926651000977, "global_step": 180793, "epoch": 1076} {"train_loss": -10.70264720916748, "global_step": 180794, "epoch": 1076} {"train_loss": -10.987762451171875, "global_step": 180795, "epoch": 1076} {"train_loss": -10.87289047241211, "global_step": 180796, "epoch": 1076} {"train_loss": -10.581317901611328, "global_step": 180797, "epoch": 1076} {"train_loss": -10.926759719848633, "global_step": 180798, "epoch": 1076} {"train_loss": -10.534135818481445, "global_step": 180799, "epoch": 1076} {"train_loss": -10.883929252624512, "global_step": 180800, "epoch": 1076} {"train_loss": -10.120122909545898, "global_step": 180801, "epoch": 1076} {"train_loss": -10.84310531616211, "global_step": 180802, "epoch": 1076} {"train_loss": -10.38729190826416, "global_step": 180803, "epoch": 1076} {"train_loss": -9.990747451782227, "global_step": 180804, "epoch": 1076} {"train_loss": -10.46896743774414, "global_step": 180805, "epoch": 1076} {"train_loss": -10.184236526489258, "global_step": 180806, "epoch": 1076} {"train_loss": -10.726730346679688, "global_step": 180807, "epoch": 1076} {"train_loss": -10.783018112182617, "global_step": 180808, "epoch": 1076} {"train_loss": -10.235932350158691, "global_step": 180809, "epoch": 1076} {"train_loss": -11.12036418914795, "global_step": 180810, "epoch": 1076} {"train_loss": -10.346430778503418, "global_step": 180811, "epoch": 1076} {"train_loss": -10.704099655151367, "global_step": 180812, "epoch": 1076} {"train_loss": -10.788232803344727, "global_step": 180813, "epoch": 1076} {"train_loss": -10.703117370605469, "global_step": 180814, "epoch": 1076} {"train_loss": -10.689050674438477, "global_step": 180815, "epoch": 1076} {"train_loss": -11.032238006591797, "global_step": 180816, "epoch": 1076} {"train_loss": -10.663126945495605, "global_step": 180817, "epoch": 1076} {"train_loss": -11.234238624572754, "global_step": 180818, "epoch": 1076} {"train_loss": -10.93823528289795, "global_step": 180819, "epoch": 1076} {"train_loss": -10.901866912841797, "global_step": 180820, "epoch": 1076} {"train_loss": -10.90945053100586, "global_step": 180821, "epoch": 1076} {"train_loss": -10.977617263793945, "global_step": 180822, "epoch": 1076} {"train_loss": -10.948698043823242, "global_step": 180823, "epoch": 1076} {"train_loss": -11.062067985534668, "global_step": 180824, "epoch": 1076} {"train_loss": -11.182141304016113, "global_step": 180825, "epoch": 1076} {"train_loss": -10.922622680664062, "global_step": 180826, "epoch": 1076} {"train_loss": -11.141493797302246, "global_step": 180827, "epoch": 1076} {"train_loss": -11.285268783569336, "global_step": 180828, "epoch": 1076} {"train_loss": -11.012864112854004, "global_step": 180829, "epoch": 1076} {"train_loss": -11.150720596313477, "global_step": 180830, "epoch": 1076} {"train_loss": -11.345422744750977, "global_step": 180831, "epoch": 1076} {"train_loss": -11.095197677612305, "global_step": 180832, "epoch": 1076} {"train_loss": -11.114736557006836, "global_step": 180833, "epoch": 1076} {"train_loss": -11.116083145141602, "global_step": 180834, "epoch": 1076} {"train_loss": -11.022174835205078, "global_step": 180835, "epoch": 1076} {"train_loss": -11.19965934753418, "global_step": 180836, "epoch": 1076} {"train_loss": -11.246326446533203, "global_step": 180837, "epoch": 1076} {"train_loss": -10.97454833984375, "global_step": 180838, "epoch": 1076} {"train_loss": -11.28623104095459, "global_step": 180839, "epoch": 1076} {"train_loss": -11.143415451049805, "global_step": 180840, "epoch": 1076} {"train_loss": -11.398624420166016, "global_step": 180841, "epoch": 1076} {"train_loss": -11.140788078308105, "global_step": 180842, "epoch": 1076} {"train_loss": -11.230690002441406, "global_step": 180843, "epoch": 1076} {"train_loss": -11.482620239257812, "global_step": 180844, "epoch": 1076} {"train_loss": -11.168542861938477, "global_step": 180845, "epoch": 1076} {"train_loss": -11.300357818603516, "global_step": 180846, "epoch": 1076} {"train_loss": -11.166982650756836, "global_step": 180847, "epoch": 1076} {"train_loss": -11.214292526245117, "global_step": 180848, "epoch": 1076} {"train_loss": -11.188800811767578, "global_step": 180849, "epoch": 1076} {"train_loss": -11.3579683303833, "global_step": 180850, "epoch": 1076} {"train_loss": -11.227104187011719, "global_step": 180851, "epoch": 1076} {"train_loss": -11.424371719360352, "global_step": 180852, "epoch": 1076} {"train_loss": -11.24789047241211, "global_step": 180853, "epoch": 1076} {"train_loss": -11.248953819274902, "global_step": 180854, "epoch": 1076} {"train_loss": -11.461413383483887, "global_step": 180855, "epoch": 1076} {"train_loss": -11.587583541870117, "global_step": 180856, "epoch": 1076} {"train_loss": -11.349481582641602, "global_step": 180857, "epoch": 1076} {"train_loss": -11.358750343322754, "global_step": 180858, "epoch": 1076} {"train_loss": -11.312573432922363, "global_step": 180859, "epoch": 1076} {"train_loss": -11.289146423339844, "global_step": 180860, "epoch": 1076} {"train_loss": -11.316120147705078, "global_step": 180861, "epoch": 1076} {"train_loss": -11.578024864196777, "global_step": 180862, "epoch": 1076} {"train_loss": -11.429290771484375, "global_step": 180863, "epoch": 1076} {"train_loss": -11.527403831481934, "global_step": 180864, "epoch": 1076} {"train_loss": -11.390711784362793, "global_step": 180865, "epoch": 1076} {"train_loss": -11.232429504394531, "global_step": 180866, "epoch": 1076} {"train_loss": -11.43317985534668, "global_step": 180867, "epoch": 1076} {"train_loss": -11.190794944763184, "global_step": 180868, "epoch": 1076} {"train_loss": -11.599038124084473, "global_step": 180869, "epoch": 1076} {"train_loss": -11.366869926452637, "global_step": 180870, "epoch": 1076} {"train_loss": -11.472879409790039, "global_step": 180871, "epoch": 1076} {"train_loss": -11.272112846374512, "global_step": 180872, "epoch": 1076} {"train_loss": -11.15982437133789, "global_step": 180873, "epoch": 1076} {"train_loss": -10.551575660705566, "global_step": 180874, "epoch": 1076} {"train_loss": -8.686151504516602, "global_step": 180875, "epoch": 1076} {"train_loss": -11.422272682189941, "global_step": 180876, "epoch": 1076} {"train_loss": -10.076581954956055, "global_step": 180877, "epoch": 1076} {"train_loss": -10.440930366516113, "global_step": 180878, "epoch": 1076} {"train_loss": -10.097881317138672, "global_step": 180879, "epoch": 1076} {"train_loss": -9.523248672485352, "global_step": 180880, "epoch": 1076} {"train_loss": -7.677630424499512, "global_step": 180881, "epoch": 1076} {"train_loss": -7.051418304443359, "global_step": 180882, "epoch": 1076} {"train_loss": -7.022061347961426, "global_step": 180883, "epoch": 1076} {"train_loss": -7.60440731048584, "global_step": 180884, "epoch": 1076} {"train_loss": -8.772911071777344, "global_step": 180885, "epoch": 1076} {"train_loss": -8.540727615356445, "global_step": 180886, "epoch": 1076} {"train_loss": -8.740439414978027, "global_step": 180887, "epoch": 1076} {"train_loss": -7.485562324523926, "global_step": 180888, "epoch": 1076} {"train_loss": -7.448821544647217, "global_step": 180889, "epoch": 1076} {"train_loss": -8.39126968383789, "global_step": 180890, "epoch": 1076} {"train_loss": -7.81333065032959, "global_step": 180891, "epoch": 1076} {"train_loss": -8.209319114685059, "global_step": 180892, "epoch": 1076} {"train_loss": -9.187276840209961, "global_step": 180893, "epoch": 1076} {"train_loss": -8.752707481384277, "global_step": 180894, "epoch": 1076} {"train_loss": -8.266351699829102, "global_step": 180895, "epoch": 1076} {"train_loss": -9.223917007446289, "global_step": 180896, "epoch": 1076} {"train_loss": -8.97804069519043, "global_step": 180897, "epoch": 1076} {"train_loss": -9.209511756896973, "global_step": 180898, "epoch": 1076} {"train_loss": -9.582216262817383, "global_step": 180899, "epoch": 1076} {"train_loss": -9.418008804321289, "global_step": 180900, "epoch": 1076} {"train_loss": -10.241581916809082, "global_step": 180901, "epoch": 1076} {"train_loss": -9.821249008178711, "global_step": 180902, "epoch": 1076} {"train_loss": -9.987540245056152, "global_step": 180903, "epoch": 1076} {"train_loss": -10.50474739074707, "global_step": 180904, "epoch": 1076} {"train_loss": -10.313912391662598, "global_step": 180905, "epoch": 1076} {"train_loss": -10.274572372436523, "global_step": 180906, "epoch": 1076} {"train_loss": -10.464001655578613, "global_step": 180907, "epoch": 1076} {"train_loss": -10.5955810546875, "global_step": 180908, "epoch": 1076} {"train_loss": -10.34876537322998, "global_step": 180909, "epoch": 1076} {"train_loss": -10.519432067871094, "global_step": 180910, "epoch": 1076} {"train_loss": -10.691688537597656, "global_step": 180911, "epoch": 1076} {"train_loss": -10.736692428588867, "global_step": 180912, "epoch": 1076} {"train_loss": -10.421977996826172, "global_step": 180913, "epoch": 1076} {"train_loss": -10.586885452270508, "global_step": 180914, "epoch": 1076} {"train_loss": -10.39112663269043, "global_step": 180915, "epoch": 1076} {"train_loss": -10.5916109085083, "global_step": 180916, "epoch": 1076} {"train_loss": -10.660689353942871, "global_step": 180917, "epoch": 1076} {"train_loss": -10.70785140991211, "global_step": 180918, "epoch": 1076} {"train_loss": -10.653581619262695, "global_step": 180919, "epoch": 1076} {"train_loss": -10.487354278564453, "global_step": 180920, "epoch": 1076} {"train_loss": -10.695446014404297, "global_step": 180921, "epoch": 1076} {"train_loss": -10.660390853881836, "global_step": 180922, "epoch": 1076} {"train_loss": -10.76675033569336, "global_step": 180923, "epoch": 1076} {"train_loss": -10.76379680633545, "global_step": 180924, "epoch": 1076} {"train_loss": -11.175243377685547, "global_step": 180925, "epoch": 1076} {"train_loss": -10.792439460754395, "global_step": 180926, "epoch": 1076} {"train_loss": -10.866291046142578, "global_step": 180927, "epoch": 1076} {"train_loss": -10.831502914428711, "global_step": 180928, "epoch": 1076} {"train_loss": -10.786952018737793, "global_step": 180929, "epoch": 1076} {"train_loss": -10.80296516418457, "global_step": 180930, "epoch": 1076} {"train_loss": -11.213362693786621, "global_step": 180931, "epoch": 1076} {"train_loss": -11.114700317382812, "global_step": 180932, "epoch": 1076} {"train_loss": -11.134742736816406, "global_step": 180933, "epoch": 1076} {"train_loss": -10.986202239990234, "global_step": 180934, "epoch": 1076} {"train_loss": -10.587392395450955, "global_step": 180935, "epoch": 1076, "val_loss": 244390.5625} {"train_loss": -11.116572380065918, "global_step": 180936, "epoch": 1077} {"train_loss": -11.024654388427734, "global_step": 180937, "epoch": 1077} {"train_loss": -11.11551284790039, "global_step": 180938, "epoch": 1077} {"train_loss": -11.367206573486328, "global_step": 180939, "epoch": 1077} {"train_loss": -11.359262466430664, "global_step": 180940, "epoch": 1077} {"train_loss": -11.268415451049805, "global_step": 180941, "epoch": 1077} {"train_loss": -11.524334907531738, "global_step": 180942, "epoch": 1077} {"train_loss": -11.241958618164062, "global_step": 180943, "epoch": 1077} {"train_loss": -11.307302474975586, "global_step": 180944, "epoch": 1077} {"train_loss": -11.468015670776367, "global_step": 180945, "epoch": 1077} {"train_loss": -11.438835144042969, "global_step": 180946, "epoch": 1077} {"train_loss": -11.459479331970215, "global_step": 180947, "epoch": 1077} {"train_loss": -11.249507904052734, "global_step": 180948, "epoch": 1077} {"train_loss": -11.108108520507812, "global_step": 180949, "epoch": 1077} {"train_loss": -11.458037376403809, "global_step": 180950, "epoch": 1077} {"train_loss": -11.441574096679688, "global_step": 180951, "epoch": 1077} {"train_loss": -11.50065803527832, "global_step": 180952, "epoch": 1077} {"train_loss": -11.503496170043945, "global_step": 180953, "epoch": 1077} {"train_loss": -11.389630317687988, "global_step": 180954, "epoch": 1077} {"train_loss": -11.45620346069336, "global_step": 180955, "epoch": 1077} {"train_loss": -11.413764953613281, "global_step": 180956, "epoch": 1077} {"train_loss": -11.471820831298828, "global_step": 180957, "epoch": 1077} {"train_loss": -11.340936660766602, "global_step": 180958, "epoch": 1077} {"train_loss": -11.254793167114258, "global_step": 180959, "epoch": 1077} {"train_loss": -11.458480834960938, "global_step": 180960, "epoch": 1077} {"train_loss": -11.409603118896484, "global_step": 180961, "epoch": 1077} {"train_loss": -10.822953224182129, "global_step": 180962, "epoch": 1077} {"train_loss": -10.864324569702148, "global_step": 180963, "epoch": 1077} {"train_loss": -11.350406646728516, "global_step": 180964, "epoch": 1077} {"train_loss": -10.58382797241211, "global_step": 180965, "epoch": 1077} {"train_loss": -10.896991729736328, "global_step": 180966, "epoch": 1077} {"train_loss": -10.811380386352539, "global_step": 180967, "epoch": 1077} {"train_loss": -11.278585433959961, "global_step": 180968, "epoch": 1077} {"train_loss": -11.022069931030273, "global_step": 180969, "epoch": 1077} {"train_loss": -10.321497917175293, "global_step": 180970, "epoch": 1077} {"train_loss": -11.09827709197998, "global_step": 180971, "epoch": 1077} {"train_loss": -10.9143705368042, "global_step": 180972, "epoch": 1077} {"train_loss": -11.142187118530273, "global_step": 180973, "epoch": 1077} {"train_loss": -10.924696922302246, "global_step": 180974, "epoch": 1077} {"train_loss": -11.200427055358887, "global_step": 180975, "epoch": 1077} {"train_loss": -11.136367797851562, "global_step": 180976, "epoch": 1077} {"train_loss": -11.260525703430176, "global_step": 180977, "epoch": 1077} {"train_loss": -11.19392204284668, "global_step": 180978, "epoch": 1077} {"train_loss": -11.06212043762207, "global_step": 180979, "epoch": 1077} {"train_loss": -10.971565246582031, "global_step": 180980, "epoch": 1077} {"train_loss": -11.379215240478516, "global_step": 180981, "epoch": 1077} {"train_loss": -10.677356719970703, "global_step": 180982, "epoch": 1077} {"train_loss": -11.264935493469238, "global_step": 180983, "epoch": 1077} {"train_loss": -11.152555465698242, "global_step": 180984, "epoch": 1077} {"train_loss": -11.116877555847168, "global_step": 180985, "epoch": 1077} {"train_loss": -11.116604804992676, "global_step": 180986, "epoch": 1077} {"train_loss": -11.21208667755127, "global_step": 180987, "epoch": 1077} {"train_loss": -11.405009269714355, "global_step": 180988, "epoch": 1077} {"train_loss": -11.47578239440918, "global_step": 180989, "epoch": 1077} {"train_loss": -11.420221328735352, "global_step": 180990, "epoch": 1077} {"train_loss": -11.35737133026123, "global_step": 180991, "epoch": 1077} {"train_loss": -11.398191452026367, "global_step": 180992, "epoch": 1077} {"train_loss": -11.211334228515625, "global_step": 180993, "epoch": 1077} {"train_loss": -11.149248123168945, "global_step": 180994, "epoch": 1077} {"train_loss": -11.191905975341797, "global_step": 180995, "epoch": 1077} {"train_loss": -11.413566589355469, "global_step": 180996, "epoch": 1077} {"train_loss": -11.396039962768555, "global_step": 180997, "epoch": 1077} {"train_loss": -11.541847229003906, "global_step": 180998, "epoch": 1077} {"train_loss": -11.258980751037598, "global_step": 180999, "epoch": 1077} {"train_loss": -11.50094985961914, "global_step": 181000, "epoch": 1077} {"train_loss": -10.947434425354004, "global_step": 181001, "epoch": 1077} {"train_loss": -11.369544982910156, "global_step": 181002, "epoch": 1077} {"train_loss": -10.919876098632812, "global_step": 181003, "epoch": 1077} {"train_loss": -10.886281967163086, "global_step": 181004, "epoch": 1077} {"train_loss": -10.571552276611328, "global_step": 181005, "epoch": 1077} {"train_loss": -11.25478458404541, "global_step": 181006, "epoch": 1077} {"train_loss": -9.364992141723633, "global_step": 181007, "epoch": 1077} {"train_loss": -11.33108139038086, "global_step": 181008, "epoch": 1077} {"train_loss": -9.88461685180664, "global_step": 181009, "epoch": 1077} {"train_loss": -9.461207389831543, "global_step": 181010, "epoch": 1077} {"train_loss": -10.591697692871094, "global_step": 181011, "epoch": 1077} {"train_loss": -8.915193557739258, "global_step": 181012, "epoch": 1077} {"train_loss": -10.935654640197754, "global_step": 181013, "epoch": 1077} {"train_loss": -10.050914764404297, "global_step": 181014, "epoch": 1077} {"train_loss": -10.637651443481445, "global_step": 181015, "epoch": 1077} {"train_loss": -10.771804809570312, "global_step": 181016, "epoch": 1077} {"train_loss": -10.038246154785156, "global_step": 181017, "epoch": 1077} {"train_loss": -11.235268592834473, "global_step": 181018, "epoch": 1077} {"train_loss": -10.284358024597168, "global_step": 181019, "epoch": 1077} {"train_loss": -11.063640594482422, "global_step": 181020, "epoch": 1077} {"train_loss": -10.39480972290039, "global_step": 181021, "epoch": 1077} {"train_loss": -10.969048500061035, "global_step": 181022, "epoch": 1077} {"train_loss": -10.692174911499023, "global_step": 181023, "epoch": 1077} {"train_loss": -10.87713623046875, "global_step": 181024, "epoch": 1077} {"train_loss": -10.87582015991211, "global_step": 181025, "epoch": 1077} {"train_loss": -11.166360855102539, "global_step": 181026, "epoch": 1077} {"train_loss": -10.713823318481445, "global_step": 181027, "epoch": 1077} {"train_loss": -10.917181015014648, "global_step": 181028, "epoch": 1077} {"train_loss": -10.98837661743164, "global_step": 181029, "epoch": 1077} {"train_loss": -10.85110855102539, "global_step": 181030, "epoch": 1077} {"train_loss": -10.833154678344727, "global_step": 181031, "epoch": 1077} {"train_loss": -10.87518310546875, "global_step": 181032, "epoch": 1077} {"train_loss": -11.021284103393555, "global_step": 181033, "epoch": 1077} {"train_loss": -10.903656005859375, "global_step": 181034, "epoch": 1077} {"train_loss": -11.085382461547852, "global_step": 181035, "epoch": 1077} {"train_loss": -11.060229301452637, "global_step": 181036, "epoch": 1077} {"train_loss": -11.070659637451172, "global_step": 181037, "epoch": 1077} {"train_loss": -11.172897338867188, "global_step": 181038, "epoch": 1077} {"train_loss": -10.980794906616211, "global_step": 181039, "epoch": 1077} {"train_loss": -11.264842987060547, "global_step": 181040, "epoch": 1077} {"train_loss": -11.014455795288086, "global_step": 181041, "epoch": 1077} {"train_loss": -11.367732048034668, "global_step": 181042, "epoch": 1077} {"train_loss": -11.078060150146484, "global_step": 181043, "epoch": 1077} {"train_loss": -11.133248329162598, "global_step": 181044, "epoch": 1077} {"train_loss": -11.119544982910156, "global_step": 181045, "epoch": 1077} {"train_loss": -11.15999984741211, "global_step": 181046, "epoch": 1077} {"train_loss": -11.302802085876465, "global_step": 181047, "epoch": 1077} {"train_loss": -11.207050323486328, "global_step": 181048, "epoch": 1077} {"train_loss": -11.30813217163086, "global_step": 181049, "epoch": 1077} {"train_loss": -11.245208740234375, "global_step": 181050, "epoch": 1077} {"train_loss": -11.34802532196045, "global_step": 181051, "epoch": 1077} {"train_loss": -11.321436882019043, "global_step": 181052, "epoch": 1077} {"train_loss": -11.395706176757812, "global_step": 181053, "epoch": 1077} {"train_loss": -11.373351097106934, "global_step": 181054, "epoch": 1077} {"train_loss": -11.552042007446289, "global_step": 181055, "epoch": 1077} {"train_loss": -11.227773666381836, "global_step": 181056, "epoch": 1077} {"train_loss": -11.414093017578125, "global_step": 181057, "epoch": 1077} {"train_loss": -11.27851676940918, "global_step": 181058, "epoch": 1077} {"train_loss": -11.26197624206543, "global_step": 181059, "epoch": 1077} {"train_loss": -11.376599311828613, "global_step": 181060, "epoch": 1077} {"train_loss": -11.139107704162598, "global_step": 181061, "epoch": 1077} {"train_loss": -11.439554214477539, "global_step": 181062, "epoch": 1077} {"train_loss": -11.313798904418945, "global_step": 181063, "epoch": 1077} {"train_loss": -11.650196075439453, "global_step": 181064, "epoch": 1077} {"train_loss": -11.445292472839355, "global_step": 181065, "epoch": 1077} {"train_loss": -11.462114334106445, "global_step": 181066, "epoch": 1077} {"train_loss": -10.928781509399414, "global_step": 181067, "epoch": 1077} {"train_loss": -11.32435417175293, "global_step": 181068, "epoch": 1077} {"train_loss": -11.154314041137695, "global_step": 181069, "epoch": 1077} {"train_loss": -11.144208908081055, "global_step": 181070, "epoch": 1077} {"train_loss": -10.986434936523438, "global_step": 181071, "epoch": 1077} {"train_loss": -11.445985794067383, "global_step": 181072, "epoch": 1077} {"train_loss": -11.369651794433594, "global_step": 181073, "epoch": 1077} {"train_loss": -10.986543655395508, "global_step": 181074, "epoch": 1077} {"train_loss": -10.41148567199707, "global_step": 181075, "epoch": 1077} {"train_loss": -11.005571365356445, "global_step": 181076, "epoch": 1077} {"train_loss": -9.860437393188477, "global_step": 181077, "epoch": 1077} {"train_loss": -10.357158660888672, "global_step": 181078, "epoch": 1077} {"train_loss": -10.751554489135742, "global_step": 181079, "epoch": 1077} {"train_loss": -10.158454895019531, "global_step": 181080, "epoch": 1077} {"train_loss": -10.57431697845459, "global_step": 181081, "epoch": 1077} {"train_loss": -10.252768516540527, "global_step": 181082, "epoch": 1077} {"train_loss": -10.804807662963867, "global_step": 181083, "epoch": 1077} {"train_loss": -10.337864875793457, "global_step": 181084, "epoch": 1077} {"train_loss": -10.396174430847168, "global_step": 181085, "epoch": 1077} {"train_loss": -8.84930419921875, "global_step": 181086, "epoch": 1077} {"train_loss": -10.758602142333984, "global_step": 181087, "epoch": 1077} {"train_loss": -9.594467163085938, "global_step": 181088, "epoch": 1077} {"train_loss": -10.408863067626953, "global_step": 181089, "epoch": 1077} {"train_loss": -9.732161521911621, "global_step": 181090, "epoch": 1077} {"train_loss": -9.830739974975586, "global_step": 181091, "epoch": 1077} {"train_loss": -10.641412734985352, "global_step": 181092, "epoch": 1077} {"train_loss": -10.321584701538086, "global_step": 181093, "epoch": 1077} {"train_loss": -10.626272201538086, "global_step": 181094, "epoch": 1077} {"train_loss": -10.16098403930664, "global_step": 181095, "epoch": 1077} {"train_loss": -10.890619277954102, "global_step": 181096, "epoch": 1077} {"train_loss": -10.399678230285645, "global_step": 181097, "epoch": 1077} {"train_loss": -10.632481575012207, "global_step": 181098, "epoch": 1077} {"train_loss": -10.579906463623047, "global_step": 181099, "epoch": 1077} {"train_loss": -10.480555534362793, "global_step": 181100, "epoch": 1077} {"train_loss": -10.905985832214355, "global_step": 181101, "epoch": 1077} {"train_loss": -10.889982223510742, "global_step": 181102, "epoch": 1077} {"train_loss": -10.97324375879197, "global_step": 181103, "epoch": 1077, "val_loss": 245001.6875} {"train_loss": -10.902904510498047, "global_step": 181104, "epoch": 1078} {"train_loss": -10.542045593261719, "global_step": 181105, "epoch": 1078} {"train_loss": -10.840269088745117, "global_step": 181106, "epoch": 1078} {"train_loss": -10.743820190429688, "global_step": 181107, "epoch": 1078} {"train_loss": -10.406262397766113, "global_step": 181108, "epoch": 1078} {"train_loss": -11.064201354980469, "global_step": 181109, "epoch": 1078} {"train_loss": -10.665691375732422, "global_step": 181110, "epoch": 1078} {"train_loss": -11.04920768737793, "global_step": 181111, "epoch": 1078} {"train_loss": -10.949606895446777, "global_step": 181112, "epoch": 1078} {"train_loss": -10.776772499084473, "global_step": 181113, "epoch": 1078} {"train_loss": -11.313992500305176, "global_step": 181114, "epoch": 1078} {"train_loss": -11.272208213806152, "global_step": 181115, "epoch": 1078} {"train_loss": -10.928301811218262, "global_step": 181116, "epoch": 1078} {"train_loss": -11.055791854858398, "global_step": 181117, "epoch": 1078} {"train_loss": -10.87436580657959, "global_step": 181118, "epoch": 1078} {"train_loss": -10.775853157043457, "global_step": 181119, "epoch": 1078} {"train_loss": -11.35174560546875, "global_step": 181120, "epoch": 1078} {"train_loss": -10.984296798706055, "global_step": 181121, "epoch": 1078} {"train_loss": -11.093452453613281, "global_step": 181122, "epoch": 1078} {"train_loss": -11.086808204650879, "global_step": 181123, "epoch": 1078} {"train_loss": -11.039848327636719, "global_step": 181124, "epoch": 1078} {"train_loss": -11.125306129455566, "global_step": 181125, "epoch": 1078} {"train_loss": -11.247188568115234, "global_step": 181126, "epoch": 1078} {"train_loss": -11.382621765136719, "global_step": 181127, "epoch": 1078} {"train_loss": -11.366236686706543, "global_step": 181128, "epoch": 1078} {"train_loss": -11.238008499145508, "global_step": 181129, "epoch": 1078} {"train_loss": -11.31838607788086, "global_step": 181130, "epoch": 1078} {"train_loss": -11.168829917907715, "global_step": 181131, "epoch": 1078} {"train_loss": -11.185100555419922, "global_step": 181132, "epoch": 1078} {"train_loss": -11.273006439208984, "global_step": 181133, "epoch": 1078} {"train_loss": -11.396929740905762, "global_step": 181134, "epoch": 1078} {"train_loss": -11.495720863342285, "global_step": 181135, "epoch": 1078} {"train_loss": -11.315115928649902, "global_step": 181136, "epoch": 1078} {"train_loss": -11.306560516357422, "global_step": 181137, "epoch": 1078} {"train_loss": -11.47407341003418, "global_step": 181138, "epoch": 1078} {"train_loss": -11.27925968170166, "global_step": 181139, "epoch": 1078} {"train_loss": -11.462947845458984, "global_step": 181140, "epoch": 1078} {"train_loss": -11.338619232177734, "global_step": 181141, "epoch": 1078} {"train_loss": -11.526695251464844, "global_step": 181142, "epoch": 1078} {"train_loss": -11.33414077758789, "global_step": 181143, "epoch": 1078} {"train_loss": -11.488880157470703, "global_step": 181144, "epoch": 1078} {"train_loss": -11.441346168518066, "global_step": 181145, "epoch": 1078} {"train_loss": -11.648763656616211, "global_step": 181146, "epoch": 1078} {"train_loss": -11.409431457519531, "global_step": 181147, "epoch": 1078} {"train_loss": -11.560233116149902, "global_step": 181148, "epoch": 1078} {"train_loss": -11.437721252441406, "global_step": 181149, "epoch": 1078} {"train_loss": -11.306434631347656, "global_step": 181150, "epoch": 1078} {"train_loss": -11.417319297790527, "global_step": 181151, "epoch": 1078} {"train_loss": -11.399200439453125, "global_step": 181152, "epoch": 1078} {"train_loss": -11.484506607055664, "global_step": 181153, "epoch": 1078} {"train_loss": -10.921382904052734, "global_step": 181154, "epoch": 1078} {"train_loss": -11.1729736328125, "global_step": 181155, "epoch": 1078} {"train_loss": -11.290288925170898, "global_step": 181156, "epoch": 1078} {"train_loss": -10.436614990234375, "global_step": 181157, "epoch": 1078} {"train_loss": -11.016899108886719, "global_step": 181158, "epoch": 1078} {"train_loss": -11.544477462768555, "global_step": 181159, "epoch": 1078} {"train_loss": -10.725175857543945, "global_step": 181160, "epoch": 1078} {"train_loss": -10.80367660522461, "global_step": 181161, "epoch": 1078} {"train_loss": -11.17166519165039, "global_step": 181162, "epoch": 1078} {"train_loss": -10.56151008605957, "global_step": 181163, "epoch": 1078} {"train_loss": -10.788732528686523, "global_step": 181164, "epoch": 1078} {"train_loss": -10.859783172607422, "global_step": 181165, "epoch": 1078} {"train_loss": -10.471031188964844, "global_step": 181166, "epoch": 1078} {"train_loss": -10.814107894897461, "global_step": 181167, "epoch": 1078} {"train_loss": -10.793914794921875, "global_step": 181168, "epoch": 1078} {"train_loss": -10.205175399780273, "global_step": 181169, "epoch": 1078} {"train_loss": -11.074578285217285, "global_step": 181170, "epoch": 1078} {"train_loss": -9.96038818359375, "global_step": 181171, "epoch": 1078} {"train_loss": -11.233997344970703, "global_step": 181172, "epoch": 1078} {"train_loss": -10.377513885498047, "global_step": 181173, "epoch": 1078} {"train_loss": -10.975448608398438, "global_step": 181174, "epoch": 1078} {"train_loss": -10.700369834899902, "global_step": 181175, "epoch": 1078} {"train_loss": -9.996767044067383, "global_step": 181176, "epoch": 1078} {"train_loss": -11.034404754638672, "global_step": 181177, "epoch": 1078} {"train_loss": -10.432994842529297, "global_step": 181178, "epoch": 1078} {"train_loss": -11.066171646118164, "global_step": 181179, "epoch": 1078} {"train_loss": -10.84632682800293, "global_step": 181180, "epoch": 1078} {"train_loss": -11.123140335083008, "global_step": 181181, "epoch": 1078} {"train_loss": -10.854475021362305, "global_step": 181182, "epoch": 1078} {"train_loss": -10.920602798461914, "global_step": 181183, "epoch": 1078} {"train_loss": -11.132339477539062, "global_step": 181184, "epoch": 1078} {"train_loss": -11.119763374328613, "global_step": 181185, "epoch": 1078} {"train_loss": -10.602190017700195, "global_step": 181186, "epoch": 1078} {"train_loss": -10.71829605102539, "global_step": 181187, "epoch": 1078} {"train_loss": -10.093547821044922, "global_step": 181188, "epoch": 1078} {"train_loss": -11.250019073486328, "global_step": 181189, "epoch": 1078} {"train_loss": -10.021629333496094, "global_step": 181190, "epoch": 1078} {"train_loss": -10.804571151733398, "global_step": 181191, "epoch": 1078} {"train_loss": -10.645572662353516, "global_step": 181192, "epoch": 1078} {"train_loss": -10.557973861694336, "global_step": 181193, "epoch": 1078} {"train_loss": -10.928884506225586, "global_step": 181194, "epoch": 1078} {"train_loss": -10.401171684265137, "global_step": 181195, "epoch": 1078} {"train_loss": -10.701677322387695, "global_step": 181196, "epoch": 1078} {"train_loss": -10.70063591003418, "global_step": 181197, "epoch": 1078} {"train_loss": -10.148235321044922, "global_step": 181198, "epoch": 1078} {"train_loss": -11.122137069702148, "global_step": 181199, "epoch": 1078} {"train_loss": -9.835203170776367, "global_step": 181200, "epoch": 1078} {"train_loss": -10.986124992370605, "global_step": 181201, "epoch": 1078} {"train_loss": -10.39006519317627, "global_step": 181202, "epoch": 1078} {"train_loss": -11.10767936706543, "global_step": 181203, "epoch": 1078} {"train_loss": -10.711663246154785, "global_step": 181204, "epoch": 1078} {"train_loss": -11.082645416259766, "global_step": 181205, "epoch": 1078} {"train_loss": -10.920504570007324, "global_step": 181206, "epoch": 1078} {"train_loss": -11.03962516784668, "global_step": 181207, "epoch": 1078} {"train_loss": -9.731948852539062, "global_step": 181208, "epoch": 1078} {"train_loss": -11.21731948852539, "global_step": 181209, "epoch": 1078} {"train_loss": -10.122457504272461, "global_step": 181210, "epoch": 1078} {"train_loss": -11.151678085327148, "global_step": 181211, "epoch": 1078} {"train_loss": -10.574024200439453, "global_step": 181212, "epoch": 1078} {"train_loss": -10.752396583557129, "global_step": 181213, "epoch": 1078} {"train_loss": -10.699662208557129, "global_step": 181214, "epoch": 1078} {"train_loss": -11.013914108276367, "global_step": 181215, "epoch": 1078} {"train_loss": -10.507829666137695, "global_step": 181216, "epoch": 1078} {"train_loss": -11.172100067138672, "global_step": 181217, "epoch": 1078} {"train_loss": -10.746253967285156, "global_step": 181218, "epoch": 1078} {"train_loss": -10.92756175994873, "global_step": 181219, "epoch": 1078} {"train_loss": -10.77092170715332, "global_step": 181220, "epoch": 1078} {"train_loss": -11.131509780883789, "global_step": 181221, "epoch": 1078} {"train_loss": -10.809697151184082, "global_step": 181222, "epoch": 1078} {"train_loss": -11.080045700073242, "global_step": 181223, "epoch": 1078} {"train_loss": -10.923696517944336, "global_step": 181224, "epoch": 1078} {"train_loss": -11.219295501708984, "global_step": 181225, "epoch": 1078} {"train_loss": -11.212813377380371, "global_step": 181226, "epoch": 1078} {"train_loss": -11.049163818359375, "global_step": 181227, "epoch": 1078} {"train_loss": -11.12954044342041, "global_step": 181228, "epoch": 1078} {"train_loss": -11.18175983428955, "global_step": 181229, "epoch": 1078} {"train_loss": -11.162235260009766, "global_step": 181230, "epoch": 1078} {"train_loss": -11.279382705688477, "global_step": 181231, "epoch": 1078} {"train_loss": -11.309475898742676, "global_step": 181232, "epoch": 1078} {"train_loss": -11.154777526855469, "global_step": 181233, "epoch": 1078} {"train_loss": -11.152090072631836, "global_step": 181234, "epoch": 1078} {"train_loss": -11.460701942443848, "global_step": 181235, "epoch": 1078} {"train_loss": -11.274568557739258, "global_step": 181236, "epoch": 1078} {"train_loss": -11.441089630126953, "global_step": 181237, "epoch": 1078} {"train_loss": -11.366485595703125, "global_step": 181238, "epoch": 1078} {"train_loss": -11.18244743347168, "global_step": 181239, "epoch": 1078} {"train_loss": -11.35421371459961, "global_step": 181240, "epoch": 1078} {"train_loss": -11.259672164916992, "global_step": 181241, "epoch": 1078} {"train_loss": -11.476053237915039, "global_step": 181242, "epoch": 1078} {"train_loss": -11.193297386169434, "global_step": 181243, "epoch": 1078} {"train_loss": -11.341487884521484, "global_step": 181244, "epoch": 1078} {"train_loss": -11.287080764770508, "global_step": 181245, "epoch": 1078} {"train_loss": -11.360393524169922, "global_step": 181246, "epoch": 1078} {"train_loss": -11.645637512207031, "global_step": 181247, "epoch": 1078} {"train_loss": -11.139751434326172, "global_step": 181248, "epoch": 1078} {"train_loss": -11.398605346679688, "global_step": 181249, "epoch": 1078} {"train_loss": -11.356954574584961, "global_step": 181250, "epoch": 1078} {"train_loss": -11.402156829833984, "global_step": 181251, "epoch": 1078} {"train_loss": -11.345952987670898, "global_step": 181252, "epoch": 1078} {"train_loss": -11.687122344970703, "global_step": 181253, "epoch": 1078} {"train_loss": -11.054950714111328, "global_step": 181254, "epoch": 1078} {"train_loss": -11.674093246459961, "global_step": 181255, "epoch": 1078} {"train_loss": -11.093294143676758, "global_step": 181256, "epoch": 1078} {"train_loss": -11.12668228149414, "global_step": 181257, "epoch": 1078} {"train_loss": -11.34003734588623, "global_step": 181258, "epoch": 1078} {"train_loss": -11.105183601379395, "global_step": 181259, "epoch": 1078} {"train_loss": -11.258021354675293, "global_step": 181260, "epoch": 1078} {"train_loss": -11.457523345947266, "global_step": 181261, "epoch": 1078} {"train_loss": -10.483393669128418, "global_step": 181262, "epoch": 1078} {"train_loss": -11.54785442352295, "global_step": 181263, "epoch": 1078} {"train_loss": -10.941825866699219, "global_step": 181264, "epoch": 1078} {"train_loss": -10.576299667358398, "global_step": 181265, "epoch": 1078} {"train_loss": -11.47085189819336, "global_step": 181266, "epoch": 1078} {"train_loss": -11.175636291503906, "global_step": 181267, "epoch": 1078} {"train_loss": -10.994880676269531, "global_step": 181268, "epoch": 1078} {"train_loss": -11.344280242919922, "global_step": 181269, "epoch": 1078} {"train_loss": -11.158863067626953, "global_step": 181270, "epoch": 1078} {"train_loss": -11.028639492534456, "global_step": 181271, "epoch": 1078, "val_loss": 245349.140625} {"train_loss": -11.516547203063965, "global_step": 181272, "epoch": 1079} {"train_loss": -11.247722625732422, "global_step": 181273, "epoch": 1079} {"train_loss": -10.78181266784668, "global_step": 181274, "epoch": 1079} {"train_loss": -11.193246841430664, "global_step": 181275, "epoch": 1079} {"train_loss": -10.893468856811523, "global_step": 181276, "epoch": 1079} {"train_loss": -11.11643123626709, "global_step": 181277, "epoch": 1079} {"train_loss": -11.055068969726562, "global_step": 181278, "epoch": 1079} {"train_loss": -11.040979385375977, "global_step": 181279, "epoch": 1079} {"train_loss": -11.17325210571289, "global_step": 181280, "epoch": 1079} {"train_loss": -11.153900146484375, "global_step": 181281, "epoch": 1079} {"train_loss": -10.669075012207031, "global_step": 181282, "epoch": 1079} {"train_loss": -11.140291213989258, "global_step": 181283, "epoch": 1079} {"train_loss": -10.897441864013672, "global_step": 181284, "epoch": 1079} {"train_loss": -10.86069107055664, "global_step": 181285, "epoch": 1079} {"train_loss": -11.099821090698242, "global_step": 181286, "epoch": 1079} {"train_loss": -10.175907135009766, "global_step": 181287, "epoch": 1079} {"train_loss": -10.378841400146484, "global_step": 181288, "epoch": 1079} {"train_loss": -10.766716003417969, "global_step": 181289, "epoch": 1079} {"train_loss": -10.582908630371094, "global_step": 181290, "epoch": 1079} {"train_loss": -11.15542221069336, "global_step": 181291, "epoch": 1079} {"train_loss": -10.424020767211914, "global_step": 181292, "epoch": 1079} {"train_loss": -11.122947692871094, "global_step": 181293, "epoch": 1079} {"train_loss": -10.67996883392334, "global_step": 181294, "epoch": 1079} {"train_loss": -10.314136505126953, "global_step": 181295, "epoch": 1079} {"train_loss": -10.92921257019043, "global_step": 181296, "epoch": 1079} {"train_loss": -10.594018936157227, "global_step": 181297, "epoch": 1079} {"train_loss": -11.161152839660645, "global_step": 181298, "epoch": 1079} {"train_loss": -10.531384468078613, "global_step": 181299, "epoch": 1079} {"train_loss": -11.11423110961914, "global_step": 181300, "epoch": 1079} {"train_loss": -10.739392280578613, "global_step": 181301, "epoch": 1079} {"train_loss": -10.72750186920166, "global_step": 181302, "epoch": 1079} {"train_loss": -10.832589149475098, "global_step": 181303, "epoch": 1079} {"train_loss": -10.884088516235352, "global_step": 181304, "epoch": 1079} {"train_loss": -10.916654586791992, "global_step": 181305, "epoch": 1079} {"train_loss": -10.933396339416504, "global_step": 181306, "epoch": 1079} {"train_loss": -10.475275039672852, "global_step": 181307, "epoch": 1079} {"train_loss": -11.032023429870605, "global_step": 181308, "epoch": 1079} {"train_loss": -10.673484802246094, "global_step": 181309, "epoch": 1079} {"train_loss": -11.15652084350586, "global_step": 181310, "epoch": 1079} {"train_loss": -10.635641098022461, "global_step": 181311, "epoch": 1079} {"train_loss": -10.987194061279297, "global_step": 181312, "epoch": 1079} {"train_loss": -11.028650283813477, "global_step": 181313, "epoch": 1079} {"train_loss": -10.666107177734375, "global_step": 181314, "epoch": 1079} {"train_loss": -11.18149185180664, "global_step": 181315, "epoch": 1079} {"train_loss": -10.655475616455078, "global_step": 181316, "epoch": 1079} {"train_loss": -10.291977882385254, "global_step": 181317, "epoch": 1079} {"train_loss": -10.951805114746094, "global_step": 181318, "epoch": 1079} {"train_loss": -9.945823669433594, "global_step": 181319, "epoch": 1079} {"train_loss": -10.651570320129395, "global_step": 181320, "epoch": 1079} {"train_loss": -10.935545921325684, "global_step": 181321, "epoch": 1079} {"train_loss": -10.503971099853516, "global_step": 181322, "epoch": 1079} {"train_loss": -11.394693374633789, "global_step": 181323, "epoch": 1079} {"train_loss": -10.535116195678711, "global_step": 181324, "epoch": 1079} {"train_loss": -11.149179458618164, "global_step": 181325, "epoch": 1079} {"train_loss": -11.041236877441406, "global_step": 181326, "epoch": 1079} {"train_loss": -10.722801208496094, "global_step": 181327, "epoch": 1079} {"train_loss": -10.865219116210938, "global_step": 181328, "epoch": 1079} {"train_loss": -10.934205055236816, "global_step": 181329, "epoch": 1079} {"train_loss": -11.066807746887207, "global_step": 181330, "epoch": 1079} {"train_loss": -10.904613494873047, "global_step": 181331, "epoch": 1079} {"train_loss": -11.21263313293457, "global_step": 181332, "epoch": 1079} {"train_loss": -10.911027908325195, "global_step": 181333, "epoch": 1079} {"train_loss": -11.22955322265625, "global_step": 181334, "epoch": 1079} {"train_loss": -10.916550636291504, "global_step": 181335, "epoch": 1079} {"train_loss": -10.678720474243164, "global_step": 181336, "epoch": 1079} {"train_loss": -10.89103889465332, "global_step": 181337, "epoch": 1079} {"train_loss": -10.969228744506836, "global_step": 181338, "epoch": 1079} {"train_loss": -11.2598876953125, "global_step": 181339, "epoch": 1079} {"train_loss": -11.227182388305664, "global_step": 181340, "epoch": 1079} {"train_loss": -11.254467964172363, "global_step": 181341, "epoch": 1079} {"train_loss": -11.074490547180176, "global_step": 181342, "epoch": 1079} {"train_loss": -11.564355850219727, "global_step": 181343, "epoch": 1079} {"train_loss": -11.08547592163086, "global_step": 181344, "epoch": 1079} {"train_loss": -11.407611846923828, "global_step": 181345, "epoch": 1079} {"train_loss": -11.15112590789795, "global_step": 181346, "epoch": 1079} {"train_loss": -11.333208084106445, "global_step": 181347, "epoch": 1079} {"train_loss": -11.417539596557617, "global_step": 181348, "epoch": 1079} {"train_loss": -11.139200210571289, "global_step": 181349, "epoch": 1079} {"train_loss": -11.03219985961914, "global_step": 181350, "epoch": 1079} {"train_loss": -11.367240905761719, "global_step": 181351, "epoch": 1079} {"train_loss": -11.257367134094238, "global_step": 181352, "epoch": 1079} {"train_loss": -11.227852821350098, "global_step": 181353, "epoch": 1079} {"train_loss": -11.274820327758789, "global_step": 181354, "epoch": 1079} {"train_loss": -11.192768096923828, "global_step": 181355, "epoch": 1079} {"train_loss": -11.467131614685059, "global_step": 181356, "epoch": 1079} {"train_loss": -11.358466148376465, "global_step": 181357, "epoch": 1079} {"train_loss": -11.532533645629883, "global_step": 181358, "epoch": 1079} {"train_loss": -11.249446868896484, "global_step": 181359, "epoch": 1079} {"train_loss": -11.412428855895996, "global_step": 181360, "epoch": 1079} {"train_loss": -11.107841491699219, "global_step": 181361, "epoch": 1079} {"train_loss": -11.028691291809082, "global_step": 181362, "epoch": 1079} {"train_loss": -11.019190788269043, "global_step": 181363, "epoch": 1079} {"train_loss": -10.77447509765625, "global_step": 181364, "epoch": 1079} {"train_loss": -11.129831314086914, "global_step": 181365, "epoch": 1079} {"train_loss": -11.079816818237305, "global_step": 181366, "epoch": 1079} {"train_loss": -11.042811393737793, "global_step": 181367, "epoch": 1079} {"train_loss": -10.679125785827637, "global_step": 181368, "epoch": 1079} {"train_loss": -11.372446060180664, "global_step": 181369, "epoch": 1079} {"train_loss": -10.355949401855469, "global_step": 181370, "epoch": 1079} {"train_loss": -10.778970718383789, "global_step": 181371, "epoch": 1079} {"train_loss": -11.421144485473633, "global_step": 181372, "epoch": 1079} {"train_loss": -11.278980255126953, "global_step": 181373, "epoch": 1079} {"train_loss": -11.362083435058594, "global_step": 181374, "epoch": 1079} {"train_loss": -11.499333381652832, "global_step": 181375, "epoch": 1079} {"train_loss": -11.203681945800781, "global_step": 181376, "epoch": 1079} {"train_loss": -11.025237083435059, "global_step": 181377, "epoch": 1079} {"train_loss": -11.388293266296387, "global_step": 181378, "epoch": 1079} {"train_loss": -10.957442283630371, "global_step": 181379, "epoch": 1079} {"train_loss": -10.758641242980957, "global_step": 181380, "epoch": 1079} {"train_loss": -11.457783699035645, "global_step": 181381, "epoch": 1079} {"train_loss": -10.812437057495117, "global_step": 181382, "epoch": 1079} {"train_loss": -11.223245620727539, "global_step": 181383, "epoch": 1079} {"train_loss": -11.236459732055664, "global_step": 181384, "epoch": 1079} {"train_loss": -11.22708511352539, "global_step": 181385, "epoch": 1079} {"train_loss": -11.13464641571045, "global_step": 181386, "epoch": 1079} {"train_loss": -10.626518249511719, "global_step": 181387, "epoch": 1079} {"train_loss": -11.2389554977417, "global_step": 181388, "epoch": 1079} {"train_loss": -10.749730110168457, "global_step": 181389, "epoch": 1079} {"train_loss": -10.969688415527344, "global_step": 181390, "epoch": 1079} {"train_loss": -10.922737121582031, "global_step": 181391, "epoch": 1079} {"train_loss": -10.935158729553223, "global_step": 181392, "epoch": 1079} {"train_loss": -11.194853782653809, "global_step": 181393, "epoch": 1079} {"train_loss": -11.080076217651367, "global_step": 181394, "epoch": 1079} {"train_loss": -10.363334655761719, "global_step": 181395, "epoch": 1079} {"train_loss": -11.330631256103516, "global_step": 181396, "epoch": 1079} {"train_loss": -10.483983993530273, "global_step": 181397, "epoch": 1079} {"train_loss": -10.692248344421387, "global_step": 181398, "epoch": 1079} {"train_loss": -11.38691520690918, "global_step": 181399, "epoch": 1079} {"train_loss": -10.780023574829102, "global_step": 181400, "epoch": 1079} {"train_loss": -10.715500831604004, "global_step": 181401, "epoch": 1079} {"train_loss": -11.362686157226562, "global_step": 181402, "epoch": 1079} {"train_loss": -10.899084091186523, "global_step": 181403, "epoch": 1079} {"train_loss": -10.981815338134766, "global_step": 181404, "epoch": 1079} {"train_loss": -11.361275672912598, "global_step": 181405, "epoch": 1079} {"train_loss": -10.432865142822266, "global_step": 181406, "epoch": 1079} {"train_loss": -11.320329666137695, "global_step": 181407, "epoch": 1079} {"train_loss": -10.263984680175781, "global_step": 181408, "epoch": 1079} {"train_loss": -11.039285659790039, "global_step": 181409, "epoch": 1079} {"train_loss": -10.541011810302734, "global_step": 181410, "epoch": 1079} {"train_loss": -11.071688652038574, "global_step": 181411, "epoch": 1079} {"train_loss": -10.814708709716797, "global_step": 181412, "epoch": 1079} {"train_loss": -10.967673301696777, "global_step": 181413, "epoch": 1079} {"train_loss": -10.924385070800781, "global_step": 181414, "epoch": 1079} {"train_loss": -10.717447280883789, "global_step": 181415, "epoch": 1079} {"train_loss": -10.971745491027832, "global_step": 181416, "epoch": 1079} {"train_loss": -10.83474349975586, "global_step": 181417, "epoch": 1079} {"train_loss": -11.049566268920898, "global_step": 181418, "epoch": 1079} {"train_loss": -11.062005043029785, "global_step": 181419, "epoch": 1079} {"train_loss": -11.196032524108887, "global_step": 181420, "epoch": 1079} {"train_loss": -11.09838581085205, "global_step": 181421, "epoch": 1079} {"train_loss": -11.428348541259766, "global_step": 181422, "epoch": 1079} {"train_loss": -11.263463020324707, "global_step": 181423, "epoch": 1079} {"train_loss": -11.174514770507812, "global_step": 181424, "epoch": 1079} {"train_loss": -11.256380081176758, "global_step": 181425, "epoch": 1079} {"train_loss": -11.093690872192383, "global_step": 181426, "epoch": 1079} {"train_loss": -11.2781343460083, "global_step": 181427, "epoch": 1079} {"train_loss": -11.385414123535156, "global_step": 181428, "epoch": 1079} {"train_loss": -11.160722732543945, "global_step": 181429, "epoch": 1079} {"train_loss": -11.379185676574707, "global_step": 181430, "epoch": 1079} {"train_loss": -11.203230857849121, "global_step": 181431, "epoch": 1079} {"train_loss": -11.347528457641602, "global_step": 181432, "epoch": 1079} {"train_loss": -11.497635841369629, "global_step": 181433, "epoch": 1079} {"train_loss": -11.26005744934082, "global_step": 181434, "epoch": 1079} {"train_loss": -11.636191368103027, "global_step": 181435, "epoch": 1079} {"train_loss": -11.118947982788086, "global_step": 181436, "epoch": 1079} {"train_loss": -11.18067741394043, "global_step": 181437, "epoch": 1079} {"train_loss": -11.345627784729004, "global_step": 181438, "epoch": 1079} {"train_loss": -11.014071612131028, "global_step": 181439, "epoch": 1079, "val_loss": 245323.921875} {"train_loss": -11.215733528137207, "global_step": 181440, "epoch": 1080} {"train_loss": -11.286815643310547, "global_step": 181441, "epoch": 1080} {"train_loss": -11.189691543579102, "global_step": 181442, "epoch": 1080} {"train_loss": -10.999987602233887, "global_step": 181443, "epoch": 1080} {"train_loss": -11.084661483764648, "global_step": 181444, "epoch": 1080} {"train_loss": -11.355229377746582, "global_step": 181445, "epoch": 1080} {"train_loss": -10.754613876342773, "global_step": 181446, "epoch": 1080} {"train_loss": -11.323275566101074, "global_step": 181447, "epoch": 1080} {"train_loss": -11.225818634033203, "global_step": 181448, "epoch": 1080} {"train_loss": -11.228677749633789, "global_step": 181449, "epoch": 1080} {"train_loss": -11.484800338745117, "global_step": 181450, "epoch": 1080} {"train_loss": -11.045921325683594, "global_step": 181451, "epoch": 1080} {"train_loss": -11.307905197143555, "global_step": 181452, "epoch": 1080} {"train_loss": -11.34596061706543, "global_step": 181453, "epoch": 1080} {"train_loss": -11.496792793273926, "global_step": 181454, "epoch": 1080} {"train_loss": -11.360978126525879, "global_step": 181455, "epoch": 1080} {"train_loss": -11.326661109924316, "global_step": 181456, "epoch": 1080} {"train_loss": -11.671080589294434, "global_step": 181457, "epoch": 1080} {"train_loss": -11.477189064025879, "global_step": 181458, "epoch": 1080} {"train_loss": -11.413106918334961, "global_step": 181459, "epoch": 1080} {"train_loss": -11.377935409545898, "global_step": 181460, "epoch": 1080} {"train_loss": -11.512191772460938, "global_step": 181461, "epoch": 1080} {"train_loss": -11.291919708251953, "global_step": 181462, "epoch": 1080} {"train_loss": -11.521415710449219, "global_step": 181463, "epoch": 1080} {"train_loss": -11.320850372314453, "global_step": 181464, "epoch": 1080} {"train_loss": -11.466827392578125, "global_step": 181465, "epoch": 1080} {"train_loss": -11.563636779785156, "global_step": 181466, "epoch": 1080} {"train_loss": -11.29698371887207, "global_step": 181467, "epoch": 1080} {"train_loss": -11.479814529418945, "global_step": 181468, "epoch": 1080} {"train_loss": -11.276965141296387, "global_step": 181469, "epoch": 1080} {"train_loss": -11.361114501953125, "global_step": 181470, "epoch": 1080} {"train_loss": -11.276782035827637, "global_step": 181471, "epoch": 1080} {"train_loss": -11.43820571899414, "global_step": 181472, "epoch": 1080} {"train_loss": -11.205995559692383, "global_step": 181473, "epoch": 1080} {"train_loss": -11.245742797851562, "global_step": 181474, "epoch": 1080} {"train_loss": -11.4713134765625, "global_step": 181475, "epoch": 1080} {"train_loss": -11.155086517333984, "global_step": 181476, "epoch": 1080} {"train_loss": -11.257493019104004, "global_step": 181477, "epoch": 1080} {"train_loss": -11.613489151000977, "global_step": 181478, "epoch": 1080} {"train_loss": -10.92093276977539, "global_step": 181479, "epoch": 1080} {"train_loss": -11.16510009765625, "global_step": 181480, "epoch": 1080} {"train_loss": -11.324003219604492, "global_step": 181481, "epoch": 1080} {"train_loss": -11.174759864807129, "global_step": 181482, "epoch": 1080} {"train_loss": -11.234088897705078, "global_step": 181483, "epoch": 1080} {"train_loss": -10.401494026184082, "global_step": 181484, "epoch": 1080} {"train_loss": -11.28329086303711, "global_step": 181485, "epoch": 1080} {"train_loss": -11.099468231201172, "global_step": 181486, "epoch": 1080} {"train_loss": -10.805719375610352, "global_step": 181487, "epoch": 1080} {"train_loss": -10.290956497192383, "global_step": 181488, "epoch": 1080} {"train_loss": -10.257477760314941, "global_step": 181489, "epoch": 1080} {"train_loss": -11.139123916625977, "global_step": 181490, "epoch": 1080} {"train_loss": -10.401911735534668, "global_step": 181491, "epoch": 1080} {"train_loss": -10.611209869384766, "global_step": 181492, "epoch": 1080} {"train_loss": -10.289604187011719, "global_step": 181493, "epoch": 1080} {"train_loss": -10.942359924316406, "global_step": 181494, "epoch": 1080} {"train_loss": -10.064927101135254, "global_step": 181495, "epoch": 1080} {"train_loss": -11.053383827209473, "global_step": 181496, "epoch": 1080} {"train_loss": -10.786079406738281, "global_step": 181497, "epoch": 1080} {"train_loss": -11.160867691040039, "global_step": 181498, "epoch": 1080} {"train_loss": -10.70016098022461, "global_step": 181499, "epoch": 1080} {"train_loss": -11.052886962890625, "global_step": 181500, "epoch": 1080} {"train_loss": -10.929885864257812, "global_step": 181501, "epoch": 1080} {"train_loss": -10.968250274658203, "global_step": 181502, "epoch": 1080} {"train_loss": -10.964893341064453, "global_step": 181503, "epoch": 1080} {"train_loss": -10.798823356628418, "global_step": 181504, "epoch": 1080} {"train_loss": -11.220199584960938, "global_step": 181505, "epoch": 1080} {"train_loss": -10.69351577758789, "global_step": 181506, "epoch": 1080} {"train_loss": -11.024152755737305, "global_step": 181507, "epoch": 1080} {"train_loss": -10.726764678955078, "global_step": 181508, "epoch": 1080} {"train_loss": -10.796613693237305, "global_step": 181509, "epoch": 1080} {"train_loss": -10.501873016357422, "global_step": 181510, "epoch": 1080} {"train_loss": -10.83627986907959, "global_step": 181511, "epoch": 1080} {"train_loss": -10.909799575805664, "global_step": 181512, "epoch": 1080} {"train_loss": -10.697124481201172, "global_step": 181513, "epoch": 1080} {"train_loss": -10.68928337097168, "global_step": 181514, "epoch": 1080} {"train_loss": -10.813653945922852, "global_step": 181515, "epoch": 1080} {"train_loss": -10.710025787353516, "global_step": 181516, "epoch": 1080} {"train_loss": -11.079802513122559, "global_step": 181517, "epoch": 1080} {"train_loss": -11.040031433105469, "global_step": 181518, "epoch": 1080} {"train_loss": -11.043977737426758, "global_step": 181519, "epoch": 1080} {"train_loss": -11.186595916748047, "global_step": 181520, "epoch": 1080} {"train_loss": -11.21754264831543, "global_step": 181521, "epoch": 1080} {"train_loss": -11.082281112670898, "global_step": 181522, "epoch": 1080} {"train_loss": -11.301115989685059, "global_step": 181523, "epoch": 1080} {"train_loss": -11.044219970703125, "global_step": 181524, "epoch": 1080} {"train_loss": -11.289688110351562, "global_step": 181525, "epoch": 1080} {"train_loss": -10.93166732788086, "global_step": 181526, "epoch": 1080} {"train_loss": -11.18038558959961, "global_step": 181527, "epoch": 1080} {"train_loss": -10.956409454345703, "global_step": 181528, "epoch": 1080} {"train_loss": -11.20395278930664, "global_step": 181529, "epoch": 1080} {"train_loss": -10.93467903137207, "global_step": 181530, "epoch": 1080} {"train_loss": -11.062830924987793, "global_step": 181531, "epoch": 1080} {"train_loss": -11.156058311462402, "global_step": 181532, "epoch": 1080} {"train_loss": -10.888080596923828, "global_step": 181533, "epoch": 1080} {"train_loss": -11.06601619720459, "global_step": 181534, "epoch": 1080} {"train_loss": -11.256929397583008, "global_step": 181535, "epoch": 1080} {"train_loss": -10.85599422454834, "global_step": 181536, "epoch": 1080} {"train_loss": -10.815471649169922, "global_step": 181537, "epoch": 1080} {"train_loss": -11.10347843170166, "global_step": 181538, "epoch": 1080} {"train_loss": -10.721494674682617, "global_step": 181539, "epoch": 1080} {"train_loss": -11.407588958740234, "global_step": 181540, "epoch": 1080} {"train_loss": -10.649578094482422, "global_step": 181541, "epoch": 1080} {"train_loss": -10.861198425292969, "global_step": 181542, "epoch": 1080} {"train_loss": -11.116342544555664, "global_step": 181543, "epoch": 1080} {"train_loss": -11.322752952575684, "global_step": 181544, "epoch": 1080} {"train_loss": -11.204856872558594, "global_step": 181545, "epoch": 1080} {"train_loss": -11.24212646484375, "global_step": 181546, "epoch": 1080} {"train_loss": -11.119976997375488, "global_step": 181547, "epoch": 1080} {"train_loss": -11.469154357910156, "global_step": 181548, "epoch": 1080} {"train_loss": -11.21119213104248, "global_step": 181549, "epoch": 1080} {"train_loss": -11.402214050292969, "global_step": 181550, "epoch": 1080} {"train_loss": -11.200157165527344, "global_step": 181551, "epoch": 1080} {"train_loss": -11.173432350158691, "global_step": 181552, "epoch": 1080} {"train_loss": -11.32209587097168, "global_step": 181553, "epoch": 1080} {"train_loss": -11.344976425170898, "global_step": 181554, "epoch": 1080} {"train_loss": -11.312704086303711, "global_step": 181555, "epoch": 1080} {"train_loss": -11.300399780273438, "global_step": 181556, "epoch": 1080} {"train_loss": -11.528769493103027, "global_step": 181557, "epoch": 1080} {"train_loss": -11.343046188354492, "global_step": 181558, "epoch": 1080} {"train_loss": -11.222379684448242, "global_step": 181559, "epoch": 1080} {"train_loss": -11.435920715332031, "global_step": 181560, "epoch": 1080} {"train_loss": -11.169686317443848, "global_step": 181561, "epoch": 1080} {"train_loss": -11.696846008300781, "global_step": 181562, "epoch": 1080} {"train_loss": -11.22928237915039, "global_step": 181563, "epoch": 1080} {"train_loss": -11.218229293823242, "global_step": 181564, "epoch": 1080} {"train_loss": -11.360589981079102, "global_step": 181565, "epoch": 1080} {"train_loss": -11.106498718261719, "global_step": 181566, "epoch": 1080} {"train_loss": -11.365795135498047, "global_step": 181567, "epoch": 1080} {"train_loss": -11.055887222290039, "global_step": 181568, "epoch": 1080} {"train_loss": -11.045445442199707, "global_step": 181569, "epoch": 1080} {"train_loss": -11.495487213134766, "global_step": 181570, "epoch": 1080} {"train_loss": -11.142444610595703, "global_step": 181571, "epoch": 1080} {"train_loss": -11.253631591796875, "global_step": 181572, "epoch": 1080} {"train_loss": -11.311872482299805, "global_step": 181573, "epoch": 1080} {"train_loss": -11.606155395507812, "global_step": 181574, "epoch": 1080} {"train_loss": -11.216453552246094, "global_step": 181575, "epoch": 1080} {"train_loss": -11.63121509552002, "global_step": 181576, "epoch": 1080} {"train_loss": -11.271737098693848, "global_step": 181577, "epoch": 1080} {"train_loss": -11.491724014282227, "global_step": 181578, "epoch": 1080} {"train_loss": -11.009773254394531, "global_step": 181579, "epoch": 1080} {"train_loss": -11.417755126953125, "global_step": 181580, "epoch": 1080} {"train_loss": -10.475385665893555, "global_step": 181581, "epoch": 1080} {"train_loss": -11.14361572265625, "global_step": 181582, "epoch": 1080} {"train_loss": -10.737406730651855, "global_step": 181583, "epoch": 1080} {"train_loss": -10.32441520690918, "global_step": 181584, "epoch": 1080} {"train_loss": -11.320594787597656, "global_step": 181585, "epoch": 1080} {"train_loss": -9.971717834472656, "global_step": 181586, "epoch": 1080} {"train_loss": -11.243165016174316, "global_step": 181587, "epoch": 1080} {"train_loss": -10.756609916687012, "global_step": 181588, "epoch": 1080} {"train_loss": -11.343247413635254, "global_step": 181589, "epoch": 1080} {"train_loss": -11.241061210632324, "global_step": 181590, "epoch": 1080} {"train_loss": -11.3709716796875, "global_step": 181591, "epoch": 1080} {"train_loss": -11.190624237060547, "global_step": 181592, "epoch": 1080} {"train_loss": -10.715033531188965, "global_step": 181593, "epoch": 1080} {"train_loss": -11.312931060791016, "global_step": 181594, "epoch": 1080} {"train_loss": -10.597765922546387, "global_step": 181595, "epoch": 1080} {"train_loss": -10.784769058227539, "global_step": 181596, "epoch": 1080} {"train_loss": -10.857890129089355, "global_step": 181597, "epoch": 1080} {"train_loss": -10.708267211914062, "global_step": 181598, "epoch": 1080} {"train_loss": -10.719714164733887, "global_step": 181599, "epoch": 1080} {"train_loss": -10.744478225708008, "global_step": 181600, "epoch": 1080} {"train_loss": -10.51978874206543, "global_step": 181601, "epoch": 1080} {"train_loss": -11.264263153076172, "global_step": 181602, "epoch": 1080} {"train_loss": -9.756280899047852, "global_step": 181603, "epoch": 1080} {"train_loss": -10.930663108825684, "global_step": 181604, "epoch": 1080} {"train_loss": -10.391068458557129, "global_step": 181605, "epoch": 1080} {"train_loss": -10.792596817016602, "global_step": 181606, "epoch": 1080} {"train_loss": -11.083729051408314, "global_step": 181607, "epoch": 1080, "val_loss": 247139.96875, "train_action_mse_error": 1.336652159690857} {"train_loss": -10.259564399719238, "global_step": 181608, "epoch": 1081} {"train_loss": -11.024372100830078, "global_step": 181609, "epoch": 1081} {"train_loss": -10.386518478393555, "global_step": 181610, "epoch": 1081} {"train_loss": -10.862242698669434, "global_step": 181611, "epoch": 1081} {"train_loss": -10.81534194946289, "global_step": 181612, "epoch": 1081} {"train_loss": -10.505340576171875, "global_step": 181613, "epoch": 1081} {"train_loss": -10.90286636352539, "global_step": 181614, "epoch": 1081} {"train_loss": -10.574874877929688, "global_step": 181615, "epoch": 1081} {"train_loss": -10.975069046020508, "global_step": 181616, "epoch": 1081} {"train_loss": -10.780694007873535, "global_step": 181617, "epoch": 1081} {"train_loss": -10.667631149291992, "global_step": 181618, "epoch": 1081} {"train_loss": -11.211702346801758, "global_step": 181619, "epoch": 1081} {"train_loss": -10.766176223754883, "global_step": 181620, "epoch": 1081} {"train_loss": -10.943010330200195, "global_step": 181621, "epoch": 1081} {"train_loss": -11.175519943237305, "global_step": 181622, "epoch": 1081} {"train_loss": -10.858951568603516, "global_step": 181623, "epoch": 1081} {"train_loss": -11.086929321289062, "global_step": 181624, "epoch": 1081} {"train_loss": -11.09195327758789, "global_step": 181625, "epoch": 1081} {"train_loss": -11.095951080322266, "global_step": 181626, "epoch": 1081} {"train_loss": -11.040321350097656, "global_step": 181627, "epoch": 1081} {"train_loss": -10.958871841430664, "global_step": 181628, "epoch": 1081} {"train_loss": -11.190849304199219, "global_step": 181629, "epoch": 1081} {"train_loss": -11.005210876464844, "global_step": 181630, "epoch": 1081} {"train_loss": -11.039098739624023, "global_step": 181631, "epoch": 1081} {"train_loss": -11.131218910217285, "global_step": 181632, "epoch": 1081} {"train_loss": -11.207393646240234, "global_step": 181633, "epoch": 1081} {"train_loss": -10.98952865600586, "global_step": 181634, "epoch": 1081} {"train_loss": -10.904058456420898, "global_step": 181635, "epoch": 1081} {"train_loss": -11.009084701538086, "global_step": 181636, "epoch": 1081} {"train_loss": -10.53610610961914, "global_step": 181637, "epoch": 1081} {"train_loss": -10.962198257446289, "global_step": 181638, "epoch": 1081} {"train_loss": -10.882183074951172, "global_step": 181639, "epoch": 1081} {"train_loss": -11.013921737670898, "global_step": 181640, "epoch": 1081} {"train_loss": -11.265979766845703, "global_step": 181641, "epoch": 1081} {"train_loss": -10.91932487487793, "global_step": 181642, "epoch": 1081} {"train_loss": -11.21859359741211, "global_step": 181643, "epoch": 1081} {"train_loss": -10.816864013671875, "global_step": 181644, "epoch": 1081} {"train_loss": -11.255535125732422, "global_step": 181645, "epoch": 1081} {"train_loss": -10.895318984985352, "global_step": 181646, "epoch": 1081} {"train_loss": -11.13807487487793, "global_step": 181647, "epoch": 1081} {"train_loss": -11.485149383544922, "global_step": 181648, "epoch": 1081} {"train_loss": -11.201815605163574, "global_step": 181649, "epoch": 1081} {"train_loss": -11.165094375610352, "global_step": 181650, "epoch": 1081} {"train_loss": -11.365660667419434, "global_step": 181651, "epoch": 1081} {"train_loss": -11.080348014831543, "global_step": 181652, "epoch": 1081} {"train_loss": -11.223541259765625, "global_step": 181653, "epoch": 1081} {"train_loss": -11.35611629486084, "global_step": 181654, "epoch": 1081} {"train_loss": -11.215374946594238, "global_step": 181655, "epoch": 1081} {"train_loss": -11.28183364868164, "global_step": 181656, "epoch": 1081} {"train_loss": -11.4259672164917, "global_step": 181657, "epoch": 1081} {"train_loss": -11.281383514404297, "global_step": 181658, "epoch": 1081} {"train_loss": -11.242908477783203, "global_step": 181659, "epoch": 1081} {"train_loss": -11.17750358581543, "global_step": 181660, "epoch": 1081} {"train_loss": -11.348605155944824, "global_step": 181661, "epoch": 1081} {"train_loss": -11.414819717407227, "global_step": 181662, "epoch": 1081} {"train_loss": -11.350804328918457, "global_step": 181663, "epoch": 1081} {"train_loss": -11.527059555053711, "global_step": 181664, "epoch": 1081} {"train_loss": -11.2713041305542, "global_step": 181665, "epoch": 1081} {"train_loss": -11.437211990356445, "global_step": 181666, "epoch": 1081} {"train_loss": -11.069424629211426, "global_step": 181667, "epoch": 1081} {"train_loss": -11.28354263305664, "global_step": 181668, "epoch": 1081} {"train_loss": -11.401281356811523, "global_step": 181669, "epoch": 1081} {"train_loss": -11.419694900512695, "global_step": 181670, "epoch": 1081} {"train_loss": -11.332088470458984, "global_step": 181671, "epoch": 1081} {"train_loss": -11.266202926635742, "global_step": 181672, "epoch": 1081} {"train_loss": -11.21420669555664, "global_step": 181673, "epoch": 1081} {"train_loss": -11.334896087646484, "global_step": 181674, "epoch": 1081} {"train_loss": -11.437196731567383, "global_step": 181675, "epoch": 1081} {"train_loss": -11.256356239318848, "global_step": 181676, "epoch": 1081} {"train_loss": -11.225608825683594, "global_step": 181677, "epoch": 1081} {"train_loss": -11.382179260253906, "global_step": 181678, "epoch": 1081} {"train_loss": -11.380911827087402, "global_step": 181679, "epoch": 1081} {"train_loss": -11.000923156738281, "global_step": 181680, "epoch": 1081} {"train_loss": -11.395071029663086, "global_step": 181681, "epoch": 1081} {"train_loss": -11.026443481445312, "global_step": 181682, "epoch": 1081} {"train_loss": -11.339483261108398, "global_step": 181683, "epoch": 1081} {"train_loss": -11.174134254455566, "global_step": 181684, "epoch": 1081} {"train_loss": -11.488527297973633, "global_step": 181685, "epoch": 1081} {"train_loss": -11.267915725708008, "global_step": 181686, "epoch": 1081} {"train_loss": -11.593194961547852, "global_step": 181687, "epoch": 1081} {"train_loss": -11.26485824584961, "global_step": 181688, "epoch": 1081} {"train_loss": -11.4979829788208, "global_step": 181689, "epoch": 1081} {"train_loss": -10.779230117797852, "global_step": 181690, "epoch": 1081} {"train_loss": -10.386747360229492, "global_step": 181691, "epoch": 1081} {"train_loss": -11.531780242919922, "global_step": 181692, "epoch": 1081} {"train_loss": -11.247970581054688, "global_step": 181693, "epoch": 1081} {"train_loss": -11.03569221496582, "global_step": 181694, "epoch": 1081} {"train_loss": -11.481748580932617, "global_step": 181695, "epoch": 1081} {"train_loss": -11.356674194335938, "global_step": 181696, "epoch": 1081} {"train_loss": -11.501590728759766, "global_step": 181697, "epoch": 1081} {"train_loss": -11.299530982971191, "global_step": 181698, "epoch": 1081} {"train_loss": -10.528400421142578, "global_step": 181699, "epoch": 1081} {"train_loss": -10.82155990600586, "global_step": 181700, "epoch": 1081} {"train_loss": -11.219964981079102, "global_step": 181701, "epoch": 1081} {"train_loss": -11.13753890991211, "global_step": 181702, "epoch": 1081} {"train_loss": -11.134626388549805, "global_step": 181703, "epoch": 1081} {"train_loss": -10.830655097961426, "global_step": 181704, "epoch": 1081} {"train_loss": -11.497516632080078, "global_step": 181705, "epoch": 1081} {"train_loss": -10.830767631530762, "global_step": 181706, "epoch": 1081} {"train_loss": -11.349479675292969, "global_step": 181707, "epoch": 1081} {"train_loss": -10.88005256652832, "global_step": 181708, "epoch": 1081} {"train_loss": -11.078339576721191, "global_step": 181709, "epoch": 1081} {"train_loss": -10.82931137084961, "global_step": 181710, "epoch": 1081} {"train_loss": -11.221736907958984, "global_step": 181711, "epoch": 1081} {"train_loss": -10.951627731323242, "global_step": 181712, "epoch": 1081} {"train_loss": -11.049259185791016, "global_step": 181713, "epoch": 1081} {"train_loss": -10.981446266174316, "global_step": 181714, "epoch": 1081} {"train_loss": -10.931663513183594, "global_step": 181715, "epoch": 1081} {"train_loss": -11.093632698059082, "global_step": 181716, "epoch": 1081} {"train_loss": -11.434398651123047, "global_step": 181717, "epoch": 1081} {"train_loss": -10.752155303955078, "global_step": 181718, "epoch": 1081} {"train_loss": -10.696593284606934, "global_step": 181719, "epoch": 1081} {"train_loss": -11.086339950561523, "global_step": 181720, "epoch": 1081} {"train_loss": -10.345027923583984, "global_step": 181721, "epoch": 1081} {"train_loss": -11.168651580810547, "global_step": 181722, "epoch": 1081} {"train_loss": -10.877359390258789, "global_step": 181723, "epoch": 1081} {"train_loss": -10.796077728271484, "global_step": 181724, "epoch": 1081} {"train_loss": -11.1796875, "global_step": 181725, "epoch": 1081} {"train_loss": -10.872642517089844, "global_step": 181726, "epoch": 1081} {"train_loss": -11.438356399536133, "global_step": 181727, "epoch": 1081} {"train_loss": -10.853116989135742, "global_step": 181728, "epoch": 1081} {"train_loss": -11.525753021240234, "global_step": 181729, "epoch": 1081} {"train_loss": -11.267642974853516, "global_step": 181730, "epoch": 1081} {"train_loss": -11.21759033203125, "global_step": 181731, "epoch": 1081} {"train_loss": -11.008514404296875, "global_step": 181732, "epoch": 1081} {"train_loss": -11.49052906036377, "global_step": 181733, "epoch": 1081} {"train_loss": -11.367557525634766, "global_step": 181734, "epoch": 1081} {"train_loss": -11.363751411437988, "global_step": 181735, "epoch": 1081} {"train_loss": -11.371980667114258, "global_step": 181736, "epoch": 1081} {"train_loss": -11.325479507446289, "global_step": 181737, "epoch": 1081} {"train_loss": -11.236970901489258, "global_step": 181738, "epoch": 1081} {"train_loss": -11.229052543640137, "global_step": 181739, "epoch": 1081} {"train_loss": -11.414857864379883, "global_step": 181740, "epoch": 1081} {"train_loss": -11.457681655883789, "global_step": 181741, "epoch": 1081} {"train_loss": -11.212265014648438, "global_step": 181742, "epoch": 1081} {"train_loss": -11.287178993225098, "global_step": 181743, "epoch": 1081} {"train_loss": -11.396642684936523, "global_step": 181744, "epoch": 1081} {"train_loss": -11.255353927612305, "global_step": 181745, "epoch": 1081} {"train_loss": -11.28478717803955, "global_step": 181746, "epoch": 1081} {"train_loss": -11.397818565368652, "global_step": 181747, "epoch": 1081} {"train_loss": -11.358878135681152, "global_step": 181748, "epoch": 1081} {"train_loss": -11.126581192016602, "global_step": 181749, "epoch": 1081} {"train_loss": -11.31106948852539, "global_step": 181750, "epoch": 1081} {"train_loss": -11.307100296020508, "global_step": 181751, "epoch": 1081} {"train_loss": -11.167469024658203, "global_step": 181752, "epoch": 1081} {"train_loss": -11.203563690185547, "global_step": 181753, "epoch": 1081} {"train_loss": -11.355655670166016, "global_step": 181754, "epoch": 1081} {"train_loss": -11.641403198242188, "global_step": 181755, "epoch": 1081} {"train_loss": -11.192279815673828, "global_step": 181756, "epoch": 1081} {"train_loss": -11.214396476745605, "global_step": 181757, "epoch": 1081} {"train_loss": -11.505130767822266, "global_step": 181758, "epoch": 1081} {"train_loss": -11.31706428527832, "global_step": 181759, "epoch": 1081} {"train_loss": -11.286018371582031, "global_step": 181760, "epoch": 1081} {"train_loss": -11.240057945251465, "global_step": 181761, "epoch": 1081} {"train_loss": -11.346508026123047, "global_step": 181762, "epoch": 1081} {"train_loss": -11.399087905883789, "global_step": 181763, "epoch": 1081} {"train_loss": -11.541460990905762, "global_step": 181764, "epoch": 1081} {"train_loss": -11.29570198059082, "global_step": 181765, "epoch": 1081} {"train_loss": -11.377340316772461, "global_step": 181766, "epoch": 1081} {"train_loss": -11.4586763381958, "global_step": 181767, "epoch": 1081} {"train_loss": -10.645025253295898, "global_step": 181768, "epoch": 1081} {"train_loss": -10.164541244506836, "global_step": 181769, "epoch": 1081} {"train_loss": -11.039576530456543, "global_step": 181770, "epoch": 1081} {"train_loss": -10.910884857177734, "global_step": 181771, "epoch": 1081} {"train_loss": -9.095684051513672, "global_step": 181772, "epoch": 1081} {"train_loss": -10.763496398925781, "global_step": 181773, "epoch": 1081} {"train_loss": -9.873502731323242, "global_step": 181774, "epoch": 1081} {"train_loss": -11.120597828002204, "global_step": 181775, "epoch": 1081, "val_loss": 245106.328125} {"train_loss": -10.427140235900879, "global_step": 181776, "epoch": 1082} {"train_loss": -10.823840141296387, "global_step": 181777, "epoch": 1082} {"train_loss": -10.92263126373291, "global_step": 181778, "epoch": 1082} {"train_loss": -10.404451370239258, "global_step": 181779, "epoch": 1082} {"train_loss": -10.987382888793945, "global_step": 181780, "epoch": 1082} {"train_loss": -10.476591110229492, "global_step": 181781, "epoch": 1082} {"train_loss": -10.946935653686523, "global_step": 181782, "epoch": 1082} {"train_loss": -11.093344688415527, "global_step": 181783, "epoch": 1082} {"train_loss": -10.937870025634766, "global_step": 181784, "epoch": 1082} {"train_loss": -11.158397674560547, "global_step": 181785, "epoch": 1082} {"train_loss": -11.127197265625, "global_step": 181786, "epoch": 1082} {"train_loss": -10.992086410522461, "global_step": 181787, "epoch": 1082} {"train_loss": -11.457656860351562, "global_step": 181788, "epoch": 1082} {"train_loss": -11.067343711853027, "global_step": 181789, "epoch": 1082} {"train_loss": -11.389606475830078, "global_step": 181790, "epoch": 1082} {"train_loss": -11.079079627990723, "global_step": 181791, "epoch": 1082} {"train_loss": -11.32719612121582, "global_step": 181792, "epoch": 1082} {"train_loss": -11.073221206665039, "global_step": 181793, "epoch": 1082} {"train_loss": -11.196415901184082, "global_step": 181794, "epoch": 1082} {"train_loss": -11.419988632202148, "global_step": 181795, "epoch": 1082} {"train_loss": -11.027599334716797, "global_step": 181796, "epoch": 1082} {"train_loss": -11.036092758178711, "global_step": 181797, "epoch": 1082} {"train_loss": -11.014418601989746, "global_step": 181798, "epoch": 1082} {"train_loss": -11.306912422180176, "global_step": 181799, "epoch": 1082} {"train_loss": -10.90165901184082, "global_step": 181800, "epoch": 1082} {"train_loss": -10.766692161560059, "global_step": 181801, "epoch": 1082} {"train_loss": -11.001727104187012, "global_step": 181802, "epoch": 1082} {"train_loss": -11.23399829864502, "global_step": 181803, "epoch": 1082} {"train_loss": -11.166269302368164, "global_step": 181804, "epoch": 1082} {"train_loss": -11.233221054077148, "global_step": 181805, "epoch": 1082} {"train_loss": -11.37161922454834, "global_step": 181806, "epoch": 1082} {"train_loss": -11.286965370178223, "global_step": 181807, "epoch": 1082} {"train_loss": -11.422394752502441, "global_step": 181808, "epoch": 1082} {"train_loss": -11.380729675292969, "global_step": 181809, "epoch": 1082} {"train_loss": -11.077682495117188, "global_step": 181810, "epoch": 1082} {"train_loss": -11.493322372436523, "global_step": 181811, "epoch": 1082} {"train_loss": -10.993114471435547, "global_step": 181812, "epoch": 1082} {"train_loss": -11.167074203491211, "global_step": 181813, "epoch": 1082} {"train_loss": -11.174306869506836, "global_step": 181814, "epoch": 1082} {"train_loss": -11.080883026123047, "global_step": 181815, "epoch": 1082} {"train_loss": -11.113103866577148, "global_step": 181816, "epoch": 1082} {"train_loss": -11.329782485961914, "global_step": 181817, "epoch": 1082} {"train_loss": -11.124757766723633, "global_step": 181818, "epoch": 1082} {"train_loss": -11.43966007232666, "global_step": 181819, "epoch": 1082} {"train_loss": -11.038314819335938, "global_step": 181820, "epoch": 1082} {"train_loss": -11.421684265136719, "global_step": 181821, "epoch": 1082} {"train_loss": -11.384624481201172, "global_step": 181822, "epoch": 1082} {"train_loss": -11.048839569091797, "global_step": 181823, "epoch": 1082} {"train_loss": -11.364184379577637, "global_step": 181824, "epoch": 1082} {"train_loss": -11.36661148071289, "global_step": 181825, "epoch": 1082} {"train_loss": -11.063364028930664, "global_step": 181826, "epoch": 1082} {"train_loss": -11.384407997131348, "global_step": 181827, "epoch": 1082} {"train_loss": -10.691349983215332, "global_step": 181828, "epoch": 1082} {"train_loss": -11.268324851989746, "global_step": 181829, "epoch": 1082} {"train_loss": -11.063362121582031, "global_step": 181830, "epoch": 1082} {"train_loss": -11.110882759094238, "global_step": 181831, "epoch": 1082} {"train_loss": -11.145669937133789, "global_step": 181832, "epoch": 1082} {"train_loss": -11.33270263671875, "global_step": 181833, "epoch": 1082} {"train_loss": -11.189080238342285, "global_step": 181834, "epoch": 1082} {"train_loss": -10.884435653686523, "global_step": 181835, "epoch": 1082} {"train_loss": -11.362391471862793, "global_step": 181836, "epoch": 1082} {"train_loss": -10.79241943359375, "global_step": 181837, "epoch": 1082} {"train_loss": -11.046213150024414, "global_step": 181838, "epoch": 1082} {"train_loss": -11.226153373718262, "global_step": 181839, "epoch": 1082} {"train_loss": -11.192502975463867, "global_step": 181840, "epoch": 1082} {"train_loss": -10.717169761657715, "global_step": 181841, "epoch": 1082} {"train_loss": -11.25275707244873, "global_step": 181842, "epoch": 1082} {"train_loss": -11.138118743896484, "global_step": 181843, "epoch": 1082} {"train_loss": -11.094501495361328, "global_step": 181844, "epoch": 1082} {"train_loss": -10.999034881591797, "global_step": 181845, "epoch": 1082} {"train_loss": -10.475582122802734, "global_step": 181846, "epoch": 1082} {"train_loss": -11.503085136413574, "global_step": 181847, "epoch": 1082} {"train_loss": -9.867996215820312, "global_step": 181848, "epoch": 1082} {"train_loss": -10.594586372375488, "global_step": 181849, "epoch": 1082} {"train_loss": -10.750795364379883, "global_step": 181850, "epoch": 1082} {"train_loss": -10.169530868530273, "global_step": 181851, "epoch": 1082} {"train_loss": -10.114367485046387, "global_step": 181852, "epoch": 1082} {"train_loss": -10.493040084838867, "global_step": 181853, "epoch": 1082} {"train_loss": -9.532575607299805, "global_step": 181854, "epoch": 1082} {"train_loss": -9.52690315246582, "global_step": 181855, "epoch": 1082} {"train_loss": -11.05843734741211, "global_step": 181856, "epoch": 1082} {"train_loss": -9.442659378051758, "global_step": 181857, "epoch": 1082} {"train_loss": -10.047243118286133, "global_step": 181858, "epoch": 1082} {"train_loss": -10.77679443359375, "global_step": 181859, "epoch": 1082} {"train_loss": -10.237090110778809, "global_step": 181860, "epoch": 1082} {"train_loss": -10.449156761169434, "global_step": 181861, "epoch": 1082} {"train_loss": -10.126696586608887, "global_step": 181862, "epoch": 1082} {"train_loss": -10.281448364257812, "global_step": 181863, "epoch": 1082} {"train_loss": -11.094419479370117, "global_step": 181864, "epoch": 1082} {"train_loss": -10.45833969116211, "global_step": 181865, "epoch": 1082} {"train_loss": -10.814922332763672, "global_step": 181866, "epoch": 1082} {"train_loss": -10.638734817504883, "global_step": 181867, "epoch": 1082} {"train_loss": -9.772270202636719, "global_step": 181868, "epoch": 1082} {"train_loss": -10.608190536499023, "global_step": 181869, "epoch": 1082} {"train_loss": -10.070484161376953, "global_step": 181870, "epoch": 1082} {"train_loss": -10.69500732421875, "global_step": 181871, "epoch": 1082} {"train_loss": -10.69968318939209, "global_step": 181872, "epoch": 1082} {"train_loss": -10.568046569824219, "global_step": 181873, "epoch": 1082} {"train_loss": -11.011823654174805, "global_step": 181874, "epoch": 1082} {"train_loss": -11.004823684692383, "global_step": 181875, "epoch": 1082} {"train_loss": -11.107439041137695, "global_step": 181876, "epoch": 1082} {"train_loss": -10.917303085327148, "global_step": 181877, "epoch": 1082} {"train_loss": -10.903396606445312, "global_step": 181878, "epoch": 1082} {"train_loss": -11.1070556640625, "global_step": 181879, "epoch": 1082} {"train_loss": -11.141937255859375, "global_step": 181880, "epoch": 1082} {"train_loss": -11.156266212463379, "global_step": 181881, "epoch": 1082} {"train_loss": -11.251405715942383, "global_step": 181882, "epoch": 1082} {"train_loss": -11.345808982849121, "global_step": 181883, "epoch": 1082} {"train_loss": -11.210848808288574, "global_step": 181884, "epoch": 1082} {"train_loss": -11.339296340942383, "global_step": 181885, "epoch": 1082} {"train_loss": -11.29556655883789, "global_step": 181886, "epoch": 1082} {"train_loss": -11.353559494018555, "global_step": 181887, "epoch": 1082} {"train_loss": -11.117874145507812, "global_step": 181888, "epoch": 1082} {"train_loss": -11.375686645507812, "global_step": 181889, "epoch": 1082} {"train_loss": -11.160240173339844, "global_step": 181890, "epoch": 1082} {"train_loss": -11.263336181640625, "global_step": 181891, "epoch": 1082} {"train_loss": -11.075571060180664, "global_step": 181892, "epoch": 1082} {"train_loss": -11.421085357666016, "global_step": 181893, "epoch": 1082} {"train_loss": -11.166925430297852, "global_step": 181894, "epoch": 1082} {"train_loss": -11.148666381835938, "global_step": 181895, "epoch": 1082} {"train_loss": -11.285943984985352, "global_step": 181896, "epoch": 1082} {"train_loss": -11.396645545959473, "global_step": 181897, "epoch": 1082} {"train_loss": -11.478851318359375, "global_step": 181898, "epoch": 1082} {"train_loss": -11.374147415161133, "global_step": 181899, "epoch": 1082} {"train_loss": -11.333555221557617, "global_step": 181900, "epoch": 1082} {"train_loss": -11.288679122924805, "global_step": 181901, "epoch": 1082} {"train_loss": -11.492652893066406, "global_step": 181902, "epoch": 1082} {"train_loss": -11.274267196655273, "global_step": 181903, "epoch": 1082} {"train_loss": -11.439350128173828, "global_step": 181904, "epoch": 1082} {"train_loss": -11.396408081054688, "global_step": 181905, "epoch": 1082} {"train_loss": -11.493972778320312, "global_step": 181906, "epoch": 1082} {"train_loss": -11.236916542053223, "global_step": 181907, "epoch": 1082} {"train_loss": -11.441638946533203, "global_step": 181908, "epoch": 1082} {"train_loss": -11.425600051879883, "global_step": 181909, "epoch": 1082} {"train_loss": -11.085466384887695, "global_step": 181910, "epoch": 1082} {"train_loss": -11.572792053222656, "global_step": 181911, "epoch": 1082} {"train_loss": -11.234743118286133, "global_step": 181912, "epoch": 1082} {"train_loss": -11.420654296875, "global_step": 181913, "epoch": 1082} {"train_loss": -11.365802764892578, "global_step": 181914, "epoch": 1082} {"train_loss": -11.381900787353516, "global_step": 181915, "epoch": 1082} {"train_loss": -11.331764221191406, "global_step": 181916, "epoch": 1082} {"train_loss": -11.575651168823242, "global_step": 181917, "epoch": 1082} {"train_loss": -11.370882034301758, "global_step": 181918, "epoch": 1082} {"train_loss": -11.59923267364502, "global_step": 181919, "epoch": 1082} {"train_loss": -11.44420337677002, "global_step": 181920, "epoch": 1082} {"train_loss": -11.534746170043945, "global_step": 181921, "epoch": 1082} {"train_loss": -11.517974853515625, "global_step": 181922, "epoch": 1082} {"train_loss": -11.423700332641602, "global_step": 181923, "epoch": 1082} {"train_loss": -11.331125259399414, "global_step": 181924, "epoch": 1082} {"train_loss": -11.291501998901367, "global_step": 181925, "epoch": 1082} {"train_loss": -11.294706344604492, "global_step": 181926, "epoch": 1082} {"train_loss": -11.31358528137207, "global_step": 181927, "epoch": 1082} {"train_loss": -11.245473861694336, "global_step": 181928, "epoch": 1082} {"train_loss": -10.62386703491211, "global_step": 181929, "epoch": 1082} {"train_loss": -11.226232528686523, "global_step": 181930, "epoch": 1082} {"train_loss": -10.800946235656738, "global_step": 181931, "epoch": 1082} {"train_loss": -11.27364730834961, "global_step": 181932, "epoch": 1082} {"train_loss": -9.953630447387695, "global_step": 181933, "epoch": 1082} {"train_loss": -11.484736442565918, "global_step": 181934, "epoch": 1082} {"train_loss": -10.60069465637207, "global_step": 181935, "epoch": 1082} {"train_loss": -10.462562561035156, "global_step": 181936, "epoch": 1082} {"train_loss": -10.759881973266602, "global_step": 181937, "epoch": 1082} {"train_loss": -11.05538558959961, "global_step": 181938, "epoch": 1082} {"train_loss": -10.498111724853516, "global_step": 181939, "epoch": 1082} {"train_loss": -11.32249641418457, "global_step": 181940, "epoch": 1082} {"train_loss": -10.707233428955078, "global_step": 181941, "epoch": 1082} {"train_loss": -10.402629852294922, "global_step": 181942, "epoch": 1082} {"train_loss": -11.028603741100856, "global_step": 181943, "epoch": 1082, "val_loss": 245972.96875} {"train_loss": -10.256837844848633, "global_step": 181944, "epoch": 1083} {"train_loss": -8.554824829101562, "global_step": 181945, "epoch": 1083} {"train_loss": -8.604728698730469, "global_step": 181946, "epoch": 1083} {"train_loss": -7.828084945678711, "global_step": 181947, "epoch": 1083} {"train_loss": -9.780855178833008, "global_step": 181948, "epoch": 1083} {"train_loss": -10.213663101196289, "global_step": 181949, "epoch": 1083} {"train_loss": -9.036575317382812, "global_step": 181950, "epoch": 1083} {"train_loss": -10.08626937866211, "global_step": 181951, "epoch": 1083} {"train_loss": -10.409869194030762, "global_step": 181952, "epoch": 1083} {"train_loss": -9.517513275146484, "global_step": 181953, "epoch": 1083} {"train_loss": -10.153936386108398, "global_step": 181954, "epoch": 1083} {"train_loss": -10.464576721191406, "global_step": 181955, "epoch": 1083} {"train_loss": -9.788249015808105, "global_step": 181956, "epoch": 1083} {"train_loss": -10.100482940673828, "global_step": 181957, "epoch": 1083} {"train_loss": -10.410724639892578, "global_step": 181958, "epoch": 1083} {"train_loss": -10.084562301635742, "global_step": 181959, "epoch": 1083} {"train_loss": -9.555473327636719, "global_step": 181960, "epoch": 1083} {"train_loss": -10.614896774291992, "global_step": 181961, "epoch": 1083} {"train_loss": -10.578306198120117, "global_step": 181962, "epoch": 1083} {"train_loss": -10.39832878112793, "global_step": 181963, "epoch": 1083} {"train_loss": -10.860648155212402, "global_step": 181964, "epoch": 1083} {"train_loss": -10.470284461975098, "global_step": 181965, "epoch": 1083} {"train_loss": -10.503520965576172, "global_step": 181966, "epoch": 1083} {"train_loss": -10.908533096313477, "global_step": 181967, "epoch": 1083} {"train_loss": -10.627963066101074, "global_step": 181968, "epoch": 1083} {"train_loss": -10.532958030700684, "global_step": 181969, "epoch": 1083} {"train_loss": -10.792051315307617, "global_step": 181970, "epoch": 1083} {"train_loss": -10.65931510925293, "global_step": 181971, "epoch": 1083} {"train_loss": -10.773151397705078, "global_step": 181972, "epoch": 1083} {"train_loss": -10.814973831176758, "global_step": 181973, "epoch": 1083} {"train_loss": -10.709329605102539, "global_step": 181974, "epoch": 1083} {"train_loss": -10.712870597839355, "global_step": 181975, "epoch": 1083} {"train_loss": -10.848821640014648, "global_step": 181976, "epoch": 1083} {"train_loss": -10.32022476196289, "global_step": 181977, "epoch": 1083} {"train_loss": -10.89551067352295, "global_step": 181978, "epoch": 1083} {"train_loss": -10.65579605102539, "global_step": 181979, "epoch": 1083} {"train_loss": -10.656333923339844, "global_step": 181980, "epoch": 1083} {"train_loss": -10.891206741333008, "global_step": 181981, "epoch": 1083} {"train_loss": -10.811416625976562, "global_step": 181982, "epoch": 1083} {"train_loss": -10.76845645904541, "global_step": 181983, "epoch": 1083} {"train_loss": -10.840316772460938, "global_step": 181984, "epoch": 1083} {"train_loss": -11.125526428222656, "global_step": 181985, "epoch": 1083} {"train_loss": -10.808563232421875, "global_step": 181986, "epoch": 1083} {"train_loss": -10.78679084777832, "global_step": 181987, "epoch": 1083} {"train_loss": -11.03972053527832, "global_step": 181988, "epoch": 1083} {"train_loss": -10.923897743225098, "global_step": 181989, "epoch": 1083} {"train_loss": -11.140498161315918, "global_step": 181990, "epoch": 1083} {"train_loss": -11.136079788208008, "global_step": 181991, "epoch": 1083} {"train_loss": -11.163553237915039, "global_step": 181992, "epoch": 1083} {"train_loss": -11.09201431274414, "global_step": 181993, "epoch": 1083} {"train_loss": -11.154922485351562, "global_step": 181994, "epoch": 1083} {"train_loss": -11.11793327331543, "global_step": 181995, "epoch": 1083} {"train_loss": -11.121394157409668, "global_step": 181996, "epoch": 1083} {"train_loss": -11.365764617919922, "global_step": 181997, "epoch": 1083} {"train_loss": -11.088621139526367, "global_step": 181998, "epoch": 1083} {"train_loss": -11.288777351379395, "global_step": 181999, "epoch": 1083} {"train_loss": -11.361358642578125, "global_step": 182000, "epoch": 1083} {"train_loss": -11.164657592773438, "global_step": 182001, "epoch": 1083} {"train_loss": -11.224679946899414, "global_step": 182002, "epoch": 1083} {"train_loss": -11.160615921020508, "global_step": 182003, "epoch": 1083} {"train_loss": -11.268791198730469, "global_step": 182004, "epoch": 1083} {"train_loss": -11.344633102416992, "global_step": 182005, "epoch": 1083} {"train_loss": -11.329264640808105, "global_step": 182006, "epoch": 1083} {"train_loss": -11.445399284362793, "global_step": 182007, "epoch": 1083} {"train_loss": -11.499139785766602, "global_step": 182008, "epoch": 1083} {"train_loss": -11.305471420288086, "global_step": 182009, "epoch": 1083} {"train_loss": -11.418197631835938, "global_step": 182010, "epoch": 1083} {"train_loss": -11.318580627441406, "global_step": 182011, "epoch": 1083} {"train_loss": -11.403087615966797, "global_step": 182012, "epoch": 1083} {"train_loss": -11.39793586730957, "global_step": 182013, "epoch": 1083} {"train_loss": -11.409965515136719, "global_step": 182014, "epoch": 1083} {"train_loss": -11.110982894897461, "global_step": 182015, "epoch": 1083} {"train_loss": -11.418876647949219, "global_step": 182016, "epoch": 1083} {"train_loss": -11.337419509887695, "global_step": 182017, "epoch": 1083} {"train_loss": -10.754354476928711, "global_step": 182018, "epoch": 1083} {"train_loss": -11.107189178466797, "global_step": 182019, "epoch": 1083} {"train_loss": -11.089754104614258, "global_step": 182020, "epoch": 1083} {"train_loss": -10.85074234008789, "global_step": 182021, "epoch": 1083} {"train_loss": -11.62588119506836, "global_step": 182022, "epoch": 1083} {"train_loss": -11.157604217529297, "global_step": 182023, "epoch": 1083} {"train_loss": -10.897820472717285, "global_step": 182024, "epoch": 1083} {"train_loss": -11.451262474060059, "global_step": 182025, "epoch": 1083} {"train_loss": -11.075092315673828, "global_step": 182026, "epoch": 1083} {"train_loss": -10.780743598937988, "global_step": 182027, "epoch": 1083} {"train_loss": -11.22838306427002, "global_step": 182028, "epoch": 1083} {"train_loss": -10.936878204345703, "global_step": 182029, "epoch": 1083} {"train_loss": -10.691330909729004, "global_step": 182030, "epoch": 1083} {"train_loss": -10.724376678466797, "global_step": 182031, "epoch": 1083} {"train_loss": -9.376747131347656, "global_step": 182032, "epoch": 1083} {"train_loss": -10.92708683013916, "global_step": 182033, "epoch": 1083} {"train_loss": -10.405747413635254, "global_step": 182034, "epoch": 1083} {"train_loss": -9.383792877197266, "global_step": 182035, "epoch": 1083} {"train_loss": -10.920841217041016, "global_step": 182036, "epoch": 1083} {"train_loss": -10.57272720336914, "global_step": 182037, "epoch": 1083} {"train_loss": -10.55227279663086, "global_step": 182038, "epoch": 1083} {"train_loss": -11.069578170776367, "global_step": 182039, "epoch": 1083} {"train_loss": -10.317193984985352, "global_step": 182040, "epoch": 1083} {"train_loss": -10.992927551269531, "global_step": 182041, "epoch": 1083} {"train_loss": -10.806578636169434, "global_step": 182042, "epoch": 1083} {"train_loss": -11.368577003479004, "global_step": 182043, "epoch": 1083} {"train_loss": -11.103872299194336, "global_step": 182044, "epoch": 1083} {"train_loss": -11.401168823242188, "global_step": 182045, "epoch": 1083} {"train_loss": -11.136899948120117, "global_step": 182046, "epoch": 1083} {"train_loss": -10.840938568115234, "global_step": 182047, "epoch": 1083} {"train_loss": -11.071939468383789, "global_step": 182048, "epoch": 1083} {"train_loss": -10.867691993713379, "global_step": 182049, "epoch": 1083} {"train_loss": -11.23509407043457, "global_step": 182050, "epoch": 1083} {"train_loss": -11.276025772094727, "global_step": 182051, "epoch": 1083} {"train_loss": -10.964540481567383, "global_step": 182052, "epoch": 1083} {"train_loss": -11.449041366577148, "global_step": 182053, "epoch": 1083} {"train_loss": -11.26712417602539, "global_step": 182054, "epoch": 1083} {"train_loss": -10.965076446533203, "global_step": 182055, "epoch": 1083} {"train_loss": -11.236852645874023, "global_step": 182056, "epoch": 1083} {"train_loss": -11.552526473999023, "global_step": 182057, "epoch": 1083} {"train_loss": -11.137763977050781, "global_step": 182058, "epoch": 1083} {"train_loss": -11.267202377319336, "global_step": 182059, "epoch": 1083} {"train_loss": -11.400411605834961, "global_step": 182060, "epoch": 1083} {"train_loss": -11.386716842651367, "global_step": 182061, "epoch": 1083} {"train_loss": -11.445110321044922, "global_step": 182062, "epoch": 1083} {"train_loss": -11.329463005065918, "global_step": 182063, "epoch": 1083} {"train_loss": -11.543368339538574, "global_step": 182064, "epoch": 1083} {"train_loss": -11.230110168457031, "global_step": 182065, "epoch": 1083} {"train_loss": -11.457104682922363, "global_step": 182066, "epoch": 1083} {"train_loss": -11.48617935180664, "global_step": 182067, "epoch": 1083} {"train_loss": -11.489383697509766, "global_step": 182068, "epoch": 1083} {"train_loss": -11.441118240356445, "global_step": 182069, "epoch": 1083} {"train_loss": -11.514307022094727, "global_step": 182070, "epoch": 1083} {"train_loss": -11.520015716552734, "global_step": 182071, "epoch": 1083} {"train_loss": -11.734246253967285, "global_step": 182072, "epoch": 1083} {"train_loss": -11.359790802001953, "global_step": 182073, "epoch": 1083} {"train_loss": -11.521656036376953, "global_step": 182074, "epoch": 1083} {"train_loss": -11.491111755371094, "global_step": 182075, "epoch": 1083} {"train_loss": -11.371572494506836, "global_step": 182076, "epoch": 1083} {"train_loss": -11.470064163208008, "global_step": 182077, "epoch": 1083} {"train_loss": -11.625223159790039, "global_step": 182078, "epoch": 1083} {"train_loss": -10.955348014831543, "global_step": 182079, "epoch": 1083} {"train_loss": -11.6406888961792, "global_step": 182080, "epoch": 1083} {"train_loss": -11.372810363769531, "global_step": 182081, "epoch": 1083} {"train_loss": -11.043739318847656, "global_step": 182082, "epoch": 1083} {"train_loss": -11.198923110961914, "global_step": 182083, "epoch": 1083} {"train_loss": -11.333383560180664, "global_step": 182084, "epoch": 1083} {"train_loss": -10.955955505371094, "global_step": 182085, "epoch": 1083} {"train_loss": -11.19070053100586, "global_step": 182086, "epoch": 1083} {"train_loss": -11.426340103149414, "global_step": 182087, "epoch": 1083} {"train_loss": -10.866033554077148, "global_step": 182088, "epoch": 1083} {"train_loss": -11.150444030761719, "global_step": 182089, "epoch": 1083} {"train_loss": -10.866900444030762, "global_step": 182090, "epoch": 1083} {"train_loss": -10.41622543334961, "global_step": 182091, "epoch": 1083} {"train_loss": -11.041563034057617, "global_step": 182092, "epoch": 1083} {"train_loss": -10.991600036621094, "global_step": 182093, "epoch": 1083} {"train_loss": -10.027393341064453, "global_step": 182094, "epoch": 1083} {"train_loss": -10.238128662109375, "global_step": 182095, "epoch": 1083} {"train_loss": -11.310672760009766, "global_step": 182096, "epoch": 1083} {"train_loss": -11.183677673339844, "global_step": 182097, "epoch": 1083} {"train_loss": -10.527673721313477, "global_step": 182098, "epoch": 1083} {"train_loss": -10.88115119934082, "global_step": 182099, "epoch": 1083} {"train_loss": -10.759074211120605, "global_step": 182100, "epoch": 1083} {"train_loss": -10.941494941711426, "global_step": 182101, "epoch": 1083} {"train_loss": -10.912919998168945, "global_step": 182102, "epoch": 1083} {"train_loss": -10.619997024536133, "global_step": 182103, "epoch": 1083} {"train_loss": -11.307899475097656, "global_step": 182104, "epoch": 1083} {"train_loss": -10.199495315551758, "global_step": 182105, "epoch": 1083} {"train_loss": -10.857027053833008, "global_step": 182106, "epoch": 1083} {"train_loss": -10.755644798278809, "global_step": 182107, "epoch": 1083} {"train_loss": -10.657297134399414, "global_step": 182108, "epoch": 1083} {"train_loss": -10.730632781982422, "global_step": 182109, "epoch": 1083} {"train_loss": -10.841779708862305, "global_step": 182110, "epoch": 1083} {"train_loss": -10.890806311652774, "global_step": 182111, "epoch": 1083, "val_loss": 239665.046875} {"train_loss": -11.001049041748047, "global_step": 182112, "epoch": 1084} {"train_loss": -10.928497314453125, "global_step": 182113, "epoch": 1084} {"train_loss": -11.162403106689453, "global_step": 182114, "epoch": 1084} {"train_loss": -10.797809600830078, "global_step": 182115, "epoch": 1084} {"train_loss": -11.1315279006958, "global_step": 182116, "epoch": 1084} {"train_loss": -10.81618595123291, "global_step": 182117, "epoch": 1084} {"train_loss": -11.000238418579102, "global_step": 182118, "epoch": 1084} {"train_loss": -10.985462188720703, "global_step": 182119, "epoch": 1084} {"train_loss": -10.910696983337402, "global_step": 182120, "epoch": 1084} {"train_loss": -10.563344955444336, "global_step": 182121, "epoch": 1084} {"train_loss": -10.657258033752441, "global_step": 182122, "epoch": 1084} {"train_loss": -10.484261512756348, "global_step": 182123, "epoch": 1084} {"train_loss": -11.183573722839355, "global_step": 182124, "epoch": 1084} {"train_loss": -10.719192504882812, "global_step": 182125, "epoch": 1084} {"train_loss": -11.251977920532227, "global_step": 182126, "epoch": 1084} {"train_loss": -10.717355728149414, "global_step": 182127, "epoch": 1084} {"train_loss": -10.936182022094727, "global_step": 182128, "epoch": 1084} {"train_loss": -11.121732711791992, "global_step": 182129, "epoch": 1084} {"train_loss": -10.939451217651367, "global_step": 182130, "epoch": 1084} {"train_loss": -11.226280212402344, "global_step": 182131, "epoch": 1084} {"train_loss": -10.882100105285645, "global_step": 182132, "epoch": 1084} {"train_loss": -11.187490463256836, "global_step": 182133, "epoch": 1084} {"train_loss": -11.04920768737793, "global_step": 182134, "epoch": 1084} {"train_loss": -10.996133804321289, "global_step": 182135, "epoch": 1084} {"train_loss": -11.234153747558594, "global_step": 182136, "epoch": 1084} {"train_loss": -11.290428161621094, "global_step": 182137, "epoch": 1084} {"train_loss": -10.862295150756836, "global_step": 182138, "epoch": 1084} {"train_loss": -11.27552318572998, "global_step": 182139, "epoch": 1084} {"train_loss": -10.969449043273926, "global_step": 182140, "epoch": 1084} {"train_loss": -11.4951810836792, "global_step": 182141, "epoch": 1084} {"train_loss": -11.103250503540039, "global_step": 182142, "epoch": 1084} {"train_loss": -11.189765930175781, "global_step": 182143, "epoch": 1084} {"train_loss": -10.9949312210083, "global_step": 182144, "epoch": 1084} {"train_loss": -11.467942237854004, "global_step": 182145, "epoch": 1084} {"train_loss": -11.31375503540039, "global_step": 182146, "epoch": 1084} {"train_loss": -11.223984718322754, "global_step": 182147, "epoch": 1084} {"train_loss": -11.25044059753418, "global_step": 182148, "epoch": 1084} {"train_loss": -11.410703659057617, "global_step": 182149, "epoch": 1084} {"train_loss": -11.301873207092285, "global_step": 182150, "epoch": 1084} {"train_loss": -11.352127075195312, "global_step": 182151, "epoch": 1084} {"train_loss": -11.416022300720215, "global_step": 182152, "epoch": 1084} {"train_loss": -11.480765342712402, "global_step": 182153, "epoch": 1084} {"train_loss": -11.482231140136719, "global_step": 182154, "epoch": 1084} {"train_loss": -11.228628158569336, "global_step": 182155, "epoch": 1084} {"train_loss": -11.543140411376953, "global_step": 182156, "epoch": 1084} {"train_loss": -11.236128807067871, "global_step": 182157, "epoch": 1084} {"train_loss": -11.19048023223877, "global_step": 182158, "epoch": 1084} {"train_loss": -11.314088821411133, "global_step": 182159, "epoch": 1084} {"train_loss": -11.350448608398438, "global_step": 182160, "epoch": 1084} {"train_loss": -11.331816673278809, "global_step": 182161, "epoch": 1084} {"train_loss": -11.205364227294922, "global_step": 182162, "epoch": 1084} {"train_loss": -11.657846450805664, "global_step": 182163, "epoch": 1084} {"train_loss": -11.397515296936035, "global_step": 182164, "epoch": 1084} {"train_loss": -11.1218900680542, "global_step": 182165, "epoch": 1084} {"train_loss": -11.408815383911133, "global_step": 182166, "epoch": 1084} {"train_loss": -10.940134048461914, "global_step": 182167, "epoch": 1084} {"train_loss": -11.521549224853516, "global_step": 182168, "epoch": 1084} {"train_loss": -10.672541618347168, "global_step": 182169, "epoch": 1084} {"train_loss": -10.973308563232422, "global_step": 182170, "epoch": 1084} {"train_loss": -11.038183212280273, "global_step": 182171, "epoch": 1084} {"train_loss": -11.271194458007812, "global_step": 182172, "epoch": 1084} {"train_loss": -11.107223510742188, "global_step": 182173, "epoch": 1084} {"train_loss": -11.11915111541748, "global_step": 182174, "epoch": 1084} {"train_loss": -10.905618667602539, "global_step": 182175, "epoch": 1084} {"train_loss": -11.300344467163086, "global_step": 182176, "epoch": 1084} {"train_loss": -10.980183601379395, "global_step": 182177, "epoch": 1084} {"train_loss": -11.564765930175781, "global_step": 182178, "epoch": 1084} {"train_loss": -10.531213760375977, "global_step": 182179, "epoch": 1084} {"train_loss": -11.391706466674805, "global_step": 182180, "epoch": 1084} {"train_loss": -10.764171600341797, "global_step": 182181, "epoch": 1084} {"train_loss": -10.449527740478516, "global_step": 182182, "epoch": 1084} {"train_loss": -10.984695434570312, "global_step": 182183, "epoch": 1084} {"train_loss": -10.53994369506836, "global_step": 182184, "epoch": 1084} {"train_loss": -10.873208999633789, "global_step": 182185, "epoch": 1084} {"train_loss": -9.912830352783203, "global_step": 182186, "epoch": 1084} {"train_loss": -11.238119125366211, "global_step": 182187, "epoch": 1084} {"train_loss": -9.104809761047363, "global_step": 182188, "epoch": 1084} {"train_loss": -10.608878135681152, "global_step": 182189, "epoch": 1084} {"train_loss": -10.755887031555176, "global_step": 182190, "epoch": 1084} {"train_loss": -9.679695129394531, "global_step": 182191, "epoch": 1084} {"train_loss": -10.251994132995605, "global_step": 182192, "epoch": 1084} {"train_loss": -10.556398391723633, "global_step": 182193, "epoch": 1084} {"train_loss": -10.759086608886719, "global_step": 182194, "epoch": 1084} {"train_loss": -10.52522087097168, "global_step": 182195, "epoch": 1084} {"train_loss": -11.084081649780273, "global_step": 182196, "epoch": 1084} {"train_loss": -10.572303771972656, "global_step": 182197, "epoch": 1084} {"train_loss": -11.188713073730469, "global_step": 182198, "epoch": 1084} {"train_loss": -10.87369155883789, "global_step": 182199, "epoch": 1084} {"train_loss": -10.844121932983398, "global_step": 182200, "epoch": 1084} {"train_loss": -11.149686813354492, "global_step": 182201, "epoch": 1084} {"train_loss": -10.937103271484375, "global_step": 182202, "epoch": 1084} {"train_loss": -11.240097045898438, "global_step": 182203, "epoch": 1084} {"train_loss": -11.166994094848633, "global_step": 182204, "epoch": 1084} {"train_loss": -11.14317512512207, "global_step": 182205, "epoch": 1084} {"train_loss": -11.032828330993652, "global_step": 182206, "epoch": 1084} {"train_loss": -11.075644493103027, "global_step": 182207, "epoch": 1084} {"train_loss": -10.777438163757324, "global_step": 182208, "epoch": 1084} {"train_loss": -11.1468505859375, "global_step": 182209, "epoch": 1084} {"train_loss": -11.139262199401855, "global_step": 182210, "epoch": 1084} {"train_loss": -10.915752410888672, "global_step": 182211, "epoch": 1084} {"train_loss": -10.980375289916992, "global_step": 182212, "epoch": 1084} {"train_loss": -11.07733154296875, "global_step": 182213, "epoch": 1084} {"train_loss": -10.967144012451172, "global_step": 182214, "epoch": 1084} {"train_loss": -11.221731185913086, "global_step": 182215, "epoch": 1084} {"train_loss": -10.748477935791016, "global_step": 182216, "epoch": 1084} {"train_loss": -11.028749465942383, "global_step": 182217, "epoch": 1084} {"train_loss": -11.017833709716797, "global_step": 182218, "epoch": 1084} {"train_loss": -10.995951652526855, "global_step": 182219, "epoch": 1084} {"train_loss": -10.716374397277832, "global_step": 182220, "epoch": 1084} {"train_loss": -10.333946228027344, "global_step": 182221, "epoch": 1084} {"train_loss": -10.6669340133667, "global_step": 182222, "epoch": 1084} {"train_loss": -10.239307403564453, "global_step": 182223, "epoch": 1084} {"train_loss": -11.111568450927734, "global_step": 182224, "epoch": 1084} {"train_loss": -10.460884094238281, "global_step": 182225, "epoch": 1084} {"train_loss": -10.420828819274902, "global_step": 182226, "epoch": 1084} {"train_loss": -10.665672302246094, "global_step": 182227, "epoch": 1084} {"train_loss": -10.6868257522583, "global_step": 182228, "epoch": 1084} {"train_loss": -10.815485000610352, "global_step": 182229, "epoch": 1084} {"train_loss": -10.535894393920898, "global_step": 182230, "epoch": 1084} {"train_loss": -10.362565994262695, "global_step": 182231, "epoch": 1084} {"train_loss": -10.81436538696289, "global_step": 182232, "epoch": 1084} {"train_loss": -10.46468734741211, "global_step": 182233, "epoch": 1084} {"train_loss": -10.896262168884277, "global_step": 182234, "epoch": 1084} {"train_loss": -10.777477264404297, "global_step": 182235, "epoch": 1084} {"train_loss": -10.77999210357666, "global_step": 182236, "epoch": 1084} {"train_loss": -11.311861038208008, "global_step": 182237, "epoch": 1084} {"train_loss": -10.911848068237305, "global_step": 182238, "epoch": 1084} {"train_loss": -11.184576034545898, "global_step": 182239, "epoch": 1084} {"train_loss": -11.09294319152832, "global_step": 182240, "epoch": 1084} {"train_loss": -11.142108917236328, "global_step": 182241, "epoch": 1084} {"train_loss": -11.120561599731445, "global_step": 182242, "epoch": 1084} {"train_loss": -11.19893741607666, "global_step": 182243, "epoch": 1084} {"train_loss": -11.296347618103027, "global_step": 182244, "epoch": 1084} {"train_loss": -11.171107292175293, "global_step": 182245, "epoch": 1084} {"train_loss": -11.109509468078613, "global_step": 182246, "epoch": 1084} {"train_loss": -11.365665435791016, "global_step": 182247, "epoch": 1084} {"train_loss": -11.060565948486328, "global_step": 182248, "epoch": 1084} {"train_loss": -10.992172241210938, "global_step": 182249, "epoch": 1084} {"train_loss": -11.174200057983398, "global_step": 182250, "epoch": 1084} {"train_loss": -11.275572776794434, "global_step": 182251, "epoch": 1084} {"train_loss": -11.029024124145508, "global_step": 182252, "epoch": 1084} {"train_loss": -11.296792030334473, "global_step": 182253, "epoch": 1084} {"train_loss": -11.199156761169434, "global_step": 182254, "epoch": 1084} {"train_loss": -11.348319053649902, "global_step": 182255, "epoch": 1084} {"train_loss": -11.19973373413086, "global_step": 182256, "epoch": 1084} {"train_loss": -11.382699966430664, "global_step": 182257, "epoch": 1084} {"train_loss": -11.159570693969727, "global_step": 182258, "epoch": 1084} {"train_loss": -11.325590133666992, "global_step": 182259, "epoch": 1084} {"train_loss": -11.288579940795898, "global_step": 182260, "epoch": 1084} {"train_loss": -11.287923812866211, "global_step": 182261, "epoch": 1084} {"train_loss": -11.257850646972656, "global_step": 182262, "epoch": 1084} {"train_loss": -11.295089721679688, "global_step": 182263, "epoch": 1084} {"train_loss": -11.535419464111328, "global_step": 182264, "epoch": 1084} {"train_loss": -11.314779281616211, "global_step": 182265, "epoch": 1084} {"train_loss": -11.340034484863281, "global_step": 182266, "epoch": 1084} {"train_loss": -11.46681022644043, "global_step": 182267, "epoch": 1084} {"train_loss": -11.22060775756836, "global_step": 182268, "epoch": 1084} {"train_loss": -11.46515941619873, "global_step": 182269, "epoch": 1084} {"train_loss": -11.232658386230469, "global_step": 182270, "epoch": 1084} {"train_loss": -11.658347129821777, "global_step": 182271, "epoch": 1084} {"train_loss": -11.387645721435547, "global_step": 182272, "epoch": 1084} {"train_loss": -11.381659507751465, "global_step": 182273, "epoch": 1084} {"train_loss": -11.58539867401123, "global_step": 182274, "epoch": 1084} {"train_loss": -11.305514335632324, "global_step": 182275, "epoch": 1084} {"train_loss": -11.526199340820312, "global_step": 182276, "epoch": 1084} {"train_loss": -11.610345840454102, "global_step": 182277, "epoch": 1084} {"train_loss": -11.054000854492188, "global_step": 182278, "epoch": 1084} {"train_loss": -11.041707901727586, "global_step": 182279, "epoch": 1084, "val_loss": 242408.015625} {"train_loss": -10.363089561462402, "global_step": 182280, "epoch": 1085} {"train_loss": -10.50302505493164, "global_step": 182281, "epoch": 1085} {"train_loss": -10.880270957946777, "global_step": 182282, "epoch": 1085} {"train_loss": -11.007156372070312, "global_step": 182283, "epoch": 1085} {"train_loss": -10.71354866027832, "global_step": 182284, "epoch": 1085} {"train_loss": -11.247835159301758, "global_step": 182285, "epoch": 1085} {"train_loss": -10.583259582519531, "global_step": 182286, "epoch": 1085} {"train_loss": -11.480359077453613, "global_step": 182287, "epoch": 1085} {"train_loss": -10.54826545715332, "global_step": 182288, "epoch": 1085} {"train_loss": -11.271703720092773, "global_step": 182289, "epoch": 1085} {"train_loss": -10.691268920898438, "global_step": 182290, "epoch": 1085} {"train_loss": -11.31226634979248, "global_step": 182291, "epoch": 1085} {"train_loss": -10.903852462768555, "global_step": 182292, "epoch": 1085} {"train_loss": -11.23484992980957, "global_step": 182293, "epoch": 1085} {"train_loss": -11.106422424316406, "global_step": 182294, "epoch": 1085} {"train_loss": -10.95418930053711, "global_step": 182295, "epoch": 1085} {"train_loss": -11.131255149841309, "global_step": 182296, "epoch": 1085} {"train_loss": -10.565324783325195, "global_step": 182297, "epoch": 1085} {"train_loss": -10.77722454071045, "global_step": 182298, "epoch": 1085} {"train_loss": -11.132741928100586, "global_step": 182299, "epoch": 1085} {"train_loss": -10.74953842163086, "global_step": 182300, "epoch": 1085} {"train_loss": -11.09061050415039, "global_step": 182301, "epoch": 1085} {"train_loss": -10.889175415039062, "global_step": 182302, "epoch": 1085} {"train_loss": -11.240436553955078, "global_step": 182303, "epoch": 1085} {"train_loss": -10.538745880126953, "global_step": 182304, "epoch": 1085} {"train_loss": -10.771060943603516, "global_step": 182305, "epoch": 1085} {"train_loss": -11.039104461669922, "global_step": 182306, "epoch": 1085} {"train_loss": -10.451032638549805, "global_step": 182307, "epoch": 1085} {"train_loss": -11.1089448928833, "global_step": 182308, "epoch": 1085} {"train_loss": -10.142879486083984, "global_step": 182309, "epoch": 1085} {"train_loss": -10.680791854858398, "global_step": 182310, "epoch": 1085} {"train_loss": -10.835561752319336, "global_step": 182311, "epoch": 1085} {"train_loss": -9.717299461364746, "global_step": 182312, "epoch": 1085} {"train_loss": -10.912321090698242, "global_step": 182313, "epoch": 1085} {"train_loss": -10.011638641357422, "global_step": 182314, "epoch": 1085} {"train_loss": -10.450515747070312, "global_step": 182315, "epoch": 1085} {"train_loss": -10.800150871276855, "global_step": 182316, "epoch": 1085} {"train_loss": -10.156858444213867, "global_step": 182317, "epoch": 1085} {"train_loss": -11.28004264831543, "global_step": 182318, "epoch": 1085} {"train_loss": -9.777283668518066, "global_step": 182319, "epoch": 1085} {"train_loss": -10.920280456542969, "global_step": 182320, "epoch": 1085} {"train_loss": -11.036283493041992, "global_step": 182321, "epoch": 1085} {"train_loss": -10.859517097473145, "global_step": 182322, "epoch": 1085} {"train_loss": -11.185831069946289, "global_step": 182323, "epoch": 1085} {"train_loss": -11.019325256347656, "global_step": 182324, "epoch": 1085} {"train_loss": -10.902613639831543, "global_step": 182325, "epoch": 1085} {"train_loss": -10.973997116088867, "global_step": 182326, "epoch": 1085} {"train_loss": -11.17538833618164, "global_step": 182327, "epoch": 1085} {"train_loss": -10.837759017944336, "global_step": 182328, "epoch": 1085} {"train_loss": -11.435975074768066, "global_step": 182329, "epoch": 1085} {"train_loss": -10.92332649230957, "global_step": 182330, "epoch": 1085} {"train_loss": -11.22219181060791, "global_step": 182331, "epoch": 1085} {"train_loss": -11.292932510375977, "global_step": 182332, "epoch": 1085} {"train_loss": -11.1609468460083, "global_step": 182333, "epoch": 1085} {"train_loss": -11.386957168579102, "global_step": 182334, "epoch": 1085} {"train_loss": -11.308841705322266, "global_step": 182335, "epoch": 1085} {"train_loss": -11.251066207885742, "global_step": 182336, "epoch": 1085} {"train_loss": -11.295943260192871, "global_step": 182337, "epoch": 1085} {"train_loss": -11.298273086547852, "global_step": 182338, "epoch": 1085} {"train_loss": -11.283464431762695, "global_step": 182339, "epoch": 1085} {"train_loss": -10.90490436553955, "global_step": 182340, "epoch": 1085} {"train_loss": -11.193344116210938, "global_step": 182341, "epoch": 1085} {"train_loss": -11.167816162109375, "global_step": 182342, "epoch": 1085} {"train_loss": -11.030098915100098, "global_step": 182343, "epoch": 1085} {"train_loss": -11.391830444335938, "global_step": 182344, "epoch": 1085} {"train_loss": -11.222250938415527, "global_step": 182345, "epoch": 1085} {"train_loss": -11.438478469848633, "global_step": 182346, "epoch": 1085} {"train_loss": -11.129585266113281, "global_step": 182347, "epoch": 1085} {"train_loss": -11.022655487060547, "global_step": 182348, "epoch": 1085} {"train_loss": -11.43387222290039, "global_step": 182349, "epoch": 1085} {"train_loss": -11.326156616210938, "global_step": 182350, "epoch": 1085} {"train_loss": -11.303627014160156, "global_step": 182351, "epoch": 1085} {"train_loss": -11.410332679748535, "global_step": 182352, "epoch": 1085} {"train_loss": -11.436655044555664, "global_step": 182353, "epoch": 1085} {"train_loss": -11.304490089416504, "global_step": 182354, "epoch": 1085} {"train_loss": -11.318914413452148, "global_step": 182355, "epoch": 1085} {"train_loss": -11.342642784118652, "global_step": 182356, "epoch": 1085} {"train_loss": -11.057313919067383, "global_step": 182357, "epoch": 1085} {"train_loss": -11.317424774169922, "global_step": 182358, "epoch": 1085} {"train_loss": -11.547945022583008, "global_step": 182359, "epoch": 1085} {"train_loss": -11.3002347946167, "global_step": 182360, "epoch": 1085} {"train_loss": -11.485538482666016, "global_step": 182361, "epoch": 1085} {"train_loss": -11.195131301879883, "global_step": 182362, "epoch": 1085} {"train_loss": -11.360172271728516, "global_step": 182363, "epoch": 1085} {"train_loss": -11.350423812866211, "global_step": 182364, "epoch": 1085} {"train_loss": -11.656631469726562, "global_step": 182365, "epoch": 1085} {"train_loss": -10.964198112487793, "global_step": 182366, "epoch": 1085} {"train_loss": -10.672733306884766, "global_step": 182367, "epoch": 1085} {"train_loss": -11.274343490600586, "global_step": 182368, "epoch": 1085} {"train_loss": -11.221699714660645, "global_step": 182369, "epoch": 1085} {"train_loss": -10.688727378845215, "global_step": 182370, "epoch": 1085} {"train_loss": -11.254831314086914, "global_step": 182371, "epoch": 1085} {"train_loss": -11.1071195602417, "global_step": 182372, "epoch": 1085} {"train_loss": -10.936639785766602, "global_step": 182373, "epoch": 1085} {"train_loss": -11.067699432373047, "global_step": 182374, "epoch": 1085} {"train_loss": -11.310239791870117, "global_step": 182375, "epoch": 1085} {"train_loss": -10.233440399169922, "global_step": 182376, "epoch": 1085} {"train_loss": -10.896405220031738, "global_step": 182377, "epoch": 1085} {"train_loss": -11.015466690063477, "global_step": 182378, "epoch": 1085} {"train_loss": -9.738197326660156, "global_step": 182379, "epoch": 1085} {"train_loss": -11.10610580444336, "global_step": 182380, "epoch": 1085} {"train_loss": -10.529212951660156, "global_step": 182381, "epoch": 1085} {"train_loss": -10.638227462768555, "global_step": 182382, "epoch": 1085} {"train_loss": -11.060955047607422, "global_step": 182383, "epoch": 1085} {"train_loss": -10.730175018310547, "global_step": 182384, "epoch": 1085} {"train_loss": -11.248686790466309, "global_step": 182385, "epoch": 1085} {"train_loss": -11.094732284545898, "global_step": 182386, "epoch": 1085} {"train_loss": -11.033493995666504, "global_step": 182387, "epoch": 1085} {"train_loss": -11.085025787353516, "global_step": 182388, "epoch": 1085} {"train_loss": -11.08345890045166, "global_step": 182389, "epoch": 1085} {"train_loss": -10.826738357543945, "global_step": 182390, "epoch": 1085} {"train_loss": -10.701672554016113, "global_step": 182391, "epoch": 1085} {"train_loss": -10.196144104003906, "global_step": 182392, "epoch": 1085} {"train_loss": -10.921674728393555, "global_step": 182393, "epoch": 1085} {"train_loss": -9.882569313049316, "global_step": 182394, "epoch": 1085} {"train_loss": -11.160455703735352, "global_step": 182395, "epoch": 1085} {"train_loss": -9.993606567382812, "global_step": 182396, "epoch": 1085} {"train_loss": -10.641227722167969, "global_step": 182397, "epoch": 1085} {"train_loss": -10.407830238342285, "global_step": 182398, "epoch": 1085} {"train_loss": -10.42579174041748, "global_step": 182399, "epoch": 1085} {"train_loss": -10.908626556396484, "global_step": 182400, "epoch": 1085} {"train_loss": -10.351689338684082, "global_step": 182401, "epoch": 1085} {"train_loss": -10.92760181427002, "global_step": 182402, "epoch": 1085} {"train_loss": -10.758966445922852, "global_step": 182403, "epoch": 1085} {"train_loss": -10.714118957519531, "global_step": 182404, "epoch": 1085} {"train_loss": -10.98735523223877, "global_step": 182405, "epoch": 1085} {"train_loss": -10.980731010437012, "global_step": 182406, "epoch": 1085} {"train_loss": -11.04649543762207, "global_step": 182407, "epoch": 1085} {"train_loss": -10.723475456237793, "global_step": 182408, "epoch": 1085} {"train_loss": -10.9830322265625, "global_step": 182409, "epoch": 1085} {"train_loss": -11.052175521850586, "global_step": 182410, "epoch": 1085} {"train_loss": -10.948521614074707, "global_step": 182411, "epoch": 1085} {"train_loss": -10.85028076171875, "global_step": 182412, "epoch": 1085} {"train_loss": -10.780138969421387, "global_step": 182413, "epoch": 1085} {"train_loss": -10.953702926635742, "global_step": 182414, "epoch": 1085} {"train_loss": -10.946527481079102, "global_step": 182415, "epoch": 1085} {"train_loss": -11.253456115722656, "global_step": 182416, "epoch": 1085} {"train_loss": -11.033905982971191, "global_step": 182417, "epoch": 1085} {"train_loss": -11.028182983398438, "global_step": 182418, "epoch": 1085} {"train_loss": -10.727656364440918, "global_step": 182419, "epoch": 1085} {"train_loss": -11.082316398620605, "global_step": 182420, "epoch": 1085} {"train_loss": -11.287017822265625, "global_step": 182421, "epoch": 1085} {"train_loss": -11.166417121887207, "global_step": 182422, "epoch": 1085} {"train_loss": -11.27418327331543, "global_step": 182423, "epoch": 1085} {"train_loss": -11.044546127319336, "global_step": 182424, "epoch": 1085} {"train_loss": -10.761067390441895, "global_step": 182425, "epoch": 1085} {"train_loss": -11.170175552368164, "global_step": 182426, "epoch": 1085} {"train_loss": -11.065223693847656, "global_step": 182427, "epoch": 1085} {"train_loss": -11.127511024475098, "global_step": 182428, "epoch": 1085} {"train_loss": -11.098623275756836, "global_step": 182429, "epoch": 1085} {"train_loss": -11.269875526428223, "global_step": 182430, "epoch": 1085} {"train_loss": -11.202058792114258, "global_step": 182431, "epoch": 1085} {"train_loss": -11.0177001953125, "global_step": 182432, "epoch": 1085} {"train_loss": -11.122740745544434, "global_step": 182433, "epoch": 1085} {"train_loss": -11.095171928405762, "global_step": 182434, "epoch": 1085} {"train_loss": -11.066161155700684, "global_step": 182435, "epoch": 1085} {"train_loss": -10.712581634521484, "global_step": 182436, "epoch": 1085} {"train_loss": -10.60174560546875, "global_step": 182437, "epoch": 1085} {"train_loss": -11.273913383483887, "global_step": 182438, "epoch": 1085} {"train_loss": -10.801898956298828, "global_step": 182439, "epoch": 1085} {"train_loss": -11.111198425292969, "global_step": 182440, "epoch": 1085} {"train_loss": -11.226621627807617, "global_step": 182441, "epoch": 1085} {"train_loss": -10.869141578674316, "global_step": 182442, "epoch": 1085} {"train_loss": -11.192412376403809, "global_step": 182443, "epoch": 1085} {"train_loss": -11.04499626159668, "global_step": 182444, "epoch": 1085} {"train_loss": -11.057157516479492, "global_step": 182445, "epoch": 1085} {"train_loss": -10.859030723571777, "global_step": 182446, "epoch": 1085} {"train_loss": -10.96714447225843, "global_step": 182447, "epoch": 1085, "val_loss": 244876.546875, "train_action_mse_error": 1.6866159439086914} {"train_loss": -10.67593765258789, "global_step": 182448, "epoch": 1086} {"train_loss": -11.206476211547852, "global_step": 182449, "epoch": 1086} {"train_loss": -10.705475807189941, "global_step": 182450, "epoch": 1086} {"train_loss": -11.19767951965332, "global_step": 182451, "epoch": 1086} {"train_loss": -10.599971771240234, "global_step": 182452, "epoch": 1086} {"train_loss": -10.994823455810547, "global_step": 182453, "epoch": 1086} {"train_loss": -10.998568534851074, "global_step": 182454, "epoch": 1086} {"train_loss": -11.101631164550781, "global_step": 182455, "epoch": 1086} {"train_loss": -10.947306632995605, "global_step": 182456, "epoch": 1086} {"train_loss": -11.24023151397705, "global_step": 182457, "epoch": 1086} {"train_loss": -10.637636184692383, "global_step": 182458, "epoch": 1086} {"train_loss": -11.228352546691895, "global_step": 182459, "epoch": 1086} {"train_loss": -10.884729385375977, "global_step": 182460, "epoch": 1086} {"train_loss": -11.299318313598633, "global_step": 182461, "epoch": 1086} {"train_loss": -11.157703399658203, "global_step": 182462, "epoch": 1086} {"train_loss": -11.243846893310547, "global_step": 182463, "epoch": 1086} {"train_loss": -11.098878860473633, "global_step": 182464, "epoch": 1086} {"train_loss": -11.141797065734863, "global_step": 182465, "epoch": 1086} {"train_loss": -11.196901321411133, "global_step": 182466, "epoch": 1086} {"train_loss": -10.879589080810547, "global_step": 182467, "epoch": 1086} {"train_loss": -11.307830810546875, "global_step": 182468, "epoch": 1086} {"train_loss": -10.947303771972656, "global_step": 182469, "epoch": 1086} {"train_loss": -11.449470520019531, "global_step": 182470, "epoch": 1086} {"train_loss": -11.017046928405762, "global_step": 182471, "epoch": 1086} {"train_loss": -11.27095890045166, "global_step": 182472, "epoch": 1086} {"train_loss": -11.321608543395996, "global_step": 182473, "epoch": 1086} {"train_loss": -11.273506164550781, "global_step": 182474, "epoch": 1086} {"train_loss": -11.277835845947266, "global_step": 182475, "epoch": 1086} {"train_loss": -11.233843803405762, "global_step": 182476, "epoch": 1086} {"train_loss": -11.20448112487793, "global_step": 182477, "epoch": 1086} {"train_loss": -11.372186660766602, "global_step": 182478, "epoch": 1086} {"train_loss": -11.515148162841797, "global_step": 182479, "epoch": 1086} {"train_loss": -11.253549575805664, "global_step": 182480, "epoch": 1086} {"train_loss": -11.416000366210938, "global_step": 182481, "epoch": 1086} {"train_loss": -11.242622375488281, "global_step": 182482, "epoch": 1086} {"train_loss": -11.26885986328125, "global_step": 182483, "epoch": 1086} {"train_loss": -11.147151947021484, "global_step": 182484, "epoch": 1086} {"train_loss": -10.941095352172852, "global_step": 182485, "epoch": 1086} {"train_loss": -11.521003723144531, "global_step": 182486, "epoch": 1086} {"train_loss": -10.8714017868042, "global_step": 182487, "epoch": 1086} {"train_loss": -11.436046600341797, "global_step": 182488, "epoch": 1086} {"train_loss": -11.407831192016602, "global_step": 182489, "epoch": 1086} {"train_loss": -11.373541831970215, "global_step": 182490, "epoch": 1086} {"train_loss": -11.547758102416992, "global_step": 182491, "epoch": 1086} {"train_loss": -11.317638397216797, "global_step": 182492, "epoch": 1086} {"train_loss": -11.577217102050781, "global_step": 182493, "epoch": 1086} {"train_loss": -11.41744327545166, "global_step": 182494, "epoch": 1086} {"train_loss": -11.402200698852539, "global_step": 182495, "epoch": 1086} {"train_loss": -11.677536010742188, "global_step": 182496, "epoch": 1086} {"train_loss": -11.584836959838867, "global_step": 182497, "epoch": 1086} {"train_loss": -11.092275619506836, "global_step": 182498, "epoch": 1086} {"train_loss": -11.406600952148438, "global_step": 182499, "epoch": 1086} {"train_loss": -11.36606502532959, "global_step": 182500, "epoch": 1086} {"train_loss": -11.377817153930664, "global_step": 182501, "epoch": 1086} {"train_loss": -11.57049560546875, "global_step": 182502, "epoch": 1086} {"train_loss": -11.494362831115723, "global_step": 182503, "epoch": 1086} {"train_loss": -11.636444091796875, "global_step": 182504, "epoch": 1086} {"train_loss": -11.375411987304688, "global_step": 182505, "epoch": 1086} {"train_loss": -11.426828384399414, "global_step": 182506, "epoch": 1086} {"train_loss": -11.293754577636719, "global_step": 182507, "epoch": 1086} {"train_loss": -11.349647521972656, "global_step": 182508, "epoch": 1086} {"train_loss": -11.527033805847168, "global_step": 182509, "epoch": 1086} {"train_loss": -11.401787757873535, "global_step": 182510, "epoch": 1086} {"train_loss": -11.50466537475586, "global_step": 182511, "epoch": 1086} {"train_loss": -11.347558975219727, "global_step": 182512, "epoch": 1086} {"train_loss": -11.400028228759766, "global_step": 182513, "epoch": 1086} {"train_loss": -11.146140098571777, "global_step": 182514, "epoch": 1086} {"train_loss": -11.3298921585083, "global_step": 182515, "epoch": 1086} {"train_loss": -11.23072624206543, "global_step": 182516, "epoch": 1086} {"train_loss": -11.007071495056152, "global_step": 182517, "epoch": 1086} {"train_loss": -11.32524585723877, "global_step": 182518, "epoch": 1086} {"train_loss": -11.448912620544434, "global_step": 182519, "epoch": 1086} {"train_loss": -10.665574073791504, "global_step": 182520, "epoch": 1086} {"train_loss": -11.093490600585938, "global_step": 182521, "epoch": 1086} {"train_loss": -11.266355514526367, "global_step": 182522, "epoch": 1086} {"train_loss": -10.241439819335938, "global_step": 182523, "epoch": 1086} {"train_loss": -10.88885498046875, "global_step": 182524, "epoch": 1086} {"train_loss": -10.213041305541992, "global_step": 182525, "epoch": 1086} {"train_loss": -10.664323806762695, "global_step": 182526, "epoch": 1086} {"train_loss": -10.476299285888672, "global_step": 182527, "epoch": 1086} {"train_loss": -11.242411613464355, "global_step": 182528, "epoch": 1086} {"train_loss": -9.936424255371094, "global_step": 182529, "epoch": 1086} {"train_loss": -10.935309410095215, "global_step": 182530, "epoch": 1086} {"train_loss": -10.766220092773438, "global_step": 182531, "epoch": 1086} {"train_loss": -10.565816879272461, "global_step": 182532, "epoch": 1086} {"train_loss": -10.73477840423584, "global_step": 182533, "epoch": 1086} {"train_loss": -10.252052307128906, "global_step": 182534, "epoch": 1086} {"train_loss": -10.518375396728516, "global_step": 182535, "epoch": 1086} {"train_loss": -10.130210876464844, "global_step": 182536, "epoch": 1086} {"train_loss": -10.38640022277832, "global_step": 182537, "epoch": 1086} {"train_loss": -10.232522964477539, "global_step": 182538, "epoch": 1086} {"train_loss": -10.588159561157227, "global_step": 182539, "epoch": 1086} {"train_loss": -11.051912307739258, "global_step": 182540, "epoch": 1086} {"train_loss": -10.271974563598633, "global_step": 182541, "epoch": 1086} {"train_loss": -10.409687042236328, "global_step": 182542, "epoch": 1086} {"train_loss": -10.86075496673584, "global_step": 182543, "epoch": 1086} {"train_loss": -10.340777397155762, "global_step": 182544, "epoch": 1086} {"train_loss": -11.109734535217285, "global_step": 182545, "epoch": 1086} {"train_loss": -10.59598159790039, "global_step": 182546, "epoch": 1086} {"train_loss": -10.600234985351562, "global_step": 182547, "epoch": 1086} {"train_loss": -10.918961524963379, "global_step": 182548, "epoch": 1086} {"train_loss": -10.464405059814453, "global_step": 182549, "epoch": 1086} {"train_loss": -10.984436988830566, "global_step": 182550, "epoch": 1086} {"train_loss": -10.783758163452148, "global_step": 182551, "epoch": 1086} {"train_loss": -10.883184432983398, "global_step": 182552, "epoch": 1086} {"train_loss": -10.960163116455078, "global_step": 182553, "epoch": 1086} {"train_loss": -10.813218116760254, "global_step": 182554, "epoch": 1086} {"train_loss": -10.965295791625977, "global_step": 182555, "epoch": 1086} {"train_loss": -11.15932846069336, "global_step": 182556, "epoch": 1086} {"train_loss": -10.884221076965332, "global_step": 182557, "epoch": 1086} {"train_loss": -10.843704223632812, "global_step": 182558, "epoch": 1086} {"train_loss": -11.00149917602539, "global_step": 182559, "epoch": 1086} {"train_loss": -11.118133544921875, "global_step": 182560, "epoch": 1086} {"train_loss": -11.002978324890137, "global_step": 182561, "epoch": 1086} {"train_loss": -11.245227813720703, "global_step": 182562, "epoch": 1086} {"train_loss": -10.746038436889648, "global_step": 182563, "epoch": 1086} {"train_loss": -11.192171096801758, "global_step": 182564, "epoch": 1086} {"train_loss": -10.683300018310547, "global_step": 182565, "epoch": 1086} {"train_loss": -10.727578163146973, "global_step": 182566, "epoch": 1086} {"train_loss": -10.532754898071289, "global_step": 182567, "epoch": 1086} {"train_loss": -10.468256950378418, "global_step": 182568, "epoch": 1086} {"train_loss": -10.7686767578125, "global_step": 182569, "epoch": 1086} {"train_loss": -10.23689079284668, "global_step": 182570, "epoch": 1086} {"train_loss": -10.891338348388672, "global_step": 182571, "epoch": 1086} {"train_loss": -10.767513275146484, "global_step": 182572, "epoch": 1086} {"train_loss": -10.975593566894531, "global_step": 182573, "epoch": 1086} {"train_loss": -10.58806037902832, "global_step": 182574, "epoch": 1086} {"train_loss": -11.007612228393555, "global_step": 182575, "epoch": 1086} {"train_loss": -10.933171272277832, "global_step": 182576, "epoch": 1086} {"train_loss": -10.851582527160645, "global_step": 182577, "epoch": 1086} {"train_loss": -10.83302116394043, "global_step": 182578, "epoch": 1086} {"train_loss": -10.80921745300293, "global_step": 182579, "epoch": 1086} {"train_loss": -10.874551773071289, "global_step": 182580, "epoch": 1086} {"train_loss": -10.609918594360352, "global_step": 182581, "epoch": 1086} {"train_loss": -11.06503677368164, "global_step": 182582, "epoch": 1086} {"train_loss": -10.303884506225586, "global_step": 182583, "epoch": 1086} {"train_loss": -10.784571647644043, "global_step": 182584, "epoch": 1086} {"train_loss": -11.016874313354492, "global_step": 182585, "epoch": 1086} {"train_loss": -11.029409408569336, "global_step": 182586, "epoch": 1086} {"train_loss": -10.888246536254883, "global_step": 182587, "epoch": 1086} {"train_loss": -11.022281646728516, "global_step": 182588, "epoch": 1086} {"train_loss": -11.069616317749023, "global_step": 182589, "epoch": 1086} {"train_loss": -10.998859405517578, "global_step": 182590, "epoch": 1086} {"train_loss": -11.16974925994873, "global_step": 182591, "epoch": 1086} {"train_loss": -11.157885551452637, "global_step": 182592, "epoch": 1086} {"train_loss": -10.93731689453125, "global_step": 182593, "epoch": 1086} {"train_loss": -11.297296524047852, "global_step": 182594, "epoch": 1086} {"train_loss": -10.881959915161133, "global_step": 182595, "epoch": 1086} {"train_loss": -11.510164260864258, "global_step": 182596, "epoch": 1086} {"train_loss": -11.003466606140137, "global_step": 182597, "epoch": 1086} {"train_loss": -11.196788787841797, "global_step": 182598, "epoch": 1086} {"train_loss": -11.15151309967041, "global_step": 182599, "epoch": 1086} {"train_loss": -11.310279846191406, "global_step": 182600, "epoch": 1086} {"train_loss": -11.157525062561035, "global_step": 182601, "epoch": 1086} {"train_loss": -11.343884468078613, "global_step": 182602, "epoch": 1086} {"train_loss": -11.203868865966797, "global_step": 182603, "epoch": 1086} {"train_loss": -11.23519515991211, "global_step": 182604, "epoch": 1086} {"train_loss": -11.152721405029297, "global_step": 182605, "epoch": 1086} {"train_loss": -11.380393028259277, "global_step": 182606, "epoch": 1086} {"train_loss": -11.274996757507324, "global_step": 182607, "epoch": 1086} {"train_loss": -11.489877700805664, "global_step": 182608, "epoch": 1086} {"train_loss": -11.42554759979248, "global_step": 182609, "epoch": 1086} {"train_loss": -11.354710578918457, "global_step": 182610, "epoch": 1086} {"train_loss": -11.31788444519043, "global_step": 182611, "epoch": 1086} {"train_loss": -11.440526962280273, "global_step": 182612, "epoch": 1086} {"train_loss": -11.413787841796875, "global_step": 182613, "epoch": 1086} {"train_loss": -11.397114753723145, "global_step": 182614, "epoch": 1086} {"train_loss": -11.044212619463602, "global_step": 182615, "epoch": 1086, "val_loss": 245097.515625} {"train_loss": -11.447242736816406, "global_step": 182616, "epoch": 1087} {"train_loss": -11.293800354003906, "global_step": 182617, "epoch": 1087} {"train_loss": -11.359488487243652, "global_step": 182618, "epoch": 1087} {"train_loss": -11.47123908996582, "global_step": 182619, "epoch": 1087} {"train_loss": -11.189106941223145, "global_step": 182620, "epoch": 1087} {"train_loss": -11.276189804077148, "global_step": 182621, "epoch": 1087} {"train_loss": -11.245595932006836, "global_step": 182622, "epoch": 1087} {"train_loss": -11.110310554504395, "global_step": 182623, "epoch": 1087} {"train_loss": -11.245109558105469, "global_step": 182624, "epoch": 1087} {"train_loss": -11.117527961730957, "global_step": 182625, "epoch": 1087} {"train_loss": -11.224991798400879, "global_step": 182626, "epoch": 1087} {"train_loss": -10.508344650268555, "global_step": 182627, "epoch": 1087} {"train_loss": -11.541746139526367, "global_step": 182628, "epoch": 1087} {"train_loss": -10.881651878356934, "global_step": 182629, "epoch": 1087} {"train_loss": -11.220928192138672, "global_step": 182630, "epoch": 1087} {"train_loss": -11.266633987426758, "global_step": 182631, "epoch": 1087} {"train_loss": -10.451361656188965, "global_step": 182632, "epoch": 1087} {"train_loss": -11.22232723236084, "global_step": 182633, "epoch": 1087} {"train_loss": -10.709939956665039, "global_step": 182634, "epoch": 1087} {"train_loss": -10.880492210388184, "global_step": 182635, "epoch": 1087} {"train_loss": -10.902730941772461, "global_step": 182636, "epoch": 1087} {"train_loss": -11.065178871154785, "global_step": 182637, "epoch": 1087} {"train_loss": -11.217218399047852, "global_step": 182638, "epoch": 1087} {"train_loss": -11.114689826965332, "global_step": 182639, "epoch": 1087} {"train_loss": -11.134976387023926, "global_step": 182640, "epoch": 1087} {"train_loss": -10.855024337768555, "global_step": 182641, "epoch": 1087} {"train_loss": -11.031536102294922, "global_step": 182642, "epoch": 1087} {"train_loss": -10.145724296569824, "global_step": 182643, "epoch": 1087} {"train_loss": -10.730711936950684, "global_step": 182644, "epoch": 1087} {"train_loss": -10.43569278717041, "global_step": 182645, "epoch": 1087} {"train_loss": -10.581307411193848, "global_step": 182646, "epoch": 1087} {"train_loss": -10.845393180847168, "global_step": 182647, "epoch": 1087} {"train_loss": -9.928666114807129, "global_step": 182648, "epoch": 1087} {"train_loss": -11.184013366699219, "global_step": 182649, "epoch": 1087} {"train_loss": -9.762699127197266, "global_step": 182650, "epoch": 1087} {"train_loss": -10.869365692138672, "global_step": 182651, "epoch": 1087} {"train_loss": -10.01781940460205, "global_step": 182652, "epoch": 1087} {"train_loss": -10.008251190185547, "global_step": 182653, "epoch": 1087} {"train_loss": -9.185504913330078, "global_step": 182654, "epoch": 1087} {"train_loss": -10.799664497375488, "global_step": 182655, "epoch": 1087} {"train_loss": -9.20919418334961, "global_step": 182656, "epoch": 1087} {"train_loss": -10.194477081298828, "global_step": 182657, "epoch": 1087} {"train_loss": -9.965936660766602, "global_step": 182658, "epoch": 1087} {"train_loss": -10.575684547424316, "global_step": 182659, "epoch": 1087} {"train_loss": -9.81529426574707, "global_step": 182660, "epoch": 1087} {"train_loss": -10.696002960205078, "global_step": 182661, "epoch": 1087} {"train_loss": -9.964727401733398, "global_step": 182662, "epoch": 1087} {"train_loss": -10.03669548034668, "global_step": 182663, "epoch": 1087} {"train_loss": -10.880067825317383, "global_step": 182664, "epoch": 1087} {"train_loss": -9.857444763183594, "global_step": 182665, "epoch": 1087} {"train_loss": -11.02342414855957, "global_step": 182666, "epoch": 1087} {"train_loss": -10.320850372314453, "global_step": 182667, "epoch": 1087} {"train_loss": -11.013649940490723, "global_step": 182668, "epoch": 1087} {"train_loss": -10.512543678283691, "global_step": 182669, "epoch": 1087} {"train_loss": -10.665132522583008, "global_step": 182670, "epoch": 1087} {"train_loss": -10.748786926269531, "global_step": 182671, "epoch": 1087} {"train_loss": -10.89278507232666, "global_step": 182672, "epoch": 1087} {"train_loss": -10.945868492126465, "global_step": 182673, "epoch": 1087} {"train_loss": -10.845535278320312, "global_step": 182674, "epoch": 1087} {"train_loss": -10.65681266784668, "global_step": 182675, "epoch": 1087} {"train_loss": -10.78598690032959, "global_step": 182676, "epoch": 1087} {"train_loss": -10.234513282775879, "global_step": 182677, "epoch": 1087} {"train_loss": -10.527856826782227, "global_step": 182678, "epoch": 1087} {"train_loss": -10.137481689453125, "global_step": 182679, "epoch": 1087} {"train_loss": -10.61996078491211, "global_step": 182680, "epoch": 1087} {"train_loss": -10.64704418182373, "global_step": 182681, "epoch": 1087} {"train_loss": -10.175053596496582, "global_step": 182682, "epoch": 1087} {"train_loss": -11.176453590393066, "global_step": 182683, "epoch": 1087} {"train_loss": -10.596231460571289, "global_step": 182684, "epoch": 1087} {"train_loss": -10.968268394470215, "global_step": 182685, "epoch": 1087} {"train_loss": -10.674829483032227, "global_step": 182686, "epoch": 1087} {"train_loss": -11.071194648742676, "global_step": 182687, "epoch": 1087} {"train_loss": -10.762493133544922, "global_step": 182688, "epoch": 1087} {"train_loss": -10.86093521118164, "global_step": 182689, "epoch": 1087} {"train_loss": -10.96316146850586, "global_step": 182690, "epoch": 1087} {"train_loss": -10.727746963500977, "global_step": 182691, "epoch": 1087} {"train_loss": -11.175134658813477, "global_step": 182692, "epoch": 1087} {"train_loss": -11.035238265991211, "global_step": 182693, "epoch": 1087} {"train_loss": -11.284658432006836, "global_step": 182694, "epoch": 1087} {"train_loss": -11.0361909866333, "global_step": 182695, "epoch": 1087} {"train_loss": -11.126543045043945, "global_step": 182696, "epoch": 1087} {"train_loss": -11.048139572143555, "global_step": 182697, "epoch": 1087} {"train_loss": -11.116632461547852, "global_step": 182698, "epoch": 1087} {"train_loss": -11.099798202514648, "global_step": 182699, "epoch": 1087} {"train_loss": -11.31224250793457, "global_step": 182700, "epoch": 1087} {"train_loss": -11.265398979187012, "global_step": 182701, "epoch": 1087} {"train_loss": -11.115805625915527, "global_step": 182702, "epoch": 1087} {"train_loss": -11.165924072265625, "global_step": 182703, "epoch": 1087} {"train_loss": -11.378949165344238, "global_step": 182704, "epoch": 1087} {"train_loss": -11.181905746459961, "global_step": 182705, "epoch": 1087} {"train_loss": -11.329275131225586, "global_step": 182706, "epoch": 1087} {"train_loss": -11.33718204498291, "global_step": 182707, "epoch": 1087} {"train_loss": -11.424497604370117, "global_step": 182708, "epoch": 1087} {"train_loss": -11.257762908935547, "global_step": 182709, "epoch": 1087} {"train_loss": -11.192364692687988, "global_step": 182710, "epoch": 1087} {"train_loss": -11.263065338134766, "global_step": 182711, "epoch": 1087} {"train_loss": -11.382624626159668, "global_step": 182712, "epoch": 1087} {"train_loss": -11.255834579467773, "global_step": 182713, "epoch": 1087} {"train_loss": -11.4766845703125, "global_step": 182714, "epoch": 1087} {"train_loss": -11.440340995788574, "global_step": 182715, "epoch": 1087} {"train_loss": -11.423842430114746, "global_step": 182716, "epoch": 1087} {"train_loss": -11.373296737670898, "global_step": 182717, "epoch": 1087} {"train_loss": -11.600435256958008, "global_step": 182718, "epoch": 1087} {"train_loss": -11.126352310180664, "global_step": 182719, "epoch": 1087} {"train_loss": -11.404561996459961, "global_step": 182720, "epoch": 1087} {"train_loss": -11.448874473571777, "global_step": 182721, "epoch": 1087} {"train_loss": -11.637088775634766, "global_step": 182722, "epoch": 1087} {"train_loss": -11.460037231445312, "global_step": 182723, "epoch": 1087} {"train_loss": -11.441946029663086, "global_step": 182724, "epoch": 1087} {"train_loss": -11.465810775756836, "global_step": 182725, "epoch": 1087} {"train_loss": -11.580169677734375, "global_step": 182726, "epoch": 1087} {"train_loss": -11.542881965637207, "global_step": 182727, "epoch": 1087} {"train_loss": -11.762190818786621, "global_step": 182728, "epoch": 1087} {"train_loss": -11.51833438873291, "global_step": 182729, "epoch": 1087} {"train_loss": -11.293705940246582, "global_step": 182730, "epoch": 1087} {"train_loss": -11.579676628112793, "global_step": 182731, "epoch": 1087} {"train_loss": -11.535489082336426, "global_step": 182732, "epoch": 1087} {"train_loss": -11.391772270202637, "global_step": 182733, "epoch": 1087} {"train_loss": -11.356550216674805, "global_step": 182734, "epoch": 1087} {"train_loss": -11.773019790649414, "global_step": 182735, "epoch": 1087} {"train_loss": -11.506233215332031, "global_step": 182736, "epoch": 1087} {"train_loss": -11.44608211517334, "global_step": 182737, "epoch": 1087} {"train_loss": -11.409804344177246, "global_step": 182738, "epoch": 1087} {"train_loss": -11.275266647338867, "global_step": 182739, "epoch": 1087} {"train_loss": -11.105245590209961, "global_step": 182740, "epoch": 1087} {"train_loss": -10.838401794433594, "global_step": 182741, "epoch": 1087} {"train_loss": -11.041971206665039, "global_step": 182742, "epoch": 1087} {"train_loss": -10.936464309692383, "global_step": 182743, "epoch": 1087} {"train_loss": -11.365423202514648, "global_step": 182744, "epoch": 1087} {"train_loss": -10.86589241027832, "global_step": 182745, "epoch": 1087} {"train_loss": -11.501224517822266, "global_step": 182746, "epoch": 1087} {"train_loss": -10.482573509216309, "global_step": 182747, "epoch": 1087} {"train_loss": -10.958877563476562, "global_step": 182748, "epoch": 1087} {"train_loss": -10.923774719238281, "global_step": 182749, "epoch": 1087} {"train_loss": -10.807056427001953, "global_step": 182750, "epoch": 1087} {"train_loss": -10.814079284667969, "global_step": 182751, "epoch": 1087} {"train_loss": -10.973384857177734, "global_step": 182752, "epoch": 1087} {"train_loss": -10.972498893737793, "global_step": 182753, "epoch": 1087} {"train_loss": -10.582504272460938, "global_step": 182754, "epoch": 1087} {"train_loss": -10.691747665405273, "global_step": 182755, "epoch": 1087} {"train_loss": -11.352645874023438, "global_step": 182756, "epoch": 1087} {"train_loss": -10.262517929077148, "global_step": 182757, "epoch": 1087} {"train_loss": -10.93839168548584, "global_step": 182758, "epoch": 1087} {"train_loss": -10.774550437927246, "global_step": 182759, "epoch": 1087} {"train_loss": -11.140487670898438, "global_step": 182760, "epoch": 1087} {"train_loss": -11.068443298339844, "global_step": 182761, "epoch": 1087} {"train_loss": -10.510499954223633, "global_step": 182762, "epoch": 1087} {"train_loss": -10.478632926940918, "global_step": 182763, "epoch": 1087} {"train_loss": -10.515718460083008, "global_step": 182764, "epoch": 1087} {"train_loss": -10.812761306762695, "global_step": 182765, "epoch": 1087} {"train_loss": -10.127403259277344, "global_step": 182766, "epoch": 1087} {"train_loss": -10.78466510772705, "global_step": 182767, "epoch": 1087} {"train_loss": -10.867490768432617, "global_step": 182768, "epoch": 1087} {"train_loss": -10.503263473510742, "global_step": 182769, "epoch": 1087} {"train_loss": -11.319196701049805, "global_step": 182770, "epoch": 1087} {"train_loss": -10.066032409667969, "global_step": 182771, "epoch": 1087} {"train_loss": -11.07448959350586, "global_step": 182772, "epoch": 1087} {"train_loss": -10.774040222167969, "global_step": 182773, "epoch": 1087} {"train_loss": -10.725061416625977, "global_step": 182774, "epoch": 1087} {"train_loss": -10.928560256958008, "global_step": 182775, "epoch": 1087} {"train_loss": -10.010910034179688, "global_step": 182776, "epoch": 1087} {"train_loss": -10.929542541503906, "global_step": 182777, "epoch": 1087} {"train_loss": -10.431462287902832, "global_step": 182778, "epoch": 1087} {"train_loss": -11.147223472595215, "global_step": 182779, "epoch": 1087} {"train_loss": -10.807747840881348, "global_step": 182780, "epoch": 1087} {"train_loss": -10.847444534301758, "global_step": 182781, "epoch": 1087} {"train_loss": -10.751375198364258, "global_step": 182782, "epoch": 1087} {"train_loss": -10.922639318874904, "global_step": 182783, "epoch": 1087, "val_loss": 247369.0} {"train_loss": -10.582939147949219, "global_step": 182784, "epoch": 1088} {"train_loss": -10.833047866821289, "global_step": 182785, "epoch": 1088} {"train_loss": -10.851868629455566, "global_step": 182786, "epoch": 1088} {"train_loss": -11.113314628601074, "global_step": 182787, "epoch": 1088} {"train_loss": -10.878350257873535, "global_step": 182788, "epoch": 1088} {"train_loss": -10.747715950012207, "global_step": 182789, "epoch": 1088} {"train_loss": -11.243289947509766, "global_step": 182790, "epoch": 1088} {"train_loss": -11.02068042755127, "global_step": 182791, "epoch": 1088} {"train_loss": -10.96371841430664, "global_step": 182792, "epoch": 1088} {"train_loss": -11.10521411895752, "global_step": 182793, "epoch": 1088} {"train_loss": -11.273054122924805, "global_step": 182794, "epoch": 1088} {"train_loss": -11.040632247924805, "global_step": 182795, "epoch": 1088} {"train_loss": -11.00837230682373, "global_step": 182796, "epoch": 1088} {"train_loss": -11.105588912963867, "global_step": 182797, "epoch": 1088} {"train_loss": -11.226962089538574, "global_step": 182798, "epoch": 1088} {"train_loss": -10.763879776000977, "global_step": 182799, "epoch": 1088} {"train_loss": -11.289239883422852, "global_step": 182800, "epoch": 1088} {"train_loss": -11.013601303100586, "global_step": 182801, "epoch": 1088} {"train_loss": -11.139206886291504, "global_step": 182802, "epoch": 1088} {"train_loss": -10.98727798461914, "global_step": 182803, "epoch": 1088} {"train_loss": -11.232528686523438, "global_step": 182804, "epoch": 1088} {"train_loss": -10.991130828857422, "global_step": 182805, "epoch": 1088} {"train_loss": -11.21664810180664, "global_step": 182806, "epoch": 1088} {"train_loss": -11.117143630981445, "global_step": 182807, "epoch": 1088} {"train_loss": -11.427700996398926, "global_step": 182808, "epoch": 1088} {"train_loss": -11.257589340209961, "global_step": 182809, "epoch": 1088} {"train_loss": -11.271491050720215, "global_step": 182810, "epoch": 1088} {"train_loss": -11.024078369140625, "global_step": 182811, "epoch": 1088} {"train_loss": -11.147520065307617, "global_step": 182812, "epoch": 1088} {"train_loss": -11.080779075622559, "global_step": 182813, "epoch": 1088} {"train_loss": -11.187475204467773, "global_step": 182814, "epoch": 1088} {"train_loss": -11.095499038696289, "global_step": 182815, "epoch": 1088} {"train_loss": -11.14976978302002, "global_step": 182816, "epoch": 1088} {"train_loss": -11.14748764038086, "global_step": 182817, "epoch": 1088} {"train_loss": -11.188889503479004, "global_step": 182818, "epoch": 1088} {"train_loss": -11.278005599975586, "global_step": 182819, "epoch": 1088} {"train_loss": -11.25866413116455, "global_step": 182820, "epoch": 1088} {"train_loss": -11.34778881072998, "global_step": 182821, "epoch": 1088} {"train_loss": -11.317330360412598, "global_step": 182822, "epoch": 1088} {"train_loss": -11.172117233276367, "global_step": 182823, "epoch": 1088} {"train_loss": -11.268987655639648, "global_step": 182824, "epoch": 1088} {"train_loss": -11.329902648925781, "global_step": 182825, "epoch": 1088} {"train_loss": -11.361217498779297, "global_step": 182826, "epoch": 1088} {"train_loss": -11.359776496887207, "global_step": 182827, "epoch": 1088} {"train_loss": -11.398078918457031, "global_step": 182828, "epoch": 1088} {"train_loss": -11.454920768737793, "global_step": 182829, "epoch": 1088} {"train_loss": -11.229009628295898, "global_step": 182830, "epoch": 1088} {"train_loss": -11.503400802612305, "global_step": 182831, "epoch": 1088} {"train_loss": -11.365506172180176, "global_step": 182832, "epoch": 1088} {"train_loss": -11.4796142578125, "global_step": 182833, "epoch": 1088} {"train_loss": -11.487831115722656, "global_step": 182834, "epoch": 1088} {"train_loss": -11.402542114257812, "global_step": 182835, "epoch": 1088} {"train_loss": -11.371988296508789, "global_step": 182836, "epoch": 1088} {"train_loss": -11.333952903747559, "global_step": 182837, "epoch": 1088} {"train_loss": -11.403829574584961, "global_step": 182838, "epoch": 1088} {"train_loss": -11.458944320678711, "global_step": 182839, "epoch": 1088} {"train_loss": -11.403703689575195, "global_step": 182840, "epoch": 1088} {"train_loss": -11.477004051208496, "global_step": 182841, "epoch": 1088} {"train_loss": -11.203311920166016, "global_step": 182842, "epoch": 1088} {"train_loss": -11.594551086425781, "global_step": 182843, "epoch": 1088} {"train_loss": -10.76557731628418, "global_step": 182844, "epoch": 1088} {"train_loss": -11.274651527404785, "global_step": 182845, "epoch": 1088} {"train_loss": -11.544267654418945, "global_step": 182846, "epoch": 1088} {"train_loss": -10.983755111694336, "global_step": 182847, "epoch": 1088} {"train_loss": -10.84820556640625, "global_step": 182848, "epoch": 1088} {"train_loss": -11.475627899169922, "global_step": 182849, "epoch": 1088} {"train_loss": -11.051509857177734, "global_step": 182850, "epoch": 1088} {"train_loss": -11.227495193481445, "global_step": 182851, "epoch": 1088} {"train_loss": -11.06430435180664, "global_step": 182852, "epoch": 1088} {"train_loss": -11.598304748535156, "global_step": 182853, "epoch": 1088} {"train_loss": -10.848241806030273, "global_step": 182854, "epoch": 1088} {"train_loss": -10.83894157409668, "global_step": 182855, "epoch": 1088} {"train_loss": -11.123289108276367, "global_step": 182856, "epoch": 1088} {"train_loss": -11.023080825805664, "global_step": 182857, "epoch": 1088} {"train_loss": -11.245826721191406, "global_step": 182858, "epoch": 1088} {"train_loss": -11.078542709350586, "global_step": 182859, "epoch": 1088} {"train_loss": -10.357137680053711, "global_step": 182860, "epoch": 1088} {"train_loss": -11.277435302734375, "global_step": 182861, "epoch": 1088} {"train_loss": -10.940540313720703, "global_step": 182862, "epoch": 1088} {"train_loss": -10.743216514587402, "global_step": 182863, "epoch": 1088} {"train_loss": -11.166839599609375, "global_step": 182864, "epoch": 1088} {"train_loss": -10.351167678833008, "global_step": 182865, "epoch": 1088} {"train_loss": -10.844598770141602, "global_step": 182866, "epoch": 1088} {"train_loss": -11.031387329101562, "global_step": 182867, "epoch": 1088} {"train_loss": -11.06667423248291, "global_step": 182868, "epoch": 1088} {"train_loss": -11.088016510009766, "global_step": 182869, "epoch": 1088} {"train_loss": -11.133270263671875, "global_step": 182870, "epoch": 1088} {"train_loss": -10.966781616210938, "global_step": 182871, "epoch": 1088} {"train_loss": -11.047916412353516, "global_step": 182872, "epoch": 1088} {"train_loss": -11.42194938659668, "global_step": 182873, "epoch": 1088} {"train_loss": -11.24347972869873, "global_step": 182874, "epoch": 1088} {"train_loss": -11.175018310546875, "global_step": 182875, "epoch": 1088} {"train_loss": -11.133392333984375, "global_step": 182876, "epoch": 1088} {"train_loss": -11.30278205871582, "global_step": 182877, "epoch": 1088} {"train_loss": -11.289653778076172, "global_step": 182878, "epoch": 1088} {"train_loss": -11.253564834594727, "global_step": 182879, "epoch": 1088} {"train_loss": -11.503547668457031, "global_step": 182880, "epoch": 1088} {"train_loss": -11.331242561340332, "global_step": 182881, "epoch": 1088} {"train_loss": -11.249532699584961, "global_step": 182882, "epoch": 1088} {"train_loss": -11.475483894348145, "global_step": 182883, "epoch": 1088} {"train_loss": -11.11417007446289, "global_step": 182884, "epoch": 1088} {"train_loss": -11.238845825195312, "global_step": 182885, "epoch": 1088} {"train_loss": -11.085529327392578, "global_step": 182886, "epoch": 1088} {"train_loss": -11.122944831848145, "global_step": 182887, "epoch": 1088} {"train_loss": -11.000518798828125, "global_step": 182888, "epoch": 1088} {"train_loss": -11.409236907958984, "global_step": 182889, "epoch": 1088} {"train_loss": -11.239723205566406, "global_step": 182890, "epoch": 1088} {"train_loss": -11.389678001403809, "global_step": 182891, "epoch": 1088} {"train_loss": -11.380792617797852, "global_step": 182892, "epoch": 1088} {"train_loss": -10.978937149047852, "global_step": 182893, "epoch": 1088} {"train_loss": -11.34960651397705, "global_step": 182894, "epoch": 1088} {"train_loss": -11.163848876953125, "global_step": 182895, "epoch": 1088} {"train_loss": -10.772480010986328, "global_step": 182896, "epoch": 1088} {"train_loss": -11.336801528930664, "global_step": 182897, "epoch": 1088} {"train_loss": -10.846465110778809, "global_step": 182898, "epoch": 1088} {"train_loss": -11.100643157958984, "global_step": 182899, "epoch": 1088} {"train_loss": -10.766477584838867, "global_step": 182900, "epoch": 1088} {"train_loss": -11.336061477661133, "global_step": 182901, "epoch": 1088} {"train_loss": -10.859370231628418, "global_step": 182902, "epoch": 1088} {"train_loss": -10.947883605957031, "global_step": 182903, "epoch": 1088} {"train_loss": -11.434803009033203, "global_step": 182904, "epoch": 1088} {"train_loss": -10.174373626708984, "global_step": 182905, "epoch": 1088} {"train_loss": -10.959834098815918, "global_step": 182906, "epoch": 1088} {"train_loss": -10.922395706176758, "global_step": 182907, "epoch": 1088} {"train_loss": -11.01523208618164, "global_step": 182908, "epoch": 1088} {"train_loss": -11.068148612976074, "global_step": 182909, "epoch": 1088} {"train_loss": -10.99698257446289, "global_step": 182910, "epoch": 1088} {"train_loss": -11.179180145263672, "global_step": 182911, "epoch": 1088} {"train_loss": -10.787717819213867, "global_step": 182912, "epoch": 1088} {"train_loss": -10.940404891967773, "global_step": 182913, "epoch": 1088} {"train_loss": -11.167976379394531, "global_step": 182914, "epoch": 1088} {"train_loss": -11.001522064208984, "global_step": 182915, "epoch": 1088} {"train_loss": -11.232048034667969, "global_step": 182916, "epoch": 1088} {"train_loss": -10.6072998046875, "global_step": 182917, "epoch": 1088} {"train_loss": -10.264178276062012, "global_step": 182918, "epoch": 1088} {"train_loss": -11.489684104919434, "global_step": 182919, "epoch": 1088} {"train_loss": -10.743905067443848, "global_step": 182920, "epoch": 1088} {"train_loss": -11.138858795166016, "global_step": 182921, "epoch": 1088} {"train_loss": -10.617164611816406, "global_step": 182922, "epoch": 1088} {"train_loss": -11.030298233032227, "global_step": 182923, "epoch": 1088} {"train_loss": -11.14720344543457, "global_step": 182924, "epoch": 1088} {"train_loss": -10.955349922180176, "global_step": 182925, "epoch": 1088} {"train_loss": -11.275646209716797, "global_step": 182926, "epoch": 1088} {"train_loss": -11.138330459594727, "global_step": 182927, "epoch": 1088} {"train_loss": -11.304536819458008, "global_step": 182928, "epoch": 1088} {"train_loss": -11.096073150634766, "global_step": 182929, "epoch": 1088} {"train_loss": -11.124603271484375, "global_step": 182930, "epoch": 1088} {"train_loss": -11.160856246948242, "global_step": 182931, "epoch": 1088} {"train_loss": -11.227688789367676, "global_step": 182932, "epoch": 1088} {"train_loss": -11.3522310256958, "global_step": 182933, "epoch": 1088} {"train_loss": -11.042211532592773, "global_step": 182934, "epoch": 1088} {"train_loss": -11.172005653381348, "global_step": 182935, "epoch": 1088} {"train_loss": -11.310582160949707, "global_step": 182936, "epoch": 1088} {"train_loss": -11.282035827636719, "global_step": 182937, "epoch": 1088} {"train_loss": -11.088153839111328, "global_step": 182938, "epoch": 1088} {"train_loss": -11.242419242858887, "global_step": 182939, "epoch": 1088} {"train_loss": -11.033750534057617, "global_step": 182940, "epoch": 1088} {"train_loss": -11.292662620544434, "global_step": 182941, "epoch": 1088} {"train_loss": -11.437105178833008, "global_step": 182942, "epoch": 1088} {"train_loss": -11.311084747314453, "global_step": 182943, "epoch": 1088} {"train_loss": -11.443870544433594, "global_step": 182944, "epoch": 1088} {"train_loss": -11.652905464172363, "global_step": 182945, "epoch": 1088} {"train_loss": -11.3970947265625, "global_step": 182946, "epoch": 1088} {"train_loss": -11.150446891784668, "global_step": 182947, "epoch": 1088} {"train_loss": -11.507272720336914, "global_step": 182948, "epoch": 1088} {"train_loss": -11.356388092041016, "global_step": 182949, "epoch": 1088} {"train_loss": -11.3530912399292, "global_step": 182950, "epoch": 1088} {"train_loss": -11.144186996278309, "global_step": 182951, "epoch": 1088, "val_loss": 248689.9375} {"train_loss": -11.402073860168457, "global_step": 182952, "epoch": 1089} {"train_loss": -11.321252822875977, "global_step": 182953, "epoch": 1089} {"train_loss": -11.019003868103027, "global_step": 182954, "epoch": 1089} {"train_loss": -11.451936721801758, "global_step": 182955, "epoch": 1089} {"train_loss": -11.55765151977539, "global_step": 182956, "epoch": 1089} {"train_loss": -11.080891609191895, "global_step": 182957, "epoch": 1089} {"train_loss": -11.33587646484375, "global_step": 182958, "epoch": 1089} {"train_loss": -11.222858428955078, "global_step": 182959, "epoch": 1089} {"train_loss": -11.161134719848633, "global_step": 182960, "epoch": 1089} {"train_loss": -11.105705261230469, "global_step": 182961, "epoch": 1089} {"train_loss": -11.408621788024902, "global_step": 182962, "epoch": 1089} {"train_loss": -11.339353561401367, "global_step": 182963, "epoch": 1089} {"train_loss": -11.612894058227539, "global_step": 182964, "epoch": 1089} {"train_loss": -11.46520709991455, "global_step": 182965, "epoch": 1089} {"train_loss": -11.673151969909668, "global_step": 182966, "epoch": 1089} {"train_loss": -11.164461135864258, "global_step": 182967, "epoch": 1089} {"train_loss": -11.459501266479492, "global_step": 182968, "epoch": 1089} {"train_loss": -11.369548797607422, "global_step": 182969, "epoch": 1089} {"train_loss": -11.545621871948242, "global_step": 182970, "epoch": 1089} {"train_loss": -11.461944580078125, "global_step": 182971, "epoch": 1089} {"train_loss": -11.232860565185547, "global_step": 182972, "epoch": 1089} {"train_loss": -11.451363563537598, "global_step": 182973, "epoch": 1089} {"train_loss": -11.321475982666016, "global_step": 182974, "epoch": 1089} {"train_loss": -11.041767120361328, "global_step": 182975, "epoch": 1089} {"train_loss": -11.297531127929688, "global_step": 182976, "epoch": 1089} {"train_loss": -11.211551666259766, "global_step": 182977, "epoch": 1089} {"train_loss": -11.42977523803711, "global_step": 182978, "epoch": 1089} {"train_loss": -10.656106948852539, "global_step": 182979, "epoch": 1089} {"train_loss": -11.31816577911377, "global_step": 182980, "epoch": 1089} {"train_loss": -9.539926528930664, "global_step": 182981, "epoch": 1089} {"train_loss": -10.270544052124023, "global_step": 182982, "epoch": 1089} {"train_loss": -10.940023422241211, "global_step": 182983, "epoch": 1089} {"train_loss": -10.393390655517578, "global_step": 182984, "epoch": 1089} {"train_loss": -10.953792572021484, "global_step": 182985, "epoch": 1089} {"train_loss": -11.078550338745117, "global_step": 182986, "epoch": 1089} {"train_loss": -10.03129768371582, "global_step": 182987, "epoch": 1089} {"train_loss": -10.866907119750977, "global_step": 182988, "epoch": 1089} {"train_loss": -11.11463737487793, "global_step": 182989, "epoch": 1089} {"train_loss": -10.546201705932617, "global_step": 182990, "epoch": 1089} {"train_loss": -11.044439315795898, "global_step": 182991, "epoch": 1089} {"train_loss": -10.982206344604492, "global_step": 182992, "epoch": 1089} {"train_loss": -11.236438751220703, "global_step": 182993, "epoch": 1089} {"train_loss": -11.171356201171875, "global_step": 182994, "epoch": 1089} {"train_loss": -11.34678840637207, "global_step": 182995, "epoch": 1089} {"train_loss": -11.365541458129883, "global_step": 182996, "epoch": 1089} {"train_loss": -11.27861213684082, "global_step": 182997, "epoch": 1089} {"train_loss": -11.300819396972656, "global_step": 182998, "epoch": 1089} {"train_loss": -11.424066543579102, "global_step": 182999, "epoch": 1089} {"train_loss": -11.0703706741333, "global_step": 183000, "epoch": 1089} {"train_loss": -11.165718078613281, "global_step": 183001, "epoch": 1089} {"train_loss": -10.95730972290039, "global_step": 183002, "epoch": 1089} {"train_loss": -11.144697189331055, "global_step": 183003, "epoch": 1089} {"train_loss": -11.235438346862793, "global_step": 183004, "epoch": 1089} {"train_loss": -11.208287239074707, "global_step": 183005, "epoch": 1089} {"train_loss": -11.055871963500977, "global_step": 183006, "epoch": 1089} {"train_loss": -11.382619857788086, "global_step": 183007, "epoch": 1089} {"train_loss": -11.291556358337402, "global_step": 183008, "epoch": 1089} {"train_loss": -10.743841171264648, "global_step": 183009, "epoch": 1089} {"train_loss": -11.580794334411621, "global_step": 183010, "epoch": 1089} {"train_loss": -10.980835914611816, "global_step": 183011, "epoch": 1089} {"train_loss": -11.565437316894531, "global_step": 183012, "epoch": 1089} {"train_loss": -10.84866714477539, "global_step": 183013, "epoch": 1089} {"train_loss": -11.233260154724121, "global_step": 183014, "epoch": 1089} {"train_loss": -11.3487548828125, "global_step": 183015, "epoch": 1089} {"train_loss": -10.940131187438965, "global_step": 183016, "epoch": 1089} {"train_loss": -11.290136337280273, "global_step": 183017, "epoch": 1089} {"train_loss": -10.925390243530273, "global_step": 183018, "epoch": 1089} {"train_loss": -10.685993194580078, "global_step": 183019, "epoch": 1089} {"train_loss": -11.110490798950195, "global_step": 183020, "epoch": 1089} {"train_loss": -10.800738334655762, "global_step": 183021, "epoch": 1089} {"train_loss": -10.877883911132812, "global_step": 183022, "epoch": 1089} {"train_loss": -11.23837661743164, "global_step": 183023, "epoch": 1089} {"train_loss": -11.037084579467773, "global_step": 183024, "epoch": 1089} {"train_loss": -11.030818939208984, "global_step": 183025, "epoch": 1089} {"train_loss": -11.169422149658203, "global_step": 183026, "epoch": 1089} {"train_loss": -11.073482513427734, "global_step": 183027, "epoch": 1089} {"train_loss": -10.553659439086914, "global_step": 183028, "epoch": 1089} {"train_loss": -10.860591888427734, "global_step": 183029, "epoch": 1089} {"train_loss": -11.121460914611816, "global_step": 183030, "epoch": 1089} {"train_loss": -10.697050094604492, "global_step": 183031, "epoch": 1089} {"train_loss": -10.744830131530762, "global_step": 183032, "epoch": 1089} {"train_loss": -11.063911437988281, "global_step": 183033, "epoch": 1089} {"train_loss": -10.918681144714355, "global_step": 183034, "epoch": 1089} {"train_loss": -10.850641250610352, "global_step": 183035, "epoch": 1089} {"train_loss": -10.983718872070312, "global_step": 183036, "epoch": 1089} {"train_loss": -10.899690628051758, "global_step": 183037, "epoch": 1089} {"train_loss": -11.118782997131348, "global_step": 183038, "epoch": 1089} {"train_loss": -10.794961929321289, "global_step": 183039, "epoch": 1089} {"train_loss": -11.038915634155273, "global_step": 183040, "epoch": 1089} {"train_loss": -11.37156867980957, "global_step": 183041, "epoch": 1089} {"train_loss": -11.342324256896973, "global_step": 183042, "epoch": 1089} {"train_loss": -11.188040733337402, "global_step": 183043, "epoch": 1089} {"train_loss": -11.300735473632812, "global_step": 183044, "epoch": 1089} {"train_loss": -11.33942699432373, "global_step": 183045, "epoch": 1089} {"train_loss": -10.972715377807617, "global_step": 183046, "epoch": 1089} {"train_loss": -11.168500900268555, "global_step": 183047, "epoch": 1089} {"train_loss": -11.019769668579102, "global_step": 183048, "epoch": 1089} {"train_loss": -11.16047477722168, "global_step": 183049, "epoch": 1089} {"train_loss": -10.913267135620117, "global_step": 183050, "epoch": 1089} {"train_loss": -11.101462364196777, "global_step": 183051, "epoch": 1089} {"train_loss": -10.941709518432617, "global_step": 183052, "epoch": 1089} {"train_loss": -10.993966102600098, "global_step": 183053, "epoch": 1089} {"train_loss": -10.957559585571289, "global_step": 183054, "epoch": 1089} {"train_loss": -11.210565567016602, "global_step": 183055, "epoch": 1089} {"train_loss": -11.139350891113281, "global_step": 183056, "epoch": 1089} {"train_loss": -11.070196151733398, "global_step": 183057, "epoch": 1089} {"train_loss": -10.995165824890137, "global_step": 183058, "epoch": 1089} {"train_loss": -10.803495407104492, "global_step": 183059, "epoch": 1089} {"train_loss": -11.294044494628906, "global_step": 183060, "epoch": 1089} {"train_loss": -11.030267715454102, "global_step": 183061, "epoch": 1089} {"train_loss": -11.467103958129883, "global_step": 183062, "epoch": 1089} {"train_loss": -11.0364351272583, "global_step": 183063, "epoch": 1089} {"train_loss": -11.386312484741211, "global_step": 183064, "epoch": 1089} {"train_loss": -11.220503807067871, "global_step": 183065, "epoch": 1089} {"train_loss": -11.230358123779297, "global_step": 183066, "epoch": 1089} {"train_loss": -11.05721378326416, "global_step": 183067, "epoch": 1089} {"train_loss": -11.241720199584961, "global_step": 183068, "epoch": 1089} {"train_loss": -10.761314392089844, "global_step": 183069, "epoch": 1089} {"train_loss": -11.244882583618164, "global_step": 183070, "epoch": 1089} {"train_loss": -11.313079833984375, "global_step": 183071, "epoch": 1089} {"train_loss": -10.933645248413086, "global_step": 183072, "epoch": 1089} {"train_loss": -11.05322551727295, "global_step": 183073, "epoch": 1089} {"train_loss": -11.036205291748047, "global_step": 183074, "epoch": 1089} {"train_loss": -11.28523063659668, "global_step": 183075, "epoch": 1089} {"train_loss": -10.689815521240234, "global_step": 183076, "epoch": 1089} {"train_loss": -11.393354415893555, "global_step": 183077, "epoch": 1089} {"train_loss": -11.064994812011719, "global_step": 183078, "epoch": 1089} {"train_loss": -10.838590621948242, "global_step": 183079, "epoch": 1089} {"train_loss": -11.168376922607422, "global_step": 183080, "epoch": 1089} {"train_loss": -11.029094696044922, "global_step": 183081, "epoch": 1089} {"train_loss": -11.397468566894531, "global_step": 183082, "epoch": 1089} {"train_loss": -11.088726043701172, "global_step": 183083, "epoch": 1089} {"train_loss": -11.221549987792969, "global_step": 183084, "epoch": 1089} {"train_loss": -11.297786712646484, "global_step": 183085, "epoch": 1089} {"train_loss": -10.931255340576172, "global_step": 183086, "epoch": 1089} {"train_loss": -11.415338516235352, "global_step": 183087, "epoch": 1089} {"train_loss": -10.996137619018555, "global_step": 183088, "epoch": 1089} {"train_loss": -11.290483474731445, "global_step": 183089, "epoch": 1089} {"train_loss": -10.929905891418457, "global_step": 183090, "epoch": 1089} {"train_loss": -11.453476905822754, "global_step": 183091, "epoch": 1089} {"train_loss": -11.05456829071045, "global_step": 183092, "epoch": 1089} {"train_loss": -11.334226608276367, "global_step": 183093, "epoch": 1089} {"train_loss": -11.072711944580078, "global_step": 183094, "epoch": 1089} {"train_loss": -11.434783935546875, "global_step": 183095, "epoch": 1089} {"train_loss": -11.26443862915039, "global_step": 183096, "epoch": 1089} {"train_loss": -11.139436721801758, "global_step": 183097, "epoch": 1089} {"train_loss": -11.42910385131836, "global_step": 183098, "epoch": 1089} {"train_loss": -11.17986011505127, "global_step": 183099, "epoch": 1089} {"train_loss": -11.301514625549316, "global_step": 183100, "epoch": 1089} {"train_loss": -11.394768714904785, "global_step": 183101, "epoch": 1089} {"train_loss": -11.295701026916504, "global_step": 183102, "epoch": 1089} {"train_loss": -11.25594711303711, "global_step": 183103, "epoch": 1089} {"train_loss": -11.425128936767578, "global_step": 183104, "epoch": 1089} {"train_loss": -11.326614379882812, "global_step": 183105, "epoch": 1089} {"train_loss": -11.112607955932617, "global_step": 183106, "epoch": 1089} {"train_loss": -10.77359390258789, "global_step": 183107, "epoch": 1089} {"train_loss": -10.665960311889648, "global_step": 183108, "epoch": 1089} {"train_loss": -10.38557243347168, "global_step": 183109, "epoch": 1089} {"train_loss": -10.972681045532227, "global_step": 183110, "epoch": 1089} {"train_loss": -10.742483139038086, "global_step": 183111, "epoch": 1089} {"train_loss": -9.838432312011719, "global_step": 183112, "epoch": 1089} {"train_loss": -9.756351470947266, "global_step": 183113, "epoch": 1089} {"train_loss": -10.955936431884766, "global_step": 183114, "epoch": 1089} {"train_loss": -10.208490371704102, "global_step": 183115, "epoch": 1089} {"train_loss": -10.989554405212402, "global_step": 183116, "epoch": 1089} {"train_loss": -10.866693496704102, "global_step": 183117, "epoch": 1089} {"train_loss": -10.72117805480957, "global_step": 183118, "epoch": 1089} {"train_loss": -11.086145338558016, "global_step": 183119, "epoch": 1089, "val_loss": 247480.265625} {"train_loss": -10.230690002441406, "global_step": 183120, "epoch": 1090} {"train_loss": -11.132347106933594, "global_step": 183121, "epoch": 1090} {"train_loss": -10.706733703613281, "global_step": 183122, "epoch": 1090} {"train_loss": -11.238296508789062, "global_step": 183123, "epoch": 1090} {"train_loss": -10.901802062988281, "global_step": 183124, "epoch": 1090} {"train_loss": -10.905452728271484, "global_step": 183125, "epoch": 1090} {"train_loss": -10.837008476257324, "global_step": 183126, "epoch": 1090} {"train_loss": -11.187440872192383, "global_step": 183127, "epoch": 1090} {"train_loss": -10.621315002441406, "global_step": 183128, "epoch": 1090} {"train_loss": -11.108165740966797, "global_step": 183129, "epoch": 1090} {"train_loss": -10.706539154052734, "global_step": 183130, "epoch": 1090} {"train_loss": -10.81685733795166, "global_step": 183131, "epoch": 1090} {"train_loss": -10.663324356079102, "global_step": 183132, "epoch": 1090} {"train_loss": -10.846195220947266, "global_step": 183133, "epoch": 1090} {"train_loss": -11.336621284484863, "global_step": 183134, "epoch": 1090} {"train_loss": -10.668909072875977, "global_step": 183135, "epoch": 1090} {"train_loss": -10.863517761230469, "global_step": 183136, "epoch": 1090} {"train_loss": -10.855196952819824, "global_step": 183137, "epoch": 1090} {"train_loss": -10.975830078125, "global_step": 183138, "epoch": 1090} {"train_loss": -11.195913314819336, "global_step": 183139, "epoch": 1090} {"train_loss": -11.033855438232422, "global_step": 183140, "epoch": 1090} {"train_loss": -11.191034317016602, "global_step": 183141, "epoch": 1090} {"train_loss": -10.896674156188965, "global_step": 183142, "epoch": 1090} {"train_loss": -11.027740478515625, "global_step": 183143, "epoch": 1090} {"train_loss": -11.197637557983398, "global_step": 183144, "epoch": 1090} {"train_loss": -10.861637115478516, "global_step": 183145, "epoch": 1090} {"train_loss": -11.37728214263916, "global_step": 183146, "epoch": 1090} {"train_loss": -11.173055648803711, "global_step": 183147, "epoch": 1090} {"train_loss": -11.09016227722168, "global_step": 183148, "epoch": 1090} {"train_loss": -10.96927261352539, "global_step": 183149, "epoch": 1090} {"train_loss": -11.235672950744629, "global_step": 183150, "epoch": 1090} {"train_loss": -11.302907943725586, "global_step": 183151, "epoch": 1090} {"train_loss": -11.454570770263672, "global_step": 183152, "epoch": 1090} {"train_loss": -11.358814239501953, "global_step": 183153, "epoch": 1090} {"train_loss": -10.98459243774414, "global_step": 183154, "epoch": 1090} {"train_loss": -11.433633804321289, "global_step": 183155, "epoch": 1090} {"train_loss": -11.127786636352539, "global_step": 183156, "epoch": 1090} {"train_loss": -11.407644271850586, "global_step": 183157, "epoch": 1090} {"train_loss": -11.111982345581055, "global_step": 183158, "epoch": 1090} {"train_loss": -11.278495788574219, "global_step": 183159, "epoch": 1090} {"train_loss": -11.605951309204102, "global_step": 183160, "epoch": 1090} {"train_loss": -11.32588005065918, "global_step": 183161, "epoch": 1090} {"train_loss": -11.492903709411621, "global_step": 183162, "epoch": 1090} {"train_loss": -11.303387641906738, "global_step": 183163, "epoch": 1090} {"train_loss": -11.46150016784668, "global_step": 183164, "epoch": 1090} {"train_loss": -11.392915725708008, "global_step": 183165, "epoch": 1090} {"train_loss": -11.415374755859375, "global_step": 183166, "epoch": 1090} {"train_loss": -11.579687118530273, "global_step": 183167, "epoch": 1090} {"train_loss": -11.299917221069336, "global_step": 183168, "epoch": 1090} {"train_loss": -11.349431037902832, "global_step": 183169, "epoch": 1090} {"train_loss": -11.295616149902344, "global_step": 183170, "epoch": 1090} {"train_loss": -11.207279205322266, "global_step": 183171, "epoch": 1090} {"train_loss": -11.61052131652832, "global_step": 183172, "epoch": 1090} {"train_loss": -11.377378463745117, "global_step": 183173, "epoch": 1090} {"train_loss": -11.298795700073242, "global_step": 183174, "epoch": 1090} {"train_loss": -11.286680221557617, "global_step": 183175, "epoch": 1090} {"train_loss": -11.134162902832031, "global_step": 183176, "epoch": 1090} {"train_loss": -11.501819610595703, "global_step": 183177, "epoch": 1090} {"train_loss": -10.756027221679688, "global_step": 183178, "epoch": 1090} {"train_loss": -11.571237564086914, "global_step": 183179, "epoch": 1090} {"train_loss": -10.853462219238281, "global_step": 183180, "epoch": 1090} {"train_loss": -10.985617637634277, "global_step": 183181, "epoch": 1090} {"train_loss": -11.133843421936035, "global_step": 183182, "epoch": 1090} {"train_loss": -11.500192642211914, "global_step": 183183, "epoch": 1090} {"train_loss": -11.062779426574707, "global_step": 183184, "epoch": 1090} {"train_loss": -11.497858047485352, "global_step": 183185, "epoch": 1090} {"train_loss": -10.926487922668457, "global_step": 183186, "epoch": 1090} {"train_loss": -11.632869720458984, "global_step": 183187, "epoch": 1090} {"train_loss": -10.966304779052734, "global_step": 183188, "epoch": 1090} {"train_loss": -10.710543632507324, "global_step": 183189, "epoch": 1090} {"train_loss": -11.614784240722656, "global_step": 183190, "epoch": 1090} {"train_loss": -11.083518981933594, "global_step": 183191, "epoch": 1090} {"train_loss": -11.242228507995605, "global_step": 183192, "epoch": 1090} {"train_loss": -10.794797897338867, "global_step": 183193, "epoch": 1090} {"train_loss": -11.330699920654297, "global_step": 183194, "epoch": 1090} {"train_loss": -10.764183044433594, "global_step": 183195, "epoch": 1090} {"train_loss": -11.253409385681152, "global_step": 183196, "epoch": 1090} {"train_loss": -11.377084732055664, "global_step": 183197, "epoch": 1090} {"train_loss": -11.278711318969727, "global_step": 183198, "epoch": 1090} {"train_loss": -11.276473045349121, "global_step": 183199, "epoch": 1090} {"train_loss": -11.122330665588379, "global_step": 183200, "epoch": 1090} {"train_loss": -10.931310653686523, "global_step": 183201, "epoch": 1090} {"train_loss": -11.399450302124023, "global_step": 183202, "epoch": 1090} {"train_loss": -11.217512130737305, "global_step": 183203, "epoch": 1090} {"train_loss": -11.323911666870117, "global_step": 183204, "epoch": 1090} {"train_loss": -10.989609718322754, "global_step": 183205, "epoch": 1090} {"train_loss": -11.067915916442871, "global_step": 183206, "epoch": 1090} {"train_loss": -9.873644828796387, "global_step": 183207, "epoch": 1090} {"train_loss": -10.931793212890625, "global_step": 183208, "epoch": 1090} {"train_loss": -10.841480255126953, "global_step": 183209, "epoch": 1090} {"train_loss": -10.272882461547852, "global_step": 183210, "epoch": 1090} {"train_loss": -11.366426467895508, "global_step": 183211, "epoch": 1090} {"train_loss": -9.857065200805664, "global_step": 183212, "epoch": 1090} {"train_loss": -10.431816101074219, "global_step": 183213, "epoch": 1090} {"train_loss": -11.347465515136719, "global_step": 183214, "epoch": 1090} {"train_loss": -10.350393295288086, "global_step": 183215, "epoch": 1090} {"train_loss": -11.305169105529785, "global_step": 183216, "epoch": 1090} {"train_loss": -11.029034614562988, "global_step": 183217, "epoch": 1090} {"train_loss": -10.669672012329102, "global_step": 183218, "epoch": 1090} {"train_loss": -11.522028923034668, "global_step": 183219, "epoch": 1090} {"train_loss": -11.238981246948242, "global_step": 183220, "epoch": 1090} {"train_loss": -11.406938552856445, "global_step": 183221, "epoch": 1090} {"train_loss": -11.167499542236328, "global_step": 183222, "epoch": 1090} {"train_loss": -11.311161041259766, "global_step": 183223, "epoch": 1090} {"train_loss": -11.26660442352295, "global_step": 183224, "epoch": 1090} {"train_loss": -11.462892532348633, "global_step": 183225, "epoch": 1090} {"train_loss": -11.128776550292969, "global_step": 183226, "epoch": 1090} {"train_loss": -11.377124786376953, "global_step": 183227, "epoch": 1090} {"train_loss": -11.203365325927734, "global_step": 183228, "epoch": 1090} {"train_loss": -11.573506355285645, "global_step": 183229, "epoch": 1090} {"train_loss": -11.216806411743164, "global_step": 183230, "epoch": 1090} {"train_loss": -11.147289276123047, "global_step": 183231, "epoch": 1090} {"train_loss": -11.284782409667969, "global_step": 183232, "epoch": 1090} {"train_loss": -11.082429885864258, "global_step": 183233, "epoch": 1090} {"train_loss": -11.137207984924316, "global_step": 183234, "epoch": 1090} {"train_loss": -11.0, "global_step": 183235, "epoch": 1090} {"train_loss": -11.543877601623535, "global_step": 183236, "epoch": 1090} {"train_loss": -11.123623847961426, "global_step": 183237, "epoch": 1090} {"train_loss": -11.45063304901123, "global_step": 183238, "epoch": 1090} {"train_loss": -11.35114860534668, "global_step": 183239, "epoch": 1090} {"train_loss": -11.453472137451172, "global_step": 183240, "epoch": 1090} {"train_loss": -11.477241516113281, "global_step": 183241, "epoch": 1090} {"train_loss": -11.343888282775879, "global_step": 183242, "epoch": 1090} {"train_loss": -11.498948097229004, "global_step": 183243, "epoch": 1090} {"train_loss": -11.354103088378906, "global_step": 183244, "epoch": 1090} {"train_loss": -11.66784954071045, "global_step": 183245, "epoch": 1090} {"train_loss": -11.428934097290039, "global_step": 183246, "epoch": 1090} {"train_loss": -11.641555786132812, "global_step": 183247, "epoch": 1090} {"train_loss": -11.312469482421875, "global_step": 183248, "epoch": 1090} {"train_loss": -11.593502044677734, "global_step": 183249, "epoch": 1090} {"train_loss": -11.683012008666992, "global_step": 183250, "epoch": 1090} {"train_loss": -11.475842475891113, "global_step": 183251, "epoch": 1090} {"train_loss": -11.656728744506836, "global_step": 183252, "epoch": 1090} {"train_loss": -11.411113739013672, "global_step": 183253, "epoch": 1090} {"train_loss": -11.385686874389648, "global_step": 183254, "epoch": 1090} {"train_loss": -11.5118408203125, "global_step": 183255, "epoch": 1090} {"train_loss": -11.286542892456055, "global_step": 183256, "epoch": 1090} {"train_loss": -11.54796028137207, "global_step": 183257, "epoch": 1090} {"train_loss": -11.236700057983398, "global_step": 183258, "epoch": 1090} {"train_loss": -11.379261016845703, "global_step": 183259, "epoch": 1090} {"train_loss": -11.280909538269043, "global_step": 183260, "epoch": 1090} {"train_loss": -11.238191604614258, "global_step": 183261, "epoch": 1090} {"train_loss": -11.077737808227539, "global_step": 183262, "epoch": 1090} {"train_loss": -11.537736892700195, "global_step": 183263, "epoch": 1090} {"train_loss": -11.33864974975586, "global_step": 183264, "epoch": 1090} {"train_loss": -11.327571868896484, "global_step": 183265, "epoch": 1090} {"train_loss": -11.427356719970703, "global_step": 183266, "epoch": 1090} {"train_loss": -11.140510559082031, "global_step": 183267, "epoch": 1090} {"train_loss": -11.350879669189453, "global_step": 183268, "epoch": 1090} {"train_loss": -11.454273223876953, "global_step": 183269, "epoch": 1090} {"train_loss": -11.286453247070312, "global_step": 183270, "epoch": 1090} {"train_loss": -10.971271514892578, "global_step": 183271, "epoch": 1090} {"train_loss": -11.253554344177246, "global_step": 183272, "epoch": 1090} {"train_loss": -10.99599838256836, "global_step": 183273, "epoch": 1090} {"train_loss": -11.094134330749512, "global_step": 183274, "epoch": 1090} {"train_loss": -11.058506965637207, "global_step": 183275, "epoch": 1090} {"train_loss": -10.810842514038086, "global_step": 183276, "epoch": 1090} {"train_loss": -11.158434867858887, "global_step": 183277, "epoch": 1090} {"train_loss": -10.791837692260742, "global_step": 183278, "epoch": 1090} {"train_loss": -10.370586395263672, "global_step": 183279, "epoch": 1090} {"train_loss": -10.56365966796875, "global_step": 183280, "epoch": 1090} {"train_loss": -11.39044189453125, "global_step": 183281, "epoch": 1090} {"train_loss": -9.925058364868164, "global_step": 183282, "epoch": 1090} {"train_loss": -10.36267375946045, "global_step": 183283, "epoch": 1090} {"train_loss": -11.233732223510742, "global_step": 183284, "epoch": 1090} {"train_loss": -10.904409408569336, "global_step": 183285, "epoch": 1090} {"train_loss": -10.633578300476074, "global_step": 183286, "epoch": 1090} {"train_loss": -11.152413589613777, "global_step": 183287, "epoch": 1090, "val_loss": 242302.75, "train_action_mse_error": 1.288682460784912} {"train_loss": -10.728014945983887, "global_step": 183288, "epoch": 1091} {"train_loss": -10.646273612976074, "global_step": 183289, "epoch": 1091} {"train_loss": -10.686003684997559, "global_step": 183290, "epoch": 1091} {"train_loss": -10.454303741455078, "global_step": 183291, "epoch": 1091} {"train_loss": -10.384208679199219, "global_step": 183292, "epoch": 1091} {"train_loss": -10.795513153076172, "global_step": 183293, "epoch": 1091} {"train_loss": -10.78029727935791, "global_step": 183294, "epoch": 1091} {"train_loss": -10.461125373840332, "global_step": 183295, "epoch": 1091} {"train_loss": -10.898490905761719, "global_step": 183296, "epoch": 1091} {"train_loss": -9.949943542480469, "global_step": 183297, "epoch": 1091} {"train_loss": -10.253908157348633, "global_step": 183298, "epoch": 1091} {"train_loss": -10.475532531738281, "global_step": 183299, "epoch": 1091} {"train_loss": -10.5440034866333, "global_step": 183300, "epoch": 1091} {"train_loss": -10.263134002685547, "global_step": 183301, "epoch": 1091} {"train_loss": -10.427170753479004, "global_step": 183302, "epoch": 1091} {"train_loss": -10.529037475585938, "global_step": 183303, "epoch": 1091} {"train_loss": -10.753181457519531, "global_step": 183304, "epoch": 1091} {"train_loss": -11.15222454071045, "global_step": 183305, "epoch": 1091} {"train_loss": -10.649858474731445, "global_step": 183306, "epoch": 1091} {"train_loss": -11.053065299987793, "global_step": 183307, "epoch": 1091} {"train_loss": -10.995244979858398, "global_step": 183308, "epoch": 1091} {"train_loss": -10.628812789916992, "global_step": 183309, "epoch": 1091} {"train_loss": -11.19973373413086, "global_step": 183310, "epoch": 1091} {"train_loss": -11.0082426071167, "global_step": 183311, "epoch": 1091} {"train_loss": -11.171892166137695, "global_step": 183312, "epoch": 1091} {"train_loss": -11.030357360839844, "global_step": 183313, "epoch": 1091} {"train_loss": -11.000556945800781, "global_step": 183314, "epoch": 1091} {"train_loss": -11.072275161743164, "global_step": 183315, "epoch": 1091} {"train_loss": -11.161368370056152, "global_step": 183316, "epoch": 1091} {"train_loss": -11.261242866516113, "global_step": 183317, "epoch": 1091} {"train_loss": -11.123739242553711, "global_step": 183318, "epoch": 1091} {"train_loss": -11.19797134399414, "global_step": 183319, "epoch": 1091} {"train_loss": -11.116981506347656, "global_step": 183320, "epoch": 1091} {"train_loss": -11.38744831085205, "global_step": 183321, "epoch": 1091} {"train_loss": -11.481515884399414, "global_step": 183322, "epoch": 1091} {"train_loss": -11.219314575195312, "global_step": 183323, "epoch": 1091} {"train_loss": -11.167926788330078, "global_step": 183324, "epoch": 1091} {"train_loss": -11.364557266235352, "global_step": 183325, "epoch": 1091} {"train_loss": -11.232888221740723, "global_step": 183326, "epoch": 1091} {"train_loss": -11.440481185913086, "global_step": 183327, "epoch": 1091} {"train_loss": -10.933059692382812, "global_step": 183328, "epoch": 1091} {"train_loss": -11.136083602905273, "global_step": 183329, "epoch": 1091} {"train_loss": -11.214385986328125, "global_step": 183330, "epoch": 1091} {"train_loss": -11.23336410522461, "global_step": 183331, "epoch": 1091} {"train_loss": -10.976493835449219, "global_step": 183332, "epoch": 1091} {"train_loss": -11.029569625854492, "global_step": 183333, "epoch": 1091} {"train_loss": -11.049225807189941, "global_step": 183334, "epoch": 1091} {"train_loss": -11.045291900634766, "global_step": 183335, "epoch": 1091} {"train_loss": -11.261306762695312, "global_step": 183336, "epoch": 1091} {"train_loss": -11.296089172363281, "global_step": 183337, "epoch": 1091} {"train_loss": -11.376348495483398, "global_step": 183338, "epoch": 1091} {"train_loss": -11.406063079833984, "global_step": 183339, "epoch": 1091} {"train_loss": -11.002408027648926, "global_step": 183340, "epoch": 1091} {"train_loss": -11.258994102478027, "global_step": 183341, "epoch": 1091} {"train_loss": -11.419777870178223, "global_step": 183342, "epoch": 1091} {"train_loss": -10.80347728729248, "global_step": 183343, "epoch": 1091} {"train_loss": -11.496343612670898, "global_step": 183344, "epoch": 1091} {"train_loss": -11.026083946228027, "global_step": 183345, "epoch": 1091} {"train_loss": -11.296870231628418, "global_step": 183346, "epoch": 1091} {"train_loss": -11.32534122467041, "global_step": 183347, "epoch": 1091} {"train_loss": -11.22111988067627, "global_step": 183348, "epoch": 1091} {"train_loss": -11.208090782165527, "global_step": 183349, "epoch": 1091} {"train_loss": -11.399792671203613, "global_step": 183350, "epoch": 1091} {"train_loss": -11.357240676879883, "global_step": 183351, "epoch": 1091} {"train_loss": -11.411365509033203, "global_step": 183352, "epoch": 1091} {"train_loss": -11.401641845703125, "global_step": 183353, "epoch": 1091} {"train_loss": -11.421880722045898, "global_step": 183354, "epoch": 1091} {"train_loss": -11.122447967529297, "global_step": 183355, "epoch": 1091} {"train_loss": -10.944357872009277, "global_step": 183356, "epoch": 1091} {"train_loss": -11.663151741027832, "global_step": 183357, "epoch": 1091} {"train_loss": -11.16649341583252, "global_step": 183358, "epoch": 1091} {"train_loss": -11.3203763961792, "global_step": 183359, "epoch": 1091} {"train_loss": -11.06879997253418, "global_step": 183360, "epoch": 1091} {"train_loss": -11.233278274536133, "global_step": 183361, "epoch": 1091} {"train_loss": -11.219789505004883, "global_step": 183362, "epoch": 1091} {"train_loss": -10.985057830810547, "global_step": 183363, "epoch": 1091} {"train_loss": -11.408170700073242, "global_step": 183364, "epoch": 1091} {"train_loss": -11.413670539855957, "global_step": 183365, "epoch": 1091} {"train_loss": -11.23398208618164, "global_step": 183366, "epoch": 1091} {"train_loss": -11.12201976776123, "global_step": 183367, "epoch": 1091} {"train_loss": -11.350740432739258, "global_step": 183368, "epoch": 1091} {"train_loss": -11.000990867614746, "global_step": 183369, "epoch": 1091} {"train_loss": -11.139154434204102, "global_step": 183370, "epoch": 1091} {"train_loss": -11.437593460083008, "global_step": 183371, "epoch": 1091} {"train_loss": -11.212946891784668, "global_step": 183372, "epoch": 1091} {"train_loss": -11.213815689086914, "global_step": 183373, "epoch": 1091} {"train_loss": -11.57507038116455, "global_step": 183374, "epoch": 1091} {"train_loss": -11.237065315246582, "global_step": 183375, "epoch": 1091} {"train_loss": -11.430217742919922, "global_step": 183376, "epoch": 1091} {"train_loss": -11.459465026855469, "global_step": 183377, "epoch": 1091} {"train_loss": -11.594688415527344, "global_step": 183378, "epoch": 1091} {"train_loss": -11.44650650024414, "global_step": 183379, "epoch": 1091} {"train_loss": -11.241371154785156, "global_step": 183380, "epoch": 1091} {"train_loss": -10.969829559326172, "global_step": 183381, "epoch": 1091} {"train_loss": -11.427783966064453, "global_step": 183382, "epoch": 1091} {"train_loss": -11.529918670654297, "global_step": 183383, "epoch": 1091} {"train_loss": -11.335214614868164, "global_step": 183384, "epoch": 1091} {"train_loss": -11.50123405456543, "global_step": 183385, "epoch": 1091} {"train_loss": -11.457588195800781, "global_step": 183386, "epoch": 1091} {"train_loss": -11.438822746276855, "global_step": 183387, "epoch": 1091} {"train_loss": -11.527044296264648, "global_step": 183388, "epoch": 1091} {"train_loss": -11.420151710510254, "global_step": 183389, "epoch": 1091} {"train_loss": -11.583351135253906, "global_step": 183390, "epoch": 1091} {"train_loss": -11.541757583618164, "global_step": 183391, "epoch": 1091} {"train_loss": -11.53157901763916, "global_step": 183392, "epoch": 1091} {"train_loss": -11.589584350585938, "global_step": 183393, "epoch": 1091} {"train_loss": -11.385032653808594, "global_step": 183394, "epoch": 1091} {"train_loss": -11.206958770751953, "global_step": 183395, "epoch": 1091} {"train_loss": -11.446893692016602, "global_step": 183396, "epoch": 1091} {"train_loss": -11.611702919006348, "global_step": 183397, "epoch": 1091} {"train_loss": -11.629190444946289, "global_step": 183398, "epoch": 1091} {"train_loss": -11.51022720336914, "global_step": 183399, "epoch": 1091} {"train_loss": -11.297647476196289, "global_step": 183400, "epoch": 1091} {"train_loss": -11.654420852661133, "global_step": 183401, "epoch": 1091} {"train_loss": -11.364155769348145, "global_step": 183402, "epoch": 1091} {"train_loss": -11.406208038330078, "global_step": 183403, "epoch": 1091} {"train_loss": -11.378886222839355, "global_step": 183404, "epoch": 1091} {"train_loss": -11.442567825317383, "global_step": 183405, "epoch": 1091} {"train_loss": -11.368995666503906, "global_step": 183406, "epoch": 1091} {"train_loss": -11.074396133422852, "global_step": 183407, "epoch": 1091} {"train_loss": -9.941417694091797, "global_step": 183408, "epoch": 1091} {"train_loss": -10.10228157043457, "global_step": 183409, "epoch": 1091} {"train_loss": -11.223340034484863, "global_step": 183410, "epoch": 1091} {"train_loss": -11.340295791625977, "global_step": 183411, "epoch": 1091} {"train_loss": -10.137514114379883, "global_step": 183412, "epoch": 1091} {"train_loss": -11.039875984191895, "global_step": 183413, "epoch": 1091} {"train_loss": -10.099897384643555, "global_step": 183414, "epoch": 1091} {"train_loss": -10.150262832641602, "global_step": 183415, "epoch": 1091} {"train_loss": -11.009571075439453, "global_step": 183416, "epoch": 1091} {"train_loss": -10.728751182556152, "global_step": 183417, "epoch": 1091} {"train_loss": -11.103045463562012, "global_step": 183418, "epoch": 1091} {"train_loss": -10.788667678833008, "global_step": 183419, "epoch": 1091} {"train_loss": -10.999507904052734, "global_step": 183420, "epoch": 1091} {"train_loss": -10.643536567687988, "global_step": 183421, "epoch": 1091} {"train_loss": -11.182437896728516, "global_step": 183422, "epoch": 1091} {"train_loss": -10.581413269042969, "global_step": 183423, "epoch": 1091} {"train_loss": -11.019981384277344, "global_step": 183424, "epoch": 1091} {"train_loss": -10.749252319335938, "global_step": 183425, "epoch": 1091} {"train_loss": -10.244024276733398, "global_step": 183426, "epoch": 1091} {"train_loss": -10.250450134277344, "global_step": 183427, "epoch": 1091} {"train_loss": -9.703242301940918, "global_step": 183428, "epoch": 1091} {"train_loss": -10.260917663574219, "global_step": 183429, "epoch": 1091} {"train_loss": -9.656084060668945, "global_step": 183430, "epoch": 1091} {"train_loss": -9.789012908935547, "global_step": 183431, "epoch": 1091} {"train_loss": -10.159443855285645, "global_step": 183432, "epoch": 1091} {"train_loss": -7.785741329193115, "global_step": 183433, "epoch": 1091} {"train_loss": -11.230304718017578, "global_step": 183434, "epoch": 1091} {"train_loss": -8.639227867126465, "global_step": 183435, "epoch": 1091} {"train_loss": -10.89260196685791, "global_step": 183436, "epoch": 1091} {"train_loss": -9.43832778930664, "global_step": 183437, "epoch": 1091} {"train_loss": -10.755826950073242, "global_step": 183438, "epoch": 1091} {"train_loss": -9.596445083618164, "global_step": 183439, "epoch": 1091} {"train_loss": -10.943107604980469, "global_step": 183440, "epoch": 1091} {"train_loss": -9.936174392700195, "global_step": 183441, "epoch": 1091} {"train_loss": -10.911136627197266, "global_step": 183442, "epoch": 1091} {"train_loss": -9.829389572143555, "global_step": 183443, "epoch": 1091} {"train_loss": -10.560176849365234, "global_step": 183444, "epoch": 1091} {"train_loss": -10.294379234313965, "global_step": 183445, "epoch": 1091} {"train_loss": -10.38009262084961, "global_step": 183446, "epoch": 1091} {"train_loss": -10.614049911499023, "global_step": 183447, "epoch": 1091} {"train_loss": -10.667251586914062, "global_step": 183448, "epoch": 1091} {"train_loss": -11.033435821533203, "global_step": 183449, "epoch": 1091} {"train_loss": -10.888357162475586, "global_step": 183450, "epoch": 1091} {"train_loss": -10.93532943725586, "global_step": 183451, "epoch": 1091} {"train_loss": -10.886577606201172, "global_step": 183452, "epoch": 1091} {"train_loss": -10.941679954528809, "global_step": 183453, "epoch": 1091} {"train_loss": -10.978543281555176, "global_step": 183454, "epoch": 1091} {"train_loss": -10.964329393137069, "global_step": 183455, "epoch": 1091, "val_loss": 240727.46875} {"train_loss": -10.824482917785645, "global_step": 183456, "epoch": 1092} {"train_loss": -11.213472366333008, "global_step": 183457, "epoch": 1092} {"train_loss": -10.992738723754883, "global_step": 183458, "epoch": 1092} {"train_loss": -11.166463851928711, "global_step": 183459, "epoch": 1092} {"train_loss": -11.098743438720703, "global_step": 183460, "epoch": 1092} {"train_loss": -11.275450706481934, "global_step": 183461, "epoch": 1092} {"train_loss": -11.131442070007324, "global_step": 183462, "epoch": 1092} {"train_loss": -11.244524002075195, "global_step": 183463, "epoch": 1092} {"train_loss": -11.24832534790039, "global_step": 183464, "epoch": 1092} {"train_loss": -11.224038124084473, "global_step": 183465, "epoch": 1092} {"train_loss": -11.1128511428833, "global_step": 183466, "epoch": 1092} {"train_loss": -11.300394058227539, "global_step": 183467, "epoch": 1092} {"train_loss": -11.231773376464844, "global_step": 183468, "epoch": 1092} {"train_loss": -11.066149711608887, "global_step": 183469, "epoch": 1092} {"train_loss": -11.092425346374512, "global_step": 183470, "epoch": 1092} {"train_loss": -11.017416000366211, "global_step": 183471, "epoch": 1092} {"train_loss": -11.26097297668457, "global_step": 183472, "epoch": 1092} {"train_loss": -11.458473205566406, "global_step": 183473, "epoch": 1092} {"train_loss": -11.50156021118164, "global_step": 183474, "epoch": 1092} {"train_loss": -11.523509979248047, "global_step": 183475, "epoch": 1092} {"train_loss": -11.379112243652344, "global_step": 183476, "epoch": 1092} {"train_loss": -11.36745548248291, "global_step": 183477, "epoch": 1092} {"train_loss": -11.303722381591797, "global_step": 183478, "epoch": 1092} {"train_loss": -11.543622970581055, "global_step": 183479, "epoch": 1092} {"train_loss": -11.22324275970459, "global_step": 183480, "epoch": 1092} {"train_loss": -11.538277626037598, "global_step": 183481, "epoch": 1092} {"train_loss": -11.213401794433594, "global_step": 183482, "epoch": 1092} {"train_loss": -11.47757339477539, "global_step": 183483, "epoch": 1092} {"train_loss": -11.374351501464844, "global_step": 183484, "epoch": 1092} {"train_loss": -11.32302474975586, "global_step": 183485, "epoch": 1092} {"train_loss": -11.359503746032715, "global_step": 183486, "epoch": 1092} {"train_loss": -11.385053634643555, "global_step": 183487, "epoch": 1092} {"train_loss": -11.163690567016602, "global_step": 183488, "epoch": 1092} {"train_loss": -11.476127624511719, "global_step": 183489, "epoch": 1092} {"train_loss": -11.20926284790039, "global_step": 183490, "epoch": 1092} {"train_loss": -11.27995491027832, "global_step": 183491, "epoch": 1092} {"train_loss": -11.446133613586426, "global_step": 183492, "epoch": 1092} {"train_loss": -11.305370330810547, "global_step": 183493, "epoch": 1092} {"train_loss": -11.356554985046387, "global_step": 183494, "epoch": 1092} {"train_loss": -11.540484428405762, "global_step": 183495, "epoch": 1092} {"train_loss": -11.323263168334961, "global_step": 183496, "epoch": 1092} {"train_loss": -10.88848876953125, "global_step": 183497, "epoch": 1092} {"train_loss": -11.449089050292969, "global_step": 183498, "epoch": 1092} {"train_loss": -11.273136138916016, "global_step": 183499, "epoch": 1092} {"train_loss": -11.101653099060059, "global_step": 183500, "epoch": 1092} {"train_loss": -10.671772003173828, "global_step": 183501, "epoch": 1092} {"train_loss": -11.021537780761719, "global_step": 183502, "epoch": 1092} {"train_loss": -10.903854370117188, "global_step": 183503, "epoch": 1092} {"train_loss": -11.160978317260742, "global_step": 183504, "epoch": 1092} {"train_loss": -10.728269577026367, "global_step": 183505, "epoch": 1092} {"train_loss": -11.387031555175781, "global_step": 183506, "epoch": 1092} {"train_loss": -11.137539863586426, "global_step": 183507, "epoch": 1092} {"train_loss": -11.182221412658691, "global_step": 183508, "epoch": 1092} {"train_loss": -11.207345962524414, "global_step": 183509, "epoch": 1092} {"train_loss": -10.514219284057617, "global_step": 183510, "epoch": 1092} {"train_loss": -10.373588562011719, "global_step": 183511, "epoch": 1092} {"train_loss": -11.076560974121094, "global_step": 183512, "epoch": 1092} {"train_loss": -10.563945770263672, "global_step": 183513, "epoch": 1092} {"train_loss": -10.471678733825684, "global_step": 183514, "epoch": 1092} {"train_loss": -10.621658325195312, "global_step": 183515, "epoch": 1092} {"train_loss": -9.004995346069336, "global_step": 183516, "epoch": 1092} {"train_loss": -9.711788177490234, "global_step": 183517, "epoch": 1092} {"train_loss": -10.263118743896484, "global_step": 183518, "epoch": 1092} {"train_loss": -9.857105255126953, "global_step": 183519, "epoch": 1092} {"train_loss": -9.998113632202148, "global_step": 183520, "epoch": 1092} {"train_loss": -10.675785064697266, "global_step": 183521, "epoch": 1092} {"train_loss": -10.082647323608398, "global_step": 183522, "epoch": 1092} {"train_loss": -10.267206192016602, "global_step": 183523, "epoch": 1092} {"train_loss": -10.573074340820312, "global_step": 183524, "epoch": 1092} {"train_loss": -10.362314224243164, "global_step": 183525, "epoch": 1092} {"train_loss": -10.087320327758789, "global_step": 183526, "epoch": 1092} {"train_loss": -10.773709297180176, "global_step": 183527, "epoch": 1092} {"train_loss": -10.379671096801758, "global_step": 183528, "epoch": 1092} {"train_loss": -11.120954513549805, "global_step": 183529, "epoch": 1092} {"train_loss": -10.26512336730957, "global_step": 183530, "epoch": 1092} {"train_loss": -10.92586612701416, "global_step": 183531, "epoch": 1092} {"train_loss": -10.704791069030762, "global_step": 183532, "epoch": 1092} {"train_loss": -11.031316757202148, "global_step": 183533, "epoch": 1092} {"train_loss": -10.892072677612305, "global_step": 183534, "epoch": 1092} {"train_loss": -10.80176830291748, "global_step": 183535, "epoch": 1092} {"train_loss": -10.876699447631836, "global_step": 183536, "epoch": 1092} {"train_loss": -10.833663940429688, "global_step": 183537, "epoch": 1092} {"train_loss": -10.85954475402832, "global_step": 183538, "epoch": 1092} {"train_loss": -11.081007957458496, "global_step": 183539, "epoch": 1092} {"train_loss": -11.013527870178223, "global_step": 183540, "epoch": 1092} {"train_loss": -10.512227058410645, "global_step": 183541, "epoch": 1092} {"train_loss": -10.831047058105469, "global_step": 183542, "epoch": 1092} {"train_loss": -10.608869552612305, "global_step": 183543, "epoch": 1092} {"train_loss": -10.542013168334961, "global_step": 183544, "epoch": 1092} {"train_loss": -11.04765796661377, "global_step": 183545, "epoch": 1092} {"train_loss": -10.667335510253906, "global_step": 183546, "epoch": 1092} {"train_loss": -10.952844619750977, "global_step": 183547, "epoch": 1092} {"train_loss": -10.949019432067871, "global_step": 183548, "epoch": 1092} {"train_loss": -11.12264633178711, "global_step": 183549, "epoch": 1092} {"train_loss": -11.121315002441406, "global_step": 183550, "epoch": 1092} {"train_loss": -11.077816009521484, "global_step": 183551, "epoch": 1092} {"train_loss": -10.983259201049805, "global_step": 183552, "epoch": 1092} {"train_loss": -11.193471908569336, "global_step": 183553, "epoch": 1092} {"train_loss": -10.826690673828125, "global_step": 183554, "epoch": 1092} {"train_loss": -11.179550170898438, "global_step": 183555, "epoch": 1092} {"train_loss": -11.2004976272583, "global_step": 183556, "epoch": 1092} {"train_loss": -11.070566177368164, "global_step": 183557, "epoch": 1092} {"train_loss": -11.232124328613281, "global_step": 183558, "epoch": 1092} {"train_loss": -11.356443405151367, "global_step": 183559, "epoch": 1092} {"train_loss": -11.057535171508789, "global_step": 183560, "epoch": 1092} {"train_loss": -11.282569885253906, "global_step": 183561, "epoch": 1092} {"train_loss": -11.380766868591309, "global_step": 183562, "epoch": 1092} {"train_loss": -11.277475357055664, "global_step": 183563, "epoch": 1092} {"train_loss": -11.241945266723633, "global_step": 183564, "epoch": 1092} {"train_loss": -11.199346542358398, "global_step": 183565, "epoch": 1092} {"train_loss": -11.164705276489258, "global_step": 183566, "epoch": 1092} {"train_loss": -11.457775115966797, "global_step": 183567, "epoch": 1092} {"train_loss": -11.091259956359863, "global_step": 183568, "epoch": 1092} {"train_loss": -11.448336601257324, "global_step": 183569, "epoch": 1092} {"train_loss": -11.58416748046875, "global_step": 183570, "epoch": 1092} {"train_loss": -11.51707649230957, "global_step": 183571, "epoch": 1092} {"train_loss": -11.375484466552734, "global_step": 183572, "epoch": 1092} {"train_loss": -11.399950981140137, "global_step": 183573, "epoch": 1092} {"train_loss": -11.475068092346191, "global_step": 183574, "epoch": 1092} {"train_loss": -11.432090759277344, "global_step": 183575, "epoch": 1092} {"train_loss": -11.596986770629883, "global_step": 183576, "epoch": 1092} {"train_loss": -11.535451889038086, "global_step": 183577, "epoch": 1092} {"train_loss": -11.500787734985352, "global_step": 183578, "epoch": 1092} {"train_loss": -11.579748153686523, "global_step": 183579, "epoch": 1092} {"train_loss": -11.545705795288086, "global_step": 183580, "epoch": 1092} {"train_loss": -11.369261741638184, "global_step": 183581, "epoch": 1092} {"train_loss": -11.681520462036133, "global_step": 183582, "epoch": 1092} {"train_loss": -11.556339263916016, "global_step": 183583, "epoch": 1092} {"train_loss": -11.683713912963867, "global_step": 183584, "epoch": 1092} {"train_loss": -11.241348266601562, "global_step": 183585, "epoch": 1092} {"train_loss": -11.755147933959961, "global_step": 183586, "epoch": 1092} {"train_loss": -11.478260040283203, "global_step": 183587, "epoch": 1092} {"train_loss": -11.678552627563477, "global_step": 183588, "epoch": 1092} {"train_loss": -11.223712921142578, "global_step": 183589, "epoch": 1092} {"train_loss": -11.111382484436035, "global_step": 183590, "epoch": 1092} {"train_loss": -11.6480131149292, "global_step": 183591, "epoch": 1092} {"train_loss": -11.38100814819336, "global_step": 183592, "epoch": 1092} {"train_loss": -11.45816421508789, "global_step": 183593, "epoch": 1092} {"train_loss": -11.098289489746094, "global_step": 183594, "epoch": 1092} {"train_loss": -11.307351112365723, "global_step": 183595, "epoch": 1092} {"train_loss": -10.514261245727539, "global_step": 183596, "epoch": 1092} {"train_loss": -10.029909133911133, "global_step": 183597, "epoch": 1092} {"train_loss": -11.284093856811523, "global_step": 183598, "epoch": 1092} {"train_loss": -10.522294044494629, "global_step": 183599, "epoch": 1092} {"train_loss": -10.824132919311523, "global_step": 183600, "epoch": 1092} {"train_loss": -11.253393173217773, "global_step": 183601, "epoch": 1092} {"train_loss": -11.030242919921875, "global_step": 183602, "epoch": 1092} {"train_loss": -10.911211013793945, "global_step": 183603, "epoch": 1092} {"train_loss": -11.237835884094238, "global_step": 183604, "epoch": 1092} {"train_loss": -10.864347457885742, "global_step": 183605, "epoch": 1092} {"train_loss": -10.98579216003418, "global_step": 183606, "epoch": 1092} {"train_loss": -11.498539924621582, "global_step": 183607, "epoch": 1092} {"train_loss": -10.868906021118164, "global_step": 183608, "epoch": 1092} {"train_loss": -11.460390090942383, "global_step": 183609, "epoch": 1092} {"train_loss": -10.94760799407959, "global_step": 183610, "epoch": 1092} {"train_loss": -10.9888916015625, "global_step": 183611, "epoch": 1092} {"train_loss": -11.033976554870605, "global_step": 183612, "epoch": 1092} {"train_loss": -10.790999412536621, "global_step": 183613, "epoch": 1092} {"train_loss": -11.098160743713379, "global_step": 183614, "epoch": 1092} {"train_loss": -10.302373886108398, "global_step": 183615, "epoch": 1092} {"train_loss": -10.854211807250977, "global_step": 183616, "epoch": 1092} {"train_loss": -10.665096282958984, "global_step": 183617, "epoch": 1092} {"train_loss": -10.879467010498047, "global_step": 183618, "epoch": 1092} {"train_loss": -10.292083740234375, "global_step": 183619, "epoch": 1092} {"train_loss": -10.168580055236816, "global_step": 183620, "epoch": 1092} {"train_loss": -10.669083595275879, "global_step": 183621, "epoch": 1092} {"train_loss": -10.404841423034668, "global_step": 183622, "epoch": 1092} {"train_loss": -11.041599381537665, "global_step": 183623, "epoch": 1092, "val_loss": 244851.046875} {"train_loss": -11.038448333740234, "global_step": 183624, "epoch": 1093} {"train_loss": -10.901723861694336, "global_step": 183625, "epoch": 1093} {"train_loss": -11.159125328063965, "global_step": 183626, "epoch": 1093} {"train_loss": -11.098382949829102, "global_step": 183627, "epoch": 1093} {"train_loss": -10.92756462097168, "global_step": 183628, "epoch": 1093} {"train_loss": -11.208797454833984, "global_step": 183629, "epoch": 1093} {"train_loss": -10.633604049682617, "global_step": 183630, "epoch": 1093} {"train_loss": -11.229406356811523, "global_step": 183631, "epoch": 1093} {"train_loss": -10.714847564697266, "global_step": 183632, "epoch": 1093} {"train_loss": -11.38822078704834, "global_step": 183633, "epoch": 1093} {"train_loss": -10.765878677368164, "global_step": 183634, "epoch": 1093} {"train_loss": -11.091667175292969, "global_step": 183635, "epoch": 1093} {"train_loss": -10.566886901855469, "global_step": 183636, "epoch": 1093} {"train_loss": -10.807546615600586, "global_step": 183637, "epoch": 1093} {"train_loss": -11.096132278442383, "global_step": 183638, "epoch": 1093} {"train_loss": -10.926130294799805, "global_step": 183639, "epoch": 1093} {"train_loss": -10.773286819458008, "global_step": 183640, "epoch": 1093} {"train_loss": -11.193830490112305, "global_step": 183641, "epoch": 1093} {"train_loss": -10.947153091430664, "global_step": 183642, "epoch": 1093} {"train_loss": -10.774456024169922, "global_step": 183643, "epoch": 1093} {"train_loss": -11.290716171264648, "global_step": 183644, "epoch": 1093} {"train_loss": -10.558164596557617, "global_step": 183645, "epoch": 1093} {"train_loss": -11.294422149658203, "global_step": 183646, "epoch": 1093} {"train_loss": -10.88269329071045, "global_step": 183647, "epoch": 1093} {"train_loss": -11.189664840698242, "global_step": 183648, "epoch": 1093} {"train_loss": -11.03179931640625, "global_step": 183649, "epoch": 1093} {"train_loss": -11.157109260559082, "global_step": 183650, "epoch": 1093} {"train_loss": -10.746824264526367, "global_step": 183651, "epoch": 1093} {"train_loss": -11.28306770324707, "global_step": 183652, "epoch": 1093} {"train_loss": -10.726369857788086, "global_step": 183653, "epoch": 1093} {"train_loss": -10.518867492675781, "global_step": 183654, "epoch": 1093} {"train_loss": -11.264698028564453, "global_step": 183655, "epoch": 1093} {"train_loss": -10.29275894165039, "global_step": 183656, "epoch": 1093} {"train_loss": -11.046104431152344, "global_step": 183657, "epoch": 1093} {"train_loss": -10.987081527709961, "global_step": 183658, "epoch": 1093} {"train_loss": -11.284268379211426, "global_step": 183659, "epoch": 1093} {"train_loss": -11.078864097595215, "global_step": 183660, "epoch": 1093} {"train_loss": -11.07088565826416, "global_step": 183661, "epoch": 1093} {"train_loss": -11.297672271728516, "global_step": 183662, "epoch": 1093} {"train_loss": -11.262821197509766, "global_step": 183663, "epoch": 1093} {"train_loss": -11.141469955444336, "global_step": 183664, "epoch": 1093} {"train_loss": -11.428482055664062, "global_step": 183665, "epoch": 1093} {"train_loss": -11.076318740844727, "global_step": 183666, "epoch": 1093} {"train_loss": -11.353178977966309, "global_step": 183667, "epoch": 1093} {"train_loss": -10.880388259887695, "global_step": 183668, "epoch": 1093} {"train_loss": -11.052413940429688, "global_step": 183669, "epoch": 1093} {"train_loss": -11.147722244262695, "global_step": 183670, "epoch": 1093} {"train_loss": -11.141386032104492, "global_step": 183671, "epoch": 1093} {"train_loss": -11.155954360961914, "global_step": 183672, "epoch": 1093} {"train_loss": -10.986315727233887, "global_step": 183673, "epoch": 1093} {"train_loss": -11.138635635375977, "global_step": 183674, "epoch": 1093} {"train_loss": -11.492067337036133, "global_step": 183675, "epoch": 1093} {"train_loss": -11.057223320007324, "global_step": 183676, "epoch": 1093} {"train_loss": -11.185810089111328, "global_step": 183677, "epoch": 1093} {"train_loss": -11.05062484741211, "global_step": 183678, "epoch": 1093} {"train_loss": -11.18018913269043, "global_step": 183679, "epoch": 1093} {"train_loss": -11.14688491821289, "global_step": 183680, "epoch": 1093} {"train_loss": -11.077670097351074, "global_step": 183681, "epoch": 1093} {"train_loss": -11.303678512573242, "global_step": 183682, "epoch": 1093} {"train_loss": -11.090885162353516, "global_step": 183683, "epoch": 1093} {"train_loss": -11.244735717773438, "global_step": 183684, "epoch": 1093} {"train_loss": -11.259984970092773, "global_step": 183685, "epoch": 1093} {"train_loss": -11.27151107788086, "global_step": 183686, "epoch": 1093} {"train_loss": -11.169784545898438, "global_step": 183687, "epoch": 1093} {"train_loss": -11.479292869567871, "global_step": 183688, "epoch": 1093} {"train_loss": -11.277379989624023, "global_step": 183689, "epoch": 1093} {"train_loss": -11.572980880737305, "global_step": 183690, "epoch": 1093} {"train_loss": -11.121644973754883, "global_step": 183691, "epoch": 1093} {"train_loss": -11.654006958007812, "global_step": 183692, "epoch": 1093} {"train_loss": -11.101760864257812, "global_step": 183693, "epoch": 1093} {"train_loss": -11.554411888122559, "global_step": 183694, "epoch": 1093} {"train_loss": -11.280679702758789, "global_step": 183695, "epoch": 1093} {"train_loss": -11.381295204162598, "global_step": 183696, "epoch": 1093} {"train_loss": -11.410896301269531, "global_step": 183697, "epoch": 1093} {"train_loss": -11.440810203552246, "global_step": 183698, "epoch": 1093} {"train_loss": -11.628494262695312, "global_step": 183699, "epoch": 1093} {"train_loss": -11.017894744873047, "global_step": 183700, "epoch": 1093} {"train_loss": -10.947729110717773, "global_step": 183701, "epoch": 1093} {"train_loss": -11.500818252563477, "global_step": 183702, "epoch": 1093} {"train_loss": -10.904966354370117, "global_step": 183703, "epoch": 1093} {"train_loss": -11.021129608154297, "global_step": 183704, "epoch": 1093} {"train_loss": -11.281951904296875, "global_step": 183705, "epoch": 1093} {"train_loss": -11.554370880126953, "global_step": 183706, "epoch": 1093} {"train_loss": -11.133798599243164, "global_step": 183707, "epoch": 1093} {"train_loss": -11.396586418151855, "global_step": 183708, "epoch": 1093} {"train_loss": -11.025355339050293, "global_step": 183709, "epoch": 1093} {"train_loss": -11.343679428100586, "global_step": 183710, "epoch": 1093} {"train_loss": -11.20543098449707, "global_step": 183711, "epoch": 1093} {"train_loss": -11.436845779418945, "global_step": 183712, "epoch": 1093} {"train_loss": -11.308029174804688, "global_step": 183713, "epoch": 1093} {"train_loss": -10.994187355041504, "global_step": 183714, "epoch": 1093} {"train_loss": -11.450955390930176, "global_step": 183715, "epoch": 1093} {"train_loss": -11.22751235961914, "global_step": 183716, "epoch": 1093} {"train_loss": -11.449588775634766, "global_step": 183717, "epoch": 1093} {"train_loss": -10.919898986816406, "global_step": 183718, "epoch": 1093} {"train_loss": -11.220654487609863, "global_step": 183719, "epoch": 1093} {"train_loss": -11.197502136230469, "global_step": 183720, "epoch": 1093} {"train_loss": -11.100311279296875, "global_step": 183721, "epoch": 1093} {"train_loss": -10.841646194458008, "global_step": 183722, "epoch": 1093} {"train_loss": -11.106161117553711, "global_step": 183723, "epoch": 1093} {"train_loss": -10.968990325927734, "global_step": 183724, "epoch": 1093} {"train_loss": -10.986528396606445, "global_step": 183725, "epoch": 1093} {"train_loss": -11.102821350097656, "global_step": 183726, "epoch": 1093} {"train_loss": -11.037496566772461, "global_step": 183727, "epoch": 1093} {"train_loss": -11.171306610107422, "global_step": 183728, "epoch": 1093} {"train_loss": -11.203094482421875, "global_step": 183729, "epoch": 1093} {"train_loss": -11.314678192138672, "global_step": 183730, "epoch": 1093} {"train_loss": -11.199822425842285, "global_step": 183731, "epoch": 1093} {"train_loss": -11.44718074798584, "global_step": 183732, "epoch": 1093} {"train_loss": -11.502412796020508, "global_step": 183733, "epoch": 1093} {"train_loss": -11.423828125, "global_step": 183734, "epoch": 1093} {"train_loss": -11.364704132080078, "global_step": 183735, "epoch": 1093} {"train_loss": -11.303768157958984, "global_step": 183736, "epoch": 1093} {"train_loss": -11.292749404907227, "global_step": 183737, "epoch": 1093} {"train_loss": -11.085683822631836, "global_step": 183738, "epoch": 1093} {"train_loss": -10.900636672973633, "global_step": 183739, "epoch": 1093} {"train_loss": -11.399173736572266, "global_step": 183740, "epoch": 1093} {"train_loss": -11.336849212646484, "global_step": 183741, "epoch": 1093} {"train_loss": -11.278202056884766, "global_step": 183742, "epoch": 1093} {"train_loss": -10.938733100891113, "global_step": 183743, "epoch": 1093} {"train_loss": -11.18612289428711, "global_step": 183744, "epoch": 1093} {"train_loss": -10.577369689941406, "global_step": 183745, "epoch": 1093} {"train_loss": -10.928752899169922, "global_step": 183746, "epoch": 1093} {"train_loss": -11.096328735351562, "global_step": 183747, "epoch": 1093} {"train_loss": -11.059152603149414, "global_step": 183748, "epoch": 1093} {"train_loss": -10.840866088867188, "global_step": 183749, "epoch": 1093} {"train_loss": -11.099321365356445, "global_step": 183750, "epoch": 1093} {"train_loss": -11.103340148925781, "global_step": 183751, "epoch": 1093} {"train_loss": -10.494903564453125, "global_step": 183752, "epoch": 1093} {"train_loss": -10.79879379272461, "global_step": 183753, "epoch": 1093} {"train_loss": -11.139165878295898, "global_step": 183754, "epoch": 1093} {"train_loss": -10.12141227722168, "global_step": 183755, "epoch": 1093} {"train_loss": -10.65143871307373, "global_step": 183756, "epoch": 1093} {"train_loss": -9.36690902709961, "global_step": 183757, "epoch": 1093} {"train_loss": -10.049842834472656, "global_step": 183758, "epoch": 1093} {"train_loss": -10.895054817199707, "global_step": 183759, "epoch": 1093} {"train_loss": -9.713817596435547, "global_step": 183760, "epoch": 1093} {"train_loss": -11.142471313476562, "global_step": 183761, "epoch": 1093} {"train_loss": -9.962522506713867, "global_step": 183762, "epoch": 1093} {"train_loss": -11.327136993408203, "global_step": 183763, "epoch": 1093} {"train_loss": -10.38129997253418, "global_step": 183764, "epoch": 1093} {"train_loss": -10.878607749938965, "global_step": 183765, "epoch": 1093} {"train_loss": -10.639405250549316, "global_step": 183766, "epoch": 1093} {"train_loss": -11.11738395690918, "global_step": 183767, "epoch": 1093} {"train_loss": -11.212818145751953, "global_step": 183768, "epoch": 1093} {"train_loss": -11.215728759765625, "global_step": 183769, "epoch": 1093} {"train_loss": -11.023750305175781, "global_step": 183770, "epoch": 1093} {"train_loss": -11.373908996582031, "global_step": 183771, "epoch": 1093} {"train_loss": -11.20595932006836, "global_step": 183772, "epoch": 1093} {"train_loss": -10.941337585449219, "global_step": 183773, "epoch": 1093} {"train_loss": -11.18471622467041, "global_step": 183774, "epoch": 1093} {"train_loss": -11.174018859863281, "global_step": 183775, "epoch": 1093} {"train_loss": -11.081647872924805, "global_step": 183776, "epoch": 1093} {"train_loss": -11.328371047973633, "global_step": 183777, "epoch": 1093} {"train_loss": -11.010063171386719, "global_step": 183778, "epoch": 1093} {"train_loss": -10.943439483642578, "global_step": 183779, "epoch": 1093} {"train_loss": -11.055912017822266, "global_step": 183780, "epoch": 1093} {"train_loss": -10.807260513305664, "global_step": 183781, "epoch": 1093} {"train_loss": -11.10575008392334, "global_step": 183782, "epoch": 1093} {"train_loss": -11.099287033081055, "global_step": 183783, "epoch": 1093} {"train_loss": -11.390941619873047, "global_step": 183784, "epoch": 1093} {"train_loss": -10.850500106811523, "global_step": 183785, "epoch": 1093} {"train_loss": -11.18088150024414, "global_step": 183786, "epoch": 1093} {"train_loss": -10.751399993896484, "global_step": 183787, "epoch": 1093} {"train_loss": -10.823945999145508, "global_step": 183788, "epoch": 1093} {"train_loss": -11.29018783569336, "global_step": 183789, "epoch": 1093} {"train_loss": -11.004119873046875, "global_step": 183790, "epoch": 1093} {"train_loss": -11.072915185065497, "global_step": 183791, "epoch": 1093, "val_loss": 247082.78125} {"train_loss": -10.685735702514648, "global_step": 183792, "epoch": 1094} {"train_loss": -11.279129981994629, "global_step": 183793, "epoch": 1094} {"train_loss": -11.324636459350586, "global_step": 183794, "epoch": 1094} {"train_loss": -11.261545181274414, "global_step": 183795, "epoch": 1094} {"train_loss": -11.33204460144043, "global_step": 183796, "epoch": 1094} {"train_loss": -11.191566467285156, "global_step": 183797, "epoch": 1094} {"train_loss": -11.393841743469238, "global_step": 183798, "epoch": 1094} {"train_loss": -11.042610168457031, "global_step": 183799, "epoch": 1094} {"train_loss": -11.223062515258789, "global_step": 183800, "epoch": 1094} {"train_loss": -10.917570114135742, "global_step": 183801, "epoch": 1094} {"train_loss": -10.55157470703125, "global_step": 183802, "epoch": 1094} {"train_loss": -11.422175407409668, "global_step": 183803, "epoch": 1094} {"train_loss": -10.802518844604492, "global_step": 183804, "epoch": 1094} {"train_loss": -11.390073776245117, "global_step": 183805, "epoch": 1094} {"train_loss": -10.591880798339844, "global_step": 183806, "epoch": 1094} {"train_loss": -11.302692413330078, "global_step": 183807, "epoch": 1094} {"train_loss": -10.920822143554688, "global_step": 183808, "epoch": 1094} {"train_loss": -11.113027572631836, "global_step": 183809, "epoch": 1094} {"train_loss": -11.15298080444336, "global_step": 183810, "epoch": 1094} {"train_loss": -11.061441421508789, "global_step": 183811, "epoch": 1094} {"train_loss": -11.306106567382812, "global_step": 183812, "epoch": 1094} {"train_loss": -11.048140525817871, "global_step": 183813, "epoch": 1094} {"train_loss": -10.980316162109375, "global_step": 183814, "epoch": 1094} {"train_loss": -11.362788200378418, "global_step": 183815, "epoch": 1094} {"train_loss": -10.882339477539062, "global_step": 183816, "epoch": 1094} {"train_loss": -11.173778533935547, "global_step": 183817, "epoch": 1094} {"train_loss": -10.630703926086426, "global_step": 183818, "epoch": 1094} {"train_loss": -10.78561019897461, "global_step": 183819, "epoch": 1094} {"train_loss": -11.050993919372559, "global_step": 183820, "epoch": 1094} {"train_loss": -10.662425994873047, "global_step": 183821, "epoch": 1094} {"train_loss": -11.007823944091797, "global_step": 183822, "epoch": 1094} {"train_loss": -10.425658226013184, "global_step": 183823, "epoch": 1094} {"train_loss": -10.82563304901123, "global_step": 183824, "epoch": 1094} {"train_loss": -10.512325286865234, "global_step": 183825, "epoch": 1094} {"train_loss": -11.298612594604492, "global_step": 183826, "epoch": 1094} {"train_loss": -10.729669570922852, "global_step": 183827, "epoch": 1094} {"train_loss": -11.238046646118164, "global_step": 183828, "epoch": 1094} {"train_loss": -10.864879608154297, "global_step": 183829, "epoch": 1094} {"train_loss": -11.098224639892578, "global_step": 183830, "epoch": 1094} {"train_loss": -10.633305549621582, "global_step": 183831, "epoch": 1094} {"train_loss": -10.966179847717285, "global_step": 183832, "epoch": 1094} {"train_loss": -10.87314224243164, "global_step": 183833, "epoch": 1094} {"train_loss": -11.068836212158203, "global_step": 183834, "epoch": 1094} {"train_loss": -11.224111557006836, "global_step": 183835, "epoch": 1094} {"train_loss": -10.823896408081055, "global_step": 183836, "epoch": 1094} {"train_loss": -11.176849365234375, "global_step": 183837, "epoch": 1094} {"train_loss": -10.996908187866211, "global_step": 183838, "epoch": 1094} {"train_loss": -11.388456344604492, "global_step": 183839, "epoch": 1094} {"train_loss": -10.765583992004395, "global_step": 183840, "epoch": 1094} {"train_loss": -11.416633605957031, "global_step": 183841, "epoch": 1094} {"train_loss": -10.76274299621582, "global_step": 183842, "epoch": 1094} {"train_loss": -11.572192192077637, "global_step": 183843, "epoch": 1094} {"train_loss": -11.07363224029541, "global_step": 183844, "epoch": 1094} {"train_loss": -11.538458824157715, "global_step": 183845, "epoch": 1094} {"train_loss": -11.194036483764648, "global_step": 183846, "epoch": 1094} {"train_loss": -11.344799041748047, "global_step": 183847, "epoch": 1094} {"train_loss": -11.198934555053711, "global_step": 183848, "epoch": 1094} {"train_loss": -11.422359466552734, "global_step": 183849, "epoch": 1094} {"train_loss": -11.315058708190918, "global_step": 183850, "epoch": 1094} {"train_loss": -11.59719467163086, "global_step": 183851, "epoch": 1094} {"train_loss": -11.301000595092773, "global_step": 183852, "epoch": 1094} {"train_loss": -11.78603744506836, "global_step": 183853, "epoch": 1094} {"train_loss": -11.338345527648926, "global_step": 183854, "epoch": 1094} {"train_loss": -11.318621635437012, "global_step": 183855, "epoch": 1094} {"train_loss": -11.26400089263916, "global_step": 183856, "epoch": 1094} {"train_loss": -11.458511352539062, "global_step": 183857, "epoch": 1094} {"train_loss": -11.254390716552734, "global_step": 183858, "epoch": 1094} {"train_loss": -11.323793411254883, "global_step": 183859, "epoch": 1094} {"train_loss": -11.122047424316406, "global_step": 183860, "epoch": 1094} {"train_loss": -11.415521621704102, "global_step": 183861, "epoch": 1094} {"train_loss": -11.281058311462402, "global_step": 183862, "epoch": 1094} {"train_loss": -11.456056594848633, "global_step": 183863, "epoch": 1094} {"train_loss": -11.434053421020508, "global_step": 183864, "epoch": 1094} {"train_loss": -11.71327018737793, "global_step": 183865, "epoch": 1094} {"train_loss": -11.53938102722168, "global_step": 183866, "epoch": 1094} {"train_loss": -11.525392532348633, "global_step": 183867, "epoch": 1094} {"train_loss": -11.655044555664062, "global_step": 183868, "epoch": 1094} {"train_loss": -11.562503814697266, "global_step": 183869, "epoch": 1094} {"train_loss": -11.503938674926758, "global_step": 183870, "epoch": 1094} {"train_loss": -11.341421127319336, "global_step": 183871, "epoch": 1094} {"train_loss": -11.61410903930664, "global_step": 183872, "epoch": 1094} {"train_loss": -11.301748275756836, "global_step": 183873, "epoch": 1094} {"train_loss": -11.48923397064209, "global_step": 183874, "epoch": 1094} {"train_loss": -11.747913360595703, "global_step": 183875, "epoch": 1094} {"train_loss": -11.3134765625, "global_step": 183876, "epoch": 1094} {"train_loss": -11.403076171875, "global_step": 183877, "epoch": 1094} {"train_loss": -11.367488861083984, "global_step": 183878, "epoch": 1094} {"train_loss": -10.993885040283203, "global_step": 183879, "epoch": 1094} {"train_loss": -11.094192504882812, "global_step": 183880, "epoch": 1094} {"train_loss": -10.962282180786133, "global_step": 183881, "epoch": 1094} {"train_loss": -11.408477783203125, "global_step": 183882, "epoch": 1094} {"train_loss": -11.22946548461914, "global_step": 183883, "epoch": 1094} {"train_loss": -11.286322593688965, "global_step": 183884, "epoch": 1094} {"train_loss": -11.643119812011719, "global_step": 183885, "epoch": 1094} {"train_loss": -11.388008117675781, "global_step": 183886, "epoch": 1094} {"train_loss": -11.13215160369873, "global_step": 183887, "epoch": 1094} {"train_loss": -11.084295272827148, "global_step": 183888, "epoch": 1094} {"train_loss": -10.864130020141602, "global_step": 183889, "epoch": 1094} {"train_loss": -10.83603286743164, "global_step": 183890, "epoch": 1094} {"train_loss": -10.948616981506348, "global_step": 183891, "epoch": 1094} {"train_loss": -10.978414535522461, "global_step": 183892, "epoch": 1094} {"train_loss": -9.744556427001953, "global_step": 183893, "epoch": 1094} {"train_loss": -10.950398445129395, "global_step": 183894, "epoch": 1094} {"train_loss": -10.262094497680664, "global_step": 183895, "epoch": 1094} {"train_loss": -10.672648429870605, "global_step": 183896, "epoch": 1094} {"train_loss": -10.123571395874023, "global_step": 183897, "epoch": 1094} {"train_loss": -11.038142204284668, "global_step": 183898, "epoch": 1094} {"train_loss": -10.5978422164917, "global_step": 183899, "epoch": 1094} {"train_loss": -10.823369979858398, "global_step": 183900, "epoch": 1094} {"train_loss": -10.464197158813477, "global_step": 183901, "epoch": 1094} {"train_loss": -10.520818710327148, "global_step": 183902, "epoch": 1094} {"train_loss": -10.719115257263184, "global_step": 183903, "epoch": 1094} {"train_loss": -10.313121795654297, "global_step": 183904, "epoch": 1094} {"train_loss": -11.184645652770996, "global_step": 183905, "epoch": 1094} {"train_loss": -10.342752456665039, "global_step": 183906, "epoch": 1094} {"train_loss": -11.123347282409668, "global_step": 183907, "epoch": 1094} {"train_loss": -10.212478637695312, "global_step": 183908, "epoch": 1094} {"train_loss": -10.431405067443848, "global_step": 183909, "epoch": 1094} {"train_loss": -10.647305488586426, "global_step": 183910, "epoch": 1094} {"train_loss": -10.509474754333496, "global_step": 183911, "epoch": 1094} {"train_loss": -10.949996948242188, "global_step": 183912, "epoch": 1094} {"train_loss": -10.53823471069336, "global_step": 183913, "epoch": 1094} {"train_loss": -10.931724548339844, "global_step": 183914, "epoch": 1094} {"train_loss": -10.547635078430176, "global_step": 183915, "epoch": 1094} {"train_loss": -10.296684265136719, "global_step": 183916, "epoch": 1094} {"train_loss": -10.896418571472168, "global_step": 183917, "epoch": 1094} {"train_loss": -10.555107116699219, "global_step": 183918, "epoch": 1094} {"train_loss": -11.038788795471191, "global_step": 183919, "epoch": 1094} {"train_loss": -10.468244552612305, "global_step": 183920, "epoch": 1094} {"train_loss": -11.202560424804688, "global_step": 183921, "epoch": 1094} {"train_loss": -10.302709579467773, "global_step": 183922, "epoch": 1094} {"train_loss": -11.008695602416992, "global_step": 183923, "epoch": 1094} {"train_loss": -10.611921310424805, "global_step": 183924, "epoch": 1094} {"train_loss": -10.884170532226562, "global_step": 183925, "epoch": 1094} {"train_loss": -10.539502143859863, "global_step": 183926, "epoch": 1094} {"train_loss": -11.074355125427246, "global_step": 183927, "epoch": 1094} {"train_loss": -10.90184211730957, "global_step": 183928, "epoch": 1094} {"train_loss": -11.043669700622559, "global_step": 183929, "epoch": 1094} {"train_loss": -10.97861099243164, "global_step": 183930, "epoch": 1094} {"train_loss": -11.164697647094727, "global_step": 183931, "epoch": 1094} {"train_loss": -11.058988571166992, "global_step": 183932, "epoch": 1094} {"train_loss": -11.128878593444824, "global_step": 183933, "epoch": 1094} {"train_loss": -11.050026893615723, "global_step": 183934, "epoch": 1094} {"train_loss": -11.178443908691406, "global_step": 183935, "epoch": 1094} {"train_loss": -11.359453201293945, "global_step": 183936, "epoch": 1094} {"train_loss": -11.031661987304688, "global_step": 183937, "epoch": 1094} {"train_loss": -11.301977157592773, "global_step": 183938, "epoch": 1094} {"train_loss": -11.131990432739258, "global_step": 183939, "epoch": 1094} {"train_loss": -11.053153991699219, "global_step": 183940, "epoch": 1094} {"train_loss": -11.147298812866211, "global_step": 183941, "epoch": 1094} {"train_loss": -10.964258193969727, "global_step": 183942, "epoch": 1094} {"train_loss": -11.351676940917969, "global_step": 183943, "epoch": 1094} {"train_loss": -11.200197219848633, "global_step": 183944, "epoch": 1094} {"train_loss": -11.477091789245605, "global_step": 183945, "epoch": 1094} {"train_loss": -11.403900146484375, "global_step": 183946, "epoch": 1094} {"train_loss": -11.157955169677734, "global_step": 183947, "epoch": 1094} {"train_loss": -11.438821792602539, "global_step": 183948, "epoch": 1094} {"train_loss": -11.287946701049805, "global_step": 183949, "epoch": 1094} {"train_loss": -11.394047737121582, "global_step": 183950, "epoch": 1094} {"train_loss": -11.284912109375, "global_step": 183951, "epoch": 1094} {"train_loss": -11.304473876953125, "global_step": 183952, "epoch": 1094} {"train_loss": -11.508459091186523, "global_step": 183953, "epoch": 1094} {"train_loss": -11.319703102111816, "global_step": 183954, "epoch": 1094} {"train_loss": -11.438982009887695, "global_step": 183955, "epoch": 1094} {"train_loss": -11.340357780456543, "global_step": 183956, "epoch": 1094} {"train_loss": -11.557669639587402, "global_step": 183957, "epoch": 1094} {"train_loss": -11.398696899414062, "global_step": 183958, "epoch": 1094} {"train_loss": -11.079131830306281, "global_step": 183959, "epoch": 1094, "val_loss": 248434.515625} {"train_loss": -11.487252235412598, "global_step": 183960, "epoch": 1095} {"train_loss": -11.328161239624023, "global_step": 183961, "epoch": 1095} {"train_loss": -11.484981536865234, "global_step": 183962, "epoch": 1095} {"train_loss": -11.401604652404785, "global_step": 183963, "epoch": 1095} {"train_loss": -11.147223472595215, "global_step": 183964, "epoch": 1095} {"train_loss": -11.72102165222168, "global_step": 183965, "epoch": 1095} {"train_loss": -11.363582611083984, "global_step": 183966, "epoch": 1095} {"train_loss": -11.47606086730957, "global_step": 183967, "epoch": 1095} {"train_loss": -11.257973670959473, "global_step": 183968, "epoch": 1095} {"train_loss": -11.591798782348633, "global_step": 183969, "epoch": 1095} {"train_loss": -11.470638275146484, "global_step": 183970, "epoch": 1095} {"train_loss": -11.3328218460083, "global_step": 183971, "epoch": 1095} {"train_loss": -11.58034610748291, "global_step": 183972, "epoch": 1095} {"train_loss": -11.429438591003418, "global_step": 183973, "epoch": 1095} {"train_loss": -11.436727523803711, "global_step": 183974, "epoch": 1095} {"train_loss": -11.420509338378906, "global_step": 183975, "epoch": 1095} {"train_loss": -11.59035873413086, "global_step": 183976, "epoch": 1095} {"train_loss": -11.21896743774414, "global_step": 183977, "epoch": 1095} {"train_loss": -11.48548698425293, "global_step": 183978, "epoch": 1095} {"train_loss": -10.957457542419434, "global_step": 183979, "epoch": 1095} {"train_loss": -11.358030319213867, "global_step": 183980, "epoch": 1095} {"train_loss": -10.918254852294922, "global_step": 183981, "epoch": 1095} {"train_loss": -11.313848495483398, "global_step": 183982, "epoch": 1095} {"train_loss": -11.501813888549805, "global_step": 183983, "epoch": 1095} {"train_loss": -10.823348045349121, "global_step": 183984, "epoch": 1095} {"train_loss": -10.545894622802734, "global_step": 183985, "epoch": 1095} {"train_loss": -11.524642944335938, "global_step": 183986, "epoch": 1095} {"train_loss": -9.871371269226074, "global_step": 183987, "epoch": 1095} {"train_loss": -10.428466796875, "global_step": 183988, "epoch": 1095} {"train_loss": -11.41066837310791, "global_step": 183989, "epoch": 1095} {"train_loss": -10.160093307495117, "global_step": 183990, "epoch": 1095} {"train_loss": -10.346311569213867, "global_step": 183991, "epoch": 1095} {"train_loss": -11.22236442565918, "global_step": 183992, "epoch": 1095} {"train_loss": -10.817622184753418, "global_step": 183993, "epoch": 1095} {"train_loss": -11.069768905639648, "global_step": 183994, "epoch": 1095} {"train_loss": -10.693563461303711, "global_step": 183995, "epoch": 1095} {"train_loss": -11.22588062286377, "global_step": 183996, "epoch": 1095} {"train_loss": -11.186710357666016, "global_step": 183997, "epoch": 1095} {"train_loss": -10.97354793548584, "global_step": 183998, "epoch": 1095} {"train_loss": -11.126561164855957, "global_step": 183999, "epoch": 1095} {"train_loss": -11.009689331054688, "global_step": 184000, "epoch": 1095} {"train_loss": -11.384248733520508, "global_step": 184001, "epoch": 1095} {"train_loss": -10.885326385498047, "global_step": 184002, "epoch": 1095} {"train_loss": -11.245899200439453, "global_step": 184003, "epoch": 1095} {"train_loss": -11.31786823272705, "global_step": 184004, "epoch": 1095} {"train_loss": -11.143571853637695, "global_step": 184005, "epoch": 1095} {"train_loss": -11.094059944152832, "global_step": 184006, "epoch": 1095} {"train_loss": -10.976264953613281, "global_step": 184007, "epoch": 1095} {"train_loss": -11.153165817260742, "global_step": 184008, "epoch": 1095} {"train_loss": -10.645450592041016, "global_step": 184009, "epoch": 1095} {"train_loss": -11.11836051940918, "global_step": 184010, "epoch": 1095} {"train_loss": -10.509124755859375, "global_step": 184011, "epoch": 1095} {"train_loss": -10.79808235168457, "global_step": 184012, "epoch": 1095} {"train_loss": -11.075687408447266, "global_step": 184013, "epoch": 1095} {"train_loss": -10.922323226928711, "global_step": 184014, "epoch": 1095} {"train_loss": -11.30760383605957, "global_step": 184015, "epoch": 1095} {"train_loss": -10.869718551635742, "global_step": 184016, "epoch": 1095} {"train_loss": -11.11032772064209, "global_step": 184017, "epoch": 1095} {"train_loss": -11.22852897644043, "global_step": 184018, "epoch": 1095} {"train_loss": -11.233311653137207, "global_step": 184019, "epoch": 1095} {"train_loss": -11.433095932006836, "global_step": 184020, "epoch": 1095} {"train_loss": -11.31505012512207, "global_step": 184021, "epoch": 1095} {"train_loss": -11.446977615356445, "global_step": 184022, "epoch": 1095} {"train_loss": -11.184368133544922, "global_step": 184023, "epoch": 1095} {"train_loss": -11.485677719116211, "global_step": 184024, "epoch": 1095} {"train_loss": -11.492776870727539, "global_step": 184025, "epoch": 1095} {"train_loss": -11.338825225830078, "global_step": 184026, "epoch": 1095} {"train_loss": -11.275899887084961, "global_step": 184027, "epoch": 1095} {"train_loss": -11.480031967163086, "global_step": 184028, "epoch": 1095} {"train_loss": -11.09246826171875, "global_step": 184029, "epoch": 1095} {"train_loss": -11.366244316101074, "global_step": 184030, "epoch": 1095} {"train_loss": -11.363191604614258, "global_step": 184031, "epoch": 1095} {"train_loss": -11.295252799987793, "global_step": 184032, "epoch": 1095} {"train_loss": -11.377147674560547, "global_step": 184033, "epoch": 1095} {"train_loss": -11.107937812805176, "global_step": 184034, "epoch": 1095} {"train_loss": -11.463884353637695, "global_step": 184035, "epoch": 1095} {"train_loss": -11.232734680175781, "global_step": 184036, "epoch": 1095} {"train_loss": -11.46804428100586, "global_step": 184037, "epoch": 1095} {"train_loss": -11.285810470581055, "global_step": 184038, "epoch": 1095} {"train_loss": -11.403739929199219, "global_step": 184039, "epoch": 1095} {"train_loss": -11.284971237182617, "global_step": 184040, "epoch": 1095} {"train_loss": -11.286971092224121, "global_step": 184041, "epoch": 1095} {"train_loss": -11.58979606628418, "global_step": 184042, "epoch": 1095} {"train_loss": -11.259520530700684, "global_step": 184043, "epoch": 1095} {"train_loss": -11.460355758666992, "global_step": 184044, "epoch": 1095} {"train_loss": -11.589863777160645, "global_step": 184045, "epoch": 1095} {"train_loss": -11.162739753723145, "global_step": 184046, "epoch": 1095} {"train_loss": -11.644536972045898, "global_step": 184047, "epoch": 1095} {"train_loss": -11.165407180786133, "global_step": 184048, "epoch": 1095} {"train_loss": -11.031274795532227, "global_step": 184049, "epoch": 1095} {"train_loss": -10.97633171081543, "global_step": 184050, "epoch": 1095} {"train_loss": -11.268733978271484, "global_step": 184051, "epoch": 1095} {"train_loss": -11.23641586303711, "global_step": 184052, "epoch": 1095} {"train_loss": -10.672303199768066, "global_step": 184053, "epoch": 1095} {"train_loss": -11.227987289428711, "global_step": 184054, "epoch": 1095} {"train_loss": -11.242708206176758, "global_step": 184055, "epoch": 1095} {"train_loss": -11.109861373901367, "global_step": 184056, "epoch": 1095} {"train_loss": -11.35366439819336, "global_step": 184057, "epoch": 1095} {"train_loss": -11.173866271972656, "global_step": 184058, "epoch": 1095} {"train_loss": -11.14112377166748, "global_step": 184059, "epoch": 1095} {"train_loss": -10.7830171585083, "global_step": 184060, "epoch": 1095} {"train_loss": -11.397027969360352, "global_step": 184061, "epoch": 1095} {"train_loss": -11.244245529174805, "global_step": 184062, "epoch": 1095} {"train_loss": -11.02031421661377, "global_step": 184063, "epoch": 1095} {"train_loss": -11.16572380065918, "global_step": 184064, "epoch": 1095} {"train_loss": -10.864090919494629, "global_step": 184065, "epoch": 1095} {"train_loss": -11.678570747375488, "global_step": 184066, "epoch": 1095} {"train_loss": -11.113792419433594, "global_step": 184067, "epoch": 1095} {"train_loss": -11.591604232788086, "global_step": 184068, "epoch": 1095} {"train_loss": -11.18563461303711, "global_step": 184069, "epoch": 1095} {"train_loss": -11.152612686157227, "global_step": 184070, "epoch": 1095} {"train_loss": -11.231538772583008, "global_step": 184071, "epoch": 1095} {"train_loss": -10.947257995605469, "global_step": 184072, "epoch": 1095} {"train_loss": -11.078468322753906, "global_step": 184073, "epoch": 1095} {"train_loss": -11.107351303100586, "global_step": 184074, "epoch": 1095} {"train_loss": -11.524450302124023, "global_step": 184075, "epoch": 1095} {"train_loss": -11.122137069702148, "global_step": 184076, "epoch": 1095} {"train_loss": -11.424646377563477, "global_step": 184077, "epoch": 1095} {"train_loss": -10.972805976867676, "global_step": 184078, "epoch": 1095} {"train_loss": -10.888992309570312, "global_step": 184079, "epoch": 1095} {"train_loss": -10.769576072692871, "global_step": 184080, "epoch": 1095} {"train_loss": -11.148249626159668, "global_step": 184081, "epoch": 1095} {"train_loss": -10.826851844787598, "global_step": 184082, "epoch": 1095} {"train_loss": -10.57481575012207, "global_step": 184083, "epoch": 1095} {"train_loss": -11.619446754455566, "global_step": 184084, "epoch": 1095} {"train_loss": -10.905014991760254, "global_step": 184085, "epoch": 1095} {"train_loss": -10.973699569702148, "global_step": 184086, "epoch": 1095} {"train_loss": -11.506797790527344, "global_step": 184087, "epoch": 1095} {"train_loss": -10.923827171325684, "global_step": 184088, "epoch": 1095} {"train_loss": -11.106502532958984, "global_step": 184089, "epoch": 1095} {"train_loss": -10.926319122314453, "global_step": 184090, "epoch": 1095} {"train_loss": -10.949209213256836, "global_step": 184091, "epoch": 1095} {"train_loss": -11.146627426147461, "global_step": 184092, "epoch": 1095} {"train_loss": -10.363508224487305, "global_step": 184093, "epoch": 1095} {"train_loss": -10.995603561401367, "global_step": 184094, "epoch": 1095} {"train_loss": -10.851447105407715, "global_step": 184095, "epoch": 1095} {"train_loss": -10.6080904006958, "global_step": 184096, "epoch": 1095} {"train_loss": -10.878990173339844, "global_step": 184097, "epoch": 1095} {"train_loss": -9.619585037231445, "global_step": 184098, "epoch": 1095} {"train_loss": -10.760696411132812, "global_step": 184099, "epoch": 1095} {"train_loss": -10.523092269897461, "global_step": 184100, "epoch": 1095} {"train_loss": -10.758066177368164, "global_step": 184101, "epoch": 1095} {"train_loss": -9.89091968536377, "global_step": 184102, "epoch": 1095} {"train_loss": -10.848956108093262, "global_step": 184103, "epoch": 1095} {"train_loss": -9.561084747314453, "global_step": 184104, "epoch": 1095} {"train_loss": -11.146817207336426, "global_step": 184105, "epoch": 1095} {"train_loss": -10.04631519317627, "global_step": 184106, "epoch": 1095} {"train_loss": -10.443355560302734, "global_step": 184107, "epoch": 1095} {"train_loss": -10.419763565063477, "global_step": 184108, "epoch": 1095} {"train_loss": -10.059722900390625, "global_step": 184109, "epoch": 1095} {"train_loss": -11.121790885925293, "global_step": 184110, "epoch": 1095} {"train_loss": -10.078729629516602, "global_step": 184111, "epoch": 1095} {"train_loss": -10.874776840209961, "global_step": 184112, "epoch": 1095} {"train_loss": -10.596050262451172, "global_step": 184113, "epoch": 1095} {"train_loss": -10.224407196044922, "global_step": 184114, "epoch": 1095} {"train_loss": -11.069511413574219, "global_step": 184115, "epoch": 1095} {"train_loss": -10.476216316223145, "global_step": 184116, "epoch": 1095} {"train_loss": -10.87678337097168, "global_step": 184117, "epoch": 1095} {"train_loss": -11.058854103088379, "global_step": 184118, "epoch": 1095} {"train_loss": -10.797447204589844, "global_step": 184119, "epoch": 1095} {"train_loss": -10.794171333312988, "global_step": 184120, "epoch": 1095} {"train_loss": -11.21221923828125, "global_step": 184121, "epoch": 1095} {"train_loss": -10.575300216674805, "global_step": 184122, "epoch": 1095} {"train_loss": -10.924118995666504, "global_step": 184123, "epoch": 1095} {"train_loss": -11.072866439819336, "global_step": 184124, "epoch": 1095} {"train_loss": -11.095651626586914, "global_step": 184125, "epoch": 1095} {"train_loss": -10.85881233215332, "global_step": 184126, "epoch": 1095} {"train_loss": -11.064883805456615, "global_step": 184127, "epoch": 1095, "val_loss": 245211.625, "train_action_mse_error": 0.368347704410553} {"train_loss": -10.975963592529297, "global_step": 184128, "epoch": 1096} {"train_loss": -10.913692474365234, "global_step": 184129, "epoch": 1096} {"train_loss": -11.16357135772705, "global_step": 184130, "epoch": 1096} {"train_loss": -10.83674144744873, "global_step": 184131, "epoch": 1096} {"train_loss": -11.130636215209961, "global_step": 184132, "epoch": 1096} {"train_loss": -10.694868087768555, "global_step": 184133, "epoch": 1096} {"train_loss": -10.98682689666748, "global_step": 184134, "epoch": 1096} {"train_loss": -11.187474250793457, "global_step": 184135, "epoch": 1096} {"train_loss": -11.155277252197266, "global_step": 184136, "epoch": 1096} {"train_loss": -10.971776962280273, "global_step": 184137, "epoch": 1096} {"train_loss": -11.147586822509766, "global_step": 184138, "epoch": 1096} {"train_loss": -11.118900299072266, "global_step": 184139, "epoch": 1096} {"train_loss": -10.965993881225586, "global_step": 184140, "epoch": 1096} {"train_loss": -11.305024147033691, "global_step": 184141, "epoch": 1096} {"train_loss": -10.680545806884766, "global_step": 184142, "epoch": 1096} {"train_loss": -11.084085464477539, "global_step": 184143, "epoch": 1096} {"train_loss": -10.985429763793945, "global_step": 184144, "epoch": 1096} {"train_loss": -10.808761596679688, "global_step": 184145, "epoch": 1096} {"train_loss": -11.306900978088379, "global_step": 184146, "epoch": 1096} {"train_loss": -11.011199951171875, "global_step": 184147, "epoch": 1096} {"train_loss": -11.166339874267578, "global_step": 184148, "epoch": 1096} {"train_loss": -11.259201049804688, "global_step": 184149, "epoch": 1096} {"train_loss": -11.259895324707031, "global_step": 184150, "epoch": 1096} {"train_loss": -11.172521591186523, "global_step": 184151, "epoch": 1096} {"train_loss": -11.26616382598877, "global_step": 184152, "epoch": 1096} {"train_loss": -11.373310089111328, "global_step": 184153, "epoch": 1096} {"train_loss": -11.401883125305176, "global_step": 184154, "epoch": 1096} {"train_loss": -11.488353729248047, "global_step": 184155, "epoch": 1096} {"train_loss": -11.588872909545898, "global_step": 184156, "epoch": 1096} {"train_loss": -11.407722473144531, "global_step": 184157, "epoch": 1096} {"train_loss": -11.553579330444336, "global_step": 184158, "epoch": 1096} {"train_loss": -11.58604621887207, "global_step": 184159, "epoch": 1096} {"train_loss": -11.37925910949707, "global_step": 184160, "epoch": 1096} {"train_loss": -11.579593658447266, "global_step": 184161, "epoch": 1096} {"train_loss": -11.499342918395996, "global_step": 184162, "epoch": 1096} {"train_loss": -11.552505493164062, "global_step": 184163, "epoch": 1096} {"train_loss": -11.5133056640625, "global_step": 184164, "epoch": 1096} {"train_loss": -11.37221908569336, "global_step": 184165, "epoch": 1096} {"train_loss": -11.476666450500488, "global_step": 184166, "epoch": 1096} {"train_loss": -11.469551086425781, "global_step": 184167, "epoch": 1096} {"train_loss": -11.44631576538086, "global_step": 184168, "epoch": 1096} {"train_loss": -11.43029499053955, "global_step": 184169, "epoch": 1096} {"train_loss": -11.648111343383789, "global_step": 184170, "epoch": 1096} {"train_loss": -11.369495391845703, "global_step": 184171, "epoch": 1096} {"train_loss": -11.432936668395996, "global_step": 184172, "epoch": 1096} {"train_loss": -11.517894744873047, "global_step": 184173, "epoch": 1096} {"train_loss": -11.608869552612305, "global_step": 184174, "epoch": 1096} {"train_loss": -11.542908668518066, "global_step": 184175, "epoch": 1096} {"train_loss": -11.347723007202148, "global_step": 184176, "epoch": 1096} {"train_loss": -11.644660949707031, "global_step": 184177, "epoch": 1096} {"train_loss": -11.619625091552734, "global_step": 184178, "epoch": 1096} {"train_loss": -11.580060005187988, "global_step": 184179, "epoch": 1096} {"train_loss": -11.57696533203125, "global_step": 184180, "epoch": 1096} {"train_loss": -11.593263626098633, "global_step": 184181, "epoch": 1096} {"train_loss": -11.627544403076172, "global_step": 184182, "epoch": 1096} {"train_loss": -11.361225128173828, "global_step": 184183, "epoch": 1096} {"train_loss": -11.418844223022461, "global_step": 184184, "epoch": 1096} {"train_loss": -11.040327072143555, "global_step": 184185, "epoch": 1096} {"train_loss": -11.054277420043945, "global_step": 184186, "epoch": 1096} {"train_loss": -11.21886920928955, "global_step": 184187, "epoch": 1096} {"train_loss": -9.800436019897461, "global_step": 184188, "epoch": 1096} {"train_loss": -10.19032096862793, "global_step": 184189, "epoch": 1096} {"train_loss": -10.050090789794922, "global_step": 184190, "epoch": 1096} {"train_loss": -10.681872367858887, "global_step": 184191, "epoch": 1096} {"train_loss": -10.748320579528809, "global_step": 184192, "epoch": 1096} {"train_loss": -10.489607810974121, "global_step": 184193, "epoch": 1096} {"train_loss": -10.489200592041016, "global_step": 184194, "epoch": 1096} {"train_loss": -9.730100631713867, "global_step": 184195, "epoch": 1096} {"train_loss": -10.093301773071289, "global_step": 184196, "epoch": 1096} {"train_loss": -10.129768371582031, "global_step": 184197, "epoch": 1096} {"train_loss": -10.025628089904785, "global_step": 184198, "epoch": 1096} {"train_loss": -10.289900779724121, "global_step": 184199, "epoch": 1096} {"train_loss": -10.046916961669922, "global_step": 184200, "epoch": 1096} {"train_loss": -9.748557090759277, "global_step": 184201, "epoch": 1096} {"train_loss": -9.846683502197266, "global_step": 184202, "epoch": 1096} {"train_loss": -10.658185958862305, "global_step": 184203, "epoch": 1096} {"train_loss": -10.551528930664062, "global_step": 184204, "epoch": 1096} {"train_loss": -10.83917236328125, "global_step": 184205, "epoch": 1096} {"train_loss": -10.771844863891602, "global_step": 184206, "epoch": 1096} {"train_loss": -10.52578353881836, "global_step": 184207, "epoch": 1096} {"train_loss": -10.908074378967285, "global_step": 184208, "epoch": 1096} {"train_loss": -10.467155456542969, "global_step": 184209, "epoch": 1096} {"train_loss": -10.681821823120117, "global_step": 184210, "epoch": 1096} {"train_loss": -10.786272048950195, "global_step": 184211, "epoch": 1096} {"train_loss": -10.374691009521484, "global_step": 184212, "epoch": 1096} {"train_loss": -10.950876235961914, "global_step": 184213, "epoch": 1096} {"train_loss": -10.62263298034668, "global_step": 184214, "epoch": 1096} {"train_loss": -10.79304313659668, "global_step": 184215, "epoch": 1096} {"train_loss": -10.781105041503906, "global_step": 184216, "epoch": 1096} {"train_loss": -10.685480117797852, "global_step": 184217, "epoch": 1096} {"train_loss": -10.711877822875977, "global_step": 184218, "epoch": 1096} {"train_loss": -10.99699592590332, "global_step": 184219, "epoch": 1096} {"train_loss": -10.959187507629395, "global_step": 184220, "epoch": 1096} {"train_loss": -10.748714447021484, "global_step": 184221, "epoch": 1096} {"train_loss": -10.926304817199707, "global_step": 184222, "epoch": 1096} {"train_loss": -11.082220077514648, "global_step": 184223, "epoch": 1096} {"train_loss": -10.954022407531738, "global_step": 184224, "epoch": 1096} {"train_loss": -11.103264808654785, "global_step": 184225, "epoch": 1096} {"train_loss": -10.949396133422852, "global_step": 184226, "epoch": 1096} {"train_loss": -11.17045783996582, "global_step": 184227, "epoch": 1096} {"train_loss": -10.964437484741211, "global_step": 184228, "epoch": 1096} {"train_loss": -11.034429550170898, "global_step": 184229, "epoch": 1096} {"train_loss": -11.271677017211914, "global_step": 184230, "epoch": 1096} {"train_loss": -10.777599334716797, "global_step": 184231, "epoch": 1096} {"train_loss": -11.184260368347168, "global_step": 184232, "epoch": 1096} {"train_loss": -11.110133171081543, "global_step": 184233, "epoch": 1096} {"train_loss": -11.126856803894043, "global_step": 184234, "epoch": 1096} {"train_loss": -10.813422203063965, "global_step": 184235, "epoch": 1096} {"train_loss": -11.0370454788208, "global_step": 184236, "epoch": 1096} {"train_loss": -10.839845657348633, "global_step": 184237, "epoch": 1096} {"train_loss": -10.743521690368652, "global_step": 184238, "epoch": 1096} {"train_loss": -10.85930061340332, "global_step": 184239, "epoch": 1096} {"train_loss": -10.637374877929688, "global_step": 184240, "epoch": 1096} {"train_loss": -11.338645935058594, "global_step": 184241, "epoch": 1096} {"train_loss": -10.79166030883789, "global_step": 184242, "epoch": 1096} {"train_loss": -11.109086990356445, "global_step": 184243, "epoch": 1096} {"train_loss": -10.908149719238281, "global_step": 184244, "epoch": 1096} {"train_loss": -11.117324829101562, "global_step": 184245, "epoch": 1096} {"train_loss": -11.210495948791504, "global_step": 184246, "epoch": 1096} {"train_loss": -11.123108863830566, "global_step": 184247, "epoch": 1096} {"train_loss": -11.046110153198242, "global_step": 184248, "epoch": 1096} {"train_loss": -11.193532943725586, "global_step": 184249, "epoch": 1096} {"train_loss": -11.273338317871094, "global_step": 184250, "epoch": 1096} {"train_loss": -11.366900444030762, "global_step": 184251, "epoch": 1096} {"train_loss": -11.010921478271484, "global_step": 184252, "epoch": 1096} {"train_loss": -11.120015144348145, "global_step": 184253, "epoch": 1096} {"train_loss": -11.108691215515137, "global_step": 184254, "epoch": 1096} {"train_loss": -11.046602249145508, "global_step": 184255, "epoch": 1096} {"train_loss": -11.133115768432617, "global_step": 184256, "epoch": 1096} {"train_loss": -11.244876861572266, "global_step": 184257, "epoch": 1096} {"train_loss": -11.271129608154297, "global_step": 184258, "epoch": 1096} {"train_loss": -11.251669883728027, "global_step": 184259, "epoch": 1096} {"train_loss": -11.225136756896973, "global_step": 184260, "epoch": 1096} {"train_loss": -11.378244400024414, "global_step": 184261, "epoch": 1096} {"train_loss": -11.162396430969238, "global_step": 184262, "epoch": 1096} {"train_loss": -11.214615821838379, "global_step": 184263, "epoch": 1096} {"train_loss": -10.701141357421875, "global_step": 184264, "epoch": 1096} {"train_loss": -11.40261459350586, "global_step": 184265, "epoch": 1096} {"train_loss": -10.977849960327148, "global_step": 184266, "epoch": 1096} {"train_loss": -11.41553020477295, "global_step": 184267, "epoch": 1096} {"train_loss": -11.412630081176758, "global_step": 184268, "epoch": 1096} {"train_loss": -11.43741226196289, "global_step": 184269, "epoch": 1096} {"train_loss": -11.443647384643555, "global_step": 184270, "epoch": 1096} {"train_loss": -11.295055389404297, "global_step": 184271, "epoch": 1096} {"train_loss": -11.108511924743652, "global_step": 184272, "epoch": 1096} {"train_loss": -11.373889923095703, "global_step": 184273, "epoch": 1096} {"train_loss": -11.521784782409668, "global_step": 184274, "epoch": 1096} {"train_loss": -11.458610534667969, "global_step": 184275, "epoch": 1096} {"train_loss": -11.361200332641602, "global_step": 184276, "epoch": 1096} {"train_loss": -11.336468696594238, "global_step": 184277, "epoch": 1096} {"train_loss": -11.369604110717773, "global_step": 184278, "epoch": 1096} {"train_loss": -11.495689392089844, "global_step": 184279, "epoch": 1096} {"train_loss": -11.523847579956055, "global_step": 184280, "epoch": 1096} {"train_loss": -11.46384048461914, "global_step": 184281, "epoch": 1096} {"train_loss": -11.559843063354492, "global_step": 184282, "epoch": 1096} {"train_loss": -11.637598037719727, "global_step": 184283, "epoch": 1096} {"train_loss": -11.593053817749023, "global_step": 184284, "epoch": 1096} {"train_loss": -11.517437934875488, "global_step": 184285, "epoch": 1096} {"train_loss": -11.559919357299805, "global_step": 184286, "epoch": 1096} {"train_loss": -11.656455993652344, "global_step": 184287, "epoch": 1096} {"train_loss": -11.70379638671875, "global_step": 184288, "epoch": 1096} {"train_loss": -11.519837379455566, "global_step": 184289, "epoch": 1096} {"train_loss": -11.609748840332031, "global_step": 184290, "epoch": 1096} {"train_loss": -11.304788589477539, "global_step": 184291, "epoch": 1096} {"train_loss": -10.512073516845703, "global_step": 184292, "epoch": 1096} {"train_loss": -10.58719253540039, "global_step": 184293, "epoch": 1096} {"train_loss": -11.53173828125, "global_step": 184294, "epoch": 1096} {"train_loss": -11.088448620977855, "global_step": 184295, "epoch": 1096, "val_loss": 245570.140625} {"train_loss": -10.154373168945312, "global_step": 184296, "epoch": 1097} {"train_loss": -10.538065910339355, "global_step": 184297, "epoch": 1097} {"train_loss": -10.670774459838867, "global_step": 184298, "epoch": 1097} {"train_loss": -11.381413459777832, "global_step": 184299, "epoch": 1097} {"train_loss": -11.271864891052246, "global_step": 184300, "epoch": 1097} {"train_loss": -11.193219184875488, "global_step": 184301, "epoch": 1097} {"train_loss": -11.462141990661621, "global_step": 184302, "epoch": 1097} {"train_loss": -11.156333923339844, "global_step": 184303, "epoch": 1097} {"train_loss": -11.137937545776367, "global_step": 184304, "epoch": 1097} {"train_loss": -10.860300064086914, "global_step": 184305, "epoch": 1097} {"train_loss": -11.107503890991211, "global_step": 184306, "epoch": 1097} {"train_loss": -11.256572723388672, "global_step": 184307, "epoch": 1097} {"train_loss": -11.120807647705078, "global_step": 184308, "epoch": 1097} {"train_loss": -11.379023551940918, "global_step": 184309, "epoch": 1097} {"train_loss": -11.126633644104004, "global_step": 184310, "epoch": 1097} {"train_loss": -11.233757019042969, "global_step": 184311, "epoch": 1097} {"train_loss": -11.118715286254883, "global_step": 184312, "epoch": 1097} {"train_loss": -11.453667640686035, "global_step": 184313, "epoch": 1097} {"train_loss": -11.109245300292969, "global_step": 184314, "epoch": 1097} {"train_loss": -11.077392578125, "global_step": 184315, "epoch": 1097} {"train_loss": -11.081823348999023, "global_step": 184316, "epoch": 1097} {"train_loss": -11.370040893554688, "global_step": 184317, "epoch": 1097} {"train_loss": -11.124736785888672, "global_step": 184318, "epoch": 1097} {"train_loss": -11.614508628845215, "global_step": 184319, "epoch": 1097} {"train_loss": -11.139636039733887, "global_step": 184320, "epoch": 1097} {"train_loss": -11.484800338745117, "global_step": 184321, "epoch": 1097} {"train_loss": -11.201545715332031, "global_step": 184322, "epoch": 1097} {"train_loss": -11.244708061218262, "global_step": 184323, "epoch": 1097} {"train_loss": -11.433691024780273, "global_step": 184324, "epoch": 1097} {"train_loss": -11.266274452209473, "global_step": 184325, "epoch": 1097} {"train_loss": -11.48263168334961, "global_step": 184326, "epoch": 1097} {"train_loss": -11.403251647949219, "global_step": 184327, "epoch": 1097} {"train_loss": -11.235918045043945, "global_step": 184328, "epoch": 1097} {"train_loss": -11.391218185424805, "global_step": 184329, "epoch": 1097} {"train_loss": -11.141935348510742, "global_step": 184330, "epoch": 1097} {"train_loss": -11.001069068908691, "global_step": 184331, "epoch": 1097} {"train_loss": -11.362615585327148, "global_step": 184332, "epoch": 1097} {"train_loss": -11.114435195922852, "global_step": 184333, "epoch": 1097} {"train_loss": -11.375972747802734, "global_step": 184334, "epoch": 1097} {"train_loss": -11.393539428710938, "global_step": 184335, "epoch": 1097} {"train_loss": -11.27885627746582, "global_step": 184336, "epoch": 1097} {"train_loss": -11.725109100341797, "global_step": 184337, "epoch": 1097} {"train_loss": -11.27121353149414, "global_step": 184338, "epoch": 1097} {"train_loss": -11.438127517700195, "global_step": 184339, "epoch": 1097} {"train_loss": -11.26386833190918, "global_step": 184340, "epoch": 1097} {"train_loss": -11.077646255493164, "global_step": 184341, "epoch": 1097} {"train_loss": -11.36036491394043, "global_step": 184342, "epoch": 1097} {"train_loss": -11.228848457336426, "global_step": 184343, "epoch": 1097} {"train_loss": -10.848994255065918, "global_step": 184344, "epoch": 1097} {"train_loss": -11.413765907287598, "global_step": 184345, "epoch": 1097} {"train_loss": -11.440391540527344, "global_step": 184346, "epoch": 1097} {"train_loss": -10.865793228149414, "global_step": 184347, "epoch": 1097} {"train_loss": -11.358147621154785, "global_step": 184348, "epoch": 1097} {"train_loss": -11.058910369873047, "global_step": 184349, "epoch": 1097} {"train_loss": -11.004840850830078, "global_step": 184350, "epoch": 1097} {"train_loss": -11.186464309692383, "global_step": 184351, "epoch": 1097} {"train_loss": -11.168859481811523, "global_step": 184352, "epoch": 1097} {"train_loss": -11.207060813903809, "global_step": 184353, "epoch": 1097} {"train_loss": -11.04816722869873, "global_step": 184354, "epoch": 1097} {"train_loss": -10.848217964172363, "global_step": 184355, "epoch": 1097} {"train_loss": -10.992860794067383, "global_step": 184356, "epoch": 1097} {"train_loss": -11.340864181518555, "global_step": 184357, "epoch": 1097} {"train_loss": -11.160903930664062, "global_step": 184358, "epoch": 1097} {"train_loss": -11.34392261505127, "global_step": 184359, "epoch": 1097} {"train_loss": -10.859254837036133, "global_step": 184360, "epoch": 1097} {"train_loss": -11.015081405639648, "global_step": 184361, "epoch": 1097} {"train_loss": -11.338813781738281, "global_step": 184362, "epoch": 1097} {"train_loss": -10.897940635681152, "global_step": 184363, "epoch": 1097} {"train_loss": -10.913159370422363, "global_step": 184364, "epoch": 1097} {"train_loss": -11.11845588684082, "global_step": 184365, "epoch": 1097} {"train_loss": -11.327862739562988, "global_step": 184366, "epoch": 1097} {"train_loss": -10.906423568725586, "global_step": 184367, "epoch": 1097} {"train_loss": -10.939619064331055, "global_step": 184368, "epoch": 1097} {"train_loss": -10.517072677612305, "global_step": 184369, "epoch": 1097} {"train_loss": -10.85834789276123, "global_step": 184370, "epoch": 1097} {"train_loss": -10.75987434387207, "global_step": 184371, "epoch": 1097} {"train_loss": -11.549261093139648, "global_step": 184372, "epoch": 1097} {"train_loss": -10.884004592895508, "global_step": 184373, "epoch": 1097} {"train_loss": -11.13393783569336, "global_step": 184374, "epoch": 1097} {"train_loss": -10.976638793945312, "global_step": 184375, "epoch": 1097} {"train_loss": -11.273356437683105, "global_step": 184376, "epoch": 1097} {"train_loss": -11.253376007080078, "global_step": 184377, "epoch": 1097} {"train_loss": -11.349770545959473, "global_step": 184378, "epoch": 1097} {"train_loss": -11.504034996032715, "global_step": 184379, "epoch": 1097} {"train_loss": -11.524211883544922, "global_step": 184380, "epoch": 1097} {"train_loss": -11.23194694519043, "global_step": 184381, "epoch": 1097} {"train_loss": -11.318033218383789, "global_step": 184382, "epoch": 1097} {"train_loss": -11.390336036682129, "global_step": 184383, "epoch": 1097} {"train_loss": -11.577407836914062, "global_step": 184384, "epoch": 1097} {"train_loss": -11.554640769958496, "global_step": 184385, "epoch": 1097} {"train_loss": -11.499551773071289, "global_step": 184386, "epoch": 1097} {"train_loss": -11.572921752929688, "global_step": 184387, "epoch": 1097} {"train_loss": -11.333133697509766, "global_step": 184388, "epoch": 1097} {"train_loss": -11.488375663757324, "global_step": 184389, "epoch": 1097} {"train_loss": -11.547591209411621, "global_step": 184390, "epoch": 1097} {"train_loss": -11.35853099822998, "global_step": 184391, "epoch": 1097} {"train_loss": -11.230535507202148, "global_step": 184392, "epoch": 1097} {"train_loss": -11.430073738098145, "global_step": 184393, "epoch": 1097} {"train_loss": -11.482558250427246, "global_step": 184394, "epoch": 1097} {"train_loss": -11.493370056152344, "global_step": 184395, "epoch": 1097} {"train_loss": -11.318039894104004, "global_step": 184396, "epoch": 1097} {"train_loss": -11.324146270751953, "global_step": 184397, "epoch": 1097} {"train_loss": -11.158578872680664, "global_step": 184398, "epoch": 1097} {"train_loss": -11.329505920410156, "global_step": 184399, "epoch": 1097} {"train_loss": -11.318967819213867, "global_step": 184400, "epoch": 1097} {"train_loss": -10.885893821716309, "global_step": 184401, "epoch": 1097} {"train_loss": -11.55763053894043, "global_step": 184402, "epoch": 1097} {"train_loss": -11.37350082397461, "global_step": 184403, "epoch": 1097} {"train_loss": -11.448841094970703, "global_step": 184404, "epoch": 1097} {"train_loss": -11.428757667541504, "global_step": 184405, "epoch": 1097} {"train_loss": -11.090291023254395, "global_step": 184406, "epoch": 1097} {"train_loss": -11.213829040527344, "global_step": 184407, "epoch": 1097} {"train_loss": -10.858506202697754, "global_step": 184408, "epoch": 1097} {"train_loss": -10.718668937683105, "global_step": 184409, "epoch": 1097} {"train_loss": -11.537055015563965, "global_step": 184410, "epoch": 1097} {"train_loss": -11.139055252075195, "global_step": 184411, "epoch": 1097} {"train_loss": -10.489157676696777, "global_step": 184412, "epoch": 1097} {"train_loss": -11.413429260253906, "global_step": 184413, "epoch": 1097} {"train_loss": -10.63071060180664, "global_step": 184414, "epoch": 1097} {"train_loss": -10.768220901489258, "global_step": 184415, "epoch": 1097} {"train_loss": -11.298413276672363, "global_step": 184416, "epoch": 1097} {"train_loss": -9.941045761108398, "global_step": 184417, "epoch": 1097} {"train_loss": -9.976682662963867, "global_step": 184418, "epoch": 1097} {"train_loss": -9.966278076171875, "global_step": 184419, "epoch": 1097} {"train_loss": -8.837940216064453, "global_step": 184420, "epoch": 1097} {"train_loss": -9.227802276611328, "global_step": 184421, "epoch": 1097} {"train_loss": -11.039548873901367, "global_step": 184422, "epoch": 1097} {"train_loss": -8.215499877929688, "global_step": 184423, "epoch": 1097} {"train_loss": -10.448968887329102, "global_step": 184424, "epoch": 1097} {"train_loss": -9.350090980529785, "global_step": 184425, "epoch": 1097} {"train_loss": -8.449548721313477, "global_step": 184426, "epoch": 1097} {"train_loss": -9.325538635253906, "global_step": 184427, "epoch": 1097} {"train_loss": -9.11228084564209, "global_step": 184428, "epoch": 1097} {"train_loss": -9.092109680175781, "global_step": 184429, "epoch": 1097} {"train_loss": -10.071310997009277, "global_step": 184430, "epoch": 1097} {"train_loss": -9.25089168548584, "global_step": 184431, "epoch": 1097} {"train_loss": -9.730956077575684, "global_step": 184432, "epoch": 1097} {"train_loss": -10.554107666015625, "global_step": 184433, "epoch": 1097} {"train_loss": -9.398676872253418, "global_step": 184434, "epoch": 1097} {"train_loss": -10.672769546508789, "global_step": 184435, "epoch": 1097} {"train_loss": -10.126514434814453, "global_step": 184436, "epoch": 1097} {"train_loss": -9.8014554977417, "global_step": 184437, "epoch": 1097} {"train_loss": -10.362574577331543, "global_step": 184438, "epoch": 1097} {"train_loss": -10.314799308776855, "global_step": 184439, "epoch": 1097} {"train_loss": -10.140103340148926, "global_step": 184440, "epoch": 1097} {"train_loss": -10.366661071777344, "global_step": 184441, "epoch": 1097} {"train_loss": -10.70893669128418, "global_step": 184442, "epoch": 1097} {"train_loss": -9.792566299438477, "global_step": 184443, "epoch": 1097} {"train_loss": -10.455623626708984, "global_step": 184444, "epoch": 1097} {"train_loss": -10.399152755737305, "global_step": 184445, "epoch": 1097} {"train_loss": -10.163579940795898, "global_step": 184446, "epoch": 1097} {"train_loss": -10.462738037109375, "global_step": 184447, "epoch": 1097} {"train_loss": -10.142156600952148, "global_step": 184448, "epoch": 1097} {"train_loss": -10.309551239013672, "global_step": 184449, "epoch": 1097} {"train_loss": -10.510128021240234, "global_step": 184450, "epoch": 1097} {"train_loss": -9.871187210083008, "global_step": 184451, "epoch": 1097} {"train_loss": -10.292457580566406, "global_step": 184452, "epoch": 1097} {"train_loss": -10.245950698852539, "global_step": 184453, "epoch": 1097} {"train_loss": -10.42802906036377, "global_step": 184454, "epoch": 1097} {"train_loss": -10.662216186523438, "global_step": 184455, "epoch": 1097} {"train_loss": -10.079811096191406, "global_step": 184456, "epoch": 1097} {"train_loss": -10.354333877563477, "global_step": 184457, "epoch": 1097} {"train_loss": -10.779067993164062, "global_step": 184458, "epoch": 1097} {"train_loss": -9.94856071472168, "global_step": 184459, "epoch": 1097} {"train_loss": -10.715221405029297, "global_step": 184460, "epoch": 1097} {"train_loss": -10.908133506774902, "global_step": 184461, "epoch": 1097} {"train_loss": -10.347869873046875, "global_step": 184462, "epoch": 1097} {"train_loss": -10.878087242444357, "global_step": 184463, "epoch": 1097, "val_loss": 241541.265625} {"train_loss": -10.658378601074219, "global_step": 184464, "epoch": 1098} {"train_loss": -10.732868194580078, "global_step": 184465, "epoch": 1098} {"train_loss": -10.761312484741211, "global_step": 184466, "epoch": 1098} {"train_loss": -10.43983268737793, "global_step": 184467, "epoch": 1098} {"train_loss": -10.937768936157227, "global_step": 184468, "epoch": 1098} {"train_loss": -10.79961109161377, "global_step": 184469, "epoch": 1098} {"train_loss": -10.819367408752441, "global_step": 184470, "epoch": 1098} {"train_loss": -10.89437198638916, "global_step": 184471, "epoch": 1098} {"train_loss": -10.723215103149414, "global_step": 184472, "epoch": 1098} {"train_loss": -10.894108772277832, "global_step": 184473, "epoch": 1098} {"train_loss": -10.687700271606445, "global_step": 184474, "epoch": 1098} {"train_loss": -10.84862995147705, "global_step": 184475, "epoch": 1098} {"train_loss": -10.955883026123047, "global_step": 184476, "epoch": 1098} {"train_loss": -10.914011001586914, "global_step": 184477, "epoch": 1098} {"train_loss": -11.077985763549805, "global_step": 184478, "epoch": 1098} {"train_loss": -10.80070972442627, "global_step": 184479, "epoch": 1098} {"train_loss": -11.163847923278809, "global_step": 184480, "epoch": 1098} {"train_loss": -11.057999610900879, "global_step": 184481, "epoch": 1098} {"train_loss": -11.00228214263916, "global_step": 184482, "epoch": 1098} {"train_loss": -11.061366081237793, "global_step": 184483, "epoch": 1098} {"train_loss": -11.18353271484375, "global_step": 184484, "epoch": 1098} {"train_loss": -11.26369571685791, "global_step": 184485, "epoch": 1098} {"train_loss": -11.098423957824707, "global_step": 184486, "epoch": 1098} {"train_loss": -11.233034133911133, "global_step": 184487, "epoch": 1098} {"train_loss": -11.159226417541504, "global_step": 184488, "epoch": 1098} {"train_loss": -11.352754592895508, "global_step": 184489, "epoch": 1098} {"train_loss": -11.246706008911133, "global_step": 184490, "epoch": 1098} {"train_loss": -11.279596328735352, "global_step": 184491, "epoch": 1098} {"train_loss": -11.399850845336914, "global_step": 184492, "epoch": 1098} {"train_loss": -11.281013488769531, "global_step": 184493, "epoch": 1098} {"train_loss": -11.354982376098633, "global_step": 184494, "epoch": 1098} {"train_loss": -11.238017082214355, "global_step": 184495, "epoch": 1098} {"train_loss": -11.444726943969727, "global_step": 184496, "epoch": 1098} {"train_loss": -11.33135986328125, "global_step": 184497, "epoch": 1098} {"train_loss": -11.40825080871582, "global_step": 184498, "epoch": 1098} {"train_loss": -11.500871658325195, "global_step": 184499, "epoch": 1098} {"train_loss": -11.531105995178223, "global_step": 184500, "epoch": 1098} {"train_loss": -11.324735641479492, "global_step": 184501, "epoch": 1098} {"train_loss": -11.444561004638672, "global_step": 184502, "epoch": 1098} {"train_loss": -11.532270431518555, "global_step": 184503, "epoch": 1098} {"train_loss": -11.588655471801758, "global_step": 184504, "epoch": 1098} {"train_loss": -11.290157318115234, "global_step": 184505, "epoch": 1098} {"train_loss": -11.321600914001465, "global_step": 184506, "epoch": 1098} {"train_loss": -11.507715225219727, "global_step": 184507, "epoch": 1098} {"train_loss": -11.478767395019531, "global_step": 184508, "epoch": 1098} {"train_loss": -11.488494873046875, "global_step": 184509, "epoch": 1098} {"train_loss": -11.463560104370117, "global_step": 184510, "epoch": 1098} {"train_loss": -11.586259841918945, "global_step": 184511, "epoch": 1098} {"train_loss": -11.401204109191895, "global_step": 184512, "epoch": 1098} {"train_loss": -11.636305809020996, "global_step": 184513, "epoch": 1098} {"train_loss": -11.646608352661133, "global_step": 184514, "epoch": 1098} {"train_loss": -11.720666885375977, "global_step": 184515, "epoch": 1098} {"train_loss": -11.702899932861328, "global_step": 184516, "epoch": 1098} {"train_loss": -11.745208740234375, "global_step": 184517, "epoch": 1098} {"train_loss": -11.706672668457031, "global_step": 184518, "epoch": 1098} {"train_loss": -11.77120304107666, "global_step": 184519, "epoch": 1098} {"train_loss": -11.789203643798828, "global_step": 184520, "epoch": 1098} {"train_loss": -11.48495864868164, "global_step": 184521, "epoch": 1098} {"train_loss": -11.477681159973145, "global_step": 184522, "epoch": 1098} {"train_loss": -11.401633262634277, "global_step": 184523, "epoch": 1098} {"train_loss": -11.622312545776367, "global_step": 184524, "epoch": 1098} {"train_loss": -11.594916343688965, "global_step": 184525, "epoch": 1098} {"train_loss": -11.46267318725586, "global_step": 184526, "epoch": 1098} {"train_loss": -11.339313507080078, "global_step": 184527, "epoch": 1098} {"train_loss": -11.707191467285156, "global_step": 184528, "epoch": 1098} {"train_loss": -11.347402572631836, "global_step": 184529, "epoch": 1098} {"train_loss": -11.448165893554688, "global_step": 184530, "epoch": 1098} {"train_loss": -11.514322280883789, "global_step": 184531, "epoch": 1098} {"train_loss": -11.02445125579834, "global_step": 184532, "epoch": 1098} {"train_loss": -9.929996490478516, "global_step": 184533, "epoch": 1098} {"train_loss": -11.397636413574219, "global_step": 184534, "epoch": 1098} {"train_loss": -10.425930976867676, "global_step": 184535, "epoch": 1098} {"train_loss": -10.563103675842285, "global_step": 184536, "epoch": 1098} {"train_loss": -10.814985275268555, "global_step": 184537, "epoch": 1098} {"train_loss": -8.623557090759277, "global_step": 184538, "epoch": 1098} {"train_loss": -10.749841690063477, "global_step": 184539, "epoch": 1098} {"train_loss": -8.752777099609375, "global_step": 184540, "epoch": 1098} {"train_loss": -9.558735847473145, "global_step": 184541, "epoch": 1098} {"train_loss": -9.896499633789062, "global_step": 184542, "epoch": 1098} {"train_loss": -9.686286926269531, "global_step": 184543, "epoch": 1098} {"train_loss": -10.154241561889648, "global_step": 184544, "epoch": 1098} {"train_loss": -8.760801315307617, "global_step": 184545, "epoch": 1098} {"train_loss": -10.539262771606445, "global_step": 184546, "epoch": 1098} {"train_loss": -9.413152694702148, "global_step": 184547, "epoch": 1098} {"train_loss": -9.190390586853027, "global_step": 184548, "epoch": 1098} {"train_loss": -10.331683158874512, "global_step": 184549, "epoch": 1098} {"train_loss": -9.4154691696167, "global_step": 184550, "epoch": 1098} {"train_loss": -9.900528907775879, "global_step": 184551, "epoch": 1098} {"train_loss": -10.26911735534668, "global_step": 184552, "epoch": 1098} {"train_loss": -10.111902236938477, "global_step": 184553, "epoch": 1098} {"train_loss": -9.832440376281738, "global_step": 184554, "epoch": 1098} {"train_loss": -10.555907249450684, "global_step": 184555, "epoch": 1098} {"train_loss": -10.25859260559082, "global_step": 184556, "epoch": 1098} {"train_loss": -10.328765869140625, "global_step": 184557, "epoch": 1098} {"train_loss": -10.54488754272461, "global_step": 184558, "epoch": 1098} {"train_loss": -10.366194725036621, "global_step": 184559, "epoch": 1098} {"train_loss": -10.253416061401367, "global_step": 184560, "epoch": 1098} {"train_loss": -10.736207008361816, "global_step": 184561, "epoch": 1098} {"train_loss": -10.619962692260742, "global_step": 184562, "epoch": 1098} {"train_loss": -10.651433944702148, "global_step": 184563, "epoch": 1098} {"train_loss": -10.544099807739258, "global_step": 184564, "epoch": 1098} {"train_loss": -10.456914901733398, "global_step": 184565, "epoch": 1098} {"train_loss": -10.768811225891113, "global_step": 184566, "epoch": 1098} {"train_loss": -10.441368103027344, "global_step": 184567, "epoch": 1098} {"train_loss": -10.553203582763672, "global_step": 184568, "epoch": 1098} {"train_loss": -10.856107711791992, "global_step": 184569, "epoch": 1098} {"train_loss": -10.74052906036377, "global_step": 184570, "epoch": 1098} {"train_loss": -10.497930526733398, "global_step": 184571, "epoch": 1098} {"train_loss": -11.110119819641113, "global_step": 184572, "epoch": 1098} {"train_loss": -10.789867401123047, "global_step": 184573, "epoch": 1098} {"train_loss": -10.791519165039062, "global_step": 184574, "epoch": 1098} {"train_loss": -10.765520095825195, "global_step": 184575, "epoch": 1098} {"train_loss": -11.016487121582031, "global_step": 184576, "epoch": 1098} {"train_loss": -10.792943000793457, "global_step": 184577, "epoch": 1098} {"train_loss": -10.751108169555664, "global_step": 184578, "epoch": 1098} {"train_loss": -11.031051635742188, "global_step": 184579, "epoch": 1098} {"train_loss": -11.005630493164062, "global_step": 184580, "epoch": 1098} {"train_loss": -10.875347137451172, "global_step": 184581, "epoch": 1098} {"train_loss": -11.119867324829102, "global_step": 184582, "epoch": 1098} {"train_loss": -11.21523666381836, "global_step": 184583, "epoch": 1098} {"train_loss": -10.920992851257324, "global_step": 184584, "epoch": 1098} {"train_loss": -11.234018325805664, "global_step": 184585, "epoch": 1098} {"train_loss": -11.136239051818848, "global_step": 184586, "epoch": 1098} {"train_loss": -11.055144309997559, "global_step": 184587, "epoch": 1098} {"train_loss": -11.033958435058594, "global_step": 184588, "epoch": 1098} {"train_loss": -11.100320816040039, "global_step": 184589, "epoch": 1098} {"train_loss": -11.228113174438477, "global_step": 184590, "epoch": 1098} {"train_loss": -11.022724151611328, "global_step": 184591, "epoch": 1098} {"train_loss": -11.14769172668457, "global_step": 184592, "epoch": 1098} {"train_loss": -11.279075622558594, "global_step": 184593, "epoch": 1098} {"train_loss": -11.298534393310547, "global_step": 184594, "epoch": 1098} {"train_loss": -11.23923110961914, "global_step": 184595, "epoch": 1098} {"train_loss": -11.41256332397461, "global_step": 184596, "epoch": 1098} {"train_loss": -11.346271514892578, "global_step": 184597, "epoch": 1098} {"train_loss": -11.342334747314453, "global_step": 184598, "epoch": 1098} {"train_loss": -11.426488876342773, "global_step": 184599, "epoch": 1098} {"train_loss": -11.352359771728516, "global_step": 184600, "epoch": 1098} {"train_loss": -11.418704986572266, "global_step": 184601, "epoch": 1098} {"train_loss": -11.164764404296875, "global_step": 184602, "epoch": 1098} {"train_loss": -11.217867851257324, "global_step": 184603, "epoch": 1098} {"train_loss": -11.54506778717041, "global_step": 184604, "epoch": 1098} {"train_loss": -11.480840682983398, "global_step": 184605, "epoch": 1098} {"train_loss": -11.387799263000488, "global_step": 184606, "epoch": 1098} {"train_loss": -11.633371353149414, "global_step": 184607, "epoch": 1098} {"train_loss": -11.414278030395508, "global_step": 184608, "epoch": 1098} {"train_loss": -11.602107048034668, "global_step": 184609, "epoch": 1098} {"train_loss": -11.426177024841309, "global_step": 184610, "epoch": 1098} {"train_loss": -11.322717666625977, "global_step": 184611, "epoch": 1098} {"train_loss": -11.422176361083984, "global_step": 184612, "epoch": 1098} {"train_loss": -11.43448257446289, "global_step": 184613, "epoch": 1098} {"train_loss": -11.096450805664062, "global_step": 184614, "epoch": 1098} {"train_loss": -11.392566680908203, "global_step": 184615, "epoch": 1098} {"train_loss": -11.417045593261719, "global_step": 184616, "epoch": 1098} {"train_loss": -11.643768310546875, "global_step": 184617, "epoch": 1098} {"train_loss": -11.352405548095703, "global_step": 184618, "epoch": 1098} {"train_loss": -11.151533126831055, "global_step": 184619, "epoch": 1098} {"train_loss": -11.144637107849121, "global_step": 184620, "epoch": 1098} {"train_loss": -11.592791557312012, "global_step": 184621, "epoch": 1098} {"train_loss": -11.526935577392578, "global_step": 184622, "epoch": 1098} {"train_loss": -11.181462287902832, "global_step": 184623, "epoch": 1098} {"train_loss": -11.274279594421387, "global_step": 184624, "epoch": 1098} {"train_loss": -11.48129653930664, "global_step": 184625, "epoch": 1098} {"train_loss": -11.35395622253418, "global_step": 184626, "epoch": 1098} {"train_loss": -11.47468376159668, "global_step": 184627, "epoch": 1098} {"train_loss": -10.567778587341309, "global_step": 184628, "epoch": 1098} {"train_loss": -10.779613494873047, "global_step": 184629, "epoch": 1098} {"train_loss": -10.711341857910156, "global_step": 184630, "epoch": 1098} {"train_loss": -10.999873740332466, "global_step": 184631, "epoch": 1098, "val_loss": 244932.890625} {"train_loss": -10.075895309448242, "global_step": 184632, "epoch": 1099} {"train_loss": -11.015954971313477, "global_step": 184633, "epoch": 1099} {"train_loss": -10.595708847045898, "global_step": 184634, "epoch": 1099} {"train_loss": -10.300003051757812, "global_step": 184635, "epoch": 1099} {"train_loss": -11.003196716308594, "global_step": 184636, "epoch": 1099} {"train_loss": -11.206193923950195, "global_step": 184637, "epoch": 1099} {"train_loss": -11.377537727355957, "global_step": 184638, "epoch": 1099} {"train_loss": -10.679636001586914, "global_step": 184639, "epoch": 1099} {"train_loss": -11.044822692871094, "global_step": 184640, "epoch": 1099} {"train_loss": -11.018655776977539, "global_step": 184641, "epoch": 1099} {"train_loss": -10.244314193725586, "global_step": 184642, "epoch": 1099} {"train_loss": -10.568574905395508, "global_step": 184643, "epoch": 1099} {"train_loss": -11.15489387512207, "global_step": 184644, "epoch": 1099} {"train_loss": -11.225505828857422, "global_step": 184645, "epoch": 1099} {"train_loss": -11.13255500793457, "global_step": 184646, "epoch": 1099} {"train_loss": -11.398112297058105, "global_step": 184647, "epoch": 1099} {"train_loss": -10.959895133972168, "global_step": 184648, "epoch": 1099} {"train_loss": -11.11701774597168, "global_step": 184649, "epoch": 1099} {"train_loss": -11.029330253601074, "global_step": 184650, "epoch": 1099} {"train_loss": -11.104068756103516, "global_step": 184651, "epoch": 1099} {"train_loss": -11.117805480957031, "global_step": 184652, "epoch": 1099} {"train_loss": -11.208578109741211, "global_step": 184653, "epoch": 1099} {"train_loss": -11.377701759338379, "global_step": 184654, "epoch": 1099} {"train_loss": -11.188867568969727, "global_step": 184655, "epoch": 1099} {"train_loss": -11.26926040649414, "global_step": 184656, "epoch": 1099} {"train_loss": -11.224802017211914, "global_step": 184657, "epoch": 1099} {"train_loss": -11.30595588684082, "global_step": 184658, "epoch": 1099} {"train_loss": -11.043864250183105, "global_step": 184659, "epoch": 1099} {"train_loss": -11.433284759521484, "global_step": 184660, "epoch": 1099} {"train_loss": -11.02380084991455, "global_step": 184661, "epoch": 1099} {"train_loss": -10.979391098022461, "global_step": 184662, "epoch": 1099} {"train_loss": -11.252681732177734, "global_step": 184663, "epoch": 1099} {"train_loss": -11.113929748535156, "global_step": 184664, "epoch": 1099} {"train_loss": -10.974100112915039, "global_step": 184665, "epoch": 1099} {"train_loss": -11.115510940551758, "global_step": 184666, "epoch": 1099} {"train_loss": -11.281354904174805, "global_step": 184667, "epoch": 1099} {"train_loss": -10.961682319641113, "global_step": 184668, "epoch": 1099} {"train_loss": -11.251191139221191, "global_step": 184669, "epoch": 1099} {"train_loss": -10.744229316711426, "global_step": 184670, "epoch": 1099} {"train_loss": -11.327085494995117, "global_step": 184671, "epoch": 1099} {"train_loss": -11.138179779052734, "global_step": 184672, "epoch": 1099} {"train_loss": -11.239853858947754, "global_step": 184673, "epoch": 1099} {"train_loss": -11.012421607971191, "global_step": 184674, "epoch": 1099} {"train_loss": -11.307453155517578, "global_step": 184675, "epoch": 1099} {"train_loss": -11.295287132263184, "global_step": 184676, "epoch": 1099} {"train_loss": -11.018749237060547, "global_step": 184677, "epoch": 1099} {"train_loss": -11.441609382629395, "global_step": 184678, "epoch": 1099} {"train_loss": -11.02354621887207, "global_step": 184679, "epoch": 1099} {"train_loss": -11.308815002441406, "global_step": 184680, "epoch": 1099} {"train_loss": -10.976099014282227, "global_step": 184681, "epoch": 1099} {"train_loss": -11.063258171081543, "global_step": 184682, "epoch": 1099} {"train_loss": -11.090925216674805, "global_step": 184683, "epoch": 1099} {"train_loss": -11.118988037109375, "global_step": 184684, "epoch": 1099} {"train_loss": -11.164299011230469, "global_step": 184685, "epoch": 1099} {"train_loss": -11.23676586151123, "global_step": 184686, "epoch": 1099} {"train_loss": -11.599786758422852, "global_step": 184687, "epoch": 1099} {"train_loss": -11.155525207519531, "global_step": 184688, "epoch": 1099} {"train_loss": -11.193315505981445, "global_step": 184689, "epoch": 1099} {"train_loss": -11.334131240844727, "global_step": 184690, "epoch": 1099} {"train_loss": -11.4424409866333, "global_step": 184691, "epoch": 1099} {"train_loss": -11.14546012878418, "global_step": 184692, "epoch": 1099} {"train_loss": -11.46445369720459, "global_step": 184693, "epoch": 1099} {"train_loss": -11.224044799804688, "global_step": 184694, "epoch": 1099} {"train_loss": -11.368175506591797, "global_step": 184695, "epoch": 1099} {"train_loss": -11.302602767944336, "global_step": 184696, "epoch": 1099} {"train_loss": -11.278054237365723, "global_step": 184697, "epoch": 1099} {"train_loss": -11.464268684387207, "global_step": 184698, "epoch": 1099} {"train_loss": -11.170492172241211, "global_step": 184699, "epoch": 1099} {"train_loss": -11.576969146728516, "global_step": 184700, "epoch": 1099} {"train_loss": -11.326652526855469, "global_step": 184701, "epoch": 1099} {"train_loss": -11.281070709228516, "global_step": 184702, "epoch": 1099} {"train_loss": -11.113239288330078, "global_step": 184703, "epoch": 1099} {"train_loss": -11.092432022094727, "global_step": 184704, "epoch": 1099} {"train_loss": -11.015109062194824, "global_step": 184705, "epoch": 1099} {"train_loss": -11.113826751708984, "global_step": 184706, "epoch": 1099} {"train_loss": -10.868852615356445, "global_step": 184707, "epoch": 1099} {"train_loss": -11.110563278198242, "global_step": 184708, "epoch": 1099} {"train_loss": -11.274344444274902, "global_step": 184709, "epoch": 1099} {"train_loss": -10.822528839111328, "global_step": 184710, "epoch": 1099} {"train_loss": -11.140213966369629, "global_step": 184711, "epoch": 1099} {"train_loss": -10.773573875427246, "global_step": 184712, "epoch": 1099} {"train_loss": -10.661784172058105, "global_step": 184713, "epoch": 1099} {"train_loss": -10.77863883972168, "global_step": 184714, "epoch": 1099} {"train_loss": -10.546372413635254, "global_step": 184715, "epoch": 1099} {"train_loss": -10.237337112426758, "global_step": 184716, "epoch": 1099} {"train_loss": -10.602670669555664, "global_step": 184717, "epoch": 1099} {"train_loss": -9.767507553100586, "global_step": 184718, "epoch": 1099} {"train_loss": -10.954459190368652, "global_step": 184719, "epoch": 1099} {"train_loss": -10.12675666809082, "global_step": 184720, "epoch": 1099} {"train_loss": -10.538232803344727, "global_step": 184721, "epoch": 1099} {"train_loss": -10.748613357543945, "global_step": 184722, "epoch": 1099} {"train_loss": -10.879638671875, "global_step": 184723, "epoch": 1099} {"train_loss": -10.494736671447754, "global_step": 184724, "epoch": 1099} {"train_loss": -11.06270980834961, "global_step": 184725, "epoch": 1099} {"train_loss": -10.88333797454834, "global_step": 184726, "epoch": 1099} {"train_loss": -11.016624450683594, "global_step": 184727, "epoch": 1099} {"train_loss": -11.029973030090332, "global_step": 184728, "epoch": 1099} {"train_loss": -11.120952606201172, "global_step": 184729, "epoch": 1099} {"train_loss": -11.093677520751953, "global_step": 184730, "epoch": 1099} {"train_loss": -11.002223014831543, "global_step": 184731, "epoch": 1099} {"train_loss": -11.333734512329102, "global_step": 184732, "epoch": 1099} {"train_loss": -11.076494216918945, "global_step": 184733, "epoch": 1099} {"train_loss": -11.267766952514648, "global_step": 184734, "epoch": 1099} {"train_loss": -11.304754257202148, "global_step": 184735, "epoch": 1099} {"train_loss": -11.05900764465332, "global_step": 184736, "epoch": 1099} {"train_loss": -11.081918716430664, "global_step": 184737, "epoch": 1099} {"train_loss": -11.08171272277832, "global_step": 184738, "epoch": 1099} {"train_loss": -11.186264991760254, "global_step": 184739, "epoch": 1099} {"train_loss": -11.334698677062988, "global_step": 184740, "epoch": 1099} {"train_loss": -11.191360473632812, "global_step": 184741, "epoch": 1099} {"train_loss": -11.156421661376953, "global_step": 184742, "epoch": 1099} {"train_loss": -10.82909870147705, "global_step": 184743, "epoch": 1099} {"train_loss": -11.590073585510254, "global_step": 184744, "epoch": 1099} {"train_loss": -10.571638107299805, "global_step": 184745, "epoch": 1099} {"train_loss": -11.163349151611328, "global_step": 184746, "epoch": 1099} {"train_loss": -10.695940017700195, "global_step": 184747, "epoch": 1099} {"train_loss": -11.3714017868042, "global_step": 184748, "epoch": 1099} {"train_loss": -11.107528686523438, "global_step": 184749, "epoch": 1099} {"train_loss": -11.141229629516602, "global_step": 184750, "epoch": 1099} {"train_loss": -10.805486679077148, "global_step": 184751, "epoch": 1099} {"train_loss": -11.145636558532715, "global_step": 184752, "epoch": 1099} {"train_loss": -10.949544906616211, "global_step": 184753, "epoch": 1099} {"train_loss": -11.22966480255127, "global_step": 184754, "epoch": 1099} {"train_loss": -11.100198745727539, "global_step": 184755, "epoch": 1099} {"train_loss": -11.094514846801758, "global_step": 184756, "epoch": 1099} {"train_loss": -11.378331184387207, "global_step": 184757, "epoch": 1099} {"train_loss": -11.403032302856445, "global_step": 184758, "epoch": 1099} {"train_loss": -11.169127464294434, "global_step": 184759, "epoch": 1099} {"train_loss": -11.306888580322266, "global_step": 184760, "epoch": 1099} {"train_loss": -11.166370391845703, "global_step": 184761, "epoch": 1099} {"train_loss": -11.02610969543457, "global_step": 184762, "epoch": 1099} {"train_loss": -11.131433486938477, "global_step": 184763, "epoch": 1099} {"train_loss": -11.318811416625977, "global_step": 184764, "epoch": 1099} {"train_loss": -11.42062759399414, "global_step": 184765, "epoch": 1099} {"train_loss": -11.516160011291504, "global_step": 184766, "epoch": 1099} {"train_loss": -11.32193374633789, "global_step": 184767, "epoch": 1099} {"train_loss": -11.494616508483887, "global_step": 184768, "epoch": 1099} {"train_loss": -11.241962432861328, "global_step": 184769, "epoch": 1099} {"train_loss": -10.985347747802734, "global_step": 184770, "epoch": 1099} {"train_loss": -11.405902862548828, "global_step": 184771, "epoch": 1099} {"train_loss": -11.58829116821289, "global_step": 184772, "epoch": 1099} {"train_loss": -11.032577514648438, "global_step": 184773, "epoch": 1099} {"train_loss": -11.520578384399414, "global_step": 184774, "epoch": 1099} {"train_loss": -11.217243194580078, "global_step": 184775, "epoch": 1099} {"train_loss": -11.254552841186523, "global_step": 184776, "epoch": 1099} {"train_loss": -11.564560890197754, "global_step": 184777, "epoch": 1099} {"train_loss": -11.564178466796875, "global_step": 184778, "epoch": 1099} {"train_loss": -11.185873985290527, "global_step": 184779, "epoch": 1099} {"train_loss": -11.270995140075684, "global_step": 184780, "epoch": 1099} {"train_loss": -11.430207252502441, "global_step": 184781, "epoch": 1099} {"train_loss": -11.207386016845703, "global_step": 184782, "epoch": 1099} {"train_loss": -11.386390686035156, "global_step": 184783, "epoch": 1099} {"train_loss": -10.985660552978516, "global_step": 184784, "epoch": 1099} {"train_loss": -11.508947372436523, "global_step": 184785, "epoch": 1099} {"train_loss": -11.405425071716309, "global_step": 184786, "epoch": 1099} {"train_loss": -11.584770202636719, "global_step": 184787, "epoch": 1099} {"train_loss": -11.260950088500977, "global_step": 184788, "epoch": 1099} {"train_loss": -11.710620880126953, "global_step": 184789, "epoch": 1099} {"train_loss": -11.316725730895996, "global_step": 184790, "epoch": 1099} {"train_loss": -11.713180541992188, "global_step": 184791, "epoch": 1099} {"train_loss": -11.38075065612793, "global_step": 184792, "epoch": 1099} {"train_loss": -11.444121360778809, "global_step": 184793, "epoch": 1099} {"train_loss": -11.562471389770508, "global_step": 184794, "epoch": 1099} {"train_loss": -11.49360466003418, "global_step": 184795, "epoch": 1099} {"train_loss": -11.51742172241211, "global_step": 184796, "epoch": 1099} {"train_loss": -11.314788818359375, "global_step": 184797, "epoch": 1099} {"train_loss": -11.287955284118652, "global_step": 184798, "epoch": 1099} {"train_loss": -11.134134758086432, "global_step": 184799, "epoch": 1099, "val_loss": 247301.96875} {"train_loss": -11.32553482055664, "global_step": 184800, "epoch": 1100} {"train_loss": -11.09479808807373, "global_step": 184801, "epoch": 1100} {"train_loss": -11.34305191040039, "global_step": 184802, "epoch": 1100} {"train_loss": -11.189454078674316, "global_step": 184803, "epoch": 1100} {"train_loss": -10.970772743225098, "global_step": 184804, "epoch": 1100} {"train_loss": -11.39080810546875, "global_step": 184805, "epoch": 1100} {"train_loss": -11.069183349609375, "global_step": 184806, "epoch": 1100} {"train_loss": -10.801139831542969, "global_step": 184807, "epoch": 1100} {"train_loss": -11.467207908630371, "global_step": 184808, "epoch": 1100} {"train_loss": -10.761323928833008, "global_step": 184809, "epoch": 1100} {"train_loss": -11.175227165222168, "global_step": 184810, "epoch": 1100} {"train_loss": -11.144100189208984, "global_step": 184811, "epoch": 1100} {"train_loss": -10.685253143310547, "global_step": 184812, "epoch": 1100} {"train_loss": -11.274280548095703, "global_step": 184813, "epoch": 1100} {"train_loss": -10.244553565979004, "global_step": 184814, "epoch": 1100} {"train_loss": -10.83596134185791, "global_step": 184815, "epoch": 1100} {"train_loss": -10.207941055297852, "global_step": 184816, "epoch": 1100} {"train_loss": -10.422013282775879, "global_step": 184817, "epoch": 1100} {"train_loss": -9.61097526550293, "global_step": 184818, "epoch": 1100} {"train_loss": -9.834335327148438, "global_step": 184819, "epoch": 1100} {"train_loss": -10.726787567138672, "global_step": 184820, "epoch": 1100} {"train_loss": -8.489163398742676, "global_step": 184821, "epoch": 1100} {"train_loss": -10.168241500854492, "global_step": 184822, "epoch": 1100} {"train_loss": -8.710519790649414, "global_step": 184823, "epoch": 1100} {"train_loss": -10.398481369018555, "global_step": 184824, "epoch": 1100} {"train_loss": -9.49468994140625, "global_step": 184825, "epoch": 1100} {"train_loss": -10.066693305969238, "global_step": 184826, "epoch": 1100} {"train_loss": -8.865193367004395, "global_step": 184827, "epoch": 1100} {"train_loss": -10.296500205993652, "global_step": 184828, "epoch": 1100} {"train_loss": -8.953134536743164, "global_step": 184829, "epoch": 1100} {"train_loss": -9.411155700683594, "global_step": 184830, "epoch": 1100} {"train_loss": -9.51052474975586, "global_step": 184831, "epoch": 1100} {"train_loss": -10.273360252380371, "global_step": 184832, "epoch": 1100} {"train_loss": -9.587918281555176, "global_step": 184833, "epoch": 1100} {"train_loss": -9.598109245300293, "global_step": 184834, "epoch": 1100} {"train_loss": -10.68625259399414, "global_step": 184835, "epoch": 1100} {"train_loss": -9.141738891601562, "global_step": 184836, "epoch": 1100} {"train_loss": -10.764232635498047, "global_step": 184837, "epoch": 1100} {"train_loss": -9.92947006225586, "global_step": 184838, "epoch": 1100} {"train_loss": -9.988147735595703, "global_step": 184839, "epoch": 1100} {"train_loss": -9.979715347290039, "global_step": 184840, "epoch": 1100} {"train_loss": -10.4586181640625, "global_step": 184841, "epoch": 1100} {"train_loss": -10.144719123840332, "global_step": 184842, "epoch": 1100} {"train_loss": -10.210420608520508, "global_step": 184843, "epoch": 1100} {"train_loss": -10.838265419006348, "global_step": 184844, "epoch": 1100} {"train_loss": -10.414556503295898, "global_step": 184845, "epoch": 1100} {"train_loss": -10.465977668762207, "global_step": 184846, "epoch": 1100} {"train_loss": -10.82813549041748, "global_step": 184847, "epoch": 1100} {"train_loss": -10.815204620361328, "global_step": 184848, "epoch": 1100} {"train_loss": -10.774864196777344, "global_step": 184849, "epoch": 1100} {"train_loss": -10.848274230957031, "global_step": 184850, "epoch": 1100} {"train_loss": -11.039416313171387, "global_step": 184851, "epoch": 1100} {"train_loss": -10.986419677734375, "global_step": 184852, "epoch": 1100} {"train_loss": -10.912618637084961, "global_step": 184853, "epoch": 1100} {"train_loss": -11.009618759155273, "global_step": 184854, "epoch": 1100} {"train_loss": -11.084827423095703, "global_step": 184855, "epoch": 1100} {"train_loss": -10.962596893310547, "global_step": 184856, "epoch": 1100} {"train_loss": -11.010799407958984, "global_step": 184857, "epoch": 1100} {"train_loss": -10.935404777526855, "global_step": 184858, "epoch": 1100} {"train_loss": -11.156960487365723, "global_step": 184859, "epoch": 1100} {"train_loss": -10.9514799118042, "global_step": 184860, "epoch": 1100} {"train_loss": -10.944272994995117, "global_step": 184861, "epoch": 1100} {"train_loss": -11.159610748291016, "global_step": 184862, "epoch": 1100} {"train_loss": -10.926383972167969, "global_step": 184863, "epoch": 1100} {"train_loss": -11.24007511138916, "global_step": 184864, "epoch": 1100} {"train_loss": -11.07282829284668, "global_step": 184865, "epoch": 1100} {"train_loss": -11.115026473999023, "global_step": 184866, "epoch": 1100} {"train_loss": -11.172250747680664, "global_step": 184867, "epoch": 1100} {"train_loss": -11.148091316223145, "global_step": 184868, "epoch": 1100} {"train_loss": -11.201539993286133, "global_step": 184869, "epoch": 1100} {"train_loss": -11.220529556274414, "global_step": 184870, "epoch": 1100} {"train_loss": -11.36978816986084, "global_step": 184871, "epoch": 1100} {"train_loss": -11.224544525146484, "global_step": 184872, "epoch": 1100} {"train_loss": -11.220903396606445, "global_step": 184873, "epoch": 1100} {"train_loss": -11.210073471069336, "global_step": 184874, "epoch": 1100} {"train_loss": -11.089799880981445, "global_step": 184875, "epoch": 1100} {"train_loss": -11.160768508911133, "global_step": 184876, "epoch": 1100} {"train_loss": -11.348182678222656, "global_step": 184877, "epoch": 1100} {"train_loss": -11.31829833984375, "global_step": 184878, "epoch": 1100} {"train_loss": -11.285091400146484, "global_step": 184879, "epoch": 1100} {"train_loss": -11.464176177978516, "global_step": 184880, "epoch": 1100} {"train_loss": -11.448434829711914, "global_step": 184881, "epoch": 1100} {"train_loss": -11.450557708740234, "global_step": 184882, "epoch": 1100} {"train_loss": -11.333358764648438, "global_step": 184883, "epoch": 1100} {"train_loss": -11.432125091552734, "global_step": 184884, "epoch": 1100} {"train_loss": -11.298768043518066, "global_step": 184885, "epoch": 1100} {"train_loss": -11.307699203491211, "global_step": 184886, "epoch": 1100} {"train_loss": -11.510499000549316, "global_step": 184887, "epoch": 1100} {"train_loss": -11.608882904052734, "global_step": 184888, "epoch": 1100} {"train_loss": -11.484947204589844, "global_step": 184889, "epoch": 1100} {"train_loss": -11.574478149414062, "global_step": 184890, "epoch": 1100} {"train_loss": -11.570877075195312, "global_step": 184891, "epoch": 1100} {"train_loss": -11.490157127380371, "global_step": 184892, "epoch": 1100} {"train_loss": -11.525871276855469, "global_step": 184893, "epoch": 1100} {"train_loss": -11.55709457397461, "global_step": 184894, "epoch": 1100} {"train_loss": -11.438592910766602, "global_step": 184895, "epoch": 1100} {"train_loss": -11.465676307678223, "global_step": 184896, "epoch": 1100} {"train_loss": -11.59784984588623, "global_step": 184897, "epoch": 1100} {"train_loss": -11.468010902404785, "global_step": 184898, "epoch": 1100} {"train_loss": -11.346521377563477, "global_step": 184899, "epoch": 1100} {"train_loss": -11.338784217834473, "global_step": 184900, "epoch": 1100} {"train_loss": -11.285383224487305, "global_step": 184901, "epoch": 1100} {"train_loss": -11.465337753295898, "global_step": 184902, "epoch": 1100} {"train_loss": -11.561235427856445, "global_step": 184903, "epoch": 1100} {"train_loss": -11.409137725830078, "global_step": 184904, "epoch": 1100} {"train_loss": -11.583751678466797, "global_step": 184905, "epoch": 1100} {"train_loss": -11.626041412353516, "global_step": 184906, "epoch": 1100} {"train_loss": -11.232669830322266, "global_step": 184907, "epoch": 1100} {"train_loss": -11.039970397949219, "global_step": 184908, "epoch": 1100} {"train_loss": -11.629013061523438, "global_step": 184909, "epoch": 1100} {"train_loss": -11.37282943725586, "global_step": 184910, "epoch": 1100} {"train_loss": -10.795183181762695, "global_step": 184911, "epoch": 1100} {"train_loss": -11.376415252685547, "global_step": 184912, "epoch": 1100} {"train_loss": -11.30163288116455, "global_step": 184913, "epoch": 1100} {"train_loss": -10.819868087768555, "global_step": 184914, "epoch": 1100} {"train_loss": -10.692387580871582, "global_step": 184915, "epoch": 1100} {"train_loss": -10.625349044799805, "global_step": 184916, "epoch": 1100} {"train_loss": -11.463380813598633, "global_step": 184917, "epoch": 1100} {"train_loss": -11.271883964538574, "global_step": 184918, "epoch": 1100} {"train_loss": -11.06313705444336, "global_step": 184919, "epoch": 1100} {"train_loss": -11.71013355255127, "global_step": 184920, "epoch": 1100} {"train_loss": -11.126585006713867, "global_step": 184921, "epoch": 1100} {"train_loss": -11.39453411102295, "global_step": 184922, "epoch": 1100} {"train_loss": -11.466449737548828, "global_step": 184923, "epoch": 1100} {"train_loss": -11.396892547607422, "global_step": 184924, "epoch": 1100} {"train_loss": -11.394701957702637, "global_step": 184925, "epoch": 1100} {"train_loss": -11.114669799804688, "global_step": 184926, "epoch": 1100} {"train_loss": -10.882635116577148, "global_step": 184927, "epoch": 1100} {"train_loss": -11.456482887268066, "global_step": 184928, "epoch": 1100} {"train_loss": -11.477167129516602, "global_step": 184929, "epoch": 1100} {"train_loss": -11.270303726196289, "global_step": 184930, "epoch": 1100} {"train_loss": -11.143798828125, "global_step": 184931, "epoch": 1100} {"train_loss": -11.437779426574707, "global_step": 184932, "epoch": 1100} {"train_loss": -11.404308319091797, "global_step": 184933, "epoch": 1100} {"train_loss": -11.259262084960938, "global_step": 184934, "epoch": 1100} {"train_loss": -11.287785530090332, "global_step": 184935, "epoch": 1100} {"train_loss": -11.118636131286621, "global_step": 184936, "epoch": 1100} {"train_loss": -10.174234390258789, "global_step": 184937, "epoch": 1100} {"train_loss": -11.00227165222168, "global_step": 184938, "epoch": 1100} {"train_loss": -10.736263275146484, "global_step": 184939, "epoch": 1100} {"train_loss": -11.347214698791504, "global_step": 184940, "epoch": 1100} {"train_loss": -10.841650009155273, "global_step": 184941, "epoch": 1100} {"train_loss": -11.36113166809082, "global_step": 184942, "epoch": 1100} {"train_loss": -11.260683059692383, "global_step": 184943, "epoch": 1100} {"train_loss": -11.277111053466797, "global_step": 184944, "epoch": 1100} {"train_loss": -11.008922576904297, "global_step": 184945, "epoch": 1100} {"train_loss": -11.496757507324219, "global_step": 184946, "epoch": 1100} {"train_loss": -11.08372688293457, "global_step": 184947, "epoch": 1100} {"train_loss": -11.306270599365234, "global_step": 184948, "epoch": 1100} {"train_loss": -11.017353057861328, "global_step": 184949, "epoch": 1100} {"train_loss": -11.162874221801758, "global_step": 184950, "epoch": 1100} {"train_loss": -10.847177505493164, "global_step": 184951, "epoch": 1100} {"train_loss": -11.612404823303223, "global_step": 184952, "epoch": 1100} {"train_loss": -10.923925399780273, "global_step": 184953, "epoch": 1100} {"train_loss": -11.132040977478027, "global_step": 184954, "epoch": 1100} {"train_loss": -11.111930847167969, "global_step": 184955, "epoch": 1100} {"train_loss": -10.984405517578125, "global_step": 184956, "epoch": 1100} {"train_loss": -11.50606632232666, "global_step": 184957, "epoch": 1100} {"train_loss": -11.17239761352539, "global_step": 184958, "epoch": 1100} {"train_loss": -10.796257019042969, "global_step": 184959, "epoch": 1100} {"train_loss": -11.109792709350586, "global_step": 184960, "epoch": 1100} {"train_loss": -11.377336502075195, "global_step": 184961, "epoch": 1100} {"train_loss": -11.079242706298828, "global_step": 184962, "epoch": 1100} {"train_loss": -11.189496040344238, "global_step": 184963, "epoch": 1100} {"train_loss": -11.190511703491211, "global_step": 184964, "epoch": 1100} {"train_loss": -11.348440170288086, "global_step": 184965, "epoch": 1100} {"train_loss": -11.263235092163086, "global_step": 184966, "epoch": 1100} {"train_loss": -10.961534505798703, "global_step": 184967, "epoch": 1100, "train/sim_max_reward_0": 0.9841852626683356, "train/sim_max_reward_1": 0.9845892714295738, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.7073746885641253, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.688968333919394, "test/sim_max_reward_4400000": 0.9929213433351756, "test/sim_max_reward_4400001": 0.34489646411047264, "test/sim_max_reward_4400002": 0.09354539605796308, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.8542507694924009, "test/sim_max_reward_4400005": 0.9533072701605865, "test/sim_max_reward_4400006": 0.2735914907606801, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 0.5690280811254868, "test/sim_max_reward_4400009": 0.3638049423281863, "test/sim_max_reward_4400010": 0.977090277598986, "test/sim_max_reward_4400011": 0.9090291677477659, "test/sim_max_reward_4400012": 0.9742815611204239, "test/sim_max_reward_4400013": 0.9725566011095088, "test/sim_max_reward_4400014": 0.5507776782173394, "test/sim_max_reward_4400015": 0.9612943684800968, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.7953188803424488, "test/sim_max_reward_4400019": 0.3470543459148832, "test/sim_max_reward_4400020": 8.943123583871446e-05, "test/sim_max_reward_4400021": 0.9560603450645891, "test/sim_max_reward_4400022": 0.9772672291180399, "test/sim_max_reward_4400023": 0.1498100815272488, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.591766328021657, "test/sim_max_reward_4400026": 0.09670774144238184, "test/sim_max_reward_4400027": 1.0, "test/sim_max_reward_4400028": 0.6531621734838846, "test/sim_max_reward_4400029": 0.9873034838647348, "test/sim_max_reward_4400030": 0.9997123343754327, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.14567620466336847, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 1.0, "test/sim_max_reward_4400036": 0.3765213863391456, "test/sim_max_reward_4400037": 0.9920501090286279, "test/sim_max_reward_4400038": 0.8827024388975893, "test/sim_max_reward_4400039": 0.9814929561029813, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.6425213736564447, "test/sim_max_reward_4400042": 1.0, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.9959703952811034, "test/sim_max_reward_4400045": 0.4672034457106083, "test/sim_max_reward_4400046": 0.3261025395994609, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.7275195927635715, "test/mean_score": 0.6050635056427437, "val_loss": 247938.078125, "train_action_mse_error": 1.280293345451355} {"train_loss": -11.354608535766602, "global_step": 184968, "epoch": 1101} {"train_loss": -11.015666007995605, "global_step": 184969, "epoch": 1101} {"train_loss": -10.892955780029297, "global_step": 184970, "epoch": 1101} {"train_loss": -11.337259292602539, "global_step": 184971, "epoch": 1101} {"train_loss": -10.399675369262695, "global_step": 184972, "epoch": 1101} {"train_loss": -10.996858596801758, "global_step": 184973, "epoch": 1101} {"train_loss": -11.16434383392334, "global_step": 184974, "epoch": 1101} {"train_loss": -11.092513084411621, "global_step": 184975, "epoch": 1101} {"train_loss": -11.270723342895508, "global_step": 184976, "epoch": 1101} {"train_loss": -10.979166030883789, "global_step": 184977, "epoch": 1101} {"train_loss": -11.100452423095703, "global_step": 184978, "epoch": 1101} {"train_loss": -11.04736042022705, "global_step": 184979, "epoch": 1101} {"train_loss": -11.171079635620117, "global_step": 184980, "epoch": 1101} {"train_loss": -11.477144241333008, "global_step": 184981, "epoch": 1101} {"train_loss": -10.803504943847656, "global_step": 184982, "epoch": 1101} {"train_loss": -11.307792663574219, "global_step": 184983, "epoch": 1101} {"train_loss": -11.0302095413208, "global_step": 184984, "epoch": 1101} {"train_loss": -10.961380004882812, "global_step": 184985, "epoch": 1101} {"train_loss": -11.256574630737305, "global_step": 184986, "epoch": 1101} {"train_loss": -10.82104206085205, "global_step": 184987, "epoch": 1101} {"train_loss": -11.215744972229004, "global_step": 184988, "epoch": 1101} {"train_loss": -11.064923286437988, "global_step": 184989, "epoch": 1101} {"train_loss": -11.127452850341797, "global_step": 184990, "epoch": 1101} {"train_loss": -11.342569351196289, "global_step": 184991, "epoch": 1101} {"train_loss": -11.241508483886719, "global_step": 184992, "epoch": 1101} {"train_loss": -11.327749252319336, "global_step": 184993, "epoch": 1101} {"train_loss": -11.169084548950195, "global_step": 184994, "epoch": 1101} {"train_loss": -11.169210433959961, "global_step": 184995, "epoch": 1101} {"train_loss": -11.308683395385742, "global_step": 184996, "epoch": 1101} {"train_loss": -11.507051467895508, "global_step": 184997, "epoch": 1101} {"train_loss": -11.240649223327637, "global_step": 184998, "epoch": 1101} {"train_loss": -11.302923202514648, "global_step": 184999, "epoch": 1101} {"train_loss": -10.95212173461914, "global_step": 185000, "epoch": 1101} {"train_loss": -11.167293548583984, "global_step": 185001, "epoch": 1101} {"train_loss": -11.10246753692627, "global_step": 185002, "epoch": 1101} {"train_loss": -10.81716537475586, "global_step": 185003, "epoch": 1101} {"train_loss": -10.986662864685059, "global_step": 185004, "epoch": 1101} {"train_loss": -10.923837661743164, "global_step": 185005, "epoch": 1101} {"train_loss": -11.134206771850586, "global_step": 185006, "epoch": 1101} {"train_loss": -11.056602478027344, "global_step": 185007, "epoch": 1101} {"train_loss": -10.553370475769043, "global_step": 185008, "epoch": 1101} {"train_loss": -11.09939956665039, "global_step": 185009, "epoch": 1101} {"train_loss": -10.907691955566406, "global_step": 185010, "epoch": 1101} {"train_loss": -10.934613227844238, "global_step": 185011, "epoch": 1101} {"train_loss": -10.692296981811523, "global_step": 185012, "epoch": 1101} {"train_loss": -10.6420316696167, "global_step": 185013, "epoch": 1101} {"train_loss": -10.90234375, "global_step": 185014, "epoch": 1101} {"train_loss": -11.095714569091797, "global_step": 185015, "epoch": 1101} {"train_loss": -11.13886547088623, "global_step": 185016, "epoch": 1101} {"train_loss": -10.962764739990234, "global_step": 185017, "epoch": 1101} {"train_loss": -11.046530723571777, "global_step": 185018, "epoch": 1101} {"train_loss": -11.127424240112305, "global_step": 185019, "epoch": 1101} {"train_loss": -11.037734985351562, "global_step": 185020, "epoch": 1101} {"train_loss": -10.796889305114746, "global_step": 185021, "epoch": 1101} {"train_loss": -10.679522514343262, "global_step": 185022, "epoch": 1101} {"train_loss": -10.716349601745605, "global_step": 185023, "epoch": 1101} {"train_loss": -10.801074028015137, "global_step": 185024, "epoch": 1101} {"train_loss": -10.773740768432617, "global_step": 185025, "epoch": 1101} {"train_loss": -10.703566551208496, "global_step": 185026, "epoch": 1101} {"train_loss": -11.286216735839844, "global_step": 185027, "epoch": 1101} {"train_loss": -10.915433883666992, "global_step": 185028, "epoch": 1101} {"train_loss": -10.686559677124023, "global_step": 185029, "epoch": 1101} {"train_loss": -10.788810729980469, "global_step": 185030, "epoch": 1101} {"train_loss": -10.695377349853516, "global_step": 185031, "epoch": 1101} {"train_loss": -11.125541687011719, "global_step": 185032, "epoch": 1101} {"train_loss": -10.873337745666504, "global_step": 185033, "epoch": 1101} {"train_loss": -11.294553756713867, "global_step": 185034, "epoch": 1101} {"train_loss": -11.130748748779297, "global_step": 185035, "epoch": 1101} {"train_loss": -11.173952102661133, "global_step": 185036, "epoch": 1101} {"train_loss": -11.288396835327148, "global_step": 185037, "epoch": 1101} {"train_loss": -11.026317596435547, "global_step": 185038, "epoch": 1101} {"train_loss": -11.133721351623535, "global_step": 185039, "epoch": 1101} {"train_loss": -10.882770538330078, "global_step": 185040, "epoch": 1101} {"train_loss": -11.298115730285645, "global_step": 185041, "epoch": 1101} {"train_loss": -10.98519229888916, "global_step": 185042, "epoch": 1101} {"train_loss": -11.43685531616211, "global_step": 185043, "epoch": 1101} {"train_loss": -11.267118453979492, "global_step": 185044, "epoch": 1101} {"train_loss": -11.200164794921875, "global_step": 185045, "epoch": 1101} {"train_loss": -11.305789947509766, "global_step": 185046, "epoch": 1101} {"train_loss": -11.145397186279297, "global_step": 185047, "epoch": 1101} {"train_loss": -11.429529190063477, "global_step": 185048, "epoch": 1101} {"train_loss": -11.251981735229492, "global_step": 185049, "epoch": 1101} {"train_loss": -11.155345916748047, "global_step": 185050, "epoch": 1101} {"train_loss": -11.483314514160156, "global_step": 185051, "epoch": 1101} {"train_loss": -11.248852729797363, "global_step": 185052, "epoch": 1101} {"train_loss": -11.518487930297852, "global_step": 185053, "epoch": 1101} {"train_loss": -11.262300491333008, "global_step": 185054, "epoch": 1101} {"train_loss": -11.33857536315918, "global_step": 185055, "epoch": 1101} {"train_loss": -11.526580810546875, "global_step": 185056, "epoch": 1101} {"train_loss": -11.367072105407715, "global_step": 185057, "epoch": 1101} {"train_loss": -11.562764167785645, "global_step": 185058, "epoch": 1101} {"train_loss": -11.235777854919434, "global_step": 185059, "epoch": 1101} {"train_loss": -11.497846603393555, "global_step": 185060, "epoch": 1101} {"train_loss": -11.475248336791992, "global_step": 185061, "epoch": 1101} {"train_loss": -11.1956787109375, "global_step": 185062, "epoch": 1101} {"train_loss": -11.584348678588867, "global_step": 185063, "epoch": 1101} {"train_loss": -11.109026908874512, "global_step": 185064, "epoch": 1101} {"train_loss": -11.470956802368164, "global_step": 185065, "epoch": 1101} {"train_loss": -11.184205055236816, "global_step": 185066, "epoch": 1101} {"train_loss": -11.078737258911133, "global_step": 185067, "epoch": 1101} {"train_loss": -11.531445503234863, "global_step": 185068, "epoch": 1101} {"train_loss": -11.410728454589844, "global_step": 185069, "epoch": 1101} {"train_loss": -11.124383926391602, "global_step": 185070, "epoch": 1101} {"train_loss": -11.619247436523438, "global_step": 185071, "epoch": 1101} {"train_loss": -11.161571502685547, "global_step": 185072, "epoch": 1101} {"train_loss": -10.955024719238281, "global_step": 185073, "epoch": 1101} {"train_loss": -11.312881469726562, "global_step": 185074, "epoch": 1101} {"train_loss": -10.471307754516602, "global_step": 185075, "epoch": 1101} {"train_loss": -11.435785293579102, "global_step": 185076, "epoch": 1101} {"train_loss": -10.433555603027344, "global_step": 185077, "epoch": 1101} {"train_loss": -10.195405960083008, "global_step": 185078, "epoch": 1101} {"train_loss": -11.022726058959961, "global_step": 185079, "epoch": 1101} {"train_loss": -9.819210052490234, "global_step": 185080, "epoch": 1101} {"train_loss": -10.816848754882812, "global_step": 185081, "epoch": 1101} {"train_loss": -10.635473251342773, "global_step": 185082, "epoch": 1101} {"train_loss": -9.61471939086914, "global_step": 185083, "epoch": 1101} {"train_loss": -11.120234489440918, "global_step": 185084, "epoch": 1101} {"train_loss": -9.910287857055664, "global_step": 185085, "epoch": 1101} {"train_loss": -11.115610122680664, "global_step": 185086, "epoch": 1101} {"train_loss": -10.176897048950195, "global_step": 185087, "epoch": 1101} {"train_loss": -10.982978820800781, "global_step": 185088, "epoch": 1101} {"train_loss": -10.704510688781738, "global_step": 185089, "epoch": 1101} {"train_loss": -11.09969711303711, "global_step": 185090, "epoch": 1101} {"train_loss": -10.945951461791992, "global_step": 185091, "epoch": 1101} {"train_loss": -10.981264114379883, "global_step": 185092, "epoch": 1101} {"train_loss": -11.138319969177246, "global_step": 185093, "epoch": 1101} {"train_loss": -11.228095054626465, "global_step": 185094, "epoch": 1101} {"train_loss": -10.913202285766602, "global_step": 185095, "epoch": 1101} {"train_loss": -11.246472358703613, "global_step": 185096, "epoch": 1101} {"train_loss": -11.166097640991211, "global_step": 185097, "epoch": 1101} {"train_loss": -11.063922882080078, "global_step": 185098, "epoch": 1101} {"train_loss": -11.07697582244873, "global_step": 185099, "epoch": 1101} {"train_loss": -11.088384628295898, "global_step": 185100, "epoch": 1101} {"train_loss": -11.156856536865234, "global_step": 185101, "epoch": 1101} {"train_loss": -11.100170135498047, "global_step": 185102, "epoch": 1101} {"train_loss": -11.445996284484863, "global_step": 185103, "epoch": 1101} {"train_loss": -11.175752639770508, "global_step": 185104, "epoch": 1101} {"train_loss": -11.294330596923828, "global_step": 185105, "epoch": 1101} {"train_loss": -11.357061386108398, "global_step": 185106, "epoch": 1101} {"train_loss": -11.395780563354492, "global_step": 185107, "epoch": 1101} {"train_loss": -11.26933479309082, "global_step": 185108, "epoch": 1101} {"train_loss": -11.520700454711914, "global_step": 185109, "epoch": 1101} {"train_loss": -11.426504135131836, "global_step": 185110, "epoch": 1101} {"train_loss": -11.008275985717773, "global_step": 185111, "epoch": 1101} {"train_loss": -11.157909393310547, "global_step": 185112, "epoch": 1101} {"train_loss": -11.012945175170898, "global_step": 185113, "epoch": 1101} {"train_loss": -11.506120681762695, "global_step": 185114, "epoch": 1101} {"train_loss": -11.368542671203613, "global_step": 185115, "epoch": 1101} {"train_loss": -11.366901397705078, "global_step": 185116, "epoch": 1101} {"train_loss": -11.288346290588379, "global_step": 185117, "epoch": 1101} {"train_loss": -11.2935791015625, "global_step": 185118, "epoch": 1101} {"train_loss": -11.220680236816406, "global_step": 185119, "epoch": 1101} {"train_loss": -11.432072639465332, "global_step": 185120, "epoch": 1101} {"train_loss": -11.456193923950195, "global_step": 185121, "epoch": 1101} {"train_loss": -11.538589477539062, "global_step": 185122, "epoch": 1101} {"train_loss": -11.659605979919434, "global_step": 185123, "epoch": 1101} {"train_loss": -11.414552688598633, "global_step": 185124, "epoch": 1101} {"train_loss": -11.470382690429688, "global_step": 185125, "epoch": 1101} {"train_loss": -11.238574028015137, "global_step": 185126, "epoch": 1101} {"train_loss": -11.610325813293457, "global_step": 185127, "epoch": 1101} {"train_loss": -11.703054428100586, "global_step": 185128, "epoch": 1101} {"train_loss": -11.369203567504883, "global_step": 185129, "epoch": 1101} {"train_loss": -11.56832504272461, "global_step": 185130, "epoch": 1101} {"train_loss": -11.469928741455078, "global_step": 185131, "epoch": 1101} {"train_loss": -11.723581314086914, "global_step": 185132, "epoch": 1101} {"train_loss": -11.547321319580078, "global_step": 185133, "epoch": 1101} {"train_loss": -11.587631225585938, "global_step": 185134, "epoch": 1101} {"train_loss": -11.12710398151761, "global_step": 185135, "epoch": 1101, "val_loss": 245032.734375} {"train_loss": -11.510486602783203, "global_step": 185136, "epoch": 1102} {"train_loss": -11.50892448425293, "global_step": 185137, "epoch": 1102} {"train_loss": -11.58832836151123, "global_step": 185138, "epoch": 1102} {"train_loss": -11.643165588378906, "global_step": 185139, "epoch": 1102} {"train_loss": -11.343743324279785, "global_step": 185140, "epoch": 1102} {"train_loss": -11.359602928161621, "global_step": 185141, "epoch": 1102} {"train_loss": -11.332405090332031, "global_step": 185142, "epoch": 1102} {"train_loss": -11.304502487182617, "global_step": 185143, "epoch": 1102} {"train_loss": -11.426895141601562, "global_step": 185144, "epoch": 1102} {"train_loss": -11.33762264251709, "global_step": 185145, "epoch": 1102} {"train_loss": -11.244991302490234, "global_step": 185146, "epoch": 1102} {"train_loss": -11.560247421264648, "global_step": 185147, "epoch": 1102} {"train_loss": -11.346675872802734, "global_step": 185148, "epoch": 1102} {"train_loss": -11.474984169006348, "global_step": 185149, "epoch": 1102} {"train_loss": -11.45042896270752, "global_step": 185150, "epoch": 1102} {"train_loss": -11.001106262207031, "global_step": 185151, "epoch": 1102} {"train_loss": -10.94163703918457, "global_step": 185152, "epoch": 1102} {"train_loss": -11.149487495422363, "global_step": 185153, "epoch": 1102} {"train_loss": -10.951969146728516, "global_step": 185154, "epoch": 1102} {"train_loss": -10.89239501953125, "global_step": 185155, "epoch": 1102} {"train_loss": -11.226032257080078, "global_step": 185156, "epoch": 1102} {"train_loss": -11.2298583984375, "global_step": 185157, "epoch": 1102} {"train_loss": -10.861705780029297, "global_step": 185158, "epoch": 1102} {"train_loss": -11.144628524780273, "global_step": 185159, "epoch": 1102} {"train_loss": -11.38615608215332, "global_step": 185160, "epoch": 1102} {"train_loss": -11.028972625732422, "global_step": 185161, "epoch": 1102} {"train_loss": -10.518943786621094, "global_step": 185162, "epoch": 1102} {"train_loss": -11.324063301086426, "global_step": 185163, "epoch": 1102} {"train_loss": -11.133567810058594, "global_step": 185164, "epoch": 1102} {"train_loss": -10.80722427368164, "global_step": 185165, "epoch": 1102} {"train_loss": -11.019735336303711, "global_step": 185166, "epoch": 1102} {"train_loss": -11.131195068359375, "global_step": 185167, "epoch": 1102} {"train_loss": -10.945610046386719, "global_step": 185168, "epoch": 1102} {"train_loss": -10.501514434814453, "global_step": 185169, "epoch": 1102} {"train_loss": -11.282464027404785, "global_step": 185170, "epoch": 1102} {"train_loss": -11.078389167785645, "global_step": 185171, "epoch": 1102} {"train_loss": -10.708888053894043, "global_step": 185172, "epoch": 1102} {"train_loss": -11.320866584777832, "global_step": 185173, "epoch": 1102} {"train_loss": -10.947542190551758, "global_step": 185174, "epoch": 1102} {"train_loss": -11.062894821166992, "global_step": 185175, "epoch": 1102} {"train_loss": -10.930543899536133, "global_step": 185176, "epoch": 1102} {"train_loss": -10.446626663208008, "global_step": 185177, "epoch": 1102} {"train_loss": -11.268489837646484, "global_step": 185178, "epoch": 1102} {"train_loss": -10.891653060913086, "global_step": 185179, "epoch": 1102} {"train_loss": -10.905879020690918, "global_step": 185180, "epoch": 1102} {"train_loss": -10.684511184692383, "global_step": 185181, "epoch": 1102} {"train_loss": -10.76527214050293, "global_step": 185182, "epoch": 1102} {"train_loss": -10.78079605102539, "global_step": 185183, "epoch": 1102} {"train_loss": -10.720333099365234, "global_step": 185184, "epoch": 1102} {"train_loss": -11.056631088256836, "global_step": 185185, "epoch": 1102} {"train_loss": -10.756834030151367, "global_step": 185186, "epoch": 1102} {"train_loss": -10.904278755187988, "global_step": 185187, "epoch": 1102} {"train_loss": -10.763242721557617, "global_step": 185188, "epoch": 1102} {"train_loss": -11.098161697387695, "global_step": 185189, "epoch": 1102} {"train_loss": -11.004645347595215, "global_step": 185190, "epoch": 1102} {"train_loss": -10.420124053955078, "global_step": 185191, "epoch": 1102} {"train_loss": -10.729477882385254, "global_step": 185192, "epoch": 1102} {"train_loss": -10.908281326293945, "global_step": 185193, "epoch": 1102} {"train_loss": -10.02261734008789, "global_step": 185194, "epoch": 1102} {"train_loss": -11.295970916748047, "global_step": 185195, "epoch": 1102} {"train_loss": -10.15742301940918, "global_step": 185196, "epoch": 1102} {"train_loss": -10.88438606262207, "global_step": 185197, "epoch": 1102} {"train_loss": -10.795469284057617, "global_step": 185198, "epoch": 1102} {"train_loss": -11.089305877685547, "global_step": 185199, "epoch": 1102} {"train_loss": -10.852243423461914, "global_step": 185200, "epoch": 1102} {"train_loss": -10.978879928588867, "global_step": 185201, "epoch": 1102} {"train_loss": -10.729002952575684, "global_step": 185202, "epoch": 1102} {"train_loss": -10.394157409667969, "global_step": 185203, "epoch": 1102} {"train_loss": -10.765703201293945, "global_step": 185204, "epoch": 1102} {"train_loss": -10.345154762268066, "global_step": 185205, "epoch": 1102} {"train_loss": -10.69894027709961, "global_step": 185206, "epoch": 1102} {"train_loss": -10.352252960205078, "global_step": 185207, "epoch": 1102} {"train_loss": -10.536402702331543, "global_step": 185208, "epoch": 1102} {"train_loss": -10.638240814208984, "global_step": 185209, "epoch": 1102} {"train_loss": -10.529672622680664, "global_step": 185210, "epoch": 1102} {"train_loss": -10.565760612487793, "global_step": 185211, "epoch": 1102} {"train_loss": -10.647013664245605, "global_step": 185212, "epoch": 1102} {"train_loss": -10.534711837768555, "global_step": 185213, "epoch": 1102} {"train_loss": -11.002768516540527, "global_step": 185214, "epoch": 1102} {"train_loss": -10.82766342163086, "global_step": 185215, "epoch": 1102} {"train_loss": -10.974660873413086, "global_step": 185216, "epoch": 1102} {"train_loss": -10.927739143371582, "global_step": 185217, "epoch": 1102} {"train_loss": -10.93819522857666, "global_step": 185218, "epoch": 1102} {"train_loss": -11.05333423614502, "global_step": 185219, "epoch": 1102} {"train_loss": -10.906497955322266, "global_step": 185220, "epoch": 1102} {"train_loss": -10.923133850097656, "global_step": 185221, "epoch": 1102} {"train_loss": -11.234527587890625, "global_step": 185222, "epoch": 1102} {"train_loss": -11.122465133666992, "global_step": 185223, "epoch": 1102} {"train_loss": -11.352949142456055, "global_step": 185224, "epoch": 1102} {"train_loss": -11.135180473327637, "global_step": 185225, "epoch": 1102} {"train_loss": -11.088143348693848, "global_step": 185226, "epoch": 1102} {"train_loss": -11.188122749328613, "global_step": 185227, "epoch": 1102} {"train_loss": -11.306747436523438, "global_step": 185228, "epoch": 1102} {"train_loss": -11.23177433013916, "global_step": 185229, "epoch": 1102} {"train_loss": -11.353429794311523, "global_step": 185230, "epoch": 1102} {"train_loss": -11.430662155151367, "global_step": 185231, "epoch": 1102} {"train_loss": -11.15787124633789, "global_step": 185232, "epoch": 1102} {"train_loss": -11.251811981201172, "global_step": 185233, "epoch": 1102} {"train_loss": -11.527261734008789, "global_step": 185234, "epoch": 1102} {"train_loss": -11.35107421875, "global_step": 185235, "epoch": 1102} {"train_loss": -11.334209442138672, "global_step": 185236, "epoch": 1102} {"train_loss": -11.46079158782959, "global_step": 185237, "epoch": 1102} {"train_loss": -11.335189819335938, "global_step": 185238, "epoch": 1102} {"train_loss": -11.467826843261719, "global_step": 185239, "epoch": 1102} {"train_loss": -11.358278274536133, "global_step": 185240, "epoch": 1102} {"train_loss": -11.491342544555664, "global_step": 185241, "epoch": 1102} {"train_loss": -11.48611831665039, "global_step": 185242, "epoch": 1102} {"train_loss": -11.403739929199219, "global_step": 185243, "epoch": 1102} {"train_loss": -11.517374992370605, "global_step": 185244, "epoch": 1102} {"train_loss": -11.473810195922852, "global_step": 185245, "epoch": 1102} {"train_loss": -11.278932571411133, "global_step": 185246, "epoch": 1102} {"train_loss": -11.444315910339355, "global_step": 185247, "epoch": 1102} {"train_loss": -11.401073455810547, "global_step": 185248, "epoch": 1102} {"train_loss": -11.72525405883789, "global_step": 185249, "epoch": 1102} {"train_loss": -11.523466110229492, "global_step": 185250, "epoch": 1102} {"train_loss": -11.782333374023438, "global_step": 185251, "epoch": 1102} {"train_loss": -11.56916618347168, "global_step": 185252, "epoch": 1102} {"train_loss": -11.690601348876953, "global_step": 185253, "epoch": 1102} {"train_loss": -11.760705947875977, "global_step": 185254, "epoch": 1102} {"train_loss": -11.70434856414795, "global_step": 185255, "epoch": 1102} {"train_loss": -11.621135711669922, "global_step": 185256, "epoch": 1102} {"train_loss": -11.722382545471191, "global_step": 185257, "epoch": 1102} {"train_loss": -11.71255111694336, "global_step": 185258, "epoch": 1102} {"train_loss": -11.653075218200684, "global_step": 185259, "epoch": 1102} {"train_loss": -11.690896987915039, "global_step": 185260, "epoch": 1102} {"train_loss": -11.522310256958008, "global_step": 185261, "epoch": 1102} {"train_loss": -11.746902465820312, "global_step": 185262, "epoch": 1102} {"train_loss": -11.704834938049316, "global_step": 185263, "epoch": 1102} {"train_loss": -11.659195899963379, "global_step": 185264, "epoch": 1102} {"train_loss": -11.914807319641113, "global_step": 185265, "epoch": 1102} {"train_loss": -11.66384506225586, "global_step": 185266, "epoch": 1102} {"train_loss": -11.534746170043945, "global_step": 185267, "epoch": 1102} {"train_loss": -11.758138656616211, "global_step": 185268, "epoch": 1102} {"train_loss": -11.555831909179688, "global_step": 185269, "epoch": 1102} {"train_loss": -11.664911270141602, "global_step": 185270, "epoch": 1102} {"train_loss": -11.150547981262207, "global_step": 185271, "epoch": 1102} {"train_loss": -11.241811752319336, "global_step": 185272, "epoch": 1102} {"train_loss": -10.453371047973633, "global_step": 185273, "epoch": 1102} {"train_loss": -10.302892684936523, "global_step": 185274, "epoch": 1102} {"train_loss": -10.205682754516602, "global_step": 185275, "epoch": 1102} {"train_loss": -9.907160758972168, "global_step": 185276, "epoch": 1102} {"train_loss": -7.759071350097656, "global_step": 185277, "epoch": 1102} {"train_loss": -9.465322494506836, "global_step": 185278, "epoch": 1102} {"train_loss": -7.673741340637207, "global_step": 185279, "epoch": 1102} {"train_loss": -8.642099380493164, "global_step": 185280, "epoch": 1102} {"train_loss": -8.156850814819336, "global_step": 185281, "epoch": 1102} {"train_loss": -9.656242370605469, "global_step": 185282, "epoch": 1102} {"train_loss": -7.325162887573242, "global_step": 185283, "epoch": 1102} {"train_loss": -8.665401458740234, "global_step": 185284, "epoch": 1102} {"train_loss": -8.380965232849121, "global_step": 185285, "epoch": 1102} {"train_loss": -9.482841491699219, "global_step": 185286, "epoch": 1102} {"train_loss": -10.45606803894043, "global_step": 185287, "epoch": 1102} {"train_loss": -8.498756408691406, "global_step": 185288, "epoch": 1102} {"train_loss": -10.675168991088867, "global_step": 185289, "epoch": 1102} {"train_loss": -9.005823135375977, "global_step": 185290, "epoch": 1102} {"train_loss": -10.529288291931152, "global_step": 185291, "epoch": 1102} {"train_loss": -9.730932235717773, "global_step": 185292, "epoch": 1102} {"train_loss": -10.429302215576172, "global_step": 185293, "epoch": 1102} {"train_loss": -10.520379066467285, "global_step": 185294, "epoch": 1102} {"train_loss": -10.310043334960938, "global_step": 185295, "epoch": 1102} {"train_loss": -10.739466667175293, "global_step": 185296, "epoch": 1102} {"train_loss": -9.823369026184082, "global_step": 185297, "epoch": 1102} {"train_loss": -10.487916946411133, "global_step": 185298, "epoch": 1102} {"train_loss": -10.827521324157715, "global_step": 185299, "epoch": 1102} {"train_loss": -10.430133819580078, "global_step": 185300, "epoch": 1102} {"train_loss": -10.821046829223633, "global_step": 185301, "epoch": 1102} {"train_loss": -10.842899322509766, "global_step": 185302, "epoch": 1102} {"train_loss": -10.886265737669808, "global_step": 185303, "epoch": 1102, "val_loss": 236199.984375} {"train_loss": -10.657392501831055, "global_step": 185304, "epoch": 1103} {"train_loss": -10.918375015258789, "global_step": 185305, "epoch": 1103} {"train_loss": -10.886171340942383, "global_step": 185306, "epoch": 1103} {"train_loss": -10.966654777526855, "global_step": 185307, "epoch": 1103} {"train_loss": -10.81826400756836, "global_step": 185308, "epoch": 1103} {"train_loss": -10.921026229858398, "global_step": 185309, "epoch": 1103} {"train_loss": -11.096647262573242, "global_step": 185310, "epoch": 1103} {"train_loss": -10.892120361328125, "global_step": 185311, "epoch": 1103} {"train_loss": -11.047657012939453, "global_step": 185312, "epoch": 1103} {"train_loss": -10.996161460876465, "global_step": 185313, "epoch": 1103} {"train_loss": -11.139915466308594, "global_step": 185314, "epoch": 1103} {"train_loss": -11.070772171020508, "global_step": 185315, "epoch": 1103} {"train_loss": -11.06273078918457, "global_step": 185316, "epoch": 1103} {"train_loss": -11.220415115356445, "global_step": 185317, "epoch": 1103} {"train_loss": -11.042520523071289, "global_step": 185318, "epoch": 1103} {"train_loss": -10.881731033325195, "global_step": 185319, "epoch": 1103} {"train_loss": -11.13393497467041, "global_step": 185320, "epoch": 1103} {"train_loss": -11.171895980834961, "global_step": 185321, "epoch": 1103} {"train_loss": -11.0617036819458, "global_step": 185322, "epoch": 1103} {"train_loss": -11.350897789001465, "global_step": 185323, "epoch": 1103} {"train_loss": -11.264076232910156, "global_step": 185324, "epoch": 1103} {"train_loss": -11.148002624511719, "global_step": 185325, "epoch": 1103} {"train_loss": -11.33462142944336, "global_step": 185326, "epoch": 1103} {"train_loss": -11.274919509887695, "global_step": 185327, "epoch": 1103} {"train_loss": -11.138742446899414, "global_step": 185328, "epoch": 1103} {"train_loss": -11.134771347045898, "global_step": 185329, "epoch": 1103} {"train_loss": -11.260589599609375, "global_step": 185330, "epoch": 1103} {"train_loss": -11.308238983154297, "global_step": 185331, "epoch": 1103} {"train_loss": -11.422857284545898, "global_step": 185332, "epoch": 1103} {"train_loss": -11.232054710388184, "global_step": 185333, "epoch": 1103} {"train_loss": -11.278299331665039, "global_step": 185334, "epoch": 1103} {"train_loss": -11.149721145629883, "global_step": 185335, "epoch": 1103} {"train_loss": -11.210063934326172, "global_step": 185336, "epoch": 1103} {"train_loss": -11.240196228027344, "global_step": 185337, "epoch": 1103} {"train_loss": -11.419178009033203, "global_step": 185338, "epoch": 1103} {"train_loss": -11.396337509155273, "global_step": 185339, "epoch": 1103} {"train_loss": -11.282567977905273, "global_step": 185340, "epoch": 1103} {"train_loss": -11.556755065917969, "global_step": 185341, "epoch": 1103} {"train_loss": -11.29830551147461, "global_step": 185342, "epoch": 1103} {"train_loss": -11.546253204345703, "global_step": 185343, "epoch": 1103} {"train_loss": -11.341035842895508, "global_step": 185344, "epoch": 1103} {"train_loss": -11.438969612121582, "global_step": 185345, "epoch": 1103} {"train_loss": -11.322132110595703, "global_step": 185346, "epoch": 1103} {"train_loss": -11.506860733032227, "global_step": 185347, "epoch": 1103} {"train_loss": -11.474014282226562, "global_step": 185348, "epoch": 1103} {"train_loss": -11.51384162902832, "global_step": 185349, "epoch": 1103} {"train_loss": -11.559774398803711, "global_step": 185350, "epoch": 1103} {"train_loss": -11.488962173461914, "global_step": 185351, "epoch": 1103} {"train_loss": -11.392873764038086, "global_step": 185352, "epoch": 1103} {"train_loss": -11.24703311920166, "global_step": 185353, "epoch": 1103} {"train_loss": -11.386704444885254, "global_step": 185354, "epoch": 1103} {"train_loss": -11.595147132873535, "global_step": 185355, "epoch": 1103} {"train_loss": -11.519432067871094, "global_step": 185356, "epoch": 1103} {"train_loss": -11.453539848327637, "global_step": 185357, "epoch": 1103} {"train_loss": -11.575529098510742, "global_step": 185358, "epoch": 1103} {"train_loss": -11.291646003723145, "global_step": 185359, "epoch": 1103} {"train_loss": -11.509968757629395, "global_step": 185360, "epoch": 1103} {"train_loss": -11.682262420654297, "global_step": 185361, "epoch": 1103} {"train_loss": -11.481647491455078, "global_step": 185362, "epoch": 1103} {"train_loss": -11.220996856689453, "global_step": 185363, "epoch": 1103} {"train_loss": -10.744848251342773, "global_step": 185364, "epoch": 1103} {"train_loss": -11.048922538757324, "global_step": 185365, "epoch": 1103} {"train_loss": -11.326045989990234, "global_step": 185366, "epoch": 1103} {"train_loss": -11.143450736999512, "global_step": 185367, "epoch": 1103} {"train_loss": -10.446362495422363, "global_step": 185368, "epoch": 1103} {"train_loss": -10.464739799499512, "global_step": 185369, "epoch": 1103} {"train_loss": -11.258885383605957, "global_step": 185370, "epoch": 1103} {"train_loss": -11.308771133422852, "global_step": 185371, "epoch": 1103} {"train_loss": -11.50440788269043, "global_step": 185372, "epoch": 1103} {"train_loss": -11.140336990356445, "global_step": 185373, "epoch": 1103} {"train_loss": -11.400957107543945, "global_step": 185374, "epoch": 1103} {"train_loss": -11.472623825073242, "global_step": 185375, "epoch": 1103} {"train_loss": -11.193169593811035, "global_step": 185376, "epoch": 1103} {"train_loss": -11.476256370544434, "global_step": 185377, "epoch": 1103} {"train_loss": -10.851669311523438, "global_step": 185378, "epoch": 1103} {"train_loss": -10.98029613494873, "global_step": 185379, "epoch": 1103} {"train_loss": -10.821720123291016, "global_step": 185380, "epoch": 1103} {"train_loss": -11.084602355957031, "global_step": 185381, "epoch": 1103} {"train_loss": -10.98371696472168, "global_step": 185382, "epoch": 1103} {"train_loss": -11.16093635559082, "global_step": 185383, "epoch": 1103} {"train_loss": -11.371466636657715, "global_step": 185384, "epoch": 1103} {"train_loss": -10.433969497680664, "global_step": 185385, "epoch": 1103} {"train_loss": -11.309515953063965, "global_step": 185386, "epoch": 1103} {"train_loss": -10.334558486938477, "global_step": 185387, "epoch": 1103} {"train_loss": -11.091377258300781, "global_step": 185388, "epoch": 1103} {"train_loss": -10.466609954833984, "global_step": 185389, "epoch": 1103} {"train_loss": -10.428167343139648, "global_step": 185390, "epoch": 1103} {"train_loss": -10.552433013916016, "global_step": 185391, "epoch": 1103} {"train_loss": -9.815683364868164, "global_step": 185392, "epoch": 1103} {"train_loss": -9.64206314086914, "global_step": 185393, "epoch": 1103} {"train_loss": -8.741409301757812, "global_step": 185394, "epoch": 1103} {"train_loss": -10.26112174987793, "global_step": 185395, "epoch": 1103} {"train_loss": -10.045429229736328, "global_step": 185396, "epoch": 1103} {"train_loss": -9.641945838928223, "global_step": 185397, "epoch": 1103} {"train_loss": -10.292054176330566, "global_step": 185398, "epoch": 1103} {"train_loss": -10.094945907592773, "global_step": 185399, "epoch": 1103} {"train_loss": -9.902362823486328, "global_step": 185400, "epoch": 1103} {"train_loss": -10.68867301940918, "global_step": 185401, "epoch": 1103} {"train_loss": -9.241471290588379, "global_step": 185402, "epoch": 1103} {"train_loss": -10.82514762878418, "global_step": 185403, "epoch": 1103} {"train_loss": -9.802571296691895, "global_step": 185404, "epoch": 1103} {"train_loss": -10.402807235717773, "global_step": 185405, "epoch": 1103} {"train_loss": -10.435053825378418, "global_step": 185406, "epoch": 1103} {"train_loss": -10.622126579284668, "global_step": 185407, "epoch": 1103} {"train_loss": -10.235539436340332, "global_step": 185408, "epoch": 1103} {"train_loss": -10.881593704223633, "global_step": 185409, "epoch": 1103} {"train_loss": -10.239611625671387, "global_step": 185410, "epoch": 1103} {"train_loss": -10.771363258361816, "global_step": 185411, "epoch": 1103} {"train_loss": -10.581798553466797, "global_step": 185412, "epoch": 1103} {"train_loss": -10.820764541625977, "global_step": 185413, "epoch": 1103} {"train_loss": -10.895273208618164, "global_step": 185414, "epoch": 1103} {"train_loss": -10.454263687133789, "global_step": 185415, "epoch": 1103} {"train_loss": -10.996925354003906, "global_step": 185416, "epoch": 1103} {"train_loss": -10.912421226501465, "global_step": 185417, "epoch": 1103} {"train_loss": -10.97262954711914, "global_step": 185418, "epoch": 1103} {"train_loss": -11.1727876663208, "global_step": 185419, "epoch": 1103} {"train_loss": -10.928643226623535, "global_step": 185420, "epoch": 1103} {"train_loss": -11.046407699584961, "global_step": 185421, "epoch": 1103} {"train_loss": -10.995477676391602, "global_step": 185422, "epoch": 1103} {"train_loss": -10.886099815368652, "global_step": 185423, "epoch": 1103} {"train_loss": -10.883247375488281, "global_step": 185424, "epoch": 1103} {"train_loss": -11.039823532104492, "global_step": 185425, "epoch": 1103} {"train_loss": -11.225271224975586, "global_step": 185426, "epoch": 1103} {"train_loss": -11.051794052124023, "global_step": 185427, "epoch": 1103} {"train_loss": -11.0247163772583, "global_step": 185428, "epoch": 1103} {"train_loss": -11.229516983032227, "global_step": 185429, "epoch": 1103} {"train_loss": -10.932836532592773, "global_step": 185430, "epoch": 1103} {"train_loss": -11.226292610168457, "global_step": 185431, "epoch": 1103} {"train_loss": -11.004534721374512, "global_step": 185432, "epoch": 1103} {"train_loss": -11.109365463256836, "global_step": 185433, "epoch": 1103} {"train_loss": -11.015926361083984, "global_step": 185434, "epoch": 1103} {"train_loss": -11.431551933288574, "global_step": 185435, "epoch": 1103} {"train_loss": -10.93997573852539, "global_step": 185436, "epoch": 1103} {"train_loss": -11.265966415405273, "global_step": 185437, "epoch": 1103} {"train_loss": -11.128326416015625, "global_step": 185438, "epoch": 1103} {"train_loss": -10.999129295349121, "global_step": 185439, "epoch": 1103} {"train_loss": -10.999201774597168, "global_step": 185440, "epoch": 1103} {"train_loss": -11.287712097167969, "global_step": 185441, "epoch": 1103} {"train_loss": -11.112726211547852, "global_step": 185442, "epoch": 1103} {"train_loss": -11.32797908782959, "global_step": 185443, "epoch": 1103} {"train_loss": -11.203019142150879, "global_step": 185444, "epoch": 1103} {"train_loss": -11.356462478637695, "global_step": 185445, "epoch": 1103} {"train_loss": -11.33365249633789, "global_step": 185446, "epoch": 1103} {"train_loss": -11.34665298461914, "global_step": 185447, "epoch": 1103} {"train_loss": -11.237713813781738, "global_step": 185448, "epoch": 1103} {"train_loss": -11.29971694946289, "global_step": 185449, "epoch": 1103} {"train_loss": -11.209440231323242, "global_step": 185450, "epoch": 1103} {"train_loss": -11.462870597839355, "global_step": 185451, "epoch": 1103} {"train_loss": -11.384185791015625, "global_step": 185452, "epoch": 1103} {"train_loss": -11.501508712768555, "global_step": 185453, "epoch": 1103} {"train_loss": -11.428030014038086, "global_step": 185454, "epoch": 1103} {"train_loss": -11.471881866455078, "global_step": 185455, "epoch": 1103} {"train_loss": -11.536650657653809, "global_step": 185456, "epoch": 1103} {"train_loss": -11.223650932312012, "global_step": 185457, "epoch": 1103} {"train_loss": -11.28519344329834, "global_step": 185458, "epoch": 1103} {"train_loss": -11.361064910888672, "global_step": 185459, "epoch": 1103} {"train_loss": -11.430400848388672, "global_step": 185460, "epoch": 1103} {"train_loss": -11.065580368041992, "global_step": 185461, "epoch": 1103} {"train_loss": -11.612183570861816, "global_step": 185462, "epoch": 1103} {"train_loss": -11.488218307495117, "global_step": 185463, "epoch": 1103} {"train_loss": -11.298654556274414, "global_step": 185464, "epoch": 1103} {"train_loss": -11.492697715759277, "global_step": 185465, "epoch": 1103} {"train_loss": -11.24537181854248, "global_step": 185466, "epoch": 1103} {"train_loss": -11.280304908752441, "global_step": 185467, "epoch": 1103} {"train_loss": -11.45142650604248, "global_step": 185468, "epoch": 1103} {"train_loss": -11.323589324951172, "global_step": 185469, "epoch": 1103} {"train_loss": -11.620033264160156, "global_step": 185470, "epoch": 1103} {"train_loss": -11.053458287602378, "global_step": 185471, "epoch": 1103, "val_loss": 250241.484375} {"train_loss": -11.386476516723633, "global_step": 185472, "epoch": 1104} {"train_loss": -11.447412490844727, "global_step": 185473, "epoch": 1104} {"train_loss": -11.200225830078125, "global_step": 185474, "epoch": 1104} {"train_loss": -11.574316024780273, "global_step": 185475, "epoch": 1104} {"train_loss": -11.441767692565918, "global_step": 185476, "epoch": 1104} {"train_loss": -11.488718032836914, "global_step": 185477, "epoch": 1104} {"train_loss": -11.432710647583008, "global_step": 185478, "epoch": 1104} {"train_loss": -11.401881217956543, "global_step": 185479, "epoch": 1104} {"train_loss": -11.630945205688477, "global_step": 185480, "epoch": 1104} {"train_loss": -11.59717082977295, "global_step": 185481, "epoch": 1104} {"train_loss": -11.653803825378418, "global_step": 185482, "epoch": 1104} {"train_loss": -11.729998588562012, "global_step": 185483, "epoch": 1104} {"train_loss": -11.860506057739258, "global_step": 185484, "epoch": 1104} {"train_loss": -11.626313209533691, "global_step": 185485, "epoch": 1104} {"train_loss": -11.382078170776367, "global_step": 185486, "epoch": 1104} {"train_loss": -11.389925003051758, "global_step": 185487, "epoch": 1104} {"train_loss": -11.418224334716797, "global_step": 185488, "epoch": 1104} {"train_loss": -11.657015800476074, "global_step": 185489, "epoch": 1104} {"train_loss": -11.614791870117188, "global_step": 185490, "epoch": 1104} {"train_loss": -11.056209564208984, "global_step": 185491, "epoch": 1104} {"train_loss": -11.311500549316406, "global_step": 185492, "epoch": 1104} {"train_loss": -11.452189445495605, "global_step": 185493, "epoch": 1104} {"train_loss": -11.159147262573242, "global_step": 185494, "epoch": 1104} {"train_loss": -11.537606239318848, "global_step": 185495, "epoch": 1104} {"train_loss": -11.224435806274414, "global_step": 185496, "epoch": 1104} {"train_loss": -10.813106536865234, "global_step": 185497, "epoch": 1104} {"train_loss": -10.765634536743164, "global_step": 185498, "epoch": 1104} {"train_loss": -11.222829818725586, "global_step": 185499, "epoch": 1104} {"train_loss": -10.171630859375, "global_step": 185500, "epoch": 1104} {"train_loss": -10.801966667175293, "global_step": 185501, "epoch": 1104} {"train_loss": -10.764181137084961, "global_step": 185502, "epoch": 1104} {"train_loss": -10.244462013244629, "global_step": 185503, "epoch": 1104} {"train_loss": -11.274648666381836, "global_step": 185504, "epoch": 1104} {"train_loss": -10.995207786560059, "global_step": 185505, "epoch": 1104} {"train_loss": -11.197624206542969, "global_step": 185506, "epoch": 1104} {"train_loss": -11.249506950378418, "global_step": 185507, "epoch": 1104} {"train_loss": -11.103973388671875, "global_step": 185508, "epoch": 1104} {"train_loss": -11.204822540283203, "global_step": 185509, "epoch": 1104} {"train_loss": -11.127573013305664, "global_step": 185510, "epoch": 1104} {"train_loss": -11.124911308288574, "global_step": 185511, "epoch": 1104} {"train_loss": -11.471552848815918, "global_step": 185512, "epoch": 1104} {"train_loss": -11.328397750854492, "global_step": 185513, "epoch": 1104} {"train_loss": -11.497520446777344, "global_step": 185514, "epoch": 1104} {"train_loss": -11.258054733276367, "global_step": 185515, "epoch": 1104} {"train_loss": -10.999565124511719, "global_step": 185516, "epoch": 1104} {"train_loss": -11.269684791564941, "global_step": 185517, "epoch": 1104} {"train_loss": -11.093782424926758, "global_step": 185518, "epoch": 1104} {"train_loss": -11.411998748779297, "global_step": 185519, "epoch": 1104} {"train_loss": -10.888174057006836, "global_step": 185520, "epoch": 1104} {"train_loss": -11.393436431884766, "global_step": 185521, "epoch": 1104} {"train_loss": -10.904363632202148, "global_step": 185522, "epoch": 1104} {"train_loss": -11.314228057861328, "global_step": 185523, "epoch": 1104} {"train_loss": -10.728423118591309, "global_step": 185524, "epoch": 1104} {"train_loss": -10.580366134643555, "global_step": 185525, "epoch": 1104} {"train_loss": -11.21957778930664, "global_step": 185526, "epoch": 1104} {"train_loss": -10.534126281738281, "global_step": 185527, "epoch": 1104} {"train_loss": -10.525251388549805, "global_step": 185528, "epoch": 1104} {"train_loss": -10.992401123046875, "global_step": 185529, "epoch": 1104} {"train_loss": -10.555303573608398, "global_step": 185530, "epoch": 1104} {"train_loss": -10.809109687805176, "global_step": 185531, "epoch": 1104} {"train_loss": -10.938843727111816, "global_step": 185532, "epoch": 1104} {"train_loss": -10.433147430419922, "global_step": 185533, "epoch": 1104} {"train_loss": -11.051492691040039, "global_step": 185534, "epoch": 1104} {"train_loss": -10.493560791015625, "global_step": 185535, "epoch": 1104} {"train_loss": -11.04630184173584, "global_step": 185536, "epoch": 1104} {"train_loss": -10.64773178100586, "global_step": 185537, "epoch": 1104} {"train_loss": -10.630496978759766, "global_step": 185538, "epoch": 1104} {"train_loss": -10.251524925231934, "global_step": 185539, "epoch": 1104} {"train_loss": -10.985591888427734, "global_step": 185540, "epoch": 1104} {"train_loss": -10.959598541259766, "global_step": 185541, "epoch": 1104} {"train_loss": -11.160669326782227, "global_step": 185542, "epoch": 1104} {"train_loss": -11.256473541259766, "global_step": 185543, "epoch": 1104} {"train_loss": -11.172778129577637, "global_step": 185544, "epoch": 1104} {"train_loss": -10.97765064239502, "global_step": 185545, "epoch": 1104} {"train_loss": -11.153888702392578, "global_step": 185546, "epoch": 1104} {"train_loss": -10.945947647094727, "global_step": 185547, "epoch": 1104} {"train_loss": -11.025224685668945, "global_step": 185548, "epoch": 1104} {"train_loss": -11.236538887023926, "global_step": 185549, "epoch": 1104} {"train_loss": -11.070450782775879, "global_step": 185550, "epoch": 1104} {"train_loss": -11.129189491271973, "global_step": 185551, "epoch": 1104} {"train_loss": -11.16988754272461, "global_step": 185552, "epoch": 1104} {"train_loss": -10.956607818603516, "global_step": 185553, "epoch": 1104} {"train_loss": -11.154898643493652, "global_step": 185554, "epoch": 1104} {"train_loss": -10.734573364257812, "global_step": 185555, "epoch": 1104} {"train_loss": -11.047504425048828, "global_step": 185556, "epoch": 1104} {"train_loss": -10.781094551086426, "global_step": 185557, "epoch": 1104} {"train_loss": -10.901556015014648, "global_step": 185558, "epoch": 1104} {"train_loss": -11.472475051879883, "global_step": 185559, "epoch": 1104} {"train_loss": -11.221227645874023, "global_step": 185560, "epoch": 1104} {"train_loss": -11.339882850646973, "global_step": 185561, "epoch": 1104} {"train_loss": -11.168599128723145, "global_step": 185562, "epoch": 1104} {"train_loss": -11.348560333251953, "global_step": 185563, "epoch": 1104} {"train_loss": -11.133901596069336, "global_step": 185564, "epoch": 1104} {"train_loss": -11.487031936645508, "global_step": 185565, "epoch": 1104} {"train_loss": -11.155223846435547, "global_step": 185566, "epoch": 1104} {"train_loss": -11.229324340820312, "global_step": 185567, "epoch": 1104} {"train_loss": -11.420802116394043, "global_step": 185568, "epoch": 1104} {"train_loss": -11.505696296691895, "global_step": 185569, "epoch": 1104} {"train_loss": -11.456790924072266, "global_step": 185570, "epoch": 1104} {"train_loss": -11.4901704788208, "global_step": 185571, "epoch": 1104} {"train_loss": -11.36314582824707, "global_step": 185572, "epoch": 1104} {"train_loss": -11.240045547485352, "global_step": 185573, "epoch": 1104} {"train_loss": -11.51764965057373, "global_step": 185574, "epoch": 1104} {"train_loss": -11.105854988098145, "global_step": 185575, "epoch": 1104} {"train_loss": -11.282297134399414, "global_step": 185576, "epoch": 1104} {"train_loss": -10.994271278381348, "global_step": 185577, "epoch": 1104} {"train_loss": -11.26577377319336, "global_step": 185578, "epoch": 1104} {"train_loss": -11.310136795043945, "global_step": 185579, "epoch": 1104} {"train_loss": -11.314167022705078, "global_step": 185580, "epoch": 1104} {"train_loss": -11.253652572631836, "global_step": 185581, "epoch": 1104} {"train_loss": -11.23583698272705, "global_step": 185582, "epoch": 1104} {"train_loss": -11.49807071685791, "global_step": 185583, "epoch": 1104} {"train_loss": -11.483731269836426, "global_step": 185584, "epoch": 1104} {"train_loss": -11.4537935256958, "global_step": 185585, "epoch": 1104} {"train_loss": -11.34511947631836, "global_step": 185586, "epoch": 1104} {"train_loss": -11.415329933166504, "global_step": 185587, "epoch": 1104} {"train_loss": -11.271791458129883, "global_step": 185588, "epoch": 1104} {"train_loss": -11.299427032470703, "global_step": 185589, "epoch": 1104} {"train_loss": -11.466670989990234, "global_step": 185590, "epoch": 1104} {"train_loss": -11.0247163772583, "global_step": 185591, "epoch": 1104} {"train_loss": -11.126510620117188, "global_step": 185592, "epoch": 1104} {"train_loss": -11.006898880004883, "global_step": 185593, "epoch": 1104} {"train_loss": -10.579416275024414, "global_step": 185594, "epoch": 1104} {"train_loss": -9.321052551269531, "global_step": 185595, "epoch": 1104} {"train_loss": -10.711282730102539, "global_step": 185596, "epoch": 1104} {"train_loss": -10.088335037231445, "global_step": 185597, "epoch": 1104} {"train_loss": -10.384819030761719, "global_step": 185598, "epoch": 1104} {"train_loss": -10.571098327636719, "global_step": 185599, "epoch": 1104} {"train_loss": -10.470012664794922, "global_step": 185600, "epoch": 1104} {"train_loss": -11.331449508666992, "global_step": 185601, "epoch": 1104} {"train_loss": -10.31978988647461, "global_step": 185602, "epoch": 1104} {"train_loss": -11.548120498657227, "global_step": 185603, "epoch": 1104} {"train_loss": -10.392189025878906, "global_step": 185604, "epoch": 1104} {"train_loss": -11.298847198486328, "global_step": 185605, "epoch": 1104} {"train_loss": -11.00424861907959, "global_step": 185606, "epoch": 1104} {"train_loss": -11.176919937133789, "global_step": 185607, "epoch": 1104} {"train_loss": -10.993147850036621, "global_step": 185608, "epoch": 1104} {"train_loss": -10.851107597351074, "global_step": 185609, "epoch": 1104} {"train_loss": -10.571000099182129, "global_step": 185610, "epoch": 1104} {"train_loss": -11.283334732055664, "global_step": 185611, "epoch": 1104} {"train_loss": -10.944046974182129, "global_step": 185612, "epoch": 1104} {"train_loss": -11.119343757629395, "global_step": 185613, "epoch": 1104} {"train_loss": -10.946197509765625, "global_step": 185614, "epoch": 1104} {"train_loss": -11.254961967468262, "global_step": 185615, "epoch": 1104} {"train_loss": -10.574156761169434, "global_step": 185616, "epoch": 1104} {"train_loss": -11.37122631072998, "global_step": 185617, "epoch": 1104} {"train_loss": -10.824431419372559, "global_step": 185618, "epoch": 1104} {"train_loss": -11.369073867797852, "global_step": 185619, "epoch": 1104} {"train_loss": -10.839133262634277, "global_step": 185620, "epoch": 1104} {"train_loss": -11.262659072875977, "global_step": 185621, "epoch": 1104} {"train_loss": -11.177602767944336, "global_step": 185622, "epoch": 1104} {"train_loss": -11.263720512390137, "global_step": 185623, "epoch": 1104} {"train_loss": -11.03879165649414, "global_step": 185624, "epoch": 1104} {"train_loss": -11.219409942626953, "global_step": 185625, "epoch": 1104} {"train_loss": -11.157167434692383, "global_step": 185626, "epoch": 1104} {"train_loss": -11.422548294067383, "global_step": 185627, "epoch": 1104} {"train_loss": -10.903755187988281, "global_step": 185628, "epoch": 1104} {"train_loss": -10.902750015258789, "global_step": 185629, "epoch": 1104} {"train_loss": -11.021540641784668, "global_step": 185630, "epoch": 1104} {"train_loss": -11.07498550415039, "global_step": 185631, "epoch": 1104} {"train_loss": -10.79010009765625, "global_step": 185632, "epoch": 1104} {"train_loss": -10.742654800415039, "global_step": 185633, "epoch": 1104} {"train_loss": -10.674988746643066, "global_step": 185634, "epoch": 1104} {"train_loss": -10.797372817993164, "global_step": 185635, "epoch": 1104} {"train_loss": -11.112279891967773, "global_step": 185636, "epoch": 1104} {"train_loss": -10.907468795776367, "global_step": 185637, "epoch": 1104} {"train_loss": -11.26473617553711, "global_step": 185638, "epoch": 1104} {"train_loss": -11.098226121493749, "global_step": 185639, "epoch": 1104, "val_loss": 248735.375} {"train_loss": -11.092679977416992, "global_step": 185640, "epoch": 1105} {"train_loss": -10.864265441894531, "global_step": 185641, "epoch": 1105} {"train_loss": -11.455472946166992, "global_step": 185642, "epoch": 1105} {"train_loss": -10.829562187194824, "global_step": 185643, "epoch": 1105} {"train_loss": -11.165802001953125, "global_step": 185644, "epoch": 1105} {"train_loss": -10.681593894958496, "global_step": 185645, "epoch": 1105} {"train_loss": -11.088813781738281, "global_step": 185646, "epoch": 1105} {"train_loss": -10.849543571472168, "global_step": 185647, "epoch": 1105} {"train_loss": -11.292545318603516, "global_step": 185648, "epoch": 1105} {"train_loss": -10.666690826416016, "global_step": 185649, "epoch": 1105} {"train_loss": -11.237815856933594, "global_step": 185650, "epoch": 1105} {"train_loss": -11.101678848266602, "global_step": 185651, "epoch": 1105} {"train_loss": -11.202986717224121, "global_step": 185652, "epoch": 1105} {"train_loss": -10.747674942016602, "global_step": 185653, "epoch": 1105} {"train_loss": -11.108148574829102, "global_step": 185654, "epoch": 1105} {"train_loss": -11.107518196105957, "global_step": 185655, "epoch": 1105} {"train_loss": -10.83090877532959, "global_step": 185656, "epoch": 1105} {"train_loss": -10.931670188903809, "global_step": 185657, "epoch": 1105} {"train_loss": -11.165355682373047, "global_step": 185658, "epoch": 1105} {"train_loss": -10.859299659729004, "global_step": 185659, "epoch": 1105} {"train_loss": -10.993513107299805, "global_step": 185660, "epoch": 1105} {"train_loss": -10.939754486083984, "global_step": 185661, "epoch": 1105} {"train_loss": -11.201098442077637, "global_step": 185662, "epoch": 1105} {"train_loss": -10.904036521911621, "global_step": 185663, "epoch": 1105} {"train_loss": -11.33441162109375, "global_step": 185664, "epoch": 1105} {"train_loss": -10.991731643676758, "global_step": 185665, "epoch": 1105} {"train_loss": -11.436009407043457, "global_step": 185666, "epoch": 1105} {"train_loss": -11.032777786254883, "global_step": 185667, "epoch": 1105} {"train_loss": -11.307406425476074, "global_step": 185668, "epoch": 1105} {"train_loss": -11.231017112731934, "global_step": 185669, "epoch": 1105} {"train_loss": -10.944366455078125, "global_step": 185670, "epoch": 1105} {"train_loss": -10.603821754455566, "global_step": 185671, "epoch": 1105} {"train_loss": -10.87763500213623, "global_step": 185672, "epoch": 1105} {"train_loss": -9.350987434387207, "global_step": 185673, "epoch": 1105} {"train_loss": -10.062334060668945, "global_step": 185674, "epoch": 1105} {"train_loss": -11.087165832519531, "global_step": 185675, "epoch": 1105} {"train_loss": -9.46257209777832, "global_step": 185676, "epoch": 1105} {"train_loss": -10.76450252532959, "global_step": 185677, "epoch": 1105} {"train_loss": -10.4000244140625, "global_step": 185678, "epoch": 1105} {"train_loss": -10.568632125854492, "global_step": 185679, "epoch": 1105} {"train_loss": -10.466440200805664, "global_step": 185680, "epoch": 1105} {"train_loss": -10.894458770751953, "global_step": 185681, "epoch": 1105} {"train_loss": -10.887016296386719, "global_step": 185682, "epoch": 1105} {"train_loss": -10.760359764099121, "global_step": 185683, "epoch": 1105} {"train_loss": -10.67916488647461, "global_step": 185684, "epoch": 1105} {"train_loss": -10.442073822021484, "global_step": 185685, "epoch": 1105} {"train_loss": -10.675114631652832, "global_step": 185686, "epoch": 1105} {"train_loss": -9.957099914550781, "global_step": 185687, "epoch": 1105} {"train_loss": -11.047863960266113, "global_step": 185688, "epoch": 1105} {"train_loss": -10.234670639038086, "global_step": 185689, "epoch": 1105} {"train_loss": -10.357250213623047, "global_step": 185690, "epoch": 1105} {"train_loss": -10.998437881469727, "global_step": 185691, "epoch": 1105} {"train_loss": -10.516494750976562, "global_step": 185692, "epoch": 1105} {"train_loss": -11.287643432617188, "global_step": 185693, "epoch": 1105} {"train_loss": -10.58147144317627, "global_step": 185694, "epoch": 1105} {"train_loss": -11.210575103759766, "global_step": 185695, "epoch": 1105} {"train_loss": -11.010963439941406, "global_step": 185696, "epoch": 1105} {"train_loss": -10.807849884033203, "global_step": 185697, "epoch": 1105} {"train_loss": -10.971302032470703, "global_step": 185698, "epoch": 1105} {"train_loss": -10.98016357421875, "global_step": 185699, "epoch": 1105} {"train_loss": -10.72290325164795, "global_step": 185700, "epoch": 1105} {"train_loss": -10.989923477172852, "global_step": 185701, "epoch": 1105} {"train_loss": -10.035524368286133, "global_step": 185702, "epoch": 1105} {"train_loss": -11.287469863891602, "global_step": 185703, "epoch": 1105} {"train_loss": -10.17434310913086, "global_step": 185704, "epoch": 1105} {"train_loss": -11.00096321105957, "global_step": 185705, "epoch": 1105} {"train_loss": -10.699755668640137, "global_step": 185706, "epoch": 1105} {"train_loss": -10.815025329589844, "global_step": 185707, "epoch": 1105} {"train_loss": -10.902055740356445, "global_step": 185708, "epoch": 1105} {"train_loss": -11.13010025024414, "global_step": 185709, "epoch": 1105} {"train_loss": -10.943714141845703, "global_step": 185710, "epoch": 1105} {"train_loss": -11.172307968139648, "global_step": 185711, "epoch": 1105} {"train_loss": -10.812374114990234, "global_step": 185712, "epoch": 1105} {"train_loss": -10.871338844299316, "global_step": 185713, "epoch": 1105} {"train_loss": -11.0919189453125, "global_step": 185714, "epoch": 1105} {"train_loss": -11.020795822143555, "global_step": 185715, "epoch": 1105} {"train_loss": -10.940428733825684, "global_step": 185716, "epoch": 1105} {"train_loss": -10.97352409362793, "global_step": 185717, "epoch": 1105} {"train_loss": -11.229994773864746, "global_step": 185718, "epoch": 1105} {"train_loss": -11.013601303100586, "global_step": 185719, "epoch": 1105} {"train_loss": -11.20020580291748, "global_step": 185720, "epoch": 1105} {"train_loss": -11.256702423095703, "global_step": 185721, "epoch": 1105} {"train_loss": -11.112354278564453, "global_step": 185722, "epoch": 1105} {"train_loss": -11.003936767578125, "global_step": 185723, "epoch": 1105} {"train_loss": -11.120410919189453, "global_step": 185724, "epoch": 1105} {"train_loss": -11.195940017700195, "global_step": 185725, "epoch": 1105} {"train_loss": -11.280431747436523, "global_step": 185726, "epoch": 1105} {"train_loss": -10.827409744262695, "global_step": 185727, "epoch": 1105} {"train_loss": -11.430423736572266, "global_step": 185728, "epoch": 1105} {"train_loss": -11.201064109802246, "global_step": 185729, "epoch": 1105} {"train_loss": -11.091827392578125, "global_step": 185730, "epoch": 1105} {"train_loss": -11.369133949279785, "global_step": 185731, "epoch": 1105} {"train_loss": -11.115721702575684, "global_step": 185732, "epoch": 1105} {"train_loss": -11.137506484985352, "global_step": 185733, "epoch": 1105} {"train_loss": -11.227472305297852, "global_step": 185734, "epoch": 1105} {"train_loss": -11.200593948364258, "global_step": 185735, "epoch": 1105} {"train_loss": -11.415002822875977, "global_step": 185736, "epoch": 1105} {"train_loss": -11.2814359664917, "global_step": 185737, "epoch": 1105} {"train_loss": -11.375354766845703, "global_step": 185738, "epoch": 1105} {"train_loss": -11.355656623840332, "global_step": 185739, "epoch": 1105} {"train_loss": -11.534273147583008, "global_step": 185740, "epoch": 1105} {"train_loss": -11.578624725341797, "global_step": 185741, "epoch": 1105} {"train_loss": -11.619677543640137, "global_step": 185742, "epoch": 1105} {"train_loss": -11.48153305053711, "global_step": 185743, "epoch": 1105} {"train_loss": -11.4136962890625, "global_step": 185744, "epoch": 1105} {"train_loss": -11.505121231079102, "global_step": 185745, "epoch": 1105} {"train_loss": -11.626623153686523, "global_step": 185746, "epoch": 1105} {"train_loss": -11.590437889099121, "global_step": 185747, "epoch": 1105} {"train_loss": -11.46524429321289, "global_step": 185748, "epoch": 1105} {"train_loss": -11.523460388183594, "global_step": 185749, "epoch": 1105} {"train_loss": -11.625261306762695, "global_step": 185750, "epoch": 1105} {"train_loss": -11.76364803314209, "global_step": 185751, "epoch": 1105} {"train_loss": -11.75184440612793, "global_step": 185752, "epoch": 1105} {"train_loss": -11.588360786437988, "global_step": 185753, "epoch": 1105} {"train_loss": -11.781171798706055, "global_step": 185754, "epoch": 1105} {"train_loss": -11.653618812561035, "global_step": 185755, "epoch": 1105} {"train_loss": -11.510540008544922, "global_step": 185756, "epoch": 1105} {"train_loss": -11.721742630004883, "global_step": 185757, "epoch": 1105} {"train_loss": -11.319881439208984, "global_step": 185758, "epoch": 1105} {"train_loss": -11.59701156616211, "global_step": 185759, "epoch": 1105} {"train_loss": -11.737131118774414, "global_step": 185760, "epoch": 1105} {"train_loss": -11.365516662597656, "global_step": 185761, "epoch": 1105} {"train_loss": -11.45425796508789, "global_step": 185762, "epoch": 1105} {"train_loss": -11.575910568237305, "global_step": 185763, "epoch": 1105} {"train_loss": -11.536161422729492, "global_step": 185764, "epoch": 1105} {"train_loss": -11.70752239227295, "global_step": 185765, "epoch": 1105} {"train_loss": -11.640646934509277, "global_step": 185766, "epoch": 1105} {"train_loss": -11.820170402526855, "global_step": 185767, "epoch": 1105} {"train_loss": -11.260826110839844, "global_step": 185768, "epoch": 1105} {"train_loss": -11.3802490234375, "global_step": 185769, "epoch": 1105} {"train_loss": -11.214435577392578, "global_step": 185770, "epoch": 1105} {"train_loss": -11.516998291015625, "global_step": 185771, "epoch": 1105} {"train_loss": -10.801435470581055, "global_step": 185772, "epoch": 1105} {"train_loss": -10.929343223571777, "global_step": 185773, "epoch": 1105} {"train_loss": -10.897307395935059, "global_step": 185774, "epoch": 1105} {"train_loss": -11.022771835327148, "global_step": 185775, "epoch": 1105} {"train_loss": -11.400455474853516, "global_step": 185776, "epoch": 1105} {"train_loss": -9.945889472961426, "global_step": 185777, "epoch": 1105} {"train_loss": -10.429973602294922, "global_step": 185778, "epoch": 1105} {"train_loss": -11.532988548278809, "global_step": 185779, "epoch": 1105} {"train_loss": -10.182974815368652, "global_step": 185780, "epoch": 1105} {"train_loss": -10.96487045288086, "global_step": 185781, "epoch": 1105} {"train_loss": -10.41649055480957, "global_step": 185782, "epoch": 1105} {"train_loss": -9.709466934204102, "global_step": 185783, "epoch": 1105} {"train_loss": -11.08113956451416, "global_step": 185784, "epoch": 1105} {"train_loss": -10.097332954406738, "global_step": 185785, "epoch": 1105} {"train_loss": -11.149377822875977, "global_step": 185786, "epoch": 1105} {"train_loss": -10.170879364013672, "global_step": 185787, "epoch": 1105} {"train_loss": -10.955110549926758, "global_step": 185788, "epoch": 1105} {"train_loss": -10.207714080810547, "global_step": 185789, "epoch": 1105} {"train_loss": -9.696176528930664, "global_step": 185790, "epoch": 1105} {"train_loss": -10.179455757141113, "global_step": 185791, "epoch": 1105} {"train_loss": -10.917801856994629, "global_step": 185792, "epoch": 1105} {"train_loss": -9.451663970947266, "global_step": 185793, "epoch": 1105} {"train_loss": -10.474586486816406, "global_step": 185794, "epoch": 1105} {"train_loss": -8.974448204040527, "global_step": 185795, "epoch": 1105} {"train_loss": -10.23041820526123, "global_step": 185796, "epoch": 1105} {"train_loss": -9.223325729370117, "global_step": 185797, "epoch": 1105} {"train_loss": -9.189857482910156, "global_step": 185798, "epoch": 1105} {"train_loss": -10.268292427062988, "global_step": 185799, "epoch": 1105} {"train_loss": -9.643840789794922, "global_step": 185800, "epoch": 1105} {"train_loss": -9.91707706451416, "global_step": 185801, "epoch": 1105} {"train_loss": -9.94217300415039, "global_step": 185802, "epoch": 1105} {"train_loss": -9.648036003112793, "global_step": 185803, "epoch": 1105} {"train_loss": -10.244187355041504, "global_step": 185804, "epoch": 1105} {"train_loss": -9.687154769897461, "global_step": 185805, "epoch": 1105} {"train_loss": -9.891297340393066, "global_step": 185806, "epoch": 1105} {"train_loss": -10.906578779220581, "global_step": 185807, "epoch": 1105, "val_loss": 243340.78125, "train_action_mse_error": 0.3930358588695526} {"train_loss": -9.469636917114258, "global_step": 185808, "epoch": 1106} {"train_loss": -9.872699737548828, "global_step": 185809, "epoch": 1106} {"train_loss": -9.740179061889648, "global_step": 185810, "epoch": 1106} {"train_loss": -9.619117736816406, "global_step": 185811, "epoch": 1106} {"train_loss": -10.02214241027832, "global_step": 185812, "epoch": 1106} {"train_loss": -9.783321380615234, "global_step": 185813, "epoch": 1106} {"train_loss": -10.304927825927734, "global_step": 185814, "epoch": 1106} {"train_loss": -10.33161449432373, "global_step": 185815, "epoch": 1106} {"train_loss": -9.764893531799316, "global_step": 185816, "epoch": 1106} {"train_loss": -10.72183609008789, "global_step": 185817, "epoch": 1106} {"train_loss": -10.431058883666992, "global_step": 185818, "epoch": 1106} {"train_loss": -10.151172637939453, "global_step": 185819, "epoch": 1106} {"train_loss": -10.529179573059082, "global_step": 185820, "epoch": 1106} {"train_loss": -10.406473159790039, "global_step": 185821, "epoch": 1106} {"train_loss": -10.563891410827637, "global_step": 185822, "epoch": 1106} {"train_loss": -10.79560375213623, "global_step": 185823, "epoch": 1106} {"train_loss": -10.632213592529297, "global_step": 185824, "epoch": 1106} {"train_loss": -10.557062149047852, "global_step": 185825, "epoch": 1106} {"train_loss": -10.956811904907227, "global_step": 185826, "epoch": 1106} {"train_loss": -10.797452926635742, "global_step": 185827, "epoch": 1106} {"train_loss": -10.766335487365723, "global_step": 185828, "epoch": 1106} {"train_loss": -10.919417381286621, "global_step": 185829, "epoch": 1106} {"train_loss": -10.901453018188477, "global_step": 185830, "epoch": 1106} {"train_loss": -10.810745239257812, "global_step": 185831, "epoch": 1106} {"train_loss": -10.951845169067383, "global_step": 185832, "epoch": 1106} {"train_loss": -11.085984230041504, "global_step": 185833, "epoch": 1106} {"train_loss": -10.979836463928223, "global_step": 185834, "epoch": 1106} {"train_loss": -11.157384872436523, "global_step": 185835, "epoch": 1106} {"train_loss": -11.118589401245117, "global_step": 185836, "epoch": 1106} {"train_loss": -11.088221549987793, "global_step": 185837, "epoch": 1106} {"train_loss": -11.225992202758789, "global_step": 185838, "epoch": 1106} {"train_loss": -11.126561164855957, "global_step": 185839, "epoch": 1106} {"train_loss": -11.151897430419922, "global_step": 185840, "epoch": 1106} {"train_loss": -11.089557647705078, "global_step": 185841, "epoch": 1106} {"train_loss": -11.242501258850098, "global_step": 185842, "epoch": 1106} {"train_loss": -11.129571914672852, "global_step": 185843, "epoch": 1106} {"train_loss": -11.016244888305664, "global_step": 185844, "epoch": 1106} {"train_loss": -11.030471801757812, "global_step": 185845, "epoch": 1106} {"train_loss": -11.288131713867188, "global_step": 185846, "epoch": 1106} {"train_loss": -11.08259105682373, "global_step": 185847, "epoch": 1106} {"train_loss": -11.13325309753418, "global_step": 185848, "epoch": 1106} {"train_loss": -11.080389976501465, "global_step": 185849, "epoch": 1106} {"train_loss": -11.355360984802246, "global_step": 185850, "epoch": 1106} {"train_loss": -11.100975036621094, "global_step": 185851, "epoch": 1106} {"train_loss": -11.437740325927734, "global_step": 185852, "epoch": 1106} {"train_loss": -11.454065322875977, "global_step": 185853, "epoch": 1106} {"train_loss": -11.228647232055664, "global_step": 185854, "epoch": 1106} {"train_loss": -11.387483596801758, "global_step": 185855, "epoch": 1106} {"train_loss": -11.31096076965332, "global_step": 185856, "epoch": 1106} {"train_loss": -11.444602966308594, "global_step": 185857, "epoch": 1106} {"train_loss": -11.398014068603516, "global_step": 185858, "epoch": 1106} {"train_loss": -11.38747787475586, "global_step": 185859, "epoch": 1106} {"train_loss": -11.508158683776855, "global_step": 185860, "epoch": 1106} {"train_loss": -11.568817138671875, "global_step": 185861, "epoch": 1106} {"train_loss": -11.425618171691895, "global_step": 185862, "epoch": 1106} {"train_loss": -11.520723342895508, "global_step": 185863, "epoch": 1106} {"train_loss": -11.213794708251953, "global_step": 185864, "epoch": 1106} {"train_loss": -11.455108642578125, "global_step": 185865, "epoch": 1106} {"train_loss": -11.4422025680542, "global_step": 185866, "epoch": 1106} {"train_loss": -11.302580833435059, "global_step": 185867, "epoch": 1106} {"train_loss": -11.526418685913086, "global_step": 185868, "epoch": 1106} {"train_loss": -11.553211212158203, "global_step": 185869, "epoch": 1106} {"train_loss": -11.454601287841797, "global_step": 185870, "epoch": 1106} {"train_loss": -11.426824569702148, "global_step": 185871, "epoch": 1106} {"train_loss": -11.67040729522705, "global_step": 185872, "epoch": 1106} {"train_loss": -11.656304359436035, "global_step": 185873, "epoch": 1106} {"train_loss": -11.726689338684082, "global_step": 185874, "epoch": 1106} {"train_loss": -11.45400619506836, "global_step": 185875, "epoch": 1106} {"train_loss": -11.503122329711914, "global_step": 185876, "epoch": 1106} {"train_loss": -11.613677024841309, "global_step": 185877, "epoch": 1106} {"train_loss": -11.641280174255371, "global_step": 185878, "epoch": 1106} {"train_loss": -11.5638427734375, "global_step": 185879, "epoch": 1106} {"train_loss": -11.683917999267578, "global_step": 185880, "epoch": 1106} {"train_loss": -11.434438705444336, "global_step": 185881, "epoch": 1106} {"train_loss": -11.310083389282227, "global_step": 185882, "epoch": 1106} {"train_loss": -11.740434646606445, "global_step": 185883, "epoch": 1106} {"train_loss": -11.651799201965332, "global_step": 185884, "epoch": 1106} {"train_loss": -11.686174392700195, "global_step": 185885, "epoch": 1106} {"train_loss": -10.913920402526855, "global_step": 185886, "epoch": 1106} {"train_loss": -10.244048118591309, "global_step": 185887, "epoch": 1106} {"train_loss": -10.28091049194336, "global_step": 185888, "epoch": 1106} {"train_loss": -11.090222358703613, "global_step": 185889, "epoch": 1106} {"train_loss": -11.527053833007812, "global_step": 185890, "epoch": 1106} {"train_loss": -10.961356163024902, "global_step": 185891, "epoch": 1106} {"train_loss": -10.109151840209961, "global_step": 185892, "epoch": 1106} {"train_loss": -10.168779373168945, "global_step": 185893, "epoch": 1106} {"train_loss": -10.825677871704102, "global_step": 185894, "epoch": 1106} {"train_loss": -9.010154724121094, "global_step": 185895, "epoch": 1106} {"train_loss": -9.746358871459961, "global_step": 185896, "epoch": 1106} {"train_loss": -7.999484062194824, "global_step": 185897, "epoch": 1106} {"train_loss": -8.623678207397461, "global_step": 185898, "epoch": 1106} {"train_loss": -7.966569900512695, "global_step": 185899, "epoch": 1106} {"train_loss": -8.516916275024414, "global_step": 185900, "epoch": 1106} {"train_loss": -9.97910213470459, "global_step": 185901, "epoch": 1106} {"train_loss": -8.324827194213867, "global_step": 185902, "epoch": 1106} {"train_loss": -8.257351875305176, "global_step": 185903, "epoch": 1106} {"train_loss": -8.201658248901367, "global_step": 185904, "epoch": 1106} {"train_loss": -10.163187026977539, "global_step": 185905, "epoch": 1106} {"train_loss": -9.14847469329834, "global_step": 185906, "epoch": 1106} {"train_loss": -10.753918647766113, "global_step": 185907, "epoch": 1106} {"train_loss": -9.598915100097656, "global_step": 185908, "epoch": 1106} {"train_loss": -9.942927360534668, "global_step": 185909, "epoch": 1106} {"train_loss": -10.194912910461426, "global_step": 185910, "epoch": 1106} {"train_loss": -10.341514587402344, "global_step": 185911, "epoch": 1106} {"train_loss": -10.215331077575684, "global_step": 185912, "epoch": 1106} {"train_loss": -10.742746353149414, "global_step": 185913, "epoch": 1106} {"train_loss": -10.662939071655273, "global_step": 185914, "epoch": 1106} {"train_loss": -10.838459014892578, "global_step": 185915, "epoch": 1106} {"train_loss": -10.624553680419922, "global_step": 185916, "epoch": 1106} {"train_loss": -10.956901550292969, "global_step": 185917, "epoch": 1106} {"train_loss": -10.74163818359375, "global_step": 185918, "epoch": 1106} {"train_loss": -10.80265998840332, "global_step": 185919, "epoch": 1106} {"train_loss": -10.875319480895996, "global_step": 185920, "epoch": 1106} {"train_loss": -10.753290176391602, "global_step": 185921, "epoch": 1106} {"train_loss": -10.748979568481445, "global_step": 185922, "epoch": 1106} {"train_loss": -10.719642639160156, "global_step": 185923, "epoch": 1106} {"train_loss": -10.846199035644531, "global_step": 185924, "epoch": 1106} {"train_loss": -10.664487838745117, "global_step": 185925, "epoch": 1106} {"train_loss": -10.924942970275879, "global_step": 185926, "epoch": 1106} {"train_loss": -11.030834197998047, "global_step": 185927, "epoch": 1106} {"train_loss": -10.769393920898438, "global_step": 185928, "epoch": 1106} {"train_loss": -10.834796905517578, "global_step": 185929, "epoch": 1106} {"train_loss": -10.935867309570312, "global_step": 185930, "epoch": 1106} {"train_loss": -10.806548118591309, "global_step": 185931, "epoch": 1106} {"train_loss": -10.993925094604492, "global_step": 185932, "epoch": 1106} {"train_loss": -11.226236343383789, "global_step": 185933, "epoch": 1106} {"train_loss": -11.011995315551758, "global_step": 185934, "epoch": 1106} {"train_loss": -11.042688369750977, "global_step": 185935, "epoch": 1106} {"train_loss": -10.924654006958008, "global_step": 185936, "epoch": 1106} {"train_loss": -10.991779327392578, "global_step": 185937, "epoch": 1106} {"train_loss": -11.266958236694336, "global_step": 185938, "epoch": 1106} {"train_loss": -11.099383354187012, "global_step": 185939, "epoch": 1106} {"train_loss": -11.268441200256348, "global_step": 185940, "epoch": 1106} {"train_loss": -11.180811882019043, "global_step": 185941, "epoch": 1106} {"train_loss": -11.087004661560059, "global_step": 185942, "epoch": 1106} {"train_loss": -11.175422668457031, "global_step": 185943, "epoch": 1106} {"train_loss": -11.292632102966309, "global_step": 185944, "epoch": 1106} {"train_loss": -11.034721374511719, "global_step": 185945, "epoch": 1106} {"train_loss": -11.275402069091797, "global_step": 185946, "epoch": 1106} {"train_loss": -11.335929870605469, "global_step": 185947, "epoch": 1106} {"train_loss": -11.253035545349121, "global_step": 185948, "epoch": 1106} {"train_loss": -11.473310470581055, "global_step": 185949, "epoch": 1106} {"train_loss": -11.313684463500977, "global_step": 185950, "epoch": 1106} {"train_loss": -11.392034530639648, "global_step": 185951, "epoch": 1106} {"train_loss": -11.315866470336914, "global_step": 185952, "epoch": 1106} {"train_loss": -11.24537467956543, "global_step": 185953, "epoch": 1106} {"train_loss": -11.450553894042969, "global_step": 185954, "epoch": 1106} {"train_loss": -11.323751449584961, "global_step": 185955, "epoch": 1106} {"train_loss": -11.326637268066406, "global_step": 185956, "epoch": 1106} {"train_loss": -11.515565872192383, "global_step": 185957, "epoch": 1106} {"train_loss": -11.347304344177246, "global_step": 185958, "epoch": 1106} {"train_loss": -11.434349060058594, "global_step": 185959, "epoch": 1106} {"train_loss": -11.517023086547852, "global_step": 185960, "epoch": 1106} {"train_loss": -11.52855396270752, "global_step": 185961, "epoch": 1106} {"train_loss": -11.466817855834961, "global_step": 185962, "epoch": 1106} {"train_loss": -11.432275772094727, "global_step": 185963, "epoch": 1106} {"train_loss": -11.684220314025879, "global_step": 185964, "epoch": 1106} {"train_loss": -11.316198348999023, "global_step": 185965, "epoch": 1106} {"train_loss": -11.311319351196289, "global_step": 185966, "epoch": 1106} {"train_loss": -11.253254890441895, "global_step": 185967, "epoch": 1106} {"train_loss": -11.29269027709961, "global_step": 185968, "epoch": 1106} {"train_loss": -11.365409851074219, "global_step": 185969, "epoch": 1106} {"train_loss": -11.187610626220703, "global_step": 185970, "epoch": 1106} {"train_loss": -11.409931182861328, "global_step": 185971, "epoch": 1106} {"train_loss": -11.064810752868652, "global_step": 185972, "epoch": 1106} {"train_loss": -11.103869438171387, "global_step": 185973, "epoch": 1106} {"train_loss": -11.253609657287598, "global_step": 185974, "epoch": 1106} {"train_loss": -10.871478398640951, "global_step": 185975, "epoch": 1106, "val_loss": 242787.078125} {"train_loss": -11.292672157287598, "global_step": 185976, "epoch": 1107} {"train_loss": -10.856539726257324, "global_step": 185977, "epoch": 1107} {"train_loss": -11.357040405273438, "global_step": 185978, "epoch": 1107} {"train_loss": -11.136129379272461, "global_step": 185979, "epoch": 1107} {"train_loss": -10.514739036560059, "global_step": 185980, "epoch": 1107} {"train_loss": -11.140493392944336, "global_step": 185981, "epoch": 1107} {"train_loss": -11.014337539672852, "global_step": 185982, "epoch": 1107} {"train_loss": -10.679056167602539, "global_step": 185983, "epoch": 1107} {"train_loss": -10.911388397216797, "global_step": 185984, "epoch": 1107} {"train_loss": -10.415987968444824, "global_step": 185985, "epoch": 1107} {"train_loss": -9.358489990234375, "global_step": 185986, "epoch": 1107} {"train_loss": -10.691729545593262, "global_step": 185987, "epoch": 1107} {"train_loss": -10.392169952392578, "global_step": 185988, "epoch": 1107} {"train_loss": -9.56718635559082, "global_step": 185989, "epoch": 1107} {"train_loss": -11.205304145812988, "global_step": 185990, "epoch": 1107} {"train_loss": -9.469972610473633, "global_step": 185991, "epoch": 1107} {"train_loss": -11.140108108520508, "global_step": 185992, "epoch": 1107} {"train_loss": -9.47164535522461, "global_step": 185993, "epoch": 1107} {"train_loss": -10.921655654907227, "global_step": 185994, "epoch": 1107} {"train_loss": -10.681985855102539, "global_step": 185995, "epoch": 1107} {"train_loss": -10.811566352844238, "global_step": 185996, "epoch": 1107} {"train_loss": -10.998539924621582, "global_step": 185997, "epoch": 1107} {"train_loss": -11.109100341796875, "global_step": 185998, "epoch": 1107} {"train_loss": -10.912700653076172, "global_step": 185999, "epoch": 1107} {"train_loss": -11.116183280944824, "global_step": 186000, "epoch": 1107} {"train_loss": -11.099286079406738, "global_step": 186001, "epoch": 1107} {"train_loss": -11.269566535949707, "global_step": 186002, "epoch": 1107} {"train_loss": -11.280332565307617, "global_step": 186003, "epoch": 1107} {"train_loss": -10.992756843566895, "global_step": 186004, "epoch": 1107} {"train_loss": -11.212017059326172, "global_step": 186005, "epoch": 1107} {"train_loss": -10.958780288696289, "global_step": 186006, "epoch": 1107} {"train_loss": -11.032526016235352, "global_step": 186007, "epoch": 1107} {"train_loss": -11.255073547363281, "global_step": 186008, "epoch": 1107} {"train_loss": -11.031580924987793, "global_step": 186009, "epoch": 1107} {"train_loss": -11.244329452514648, "global_step": 186010, "epoch": 1107} {"train_loss": -11.095029830932617, "global_step": 186011, "epoch": 1107} {"train_loss": -11.142518997192383, "global_step": 186012, "epoch": 1107} {"train_loss": -11.207916259765625, "global_step": 186013, "epoch": 1107} {"train_loss": -11.312969207763672, "global_step": 186014, "epoch": 1107} {"train_loss": -11.181819915771484, "global_step": 186015, "epoch": 1107} {"train_loss": -11.293530464172363, "global_step": 186016, "epoch": 1107} {"train_loss": -10.97824478149414, "global_step": 186017, "epoch": 1107} {"train_loss": -11.241251945495605, "global_step": 186018, "epoch": 1107} {"train_loss": -10.876750946044922, "global_step": 186019, "epoch": 1107} {"train_loss": -11.074621200561523, "global_step": 186020, "epoch": 1107} {"train_loss": -11.263425827026367, "global_step": 186021, "epoch": 1107} {"train_loss": -11.152045249938965, "global_step": 186022, "epoch": 1107} {"train_loss": -11.404335975646973, "global_step": 186023, "epoch": 1107} {"train_loss": -10.910764694213867, "global_step": 186024, "epoch": 1107} {"train_loss": -11.17858600616455, "global_step": 186025, "epoch": 1107} {"train_loss": -11.373241424560547, "global_step": 186026, "epoch": 1107} {"train_loss": -11.290456771850586, "global_step": 186027, "epoch": 1107} {"train_loss": -11.3407564163208, "global_step": 186028, "epoch": 1107} {"train_loss": -11.274913787841797, "global_step": 186029, "epoch": 1107} {"train_loss": -11.338451385498047, "global_step": 186030, "epoch": 1107} {"train_loss": -11.23858642578125, "global_step": 186031, "epoch": 1107} {"train_loss": -11.318185806274414, "global_step": 186032, "epoch": 1107} {"train_loss": -11.459403038024902, "global_step": 186033, "epoch": 1107} {"train_loss": -11.04400634765625, "global_step": 186034, "epoch": 1107} {"train_loss": -11.464405059814453, "global_step": 186035, "epoch": 1107} {"train_loss": -11.193265914916992, "global_step": 186036, "epoch": 1107} {"train_loss": -11.549043655395508, "global_step": 186037, "epoch": 1107} {"train_loss": -11.384845733642578, "global_step": 186038, "epoch": 1107} {"train_loss": -11.335084915161133, "global_step": 186039, "epoch": 1107} {"train_loss": -11.24982738494873, "global_step": 186040, "epoch": 1107} {"train_loss": -11.244728088378906, "global_step": 186041, "epoch": 1107} {"train_loss": -11.502424240112305, "global_step": 186042, "epoch": 1107} {"train_loss": -11.212251663208008, "global_step": 186043, "epoch": 1107} {"train_loss": -11.399763107299805, "global_step": 186044, "epoch": 1107} {"train_loss": -11.23245620727539, "global_step": 186045, "epoch": 1107} {"train_loss": -11.29958724975586, "global_step": 186046, "epoch": 1107} {"train_loss": -11.19204330444336, "global_step": 186047, "epoch": 1107} {"train_loss": -11.07396411895752, "global_step": 186048, "epoch": 1107} {"train_loss": -11.737503051757812, "global_step": 186049, "epoch": 1107} {"train_loss": -11.137616157531738, "global_step": 186050, "epoch": 1107} {"train_loss": -11.44044303894043, "global_step": 186051, "epoch": 1107} {"train_loss": -11.537120819091797, "global_step": 186052, "epoch": 1107} {"train_loss": -11.300970077514648, "global_step": 186053, "epoch": 1107} {"train_loss": -11.77863883972168, "global_step": 186054, "epoch": 1107} {"train_loss": -11.368013381958008, "global_step": 186055, "epoch": 1107} {"train_loss": -11.620696067810059, "global_step": 186056, "epoch": 1107} {"train_loss": -11.525065422058105, "global_step": 186057, "epoch": 1107} {"train_loss": -11.508737564086914, "global_step": 186058, "epoch": 1107} {"train_loss": -11.54061508178711, "global_step": 186059, "epoch": 1107} {"train_loss": -11.483121871948242, "global_step": 186060, "epoch": 1107} {"train_loss": -11.556741714477539, "global_step": 186061, "epoch": 1107} {"train_loss": -11.772165298461914, "global_step": 186062, "epoch": 1107} {"train_loss": -11.294866561889648, "global_step": 186063, "epoch": 1107} {"train_loss": -11.53314208984375, "global_step": 186064, "epoch": 1107} {"train_loss": -11.238385200500488, "global_step": 186065, "epoch": 1107} {"train_loss": -11.390571594238281, "global_step": 186066, "epoch": 1107} {"train_loss": -11.239712715148926, "global_step": 186067, "epoch": 1107} {"train_loss": -11.170316696166992, "global_step": 186068, "epoch": 1107} {"train_loss": -9.273134231567383, "global_step": 186069, "epoch": 1107} {"train_loss": -11.503009796142578, "global_step": 186070, "epoch": 1107} {"train_loss": -10.807861328125, "global_step": 186071, "epoch": 1107} {"train_loss": -11.264558792114258, "global_step": 186072, "epoch": 1107} {"train_loss": -11.203216552734375, "global_step": 186073, "epoch": 1107} {"train_loss": -11.594560623168945, "global_step": 186074, "epoch": 1107} {"train_loss": -10.883315086364746, "global_step": 186075, "epoch": 1107} {"train_loss": -11.208213806152344, "global_step": 186076, "epoch": 1107} {"train_loss": -10.593584060668945, "global_step": 186077, "epoch": 1107} {"train_loss": -10.98109245300293, "global_step": 186078, "epoch": 1107} {"train_loss": -11.033190727233887, "global_step": 186079, "epoch": 1107} {"train_loss": -11.307233810424805, "global_step": 186080, "epoch": 1107} {"train_loss": -10.787069320678711, "global_step": 186081, "epoch": 1107} {"train_loss": -10.908748626708984, "global_step": 186082, "epoch": 1107} {"train_loss": -10.501336097717285, "global_step": 186083, "epoch": 1107} {"train_loss": -11.28283405303955, "global_step": 186084, "epoch": 1107} {"train_loss": -11.56753158569336, "global_step": 186085, "epoch": 1107} {"train_loss": -11.2725830078125, "global_step": 186086, "epoch": 1107} {"train_loss": -11.182878494262695, "global_step": 186087, "epoch": 1107} {"train_loss": -11.197786331176758, "global_step": 186088, "epoch": 1107} {"train_loss": -11.138984680175781, "global_step": 186089, "epoch": 1107} {"train_loss": -11.27375602722168, "global_step": 186090, "epoch": 1107} {"train_loss": -11.355413436889648, "global_step": 186091, "epoch": 1107} {"train_loss": -11.23989200592041, "global_step": 186092, "epoch": 1107} {"train_loss": -11.103630065917969, "global_step": 186093, "epoch": 1107} {"train_loss": -11.310491561889648, "global_step": 186094, "epoch": 1107} {"train_loss": -11.142294883728027, "global_step": 186095, "epoch": 1107} {"train_loss": -11.199888229370117, "global_step": 186096, "epoch": 1107} {"train_loss": -11.013952255249023, "global_step": 186097, "epoch": 1107} {"train_loss": -11.035460472106934, "global_step": 186098, "epoch": 1107} {"train_loss": -11.28040885925293, "global_step": 186099, "epoch": 1107} {"train_loss": -10.851496696472168, "global_step": 186100, "epoch": 1107} {"train_loss": -11.080821990966797, "global_step": 186101, "epoch": 1107} {"train_loss": -11.124415397644043, "global_step": 186102, "epoch": 1107} {"train_loss": -10.734905242919922, "global_step": 186103, "epoch": 1107} {"train_loss": -11.177855491638184, "global_step": 186104, "epoch": 1107} {"train_loss": -10.609762191772461, "global_step": 186105, "epoch": 1107} {"train_loss": -10.979589462280273, "global_step": 186106, "epoch": 1107} {"train_loss": -11.0908203125, "global_step": 186107, "epoch": 1107} {"train_loss": -11.037904739379883, "global_step": 186108, "epoch": 1107} {"train_loss": -11.534370422363281, "global_step": 186109, "epoch": 1107} {"train_loss": -10.879374504089355, "global_step": 186110, "epoch": 1107} {"train_loss": -11.247828483581543, "global_step": 186111, "epoch": 1107} {"train_loss": -11.21337890625, "global_step": 186112, "epoch": 1107} {"train_loss": -11.243728637695312, "global_step": 186113, "epoch": 1107} {"train_loss": -11.504959106445312, "global_step": 186114, "epoch": 1107} {"train_loss": -11.204111099243164, "global_step": 186115, "epoch": 1107} {"train_loss": -11.349771499633789, "global_step": 186116, "epoch": 1107} {"train_loss": -10.958961486816406, "global_step": 186117, "epoch": 1107} {"train_loss": -11.247156143188477, "global_step": 186118, "epoch": 1107} {"train_loss": -11.06474494934082, "global_step": 186119, "epoch": 1107} {"train_loss": -11.321239471435547, "global_step": 186120, "epoch": 1107} {"train_loss": -11.330605506896973, "global_step": 186121, "epoch": 1107} {"train_loss": -11.004948616027832, "global_step": 186122, "epoch": 1107} {"train_loss": -11.22360610961914, "global_step": 186123, "epoch": 1107} {"train_loss": -11.09670639038086, "global_step": 186124, "epoch": 1107} {"train_loss": -11.12874698638916, "global_step": 186125, "epoch": 1107} {"train_loss": -11.254634857177734, "global_step": 186126, "epoch": 1107} {"train_loss": -11.042943000793457, "global_step": 186127, "epoch": 1107} {"train_loss": -11.310647010803223, "global_step": 186128, "epoch": 1107} {"train_loss": -10.690496444702148, "global_step": 186129, "epoch": 1107} {"train_loss": -10.14983081817627, "global_step": 186130, "epoch": 1107} {"train_loss": -11.239590644836426, "global_step": 186131, "epoch": 1107} {"train_loss": -10.829635620117188, "global_step": 186132, "epoch": 1107} {"train_loss": -10.778241157531738, "global_step": 186133, "epoch": 1107} {"train_loss": -11.102256774902344, "global_step": 186134, "epoch": 1107} {"train_loss": -10.847939491271973, "global_step": 186135, "epoch": 1107} {"train_loss": -10.710800170898438, "global_step": 186136, "epoch": 1107} {"train_loss": -10.914581298828125, "global_step": 186137, "epoch": 1107} {"train_loss": -10.229717254638672, "global_step": 186138, "epoch": 1107} {"train_loss": -11.09634017944336, "global_step": 186139, "epoch": 1107} {"train_loss": -11.032089233398438, "global_step": 186140, "epoch": 1107} {"train_loss": -11.052392959594727, "global_step": 186141, "epoch": 1107} {"train_loss": -10.81940746307373, "global_step": 186142, "epoch": 1107} {"train_loss": -11.094049896512713, "global_step": 186143, "epoch": 1107, "val_loss": 245169.21875} {"train_loss": -11.242112159729004, "global_step": 186144, "epoch": 1108} {"train_loss": -10.807659149169922, "global_step": 186145, "epoch": 1108} {"train_loss": -10.986797332763672, "global_step": 186146, "epoch": 1108} {"train_loss": -10.785652160644531, "global_step": 186147, "epoch": 1108} {"train_loss": -11.074378967285156, "global_step": 186148, "epoch": 1108} {"train_loss": -10.61805534362793, "global_step": 186149, "epoch": 1108} {"train_loss": -10.92264175415039, "global_step": 186150, "epoch": 1108} {"train_loss": -10.873031616210938, "global_step": 186151, "epoch": 1108} {"train_loss": -10.83576488494873, "global_step": 186152, "epoch": 1108} {"train_loss": -11.094104766845703, "global_step": 186153, "epoch": 1108} {"train_loss": -10.977383613586426, "global_step": 186154, "epoch": 1108} {"train_loss": -10.966521263122559, "global_step": 186155, "epoch": 1108} {"train_loss": -10.473869323730469, "global_step": 186156, "epoch": 1108} {"train_loss": -11.101387023925781, "global_step": 186157, "epoch": 1108} {"train_loss": -10.530834197998047, "global_step": 186158, "epoch": 1108} {"train_loss": -10.36059856414795, "global_step": 186159, "epoch": 1108} {"train_loss": -10.80330753326416, "global_step": 186160, "epoch": 1108} {"train_loss": -10.14117431640625, "global_step": 186161, "epoch": 1108} {"train_loss": -10.415047645568848, "global_step": 186162, "epoch": 1108} {"train_loss": -10.749052047729492, "global_step": 186163, "epoch": 1108} {"train_loss": -10.430276870727539, "global_step": 186164, "epoch": 1108} {"train_loss": -11.020120620727539, "global_step": 186165, "epoch": 1108} {"train_loss": -10.572509765625, "global_step": 186166, "epoch": 1108} {"train_loss": -11.150833129882812, "global_step": 186167, "epoch": 1108} {"train_loss": -10.705940246582031, "global_step": 186168, "epoch": 1108} {"train_loss": -11.029377937316895, "global_step": 186169, "epoch": 1108} {"train_loss": -10.650177001953125, "global_step": 186170, "epoch": 1108} {"train_loss": -11.215356826782227, "global_step": 186171, "epoch": 1108} {"train_loss": -10.831988334655762, "global_step": 186172, "epoch": 1108} {"train_loss": -10.531951904296875, "global_step": 186173, "epoch": 1108} {"train_loss": -11.262090682983398, "global_step": 186174, "epoch": 1108} {"train_loss": -10.635488510131836, "global_step": 186175, "epoch": 1108} {"train_loss": -11.15244197845459, "global_step": 186176, "epoch": 1108} {"train_loss": -10.772781372070312, "global_step": 186177, "epoch": 1108} {"train_loss": -10.882890701293945, "global_step": 186178, "epoch": 1108} {"train_loss": -10.851890563964844, "global_step": 186179, "epoch": 1108} {"train_loss": -11.123861312866211, "global_step": 186180, "epoch": 1108} {"train_loss": -10.817970275878906, "global_step": 186181, "epoch": 1108} {"train_loss": -11.001834869384766, "global_step": 186182, "epoch": 1108} {"train_loss": -10.808995246887207, "global_step": 186183, "epoch": 1108} {"train_loss": -11.148446083068848, "global_step": 186184, "epoch": 1108} {"train_loss": -11.194076538085938, "global_step": 186185, "epoch": 1108} {"train_loss": -11.062911033630371, "global_step": 186186, "epoch": 1108} {"train_loss": -11.120227813720703, "global_step": 186187, "epoch": 1108} {"train_loss": -11.289644241333008, "global_step": 186188, "epoch": 1108} {"train_loss": -11.255035400390625, "global_step": 186189, "epoch": 1108} {"train_loss": -11.012561798095703, "global_step": 186190, "epoch": 1108} {"train_loss": -11.049556732177734, "global_step": 186191, "epoch": 1108} {"train_loss": -11.096315383911133, "global_step": 186192, "epoch": 1108} {"train_loss": -11.036779403686523, "global_step": 186193, "epoch": 1108} {"train_loss": -10.688807487487793, "global_step": 186194, "epoch": 1108} {"train_loss": -11.187382698059082, "global_step": 186195, "epoch": 1108} {"train_loss": -10.879523277282715, "global_step": 186196, "epoch": 1108} {"train_loss": -11.021322250366211, "global_step": 186197, "epoch": 1108} {"train_loss": -11.211626052856445, "global_step": 186198, "epoch": 1108} {"train_loss": -10.669755935668945, "global_step": 186199, "epoch": 1108} {"train_loss": -11.180768966674805, "global_step": 186200, "epoch": 1108} {"train_loss": -11.208230972290039, "global_step": 186201, "epoch": 1108} {"train_loss": -11.068887710571289, "global_step": 186202, "epoch": 1108} {"train_loss": -11.205286026000977, "global_step": 186203, "epoch": 1108} {"train_loss": -11.10746955871582, "global_step": 186204, "epoch": 1108} {"train_loss": -11.269913673400879, "global_step": 186205, "epoch": 1108} {"train_loss": -11.271129608154297, "global_step": 186206, "epoch": 1108} {"train_loss": -11.077035903930664, "global_step": 186207, "epoch": 1108} {"train_loss": -11.383718490600586, "global_step": 186208, "epoch": 1108} {"train_loss": -11.039804458618164, "global_step": 186209, "epoch": 1108} {"train_loss": -11.317646980285645, "global_step": 186210, "epoch": 1108} {"train_loss": -11.40114974975586, "global_step": 186211, "epoch": 1108} {"train_loss": -11.186580657958984, "global_step": 186212, "epoch": 1108} {"train_loss": -11.496074676513672, "global_step": 186213, "epoch": 1108} {"train_loss": -11.280350685119629, "global_step": 186214, "epoch": 1108} {"train_loss": -11.186201095581055, "global_step": 186215, "epoch": 1108} {"train_loss": -11.17442512512207, "global_step": 186216, "epoch": 1108} {"train_loss": -11.627208709716797, "global_step": 186217, "epoch": 1108} {"train_loss": -11.212562561035156, "global_step": 186218, "epoch": 1108} {"train_loss": -11.51430892944336, "global_step": 186219, "epoch": 1108} {"train_loss": -11.386907577514648, "global_step": 186220, "epoch": 1108} {"train_loss": -11.368517875671387, "global_step": 186221, "epoch": 1108} {"train_loss": -11.468810081481934, "global_step": 186222, "epoch": 1108} {"train_loss": -11.479706764221191, "global_step": 186223, "epoch": 1108} {"train_loss": -11.623213768005371, "global_step": 186224, "epoch": 1108} {"train_loss": -11.276644706726074, "global_step": 186225, "epoch": 1108} {"train_loss": -11.465957641601562, "global_step": 186226, "epoch": 1108} {"train_loss": -11.354278564453125, "global_step": 186227, "epoch": 1108} {"train_loss": -11.595316886901855, "global_step": 186228, "epoch": 1108} {"train_loss": -11.177453994750977, "global_step": 186229, "epoch": 1108} {"train_loss": -11.320180892944336, "global_step": 186230, "epoch": 1108} {"train_loss": -11.494829177856445, "global_step": 186231, "epoch": 1108} {"train_loss": -11.416285514831543, "global_step": 186232, "epoch": 1108} {"train_loss": -11.39955997467041, "global_step": 186233, "epoch": 1108} {"train_loss": -11.452787399291992, "global_step": 186234, "epoch": 1108} {"train_loss": -11.30789566040039, "global_step": 186235, "epoch": 1108} {"train_loss": -11.576168060302734, "global_step": 186236, "epoch": 1108} {"train_loss": -11.520784378051758, "global_step": 186237, "epoch": 1108} {"train_loss": -11.491403579711914, "global_step": 186238, "epoch": 1108} {"train_loss": -11.599264144897461, "global_step": 186239, "epoch": 1108} {"train_loss": -11.44460678100586, "global_step": 186240, "epoch": 1108} {"train_loss": -11.584254264831543, "global_step": 186241, "epoch": 1108} {"train_loss": -11.575057029724121, "global_step": 186242, "epoch": 1108} {"train_loss": -11.227291107177734, "global_step": 186243, "epoch": 1108} {"train_loss": -11.655749320983887, "global_step": 186244, "epoch": 1108} {"train_loss": -11.280108451843262, "global_step": 186245, "epoch": 1108} {"train_loss": -11.479265213012695, "global_step": 186246, "epoch": 1108} {"train_loss": -11.353780746459961, "global_step": 186247, "epoch": 1108} {"train_loss": -11.382143020629883, "global_step": 186248, "epoch": 1108} {"train_loss": -11.28648567199707, "global_step": 186249, "epoch": 1108} {"train_loss": -11.201227188110352, "global_step": 186250, "epoch": 1108} {"train_loss": -10.852405548095703, "global_step": 186251, "epoch": 1108} {"train_loss": -10.914548873901367, "global_step": 186252, "epoch": 1108} {"train_loss": -10.290131568908691, "global_step": 186253, "epoch": 1108} {"train_loss": -11.392097473144531, "global_step": 186254, "epoch": 1108} {"train_loss": -10.517353057861328, "global_step": 186255, "epoch": 1108} {"train_loss": -10.125473022460938, "global_step": 186256, "epoch": 1108} {"train_loss": -10.176249504089355, "global_step": 186257, "epoch": 1108} {"train_loss": -10.128026008605957, "global_step": 186258, "epoch": 1108} {"train_loss": -9.823881149291992, "global_step": 186259, "epoch": 1108} {"train_loss": -9.66403579711914, "global_step": 186260, "epoch": 1108} {"train_loss": -10.01608657836914, "global_step": 186261, "epoch": 1108} {"train_loss": -10.814107894897461, "global_step": 186262, "epoch": 1108} {"train_loss": -10.41264533996582, "global_step": 186263, "epoch": 1108} {"train_loss": -10.410538673400879, "global_step": 186264, "epoch": 1108} {"train_loss": -11.138517379760742, "global_step": 186265, "epoch": 1108} {"train_loss": -11.095708847045898, "global_step": 186266, "epoch": 1108} {"train_loss": -11.084216117858887, "global_step": 186267, "epoch": 1108} {"train_loss": -11.085044860839844, "global_step": 186268, "epoch": 1108} {"train_loss": -11.085192680358887, "global_step": 186269, "epoch": 1108} {"train_loss": -10.738737106323242, "global_step": 186270, "epoch": 1108} {"train_loss": -10.96910285949707, "global_step": 186271, "epoch": 1108} {"train_loss": -10.826837539672852, "global_step": 186272, "epoch": 1108} {"train_loss": -11.311798095703125, "global_step": 186273, "epoch": 1108} {"train_loss": -11.041543960571289, "global_step": 186274, "epoch": 1108} {"train_loss": -11.345406532287598, "global_step": 186275, "epoch": 1108} {"train_loss": -11.15682601928711, "global_step": 186276, "epoch": 1108} {"train_loss": -11.363914489746094, "global_step": 186277, "epoch": 1108} {"train_loss": -11.349207878112793, "global_step": 186278, "epoch": 1108} {"train_loss": -11.332015037536621, "global_step": 186279, "epoch": 1108} {"train_loss": -11.324392318725586, "global_step": 186280, "epoch": 1108} {"train_loss": -11.084369659423828, "global_step": 186281, "epoch": 1108} {"train_loss": -11.318901062011719, "global_step": 186282, "epoch": 1108} {"train_loss": -11.152600288391113, "global_step": 186283, "epoch": 1108} {"train_loss": -11.112846374511719, "global_step": 186284, "epoch": 1108} {"train_loss": -11.11959457397461, "global_step": 186285, "epoch": 1108} {"train_loss": -11.26153564453125, "global_step": 186286, "epoch": 1108} {"train_loss": -11.28689193725586, "global_step": 186287, "epoch": 1108} {"train_loss": -11.389976501464844, "global_step": 186288, "epoch": 1108} {"train_loss": -11.328433990478516, "global_step": 186289, "epoch": 1108} {"train_loss": -11.41219711303711, "global_step": 186290, "epoch": 1108} {"train_loss": -11.424019813537598, "global_step": 186291, "epoch": 1108} {"train_loss": -11.279908180236816, "global_step": 186292, "epoch": 1108} {"train_loss": -11.535100936889648, "global_step": 186293, "epoch": 1108} {"train_loss": -11.275535583496094, "global_step": 186294, "epoch": 1108} {"train_loss": -11.348265647888184, "global_step": 186295, "epoch": 1108} {"train_loss": -11.353055953979492, "global_step": 186296, "epoch": 1108} {"train_loss": -11.410639762878418, "global_step": 186297, "epoch": 1108} {"train_loss": -11.543761253356934, "global_step": 186298, "epoch": 1108} {"train_loss": -11.212469100952148, "global_step": 186299, "epoch": 1108} {"train_loss": -11.411497116088867, "global_step": 186300, "epoch": 1108} {"train_loss": -11.232608795166016, "global_step": 186301, "epoch": 1108} {"train_loss": -10.88796615600586, "global_step": 186302, "epoch": 1108} {"train_loss": -11.568317413330078, "global_step": 186303, "epoch": 1108} {"train_loss": -10.703250885009766, "global_step": 186304, "epoch": 1108} {"train_loss": -11.201868057250977, "global_step": 186305, "epoch": 1108} {"train_loss": -10.820245742797852, "global_step": 186306, "epoch": 1108} {"train_loss": -10.549528121948242, "global_step": 186307, "epoch": 1108} {"train_loss": -10.456829071044922, "global_step": 186308, "epoch": 1108} {"train_loss": -10.513697624206543, "global_step": 186309, "epoch": 1108} {"train_loss": -10.45024299621582, "global_step": 186310, "epoch": 1108} {"train_loss": -11.061890244483948, "global_step": 186311, "epoch": 1108, "val_loss": 247524.6875} {"train_loss": -10.901728630065918, "global_step": 186312, "epoch": 1109} {"train_loss": -10.911685943603516, "global_step": 186313, "epoch": 1109} {"train_loss": -10.71440315246582, "global_step": 186314, "epoch": 1109} {"train_loss": -10.818233489990234, "global_step": 186315, "epoch": 1109} {"train_loss": -10.4678955078125, "global_step": 186316, "epoch": 1109} {"train_loss": -11.281030654907227, "global_step": 186317, "epoch": 1109} {"train_loss": -10.712974548339844, "global_step": 186318, "epoch": 1109} {"train_loss": -10.467857360839844, "global_step": 186319, "epoch": 1109} {"train_loss": -10.640524864196777, "global_step": 186320, "epoch": 1109} {"train_loss": -9.307306289672852, "global_step": 186321, "epoch": 1109} {"train_loss": -9.492177963256836, "global_step": 186322, "epoch": 1109} {"train_loss": -10.597000122070312, "global_step": 186323, "epoch": 1109} {"train_loss": -9.52124309539795, "global_step": 186324, "epoch": 1109} {"train_loss": -11.007780075073242, "global_step": 186325, "epoch": 1109} {"train_loss": -10.358516693115234, "global_step": 186326, "epoch": 1109} {"train_loss": -10.605939865112305, "global_step": 186327, "epoch": 1109} {"train_loss": -10.48369312286377, "global_step": 186328, "epoch": 1109} {"train_loss": -9.680566787719727, "global_step": 186329, "epoch": 1109} {"train_loss": -10.800551414489746, "global_step": 186330, "epoch": 1109} {"train_loss": -10.368133544921875, "global_step": 186331, "epoch": 1109} {"train_loss": -10.270750045776367, "global_step": 186332, "epoch": 1109} {"train_loss": -10.608707427978516, "global_step": 186333, "epoch": 1109} {"train_loss": -10.531147003173828, "global_step": 186334, "epoch": 1109} {"train_loss": -10.745542526245117, "global_step": 186335, "epoch": 1109} {"train_loss": -10.381505966186523, "global_step": 186336, "epoch": 1109} {"train_loss": -10.391029357910156, "global_step": 186337, "epoch": 1109} {"train_loss": -10.77027416229248, "global_step": 186338, "epoch": 1109} {"train_loss": -10.544389724731445, "global_step": 186339, "epoch": 1109} {"train_loss": -10.511871337890625, "global_step": 186340, "epoch": 1109} {"train_loss": -11.068334579467773, "global_step": 186341, "epoch": 1109} {"train_loss": -10.428839683532715, "global_step": 186342, "epoch": 1109} {"train_loss": -10.507303237915039, "global_step": 186343, "epoch": 1109} {"train_loss": -10.87573528289795, "global_step": 186344, "epoch": 1109} {"train_loss": -10.626626014709473, "global_step": 186345, "epoch": 1109} {"train_loss": -10.121435165405273, "global_step": 186346, "epoch": 1109} {"train_loss": -11.099518775939941, "global_step": 186347, "epoch": 1109} {"train_loss": -10.510249137878418, "global_step": 186348, "epoch": 1109} {"train_loss": -10.568166732788086, "global_step": 186349, "epoch": 1109} {"train_loss": -10.879952430725098, "global_step": 186350, "epoch": 1109} {"train_loss": -10.857550621032715, "global_step": 186351, "epoch": 1109} {"train_loss": -10.832086563110352, "global_step": 186352, "epoch": 1109} {"train_loss": -10.745038986206055, "global_step": 186353, "epoch": 1109} {"train_loss": -11.059195518493652, "global_step": 186354, "epoch": 1109} {"train_loss": -10.693365097045898, "global_step": 186355, "epoch": 1109} {"train_loss": -10.703410148620605, "global_step": 186356, "epoch": 1109} {"train_loss": -11.163554191589355, "global_step": 186357, "epoch": 1109} {"train_loss": -10.491382598876953, "global_step": 186358, "epoch": 1109} {"train_loss": -10.92875862121582, "global_step": 186359, "epoch": 1109} {"train_loss": -10.973601341247559, "global_step": 186360, "epoch": 1109} {"train_loss": -11.027007102966309, "global_step": 186361, "epoch": 1109} {"train_loss": -11.221220016479492, "global_step": 186362, "epoch": 1109} {"train_loss": -11.048312187194824, "global_step": 186363, "epoch": 1109} {"train_loss": -11.081274032592773, "global_step": 186364, "epoch": 1109} {"train_loss": -10.723884582519531, "global_step": 186365, "epoch": 1109} {"train_loss": -11.170259475708008, "global_step": 186366, "epoch": 1109} {"train_loss": -11.241045951843262, "global_step": 186367, "epoch": 1109} {"train_loss": -11.100430488586426, "global_step": 186368, "epoch": 1109} {"train_loss": -11.477794647216797, "global_step": 186369, "epoch": 1109} {"train_loss": -11.220491409301758, "global_step": 186370, "epoch": 1109} {"train_loss": -11.352029800415039, "global_step": 186371, "epoch": 1109} {"train_loss": -11.286417007446289, "global_step": 186372, "epoch": 1109} {"train_loss": -11.382272720336914, "global_step": 186373, "epoch": 1109} {"train_loss": -11.09207534790039, "global_step": 186374, "epoch": 1109} {"train_loss": -11.219413757324219, "global_step": 186375, "epoch": 1109} {"train_loss": -11.421405792236328, "global_step": 186376, "epoch": 1109} {"train_loss": -11.308168411254883, "global_step": 186377, "epoch": 1109} {"train_loss": -11.271339416503906, "global_step": 186378, "epoch": 1109} {"train_loss": -11.368200302124023, "global_step": 186379, "epoch": 1109} {"train_loss": -11.39794921875, "global_step": 186380, "epoch": 1109} {"train_loss": -11.139835357666016, "global_step": 186381, "epoch": 1109} {"train_loss": -11.354747772216797, "global_step": 186382, "epoch": 1109} {"train_loss": -11.500040054321289, "global_step": 186383, "epoch": 1109} {"train_loss": -11.256811141967773, "global_step": 186384, "epoch": 1109} {"train_loss": -11.424455642700195, "global_step": 186385, "epoch": 1109} {"train_loss": -11.301050186157227, "global_step": 186386, "epoch": 1109} {"train_loss": -11.166401863098145, "global_step": 186387, "epoch": 1109} {"train_loss": -11.450410842895508, "global_step": 186388, "epoch": 1109} {"train_loss": -11.312274932861328, "global_step": 186389, "epoch": 1109} {"train_loss": -11.050265312194824, "global_step": 186390, "epoch": 1109} {"train_loss": -11.51058578491211, "global_step": 186391, "epoch": 1109} {"train_loss": -11.39586067199707, "global_step": 186392, "epoch": 1109} {"train_loss": -11.566308975219727, "global_step": 186393, "epoch": 1109} {"train_loss": -11.502399444580078, "global_step": 186394, "epoch": 1109} {"train_loss": -11.424545288085938, "global_step": 186395, "epoch": 1109} {"train_loss": -11.447187423706055, "global_step": 186396, "epoch": 1109} {"train_loss": -11.46323299407959, "global_step": 186397, "epoch": 1109} {"train_loss": -11.45516586303711, "global_step": 186398, "epoch": 1109} {"train_loss": -11.514975547790527, "global_step": 186399, "epoch": 1109} {"train_loss": -11.01781177520752, "global_step": 186400, "epoch": 1109} {"train_loss": -11.256351470947266, "global_step": 186401, "epoch": 1109} {"train_loss": -11.358343124389648, "global_step": 186402, "epoch": 1109} {"train_loss": -11.476414680480957, "global_step": 186403, "epoch": 1109} {"train_loss": -11.358132362365723, "global_step": 186404, "epoch": 1109} {"train_loss": -11.374261856079102, "global_step": 186405, "epoch": 1109} {"train_loss": -11.139288902282715, "global_step": 186406, "epoch": 1109} {"train_loss": -9.876453399658203, "global_step": 186407, "epoch": 1109} {"train_loss": -11.15005111694336, "global_step": 186408, "epoch": 1109} {"train_loss": -11.117465019226074, "global_step": 186409, "epoch": 1109} {"train_loss": -11.25879192352295, "global_step": 186410, "epoch": 1109} {"train_loss": -11.165245056152344, "global_step": 186411, "epoch": 1109} {"train_loss": -11.363052368164062, "global_step": 186412, "epoch": 1109} {"train_loss": -10.583267211914062, "global_step": 186413, "epoch": 1109} {"train_loss": -9.015920639038086, "global_step": 186414, "epoch": 1109} {"train_loss": -10.804266929626465, "global_step": 186415, "epoch": 1109} {"train_loss": -10.018745422363281, "global_step": 186416, "epoch": 1109} {"train_loss": -9.570547103881836, "global_step": 186417, "epoch": 1109} {"train_loss": -9.942522048950195, "global_step": 186418, "epoch": 1109} {"train_loss": -10.395397186279297, "global_step": 186419, "epoch": 1109} {"train_loss": -7.969424724578857, "global_step": 186420, "epoch": 1109} {"train_loss": -8.457322120666504, "global_step": 186421, "epoch": 1109} {"train_loss": -10.384096145629883, "global_step": 186422, "epoch": 1109} {"train_loss": -8.698994636535645, "global_step": 186423, "epoch": 1109} {"train_loss": -9.297237396240234, "global_step": 186424, "epoch": 1109} {"train_loss": -8.948463439941406, "global_step": 186425, "epoch": 1109} {"train_loss": -10.348475456237793, "global_step": 186426, "epoch": 1109} {"train_loss": -8.697792053222656, "global_step": 186427, "epoch": 1109} {"train_loss": -10.36507797241211, "global_step": 186428, "epoch": 1109} {"train_loss": -9.537015914916992, "global_step": 186429, "epoch": 1109} {"train_loss": -9.680404663085938, "global_step": 186430, "epoch": 1109} {"train_loss": -9.645210266113281, "global_step": 186431, "epoch": 1109} {"train_loss": -10.046879768371582, "global_step": 186432, "epoch": 1109} {"train_loss": -10.223880767822266, "global_step": 186433, "epoch": 1109} {"train_loss": -9.824323654174805, "global_step": 186434, "epoch": 1109} {"train_loss": -10.879791259765625, "global_step": 186435, "epoch": 1109} {"train_loss": -10.117681503295898, "global_step": 186436, "epoch": 1109} {"train_loss": -10.170324325561523, "global_step": 186437, "epoch": 1109} {"train_loss": -9.891836166381836, "global_step": 186438, "epoch": 1109} {"train_loss": -10.737438201904297, "global_step": 186439, "epoch": 1109} {"train_loss": -10.30274486541748, "global_step": 186440, "epoch": 1109} {"train_loss": -10.290599822998047, "global_step": 186441, "epoch": 1109} {"train_loss": -10.766753196716309, "global_step": 186442, "epoch": 1109} {"train_loss": -10.452796936035156, "global_step": 186443, "epoch": 1109} {"train_loss": -10.166366577148438, "global_step": 186444, "epoch": 1109} {"train_loss": -10.665013313293457, "global_step": 186445, "epoch": 1109} {"train_loss": -10.772653579711914, "global_step": 186446, "epoch": 1109} {"train_loss": -10.853780746459961, "global_step": 186447, "epoch": 1109} {"train_loss": -10.755202293395996, "global_step": 186448, "epoch": 1109} {"train_loss": -10.751136779785156, "global_step": 186449, "epoch": 1109} {"train_loss": -11.018208503723145, "global_step": 186450, "epoch": 1109} {"train_loss": -10.873689651489258, "global_step": 186451, "epoch": 1109} {"train_loss": -10.89907455444336, "global_step": 186452, "epoch": 1109} {"train_loss": -10.833730697631836, "global_step": 186453, "epoch": 1109} {"train_loss": -10.874773025512695, "global_step": 186454, "epoch": 1109} {"train_loss": -10.974457740783691, "global_step": 186455, "epoch": 1109} {"train_loss": -10.775547981262207, "global_step": 186456, "epoch": 1109} {"train_loss": -10.891687393188477, "global_step": 186457, "epoch": 1109} {"train_loss": -10.631484985351562, "global_step": 186458, "epoch": 1109} {"train_loss": -10.879154205322266, "global_step": 186459, "epoch": 1109} {"train_loss": -11.155014991760254, "global_step": 186460, "epoch": 1109} {"train_loss": -10.907880783081055, "global_step": 186461, "epoch": 1109} {"train_loss": -11.268803596496582, "global_step": 186462, "epoch": 1109} {"train_loss": -10.962507247924805, "global_step": 186463, "epoch": 1109} {"train_loss": -11.013500213623047, "global_step": 186464, "epoch": 1109} {"train_loss": -11.090595245361328, "global_step": 186465, "epoch": 1109} {"train_loss": -11.273763656616211, "global_step": 186466, "epoch": 1109} {"train_loss": -10.999390602111816, "global_step": 186467, "epoch": 1109} {"train_loss": -10.985946655273438, "global_step": 186468, "epoch": 1109} {"train_loss": -11.081315994262695, "global_step": 186469, "epoch": 1109} {"train_loss": -11.215845108032227, "global_step": 186470, "epoch": 1109} {"train_loss": -11.16738510131836, "global_step": 186471, "epoch": 1109} {"train_loss": -10.936591148376465, "global_step": 186472, "epoch": 1109} {"train_loss": -11.077078819274902, "global_step": 186473, "epoch": 1109} {"train_loss": -10.895593643188477, "global_step": 186474, "epoch": 1109} {"train_loss": -11.256341934204102, "global_step": 186475, "epoch": 1109} {"train_loss": -11.007922172546387, "global_step": 186476, "epoch": 1109} {"train_loss": -11.040491104125977, "global_step": 186477, "epoch": 1109} {"train_loss": -11.00656509399414, "global_step": 186478, "epoch": 1109} {"train_loss": -10.742066045602163, "global_step": 186479, "epoch": 1109, "val_loss": 244536.6875} {"train_loss": -11.155080795288086, "global_step": 186480, "epoch": 1110} {"train_loss": -11.097017288208008, "global_step": 186481, "epoch": 1110} {"train_loss": -11.214611053466797, "global_step": 186482, "epoch": 1110} {"train_loss": -11.304788589477539, "global_step": 186483, "epoch": 1110} {"train_loss": -11.062450408935547, "global_step": 186484, "epoch": 1110} {"train_loss": -11.351954460144043, "global_step": 186485, "epoch": 1110} {"train_loss": -11.201648712158203, "global_step": 186486, "epoch": 1110} {"train_loss": -11.227922439575195, "global_step": 186487, "epoch": 1110} {"train_loss": -11.16402816772461, "global_step": 186488, "epoch": 1110} {"train_loss": -11.244888305664062, "global_step": 186489, "epoch": 1110} {"train_loss": -11.403284072875977, "global_step": 186490, "epoch": 1110} {"train_loss": -11.513808250427246, "global_step": 186491, "epoch": 1110} {"train_loss": -11.458795547485352, "global_step": 186492, "epoch": 1110} {"train_loss": -11.263525009155273, "global_step": 186493, "epoch": 1110} {"train_loss": -11.424212455749512, "global_step": 186494, "epoch": 1110} {"train_loss": -11.634794235229492, "global_step": 186495, "epoch": 1110} {"train_loss": -11.369256019592285, "global_step": 186496, "epoch": 1110} {"train_loss": -11.49962043762207, "global_step": 186497, "epoch": 1110} {"train_loss": -11.405149459838867, "global_step": 186498, "epoch": 1110} {"train_loss": -11.254182815551758, "global_step": 186499, "epoch": 1110} {"train_loss": -11.43414306640625, "global_step": 186500, "epoch": 1110} {"train_loss": -11.109590530395508, "global_step": 186501, "epoch": 1110} {"train_loss": -11.23902416229248, "global_step": 186502, "epoch": 1110} {"train_loss": -11.301370620727539, "global_step": 186503, "epoch": 1110} {"train_loss": -11.305675506591797, "global_step": 186504, "epoch": 1110} {"train_loss": -11.230685234069824, "global_step": 186505, "epoch": 1110} {"train_loss": -11.406974792480469, "global_step": 186506, "epoch": 1110} {"train_loss": -10.994236946105957, "global_step": 186507, "epoch": 1110} {"train_loss": -11.357185363769531, "global_step": 186508, "epoch": 1110} {"train_loss": -11.516242027282715, "global_step": 186509, "epoch": 1110} {"train_loss": -11.570257186889648, "global_step": 186510, "epoch": 1110} {"train_loss": -11.403460502624512, "global_step": 186511, "epoch": 1110} {"train_loss": -11.217588424682617, "global_step": 186512, "epoch": 1110} {"train_loss": -11.607603073120117, "global_step": 186513, "epoch": 1110} {"train_loss": -10.947881698608398, "global_step": 186514, "epoch": 1110} {"train_loss": -11.382132530212402, "global_step": 186515, "epoch": 1110} {"train_loss": -11.127528190612793, "global_step": 186516, "epoch": 1110} {"train_loss": -11.127708435058594, "global_step": 186517, "epoch": 1110} {"train_loss": -11.30879020690918, "global_step": 186518, "epoch": 1110} {"train_loss": -11.32929801940918, "global_step": 186519, "epoch": 1110} {"train_loss": -11.51837158203125, "global_step": 186520, "epoch": 1110} {"train_loss": -10.86916446685791, "global_step": 186521, "epoch": 1110} {"train_loss": -11.438594818115234, "global_step": 186522, "epoch": 1110} {"train_loss": -11.230937004089355, "global_step": 186523, "epoch": 1110} {"train_loss": -11.22844123840332, "global_step": 186524, "epoch": 1110} {"train_loss": -11.101255416870117, "global_step": 186525, "epoch": 1110} {"train_loss": -11.72311019897461, "global_step": 186526, "epoch": 1110} {"train_loss": -11.045324325561523, "global_step": 186527, "epoch": 1110} {"train_loss": -11.310535430908203, "global_step": 186528, "epoch": 1110} {"train_loss": -11.570966720581055, "global_step": 186529, "epoch": 1110} {"train_loss": -11.292726516723633, "global_step": 186530, "epoch": 1110} {"train_loss": -11.369073867797852, "global_step": 186531, "epoch": 1110} {"train_loss": -11.175472259521484, "global_step": 186532, "epoch": 1110} {"train_loss": -11.53594970703125, "global_step": 186533, "epoch": 1110} {"train_loss": -11.16961669921875, "global_step": 186534, "epoch": 1110} {"train_loss": -11.244647979736328, "global_step": 186535, "epoch": 1110} {"train_loss": -11.328510284423828, "global_step": 186536, "epoch": 1110} {"train_loss": -11.198784828186035, "global_step": 186537, "epoch": 1110} {"train_loss": -11.251627922058105, "global_step": 186538, "epoch": 1110} {"train_loss": -10.866639137268066, "global_step": 186539, "epoch": 1110} {"train_loss": -11.169273376464844, "global_step": 186540, "epoch": 1110} {"train_loss": -10.905256271362305, "global_step": 186541, "epoch": 1110} {"train_loss": -10.694602966308594, "global_step": 186542, "epoch": 1110} {"train_loss": -11.445415496826172, "global_step": 186543, "epoch": 1110} {"train_loss": -10.538122177124023, "global_step": 186544, "epoch": 1110} {"train_loss": -11.22585678100586, "global_step": 186545, "epoch": 1110} {"train_loss": -11.03946304321289, "global_step": 186546, "epoch": 1110} {"train_loss": -10.720260620117188, "global_step": 186547, "epoch": 1110} {"train_loss": -11.216212272644043, "global_step": 186548, "epoch": 1110} {"train_loss": -11.144147872924805, "global_step": 186549, "epoch": 1110} {"train_loss": -11.404869079589844, "global_step": 186550, "epoch": 1110} {"train_loss": -11.060619354248047, "global_step": 186551, "epoch": 1110} {"train_loss": -11.294084548950195, "global_step": 186552, "epoch": 1110} {"train_loss": -11.240255355834961, "global_step": 186553, "epoch": 1110} {"train_loss": -11.500848770141602, "global_step": 186554, "epoch": 1110} {"train_loss": -11.234640121459961, "global_step": 186555, "epoch": 1110} {"train_loss": -11.440740585327148, "global_step": 186556, "epoch": 1110} {"train_loss": -11.250911712646484, "global_step": 186557, "epoch": 1110} {"train_loss": -11.506538391113281, "global_step": 186558, "epoch": 1110} {"train_loss": -11.144195556640625, "global_step": 186559, "epoch": 1110} {"train_loss": -11.506328582763672, "global_step": 186560, "epoch": 1110} {"train_loss": -11.339225769042969, "global_step": 186561, "epoch": 1110} {"train_loss": -11.633556365966797, "global_step": 186562, "epoch": 1110} {"train_loss": -11.584540367126465, "global_step": 186563, "epoch": 1110} {"train_loss": -11.43083667755127, "global_step": 186564, "epoch": 1110} {"train_loss": -11.6512451171875, "global_step": 186565, "epoch": 1110} {"train_loss": -11.58267593383789, "global_step": 186566, "epoch": 1110} {"train_loss": -11.442919731140137, "global_step": 186567, "epoch": 1110} {"train_loss": -11.595671653747559, "global_step": 186568, "epoch": 1110} {"train_loss": -11.402804374694824, "global_step": 186569, "epoch": 1110} {"train_loss": -11.481554985046387, "global_step": 186570, "epoch": 1110} {"train_loss": -11.29631233215332, "global_step": 186571, "epoch": 1110} {"train_loss": -11.603153228759766, "global_step": 186572, "epoch": 1110} {"train_loss": -11.49662971496582, "global_step": 186573, "epoch": 1110} {"train_loss": -11.56966781616211, "global_step": 186574, "epoch": 1110} {"train_loss": -11.586244583129883, "global_step": 186575, "epoch": 1110} {"train_loss": -11.370028495788574, "global_step": 186576, "epoch": 1110} {"train_loss": -11.298516273498535, "global_step": 186577, "epoch": 1110} {"train_loss": -11.631482124328613, "global_step": 186578, "epoch": 1110} {"train_loss": -11.370882987976074, "global_step": 186579, "epoch": 1110} {"train_loss": -11.439823150634766, "global_step": 186580, "epoch": 1110} {"train_loss": -11.410762786865234, "global_step": 186581, "epoch": 1110} {"train_loss": -11.488101959228516, "global_step": 186582, "epoch": 1110} {"train_loss": -11.68149185180664, "global_step": 186583, "epoch": 1110} {"train_loss": -11.349495887756348, "global_step": 186584, "epoch": 1110} {"train_loss": -11.42251205444336, "global_step": 186585, "epoch": 1110} {"train_loss": -11.03834342956543, "global_step": 186586, "epoch": 1110} {"train_loss": -11.332615852355957, "global_step": 186587, "epoch": 1110} {"train_loss": -11.54684829711914, "global_step": 186588, "epoch": 1110} {"train_loss": -11.412235260009766, "global_step": 186589, "epoch": 1110} {"train_loss": -11.170644760131836, "global_step": 186590, "epoch": 1110} {"train_loss": -11.011493682861328, "global_step": 186591, "epoch": 1110} {"train_loss": -11.608888626098633, "global_step": 186592, "epoch": 1110} {"train_loss": -11.341987609863281, "global_step": 186593, "epoch": 1110} {"train_loss": -10.648391723632812, "global_step": 186594, "epoch": 1110} {"train_loss": -10.64605712890625, "global_step": 186595, "epoch": 1110} {"train_loss": -11.212626457214355, "global_step": 186596, "epoch": 1110} {"train_loss": -9.480585098266602, "global_step": 186597, "epoch": 1110} {"train_loss": -10.63619613647461, "global_step": 186598, "epoch": 1110} {"train_loss": -10.903213500976562, "global_step": 186599, "epoch": 1110} {"train_loss": -10.014252662658691, "global_step": 186600, "epoch": 1110} {"train_loss": -10.522825241088867, "global_step": 186601, "epoch": 1110} {"train_loss": -9.763381004333496, "global_step": 186602, "epoch": 1110} {"train_loss": -10.56454086303711, "global_step": 186603, "epoch": 1110} {"train_loss": -11.123408317565918, "global_step": 186604, "epoch": 1110} {"train_loss": -10.701356887817383, "global_step": 186605, "epoch": 1110} {"train_loss": -9.894920349121094, "global_step": 186606, "epoch": 1110} {"train_loss": -11.228861808776855, "global_step": 186607, "epoch": 1110} {"train_loss": -10.115728378295898, "global_step": 186608, "epoch": 1110} {"train_loss": -10.057119369506836, "global_step": 186609, "epoch": 1110} {"train_loss": -11.043428421020508, "global_step": 186610, "epoch": 1110} {"train_loss": -9.8758544921875, "global_step": 186611, "epoch": 1110} {"train_loss": -10.737372398376465, "global_step": 186612, "epoch": 1110} {"train_loss": -10.215009689331055, "global_step": 186613, "epoch": 1110} {"train_loss": -11.209465026855469, "global_step": 186614, "epoch": 1110} {"train_loss": -10.588111877441406, "global_step": 186615, "epoch": 1110} {"train_loss": -10.820161819458008, "global_step": 186616, "epoch": 1110} {"train_loss": -10.78020191192627, "global_step": 186617, "epoch": 1110} {"train_loss": -10.34445571899414, "global_step": 186618, "epoch": 1110} {"train_loss": -10.928596496582031, "global_step": 186619, "epoch": 1110} {"train_loss": -10.08128833770752, "global_step": 186620, "epoch": 1110} {"train_loss": -11.00556755065918, "global_step": 186621, "epoch": 1110} {"train_loss": -10.247072219848633, "global_step": 186622, "epoch": 1110} {"train_loss": -11.081995010375977, "global_step": 186623, "epoch": 1110} {"train_loss": -10.641490936279297, "global_step": 186624, "epoch": 1110} {"train_loss": -10.993766784667969, "global_step": 186625, "epoch": 1110} {"train_loss": -10.835091590881348, "global_step": 186626, "epoch": 1110} {"train_loss": -11.048905372619629, "global_step": 186627, "epoch": 1110} {"train_loss": -10.795848846435547, "global_step": 186628, "epoch": 1110} {"train_loss": -10.8733491897583, "global_step": 186629, "epoch": 1110} {"train_loss": -11.140890121459961, "global_step": 186630, "epoch": 1110} {"train_loss": -11.128937721252441, "global_step": 186631, "epoch": 1110} {"train_loss": -11.065032958984375, "global_step": 186632, "epoch": 1110} {"train_loss": -11.125322341918945, "global_step": 186633, "epoch": 1110} {"train_loss": -10.893259048461914, "global_step": 186634, "epoch": 1110} {"train_loss": -10.900146484375, "global_step": 186635, "epoch": 1110} {"train_loss": -11.339487075805664, "global_step": 186636, "epoch": 1110} {"train_loss": -10.973546028137207, "global_step": 186637, "epoch": 1110} {"train_loss": -11.143417358398438, "global_step": 186638, "epoch": 1110} {"train_loss": -11.112553596496582, "global_step": 186639, "epoch": 1110} {"train_loss": -11.174901008605957, "global_step": 186640, "epoch": 1110} {"train_loss": -11.012081146240234, "global_step": 186641, "epoch": 1110} {"train_loss": -11.399932861328125, "global_step": 186642, "epoch": 1110} {"train_loss": -10.958427429199219, "global_step": 186643, "epoch": 1110} {"train_loss": -11.316106796264648, "global_step": 186644, "epoch": 1110} {"train_loss": -11.2643404006958, "global_step": 186645, "epoch": 1110} {"train_loss": -11.360221862792969, "global_step": 186646, "epoch": 1110} {"train_loss": -11.14346078463963, "global_step": 186647, "epoch": 1110, "val_loss": 247834.34375, "train_action_mse_error": 0.30766940116882324} {"train_loss": -11.32198429107666, "global_step": 186648, "epoch": 1111} {"train_loss": -11.228503227233887, "global_step": 186649, "epoch": 1111} {"train_loss": -11.429317474365234, "global_step": 186650, "epoch": 1111} {"train_loss": -11.44578742980957, "global_step": 186651, "epoch": 1111} {"train_loss": -11.285009384155273, "global_step": 186652, "epoch": 1111} {"train_loss": -11.346155166625977, "global_step": 186653, "epoch": 1111} {"train_loss": -11.393836975097656, "global_step": 186654, "epoch": 1111} {"train_loss": -11.667375564575195, "global_step": 186655, "epoch": 1111} {"train_loss": -11.258514404296875, "global_step": 186656, "epoch": 1111} {"train_loss": -11.642786026000977, "global_step": 186657, "epoch": 1111} {"train_loss": -11.194710731506348, "global_step": 186658, "epoch": 1111} {"train_loss": -11.291200637817383, "global_step": 186659, "epoch": 1111} {"train_loss": -11.43079948425293, "global_step": 186660, "epoch": 1111} {"train_loss": -11.492897033691406, "global_step": 186661, "epoch": 1111} {"train_loss": -11.388696670532227, "global_step": 186662, "epoch": 1111} {"train_loss": -11.462177276611328, "global_step": 186663, "epoch": 1111} {"train_loss": -11.295917510986328, "global_step": 186664, "epoch": 1111} {"train_loss": -11.32942008972168, "global_step": 186665, "epoch": 1111} {"train_loss": -11.501835823059082, "global_step": 186666, "epoch": 1111} {"train_loss": -11.52774429321289, "global_step": 186667, "epoch": 1111} {"train_loss": -11.636850357055664, "global_step": 186668, "epoch": 1111} {"train_loss": -11.57425594329834, "global_step": 186669, "epoch": 1111} {"train_loss": -11.283258438110352, "global_step": 186670, "epoch": 1111} {"train_loss": -11.481937408447266, "global_step": 186671, "epoch": 1111} {"train_loss": -11.650405883789062, "global_step": 186672, "epoch": 1111} {"train_loss": -11.556110382080078, "global_step": 186673, "epoch": 1111} {"train_loss": -11.65829086303711, "global_step": 186674, "epoch": 1111} {"train_loss": -11.602616310119629, "global_step": 186675, "epoch": 1111} {"train_loss": -11.609686851501465, "global_step": 186676, "epoch": 1111} {"train_loss": -11.699127197265625, "global_step": 186677, "epoch": 1111} {"train_loss": -11.758673667907715, "global_step": 186678, "epoch": 1111} {"train_loss": -11.655142784118652, "global_step": 186679, "epoch": 1111} {"train_loss": -11.525242805480957, "global_step": 186680, "epoch": 1111} {"train_loss": -11.683656692504883, "global_step": 186681, "epoch": 1111} {"train_loss": -11.710121154785156, "global_step": 186682, "epoch": 1111} {"train_loss": -11.422812461853027, "global_step": 186683, "epoch": 1111} {"train_loss": -11.692249298095703, "global_step": 186684, "epoch": 1111} {"train_loss": -11.564665794372559, "global_step": 186685, "epoch": 1111} {"train_loss": -11.6980562210083, "global_step": 186686, "epoch": 1111} {"train_loss": -11.317914962768555, "global_step": 186687, "epoch": 1111} {"train_loss": -11.163215637207031, "global_step": 186688, "epoch": 1111} {"train_loss": -11.558503150939941, "global_step": 186689, "epoch": 1111} {"train_loss": -11.328178405761719, "global_step": 186690, "epoch": 1111} {"train_loss": -11.253181457519531, "global_step": 186691, "epoch": 1111} {"train_loss": -11.3359375, "global_step": 186692, "epoch": 1111} {"train_loss": -11.553003311157227, "global_step": 186693, "epoch": 1111} {"train_loss": -11.674699783325195, "global_step": 186694, "epoch": 1111} {"train_loss": -11.43798828125, "global_step": 186695, "epoch": 1111} {"train_loss": -11.322769165039062, "global_step": 186696, "epoch": 1111} {"train_loss": -11.120564460754395, "global_step": 186697, "epoch": 1111} {"train_loss": -11.375198364257812, "global_step": 186698, "epoch": 1111} {"train_loss": -10.276391983032227, "global_step": 186699, "epoch": 1111} {"train_loss": -10.789630889892578, "global_step": 186700, "epoch": 1111} {"train_loss": -11.419260025024414, "global_step": 186701, "epoch": 1111} {"train_loss": -11.516170501708984, "global_step": 186702, "epoch": 1111} {"train_loss": -11.352685928344727, "global_step": 186703, "epoch": 1111} {"train_loss": -11.456993103027344, "global_step": 186704, "epoch": 1111} {"train_loss": -11.334918975830078, "global_step": 186705, "epoch": 1111} {"train_loss": -11.638914108276367, "global_step": 186706, "epoch": 1111} {"train_loss": -11.516300201416016, "global_step": 186707, "epoch": 1111} {"train_loss": -11.736757278442383, "global_step": 186708, "epoch": 1111} {"train_loss": -11.728982925415039, "global_step": 186709, "epoch": 1111} {"train_loss": -11.40617847442627, "global_step": 186710, "epoch": 1111} {"train_loss": -11.463176727294922, "global_step": 186711, "epoch": 1111} {"train_loss": -11.213518142700195, "global_step": 186712, "epoch": 1111} {"train_loss": -11.22972583770752, "global_step": 186713, "epoch": 1111} {"train_loss": -11.33545207977295, "global_step": 186714, "epoch": 1111} {"train_loss": -11.360960006713867, "global_step": 186715, "epoch": 1111} {"train_loss": -10.425494194030762, "global_step": 186716, "epoch": 1111} {"train_loss": -10.0429105758667, "global_step": 186717, "epoch": 1111} {"train_loss": -11.384413719177246, "global_step": 186718, "epoch": 1111} {"train_loss": -11.1572904586792, "global_step": 186719, "epoch": 1111} {"train_loss": -10.690783500671387, "global_step": 186720, "epoch": 1111} {"train_loss": -10.976033210754395, "global_step": 186721, "epoch": 1111} {"train_loss": -11.206459045410156, "global_step": 186722, "epoch": 1111} {"train_loss": -10.407873153686523, "global_step": 186723, "epoch": 1111} {"train_loss": -11.170541763305664, "global_step": 186724, "epoch": 1111} {"train_loss": -11.169693946838379, "global_step": 186725, "epoch": 1111} {"train_loss": -11.483787536621094, "global_step": 186726, "epoch": 1111} {"train_loss": -11.02597427368164, "global_step": 186727, "epoch": 1111} {"train_loss": -10.835590362548828, "global_step": 186728, "epoch": 1111} {"train_loss": -10.213785171508789, "global_step": 186729, "epoch": 1111} {"train_loss": -10.860000610351562, "global_step": 186730, "epoch": 1111} {"train_loss": -11.110206604003906, "global_step": 186731, "epoch": 1111} {"train_loss": -10.374822616577148, "global_step": 186732, "epoch": 1111} {"train_loss": -10.806123733520508, "global_step": 186733, "epoch": 1111} {"train_loss": -10.846800804138184, "global_step": 186734, "epoch": 1111} {"train_loss": -10.30528450012207, "global_step": 186735, "epoch": 1111} {"train_loss": -10.304943084716797, "global_step": 186736, "epoch": 1111} {"train_loss": -10.53235149383545, "global_step": 186737, "epoch": 1111} {"train_loss": -8.646456718444824, "global_step": 186738, "epoch": 1111} {"train_loss": -9.779853820800781, "global_step": 186739, "epoch": 1111} {"train_loss": -8.221870422363281, "global_step": 186740, "epoch": 1111} {"train_loss": -9.765338897705078, "global_step": 186741, "epoch": 1111} {"train_loss": -8.503166198730469, "global_step": 186742, "epoch": 1111} {"train_loss": -10.040201187133789, "global_step": 186743, "epoch": 1111} {"train_loss": -8.86420726776123, "global_step": 186744, "epoch": 1111} {"train_loss": -10.373658180236816, "global_step": 186745, "epoch": 1111} {"train_loss": -9.12454605102539, "global_step": 186746, "epoch": 1111} {"train_loss": -10.338173866271973, "global_step": 186747, "epoch": 1111} {"train_loss": -9.257457733154297, "global_step": 186748, "epoch": 1111} {"train_loss": -9.615121841430664, "global_step": 186749, "epoch": 1111} {"train_loss": -8.991775512695312, "global_step": 186750, "epoch": 1111} {"train_loss": -9.767202377319336, "global_step": 186751, "epoch": 1111} {"train_loss": -10.185529708862305, "global_step": 186752, "epoch": 1111} {"train_loss": -10.242685317993164, "global_step": 186753, "epoch": 1111} {"train_loss": -10.050771713256836, "global_step": 186754, "epoch": 1111} {"train_loss": -9.943487167358398, "global_step": 186755, "epoch": 1111} {"train_loss": -10.460068702697754, "global_step": 186756, "epoch": 1111} {"train_loss": -10.380819320678711, "global_step": 186757, "epoch": 1111} {"train_loss": -10.375633239746094, "global_step": 186758, "epoch": 1111} {"train_loss": -10.466364860534668, "global_step": 186759, "epoch": 1111} {"train_loss": -10.705571174621582, "global_step": 186760, "epoch": 1111} {"train_loss": -10.43795394897461, "global_step": 186761, "epoch": 1111} {"train_loss": -10.38663387298584, "global_step": 186762, "epoch": 1111} {"train_loss": -10.681549072265625, "global_step": 186763, "epoch": 1111} {"train_loss": -10.491405487060547, "global_step": 186764, "epoch": 1111} {"train_loss": -10.41572380065918, "global_step": 186765, "epoch": 1111} {"train_loss": -10.821191787719727, "global_step": 186766, "epoch": 1111} {"train_loss": -10.816943168640137, "global_step": 186767, "epoch": 1111} {"train_loss": -10.495830535888672, "global_step": 186768, "epoch": 1111} {"train_loss": -10.598518371582031, "global_step": 186769, "epoch": 1111} {"train_loss": -10.7943696975708, "global_step": 186770, "epoch": 1111} {"train_loss": -10.719345092773438, "global_step": 186771, "epoch": 1111} {"train_loss": -10.66646957397461, "global_step": 186772, "epoch": 1111} {"train_loss": -10.795400619506836, "global_step": 186773, "epoch": 1111} {"train_loss": -10.910080909729004, "global_step": 186774, "epoch": 1111} {"train_loss": -10.83480453491211, "global_step": 186775, "epoch": 1111} {"train_loss": -10.907928466796875, "global_step": 186776, "epoch": 1111} {"train_loss": -10.996368408203125, "global_step": 186777, "epoch": 1111} {"train_loss": -11.102792739868164, "global_step": 186778, "epoch": 1111} {"train_loss": -11.072793960571289, "global_step": 186779, "epoch": 1111} {"train_loss": -11.037704467773438, "global_step": 186780, "epoch": 1111} {"train_loss": -11.098170280456543, "global_step": 186781, "epoch": 1111} {"train_loss": -11.050661087036133, "global_step": 186782, "epoch": 1111} {"train_loss": -10.971784591674805, "global_step": 186783, "epoch": 1111} {"train_loss": -11.09560775756836, "global_step": 186784, "epoch": 1111} {"train_loss": -10.891088485717773, "global_step": 186785, "epoch": 1111} {"train_loss": -11.091662406921387, "global_step": 186786, "epoch": 1111} {"train_loss": -11.135028839111328, "global_step": 186787, "epoch": 1111} {"train_loss": -11.228527069091797, "global_step": 186788, "epoch": 1111} {"train_loss": -11.200579643249512, "global_step": 186789, "epoch": 1111} {"train_loss": -11.250631332397461, "global_step": 186790, "epoch": 1111} {"train_loss": -11.33407211303711, "global_step": 186791, "epoch": 1111} {"train_loss": -10.952275276184082, "global_step": 186792, "epoch": 1111} {"train_loss": -11.246992111206055, "global_step": 186793, "epoch": 1111} {"train_loss": -11.300093650817871, "global_step": 186794, "epoch": 1111} {"train_loss": -11.19688606262207, "global_step": 186795, "epoch": 1111} {"train_loss": -11.388172149658203, "global_step": 186796, "epoch": 1111} {"train_loss": -11.09521484375, "global_step": 186797, "epoch": 1111} {"train_loss": -11.256528854370117, "global_step": 186798, "epoch": 1111} {"train_loss": -11.082992553710938, "global_step": 186799, "epoch": 1111} {"train_loss": -11.105798721313477, "global_step": 186800, "epoch": 1111} {"train_loss": -11.232629776000977, "global_step": 186801, "epoch": 1111} {"train_loss": -11.300373077392578, "global_step": 186802, "epoch": 1111} {"train_loss": -11.462053298950195, "global_step": 186803, "epoch": 1111} {"train_loss": -11.249157905578613, "global_step": 186804, "epoch": 1111} {"train_loss": -11.349726676940918, "global_step": 186805, "epoch": 1111} {"train_loss": -11.472896575927734, "global_step": 186806, "epoch": 1111} {"train_loss": -11.416365623474121, "global_step": 186807, "epoch": 1111} {"train_loss": -11.486427307128906, "global_step": 186808, "epoch": 1111} {"train_loss": -11.227349281311035, "global_step": 186809, "epoch": 1111} {"train_loss": -11.565864562988281, "global_step": 186810, "epoch": 1111} {"train_loss": -11.308183670043945, "global_step": 186811, "epoch": 1111} {"train_loss": -11.354972839355469, "global_step": 186812, "epoch": 1111} {"train_loss": -11.453553199768066, "global_step": 186813, "epoch": 1111} {"train_loss": -11.352893829345703, "global_step": 186814, "epoch": 1111} {"train_loss": -10.99904031412942, "global_step": 186815, "epoch": 1111, "val_loss": 247443.609375} {"train_loss": -11.710892677307129, "global_step": 186816, "epoch": 1112} {"train_loss": -11.476838111877441, "global_step": 186817, "epoch": 1112} {"train_loss": -11.673038482666016, "global_step": 186818, "epoch": 1112} {"train_loss": -11.657491683959961, "global_step": 186819, "epoch": 1112} {"train_loss": -11.669412612915039, "global_step": 186820, "epoch": 1112} {"train_loss": -11.664649963378906, "global_step": 186821, "epoch": 1112} {"train_loss": -11.536323547363281, "global_step": 186822, "epoch": 1112} {"train_loss": -11.612957000732422, "global_step": 186823, "epoch": 1112} {"train_loss": -11.760995864868164, "global_step": 186824, "epoch": 1112} {"train_loss": -11.544914245605469, "global_step": 186825, "epoch": 1112} {"train_loss": -11.648787498474121, "global_step": 186826, "epoch": 1112} {"train_loss": -11.556219100952148, "global_step": 186827, "epoch": 1112} {"train_loss": -11.65170955657959, "global_step": 186828, "epoch": 1112} {"train_loss": -11.458189010620117, "global_step": 186829, "epoch": 1112} {"train_loss": -11.470756530761719, "global_step": 186830, "epoch": 1112} {"train_loss": -11.441875457763672, "global_step": 186831, "epoch": 1112} {"train_loss": -11.542400360107422, "global_step": 186832, "epoch": 1112} {"train_loss": -11.624958992004395, "global_step": 186833, "epoch": 1112} {"train_loss": -11.283088684082031, "global_step": 186834, "epoch": 1112} {"train_loss": -11.208122253417969, "global_step": 186835, "epoch": 1112} {"train_loss": -11.132242202758789, "global_step": 186836, "epoch": 1112} {"train_loss": -11.384111404418945, "global_step": 186837, "epoch": 1112} {"train_loss": -10.935563087463379, "global_step": 186838, "epoch": 1112} {"train_loss": -11.217245101928711, "global_step": 186839, "epoch": 1112} {"train_loss": -11.442832946777344, "global_step": 186840, "epoch": 1112} {"train_loss": -11.330574035644531, "global_step": 186841, "epoch": 1112} {"train_loss": -11.415539741516113, "global_step": 186842, "epoch": 1112} {"train_loss": -11.17825698852539, "global_step": 186843, "epoch": 1112} {"train_loss": -11.147895812988281, "global_step": 186844, "epoch": 1112} {"train_loss": -10.83237075805664, "global_step": 186845, "epoch": 1112} {"train_loss": -11.423060417175293, "global_step": 186846, "epoch": 1112} {"train_loss": -11.247499465942383, "global_step": 186847, "epoch": 1112} {"train_loss": -11.299458503723145, "global_step": 186848, "epoch": 1112} {"train_loss": -10.950095176696777, "global_step": 186849, "epoch": 1112} {"train_loss": -11.512716293334961, "global_step": 186850, "epoch": 1112} {"train_loss": -11.375496864318848, "global_step": 186851, "epoch": 1112} {"train_loss": -11.454752922058105, "global_step": 186852, "epoch": 1112} {"train_loss": -11.53725528717041, "global_step": 186853, "epoch": 1112} {"train_loss": -11.081033706665039, "global_step": 186854, "epoch": 1112} {"train_loss": -11.474696159362793, "global_step": 186855, "epoch": 1112} {"train_loss": -11.041204452514648, "global_step": 186856, "epoch": 1112} {"train_loss": -10.766722679138184, "global_step": 186857, "epoch": 1112} {"train_loss": -11.504865646362305, "global_step": 186858, "epoch": 1112} {"train_loss": -10.196013450622559, "global_step": 186859, "epoch": 1112} {"train_loss": -10.241902351379395, "global_step": 186860, "epoch": 1112} {"train_loss": -11.020275115966797, "global_step": 186861, "epoch": 1112} {"train_loss": -11.016090393066406, "global_step": 186862, "epoch": 1112} {"train_loss": -11.510290145874023, "global_step": 186863, "epoch": 1112} {"train_loss": -11.008855819702148, "global_step": 186864, "epoch": 1112} {"train_loss": -11.193796157836914, "global_step": 186865, "epoch": 1112} {"train_loss": -10.413728713989258, "global_step": 186866, "epoch": 1112} {"train_loss": -11.122766494750977, "global_step": 186867, "epoch": 1112} {"train_loss": -10.847258567810059, "global_step": 186868, "epoch": 1112} {"train_loss": -11.108034133911133, "global_step": 186869, "epoch": 1112} {"train_loss": -10.954168319702148, "global_step": 186870, "epoch": 1112} {"train_loss": -10.624978065490723, "global_step": 186871, "epoch": 1112} {"train_loss": -11.277374267578125, "global_step": 186872, "epoch": 1112} {"train_loss": -10.376341819763184, "global_step": 186873, "epoch": 1112} {"train_loss": -11.207475662231445, "global_step": 186874, "epoch": 1112} {"train_loss": -10.69664192199707, "global_step": 186875, "epoch": 1112} {"train_loss": -10.78309440612793, "global_step": 186876, "epoch": 1112} {"train_loss": -11.437704086303711, "global_step": 186877, "epoch": 1112} {"train_loss": -10.457901000976562, "global_step": 186878, "epoch": 1112} {"train_loss": -11.356298446655273, "global_step": 186879, "epoch": 1112} {"train_loss": -10.785768508911133, "global_step": 186880, "epoch": 1112} {"train_loss": -11.275518417358398, "global_step": 186881, "epoch": 1112} {"train_loss": -10.76304817199707, "global_step": 186882, "epoch": 1112} {"train_loss": -11.397765159606934, "global_step": 186883, "epoch": 1112} {"train_loss": -11.245626449584961, "global_step": 186884, "epoch": 1112} {"train_loss": -10.999235153198242, "global_step": 186885, "epoch": 1112} {"train_loss": -11.068115234375, "global_step": 186886, "epoch": 1112} {"train_loss": -11.067306518554688, "global_step": 186887, "epoch": 1112} {"train_loss": -11.362956047058105, "global_step": 186888, "epoch": 1112} {"train_loss": -10.559059143066406, "global_step": 186889, "epoch": 1112} {"train_loss": -11.385568618774414, "global_step": 186890, "epoch": 1112} {"train_loss": -10.77256965637207, "global_step": 186891, "epoch": 1112} {"train_loss": -10.72150993347168, "global_step": 186892, "epoch": 1112} {"train_loss": -10.231670379638672, "global_step": 186893, "epoch": 1112} {"train_loss": -10.886606216430664, "global_step": 186894, "epoch": 1112} {"train_loss": -10.147380828857422, "global_step": 186895, "epoch": 1112} {"train_loss": -10.984756469726562, "global_step": 186896, "epoch": 1112} {"train_loss": -10.165257453918457, "global_step": 186897, "epoch": 1112} {"train_loss": -11.270994186401367, "global_step": 186898, "epoch": 1112} {"train_loss": -10.511825561523438, "global_step": 186899, "epoch": 1112} {"train_loss": -11.135896682739258, "global_step": 186900, "epoch": 1112} {"train_loss": -10.53236198425293, "global_step": 186901, "epoch": 1112} {"train_loss": -10.872025489807129, "global_step": 186902, "epoch": 1112} {"train_loss": -10.869336128234863, "global_step": 186903, "epoch": 1112} {"train_loss": -11.18263053894043, "global_step": 186904, "epoch": 1112} {"train_loss": -11.005674362182617, "global_step": 186905, "epoch": 1112} {"train_loss": -11.020193099975586, "global_step": 186906, "epoch": 1112} {"train_loss": -11.060356140136719, "global_step": 186907, "epoch": 1112} {"train_loss": -11.178112030029297, "global_step": 186908, "epoch": 1112} {"train_loss": -11.229340553283691, "global_step": 186909, "epoch": 1112} {"train_loss": -11.009679794311523, "global_step": 186910, "epoch": 1112} {"train_loss": -10.89046859741211, "global_step": 186911, "epoch": 1112} {"train_loss": -10.882157325744629, "global_step": 186912, "epoch": 1112} {"train_loss": -11.184921264648438, "global_step": 186913, "epoch": 1112} {"train_loss": -11.0691556930542, "global_step": 186914, "epoch": 1112} {"train_loss": -10.93420124053955, "global_step": 186915, "epoch": 1112} {"train_loss": -11.112674713134766, "global_step": 186916, "epoch": 1112} {"train_loss": -11.2942476272583, "global_step": 186917, "epoch": 1112} {"train_loss": -10.764130592346191, "global_step": 186918, "epoch": 1112} {"train_loss": -11.360174179077148, "global_step": 186919, "epoch": 1112} {"train_loss": -11.158050537109375, "global_step": 186920, "epoch": 1112} {"train_loss": -11.350069999694824, "global_step": 186921, "epoch": 1112} {"train_loss": -11.407074928283691, "global_step": 186922, "epoch": 1112} {"train_loss": -11.039669036865234, "global_step": 186923, "epoch": 1112} {"train_loss": -10.87509822845459, "global_step": 186924, "epoch": 1112} {"train_loss": -11.262969970703125, "global_step": 186925, "epoch": 1112} {"train_loss": -10.928886413574219, "global_step": 186926, "epoch": 1112} {"train_loss": -11.091119766235352, "global_step": 186927, "epoch": 1112} {"train_loss": -11.297499656677246, "global_step": 186928, "epoch": 1112} {"train_loss": -11.076982498168945, "global_step": 186929, "epoch": 1112} {"train_loss": -11.170951843261719, "global_step": 186930, "epoch": 1112} {"train_loss": -11.216865539550781, "global_step": 186931, "epoch": 1112} {"train_loss": -11.240405082702637, "global_step": 186932, "epoch": 1112} {"train_loss": -10.910813331604004, "global_step": 186933, "epoch": 1112} {"train_loss": -11.013250350952148, "global_step": 186934, "epoch": 1112} {"train_loss": -11.337127685546875, "global_step": 186935, "epoch": 1112} {"train_loss": -11.338370323181152, "global_step": 186936, "epoch": 1112} {"train_loss": -11.34168815612793, "global_step": 186937, "epoch": 1112} {"train_loss": -11.031072616577148, "global_step": 186938, "epoch": 1112} {"train_loss": -11.02584171295166, "global_step": 186939, "epoch": 1112} {"train_loss": -11.528911590576172, "global_step": 186940, "epoch": 1112} {"train_loss": -11.092613220214844, "global_step": 186941, "epoch": 1112} {"train_loss": -11.34043025970459, "global_step": 186942, "epoch": 1112} {"train_loss": -11.446295738220215, "global_step": 186943, "epoch": 1112} {"train_loss": -11.349546432495117, "global_step": 186944, "epoch": 1112} {"train_loss": -11.231093406677246, "global_step": 186945, "epoch": 1112} {"train_loss": -11.613571166992188, "global_step": 186946, "epoch": 1112} {"train_loss": -11.2845458984375, "global_step": 186947, "epoch": 1112} {"train_loss": -11.32436752319336, "global_step": 186948, "epoch": 1112} {"train_loss": -11.485432624816895, "global_step": 186949, "epoch": 1112} {"train_loss": -10.884441375732422, "global_step": 186950, "epoch": 1112} {"train_loss": -11.241247177124023, "global_step": 186951, "epoch": 1112} {"train_loss": -11.257013320922852, "global_step": 186952, "epoch": 1112} {"train_loss": -10.951780319213867, "global_step": 186953, "epoch": 1112} {"train_loss": -11.129830360412598, "global_step": 186954, "epoch": 1112} {"train_loss": -11.328093528747559, "global_step": 186955, "epoch": 1112} {"train_loss": -11.070899963378906, "global_step": 186956, "epoch": 1112} {"train_loss": -11.430946350097656, "global_step": 186957, "epoch": 1112} {"train_loss": -11.195388793945312, "global_step": 186958, "epoch": 1112} {"train_loss": -11.023689270019531, "global_step": 186959, "epoch": 1112} {"train_loss": -11.175289154052734, "global_step": 186960, "epoch": 1112} {"train_loss": -11.090919494628906, "global_step": 186961, "epoch": 1112} {"train_loss": -11.075324058532715, "global_step": 186962, "epoch": 1112} {"train_loss": -11.437103271484375, "global_step": 186963, "epoch": 1112} {"train_loss": -11.328958511352539, "global_step": 186964, "epoch": 1112} {"train_loss": -11.279681205749512, "global_step": 186965, "epoch": 1112} {"train_loss": -11.185903549194336, "global_step": 186966, "epoch": 1112} {"train_loss": -11.396317481994629, "global_step": 186967, "epoch": 1112} {"train_loss": -11.374826431274414, "global_step": 186968, "epoch": 1112} {"train_loss": -11.244340896606445, "global_step": 186969, "epoch": 1112} {"train_loss": -11.060909271240234, "global_step": 186970, "epoch": 1112} {"train_loss": -11.46099853515625, "global_step": 186971, "epoch": 1112} {"train_loss": -11.335121154785156, "global_step": 186972, "epoch": 1112} {"train_loss": -11.621133804321289, "global_step": 186973, "epoch": 1112} {"train_loss": -11.39649486541748, "global_step": 186974, "epoch": 1112} {"train_loss": -11.125722885131836, "global_step": 186975, "epoch": 1112} {"train_loss": -11.522936820983887, "global_step": 186976, "epoch": 1112} {"train_loss": -11.28676986694336, "global_step": 186977, "epoch": 1112} {"train_loss": -11.263238906860352, "global_step": 186978, "epoch": 1112} {"train_loss": -11.19776439666748, "global_step": 186979, "epoch": 1112} {"train_loss": -11.397071838378906, "global_step": 186980, "epoch": 1112} {"train_loss": -11.29202651977539, "global_step": 186981, "epoch": 1112} {"train_loss": -11.443379402160645, "global_step": 186982, "epoch": 1112} {"train_loss": -11.168964334896632, "global_step": 186983, "epoch": 1112, "val_loss": 250202.34375} {"train_loss": -10.900033950805664, "global_step": 186984, "epoch": 1113} {"train_loss": -10.864675521850586, "global_step": 186985, "epoch": 1113} {"train_loss": -11.091911315917969, "global_step": 186986, "epoch": 1113} {"train_loss": -11.152907371520996, "global_step": 186987, "epoch": 1113} {"train_loss": -11.268404006958008, "global_step": 186988, "epoch": 1113} {"train_loss": -11.524032592773438, "global_step": 186989, "epoch": 1113} {"train_loss": -11.132379531860352, "global_step": 186990, "epoch": 1113} {"train_loss": -10.909296035766602, "global_step": 186991, "epoch": 1113} {"train_loss": -10.903608322143555, "global_step": 186992, "epoch": 1113} {"train_loss": -11.364084243774414, "global_step": 186993, "epoch": 1113} {"train_loss": -11.080062866210938, "global_step": 186994, "epoch": 1113} {"train_loss": -11.307732582092285, "global_step": 186995, "epoch": 1113} {"train_loss": -10.311363220214844, "global_step": 186996, "epoch": 1113} {"train_loss": -10.819358825683594, "global_step": 186997, "epoch": 1113} {"train_loss": -11.11825180053711, "global_step": 186998, "epoch": 1113} {"train_loss": -11.257333755493164, "global_step": 186999, "epoch": 1113} {"train_loss": -10.92419719696045, "global_step": 187000, "epoch": 1113} {"train_loss": -11.534626007080078, "global_step": 187001, "epoch": 1113} {"train_loss": -11.083964347839355, "global_step": 187002, "epoch": 1113} {"train_loss": -11.18657112121582, "global_step": 187003, "epoch": 1113} {"train_loss": -11.338820457458496, "global_step": 187004, "epoch": 1113} {"train_loss": -10.593428611755371, "global_step": 187005, "epoch": 1113} {"train_loss": -11.104940414428711, "global_step": 187006, "epoch": 1113} {"train_loss": -11.045527458190918, "global_step": 187007, "epoch": 1113} {"train_loss": -11.071678161621094, "global_step": 187008, "epoch": 1113} {"train_loss": -10.621988296508789, "global_step": 187009, "epoch": 1113} {"train_loss": -10.993196487426758, "global_step": 187010, "epoch": 1113} {"train_loss": -10.319439888000488, "global_step": 187011, "epoch": 1113} {"train_loss": -10.634626388549805, "global_step": 187012, "epoch": 1113} {"train_loss": -10.329169273376465, "global_step": 187013, "epoch": 1113} {"train_loss": -10.27771282196045, "global_step": 187014, "epoch": 1113} {"train_loss": -10.661283493041992, "global_step": 187015, "epoch": 1113} {"train_loss": -9.200672149658203, "global_step": 187016, "epoch": 1113} {"train_loss": -10.966217994689941, "global_step": 187017, "epoch": 1113} {"train_loss": -9.75052261352539, "global_step": 187018, "epoch": 1113} {"train_loss": -10.32752799987793, "global_step": 187019, "epoch": 1113} {"train_loss": -9.744247436523438, "global_step": 187020, "epoch": 1113} {"train_loss": -10.29953384399414, "global_step": 187021, "epoch": 1113} {"train_loss": -9.513193130493164, "global_step": 187022, "epoch": 1113} {"train_loss": -10.52228832244873, "global_step": 187023, "epoch": 1113} {"train_loss": -9.63516902923584, "global_step": 187024, "epoch": 1113} {"train_loss": -10.909186363220215, "global_step": 187025, "epoch": 1113} {"train_loss": -9.893499374389648, "global_step": 187026, "epoch": 1113} {"train_loss": -10.525786399841309, "global_step": 187027, "epoch": 1113} {"train_loss": -10.160486221313477, "global_step": 187028, "epoch": 1113} {"train_loss": -10.603792190551758, "global_step": 187029, "epoch": 1113} {"train_loss": -9.979928970336914, "global_step": 187030, "epoch": 1113} {"train_loss": -11.140857696533203, "global_step": 187031, "epoch": 1113} {"train_loss": -10.771636962890625, "global_step": 187032, "epoch": 1113} {"train_loss": -10.996238708496094, "global_step": 187033, "epoch": 1113} {"train_loss": -10.933194160461426, "global_step": 187034, "epoch": 1113} {"train_loss": -10.869996070861816, "global_step": 187035, "epoch": 1113} {"train_loss": -10.467365264892578, "global_step": 187036, "epoch": 1113} {"train_loss": -10.889623641967773, "global_step": 187037, "epoch": 1113} {"train_loss": -10.979793548583984, "global_step": 187038, "epoch": 1113} {"train_loss": -10.864620208740234, "global_step": 187039, "epoch": 1113} {"train_loss": -10.992427825927734, "global_step": 187040, "epoch": 1113} {"train_loss": -11.13431453704834, "global_step": 187041, "epoch": 1113} {"train_loss": -11.041472434997559, "global_step": 187042, "epoch": 1113} {"train_loss": -11.140702247619629, "global_step": 187043, "epoch": 1113} {"train_loss": -10.883227348327637, "global_step": 187044, "epoch": 1113} {"train_loss": -11.110590934753418, "global_step": 187045, "epoch": 1113} {"train_loss": -11.109476089477539, "global_step": 187046, "epoch": 1113} {"train_loss": -11.239973068237305, "global_step": 187047, "epoch": 1113} {"train_loss": -11.0327787399292, "global_step": 187048, "epoch": 1113} {"train_loss": -11.2584810256958, "global_step": 187049, "epoch": 1113} {"train_loss": -11.138345718383789, "global_step": 187050, "epoch": 1113} {"train_loss": -11.34408187866211, "global_step": 187051, "epoch": 1113} {"train_loss": -11.391157150268555, "global_step": 187052, "epoch": 1113} {"train_loss": -11.35630989074707, "global_step": 187053, "epoch": 1113} {"train_loss": -11.217218399047852, "global_step": 187054, "epoch": 1113} {"train_loss": -11.274253845214844, "global_step": 187055, "epoch": 1113} {"train_loss": -11.358872413635254, "global_step": 187056, "epoch": 1113} {"train_loss": -11.492905616760254, "global_step": 187057, "epoch": 1113} {"train_loss": -11.196730613708496, "global_step": 187058, "epoch": 1113} {"train_loss": -11.404397010803223, "global_step": 187059, "epoch": 1113} {"train_loss": -11.452657699584961, "global_step": 187060, "epoch": 1113} {"train_loss": -11.473470687866211, "global_step": 187061, "epoch": 1113} {"train_loss": -11.234993934631348, "global_step": 187062, "epoch": 1113} {"train_loss": -11.299230575561523, "global_step": 187063, "epoch": 1113} {"train_loss": -11.481831550598145, "global_step": 187064, "epoch": 1113} {"train_loss": -11.454179763793945, "global_step": 187065, "epoch": 1113} {"train_loss": -11.406534194946289, "global_step": 187066, "epoch": 1113} {"train_loss": -11.365349769592285, "global_step": 187067, "epoch": 1113} {"train_loss": -11.4217529296875, "global_step": 187068, "epoch": 1113} {"train_loss": -11.565610885620117, "global_step": 187069, "epoch": 1113} {"train_loss": -11.375997543334961, "global_step": 187070, "epoch": 1113} {"train_loss": -11.567869186401367, "global_step": 187071, "epoch": 1113} {"train_loss": -11.324520111083984, "global_step": 187072, "epoch": 1113} {"train_loss": -11.349557876586914, "global_step": 187073, "epoch": 1113} {"train_loss": -11.68403434753418, "global_step": 187074, "epoch": 1113} {"train_loss": -11.202875137329102, "global_step": 187075, "epoch": 1113} {"train_loss": -11.451234817504883, "global_step": 187076, "epoch": 1113} {"train_loss": -11.360601425170898, "global_step": 187077, "epoch": 1113} {"train_loss": -11.574379920959473, "global_step": 187078, "epoch": 1113} {"train_loss": -11.385363578796387, "global_step": 187079, "epoch": 1113} {"train_loss": -11.442564010620117, "global_step": 187080, "epoch": 1113} {"train_loss": -11.522785186767578, "global_step": 187081, "epoch": 1113} {"train_loss": -11.571162223815918, "global_step": 187082, "epoch": 1113} {"train_loss": -11.505043983459473, "global_step": 187083, "epoch": 1113} {"train_loss": -11.258148193359375, "global_step": 187084, "epoch": 1113} {"train_loss": -11.38381576538086, "global_step": 187085, "epoch": 1113} {"train_loss": -11.29324722290039, "global_step": 187086, "epoch": 1113} {"train_loss": -11.198453903198242, "global_step": 187087, "epoch": 1113} {"train_loss": -11.009978294372559, "global_step": 187088, "epoch": 1113} {"train_loss": -10.958276748657227, "global_step": 187089, "epoch": 1113} {"train_loss": -11.218849182128906, "global_step": 187090, "epoch": 1113} {"train_loss": -11.312956809997559, "global_step": 187091, "epoch": 1113} {"train_loss": -11.261758804321289, "global_step": 187092, "epoch": 1113} {"train_loss": -11.265600204467773, "global_step": 187093, "epoch": 1113} {"train_loss": -11.278924942016602, "global_step": 187094, "epoch": 1113} {"train_loss": -10.1782808303833, "global_step": 187095, "epoch": 1113} {"train_loss": -11.337841033935547, "global_step": 187096, "epoch": 1113} {"train_loss": -11.480876922607422, "global_step": 187097, "epoch": 1113} {"train_loss": -11.265984535217285, "global_step": 187098, "epoch": 1113} {"train_loss": -11.525951385498047, "global_step": 187099, "epoch": 1113} {"train_loss": -11.52875804901123, "global_step": 187100, "epoch": 1113} {"train_loss": -11.580927848815918, "global_step": 187101, "epoch": 1113} {"train_loss": -11.229659080505371, "global_step": 187102, "epoch": 1113} {"train_loss": -11.19261360168457, "global_step": 187103, "epoch": 1113} {"train_loss": -11.439064979553223, "global_step": 187104, "epoch": 1113} {"train_loss": -11.619872093200684, "global_step": 187105, "epoch": 1113} {"train_loss": -11.12314510345459, "global_step": 187106, "epoch": 1113} {"train_loss": -10.769357681274414, "global_step": 187107, "epoch": 1113} {"train_loss": -10.758016586303711, "global_step": 187108, "epoch": 1113} {"train_loss": -11.162662506103516, "global_step": 187109, "epoch": 1113} {"train_loss": -10.226309776306152, "global_step": 187110, "epoch": 1113} {"train_loss": -11.256448745727539, "global_step": 187111, "epoch": 1113} {"train_loss": -11.168946266174316, "global_step": 187112, "epoch": 1113} {"train_loss": -11.041420936584473, "global_step": 187113, "epoch": 1113} {"train_loss": -11.214221954345703, "global_step": 187114, "epoch": 1113} {"train_loss": -11.098665237426758, "global_step": 187115, "epoch": 1113} {"train_loss": -10.925928115844727, "global_step": 187116, "epoch": 1113} {"train_loss": -11.322904586791992, "global_step": 187117, "epoch": 1113} {"train_loss": -11.326614379882812, "global_step": 187118, "epoch": 1113} {"train_loss": -11.195283889770508, "global_step": 187119, "epoch": 1113} {"train_loss": -11.437143325805664, "global_step": 187120, "epoch": 1113} {"train_loss": -11.287714958190918, "global_step": 187121, "epoch": 1113} {"train_loss": -11.05550479888916, "global_step": 187122, "epoch": 1113} {"train_loss": -11.220499038696289, "global_step": 187123, "epoch": 1113} {"train_loss": -11.255634307861328, "global_step": 187124, "epoch": 1113} {"train_loss": -11.30318546295166, "global_step": 187125, "epoch": 1113} {"train_loss": -11.10983943939209, "global_step": 187126, "epoch": 1113} {"train_loss": -11.271608352661133, "global_step": 187127, "epoch": 1113} {"train_loss": -11.293121337890625, "global_step": 187128, "epoch": 1113} {"train_loss": -11.083246231079102, "global_step": 187129, "epoch": 1113} {"train_loss": -11.205166816711426, "global_step": 187130, "epoch": 1113} {"train_loss": -11.10447883605957, "global_step": 187131, "epoch": 1113} {"train_loss": -11.131237983703613, "global_step": 187132, "epoch": 1113} {"train_loss": -10.838430404663086, "global_step": 187133, "epoch": 1113} {"train_loss": -11.558334350585938, "global_step": 187134, "epoch": 1113} {"train_loss": -11.232361793518066, "global_step": 187135, "epoch": 1113} {"train_loss": -11.61137866973877, "global_step": 187136, "epoch": 1113} {"train_loss": -11.225220680236816, "global_step": 187137, "epoch": 1113} {"train_loss": -11.120431900024414, "global_step": 187138, "epoch": 1113} {"train_loss": -11.564047813415527, "global_step": 187139, "epoch": 1113} {"train_loss": -11.188517570495605, "global_step": 187140, "epoch": 1113} {"train_loss": -11.193296432495117, "global_step": 187141, "epoch": 1113} {"train_loss": -11.276529312133789, "global_step": 187142, "epoch": 1113} {"train_loss": -11.464778900146484, "global_step": 187143, "epoch": 1113} {"train_loss": -11.186185836791992, "global_step": 187144, "epoch": 1113} {"train_loss": -11.670978546142578, "global_step": 187145, "epoch": 1113} {"train_loss": -11.297086715698242, "global_step": 187146, "epoch": 1113} {"train_loss": -11.611614227294922, "global_step": 187147, "epoch": 1113} {"train_loss": -11.394973754882812, "global_step": 187148, "epoch": 1113} {"train_loss": -11.21592903137207, "global_step": 187149, "epoch": 1113} {"train_loss": -11.071033477783203, "global_step": 187150, "epoch": 1113} {"train_loss": -11.084920485814413, "global_step": 187151, "epoch": 1113, "val_loss": 251315.171875} {"train_loss": -10.71619987487793, "global_step": 187152, "epoch": 1114} {"train_loss": -11.124462127685547, "global_step": 187153, "epoch": 1114} {"train_loss": -10.879265785217285, "global_step": 187154, "epoch": 1114} {"train_loss": -10.966400146484375, "global_step": 187155, "epoch": 1114} {"train_loss": -11.09583854675293, "global_step": 187156, "epoch": 1114} {"train_loss": -11.364469528198242, "global_step": 187157, "epoch": 1114} {"train_loss": -11.053679466247559, "global_step": 187158, "epoch": 1114} {"train_loss": -10.971212387084961, "global_step": 187159, "epoch": 1114} {"train_loss": -11.335223197937012, "global_step": 187160, "epoch": 1114} {"train_loss": -11.238548278808594, "global_step": 187161, "epoch": 1114} {"train_loss": -10.978093147277832, "global_step": 187162, "epoch": 1114} {"train_loss": -11.37192153930664, "global_step": 187163, "epoch": 1114} {"train_loss": -11.187219619750977, "global_step": 187164, "epoch": 1114} {"train_loss": -11.288657188415527, "global_step": 187165, "epoch": 1114} {"train_loss": -11.16805648803711, "global_step": 187166, "epoch": 1114} {"train_loss": -11.153694152832031, "global_step": 187167, "epoch": 1114} {"train_loss": -11.35000991821289, "global_step": 187168, "epoch": 1114} {"train_loss": -11.574910163879395, "global_step": 187169, "epoch": 1114} {"train_loss": -11.521617889404297, "global_step": 187170, "epoch": 1114} {"train_loss": -11.450639724731445, "global_step": 187171, "epoch": 1114} {"train_loss": -11.585729598999023, "global_step": 187172, "epoch": 1114} {"train_loss": -11.532989501953125, "global_step": 187173, "epoch": 1114} {"train_loss": -11.454366683959961, "global_step": 187174, "epoch": 1114} {"train_loss": -10.538141250610352, "global_step": 187175, "epoch": 1114} {"train_loss": -11.02023696899414, "global_step": 187176, "epoch": 1114} {"train_loss": -11.205196380615234, "global_step": 187177, "epoch": 1114} {"train_loss": -10.565176010131836, "global_step": 187178, "epoch": 1114} {"train_loss": -10.766515731811523, "global_step": 187179, "epoch": 1114} {"train_loss": -11.03966236114502, "global_step": 187180, "epoch": 1114} {"train_loss": -10.771743774414062, "global_step": 187181, "epoch": 1114} {"train_loss": -11.047866821289062, "global_step": 187182, "epoch": 1114} {"train_loss": -11.041964530944824, "global_step": 187183, "epoch": 1114} {"train_loss": -10.924599647521973, "global_step": 187184, "epoch": 1114} {"train_loss": -10.989036560058594, "global_step": 187185, "epoch": 1114} {"train_loss": -11.26746940612793, "global_step": 187186, "epoch": 1114} {"train_loss": -10.58755111694336, "global_step": 187187, "epoch": 1114} {"train_loss": -10.840214729309082, "global_step": 187188, "epoch": 1114} {"train_loss": -10.52114200592041, "global_step": 187189, "epoch": 1114} {"train_loss": -10.157350540161133, "global_step": 187190, "epoch": 1114} {"train_loss": -10.596534729003906, "global_step": 187191, "epoch": 1114} {"train_loss": -9.874021530151367, "global_step": 187192, "epoch": 1114} {"train_loss": -11.425814628601074, "global_step": 187193, "epoch": 1114} {"train_loss": -10.420610427856445, "global_step": 187194, "epoch": 1114} {"train_loss": -11.132345199584961, "global_step": 187195, "epoch": 1114} {"train_loss": -10.62016773223877, "global_step": 187196, "epoch": 1114} {"train_loss": -11.053396224975586, "global_step": 187197, "epoch": 1114} {"train_loss": -10.622621536254883, "global_step": 187198, "epoch": 1114} {"train_loss": -10.9934663772583, "global_step": 187199, "epoch": 1114} {"train_loss": -11.116291046142578, "global_step": 187200, "epoch": 1114} {"train_loss": -10.830196380615234, "global_step": 187201, "epoch": 1114} {"train_loss": -11.15041732788086, "global_step": 187202, "epoch": 1114} {"train_loss": -10.678304672241211, "global_step": 187203, "epoch": 1114} {"train_loss": -11.14703369140625, "global_step": 187204, "epoch": 1114} {"train_loss": -10.940451622009277, "global_step": 187205, "epoch": 1114} {"train_loss": -11.033367156982422, "global_step": 187206, "epoch": 1114} {"train_loss": -11.217203140258789, "global_step": 187207, "epoch": 1114} {"train_loss": -10.870138168334961, "global_step": 187208, "epoch": 1114} {"train_loss": -11.38429069519043, "global_step": 187209, "epoch": 1114} {"train_loss": -11.28990364074707, "global_step": 187210, "epoch": 1114} {"train_loss": -10.755755424499512, "global_step": 187211, "epoch": 1114} {"train_loss": -10.972691535949707, "global_step": 187212, "epoch": 1114} {"train_loss": -10.990752220153809, "global_step": 187213, "epoch": 1114} {"train_loss": -11.189922332763672, "global_step": 187214, "epoch": 1114} {"train_loss": -10.697805404663086, "global_step": 187215, "epoch": 1114} {"train_loss": -11.107158660888672, "global_step": 187216, "epoch": 1114} {"train_loss": -11.078325271606445, "global_step": 187217, "epoch": 1114} {"train_loss": -10.922783851623535, "global_step": 187218, "epoch": 1114} {"train_loss": -11.081695556640625, "global_step": 187219, "epoch": 1114} {"train_loss": -10.86703109741211, "global_step": 187220, "epoch": 1114} {"train_loss": -11.39128303527832, "global_step": 187221, "epoch": 1114} {"train_loss": -10.93974781036377, "global_step": 187222, "epoch": 1114} {"train_loss": -11.210136413574219, "global_step": 187223, "epoch": 1114} {"train_loss": -11.30650520324707, "global_step": 187224, "epoch": 1114} {"train_loss": -11.10992431640625, "global_step": 187225, "epoch": 1114} {"train_loss": -11.32478141784668, "global_step": 187226, "epoch": 1114} {"train_loss": -11.21143627166748, "global_step": 187227, "epoch": 1114} {"train_loss": -11.448728561401367, "global_step": 187228, "epoch": 1114} {"train_loss": -11.069182395935059, "global_step": 187229, "epoch": 1114} {"train_loss": -11.313272476196289, "global_step": 187230, "epoch": 1114} {"train_loss": -11.249814987182617, "global_step": 187231, "epoch": 1114} {"train_loss": -11.325874328613281, "global_step": 187232, "epoch": 1114} {"train_loss": -10.742422103881836, "global_step": 187233, "epoch": 1114} {"train_loss": -11.255290031433105, "global_step": 187234, "epoch": 1114} {"train_loss": -10.933147430419922, "global_step": 187235, "epoch": 1114} {"train_loss": -10.87741470336914, "global_step": 187236, "epoch": 1114} {"train_loss": -10.921965599060059, "global_step": 187237, "epoch": 1114} {"train_loss": -10.562728881835938, "global_step": 187238, "epoch": 1114} {"train_loss": -11.212221145629883, "global_step": 187239, "epoch": 1114} {"train_loss": -10.990589141845703, "global_step": 187240, "epoch": 1114} {"train_loss": -11.28544807434082, "global_step": 187241, "epoch": 1114} {"train_loss": -11.413545608520508, "global_step": 187242, "epoch": 1114} {"train_loss": -11.145492553710938, "global_step": 187243, "epoch": 1114} {"train_loss": -11.352742195129395, "global_step": 187244, "epoch": 1114} {"train_loss": -10.868301391601562, "global_step": 187245, "epoch": 1114} {"train_loss": -11.101360321044922, "global_step": 187246, "epoch": 1114} {"train_loss": -10.993030548095703, "global_step": 187247, "epoch": 1114} {"train_loss": -11.366837501525879, "global_step": 187248, "epoch": 1114} {"train_loss": -11.194962501525879, "global_step": 187249, "epoch": 1114} {"train_loss": -11.2335205078125, "global_step": 187250, "epoch": 1114} {"train_loss": -11.414011001586914, "global_step": 187251, "epoch": 1114} {"train_loss": -11.079048156738281, "global_step": 187252, "epoch": 1114} {"train_loss": -11.173789978027344, "global_step": 187253, "epoch": 1114} {"train_loss": -11.388046264648438, "global_step": 187254, "epoch": 1114} {"train_loss": -10.706101417541504, "global_step": 187255, "epoch": 1114} {"train_loss": -11.162333488464355, "global_step": 187256, "epoch": 1114} {"train_loss": -11.557482719421387, "global_step": 187257, "epoch": 1114} {"train_loss": -10.981817245483398, "global_step": 187258, "epoch": 1114} {"train_loss": -11.408204078674316, "global_step": 187259, "epoch": 1114} {"train_loss": -11.24063491821289, "global_step": 187260, "epoch": 1114} {"train_loss": -11.447364807128906, "global_step": 187261, "epoch": 1114} {"train_loss": -11.221710205078125, "global_step": 187262, "epoch": 1114} {"train_loss": -11.199554443359375, "global_step": 187263, "epoch": 1114} {"train_loss": -11.380434036254883, "global_step": 187264, "epoch": 1114} {"train_loss": -11.509794235229492, "global_step": 187265, "epoch": 1114} {"train_loss": -11.466789245605469, "global_step": 187266, "epoch": 1114} {"train_loss": -11.62492561340332, "global_step": 187267, "epoch": 1114} {"train_loss": -11.407552719116211, "global_step": 187268, "epoch": 1114} {"train_loss": -11.141441345214844, "global_step": 187269, "epoch": 1114} {"train_loss": -11.299910545349121, "global_step": 187270, "epoch": 1114} {"train_loss": -11.29854965209961, "global_step": 187271, "epoch": 1114} {"train_loss": -11.416254043579102, "global_step": 187272, "epoch": 1114} {"train_loss": -11.382436752319336, "global_step": 187273, "epoch": 1114} {"train_loss": -11.389547348022461, "global_step": 187274, "epoch": 1114} {"train_loss": -11.451443672180176, "global_step": 187275, "epoch": 1114} {"train_loss": -11.540891647338867, "global_step": 187276, "epoch": 1114} {"train_loss": -11.250279426574707, "global_step": 187277, "epoch": 1114} {"train_loss": -11.00790786743164, "global_step": 187278, "epoch": 1114} {"train_loss": -11.390596389770508, "global_step": 187279, "epoch": 1114} {"train_loss": -11.48688793182373, "global_step": 187280, "epoch": 1114} {"train_loss": -11.077013969421387, "global_step": 187281, "epoch": 1114} {"train_loss": -11.233257293701172, "global_step": 187282, "epoch": 1114} {"train_loss": -11.368856430053711, "global_step": 187283, "epoch": 1114} {"train_loss": -11.064910888671875, "global_step": 187284, "epoch": 1114} {"train_loss": -11.112403869628906, "global_step": 187285, "epoch": 1114} {"train_loss": -11.034168243408203, "global_step": 187286, "epoch": 1114} {"train_loss": -10.835708618164062, "global_step": 187287, "epoch": 1114} {"train_loss": -11.51938533782959, "global_step": 187288, "epoch": 1114} {"train_loss": -10.90226936340332, "global_step": 187289, "epoch": 1114} {"train_loss": -11.559648513793945, "global_step": 187290, "epoch": 1114} {"train_loss": -11.427568435668945, "global_step": 187291, "epoch": 1114} {"train_loss": -11.290109634399414, "global_step": 187292, "epoch": 1114} {"train_loss": -11.24460506439209, "global_step": 187293, "epoch": 1114} {"train_loss": -11.229131698608398, "global_step": 187294, "epoch": 1114} {"train_loss": -11.289423942565918, "global_step": 187295, "epoch": 1114} {"train_loss": -11.437095642089844, "global_step": 187296, "epoch": 1114} {"train_loss": -11.362455368041992, "global_step": 187297, "epoch": 1114} {"train_loss": -10.889341354370117, "global_step": 187298, "epoch": 1114} {"train_loss": -11.383259773254395, "global_step": 187299, "epoch": 1114} {"train_loss": -11.222265243530273, "global_step": 187300, "epoch": 1114} {"train_loss": -11.254974365234375, "global_step": 187301, "epoch": 1114} {"train_loss": -10.980611801147461, "global_step": 187302, "epoch": 1114} {"train_loss": -11.400778770446777, "global_step": 187303, "epoch": 1114} {"train_loss": -11.311113357543945, "global_step": 187304, "epoch": 1114} {"train_loss": -11.31724739074707, "global_step": 187305, "epoch": 1114} {"train_loss": -11.578231811523438, "global_step": 187306, "epoch": 1114} {"train_loss": -11.45655632019043, "global_step": 187307, "epoch": 1114} {"train_loss": -11.451879501342773, "global_step": 187308, "epoch": 1114} {"train_loss": -11.274153709411621, "global_step": 187309, "epoch": 1114} {"train_loss": -11.767236709594727, "global_step": 187310, "epoch": 1114} {"train_loss": -11.274712562561035, "global_step": 187311, "epoch": 1114} {"train_loss": -11.3497953414917, "global_step": 187312, "epoch": 1114} {"train_loss": -11.417248725891113, "global_step": 187313, "epoch": 1114} {"train_loss": -11.392369270324707, "global_step": 187314, "epoch": 1114} {"train_loss": -11.487173080444336, "global_step": 187315, "epoch": 1114} {"train_loss": -11.218290328979492, "global_step": 187316, "epoch": 1114} {"train_loss": -11.666704177856445, "global_step": 187317, "epoch": 1114} {"train_loss": -11.499372482299805, "global_step": 187318, "epoch": 1114} {"train_loss": -11.158576738266717, "global_step": 187319, "epoch": 1114, "val_loss": 247739.640625} {"train_loss": -11.682779312133789, "global_step": 187320, "epoch": 1115} {"train_loss": -11.091102600097656, "global_step": 187321, "epoch": 1115} {"train_loss": -11.523921966552734, "global_step": 187322, "epoch": 1115} {"train_loss": -11.210905075073242, "global_step": 187323, "epoch": 1115} {"train_loss": -11.17892074584961, "global_step": 187324, "epoch": 1115} {"train_loss": -10.981929779052734, "global_step": 187325, "epoch": 1115} {"train_loss": -10.635810852050781, "global_step": 187326, "epoch": 1115} {"train_loss": -10.549529075622559, "global_step": 187327, "epoch": 1115} {"train_loss": -10.752278327941895, "global_step": 187328, "epoch": 1115} {"train_loss": -9.346724510192871, "global_step": 187329, "epoch": 1115} {"train_loss": -11.10274600982666, "global_step": 187330, "epoch": 1115} {"train_loss": -9.791837692260742, "global_step": 187331, "epoch": 1115} {"train_loss": -10.3013916015625, "global_step": 187332, "epoch": 1115} {"train_loss": -9.723779678344727, "global_step": 187333, "epoch": 1115} {"train_loss": -9.696538925170898, "global_step": 187334, "epoch": 1115} {"train_loss": -10.001726150512695, "global_step": 187335, "epoch": 1115} {"train_loss": -9.81298542022705, "global_step": 187336, "epoch": 1115} {"train_loss": -9.603589057922363, "global_step": 187337, "epoch": 1115} {"train_loss": -9.146795272827148, "global_step": 187338, "epoch": 1115} {"train_loss": -10.323236465454102, "global_step": 187339, "epoch": 1115} {"train_loss": -10.337291717529297, "global_step": 187340, "epoch": 1115} {"train_loss": -10.099894523620605, "global_step": 187341, "epoch": 1115} {"train_loss": -10.081904411315918, "global_step": 187342, "epoch": 1115} {"train_loss": -9.56355094909668, "global_step": 187343, "epoch": 1115} {"train_loss": -10.592752456665039, "global_step": 187344, "epoch": 1115} {"train_loss": -10.603382110595703, "global_step": 187345, "epoch": 1115} {"train_loss": -10.102614402770996, "global_step": 187346, "epoch": 1115} {"train_loss": -10.51685905456543, "global_step": 187347, "epoch": 1115} {"train_loss": -10.478205680847168, "global_step": 187348, "epoch": 1115} {"train_loss": -10.623817443847656, "global_step": 187349, "epoch": 1115} {"train_loss": -10.722784042358398, "global_step": 187350, "epoch": 1115} {"train_loss": -10.963635444641113, "global_step": 187351, "epoch": 1115} {"train_loss": -10.485198974609375, "global_step": 187352, "epoch": 1115} {"train_loss": -11.145748138427734, "global_step": 187353, "epoch": 1115} {"train_loss": -10.599173545837402, "global_step": 187354, "epoch": 1115} {"train_loss": -11.00130558013916, "global_step": 187355, "epoch": 1115} {"train_loss": -10.67133617401123, "global_step": 187356, "epoch": 1115} {"train_loss": -10.490371704101562, "global_step": 187357, "epoch": 1115} {"train_loss": -10.986763000488281, "global_step": 187358, "epoch": 1115} {"train_loss": -10.5591459274292, "global_step": 187359, "epoch": 1115} {"train_loss": -10.98526382446289, "global_step": 187360, "epoch": 1115} {"train_loss": -10.657400131225586, "global_step": 187361, "epoch": 1115} {"train_loss": -10.92949390411377, "global_step": 187362, "epoch": 1115} {"train_loss": -10.994645118713379, "global_step": 187363, "epoch": 1115} {"train_loss": -11.090208053588867, "global_step": 187364, "epoch": 1115} {"train_loss": -11.097222328186035, "global_step": 187365, "epoch": 1115} {"train_loss": -10.952839851379395, "global_step": 187366, "epoch": 1115} {"train_loss": -11.029058456420898, "global_step": 187367, "epoch": 1115} {"train_loss": -10.74903678894043, "global_step": 187368, "epoch": 1115} {"train_loss": -11.270747184753418, "global_step": 187369, "epoch": 1115} {"train_loss": -10.913909912109375, "global_step": 187370, "epoch": 1115} {"train_loss": -11.306658744812012, "global_step": 187371, "epoch": 1115} {"train_loss": -11.112897872924805, "global_step": 187372, "epoch": 1115} {"train_loss": -11.089640617370605, "global_step": 187373, "epoch": 1115} {"train_loss": -11.18073844909668, "global_step": 187374, "epoch": 1115} {"train_loss": -11.051010131835938, "global_step": 187375, "epoch": 1115} {"train_loss": -11.224853515625, "global_step": 187376, "epoch": 1115} {"train_loss": -11.084955215454102, "global_step": 187377, "epoch": 1115} {"train_loss": -11.343341827392578, "global_step": 187378, "epoch": 1115} {"train_loss": -11.038177490234375, "global_step": 187379, "epoch": 1115} {"train_loss": -11.406259536743164, "global_step": 187380, "epoch": 1115} {"train_loss": -11.091347694396973, "global_step": 187381, "epoch": 1115} {"train_loss": -11.564441680908203, "global_step": 187382, "epoch": 1115} {"train_loss": -11.156366348266602, "global_step": 187383, "epoch": 1115} {"train_loss": -11.323927879333496, "global_step": 187384, "epoch": 1115} {"train_loss": -11.160232543945312, "global_step": 187385, "epoch": 1115} {"train_loss": -11.514457702636719, "global_step": 187386, "epoch": 1115} {"train_loss": -11.342533111572266, "global_step": 187387, "epoch": 1115} {"train_loss": -11.427123069763184, "global_step": 187388, "epoch": 1115} {"train_loss": -11.316460609436035, "global_step": 187389, "epoch": 1115} {"train_loss": -11.660097122192383, "global_step": 187390, "epoch": 1115} {"train_loss": -11.114202499389648, "global_step": 187391, "epoch": 1115} {"train_loss": -11.449470520019531, "global_step": 187392, "epoch": 1115} {"train_loss": -11.335165023803711, "global_step": 187393, "epoch": 1115} {"train_loss": -11.417915344238281, "global_step": 187394, "epoch": 1115} {"train_loss": -11.652135848999023, "global_step": 187395, "epoch": 1115} {"train_loss": -11.508056640625, "global_step": 187396, "epoch": 1115} {"train_loss": -11.405073165893555, "global_step": 187397, "epoch": 1115} {"train_loss": -11.568727493286133, "global_step": 187398, "epoch": 1115} {"train_loss": -11.414152145385742, "global_step": 187399, "epoch": 1115} {"train_loss": -11.517921447753906, "global_step": 187400, "epoch": 1115} {"train_loss": -11.182586669921875, "global_step": 187401, "epoch": 1115} {"train_loss": -11.456389427185059, "global_step": 187402, "epoch": 1115} {"train_loss": -11.456488609313965, "global_step": 187403, "epoch": 1115} {"train_loss": -11.62363338470459, "global_step": 187404, "epoch": 1115} {"train_loss": -11.704256057739258, "global_step": 187405, "epoch": 1115} {"train_loss": -11.5358247756958, "global_step": 187406, "epoch": 1115} {"train_loss": -11.65881061553955, "global_step": 187407, "epoch": 1115} {"train_loss": -11.437610626220703, "global_step": 187408, "epoch": 1115} {"train_loss": -11.682832717895508, "global_step": 187409, "epoch": 1115} {"train_loss": -11.497001647949219, "global_step": 187410, "epoch": 1115} {"train_loss": -11.441473007202148, "global_step": 187411, "epoch": 1115} {"train_loss": -11.353760719299316, "global_step": 187412, "epoch": 1115} {"train_loss": -11.58193588256836, "global_step": 187413, "epoch": 1115} {"train_loss": -11.405716896057129, "global_step": 187414, "epoch": 1115} {"train_loss": -11.031885147094727, "global_step": 187415, "epoch": 1115} {"train_loss": -11.195058822631836, "global_step": 187416, "epoch": 1115} {"train_loss": -10.882566452026367, "global_step": 187417, "epoch": 1115} {"train_loss": -11.469703674316406, "global_step": 187418, "epoch": 1115} {"train_loss": -11.167613983154297, "global_step": 187419, "epoch": 1115} {"train_loss": -11.130247116088867, "global_step": 187420, "epoch": 1115} {"train_loss": -11.612889289855957, "global_step": 187421, "epoch": 1115} {"train_loss": -10.851177215576172, "global_step": 187422, "epoch": 1115} {"train_loss": -11.41716480255127, "global_step": 187423, "epoch": 1115} {"train_loss": -11.540879249572754, "global_step": 187424, "epoch": 1115} {"train_loss": -10.664156913757324, "global_step": 187425, "epoch": 1115} {"train_loss": -11.319389343261719, "global_step": 187426, "epoch": 1115} {"train_loss": -10.937281608581543, "global_step": 187427, "epoch": 1115} {"train_loss": -10.79298210144043, "global_step": 187428, "epoch": 1115} {"train_loss": -11.09465503692627, "global_step": 187429, "epoch": 1115} {"train_loss": -11.092910766601562, "global_step": 187430, "epoch": 1115} {"train_loss": -10.61359977722168, "global_step": 187431, "epoch": 1115} {"train_loss": -11.401440620422363, "global_step": 187432, "epoch": 1115} {"train_loss": -10.804017066955566, "global_step": 187433, "epoch": 1115} {"train_loss": -11.099382400512695, "global_step": 187434, "epoch": 1115} {"train_loss": -10.899001121520996, "global_step": 187435, "epoch": 1115} {"train_loss": -11.122962951660156, "global_step": 187436, "epoch": 1115} {"train_loss": -11.008623123168945, "global_step": 187437, "epoch": 1115} {"train_loss": -10.680302619934082, "global_step": 187438, "epoch": 1115} {"train_loss": -10.895708084106445, "global_step": 187439, "epoch": 1115} {"train_loss": -10.224079132080078, "global_step": 187440, "epoch": 1115} {"train_loss": -10.919877052307129, "global_step": 187441, "epoch": 1115} {"train_loss": -10.500062942504883, "global_step": 187442, "epoch": 1115} {"train_loss": -10.203536987304688, "global_step": 187443, "epoch": 1115} {"train_loss": -10.55860424041748, "global_step": 187444, "epoch": 1115} {"train_loss": -10.993725776672363, "global_step": 187445, "epoch": 1115} {"train_loss": -11.018373489379883, "global_step": 187446, "epoch": 1115} {"train_loss": -11.153864860534668, "global_step": 187447, "epoch": 1115} {"train_loss": -10.7128267288208, "global_step": 187448, "epoch": 1115} {"train_loss": -11.185270309448242, "global_step": 187449, "epoch": 1115} {"train_loss": -11.16963005065918, "global_step": 187450, "epoch": 1115} {"train_loss": -10.462959289550781, "global_step": 187451, "epoch": 1115} {"train_loss": -11.347213745117188, "global_step": 187452, "epoch": 1115} {"train_loss": -10.741332054138184, "global_step": 187453, "epoch": 1115} {"train_loss": -11.225515365600586, "global_step": 187454, "epoch": 1115} {"train_loss": -10.957805633544922, "global_step": 187455, "epoch": 1115} {"train_loss": -11.201288223266602, "global_step": 187456, "epoch": 1115} {"train_loss": -11.208821296691895, "global_step": 187457, "epoch": 1115} {"train_loss": -11.272869110107422, "global_step": 187458, "epoch": 1115} {"train_loss": -11.36672592163086, "global_step": 187459, "epoch": 1115} {"train_loss": -11.317541122436523, "global_step": 187460, "epoch": 1115} {"train_loss": -11.475109100341797, "global_step": 187461, "epoch": 1115} {"train_loss": -11.184356689453125, "global_step": 187462, "epoch": 1115} {"train_loss": -11.300098419189453, "global_step": 187463, "epoch": 1115} {"train_loss": -11.107902526855469, "global_step": 187464, "epoch": 1115} {"train_loss": -11.321456909179688, "global_step": 187465, "epoch": 1115} {"train_loss": -11.187173843383789, "global_step": 187466, "epoch": 1115} {"train_loss": -11.338626861572266, "global_step": 187467, "epoch": 1115} {"train_loss": -11.390096664428711, "global_step": 187468, "epoch": 1115} {"train_loss": -11.258895874023438, "global_step": 187469, "epoch": 1115} {"train_loss": -11.338868141174316, "global_step": 187470, "epoch": 1115} {"train_loss": -11.093077659606934, "global_step": 187471, "epoch": 1115} {"train_loss": -11.339353561401367, "global_step": 187472, "epoch": 1115} {"train_loss": -11.145193099975586, "global_step": 187473, "epoch": 1115} {"train_loss": -11.107534408569336, "global_step": 187474, "epoch": 1115} {"train_loss": -11.464521408081055, "global_step": 187475, "epoch": 1115} {"train_loss": -10.938973426818848, "global_step": 187476, "epoch": 1115} {"train_loss": -11.219255447387695, "global_step": 187477, "epoch": 1115} {"train_loss": -10.99329662322998, "global_step": 187478, "epoch": 1115} {"train_loss": -10.426889419555664, "global_step": 187479, "epoch": 1115} {"train_loss": -10.738346099853516, "global_step": 187480, "epoch": 1115} {"train_loss": -9.576471328735352, "global_step": 187481, "epoch": 1115} {"train_loss": -10.614923477172852, "global_step": 187482, "epoch": 1115} {"train_loss": -9.256823539733887, "global_step": 187483, "epoch": 1115} {"train_loss": -10.359468460083008, "global_step": 187484, "epoch": 1115} {"train_loss": -8.126553535461426, "global_step": 187485, "epoch": 1115} {"train_loss": -9.22338581085205, "global_step": 187486, "epoch": 1115} {"train_loss": -10.930919380415054, "global_step": 187487, "epoch": 1115, "val_loss": 247270.6875, "train_action_mse_error": 1.1218814849853516} {"train_loss": -8.526504516601562, "global_step": 187488, "epoch": 1116} {"train_loss": -9.919344902038574, "global_step": 187489, "epoch": 1116} {"train_loss": -8.483466148376465, "global_step": 187490, "epoch": 1116} {"train_loss": -8.995054244995117, "global_step": 187491, "epoch": 1116} {"train_loss": -8.336709022521973, "global_step": 187492, "epoch": 1116} {"train_loss": -10.123918533325195, "global_step": 187493, "epoch": 1116} {"train_loss": -9.331035614013672, "global_step": 187494, "epoch": 1116} {"train_loss": -10.066269874572754, "global_step": 187495, "epoch": 1116} {"train_loss": -9.812828063964844, "global_step": 187496, "epoch": 1116} {"train_loss": -9.793119430541992, "global_step": 187497, "epoch": 1116} {"train_loss": -9.62398624420166, "global_step": 187498, "epoch": 1116} {"train_loss": -10.188041687011719, "global_step": 187499, "epoch": 1116} {"train_loss": -9.804630279541016, "global_step": 187500, "epoch": 1116} {"train_loss": -10.589958190917969, "global_step": 187501, "epoch": 1116} {"train_loss": -9.674281120300293, "global_step": 187502, "epoch": 1116} {"train_loss": -10.25473403930664, "global_step": 187503, "epoch": 1116} {"train_loss": -10.003021240234375, "global_step": 187504, "epoch": 1116} {"train_loss": -9.89183235168457, "global_step": 187505, "epoch": 1116} {"train_loss": -10.525667190551758, "global_step": 187506, "epoch": 1116} {"train_loss": -10.381232261657715, "global_step": 187507, "epoch": 1116} {"train_loss": -10.391300201416016, "global_step": 187508, "epoch": 1116} {"train_loss": -10.37249755859375, "global_step": 187509, "epoch": 1116} {"train_loss": -10.571133613586426, "global_step": 187510, "epoch": 1116} {"train_loss": -10.617866516113281, "global_step": 187511, "epoch": 1116} {"train_loss": -10.265016555786133, "global_step": 187512, "epoch": 1116} {"train_loss": -10.868151664733887, "global_step": 187513, "epoch": 1116} {"train_loss": -10.770313262939453, "global_step": 187514, "epoch": 1116} {"train_loss": -10.63438606262207, "global_step": 187515, "epoch": 1116} {"train_loss": -10.81696891784668, "global_step": 187516, "epoch": 1116} {"train_loss": -10.671932220458984, "global_step": 187517, "epoch": 1116} {"train_loss": -10.63713550567627, "global_step": 187518, "epoch": 1116} {"train_loss": -10.745842933654785, "global_step": 187519, "epoch": 1116} {"train_loss": -10.892871856689453, "global_step": 187520, "epoch": 1116} {"train_loss": -10.915397644042969, "global_step": 187521, "epoch": 1116} {"train_loss": -10.782264709472656, "global_step": 187522, "epoch": 1116} {"train_loss": -10.899784088134766, "global_step": 187523, "epoch": 1116} {"train_loss": -11.047259330749512, "global_step": 187524, "epoch": 1116} {"train_loss": -11.04498291015625, "global_step": 187525, "epoch": 1116} {"train_loss": -11.022134780883789, "global_step": 187526, "epoch": 1116} {"train_loss": -10.959495544433594, "global_step": 187527, "epoch": 1116} {"train_loss": -11.038905143737793, "global_step": 187528, "epoch": 1116} {"train_loss": -11.085647583007812, "global_step": 187529, "epoch": 1116} {"train_loss": -11.125402450561523, "global_step": 187530, "epoch": 1116} {"train_loss": -11.01561450958252, "global_step": 187531, "epoch": 1116} {"train_loss": -11.21152400970459, "global_step": 187532, "epoch": 1116} {"train_loss": -11.05171012878418, "global_step": 187533, "epoch": 1116} {"train_loss": -11.106178283691406, "global_step": 187534, "epoch": 1116} {"train_loss": -11.007658004760742, "global_step": 187535, "epoch": 1116} {"train_loss": -11.179847717285156, "global_step": 187536, "epoch": 1116} {"train_loss": -10.988113403320312, "global_step": 187537, "epoch": 1116} {"train_loss": -11.256475448608398, "global_step": 187538, "epoch": 1116} {"train_loss": -11.380749702453613, "global_step": 187539, "epoch": 1116} {"train_loss": -11.100029945373535, "global_step": 187540, "epoch": 1116} {"train_loss": -11.33906078338623, "global_step": 187541, "epoch": 1116} {"train_loss": -10.939348220825195, "global_step": 187542, "epoch": 1116} {"train_loss": -11.30058479309082, "global_step": 187543, "epoch": 1116} {"train_loss": -11.23820686340332, "global_step": 187544, "epoch": 1116} {"train_loss": -11.309555053710938, "global_step": 187545, "epoch": 1116} {"train_loss": -11.37387466430664, "global_step": 187546, "epoch": 1116} {"train_loss": -11.27595043182373, "global_step": 187547, "epoch": 1116} {"train_loss": -11.563019752502441, "global_step": 187548, "epoch": 1116} {"train_loss": -11.323616027832031, "global_step": 187549, "epoch": 1116} {"train_loss": -11.237258911132812, "global_step": 187550, "epoch": 1116} {"train_loss": -11.18665885925293, "global_step": 187551, "epoch": 1116} {"train_loss": -11.202025413513184, "global_step": 187552, "epoch": 1116} {"train_loss": -11.125107765197754, "global_step": 187553, "epoch": 1116} {"train_loss": -11.276548385620117, "global_step": 187554, "epoch": 1116} {"train_loss": -11.254334449768066, "global_step": 187555, "epoch": 1116} {"train_loss": -11.38534164428711, "global_step": 187556, "epoch": 1116} {"train_loss": -11.292932510375977, "global_step": 187557, "epoch": 1116} {"train_loss": -11.299964904785156, "global_step": 187558, "epoch": 1116} {"train_loss": -11.356149673461914, "global_step": 187559, "epoch": 1116} {"train_loss": -11.218961715698242, "global_step": 187560, "epoch": 1116} {"train_loss": -11.095037460327148, "global_step": 187561, "epoch": 1116} {"train_loss": -11.264389038085938, "global_step": 187562, "epoch": 1116} {"train_loss": -10.949668884277344, "global_step": 187563, "epoch": 1116} {"train_loss": -11.219402313232422, "global_step": 187564, "epoch": 1116} {"train_loss": -11.39488410949707, "global_step": 187565, "epoch": 1116} {"train_loss": -11.464664459228516, "global_step": 187566, "epoch": 1116} {"train_loss": -11.213592529296875, "global_step": 187567, "epoch": 1116} {"train_loss": -10.930732727050781, "global_step": 187568, "epoch": 1116} {"train_loss": -11.535003662109375, "global_step": 187569, "epoch": 1116} {"train_loss": -11.203542709350586, "global_step": 187570, "epoch": 1116} {"train_loss": -11.373540878295898, "global_step": 187571, "epoch": 1116} {"train_loss": -11.334716796875, "global_step": 187572, "epoch": 1116} {"train_loss": -11.415102005004883, "global_step": 187573, "epoch": 1116} {"train_loss": -11.434738159179688, "global_step": 187574, "epoch": 1116} {"train_loss": -11.383472442626953, "global_step": 187575, "epoch": 1116} {"train_loss": -11.50066089630127, "global_step": 187576, "epoch": 1116} {"train_loss": -11.49261474609375, "global_step": 187577, "epoch": 1116} {"train_loss": -11.227423667907715, "global_step": 187578, "epoch": 1116} {"train_loss": -11.253681182861328, "global_step": 187579, "epoch": 1116} {"train_loss": -11.529651641845703, "global_step": 187580, "epoch": 1116} {"train_loss": -11.581724166870117, "global_step": 187581, "epoch": 1116} {"train_loss": -11.647531509399414, "global_step": 187582, "epoch": 1116} {"train_loss": -11.38390064239502, "global_step": 187583, "epoch": 1116} {"train_loss": -11.413835525512695, "global_step": 187584, "epoch": 1116} {"train_loss": -11.368518829345703, "global_step": 187585, "epoch": 1116} {"train_loss": -11.263116836547852, "global_step": 187586, "epoch": 1116} {"train_loss": -11.224099159240723, "global_step": 187587, "epoch": 1116} {"train_loss": -11.486100196838379, "global_step": 187588, "epoch": 1116} {"train_loss": -10.601019859313965, "global_step": 187589, "epoch": 1116} {"train_loss": -10.368209838867188, "global_step": 187590, "epoch": 1116} {"train_loss": -11.558425903320312, "global_step": 187591, "epoch": 1116} {"train_loss": -10.191377639770508, "global_step": 187592, "epoch": 1116} {"train_loss": -10.634794235229492, "global_step": 187593, "epoch": 1116} {"train_loss": -10.4120512008667, "global_step": 187594, "epoch": 1116} {"train_loss": -8.946359634399414, "global_step": 187595, "epoch": 1116} {"train_loss": -11.266890525817871, "global_step": 187596, "epoch": 1116} {"train_loss": -9.19854736328125, "global_step": 187597, "epoch": 1116} {"train_loss": -10.744258880615234, "global_step": 187598, "epoch": 1116} {"train_loss": -9.928796768188477, "global_step": 187599, "epoch": 1116} {"train_loss": -9.46902084350586, "global_step": 187600, "epoch": 1116} {"train_loss": -10.664178848266602, "global_step": 187601, "epoch": 1116} {"train_loss": -9.1602201461792, "global_step": 187602, "epoch": 1116} {"train_loss": -10.73021125793457, "global_step": 187603, "epoch": 1116} {"train_loss": -9.78022575378418, "global_step": 187604, "epoch": 1116} {"train_loss": -10.857547760009766, "global_step": 187605, "epoch": 1116} {"train_loss": -9.955978393554688, "global_step": 187606, "epoch": 1116} {"train_loss": -10.43293571472168, "global_step": 187607, "epoch": 1116} {"train_loss": -10.647418022155762, "global_step": 187608, "epoch": 1116} {"train_loss": -10.650732040405273, "global_step": 187609, "epoch": 1116} {"train_loss": -10.585896492004395, "global_step": 187610, "epoch": 1116} {"train_loss": -10.753950119018555, "global_step": 187611, "epoch": 1116} {"train_loss": -10.590261459350586, "global_step": 187612, "epoch": 1116} {"train_loss": -10.381134033203125, "global_step": 187613, "epoch": 1116} {"train_loss": -11.070488929748535, "global_step": 187614, "epoch": 1116} {"train_loss": -10.543611526489258, "global_step": 187615, "epoch": 1116} {"train_loss": -10.841751098632812, "global_step": 187616, "epoch": 1116} {"train_loss": -10.642749786376953, "global_step": 187617, "epoch": 1116} {"train_loss": -10.819334983825684, "global_step": 187618, "epoch": 1116} {"train_loss": -10.98036003112793, "global_step": 187619, "epoch": 1116} {"train_loss": -10.800040245056152, "global_step": 187620, "epoch": 1116} {"train_loss": -11.089290618896484, "global_step": 187621, "epoch": 1116} {"train_loss": -10.841609954833984, "global_step": 187622, "epoch": 1116} {"train_loss": -11.000526428222656, "global_step": 187623, "epoch": 1116} {"train_loss": -10.783443450927734, "global_step": 187624, "epoch": 1116} {"train_loss": -10.864850044250488, "global_step": 187625, "epoch": 1116} {"train_loss": -10.838129043579102, "global_step": 187626, "epoch": 1116} {"train_loss": -11.066751480102539, "global_step": 187627, "epoch": 1116} {"train_loss": -11.136392593383789, "global_step": 187628, "epoch": 1116} {"train_loss": -10.870635032653809, "global_step": 187629, "epoch": 1116} {"train_loss": -10.796333312988281, "global_step": 187630, "epoch": 1116} {"train_loss": -11.028661727905273, "global_step": 187631, "epoch": 1116} {"train_loss": -10.916744232177734, "global_step": 187632, "epoch": 1116} {"train_loss": -11.260913848876953, "global_step": 187633, "epoch": 1116} {"train_loss": -10.884490013122559, "global_step": 187634, "epoch": 1116} {"train_loss": -11.140249252319336, "global_step": 187635, "epoch": 1116} {"train_loss": -10.95640754699707, "global_step": 187636, "epoch": 1116} {"train_loss": -11.200599670410156, "global_step": 187637, "epoch": 1116} {"train_loss": -10.99272632598877, "global_step": 187638, "epoch": 1116} {"train_loss": -11.257229804992676, "global_step": 187639, "epoch": 1116} {"train_loss": -11.156302452087402, "global_step": 187640, "epoch": 1116} {"train_loss": -11.177696228027344, "global_step": 187641, "epoch": 1116} {"train_loss": -11.310760498046875, "global_step": 187642, "epoch": 1116} {"train_loss": -10.849774360656738, "global_step": 187643, "epoch": 1116} {"train_loss": -11.071367263793945, "global_step": 187644, "epoch": 1116} {"train_loss": -10.950614929199219, "global_step": 187645, "epoch": 1116} {"train_loss": -11.394180297851562, "global_step": 187646, "epoch": 1116} {"train_loss": -11.271432876586914, "global_step": 187647, "epoch": 1116} {"train_loss": -11.141496658325195, "global_step": 187648, "epoch": 1116} {"train_loss": -11.110596656799316, "global_step": 187649, "epoch": 1116} {"train_loss": -11.052331924438477, "global_step": 187650, "epoch": 1116} {"train_loss": -11.296331405639648, "global_step": 187651, "epoch": 1116} {"train_loss": -11.239638328552246, "global_step": 187652, "epoch": 1116} {"train_loss": -11.387107849121094, "global_step": 187653, "epoch": 1116} {"train_loss": -11.230158805847168, "global_step": 187654, "epoch": 1116} {"train_loss": -10.827104534421649, "global_step": 187655, "epoch": 1116, "val_loss": 246227.984375} {"train_loss": -11.062736511230469, "global_step": 187656, "epoch": 1117} {"train_loss": -11.127683639526367, "global_step": 187657, "epoch": 1117} {"train_loss": -11.220770835876465, "global_step": 187658, "epoch": 1117} {"train_loss": -11.175802230834961, "global_step": 187659, "epoch": 1117} {"train_loss": -10.889060020446777, "global_step": 187660, "epoch": 1117} {"train_loss": -11.01526927947998, "global_step": 187661, "epoch": 1117} {"train_loss": -11.429742813110352, "global_step": 187662, "epoch": 1117} {"train_loss": -11.042034149169922, "global_step": 187663, "epoch": 1117} {"train_loss": -11.296834945678711, "global_step": 187664, "epoch": 1117} {"train_loss": -11.0475492477417, "global_step": 187665, "epoch": 1117} {"train_loss": -11.200258255004883, "global_step": 187666, "epoch": 1117} {"train_loss": -11.344844818115234, "global_step": 187667, "epoch": 1117} {"train_loss": -11.114013671875, "global_step": 187668, "epoch": 1117} {"train_loss": -11.414735794067383, "global_step": 187669, "epoch": 1117} {"train_loss": -11.101831436157227, "global_step": 187670, "epoch": 1117} {"train_loss": -10.956831932067871, "global_step": 187671, "epoch": 1117} {"train_loss": -11.251070022583008, "global_step": 187672, "epoch": 1117} {"train_loss": -11.384440422058105, "global_step": 187673, "epoch": 1117} {"train_loss": -11.135631561279297, "global_step": 187674, "epoch": 1117} {"train_loss": -11.155989646911621, "global_step": 187675, "epoch": 1117} {"train_loss": -10.641910552978516, "global_step": 187676, "epoch": 1117} {"train_loss": -11.497255325317383, "global_step": 187677, "epoch": 1117} {"train_loss": -10.588871002197266, "global_step": 187678, "epoch": 1117} {"train_loss": -10.936299324035645, "global_step": 187679, "epoch": 1117} {"train_loss": -10.749330520629883, "global_step": 187680, "epoch": 1117} {"train_loss": -10.428670883178711, "global_step": 187681, "epoch": 1117} {"train_loss": -9.957099914550781, "global_step": 187682, "epoch": 1117} {"train_loss": -10.469063758850098, "global_step": 187683, "epoch": 1117} {"train_loss": -11.286468505859375, "global_step": 187684, "epoch": 1117} {"train_loss": -10.211894035339355, "global_step": 187685, "epoch": 1117} {"train_loss": -11.071659088134766, "global_step": 187686, "epoch": 1117} {"train_loss": -11.116472244262695, "global_step": 187687, "epoch": 1117} {"train_loss": -10.81553840637207, "global_step": 187688, "epoch": 1117} {"train_loss": -11.18387222290039, "global_step": 187689, "epoch": 1117} {"train_loss": -10.771270751953125, "global_step": 187690, "epoch": 1117} {"train_loss": -10.873777389526367, "global_step": 187691, "epoch": 1117} {"train_loss": -11.00068473815918, "global_step": 187692, "epoch": 1117} {"train_loss": -10.670246124267578, "global_step": 187693, "epoch": 1117} {"train_loss": -10.89521598815918, "global_step": 187694, "epoch": 1117} {"train_loss": -11.108055114746094, "global_step": 187695, "epoch": 1117} {"train_loss": -10.982328414916992, "global_step": 187696, "epoch": 1117} {"train_loss": -10.749576568603516, "global_step": 187697, "epoch": 1117} {"train_loss": -10.927202224731445, "global_step": 187698, "epoch": 1117} {"train_loss": -11.037910461425781, "global_step": 187699, "epoch": 1117} {"train_loss": -10.567506790161133, "global_step": 187700, "epoch": 1117} {"train_loss": -11.202552795410156, "global_step": 187701, "epoch": 1117} {"train_loss": -11.043878555297852, "global_step": 187702, "epoch": 1117} {"train_loss": -11.03864860534668, "global_step": 187703, "epoch": 1117} {"train_loss": -10.834434509277344, "global_step": 187704, "epoch": 1117} {"train_loss": -11.09553337097168, "global_step": 187705, "epoch": 1117} {"train_loss": -11.248801231384277, "global_step": 187706, "epoch": 1117} {"train_loss": -11.180452346801758, "global_step": 187707, "epoch": 1117} {"train_loss": -11.073103904724121, "global_step": 187708, "epoch": 1117} {"train_loss": -11.14261245727539, "global_step": 187709, "epoch": 1117} {"train_loss": -11.181159019470215, "global_step": 187710, "epoch": 1117} {"train_loss": -11.099971771240234, "global_step": 187711, "epoch": 1117} {"train_loss": -11.234155654907227, "global_step": 187712, "epoch": 1117} {"train_loss": -10.712193489074707, "global_step": 187713, "epoch": 1117} {"train_loss": -11.3107328414917, "global_step": 187714, "epoch": 1117} {"train_loss": -11.101216316223145, "global_step": 187715, "epoch": 1117} {"train_loss": -10.997958183288574, "global_step": 187716, "epoch": 1117} {"train_loss": -10.942815780639648, "global_step": 187717, "epoch": 1117} {"train_loss": -11.10679817199707, "global_step": 187718, "epoch": 1117} {"train_loss": -11.107431411743164, "global_step": 187719, "epoch": 1117} {"train_loss": -11.27408218383789, "global_step": 187720, "epoch": 1117} {"train_loss": -11.096643447875977, "global_step": 187721, "epoch": 1117} {"train_loss": -11.108663558959961, "global_step": 187722, "epoch": 1117} {"train_loss": -11.176939964294434, "global_step": 187723, "epoch": 1117} {"train_loss": -11.120121002197266, "global_step": 187724, "epoch": 1117} {"train_loss": -11.351972579956055, "global_step": 187725, "epoch": 1117} {"train_loss": -11.172107696533203, "global_step": 187726, "epoch": 1117} {"train_loss": -11.163888931274414, "global_step": 187727, "epoch": 1117} {"train_loss": -11.463756561279297, "global_step": 187728, "epoch": 1117} {"train_loss": -11.442596435546875, "global_step": 187729, "epoch": 1117} {"train_loss": -11.519445419311523, "global_step": 187730, "epoch": 1117} {"train_loss": -11.61707878112793, "global_step": 187731, "epoch": 1117} {"train_loss": -11.444162368774414, "global_step": 187732, "epoch": 1117} {"train_loss": -11.572470664978027, "global_step": 187733, "epoch": 1117} {"train_loss": -11.432368278503418, "global_step": 187734, "epoch": 1117} {"train_loss": -11.62121295928955, "global_step": 187735, "epoch": 1117} {"train_loss": -11.413538932800293, "global_step": 187736, "epoch": 1117} {"train_loss": -11.625273704528809, "global_step": 187737, "epoch": 1117} {"train_loss": -11.765558242797852, "global_step": 187738, "epoch": 1117} {"train_loss": -11.462212562561035, "global_step": 187739, "epoch": 1117} {"train_loss": -11.564155578613281, "global_step": 187740, "epoch": 1117} {"train_loss": -11.472710609436035, "global_step": 187741, "epoch": 1117} {"train_loss": -11.512909889221191, "global_step": 187742, "epoch": 1117} {"train_loss": -11.560604095458984, "global_step": 187743, "epoch": 1117} {"train_loss": -11.435989379882812, "global_step": 187744, "epoch": 1117} {"train_loss": -11.593108177185059, "global_step": 187745, "epoch": 1117} {"train_loss": -11.43553638458252, "global_step": 187746, "epoch": 1117} {"train_loss": -11.40101432800293, "global_step": 187747, "epoch": 1117} {"train_loss": -11.528493881225586, "global_step": 187748, "epoch": 1117} {"train_loss": -11.418617248535156, "global_step": 187749, "epoch": 1117} {"train_loss": -11.680614471435547, "global_step": 187750, "epoch": 1117} {"train_loss": -11.554800987243652, "global_step": 187751, "epoch": 1117} {"train_loss": -11.28081226348877, "global_step": 187752, "epoch": 1117} {"train_loss": -11.632179260253906, "global_step": 187753, "epoch": 1117} {"train_loss": -11.504924774169922, "global_step": 187754, "epoch": 1117} {"train_loss": -11.328130722045898, "global_step": 187755, "epoch": 1117} {"train_loss": -11.245548248291016, "global_step": 187756, "epoch": 1117} {"train_loss": -11.362005233764648, "global_step": 187757, "epoch": 1117} {"train_loss": -11.397407531738281, "global_step": 187758, "epoch": 1117} {"train_loss": -11.24979019165039, "global_step": 187759, "epoch": 1117} {"train_loss": -11.513334274291992, "global_step": 187760, "epoch": 1117} {"train_loss": -11.558982849121094, "global_step": 187761, "epoch": 1117} {"train_loss": -11.676944732666016, "global_step": 187762, "epoch": 1117} {"train_loss": -11.541067123413086, "global_step": 187763, "epoch": 1117} {"train_loss": -11.370704650878906, "global_step": 187764, "epoch": 1117} {"train_loss": -11.045597076416016, "global_step": 187765, "epoch": 1117} {"train_loss": -11.641897201538086, "global_step": 187766, "epoch": 1117} {"train_loss": -11.520669937133789, "global_step": 187767, "epoch": 1117} {"train_loss": -11.323524475097656, "global_step": 187768, "epoch": 1117} {"train_loss": -11.320363998413086, "global_step": 187769, "epoch": 1117} {"train_loss": -11.72009563446045, "global_step": 187770, "epoch": 1117} {"train_loss": -11.356389045715332, "global_step": 187771, "epoch": 1117} {"train_loss": -11.34550952911377, "global_step": 187772, "epoch": 1117} {"train_loss": -11.329752922058105, "global_step": 187773, "epoch": 1117} {"train_loss": -11.390798568725586, "global_step": 187774, "epoch": 1117} {"train_loss": -10.80611801147461, "global_step": 187775, "epoch": 1117} {"train_loss": -11.621390342712402, "global_step": 187776, "epoch": 1117} {"train_loss": -10.810762405395508, "global_step": 187777, "epoch": 1117} {"train_loss": -11.547855377197266, "global_step": 187778, "epoch": 1117} {"train_loss": -11.135101318359375, "global_step": 187779, "epoch": 1117} {"train_loss": -11.061723709106445, "global_step": 187780, "epoch": 1117} {"train_loss": -10.951562881469727, "global_step": 187781, "epoch": 1117} {"train_loss": -11.388489723205566, "global_step": 187782, "epoch": 1117} {"train_loss": -10.769180297851562, "global_step": 187783, "epoch": 1117} {"train_loss": -11.303230285644531, "global_step": 187784, "epoch": 1117} {"train_loss": -10.67624568939209, "global_step": 187785, "epoch": 1117} {"train_loss": -10.833962440490723, "global_step": 187786, "epoch": 1117} {"train_loss": -11.121855735778809, "global_step": 187787, "epoch": 1117} {"train_loss": -11.36242961883545, "global_step": 187788, "epoch": 1117} {"train_loss": -11.299162864685059, "global_step": 187789, "epoch": 1117} {"train_loss": -11.162904739379883, "global_step": 187790, "epoch": 1117} {"train_loss": -11.22427749633789, "global_step": 187791, "epoch": 1117} {"train_loss": -11.086002349853516, "global_step": 187792, "epoch": 1117} {"train_loss": -11.291656494140625, "global_step": 187793, "epoch": 1117} {"train_loss": -11.419464111328125, "global_step": 187794, "epoch": 1117} {"train_loss": -10.958456039428711, "global_step": 187795, "epoch": 1117} {"train_loss": -11.336784362792969, "global_step": 187796, "epoch": 1117} {"train_loss": -11.189115524291992, "global_step": 187797, "epoch": 1117} {"train_loss": -11.083786010742188, "global_step": 187798, "epoch": 1117} {"train_loss": -10.881351470947266, "global_step": 187799, "epoch": 1117} {"train_loss": -11.439576148986816, "global_step": 187800, "epoch": 1117} {"train_loss": -11.600899696350098, "global_step": 187801, "epoch": 1117} {"train_loss": -10.893843650817871, "global_step": 187802, "epoch": 1117} {"train_loss": -11.232831001281738, "global_step": 187803, "epoch": 1117} {"train_loss": -11.404752731323242, "global_step": 187804, "epoch": 1117} {"train_loss": -11.37702751159668, "global_step": 187805, "epoch": 1117} {"train_loss": -10.995431900024414, "global_step": 187806, "epoch": 1117} {"train_loss": -11.124752044677734, "global_step": 187807, "epoch": 1117} {"train_loss": -11.002729415893555, "global_step": 187808, "epoch": 1117} {"train_loss": -11.142282485961914, "global_step": 187809, "epoch": 1117} {"train_loss": -11.19357681274414, "global_step": 187810, "epoch": 1117} {"train_loss": -10.603034019470215, "global_step": 187811, "epoch": 1117} {"train_loss": -11.081966400146484, "global_step": 187812, "epoch": 1117} {"train_loss": -11.082834243774414, "global_step": 187813, "epoch": 1117} {"train_loss": -10.875476837158203, "global_step": 187814, "epoch": 1117} {"train_loss": -10.888117790222168, "global_step": 187815, "epoch": 1117} {"train_loss": -11.028653144836426, "global_step": 187816, "epoch": 1117} {"train_loss": -11.196666717529297, "global_step": 187817, "epoch": 1117} {"train_loss": -11.002132415771484, "global_step": 187818, "epoch": 1117} {"train_loss": -11.178234100341797, "global_step": 187819, "epoch": 1117} {"train_loss": -10.65061092376709, "global_step": 187820, "epoch": 1117} {"train_loss": -11.165494918823242, "global_step": 187821, "epoch": 1117} {"train_loss": -10.757932662963867, "global_step": 187822, "epoch": 1117} {"train_loss": -11.17450441632952, "global_step": 187823, "epoch": 1117, "val_loss": 246478.9375} {"train_loss": -10.634613990783691, "global_step": 187824, "epoch": 1118} {"train_loss": -11.292436599731445, "global_step": 187825, "epoch": 1118} {"train_loss": -10.63919734954834, "global_step": 187826, "epoch": 1118} {"train_loss": -10.552373886108398, "global_step": 187827, "epoch": 1118} {"train_loss": -10.825325965881348, "global_step": 187828, "epoch": 1118} {"train_loss": -10.992597579956055, "global_step": 187829, "epoch": 1118} {"train_loss": -11.085932731628418, "global_step": 187830, "epoch": 1118} {"train_loss": -10.632018089294434, "global_step": 187831, "epoch": 1118} {"train_loss": -11.013334274291992, "global_step": 187832, "epoch": 1118} {"train_loss": -10.579635620117188, "global_step": 187833, "epoch": 1118} {"train_loss": -10.94923210144043, "global_step": 187834, "epoch": 1118} {"train_loss": -10.854405403137207, "global_step": 187835, "epoch": 1118} {"train_loss": -10.453875541687012, "global_step": 187836, "epoch": 1118} {"train_loss": -11.274845123291016, "global_step": 187837, "epoch": 1118} {"train_loss": -10.52271842956543, "global_step": 187838, "epoch": 1118} {"train_loss": -11.388177871704102, "global_step": 187839, "epoch": 1118} {"train_loss": -10.715452194213867, "global_step": 187840, "epoch": 1118} {"train_loss": -11.050124168395996, "global_step": 187841, "epoch": 1118} {"train_loss": -10.880298614501953, "global_step": 187842, "epoch": 1118} {"train_loss": -10.721662521362305, "global_step": 187843, "epoch": 1118} {"train_loss": -10.66018295288086, "global_step": 187844, "epoch": 1118} {"train_loss": -10.213659286499023, "global_step": 187845, "epoch": 1118} {"train_loss": -11.242888450622559, "global_step": 187846, "epoch": 1118} {"train_loss": -10.419788360595703, "global_step": 187847, "epoch": 1118} {"train_loss": -10.707239151000977, "global_step": 187848, "epoch": 1118} {"train_loss": -10.738957405090332, "global_step": 187849, "epoch": 1118} {"train_loss": -10.836563110351562, "global_step": 187850, "epoch": 1118} {"train_loss": -10.828121185302734, "global_step": 187851, "epoch": 1118} {"train_loss": -10.68268871307373, "global_step": 187852, "epoch": 1118} {"train_loss": -11.178101539611816, "global_step": 187853, "epoch": 1118} {"train_loss": -11.004480361938477, "global_step": 187854, "epoch": 1118} {"train_loss": -10.919492721557617, "global_step": 187855, "epoch": 1118} {"train_loss": -11.244888305664062, "global_step": 187856, "epoch": 1118} {"train_loss": -10.99637508392334, "global_step": 187857, "epoch": 1118} {"train_loss": -11.205873489379883, "global_step": 187858, "epoch": 1118} {"train_loss": -11.119597434997559, "global_step": 187859, "epoch": 1118} {"train_loss": -11.286046981811523, "global_step": 187860, "epoch": 1118} {"train_loss": -11.014427185058594, "global_step": 187861, "epoch": 1118} {"train_loss": -11.25732421875, "global_step": 187862, "epoch": 1118} {"train_loss": -11.209033966064453, "global_step": 187863, "epoch": 1118} {"train_loss": -10.826953887939453, "global_step": 187864, "epoch": 1118} {"train_loss": -11.402649879455566, "global_step": 187865, "epoch": 1118} {"train_loss": -11.038981437683105, "global_step": 187866, "epoch": 1118} {"train_loss": -11.268415451049805, "global_step": 187867, "epoch": 1118} {"train_loss": -11.182119369506836, "global_step": 187868, "epoch": 1118} {"train_loss": -11.130041122436523, "global_step": 187869, "epoch": 1118} {"train_loss": -11.153364181518555, "global_step": 187870, "epoch": 1118} {"train_loss": -11.178719520568848, "global_step": 187871, "epoch": 1118} {"train_loss": -10.994139671325684, "global_step": 187872, "epoch": 1118} {"train_loss": -11.371549606323242, "global_step": 187873, "epoch": 1118} {"train_loss": -10.91097354888916, "global_step": 187874, "epoch": 1118} {"train_loss": -11.467082977294922, "global_step": 187875, "epoch": 1118} {"train_loss": -11.237006187438965, "global_step": 187876, "epoch": 1118} {"train_loss": -11.468269348144531, "global_step": 187877, "epoch": 1118} {"train_loss": -11.281122207641602, "global_step": 187878, "epoch": 1118} {"train_loss": -11.172561645507812, "global_step": 187879, "epoch": 1118} {"train_loss": -11.380027770996094, "global_step": 187880, "epoch": 1118} {"train_loss": -11.537755966186523, "global_step": 187881, "epoch": 1118} {"train_loss": -11.401845932006836, "global_step": 187882, "epoch": 1118} {"train_loss": -11.57267951965332, "global_step": 187883, "epoch": 1118} {"train_loss": -11.426889419555664, "global_step": 187884, "epoch": 1118} {"train_loss": -11.61768913269043, "global_step": 187885, "epoch": 1118} {"train_loss": -11.235249519348145, "global_step": 187886, "epoch": 1118} {"train_loss": -11.548174858093262, "global_step": 187887, "epoch": 1118} {"train_loss": -11.370861053466797, "global_step": 187888, "epoch": 1118} {"train_loss": -11.474546432495117, "global_step": 187889, "epoch": 1118} {"train_loss": -11.716228485107422, "global_step": 187890, "epoch": 1118} {"train_loss": -11.518030166625977, "global_step": 187891, "epoch": 1118} {"train_loss": -11.591585159301758, "global_step": 187892, "epoch": 1118} {"train_loss": -11.589838027954102, "global_step": 187893, "epoch": 1118} {"train_loss": -11.659008026123047, "global_step": 187894, "epoch": 1118} {"train_loss": -11.755481719970703, "global_step": 187895, "epoch": 1118} {"train_loss": -11.386222839355469, "global_step": 187896, "epoch": 1118} {"train_loss": -11.602893829345703, "global_step": 187897, "epoch": 1118} {"train_loss": -11.595379829406738, "global_step": 187898, "epoch": 1118} {"train_loss": -11.505657196044922, "global_step": 187899, "epoch": 1118} {"train_loss": -11.583566665649414, "global_step": 187900, "epoch": 1118} {"train_loss": -11.492847442626953, "global_step": 187901, "epoch": 1118} {"train_loss": -11.383331298828125, "global_step": 187902, "epoch": 1118} {"train_loss": -11.67368221282959, "global_step": 187903, "epoch": 1118} {"train_loss": -11.52698040008545, "global_step": 187904, "epoch": 1118} {"train_loss": -11.200237274169922, "global_step": 187905, "epoch": 1118} {"train_loss": -11.500003814697266, "global_step": 187906, "epoch": 1118} {"train_loss": -11.134952545166016, "global_step": 187907, "epoch": 1118} {"train_loss": -11.736555099487305, "global_step": 187908, "epoch": 1118} {"train_loss": -10.91249942779541, "global_step": 187909, "epoch": 1118} {"train_loss": -11.450796127319336, "global_step": 187910, "epoch": 1118} {"train_loss": -11.134198188781738, "global_step": 187911, "epoch": 1118} {"train_loss": -11.605609893798828, "global_step": 187912, "epoch": 1118} {"train_loss": -11.05748176574707, "global_step": 187913, "epoch": 1118} {"train_loss": -11.313719749450684, "global_step": 187914, "epoch": 1118} {"train_loss": -11.285882949829102, "global_step": 187915, "epoch": 1118} {"train_loss": -11.342784881591797, "global_step": 187916, "epoch": 1118} {"train_loss": -11.360145568847656, "global_step": 187917, "epoch": 1118} {"train_loss": -10.832681655883789, "global_step": 187918, "epoch": 1118} {"train_loss": -11.736273765563965, "global_step": 187919, "epoch": 1118} {"train_loss": -11.07783031463623, "global_step": 187920, "epoch": 1118} {"train_loss": -11.480843544006348, "global_step": 187921, "epoch": 1118} {"train_loss": -10.823596954345703, "global_step": 187922, "epoch": 1118} {"train_loss": -11.067296981811523, "global_step": 187923, "epoch": 1118} {"train_loss": -11.267005920410156, "global_step": 187924, "epoch": 1118} {"train_loss": -10.950407981872559, "global_step": 187925, "epoch": 1118} {"train_loss": -10.886812210083008, "global_step": 187926, "epoch": 1118} {"train_loss": -10.374391555786133, "global_step": 187927, "epoch": 1118} {"train_loss": -11.197394371032715, "global_step": 187928, "epoch": 1118} {"train_loss": -10.919454574584961, "global_step": 187929, "epoch": 1118} {"train_loss": -11.049415588378906, "global_step": 187930, "epoch": 1118} {"train_loss": -10.880472183227539, "global_step": 187931, "epoch": 1118} {"train_loss": -10.772192001342773, "global_step": 187932, "epoch": 1118} {"train_loss": -11.035928726196289, "global_step": 187933, "epoch": 1118} {"train_loss": -11.130512237548828, "global_step": 187934, "epoch": 1118} {"train_loss": -10.62850570678711, "global_step": 187935, "epoch": 1118} {"train_loss": -11.377279281616211, "global_step": 187936, "epoch": 1118} {"train_loss": -10.304140090942383, "global_step": 187937, "epoch": 1118} {"train_loss": -10.366055488586426, "global_step": 187938, "epoch": 1118} {"train_loss": -10.981881141662598, "global_step": 187939, "epoch": 1118} {"train_loss": -10.697667121887207, "global_step": 187940, "epoch": 1118} {"train_loss": -10.579999923706055, "global_step": 187941, "epoch": 1118} {"train_loss": -11.33562183380127, "global_step": 187942, "epoch": 1118} {"train_loss": -10.820161819458008, "global_step": 187943, "epoch": 1118} {"train_loss": -10.97606086730957, "global_step": 187944, "epoch": 1118} {"train_loss": -10.886123657226562, "global_step": 187945, "epoch": 1118} {"train_loss": -10.925277709960938, "global_step": 187946, "epoch": 1118} {"train_loss": -10.934022903442383, "global_step": 187947, "epoch": 1118} {"train_loss": -11.12096118927002, "global_step": 187948, "epoch": 1118} {"train_loss": -11.20744800567627, "global_step": 187949, "epoch": 1118} {"train_loss": -11.058893203735352, "global_step": 187950, "epoch": 1118} {"train_loss": -11.103893280029297, "global_step": 187951, "epoch": 1118} {"train_loss": -11.009086608886719, "global_step": 187952, "epoch": 1118} {"train_loss": -11.334843635559082, "global_step": 187953, "epoch": 1118} {"train_loss": -10.954390525817871, "global_step": 187954, "epoch": 1118} {"train_loss": -11.233808517456055, "global_step": 187955, "epoch": 1118} {"train_loss": -11.26453971862793, "global_step": 187956, "epoch": 1118} {"train_loss": -11.088403701782227, "global_step": 187957, "epoch": 1118} {"train_loss": -11.274328231811523, "global_step": 187958, "epoch": 1118} {"train_loss": -11.480547904968262, "global_step": 187959, "epoch": 1118} {"train_loss": -10.875625610351562, "global_step": 187960, "epoch": 1118} {"train_loss": -11.526008605957031, "global_step": 187961, "epoch": 1118} {"train_loss": -10.778160095214844, "global_step": 187962, "epoch": 1118} {"train_loss": -11.233306884765625, "global_step": 187963, "epoch": 1118} {"train_loss": -11.241809844970703, "global_step": 187964, "epoch": 1118} {"train_loss": -11.243569374084473, "global_step": 187965, "epoch": 1118} {"train_loss": -10.994189262390137, "global_step": 187966, "epoch": 1118} {"train_loss": -11.140888214111328, "global_step": 187967, "epoch": 1118} {"train_loss": -10.600069999694824, "global_step": 187968, "epoch": 1118} {"train_loss": -10.785162925720215, "global_step": 187969, "epoch": 1118} {"train_loss": -11.183420181274414, "global_step": 187970, "epoch": 1118} {"train_loss": -10.79475212097168, "global_step": 187971, "epoch": 1118} {"train_loss": -11.321041107177734, "global_step": 187972, "epoch": 1118} {"train_loss": -10.783479690551758, "global_step": 187973, "epoch": 1118} {"train_loss": -11.437124252319336, "global_step": 187974, "epoch": 1118} {"train_loss": -11.26151180267334, "global_step": 187975, "epoch": 1118} {"train_loss": -11.126355171203613, "global_step": 187976, "epoch": 1118} {"train_loss": -10.793853759765625, "global_step": 187977, "epoch": 1118} {"train_loss": -10.786199569702148, "global_step": 187978, "epoch": 1118} {"train_loss": -10.459844589233398, "global_step": 187979, "epoch": 1118} {"train_loss": -10.696928024291992, "global_step": 187980, "epoch": 1118} {"train_loss": -11.007152557373047, "global_step": 187981, "epoch": 1118} {"train_loss": -10.477376937866211, "global_step": 187982, "epoch": 1118} {"train_loss": -10.978647232055664, "global_step": 187983, "epoch": 1118} {"train_loss": -10.90488052368164, "global_step": 187984, "epoch": 1118} {"train_loss": -9.885488510131836, "global_step": 187985, "epoch": 1118} {"train_loss": -10.74203109741211, "global_step": 187986, "epoch": 1118} {"train_loss": -10.451272964477539, "global_step": 187987, "epoch": 1118} {"train_loss": -11.216175079345703, "global_step": 187988, "epoch": 1118} {"train_loss": -10.890167236328125, "global_step": 187989, "epoch": 1118} {"train_loss": -10.751063346862793, "global_step": 187990, "epoch": 1118} {"train_loss": -11.083694060643515, "global_step": 187991, "epoch": 1118, "val_loss": 246828.859375} {"train_loss": -11.021903038024902, "global_step": 187992, "epoch": 1119} {"train_loss": -10.5079927444458, "global_step": 187993, "epoch": 1119} {"train_loss": -10.74569320678711, "global_step": 187994, "epoch": 1119} {"train_loss": -11.033185958862305, "global_step": 187995, "epoch": 1119} {"train_loss": -11.107417106628418, "global_step": 187996, "epoch": 1119} {"train_loss": -11.0740327835083, "global_step": 187997, "epoch": 1119} {"train_loss": -10.784019470214844, "global_step": 187998, "epoch": 1119} {"train_loss": -11.254595756530762, "global_step": 187999, "epoch": 1119} {"train_loss": -11.106386184692383, "global_step": 188000, "epoch": 1119} {"train_loss": -10.741329193115234, "global_step": 188001, "epoch": 1119} {"train_loss": -11.425910949707031, "global_step": 188002, "epoch": 1119} {"train_loss": -11.122051239013672, "global_step": 188003, "epoch": 1119} {"train_loss": -11.220067024230957, "global_step": 188004, "epoch": 1119} {"train_loss": -11.155733108520508, "global_step": 188005, "epoch": 1119} {"train_loss": -11.14018440246582, "global_step": 188006, "epoch": 1119} {"train_loss": -11.166000366210938, "global_step": 188007, "epoch": 1119} {"train_loss": -11.26323127746582, "global_step": 188008, "epoch": 1119} {"train_loss": -11.335911750793457, "global_step": 188009, "epoch": 1119} {"train_loss": -11.338235855102539, "global_step": 188010, "epoch": 1119} {"train_loss": -11.385189056396484, "global_step": 188011, "epoch": 1119} {"train_loss": -11.231473922729492, "global_step": 188012, "epoch": 1119} {"train_loss": -11.112238883972168, "global_step": 188013, "epoch": 1119} {"train_loss": -11.089141845703125, "global_step": 188014, "epoch": 1119} {"train_loss": -10.995183944702148, "global_step": 188015, "epoch": 1119} {"train_loss": -11.299921989440918, "global_step": 188016, "epoch": 1119} {"train_loss": -10.942193984985352, "global_step": 188017, "epoch": 1119} {"train_loss": -11.272379875183105, "global_step": 188018, "epoch": 1119} {"train_loss": -11.094404220581055, "global_step": 188019, "epoch": 1119} {"train_loss": -11.190240859985352, "global_step": 188020, "epoch": 1119} {"train_loss": -11.102981567382812, "global_step": 188021, "epoch": 1119} {"train_loss": -10.98750114440918, "global_step": 188022, "epoch": 1119} {"train_loss": -11.197999954223633, "global_step": 188023, "epoch": 1119} {"train_loss": -11.258392333984375, "global_step": 188024, "epoch": 1119} {"train_loss": -11.150724411010742, "global_step": 188025, "epoch": 1119} {"train_loss": -11.344208717346191, "global_step": 188026, "epoch": 1119} {"train_loss": -10.883956909179688, "global_step": 188027, "epoch": 1119} {"train_loss": -11.370016098022461, "global_step": 188028, "epoch": 1119} {"train_loss": -11.215386390686035, "global_step": 188029, "epoch": 1119} {"train_loss": -11.031808853149414, "global_step": 188030, "epoch": 1119} {"train_loss": -11.354446411132812, "global_step": 188031, "epoch": 1119} {"train_loss": -11.131427764892578, "global_step": 188032, "epoch": 1119} {"train_loss": -11.382993698120117, "global_step": 188033, "epoch": 1119} {"train_loss": -11.346955299377441, "global_step": 188034, "epoch": 1119} {"train_loss": -11.444341659545898, "global_step": 188035, "epoch": 1119} {"train_loss": -11.421928405761719, "global_step": 188036, "epoch": 1119} {"train_loss": -11.426502227783203, "global_step": 188037, "epoch": 1119} {"train_loss": -11.303573608398438, "global_step": 188038, "epoch": 1119} {"train_loss": -11.326976776123047, "global_step": 188039, "epoch": 1119} {"train_loss": -11.200085639953613, "global_step": 188040, "epoch": 1119} {"train_loss": -11.544164657592773, "global_step": 188041, "epoch": 1119} {"train_loss": -11.335044860839844, "global_step": 188042, "epoch": 1119} {"train_loss": -11.36230182647705, "global_step": 188043, "epoch": 1119} {"train_loss": -11.349384307861328, "global_step": 188044, "epoch": 1119} {"train_loss": -11.474813461303711, "global_step": 188045, "epoch": 1119} {"train_loss": -11.30045223236084, "global_step": 188046, "epoch": 1119} {"train_loss": -11.292495727539062, "global_step": 188047, "epoch": 1119} {"train_loss": -11.695744514465332, "global_step": 188048, "epoch": 1119} {"train_loss": -11.446456909179688, "global_step": 188049, "epoch": 1119} {"train_loss": -11.715527534484863, "global_step": 188050, "epoch": 1119} {"train_loss": -11.435684204101562, "global_step": 188051, "epoch": 1119} {"train_loss": -11.252384185791016, "global_step": 188052, "epoch": 1119} {"train_loss": -11.656940460205078, "global_step": 188053, "epoch": 1119} {"train_loss": -11.52252197265625, "global_step": 188054, "epoch": 1119} {"train_loss": -10.879497528076172, "global_step": 188055, "epoch": 1119} {"train_loss": -10.936861991882324, "global_step": 188056, "epoch": 1119} {"train_loss": -11.300256729125977, "global_step": 188057, "epoch": 1119} {"train_loss": -11.507904052734375, "global_step": 188058, "epoch": 1119} {"train_loss": -11.452868461608887, "global_step": 188059, "epoch": 1119} {"train_loss": -11.142655372619629, "global_step": 188060, "epoch": 1119} {"train_loss": -11.315191268920898, "global_step": 188061, "epoch": 1119} {"train_loss": -11.137442588806152, "global_step": 188062, "epoch": 1119} {"train_loss": -11.177814483642578, "global_step": 188063, "epoch": 1119} {"train_loss": -11.387099266052246, "global_step": 188064, "epoch": 1119} {"train_loss": -11.363035202026367, "global_step": 188065, "epoch": 1119} {"train_loss": -11.404370307922363, "global_step": 188066, "epoch": 1119} {"train_loss": -11.72635269165039, "global_step": 188067, "epoch": 1119} {"train_loss": -11.618337631225586, "global_step": 188068, "epoch": 1119} {"train_loss": -11.212430953979492, "global_step": 188069, "epoch": 1119} {"train_loss": -11.401779174804688, "global_step": 188070, "epoch": 1119} {"train_loss": -11.606538772583008, "global_step": 188071, "epoch": 1119} {"train_loss": -11.2051420211792, "global_step": 188072, "epoch": 1119} {"train_loss": -10.423820495605469, "global_step": 188073, "epoch": 1119} {"train_loss": -10.091275215148926, "global_step": 188074, "epoch": 1119} {"train_loss": -11.239703178405762, "global_step": 188075, "epoch": 1119} {"train_loss": -10.913065910339355, "global_step": 188076, "epoch": 1119} {"train_loss": -11.209217071533203, "global_step": 188077, "epoch": 1119} {"train_loss": -10.243788719177246, "global_step": 188078, "epoch": 1119} {"train_loss": -11.25822639465332, "global_step": 188079, "epoch": 1119} {"train_loss": -10.567499160766602, "global_step": 188080, "epoch": 1119} {"train_loss": -11.000677108764648, "global_step": 188081, "epoch": 1119} {"train_loss": -10.646612167358398, "global_step": 188082, "epoch": 1119} {"train_loss": -11.141572952270508, "global_step": 188083, "epoch": 1119} {"train_loss": -11.11330795288086, "global_step": 188084, "epoch": 1119} {"train_loss": -10.413263320922852, "global_step": 188085, "epoch": 1119} {"train_loss": -11.078662872314453, "global_step": 188086, "epoch": 1119} {"train_loss": -11.047966957092285, "global_step": 188087, "epoch": 1119} {"train_loss": -10.213640213012695, "global_step": 188088, "epoch": 1119} {"train_loss": -10.756053924560547, "global_step": 188089, "epoch": 1119} {"train_loss": -10.306154251098633, "global_step": 188090, "epoch": 1119} {"train_loss": -10.497166633605957, "global_step": 188091, "epoch": 1119} {"train_loss": -10.504337310791016, "global_step": 188092, "epoch": 1119} {"train_loss": -10.745870590209961, "global_step": 188093, "epoch": 1119} {"train_loss": -10.687932968139648, "global_step": 188094, "epoch": 1119} {"train_loss": -10.853738784790039, "global_step": 188095, "epoch": 1119} {"train_loss": -11.284097671508789, "global_step": 188096, "epoch": 1119} {"train_loss": -10.731152534484863, "global_step": 188097, "epoch": 1119} {"train_loss": -11.006311416625977, "global_step": 188098, "epoch": 1119} {"train_loss": -10.984633445739746, "global_step": 188099, "epoch": 1119} {"train_loss": -11.131226539611816, "global_step": 188100, "epoch": 1119} {"train_loss": -11.360601425170898, "global_step": 188101, "epoch": 1119} {"train_loss": -11.139686584472656, "global_step": 188102, "epoch": 1119} {"train_loss": -11.361157417297363, "global_step": 188103, "epoch": 1119} {"train_loss": -11.180575370788574, "global_step": 188104, "epoch": 1119} {"train_loss": -10.752836227416992, "global_step": 188105, "epoch": 1119} {"train_loss": -11.410711288452148, "global_step": 188106, "epoch": 1119} {"train_loss": -11.166223526000977, "global_step": 188107, "epoch": 1119} {"train_loss": -11.36883544921875, "global_step": 188108, "epoch": 1119} {"train_loss": -11.321044921875, "global_step": 188109, "epoch": 1119} {"train_loss": -11.391423225402832, "global_step": 188110, "epoch": 1119} {"train_loss": -11.084306716918945, "global_step": 188111, "epoch": 1119} {"train_loss": -11.22962760925293, "global_step": 188112, "epoch": 1119} {"train_loss": -11.454017639160156, "global_step": 188113, "epoch": 1119} {"train_loss": -11.45701789855957, "global_step": 188114, "epoch": 1119} {"train_loss": -11.462879180908203, "global_step": 188115, "epoch": 1119} {"train_loss": -11.353860855102539, "global_step": 188116, "epoch": 1119} {"train_loss": -11.432841300964355, "global_step": 188117, "epoch": 1119} {"train_loss": -11.438505172729492, "global_step": 188118, "epoch": 1119} {"train_loss": -11.541996955871582, "global_step": 188119, "epoch": 1119} {"train_loss": -11.446794509887695, "global_step": 188120, "epoch": 1119} {"train_loss": -11.560571670532227, "global_step": 188121, "epoch": 1119} {"train_loss": -11.358499526977539, "global_step": 188122, "epoch": 1119} {"train_loss": -11.780706405639648, "global_step": 188123, "epoch": 1119} {"train_loss": -11.283056259155273, "global_step": 188124, "epoch": 1119} {"train_loss": -11.61400032043457, "global_step": 188125, "epoch": 1119} {"train_loss": -11.469215393066406, "global_step": 188126, "epoch": 1119} {"train_loss": -11.628049850463867, "global_step": 188127, "epoch": 1119} {"train_loss": -11.58848762512207, "global_step": 188128, "epoch": 1119} {"train_loss": -11.507074356079102, "global_step": 188129, "epoch": 1119} {"train_loss": -11.446388244628906, "global_step": 188130, "epoch": 1119} {"train_loss": -11.507966995239258, "global_step": 188131, "epoch": 1119} {"train_loss": -11.404253959655762, "global_step": 188132, "epoch": 1119} {"train_loss": -11.642936706542969, "global_step": 188133, "epoch": 1119} {"train_loss": -11.35319709777832, "global_step": 188134, "epoch": 1119} {"train_loss": -11.553324699401855, "global_step": 188135, "epoch": 1119} {"train_loss": -11.430286407470703, "global_step": 188136, "epoch": 1119} {"train_loss": -11.19192886352539, "global_step": 188137, "epoch": 1119} {"train_loss": -11.381229400634766, "global_step": 188138, "epoch": 1119} {"train_loss": -11.260472297668457, "global_step": 188139, "epoch": 1119} {"train_loss": -11.097379684448242, "global_step": 188140, "epoch": 1119} {"train_loss": -11.265376091003418, "global_step": 188141, "epoch": 1119} {"train_loss": -11.2293062210083, "global_step": 188142, "epoch": 1119} {"train_loss": -10.651578903198242, "global_step": 188143, "epoch": 1119} {"train_loss": -10.977873802185059, "global_step": 188144, "epoch": 1119} {"train_loss": -10.71871566772461, "global_step": 188145, "epoch": 1119} {"train_loss": -10.734289169311523, "global_step": 188146, "epoch": 1119} {"train_loss": -10.945619583129883, "global_step": 188147, "epoch": 1119} {"train_loss": -11.245771408081055, "global_step": 188148, "epoch": 1119} {"train_loss": -10.632539749145508, "global_step": 188149, "epoch": 1119} {"train_loss": -11.321914672851562, "global_step": 188150, "epoch": 1119} {"train_loss": -10.830561637878418, "global_step": 188151, "epoch": 1119} {"train_loss": -11.305317878723145, "global_step": 188152, "epoch": 1119} {"train_loss": -10.828581809997559, "global_step": 188153, "epoch": 1119} {"train_loss": -11.078980445861816, "global_step": 188154, "epoch": 1119} {"train_loss": -11.490140914916992, "global_step": 188155, "epoch": 1119} {"train_loss": -11.032262802124023, "global_step": 188156, "epoch": 1119} {"train_loss": -11.151742935180664, "global_step": 188157, "epoch": 1119} {"train_loss": -11.470158576965332, "global_step": 188158, "epoch": 1119} {"train_loss": -11.185727232978458, "global_step": 188159, "epoch": 1119, "val_loss": 246619.203125} {"train_loss": -11.491769790649414, "global_step": 188160, "epoch": 1120} {"train_loss": -11.011877059936523, "global_step": 188161, "epoch": 1120} {"train_loss": -11.482555389404297, "global_step": 188162, "epoch": 1120} {"train_loss": -11.352056503295898, "global_step": 188163, "epoch": 1120} {"train_loss": -11.262245178222656, "global_step": 188164, "epoch": 1120} {"train_loss": -10.933615684509277, "global_step": 188165, "epoch": 1120} {"train_loss": -11.573951721191406, "global_step": 188166, "epoch": 1120} {"train_loss": -10.815869331359863, "global_step": 188167, "epoch": 1120} {"train_loss": -11.357488632202148, "global_step": 188168, "epoch": 1120} {"train_loss": -10.857381820678711, "global_step": 188169, "epoch": 1120} {"train_loss": -10.950298309326172, "global_step": 188170, "epoch": 1120} {"train_loss": -11.016579627990723, "global_step": 188171, "epoch": 1120} {"train_loss": -11.391000747680664, "global_step": 188172, "epoch": 1120} {"train_loss": -10.692092895507812, "global_step": 188173, "epoch": 1120} {"train_loss": -11.04244613647461, "global_step": 188174, "epoch": 1120} {"train_loss": -11.210378646850586, "global_step": 188175, "epoch": 1120} {"train_loss": -10.60529899597168, "global_step": 188176, "epoch": 1120} {"train_loss": -11.114923477172852, "global_step": 188177, "epoch": 1120} {"train_loss": -10.982975006103516, "global_step": 188178, "epoch": 1120} {"train_loss": -10.952707290649414, "global_step": 188179, "epoch": 1120} {"train_loss": -10.782981872558594, "global_step": 188180, "epoch": 1120} {"train_loss": -11.273170471191406, "global_step": 188181, "epoch": 1120} {"train_loss": -11.226434707641602, "global_step": 188182, "epoch": 1120} {"train_loss": -10.7862548828125, "global_step": 188183, "epoch": 1120} {"train_loss": -11.000877380371094, "global_step": 188184, "epoch": 1120} {"train_loss": -11.119397163391113, "global_step": 188185, "epoch": 1120} {"train_loss": -11.359289169311523, "global_step": 188186, "epoch": 1120} {"train_loss": -10.973546981811523, "global_step": 188187, "epoch": 1120} {"train_loss": -11.319742202758789, "global_step": 188188, "epoch": 1120} {"train_loss": -11.2003173828125, "global_step": 188189, "epoch": 1120} {"train_loss": -11.32409381866455, "global_step": 188190, "epoch": 1120} {"train_loss": -11.08364486694336, "global_step": 188191, "epoch": 1120} {"train_loss": -10.841743469238281, "global_step": 188192, "epoch": 1120} {"train_loss": -11.190984725952148, "global_step": 188193, "epoch": 1120} {"train_loss": -11.401728630065918, "global_step": 188194, "epoch": 1120} {"train_loss": -11.155118942260742, "global_step": 188195, "epoch": 1120} {"train_loss": -11.029281616210938, "global_step": 188196, "epoch": 1120} {"train_loss": -11.219228744506836, "global_step": 188197, "epoch": 1120} {"train_loss": -10.907011032104492, "global_step": 188198, "epoch": 1120} {"train_loss": -11.033804893493652, "global_step": 188199, "epoch": 1120} {"train_loss": -10.66931438446045, "global_step": 188200, "epoch": 1120} {"train_loss": -10.895339965820312, "global_step": 188201, "epoch": 1120} {"train_loss": -11.111590385437012, "global_step": 188202, "epoch": 1120} {"train_loss": -10.986688613891602, "global_step": 188203, "epoch": 1120} {"train_loss": -11.351892471313477, "global_step": 188204, "epoch": 1120} {"train_loss": -11.187009811401367, "global_step": 188205, "epoch": 1120} {"train_loss": -11.394989013671875, "global_step": 188206, "epoch": 1120} {"train_loss": -11.457579612731934, "global_step": 188207, "epoch": 1120} {"train_loss": -11.039998054504395, "global_step": 188208, "epoch": 1120} {"train_loss": -11.304837226867676, "global_step": 188209, "epoch": 1120} {"train_loss": -11.393467903137207, "global_step": 188210, "epoch": 1120} {"train_loss": -11.494319915771484, "global_step": 188211, "epoch": 1120} {"train_loss": -11.072736740112305, "global_step": 188212, "epoch": 1120} {"train_loss": -11.208663940429688, "global_step": 188213, "epoch": 1120} {"train_loss": -11.65809440612793, "global_step": 188214, "epoch": 1120} {"train_loss": -11.504117965698242, "global_step": 188215, "epoch": 1120} {"train_loss": -11.364587783813477, "global_step": 188216, "epoch": 1120} {"train_loss": -11.400969505310059, "global_step": 188217, "epoch": 1120} {"train_loss": -11.457849502563477, "global_step": 188218, "epoch": 1120} {"train_loss": -11.243768692016602, "global_step": 188219, "epoch": 1120} {"train_loss": -11.242522239685059, "global_step": 188220, "epoch": 1120} {"train_loss": -11.241401672363281, "global_step": 188221, "epoch": 1120} {"train_loss": -11.196425437927246, "global_step": 188222, "epoch": 1120} {"train_loss": -11.142168045043945, "global_step": 188223, "epoch": 1120} {"train_loss": -11.07677173614502, "global_step": 188224, "epoch": 1120} {"train_loss": -11.25070571899414, "global_step": 188225, "epoch": 1120} {"train_loss": -11.21771240234375, "global_step": 188226, "epoch": 1120} {"train_loss": -11.204801559448242, "global_step": 188227, "epoch": 1120} {"train_loss": -11.245439529418945, "global_step": 188228, "epoch": 1120} {"train_loss": -11.586390495300293, "global_step": 188229, "epoch": 1120} {"train_loss": -11.526790618896484, "global_step": 188230, "epoch": 1120} {"train_loss": -11.368514060974121, "global_step": 188231, "epoch": 1120} {"train_loss": -11.21331787109375, "global_step": 188232, "epoch": 1120} {"train_loss": -11.44582462310791, "global_step": 188233, "epoch": 1120} {"train_loss": -11.414306640625, "global_step": 188234, "epoch": 1120} {"train_loss": -10.927899360656738, "global_step": 188235, "epoch": 1120} {"train_loss": -10.996994018554688, "global_step": 188236, "epoch": 1120} {"train_loss": -11.429306030273438, "global_step": 188237, "epoch": 1120} {"train_loss": -11.412677764892578, "global_step": 188238, "epoch": 1120} {"train_loss": -11.155743598937988, "global_step": 188239, "epoch": 1120} {"train_loss": -11.328544616699219, "global_step": 188240, "epoch": 1120} {"train_loss": -11.219560623168945, "global_step": 188241, "epoch": 1120} {"train_loss": -11.25576400756836, "global_step": 188242, "epoch": 1120} {"train_loss": -11.47909927368164, "global_step": 188243, "epoch": 1120} {"train_loss": -11.264612197875977, "global_step": 188244, "epoch": 1120} {"train_loss": -11.45437240600586, "global_step": 188245, "epoch": 1120} {"train_loss": -11.427813529968262, "global_step": 188246, "epoch": 1120} {"train_loss": -11.462374687194824, "global_step": 188247, "epoch": 1120} {"train_loss": -11.184572219848633, "global_step": 188248, "epoch": 1120} {"train_loss": -11.465219497680664, "global_step": 188249, "epoch": 1120} {"train_loss": -11.487564086914062, "global_step": 188250, "epoch": 1120} {"train_loss": -11.742853164672852, "global_step": 188251, "epoch": 1120} {"train_loss": -11.507293701171875, "global_step": 188252, "epoch": 1120} {"train_loss": -11.425801277160645, "global_step": 188253, "epoch": 1120} {"train_loss": -11.345370292663574, "global_step": 188254, "epoch": 1120} {"train_loss": -11.733137130737305, "global_step": 188255, "epoch": 1120} {"train_loss": -11.415582656860352, "global_step": 188256, "epoch": 1120} {"train_loss": -11.458282470703125, "global_step": 188257, "epoch": 1120} {"train_loss": -11.640586853027344, "global_step": 188258, "epoch": 1120} {"train_loss": -11.593475341796875, "global_step": 188259, "epoch": 1120} {"train_loss": -11.455697059631348, "global_step": 188260, "epoch": 1120} {"train_loss": -11.489532470703125, "global_step": 188261, "epoch": 1120} {"train_loss": -11.14539909362793, "global_step": 188262, "epoch": 1120} {"train_loss": -11.586051940917969, "global_step": 188263, "epoch": 1120} {"train_loss": -11.523504257202148, "global_step": 188264, "epoch": 1120} {"train_loss": -11.212789535522461, "global_step": 188265, "epoch": 1120} {"train_loss": -10.241255760192871, "global_step": 188266, "epoch": 1120} {"train_loss": -11.529487609863281, "global_step": 188267, "epoch": 1120} {"train_loss": -10.70486068725586, "global_step": 188268, "epoch": 1120} {"train_loss": -9.680160522460938, "global_step": 188269, "epoch": 1120} {"train_loss": -11.436189651489258, "global_step": 188270, "epoch": 1120} {"train_loss": -10.010091781616211, "global_step": 188271, "epoch": 1120} {"train_loss": -9.470966339111328, "global_step": 188272, "epoch": 1120} {"train_loss": -10.791872024536133, "global_step": 188273, "epoch": 1120} {"train_loss": -9.652524948120117, "global_step": 188274, "epoch": 1120} {"train_loss": -11.118358612060547, "global_step": 188275, "epoch": 1120} {"train_loss": -10.296775817871094, "global_step": 188276, "epoch": 1120} {"train_loss": -10.888650894165039, "global_step": 188277, "epoch": 1120} {"train_loss": -9.81846809387207, "global_step": 188278, "epoch": 1120} {"train_loss": -10.179335594177246, "global_step": 188279, "epoch": 1120} {"train_loss": -9.861913681030273, "global_step": 188280, "epoch": 1120} {"train_loss": -10.511618614196777, "global_step": 188281, "epoch": 1120} {"train_loss": -10.405092239379883, "global_step": 188282, "epoch": 1120} {"train_loss": -10.070310592651367, "global_step": 188283, "epoch": 1120} {"train_loss": -10.599306106567383, "global_step": 188284, "epoch": 1120} {"train_loss": -10.454486846923828, "global_step": 188285, "epoch": 1120} {"train_loss": -10.13410758972168, "global_step": 188286, "epoch": 1120} {"train_loss": -10.690890312194824, "global_step": 188287, "epoch": 1120} {"train_loss": -10.017541885375977, "global_step": 188288, "epoch": 1120} {"train_loss": -10.623186111450195, "global_step": 188289, "epoch": 1120} {"train_loss": -10.367059707641602, "global_step": 188290, "epoch": 1120} {"train_loss": -11.106842041015625, "global_step": 188291, "epoch": 1120} {"train_loss": -10.73007583618164, "global_step": 188292, "epoch": 1120} {"train_loss": -11.292574882507324, "global_step": 188293, "epoch": 1120} {"train_loss": -10.822751998901367, "global_step": 188294, "epoch": 1120} {"train_loss": -10.879888534545898, "global_step": 188295, "epoch": 1120} {"train_loss": -10.66119384765625, "global_step": 188296, "epoch": 1120} {"train_loss": -11.311773300170898, "global_step": 188297, "epoch": 1120} {"train_loss": -10.995694160461426, "global_step": 188298, "epoch": 1120} {"train_loss": -10.874187469482422, "global_step": 188299, "epoch": 1120} {"train_loss": -11.150693893432617, "global_step": 188300, "epoch": 1120} {"train_loss": -11.179969787597656, "global_step": 188301, "epoch": 1120} {"train_loss": -11.319692611694336, "global_step": 188302, "epoch": 1120} {"train_loss": -11.06583309173584, "global_step": 188303, "epoch": 1120} {"train_loss": -11.295493125915527, "global_step": 188304, "epoch": 1120} {"train_loss": -11.103811264038086, "global_step": 188305, "epoch": 1120} {"train_loss": -11.147438049316406, "global_step": 188306, "epoch": 1120} {"train_loss": -11.298287391662598, "global_step": 188307, "epoch": 1120} {"train_loss": -11.282766342163086, "global_step": 188308, "epoch": 1120} {"train_loss": -11.310219764709473, "global_step": 188309, "epoch": 1120} {"train_loss": -11.232965469360352, "global_step": 188310, "epoch": 1120} {"train_loss": -11.135114669799805, "global_step": 188311, "epoch": 1120} {"train_loss": -11.342761039733887, "global_step": 188312, "epoch": 1120} {"train_loss": -11.373897552490234, "global_step": 188313, "epoch": 1120} {"train_loss": -11.261592864990234, "global_step": 188314, "epoch": 1120} {"train_loss": -11.677343368530273, "global_step": 188315, "epoch": 1120} {"train_loss": -11.187395095825195, "global_step": 188316, "epoch": 1120} {"train_loss": -11.359912872314453, "global_step": 188317, "epoch": 1120} {"train_loss": -11.303178787231445, "global_step": 188318, "epoch": 1120} {"train_loss": -11.532012939453125, "global_step": 188319, "epoch": 1120} {"train_loss": -11.184179306030273, "global_step": 188320, "epoch": 1120} {"train_loss": -11.102272033691406, "global_step": 188321, "epoch": 1120} {"train_loss": -11.091510772705078, "global_step": 188322, "epoch": 1120} {"train_loss": -10.874333381652832, "global_step": 188323, "epoch": 1120} {"train_loss": -11.514509201049805, "global_step": 188324, "epoch": 1120} {"train_loss": -11.070001602172852, "global_step": 188325, "epoch": 1120} {"train_loss": -11.381648063659668, "global_step": 188326, "epoch": 1120} {"train_loss": -11.100872948056175, "global_step": 188327, "epoch": 1120, "val_loss": 249573.40625, "train_action_mse_error": 0.3213185966014862} {"train_loss": -11.12179946899414, "global_step": 188328, "epoch": 1121} {"train_loss": -11.251090049743652, "global_step": 188329, "epoch": 1121} {"train_loss": -11.438507080078125, "global_step": 188330, "epoch": 1121} {"train_loss": -11.076672554016113, "global_step": 188331, "epoch": 1121} {"train_loss": -11.27268123626709, "global_step": 188332, "epoch": 1121} {"train_loss": -11.275335311889648, "global_step": 188333, "epoch": 1121} {"train_loss": -11.427371978759766, "global_step": 188334, "epoch": 1121} {"train_loss": -11.418619155883789, "global_step": 188335, "epoch": 1121} {"train_loss": -11.191429138183594, "global_step": 188336, "epoch": 1121} {"train_loss": -11.222599983215332, "global_step": 188337, "epoch": 1121} {"train_loss": -10.876830101013184, "global_step": 188338, "epoch": 1121} {"train_loss": -11.035754203796387, "global_step": 188339, "epoch": 1121} {"train_loss": -11.509502410888672, "global_step": 188340, "epoch": 1121} {"train_loss": -11.033366203308105, "global_step": 188341, "epoch": 1121} {"train_loss": -10.678306579589844, "global_step": 188342, "epoch": 1121} {"train_loss": -11.014098167419434, "global_step": 188343, "epoch": 1121} {"train_loss": -11.329696655273438, "global_step": 188344, "epoch": 1121} {"train_loss": -11.124589920043945, "global_step": 188345, "epoch": 1121} {"train_loss": -11.267753601074219, "global_step": 188346, "epoch": 1121} {"train_loss": -11.29623794555664, "global_step": 188347, "epoch": 1121} {"train_loss": -11.393150329589844, "global_step": 188348, "epoch": 1121} {"train_loss": -11.453278541564941, "global_step": 188349, "epoch": 1121} {"train_loss": -11.502936363220215, "global_step": 188350, "epoch": 1121} {"train_loss": -11.352721214294434, "global_step": 188351, "epoch": 1121} {"train_loss": -11.398920059204102, "global_step": 188352, "epoch": 1121} {"train_loss": -11.429018020629883, "global_step": 188353, "epoch": 1121} {"train_loss": -11.21252727508545, "global_step": 188354, "epoch": 1121} {"train_loss": -11.57070541381836, "global_step": 188355, "epoch": 1121} {"train_loss": -11.447595596313477, "global_step": 188356, "epoch": 1121} {"train_loss": -11.27914047241211, "global_step": 188357, "epoch": 1121} {"train_loss": -11.162097930908203, "global_step": 188358, "epoch": 1121} {"train_loss": -11.270027160644531, "global_step": 188359, "epoch": 1121} {"train_loss": -10.88230037689209, "global_step": 188360, "epoch": 1121} {"train_loss": -11.57386589050293, "global_step": 188361, "epoch": 1121} {"train_loss": -10.940234184265137, "global_step": 188362, "epoch": 1121} {"train_loss": -11.45418930053711, "global_step": 188363, "epoch": 1121} {"train_loss": -11.01030445098877, "global_step": 188364, "epoch": 1121} {"train_loss": -11.413215637207031, "global_step": 188365, "epoch": 1121} {"train_loss": -11.031105041503906, "global_step": 188366, "epoch": 1121} {"train_loss": -11.297033309936523, "global_step": 188367, "epoch": 1121} {"train_loss": -10.252805709838867, "global_step": 188368, "epoch": 1121} {"train_loss": -10.732222557067871, "global_step": 188369, "epoch": 1121} {"train_loss": -11.455565452575684, "global_step": 188370, "epoch": 1121} {"train_loss": -10.759869575500488, "global_step": 188371, "epoch": 1121} {"train_loss": -11.221709251403809, "global_step": 188372, "epoch": 1121} {"train_loss": -10.99206256866455, "global_step": 188373, "epoch": 1121} {"train_loss": -10.609638214111328, "global_step": 188374, "epoch": 1121} {"train_loss": -11.609674453735352, "global_step": 188375, "epoch": 1121} {"train_loss": -10.653521537780762, "global_step": 188376, "epoch": 1121} {"train_loss": -10.649736404418945, "global_step": 188377, "epoch": 1121} {"train_loss": -11.536081314086914, "global_step": 188378, "epoch": 1121} {"train_loss": -11.165684700012207, "global_step": 188379, "epoch": 1121} {"train_loss": -11.006199836730957, "global_step": 188380, "epoch": 1121} {"train_loss": -11.271811485290527, "global_step": 188381, "epoch": 1121} {"train_loss": -10.88435173034668, "global_step": 188382, "epoch": 1121} {"train_loss": -10.715254783630371, "global_step": 188383, "epoch": 1121} {"train_loss": -11.149248123168945, "global_step": 188384, "epoch": 1121} {"train_loss": -11.071477890014648, "global_step": 188385, "epoch": 1121} {"train_loss": -11.358307838439941, "global_step": 188386, "epoch": 1121} {"train_loss": -10.759857177734375, "global_step": 188387, "epoch": 1121} {"train_loss": -10.851727485656738, "global_step": 188388, "epoch": 1121} {"train_loss": -11.141759872436523, "global_step": 188389, "epoch": 1121} {"train_loss": -10.483484268188477, "global_step": 188390, "epoch": 1121} {"train_loss": -10.814997673034668, "global_step": 188391, "epoch": 1121} {"train_loss": -11.239415168762207, "global_step": 188392, "epoch": 1121} {"train_loss": -11.060195922851562, "global_step": 188393, "epoch": 1121} {"train_loss": -10.905468940734863, "global_step": 188394, "epoch": 1121} {"train_loss": -11.155132293701172, "global_step": 188395, "epoch": 1121} {"train_loss": -10.890777587890625, "global_step": 188396, "epoch": 1121} {"train_loss": -11.203448295593262, "global_step": 188397, "epoch": 1121} {"train_loss": -10.847768783569336, "global_step": 188398, "epoch": 1121} {"train_loss": -11.000905990600586, "global_step": 188399, "epoch": 1121} {"train_loss": -10.92460823059082, "global_step": 188400, "epoch": 1121} {"train_loss": -11.03248405456543, "global_step": 188401, "epoch": 1121} {"train_loss": -11.171040534973145, "global_step": 188402, "epoch": 1121} {"train_loss": -11.057077407836914, "global_step": 188403, "epoch": 1121} {"train_loss": -11.357608795166016, "global_step": 188404, "epoch": 1121} {"train_loss": -11.0130615234375, "global_step": 188405, "epoch": 1121} {"train_loss": -11.27750015258789, "global_step": 188406, "epoch": 1121} {"train_loss": -11.156402587890625, "global_step": 188407, "epoch": 1121} {"train_loss": -11.360827445983887, "global_step": 188408, "epoch": 1121} {"train_loss": -11.098140716552734, "global_step": 188409, "epoch": 1121} {"train_loss": -11.362370491027832, "global_step": 188410, "epoch": 1121} {"train_loss": -11.132133483886719, "global_step": 188411, "epoch": 1121} {"train_loss": -11.2250337600708, "global_step": 188412, "epoch": 1121} {"train_loss": -11.03773307800293, "global_step": 188413, "epoch": 1121} {"train_loss": -10.943115234375, "global_step": 188414, "epoch": 1121} {"train_loss": -11.5565185546875, "global_step": 188415, "epoch": 1121} {"train_loss": -11.47060775756836, "global_step": 188416, "epoch": 1121} {"train_loss": -11.377151489257812, "global_step": 188417, "epoch": 1121} {"train_loss": -11.461132049560547, "global_step": 188418, "epoch": 1121} {"train_loss": -11.376927375793457, "global_step": 188419, "epoch": 1121} {"train_loss": -11.528892517089844, "global_step": 188420, "epoch": 1121} {"train_loss": -11.359776496887207, "global_step": 188421, "epoch": 1121} {"train_loss": -11.265460014343262, "global_step": 188422, "epoch": 1121} {"train_loss": -11.485758781433105, "global_step": 188423, "epoch": 1121} {"train_loss": -11.603731155395508, "global_step": 188424, "epoch": 1121} {"train_loss": -11.491572380065918, "global_step": 188425, "epoch": 1121} {"train_loss": -11.433492660522461, "global_step": 188426, "epoch": 1121} {"train_loss": -11.441081047058105, "global_step": 188427, "epoch": 1121} {"train_loss": -11.355949401855469, "global_step": 188428, "epoch": 1121} {"train_loss": -11.173554420471191, "global_step": 188429, "epoch": 1121} {"train_loss": -11.283935546875, "global_step": 188430, "epoch": 1121} {"train_loss": -11.329330444335938, "global_step": 188431, "epoch": 1121} {"train_loss": -11.310977935791016, "global_step": 188432, "epoch": 1121} {"train_loss": -11.307119369506836, "global_step": 188433, "epoch": 1121} {"train_loss": -11.144248962402344, "global_step": 188434, "epoch": 1121} {"train_loss": -11.168676376342773, "global_step": 188435, "epoch": 1121} {"train_loss": -11.215787887573242, "global_step": 188436, "epoch": 1121} {"train_loss": -11.30670166015625, "global_step": 188437, "epoch": 1121} {"train_loss": -11.125028610229492, "global_step": 188438, "epoch": 1121} {"train_loss": -11.175861358642578, "global_step": 188439, "epoch": 1121} {"train_loss": -10.920583724975586, "global_step": 188440, "epoch": 1121} {"train_loss": -10.818219184875488, "global_step": 188441, "epoch": 1121} {"train_loss": -11.466952323913574, "global_step": 188442, "epoch": 1121} {"train_loss": -11.046409606933594, "global_step": 188443, "epoch": 1121} {"train_loss": -11.12984848022461, "global_step": 188444, "epoch": 1121} {"train_loss": -11.307943344116211, "global_step": 188445, "epoch": 1121} {"train_loss": -11.361090660095215, "global_step": 188446, "epoch": 1121} {"train_loss": -11.435903549194336, "global_step": 188447, "epoch": 1121} {"train_loss": -11.293318748474121, "global_step": 188448, "epoch": 1121} {"train_loss": -11.473105430603027, "global_step": 188449, "epoch": 1121} {"train_loss": -11.358657836914062, "global_step": 188450, "epoch": 1121} {"train_loss": -11.125388145446777, "global_step": 188451, "epoch": 1121} {"train_loss": -11.454809188842773, "global_step": 188452, "epoch": 1121} {"train_loss": -11.236076354980469, "global_step": 188453, "epoch": 1121} {"train_loss": -11.186436653137207, "global_step": 188454, "epoch": 1121} {"train_loss": -11.431232452392578, "global_step": 188455, "epoch": 1121} {"train_loss": -10.849279403686523, "global_step": 188456, "epoch": 1121} {"train_loss": -11.036760330200195, "global_step": 188457, "epoch": 1121} {"train_loss": -10.607181549072266, "global_step": 188458, "epoch": 1121} {"train_loss": -11.145223617553711, "global_step": 188459, "epoch": 1121} {"train_loss": -11.24789047241211, "global_step": 188460, "epoch": 1121} {"train_loss": -11.193506240844727, "global_step": 188461, "epoch": 1121} {"train_loss": -11.302215576171875, "global_step": 188462, "epoch": 1121} {"train_loss": -11.211808204650879, "global_step": 188463, "epoch": 1121} {"train_loss": -10.850255966186523, "global_step": 188464, "epoch": 1121} {"train_loss": -11.323518753051758, "global_step": 188465, "epoch": 1121} {"train_loss": -10.767863273620605, "global_step": 188466, "epoch": 1121} {"train_loss": -11.266327857971191, "global_step": 188467, "epoch": 1121} {"train_loss": -10.498156547546387, "global_step": 188468, "epoch": 1121} {"train_loss": -11.306024551391602, "global_step": 188469, "epoch": 1121} {"train_loss": -10.750051498413086, "global_step": 188470, "epoch": 1121} {"train_loss": -11.042512893676758, "global_step": 188471, "epoch": 1121} {"train_loss": -10.96037483215332, "global_step": 188472, "epoch": 1121} {"train_loss": -10.701401710510254, "global_step": 188473, "epoch": 1121} {"train_loss": -11.068929672241211, "global_step": 188474, "epoch": 1121} {"train_loss": -10.823203086853027, "global_step": 188475, "epoch": 1121} {"train_loss": -11.615424156188965, "global_step": 188476, "epoch": 1121} {"train_loss": -11.260223388671875, "global_step": 188477, "epoch": 1121} {"train_loss": -11.337776184082031, "global_step": 188478, "epoch": 1121} {"train_loss": -11.42198371887207, "global_step": 188479, "epoch": 1121} {"train_loss": -11.094075202941895, "global_step": 188480, "epoch": 1121} {"train_loss": -11.367171287536621, "global_step": 188481, "epoch": 1121} {"train_loss": -11.429145812988281, "global_step": 188482, "epoch": 1121} {"train_loss": -11.177343368530273, "global_step": 188483, "epoch": 1121} {"train_loss": -11.385462760925293, "global_step": 188484, "epoch": 1121} {"train_loss": -11.469891548156738, "global_step": 188485, "epoch": 1121} {"train_loss": -11.415733337402344, "global_step": 188486, "epoch": 1121} {"train_loss": -11.5370454788208, "global_step": 188487, "epoch": 1121} {"train_loss": -11.318940162658691, "global_step": 188488, "epoch": 1121} {"train_loss": -11.646673202514648, "global_step": 188489, "epoch": 1121} {"train_loss": -11.155206680297852, "global_step": 188490, "epoch": 1121} {"train_loss": -11.602577209472656, "global_step": 188491, "epoch": 1121} {"train_loss": -11.368062019348145, "global_step": 188492, "epoch": 1121} {"train_loss": -11.24649429321289, "global_step": 188493, "epoch": 1121} {"train_loss": -11.518352508544922, "global_step": 188494, "epoch": 1121} {"train_loss": -11.189924489884149, "global_step": 188495, "epoch": 1121, "val_loss": 247980.109375} {"train_loss": -11.422211647033691, "global_step": 188496, "epoch": 1122} {"train_loss": -11.475610733032227, "global_step": 188497, "epoch": 1122} {"train_loss": -11.333224296569824, "global_step": 188498, "epoch": 1122} {"train_loss": -11.2227783203125, "global_step": 188499, "epoch": 1122} {"train_loss": -11.510246276855469, "global_step": 188500, "epoch": 1122} {"train_loss": -11.412044525146484, "global_step": 188501, "epoch": 1122} {"train_loss": -11.3943510055542, "global_step": 188502, "epoch": 1122} {"train_loss": -11.70418930053711, "global_step": 188503, "epoch": 1122} {"train_loss": -11.466135025024414, "global_step": 188504, "epoch": 1122} {"train_loss": -11.543018341064453, "global_step": 188505, "epoch": 1122} {"train_loss": -11.62908935546875, "global_step": 188506, "epoch": 1122} {"train_loss": -11.36951732635498, "global_step": 188507, "epoch": 1122} {"train_loss": -11.671101570129395, "global_step": 188508, "epoch": 1122} {"train_loss": -11.55551815032959, "global_step": 188509, "epoch": 1122} {"train_loss": -11.250869750976562, "global_step": 188510, "epoch": 1122} {"train_loss": -11.645663261413574, "global_step": 188511, "epoch": 1122} {"train_loss": -11.470059394836426, "global_step": 188512, "epoch": 1122} {"train_loss": -10.879743576049805, "global_step": 188513, "epoch": 1122} {"train_loss": -11.270923614501953, "global_step": 188514, "epoch": 1122} {"train_loss": -11.562820434570312, "global_step": 188515, "epoch": 1122} {"train_loss": -11.165135383605957, "global_step": 188516, "epoch": 1122} {"train_loss": -11.024954795837402, "global_step": 188517, "epoch": 1122} {"train_loss": -10.83265495300293, "global_step": 188518, "epoch": 1122} {"train_loss": -11.378828048706055, "global_step": 188519, "epoch": 1122} {"train_loss": -10.742639541625977, "global_step": 188520, "epoch": 1122} {"train_loss": -11.112812042236328, "global_step": 188521, "epoch": 1122} {"train_loss": -10.386228561401367, "global_step": 188522, "epoch": 1122} {"train_loss": -9.913912773132324, "global_step": 188523, "epoch": 1122} {"train_loss": -9.888782501220703, "global_step": 188524, "epoch": 1122} {"train_loss": -9.875560760498047, "global_step": 188525, "epoch": 1122} {"train_loss": -9.729788780212402, "global_step": 188526, "epoch": 1122} {"train_loss": -10.043283462524414, "global_step": 188527, "epoch": 1122} {"train_loss": -9.929542541503906, "global_step": 188528, "epoch": 1122} {"train_loss": -10.007274627685547, "global_step": 188529, "epoch": 1122} {"train_loss": -10.330501556396484, "global_step": 188530, "epoch": 1122} {"train_loss": -9.163135528564453, "global_step": 188531, "epoch": 1122} {"train_loss": -10.835801124572754, "global_step": 188532, "epoch": 1122} {"train_loss": -9.552682876586914, "global_step": 188533, "epoch": 1122} {"train_loss": -10.104061126708984, "global_step": 188534, "epoch": 1122} {"train_loss": -10.138965606689453, "global_step": 188535, "epoch": 1122} {"train_loss": -9.966239929199219, "global_step": 188536, "epoch": 1122} {"train_loss": -9.300383567810059, "global_step": 188537, "epoch": 1122} {"train_loss": -10.2844877243042, "global_step": 188538, "epoch": 1122} {"train_loss": -9.808945655822754, "global_step": 188539, "epoch": 1122} {"train_loss": -10.417830467224121, "global_step": 188540, "epoch": 1122} {"train_loss": -10.734235763549805, "global_step": 188541, "epoch": 1122} {"train_loss": -10.41512680053711, "global_step": 188542, "epoch": 1122} {"train_loss": -10.10737419128418, "global_step": 188543, "epoch": 1122} {"train_loss": -10.521763801574707, "global_step": 188544, "epoch": 1122} {"train_loss": -9.891886711120605, "global_step": 188545, "epoch": 1122} {"train_loss": -10.82420539855957, "global_step": 188546, "epoch": 1122} {"train_loss": -10.159679412841797, "global_step": 188547, "epoch": 1122} {"train_loss": -10.742626190185547, "global_step": 188548, "epoch": 1122} {"train_loss": -10.567703247070312, "global_step": 188549, "epoch": 1122} {"train_loss": -10.760644912719727, "global_step": 188550, "epoch": 1122} {"train_loss": -10.548293113708496, "global_step": 188551, "epoch": 1122} {"train_loss": -10.3810453414917, "global_step": 188552, "epoch": 1122} {"train_loss": -10.963252067565918, "global_step": 188553, "epoch": 1122} {"train_loss": -10.672548294067383, "global_step": 188554, "epoch": 1122} {"train_loss": -9.86562442779541, "global_step": 188555, "epoch": 1122} {"train_loss": -10.752151489257812, "global_step": 188556, "epoch": 1122} {"train_loss": -10.77165412902832, "global_step": 188557, "epoch": 1122} {"train_loss": -10.710835456848145, "global_step": 188558, "epoch": 1122} {"train_loss": -10.865327835083008, "global_step": 188559, "epoch": 1122} {"train_loss": -11.136201858520508, "global_step": 188560, "epoch": 1122} {"train_loss": -10.633990287780762, "global_step": 188561, "epoch": 1122} {"train_loss": -10.954288482666016, "global_step": 188562, "epoch": 1122} {"train_loss": -10.84531021118164, "global_step": 188563, "epoch": 1122} {"train_loss": -10.945109367370605, "global_step": 188564, "epoch": 1122} {"train_loss": -11.173255920410156, "global_step": 188565, "epoch": 1122} {"train_loss": -10.948265075683594, "global_step": 188566, "epoch": 1122} {"train_loss": -10.964141845703125, "global_step": 188567, "epoch": 1122} {"train_loss": -10.97932243347168, "global_step": 188568, "epoch": 1122} {"train_loss": -10.904468536376953, "global_step": 188569, "epoch": 1122} {"train_loss": -10.909687042236328, "global_step": 188570, "epoch": 1122} {"train_loss": -11.129579544067383, "global_step": 188571, "epoch": 1122} {"train_loss": -11.041545867919922, "global_step": 188572, "epoch": 1122} {"train_loss": -11.275001525878906, "global_step": 188573, "epoch": 1122} {"train_loss": -10.999443054199219, "global_step": 188574, "epoch": 1122} {"train_loss": -11.091443061828613, "global_step": 188575, "epoch": 1122} {"train_loss": -11.122779846191406, "global_step": 188576, "epoch": 1122} {"train_loss": -11.218071937561035, "global_step": 188577, "epoch": 1122} {"train_loss": -11.319536209106445, "global_step": 188578, "epoch": 1122} {"train_loss": -11.133033752441406, "global_step": 188579, "epoch": 1122} {"train_loss": -11.138143539428711, "global_step": 188580, "epoch": 1122} {"train_loss": -11.184194564819336, "global_step": 188581, "epoch": 1122} {"train_loss": -11.439102172851562, "global_step": 188582, "epoch": 1122} {"train_loss": -11.052572250366211, "global_step": 188583, "epoch": 1122} {"train_loss": -11.41222858428955, "global_step": 188584, "epoch": 1122} {"train_loss": -11.295149803161621, "global_step": 188585, "epoch": 1122} {"train_loss": -11.136919021606445, "global_step": 188586, "epoch": 1122} {"train_loss": -11.499545097351074, "global_step": 188587, "epoch": 1122} {"train_loss": -11.690425872802734, "global_step": 188588, "epoch": 1122} {"train_loss": -11.254369735717773, "global_step": 188589, "epoch": 1122} {"train_loss": -11.141668319702148, "global_step": 188590, "epoch": 1122} {"train_loss": -11.249465942382812, "global_step": 188591, "epoch": 1122} {"train_loss": -11.35363483428955, "global_step": 188592, "epoch": 1122} {"train_loss": -11.347464561462402, "global_step": 188593, "epoch": 1122} {"train_loss": -11.423192024230957, "global_step": 188594, "epoch": 1122} {"train_loss": -11.242469787597656, "global_step": 188595, "epoch": 1122} {"train_loss": -11.610042572021484, "global_step": 188596, "epoch": 1122} {"train_loss": -11.455917358398438, "global_step": 188597, "epoch": 1122} {"train_loss": -11.296808242797852, "global_step": 188598, "epoch": 1122} {"train_loss": -11.467403411865234, "global_step": 188599, "epoch": 1122} {"train_loss": -11.43084716796875, "global_step": 188600, "epoch": 1122} {"train_loss": -11.448526382446289, "global_step": 188601, "epoch": 1122} {"train_loss": -11.4364652633667, "global_step": 188602, "epoch": 1122} {"train_loss": -11.486001014709473, "global_step": 188603, "epoch": 1122} {"train_loss": -11.39803695678711, "global_step": 188604, "epoch": 1122} {"train_loss": -11.628068923950195, "global_step": 188605, "epoch": 1122} {"train_loss": -11.636392593383789, "global_step": 188606, "epoch": 1122} {"train_loss": -11.591035842895508, "global_step": 188607, "epoch": 1122} {"train_loss": -11.449262619018555, "global_step": 188608, "epoch": 1122} {"train_loss": -11.501383781433105, "global_step": 188609, "epoch": 1122} {"train_loss": -11.44964599609375, "global_step": 188610, "epoch": 1122} {"train_loss": -11.570329666137695, "global_step": 188611, "epoch": 1122} {"train_loss": -11.709604263305664, "global_step": 188612, "epoch": 1122} {"train_loss": -11.349523544311523, "global_step": 188613, "epoch": 1122} {"train_loss": -11.459707260131836, "global_step": 188614, "epoch": 1122} {"train_loss": -11.417011260986328, "global_step": 188615, "epoch": 1122} {"train_loss": -10.867841720581055, "global_step": 188616, "epoch": 1122} {"train_loss": -11.316113471984863, "global_step": 188617, "epoch": 1122} {"train_loss": -11.405706405639648, "global_step": 188618, "epoch": 1122} {"train_loss": -10.75096321105957, "global_step": 188619, "epoch": 1122} {"train_loss": -10.863981246948242, "global_step": 188620, "epoch": 1122} {"train_loss": -11.334552764892578, "global_step": 188621, "epoch": 1122} {"train_loss": -11.011512756347656, "global_step": 188622, "epoch": 1122} {"train_loss": -11.402597427368164, "global_step": 188623, "epoch": 1122} {"train_loss": -11.387592315673828, "global_step": 188624, "epoch": 1122} {"train_loss": -11.321922302246094, "global_step": 188625, "epoch": 1122} {"train_loss": -11.207601547241211, "global_step": 188626, "epoch": 1122} {"train_loss": -11.493053436279297, "global_step": 188627, "epoch": 1122} {"train_loss": -10.948479652404785, "global_step": 188628, "epoch": 1122} {"train_loss": -11.485448837280273, "global_step": 188629, "epoch": 1122} {"train_loss": -11.58779525756836, "global_step": 188630, "epoch": 1122} {"train_loss": -11.422235488891602, "global_step": 188631, "epoch": 1122} {"train_loss": -11.26483154296875, "global_step": 188632, "epoch": 1122} {"train_loss": -11.583958625793457, "global_step": 188633, "epoch": 1122} {"train_loss": -11.56937026977539, "global_step": 188634, "epoch": 1122} {"train_loss": -11.405719757080078, "global_step": 188635, "epoch": 1122} {"train_loss": -11.63376235961914, "global_step": 188636, "epoch": 1122} {"train_loss": -11.361198425292969, "global_step": 188637, "epoch": 1122} {"train_loss": -11.722305297851562, "global_step": 188638, "epoch": 1122} {"train_loss": -11.662435531616211, "global_step": 188639, "epoch": 1122} {"train_loss": -11.528550148010254, "global_step": 188640, "epoch": 1122} {"train_loss": -11.648086547851562, "global_step": 188641, "epoch": 1122} {"train_loss": -11.551529884338379, "global_step": 188642, "epoch": 1122} {"train_loss": -11.251235961914062, "global_step": 188643, "epoch": 1122} {"train_loss": -11.44875431060791, "global_step": 188644, "epoch": 1122} {"train_loss": -11.861739158630371, "global_step": 188645, "epoch": 1122} {"train_loss": -11.683004379272461, "global_step": 188646, "epoch": 1122} {"train_loss": -11.597622871398926, "global_step": 188647, "epoch": 1122} {"train_loss": -11.529895782470703, "global_step": 188648, "epoch": 1122} {"train_loss": -11.550178527832031, "global_step": 188649, "epoch": 1122} {"train_loss": -11.378889083862305, "global_step": 188650, "epoch": 1122} {"train_loss": -11.516977310180664, "global_step": 188651, "epoch": 1122} {"train_loss": -11.44729995727539, "global_step": 188652, "epoch": 1122} {"train_loss": -11.44262981414795, "global_step": 188653, "epoch": 1122} {"train_loss": -11.179306030273438, "global_step": 188654, "epoch": 1122} {"train_loss": -11.21824836730957, "global_step": 188655, "epoch": 1122} {"train_loss": -11.49394416809082, "global_step": 188656, "epoch": 1122} {"train_loss": -11.295364379882812, "global_step": 188657, "epoch": 1122} {"train_loss": -11.009757995605469, "global_step": 188658, "epoch": 1122} {"train_loss": -10.707330703735352, "global_step": 188659, "epoch": 1122} {"train_loss": -10.491830825805664, "global_step": 188660, "epoch": 1122} {"train_loss": -11.112284660339355, "global_step": 188661, "epoch": 1122} {"train_loss": -10.464500427246094, "global_step": 188662, "epoch": 1122} {"train_loss": -11.067467258090065, "global_step": 188663, "epoch": 1122, "val_loss": 246390.5} {"train_loss": -9.735189437866211, "global_step": 188664, "epoch": 1123} {"train_loss": -10.405231475830078, "global_step": 188665, "epoch": 1123} {"train_loss": -10.651790618896484, "global_step": 188666, "epoch": 1123} {"train_loss": -10.756145477294922, "global_step": 188667, "epoch": 1123} {"train_loss": -9.762554168701172, "global_step": 188668, "epoch": 1123} {"train_loss": -10.711933135986328, "global_step": 188669, "epoch": 1123} {"train_loss": -10.59744644165039, "global_step": 188670, "epoch": 1123} {"train_loss": -10.086578369140625, "global_step": 188671, "epoch": 1123} {"train_loss": -10.820083618164062, "global_step": 188672, "epoch": 1123} {"train_loss": -9.541309356689453, "global_step": 188673, "epoch": 1123} {"train_loss": -10.902191162109375, "global_step": 188674, "epoch": 1123} {"train_loss": -9.780410766601562, "global_step": 188675, "epoch": 1123} {"train_loss": -10.902203559875488, "global_step": 188676, "epoch": 1123} {"train_loss": -10.382777214050293, "global_step": 188677, "epoch": 1123} {"train_loss": -11.260063171386719, "global_step": 188678, "epoch": 1123} {"train_loss": -10.084797859191895, "global_step": 188679, "epoch": 1123} {"train_loss": -10.339654922485352, "global_step": 188680, "epoch": 1123} {"train_loss": -10.39461898803711, "global_step": 188681, "epoch": 1123} {"train_loss": -9.313618659973145, "global_step": 188682, "epoch": 1123} {"train_loss": -10.965394973754883, "global_step": 188683, "epoch": 1123} {"train_loss": -9.758360862731934, "global_step": 188684, "epoch": 1123} {"train_loss": -10.897220611572266, "global_step": 188685, "epoch": 1123} {"train_loss": -10.534907341003418, "global_step": 188686, "epoch": 1123} {"train_loss": -10.526599884033203, "global_step": 188687, "epoch": 1123} {"train_loss": -10.7200288772583, "global_step": 188688, "epoch": 1123} {"train_loss": -10.595304489135742, "global_step": 188689, "epoch": 1123} {"train_loss": -10.926912307739258, "global_step": 188690, "epoch": 1123} {"train_loss": -10.780162811279297, "global_step": 188691, "epoch": 1123} {"train_loss": -10.878293991088867, "global_step": 188692, "epoch": 1123} {"train_loss": -10.891459465026855, "global_step": 188693, "epoch": 1123} {"train_loss": -10.989185333251953, "global_step": 188694, "epoch": 1123} {"train_loss": -10.67735481262207, "global_step": 188695, "epoch": 1123} {"train_loss": -11.366571426391602, "global_step": 188696, "epoch": 1123} {"train_loss": -10.87578010559082, "global_step": 188697, "epoch": 1123} {"train_loss": -11.251382827758789, "global_step": 188698, "epoch": 1123} {"train_loss": -11.301454544067383, "global_step": 188699, "epoch": 1123} {"train_loss": -10.94841480255127, "global_step": 188700, "epoch": 1123} {"train_loss": -10.947062492370605, "global_step": 188701, "epoch": 1123} {"train_loss": -10.879801750183105, "global_step": 188702, "epoch": 1123} {"train_loss": -10.9747896194458, "global_step": 188703, "epoch": 1123} {"train_loss": -11.174213409423828, "global_step": 188704, "epoch": 1123} {"train_loss": -11.35365104675293, "global_step": 188705, "epoch": 1123} {"train_loss": -11.082911491394043, "global_step": 188706, "epoch": 1123} {"train_loss": -11.14455795288086, "global_step": 188707, "epoch": 1123} {"train_loss": -11.441244125366211, "global_step": 188708, "epoch": 1123} {"train_loss": -11.03681755065918, "global_step": 188709, "epoch": 1123} {"train_loss": -11.43773365020752, "global_step": 188710, "epoch": 1123} {"train_loss": -11.282373428344727, "global_step": 188711, "epoch": 1123} {"train_loss": -11.21147346496582, "global_step": 188712, "epoch": 1123} {"train_loss": -11.324857711791992, "global_step": 188713, "epoch": 1123} {"train_loss": -11.225971221923828, "global_step": 188714, "epoch": 1123} {"train_loss": -11.354459762573242, "global_step": 188715, "epoch": 1123} {"train_loss": -11.48388671875, "global_step": 188716, "epoch": 1123} {"train_loss": -11.36025619506836, "global_step": 188717, "epoch": 1123} {"train_loss": -11.275577545166016, "global_step": 188718, "epoch": 1123} {"train_loss": -11.373003959655762, "global_step": 188719, "epoch": 1123} {"train_loss": -11.318387985229492, "global_step": 188720, "epoch": 1123} {"train_loss": -11.294175148010254, "global_step": 188721, "epoch": 1123} {"train_loss": -11.301538467407227, "global_step": 188722, "epoch": 1123} {"train_loss": -11.056896209716797, "global_step": 188723, "epoch": 1123} {"train_loss": -11.326566696166992, "global_step": 188724, "epoch": 1123} {"train_loss": -11.4689302444458, "global_step": 188725, "epoch": 1123} {"train_loss": -11.455829620361328, "global_step": 188726, "epoch": 1123} {"train_loss": -11.35230827331543, "global_step": 188727, "epoch": 1123} {"train_loss": -11.20491886138916, "global_step": 188728, "epoch": 1123} {"train_loss": -11.4839448928833, "global_step": 188729, "epoch": 1123} {"train_loss": -11.071796417236328, "global_step": 188730, "epoch": 1123} {"train_loss": -11.521055221557617, "global_step": 188731, "epoch": 1123} {"train_loss": -11.015718460083008, "global_step": 188732, "epoch": 1123} {"train_loss": -11.444499969482422, "global_step": 188733, "epoch": 1123} {"train_loss": -11.122117042541504, "global_step": 188734, "epoch": 1123} {"train_loss": -11.643365859985352, "global_step": 188735, "epoch": 1123} {"train_loss": -11.295658111572266, "global_step": 188736, "epoch": 1123} {"train_loss": -11.339338302612305, "global_step": 188737, "epoch": 1123} {"train_loss": -11.206409454345703, "global_step": 188738, "epoch": 1123} {"train_loss": -11.267133712768555, "global_step": 188739, "epoch": 1123} {"train_loss": -11.231344223022461, "global_step": 188740, "epoch": 1123} {"train_loss": -11.395662307739258, "global_step": 188741, "epoch": 1123} {"train_loss": -11.143523216247559, "global_step": 188742, "epoch": 1123} {"train_loss": -11.149824142456055, "global_step": 188743, "epoch": 1123} {"train_loss": -11.164957046508789, "global_step": 188744, "epoch": 1123} {"train_loss": -11.436450958251953, "global_step": 188745, "epoch": 1123} {"train_loss": -11.453597068786621, "global_step": 188746, "epoch": 1123} {"train_loss": -10.439657211303711, "global_step": 188747, "epoch": 1123} {"train_loss": -11.101726531982422, "global_step": 188748, "epoch": 1123} {"train_loss": -10.689611434936523, "global_step": 188749, "epoch": 1123} {"train_loss": -10.657194137573242, "global_step": 188750, "epoch": 1123} {"train_loss": -10.794075012207031, "global_step": 188751, "epoch": 1123} {"train_loss": -11.206859588623047, "global_step": 188752, "epoch": 1123} {"train_loss": -11.011093139648438, "global_step": 188753, "epoch": 1123} {"train_loss": -11.502803802490234, "global_step": 188754, "epoch": 1123} {"train_loss": -10.490466117858887, "global_step": 188755, "epoch": 1123} {"train_loss": -10.784563064575195, "global_step": 188756, "epoch": 1123} {"train_loss": -11.458125114440918, "global_step": 188757, "epoch": 1123} {"train_loss": -10.886452674865723, "global_step": 188758, "epoch": 1123} {"train_loss": -11.039125442504883, "global_step": 188759, "epoch": 1123} {"train_loss": -10.599830627441406, "global_step": 188760, "epoch": 1123} {"train_loss": -10.50767707824707, "global_step": 188761, "epoch": 1123} {"train_loss": -11.125665664672852, "global_step": 188762, "epoch": 1123} {"train_loss": -10.686308860778809, "global_step": 188763, "epoch": 1123} {"train_loss": -10.564102172851562, "global_step": 188764, "epoch": 1123} {"train_loss": -11.181964874267578, "global_step": 188765, "epoch": 1123} {"train_loss": -11.029535293579102, "global_step": 188766, "epoch": 1123} {"train_loss": -10.792854309082031, "global_step": 188767, "epoch": 1123} {"train_loss": -10.419130325317383, "global_step": 188768, "epoch": 1123} {"train_loss": -10.918174743652344, "global_step": 188769, "epoch": 1123} {"train_loss": -9.676702499389648, "global_step": 188770, "epoch": 1123} {"train_loss": -11.005037307739258, "global_step": 188771, "epoch": 1123} {"train_loss": -10.345785140991211, "global_step": 188772, "epoch": 1123} {"train_loss": -11.115171432495117, "global_step": 188773, "epoch": 1123} {"train_loss": -10.818317413330078, "global_step": 188774, "epoch": 1123} {"train_loss": -10.817306518554688, "global_step": 188775, "epoch": 1123} {"train_loss": -11.034869194030762, "global_step": 188776, "epoch": 1123} {"train_loss": -10.875192642211914, "global_step": 188777, "epoch": 1123} {"train_loss": -10.521829605102539, "global_step": 188778, "epoch": 1123} {"train_loss": -11.111689567565918, "global_step": 188779, "epoch": 1123} {"train_loss": -10.351778030395508, "global_step": 188780, "epoch": 1123} {"train_loss": -11.088546752929688, "global_step": 188781, "epoch": 1123} {"train_loss": -10.601054191589355, "global_step": 188782, "epoch": 1123} {"train_loss": -11.245566368103027, "global_step": 188783, "epoch": 1123} {"train_loss": -10.724544525146484, "global_step": 188784, "epoch": 1123} {"train_loss": -11.063480377197266, "global_step": 188785, "epoch": 1123} {"train_loss": -10.882816314697266, "global_step": 188786, "epoch": 1123} {"train_loss": -11.209224700927734, "global_step": 188787, "epoch": 1123} {"train_loss": -11.16126823425293, "global_step": 188788, "epoch": 1123} {"train_loss": -11.326828002929688, "global_step": 188789, "epoch": 1123} {"train_loss": -11.283729553222656, "global_step": 188790, "epoch": 1123} {"train_loss": -11.259103775024414, "global_step": 188791, "epoch": 1123} {"train_loss": -10.916106224060059, "global_step": 188792, "epoch": 1123} {"train_loss": -11.493539810180664, "global_step": 188793, "epoch": 1123} {"train_loss": -11.194976806640625, "global_step": 188794, "epoch": 1123} {"train_loss": -11.347917556762695, "global_step": 188795, "epoch": 1123} {"train_loss": -11.021875381469727, "global_step": 188796, "epoch": 1123} {"train_loss": -11.409074783325195, "global_step": 188797, "epoch": 1123} {"train_loss": -11.14913272857666, "global_step": 188798, "epoch": 1123} {"train_loss": -11.374019622802734, "global_step": 188799, "epoch": 1123} {"train_loss": -11.346307754516602, "global_step": 188800, "epoch": 1123} {"train_loss": -11.361221313476562, "global_step": 188801, "epoch": 1123} {"train_loss": -11.124683380126953, "global_step": 188802, "epoch": 1123} {"train_loss": -11.400784492492676, "global_step": 188803, "epoch": 1123} {"train_loss": -11.394072532653809, "global_step": 188804, "epoch": 1123} {"train_loss": -11.240827560424805, "global_step": 188805, "epoch": 1123} {"train_loss": -11.406355857849121, "global_step": 188806, "epoch": 1123} {"train_loss": -11.356385231018066, "global_step": 188807, "epoch": 1123} {"train_loss": -11.524435043334961, "global_step": 188808, "epoch": 1123} {"train_loss": -11.308399200439453, "global_step": 188809, "epoch": 1123} {"train_loss": -11.4127197265625, "global_step": 188810, "epoch": 1123} {"train_loss": -11.513250350952148, "global_step": 188811, "epoch": 1123} {"train_loss": -11.587432861328125, "global_step": 188812, "epoch": 1123} {"train_loss": -11.489953994750977, "global_step": 188813, "epoch": 1123} {"train_loss": -11.527063369750977, "global_step": 188814, "epoch": 1123} {"train_loss": -11.581354141235352, "global_step": 188815, "epoch": 1123} {"train_loss": -11.470549583435059, "global_step": 188816, "epoch": 1123} {"train_loss": -11.720195770263672, "global_step": 188817, "epoch": 1123} {"train_loss": -11.457429885864258, "global_step": 188818, "epoch": 1123} {"train_loss": -11.643108367919922, "global_step": 188819, "epoch": 1123} {"train_loss": -11.580268859863281, "global_step": 188820, "epoch": 1123} {"train_loss": -11.601055145263672, "global_step": 188821, "epoch": 1123} {"train_loss": -11.534244537353516, "global_step": 188822, "epoch": 1123} {"train_loss": -11.572589874267578, "global_step": 188823, "epoch": 1123} {"train_loss": -11.3537015914917, "global_step": 188824, "epoch": 1123} {"train_loss": -11.488163948059082, "global_step": 188825, "epoch": 1123} {"train_loss": -11.525894165039062, "global_step": 188826, "epoch": 1123} {"train_loss": -11.541946411132812, "global_step": 188827, "epoch": 1123} {"train_loss": -11.266091346740723, "global_step": 188828, "epoch": 1123} {"train_loss": -11.556236267089844, "global_step": 188829, "epoch": 1123} {"train_loss": -11.676124572753906, "global_step": 188830, "epoch": 1123} {"train_loss": -11.050183653831482, "global_step": 188831, "epoch": 1123, "val_loss": 245510.9375} {"train_loss": -11.34984016418457, "global_step": 188832, "epoch": 1124} {"train_loss": -11.397911071777344, "global_step": 188833, "epoch": 1124} {"train_loss": -11.400779724121094, "global_step": 188834, "epoch": 1124} {"train_loss": -11.44566535949707, "global_step": 188835, "epoch": 1124} {"train_loss": -11.472814559936523, "global_step": 188836, "epoch": 1124} {"train_loss": -11.532599449157715, "global_step": 188837, "epoch": 1124} {"train_loss": -11.366935729980469, "global_step": 188838, "epoch": 1124} {"train_loss": -11.578434944152832, "global_step": 188839, "epoch": 1124} {"train_loss": -11.571428298950195, "global_step": 188840, "epoch": 1124} {"train_loss": -11.552000045776367, "global_step": 188841, "epoch": 1124} {"train_loss": -11.305010795593262, "global_step": 188842, "epoch": 1124} {"train_loss": -11.167583465576172, "global_step": 188843, "epoch": 1124} {"train_loss": -11.338393211364746, "global_step": 188844, "epoch": 1124} {"train_loss": -11.268861770629883, "global_step": 188845, "epoch": 1124} {"train_loss": -11.10906982421875, "global_step": 188846, "epoch": 1124} {"train_loss": -11.341248512268066, "global_step": 188847, "epoch": 1124} {"train_loss": -11.320476531982422, "global_step": 188848, "epoch": 1124} {"train_loss": -11.548178672790527, "global_step": 188849, "epoch": 1124} {"train_loss": -11.00678539276123, "global_step": 188850, "epoch": 1124} {"train_loss": -11.346612930297852, "global_step": 188851, "epoch": 1124} {"train_loss": -11.15602970123291, "global_step": 188852, "epoch": 1124} {"train_loss": -11.476937294006348, "global_step": 188853, "epoch": 1124} {"train_loss": -10.999658584594727, "global_step": 188854, "epoch": 1124} {"train_loss": -11.528432846069336, "global_step": 188855, "epoch": 1124} {"train_loss": -10.814181327819824, "global_step": 188856, "epoch": 1124} {"train_loss": -11.24172592163086, "global_step": 188857, "epoch": 1124} {"train_loss": -11.450435638427734, "global_step": 188858, "epoch": 1124} {"train_loss": -10.994386672973633, "global_step": 188859, "epoch": 1124} {"train_loss": -10.473999977111816, "global_step": 188860, "epoch": 1124} {"train_loss": -11.169595718383789, "global_step": 188861, "epoch": 1124} {"train_loss": -10.746580123901367, "global_step": 188862, "epoch": 1124} {"train_loss": -11.074994087219238, "global_step": 188863, "epoch": 1124} {"train_loss": -11.17861270904541, "global_step": 188864, "epoch": 1124} {"train_loss": -10.86931037902832, "global_step": 188865, "epoch": 1124} {"train_loss": -11.025497436523438, "global_step": 188866, "epoch": 1124} {"train_loss": -11.457454681396484, "global_step": 188867, "epoch": 1124} {"train_loss": -11.153057098388672, "global_step": 188868, "epoch": 1124} {"train_loss": -11.200920104980469, "global_step": 188869, "epoch": 1124} {"train_loss": -11.521200180053711, "global_step": 188870, "epoch": 1124} {"train_loss": -11.074958801269531, "global_step": 188871, "epoch": 1124} {"train_loss": -11.1820068359375, "global_step": 188872, "epoch": 1124} {"train_loss": -11.300790786743164, "global_step": 188873, "epoch": 1124} {"train_loss": -11.232992172241211, "global_step": 188874, "epoch": 1124} {"train_loss": -11.189613342285156, "global_step": 188875, "epoch": 1124} {"train_loss": -11.360008239746094, "global_step": 188876, "epoch": 1124} {"train_loss": -11.29788589477539, "global_step": 188877, "epoch": 1124} {"train_loss": -11.229656219482422, "global_step": 188878, "epoch": 1124} {"train_loss": -11.298433303833008, "global_step": 188879, "epoch": 1124} {"train_loss": -11.020919799804688, "global_step": 188880, "epoch": 1124} {"train_loss": -11.081583023071289, "global_step": 188881, "epoch": 1124} {"train_loss": -10.828573226928711, "global_step": 188882, "epoch": 1124} {"train_loss": -11.24660873413086, "global_step": 188883, "epoch": 1124} {"train_loss": -11.294210433959961, "global_step": 188884, "epoch": 1124} {"train_loss": -11.40362548828125, "global_step": 188885, "epoch": 1124} {"train_loss": -10.796149253845215, "global_step": 188886, "epoch": 1124} {"train_loss": -11.177267074584961, "global_step": 188887, "epoch": 1124} {"train_loss": -11.083560943603516, "global_step": 188888, "epoch": 1124} {"train_loss": -10.80888843536377, "global_step": 188889, "epoch": 1124} {"train_loss": -11.249231338500977, "global_step": 188890, "epoch": 1124} {"train_loss": -10.196934700012207, "global_step": 188891, "epoch": 1124} {"train_loss": -10.836341857910156, "global_step": 188892, "epoch": 1124} {"train_loss": -11.266698837280273, "global_step": 188893, "epoch": 1124} {"train_loss": -10.58115291595459, "global_step": 188894, "epoch": 1124} {"train_loss": -10.712888717651367, "global_step": 188895, "epoch": 1124} {"train_loss": -9.78569507598877, "global_step": 188896, "epoch": 1124} {"train_loss": -10.236429214477539, "global_step": 188897, "epoch": 1124} {"train_loss": -9.347513198852539, "global_step": 188898, "epoch": 1124} {"train_loss": -11.047280311584473, "global_step": 188899, "epoch": 1124} {"train_loss": -9.905405044555664, "global_step": 188900, "epoch": 1124} {"train_loss": -10.404884338378906, "global_step": 188901, "epoch": 1124} {"train_loss": -10.359968185424805, "global_step": 188902, "epoch": 1124} {"train_loss": -10.850191116333008, "global_step": 188903, "epoch": 1124} {"train_loss": -9.974714279174805, "global_step": 188904, "epoch": 1124} {"train_loss": -10.498054504394531, "global_step": 188905, "epoch": 1124} {"train_loss": -10.175630569458008, "global_step": 188906, "epoch": 1124} {"train_loss": -11.168484687805176, "global_step": 188907, "epoch": 1124} {"train_loss": -9.982223510742188, "global_step": 188908, "epoch": 1124} {"train_loss": -11.06519603729248, "global_step": 188909, "epoch": 1124} {"train_loss": -10.31158447265625, "global_step": 188910, "epoch": 1124} {"train_loss": -10.662900924682617, "global_step": 188911, "epoch": 1124} {"train_loss": -10.800056457519531, "global_step": 188912, "epoch": 1124} {"train_loss": -10.70972728729248, "global_step": 188913, "epoch": 1124} {"train_loss": -10.869607925415039, "global_step": 188914, "epoch": 1124} {"train_loss": -10.169623374938965, "global_step": 188915, "epoch": 1124} {"train_loss": -10.976869583129883, "global_step": 188916, "epoch": 1124} {"train_loss": -10.349912643432617, "global_step": 188917, "epoch": 1124} {"train_loss": -11.313237190246582, "global_step": 188918, "epoch": 1124} {"train_loss": -10.555541038513184, "global_step": 188919, "epoch": 1124} {"train_loss": -10.728076934814453, "global_step": 188920, "epoch": 1124} {"train_loss": -10.699520111083984, "global_step": 188921, "epoch": 1124} {"train_loss": -10.519901275634766, "global_step": 188922, "epoch": 1124} {"train_loss": -11.192103385925293, "global_step": 188923, "epoch": 1124} {"train_loss": -10.732693672180176, "global_step": 188924, "epoch": 1124} {"train_loss": -11.230327606201172, "global_step": 188925, "epoch": 1124} {"train_loss": -11.045798301696777, "global_step": 188926, "epoch": 1124} {"train_loss": -11.221755981445312, "global_step": 188927, "epoch": 1124} {"train_loss": -11.05141830444336, "global_step": 188928, "epoch": 1124} {"train_loss": -11.093899726867676, "global_step": 188929, "epoch": 1124} {"train_loss": -11.155729293823242, "global_step": 188930, "epoch": 1124} {"train_loss": -10.956306457519531, "global_step": 188931, "epoch": 1124} {"train_loss": -11.17515754699707, "global_step": 188932, "epoch": 1124} {"train_loss": -11.190921783447266, "global_step": 188933, "epoch": 1124} {"train_loss": -11.113431930541992, "global_step": 188934, "epoch": 1124} {"train_loss": -11.127104759216309, "global_step": 188935, "epoch": 1124} {"train_loss": -10.861520767211914, "global_step": 188936, "epoch": 1124} {"train_loss": -11.310237884521484, "global_step": 188937, "epoch": 1124} {"train_loss": -11.10846996307373, "global_step": 188938, "epoch": 1124} {"train_loss": -11.308328628540039, "global_step": 188939, "epoch": 1124} {"train_loss": -11.311363220214844, "global_step": 188940, "epoch": 1124} {"train_loss": -11.173158645629883, "global_step": 188941, "epoch": 1124} {"train_loss": -11.111663818359375, "global_step": 188942, "epoch": 1124} {"train_loss": -11.351110458374023, "global_step": 188943, "epoch": 1124} {"train_loss": -11.376409530639648, "global_step": 188944, "epoch": 1124} {"train_loss": -11.559948921203613, "global_step": 188945, "epoch": 1124} {"train_loss": -11.426826477050781, "global_step": 188946, "epoch": 1124} {"train_loss": -11.36842155456543, "global_step": 188947, "epoch": 1124} {"train_loss": -11.54401969909668, "global_step": 188948, "epoch": 1124} {"train_loss": -11.380958557128906, "global_step": 188949, "epoch": 1124} {"train_loss": -11.535638809204102, "global_step": 188950, "epoch": 1124} {"train_loss": -11.472586631774902, "global_step": 188951, "epoch": 1124} {"train_loss": -11.388287544250488, "global_step": 188952, "epoch": 1124} {"train_loss": -11.329858779907227, "global_step": 188953, "epoch": 1124} {"train_loss": -11.579731941223145, "global_step": 188954, "epoch": 1124} {"train_loss": -11.588151931762695, "global_step": 188955, "epoch": 1124} {"train_loss": -11.593194961547852, "global_step": 188956, "epoch": 1124} {"train_loss": -11.548238754272461, "global_step": 188957, "epoch": 1124} {"train_loss": -11.427377700805664, "global_step": 188958, "epoch": 1124} {"train_loss": -11.641135215759277, "global_step": 188959, "epoch": 1124} {"train_loss": -11.274209022521973, "global_step": 188960, "epoch": 1124} {"train_loss": -11.283456802368164, "global_step": 188961, "epoch": 1124} {"train_loss": -11.289687156677246, "global_step": 188962, "epoch": 1124} {"train_loss": -11.134675025939941, "global_step": 188963, "epoch": 1124} {"train_loss": -11.293082237243652, "global_step": 188964, "epoch": 1124} {"train_loss": -10.896276473999023, "global_step": 188965, "epoch": 1124} {"train_loss": -11.602418899536133, "global_step": 188966, "epoch": 1124} {"train_loss": -11.186795234680176, "global_step": 188967, "epoch": 1124} {"train_loss": -10.523643493652344, "global_step": 188968, "epoch": 1124} {"train_loss": -10.272724151611328, "global_step": 188969, "epoch": 1124} {"train_loss": -11.325973510742188, "global_step": 188970, "epoch": 1124} {"train_loss": -10.143415451049805, "global_step": 188971, "epoch": 1124} {"train_loss": -11.598001480102539, "global_step": 188972, "epoch": 1124} {"train_loss": -10.559492111206055, "global_step": 188973, "epoch": 1124} {"train_loss": -10.592164993286133, "global_step": 188974, "epoch": 1124} {"train_loss": -10.995975494384766, "global_step": 188975, "epoch": 1124} {"train_loss": -10.556318283081055, "global_step": 188976, "epoch": 1124} {"train_loss": -10.605369567871094, "global_step": 188977, "epoch": 1124} {"train_loss": -11.044759750366211, "global_step": 188978, "epoch": 1124} {"train_loss": -10.200643539428711, "global_step": 188979, "epoch": 1124} {"train_loss": -10.736717224121094, "global_step": 188980, "epoch": 1124} {"train_loss": -10.354619979858398, "global_step": 188981, "epoch": 1124} {"train_loss": -10.023951530456543, "global_step": 188982, "epoch": 1124} {"train_loss": -10.476651191711426, "global_step": 188983, "epoch": 1124} {"train_loss": -9.115015029907227, "global_step": 188984, "epoch": 1124} {"train_loss": -8.664077758789062, "global_step": 188985, "epoch": 1124} {"train_loss": -9.92291259765625, "global_step": 188986, "epoch": 1124} {"train_loss": -10.05157470703125, "global_step": 188987, "epoch": 1124} {"train_loss": -8.807876586914062, "global_step": 188988, "epoch": 1124} {"train_loss": -10.408689498901367, "global_step": 188989, "epoch": 1124} {"train_loss": -9.973737716674805, "global_step": 188990, "epoch": 1124} {"train_loss": -9.95988655090332, "global_step": 188991, "epoch": 1124} {"train_loss": -10.130163192749023, "global_step": 188992, "epoch": 1124} {"train_loss": -9.667966842651367, "global_step": 188993, "epoch": 1124} {"train_loss": -8.73405647277832, "global_step": 188994, "epoch": 1124} {"train_loss": -8.282487869262695, "global_step": 188995, "epoch": 1124} {"train_loss": -10.519437789916992, "global_step": 188996, "epoch": 1124} {"train_loss": -9.709630966186523, "global_step": 188997, "epoch": 1124} {"train_loss": -8.896750450134277, "global_step": 188998, "epoch": 1124} {"train_loss": -10.889030195417858, "global_step": 188999, "epoch": 1124, "val_loss": 236164.53125} {"train_loss": -10.239779472351074, "global_step": 189000, "epoch": 1125} {"train_loss": -10.103166580200195, "global_step": 189001, "epoch": 1125} {"train_loss": -10.025809288024902, "global_step": 189002, "epoch": 1125} {"train_loss": -10.870431900024414, "global_step": 189003, "epoch": 1125} {"train_loss": -10.434282302856445, "global_step": 189004, "epoch": 1125} {"train_loss": -10.366887092590332, "global_step": 189005, "epoch": 1125} {"train_loss": -10.659143447875977, "global_step": 189006, "epoch": 1125} {"train_loss": -10.664514541625977, "global_step": 189007, "epoch": 1125} {"train_loss": -10.392216682434082, "global_step": 189008, "epoch": 1125} {"train_loss": -10.326276779174805, "global_step": 189009, "epoch": 1125} {"train_loss": -10.771169662475586, "global_step": 189010, "epoch": 1125} {"train_loss": -10.635004997253418, "global_step": 189011, "epoch": 1125} {"train_loss": -10.706378936767578, "global_step": 189012, "epoch": 1125} {"train_loss": -11.057902336120605, "global_step": 189013, "epoch": 1125} {"train_loss": -10.507834434509277, "global_step": 189014, "epoch": 1125} {"train_loss": -10.328434944152832, "global_step": 189015, "epoch": 1125} {"train_loss": -10.97452163696289, "global_step": 189016, "epoch": 1125} {"train_loss": -10.858104705810547, "global_step": 189017, "epoch": 1125} {"train_loss": -10.928693771362305, "global_step": 189018, "epoch": 1125} {"train_loss": -10.779932022094727, "global_step": 189019, "epoch": 1125} {"train_loss": -10.969499588012695, "global_step": 189020, "epoch": 1125} {"train_loss": -11.19001579284668, "global_step": 189021, "epoch": 1125} {"train_loss": -10.83875846862793, "global_step": 189022, "epoch": 1125} {"train_loss": -11.001541137695312, "global_step": 189023, "epoch": 1125} {"train_loss": -10.980676651000977, "global_step": 189024, "epoch": 1125} {"train_loss": -11.087076187133789, "global_step": 189025, "epoch": 1125} {"train_loss": -10.779821395874023, "global_step": 189026, "epoch": 1125} {"train_loss": -11.122617721557617, "global_step": 189027, "epoch": 1125} {"train_loss": -11.02896785736084, "global_step": 189028, "epoch": 1125} {"train_loss": -11.22356128692627, "global_step": 189029, "epoch": 1125} {"train_loss": -11.216474533081055, "global_step": 189030, "epoch": 1125} {"train_loss": -11.096725463867188, "global_step": 189031, "epoch": 1125} {"train_loss": -11.332412719726562, "global_step": 189032, "epoch": 1125} {"train_loss": -11.088777542114258, "global_step": 189033, "epoch": 1125} {"train_loss": -11.18662166595459, "global_step": 189034, "epoch": 1125} {"train_loss": -11.21766471862793, "global_step": 189035, "epoch": 1125} {"train_loss": -11.128353118896484, "global_step": 189036, "epoch": 1125} {"train_loss": -11.363863945007324, "global_step": 189037, "epoch": 1125} {"train_loss": -11.393068313598633, "global_step": 189038, "epoch": 1125} {"train_loss": -11.173850059509277, "global_step": 189039, "epoch": 1125} {"train_loss": -11.438394546508789, "global_step": 189040, "epoch": 1125} {"train_loss": -11.439995765686035, "global_step": 189041, "epoch": 1125} {"train_loss": -11.425976753234863, "global_step": 189042, "epoch": 1125} {"train_loss": -11.521025657653809, "global_step": 189043, "epoch": 1125} {"train_loss": -11.331602096557617, "global_step": 189044, "epoch": 1125} {"train_loss": -11.310869216918945, "global_step": 189045, "epoch": 1125} {"train_loss": -11.560440063476562, "global_step": 189046, "epoch": 1125} {"train_loss": -11.461316108703613, "global_step": 189047, "epoch": 1125} {"train_loss": -11.446085929870605, "global_step": 189048, "epoch": 1125} {"train_loss": -11.479555130004883, "global_step": 189049, "epoch": 1125} {"train_loss": -11.469758987426758, "global_step": 189050, "epoch": 1125} {"train_loss": -11.421536445617676, "global_step": 189051, "epoch": 1125} {"train_loss": -11.566255569458008, "global_step": 189052, "epoch": 1125} {"train_loss": -11.30706787109375, "global_step": 189053, "epoch": 1125} {"train_loss": -11.467479705810547, "global_step": 189054, "epoch": 1125} {"train_loss": -11.740367889404297, "global_step": 189055, "epoch": 1125} {"train_loss": -11.595178604125977, "global_step": 189056, "epoch": 1125} {"train_loss": -11.544746398925781, "global_step": 189057, "epoch": 1125} {"train_loss": -11.414721488952637, "global_step": 189058, "epoch": 1125} {"train_loss": -11.563032150268555, "global_step": 189059, "epoch": 1125} {"train_loss": -11.719846725463867, "global_step": 189060, "epoch": 1125} {"train_loss": -11.527976989746094, "global_step": 189061, "epoch": 1125} {"train_loss": -11.556621551513672, "global_step": 189062, "epoch": 1125} {"train_loss": -11.541418075561523, "global_step": 189063, "epoch": 1125} {"train_loss": -11.345155715942383, "global_step": 189064, "epoch": 1125} {"train_loss": -11.490008354187012, "global_step": 189065, "epoch": 1125} {"train_loss": -11.690410614013672, "global_step": 189066, "epoch": 1125} {"train_loss": -11.62031078338623, "global_step": 189067, "epoch": 1125} {"train_loss": -11.456531524658203, "global_step": 189068, "epoch": 1125} {"train_loss": -11.482160568237305, "global_step": 189069, "epoch": 1125} {"train_loss": -11.222677230834961, "global_step": 189070, "epoch": 1125} {"train_loss": -11.094768524169922, "global_step": 189071, "epoch": 1125} {"train_loss": -11.722366333007812, "global_step": 189072, "epoch": 1125} {"train_loss": -10.594165802001953, "global_step": 189073, "epoch": 1125} {"train_loss": -10.815618515014648, "global_step": 189074, "epoch": 1125} {"train_loss": -10.868223190307617, "global_step": 189075, "epoch": 1125} {"train_loss": -10.497123718261719, "global_step": 189076, "epoch": 1125} {"train_loss": -10.822053909301758, "global_step": 189077, "epoch": 1125} {"train_loss": -11.109975814819336, "global_step": 189078, "epoch": 1125} {"train_loss": -9.95816421508789, "global_step": 189079, "epoch": 1125} {"train_loss": -9.703386306762695, "global_step": 189080, "epoch": 1125} {"train_loss": -10.111624717712402, "global_step": 189081, "epoch": 1125} {"train_loss": -10.925252914428711, "global_step": 189082, "epoch": 1125} {"train_loss": -9.37578010559082, "global_step": 189083, "epoch": 1125} {"train_loss": -10.757513999938965, "global_step": 189084, "epoch": 1125} {"train_loss": -9.892745971679688, "global_step": 189085, "epoch": 1125} {"train_loss": -10.79029369354248, "global_step": 189086, "epoch": 1125} {"train_loss": -10.113264083862305, "global_step": 189087, "epoch": 1125} {"train_loss": -9.488377571105957, "global_step": 189088, "epoch": 1125} {"train_loss": -10.655508041381836, "global_step": 189089, "epoch": 1125} {"train_loss": -10.0035400390625, "global_step": 189090, "epoch": 1125} {"train_loss": -9.984403610229492, "global_step": 189091, "epoch": 1125} {"train_loss": -10.475540161132812, "global_step": 189092, "epoch": 1125} {"train_loss": -9.339197158813477, "global_step": 189093, "epoch": 1125} {"train_loss": -10.424360275268555, "global_step": 189094, "epoch": 1125} {"train_loss": -9.538789749145508, "global_step": 189095, "epoch": 1125} {"train_loss": -9.479133605957031, "global_step": 189096, "epoch": 1125} {"train_loss": -10.388571739196777, "global_step": 189097, "epoch": 1125} {"train_loss": -9.308775901794434, "global_step": 189098, "epoch": 1125} {"train_loss": -10.05497932434082, "global_step": 189099, "epoch": 1125} {"train_loss": -10.162708282470703, "global_step": 189100, "epoch": 1125} {"train_loss": -9.573472023010254, "global_step": 189101, "epoch": 1125} {"train_loss": -9.175948143005371, "global_step": 189102, "epoch": 1125} {"train_loss": -10.673288345336914, "global_step": 189103, "epoch": 1125} {"train_loss": -9.853796005249023, "global_step": 189104, "epoch": 1125} {"train_loss": -10.140026092529297, "global_step": 189105, "epoch": 1125} {"train_loss": -10.795295715332031, "global_step": 189106, "epoch": 1125} {"train_loss": -10.145999908447266, "global_step": 189107, "epoch": 1125} {"train_loss": -10.430685997009277, "global_step": 189108, "epoch": 1125} {"train_loss": -10.407249450683594, "global_step": 189109, "epoch": 1125} {"train_loss": -10.628708839416504, "global_step": 189110, "epoch": 1125} {"train_loss": -10.337199211120605, "global_step": 189111, "epoch": 1125} {"train_loss": -10.420783996582031, "global_step": 189112, "epoch": 1125} {"train_loss": -10.746978759765625, "global_step": 189113, "epoch": 1125} {"train_loss": -10.440916061401367, "global_step": 189114, "epoch": 1125} {"train_loss": -10.550422668457031, "global_step": 189115, "epoch": 1125} {"train_loss": -10.866196632385254, "global_step": 189116, "epoch": 1125} {"train_loss": -10.701491355895996, "global_step": 189117, "epoch": 1125} {"train_loss": -10.34715747833252, "global_step": 189118, "epoch": 1125} {"train_loss": -11.047611236572266, "global_step": 189119, "epoch": 1125} {"train_loss": -10.950713157653809, "global_step": 189120, "epoch": 1125} {"train_loss": -10.801921844482422, "global_step": 189121, "epoch": 1125} {"train_loss": -10.686788558959961, "global_step": 189122, "epoch": 1125} {"train_loss": -10.99848747253418, "global_step": 189123, "epoch": 1125} {"train_loss": -10.920403480529785, "global_step": 189124, "epoch": 1125} {"train_loss": -11.015426635742188, "global_step": 189125, "epoch": 1125} {"train_loss": -10.921266555786133, "global_step": 189126, "epoch": 1125} {"train_loss": -11.204267501831055, "global_step": 189127, "epoch": 1125} {"train_loss": -10.814949989318848, "global_step": 189128, "epoch": 1125} {"train_loss": -11.068857192993164, "global_step": 189129, "epoch": 1125} {"train_loss": -11.140806198120117, "global_step": 189130, "epoch": 1125} {"train_loss": -10.770038604736328, "global_step": 189131, "epoch": 1125} {"train_loss": -11.141014099121094, "global_step": 189132, "epoch": 1125} {"train_loss": -11.213264465332031, "global_step": 189133, "epoch": 1125} {"train_loss": -11.132576942443848, "global_step": 189134, "epoch": 1125} {"train_loss": -11.084821701049805, "global_step": 189135, "epoch": 1125} {"train_loss": -11.327564239501953, "global_step": 189136, "epoch": 1125} {"train_loss": -11.004631996154785, "global_step": 189137, "epoch": 1125} {"train_loss": -11.154376983642578, "global_step": 189138, "epoch": 1125} {"train_loss": -11.217506408691406, "global_step": 189139, "epoch": 1125} {"train_loss": -11.25013542175293, "global_step": 189140, "epoch": 1125} {"train_loss": -11.192307472229004, "global_step": 189141, "epoch": 1125} {"train_loss": -11.242140769958496, "global_step": 189142, "epoch": 1125} {"train_loss": -11.201184272766113, "global_step": 189143, "epoch": 1125} {"train_loss": -11.222537994384766, "global_step": 189144, "epoch": 1125} {"train_loss": -11.444380760192871, "global_step": 189145, "epoch": 1125} {"train_loss": -11.12382698059082, "global_step": 189146, "epoch": 1125} {"train_loss": -11.14605712890625, "global_step": 189147, "epoch": 1125} {"train_loss": -11.326156616210938, "global_step": 189148, "epoch": 1125} {"train_loss": -11.03316879272461, "global_step": 189149, "epoch": 1125} {"train_loss": -11.40339469909668, "global_step": 189150, "epoch": 1125} {"train_loss": -11.132413864135742, "global_step": 189151, "epoch": 1125} {"train_loss": -11.166171073913574, "global_step": 189152, "epoch": 1125} {"train_loss": -11.289704322814941, "global_step": 189153, "epoch": 1125} {"train_loss": -11.194486618041992, "global_step": 189154, "epoch": 1125} {"train_loss": -11.417808532714844, "global_step": 189155, "epoch": 1125} {"train_loss": -11.383479118347168, "global_step": 189156, "epoch": 1125} {"train_loss": -11.161053657531738, "global_step": 189157, "epoch": 1125} {"train_loss": -11.235857009887695, "global_step": 189158, "epoch": 1125} {"train_loss": -10.628824234008789, "global_step": 189159, "epoch": 1125} {"train_loss": -11.238754272460938, "global_step": 189160, "epoch": 1125} {"train_loss": -10.576606750488281, "global_step": 189161, "epoch": 1125} {"train_loss": -11.278249740600586, "global_step": 189162, "epoch": 1125} {"train_loss": -10.986061096191406, "global_step": 189163, "epoch": 1125} {"train_loss": -10.963827133178711, "global_step": 189164, "epoch": 1125} {"train_loss": -11.029739379882812, "global_step": 189165, "epoch": 1125} {"train_loss": -10.890819549560547, "global_step": 189166, "epoch": 1125} {"train_loss": -10.88572701386043, "global_step": 189167, "epoch": 1125, "val_loss": 243087.203125, "train_action_mse_error": 2.010226011276245} {"train_loss": -11.135480880737305, "global_step": 189168, "epoch": 1126} {"train_loss": -11.071300506591797, "global_step": 189169, "epoch": 1126} {"train_loss": -11.440559387207031, "global_step": 189170, "epoch": 1126} {"train_loss": -11.104904174804688, "global_step": 189171, "epoch": 1126} {"train_loss": -11.234725952148438, "global_step": 189172, "epoch": 1126} {"train_loss": -11.323861122131348, "global_step": 189173, "epoch": 1126} {"train_loss": -11.46107292175293, "global_step": 189174, "epoch": 1126} {"train_loss": -11.385700225830078, "global_step": 189175, "epoch": 1126} {"train_loss": -11.479244232177734, "global_step": 189176, "epoch": 1126} {"train_loss": -11.292752265930176, "global_step": 189177, "epoch": 1126} {"train_loss": -11.361169815063477, "global_step": 189178, "epoch": 1126} {"train_loss": -11.570566177368164, "global_step": 189179, "epoch": 1126} {"train_loss": -11.536151885986328, "global_step": 189180, "epoch": 1126} {"train_loss": -11.608470916748047, "global_step": 189181, "epoch": 1126} {"train_loss": -11.316291809082031, "global_step": 189182, "epoch": 1126} {"train_loss": -11.587278366088867, "global_step": 189183, "epoch": 1126} {"train_loss": -11.428910255432129, "global_step": 189184, "epoch": 1126} {"train_loss": -11.678731918334961, "global_step": 189185, "epoch": 1126} {"train_loss": -11.367242813110352, "global_step": 189186, "epoch": 1126} {"train_loss": -11.460834503173828, "global_step": 189187, "epoch": 1126} {"train_loss": -11.535144805908203, "global_step": 189188, "epoch": 1126} {"train_loss": -11.661086082458496, "global_step": 189189, "epoch": 1126} {"train_loss": -11.357076644897461, "global_step": 189190, "epoch": 1126} {"train_loss": -11.53718376159668, "global_step": 189191, "epoch": 1126} {"train_loss": -11.499317169189453, "global_step": 189192, "epoch": 1126} {"train_loss": -11.653894424438477, "global_step": 189193, "epoch": 1126} {"train_loss": -11.273941040039062, "global_step": 189194, "epoch": 1126} {"train_loss": -11.545284271240234, "global_step": 189195, "epoch": 1126} {"train_loss": -11.319221496582031, "global_step": 189196, "epoch": 1126} {"train_loss": -11.467273712158203, "global_step": 189197, "epoch": 1126} {"train_loss": -11.279776573181152, "global_step": 189198, "epoch": 1126} {"train_loss": -11.567222595214844, "global_step": 189199, "epoch": 1126} {"train_loss": -11.397903442382812, "global_step": 189200, "epoch": 1126} {"train_loss": -11.479275703430176, "global_step": 189201, "epoch": 1126} {"train_loss": -11.197537422180176, "global_step": 189202, "epoch": 1126} {"train_loss": -10.921440124511719, "global_step": 189203, "epoch": 1126} {"train_loss": -11.523643493652344, "global_step": 189204, "epoch": 1126} {"train_loss": -11.444765090942383, "global_step": 189205, "epoch": 1126} {"train_loss": -11.185998916625977, "global_step": 189206, "epoch": 1126} {"train_loss": -11.521818161010742, "global_step": 189207, "epoch": 1126} {"train_loss": -11.574016571044922, "global_step": 189208, "epoch": 1126} {"train_loss": -11.571792602539062, "global_step": 189209, "epoch": 1126} {"train_loss": -11.591140747070312, "global_step": 189210, "epoch": 1126} {"train_loss": -11.393255233764648, "global_step": 189211, "epoch": 1126} {"train_loss": -11.171356201171875, "global_step": 189212, "epoch": 1126} {"train_loss": -11.664229393005371, "global_step": 189213, "epoch": 1126} {"train_loss": -11.12067985534668, "global_step": 189214, "epoch": 1126} {"train_loss": -10.746895790100098, "global_step": 189215, "epoch": 1126} {"train_loss": -11.258224487304688, "global_step": 189216, "epoch": 1126} {"train_loss": -11.112726211547852, "global_step": 189217, "epoch": 1126} {"train_loss": -10.736127853393555, "global_step": 189218, "epoch": 1126} {"train_loss": -11.347457885742188, "global_step": 189219, "epoch": 1126} {"train_loss": -11.328573226928711, "global_step": 189220, "epoch": 1126} {"train_loss": -10.57082748413086, "global_step": 189221, "epoch": 1126} {"train_loss": -11.169235229492188, "global_step": 189222, "epoch": 1126} {"train_loss": -11.285161972045898, "global_step": 189223, "epoch": 1126} {"train_loss": -11.177237510681152, "global_step": 189224, "epoch": 1126} {"train_loss": -11.051136016845703, "global_step": 189225, "epoch": 1126} {"train_loss": -11.541715621948242, "global_step": 189226, "epoch": 1126} {"train_loss": -11.307247161865234, "global_step": 189227, "epoch": 1126} {"train_loss": -11.339153289794922, "global_step": 189228, "epoch": 1126} {"train_loss": -11.12374496459961, "global_step": 189229, "epoch": 1126} {"train_loss": -11.637269973754883, "global_step": 189230, "epoch": 1126} {"train_loss": -11.378473281860352, "global_step": 189231, "epoch": 1126} {"train_loss": -11.52102279663086, "global_step": 189232, "epoch": 1126} {"train_loss": -11.275768280029297, "global_step": 189233, "epoch": 1126} {"train_loss": -11.132329940795898, "global_step": 189234, "epoch": 1126} {"train_loss": -11.462313652038574, "global_step": 189235, "epoch": 1126} {"train_loss": -11.035611152648926, "global_step": 189236, "epoch": 1126} {"train_loss": -11.172149658203125, "global_step": 189237, "epoch": 1126} {"train_loss": -11.428996086120605, "global_step": 189238, "epoch": 1126} {"train_loss": -11.10675048828125, "global_step": 189239, "epoch": 1126} {"train_loss": -11.144731521606445, "global_step": 189240, "epoch": 1126} {"train_loss": -11.038393020629883, "global_step": 189241, "epoch": 1126} {"train_loss": -10.868697166442871, "global_step": 189242, "epoch": 1126} {"train_loss": -11.02859115600586, "global_step": 189243, "epoch": 1126} {"train_loss": -11.28341293334961, "global_step": 189244, "epoch": 1126} {"train_loss": -11.023591995239258, "global_step": 189245, "epoch": 1126} {"train_loss": -11.210156440734863, "global_step": 189246, "epoch": 1126} {"train_loss": -11.178778648376465, "global_step": 189247, "epoch": 1126} {"train_loss": -10.833894729614258, "global_step": 189248, "epoch": 1126} {"train_loss": -11.447100639343262, "global_step": 189249, "epoch": 1126} {"train_loss": -11.05959701538086, "global_step": 189250, "epoch": 1126} {"train_loss": -11.266901016235352, "global_step": 189251, "epoch": 1126} {"train_loss": -11.27725601196289, "global_step": 189252, "epoch": 1126} {"train_loss": -10.798322677612305, "global_step": 189253, "epoch": 1126} {"train_loss": -11.317802429199219, "global_step": 189254, "epoch": 1126} {"train_loss": -11.229866027832031, "global_step": 189255, "epoch": 1126} {"train_loss": -11.047130584716797, "global_step": 189256, "epoch": 1126} {"train_loss": -11.376005172729492, "global_step": 189257, "epoch": 1126} {"train_loss": -11.0216064453125, "global_step": 189258, "epoch": 1126} {"train_loss": -11.594206809997559, "global_step": 189259, "epoch": 1126} {"train_loss": -10.992443084716797, "global_step": 189260, "epoch": 1126} {"train_loss": -11.138386726379395, "global_step": 189261, "epoch": 1126} {"train_loss": -11.574169158935547, "global_step": 189262, "epoch": 1126} {"train_loss": -11.154091835021973, "global_step": 189263, "epoch": 1126} {"train_loss": -11.05792236328125, "global_step": 189264, "epoch": 1126} {"train_loss": -11.015912055969238, "global_step": 189265, "epoch": 1126} {"train_loss": -11.218208312988281, "global_step": 189266, "epoch": 1126} {"train_loss": -10.907211303710938, "global_step": 189267, "epoch": 1126} {"train_loss": -10.800048828125, "global_step": 189268, "epoch": 1126} {"train_loss": -11.333032608032227, "global_step": 189269, "epoch": 1126} {"train_loss": -10.8817138671875, "global_step": 189270, "epoch": 1126} {"train_loss": -11.010580062866211, "global_step": 189271, "epoch": 1126} {"train_loss": -11.085287094116211, "global_step": 189272, "epoch": 1126} {"train_loss": -11.117820739746094, "global_step": 189273, "epoch": 1126} {"train_loss": -11.18459701538086, "global_step": 189274, "epoch": 1126} {"train_loss": -10.8287353515625, "global_step": 189275, "epoch": 1126} {"train_loss": -11.136021614074707, "global_step": 189276, "epoch": 1126} {"train_loss": -10.979339599609375, "global_step": 189277, "epoch": 1126} {"train_loss": -11.40970230102539, "global_step": 189278, "epoch": 1126} {"train_loss": -10.681055068969727, "global_step": 189279, "epoch": 1126} {"train_loss": -11.430922508239746, "global_step": 189280, "epoch": 1126} {"train_loss": -11.134048461914062, "global_step": 189281, "epoch": 1126} {"train_loss": -11.092424392700195, "global_step": 189282, "epoch": 1126} {"train_loss": -11.145170211791992, "global_step": 189283, "epoch": 1126} {"train_loss": -10.824915885925293, "global_step": 189284, "epoch": 1126} {"train_loss": -11.320508003234863, "global_step": 189285, "epoch": 1126} {"train_loss": -11.004261016845703, "global_step": 189286, "epoch": 1126} {"train_loss": -11.125975608825684, "global_step": 189287, "epoch": 1126} {"train_loss": -11.069377899169922, "global_step": 189288, "epoch": 1126} {"train_loss": -11.585346221923828, "global_step": 189289, "epoch": 1126} {"train_loss": -10.757599830627441, "global_step": 189290, "epoch": 1126} {"train_loss": -11.129193305969238, "global_step": 189291, "epoch": 1126} {"train_loss": -10.71412467956543, "global_step": 189292, "epoch": 1126} {"train_loss": -10.576590538024902, "global_step": 189293, "epoch": 1126} {"train_loss": -10.770849227905273, "global_step": 189294, "epoch": 1126} {"train_loss": -10.797345161437988, "global_step": 189295, "epoch": 1126} {"train_loss": -10.792688369750977, "global_step": 189296, "epoch": 1126} {"train_loss": -10.65250301361084, "global_step": 189297, "epoch": 1126} {"train_loss": -11.003910064697266, "global_step": 189298, "epoch": 1126} {"train_loss": -10.64948844909668, "global_step": 189299, "epoch": 1126} {"train_loss": -11.156033515930176, "global_step": 189300, "epoch": 1126} {"train_loss": -10.813074111938477, "global_step": 189301, "epoch": 1126} {"train_loss": -10.972478866577148, "global_step": 189302, "epoch": 1126} {"train_loss": -10.762703895568848, "global_step": 189303, "epoch": 1126} {"train_loss": -10.568706512451172, "global_step": 189304, "epoch": 1126} {"train_loss": -10.856176376342773, "global_step": 189305, "epoch": 1126} {"train_loss": -10.544041633605957, "global_step": 189306, "epoch": 1126} {"train_loss": -10.692017555236816, "global_step": 189307, "epoch": 1126} {"train_loss": -11.166247367858887, "global_step": 189308, "epoch": 1126} {"train_loss": -10.687191009521484, "global_step": 189309, "epoch": 1126} {"train_loss": -11.203821182250977, "global_step": 189310, "epoch": 1126} {"train_loss": -10.987628936767578, "global_step": 189311, "epoch": 1126} {"train_loss": -11.206792831420898, "global_step": 189312, "epoch": 1126} {"train_loss": -10.816598892211914, "global_step": 189313, "epoch": 1126} {"train_loss": -11.075640678405762, "global_step": 189314, "epoch": 1126} {"train_loss": -11.401923179626465, "global_step": 189315, "epoch": 1126} {"train_loss": -11.050758361816406, "global_step": 189316, "epoch": 1126} {"train_loss": -11.167500495910645, "global_step": 189317, "epoch": 1126} {"train_loss": -11.198066711425781, "global_step": 189318, "epoch": 1126} {"train_loss": -11.251501083374023, "global_step": 189319, "epoch": 1126} {"train_loss": -11.338716506958008, "global_step": 189320, "epoch": 1126} {"train_loss": -11.184768676757812, "global_step": 189321, "epoch": 1126} {"train_loss": -11.187981605529785, "global_step": 189322, "epoch": 1126} {"train_loss": -11.235093116760254, "global_step": 189323, "epoch": 1126} {"train_loss": -11.219621658325195, "global_step": 189324, "epoch": 1126} {"train_loss": -11.112787246704102, "global_step": 189325, "epoch": 1126} {"train_loss": -11.07309627532959, "global_step": 189326, "epoch": 1126} {"train_loss": -11.182544708251953, "global_step": 189327, "epoch": 1126} {"train_loss": -11.524548530578613, "global_step": 189328, "epoch": 1126} {"train_loss": -10.78499984741211, "global_step": 189329, "epoch": 1126} {"train_loss": -10.926053047180176, "global_step": 189330, "epoch": 1126} {"train_loss": -10.970640182495117, "global_step": 189331, "epoch": 1126} {"train_loss": -10.927417755126953, "global_step": 189332, "epoch": 1126} {"train_loss": -11.000261306762695, "global_step": 189333, "epoch": 1126} {"train_loss": -11.145586013793945, "global_step": 189334, "epoch": 1126} {"train_loss": -11.180556768462772, "global_step": 189335, "epoch": 1126, "val_loss": 242415.53125} {"train_loss": -11.047884941101074, "global_step": 189336, "epoch": 1127} {"train_loss": -10.942028045654297, "global_step": 189337, "epoch": 1127} {"train_loss": -11.384449005126953, "global_step": 189338, "epoch": 1127} {"train_loss": -11.224720001220703, "global_step": 189339, "epoch": 1127} {"train_loss": -11.065098762512207, "global_step": 189340, "epoch": 1127} {"train_loss": -11.34898567199707, "global_step": 189341, "epoch": 1127} {"train_loss": -11.149978637695312, "global_step": 189342, "epoch": 1127} {"train_loss": -11.532089233398438, "global_step": 189343, "epoch": 1127} {"train_loss": -11.244361877441406, "global_step": 189344, "epoch": 1127} {"train_loss": -11.428979873657227, "global_step": 189345, "epoch": 1127} {"train_loss": -11.315749168395996, "global_step": 189346, "epoch": 1127} {"train_loss": -11.043861389160156, "global_step": 189347, "epoch": 1127} {"train_loss": -11.468402862548828, "global_step": 189348, "epoch": 1127} {"train_loss": -11.205693244934082, "global_step": 189349, "epoch": 1127} {"train_loss": -11.278995513916016, "global_step": 189350, "epoch": 1127} {"train_loss": -11.36652946472168, "global_step": 189351, "epoch": 1127} {"train_loss": -11.501202583312988, "global_step": 189352, "epoch": 1127} {"train_loss": -11.380115509033203, "global_step": 189353, "epoch": 1127} {"train_loss": -11.738143920898438, "global_step": 189354, "epoch": 1127} {"train_loss": -11.269329071044922, "global_step": 189355, "epoch": 1127} {"train_loss": -11.59454345703125, "global_step": 189356, "epoch": 1127} {"train_loss": -11.453882217407227, "global_step": 189357, "epoch": 1127} {"train_loss": -11.139476776123047, "global_step": 189358, "epoch": 1127} {"train_loss": -11.264470100402832, "global_step": 189359, "epoch": 1127} {"train_loss": -11.12879467010498, "global_step": 189360, "epoch": 1127} {"train_loss": -11.016301155090332, "global_step": 189361, "epoch": 1127} {"train_loss": -11.582452774047852, "global_step": 189362, "epoch": 1127} {"train_loss": -11.2223539352417, "global_step": 189363, "epoch": 1127} {"train_loss": -11.081235885620117, "global_step": 189364, "epoch": 1127} {"train_loss": -10.958409309387207, "global_step": 189365, "epoch": 1127} {"train_loss": -11.243257522583008, "global_step": 189366, "epoch": 1127} {"train_loss": -11.33013916015625, "global_step": 189367, "epoch": 1127} {"train_loss": -11.338472366333008, "global_step": 189368, "epoch": 1127} {"train_loss": -11.616188049316406, "global_step": 189369, "epoch": 1127} {"train_loss": -11.570566177368164, "global_step": 189370, "epoch": 1127} {"train_loss": -11.332487106323242, "global_step": 189371, "epoch": 1127} {"train_loss": -11.190884590148926, "global_step": 189372, "epoch": 1127} {"train_loss": -11.115056991577148, "global_step": 189373, "epoch": 1127} {"train_loss": -11.519145965576172, "global_step": 189374, "epoch": 1127} {"train_loss": -11.38762092590332, "global_step": 189375, "epoch": 1127} {"train_loss": -11.25187873840332, "global_step": 189376, "epoch": 1127} {"train_loss": -11.483259201049805, "global_step": 189377, "epoch": 1127} {"train_loss": -11.451272010803223, "global_step": 189378, "epoch": 1127} {"train_loss": -11.509326934814453, "global_step": 189379, "epoch": 1127} {"train_loss": -11.556844711303711, "global_step": 189380, "epoch": 1127} {"train_loss": -11.391283988952637, "global_step": 189381, "epoch": 1127} {"train_loss": -11.027111053466797, "global_step": 189382, "epoch": 1127} {"train_loss": -10.780141830444336, "global_step": 189383, "epoch": 1127} {"train_loss": -11.611347198486328, "global_step": 189384, "epoch": 1127} {"train_loss": -11.050552368164062, "global_step": 189385, "epoch": 1127} {"train_loss": -11.094732284545898, "global_step": 189386, "epoch": 1127} {"train_loss": -11.51813793182373, "global_step": 189387, "epoch": 1127} {"train_loss": -11.010658264160156, "global_step": 189388, "epoch": 1127} {"train_loss": -10.716972351074219, "global_step": 189389, "epoch": 1127} {"train_loss": -11.22543716430664, "global_step": 189390, "epoch": 1127} {"train_loss": -11.545585632324219, "global_step": 189391, "epoch": 1127} {"train_loss": -11.05421257019043, "global_step": 189392, "epoch": 1127} {"train_loss": -11.235250473022461, "global_step": 189393, "epoch": 1127} {"train_loss": -11.12166976928711, "global_step": 189394, "epoch": 1127} {"train_loss": -10.858512878417969, "global_step": 189395, "epoch": 1127} {"train_loss": -10.977952003479004, "global_step": 189396, "epoch": 1127} {"train_loss": -10.943938255310059, "global_step": 189397, "epoch": 1127} {"train_loss": -10.749897003173828, "global_step": 189398, "epoch": 1127} {"train_loss": -11.478937149047852, "global_step": 189399, "epoch": 1127} {"train_loss": -10.506380081176758, "global_step": 189400, "epoch": 1127} {"train_loss": -11.192554473876953, "global_step": 189401, "epoch": 1127} {"train_loss": -11.225809097290039, "global_step": 189402, "epoch": 1127} {"train_loss": -10.707208633422852, "global_step": 189403, "epoch": 1127} {"train_loss": -11.406668663024902, "global_step": 189404, "epoch": 1127} {"train_loss": -10.35079574584961, "global_step": 189405, "epoch": 1127} {"train_loss": -11.026764869689941, "global_step": 189406, "epoch": 1127} {"train_loss": -10.453279495239258, "global_step": 189407, "epoch": 1127} {"train_loss": -10.403464317321777, "global_step": 189408, "epoch": 1127} {"train_loss": -10.880561828613281, "global_step": 189409, "epoch": 1127} {"train_loss": -10.321660995483398, "global_step": 189410, "epoch": 1127} {"train_loss": -10.684440612792969, "global_step": 189411, "epoch": 1127} {"train_loss": -10.365303039550781, "global_step": 189412, "epoch": 1127} {"train_loss": -9.999845504760742, "global_step": 189413, "epoch": 1127} {"train_loss": -10.716653823852539, "global_step": 189414, "epoch": 1127} {"train_loss": -9.574895858764648, "global_step": 189415, "epoch": 1127} {"train_loss": -10.085319519042969, "global_step": 189416, "epoch": 1127} {"train_loss": -10.219157218933105, "global_step": 189417, "epoch": 1127} {"train_loss": -9.879544258117676, "global_step": 189418, "epoch": 1127} {"train_loss": -9.912996292114258, "global_step": 189419, "epoch": 1127} {"train_loss": -9.909850120544434, "global_step": 189420, "epoch": 1127} {"train_loss": -9.843045234680176, "global_step": 189421, "epoch": 1127} {"train_loss": -10.532964706420898, "global_step": 189422, "epoch": 1127} {"train_loss": -10.016159057617188, "global_step": 189423, "epoch": 1127} {"train_loss": -9.606136322021484, "global_step": 189424, "epoch": 1127} {"train_loss": -10.695390701293945, "global_step": 189425, "epoch": 1127} {"train_loss": -9.764431953430176, "global_step": 189426, "epoch": 1127} {"train_loss": -10.695514678955078, "global_step": 189427, "epoch": 1127} {"train_loss": -10.547293663024902, "global_step": 189428, "epoch": 1127} {"train_loss": -10.45159912109375, "global_step": 189429, "epoch": 1127} {"train_loss": -10.400785446166992, "global_step": 189430, "epoch": 1127} {"train_loss": -10.72464656829834, "global_step": 189431, "epoch": 1127} {"train_loss": -10.30539608001709, "global_step": 189432, "epoch": 1127} {"train_loss": -10.890054702758789, "global_step": 189433, "epoch": 1127} {"train_loss": -10.700033187866211, "global_step": 189434, "epoch": 1127} {"train_loss": -10.842622756958008, "global_step": 189435, "epoch": 1127} {"train_loss": -10.20892333984375, "global_step": 189436, "epoch": 1127} {"train_loss": -11.062070846557617, "global_step": 189437, "epoch": 1127} {"train_loss": -10.198322296142578, "global_step": 189438, "epoch": 1127} {"train_loss": -10.473819732666016, "global_step": 189439, "epoch": 1127} {"train_loss": -11.027814865112305, "global_step": 189440, "epoch": 1127} {"train_loss": -10.883904457092285, "global_step": 189441, "epoch": 1127} {"train_loss": -10.878103256225586, "global_step": 189442, "epoch": 1127} {"train_loss": -10.795022010803223, "global_step": 189443, "epoch": 1127} {"train_loss": -11.049541473388672, "global_step": 189444, "epoch": 1127} {"train_loss": -10.66464900970459, "global_step": 189445, "epoch": 1127} {"train_loss": -10.964038848876953, "global_step": 189446, "epoch": 1127} {"train_loss": -11.073463439941406, "global_step": 189447, "epoch": 1127} {"train_loss": -10.928421974182129, "global_step": 189448, "epoch": 1127} {"train_loss": -11.1657133102417, "global_step": 189449, "epoch": 1127} {"train_loss": -11.154319763183594, "global_step": 189450, "epoch": 1127} {"train_loss": -11.204047203063965, "global_step": 189451, "epoch": 1127} {"train_loss": -11.125953674316406, "global_step": 189452, "epoch": 1127} {"train_loss": -10.7532958984375, "global_step": 189453, "epoch": 1127} {"train_loss": -11.257148742675781, "global_step": 189454, "epoch": 1127} {"train_loss": -11.049317359924316, "global_step": 189455, "epoch": 1127} {"train_loss": -11.256988525390625, "global_step": 189456, "epoch": 1127} {"train_loss": -11.051814079284668, "global_step": 189457, "epoch": 1127} {"train_loss": -11.055280685424805, "global_step": 189458, "epoch": 1127} {"train_loss": -11.071730613708496, "global_step": 189459, "epoch": 1127} {"train_loss": -11.186309814453125, "global_step": 189460, "epoch": 1127} {"train_loss": -11.056541442871094, "global_step": 189461, "epoch": 1127} {"train_loss": -11.161397933959961, "global_step": 189462, "epoch": 1127} {"train_loss": -11.30716323852539, "global_step": 189463, "epoch": 1127} {"train_loss": -11.339788436889648, "global_step": 189464, "epoch": 1127} {"train_loss": -11.168073654174805, "global_step": 189465, "epoch": 1127} {"train_loss": -11.41594409942627, "global_step": 189466, "epoch": 1127} {"train_loss": -11.261043548583984, "global_step": 189467, "epoch": 1127} {"train_loss": -11.288910865783691, "global_step": 189468, "epoch": 1127} {"train_loss": -11.401948928833008, "global_step": 189469, "epoch": 1127} {"train_loss": -11.464393615722656, "global_step": 189470, "epoch": 1127} {"train_loss": -11.316192626953125, "global_step": 189471, "epoch": 1127} {"train_loss": -11.446428298950195, "global_step": 189472, "epoch": 1127} {"train_loss": -11.376980781555176, "global_step": 189473, "epoch": 1127} {"train_loss": -11.41808795928955, "global_step": 189474, "epoch": 1127} {"train_loss": -11.56728744506836, "global_step": 189475, "epoch": 1127} {"train_loss": -11.620109558105469, "global_step": 189476, "epoch": 1127} {"train_loss": -11.449617385864258, "global_step": 189477, "epoch": 1127} {"train_loss": -11.29759407043457, "global_step": 189478, "epoch": 1127} {"train_loss": -11.544536590576172, "global_step": 189479, "epoch": 1127} {"train_loss": -11.537424087524414, "global_step": 189480, "epoch": 1127} {"train_loss": -11.384042739868164, "global_step": 189481, "epoch": 1127} {"train_loss": -11.459001541137695, "global_step": 189482, "epoch": 1127} {"train_loss": -11.596196174621582, "global_step": 189483, "epoch": 1127} {"train_loss": -11.658761978149414, "global_step": 189484, "epoch": 1127} {"train_loss": -11.549942970275879, "global_step": 189485, "epoch": 1127} {"train_loss": -11.598194122314453, "global_step": 189486, "epoch": 1127} {"train_loss": -11.528544425964355, "global_step": 189487, "epoch": 1127} {"train_loss": -11.508625030517578, "global_step": 189488, "epoch": 1127} {"train_loss": -11.524131774902344, "global_step": 189489, "epoch": 1127} {"train_loss": -11.338861465454102, "global_step": 189490, "epoch": 1127} {"train_loss": -11.520824432373047, "global_step": 189491, "epoch": 1127} {"train_loss": -11.584351539611816, "global_step": 189492, "epoch": 1127} {"train_loss": -11.56505298614502, "global_step": 189493, "epoch": 1127} {"train_loss": -11.472814559936523, "global_step": 189494, "epoch": 1127} {"train_loss": -11.784039497375488, "global_step": 189495, "epoch": 1127} {"train_loss": -11.50947380065918, "global_step": 189496, "epoch": 1127} {"train_loss": -11.435779571533203, "global_step": 189497, "epoch": 1127} {"train_loss": -11.541597366333008, "global_step": 189498, "epoch": 1127} {"train_loss": -11.716106414794922, "global_step": 189499, "epoch": 1127} {"train_loss": -11.46052360534668, "global_step": 189500, "epoch": 1127} {"train_loss": -11.630908012390137, "global_step": 189501, "epoch": 1127} {"train_loss": -11.514209747314453, "global_step": 189502, "epoch": 1127} {"train_loss": -11.088080769493466, "global_step": 189503, "epoch": 1127, "val_loss": 248036.359375} {"train_loss": -11.631532669067383, "global_step": 189504, "epoch": 1128} {"train_loss": -11.468116760253906, "global_step": 189505, "epoch": 1128} {"train_loss": -11.599945068359375, "global_step": 189506, "epoch": 1128} {"train_loss": -11.247211456298828, "global_step": 189507, "epoch": 1128} {"train_loss": -11.598761558532715, "global_step": 189508, "epoch": 1128} {"train_loss": -11.289283752441406, "global_step": 189509, "epoch": 1128} {"train_loss": -11.46509075164795, "global_step": 189510, "epoch": 1128} {"train_loss": -11.18906307220459, "global_step": 189511, "epoch": 1128} {"train_loss": -11.17685317993164, "global_step": 189512, "epoch": 1128} {"train_loss": -10.983098030090332, "global_step": 189513, "epoch": 1128} {"train_loss": -10.948348999023438, "global_step": 189514, "epoch": 1128} {"train_loss": -10.469741821289062, "global_step": 189515, "epoch": 1128} {"train_loss": -10.77414321899414, "global_step": 189516, "epoch": 1128} {"train_loss": -9.980485916137695, "global_step": 189517, "epoch": 1128} {"train_loss": -10.758773803710938, "global_step": 189518, "epoch": 1128} {"train_loss": -10.867274284362793, "global_step": 189519, "epoch": 1128} {"train_loss": -9.828290939331055, "global_step": 189520, "epoch": 1128} {"train_loss": -9.98707389831543, "global_step": 189521, "epoch": 1128} {"train_loss": -11.091672897338867, "global_step": 189522, "epoch": 1128} {"train_loss": -10.446206092834473, "global_step": 189523, "epoch": 1128} {"train_loss": -10.968363761901855, "global_step": 189524, "epoch": 1128} {"train_loss": -10.659767150878906, "global_step": 189525, "epoch": 1128} {"train_loss": -11.340103149414062, "global_step": 189526, "epoch": 1128} {"train_loss": -10.985420227050781, "global_step": 189527, "epoch": 1128} {"train_loss": -10.012616157531738, "global_step": 189528, "epoch": 1128} {"train_loss": -10.880651473999023, "global_step": 189529, "epoch": 1128} {"train_loss": -10.390935897827148, "global_step": 189530, "epoch": 1128} {"train_loss": -9.943672180175781, "global_step": 189531, "epoch": 1128} {"train_loss": -10.714395523071289, "global_step": 189532, "epoch": 1128} {"train_loss": -9.934915542602539, "global_step": 189533, "epoch": 1128} {"train_loss": -10.096445083618164, "global_step": 189534, "epoch": 1128} {"train_loss": -9.566096305847168, "global_step": 189535, "epoch": 1128} {"train_loss": -10.145757675170898, "global_step": 189536, "epoch": 1128} {"train_loss": -10.447664260864258, "global_step": 189537, "epoch": 1128} {"train_loss": -10.180465698242188, "global_step": 189538, "epoch": 1128} {"train_loss": -10.139642715454102, "global_step": 189539, "epoch": 1128} {"train_loss": -10.734640121459961, "global_step": 189540, "epoch": 1128} {"train_loss": -10.086345672607422, "global_step": 189541, "epoch": 1128} {"train_loss": -11.13659954071045, "global_step": 189542, "epoch": 1128} {"train_loss": -10.25051212310791, "global_step": 189543, "epoch": 1128} {"train_loss": -10.635650634765625, "global_step": 189544, "epoch": 1128} {"train_loss": -11.086557388305664, "global_step": 189545, "epoch": 1128} {"train_loss": -10.466256141662598, "global_step": 189546, "epoch": 1128} {"train_loss": -10.987907409667969, "global_step": 189547, "epoch": 1128} {"train_loss": -10.444890975952148, "global_step": 189548, "epoch": 1128} {"train_loss": -11.066455841064453, "global_step": 189549, "epoch": 1128} {"train_loss": -10.644519805908203, "global_step": 189550, "epoch": 1128} {"train_loss": -11.183971405029297, "global_step": 189551, "epoch": 1128} {"train_loss": -10.944944381713867, "global_step": 189552, "epoch": 1128} {"train_loss": -10.972519874572754, "global_step": 189553, "epoch": 1128} {"train_loss": -10.979005813598633, "global_step": 189554, "epoch": 1128} {"train_loss": -10.884359359741211, "global_step": 189555, "epoch": 1128} {"train_loss": -11.15556526184082, "global_step": 189556, "epoch": 1128} {"train_loss": -11.08250617980957, "global_step": 189557, "epoch": 1128} {"train_loss": -11.085821151733398, "global_step": 189558, "epoch": 1128} {"train_loss": -11.176431655883789, "global_step": 189559, "epoch": 1128} {"train_loss": -11.150278091430664, "global_step": 189560, "epoch": 1128} {"train_loss": -10.945727348327637, "global_step": 189561, "epoch": 1128} {"train_loss": -11.26801586151123, "global_step": 189562, "epoch": 1128} {"train_loss": -11.040325164794922, "global_step": 189563, "epoch": 1128} {"train_loss": -11.19506549835205, "global_step": 189564, "epoch": 1128} {"train_loss": -11.195069313049316, "global_step": 189565, "epoch": 1128} {"train_loss": -11.190101623535156, "global_step": 189566, "epoch": 1128} {"train_loss": -11.343877792358398, "global_step": 189567, "epoch": 1128} {"train_loss": -11.297002792358398, "global_step": 189568, "epoch": 1128} {"train_loss": -11.281309127807617, "global_step": 189569, "epoch": 1128} {"train_loss": -11.193451881408691, "global_step": 189570, "epoch": 1128} {"train_loss": -11.334794998168945, "global_step": 189571, "epoch": 1128} {"train_loss": -11.191590309143066, "global_step": 189572, "epoch": 1128} {"train_loss": -11.477316856384277, "global_step": 189573, "epoch": 1128} {"train_loss": -11.304945945739746, "global_step": 189574, "epoch": 1128} {"train_loss": -11.494287490844727, "global_step": 189575, "epoch": 1128} {"train_loss": -11.380586624145508, "global_step": 189576, "epoch": 1128} {"train_loss": -11.524923324584961, "global_step": 189577, "epoch": 1128} {"train_loss": -11.156402587890625, "global_step": 189578, "epoch": 1128} {"train_loss": -11.316644668579102, "global_step": 189579, "epoch": 1128} {"train_loss": -11.156576156616211, "global_step": 189580, "epoch": 1128} {"train_loss": -11.504467010498047, "global_step": 189581, "epoch": 1128} {"train_loss": -11.25385856628418, "global_step": 189582, "epoch": 1128} {"train_loss": -11.405983924865723, "global_step": 189583, "epoch": 1128} {"train_loss": -11.412511825561523, "global_step": 189584, "epoch": 1128} {"train_loss": -11.628485679626465, "global_step": 189585, "epoch": 1128} {"train_loss": -11.460251808166504, "global_step": 189586, "epoch": 1128} {"train_loss": -11.509130477905273, "global_step": 189587, "epoch": 1128} {"train_loss": -11.544393539428711, "global_step": 189588, "epoch": 1128} {"train_loss": -11.448260307312012, "global_step": 189589, "epoch": 1128} {"train_loss": -11.551592826843262, "global_step": 189590, "epoch": 1128} {"train_loss": -11.355151176452637, "global_step": 189591, "epoch": 1128} {"train_loss": -11.539301872253418, "global_step": 189592, "epoch": 1128} {"train_loss": -11.574108123779297, "global_step": 189593, "epoch": 1128} {"train_loss": -11.525997161865234, "global_step": 189594, "epoch": 1128} {"train_loss": -11.501001358032227, "global_step": 189595, "epoch": 1128} {"train_loss": -11.51423454284668, "global_step": 189596, "epoch": 1128} {"train_loss": -11.478802680969238, "global_step": 189597, "epoch": 1128} {"train_loss": -11.664773941040039, "global_step": 189598, "epoch": 1128} {"train_loss": -11.597406387329102, "global_step": 189599, "epoch": 1128} {"train_loss": -11.566451072692871, "global_step": 189600, "epoch": 1128} {"train_loss": -11.490169525146484, "global_step": 189601, "epoch": 1128} {"train_loss": -11.377341270446777, "global_step": 189602, "epoch": 1128} {"train_loss": -11.683566093444824, "global_step": 189603, "epoch": 1128} {"train_loss": -11.517507553100586, "global_step": 189604, "epoch": 1128} {"train_loss": -11.559198379516602, "global_step": 189605, "epoch": 1128} {"train_loss": -11.507894515991211, "global_step": 189606, "epoch": 1128} {"train_loss": -11.729024887084961, "global_step": 189607, "epoch": 1128} {"train_loss": -11.599897384643555, "global_step": 189608, "epoch": 1128} {"train_loss": -11.716245651245117, "global_step": 189609, "epoch": 1128} {"train_loss": -11.683782577514648, "global_step": 189610, "epoch": 1128} {"train_loss": -11.677694320678711, "global_step": 189611, "epoch": 1128} {"train_loss": -11.514779090881348, "global_step": 189612, "epoch": 1128} {"train_loss": -11.494150161743164, "global_step": 189613, "epoch": 1128} {"train_loss": -11.588165283203125, "global_step": 189614, "epoch": 1128} {"train_loss": -11.124740600585938, "global_step": 189615, "epoch": 1128} {"train_loss": -11.302671432495117, "global_step": 189616, "epoch": 1128} {"train_loss": -11.479917526245117, "global_step": 189617, "epoch": 1128} {"train_loss": -10.368219375610352, "global_step": 189618, "epoch": 1128} {"train_loss": -10.861780166625977, "global_step": 189619, "epoch": 1128} {"train_loss": -10.843594551086426, "global_step": 189620, "epoch": 1128} {"train_loss": -10.614490509033203, "global_step": 189621, "epoch": 1128} {"train_loss": -10.500204086303711, "global_step": 189622, "epoch": 1128} {"train_loss": -10.149995803833008, "global_step": 189623, "epoch": 1128} {"train_loss": -8.073328018188477, "global_step": 189624, "epoch": 1128} {"train_loss": -10.649560928344727, "global_step": 189625, "epoch": 1128} {"train_loss": -6.092961311340332, "global_step": 189626, "epoch": 1128} {"train_loss": -10.040803909301758, "global_step": 189627, "epoch": 1128} {"train_loss": -8.3392333984375, "global_step": 189628, "epoch": 1128} {"train_loss": -10.412545204162598, "global_step": 189629, "epoch": 1128} {"train_loss": -7.919246196746826, "global_step": 189630, "epoch": 1128} {"train_loss": -10.550651550292969, "global_step": 189631, "epoch": 1128} {"train_loss": -8.783807754516602, "global_step": 189632, "epoch": 1128} {"train_loss": -9.965898513793945, "global_step": 189633, "epoch": 1128} {"train_loss": -9.294221878051758, "global_step": 189634, "epoch": 1128} {"train_loss": -10.023247718811035, "global_step": 189635, "epoch": 1128} {"train_loss": -10.564544677734375, "global_step": 189636, "epoch": 1128} {"train_loss": -9.511589050292969, "global_step": 189637, "epoch": 1128} {"train_loss": -10.855745315551758, "global_step": 189638, "epoch": 1128} {"train_loss": -8.996903419494629, "global_step": 189639, "epoch": 1128} {"train_loss": -10.712413787841797, "global_step": 189640, "epoch": 1128} {"train_loss": -9.819040298461914, "global_step": 189641, "epoch": 1128} {"train_loss": -10.958244323730469, "global_step": 189642, "epoch": 1128} {"train_loss": -10.454278945922852, "global_step": 189643, "epoch": 1128} {"train_loss": -10.541646957397461, "global_step": 189644, "epoch": 1128} {"train_loss": -10.730042457580566, "global_step": 189645, "epoch": 1128} {"train_loss": -10.52507495880127, "global_step": 189646, "epoch": 1128} {"train_loss": -10.901934623718262, "global_step": 189647, "epoch": 1128} {"train_loss": -11.126348495483398, "global_step": 189648, "epoch": 1128} {"train_loss": -10.874629974365234, "global_step": 189649, "epoch": 1128} {"train_loss": -10.800561904907227, "global_step": 189650, "epoch": 1128} {"train_loss": -11.011714935302734, "global_step": 189651, "epoch": 1128} {"train_loss": -10.851767539978027, "global_step": 189652, "epoch": 1128} {"train_loss": -10.933309555053711, "global_step": 189653, "epoch": 1128} {"train_loss": -10.8233060836792, "global_step": 189654, "epoch": 1128} {"train_loss": -10.645769119262695, "global_step": 189655, "epoch": 1128} {"train_loss": -11.205564498901367, "global_step": 189656, "epoch": 1128} {"train_loss": -10.798500061035156, "global_step": 189657, "epoch": 1128} {"train_loss": -10.894510269165039, "global_step": 189658, "epoch": 1128} {"train_loss": -11.012612342834473, "global_step": 189659, "epoch": 1128} {"train_loss": -10.98044204711914, "global_step": 189660, "epoch": 1128} {"train_loss": -11.078693389892578, "global_step": 189661, "epoch": 1128} {"train_loss": -11.17222785949707, "global_step": 189662, "epoch": 1128} {"train_loss": -11.08287239074707, "global_step": 189663, "epoch": 1128} {"train_loss": -11.216730117797852, "global_step": 189664, "epoch": 1128} {"train_loss": -10.972201347351074, "global_step": 189665, "epoch": 1128} {"train_loss": -11.05484390258789, "global_step": 189666, "epoch": 1128} {"train_loss": -11.042964935302734, "global_step": 189667, "epoch": 1128} {"train_loss": -11.08341121673584, "global_step": 189668, "epoch": 1128} {"train_loss": -11.096780776977539, "global_step": 189669, "epoch": 1128} {"train_loss": -11.141663551330566, "global_step": 189670, "epoch": 1128} {"train_loss": -10.874013733296167, "global_step": 189671, "epoch": 1128, "val_loss": 241408.796875} {"train_loss": -11.110005378723145, "global_step": 189672, "epoch": 1129} {"train_loss": -11.220643997192383, "global_step": 189673, "epoch": 1129} {"train_loss": -11.205171585083008, "global_step": 189674, "epoch": 1129} {"train_loss": -11.181198120117188, "global_step": 189675, "epoch": 1129} {"train_loss": -11.188471794128418, "global_step": 189676, "epoch": 1129} {"train_loss": -11.485548973083496, "global_step": 189677, "epoch": 1129} {"train_loss": -11.37961196899414, "global_step": 189678, "epoch": 1129} {"train_loss": -11.577615737915039, "global_step": 189679, "epoch": 1129} {"train_loss": -11.378922462463379, "global_step": 189680, "epoch": 1129} {"train_loss": -11.128074645996094, "global_step": 189681, "epoch": 1129} {"train_loss": -11.273918151855469, "global_step": 189682, "epoch": 1129} {"train_loss": -11.378063201904297, "global_step": 189683, "epoch": 1129} {"train_loss": -11.47849178314209, "global_step": 189684, "epoch": 1129} {"train_loss": -11.20787239074707, "global_step": 189685, "epoch": 1129} {"train_loss": -11.61687183380127, "global_step": 189686, "epoch": 1129} {"train_loss": -11.257159233093262, "global_step": 189687, "epoch": 1129} {"train_loss": -11.408733367919922, "global_step": 189688, "epoch": 1129} {"train_loss": -11.49969482421875, "global_step": 189689, "epoch": 1129} {"train_loss": -11.590591430664062, "global_step": 189690, "epoch": 1129} {"train_loss": -11.586843490600586, "global_step": 189691, "epoch": 1129} {"train_loss": -11.734359741210938, "global_step": 189692, "epoch": 1129} {"train_loss": -11.377595901489258, "global_step": 189693, "epoch": 1129} {"train_loss": -11.439395904541016, "global_step": 189694, "epoch": 1129} {"train_loss": -11.344796180725098, "global_step": 189695, "epoch": 1129} {"train_loss": -10.561561584472656, "global_step": 189696, "epoch": 1129} {"train_loss": -10.693136215209961, "global_step": 189697, "epoch": 1129} {"train_loss": -11.415771484375, "global_step": 189698, "epoch": 1129} {"train_loss": -9.858966827392578, "global_step": 189699, "epoch": 1129} {"train_loss": -10.851123809814453, "global_step": 189700, "epoch": 1129} {"train_loss": -10.814848899841309, "global_step": 189701, "epoch": 1129} {"train_loss": -9.897683143615723, "global_step": 189702, "epoch": 1129} {"train_loss": -11.604001998901367, "global_step": 189703, "epoch": 1129} {"train_loss": -10.935918807983398, "global_step": 189704, "epoch": 1129} {"train_loss": -10.639732360839844, "global_step": 189705, "epoch": 1129} {"train_loss": -11.243880271911621, "global_step": 189706, "epoch": 1129} {"train_loss": -10.747333526611328, "global_step": 189707, "epoch": 1129} {"train_loss": -10.990248680114746, "global_step": 189708, "epoch": 1129} {"train_loss": -11.16136360168457, "global_step": 189709, "epoch": 1129} {"train_loss": -10.286744117736816, "global_step": 189710, "epoch": 1129} {"train_loss": -11.456853866577148, "global_step": 189711, "epoch": 1129} {"train_loss": -10.724737167358398, "global_step": 189712, "epoch": 1129} {"train_loss": -10.86305046081543, "global_step": 189713, "epoch": 1129} {"train_loss": -11.078571319580078, "global_step": 189714, "epoch": 1129} {"train_loss": -10.19007682800293, "global_step": 189715, "epoch": 1129} {"train_loss": -11.099266052246094, "global_step": 189716, "epoch": 1129} {"train_loss": -9.638704299926758, "global_step": 189717, "epoch": 1129} {"train_loss": -11.309359550476074, "global_step": 189718, "epoch": 1129} {"train_loss": -9.936676025390625, "global_step": 189719, "epoch": 1129} {"train_loss": -10.831924438476562, "global_step": 189720, "epoch": 1129} {"train_loss": -10.258561134338379, "global_step": 189721, "epoch": 1129} {"train_loss": -10.623234748840332, "global_step": 189722, "epoch": 1129} {"train_loss": -10.513786315917969, "global_step": 189723, "epoch": 1129} {"train_loss": -9.95018196105957, "global_step": 189724, "epoch": 1129} {"train_loss": -11.209795951843262, "global_step": 189725, "epoch": 1129} {"train_loss": -10.693037033081055, "global_step": 189726, "epoch": 1129} {"train_loss": -11.149921417236328, "global_step": 189727, "epoch": 1129} {"train_loss": -11.0160551071167, "global_step": 189728, "epoch": 1129} {"train_loss": -11.117576599121094, "global_step": 189729, "epoch": 1129} {"train_loss": -11.175777435302734, "global_step": 189730, "epoch": 1129} {"train_loss": -11.30963134765625, "global_step": 189731, "epoch": 1129} {"train_loss": -11.117622375488281, "global_step": 189732, "epoch": 1129} {"train_loss": -11.31106948852539, "global_step": 189733, "epoch": 1129} {"train_loss": -11.155750274658203, "global_step": 189734, "epoch": 1129} {"train_loss": -10.944704055786133, "global_step": 189735, "epoch": 1129} {"train_loss": -11.48344898223877, "global_step": 189736, "epoch": 1129} {"train_loss": -10.989636421203613, "global_step": 189737, "epoch": 1129} {"train_loss": -11.096696853637695, "global_step": 189738, "epoch": 1129} {"train_loss": -11.335071563720703, "global_step": 189739, "epoch": 1129} {"train_loss": -11.213014602661133, "global_step": 189740, "epoch": 1129} {"train_loss": -11.084961891174316, "global_step": 189741, "epoch": 1129} {"train_loss": -11.213470458984375, "global_step": 189742, "epoch": 1129} {"train_loss": -11.3269681930542, "global_step": 189743, "epoch": 1129} {"train_loss": -11.275127410888672, "global_step": 189744, "epoch": 1129} {"train_loss": -11.09349250793457, "global_step": 189745, "epoch": 1129} {"train_loss": -11.030082702636719, "global_step": 189746, "epoch": 1129} {"train_loss": -10.904096603393555, "global_step": 189747, "epoch": 1129} {"train_loss": -11.554765701293945, "global_step": 189748, "epoch": 1129} {"train_loss": -11.170937538146973, "global_step": 189749, "epoch": 1129} {"train_loss": -11.222147941589355, "global_step": 189750, "epoch": 1129} {"train_loss": -10.88221263885498, "global_step": 189751, "epoch": 1129} {"train_loss": -11.321733474731445, "global_step": 189752, "epoch": 1129} {"train_loss": -11.030755996704102, "global_step": 189753, "epoch": 1129} {"train_loss": -11.332418441772461, "global_step": 189754, "epoch": 1129} {"train_loss": -10.900227546691895, "global_step": 189755, "epoch": 1129} {"train_loss": -11.470378875732422, "global_step": 189756, "epoch": 1129} {"train_loss": -10.957746505737305, "global_step": 189757, "epoch": 1129} {"train_loss": -11.217072486877441, "global_step": 189758, "epoch": 1129} {"train_loss": -11.18016242980957, "global_step": 189759, "epoch": 1129} {"train_loss": -11.172499656677246, "global_step": 189760, "epoch": 1129} {"train_loss": -11.139634132385254, "global_step": 189761, "epoch": 1129} {"train_loss": -11.257113456726074, "global_step": 189762, "epoch": 1129} {"train_loss": -11.219583511352539, "global_step": 189763, "epoch": 1129} {"train_loss": -10.996307373046875, "global_step": 189764, "epoch": 1129} {"train_loss": -11.321706771850586, "global_step": 189765, "epoch": 1129} {"train_loss": -11.077619552612305, "global_step": 189766, "epoch": 1129} {"train_loss": -11.370399475097656, "global_step": 189767, "epoch": 1129} {"train_loss": -10.923941612243652, "global_step": 189768, "epoch": 1129} {"train_loss": -10.9885835647583, "global_step": 189769, "epoch": 1129} {"train_loss": -10.619039535522461, "global_step": 189770, "epoch": 1129} {"train_loss": -10.810892105102539, "global_step": 189771, "epoch": 1129} {"train_loss": -10.532371520996094, "global_step": 189772, "epoch": 1129} {"train_loss": -10.682085037231445, "global_step": 189773, "epoch": 1129} {"train_loss": -10.874204635620117, "global_step": 189774, "epoch": 1129} {"train_loss": -10.174560546875, "global_step": 189775, "epoch": 1129} {"train_loss": -11.162702560424805, "global_step": 189776, "epoch": 1129} {"train_loss": -10.447818756103516, "global_step": 189777, "epoch": 1129} {"train_loss": -11.313591003417969, "global_step": 189778, "epoch": 1129} {"train_loss": -10.863081932067871, "global_step": 189779, "epoch": 1129} {"train_loss": -11.176534652709961, "global_step": 189780, "epoch": 1129} {"train_loss": -11.01211166381836, "global_step": 189781, "epoch": 1129} {"train_loss": -10.982063293457031, "global_step": 189782, "epoch": 1129} {"train_loss": -10.75567626953125, "global_step": 189783, "epoch": 1129} {"train_loss": -11.077716827392578, "global_step": 189784, "epoch": 1129} {"train_loss": -11.102866172790527, "global_step": 189785, "epoch": 1129} {"train_loss": -10.8355073928833, "global_step": 189786, "epoch": 1129} {"train_loss": -11.0858154296875, "global_step": 189787, "epoch": 1129} {"train_loss": -11.076019287109375, "global_step": 189788, "epoch": 1129} {"train_loss": -11.454713821411133, "global_step": 189789, "epoch": 1129} {"train_loss": -10.778619766235352, "global_step": 189790, "epoch": 1129} {"train_loss": -11.349578857421875, "global_step": 189791, "epoch": 1129} {"train_loss": -11.129640579223633, "global_step": 189792, "epoch": 1129} {"train_loss": -11.139871597290039, "global_step": 189793, "epoch": 1129} {"train_loss": -11.18655014038086, "global_step": 189794, "epoch": 1129} {"train_loss": -11.364114761352539, "global_step": 189795, "epoch": 1129} {"train_loss": -11.464009284973145, "global_step": 189796, "epoch": 1129} {"train_loss": -11.081113815307617, "global_step": 189797, "epoch": 1129} {"train_loss": -11.540395736694336, "global_step": 189798, "epoch": 1129} {"train_loss": -11.231447219848633, "global_step": 189799, "epoch": 1129} {"train_loss": -11.561910629272461, "global_step": 189800, "epoch": 1129} {"train_loss": -11.40715217590332, "global_step": 189801, "epoch": 1129} {"train_loss": -11.4324951171875, "global_step": 189802, "epoch": 1129} {"train_loss": -11.313739776611328, "global_step": 189803, "epoch": 1129} {"train_loss": -11.371053695678711, "global_step": 189804, "epoch": 1129} {"train_loss": -11.13223934173584, "global_step": 189805, "epoch": 1129} {"train_loss": -10.73713493347168, "global_step": 189806, "epoch": 1129} {"train_loss": -11.225818634033203, "global_step": 189807, "epoch": 1129} {"train_loss": -10.995718002319336, "global_step": 189808, "epoch": 1129} {"train_loss": -11.633264541625977, "global_step": 189809, "epoch": 1129} {"train_loss": -11.419185638427734, "global_step": 189810, "epoch": 1129} {"train_loss": -11.186705589294434, "global_step": 189811, "epoch": 1129} {"train_loss": -11.346973419189453, "global_step": 189812, "epoch": 1129} {"train_loss": -11.383272171020508, "global_step": 189813, "epoch": 1129} {"train_loss": -11.540592193603516, "global_step": 189814, "epoch": 1129} {"train_loss": -11.360950469970703, "global_step": 189815, "epoch": 1129} {"train_loss": -11.507364273071289, "global_step": 189816, "epoch": 1129} {"train_loss": -11.559762954711914, "global_step": 189817, "epoch": 1129} {"train_loss": -11.406339645385742, "global_step": 189818, "epoch": 1129} {"train_loss": -11.31338882446289, "global_step": 189819, "epoch": 1129} {"train_loss": -11.443029403686523, "global_step": 189820, "epoch": 1129} {"train_loss": -11.459864616394043, "global_step": 189821, "epoch": 1129} {"train_loss": -11.492988586425781, "global_step": 189822, "epoch": 1129} {"train_loss": -11.340582847595215, "global_step": 189823, "epoch": 1129} {"train_loss": -11.442554473876953, "global_step": 189824, "epoch": 1129} {"train_loss": -11.310844421386719, "global_step": 189825, "epoch": 1129} {"train_loss": -11.466131210327148, "global_step": 189826, "epoch": 1129} {"train_loss": -11.75525188446045, "global_step": 189827, "epoch": 1129} {"train_loss": -11.25385856628418, "global_step": 189828, "epoch": 1129} {"train_loss": -11.75056266784668, "global_step": 189829, "epoch": 1129} {"train_loss": -11.401719093322754, "global_step": 189830, "epoch": 1129} {"train_loss": -11.627388000488281, "global_step": 189831, "epoch": 1129} {"train_loss": -11.6062650680542, "global_step": 189832, "epoch": 1129} {"train_loss": -11.417688369750977, "global_step": 189833, "epoch": 1129} {"train_loss": -11.547246932983398, "global_step": 189834, "epoch": 1129} {"train_loss": -11.562671661376953, "global_step": 189835, "epoch": 1129} {"train_loss": -11.52273941040039, "global_step": 189836, "epoch": 1129} {"train_loss": -11.517704010009766, "global_step": 189837, "epoch": 1129} {"train_loss": -11.491449356079102, "global_step": 189838, "epoch": 1129} {"train_loss": -11.141970424425034, "global_step": 189839, "epoch": 1129, "val_loss": 245422.828125} {"train_loss": -11.471672058105469, "global_step": 189840, "epoch": 1130} {"train_loss": -11.553443908691406, "global_step": 189841, "epoch": 1130} {"train_loss": -11.23328971862793, "global_step": 189842, "epoch": 1130} {"train_loss": -11.4425630569458, "global_step": 189843, "epoch": 1130} {"train_loss": -11.246038436889648, "global_step": 189844, "epoch": 1130} {"train_loss": -11.47769546508789, "global_step": 189845, "epoch": 1130} {"train_loss": -9.94184398651123, "global_step": 189846, "epoch": 1130} {"train_loss": -11.34291934967041, "global_step": 189847, "epoch": 1130} {"train_loss": -10.61815071105957, "global_step": 189848, "epoch": 1130} {"train_loss": -10.947356224060059, "global_step": 189849, "epoch": 1130} {"train_loss": -10.428083419799805, "global_step": 189850, "epoch": 1130} {"train_loss": -11.493865966796875, "global_step": 189851, "epoch": 1130} {"train_loss": -11.03693962097168, "global_step": 189852, "epoch": 1130} {"train_loss": -10.188694953918457, "global_step": 189853, "epoch": 1130} {"train_loss": -10.86170768737793, "global_step": 189854, "epoch": 1130} {"train_loss": -11.173223495483398, "global_step": 189855, "epoch": 1130} {"train_loss": -11.036613464355469, "global_step": 189856, "epoch": 1130} {"train_loss": -11.258918762207031, "global_step": 189857, "epoch": 1130} {"train_loss": -10.949238777160645, "global_step": 189858, "epoch": 1130} {"train_loss": -11.329361915588379, "global_step": 189859, "epoch": 1130} {"train_loss": -11.097269058227539, "global_step": 189860, "epoch": 1130} {"train_loss": -10.776996612548828, "global_step": 189861, "epoch": 1130} {"train_loss": -11.665620803833008, "global_step": 189862, "epoch": 1130} {"train_loss": -11.082493782043457, "global_step": 189863, "epoch": 1130} {"train_loss": -11.407001495361328, "global_step": 189864, "epoch": 1130} {"train_loss": -11.301094055175781, "global_step": 189865, "epoch": 1130} {"train_loss": -10.959052085876465, "global_step": 189866, "epoch": 1130} {"train_loss": -11.28299331665039, "global_step": 189867, "epoch": 1130} {"train_loss": -11.408201217651367, "global_step": 189868, "epoch": 1130} {"train_loss": -10.91677188873291, "global_step": 189869, "epoch": 1130} {"train_loss": -11.512619018554688, "global_step": 189870, "epoch": 1130} {"train_loss": -10.122673034667969, "global_step": 189871, "epoch": 1130} {"train_loss": -10.140613555908203, "global_step": 189872, "epoch": 1130} {"train_loss": -11.011202812194824, "global_step": 189873, "epoch": 1130} {"train_loss": -9.569798469543457, "global_step": 189874, "epoch": 1130} {"train_loss": -10.799266815185547, "global_step": 189875, "epoch": 1130} {"train_loss": -10.550121307373047, "global_step": 189876, "epoch": 1130} {"train_loss": -10.686576843261719, "global_step": 189877, "epoch": 1130} {"train_loss": -10.551353454589844, "global_step": 189878, "epoch": 1130} {"train_loss": -10.874491691589355, "global_step": 189879, "epoch": 1130} {"train_loss": -10.622051239013672, "global_step": 189880, "epoch": 1130} {"train_loss": -10.691164016723633, "global_step": 189881, "epoch": 1130} {"train_loss": -10.9605712890625, "global_step": 189882, "epoch": 1130} {"train_loss": -11.035528182983398, "global_step": 189883, "epoch": 1130} {"train_loss": -11.288520812988281, "global_step": 189884, "epoch": 1130} {"train_loss": -11.016477584838867, "global_step": 189885, "epoch": 1130} {"train_loss": -11.143575668334961, "global_step": 189886, "epoch": 1130} {"train_loss": -10.65111255645752, "global_step": 189887, "epoch": 1130} {"train_loss": -11.091629028320312, "global_step": 189888, "epoch": 1130} {"train_loss": -10.920999526977539, "global_step": 189889, "epoch": 1130} {"train_loss": -11.278573989868164, "global_step": 189890, "epoch": 1130} {"train_loss": -10.93283748626709, "global_step": 189891, "epoch": 1130} {"train_loss": -11.175890922546387, "global_step": 189892, "epoch": 1130} {"train_loss": -11.269729614257812, "global_step": 189893, "epoch": 1130} {"train_loss": -11.277074813842773, "global_step": 189894, "epoch": 1130} {"train_loss": -11.054769515991211, "global_step": 189895, "epoch": 1130} {"train_loss": -11.249302864074707, "global_step": 189896, "epoch": 1130} {"train_loss": -10.644813537597656, "global_step": 189897, "epoch": 1130} {"train_loss": -11.026912689208984, "global_step": 189898, "epoch": 1130} {"train_loss": -10.979473114013672, "global_step": 189899, "epoch": 1130} {"train_loss": -10.718192100524902, "global_step": 189900, "epoch": 1130} {"train_loss": -11.018387794494629, "global_step": 189901, "epoch": 1130} {"train_loss": -10.891738891601562, "global_step": 189902, "epoch": 1130} {"train_loss": -11.319110870361328, "global_step": 189903, "epoch": 1130} {"train_loss": -11.011926651000977, "global_step": 189904, "epoch": 1130} {"train_loss": -11.144426345825195, "global_step": 189905, "epoch": 1130} {"train_loss": -10.732126235961914, "global_step": 189906, "epoch": 1130} {"train_loss": -10.733024597167969, "global_step": 189907, "epoch": 1130} {"train_loss": -10.88386344909668, "global_step": 189908, "epoch": 1130} {"train_loss": -10.936796188354492, "global_step": 189909, "epoch": 1130} {"train_loss": -11.056872367858887, "global_step": 189910, "epoch": 1130} {"train_loss": -10.60683822631836, "global_step": 189911, "epoch": 1130} {"train_loss": -11.05982780456543, "global_step": 189912, "epoch": 1130} {"train_loss": -10.504130363464355, "global_step": 189913, "epoch": 1130} {"train_loss": -9.491695404052734, "global_step": 189914, "epoch": 1130} {"train_loss": -10.201665878295898, "global_step": 189915, "epoch": 1130} {"train_loss": -10.478652000427246, "global_step": 189916, "epoch": 1130} {"train_loss": -10.838972091674805, "global_step": 189917, "epoch": 1130} {"train_loss": -11.117047309875488, "global_step": 189918, "epoch": 1130} {"train_loss": -10.623806953430176, "global_step": 189919, "epoch": 1130} {"train_loss": -11.01717472076416, "global_step": 189920, "epoch": 1130} {"train_loss": -10.765579223632812, "global_step": 189921, "epoch": 1130} {"train_loss": -11.1231689453125, "global_step": 189922, "epoch": 1130} {"train_loss": -10.830116271972656, "global_step": 189923, "epoch": 1130} {"train_loss": -10.829756736755371, "global_step": 189924, "epoch": 1130} {"train_loss": -11.080551147460938, "global_step": 189925, "epoch": 1130} {"train_loss": -11.317120552062988, "global_step": 189926, "epoch": 1130} {"train_loss": -10.65025806427002, "global_step": 189927, "epoch": 1130} {"train_loss": -11.315263748168945, "global_step": 189928, "epoch": 1130} {"train_loss": -10.912338256835938, "global_step": 189929, "epoch": 1130} {"train_loss": -11.298983573913574, "global_step": 189930, "epoch": 1130} {"train_loss": -11.156684875488281, "global_step": 189931, "epoch": 1130} {"train_loss": -11.218460083007812, "global_step": 189932, "epoch": 1130} {"train_loss": -11.148500442504883, "global_step": 189933, "epoch": 1130} {"train_loss": -11.518050193786621, "global_step": 189934, "epoch": 1130} {"train_loss": -10.973539352416992, "global_step": 189935, "epoch": 1130} {"train_loss": -11.037429809570312, "global_step": 189936, "epoch": 1130} {"train_loss": -11.04361343383789, "global_step": 189937, "epoch": 1130} {"train_loss": -11.297487258911133, "global_step": 189938, "epoch": 1130} {"train_loss": -11.130165100097656, "global_step": 189939, "epoch": 1130} {"train_loss": -11.47005558013916, "global_step": 189940, "epoch": 1130} {"train_loss": -11.375126838684082, "global_step": 189941, "epoch": 1130} {"train_loss": -11.294549942016602, "global_step": 189942, "epoch": 1130} {"train_loss": -11.259233474731445, "global_step": 189943, "epoch": 1130} {"train_loss": -11.273981094360352, "global_step": 189944, "epoch": 1130} {"train_loss": -10.96091079711914, "global_step": 189945, "epoch": 1130} {"train_loss": -11.3631591796875, "global_step": 189946, "epoch": 1130} {"train_loss": -11.119136810302734, "global_step": 189947, "epoch": 1130} {"train_loss": -11.404369354248047, "global_step": 189948, "epoch": 1130} {"train_loss": -10.940092086791992, "global_step": 189949, "epoch": 1130} {"train_loss": -11.50642204284668, "global_step": 189950, "epoch": 1130} {"train_loss": -11.273277282714844, "global_step": 189951, "epoch": 1130} {"train_loss": -11.482711791992188, "global_step": 189952, "epoch": 1130} {"train_loss": -11.205812454223633, "global_step": 189953, "epoch": 1130} {"train_loss": -11.540952682495117, "global_step": 189954, "epoch": 1130} {"train_loss": -11.346866607666016, "global_step": 189955, "epoch": 1130} {"train_loss": -11.401102066040039, "global_step": 189956, "epoch": 1130} {"train_loss": -11.350226402282715, "global_step": 189957, "epoch": 1130} {"train_loss": -11.444343566894531, "global_step": 189958, "epoch": 1130} {"train_loss": -11.315260887145996, "global_step": 189959, "epoch": 1130} {"train_loss": -11.532691955566406, "global_step": 189960, "epoch": 1130} {"train_loss": -11.505828857421875, "global_step": 189961, "epoch": 1130} {"train_loss": -11.247175216674805, "global_step": 189962, "epoch": 1130} {"train_loss": -11.574224472045898, "global_step": 189963, "epoch": 1130} {"train_loss": -11.370088577270508, "global_step": 189964, "epoch": 1130} {"train_loss": -11.135995864868164, "global_step": 189965, "epoch": 1130} {"train_loss": -11.416129112243652, "global_step": 189966, "epoch": 1130} {"train_loss": -11.524906158447266, "global_step": 189967, "epoch": 1130} {"train_loss": -11.427652359008789, "global_step": 189968, "epoch": 1130} {"train_loss": -11.385950088500977, "global_step": 189969, "epoch": 1130} {"train_loss": -11.454821586608887, "global_step": 189970, "epoch": 1130} {"train_loss": -11.302835464477539, "global_step": 189971, "epoch": 1130} {"train_loss": -11.60466194152832, "global_step": 189972, "epoch": 1130} {"train_loss": -11.564715385437012, "global_step": 189973, "epoch": 1130} {"train_loss": -11.562824249267578, "global_step": 189974, "epoch": 1130} {"train_loss": -11.693960189819336, "global_step": 189975, "epoch": 1130} {"train_loss": -11.684486389160156, "global_step": 189976, "epoch": 1130} {"train_loss": -11.40219497680664, "global_step": 189977, "epoch": 1130} {"train_loss": -11.469022750854492, "global_step": 189978, "epoch": 1130} {"train_loss": -11.470236778259277, "global_step": 189979, "epoch": 1130} {"train_loss": -11.62938117980957, "global_step": 189980, "epoch": 1130} {"train_loss": -11.535850524902344, "global_step": 189981, "epoch": 1130} {"train_loss": -11.094598770141602, "global_step": 189982, "epoch": 1130} {"train_loss": -11.223369598388672, "global_step": 189983, "epoch": 1130} {"train_loss": -11.556293487548828, "global_step": 189984, "epoch": 1130} {"train_loss": -11.389623641967773, "global_step": 189985, "epoch": 1130} {"train_loss": -11.262918472290039, "global_step": 189986, "epoch": 1130} {"train_loss": -11.336214065551758, "global_step": 189987, "epoch": 1130} {"train_loss": -11.13715934753418, "global_step": 189988, "epoch": 1130} {"train_loss": -10.927074432373047, "global_step": 189989, "epoch": 1130} {"train_loss": -10.913711547851562, "global_step": 189990, "epoch": 1130} {"train_loss": -11.308708190917969, "global_step": 189991, "epoch": 1130} {"train_loss": -11.44129753112793, "global_step": 189992, "epoch": 1130} {"train_loss": -11.306828498840332, "global_step": 189993, "epoch": 1130} {"train_loss": -11.361370086669922, "global_step": 189994, "epoch": 1130} {"train_loss": -10.127544403076172, "global_step": 189995, "epoch": 1130} {"train_loss": -10.208592414855957, "global_step": 189996, "epoch": 1130} {"train_loss": -11.161852836608887, "global_step": 189997, "epoch": 1130} {"train_loss": -10.962814331054688, "global_step": 189998, "epoch": 1130} {"train_loss": -10.33169937133789, "global_step": 189999, "epoch": 1130} {"train_loss": -11.401598930358887, "global_step": 190000, "epoch": 1130} {"train_loss": -10.217403411865234, "global_step": 190001, "epoch": 1130} {"train_loss": -11.378800392150879, "global_step": 190002, "epoch": 1130} {"train_loss": -10.453174591064453, "global_step": 190003, "epoch": 1130} {"train_loss": -11.199089050292969, "global_step": 190004, "epoch": 1130} {"train_loss": -11.157773971557617, "global_step": 190005, "epoch": 1130} {"train_loss": -10.888771057128906, "global_step": 190006, "epoch": 1130} {"train_loss": -11.082514234951564, "global_step": 190007, "epoch": 1130, "val_loss": 247187.71875, "train_action_mse_error": 1.0373347997665405} {"train_loss": -11.595438003540039, "global_step": 190008, "epoch": 1131} {"train_loss": -11.280864715576172, "global_step": 190009, "epoch": 1131} {"train_loss": -11.390356063842773, "global_step": 190010, "epoch": 1131} {"train_loss": -11.246907234191895, "global_step": 190011, "epoch": 1131} {"train_loss": -11.107501983642578, "global_step": 190012, "epoch": 1131} {"train_loss": -11.296525955200195, "global_step": 190013, "epoch": 1131} {"train_loss": -11.01500129699707, "global_step": 190014, "epoch": 1131} {"train_loss": -11.388616561889648, "global_step": 190015, "epoch": 1131} {"train_loss": -11.28391170501709, "global_step": 190016, "epoch": 1131} {"train_loss": -11.334156036376953, "global_step": 190017, "epoch": 1131} {"train_loss": -11.345349311828613, "global_step": 190018, "epoch": 1131} {"train_loss": -11.334342956542969, "global_step": 190019, "epoch": 1131} {"train_loss": -11.147916793823242, "global_step": 190020, "epoch": 1131} {"train_loss": -11.396404266357422, "global_step": 190021, "epoch": 1131} {"train_loss": -11.158156394958496, "global_step": 190022, "epoch": 1131} {"train_loss": -11.364374160766602, "global_step": 190023, "epoch": 1131} {"train_loss": -11.420763969421387, "global_step": 190024, "epoch": 1131} {"train_loss": -10.967659950256348, "global_step": 190025, "epoch": 1131} {"train_loss": -11.444076538085938, "global_step": 190026, "epoch": 1131} {"train_loss": -11.00226879119873, "global_step": 190027, "epoch": 1131} {"train_loss": -11.375581741333008, "global_step": 190028, "epoch": 1131} {"train_loss": -10.957779884338379, "global_step": 190029, "epoch": 1131} {"train_loss": -11.192930221557617, "global_step": 190030, "epoch": 1131} {"train_loss": -11.332605361938477, "global_step": 190031, "epoch": 1131} {"train_loss": -10.607824325561523, "global_step": 190032, "epoch": 1131} {"train_loss": -11.226478576660156, "global_step": 190033, "epoch": 1131} {"train_loss": -10.971393585205078, "global_step": 190034, "epoch": 1131} {"train_loss": -10.526566505432129, "global_step": 190035, "epoch": 1131} {"train_loss": -10.97775650024414, "global_step": 190036, "epoch": 1131} {"train_loss": -10.832195281982422, "global_step": 190037, "epoch": 1131} {"train_loss": -11.185586929321289, "global_step": 190038, "epoch": 1131} {"train_loss": -11.00587272644043, "global_step": 190039, "epoch": 1131} {"train_loss": -11.321303367614746, "global_step": 190040, "epoch": 1131} {"train_loss": -10.71218204498291, "global_step": 190041, "epoch": 1131} {"train_loss": -11.159472465515137, "global_step": 190042, "epoch": 1131} {"train_loss": -10.777896881103516, "global_step": 190043, "epoch": 1131} {"train_loss": -10.814724922180176, "global_step": 190044, "epoch": 1131} {"train_loss": -11.01365852355957, "global_step": 190045, "epoch": 1131} {"train_loss": -10.613940238952637, "global_step": 190046, "epoch": 1131} {"train_loss": -11.29377555847168, "global_step": 190047, "epoch": 1131} {"train_loss": -10.660585403442383, "global_step": 190048, "epoch": 1131} {"train_loss": -10.943878173828125, "global_step": 190049, "epoch": 1131} {"train_loss": -10.501516342163086, "global_step": 190050, "epoch": 1131} {"train_loss": -10.813716888427734, "global_step": 190051, "epoch": 1131} {"train_loss": -10.444930076599121, "global_step": 190052, "epoch": 1131} {"train_loss": -10.738911628723145, "global_step": 190053, "epoch": 1131} {"train_loss": -10.58205509185791, "global_step": 190054, "epoch": 1131} {"train_loss": -10.72615909576416, "global_step": 190055, "epoch": 1131} {"train_loss": -10.501849174499512, "global_step": 190056, "epoch": 1131} {"train_loss": -11.05540943145752, "global_step": 190057, "epoch": 1131} {"train_loss": -10.913511276245117, "global_step": 190058, "epoch": 1131} {"train_loss": -10.761221885681152, "global_step": 190059, "epoch": 1131} {"train_loss": -10.625530242919922, "global_step": 190060, "epoch": 1131} {"train_loss": -10.726871490478516, "global_step": 190061, "epoch": 1131} {"train_loss": -9.866201400756836, "global_step": 190062, "epoch": 1131} {"train_loss": -10.888158798217773, "global_step": 190063, "epoch": 1131} {"train_loss": -9.859756469726562, "global_step": 190064, "epoch": 1131} {"train_loss": -10.395896911621094, "global_step": 190065, "epoch": 1131} {"train_loss": -10.291915893554688, "global_step": 190066, "epoch": 1131} {"train_loss": -10.64954662322998, "global_step": 190067, "epoch": 1131} {"train_loss": -10.977581977844238, "global_step": 190068, "epoch": 1131} {"train_loss": -10.963973999023438, "global_step": 190069, "epoch": 1131} {"train_loss": -10.659235000610352, "global_step": 190070, "epoch": 1131} {"train_loss": -11.143051147460938, "global_step": 190071, "epoch": 1131} {"train_loss": -10.886510848999023, "global_step": 190072, "epoch": 1131} {"train_loss": -10.825722694396973, "global_step": 190073, "epoch": 1131} {"train_loss": -11.066180229187012, "global_step": 190074, "epoch": 1131} {"train_loss": -11.009417533874512, "global_step": 190075, "epoch": 1131} {"train_loss": -11.16970443725586, "global_step": 190076, "epoch": 1131} {"train_loss": -10.786144256591797, "global_step": 190077, "epoch": 1131} {"train_loss": -11.197476387023926, "global_step": 190078, "epoch": 1131} {"train_loss": -10.860651969909668, "global_step": 190079, "epoch": 1131} {"train_loss": -11.212488174438477, "global_step": 190080, "epoch": 1131} {"train_loss": -10.997528076171875, "global_step": 190081, "epoch": 1131} {"train_loss": -11.03386402130127, "global_step": 190082, "epoch": 1131} {"train_loss": -10.878623962402344, "global_step": 190083, "epoch": 1131} {"train_loss": -11.181703567504883, "global_step": 190084, "epoch": 1131} {"train_loss": -11.058640480041504, "global_step": 190085, "epoch": 1131} {"train_loss": -11.290261268615723, "global_step": 190086, "epoch": 1131} {"train_loss": -11.062993049621582, "global_step": 190087, "epoch": 1131} {"train_loss": -11.160603523254395, "global_step": 190088, "epoch": 1131} {"train_loss": -10.96065902709961, "global_step": 190089, "epoch": 1131} {"train_loss": -11.251035690307617, "global_step": 190090, "epoch": 1131} {"train_loss": -10.985254287719727, "global_step": 190091, "epoch": 1131} {"train_loss": -11.189984321594238, "global_step": 190092, "epoch": 1131} {"train_loss": -10.74418830871582, "global_step": 190093, "epoch": 1131} {"train_loss": -11.248200416564941, "global_step": 190094, "epoch": 1131} {"train_loss": -11.30369758605957, "global_step": 190095, "epoch": 1131} {"train_loss": -11.516729354858398, "global_step": 190096, "epoch": 1131} {"train_loss": -11.146913528442383, "global_step": 190097, "epoch": 1131} {"train_loss": -11.230005264282227, "global_step": 190098, "epoch": 1131} {"train_loss": -11.146747589111328, "global_step": 190099, "epoch": 1131} {"train_loss": -11.342693328857422, "global_step": 190100, "epoch": 1131} {"train_loss": -11.487707138061523, "global_step": 190101, "epoch": 1131} {"train_loss": -11.493453979492188, "global_step": 190102, "epoch": 1131} {"train_loss": -11.33750057220459, "global_step": 190103, "epoch": 1131} {"train_loss": -11.547708511352539, "global_step": 190104, "epoch": 1131} {"train_loss": -11.330816268920898, "global_step": 190105, "epoch": 1131} {"train_loss": -11.483957290649414, "global_step": 190106, "epoch": 1131} {"train_loss": -11.501092910766602, "global_step": 190107, "epoch": 1131} {"train_loss": -11.780200958251953, "global_step": 190108, "epoch": 1131} {"train_loss": -11.539668083190918, "global_step": 190109, "epoch": 1131} {"train_loss": -11.459861755371094, "global_step": 190110, "epoch": 1131} {"train_loss": -11.434099197387695, "global_step": 190111, "epoch": 1131} {"train_loss": -11.518194198608398, "global_step": 190112, "epoch": 1131} {"train_loss": -11.470678329467773, "global_step": 190113, "epoch": 1131} {"train_loss": -11.54000473022461, "global_step": 190114, "epoch": 1131} {"train_loss": -11.618087768554688, "global_step": 190115, "epoch": 1131} {"train_loss": -11.432600975036621, "global_step": 190116, "epoch": 1131} {"train_loss": -11.832460403442383, "global_step": 190117, "epoch": 1131} {"train_loss": -11.618217468261719, "global_step": 190118, "epoch": 1131} {"train_loss": -11.800019264221191, "global_step": 190119, "epoch": 1131} {"train_loss": -11.540862083435059, "global_step": 190120, "epoch": 1131} {"train_loss": -11.694968223571777, "global_step": 190121, "epoch": 1131} {"train_loss": -11.567044258117676, "global_step": 190122, "epoch": 1131} {"train_loss": -11.749807357788086, "global_step": 190123, "epoch": 1131} {"train_loss": -11.530054092407227, "global_step": 190124, "epoch": 1131} {"train_loss": -11.508234024047852, "global_step": 190125, "epoch": 1131} {"train_loss": -11.52306842803955, "global_step": 190126, "epoch": 1131} {"train_loss": -11.40353775024414, "global_step": 190127, "epoch": 1131} {"train_loss": -11.642398834228516, "global_step": 190128, "epoch": 1131} {"train_loss": -11.416975021362305, "global_step": 190129, "epoch": 1131} {"train_loss": -11.535848617553711, "global_step": 190130, "epoch": 1131} {"train_loss": -11.255632400512695, "global_step": 190131, "epoch": 1131} {"train_loss": -11.69973373413086, "global_step": 190132, "epoch": 1131} {"train_loss": -11.731485366821289, "global_step": 190133, "epoch": 1131} {"train_loss": -11.867040634155273, "global_step": 190134, "epoch": 1131} {"train_loss": -11.722494125366211, "global_step": 190135, "epoch": 1131} {"train_loss": -11.498353004455566, "global_step": 190136, "epoch": 1131} {"train_loss": -11.752683639526367, "global_step": 190137, "epoch": 1131} {"train_loss": -11.563041687011719, "global_step": 190138, "epoch": 1131} {"train_loss": -11.5675048828125, "global_step": 190139, "epoch": 1131} {"train_loss": -11.4347505569458, "global_step": 190140, "epoch": 1131} {"train_loss": -11.224809646606445, "global_step": 190141, "epoch": 1131} {"train_loss": -11.339394569396973, "global_step": 190142, "epoch": 1131} {"train_loss": -11.457762718200684, "global_step": 190143, "epoch": 1131} {"train_loss": -11.217377662658691, "global_step": 190144, "epoch": 1131} {"train_loss": -11.153042793273926, "global_step": 190145, "epoch": 1131} {"train_loss": -11.722816467285156, "global_step": 190146, "epoch": 1131} {"train_loss": -11.078248977661133, "global_step": 190147, "epoch": 1131} {"train_loss": -10.939340591430664, "global_step": 190148, "epoch": 1131} {"train_loss": -11.180788040161133, "global_step": 190149, "epoch": 1131} {"train_loss": -11.405949592590332, "global_step": 190150, "epoch": 1131} {"train_loss": -11.291293144226074, "global_step": 190151, "epoch": 1131} {"train_loss": -11.068347930908203, "global_step": 190152, "epoch": 1131} {"train_loss": -10.99439811706543, "global_step": 190153, "epoch": 1131} {"train_loss": -11.308544158935547, "global_step": 190154, "epoch": 1131} {"train_loss": -10.931050300598145, "global_step": 190155, "epoch": 1131} {"train_loss": -11.1978759765625, "global_step": 190156, "epoch": 1131} {"train_loss": -11.326498985290527, "global_step": 190157, "epoch": 1131} {"train_loss": -10.278691291809082, "global_step": 190158, "epoch": 1131} {"train_loss": -11.559799194335938, "global_step": 190159, "epoch": 1131} {"train_loss": -10.819867134094238, "global_step": 190160, "epoch": 1131} {"train_loss": -10.90578842163086, "global_step": 190161, "epoch": 1131} {"train_loss": -10.569355010986328, "global_step": 190162, "epoch": 1131} {"train_loss": -11.426555633544922, "global_step": 190163, "epoch": 1131} {"train_loss": -10.769392967224121, "global_step": 190164, "epoch": 1131} {"train_loss": -11.211708068847656, "global_step": 190165, "epoch": 1131} {"train_loss": -11.132164001464844, "global_step": 190166, "epoch": 1131} {"train_loss": -10.772745132446289, "global_step": 190167, "epoch": 1131} {"train_loss": -11.307403564453125, "global_step": 190168, "epoch": 1131} {"train_loss": -10.123387336730957, "global_step": 190169, "epoch": 1131} {"train_loss": -10.240266799926758, "global_step": 190170, "epoch": 1131} {"train_loss": -10.904394149780273, "global_step": 190171, "epoch": 1131} {"train_loss": -10.7142333984375, "global_step": 190172, "epoch": 1131} {"train_loss": -10.705242156982422, "global_step": 190173, "epoch": 1131} {"train_loss": -10.994470596313477, "global_step": 190174, "epoch": 1131} {"train_loss": -11.136638930865697, "global_step": 190175, "epoch": 1131, "val_loss": 248017.046875} {"train_loss": -9.998273849487305, "global_step": 190176, "epoch": 1132} {"train_loss": -9.909400939941406, "global_step": 190177, "epoch": 1132} {"train_loss": -10.687725067138672, "global_step": 190178, "epoch": 1132} {"train_loss": -10.523710250854492, "global_step": 190179, "epoch": 1132} {"train_loss": -10.770004272460938, "global_step": 190180, "epoch": 1132} {"train_loss": -10.872458457946777, "global_step": 190181, "epoch": 1132} {"train_loss": -10.971643447875977, "global_step": 190182, "epoch": 1132} {"train_loss": -10.646781921386719, "global_step": 190183, "epoch": 1132} {"train_loss": -11.011951446533203, "global_step": 190184, "epoch": 1132} {"train_loss": -10.293012619018555, "global_step": 190185, "epoch": 1132} {"train_loss": -10.922686576843262, "global_step": 190186, "epoch": 1132} {"train_loss": -10.34622859954834, "global_step": 190187, "epoch": 1132} {"train_loss": -10.471887588500977, "global_step": 190188, "epoch": 1132} {"train_loss": -9.811899185180664, "global_step": 190189, "epoch": 1132} {"train_loss": -10.923521995544434, "global_step": 190190, "epoch": 1132} {"train_loss": -9.8391752243042, "global_step": 190191, "epoch": 1132} {"train_loss": -10.179572105407715, "global_step": 190192, "epoch": 1132} {"train_loss": -9.804960250854492, "global_step": 190193, "epoch": 1132} {"train_loss": -10.66490364074707, "global_step": 190194, "epoch": 1132} {"train_loss": -10.038066864013672, "global_step": 190195, "epoch": 1132} {"train_loss": -10.749815940856934, "global_step": 190196, "epoch": 1132} {"train_loss": -10.432427406311035, "global_step": 190197, "epoch": 1132} {"train_loss": -10.750320434570312, "global_step": 190198, "epoch": 1132} {"train_loss": -10.895691871643066, "global_step": 190199, "epoch": 1132} {"train_loss": -10.887415885925293, "global_step": 190200, "epoch": 1132} {"train_loss": -10.918624877929688, "global_step": 190201, "epoch": 1132} {"train_loss": -10.627555847167969, "global_step": 190202, "epoch": 1132} {"train_loss": -11.100289344787598, "global_step": 190203, "epoch": 1132} {"train_loss": -11.094583511352539, "global_step": 190204, "epoch": 1132} {"train_loss": -10.913819313049316, "global_step": 190205, "epoch": 1132} {"train_loss": -11.319197654724121, "global_step": 190206, "epoch": 1132} {"train_loss": -11.028496742248535, "global_step": 190207, "epoch": 1132} {"train_loss": -11.06428050994873, "global_step": 190208, "epoch": 1132} {"train_loss": -11.232457160949707, "global_step": 190209, "epoch": 1132} {"train_loss": -11.185260772705078, "global_step": 190210, "epoch": 1132} {"train_loss": -11.22361946105957, "global_step": 190211, "epoch": 1132} {"train_loss": -11.252918243408203, "global_step": 190212, "epoch": 1132} {"train_loss": -11.301496505737305, "global_step": 190213, "epoch": 1132} {"train_loss": -11.312999725341797, "global_step": 190214, "epoch": 1132} {"train_loss": -11.373489379882812, "global_step": 190215, "epoch": 1132} {"train_loss": -11.314870834350586, "global_step": 190216, "epoch": 1132} {"train_loss": -11.20072078704834, "global_step": 190217, "epoch": 1132} {"train_loss": -11.308454513549805, "global_step": 190218, "epoch": 1132} {"train_loss": -11.36621379852295, "global_step": 190219, "epoch": 1132} {"train_loss": -11.250445365905762, "global_step": 190220, "epoch": 1132} {"train_loss": -11.378870964050293, "global_step": 190221, "epoch": 1132} {"train_loss": -11.241998672485352, "global_step": 190222, "epoch": 1132} {"train_loss": -11.424591064453125, "global_step": 190223, "epoch": 1132} {"train_loss": -11.475204467773438, "global_step": 190224, "epoch": 1132} {"train_loss": -11.487634658813477, "global_step": 190225, "epoch": 1132} {"train_loss": -11.545087814331055, "global_step": 190226, "epoch": 1132} {"train_loss": -11.554065704345703, "global_step": 190227, "epoch": 1132} {"train_loss": -11.425552368164062, "global_step": 190228, "epoch": 1132} {"train_loss": -11.480745315551758, "global_step": 190229, "epoch": 1132} {"train_loss": -11.407587051391602, "global_step": 190230, "epoch": 1132} {"train_loss": -11.522048950195312, "global_step": 190231, "epoch": 1132} {"train_loss": -11.404702186584473, "global_step": 190232, "epoch": 1132} {"train_loss": -11.540024757385254, "global_step": 190233, "epoch": 1132} {"train_loss": -11.337389945983887, "global_step": 190234, "epoch": 1132} {"train_loss": -11.511592864990234, "global_step": 190235, "epoch": 1132} {"train_loss": -11.40487289428711, "global_step": 190236, "epoch": 1132} {"train_loss": -11.545608520507812, "global_step": 190237, "epoch": 1132} {"train_loss": -11.700740814208984, "global_step": 190238, "epoch": 1132} {"train_loss": -11.587871551513672, "global_step": 190239, "epoch": 1132} {"train_loss": -11.663978576660156, "global_step": 190240, "epoch": 1132} {"train_loss": -11.308893203735352, "global_step": 190241, "epoch": 1132} {"train_loss": -11.447275161743164, "global_step": 190242, "epoch": 1132} {"train_loss": -11.526603698730469, "global_step": 190243, "epoch": 1132} {"train_loss": -11.680105209350586, "global_step": 190244, "epoch": 1132} {"train_loss": -11.55724811553955, "global_step": 190245, "epoch": 1132} {"train_loss": -11.668399810791016, "global_step": 190246, "epoch": 1132} {"train_loss": -11.494979858398438, "global_step": 190247, "epoch": 1132} {"train_loss": -11.667583465576172, "global_step": 190248, "epoch": 1132} {"train_loss": -11.613700866699219, "global_step": 190249, "epoch": 1132} {"train_loss": -11.579608917236328, "global_step": 190250, "epoch": 1132} {"train_loss": -11.619546890258789, "global_step": 190251, "epoch": 1132} {"train_loss": -11.881675720214844, "global_step": 190252, "epoch": 1132} {"train_loss": -11.708683013916016, "global_step": 190253, "epoch": 1132} {"train_loss": -11.76987075805664, "global_step": 190254, "epoch": 1132} {"train_loss": -11.550304412841797, "global_step": 190255, "epoch": 1132} {"train_loss": -11.843708992004395, "global_step": 190256, "epoch": 1132} {"train_loss": -11.606977462768555, "global_step": 190257, "epoch": 1132} {"train_loss": -11.31000804901123, "global_step": 190258, "epoch": 1132} {"train_loss": -11.2181396484375, "global_step": 190259, "epoch": 1132} {"train_loss": -11.395030975341797, "global_step": 190260, "epoch": 1132} {"train_loss": -11.562410354614258, "global_step": 190261, "epoch": 1132} {"train_loss": -11.4781494140625, "global_step": 190262, "epoch": 1132} {"train_loss": -11.426746368408203, "global_step": 190263, "epoch": 1132} {"train_loss": -11.25614070892334, "global_step": 190264, "epoch": 1132} {"train_loss": -11.591890335083008, "global_step": 190265, "epoch": 1132} {"train_loss": -11.219110488891602, "global_step": 190266, "epoch": 1132} {"train_loss": -11.61993408203125, "global_step": 190267, "epoch": 1132} {"train_loss": -11.404157638549805, "global_step": 190268, "epoch": 1132} {"train_loss": -11.109021186828613, "global_step": 190269, "epoch": 1132} {"train_loss": -10.36976432800293, "global_step": 190270, "epoch": 1132} {"train_loss": -11.41734790802002, "global_step": 190271, "epoch": 1132} {"train_loss": -10.752913475036621, "global_step": 190272, "epoch": 1132} {"train_loss": -8.7517671585083, "global_step": 190273, "epoch": 1132} {"train_loss": -10.626737594604492, "global_step": 190274, "epoch": 1132} {"train_loss": -10.804386138916016, "global_step": 190275, "epoch": 1132} {"train_loss": -10.75405502319336, "global_step": 190276, "epoch": 1132} {"train_loss": -10.401309967041016, "global_step": 190277, "epoch": 1132} {"train_loss": -10.98976993560791, "global_step": 190278, "epoch": 1132} {"train_loss": -10.324199676513672, "global_step": 190279, "epoch": 1132} {"train_loss": -11.125640869140625, "global_step": 190280, "epoch": 1132} {"train_loss": -10.952539443969727, "global_step": 190281, "epoch": 1132} {"train_loss": -10.603559494018555, "global_step": 190282, "epoch": 1132} {"train_loss": -10.053354263305664, "global_step": 190283, "epoch": 1132} {"train_loss": -10.823695182800293, "global_step": 190284, "epoch": 1132} {"train_loss": -10.10047721862793, "global_step": 190285, "epoch": 1132} {"train_loss": -10.076009750366211, "global_step": 190286, "epoch": 1132} {"train_loss": -10.545753479003906, "global_step": 190287, "epoch": 1132} {"train_loss": -10.221900939941406, "global_step": 190288, "epoch": 1132} {"train_loss": -10.094276428222656, "global_step": 190289, "epoch": 1132} {"train_loss": -10.645560264587402, "global_step": 190290, "epoch": 1132} {"train_loss": -10.64920425415039, "global_step": 190291, "epoch": 1132} {"train_loss": -10.48957633972168, "global_step": 190292, "epoch": 1132} {"train_loss": -10.481407165527344, "global_step": 190293, "epoch": 1132} {"train_loss": -11.062241554260254, "global_step": 190294, "epoch": 1132} {"train_loss": -10.501181602478027, "global_step": 190295, "epoch": 1132} {"train_loss": -10.65542984008789, "global_step": 190296, "epoch": 1132} {"train_loss": -10.684724807739258, "global_step": 190297, "epoch": 1132} {"train_loss": -10.739710807800293, "global_step": 190298, "epoch": 1132} {"train_loss": -10.484132766723633, "global_step": 190299, "epoch": 1132} {"train_loss": -11.011323928833008, "global_step": 190300, "epoch": 1132} {"train_loss": -10.642850875854492, "global_step": 190301, "epoch": 1132} {"train_loss": -11.022497177124023, "global_step": 190302, "epoch": 1132} {"train_loss": -10.698941230773926, "global_step": 190303, "epoch": 1132} {"train_loss": -10.797597885131836, "global_step": 190304, "epoch": 1132} {"train_loss": -10.92294692993164, "global_step": 190305, "epoch": 1132} {"train_loss": -10.92104434967041, "global_step": 190306, "epoch": 1132} {"train_loss": -10.783369064331055, "global_step": 190307, "epoch": 1132} {"train_loss": -11.160173416137695, "global_step": 190308, "epoch": 1132} {"train_loss": -10.930852890014648, "global_step": 190309, "epoch": 1132} {"train_loss": -10.859354019165039, "global_step": 190310, "epoch": 1132} {"train_loss": -11.10155963897705, "global_step": 190311, "epoch": 1132} {"train_loss": -11.182369232177734, "global_step": 190312, "epoch": 1132} {"train_loss": -10.967214584350586, "global_step": 190313, "epoch": 1132} {"train_loss": -11.062271118164062, "global_step": 190314, "epoch": 1132} {"train_loss": -10.987854957580566, "global_step": 190315, "epoch": 1132} {"train_loss": -11.2787446975708, "global_step": 190316, "epoch": 1132} {"train_loss": -11.08287525177002, "global_step": 190317, "epoch": 1132} {"train_loss": -11.033926963806152, "global_step": 190318, "epoch": 1132} {"train_loss": -11.357620239257812, "global_step": 190319, "epoch": 1132} {"train_loss": -11.330368041992188, "global_step": 190320, "epoch": 1132} {"train_loss": -11.190849304199219, "global_step": 190321, "epoch": 1132} {"train_loss": -11.155357360839844, "global_step": 190322, "epoch": 1132} {"train_loss": -11.266082763671875, "global_step": 190323, "epoch": 1132} {"train_loss": -11.525224685668945, "global_step": 190324, "epoch": 1132} {"train_loss": -11.277019500732422, "global_step": 190325, "epoch": 1132} {"train_loss": -11.43267822265625, "global_step": 190326, "epoch": 1132} {"train_loss": -11.44304370880127, "global_step": 190327, "epoch": 1132} {"train_loss": -11.331171989440918, "global_step": 190328, "epoch": 1132} {"train_loss": -11.47000503540039, "global_step": 190329, "epoch": 1132} {"train_loss": -11.518804550170898, "global_step": 190330, "epoch": 1132} {"train_loss": -11.577800750732422, "global_step": 190331, "epoch": 1132} {"train_loss": -11.490468978881836, "global_step": 190332, "epoch": 1132} {"train_loss": -11.444819450378418, "global_step": 190333, "epoch": 1132} {"train_loss": -11.45247745513916, "global_step": 190334, "epoch": 1132} {"train_loss": -11.596139907836914, "global_step": 190335, "epoch": 1132} {"train_loss": -11.665863037109375, "global_step": 190336, "epoch": 1132} {"train_loss": -11.58001708984375, "global_step": 190337, "epoch": 1132} {"train_loss": -11.728582382202148, "global_step": 190338, "epoch": 1132} {"train_loss": -11.752756118774414, "global_step": 190339, "epoch": 1132} {"train_loss": -11.608352661132812, "global_step": 190340, "epoch": 1132} {"train_loss": -11.464599609375, "global_step": 190341, "epoch": 1132} {"train_loss": -11.612541198730469, "global_step": 190342, "epoch": 1132} {"train_loss": -11.077219139961969, "global_step": 190343, "epoch": 1132, "val_loss": 249317.984375} {"train_loss": -11.614007949829102, "global_step": 190344, "epoch": 1133} {"train_loss": -11.721267700195312, "global_step": 190345, "epoch": 1133} {"train_loss": -11.747611045837402, "global_step": 190346, "epoch": 1133} {"train_loss": -11.709083557128906, "global_step": 190347, "epoch": 1133} {"train_loss": -11.697200775146484, "global_step": 190348, "epoch": 1133} {"train_loss": -11.824334144592285, "global_step": 190349, "epoch": 1133} {"train_loss": -11.785564422607422, "global_step": 190350, "epoch": 1133} {"train_loss": -11.693363189697266, "global_step": 190351, "epoch": 1133} {"train_loss": -11.741666793823242, "global_step": 190352, "epoch": 1133} {"train_loss": -11.762543678283691, "global_step": 190353, "epoch": 1133} {"train_loss": -11.653116226196289, "global_step": 190354, "epoch": 1133} {"train_loss": -11.833341598510742, "global_step": 190355, "epoch": 1133} {"train_loss": -11.652616500854492, "global_step": 190356, "epoch": 1133} {"train_loss": -11.893494606018066, "global_step": 190357, "epoch": 1133} {"train_loss": -11.758816719055176, "global_step": 190358, "epoch": 1133} {"train_loss": -11.42624568939209, "global_step": 190359, "epoch": 1133} {"train_loss": -10.727709770202637, "global_step": 190360, "epoch": 1133} {"train_loss": -10.270181655883789, "global_step": 190361, "epoch": 1133} {"train_loss": -11.377885818481445, "global_step": 190362, "epoch": 1133} {"train_loss": -11.322858810424805, "global_step": 190363, "epoch": 1133} {"train_loss": -10.534158706665039, "global_step": 190364, "epoch": 1133} {"train_loss": -11.491270065307617, "global_step": 190365, "epoch": 1133} {"train_loss": -11.491321563720703, "global_step": 190366, "epoch": 1133} {"train_loss": -10.391042709350586, "global_step": 190367, "epoch": 1133} {"train_loss": -11.263608932495117, "global_step": 190368, "epoch": 1133} {"train_loss": -11.39892578125, "global_step": 190369, "epoch": 1133} {"train_loss": -11.014392852783203, "global_step": 190370, "epoch": 1133} {"train_loss": -11.323326110839844, "global_step": 190371, "epoch": 1133} {"train_loss": -11.767746925354004, "global_step": 190372, "epoch": 1133} {"train_loss": -10.917387008666992, "global_step": 190373, "epoch": 1133} {"train_loss": -11.148271560668945, "global_step": 190374, "epoch": 1133} {"train_loss": -11.415447235107422, "global_step": 190375, "epoch": 1133} {"train_loss": -11.123199462890625, "global_step": 190376, "epoch": 1133} {"train_loss": -11.200855255126953, "global_step": 190377, "epoch": 1133} {"train_loss": -11.210476875305176, "global_step": 190378, "epoch": 1133} {"train_loss": -11.071776390075684, "global_step": 190379, "epoch": 1133} {"train_loss": -11.402506828308105, "global_step": 190380, "epoch": 1133} {"train_loss": -11.076395034790039, "global_step": 190381, "epoch": 1133} {"train_loss": -11.518665313720703, "global_step": 190382, "epoch": 1133} {"train_loss": -11.268415451049805, "global_step": 190383, "epoch": 1133} {"train_loss": -10.979065895080566, "global_step": 190384, "epoch": 1133} {"train_loss": -11.001588821411133, "global_step": 190385, "epoch": 1133} {"train_loss": -10.811948776245117, "global_step": 190386, "epoch": 1133} {"train_loss": -11.547805786132812, "global_step": 190387, "epoch": 1133} {"train_loss": -11.131379127502441, "global_step": 190388, "epoch": 1133} {"train_loss": -10.895301818847656, "global_step": 190389, "epoch": 1133} {"train_loss": -10.414554595947266, "global_step": 190390, "epoch": 1133} {"train_loss": -11.11971378326416, "global_step": 190391, "epoch": 1133} {"train_loss": -10.721319198608398, "global_step": 190392, "epoch": 1133} {"train_loss": -10.89708137512207, "global_step": 190393, "epoch": 1133} {"train_loss": -11.29920768737793, "global_step": 190394, "epoch": 1133} {"train_loss": -10.962761878967285, "global_step": 190395, "epoch": 1133} {"train_loss": -11.20763111114502, "global_step": 190396, "epoch": 1133} {"train_loss": -11.091503143310547, "global_step": 190397, "epoch": 1133} {"train_loss": -11.137717247009277, "global_step": 190398, "epoch": 1133} {"train_loss": -11.364503860473633, "global_step": 190399, "epoch": 1133} {"train_loss": -11.207430839538574, "global_step": 190400, "epoch": 1133} {"train_loss": -11.331006050109863, "global_step": 190401, "epoch": 1133} {"train_loss": -11.038772583007812, "global_step": 190402, "epoch": 1133} {"train_loss": -11.339168548583984, "global_step": 190403, "epoch": 1133} {"train_loss": -11.402397155761719, "global_step": 190404, "epoch": 1133} {"train_loss": -11.566264152526855, "global_step": 190405, "epoch": 1133} {"train_loss": -11.418642044067383, "global_step": 190406, "epoch": 1133} {"train_loss": -11.615429878234863, "global_step": 190407, "epoch": 1133} {"train_loss": -11.28734016418457, "global_step": 190408, "epoch": 1133} {"train_loss": -11.262845993041992, "global_step": 190409, "epoch": 1133} {"train_loss": -11.475626945495605, "global_step": 190410, "epoch": 1133} {"train_loss": -11.439738273620605, "global_step": 190411, "epoch": 1133} {"train_loss": -11.397216796875, "global_step": 190412, "epoch": 1133} {"train_loss": -11.304020881652832, "global_step": 190413, "epoch": 1133} {"train_loss": -11.5593900680542, "global_step": 190414, "epoch": 1133} {"train_loss": -11.419821739196777, "global_step": 190415, "epoch": 1133} {"train_loss": -11.0887451171875, "global_step": 190416, "epoch": 1133} {"train_loss": -11.396381378173828, "global_step": 190417, "epoch": 1133} {"train_loss": -11.182613372802734, "global_step": 190418, "epoch": 1133} {"train_loss": -10.529150009155273, "global_step": 190419, "epoch": 1133} {"train_loss": -11.385719299316406, "global_step": 190420, "epoch": 1133} {"train_loss": -10.943351745605469, "global_step": 190421, "epoch": 1133} {"train_loss": -10.978726387023926, "global_step": 190422, "epoch": 1133} {"train_loss": -11.125738143920898, "global_step": 190423, "epoch": 1133} {"train_loss": -10.344510078430176, "global_step": 190424, "epoch": 1133} {"train_loss": -9.248435020446777, "global_step": 190425, "epoch": 1133} {"train_loss": -11.224700927734375, "global_step": 190426, "epoch": 1133} {"train_loss": -9.662511825561523, "global_step": 190427, "epoch": 1133} {"train_loss": -10.125296592712402, "global_step": 190428, "epoch": 1133} {"train_loss": -10.609840393066406, "global_step": 190429, "epoch": 1133} {"train_loss": -10.045215606689453, "global_step": 190430, "epoch": 1133} {"train_loss": -9.647237777709961, "global_step": 190431, "epoch": 1133} {"train_loss": -9.644522666931152, "global_step": 190432, "epoch": 1133} {"train_loss": -10.257593154907227, "global_step": 190433, "epoch": 1133} {"train_loss": -10.46009635925293, "global_step": 190434, "epoch": 1133} {"train_loss": -10.10798454284668, "global_step": 190435, "epoch": 1133} {"train_loss": -10.010236740112305, "global_step": 190436, "epoch": 1133} {"train_loss": -10.877833366394043, "global_step": 190437, "epoch": 1133} {"train_loss": -9.346260070800781, "global_step": 190438, "epoch": 1133} {"train_loss": -10.94454574584961, "global_step": 190439, "epoch": 1133} {"train_loss": -10.047956466674805, "global_step": 190440, "epoch": 1133} {"train_loss": -10.689241409301758, "global_step": 190441, "epoch": 1133} {"train_loss": -10.776525497436523, "global_step": 190442, "epoch": 1133} {"train_loss": -10.298418045043945, "global_step": 190443, "epoch": 1133} {"train_loss": -10.78840160369873, "global_step": 190444, "epoch": 1133} {"train_loss": -11.028329849243164, "global_step": 190445, "epoch": 1133} {"train_loss": -10.350576400756836, "global_step": 190446, "epoch": 1133} {"train_loss": -11.143993377685547, "global_step": 190447, "epoch": 1133} {"train_loss": -10.367597579956055, "global_step": 190448, "epoch": 1133} {"train_loss": -10.977936744689941, "global_step": 190449, "epoch": 1133} {"train_loss": -10.429308891296387, "global_step": 190450, "epoch": 1133} {"train_loss": -10.945964813232422, "global_step": 190451, "epoch": 1133} {"train_loss": -10.196707725524902, "global_step": 190452, "epoch": 1133} {"train_loss": -10.788159370422363, "global_step": 190453, "epoch": 1133} {"train_loss": -10.301273345947266, "global_step": 190454, "epoch": 1133} {"train_loss": -11.16552734375, "global_step": 190455, "epoch": 1133} {"train_loss": -11.109870910644531, "global_step": 190456, "epoch": 1133} {"train_loss": -10.691797256469727, "global_step": 190457, "epoch": 1133} {"train_loss": -11.00474739074707, "global_step": 190458, "epoch": 1133} {"train_loss": -11.043031692504883, "global_step": 190459, "epoch": 1133} {"train_loss": -11.267546653747559, "global_step": 190460, "epoch": 1133} {"train_loss": -10.844222068786621, "global_step": 190461, "epoch": 1133} {"train_loss": -11.204365730285645, "global_step": 190462, "epoch": 1133} {"train_loss": -10.924829483032227, "global_step": 190463, "epoch": 1133} {"train_loss": -11.297615051269531, "global_step": 190464, "epoch": 1133} {"train_loss": -11.176675796508789, "global_step": 190465, "epoch": 1133} {"train_loss": -10.975390434265137, "global_step": 190466, "epoch": 1133} {"train_loss": -11.215805053710938, "global_step": 190467, "epoch": 1133} {"train_loss": -11.239921569824219, "global_step": 190468, "epoch": 1133} {"train_loss": -11.002918243408203, "global_step": 190469, "epoch": 1133} {"train_loss": -10.93187141418457, "global_step": 190470, "epoch": 1133} {"train_loss": -11.262081146240234, "global_step": 190471, "epoch": 1133} {"train_loss": -10.960794448852539, "global_step": 190472, "epoch": 1133} {"train_loss": -11.183740615844727, "global_step": 190473, "epoch": 1133} {"train_loss": -11.1251859664917, "global_step": 190474, "epoch": 1133} {"train_loss": -11.127941131591797, "global_step": 190475, "epoch": 1133} {"train_loss": -11.125692367553711, "global_step": 190476, "epoch": 1133} {"train_loss": -10.914308547973633, "global_step": 190477, "epoch": 1133} {"train_loss": -10.929677963256836, "global_step": 190478, "epoch": 1133} {"train_loss": -11.244373321533203, "global_step": 190479, "epoch": 1133} {"train_loss": -11.240604400634766, "global_step": 190480, "epoch": 1133} {"train_loss": -11.214094161987305, "global_step": 190481, "epoch": 1133} {"train_loss": -11.248271942138672, "global_step": 190482, "epoch": 1133} {"train_loss": -11.101862907409668, "global_step": 190483, "epoch": 1133} {"train_loss": -11.372350692749023, "global_step": 190484, "epoch": 1133} {"train_loss": -11.018946647644043, "global_step": 190485, "epoch": 1133} {"train_loss": -11.460489273071289, "global_step": 190486, "epoch": 1133} {"train_loss": -11.24659252166748, "global_step": 190487, "epoch": 1133} {"train_loss": -11.421087265014648, "global_step": 190488, "epoch": 1133} {"train_loss": -11.468215942382812, "global_step": 190489, "epoch": 1133} {"train_loss": -11.308343887329102, "global_step": 190490, "epoch": 1133} {"train_loss": -11.534090042114258, "global_step": 190491, "epoch": 1133} {"train_loss": -11.31660270690918, "global_step": 190492, "epoch": 1133} {"train_loss": -11.52634334564209, "global_step": 190493, "epoch": 1133} {"train_loss": -11.511486053466797, "global_step": 190494, "epoch": 1133} {"train_loss": -11.52752685546875, "global_step": 190495, "epoch": 1133} {"train_loss": -11.440643310546875, "global_step": 190496, "epoch": 1133} {"train_loss": -11.660381317138672, "global_step": 190497, "epoch": 1133} {"train_loss": -11.752277374267578, "global_step": 190498, "epoch": 1133} {"train_loss": -11.612384796142578, "global_step": 190499, "epoch": 1133} {"train_loss": -11.542596817016602, "global_step": 190500, "epoch": 1133} {"train_loss": -11.474666595458984, "global_step": 190501, "epoch": 1133} {"train_loss": -11.512414932250977, "global_step": 190502, "epoch": 1133} {"train_loss": -11.336892127990723, "global_step": 190503, "epoch": 1133} {"train_loss": -11.693252563476562, "global_step": 190504, "epoch": 1133} {"train_loss": -11.501628875732422, "global_step": 190505, "epoch": 1133} {"train_loss": -11.654701232910156, "global_step": 190506, "epoch": 1133} {"train_loss": -11.598119735717773, "global_step": 190507, "epoch": 1133} {"train_loss": -11.663642883300781, "global_step": 190508, "epoch": 1133} {"train_loss": -11.586298942565918, "global_step": 190509, "epoch": 1133} {"train_loss": -11.569402694702148, "global_step": 190510, "epoch": 1133} {"train_loss": -11.118511813027519, "global_step": 190511, "epoch": 1133, "val_loss": 249476.1875} {"train_loss": -11.531903266906738, "global_step": 190512, "epoch": 1134} {"train_loss": -11.702420234680176, "global_step": 190513, "epoch": 1134} {"train_loss": -11.628618240356445, "global_step": 190514, "epoch": 1134} {"train_loss": -11.361101150512695, "global_step": 190515, "epoch": 1134} {"train_loss": -10.992650985717773, "global_step": 190516, "epoch": 1134} {"train_loss": -11.263895034790039, "global_step": 190517, "epoch": 1134} {"train_loss": -11.493181228637695, "global_step": 190518, "epoch": 1134} {"train_loss": -11.611095428466797, "global_step": 190519, "epoch": 1134} {"train_loss": -11.286678314208984, "global_step": 190520, "epoch": 1134} {"train_loss": -11.202096939086914, "global_step": 190521, "epoch": 1134} {"train_loss": -10.495232582092285, "global_step": 190522, "epoch": 1134} {"train_loss": -10.910240173339844, "global_step": 190523, "epoch": 1134} {"train_loss": -11.238617897033691, "global_step": 190524, "epoch": 1134} {"train_loss": -10.573352813720703, "global_step": 190525, "epoch": 1134} {"train_loss": -10.443882942199707, "global_step": 190526, "epoch": 1134} {"train_loss": -11.040340423583984, "global_step": 190527, "epoch": 1134} {"train_loss": -10.847860336303711, "global_step": 190528, "epoch": 1134} {"train_loss": -9.6981201171875, "global_step": 190529, "epoch": 1134} {"train_loss": -11.025696754455566, "global_step": 190530, "epoch": 1134} {"train_loss": -11.174701690673828, "global_step": 190531, "epoch": 1134} {"train_loss": -10.80626392364502, "global_step": 190532, "epoch": 1134} {"train_loss": -10.584099769592285, "global_step": 190533, "epoch": 1134} {"train_loss": -11.059798240661621, "global_step": 190534, "epoch": 1134} {"train_loss": -10.915599822998047, "global_step": 190535, "epoch": 1134} {"train_loss": -11.335458755493164, "global_step": 190536, "epoch": 1134} {"train_loss": -11.11431884765625, "global_step": 190537, "epoch": 1134} {"train_loss": -11.119882583618164, "global_step": 190538, "epoch": 1134} {"train_loss": -11.130532264709473, "global_step": 190539, "epoch": 1134} {"train_loss": -11.28276252746582, "global_step": 190540, "epoch": 1134} {"train_loss": -11.113370895385742, "global_step": 190541, "epoch": 1134} {"train_loss": -11.408483505249023, "global_step": 190542, "epoch": 1134} {"train_loss": -11.239644050598145, "global_step": 190543, "epoch": 1134} {"train_loss": -11.435903549194336, "global_step": 190544, "epoch": 1134} {"train_loss": -11.040882110595703, "global_step": 190545, "epoch": 1134} {"train_loss": -11.098742485046387, "global_step": 190546, "epoch": 1134} {"train_loss": -11.101358413696289, "global_step": 190547, "epoch": 1134} {"train_loss": -10.986849784851074, "global_step": 190548, "epoch": 1134} {"train_loss": -11.430683135986328, "global_step": 190549, "epoch": 1134} {"train_loss": -11.322348594665527, "global_step": 190550, "epoch": 1134} {"train_loss": -11.123393058776855, "global_step": 190551, "epoch": 1134} {"train_loss": -10.732468605041504, "global_step": 190552, "epoch": 1134} {"train_loss": -11.361675262451172, "global_step": 190553, "epoch": 1134} {"train_loss": -11.054020881652832, "global_step": 190554, "epoch": 1134} {"train_loss": -10.623735427856445, "global_step": 190555, "epoch": 1134} {"train_loss": -11.43941593170166, "global_step": 190556, "epoch": 1134} {"train_loss": -10.650419235229492, "global_step": 190557, "epoch": 1134} {"train_loss": -11.318575859069824, "global_step": 190558, "epoch": 1134} {"train_loss": -10.7669677734375, "global_step": 190559, "epoch": 1134} {"train_loss": -11.213698387145996, "global_step": 190560, "epoch": 1134} {"train_loss": -11.123701095581055, "global_step": 190561, "epoch": 1134} {"train_loss": -10.893033981323242, "global_step": 190562, "epoch": 1134} {"train_loss": -10.995635986328125, "global_step": 190563, "epoch": 1134} {"train_loss": -10.89490032196045, "global_step": 190564, "epoch": 1134} {"train_loss": -11.289522171020508, "global_step": 190565, "epoch": 1134} {"train_loss": -10.845396041870117, "global_step": 190566, "epoch": 1134} {"train_loss": -11.186306953430176, "global_step": 190567, "epoch": 1134} {"train_loss": -11.062555313110352, "global_step": 190568, "epoch": 1134} {"train_loss": -11.288076400756836, "global_step": 190569, "epoch": 1134} {"train_loss": -11.048125267028809, "global_step": 190570, "epoch": 1134} {"train_loss": -11.205541610717773, "global_step": 190571, "epoch": 1134} {"train_loss": -11.37269401550293, "global_step": 190572, "epoch": 1134} {"train_loss": -11.015830039978027, "global_step": 190573, "epoch": 1134} {"train_loss": -11.033540725708008, "global_step": 190574, "epoch": 1134} {"train_loss": -11.237020492553711, "global_step": 190575, "epoch": 1134} {"train_loss": -11.376564025878906, "global_step": 190576, "epoch": 1134} {"train_loss": -11.211938858032227, "global_step": 190577, "epoch": 1134} {"train_loss": -11.313077926635742, "global_step": 190578, "epoch": 1134} {"train_loss": -11.314884185791016, "global_step": 190579, "epoch": 1134} {"train_loss": -11.405580520629883, "global_step": 190580, "epoch": 1134} {"train_loss": -11.707807540893555, "global_step": 190581, "epoch": 1134} {"train_loss": -11.335806846618652, "global_step": 190582, "epoch": 1134} {"train_loss": -11.481735229492188, "global_step": 190583, "epoch": 1134} {"train_loss": -11.262189865112305, "global_step": 190584, "epoch": 1134} {"train_loss": -11.46042251586914, "global_step": 190585, "epoch": 1134} {"train_loss": -11.32944107055664, "global_step": 190586, "epoch": 1134} {"train_loss": -11.375821113586426, "global_step": 190587, "epoch": 1134} {"train_loss": -11.206652641296387, "global_step": 190588, "epoch": 1134} {"train_loss": -11.482532501220703, "global_step": 190589, "epoch": 1134} {"train_loss": -11.57396411895752, "global_step": 190590, "epoch": 1134} {"train_loss": -11.524353981018066, "global_step": 190591, "epoch": 1134} {"train_loss": -11.469734191894531, "global_step": 190592, "epoch": 1134} {"train_loss": -11.444894790649414, "global_step": 190593, "epoch": 1134} {"train_loss": -11.570898056030273, "global_step": 190594, "epoch": 1134} {"train_loss": -11.359766960144043, "global_step": 190595, "epoch": 1134} {"train_loss": -11.753907203674316, "global_step": 190596, "epoch": 1134} {"train_loss": -11.410785675048828, "global_step": 190597, "epoch": 1134} {"train_loss": -11.555227279663086, "global_step": 190598, "epoch": 1134} {"train_loss": -11.7296724319458, "global_step": 190599, "epoch": 1134} {"train_loss": -11.501192092895508, "global_step": 190600, "epoch": 1134} {"train_loss": -11.245784759521484, "global_step": 190601, "epoch": 1134} {"train_loss": -11.348395347595215, "global_step": 190602, "epoch": 1134} {"train_loss": -11.380800247192383, "global_step": 190603, "epoch": 1134} {"train_loss": -11.489795684814453, "global_step": 190604, "epoch": 1134} {"train_loss": -10.993593215942383, "global_step": 190605, "epoch": 1134} {"train_loss": -11.565455436706543, "global_step": 190606, "epoch": 1134} {"train_loss": -10.933704376220703, "global_step": 190607, "epoch": 1134} {"train_loss": -10.856243133544922, "global_step": 190608, "epoch": 1134} {"train_loss": -11.488828659057617, "global_step": 190609, "epoch": 1134} {"train_loss": -11.222332954406738, "global_step": 190610, "epoch": 1134} {"train_loss": -11.130912780761719, "global_step": 190611, "epoch": 1134} {"train_loss": -11.521278381347656, "global_step": 190612, "epoch": 1134} {"train_loss": -11.743901252746582, "global_step": 190613, "epoch": 1134} {"train_loss": -11.480701446533203, "global_step": 190614, "epoch": 1134} {"train_loss": -11.184037208557129, "global_step": 190615, "epoch": 1134} {"train_loss": -11.422099113464355, "global_step": 190616, "epoch": 1134} {"train_loss": -11.574546813964844, "global_step": 190617, "epoch": 1134} {"train_loss": -11.597362518310547, "global_step": 190618, "epoch": 1134} {"train_loss": -11.480528831481934, "global_step": 190619, "epoch": 1134} {"train_loss": -11.594587326049805, "global_step": 190620, "epoch": 1134} {"train_loss": -11.642923355102539, "global_step": 190621, "epoch": 1134} {"train_loss": -11.490214347839355, "global_step": 190622, "epoch": 1134} {"train_loss": -11.300743103027344, "global_step": 190623, "epoch": 1134} {"train_loss": -11.249187469482422, "global_step": 190624, "epoch": 1134} {"train_loss": -11.448665618896484, "global_step": 190625, "epoch": 1134} {"train_loss": -11.508502960205078, "global_step": 190626, "epoch": 1134} {"train_loss": -11.102535247802734, "global_step": 190627, "epoch": 1134} {"train_loss": -11.518508911132812, "global_step": 190628, "epoch": 1134} {"train_loss": -11.515270233154297, "global_step": 190629, "epoch": 1134} {"train_loss": -11.373706817626953, "global_step": 190630, "epoch": 1134} {"train_loss": -11.296768188476562, "global_step": 190631, "epoch": 1134} {"train_loss": -11.19529914855957, "global_step": 190632, "epoch": 1134} {"train_loss": -11.075886726379395, "global_step": 190633, "epoch": 1134} {"train_loss": -11.068428039550781, "global_step": 190634, "epoch": 1134} {"train_loss": -11.438031196594238, "global_step": 190635, "epoch": 1134} {"train_loss": -11.201241493225098, "global_step": 190636, "epoch": 1134} {"train_loss": -11.107540130615234, "global_step": 190637, "epoch": 1134} {"train_loss": -10.776969909667969, "global_step": 190638, "epoch": 1134} {"train_loss": -11.46424388885498, "global_step": 190639, "epoch": 1134} {"train_loss": -10.995200157165527, "global_step": 190640, "epoch": 1134} {"train_loss": -10.60586929321289, "global_step": 190641, "epoch": 1134} {"train_loss": -11.017674446105957, "global_step": 190642, "epoch": 1134} {"train_loss": -11.504108428955078, "global_step": 190643, "epoch": 1134} {"train_loss": -11.232799530029297, "global_step": 190644, "epoch": 1134} {"train_loss": -10.613679885864258, "global_step": 190645, "epoch": 1134} {"train_loss": -10.990293502807617, "global_step": 190646, "epoch": 1134} {"train_loss": -11.540552139282227, "global_step": 190647, "epoch": 1134} {"train_loss": -10.728818893432617, "global_step": 190648, "epoch": 1134} {"train_loss": -10.943005561828613, "global_step": 190649, "epoch": 1134} {"train_loss": -11.393796920776367, "global_step": 190650, "epoch": 1134} {"train_loss": -10.531538963317871, "global_step": 190651, "epoch": 1134} {"train_loss": -11.102928161621094, "global_step": 190652, "epoch": 1134} {"train_loss": -10.184322357177734, "global_step": 190653, "epoch": 1134} {"train_loss": -11.39395523071289, "global_step": 190654, "epoch": 1134} {"train_loss": -10.578859329223633, "global_step": 190655, "epoch": 1134} {"train_loss": -11.376352310180664, "global_step": 190656, "epoch": 1134} {"train_loss": -11.425726890563965, "global_step": 190657, "epoch": 1134} {"train_loss": -10.867552757263184, "global_step": 190658, "epoch": 1134} {"train_loss": -11.240813255310059, "global_step": 190659, "epoch": 1134} {"train_loss": -10.912750244140625, "global_step": 190660, "epoch": 1134} {"train_loss": -11.21497917175293, "global_step": 190661, "epoch": 1134} {"train_loss": -11.242237091064453, "global_step": 190662, "epoch": 1134} {"train_loss": -11.127365112304688, "global_step": 190663, "epoch": 1134} {"train_loss": -11.47330093383789, "global_step": 190664, "epoch": 1134} {"train_loss": -11.365711212158203, "global_step": 190665, "epoch": 1134} {"train_loss": -11.473926544189453, "global_step": 190666, "epoch": 1134} {"train_loss": -11.433300018310547, "global_step": 190667, "epoch": 1134} {"train_loss": -11.388914108276367, "global_step": 190668, "epoch": 1134} {"train_loss": -11.086142539978027, "global_step": 190669, "epoch": 1134} {"train_loss": -11.243741035461426, "global_step": 190670, "epoch": 1134} {"train_loss": -10.709338188171387, "global_step": 190671, "epoch": 1134} {"train_loss": -11.37806510925293, "global_step": 190672, "epoch": 1134} {"train_loss": -11.032885551452637, "global_step": 190673, "epoch": 1134} {"train_loss": -11.392631530761719, "global_step": 190674, "epoch": 1134} {"train_loss": -11.076736450195312, "global_step": 190675, "epoch": 1134} {"train_loss": -11.40908145904541, "global_step": 190676, "epoch": 1134} {"train_loss": -11.243885040283203, "global_step": 190677, "epoch": 1134} {"train_loss": -11.274791717529297, "global_step": 190678, "epoch": 1134} {"train_loss": -11.207138237499056, "global_step": 190679, "epoch": 1134, "val_loss": 250480.453125} {"train_loss": -11.171785354614258, "global_step": 190680, "epoch": 1135} {"train_loss": -11.389023780822754, "global_step": 190681, "epoch": 1135} {"train_loss": -10.986234664916992, "global_step": 190682, "epoch": 1135} {"train_loss": -10.928417205810547, "global_step": 190683, "epoch": 1135} {"train_loss": -10.92244815826416, "global_step": 190684, "epoch": 1135} {"train_loss": -11.056122779846191, "global_step": 190685, "epoch": 1135} {"train_loss": -10.805191040039062, "global_step": 190686, "epoch": 1135} {"train_loss": -11.41588306427002, "global_step": 190687, "epoch": 1135} {"train_loss": -11.253396034240723, "global_step": 190688, "epoch": 1135} {"train_loss": -11.257580757141113, "global_step": 190689, "epoch": 1135} {"train_loss": -11.361769676208496, "global_step": 190690, "epoch": 1135} {"train_loss": -11.268226623535156, "global_step": 190691, "epoch": 1135} {"train_loss": -11.42849063873291, "global_step": 190692, "epoch": 1135} {"train_loss": -11.390501022338867, "global_step": 190693, "epoch": 1135} {"train_loss": -11.569812774658203, "global_step": 190694, "epoch": 1135} {"train_loss": -11.500711441040039, "global_step": 190695, "epoch": 1135} {"train_loss": -11.433164596557617, "global_step": 190696, "epoch": 1135} {"train_loss": -11.387507438659668, "global_step": 190697, "epoch": 1135} {"train_loss": -11.35795783996582, "global_step": 190698, "epoch": 1135} {"train_loss": -11.469205856323242, "global_step": 190699, "epoch": 1135} {"train_loss": -11.229985237121582, "global_step": 190700, "epoch": 1135} {"train_loss": -11.575759887695312, "global_step": 190701, "epoch": 1135} {"train_loss": -11.460436820983887, "global_step": 190702, "epoch": 1135} {"train_loss": -11.777442932128906, "global_step": 190703, "epoch": 1135} {"train_loss": -11.527030944824219, "global_step": 190704, "epoch": 1135} {"train_loss": -11.439191818237305, "global_step": 190705, "epoch": 1135} {"train_loss": -11.493976593017578, "global_step": 190706, "epoch": 1135} {"train_loss": -11.512409210205078, "global_step": 190707, "epoch": 1135} {"train_loss": -11.027948379516602, "global_step": 190708, "epoch": 1135} {"train_loss": -11.577288627624512, "global_step": 190709, "epoch": 1135} {"train_loss": -11.50786018371582, "global_step": 190710, "epoch": 1135} {"train_loss": -11.163390159606934, "global_step": 190711, "epoch": 1135} {"train_loss": -11.625656127929688, "global_step": 190712, "epoch": 1135} {"train_loss": -11.129926681518555, "global_step": 190713, "epoch": 1135} {"train_loss": -11.406608581542969, "global_step": 190714, "epoch": 1135} {"train_loss": -11.229633331298828, "global_step": 190715, "epoch": 1135} {"train_loss": -11.330942153930664, "global_step": 190716, "epoch": 1135} {"train_loss": -11.03283405303955, "global_step": 190717, "epoch": 1135} {"train_loss": -11.452993392944336, "global_step": 190718, "epoch": 1135} {"train_loss": -10.878490447998047, "global_step": 190719, "epoch": 1135} {"train_loss": -11.500924110412598, "global_step": 190720, "epoch": 1135} {"train_loss": -11.152884483337402, "global_step": 190721, "epoch": 1135} {"train_loss": -11.269052505493164, "global_step": 190722, "epoch": 1135} {"train_loss": -11.595799446105957, "global_step": 190723, "epoch": 1135} {"train_loss": -11.45279598236084, "global_step": 190724, "epoch": 1135} {"train_loss": -11.171602249145508, "global_step": 190725, "epoch": 1135} {"train_loss": -11.205869674682617, "global_step": 190726, "epoch": 1135} {"train_loss": -10.922258377075195, "global_step": 190727, "epoch": 1135} {"train_loss": -11.170022964477539, "global_step": 190728, "epoch": 1135} {"train_loss": -10.99980640411377, "global_step": 190729, "epoch": 1135} {"train_loss": -10.050813674926758, "global_step": 190730, "epoch": 1135} {"train_loss": -11.392118453979492, "global_step": 190731, "epoch": 1135} {"train_loss": -10.744410514831543, "global_step": 190732, "epoch": 1135} {"train_loss": -10.791065216064453, "global_step": 190733, "epoch": 1135} {"train_loss": -10.79788875579834, "global_step": 190734, "epoch": 1135} {"train_loss": -11.243900299072266, "global_step": 190735, "epoch": 1135} {"train_loss": -10.728113174438477, "global_step": 190736, "epoch": 1135} {"train_loss": -11.488043785095215, "global_step": 190737, "epoch": 1135} {"train_loss": -10.989850044250488, "global_step": 190738, "epoch": 1135} {"train_loss": -11.263223648071289, "global_step": 190739, "epoch": 1135} {"train_loss": -10.479681015014648, "global_step": 190740, "epoch": 1135} {"train_loss": -11.290886878967285, "global_step": 190741, "epoch": 1135} {"train_loss": -11.258056640625, "global_step": 190742, "epoch": 1135} {"train_loss": -11.004979133605957, "global_step": 190743, "epoch": 1135} {"train_loss": -11.028820037841797, "global_step": 190744, "epoch": 1135} {"train_loss": -11.13070297241211, "global_step": 190745, "epoch": 1135} {"train_loss": -10.909369468688965, "global_step": 190746, "epoch": 1135} {"train_loss": -10.996854782104492, "global_step": 190747, "epoch": 1135} {"train_loss": -11.050946235656738, "global_step": 190748, "epoch": 1135} {"train_loss": -10.803585052490234, "global_step": 190749, "epoch": 1135} {"train_loss": -10.788122177124023, "global_step": 190750, "epoch": 1135} {"train_loss": -11.011611938476562, "global_step": 190751, "epoch": 1135} {"train_loss": -11.486438751220703, "global_step": 190752, "epoch": 1135} {"train_loss": -11.105287551879883, "global_step": 190753, "epoch": 1135} {"train_loss": -11.16564655303955, "global_step": 190754, "epoch": 1135} {"train_loss": -10.85735034942627, "global_step": 190755, "epoch": 1135} {"train_loss": -10.996875762939453, "global_step": 190756, "epoch": 1135} {"train_loss": -10.430879592895508, "global_step": 190757, "epoch": 1135} {"train_loss": -10.632489204406738, "global_step": 190758, "epoch": 1135} {"train_loss": -9.460590362548828, "global_step": 190759, "epoch": 1135} {"train_loss": -9.968561172485352, "global_step": 190760, "epoch": 1135} {"train_loss": -9.17258071899414, "global_step": 190761, "epoch": 1135} {"train_loss": -10.630008697509766, "global_step": 190762, "epoch": 1135} {"train_loss": -10.282296180725098, "global_step": 190763, "epoch": 1135} {"train_loss": -10.633403778076172, "global_step": 190764, "epoch": 1135} {"train_loss": -10.99622631072998, "global_step": 190765, "epoch": 1135} {"train_loss": -10.567588806152344, "global_step": 190766, "epoch": 1135} {"train_loss": -11.032358169555664, "global_step": 190767, "epoch": 1135} {"train_loss": -10.569356918334961, "global_step": 190768, "epoch": 1135} {"train_loss": -10.703564643859863, "global_step": 190769, "epoch": 1135} {"train_loss": -10.080317497253418, "global_step": 190770, "epoch": 1135} {"train_loss": -10.809309959411621, "global_step": 190771, "epoch": 1135} {"train_loss": -10.952972412109375, "global_step": 190772, "epoch": 1135} {"train_loss": -11.067564010620117, "global_step": 190773, "epoch": 1135} {"train_loss": -10.457620620727539, "global_step": 190774, "epoch": 1135} {"train_loss": -11.041259765625, "global_step": 190775, "epoch": 1135} {"train_loss": -10.164320945739746, "global_step": 190776, "epoch": 1135} {"train_loss": -11.085921287536621, "global_step": 190777, "epoch": 1135} {"train_loss": -10.774089813232422, "global_step": 190778, "epoch": 1135} {"train_loss": -11.29255485534668, "global_step": 190779, "epoch": 1135} {"train_loss": -11.066862106323242, "global_step": 190780, "epoch": 1135} {"train_loss": -11.161145210266113, "global_step": 190781, "epoch": 1135} {"train_loss": -11.060829162597656, "global_step": 190782, "epoch": 1135} {"train_loss": -11.398355484008789, "global_step": 190783, "epoch": 1135} {"train_loss": -11.28814697265625, "global_step": 190784, "epoch": 1135} {"train_loss": -11.02249813079834, "global_step": 190785, "epoch": 1135} {"train_loss": -11.280740737915039, "global_step": 190786, "epoch": 1135} {"train_loss": -11.062568664550781, "global_step": 190787, "epoch": 1135} {"train_loss": -11.232544898986816, "global_step": 190788, "epoch": 1135} {"train_loss": -11.47407341003418, "global_step": 190789, "epoch": 1135} {"train_loss": -11.176133155822754, "global_step": 190790, "epoch": 1135} {"train_loss": -11.38643741607666, "global_step": 190791, "epoch": 1135} {"train_loss": -11.519254684448242, "global_step": 190792, "epoch": 1135} {"train_loss": -11.371329307556152, "global_step": 190793, "epoch": 1135} {"train_loss": -11.297184944152832, "global_step": 190794, "epoch": 1135} {"train_loss": -11.305231094360352, "global_step": 190795, "epoch": 1135} {"train_loss": -11.01885986328125, "global_step": 190796, "epoch": 1135} {"train_loss": -11.392230987548828, "global_step": 190797, "epoch": 1135} {"train_loss": -11.296350479125977, "global_step": 190798, "epoch": 1135} {"train_loss": -11.21943473815918, "global_step": 190799, "epoch": 1135} {"train_loss": -11.44623851776123, "global_step": 190800, "epoch": 1135} {"train_loss": -11.436619758605957, "global_step": 190801, "epoch": 1135} {"train_loss": -11.368102073669434, "global_step": 190802, "epoch": 1135} {"train_loss": -11.482993125915527, "global_step": 190803, "epoch": 1135} {"train_loss": -11.441884994506836, "global_step": 190804, "epoch": 1135} {"train_loss": -11.457270622253418, "global_step": 190805, "epoch": 1135} {"train_loss": -11.517948150634766, "global_step": 190806, "epoch": 1135} {"train_loss": -11.685282707214355, "global_step": 190807, "epoch": 1135} {"train_loss": -11.546548843383789, "global_step": 190808, "epoch": 1135} {"train_loss": -11.751102447509766, "global_step": 190809, "epoch": 1135} {"train_loss": -11.77818489074707, "global_step": 190810, "epoch": 1135} {"train_loss": -11.653727531433105, "global_step": 190811, "epoch": 1135} {"train_loss": -11.664609909057617, "global_step": 190812, "epoch": 1135} {"train_loss": -11.607270240783691, "global_step": 190813, "epoch": 1135} {"train_loss": -11.628327369689941, "global_step": 190814, "epoch": 1135} {"train_loss": -11.692090034484863, "global_step": 190815, "epoch": 1135} {"train_loss": -11.639202117919922, "global_step": 190816, "epoch": 1135} {"train_loss": -11.282037734985352, "global_step": 190817, "epoch": 1135} {"train_loss": -11.498226165771484, "global_step": 190818, "epoch": 1135} {"train_loss": -11.44679069519043, "global_step": 190819, "epoch": 1135} {"train_loss": -11.39661693572998, "global_step": 190820, "epoch": 1135} {"train_loss": -11.468971252441406, "global_step": 190821, "epoch": 1135} {"train_loss": -11.437396049499512, "global_step": 190822, "epoch": 1135} {"train_loss": -11.762727737426758, "global_step": 190823, "epoch": 1135} {"train_loss": -11.323518753051758, "global_step": 190824, "epoch": 1135} {"train_loss": -11.776390075683594, "global_step": 190825, "epoch": 1135} {"train_loss": -11.387473106384277, "global_step": 190826, "epoch": 1135} {"train_loss": -11.631828308105469, "global_step": 190827, "epoch": 1135} {"train_loss": -11.586965560913086, "global_step": 190828, "epoch": 1135} {"train_loss": -11.258245468139648, "global_step": 190829, "epoch": 1135} {"train_loss": -11.626338958740234, "global_step": 190830, "epoch": 1135} {"train_loss": -11.540725708007812, "global_step": 190831, "epoch": 1135} {"train_loss": -11.363889694213867, "global_step": 190832, "epoch": 1135} {"train_loss": -11.341365814208984, "global_step": 190833, "epoch": 1135} {"train_loss": -11.711339950561523, "global_step": 190834, "epoch": 1135} {"train_loss": -11.466081619262695, "global_step": 190835, "epoch": 1135} {"train_loss": -11.133350372314453, "global_step": 190836, "epoch": 1135} {"train_loss": -11.428321838378906, "global_step": 190837, "epoch": 1135} {"train_loss": -11.610284805297852, "global_step": 190838, "epoch": 1135} {"train_loss": -11.28310489654541, "global_step": 190839, "epoch": 1135} {"train_loss": -10.93368148803711, "global_step": 190840, "epoch": 1135} {"train_loss": -11.33774185180664, "global_step": 190841, "epoch": 1135} {"train_loss": -11.343118667602539, "global_step": 190842, "epoch": 1135} {"train_loss": -11.716109275817871, "global_step": 190843, "epoch": 1135} {"train_loss": -11.719326972961426, "global_step": 190844, "epoch": 1135} {"train_loss": -11.543453216552734, "global_step": 190845, "epoch": 1135} {"train_loss": -11.53158950805664, "global_step": 190846, "epoch": 1135} {"train_loss": -11.201979273841495, "global_step": 190847, "epoch": 1135, "val_loss": 248588.0, "train_action_mse_error": 0.475214421749115} {"train_loss": -11.633350372314453, "global_step": 190848, "epoch": 1136} {"train_loss": -11.736967086791992, "global_step": 190849, "epoch": 1136} {"train_loss": -11.477468490600586, "global_step": 190850, "epoch": 1136} {"train_loss": -11.353334426879883, "global_step": 190851, "epoch": 1136} {"train_loss": -11.505990982055664, "global_step": 190852, "epoch": 1136} {"train_loss": -11.536637306213379, "global_step": 190853, "epoch": 1136} {"train_loss": -11.744638442993164, "global_step": 190854, "epoch": 1136} {"train_loss": -11.490589141845703, "global_step": 190855, "epoch": 1136} {"train_loss": -11.529590606689453, "global_step": 190856, "epoch": 1136} {"train_loss": -11.486038208007812, "global_step": 190857, "epoch": 1136} {"train_loss": -11.36677360534668, "global_step": 190858, "epoch": 1136} {"train_loss": -10.948314666748047, "global_step": 190859, "epoch": 1136} {"train_loss": -10.797170639038086, "global_step": 190860, "epoch": 1136} {"train_loss": -11.453707695007324, "global_step": 190861, "epoch": 1136} {"train_loss": -11.551660537719727, "global_step": 190862, "epoch": 1136} {"train_loss": -11.015619277954102, "global_step": 190863, "epoch": 1136} {"train_loss": -10.883272171020508, "global_step": 190864, "epoch": 1136} {"train_loss": -10.489736557006836, "global_step": 190865, "epoch": 1136} {"train_loss": -11.198200225830078, "global_step": 190866, "epoch": 1136} {"train_loss": -10.340097427368164, "global_step": 190867, "epoch": 1136} {"train_loss": -10.429553985595703, "global_step": 190868, "epoch": 1136} {"train_loss": -10.381647109985352, "global_step": 190869, "epoch": 1136} {"train_loss": -8.556745529174805, "global_step": 190870, "epoch": 1136} {"train_loss": -10.097270965576172, "global_step": 190871, "epoch": 1136} {"train_loss": -8.127100944519043, "global_step": 190872, "epoch": 1136} {"train_loss": -8.303457260131836, "global_step": 190873, "epoch": 1136} {"train_loss": -9.477594375610352, "global_step": 190874, "epoch": 1136} {"train_loss": -9.318194389343262, "global_step": 190875, "epoch": 1136} {"train_loss": -9.83414077758789, "global_step": 190876, "epoch": 1136} {"train_loss": -9.870386123657227, "global_step": 190877, "epoch": 1136} {"train_loss": -9.931591033935547, "global_step": 190878, "epoch": 1136} {"train_loss": -9.90260124206543, "global_step": 190879, "epoch": 1136} {"train_loss": -10.142646789550781, "global_step": 190880, "epoch": 1136} {"train_loss": -10.59772777557373, "global_step": 190881, "epoch": 1136} {"train_loss": -10.309456825256348, "global_step": 190882, "epoch": 1136} {"train_loss": -10.54517936706543, "global_step": 190883, "epoch": 1136} {"train_loss": -10.305532455444336, "global_step": 190884, "epoch": 1136} {"train_loss": -10.490804672241211, "global_step": 190885, "epoch": 1136} {"train_loss": -10.507838249206543, "global_step": 190886, "epoch": 1136} {"train_loss": -10.433144569396973, "global_step": 190887, "epoch": 1136} {"train_loss": -10.95094108581543, "global_step": 190888, "epoch": 1136} {"train_loss": -10.411934852600098, "global_step": 190889, "epoch": 1136} {"train_loss": -10.902667045593262, "global_step": 190890, "epoch": 1136} {"train_loss": -10.445610046386719, "global_step": 190891, "epoch": 1136} {"train_loss": -10.64065170288086, "global_step": 190892, "epoch": 1136} {"train_loss": -10.795148849487305, "global_step": 190893, "epoch": 1136} {"train_loss": -10.888267517089844, "global_step": 190894, "epoch": 1136} {"train_loss": -10.618583679199219, "global_step": 190895, "epoch": 1136} {"train_loss": -11.096531867980957, "global_step": 190896, "epoch": 1136} {"train_loss": -10.916959762573242, "global_step": 190897, "epoch": 1136} {"train_loss": -10.798632621765137, "global_step": 190898, "epoch": 1136} {"train_loss": -10.783712387084961, "global_step": 190899, "epoch": 1136} {"train_loss": -10.725421905517578, "global_step": 190900, "epoch": 1136} {"train_loss": -10.70678424835205, "global_step": 190901, "epoch": 1136} {"train_loss": -11.050853729248047, "global_step": 190902, "epoch": 1136} {"train_loss": -10.985421180725098, "global_step": 190903, "epoch": 1136} {"train_loss": -10.87984561920166, "global_step": 190904, "epoch": 1136} {"train_loss": -11.105674743652344, "global_step": 190905, "epoch": 1136} {"train_loss": -11.091330528259277, "global_step": 190906, "epoch": 1136} {"train_loss": -10.977914810180664, "global_step": 190907, "epoch": 1136} {"train_loss": -11.307491302490234, "global_step": 190908, "epoch": 1136} {"train_loss": -11.212089538574219, "global_step": 190909, "epoch": 1136} {"train_loss": -11.314709663391113, "global_step": 190910, "epoch": 1136} {"train_loss": -11.063460350036621, "global_step": 190911, "epoch": 1136} {"train_loss": -11.075080871582031, "global_step": 190912, "epoch": 1136} {"train_loss": -11.206803321838379, "global_step": 190913, "epoch": 1136} {"train_loss": -11.126683235168457, "global_step": 190914, "epoch": 1136} {"train_loss": -11.265380859375, "global_step": 190915, "epoch": 1136} {"train_loss": -11.051900863647461, "global_step": 190916, "epoch": 1136} {"train_loss": -11.064696311950684, "global_step": 190917, "epoch": 1136} {"train_loss": -11.245018005371094, "global_step": 190918, "epoch": 1136} {"train_loss": -11.285276412963867, "global_step": 190919, "epoch": 1136} {"train_loss": -11.052312850952148, "global_step": 190920, "epoch": 1136} {"train_loss": -11.396480560302734, "global_step": 190921, "epoch": 1136} {"train_loss": -11.124372482299805, "global_step": 190922, "epoch": 1136} {"train_loss": -11.3370361328125, "global_step": 190923, "epoch": 1136} {"train_loss": -11.192252159118652, "global_step": 190924, "epoch": 1136} {"train_loss": -10.9839506149292, "global_step": 190925, "epoch": 1136} {"train_loss": -11.145782470703125, "global_step": 190926, "epoch": 1136} {"train_loss": -11.311777114868164, "global_step": 190927, "epoch": 1136} {"train_loss": -11.537421226501465, "global_step": 190928, "epoch": 1136} {"train_loss": -11.187236785888672, "global_step": 190929, "epoch": 1136} {"train_loss": -11.32303237915039, "global_step": 190930, "epoch": 1136} {"train_loss": -11.338702201843262, "global_step": 190931, "epoch": 1136} {"train_loss": -11.279072761535645, "global_step": 190932, "epoch": 1136} {"train_loss": -11.197134017944336, "global_step": 190933, "epoch": 1136} {"train_loss": -11.28131103515625, "global_step": 190934, "epoch": 1136} {"train_loss": -11.343368530273438, "global_step": 190935, "epoch": 1136} {"train_loss": -11.292143821716309, "global_step": 190936, "epoch": 1136} {"train_loss": -11.06936264038086, "global_step": 190937, "epoch": 1136} {"train_loss": -11.515125274658203, "global_step": 190938, "epoch": 1136} {"train_loss": -11.160198211669922, "global_step": 190939, "epoch": 1136} {"train_loss": -11.350589752197266, "global_step": 190940, "epoch": 1136} {"train_loss": -11.368467330932617, "global_step": 190941, "epoch": 1136} {"train_loss": -11.577703475952148, "global_step": 190942, "epoch": 1136} {"train_loss": -11.439838409423828, "global_step": 190943, "epoch": 1136} {"train_loss": -11.327796936035156, "global_step": 190944, "epoch": 1136} {"train_loss": -11.410212516784668, "global_step": 190945, "epoch": 1136} {"train_loss": -11.622686386108398, "global_step": 190946, "epoch": 1136} {"train_loss": -11.604898452758789, "global_step": 190947, "epoch": 1136} {"train_loss": -11.651329040527344, "global_step": 190948, "epoch": 1136} {"train_loss": -11.592241287231445, "global_step": 190949, "epoch": 1136} {"train_loss": -11.527434349060059, "global_step": 190950, "epoch": 1136} {"train_loss": -11.612752914428711, "global_step": 190951, "epoch": 1136} {"train_loss": -11.556062698364258, "global_step": 190952, "epoch": 1136} {"train_loss": -11.600894927978516, "global_step": 190953, "epoch": 1136} {"train_loss": -11.43774127960205, "global_step": 190954, "epoch": 1136} {"train_loss": -11.714117050170898, "global_step": 190955, "epoch": 1136} {"train_loss": -11.674149513244629, "global_step": 190956, "epoch": 1136} {"train_loss": -11.449264526367188, "global_step": 190957, "epoch": 1136} {"train_loss": -11.768142700195312, "global_step": 190958, "epoch": 1136} {"train_loss": -11.496399879455566, "global_step": 190959, "epoch": 1136} {"train_loss": -11.680145263671875, "global_step": 190960, "epoch": 1136} {"train_loss": -11.405572891235352, "global_step": 190961, "epoch": 1136} {"train_loss": -11.575518608093262, "global_step": 190962, "epoch": 1136} {"train_loss": -11.806621551513672, "global_step": 190963, "epoch": 1136} {"train_loss": -11.600669860839844, "global_step": 190964, "epoch": 1136} {"train_loss": -11.498485565185547, "global_step": 190965, "epoch": 1136} {"train_loss": -11.65152359008789, "global_step": 190966, "epoch": 1136} {"train_loss": -11.668148040771484, "global_step": 190967, "epoch": 1136} {"train_loss": -11.71829605102539, "global_step": 190968, "epoch": 1136} {"train_loss": -11.686055183410645, "global_step": 190969, "epoch": 1136} {"train_loss": -11.477457046508789, "global_step": 190970, "epoch": 1136} {"train_loss": -11.668495178222656, "global_step": 190971, "epoch": 1136} {"train_loss": -11.520198822021484, "global_step": 190972, "epoch": 1136} {"train_loss": -11.435426712036133, "global_step": 190973, "epoch": 1136} {"train_loss": -11.277830123901367, "global_step": 190974, "epoch": 1136} {"train_loss": -11.46683120727539, "global_step": 190975, "epoch": 1136} {"train_loss": -11.408297538757324, "global_step": 190976, "epoch": 1136} {"train_loss": -11.102832794189453, "global_step": 190977, "epoch": 1136} {"train_loss": -11.58646011352539, "global_step": 190978, "epoch": 1136} {"train_loss": -11.26754093170166, "global_step": 190979, "epoch": 1136} {"train_loss": -11.904778480529785, "global_step": 190980, "epoch": 1136} {"train_loss": -11.652685165405273, "global_step": 190981, "epoch": 1136} {"train_loss": -11.590703010559082, "global_step": 190982, "epoch": 1136} {"train_loss": -11.926576614379883, "global_step": 190983, "epoch": 1136} {"train_loss": -11.44652271270752, "global_step": 190984, "epoch": 1136} {"train_loss": -11.458292007446289, "global_step": 190985, "epoch": 1136} {"train_loss": -11.678561210632324, "global_step": 190986, "epoch": 1136} {"train_loss": -11.643640518188477, "global_step": 190987, "epoch": 1136} {"train_loss": -11.150306701660156, "global_step": 190988, "epoch": 1136} {"train_loss": -10.908172607421875, "global_step": 190989, "epoch": 1136} {"train_loss": -10.393197059631348, "global_step": 190990, "epoch": 1136} {"train_loss": -11.168041229248047, "global_step": 190991, "epoch": 1136} {"train_loss": -10.718379974365234, "global_step": 190992, "epoch": 1136} {"train_loss": -10.560420036315918, "global_step": 190993, "epoch": 1136} {"train_loss": -11.178112030029297, "global_step": 190994, "epoch": 1136} {"train_loss": -10.841928482055664, "global_step": 190995, "epoch": 1136} {"train_loss": -10.37529182434082, "global_step": 190996, "epoch": 1136} {"train_loss": -9.873607635498047, "global_step": 190997, "epoch": 1136} {"train_loss": -10.582479476928711, "global_step": 190998, "epoch": 1136} {"train_loss": -10.40797233581543, "global_step": 190999, "epoch": 1136} {"train_loss": -10.491229057312012, "global_step": 191000, "epoch": 1136} {"train_loss": -9.91641616821289, "global_step": 191001, "epoch": 1136} {"train_loss": -10.6881742477417, "global_step": 191002, "epoch": 1136} {"train_loss": -10.519121170043945, "global_step": 191003, "epoch": 1136} {"train_loss": -10.743963241577148, "global_step": 191004, "epoch": 1136} {"train_loss": -9.952609062194824, "global_step": 191005, "epoch": 1136} {"train_loss": -10.495083808898926, "global_step": 191006, "epoch": 1136} {"train_loss": -10.77511978149414, "global_step": 191007, "epoch": 1136} {"train_loss": -11.148682594299316, "global_step": 191008, "epoch": 1136} {"train_loss": -10.472869873046875, "global_step": 191009, "epoch": 1136} {"train_loss": -10.846399307250977, "global_step": 191010, "epoch": 1136} {"train_loss": -10.999011039733887, "global_step": 191011, "epoch": 1136} {"train_loss": -10.661691665649414, "global_step": 191012, "epoch": 1136} {"train_loss": -11.455501556396484, "global_step": 191013, "epoch": 1136} {"train_loss": -11.139626502990723, "global_step": 191014, "epoch": 1136} {"train_loss": -11.032172106561207, "global_step": 191015, "epoch": 1136, "val_loss": 244022.65625} {"train_loss": -10.664019584655762, "global_step": 191016, "epoch": 1137} {"train_loss": -11.254352569580078, "global_step": 191017, "epoch": 1137} {"train_loss": -10.467743873596191, "global_step": 191018, "epoch": 1137} {"train_loss": -11.030637741088867, "global_step": 191019, "epoch": 1137} {"train_loss": -10.868894577026367, "global_step": 191020, "epoch": 1137} {"train_loss": -10.915704727172852, "global_step": 191021, "epoch": 1137} {"train_loss": -10.842422485351562, "global_step": 191022, "epoch": 1137} {"train_loss": -11.038362503051758, "global_step": 191023, "epoch": 1137} {"train_loss": -10.6721830368042, "global_step": 191024, "epoch": 1137} {"train_loss": -11.205194473266602, "global_step": 191025, "epoch": 1137} {"train_loss": -10.855108261108398, "global_step": 191026, "epoch": 1137} {"train_loss": -10.944659233093262, "global_step": 191027, "epoch": 1137} {"train_loss": -10.828466415405273, "global_step": 191028, "epoch": 1137} {"train_loss": -11.069219589233398, "global_step": 191029, "epoch": 1137} {"train_loss": -10.571985244750977, "global_step": 191030, "epoch": 1137} {"train_loss": -11.099464416503906, "global_step": 191031, "epoch": 1137} {"train_loss": -10.785005569458008, "global_step": 191032, "epoch": 1137} {"train_loss": -10.972845077514648, "global_step": 191033, "epoch": 1137} {"train_loss": -10.439420700073242, "global_step": 191034, "epoch": 1137} {"train_loss": -10.712465286254883, "global_step": 191035, "epoch": 1137} {"train_loss": -10.73922061920166, "global_step": 191036, "epoch": 1137} {"train_loss": -11.326879501342773, "global_step": 191037, "epoch": 1137} {"train_loss": -10.582952499389648, "global_step": 191038, "epoch": 1137} {"train_loss": -11.287467956542969, "global_step": 191039, "epoch": 1137} {"train_loss": -10.827291488647461, "global_step": 191040, "epoch": 1137} {"train_loss": -11.039496421813965, "global_step": 191041, "epoch": 1137} {"train_loss": -11.3449125289917, "global_step": 191042, "epoch": 1137} {"train_loss": -11.111516952514648, "global_step": 191043, "epoch": 1137} {"train_loss": -11.290788650512695, "global_step": 191044, "epoch": 1137} {"train_loss": -11.232248306274414, "global_step": 191045, "epoch": 1137} {"train_loss": -11.015541076660156, "global_step": 191046, "epoch": 1137} {"train_loss": -11.362424850463867, "global_step": 191047, "epoch": 1137} {"train_loss": -11.170671463012695, "global_step": 191048, "epoch": 1137} {"train_loss": -11.274728775024414, "global_step": 191049, "epoch": 1137} {"train_loss": -11.256912231445312, "global_step": 191050, "epoch": 1137} {"train_loss": -11.414225578308105, "global_step": 191051, "epoch": 1137} {"train_loss": -11.435750007629395, "global_step": 191052, "epoch": 1137} {"train_loss": -11.55915641784668, "global_step": 191053, "epoch": 1137} {"train_loss": -11.510848999023438, "global_step": 191054, "epoch": 1137} {"train_loss": -11.321261405944824, "global_step": 191055, "epoch": 1137} {"train_loss": -11.10692310333252, "global_step": 191056, "epoch": 1137} {"train_loss": -11.235418319702148, "global_step": 191057, "epoch": 1137} {"train_loss": -11.14202880859375, "global_step": 191058, "epoch": 1137} {"train_loss": -11.341571807861328, "global_step": 191059, "epoch": 1137} {"train_loss": -11.180743217468262, "global_step": 191060, "epoch": 1137} {"train_loss": -11.14427375793457, "global_step": 191061, "epoch": 1137} {"train_loss": -11.317551612854004, "global_step": 191062, "epoch": 1137} {"train_loss": -11.279951095581055, "global_step": 191063, "epoch": 1137} {"train_loss": -11.23289680480957, "global_step": 191064, "epoch": 1137} {"train_loss": -11.380809783935547, "global_step": 191065, "epoch": 1137} {"train_loss": -10.997949600219727, "global_step": 191066, "epoch": 1137} {"train_loss": -11.19318962097168, "global_step": 191067, "epoch": 1137} {"train_loss": -10.817583084106445, "global_step": 191068, "epoch": 1137} {"train_loss": -11.00387191772461, "global_step": 191069, "epoch": 1137} {"train_loss": -10.739632606506348, "global_step": 191070, "epoch": 1137} {"train_loss": -11.230850219726562, "global_step": 191071, "epoch": 1137} {"train_loss": -11.043899536132812, "global_step": 191072, "epoch": 1137} {"train_loss": -11.029032707214355, "global_step": 191073, "epoch": 1137} {"train_loss": -10.898673057556152, "global_step": 191074, "epoch": 1137} {"train_loss": -10.758382797241211, "global_step": 191075, "epoch": 1137} {"train_loss": -10.384008407592773, "global_step": 191076, "epoch": 1137} {"train_loss": -10.449018478393555, "global_step": 191077, "epoch": 1137} {"train_loss": -9.86825180053711, "global_step": 191078, "epoch": 1137} {"train_loss": -11.071052551269531, "global_step": 191079, "epoch": 1137} {"train_loss": -10.36776351928711, "global_step": 191080, "epoch": 1137} {"train_loss": -10.909456253051758, "global_step": 191081, "epoch": 1137} {"train_loss": -10.600530624389648, "global_step": 191082, "epoch": 1137} {"train_loss": -9.805272102355957, "global_step": 191083, "epoch": 1137} {"train_loss": -10.735475540161133, "global_step": 191084, "epoch": 1137} {"train_loss": -10.447884559631348, "global_step": 191085, "epoch": 1137} {"train_loss": -10.755130767822266, "global_step": 191086, "epoch": 1137} {"train_loss": -10.514913558959961, "global_step": 191087, "epoch": 1137} {"train_loss": -10.207450866699219, "global_step": 191088, "epoch": 1137} {"train_loss": -10.334572792053223, "global_step": 191089, "epoch": 1137} {"train_loss": -10.693066596984863, "global_step": 191090, "epoch": 1137} {"train_loss": -10.604284286499023, "global_step": 191091, "epoch": 1137} {"train_loss": -10.781173706054688, "global_step": 191092, "epoch": 1137} {"train_loss": -11.038477897644043, "global_step": 191093, "epoch": 1137} {"train_loss": -10.414021492004395, "global_step": 191094, "epoch": 1137} {"train_loss": -11.039087295532227, "global_step": 191095, "epoch": 1137} {"train_loss": -10.829019546508789, "global_step": 191096, "epoch": 1137} {"train_loss": -10.605073928833008, "global_step": 191097, "epoch": 1137} {"train_loss": -10.946467399597168, "global_step": 191098, "epoch": 1137} {"train_loss": -11.132856369018555, "global_step": 191099, "epoch": 1137} {"train_loss": -10.60551643371582, "global_step": 191100, "epoch": 1137} {"train_loss": -11.292274475097656, "global_step": 191101, "epoch": 1137} {"train_loss": -10.749470710754395, "global_step": 191102, "epoch": 1137} {"train_loss": -11.121280670166016, "global_step": 191103, "epoch": 1137} {"train_loss": -10.691598892211914, "global_step": 191104, "epoch": 1137} {"train_loss": -11.124715805053711, "global_step": 191105, "epoch": 1137} {"train_loss": -10.553262710571289, "global_step": 191106, "epoch": 1137} {"train_loss": -11.100837707519531, "global_step": 191107, "epoch": 1137} {"train_loss": -10.878206253051758, "global_step": 191108, "epoch": 1137} {"train_loss": -11.092641830444336, "global_step": 191109, "epoch": 1137} {"train_loss": -11.26512336730957, "global_step": 191110, "epoch": 1137} {"train_loss": -11.031143188476562, "global_step": 191111, "epoch": 1137} {"train_loss": -11.052858352661133, "global_step": 191112, "epoch": 1137} {"train_loss": -11.148820877075195, "global_step": 191113, "epoch": 1137} {"train_loss": -11.186933517456055, "global_step": 191114, "epoch": 1137} {"train_loss": -11.162334442138672, "global_step": 191115, "epoch": 1137} {"train_loss": -11.195128440856934, "global_step": 191116, "epoch": 1137} {"train_loss": -11.414400100708008, "global_step": 191117, "epoch": 1137} {"train_loss": -11.217476844787598, "global_step": 191118, "epoch": 1137} {"train_loss": -11.071306228637695, "global_step": 191119, "epoch": 1137} {"train_loss": -11.212432861328125, "global_step": 191120, "epoch": 1137} {"train_loss": -11.296224594116211, "global_step": 191121, "epoch": 1137} {"train_loss": -11.332530975341797, "global_step": 191122, "epoch": 1137} {"train_loss": -11.137391090393066, "global_step": 191123, "epoch": 1137} {"train_loss": -11.335770606994629, "global_step": 191124, "epoch": 1137} {"train_loss": -11.199027061462402, "global_step": 191125, "epoch": 1137} {"train_loss": -11.507006645202637, "global_step": 191126, "epoch": 1137} {"train_loss": -11.580440521240234, "global_step": 191127, "epoch": 1137} {"train_loss": -11.65474796295166, "global_step": 191128, "epoch": 1137} {"train_loss": -11.613149642944336, "global_step": 191129, "epoch": 1137} {"train_loss": -11.456116676330566, "global_step": 191130, "epoch": 1137} {"train_loss": -11.569696426391602, "global_step": 191131, "epoch": 1137} {"train_loss": -11.562847137451172, "global_step": 191132, "epoch": 1137} {"train_loss": -11.640179634094238, "global_step": 191133, "epoch": 1137} {"train_loss": -11.537396430969238, "global_step": 191134, "epoch": 1137} {"train_loss": -11.419397354125977, "global_step": 191135, "epoch": 1137} {"train_loss": -11.500798225402832, "global_step": 191136, "epoch": 1137} {"train_loss": -11.347322463989258, "global_step": 191137, "epoch": 1137} {"train_loss": -11.50989055633545, "global_step": 191138, "epoch": 1137} {"train_loss": -11.809615135192871, "global_step": 191139, "epoch": 1137} {"train_loss": -11.436010360717773, "global_step": 191140, "epoch": 1137} {"train_loss": -11.80868148803711, "global_step": 191141, "epoch": 1137} {"train_loss": -11.642518997192383, "global_step": 191142, "epoch": 1137} {"train_loss": -11.620208740234375, "global_step": 191143, "epoch": 1137} {"train_loss": -11.631490707397461, "global_step": 191144, "epoch": 1137} {"train_loss": -11.656320571899414, "global_step": 191145, "epoch": 1137} {"train_loss": -11.437263488769531, "global_step": 191146, "epoch": 1137} {"train_loss": -11.532838821411133, "global_step": 191147, "epoch": 1137} {"train_loss": -11.534259796142578, "global_step": 191148, "epoch": 1137} {"train_loss": -11.475062370300293, "global_step": 191149, "epoch": 1137} {"train_loss": -11.13078498840332, "global_step": 191150, "epoch": 1137} {"train_loss": -11.27489948272705, "global_step": 191151, "epoch": 1137} {"train_loss": -11.653117179870605, "global_step": 191152, "epoch": 1137} {"train_loss": -11.568379402160645, "global_step": 191153, "epoch": 1137} {"train_loss": -11.632229804992676, "global_step": 191154, "epoch": 1137} {"train_loss": -11.579038619995117, "global_step": 191155, "epoch": 1137} {"train_loss": -11.411882400512695, "global_step": 191156, "epoch": 1137} {"train_loss": -11.866476058959961, "global_step": 191157, "epoch": 1137} {"train_loss": -11.617973327636719, "global_step": 191158, "epoch": 1137} {"train_loss": -11.568620681762695, "global_step": 191159, "epoch": 1137} {"train_loss": -11.548933982849121, "global_step": 191160, "epoch": 1137} {"train_loss": -11.680967330932617, "global_step": 191161, "epoch": 1137} {"train_loss": -11.558717727661133, "global_step": 191162, "epoch": 1137} {"train_loss": -11.38915729522705, "global_step": 191163, "epoch": 1137} {"train_loss": -11.551101684570312, "global_step": 191164, "epoch": 1137} {"train_loss": -11.352263450622559, "global_step": 191165, "epoch": 1137} {"train_loss": -11.424886703491211, "global_step": 191166, "epoch": 1137} {"train_loss": -11.595311164855957, "global_step": 191167, "epoch": 1137} {"train_loss": -11.831619262695312, "global_step": 191168, "epoch": 1137} {"train_loss": -10.698663711547852, "global_step": 191169, "epoch": 1137} {"train_loss": -11.424603462219238, "global_step": 191170, "epoch": 1137} {"train_loss": -11.582391738891602, "global_step": 191171, "epoch": 1137} {"train_loss": -11.136850357055664, "global_step": 191172, "epoch": 1137} {"train_loss": -10.464040756225586, "global_step": 191173, "epoch": 1137} {"train_loss": -11.220222473144531, "global_step": 191174, "epoch": 1137} {"train_loss": -10.02580451965332, "global_step": 191175, "epoch": 1137} {"train_loss": -9.326835632324219, "global_step": 191176, "epoch": 1137} {"train_loss": -9.92111587524414, "global_step": 191177, "epoch": 1137} {"train_loss": -11.165931701660156, "global_step": 191178, "epoch": 1137} {"train_loss": -10.198570251464844, "global_step": 191179, "epoch": 1137} {"train_loss": -9.878822326660156, "global_step": 191180, "epoch": 1137} {"train_loss": -10.494132995605469, "global_step": 191181, "epoch": 1137} {"train_loss": -11.045412063598633, "global_step": 191182, "epoch": 1137} {"train_loss": -11.090140876315889, "global_step": 191183, "epoch": 1137, "val_loss": 248092.953125} {"train_loss": -11.251655578613281, "global_step": 191184, "epoch": 1138} {"train_loss": -10.88051986694336, "global_step": 191185, "epoch": 1138} {"train_loss": -11.015331268310547, "global_step": 191186, "epoch": 1138} {"train_loss": -10.84904670715332, "global_step": 191187, "epoch": 1138} {"train_loss": -11.247269630432129, "global_step": 191188, "epoch": 1138} {"train_loss": -10.949793815612793, "global_step": 191189, "epoch": 1138} {"train_loss": -11.153188705444336, "global_step": 191190, "epoch": 1138} {"train_loss": -10.901262283325195, "global_step": 191191, "epoch": 1138} {"train_loss": -10.713111877441406, "global_step": 191192, "epoch": 1138} {"train_loss": -10.948663711547852, "global_step": 191193, "epoch": 1138} {"train_loss": -9.896391868591309, "global_step": 191194, "epoch": 1138} {"train_loss": -11.057217597961426, "global_step": 191195, "epoch": 1138} {"train_loss": -10.744266510009766, "global_step": 191196, "epoch": 1138} {"train_loss": -10.425407409667969, "global_step": 191197, "epoch": 1138} {"train_loss": -10.996465682983398, "global_step": 191198, "epoch": 1138} {"train_loss": -10.868012428283691, "global_step": 191199, "epoch": 1138} {"train_loss": -10.831755638122559, "global_step": 191200, "epoch": 1138} {"train_loss": -11.05392074584961, "global_step": 191201, "epoch": 1138} {"train_loss": -11.200034141540527, "global_step": 191202, "epoch": 1138} {"train_loss": -10.805242538452148, "global_step": 191203, "epoch": 1138} {"train_loss": -10.665508270263672, "global_step": 191204, "epoch": 1138} {"train_loss": -11.013075828552246, "global_step": 191205, "epoch": 1138} {"train_loss": -10.999966621398926, "global_step": 191206, "epoch": 1138} {"train_loss": -11.202518463134766, "global_step": 191207, "epoch": 1138} {"train_loss": -11.21906852722168, "global_step": 191208, "epoch": 1138} {"train_loss": -11.24810791015625, "global_step": 191209, "epoch": 1138} {"train_loss": -11.360557556152344, "global_step": 191210, "epoch": 1138} {"train_loss": -10.756298065185547, "global_step": 191211, "epoch": 1138} {"train_loss": -11.249902725219727, "global_step": 191212, "epoch": 1138} {"train_loss": -10.898008346557617, "global_step": 191213, "epoch": 1138} {"train_loss": -11.068042755126953, "global_step": 191214, "epoch": 1138} {"train_loss": -11.223806381225586, "global_step": 191215, "epoch": 1138} {"train_loss": -11.166498184204102, "global_step": 191216, "epoch": 1138} {"train_loss": -11.36385440826416, "global_step": 191217, "epoch": 1138} {"train_loss": -11.229925155639648, "global_step": 191218, "epoch": 1138} {"train_loss": -11.358634948730469, "global_step": 191219, "epoch": 1138} {"train_loss": -11.252086639404297, "global_step": 191220, "epoch": 1138} {"train_loss": -11.178611755371094, "global_step": 191221, "epoch": 1138} {"train_loss": -11.355183601379395, "global_step": 191222, "epoch": 1138} {"train_loss": -11.426552772521973, "global_step": 191223, "epoch": 1138} {"train_loss": -11.470510482788086, "global_step": 191224, "epoch": 1138} {"train_loss": -11.205201148986816, "global_step": 191225, "epoch": 1138} {"train_loss": -11.511505126953125, "global_step": 191226, "epoch": 1138} {"train_loss": -11.314605712890625, "global_step": 191227, "epoch": 1138} {"train_loss": -11.223588943481445, "global_step": 191228, "epoch": 1138} {"train_loss": -11.449094772338867, "global_step": 191229, "epoch": 1138} {"train_loss": -11.159003257751465, "global_step": 191230, "epoch": 1138} {"train_loss": -11.502495765686035, "global_step": 191231, "epoch": 1138} {"train_loss": -11.21892261505127, "global_step": 191232, "epoch": 1138} {"train_loss": -11.40145206451416, "global_step": 191233, "epoch": 1138} {"train_loss": -11.476040840148926, "global_step": 191234, "epoch": 1138} {"train_loss": -11.269832611083984, "global_step": 191235, "epoch": 1138} {"train_loss": -11.449686050415039, "global_step": 191236, "epoch": 1138} {"train_loss": -11.464499473571777, "global_step": 191237, "epoch": 1138} {"train_loss": -11.217885971069336, "global_step": 191238, "epoch": 1138} {"train_loss": -11.257893562316895, "global_step": 191239, "epoch": 1138} {"train_loss": -10.388519287109375, "global_step": 191240, "epoch": 1138} {"train_loss": -11.220605850219727, "global_step": 191241, "epoch": 1138} {"train_loss": -10.669651985168457, "global_step": 191242, "epoch": 1138} {"train_loss": -10.788850784301758, "global_step": 191243, "epoch": 1138} {"train_loss": -11.339868545532227, "global_step": 191244, "epoch": 1138} {"train_loss": -10.767769813537598, "global_step": 191245, "epoch": 1138} {"train_loss": -11.378124237060547, "global_step": 191246, "epoch": 1138} {"train_loss": -10.429855346679688, "global_step": 191247, "epoch": 1138} {"train_loss": -11.265209197998047, "global_step": 191248, "epoch": 1138} {"train_loss": -11.14802074432373, "global_step": 191249, "epoch": 1138} {"train_loss": -11.221015930175781, "global_step": 191250, "epoch": 1138} {"train_loss": -11.126116752624512, "global_step": 191251, "epoch": 1138} {"train_loss": -11.167489051818848, "global_step": 191252, "epoch": 1138} {"train_loss": -11.196898460388184, "global_step": 191253, "epoch": 1138} {"train_loss": -10.775470733642578, "global_step": 191254, "epoch": 1138} {"train_loss": -10.974516868591309, "global_step": 191255, "epoch": 1138} {"train_loss": -11.058589935302734, "global_step": 191256, "epoch": 1138} {"train_loss": -11.234715461730957, "global_step": 191257, "epoch": 1138} {"train_loss": -11.016794204711914, "global_step": 191258, "epoch": 1138} {"train_loss": -11.24785041809082, "global_step": 191259, "epoch": 1138} {"train_loss": -11.2734375, "global_step": 191260, "epoch": 1138} {"train_loss": -11.272767066955566, "global_step": 191261, "epoch": 1138} {"train_loss": -11.150349617004395, "global_step": 191262, "epoch": 1138} {"train_loss": -11.153830528259277, "global_step": 191263, "epoch": 1138} {"train_loss": -10.956938743591309, "global_step": 191264, "epoch": 1138} {"train_loss": -11.334182739257812, "global_step": 191265, "epoch": 1138} {"train_loss": -10.95447826385498, "global_step": 191266, "epoch": 1138} {"train_loss": -11.190423011779785, "global_step": 191267, "epoch": 1138} {"train_loss": -10.492013931274414, "global_step": 191268, "epoch": 1138} {"train_loss": -10.913846969604492, "global_step": 191269, "epoch": 1138} {"train_loss": -10.622303009033203, "global_step": 191270, "epoch": 1138} {"train_loss": -10.905963897705078, "global_step": 191271, "epoch": 1138} {"train_loss": -10.71267318725586, "global_step": 191272, "epoch": 1138} {"train_loss": -10.595569610595703, "global_step": 191273, "epoch": 1138} {"train_loss": -10.791379928588867, "global_step": 191274, "epoch": 1138} {"train_loss": -10.471490859985352, "global_step": 191275, "epoch": 1138} {"train_loss": -10.788082122802734, "global_step": 191276, "epoch": 1138} {"train_loss": -10.48342514038086, "global_step": 191277, "epoch": 1138} {"train_loss": -10.979408264160156, "global_step": 191278, "epoch": 1138} {"train_loss": -11.01443099975586, "global_step": 191279, "epoch": 1138} {"train_loss": -11.156256675720215, "global_step": 191280, "epoch": 1138} {"train_loss": -10.827339172363281, "global_step": 191281, "epoch": 1138} {"train_loss": -11.153358459472656, "global_step": 191282, "epoch": 1138} {"train_loss": -10.739513397216797, "global_step": 191283, "epoch": 1138} {"train_loss": -11.329240798950195, "global_step": 191284, "epoch": 1138} {"train_loss": -10.971168518066406, "global_step": 191285, "epoch": 1138} {"train_loss": -11.146759033203125, "global_step": 191286, "epoch": 1138} {"train_loss": -11.018571853637695, "global_step": 191287, "epoch": 1138} {"train_loss": -11.10435676574707, "global_step": 191288, "epoch": 1138} {"train_loss": -10.992008209228516, "global_step": 191289, "epoch": 1138} {"train_loss": -11.19312858581543, "global_step": 191290, "epoch": 1138} {"train_loss": -11.030061721801758, "global_step": 191291, "epoch": 1138} {"train_loss": -11.161516189575195, "global_step": 191292, "epoch": 1138} {"train_loss": -11.25155258178711, "global_step": 191293, "epoch": 1138} {"train_loss": -11.421379089355469, "global_step": 191294, "epoch": 1138} {"train_loss": -11.45217514038086, "global_step": 191295, "epoch": 1138} {"train_loss": -11.022176742553711, "global_step": 191296, "epoch": 1138} {"train_loss": -11.51882553100586, "global_step": 191297, "epoch": 1138} {"train_loss": -11.220640182495117, "global_step": 191298, "epoch": 1138} {"train_loss": -11.29006576538086, "global_step": 191299, "epoch": 1138} {"train_loss": -11.29231071472168, "global_step": 191300, "epoch": 1138} {"train_loss": -10.80994701385498, "global_step": 191301, "epoch": 1138} {"train_loss": -11.319318771362305, "global_step": 191302, "epoch": 1138} {"train_loss": -10.670598983764648, "global_step": 191303, "epoch": 1138} {"train_loss": -11.48362922668457, "global_step": 191304, "epoch": 1138} {"train_loss": -10.535364151000977, "global_step": 191305, "epoch": 1138} {"train_loss": -11.316963195800781, "global_step": 191306, "epoch": 1138} {"train_loss": -10.896775245666504, "global_step": 191307, "epoch": 1138} {"train_loss": -11.056983947753906, "global_step": 191308, "epoch": 1138} {"train_loss": -11.394027709960938, "global_step": 191309, "epoch": 1138} {"train_loss": -11.10287857055664, "global_step": 191310, "epoch": 1138} {"train_loss": -11.227432250976562, "global_step": 191311, "epoch": 1138} {"train_loss": -11.346626281738281, "global_step": 191312, "epoch": 1138} {"train_loss": -10.929957389831543, "global_step": 191313, "epoch": 1138} {"train_loss": -11.503864288330078, "global_step": 191314, "epoch": 1138} {"train_loss": -11.186264038085938, "global_step": 191315, "epoch": 1138} {"train_loss": -11.276988983154297, "global_step": 191316, "epoch": 1138} {"train_loss": -11.44387435913086, "global_step": 191317, "epoch": 1138} {"train_loss": -10.974142074584961, "global_step": 191318, "epoch": 1138} {"train_loss": -11.028804779052734, "global_step": 191319, "epoch": 1138} {"train_loss": -11.0394287109375, "global_step": 191320, "epoch": 1138} {"train_loss": -11.207986831665039, "global_step": 191321, "epoch": 1138} {"train_loss": -11.35109806060791, "global_step": 191322, "epoch": 1138} {"train_loss": -10.903338432312012, "global_step": 191323, "epoch": 1138} {"train_loss": -11.201042175292969, "global_step": 191324, "epoch": 1138} {"train_loss": -11.32360553741455, "global_step": 191325, "epoch": 1138} {"train_loss": -11.15224838256836, "global_step": 191326, "epoch": 1138} {"train_loss": -11.015697479248047, "global_step": 191327, "epoch": 1138} {"train_loss": -10.67365837097168, "global_step": 191328, "epoch": 1138} {"train_loss": -11.323355674743652, "global_step": 191329, "epoch": 1138} {"train_loss": -11.10784912109375, "global_step": 191330, "epoch": 1138} {"train_loss": -10.935696601867676, "global_step": 191331, "epoch": 1138} {"train_loss": -11.546928405761719, "global_step": 191332, "epoch": 1138} {"train_loss": -11.172475814819336, "global_step": 191333, "epoch": 1138} {"train_loss": -11.207427978515625, "global_step": 191334, "epoch": 1138} {"train_loss": -11.42111873626709, "global_step": 191335, "epoch": 1138} {"train_loss": -11.423986434936523, "global_step": 191336, "epoch": 1138} {"train_loss": -11.323095321655273, "global_step": 191337, "epoch": 1138} {"train_loss": -11.364362716674805, "global_step": 191338, "epoch": 1138} {"train_loss": -11.134202003479004, "global_step": 191339, "epoch": 1138} {"train_loss": -11.514122009277344, "global_step": 191340, "epoch": 1138} {"train_loss": -11.107551574707031, "global_step": 191341, "epoch": 1138} {"train_loss": -10.956080436706543, "global_step": 191342, "epoch": 1138} {"train_loss": -11.119367599487305, "global_step": 191343, "epoch": 1138} {"train_loss": -11.120745658874512, "global_step": 191344, "epoch": 1138} {"train_loss": -11.302947998046875, "global_step": 191345, "epoch": 1138} {"train_loss": -11.302343368530273, "global_step": 191346, "epoch": 1138} {"train_loss": -11.259111404418945, "global_step": 191347, "epoch": 1138} {"train_loss": -11.447010040283203, "global_step": 191348, "epoch": 1138} {"train_loss": -11.481973648071289, "global_step": 191349, "epoch": 1138} {"train_loss": -11.025120735168457, "global_step": 191350, "epoch": 1138} {"train_loss": -11.10496559597197, "global_step": 191351, "epoch": 1138, "val_loss": 248544.015625} {"train_loss": -11.200096130371094, "global_step": 191352, "epoch": 1139} {"train_loss": -10.735475540161133, "global_step": 191353, "epoch": 1139} {"train_loss": -10.99803352355957, "global_step": 191354, "epoch": 1139} {"train_loss": -10.764598846435547, "global_step": 191355, "epoch": 1139} {"train_loss": -10.822364807128906, "global_step": 191356, "epoch": 1139} {"train_loss": -11.134730339050293, "global_step": 191357, "epoch": 1139} {"train_loss": -11.371126174926758, "global_step": 191358, "epoch": 1139} {"train_loss": -10.845471382141113, "global_step": 191359, "epoch": 1139} {"train_loss": -11.115262985229492, "global_step": 191360, "epoch": 1139} {"train_loss": -11.382498741149902, "global_step": 191361, "epoch": 1139} {"train_loss": -11.038589477539062, "global_step": 191362, "epoch": 1139} {"train_loss": -11.372918128967285, "global_step": 191363, "epoch": 1139} {"train_loss": -11.427643775939941, "global_step": 191364, "epoch": 1139} {"train_loss": -11.542057991027832, "global_step": 191365, "epoch": 1139} {"train_loss": -11.408897399902344, "global_step": 191366, "epoch": 1139} {"train_loss": -11.497366905212402, "global_step": 191367, "epoch": 1139} {"train_loss": -11.235755920410156, "global_step": 191368, "epoch": 1139} {"train_loss": -11.359591484069824, "global_step": 191369, "epoch": 1139} {"train_loss": -11.128937721252441, "global_step": 191370, "epoch": 1139} {"train_loss": -11.38818645477295, "global_step": 191371, "epoch": 1139} {"train_loss": -11.255714416503906, "global_step": 191372, "epoch": 1139} {"train_loss": -11.239849090576172, "global_step": 191373, "epoch": 1139} {"train_loss": -11.157584190368652, "global_step": 191374, "epoch": 1139} {"train_loss": -11.264742851257324, "global_step": 191375, "epoch": 1139} {"train_loss": -11.22884750366211, "global_step": 191376, "epoch": 1139} {"train_loss": -11.061614036560059, "global_step": 191377, "epoch": 1139} {"train_loss": -11.156984329223633, "global_step": 191378, "epoch": 1139} {"train_loss": -11.393104553222656, "global_step": 191379, "epoch": 1139} {"train_loss": -11.474509239196777, "global_step": 191380, "epoch": 1139} {"train_loss": -11.099828720092773, "global_step": 191381, "epoch": 1139} {"train_loss": -11.253799438476562, "global_step": 191382, "epoch": 1139} {"train_loss": -11.493812561035156, "global_step": 191383, "epoch": 1139} {"train_loss": -11.498559951782227, "global_step": 191384, "epoch": 1139} {"train_loss": -11.590754508972168, "global_step": 191385, "epoch": 1139} {"train_loss": -11.578749656677246, "global_step": 191386, "epoch": 1139} {"train_loss": -11.41871166229248, "global_step": 191387, "epoch": 1139} {"train_loss": -11.191524505615234, "global_step": 191388, "epoch": 1139} {"train_loss": -11.19192886352539, "global_step": 191389, "epoch": 1139} {"train_loss": -11.461751937866211, "global_step": 191390, "epoch": 1139} {"train_loss": -11.490463256835938, "global_step": 191391, "epoch": 1139} {"train_loss": -11.499435424804688, "global_step": 191392, "epoch": 1139} {"train_loss": -11.411558151245117, "global_step": 191393, "epoch": 1139} {"train_loss": -11.519567489624023, "global_step": 191394, "epoch": 1139} {"train_loss": -11.458927154541016, "global_step": 191395, "epoch": 1139} {"train_loss": -11.691390991210938, "global_step": 191396, "epoch": 1139} {"train_loss": -11.560632705688477, "global_step": 191397, "epoch": 1139} {"train_loss": -11.445022583007812, "global_step": 191398, "epoch": 1139} {"train_loss": -11.224102020263672, "global_step": 191399, "epoch": 1139} {"train_loss": -11.19584846496582, "global_step": 191400, "epoch": 1139} {"train_loss": -10.97547435760498, "global_step": 191401, "epoch": 1139} {"train_loss": -11.374781608581543, "global_step": 191402, "epoch": 1139} {"train_loss": -11.130237579345703, "global_step": 191403, "epoch": 1139} {"train_loss": -11.0166597366333, "global_step": 191404, "epoch": 1139} {"train_loss": -10.561668395996094, "global_step": 191405, "epoch": 1139} {"train_loss": -11.454237937927246, "global_step": 191406, "epoch": 1139} {"train_loss": -10.624979019165039, "global_step": 191407, "epoch": 1139} {"train_loss": -10.517376899719238, "global_step": 191408, "epoch": 1139} {"train_loss": -10.957172393798828, "global_step": 191409, "epoch": 1139} {"train_loss": -11.344854354858398, "global_step": 191410, "epoch": 1139} {"train_loss": -11.310608863830566, "global_step": 191411, "epoch": 1139} {"train_loss": -11.450540542602539, "global_step": 191412, "epoch": 1139} {"train_loss": -11.235337257385254, "global_step": 191413, "epoch": 1139} {"train_loss": -10.83458137512207, "global_step": 191414, "epoch": 1139} {"train_loss": -11.308055877685547, "global_step": 191415, "epoch": 1139} {"train_loss": -11.139437675476074, "global_step": 191416, "epoch": 1139} {"train_loss": -11.578248977661133, "global_step": 191417, "epoch": 1139} {"train_loss": -11.585437774658203, "global_step": 191418, "epoch": 1139} {"train_loss": -10.952457427978516, "global_step": 191419, "epoch": 1139} {"train_loss": -10.963861465454102, "global_step": 191420, "epoch": 1139} {"train_loss": -11.43665885925293, "global_step": 191421, "epoch": 1139} {"train_loss": -11.266881942749023, "global_step": 191422, "epoch": 1139} {"train_loss": -10.918630599975586, "global_step": 191423, "epoch": 1139} {"train_loss": -11.449979782104492, "global_step": 191424, "epoch": 1139} {"train_loss": -11.479775428771973, "global_step": 191425, "epoch": 1139} {"train_loss": -11.283834457397461, "global_step": 191426, "epoch": 1139} {"train_loss": -11.114248275756836, "global_step": 191427, "epoch": 1139} {"train_loss": -11.423216819763184, "global_step": 191428, "epoch": 1139} {"train_loss": -11.165170669555664, "global_step": 191429, "epoch": 1139} {"train_loss": -10.860347747802734, "global_step": 191430, "epoch": 1139} {"train_loss": -11.41513442993164, "global_step": 191431, "epoch": 1139} {"train_loss": -10.919029235839844, "global_step": 191432, "epoch": 1139} {"train_loss": -11.126781463623047, "global_step": 191433, "epoch": 1139} {"train_loss": -11.312298774719238, "global_step": 191434, "epoch": 1139} {"train_loss": -9.779955863952637, "global_step": 191435, "epoch": 1139} {"train_loss": -11.273469924926758, "global_step": 191436, "epoch": 1139} {"train_loss": -10.401945114135742, "global_step": 191437, "epoch": 1139} {"train_loss": -10.177206039428711, "global_step": 191438, "epoch": 1139} {"train_loss": -10.810083389282227, "global_step": 191439, "epoch": 1139} {"train_loss": -10.340265274047852, "global_step": 191440, "epoch": 1139} {"train_loss": -11.189322471618652, "global_step": 191441, "epoch": 1139} {"train_loss": -10.178202629089355, "global_step": 191442, "epoch": 1139} {"train_loss": -11.137953758239746, "global_step": 191443, "epoch": 1139} {"train_loss": -10.703896522521973, "global_step": 191444, "epoch": 1139} {"train_loss": -11.22342300415039, "global_step": 191445, "epoch": 1139} {"train_loss": -11.062994003295898, "global_step": 191446, "epoch": 1139} {"train_loss": -10.978288650512695, "global_step": 191447, "epoch": 1139} {"train_loss": -11.247915267944336, "global_step": 191448, "epoch": 1139} {"train_loss": -10.979629516601562, "global_step": 191449, "epoch": 1139} {"train_loss": -11.119135856628418, "global_step": 191450, "epoch": 1139} {"train_loss": -11.10700798034668, "global_step": 191451, "epoch": 1139} {"train_loss": -11.314353942871094, "global_step": 191452, "epoch": 1139} {"train_loss": -11.162442207336426, "global_step": 191453, "epoch": 1139} {"train_loss": -11.210184097290039, "global_step": 191454, "epoch": 1139} {"train_loss": -11.42830753326416, "global_step": 191455, "epoch": 1139} {"train_loss": -10.920997619628906, "global_step": 191456, "epoch": 1139} {"train_loss": -11.443572044372559, "global_step": 191457, "epoch": 1139} {"train_loss": -10.875630378723145, "global_step": 191458, "epoch": 1139} {"train_loss": -11.34469985961914, "global_step": 191459, "epoch": 1139} {"train_loss": -11.014474868774414, "global_step": 191460, "epoch": 1139} {"train_loss": -10.958039283752441, "global_step": 191461, "epoch": 1139} {"train_loss": -11.356757164001465, "global_step": 191462, "epoch": 1139} {"train_loss": -10.862853050231934, "global_step": 191463, "epoch": 1139} {"train_loss": -11.255599975585938, "global_step": 191464, "epoch": 1139} {"train_loss": -11.04322624206543, "global_step": 191465, "epoch": 1139} {"train_loss": -11.377870559692383, "global_step": 191466, "epoch": 1139} {"train_loss": -10.827611923217773, "global_step": 191467, "epoch": 1139} {"train_loss": -11.16087818145752, "global_step": 191468, "epoch": 1139} {"train_loss": -11.022516250610352, "global_step": 191469, "epoch": 1139} {"train_loss": -11.015226364135742, "global_step": 191470, "epoch": 1139} {"train_loss": -11.370542526245117, "global_step": 191471, "epoch": 1139} {"train_loss": -11.36673355102539, "global_step": 191472, "epoch": 1139} {"train_loss": -11.436126708984375, "global_step": 191473, "epoch": 1139} {"train_loss": -11.566181182861328, "global_step": 191474, "epoch": 1139} {"train_loss": -11.46141529083252, "global_step": 191475, "epoch": 1139} {"train_loss": -11.193435668945312, "global_step": 191476, "epoch": 1139} {"train_loss": -11.610978126525879, "global_step": 191477, "epoch": 1139} {"train_loss": -11.300304412841797, "global_step": 191478, "epoch": 1139} {"train_loss": -11.528764724731445, "global_step": 191479, "epoch": 1139} {"train_loss": -11.417455673217773, "global_step": 191480, "epoch": 1139} {"train_loss": -11.29304313659668, "global_step": 191481, "epoch": 1139} {"train_loss": -11.54721450805664, "global_step": 191482, "epoch": 1139} {"train_loss": -11.339988708496094, "global_step": 191483, "epoch": 1139} {"train_loss": -11.661941528320312, "global_step": 191484, "epoch": 1139} {"train_loss": -11.010187149047852, "global_step": 191485, "epoch": 1139} {"train_loss": -11.227371215820312, "global_step": 191486, "epoch": 1139} {"train_loss": -11.184114456176758, "global_step": 191487, "epoch": 1139} {"train_loss": -11.470537185668945, "global_step": 191488, "epoch": 1139} {"train_loss": -11.243036270141602, "global_step": 191489, "epoch": 1139} {"train_loss": -11.426609992980957, "global_step": 191490, "epoch": 1139} {"train_loss": -11.621743202209473, "global_step": 191491, "epoch": 1139} {"train_loss": -11.442602157592773, "global_step": 191492, "epoch": 1139} {"train_loss": -11.536188125610352, "global_step": 191493, "epoch": 1139} {"train_loss": -11.344950675964355, "global_step": 191494, "epoch": 1139} {"train_loss": -11.386821746826172, "global_step": 191495, "epoch": 1139} {"train_loss": -11.3027982711792, "global_step": 191496, "epoch": 1139} {"train_loss": -11.784377098083496, "global_step": 191497, "epoch": 1139} {"train_loss": -11.376996994018555, "global_step": 191498, "epoch": 1139} {"train_loss": -11.54002571105957, "global_step": 191499, "epoch": 1139} {"train_loss": -11.56888484954834, "global_step": 191500, "epoch": 1139} {"train_loss": -11.553410530090332, "global_step": 191501, "epoch": 1139} {"train_loss": -11.440614700317383, "global_step": 191502, "epoch": 1139} {"train_loss": -11.350016593933105, "global_step": 191503, "epoch": 1139} {"train_loss": -11.486024856567383, "global_step": 191504, "epoch": 1139} {"train_loss": -11.22171401977539, "global_step": 191505, "epoch": 1139} {"train_loss": -11.046828269958496, "global_step": 191506, "epoch": 1139} {"train_loss": -11.465520858764648, "global_step": 191507, "epoch": 1139} {"train_loss": -11.43244743347168, "global_step": 191508, "epoch": 1139} {"train_loss": -11.180131912231445, "global_step": 191509, "epoch": 1139} {"train_loss": -11.288410186767578, "global_step": 191510, "epoch": 1139} {"train_loss": -11.243574142456055, "global_step": 191511, "epoch": 1139} {"train_loss": -11.068947792053223, "global_step": 191512, "epoch": 1139} {"train_loss": -10.801024436950684, "global_step": 191513, "epoch": 1139} {"train_loss": -11.289897918701172, "global_step": 191514, "epoch": 1139} {"train_loss": -10.122625350952148, "global_step": 191515, "epoch": 1139} {"train_loss": -10.213098526000977, "global_step": 191516, "epoch": 1139} {"train_loss": -11.234960556030273, "global_step": 191517, "epoch": 1139} {"train_loss": -9.915021896362305, "global_step": 191518, "epoch": 1139} {"train_loss": -11.197342651230949, "global_step": 191519, "epoch": 1139, "val_loss": 246874.609375} {"train_loss": -11.062771797180176, "global_step": 191520, "epoch": 1140} {"train_loss": -9.87706184387207, "global_step": 191521, "epoch": 1140} {"train_loss": -11.103559494018555, "global_step": 191522, "epoch": 1140} {"train_loss": -9.877025604248047, "global_step": 191523, "epoch": 1140} {"train_loss": -10.084221839904785, "global_step": 191524, "epoch": 1140} {"train_loss": -10.582695007324219, "global_step": 191525, "epoch": 1140} {"train_loss": -9.532861709594727, "global_step": 191526, "epoch": 1140} {"train_loss": -10.034680366516113, "global_step": 191527, "epoch": 1140} {"train_loss": -8.667991638183594, "global_step": 191528, "epoch": 1140} {"train_loss": -8.685632705688477, "global_step": 191529, "epoch": 1140} {"train_loss": -9.943412780761719, "global_step": 191530, "epoch": 1140} {"train_loss": -10.178077697753906, "global_step": 191531, "epoch": 1140} {"train_loss": -8.99608325958252, "global_step": 191532, "epoch": 1140} {"train_loss": -9.092763900756836, "global_step": 191533, "epoch": 1140} {"train_loss": -9.851476669311523, "global_step": 191534, "epoch": 1140} {"train_loss": -10.147146224975586, "global_step": 191535, "epoch": 1140} {"train_loss": -9.432011604309082, "global_step": 191536, "epoch": 1140} {"train_loss": -10.438525199890137, "global_step": 191537, "epoch": 1140} {"train_loss": -10.162982940673828, "global_step": 191538, "epoch": 1140} {"train_loss": -9.796998977661133, "global_step": 191539, "epoch": 1140} {"train_loss": -10.306062698364258, "global_step": 191540, "epoch": 1140} {"train_loss": -10.029853820800781, "global_step": 191541, "epoch": 1140} {"train_loss": -10.451881408691406, "global_step": 191542, "epoch": 1140} {"train_loss": -10.467161178588867, "global_step": 191543, "epoch": 1140} {"train_loss": -10.644567489624023, "global_step": 191544, "epoch": 1140} {"train_loss": -10.328313827514648, "global_step": 191545, "epoch": 1140} {"train_loss": -10.46800422668457, "global_step": 191546, "epoch": 1140} {"train_loss": -10.45229721069336, "global_step": 191547, "epoch": 1140} {"train_loss": -10.588211059570312, "global_step": 191548, "epoch": 1140} {"train_loss": -10.466630935668945, "global_step": 191549, "epoch": 1140} {"train_loss": -11.010974884033203, "global_step": 191550, "epoch": 1140} {"train_loss": -10.527246475219727, "global_step": 191551, "epoch": 1140} {"train_loss": -11.088966369628906, "global_step": 191552, "epoch": 1140} {"train_loss": -10.889077186584473, "global_step": 191553, "epoch": 1140} {"train_loss": -10.926547050476074, "global_step": 191554, "epoch": 1140} {"train_loss": -10.929195404052734, "global_step": 191555, "epoch": 1140} {"train_loss": -11.181852340698242, "global_step": 191556, "epoch": 1140} {"train_loss": -10.635200500488281, "global_step": 191557, "epoch": 1140} {"train_loss": -11.10546875, "global_step": 191558, "epoch": 1140} {"train_loss": -10.923205375671387, "global_step": 191559, "epoch": 1140} {"train_loss": -10.789413452148438, "global_step": 191560, "epoch": 1140} {"train_loss": -11.124916076660156, "global_step": 191561, "epoch": 1140} {"train_loss": -10.814994812011719, "global_step": 191562, "epoch": 1140} {"train_loss": -11.148018836975098, "global_step": 191563, "epoch": 1140} {"train_loss": -11.099381446838379, "global_step": 191564, "epoch": 1140} {"train_loss": -11.109455108642578, "global_step": 191565, "epoch": 1140} {"train_loss": -11.120603561401367, "global_step": 191566, "epoch": 1140} {"train_loss": -10.980791091918945, "global_step": 191567, "epoch": 1140} {"train_loss": -11.234355926513672, "global_step": 191568, "epoch": 1140} {"train_loss": -11.062873840332031, "global_step": 191569, "epoch": 1140} {"train_loss": -11.134964942932129, "global_step": 191570, "epoch": 1140} {"train_loss": -11.320852279663086, "global_step": 191571, "epoch": 1140} {"train_loss": -11.016986846923828, "global_step": 191572, "epoch": 1140} {"train_loss": -11.332521438598633, "global_step": 191573, "epoch": 1140} {"train_loss": -11.465471267700195, "global_step": 191574, "epoch": 1140} {"train_loss": -11.283711433410645, "global_step": 191575, "epoch": 1140} {"train_loss": -11.299181938171387, "global_step": 191576, "epoch": 1140} {"train_loss": -11.318713188171387, "global_step": 191577, "epoch": 1140} {"train_loss": -11.375965118408203, "global_step": 191578, "epoch": 1140} {"train_loss": -11.292377471923828, "global_step": 191579, "epoch": 1140} {"train_loss": -11.393614768981934, "global_step": 191580, "epoch": 1140} {"train_loss": -11.157787322998047, "global_step": 191581, "epoch": 1140} {"train_loss": -11.416618347167969, "global_step": 191582, "epoch": 1140} {"train_loss": -11.36184310913086, "global_step": 191583, "epoch": 1140} {"train_loss": -11.364904403686523, "global_step": 191584, "epoch": 1140} {"train_loss": -11.403192520141602, "global_step": 191585, "epoch": 1140} {"train_loss": -11.3609619140625, "global_step": 191586, "epoch": 1140} {"train_loss": -11.446393013000488, "global_step": 191587, "epoch": 1140} {"train_loss": -11.429788589477539, "global_step": 191588, "epoch": 1140} {"train_loss": -11.62480640411377, "global_step": 191589, "epoch": 1140} {"train_loss": -11.522653579711914, "global_step": 191590, "epoch": 1140} {"train_loss": -11.519868850708008, "global_step": 191591, "epoch": 1140} {"train_loss": -11.44097900390625, "global_step": 191592, "epoch": 1140} {"train_loss": -11.535215377807617, "global_step": 191593, "epoch": 1140} {"train_loss": -11.565813064575195, "global_step": 191594, "epoch": 1140} {"train_loss": -11.42431926727295, "global_step": 191595, "epoch": 1140} {"train_loss": -11.43842887878418, "global_step": 191596, "epoch": 1140} {"train_loss": -11.488393783569336, "global_step": 191597, "epoch": 1140} {"train_loss": -11.488238334655762, "global_step": 191598, "epoch": 1140} {"train_loss": -11.697940826416016, "global_step": 191599, "epoch": 1140} {"train_loss": -11.70761489868164, "global_step": 191600, "epoch": 1140} {"train_loss": -11.669942855834961, "global_step": 191601, "epoch": 1140} {"train_loss": -11.601573944091797, "global_step": 191602, "epoch": 1140} {"train_loss": -11.506650924682617, "global_step": 191603, "epoch": 1140} {"train_loss": -11.851882934570312, "global_step": 191604, "epoch": 1140} {"train_loss": -11.531488418579102, "global_step": 191605, "epoch": 1140} {"train_loss": -11.673553466796875, "global_step": 191606, "epoch": 1140} {"train_loss": -11.366511344909668, "global_step": 191607, "epoch": 1140} {"train_loss": -11.757999420166016, "global_step": 191608, "epoch": 1140} {"train_loss": -11.4825439453125, "global_step": 191609, "epoch": 1140} {"train_loss": -11.55996322631836, "global_step": 191610, "epoch": 1140} {"train_loss": -11.706032752990723, "global_step": 191611, "epoch": 1140} {"train_loss": -11.462510108947754, "global_step": 191612, "epoch": 1140} {"train_loss": -11.390421867370605, "global_step": 191613, "epoch": 1140} {"train_loss": -11.534587860107422, "global_step": 191614, "epoch": 1140} {"train_loss": -11.872310638427734, "global_step": 191615, "epoch": 1140} {"train_loss": -11.530183792114258, "global_step": 191616, "epoch": 1140} {"train_loss": -11.337166786193848, "global_step": 191617, "epoch": 1140} {"train_loss": -11.747310638427734, "global_step": 191618, "epoch": 1140} {"train_loss": -11.62994384765625, "global_step": 191619, "epoch": 1140} {"train_loss": -11.120177268981934, "global_step": 191620, "epoch": 1140} {"train_loss": -10.988666534423828, "global_step": 191621, "epoch": 1140} {"train_loss": -11.539920806884766, "global_step": 191622, "epoch": 1140} {"train_loss": -11.421156883239746, "global_step": 191623, "epoch": 1140} {"train_loss": -11.004119873046875, "global_step": 191624, "epoch": 1140} {"train_loss": -11.305758476257324, "global_step": 191625, "epoch": 1140} {"train_loss": -11.385530471801758, "global_step": 191626, "epoch": 1140} {"train_loss": -10.729787826538086, "global_step": 191627, "epoch": 1140} {"train_loss": -9.189338684082031, "global_step": 191628, "epoch": 1140} {"train_loss": -9.64480972290039, "global_step": 191629, "epoch": 1140} {"train_loss": -11.059797286987305, "global_step": 191630, "epoch": 1140} {"train_loss": -9.504670143127441, "global_step": 191631, "epoch": 1140} {"train_loss": -10.174212455749512, "global_step": 191632, "epoch": 1140} {"train_loss": -10.54753589630127, "global_step": 191633, "epoch": 1140} {"train_loss": -10.090041160583496, "global_step": 191634, "epoch": 1140} {"train_loss": -10.761789321899414, "global_step": 191635, "epoch": 1140} {"train_loss": -11.07801342010498, "global_step": 191636, "epoch": 1140} {"train_loss": -11.261916160583496, "global_step": 191637, "epoch": 1140} {"train_loss": -11.497712135314941, "global_step": 191638, "epoch": 1140} {"train_loss": -10.682329177856445, "global_step": 191639, "epoch": 1140} {"train_loss": -10.9412202835083, "global_step": 191640, "epoch": 1140} {"train_loss": -10.460077285766602, "global_step": 191641, "epoch": 1140} {"train_loss": -11.051746368408203, "global_step": 191642, "epoch": 1140} {"train_loss": -10.390276908874512, "global_step": 191643, "epoch": 1140} {"train_loss": -9.976097106933594, "global_step": 191644, "epoch": 1140} {"train_loss": -10.678030014038086, "global_step": 191645, "epoch": 1140} {"train_loss": -9.798079490661621, "global_step": 191646, "epoch": 1140} {"train_loss": -10.799098014831543, "global_step": 191647, "epoch": 1140} {"train_loss": -10.274618148803711, "global_step": 191648, "epoch": 1140} {"train_loss": -11.065279006958008, "global_step": 191649, "epoch": 1140} {"train_loss": -9.960429191589355, "global_step": 191650, "epoch": 1140} {"train_loss": -10.980894088745117, "global_step": 191651, "epoch": 1140} {"train_loss": -10.665094375610352, "global_step": 191652, "epoch": 1140} {"train_loss": -11.045103073120117, "global_step": 191653, "epoch": 1140} {"train_loss": -11.044553756713867, "global_step": 191654, "epoch": 1140} {"train_loss": -11.005533218383789, "global_step": 191655, "epoch": 1140} {"train_loss": -11.175312042236328, "global_step": 191656, "epoch": 1140} {"train_loss": -10.84253215789795, "global_step": 191657, "epoch": 1140} {"train_loss": -11.1140775680542, "global_step": 191658, "epoch": 1140} {"train_loss": -10.841888427734375, "global_step": 191659, "epoch": 1140} {"train_loss": -10.851543426513672, "global_step": 191660, "epoch": 1140} {"train_loss": -11.37878704071045, "global_step": 191661, "epoch": 1140} {"train_loss": -10.520173072814941, "global_step": 191662, "epoch": 1140} {"train_loss": -11.253449440002441, "global_step": 191663, "epoch": 1140} {"train_loss": -10.991918563842773, "global_step": 191664, "epoch": 1140} {"train_loss": -10.693879127502441, "global_step": 191665, "epoch": 1140} {"train_loss": -10.953123092651367, "global_step": 191666, "epoch": 1140} {"train_loss": -10.979490280151367, "global_step": 191667, "epoch": 1140} {"train_loss": -10.678743362426758, "global_step": 191668, "epoch": 1140} {"train_loss": -10.654258728027344, "global_step": 191669, "epoch": 1140} {"train_loss": -10.885255813598633, "global_step": 191670, "epoch": 1140} {"train_loss": -10.548524856567383, "global_step": 191671, "epoch": 1140} {"train_loss": -11.346091270446777, "global_step": 191672, "epoch": 1140} {"train_loss": -10.45318603515625, "global_step": 191673, "epoch": 1140} {"train_loss": -11.226204872131348, "global_step": 191674, "epoch": 1140} {"train_loss": -11.12695598602295, "global_step": 191675, "epoch": 1140} {"train_loss": -10.885963439941406, "global_step": 191676, "epoch": 1140} {"train_loss": -10.978925704956055, "global_step": 191677, "epoch": 1140} {"train_loss": -11.136985778808594, "global_step": 191678, "epoch": 1140} {"train_loss": -11.049190521240234, "global_step": 191679, "epoch": 1140} {"train_loss": -11.204340934753418, "global_step": 191680, "epoch": 1140} {"train_loss": -11.318540573120117, "global_step": 191681, "epoch": 1140} {"train_loss": -11.048043251037598, "global_step": 191682, "epoch": 1140} {"train_loss": -10.91196060180664, "global_step": 191683, "epoch": 1140} {"train_loss": -11.345015525817871, "global_step": 191684, "epoch": 1140} {"train_loss": -11.312899589538574, "global_step": 191685, "epoch": 1140} {"train_loss": -11.199518203735352, "global_step": 191686, "epoch": 1140} {"train_loss": -10.90810675848098, "global_step": 191687, "epoch": 1140, "val_loss": 242661.765625, "train_action_mse_error": 0.22100725769996643} {"train_loss": -11.428486824035645, "global_step": 191688, "epoch": 1141} {"train_loss": -11.10828685760498, "global_step": 191689, "epoch": 1141} {"train_loss": -11.470905303955078, "global_step": 191690, "epoch": 1141} {"train_loss": -10.95698070526123, "global_step": 191691, "epoch": 1141} {"train_loss": -11.178155899047852, "global_step": 191692, "epoch": 1141} {"train_loss": -11.051101684570312, "global_step": 191693, "epoch": 1141} {"train_loss": -11.436840057373047, "global_step": 191694, "epoch": 1141} {"train_loss": -11.315200805664062, "global_step": 191695, "epoch": 1141} {"train_loss": -11.384267807006836, "global_step": 191696, "epoch": 1141} {"train_loss": -11.52027702331543, "global_step": 191697, "epoch": 1141} {"train_loss": -11.159112930297852, "global_step": 191698, "epoch": 1141} {"train_loss": -11.526318550109863, "global_step": 191699, "epoch": 1141} {"train_loss": -11.466634750366211, "global_step": 191700, "epoch": 1141} {"train_loss": -11.474632263183594, "global_step": 191701, "epoch": 1141} {"train_loss": -11.463037490844727, "global_step": 191702, "epoch": 1141} {"train_loss": -11.327576637268066, "global_step": 191703, "epoch": 1141} {"train_loss": -11.39228343963623, "global_step": 191704, "epoch": 1141} {"train_loss": -11.569610595703125, "global_step": 191705, "epoch": 1141} {"train_loss": -11.761923789978027, "global_step": 191706, "epoch": 1141} {"train_loss": -11.541906356811523, "global_step": 191707, "epoch": 1141} {"train_loss": -11.554742813110352, "global_step": 191708, "epoch": 1141} {"train_loss": -11.47904109954834, "global_step": 191709, "epoch": 1141} {"train_loss": -11.606825828552246, "global_step": 191710, "epoch": 1141} {"train_loss": -11.390543937683105, "global_step": 191711, "epoch": 1141} {"train_loss": -11.596662521362305, "global_step": 191712, "epoch": 1141} {"train_loss": -11.60866641998291, "global_step": 191713, "epoch": 1141} {"train_loss": -11.540840148925781, "global_step": 191714, "epoch": 1141} {"train_loss": -11.656383514404297, "global_step": 191715, "epoch": 1141} {"train_loss": -11.461769104003906, "global_step": 191716, "epoch": 1141} {"train_loss": -11.174673080444336, "global_step": 191717, "epoch": 1141} {"train_loss": -11.448307037353516, "global_step": 191718, "epoch": 1141} {"train_loss": -11.653417587280273, "global_step": 191719, "epoch": 1141} {"train_loss": -11.527992248535156, "global_step": 191720, "epoch": 1141} {"train_loss": -11.647245407104492, "global_step": 191721, "epoch": 1141} {"train_loss": -11.689834594726562, "global_step": 191722, "epoch": 1141} {"train_loss": -11.738216400146484, "global_step": 191723, "epoch": 1141} {"train_loss": -11.654878616333008, "global_step": 191724, "epoch": 1141} {"train_loss": -11.558351516723633, "global_step": 191725, "epoch": 1141} {"train_loss": -11.652381896972656, "global_step": 191726, "epoch": 1141} {"train_loss": -11.772590637207031, "global_step": 191727, "epoch": 1141} {"train_loss": -11.647216796875, "global_step": 191728, "epoch": 1141} {"train_loss": -11.421460151672363, "global_step": 191729, "epoch": 1141} {"train_loss": -11.622339248657227, "global_step": 191730, "epoch": 1141} {"train_loss": -11.366147994995117, "global_step": 191731, "epoch": 1141} {"train_loss": -11.594725608825684, "global_step": 191732, "epoch": 1141} {"train_loss": -11.263633728027344, "global_step": 191733, "epoch": 1141} {"train_loss": -10.948919296264648, "global_step": 191734, "epoch": 1141} {"train_loss": -11.415050506591797, "global_step": 191735, "epoch": 1141} {"train_loss": -11.297699928283691, "global_step": 191736, "epoch": 1141} {"train_loss": -10.98825454711914, "global_step": 191737, "epoch": 1141} {"train_loss": -11.585403442382812, "global_step": 191738, "epoch": 1141} {"train_loss": -10.803885459899902, "global_step": 191739, "epoch": 1141} {"train_loss": -10.928050994873047, "global_step": 191740, "epoch": 1141} {"train_loss": -11.310033798217773, "global_step": 191741, "epoch": 1141} {"train_loss": -10.767253875732422, "global_step": 191742, "epoch": 1141} {"train_loss": -11.113579750061035, "global_step": 191743, "epoch": 1141} {"train_loss": -11.016202926635742, "global_step": 191744, "epoch": 1141} {"train_loss": -10.249950408935547, "global_step": 191745, "epoch": 1141} {"train_loss": -11.004167556762695, "global_step": 191746, "epoch": 1141} {"train_loss": -10.92552375793457, "global_step": 191747, "epoch": 1141} {"train_loss": -10.293532371520996, "global_step": 191748, "epoch": 1141} {"train_loss": -11.465084075927734, "global_step": 191749, "epoch": 1141} {"train_loss": -10.81007194519043, "global_step": 191750, "epoch": 1141} {"train_loss": -9.826898574829102, "global_step": 191751, "epoch": 1141} {"train_loss": -10.775283813476562, "global_step": 191752, "epoch": 1141} {"train_loss": -10.91340446472168, "global_step": 191753, "epoch": 1141} {"train_loss": -10.627599716186523, "global_step": 191754, "epoch": 1141} {"train_loss": -10.360342979431152, "global_step": 191755, "epoch": 1141} {"train_loss": -11.021263122558594, "global_step": 191756, "epoch": 1141} {"train_loss": -10.857215881347656, "global_step": 191757, "epoch": 1141} {"train_loss": -9.49113655090332, "global_step": 191758, "epoch": 1141} {"train_loss": -11.201116561889648, "global_step": 191759, "epoch": 1141} {"train_loss": -10.129722595214844, "global_step": 191760, "epoch": 1141} {"train_loss": -10.577775955200195, "global_step": 191761, "epoch": 1141} {"train_loss": -10.461483001708984, "global_step": 191762, "epoch": 1141} {"train_loss": -10.856316566467285, "global_step": 191763, "epoch": 1141} {"train_loss": -10.81300163269043, "global_step": 191764, "epoch": 1141} {"train_loss": -10.694703102111816, "global_step": 191765, "epoch": 1141} {"train_loss": -11.076711654663086, "global_step": 191766, "epoch": 1141} {"train_loss": -11.067108154296875, "global_step": 191767, "epoch": 1141} {"train_loss": -11.208213806152344, "global_step": 191768, "epoch": 1141} {"train_loss": -11.01612663269043, "global_step": 191769, "epoch": 1141} {"train_loss": -11.195211410522461, "global_step": 191770, "epoch": 1141} {"train_loss": -10.868727684020996, "global_step": 191771, "epoch": 1141} {"train_loss": -11.055577278137207, "global_step": 191772, "epoch": 1141} {"train_loss": -10.907186508178711, "global_step": 191773, "epoch": 1141} {"train_loss": -11.26382064819336, "global_step": 191774, "epoch": 1141} {"train_loss": -11.190536499023438, "global_step": 191775, "epoch": 1141} {"train_loss": -11.100366592407227, "global_step": 191776, "epoch": 1141} {"train_loss": -11.24893856048584, "global_step": 191777, "epoch": 1141} {"train_loss": -10.691011428833008, "global_step": 191778, "epoch": 1141} {"train_loss": -11.181137084960938, "global_step": 191779, "epoch": 1141} {"train_loss": -11.036026000976562, "global_step": 191780, "epoch": 1141} {"train_loss": -11.207765579223633, "global_step": 191781, "epoch": 1141} {"train_loss": -11.265190124511719, "global_step": 191782, "epoch": 1141} {"train_loss": -11.006669998168945, "global_step": 191783, "epoch": 1141} {"train_loss": -11.353082656860352, "global_step": 191784, "epoch": 1141} {"train_loss": -11.24179458618164, "global_step": 191785, "epoch": 1141} {"train_loss": -11.389076232910156, "global_step": 191786, "epoch": 1141} {"train_loss": -11.183441162109375, "global_step": 191787, "epoch": 1141} {"train_loss": -11.372325897216797, "global_step": 191788, "epoch": 1141} {"train_loss": -10.994451522827148, "global_step": 191789, "epoch": 1141} {"train_loss": -11.437459945678711, "global_step": 191790, "epoch": 1141} {"train_loss": -11.261009216308594, "global_step": 191791, "epoch": 1141} {"train_loss": -11.344930648803711, "global_step": 191792, "epoch": 1141} {"train_loss": -11.562461853027344, "global_step": 191793, "epoch": 1141} {"train_loss": -11.448503494262695, "global_step": 191794, "epoch": 1141} {"train_loss": -11.558874130249023, "global_step": 191795, "epoch": 1141} {"train_loss": -11.464982986450195, "global_step": 191796, "epoch": 1141} {"train_loss": -11.662854194641113, "global_step": 191797, "epoch": 1141} {"train_loss": -11.26272201538086, "global_step": 191798, "epoch": 1141} {"train_loss": -11.622171401977539, "global_step": 191799, "epoch": 1141} {"train_loss": -11.173054695129395, "global_step": 191800, "epoch": 1141} {"train_loss": -11.400527954101562, "global_step": 191801, "epoch": 1141} {"train_loss": -11.379173278808594, "global_step": 191802, "epoch": 1141} {"train_loss": -11.233833312988281, "global_step": 191803, "epoch": 1141} {"train_loss": -11.261716842651367, "global_step": 191804, "epoch": 1141} {"train_loss": -11.579121589660645, "global_step": 191805, "epoch": 1141} {"train_loss": -11.591075897216797, "global_step": 191806, "epoch": 1141} {"train_loss": -11.48045825958252, "global_step": 191807, "epoch": 1141} {"train_loss": -11.573551177978516, "global_step": 191808, "epoch": 1141} {"train_loss": -11.412698745727539, "global_step": 191809, "epoch": 1141} {"train_loss": -11.720813751220703, "global_step": 191810, "epoch": 1141} {"train_loss": -11.657905578613281, "global_step": 191811, "epoch": 1141} {"train_loss": -11.371337890625, "global_step": 191812, "epoch": 1141} {"train_loss": -11.606101989746094, "global_step": 191813, "epoch": 1141} {"train_loss": -11.71654987335205, "global_step": 191814, "epoch": 1141} {"train_loss": -11.446081161499023, "global_step": 191815, "epoch": 1141} {"train_loss": -11.525103569030762, "global_step": 191816, "epoch": 1141} {"train_loss": -11.560492515563965, "global_step": 191817, "epoch": 1141} {"train_loss": -10.782020568847656, "global_step": 191818, "epoch": 1141} {"train_loss": -11.138614654541016, "global_step": 191819, "epoch": 1141} {"train_loss": -11.188070297241211, "global_step": 191820, "epoch": 1141} {"train_loss": -10.712839126586914, "global_step": 191821, "epoch": 1141} {"train_loss": -11.323755264282227, "global_step": 191822, "epoch": 1141} {"train_loss": -11.30351448059082, "global_step": 191823, "epoch": 1141} {"train_loss": -11.240829467773438, "global_step": 191824, "epoch": 1141} {"train_loss": -11.366674423217773, "global_step": 191825, "epoch": 1141} {"train_loss": -11.281476974487305, "global_step": 191826, "epoch": 1141} {"train_loss": -11.480151176452637, "global_step": 191827, "epoch": 1141} {"train_loss": -11.262166023254395, "global_step": 191828, "epoch": 1141} {"train_loss": -11.258947372436523, "global_step": 191829, "epoch": 1141} {"train_loss": -11.489577293395996, "global_step": 191830, "epoch": 1141} {"train_loss": -11.578967094421387, "global_step": 191831, "epoch": 1141} {"train_loss": -11.469565391540527, "global_step": 191832, "epoch": 1141} {"train_loss": -11.35466194152832, "global_step": 191833, "epoch": 1141} {"train_loss": -11.392083168029785, "global_step": 191834, "epoch": 1141} {"train_loss": -11.412399291992188, "global_step": 191835, "epoch": 1141} {"train_loss": -11.574108123779297, "global_step": 191836, "epoch": 1141} {"train_loss": -11.663349151611328, "global_step": 191837, "epoch": 1141} {"train_loss": -11.667459487915039, "global_step": 191838, "epoch": 1141} {"train_loss": -11.216201782226562, "global_step": 191839, "epoch": 1141} {"train_loss": -11.299944877624512, "global_step": 191840, "epoch": 1141} {"train_loss": -11.549918174743652, "global_step": 191841, "epoch": 1141} {"train_loss": -10.562828063964844, "global_step": 191842, "epoch": 1141} {"train_loss": -11.187705993652344, "global_step": 191843, "epoch": 1141} {"train_loss": -10.809236526489258, "global_step": 191844, "epoch": 1141} {"train_loss": -11.399824142456055, "global_step": 191845, "epoch": 1141} {"train_loss": -11.336751937866211, "global_step": 191846, "epoch": 1141} {"train_loss": -11.19160270690918, "global_step": 191847, "epoch": 1141} {"train_loss": -11.023031234741211, "global_step": 191848, "epoch": 1141} {"train_loss": -10.964237213134766, "global_step": 191849, "epoch": 1141} {"train_loss": -10.698808670043945, "global_step": 191850, "epoch": 1141} {"train_loss": -11.029839515686035, "global_step": 191851, "epoch": 1141} {"train_loss": -9.571937561035156, "global_step": 191852, "epoch": 1141} {"train_loss": -11.365434646606445, "global_step": 191853, "epoch": 1141} {"train_loss": -10.03724479675293, "global_step": 191854, "epoch": 1141} {"train_loss": -11.223843875385466, "global_step": 191855, "epoch": 1141, "val_loss": 248979.828125} {"train_loss": -10.463038444519043, "global_step": 191856, "epoch": 1142} {"train_loss": -10.20671272277832, "global_step": 191857, "epoch": 1142} {"train_loss": -11.227217674255371, "global_step": 191858, "epoch": 1142} {"train_loss": -9.900809288024902, "global_step": 191859, "epoch": 1142} {"train_loss": -10.938918113708496, "global_step": 191860, "epoch": 1142} {"train_loss": -10.629722595214844, "global_step": 191861, "epoch": 1142} {"train_loss": -10.710319519042969, "global_step": 191862, "epoch": 1142} {"train_loss": -11.046875, "global_step": 191863, "epoch": 1142} {"train_loss": -10.011833190917969, "global_step": 191864, "epoch": 1142} {"train_loss": -10.149049758911133, "global_step": 191865, "epoch": 1142} {"train_loss": -10.869532585144043, "global_step": 191866, "epoch": 1142} {"train_loss": -10.52907943725586, "global_step": 191867, "epoch": 1142} {"train_loss": -10.790044784545898, "global_step": 191868, "epoch": 1142} {"train_loss": -10.452444076538086, "global_step": 191869, "epoch": 1142} {"train_loss": -10.456033706665039, "global_step": 191870, "epoch": 1142} {"train_loss": -10.908679008483887, "global_step": 191871, "epoch": 1142} {"train_loss": -10.397863388061523, "global_step": 191872, "epoch": 1142} {"train_loss": -10.742074966430664, "global_step": 191873, "epoch": 1142} {"train_loss": -10.501997947692871, "global_step": 191874, "epoch": 1142} {"train_loss": -10.560525894165039, "global_step": 191875, "epoch": 1142} {"train_loss": -10.845478057861328, "global_step": 191876, "epoch": 1142} {"train_loss": -9.98941707611084, "global_step": 191877, "epoch": 1142} {"train_loss": -10.19290828704834, "global_step": 191878, "epoch": 1142} {"train_loss": -10.668708801269531, "global_step": 191879, "epoch": 1142} {"train_loss": -10.079048156738281, "global_step": 191880, "epoch": 1142} {"train_loss": -9.391568183898926, "global_step": 191881, "epoch": 1142} {"train_loss": -10.922727584838867, "global_step": 191882, "epoch": 1142} {"train_loss": -9.156121253967285, "global_step": 191883, "epoch": 1142} {"train_loss": -10.199769973754883, "global_step": 191884, "epoch": 1142} {"train_loss": -10.502792358398438, "global_step": 191885, "epoch": 1142} {"train_loss": -10.462738037109375, "global_step": 191886, "epoch": 1142} {"train_loss": -10.489103317260742, "global_step": 191887, "epoch": 1142} {"train_loss": -10.577277183532715, "global_step": 191888, "epoch": 1142} {"train_loss": -11.076679229736328, "global_step": 191889, "epoch": 1142} {"train_loss": -10.657547950744629, "global_step": 191890, "epoch": 1142} {"train_loss": -10.637582778930664, "global_step": 191891, "epoch": 1142} {"train_loss": -10.60466194152832, "global_step": 191892, "epoch": 1142} {"train_loss": -10.637187957763672, "global_step": 191893, "epoch": 1142} {"train_loss": -10.735783576965332, "global_step": 191894, "epoch": 1142} {"train_loss": -11.217232704162598, "global_step": 191895, "epoch": 1142} {"train_loss": -10.91091537475586, "global_step": 191896, "epoch": 1142} {"train_loss": -10.919742584228516, "global_step": 191897, "epoch": 1142} {"train_loss": -11.089492797851562, "global_step": 191898, "epoch": 1142} {"train_loss": -11.14084243774414, "global_step": 191899, "epoch": 1142} {"train_loss": -11.091211318969727, "global_step": 191900, "epoch": 1142} {"train_loss": -11.093635559082031, "global_step": 191901, "epoch": 1142} {"train_loss": -11.388694763183594, "global_step": 191902, "epoch": 1142} {"train_loss": -11.286306381225586, "global_step": 191903, "epoch": 1142} {"train_loss": -11.209951400756836, "global_step": 191904, "epoch": 1142} {"train_loss": -10.917030334472656, "global_step": 191905, "epoch": 1142} {"train_loss": -11.141183853149414, "global_step": 191906, "epoch": 1142} {"train_loss": -11.333393096923828, "global_step": 191907, "epoch": 1142} {"train_loss": -11.174585342407227, "global_step": 191908, "epoch": 1142} {"train_loss": -11.168328285217285, "global_step": 191909, "epoch": 1142} {"train_loss": -11.438538551330566, "global_step": 191910, "epoch": 1142} {"train_loss": -11.275697708129883, "global_step": 191911, "epoch": 1142} {"train_loss": -11.167922973632812, "global_step": 191912, "epoch": 1142} {"train_loss": -11.465228080749512, "global_step": 191913, "epoch": 1142} {"train_loss": -11.429450988769531, "global_step": 191914, "epoch": 1142} {"train_loss": -11.476131439208984, "global_step": 191915, "epoch": 1142} {"train_loss": -11.426807403564453, "global_step": 191916, "epoch": 1142} {"train_loss": -11.391667366027832, "global_step": 191917, "epoch": 1142} {"train_loss": -11.524155616760254, "global_step": 191918, "epoch": 1142} {"train_loss": -11.386164665222168, "global_step": 191919, "epoch": 1142} {"train_loss": -11.530856132507324, "global_step": 191920, "epoch": 1142} {"train_loss": -11.448073387145996, "global_step": 191921, "epoch": 1142} {"train_loss": -11.435525894165039, "global_step": 191922, "epoch": 1142} {"train_loss": -11.339216232299805, "global_step": 191923, "epoch": 1142} {"train_loss": -11.487558364868164, "global_step": 191924, "epoch": 1142} {"train_loss": -11.506674766540527, "global_step": 191925, "epoch": 1142} {"train_loss": -11.517647743225098, "global_step": 191926, "epoch": 1142} {"train_loss": -11.489187240600586, "global_step": 191927, "epoch": 1142} {"train_loss": -11.315200805664062, "global_step": 191928, "epoch": 1142} {"train_loss": -11.351034164428711, "global_step": 191929, "epoch": 1142} {"train_loss": -11.402650833129883, "global_step": 191930, "epoch": 1142} {"train_loss": -11.237130165100098, "global_step": 191931, "epoch": 1142} {"train_loss": -11.361198425292969, "global_step": 191932, "epoch": 1142} {"train_loss": -11.233596801757812, "global_step": 191933, "epoch": 1142} {"train_loss": -11.528461456298828, "global_step": 191934, "epoch": 1142} {"train_loss": -11.435378074645996, "global_step": 191935, "epoch": 1142} {"train_loss": -10.976558685302734, "global_step": 191936, "epoch": 1142} {"train_loss": -10.997892379760742, "global_step": 191937, "epoch": 1142} {"train_loss": -11.798955917358398, "global_step": 191938, "epoch": 1142} {"train_loss": -11.589654922485352, "global_step": 191939, "epoch": 1142} {"train_loss": -11.122228622436523, "global_step": 191940, "epoch": 1142} {"train_loss": -11.092188835144043, "global_step": 191941, "epoch": 1142} {"train_loss": -11.620990753173828, "global_step": 191942, "epoch": 1142} {"train_loss": -11.314970016479492, "global_step": 191943, "epoch": 1142} {"train_loss": -11.39822769165039, "global_step": 191944, "epoch": 1142} {"train_loss": -11.52951717376709, "global_step": 191945, "epoch": 1142} {"train_loss": -11.478426933288574, "global_step": 191946, "epoch": 1142} {"train_loss": -11.322895050048828, "global_step": 191947, "epoch": 1142} {"train_loss": -11.737545013427734, "global_step": 191948, "epoch": 1142} {"train_loss": -11.277063369750977, "global_step": 191949, "epoch": 1142} {"train_loss": -11.398908615112305, "global_step": 191950, "epoch": 1142} {"train_loss": -11.69857406616211, "global_step": 191951, "epoch": 1142} {"train_loss": -11.745805740356445, "global_step": 191952, "epoch": 1142} {"train_loss": -11.162698745727539, "global_step": 191953, "epoch": 1142} {"train_loss": -11.16057014465332, "global_step": 191954, "epoch": 1142} {"train_loss": -11.406543731689453, "global_step": 191955, "epoch": 1142} {"train_loss": -11.532896041870117, "global_step": 191956, "epoch": 1142} {"train_loss": -11.562983512878418, "global_step": 191957, "epoch": 1142} {"train_loss": -11.648740768432617, "global_step": 191958, "epoch": 1142} {"train_loss": -11.253684997558594, "global_step": 191959, "epoch": 1142} {"train_loss": -11.312841415405273, "global_step": 191960, "epoch": 1142} {"train_loss": -11.458356857299805, "global_step": 191961, "epoch": 1142} {"train_loss": -11.385873794555664, "global_step": 191962, "epoch": 1142} {"train_loss": -11.555712699890137, "global_step": 191963, "epoch": 1142} {"train_loss": -11.375524520874023, "global_step": 191964, "epoch": 1142} {"train_loss": -11.401809692382812, "global_step": 191965, "epoch": 1142} {"train_loss": -10.972933769226074, "global_step": 191966, "epoch": 1142} {"train_loss": -11.361848831176758, "global_step": 191967, "epoch": 1142} {"train_loss": -10.106521606445312, "global_step": 191968, "epoch": 1142} {"train_loss": -9.37696361541748, "global_step": 191969, "epoch": 1142} {"train_loss": -9.235431671142578, "global_step": 191970, "epoch": 1142} {"train_loss": -10.72349739074707, "global_step": 191971, "epoch": 1142} {"train_loss": -10.117144584655762, "global_step": 191972, "epoch": 1142} {"train_loss": -9.306098937988281, "global_step": 191973, "epoch": 1142} {"train_loss": -9.611842155456543, "global_step": 191974, "epoch": 1142} {"train_loss": -10.01803207397461, "global_step": 191975, "epoch": 1142} {"train_loss": -11.137038230895996, "global_step": 191976, "epoch": 1142} {"train_loss": -10.48267650604248, "global_step": 191977, "epoch": 1142} {"train_loss": -10.18903923034668, "global_step": 191978, "epoch": 1142} {"train_loss": -9.692618370056152, "global_step": 191979, "epoch": 1142} {"train_loss": -9.444658279418945, "global_step": 191980, "epoch": 1142} {"train_loss": -10.16810417175293, "global_step": 191981, "epoch": 1142} {"train_loss": -9.973011016845703, "global_step": 191982, "epoch": 1142} {"train_loss": -9.667133331298828, "global_step": 191983, "epoch": 1142} {"train_loss": -10.478713989257812, "global_step": 191984, "epoch": 1142} {"train_loss": -9.443336486816406, "global_step": 191985, "epoch": 1142} {"train_loss": -9.541451454162598, "global_step": 191986, "epoch": 1142} {"train_loss": -10.240127563476562, "global_step": 191987, "epoch": 1142} {"train_loss": -10.215592384338379, "global_step": 191988, "epoch": 1142} {"train_loss": -10.120576858520508, "global_step": 191989, "epoch": 1142} {"train_loss": -10.068696975708008, "global_step": 191990, "epoch": 1142} {"train_loss": -10.884542465209961, "global_step": 191991, "epoch": 1142} {"train_loss": -9.68301010131836, "global_step": 191992, "epoch": 1142} {"train_loss": -10.472551345825195, "global_step": 191993, "epoch": 1142} {"train_loss": -9.714776039123535, "global_step": 191994, "epoch": 1142} {"train_loss": -10.510700225830078, "global_step": 191995, "epoch": 1142} {"train_loss": -9.588162422180176, "global_step": 191996, "epoch": 1142} {"train_loss": -10.627296447753906, "global_step": 191997, "epoch": 1142} {"train_loss": -10.425804138183594, "global_step": 191998, "epoch": 1142} {"train_loss": -9.64674186706543, "global_step": 191999, "epoch": 1142} {"train_loss": -10.431777954101562, "global_step": 192000, "epoch": 1142} {"train_loss": -10.309033393859863, "global_step": 192001, "epoch": 1142} {"train_loss": -10.334043502807617, "global_step": 192002, "epoch": 1142} {"train_loss": -10.372010231018066, "global_step": 192003, "epoch": 1142} {"train_loss": -10.492107391357422, "global_step": 192004, "epoch": 1142} {"train_loss": -10.731877326965332, "global_step": 192005, "epoch": 1142} {"train_loss": -10.56131649017334, "global_step": 192006, "epoch": 1142} {"train_loss": -10.632920265197754, "global_step": 192007, "epoch": 1142} {"train_loss": -11.148845672607422, "global_step": 192008, "epoch": 1142} {"train_loss": -10.826807975769043, "global_step": 192009, "epoch": 1142} {"train_loss": -10.797958374023438, "global_step": 192010, "epoch": 1142} {"train_loss": -10.819185256958008, "global_step": 192011, "epoch": 1142} {"train_loss": -10.894706726074219, "global_step": 192012, "epoch": 1142} {"train_loss": -10.744281768798828, "global_step": 192013, "epoch": 1142} {"train_loss": -10.903989791870117, "global_step": 192014, "epoch": 1142} {"train_loss": -11.060247421264648, "global_step": 192015, "epoch": 1142} {"train_loss": -10.80097770690918, "global_step": 192016, "epoch": 1142} {"train_loss": -11.088922500610352, "global_step": 192017, "epoch": 1142} {"train_loss": -11.149667739868164, "global_step": 192018, "epoch": 1142} {"train_loss": -11.090802192687988, "global_step": 192019, "epoch": 1142} {"train_loss": -10.94201946258545, "global_step": 192020, "epoch": 1142} {"train_loss": -10.924431800842285, "global_step": 192021, "epoch": 1142} {"train_loss": -11.30015754699707, "global_step": 192022, "epoch": 1142} {"train_loss": -10.82111876919156, "global_step": 192023, "epoch": 1142, "val_loss": 251304.265625} {"train_loss": -11.130145072937012, "global_step": 192024, "epoch": 1143} {"train_loss": -11.122774124145508, "global_step": 192025, "epoch": 1143} {"train_loss": -11.04078483581543, "global_step": 192026, "epoch": 1143} {"train_loss": -10.965310096740723, "global_step": 192027, "epoch": 1143} {"train_loss": -11.293402671813965, "global_step": 192028, "epoch": 1143} {"train_loss": -11.079240798950195, "global_step": 192029, "epoch": 1143} {"train_loss": -11.168306350708008, "global_step": 192030, "epoch": 1143} {"train_loss": -11.224523544311523, "global_step": 192031, "epoch": 1143} {"train_loss": -11.129590034484863, "global_step": 192032, "epoch": 1143} {"train_loss": -11.309099197387695, "global_step": 192033, "epoch": 1143} {"train_loss": -11.095743179321289, "global_step": 192034, "epoch": 1143} {"train_loss": -11.391056060791016, "global_step": 192035, "epoch": 1143} {"train_loss": -11.287102699279785, "global_step": 192036, "epoch": 1143} {"train_loss": -11.278236389160156, "global_step": 192037, "epoch": 1143} {"train_loss": -11.343545913696289, "global_step": 192038, "epoch": 1143} {"train_loss": -11.31248664855957, "global_step": 192039, "epoch": 1143} {"train_loss": -11.52708911895752, "global_step": 192040, "epoch": 1143} {"train_loss": -11.300812721252441, "global_step": 192041, "epoch": 1143} {"train_loss": -11.583124160766602, "global_step": 192042, "epoch": 1143} {"train_loss": -11.43505573272705, "global_step": 192043, "epoch": 1143} {"train_loss": -11.505550384521484, "global_step": 192044, "epoch": 1143} {"train_loss": -11.544118881225586, "global_step": 192045, "epoch": 1143} {"train_loss": -11.583070755004883, "global_step": 192046, "epoch": 1143} {"train_loss": -11.636964797973633, "global_step": 192047, "epoch": 1143} {"train_loss": -11.29928207397461, "global_step": 192048, "epoch": 1143} {"train_loss": -11.587345123291016, "global_step": 192049, "epoch": 1143} {"train_loss": -11.57895565032959, "global_step": 192050, "epoch": 1143} {"train_loss": -11.60840129852295, "global_step": 192051, "epoch": 1143} {"train_loss": -11.550114631652832, "global_step": 192052, "epoch": 1143} {"train_loss": -11.474266052246094, "global_step": 192053, "epoch": 1143} {"train_loss": -11.439645767211914, "global_step": 192054, "epoch": 1143} {"train_loss": -11.470379829406738, "global_step": 192055, "epoch": 1143} {"train_loss": -11.27142333984375, "global_step": 192056, "epoch": 1143} {"train_loss": -11.396650314331055, "global_step": 192057, "epoch": 1143} {"train_loss": -11.438421249389648, "global_step": 192058, "epoch": 1143} {"train_loss": -11.24884033203125, "global_step": 192059, "epoch": 1143} {"train_loss": -11.01057243347168, "global_step": 192060, "epoch": 1143} {"train_loss": -11.213319778442383, "global_step": 192061, "epoch": 1143} {"train_loss": -11.631763458251953, "global_step": 192062, "epoch": 1143} {"train_loss": -11.144432067871094, "global_step": 192063, "epoch": 1143} {"train_loss": -11.577269554138184, "global_step": 192064, "epoch": 1143} {"train_loss": -11.014900207519531, "global_step": 192065, "epoch": 1143} {"train_loss": -11.068663597106934, "global_step": 192066, "epoch": 1143} {"train_loss": -11.098381996154785, "global_step": 192067, "epoch": 1143} {"train_loss": -11.49435806274414, "global_step": 192068, "epoch": 1143} {"train_loss": -10.96727180480957, "global_step": 192069, "epoch": 1143} {"train_loss": -11.410144805908203, "global_step": 192070, "epoch": 1143} {"train_loss": -11.586525917053223, "global_step": 192071, "epoch": 1143} {"train_loss": -11.048004150390625, "global_step": 192072, "epoch": 1143} {"train_loss": -11.506175994873047, "global_step": 192073, "epoch": 1143} {"train_loss": -11.471564292907715, "global_step": 192074, "epoch": 1143} {"train_loss": -11.51603889465332, "global_step": 192075, "epoch": 1143} {"train_loss": -11.744017601013184, "global_step": 192076, "epoch": 1143} {"train_loss": -11.681267738342285, "global_step": 192077, "epoch": 1143} {"train_loss": -11.36577033996582, "global_step": 192078, "epoch": 1143} {"train_loss": -11.238910675048828, "global_step": 192079, "epoch": 1143} {"train_loss": -11.565099716186523, "global_step": 192080, "epoch": 1143} {"train_loss": -11.138669967651367, "global_step": 192081, "epoch": 1143} {"train_loss": -10.858938217163086, "global_step": 192082, "epoch": 1143} {"train_loss": -11.11944580078125, "global_step": 192083, "epoch": 1143} {"train_loss": -11.176050186157227, "global_step": 192084, "epoch": 1143} {"train_loss": -11.001965522766113, "global_step": 192085, "epoch": 1143} {"train_loss": -11.498125076293945, "global_step": 192086, "epoch": 1143} {"train_loss": -11.05472469329834, "global_step": 192087, "epoch": 1143} {"train_loss": -10.854120254516602, "global_step": 192088, "epoch": 1143} {"train_loss": -11.526169776916504, "global_step": 192089, "epoch": 1143} {"train_loss": -11.313458442687988, "global_step": 192090, "epoch": 1143} {"train_loss": -10.642303466796875, "global_step": 192091, "epoch": 1143} {"train_loss": -11.319321632385254, "global_step": 192092, "epoch": 1143} {"train_loss": -11.146388053894043, "global_step": 192093, "epoch": 1143} {"train_loss": -11.011003494262695, "global_step": 192094, "epoch": 1143} {"train_loss": -11.19963550567627, "global_step": 192095, "epoch": 1143} {"train_loss": -11.327396392822266, "global_step": 192096, "epoch": 1143} {"train_loss": -11.520998001098633, "global_step": 192097, "epoch": 1143} {"train_loss": -11.088623046875, "global_step": 192098, "epoch": 1143} {"train_loss": -11.329541206359863, "global_step": 192099, "epoch": 1143} {"train_loss": -11.299274444580078, "global_step": 192100, "epoch": 1143} {"train_loss": -11.197113990783691, "global_step": 192101, "epoch": 1143} {"train_loss": -10.829172134399414, "global_step": 192102, "epoch": 1143} {"train_loss": -10.945834159851074, "global_step": 192103, "epoch": 1143} {"train_loss": -10.90561580657959, "global_step": 192104, "epoch": 1143} {"train_loss": -11.349289894104004, "global_step": 192105, "epoch": 1143} {"train_loss": -11.143239974975586, "global_step": 192106, "epoch": 1143} {"train_loss": -11.273297309875488, "global_step": 192107, "epoch": 1143} {"train_loss": -11.348665237426758, "global_step": 192108, "epoch": 1143} {"train_loss": -10.748144149780273, "global_step": 192109, "epoch": 1143} {"train_loss": -11.176138877868652, "global_step": 192110, "epoch": 1143} {"train_loss": -11.296438217163086, "global_step": 192111, "epoch": 1143} {"train_loss": -10.926992416381836, "global_step": 192112, "epoch": 1143} {"train_loss": -11.259870529174805, "global_step": 192113, "epoch": 1143} {"train_loss": -11.196962356567383, "global_step": 192114, "epoch": 1143} {"train_loss": -10.870689392089844, "global_step": 192115, "epoch": 1143} {"train_loss": -11.237377166748047, "global_step": 192116, "epoch": 1143} {"train_loss": -10.604483604431152, "global_step": 192117, "epoch": 1143} {"train_loss": -10.534313201904297, "global_step": 192118, "epoch": 1143} {"train_loss": -10.978836059570312, "global_step": 192119, "epoch": 1143} {"train_loss": -10.833761215209961, "global_step": 192120, "epoch": 1143} {"train_loss": -11.432926177978516, "global_step": 192121, "epoch": 1143} {"train_loss": -10.249284744262695, "global_step": 192122, "epoch": 1143} {"train_loss": -10.840383529663086, "global_step": 192123, "epoch": 1143} {"train_loss": -11.12342357635498, "global_step": 192124, "epoch": 1143} {"train_loss": -10.151467323303223, "global_step": 192125, "epoch": 1143} {"train_loss": -11.209888458251953, "global_step": 192126, "epoch": 1143} {"train_loss": -11.060046195983887, "global_step": 192127, "epoch": 1143} {"train_loss": -11.132797241210938, "global_step": 192128, "epoch": 1143} {"train_loss": -11.326774597167969, "global_step": 192129, "epoch": 1143} {"train_loss": -10.337518692016602, "global_step": 192130, "epoch": 1143} {"train_loss": -10.954610824584961, "global_step": 192131, "epoch": 1143} {"train_loss": -10.90054702758789, "global_step": 192132, "epoch": 1143} {"train_loss": -11.168426513671875, "global_step": 192133, "epoch": 1143} {"train_loss": -10.93701171875, "global_step": 192134, "epoch": 1143} {"train_loss": -10.796875, "global_step": 192135, "epoch": 1143} {"train_loss": -10.943160057067871, "global_step": 192136, "epoch": 1143} {"train_loss": -10.819920539855957, "global_step": 192137, "epoch": 1143} {"train_loss": -10.58368968963623, "global_step": 192138, "epoch": 1143} {"train_loss": -11.028138160705566, "global_step": 192139, "epoch": 1143} {"train_loss": -10.749004364013672, "global_step": 192140, "epoch": 1143} {"train_loss": -11.095672607421875, "global_step": 192141, "epoch": 1143} {"train_loss": -10.942917823791504, "global_step": 192142, "epoch": 1143} {"train_loss": -11.056411743164062, "global_step": 192143, "epoch": 1143} {"train_loss": -11.382994651794434, "global_step": 192144, "epoch": 1143} {"train_loss": -11.033512115478516, "global_step": 192145, "epoch": 1143} {"train_loss": -11.457759857177734, "global_step": 192146, "epoch": 1143} {"train_loss": -11.186046600341797, "global_step": 192147, "epoch": 1143} {"train_loss": -11.054747581481934, "global_step": 192148, "epoch": 1143} {"train_loss": -11.101219177246094, "global_step": 192149, "epoch": 1143} {"train_loss": -11.289467811584473, "global_step": 192150, "epoch": 1143} {"train_loss": -11.220420837402344, "global_step": 192151, "epoch": 1143} {"train_loss": -11.370967864990234, "global_step": 192152, "epoch": 1143} {"train_loss": -10.929160118103027, "global_step": 192153, "epoch": 1143} {"train_loss": -10.952288627624512, "global_step": 192154, "epoch": 1143} {"train_loss": -11.541406631469727, "global_step": 192155, "epoch": 1143} {"train_loss": -10.426572799682617, "global_step": 192156, "epoch": 1143} {"train_loss": -11.153486251831055, "global_step": 192157, "epoch": 1143} {"train_loss": -11.15269660949707, "global_step": 192158, "epoch": 1143} {"train_loss": -11.35558032989502, "global_step": 192159, "epoch": 1143} {"train_loss": -11.400054931640625, "global_step": 192160, "epoch": 1143} {"train_loss": -11.418100357055664, "global_step": 192161, "epoch": 1143} {"train_loss": -11.136014938354492, "global_step": 192162, "epoch": 1143} {"train_loss": -11.5321626663208, "global_step": 192163, "epoch": 1143} {"train_loss": -11.248730659484863, "global_step": 192164, "epoch": 1143} {"train_loss": -11.330948829650879, "global_step": 192165, "epoch": 1143} {"train_loss": -11.280478477478027, "global_step": 192166, "epoch": 1143} {"train_loss": -11.368983268737793, "global_step": 192167, "epoch": 1143} {"train_loss": -11.184286117553711, "global_step": 192168, "epoch": 1143} {"train_loss": -11.399988174438477, "global_step": 192169, "epoch": 1143} {"train_loss": -11.291068077087402, "global_step": 192170, "epoch": 1143} {"train_loss": -11.328170776367188, "global_step": 192171, "epoch": 1143} {"train_loss": -11.511618614196777, "global_step": 192172, "epoch": 1143} {"train_loss": -11.013206481933594, "global_step": 192173, "epoch": 1143} {"train_loss": -11.495969772338867, "global_step": 192174, "epoch": 1143} {"train_loss": -10.990160942077637, "global_step": 192175, "epoch": 1143} {"train_loss": -11.226675033569336, "global_step": 192176, "epoch": 1143} {"train_loss": -10.944294929504395, "global_step": 192177, "epoch": 1143} {"train_loss": -11.465914726257324, "global_step": 192178, "epoch": 1143} {"train_loss": -11.333404541015625, "global_step": 192179, "epoch": 1143} {"train_loss": -11.456277847290039, "global_step": 192180, "epoch": 1143} {"train_loss": -11.33452033996582, "global_step": 192181, "epoch": 1143} {"train_loss": -11.415809631347656, "global_step": 192182, "epoch": 1143} {"train_loss": -11.535575866699219, "global_step": 192183, "epoch": 1143} {"train_loss": -11.22714900970459, "global_step": 192184, "epoch": 1143} {"train_loss": -11.509431838989258, "global_step": 192185, "epoch": 1143} {"train_loss": -11.441184997558594, "global_step": 192186, "epoch": 1143} {"train_loss": -11.361871719360352, "global_step": 192187, "epoch": 1143} {"train_loss": -11.531991958618164, "global_step": 192188, "epoch": 1143} {"train_loss": -11.423755645751953, "global_step": 192189, "epoch": 1143} {"train_loss": -11.203824996948242, "global_step": 192190, "epoch": 1143} {"train_loss": -11.210752021698724, "global_step": 192191, "epoch": 1143, "val_loss": 248731.890625} {"train_loss": -11.636497497558594, "global_step": 192192, "epoch": 1144} {"train_loss": -11.600584030151367, "global_step": 192193, "epoch": 1144} {"train_loss": -11.458281517028809, "global_step": 192194, "epoch": 1144} {"train_loss": -11.643836975097656, "global_step": 192195, "epoch": 1144} {"train_loss": -11.364950180053711, "global_step": 192196, "epoch": 1144} {"train_loss": -11.42801284790039, "global_step": 192197, "epoch": 1144} {"train_loss": -11.51248836517334, "global_step": 192198, "epoch": 1144} {"train_loss": -11.678988456726074, "global_step": 192199, "epoch": 1144} {"train_loss": -11.532219886779785, "global_step": 192200, "epoch": 1144} {"train_loss": -11.48205280303955, "global_step": 192201, "epoch": 1144} {"train_loss": -11.36019515991211, "global_step": 192202, "epoch": 1144} {"train_loss": -11.530635833740234, "global_step": 192203, "epoch": 1144} {"train_loss": -11.508340835571289, "global_step": 192204, "epoch": 1144} {"train_loss": -11.720513343811035, "global_step": 192205, "epoch": 1144} {"train_loss": -11.564899444580078, "global_step": 192206, "epoch": 1144} {"train_loss": -11.613321304321289, "global_step": 192207, "epoch": 1144} {"train_loss": -11.606465339660645, "global_step": 192208, "epoch": 1144} {"train_loss": -11.934001922607422, "global_step": 192209, "epoch": 1144} {"train_loss": -11.934748649597168, "global_step": 192210, "epoch": 1144} {"train_loss": -11.591797828674316, "global_step": 192211, "epoch": 1144} {"train_loss": -11.784612655639648, "global_step": 192212, "epoch": 1144} {"train_loss": -11.769681930541992, "global_step": 192213, "epoch": 1144} {"train_loss": -11.696962356567383, "global_step": 192214, "epoch": 1144} {"train_loss": -11.653352737426758, "global_step": 192215, "epoch": 1144} {"train_loss": -11.70988941192627, "global_step": 192216, "epoch": 1144} {"train_loss": -11.81466007232666, "global_step": 192217, "epoch": 1144} {"train_loss": -11.629585266113281, "global_step": 192218, "epoch": 1144} {"train_loss": -11.350187301635742, "global_step": 192219, "epoch": 1144} {"train_loss": -11.069461822509766, "global_step": 192220, "epoch": 1144} {"train_loss": -11.278586387634277, "global_step": 192221, "epoch": 1144} {"train_loss": -11.257959365844727, "global_step": 192222, "epoch": 1144} {"train_loss": -10.358247756958008, "global_step": 192223, "epoch": 1144} {"train_loss": -10.558320999145508, "global_step": 192224, "epoch": 1144} {"train_loss": -11.41425895690918, "global_step": 192225, "epoch": 1144} {"train_loss": -10.63086223602295, "global_step": 192226, "epoch": 1144} {"train_loss": -9.37845230102539, "global_step": 192227, "epoch": 1144} {"train_loss": -10.469911575317383, "global_step": 192228, "epoch": 1144} {"train_loss": -11.540834426879883, "global_step": 192229, "epoch": 1144} {"train_loss": -10.817072868347168, "global_step": 192230, "epoch": 1144} {"train_loss": -9.962892532348633, "global_step": 192231, "epoch": 1144} {"train_loss": -11.119134902954102, "global_step": 192232, "epoch": 1144} {"train_loss": -10.14415454864502, "global_step": 192233, "epoch": 1144} {"train_loss": -10.670321464538574, "global_step": 192234, "epoch": 1144} {"train_loss": -10.070287704467773, "global_step": 192235, "epoch": 1144} {"train_loss": -11.04238224029541, "global_step": 192236, "epoch": 1144} {"train_loss": -10.290229797363281, "global_step": 192237, "epoch": 1144} {"train_loss": -11.067060470581055, "global_step": 192238, "epoch": 1144} {"train_loss": -11.152397155761719, "global_step": 192239, "epoch": 1144} {"train_loss": -11.146778106689453, "global_step": 192240, "epoch": 1144} {"train_loss": -11.147784233093262, "global_step": 192241, "epoch": 1144} {"train_loss": -10.856794357299805, "global_step": 192242, "epoch": 1144} {"train_loss": -11.3237886428833, "global_step": 192243, "epoch": 1144} {"train_loss": -11.378902435302734, "global_step": 192244, "epoch": 1144} {"train_loss": -11.283824920654297, "global_step": 192245, "epoch": 1144} {"train_loss": -11.279431343078613, "global_step": 192246, "epoch": 1144} {"train_loss": -11.030624389648438, "global_step": 192247, "epoch": 1144} {"train_loss": -11.22429370880127, "global_step": 192248, "epoch": 1144} {"train_loss": -10.998929977416992, "global_step": 192249, "epoch": 1144} {"train_loss": -11.113443374633789, "global_step": 192250, "epoch": 1144} {"train_loss": -11.110639572143555, "global_step": 192251, "epoch": 1144} {"train_loss": -11.318655014038086, "global_step": 192252, "epoch": 1144} {"train_loss": -11.132959365844727, "global_step": 192253, "epoch": 1144} {"train_loss": -11.242748260498047, "global_step": 192254, "epoch": 1144} {"train_loss": -11.220335006713867, "global_step": 192255, "epoch": 1144} {"train_loss": -11.445502281188965, "global_step": 192256, "epoch": 1144} {"train_loss": -11.139830589294434, "global_step": 192257, "epoch": 1144} {"train_loss": -11.24106502532959, "global_step": 192258, "epoch": 1144} {"train_loss": -11.428313255310059, "global_step": 192259, "epoch": 1144} {"train_loss": -11.52066421508789, "global_step": 192260, "epoch": 1144} {"train_loss": -11.625014305114746, "global_step": 192261, "epoch": 1144} {"train_loss": -11.515457153320312, "global_step": 192262, "epoch": 1144} {"train_loss": -11.560503959655762, "global_step": 192263, "epoch": 1144} {"train_loss": -11.325206756591797, "global_step": 192264, "epoch": 1144} {"train_loss": -11.522302627563477, "global_step": 192265, "epoch": 1144} {"train_loss": -11.633155822753906, "global_step": 192266, "epoch": 1144} {"train_loss": -11.098997116088867, "global_step": 192267, "epoch": 1144} {"train_loss": -11.653419494628906, "global_step": 192268, "epoch": 1144} {"train_loss": -11.266923904418945, "global_step": 192269, "epoch": 1144} {"train_loss": -11.444415092468262, "global_step": 192270, "epoch": 1144} {"train_loss": -11.149385452270508, "global_step": 192271, "epoch": 1144} {"train_loss": -11.463979721069336, "global_step": 192272, "epoch": 1144} {"train_loss": -11.325356483459473, "global_step": 192273, "epoch": 1144} {"train_loss": -11.143795013427734, "global_step": 192274, "epoch": 1144} {"train_loss": -11.361228942871094, "global_step": 192275, "epoch": 1144} {"train_loss": -11.37409496307373, "global_step": 192276, "epoch": 1144} {"train_loss": -11.550621032714844, "global_step": 192277, "epoch": 1144} {"train_loss": -11.518510818481445, "global_step": 192278, "epoch": 1144} {"train_loss": -10.883152961730957, "global_step": 192279, "epoch": 1144} {"train_loss": -11.51225471496582, "global_step": 192280, "epoch": 1144} {"train_loss": -11.356301307678223, "global_step": 192281, "epoch": 1144} {"train_loss": -11.331689834594727, "global_step": 192282, "epoch": 1144} {"train_loss": -11.381675720214844, "global_step": 192283, "epoch": 1144} {"train_loss": -11.08835506439209, "global_step": 192284, "epoch": 1144} {"train_loss": -11.04035758972168, "global_step": 192285, "epoch": 1144} {"train_loss": -11.232275009155273, "global_step": 192286, "epoch": 1144} {"train_loss": -11.021116256713867, "global_step": 192287, "epoch": 1144} {"train_loss": -10.48178482055664, "global_step": 192288, "epoch": 1144} {"train_loss": -10.728256225585938, "global_step": 192289, "epoch": 1144} {"train_loss": -10.813281059265137, "global_step": 192290, "epoch": 1144} {"train_loss": -9.71563720703125, "global_step": 192291, "epoch": 1144} {"train_loss": -10.824329376220703, "global_step": 192292, "epoch": 1144} {"train_loss": -10.019501686096191, "global_step": 192293, "epoch": 1144} {"train_loss": -10.097282409667969, "global_step": 192294, "epoch": 1144} {"train_loss": -10.61961555480957, "global_step": 192295, "epoch": 1144} {"train_loss": -10.390154838562012, "global_step": 192296, "epoch": 1144} {"train_loss": -10.542245864868164, "global_step": 192297, "epoch": 1144} {"train_loss": -11.037544250488281, "global_step": 192298, "epoch": 1144} {"train_loss": -10.699712753295898, "global_step": 192299, "epoch": 1144} {"train_loss": -10.838214874267578, "global_step": 192300, "epoch": 1144} {"train_loss": -11.068512916564941, "global_step": 192301, "epoch": 1144} {"train_loss": -11.008801460266113, "global_step": 192302, "epoch": 1144} {"train_loss": -10.850592613220215, "global_step": 192303, "epoch": 1144} {"train_loss": -10.256105422973633, "global_step": 192304, "epoch": 1144} {"train_loss": -10.333844184875488, "global_step": 192305, "epoch": 1144} {"train_loss": -10.01672077178955, "global_step": 192306, "epoch": 1144} {"train_loss": -11.041406631469727, "global_step": 192307, "epoch": 1144} {"train_loss": -9.05777645111084, "global_step": 192308, "epoch": 1144} {"train_loss": -11.325937271118164, "global_step": 192309, "epoch": 1144} {"train_loss": -9.489154815673828, "global_step": 192310, "epoch": 1144} {"train_loss": -10.893781661987305, "global_step": 192311, "epoch": 1144} {"train_loss": -10.07328987121582, "global_step": 192312, "epoch": 1144} {"train_loss": -10.945588111877441, "global_step": 192313, "epoch": 1144} {"train_loss": -10.35335922241211, "global_step": 192314, "epoch": 1144} {"train_loss": -10.69412612915039, "global_step": 192315, "epoch": 1144} {"train_loss": -10.868036270141602, "global_step": 192316, "epoch": 1144} {"train_loss": -11.039112091064453, "global_step": 192317, "epoch": 1144} {"train_loss": -11.009345054626465, "global_step": 192318, "epoch": 1144} {"train_loss": -11.128836631774902, "global_step": 192319, "epoch": 1144} {"train_loss": -11.0938720703125, "global_step": 192320, "epoch": 1144} {"train_loss": -10.89798641204834, "global_step": 192321, "epoch": 1144} {"train_loss": -11.08519458770752, "global_step": 192322, "epoch": 1144} {"train_loss": -11.265188217163086, "global_step": 192323, "epoch": 1144} {"train_loss": -11.043779373168945, "global_step": 192324, "epoch": 1144} {"train_loss": -11.271479606628418, "global_step": 192325, "epoch": 1144} {"train_loss": -11.287553787231445, "global_step": 192326, "epoch": 1144} {"train_loss": -11.379610061645508, "global_step": 192327, "epoch": 1144} {"train_loss": -11.196521759033203, "global_step": 192328, "epoch": 1144} {"train_loss": -11.360879898071289, "global_step": 192329, "epoch": 1144} {"train_loss": -11.244673728942871, "global_step": 192330, "epoch": 1144} {"train_loss": -11.420782089233398, "global_step": 192331, "epoch": 1144} {"train_loss": -11.23617935180664, "global_step": 192332, "epoch": 1144} {"train_loss": -11.334318161010742, "global_step": 192333, "epoch": 1144} {"train_loss": -11.500097274780273, "global_step": 192334, "epoch": 1144} {"train_loss": -11.336506843566895, "global_step": 192335, "epoch": 1144} {"train_loss": -11.396522521972656, "global_step": 192336, "epoch": 1144} {"train_loss": -11.307884216308594, "global_step": 192337, "epoch": 1144} {"train_loss": -11.54845905303955, "global_step": 192338, "epoch": 1144} {"train_loss": -11.36526107788086, "global_step": 192339, "epoch": 1144} {"train_loss": -11.349613189697266, "global_step": 192340, "epoch": 1144} {"train_loss": -11.403854370117188, "global_step": 192341, "epoch": 1144} {"train_loss": -11.446550369262695, "global_step": 192342, "epoch": 1144} {"train_loss": -11.52013111114502, "global_step": 192343, "epoch": 1144} {"train_loss": -11.407140731811523, "global_step": 192344, "epoch": 1144} {"train_loss": -11.596705436706543, "global_step": 192345, "epoch": 1144} {"train_loss": -11.25617790222168, "global_step": 192346, "epoch": 1144} {"train_loss": -11.534929275512695, "global_step": 192347, "epoch": 1144} {"train_loss": -11.155454635620117, "global_step": 192348, "epoch": 1144} {"train_loss": -11.323158264160156, "global_step": 192349, "epoch": 1144} {"train_loss": -11.287395477294922, "global_step": 192350, "epoch": 1144} {"train_loss": -11.501274108886719, "global_step": 192351, "epoch": 1144} {"train_loss": -11.448290824890137, "global_step": 192352, "epoch": 1144} {"train_loss": -11.516756057739258, "global_step": 192353, "epoch": 1144} {"train_loss": -11.139081954956055, "global_step": 192354, "epoch": 1144} {"train_loss": -11.394828796386719, "global_step": 192355, "epoch": 1144} {"train_loss": -11.64708423614502, "global_step": 192356, "epoch": 1144} {"train_loss": -11.527993202209473, "global_step": 192357, "epoch": 1144} {"train_loss": -11.306743621826172, "global_step": 192358, "epoch": 1144} {"train_loss": -11.15155881927127, "global_step": 192359, "epoch": 1144, "val_loss": 252515.078125} {"train_loss": -11.560242652893066, "global_step": 192360, "epoch": 1145} {"train_loss": -11.394569396972656, "global_step": 192361, "epoch": 1145} {"train_loss": -11.369719505310059, "global_step": 192362, "epoch": 1145} {"train_loss": -11.551328659057617, "global_step": 192363, "epoch": 1145} {"train_loss": -11.34387493133545, "global_step": 192364, "epoch": 1145} {"train_loss": -11.250235557556152, "global_step": 192365, "epoch": 1145} {"train_loss": -11.370630264282227, "global_step": 192366, "epoch": 1145} {"train_loss": -11.204878807067871, "global_step": 192367, "epoch": 1145} {"train_loss": -10.75973892211914, "global_step": 192368, "epoch": 1145} {"train_loss": -9.990019798278809, "global_step": 192369, "epoch": 1145} {"train_loss": -10.677261352539062, "global_step": 192370, "epoch": 1145} {"train_loss": -10.971944808959961, "global_step": 192371, "epoch": 1145} {"train_loss": -10.153980255126953, "global_step": 192372, "epoch": 1145} {"train_loss": -10.435253143310547, "global_step": 192373, "epoch": 1145} {"train_loss": -10.914088249206543, "global_step": 192374, "epoch": 1145} {"train_loss": -10.392305374145508, "global_step": 192375, "epoch": 1145} {"train_loss": -10.843130111694336, "global_step": 192376, "epoch": 1145} {"train_loss": -11.26704216003418, "global_step": 192377, "epoch": 1145} {"train_loss": -10.77367877960205, "global_step": 192378, "epoch": 1145} {"train_loss": -10.94877815246582, "global_step": 192379, "epoch": 1145} {"train_loss": -11.537851333618164, "global_step": 192380, "epoch": 1145} {"train_loss": -11.425176620483398, "global_step": 192381, "epoch": 1145} {"train_loss": -10.7021484375, "global_step": 192382, "epoch": 1145} {"train_loss": -11.29111099243164, "global_step": 192383, "epoch": 1145} {"train_loss": -11.297782897949219, "global_step": 192384, "epoch": 1145} {"train_loss": -11.068103790283203, "global_step": 192385, "epoch": 1145} {"train_loss": -11.395023345947266, "global_step": 192386, "epoch": 1145} {"train_loss": -10.924227714538574, "global_step": 192387, "epoch": 1145} {"train_loss": -11.248556137084961, "global_step": 192388, "epoch": 1145} {"train_loss": -11.474313735961914, "global_step": 192389, "epoch": 1145} {"train_loss": -11.030508995056152, "global_step": 192390, "epoch": 1145} {"train_loss": -11.360109329223633, "global_step": 192391, "epoch": 1145} {"train_loss": -11.017906188964844, "global_step": 192392, "epoch": 1145} {"train_loss": -11.287817001342773, "global_step": 192393, "epoch": 1145} {"train_loss": -11.194517135620117, "global_step": 192394, "epoch": 1145} {"train_loss": -11.435776710510254, "global_step": 192395, "epoch": 1145} {"train_loss": -11.287328720092773, "global_step": 192396, "epoch": 1145} {"train_loss": -11.055717468261719, "global_step": 192397, "epoch": 1145} {"train_loss": -11.170496940612793, "global_step": 192398, "epoch": 1145} {"train_loss": -11.277328491210938, "global_step": 192399, "epoch": 1145} {"train_loss": -11.327787399291992, "global_step": 192400, "epoch": 1145} {"train_loss": -11.32694149017334, "global_step": 192401, "epoch": 1145} {"train_loss": -11.109770774841309, "global_step": 192402, "epoch": 1145} {"train_loss": -11.685111999511719, "global_step": 192403, "epoch": 1145} {"train_loss": -11.045982360839844, "global_step": 192404, "epoch": 1145} {"train_loss": -11.251770973205566, "global_step": 192405, "epoch": 1145} {"train_loss": -11.353548049926758, "global_step": 192406, "epoch": 1145} {"train_loss": -11.146134376525879, "global_step": 192407, "epoch": 1145} {"train_loss": -11.432382583618164, "global_step": 192408, "epoch": 1145} {"train_loss": -11.172622680664062, "global_step": 192409, "epoch": 1145} {"train_loss": -11.329460144042969, "global_step": 192410, "epoch": 1145} {"train_loss": -11.156490325927734, "global_step": 192411, "epoch": 1145} {"train_loss": -11.061529159545898, "global_step": 192412, "epoch": 1145} {"train_loss": -11.212661743164062, "global_step": 192413, "epoch": 1145} {"train_loss": -11.438676834106445, "global_step": 192414, "epoch": 1145} {"train_loss": -10.430455207824707, "global_step": 192415, "epoch": 1145} {"train_loss": -10.960238456726074, "global_step": 192416, "epoch": 1145} {"train_loss": -10.99730110168457, "global_step": 192417, "epoch": 1145} {"train_loss": -10.670829772949219, "global_step": 192418, "epoch": 1145} {"train_loss": -10.866140365600586, "global_step": 192419, "epoch": 1145} {"train_loss": -10.19206428527832, "global_step": 192420, "epoch": 1145} {"train_loss": -11.159577369689941, "global_step": 192421, "epoch": 1145} {"train_loss": -10.890411376953125, "global_step": 192422, "epoch": 1145} {"train_loss": -11.187198638916016, "global_step": 192423, "epoch": 1145} {"train_loss": -10.781723022460938, "global_step": 192424, "epoch": 1145} {"train_loss": -10.575915336608887, "global_step": 192425, "epoch": 1145} {"train_loss": -10.576576232910156, "global_step": 192426, "epoch": 1145} {"train_loss": -10.683899879455566, "global_step": 192427, "epoch": 1145} {"train_loss": -11.372005462646484, "global_step": 192428, "epoch": 1145} {"train_loss": -10.527831077575684, "global_step": 192429, "epoch": 1145} {"train_loss": -11.436208724975586, "global_step": 192430, "epoch": 1145} {"train_loss": -10.854482650756836, "global_step": 192431, "epoch": 1145} {"train_loss": -11.077611923217773, "global_step": 192432, "epoch": 1145} {"train_loss": -11.106986999511719, "global_step": 192433, "epoch": 1145} {"train_loss": -10.783376693725586, "global_step": 192434, "epoch": 1145} {"train_loss": -11.423820495605469, "global_step": 192435, "epoch": 1145} {"train_loss": -10.902511596679688, "global_step": 192436, "epoch": 1145} {"train_loss": -11.16215705871582, "global_step": 192437, "epoch": 1145} {"train_loss": -11.093672752380371, "global_step": 192438, "epoch": 1145} {"train_loss": -11.011281967163086, "global_step": 192439, "epoch": 1145} {"train_loss": -11.166019439697266, "global_step": 192440, "epoch": 1145} {"train_loss": -10.92875862121582, "global_step": 192441, "epoch": 1145} {"train_loss": -11.217571258544922, "global_step": 192442, "epoch": 1145} {"train_loss": -11.213849067687988, "global_step": 192443, "epoch": 1145} {"train_loss": -11.161639213562012, "global_step": 192444, "epoch": 1145} {"train_loss": -11.171651840209961, "global_step": 192445, "epoch": 1145} {"train_loss": -11.422666549682617, "global_step": 192446, "epoch": 1145} {"train_loss": -11.121025085449219, "global_step": 192447, "epoch": 1145} {"train_loss": -11.167238235473633, "global_step": 192448, "epoch": 1145} {"train_loss": -10.80091667175293, "global_step": 192449, "epoch": 1145} {"train_loss": -10.72108268737793, "global_step": 192450, "epoch": 1145} {"train_loss": -11.291694641113281, "global_step": 192451, "epoch": 1145} {"train_loss": -10.629345893859863, "global_step": 192452, "epoch": 1145} {"train_loss": -11.044073104858398, "global_step": 192453, "epoch": 1145} {"train_loss": -11.163761138916016, "global_step": 192454, "epoch": 1145} {"train_loss": -11.049924850463867, "global_step": 192455, "epoch": 1145} {"train_loss": -10.665371894836426, "global_step": 192456, "epoch": 1145} {"train_loss": -10.856391906738281, "global_step": 192457, "epoch": 1145} {"train_loss": -11.213239669799805, "global_step": 192458, "epoch": 1145} {"train_loss": -11.309879302978516, "global_step": 192459, "epoch": 1145} {"train_loss": -11.36363410949707, "global_step": 192460, "epoch": 1145} {"train_loss": -11.220117568969727, "global_step": 192461, "epoch": 1145} {"train_loss": -11.257009506225586, "global_step": 192462, "epoch": 1145} {"train_loss": -11.408771514892578, "global_step": 192463, "epoch": 1145} {"train_loss": -11.271963119506836, "global_step": 192464, "epoch": 1145} {"train_loss": -11.32231330871582, "global_step": 192465, "epoch": 1145} {"train_loss": -11.326216697692871, "global_step": 192466, "epoch": 1145} {"train_loss": -11.333276748657227, "global_step": 192467, "epoch": 1145} {"train_loss": -11.631889343261719, "global_step": 192468, "epoch": 1145} {"train_loss": -11.485709190368652, "global_step": 192469, "epoch": 1145} {"train_loss": -11.525211334228516, "global_step": 192470, "epoch": 1145} {"train_loss": -11.601187705993652, "global_step": 192471, "epoch": 1145} {"train_loss": -11.604496002197266, "global_step": 192472, "epoch": 1145} {"train_loss": -11.433080673217773, "global_step": 192473, "epoch": 1145} {"train_loss": -11.466243743896484, "global_step": 192474, "epoch": 1145} {"train_loss": -11.58057975769043, "global_step": 192475, "epoch": 1145} {"train_loss": -11.834648132324219, "global_step": 192476, "epoch": 1145} {"train_loss": -11.75337028503418, "global_step": 192477, "epoch": 1145} {"train_loss": -11.610276222229004, "global_step": 192478, "epoch": 1145} {"train_loss": -11.77227783203125, "global_step": 192479, "epoch": 1145} {"train_loss": -11.696422576904297, "global_step": 192480, "epoch": 1145} {"train_loss": -11.650466918945312, "global_step": 192481, "epoch": 1145} {"train_loss": -11.776521682739258, "global_step": 192482, "epoch": 1145} {"train_loss": -11.673057556152344, "global_step": 192483, "epoch": 1145} {"train_loss": -11.843050003051758, "global_step": 192484, "epoch": 1145} {"train_loss": -11.490894317626953, "global_step": 192485, "epoch": 1145} {"train_loss": -11.516364097595215, "global_step": 192486, "epoch": 1145} {"train_loss": -11.406196594238281, "global_step": 192487, "epoch": 1145} {"train_loss": -11.764646530151367, "global_step": 192488, "epoch": 1145} {"train_loss": -11.476957321166992, "global_step": 192489, "epoch": 1145} {"train_loss": -11.466588020324707, "global_step": 192490, "epoch": 1145} {"train_loss": -11.696023941040039, "global_step": 192491, "epoch": 1145} {"train_loss": -11.521373748779297, "global_step": 192492, "epoch": 1145} {"train_loss": -11.787912368774414, "global_step": 192493, "epoch": 1145} {"train_loss": -11.5858736038208, "global_step": 192494, "epoch": 1145} {"train_loss": -11.766518592834473, "global_step": 192495, "epoch": 1145} {"train_loss": -11.275066375732422, "global_step": 192496, "epoch": 1145} {"train_loss": -11.592206954956055, "global_step": 192497, "epoch": 1145} {"train_loss": -11.315887451171875, "global_step": 192498, "epoch": 1145} {"train_loss": -11.204309463500977, "global_step": 192499, "epoch": 1145} {"train_loss": -11.279694557189941, "global_step": 192500, "epoch": 1145} {"train_loss": -11.80877685546875, "global_step": 192501, "epoch": 1145} {"train_loss": -11.816917419433594, "global_step": 192502, "epoch": 1145} {"train_loss": -11.74326229095459, "global_step": 192503, "epoch": 1145} {"train_loss": -11.652971267700195, "global_step": 192504, "epoch": 1145} {"train_loss": -11.70779037475586, "global_step": 192505, "epoch": 1145} {"train_loss": -11.789151191711426, "global_step": 192506, "epoch": 1145} {"train_loss": -11.801794052124023, "global_step": 192507, "epoch": 1145} {"train_loss": -11.646865844726562, "global_step": 192508, "epoch": 1145} {"train_loss": -11.528675079345703, "global_step": 192509, "epoch": 1145} {"train_loss": -11.54246997833252, "global_step": 192510, "epoch": 1145} {"train_loss": -11.594482421875, "global_step": 192511, "epoch": 1145} {"train_loss": -11.467456817626953, "global_step": 192512, "epoch": 1145} {"train_loss": -11.78216552734375, "global_step": 192513, "epoch": 1145} {"train_loss": -11.689735412597656, "global_step": 192514, "epoch": 1145} {"train_loss": -11.492782592773438, "global_step": 192515, "epoch": 1145} {"train_loss": -11.267406463623047, "global_step": 192516, "epoch": 1145} {"train_loss": -11.505943298339844, "global_step": 192517, "epoch": 1145} {"train_loss": -11.620655059814453, "global_step": 192518, "epoch": 1145} {"train_loss": -11.616162300109863, "global_step": 192519, "epoch": 1145} {"train_loss": -11.59762191772461, "global_step": 192520, "epoch": 1145} {"train_loss": -11.238290786743164, "global_step": 192521, "epoch": 1145} {"train_loss": -10.967876434326172, "global_step": 192522, "epoch": 1145} {"train_loss": -11.517206192016602, "global_step": 192523, "epoch": 1145} {"train_loss": -11.499323844909668, "global_step": 192524, "epoch": 1145} {"train_loss": -11.408771514892578, "global_step": 192525, "epoch": 1145} {"train_loss": -11.151083946228027, "global_step": 192526, "epoch": 1145} {"train_loss": -11.257433482578822, "global_step": 192527, "epoch": 1145, "val_loss": 244648.8125, "train_action_mse_error": 4.728511810302734} {"train_loss": -11.139554977416992, "global_step": 192528, "epoch": 1146} {"train_loss": -11.499935150146484, "global_step": 192529, "epoch": 1146} {"train_loss": -11.733019828796387, "global_step": 192530, "epoch": 1146} {"train_loss": -11.299696922302246, "global_step": 192531, "epoch": 1146} {"train_loss": -10.774956703186035, "global_step": 192532, "epoch": 1146} {"train_loss": -11.26017951965332, "global_step": 192533, "epoch": 1146} {"train_loss": -11.673454284667969, "global_step": 192534, "epoch": 1146} {"train_loss": -11.411131858825684, "global_step": 192535, "epoch": 1146} {"train_loss": -11.017867088317871, "global_step": 192536, "epoch": 1146} {"train_loss": -10.579017639160156, "global_step": 192537, "epoch": 1146} {"train_loss": -10.821834564208984, "global_step": 192538, "epoch": 1146} {"train_loss": -10.591756820678711, "global_step": 192539, "epoch": 1146} {"train_loss": -10.81928539276123, "global_step": 192540, "epoch": 1146} {"train_loss": -10.344242095947266, "global_step": 192541, "epoch": 1146} {"train_loss": -10.073416709899902, "global_step": 192542, "epoch": 1146} {"train_loss": -10.864289283752441, "global_step": 192543, "epoch": 1146} {"train_loss": -9.42637825012207, "global_step": 192544, "epoch": 1146} {"train_loss": -10.72287368774414, "global_step": 192545, "epoch": 1146} {"train_loss": -9.468381881713867, "global_step": 192546, "epoch": 1146} {"train_loss": -9.90217399597168, "global_step": 192547, "epoch": 1146} {"train_loss": -9.579397201538086, "global_step": 192548, "epoch": 1146} {"train_loss": -9.559460639953613, "global_step": 192549, "epoch": 1146} {"train_loss": -9.068441390991211, "global_step": 192550, "epoch": 1146} {"train_loss": -8.565664291381836, "global_step": 192551, "epoch": 1146} {"train_loss": -7.456796169281006, "global_step": 192552, "epoch": 1146} {"train_loss": -9.66568374633789, "global_step": 192553, "epoch": 1146} {"train_loss": -9.048849105834961, "global_step": 192554, "epoch": 1146} {"train_loss": -9.336088180541992, "global_step": 192555, "epoch": 1146} {"train_loss": -10.175912857055664, "global_step": 192556, "epoch": 1146} {"train_loss": -10.550228118896484, "global_step": 192557, "epoch": 1146} {"train_loss": -9.60649585723877, "global_step": 192558, "epoch": 1146} {"train_loss": -11.065569877624512, "global_step": 192559, "epoch": 1146} {"train_loss": -10.233048439025879, "global_step": 192560, "epoch": 1146} {"train_loss": -10.50484561920166, "global_step": 192561, "epoch": 1146} {"train_loss": -10.670501708984375, "global_step": 192562, "epoch": 1146} {"train_loss": -10.511343002319336, "global_step": 192563, "epoch": 1146} {"train_loss": -10.189446449279785, "global_step": 192564, "epoch": 1146} {"train_loss": -11.019307136535645, "global_step": 192565, "epoch": 1146} {"train_loss": -10.465540885925293, "global_step": 192566, "epoch": 1146} {"train_loss": -10.900667190551758, "global_step": 192567, "epoch": 1146} {"train_loss": -10.848627090454102, "global_step": 192568, "epoch": 1146} {"train_loss": -10.616863250732422, "global_step": 192569, "epoch": 1146} {"train_loss": -10.6722412109375, "global_step": 192570, "epoch": 1146} {"train_loss": -10.900749206542969, "global_step": 192571, "epoch": 1146} {"train_loss": -10.578137397766113, "global_step": 192572, "epoch": 1146} {"train_loss": -10.695571899414062, "global_step": 192573, "epoch": 1146} {"train_loss": -10.750967025756836, "global_step": 192574, "epoch": 1146} {"train_loss": -11.012500762939453, "global_step": 192575, "epoch": 1146} {"train_loss": -10.876794815063477, "global_step": 192576, "epoch": 1146} {"train_loss": -10.997297286987305, "global_step": 192577, "epoch": 1146} {"train_loss": -11.006586074829102, "global_step": 192578, "epoch": 1146} {"train_loss": -10.98338794708252, "global_step": 192579, "epoch": 1146} {"train_loss": -11.050537109375, "global_step": 192580, "epoch": 1146} {"train_loss": -11.19409465789795, "global_step": 192581, "epoch": 1146} {"train_loss": -11.074512481689453, "global_step": 192582, "epoch": 1146} {"train_loss": -10.773168563842773, "global_step": 192583, "epoch": 1146} {"train_loss": -11.074278831481934, "global_step": 192584, "epoch": 1146} {"train_loss": -11.282917022705078, "global_step": 192585, "epoch": 1146} {"train_loss": -11.117886543273926, "global_step": 192586, "epoch": 1146} {"train_loss": -11.068575859069824, "global_step": 192587, "epoch": 1146} {"train_loss": -11.143455505371094, "global_step": 192588, "epoch": 1146} {"train_loss": -10.991605758666992, "global_step": 192589, "epoch": 1146} {"train_loss": -11.022645950317383, "global_step": 192590, "epoch": 1146} {"train_loss": -11.21490478515625, "global_step": 192591, "epoch": 1146} {"train_loss": -11.115739822387695, "global_step": 192592, "epoch": 1146} {"train_loss": -11.291955947875977, "global_step": 192593, "epoch": 1146} {"train_loss": -11.229414939880371, "global_step": 192594, "epoch": 1146} {"train_loss": -11.349745750427246, "global_step": 192595, "epoch": 1146} {"train_loss": -11.315838813781738, "global_step": 192596, "epoch": 1146} {"train_loss": -11.414798736572266, "global_step": 192597, "epoch": 1146} {"train_loss": -11.36568546295166, "global_step": 192598, "epoch": 1146} {"train_loss": -11.331151962280273, "global_step": 192599, "epoch": 1146} {"train_loss": -11.45765495300293, "global_step": 192600, "epoch": 1146} {"train_loss": -11.309700012207031, "global_step": 192601, "epoch": 1146} {"train_loss": -11.278462409973145, "global_step": 192602, "epoch": 1146} {"train_loss": -11.499829292297363, "global_step": 192603, "epoch": 1146} {"train_loss": -11.472747802734375, "global_step": 192604, "epoch": 1146} {"train_loss": -11.449346542358398, "global_step": 192605, "epoch": 1146} {"train_loss": -11.257781028747559, "global_step": 192606, "epoch": 1146} {"train_loss": -11.462966918945312, "global_step": 192607, "epoch": 1146} {"train_loss": -11.378195762634277, "global_step": 192608, "epoch": 1146} {"train_loss": -11.358055114746094, "global_step": 192609, "epoch": 1146} {"train_loss": -11.38157844543457, "global_step": 192610, "epoch": 1146} {"train_loss": -11.421443939208984, "global_step": 192611, "epoch": 1146} {"train_loss": -11.391298294067383, "global_step": 192612, "epoch": 1146} {"train_loss": -11.460350036621094, "global_step": 192613, "epoch": 1146} {"train_loss": -11.598344802856445, "global_step": 192614, "epoch": 1146} {"train_loss": -11.50528621673584, "global_step": 192615, "epoch": 1146} {"train_loss": -11.628350257873535, "global_step": 192616, "epoch": 1146} {"train_loss": -11.589521408081055, "global_step": 192617, "epoch": 1146} {"train_loss": -11.460992813110352, "global_step": 192618, "epoch": 1146} {"train_loss": -11.573629379272461, "global_step": 192619, "epoch": 1146} {"train_loss": -11.678285598754883, "global_step": 192620, "epoch": 1146} {"train_loss": -11.48532485961914, "global_step": 192621, "epoch": 1146} {"train_loss": -11.231181144714355, "global_step": 192622, "epoch": 1146} {"train_loss": -11.75334644317627, "global_step": 192623, "epoch": 1146} {"train_loss": -11.530563354492188, "global_step": 192624, "epoch": 1146} {"train_loss": -11.505927085876465, "global_step": 192625, "epoch": 1146} {"train_loss": -11.70394515991211, "global_step": 192626, "epoch": 1146} {"train_loss": -11.570586204528809, "global_step": 192627, "epoch": 1146} {"train_loss": -11.76419448852539, "global_step": 192628, "epoch": 1146} {"train_loss": -11.623640060424805, "global_step": 192629, "epoch": 1146} {"train_loss": -11.636408805847168, "global_step": 192630, "epoch": 1146} {"train_loss": -11.473409652709961, "global_step": 192631, "epoch": 1146} {"train_loss": -11.202627182006836, "global_step": 192632, "epoch": 1146} {"train_loss": -11.220382690429688, "global_step": 192633, "epoch": 1146} {"train_loss": -11.380385398864746, "global_step": 192634, "epoch": 1146} {"train_loss": -11.217796325683594, "global_step": 192635, "epoch": 1146} {"train_loss": -11.265535354614258, "global_step": 192636, "epoch": 1146} {"train_loss": -11.351828575134277, "global_step": 192637, "epoch": 1146} {"train_loss": -11.479085922241211, "global_step": 192638, "epoch": 1146} {"train_loss": -11.397367477416992, "global_step": 192639, "epoch": 1146} {"train_loss": -10.784040451049805, "global_step": 192640, "epoch": 1146} {"train_loss": -10.463212966918945, "global_step": 192641, "epoch": 1146} {"train_loss": -10.339822769165039, "global_step": 192642, "epoch": 1146} {"train_loss": -11.005796432495117, "global_step": 192643, "epoch": 1146} {"train_loss": -10.976861000061035, "global_step": 192644, "epoch": 1146} {"train_loss": -9.625128746032715, "global_step": 192645, "epoch": 1146} {"train_loss": -8.27340316772461, "global_step": 192646, "epoch": 1146} {"train_loss": -10.732405662536621, "global_step": 192647, "epoch": 1146} {"train_loss": -10.066189765930176, "global_step": 192648, "epoch": 1146} {"train_loss": -10.038454055786133, "global_step": 192649, "epoch": 1146} {"train_loss": -9.279147148132324, "global_step": 192650, "epoch": 1146} {"train_loss": -9.064899444580078, "global_step": 192651, "epoch": 1146} {"train_loss": -9.399569511413574, "global_step": 192652, "epoch": 1146} {"train_loss": -9.746208190917969, "global_step": 192653, "epoch": 1146} {"train_loss": -10.571171760559082, "global_step": 192654, "epoch": 1146} {"train_loss": -9.107356071472168, "global_step": 192655, "epoch": 1146} {"train_loss": -10.727094650268555, "global_step": 192656, "epoch": 1146} {"train_loss": -10.029672622680664, "global_step": 192657, "epoch": 1146} {"train_loss": -9.421321868896484, "global_step": 192658, "epoch": 1146} {"train_loss": -10.618038177490234, "global_step": 192659, "epoch": 1146} {"train_loss": -10.076571464538574, "global_step": 192660, "epoch": 1146} {"train_loss": -10.06509017944336, "global_step": 192661, "epoch": 1146} {"train_loss": -10.649484634399414, "global_step": 192662, "epoch": 1146} {"train_loss": -10.183049201965332, "global_step": 192663, "epoch": 1146} {"train_loss": -10.5491943359375, "global_step": 192664, "epoch": 1146} {"train_loss": -10.583181381225586, "global_step": 192665, "epoch": 1146} {"train_loss": -10.4345703125, "global_step": 192666, "epoch": 1146} {"train_loss": -10.233287811279297, "global_step": 192667, "epoch": 1146} {"train_loss": -10.473304748535156, "global_step": 192668, "epoch": 1146} {"train_loss": -9.822038650512695, "global_step": 192669, "epoch": 1146} {"train_loss": -10.480859756469727, "global_step": 192670, "epoch": 1146} {"train_loss": -9.66469669342041, "global_step": 192671, "epoch": 1146} {"train_loss": -10.744638442993164, "global_step": 192672, "epoch": 1146} {"train_loss": -10.204288482666016, "global_step": 192673, "epoch": 1146} {"train_loss": -10.366263389587402, "global_step": 192674, "epoch": 1146} {"train_loss": -10.76144790649414, "global_step": 192675, "epoch": 1146} {"train_loss": -10.74371337890625, "global_step": 192676, "epoch": 1146} {"train_loss": -10.632688522338867, "global_step": 192677, "epoch": 1146} {"train_loss": -10.918123245239258, "global_step": 192678, "epoch": 1146} {"train_loss": -10.694950103759766, "global_step": 192679, "epoch": 1146} {"train_loss": -10.764837265014648, "global_step": 192680, "epoch": 1146} {"train_loss": -10.914884567260742, "global_step": 192681, "epoch": 1146} {"train_loss": -11.072468757629395, "global_step": 192682, "epoch": 1146} {"train_loss": -10.821988105773926, "global_step": 192683, "epoch": 1146} {"train_loss": -10.881698608398438, "global_step": 192684, "epoch": 1146} {"train_loss": -11.092092514038086, "global_step": 192685, "epoch": 1146} {"train_loss": -10.847067832946777, "global_step": 192686, "epoch": 1146} {"train_loss": -10.909055709838867, "global_step": 192687, "epoch": 1146} {"train_loss": -11.02562141418457, "global_step": 192688, "epoch": 1146} {"train_loss": -11.139810562133789, "global_step": 192689, "epoch": 1146} {"train_loss": -11.085929870605469, "global_step": 192690, "epoch": 1146} {"train_loss": -11.009878158569336, "global_step": 192691, "epoch": 1146} {"train_loss": -11.203821182250977, "global_step": 192692, "epoch": 1146} {"train_loss": -11.220020294189453, "global_step": 192693, "epoch": 1146} {"train_loss": -11.329133033752441, "global_step": 192694, "epoch": 1146} {"train_loss": -10.775832213106609, "global_step": 192695, "epoch": 1146, "val_loss": 242400.5625} {"train_loss": -11.34361457824707, "global_step": 192696, "epoch": 1147} {"train_loss": -11.187417030334473, "global_step": 192697, "epoch": 1147} {"train_loss": -11.211210250854492, "global_step": 192698, "epoch": 1147} {"train_loss": -11.198063850402832, "global_step": 192699, "epoch": 1147} {"train_loss": -11.358783721923828, "global_step": 192700, "epoch": 1147} {"train_loss": -11.511735916137695, "global_step": 192701, "epoch": 1147} {"train_loss": -11.426223754882812, "global_step": 192702, "epoch": 1147} {"train_loss": -11.256192207336426, "global_step": 192703, "epoch": 1147} {"train_loss": -11.492218017578125, "global_step": 192704, "epoch": 1147} {"train_loss": -11.285539627075195, "global_step": 192705, "epoch": 1147} {"train_loss": -11.471702575683594, "global_step": 192706, "epoch": 1147} {"train_loss": -11.39981746673584, "global_step": 192707, "epoch": 1147} {"train_loss": -11.323007583618164, "global_step": 192708, "epoch": 1147} {"train_loss": -11.417144775390625, "global_step": 192709, "epoch": 1147} {"train_loss": -11.340433120727539, "global_step": 192710, "epoch": 1147} {"train_loss": -11.342491149902344, "global_step": 192711, "epoch": 1147} {"train_loss": -11.580141067504883, "global_step": 192712, "epoch": 1147} {"train_loss": -11.620525360107422, "global_step": 192713, "epoch": 1147} {"train_loss": -11.539224624633789, "global_step": 192714, "epoch": 1147} {"train_loss": -11.367976188659668, "global_step": 192715, "epoch": 1147} {"train_loss": -11.167423248291016, "global_step": 192716, "epoch": 1147} {"train_loss": -11.613907814025879, "global_step": 192717, "epoch": 1147} {"train_loss": -11.491365432739258, "global_step": 192718, "epoch": 1147} {"train_loss": -11.725335121154785, "global_step": 192719, "epoch": 1147} {"train_loss": -11.392106056213379, "global_step": 192720, "epoch": 1147} {"train_loss": -11.448202133178711, "global_step": 192721, "epoch": 1147} {"train_loss": -11.272645950317383, "global_step": 192722, "epoch": 1147} {"train_loss": -11.27358627319336, "global_step": 192723, "epoch": 1147} {"train_loss": -11.496382713317871, "global_step": 192724, "epoch": 1147} {"train_loss": -11.404172897338867, "global_step": 192725, "epoch": 1147} {"train_loss": -11.489059448242188, "global_step": 192726, "epoch": 1147} {"train_loss": -11.19926643371582, "global_step": 192727, "epoch": 1147} {"train_loss": -11.72653865814209, "global_step": 192728, "epoch": 1147} {"train_loss": -11.454566955566406, "global_step": 192729, "epoch": 1147} {"train_loss": -11.504758834838867, "global_step": 192730, "epoch": 1147} {"train_loss": -11.319253921508789, "global_step": 192731, "epoch": 1147} {"train_loss": -11.411870956420898, "global_step": 192732, "epoch": 1147} {"train_loss": -11.169210433959961, "global_step": 192733, "epoch": 1147} {"train_loss": -11.678279876708984, "global_step": 192734, "epoch": 1147} {"train_loss": -11.497946739196777, "global_step": 192735, "epoch": 1147} {"train_loss": -11.148321151733398, "global_step": 192736, "epoch": 1147} {"train_loss": -11.621545791625977, "global_step": 192737, "epoch": 1147} {"train_loss": -11.249295234680176, "global_step": 192738, "epoch": 1147} {"train_loss": -11.31115436553955, "global_step": 192739, "epoch": 1147} {"train_loss": -11.12898063659668, "global_step": 192740, "epoch": 1147} {"train_loss": -11.4542236328125, "global_step": 192741, "epoch": 1147} {"train_loss": -11.518295288085938, "global_step": 192742, "epoch": 1147} {"train_loss": -10.75998592376709, "global_step": 192743, "epoch": 1147} {"train_loss": -10.835741996765137, "global_step": 192744, "epoch": 1147} {"train_loss": -11.075416564941406, "global_step": 192745, "epoch": 1147} {"train_loss": -11.237066268920898, "global_step": 192746, "epoch": 1147} {"train_loss": -10.154617309570312, "global_step": 192747, "epoch": 1147} {"train_loss": -10.812477111816406, "global_step": 192748, "epoch": 1147} {"train_loss": -11.079744338989258, "global_step": 192749, "epoch": 1147} {"train_loss": -10.927850723266602, "global_step": 192750, "epoch": 1147} {"train_loss": -11.102300643920898, "global_step": 192751, "epoch": 1147} {"train_loss": -11.21098804473877, "global_step": 192752, "epoch": 1147} {"train_loss": -10.588666915893555, "global_step": 192753, "epoch": 1147} {"train_loss": -11.304292678833008, "global_step": 192754, "epoch": 1147} {"train_loss": -10.977724075317383, "global_step": 192755, "epoch": 1147} {"train_loss": -10.620322227478027, "global_step": 192756, "epoch": 1147} {"train_loss": -11.020623207092285, "global_step": 192757, "epoch": 1147} {"train_loss": -10.442718505859375, "global_step": 192758, "epoch": 1147} {"train_loss": -11.156197547912598, "global_step": 192759, "epoch": 1147} {"train_loss": -11.334246635437012, "global_step": 192760, "epoch": 1147} {"train_loss": -10.330913543701172, "global_step": 192761, "epoch": 1147} {"train_loss": -10.48226547241211, "global_step": 192762, "epoch": 1147} {"train_loss": -10.755516052246094, "global_step": 192763, "epoch": 1147} {"train_loss": -8.699810028076172, "global_step": 192764, "epoch": 1147} {"train_loss": -10.991331100463867, "global_step": 192765, "epoch": 1147} {"train_loss": -8.871145248413086, "global_step": 192766, "epoch": 1147} {"train_loss": -10.53177261352539, "global_step": 192767, "epoch": 1147} {"train_loss": -9.796931266784668, "global_step": 192768, "epoch": 1147} {"train_loss": -10.591463088989258, "global_step": 192769, "epoch": 1147} {"train_loss": -10.205352783203125, "global_step": 192770, "epoch": 1147} {"train_loss": -10.657936096191406, "global_step": 192771, "epoch": 1147} {"train_loss": -10.616669654846191, "global_step": 192772, "epoch": 1147} {"train_loss": -10.6483154296875, "global_step": 192773, "epoch": 1147} {"train_loss": -10.658466339111328, "global_step": 192774, "epoch": 1147} {"train_loss": -10.780301094055176, "global_step": 192775, "epoch": 1147} {"train_loss": -11.068225860595703, "global_step": 192776, "epoch": 1147} {"train_loss": -11.04642105102539, "global_step": 192777, "epoch": 1147} {"train_loss": -11.168392181396484, "global_step": 192778, "epoch": 1147} {"train_loss": -11.02845573425293, "global_step": 192779, "epoch": 1147} {"train_loss": -10.771920204162598, "global_step": 192780, "epoch": 1147} {"train_loss": -11.121752738952637, "global_step": 192781, "epoch": 1147} {"train_loss": -10.873191833496094, "global_step": 192782, "epoch": 1147} {"train_loss": -11.2109375, "global_step": 192783, "epoch": 1147} {"train_loss": -11.053281784057617, "global_step": 192784, "epoch": 1147} {"train_loss": -11.144994735717773, "global_step": 192785, "epoch": 1147} {"train_loss": -10.744278907775879, "global_step": 192786, "epoch": 1147} {"train_loss": -11.194130897521973, "global_step": 192787, "epoch": 1147} {"train_loss": -11.00541877746582, "global_step": 192788, "epoch": 1147} {"train_loss": -11.205211639404297, "global_step": 192789, "epoch": 1147} {"train_loss": -11.061887741088867, "global_step": 192790, "epoch": 1147} {"train_loss": -11.25433349609375, "global_step": 192791, "epoch": 1147} {"train_loss": -11.218990325927734, "global_step": 192792, "epoch": 1147} {"train_loss": -11.259127616882324, "global_step": 192793, "epoch": 1147} {"train_loss": -11.193127632141113, "global_step": 192794, "epoch": 1147} {"train_loss": -11.060232162475586, "global_step": 192795, "epoch": 1147} {"train_loss": -11.409318923950195, "global_step": 192796, "epoch": 1147} {"train_loss": -11.09755802154541, "global_step": 192797, "epoch": 1147} {"train_loss": -11.195086479187012, "global_step": 192798, "epoch": 1147} {"train_loss": -10.913322448730469, "global_step": 192799, "epoch": 1147} {"train_loss": -11.248150825500488, "global_step": 192800, "epoch": 1147} {"train_loss": -11.029573440551758, "global_step": 192801, "epoch": 1147} {"train_loss": -11.183660507202148, "global_step": 192802, "epoch": 1147} {"train_loss": -11.405661582946777, "global_step": 192803, "epoch": 1147} {"train_loss": -11.224583625793457, "global_step": 192804, "epoch": 1147} {"train_loss": -11.434867858886719, "global_step": 192805, "epoch": 1147} {"train_loss": -11.049253463745117, "global_step": 192806, "epoch": 1147} {"train_loss": -11.119538307189941, "global_step": 192807, "epoch": 1147} {"train_loss": -11.333938598632812, "global_step": 192808, "epoch": 1147} {"train_loss": -11.0737886428833, "global_step": 192809, "epoch": 1147} {"train_loss": -11.392763137817383, "global_step": 192810, "epoch": 1147} {"train_loss": -11.025226593017578, "global_step": 192811, "epoch": 1147} {"train_loss": -11.38370418548584, "global_step": 192812, "epoch": 1147} {"train_loss": -11.313657760620117, "global_step": 192813, "epoch": 1147} {"train_loss": -11.464353561401367, "global_step": 192814, "epoch": 1147} {"train_loss": -11.0679931640625, "global_step": 192815, "epoch": 1147} {"train_loss": -11.265363693237305, "global_step": 192816, "epoch": 1147} {"train_loss": -11.263092041015625, "global_step": 192817, "epoch": 1147} {"train_loss": -11.667806625366211, "global_step": 192818, "epoch": 1147} {"train_loss": -11.27904224395752, "global_step": 192819, "epoch": 1147} {"train_loss": -11.466590881347656, "global_step": 192820, "epoch": 1147} {"train_loss": -11.103364944458008, "global_step": 192821, "epoch": 1147} {"train_loss": -11.615452766418457, "global_step": 192822, "epoch": 1147} {"train_loss": -11.145417213439941, "global_step": 192823, "epoch": 1147} {"train_loss": -11.346693992614746, "global_step": 192824, "epoch": 1147} {"train_loss": -11.421896934509277, "global_step": 192825, "epoch": 1147} {"train_loss": -11.194307327270508, "global_step": 192826, "epoch": 1147} {"train_loss": -11.509623527526855, "global_step": 192827, "epoch": 1147} {"train_loss": -11.373786926269531, "global_step": 192828, "epoch": 1147} {"train_loss": -11.51258659362793, "global_step": 192829, "epoch": 1147} {"train_loss": -11.345928192138672, "global_step": 192830, "epoch": 1147} {"train_loss": -11.532278060913086, "global_step": 192831, "epoch": 1147} {"train_loss": -11.294198989868164, "global_step": 192832, "epoch": 1147} {"train_loss": -11.333237648010254, "global_step": 192833, "epoch": 1147} {"train_loss": -11.383561134338379, "global_step": 192834, "epoch": 1147} {"train_loss": -11.530946731567383, "global_step": 192835, "epoch": 1147} {"train_loss": -11.384392738342285, "global_step": 192836, "epoch": 1147} {"train_loss": -11.60872745513916, "global_step": 192837, "epoch": 1147} {"train_loss": -11.722984313964844, "global_step": 192838, "epoch": 1147} {"train_loss": -11.47046184539795, "global_step": 192839, "epoch": 1147} {"train_loss": -11.589162826538086, "global_step": 192840, "epoch": 1147} {"train_loss": -11.704790115356445, "global_step": 192841, "epoch": 1147} {"train_loss": -11.190669059753418, "global_step": 192842, "epoch": 1147} {"train_loss": -11.500444412231445, "global_step": 192843, "epoch": 1147} {"train_loss": -11.26925277709961, "global_step": 192844, "epoch": 1147} {"train_loss": -11.419060707092285, "global_step": 192845, "epoch": 1147} {"train_loss": -11.263526916503906, "global_step": 192846, "epoch": 1147} {"train_loss": -11.439090728759766, "global_step": 192847, "epoch": 1147} {"train_loss": -11.312931060791016, "global_step": 192848, "epoch": 1147} {"train_loss": -11.515077590942383, "global_step": 192849, "epoch": 1147} {"train_loss": -11.089344024658203, "global_step": 192850, "epoch": 1147} {"train_loss": -11.344696044921875, "global_step": 192851, "epoch": 1147} {"train_loss": -11.34929084777832, "global_step": 192852, "epoch": 1147} {"train_loss": -11.473322868347168, "global_step": 192853, "epoch": 1147} {"train_loss": -11.160371780395508, "global_step": 192854, "epoch": 1147} {"train_loss": -11.229910850524902, "global_step": 192855, "epoch": 1147} {"train_loss": -11.693878173828125, "global_step": 192856, "epoch": 1147} {"train_loss": -11.474985122680664, "global_step": 192857, "epoch": 1147} {"train_loss": -11.364398002624512, "global_step": 192858, "epoch": 1147} {"train_loss": -11.639303207397461, "global_step": 192859, "epoch": 1147} {"train_loss": -11.639657974243164, "global_step": 192860, "epoch": 1147} {"train_loss": -11.647130012512207, "global_step": 192861, "epoch": 1147} {"train_loss": -11.558655738830566, "global_step": 192862, "epoch": 1147} {"train_loss": -11.195331528073265, "global_step": 192863, "epoch": 1147, "val_loss": 248653.59375} {"train_loss": -11.436527252197266, "global_step": 192864, "epoch": 1148} {"train_loss": -9.8881196975708, "global_step": 192865, "epoch": 1148} {"train_loss": -10.080785751342773, "global_step": 192866, "epoch": 1148} {"train_loss": -11.41546630859375, "global_step": 192867, "epoch": 1148} {"train_loss": -10.081048965454102, "global_step": 192868, "epoch": 1148} {"train_loss": -10.285091400146484, "global_step": 192869, "epoch": 1148} {"train_loss": -11.339614868164062, "global_step": 192870, "epoch": 1148} {"train_loss": -10.80620002746582, "global_step": 192871, "epoch": 1148} {"train_loss": -11.063044548034668, "global_step": 192872, "epoch": 1148} {"train_loss": -10.806447982788086, "global_step": 192873, "epoch": 1148} {"train_loss": -11.142692565917969, "global_step": 192874, "epoch": 1148} {"train_loss": -11.531702995300293, "global_step": 192875, "epoch": 1148} {"train_loss": -10.684544563293457, "global_step": 192876, "epoch": 1148} {"train_loss": -11.352161407470703, "global_step": 192877, "epoch": 1148} {"train_loss": -11.121869087219238, "global_step": 192878, "epoch": 1148} {"train_loss": -11.352066040039062, "global_step": 192879, "epoch": 1148} {"train_loss": -11.03683853149414, "global_step": 192880, "epoch": 1148} {"train_loss": -11.109933853149414, "global_step": 192881, "epoch": 1148} {"train_loss": -11.190458297729492, "global_step": 192882, "epoch": 1148} {"train_loss": -11.521212577819824, "global_step": 192883, "epoch": 1148} {"train_loss": -11.10147476196289, "global_step": 192884, "epoch": 1148} {"train_loss": -11.306365966796875, "global_step": 192885, "epoch": 1148} {"train_loss": -11.503793716430664, "global_step": 192886, "epoch": 1148} {"train_loss": -11.488913536071777, "global_step": 192887, "epoch": 1148} {"train_loss": -11.436671257019043, "global_step": 192888, "epoch": 1148} {"train_loss": -11.180440902709961, "global_step": 192889, "epoch": 1148} {"train_loss": -11.516510009765625, "global_step": 192890, "epoch": 1148} {"train_loss": -11.202054023742676, "global_step": 192891, "epoch": 1148} {"train_loss": -11.331527709960938, "global_step": 192892, "epoch": 1148} {"train_loss": -11.320762634277344, "global_step": 192893, "epoch": 1148} {"train_loss": -11.378377914428711, "global_step": 192894, "epoch": 1148} {"train_loss": -11.580230712890625, "global_step": 192895, "epoch": 1148} {"train_loss": -10.598495483398438, "global_step": 192896, "epoch": 1148} {"train_loss": -11.028024673461914, "global_step": 192897, "epoch": 1148} {"train_loss": -11.051279067993164, "global_step": 192898, "epoch": 1148} {"train_loss": -10.906723022460938, "global_step": 192899, "epoch": 1148} {"train_loss": -10.5999116897583, "global_step": 192900, "epoch": 1148} {"train_loss": -11.223618507385254, "global_step": 192901, "epoch": 1148} {"train_loss": -10.950756072998047, "global_step": 192902, "epoch": 1148} {"train_loss": -11.227193832397461, "global_step": 192903, "epoch": 1148} {"train_loss": -10.665167808532715, "global_step": 192904, "epoch": 1148} {"train_loss": -10.633365631103516, "global_step": 192905, "epoch": 1148} {"train_loss": -11.242188453674316, "global_step": 192906, "epoch": 1148} {"train_loss": -10.738924026489258, "global_step": 192907, "epoch": 1148} {"train_loss": -10.926372528076172, "global_step": 192908, "epoch": 1148} {"train_loss": -11.254155158996582, "global_step": 192909, "epoch": 1148} {"train_loss": -10.74658203125, "global_step": 192910, "epoch": 1148} {"train_loss": -11.141733169555664, "global_step": 192911, "epoch": 1148} {"train_loss": -11.345934867858887, "global_step": 192912, "epoch": 1148} {"train_loss": -10.979106903076172, "global_step": 192913, "epoch": 1148} {"train_loss": -11.411956787109375, "global_step": 192914, "epoch": 1148} {"train_loss": -11.328852653503418, "global_step": 192915, "epoch": 1148} {"train_loss": -11.427057266235352, "global_step": 192916, "epoch": 1148} {"train_loss": -11.199954986572266, "global_step": 192917, "epoch": 1148} {"train_loss": -11.427804946899414, "global_step": 192918, "epoch": 1148} {"train_loss": -10.867124557495117, "global_step": 192919, "epoch": 1148} {"train_loss": -11.165782928466797, "global_step": 192920, "epoch": 1148} {"train_loss": -11.032833099365234, "global_step": 192921, "epoch": 1148} {"train_loss": -11.414443969726562, "global_step": 192922, "epoch": 1148} {"train_loss": -11.393704414367676, "global_step": 192923, "epoch": 1148} {"train_loss": -11.358047485351562, "global_step": 192924, "epoch": 1148} {"train_loss": -11.357536315917969, "global_step": 192925, "epoch": 1148} {"train_loss": -11.375833511352539, "global_step": 192926, "epoch": 1148} {"train_loss": -11.36861801147461, "global_step": 192927, "epoch": 1148} {"train_loss": -11.493789672851562, "global_step": 192928, "epoch": 1148} {"train_loss": -11.217615127563477, "global_step": 192929, "epoch": 1148} {"train_loss": -11.492974281311035, "global_step": 192930, "epoch": 1148} {"train_loss": -11.220704078674316, "global_step": 192931, "epoch": 1148} {"train_loss": -11.478873252868652, "global_step": 192932, "epoch": 1148} {"train_loss": -11.325775146484375, "global_step": 192933, "epoch": 1148} {"train_loss": -11.425140380859375, "global_step": 192934, "epoch": 1148} {"train_loss": -11.226099014282227, "global_step": 192935, "epoch": 1148} {"train_loss": -11.592775344848633, "global_step": 192936, "epoch": 1148} {"train_loss": -11.329049110412598, "global_step": 192937, "epoch": 1148} {"train_loss": -11.401191711425781, "global_step": 192938, "epoch": 1148} {"train_loss": -11.611733436584473, "global_step": 192939, "epoch": 1148} {"train_loss": -11.174829483032227, "global_step": 192940, "epoch": 1148} {"train_loss": -11.4302978515625, "global_step": 192941, "epoch": 1148} {"train_loss": -11.255629539489746, "global_step": 192942, "epoch": 1148} {"train_loss": -10.955723762512207, "global_step": 192943, "epoch": 1148} {"train_loss": -11.37997817993164, "global_step": 192944, "epoch": 1148} {"train_loss": -11.278339385986328, "global_step": 192945, "epoch": 1148} {"train_loss": -11.609644889831543, "global_step": 192946, "epoch": 1148} {"train_loss": -11.215248107910156, "global_step": 192947, "epoch": 1148} {"train_loss": -11.306509971618652, "global_step": 192948, "epoch": 1148} {"train_loss": -11.629800796508789, "global_step": 192949, "epoch": 1148} {"train_loss": -11.595008850097656, "global_step": 192950, "epoch": 1148} {"train_loss": -11.692835807800293, "global_step": 192951, "epoch": 1148} {"train_loss": -11.054126739501953, "global_step": 192952, "epoch": 1148} {"train_loss": -11.18777084350586, "global_step": 192953, "epoch": 1148} {"train_loss": -11.401158332824707, "global_step": 192954, "epoch": 1148} {"train_loss": -11.581462860107422, "global_step": 192955, "epoch": 1148} {"train_loss": -11.67629623413086, "global_step": 192956, "epoch": 1148} {"train_loss": -11.748210906982422, "global_step": 192957, "epoch": 1148} {"train_loss": -11.521209716796875, "global_step": 192958, "epoch": 1148} {"train_loss": -11.229767799377441, "global_step": 192959, "epoch": 1148} {"train_loss": -11.452022552490234, "global_step": 192960, "epoch": 1148} {"train_loss": -11.452523231506348, "global_step": 192961, "epoch": 1148} {"train_loss": -10.890043258666992, "global_step": 192962, "epoch": 1148} {"train_loss": -11.083839416503906, "global_step": 192963, "epoch": 1148} {"train_loss": -11.482673645019531, "global_step": 192964, "epoch": 1148} {"train_loss": -11.240948677062988, "global_step": 192965, "epoch": 1148} {"train_loss": -10.898258209228516, "global_step": 192966, "epoch": 1148} {"train_loss": -10.664216041564941, "global_step": 192967, "epoch": 1148} {"train_loss": -11.580323219299316, "global_step": 192968, "epoch": 1148} {"train_loss": -11.652250289916992, "global_step": 192969, "epoch": 1148} {"train_loss": -11.60971450805664, "global_step": 192970, "epoch": 1148} {"train_loss": -11.635209083557129, "global_step": 192971, "epoch": 1148} {"train_loss": -11.566495895385742, "global_step": 192972, "epoch": 1148} {"train_loss": -11.740568161010742, "global_step": 192973, "epoch": 1148} {"train_loss": -11.496406555175781, "global_step": 192974, "epoch": 1148} {"train_loss": -11.465877532958984, "global_step": 192975, "epoch": 1148} {"train_loss": -11.619099617004395, "global_step": 192976, "epoch": 1148} {"train_loss": -11.299005508422852, "global_step": 192977, "epoch": 1148} {"train_loss": -11.381532669067383, "global_step": 192978, "epoch": 1148} {"train_loss": -11.354438781738281, "global_step": 192979, "epoch": 1148} {"train_loss": -10.881643295288086, "global_step": 192980, "epoch": 1148} {"train_loss": -11.130487442016602, "global_step": 192981, "epoch": 1148} {"train_loss": -11.034664154052734, "global_step": 192982, "epoch": 1148} {"train_loss": -11.474800109863281, "global_step": 192983, "epoch": 1148} {"train_loss": -11.093732833862305, "global_step": 192984, "epoch": 1148} {"train_loss": -11.66067886352539, "global_step": 192985, "epoch": 1148} {"train_loss": -11.349015235900879, "global_step": 192986, "epoch": 1148} {"train_loss": -11.178654670715332, "global_step": 192987, "epoch": 1148} {"train_loss": -11.677606582641602, "global_step": 192988, "epoch": 1148} {"train_loss": -11.201574325561523, "global_step": 192989, "epoch": 1148} {"train_loss": -11.442211151123047, "global_step": 192990, "epoch": 1148} {"train_loss": -11.490189552307129, "global_step": 192991, "epoch": 1148} {"train_loss": -11.130867004394531, "global_step": 192992, "epoch": 1148} {"train_loss": -11.475303649902344, "global_step": 192993, "epoch": 1148} {"train_loss": -11.350297927856445, "global_step": 192994, "epoch": 1148} {"train_loss": -11.50326919555664, "global_step": 192995, "epoch": 1148} {"train_loss": -10.900703430175781, "global_step": 192996, "epoch": 1148} {"train_loss": -10.999836921691895, "global_step": 192997, "epoch": 1148} {"train_loss": -11.076339721679688, "global_step": 192998, "epoch": 1148} {"train_loss": -11.185968399047852, "global_step": 192999, "epoch": 1148} {"train_loss": -10.934186935424805, "global_step": 193000, "epoch": 1148} {"train_loss": -10.770637512207031, "global_step": 193001, "epoch": 1148} {"train_loss": -11.179888725280762, "global_step": 193002, "epoch": 1148} {"train_loss": -10.900890350341797, "global_step": 193003, "epoch": 1148} {"train_loss": -11.090380668640137, "global_step": 193004, "epoch": 1148} {"train_loss": -10.722391128540039, "global_step": 193005, "epoch": 1148} {"train_loss": -11.310508728027344, "global_step": 193006, "epoch": 1148} {"train_loss": -11.490854263305664, "global_step": 193007, "epoch": 1148} {"train_loss": -11.405586242675781, "global_step": 193008, "epoch": 1148} {"train_loss": -10.826428413391113, "global_step": 193009, "epoch": 1148} {"train_loss": -11.716825485229492, "global_step": 193010, "epoch": 1148} {"train_loss": -11.23166275024414, "global_step": 193011, "epoch": 1148} {"train_loss": -11.152114868164062, "global_step": 193012, "epoch": 1148} {"train_loss": -11.080459594726562, "global_step": 193013, "epoch": 1148} {"train_loss": -11.009040832519531, "global_step": 193014, "epoch": 1148} {"train_loss": -11.074430465698242, "global_step": 193015, "epoch": 1148} {"train_loss": -10.977359771728516, "global_step": 193016, "epoch": 1148} {"train_loss": -11.335524559020996, "global_step": 193017, "epoch": 1148} {"train_loss": -10.959077835083008, "global_step": 193018, "epoch": 1148} {"train_loss": -11.398187637329102, "global_step": 193019, "epoch": 1148} {"train_loss": -10.78797721862793, "global_step": 193020, "epoch": 1148} {"train_loss": -11.552362442016602, "global_step": 193021, "epoch": 1148} {"train_loss": -10.618224143981934, "global_step": 193022, "epoch": 1148} {"train_loss": -10.902831077575684, "global_step": 193023, "epoch": 1148} {"train_loss": -10.840137481689453, "global_step": 193024, "epoch": 1148} {"train_loss": -10.796836853027344, "global_step": 193025, "epoch": 1148} {"train_loss": -10.854844093322754, "global_step": 193026, "epoch": 1148} {"train_loss": -11.085601806640625, "global_step": 193027, "epoch": 1148} {"train_loss": -10.297728538513184, "global_step": 193028, "epoch": 1148} {"train_loss": -11.09503173828125, "global_step": 193029, "epoch": 1148} {"train_loss": -10.414838790893555, "global_step": 193030, "epoch": 1148} {"train_loss": -11.19429502033052, "global_step": 193031, "epoch": 1148, "val_loss": 250997.671875} {"train_loss": -11.457530975341797, "global_step": 193032, "epoch": 1149} {"train_loss": -10.52093505859375, "global_step": 193033, "epoch": 1149} {"train_loss": -10.575111389160156, "global_step": 193034, "epoch": 1149} {"train_loss": -10.860380172729492, "global_step": 193035, "epoch": 1149} {"train_loss": -10.189250946044922, "global_step": 193036, "epoch": 1149} {"train_loss": -11.028470993041992, "global_step": 193037, "epoch": 1149} {"train_loss": -10.377939224243164, "global_step": 193038, "epoch": 1149} {"train_loss": -11.07338809967041, "global_step": 193039, "epoch": 1149} {"train_loss": -10.664064407348633, "global_step": 193040, "epoch": 1149} {"train_loss": -10.84892749786377, "global_step": 193041, "epoch": 1149} {"train_loss": -11.125143051147461, "global_step": 193042, "epoch": 1149} {"train_loss": -10.88090705871582, "global_step": 193043, "epoch": 1149} {"train_loss": -10.856245040893555, "global_step": 193044, "epoch": 1149} {"train_loss": -10.637737274169922, "global_step": 193045, "epoch": 1149} {"train_loss": -11.190529823303223, "global_step": 193046, "epoch": 1149} {"train_loss": -10.931461334228516, "global_step": 193047, "epoch": 1149} {"train_loss": -11.345710754394531, "global_step": 193048, "epoch": 1149} {"train_loss": -10.66540813446045, "global_step": 193049, "epoch": 1149} {"train_loss": -11.235734939575195, "global_step": 193050, "epoch": 1149} {"train_loss": -11.0968017578125, "global_step": 193051, "epoch": 1149} {"train_loss": -11.013873100280762, "global_step": 193052, "epoch": 1149} {"train_loss": -10.990199089050293, "global_step": 193053, "epoch": 1149} {"train_loss": -11.00977897644043, "global_step": 193054, "epoch": 1149} {"train_loss": -11.267633438110352, "global_step": 193055, "epoch": 1149} {"train_loss": -11.325909614562988, "global_step": 193056, "epoch": 1149} {"train_loss": -11.252802848815918, "global_step": 193057, "epoch": 1149} {"train_loss": -11.595170021057129, "global_step": 193058, "epoch": 1149} {"train_loss": -11.147907257080078, "global_step": 193059, "epoch": 1149} {"train_loss": -11.443102836608887, "global_step": 193060, "epoch": 1149} {"train_loss": -11.1216402053833, "global_step": 193061, "epoch": 1149} {"train_loss": -11.153564453125, "global_step": 193062, "epoch": 1149} {"train_loss": -10.832404136657715, "global_step": 193063, "epoch": 1149} {"train_loss": -11.392500877380371, "global_step": 193064, "epoch": 1149} {"train_loss": -11.35055160522461, "global_step": 193065, "epoch": 1149} {"train_loss": -11.458803176879883, "global_step": 193066, "epoch": 1149} {"train_loss": -11.30734634399414, "global_step": 193067, "epoch": 1149} {"train_loss": -11.452933311462402, "global_step": 193068, "epoch": 1149} {"train_loss": -11.162353515625, "global_step": 193069, "epoch": 1149} {"train_loss": -11.266486167907715, "global_step": 193070, "epoch": 1149} {"train_loss": -11.339378356933594, "global_step": 193071, "epoch": 1149} {"train_loss": -11.193291664123535, "global_step": 193072, "epoch": 1149} {"train_loss": -11.410242080688477, "global_step": 193073, "epoch": 1149} {"train_loss": -11.307220458984375, "global_step": 193074, "epoch": 1149} {"train_loss": -11.343494415283203, "global_step": 193075, "epoch": 1149} {"train_loss": -11.244930267333984, "global_step": 193076, "epoch": 1149} {"train_loss": -11.430868148803711, "global_step": 193077, "epoch": 1149} {"train_loss": -11.356252670288086, "global_step": 193078, "epoch": 1149} {"train_loss": -11.562639236450195, "global_step": 193079, "epoch": 1149} {"train_loss": -11.743995666503906, "global_step": 193080, "epoch": 1149} {"train_loss": -11.461588859558105, "global_step": 193081, "epoch": 1149} {"train_loss": -11.232765197753906, "global_step": 193082, "epoch": 1149} {"train_loss": -11.399934768676758, "global_step": 193083, "epoch": 1149} {"train_loss": -11.742864608764648, "global_step": 193084, "epoch": 1149} {"train_loss": -11.64688491821289, "global_step": 193085, "epoch": 1149} {"train_loss": -11.261653900146484, "global_step": 193086, "epoch": 1149} {"train_loss": -11.65266227722168, "global_step": 193087, "epoch": 1149} {"train_loss": -11.560102462768555, "global_step": 193088, "epoch": 1149} {"train_loss": -11.6028470993042, "global_step": 193089, "epoch": 1149} {"train_loss": -11.741035461425781, "global_step": 193090, "epoch": 1149} {"train_loss": -11.589278221130371, "global_step": 193091, "epoch": 1149} {"train_loss": -11.626445770263672, "global_step": 193092, "epoch": 1149} {"train_loss": -11.472333908081055, "global_step": 193093, "epoch": 1149} {"train_loss": -11.780167579650879, "global_step": 193094, "epoch": 1149} {"train_loss": -11.522963523864746, "global_step": 193095, "epoch": 1149} {"train_loss": -11.530401229858398, "global_step": 193096, "epoch": 1149} {"train_loss": -11.651674270629883, "global_step": 193097, "epoch": 1149} {"train_loss": -11.333602905273438, "global_step": 193098, "epoch": 1149} {"train_loss": -11.650162696838379, "global_step": 193099, "epoch": 1149} {"train_loss": -11.070340156555176, "global_step": 193100, "epoch": 1149} {"train_loss": -10.994808197021484, "global_step": 193101, "epoch": 1149} {"train_loss": -11.352713584899902, "global_step": 193102, "epoch": 1149} {"train_loss": -11.690287590026855, "global_step": 193103, "epoch": 1149} {"train_loss": -11.265937805175781, "global_step": 193104, "epoch": 1149} {"train_loss": -11.623170852661133, "global_step": 193105, "epoch": 1149} {"train_loss": -11.865472793579102, "global_step": 193106, "epoch": 1149} {"train_loss": -11.616996765136719, "global_step": 193107, "epoch": 1149} {"train_loss": -11.560054779052734, "global_step": 193108, "epoch": 1149} {"train_loss": -11.732671737670898, "global_step": 193109, "epoch": 1149} {"train_loss": -11.536602020263672, "global_step": 193110, "epoch": 1149} {"train_loss": -11.819221496582031, "global_step": 193111, "epoch": 1149} {"train_loss": -11.539023399353027, "global_step": 193112, "epoch": 1149} {"train_loss": -11.564953804016113, "global_step": 193113, "epoch": 1149} {"train_loss": -11.988757133483887, "global_step": 193114, "epoch": 1149} {"train_loss": -11.722972869873047, "global_step": 193115, "epoch": 1149} {"train_loss": -11.716195106506348, "global_step": 193116, "epoch": 1149} {"train_loss": -11.519342422485352, "global_step": 193117, "epoch": 1149} {"train_loss": -11.820074081420898, "global_step": 193118, "epoch": 1149} {"train_loss": -10.915650367736816, "global_step": 193119, "epoch": 1149} {"train_loss": -11.622087478637695, "global_step": 193120, "epoch": 1149} {"train_loss": -11.615575790405273, "global_step": 193121, "epoch": 1149} {"train_loss": -11.440205574035645, "global_step": 193122, "epoch": 1149} {"train_loss": -10.843562126159668, "global_step": 193123, "epoch": 1149} {"train_loss": -10.422998428344727, "global_step": 193124, "epoch": 1149} {"train_loss": -10.545997619628906, "global_step": 193125, "epoch": 1149} {"train_loss": -10.747962951660156, "global_step": 193126, "epoch": 1149} {"train_loss": -10.80113697052002, "global_step": 193127, "epoch": 1149} {"train_loss": -10.611944198608398, "global_step": 193128, "epoch": 1149} {"train_loss": -10.092318534851074, "global_step": 193129, "epoch": 1149} {"train_loss": -10.354446411132812, "global_step": 193130, "epoch": 1149} {"train_loss": -11.327352523803711, "global_step": 193131, "epoch": 1149} {"train_loss": -10.279597282409668, "global_step": 193132, "epoch": 1149} {"train_loss": -11.199074745178223, "global_step": 193133, "epoch": 1149} {"train_loss": -10.0950927734375, "global_step": 193134, "epoch": 1149} {"train_loss": -11.325006484985352, "global_step": 193135, "epoch": 1149} {"train_loss": -10.116036415100098, "global_step": 193136, "epoch": 1149} {"train_loss": -11.066471099853516, "global_step": 193137, "epoch": 1149} {"train_loss": -10.526752471923828, "global_step": 193138, "epoch": 1149} {"train_loss": -9.717941284179688, "global_step": 193139, "epoch": 1149} {"train_loss": -11.069565773010254, "global_step": 193140, "epoch": 1149} {"train_loss": -10.212017059326172, "global_step": 193141, "epoch": 1149} {"train_loss": -10.616096496582031, "global_step": 193142, "epoch": 1149} {"train_loss": -10.749971389770508, "global_step": 193143, "epoch": 1149} {"train_loss": -9.811819076538086, "global_step": 193144, "epoch": 1149} {"train_loss": -11.453067779541016, "global_step": 193145, "epoch": 1149} {"train_loss": -9.10893440246582, "global_step": 193146, "epoch": 1149} {"train_loss": -11.018495559692383, "global_step": 193147, "epoch": 1149} {"train_loss": -10.06236457824707, "global_step": 193148, "epoch": 1149} {"train_loss": -10.52802562713623, "global_step": 193149, "epoch": 1149} {"train_loss": -10.72494125366211, "global_step": 193150, "epoch": 1149} {"train_loss": -10.359525680541992, "global_step": 193151, "epoch": 1149} {"train_loss": -10.79297924041748, "global_step": 193152, "epoch": 1149} {"train_loss": -10.498912811279297, "global_step": 193153, "epoch": 1149} {"train_loss": -10.855889320373535, "global_step": 193154, "epoch": 1149} {"train_loss": -10.837520599365234, "global_step": 193155, "epoch": 1149} {"train_loss": -10.771499633789062, "global_step": 193156, "epoch": 1149} {"train_loss": -10.85584831237793, "global_step": 193157, "epoch": 1149} {"train_loss": -10.868188858032227, "global_step": 193158, "epoch": 1149} {"train_loss": -11.222345352172852, "global_step": 193159, "epoch": 1149} {"train_loss": -10.603334426879883, "global_step": 193160, "epoch": 1149} {"train_loss": -11.275075912475586, "global_step": 193161, "epoch": 1149} {"train_loss": -10.697830200195312, "global_step": 193162, "epoch": 1149} {"train_loss": -11.133684158325195, "global_step": 193163, "epoch": 1149} {"train_loss": -11.03994083404541, "global_step": 193164, "epoch": 1149} {"train_loss": -11.113004684448242, "global_step": 193165, "epoch": 1149} {"train_loss": -11.00953483581543, "global_step": 193166, "epoch": 1149} {"train_loss": -11.330464363098145, "global_step": 193167, "epoch": 1149} {"train_loss": -10.98610782623291, "global_step": 193168, "epoch": 1149} {"train_loss": -11.042698860168457, "global_step": 193169, "epoch": 1149} {"train_loss": -11.194244384765625, "global_step": 193170, "epoch": 1149} {"train_loss": -10.760285377502441, "global_step": 193171, "epoch": 1149} {"train_loss": -11.050455093383789, "global_step": 193172, "epoch": 1149} {"train_loss": -11.031013488769531, "global_step": 193173, "epoch": 1149} {"train_loss": -11.306797981262207, "global_step": 193174, "epoch": 1149} {"train_loss": -10.95217227935791, "global_step": 193175, "epoch": 1149} {"train_loss": -11.377449035644531, "global_step": 193176, "epoch": 1149} {"train_loss": -11.287067413330078, "global_step": 193177, "epoch": 1149} {"train_loss": -11.16342544555664, "global_step": 193178, "epoch": 1149} {"train_loss": -11.327264785766602, "global_step": 193179, "epoch": 1149} {"train_loss": -11.403984069824219, "global_step": 193180, "epoch": 1149} {"train_loss": -11.4595308303833, "global_step": 193181, "epoch": 1149} {"train_loss": -11.40891170501709, "global_step": 193182, "epoch": 1149} {"train_loss": -11.407608032226562, "global_step": 193183, "epoch": 1149} {"train_loss": -11.53952407836914, "global_step": 193184, "epoch": 1149} {"train_loss": -11.248732566833496, "global_step": 193185, "epoch": 1149} {"train_loss": -11.535380363464355, "global_step": 193186, "epoch": 1149} {"train_loss": -11.558465003967285, "global_step": 193187, "epoch": 1149} {"train_loss": -11.595964431762695, "global_step": 193188, "epoch": 1149} {"train_loss": -11.510913848876953, "global_step": 193189, "epoch": 1149} {"train_loss": -11.555583953857422, "global_step": 193190, "epoch": 1149} {"train_loss": -11.489278793334961, "global_step": 193191, "epoch": 1149} {"train_loss": -11.726181030273438, "global_step": 193192, "epoch": 1149} {"train_loss": -11.57748031616211, "global_step": 193193, "epoch": 1149} {"train_loss": -11.653997421264648, "global_step": 193194, "epoch": 1149} {"train_loss": -11.554727554321289, "global_step": 193195, "epoch": 1149} {"train_loss": -11.477079391479492, "global_step": 193196, "epoch": 1149} {"train_loss": -11.774690628051758, "global_step": 193197, "epoch": 1149} {"train_loss": -11.622817039489746, "global_step": 193198, "epoch": 1149} {"train_loss": -11.161160645030794, "global_step": 193199, "epoch": 1149, "val_loss": 250799.125} {"train_loss": -11.67088794708252, "global_step": 193200, "epoch": 1150} {"train_loss": -11.403704643249512, "global_step": 193201, "epoch": 1150} {"train_loss": -11.761293411254883, "global_step": 193202, "epoch": 1150} {"train_loss": -11.560205459594727, "global_step": 193203, "epoch": 1150} {"train_loss": -11.757959365844727, "global_step": 193204, "epoch": 1150} {"train_loss": -11.577285766601562, "global_step": 193205, "epoch": 1150} {"train_loss": -11.614299774169922, "global_step": 193206, "epoch": 1150} {"train_loss": -11.651664733886719, "global_step": 193207, "epoch": 1150} {"train_loss": -11.828604698181152, "global_step": 193208, "epoch": 1150} {"train_loss": -11.665733337402344, "global_step": 193209, "epoch": 1150} {"train_loss": -11.835370063781738, "global_step": 193210, "epoch": 1150} {"train_loss": -11.825764656066895, "global_step": 193211, "epoch": 1150} {"train_loss": -11.394371032714844, "global_step": 193212, "epoch": 1150} {"train_loss": -11.615808486938477, "global_step": 193213, "epoch": 1150} {"train_loss": -11.72487735748291, "global_step": 193214, "epoch": 1150} {"train_loss": -11.569463729858398, "global_step": 193215, "epoch": 1150} {"train_loss": -11.828509330749512, "global_step": 193216, "epoch": 1150} {"train_loss": -11.928106307983398, "global_step": 193217, "epoch": 1150} {"train_loss": -11.632560729980469, "global_step": 193218, "epoch": 1150} {"train_loss": -11.444770812988281, "global_step": 193219, "epoch": 1150} {"train_loss": -11.672536849975586, "global_step": 193220, "epoch": 1150} {"train_loss": -11.788330078125, "global_step": 193221, "epoch": 1150} {"train_loss": -11.577014923095703, "global_step": 193222, "epoch": 1150} {"train_loss": -11.509278297424316, "global_step": 193223, "epoch": 1150} {"train_loss": -11.410700798034668, "global_step": 193224, "epoch": 1150} {"train_loss": -11.768683433532715, "global_step": 193225, "epoch": 1150} {"train_loss": -11.280238151550293, "global_step": 193226, "epoch": 1150} {"train_loss": -11.349458694458008, "global_step": 193227, "epoch": 1150} {"train_loss": -9.995631217956543, "global_step": 193228, "epoch": 1150} {"train_loss": -10.93376350402832, "global_step": 193229, "epoch": 1150} {"train_loss": -11.198257446289062, "global_step": 193230, "epoch": 1150} {"train_loss": -11.085274696350098, "global_step": 193231, "epoch": 1150} {"train_loss": -10.761138916015625, "global_step": 193232, "epoch": 1150} {"train_loss": -10.95190715789795, "global_step": 193233, "epoch": 1150} {"train_loss": -10.482015609741211, "global_step": 193234, "epoch": 1150} {"train_loss": -9.820937156677246, "global_step": 193235, "epoch": 1150} {"train_loss": -8.99285888671875, "global_step": 193236, "epoch": 1150} {"train_loss": -9.491836547851562, "global_step": 193237, "epoch": 1150} {"train_loss": -9.120884895324707, "global_step": 193238, "epoch": 1150} {"train_loss": -9.237678527832031, "global_step": 193239, "epoch": 1150} {"train_loss": -7.172821044921875, "global_step": 193240, "epoch": 1150} {"train_loss": -9.601348876953125, "global_step": 193241, "epoch": 1150} {"train_loss": -7.357924461364746, "global_step": 193242, "epoch": 1150} {"train_loss": -8.938358306884766, "global_step": 193243, "epoch": 1150} {"train_loss": -7.686656951904297, "global_step": 193244, "epoch": 1150} {"train_loss": -7.8180832862854, "global_step": 193245, "epoch": 1150} {"train_loss": -9.005838394165039, "global_step": 193246, "epoch": 1150} {"train_loss": -9.44650936126709, "global_step": 193247, "epoch": 1150} {"train_loss": -9.411073684692383, "global_step": 193248, "epoch": 1150} {"train_loss": -9.676156997680664, "global_step": 193249, "epoch": 1150} {"train_loss": -10.367307662963867, "global_step": 193250, "epoch": 1150} {"train_loss": -9.830179214477539, "global_step": 193251, "epoch": 1150} {"train_loss": -10.063125610351562, "global_step": 193252, "epoch": 1150} {"train_loss": -10.273451805114746, "global_step": 193253, "epoch": 1150} {"train_loss": -10.205659866333008, "global_step": 193254, "epoch": 1150} {"train_loss": -10.850179672241211, "global_step": 193255, "epoch": 1150} {"train_loss": -10.919017791748047, "global_step": 193256, "epoch": 1150} {"train_loss": -10.678048133850098, "global_step": 193257, "epoch": 1150} {"train_loss": -10.880317687988281, "global_step": 193258, "epoch": 1150} {"train_loss": -10.98643684387207, "global_step": 193259, "epoch": 1150} {"train_loss": -10.732564926147461, "global_step": 193260, "epoch": 1150} {"train_loss": -10.767720222473145, "global_step": 193261, "epoch": 1150} {"train_loss": -10.952286720275879, "global_step": 193262, "epoch": 1150} {"train_loss": -10.725341796875, "global_step": 193263, "epoch": 1150} {"train_loss": -10.715089797973633, "global_step": 193264, "epoch": 1150} {"train_loss": -10.972920417785645, "global_step": 193265, "epoch": 1150} {"train_loss": -10.766801834106445, "global_step": 193266, "epoch": 1150} {"train_loss": -10.77380657196045, "global_step": 193267, "epoch": 1150} {"train_loss": -11.124544143676758, "global_step": 193268, "epoch": 1150} {"train_loss": -11.000421524047852, "global_step": 193269, "epoch": 1150} {"train_loss": -11.046499252319336, "global_step": 193270, "epoch": 1150} {"train_loss": -10.972004890441895, "global_step": 193271, "epoch": 1150} {"train_loss": -10.985051155090332, "global_step": 193272, "epoch": 1150} {"train_loss": -10.834766387939453, "global_step": 193273, "epoch": 1150} {"train_loss": -11.026481628417969, "global_step": 193274, "epoch": 1150} {"train_loss": -10.98025894165039, "global_step": 193275, "epoch": 1150} {"train_loss": -11.019171714782715, "global_step": 193276, "epoch": 1150} {"train_loss": -10.950689315795898, "global_step": 193277, "epoch": 1150} {"train_loss": -11.121335983276367, "global_step": 193278, "epoch": 1150} {"train_loss": -11.318012237548828, "global_step": 193279, "epoch": 1150} {"train_loss": -11.289600372314453, "global_step": 193280, "epoch": 1150} {"train_loss": -11.127277374267578, "global_step": 193281, "epoch": 1150} {"train_loss": -11.394439697265625, "global_step": 193282, "epoch": 1150} {"train_loss": -11.263055801391602, "global_step": 193283, "epoch": 1150} {"train_loss": -11.447540283203125, "global_step": 193284, "epoch": 1150} {"train_loss": -11.380647659301758, "global_step": 193285, "epoch": 1150} {"train_loss": -11.214460372924805, "global_step": 193286, "epoch": 1150} {"train_loss": -11.38088321685791, "global_step": 193287, "epoch": 1150} {"train_loss": -11.362909317016602, "global_step": 193288, "epoch": 1150} {"train_loss": -11.457799911499023, "global_step": 193289, "epoch": 1150} {"train_loss": -11.310940742492676, "global_step": 193290, "epoch": 1150} {"train_loss": -11.489577293395996, "global_step": 193291, "epoch": 1150} {"train_loss": -11.30634593963623, "global_step": 193292, "epoch": 1150} {"train_loss": -11.402122497558594, "global_step": 193293, "epoch": 1150} {"train_loss": -11.467096328735352, "global_step": 193294, "epoch": 1150} {"train_loss": -11.656147956848145, "global_step": 193295, "epoch": 1150} {"train_loss": -11.376213073730469, "global_step": 193296, "epoch": 1150} {"train_loss": -11.397261619567871, "global_step": 193297, "epoch": 1150} {"train_loss": -11.367694854736328, "global_step": 193298, "epoch": 1150} {"train_loss": -11.392064094543457, "global_step": 193299, "epoch": 1150} {"train_loss": -11.664464950561523, "global_step": 193300, "epoch": 1150} {"train_loss": -11.357841491699219, "global_step": 193301, "epoch": 1150} {"train_loss": -11.527017593383789, "global_step": 193302, "epoch": 1150} {"train_loss": -11.575586318969727, "global_step": 193303, "epoch": 1150} {"train_loss": -11.604618072509766, "global_step": 193304, "epoch": 1150} {"train_loss": -11.720605850219727, "global_step": 193305, "epoch": 1150} {"train_loss": -11.339873313903809, "global_step": 193306, "epoch": 1150} {"train_loss": -11.706467628479004, "global_step": 193307, "epoch": 1150} {"train_loss": -11.676961898803711, "global_step": 193308, "epoch": 1150} {"train_loss": -11.604470252990723, "global_step": 193309, "epoch": 1150} {"train_loss": -11.801877975463867, "global_step": 193310, "epoch": 1150} {"train_loss": -11.514227867126465, "global_step": 193311, "epoch": 1150} {"train_loss": -11.799739837646484, "global_step": 193312, "epoch": 1150} {"train_loss": -11.660476684570312, "global_step": 193313, "epoch": 1150} {"train_loss": -11.797788619995117, "global_step": 193314, "epoch": 1150} {"train_loss": -11.73245620727539, "global_step": 193315, "epoch": 1150} {"train_loss": -11.588777542114258, "global_step": 193316, "epoch": 1150} {"train_loss": -11.636453628540039, "global_step": 193317, "epoch": 1150} {"train_loss": -11.70292854309082, "global_step": 193318, "epoch": 1150} {"train_loss": -11.671457290649414, "global_step": 193319, "epoch": 1150} {"train_loss": -11.625513076782227, "global_step": 193320, "epoch": 1150} {"train_loss": -11.606034278869629, "global_step": 193321, "epoch": 1150} {"train_loss": -11.622503280639648, "global_step": 193322, "epoch": 1150} {"train_loss": -11.970693588256836, "global_step": 193323, "epoch": 1150} {"train_loss": -11.894576072692871, "global_step": 193324, "epoch": 1150} {"train_loss": -11.659028053283691, "global_step": 193325, "epoch": 1150} {"train_loss": -11.48681640625, "global_step": 193326, "epoch": 1150} {"train_loss": -11.524486541748047, "global_step": 193327, "epoch": 1150} {"train_loss": -11.610471725463867, "global_step": 193328, "epoch": 1150} {"train_loss": -11.318929672241211, "global_step": 193329, "epoch": 1150} {"train_loss": -11.663532257080078, "global_step": 193330, "epoch": 1150} {"train_loss": -11.224918365478516, "global_step": 193331, "epoch": 1150} {"train_loss": -11.680562973022461, "global_step": 193332, "epoch": 1150} {"train_loss": -11.181047439575195, "global_step": 193333, "epoch": 1150} {"train_loss": -11.206907272338867, "global_step": 193334, "epoch": 1150} {"train_loss": -10.962532043457031, "global_step": 193335, "epoch": 1150} {"train_loss": -10.155313491821289, "global_step": 193336, "epoch": 1150} {"train_loss": -10.026498794555664, "global_step": 193337, "epoch": 1150} {"train_loss": -11.19930648803711, "global_step": 193338, "epoch": 1150} {"train_loss": -11.358695983886719, "global_step": 193339, "epoch": 1150} {"train_loss": -10.703092575073242, "global_step": 193340, "epoch": 1150} {"train_loss": -11.169897079467773, "global_step": 193341, "epoch": 1150} {"train_loss": -10.334976196289062, "global_step": 193342, "epoch": 1150} {"train_loss": -11.136577606201172, "global_step": 193343, "epoch": 1150} {"train_loss": -10.707807540893555, "global_step": 193344, "epoch": 1150} {"train_loss": -11.307449340820312, "global_step": 193345, "epoch": 1150} {"train_loss": -10.138164520263672, "global_step": 193346, "epoch": 1150} {"train_loss": -9.980140686035156, "global_step": 193347, "epoch": 1150} {"train_loss": -11.013787269592285, "global_step": 193348, "epoch": 1150} {"train_loss": -10.839245796203613, "global_step": 193349, "epoch": 1150} {"train_loss": -10.73906135559082, "global_step": 193350, "epoch": 1150} {"train_loss": -10.920231819152832, "global_step": 193351, "epoch": 1150} {"train_loss": -10.540781021118164, "global_step": 193352, "epoch": 1150} {"train_loss": -10.609371185302734, "global_step": 193353, "epoch": 1150} {"train_loss": -8.938314437866211, "global_step": 193354, "epoch": 1150} {"train_loss": -9.512263298034668, "global_step": 193355, "epoch": 1150} {"train_loss": -10.753972053527832, "global_step": 193356, "epoch": 1150} {"train_loss": -10.338994979858398, "global_step": 193357, "epoch": 1150} {"train_loss": -10.775383949279785, "global_step": 193358, "epoch": 1150} {"train_loss": -9.744173049926758, "global_step": 193359, "epoch": 1150} {"train_loss": -10.415319442749023, "global_step": 193360, "epoch": 1150} {"train_loss": -10.129199981689453, "global_step": 193361, "epoch": 1150} {"train_loss": -10.792941093444824, "global_step": 193362, "epoch": 1150} {"train_loss": -10.090141296386719, "global_step": 193363, "epoch": 1150} {"train_loss": -11.10608196258545, "global_step": 193364, "epoch": 1150} {"train_loss": -10.503771781921387, "global_step": 193365, "epoch": 1150} {"train_loss": -10.398475646972656, "global_step": 193366, "epoch": 1150} {"train_loss": -10.94780864318212, "global_step": 193367, "epoch": 1150, "train/sim_max_reward_0": 0.6949644214224812, "train/sim_max_reward_1": 0.9943296216561885, "train/sim_max_reward_2": 0.05378436117423788, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.5823399194466827, "test/sim_max_reward_4400000": 0.29974027361458155, "test/sim_max_reward_4400001": 0.5174574511534954, "test/sim_max_reward_4400002": 0.08330444015458723, "test/sim_max_reward_4400003": 0.9731275692212783, "test/sim_max_reward_4400004": 0.9094889610896633, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 0.38417073818628733, "test/sim_max_reward_4400007": 0.7099678647769759, "test/sim_max_reward_4400008": 0.6202001843205052, "test/sim_max_reward_4400009": 0.4794967092608056, "test/sim_max_reward_4400010": 0.9823023098807301, "test/sim_max_reward_4400011": 0.9150938309729586, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.9825965860519877, "test/sim_max_reward_4400014": 0.9613669547364628, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.960885567227389, "test/sim_max_reward_4400019": 0.5201315378681667, "test/sim_max_reward_4400020": 3.1776990466733094e-05, "test/sim_max_reward_4400021": 0.6361380596638594, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 1.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.6021825165887201, "test/sim_max_reward_4400026": 0.060316548145981294, "test/sim_max_reward_4400027": 1.0, "test/sim_max_reward_4400028": 1.0, "test/sim_max_reward_4400029": 0.49183256390094987, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.9747854692197482, "test/sim_max_reward_4400032": 0.1886389233279365, "test/sim_max_reward_4400033": 1.0, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.4892414984985966, "test/sim_max_reward_4400036": 0.37471955135051344, "test/sim_max_reward_4400037": 0.9252421378425252, "test/sim_max_reward_4400038": 0.3368286814919356, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.1810053768784295, "test/sim_max_reward_4400042": 0.02941963599060912, "test/sim_max_reward_4400043": 0.9913861687743682, "test/sim_max_reward_4400044": 0.8921852261015759, "test/sim_max_reward_4400045": 0.958465993097283, "test/sim_max_reward_4400046": 0.3079963635066071, "test/sim_max_reward_4400047": 0.9981732641670078, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.32675927642192304, "train/mean_score": 0.7209030539499318, "test/mean_score": 0.5914906179108858, "val_loss": 242257.578125, "train_action_mse_error": 0.6229404807090759} {"train_loss": -10.664186477661133, "global_step": 193368, "epoch": 1151} {"train_loss": -10.770502090454102, "global_step": 193369, "epoch": 1151} {"train_loss": -10.942585945129395, "global_step": 193370, "epoch": 1151} {"train_loss": -10.3662109375, "global_step": 193371, "epoch": 1151} {"train_loss": -10.946065902709961, "global_step": 193372, "epoch": 1151} {"train_loss": -10.812301635742188, "global_step": 193373, "epoch": 1151} {"train_loss": -10.650056838989258, "global_step": 193374, "epoch": 1151} {"train_loss": -11.089661598205566, "global_step": 193375, "epoch": 1151} {"train_loss": -11.077007293701172, "global_step": 193376, "epoch": 1151} {"train_loss": -10.988468170166016, "global_step": 193377, "epoch": 1151} {"train_loss": -11.332544326782227, "global_step": 193378, "epoch": 1151} {"train_loss": -11.091890335083008, "global_step": 193379, "epoch": 1151} {"train_loss": -11.077714920043945, "global_step": 193380, "epoch": 1151} {"train_loss": -11.306694030761719, "global_step": 193381, "epoch": 1151} {"train_loss": -11.075712203979492, "global_step": 193382, "epoch": 1151} {"train_loss": -11.015103340148926, "global_step": 193383, "epoch": 1151} {"train_loss": -11.167252540588379, "global_step": 193384, "epoch": 1151} {"train_loss": -11.288351058959961, "global_step": 193385, "epoch": 1151} {"train_loss": -11.1878662109375, "global_step": 193386, "epoch": 1151} {"train_loss": -11.381353378295898, "global_step": 193387, "epoch": 1151} {"train_loss": -11.107693672180176, "global_step": 193388, "epoch": 1151} {"train_loss": -11.485300064086914, "global_step": 193389, "epoch": 1151} {"train_loss": -11.368149757385254, "global_step": 193390, "epoch": 1151} {"train_loss": -11.210554122924805, "global_step": 193391, "epoch": 1151} {"train_loss": -11.392465591430664, "global_step": 193392, "epoch": 1151} {"train_loss": -11.493090629577637, "global_step": 193393, "epoch": 1151} {"train_loss": -11.440312385559082, "global_step": 193394, "epoch": 1151} {"train_loss": -11.448698043823242, "global_step": 193395, "epoch": 1151} {"train_loss": -11.500329971313477, "global_step": 193396, "epoch": 1151} {"train_loss": -11.292562484741211, "global_step": 193397, "epoch": 1151} {"train_loss": -11.394315719604492, "global_step": 193398, "epoch": 1151} {"train_loss": -11.572362899780273, "global_step": 193399, "epoch": 1151} {"train_loss": -10.99247932434082, "global_step": 193400, "epoch": 1151} {"train_loss": -11.61280632019043, "global_step": 193401, "epoch": 1151} {"train_loss": -11.442658424377441, "global_step": 193402, "epoch": 1151} {"train_loss": -11.478516578674316, "global_step": 193403, "epoch": 1151} {"train_loss": -11.29552936553955, "global_step": 193404, "epoch": 1151} {"train_loss": -11.502946853637695, "global_step": 193405, "epoch": 1151} {"train_loss": -11.561853408813477, "global_step": 193406, "epoch": 1151} {"train_loss": -11.381769180297852, "global_step": 193407, "epoch": 1151} {"train_loss": -11.552875518798828, "global_step": 193408, "epoch": 1151} {"train_loss": -11.624669075012207, "global_step": 193409, "epoch": 1151} {"train_loss": -11.763992309570312, "global_step": 193410, "epoch": 1151} {"train_loss": -11.674149513244629, "global_step": 193411, "epoch": 1151} {"train_loss": -11.549570083618164, "global_step": 193412, "epoch": 1151} {"train_loss": -11.784282684326172, "global_step": 193413, "epoch": 1151} {"train_loss": -11.613176345825195, "global_step": 193414, "epoch": 1151} {"train_loss": -11.716486930847168, "global_step": 193415, "epoch": 1151} {"train_loss": -11.74940299987793, "global_step": 193416, "epoch": 1151} {"train_loss": -11.80611801147461, "global_step": 193417, "epoch": 1151} {"train_loss": -11.718185424804688, "global_step": 193418, "epoch": 1151} {"train_loss": -11.717528343200684, "global_step": 193419, "epoch": 1151} {"train_loss": -11.794913291931152, "global_step": 193420, "epoch": 1151} {"train_loss": -11.728028297424316, "global_step": 193421, "epoch": 1151} {"train_loss": -11.593541145324707, "global_step": 193422, "epoch": 1151} {"train_loss": -11.7173433303833, "global_step": 193423, "epoch": 1151} {"train_loss": -11.771751403808594, "global_step": 193424, "epoch": 1151} {"train_loss": -11.639028549194336, "global_step": 193425, "epoch": 1151} {"train_loss": -11.737646102905273, "global_step": 193426, "epoch": 1151} {"train_loss": -11.809260368347168, "global_step": 193427, "epoch": 1151} {"train_loss": -11.69821548461914, "global_step": 193428, "epoch": 1151} {"train_loss": -11.812249183654785, "global_step": 193429, "epoch": 1151} {"train_loss": -11.270333290100098, "global_step": 193430, "epoch": 1151} {"train_loss": -11.549489974975586, "global_step": 193431, "epoch": 1151} {"train_loss": -11.45428466796875, "global_step": 193432, "epoch": 1151} {"train_loss": -11.48588752746582, "global_step": 193433, "epoch": 1151} {"train_loss": -11.269350051879883, "global_step": 193434, "epoch": 1151} {"train_loss": -11.200523376464844, "global_step": 193435, "epoch": 1151} {"train_loss": -11.19485855102539, "global_step": 193436, "epoch": 1151} {"train_loss": -11.130739212036133, "global_step": 193437, "epoch": 1151} {"train_loss": -11.772198677062988, "global_step": 193438, "epoch": 1151} {"train_loss": -10.968219757080078, "global_step": 193439, "epoch": 1151} {"train_loss": -11.620393753051758, "global_step": 193440, "epoch": 1151} {"train_loss": -11.276002883911133, "global_step": 193441, "epoch": 1151} {"train_loss": -11.082566261291504, "global_step": 193442, "epoch": 1151} {"train_loss": -10.654498100280762, "global_step": 193443, "epoch": 1151} {"train_loss": -10.738996505737305, "global_step": 193444, "epoch": 1151} {"train_loss": -10.604053497314453, "global_step": 193445, "epoch": 1151} {"train_loss": -11.129159927368164, "global_step": 193446, "epoch": 1151} {"train_loss": -11.123544692993164, "global_step": 193447, "epoch": 1151} {"train_loss": -10.790151596069336, "global_step": 193448, "epoch": 1151} {"train_loss": -10.31717300415039, "global_step": 193449, "epoch": 1151} {"train_loss": -10.145325660705566, "global_step": 193450, "epoch": 1151} {"train_loss": -10.053539276123047, "global_step": 193451, "epoch": 1151} {"train_loss": -10.913649559020996, "global_step": 193452, "epoch": 1151} {"train_loss": -10.874722480773926, "global_step": 193453, "epoch": 1151} {"train_loss": -10.691211700439453, "global_step": 193454, "epoch": 1151} {"train_loss": -10.684130668640137, "global_step": 193455, "epoch": 1151} {"train_loss": -10.906339645385742, "global_step": 193456, "epoch": 1151} {"train_loss": -10.558381080627441, "global_step": 193457, "epoch": 1151} {"train_loss": -11.32314682006836, "global_step": 193458, "epoch": 1151} {"train_loss": -9.784366607666016, "global_step": 193459, "epoch": 1151} {"train_loss": -10.740375518798828, "global_step": 193460, "epoch": 1151} {"train_loss": -10.333749771118164, "global_step": 193461, "epoch": 1151} {"train_loss": -10.860627174377441, "global_step": 193462, "epoch": 1151} {"train_loss": -10.047213554382324, "global_step": 193463, "epoch": 1151} {"train_loss": -10.333087921142578, "global_step": 193464, "epoch": 1151} {"train_loss": -10.637821197509766, "global_step": 193465, "epoch": 1151} {"train_loss": -10.279037475585938, "global_step": 193466, "epoch": 1151} {"train_loss": -10.941198348999023, "global_step": 193467, "epoch": 1151} {"train_loss": -10.948877334594727, "global_step": 193468, "epoch": 1151} {"train_loss": -10.710347175598145, "global_step": 193469, "epoch": 1151} {"train_loss": -10.496426582336426, "global_step": 193470, "epoch": 1151} {"train_loss": -10.140274047851562, "global_step": 193471, "epoch": 1151} {"train_loss": -10.540188789367676, "global_step": 193472, "epoch": 1151} {"train_loss": -10.822626113891602, "global_step": 193473, "epoch": 1151} {"train_loss": -10.555606842041016, "global_step": 193474, "epoch": 1151} {"train_loss": -10.795751571655273, "global_step": 193475, "epoch": 1151} {"train_loss": -10.930388450622559, "global_step": 193476, "epoch": 1151} {"train_loss": -11.069890975952148, "global_step": 193477, "epoch": 1151} {"train_loss": -10.904796600341797, "global_step": 193478, "epoch": 1151} {"train_loss": -10.826786041259766, "global_step": 193479, "epoch": 1151} {"train_loss": -10.891483306884766, "global_step": 193480, "epoch": 1151} {"train_loss": -11.067060470581055, "global_step": 193481, "epoch": 1151} {"train_loss": -11.208868026733398, "global_step": 193482, "epoch": 1151} {"train_loss": -11.121572494506836, "global_step": 193483, "epoch": 1151} {"train_loss": -11.105362892150879, "global_step": 193484, "epoch": 1151} {"train_loss": -11.172164916992188, "global_step": 193485, "epoch": 1151} {"train_loss": -11.097610473632812, "global_step": 193486, "epoch": 1151} {"train_loss": -11.30069637298584, "global_step": 193487, "epoch": 1151} {"train_loss": -11.12930965423584, "global_step": 193488, "epoch": 1151} {"train_loss": -11.136688232421875, "global_step": 193489, "epoch": 1151} {"train_loss": -11.252355575561523, "global_step": 193490, "epoch": 1151} {"train_loss": -11.303876876831055, "global_step": 193491, "epoch": 1151} {"train_loss": -11.13829517364502, "global_step": 193492, "epoch": 1151} {"train_loss": -11.283509254455566, "global_step": 193493, "epoch": 1151} {"train_loss": -11.361751556396484, "global_step": 193494, "epoch": 1151} {"train_loss": -11.177003860473633, "global_step": 193495, "epoch": 1151} {"train_loss": -11.083211898803711, "global_step": 193496, "epoch": 1151} {"train_loss": -11.293886184692383, "global_step": 193497, "epoch": 1151} {"train_loss": -11.202516555786133, "global_step": 193498, "epoch": 1151} {"train_loss": -11.255109786987305, "global_step": 193499, "epoch": 1151} {"train_loss": -11.31235408782959, "global_step": 193500, "epoch": 1151} {"train_loss": -11.292335510253906, "global_step": 193501, "epoch": 1151} {"train_loss": -11.260257720947266, "global_step": 193502, "epoch": 1151} {"train_loss": -11.307036399841309, "global_step": 193503, "epoch": 1151} {"train_loss": -11.173100471496582, "global_step": 193504, "epoch": 1151} {"train_loss": -11.521367073059082, "global_step": 193505, "epoch": 1151} {"train_loss": -11.335921287536621, "global_step": 193506, "epoch": 1151} {"train_loss": -11.277198791503906, "global_step": 193507, "epoch": 1151} {"train_loss": -11.40728759765625, "global_step": 193508, "epoch": 1151} {"train_loss": -11.360380172729492, "global_step": 193509, "epoch": 1151} {"train_loss": -11.25390338897705, "global_step": 193510, "epoch": 1151} {"train_loss": -11.316119194030762, "global_step": 193511, "epoch": 1151} {"train_loss": -11.396284103393555, "global_step": 193512, "epoch": 1151} {"train_loss": -11.641693115234375, "global_step": 193513, "epoch": 1151} {"train_loss": -11.618213653564453, "global_step": 193514, "epoch": 1151} {"train_loss": -11.435506820678711, "global_step": 193515, "epoch": 1151} {"train_loss": -11.480199813842773, "global_step": 193516, "epoch": 1151} {"train_loss": -11.61001968383789, "global_step": 193517, "epoch": 1151} {"train_loss": -11.599691390991211, "global_step": 193518, "epoch": 1151} {"train_loss": -11.788671493530273, "global_step": 193519, "epoch": 1151} {"train_loss": -11.504714965820312, "global_step": 193520, "epoch": 1151} {"train_loss": -11.641721725463867, "global_step": 193521, "epoch": 1151} {"train_loss": -11.525640487670898, "global_step": 193522, "epoch": 1151} {"train_loss": -11.719490051269531, "global_step": 193523, "epoch": 1151} {"train_loss": -11.535024642944336, "global_step": 193524, "epoch": 1151} {"train_loss": -11.65594482421875, "global_step": 193525, "epoch": 1151} {"train_loss": -11.528271675109863, "global_step": 193526, "epoch": 1151} {"train_loss": -11.738224029541016, "global_step": 193527, "epoch": 1151} {"train_loss": -11.440898895263672, "global_step": 193528, "epoch": 1151} {"train_loss": -11.80810546875, "global_step": 193529, "epoch": 1151} {"train_loss": -11.586599349975586, "global_step": 193530, "epoch": 1151} {"train_loss": -11.646474838256836, "global_step": 193531, "epoch": 1151} {"train_loss": -11.84715747833252, "global_step": 193532, "epoch": 1151} {"train_loss": -11.55087661743164, "global_step": 193533, "epoch": 1151} {"train_loss": -11.561874389648438, "global_step": 193534, "epoch": 1151} {"train_loss": -11.222445629891896, "global_step": 193535, "epoch": 1151, "val_loss": 245431.921875} {"train_loss": -11.47343635559082, "global_step": 193536, "epoch": 1152} {"train_loss": -11.876238822937012, "global_step": 193537, "epoch": 1152} {"train_loss": -11.726259231567383, "global_step": 193538, "epoch": 1152} {"train_loss": -11.625202178955078, "global_step": 193539, "epoch": 1152} {"train_loss": -11.834894180297852, "global_step": 193540, "epoch": 1152} {"train_loss": -11.574716567993164, "global_step": 193541, "epoch": 1152} {"train_loss": -11.730128288269043, "global_step": 193542, "epoch": 1152} {"train_loss": -11.532567024230957, "global_step": 193543, "epoch": 1152} {"train_loss": -11.81637954711914, "global_step": 193544, "epoch": 1152} {"train_loss": -11.782711029052734, "global_step": 193545, "epoch": 1152} {"train_loss": -11.895211219787598, "global_step": 193546, "epoch": 1152} {"train_loss": -11.688621520996094, "global_step": 193547, "epoch": 1152} {"train_loss": -11.524625778198242, "global_step": 193548, "epoch": 1152} {"train_loss": -11.593860626220703, "global_step": 193549, "epoch": 1152} {"train_loss": -11.830924987792969, "global_step": 193550, "epoch": 1152} {"train_loss": -11.414161682128906, "global_step": 193551, "epoch": 1152} {"train_loss": -11.606109619140625, "global_step": 193552, "epoch": 1152} {"train_loss": -11.217729568481445, "global_step": 193553, "epoch": 1152} {"train_loss": -10.8115234375, "global_step": 193554, "epoch": 1152} {"train_loss": -10.83152961730957, "global_step": 193555, "epoch": 1152} {"train_loss": -11.558162689208984, "global_step": 193556, "epoch": 1152} {"train_loss": -10.803009033203125, "global_step": 193557, "epoch": 1152} {"train_loss": -10.300010681152344, "global_step": 193558, "epoch": 1152} {"train_loss": -9.918502807617188, "global_step": 193559, "epoch": 1152} {"train_loss": -10.397283554077148, "global_step": 193560, "epoch": 1152} {"train_loss": -8.982348442077637, "global_step": 193561, "epoch": 1152} {"train_loss": -10.50781536102295, "global_step": 193562, "epoch": 1152} {"train_loss": -10.582036972045898, "global_step": 193563, "epoch": 1152} {"train_loss": -9.286113739013672, "global_step": 193564, "epoch": 1152} {"train_loss": -10.275657653808594, "global_step": 193565, "epoch": 1152} {"train_loss": -9.729205131530762, "global_step": 193566, "epoch": 1152} {"train_loss": -8.580282211303711, "global_step": 193567, "epoch": 1152} {"train_loss": -11.07702350616455, "global_step": 193568, "epoch": 1152} {"train_loss": -9.86131763458252, "global_step": 193569, "epoch": 1152} {"train_loss": -9.867106437683105, "global_step": 193570, "epoch": 1152} {"train_loss": -11.053361892700195, "global_step": 193571, "epoch": 1152} {"train_loss": -9.287578582763672, "global_step": 193572, "epoch": 1152} {"train_loss": -11.073745727539062, "global_step": 193573, "epoch": 1152} {"train_loss": -10.502481460571289, "global_step": 193574, "epoch": 1152} {"train_loss": -10.631909370422363, "global_step": 193575, "epoch": 1152} {"train_loss": -10.837550163269043, "global_step": 193576, "epoch": 1152} {"train_loss": -10.793685913085938, "global_step": 193577, "epoch": 1152} {"train_loss": -11.038762092590332, "global_step": 193578, "epoch": 1152} {"train_loss": -10.814868927001953, "global_step": 193579, "epoch": 1152} {"train_loss": -10.962526321411133, "global_step": 193580, "epoch": 1152} {"train_loss": -10.809587478637695, "global_step": 193581, "epoch": 1152} {"train_loss": -11.050274848937988, "global_step": 193582, "epoch": 1152} {"train_loss": -11.261150360107422, "global_step": 193583, "epoch": 1152} {"train_loss": -11.155174255371094, "global_step": 193584, "epoch": 1152} {"train_loss": -10.946735382080078, "global_step": 193585, "epoch": 1152} {"train_loss": -11.25343132019043, "global_step": 193586, "epoch": 1152} {"train_loss": -11.349617958068848, "global_step": 193587, "epoch": 1152} {"train_loss": -11.224145889282227, "global_step": 193588, "epoch": 1152} {"train_loss": -11.040359497070312, "global_step": 193589, "epoch": 1152} {"train_loss": -11.025543212890625, "global_step": 193590, "epoch": 1152} {"train_loss": -11.221510887145996, "global_step": 193591, "epoch": 1152} {"train_loss": -11.268423080444336, "global_step": 193592, "epoch": 1152} {"train_loss": -11.212596893310547, "global_step": 193593, "epoch": 1152} {"train_loss": -11.215319633483887, "global_step": 193594, "epoch": 1152} {"train_loss": -11.222728729248047, "global_step": 193595, "epoch": 1152} {"train_loss": -11.238582611083984, "global_step": 193596, "epoch": 1152} {"train_loss": -11.09749984741211, "global_step": 193597, "epoch": 1152} {"train_loss": -11.188631057739258, "global_step": 193598, "epoch": 1152} {"train_loss": -10.850625991821289, "global_step": 193599, "epoch": 1152} {"train_loss": -11.283868789672852, "global_step": 193600, "epoch": 1152} {"train_loss": -10.956796646118164, "global_step": 193601, "epoch": 1152} {"train_loss": -11.374307632446289, "global_step": 193602, "epoch": 1152} {"train_loss": -11.183053970336914, "global_step": 193603, "epoch": 1152} {"train_loss": -11.523954391479492, "global_step": 193604, "epoch": 1152} {"train_loss": -11.330307960510254, "global_step": 193605, "epoch": 1152} {"train_loss": -11.26998233795166, "global_step": 193606, "epoch": 1152} {"train_loss": -11.324117660522461, "global_step": 193607, "epoch": 1152} {"train_loss": -11.211013793945312, "global_step": 193608, "epoch": 1152} {"train_loss": -11.523244857788086, "global_step": 193609, "epoch": 1152} {"train_loss": -11.537859916687012, "global_step": 193610, "epoch": 1152} {"train_loss": -11.184138298034668, "global_step": 193611, "epoch": 1152} {"train_loss": -11.250102996826172, "global_step": 193612, "epoch": 1152} {"train_loss": -11.490365028381348, "global_step": 193613, "epoch": 1152} {"train_loss": -11.137121200561523, "global_step": 193614, "epoch": 1152} {"train_loss": -11.532478332519531, "global_step": 193615, "epoch": 1152} {"train_loss": -11.14762020111084, "global_step": 193616, "epoch": 1152} {"train_loss": -11.412493705749512, "global_step": 193617, "epoch": 1152} {"train_loss": -11.262636184692383, "global_step": 193618, "epoch": 1152} {"train_loss": -11.406831741333008, "global_step": 193619, "epoch": 1152} {"train_loss": -11.586392402648926, "global_step": 193620, "epoch": 1152} {"train_loss": -11.232500076293945, "global_step": 193621, "epoch": 1152} {"train_loss": -11.514932632446289, "global_step": 193622, "epoch": 1152} {"train_loss": -11.549025535583496, "global_step": 193623, "epoch": 1152} {"train_loss": -11.625715255737305, "global_step": 193624, "epoch": 1152} {"train_loss": -11.539443969726562, "global_step": 193625, "epoch": 1152} {"train_loss": -11.618806838989258, "global_step": 193626, "epoch": 1152} {"train_loss": -11.663714408874512, "global_step": 193627, "epoch": 1152} {"train_loss": -11.46790885925293, "global_step": 193628, "epoch": 1152} {"train_loss": -11.430854797363281, "global_step": 193629, "epoch": 1152} {"train_loss": -11.462119102478027, "global_step": 193630, "epoch": 1152} {"train_loss": -11.421530723571777, "global_step": 193631, "epoch": 1152} {"train_loss": -11.618461608886719, "global_step": 193632, "epoch": 1152} {"train_loss": -11.609180450439453, "global_step": 193633, "epoch": 1152} {"train_loss": -11.638557434082031, "global_step": 193634, "epoch": 1152} {"train_loss": -11.7027587890625, "global_step": 193635, "epoch": 1152} {"train_loss": -11.377960205078125, "global_step": 193636, "epoch": 1152} {"train_loss": -11.764751434326172, "global_step": 193637, "epoch": 1152} {"train_loss": -11.490439414978027, "global_step": 193638, "epoch": 1152} {"train_loss": -11.143377304077148, "global_step": 193639, "epoch": 1152} {"train_loss": -11.243343353271484, "global_step": 193640, "epoch": 1152} {"train_loss": -11.735379219055176, "global_step": 193641, "epoch": 1152} {"train_loss": -11.589054107666016, "global_step": 193642, "epoch": 1152} {"train_loss": -11.423345565795898, "global_step": 193643, "epoch": 1152} {"train_loss": -11.156023025512695, "global_step": 193644, "epoch": 1152} {"train_loss": -10.945878982543945, "global_step": 193645, "epoch": 1152} {"train_loss": -11.402387619018555, "global_step": 193646, "epoch": 1152} {"train_loss": -11.18966293334961, "global_step": 193647, "epoch": 1152} {"train_loss": -11.164073944091797, "global_step": 193648, "epoch": 1152} {"train_loss": -10.935388565063477, "global_step": 193649, "epoch": 1152} {"train_loss": -11.479402542114258, "global_step": 193650, "epoch": 1152} {"train_loss": -11.41528034210205, "global_step": 193651, "epoch": 1152} {"train_loss": -11.335007667541504, "global_step": 193652, "epoch": 1152} {"train_loss": -11.115442276000977, "global_step": 193653, "epoch": 1152} {"train_loss": -11.590250015258789, "global_step": 193654, "epoch": 1152} {"train_loss": -11.100895881652832, "global_step": 193655, "epoch": 1152} {"train_loss": -11.605510711669922, "global_step": 193656, "epoch": 1152} {"train_loss": -11.13453483581543, "global_step": 193657, "epoch": 1152} {"train_loss": -11.299407958984375, "global_step": 193658, "epoch": 1152} {"train_loss": -11.212419509887695, "global_step": 193659, "epoch": 1152} {"train_loss": -11.372885704040527, "global_step": 193660, "epoch": 1152} {"train_loss": -11.387274742126465, "global_step": 193661, "epoch": 1152} {"train_loss": -11.496724128723145, "global_step": 193662, "epoch": 1152} {"train_loss": -11.466355323791504, "global_step": 193663, "epoch": 1152} {"train_loss": -11.328590393066406, "global_step": 193664, "epoch": 1152} {"train_loss": -11.418886184692383, "global_step": 193665, "epoch": 1152} {"train_loss": -11.367496490478516, "global_step": 193666, "epoch": 1152} {"train_loss": -11.488571166992188, "global_step": 193667, "epoch": 1152} {"train_loss": -11.829217910766602, "global_step": 193668, "epoch": 1152} {"train_loss": -11.249360084533691, "global_step": 193669, "epoch": 1152} {"train_loss": -11.385992050170898, "global_step": 193670, "epoch": 1152} {"train_loss": -11.450517654418945, "global_step": 193671, "epoch": 1152} {"train_loss": -11.407898902893066, "global_step": 193672, "epoch": 1152} {"train_loss": -11.098932266235352, "global_step": 193673, "epoch": 1152} {"train_loss": -11.428555488586426, "global_step": 193674, "epoch": 1152} {"train_loss": -11.119684219360352, "global_step": 193675, "epoch": 1152} {"train_loss": -10.551656723022461, "global_step": 193676, "epoch": 1152} {"train_loss": -11.084744453430176, "global_step": 193677, "epoch": 1152} {"train_loss": -10.892413139343262, "global_step": 193678, "epoch": 1152} {"train_loss": -10.780954360961914, "global_step": 193679, "epoch": 1152} {"train_loss": -10.949077606201172, "global_step": 193680, "epoch": 1152} {"train_loss": -11.011983871459961, "global_step": 193681, "epoch": 1152} {"train_loss": -10.964818954467773, "global_step": 193682, "epoch": 1152} {"train_loss": -11.190361976623535, "global_step": 193683, "epoch": 1152} {"train_loss": -10.697925567626953, "global_step": 193684, "epoch": 1152} {"train_loss": -11.374383926391602, "global_step": 193685, "epoch": 1152} {"train_loss": -10.922603607177734, "global_step": 193686, "epoch": 1152} {"train_loss": -11.578956604003906, "global_step": 193687, "epoch": 1152} {"train_loss": -11.107500076293945, "global_step": 193688, "epoch": 1152} {"train_loss": -11.304365158081055, "global_step": 193689, "epoch": 1152} {"train_loss": -11.412790298461914, "global_step": 193690, "epoch": 1152} {"train_loss": -11.230862617492676, "global_step": 193691, "epoch": 1152} {"train_loss": -11.418030738830566, "global_step": 193692, "epoch": 1152} {"train_loss": -11.28851318359375, "global_step": 193693, "epoch": 1152} {"train_loss": -11.251415252685547, "global_step": 193694, "epoch": 1152} {"train_loss": -11.300355911254883, "global_step": 193695, "epoch": 1152} {"train_loss": -11.398239135742188, "global_step": 193696, "epoch": 1152} {"train_loss": -11.047127723693848, "global_step": 193697, "epoch": 1152} {"train_loss": -11.657928466796875, "global_step": 193698, "epoch": 1152} {"train_loss": -10.709297180175781, "global_step": 193699, "epoch": 1152} {"train_loss": -11.232430458068848, "global_step": 193700, "epoch": 1152} {"train_loss": -10.60891342163086, "global_step": 193701, "epoch": 1152} {"train_loss": -11.222631454467773, "global_step": 193702, "epoch": 1152} {"train_loss": -11.176786411376227, "global_step": 193703, "epoch": 1152, "val_loss": 248959.796875} {"train_loss": -11.261436462402344, "global_step": 193704, "epoch": 1153} {"train_loss": -10.563392639160156, "global_step": 193705, "epoch": 1153} {"train_loss": -10.656390190124512, "global_step": 193706, "epoch": 1153} {"train_loss": -10.921243667602539, "global_step": 193707, "epoch": 1153} {"train_loss": -10.982890129089355, "global_step": 193708, "epoch": 1153} {"train_loss": -10.963287353515625, "global_step": 193709, "epoch": 1153} {"train_loss": -11.088306427001953, "global_step": 193710, "epoch": 1153} {"train_loss": -11.062734603881836, "global_step": 193711, "epoch": 1153} {"train_loss": -11.083871841430664, "global_step": 193712, "epoch": 1153} {"train_loss": -10.806846618652344, "global_step": 193713, "epoch": 1153} {"train_loss": -11.23127555847168, "global_step": 193714, "epoch": 1153} {"train_loss": -10.838706970214844, "global_step": 193715, "epoch": 1153} {"train_loss": -11.239007949829102, "global_step": 193716, "epoch": 1153} {"train_loss": -10.88386344909668, "global_step": 193717, "epoch": 1153} {"train_loss": -11.432634353637695, "global_step": 193718, "epoch": 1153} {"train_loss": -11.017793655395508, "global_step": 193719, "epoch": 1153} {"train_loss": -11.0987548828125, "global_step": 193720, "epoch": 1153} {"train_loss": -11.367029190063477, "global_step": 193721, "epoch": 1153} {"train_loss": -11.189910888671875, "global_step": 193722, "epoch": 1153} {"train_loss": -11.583393096923828, "global_step": 193723, "epoch": 1153} {"train_loss": -11.325610160827637, "global_step": 193724, "epoch": 1153} {"train_loss": -11.576272964477539, "global_step": 193725, "epoch": 1153} {"train_loss": -11.248164176940918, "global_step": 193726, "epoch": 1153} {"train_loss": -11.38302230834961, "global_step": 193727, "epoch": 1153} {"train_loss": -11.52168083190918, "global_step": 193728, "epoch": 1153} {"train_loss": -11.237802505493164, "global_step": 193729, "epoch": 1153} {"train_loss": -11.579873085021973, "global_step": 193730, "epoch": 1153} {"train_loss": -11.384868621826172, "global_step": 193731, "epoch": 1153} {"train_loss": -11.317865371704102, "global_step": 193732, "epoch": 1153} {"train_loss": -11.396509170532227, "global_step": 193733, "epoch": 1153} {"train_loss": -11.442286491394043, "global_step": 193734, "epoch": 1153} {"train_loss": -11.058341979980469, "global_step": 193735, "epoch": 1153} {"train_loss": -11.59579086303711, "global_step": 193736, "epoch": 1153} {"train_loss": -11.293060302734375, "global_step": 193737, "epoch": 1153} {"train_loss": -11.284934997558594, "global_step": 193738, "epoch": 1153} {"train_loss": -11.090656280517578, "global_step": 193739, "epoch": 1153} {"train_loss": -11.148831367492676, "global_step": 193740, "epoch": 1153} {"train_loss": -11.159961700439453, "global_step": 193741, "epoch": 1153} {"train_loss": -10.927499771118164, "global_step": 193742, "epoch": 1153} {"train_loss": -11.323749542236328, "global_step": 193743, "epoch": 1153} {"train_loss": -11.2535982131958, "global_step": 193744, "epoch": 1153} {"train_loss": -11.185470581054688, "global_step": 193745, "epoch": 1153} {"train_loss": -11.079305648803711, "global_step": 193746, "epoch": 1153} {"train_loss": -11.228645324707031, "global_step": 193747, "epoch": 1153} {"train_loss": -11.110536575317383, "global_step": 193748, "epoch": 1153} {"train_loss": -11.013932228088379, "global_step": 193749, "epoch": 1153} {"train_loss": -11.58292007446289, "global_step": 193750, "epoch": 1153} {"train_loss": -10.446950912475586, "global_step": 193751, "epoch": 1153} {"train_loss": -10.75221061706543, "global_step": 193752, "epoch": 1153} {"train_loss": -10.958248138427734, "global_step": 193753, "epoch": 1153} {"train_loss": -11.000923156738281, "global_step": 193754, "epoch": 1153} {"train_loss": -11.002531051635742, "global_step": 193755, "epoch": 1153} {"train_loss": -10.888474464416504, "global_step": 193756, "epoch": 1153} {"train_loss": -10.790573120117188, "global_step": 193757, "epoch": 1153} {"train_loss": -11.171212196350098, "global_step": 193758, "epoch": 1153} {"train_loss": -10.61660099029541, "global_step": 193759, "epoch": 1153} {"train_loss": -10.928750991821289, "global_step": 193760, "epoch": 1153} {"train_loss": -11.11790657043457, "global_step": 193761, "epoch": 1153} {"train_loss": -10.351919174194336, "global_step": 193762, "epoch": 1153} {"train_loss": -11.307270050048828, "global_step": 193763, "epoch": 1153} {"train_loss": -10.585286140441895, "global_step": 193764, "epoch": 1153} {"train_loss": -11.16253662109375, "global_step": 193765, "epoch": 1153} {"train_loss": -11.015997886657715, "global_step": 193766, "epoch": 1153} {"train_loss": -11.11480712890625, "global_step": 193767, "epoch": 1153} {"train_loss": -10.767441749572754, "global_step": 193768, "epoch": 1153} {"train_loss": -10.964698791503906, "global_step": 193769, "epoch": 1153} {"train_loss": -10.88803482055664, "global_step": 193770, "epoch": 1153} {"train_loss": -10.939416885375977, "global_step": 193771, "epoch": 1153} {"train_loss": -10.809083938598633, "global_step": 193772, "epoch": 1153} {"train_loss": -10.933778762817383, "global_step": 193773, "epoch": 1153} {"train_loss": -10.927549362182617, "global_step": 193774, "epoch": 1153} {"train_loss": -11.142556190490723, "global_step": 193775, "epoch": 1153} {"train_loss": -10.83203125, "global_step": 193776, "epoch": 1153} {"train_loss": -10.965241432189941, "global_step": 193777, "epoch": 1153} {"train_loss": -11.359769821166992, "global_step": 193778, "epoch": 1153} {"train_loss": -10.880733489990234, "global_step": 193779, "epoch": 1153} {"train_loss": -11.32917594909668, "global_step": 193780, "epoch": 1153} {"train_loss": -11.06596565246582, "global_step": 193781, "epoch": 1153} {"train_loss": -11.195037841796875, "global_step": 193782, "epoch": 1153} {"train_loss": -11.210599899291992, "global_step": 193783, "epoch": 1153} {"train_loss": -11.351898193359375, "global_step": 193784, "epoch": 1153} {"train_loss": -11.232152938842773, "global_step": 193785, "epoch": 1153} {"train_loss": -11.233662605285645, "global_step": 193786, "epoch": 1153} {"train_loss": -11.245676040649414, "global_step": 193787, "epoch": 1153} {"train_loss": -11.196184158325195, "global_step": 193788, "epoch": 1153} {"train_loss": -11.45189380645752, "global_step": 193789, "epoch": 1153} {"train_loss": -11.17184829711914, "global_step": 193790, "epoch": 1153} {"train_loss": -11.388467788696289, "global_step": 193791, "epoch": 1153} {"train_loss": -11.278559684753418, "global_step": 193792, "epoch": 1153} {"train_loss": -11.373556137084961, "global_step": 193793, "epoch": 1153} {"train_loss": -11.425555229187012, "global_step": 193794, "epoch": 1153} {"train_loss": -11.437858581542969, "global_step": 193795, "epoch": 1153} {"train_loss": -11.531177520751953, "global_step": 193796, "epoch": 1153} {"train_loss": -11.277632713317871, "global_step": 193797, "epoch": 1153} {"train_loss": -11.536696434020996, "global_step": 193798, "epoch": 1153} {"train_loss": -11.607500076293945, "global_step": 193799, "epoch": 1153} {"train_loss": -11.666055679321289, "global_step": 193800, "epoch": 1153} {"train_loss": -11.679906845092773, "global_step": 193801, "epoch": 1153} {"train_loss": -11.492788314819336, "global_step": 193802, "epoch": 1153} {"train_loss": -11.681768417358398, "global_step": 193803, "epoch": 1153} {"train_loss": -11.668588638305664, "global_step": 193804, "epoch": 1153} {"train_loss": -11.7113037109375, "global_step": 193805, "epoch": 1153} {"train_loss": -11.785919189453125, "global_step": 193806, "epoch": 1153} {"train_loss": -11.788862228393555, "global_step": 193807, "epoch": 1153} {"train_loss": -11.228174209594727, "global_step": 193808, "epoch": 1153} {"train_loss": -11.419730186462402, "global_step": 193809, "epoch": 1153} {"train_loss": -11.668716430664062, "global_step": 193810, "epoch": 1153} {"train_loss": -11.530858993530273, "global_step": 193811, "epoch": 1153} {"train_loss": -11.743871688842773, "global_step": 193812, "epoch": 1153} {"train_loss": -11.82420539855957, "global_step": 193813, "epoch": 1153} {"train_loss": -11.778738021850586, "global_step": 193814, "epoch": 1153} {"train_loss": -11.474852561950684, "global_step": 193815, "epoch": 1153} {"train_loss": -11.980949401855469, "global_step": 193816, "epoch": 1153} {"train_loss": -11.630866050720215, "global_step": 193817, "epoch": 1153} {"train_loss": -11.82913589477539, "global_step": 193818, "epoch": 1153} {"train_loss": -11.65916633605957, "global_step": 193819, "epoch": 1153} {"train_loss": -11.85113525390625, "global_step": 193820, "epoch": 1153} {"train_loss": -11.677111625671387, "global_step": 193821, "epoch": 1153} {"train_loss": -11.618110656738281, "global_step": 193822, "epoch": 1153} {"train_loss": -11.514249801635742, "global_step": 193823, "epoch": 1153} {"train_loss": -11.659957885742188, "global_step": 193824, "epoch": 1153} {"train_loss": -11.690757751464844, "global_step": 193825, "epoch": 1153} {"train_loss": -11.815267562866211, "global_step": 193826, "epoch": 1153} {"train_loss": -11.88839340209961, "global_step": 193827, "epoch": 1153} {"train_loss": -11.850955963134766, "global_step": 193828, "epoch": 1153} {"train_loss": -11.789389610290527, "global_step": 193829, "epoch": 1153} {"train_loss": -11.733673095703125, "global_step": 193830, "epoch": 1153} {"train_loss": -11.635357856750488, "global_step": 193831, "epoch": 1153} {"train_loss": -11.183379173278809, "global_step": 193832, "epoch": 1153} {"train_loss": -11.602132797241211, "global_step": 193833, "epoch": 1153} {"train_loss": -11.521672248840332, "global_step": 193834, "epoch": 1153} {"train_loss": -10.906842231750488, "global_step": 193835, "epoch": 1153} {"train_loss": -10.335674285888672, "global_step": 193836, "epoch": 1153} {"train_loss": -11.759899139404297, "global_step": 193837, "epoch": 1153} {"train_loss": -10.473587989807129, "global_step": 193838, "epoch": 1153} {"train_loss": -9.513919830322266, "global_step": 193839, "epoch": 1153} {"train_loss": -10.003273010253906, "global_step": 193840, "epoch": 1153} {"train_loss": -11.18060302734375, "global_step": 193841, "epoch": 1153} {"train_loss": -10.161575317382812, "global_step": 193842, "epoch": 1153} {"train_loss": -9.294733047485352, "global_step": 193843, "epoch": 1153} {"train_loss": -10.912729263305664, "global_step": 193844, "epoch": 1153} {"train_loss": -10.919410705566406, "global_step": 193845, "epoch": 1153} {"train_loss": -11.27377700805664, "global_step": 193846, "epoch": 1153} {"train_loss": -11.203374862670898, "global_step": 193847, "epoch": 1153} {"train_loss": -11.349719047546387, "global_step": 193848, "epoch": 1153} {"train_loss": -10.317951202392578, "global_step": 193849, "epoch": 1153} {"train_loss": -11.218770980834961, "global_step": 193850, "epoch": 1153} {"train_loss": -10.854766845703125, "global_step": 193851, "epoch": 1153} {"train_loss": -11.338018417358398, "global_step": 193852, "epoch": 1153} {"train_loss": -11.22989273071289, "global_step": 193853, "epoch": 1153} {"train_loss": -11.116270065307617, "global_step": 193854, "epoch": 1153} {"train_loss": -11.226487159729004, "global_step": 193855, "epoch": 1153} {"train_loss": -11.27178955078125, "global_step": 193856, "epoch": 1153} {"train_loss": -11.276588439941406, "global_step": 193857, "epoch": 1153} {"train_loss": -10.86307430267334, "global_step": 193858, "epoch": 1153} {"train_loss": -11.161991119384766, "global_step": 193859, "epoch": 1153} {"train_loss": -10.845577239990234, "global_step": 193860, "epoch": 1153} {"train_loss": -11.150156021118164, "global_step": 193861, "epoch": 1153} {"train_loss": -11.22238826751709, "global_step": 193862, "epoch": 1153} {"train_loss": -11.030576705932617, "global_step": 193863, "epoch": 1153} {"train_loss": -11.380428314208984, "global_step": 193864, "epoch": 1153} {"train_loss": -10.965112686157227, "global_step": 193865, "epoch": 1153} {"train_loss": -10.831531524658203, "global_step": 193866, "epoch": 1153} {"train_loss": -10.837282180786133, "global_step": 193867, "epoch": 1153} {"train_loss": -10.469559669494629, "global_step": 193868, "epoch": 1153} {"train_loss": -10.920361518859863, "global_step": 193869, "epoch": 1153} {"train_loss": -10.833887100219727, "global_step": 193870, "epoch": 1153} {"train_loss": -11.193104068438211, "global_step": 193871, "epoch": 1153, "val_loss": 248748.90625} {"train_loss": -10.783004760742188, "global_step": 193872, "epoch": 1154} {"train_loss": -10.885078430175781, "global_step": 193873, "epoch": 1154} {"train_loss": -10.968204498291016, "global_step": 193874, "epoch": 1154} {"train_loss": -10.206842422485352, "global_step": 193875, "epoch": 1154} {"train_loss": -11.114582061767578, "global_step": 193876, "epoch": 1154} {"train_loss": -10.43648624420166, "global_step": 193877, "epoch": 1154} {"train_loss": -10.929004669189453, "global_step": 193878, "epoch": 1154} {"train_loss": -10.927383422851562, "global_step": 193879, "epoch": 1154} {"train_loss": -11.034082412719727, "global_step": 193880, "epoch": 1154} {"train_loss": -11.369138717651367, "global_step": 193881, "epoch": 1154} {"train_loss": -10.840883255004883, "global_step": 193882, "epoch": 1154} {"train_loss": -11.094480514526367, "global_step": 193883, "epoch": 1154} {"train_loss": -10.81619644165039, "global_step": 193884, "epoch": 1154} {"train_loss": -11.135398864746094, "global_step": 193885, "epoch": 1154} {"train_loss": -11.150859832763672, "global_step": 193886, "epoch": 1154} {"train_loss": -11.079948425292969, "global_step": 193887, "epoch": 1154} {"train_loss": -11.215533256530762, "global_step": 193888, "epoch": 1154} {"train_loss": -11.405912399291992, "global_step": 193889, "epoch": 1154} {"train_loss": -11.206138610839844, "global_step": 193890, "epoch": 1154} {"train_loss": -11.333841323852539, "global_step": 193891, "epoch": 1154} {"train_loss": -11.338130950927734, "global_step": 193892, "epoch": 1154} {"train_loss": -11.371828079223633, "global_step": 193893, "epoch": 1154} {"train_loss": -11.330012321472168, "global_step": 193894, "epoch": 1154} {"train_loss": -11.294883728027344, "global_step": 193895, "epoch": 1154} {"train_loss": -11.280004501342773, "global_step": 193896, "epoch": 1154} {"train_loss": -11.372749328613281, "global_step": 193897, "epoch": 1154} {"train_loss": -11.311325073242188, "global_step": 193898, "epoch": 1154} {"train_loss": -11.21159839630127, "global_step": 193899, "epoch": 1154} {"train_loss": -11.33824634552002, "global_step": 193900, "epoch": 1154} {"train_loss": -11.534381866455078, "global_step": 193901, "epoch": 1154} {"train_loss": -11.373624801635742, "global_step": 193902, "epoch": 1154} {"train_loss": -11.338714599609375, "global_step": 193903, "epoch": 1154} {"train_loss": -11.342373847961426, "global_step": 193904, "epoch": 1154} {"train_loss": -11.495765686035156, "global_step": 193905, "epoch": 1154} {"train_loss": -11.366649627685547, "global_step": 193906, "epoch": 1154} {"train_loss": -11.350985527038574, "global_step": 193907, "epoch": 1154} {"train_loss": -11.67711067199707, "global_step": 193908, "epoch": 1154} {"train_loss": -11.493371963500977, "global_step": 193909, "epoch": 1154} {"train_loss": -11.577199935913086, "global_step": 193910, "epoch": 1154} {"train_loss": -11.499530792236328, "global_step": 193911, "epoch": 1154} {"train_loss": -11.439573287963867, "global_step": 193912, "epoch": 1154} {"train_loss": -11.44509220123291, "global_step": 193913, "epoch": 1154} {"train_loss": -11.399477005004883, "global_step": 193914, "epoch": 1154} {"train_loss": -11.608616828918457, "global_step": 193915, "epoch": 1154} {"train_loss": -11.583076477050781, "global_step": 193916, "epoch": 1154} {"train_loss": -11.401285171508789, "global_step": 193917, "epoch": 1154} {"train_loss": -11.587546348571777, "global_step": 193918, "epoch": 1154} {"train_loss": -11.489578247070312, "global_step": 193919, "epoch": 1154} {"train_loss": -11.334580421447754, "global_step": 193920, "epoch": 1154} {"train_loss": -11.525853157043457, "global_step": 193921, "epoch": 1154} {"train_loss": -11.49462890625, "global_step": 193922, "epoch": 1154} {"train_loss": -11.490362167358398, "global_step": 193923, "epoch": 1154} {"train_loss": -11.609332084655762, "global_step": 193924, "epoch": 1154} {"train_loss": -11.053169250488281, "global_step": 193925, "epoch": 1154} {"train_loss": -11.575889587402344, "global_step": 193926, "epoch": 1154} {"train_loss": -11.238850593566895, "global_step": 193927, "epoch": 1154} {"train_loss": -11.398706436157227, "global_step": 193928, "epoch": 1154} {"train_loss": -11.60123062133789, "global_step": 193929, "epoch": 1154} {"train_loss": -11.559650421142578, "global_step": 193930, "epoch": 1154} {"train_loss": -11.143743515014648, "global_step": 193931, "epoch": 1154} {"train_loss": -11.818305015563965, "global_step": 193932, "epoch": 1154} {"train_loss": -11.212989807128906, "global_step": 193933, "epoch": 1154} {"train_loss": -11.6337890625, "global_step": 193934, "epoch": 1154} {"train_loss": -11.332423210144043, "global_step": 193935, "epoch": 1154} {"train_loss": -11.73605728149414, "global_step": 193936, "epoch": 1154} {"train_loss": -11.522697448730469, "global_step": 193937, "epoch": 1154} {"train_loss": -11.666448593139648, "global_step": 193938, "epoch": 1154} {"train_loss": -11.172882080078125, "global_step": 193939, "epoch": 1154} {"train_loss": -11.51925277709961, "global_step": 193940, "epoch": 1154} {"train_loss": -11.541980743408203, "global_step": 193941, "epoch": 1154} {"train_loss": -11.055522918701172, "global_step": 193942, "epoch": 1154} {"train_loss": -11.477178573608398, "global_step": 193943, "epoch": 1154} {"train_loss": -11.548271179199219, "global_step": 193944, "epoch": 1154} {"train_loss": -11.529243469238281, "global_step": 193945, "epoch": 1154} {"train_loss": -11.774356842041016, "global_step": 193946, "epoch": 1154} {"train_loss": -11.663188934326172, "global_step": 193947, "epoch": 1154} {"train_loss": -11.140667915344238, "global_step": 193948, "epoch": 1154} {"train_loss": -11.226777076721191, "global_step": 193949, "epoch": 1154} {"train_loss": -11.616291046142578, "global_step": 193950, "epoch": 1154} {"train_loss": -11.7376127243042, "global_step": 193951, "epoch": 1154} {"train_loss": -11.586963653564453, "global_step": 193952, "epoch": 1154} {"train_loss": -11.396069526672363, "global_step": 193953, "epoch": 1154} {"train_loss": -11.181947708129883, "global_step": 193954, "epoch": 1154} {"train_loss": -11.541117668151855, "global_step": 193955, "epoch": 1154} {"train_loss": -11.200201034545898, "global_step": 193956, "epoch": 1154} {"train_loss": -11.536079406738281, "global_step": 193957, "epoch": 1154} {"train_loss": -11.196062088012695, "global_step": 193958, "epoch": 1154} {"train_loss": -11.51546859741211, "global_step": 193959, "epoch": 1154} {"train_loss": -11.277762413024902, "global_step": 193960, "epoch": 1154} {"train_loss": -11.280889511108398, "global_step": 193961, "epoch": 1154} {"train_loss": -10.8578519821167, "global_step": 193962, "epoch": 1154} {"train_loss": -11.008539199829102, "global_step": 193963, "epoch": 1154} {"train_loss": -11.107017517089844, "global_step": 193964, "epoch": 1154} {"train_loss": -10.292016983032227, "global_step": 193965, "epoch": 1154} {"train_loss": -10.111848831176758, "global_step": 193966, "epoch": 1154} {"train_loss": -10.712444305419922, "global_step": 193967, "epoch": 1154} {"train_loss": -11.610284805297852, "global_step": 193968, "epoch": 1154} {"train_loss": -10.479782104492188, "global_step": 193969, "epoch": 1154} {"train_loss": -11.26617431640625, "global_step": 193970, "epoch": 1154} {"train_loss": -10.98388957977295, "global_step": 193971, "epoch": 1154} {"train_loss": -11.153095245361328, "global_step": 193972, "epoch": 1154} {"train_loss": -11.165929794311523, "global_step": 193973, "epoch": 1154} {"train_loss": -11.300199508666992, "global_step": 193974, "epoch": 1154} {"train_loss": -11.271360397338867, "global_step": 193975, "epoch": 1154} {"train_loss": -10.88633918762207, "global_step": 193976, "epoch": 1154} {"train_loss": -11.052019119262695, "global_step": 193977, "epoch": 1154} {"train_loss": -10.157024383544922, "global_step": 193978, "epoch": 1154} {"train_loss": -10.885000228881836, "global_step": 193979, "epoch": 1154} {"train_loss": -10.250143051147461, "global_step": 193980, "epoch": 1154} {"train_loss": -9.744915008544922, "global_step": 193981, "epoch": 1154} {"train_loss": -11.344535827636719, "global_step": 193982, "epoch": 1154} {"train_loss": -10.641960144042969, "global_step": 193983, "epoch": 1154} {"train_loss": -11.081398963928223, "global_step": 193984, "epoch": 1154} {"train_loss": -11.308321952819824, "global_step": 193985, "epoch": 1154} {"train_loss": -10.54472541809082, "global_step": 193986, "epoch": 1154} {"train_loss": -11.328055381774902, "global_step": 193987, "epoch": 1154} {"train_loss": -10.684045791625977, "global_step": 193988, "epoch": 1154} {"train_loss": -10.987327575683594, "global_step": 193989, "epoch": 1154} {"train_loss": -10.995809555053711, "global_step": 193990, "epoch": 1154} {"train_loss": -11.121179580688477, "global_step": 193991, "epoch": 1154} {"train_loss": -10.890237808227539, "global_step": 193992, "epoch": 1154} {"train_loss": -11.074238777160645, "global_step": 193993, "epoch": 1154} {"train_loss": -10.848339080810547, "global_step": 193994, "epoch": 1154} {"train_loss": -10.998880386352539, "global_step": 193995, "epoch": 1154} {"train_loss": -11.370262145996094, "global_step": 193996, "epoch": 1154} {"train_loss": -10.912291526794434, "global_step": 193997, "epoch": 1154} {"train_loss": -11.345911979675293, "global_step": 193998, "epoch": 1154} {"train_loss": -10.917425155639648, "global_step": 193999, "epoch": 1154} {"train_loss": -11.245063781738281, "global_step": 194000, "epoch": 1154} {"train_loss": -11.37171745300293, "global_step": 194001, "epoch": 1154} {"train_loss": -10.718463897705078, "global_step": 194002, "epoch": 1154} {"train_loss": -11.36607551574707, "global_step": 194003, "epoch": 1154} {"train_loss": -10.960872650146484, "global_step": 194004, "epoch": 1154} {"train_loss": -11.383712768554688, "global_step": 194005, "epoch": 1154} {"train_loss": -11.019241333007812, "global_step": 194006, "epoch": 1154} {"train_loss": -10.67574691772461, "global_step": 194007, "epoch": 1154} {"train_loss": -11.433679580688477, "global_step": 194008, "epoch": 1154} {"train_loss": -10.942419052124023, "global_step": 194009, "epoch": 1154} {"train_loss": -11.49983024597168, "global_step": 194010, "epoch": 1154} {"train_loss": -11.034404754638672, "global_step": 194011, "epoch": 1154} {"train_loss": -10.913763046264648, "global_step": 194012, "epoch": 1154} {"train_loss": -11.385211944580078, "global_step": 194013, "epoch": 1154} {"train_loss": -10.785079956054688, "global_step": 194014, "epoch": 1154} {"train_loss": -11.429777145385742, "global_step": 194015, "epoch": 1154} {"train_loss": -10.808540344238281, "global_step": 194016, "epoch": 1154} {"train_loss": -11.443346977233887, "global_step": 194017, "epoch": 1154} {"train_loss": -11.1102294921875, "global_step": 194018, "epoch": 1154} {"train_loss": -10.865808486938477, "global_step": 194019, "epoch": 1154} {"train_loss": -11.466391563415527, "global_step": 194020, "epoch": 1154} {"train_loss": -10.864938735961914, "global_step": 194021, "epoch": 1154} {"train_loss": -11.348472595214844, "global_step": 194022, "epoch": 1154} {"train_loss": -11.40216064453125, "global_step": 194023, "epoch": 1154} {"train_loss": -11.288070678710938, "global_step": 194024, "epoch": 1154} {"train_loss": -11.397607803344727, "global_step": 194025, "epoch": 1154} {"train_loss": -10.862478256225586, "global_step": 194026, "epoch": 1154} {"train_loss": -11.25018310546875, "global_step": 194027, "epoch": 1154} {"train_loss": -10.98973560333252, "global_step": 194028, "epoch": 1154} {"train_loss": -10.542928695678711, "global_step": 194029, "epoch": 1154} {"train_loss": -10.808804512023926, "global_step": 194030, "epoch": 1154} {"train_loss": -10.926765441894531, "global_step": 194031, "epoch": 1154} {"train_loss": -10.78502082824707, "global_step": 194032, "epoch": 1154} {"train_loss": -11.123851776123047, "global_step": 194033, "epoch": 1154} {"train_loss": -11.274223327636719, "global_step": 194034, "epoch": 1154} {"train_loss": -10.890416145324707, "global_step": 194035, "epoch": 1154} {"train_loss": -11.227312088012695, "global_step": 194036, "epoch": 1154} {"train_loss": -11.087943077087402, "global_step": 194037, "epoch": 1154} {"train_loss": -11.023605346679688, "global_step": 194038, "epoch": 1154} {"train_loss": -11.184851095789956, "global_step": 194039, "epoch": 1154, "val_loss": 249928.875} {"train_loss": -11.375310897827148, "global_step": 194040, "epoch": 1155} {"train_loss": -11.042165756225586, "global_step": 194041, "epoch": 1155} {"train_loss": -11.12846565246582, "global_step": 194042, "epoch": 1155} {"train_loss": -11.1150541305542, "global_step": 194043, "epoch": 1155} {"train_loss": -11.329124450683594, "global_step": 194044, "epoch": 1155} {"train_loss": -11.253421783447266, "global_step": 194045, "epoch": 1155} {"train_loss": -11.328197479248047, "global_step": 194046, "epoch": 1155} {"train_loss": -11.168069839477539, "global_step": 194047, "epoch": 1155} {"train_loss": -11.234609603881836, "global_step": 194048, "epoch": 1155} {"train_loss": -11.442320823669434, "global_step": 194049, "epoch": 1155} {"train_loss": -11.46452522277832, "global_step": 194050, "epoch": 1155} {"train_loss": -11.289810180664062, "global_step": 194051, "epoch": 1155} {"train_loss": -11.480751037597656, "global_step": 194052, "epoch": 1155} {"train_loss": -11.401792526245117, "global_step": 194053, "epoch": 1155} {"train_loss": -11.370445251464844, "global_step": 194054, "epoch": 1155} {"train_loss": -11.27273941040039, "global_step": 194055, "epoch": 1155} {"train_loss": -11.372536659240723, "global_step": 194056, "epoch": 1155} {"train_loss": -11.309219360351562, "global_step": 194057, "epoch": 1155} {"train_loss": -11.118810653686523, "global_step": 194058, "epoch": 1155} {"train_loss": -11.46061897277832, "global_step": 194059, "epoch": 1155} {"train_loss": -11.122014999389648, "global_step": 194060, "epoch": 1155} {"train_loss": -11.545156478881836, "global_step": 194061, "epoch": 1155} {"train_loss": -11.383630752563477, "global_step": 194062, "epoch": 1155} {"train_loss": -11.431960105895996, "global_step": 194063, "epoch": 1155} {"train_loss": -11.487890243530273, "global_step": 194064, "epoch": 1155} {"train_loss": -11.428808212280273, "global_step": 194065, "epoch": 1155} {"train_loss": -11.563011169433594, "global_step": 194066, "epoch": 1155} {"train_loss": -11.569284439086914, "global_step": 194067, "epoch": 1155} {"train_loss": -11.363058090209961, "global_step": 194068, "epoch": 1155} {"train_loss": -11.55079460144043, "global_step": 194069, "epoch": 1155} {"train_loss": -11.714685440063477, "global_step": 194070, "epoch": 1155} {"train_loss": -11.441726684570312, "global_step": 194071, "epoch": 1155} {"train_loss": -11.471762657165527, "global_step": 194072, "epoch": 1155} {"train_loss": -11.179426193237305, "global_step": 194073, "epoch": 1155} {"train_loss": -11.493739128112793, "global_step": 194074, "epoch": 1155} {"train_loss": -11.68134880065918, "global_step": 194075, "epoch": 1155} {"train_loss": -11.553160667419434, "global_step": 194076, "epoch": 1155} {"train_loss": -11.478468894958496, "global_step": 194077, "epoch": 1155} {"train_loss": -11.590757369995117, "global_step": 194078, "epoch": 1155} {"train_loss": -11.55826187133789, "global_step": 194079, "epoch": 1155} {"train_loss": -11.520051956176758, "global_step": 194080, "epoch": 1155} {"train_loss": -11.296777725219727, "global_step": 194081, "epoch": 1155} {"train_loss": -11.503524780273438, "global_step": 194082, "epoch": 1155} {"train_loss": -11.465438842773438, "global_step": 194083, "epoch": 1155} {"train_loss": -11.357588768005371, "global_step": 194084, "epoch": 1155} {"train_loss": -11.778852462768555, "global_step": 194085, "epoch": 1155} {"train_loss": -11.510972023010254, "global_step": 194086, "epoch": 1155} {"train_loss": -11.57316780090332, "global_step": 194087, "epoch": 1155} {"train_loss": -11.2178955078125, "global_step": 194088, "epoch": 1155} {"train_loss": -11.684911727905273, "global_step": 194089, "epoch": 1155} {"train_loss": -11.714422225952148, "global_step": 194090, "epoch": 1155} {"train_loss": -11.889264106750488, "global_step": 194091, "epoch": 1155} {"train_loss": -11.55318832397461, "global_step": 194092, "epoch": 1155} {"train_loss": -11.476421356201172, "global_step": 194093, "epoch": 1155} {"train_loss": -11.509775161743164, "global_step": 194094, "epoch": 1155} {"train_loss": -11.486719131469727, "global_step": 194095, "epoch": 1155} {"train_loss": -11.492673873901367, "global_step": 194096, "epoch": 1155} {"train_loss": -10.657384872436523, "global_step": 194097, "epoch": 1155} {"train_loss": -11.001487731933594, "global_step": 194098, "epoch": 1155} {"train_loss": -10.997180938720703, "global_step": 194099, "epoch": 1155} {"train_loss": -11.185163497924805, "global_step": 194100, "epoch": 1155} {"train_loss": -9.79926872253418, "global_step": 194101, "epoch": 1155} {"train_loss": -11.325241088867188, "global_step": 194102, "epoch": 1155} {"train_loss": -11.09036636352539, "global_step": 194103, "epoch": 1155} {"train_loss": -11.213298797607422, "global_step": 194104, "epoch": 1155} {"train_loss": -10.205178260803223, "global_step": 194105, "epoch": 1155} {"train_loss": -10.148429870605469, "global_step": 194106, "epoch": 1155} {"train_loss": -10.573646545410156, "global_step": 194107, "epoch": 1155} {"train_loss": -10.226044654846191, "global_step": 194108, "epoch": 1155} {"train_loss": -10.356689453125, "global_step": 194109, "epoch": 1155} {"train_loss": -10.200631141662598, "global_step": 194110, "epoch": 1155} {"train_loss": -9.944692611694336, "global_step": 194111, "epoch": 1155} {"train_loss": -11.177862167358398, "global_step": 194112, "epoch": 1155} {"train_loss": -10.132884979248047, "global_step": 194113, "epoch": 1155} {"train_loss": -11.200419425964355, "global_step": 194114, "epoch": 1155} {"train_loss": -10.457484245300293, "global_step": 194115, "epoch": 1155} {"train_loss": -11.37948989868164, "global_step": 194116, "epoch": 1155} {"train_loss": -10.484630584716797, "global_step": 194117, "epoch": 1155} {"train_loss": -11.4116849899292, "global_step": 194118, "epoch": 1155} {"train_loss": -10.564210891723633, "global_step": 194119, "epoch": 1155} {"train_loss": -10.799398422241211, "global_step": 194120, "epoch": 1155} {"train_loss": -11.113359451293945, "global_step": 194121, "epoch": 1155} {"train_loss": -10.602962493896484, "global_step": 194122, "epoch": 1155} {"train_loss": -10.541301727294922, "global_step": 194123, "epoch": 1155} {"train_loss": -11.150141716003418, "global_step": 194124, "epoch": 1155} {"train_loss": -10.835835456848145, "global_step": 194125, "epoch": 1155} {"train_loss": -11.09028434753418, "global_step": 194126, "epoch": 1155} {"train_loss": -10.897186279296875, "global_step": 194127, "epoch": 1155} {"train_loss": -10.889058113098145, "global_step": 194128, "epoch": 1155} {"train_loss": -10.516496658325195, "global_step": 194129, "epoch": 1155} {"train_loss": -11.179391860961914, "global_step": 194130, "epoch": 1155} {"train_loss": -10.775908470153809, "global_step": 194131, "epoch": 1155} {"train_loss": -10.959028244018555, "global_step": 194132, "epoch": 1155} {"train_loss": -11.46960735321045, "global_step": 194133, "epoch": 1155} {"train_loss": -10.957547187805176, "global_step": 194134, "epoch": 1155} {"train_loss": -11.149194717407227, "global_step": 194135, "epoch": 1155} {"train_loss": -11.431529998779297, "global_step": 194136, "epoch": 1155} {"train_loss": -11.286359786987305, "global_step": 194137, "epoch": 1155} {"train_loss": -11.21408462524414, "global_step": 194138, "epoch": 1155} {"train_loss": -11.312227249145508, "global_step": 194139, "epoch": 1155} {"train_loss": -11.192310333251953, "global_step": 194140, "epoch": 1155} {"train_loss": -10.905882835388184, "global_step": 194141, "epoch": 1155} {"train_loss": -11.46338176727295, "global_step": 194142, "epoch": 1155} {"train_loss": -10.734081268310547, "global_step": 194143, "epoch": 1155} {"train_loss": -11.191762924194336, "global_step": 194144, "epoch": 1155} {"train_loss": -11.181066513061523, "global_step": 194145, "epoch": 1155} {"train_loss": -11.294448852539062, "global_step": 194146, "epoch": 1155} {"train_loss": -11.083051681518555, "global_step": 194147, "epoch": 1155} {"train_loss": -11.358123779296875, "global_step": 194148, "epoch": 1155} {"train_loss": -11.118337631225586, "global_step": 194149, "epoch": 1155} {"train_loss": -11.386398315429688, "global_step": 194150, "epoch": 1155} {"train_loss": -11.441797256469727, "global_step": 194151, "epoch": 1155} {"train_loss": -11.143889427185059, "global_step": 194152, "epoch": 1155} {"train_loss": -11.374674797058105, "global_step": 194153, "epoch": 1155} {"train_loss": -11.108413696289062, "global_step": 194154, "epoch": 1155} {"train_loss": -11.351503372192383, "global_step": 194155, "epoch": 1155} {"train_loss": -11.342414855957031, "global_step": 194156, "epoch": 1155} {"train_loss": -11.418445587158203, "global_step": 194157, "epoch": 1155} {"train_loss": -11.463359832763672, "global_step": 194158, "epoch": 1155} {"train_loss": -11.585966110229492, "global_step": 194159, "epoch": 1155} {"train_loss": -11.119728088378906, "global_step": 194160, "epoch": 1155} {"train_loss": -11.454971313476562, "global_step": 194161, "epoch": 1155} {"train_loss": -11.25712776184082, "global_step": 194162, "epoch": 1155} {"train_loss": -11.23015308380127, "global_step": 194163, "epoch": 1155} {"train_loss": -11.233696937561035, "global_step": 194164, "epoch": 1155} {"train_loss": -11.279706001281738, "global_step": 194165, "epoch": 1155} {"train_loss": -11.036663055419922, "global_step": 194166, "epoch": 1155} {"train_loss": -11.5879487991333, "global_step": 194167, "epoch": 1155} {"train_loss": -11.002531051635742, "global_step": 194168, "epoch": 1155} {"train_loss": -11.216266632080078, "global_step": 194169, "epoch": 1155} {"train_loss": -11.037734031677246, "global_step": 194170, "epoch": 1155} {"train_loss": -11.294065475463867, "global_step": 194171, "epoch": 1155} {"train_loss": -10.65436840057373, "global_step": 194172, "epoch": 1155} {"train_loss": -11.223535537719727, "global_step": 194173, "epoch": 1155} {"train_loss": -11.174159049987793, "global_step": 194174, "epoch": 1155} {"train_loss": -10.822271347045898, "global_step": 194175, "epoch": 1155} {"train_loss": -11.421247482299805, "global_step": 194176, "epoch": 1155} {"train_loss": -11.116081237792969, "global_step": 194177, "epoch": 1155} {"train_loss": -10.87228012084961, "global_step": 194178, "epoch": 1155} {"train_loss": -11.377222061157227, "global_step": 194179, "epoch": 1155} {"train_loss": -11.210112571716309, "global_step": 194180, "epoch": 1155} {"train_loss": -11.10795783996582, "global_step": 194181, "epoch": 1155} {"train_loss": -11.636341094970703, "global_step": 194182, "epoch": 1155} {"train_loss": -11.137499809265137, "global_step": 194183, "epoch": 1155} {"train_loss": -11.514949798583984, "global_step": 194184, "epoch": 1155} {"train_loss": -11.366585731506348, "global_step": 194185, "epoch": 1155} {"train_loss": -11.158430099487305, "global_step": 194186, "epoch": 1155} {"train_loss": -11.321199417114258, "global_step": 194187, "epoch": 1155} {"train_loss": -11.16700553894043, "global_step": 194188, "epoch": 1155} {"train_loss": -11.097429275512695, "global_step": 194189, "epoch": 1155} {"train_loss": -11.439519882202148, "global_step": 194190, "epoch": 1155} {"train_loss": -11.3350830078125, "global_step": 194191, "epoch": 1155} {"train_loss": -11.116096496582031, "global_step": 194192, "epoch": 1155} {"train_loss": -11.253715515136719, "global_step": 194193, "epoch": 1155} {"train_loss": -11.198898315429688, "global_step": 194194, "epoch": 1155} {"train_loss": -10.918532371520996, "global_step": 194195, "epoch": 1155} {"train_loss": -11.316032409667969, "global_step": 194196, "epoch": 1155} {"train_loss": -11.219208717346191, "global_step": 194197, "epoch": 1155} {"train_loss": -11.475920677185059, "global_step": 194198, "epoch": 1155} {"train_loss": -11.473318099975586, "global_step": 194199, "epoch": 1155} {"train_loss": -11.319624900817871, "global_step": 194200, "epoch": 1155} {"train_loss": -11.227652549743652, "global_step": 194201, "epoch": 1155} {"train_loss": -11.245508193969727, "global_step": 194202, "epoch": 1155} {"train_loss": -10.722667694091797, "global_step": 194203, "epoch": 1155} {"train_loss": -11.500638008117676, "global_step": 194204, "epoch": 1155} {"train_loss": -11.155473709106445, "global_step": 194205, "epoch": 1155} {"train_loss": -10.978099822998047, "global_step": 194206, "epoch": 1155} {"train_loss": -11.1955593029658, "global_step": 194207, "epoch": 1155, "val_loss": 248038.109375, "train_action_mse_error": 1.359444499015808} {"train_loss": -11.490750312805176, "global_step": 194208, "epoch": 1156} {"train_loss": -11.115041732788086, "global_step": 194209, "epoch": 1156} {"train_loss": -11.25284194946289, "global_step": 194210, "epoch": 1156} {"train_loss": -11.189229965209961, "global_step": 194211, "epoch": 1156} {"train_loss": -11.084924697875977, "global_step": 194212, "epoch": 1156} {"train_loss": -11.54348373413086, "global_step": 194213, "epoch": 1156} {"train_loss": -11.209432601928711, "global_step": 194214, "epoch": 1156} {"train_loss": -10.382976531982422, "global_step": 194215, "epoch": 1156} {"train_loss": -11.590304374694824, "global_step": 194216, "epoch": 1156} {"train_loss": -11.275097846984863, "global_step": 194217, "epoch": 1156} {"train_loss": -10.977834701538086, "global_step": 194218, "epoch": 1156} {"train_loss": -11.347390174865723, "global_step": 194219, "epoch": 1156} {"train_loss": -10.297066688537598, "global_step": 194220, "epoch": 1156} {"train_loss": -11.049393653869629, "global_step": 194221, "epoch": 1156} {"train_loss": -11.26321792602539, "global_step": 194222, "epoch": 1156} {"train_loss": -11.171428680419922, "global_step": 194223, "epoch": 1156} {"train_loss": -11.668465614318848, "global_step": 194224, "epoch": 1156} {"train_loss": -11.34201431274414, "global_step": 194225, "epoch": 1156} {"train_loss": -11.607967376708984, "global_step": 194226, "epoch": 1156} {"train_loss": -11.408214569091797, "global_step": 194227, "epoch": 1156} {"train_loss": -11.283822059631348, "global_step": 194228, "epoch": 1156} {"train_loss": -11.328178405761719, "global_step": 194229, "epoch": 1156} {"train_loss": -11.011358261108398, "global_step": 194230, "epoch": 1156} {"train_loss": -11.447733879089355, "global_step": 194231, "epoch": 1156} {"train_loss": -11.374414443969727, "global_step": 194232, "epoch": 1156} {"train_loss": -11.681103706359863, "global_step": 194233, "epoch": 1156} {"train_loss": -11.554388046264648, "global_step": 194234, "epoch": 1156} {"train_loss": -11.219415664672852, "global_step": 194235, "epoch": 1156} {"train_loss": -11.398584365844727, "global_step": 194236, "epoch": 1156} {"train_loss": -11.086943626403809, "global_step": 194237, "epoch": 1156} {"train_loss": -11.15536117553711, "global_step": 194238, "epoch": 1156} {"train_loss": -11.607969284057617, "global_step": 194239, "epoch": 1156} {"train_loss": -11.440969467163086, "global_step": 194240, "epoch": 1156} {"train_loss": -11.523706436157227, "global_step": 194241, "epoch": 1156} {"train_loss": -11.366035461425781, "global_step": 194242, "epoch": 1156} {"train_loss": -11.35563850402832, "global_step": 194243, "epoch": 1156} {"train_loss": -11.660443305969238, "global_step": 194244, "epoch": 1156} {"train_loss": -11.34194564819336, "global_step": 194245, "epoch": 1156} {"train_loss": -11.59225845336914, "global_step": 194246, "epoch": 1156} {"train_loss": -11.49658203125, "global_step": 194247, "epoch": 1156} {"train_loss": -11.448542594909668, "global_step": 194248, "epoch": 1156} {"train_loss": -11.060582160949707, "global_step": 194249, "epoch": 1156} {"train_loss": -11.518996238708496, "global_step": 194250, "epoch": 1156} {"train_loss": -11.17470932006836, "global_step": 194251, "epoch": 1156} {"train_loss": -11.532210350036621, "global_step": 194252, "epoch": 1156} {"train_loss": -10.770824432373047, "global_step": 194253, "epoch": 1156} {"train_loss": -11.102468490600586, "global_step": 194254, "epoch": 1156} {"train_loss": -11.300498962402344, "global_step": 194255, "epoch": 1156} {"train_loss": -11.348386764526367, "global_step": 194256, "epoch": 1156} {"train_loss": -11.192169189453125, "global_step": 194257, "epoch": 1156} {"train_loss": -11.434097290039062, "global_step": 194258, "epoch": 1156} {"train_loss": -11.015888214111328, "global_step": 194259, "epoch": 1156} {"train_loss": -10.84821891784668, "global_step": 194260, "epoch": 1156} {"train_loss": -11.36752700805664, "global_step": 194261, "epoch": 1156} {"train_loss": -11.461118698120117, "global_step": 194262, "epoch": 1156} {"train_loss": -11.162589073181152, "global_step": 194263, "epoch": 1156} {"train_loss": -11.114034652709961, "global_step": 194264, "epoch": 1156} {"train_loss": -10.704751968383789, "global_step": 194265, "epoch": 1156} {"train_loss": -11.32520866394043, "global_step": 194266, "epoch": 1156} {"train_loss": -11.032718658447266, "global_step": 194267, "epoch": 1156} {"train_loss": -10.548111915588379, "global_step": 194268, "epoch": 1156} {"train_loss": -10.91280746459961, "global_step": 194269, "epoch": 1156} {"train_loss": -10.859033584594727, "global_step": 194270, "epoch": 1156} {"train_loss": -10.006922721862793, "global_step": 194271, "epoch": 1156} {"train_loss": -11.304328918457031, "global_step": 194272, "epoch": 1156} {"train_loss": -11.13871955871582, "global_step": 194273, "epoch": 1156} {"train_loss": -11.048761367797852, "global_step": 194274, "epoch": 1156} {"train_loss": -10.87391471862793, "global_step": 194275, "epoch": 1156} {"train_loss": -10.713948249816895, "global_step": 194276, "epoch": 1156} {"train_loss": -11.415160179138184, "global_step": 194277, "epoch": 1156} {"train_loss": -10.585495948791504, "global_step": 194278, "epoch": 1156} {"train_loss": -11.569877624511719, "global_step": 194279, "epoch": 1156} {"train_loss": -11.035606384277344, "global_step": 194280, "epoch": 1156} {"train_loss": -11.074498176574707, "global_step": 194281, "epoch": 1156} {"train_loss": -11.422830581665039, "global_step": 194282, "epoch": 1156} {"train_loss": -11.104482650756836, "global_step": 194283, "epoch": 1156} {"train_loss": -11.202035903930664, "global_step": 194284, "epoch": 1156} {"train_loss": -10.971271514892578, "global_step": 194285, "epoch": 1156} {"train_loss": -11.318817138671875, "global_step": 194286, "epoch": 1156} {"train_loss": -11.234758377075195, "global_step": 194287, "epoch": 1156} {"train_loss": -11.352056503295898, "global_step": 194288, "epoch": 1156} {"train_loss": -11.512775421142578, "global_step": 194289, "epoch": 1156} {"train_loss": -11.297157287597656, "global_step": 194290, "epoch": 1156} {"train_loss": -11.434672355651855, "global_step": 194291, "epoch": 1156} {"train_loss": -11.51858901977539, "global_step": 194292, "epoch": 1156} {"train_loss": -11.125407218933105, "global_step": 194293, "epoch": 1156} {"train_loss": -11.478387832641602, "global_step": 194294, "epoch": 1156} {"train_loss": -11.131772994995117, "global_step": 194295, "epoch": 1156} {"train_loss": -11.054758071899414, "global_step": 194296, "epoch": 1156} {"train_loss": -11.364065170288086, "global_step": 194297, "epoch": 1156} {"train_loss": -10.635098457336426, "global_step": 194298, "epoch": 1156} {"train_loss": -11.629983901977539, "global_step": 194299, "epoch": 1156} {"train_loss": -10.785487174987793, "global_step": 194300, "epoch": 1156} {"train_loss": -11.213404655456543, "global_step": 194301, "epoch": 1156} {"train_loss": -11.270563125610352, "global_step": 194302, "epoch": 1156} {"train_loss": -11.100848197937012, "global_step": 194303, "epoch": 1156} {"train_loss": -11.52951431274414, "global_step": 194304, "epoch": 1156} {"train_loss": -11.351527214050293, "global_step": 194305, "epoch": 1156} {"train_loss": -11.46700668334961, "global_step": 194306, "epoch": 1156} {"train_loss": -11.737588882446289, "global_step": 194307, "epoch": 1156} {"train_loss": -11.462921142578125, "global_step": 194308, "epoch": 1156} {"train_loss": -11.611016273498535, "global_step": 194309, "epoch": 1156} {"train_loss": -11.359479904174805, "global_step": 194310, "epoch": 1156} {"train_loss": -11.677987098693848, "global_step": 194311, "epoch": 1156} {"train_loss": -11.635763168334961, "global_step": 194312, "epoch": 1156} {"train_loss": -11.56576156616211, "global_step": 194313, "epoch": 1156} {"train_loss": -11.5645112991333, "global_step": 194314, "epoch": 1156} {"train_loss": -11.302799224853516, "global_step": 194315, "epoch": 1156} {"train_loss": -11.301998138427734, "global_step": 194316, "epoch": 1156} {"train_loss": -11.648736953735352, "global_step": 194317, "epoch": 1156} {"train_loss": -11.209677696228027, "global_step": 194318, "epoch": 1156} {"train_loss": -11.416292190551758, "global_step": 194319, "epoch": 1156} {"train_loss": -11.2634916305542, "global_step": 194320, "epoch": 1156} {"train_loss": -11.428962707519531, "global_step": 194321, "epoch": 1156} {"train_loss": -11.41541862487793, "global_step": 194322, "epoch": 1156} {"train_loss": -11.491994857788086, "global_step": 194323, "epoch": 1156} {"train_loss": -11.535696983337402, "global_step": 194324, "epoch": 1156} {"train_loss": -11.39143180847168, "global_step": 194325, "epoch": 1156} {"train_loss": -11.492279052734375, "global_step": 194326, "epoch": 1156} {"train_loss": -11.603031158447266, "global_step": 194327, "epoch": 1156} {"train_loss": -11.621869087219238, "global_step": 194328, "epoch": 1156} {"train_loss": -11.647688865661621, "global_step": 194329, "epoch": 1156} {"train_loss": -11.516119003295898, "global_step": 194330, "epoch": 1156} {"train_loss": -11.472705841064453, "global_step": 194331, "epoch": 1156} {"train_loss": -10.83969497680664, "global_step": 194332, "epoch": 1156} {"train_loss": -10.554899215698242, "global_step": 194333, "epoch": 1156} {"train_loss": -11.48373031616211, "global_step": 194334, "epoch": 1156} {"train_loss": -11.095297813415527, "global_step": 194335, "epoch": 1156} {"train_loss": -9.718774795532227, "global_step": 194336, "epoch": 1156} {"train_loss": -10.4439697265625, "global_step": 194337, "epoch": 1156} {"train_loss": -10.843891143798828, "global_step": 194338, "epoch": 1156} {"train_loss": -10.793966293334961, "global_step": 194339, "epoch": 1156} {"train_loss": -9.149858474731445, "global_step": 194340, "epoch": 1156} {"train_loss": -9.860979080200195, "global_step": 194341, "epoch": 1156} {"train_loss": -9.79964828491211, "global_step": 194342, "epoch": 1156} {"train_loss": -10.282636642456055, "global_step": 194343, "epoch": 1156} {"train_loss": -10.79557991027832, "global_step": 194344, "epoch": 1156} {"train_loss": -9.646099090576172, "global_step": 194345, "epoch": 1156} {"train_loss": -10.864931106567383, "global_step": 194346, "epoch": 1156} {"train_loss": -10.340707778930664, "global_step": 194347, "epoch": 1156} {"train_loss": -11.01685905456543, "global_step": 194348, "epoch": 1156} {"train_loss": -10.740987777709961, "global_step": 194349, "epoch": 1156} {"train_loss": -11.150039672851562, "global_step": 194350, "epoch": 1156} {"train_loss": -10.930540084838867, "global_step": 194351, "epoch": 1156} {"train_loss": -10.928360939025879, "global_step": 194352, "epoch": 1156} {"train_loss": -11.19620132446289, "global_step": 194353, "epoch": 1156} {"train_loss": -10.481884956359863, "global_step": 194354, "epoch": 1156} {"train_loss": -11.490720748901367, "global_step": 194355, "epoch": 1156} {"train_loss": -10.414548873901367, "global_step": 194356, "epoch": 1156} {"train_loss": -10.983116149902344, "global_step": 194357, "epoch": 1156} {"train_loss": -11.266046524047852, "global_step": 194358, "epoch": 1156} {"train_loss": -10.910375595092773, "global_step": 194359, "epoch": 1156} {"train_loss": -11.299135208129883, "global_step": 194360, "epoch": 1156} {"train_loss": -10.689533233642578, "global_step": 194361, "epoch": 1156} {"train_loss": -11.300031661987305, "global_step": 194362, "epoch": 1156} {"train_loss": -11.14034366607666, "global_step": 194363, "epoch": 1156} {"train_loss": -11.187398910522461, "global_step": 194364, "epoch": 1156} {"train_loss": -11.115227699279785, "global_step": 194365, "epoch": 1156} {"train_loss": -11.219808578491211, "global_step": 194366, "epoch": 1156} {"train_loss": -11.272719383239746, "global_step": 194367, "epoch": 1156} {"train_loss": -11.079841613769531, "global_step": 194368, "epoch": 1156} {"train_loss": -10.960592269897461, "global_step": 194369, "epoch": 1156} {"train_loss": -11.483291625976562, "global_step": 194370, "epoch": 1156} {"train_loss": -10.987853050231934, "global_step": 194371, "epoch": 1156} {"train_loss": -11.107444763183594, "global_step": 194372, "epoch": 1156} {"train_loss": -11.139167785644531, "global_step": 194373, "epoch": 1156} {"train_loss": -11.40517807006836, "global_step": 194374, "epoch": 1156} {"train_loss": -11.158582727114359, "global_step": 194375, "epoch": 1156, "val_loss": 247595.75} {"train_loss": -11.341826438903809, "global_step": 194376, "epoch": 1157} {"train_loss": -10.99315357208252, "global_step": 194377, "epoch": 1157} {"train_loss": -11.34433650970459, "global_step": 194378, "epoch": 1157} {"train_loss": -11.407573699951172, "global_step": 194379, "epoch": 1157} {"train_loss": -11.468513488769531, "global_step": 194380, "epoch": 1157} {"train_loss": -11.348262786865234, "global_step": 194381, "epoch": 1157} {"train_loss": -11.49196720123291, "global_step": 194382, "epoch": 1157} {"train_loss": -11.405630111694336, "global_step": 194383, "epoch": 1157} {"train_loss": -11.344930648803711, "global_step": 194384, "epoch": 1157} {"train_loss": -11.355745315551758, "global_step": 194385, "epoch": 1157} {"train_loss": -11.21088695526123, "global_step": 194386, "epoch": 1157} {"train_loss": -11.586824417114258, "global_step": 194387, "epoch": 1157} {"train_loss": -11.337196350097656, "global_step": 194388, "epoch": 1157} {"train_loss": -11.551055908203125, "global_step": 194389, "epoch": 1157} {"train_loss": -11.384788513183594, "global_step": 194390, "epoch": 1157} {"train_loss": -11.30251693725586, "global_step": 194391, "epoch": 1157} {"train_loss": -11.171293258666992, "global_step": 194392, "epoch": 1157} {"train_loss": -11.320877075195312, "global_step": 194393, "epoch": 1157} {"train_loss": -11.397493362426758, "global_step": 194394, "epoch": 1157} {"train_loss": -11.53103256225586, "global_step": 194395, "epoch": 1157} {"train_loss": -11.474729537963867, "global_step": 194396, "epoch": 1157} {"train_loss": -11.52248764038086, "global_step": 194397, "epoch": 1157} {"train_loss": -11.57973861694336, "global_step": 194398, "epoch": 1157} {"train_loss": -11.272695541381836, "global_step": 194399, "epoch": 1157} {"train_loss": -11.383052825927734, "global_step": 194400, "epoch": 1157} {"train_loss": -11.282703399658203, "global_step": 194401, "epoch": 1157} {"train_loss": -11.58540153503418, "global_step": 194402, "epoch": 1157} {"train_loss": -11.300621032714844, "global_step": 194403, "epoch": 1157} {"train_loss": -11.56551742553711, "global_step": 194404, "epoch": 1157} {"train_loss": -11.0755615234375, "global_step": 194405, "epoch": 1157} {"train_loss": -11.438112258911133, "global_step": 194406, "epoch": 1157} {"train_loss": -11.539865493774414, "global_step": 194407, "epoch": 1157} {"train_loss": -11.49734878540039, "global_step": 194408, "epoch": 1157} {"train_loss": -11.595512390136719, "global_step": 194409, "epoch": 1157} {"train_loss": -11.255376815795898, "global_step": 194410, "epoch": 1157} {"train_loss": -11.463552474975586, "global_step": 194411, "epoch": 1157} {"train_loss": -11.581127166748047, "global_step": 194412, "epoch": 1157} {"train_loss": -11.74295425415039, "global_step": 194413, "epoch": 1157} {"train_loss": -11.274442672729492, "global_step": 194414, "epoch": 1157} {"train_loss": -11.308124542236328, "global_step": 194415, "epoch": 1157} {"train_loss": -11.518918991088867, "global_step": 194416, "epoch": 1157} {"train_loss": -10.98800277709961, "global_step": 194417, "epoch": 1157} {"train_loss": -10.953778266906738, "global_step": 194418, "epoch": 1157} {"train_loss": -11.319911003112793, "global_step": 194419, "epoch": 1157} {"train_loss": -11.022254943847656, "global_step": 194420, "epoch": 1157} {"train_loss": -11.355770111083984, "global_step": 194421, "epoch": 1157} {"train_loss": -11.002182006835938, "global_step": 194422, "epoch": 1157} {"train_loss": -10.591538429260254, "global_step": 194423, "epoch": 1157} {"train_loss": -11.01675033569336, "global_step": 194424, "epoch": 1157} {"train_loss": -11.597799301147461, "global_step": 194425, "epoch": 1157} {"train_loss": -10.751585960388184, "global_step": 194426, "epoch": 1157} {"train_loss": -11.21511173248291, "global_step": 194427, "epoch": 1157} {"train_loss": -11.563957214355469, "global_step": 194428, "epoch": 1157} {"train_loss": -11.291969299316406, "global_step": 194429, "epoch": 1157} {"train_loss": -11.00554084777832, "global_step": 194430, "epoch": 1157} {"train_loss": -11.314067840576172, "global_step": 194431, "epoch": 1157} {"train_loss": -11.523401260375977, "global_step": 194432, "epoch": 1157} {"train_loss": -11.082341194152832, "global_step": 194433, "epoch": 1157} {"train_loss": -11.42999267578125, "global_step": 194434, "epoch": 1157} {"train_loss": -11.193283081054688, "global_step": 194435, "epoch": 1157} {"train_loss": -11.484621047973633, "global_step": 194436, "epoch": 1157} {"train_loss": -11.192058563232422, "global_step": 194437, "epoch": 1157} {"train_loss": -11.479389190673828, "global_step": 194438, "epoch": 1157} {"train_loss": -10.56383991241455, "global_step": 194439, "epoch": 1157} {"train_loss": -11.436777114868164, "global_step": 194440, "epoch": 1157} {"train_loss": -10.555179595947266, "global_step": 194441, "epoch": 1157} {"train_loss": -11.018962860107422, "global_step": 194442, "epoch": 1157} {"train_loss": -10.554566383361816, "global_step": 194443, "epoch": 1157} {"train_loss": -9.760724067687988, "global_step": 194444, "epoch": 1157} {"train_loss": -11.137252807617188, "global_step": 194445, "epoch": 1157} {"train_loss": -9.339384078979492, "global_step": 194446, "epoch": 1157} {"train_loss": -10.46098804473877, "global_step": 194447, "epoch": 1157} {"train_loss": -8.719149589538574, "global_step": 194448, "epoch": 1157} {"train_loss": -9.055585861206055, "global_step": 194449, "epoch": 1157} {"train_loss": -9.044361114501953, "global_step": 194450, "epoch": 1157} {"train_loss": -10.784051895141602, "global_step": 194451, "epoch": 1157} {"train_loss": -8.410876274108887, "global_step": 194452, "epoch": 1157} {"train_loss": -10.850252151489258, "global_step": 194453, "epoch": 1157} {"train_loss": -10.079731941223145, "global_step": 194454, "epoch": 1157} {"train_loss": -9.198294639587402, "global_step": 194455, "epoch": 1157} {"train_loss": -9.531482696533203, "global_step": 194456, "epoch": 1157} {"train_loss": -10.45850944519043, "global_step": 194457, "epoch": 1157} {"train_loss": -9.747068405151367, "global_step": 194458, "epoch": 1157} {"train_loss": -10.86020565032959, "global_step": 194459, "epoch": 1157} {"train_loss": -10.99311351776123, "global_step": 194460, "epoch": 1157} {"train_loss": -9.760223388671875, "global_step": 194461, "epoch": 1157} {"train_loss": -10.332778930664062, "global_step": 194462, "epoch": 1157} {"train_loss": -10.538052558898926, "global_step": 194463, "epoch": 1157} {"train_loss": -9.481704711914062, "global_step": 194464, "epoch": 1157} {"train_loss": -10.776066780090332, "global_step": 194465, "epoch": 1157} {"train_loss": -10.325506210327148, "global_step": 194466, "epoch": 1157} {"train_loss": -9.758872032165527, "global_step": 194467, "epoch": 1157} {"train_loss": -10.818695068359375, "global_step": 194468, "epoch": 1157} {"train_loss": -9.846973419189453, "global_step": 194469, "epoch": 1157} {"train_loss": -10.489377975463867, "global_step": 194470, "epoch": 1157} {"train_loss": -10.736814498901367, "global_step": 194471, "epoch": 1157} {"train_loss": -10.441827774047852, "global_step": 194472, "epoch": 1157} {"train_loss": -10.892878532409668, "global_step": 194473, "epoch": 1157} {"train_loss": -10.800294876098633, "global_step": 194474, "epoch": 1157} {"train_loss": -11.245909690856934, "global_step": 194475, "epoch": 1157} {"train_loss": -10.909576416015625, "global_step": 194476, "epoch": 1157} {"train_loss": -11.148996353149414, "global_step": 194477, "epoch": 1157} {"train_loss": -11.025093078613281, "global_step": 194478, "epoch": 1157} {"train_loss": -11.11884880065918, "global_step": 194479, "epoch": 1157} {"train_loss": -11.26431655883789, "global_step": 194480, "epoch": 1157} {"train_loss": -11.07768440246582, "global_step": 194481, "epoch": 1157} {"train_loss": -11.148844718933105, "global_step": 194482, "epoch": 1157} {"train_loss": -11.210968017578125, "global_step": 194483, "epoch": 1157} {"train_loss": -11.29996395111084, "global_step": 194484, "epoch": 1157} {"train_loss": -11.130175590515137, "global_step": 194485, "epoch": 1157} {"train_loss": -11.10809326171875, "global_step": 194486, "epoch": 1157} {"train_loss": -11.331357955932617, "global_step": 194487, "epoch": 1157} {"train_loss": -11.087059020996094, "global_step": 194488, "epoch": 1157} {"train_loss": -11.220518112182617, "global_step": 194489, "epoch": 1157} {"train_loss": -11.343985557556152, "global_step": 194490, "epoch": 1157} {"train_loss": -11.213841438293457, "global_step": 194491, "epoch": 1157} {"train_loss": -11.12729263305664, "global_step": 194492, "epoch": 1157} {"train_loss": -11.200139999389648, "global_step": 194493, "epoch": 1157} {"train_loss": -11.321533203125, "global_step": 194494, "epoch": 1157} {"train_loss": -10.989511489868164, "global_step": 194495, "epoch": 1157} {"train_loss": -11.153668403625488, "global_step": 194496, "epoch": 1157} {"train_loss": -11.10110092163086, "global_step": 194497, "epoch": 1157} {"train_loss": -11.37215805053711, "global_step": 194498, "epoch": 1157} {"train_loss": -11.238691329956055, "global_step": 194499, "epoch": 1157} {"train_loss": -11.287232398986816, "global_step": 194500, "epoch": 1157} {"train_loss": -11.274741172790527, "global_step": 194501, "epoch": 1157} {"train_loss": -11.461589813232422, "global_step": 194502, "epoch": 1157} {"train_loss": -11.545204162597656, "global_step": 194503, "epoch": 1157} {"train_loss": -11.367027282714844, "global_step": 194504, "epoch": 1157} {"train_loss": -11.422353744506836, "global_step": 194505, "epoch": 1157} {"train_loss": -11.631579399108887, "global_step": 194506, "epoch": 1157} {"train_loss": -11.417292594909668, "global_step": 194507, "epoch": 1157} {"train_loss": -11.43505859375, "global_step": 194508, "epoch": 1157} {"train_loss": -11.490478515625, "global_step": 194509, "epoch": 1157} {"train_loss": -11.407861709594727, "global_step": 194510, "epoch": 1157} {"train_loss": -11.32211685180664, "global_step": 194511, "epoch": 1157} {"train_loss": -11.531214714050293, "global_step": 194512, "epoch": 1157} {"train_loss": -11.382293701171875, "global_step": 194513, "epoch": 1157} {"train_loss": -11.568633079528809, "global_step": 194514, "epoch": 1157} {"train_loss": -11.602798461914062, "global_step": 194515, "epoch": 1157} {"train_loss": -11.281105041503906, "global_step": 194516, "epoch": 1157} {"train_loss": -11.422125816345215, "global_step": 194517, "epoch": 1157} {"train_loss": -11.648972511291504, "global_step": 194518, "epoch": 1157} {"train_loss": -11.730484008789062, "global_step": 194519, "epoch": 1157} {"train_loss": -11.59267807006836, "global_step": 194520, "epoch": 1157} {"train_loss": -11.44991683959961, "global_step": 194521, "epoch": 1157} {"train_loss": -11.674497604370117, "global_step": 194522, "epoch": 1157} {"train_loss": -11.72688102722168, "global_step": 194523, "epoch": 1157} {"train_loss": -11.653295516967773, "global_step": 194524, "epoch": 1157} {"train_loss": -11.808916091918945, "global_step": 194525, "epoch": 1157} {"train_loss": -11.670991897583008, "global_step": 194526, "epoch": 1157} {"train_loss": -11.572644233703613, "global_step": 194527, "epoch": 1157} {"train_loss": -11.674795150756836, "global_step": 194528, "epoch": 1157} {"train_loss": -11.688223838806152, "global_step": 194529, "epoch": 1157} {"train_loss": -11.197105407714844, "global_step": 194530, "epoch": 1157} {"train_loss": -11.613401412963867, "global_step": 194531, "epoch": 1157} {"train_loss": -11.619352340698242, "global_step": 194532, "epoch": 1157} {"train_loss": -11.384293556213379, "global_step": 194533, "epoch": 1157} {"train_loss": -11.508743286132812, "global_step": 194534, "epoch": 1157} {"train_loss": -11.105205535888672, "global_step": 194535, "epoch": 1157} {"train_loss": -11.029012680053711, "global_step": 194536, "epoch": 1157} {"train_loss": -11.494301795959473, "global_step": 194537, "epoch": 1157} {"train_loss": -11.476213455200195, "global_step": 194538, "epoch": 1157} {"train_loss": -11.431680679321289, "global_step": 194539, "epoch": 1157} {"train_loss": -11.61772632598877, "global_step": 194540, "epoch": 1157} {"train_loss": -11.498466491699219, "global_step": 194541, "epoch": 1157} {"train_loss": -11.582561492919922, "global_step": 194542, "epoch": 1157} {"train_loss": -11.113043103899274, "global_step": 194543, "epoch": 1157, "val_loss": 249488.453125} {"train_loss": -10.707763671875, "global_step": 194544, "epoch": 1158} {"train_loss": -11.131117820739746, "global_step": 194545, "epoch": 1158} {"train_loss": -11.54310417175293, "global_step": 194546, "epoch": 1158} {"train_loss": -10.999076843261719, "global_step": 194547, "epoch": 1158} {"train_loss": -11.657313346862793, "global_step": 194548, "epoch": 1158} {"train_loss": -11.256118774414062, "global_step": 194549, "epoch": 1158} {"train_loss": -11.226856231689453, "global_step": 194550, "epoch": 1158} {"train_loss": -11.762981414794922, "global_step": 194551, "epoch": 1158} {"train_loss": -10.881720542907715, "global_step": 194552, "epoch": 1158} {"train_loss": -10.80395793914795, "global_step": 194553, "epoch": 1158} {"train_loss": -11.352629661560059, "global_step": 194554, "epoch": 1158} {"train_loss": -10.542312622070312, "global_step": 194555, "epoch": 1158} {"train_loss": -10.549591064453125, "global_step": 194556, "epoch": 1158} {"train_loss": -11.242630004882812, "global_step": 194557, "epoch": 1158} {"train_loss": -10.427046775817871, "global_step": 194558, "epoch": 1158} {"train_loss": -10.263784408569336, "global_step": 194559, "epoch": 1158} {"train_loss": -10.962108612060547, "global_step": 194560, "epoch": 1158} {"train_loss": -10.0592041015625, "global_step": 194561, "epoch": 1158} {"train_loss": -11.103899955749512, "global_step": 194562, "epoch": 1158} {"train_loss": -10.993952751159668, "global_step": 194563, "epoch": 1158} {"train_loss": -10.682010650634766, "global_step": 194564, "epoch": 1158} {"train_loss": -11.415433883666992, "global_step": 194565, "epoch": 1158} {"train_loss": -11.162399291992188, "global_step": 194566, "epoch": 1158} {"train_loss": -11.452692031860352, "global_step": 194567, "epoch": 1158} {"train_loss": -11.285076141357422, "global_step": 194568, "epoch": 1158} {"train_loss": -11.474750518798828, "global_step": 194569, "epoch": 1158} {"train_loss": -11.361270904541016, "global_step": 194570, "epoch": 1158} {"train_loss": -11.598616600036621, "global_step": 194571, "epoch": 1158} {"train_loss": -11.406896591186523, "global_step": 194572, "epoch": 1158} {"train_loss": -11.43806266784668, "global_step": 194573, "epoch": 1158} {"train_loss": -11.488969802856445, "global_step": 194574, "epoch": 1158} {"train_loss": -11.396768569946289, "global_step": 194575, "epoch": 1158} {"train_loss": -11.31705093383789, "global_step": 194576, "epoch": 1158} {"train_loss": -11.232064247131348, "global_step": 194577, "epoch": 1158} {"train_loss": -11.466142654418945, "global_step": 194578, "epoch": 1158} {"train_loss": -11.194732666015625, "global_step": 194579, "epoch": 1158} {"train_loss": -11.319778442382812, "global_step": 194580, "epoch": 1158} {"train_loss": -11.281916618347168, "global_step": 194581, "epoch": 1158} {"train_loss": -11.3779296875, "global_step": 194582, "epoch": 1158} {"train_loss": -11.261253356933594, "global_step": 194583, "epoch": 1158} {"train_loss": -11.416998863220215, "global_step": 194584, "epoch": 1158} {"train_loss": -11.435726165771484, "global_step": 194585, "epoch": 1158} {"train_loss": -11.16904067993164, "global_step": 194586, "epoch": 1158} {"train_loss": -11.196786880493164, "global_step": 194587, "epoch": 1158} {"train_loss": -11.270637512207031, "global_step": 194588, "epoch": 1158} {"train_loss": -11.448657035827637, "global_step": 194589, "epoch": 1158} {"train_loss": -11.598989486694336, "global_step": 194590, "epoch": 1158} {"train_loss": -11.192169189453125, "global_step": 194591, "epoch": 1158} {"train_loss": -11.594326972961426, "global_step": 194592, "epoch": 1158} {"train_loss": -11.28908920288086, "global_step": 194593, "epoch": 1158} {"train_loss": -11.532854080200195, "global_step": 194594, "epoch": 1158} {"train_loss": -11.140698432922363, "global_step": 194595, "epoch": 1158} {"train_loss": -11.660545349121094, "global_step": 194596, "epoch": 1158} {"train_loss": -11.430765151977539, "global_step": 194597, "epoch": 1158} {"train_loss": -11.399696350097656, "global_step": 194598, "epoch": 1158} {"train_loss": -11.469565391540527, "global_step": 194599, "epoch": 1158} {"train_loss": -11.237515449523926, "global_step": 194600, "epoch": 1158} {"train_loss": -11.549449920654297, "global_step": 194601, "epoch": 1158} {"train_loss": -11.18689250946045, "global_step": 194602, "epoch": 1158} {"train_loss": -11.342844009399414, "global_step": 194603, "epoch": 1158} {"train_loss": -11.423775672912598, "global_step": 194604, "epoch": 1158} {"train_loss": -11.658681869506836, "global_step": 194605, "epoch": 1158} {"train_loss": -11.361688613891602, "global_step": 194606, "epoch": 1158} {"train_loss": -11.566022872924805, "global_step": 194607, "epoch": 1158} {"train_loss": -11.349687576293945, "global_step": 194608, "epoch": 1158} {"train_loss": -11.53093147277832, "global_step": 194609, "epoch": 1158} {"train_loss": -11.093709945678711, "global_step": 194610, "epoch": 1158} {"train_loss": -11.543972969055176, "global_step": 194611, "epoch": 1158} {"train_loss": -11.106578826904297, "global_step": 194612, "epoch": 1158} {"train_loss": -11.052656173706055, "global_step": 194613, "epoch": 1158} {"train_loss": -11.548836708068848, "global_step": 194614, "epoch": 1158} {"train_loss": -11.274377822875977, "global_step": 194615, "epoch": 1158} {"train_loss": -11.339885711669922, "global_step": 194616, "epoch": 1158} {"train_loss": -11.492223739624023, "global_step": 194617, "epoch": 1158} {"train_loss": -11.441274642944336, "global_step": 194618, "epoch": 1158} {"train_loss": -11.462617874145508, "global_step": 194619, "epoch": 1158} {"train_loss": -11.640706062316895, "global_step": 194620, "epoch": 1158} {"train_loss": -11.595247268676758, "global_step": 194621, "epoch": 1158} {"train_loss": -11.841846466064453, "global_step": 194622, "epoch": 1158} {"train_loss": -11.691261291503906, "global_step": 194623, "epoch": 1158} {"train_loss": -11.610578536987305, "global_step": 194624, "epoch": 1158} {"train_loss": -11.875823974609375, "global_step": 194625, "epoch": 1158} {"train_loss": -11.609853744506836, "global_step": 194626, "epoch": 1158} {"train_loss": -11.416574478149414, "global_step": 194627, "epoch": 1158} {"train_loss": -11.474180221557617, "global_step": 194628, "epoch": 1158} {"train_loss": -11.507296562194824, "global_step": 194629, "epoch": 1158} {"train_loss": -11.328429222106934, "global_step": 194630, "epoch": 1158} {"train_loss": -11.391173362731934, "global_step": 194631, "epoch": 1158} {"train_loss": -11.291803359985352, "global_step": 194632, "epoch": 1158} {"train_loss": -10.980576515197754, "global_step": 194633, "epoch": 1158} {"train_loss": -10.097187995910645, "global_step": 194634, "epoch": 1158} {"train_loss": -10.744305610656738, "global_step": 194635, "epoch": 1158} {"train_loss": -10.885354995727539, "global_step": 194636, "epoch": 1158} {"train_loss": -9.820028305053711, "global_step": 194637, "epoch": 1158} {"train_loss": -10.298765182495117, "global_step": 194638, "epoch": 1158} {"train_loss": -11.328256607055664, "global_step": 194639, "epoch": 1158} {"train_loss": -9.231054306030273, "global_step": 194640, "epoch": 1158} {"train_loss": -11.56600570678711, "global_step": 194641, "epoch": 1158} {"train_loss": -9.524850845336914, "global_step": 194642, "epoch": 1158} {"train_loss": -9.930274963378906, "global_step": 194643, "epoch": 1158} {"train_loss": -10.627202987670898, "global_step": 194644, "epoch": 1158} {"train_loss": -9.382259368896484, "global_step": 194645, "epoch": 1158} {"train_loss": -11.225791931152344, "global_step": 194646, "epoch": 1158} {"train_loss": -9.892308235168457, "global_step": 194647, "epoch": 1158} {"train_loss": -11.09438705444336, "global_step": 194648, "epoch": 1158} {"train_loss": -11.100110054016113, "global_step": 194649, "epoch": 1158} {"train_loss": -10.980606079101562, "global_step": 194650, "epoch": 1158} {"train_loss": -11.231061935424805, "global_step": 194651, "epoch": 1158} {"train_loss": -10.940254211425781, "global_step": 194652, "epoch": 1158} {"train_loss": -11.046749114990234, "global_step": 194653, "epoch": 1158} {"train_loss": -11.29445743560791, "global_step": 194654, "epoch": 1158} {"train_loss": -10.580228805541992, "global_step": 194655, "epoch": 1158} {"train_loss": -11.48538589477539, "global_step": 194656, "epoch": 1158} {"train_loss": -11.114114761352539, "global_step": 194657, "epoch": 1158} {"train_loss": -11.032278060913086, "global_step": 194658, "epoch": 1158} {"train_loss": -10.981555938720703, "global_step": 194659, "epoch": 1158} {"train_loss": -10.626394271850586, "global_step": 194660, "epoch": 1158} {"train_loss": -11.27208137512207, "global_step": 194661, "epoch": 1158} {"train_loss": -10.678086280822754, "global_step": 194662, "epoch": 1158} {"train_loss": -11.00190544128418, "global_step": 194663, "epoch": 1158} {"train_loss": -10.910127639770508, "global_step": 194664, "epoch": 1158} {"train_loss": -11.525704383850098, "global_step": 194665, "epoch": 1158} {"train_loss": -11.575014114379883, "global_step": 194666, "epoch": 1158} {"train_loss": -11.218948364257812, "global_step": 194667, "epoch": 1158} {"train_loss": -11.351163864135742, "global_step": 194668, "epoch": 1158} {"train_loss": -11.401259422302246, "global_step": 194669, "epoch": 1158} {"train_loss": -10.950300216674805, "global_step": 194670, "epoch": 1158} {"train_loss": -11.21770191192627, "global_step": 194671, "epoch": 1158} {"train_loss": -11.051406860351562, "global_step": 194672, "epoch": 1158} {"train_loss": -10.799603462219238, "global_step": 194673, "epoch": 1158} {"train_loss": -11.360177040100098, "global_step": 194674, "epoch": 1158} {"train_loss": -11.011430740356445, "global_step": 194675, "epoch": 1158} {"train_loss": -11.063835144042969, "global_step": 194676, "epoch": 1158} {"train_loss": -11.351036071777344, "global_step": 194677, "epoch": 1158} {"train_loss": -11.316566467285156, "global_step": 194678, "epoch": 1158} {"train_loss": -11.520215034484863, "global_step": 194679, "epoch": 1158} {"train_loss": -11.402569770812988, "global_step": 194680, "epoch": 1158} {"train_loss": -11.275365829467773, "global_step": 194681, "epoch": 1158} {"train_loss": -11.379937171936035, "global_step": 194682, "epoch": 1158} {"train_loss": -11.545416831970215, "global_step": 194683, "epoch": 1158} {"train_loss": -11.414596557617188, "global_step": 194684, "epoch": 1158} {"train_loss": -11.618714332580566, "global_step": 194685, "epoch": 1158} {"train_loss": -11.379491806030273, "global_step": 194686, "epoch": 1158} {"train_loss": -11.454154014587402, "global_step": 194687, "epoch": 1158} {"train_loss": -11.364737510681152, "global_step": 194688, "epoch": 1158} {"train_loss": -11.370489120483398, "global_step": 194689, "epoch": 1158} {"train_loss": -11.51695442199707, "global_step": 194690, "epoch": 1158} {"train_loss": -11.466054916381836, "global_step": 194691, "epoch": 1158} {"train_loss": -11.560606956481934, "global_step": 194692, "epoch": 1158} {"train_loss": -11.260699272155762, "global_step": 194693, "epoch": 1158} {"train_loss": -11.135276794433594, "global_step": 194694, "epoch": 1158} {"train_loss": -11.477764129638672, "global_step": 194695, "epoch": 1158} {"train_loss": -11.44861888885498, "global_step": 194696, "epoch": 1158} {"train_loss": -11.515837669372559, "global_step": 194697, "epoch": 1158} {"train_loss": -11.577817916870117, "global_step": 194698, "epoch": 1158} {"train_loss": -11.217653274536133, "global_step": 194699, "epoch": 1158} {"train_loss": -11.645642280578613, "global_step": 194700, "epoch": 1158} {"train_loss": -11.456418991088867, "global_step": 194701, "epoch": 1158} {"train_loss": -11.360856056213379, "global_step": 194702, "epoch": 1158} {"train_loss": -11.295755386352539, "global_step": 194703, "epoch": 1158} {"train_loss": -11.43481159210205, "global_step": 194704, "epoch": 1158} {"train_loss": -11.600616455078125, "global_step": 194705, "epoch": 1158} {"train_loss": -11.229971885681152, "global_step": 194706, "epoch": 1158} {"train_loss": -11.0654878616333, "global_step": 194707, "epoch": 1158} {"train_loss": -11.382445335388184, "global_step": 194708, "epoch": 1158} {"train_loss": -11.324661254882812, "global_step": 194709, "epoch": 1158} {"train_loss": -11.254109382629395, "global_step": 194710, "epoch": 1158} {"train_loss": -11.206448878560748, "global_step": 194711, "epoch": 1158, "val_loss": 248088.609375} {"train_loss": -11.36570930480957, "global_step": 194712, "epoch": 1159} {"train_loss": -11.266587257385254, "global_step": 194713, "epoch": 1159} {"train_loss": -11.377321243286133, "global_step": 194714, "epoch": 1159} {"train_loss": -11.385461807250977, "global_step": 194715, "epoch": 1159} {"train_loss": -11.443742752075195, "global_step": 194716, "epoch": 1159} {"train_loss": -11.756027221679688, "global_step": 194717, "epoch": 1159} {"train_loss": -11.439411163330078, "global_step": 194718, "epoch": 1159} {"train_loss": -11.389062881469727, "global_step": 194719, "epoch": 1159} {"train_loss": -11.52498722076416, "global_step": 194720, "epoch": 1159} {"train_loss": -11.724349021911621, "global_step": 194721, "epoch": 1159} {"train_loss": -11.58090591430664, "global_step": 194722, "epoch": 1159} {"train_loss": -11.29319953918457, "global_step": 194723, "epoch": 1159} {"train_loss": -11.615821838378906, "global_step": 194724, "epoch": 1159} {"train_loss": -11.245453834533691, "global_step": 194725, "epoch": 1159} {"train_loss": -11.3815336227417, "global_step": 194726, "epoch": 1159} {"train_loss": -11.331632614135742, "global_step": 194727, "epoch": 1159} {"train_loss": -11.460354804992676, "global_step": 194728, "epoch": 1159} {"train_loss": -11.379790306091309, "global_step": 194729, "epoch": 1159} {"train_loss": -11.488611221313477, "global_step": 194730, "epoch": 1159} {"train_loss": -11.368570327758789, "global_step": 194731, "epoch": 1159} {"train_loss": -11.51777458190918, "global_step": 194732, "epoch": 1159} {"train_loss": -11.640027046203613, "global_step": 194733, "epoch": 1159} {"train_loss": -11.567560195922852, "global_step": 194734, "epoch": 1159} {"train_loss": -11.458198547363281, "global_step": 194735, "epoch": 1159} {"train_loss": -11.370166778564453, "global_step": 194736, "epoch": 1159} {"train_loss": -11.480039596557617, "global_step": 194737, "epoch": 1159} {"train_loss": -11.040380477905273, "global_step": 194738, "epoch": 1159} {"train_loss": -11.12236213684082, "global_step": 194739, "epoch": 1159} {"train_loss": -10.338949203491211, "global_step": 194740, "epoch": 1159} {"train_loss": -10.443656921386719, "global_step": 194741, "epoch": 1159} {"train_loss": -10.926074981689453, "global_step": 194742, "epoch": 1159} {"train_loss": -11.442447662353516, "global_step": 194743, "epoch": 1159} {"train_loss": -10.413516998291016, "global_step": 194744, "epoch": 1159} {"train_loss": -10.291393280029297, "global_step": 194745, "epoch": 1159} {"train_loss": -11.261274337768555, "global_step": 194746, "epoch": 1159} {"train_loss": -10.48141860961914, "global_step": 194747, "epoch": 1159} {"train_loss": -11.277754783630371, "global_step": 194748, "epoch": 1159} {"train_loss": -10.382904052734375, "global_step": 194749, "epoch": 1159} {"train_loss": -10.879486083984375, "global_step": 194750, "epoch": 1159} {"train_loss": -10.88670539855957, "global_step": 194751, "epoch": 1159} {"train_loss": -10.659947395324707, "global_step": 194752, "epoch": 1159} {"train_loss": -10.94441032409668, "global_step": 194753, "epoch": 1159} {"train_loss": -10.933577537536621, "global_step": 194754, "epoch": 1159} {"train_loss": -11.089983940124512, "global_step": 194755, "epoch": 1159} {"train_loss": -10.500688552856445, "global_step": 194756, "epoch": 1159} {"train_loss": -10.491754531860352, "global_step": 194757, "epoch": 1159} {"train_loss": -10.77973461151123, "global_step": 194758, "epoch": 1159} {"train_loss": -10.874015808105469, "global_step": 194759, "epoch": 1159} {"train_loss": -11.166020393371582, "global_step": 194760, "epoch": 1159} {"train_loss": -11.09557056427002, "global_step": 194761, "epoch": 1159} {"train_loss": -11.236084938049316, "global_step": 194762, "epoch": 1159} {"train_loss": -10.991667747497559, "global_step": 194763, "epoch": 1159} {"train_loss": -11.225263595581055, "global_step": 194764, "epoch": 1159} {"train_loss": -11.314665794372559, "global_step": 194765, "epoch": 1159} {"train_loss": -11.32443618774414, "global_step": 194766, "epoch": 1159} {"train_loss": -11.140812873840332, "global_step": 194767, "epoch": 1159} {"train_loss": -10.918407440185547, "global_step": 194768, "epoch": 1159} {"train_loss": -11.229696273803711, "global_step": 194769, "epoch": 1159} {"train_loss": -11.380666732788086, "global_step": 194770, "epoch": 1159} {"train_loss": -11.196372985839844, "global_step": 194771, "epoch": 1159} {"train_loss": -11.386899948120117, "global_step": 194772, "epoch": 1159} {"train_loss": -10.156820297241211, "global_step": 194773, "epoch": 1159} {"train_loss": -11.082141876220703, "global_step": 194774, "epoch": 1159} {"train_loss": -11.104774475097656, "global_step": 194775, "epoch": 1159} {"train_loss": -10.449541091918945, "global_step": 194776, "epoch": 1159} {"train_loss": -11.477095603942871, "global_step": 194777, "epoch": 1159} {"train_loss": -10.517536163330078, "global_step": 194778, "epoch": 1159} {"train_loss": -11.379690170288086, "global_step": 194779, "epoch": 1159} {"train_loss": -11.328356742858887, "global_step": 194780, "epoch": 1159} {"train_loss": -11.295442581176758, "global_step": 194781, "epoch": 1159} {"train_loss": -11.487421035766602, "global_step": 194782, "epoch": 1159} {"train_loss": -11.032828330993652, "global_step": 194783, "epoch": 1159} {"train_loss": -11.441242218017578, "global_step": 194784, "epoch": 1159} {"train_loss": -11.333847999572754, "global_step": 194785, "epoch": 1159} {"train_loss": -11.220643997192383, "global_step": 194786, "epoch": 1159} {"train_loss": -11.437629699707031, "global_step": 194787, "epoch": 1159} {"train_loss": -11.395893096923828, "global_step": 194788, "epoch": 1159} {"train_loss": -11.371625900268555, "global_step": 194789, "epoch": 1159} {"train_loss": -11.400107383728027, "global_step": 194790, "epoch": 1159} {"train_loss": -11.38314437866211, "global_step": 194791, "epoch": 1159} {"train_loss": -11.175331115722656, "global_step": 194792, "epoch": 1159} {"train_loss": -11.172187805175781, "global_step": 194793, "epoch": 1159} {"train_loss": -10.614082336425781, "global_step": 194794, "epoch": 1159} {"train_loss": -10.382476806640625, "global_step": 194795, "epoch": 1159} {"train_loss": -11.128705024719238, "global_step": 194796, "epoch": 1159} {"train_loss": -9.996373176574707, "global_step": 194797, "epoch": 1159} {"train_loss": -11.281484603881836, "global_step": 194798, "epoch": 1159} {"train_loss": -10.786775588989258, "global_step": 194799, "epoch": 1159} {"train_loss": -11.108667373657227, "global_step": 194800, "epoch": 1159} {"train_loss": -10.916299819946289, "global_step": 194801, "epoch": 1159} {"train_loss": -11.170751571655273, "global_step": 194802, "epoch": 1159} {"train_loss": -11.102243423461914, "global_step": 194803, "epoch": 1159} {"train_loss": -10.94172477722168, "global_step": 194804, "epoch": 1159} {"train_loss": -11.148482322692871, "global_step": 194805, "epoch": 1159} {"train_loss": -11.226175308227539, "global_step": 194806, "epoch": 1159} {"train_loss": -11.263209342956543, "global_step": 194807, "epoch": 1159} {"train_loss": -11.278974533081055, "global_step": 194808, "epoch": 1159} {"train_loss": -11.255472183227539, "global_step": 194809, "epoch": 1159} {"train_loss": -11.259299278259277, "global_step": 194810, "epoch": 1159} {"train_loss": -11.35453987121582, "global_step": 194811, "epoch": 1159} {"train_loss": -11.02389907836914, "global_step": 194812, "epoch": 1159} {"train_loss": -11.5188627243042, "global_step": 194813, "epoch": 1159} {"train_loss": -11.066354751586914, "global_step": 194814, "epoch": 1159} {"train_loss": -11.499225616455078, "global_step": 194815, "epoch": 1159} {"train_loss": -10.882866859436035, "global_step": 194816, "epoch": 1159} {"train_loss": -11.302123069763184, "global_step": 194817, "epoch": 1159} {"train_loss": -11.047019958496094, "global_step": 194818, "epoch": 1159} {"train_loss": -11.114738464355469, "global_step": 194819, "epoch": 1159} {"train_loss": -11.473274230957031, "global_step": 194820, "epoch": 1159} {"train_loss": -10.925813674926758, "global_step": 194821, "epoch": 1159} {"train_loss": -11.480382919311523, "global_step": 194822, "epoch": 1159} {"train_loss": -10.921387672424316, "global_step": 194823, "epoch": 1159} {"train_loss": -11.347064018249512, "global_step": 194824, "epoch": 1159} {"train_loss": -11.12330150604248, "global_step": 194825, "epoch": 1159} {"train_loss": -11.363276481628418, "global_step": 194826, "epoch": 1159} {"train_loss": -11.03310775756836, "global_step": 194827, "epoch": 1159} {"train_loss": -11.438261032104492, "global_step": 194828, "epoch": 1159} {"train_loss": -11.311151504516602, "global_step": 194829, "epoch": 1159} {"train_loss": -11.585265159606934, "global_step": 194830, "epoch": 1159} {"train_loss": -11.218902587890625, "global_step": 194831, "epoch": 1159} {"train_loss": -11.40340805053711, "global_step": 194832, "epoch": 1159} {"train_loss": -11.514532089233398, "global_step": 194833, "epoch": 1159} {"train_loss": -11.387531280517578, "global_step": 194834, "epoch": 1159} {"train_loss": -11.412642478942871, "global_step": 194835, "epoch": 1159} {"train_loss": -11.272514343261719, "global_step": 194836, "epoch": 1159} {"train_loss": -11.521665573120117, "global_step": 194837, "epoch": 1159} {"train_loss": -11.288684844970703, "global_step": 194838, "epoch": 1159} {"train_loss": -11.464329719543457, "global_step": 194839, "epoch": 1159} {"train_loss": -11.433695793151855, "global_step": 194840, "epoch": 1159} {"train_loss": -11.644854545593262, "global_step": 194841, "epoch": 1159} {"train_loss": -11.422632217407227, "global_step": 194842, "epoch": 1159} {"train_loss": -11.408134460449219, "global_step": 194843, "epoch": 1159} {"train_loss": -11.230663299560547, "global_step": 194844, "epoch": 1159} {"train_loss": -11.421392440795898, "global_step": 194845, "epoch": 1159} {"train_loss": -11.023822784423828, "global_step": 194846, "epoch": 1159} {"train_loss": -11.500627517700195, "global_step": 194847, "epoch": 1159} {"train_loss": -11.486494064331055, "global_step": 194848, "epoch": 1159} {"train_loss": -11.181272506713867, "global_step": 194849, "epoch": 1159} {"train_loss": -11.623546600341797, "global_step": 194850, "epoch": 1159} {"train_loss": -11.14358139038086, "global_step": 194851, "epoch": 1159} {"train_loss": -11.193231582641602, "global_step": 194852, "epoch": 1159} {"train_loss": -11.379376411437988, "global_step": 194853, "epoch": 1159} {"train_loss": -11.323467254638672, "global_step": 194854, "epoch": 1159} {"train_loss": -11.148222923278809, "global_step": 194855, "epoch": 1159} {"train_loss": -11.419740676879883, "global_step": 194856, "epoch": 1159} {"train_loss": -11.102163314819336, "global_step": 194857, "epoch": 1159} {"train_loss": -11.405607223510742, "global_step": 194858, "epoch": 1159} {"train_loss": -11.560128211975098, "global_step": 194859, "epoch": 1159} {"train_loss": -11.137186050415039, "global_step": 194860, "epoch": 1159} {"train_loss": -11.43062686920166, "global_step": 194861, "epoch": 1159} {"train_loss": -11.66923713684082, "global_step": 194862, "epoch": 1159} {"train_loss": -11.362674713134766, "global_step": 194863, "epoch": 1159} {"train_loss": -11.528580665588379, "global_step": 194864, "epoch": 1159} {"train_loss": -11.137222290039062, "global_step": 194865, "epoch": 1159} {"train_loss": -11.384428977966309, "global_step": 194866, "epoch": 1159} {"train_loss": -11.336759567260742, "global_step": 194867, "epoch": 1159} {"train_loss": -11.204967498779297, "global_step": 194868, "epoch": 1159} {"train_loss": -11.18522834777832, "global_step": 194869, "epoch": 1159} {"train_loss": -11.527691841125488, "global_step": 194870, "epoch": 1159} {"train_loss": -11.567413330078125, "global_step": 194871, "epoch": 1159} {"train_loss": -11.278406143188477, "global_step": 194872, "epoch": 1159} {"train_loss": -11.440048217773438, "global_step": 194873, "epoch": 1159} {"train_loss": -11.051995277404785, "global_step": 194874, "epoch": 1159} {"train_loss": -11.422796249389648, "global_step": 194875, "epoch": 1159} {"train_loss": -11.26093864440918, "global_step": 194876, "epoch": 1159} {"train_loss": -11.358863830566406, "global_step": 194877, "epoch": 1159} {"train_loss": -10.930035591125488, "global_step": 194878, "epoch": 1159} {"train_loss": -11.209256728490194, "global_step": 194879, "epoch": 1159, "val_loss": 249792.78125} {"train_loss": -11.47653579711914, "global_step": 194880, "epoch": 1160} {"train_loss": -10.997159957885742, "global_step": 194881, "epoch": 1160} {"train_loss": -11.205095291137695, "global_step": 194882, "epoch": 1160} {"train_loss": -11.41028118133545, "global_step": 194883, "epoch": 1160} {"train_loss": -10.988174438476562, "global_step": 194884, "epoch": 1160} {"train_loss": -11.120128631591797, "global_step": 194885, "epoch": 1160} {"train_loss": -11.60410213470459, "global_step": 194886, "epoch": 1160} {"train_loss": -11.098760604858398, "global_step": 194887, "epoch": 1160} {"train_loss": -11.336710929870605, "global_step": 194888, "epoch": 1160} {"train_loss": -11.15910530090332, "global_step": 194889, "epoch": 1160} {"train_loss": -11.347455978393555, "global_step": 194890, "epoch": 1160} {"train_loss": -10.964471817016602, "global_step": 194891, "epoch": 1160} {"train_loss": -11.062220573425293, "global_step": 194892, "epoch": 1160} {"train_loss": -10.884956359863281, "global_step": 194893, "epoch": 1160} {"train_loss": -10.771749496459961, "global_step": 194894, "epoch": 1160} {"train_loss": -10.537412643432617, "global_step": 194895, "epoch": 1160} {"train_loss": -11.404952049255371, "global_step": 194896, "epoch": 1160} {"train_loss": -10.926979064941406, "global_step": 194897, "epoch": 1160} {"train_loss": -11.025408744812012, "global_step": 194898, "epoch": 1160} {"train_loss": -11.021102905273438, "global_step": 194899, "epoch": 1160} {"train_loss": -9.911386489868164, "global_step": 194900, "epoch": 1160} {"train_loss": -10.232146263122559, "global_step": 194901, "epoch": 1160} {"train_loss": -10.527865409851074, "global_step": 194902, "epoch": 1160} {"train_loss": -10.850425720214844, "global_step": 194903, "epoch": 1160} {"train_loss": -10.27087688446045, "global_step": 194904, "epoch": 1160} {"train_loss": -9.432950973510742, "global_step": 194905, "epoch": 1160} {"train_loss": -11.246465682983398, "global_step": 194906, "epoch": 1160} {"train_loss": -10.253725051879883, "global_step": 194907, "epoch": 1160} {"train_loss": -10.824522018432617, "global_step": 194908, "epoch": 1160} {"train_loss": -10.523908615112305, "global_step": 194909, "epoch": 1160} {"train_loss": -10.559271812438965, "global_step": 194910, "epoch": 1160} {"train_loss": -11.30681037902832, "global_step": 194911, "epoch": 1160} {"train_loss": -10.576128005981445, "global_step": 194912, "epoch": 1160} {"train_loss": -11.274829864501953, "global_step": 194913, "epoch": 1160} {"train_loss": -11.104141235351562, "global_step": 194914, "epoch": 1160} {"train_loss": -10.956220626831055, "global_step": 194915, "epoch": 1160} {"train_loss": -11.188180923461914, "global_step": 194916, "epoch": 1160} {"train_loss": -11.261293411254883, "global_step": 194917, "epoch": 1160} {"train_loss": -10.960065841674805, "global_step": 194918, "epoch": 1160} {"train_loss": -11.17495059967041, "global_step": 194919, "epoch": 1160} {"train_loss": -10.832335472106934, "global_step": 194920, "epoch": 1160} {"train_loss": -11.135026931762695, "global_step": 194921, "epoch": 1160} {"train_loss": -10.776147842407227, "global_step": 194922, "epoch": 1160} {"train_loss": -10.616731643676758, "global_step": 194923, "epoch": 1160} {"train_loss": -10.835609436035156, "global_step": 194924, "epoch": 1160} {"train_loss": -10.546791076660156, "global_step": 194925, "epoch": 1160} {"train_loss": -10.509300231933594, "global_step": 194926, "epoch": 1160} {"train_loss": -10.853414535522461, "global_step": 194927, "epoch": 1160} {"train_loss": -10.07007122039795, "global_step": 194928, "epoch": 1160} {"train_loss": -11.202741622924805, "global_step": 194929, "epoch": 1160} {"train_loss": -10.295560836791992, "global_step": 194930, "epoch": 1160} {"train_loss": -10.67216682434082, "global_step": 194931, "epoch": 1160} {"train_loss": -10.708043098449707, "global_step": 194932, "epoch": 1160} {"train_loss": -10.56144905090332, "global_step": 194933, "epoch": 1160} {"train_loss": -10.484615325927734, "global_step": 194934, "epoch": 1160} {"train_loss": -10.549763679504395, "global_step": 194935, "epoch": 1160} {"train_loss": -10.30366325378418, "global_step": 194936, "epoch": 1160} {"train_loss": -11.072728157043457, "global_step": 194937, "epoch": 1160} {"train_loss": -10.665284156799316, "global_step": 194938, "epoch": 1160} {"train_loss": -10.781352996826172, "global_step": 194939, "epoch": 1160} {"train_loss": -10.69120979309082, "global_step": 194940, "epoch": 1160} {"train_loss": -11.150487899780273, "global_step": 194941, "epoch": 1160} {"train_loss": -10.921321868896484, "global_step": 194942, "epoch": 1160} {"train_loss": -11.08417797088623, "global_step": 194943, "epoch": 1160} {"train_loss": -11.241514205932617, "global_step": 194944, "epoch": 1160} {"train_loss": -11.034521102905273, "global_step": 194945, "epoch": 1160} {"train_loss": -10.739931106567383, "global_step": 194946, "epoch": 1160} {"train_loss": -11.173863410949707, "global_step": 194947, "epoch": 1160} {"train_loss": -10.756921768188477, "global_step": 194948, "epoch": 1160} {"train_loss": -11.020101547241211, "global_step": 194949, "epoch": 1160} {"train_loss": -10.878616333007812, "global_step": 194950, "epoch": 1160} {"train_loss": -11.129327774047852, "global_step": 194951, "epoch": 1160} {"train_loss": -11.046152114868164, "global_step": 194952, "epoch": 1160} {"train_loss": -11.47404670715332, "global_step": 194953, "epoch": 1160} {"train_loss": -10.783491134643555, "global_step": 194954, "epoch": 1160} {"train_loss": -11.410359382629395, "global_step": 194955, "epoch": 1160} {"train_loss": -11.084843635559082, "global_step": 194956, "epoch": 1160} {"train_loss": -11.415326118469238, "global_step": 194957, "epoch": 1160} {"train_loss": -11.063131332397461, "global_step": 194958, "epoch": 1160} {"train_loss": -11.390798568725586, "global_step": 194959, "epoch": 1160} {"train_loss": -11.298736572265625, "global_step": 194960, "epoch": 1160} {"train_loss": -11.542120933532715, "global_step": 194961, "epoch": 1160} {"train_loss": -11.224650382995605, "global_step": 194962, "epoch": 1160} {"train_loss": -11.257955551147461, "global_step": 194963, "epoch": 1160} {"train_loss": -11.470995903015137, "global_step": 194964, "epoch": 1160} {"train_loss": -11.344416618347168, "global_step": 194965, "epoch": 1160} {"train_loss": -11.56198501586914, "global_step": 194966, "epoch": 1160} {"train_loss": -11.64417839050293, "global_step": 194967, "epoch": 1160} {"train_loss": -11.519904136657715, "global_step": 194968, "epoch": 1160} {"train_loss": -11.462714195251465, "global_step": 194969, "epoch": 1160} {"train_loss": -11.4840726852417, "global_step": 194970, "epoch": 1160} {"train_loss": -11.401392936706543, "global_step": 194971, "epoch": 1160} {"train_loss": -11.626668930053711, "global_step": 194972, "epoch": 1160} {"train_loss": -11.27699089050293, "global_step": 194973, "epoch": 1160} {"train_loss": -11.513673782348633, "global_step": 194974, "epoch": 1160} {"train_loss": -11.65161418914795, "global_step": 194975, "epoch": 1160} {"train_loss": -11.180842399597168, "global_step": 194976, "epoch": 1160} {"train_loss": -11.371458053588867, "global_step": 194977, "epoch": 1160} {"train_loss": -11.320188522338867, "global_step": 194978, "epoch": 1160} {"train_loss": -11.438909530639648, "global_step": 194979, "epoch": 1160} {"train_loss": -11.428757667541504, "global_step": 194980, "epoch": 1160} {"train_loss": -11.598602294921875, "global_step": 194981, "epoch": 1160} {"train_loss": -11.402427673339844, "global_step": 194982, "epoch": 1160} {"train_loss": -11.60927677154541, "global_step": 194983, "epoch": 1160} {"train_loss": -11.444700241088867, "global_step": 194984, "epoch": 1160} {"train_loss": -11.64833927154541, "global_step": 194985, "epoch": 1160} {"train_loss": -11.622760772705078, "global_step": 194986, "epoch": 1160} {"train_loss": -11.712848663330078, "global_step": 194987, "epoch": 1160} {"train_loss": -11.337027549743652, "global_step": 194988, "epoch": 1160} {"train_loss": -11.584854125976562, "global_step": 194989, "epoch": 1160} {"train_loss": -11.610501289367676, "global_step": 194990, "epoch": 1160} {"train_loss": -11.680413246154785, "global_step": 194991, "epoch": 1160} {"train_loss": -11.80245590209961, "global_step": 194992, "epoch": 1160} {"train_loss": -11.685857772827148, "global_step": 194993, "epoch": 1160} {"train_loss": -11.664883613586426, "global_step": 194994, "epoch": 1160} {"train_loss": -11.52845573425293, "global_step": 194995, "epoch": 1160} {"train_loss": -11.777985572814941, "global_step": 194996, "epoch": 1160} {"train_loss": -11.796053886413574, "global_step": 194997, "epoch": 1160} {"train_loss": -11.7349271774292, "global_step": 194998, "epoch": 1160} {"train_loss": -11.577951431274414, "global_step": 194999, "epoch": 1160} {"train_loss": -11.785503387451172, "global_step": 195000, "epoch": 1160} {"train_loss": -11.557788848876953, "global_step": 195001, "epoch": 1160} {"train_loss": -11.45888614654541, "global_step": 195002, "epoch": 1160} {"train_loss": -11.908693313598633, "global_step": 195003, "epoch": 1160} {"train_loss": -11.942648887634277, "global_step": 195004, "epoch": 1160} {"train_loss": -11.64248275756836, "global_step": 195005, "epoch": 1160} {"train_loss": -11.682775497436523, "global_step": 195006, "epoch": 1160} {"train_loss": -11.642340660095215, "global_step": 195007, "epoch": 1160} {"train_loss": -11.491964340209961, "global_step": 195008, "epoch": 1160} {"train_loss": -11.386442184448242, "global_step": 195009, "epoch": 1160} {"train_loss": -11.503096580505371, "global_step": 195010, "epoch": 1160} {"train_loss": -11.723952293395996, "global_step": 195011, "epoch": 1160} {"train_loss": -11.705974578857422, "global_step": 195012, "epoch": 1160} {"train_loss": -11.556279182434082, "global_step": 195013, "epoch": 1160} {"train_loss": -11.583720207214355, "global_step": 195014, "epoch": 1160} {"train_loss": -11.279659271240234, "global_step": 195015, "epoch": 1160} {"train_loss": -11.319478034973145, "global_step": 195016, "epoch": 1160} {"train_loss": -11.399871826171875, "global_step": 195017, "epoch": 1160} {"train_loss": -11.656946182250977, "global_step": 195018, "epoch": 1160} {"train_loss": -11.501143455505371, "global_step": 195019, "epoch": 1160} {"train_loss": -11.441047668457031, "global_step": 195020, "epoch": 1160} {"train_loss": -11.210302352905273, "global_step": 195021, "epoch": 1160} {"train_loss": -11.160689353942871, "global_step": 195022, "epoch": 1160} {"train_loss": -11.662346839904785, "global_step": 195023, "epoch": 1160} {"train_loss": -11.612879753112793, "global_step": 195024, "epoch": 1160} {"train_loss": -11.532598495483398, "global_step": 195025, "epoch": 1160} {"train_loss": -11.536062240600586, "global_step": 195026, "epoch": 1160} {"train_loss": -11.467703819274902, "global_step": 195027, "epoch": 1160} {"train_loss": -11.245889663696289, "global_step": 195028, "epoch": 1160} {"train_loss": -10.632287979125977, "global_step": 195029, "epoch": 1160} {"train_loss": -10.44807243347168, "global_step": 195030, "epoch": 1160} {"train_loss": -10.853469848632812, "global_step": 195031, "epoch": 1160} {"train_loss": -11.475754737854004, "global_step": 195032, "epoch": 1160} {"train_loss": -10.941761016845703, "global_step": 195033, "epoch": 1160} {"train_loss": -10.720479965209961, "global_step": 195034, "epoch": 1160} {"train_loss": -10.491214752197266, "global_step": 195035, "epoch": 1160} {"train_loss": -10.816822052001953, "global_step": 195036, "epoch": 1160} {"train_loss": -10.958053588867188, "global_step": 195037, "epoch": 1160} {"train_loss": -11.277429580688477, "global_step": 195038, "epoch": 1160} {"train_loss": -10.477816581726074, "global_step": 195039, "epoch": 1160} {"train_loss": -11.275976181030273, "global_step": 195040, "epoch": 1160} {"train_loss": -10.83137321472168, "global_step": 195041, "epoch": 1160} {"train_loss": -10.57666301727295, "global_step": 195042, "epoch": 1160} {"train_loss": -11.054132461547852, "global_step": 195043, "epoch": 1160} {"train_loss": -10.35410213470459, "global_step": 195044, "epoch": 1160} {"train_loss": -9.32734489440918, "global_step": 195045, "epoch": 1160} {"train_loss": -9.606361389160156, "global_step": 195046, "epoch": 1160} {"train_loss": -11.128387803123111, "global_step": 195047, "epoch": 1160, "val_loss": 246930.46875, "train_action_mse_error": 1.380563497543335} {"train_loss": -9.957566261291504, "global_step": 195048, "epoch": 1161} {"train_loss": -9.70390796661377, "global_step": 195049, "epoch": 1161} {"train_loss": -10.820066452026367, "global_step": 195050, "epoch": 1161} {"train_loss": -8.690223693847656, "global_step": 195051, "epoch": 1161} {"train_loss": -8.494739532470703, "global_step": 195052, "epoch": 1161} {"train_loss": -10.005569458007812, "global_step": 195053, "epoch": 1161} {"train_loss": -9.867752075195312, "global_step": 195054, "epoch": 1161} {"train_loss": -9.222323417663574, "global_step": 195055, "epoch": 1161} {"train_loss": -10.743426322937012, "global_step": 195056, "epoch": 1161} {"train_loss": -10.372648239135742, "global_step": 195057, "epoch": 1161} {"train_loss": -9.863819122314453, "global_step": 195058, "epoch": 1161} {"train_loss": -10.770167350769043, "global_step": 195059, "epoch": 1161} {"train_loss": -9.649478912353516, "global_step": 195060, "epoch": 1161} {"train_loss": -10.03976821899414, "global_step": 195061, "epoch": 1161} {"train_loss": -11.007675170898438, "global_step": 195062, "epoch": 1161} {"train_loss": -10.210969924926758, "global_step": 195063, "epoch": 1161} {"train_loss": -10.631731033325195, "global_step": 195064, "epoch": 1161} {"train_loss": -10.699127197265625, "global_step": 195065, "epoch": 1161} {"train_loss": -10.481678009033203, "global_step": 195066, "epoch": 1161} {"train_loss": -10.679755210876465, "global_step": 195067, "epoch": 1161} {"train_loss": -10.747306823730469, "global_step": 195068, "epoch": 1161} {"train_loss": -10.61306095123291, "global_step": 195069, "epoch": 1161} {"train_loss": -10.599288940429688, "global_step": 195070, "epoch": 1161} {"train_loss": -11.071715354919434, "global_step": 195071, "epoch": 1161} {"train_loss": -11.057331085205078, "global_step": 195072, "epoch": 1161} {"train_loss": -10.79172420501709, "global_step": 195073, "epoch": 1161} {"train_loss": -10.88636589050293, "global_step": 195074, "epoch": 1161} {"train_loss": -11.156303405761719, "global_step": 195075, "epoch": 1161} {"train_loss": -10.99377155303955, "global_step": 195076, "epoch": 1161} {"train_loss": -10.935443878173828, "global_step": 195077, "epoch": 1161} {"train_loss": -11.196197509765625, "global_step": 195078, "epoch": 1161} {"train_loss": -11.178670883178711, "global_step": 195079, "epoch": 1161} {"train_loss": -10.944414138793945, "global_step": 195080, "epoch": 1161} {"train_loss": -11.194278717041016, "global_step": 195081, "epoch": 1161} {"train_loss": -11.020169258117676, "global_step": 195082, "epoch": 1161} {"train_loss": -11.23233413696289, "global_step": 195083, "epoch": 1161} {"train_loss": -11.355324745178223, "global_step": 195084, "epoch": 1161} {"train_loss": -11.061052322387695, "global_step": 195085, "epoch": 1161} {"train_loss": -11.282825469970703, "global_step": 195086, "epoch": 1161} {"train_loss": -11.391114234924316, "global_step": 195087, "epoch": 1161} {"train_loss": -11.330720901489258, "global_step": 195088, "epoch": 1161} {"train_loss": -11.333043098449707, "global_step": 195089, "epoch": 1161} {"train_loss": -11.51596450805664, "global_step": 195090, "epoch": 1161} {"train_loss": -11.325874328613281, "global_step": 195091, "epoch": 1161} {"train_loss": -11.034479141235352, "global_step": 195092, "epoch": 1161} {"train_loss": -11.260912895202637, "global_step": 195093, "epoch": 1161} {"train_loss": -11.264670372009277, "global_step": 195094, "epoch": 1161} {"train_loss": -11.122450828552246, "global_step": 195095, "epoch": 1161} {"train_loss": -11.263408660888672, "global_step": 195096, "epoch": 1161} {"train_loss": -11.251916885375977, "global_step": 195097, "epoch": 1161} {"train_loss": -11.332496643066406, "global_step": 195098, "epoch": 1161} {"train_loss": -11.338663101196289, "global_step": 195099, "epoch": 1161} {"train_loss": -11.453102111816406, "global_step": 195100, "epoch": 1161} {"train_loss": -11.229915618896484, "global_step": 195101, "epoch": 1161} {"train_loss": -11.472347259521484, "global_step": 195102, "epoch": 1161} {"train_loss": -11.321730613708496, "global_step": 195103, "epoch": 1161} {"train_loss": -11.598663330078125, "global_step": 195104, "epoch": 1161} {"train_loss": -11.588593482971191, "global_step": 195105, "epoch": 1161} {"train_loss": -11.64835262298584, "global_step": 195106, "epoch": 1161} {"train_loss": -11.538984298706055, "global_step": 195107, "epoch": 1161} {"train_loss": -11.318750381469727, "global_step": 195108, "epoch": 1161} {"train_loss": -11.563329696655273, "global_step": 195109, "epoch": 1161} {"train_loss": -11.44726848602295, "global_step": 195110, "epoch": 1161} {"train_loss": -11.656189918518066, "global_step": 195111, "epoch": 1161} {"train_loss": -11.728601455688477, "global_step": 195112, "epoch": 1161} {"train_loss": -11.500246047973633, "global_step": 195113, "epoch": 1161} {"train_loss": -11.581856727600098, "global_step": 195114, "epoch": 1161} {"train_loss": -11.64687728881836, "global_step": 195115, "epoch": 1161} {"train_loss": -11.383708953857422, "global_step": 195116, "epoch": 1161} {"train_loss": -11.722419738769531, "global_step": 195117, "epoch": 1161} {"train_loss": -11.552436828613281, "global_step": 195118, "epoch": 1161} {"train_loss": -11.490131378173828, "global_step": 195119, "epoch": 1161} {"train_loss": -11.767197608947754, "global_step": 195120, "epoch": 1161} {"train_loss": -11.422637939453125, "global_step": 195121, "epoch": 1161} {"train_loss": -11.402034759521484, "global_step": 195122, "epoch": 1161} {"train_loss": -11.542475700378418, "global_step": 195123, "epoch": 1161} {"train_loss": -11.471826553344727, "global_step": 195124, "epoch": 1161} {"train_loss": -11.296446800231934, "global_step": 195125, "epoch": 1161} {"train_loss": -10.856305122375488, "global_step": 195126, "epoch": 1161} {"train_loss": -11.442707061767578, "global_step": 195127, "epoch": 1161} {"train_loss": -11.686405181884766, "global_step": 195128, "epoch": 1161} {"train_loss": -11.5586576461792, "global_step": 195129, "epoch": 1161} {"train_loss": -11.618919372558594, "global_step": 195130, "epoch": 1161} {"train_loss": -11.508450508117676, "global_step": 195131, "epoch": 1161} {"train_loss": -11.495535850524902, "global_step": 195132, "epoch": 1161} {"train_loss": -11.333620071411133, "global_step": 195133, "epoch": 1161} {"train_loss": -11.654964447021484, "global_step": 195134, "epoch": 1161} {"train_loss": -11.407500267028809, "global_step": 195135, "epoch": 1161} {"train_loss": -11.405500411987305, "global_step": 195136, "epoch": 1161} {"train_loss": -11.607511520385742, "global_step": 195137, "epoch": 1161} {"train_loss": -11.661643028259277, "global_step": 195138, "epoch": 1161} {"train_loss": -11.636236190795898, "global_step": 195139, "epoch": 1161} {"train_loss": -11.571307182312012, "global_step": 195140, "epoch": 1161} {"train_loss": -11.696842193603516, "global_step": 195141, "epoch": 1161} {"train_loss": -11.837145805358887, "global_step": 195142, "epoch": 1161} {"train_loss": -11.607925415039062, "global_step": 195143, "epoch": 1161} {"train_loss": -11.683747291564941, "global_step": 195144, "epoch": 1161} {"train_loss": -11.466087341308594, "global_step": 195145, "epoch": 1161} {"train_loss": -11.793829917907715, "global_step": 195146, "epoch": 1161} {"train_loss": -11.020417213439941, "global_step": 195147, "epoch": 1161} {"train_loss": -10.202312469482422, "global_step": 195148, "epoch": 1161} {"train_loss": -9.081348419189453, "global_step": 195149, "epoch": 1161} {"train_loss": -10.98962688446045, "global_step": 195150, "epoch": 1161} {"train_loss": -11.379611015319824, "global_step": 195151, "epoch": 1161} {"train_loss": -8.88205337524414, "global_step": 195152, "epoch": 1161} {"train_loss": -9.295330047607422, "global_step": 195153, "epoch": 1161} {"train_loss": -10.805013656616211, "global_step": 195154, "epoch": 1161} {"train_loss": -8.429327011108398, "global_step": 195155, "epoch": 1161} {"train_loss": -7.5302324295043945, "global_step": 195156, "epoch": 1161} {"train_loss": -9.56482982635498, "global_step": 195157, "epoch": 1161} {"train_loss": -8.182232856750488, "global_step": 195158, "epoch": 1161} {"train_loss": -6.27828311920166, "global_step": 195159, "epoch": 1161} {"train_loss": -5.766692161560059, "global_step": 195160, "epoch": 1161} {"train_loss": -7.259024620056152, "global_step": 195161, "epoch": 1161} {"train_loss": -7.683404922485352, "global_step": 195162, "epoch": 1161} {"train_loss": -7.794007301330566, "global_step": 195163, "epoch": 1161} {"train_loss": -8.09012222290039, "global_step": 195164, "epoch": 1161} {"train_loss": -9.201562881469727, "global_step": 195165, "epoch": 1161} {"train_loss": -9.020208358764648, "global_step": 195166, "epoch": 1161} {"train_loss": -10.03145980834961, "global_step": 195167, "epoch": 1161} {"train_loss": -9.334949493408203, "global_step": 195168, "epoch": 1161} {"train_loss": -9.710136413574219, "global_step": 195169, "epoch": 1161} {"train_loss": -9.895126342773438, "global_step": 195170, "epoch": 1161} {"train_loss": -10.0955171585083, "global_step": 195171, "epoch": 1161} {"train_loss": -10.18516731262207, "global_step": 195172, "epoch": 1161} {"train_loss": -9.780033111572266, "global_step": 195173, "epoch": 1161} {"train_loss": -10.239521026611328, "global_step": 195174, "epoch": 1161} {"train_loss": -9.59759521484375, "global_step": 195175, "epoch": 1161} {"train_loss": -10.106846809387207, "global_step": 195176, "epoch": 1161} {"train_loss": -10.894325256347656, "global_step": 195177, "epoch": 1161} {"train_loss": -10.159322738647461, "global_step": 195178, "epoch": 1161} {"train_loss": -10.647871017456055, "global_step": 195179, "epoch": 1161} {"train_loss": -10.410168647766113, "global_step": 195180, "epoch": 1161} {"train_loss": -10.54699993133545, "global_step": 195181, "epoch": 1161} {"train_loss": -10.948596954345703, "global_step": 195182, "epoch": 1161} {"train_loss": -10.633393287658691, "global_step": 195183, "epoch": 1161} {"train_loss": -10.67536735534668, "global_step": 195184, "epoch": 1161} {"train_loss": -10.8652925491333, "global_step": 195185, "epoch": 1161} {"train_loss": -10.763164520263672, "global_step": 195186, "epoch": 1161} {"train_loss": -10.875760078430176, "global_step": 195187, "epoch": 1161} {"train_loss": -11.050263404846191, "global_step": 195188, "epoch": 1161} {"train_loss": -10.92599868774414, "global_step": 195189, "epoch": 1161} {"train_loss": -10.8839111328125, "global_step": 195190, "epoch": 1161} {"train_loss": -11.107369422912598, "global_step": 195191, "epoch": 1161} {"train_loss": -10.77346134185791, "global_step": 195192, "epoch": 1161} {"train_loss": -11.135340690612793, "global_step": 195193, "epoch": 1161} {"train_loss": -10.970134735107422, "global_step": 195194, "epoch": 1161} {"train_loss": -10.870582580566406, "global_step": 195195, "epoch": 1161} {"train_loss": -11.353540420532227, "global_step": 195196, "epoch": 1161} {"train_loss": -11.058938980102539, "global_step": 195197, "epoch": 1161} {"train_loss": -10.919474601745605, "global_step": 195198, "epoch": 1161} {"train_loss": -11.215402603149414, "global_step": 195199, "epoch": 1161} {"train_loss": -10.971700668334961, "global_step": 195200, "epoch": 1161} {"train_loss": -11.102008819580078, "global_step": 195201, "epoch": 1161} {"train_loss": -11.289159774780273, "global_step": 195202, "epoch": 1161} {"train_loss": -11.176254272460938, "global_step": 195203, "epoch": 1161} {"train_loss": -11.11172103881836, "global_step": 195204, "epoch": 1161} {"train_loss": -11.29797649383545, "global_step": 195205, "epoch": 1161} {"train_loss": -11.048362731933594, "global_step": 195206, "epoch": 1161} {"train_loss": -11.294937133789062, "global_step": 195207, "epoch": 1161} {"train_loss": -11.340818405151367, "global_step": 195208, "epoch": 1161} {"train_loss": -11.26788330078125, "global_step": 195209, "epoch": 1161} {"train_loss": -11.407585144042969, "global_step": 195210, "epoch": 1161} {"train_loss": -11.20974349975586, "global_step": 195211, "epoch": 1161} {"train_loss": -11.41303825378418, "global_step": 195212, "epoch": 1161} {"train_loss": -11.312507629394531, "global_step": 195213, "epoch": 1161} {"train_loss": -11.488394737243652, "global_step": 195214, "epoch": 1161} {"train_loss": -10.744855318750654, "global_step": 195215, "epoch": 1161, "val_loss": 240320.359375} {"train_loss": -11.616854667663574, "global_step": 195216, "epoch": 1162} {"train_loss": -11.27481460571289, "global_step": 195217, "epoch": 1162} {"train_loss": -11.31854248046875, "global_step": 195218, "epoch": 1162} {"train_loss": -11.379172325134277, "global_step": 195219, "epoch": 1162} {"train_loss": -11.353958129882812, "global_step": 195220, "epoch": 1162} {"train_loss": -11.28011703491211, "global_step": 195221, "epoch": 1162} {"train_loss": -11.394468307495117, "global_step": 195222, "epoch": 1162} {"train_loss": -11.599833488464355, "global_step": 195223, "epoch": 1162} {"train_loss": -11.382765769958496, "global_step": 195224, "epoch": 1162} {"train_loss": -11.442874908447266, "global_step": 195225, "epoch": 1162} {"train_loss": -11.615047454833984, "global_step": 195226, "epoch": 1162} {"train_loss": -11.576906204223633, "global_step": 195227, "epoch": 1162} {"train_loss": -11.301257133483887, "global_step": 195228, "epoch": 1162} {"train_loss": -11.6497163772583, "global_step": 195229, "epoch": 1162} {"train_loss": -11.598987579345703, "global_step": 195230, "epoch": 1162} {"train_loss": -11.533794403076172, "global_step": 195231, "epoch": 1162} {"train_loss": -11.403494834899902, "global_step": 195232, "epoch": 1162} {"train_loss": -11.702576637268066, "global_step": 195233, "epoch": 1162} {"train_loss": -11.6627779006958, "global_step": 195234, "epoch": 1162} {"train_loss": -11.11113166809082, "global_step": 195235, "epoch": 1162} {"train_loss": -11.764778137207031, "global_step": 195236, "epoch": 1162} {"train_loss": -11.405328750610352, "global_step": 195237, "epoch": 1162} {"train_loss": -11.599108695983887, "global_step": 195238, "epoch": 1162} {"train_loss": -11.592706680297852, "global_step": 195239, "epoch": 1162} {"train_loss": -11.39554500579834, "global_step": 195240, "epoch": 1162} {"train_loss": -11.194570541381836, "global_step": 195241, "epoch": 1162} {"train_loss": -11.482357025146484, "global_step": 195242, "epoch": 1162} {"train_loss": -11.378303527832031, "global_step": 195243, "epoch": 1162} {"train_loss": -11.444904327392578, "global_step": 195244, "epoch": 1162} {"train_loss": -11.491070747375488, "global_step": 195245, "epoch": 1162} {"train_loss": -11.524833679199219, "global_step": 195246, "epoch": 1162} {"train_loss": -11.444129943847656, "global_step": 195247, "epoch": 1162} {"train_loss": -11.588603973388672, "global_step": 195248, "epoch": 1162} {"train_loss": -11.64328670501709, "global_step": 195249, "epoch": 1162} {"train_loss": -11.447343826293945, "global_step": 195250, "epoch": 1162} {"train_loss": -11.31392765045166, "global_step": 195251, "epoch": 1162} {"train_loss": -11.454526901245117, "global_step": 195252, "epoch": 1162} {"train_loss": -11.632024765014648, "global_step": 195253, "epoch": 1162} {"train_loss": -11.833267211914062, "global_step": 195254, "epoch": 1162} {"train_loss": -11.212556838989258, "global_step": 195255, "epoch": 1162} {"train_loss": -11.688884735107422, "global_step": 195256, "epoch": 1162} {"train_loss": -11.511407852172852, "global_step": 195257, "epoch": 1162} {"train_loss": -10.780202865600586, "global_step": 195258, "epoch": 1162} {"train_loss": -9.299304008483887, "global_step": 195259, "epoch": 1162} {"train_loss": -10.177144050598145, "global_step": 195260, "epoch": 1162} {"train_loss": -11.439568519592285, "global_step": 195261, "epoch": 1162} {"train_loss": -9.773446083068848, "global_step": 195262, "epoch": 1162} {"train_loss": -10.25572395324707, "global_step": 195263, "epoch": 1162} {"train_loss": -11.341028213500977, "global_step": 195264, "epoch": 1162} {"train_loss": -8.51982307434082, "global_step": 195265, "epoch": 1162} {"train_loss": -9.136406898498535, "global_step": 195266, "epoch": 1162} {"train_loss": -11.043312072753906, "global_step": 195267, "epoch": 1162} {"train_loss": -9.168719291687012, "global_step": 195268, "epoch": 1162} {"train_loss": -10.307997703552246, "global_step": 195269, "epoch": 1162} {"train_loss": -9.963748931884766, "global_step": 195270, "epoch": 1162} {"train_loss": -10.751571655273438, "global_step": 195271, "epoch": 1162} {"train_loss": -10.745006561279297, "global_step": 195272, "epoch": 1162} {"train_loss": -10.286413192749023, "global_step": 195273, "epoch": 1162} {"train_loss": -10.95936107635498, "global_step": 195274, "epoch": 1162} {"train_loss": -10.616470336914062, "global_step": 195275, "epoch": 1162} {"train_loss": -10.8687105178833, "global_step": 195276, "epoch": 1162} {"train_loss": -11.06330680847168, "global_step": 195277, "epoch": 1162} {"train_loss": -10.933270454406738, "global_step": 195278, "epoch": 1162} {"train_loss": -11.07828140258789, "global_step": 195279, "epoch": 1162} {"train_loss": -10.89925765991211, "global_step": 195280, "epoch": 1162} {"train_loss": -11.131141662597656, "global_step": 195281, "epoch": 1162} {"train_loss": -10.94865608215332, "global_step": 195282, "epoch": 1162} {"train_loss": -10.973189353942871, "global_step": 195283, "epoch": 1162} {"train_loss": -11.008810997009277, "global_step": 195284, "epoch": 1162} {"train_loss": -10.95169448852539, "global_step": 195285, "epoch": 1162} {"train_loss": -10.979005813598633, "global_step": 195286, "epoch": 1162} {"train_loss": -11.022674560546875, "global_step": 195287, "epoch": 1162} {"train_loss": -10.837348937988281, "global_step": 195288, "epoch": 1162} {"train_loss": -11.023460388183594, "global_step": 195289, "epoch": 1162} {"train_loss": -10.813751220703125, "global_step": 195290, "epoch": 1162} {"train_loss": -10.70322036743164, "global_step": 195291, "epoch": 1162} {"train_loss": -10.734724044799805, "global_step": 195292, "epoch": 1162} {"train_loss": -10.702337265014648, "global_step": 195293, "epoch": 1162} {"train_loss": -10.946407318115234, "global_step": 195294, "epoch": 1162} {"train_loss": -11.085009574890137, "global_step": 195295, "epoch": 1162} {"train_loss": -10.597488403320312, "global_step": 195296, "epoch": 1162} {"train_loss": -11.176109313964844, "global_step": 195297, "epoch": 1162} {"train_loss": -10.502922058105469, "global_step": 195298, "epoch": 1162} {"train_loss": -11.206649780273438, "global_step": 195299, "epoch": 1162} {"train_loss": -10.416860580444336, "global_step": 195300, "epoch": 1162} {"train_loss": -11.103224754333496, "global_step": 195301, "epoch": 1162} {"train_loss": -10.603246688842773, "global_step": 195302, "epoch": 1162} {"train_loss": -11.030593872070312, "global_step": 195303, "epoch": 1162} {"train_loss": -10.870895385742188, "global_step": 195304, "epoch": 1162} {"train_loss": -11.21211051940918, "global_step": 195305, "epoch": 1162} {"train_loss": -11.080541610717773, "global_step": 195306, "epoch": 1162} {"train_loss": -11.337968826293945, "global_step": 195307, "epoch": 1162} {"train_loss": -11.077618598937988, "global_step": 195308, "epoch": 1162} {"train_loss": -11.181018829345703, "global_step": 195309, "epoch": 1162} {"train_loss": -11.433121681213379, "global_step": 195310, "epoch": 1162} {"train_loss": -11.121116638183594, "global_step": 195311, "epoch": 1162} {"train_loss": -11.290290832519531, "global_step": 195312, "epoch": 1162} {"train_loss": -11.311483383178711, "global_step": 195313, "epoch": 1162} {"train_loss": -11.377427101135254, "global_step": 195314, "epoch": 1162} {"train_loss": -11.509759902954102, "global_step": 195315, "epoch": 1162} {"train_loss": -11.58030891418457, "global_step": 195316, "epoch": 1162} {"train_loss": -11.084159851074219, "global_step": 195317, "epoch": 1162} {"train_loss": -11.25883674621582, "global_step": 195318, "epoch": 1162} {"train_loss": -11.403152465820312, "global_step": 195319, "epoch": 1162} {"train_loss": -11.164843559265137, "global_step": 195320, "epoch": 1162} {"train_loss": -11.431502342224121, "global_step": 195321, "epoch": 1162} {"train_loss": -11.284404754638672, "global_step": 195322, "epoch": 1162} {"train_loss": -11.302845001220703, "global_step": 195323, "epoch": 1162} {"train_loss": -11.294301986694336, "global_step": 195324, "epoch": 1162} {"train_loss": -11.339354515075684, "global_step": 195325, "epoch": 1162} {"train_loss": -11.567712783813477, "global_step": 195326, "epoch": 1162} {"train_loss": -11.378935813903809, "global_step": 195327, "epoch": 1162} {"train_loss": -11.715086936950684, "global_step": 195328, "epoch": 1162} {"train_loss": -11.455039978027344, "global_step": 195329, "epoch": 1162} {"train_loss": -11.388367652893066, "global_step": 195330, "epoch": 1162} {"train_loss": -11.485578536987305, "global_step": 195331, "epoch": 1162} {"train_loss": -11.736425399780273, "global_step": 195332, "epoch": 1162} {"train_loss": -11.471637725830078, "global_step": 195333, "epoch": 1162} {"train_loss": -11.33598804473877, "global_step": 195334, "epoch": 1162} {"train_loss": -11.473199844360352, "global_step": 195335, "epoch": 1162} {"train_loss": -11.617414474487305, "global_step": 195336, "epoch": 1162} {"train_loss": -11.61160945892334, "global_step": 195337, "epoch": 1162} {"train_loss": -11.415295600891113, "global_step": 195338, "epoch": 1162} {"train_loss": -11.70037841796875, "global_step": 195339, "epoch": 1162} {"train_loss": -11.416788101196289, "global_step": 195340, "epoch": 1162} {"train_loss": -11.417877197265625, "global_step": 195341, "epoch": 1162} {"train_loss": -11.775662422180176, "global_step": 195342, "epoch": 1162} {"train_loss": -11.4229736328125, "global_step": 195343, "epoch": 1162} {"train_loss": -11.610517501831055, "global_step": 195344, "epoch": 1162} {"train_loss": -11.464710235595703, "global_step": 195345, "epoch": 1162} {"train_loss": -11.689266204833984, "global_step": 195346, "epoch": 1162} {"train_loss": -11.559389114379883, "global_step": 195347, "epoch": 1162} {"train_loss": -11.687832832336426, "global_step": 195348, "epoch": 1162} {"train_loss": -11.744958877563477, "global_step": 195349, "epoch": 1162} {"train_loss": -11.667142868041992, "global_step": 195350, "epoch": 1162} {"train_loss": -11.709236145019531, "global_step": 195351, "epoch": 1162} {"train_loss": -11.570724487304688, "global_step": 195352, "epoch": 1162} {"train_loss": -11.52159309387207, "global_step": 195353, "epoch": 1162} {"train_loss": -11.602584838867188, "global_step": 195354, "epoch": 1162} {"train_loss": -11.752228736877441, "global_step": 195355, "epoch": 1162} {"train_loss": -11.898534774780273, "global_step": 195356, "epoch": 1162} {"train_loss": -11.94636058807373, "global_step": 195357, "epoch": 1162} {"train_loss": -11.884377479553223, "global_step": 195358, "epoch": 1162} {"train_loss": -11.658761978149414, "global_step": 195359, "epoch": 1162} {"train_loss": -11.659433364868164, "global_step": 195360, "epoch": 1162} {"train_loss": -11.846494674682617, "global_step": 195361, "epoch": 1162} {"train_loss": -11.472457885742188, "global_step": 195362, "epoch": 1162} {"train_loss": -11.893795013427734, "global_step": 195363, "epoch": 1162} {"train_loss": -11.755895614624023, "global_step": 195364, "epoch": 1162} {"train_loss": -11.692609786987305, "global_step": 195365, "epoch": 1162} {"train_loss": -11.692228317260742, "global_step": 195366, "epoch": 1162} {"train_loss": -11.755865097045898, "global_step": 195367, "epoch": 1162} {"train_loss": -11.40927505493164, "global_step": 195368, "epoch": 1162} {"train_loss": -11.491598129272461, "global_step": 195369, "epoch": 1162} {"train_loss": -11.120838165283203, "global_step": 195370, "epoch": 1162} {"train_loss": -11.73203182220459, "global_step": 195371, "epoch": 1162} {"train_loss": -11.4830904006958, "global_step": 195372, "epoch": 1162} {"train_loss": -11.085431098937988, "global_step": 195373, "epoch": 1162} {"train_loss": -10.402462005615234, "global_step": 195374, "epoch": 1162} {"train_loss": -11.232685089111328, "global_step": 195375, "epoch": 1162} {"train_loss": -11.519168853759766, "global_step": 195376, "epoch": 1162} {"train_loss": -11.419672966003418, "global_step": 195377, "epoch": 1162} {"train_loss": -10.631388664245605, "global_step": 195378, "epoch": 1162} {"train_loss": -11.139884948730469, "global_step": 195379, "epoch": 1162} {"train_loss": -10.769726753234863, "global_step": 195380, "epoch": 1162} {"train_loss": -11.040499687194824, "global_step": 195381, "epoch": 1162} {"train_loss": -10.677448272705078, "global_step": 195382, "epoch": 1162} {"train_loss": -11.231026587032137, "global_step": 195383, "epoch": 1162, "val_loss": 247338.21875} {"train_loss": -10.906363487243652, "global_step": 195384, "epoch": 1163} {"train_loss": -11.042535781860352, "global_step": 195385, "epoch": 1163} {"train_loss": -10.396570205688477, "global_step": 195386, "epoch": 1163} {"train_loss": -11.171941757202148, "global_step": 195387, "epoch": 1163} {"train_loss": -9.93048095703125, "global_step": 195388, "epoch": 1163} {"train_loss": -9.44659423828125, "global_step": 195389, "epoch": 1163} {"train_loss": -10.696128845214844, "global_step": 195390, "epoch": 1163} {"train_loss": -9.301000595092773, "global_step": 195391, "epoch": 1163} {"train_loss": -8.81610107421875, "global_step": 195392, "epoch": 1163} {"train_loss": -9.985697746276855, "global_step": 195393, "epoch": 1163} {"train_loss": -10.647064208984375, "global_step": 195394, "epoch": 1163} {"train_loss": -9.78987979888916, "global_step": 195395, "epoch": 1163} {"train_loss": -10.832058906555176, "global_step": 195396, "epoch": 1163} {"train_loss": -9.351875305175781, "global_step": 195397, "epoch": 1163} {"train_loss": -9.978364944458008, "global_step": 195398, "epoch": 1163} {"train_loss": -9.754776000976562, "global_step": 195399, "epoch": 1163} {"train_loss": -9.92673110961914, "global_step": 195400, "epoch": 1163} {"train_loss": -9.2853422164917, "global_step": 195401, "epoch": 1163} {"train_loss": -9.660189628601074, "global_step": 195402, "epoch": 1163} {"train_loss": -10.506523132324219, "global_step": 195403, "epoch": 1163} {"train_loss": -10.145434379577637, "global_step": 195404, "epoch": 1163} {"train_loss": -10.04916763305664, "global_step": 195405, "epoch": 1163} {"train_loss": -10.449963569641113, "global_step": 195406, "epoch": 1163} {"train_loss": -10.379039764404297, "global_step": 195407, "epoch": 1163} {"train_loss": -10.767255783081055, "global_step": 195408, "epoch": 1163} {"train_loss": -10.830997467041016, "global_step": 195409, "epoch": 1163} {"train_loss": -10.849564552307129, "global_step": 195410, "epoch": 1163} {"train_loss": -11.101299285888672, "global_step": 195411, "epoch": 1163} {"train_loss": -10.95201301574707, "global_step": 195412, "epoch": 1163} {"train_loss": -10.85952377319336, "global_step": 195413, "epoch": 1163} {"train_loss": -10.876554489135742, "global_step": 195414, "epoch": 1163} {"train_loss": -11.135676383972168, "global_step": 195415, "epoch": 1163} {"train_loss": -10.605246543884277, "global_step": 195416, "epoch": 1163} {"train_loss": -10.836698532104492, "global_step": 195417, "epoch": 1163} {"train_loss": -10.878071784973145, "global_step": 195418, "epoch": 1163} {"train_loss": -10.831445693969727, "global_step": 195419, "epoch": 1163} {"train_loss": -10.962692260742188, "global_step": 195420, "epoch": 1163} {"train_loss": -10.917157173156738, "global_step": 195421, "epoch": 1163} {"train_loss": -10.831262588500977, "global_step": 195422, "epoch": 1163} {"train_loss": -10.806462287902832, "global_step": 195423, "epoch": 1163} {"train_loss": -10.9649076461792, "global_step": 195424, "epoch": 1163} {"train_loss": -11.166877746582031, "global_step": 195425, "epoch": 1163} {"train_loss": -11.178342819213867, "global_step": 195426, "epoch": 1163} {"train_loss": -10.935436248779297, "global_step": 195427, "epoch": 1163} {"train_loss": -11.131678581237793, "global_step": 195428, "epoch": 1163} {"train_loss": -11.150339126586914, "global_step": 195429, "epoch": 1163} {"train_loss": -11.20695972442627, "global_step": 195430, "epoch": 1163} {"train_loss": -11.024224281311035, "global_step": 195431, "epoch": 1163} {"train_loss": -11.134557723999023, "global_step": 195432, "epoch": 1163} {"train_loss": -10.837005615234375, "global_step": 195433, "epoch": 1163} {"train_loss": -11.090787887573242, "global_step": 195434, "epoch": 1163} {"train_loss": -11.169894218444824, "global_step": 195435, "epoch": 1163} {"train_loss": -11.024800300598145, "global_step": 195436, "epoch": 1163} {"train_loss": -11.340438842773438, "global_step": 195437, "epoch": 1163} {"train_loss": -10.954675674438477, "global_step": 195438, "epoch": 1163} {"train_loss": -11.277843475341797, "global_step": 195439, "epoch": 1163} {"train_loss": -11.095030784606934, "global_step": 195440, "epoch": 1163} {"train_loss": -11.179251670837402, "global_step": 195441, "epoch": 1163} {"train_loss": -11.293814659118652, "global_step": 195442, "epoch": 1163} {"train_loss": -11.260787963867188, "global_step": 195443, "epoch": 1163} {"train_loss": -11.025163650512695, "global_step": 195444, "epoch": 1163} {"train_loss": -11.011159896850586, "global_step": 195445, "epoch": 1163} {"train_loss": -11.438905715942383, "global_step": 195446, "epoch": 1163} {"train_loss": -11.261741638183594, "global_step": 195447, "epoch": 1163} {"train_loss": -11.340103149414062, "global_step": 195448, "epoch": 1163} {"train_loss": -11.36396312713623, "global_step": 195449, "epoch": 1163} {"train_loss": -11.201739311218262, "global_step": 195450, "epoch": 1163} {"train_loss": -11.482105255126953, "global_step": 195451, "epoch": 1163} {"train_loss": -11.445120811462402, "global_step": 195452, "epoch": 1163} {"train_loss": -11.158140182495117, "global_step": 195453, "epoch": 1163} {"train_loss": -11.187156677246094, "global_step": 195454, "epoch": 1163} {"train_loss": -11.26028823852539, "global_step": 195455, "epoch": 1163} {"train_loss": -10.850143432617188, "global_step": 195456, "epoch": 1163} {"train_loss": -11.268841743469238, "global_step": 195457, "epoch": 1163} {"train_loss": -10.841970443725586, "global_step": 195458, "epoch": 1163} {"train_loss": -11.277669906616211, "global_step": 195459, "epoch": 1163} {"train_loss": -11.023726463317871, "global_step": 195460, "epoch": 1163} {"train_loss": -11.13434886932373, "global_step": 195461, "epoch": 1163} {"train_loss": -10.935256958007812, "global_step": 195462, "epoch": 1163} {"train_loss": -11.32998275756836, "global_step": 195463, "epoch": 1163} {"train_loss": -10.520675659179688, "global_step": 195464, "epoch": 1163} {"train_loss": -11.393839836120605, "global_step": 195465, "epoch": 1163} {"train_loss": -10.639729499816895, "global_step": 195466, "epoch": 1163} {"train_loss": -11.218245506286621, "global_step": 195467, "epoch": 1163} {"train_loss": -11.034747123718262, "global_step": 195468, "epoch": 1163} {"train_loss": -11.326872825622559, "global_step": 195469, "epoch": 1163} {"train_loss": -10.771638870239258, "global_step": 195470, "epoch": 1163} {"train_loss": -11.628145217895508, "global_step": 195471, "epoch": 1163} {"train_loss": -10.866961479187012, "global_step": 195472, "epoch": 1163} {"train_loss": -11.386723518371582, "global_step": 195473, "epoch": 1163} {"train_loss": -10.629034042358398, "global_step": 195474, "epoch": 1163} {"train_loss": -11.291439056396484, "global_step": 195475, "epoch": 1163} {"train_loss": -10.922977447509766, "global_step": 195476, "epoch": 1163} {"train_loss": -11.485048294067383, "global_step": 195477, "epoch": 1163} {"train_loss": -11.032012939453125, "global_step": 195478, "epoch": 1163} {"train_loss": -11.582443237304688, "global_step": 195479, "epoch": 1163} {"train_loss": -11.357220649719238, "global_step": 195480, "epoch": 1163} {"train_loss": -11.463817596435547, "global_step": 195481, "epoch": 1163} {"train_loss": -11.458135604858398, "global_step": 195482, "epoch": 1163} {"train_loss": -11.452362060546875, "global_step": 195483, "epoch": 1163} {"train_loss": -11.769351959228516, "global_step": 195484, "epoch": 1163} {"train_loss": -11.624069213867188, "global_step": 195485, "epoch": 1163} {"train_loss": -11.534276962280273, "global_step": 195486, "epoch": 1163} {"train_loss": -11.722030639648438, "global_step": 195487, "epoch": 1163} {"train_loss": -11.45652961730957, "global_step": 195488, "epoch": 1163} {"train_loss": -11.700340270996094, "global_step": 195489, "epoch": 1163} {"train_loss": -11.742303848266602, "global_step": 195490, "epoch": 1163} {"train_loss": -11.525951385498047, "global_step": 195491, "epoch": 1163} {"train_loss": -11.676929473876953, "global_step": 195492, "epoch": 1163} {"train_loss": -11.568672180175781, "global_step": 195493, "epoch": 1163} {"train_loss": -11.557802200317383, "global_step": 195494, "epoch": 1163} {"train_loss": -11.743852615356445, "global_step": 195495, "epoch": 1163} {"train_loss": -11.342126846313477, "global_step": 195496, "epoch": 1163} {"train_loss": -11.86677360534668, "global_step": 195497, "epoch": 1163} {"train_loss": -11.397557258605957, "global_step": 195498, "epoch": 1163} {"train_loss": -11.170049667358398, "global_step": 195499, "epoch": 1163} {"train_loss": -11.53802490234375, "global_step": 195500, "epoch": 1163} {"train_loss": -11.605583190917969, "global_step": 195501, "epoch": 1163} {"train_loss": -11.524356842041016, "global_step": 195502, "epoch": 1163} {"train_loss": -11.31057357788086, "global_step": 195503, "epoch": 1163} {"train_loss": -11.51034927368164, "global_step": 195504, "epoch": 1163} {"train_loss": -11.74134349822998, "global_step": 195505, "epoch": 1163} {"train_loss": -11.604247093200684, "global_step": 195506, "epoch": 1163} {"train_loss": -11.74388313293457, "global_step": 195507, "epoch": 1163} {"train_loss": -11.624489784240723, "global_step": 195508, "epoch": 1163} {"train_loss": -11.717944145202637, "global_step": 195509, "epoch": 1163} {"train_loss": -11.728260040283203, "global_step": 195510, "epoch": 1163} {"train_loss": -11.483564376831055, "global_step": 195511, "epoch": 1163} {"train_loss": -11.662696838378906, "global_step": 195512, "epoch": 1163} {"train_loss": -11.159279823303223, "global_step": 195513, "epoch": 1163} {"train_loss": -11.41971492767334, "global_step": 195514, "epoch": 1163} {"train_loss": -11.463499069213867, "global_step": 195515, "epoch": 1163} {"train_loss": -11.676570892333984, "global_step": 195516, "epoch": 1163} {"train_loss": -11.762245178222656, "global_step": 195517, "epoch": 1163} {"train_loss": -11.66240406036377, "global_step": 195518, "epoch": 1163} {"train_loss": -11.705808639526367, "global_step": 195519, "epoch": 1163} {"train_loss": -11.675789833068848, "global_step": 195520, "epoch": 1163} {"train_loss": -11.622842788696289, "global_step": 195521, "epoch": 1163} {"train_loss": -11.59260082244873, "global_step": 195522, "epoch": 1163} {"train_loss": -10.682663917541504, "global_step": 195523, "epoch": 1163} {"train_loss": -10.976541519165039, "global_step": 195524, "epoch": 1163} {"train_loss": -11.714962005615234, "global_step": 195525, "epoch": 1163} {"train_loss": -10.813772201538086, "global_step": 195526, "epoch": 1163} {"train_loss": -10.040916442871094, "global_step": 195527, "epoch": 1163} {"train_loss": -10.99950122833252, "global_step": 195528, "epoch": 1163} {"train_loss": -10.974051475524902, "global_step": 195529, "epoch": 1163} {"train_loss": -10.714738845825195, "global_step": 195530, "epoch": 1163} {"train_loss": -9.799449920654297, "global_step": 195531, "epoch": 1163} {"train_loss": -10.999414443969727, "global_step": 195532, "epoch": 1163} {"train_loss": -10.672739028930664, "global_step": 195533, "epoch": 1163} {"train_loss": -10.471210479736328, "global_step": 195534, "epoch": 1163} {"train_loss": -11.232330322265625, "global_step": 195535, "epoch": 1163} {"train_loss": -10.703397750854492, "global_step": 195536, "epoch": 1163} {"train_loss": -10.648918151855469, "global_step": 195537, "epoch": 1163} {"train_loss": -11.013568878173828, "global_step": 195538, "epoch": 1163} {"train_loss": -10.76437759399414, "global_step": 195539, "epoch": 1163} {"train_loss": -11.179960250854492, "global_step": 195540, "epoch": 1163} {"train_loss": -11.274581909179688, "global_step": 195541, "epoch": 1163} {"train_loss": -11.00306224822998, "global_step": 195542, "epoch": 1163} {"train_loss": -11.395506858825684, "global_step": 195543, "epoch": 1163} {"train_loss": -10.597036361694336, "global_step": 195544, "epoch": 1163} {"train_loss": -10.4034423828125, "global_step": 195545, "epoch": 1163} {"train_loss": -11.113248825073242, "global_step": 195546, "epoch": 1163} {"train_loss": -10.41766357421875, "global_step": 195547, "epoch": 1163} {"train_loss": -11.256082534790039, "global_step": 195548, "epoch": 1163} {"train_loss": -10.217010498046875, "global_step": 195549, "epoch": 1163} {"train_loss": -10.718015670776367, "global_step": 195550, "epoch": 1163} {"train_loss": -11.022944881802513, "global_step": 195551, "epoch": 1163, "val_loss": 250070.578125} {"train_loss": -11.27713394165039, "global_step": 195552, "epoch": 1164} {"train_loss": -11.30744743347168, "global_step": 195553, "epoch": 1164} {"train_loss": -11.36298942565918, "global_step": 195554, "epoch": 1164} {"train_loss": -11.298951148986816, "global_step": 195555, "epoch": 1164} {"train_loss": -11.401387214660645, "global_step": 195556, "epoch": 1164} {"train_loss": -11.482943534851074, "global_step": 195557, "epoch": 1164} {"train_loss": -11.33144760131836, "global_step": 195558, "epoch": 1164} {"train_loss": -11.118387222290039, "global_step": 195559, "epoch": 1164} {"train_loss": -11.418073654174805, "global_step": 195560, "epoch": 1164} {"train_loss": -11.427783966064453, "global_step": 195561, "epoch": 1164} {"train_loss": -11.390837669372559, "global_step": 195562, "epoch": 1164} {"train_loss": -11.486883163452148, "global_step": 195563, "epoch": 1164} {"train_loss": -11.512066841125488, "global_step": 195564, "epoch": 1164} {"train_loss": -11.191408157348633, "global_step": 195565, "epoch": 1164} {"train_loss": -11.454143524169922, "global_step": 195566, "epoch": 1164} {"train_loss": -11.51300048828125, "global_step": 195567, "epoch": 1164} {"train_loss": -11.649259567260742, "global_step": 195568, "epoch": 1164} {"train_loss": -11.42075252532959, "global_step": 195569, "epoch": 1164} {"train_loss": -11.480031967163086, "global_step": 195570, "epoch": 1164} {"train_loss": -11.627485275268555, "global_step": 195571, "epoch": 1164} {"train_loss": -11.601163864135742, "global_step": 195572, "epoch": 1164} {"train_loss": -11.534326553344727, "global_step": 195573, "epoch": 1164} {"train_loss": -11.64967155456543, "global_step": 195574, "epoch": 1164} {"train_loss": -11.571882247924805, "global_step": 195575, "epoch": 1164} {"train_loss": -11.698080062866211, "global_step": 195576, "epoch": 1164} {"train_loss": -11.361343383789062, "global_step": 195577, "epoch": 1164} {"train_loss": -11.628684043884277, "global_step": 195578, "epoch": 1164} {"train_loss": -11.569205284118652, "global_step": 195579, "epoch": 1164} {"train_loss": -11.313627243041992, "global_step": 195580, "epoch": 1164} {"train_loss": -11.739459991455078, "global_step": 195581, "epoch": 1164} {"train_loss": -11.545964241027832, "global_step": 195582, "epoch": 1164} {"train_loss": -11.227872848510742, "global_step": 195583, "epoch": 1164} {"train_loss": -11.482792854309082, "global_step": 195584, "epoch": 1164} {"train_loss": -11.540023803710938, "global_step": 195585, "epoch": 1164} {"train_loss": -11.582746505737305, "global_step": 195586, "epoch": 1164} {"train_loss": -11.291261672973633, "global_step": 195587, "epoch": 1164} {"train_loss": -10.9652738571167, "global_step": 195588, "epoch": 1164} {"train_loss": -10.915260314941406, "global_step": 195589, "epoch": 1164} {"train_loss": -11.51043701171875, "global_step": 195590, "epoch": 1164} {"train_loss": -11.180354118347168, "global_step": 195591, "epoch": 1164} {"train_loss": -11.125763893127441, "global_step": 195592, "epoch": 1164} {"train_loss": -10.779036521911621, "global_step": 195593, "epoch": 1164} {"train_loss": -10.579458236694336, "global_step": 195594, "epoch": 1164} {"train_loss": -10.67466926574707, "global_step": 195595, "epoch": 1164} {"train_loss": -10.669900894165039, "global_step": 195596, "epoch": 1164} {"train_loss": -11.361936569213867, "global_step": 195597, "epoch": 1164} {"train_loss": -10.75619125366211, "global_step": 195598, "epoch": 1164} {"train_loss": -11.107349395751953, "global_step": 195599, "epoch": 1164} {"train_loss": -11.2933931350708, "global_step": 195600, "epoch": 1164} {"train_loss": -10.923003196716309, "global_step": 195601, "epoch": 1164} {"train_loss": -11.532916069030762, "global_step": 195602, "epoch": 1164} {"train_loss": -11.102701187133789, "global_step": 195603, "epoch": 1164} {"train_loss": -11.366418838500977, "global_step": 195604, "epoch": 1164} {"train_loss": -11.399080276489258, "global_step": 195605, "epoch": 1164} {"train_loss": -11.462923049926758, "global_step": 195606, "epoch": 1164} {"train_loss": -11.26577377319336, "global_step": 195607, "epoch": 1164} {"train_loss": -11.231292724609375, "global_step": 195608, "epoch": 1164} {"train_loss": -11.508768081665039, "global_step": 195609, "epoch": 1164} {"train_loss": -11.221067428588867, "global_step": 195610, "epoch": 1164} {"train_loss": -11.163437843322754, "global_step": 195611, "epoch": 1164} {"train_loss": -11.421964645385742, "global_step": 195612, "epoch": 1164} {"train_loss": -11.368185043334961, "global_step": 195613, "epoch": 1164} {"train_loss": -11.527207374572754, "global_step": 195614, "epoch": 1164} {"train_loss": -11.496935844421387, "global_step": 195615, "epoch": 1164} {"train_loss": -11.725531578063965, "global_step": 195616, "epoch": 1164} {"train_loss": -11.229142189025879, "global_step": 195617, "epoch": 1164} {"train_loss": -11.629728317260742, "global_step": 195618, "epoch": 1164} {"train_loss": -11.284026145935059, "global_step": 195619, "epoch": 1164} {"train_loss": -11.530607223510742, "global_step": 195620, "epoch": 1164} {"train_loss": -11.473406791687012, "global_step": 195621, "epoch": 1164} {"train_loss": -11.549986839294434, "global_step": 195622, "epoch": 1164} {"train_loss": -11.214703559875488, "global_step": 195623, "epoch": 1164} {"train_loss": -11.236674308776855, "global_step": 195624, "epoch": 1164} {"train_loss": -11.40376091003418, "global_step": 195625, "epoch": 1164} {"train_loss": -11.509410858154297, "global_step": 195626, "epoch": 1164} {"train_loss": -11.475290298461914, "global_step": 195627, "epoch": 1164} {"train_loss": -11.460366249084473, "global_step": 195628, "epoch": 1164} {"train_loss": -11.452223777770996, "global_step": 195629, "epoch": 1164} {"train_loss": -11.416193962097168, "global_step": 195630, "epoch": 1164} {"train_loss": -11.015419006347656, "global_step": 195631, "epoch": 1164} {"train_loss": -11.046648979187012, "global_step": 195632, "epoch": 1164} {"train_loss": -11.4804048538208, "global_step": 195633, "epoch": 1164} {"train_loss": -10.789265632629395, "global_step": 195634, "epoch": 1164} {"train_loss": -11.573502540588379, "global_step": 195635, "epoch": 1164} {"train_loss": -11.216124534606934, "global_step": 195636, "epoch": 1164} {"train_loss": -11.354269981384277, "global_step": 195637, "epoch": 1164} {"train_loss": -11.17547607421875, "global_step": 195638, "epoch": 1164} {"train_loss": -11.18075180053711, "global_step": 195639, "epoch": 1164} {"train_loss": -11.287714004516602, "global_step": 195640, "epoch": 1164} {"train_loss": -11.031295776367188, "global_step": 195641, "epoch": 1164} {"train_loss": -11.202515602111816, "global_step": 195642, "epoch": 1164} {"train_loss": -11.241046905517578, "global_step": 195643, "epoch": 1164} {"train_loss": -11.501397132873535, "global_step": 195644, "epoch": 1164} {"train_loss": -11.456365585327148, "global_step": 195645, "epoch": 1164} {"train_loss": -11.157829284667969, "global_step": 195646, "epoch": 1164} {"train_loss": -10.808892250061035, "global_step": 195647, "epoch": 1164} {"train_loss": -11.625568389892578, "global_step": 195648, "epoch": 1164} {"train_loss": -11.043827056884766, "global_step": 195649, "epoch": 1164} {"train_loss": -11.462453842163086, "global_step": 195650, "epoch": 1164} {"train_loss": -11.46468734741211, "global_step": 195651, "epoch": 1164} {"train_loss": -11.471181869506836, "global_step": 195652, "epoch": 1164} {"train_loss": -11.167732238769531, "global_step": 195653, "epoch": 1164} {"train_loss": -11.372373580932617, "global_step": 195654, "epoch": 1164} {"train_loss": -11.509970664978027, "global_step": 195655, "epoch": 1164} {"train_loss": -11.249139785766602, "global_step": 195656, "epoch": 1164} {"train_loss": -11.710565567016602, "global_step": 195657, "epoch": 1164} {"train_loss": -11.270572662353516, "global_step": 195658, "epoch": 1164} {"train_loss": -11.607664108276367, "global_step": 195659, "epoch": 1164} {"train_loss": -11.297252655029297, "global_step": 195660, "epoch": 1164} {"train_loss": -11.303833961486816, "global_step": 195661, "epoch": 1164} {"train_loss": -11.607784271240234, "global_step": 195662, "epoch": 1164} {"train_loss": -11.040545463562012, "global_step": 195663, "epoch": 1164} {"train_loss": -11.416839599609375, "global_step": 195664, "epoch": 1164} {"train_loss": -11.181866645812988, "global_step": 195665, "epoch": 1164} {"train_loss": -10.845120429992676, "global_step": 195666, "epoch": 1164} {"train_loss": -11.071868896484375, "global_step": 195667, "epoch": 1164} {"train_loss": -11.044403076171875, "global_step": 195668, "epoch": 1164} {"train_loss": -10.91447639465332, "global_step": 195669, "epoch": 1164} {"train_loss": -11.114219665527344, "global_step": 195670, "epoch": 1164} {"train_loss": -10.627676010131836, "global_step": 195671, "epoch": 1164} {"train_loss": -11.18118667602539, "global_step": 195672, "epoch": 1164} {"train_loss": -11.283014297485352, "global_step": 195673, "epoch": 1164} {"train_loss": -10.735448837280273, "global_step": 195674, "epoch": 1164} {"train_loss": -10.943889617919922, "global_step": 195675, "epoch": 1164} {"train_loss": -10.909539222717285, "global_step": 195676, "epoch": 1164} {"train_loss": -10.803404808044434, "global_step": 195677, "epoch": 1164} {"train_loss": -10.328336715698242, "global_step": 195678, "epoch": 1164} {"train_loss": -11.380568504333496, "global_step": 195679, "epoch": 1164} {"train_loss": -10.408258438110352, "global_step": 195680, "epoch": 1164} {"train_loss": -10.080453872680664, "global_step": 195681, "epoch": 1164} {"train_loss": -11.280644416809082, "global_step": 195682, "epoch": 1164} {"train_loss": -10.450033187866211, "global_step": 195683, "epoch": 1164} {"train_loss": -11.351485252380371, "global_step": 195684, "epoch": 1164} {"train_loss": -10.653666496276855, "global_step": 195685, "epoch": 1164} {"train_loss": -11.478801727294922, "global_step": 195686, "epoch": 1164} {"train_loss": -11.100052833557129, "global_step": 195687, "epoch": 1164} {"train_loss": -10.971724510192871, "global_step": 195688, "epoch": 1164} {"train_loss": -11.169181823730469, "global_step": 195689, "epoch": 1164} {"train_loss": -10.83541488647461, "global_step": 195690, "epoch": 1164} {"train_loss": -10.832291603088379, "global_step": 195691, "epoch": 1164} {"train_loss": -10.699457168579102, "global_step": 195692, "epoch": 1164} {"train_loss": -11.403209686279297, "global_step": 195693, "epoch": 1164} {"train_loss": -10.961633682250977, "global_step": 195694, "epoch": 1164} {"train_loss": -11.395743370056152, "global_step": 195695, "epoch": 1164} {"train_loss": -11.378713607788086, "global_step": 195696, "epoch": 1164} {"train_loss": -11.459781646728516, "global_step": 195697, "epoch": 1164} {"train_loss": -11.373971939086914, "global_step": 195698, "epoch": 1164} {"train_loss": -11.15895938873291, "global_step": 195699, "epoch": 1164} {"train_loss": -11.5663480758667, "global_step": 195700, "epoch": 1164} {"train_loss": -11.511619567871094, "global_step": 195701, "epoch": 1164} {"train_loss": -11.395328521728516, "global_step": 195702, "epoch": 1164} {"train_loss": -11.624326705932617, "global_step": 195703, "epoch": 1164} {"train_loss": -11.39633560180664, "global_step": 195704, "epoch": 1164} {"train_loss": -11.43008804321289, "global_step": 195705, "epoch": 1164} {"train_loss": -11.39942741394043, "global_step": 195706, "epoch": 1164} {"train_loss": -11.327306747436523, "global_step": 195707, "epoch": 1164} {"train_loss": -11.203861236572266, "global_step": 195708, "epoch": 1164} {"train_loss": -11.236276626586914, "global_step": 195709, "epoch": 1164} {"train_loss": -11.452613830566406, "global_step": 195710, "epoch": 1164} {"train_loss": -11.41817569732666, "global_step": 195711, "epoch": 1164} {"train_loss": -11.388348579406738, "global_step": 195712, "epoch": 1164} {"train_loss": -11.453957557678223, "global_step": 195713, "epoch": 1164} {"train_loss": -11.61149787902832, "global_step": 195714, "epoch": 1164} {"train_loss": -11.463768005371094, "global_step": 195715, "epoch": 1164} {"train_loss": -11.320781707763672, "global_step": 195716, "epoch": 1164} {"train_loss": -11.540958404541016, "global_step": 195717, "epoch": 1164} {"train_loss": -11.427384376525879, "global_step": 195718, "epoch": 1164} {"train_loss": -11.277679358209882, "global_step": 195719, "epoch": 1164, "val_loss": 248897.546875} {"train_loss": -11.805473327636719, "global_step": 195720, "epoch": 1165} {"train_loss": -11.145950317382812, "global_step": 195721, "epoch": 1165} {"train_loss": -11.710168838500977, "global_step": 195722, "epoch": 1165} {"train_loss": -11.422477722167969, "global_step": 195723, "epoch": 1165} {"train_loss": -11.762102127075195, "global_step": 195724, "epoch": 1165} {"train_loss": -11.018062591552734, "global_step": 195725, "epoch": 1165} {"train_loss": -11.48932933807373, "global_step": 195726, "epoch": 1165} {"train_loss": -11.024739265441895, "global_step": 195727, "epoch": 1165} {"train_loss": -11.15173625946045, "global_step": 195728, "epoch": 1165} {"train_loss": -11.462590217590332, "global_step": 195729, "epoch": 1165} {"train_loss": -11.258512496948242, "global_step": 195730, "epoch": 1165} {"train_loss": -11.695530891418457, "global_step": 195731, "epoch": 1165} {"train_loss": -11.401423454284668, "global_step": 195732, "epoch": 1165} {"train_loss": -11.705056190490723, "global_step": 195733, "epoch": 1165} {"train_loss": -11.564556121826172, "global_step": 195734, "epoch": 1165} {"train_loss": -11.64274787902832, "global_step": 195735, "epoch": 1165} {"train_loss": -11.49721908569336, "global_step": 195736, "epoch": 1165} {"train_loss": -11.195192337036133, "global_step": 195737, "epoch": 1165} {"train_loss": -11.580495834350586, "global_step": 195738, "epoch": 1165} {"train_loss": -11.171419143676758, "global_step": 195739, "epoch": 1165} {"train_loss": -11.099294662475586, "global_step": 195740, "epoch": 1165} {"train_loss": -11.054413795471191, "global_step": 195741, "epoch": 1165} {"train_loss": -11.11958122253418, "global_step": 195742, "epoch": 1165} {"train_loss": -10.991875648498535, "global_step": 195743, "epoch": 1165} {"train_loss": -11.237201690673828, "global_step": 195744, "epoch": 1165} {"train_loss": -11.300872802734375, "global_step": 195745, "epoch": 1165} {"train_loss": -11.234153747558594, "global_step": 195746, "epoch": 1165} {"train_loss": -11.458202362060547, "global_step": 195747, "epoch": 1165} {"train_loss": -11.291354179382324, "global_step": 195748, "epoch": 1165} {"train_loss": -11.116312980651855, "global_step": 195749, "epoch": 1165} {"train_loss": -11.542154312133789, "global_step": 195750, "epoch": 1165} {"train_loss": -11.242376327514648, "global_step": 195751, "epoch": 1165} {"train_loss": -11.724447250366211, "global_step": 195752, "epoch": 1165} {"train_loss": -11.465607643127441, "global_step": 195753, "epoch": 1165} {"train_loss": -11.4247407913208, "global_step": 195754, "epoch": 1165} {"train_loss": -11.570661544799805, "global_step": 195755, "epoch": 1165} {"train_loss": -11.36353874206543, "global_step": 195756, "epoch": 1165} {"train_loss": -10.92889404296875, "global_step": 195757, "epoch": 1165} {"train_loss": -11.111900329589844, "global_step": 195758, "epoch": 1165} {"train_loss": -10.948385238647461, "global_step": 195759, "epoch": 1165} {"train_loss": -11.043542861938477, "global_step": 195760, "epoch": 1165} {"train_loss": -11.362435340881348, "global_step": 195761, "epoch": 1165} {"train_loss": -10.771686553955078, "global_step": 195762, "epoch": 1165} {"train_loss": -11.187490463256836, "global_step": 195763, "epoch": 1165} {"train_loss": -11.488662719726562, "global_step": 195764, "epoch": 1165} {"train_loss": -11.252283096313477, "global_step": 195765, "epoch": 1165} {"train_loss": -11.083189010620117, "global_step": 195766, "epoch": 1165} {"train_loss": -11.367563247680664, "global_step": 195767, "epoch": 1165} {"train_loss": -10.967556953430176, "global_step": 195768, "epoch": 1165} {"train_loss": -11.641324996948242, "global_step": 195769, "epoch": 1165} {"train_loss": -11.2449951171875, "global_step": 195770, "epoch": 1165} {"train_loss": -11.255912780761719, "global_step": 195771, "epoch": 1165} {"train_loss": -11.065587043762207, "global_step": 195772, "epoch": 1165} {"train_loss": -11.476184844970703, "global_step": 195773, "epoch": 1165} {"train_loss": -10.806655883789062, "global_step": 195774, "epoch": 1165} {"train_loss": -11.04849624633789, "global_step": 195775, "epoch": 1165} {"train_loss": -10.949752807617188, "global_step": 195776, "epoch": 1165} {"train_loss": -10.661581039428711, "global_step": 195777, "epoch": 1165} {"train_loss": -10.927104949951172, "global_step": 195778, "epoch": 1165} {"train_loss": -11.142119407653809, "global_step": 195779, "epoch": 1165} {"train_loss": -10.76504898071289, "global_step": 195780, "epoch": 1165} {"train_loss": -11.393922805786133, "global_step": 195781, "epoch": 1165} {"train_loss": -11.300737380981445, "global_step": 195782, "epoch": 1165} {"train_loss": -11.306974411010742, "global_step": 195783, "epoch": 1165} {"train_loss": -11.34260082244873, "global_step": 195784, "epoch": 1165} {"train_loss": -11.26380443572998, "global_step": 195785, "epoch": 1165} {"train_loss": -11.535433769226074, "global_step": 195786, "epoch": 1165} {"train_loss": -11.008052825927734, "global_step": 195787, "epoch": 1165} {"train_loss": -11.20747184753418, "global_step": 195788, "epoch": 1165} {"train_loss": -11.5748291015625, "global_step": 195789, "epoch": 1165} {"train_loss": -11.095637321472168, "global_step": 195790, "epoch": 1165} {"train_loss": -11.306180953979492, "global_step": 195791, "epoch": 1165} {"train_loss": -11.091065406799316, "global_step": 195792, "epoch": 1165} {"train_loss": -10.807831764221191, "global_step": 195793, "epoch": 1165} {"train_loss": -11.295446395874023, "global_step": 195794, "epoch": 1165} {"train_loss": -11.076531410217285, "global_step": 195795, "epoch": 1165} {"train_loss": -11.16459846496582, "global_step": 195796, "epoch": 1165} {"train_loss": -11.191713333129883, "global_step": 195797, "epoch": 1165} {"train_loss": -11.177216529846191, "global_step": 195798, "epoch": 1165} {"train_loss": -11.615279197692871, "global_step": 195799, "epoch": 1165} {"train_loss": -11.061450958251953, "global_step": 195800, "epoch": 1165} {"train_loss": -11.49001693725586, "global_step": 195801, "epoch": 1165} {"train_loss": -11.350074768066406, "global_step": 195802, "epoch": 1165} {"train_loss": -11.255281448364258, "global_step": 195803, "epoch": 1165} {"train_loss": -11.378988265991211, "global_step": 195804, "epoch": 1165} {"train_loss": -11.22854232788086, "global_step": 195805, "epoch": 1165} {"train_loss": -11.200803756713867, "global_step": 195806, "epoch": 1165} {"train_loss": -11.294350624084473, "global_step": 195807, "epoch": 1165} {"train_loss": -11.259740829467773, "global_step": 195808, "epoch": 1165} {"train_loss": -11.276833534240723, "global_step": 195809, "epoch": 1165} {"train_loss": -11.07121467590332, "global_step": 195810, "epoch": 1165} {"train_loss": -11.510416030883789, "global_step": 195811, "epoch": 1165} {"train_loss": -11.255102157592773, "global_step": 195812, "epoch": 1165} {"train_loss": -11.52076530456543, "global_step": 195813, "epoch": 1165} {"train_loss": -11.500848770141602, "global_step": 195814, "epoch": 1165} {"train_loss": -10.943721771240234, "global_step": 195815, "epoch": 1165} {"train_loss": -11.261116981506348, "global_step": 195816, "epoch": 1165} {"train_loss": -11.440589904785156, "global_step": 195817, "epoch": 1165} {"train_loss": -11.536992073059082, "global_step": 195818, "epoch": 1165} {"train_loss": -11.726446151733398, "global_step": 195819, "epoch": 1165} {"train_loss": -11.408523559570312, "global_step": 195820, "epoch": 1165} {"train_loss": -11.444506645202637, "global_step": 195821, "epoch": 1165} {"train_loss": -11.203413009643555, "global_step": 195822, "epoch": 1165} {"train_loss": -10.944494247436523, "global_step": 195823, "epoch": 1165} {"train_loss": -11.331961631774902, "global_step": 195824, "epoch": 1165} {"train_loss": -10.888347625732422, "global_step": 195825, "epoch": 1165} {"train_loss": -11.43358325958252, "global_step": 195826, "epoch": 1165} {"train_loss": -11.434425354003906, "global_step": 195827, "epoch": 1165} {"train_loss": -11.238943099975586, "global_step": 195828, "epoch": 1165} {"train_loss": -11.497567176818848, "global_step": 195829, "epoch": 1165} {"train_loss": -11.271520614624023, "global_step": 195830, "epoch": 1165} {"train_loss": -11.118980407714844, "global_step": 195831, "epoch": 1165} {"train_loss": -11.336031913757324, "global_step": 195832, "epoch": 1165} {"train_loss": -11.3010835647583, "global_step": 195833, "epoch": 1165} {"train_loss": -11.410325050354004, "global_step": 195834, "epoch": 1165} {"train_loss": -11.351224899291992, "global_step": 195835, "epoch": 1165} {"train_loss": -11.47232723236084, "global_step": 195836, "epoch": 1165} {"train_loss": -11.346128463745117, "global_step": 195837, "epoch": 1165} {"train_loss": -11.269793510437012, "global_step": 195838, "epoch": 1165} {"train_loss": -11.33210563659668, "global_step": 195839, "epoch": 1165} {"train_loss": -11.266321182250977, "global_step": 195840, "epoch": 1165} {"train_loss": -11.720725059509277, "global_step": 195841, "epoch": 1165} {"train_loss": -11.281837463378906, "global_step": 195842, "epoch": 1165} {"train_loss": -11.53853988647461, "global_step": 195843, "epoch": 1165} {"train_loss": -11.168560981750488, "global_step": 195844, "epoch": 1165} {"train_loss": -11.228824615478516, "global_step": 195845, "epoch": 1165} {"train_loss": -11.266738891601562, "global_step": 195846, "epoch": 1165} {"train_loss": -11.252883911132812, "global_step": 195847, "epoch": 1165} {"train_loss": -11.364950180053711, "global_step": 195848, "epoch": 1165} {"train_loss": -11.443758010864258, "global_step": 195849, "epoch": 1165} {"train_loss": -11.698850631713867, "global_step": 195850, "epoch": 1165} {"train_loss": -11.200029373168945, "global_step": 195851, "epoch": 1165} {"train_loss": -11.199440956115723, "global_step": 195852, "epoch": 1165} {"train_loss": -11.815293312072754, "global_step": 195853, "epoch": 1165} {"train_loss": -11.465784072875977, "global_step": 195854, "epoch": 1165} {"train_loss": -11.294342994689941, "global_step": 195855, "epoch": 1165} {"train_loss": -11.423270225524902, "global_step": 195856, "epoch": 1165} {"train_loss": -10.976058959960938, "global_step": 195857, "epoch": 1165} {"train_loss": -10.724352836608887, "global_step": 195858, "epoch": 1165} {"train_loss": -11.447145462036133, "global_step": 195859, "epoch": 1165} {"train_loss": -11.06393051147461, "global_step": 195860, "epoch": 1165} {"train_loss": -11.131575584411621, "global_step": 195861, "epoch": 1165} {"train_loss": -11.360191345214844, "global_step": 195862, "epoch": 1165} {"train_loss": -11.21413516998291, "global_step": 195863, "epoch": 1165} {"train_loss": -11.484928131103516, "global_step": 195864, "epoch": 1165} {"train_loss": -11.476751327514648, "global_step": 195865, "epoch": 1165} {"train_loss": -11.5098237991333, "global_step": 195866, "epoch": 1165} {"train_loss": -11.485823631286621, "global_step": 195867, "epoch": 1165} {"train_loss": -11.525358200073242, "global_step": 195868, "epoch": 1165} {"train_loss": -11.351363182067871, "global_step": 195869, "epoch": 1165} {"train_loss": -11.349082946777344, "global_step": 195870, "epoch": 1165} {"train_loss": -11.729957580566406, "global_step": 195871, "epoch": 1165} {"train_loss": -11.39185905456543, "global_step": 195872, "epoch": 1165} {"train_loss": -11.622934341430664, "global_step": 195873, "epoch": 1165} {"train_loss": -11.542136192321777, "global_step": 195874, "epoch": 1165} {"train_loss": -11.574177742004395, "global_step": 195875, "epoch": 1165} {"train_loss": -11.339824676513672, "global_step": 195876, "epoch": 1165} {"train_loss": -11.431191444396973, "global_step": 195877, "epoch": 1165} {"train_loss": -11.214250564575195, "global_step": 195878, "epoch": 1165} {"train_loss": -11.451534271240234, "global_step": 195879, "epoch": 1165} {"train_loss": -11.03776741027832, "global_step": 195880, "epoch": 1165} {"train_loss": -11.667474746704102, "global_step": 195881, "epoch": 1165} {"train_loss": -11.177732467651367, "global_step": 195882, "epoch": 1165} {"train_loss": -11.373647689819336, "global_step": 195883, "epoch": 1165} {"train_loss": -11.094560623168945, "global_step": 195884, "epoch": 1165} {"train_loss": -11.10348129272461, "global_step": 195885, "epoch": 1165} {"train_loss": -11.14423942565918, "global_step": 195886, "epoch": 1165} {"train_loss": -11.30100477309454, "global_step": 195887, "epoch": 1165, "val_loss": 251741.328125, "train_action_mse_error": 1.6261377334594727} {"train_loss": -11.368322372436523, "global_step": 195888, "epoch": 1166} {"train_loss": -11.445280075073242, "global_step": 195889, "epoch": 1166} {"train_loss": -11.296478271484375, "global_step": 195890, "epoch": 1166} {"train_loss": -11.404928207397461, "global_step": 195891, "epoch": 1166} {"train_loss": -11.412837982177734, "global_step": 195892, "epoch": 1166} {"train_loss": -11.282222747802734, "global_step": 195893, "epoch": 1166} {"train_loss": -11.493940353393555, "global_step": 195894, "epoch": 1166} {"train_loss": -11.236230850219727, "global_step": 195895, "epoch": 1166} {"train_loss": -11.007888793945312, "global_step": 195896, "epoch": 1166} {"train_loss": -10.760772705078125, "global_step": 195897, "epoch": 1166} {"train_loss": -11.304908752441406, "global_step": 195898, "epoch": 1166} {"train_loss": -10.732234001159668, "global_step": 195899, "epoch": 1166} {"train_loss": -11.48498821258545, "global_step": 195900, "epoch": 1166} {"train_loss": -11.202790260314941, "global_step": 195901, "epoch": 1166} {"train_loss": -11.386411666870117, "global_step": 195902, "epoch": 1166} {"train_loss": -11.475025177001953, "global_step": 195903, "epoch": 1166} {"train_loss": -11.48315143585205, "global_step": 195904, "epoch": 1166} {"train_loss": -11.21652603149414, "global_step": 195905, "epoch": 1166} {"train_loss": -11.405736923217773, "global_step": 195906, "epoch": 1166} {"train_loss": -11.202589988708496, "global_step": 195907, "epoch": 1166} {"train_loss": -11.34070873260498, "global_step": 195908, "epoch": 1166} {"train_loss": -11.539444923400879, "global_step": 195909, "epoch": 1166} {"train_loss": -11.303699493408203, "global_step": 195910, "epoch": 1166} {"train_loss": -11.202442169189453, "global_step": 195911, "epoch": 1166} {"train_loss": -11.345708847045898, "global_step": 195912, "epoch": 1166} {"train_loss": -10.812976837158203, "global_step": 195913, "epoch": 1166} {"train_loss": -11.643115997314453, "global_step": 195914, "epoch": 1166} {"train_loss": -11.114033699035645, "global_step": 195915, "epoch": 1166} {"train_loss": -10.860759735107422, "global_step": 195916, "epoch": 1166} {"train_loss": -11.321785926818848, "global_step": 195917, "epoch": 1166} {"train_loss": -11.374847412109375, "global_step": 195918, "epoch": 1166} {"train_loss": -11.421368598937988, "global_step": 195919, "epoch": 1166} {"train_loss": -11.478355407714844, "global_step": 195920, "epoch": 1166} {"train_loss": -11.342412948608398, "global_step": 195921, "epoch": 1166} {"train_loss": -11.060470581054688, "global_step": 195922, "epoch": 1166} {"train_loss": -11.423395156860352, "global_step": 195923, "epoch": 1166} {"train_loss": -11.618946075439453, "global_step": 195924, "epoch": 1166} {"train_loss": -11.492237091064453, "global_step": 195925, "epoch": 1166} {"train_loss": -11.384814262390137, "global_step": 195926, "epoch": 1166} {"train_loss": -11.443338394165039, "global_step": 195927, "epoch": 1166} {"train_loss": -11.186617851257324, "global_step": 195928, "epoch": 1166} {"train_loss": -11.427285194396973, "global_step": 195929, "epoch": 1166} {"train_loss": -11.47170639038086, "global_step": 195930, "epoch": 1166} {"train_loss": -11.537324905395508, "global_step": 195931, "epoch": 1166} {"train_loss": -11.518567085266113, "global_step": 195932, "epoch": 1166} {"train_loss": -11.302265167236328, "global_step": 195933, "epoch": 1166} {"train_loss": -11.354625701904297, "global_step": 195934, "epoch": 1166} {"train_loss": -11.573152542114258, "global_step": 195935, "epoch": 1166} {"train_loss": -11.53813648223877, "global_step": 195936, "epoch": 1166} {"train_loss": -11.643016815185547, "global_step": 195937, "epoch": 1166} {"train_loss": -11.438833236694336, "global_step": 195938, "epoch": 1166} {"train_loss": -11.49150276184082, "global_step": 195939, "epoch": 1166} {"train_loss": -11.667137145996094, "global_step": 195940, "epoch": 1166} {"train_loss": -11.45961856842041, "global_step": 195941, "epoch": 1166} {"train_loss": -11.057817459106445, "global_step": 195942, "epoch": 1166} {"train_loss": -11.475772857666016, "global_step": 195943, "epoch": 1166} {"train_loss": -11.393867492675781, "global_step": 195944, "epoch": 1166} {"train_loss": -10.691184043884277, "global_step": 195945, "epoch": 1166} {"train_loss": -11.360898971557617, "global_step": 195946, "epoch": 1166} {"train_loss": -10.843213081359863, "global_step": 195947, "epoch": 1166} {"train_loss": -9.978939056396484, "global_step": 195948, "epoch": 1166} {"train_loss": -10.598432540893555, "global_step": 195949, "epoch": 1166} {"train_loss": -7.022607803344727, "global_step": 195950, "epoch": 1166} {"train_loss": -10.161394119262695, "global_step": 195951, "epoch": 1166} {"train_loss": -8.472618103027344, "global_step": 195952, "epoch": 1166} {"train_loss": -10.128145217895508, "global_step": 195953, "epoch": 1166} {"train_loss": -8.836044311523438, "global_step": 195954, "epoch": 1166} {"train_loss": -10.362606048583984, "global_step": 195955, "epoch": 1166} {"train_loss": -8.257983207702637, "global_step": 195956, "epoch": 1166} {"train_loss": -9.806758880615234, "global_step": 195957, "epoch": 1166} {"train_loss": -9.238114356994629, "global_step": 195958, "epoch": 1166} {"train_loss": -10.302017211914062, "global_step": 195959, "epoch": 1166} {"train_loss": -8.21010684967041, "global_step": 195960, "epoch": 1166} {"train_loss": -10.341939926147461, "global_step": 195961, "epoch": 1166} {"train_loss": -8.985154151916504, "global_step": 195962, "epoch": 1166} {"train_loss": -10.55083179473877, "global_step": 195963, "epoch": 1166} {"train_loss": -9.162418365478516, "global_step": 195964, "epoch": 1166} {"train_loss": -10.531759262084961, "global_step": 195965, "epoch": 1166} {"train_loss": -9.854968070983887, "global_step": 195966, "epoch": 1166} {"train_loss": -9.690661430358887, "global_step": 195967, "epoch": 1166} {"train_loss": -10.516904830932617, "global_step": 195968, "epoch": 1166} {"train_loss": -10.079763412475586, "global_step": 195969, "epoch": 1166} {"train_loss": -10.362283706665039, "global_step": 195970, "epoch": 1166} {"train_loss": -10.69123649597168, "global_step": 195971, "epoch": 1166} {"train_loss": -9.976653099060059, "global_step": 195972, "epoch": 1166} {"train_loss": -10.883692741394043, "global_step": 195973, "epoch": 1166} {"train_loss": -9.953988075256348, "global_step": 195974, "epoch": 1166} {"train_loss": -10.512481689453125, "global_step": 195975, "epoch": 1166} {"train_loss": -10.529123306274414, "global_step": 195976, "epoch": 1166} {"train_loss": -10.263262748718262, "global_step": 195977, "epoch": 1166} {"train_loss": -10.728653907775879, "global_step": 195978, "epoch": 1166} {"train_loss": -10.694741249084473, "global_step": 195979, "epoch": 1166} {"train_loss": -10.539640426635742, "global_step": 195980, "epoch": 1166} {"train_loss": -11.078914642333984, "global_step": 195981, "epoch": 1166} {"train_loss": -11.045578002929688, "global_step": 195982, "epoch": 1166} {"train_loss": -10.915804862976074, "global_step": 195983, "epoch": 1166} {"train_loss": -11.124054908752441, "global_step": 195984, "epoch": 1166} {"train_loss": -11.231803894042969, "global_step": 195985, "epoch": 1166} {"train_loss": -10.756000518798828, "global_step": 195986, "epoch": 1166} {"train_loss": -10.910139083862305, "global_step": 195987, "epoch": 1166} {"train_loss": -11.138664245605469, "global_step": 195988, "epoch": 1166} {"train_loss": -10.890381813049316, "global_step": 195989, "epoch": 1166} {"train_loss": -11.104727745056152, "global_step": 195990, "epoch": 1166} {"train_loss": -11.245227813720703, "global_step": 195991, "epoch": 1166} {"train_loss": -10.927978515625, "global_step": 195992, "epoch": 1166} {"train_loss": -11.00482177734375, "global_step": 195993, "epoch": 1166} {"train_loss": -10.925065994262695, "global_step": 195994, "epoch": 1166} {"train_loss": -10.976229667663574, "global_step": 195995, "epoch": 1166} {"train_loss": -11.198954582214355, "global_step": 195996, "epoch": 1166} {"train_loss": -11.137489318847656, "global_step": 195997, "epoch": 1166} {"train_loss": -10.909997940063477, "global_step": 195998, "epoch": 1166} {"train_loss": -11.271257400512695, "global_step": 195999, "epoch": 1166} {"train_loss": -11.150045394897461, "global_step": 196000, "epoch": 1166} {"train_loss": -10.98139762878418, "global_step": 196001, "epoch": 1166} {"train_loss": -11.367566108703613, "global_step": 196002, "epoch": 1166} {"train_loss": -11.135421752929688, "global_step": 196003, "epoch": 1166} {"train_loss": -11.058769226074219, "global_step": 196004, "epoch": 1166} {"train_loss": -11.37734603881836, "global_step": 196005, "epoch": 1166} {"train_loss": -11.257410049438477, "global_step": 196006, "epoch": 1166} {"train_loss": -11.301145553588867, "global_step": 196007, "epoch": 1166} {"train_loss": -11.1344633102417, "global_step": 196008, "epoch": 1166} {"train_loss": -11.39895248413086, "global_step": 196009, "epoch": 1166} {"train_loss": -11.333763122558594, "global_step": 196010, "epoch": 1166} {"train_loss": -11.484570503234863, "global_step": 196011, "epoch": 1166} {"train_loss": -11.445561408996582, "global_step": 196012, "epoch": 1166} {"train_loss": -11.523359298706055, "global_step": 196013, "epoch": 1166} {"train_loss": -11.471149444580078, "global_step": 196014, "epoch": 1166} {"train_loss": -11.42489242553711, "global_step": 196015, "epoch": 1166} {"train_loss": -11.510773658752441, "global_step": 196016, "epoch": 1166} {"train_loss": -11.226903915405273, "global_step": 196017, "epoch": 1166} {"train_loss": -11.548959732055664, "global_step": 196018, "epoch": 1166} {"train_loss": -11.563480377197266, "global_step": 196019, "epoch": 1166} {"train_loss": -11.449085235595703, "global_step": 196020, "epoch": 1166} {"train_loss": -11.662492752075195, "global_step": 196021, "epoch": 1166} {"train_loss": -11.551032066345215, "global_step": 196022, "epoch": 1166} {"train_loss": -11.742744445800781, "global_step": 196023, "epoch": 1166} {"train_loss": -11.764196395874023, "global_step": 196024, "epoch": 1166} {"train_loss": -11.576269149780273, "global_step": 196025, "epoch": 1166} {"train_loss": -11.539278984069824, "global_step": 196026, "epoch": 1166} {"train_loss": -11.610939025878906, "global_step": 196027, "epoch": 1166} {"train_loss": -11.612031936645508, "global_step": 196028, "epoch": 1166} {"train_loss": -11.640138626098633, "global_step": 196029, "epoch": 1166} {"train_loss": -11.614267349243164, "global_step": 196030, "epoch": 1166} {"train_loss": -11.615859985351562, "global_step": 196031, "epoch": 1166} {"train_loss": -11.596590042114258, "global_step": 196032, "epoch": 1166} {"train_loss": -11.638298034667969, "global_step": 196033, "epoch": 1166} {"train_loss": -11.705548286437988, "global_step": 196034, "epoch": 1166} {"train_loss": -11.675795555114746, "global_step": 196035, "epoch": 1166} {"train_loss": -11.639852523803711, "global_step": 196036, "epoch": 1166} {"train_loss": -11.67740249633789, "global_step": 196037, "epoch": 1166} {"train_loss": -11.643903732299805, "global_step": 196038, "epoch": 1166} {"train_loss": -11.679553031921387, "global_step": 196039, "epoch": 1166} {"train_loss": -11.462244033813477, "global_step": 196040, "epoch": 1166} {"train_loss": -11.680063247680664, "global_step": 196041, "epoch": 1166} {"train_loss": -11.524713516235352, "global_step": 196042, "epoch": 1166} {"train_loss": -11.709366798400879, "global_step": 196043, "epoch": 1166} {"train_loss": -11.479941368103027, "global_step": 196044, "epoch": 1166} {"train_loss": -11.608470916748047, "global_step": 196045, "epoch": 1166} {"train_loss": -11.641582489013672, "global_step": 196046, "epoch": 1166} {"train_loss": -11.507308959960938, "global_step": 196047, "epoch": 1166} {"train_loss": -11.588690757751465, "global_step": 196048, "epoch": 1166} {"train_loss": -11.310669898986816, "global_step": 196049, "epoch": 1166} {"train_loss": -11.15290641784668, "global_step": 196050, "epoch": 1166} {"train_loss": -11.140769958496094, "global_step": 196051, "epoch": 1166} {"train_loss": -11.05819320678711, "global_step": 196052, "epoch": 1166} {"train_loss": -11.480045318603516, "global_step": 196053, "epoch": 1166} {"train_loss": -11.16394329071045, "global_step": 196054, "epoch": 1166} {"train_loss": -11.059338115510487, "global_step": 196055, "epoch": 1166, "val_loss": 246932.203125} {"train_loss": -11.544937133789062, "global_step": 196056, "epoch": 1167} {"train_loss": -11.624935150146484, "global_step": 196057, "epoch": 1167} {"train_loss": -11.499996185302734, "global_step": 196058, "epoch": 1167} {"train_loss": -11.409770965576172, "global_step": 196059, "epoch": 1167} {"train_loss": -11.3863525390625, "global_step": 196060, "epoch": 1167} {"train_loss": -11.327818870544434, "global_step": 196061, "epoch": 1167} {"train_loss": -11.604625701904297, "global_step": 196062, "epoch": 1167} {"train_loss": -11.376352310180664, "global_step": 196063, "epoch": 1167} {"train_loss": -11.731117248535156, "global_step": 196064, "epoch": 1167} {"train_loss": -11.38731861114502, "global_step": 196065, "epoch": 1167} {"train_loss": -11.466386795043945, "global_step": 196066, "epoch": 1167} {"train_loss": -11.419950485229492, "global_step": 196067, "epoch": 1167} {"train_loss": -11.306514739990234, "global_step": 196068, "epoch": 1167} {"train_loss": -11.203313827514648, "global_step": 196069, "epoch": 1167} {"train_loss": -11.055375099182129, "global_step": 196070, "epoch": 1167} {"train_loss": -11.083969116210938, "global_step": 196071, "epoch": 1167} {"train_loss": -11.651824951171875, "global_step": 196072, "epoch": 1167} {"train_loss": -11.328630447387695, "global_step": 196073, "epoch": 1167} {"train_loss": -11.56800651550293, "global_step": 196074, "epoch": 1167} {"train_loss": -11.188875198364258, "global_step": 196075, "epoch": 1167} {"train_loss": -11.486505508422852, "global_step": 196076, "epoch": 1167} {"train_loss": -10.908149719238281, "global_step": 196077, "epoch": 1167} {"train_loss": -9.592151641845703, "global_step": 196078, "epoch": 1167} {"train_loss": -10.805183410644531, "global_step": 196079, "epoch": 1167} {"train_loss": -10.385156631469727, "global_step": 196080, "epoch": 1167} {"train_loss": -10.939444541931152, "global_step": 196081, "epoch": 1167} {"train_loss": -10.295660018920898, "global_step": 196082, "epoch": 1167} {"train_loss": -11.038427352905273, "global_step": 196083, "epoch": 1167} {"train_loss": -10.670957565307617, "global_step": 196084, "epoch": 1167} {"train_loss": -11.328907012939453, "global_step": 196085, "epoch": 1167} {"train_loss": -10.740264892578125, "global_step": 196086, "epoch": 1167} {"train_loss": -11.368406295776367, "global_step": 196087, "epoch": 1167} {"train_loss": -10.588151931762695, "global_step": 196088, "epoch": 1167} {"train_loss": -11.095952987670898, "global_step": 196089, "epoch": 1167} {"train_loss": -11.313108444213867, "global_step": 196090, "epoch": 1167} {"train_loss": -11.092119216918945, "global_step": 196091, "epoch": 1167} {"train_loss": -11.255531311035156, "global_step": 196092, "epoch": 1167} {"train_loss": -10.985361099243164, "global_step": 196093, "epoch": 1167} {"train_loss": -10.992076873779297, "global_step": 196094, "epoch": 1167} {"train_loss": -11.482048034667969, "global_step": 196095, "epoch": 1167} {"train_loss": -11.089923858642578, "global_step": 196096, "epoch": 1167} {"train_loss": -11.096728324890137, "global_step": 196097, "epoch": 1167} {"train_loss": -11.011167526245117, "global_step": 196098, "epoch": 1167} {"train_loss": -10.916500091552734, "global_step": 196099, "epoch": 1167} {"train_loss": -11.27414321899414, "global_step": 196100, "epoch": 1167} {"train_loss": -10.989849090576172, "global_step": 196101, "epoch": 1167} {"train_loss": -11.316027641296387, "global_step": 196102, "epoch": 1167} {"train_loss": -10.766054153442383, "global_step": 196103, "epoch": 1167} {"train_loss": -11.231409072875977, "global_step": 196104, "epoch": 1167} {"train_loss": -10.721359252929688, "global_step": 196105, "epoch": 1167} {"train_loss": -10.646591186523438, "global_step": 196106, "epoch": 1167} {"train_loss": -11.064580917358398, "global_step": 196107, "epoch": 1167} {"train_loss": -9.962713241577148, "global_step": 196108, "epoch": 1167} {"train_loss": -10.728850364685059, "global_step": 196109, "epoch": 1167} {"train_loss": -9.038908958435059, "global_step": 196110, "epoch": 1167} {"train_loss": -10.595335006713867, "global_step": 196111, "epoch": 1167} {"train_loss": -9.702325820922852, "global_step": 196112, "epoch": 1167} {"train_loss": -10.621761322021484, "global_step": 196113, "epoch": 1167} {"train_loss": -10.072098731994629, "global_step": 196114, "epoch": 1167} {"train_loss": -10.516698837280273, "global_step": 196115, "epoch": 1167} {"train_loss": -10.893562316894531, "global_step": 196116, "epoch": 1167} {"train_loss": -10.534093856811523, "global_step": 196117, "epoch": 1167} {"train_loss": -11.013446807861328, "global_step": 196118, "epoch": 1167} {"train_loss": -11.057258605957031, "global_step": 196119, "epoch": 1167} {"train_loss": -10.775739669799805, "global_step": 196120, "epoch": 1167} {"train_loss": -11.18494701385498, "global_step": 196121, "epoch": 1167} {"train_loss": -11.040489196777344, "global_step": 196122, "epoch": 1167} {"train_loss": -11.032135009765625, "global_step": 196123, "epoch": 1167} {"train_loss": -11.21499252319336, "global_step": 196124, "epoch": 1167} {"train_loss": -10.7473783493042, "global_step": 196125, "epoch": 1167} {"train_loss": -11.284249305725098, "global_step": 196126, "epoch": 1167} {"train_loss": -11.128137588500977, "global_step": 196127, "epoch": 1167} {"train_loss": -11.101171493530273, "global_step": 196128, "epoch": 1167} {"train_loss": -11.04726791381836, "global_step": 196129, "epoch": 1167} {"train_loss": -11.155287742614746, "global_step": 196130, "epoch": 1167} {"train_loss": -10.889739990234375, "global_step": 196131, "epoch": 1167} {"train_loss": -11.329556465148926, "global_step": 196132, "epoch": 1167} {"train_loss": -10.964944839477539, "global_step": 196133, "epoch": 1167} {"train_loss": -11.100648880004883, "global_step": 196134, "epoch": 1167} {"train_loss": -11.257537841796875, "global_step": 196135, "epoch": 1167} {"train_loss": -11.009599685668945, "global_step": 196136, "epoch": 1167} {"train_loss": -11.09202766418457, "global_step": 196137, "epoch": 1167} {"train_loss": -11.147018432617188, "global_step": 196138, "epoch": 1167} {"train_loss": -11.619667053222656, "global_step": 196139, "epoch": 1167} {"train_loss": -11.304391860961914, "global_step": 196140, "epoch": 1167} {"train_loss": -11.417756080627441, "global_step": 196141, "epoch": 1167} {"train_loss": -11.330641746520996, "global_step": 196142, "epoch": 1167} {"train_loss": -11.155674934387207, "global_step": 196143, "epoch": 1167} {"train_loss": -11.355003356933594, "global_step": 196144, "epoch": 1167} {"train_loss": -11.15298080444336, "global_step": 196145, "epoch": 1167} {"train_loss": -11.632352828979492, "global_step": 196146, "epoch": 1167} {"train_loss": -11.271838188171387, "global_step": 196147, "epoch": 1167} {"train_loss": -11.479406356811523, "global_step": 196148, "epoch": 1167} {"train_loss": -11.038424491882324, "global_step": 196149, "epoch": 1167} {"train_loss": -11.612853050231934, "global_step": 196150, "epoch": 1167} {"train_loss": -11.211520195007324, "global_step": 196151, "epoch": 1167} {"train_loss": -11.338966369628906, "global_step": 196152, "epoch": 1167} {"train_loss": -11.419039726257324, "global_step": 196153, "epoch": 1167} {"train_loss": -11.139702796936035, "global_step": 196154, "epoch": 1167} {"train_loss": -11.390583038330078, "global_step": 196155, "epoch": 1167} {"train_loss": -11.372943878173828, "global_step": 196156, "epoch": 1167} {"train_loss": -11.372695922851562, "global_step": 196157, "epoch": 1167} {"train_loss": -11.251493453979492, "global_step": 196158, "epoch": 1167} {"train_loss": -11.17420482635498, "global_step": 196159, "epoch": 1167} {"train_loss": -11.375734329223633, "global_step": 196160, "epoch": 1167} {"train_loss": -11.2666015625, "global_step": 196161, "epoch": 1167} {"train_loss": -11.15357780456543, "global_step": 196162, "epoch": 1167} {"train_loss": -11.189592361450195, "global_step": 196163, "epoch": 1167} {"train_loss": -11.143486022949219, "global_step": 196164, "epoch": 1167} {"train_loss": -11.000371932983398, "global_step": 196165, "epoch": 1167} {"train_loss": -11.209059715270996, "global_step": 196166, "epoch": 1167} {"train_loss": -11.454710006713867, "global_step": 196167, "epoch": 1167} {"train_loss": -11.019729614257812, "global_step": 196168, "epoch": 1167} {"train_loss": -11.430885314941406, "global_step": 196169, "epoch": 1167} {"train_loss": -11.420347213745117, "global_step": 196170, "epoch": 1167} {"train_loss": -11.342126846313477, "global_step": 196171, "epoch": 1167} {"train_loss": -11.46922492980957, "global_step": 196172, "epoch": 1167} {"train_loss": -11.437554359436035, "global_step": 196173, "epoch": 1167} {"train_loss": -11.611727714538574, "global_step": 196174, "epoch": 1167} {"train_loss": -11.711984634399414, "global_step": 196175, "epoch": 1167} {"train_loss": -11.266849517822266, "global_step": 196176, "epoch": 1167} {"train_loss": -11.665393829345703, "global_step": 196177, "epoch": 1167} {"train_loss": -11.634925842285156, "global_step": 196178, "epoch": 1167} {"train_loss": -11.546329498291016, "global_step": 196179, "epoch": 1167} {"train_loss": -11.696182250976562, "global_step": 196180, "epoch": 1167} {"train_loss": -11.780462265014648, "global_step": 196181, "epoch": 1167} {"train_loss": -11.567424774169922, "global_step": 196182, "epoch": 1167} {"train_loss": -11.450462341308594, "global_step": 196183, "epoch": 1167} {"train_loss": -11.627655982971191, "global_step": 196184, "epoch": 1167} {"train_loss": -11.551919937133789, "global_step": 196185, "epoch": 1167} {"train_loss": -11.478571891784668, "global_step": 196186, "epoch": 1167} {"train_loss": -11.704347610473633, "global_step": 196187, "epoch": 1167} {"train_loss": -10.968954086303711, "global_step": 196188, "epoch": 1167} {"train_loss": -11.252777099609375, "global_step": 196189, "epoch": 1167} {"train_loss": -11.612916946411133, "global_step": 196190, "epoch": 1167} {"train_loss": -11.340520858764648, "global_step": 196191, "epoch": 1167} {"train_loss": -11.58660888671875, "global_step": 196192, "epoch": 1167} {"train_loss": -11.711753845214844, "global_step": 196193, "epoch": 1167} {"train_loss": -11.659859657287598, "global_step": 196194, "epoch": 1167} {"train_loss": -11.590034484863281, "global_step": 196195, "epoch": 1167} {"train_loss": -11.806766510009766, "global_step": 196196, "epoch": 1167} {"train_loss": -11.498271942138672, "global_step": 196197, "epoch": 1167} {"train_loss": -11.655923843383789, "global_step": 196198, "epoch": 1167} {"train_loss": -11.668729782104492, "global_step": 196199, "epoch": 1167} {"train_loss": -11.620301246643066, "global_step": 196200, "epoch": 1167} {"train_loss": -11.486930847167969, "global_step": 196201, "epoch": 1167} {"train_loss": -11.303363800048828, "global_step": 196202, "epoch": 1167} {"train_loss": -11.824647903442383, "global_step": 196203, "epoch": 1167} {"train_loss": -11.243949890136719, "global_step": 196204, "epoch": 1167} {"train_loss": -10.780684471130371, "global_step": 196205, "epoch": 1167} {"train_loss": -11.228385925292969, "global_step": 196206, "epoch": 1167} {"train_loss": -11.760261535644531, "global_step": 196207, "epoch": 1167} {"train_loss": -11.24403190612793, "global_step": 196208, "epoch": 1167} {"train_loss": -11.31751537322998, "global_step": 196209, "epoch": 1167} {"train_loss": -11.804443359375, "global_step": 196210, "epoch": 1167} {"train_loss": -11.500293731689453, "global_step": 196211, "epoch": 1167} {"train_loss": -11.688032150268555, "global_step": 196212, "epoch": 1167} {"train_loss": -11.64211654663086, "global_step": 196213, "epoch": 1167} {"train_loss": -11.63961410522461, "global_step": 196214, "epoch": 1167} {"train_loss": -11.730633735656738, "global_step": 196215, "epoch": 1167} {"train_loss": -11.59232234954834, "global_step": 196216, "epoch": 1167} {"train_loss": -11.144994735717773, "global_step": 196217, "epoch": 1167} {"train_loss": -11.188531875610352, "global_step": 196218, "epoch": 1167} {"train_loss": -11.481046676635742, "global_step": 196219, "epoch": 1167} {"train_loss": -11.344587326049805, "global_step": 196220, "epoch": 1167} {"train_loss": -11.082592010498047, "global_step": 196221, "epoch": 1167} {"train_loss": -11.365421295166016, "global_step": 196222, "epoch": 1167} {"train_loss": -11.21935558886755, "global_step": 196223, "epoch": 1167, "val_loss": 250442.234375} {"train_loss": -10.641223907470703, "global_step": 196224, "epoch": 1168} {"train_loss": -11.373275756835938, "global_step": 196225, "epoch": 1168} {"train_loss": -11.29226303100586, "global_step": 196226, "epoch": 1168} {"train_loss": -10.857556343078613, "global_step": 196227, "epoch": 1168} {"train_loss": -11.134733200073242, "global_step": 196228, "epoch": 1168} {"train_loss": -11.406835556030273, "global_step": 196229, "epoch": 1168} {"train_loss": -10.931350708007812, "global_step": 196230, "epoch": 1168} {"train_loss": -11.289702415466309, "global_step": 196231, "epoch": 1168} {"train_loss": -10.423078536987305, "global_step": 196232, "epoch": 1168} {"train_loss": -11.331621170043945, "global_step": 196233, "epoch": 1168} {"train_loss": -11.321512222290039, "global_step": 196234, "epoch": 1168} {"train_loss": -10.615715026855469, "global_step": 196235, "epoch": 1168} {"train_loss": -11.079998016357422, "global_step": 196236, "epoch": 1168} {"train_loss": -11.154449462890625, "global_step": 196237, "epoch": 1168} {"train_loss": -11.364147186279297, "global_step": 196238, "epoch": 1168} {"train_loss": -11.053882598876953, "global_step": 196239, "epoch": 1168} {"train_loss": -10.437559127807617, "global_step": 196240, "epoch": 1168} {"train_loss": -11.261054992675781, "global_step": 196241, "epoch": 1168} {"train_loss": -10.779826164245605, "global_step": 196242, "epoch": 1168} {"train_loss": -10.756766319274902, "global_step": 196243, "epoch": 1168} {"train_loss": -11.203332901000977, "global_step": 196244, "epoch": 1168} {"train_loss": -9.504312515258789, "global_step": 196245, "epoch": 1168} {"train_loss": -10.609416961669922, "global_step": 196246, "epoch": 1168} {"train_loss": -10.438838958740234, "global_step": 196247, "epoch": 1168} {"train_loss": -9.110026359558105, "global_step": 196248, "epoch": 1168} {"train_loss": -11.365577697753906, "global_step": 196249, "epoch": 1168} {"train_loss": -10.288991928100586, "global_step": 196250, "epoch": 1168} {"train_loss": -10.845502853393555, "global_step": 196251, "epoch": 1168} {"train_loss": -9.810544967651367, "global_step": 196252, "epoch": 1168} {"train_loss": -11.183660507202148, "global_step": 196253, "epoch": 1168} {"train_loss": -9.882659912109375, "global_step": 196254, "epoch": 1168} {"train_loss": -11.263938903808594, "global_step": 196255, "epoch": 1168} {"train_loss": -10.081600189208984, "global_step": 196256, "epoch": 1168} {"train_loss": -10.979957580566406, "global_step": 196257, "epoch": 1168} {"train_loss": -10.932635307312012, "global_step": 196258, "epoch": 1168} {"train_loss": -11.250657081604004, "global_step": 196259, "epoch": 1168} {"train_loss": -10.995976448059082, "global_step": 196260, "epoch": 1168} {"train_loss": -11.441976547241211, "global_step": 196261, "epoch": 1168} {"train_loss": -11.13132381439209, "global_step": 196262, "epoch": 1168} {"train_loss": -11.237950325012207, "global_step": 196263, "epoch": 1168} {"train_loss": -11.03646183013916, "global_step": 196264, "epoch": 1168} {"train_loss": -11.286861419677734, "global_step": 196265, "epoch": 1168} {"train_loss": -11.426790237426758, "global_step": 196266, "epoch": 1168} {"train_loss": -11.403157234191895, "global_step": 196267, "epoch": 1168} {"train_loss": -11.338582992553711, "global_step": 196268, "epoch": 1168} {"train_loss": -11.515396118164062, "global_step": 196269, "epoch": 1168} {"train_loss": -11.1905517578125, "global_step": 196270, "epoch": 1168} {"train_loss": -11.426921844482422, "global_step": 196271, "epoch": 1168} {"train_loss": -11.398630142211914, "global_step": 196272, "epoch": 1168} {"train_loss": -11.48611068725586, "global_step": 196273, "epoch": 1168} {"train_loss": -11.309101104736328, "global_step": 196274, "epoch": 1168} {"train_loss": -11.461294174194336, "global_step": 196275, "epoch": 1168} {"train_loss": -11.363167762756348, "global_step": 196276, "epoch": 1168} {"train_loss": -11.294550895690918, "global_step": 196277, "epoch": 1168} {"train_loss": -11.2076997756958, "global_step": 196278, "epoch": 1168} {"train_loss": -11.429670333862305, "global_step": 196279, "epoch": 1168} {"train_loss": -10.936742782592773, "global_step": 196280, "epoch": 1168} {"train_loss": -11.453351974487305, "global_step": 196281, "epoch": 1168} {"train_loss": -10.863838195800781, "global_step": 196282, "epoch": 1168} {"train_loss": -11.45339584350586, "global_step": 196283, "epoch": 1168} {"train_loss": -11.083901405334473, "global_step": 196284, "epoch": 1168} {"train_loss": -11.154614448547363, "global_step": 196285, "epoch": 1168} {"train_loss": -11.194862365722656, "global_step": 196286, "epoch": 1168} {"train_loss": -10.448282241821289, "global_step": 196287, "epoch": 1168} {"train_loss": -11.610967636108398, "global_step": 196288, "epoch": 1168} {"train_loss": -10.908493041992188, "global_step": 196289, "epoch": 1168} {"train_loss": -11.495468139648438, "global_step": 196290, "epoch": 1168} {"train_loss": -11.39395523071289, "global_step": 196291, "epoch": 1168} {"train_loss": -11.212533950805664, "global_step": 196292, "epoch": 1168} {"train_loss": -11.723489761352539, "global_step": 196293, "epoch": 1168} {"train_loss": -11.193836212158203, "global_step": 196294, "epoch": 1168} {"train_loss": -11.331144332885742, "global_step": 196295, "epoch": 1168} {"train_loss": -11.625715255737305, "global_step": 196296, "epoch": 1168} {"train_loss": -11.316164016723633, "global_step": 196297, "epoch": 1168} {"train_loss": -11.496110916137695, "global_step": 196298, "epoch": 1168} {"train_loss": -11.088483810424805, "global_step": 196299, "epoch": 1168} {"train_loss": -11.047691345214844, "global_step": 196300, "epoch": 1168} {"train_loss": -11.235010147094727, "global_step": 196301, "epoch": 1168} {"train_loss": -10.81550407409668, "global_step": 196302, "epoch": 1168} {"train_loss": -11.506080627441406, "global_step": 196303, "epoch": 1168} {"train_loss": -10.85986042022705, "global_step": 196304, "epoch": 1168} {"train_loss": -11.38487434387207, "global_step": 196305, "epoch": 1168} {"train_loss": -11.096437454223633, "global_step": 196306, "epoch": 1168} {"train_loss": -11.318048477172852, "global_step": 196307, "epoch": 1168} {"train_loss": -10.992059707641602, "global_step": 196308, "epoch": 1168} {"train_loss": -11.454791069030762, "global_step": 196309, "epoch": 1168} {"train_loss": -11.323673248291016, "global_step": 196310, "epoch": 1168} {"train_loss": -11.43934440612793, "global_step": 196311, "epoch": 1168} {"train_loss": -11.097561836242676, "global_step": 196312, "epoch": 1168} {"train_loss": -11.180397033691406, "global_step": 196313, "epoch": 1168} {"train_loss": -11.554720878601074, "global_step": 196314, "epoch": 1168} {"train_loss": -11.10430908203125, "global_step": 196315, "epoch": 1168} {"train_loss": -11.50797176361084, "global_step": 196316, "epoch": 1168} {"train_loss": -11.283002853393555, "global_step": 196317, "epoch": 1168} {"train_loss": -11.599397659301758, "global_step": 196318, "epoch": 1168} {"train_loss": -11.320391654968262, "global_step": 196319, "epoch": 1168} {"train_loss": -11.463409423828125, "global_step": 196320, "epoch": 1168} {"train_loss": -11.707684516906738, "global_step": 196321, "epoch": 1168} {"train_loss": -11.446611404418945, "global_step": 196322, "epoch": 1168} {"train_loss": -11.42044448852539, "global_step": 196323, "epoch": 1168} {"train_loss": -11.570484161376953, "global_step": 196324, "epoch": 1168} {"train_loss": -11.730905532836914, "global_step": 196325, "epoch": 1168} {"train_loss": -11.588558197021484, "global_step": 196326, "epoch": 1168} {"train_loss": -11.48002815246582, "global_step": 196327, "epoch": 1168} {"train_loss": -11.616843223571777, "global_step": 196328, "epoch": 1168} {"train_loss": -11.729602813720703, "global_step": 196329, "epoch": 1168} {"train_loss": -11.755315780639648, "global_step": 196330, "epoch": 1168} {"train_loss": -11.797122955322266, "global_step": 196331, "epoch": 1168} {"train_loss": -11.629950523376465, "global_step": 196332, "epoch": 1168} {"train_loss": -11.838722229003906, "global_step": 196333, "epoch": 1168} {"train_loss": -11.8006591796875, "global_step": 196334, "epoch": 1168} {"train_loss": -11.67086124420166, "global_step": 196335, "epoch": 1168} {"train_loss": -11.621232986450195, "global_step": 196336, "epoch": 1168} {"train_loss": -11.554396629333496, "global_step": 196337, "epoch": 1168} {"train_loss": -11.754870414733887, "global_step": 196338, "epoch": 1168} {"train_loss": -11.587348937988281, "global_step": 196339, "epoch": 1168} {"train_loss": -11.801674842834473, "global_step": 196340, "epoch": 1168} {"train_loss": -11.654254913330078, "global_step": 196341, "epoch": 1168} {"train_loss": -11.770570755004883, "global_step": 196342, "epoch": 1168} {"train_loss": -11.479936599731445, "global_step": 196343, "epoch": 1168} {"train_loss": -11.595165252685547, "global_step": 196344, "epoch": 1168} {"train_loss": -11.57033634185791, "global_step": 196345, "epoch": 1168} {"train_loss": -10.95423698425293, "global_step": 196346, "epoch": 1168} {"train_loss": -11.062488555908203, "global_step": 196347, "epoch": 1168} {"train_loss": -11.179844856262207, "global_step": 196348, "epoch": 1168} {"train_loss": -11.105033874511719, "global_step": 196349, "epoch": 1168} {"train_loss": -11.212069511413574, "global_step": 196350, "epoch": 1168} {"train_loss": -10.137678146362305, "global_step": 196351, "epoch": 1168} {"train_loss": -9.46474838256836, "global_step": 196352, "epoch": 1168} {"train_loss": -11.091626167297363, "global_step": 196353, "epoch": 1168} {"train_loss": -10.3572359085083, "global_step": 196354, "epoch": 1168} {"train_loss": -10.273527145385742, "global_step": 196355, "epoch": 1168} {"train_loss": -11.284494400024414, "global_step": 196356, "epoch": 1168} {"train_loss": -9.437898635864258, "global_step": 196357, "epoch": 1168} {"train_loss": -11.157266616821289, "global_step": 196358, "epoch": 1168} {"train_loss": -10.296541213989258, "global_step": 196359, "epoch": 1168} {"train_loss": -9.890542984008789, "global_step": 196360, "epoch": 1168} {"train_loss": -10.909956932067871, "global_step": 196361, "epoch": 1168} {"train_loss": -9.490364074707031, "global_step": 196362, "epoch": 1168} {"train_loss": -10.652863502502441, "global_step": 196363, "epoch": 1168} {"train_loss": -10.354084014892578, "global_step": 196364, "epoch": 1168} {"train_loss": -10.920113563537598, "global_step": 196365, "epoch": 1168} {"train_loss": -9.61001205444336, "global_step": 196366, "epoch": 1168} {"train_loss": -10.917730331420898, "global_step": 196367, "epoch": 1168} {"train_loss": -9.751012802124023, "global_step": 196368, "epoch": 1168} {"train_loss": -10.687369346618652, "global_step": 196369, "epoch": 1168} {"train_loss": -10.591024398803711, "global_step": 196370, "epoch": 1168} {"train_loss": -11.020429611206055, "global_step": 196371, "epoch": 1168} {"train_loss": -10.866538047790527, "global_step": 196372, "epoch": 1168} {"train_loss": -10.660730361938477, "global_step": 196373, "epoch": 1168} {"train_loss": -11.067546844482422, "global_step": 196374, "epoch": 1168} {"train_loss": -11.064773559570312, "global_step": 196375, "epoch": 1168} {"train_loss": -10.739042282104492, "global_step": 196376, "epoch": 1168} {"train_loss": -10.960996627807617, "global_step": 196377, "epoch": 1168} {"train_loss": -10.453224182128906, "global_step": 196378, "epoch": 1168} {"train_loss": -11.081562042236328, "global_step": 196379, "epoch": 1168} {"train_loss": -11.016792297363281, "global_step": 196380, "epoch": 1168} {"train_loss": -10.48619270324707, "global_step": 196381, "epoch": 1168} {"train_loss": -11.30760669708252, "global_step": 196382, "epoch": 1168} {"train_loss": -10.823333740234375, "global_step": 196383, "epoch": 1168} {"train_loss": -10.654494285583496, "global_step": 196384, "epoch": 1168} {"train_loss": -10.904935836791992, "global_step": 196385, "epoch": 1168} {"train_loss": -10.869729042053223, "global_step": 196386, "epoch": 1168} {"train_loss": -11.03896713256836, "global_step": 196387, "epoch": 1168} {"train_loss": -11.144449234008789, "global_step": 196388, "epoch": 1168} {"train_loss": -10.77517318725586, "global_step": 196389, "epoch": 1168} {"train_loss": -11.10246753692627, "global_step": 196390, "epoch": 1168} {"train_loss": -11.072046512649173, "global_step": 196391, "epoch": 1168, "val_loss": 252344.0} {"train_loss": -10.874645233154297, "global_step": 196392, "epoch": 1169} {"train_loss": -11.408638954162598, "global_step": 196393, "epoch": 1169} {"train_loss": -11.217092514038086, "global_step": 196394, "epoch": 1169} {"train_loss": -11.340113639831543, "global_step": 196395, "epoch": 1169} {"train_loss": -11.333285331726074, "global_step": 196396, "epoch": 1169} {"train_loss": -11.095743179321289, "global_step": 196397, "epoch": 1169} {"train_loss": -11.290205955505371, "global_step": 196398, "epoch": 1169} {"train_loss": -11.384899139404297, "global_step": 196399, "epoch": 1169} {"train_loss": -11.405261039733887, "global_step": 196400, "epoch": 1169} {"train_loss": -11.45528793334961, "global_step": 196401, "epoch": 1169} {"train_loss": -11.297872543334961, "global_step": 196402, "epoch": 1169} {"train_loss": -11.558065414428711, "global_step": 196403, "epoch": 1169} {"train_loss": -11.58176326751709, "global_step": 196404, "epoch": 1169} {"train_loss": -11.497363090515137, "global_step": 196405, "epoch": 1169} {"train_loss": -11.433093070983887, "global_step": 196406, "epoch": 1169} {"train_loss": -11.459009170532227, "global_step": 196407, "epoch": 1169} {"train_loss": -11.421700477600098, "global_step": 196408, "epoch": 1169} {"train_loss": -11.549623489379883, "global_step": 196409, "epoch": 1169} {"train_loss": -11.289012908935547, "global_step": 196410, "epoch": 1169} {"train_loss": -11.63412094116211, "global_step": 196411, "epoch": 1169} {"train_loss": -11.755864143371582, "global_step": 196412, "epoch": 1169} {"train_loss": -11.54104232788086, "global_step": 196413, "epoch": 1169} {"train_loss": -11.4832124710083, "global_step": 196414, "epoch": 1169} {"train_loss": -11.546876907348633, "global_step": 196415, "epoch": 1169} {"train_loss": -11.746621131896973, "global_step": 196416, "epoch": 1169} {"train_loss": -11.507586479187012, "global_step": 196417, "epoch": 1169} {"train_loss": -11.82263469696045, "global_step": 196418, "epoch": 1169} {"train_loss": -11.586087226867676, "global_step": 196419, "epoch": 1169} {"train_loss": -11.455516815185547, "global_step": 196420, "epoch": 1169} {"train_loss": -11.697502136230469, "global_step": 196421, "epoch": 1169} {"train_loss": -11.649243354797363, "global_step": 196422, "epoch": 1169} {"train_loss": -11.743705749511719, "global_step": 196423, "epoch": 1169} {"train_loss": -11.7528715133667, "global_step": 196424, "epoch": 1169} {"train_loss": -11.831289291381836, "global_step": 196425, "epoch": 1169} {"train_loss": -11.548545837402344, "global_step": 196426, "epoch": 1169} {"train_loss": -11.74062442779541, "global_step": 196427, "epoch": 1169} {"train_loss": -11.834085464477539, "global_step": 196428, "epoch": 1169} {"train_loss": -11.691267967224121, "global_step": 196429, "epoch": 1169} {"train_loss": -11.615894317626953, "global_step": 196430, "epoch": 1169} {"train_loss": -11.787490844726562, "global_step": 196431, "epoch": 1169} {"train_loss": -11.687417984008789, "global_step": 196432, "epoch": 1169} {"train_loss": -11.711080551147461, "global_step": 196433, "epoch": 1169} {"train_loss": -11.460456848144531, "global_step": 196434, "epoch": 1169} {"train_loss": -11.286458969116211, "global_step": 196435, "epoch": 1169} {"train_loss": -11.836990356445312, "global_step": 196436, "epoch": 1169} {"train_loss": -11.683210372924805, "global_step": 196437, "epoch": 1169} {"train_loss": -11.814373016357422, "global_step": 196438, "epoch": 1169} {"train_loss": -11.767930030822754, "global_step": 196439, "epoch": 1169} {"train_loss": -11.66641902923584, "global_step": 196440, "epoch": 1169} {"train_loss": -11.274831771850586, "global_step": 196441, "epoch": 1169} {"train_loss": -11.224254608154297, "global_step": 196442, "epoch": 1169} {"train_loss": -11.69420051574707, "global_step": 196443, "epoch": 1169} {"train_loss": -11.391145706176758, "global_step": 196444, "epoch": 1169} {"train_loss": -11.764225006103516, "global_step": 196445, "epoch": 1169} {"train_loss": -11.535966873168945, "global_step": 196446, "epoch": 1169} {"train_loss": -11.404491424560547, "global_step": 196447, "epoch": 1169} {"train_loss": -11.335268020629883, "global_step": 196448, "epoch": 1169} {"train_loss": -11.370141983032227, "global_step": 196449, "epoch": 1169} {"train_loss": -10.904354095458984, "global_step": 196450, "epoch": 1169} {"train_loss": -11.361616134643555, "global_step": 196451, "epoch": 1169} {"train_loss": -11.65444564819336, "global_step": 196452, "epoch": 1169} {"train_loss": -11.426717758178711, "global_step": 196453, "epoch": 1169} {"train_loss": -11.659263610839844, "global_step": 196454, "epoch": 1169} {"train_loss": -11.833799362182617, "global_step": 196455, "epoch": 1169} {"train_loss": -11.2195463180542, "global_step": 196456, "epoch": 1169} {"train_loss": -11.108378410339355, "global_step": 196457, "epoch": 1169} {"train_loss": -10.898789405822754, "global_step": 196458, "epoch": 1169} {"train_loss": -11.319480895996094, "global_step": 196459, "epoch": 1169} {"train_loss": -11.284004211425781, "global_step": 196460, "epoch": 1169} {"train_loss": -11.065536499023438, "global_step": 196461, "epoch": 1169} {"train_loss": -11.092519760131836, "global_step": 196462, "epoch": 1169} {"train_loss": -11.084305763244629, "global_step": 196463, "epoch": 1169} {"train_loss": -10.774145126342773, "global_step": 196464, "epoch": 1169} {"train_loss": -11.53105354309082, "global_step": 196465, "epoch": 1169} {"train_loss": -10.012126922607422, "global_step": 196466, "epoch": 1169} {"train_loss": -10.475210189819336, "global_step": 196467, "epoch": 1169} {"train_loss": -11.347575187683105, "global_step": 196468, "epoch": 1169} {"train_loss": -11.196667671203613, "global_step": 196469, "epoch": 1169} {"train_loss": -10.577834129333496, "global_step": 196470, "epoch": 1169} {"train_loss": -11.454358100891113, "global_step": 196471, "epoch": 1169} {"train_loss": -10.945150375366211, "global_step": 196472, "epoch": 1169} {"train_loss": -10.452751159667969, "global_step": 196473, "epoch": 1169} {"train_loss": -10.944933891296387, "global_step": 196474, "epoch": 1169} {"train_loss": -11.24339485168457, "global_step": 196475, "epoch": 1169} {"train_loss": -11.295047760009766, "global_step": 196476, "epoch": 1169} {"train_loss": -11.06878662109375, "global_step": 196477, "epoch": 1169} {"train_loss": -11.295330047607422, "global_step": 196478, "epoch": 1169} {"train_loss": -11.329544067382812, "global_step": 196479, "epoch": 1169} {"train_loss": -11.302518844604492, "global_step": 196480, "epoch": 1169} {"train_loss": -11.386468887329102, "global_step": 196481, "epoch": 1169} {"train_loss": -11.560571670532227, "global_step": 196482, "epoch": 1169} {"train_loss": -11.258621215820312, "global_step": 196483, "epoch": 1169} {"train_loss": -11.363212585449219, "global_step": 196484, "epoch": 1169} {"train_loss": -11.354511260986328, "global_step": 196485, "epoch": 1169} {"train_loss": -11.288768768310547, "global_step": 196486, "epoch": 1169} {"train_loss": -11.28841781616211, "global_step": 196487, "epoch": 1169} {"train_loss": -11.350499153137207, "global_step": 196488, "epoch": 1169} {"train_loss": -11.376791000366211, "global_step": 196489, "epoch": 1169} {"train_loss": -11.437301635742188, "global_step": 196490, "epoch": 1169} {"train_loss": -11.494840621948242, "global_step": 196491, "epoch": 1169} {"train_loss": -11.570015907287598, "global_step": 196492, "epoch": 1169} {"train_loss": -11.585334777832031, "global_step": 196493, "epoch": 1169} {"train_loss": -11.27315902709961, "global_step": 196494, "epoch": 1169} {"train_loss": -11.643526077270508, "global_step": 196495, "epoch": 1169} {"train_loss": -11.188138961791992, "global_step": 196496, "epoch": 1169} {"train_loss": -11.486209869384766, "global_step": 196497, "epoch": 1169} {"train_loss": -11.261378288269043, "global_step": 196498, "epoch": 1169} {"train_loss": -11.356550216674805, "global_step": 196499, "epoch": 1169} {"train_loss": -11.666399002075195, "global_step": 196500, "epoch": 1169} {"train_loss": -11.448888778686523, "global_step": 196501, "epoch": 1169} {"train_loss": -11.59714126586914, "global_step": 196502, "epoch": 1169} {"train_loss": -11.55807876586914, "global_step": 196503, "epoch": 1169} {"train_loss": -11.516066551208496, "global_step": 196504, "epoch": 1169} {"train_loss": -11.523368835449219, "global_step": 196505, "epoch": 1169} {"train_loss": -11.247408866882324, "global_step": 196506, "epoch": 1169} {"train_loss": -11.522722244262695, "global_step": 196507, "epoch": 1169} {"train_loss": -11.651442527770996, "global_step": 196508, "epoch": 1169} {"train_loss": -11.344892501831055, "global_step": 196509, "epoch": 1169} {"train_loss": -11.218446731567383, "global_step": 196510, "epoch": 1169} {"train_loss": -11.272595405578613, "global_step": 196511, "epoch": 1169} {"train_loss": -11.41338062286377, "global_step": 196512, "epoch": 1169} {"train_loss": -11.521525382995605, "global_step": 196513, "epoch": 1169} {"train_loss": -11.604732513427734, "global_step": 196514, "epoch": 1169} {"train_loss": -11.538061141967773, "global_step": 196515, "epoch": 1169} {"train_loss": -11.352287292480469, "global_step": 196516, "epoch": 1169} {"train_loss": -11.679115295410156, "global_step": 196517, "epoch": 1169} {"train_loss": -11.51168441772461, "global_step": 196518, "epoch": 1169} {"train_loss": -11.301054000854492, "global_step": 196519, "epoch": 1169} {"train_loss": -11.6675443649292, "global_step": 196520, "epoch": 1169} {"train_loss": -11.220324516296387, "global_step": 196521, "epoch": 1169} {"train_loss": -11.188192367553711, "global_step": 196522, "epoch": 1169} {"train_loss": -11.23312759399414, "global_step": 196523, "epoch": 1169} {"train_loss": -11.504026412963867, "global_step": 196524, "epoch": 1169} {"train_loss": -11.224347114562988, "global_step": 196525, "epoch": 1169} {"train_loss": -11.177253723144531, "global_step": 196526, "epoch": 1169} {"train_loss": -11.249820709228516, "global_step": 196527, "epoch": 1169} {"train_loss": -11.18820571899414, "global_step": 196528, "epoch": 1169} {"train_loss": -11.289091110229492, "global_step": 196529, "epoch": 1169} {"train_loss": -11.130167007446289, "global_step": 196530, "epoch": 1169} {"train_loss": -11.486661911010742, "global_step": 196531, "epoch": 1169} {"train_loss": -11.50098991394043, "global_step": 196532, "epoch": 1169} {"train_loss": -11.262939453125, "global_step": 196533, "epoch": 1169} {"train_loss": -11.497058868408203, "global_step": 196534, "epoch": 1169} {"train_loss": -11.198373794555664, "global_step": 196535, "epoch": 1169} {"train_loss": -10.866134643554688, "global_step": 196536, "epoch": 1169} {"train_loss": -10.435327529907227, "global_step": 196537, "epoch": 1169} {"train_loss": -11.240882873535156, "global_step": 196538, "epoch": 1169} {"train_loss": -10.862695693969727, "global_step": 196539, "epoch": 1169} {"train_loss": -10.635186195373535, "global_step": 196540, "epoch": 1169} {"train_loss": -10.65301513671875, "global_step": 196541, "epoch": 1169} {"train_loss": -10.539538383483887, "global_step": 196542, "epoch": 1169} {"train_loss": -10.390716552734375, "global_step": 196543, "epoch": 1169} {"train_loss": -10.890684127807617, "global_step": 196544, "epoch": 1169} {"train_loss": -10.131003379821777, "global_step": 196545, "epoch": 1169} {"train_loss": -9.998958587646484, "global_step": 196546, "epoch": 1169} {"train_loss": -10.367589950561523, "global_step": 196547, "epoch": 1169} {"train_loss": -8.066670417785645, "global_step": 196548, "epoch": 1169} {"train_loss": -8.578454971313477, "global_step": 196549, "epoch": 1169} {"train_loss": -10.059900283813477, "global_step": 196550, "epoch": 1169} {"train_loss": -9.856475830078125, "global_step": 196551, "epoch": 1169} {"train_loss": -9.027030944824219, "global_step": 196552, "epoch": 1169} {"train_loss": -9.883193969726562, "global_step": 196553, "epoch": 1169} {"train_loss": -9.086187362670898, "global_step": 196554, "epoch": 1169} {"train_loss": -9.497215270996094, "global_step": 196555, "epoch": 1169} {"train_loss": -10.841434478759766, "global_step": 196556, "epoch": 1169} {"train_loss": -8.629020690917969, "global_step": 196557, "epoch": 1169} {"train_loss": -9.881072998046875, "global_step": 196558, "epoch": 1169} {"train_loss": -11.196557834034873, "global_step": 196559, "epoch": 1169, "val_loss": 240991.265625} {"train_loss": -9.02859878540039, "global_step": 196560, "epoch": 1170} {"train_loss": -9.501692771911621, "global_step": 196561, "epoch": 1170} {"train_loss": -9.841166496276855, "global_step": 196562, "epoch": 1170} {"train_loss": -9.596570014953613, "global_step": 196563, "epoch": 1170} {"train_loss": -8.978581428527832, "global_step": 196564, "epoch": 1170} {"train_loss": -10.292017936706543, "global_step": 196565, "epoch": 1170} {"train_loss": -9.354901313781738, "global_step": 196566, "epoch": 1170} {"train_loss": -9.620351791381836, "global_step": 196567, "epoch": 1170} {"train_loss": -10.425759315490723, "global_step": 196568, "epoch": 1170} {"train_loss": -9.797416687011719, "global_step": 196569, "epoch": 1170} {"train_loss": -9.533987998962402, "global_step": 196570, "epoch": 1170} {"train_loss": -10.175593376159668, "global_step": 196571, "epoch": 1170} {"train_loss": -10.558104515075684, "global_step": 196572, "epoch": 1170} {"train_loss": -10.096713066101074, "global_step": 196573, "epoch": 1170} {"train_loss": -10.18526840209961, "global_step": 196574, "epoch": 1170} {"train_loss": -10.787630081176758, "global_step": 196575, "epoch": 1170} {"train_loss": -10.401094436645508, "global_step": 196576, "epoch": 1170} {"train_loss": -10.076171875, "global_step": 196577, "epoch": 1170} {"train_loss": -10.490116119384766, "global_step": 196578, "epoch": 1170} {"train_loss": -10.500938415527344, "global_step": 196579, "epoch": 1170} {"train_loss": -10.09361457824707, "global_step": 196580, "epoch": 1170} {"train_loss": -10.563735008239746, "global_step": 196581, "epoch": 1170} {"train_loss": -10.778485298156738, "global_step": 196582, "epoch": 1170} {"train_loss": -10.603324890136719, "global_step": 196583, "epoch": 1170} {"train_loss": -10.881494522094727, "global_step": 196584, "epoch": 1170} {"train_loss": -10.615021705627441, "global_step": 196585, "epoch": 1170} {"train_loss": -10.569063186645508, "global_step": 196586, "epoch": 1170} {"train_loss": -10.708283424377441, "global_step": 196587, "epoch": 1170} {"train_loss": -10.964265823364258, "global_step": 196588, "epoch": 1170} {"train_loss": -10.959702491760254, "global_step": 196589, "epoch": 1170} {"train_loss": -11.008630752563477, "global_step": 196590, "epoch": 1170} {"train_loss": -10.720582962036133, "global_step": 196591, "epoch": 1170} {"train_loss": -10.723033905029297, "global_step": 196592, "epoch": 1170} {"train_loss": -11.003633499145508, "global_step": 196593, "epoch": 1170} {"train_loss": -10.734760284423828, "global_step": 196594, "epoch": 1170} {"train_loss": -11.152767181396484, "global_step": 196595, "epoch": 1170} {"train_loss": -11.00013256072998, "global_step": 196596, "epoch": 1170} {"train_loss": -11.09402847290039, "global_step": 196597, "epoch": 1170} {"train_loss": -11.20858383178711, "global_step": 196598, "epoch": 1170} {"train_loss": -10.925081253051758, "global_step": 196599, "epoch": 1170} {"train_loss": -11.152210235595703, "global_step": 196600, "epoch": 1170} {"train_loss": -11.153525352478027, "global_step": 196601, "epoch": 1170} {"train_loss": -11.034876823425293, "global_step": 196602, "epoch": 1170} {"train_loss": -11.219602584838867, "global_step": 196603, "epoch": 1170} {"train_loss": -11.130215644836426, "global_step": 196604, "epoch": 1170} {"train_loss": -11.175400733947754, "global_step": 196605, "epoch": 1170} {"train_loss": -11.23304557800293, "global_step": 196606, "epoch": 1170} {"train_loss": -11.354270935058594, "global_step": 196607, "epoch": 1170} {"train_loss": -11.264045715332031, "global_step": 196608, "epoch": 1170} {"train_loss": -11.19835090637207, "global_step": 196609, "epoch": 1170} {"train_loss": -11.343647003173828, "global_step": 196610, "epoch": 1170} {"train_loss": -11.161304473876953, "global_step": 196611, "epoch": 1170} {"train_loss": -11.249963760375977, "global_step": 196612, "epoch": 1170} {"train_loss": -11.363100051879883, "global_step": 196613, "epoch": 1170} {"train_loss": -11.360458374023438, "global_step": 196614, "epoch": 1170} {"train_loss": -11.321768760681152, "global_step": 196615, "epoch": 1170} {"train_loss": -11.323254585266113, "global_step": 196616, "epoch": 1170} {"train_loss": -11.323301315307617, "global_step": 196617, "epoch": 1170} {"train_loss": -11.384515762329102, "global_step": 196618, "epoch": 1170} {"train_loss": -11.523406982421875, "global_step": 196619, "epoch": 1170} {"train_loss": -11.426939964294434, "global_step": 196620, "epoch": 1170} {"train_loss": -11.663826942443848, "global_step": 196621, "epoch": 1170} {"train_loss": -11.420509338378906, "global_step": 196622, "epoch": 1170} {"train_loss": -11.53338623046875, "global_step": 196623, "epoch": 1170} {"train_loss": -11.544599533081055, "global_step": 196624, "epoch": 1170} {"train_loss": -11.620809555053711, "global_step": 196625, "epoch": 1170} {"train_loss": -11.614017486572266, "global_step": 196626, "epoch": 1170} {"train_loss": -11.74620246887207, "global_step": 196627, "epoch": 1170} {"train_loss": -11.553726196289062, "global_step": 196628, "epoch": 1170} {"train_loss": -11.389432907104492, "global_step": 196629, "epoch": 1170} {"train_loss": -11.508926391601562, "global_step": 196630, "epoch": 1170} {"train_loss": -11.369888305664062, "global_step": 196631, "epoch": 1170} {"train_loss": -11.64837646484375, "global_step": 196632, "epoch": 1170} {"train_loss": -11.622344970703125, "global_step": 196633, "epoch": 1170} {"train_loss": -11.544092178344727, "global_step": 196634, "epoch": 1170} {"train_loss": -11.77231502532959, "global_step": 196635, "epoch": 1170} {"train_loss": -11.554601669311523, "global_step": 196636, "epoch": 1170} {"train_loss": -11.745343208312988, "global_step": 196637, "epoch": 1170} {"train_loss": -11.564029693603516, "global_step": 196638, "epoch": 1170} {"train_loss": -11.732616424560547, "global_step": 196639, "epoch": 1170} {"train_loss": -11.797809600830078, "global_step": 196640, "epoch": 1170} {"train_loss": -11.576499938964844, "global_step": 196641, "epoch": 1170} {"train_loss": -11.828413009643555, "global_step": 196642, "epoch": 1170} {"train_loss": -11.830913543701172, "global_step": 196643, "epoch": 1170} {"train_loss": -11.51608657836914, "global_step": 196644, "epoch": 1170} {"train_loss": -11.721994400024414, "global_step": 196645, "epoch": 1170} {"train_loss": -11.822661399841309, "global_step": 196646, "epoch": 1170} {"train_loss": -11.779092788696289, "global_step": 196647, "epoch": 1170} {"train_loss": -11.698311805725098, "global_step": 196648, "epoch": 1170} {"train_loss": -11.480104446411133, "global_step": 196649, "epoch": 1170} {"train_loss": -11.684248924255371, "global_step": 196650, "epoch": 1170} {"train_loss": -11.426345825195312, "global_step": 196651, "epoch": 1170} {"train_loss": -11.31429672241211, "global_step": 196652, "epoch": 1170} {"train_loss": -10.558292388916016, "global_step": 196653, "epoch": 1170} {"train_loss": -11.306772232055664, "global_step": 196654, "epoch": 1170} {"train_loss": -10.9852876663208, "global_step": 196655, "epoch": 1170} {"train_loss": -9.138994216918945, "global_step": 196656, "epoch": 1170} {"train_loss": -10.088362693786621, "global_step": 196657, "epoch": 1170} {"train_loss": -8.142267227172852, "global_step": 196658, "epoch": 1170} {"train_loss": -8.855765342712402, "global_step": 196659, "epoch": 1170} {"train_loss": -9.863216400146484, "global_step": 196660, "epoch": 1170} {"train_loss": -9.526541709899902, "global_step": 196661, "epoch": 1170} {"train_loss": -8.096724510192871, "global_step": 196662, "epoch": 1170} {"train_loss": -10.558843612670898, "global_step": 196663, "epoch": 1170} {"train_loss": -10.589422225952148, "global_step": 196664, "epoch": 1170} {"train_loss": -9.86527156829834, "global_step": 196665, "epoch": 1170} {"train_loss": -10.69943618774414, "global_step": 196666, "epoch": 1170} {"train_loss": -10.353429794311523, "global_step": 196667, "epoch": 1170} {"train_loss": -10.655858993530273, "global_step": 196668, "epoch": 1170} {"train_loss": -9.403944969177246, "global_step": 196669, "epoch": 1170} {"train_loss": -9.71469497680664, "global_step": 196670, "epoch": 1170} {"train_loss": -10.215402603149414, "global_step": 196671, "epoch": 1170} {"train_loss": -10.030179977416992, "global_step": 196672, "epoch": 1170} {"train_loss": -10.438544273376465, "global_step": 196673, "epoch": 1170} {"train_loss": -10.475154876708984, "global_step": 196674, "epoch": 1170} {"train_loss": -10.186715126037598, "global_step": 196675, "epoch": 1170} {"train_loss": -10.979049682617188, "global_step": 196676, "epoch": 1170} {"train_loss": -10.379425048828125, "global_step": 196677, "epoch": 1170} {"train_loss": -10.384161949157715, "global_step": 196678, "epoch": 1170} {"train_loss": -11.025792121887207, "global_step": 196679, "epoch": 1170} {"train_loss": -10.88951301574707, "global_step": 196680, "epoch": 1170} {"train_loss": -10.546711921691895, "global_step": 196681, "epoch": 1170} {"train_loss": -10.839255332946777, "global_step": 196682, "epoch": 1170} {"train_loss": -10.274791717529297, "global_step": 196683, "epoch": 1170} {"train_loss": -10.769994735717773, "global_step": 196684, "epoch": 1170} {"train_loss": -10.56574821472168, "global_step": 196685, "epoch": 1170} {"train_loss": -10.652828216552734, "global_step": 196686, "epoch": 1170} {"train_loss": -10.923566818237305, "global_step": 196687, "epoch": 1170} {"train_loss": -10.720499038696289, "global_step": 196688, "epoch": 1170} {"train_loss": -10.43901252746582, "global_step": 196689, "epoch": 1170} {"train_loss": -11.002134323120117, "global_step": 196690, "epoch": 1170} {"train_loss": -11.051895141601562, "global_step": 196691, "epoch": 1170} {"train_loss": -10.787782669067383, "global_step": 196692, "epoch": 1170} {"train_loss": -11.03392219543457, "global_step": 196693, "epoch": 1170} {"train_loss": -11.044649124145508, "global_step": 196694, "epoch": 1170} {"train_loss": -10.808221817016602, "global_step": 196695, "epoch": 1170} {"train_loss": -11.098387718200684, "global_step": 196696, "epoch": 1170} {"train_loss": -11.058530807495117, "global_step": 196697, "epoch": 1170} {"train_loss": -10.917086601257324, "global_step": 196698, "epoch": 1170} {"train_loss": -10.941054344177246, "global_step": 196699, "epoch": 1170} {"train_loss": -11.044953346252441, "global_step": 196700, "epoch": 1170} {"train_loss": -10.96589183807373, "global_step": 196701, "epoch": 1170} {"train_loss": -11.24638557434082, "global_step": 196702, "epoch": 1170} {"train_loss": -11.206904411315918, "global_step": 196703, "epoch": 1170} {"train_loss": -11.101801872253418, "global_step": 196704, "epoch": 1170} {"train_loss": -11.235642433166504, "global_step": 196705, "epoch": 1170} {"train_loss": -11.186300277709961, "global_step": 196706, "epoch": 1170} {"train_loss": -11.339071273803711, "global_step": 196707, "epoch": 1170} {"train_loss": -11.056900024414062, "global_step": 196708, "epoch": 1170} {"train_loss": -11.191173553466797, "global_step": 196709, "epoch": 1170} {"train_loss": -11.364240646362305, "global_step": 196710, "epoch": 1170} {"train_loss": -11.394881248474121, "global_step": 196711, "epoch": 1170} {"train_loss": -11.434558868408203, "global_step": 196712, "epoch": 1170} {"train_loss": -11.628644943237305, "global_step": 196713, "epoch": 1170} {"train_loss": -11.371524810791016, "global_step": 196714, "epoch": 1170} {"train_loss": -11.513423919677734, "global_step": 196715, "epoch": 1170} {"train_loss": -11.429098129272461, "global_step": 196716, "epoch": 1170} {"train_loss": -11.527297019958496, "global_step": 196717, "epoch": 1170} {"train_loss": -11.517578125, "global_step": 196718, "epoch": 1170} {"train_loss": -11.362800598144531, "global_step": 196719, "epoch": 1170} {"train_loss": -11.23619270324707, "global_step": 196720, "epoch": 1170} {"train_loss": -11.69955825805664, "global_step": 196721, "epoch": 1170} {"train_loss": -11.607179641723633, "global_step": 196722, "epoch": 1170} {"train_loss": -11.743268013000488, "global_step": 196723, "epoch": 1170} {"train_loss": -11.45539665222168, "global_step": 196724, "epoch": 1170} {"train_loss": -11.387835502624512, "global_step": 196725, "epoch": 1170} {"train_loss": -11.680917739868164, "global_step": 196726, "epoch": 1170} {"train_loss": -10.900428681146531, "global_step": 196727, "epoch": 1170, "val_loss": 243274.40625, "train_action_mse_error": 0.3387419581413269} {"train_loss": -11.414383888244629, "global_step": 196728, "epoch": 1171} {"train_loss": -11.585612297058105, "global_step": 196729, "epoch": 1171} {"train_loss": -11.427719116210938, "global_step": 196730, "epoch": 1171} {"train_loss": -11.529918670654297, "global_step": 196731, "epoch": 1171} {"train_loss": -11.616013526916504, "global_step": 196732, "epoch": 1171} {"train_loss": -11.445693016052246, "global_step": 196733, "epoch": 1171} {"train_loss": -11.555221557617188, "global_step": 196734, "epoch": 1171} {"train_loss": -11.586481094360352, "global_step": 196735, "epoch": 1171} {"train_loss": -11.542839050292969, "global_step": 196736, "epoch": 1171} {"train_loss": -11.774225234985352, "global_step": 196737, "epoch": 1171} {"train_loss": -11.508359909057617, "global_step": 196738, "epoch": 1171} {"train_loss": -11.08255672454834, "global_step": 196739, "epoch": 1171} {"train_loss": -11.474053382873535, "global_step": 196740, "epoch": 1171} {"train_loss": -11.304871559143066, "global_step": 196741, "epoch": 1171} {"train_loss": -11.780349731445312, "global_step": 196742, "epoch": 1171} {"train_loss": -11.355152130126953, "global_step": 196743, "epoch": 1171} {"train_loss": -11.526269912719727, "global_step": 196744, "epoch": 1171} {"train_loss": -11.523141860961914, "global_step": 196745, "epoch": 1171} {"train_loss": -11.254552841186523, "global_step": 196746, "epoch": 1171} {"train_loss": -11.78419017791748, "global_step": 196747, "epoch": 1171} {"train_loss": -11.155982971191406, "global_step": 196748, "epoch": 1171} {"train_loss": -11.344823837280273, "global_step": 196749, "epoch": 1171} {"train_loss": -11.484025955200195, "global_step": 196750, "epoch": 1171} {"train_loss": -11.289135932922363, "global_step": 196751, "epoch": 1171} {"train_loss": -11.390748977661133, "global_step": 196752, "epoch": 1171} {"train_loss": -10.48918342590332, "global_step": 196753, "epoch": 1171} {"train_loss": -11.543039321899414, "global_step": 196754, "epoch": 1171} {"train_loss": -11.026546478271484, "global_step": 196755, "epoch": 1171} {"train_loss": -10.891525268554688, "global_step": 196756, "epoch": 1171} {"train_loss": -10.898101806640625, "global_step": 196757, "epoch": 1171} {"train_loss": -11.556659698486328, "global_step": 196758, "epoch": 1171} {"train_loss": -10.797672271728516, "global_step": 196759, "epoch": 1171} {"train_loss": -11.091127395629883, "global_step": 196760, "epoch": 1171} {"train_loss": -11.223989486694336, "global_step": 196761, "epoch": 1171} {"train_loss": -11.36672592163086, "global_step": 196762, "epoch": 1171} {"train_loss": -10.67434024810791, "global_step": 196763, "epoch": 1171} {"train_loss": -11.278764724731445, "global_step": 196764, "epoch": 1171} {"train_loss": -11.030586242675781, "global_step": 196765, "epoch": 1171} {"train_loss": -10.70383071899414, "global_step": 196766, "epoch": 1171} {"train_loss": -11.3604097366333, "global_step": 196767, "epoch": 1171} {"train_loss": -11.020088195800781, "global_step": 196768, "epoch": 1171} {"train_loss": -11.256202697753906, "global_step": 196769, "epoch": 1171} {"train_loss": -11.175846099853516, "global_step": 196770, "epoch": 1171} {"train_loss": -11.056309700012207, "global_step": 196771, "epoch": 1171} {"train_loss": -10.65906810760498, "global_step": 196772, "epoch": 1171} {"train_loss": -11.643312454223633, "global_step": 196773, "epoch": 1171} {"train_loss": -11.141890525817871, "global_step": 196774, "epoch": 1171} {"train_loss": -11.386146545410156, "global_step": 196775, "epoch": 1171} {"train_loss": -11.304215431213379, "global_step": 196776, "epoch": 1171} {"train_loss": -11.285894393920898, "global_step": 196777, "epoch": 1171} {"train_loss": -11.450323104858398, "global_step": 196778, "epoch": 1171} {"train_loss": -11.29040241241455, "global_step": 196779, "epoch": 1171} {"train_loss": -11.212233543395996, "global_step": 196780, "epoch": 1171} {"train_loss": -11.253904342651367, "global_step": 196781, "epoch": 1171} {"train_loss": -11.068599700927734, "global_step": 196782, "epoch": 1171} {"train_loss": -11.547657012939453, "global_step": 196783, "epoch": 1171} {"train_loss": -10.882646560668945, "global_step": 196784, "epoch": 1171} {"train_loss": -11.494243621826172, "global_step": 196785, "epoch": 1171} {"train_loss": -11.056957244873047, "global_step": 196786, "epoch": 1171} {"train_loss": -11.470184326171875, "global_step": 196787, "epoch": 1171} {"train_loss": -11.170470237731934, "global_step": 196788, "epoch": 1171} {"train_loss": -10.735357284545898, "global_step": 196789, "epoch": 1171} {"train_loss": -11.173857688903809, "global_step": 196790, "epoch": 1171} {"train_loss": -10.839174270629883, "global_step": 196791, "epoch": 1171} {"train_loss": -11.53183364868164, "global_step": 196792, "epoch": 1171} {"train_loss": -11.109029769897461, "global_step": 196793, "epoch": 1171} {"train_loss": -11.179898262023926, "global_step": 196794, "epoch": 1171} {"train_loss": -10.8956880569458, "global_step": 196795, "epoch": 1171} {"train_loss": -11.28614616394043, "global_step": 196796, "epoch": 1171} {"train_loss": -10.905956268310547, "global_step": 196797, "epoch": 1171} {"train_loss": -10.729981422424316, "global_step": 196798, "epoch": 1171} {"train_loss": -11.2432861328125, "global_step": 196799, "epoch": 1171} {"train_loss": -10.617483139038086, "global_step": 196800, "epoch": 1171} {"train_loss": -11.307628631591797, "global_step": 196801, "epoch": 1171} {"train_loss": -11.2127685546875, "global_step": 196802, "epoch": 1171} {"train_loss": -11.271501541137695, "global_step": 196803, "epoch": 1171} {"train_loss": -10.731871604919434, "global_step": 196804, "epoch": 1171} {"train_loss": -10.93022346496582, "global_step": 196805, "epoch": 1171} {"train_loss": -11.241819381713867, "global_step": 196806, "epoch": 1171} {"train_loss": -10.762308120727539, "global_step": 196807, "epoch": 1171} {"train_loss": -11.127922058105469, "global_step": 196808, "epoch": 1171} {"train_loss": -11.170356750488281, "global_step": 196809, "epoch": 1171} {"train_loss": -11.191267013549805, "global_step": 196810, "epoch": 1171} {"train_loss": -11.280929565429688, "global_step": 196811, "epoch": 1171} {"train_loss": -11.174216270446777, "global_step": 196812, "epoch": 1171} {"train_loss": -11.243836402893066, "global_step": 196813, "epoch": 1171} {"train_loss": -11.159921646118164, "global_step": 196814, "epoch": 1171} {"train_loss": -11.246188163757324, "global_step": 196815, "epoch": 1171} {"train_loss": -11.306673049926758, "global_step": 196816, "epoch": 1171} {"train_loss": -11.082130432128906, "global_step": 196817, "epoch": 1171} {"train_loss": -11.658485412597656, "global_step": 196818, "epoch": 1171} {"train_loss": -11.082968711853027, "global_step": 196819, "epoch": 1171} {"train_loss": -11.476710319519043, "global_step": 196820, "epoch": 1171} {"train_loss": -11.128232955932617, "global_step": 196821, "epoch": 1171} {"train_loss": -11.449600219726562, "global_step": 196822, "epoch": 1171} {"train_loss": -11.615367889404297, "global_step": 196823, "epoch": 1171} {"train_loss": -11.390213012695312, "global_step": 196824, "epoch": 1171} {"train_loss": -11.667393684387207, "global_step": 196825, "epoch": 1171} {"train_loss": -11.540327072143555, "global_step": 196826, "epoch": 1171} {"train_loss": -11.590973854064941, "global_step": 196827, "epoch": 1171} {"train_loss": -11.45266342163086, "global_step": 196828, "epoch": 1171} {"train_loss": -11.658705711364746, "global_step": 196829, "epoch": 1171} {"train_loss": -11.507637023925781, "global_step": 196830, "epoch": 1171} {"train_loss": -11.738039016723633, "global_step": 196831, "epoch": 1171} {"train_loss": -11.648168563842773, "global_step": 196832, "epoch": 1171} {"train_loss": -11.55905532836914, "global_step": 196833, "epoch": 1171} {"train_loss": -11.669290542602539, "global_step": 196834, "epoch": 1171} {"train_loss": -11.634626388549805, "global_step": 196835, "epoch": 1171} {"train_loss": -11.576666831970215, "global_step": 196836, "epoch": 1171} {"train_loss": -11.47628402709961, "global_step": 196837, "epoch": 1171} {"train_loss": -11.259965896606445, "global_step": 196838, "epoch": 1171} {"train_loss": -11.304701805114746, "global_step": 196839, "epoch": 1171} {"train_loss": -11.228021621704102, "global_step": 196840, "epoch": 1171} {"train_loss": -11.484853744506836, "global_step": 196841, "epoch": 1171} {"train_loss": -11.349092483520508, "global_step": 196842, "epoch": 1171} {"train_loss": -11.241869926452637, "global_step": 196843, "epoch": 1171} {"train_loss": -11.41843032836914, "global_step": 196844, "epoch": 1171} {"train_loss": -11.779777526855469, "global_step": 196845, "epoch": 1171} {"train_loss": -11.41723918914795, "global_step": 196846, "epoch": 1171} {"train_loss": -11.472298622131348, "global_step": 196847, "epoch": 1171} {"train_loss": -11.77084732055664, "global_step": 196848, "epoch": 1171} {"train_loss": -11.392452239990234, "global_step": 196849, "epoch": 1171} {"train_loss": -11.648900032043457, "global_step": 196850, "epoch": 1171} {"train_loss": -11.504974365234375, "global_step": 196851, "epoch": 1171} {"train_loss": -11.540960311889648, "global_step": 196852, "epoch": 1171} {"train_loss": -11.492120742797852, "global_step": 196853, "epoch": 1171} {"train_loss": -11.631040573120117, "global_step": 196854, "epoch": 1171} {"train_loss": -11.567405700683594, "global_step": 196855, "epoch": 1171} {"train_loss": -11.861618041992188, "global_step": 196856, "epoch": 1171} {"train_loss": -11.574356079101562, "global_step": 196857, "epoch": 1171} {"train_loss": -11.55278205871582, "global_step": 196858, "epoch": 1171} {"train_loss": -11.550987243652344, "global_step": 196859, "epoch": 1171} {"train_loss": -11.577659606933594, "global_step": 196860, "epoch": 1171} {"train_loss": -11.344449996948242, "global_step": 196861, "epoch": 1171} {"train_loss": -11.492449760437012, "global_step": 196862, "epoch": 1171} {"train_loss": -11.279535293579102, "global_step": 196863, "epoch": 1171} {"train_loss": -11.170284271240234, "global_step": 196864, "epoch": 1171} {"train_loss": -10.96647834777832, "global_step": 196865, "epoch": 1171} {"train_loss": -11.157777786254883, "global_step": 196866, "epoch": 1171} {"train_loss": -10.064993858337402, "global_step": 196867, "epoch": 1171} {"train_loss": -10.951641082763672, "global_step": 196868, "epoch": 1171} {"train_loss": -10.918651580810547, "global_step": 196869, "epoch": 1171} {"train_loss": -11.124326705932617, "global_step": 196870, "epoch": 1171} {"train_loss": -11.235419273376465, "global_step": 196871, "epoch": 1171} {"train_loss": -11.09748649597168, "global_step": 196872, "epoch": 1171} {"train_loss": -10.720413208007812, "global_step": 196873, "epoch": 1171} {"train_loss": -11.116443634033203, "global_step": 196874, "epoch": 1171} {"train_loss": -10.872135162353516, "global_step": 196875, "epoch": 1171} {"train_loss": -11.170000076293945, "global_step": 196876, "epoch": 1171} {"train_loss": -11.15716552734375, "global_step": 196877, "epoch": 1171} {"train_loss": -10.87431812286377, "global_step": 196878, "epoch": 1171} {"train_loss": -11.390630722045898, "global_step": 196879, "epoch": 1171} {"train_loss": -10.754599571228027, "global_step": 196880, "epoch": 1171} {"train_loss": -11.018770217895508, "global_step": 196881, "epoch": 1171} {"train_loss": -11.093658447265625, "global_step": 196882, "epoch": 1171} {"train_loss": -11.0438232421875, "global_step": 196883, "epoch": 1171} {"train_loss": -10.183205604553223, "global_step": 196884, "epoch": 1171} {"train_loss": -11.492765426635742, "global_step": 196885, "epoch": 1171} {"train_loss": -10.339042663574219, "global_step": 196886, "epoch": 1171} {"train_loss": -10.910196304321289, "global_step": 196887, "epoch": 1171} {"train_loss": -11.385784149169922, "global_step": 196888, "epoch": 1171} {"train_loss": -10.942986488342285, "global_step": 196889, "epoch": 1171} {"train_loss": -11.329183578491211, "global_step": 196890, "epoch": 1171} {"train_loss": -10.7733154296875, "global_step": 196891, "epoch": 1171} {"train_loss": -10.646622657775879, "global_step": 196892, "epoch": 1171} {"train_loss": -11.46115493774414, "global_step": 196893, "epoch": 1171} {"train_loss": -11.10073471069336, "global_step": 196894, "epoch": 1171} {"train_loss": -11.256157012212844, "global_step": 196895, "epoch": 1171, "val_loss": 250042.328125} {"train_loss": -10.83633041381836, "global_step": 196896, "epoch": 1172} {"train_loss": -10.92757511138916, "global_step": 196897, "epoch": 1172} {"train_loss": -10.970097541809082, "global_step": 196898, "epoch": 1172} {"train_loss": -11.020988464355469, "global_step": 196899, "epoch": 1172} {"train_loss": -11.166462898254395, "global_step": 196900, "epoch": 1172} {"train_loss": -10.910343170166016, "global_step": 196901, "epoch": 1172} {"train_loss": -10.806633949279785, "global_step": 196902, "epoch": 1172} {"train_loss": -10.753070831298828, "global_step": 196903, "epoch": 1172} {"train_loss": -10.689888000488281, "global_step": 196904, "epoch": 1172} {"train_loss": -11.102276802062988, "global_step": 196905, "epoch": 1172} {"train_loss": -10.44926929473877, "global_step": 196906, "epoch": 1172} {"train_loss": -11.150738716125488, "global_step": 196907, "epoch": 1172} {"train_loss": -10.784820556640625, "global_step": 196908, "epoch": 1172} {"train_loss": -10.929636001586914, "global_step": 196909, "epoch": 1172} {"train_loss": -10.834182739257812, "global_step": 196910, "epoch": 1172} {"train_loss": -10.740983963012695, "global_step": 196911, "epoch": 1172} {"train_loss": -11.099076271057129, "global_step": 196912, "epoch": 1172} {"train_loss": -11.000747680664062, "global_step": 196913, "epoch": 1172} {"train_loss": -10.852846145629883, "global_step": 196914, "epoch": 1172} {"train_loss": -11.08450698852539, "global_step": 196915, "epoch": 1172} {"train_loss": -10.88906478881836, "global_step": 196916, "epoch": 1172} {"train_loss": -10.99323844909668, "global_step": 196917, "epoch": 1172} {"train_loss": -11.085357666015625, "global_step": 196918, "epoch": 1172} {"train_loss": -11.032087326049805, "global_step": 196919, "epoch": 1172} {"train_loss": -11.188946723937988, "global_step": 196920, "epoch": 1172} {"train_loss": -11.297624588012695, "global_step": 196921, "epoch": 1172} {"train_loss": -11.111846923828125, "global_step": 196922, "epoch": 1172} {"train_loss": -11.138702392578125, "global_step": 196923, "epoch": 1172} {"train_loss": -11.251262664794922, "global_step": 196924, "epoch": 1172} {"train_loss": -11.304064750671387, "global_step": 196925, "epoch": 1172} {"train_loss": -11.353982925415039, "global_step": 196926, "epoch": 1172} {"train_loss": -11.19482421875, "global_step": 196927, "epoch": 1172} {"train_loss": -11.560937881469727, "global_step": 196928, "epoch": 1172} {"train_loss": -11.56273365020752, "global_step": 196929, "epoch": 1172} {"train_loss": -11.455833435058594, "global_step": 196930, "epoch": 1172} {"train_loss": -11.623867988586426, "global_step": 196931, "epoch": 1172} {"train_loss": -11.394622802734375, "global_step": 196932, "epoch": 1172} {"train_loss": -11.238350868225098, "global_step": 196933, "epoch": 1172} {"train_loss": -11.629623413085938, "global_step": 196934, "epoch": 1172} {"train_loss": -11.556375503540039, "global_step": 196935, "epoch": 1172} {"train_loss": -11.46473503112793, "global_step": 196936, "epoch": 1172} {"train_loss": -11.697821617126465, "global_step": 196937, "epoch": 1172} {"train_loss": -11.507198333740234, "global_step": 196938, "epoch": 1172} {"train_loss": -11.598987579345703, "global_step": 196939, "epoch": 1172} {"train_loss": -11.74029541015625, "global_step": 196940, "epoch": 1172} {"train_loss": -11.708148002624512, "global_step": 196941, "epoch": 1172} {"train_loss": -11.480140686035156, "global_step": 196942, "epoch": 1172} {"train_loss": -11.575889587402344, "global_step": 196943, "epoch": 1172} {"train_loss": -11.59542465209961, "global_step": 196944, "epoch": 1172} {"train_loss": -11.230024337768555, "global_step": 196945, "epoch": 1172} {"train_loss": -11.60818862915039, "global_step": 196946, "epoch": 1172} {"train_loss": -11.324302673339844, "global_step": 196947, "epoch": 1172} {"train_loss": -11.28721809387207, "global_step": 196948, "epoch": 1172} {"train_loss": -11.751654624938965, "global_step": 196949, "epoch": 1172} {"train_loss": -11.176034927368164, "global_step": 196950, "epoch": 1172} {"train_loss": -11.212810516357422, "global_step": 196951, "epoch": 1172} {"train_loss": -11.63338851928711, "global_step": 196952, "epoch": 1172} {"train_loss": -11.245477676391602, "global_step": 196953, "epoch": 1172} {"train_loss": -11.657991409301758, "global_step": 196954, "epoch": 1172} {"train_loss": -11.515320777893066, "global_step": 196955, "epoch": 1172} {"train_loss": -11.635451316833496, "global_step": 196956, "epoch": 1172} {"train_loss": -11.657560348510742, "global_step": 196957, "epoch": 1172} {"train_loss": -11.849747657775879, "global_step": 196958, "epoch": 1172} {"train_loss": -11.491046905517578, "global_step": 196959, "epoch": 1172} {"train_loss": -11.569084167480469, "global_step": 196960, "epoch": 1172} {"train_loss": -11.529470443725586, "global_step": 196961, "epoch": 1172} {"train_loss": -11.730920791625977, "global_step": 196962, "epoch": 1172} {"train_loss": -11.608525276184082, "global_step": 196963, "epoch": 1172} {"train_loss": -11.388885498046875, "global_step": 196964, "epoch": 1172} {"train_loss": -11.57158088684082, "global_step": 196965, "epoch": 1172} {"train_loss": -11.636289596557617, "global_step": 196966, "epoch": 1172} {"train_loss": -11.401352882385254, "global_step": 196967, "epoch": 1172} {"train_loss": -11.414799690246582, "global_step": 196968, "epoch": 1172} {"train_loss": -11.39866828918457, "global_step": 196969, "epoch": 1172} {"train_loss": -11.407405853271484, "global_step": 196970, "epoch": 1172} {"train_loss": -11.137592315673828, "global_step": 196971, "epoch": 1172} {"train_loss": -11.123013496398926, "global_step": 196972, "epoch": 1172} {"train_loss": -11.365070343017578, "global_step": 196973, "epoch": 1172} {"train_loss": -10.531095504760742, "global_step": 196974, "epoch": 1172} {"train_loss": -11.394754409790039, "global_step": 196975, "epoch": 1172} {"train_loss": -10.76860523223877, "global_step": 196976, "epoch": 1172} {"train_loss": -10.937854766845703, "global_step": 196977, "epoch": 1172} {"train_loss": -11.38408088684082, "global_step": 196978, "epoch": 1172} {"train_loss": -10.55343246459961, "global_step": 196979, "epoch": 1172} {"train_loss": -11.10584545135498, "global_step": 196980, "epoch": 1172} {"train_loss": -10.96040153503418, "global_step": 196981, "epoch": 1172} {"train_loss": -10.198297500610352, "global_step": 196982, "epoch": 1172} {"train_loss": -10.732707023620605, "global_step": 196983, "epoch": 1172} {"train_loss": -9.686359405517578, "global_step": 196984, "epoch": 1172} {"train_loss": -10.637259483337402, "global_step": 196985, "epoch": 1172} {"train_loss": -10.544801712036133, "global_step": 196986, "epoch": 1172} {"train_loss": -10.384631156921387, "global_step": 196987, "epoch": 1172} {"train_loss": -10.891267776489258, "global_step": 196988, "epoch": 1172} {"train_loss": -9.364461898803711, "global_step": 196989, "epoch": 1172} {"train_loss": -11.369571685791016, "global_step": 196990, "epoch": 1172} {"train_loss": -10.683622360229492, "global_step": 196991, "epoch": 1172} {"train_loss": -10.525522232055664, "global_step": 196992, "epoch": 1172} {"train_loss": -10.987493515014648, "global_step": 196993, "epoch": 1172} {"train_loss": -9.963168144226074, "global_step": 196994, "epoch": 1172} {"train_loss": -10.547811508178711, "global_step": 196995, "epoch": 1172} {"train_loss": -10.76146411895752, "global_step": 196996, "epoch": 1172} {"train_loss": -9.985404968261719, "global_step": 196997, "epoch": 1172} {"train_loss": -11.293139457702637, "global_step": 196998, "epoch": 1172} {"train_loss": -9.998146057128906, "global_step": 196999, "epoch": 1172} {"train_loss": -10.612350463867188, "global_step": 197000, "epoch": 1172} {"train_loss": -10.81306266784668, "global_step": 197001, "epoch": 1172} {"train_loss": -10.402270317077637, "global_step": 197002, "epoch": 1172} {"train_loss": -10.874290466308594, "global_step": 197003, "epoch": 1172} {"train_loss": -10.829022407531738, "global_step": 197004, "epoch": 1172} {"train_loss": -10.758819580078125, "global_step": 197005, "epoch": 1172} {"train_loss": -10.99677848815918, "global_step": 197006, "epoch": 1172} {"train_loss": -10.86086368560791, "global_step": 197007, "epoch": 1172} {"train_loss": -10.98659610748291, "global_step": 197008, "epoch": 1172} {"train_loss": -10.474451065063477, "global_step": 197009, "epoch": 1172} {"train_loss": -10.878377914428711, "global_step": 197010, "epoch": 1172} {"train_loss": -11.051126480102539, "global_step": 197011, "epoch": 1172} {"train_loss": -10.893840789794922, "global_step": 197012, "epoch": 1172} {"train_loss": -11.054487228393555, "global_step": 197013, "epoch": 1172} {"train_loss": -10.788947105407715, "global_step": 197014, "epoch": 1172} {"train_loss": -11.092081069946289, "global_step": 197015, "epoch": 1172} {"train_loss": -10.773072242736816, "global_step": 197016, "epoch": 1172} {"train_loss": -10.700984954833984, "global_step": 197017, "epoch": 1172} {"train_loss": -11.015237808227539, "global_step": 197018, "epoch": 1172} {"train_loss": -10.936334609985352, "global_step": 197019, "epoch": 1172} {"train_loss": -11.151721954345703, "global_step": 197020, "epoch": 1172} {"train_loss": -11.23439884185791, "global_step": 197021, "epoch": 1172} {"train_loss": -10.592254638671875, "global_step": 197022, "epoch": 1172} {"train_loss": -11.33828353881836, "global_step": 197023, "epoch": 1172} {"train_loss": -10.994324684143066, "global_step": 197024, "epoch": 1172} {"train_loss": -11.071693420410156, "global_step": 197025, "epoch": 1172} {"train_loss": -11.10426139831543, "global_step": 197026, "epoch": 1172} {"train_loss": -11.116482734680176, "global_step": 197027, "epoch": 1172} {"train_loss": -11.011390686035156, "global_step": 197028, "epoch": 1172} {"train_loss": -11.319833755493164, "global_step": 197029, "epoch": 1172} {"train_loss": -11.249372482299805, "global_step": 197030, "epoch": 1172} {"train_loss": -11.465970993041992, "global_step": 197031, "epoch": 1172} {"train_loss": -11.03994369506836, "global_step": 197032, "epoch": 1172} {"train_loss": -11.152950286865234, "global_step": 197033, "epoch": 1172} {"train_loss": -11.276142120361328, "global_step": 197034, "epoch": 1172} {"train_loss": -11.111763000488281, "global_step": 197035, "epoch": 1172} {"train_loss": -11.347087860107422, "global_step": 197036, "epoch": 1172} {"train_loss": -10.701469421386719, "global_step": 197037, "epoch": 1172} {"train_loss": -11.382772445678711, "global_step": 197038, "epoch": 1172} {"train_loss": -11.32909107208252, "global_step": 197039, "epoch": 1172} {"train_loss": -11.307193756103516, "global_step": 197040, "epoch": 1172} {"train_loss": -11.318343162536621, "global_step": 197041, "epoch": 1172} {"train_loss": -11.461065292358398, "global_step": 197042, "epoch": 1172} {"train_loss": -11.349985122680664, "global_step": 197043, "epoch": 1172} {"train_loss": -11.565625190734863, "global_step": 197044, "epoch": 1172} {"train_loss": -11.172394752502441, "global_step": 197045, "epoch": 1172} {"train_loss": -11.505375862121582, "global_step": 197046, "epoch": 1172} {"train_loss": -11.39736557006836, "global_step": 197047, "epoch": 1172} {"train_loss": -11.531938552856445, "global_step": 197048, "epoch": 1172} {"train_loss": -11.446228981018066, "global_step": 197049, "epoch": 1172} {"train_loss": -11.547496795654297, "global_step": 197050, "epoch": 1172} {"train_loss": -11.22599983215332, "global_step": 197051, "epoch": 1172} {"train_loss": -11.455509185791016, "global_step": 197052, "epoch": 1172} {"train_loss": -11.270620346069336, "global_step": 197053, "epoch": 1172} {"train_loss": -11.608954429626465, "global_step": 197054, "epoch": 1172} {"train_loss": -11.666057586669922, "global_step": 197055, "epoch": 1172} {"train_loss": -11.550787925720215, "global_step": 197056, "epoch": 1172} {"train_loss": -11.472883224487305, "global_step": 197057, "epoch": 1172} {"train_loss": -11.495707511901855, "global_step": 197058, "epoch": 1172} {"train_loss": -11.465462684631348, "global_step": 197059, "epoch": 1172} {"train_loss": -11.457233428955078, "global_step": 197060, "epoch": 1172} {"train_loss": -11.387405395507812, "global_step": 197061, "epoch": 1172} {"train_loss": -11.609057426452637, "global_step": 197062, "epoch": 1172} {"train_loss": -11.140252771831694, "global_step": 197063, "epoch": 1172, "val_loss": 252429.484375} {"train_loss": -11.533801078796387, "global_step": 197064, "epoch": 1173} {"train_loss": -11.405342102050781, "global_step": 197065, "epoch": 1173} {"train_loss": -11.66653060913086, "global_step": 197066, "epoch": 1173} {"train_loss": -11.654544830322266, "global_step": 197067, "epoch": 1173} {"train_loss": -11.481209754943848, "global_step": 197068, "epoch": 1173} {"train_loss": -11.584025382995605, "global_step": 197069, "epoch": 1173} {"train_loss": -11.321081161499023, "global_step": 197070, "epoch": 1173} {"train_loss": -11.360302925109863, "global_step": 197071, "epoch": 1173} {"train_loss": -11.607099533081055, "global_step": 197072, "epoch": 1173} {"train_loss": -11.265111923217773, "global_step": 197073, "epoch": 1173} {"train_loss": -11.711446762084961, "global_step": 197074, "epoch": 1173} {"train_loss": -11.252228736877441, "global_step": 197075, "epoch": 1173} {"train_loss": -11.503665924072266, "global_step": 197076, "epoch": 1173} {"train_loss": -11.437500953674316, "global_step": 197077, "epoch": 1173} {"train_loss": -11.297099113464355, "global_step": 197078, "epoch": 1173} {"train_loss": -11.569053649902344, "global_step": 197079, "epoch": 1173} {"train_loss": -11.456793785095215, "global_step": 197080, "epoch": 1173} {"train_loss": -11.485982894897461, "global_step": 197081, "epoch": 1173} {"train_loss": -11.305109024047852, "global_step": 197082, "epoch": 1173} {"train_loss": -11.492725372314453, "global_step": 197083, "epoch": 1173} {"train_loss": -11.288883209228516, "global_step": 197084, "epoch": 1173} {"train_loss": -11.847835540771484, "global_step": 197085, "epoch": 1173} {"train_loss": -11.352583885192871, "global_step": 197086, "epoch": 1173} {"train_loss": -11.514188766479492, "global_step": 197087, "epoch": 1173} {"train_loss": -11.580692291259766, "global_step": 197088, "epoch": 1173} {"train_loss": -11.049410820007324, "global_step": 197089, "epoch": 1173} {"train_loss": -11.334527969360352, "global_step": 197090, "epoch": 1173} {"train_loss": -11.671503067016602, "global_step": 197091, "epoch": 1173} {"train_loss": -11.258552551269531, "global_step": 197092, "epoch": 1173} {"train_loss": -11.909811019897461, "global_step": 197093, "epoch": 1173} {"train_loss": -11.62259578704834, "global_step": 197094, "epoch": 1173} {"train_loss": -11.59713077545166, "global_step": 197095, "epoch": 1173} {"train_loss": -11.664417266845703, "global_step": 197096, "epoch": 1173} {"train_loss": -11.37977409362793, "global_step": 197097, "epoch": 1173} {"train_loss": -11.487730026245117, "global_step": 197098, "epoch": 1173} {"train_loss": -11.59731674194336, "global_step": 197099, "epoch": 1173} {"train_loss": -11.429807662963867, "global_step": 197100, "epoch": 1173} {"train_loss": -11.164403915405273, "global_step": 197101, "epoch": 1173} {"train_loss": -11.792058944702148, "global_step": 197102, "epoch": 1173} {"train_loss": -11.034194946289062, "global_step": 197103, "epoch": 1173} {"train_loss": -10.205917358398438, "global_step": 197104, "epoch": 1173} {"train_loss": -10.982227325439453, "global_step": 197105, "epoch": 1173} {"train_loss": -10.762421607971191, "global_step": 197106, "epoch": 1173} {"train_loss": -11.496360778808594, "global_step": 197107, "epoch": 1173} {"train_loss": -11.49747085571289, "global_step": 197108, "epoch": 1173} {"train_loss": -11.124059677124023, "global_step": 197109, "epoch": 1173} {"train_loss": -11.285626411437988, "global_step": 197110, "epoch": 1173} {"train_loss": -11.249802589416504, "global_step": 197111, "epoch": 1173} {"train_loss": -11.50206184387207, "global_step": 197112, "epoch": 1173} {"train_loss": -11.017129898071289, "global_step": 197113, "epoch": 1173} {"train_loss": -10.97956371307373, "global_step": 197114, "epoch": 1173} {"train_loss": -11.485135078430176, "global_step": 197115, "epoch": 1173} {"train_loss": -11.24915885925293, "global_step": 197116, "epoch": 1173} {"train_loss": -11.221185684204102, "global_step": 197117, "epoch": 1173} {"train_loss": -11.427754402160645, "global_step": 197118, "epoch": 1173} {"train_loss": -11.258563995361328, "global_step": 197119, "epoch": 1173} {"train_loss": -11.207969665527344, "global_step": 197120, "epoch": 1173} {"train_loss": -11.450328826904297, "global_step": 197121, "epoch": 1173} {"train_loss": -11.386752128601074, "global_step": 197122, "epoch": 1173} {"train_loss": -11.459815979003906, "global_step": 197123, "epoch": 1173} {"train_loss": -11.442357063293457, "global_step": 197124, "epoch": 1173} {"train_loss": -11.311321258544922, "global_step": 197125, "epoch": 1173} {"train_loss": -10.953910827636719, "global_step": 197126, "epoch": 1173} {"train_loss": -11.573153495788574, "global_step": 197127, "epoch": 1173} {"train_loss": -11.196183204650879, "global_step": 197128, "epoch": 1173} {"train_loss": -11.161800384521484, "global_step": 197129, "epoch": 1173} {"train_loss": -11.218525886535645, "global_step": 197130, "epoch": 1173} {"train_loss": -11.64401912689209, "global_step": 197131, "epoch": 1173} {"train_loss": -11.558001518249512, "global_step": 197132, "epoch": 1173} {"train_loss": -11.609492301940918, "global_step": 197133, "epoch": 1173} {"train_loss": -11.796928405761719, "global_step": 197134, "epoch": 1173} {"train_loss": -11.545244216918945, "global_step": 197135, "epoch": 1173} {"train_loss": -11.699213981628418, "global_step": 197136, "epoch": 1173} {"train_loss": -11.141496658325195, "global_step": 197137, "epoch": 1173} {"train_loss": -11.62368392944336, "global_step": 197138, "epoch": 1173} {"train_loss": -11.682443618774414, "global_step": 197139, "epoch": 1173} {"train_loss": -11.50127124786377, "global_step": 197140, "epoch": 1173} {"train_loss": -11.624513626098633, "global_step": 197141, "epoch": 1173} {"train_loss": -11.475709915161133, "global_step": 197142, "epoch": 1173} {"train_loss": -11.418810844421387, "global_step": 197143, "epoch": 1173} {"train_loss": -11.603963851928711, "global_step": 197144, "epoch": 1173} {"train_loss": -11.033380508422852, "global_step": 197145, "epoch": 1173} {"train_loss": -11.01409912109375, "global_step": 197146, "epoch": 1173} {"train_loss": -11.145679473876953, "global_step": 197147, "epoch": 1173} {"train_loss": -11.370697021484375, "global_step": 197148, "epoch": 1173} {"train_loss": -11.433459281921387, "global_step": 197149, "epoch": 1173} {"train_loss": -11.242612838745117, "global_step": 197150, "epoch": 1173} {"train_loss": -11.639884948730469, "global_step": 197151, "epoch": 1173} {"train_loss": -11.305986404418945, "global_step": 197152, "epoch": 1173} {"train_loss": -10.868108749389648, "global_step": 197153, "epoch": 1173} {"train_loss": -11.544079780578613, "global_step": 197154, "epoch": 1173} {"train_loss": -10.817434310913086, "global_step": 197155, "epoch": 1173} {"train_loss": -11.449716567993164, "global_step": 197156, "epoch": 1173} {"train_loss": -10.62837028503418, "global_step": 197157, "epoch": 1173} {"train_loss": -11.475013732910156, "global_step": 197158, "epoch": 1173} {"train_loss": -11.037656784057617, "global_step": 197159, "epoch": 1173} {"train_loss": -10.800567626953125, "global_step": 197160, "epoch": 1173} {"train_loss": -11.63221549987793, "global_step": 197161, "epoch": 1173} {"train_loss": -10.559657096862793, "global_step": 197162, "epoch": 1173} {"train_loss": -10.864858627319336, "global_step": 197163, "epoch": 1173} {"train_loss": -10.733194351196289, "global_step": 197164, "epoch": 1173} {"train_loss": -9.487306594848633, "global_step": 197165, "epoch": 1173} {"train_loss": -10.417787551879883, "global_step": 197166, "epoch": 1173} {"train_loss": -8.84935188293457, "global_step": 197167, "epoch": 1173} {"train_loss": -9.894855499267578, "global_step": 197168, "epoch": 1173} {"train_loss": -9.312110900878906, "global_step": 197169, "epoch": 1173} {"train_loss": -10.681441307067871, "global_step": 197170, "epoch": 1173} {"train_loss": -9.94528865814209, "global_step": 197171, "epoch": 1173} {"train_loss": -10.03945541381836, "global_step": 197172, "epoch": 1173} {"train_loss": -10.744996070861816, "global_step": 197173, "epoch": 1173} {"train_loss": -11.126703262329102, "global_step": 197174, "epoch": 1173} {"train_loss": -11.00312614440918, "global_step": 197175, "epoch": 1173} {"train_loss": -11.282052993774414, "global_step": 197176, "epoch": 1173} {"train_loss": -11.272218704223633, "global_step": 197177, "epoch": 1173} {"train_loss": -11.054903030395508, "global_step": 197178, "epoch": 1173} {"train_loss": -11.426780700683594, "global_step": 197179, "epoch": 1173} {"train_loss": -11.248306274414062, "global_step": 197180, "epoch": 1173} {"train_loss": -11.27464771270752, "global_step": 197181, "epoch": 1173} {"train_loss": -11.412651062011719, "global_step": 197182, "epoch": 1173} {"train_loss": -11.314346313476562, "global_step": 197183, "epoch": 1173} {"train_loss": -11.126541137695312, "global_step": 197184, "epoch": 1173} {"train_loss": -11.223042488098145, "global_step": 197185, "epoch": 1173} {"train_loss": -11.426467895507812, "global_step": 197186, "epoch": 1173} {"train_loss": -11.353582382202148, "global_step": 197187, "epoch": 1173} {"train_loss": -11.27523422241211, "global_step": 197188, "epoch": 1173} {"train_loss": -11.748611450195312, "global_step": 197189, "epoch": 1173} {"train_loss": -11.2921142578125, "global_step": 197190, "epoch": 1173} {"train_loss": -11.23664665222168, "global_step": 197191, "epoch": 1173} {"train_loss": -11.515870094299316, "global_step": 197192, "epoch": 1173} {"train_loss": -11.586996078491211, "global_step": 197193, "epoch": 1173} {"train_loss": -11.746772766113281, "global_step": 197194, "epoch": 1173} {"train_loss": -11.577709197998047, "global_step": 197195, "epoch": 1173} {"train_loss": -11.578256607055664, "global_step": 197196, "epoch": 1173} {"train_loss": -11.529831886291504, "global_step": 197197, "epoch": 1173} {"train_loss": -11.592987060546875, "global_step": 197198, "epoch": 1173} {"train_loss": -11.654808044433594, "global_step": 197199, "epoch": 1173} {"train_loss": -11.516563415527344, "global_step": 197200, "epoch": 1173} {"train_loss": -11.379514694213867, "global_step": 197201, "epoch": 1173} {"train_loss": -11.538959503173828, "global_step": 197202, "epoch": 1173} {"train_loss": -11.665689468383789, "global_step": 197203, "epoch": 1173} {"train_loss": -11.702421188354492, "global_step": 197204, "epoch": 1173} {"train_loss": -11.558316230773926, "global_step": 197205, "epoch": 1173} {"train_loss": -11.417024612426758, "global_step": 197206, "epoch": 1173} {"train_loss": -11.548812866210938, "global_step": 197207, "epoch": 1173} {"train_loss": -10.938901901245117, "global_step": 197208, "epoch": 1173} {"train_loss": -11.189515113830566, "global_step": 197209, "epoch": 1173} {"train_loss": -11.633611679077148, "global_step": 197210, "epoch": 1173} {"train_loss": -11.143956184387207, "global_step": 197211, "epoch": 1173} {"train_loss": -11.456951141357422, "global_step": 197212, "epoch": 1173} {"train_loss": -10.94892692565918, "global_step": 197213, "epoch": 1173} {"train_loss": -11.327285766601562, "global_step": 197214, "epoch": 1173} {"train_loss": -11.631587982177734, "global_step": 197215, "epoch": 1173} {"train_loss": -11.252345085144043, "global_step": 197216, "epoch": 1173} {"train_loss": -11.508581161499023, "global_step": 197217, "epoch": 1173} {"train_loss": -11.65774917602539, "global_step": 197218, "epoch": 1173} {"train_loss": -11.490103721618652, "global_step": 197219, "epoch": 1173} {"train_loss": -11.75007438659668, "global_step": 197220, "epoch": 1173} {"train_loss": -11.548140525817871, "global_step": 197221, "epoch": 1173} {"train_loss": -11.505765914916992, "global_step": 197222, "epoch": 1173} {"train_loss": -11.714553833007812, "global_step": 197223, "epoch": 1173} {"train_loss": -11.55795955657959, "global_step": 197224, "epoch": 1173} {"train_loss": -11.586222648620605, "global_step": 197225, "epoch": 1173} {"train_loss": -11.70870590209961, "global_step": 197226, "epoch": 1173} {"train_loss": -11.452624320983887, "global_step": 197227, "epoch": 1173} {"train_loss": -11.641407012939453, "global_step": 197228, "epoch": 1173} {"train_loss": -11.450039863586426, "global_step": 197229, "epoch": 1173} {"train_loss": -11.401065826416016, "global_step": 197230, "epoch": 1173} {"train_loss": -11.301376178151084, "global_step": 197231, "epoch": 1173, "val_loss": 250318.96875} {"train_loss": -11.821763038635254, "global_step": 197232, "epoch": 1174} {"train_loss": -11.03303337097168, "global_step": 197233, "epoch": 1174} {"train_loss": -11.6563720703125, "global_step": 197234, "epoch": 1174} {"train_loss": -11.383094787597656, "global_step": 197235, "epoch": 1174} {"train_loss": -11.679740905761719, "global_step": 197236, "epoch": 1174} {"train_loss": -11.135139465332031, "global_step": 197237, "epoch": 1174} {"train_loss": -10.88166618347168, "global_step": 197238, "epoch": 1174} {"train_loss": -11.694258689880371, "global_step": 197239, "epoch": 1174} {"train_loss": -10.992101669311523, "global_step": 197240, "epoch": 1174} {"train_loss": -11.056605339050293, "global_step": 197241, "epoch": 1174} {"train_loss": -11.549116134643555, "global_step": 197242, "epoch": 1174} {"train_loss": -11.348382949829102, "global_step": 197243, "epoch": 1174} {"train_loss": -10.747390747070312, "global_step": 197244, "epoch": 1174} {"train_loss": -10.802549362182617, "global_step": 197245, "epoch": 1174} {"train_loss": -11.463781356811523, "global_step": 197246, "epoch": 1174} {"train_loss": -11.175857543945312, "global_step": 197247, "epoch": 1174} {"train_loss": -11.368340492248535, "global_step": 197248, "epoch": 1174} {"train_loss": -11.30129623413086, "global_step": 197249, "epoch": 1174} {"train_loss": -11.096834182739258, "global_step": 197250, "epoch": 1174} {"train_loss": -11.53355598449707, "global_step": 197251, "epoch": 1174} {"train_loss": -11.365766525268555, "global_step": 197252, "epoch": 1174} {"train_loss": -11.413040161132812, "global_step": 197253, "epoch": 1174} {"train_loss": -11.523128509521484, "global_step": 197254, "epoch": 1174} {"train_loss": -11.43064022064209, "global_step": 197255, "epoch": 1174} {"train_loss": -11.454536437988281, "global_step": 197256, "epoch": 1174} {"train_loss": -10.909465789794922, "global_step": 197257, "epoch": 1174} {"train_loss": -11.332096099853516, "global_step": 197258, "epoch": 1174} {"train_loss": -11.51154613494873, "global_step": 197259, "epoch": 1174} {"train_loss": -11.483642578125, "global_step": 197260, "epoch": 1174} {"train_loss": -11.085102081298828, "global_step": 197261, "epoch": 1174} {"train_loss": -11.093049049377441, "global_step": 197262, "epoch": 1174} {"train_loss": -10.559038162231445, "global_step": 197263, "epoch": 1174} {"train_loss": -11.036617279052734, "global_step": 197264, "epoch": 1174} {"train_loss": -10.982892990112305, "global_step": 197265, "epoch": 1174} {"train_loss": -11.153406143188477, "global_step": 197266, "epoch": 1174} {"train_loss": -10.371604919433594, "global_step": 197267, "epoch": 1174} {"train_loss": -11.489110946655273, "global_step": 197268, "epoch": 1174} {"train_loss": -10.479676246643066, "global_step": 197269, "epoch": 1174} {"train_loss": -11.335088729858398, "global_step": 197270, "epoch": 1174} {"train_loss": -10.682941436767578, "global_step": 197271, "epoch": 1174} {"train_loss": -11.07279109954834, "global_step": 197272, "epoch": 1174} {"train_loss": -11.081825256347656, "global_step": 197273, "epoch": 1174} {"train_loss": -11.219064712524414, "global_step": 197274, "epoch": 1174} {"train_loss": -11.160982131958008, "global_step": 197275, "epoch": 1174} {"train_loss": -10.883316040039062, "global_step": 197276, "epoch": 1174} {"train_loss": -11.462864875793457, "global_step": 197277, "epoch": 1174} {"train_loss": -11.052253723144531, "global_step": 197278, "epoch": 1174} {"train_loss": -11.488958358764648, "global_step": 197279, "epoch": 1174} {"train_loss": -11.534624099731445, "global_step": 197280, "epoch": 1174} {"train_loss": -10.974823951721191, "global_step": 197281, "epoch": 1174} {"train_loss": -11.562390327453613, "global_step": 197282, "epoch": 1174} {"train_loss": -10.845714569091797, "global_step": 197283, "epoch": 1174} {"train_loss": -11.274168968200684, "global_step": 197284, "epoch": 1174} {"train_loss": -10.896193504333496, "global_step": 197285, "epoch": 1174} {"train_loss": -11.243927001953125, "global_step": 197286, "epoch": 1174} {"train_loss": -10.934374809265137, "global_step": 197287, "epoch": 1174} {"train_loss": -11.321313858032227, "global_step": 197288, "epoch": 1174} {"train_loss": -11.177164077758789, "global_step": 197289, "epoch": 1174} {"train_loss": -10.686149597167969, "global_step": 197290, "epoch": 1174} {"train_loss": -11.382173538208008, "global_step": 197291, "epoch": 1174} {"train_loss": -10.83734130859375, "global_step": 197292, "epoch": 1174} {"train_loss": -10.839427947998047, "global_step": 197293, "epoch": 1174} {"train_loss": -11.093809127807617, "global_step": 197294, "epoch": 1174} {"train_loss": -10.662353515625, "global_step": 197295, "epoch": 1174} {"train_loss": -10.342470169067383, "global_step": 197296, "epoch": 1174} {"train_loss": -9.658149719238281, "global_step": 197297, "epoch": 1174} {"train_loss": -10.385892868041992, "global_step": 197298, "epoch": 1174} {"train_loss": -9.685134887695312, "global_step": 197299, "epoch": 1174} {"train_loss": -10.875441551208496, "global_step": 197300, "epoch": 1174} {"train_loss": -9.703646659851074, "global_step": 197301, "epoch": 1174} {"train_loss": -10.411066055297852, "global_step": 197302, "epoch": 1174} {"train_loss": -10.140901565551758, "global_step": 197303, "epoch": 1174} {"train_loss": -10.123933792114258, "global_step": 197304, "epoch": 1174} {"train_loss": -10.295160293579102, "global_step": 197305, "epoch": 1174} {"train_loss": -10.394075393676758, "global_step": 197306, "epoch": 1174} {"train_loss": -9.816080093383789, "global_step": 197307, "epoch": 1174} {"train_loss": -11.204275131225586, "global_step": 197308, "epoch": 1174} {"train_loss": -10.151458740234375, "global_step": 197309, "epoch": 1174} {"train_loss": -10.543764114379883, "global_step": 197310, "epoch": 1174} {"train_loss": -10.695208549499512, "global_step": 197311, "epoch": 1174} {"train_loss": -10.19288444519043, "global_step": 197312, "epoch": 1174} {"train_loss": -10.557497024536133, "global_step": 197313, "epoch": 1174} {"train_loss": -10.993218421936035, "global_step": 197314, "epoch": 1174} {"train_loss": -10.450423240661621, "global_step": 197315, "epoch": 1174} {"train_loss": -11.163764953613281, "global_step": 197316, "epoch": 1174} {"train_loss": -11.270788192749023, "global_step": 197317, "epoch": 1174} {"train_loss": -10.357453346252441, "global_step": 197318, "epoch": 1174} {"train_loss": -11.174171447753906, "global_step": 197319, "epoch": 1174} {"train_loss": -10.787700653076172, "global_step": 197320, "epoch": 1174} {"train_loss": -11.101128578186035, "global_step": 197321, "epoch": 1174} {"train_loss": -11.225173950195312, "global_step": 197322, "epoch": 1174} {"train_loss": -11.183238983154297, "global_step": 197323, "epoch": 1174} {"train_loss": -10.934693336486816, "global_step": 197324, "epoch": 1174} {"train_loss": -11.379632949829102, "global_step": 197325, "epoch": 1174} {"train_loss": -11.173377990722656, "global_step": 197326, "epoch": 1174} {"train_loss": -11.011772155761719, "global_step": 197327, "epoch": 1174} {"train_loss": -11.256767272949219, "global_step": 197328, "epoch": 1174} {"train_loss": -11.133626937866211, "global_step": 197329, "epoch": 1174} {"train_loss": -11.347013473510742, "global_step": 197330, "epoch": 1174} {"train_loss": -11.375029563903809, "global_step": 197331, "epoch": 1174} {"train_loss": -11.508935928344727, "global_step": 197332, "epoch": 1174} {"train_loss": -11.035531997680664, "global_step": 197333, "epoch": 1174} {"train_loss": -11.404834747314453, "global_step": 197334, "epoch": 1174} {"train_loss": -11.40095043182373, "global_step": 197335, "epoch": 1174} {"train_loss": -11.348735809326172, "global_step": 197336, "epoch": 1174} {"train_loss": -11.445305824279785, "global_step": 197337, "epoch": 1174} {"train_loss": -11.427656173706055, "global_step": 197338, "epoch": 1174} {"train_loss": -11.428238868713379, "global_step": 197339, "epoch": 1174} {"train_loss": -11.552019119262695, "global_step": 197340, "epoch": 1174} {"train_loss": -11.38001823425293, "global_step": 197341, "epoch": 1174} {"train_loss": -11.592094421386719, "global_step": 197342, "epoch": 1174} {"train_loss": -11.507946014404297, "global_step": 197343, "epoch": 1174} {"train_loss": -11.435685157775879, "global_step": 197344, "epoch": 1174} {"train_loss": -11.48672866821289, "global_step": 197345, "epoch": 1174} {"train_loss": -11.43758773803711, "global_step": 197346, "epoch": 1174} {"train_loss": -11.639713287353516, "global_step": 197347, "epoch": 1174} {"train_loss": -11.442183494567871, "global_step": 197348, "epoch": 1174} {"train_loss": -11.671722412109375, "global_step": 197349, "epoch": 1174} {"train_loss": -11.558237075805664, "global_step": 197350, "epoch": 1174} {"train_loss": -11.603516578674316, "global_step": 197351, "epoch": 1174} {"train_loss": -11.60642147064209, "global_step": 197352, "epoch": 1174} {"train_loss": -11.606637954711914, "global_step": 197353, "epoch": 1174} {"train_loss": -11.630875587463379, "global_step": 197354, "epoch": 1174} {"train_loss": -11.693254470825195, "global_step": 197355, "epoch": 1174} {"train_loss": -11.21193790435791, "global_step": 197356, "epoch": 1174} {"train_loss": -11.662022590637207, "global_step": 197357, "epoch": 1174} {"train_loss": -11.56079387664795, "global_step": 197358, "epoch": 1174} {"train_loss": -11.841961860656738, "global_step": 197359, "epoch": 1174} {"train_loss": -11.77767276763916, "global_step": 197360, "epoch": 1174} {"train_loss": -11.7403564453125, "global_step": 197361, "epoch": 1174} {"train_loss": -11.573760986328125, "global_step": 197362, "epoch": 1174} {"train_loss": -11.809388160705566, "global_step": 197363, "epoch": 1174} {"train_loss": -11.595093727111816, "global_step": 197364, "epoch": 1174} {"train_loss": -11.690732955932617, "global_step": 197365, "epoch": 1174} {"train_loss": -11.659573554992676, "global_step": 197366, "epoch": 1174} {"train_loss": -11.726127624511719, "global_step": 197367, "epoch": 1174} {"train_loss": -11.609808921813965, "global_step": 197368, "epoch": 1174} {"train_loss": -11.536808013916016, "global_step": 197369, "epoch": 1174} {"train_loss": -11.453868865966797, "global_step": 197370, "epoch": 1174} {"train_loss": -11.532929420471191, "global_step": 197371, "epoch": 1174} {"train_loss": -11.344256401062012, "global_step": 197372, "epoch": 1174} {"train_loss": -11.673095703125, "global_step": 197373, "epoch": 1174} {"train_loss": -11.911375045776367, "global_step": 197374, "epoch": 1174} {"train_loss": -11.772283554077148, "global_step": 197375, "epoch": 1174} {"train_loss": -11.241120338439941, "global_step": 197376, "epoch": 1174} {"train_loss": -11.767300605773926, "global_step": 197377, "epoch": 1174} {"train_loss": -11.599189758300781, "global_step": 197378, "epoch": 1174} {"train_loss": -12.003928184509277, "global_step": 197379, "epoch": 1174} {"train_loss": -11.195566177368164, "global_step": 197380, "epoch": 1174} {"train_loss": -10.919089317321777, "global_step": 197381, "epoch": 1174} {"train_loss": -10.5432767868042, "global_step": 197382, "epoch": 1174} {"train_loss": -10.791123390197754, "global_step": 197383, "epoch": 1174} {"train_loss": -11.076066970825195, "global_step": 197384, "epoch": 1174} {"train_loss": -10.97236442565918, "global_step": 197385, "epoch": 1174} {"train_loss": -10.984017372131348, "global_step": 197386, "epoch": 1174} {"train_loss": -11.031871795654297, "global_step": 197387, "epoch": 1174} {"train_loss": -10.838188171386719, "global_step": 197388, "epoch": 1174} {"train_loss": -11.021366119384766, "global_step": 197389, "epoch": 1174} {"train_loss": -11.299245834350586, "global_step": 197390, "epoch": 1174} {"train_loss": -11.27220344543457, "global_step": 197391, "epoch": 1174} {"train_loss": -11.607125282287598, "global_step": 197392, "epoch": 1174} {"train_loss": -11.218366622924805, "global_step": 197393, "epoch": 1174} {"train_loss": -11.124577522277832, "global_step": 197394, "epoch": 1174} {"train_loss": -10.56367015838623, "global_step": 197395, "epoch": 1174} {"train_loss": -10.774358749389648, "global_step": 197396, "epoch": 1174} {"train_loss": -11.153287887573242, "global_step": 197397, "epoch": 1174} {"train_loss": -10.476524353027344, "global_step": 197398, "epoch": 1174} {"train_loss": -11.153646190961203, "global_step": 197399, "epoch": 1174, "val_loss": 248959.140625} {"train_loss": -11.215253829956055, "global_step": 197400, "epoch": 1175} {"train_loss": -10.997358322143555, "global_step": 197401, "epoch": 1175} {"train_loss": -11.015155792236328, "global_step": 197402, "epoch": 1175} {"train_loss": -10.801309585571289, "global_step": 197403, "epoch": 1175} {"train_loss": -11.054839134216309, "global_step": 197404, "epoch": 1175} {"train_loss": -10.322072982788086, "global_step": 197405, "epoch": 1175} {"train_loss": -10.13232135772705, "global_step": 197406, "epoch": 1175} {"train_loss": -11.051416397094727, "global_step": 197407, "epoch": 1175} {"train_loss": -10.378799438476562, "global_step": 197408, "epoch": 1175} {"train_loss": -10.888334274291992, "global_step": 197409, "epoch": 1175} {"train_loss": -10.463205337524414, "global_step": 197410, "epoch": 1175} {"train_loss": -10.916269302368164, "global_step": 197411, "epoch": 1175} {"train_loss": -10.766721725463867, "global_step": 197412, "epoch": 1175} {"train_loss": -11.083636283874512, "global_step": 197413, "epoch": 1175} {"train_loss": -10.608505249023438, "global_step": 197414, "epoch": 1175} {"train_loss": -11.074060440063477, "global_step": 197415, "epoch": 1175} {"train_loss": -10.70339584350586, "global_step": 197416, "epoch": 1175} {"train_loss": -11.18571662902832, "global_step": 197417, "epoch": 1175} {"train_loss": -11.3213472366333, "global_step": 197418, "epoch": 1175} {"train_loss": -11.235172271728516, "global_step": 197419, "epoch": 1175} {"train_loss": -11.35546588897705, "global_step": 197420, "epoch": 1175} {"train_loss": -11.196954727172852, "global_step": 197421, "epoch": 1175} {"train_loss": -11.152114868164062, "global_step": 197422, "epoch": 1175} {"train_loss": -11.286287307739258, "global_step": 197423, "epoch": 1175} {"train_loss": -11.157790184020996, "global_step": 197424, "epoch": 1175} {"train_loss": -11.092506408691406, "global_step": 197425, "epoch": 1175} {"train_loss": -11.266010284423828, "global_step": 197426, "epoch": 1175} {"train_loss": -11.221710205078125, "global_step": 197427, "epoch": 1175} {"train_loss": -11.053831100463867, "global_step": 197428, "epoch": 1175} {"train_loss": -11.336047172546387, "global_step": 197429, "epoch": 1175} {"train_loss": -11.132854461669922, "global_step": 197430, "epoch": 1175} {"train_loss": -11.149001121520996, "global_step": 197431, "epoch": 1175} {"train_loss": -11.472140312194824, "global_step": 197432, "epoch": 1175} {"train_loss": -11.126055717468262, "global_step": 197433, "epoch": 1175} {"train_loss": -11.482297897338867, "global_step": 197434, "epoch": 1175} {"train_loss": -11.348844528198242, "global_step": 197435, "epoch": 1175} {"train_loss": -11.247770309448242, "global_step": 197436, "epoch": 1175} {"train_loss": -11.455836296081543, "global_step": 197437, "epoch": 1175} {"train_loss": -11.38204574584961, "global_step": 197438, "epoch": 1175} {"train_loss": -11.371786117553711, "global_step": 197439, "epoch": 1175} {"train_loss": -11.560750007629395, "global_step": 197440, "epoch": 1175} {"train_loss": -11.517440795898438, "global_step": 197441, "epoch": 1175} {"train_loss": -11.499167442321777, "global_step": 197442, "epoch": 1175} {"train_loss": -11.454179763793945, "global_step": 197443, "epoch": 1175} {"train_loss": -11.54217529296875, "global_step": 197444, "epoch": 1175} {"train_loss": -11.623992919921875, "global_step": 197445, "epoch": 1175} {"train_loss": -11.591279983520508, "global_step": 197446, "epoch": 1175} {"train_loss": -11.628589630126953, "global_step": 197447, "epoch": 1175} {"train_loss": -11.55474853515625, "global_step": 197448, "epoch": 1175} {"train_loss": -11.666886329650879, "global_step": 197449, "epoch": 1175} {"train_loss": -11.0599365234375, "global_step": 197450, "epoch": 1175} {"train_loss": -11.50015926361084, "global_step": 197451, "epoch": 1175} {"train_loss": -11.39858627319336, "global_step": 197452, "epoch": 1175} {"train_loss": -11.290721893310547, "global_step": 197453, "epoch": 1175} {"train_loss": -11.373093605041504, "global_step": 197454, "epoch": 1175} {"train_loss": -11.427106857299805, "global_step": 197455, "epoch": 1175} {"train_loss": -11.631294250488281, "global_step": 197456, "epoch": 1175} {"train_loss": -11.425125122070312, "global_step": 197457, "epoch": 1175} {"train_loss": -11.438821792602539, "global_step": 197458, "epoch": 1175} {"train_loss": -11.441431045532227, "global_step": 197459, "epoch": 1175} {"train_loss": -11.028647422790527, "global_step": 197460, "epoch": 1175} {"train_loss": -11.517450332641602, "global_step": 197461, "epoch": 1175} {"train_loss": -11.275985717773438, "global_step": 197462, "epoch": 1175} {"train_loss": -11.281391143798828, "global_step": 197463, "epoch": 1175} {"train_loss": -10.6832914352417, "global_step": 197464, "epoch": 1175} {"train_loss": -11.304532051086426, "global_step": 197465, "epoch": 1175} {"train_loss": -11.588071823120117, "global_step": 197466, "epoch": 1175} {"train_loss": -11.221293449401855, "global_step": 197467, "epoch": 1175} {"train_loss": -11.396997451782227, "global_step": 197468, "epoch": 1175} {"train_loss": -11.062166213989258, "global_step": 197469, "epoch": 1175} {"train_loss": -11.34179973602295, "global_step": 197470, "epoch": 1175} {"train_loss": -11.178038597106934, "global_step": 197471, "epoch": 1175} {"train_loss": -11.485427856445312, "global_step": 197472, "epoch": 1175} {"train_loss": -11.270331382751465, "global_step": 197473, "epoch": 1175} {"train_loss": -11.348320960998535, "global_step": 197474, "epoch": 1175} {"train_loss": -11.446199417114258, "global_step": 197475, "epoch": 1175} {"train_loss": -11.552888870239258, "global_step": 197476, "epoch": 1175} {"train_loss": -11.244599342346191, "global_step": 197477, "epoch": 1175} {"train_loss": -11.457324981689453, "global_step": 197478, "epoch": 1175} {"train_loss": -11.678512573242188, "global_step": 197479, "epoch": 1175} {"train_loss": -11.359816551208496, "global_step": 197480, "epoch": 1175} {"train_loss": -11.090819358825684, "global_step": 197481, "epoch": 1175} {"train_loss": -11.58865737915039, "global_step": 197482, "epoch": 1175} {"train_loss": -11.591541290283203, "global_step": 197483, "epoch": 1175} {"train_loss": -11.709009170532227, "global_step": 197484, "epoch": 1175} {"train_loss": -11.661918640136719, "global_step": 197485, "epoch": 1175} {"train_loss": -11.22933578491211, "global_step": 197486, "epoch": 1175} {"train_loss": -11.637139320373535, "global_step": 197487, "epoch": 1175} {"train_loss": -11.393974304199219, "global_step": 197488, "epoch": 1175} {"train_loss": -11.228093147277832, "global_step": 197489, "epoch": 1175} {"train_loss": -11.468990325927734, "global_step": 197490, "epoch": 1175} {"train_loss": -11.70331859588623, "global_step": 197491, "epoch": 1175} {"train_loss": -11.099343299865723, "global_step": 197492, "epoch": 1175} {"train_loss": -11.706901550292969, "global_step": 197493, "epoch": 1175} {"train_loss": -11.15102767944336, "global_step": 197494, "epoch": 1175} {"train_loss": -11.38272476196289, "global_step": 197495, "epoch": 1175} {"train_loss": -11.430685043334961, "global_step": 197496, "epoch": 1175} {"train_loss": -11.448066711425781, "global_step": 197497, "epoch": 1175} {"train_loss": -11.03296184539795, "global_step": 197498, "epoch": 1175} {"train_loss": -11.670750617980957, "global_step": 197499, "epoch": 1175} {"train_loss": -11.261651992797852, "global_step": 197500, "epoch": 1175} {"train_loss": -11.338581085205078, "global_step": 197501, "epoch": 1175} {"train_loss": -11.476003646850586, "global_step": 197502, "epoch": 1175} {"train_loss": -11.684160232543945, "global_step": 197503, "epoch": 1175} {"train_loss": -11.416969299316406, "global_step": 197504, "epoch": 1175} {"train_loss": -11.778902053833008, "global_step": 197505, "epoch": 1175} {"train_loss": -11.482563018798828, "global_step": 197506, "epoch": 1175} {"train_loss": -11.52924633026123, "global_step": 197507, "epoch": 1175} {"train_loss": -11.588528633117676, "global_step": 197508, "epoch": 1175} {"train_loss": -11.392858505249023, "global_step": 197509, "epoch": 1175} {"train_loss": -11.237863540649414, "global_step": 197510, "epoch": 1175} {"train_loss": -11.448530197143555, "global_step": 197511, "epoch": 1175} {"train_loss": -11.091732025146484, "global_step": 197512, "epoch": 1175} {"train_loss": -10.903125762939453, "global_step": 197513, "epoch": 1175} {"train_loss": -11.49123477935791, "global_step": 197514, "epoch": 1175} {"train_loss": -11.159296035766602, "global_step": 197515, "epoch": 1175} {"train_loss": -11.453436851501465, "global_step": 197516, "epoch": 1175} {"train_loss": -10.964920043945312, "global_step": 197517, "epoch": 1175} {"train_loss": -11.136761665344238, "global_step": 197518, "epoch": 1175} {"train_loss": -10.807493209838867, "global_step": 197519, "epoch": 1175} {"train_loss": -11.080894470214844, "global_step": 197520, "epoch": 1175} {"train_loss": -11.076526641845703, "global_step": 197521, "epoch": 1175} {"train_loss": -10.87535285949707, "global_step": 197522, "epoch": 1175} {"train_loss": -11.201292037963867, "global_step": 197523, "epoch": 1175} {"train_loss": -11.190688133239746, "global_step": 197524, "epoch": 1175} {"train_loss": -11.022451400756836, "global_step": 197525, "epoch": 1175} {"train_loss": -10.891389846801758, "global_step": 197526, "epoch": 1175} {"train_loss": -11.092726707458496, "global_step": 197527, "epoch": 1175} {"train_loss": -10.581164360046387, "global_step": 197528, "epoch": 1175} {"train_loss": -11.15015697479248, "global_step": 197529, "epoch": 1175} {"train_loss": -10.675935745239258, "global_step": 197530, "epoch": 1175} {"train_loss": -11.113203048706055, "global_step": 197531, "epoch": 1175} {"train_loss": -10.861285209655762, "global_step": 197532, "epoch": 1175} {"train_loss": -11.018407821655273, "global_step": 197533, "epoch": 1175} {"train_loss": -10.913511276245117, "global_step": 197534, "epoch": 1175} {"train_loss": -11.088068008422852, "global_step": 197535, "epoch": 1175} {"train_loss": -11.33333969116211, "global_step": 197536, "epoch": 1175} {"train_loss": -10.738618850708008, "global_step": 197537, "epoch": 1175} {"train_loss": -11.325490951538086, "global_step": 197538, "epoch": 1175} {"train_loss": -10.875875473022461, "global_step": 197539, "epoch": 1175} {"train_loss": -11.038680076599121, "global_step": 197540, "epoch": 1175} {"train_loss": -11.201570510864258, "global_step": 197541, "epoch": 1175} {"train_loss": -10.474309921264648, "global_step": 197542, "epoch": 1175} {"train_loss": -11.226715087890625, "global_step": 197543, "epoch": 1175} {"train_loss": -11.236645698547363, "global_step": 197544, "epoch": 1175} {"train_loss": -10.79426097869873, "global_step": 197545, "epoch": 1175} {"train_loss": -11.45376968383789, "global_step": 197546, "epoch": 1175} {"train_loss": -10.920581817626953, "global_step": 197547, "epoch": 1175} {"train_loss": -11.459379196166992, "global_step": 197548, "epoch": 1175} {"train_loss": -11.1240234375, "global_step": 197549, "epoch": 1175} {"train_loss": -11.24773120880127, "global_step": 197550, "epoch": 1175} {"train_loss": -11.481918334960938, "global_step": 197551, "epoch": 1175} {"train_loss": -11.45515251159668, "global_step": 197552, "epoch": 1175} {"train_loss": -11.437594413757324, "global_step": 197553, "epoch": 1175} {"train_loss": -11.417261123657227, "global_step": 197554, "epoch": 1175} {"train_loss": -11.430598258972168, "global_step": 197555, "epoch": 1175} {"train_loss": -11.334199905395508, "global_step": 197556, "epoch": 1175} {"train_loss": -11.40041732788086, "global_step": 197557, "epoch": 1175} {"train_loss": -11.214540481567383, "global_step": 197558, "epoch": 1175} {"train_loss": -11.244433403015137, "global_step": 197559, "epoch": 1175} {"train_loss": -11.54076099395752, "global_step": 197560, "epoch": 1175} {"train_loss": -11.47938346862793, "global_step": 197561, "epoch": 1175} {"train_loss": -10.954078674316406, "global_step": 197562, "epoch": 1175} {"train_loss": -11.353058815002441, "global_step": 197563, "epoch": 1175} {"train_loss": -11.34659194946289, "global_step": 197564, "epoch": 1175} {"train_loss": -11.47546672821045, "global_step": 197565, "epoch": 1175} {"train_loss": -11.266860961914062, "global_step": 197566, "epoch": 1175} {"train_loss": -11.246643151555743, "global_step": 197567, "epoch": 1175, "val_loss": 249483.484375, "train_action_mse_error": 1.1141252517700195} {"train_loss": -11.326309204101562, "global_step": 197568, "epoch": 1176} {"train_loss": -11.431355476379395, "global_step": 197569, "epoch": 1176} {"train_loss": -11.223438262939453, "global_step": 197570, "epoch": 1176} {"train_loss": -11.274356842041016, "global_step": 197571, "epoch": 1176} {"train_loss": -11.443602561950684, "global_step": 197572, "epoch": 1176} {"train_loss": -11.234345436096191, "global_step": 197573, "epoch": 1176} {"train_loss": -11.052263259887695, "global_step": 197574, "epoch": 1176} {"train_loss": -11.056655883789062, "global_step": 197575, "epoch": 1176} {"train_loss": -11.471551895141602, "global_step": 197576, "epoch": 1176} {"train_loss": -11.377695083618164, "global_step": 197577, "epoch": 1176} {"train_loss": -11.294044494628906, "global_step": 197578, "epoch": 1176} {"train_loss": -11.148229598999023, "global_step": 197579, "epoch": 1176} {"train_loss": -11.148416519165039, "global_step": 197580, "epoch": 1176} {"train_loss": -11.401227951049805, "global_step": 197581, "epoch": 1176} {"train_loss": -11.101151466369629, "global_step": 197582, "epoch": 1176} {"train_loss": -11.370903015136719, "global_step": 197583, "epoch": 1176} {"train_loss": -11.63869857788086, "global_step": 197584, "epoch": 1176} {"train_loss": -11.508535385131836, "global_step": 197585, "epoch": 1176} {"train_loss": -11.672225952148438, "global_step": 197586, "epoch": 1176} {"train_loss": -11.369195938110352, "global_step": 197587, "epoch": 1176} {"train_loss": -11.523880004882812, "global_step": 197588, "epoch": 1176} {"train_loss": -11.540626525878906, "global_step": 197589, "epoch": 1176} {"train_loss": -11.542278289794922, "global_step": 197590, "epoch": 1176} {"train_loss": -11.658227920532227, "global_step": 197591, "epoch": 1176} {"train_loss": -11.767911911010742, "global_step": 197592, "epoch": 1176} {"train_loss": -11.453174591064453, "global_step": 197593, "epoch": 1176} {"train_loss": -11.355681419372559, "global_step": 197594, "epoch": 1176} {"train_loss": -11.298969268798828, "global_step": 197595, "epoch": 1176} {"train_loss": -11.279413223266602, "global_step": 197596, "epoch": 1176} {"train_loss": -11.318038940429688, "global_step": 197597, "epoch": 1176} {"train_loss": -11.321304321289062, "global_step": 197598, "epoch": 1176} {"train_loss": -11.245885848999023, "global_step": 197599, "epoch": 1176} {"train_loss": -11.15553092956543, "global_step": 197600, "epoch": 1176} {"train_loss": -11.09228515625, "global_step": 197601, "epoch": 1176} {"train_loss": -11.72241497039795, "global_step": 197602, "epoch": 1176} {"train_loss": -10.205474853515625, "global_step": 197603, "epoch": 1176} {"train_loss": -10.778539657592773, "global_step": 197604, "epoch": 1176} {"train_loss": -11.373397827148438, "global_step": 197605, "epoch": 1176} {"train_loss": -11.000152587890625, "global_step": 197606, "epoch": 1176} {"train_loss": -11.395746231079102, "global_step": 197607, "epoch": 1176} {"train_loss": -11.168931007385254, "global_step": 197608, "epoch": 1176} {"train_loss": -11.122827529907227, "global_step": 197609, "epoch": 1176} {"train_loss": -11.335391998291016, "global_step": 197610, "epoch": 1176} {"train_loss": -11.31124496459961, "global_step": 197611, "epoch": 1176} {"train_loss": -10.861852645874023, "global_step": 197612, "epoch": 1176} {"train_loss": -11.071403503417969, "global_step": 197613, "epoch": 1176} {"train_loss": -11.374950408935547, "global_step": 197614, "epoch": 1176} {"train_loss": -11.330486297607422, "global_step": 197615, "epoch": 1176} {"train_loss": -11.331844329833984, "global_step": 197616, "epoch": 1176} {"train_loss": -11.394665718078613, "global_step": 197617, "epoch": 1176} {"train_loss": -11.381579399108887, "global_step": 197618, "epoch": 1176} {"train_loss": -11.428303718566895, "global_step": 197619, "epoch": 1176} {"train_loss": -11.450060844421387, "global_step": 197620, "epoch": 1176} {"train_loss": -10.937074661254883, "global_step": 197621, "epoch": 1176} {"train_loss": -10.881118774414062, "global_step": 197622, "epoch": 1176} {"train_loss": -11.6305513381958, "global_step": 197623, "epoch": 1176} {"train_loss": -10.978302955627441, "global_step": 197624, "epoch": 1176} {"train_loss": -11.70824909210205, "global_step": 197625, "epoch": 1176} {"train_loss": -11.04112720489502, "global_step": 197626, "epoch": 1176} {"train_loss": -11.344009399414062, "global_step": 197627, "epoch": 1176} {"train_loss": -11.590744018554688, "global_step": 197628, "epoch": 1176} {"train_loss": -11.059648513793945, "global_step": 197629, "epoch": 1176} {"train_loss": -11.69822883605957, "global_step": 197630, "epoch": 1176} {"train_loss": -11.292755126953125, "global_step": 197631, "epoch": 1176} {"train_loss": -11.392080307006836, "global_step": 197632, "epoch": 1176} {"train_loss": -11.37769889831543, "global_step": 197633, "epoch": 1176} {"train_loss": -11.495800971984863, "global_step": 197634, "epoch": 1176} {"train_loss": -11.308046340942383, "global_step": 197635, "epoch": 1176} {"train_loss": -11.338289260864258, "global_step": 197636, "epoch": 1176} {"train_loss": -11.505364418029785, "global_step": 197637, "epoch": 1176} {"train_loss": -10.907156944274902, "global_step": 197638, "epoch": 1176} {"train_loss": -11.227327346801758, "global_step": 197639, "epoch": 1176} {"train_loss": -11.379566192626953, "global_step": 197640, "epoch": 1176} {"train_loss": -10.744084358215332, "global_step": 197641, "epoch": 1176} {"train_loss": -11.564451217651367, "global_step": 197642, "epoch": 1176} {"train_loss": -11.108542442321777, "global_step": 197643, "epoch": 1176} {"train_loss": -10.77560043334961, "global_step": 197644, "epoch": 1176} {"train_loss": -11.442525863647461, "global_step": 197645, "epoch": 1176} {"train_loss": -10.948808670043945, "global_step": 197646, "epoch": 1176} {"train_loss": -11.381694793701172, "global_step": 197647, "epoch": 1176} {"train_loss": -11.468558311462402, "global_step": 197648, "epoch": 1176} {"train_loss": -11.32550048828125, "global_step": 197649, "epoch": 1176} {"train_loss": -11.516605377197266, "global_step": 197650, "epoch": 1176} {"train_loss": -11.187312126159668, "global_step": 197651, "epoch": 1176} {"train_loss": -11.304492950439453, "global_step": 197652, "epoch": 1176} {"train_loss": -11.490503311157227, "global_step": 197653, "epoch": 1176} {"train_loss": -11.164018630981445, "global_step": 197654, "epoch": 1176} {"train_loss": -11.403797149658203, "global_step": 197655, "epoch": 1176} {"train_loss": -11.422004699707031, "global_step": 197656, "epoch": 1176} {"train_loss": -11.732129096984863, "global_step": 197657, "epoch": 1176} {"train_loss": -11.267387390136719, "global_step": 197658, "epoch": 1176} {"train_loss": -11.580586433410645, "global_step": 197659, "epoch": 1176} {"train_loss": -11.30998706817627, "global_step": 197660, "epoch": 1176} {"train_loss": -11.497821807861328, "global_step": 197661, "epoch": 1176} {"train_loss": -11.394704818725586, "global_step": 197662, "epoch": 1176} {"train_loss": -11.557273864746094, "global_step": 197663, "epoch": 1176} {"train_loss": -11.674420356750488, "global_step": 197664, "epoch": 1176} {"train_loss": -11.3682861328125, "global_step": 197665, "epoch": 1176} {"train_loss": -11.399179458618164, "global_step": 197666, "epoch": 1176} {"train_loss": -11.58662223815918, "global_step": 197667, "epoch": 1176} {"train_loss": -11.743551254272461, "global_step": 197668, "epoch": 1176} {"train_loss": -11.375527381896973, "global_step": 197669, "epoch": 1176} {"train_loss": -11.340192794799805, "global_step": 197670, "epoch": 1176} {"train_loss": -11.715142250061035, "global_step": 197671, "epoch": 1176} {"train_loss": -11.548929214477539, "global_step": 197672, "epoch": 1176} {"train_loss": -11.557137489318848, "global_step": 197673, "epoch": 1176} {"train_loss": -11.20528793334961, "global_step": 197674, "epoch": 1176} {"train_loss": -11.336897850036621, "global_step": 197675, "epoch": 1176} {"train_loss": -11.72269058227539, "global_step": 197676, "epoch": 1176} {"train_loss": -11.186949729919434, "global_step": 197677, "epoch": 1176} {"train_loss": -11.180753707885742, "global_step": 197678, "epoch": 1176} {"train_loss": -11.434446334838867, "global_step": 197679, "epoch": 1176} {"train_loss": -11.354837417602539, "global_step": 197680, "epoch": 1176} {"train_loss": -11.500916481018066, "global_step": 197681, "epoch": 1176} {"train_loss": -11.528939247131348, "global_step": 197682, "epoch": 1176} {"train_loss": -11.276369094848633, "global_step": 197683, "epoch": 1176} {"train_loss": -11.285043716430664, "global_step": 197684, "epoch": 1176} {"train_loss": -11.176636695861816, "global_step": 197685, "epoch": 1176} {"train_loss": -11.431543350219727, "global_step": 197686, "epoch": 1176} {"train_loss": -11.449518203735352, "global_step": 197687, "epoch": 1176} {"train_loss": -11.252978324890137, "global_step": 197688, "epoch": 1176} {"train_loss": -11.421472549438477, "global_step": 197689, "epoch": 1176} {"train_loss": -11.680282592773438, "global_step": 197690, "epoch": 1176} {"train_loss": -11.60661506652832, "global_step": 197691, "epoch": 1176} {"train_loss": -11.092881202697754, "global_step": 197692, "epoch": 1176} {"train_loss": -11.551347732543945, "global_step": 197693, "epoch": 1176} {"train_loss": -11.532818794250488, "global_step": 197694, "epoch": 1176} {"train_loss": -10.862991333007812, "global_step": 197695, "epoch": 1176} {"train_loss": -10.749040603637695, "global_step": 197696, "epoch": 1176} {"train_loss": -11.72320556640625, "global_step": 197697, "epoch": 1176} {"train_loss": -11.490883827209473, "global_step": 197698, "epoch": 1176} {"train_loss": -11.365036010742188, "global_step": 197699, "epoch": 1176} {"train_loss": -11.622760772705078, "global_step": 197700, "epoch": 1176} {"train_loss": -11.695253372192383, "global_step": 197701, "epoch": 1176} {"train_loss": -11.53823184967041, "global_step": 197702, "epoch": 1176} {"train_loss": -11.773367881774902, "global_step": 197703, "epoch": 1176} {"train_loss": -11.531326293945312, "global_step": 197704, "epoch": 1176} {"train_loss": -11.311772346496582, "global_step": 197705, "epoch": 1176} {"train_loss": -11.667203903198242, "global_step": 197706, "epoch": 1176} {"train_loss": -11.490756034851074, "global_step": 197707, "epoch": 1176} {"train_loss": -11.83333969116211, "global_step": 197708, "epoch": 1176} {"train_loss": -11.72785758972168, "global_step": 197709, "epoch": 1176} {"train_loss": -11.547690391540527, "global_step": 197710, "epoch": 1176} {"train_loss": -11.851848602294922, "global_step": 197711, "epoch": 1176} {"train_loss": -11.90156364440918, "global_step": 197712, "epoch": 1176} {"train_loss": -11.539989471435547, "global_step": 197713, "epoch": 1176} {"train_loss": -11.009672164916992, "global_step": 197714, "epoch": 1176} {"train_loss": -11.563911437988281, "global_step": 197715, "epoch": 1176} {"train_loss": -10.649930953979492, "global_step": 197716, "epoch": 1176} {"train_loss": -10.50491714477539, "global_step": 197717, "epoch": 1176} {"train_loss": -10.910247802734375, "global_step": 197718, "epoch": 1176} {"train_loss": -9.702468872070312, "global_step": 197719, "epoch": 1176} {"train_loss": -11.148900985717773, "global_step": 197720, "epoch": 1176} {"train_loss": -10.305171966552734, "global_step": 197721, "epoch": 1176} {"train_loss": -10.143720626831055, "global_step": 197722, "epoch": 1176} {"train_loss": -10.307400703430176, "global_step": 197723, "epoch": 1176} {"train_loss": -10.46212387084961, "global_step": 197724, "epoch": 1176} {"train_loss": -9.978031158447266, "global_step": 197725, "epoch": 1176} {"train_loss": -10.498159408569336, "global_step": 197726, "epoch": 1176} {"train_loss": -9.997007369995117, "global_step": 197727, "epoch": 1176} {"train_loss": -9.6769380569458, "global_step": 197728, "epoch": 1176} {"train_loss": -9.54204273223877, "global_step": 197729, "epoch": 1176} {"train_loss": -10.479284286499023, "global_step": 197730, "epoch": 1176} {"train_loss": -9.877969741821289, "global_step": 197731, "epoch": 1176} {"train_loss": -10.674421310424805, "global_step": 197732, "epoch": 1176} {"train_loss": -9.35980224609375, "global_step": 197733, "epoch": 1176} {"train_loss": -10.144594192504883, "global_step": 197734, "epoch": 1176} {"train_loss": -11.225351117906117, "global_step": 197735, "epoch": 1176, "val_loss": 252885.265625} {"train_loss": -9.894027709960938, "global_step": 197736, "epoch": 1177} {"train_loss": -9.728401184082031, "global_step": 197737, "epoch": 1177} {"train_loss": -9.728660583496094, "global_step": 197738, "epoch": 1177} {"train_loss": -9.990625381469727, "global_step": 197739, "epoch": 1177} {"train_loss": -9.137283325195312, "global_step": 197740, "epoch": 1177} {"train_loss": -10.465229034423828, "global_step": 197741, "epoch": 1177} {"train_loss": -9.657352447509766, "global_step": 197742, "epoch": 1177} {"train_loss": -10.602550506591797, "global_step": 197743, "epoch": 1177} {"train_loss": -9.614460945129395, "global_step": 197744, "epoch": 1177} {"train_loss": -10.62681770324707, "global_step": 197745, "epoch": 1177} {"train_loss": -10.184800148010254, "global_step": 197746, "epoch": 1177} {"train_loss": -10.426841735839844, "global_step": 197747, "epoch": 1177} {"train_loss": -10.672273635864258, "global_step": 197748, "epoch": 1177} {"train_loss": -9.938655853271484, "global_step": 197749, "epoch": 1177} {"train_loss": -10.949871063232422, "global_step": 197750, "epoch": 1177} {"train_loss": -10.751164436340332, "global_step": 197751, "epoch": 1177} {"train_loss": -10.478344917297363, "global_step": 197752, "epoch": 1177} {"train_loss": -10.984759330749512, "global_step": 197753, "epoch": 1177} {"train_loss": -10.77880859375, "global_step": 197754, "epoch": 1177} {"train_loss": -10.581871032714844, "global_step": 197755, "epoch": 1177} {"train_loss": -11.029322624206543, "global_step": 197756, "epoch": 1177} {"train_loss": -10.520602226257324, "global_step": 197757, "epoch": 1177} {"train_loss": -10.974739074707031, "global_step": 197758, "epoch": 1177} {"train_loss": -10.946457862854004, "global_step": 197759, "epoch": 1177} {"train_loss": -10.692618370056152, "global_step": 197760, "epoch": 1177} {"train_loss": -11.01194953918457, "global_step": 197761, "epoch": 1177} {"train_loss": -10.962259292602539, "global_step": 197762, "epoch": 1177} {"train_loss": -10.764636993408203, "global_step": 197763, "epoch": 1177} {"train_loss": -11.23599624633789, "global_step": 197764, "epoch": 1177} {"train_loss": -10.825250625610352, "global_step": 197765, "epoch": 1177} {"train_loss": -11.02869987487793, "global_step": 197766, "epoch": 1177} {"train_loss": -11.045425415039062, "global_step": 197767, "epoch": 1177} {"train_loss": -11.082304000854492, "global_step": 197768, "epoch": 1177} {"train_loss": -11.113350868225098, "global_step": 197769, "epoch": 1177} {"train_loss": -11.193134307861328, "global_step": 197770, "epoch": 1177} {"train_loss": -11.207435607910156, "global_step": 197771, "epoch": 1177} {"train_loss": -11.322845458984375, "global_step": 197772, "epoch": 1177} {"train_loss": -11.044078826904297, "global_step": 197773, "epoch": 1177} {"train_loss": -11.087491035461426, "global_step": 197774, "epoch": 1177} {"train_loss": -11.281198501586914, "global_step": 197775, "epoch": 1177} {"train_loss": -11.178911209106445, "global_step": 197776, "epoch": 1177} {"train_loss": -11.343803405761719, "global_step": 197777, "epoch": 1177} {"train_loss": -10.962305068969727, "global_step": 197778, "epoch": 1177} {"train_loss": -11.140106201171875, "global_step": 197779, "epoch": 1177} {"train_loss": -11.283008575439453, "global_step": 197780, "epoch": 1177} {"train_loss": -11.455171585083008, "global_step": 197781, "epoch": 1177} {"train_loss": -11.403959274291992, "global_step": 197782, "epoch": 1177} {"train_loss": -11.398738861083984, "global_step": 197783, "epoch": 1177} {"train_loss": -11.354938507080078, "global_step": 197784, "epoch": 1177} {"train_loss": -11.252559661865234, "global_step": 197785, "epoch": 1177} {"train_loss": -11.390180587768555, "global_step": 197786, "epoch": 1177} {"train_loss": -11.437030792236328, "global_step": 197787, "epoch": 1177} {"train_loss": -11.437517166137695, "global_step": 197788, "epoch": 1177} {"train_loss": -11.47957706451416, "global_step": 197789, "epoch": 1177} {"train_loss": -11.430929183959961, "global_step": 197790, "epoch": 1177} {"train_loss": -11.56569766998291, "global_step": 197791, "epoch": 1177} {"train_loss": -11.688505172729492, "global_step": 197792, "epoch": 1177} {"train_loss": -11.629110336303711, "global_step": 197793, "epoch": 1177} {"train_loss": -11.54359245300293, "global_step": 197794, "epoch": 1177} {"train_loss": -11.664759635925293, "global_step": 197795, "epoch": 1177} {"train_loss": -11.333971977233887, "global_step": 197796, "epoch": 1177} {"train_loss": -11.562845230102539, "global_step": 197797, "epoch": 1177} {"train_loss": -11.483887672424316, "global_step": 197798, "epoch": 1177} {"train_loss": -11.35513687133789, "global_step": 197799, "epoch": 1177} {"train_loss": -11.450101852416992, "global_step": 197800, "epoch": 1177} {"train_loss": -11.77159595489502, "global_step": 197801, "epoch": 1177} {"train_loss": -11.38626480102539, "global_step": 197802, "epoch": 1177} {"train_loss": -11.54727554321289, "global_step": 197803, "epoch": 1177} {"train_loss": -11.802789688110352, "global_step": 197804, "epoch": 1177} {"train_loss": -11.685294151306152, "global_step": 197805, "epoch": 1177} {"train_loss": -11.755014419555664, "global_step": 197806, "epoch": 1177} {"train_loss": -11.604337692260742, "global_step": 197807, "epoch": 1177} {"train_loss": -11.674711227416992, "global_step": 197808, "epoch": 1177} {"train_loss": -11.620640754699707, "global_step": 197809, "epoch": 1177} {"train_loss": -11.700303077697754, "global_step": 197810, "epoch": 1177} {"train_loss": -11.80778980255127, "global_step": 197811, "epoch": 1177} {"train_loss": -11.803725242614746, "global_step": 197812, "epoch": 1177} {"train_loss": -11.980334281921387, "global_step": 197813, "epoch": 1177} {"train_loss": -11.740272521972656, "global_step": 197814, "epoch": 1177} {"train_loss": -11.846878051757812, "global_step": 197815, "epoch": 1177} {"train_loss": -11.854690551757812, "global_step": 197816, "epoch": 1177} {"train_loss": -11.744068145751953, "global_step": 197817, "epoch": 1177} {"train_loss": -11.745794296264648, "global_step": 197818, "epoch": 1177} {"train_loss": -11.88231086730957, "global_step": 197819, "epoch": 1177} {"train_loss": -11.847496032714844, "global_step": 197820, "epoch": 1177} {"train_loss": -11.879420280456543, "global_step": 197821, "epoch": 1177} {"train_loss": -11.70974063873291, "global_step": 197822, "epoch": 1177} {"train_loss": -11.729147911071777, "global_step": 197823, "epoch": 1177} {"train_loss": -11.133289337158203, "global_step": 197824, "epoch": 1177} {"train_loss": -11.19883918762207, "global_step": 197825, "epoch": 1177} {"train_loss": -11.600748062133789, "global_step": 197826, "epoch": 1177} {"train_loss": -11.689149856567383, "global_step": 197827, "epoch": 1177} {"train_loss": -10.98086166381836, "global_step": 197828, "epoch": 1177} {"train_loss": -10.025382995605469, "global_step": 197829, "epoch": 1177} {"train_loss": -9.521907806396484, "global_step": 197830, "epoch": 1177} {"train_loss": -11.488327026367188, "global_step": 197831, "epoch": 1177} {"train_loss": -9.613247871398926, "global_step": 197832, "epoch": 1177} {"train_loss": -8.133467674255371, "global_step": 197833, "epoch": 1177} {"train_loss": -8.410379409790039, "global_step": 197834, "epoch": 1177} {"train_loss": -9.919879913330078, "global_step": 197835, "epoch": 1177} {"train_loss": -9.897984504699707, "global_step": 197836, "epoch": 1177} {"train_loss": -9.528953552246094, "global_step": 197837, "epoch": 1177} {"train_loss": -11.076011657714844, "global_step": 197838, "epoch": 1177} {"train_loss": -9.926302909851074, "global_step": 197839, "epoch": 1177} {"train_loss": -10.623230934143066, "global_step": 197840, "epoch": 1177} {"train_loss": -9.127721786499023, "global_step": 197841, "epoch": 1177} {"train_loss": -9.702835083007812, "global_step": 197842, "epoch": 1177} {"train_loss": -10.552604675292969, "global_step": 197843, "epoch": 1177} {"train_loss": -8.960699081420898, "global_step": 197844, "epoch": 1177} {"train_loss": -10.01003646850586, "global_step": 197845, "epoch": 1177} {"train_loss": -10.063863754272461, "global_step": 197846, "epoch": 1177} {"train_loss": -10.465034484863281, "global_step": 197847, "epoch": 1177} {"train_loss": -10.466288566589355, "global_step": 197848, "epoch": 1177} {"train_loss": -10.48784065246582, "global_step": 197849, "epoch": 1177} {"train_loss": -10.518993377685547, "global_step": 197850, "epoch": 1177} {"train_loss": -10.824687957763672, "global_step": 197851, "epoch": 1177} {"train_loss": -10.923527717590332, "global_step": 197852, "epoch": 1177} {"train_loss": -10.910774230957031, "global_step": 197853, "epoch": 1177} {"train_loss": -11.15239143371582, "global_step": 197854, "epoch": 1177} {"train_loss": -10.868484497070312, "global_step": 197855, "epoch": 1177} {"train_loss": -11.065807342529297, "global_step": 197856, "epoch": 1177} {"train_loss": -10.938187599182129, "global_step": 197857, "epoch": 1177} {"train_loss": -10.498265266418457, "global_step": 197858, "epoch": 1177} {"train_loss": -10.792900085449219, "global_step": 197859, "epoch": 1177} {"train_loss": -11.09189224243164, "global_step": 197860, "epoch": 1177} {"train_loss": -10.779716491699219, "global_step": 197861, "epoch": 1177} {"train_loss": -11.112641334533691, "global_step": 197862, "epoch": 1177} {"train_loss": -10.98309326171875, "global_step": 197863, "epoch": 1177} {"train_loss": -11.1696138381958, "global_step": 197864, "epoch": 1177} {"train_loss": -11.162656784057617, "global_step": 197865, "epoch": 1177} {"train_loss": -10.67737102508545, "global_step": 197866, "epoch": 1177} {"train_loss": -11.095499038696289, "global_step": 197867, "epoch": 1177} {"train_loss": -11.074399948120117, "global_step": 197868, "epoch": 1177} {"train_loss": -11.160676002502441, "global_step": 197869, "epoch": 1177} {"train_loss": -11.464157104492188, "global_step": 197870, "epoch": 1177} {"train_loss": -11.044048309326172, "global_step": 197871, "epoch": 1177} {"train_loss": -11.217082977294922, "global_step": 197872, "epoch": 1177} {"train_loss": -11.106473922729492, "global_step": 197873, "epoch": 1177} {"train_loss": -11.321009635925293, "global_step": 197874, "epoch": 1177} {"train_loss": -11.13282585144043, "global_step": 197875, "epoch": 1177} {"train_loss": -11.322793960571289, "global_step": 197876, "epoch": 1177} {"train_loss": -11.206525802612305, "global_step": 197877, "epoch": 1177} {"train_loss": -11.231886863708496, "global_step": 197878, "epoch": 1177} {"train_loss": -11.129881858825684, "global_step": 197879, "epoch": 1177} {"train_loss": -11.349170684814453, "global_step": 197880, "epoch": 1177} {"train_loss": -11.307806015014648, "global_step": 197881, "epoch": 1177} {"train_loss": -11.277341842651367, "global_step": 197882, "epoch": 1177} {"train_loss": -11.433613777160645, "global_step": 197883, "epoch": 1177} {"train_loss": -11.374481201171875, "global_step": 197884, "epoch": 1177} {"train_loss": -11.306465148925781, "global_step": 197885, "epoch": 1177} {"train_loss": -11.573646545410156, "global_step": 197886, "epoch": 1177} {"train_loss": -11.295854568481445, "global_step": 197887, "epoch": 1177} {"train_loss": -11.439262390136719, "global_step": 197888, "epoch": 1177} {"train_loss": -11.243435859680176, "global_step": 197889, "epoch": 1177} {"train_loss": -11.405885696411133, "global_step": 197890, "epoch": 1177} {"train_loss": -11.509839057922363, "global_step": 197891, "epoch": 1177} {"train_loss": -11.525876998901367, "global_step": 197892, "epoch": 1177} {"train_loss": -11.198112487792969, "global_step": 197893, "epoch": 1177} {"train_loss": -11.455209732055664, "global_step": 197894, "epoch": 1177} {"train_loss": -11.50015926361084, "global_step": 197895, "epoch": 1177} {"train_loss": -11.302885055541992, "global_step": 197896, "epoch": 1177} {"train_loss": -11.728658676147461, "global_step": 197897, "epoch": 1177} {"train_loss": -11.342174530029297, "global_step": 197898, "epoch": 1177} {"train_loss": -11.487136840820312, "global_step": 197899, "epoch": 1177} {"train_loss": -11.479591369628906, "global_step": 197900, "epoch": 1177} {"train_loss": -11.458389282226562, "global_step": 197901, "epoch": 1177} {"train_loss": -11.591174125671387, "global_step": 197902, "epoch": 1177} {"train_loss": -11.014421201887584, "global_step": 197903, "epoch": 1177, "val_loss": 242885.453125} {"train_loss": -11.689886093139648, "global_step": 197904, "epoch": 1178} {"train_loss": -11.37576675415039, "global_step": 197905, "epoch": 1178} {"train_loss": -11.577701568603516, "global_step": 197906, "epoch": 1178} {"train_loss": -11.509777069091797, "global_step": 197907, "epoch": 1178} {"train_loss": -11.522542953491211, "global_step": 197908, "epoch": 1178} {"train_loss": -11.344016075134277, "global_step": 197909, "epoch": 1178} {"train_loss": -11.428058624267578, "global_step": 197910, "epoch": 1178} {"train_loss": -11.220541000366211, "global_step": 197911, "epoch": 1178} {"train_loss": -11.440357208251953, "global_step": 197912, "epoch": 1178} {"train_loss": -11.603506088256836, "global_step": 197913, "epoch": 1178} {"train_loss": -11.428054809570312, "global_step": 197914, "epoch": 1178} {"train_loss": -11.419051170349121, "global_step": 197915, "epoch": 1178} {"train_loss": -11.71114730834961, "global_step": 197916, "epoch": 1178} {"train_loss": -11.183489799499512, "global_step": 197917, "epoch": 1178} {"train_loss": -11.587615966796875, "global_step": 197918, "epoch": 1178} {"train_loss": -11.587020874023438, "global_step": 197919, "epoch": 1178} {"train_loss": -11.386826515197754, "global_step": 197920, "epoch": 1178} {"train_loss": -11.176986694335938, "global_step": 197921, "epoch": 1178} {"train_loss": -11.451748847961426, "global_step": 197922, "epoch": 1178} {"train_loss": -11.43760871887207, "global_step": 197923, "epoch": 1178} {"train_loss": -11.370616912841797, "global_step": 197924, "epoch": 1178} {"train_loss": -11.549819946289062, "global_step": 197925, "epoch": 1178} {"train_loss": -11.515060424804688, "global_step": 197926, "epoch": 1178} {"train_loss": -11.224550247192383, "global_step": 197927, "epoch": 1178} {"train_loss": -11.50851058959961, "global_step": 197928, "epoch": 1178} {"train_loss": -11.251049041748047, "global_step": 197929, "epoch": 1178} {"train_loss": -11.120626449584961, "global_step": 197930, "epoch": 1178} {"train_loss": -10.874543190002441, "global_step": 197931, "epoch": 1178} {"train_loss": -11.318036079406738, "global_step": 197932, "epoch": 1178} {"train_loss": -10.564640998840332, "global_step": 197933, "epoch": 1178} {"train_loss": -10.342869758605957, "global_step": 197934, "epoch": 1178} {"train_loss": -11.351563453674316, "global_step": 197935, "epoch": 1178} {"train_loss": -10.92772102355957, "global_step": 197936, "epoch": 1178} {"train_loss": -11.216636657714844, "global_step": 197937, "epoch": 1178} {"train_loss": -11.068017959594727, "global_step": 197938, "epoch": 1178} {"train_loss": -11.020137786865234, "global_step": 197939, "epoch": 1178} {"train_loss": -10.763525009155273, "global_step": 197940, "epoch": 1178} {"train_loss": -9.575037956237793, "global_step": 197941, "epoch": 1178} {"train_loss": -10.765824317932129, "global_step": 197942, "epoch": 1178} {"train_loss": -10.662445068359375, "global_step": 197943, "epoch": 1178} {"train_loss": -10.541460037231445, "global_step": 197944, "epoch": 1178} {"train_loss": -11.09523868560791, "global_step": 197945, "epoch": 1178} {"train_loss": -10.483359336853027, "global_step": 197946, "epoch": 1178} {"train_loss": -10.64584732055664, "global_step": 197947, "epoch": 1178} {"train_loss": -10.29545783996582, "global_step": 197948, "epoch": 1178} {"train_loss": -9.881294250488281, "global_step": 197949, "epoch": 1178} {"train_loss": -10.768720626831055, "global_step": 197950, "epoch": 1178} {"train_loss": -9.127580642700195, "global_step": 197951, "epoch": 1178} {"train_loss": -10.608728408813477, "global_step": 197952, "epoch": 1178} {"train_loss": -7.441680431365967, "global_step": 197953, "epoch": 1178} {"train_loss": -8.924564361572266, "global_step": 197954, "epoch": 1178} {"train_loss": -9.725729942321777, "global_step": 197955, "epoch": 1178} {"train_loss": -9.96399974822998, "global_step": 197956, "epoch": 1178} {"train_loss": -8.48478889465332, "global_step": 197957, "epoch": 1178} {"train_loss": -9.938322067260742, "global_step": 197958, "epoch": 1178} {"train_loss": -9.796409606933594, "global_step": 197959, "epoch": 1178} {"train_loss": -8.495809555053711, "global_step": 197960, "epoch": 1178} {"train_loss": -8.903644561767578, "global_step": 197961, "epoch": 1178} {"train_loss": -9.122072219848633, "global_step": 197962, "epoch": 1178} {"train_loss": -10.302824974060059, "global_step": 197963, "epoch": 1178} {"train_loss": -9.60843563079834, "global_step": 197964, "epoch": 1178} {"train_loss": -11.002294540405273, "global_step": 197965, "epoch": 1178} {"train_loss": -10.365689277648926, "global_step": 197966, "epoch": 1178} {"train_loss": -10.26737117767334, "global_step": 197967, "epoch": 1178} {"train_loss": -10.438760757446289, "global_step": 197968, "epoch": 1178} {"train_loss": -10.431997299194336, "global_step": 197969, "epoch": 1178} {"train_loss": -10.425949096679688, "global_step": 197970, "epoch": 1178} {"train_loss": -10.286476135253906, "global_step": 197971, "epoch": 1178} {"train_loss": -10.592752456665039, "global_step": 197972, "epoch": 1178} {"train_loss": -10.33340835571289, "global_step": 197973, "epoch": 1178} {"train_loss": -10.799087524414062, "global_step": 197974, "epoch": 1178} {"train_loss": -10.729999542236328, "global_step": 197975, "epoch": 1178} {"train_loss": -10.658951759338379, "global_step": 197976, "epoch": 1178} {"train_loss": -10.909976959228516, "global_step": 197977, "epoch": 1178} {"train_loss": -10.85717487335205, "global_step": 197978, "epoch": 1178} {"train_loss": -10.945049285888672, "global_step": 197979, "epoch": 1178} {"train_loss": -11.007434844970703, "global_step": 197980, "epoch": 1178} {"train_loss": -10.883769989013672, "global_step": 197981, "epoch": 1178} {"train_loss": -11.085196495056152, "global_step": 197982, "epoch": 1178} {"train_loss": -11.129603385925293, "global_step": 197983, "epoch": 1178} {"train_loss": -11.093679428100586, "global_step": 197984, "epoch": 1178} {"train_loss": -11.205671310424805, "global_step": 197985, "epoch": 1178} {"train_loss": -11.25218391418457, "global_step": 197986, "epoch": 1178} {"train_loss": -11.113658905029297, "global_step": 197987, "epoch": 1178} {"train_loss": -11.14596176147461, "global_step": 197988, "epoch": 1178} {"train_loss": -11.112717628479004, "global_step": 197989, "epoch": 1178} {"train_loss": -10.992173194885254, "global_step": 197990, "epoch": 1178} {"train_loss": -11.167774200439453, "global_step": 197991, "epoch": 1178} {"train_loss": -11.243879318237305, "global_step": 197992, "epoch": 1178} {"train_loss": -11.177895545959473, "global_step": 197993, "epoch": 1178} {"train_loss": -11.228536605834961, "global_step": 197994, "epoch": 1178} {"train_loss": -11.135095596313477, "global_step": 197995, "epoch": 1178} {"train_loss": -11.418493270874023, "global_step": 197996, "epoch": 1178} {"train_loss": -11.310396194458008, "global_step": 197997, "epoch": 1178} {"train_loss": -11.276802062988281, "global_step": 197998, "epoch": 1178} {"train_loss": -11.290824890136719, "global_step": 197999, "epoch": 1178} {"train_loss": -11.221113204956055, "global_step": 198000, "epoch": 1178} {"train_loss": -11.180747985839844, "global_step": 198001, "epoch": 1178} {"train_loss": -11.451387405395508, "global_step": 198002, "epoch": 1178} {"train_loss": -11.460978507995605, "global_step": 198003, "epoch": 1178} {"train_loss": -11.533914566040039, "global_step": 198004, "epoch": 1178} {"train_loss": -11.42674446105957, "global_step": 198005, "epoch": 1178} {"train_loss": -11.472274780273438, "global_step": 198006, "epoch": 1178} {"train_loss": -11.525995254516602, "global_step": 198007, "epoch": 1178} {"train_loss": -11.275888442993164, "global_step": 198008, "epoch": 1178} {"train_loss": -11.490236282348633, "global_step": 198009, "epoch": 1178} {"train_loss": -11.430288314819336, "global_step": 198010, "epoch": 1178} {"train_loss": -11.406654357910156, "global_step": 198011, "epoch": 1178} {"train_loss": -11.249382972717285, "global_step": 198012, "epoch": 1178} {"train_loss": -11.521592140197754, "global_step": 198013, "epoch": 1178} {"train_loss": -11.589740753173828, "global_step": 198014, "epoch": 1178} {"train_loss": -11.690266609191895, "global_step": 198015, "epoch": 1178} {"train_loss": -11.382293701171875, "global_step": 198016, "epoch": 1178} {"train_loss": -11.553460121154785, "global_step": 198017, "epoch": 1178} {"train_loss": -11.659833908081055, "global_step": 198018, "epoch": 1178} {"train_loss": -11.346765518188477, "global_step": 198019, "epoch": 1178} {"train_loss": -11.674886703491211, "global_step": 198020, "epoch": 1178} {"train_loss": -11.55063533782959, "global_step": 198021, "epoch": 1178} {"train_loss": -11.659618377685547, "global_step": 198022, "epoch": 1178} {"train_loss": -11.82619857788086, "global_step": 198023, "epoch": 1178} {"train_loss": -11.64178466796875, "global_step": 198024, "epoch": 1178} {"train_loss": -11.646227836608887, "global_step": 198025, "epoch": 1178} {"train_loss": -11.793182373046875, "global_step": 198026, "epoch": 1178} {"train_loss": -11.7440185546875, "global_step": 198027, "epoch": 1178} {"train_loss": -11.747416496276855, "global_step": 198028, "epoch": 1178} {"train_loss": -11.670856475830078, "global_step": 198029, "epoch": 1178} {"train_loss": -11.768322944641113, "global_step": 198030, "epoch": 1178} {"train_loss": -11.72247314453125, "global_step": 198031, "epoch": 1178} {"train_loss": -11.917091369628906, "global_step": 198032, "epoch": 1178} {"train_loss": -11.891255378723145, "global_step": 198033, "epoch": 1178} {"train_loss": -11.861392974853516, "global_step": 198034, "epoch": 1178} {"train_loss": -11.641225814819336, "global_step": 198035, "epoch": 1178} {"train_loss": -11.6251220703125, "global_step": 198036, "epoch": 1178} {"train_loss": -11.494561195373535, "global_step": 198037, "epoch": 1178} {"train_loss": -11.744651794433594, "global_step": 198038, "epoch": 1178} {"train_loss": -11.987313270568848, "global_step": 198039, "epoch": 1178} {"train_loss": -11.810667037963867, "global_step": 198040, "epoch": 1178} {"train_loss": -11.70345687866211, "global_step": 198041, "epoch": 1178} {"train_loss": -11.782442092895508, "global_step": 198042, "epoch": 1178} {"train_loss": -11.847960472106934, "global_step": 198043, "epoch": 1178} {"train_loss": -11.59813117980957, "global_step": 198044, "epoch": 1178} {"train_loss": -11.76436996459961, "global_step": 198045, "epoch": 1178} {"train_loss": -11.667327880859375, "global_step": 198046, "epoch": 1178} {"train_loss": -11.658581733703613, "global_step": 198047, "epoch": 1178} {"train_loss": -11.847001075744629, "global_step": 198048, "epoch": 1178} {"train_loss": -11.635833740234375, "global_step": 198049, "epoch": 1178} {"train_loss": -11.643710136413574, "global_step": 198050, "epoch": 1178} {"train_loss": -11.884904861450195, "global_step": 198051, "epoch": 1178} {"train_loss": -11.480425834655762, "global_step": 198052, "epoch": 1178} {"train_loss": -11.730670928955078, "global_step": 198053, "epoch": 1178} {"train_loss": -11.073347091674805, "global_step": 198054, "epoch": 1178} {"train_loss": -10.77000617980957, "global_step": 198055, "epoch": 1178} {"train_loss": -10.561543464660645, "global_step": 198056, "epoch": 1178} {"train_loss": -10.06495475769043, "global_step": 198057, "epoch": 1178} {"train_loss": -10.7080078125, "global_step": 198058, "epoch": 1178} {"train_loss": -9.158346176147461, "global_step": 198059, "epoch": 1178} {"train_loss": -8.04561710357666, "global_step": 198060, "epoch": 1178} {"train_loss": -9.024306297302246, "global_step": 198061, "epoch": 1178} {"train_loss": -7.775387287139893, "global_step": 198062, "epoch": 1178} {"train_loss": -9.946826934814453, "global_step": 198063, "epoch": 1178} {"train_loss": -9.009450912475586, "global_step": 198064, "epoch": 1178} {"train_loss": -9.209260940551758, "global_step": 198065, "epoch": 1178} {"train_loss": -9.797076225280762, "global_step": 198066, "epoch": 1178} {"train_loss": -8.78944206237793, "global_step": 198067, "epoch": 1178} {"train_loss": -9.668975830078125, "global_step": 198068, "epoch": 1178} {"train_loss": -10.247871398925781, "global_step": 198069, "epoch": 1178} {"train_loss": -9.509635925292969, "global_step": 198070, "epoch": 1178} {"train_loss": -10.930378034001304, "global_step": 198071, "epoch": 1178, "val_loss": 250678.484375} {"train_loss": -10.766294479370117, "global_step": 198072, "epoch": 1179} {"train_loss": -9.70650863647461, "global_step": 198073, "epoch": 1179} {"train_loss": -10.68844223022461, "global_step": 198074, "epoch": 1179} {"train_loss": -10.49118709564209, "global_step": 198075, "epoch": 1179} {"train_loss": -10.36715030670166, "global_step": 198076, "epoch": 1179} {"train_loss": -10.75782299041748, "global_step": 198077, "epoch": 1179} {"train_loss": -10.524515151977539, "global_step": 198078, "epoch": 1179} {"train_loss": -10.255962371826172, "global_step": 198079, "epoch": 1179} {"train_loss": -10.534168243408203, "global_step": 198080, "epoch": 1179} {"train_loss": -10.849800109863281, "global_step": 198081, "epoch": 1179} {"train_loss": -10.789643287658691, "global_step": 198082, "epoch": 1179} {"train_loss": -10.96861457824707, "global_step": 198083, "epoch": 1179} {"train_loss": -10.972134590148926, "global_step": 198084, "epoch": 1179} {"train_loss": -10.773876190185547, "global_step": 198085, "epoch": 1179} {"train_loss": -11.001262664794922, "global_step": 198086, "epoch": 1179} {"train_loss": -10.734421730041504, "global_step": 198087, "epoch": 1179} {"train_loss": -11.10784912109375, "global_step": 198088, "epoch": 1179} {"train_loss": -11.254762649536133, "global_step": 198089, "epoch": 1179} {"train_loss": -10.85978889465332, "global_step": 198090, "epoch": 1179} {"train_loss": -11.152214050292969, "global_step": 198091, "epoch": 1179} {"train_loss": -11.193822860717773, "global_step": 198092, "epoch": 1179} {"train_loss": -10.875916481018066, "global_step": 198093, "epoch": 1179} {"train_loss": -11.047351837158203, "global_step": 198094, "epoch": 1179} {"train_loss": -11.020902633666992, "global_step": 198095, "epoch": 1179} {"train_loss": -10.825494766235352, "global_step": 198096, "epoch": 1179} {"train_loss": -10.960636138916016, "global_step": 198097, "epoch": 1179} {"train_loss": -11.015193939208984, "global_step": 198098, "epoch": 1179} {"train_loss": -11.078230857849121, "global_step": 198099, "epoch": 1179} {"train_loss": -11.061502456665039, "global_step": 198100, "epoch": 1179} {"train_loss": -11.382627487182617, "global_step": 198101, "epoch": 1179} {"train_loss": -11.080791473388672, "global_step": 198102, "epoch": 1179} {"train_loss": -11.235380172729492, "global_step": 198103, "epoch": 1179} {"train_loss": -11.165952682495117, "global_step": 198104, "epoch": 1179} {"train_loss": -11.218090057373047, "global_step": 198105, "epoch": 1179} {"train_loss": -11.261863708496094, "global_step": 198106, "epoch": 1179} {"train_loss": -11.364603042602539, "global_step": 198107, "epoch": 1179} {"train_loss": -11.205886840820312, "global_step": 198108, "epoch": 1179} {"train_loss": -11.275903701782227, "global_step": 198109, "epoch": 1179} {"train_loss": -11.122976303100586, "global_step": 198110, "epoch": 1179} {"train_loss": -11.33041763305664, "global_step": 198111, "epoch": 1179} {"train_loss": -11.316118240356445, "global_step": 198112, "epoch": 1179} {"train_loss": -11.43360424041748, "global_step": 198113, "epoch": 1179} {"train_loss": -11.351251602172852, "global_step": 198114, "epoch": 1179} {"train_loss": -11.349857330322266, "global_step": 198115, "epoch": 1179} {"train_loss": -11.396018981933594, "global_step": 198116, "epoch": 1179} {"train_loss": -11.250120162963867, "global_step": 198117, "epoch": 1179} {"train_loss": -11.531173706054688, "global_step": 198118, "epoch": 1179} {"train_loss": -11.544557571411133, "global_step": 198119, "epoch": 1179} {"train_loss": -11.397643089294434, "global_step": 198120, "epoch": 1179} {"train_loss": -11.338812828063965, "global_step": 198121, "epoch": 1179} {"train_loss": -11.661518096923828, "global_step": 198122, "epoch": 1179} {"train_loss": -11.407417297363281, "global_step": 198123, "epoch": 1179} {"train_loss": -11.38565731048584, "global_step": 198124, "epoch": 1179} {"train_loss": -11.49575424194336, "global_step": 198125, "epoch": 1179} {"train_loss": -11.502141952514648, "global_step": 198126, "epoch": 1179} {"train_loss": -11.524702072143555, "global_step": 198127, "epoch": 1179} {"train_loss": -11.673298835754395, "global_step": 198128, "epoch": 1179} {"train_loss": -11.494131088256836, "global_step": 198129, "epoch": 1179} {"train_loss": -11.585216522216797, "global_step": 198130, "epoch": 1179} {"train_loss": -11.571540832519531, "global_step": 198131, "epoch": 1179} {"train_loss": -11.467140197753906, "global_step": 198132, "epoch": 1179} {"train_loss": -11.619988441467285, "global_step": 198133, "epoch": 1179} {"train_loss": -11.467042922973633, "global_step": 198134, "epoch": 1179} {"train_loss": -11.578272819519043, "global_step": 198135, "epoch": 1179} {"train_loss": -11.759979248046875, "global_step": 198136, "epoch": 1179} {"train_loss": -11.667524337768555, "global_step": 198137, "epoch": 1179} {"train_loss": -11.6249361038208, "global_step": 198138, "epoch": 1179} {"train_loss": -11.775519371032715, "global_step": 198139, "epoch": 1179} {"train_loss": -11.66289234161377, "global_step": 198140, "epoch": 1179} {"train_loss": -11.53738784790039, "global_step": 198141, "epoch": 1179} {"train_loss": -11.584331512451172, "global_step": 198142, "epoch": 1179} {"train_loss": -11.740554809570312, "global_step": 198143, "epoch": 1179} {"train_loss": -11.511625289916992, "global_step": 198144, "epoch": 1179} {"train_loss": -11.48045539855957, "global_step": 198145, "epoch": 1179} {"train_loss": -11.24688720703125, "global_step": 198146, "epoch": 1179} {"train_loss": -11.281314849853516, "global_step": 198147, "epoch": 1179} {"train_loss": -11.564386367797852, "global_step": 198148, "epoch": 1179} {"train_loss": -11.28774642944336, "global_step": 198149, "epoch": 1179} {"train_loss": -11.899909973144531, "global_step": 198150, "epoch": 1179} {"train_loss": -11.56435775756836, "global_step": 198151, "epoch": 1179} {"train_loss": -11.850099563598633, "global_step": 198152, "epoch": 1179} {"train_loss": -11.430293083190918, "global_step": 198153, "epoch": 1179} {"train_loss": -11.85509204864502, "global_step": 198154, "epoch": 1179} {"train_loss": -11.808867454528809, "global_step": 198155, "epoch": 1179} {"train_loss": -11.744043350219727, "global_step": 198156, "epoch": 1179} {"train_loss": -11.110736846923828, "global_step": 198157, "epoch": 1179} {"train_loss": -11.348936080932617, "global_step": 198158, "epoch": 1179} {"train_loss": -11.684854507446289, "global_step": 198159, "epoch": 1179} {"train_loss": -11.18266487121582, "global_step": 198160, "epoch": 1179} {"train_loss": -11.576128959655762, "global_step": 198161, "epoch": 1179} {"train_loss": -11.624761581420898, "global_step": 198162, "epoch": 1179} {"train_loss": -11.684253692626953, "global_step": 198163, "epoch": 1179} {"train_loss": -11.838322639465332, "global_step": 198164, "epoch": 1179} {"train_loss": -11.378938674926758, "global_step": 198165, "epoch": 1179} {"train_loss": -11.502187728881836, "global_step": 198166, "epoch": 1179} {"train_loss": -11.64279556274414, "global_step": 198167, "epoch": 1179} {"train_loss": -11.682364463806152, "global_step": 198168, "epoch": 1179} {"train_loss": -11.645879745483398, "global_step": 198169, "epoch": 1179} {"train_loss": -11.64073657989502, "global_step": 198170, "epoch": 1179} {"train_loss": -11.529138565063477, "global_step": 198171, "epoch": 1179} {"train_loss": -11.296016693115234, "global_step": 198172, "epoch": 1179} {"train_loss": -11.404420852661133, "global_step": 198173, "epoch": 1179} {"train_loss": -11.568138122558594, "global_step": 198174, "epoch": 1179} {"train_loss": -10.859321594238281, "global_step": 198175, "epoch": 1179} {"train_loss": -10.471774101257324, "global_step": 198176, "epoch": 1179} {"train_loss": -10.464685440063477, "global_step": 198177, "epoch": 1179} {"train_loss": -10.932665824890137, "global_step": 198178, "epoch": 1179} {"train_loss": -10.468914031982422, "global_step": 198179, "epoch": 1179} {"train_loss": -10.612034797668457, "global_step": 198180, "epoch": 1179} {"train_loss": -10.643841743469238, "global_step": 198181, "epoch": 1179} {"train_loss": -7.372736930847168, "global_step": 198182, "epoch": 1179} {"train_loss": -6.87812614440918, "global_step": 198183, "epoch": 1179} {"train_loss": -8.28363037109375, "global_step": 198184, "epoch": 1179} {"train_loss": -9.827856063842773, "global_step": 198185, "epoch": 1179} {"train_loss": -8.463974952697754, "global_step": 198186, "epoch": 1179} {"train_loss": -7.296204566955566, "global_step": 198187, "epoch": 1179} {"train_loss": -7.620820045471191, "global_step": 198188, "epoch": 1179} {"train_loss": -8.038812637329102, "global_step": 198189, "epoch": 1179} {"train_loss": -7.697256565093994, "global_step": 198190, "epoch": 1179} {"train_loss": -7.747469425201416, "global_step": 198191, "epoch": 1179} {"train_loss": -7.744406223297119, "global_step": 198192, "epoch": 1179} {"train_loss": -8.509928703308105, "global_step": 198193, "epoch": 1179} {"train_loss": -8.688071250915527, "global_step": 198194, "epoch": 1179} {"train_loss": -9.156717300415039, "global_step": 198195, "epoch": 1179} {"train_loss": -10.298104286193848, "global_step": 198196, "epoch": 1179} {"train_loss": -10.406543731689453, "global_step": 198197, "epoch": 1179} {"train_loss": -10.441280364990234, "global_step": 198198, "epoch": 1179} {"train_loss": -10.258337020874023, "global_step": 198199, "epoch": 1179} {"train_loss": -10.332626342773438, "global_step": 198200, "epoch": 1179} {"train_loss": -10.060176849365234, "global_step": 198201, "epoch": 1179} {"train_loss": -9.79847240447998, "global_step": 198202, "epoch": 1179} {"train_loss": -10.361329078674316, "global_step": 198203, "epoch": 1179} {"train_loss": -9.963661193847656, "global_step": 198204, "epoch": 1179} {"train_loss": -9.582204818725586, "global_step": 198205, "epoch": 1179} {"train_loss": -10.3746976852417, "global_step": 198206, "epoch": 1179} {"train_loss": -10.577834129333496, "global_step": 198207, "epoch": 1179} {"train_loss": -9.749213218688965, "global_step": 198208, "epoch": 1179} {"train_loss": -10.786298751831055, "global_step": 198209, "epoch": 1179} {"train_loss": -10.892001152038574, "global_step": 198210, "epoch": 1179} {"train_loss": -10.393641471862793, "global_step": 198211, "epoch": 1179} {"train_loss": -10.383208274841309, "global_step": 198212, "epoch": 1179} {"train_loss": -10.731391906738281, "global_step": 198213, "epoch": 1179} {"train_loss": -10.96225357055664, "global_step": 198214, "epoch": 1179} {"train_loss": -10.68454647064209, "global_step": 198215, "epoch": 1179} {"train_loss": -10.948836326599121, "global_step": 198216, "epoch": 1179} {"train_loss": -11.027070999145508, "global_step": 198217, "epoch": 1179} {"train_loss": -10.767827987670898, "global_step": 198218, "epoch": 1179} {"train_loss": -10.874849319458008, "global_step": 198219, "epoch": 1179} {"train_loss": -11.087149620056152, "global_step": 198220, "epoch": 1179} {"train_loss": -10.826441764831543, "global_step": 198221, "epoch": 1179} {"train_loss": -11.061532974243164, "global_step": 198222, "epoch": 1179} {"train_loss": -11.034200668334961, "global_step": 198223, "epoch": 1179} {"train_loss": -11.061370849609375, "global_step": 198224, "epoch": 1179} {"train_loss": -11.235755920410156, "global_step": 198225, "epoch": 1179} {"train_loss": -11.077215194702148, "global_step": 198226, "epoch": 1179} {"train_loss": -11.0466890335083, "global_step": 198227, "epoch": 1179} {"train_loss": -11.153491973876953, "global_step": 198228, "epoch": 1179} {"train_loss": -11.141571044921875, "global_step": 198229, "epoch": 1179} {"train_loss": -11.160806655883789, "global_step": 198230, "epoch": 1179} {"train_loss": -11.114278793334961, "global_step": 198231, "epoch": 1179} {"train_loss": -11.118303298950195, "global_step": 198232, "epoch": 1179} {"train_loss": -11.194108009338379, "global_step": 198233, "epoch": 1179} {"train_loss": -11.109173774719238, "global_step": 198234, "epoch": 1179} {"train_loss": -11.270209312438965, "global_step": 198235, "epoch": 1179} {"train_loss": -11.233780860900879, "global_step": 198236, "epoch": 1179} {"train_loss": -11.365360260009766, "global_step": 198237, "epoch": 1179} {"train_loss": -11.205953598022461, "global_step": 198238, "epoch": 1179} {"train_loss": -10.86248383919398, "global_step": 198239, "epoch": 1179, "val_loss": 237123.96875} {"train_loss": -11.2562894821167, "global_step": 198240, "epoch": 1180} {"train_loss": -11.14887809753418, "global_step": 198241, "epoch": 1180} {"train_loss": -11.37220573425293, "global_step": 198242, "epoch": 1180} {"train_loss": -11.365074157714844, "global_step": 198243, "epoch": 1180} {"train_loss": -11.217151641845703, "global_step": 198244, "epoch": 1180} {"train_loss": -11.36920166015625, "global_step": 198245, "epoch": 1180} {"train_loss": -11.475817680358887, "global_step": 198246, "epoch": 1180} {"train_loss": -11.493297576904297, "global_step": 198247, "epoch": 1180} {"train_loss": -11.259262084960938, "global_step": 198248, "epoch": 1180} {"train_loss": -11.471977233886719, "global_step": 198249, "epoch": 1180} {"train_loss": -11.368093490600586, "global_step": 198250, "epoch": 1180} {"train_loss": -11.320267677307129, "global_step": 198251, "epoch": 1180} {"train_loss": -11.378095626831055, "global_step": 198252, "epoch": 1180} {"train_loss": -11.695123672485352, "global_step": 198253, "epoch": 1180} {"train_loss": -11.454048156738281, "global_step": 198254, "epoch": 1180} {"train_loss": -11.27843189239502, "global_step": 198255, "epoch": 1180} {"train_loss": -11.713576316833496, "global_step": 198256, "epoch": 1180} {"train_loss": -11.509431838989258, "global_step": 198257, "epoch": 1180} {"train_loss": -11.549087524414062, "global_step": 198258, "epoch": 1180} {"train_loss": -11.716314315795898, "global_step": 198259, "epoch": 1180} {"train_loss": -11.681766510009766, "global_step": 198260, "epoch": 1180} {"train_loss": -11.464556694030762, "global_step": 198261, "epoch": 1180} {"train_loss": -11.45205020904541, "global_step": 198262, "epoch": 1180} {"train_loss": -11.594082832336426, "global_step": 198263, "epoch": 1180} {"train_loss": -10.689255714416504, "global_step": 198264, "epoch": 1180} {"train_loss": -10.889369010925293, "global_step": 198265, "epoch": 1180} {"train_loss": -11.78958797454834, "global_step": 198266, "epoch": 1180} {"train_loss": -10.967238426208496, "global_step": 198267, "epoch": 1180} {"train_loss": -10.857760429382324, "global_step": 198268, "epoch": 1180} {"train_loss": -11.332822799682617, "global_step": 198269, "epoch": 1180} {"train_loss": -11.57679271697998, "global_step": 198270, "epoch": 1180} {"train_loss": -11.192764282226562, "global_step": 198271, "epoch": 1180} {"train_loss": -11.07626724243164, "global_step": 198272, "epoch": 1180} {"train_loss": -11.369304656982422, "global_step": 198273, "epoch": 1180} {"train_loss": -11.390439987182617, "global_step": 198274, "epoch": 1180} {"train_loss": -11.276777267456055, "global_step": 198275, "epoch": 1180} {"train_loss": -11.420726776123047, "global_step": 198276, "epoch": 1180} {"train_loss": -10.501245498657227, "global_step": 198277, "epoch": 1180} {"train_loss": -10.512468338012695, "global_step": 198278, "epoch": 1180} {"train_loss": -10.392913818359375, "global_step": 198279, "epoch": 1180} {"train_loss": -11.679851531982422, "global_step": 198280, "epoch": 1180} {"train_loss": -10.296407699584961, "global_step": 198281, "epoch": 1180} {"train_loss": -10.346158981323242, "global_step": 198282, "epoch": 1180} {"train_loss": -11.211788177490234, "global_step": 198283, "epoch": 1180} {"train_loss": -10.520112991333008, "global_step": 198284, "epoch": 1180} {"train_loss": -10.683263778686523, "global_step": 198285, "epoch": 1180} {"train_loss": -11.397302627563477, "global_step": 198286, "epoch": 1180} {"train_loss": -10.986587524414062, "global_step": 198287, "epoch": 1180} {"train_loss": -10.93739128112793, "global_step": 198288, "epoch": 1180} {"train_loss": -11.235528945922852, "global_step": 198289, "epoch": 1180} {"train_loss": -10.818727493286133, "global_step": 198290, "epoch": 1180} {"train_loss": -11.434466361999512, "global_step": 198291, "epoch": 1180} {"train_loss": -11.289531707763672, "global_step": 198292, "epoch": 1180} {"train_loss": -11.464550018310547, "global_step": 198293, "epoch": 1180} {"train_loss": -11.136771202087402, "global_step": 198294, "epoch": 1180} {"train_loss": -11.33211898803711, "global_step": 198295, "epoch": 1180} {"train_loss": -11.268112182617188, "global_step": 198296, "epoch": 1180} {"train_loss": -11.179974555969238, "global_step": 198297, "epoch": 1180} {"train_loss": -11.282340049743652, "global_step": 198298, "epoch": 1180} {"train_loss": -11.019952774047852, "global_step": 198299, "epoch": 1180} {"train_loss": -11.076986312866211, "global_step": 198300, "epoch": 1180} {"train_loss": -11.027965545654297, "global_step": 198301, "epoch": 1180} {"train_loss": -10.643891334533691, "global_step": 198302, "epoch": 1180} {"train_loss": -11.419876098632812, "global_step": 198303, "epoch": 1180} {"train_loss": -11.314627647399902, "global_step": 198304, "epoch": 1180} {"train_loss": -11.143519401550293, "global_step": 198305, "epoch": 1180} {"train_loss": -11.264547348022461, "global_step": 198306, "epoch": 1180} {"train_loss": -11.33449649810791, "global_step": 198307, "epoch": 1180} {"train_loss": -11.205549240112305, "global_step": 198308, "epoch": 1180} {"train_loss": -10.996818542480469, "global_step": 198309, "epoch": 1180} {"train_loss": -11.459718704223633, "global_step": 198310, "epoch": 1180} {"train_loss": -11.052457809448242, "global_step": 198311, "epoch": 1180} {"train_loss": -11.457212448120117, "global_step": 198312, "epoch": 1180} {"train_loss": -11.14539909362793, "global_step": 198313, "epoch": 1180} {"train_loss": -11.159435272216797, "global_step": 198314, "epoch": 1180} {"train_loss": -11.591180801391602, "global_step": 198315, "epoch": 1180} {"train_loss": -11.469290733337402, "global_step": 198316, "epoch": 1180} {"train_loss": -11.439606666564941, "global_step": 198317, "epoch": 1180} {"train_loss": -11.243165969848633, "global_step": 198318, "epoch": 1180} {"train_loss": -11.207646369934082, "global_step": 198319, "epoch": 1180} {"train_loss": -11.411422729492188, "global_step": 198320, "epoch": 1180} {"train_loss": -11.246614456176758, "global_step": 198321, "epoch": 1180} {"train_loss": -10.947237014770508, "global_step": 198322, "epoch": 1180} {"train_loss": -11.41923713684082, "global_step": 198323, "epoch": 1180} {"train_loss": -11.285514831542969, "global_step": 198324, "epoch": 1180} {"train_loss": -10.594045639038086, "global_step": 198325, "epoch": 1180} {"train_loss": -11.172016143798828, "global_step": 198326, "epoch": 1180} {"train_loss": -11.092198371887207, "global_step": 198327, "epoch": 1180} {"train_loss": -10.121532440185547, "global_step": 198328, "epoch": 1180} {"train_loss": -11.474748611450195, "global_step": 198329, "epoch": 1180} {"train_loss": -10.59521484375, "global_step": 198330, "epoch": 1180} {"train_loss": -11.274213790893555, "global_step": 198331, "epoch": 1180} {"train_loss": -10.668169975280762, "global_step": 198332, "epoch": 1180} {"train_loss": -11.044316291809082, "global_step": 198333, "epoch": 1180} {"train_loss": -11.552694320678711, "global_step": 198334, "epoch": 1180} {"train_loss": -10.575836181640625, "global_step": 198335, "epoch": 1180} {"train_loss": -11.742440223693848, "global_step": 198336, "epoch": 1180} {"train_loss": -10.870424270629883, "global_step": 198337, "epoch": 1180} {"train_loss": -11.048798561096191, "global_step": 198338, "epoch": 1180} {"train_loss": -11.46325397491455, "global_step": 198339, "epoch": 1180} {"train_loss": -10.520536422729492, "global_step": 198340, "epoch": 1180} {"train_loss": -11.385969161987305, "global_step": 198341, "epoch": 1180} {"train_loss": -10.762674331665039, "global_step": 198342, "epoch": 1180} {"train_loss": -11.184598922729492, "global_step": 198343, "epoch": 1180} {"train_loss": -11.214494705200195, "global_step": 198344, "epoch": 1180} {"train_loss": -11.481572151184082, "global_step": 198345, "epoch": 1180} {"train_loss": -10.909717559814453, "global_step": 198346, "epoch": 1180} {"train_loss": -11.328058242797852, "global_step": 198347, "epoch": 1180} {"train_loss": -11.251306533813477, "global_step": 198348, "epoch": 1180} {"train_loss": -11.139596939086914, "global_step": 198349, "epoch": 1180} {"train_loss": -11.276567459106445, "global_step": 198350, "epoch": 1180} {"train_loss": -11.044387817382812, "global_step": 198351, "epoch": 1180} {"train_loss": -11.332662582397461, "global_step": 198352, "epoch": 1180} {"train_loss": -11.11468505859375, "global_step": 198353, "epoch": 1180} {"train_loss": -11.635063171386719, "global_step": 198354, "epoch": 1180} {"train_loss": -11.331212043762207, "global_step": 198355, "epoch": 1180} {"train_loss": -11.228649139404297, "global_step": 198356, "epoch": 1180} {"train_loss": -11.264016151428223, "global_step": 198357, "epoch": 1180} {"train_loss": -11.205150604248047, "global_step": 198358, "epoch": 1180} {"train_loss": -10.924565315246582, "global_step": 198359, "epoch": 1180} {"train_loss": -11.416223526000977, "global_step": 198360, "epoch": 1180} {"train_loss": -10.96536636352539, "global_step": 198361, "epoch": 1180} {"train_loss": -11.097757339477539, "global_step": 198362, "epoch": 1180} {"train_loss": -11.25471305847168, "global_step": 198363, "epoch": 1180} {"train_loss": -11.28839111328125, "global_step": 198364, "epoch": 1180} {"train_loss": -11.155953407287598, "global_step": 198365, "epoch": 1180} {"train_loss": -11.319464683532715, "global_step": 198366, "epoch": 1180} {"train_loss": -11.40687084197998, "global_step": 198367, "epoch": 1180} {"train_loss": -11.634851455688477, "global_step": 198368, "epoch": 1180} {"train_loss": -11.390022277832031, "global_step": 198369, "epoch": 1180} {"train_loss": -11.48338508605957, "global_step": 198370, "epoch": 1180} {"train_loss": -11.51866340637207, "global_step": 198371, "epoch": 1180} {"train_loss": -11.674318313598633, "global_step": 198372, "epoch": 1180} {"train_loss": -11.41508674621582, "global_step": 198373, "epoch": 1180} {"train_loss": -11.280068397521973, "global_step": 198374, "epoch": 1180} {"train_loss": -11.202913284301758, "global_step": 198375, "epoch": 1180} {"train_loss": -11.127513885498047, "global_step": 198376, "epoch": 1180} {"train_loss": -11.1840181350708, "global_step": 198377, "epoch": 1180} {"train_loss": -10.13672924041748, "global_step": 198378, "epoch": 1180} {"train_loss": -11.590872764587402, "global_step": 198379, "epoch": 1180} {"train_loss": -10.803093910217285, "global_step": 198380, "epoch": 1180} {"train_loss": -11.01099681854248, "global_step": 198381, "epoch": 1180} {"train_loss": -11.170294761657715, "global_step": 198382, "epoch": 1180} {"train_loss": -10.574475288391113, "global_step": 198383, "epoch": 1180} {"train_loss": -11.360828399658203, "global_step": 198384, "epoch": 1180} {"train_loss": -10.427790641784668, "global_step": 198385, "epoch": 1180} {"train_loss": -11.321171760559082, "global_step": 198386, "epoch": 1180} {"train_loss": -10.74032211303711, "global_step": 198387, "epoch": 1180} {"train_loss": -10.775306701660156, "global_step": 198388, "epoch": 1180} {"train_loss": -10.932561874389648, "global_step": 198389, "epoch": 1180} {"train_loss": -10.708515167236328, "global_step": 198390, "epoch": 1180} {"train_loss": -10.441062927246094, "global_step": 198391, "epoch": 1180} {"train_loss": -10.176962852478027, "global_step": 198392, "epoch": 1180} {"train_loss": -10.975290298461914, "global_step": 198393, "epoch": 1180} {"train_loss": -10.895358085632324, "global_step": 198394, "epoch": 1180} {"train_loss": -10.800731658935547, "global_step": 198395, "epoch": 1180} {"train_loss": -10.806280136108398, "global_step": 198396, "epoch": 1180} {"train_loss": -10.877687454223633, "global_step": 198397, "epoch": 1180} {"train_loss": -11.130905151367188, "global_step": 198398, "epoch": 1180} {"train_loss": -11.271564483642578, "global_step": 198399, "epoch": 1180} {"train_loss": -11.074480056762695, "global_step": 198400, "epoch": 1180} {"train_loss": -11.453227043151855, "global_step": 198401, "epoch": 1180} {"train_loss": -11.051273345947266, "global_step": 198402, "epoch": 1180} {"train_loss": -11.263435363769531, "global_step": 198403, "epoch": 1180} {"train_loss": -11.151296615600586, "global_step": 198404, "epoch": 1180} {"train_loss": -11.459808349609375, "global_step": 198405, "epoch": 1180} {"train_loss": -11.065832138061523, "global_step": 198406, "epoch": 1180} {"train_loss": -11.165991005443392, "global_step": 198407, "epoch": 1180, "val_loss": 239922.921875, "train_action_mse_error": 2.427210807800293} {"train_loss": -10.941699981689453, "global_step": 198408, "epoch": 1181} {"train_loss": -11.152322769165039, "global_step": 198409, "epoch": 1181} {"train_loss": -11.423819541931152, "global_step": 198410, "epoch": 1181} {"train_loss": -11.181947708129883, "global_step": 198411, "epoch": 1181} {"train_loss": -11.554585456848145, "global_step": 198412, "epoch": 1181} {"train_loss": -11.279747009277344, "global_step": 198413, "epoch": 1181} {"train_loss": -11.583412170410156, "global_step": 198414, "epoch": 1181} {"train_loss": -11.040348052978516, "global_step": 198415, "epoch": 1181} {"train_loss": -11.611024856567383, "global_step": 198416, "epoch": 1181} {"train_loss": -11.211525917053223, "global_step": 198417, "epoch": 1181} {"train_loss": -11.390584945678711, "global_step": 198418, "epoch": 1181} {"train_loss": -11.221603393554688, "global_step": 198419, "epoch": 1181} {"train_loss": -11.23729133605957, "global_step": 198420, "epoch": 1181} {"train_loss": -11.35926628112793, "global_step": 198421, "epoch": 1181} {"train_loss": -11.285985946655273, "global_step": 198422, "epoch": 1181} {"train_loss": -11.469043731689453, "global_step": 198423, "epoch": 1181} {"train_loss": -11.540102005004883, "global_step": 198424, "epoch": 1181} {"train_loss": -11.429524421691895, "global_step": 198425, "epoch": 1181} {"train_loss": -11.58020305633545, "global_step": 198426, "epoch": 1181} {"train_loss": -11.442211151123047, "global_step": 198427, "epoch": 1181} {"train_loss": -11.44337272644043, "global_step": 198428, "epoch": 1181} {"train_loss": -11.336389541625977, "global_step": 198429, "epoch": 1181} {"train_loss": -11.54734992980957, "global_step": 198430, "epoch": 1181} {"train_loss": -11.393064498901367, "global_step": 198431, "epoch": 1181} {"train_loss": -11.653177261352539, "global_step": 198432, "epoch": 1181} {"train_loss": -11.558880805969238, "global_step": 198433, "epoch": 1181} {"train_loss": -11.532377243041992, "global_step": 198434, "epoch": 1181} {"train_loss": -11.397255897521973, "global_step": 198435, "epoch": 1181} {"train_loss": -11.481155395507812, "global_step": 198436, "epoch": 1181} {"train_loss": -11.631586074829102, "global_step": 198437, "epoch": 1181} {"train_loss": -11.254598617553711, "global_step": 198438, "epoch": 1181} {"train_loss": -11.373248100280762, "global_step": 198439, "epoch": 1181} {"train_loss": -11.443708419799805, "global_step": 198440, "epoch": 1181} {"train_loss": -11.186185836791992, "global_step": 198441, "epoch": 1181} {"train_loss": -11.465503692626953, "global_step": 198442, "epoch": 1181} {"train_loss": -10.91024112701416, "global_step": 198443, "epoch": 1181} {"train_loss": -10.94573974609375, "global_step": 198444, "epoch": 1181} {"train_loss": -11.40057373046875, "global_step": 198445, "epoch": 1181} {"train_loss": -11.381657600402832, "global_step": 198446, "epoch": 1181} {"train_loss": -11.225048065185547, "global_step": 198447, "epoch": 1181} {"train_loss": -10.943216323852539, "global_step": 198448, "epoch": 1181} {"train_loss": -11.106328964233398, "global_step": 198449, "epoch": 1181} {"train_loss": -11.455909729003906, "global_step": 198450, "epoch": 1181} {"train_loss": -10.826122283935547, "global_step": 198451, "epoch": 1181} {"train_loss": -11.342523574829102, "global_step": 198452, "epoch": 1181} {"train_loss": -11.469051361083984, "global_step": 198453, "epoch": 1181} {"train_loss": -10.929628372192383, "global_step": 198454, "epoch": 1181} {"train_loss": -11.19883918762207, "global_step": 198455, "epoch": 1181} {"train_loss": -10.926979064941406, "global_step": 198456, "epoch": 1181} {"train_loss": -11.145057678222656, "global_step": 198457, "epoch": 1181} {"train_loss": -10.407279014587402, "global_step": 198458, "epoch": 1181} {"train_loss": -10.51405143737793, "global_step": 198459, "epoch": 1181} {"train_loss": -10.171984672546387, "global_step": 198460, "epoch": 1181} {"train_loss": -9.400479316711426, "global_step": 198461, "epoch": 1181} {"train_loss": -11.200141906738281, "global_step": 198462, "epoch": 1181} {"train_loss": -9.61387825012207, "global_step": 198463, "epoch": 1181} {"train_loss": -10.27508544921875, "global_step": 198464, "epoch": 1181} {"train_loss": -10.667227745056152, "global_step": 198465, "epoch": 1181} {"train_loss": -9.471357345581055, "global_step": 198466, "epoch": 1181} {"train_loss": -10.54008674621582, "global_step": 198467, "epoch": 1181} {"train_loss": -10.662832260131836, "global_step": 198468, "epoch": 1181} {"train_loss": -10.647478103637695, "global_step": 198469, "epoch": 1181} {"train_loss": -10.796380043029785, "global_step": 198470, "epoch": 1181} {"train_loss": -10.842998504638672, "global_step": 198471, "epoch": 1181} {"train_loss": -11.056742668151855, "global_step": 198472, "epoch": 1181} {"train_loss": -11.133634567260742, "global_step": 198473, "epoch": 1181} {"train_loss": -10.835553169250488, "global_step": 198474, "epoch": 1181} {"train_loss": -10.634720802307129, "global_step": 198475, "epoch": 1181} {"train_loss": -10.49472713470459, "global_step": 198476, "epoch": 1181} {"train_loss": -10.76169204711914, "global_step": 198477, "epoch": 1181} {"train_loss": -10.682214736938477, "global_step": 198478, "epoch": 1181} {"train_loss": -11.063692092895508, "global_step": 198479, "epoch": 1181} {"train_loss": -10.472383499145508, "global_step": 198480, "epoch": 1181} {"train_loss": -11.150954246520996, "global_step": 198481, "epoch": 1181} {"train_loss": -10.866280555725098, "global_step": 198482, "epoch": 1181} {"train_loss": -11.040821075439453, "global_step": 198483, "epoch": 1181} {"train_loss": -10.881488800048828, "global_step": 198484, "epoch": 1181} {"train_loss": -11.095666885375977, "global_step": 198485, "epoch": 1181} {"train_loss": -10.714693069458008, "global_step": 198486, "epoch": 1181} {"train_loss": -11.042734146118164, "global_step": 198487, "epoch": 1181} {"train_loss": -10.606589317321777, "global_step": 198488, "epoch": 1181} {"train_loss": -11.153752326965332, "global_step": 198489, "epoch": 1181} {"train_loss": -11.083511352539062, "global_step": 198490, "epoch": 1181} {"train_loss": -11.076858520507812, "global_step": 198491, "epoch": 1181} {"train_loss": -10.68850326538086, "global_step": 198492, "epoch": 1181} {"train_loss": -11.331643104553223, "global_step": 198493, "epoch": 1181} {"train_loss": -10.813547134399414, "global_step": 198494, "epoch": 1181} {"train_loss": -11.385848999023438, "global_step": 198495, "epoch": 1181} {"train_loss": -10.989701271057129, "global_step": 198496, "epoch": 1181} {"train_loss": -11.271347045898438, "global_step": 198497, "epoch": 1181} {"train_loss": -11.220932006835938, "global_step": 198498, "epoch": 1181} {"train_loss": -11.094985961914062, "global_step": 198499, "epoch": 1181} {"train_loss": -11.091826438903809, "global_step": 198500, "epoch": 1181} {"train_loss": -11.345402717590332, "global_step": 198501, "epoch": 1181} {"train_loss": -11.255212783813477, "global_step": 198502, "epoch": 1181} {"train_loss": -11.129016876220703, "global_step": 198503, "epoch": 1181} {"train_loss": -11.463546752929688, "global_step": 198504, "epoch": 1181} {"train_loss": -11.059176445007324, "global_step": 198505, "epoch": 1181} {"train_loss": -11.365497589111328, "global_step": 198506, "epoch": 1181} {"train_loss": -11.352058410644531, "global_step": 198507, "epoch": 1181} {"train_loss": -11.51007080078125, "global_step": 198508, "epoch": 1181} {"train_loss": -11.44327163696289, "global_step": 198509, "epoch": 1181} {"train_loss": -11.476019859313965, "global_step": 198510, "epoch": 1181} {"train_loss": -11.642675399780273, "global_step": 198511, "epoch": 1181} {"train_loss": -11.219043731689453, "global_step": 198512, "epoch": 1181} {"train_loss": -11.46013069152832, "global_step": 198513, "epoch": 1181} {"train_loss": -11.59223747253418, "global_step": 198514, "epoch": 1181} {"train_loss": -11.561487197875977, "global_step": 198515, "epoch": 1181} {"train_loss": -11.530595779418945, "global_step": 198516, "epoch": 1181} {"train_loss": -11.654335975646973, "global_step": 198517, "epoch": 1181} {"train_loss": -11.533031463623047, "global_step": 198518, "epoch": 1181} {"train_loss": -11.567522048950195, "global_step": 198519, "epoch": 1181} {"train_loss": -11.62905502319336, "global_step": 198520, "epoch": 1181} {"train_loss": -11.579202651977539, "global_step": 198521, "epoch": 1181} {"train_loss": -11.541807174682617, "global_step": 198522, "epoch": 1181} {"train_loss": -11.409130096435547, "global_step": 198523, "epoch": 1181} {"train_loss": -11.746200561523438, "global_step": 198524, "epoch": 1181} {"train_loss": -11.37448787689209, "global_step": 198525, "epoch": 1181} {"train_loss": -11.46056079864502, "global_step": 198526, "epoch": 1181} {"train_loss": -11.230720520019531, "global_step": 198527, "epoch": 1181} {"train_loss": -11.686853408813477, "global_step": 198528, "epoch": 1181} {"train_loss": -11.019170761108398, "global_step": 198529, "epoch": 1181} {"train_loss": -11.658533096313477, "global_step": 198530, "epoch": 1181} {"train_loss": -11.51038646697998, "global_step": 198531, "epoch": 1181} {"train_loss": -11.617505073547363, "global_step": 198532, "epoch": 1181} {"train_loss": -11.592012405395508, "global_step": 198533, "epoch": 1181} {"train_loss": -11.729131698608398, "global_step": 198534, "epoch": 1181} {"train_loss": -11.415445327758789, "global_step": 198535, "epoch": 1181} {"train_loss": -11.686025619506836, "global_step": 198536, "epoch": 1181} {"train_loss": -11.701970100402832, "global_step": 198537, "epoch": 1181} {"train_loss": -11.558595657348633, "global_step": 198538, "epoch": 1181} {"train_loss": -11.833406448364258, "global_step": 198539, "epoch": 1181} {"train_loss": -11.338544845581055, "global_step": 198540, "epoch": 1181} {"train_loss": -11.341100692749023, "global_step": 198541, "epoch": 1181} {"train_loss": -11.62765884399414, "global_step": 198542, "epoch": 1181} {"train_loss": -11.569355010986328, "global_step": 198543, "epoch": 1181} {"train_loss": -11.597410202026367, "global_step": 198544, "epoch": 1181} {"train_loss": -11.594837188720703, "global_step": 198545, "epoch": 1181} {"train_loss": -11.337898254394531, "global_step": 198546, "epoch": 1181} {"train_loss": -11.578153610229492, "global_step": 198547, "epoch": 1181} {"train_loss": -11.523916244506836, "global_step": 198548, "epoch": 1181} {"train_loss": -11.710599899291992, "global_step": 198549, "epoch": 1181} {"train_loss": -11.730066299438477, "global_step": 198550, "epoch": 1181} {"train_loss": -11.512836456298828, "global_step": 198551, "epoch": 1181} {"train_loss": -11.372520446777344, "global_step": 198552, "epoch": 1181} {"train_loss": -10.955044746398926, "global_step": 198553, "epoch": 1181} {"train_loss": -10.714744567871094, "global_step": 198554, "epoch": 1181} {"train_loss": -11.232011795043945, "global_step": 198555, "epoch": 1181} {"train_loss": -11.391006469726562, "global_step": 198556, "epoch": 1181} {"train_loss": -10.984728813171387, "global_step": 198557, "epoch": 1181} {"train_loss": -10.945199966430664, "global_step": 198558, "epoch": 1181} {"train_loss": -11.219886779785156, "global_step": 198559, "epoch": 1181} {"train_loss": -10.726758003234863, "global_step": 198560, "epoch": 1181} {"train_loss": -11.64707088470459, "global_step": 198561, "epoch": 1181} {"train_loss": -11.26085090637207, "global_step": 198562, "epoch": 1181} {"train_loss": -11.397656440734863, "global_step": 198563, "epoch": 1181} {"train_loss": -11.172616004943848, "global_step": 198564, "epoch": 1181} {"train_loss": -11.233488082885742, "global_step": 198565, "epoch": 1181} {"train_loss": -11.087667465209961, "global_step": 198566, "epoch": 1181} {"train_loss": -11.245281219482422, "global_step": 198567, "epoch": 1181} {"train_loss": -11.07321548461914, "global_step": 198568, "epoch": 1181} {"train_loss": -11.521315574645996, "global_step": 198569, "epoch": 1181} {"train_loss": -10.746490478515625, "global_step": 198570, "epoch": 1181} {"train_loss": -10.761578559875488, "global_step": 198571, "epoch": 1181} {"train_loss": -10.906280517578125, "global_step": 198572, "epoch": 1181} {"train_loss": -10.928244590759277, "global_step": 198573, "epoch": 1181} {"train_loss": -10.999139785766602, "global_step": 198574, "epoch": 1181} {"train_loss": -11.200280365489778, "global_step": 198575, "epoch": 1181, "val_loss": 243807.5} {"train_loss": -11.124467849731445, "global_step": 198576, "epoch": 1182} {"train_loss": -9.537020683288574, "global_step": 198577, "epoch": 1182} {"train_loss": -10.044000625610352, "global_step": 198578, "epoch": 1182} {"train_loss": -9.20543098449707, "global_step": 198579, "epoch": 1182} {"train_loss": -9.01490306854248, "global_step": 198580, "epoch": 1182} {"train_loss": -10.093525886535645, "global_step": 198581, "epoch": 1182} {"train_loss": -9.660523414611816, "global_step": 198582, "epoch": 1182} {"train_loss": -9.393918991088867, "global_step": 198583, "epoch": 1182} {"train_loss": -9.892864227294922, "global_step": 198584, "epoch": 1182} {"train_loss": -10.110671997070312, "global_step": 198585, "epoch": 1182} {"train_loss": -8.55582046508789, "global_step": 198586, "epoch": 1182} {"train_loss": -9.053627014160156, "global_step": 198587, "epoch": 1182} {"train_loss": -10.34931468963623, "global_step": 198588, "epoch": 1182} {"train_loss": -9.033926010131836, "global_step": 198589, "epoch": 1182} {"train_loss": -8.923765182495117, "global_step": 198590, "epoch": 1182} {"train_loss": -10.325008392333984, "global_step": 198591, "epoch": 1182} {"train_loss": -8.781721115112305, "global_step": 198592, "epoch": 1182} {"train_loss": -10.089896202087402, "global_step": 198593, "epoch": 1182} {"train_loss": -10.360925674438477, "global_step": 198594, "epoch": 1182} {"train_loss": -10.180951118469238, "global_step": 198595, "epoch": 1182} {"train_loss": -10.060609817504883, "global_step": 198596, "epoch": 1182} {"train_loss": -10.464363098144531, "global_step": 198597, "epoch": 1182} {"train_loss": -10.520780563354492, "global_step": 198598, "epoch": 1182} {"train_loss": -10.267176628112793, "global_step": 198599, "epoch": 1182} {"train_loss": -10.370746612548828, "global_step": 198600, "epoch": 1182} {"train_loss": -10.670894622802734, "global_step": 198601, "epoch": 1182} {"train_loss": -10.469756126403809, "global_step": 198602, "epoch": 1182} {"train_loss": -10.215736389160156, "global_step": 198603, "epoch": 1182} {"train_loss": -10.850772857666016, "global_step": 198604, "epoch": 1182} {"train_loss": -10.816420555114746, "global_step": 198605, "epoch": 1182} {"train_loss": -10.667400360107422, "global_step": 198606, "epoch": 1182} {"train_loss": -10.817752838134766, "global_step": 198607, "epoch": 1182} {"train_loss": -10.780492782592773, "global_step": 198608, "epoch": 1182} {"train_loss": -11.037460327148438, "global_step": 198609, "epoch": 1182} {"train_loss": -10.616602897644043, "global_step": 198610, "epoch": 1182} {"train_loss": -11.082700729370117, "global_step": 198611, "epoch": 1182} {"train_loss": -11.17028522491455, "global_step": 198612, "epoch": 1182} {"train_loss": -10.797176361083984, "global_step": 198613, "epoch": 1182} {"train_loss": -10.853904724121094, "global_step": 198614, "epoch": 1182} {"train_loss": -10.982128143310547, "global_step": 198615, "epoch": 1182} {"train_loss": -10.844078063964844, "global_step": 198616, "epoch": 1182} {"train_loss": -11.036133766174316, "global_step": 198617, "epoch": 1182} {"train_loss": -11.063467025756836, "global_step": 198618, "epoch": 1182} {"train_loss": -10.992873191833496, "global_step": 198619, "epoch": 1182} {"train_loss": -10.997459411621094, "global_step": 198620, "epoch": 1182} {"train_loss": -11.077460289001465, "global_step": 198621, "epoch": 1182} {"train_loss": -11.119828224182129, "global_step": 198622, "epoch": 1182} {"train_loss": -11.165833473205566, "global_step": 198623, "epoch": 1182} {"train_loss": -11.142353057861328, "global_step": 198624, "epoch": 1182} {"train_loss": -11.143865585327148, "global_step": 198625, "epoch": 1182} {"train_loss": -11.179146766662598, "global_step": 198626, "epoch": 1182} {"train_loss": -11.127096176147461, "global_step": 198627, "epoch": 1182} {"train_loss": -11.270811080932617, "global_step": 198628, "epoch": 1182} {"train_loss": -11.35990047454834, "global_step": 198629, "epoch": 1182} {"train_loss": -11.264442443847656, "global_step": 198630, "epoch": 1182} {"train_loss": -11.257165908813477, "global_step": 198631, "epoch": 1182} {"train_loss": -11.386277198791504, "global_step": 198632, "epoch": 1182} {"train_loss": -11.352630615234375, "global_step": 198633, "epoch": 1182} {"train_loss": -11.223485946655273, "global_step": 198634, "epoch": 1182} {"train_loss": -11.498218536376953, "global_step": 198635, "epoch": 1182} {"train_loss": -11.305732727050781, "global_step": 198636, "epoch": 1182} {"train_loss": -11.396520614624023, "global_step": 198637, "epoch": 1182} {"train_loss": -11.53261661529541, "global_step": 198638, "epoch": 1182} {"train_loss": -11.363643646240234, "global_step": 198639, "epoch": 1182} {"train_loss": -11.589839935302734, "global_step": 198640, "epoch": 1182} {"train_loss": -11.535869598388672, "global_step": 198641, "epoch": 1182} {"train_loss": -11.456730842590332, "global_step": 198642, "epoch": 1182} {"train_loss": -11.549918174743652, "global_step": 198643, "epoch": 1182} {"train_loss": -11.385841369628906, "global_step": 198644, "epoch": 1182} {"train_loss": -11.563690185546875, "global_step": 198645, "epoch": 1182} {"train_loss": -11.624139785766602, "global_step": 198646, "epoch": 1182} {"train_loss": -11.643753051757812, "global_step": 198647, "epoch": 1182} {"train_loss": -11.609729766845703, "global_step": 198648, "epoch": 1182} {"train_loss": -11.554088592529297, "global_step": 198649, "epoch": 1182} {"train_loss": -11.323200225830078, "global_step": 198650, "epoch": 1182} {"train_loss": -11.454278945922852, "global_step": 198651, "epoch": 1182} {"train_loss": -11.832757949829102, "global_step": 198652, "epoch": 1182} {"train_loss": -11.44676399230957, "global_step": 198653, "epoch": 1182} {"train_loss": -11.720046043395996, "global_step": 198654, "epoch": 1182} {"train_loss": -11.705830574035645, "global_step": 198655, "epoch": 1182} {"train_loss": -11.702080726623535, "global_step": 198656, "epoch": 1182} {"train_loss": -11.637752532958984, "global_step": 198657, "epoch": 1182} {"train_loss": -11.86028003692627, "global_step": 198658, "epoch": 1182} {"train_loss": -11.692010879516602, "global_step": 198659, "epoch": 1182} {"train_loss": -11.58041000366211, "global_step": 198660, "epoch": 1182} {"train_loss": -11.554983139038086, "global_step": 198661, "epoch": 1182} {"train_loss": -11.75365924835205, "global_step": 198662, "epoch": 1182} {"train_loss": -11.632613182067871, "global_step": 198663, "epoch": 1182} {"train_loss": -11.578252792358398, "global_step": 198664, "epoch": 1182} {"train_loss": -11.819404602050781, "global_step": 198665, "epoch": 1182} {"train_loss": -11.60706901550293, "global_step": 198666, "epoch": 1182} {"train_loss": -11.6184720993042, "global_step": 198667, "epoch": 1182} {"train_loss": -11.672863960266113, "global_step": 198668, "epoch": 1182} {"train_loss": -11.73585319519043, "global_step": 198669, "epoch": 1182} {"train_loss": -11.494019508361816, "global_step": 198670, "epoch": 1182} {"train_loss": -11.547603607177734, "global_step": 198671, "epoch": 1182} {"train_loss": -11.703514099121094, "global_step": 198672, "epoch": 1182} {"train_loss": -11.49947738647461, "global_step": 198673, "epoch": 1182} {"train_loss": -11.524406433105469, "global_step": 198674, "epoch": 1182} {"train_loss": -11.21933364868164, "global_step": 198675, "epoch": 1182} {"train_loss": -11.337165832519531, "global_step": 198676, "epoch": 1182} {"train_loss": -11.452540397644043, "global_step": 198677, "epoch": 1182} {"train_loss": -11.582273483276367, "global_step": 198678, "epoch": 1182} {"train_loss": -11.243646621704102, "global_step": 198679, "epoch": 1182} {"train_loss": -11.602180480957031, "global_step": 198680, "epoch": 1182} {"train_loss": -11.414920806884766, "global_step": 198681, "epoch": 1182} {"train_loss": -11.456363677978516, "global_step": 198682, "epoch": 1182} {"train_loss": -10.810464859008789, "global_step": 198683, "epoch": 1182} {"train_loss": -11.606949806213379, "global_step": 198684, "epoch": 1182} {"train_loss": -11.409876823425293, "global_step": 198685, "epoch": 1182} {"train_loss": -11.169023513793945, "global_step": 198686, "epoch": 1182} {"train_loss": -11.465690612792969, "global_step": 198687, "epoch": 1182} {"train_loss": -11.614197731018066, "global_step": 198688, "epoch": 1182} {"train_loss": -11.223735809326172, "global_step": 198689, "epoch": 1182} {"train_loss": -11.462745666503906, "global_step": 198690, "epoch": 1182} {"train_loss": -11.69858455657959, "global_step": 198691, "epoch": 1182} {"train_loss": -10.877408981323242, "global_step": 198692, "epoch": 1182} {"train_loss": -11.23200511932373, "global_step": 198693, "epoch": 1182} {"train_loss": -10.8132963180542, "global_step": 198694, "epoch": 1182} {"train_loss": -11.547134399414062, "global_step": 198695, "epoch": 1182} {"train_loss": -10.999724388122559, "global_step": 198696, "epoch": 1182} {"train_loss": -11.39344596862793, "global_step": 198697, "epoch": 1182} {"train_loss": -11.074493408203125, "global_step": 198698, "epoch": 1182} {"train_loss": -11.646795272827148, "global_step": 198699, "epoch": 1182} {"train_loss": -11.688013076782227, "global_step": 198700, "epoch": 1182} {"train_loss": -11.168654441833496, "global_step": 198701, "epoch": 1182} {"train_loss": -11.187246322631836, "global_step": 198702, "epoch": 1182} {"train_loss": -11.251313209533691, "global_step": 198703, "epoch": 1182} {"train_loss": -10.736541748046875, "global_step": 198704, "epoch": 1182} {"train_loss": -10.73343276977539, "global_step": 198705, "epoch": 1182} {"train_loss": -11.477010726928711, "global_step": 198706, "epoch": 1182} {"train_loss": -11.375642776489258, "global_step": 198707, "epoch": 1182} {"train_loss": -11.277637481689453, "global_step": 198708, "epoch": 1182} {"train_loss": -11.596624374389648, "global_step": 198709, "epoch": 1182} {"train_loss": -11.567545890808105, "global_step": 198710, "epoch": 1182} {"train_loss": -11.513237953186035, "global_step": 198711, "epoch": 1182} {"train_loss": -11.505508422851562, "global_step": 198712, "epoch": 1182} {"train_loss": -11.415745735168457, "global_step": 198713, "epoch": 1182} {"train_loss": -10.916379928588867, "global_step": 198714, "epoch": 1182} {"train_loss": -11.075516700744629, "global_step": 198715, "epoch": 1182} {"train_loss": -10.806208610534668, "global_step": 198716, "epoch": 1182} {"train_loss": -11.036394119262695, "global_step": 198717, "epoch": 1182} {"train_loss": -11.471959114074707, "global_step": 198718, "epoch": 1182} {"train_loss": -10.686665534973145, "global_step": 198719, "epoch": 1182} {"train_loss": -11.026347160339355, "global_step": 198720, "epoch": 1182} {"train_loss": -11.054845809936523, "global_step": 198721, "epoch": 1182} {"train_loss": -9.922697067260742, "global_step": 198722, "epoch": 1182} {"train_loss": -11.42471694946289, "global_step": 198723, "epoch": 1182} {"train_loss": -10.350744247436523, "global_step": 198724, "epoch": 1182} {"train_loss": -11.210695266723633, "global_step": 198725, "epoch": 1182} {"train_loss": -10.958404541015625, "global_step": 198726, "epoch": 1182} {"train_loss": -10.843775749206543, "global_step": 198727, "epoch": 1182} {"train_loss": -11.096246719360352, "global_step": 198728, "epoch": 1182} {"train_loss": -11.014429092407227, "global_step": 198729, "epoch": 1182} {"train_loss": -11.28238296508789, "global_step": 198730, "epoch": 1182} {"train_loss": -10.983181953430176, "global_step": 198731, "epoch": 1182} {"train_loss": -11.343547821044922, "global_step": 198732, "epoch": 1182} {"train_loss": -11.0240478515625, "global_step": 198733, "epoch": 1182} {"train_loss": -11.217608451843262, "global_step": 198734, "epoch": 1182} {"train_loss": -11.036680221557617, "global_step": 198735, "epoch": 1182} {"train_loss": -11.393360137939453, "global_step": 198736, "epoch": 1182} {"train_loss": -10.933693885803223, "global_step": 198737, "epoch": 1182} {"train_loss": -11.35720443725586, "global_step": 198738, "epoch": 1182} {"train_loss": -11.274429321289062, "global_step": 198739, "epoch": 1182} {"train_loss": -11.367351531982422, "global_step": 198740, "epoch": 1182} {"train_loss": -11.201915740966797, "global_step": 198741, "epoch": 1182} {"train_loss": -11.00051498413086, "global_step": 198742, "epoch": 1182} {"train_loss": -11.048387675058274, "global_step": 198743, "epoch": 1182, "val_loss": 249477.96875} {"train_loss": -10.8759126663208, "global_step": 198744, "epoch": 1183} {"train_loss": -11.272214889526367, "global_step": 198745, "epoch": 1183} {"train_loss": -11.375324249267578, "global_step": 198746, "epoch": 1183} {"train_loss": -10.604978561401367, "global_step": 198747, "epoch": 1183} {"train_loss": -11.316739082336426, "global_step": 198748, "epoch": 1183} {"train_loss": -11.116765975952148, "global_step": 198749, "epoch": 1183} {"train_loss": -10.886144638061523, "global_step": 198750, "epoch": 1183} {"train_loss": -11.379776954650879, "global_step": 198751, "epoch": 1183} {"train_loss": -11.281234741210938, "global_step": 198752, "epoch": 1183} {"train_loss": -11.162737846374512, "global_step": 198753, "epoch": 1183} {"train_loss": -11.281964302062988, "global_step": 198754, "epoch": 1183} {"train_loss": -11.160565376281738, "global_step": 198755, "epoch": 1183} {"train_loss": -11.062252044677734, "global_step": 198756, "epoch": 1183} {"train_loss": -11.188253402709961, "global_step": 198757, "epoch": 1183} {"train_loss": -10.957722663879395, "global_step": 198758, "epoch": 1183} {"train_loss": -10.669915199279785, "global_step": 198759, "epoch": 1183} {"train_loss": -10.711771965026855, "global_step": 198760, "epoch": 1183} {"train_loss": -10.42840576171875, "global_step": 198761, "epoch": 1183} {"train_loss": -11.239283561706543, "global_step": 198762, "epoch": 1183} {"train_loss": -10.500999450683594, "global_step": 198763, "epoch": 1183} {"train_loss": -11.294062614440918, "global_step": 198764, "epoch": 1183} {"train_loss": -10.78683853149414, "global_step": 198765, "epoch": 1183} {"train_loss": -11.083670616149902, "global_step": 198766, "epoch": 1183} {"train_loss": -10.949856758117676, "global_step": 198767, "epoch": 1183} {"train_loss": -10.365276336669922, "global_step": 198768, "epoch": 1183} {"train_loss": -11.32931900024414, "global_step": 198769, "epoch": 1183} {"train_loss": -10.615111351013184, "global_step": 198770, "epoch": 1183} {"train_loss": -11.354660034179688, "global_step": 198771, "epoch": 1183} {"train_loss": -10.891550064086914, "global_step": 198772, "epoch": 1183} {"train_loss": -11.020662307739258, "global_step": 198773, "epoch": 1183} {"train_loss": -11.077072143554688, "global_step": 198774, "epoch": 1183} {"train_loss": -11.029887199401855, "global_step": 198775, "epoch": 1183} {"train_loss": -11.102957725524902, "global_step": 198776, "epoch": 1183} {"train_loss": -11.212109565734863, "global_step": 198777, "epoch": 1183} {"train_loss": -10.99148178100586, "global_step": 198778, "epoch": 1183} {"train_loss": -10.725038528442383, "global_step": 198779, "epoch": 1183} {"train_loss": -11.111100196838379, "global_step": 198780, "epoch": 1183} {"train_loss": -11.034661293029785, "global_step": 198781, "epoch": 1183} {"train_loss": -10.967199325561523, "global_step": 198782, "epoch": 1183} {"train_loss": -11.103046417236328, "global_step": 198783, "epoch": 1183} {"train_loss": -10.643035888671875, "global_step": 198784, "epoch": 1183} {"train_loss": -11.300140380859375, "global_step": 198785, "epoch": 1183} {"train_loss": -11.197955131530762, "global_step": 198786, "epoch": 1183} {"train_loss": -11.145050048828125, "global_step": 198787, "epoch": 1183} {"train_loss": -11.498687744140625, "global_step": 198788, "epoch": 1183} {"train_loss": -11.276676177978516, "global_step": 198789, "epoch": 1183} {"train_loss": -11.357351303100586, "global_step": 198790, "epoch": 1183} {"train_loss": -11.47409439086914, "global_step": 198791, "epoch": 1183} {"train_loss": -11.394152641296387, "global_step": 198792, "epoch": 1183} {"train_loss": -11.50027084350586, "global_step": 198793, "epoch": 1183} {"train_loss": -11.527077674865723, "global_step": 198794, "epoch": 1183} {"train_loss": -11.598145484924316, "global_step": 198795, "epoch": 1183} {"train_loss": -11.418886184692383, "global_step": 198796, "epoch": 1183} {"train_loss": -11.534660339355469, "global_step": 198797, "epoch": 1183} {"train_loss": -11.282084465026855, "global_step": 198798, "epoch": 1183} {"train_loss": -11.41309928894043, "global_step": 198799, "epoch": 1183} {"train_loss": -11.515983581542969, "global_step": 198800, "epoch": 1183} {"train_loss": -11.514832496643066, "global_step": 198801, "epoch": 1183} {"train_loss": -11.401305198669434, "global_step": 198802, "epoch": 1183} {"train_loss": -11.775396347045898, "global_step": 198803, "epoch": 1183} {"train_loss": -11.435659408569336, "global_step": 198804, "epoch": 1183} {"train_loss": -11.585122108459473, "global_step": 198805, "epoch": 1183} {"train_loss": -11.632396697998047, "global_step": 198806, "epoch": 1183} {"train_loss": -11.492546081542969, "global_step": 198807, "epoch": 1183} {"train_loss": -11.46567153930664, "global_step": 198808, "epoch": 1183} {"train_loss": -11.571476936340332, "global_step": 198809, "epoch": 1183} {"train_loss": -11.678336143493652, "global_step": 198810, "epoch": 1183} {"train_loss": -11.800339698791504, "global_step": 198811, "epoch": 1183} {"train_loss": -11.398200035095215, "global_step": 198812, "epoch": 1183} {"train_loss": -11.685200691223145, "global_step": 198813, "epoch": 1183} {"train_loss": -11.424068450927734, "global_step": 198814, "epoch": 1183} {"train_loss": -11.538725852966309, "global_step": 198815, "epoch": 1183} {"train_loss": -11.410408973693848, "global_step": 198816, "epoch": 1183} {"train_loss": -11.644377708435059, "global_step": 198817, "epoch": 1183} {"train_loss": -11.34927749633789, "global_step": 198818, "epoch": 1183} {"train_loss": -11.675596237182617, "global_step": 198819, "epoch": 1183} {"train_loss": -11.349098205566406, "global_step": 198820, "epoch": 1183} {"train_loss": -11.363847732543945, "global_step": 198821, "epoch": 1183} {"train_loss": -11.552602767944336, "global_step": 198822, "epoch": 1183} {"train_loss": -11.351268768310547, "global_step": 198823, "epoch": 1183} {"train_loss": -11.286005973815918, "global_step": 198824, "epoch": 1183} {"train_loss": -11.756824493408203, "global_step": 198825, "epoch": 1183} {"train_loss": -11.340343475341797, "global_step": 198826, "epoch": 1183} {"train_loss": -11.636810302734375, "global_step": 198827, "epoch": 1183} {"train_loss": -11.511371612548828, "global_step": 198828, "epoch": 1183} {"train_loss": -11.626188278198242, "global_step": 198829, "epoch": 1183} {"train_loss": -11.422128677368164, "global_step": 198830, "epoch": 1183} {"train_loss": -11.587207794189453, "global_step": 198831, "epoch": 1183} {"train_loss": -11.318595886230469, "global_step": 198832, "epoch": 1183} {"train_loss": -11.54205322265625, "global_step": 198833, "epoch": 1183} {"train_loss": -10.9559326171875, "global_step": 198834, "epoch": 1183} {"train_loss": -11.534868240356445, "global_step": 198835, "epoch": 1183} {"train_loss": -11.578356742858887, "global_step": 198836, "epoch": 1183} {"train_loss": -11.609251976013184, "global_step": 198837, "epoch": 1183} {"train_loss": -11.465368270874023, "global_step": 198838, "epoch": 1183} {"train_loss": -11.441336631774902, "global_step": 198839, "epoch": 1183} {"train_loss": -11.633237838745117, "global_step": 198840, "epoch": 1183} {"train_loss": -11.338714599609375, "global_step": 198841, "epoch": 1183} {"train_loss": -11.194818496704102, "global_step": 198842, "epoch": 1183} {"train_loss": -11.599313735961914, "global_step": 198843, "epoch": 1183} {"train_loss": -11.53658676147461, "global_step": 198844, "epoch": 1183} {"train_loss": -11.052322387695312, "global_step": 198845, "epoch": 1183} {"train_loss": -11.62199592590332, "global_step": 198846, "epoch": 1183} {"train_loss": -11.484848976135254, "global_step": 198847, "epoch": 1183} {"train_loss": -11.216408729553223, "global_step": 198848, "epoch": 1183} {"train_loss": -11.195953369140625, "global_step": 198849, "epoch": 1183} {"train_loss": -11.428474426269531, "global_step": 198850, "epoch": 1183} {"train_loss": -10.42133903503418, "global_step": 198851, "epoch": 1183} {"train_loss": -11.09118938446045, "global_step": 198852, "epoch": 1183} {"train_loss": -11.196782112121582, "global_step": 198853, "epoch": 1183} {"train_loss": -10.30860710144043, "global_step": 198854, "epoch": 1183} {"train_loss": -10.699708938598633, "global_step": 198855, "epoch": 1183} {"train_loss": -11.646763801574707, "global_step": 198856, "epoch": 1183} {"train_loss": -11.064458847045898, "global_step": 198857, "epoch": 1183} {"train_loss": -10.741870880126953, "global_step": 198858, "epoch": 1183} {"train_loss": -11.141056060791016, "global_step": 198859, "epoch": 1183} {"train_loss": -10.978043556213379, "global_step": 198860, "epoch": 1183} {"train_loss": -11.335005760192871, "global_step": 198861, "epoch": 1183} {"train_loss": -11.512073516845703, "global_step": 198862, "epoch": 1183} {"train_loss": -10.914392471313477, "global_step": 198863, "epoch": 1183} {"train_loss": -11.09129524230957, "global_step": 198864, "epoch": 1183} {"train_loss": -11.515389442443848, "global_step": 198865, "epoch": 1183} {"train_loss": -11.238216400146484, "global_step": 198866, "epoch": 1183} {"train_loss": -11.439159393310547, "global_step": 198867, "epoch": 1183} {"train_loss": -11.407449722290039, "global_step": 198868, "epoch": 1183} {"train_loss": -11.44196891784668, "global_step": 198869, "epoch": 1183} {"train_loss": -11.66610050201416, "global_step": 198870, "epoch": 1183} {"train_loss": -11.469003677368164, "global_step": 198871, "epoch": 1183} {"train_loss": -11.378149032592773, "global_step": 198872, "epoch": 1183} {"train_loss": -11.447355270385742, "global_step": 198873, "epoch": 1183} {"train_loss": -11.524951934814453, "global_step": 198874, "epoch": 1183} {"train_loss": -11.590951919555664, "global_step": 198875, "epoch": 1183} {"train_loss": -11.441049575805664, "global_step": 198876, "epoch": 1183} {"train_loss": -11.390195846557617, "global_step": 198877, "epoch": 1183} {"train_loss": -11.152741432189941, "global_step": 198878, "epoch": 1183} {"train_loss": -11.298624038696289, "global_step": 198879, "epoch": 1183} {"train_loss": -11.41364860534668, "global_step": 198880, "epoch": 1183} {"train_loss": -11.481727600097656, "global_step": 198881, "epoch": 1183} {"train_loss": -11.444826126098633, "global_step": 198882, "epoch": 1183} {"train_loss": -11.601852416992188, "global_step": 198883, "epoch": 1183} {"train_loss": -10.84748363494873, "global_step": 198884, "epoch": 1183} {"train_loss": -10.929885864257812, "global_step": 198885, "epoch": 1183} {"train_loss": -11.15722370147705, "global_step": 198886, "epoch": 1183} {"train_loss": -10.921573638916016, "global_step": 198887, "epoch": 1183} {"train_loss": -11.390209197998047, "global_step": 198888, "epoch": 1183} {"train_loss": -10.577884674072266, "global_step": 198889, "epoch": 1183} {"train_loss": -11.700799942016602, "global_step": 198890, "epoch": 1183} {"train_loss": -10.785750389099121, "global_step": 198891, "epoch": 1183} {"train_loss": -11.289350509643555, "global_step": 198892, "epoch": 1183} {"train_loss": -11.13016128540039, "global_step": 198893, "epoch": 1183} {"train_loss": -11.293262481689453, "global_step": 198894, "epoch": 1183} {"train_loss": -11.082832336425781, "global_step": 198895, "epoch": 1183} {"train_loss": -11.531950950622559, "global_step": 198896, "epoch": 1183} {"train_loss": -10.929132461547852, "global_step": 198897, "epoch": 1183} {"train_loss": -11.237262725830078, "global_step": 198898, "epoch": 1183} {"train_loss": -11.214740753173828, "global_step": 198899, "epoch": 1183} {"train_loss": -11.260662078857422, "global_step": 198900, "epoch": 1183} {"train_loss": -11.423203468322754, "global_step": 198901, "epoch": 1183} {"train_loss": -11.4593505859375, "global_step": 198902, "epoch": 1183} {"train_loss": -11.553762435913086, "global_step": 198903, "epoch": 1183} {"train_loss": -11.154088020324707, "global_step": 198904, "epoch": 1183} {"train_loss": -11.126802444458008, "global_step": 198905, "epoch": 1183} {"train_loss": -11.387409210205078, "global_step": 198906, "epoch": 1183} {"train_loss": -10.359285354614258, "global_step": 198907, "epoch": 1183} {"train_loss": -11.484959602355957, "global_step": 198908, "epoch": 1183} {"train_loss": -11.137476921081543, "global_step": 198909, "epoch": 1183} {"train_loss": -10.856203079223633, "global_step": 198910, "epoch": 1183} {"train_loss": -11.259662923358736, "global_step": 198911, "epoch": 1183, "val_loss": 252660.984375} {"train_loss": -11.45377254486084, "global_step": 198912, "epoch": 1184} {"train_loss": -11.016901016235352, "global_step": 198913, "epoch": 1184} {"train_loss": -11.52255630493164, "global_step": 198914, "epoch": 1184} {"train_loss": -11.327823638916016, "global_step": 198915, "epoch": 1184} {"train_loss": -11.340069770812988, "global_step": 198916, "epoch": 1184} {"train_loss": -11.575105667114258, "global_step": 198917, "epoch": 1184} {"train_loss": -11.238753318786621, "global_step": 198918, "epoch": 1184} {"train_loss": -11.028242111206055, "global_step": 198919, "epoch": 1184} {"train_loss": -10.259561538696289, "global_step": 198920, "epoch": 1184} {"train_loss": -11.51036262512207, "global_step": 198921, "epoch": 1184} {"train_loss": -10.966974258422852, "global_step": 198922, "epoch": 1184} {"train_loss": -11.13302993774414, "global_step": 198923, "epoch": 1184} {"train_loss": -11.020156860351562, "global_step": 198924, "epoch": 1184} {"train_loss": -11.288207054138184, "global_step": 198925, "epoch": 1184} {"train_loss": -11.106965065002441, "global_step": 198926, "epoch": 1184} {"train_loss": -11.346979141235352, "global_step": 198927, "epoch": 1184} {"train_loss": -11.30764102935791, "global_step": 198928, "epoch": 1184} {"train_loss": -11.238470077514648, "global_step": 198929, "epoch": 1184} {"train_loss": -11.598281860351562, "global_step": 198930, "epoch": 1184} {"train_loss": -11.39676570892334, "global_step": 198931, "epoch": 1184} {"train_loss": -11.237808227539062, "global_step": 198932, "epoch": 1184} {"train_loss": -11.319808959960938, "global_step": 198933, "epoch": 1184} {"train_loss": -10.985836029052734, "global_step": 198934, "epoch": 1184} {"train_loss": -11.525484085083008, "global_step": 198935, "epoch": 1184} {"train_loss": -11.418769836425781, "global_step": 198936, "epoch": 1184} {"train_loss": -11.275116920471191, "global_step": 198937, "epoch": 1184} {"train_loss": -11.194500923156738, "global_step": 198938, "epoch": 1184} {"train_loss": -10.963348388671875, "global_step": 198939, "epoch": 1184} {"train_loss": -11.097113609313965, "global_step": 198940, "epoch": 1184} {"train_loss": -11.463021278381348, "global_step": 198941, "epoch": 1184} {"train_loss": -11.227782249450684, "global_step": 198942, "epoch": 1184} {"train_loss": -11.390792846679688, "global_step": 198943, "epoch": 1184} {"train_loss": -11.154767990112305, "global_step": 198944, "epoch": 1184} {"train_loss": -11.185378074645996, "global_step": 198945, "epoch": 1184} {"train_loss": -11.345062255859375, "global_step": 198946, "epoch": 1184} {"train_loss": -11.367393493652344, "global_step": 198947, "epoch": 1184} {"train_loss": -11.488449096679688, "global_step": 198948, "epoch": 1184} {"train_loss": -10.868484497070312, "global_step": 198949, "epoch": 1184} {"train_loss": -11.58635139465332, "global_step": 198950, "epoch": 1184} {"train_loss": -11.457307815551758, "global_step": 198951, "epoch": 1184} {"train_loss": -11.166024208068848, "global_step": 198952, "epoch": 1184} {"train_loss": -11.462217330932617, "global_step": 198953, "epoch": 1184} {"train_loss": -11.42017650604248, "global_step": 198954, "epoch": 1184} {"train_loss": -10.90989875793457, "global_step": 198955, "epoch": 1184} {"train_loss": -11.517595291137695, "global_step": 198956, "epoch": 1184} {"train_loss": -11.166913986206055, "global_step": 198957, "epoch": 1184} {"train_loss": -11.251956939697266, "global_step": 198958, "epoch": 1184} {"train_loss": -11.27511978149414, "global_step": 198959, "epoch": 1184} {"train_loss": -10.99189281463623, "global_step": 198960, "epoch": 1184} {"train_loss": -11.335658073425293, "global_step": 198961, "epoch": 1184} {"train_loss": -11.509506225585938, "global_step": 198962, "epoch": 1184} {"train_loss": -10.821067810058594, "global_step": 198963, "epoch": 1184} {"train_loss": -11.23832893371582, "global_step": 198964, "epoch": 1184} {"train_loss": -10.765388488769531, "global_step": 198965, "epoch": 1184} {"train_loss": -11.329132080078125, "global_step": 198966, "epoch": 1184} {"train_loss": -11.471427917480469, "global_step": 198967, "epoch": 1184} {"train_loss": -11.40925121307373, "global_step": 198968, "epoch": 1184} {"train_loss": -11.113746643066406, "global_step": 198969, "epoch": 1184} {"train_loss": -11.36924934387207, "global_step": 198970, "epoch": 1184} {"train_loss": -11.187461853027344, "global_step": 198971, "epoch": 1184} {"train_loss": -11.493183135986328, "global_step": 198972, "epoch": 1184} {"train_loss": -10.9194917678833, "global_step": 198973, "epoch": 1184} {"train_loss": -11.621780395507812, "global_step": 198974, "epoch": 1184} {"train_loss": -11.1492919921875, "global_step": 198975, "epoch": 1184} {"train_loss": -11.471800804138184, "global_step": 198976, "epoch": 1184} {"train_loss": -11.46783447265625, "global_step": 198977, "epoch": 1184} {"train_loss": -11.335150718688965, "global_step": 198978, "epoch": 1184} {"train_loss": -11.641218185424805, "global_step": 198979, "epoch": 1184} {"train_loss": -11.270127296447754, "global_step": 198980, "epoch": 1184} {"train_loss": -11.522933006286621, "global_step": 198981, "epoch": 1184} {"train_loss": -11.36479377746582, "global_step": 198982, "epoch": 1184} {"train_loss": -11.598877906799316, "global_step": 198983, "epoch": 1184} {"train_loss": -11.319808959960938, "global_step": 198984, "epoch": 1184} {"train_loss": -11.280205726623535, "global_step": 198985, "epoch": 1184} {"train_loss": -11.345849990844727, "global_step": 198986, "epoch": 1184} {"train_loss": -11.250597953796387, "global_step": 198987, "epoch": 1184} {"train_loss": -11.300192832946777, "global_step": 198988, "epoch": 1184} {"train_loss": -11.087448120117188, "global_step": 198989, "epoch": 1184} {"train_loss": -11.354665756225586, "global_step": 198990, "epoch": 1184} {"train_loss": -11.396642684936523, "global_step": 198991, "epoch": 1184} {"train_loss": -11.187365531921387, "global_step": 198992, "epoch": 1184} {"train_loss": -11.3215913772583, "global_step": 198993, "epoch": 1184} {"train_loss": -11.334169387817383, "global_step": 198994, "epoch": 1184} {"train_loss": -11.535877227783203, "global_step": 198995, "epoch": 1184} {"train_loss": -11.173320770263672, "global_step": 198996, "epoch": 1184} {"train_loss": -11.430354118347168, "global_step": 198997, "epoch": 1184} {"train_loss": -11.587272644042969, "global_step": 198998, "epoch": 1184} {"train_loss": -11.512910842895508, "global_step": 198999, "epoch": 1184} {"train_loss": -11.374950408935547, "global_step": 199000, "epoch": 1184} {"train_loss": -11.473380088806152, "global_step": 199001, "epoch": 1184} {"train_loss": -11.488546371459961, "global_step": 199002, "epoch": 1184} {"train_loss": -11.453466415405273, "global_step": 199003, "epoch": 1184} {"train_loss": -11.493795394897461, "global_step": 199004, "epoch": 1184} {"train_loss": -11.756521224975586, "global_step": 199005, "epoch": 1184} {"train_loss": -11.086804389953613, "global_step": 199006, "epoch": 1184} {"train_loss": -11.731687545776367, "global_step": 199007, "epoch": 1184} {"train_loss": -11.357063293457031, "global_step": 199008, "epoch": 1184} {"train_loss": -11.474268913269043, "global_step": 199009, "epoch": 1184} {"train_loss": -11.64144515991211, "global_step": 199010, "epoch": 1184} {"train_loss": -11.37324047088623, "global_step": 199011, "epoch": 1184} {"train_loss": -11.862580299377441, "global_step": 199012, "epoch": 1184} {"train_loss": -11.634400367736816, "global_step": 199013, "epoch": 1184} {"train_loss": -11.396930694580078, "global_step": 199014, "epoch": 1184} {"train_loss": -11.58619499206543, "global_step": 199015, "epoch": 1184} {"train_loss": -11.549633026123047, "global_step": 199016, "epoch": 1184} {"train_loss": -11.400333404541016, "global_step": 199017, "epoch": 1184} {"train_loss": -11.289987564086914, "global_step": 199018, "epoch": 1184} {"train_loss": -11.362619400024414, "global_step": 199019, "epoch": 1184} {"train_loss": -11.131746292114258, "global_step": 199020, "epoch": 1184} {"train_loss": -11.27131462097168, "global_step": 199021, "epoch": 1184} {"train_loss": -11.30932903289795, "global_step": 199022, "epoch": 1184} {"train_loss": -11.708431243896484, "global_step": 199023, "epoch": 1184} {"train_loss": -11.178436279296875, "global_step": 199024, "epoch": 1184} {"train_loss": -11.587306022644043, "global_step": 199025, "epoch": 1184} {"train_loss": -11.608997344970703, "global_step": 199026, "epoch": 1184} {"train_loss": -11.642049789428711, "global_step": 199027, "epoch": 1184} {"train_loss": -11.441819190979004, "global_step": 199028, "epoch": 1184} {"train_loss": -11.799232482910156, "global_step": 199029, "epoch": 1184} {"train_loss": -11.70313835144043, "global_step": 199030, "epoch": 1184} {"train_loss": -11.454608917236328, "global_step": 199031, "epoch": 1184} {"train_loss": -11.477550506591797, "global_step": 199032, "epoch": 1184} {"train_loss": -11.61385726928711, "global_step": 199033, "epoch": 1184} {"train_loss": -11.753456115722656, "global_step": 199034, "epoch": 1184} {"train_loss": -11.586280822753906, "global_step": 199035, "epoch": 1184} {"train_loss": -11.839155197143555, "global_step": 199036, "epoch": 1184} {"train_loss": -11.578878402709961, "global_step": 199037, "epoch": 1184} {"train_loss": -11.55988883972168, "global_step": 199038, "epoch": 1184} {"train_loss": -11.310893058776855, "global_step": 199039, "epoch": 1184} {"train_loss": -11.749516487121582, "global_step": 199040, "epoch": 1184} {"train_loss": -11.6072416305542, "global_step": 199041, "epoch": 1184} {"train_loss": -11.464489936828613, "global_step": 199042, "epoch": 1184} {"train_loss": -11.922561645507812, "global_step": 199043, "epoch": 1184} {"train_loss": -11.88808536529541, "global_step": 199044, "epoch": 1184} {"train_loss": -11.807132720947266, "global_step": 199045, "epoch": 1184} {"train_loss": -11.436161994934082, "global_step": 199046, "epoch": 1184} {"train_loss": -11.267679214477539, "global_step": 199047, "epoch": 1184} {"train_loss": -11.140459060668945, "global_step": 199048, "epoch": 1184} {"train_loss": -11.485055923461914, "global_step": 199049, "epoch": 1184} {"train_loss": -10.060712814331055, "global_step": 199050, "epoch": 1184} {"train_loss": -10.755587577819824, "global_step": 199051, "epoch": 1184} {"train_loss": -11.173870086669922, "global_step": 199052, "epoch": 1184} {"train_loss": -10.669445037841797, "global_step": 199053, "epoch": 1184} {"train_loss": -11.325939178466797, "global_step": 199054, "epoch": 1184} {"train_loss": -9.98945426940918, "global_step": 199055, "epoch": 1184} {"train_loss": -10.984512329101562, "global_step": 199056, "epoch": 1184} {"train_loss": -9.986217498779297, "global_step": 199057, "epoch": 1184} {"train_loss": -9.611613273620605, "global_step": 199058, "epoch": 1184} {"train_loss": -9.550179481506348, "global_step": 199059, "epoch": 1184} {"train_loss": -10.501391410827637, "global_step": 199060, "epoch": 1184} {"train_loss": -8.909233093261719, "global_step": 199061, "epoch": 1184} {"train_loss": -9.306585311889648, "global_step": 199062, "epoch": 1184} {"train_loss": -10.389192581176758, "global_step": 199063, "epoch": 1184} {"train_loss": -9.37208366394043, "global_step": 199064, "epoch": 1184} {"train_loss": -8.763040542602539, "global_step": 199065, "epoch": 1184} {"train_loss": -10.04999828338623, "global_step": 199066, "epoch": 1184} {"train_loss": -7.806133270263672, "global_step": 199067, "epoch": 1184} {"train_loss": -9.947587966918945, "global_step": 199068, "epoch": 1184} {"train_loss": -8.790268898010254, "global_step": 199069, "epoch": 1184} {"train_loss": -9.850785255432129, "global_step": 199070, "epoch": 1184} {"train_loss": -9.324051856994629, "global_step": 199071, "epoch": 1184} {"train_loss": -10.055930137634277, "global_step": 199072, "epoch": 1184} {"train_loss": -9.741172790527344, "global_step": 199073, "epoch": 1184} {"train_loss": -9.506650924682617, "global_step": 199074, "epoch": 1184} {"train_loss": -10.381156921386719, "global_step": 199075, "epoch": 1184} {"train_loss": -9.58366870880127, "global_step": 199076, "epoch": 1184} {"train_loss": -9.529243469238281, "global_step": 199077, "epoch": 1184} {"train_loss": -10.73460578918457, "global_step": 199078, "epoch": 1184} {"train_loss": -11.106575165476118, "global_step": 199079, "epoch": 1184, "val_loss": 251178.046875} {"train_loss": -10.206707000732422, "global_step": 199080, "epoch": 1185} {"train_loss": -10.5877685546875, "global_step": 199081, "epoch": 1185} {"train_loss": -10.702194213867188, "global_step": 199082, "epoch": 1185} {"train_loss": -10.92087173461914, "global_step": 199083, "epoch": 1185} {"train_loss": -10.425666809082031, "global_step": 199084, "epoch": 1185} {"train_loss": -10.643264770507812, "global_step": 199085, "epoch": 1185} {"train_loss": -10.962041854858398, "global_step": 199086, "epoch": 1185} {"train_loss": -10.603952407836914, "global_step": 199087, "epoch": 1185} {"train_loss": -10.577302932739258, "global_step": 199088, "epoch": 1185} {"train_loss": -10.730365753173828, "global_step": 199089, "epoch": 1185} {"train_loss": -10.754920959472656, "global_step": 199090, "epoch": 1185} {"train_loss": -10.601961135864258, "global_step": 199091, "epoch": 1185} {"train_loss": -10.812747955322266, "global_step": 199092, "epoch": 1185} {"train_loss": -10.48454761505127, "global_step": 199093, "epoch": 1185} {"train_loss": -10.641412734985352, "global_step": 199094, "epoch": 1185} {"train_loss": -10.63582706451416, "global_step": 199095, "epoch": 1185} {"train_loss": -10.952516555786133, "global_step": 199096, "epoch": 1185} {"train_loss": -10.732202529907227, "global_step": 199097, "epoch": 1185} {"train_loss": -10.753284454345703, "global_step": 199098, "epoch": 1185} {"train_loss": -10.627633094787598, "global_step": 199099, "epoch": 1185} {"train_loss": -11.121742248535156, "global_step": 199100, "epoch": 1185} {"train_loss": -10.865814208984375, "global_step": 199101, "epoch": 1185} {"train_loss": -11.150006294250488, "global_step": 199102, "epoch": 1185} {"train_loss": -11.088635444641113, "global_step": 199103, "epoch": 1185} {"train_loss": -11.004230499267578, "global_step": 199104, "epoch": 1185} {"train_loss": -10.846807479858398, "global_step": 199105, "epoch": 1185} {"train_loss": -10.99618148803711, "global_step": 199106, "epoch": 1185} {"train_loss": -11.110326766967773, "global_step": 199107, "epoch": 1185} {"train_loss": -11.216275215148926, "global_step": 199108, "epoch": 1185} {"train_loss": -11.010480880737305, "global_step": 199109, "epoch": 1185} {"train_loss": -11.160414695739746, "global_step": 199110, "epoch": 1185} {"train_loss": -11.326332092285156, "global_step": 199111, "epoch": 1185} {"train_loss": -11.199172973632812, "global_step": 199112, "epoch": 1185} {"train_loss": -11.319723129272461, "global_step": 199113, "epoch": 1185} {"train_loss": -11.13201904296875, "global_step": 199114, "epoch": 1185} {"train_loss": -11.443058013916016, "global_step": 199115, "epoch": 1185} {"train_loss": -11.329030990600586, "global_step": 199116, "epoch": 1185} {"train_loss": -11.309671401977539, "global_step": 199117, "epoch": 1185} {"train_loss": -11.451360702514648, "global_step": 199118, "epoch": 1185} {"train_loss": -11.333267211914062, "global_step": 199119, "epoch": 1185} {"train_loss": -11.22970962524414, "global_step": 199120, "epoch": 1185} {"train_loss": -11.41295051574707, "global_step": 199121, "epoch": 1185} {"train_loss": -11.352093696594238, "global_step": 199122, "epoch": 1185} {"train_loss": -11.270936965942383, "global_step": 199123, "epoch": 1185} {"train_loss": -11.55256462097168, "global_step": 199124, "epoch": 1185} {"train_loss": -11.47555923461914, "global_step": 199125, "epoch": 1185} {"train_loss": -11.446966171264648, "global_step": 199126, "epoch": 1185} {"train_loss": -11.391702651977539, "global_step": 199127, "epoch": 1185} {"train_loss": -11.293892860412598, "global_step": 199128, "epoch": 1185} {"train_loss": -11.641765594482422, "global_step": 199129, "epoch": 1185} {"train_loss": -11.404793739318848, "global_step": 199130, "epoch": 1185} {"train_loss": -11.407752990722656, "global_step": 199131, "epoch": 1185} {"train_loss": -11.413596153259277, "global_step": 199132, "epoch": 1185} {"train_loss": -11.653907775878906, "global_step": 199133, "epoch": 1185} {"train_loss": -11.446746826171875, "global_step": 199134, "epoch": 1185} {"train_loss": -11.548413276672363, "global_step": 199135, "epoch": 1185} {"train_loss": -11.355391502380371, "global_step": 199136, "epoch": 1185} {"train_loss": -11.38791275024414, "global_step": 199137, "epoch": 1185} {"train_loss": -11.533134460449219, "global_step": 199138, "epoch": 1185} {"train_loss": -11.483075141906738, "global_step": 199139, "epoch": 1185} {"train_loss": -11.67196273803711, "global_step": 199140, "epoch": 1185} {"train_loss": -11.396112442016602, "global_step": 199141, "epoch": 1185} {"train_loss": -11.319097518920898, "global_step": 199142, "epoch": 1185} {"train_loss": -11.579845428466797, "global_step": 199143, "epoch": 1185} {"train_loss": -11.644145011901855, "global_step": 199144, "epoch": 1185} {"train_loss": -11.467041015625, "global_step": 199145, "epoch": 1185} {"train_loss": -11.532629013061523, "global_step": 199146, "epoch": 1185} {"train_loss": -11.560670852661133, "global_step": 199147, "epoch": 1185} {"train_loss": -11.402385711669922, "global_step": 199148, "epoch": 1185} {"train_loss": -11.309687614440918, "global_step": 199149, "epoch": 1185} {"train_loss": -11.851283073425293, "global_step": 199150, "epoch": 1185} {"train_loss": -11.424339294433594, "global_step": 199151, "epoch": 1185} {"train_loss": -11.568033218383789, "global_step": 199152, "epoch": 1185} {"train_loss": -11.271343231201172, "global_step": 199153, "epoch": 1185} {"train_loss": -11.76207447052002, "global_step": 199154, "epoch": 1185} {"train_loss": -11.17598819732666, "global_step": 199155, "epoch": 1185} {"train_loss": -11.771430969238281, "global_step": 199156, "epoch": 1185} {"train_loss": -11.3671236038208, "global_step": 199157, "epoch": 1185} {"train_loss": -11.644462585449219, "global_step": 199158, "epoch": 1185} {"train_loss": -11.745157241821289, "global_step": 199159, "epoch": 1185} {"train_loss": -11.696720123291016, "global_step": 199160, "epoch": 1185} {"train_loss": -11.514119148254395, "global_step": 199161, "epoch": 1185} {"train_loss": -11.21259880065918, "global_step": 199162, "epoch": 1185} {"train_loss": -11.327105522155762, "global_step": 199163, "epoch": 1185} {"train_loss": -11.267293930053711, "global_step": 199164, "epoch": 1185} {"train_loss": -11.098254203796387, "global_step": 199165, "epoch": 1185} {"train_loss": -11.135965347290039, "global_step": 199166, "epoch": 1185} {"train_loss": -11.198762893676758, "global_step": 199167, "epoch": 1185} {"train_loss": -11.396949768066406, "global_step": 199168, "epoch": 1185} {"train_loss": -11.321703910827637, "global_step": 199169, "epoch": 1185} {"train_loss": -11.116432189941406, "global_step": 199170, "epoch": 1185} {"train_loss": -11.439029693603516, "global_step": 199171, "epoch": 1185} {"train_loss": -10.840860366821289, "global_step": 199172, "epoch": 1185} {"train_loss": -10.875468254089355, "global_step": 199173, "epoch": 1185} {"train_loss": -10.604499816894531, "global_step": 199174, "epoch": 1185} {"train_loss": -10.976552963256836, "global_step": 199175, "epoch": 1185} {"train_loss": -9.598685264587402, "global_step": 199176, "epoch": 1185} {"train_loss": -11.216144561767578, "global_step": 199177, "epoch": 1185} {"train_loss": -10.432439804077148, "global_step": 199178, "epoch": 1185} {"train_loss": -10.94137954711914, "global_step": 199179, "epoch": 1185} {"train_loss": -10.007516860961914, "global_step": 199180, "epoch": 1185} {"train_loss": -10.769468307495117, "global_step": 199181, "epoch": 1185} {"train_loss": -10.956986427307129, "global_step": 199182, "epoch": 1185} {"train_loss": -10.293678283691406, "global_step": 199183, "epoch": 1185} {"train_loss": -11.061062812805176, "global_step": 199184, "epoch": 1185} {"train_loss": -9.946538925170898, "global_step": 199185, "epoch": 1185} {"train_loss": -10.802096366882324, "global_step": 199186, "epoch": 1185} {"train_loss": -10.89030647277832, "global_step": 199187, "epoch": 1185} {"train_loss": -10.977993965148926, "global_step": 199188, "epoch": 1185} {"train_loss": -10.730147361755371, "global_step": 199189, "epoch": 1185} {"train_loss": -10.751365661621094, "global_step": 199190, "epoch": 1185} {"train_loss": -10.54271411895752, "global_step": 199191, "epoch": 1185} {"train_loss": -11.103796005249023, "global_step": 199192, "epoch": 1185} {"train_loss": -10.9243745803833, "global_step": 199193, "epoch": 1185} {"train_loss": -10.99752426147461, "global_step": 199194, "epoch": 1185} {"train_loss": -10.854944229125977, "global_step": 199195, "epoch": 1185} {"train_loss": -11.21323299407959, "global_step": 199196, "epoch": 1185} {"train_loss": -10.940412521362305, "global_step": 199197, "epoch": 1185} {"train_loss": -10.913551330566406, "global_step": 199198, "epoch": 1185} {"train_loss": -10.948598861694336, "global_step": 199199, "epoch": 1185} {"train_loss": -10.684056282043457, "global_step": 199200, "epoch": 1185} {"train_loss": -10.891005516052246, "global_step": 199201, "epoch": 1185} {"train_loss": -10.750555038452148, "global_step": 199202, "epoch": 1185} {"train_loss": -10.586978912353516, "global_step": 199203, "epoch": 1185} {"train_loss": -11.211869239807129, "global_step": 199204, "epoch": 1185} {"train_loss": -11.060859680175781, "global_step": 199205, "epoch": 1185} {"train_loss": -10.457775115966797, "global_step": 199206, "epoch": 1185} {"train_loss": -11.046886444091797, "global_step": 199207, "epoch": 1185} {"train_loss": -11.048360824584961, "global_step": 199208, "epoch": 1185} {"train_loss": -10.895380020141602, "global_step": 199209, "epoch": 1185} {"train_loss": -11.12112808227539, "global_step": 199210, "epoch": 1185} {"train_loss": -11.047510147094727, "global_step": 199211, "epoch": 1185} {"train_loss": -11.162932395935059, "global_step": 199212, "epoch": 1185} {"train_loss": -11.18494987487793, "global_step": 199213, "epoch": 1185} {"train_loss": -10.868398666381836, "global_step": 199214, "epoch": 1185} {"train_loss": -11.224542617797852, "global_step": 199215, "epoch": 1185} {"train_loss": -11.12034797668457, "global_step": 199216, "epoch": 1185} {"train_loss": -11.109721183776855, "global_step": 199217, "epoch": 1185} {"train_loss": -11.234945297241211, "global_step": 199218, "epoch": 1185} {"train_loss": -11.221951484680176, "global_step": 199219, "epoch": 1185} {"train_loss": -11.25400447845459, "global_step": 199220, "epoch": 1185} {"train_loss": -11.587698936462402, "global_step": 199221, "epoch": 1185} {"train_loss": -11.639541625976562, "global_step": 199222, "epoch": 1185} {"train_loss": -11.510210037231445, "global_step": 199223, "epoch": 1185} {"train_loss": -11.541540145874023, "global_step": 199224, "epoch": 1185} {"train_loss": -11.557933807373047, "global_step": 199225, "epoch": 1185} {"train_loss": -11.485395431518555, "global_step": 199226, "epoch": 1185} {"train_loss": -11.619220733642578, "global_step": 199227, "epoch": 1185} {"train_loss": -11.268522262573242, "global_step": 199228, "epoch": 1185} {"train_loss": -11.415740966796875, "global_step": 199229, "epoch": 1185} {"train_loss": -11.482560157775879, "global_step": 199230, "epoch": 1185} {"train_loss": -11.663297653198242, "global_step": 199231, "epoch": 1185} {"train_loss": -11.672962188720703, "global_step": 199232, "epoch": 1185} {"train_loss": -11.479133605957031, "global_step": 199233, "epoch": 1185} {"train_loss": -11.539190292358398, "global_step": 199234, "epoch": 1185} {"train_loss": -11.758996963500977, "global_step": 199235, "epoch": 1185} {"train_loss": -11.667425155639648, "global_step": 199236, "epoch": 1185} {"train_loss": -11.496850967407227, "global_step": 199237, "epoch": 1185} {"train_loss": -11.653031349182129, "global_step": 199238, "epoch": 1185} {"train_loss": -11.59634780883789, "global_step": 199239, "epoch": 1185} {"train_loss": -11.73534870147705, "global_step": 199240, "epoch": 1185} {"train_loss": -11.71068000793457, "global_step": 199241, "epoch": 1185} {"train_loss": -11.676610946655273, "global_step": 199242, "epoch": 1185} {"train_loss": -11.718962669372559, "global_step": 199243, "epoch": 1185} {"train_loss": -11.735916137695312, "global_step": 199244, "epoch": 1185} {"train_loss": -11.675333976745605, "global_step": 199245, "epoch": 1185} {"train_loss": -11.63787841796875, "global_step": 199246, "epoch": 1185} {"train_loss": -11.173841782978602, "global_step": 199247, "epoch": 1185, "val_loss": 252251.53125, "train_action_mse_error": 1.331978678703308} {"train_loss": -11.743794441223145, "global_step": 199248, "epoch": 1186} {"train_loss": -11.79684066772461, "global_step": 199249, "epoch": 1186} {"train_loss": -11.625875473022461, "global_step": 199250, "epoch": 1186} {"train_loss": -11.748376846313477, "global_step": 199251, "epoch": 1186} {"train_loss": -11.809983253479004, "global_step": 199252, "epoch": 1186} {"train_loss": -11.592086791992188, "global_step": 199253, "epoch": 1186} {"train_loss": -11.661189079284668, "global_step": 199254, "epoch": 1186} {"train_loss": -11.646186828613281, "global_step": 199255, "epoch": 1186} {"train_loss": -11.759252548217773, "global_step": 199256, "epoch": 1186} {"train_loss": -11.890054702758789, "global_step": 199257, "epoch": 1186} {"train_loss": -11.567939758300781, "global_step": 199258, "epoch": 1186} {"train_loss": -11.66794204711914, "global_step": 199259, "epoch": 1186} {"train_loss": -11.502423286437988, "global_step": 199260, "epoch": 1186} {"train_loss": -11.345561981201172, "global_step": 199261, "epoch": 1186} {"train_loss": -11.681700706481934, "global_step": 199262, "epoch": 1186} {"train_loss": -11.598690032958984, "global_step": 199263, "epoch": 1186} {"train_loss": -10.814996719360352, "global_step": 199264, "epoch": 1186} {"train_loss": -11.194920539855957, "global_step": 199265, "epoch": 1186} {"train_loss": -11.372576713562012, "global_step": 199266, "epoch": 1186} {"train_loss": -11.583098411560059, "global_step": 199267, "epoch": 1186} {"train_loss": -11.352823257446289, "global_step": 199268, "epoch": 1186} {"train_loss": -11.402003288269043, "global_step": 199269, "epoch": 1186} {"train_loss": -11.70009994506836, "global_step": 199270, "epoch": 1186} {"train_loss": -11.508567810058594, "global_step": 199271, "epoch": 1186} {"train_loss": -11.143084526062012, "global_step": 199272, "epoch": 1186} {"train_loss": -11.139198303222656, "global_step": 199273, "epoch": 1186} {"train_loss": -11.575301170349121, "global_step": 199274, "epoch": 1186} {"train_loss": -11.058547973632812, "global_step": 199275, "epoch": 1186} {"train_loss": -11.5517578125, "global_step": 199276, "epoch": 1186} {"train_loss": -11.298564910888672, "global_step": 199277, "epoch": 1186} {"train_loss": -11.365095138549805, "global_step": 199278, "epoch": 1186} {"train_loss": -11.171113014221191, "global_step": 199279, "epoch": 1186} {"train_loss": -11.010442733764648, "global_step": 199280, "epoch": 1186} {"train_loss": -9.808879852294922, "global_step": 199281, "epoch": 1186} {"train_loss": -10.294361114501953, "global_step": 199282, "epoch": 1186} {"train_loss": -9.96427059173584, "global_step": 199283, "epoch": 1186} {"train_loss": -9.281723022460938, "global_step": 199284, "epoch": 1186} {"train_loss": -9.41617202758789, "global_step": 199285, "epoch": 1186} {"train_loss": -9.945205688476562, "global_step": 199286, "epoch": 1186} {"train_loss": -8.415433883666992, "global_step": 199287, "epoch": 1186} {"train_loss": -10.66436767578125, "global_step": 199288, "epoch": 1186} {"train_loss": -9.2811279296875, "global_step": 199289, "epoch": 1186} {"train_loss": -10.755889892578125, "global_step": 199290, "epoch": 1186} {"train_loss": -9.125381469726562, "global_step": 199291, "epoch": 1186} {"train_loss": -10.663358688354492, "global_step": 199292, "epoch": 1186} {"train_loss": -10.54285717010498, "global_step": 199293, "epoch": 1186} {"train_loss": -10.42651081085205, "global_step": 199294, "epoch": 1186} {"train_loss": -11.019200325012207, "global_step": 199295, "epoch": 1186} {"train_loss": -9.93146800994873, "global_step": 199296, "epoch": 1186} {"train_loss": -10.96213150024414, "global_step": 199297, "epoch": 1186} {"train_loss": -10.085118293762207, "global_step": 199298, "epoch": 1186} {"train_loss": -10.415617942810059, "global_step": 199299, "epoch": 1186} {"train_loss": -10.834566116333008, "global_step": 199300, "epoch": 1186} {"train_loss": -10.291278839111328, "global_step": 199301, "epoch": 1186} {"train_loss": -10.399848937988281, "global_step": 199302, "epoch": 1186} {"train_loss": -10.70748233795166, "global_step": 199303, "epoch": 1186} {"train_loss": -10.472776412963867, "global_step": 199304, "epoch": 1186} {"train_loss": -11.190194129943848, "global_step": 199305, "epoch": 1186} {"train_loss": -10.876802444458008, "global_step": 199306, "epoch": 1186} {"train_loss": -10.79847526550293, "global_step": 199307, "epoch": 1186} {"train_loss": -10.945698738098145, "global_step": 199308, "epoch": 1186} {"train_loss": -11.170299530029297, "global_step": 199309, "epoch": 1186} {"train_loss": -10.846883773803711, "global_step": 199310, "epoch": 1186} {"train_loss": -11.342341423034668, "global_step": 199311, "epoch": 1186} {"train_loss": -10.768387794494629, "global_step": 199312, "epoch": 1186} {"train_loss": -11.09330940246582, "global_step": 199313, "epoch": 1186} {"train_loss": -11.100200653076172, "global_step": 199314, "epoch": 1186} {"train_loss": -11.165192604064941, "global_step": 199315, "epoch": 1186} {"train_loss": -11.274402618408203, "global_step": 199316, "epoch": 1186} {"train_loss": -10.795276641845703, "global_step": 199317, "epoch": 1186} {"train_loss": -11.423721313476562, "global_step": 199318, "epoch": 1186} {"train_loss": -11.21112060546875, "global_step": 199319, "epoch": 1186} {"train_loss": -11.241971969604492, "global_step": 199320, "epoch": 1186} {"train_loss": -11.099265098571777, "global_step": 199321, "epoch": 1186} {"train_loss": -11.243144989013672, "global_step": 199322, "epoch": 1186} {"train_loss": -11.25625228881836, "global_step": 199323, "epoch": 1186} {"train_loss": -10.945807456970215, "global_step": 199324, "epoch": 1186} {"train_loss": -11.244662284851074, "global_step": 199325, "epoch": 1186} {"train_loss": -10.712930679321289, "global_step": 199326, "epoch": 1186} {"train_loss": -11.254842758178711, "global_step": 199327, "epoch": 1186} {"train_loss": -10.778690338134766, "global_step": 199328, "epoch": 1186} {"train_loss": -11.401049613952637, "global_step": 199329, "epoch": 1186} {"train_loss": -10.942782402038574, "global_step": 199330, "epoch": 1186} {"train_loss": -11.408485412597656, "global_step": 199331, "epoch": 1186} {"train_loss": -11.320999145507812, "global_step": 199332, "epoch": 1186} {"train_loss": -11.17819595336914, "global_step": 199333, "epoch": 1186} {"train_loss": -11.215251922607422, "global_step": 199334, "epoch": 1186} {"train_loss": -11.334635734558105, "global_step": 199335, "epoch": 1186} {"train_loss": -11.26569938659668, "global_step": 199336, "epoch": 1186} {"train_loss": -10.331074714660645, "global_step": 199337, "epoch": 1186} {"train_loss": -11.221153259277344, "global_step": 199338, "epoch": 1186} {"train_loss": -10.581033706665039, "global_step": 199339, "epoch": 1186} {"train_loss": -11.117025375366211, "global_step": 199340, "epoch": 1186} {"train_loss": -10.74775505065918, "global_step": 199341, "epoch": 1186} {"train_loss": -11.221878051757812, "global_step": 199342, "epoch": 1186} {"train_loss": -10.816158294677734, "global_step": 199343, "epoch": 1186} {"train_loss": -11.068421363830566, "global_step": 199344, "epoch": 1186} {"train_loss": -10.970613479614258, "global_step": 199345, "epoch": 1186} {"train_loss": -11.418350219726562, "global_step": 199346, "epoch": 1186} {"train_loss": -11.216904640197754, "global_step": 199347, "epoch": 1186} {"train_loss": -11.197159767150879, "global_step": 199348, "epoch": 1186} {"train_loss": -11.334405899047852, "global_step": 199349, "epoch": 1186} {"train_loss": -10.936095237731934, "global_step": 199350, "epoch": 1186} {"train_loss": -11.45016098022461, "global_step": 199351, "epoch": 1186} {"train_loss": -11.039411544799805, "global_step": 199352, "epoch": 1186} {"train_loss": -11.449597358703613, "global_step": 199353, "epoch": 1186} {"train_loss": -11.28669548034668, "global_step": 199354, "epoch": 1186} {"train_loss": -11.178030967712402, "global_step": 199355, "epoch": 1186} {"train_loss": -11.241792678833008, "global_step": 199356, "epoch": 1186} {"train_loss": -11.15441608428955, "global_step": 199357, "epoch": 1186} {"train_loss": -11.004822731018066, "global_step": 199358, "epoch": 1186} {"train_loss": -11.266765594482422, "global_step": 199359, "epoch": 1186} {"train_loss": -11.340682029724121, "global_step": 199360, "epoch": 1186} {"train_loss": -11.232707023620605, "global_step": 199361, "epoch": 1186} {"train_loss": -11.496335983276367, "global_step": 199362, "epoch": 1186} {"train_loss": -11.45016098022461, "global_step": 199363, "epoch": 1186} {"train_loss": -11.28419303894043, "global_step": 199364, "epoch": 1186} {"train_loss": -11.60688591003418, "global_step": 199365, "epoch": 1186} {"train_loss": -11.579633712768555, "global_step": 199366, "epoch": 1186} {"train_loss": -11.301350593566895, "global_step": 199367, "epoch": 1186} {"train_loss": -11.406652450561523, "global_step": 199368, "epoch": 1186} {"train_loss": -11.528257369995117, "global_step": 199369, "epoch": 1186} {"train_loss": -11.564340591430664, "global_step": 199370, "epoch": 1186} {"train_loss": -11.193727493286133, "global_step": 199371, "epoch": 1186} {"train_loss": -11.507582664489746, "global_step": 199372, "epoch": 1186} {"train_loss": -11.246685981750488, "global_step": 199373, "epoch": 1186} {"train_loss": -11.421192169189453, "global_step": 199374, "epoch": 1186} {"train_loss": -11.663833618164062, "global_step": 199375, "epoch": 1186} {"train_loss": -11.513158798217773, "global_step": 199376, "epoch": 1186} {"train_loss": -11.644103050231934, "global_step": 199377, "epoch": 1186} {"train_loss": -11.46722412109375, "global_step": 199378, "epoch": 1186} {"train_loss": -11.521425247192383, "global_step": 199379, "epoch": 1186} {"train_loss": -11.527687072753906, "global_step": 199380, "epoch": 1186} {"train_loss": -11.440622329711914, "global_step": 199381, "epoch": 1186} {"train_loss": -11.552754402160645, "global_step": 199382, "epoch": 1186} {"train_loss": -11.177467346191406, "global_step": 199383, "epoch": 1186} {"train_loss": -11.491025924682617, "global_step": 199384, "epoch": 1186} {"train_loss": -11.42282485961914, "global_step": 199385, "epoch": 1186} {"train_loss": -11.252713203430176, "global_step": 199386, "epoch": 1186} {"train_loss": -11.526556968688965, "global_step": 199387, "epoch": 1186} {"train_loss": -11.437850952148438, "global_step": 199388, "epoch": 1186} {"train_loss": -11.55372142791748, "global_step": 199389, "epoch": 1186} {"train_loss": -11.174570083618164, "global_step": 199390, "epoch": 1186} {"train_loss": -11.551098823547363, "global_step": 199391, "epoch": 1186} {"train_loss": -11.077982902526855, "global_step": 199392, "epoch": 1186} {"train_loss": -11.469368934631348, "global_step": 199393, "epoch": 1186} {"train_loss": -10.862544059753418, "global_step": 199394, "epoch": 1186} {"train_loss": -11.575759887695312, "global_step": 199395, "epoch": 1186} {"train_loss": -11.368886947631836, "global_step": 199396, "epoch": 1186} {"train_loss": -11.778453826904297, "global_step": 199397, "epoch": 1186} {"train_loss": -11.097489356994629, "global_step": 199398, "epoch": 1186} {"train_loss": -11.473628997802734, "global_step": 199399, "epoch": 1186} {"train_loss": -11.54486083984375, "global_step": 199400, "epoch": 1186} {"train_loss": -11.636624336242676, "global_step": 199401, "epoch": 1186} {"train_loss": -11.63597583770752, "global_step": 199402, "epoch": 1186} {"train_loss": -11.44926643371582, "global_step": 199403, "epoch": 1186} {"train_loss": -11.135708808898926, "global_step": 199404, "epoch": 1186} {"train_loss": -11.773576736450195, "global_step": 199405, "epoch": 1186} {"train_loss": -11.05687427520752, "global_step": 199406, "epoch": 1186} {"train_loss": -11.266962051391602, "global_step": 199407, "epoch": 1186} {"train_loss": -11.562759399414062, "global_step": 199408, "epoch": 1186} {"train_loss": -11.792131423950195, "global_step": 199409, "epoch": 1186} {"train_loss": -11.481008529663086, "global_step": 199410, "epoch": 1186} {"train_loss": -11.713406562805176, "global_step": 199411, "epoch": 1186} {"train_loss": -11.36107349395752, "global_step": 199412, "epoch": 1186} {"train_loss": -11.364303588867188, "global_step": 199413, "epoch": 1186} {"train_loss": -11.681382179260254, "global_step": 199414, "epoch": 1186} {"train_loss": -11.157734269187564, "global_step": 199415, "epoch": 1186, "val_loss": 248905.09375} {"train_loss": -11.299099922180176, "global_step": 199416, "epoch": 1187} {"train_loss": -11.548112869262695, "global_step": 199417, "epoch": 1187} {"train_loss": -11.53281021118164, "global_step": 199418, "epoch": 1187} {"train_loss": -11.327001571655273, "global_step": 199419, "epoch": 1187} {"train_loss": -11.13275146484375, "global_step": 199420, "epoch": 1187} {"train_loss": -11.171825408935547, "global_step": 199421, "epoch": 1187} {"train_loss": -11.672439575195312, "global_step": 199422, "epoch": 1187} {"train_loss": -10.884268760681152, "global_step": 199423, "epoch": 1187} {"train_loss": -11.558892250061035, "global_step": 199424, "epoch": 1187} {"train_loss": -10.940998077392578, "global_step": 199425, "epoch": 1187} {"train_loss": -11.054330825805664, "global_step": 199426, "epoch": 1187} {"train_loss": -11.438151359558105, "global_step": 199427, "epoch": 1187} {"train_loss": -10.241196632385254, "global_step": 199428, "epoch": 1187} {"train_loss": -11.29212474822998, "global_step": 199429, "epoch": 1187} {"train_loss": -10.719829559326172, "global_step": 199430, "epoch": 1187} {"train_loss": -10.088817596435547, "global_step": 199431, "epoch": 1187} {"train_loss": -10.62547779083252, "global_step": 199432, "epoch": 1187} {"train_loss": -11.530881881713867, "global_step": 199433, "epoch": 1187} {"train_loss": -10.640225410461426, "global_step": 199434, "epoch": 1187} {"train_loss": -11.540903091430664, "global_step": 199435, "epoch": 1187} {"train_loss": -11.074380874633789, "global_step": 199436, "epoch": 1187} {"train_loss": -10.958395004272461, "global_step": 199437, "epoch": 1187} {"train_loss": -11.484297752380371, "global_step": 199438, "epoch": 1187} {"train_loss": -11.097516059875488, "global_step": 199439, "epoch": 1187} {"train_loss": -11.12147331237793, "global_step": 199440, "epoch": 1187} {"train_loss": -11.172410011291504, "global_step": 199441, "epoch": 1187} {"train_loss": -10.923569679260254, "global_step": 199442, "epoch": 1187} {"train_loss": -11.187492370605469, "global_step": 199443, "epoch": 1187} {"train_loss": -11.107776641845703, "global_step": 199444, "epoch": 1187} {"train_loss": -11.520605087280273, "global_step": 199445, "epoch": 1187} {"train_loss": -11.004199981689453, "global_step": 199446, "epoch": 1187} {"train_loss": -11.376914978027344, "global_step": 199447, "epoch": 1187} {"train_loss": -10.919654846191406, "global_step": 199448, "epoch": 1187} {"train_loss": -11.324195861816406, "global_step": 199449, "epoch": 1187} {"train_loss": -11.173966407775879, "global_step": 199450, "epoch": 1187} {"train_loss": -11.0546875, "global_step": 199451, "epoch": 1187} {"train_loss": -11.156709671020508, "global_step": 199452, "epoch": 1187} {"train_loss": -10.69721794128418, "global_step": 199453, "epoch": 1187} {"train_loss": -10.853155136108398, "global_step": 199454, "epoch": 1187} {"train_loss": -11.256376266479492, "global_step": 199455, "epoch": 1187} {"train_loss": -10.482131004333496, "global_step": 199456, "epoch": 1187} {"train_loss": -11.276775360107422, "global_step": 199457, "epoch": 1187} {"train_loss": -10.569290161132812, "global_step": 199458, "epoch": 1187} {"train_loss": -11.0458345413208, "global_step": 199459, "epoch": 1187} {"train_loss": -10.912288665771484, "global_step": 199460, "epoch": 1187} {"train_loss": -10.895242691040039, "global_step": 199461, "epoch": 1187} {"train_loss": -10.892147064208984, "global_step": 199462, "epoch": 1187} {"train_loss": -10.952204704284668, "global_step": 199463, "epoch": 1187} {"train_loss": -10.31521224975586, "global_step": 199464, "epoch": 1187} {"train_loss": -10.849815368652344, "global_step": 199465, "epoch": 1187} {"train_loss": -10.673996925354004, "global_step": 199466, "epoch": 1187} {"train_loss": -11.26760196685791, "global_step": 199467, "epoch": 1187} {"train_loss": -10.672616958618164, "global_step": 199468, "epoch": 1187} {"train_loss": -11.15903091430664, "global_step": 199469, "epoch": 1187} {"train_loss": -10.913690567016602, "global_step": 199470, "epoch": 1187} {"train_loss": -11.247161865234375, "global_step": 199471, "epoch": 1187} {"train_loss": -11.034051895141602, "global_step": 199472, "epoch": 1187} {"train_loss": -11.182487487792969, "global_step": 199473, "epoch": 1187} {"train_loss": -11.282346725463867, "global_step": 199474, "epoch": 1187} {"train_loss": -11.061853408813477, "global_step": 199475, "epoch": 1187} {"train_loss": -11.500481605529785, "global_step": 199476, "epoch": 1187} {"train_loss": -11.393594741821289, "global_step": 199477, "epoch": 1187} {"train_loss": -11.432491302490234, "global_step": 199478, "epoch": 1187} {"train_loss": -11.29868221282959, "global_step": 199479, "epoch": 1187} {"train_loss": -11.423298835754395, "global_step": 199480, "epoch": 1187} {"train_loss": -11.377752304077148, "global_step": 199481, "epoch": 1187} {"train_loss": -11.513103485107422, "global_step": 199482, "epoch": 1187} {"train_loss": -11.482497215270996, "global_step": 199483, "epoch": 1187} {"train_loss": -11.312285423278809, "global_step": 199484, "epoch": 1187} {"train_loss": -11.645102500915527, "global_step": 199485, "epoch": 1187} {"train_loss": -11.255611419677734, "global_step": 199486, "epoch": 1187} {"train_loss": -11.349082946777344, "global_step": 199487, "epoch": 1187} {"train_loss": -11.30154037475586, "global_step": 199488, "epoch": 1187} {"train_loss": -11.530014038085938, "global_step": 199489, "epoch": 1187} {"train_loss": -11.149171829223633, "global_step": 199490, "epoch": 1187} {"train_loss": -11.424981117248535, "global_step": 199491, "epoch": 1187} {"train_loss": -11.643270492553711, "global_step": 199492, "epoch": 1187} {"train_loss": -11.335509300231934, "global_step": 199493, "epoch": 1187} {"train_loss": -11.673877716064453, "global_step": 199494, "epoch": 1187} {"train_loss": -11.455228805541992, "global_step": 199495, "epoch": 1187} {"train_loss": -11.552831649780273, "global_step": 199496, "epoch": 1187} {"train_loss": -11.518512725830078, "global_step": 199497, "epoch": 1187} {"train_loss": -11.546497344970703, "global_step": 199498, "epoch": 1187} {"train_loss": -11.680242538452148, "global_step": 199499, "epoch": 1187} {"train_loss": -11.429802894592285, "global_step": 199500, "epoch": 1187} {"train_loss": -11.67603874206543, "global_step": 199501, "epoch": 1187} {"train_loss": -11.34707260131836, "global_step": 199502, "epoch": 1187} {"train_loss": -11.556556701660156, "global_step": 199503, "epoch": 1187} {"train_loss": -11.437043190002441, "global_step": 199504, "epoch": 1187} {"train_loss": -11.680964469909668, "global_step": 199505, "epoch": 1187} {"train_loss": -11.181695938110352, "global_step": 199506, "epoch": 1187} {"train_loss": -11.645612716674805, "global_step": 199507, "epoch": 1187} {"train_loss": -11.406119346618652, "global_step": 199508, "epoch": 1187} {"train_loss": -11.510380744934082, "global_step": 199509, "epoch": 1187} {"train_loss": -11.73390007019043, "global_step": 199510, "epoch": 1187} {"train_loss": -11.617459297180176, "global_step": 199511, "epoch": 1187} {"train_loss": -11.639427185058594, "global_step": 199512, "epoch": 1187} {"train_loss": -11.638050079345703, "global_step": 199513, "epoch": 1187} {"train_loss": -11.556072235107422, "global_step": 199514, "epoch": 1187} {"train_loss": -11.576071739196777, "global_step": 199515, "epoch": 1187} {"train_loss": -11.661684036254883, "global_step": 199516, "epoch": 1187} {"train_loss": -11.926880836486816, "global_step": 199517, "epoch": 1187} {"train_loss": -11.8834810256958, "global_step": 199518, "epoch": 1187} {"train_loss": -11.816583633422852, "global_step": 199519, "epoch": 1187} {"train_loss": -11.754617691040039, "global_step": 199520, "epoch": 1187} {"train_loss": -11.784305572509766, "global_step": 199521, "epoch": 1187} {"train_loss": -11.732404708862305, "global_step": 199522, "epoch": 1187} {"train_loss": -11.467781066894531, "global_step": 199523, "epoch": 1187} {"train_loss": -11.732905387878418, "global_step": 199524, "epoch": 1187} {"train_loss": -11.767630577087402, "global_step": 199525, "epoch": 1187} {"train_loss": -11.577423095703125, "global_step": 199526, "epoch": 1187} {"train_loss": -11.450275421142578, "global_step": 199527, "epoch": 1187} {"train_loss": -11.898181915283203, "global_step": 199528, "epoch": 1187} {"train_loss": -11.483657836914062, "global_step": 199529, "epoch": 1187} {"train_loss": -11.640151023864746, "global_step": 199530, "epoch": 1187} {"train_loss": -11.482587814331055, "global_step": 199531, "epoch": 1187} {"train_loss": -11.368860244750977, "global_step": 199532, "epoch": 1187} {"train_loss": -11.256675720214844, "global_step": 199533, "epoch": 1187} {"train_loss": -10.94500732421875, "global_step": 199534, "epoch": 1187} {"train_loss": -11.191581726074219, "global_step": 199535, "epoch": 1187} {"train_loss": -11.005450248718262, "global_step": 199536, "epoch": 1187} {"train_loss": -11.12320613861084, "global_step": 199537, "epoch": 1187} {"train_loss": -10.260318756103516, "global_step": 199538, "epoch": 1187} {"train_loss": -10.809244155883789, "global_step": 199539, "epoch": 1187} {"train_loss": -10.360750198364258, "global_step": 199540, "epoch": 1187} {"train_loss": -10.384342193603516, "global_step": 199541, "epoch": 1187} {"train_loss": -10.583151817321777, "global_step": 199542, "epoch": 1187} {"train_loss": -9.885139465332031, "global_step": 199543, "epoch": 1187} {"train_loss": -9.90987777709961, "global_step": 199544, "epoch": 1187} {"train_loss": -10.079790115356445, "global_step": 199545, "epoch": 1187} {"train_loss": -9.7691011428833, "global_step": 199546, "epoch": 1187} {"train_loss": -9.767963409423828, "global_step": 199547, "epoch": 1187} {"train_loss": -8.914201736450195, "global_step": 199548, "epoch": 1187} {"train_loss": -9.573116302490234, "global_step": 199549, "epoch": 1187} {"train_loss": -10.345952987670898, "global_step": 199550, "epoch": 1187} {"train_loss": -9.855121612548828, "global_step": 199551, "epoch": 1187} {"train_loss": -10.449352264404297, "global_step": 199552, "epoch": 1187} {"train_loss": -9.872718811035156, "global_step": 199553, "epoch": 1187} {"train_loss": -9.751012802124023, "global_step": 199554, "epoch": 1187} {"train_loss": -9.759729385375977, "global_step": 199555, "epoch": 1187} {"train_loss": -9.673831939697266, "global_step": 199556, "epoch": 1187} {"train_loss": -9.788919448852539, "global_step": 199557, "epoch": 1187} {"train_loss": -10.113561630249023, "global_step": 199558, "epoch": 1187} {"train_loss": -10.52843189239502, "global_step": 199559, "epoch": 1187} {"train_loss": -10.185575485229492, "global_step": 199560, "epoch": 1187} {"train_loss": -9.916627883911133, "global_step": 199561, "epoch": 1187} {"train_loss": -10.906750679016113, "global_step": 199562, "epoch": 1187} {"train_loss": -10.21660041809082, "global_step": 199563, "epoch": 1187} {"train_loss": -10.392566680908203, "global_step": 199564, "epoch": 1187} {"train_loss": -10.75229263305664, "global_step": 199565, "epoch": 1187} {"train_loss": -9.988142013549805, "global_step": 199566, "epoch": 1187} {"train_loss": -10.696943283081055, "global_step": 199567, "epoch": 1187} {"train_loss": -10.369919776916504, "global_step": 199568, "epoch": 1187} {"train_loss": -10.74355697631836, "global_step": 199569, "epoch": 1187} {"train_loss": -10.469345092773438, "global_step": 199570, "epoch": 1187} {"train_loss": -11.153611183166504, "global_step": 199571, "epoch": 1187} {"train_loss": -10.888272285461426, "global_step": 199572, "epoch": 1187} {"train_loss": -10.615738868713379, "global_step": 199573, "epoch": 1187} {"train_loss": -11.09390926361084, "global_step": 199574, "epoch": 1187} {"train_loss": -10.913156509399414, "global_step": 199575, "epoch": 1187} {"train_loss": -10.817270278930664, "global_step": 199576, "epoch": 1187} {"train_loss": -11.068707466125488, "global_step": 199577, "epoch": 1187} {"train_loss": -11.089641571044922, "global_step": 199578, "epoch": 1187} {"train_loss": -11.141654968261719, "global_step": 199579, "epoch": 1187} {"train_loss": -11.040169715881348, "global_step": 199580, "epoch": 1187} {"train_loss": -11.28981876373291, "global_step": 199581, "epoch": 1187} {"train_loss": -11.224210739135742, "global_step": 199582, "epoch": 1187} {"train_loss": -11.044474681218466, "global_step": 199583, "epoch": 1187, "val_loss": 248295.140625} {"train_loss": -11.01361083984375, "global_step": 199584, "epoch": 1188} {"train_loss": -11.350379943847656, "global_step": 199585, "epoch": 1188} {"train_loss": -11.202848434448242, "global_step": 199586, "epoch": 1188} {"train_loss": -11.333816528320312, "global_step": 199587, "epoch": 1188} {"train_loss": -11.119827270507812, "global_step": 199588, "epoch": 1188} {"train_loss": -11.393733978271484, "global_step": 199589, "epoch": 1188} {"train_loss": -11.260977745056152, "global_step": 199590, "epoch": 1188} {"train_loss": -11.063446998596191, "global_step": 199591, "epoch": 1188} {"train_loss": -11.252182960510254, "global_step": 199592, "epoch": 1188} {"train_loss": -11.193076133728027, "global_step": 199593, "epoch": 1188} {"train_loss": -11.329730987548828, "global_step": 199594, "epoch": 1188} {"train_loss": -11.292491912841797, "global_step": 199595, "epoch": 1188} {"train_loss": -11.266901016235352, "global_step": 199596, "epoch": 1188} {"train_loss": -11.384047508239746, "global_step": 199597, "epoch": 1188} {"train_loss": -11.437995910644531, "global_step": 199598, "epoch": 1188} {"train_loss": -11.289847373962402, "global_step": 199599, "epoch": 1188} {"train_loss": -11.359039306640625, "global_step": 199600, "epoch": 1188} {"train_loss": -11.283262252807617, "global_step": 199601, "epoch": 1188} {"train_loss": -11.439913749694824, "global_step": 199602, "epoch": 1188} {"train_loss": -11.300159454345703, "global_step": 199603, "epoch": 1188} {"train_loss": -11.640982627868652, "global_step": 199604, "epoch": 1188} {"train_loss": -11.549139022827148, "global_step": 199605, "epoch": 1188} {"train_loss": -11.415831565856934, "global_step": 199606, "epoch": 1188} {"train_loss": -11.555232048034668, "global_step": 199607, "epoch": 1188} {"train_loss": -11.652567863464355, "global_step": 199608, "epoch": 1188} {"train_loss": -11.33116626739502, "global_step": 199609, "epoch": 1188} {"train_loss": -11.475021362304688, "global_step": 199610, "epoch": 1188} {"train_loss": -11.661145210266113, "global_step": 199611, "epoch": 1188} {"train_loss": -11.584935188293457, "global_step": 199612, "epoch": 1188} {"train_loss": -11.358484268188477, "global_step": 199613, "epoch": 1188} {"train_loss": -11.529613494873047, "global_step": 199614, "epoch": 1188} {"train_loss": -11.583684921264648, "global_step": 199615, "epoch": 1188} {"train_loss": -11.4598388671875, "global_step": 199616, "epoch": 1188} {"train_loss": -11.699764251708984, "global_step": 199617, "epoch": 1188} {"train_loss": -11.42438793182373, "global_step": 199618, "epoch": 1188} {"train_loss": -11.45814037322998, "global_step": 199619, "epoch": 1188} {"train_loss": -11.72612190246582, "global_step": 199620, "epoch": 1188} {"train_loss": -11.659002304077148, "global_step": 199621, "epoch": 1188} {"train_loss": -11.834214210510254, "global_step": 199622, "epoch": 1188} {"train_loss": -11.63998794555664, "global_step": 199623, "epoch": 1188} {"train_loss": -11.586748123168945, "global_step": 199624, "epoch": 1188} {"train_loss": -11.635454177856445, "global_step": 199625, "epoch": 1188} {"train_loss": -11.768350601196289, "global_step": 199626, "epoch": 1188} {"train_loss": -11.407402038574219, "global_step": 199627, "epoch": 1188} {"train_loss": -11.6928129196167, "global_step": 199628, "epoch": 1188} {"train_loss": -11.562769889831543, "global_step": 199629, "epoch": 1188} {"train_loss": -11.797682762145996, "global_step": 199630, "epoch": 1188} {"train_loss": -11.580463409423828, "global_step": 199631, "epoch": 1188} {"train_loss": -11.647050857543945, "global_step": 199632, "epoch": 1188} {"train_loss": -11.780243873596191, "global_step": 199633, "epoch": 1188} {"train_loss": -11.45498275756836, "global_step": 199634, "epoch": 1188} {"train_loss": -11.527420997619629, "global_step": 199635, "epoch": 1188} {"train_loss": -11.393033981323242, "global_step": 199636, "epoch": 1188} {"train_loss": -11.368135452270508, "global_step": 199637, "epoch": 1188} {"train_loss": -11.693044662475586, "global_step": 199638, "epoch": 1188} {"train_loss": -11.597965240478516, "global_step": 199639, "epoch": 1188} {"train_loss": -11.462684631347656, "global_step": 199640, "epoch": 1188} {"train_loss": -11.500358581542969, "global_step": 199641, "epoch": 1188} {"train_loss": -11.188455581665039, "global_step": 199642, "epoch": 1188} {"train_loss": -11.07308578491211, "global_step": 199643, "epoch": 1188} {"train_loss": -11.030694007873535, "global_step": 199644, "epoch": 1188} {"train_loss": -11.009984970092773, "global_step": 199645, "epoch": 1188} {"train_loss": -11.859488487243652, "global_step": 199646, "epoch": 1188} {"train_loss": -11.138723373413086, "global_step": 199647, "epoch": 1188} {"train_loss": -11.389384269714355, "global_step": 199648, "epoch": 1188} {"train_loss": -11.292312622070312, "global_step": 199649, "epoch": 1188} {"train_loss": -11.339378356933594, "global_step": 199650, "epoch": 1188} {"train_loss": -10.530975341796875, "global_step": 199651, "epoch": 1188} {"train_loss": -10.615213394165039, "global_step": 199652, "epoch": 1188} {"train_loss": -11.176292419433594, "global_step": 199653, "epoch": 1188} {"train_loss": -9.90998649597168, "global_step": 199654, "epoch": 1188} {"train_loss": -9.970233917236328, "global_step": 199655, "epoch": 1188} {"train_loss": -11.054670333862305, "global_step": 199656, "epoch": 1188} {"train_loss": -10.647049903869629, "global_step": 199657, "epoch": 1188} {"train_loss": -10.572183609008789, "global_step": 199658, "epoch": 1188} {"train_loss": -11.208752632141113, "global_step": 199659, "epoch": 1188} {"train_loss": -11.063976287841797, "global_step": 199660, "epoch": 1188} {"train_loss": -11.11378288269043, "global_step": 199661, "epoch": 1188} {"train_loss": -11.461603164672852, "global_step": 199662, "epoch": 1188} {"train_loss": -10.804769515991211, "global_step": 199663, "epoch": 1188} {"train_loss": -11.104625701904297, "global_step": 199664, "epoch": 1188} {"train_loss": -11.00278377532959, "global_step": 199665, "epoch": 1188} {"train_loss": -11.303079605102539, "global_step": 199666, "epoch": 1188} {"train_loss": -10.94904899597168, "global_step": 199667, "epoch": 1188} {"train_loss": -10.985352516174316, "global_step": 199668, "epoch": 1188} {"train_loss": -11.341036796569824, "global_step": 199669, "epoch": 1188} {"train_loss": -11.055328369140625, "global_step": 199670, "epoch": 1188} {"train_loss": -10.921531677246094, "global_step": 199671, "epoch": 1188} {"train_loss": -11.325486183166504, "global_step": 199672, "epoch": 1188} {"train_loss": -11.104753494262695, "global_step": 199673, "epoch": 1188} {"train_loss": -11.305546760559082, "global_step": 199674, "epoch": 1188} {"train_loss": -11.364506721496582, "global_step": 199675, "epoch": 1188} {"train_loss": -11.0499849319458, "global_step": 199676, "epoch": 1188} {"train_loss": -11.431981086730957, "global_step": 199677, "epoch": 1188} {"train_loss": -11.220041275024414, "global_step": 199678, "epoch": 1188} {"train_loss": -11.337315559387207, "global_step": 199679, "epoch": 1188} {"train_loss": -11.51417350769043, "global_step": 199680, "epoch": 1188} {"train_loss": -11.158731460571289, "global_step": 199681, "epoch": 1188} {"train_loss": -11.289949417114258, "global_step": 199682, "epoch": 1188} {"train_loss": -11.357414245605469, "global_step": 199683, "epoch": 1188} {"train_loss": -11.347314834594727, "global_step": 199684, "epoch": 1188} {"train_loss": -11.280416488647461, "global_step": 199685, "epoch": 1188} {"train_loss": -11.293312072753906, "global_step": 199686, "epoch": 1188} {"train_loss": -11.464689254760742, "global_step": 199687, "epoch": 1188} {"train_loss": -11.623830795288086, "global_step": 199688, "epoch": 1188} {"train_loss": -11.421616554260254, "global_step": 199689, "epoch": 1188} {"train_loss": -11.596084594726562, "global_step": 199690, "epoch": 1188} {"train_loss": -11.523614883422852, "global_step": 199691, "epoch": 1188} {"train_loss": -11.564300537109375, "global_step": 199692, "epoch": 1188} {"train_loss": -11.314743995666504, "global_step": 199693, "epoch": 1188} {"train_loss": -11.54263973236084, "global_step": 199694, "epoch": 1188} {"train_loss": -11.521796226501465, "global_step": 199695, "epoch": 1188} {"train_loss": -11.463127136230469, "global_step": 199696, "epoch": 1188} {"train_loss": -11.409481048583984, "global_step": 199697, "epoch": 1188} {"train_loss": -11.391355514526367, "global_step": 199698, "epoch": 1188} {"train_loss": -11.835895538330078, "global_step": 199699, "epoch": 1188} {"train_loss": -11.394014358520508, "global_step": 199700, "epoch": 1188} {"train_loss": -11.445272445678711, "global_step": 199701, "epoch": 1188} {"train_loss": -11.65994644165039, "global_step": 199702, "epoch": 1188} {"train_loss": -11.156608581542969, "global_step": 199703, "epoch": 1188} {"train_loss": -10.84897232055664, "global_step": 199704, "epoch": 1188} {"train_loss": -11.534078598022461, "global_step": 199705, "epoch": 1188} {"train_loss": -11.089912414550781, "global_step": 199706, "epoch": 1188} {"train_loss": -11.519936561584473, "global_step": 199707, "epoch": 1188} {"train_loss": -11.705504417419434, "global_step": 199708, "epoch": 1188} {"train_loss": -11.607919692993164, "global_step": 199709, "epoch": 1188} {"train_loss": -11.474523544311523, "global_step": 199710, "epoch": 1188} {"train_loss": -11.542052268981934, "global_step": 199711, "epoch": 1188} {"train_loss": -11.477246284484863, "global_step": 199712, "epoch": 1188} {"train_loss": -11.551887512207031, "global_step": 199713, "epoch": 1188} {"train_loss": -11.630170822143555, "global_step": 199714, "epoch": 1188} {"train_loss": -11.329100608825684, "global_step": 199715, "epoch": 1188} {"train_loss": -11.496550559997559, "global_step": 199716, "epoch": 1188} {"train_loss": -10.853111267089844, "global_step": 199717, "epoch": 1188} {"train_loss": -10.944647789001465, "global_step": 199718, "epoch": 1188} {"train_loss": -11.122940063476562, "global_step": 199719, "epoch": 1188} {"train_loss": -11.129262924194336, "global_step": 199720, "epoch": 1188} {"train_loss": -10.500898361206055, "global_step": 199721, "epoch": 1188} {"train_loss": -11.448421478271484, "global_step": 199722, "epoch": 1188} {"train_loss": -11.375847816467285, "global_step": 199723, "epoch": 1188} {"train_loss": -10.901594161987305, "global_step": 199724, "epoch": 1188} {"train_loss": -11.223928451538086, "global_step": 199725, "epoch": 1188} {"train_loss": -11.534610748291016, "global_step": 199726, "epoch": 1188} {"train_loss": -10.916111946105957, "global_step": 199727, "epoch": 1188} {"train_loss": -11.139732360839844, "global_step": 199728, "epoch": 1188} {"train_loss": -10.681503295898438, "global_step": 199729, "epoch": 1188} {"train_loss": -11.265411376953125, "global_step": 199730, "epoch": 1188} {"train_loss": -11.158247947692871, "global_step": 199731, "epoch": 1188} {"train_loss": -10.837167739868164, "global_step": 199732, "epoch": 1188} {"train_loss": -11.287664413452148, "global_step": 199733, "epoch": 1188} {"train_loss": -10.496204376220703, "global_step": 199734, "epoch": 1188} {"train_loss": -11.0859956741333, "global_step": 199735, "epoch": 1188} {"train_loss": -11.220924377441406, "global_step": 199736, "epoch": 1188} {"train_loss": -10.514761924743652, "global_step": 199737, "epoch": 1188} {"train_loss": -11.470672607421875, "global_step": 199738, "epoch": 1188} {"train_loss": -10.992059707641602, "global_step": 199739, "epoch": 1188} {"train_loss": -10.995943069458008, "global_step": 199740, "epoch": 1188} {"train_loss": -11.326061248779297, "global_step": 199741, "epoch": 1188} {"train_loss": -11.03832721710205, "global_step": 199742, "epoch": 1188} {"train_loss": -11.470115661621094, "global_step": 199743, "epoch": 1188} {"train_loss": -11.253397941589355, "global_step": 199744, "epoch": 1188} {"train_loss": -11.41342544555664, "global_step": 199745, "epoch": 1188} {"train_loss": -11.658857345581055, "global_step": 199746, "epoch": 1188} {"train_loss": -11.263280868530273, "global_step": 199747, "epoch": 1188} {"train_loss": -11.35678482055664, "global_step": 199748, "epoch": 1188} {"train_loss": -11.465517044067383, "global_step": 199749, "epoch": 1188} {"train_loss": -11.462295532226562, "global_step": 199750, "epoch": 1188} {"train_loss": -11.305481133006868, "global_step": 199751, "epoch": 1188, "val_loss": 252448.8125} {"train_loss": -11.211151123046875, "global_step": 199752, "epoch": 1189} {"train_loss": -11.451982498168945, "global_step": 199753, "epoch": 1189} {"train_loss": -11.371868133544922, "global_step": 199754, "epoch": 1189} {"train_loss": -11.339189529418945, "global_step": 199755, "epoch": 1189} {"train_loss": -11.36914348602295, "global_step": 199756, "epoch": 1189} {"train_loss": -11.113353729248047, "global_step": 199757, "epoch": 1189} {"train_loss": -11.577611923217773, "global_step": 199758, "epoch": 1189} {"train_loss": -11.138964653015137, "global_step": 199759, "epoch": 1189} {"train_loss": -11.655370712280273, "global_step": 199760, "epoch": 1189} {"train_loss": -11.450567245483398, "global_step": 199761, "epoch": 1189} {"train_loss": -11.486223220825195, "global_step": 199762, "epoch": 1189} {"train_loss": -11.552886962890625, "global_step": 199763, "epoch": 1189} {"train_loss": -11.60722827911377, "global_step": 199764, "epoch": 1189} {"train_loss": -11.509724617004395, "global_step": 199765, "epoch": 1189} {"train_loss": -11.544891357421875, "global_step": 199766, "epoch": 1189} {"train_loss": -11.199234008789062, "global_step": 199767, "epoch": 1189} {"train_loss": -11.514753341674805, "global_step": 199768, "epoch": 1189} {"train_loss": -11.235771179199219, "global_step": 199769, "epoch": 1189} {"train_loss": -11.597370147705078, "global_step": 199770, "epoch": 1189} {"train_loss": -11.623416900634766, "global_step": 199771, "epoch": 1189} {"train_loss": -11.272978782653809, "global_step": 199772, "epoch": 1189} {"train_loss": -11.0531644821167, "global_step": 199773, "epoch": 1189} {"train_loss": -11.61271858215332, "global_step": 199774, "epoch": 1189} {"train_loss": -11.205252647399902, "global_step": 199775, "epoch": 1189} {"train_loss": -11.398409843444824, "global_step": 199776, "epoch": 1189} {"train_loss": -11.44539737701416, "global_step": 199777, "epoch": 1189} {"train_loss": -11.47357177734375, "global_step": 199778, "epoch": 1189} {"train_loss": -10.598587036132812, "global_step": 199779, "epoch": 1189} {"train_loss": -11.576740264892578, "global_step": 199780, "epoch": 1189} {"train_loss": -9.928064346313477, "global_step": 199781, "epoch": 1189} {"train_loss": -11.018298149108887, "global_step": 199782, "epoch": 1189} {"train_loss": -10.331604957580566, "global_step": 199783, "epoch": 1189} {"train_loss": -10.542596817016602, "global_step": 199784, "epoch": 1189} {"train_loss": -10.712400436401367, "global_step": 199785, "epoch": 1189} {"train_loss": -11.037582397460938, "global_step": 199786, "epoch": 1189} {"train_loss": -10.625880241394043, "global_step": 199787, "epoch": 1189} {"train_loss": -11.00625991821289, "global_step": 199788, "epoch": 1189} {"train_loss": -10.769344329833984, "global_step": 199789, "epoch": 1189} {"train_loss": -10.487722396850586, "global_step": 199790, "epoch": 1189} {"train_loss": -10.942861557006836, "global_step": 199791, "epoch": 1189} {"train_loss": -10.65744400024414, "global_step": 199792, "epoch": 1189} {"train_loss": -10.552417755126953, "global_step": 199793, "epoch": 1189} {"train_loss": -10.77379035949707, "global_step": 199794, "epoch": 1189} {"train_loss": -10.796576499938965, "global_step": 199795, "epoch": 1189} {"train_loss": -11.352676391601562, "global_step": 199796, "epoch": 1189} {"train_loss": -10.897079467773438, "global_step": 199797, "epoch": 1189} {"train_loss": -11.079425811767578, "global_step": 199798, "epoch": 1189} {"train_loss": -11.264226913452148, "global_step": 199799, "epoch": 1189} {"train_loss": -11.078577041625977, "global_step": 199800, "epoch": 1189} {"train_loss": -11.251625061035156, "global_step": 199801, "epoch": 1189} {"train_loss": -11.290966033935547, "global_step": 199802, "epoch": 1189} {"train_loss": -11.221923828125, "global_step": 199803, "epoch": 1189} {"train_loss": -10.781265258789062, "global_step": 199804, "epoch": 1189} {"train_loss": -11.106816291809082, "global_step": 199805, "epoch": 1189} {"train_loss": -10.83802318572998, "global_step": 199806, "epoch": 1189} {"train_loss": -10.976609230041504, "global_step": 199807, "epoch": 1189} {"train_loss": -10.603050231933594, "global_step": 199808, "epoch": 1189} {"train_loss": -11.225632667541504, "global_step": 199809, "epoch": 1189} {"train_loss": -10.627020835876465, "global_step": 199810, "epoch": 1189} {"train_loss": -11.310312271118164, "global_step": 199811, "epoch": 1189} {"train_loss": -11.10745620727539, "global_step": 199812, "epoch": 1189} {"train_loss": -11.135931968688965, "global_step": 199813, "epoch": 1189} {"train_loss": -11.186151504516602, "global_step": 199814, "epoch": 1189} {"train_loss": -11.237289428710938, "global_step": 199815, "epoch": 1189} {"train_loss": -11.202201843261719, "global_step": 199816, "epoch": 1189} {"train_loss": -11.334147453308105, "global_step": 199817, "epoch": 1189} {"train_loss": -11.444595336914062, "global_step": 199818, "epoch": 1189} {"train_loss": -11.536847114562988, "global_step": 199819, "epoch": 1189} {"train_loss": -11.330528259277344, "global_step": 199820, "epoch": 1189} {"train_loss": -11.610862731933594, "global_step": 199821, "epoch": 1189} {"train_loss": -11.3723726272583, "global_step": 199822, "epoch": 1189} {"train_loss": -11.440620422363281, "global_step": 199823, "epoch": 1189} {"train_loss": -11.611102104187012, "global_step": 199824, "epoch": 1189} {"train_loss": -11.262434005737305, "global_step": 199825, "epoch": 1189} {"train_loss": -11.424274444580078, "global_step": 199826, "epoch": 1189} {"train_loss": -11.371026992797852, "global_step": 199827, "epoch": 1189} {"train_loss": -11.356218338012695, "global_step": 199828, "epoch": 1189} {"train_loss": -11.401823043823242, "global_step": 199829, "epoch": 1189} {"train_loss": -11.62908935546875, "global_step": 199830, "epoch": 1189} {"train_loss": -11.770078659057617, "global_step": 199831, "epoch": 1189} {"train_loss": -11.584583282470703, "global_step": 199832, "epoch": 1189} {"train_loss": -11.675710678100586, "global_step": 199833, "epoch": 1189} {"train_loss": -11.724292755126953, "global_step": 199834, "epoch": 1189} {"train_loss": -11.47684097290039, "global_step": 199835, "epoch": 1189} {"train_loss": -11.54864501953125, "global_step": 199836, "epoch": 1189} {"train_loss": -11.752220153808594, "global_step": 199837, "epoch": 1189} {"train_loss": -11.771995544433594, "global_step": 199838, "epoch": 1189} {"train_loss": -11.510795593261719, "global_step": 199839, "epoch": 1189} {"train_loss": -11.79278564453125, "global_step": 199840, "epoch": 1189} {"train_loss": -11.63188362121582, "global_step": 199841, "epoch": 1189} {"train_loss": -11.811634063720703, "global_step": 199842, "epoch": 1189} {"train_loss": -11.656097412109375, "global_step": 199843, "epoch": 1189} {"train_loss": -11.730371475219727, "global_step": 199844, "epoch": 1189} {"train_loss": -11.82955265045166, "global_step": 199845, "epoch": 1189} {"train_loss": -11.656838417053223, "global_step": 199846, "epoch": 1189} {"train_loss": -11.576486587524414, "global_step": 199847, "epoch": 1189} {"train_loss": -11.873411178588867, "global_step": 199848, "epoch": 1189} {"train_loss": -11.56965446472168, "global_step": 199849, "epoch": 1189} {"train_loss": -11.65319538116455, "global_step": 199850, "epoch": 1189} {"train_loss": -11.858171463012695, "global_step": 199851, "epoch": 1189} {"train_loss": -11.656903266906738, "global_step": 199852, "epoch": 1189} {"train_loss": -11.813833236694336, "global_step": 199853, "epoch": 1189} {"train_loss": -11.65376091003418, "global_step": 199854, "epoch": 1189} {"train_loss": -11.865440368652344, "global_step": 199855, "epoch": 1189} {"train_loss": -11.78940200805664, "global_step": 199856, "epoch": 1189} {"train_loss": -11.834945678710938, "global_step": 199857, "epoch": 1189} {"train_loss": -11.70937728881836, "global_step": 199858, "epoch": 1189} {"train_loss": -11.598309516906738, "global_step": 199859, "epoch": 1189} {"train_loss": -11.669229507446289, "global_step": 199860, "epoch": 1189} {"train_loss": -11.535482406616211, "global_step": 199861, "epoch": 1189} {"train_loss": -11.922429084777832, "global_step": 199862, "epoch": 1189} {"train_loss": -11.288522720336914, "global_step": 199863, "epoch": 1189} {"train_loss": -11.332113265991211, "global_step": 199864, "epoch": 1189} {"train_loss": -11.688275337219238, "global_step": 199865, "epoch": 1189} {"train_loss": -10.902571678161621, "global_step": 199866, "epoch": 1189} {"train_loss": -10.199819564819336, "global_step": 199867, "epoch": 1189} {"train_loss": -10.69951057434082, "global_step": 199868, "epoch": 1189} {"train_loss": -10.97957992553711, "global_step": 199869, "epoch": 1189} {"train_loss": -10.803606033325195, "global_step": 199870, "epoch": 1189} {"train_loss": -11.010991096496582, "global_step": 199871, "epoch": 1189} {"train_loss": -10.626068115234375, "global_step": 199872, "epoch": 1189} {"train_loss": -10.18419361114502, "global_step": 199873, "epoch": 1189} {"train_loss": -11.494821548461914, "global_step": 199874, "epoch": 1189} {"train_loss": -10.505376815795898, "global_step": 199875, "epoch": 1189} {"train_loss": -10.814937591552734, "global_step": 199876, "epoch": 1189} {"train_loss": -10.788132667541504, "global_step": 199877, "epoch": 1189} {"train_loss": -11.207540512084961, "global_step": 199878, "epoch": 1189} {"train_loss": -10.923627853393555, "global_step": 199879, "epoch": 1189} {"train_loss": -10.914976119995117, "global_step": 199880, "epoch": 1189} {"train_loss": -10.977483749389648, "global_step": 199881, "epoch": 1189} {"train_loss": -10.320978164672852, "global_step": 199882, "epoch": 1189} {"train_loss": -11.353075981140137, "global_step": 199883, "epoch": 1189} {"train_loss": -11.018851280212402, "global_step": 199884, "epoch": 1189} {"train_loss": -11.283544540405273, "global_step": 199885, "epoch": 1189} {"train_loss": -11.13014030456543, "global_step": 199886, "epoch": 1189} {"train_loss": -11.147138595581055, "global_step": 199887, "epoch": 1189} {"train_loss": -11.249935150146484, "global_step": 199888, "epoch": 1189} {"train_loss": -11.736772537231445, "global_step": 199889, "epoch": 1189} {"train_loss": -11.331653594970703, "global_step": 199890, "epoch": 1189} {"train_loss": -11.116632461547852, "global_step": 199891, "epoch": 1189} {"train_loss": -11.0172119140625, "global_step": 199892, "epoch": 1189} {"train_loss": -11.102548599243164, "global_step": 199893, "epoch": 1189} {"train_loss": -11.080032348632812, "global_step": 199894, "epoch": 1189} {"train_loss": -11.633478164672852, "global_step": 199895, "epoch": 1189} {"train_loss": -11.578943252563477, "global_step": 199896, "epoch": 1189} {"train_loss": -11.52641773223877, "global_step": 199897, "epoch": 1189} {"train_loss": -11.466765403747559, "global_step": 199898, "epoch": 1189} {"train_loss": -11.428045272827148, "global_step": 199899, "epoch": 1189} {"train_loss": -11.276845932006836, "global_step": 199900, "epoch": 1189} {"train_loss": -11.477745056152344, "global_step": 199901, "epoch": 1189} {"train_loss": -11.473665237426758, "global_step": 199902, "epoch": 1189} {"train_loss": -11.066097259521484, "global_step": 199903, "epoch": 1189} {"train_loss": -11.301969528198242, "global_step": 199904, "epoch": 1189} {"train_loss": -10.687807083129883, "global_step": 199905, "epoch": 1189} {"train_loss": -11.288816452026367, "global_step": 199906, "epoch": 1189} {"train_loss": -11.153963088989258, "global_step": 199907, "epoch": 1189} {"train_loss": -10.99350357055664, "global_step": 199908, "epoch": 1189} {"train_loss": -11.387715339660645, "global_step": 199909, "epoch": 1189} {"train_loss": -11.237382888793945, "global_step": 199910, "epoch": 1189} {"train_loss": -11.161617279052734, "global_step": 199911, "epoch": 1189} {"train_loss": -11.438231468200684, "global_step": 199912, "epoch": 1189} {"train_loss": -11.14447021484375, "global_step": 199913, "epoch": 1189} {"train_loss": -11.454236030578613, "global_step": 199914, "epoch": 1189} {"train_loss": -11.385331153869629, "global_step": 199915, "epoch": 1189} {"train_loss": -11.520151138305664, "global_step": 199916, "epoch": 1189} {"train_loss": -11.544585227966309, "global_step": 199917, "epoch": 1189} {"train_loss": -11.681524276733398, "global_step": 199918, "epoch": 1189} {"train_loss": -11.27270918233054, "global_step": 199919, "epoch": 1189, "val_loss": 254451.34375} {"train_loss": -11.517662048339844, "global_step": 199920, "epoch": 1190} {"train_loss": -11.414690971374512, "global_step": 199921, "epoch": 1190} {"train_loss": -11.444398880004883, "global_step": 199922, "epoch": 1190} {"train_loss": -11.49781608581543, "global_step": 199923, "epoch": 1190} {"train_loss": -11.553996086120605, "global_step": 199924, "epoch": 1190} {"train_loss": -11.67713737487793, "global_step": 199925, "epoch": 1190} {"train_loss": -11.513601303100586, "global_step": 199926, "epoch": 1190} {"train_loss": -11.689409255981445, "global_step": 199927, "epoch": 1190} {"train_loss": -11.547369003295898, "global_step": 199928, "epoch": 1190} {"train_loss": -11.83646011352539, "global_step": 199929, "epoch": 1190} {"train_loss": -11.785255432128906, "global_step": 199930, "epoch": 1190} {"train_loss": -11.486185073852539, "global_step": 199931, "epoch": 1190} {"train_loss": -11.577582359313965, "global_step": 199932, "epoch": 1190} {"train_loss": -11.472434997558594, "global_step": 199933, "epoch": 1190} {"train_loss": -11.64651870727539, "global_step": 199934, "epoch": 1190} {"train_loss": -11.466052055358887, "global_step": 199935, "epoch": 1190} {"train_loss": -11.483650207519531, "global_step": 199936, "epoch": 1190} {"train_loss": -11.475471496582031, "global_step": 199937, "epoch": 1190} {"train_loss": -11.35943603515625, "global_step": 199938, "epoch": 1190} {"train_loss": -10.994949340820312, "global_step": 199939, "epoch": 1190} {"train_loss": -11.746179580688477, "global_step": 199940, "epoch": 1190} {"train_loss": -11.755547523498535, "global_step": 199941, "epoch": 1190} {"train_loss": -11.602508544921875, "global_step": 199942, "epoch": 1190} {"train_loss": -11.223986625671387, "global_step": 199943, "epoch": 1190} {"train_loss": -10.70679759979248, "global_step": 199944, "epoch": 1190} {"train_loss": -11.525064468383789, "global_step": 199945, "epoch": 1190} {"train_loss": -11.160299301147461, "global_step": 199946, "epoch": 1190} {"train_loss": -10.867181777954102, "global_step": 199947, "epoch": 1190} {"train_loss": -11.551862716674805, "global_step": 199948, "epoch": 1190} {"train_loss": -10.564884185791016, "global_step": 199949, "epoch": 1190} {"train_loss": -10.798757553100586, "global_step": 199950, "epoch": 1190} {"train_loss": -11.685791015625, "global_step": 199951, "epoch": 1190} {"train_loss": -11.390214920043945, "global_step": 199952, "epoch": 1190} {"train_loss": -11.108161926269531, "global_step": 199953, "epoch": 1190} {"train_loss": -11.416467666625977, "global_step": 199954, "epoch": 1190} {"train_loss": -11.454887390136719, "global_step": 199955, "epoch": 1190} {"train_loss": -10.879857063293457, "global_step": 199956, "epoch": 1190} {"train_loss": -11.381418228149414, "global_step": 199957, "epoch": 1190} {"train_loss": -11.101081848144531, "global_step": 199958, "epoch": 1190} {"train_loss": -11.089729309082031, "global_step": 199959, "epoch": 1190} {"train_loss": -10.582191467285156, "global_step": 199960, "epoch": 1190} {"train_loss": -11.242324829101562, "global_step": 199961, "epoch": 1190} {"train_loss": -11.023832321166992, "global_step": 199962, "epoch": 1190} {"train_loss": -9.959095001220703, "global_step": 199963, "epoch": 1190} {"train_loss": -10.477044105529785, "global_step": 199964, "epoch": 1190} {"train_loss": -10.258821487426758, "global_step": 199965, "epoch": 1190} {"train_loss": -10.246572494506836, "global_step": 199966, "epoch": 1190} {"train_loss": -8.361370086669922, "global_step": 199967, "epoch": 1190} {"train_loss": -10.34203815460205, "global_step": 199968, "epoch": 1190} {"train_loss": -10.096275329589844, "global_step": 199969, "epoch": 1190} {"train_loss": -9.19584846496582, "global_step": 199970, "epoch": 1190} {"train_loss": -9.98047924041748, "global_step": 199971, "epoch": 1190} {"train_loss": -10.144784927368164, "global_step": 199972, "epoch": 1190} {"train_loss": -10.286188125610352, "global_step": 199973, "epoch": 1190} {"train_loss": -10.458627700805664, "global_step": 199974, "epoch": 1190} {"train_loss": -11.002202987670898, "global_step": 199975, "epoch": 1190} {"train_loss": -10.142398834228516, "global_step": 199976, "epoch": 1190} {"train_loss": -11.084632873535156, "global_step": 199977, "epoch": 1190} {"train_loss": -10.321134567260742, "global_step": 199978, "epoch": 1190} {"train_loss": -10.68805980682373, "global_step": 199979, "epoch": 1190} {"train_loss": -10.780774116516113, "global_step": 199980, "epoch": 1190} {"train_loss": -10.906776428222656, "global_step": 199981, "epoch": 1190} {"train_loss": -11.184455871582031, "global_step": 199982, "epoch": 1190} {"train_loss": -10.965377807617188, "global_step": 199983, "epoch": 1190} {"train_loss": -11.037721633911133, "global_step": 199984, "epoch": 1190} {"train_loss": -11.26500129699707, "global_step": 199985, "epoch": 1190} {"train_loss": -10.66734790802002, "global_step": 199986, "epoch": 1190} {"train_loss": -11.09487533569336, "global_step": 199987, "epoch": 1190} {"train_loss": -10.808393478393555, "global_step": 199988, "epoch": 1190} {"train_loss": -11.017184257507324, "global_step": 199989, "epoch": 1190} {"train_loss": -11.053138732910156, "global_step": 199990, "epoch": 1190} {"train_loss": -10.760159492492676, "global_step": 199991, "epoch": 1190} {"train_loss": -10.448408126831055, "global_step": 199992, "epoch": 1190} {"train_loss": -10.50592041015625, "global_step": 199993, "epoch": 1190} {"train_loss": -10.746001243591309, "global_step": 199994, "epoch": 1190} {"train_loss": -10.581079483032227, "global_step": 199995, "epoch": 1190} {"train_loss": -10.912105560302734, "global_step": 199996, "epoch": 1190} {"train_loss": -10.180574417114258, "global_step": 199997, "epoch": 1190} {"train_loss": -11.362027168273926, "global_step": 199998, "epoch": 1190} {"train_loss": -10.16116714477539, "global_step": 199999, "epoch": 1190} {"train_loss": -11.241779327392578, "global_step": 200000, "epoch": 1190} {"train_loss": -10.63066291809082, "global_step": 200001, "epoch": 1190} {"train_loss": -11.03526782989502, "global_step": 200002, "epoch": 1190} {"train_loss": -10.777793884277344, "global_step": 200003, "epoch": 1190} {"train_loss": -10.934406280517578, "global_step": 200004, "epoch": 1190} {"train_loss": -10.977869033813477, "global_step": 200005, "epoch": 1190} {"train_loss": -10.95088005065918, "global_step": 200006, "epoch": 1190} {"train_loss": -10.994101524353027, "global_step": 200007, "epoch": 1190} {"train_loss": -10.84304141998291, "global_step": 200008, "epoch": 1190} {"train_loss": -10.862712860107422, "global_step": 200009, "epoch": 1190} {"train_loss": -10.9258451461792, "global_step": 200010, "epoch": 1190} {"train_loss": -11.2543363571167, "global_step": 200011, "epoch": 1190} {"train_loss": -11.054030418395996, "global_step": 200012, "epoch": 1190} {"train_loss": -11.397324562072754, "global_step": 200013, "epoch": 1190} {"train_loss": -11.071468353271484, "global_step": 200014, "epoch": 1190} {"train_loss": -11.17507266998291, "global_step": 200015, "epoch": 1190} {"train_loss": -11.216004371643066, "global_step": 200016, "epoch": 1190} {"train_loss": -11.198482513427734, "global_step": 200017, "epoch": 1190} {"train_loss": -11.386317253112793, "global_step": 200018, "epoch": 1190} {"train_loss": -11.256429672241211, "global_step": 200019, "epoch": 1190} {"train_loss": -11.561769485473633, "global_step": 200020, "epoch": 1190} {"train_loss": -11.407205581665039, "global_step": 200021, "epoch": 1190} {"train_loss": -11.02396011352539, "global_step": 200022, "epoch": 1190} {"train_loss": -11.060606002807617, "global_step": 200023, "epoch": 1190} {"train_loss": -11.331525802612305, "global_step": 200024, "epoch": 1190} {"train_loss": -11.391239166259766, "global_step": 200025, "epoch": 1190} {"train_loss": -11.257513046264648, "global_step": 200026, "epoch": 1190} {"train_loss": -11.242711067199707, "global_step": 200027, "epoch": 1190} {"train_loss": -11.554693222045898, "global_step": 200028, "epoch": 1190} {"train_loss": -11.256011962890625, "global_step": 200029, "epoch": 1190} {"train_loss": -11.194746971130371, "global_step": 200030, "epoch": 1190} {"train_loss": -11.350622177124023, "global_step": 200031, "epoch": 1190} {"train_loss": -11.426298141479492, "global_step": 200032, "epoch": 1190} {"train_loss": -11.633393287658691, "global_step": 200033, "epoch": 1190} {"train_loss": -11.470300674438477, "global_step": 200034, "epoch": 1190} {"train_loss": -11.608867645263672, "global_step": 200035, "epoch": 1190} {"train_loss": -11.419713973999023, "global_step": 200036, "epoch": 1190} {"train_loss": -11.540155410766602, "global_step": 200037, "epoch": 1190} {"train_loss": -11.504701614379883, "global_step": 200038, "epoch": 1190} {"train_loss": -11.457417488098145, "global_step": 200039, "epoch": 1190} {"train_loss": -11.371907234191895, "global_step": 200040, "epoch": 1190} {"train_loss": -11.600502014160156, "global_step": 200041, "epoch": 1190} {"train_loss": -11.482843399047852, "global_step": 200042, "epoch": 1190} {"train_loss": -11.33343505859375, "global_step": 200043, "epoch": 1190} {"train_loss": -11.49658203125, "global_step": 200044, "epoch": 1190} {"train_loss": -11.703154563903809, "global_step": 200045, "epoch": 1190} {"train_loss": -11.320913314819336, "global_step": 200046, "epoch": 1190} {"train_loss": -11.350541114807129, "global_step": 200047, "epoch": 1190} {"train_loss": -11.696325302124023, "global_step": 200048, "epoch": 1190} {"train_loss": -11.441275596618652, "global_step": 200049, "epoch": 1190} {"train_loss": -11.620368003845215, "global_step": 200050, "epoch": 1190} {"train_loss": -11.403432846069336, "global_step": 200051, "epoch": 1190} {"train_loss": -10.989859580993652, "global_step": 200052, "epoch": 1190} {"train_loss": -11.268341064453125, "global_step": 200053, "epoch": 1190} {"train_loss": -11.626934051513672, "global_step": 200054, "epoch": 1190} {"train_loss": -11.089829444885254, "global_step": 200055, "epoch": 1190} {"train_loss": -11.417753219604492, "global_step": 200056, "epoch": 1190} {"train_loss": -11.471393585205078, "global_step": 200057, "epoch": 1190} {"train_loss": -11.523198127746582, "global_step": 200058, "epoch": 1190} {"train_loss": -11.781743049621582, "global_step": 200059, "epoch": 1190} {"train_loss": -11.545677185058594, "global_step": 200060, "epoch": 1190} {"train_loss": -11.580326080322266, "global_step": 200061, "epoch": 1190} {"train_loss": -11.342790603637695, "global_step": 200062, "epoch": 1190} {"train_loss": -11.044900894165039, "global_step": 200063, "epoch": 1190} {"train_loss": -11.360816955566406, "global_step": 200064, "epoch": 1190} {"train_loss": -11.397747039794922, "global_step": 200065, "epoch": 1190} {"train_loss": -11.020856857299805, "global_step": 200066, "epoch": 1190} {"train_loss": -11.08119010925293, "global_step": 200067, "epoch": 1190} {"train_loss": -11.209542274475098, "global_step": 200068, "epoch": 1190} {"train_loss": -11.33299446105957, "global_step": 200069, "epoch": 1190} {"train_loss": -11.475166320800781, "global_step": 200070, "epoch": 1190} {"train_loss": -11.461638450622559, "global_step": 200071, "epoch": 1190} {"train_loss": -11.42561149597168, "global_step": 200072, "epoch": 1190} {"train_loss": -11.226907730102539, "global_step": 200073, "epoch": 1190} {"train_loss": -11.311128616333008, "global_step": 200074, "epoch": 1190} {"train_loss": -11.238555908203125, "global_step": 200075, "epoch": 1190} {"train_loss": -11.342012405395508, "global_step": 200076, "epoch": 1190} {"train_loss": -11.390491485595703, "global_step": 200077, "epoch": 1190} {"train_loss": -10.833074569702148, "global_step": 200078, "epoch": 1190} {"train_loss": -11.128373146057129, "global_step": 200079, "epoch": 1190} {"train_loss": -11.172456741333008, "global_step": 200080, "epoch": 1190} {"train_loss": -10.686925888061523, "global_step": 200081, "epoch": 1190} {"train_loss": -10.831555366516113, "global_step": 200082, "epoch": 1190} {"train_loss": -11.599676132202148, "global_step": 200083, "epoch": 1190} {"train_loss": -11.049003601074219, "global_step": 200084, "epoch": 1190} {"train_loss": -11.429248809814453, "global_step": 200085, "epoch": 1190} {"train_loss": -11.292281150817871, "global_step": 200086, "epoch": 1190} {"train_loss": -11.133064690090361, "global_step": 200087, "epoch": 1190, "val_loss": 245234.078125, "train_action_mse_error": 9.742082595825195} {"train_loss": -11.53278636932373, "global_step": 200088, "epoch": 1191} {"train_loss": -10.968965530395508, "global_step": 200089, "epoch": 1191} {"train_loss": -10.729645729064941, "global_step": 200090, "epoch": 1191} {"train_loss": -11.394891738891602, "global_step": 200091, "epoch": 1191} {"train_loss": -10.630287170410156, "global_step": 200092, "epoch": 1191} {"train_loss": -11.32698917388916, "global_step": 200093, "epoch": 1191} {"train_loss": -11.322614669799805, "global_step": 200094, "epoch": 1191} {"train_loss": -11.083481788635254, "global_step": 200095, "epoch": 1191} {"train_loss": -11.509634017944336, "global_step": 200096, "epoch": 1191} {"train_loss": -10.573420524597168, "global_step": 200097, "epoch": 1191} {"train_loss": -11.459915161132812, "global_step": 200098, "epoch": 1191} {"train_loss": -10.236907958984375, "global_step": 200099, "epoch": 1191} {"train_loss": -10.779044151306152, "global_step": 200100, "epoch": 1191} {"train_loss": -10.898513793945312, "global_step": 200101, "epoch": 1191} {"train_loss": -10.879840850830078, "global_step": 200102, "epoch": 1191} {"train_loss": -11.061979293823242, "global_step": 200103, "epoch": 1191} {"train_loss": -10.93474006652832, "global_step": 200104, "epoch": 1191} {"train_loss": -11.228968620300293, "global_step": 200105, "epoch": 1191} {"train_loss": -10.94540786743164, "global_step": 200106, "epoch": 1191} {"train_loss": -10.687938690185547, "global_step": 200107, "epoch": 1191} {"train_loss": -11.264028549194336, "global_step": 200108, "epoch": 1191} {"train_loss": -10.78818130493164, "global_step": 200109, "epoch": 1191} {"train_loss": -11.18909740447998, "global_step": 200110, "epoch": 1191} {"train_loss": -11.184003829956055, "global_step": 200111, "epoch": 1191} {"train_loss": -11.182785987854004, "global_step": 200112, "epoch": 1191} {"train_loss": -11.408924102783203, "global_step": 200113, "epoch": 1191} {"train_loss": -11.253751754760742, "global_step": 200114, "epoch": 1191} {"train_loss": -11.034011840820312, "global_step": 200115, "epoch": 1191} {"train_loss": -11.339516639709473, "global_step": 200116, "epoch": 1191} {"train_loss": -11.274696350097656, "global_step": 200117, "epoch": 1191} {"train_loss": -11.165903091430664, "global_step": 200118, "epoch": 1191} {"train_loss": -11.190210342407227, "global_step": 200119, "epoch": 1191} {"train_loss": -11.110296249389648, "global_step": 200120, "epoch": 1191} {"train_loss": -11.226284980773926, "global_step": 200121, "epoch": 1191} {"train_loss": -10.884507179260254, "global_step": 200122, "epoch": 1191} {"train_loss": -11.298866271972656, "global_step": 200123, "epoch": 1191} {"train_loss": -10.642288208007812, "global_step": 200124, "epoch": 1191} {"train_loss": -11.223430633544922, "global_step": 200125, "epoch": 1191} {"train_loss": -11.169054985046387, "global_step": 200126, "epoch": 1191} {"train_loss": -10.89794921875, "global_step": 200127, "epoch": 1191} {"train_loss": -11.066712379455566, "global_step": 200128, "epoch": 1191} {"train_loss": -11.158529281616211, "global_step": 200129, "epoch": 1191} {"train_loss": -11.426694869995117, "global_step": 200130, "epoch": 1191} {"train_loss": -11.236852645874023, "global_step": 200131, "epoch": 1191} {"train_loss": -11.07905387878418, "global_step": 200132, "epoch": 1191} {"train_loss": -11.50311279296875, "global_step": 200133, "epoch": 1191} {"train_loss": -11.23225212097168, "global_step": 200134, "epoch": 1191} {"train_loss": -11.571062088012695, "global_step": 200135, "epoch": 1191} {"train_loss": -11.093785285949707, "global_step": 200136, "epoch": 1191} {"train_loss": -11.161450386047363, "global_step": 200137, "epoch": 1191} {"train_loss": -11.310455322265625, "global_step": 200138, "epoch": 1191} {"train_loss": -11.262527465820312, "global_step": 200139, "epoch": 1191} {"train_loss": -11.398849487304688, "global_step": 200140, "epoch": 1191} {"train_loss": -11.14706802368164, "global_step": 200141, "epoch": 1191} {"train_loss": -11.738862037658691, "global_step": 200142, "epoch": 1191} {"train_loss": -11.345050811767578, "global_step": 200143, "epoch": 1191} {"train_loss": -11.471837997436523, "global_step": 200144, "epoch": 1191} {"train_loss": -11.780881881713867, "global_step": 200145, "epoch": 1191} {"train_loss": -11.410998344421387, "global_step": 200146, "epoch": 1191} {"train_loss": -11.569828987121582, "global_step": 200147, "epoch": 1191} {"train_loss": -11.463367462158203, "global_step": 200148, "epoch": 1191} {"train_loss": -11.661084175109863, "global_step": 200149, "epoch": 1191} {"train_loss": -11.69996452331543, "global_step": 200150, "epoch": 1191} {"train_loss": -11.444340705871582, "global_step": 200151, "epoch": 1191} {"train_loss": -11.471578598022461, "global_step": 200152, "epoch": 1191} {"train_loss": -11.707878112792969, "global_step": 200153, "epoch": 1191} {"train_loss": -11.640413284301758, "global_step": 200154, "epoch": 1191} {"train_loss": -11.52414321899414, "global_step": 200155, "epoch": 1191} {"train_loss": -11.719870567321777, "global_step": 200156, "epoch": 1191} {"train_loss": -11.419435501098633, "global_step": 200157, "epoch": 1191} {"train_loss": -11.735219955444336, "global_step": 200158, "epoch": 1191} {"train_loss": -11.294636726379395, "global_step": 200159, "epoch": 1191} {"train_loss": -11.645650863647461, "global_step": 200160, "epoch": 1191} {"train_loss": -11.67951774597168, "global_step": 200161, "epoch": 1191} {"train_loss": -11.651217460632324, "global_step": 200162, "epoch": 1191} {"train_loss": -11.654189109802246, "global_step": 200163, "epoch": 1191} {"train_loss": -11.76011848449707, "global_step": 200164, "epoch": 1191} {"train_loss": -11.832120895385742, "global_step": 200165, "epoch": 1191} {"train_loss": -11.57098388671875, "global_step": 200166, "epoch": 1191} {"train_loss": -11.825475692749023, "global_step": 200167, "epoch": 1191} {"train_loss": -11.767570495605469, "global_step": 200168, "epoch": 1191} {"train_loss": -11.581671714782715, "global_step": 200169, "epoch": 1191} {"train_loss": -11.87844181060791, "global_step": 200170, "epoch": 1191} {"train_loss": -11.83041000366211, "global_step": 200171, "epoch": 1191} {"train_loss": -11.987887382507324, "global_step": 200172, "epoch": 1191} {"train_loss": -11.654312133789062, "global_step": 200173, "epoch": 1191} {"train_loss": -11.791481018066406, "global_step": 200174, "epoch": 1191} {"train_loss": -11.851734161376953, "global_step": 200175, "epoch": 1191} {"train_loss": -11.80302619934082, "global_step": 200176, "epoch": 1191} {"train_loss": -11.864903450012207, "global_step": 200177, "epoch": 1191} {"train_loss": -11.704511642456055, "global_step": 200178, "epoch": 1191} {"train_loss": -11.907074928283691, "global_step": 200179, "epoch": 1191} {"train_loss": -11.837276458740234, "global_step": 200180, "epoch": 1191} {"train_loss": -11.979037284851074, "global_step": 200181, "epoch": 1191} {"train_loss": -11.901758193969727, "global_step": 200182, "epoch": 1191} {"train_loss": -11.802751541137695, "global_step": 200183, "epoch": 1191} {"train_loss": -11.76393985748291, "global_step": 200184, "epoch": 1191} {"train_loss": -11.62885856628418, "global_step": 200185, "epoch": 1191} {"train_loss": -11.47493839263916, "global_step": 200186, "epoch": 1191} {"train_loss": -11.402484893798828, "global_step": 200187, "epoch": 1191} {"train_loss": -11.168472290039062, "global_step": 200188, "epoch": 1191} {"train_loss": -11.499306678771973, "global_step": 200189, "epoch": 1191} {"train_loss": -10.868484497070312, "global_step": 200190, "epoch": 1191} {"train_loss": -10.222846031188965, "global_step": 200191, "epoch": 1191} {"train_loss": -10.494659423828125, "global_step": 200192, "epoch": 1191} {"train_loss": -10.705615043640137, "global_step": 200193, "epoch": 1191} {"train_loss": -10.193929672241211, "global_step": 200194, "epoch": 1191} {"train_loss": -9.693272590637207, "global_step": 200195, "epoch": 1191} {"train_loss": -10.37828254699707, "global_step": 200196, "epoch": 1191} {"train_loss": -10.258726119995117, "global_step": 200197, "epoch": 1191} {"train_loss": -10.003145217895508, "global_step": 200198, "epoch": 1191} {"train_loss": -10.302627563476562, "global_step": 200199, "epoch": 1191} {"train_loss": -8.91746711730957, "global_step": 200200, "epoch": 1191} {"train_loss": -10.470032691955566, "global_step": 200201, "epoch": 1191} {"train_loss": -10.325748443603516, "global_step": 200202, "epoch": 1191} {"train_loss": -9.797576904296875, "global_step": 200203, "epoch": 1191} {"train_loss": -11.09430980682373, "global_step": 200204, "epoch": 1191} {"train_loss": -8.370973587036133, "global_step": 200205, "epoch": 1191} {"train_loss": -10.391061782836914, "global_step": 200206, "epoch": 1191} {"train_loss": -9.870606422424316, "global_step": 200207, "epoch": 1191} {"train_loss": -9.98507308959961, "global_step": 200208, "epoch": 1191} {"train_loss": -11.30030632019043, "global_step": 200209, "epoch": 1191} {"train_loss": -9.930464744567871, "global_step": 200210, "epoch": 1191} {"train_loss": -11.096595764160156, "global_step": 200211, "epoch": 1191} {"train_loss": -10.898717880249023, "global_step": 200212, "epoch": 1191} {"train_loss": -10.692317962646484, "global_step": 200213, "epoch": 1191} {"train_loss": -10.833515167236328, "global_step": 200214, "epoch": 1191} {"train_loss": -10.790008544921875, "global_step": 200215, "epoch": 1191} {"train_loss": -11.072671890258789, "global_step": 200216, "epoch": 1191} {"train_loss": -10.754685401916504, "global_step": 200217, "epoch": 1191} {"train_loss": -11.197066307067871, "global_step": 200218, "epoch": 1191} {"train_loss": -10.977960586547852, "global_step": 200219, "epoch": 1191} {"train_loss": -11.091699600219727, "global_step": 200220, "epoch": 1191} {"train_loss": -11.229009628295898, "global_step": 200221, "epoch": 1191} {"train_loss": -10.991776466369629, "global_step": 200222, "epoch": 1191} {"train_loss": -11.015975952148438, "global_step": 200223, "epoch": 1191} {"train_loss": -11.318633079528809, "global_step": 200224, "epoch": 1191} {"train_loss": -11.480775833129883, "global_step": 200225, "epoch": 1191} {"train_loss": -10.99909496307373, "global_step": 200226, "epoch": 1191} {"train_loss": -11.160298347473145, "global_step": 200227, "epoch": 1191} {"train_loss": -11.389997482299805, "global_step": 200228, "epoch": 1191} {"train_loss": -11.29116439819336, "global_step": 200229, "epoch": 1191} {"train_loss": -11.28982162475586, "global_step": 200230, "epoch": 1191} {"train_loss": -11.282917022705078, "global_step": 200231, "epoch": 1191} {"train_loss": -11.238800048828125, "global_step": 200232, "epoch": 1191} {"train_loss": -11.182024955749512, "global_step": 200233, "epoch": 1191} {"train_loss": -11.268712043762207, "global_step": 200234, "epoch": 1191} {"train_loss": -11.602926254272461, "global_step": 200235, "epoch": 1191} {"train_loss": -11.524040222167969, "global_step": 200236, "epoch": 1191} {"train_loss": -11.297151565551758, "global_step": 200237, "epoch": 1191} {"train_loss": -11.205001831054688, "global_step": 200238, "epoch": 1191} {"train_loss": -11.358131408691406, "global_step": 200239, "epoch": 1191} {"train_loss": -11.486529350280762, "global_step": 200240, "epoch": 1191} {"train_loss": -11.285650253295898, "global_step": 200241, "epoch": 1191} {"train_loss": -11.388662338256836, "global_step": 200242, "epoch": 1191} {"train_loss": -11.391704559326172, "global_step": 200243, "epoch": 1191} {"train_loss": -11.665581703186035, "global_step": 200244, "epoch": 1191} {"train_loss": -11.595882415771484, "global_step": 200245, "epoch": 1191} {"train_loss": -11.457171440124512, "global_step": 200246, "epoch": 1191} {"train_loss": -11.378194808959961, "global_step": 200247, "epoch": 1191} {"train_loss": -11.344659805297852, "global_step": 200248, "epoch": 1191} {"train_loss": -11.702522277832031, "global_step": 200249, "epoch": 1191} {"train_loss": -11.432169914245605, "global_step": 200250, "epoch": 1191} {"train_loss": -11.30435562133789, "global_step": 200251, "epoch": 1191} {"train_loss": -11.515325546264648, "global_step": 200252, "epoch": 1191} {"train_loss": -11.54102897644043, "global_step": 200253, "epoch": 1191} {"train_loss": -11.455485343933105, "global_step": 200254, "epoch": 1191} {"train_loss": -11.195547995113191, "global_step": 200255, "epoch": 1191, "val_loss": 245604.90625} {"train_loss": -11.669781684875488, "global_step": 200256, "epoch": 1192} {"train_loss": -11.78076171875, "global_step": 200257, "epoch": 1192} {"train_loss": -11.667930603027344, "global_step": 200258, "epoch": 1192} {"train_loss": -11.67447280883789, "global_step": 200259, "epoch": 1192} {"train_loss": -11.585582733154297, "global_step": 200260, "epoch": 1192} {"train_loss": -11.602140426635742, "global_step": 200261, "epoch": 1192} {"train_loss": -11.792790412902832, "global_step": 200262, "epoch": 1192} {"train_loss": -11.548041343688965, "global_step": 200263, "epoch": 1192} {"train_loss": -11.715351104736328, "global_step": 200264, "epoch": 1192} {"train_loss": -11.814067840576172, "global_step": 200265, "epoch": 1192} {"train_loss": -11.343876838684082, "global_step": 200266, "epoch": 1192} {"train_loss": -11.645808219909668, "global_step": 200267, "epoch": 1192} {"train_loss": -11.616532325744629, "global_step": 200268, "epoch": 1192} {"train_loss": -11.831873893737793, "global_step": 200269, "epoch": 1192} {"train_loss": -11.456436157226562, "global_step": 200270, "epoch": 1192} {"train_loss": -11.552095413208008, "global_step": 200271, "epoch": 1192} {"train_loss": -11.653273582458496, "global_step": 200272, "epoch": 1192} {"train_loss": -11.045001983642578, "global_step": 200273, "epoch": 1192} {"train_loss": -11.475522994995117, "global_step": 200274, "epoch": 1192} {"train_loss": -11.356257438659668, "global_step": 200275, "epoch": 1192} {"train_loss": -11.778398513793945, "global_step": 200276, "epoch": 1192} {"train_loss": -11.64417552947998, "global_step": 200277, "epoch": 1192} {"train_loss": -11.175636291503906, "global_step": 200278, "epoch": 1192} {"train_loss": -11.309983253479004, "global_step": 200279, "epoch": 1192} {"train_loss": -11.718267440795898, "global_step": 200280, "epoch": 1192} {"train_loss": -11.171065330505371, "global_step": 200281, "epoch": 1192} {"train_loss": -11.390185356140137, "global_step": 200282, "epoch": 1192} {"train_loss": -11.545166015625, "global_step": 200283, "epoch": 1192} {"train_loss": -11.017419815063477, "global_step": 200284, "epoch": 1192} {"train_loss": -11.047294616699219, "global_step": 200285, "epoch": 1192} {"train_loss": -11.620916366577148, "global_step": 200286, "epoch": 1192} {"train_loss": -11.285274505615234, "global_step": 200287, "epoch": 1192} {"train_loss": -11.402510643005371, "global_step": 200288, "epoch": 1192} {"train_loss": -11.007364273071289, "global_step": 200289, "epoch": 1192} {"train_loss": -10.888153076171875, "global_step": 200290, "epoch": 1192} {"train_loss": -11.665092468261719, "global_step": 200291, "epoch": 1192} {"train_loss": -11.24439811706543, "global_step": 200292, "epoch": 1192} {"train_loss": -11.391857147216797, "global_step": 200293, "epoch": 1192} {"train_loss": -10.533655166625977, "global_step": 200294, "epoch": 1192} {"train_loss": -10.849944114685059, "global_step": 200295, "epoch": 1192} {"train_loss": -11.487610816955566, "global_step": 200296, "epoch": 1192} {"train_loss": -11.414392471313477, "global_step": 200297, "epoch": 1192} {"train_loss": -10.71601676940918, "global_step": 200298, "epoch": 1192} {"train_loss": -10.474876403808594, "global_step": 200299, "epoch": 1192} {"train_loss": -10.950984001159668, "global_step": 200300, "epoch": 1192} {"train_loss": -11.072726249694824, "global_step": 200301, "epoch": 1192} {"train_loss": -10.866307258605957, "global_step": 200302, "epoch": 1192} {"train_loss": -11.34208869934082, "global_step": 200303, "epoch": 1192} {"train_loss": -11.247011184692383, "global_step": 200304, "epoch": 1192} {"train_loss": -11.021095275878906, "global_step": 200305, "epoch": 1192} {"train_loss": -10.482025146484375, "global_step": 200306, "epoch": 1192} {"train_loss": -11.413477897644043, "global_step": 200307, "epoch": 1192} {"train_loss": -10.28749942779541, "global_step": 200308, "epoch": 1192} {"train_loss": -11.500713348388672, "global_step": 200309, "epoch": 1192} {"train_loss": -10.826730728149414, "global_step": 200310, "epoch": 1192} {"train_loss": -10.648558616638184, "global_step": 200311, "epoch": 1192} {"train_loss": -11.13418960571289, "global_step": 200312, "epoch": 1192} {"train_loss": -10.417802810668945, "global_step": 200313, "epoch": 1192} {"train_loss": -11.246231079101562, "global_step": 200314, "epoch": 1192} {"train_loss": -11.173503875732422, "global_step": 200315, "epoch": 1192} {"train_loss": -11.157454490661621, "global_step": 200316, "epoch": 1192} {"train_loss": -11.359431266784668, "global_step": 200317, "epoch": 1192} {"train_loss": -11.317319869995117, "global_step": 200318, "epoch": 1192} {"train_loss": -11.404378890991211, "global_step": 200319, "epoch": 1192} {"train_loss": -11.310640335083008, "global_step": 200320, "epoch": 1192} {"train_loss": -11.377525329589844, "global_step": 200321, "epoch": 1192} {"train_loss": -11.047128677368164, "global_step": 200322, "epoch": 1192} {"train_loss": -11.332923889160156, "global_step": 200323, "epoch": 1192} {"train_loss": -11.661433219909668, "global_step": 200324, "epoch": 1192} {"train_loss": -11.175043106079102, "global_step": 200325, "epoch": 1192} {"train_loss": -11.319780349731445, "global_step": 200326, "epoch": 1192} {"train_loss": -11.015395164489746, "global_step": 200327, "epoch": 1192} {"train_loss": -11.209515571594238, "global_step": 200328, "epoch": 1192} {"train_loss": -11.059206008911133, "global_step": 200329, "epoch": 1192} {"train_loss": -11.266624450683594, "global_step": 200330, "epoch": 1192} {"train_loss": -11.313539505004883, "global_step": 200331, "epoch": 1192} {"train_loss": -10.939699172973633, "global_step": 200332, "epoch": 1192} {"train_loss": -11.450739860534668, "global_step": 200333, "epoch": 1192} {"train_loss": -11.389409065246582, "global_step": 200334, "epoch": 1192} {"train_loss": -11.451841354370117, "global_step": 200335, "epoch": 1192} {"train_loss": -11.388537406921387, "global_step": 200336, "epoch": 1192} {"train_loss": -11.437298774719238, "global_step": 200337, "epoch": 1192} {"train_loss": -11.093321800231934, "global_step": 200338, "epoch": 1192} {"train_loss": -11.48105525970459, "global_step": 200339, "epoch": 1192} {"train_loss": -11.249777793884277, "global_step": 200340, "epoch": 1192} {"train_loss": -11.485108375549316, "global_step": 200341, "epoch": 1192} {"train_loss": -11.48002815246582, "global_step": 200342, "epoch": 1192} {"train_loss": -11.230656623840332, "global_step": 200343, "epoch": 1192} {"train_loss": -11.587160110473633, "global_step": 200344, "epoch": 1192} {"train_loss": -11.238737106323242, "global_step": 200345, "epoch": 1192} {"train_loss": -11.416202545166016, "global_step": 200346, "epoch": 1192} {"train_loss": -11.339557647705078, "global_step": 200347, "epoch": 1192} {"train_loss": -11.363025665283203, "global_step": 200348, "epoch": 1192} {"train_loss": -10.96511459350586, "global_step": 200349, "epoch": 1192} {"train_loss": -11.51966667175293, "global_step": 200350, "epoch": 1192} {"train_loss": -10.511271476745605, "global_step": 200351, "epoch": 1192} {"train_loss": -11.291682243347168, "global_step": 200352, "epoch": 1192} {"train_loss": -10.958690643310547, "global_step": 200353, "epoch": 1192} {"train_loss": -11.021604537963867, "global_step": 200354, "epoch": 1192} {"train_loss": -11.33114242553711, "global_step": 200355, "epoch": 1192} {"train_loss": -11.227350234985352, "global_step": 200356, "epoch": 1192} {"train_loss": -11.272381782531738, "global_step": 200357, "epoch": 1192} {"train_loss": -11.226114273071289, "global_step": 200358, "epoch": 1192} {"train_loss": -11.31629467010498, "global_step": 200359, "epoch": 1192} {"train_loss": -11.452385902404785, "global_step": 200360, "epoch": 1192} {"train_loss": -11.582727432250977, "global_step": 200361, "epoch": 1192} {"train_loss": -11.513326644897461, "global_step": 200362, "epoch": 1192} {"train_loss": -10.747883796691895, "global_step": 200363, "epoch": 1192} {"train_loss": -11.437871932983398, "global_step": 200364, "epoch": 1192} {"train_loss": -10.784111976623535, "global_step": 200365, "epoch": 1192} {"train_loss": -11.127604484558105, "global_step": 200366, "epoch": 1192} {"train_loss": -11.466115951538086, "global_step": 200367, "epoch": 1192} {"train_loss": -11.10464096069336, "global_step": 200368, "epoch": 1192} {"train_loss": -11.49483585357666, "global_step": 200369, "epoch": 1192} {"train_loss": -11.289148330688477, "global_step": 200370, "epoch": 1192} {"train_loss": -11.425821304321289, "global_step": 200371, "epoch": 1192} {"train_loss": -11.30185317993164, "global_step": 200372, "epoch": 1192} {"train_loss": -11.376444816589355, "global_step": 200373, "epoch": 1192} {"train_loss": -11.284271240234375, "global_step": 200374, "epoch": 1192} {"train_loss": -11.079161643981934, "global_step": 200375, "epoch": 1192} {"train_loss": -10.909468650817871, "global_step": 200376, "epoch": 1192} {"train_loss": -11.012212753295898, "global_step": 200377, "epoch": 1192} {"train_loss": -10.971173286437988, "global_step": 200378, "epoch": 1192} {"train_loss": -10.894902229309082, "global_step": 200379, "epoch": 1192} {"train_loss": -11.304957389831543, "global_step": 200380, "epoch": 1192} {"train_loss": -11.231433868408203, "global_step": 200381, "epoch": 1192} {"train_loss": -10.872112274169922, "global_step": 200382, "epoch": 1192} {"train_loss": -11.47208023071289, "global_step": 200383, "epoch": 1192} {"train_loss": -10.719184875488281, "global_step": 200384, "epoch": 1192} {"train_loss": -10.927478790283203, "global_step": 200385, "epoch": 1192} {"train_loss": -11.199857711791992, "global_step": 200386, "epoch": 1192} {"train_loss": -10.66533088684082, "global_step": 200387, "epoch": 1192} {"train_loss": -11.295429229736328, "global_step": 200388, "epoch": 1192} {"train_loss": -10.83834457397461, "global_step": 200389, "epoch": 1192} {"train_loss": -11.040695190429688, "global_step": 200390, "epoch": 1192} {"train_loss": -11.042379379272461, "global_step": 200391, "epoch": 1192} {"train_loss": -10.48114013671875, "global_step": 200392, "epoch": 1192} {"train_loss": -11.360910415649414, "global_step": 200393, "epoch": 1192} {"train_loss": -10.642906188964844, "global_step": 200394, "epoch": 1192} {"train_loss": -11.091869354248047, "global_step": 200395, "epoch": 1192} {"train_loss": -10.510174751281738, "global_step": 200396, "epoch": 1192} {"train_loss": -11.093111991882324, "global_step": 200397, "epoch": 1192} {"train_loss": -11.310003280639648, "global_step": 200398, "epoch": 1192} {"train_loss": -11.013004302978516, "global_step": 200399, "epoch": 1192} {"train_loss": -11.398313522338867, "global_step": 200400, "epoch": 1192} {"train_loss": -10.691773414611816, "global_step": 200401, "epoch": 1192} {"train_loss": -11.31448745727539, "global_step": 200402, "epoch": 1192} {"train_loss": -10.972601890563965, "global_step": 200403, "epoch": 1192} {"train_loss": -10.603063583374023, "global_step": 200404, "epoch": 1192} {"train_loss": -10.55319881439209, "global_step": 200405, "epoch": 1192} {"train_loss": -10.32033920288086, "global_step": 200406, "epoch": 1192} {"train_loss": -10.312385559082031, "global_step": 200407, "epoch": 1192} {"train_loss": -10.696474075317383, "global_step": 200408, "epoch": 1192} {"train_loss": -11.219671249389648, "global_step": 200409, "epoch": 1192} {"train_loss": -11.206268310546875, "global_step": 200410, "epoch": 1192} {"train_loss": -10.981884956359863, "global_step": 200411, "epoch": 1192} {"train_loss": -11.361847877502441, "global_step": 200412, "epoch": 1192} {"train_loss": -11.310096740722656, "global_step": 200413, "epoch": 1192} {"train_loss": -11.499549865722656, "global_step": 200414, "epoch": 1192} {"train_loss": -11.160673141479492, "global_step": 200415, "epoch": 1192} {"train_loss": -11.135828971862793, "global_step": 200416, "epoch": 1192} {"train_loss": -10.963071823120117, "global_step": 200417, "epoch": 1192} {"train_loss": -11.333415985107422, "global_step": 200418, "epoch": 1192} {"train_loss": -11.118236541748047, "global_step": 200419, "epoch": 1192} {"train_loss": -11.147439956665039, "global_step": 200420, "epoch": 1192} {"train_loss": -11.42031478881836, "global_step": 200421, "epoch": 1192} {"train_loss": -11.319686889648438, "global_step": 200422, "epoch": 1192} {"train_loss": -11.207167284829277, "global_step": 200423, "epoch": 1192, "val_loss": 251222.59375} {"train_loss": -11.403966903686523, "global_step": 200424, "epoch": 1193} {"train_loss": -11.590102195739746, "global_step": 200425, "epoch": 1193} {"train_loss": -11.268970489501953, "global_step": 200426, "epoch": 1193} {"train_loss": -11.235504150390625, "global_step": 200427, "epoch": 1193} {"train_loss": -11.43171501159668, "global_step": 200428, "epoch": 1193} {"train_loss": -11.427644729614258, "global_step": 200429, "epoch": 1193} {"train_loss": -11.267740249633789, "global_step": 200430, "epoch": 1193} {"train_loss": -11.668770790100098, "global_step": 200431, "epoch": 1193} {"train_loss": -11.046183586120605, "global_step": 200432, "epoch": 1193} {"train_loss": -11.718162536621094, "global_step": 200433, "epoch": 1193} {"train_loss": -11.377481460571289, "global_step": 200434, "epoch": 1193} {"train_loss": -11.485434532165527, "global_step": 200435, "epoch": 1193} {"train_loss": -11.382025718688965, "global_step": 200436, "epoch": 1193} {"train_loss": -11.233440399169922, "global_step": 200437, "epoch": 1193} {"train_loss": -11.557899475097656, "global_step": 200438, "epoch": 1193} {"train_loss": -11.308673858642578, "global_step": 200439, "epoch": 1193} {"train_loss": -11.576576232910156, "global_step": 200440, "epoch": 1193} {"train_loss": -11.348549842834473, "global_step": 200441, "epoch": 1193} {"train_loss": -11.465025901794434, "global_step": 200442, "epoch": 1193} {"train_loss": -11.689552307128906, "global_step": 200443, "epoch": 1193} {"train_loss": -11.582983016967773, "global_step": 200444, "epoch": 1193} {"train_loss": -11.531414031982422, "global_step": 200445, "epoch": 1193} {"train_loss": -11.42204475402832, "global_step": 200446, "epoch": 1193} {"train_loss": -11.578849792480469, "global_step": 200447, "epoch": 1193} {"train_loss": -11.47967529296875, "global_step": 200448, "epoch": 1193} {"train_loss": -11.37765121459961, "global_step": 200449, "epoch": 1193} {"train_loss": -11.473427772521973, "global_step": 200450, "epoch": 1193} {"train_loss": -11.386588096618652, "global_step": 200451, "epoch": 1193} {"train_loss": -11.39417839050293, "global_step": 200452, "epoch": 1193} {"train_loss": -11.52733039855957, "global_step": 200453, "epoch": 1193} {"train_loss": -11.334226608276367, "global_step": 200454, "epoch": 1193} {"train_loss": -11.732582092285156, "global_step": 200455, "epoch": 1193} {"train_loss": -11.448137283325195, "global_step": 200456, "epoch": 1193} {"train_loss": -11.275413513183594, "global_step": 200457, "epoch": 1193} {"train_loss": -11.564027786254883, "global_step": 200458, "epoch": 1193} {"train_loss": -11.490621566772461, "global_step": 200459, "epoch": 1193} {"train_loss": -11.278264999389648, "global_step": 200460, "epoch": 1193} {"train_loss": -11.53952407836914, "global_step": 200461, "epoch": 1193} {"train_loss": -11.436254501342773, "global_step": 200462, "epoch": 1193} {"train_loss": -11.128325462341309, "global_step": 200463, "epoch": 1193} {"train_loss": -11.045881271362305, "global_step": 200464, "epoch": 1193} {"train_loss": -11.256593704223633, "global_step": 200465, "epoch": 1193} {"train_loss": -10.693439483642578, "global_step": 200466, "epoch": 1193} {"train_loss": -11.679671287536621, "global_step": 200467, "epoch": 1193} {"train_loss": -11.396316528320312, "global_step": 200468, "epoch": 1193} {"train_loss": -11.244576454162598, "global_step": 200469, "epoch": 1193} {"train_loss": -11.271953582763672, "global_step": 200470, "epoch": 1193} {"train_loss": -11.124727249145508, "global_step": 200471, "epoch": 1193} {"train_loss": -11.595993041992188, "global_step": 200472, "epoch": 1193} {"train_loss": -11.37666130065918, "global_step": 200473, "epoch": 1193} {"train_loss": -11.487678527832031, "global_step": 200474, "epoch": 1193} {"train_loss": -11.372855186462402, "global_step": 200475, "epoch": 1193} {"train_loss": -11.437906265258789, "global_step": 200476, "epoch": 1193} {"train_loss": -11.707834243774414, "global_step": 200477, "epoch": 1193} {"train_loss": -11.570966720581055, "global_step": 200478, "epoch": 1193} {"train_loss": -11.515115737915039, "global_step": 200479, "epoch": 1193} {"train_loss": -11.312538146972656, "global_step": 200480, "epoch": 1193} {"train_loss": -11.737127304077148, "global_step": 200481, "epoch": 1193} {"train_loss": -11.734220504760742, "global_step": 200482, "epoch": 1193} {"train_loss": -11.417226791381836, "global_step": 200483, "epoch": 1193} {"train_loss": -11.695323944091797, "global_step": 200484, "epoch": 1193} {"train_loss": -11.697122573852539, "global_step": 200485, "epoch": 1193} {"train_loss": -11.619352340698242, "global_step": 200486, "epoch": 1193} {"train_loss": -11.542032241821289, "global_step": 200487, "epoch": 1193} {"train_loss": -11.932889938354492, "global_step": 200488, "epoch": 1193} {"train_loss": -11.453192710876465, "global_step": 200489, "epoch": 1193} {"train_loss": -11.276129722595215, "global_step": 200490, "epoch": 1193} {"train_loss": -11.35966682434082, "global_step": 200491, "epoch": 1193} {"train_loss": -11.631575584411621, "global_step": 200492, "epoch": 1193} {"train_loss": -11.583992004394531, "global_step": 200493, "epoch": 1193} {"train_loss": -11.720453262329102, "global_step": 200494, "epoch": 1193} {"train_loss": -11.371543884277344, "global_step": 200495, "epoch": 1193} {"train_loss": -11.487401962280273, "global_step": 200496, "epoch": 1193} {"train_loss": -11.355541229248047, "global_step": 200497, "epoch": 1193} {"train_loss": -11.606215476989746, "global_step": 200498, "epoch": 1193} {"train_loss": -11.75102424621582, "global_step": 200499, "epoch": 1193} {"train_loss": -11.74077033996582, "global_step": 200500, "epoch": 1193} {"train_loss": -11.561811447143555, "global_step": 200501, "epoch": 1193} {"train_loss": -11.041109085083008, "global_step": 200502, "epoch": 1193} {"train_loss": -11.334187507629395, "global_step": 200503, "epoch": 1193} {"train_loss": -11.91724967956543, "global_step": 200504, "epoch": 1193} {"train_loss": -11.67365837097168, "global_step": 200505, "epoch": 1193} {"train_loss": -11.696508407592773, "global_step": 200506, "epoch": 1193} {"train_loss": -11.293625831604004, "global_step": 200507, "epoch": 1193} {"train_loss": -11.699132919311523, "global_step": 200508, "epoch": 1193} {"train_loss": -11.734810829162598, "global_step": 200509, "epoch": 1193} {"train_loss": -11.91657829284668, "global_step": 200510, "epoch": 1193} {"train_loss": -11.63371753692627, "global_step": 200511, "epoch": 1193} {"train_loss": -11.47665786743164, "global_step": 200512, "epoch": 1193} {"train_loss": -11.627362251281738, "global_step": 200513, "epoch": 1193} {"train_loss": -11.626424789428711, "global_step": 200514, "epoch": 1193} {"train_loss": -11.700307846069336, "global_step": 200515, "epoch": 1193} {"train_loss": -11.182303428649902, "global_step": 200516, "epoch": 1193} {"train_loss": -10.854658126831055, "global_step": 200517, "epoch": 1193} {"train_loss": -10.748394012451172, "global_step": 200518, "epoch": 1193} {"train_loss": -10.857105255126953, "global_step": 200519, "epoch": 1193} {"train_loss": -11.37036418914795, "global_step": 200520, "epoch": 1193} {"train_loss": -10.699851989746094, "global_step": 200521, "epoch": 1193} {"train_loss": -8.916484832763672, "global_step": 200522, "epoch": 1193} {"train_loss": -9.911418914794922, "global_step": 200523, "epoch": 1193} {"train_loss": -10.390499114990234, "global_step": 200524, "epoch": 1193} {"train_loss": -9.381755828857422, "global_step": 200525, "epoch": 1193} {"train_loss": -11.176517486572266, "global_step": 200526, "epoch": 1193} {"train_loss": -10.038219451904297, "global_step": 200527, "epoch": 1193} {"train_loss": -9.563037872314453, "global_step": 200528, "epoch": 1193} {"train_loss": -10.585445404052734, "global_step": 200529, "epoch": 1193} {"train_loss": -9.442039489746094, "global_step": 200530, "epoch": 1193} {"train_loss": -10.70699691772461, "global_step": 200531, "epoch": 1193} {"train_loss": -9.548454284667969, "global_step": 200532, "epoch": 1193} {"train_loss": -9.272994995117188, "global_step": 200533, "epoch": 1193} {"train_loss": -9.916905403137207, "global_step": 200534, "epoch": 1193} {"train_loss": -9.173826217651367, "global_step": 200535, "epoch": 1193} {"train_loss": -9.680919647216797, "global_step": 200536, "epoch": 1193} {"train_loss": -10.260443687438965, "global_step": 200537, "epoch": 1193} {"train_loss": -10.258749008178711, "global_step": 200538, "epoch": 1193} {"train_loss": -10.457033157348633, "global_step": 200539, "epoch": 1193} {"train_loss": -10.934890747070312, "global_step": 200540, "epoch": 1193} {"train_loss": -10.24051284790039, "global_step": 200541, "epoch": 1193} {"train_loss": -10.678266525268555, "global_step": 200542, "epoch": 1193} {"train_loss": -10.123977661132812, "global_step": 200543, "epoch": 1193} {"train_loss": -10.539323806762695, "global_step": 200544, "epoch": 1193} {"train_loss": -10.877224922180176, "global_step": 200545, "epoch": 1193} {"train_loss": -10.345584869384766, "global_step": 200546, "epoch": 1193} {"train_loss": -10.663311004638672, "global_step": 200547, "epoch": 1193} {"train_loss": -10.687786102294922, "global_step": 200548, "epoch": 1193} {"train_loss": -11.001289367675781, "global_step": 200549, "epoch": 1193} {"train_loss": -10.892576217651367, "global_step": 200550, "epoch": 1193} {"train_loss": -11.190773010253906, "global_step": 200551, "epoch": 1193} {"train_loss": -10.585630416870117, "global_step": 200552, "epoch": 1193} {"train_loss": -10.594768524169922, "global_step": 200553, "epoch": 1193} {"train_loss": -10.975756645202637, "global_step": 200554, "epoch": 1193} {"train_loss": -10.814776420593262, "global_step": 200555, "epoch": 1193} {"train_loss": -10.864927291870117, "global_step": 200556, "epoch": 1193} {"train_loss": -11.149459838867188, "global_step": 200557, "epoch": 1193} {"train_loss": -10.819831848144531, "global_step": 200558, "epoch": 1193} {"train_loss": -11.156412124633789, "global_step": 200559, "epoch": 1193} {"train_loss": -10.985633850097656, "global_step": 200560, "epoch": 1193} {"train_loss": -11.368860244750977, "global_step": 200561, "epoch": 1193} {"train_loss": -10.696495056152344, "global_step": 200562, "epoch": 1193} {"train_loss": -11.393415451049805, "global_step": 200563, "epoch": 1193} {"train_loss": -11.141133308410645, "global_step": 200564, "epoch": 1193} {"train_loss": -11.393171310424805, "global_step": 200565, "epoch": 1193} {"train_loss": -11.240571975708008, "global_step": 200566, "epoch": 1193} {"train_loss": -11.187183380126953, "global_step": 200567, "epoch": 1193} {"train_loss": -11.067965507507324, "global_step": 200568, "epoch": 1193} {"train_loss": -11.284721374511719, "global_step": 200569, "epoch": 1193} {"train_loss": -11.126344680786133, "global_step": 200570, "epoch": 1193} {"train_loss": -11.160172462463379, "global_step": 200571, "epoch": 1193} {"train_loss": -11.254616737365723, "global_step": 200572, "epoch": 1193} {"train_loss": -11.306151390075684, "global_step": 200573, "epoch": 1193} {"train_loss": -11.420976638793945, "global_step": 200574, "epoch": 1193} {"train_loss": -11.126054763793945, "global_step": 200575, "epoch": 1193} {"train_loss": -11.464092254638672, "global_step": 200576, "epoch": 1193} {"train_loss": -11.229402542114258, "global_step": 200577, "epoch": 1193} {"train_loss": -11.263280868530273, "global_step": 200578, "epoch": 1193} {"train_loss": -11.294076919555664, "global_step": 200579, "epoch": 1193} {"train_loss": -11.436854362487793, "global_step": 200580, "epoch": 1193} {"train_loss": -11.508673667907715, "global_step": 200581, "epoch": 1193} {"train_loss": -11.56628704071045, "global_step": 200582, "epoch": 1193} {"train_loss": -11.394550323486328, "global_step": 200583, "epoch": 1193} {"train_loss": -11.388518333435059, "global_step": 200584, "epoch": 1193} {"train_loss": -11.569597244262695, "global_step": 200585, "epoch": 1193} {"train_loss": -11.468476295471191, "global_step": 200586, "epoch": 1193} {"train_loss": -11.463367462158203, "global_step": 200587, "epoch": 1193} {"train_loss": -11.480481147766113, "global_step": 200588, "epoch": 1193} {"train_loss": -11.523856163024902, "global_step": 200589, "epoch": 1193} {"train_loss": -11.521261215209961, "global_step": 200590, "epoch": 1193} {"train_loss": -11.176901374544416, "global_step": 200591, "epoch": 1193, "val_loss": 252249.6875} {"train_loss": -11.504343032836914, "global_step": 200592, "epoch": 1194} {"train_loss": -11.404781341552734, "global_step": 200593, "epoch": 1194} {"train_loss": -11.617258071899414, "global_step": 200594, "epoch": 1194} {"train_loss": -11.604473114013672, "global_step": 200595, "epoch": 1194} {"train_loss": -11.623306274414062, "global_step": 200596, "epoch": 1194} {"train_loss": -11.65719985961914, "global_step": 200597, "epoch": 1194} {"train_loss": -11.630939483642578, "global_step": 200598, "epoch": 1194} {"train_loss": -11.599224090576172, "global_step": 200599, "epoch": 1194} {"train_loss": -11.710298538208008, "global_step": 200600, "epoch": 1194} {"train_loss": -11.503799438476562, "global_step": 200601, "epoch": 1194} {"train_loss": -11.504911422729492, "global_step": 200602, "epoch": 1194} {"train_loss": -11.50450325012207, "global_step": 200603, "epoch": 1194} {"train_loss": -11.653680801391602, "global_step": 200604, "epoch": 1194} {"train_loss": -11.447561264038086, "global_step": 200605, "epoch": 1194} {"train_loss": -11.363536834716797, "global_step": 200606, "epoch": 1194} {"train_loss": -11.784629821777344, "global_step": 200607, "epoch": 1194} {"train_loss": -11.69456672668457, "global_step": 200608, "epoch": 1194} {"train_loss": -11.730178833007812, "global_step": 200609, "epoch": 1194} {"train_loss": -11.30579948425293, "global_step": 200610, "epoch": 1194} {"train_loss": -11.787260055541992, "global_step": 200611, "epoch": 1194} {"train_loss": -11.017786026000977, "global_step": 200612, "epoch": 1194} {"train_loss": -11.20665168762207, "global_step": 200613, "epoch": 1194} {"train_loss": -11.741181373596191, "global_step": 200614, "epoch": 1194} {"train_loss": -11.568954467773438, "global_step": 200615, "epoch": 1194} {"train_loss": -11.407560348510742, "global_step": 200616, "epoch": 1194} {"train_loss": -11.417197227478027, "global_step": 200617, "epoch": 1194} {"train_loss": -11.514031410217285, "global_step": 200618, "epoch": 1194} {"train_loss": -11.512632369995117, "global_step": 200619, "epoch": 1194} {"train_loss": -11.410497665405273, "global_step": 200620, "epoch": 1194} {"train_loss": -11.462854385375977, "global_step": 200621, "epoch": 1194} {"train_loss": -11.828570365905762, "global_step": 200622, "epoch": 1194} {"train_loss": -11.474153518676758, "global_step": 200623, "epoch": 1194} {"train_loss": -11.688583374023438, "global_step": 200624, "epoch": 1194} {"train_loss": -11.453598022460938, "global_step": 200625, "epoch": 1194} {"train_loss": -11.66046142578125, "global_step": 200626, "epoch": 1194} {"train_loss": -11.107863426208496, "global_step": 200627, "epoch": 1194} {"train_loss": -11.460244178771973, "global_step": 200628, "epoch": 1194} {"train_loss": -11.514969825744629, "global_step": 200629, "epoch": 1194} {"train_loss": -11.162839889526367, "global_step": 200630, "epoch": 1194} {"train_loss": -11.218893051147461, "global_step": 200631, "epoch": 1194} {"train_loss": -10.96513557434082, "global_step": 200632, "epoch": 1194} {"train_loss": -11.185546875, "global_step": 200633, "epoch": 1194} {"train_loss": -10.480437278747559, "global_step": 200634, "epoch": 1194} {"train_loss": -10.764669418334961, "global_step": 200635, "epoch": 1194} {"train_loss": -10.358743667602539, "global_step": 200636, "epoch": 1194} {"train_loss": -11.2535982131958, "global_step": 200637, "epoch": 1194} {"train_loss": -9.994274139404297, "global_step": 200638, "epoch": 1194} {"train_loss": -11.030706405639648, "global_step": 200639, "epoch": 1194} {"train_loss": -10.515646934509277, "global_step": 200640, "epoch": 1194} {"train_loss": -10.924333572387695, "global_step": 200641, "epoch": 1194} {"train_loss": -10.932509422302246, "global_step": 200642, "epoch": 1194} {"train_loss": -10.961261749267578, "global_step": 200643, "epoch": 1194} {"train_loss": -11.184870719909668, "global_step": 200644, "epoch": 1194} {"train_loss": -10.539501190185547, "global_step": 200645, "epoch": 1194} {"train_loss": -11.314842224121094, "global_step": 200646, "epoch": 1194} {"train_loss": -10.743041038513184, "global_step": 200647, "epoch": 1194} {"train_loss": -10.733412742614746, "global_step": 200648, "epoch": 1194} {"train_loss": -10.794788360595703, "global_step": 200649, "epoch": 1194} {"train_loss": -11.308675765991211, "global_step": 200650, "epoch": 1194} {"train_loss": -11.182807922363281, "global_step": 200651, "epoch": 1194} {"train_loss": -11.201231002807617, "global_step": 200652, "epoch": 1194} {"train_loss": -10.975330352783203, "global_step": 200653, "epoch": 1194} {"train_loss": -10.664772033691406, "global_step": 200654, "epoch": 1194} {"train_loss": -10.985295295715332, "global_step": 200655, "epoch": 1194} {"train_loss": -10.606868743896484, "global_step": 200656, "epoch": 1194} {"train_loss": -10.75282096862793, "global_step": 200657, "epoch": 1194} {"train_loss": -11.05561637878418, "global_step": 200658, "epoch": 1194} {"train_loss": -10.42795181274414, "global_step": 200659, "epoch": 1194} {"train_loss": -10.849349975585938, "global_step": 200660, "epoch": 1194} {"train_loss": -10.23007583618164, "global_step": 200661, "epoch": 1194} {"train_loss": -11.125726699829102, "global_step": 200662, "epoch": 1194} {"train_loss": -10.417394638061523, "global_step": 200663, "epoch": 1194} {"train_loss": -11.164731979370117, "global_step": 200664, "epoch": 1194} {"train_loss": -10.015228271484375, "global_step": 200665, "epoch": 1194} {"train_loss": -11.14162540435791, "global_step": 200666, "epoch": 1194} {"train_loss": -10.605060577392578, "global_step": 200667, "epoch": 1194} {"train_loss": -10.823734283447266, "global_step": 200668, "epoch": 1194} {"train_loss": -10.675012588500977, "global_step": 200669, "epoch": 1194} {"train_loss": -10.796524047851562, "global_step": 200670, "epoch": 1194} {"train_loss": -10.806442260742188, "global_step": 200671, "epoch": 1194} {"train_loss": -10.641266822814941, "global_step": 200672, "epoch": 1194} {"train_loss": -11.184144973754883, "global_step": 200673, "epoch": 1194} {"train_loss": -10.800468444824219, "global_step": 200674, "epoch": 1194} {"train_loss": -11.330069541931152, "global_step": 200675, "epoch": 1194} {"train_loss": -11.115270614624023, "global_step": 200676, "epoch": 1194} {"train_loss": -11.155336380004883, "global_step": 200677, "epoch": 1194} {"train_loss": -11.430512428283691, "global_step": 200678, "epoch": 1194} {"train_loss": -11.25243854522705, "global_step": 200679, "epoch": 1194} {"train_loss": -11.030234336853027, "global_step": 200680, "epoch": 1194} {"train_loss": -11.244626998901367, "global_step": 200681, "epoch": 1194} {"train_loss": -11.308919906616211, "global_step": 200682, "epoch": 1194} {"train_loss": -11.248214721679688, "global_step": 200683, "epoch": 1194} {"train_loss": -11.537206649780273, "global_step": 200684, "epoch": 1194} {"train_loss": -11.578961372375488, "global_step": 200685, "epoch": 1194} {"train_loss": -11.505807876586914, "global_step": 200686, "epoch": 1194} {"train_loss": -11.643336296081543, "global_step": 200687, "epoch": 1194} {"train_loss": -11.428569793701172, "global_step": 200688, "epoch": 1194} {"train_loss": -11.307182312011719, "global_step": 200689, "epoch": 1194} {"train_loss": -11.336651802062988, "global_step": 200690, "epoch": 1194} {"train_loss": -11.487380981445312, "global_step": 200691, "epoch": 1194} {"train_loss": -11.610252380371094, "global_step": 200692, "epoch": 1194} {"train_loss": -11.553112030029297, "global_step": 200693, "epoch": 1194} {"train_loss": -11.43445873260498, "global_step": 200694, "epoch": 1194} {"train_loss": -11.528877258300781, "global_step": 200695, "epoch": 1194} {"train_loss": -11.27574634552002, "global_step": 200696, "epoch": 1194} {"train_loss": -11.768774032592773, "global_step": 200697, "epoch": 1194} {"train_loss": -11.329585075378418, "global_step": 200698, "epoch": 1194} {"train_loss": -11.390578269958496, "global_step": 200699, "epoch": 1194} {"train_loss": -11.14803695678711, "global_step": 200700, "epoch": 1194} {"train_loss": -11.513870239257812, "global_step": 200701, "epoch": 1194} {"train_loss": -11.241817474365234, "global_step": 200702, "epoch": 1194} {"train_loss": -11.346074104309082, "global_step": 200703, "epoch": 1194} {"train_loss": -11.723888397216797, "global_step": 200704, "epoch": 1194} {"train_loss": -11.031265258789062, "global_step": 200705, "epoch": 1194} {"train_loss": -11.61421012878418, "global_step": 200706, "epoch": 1194} {"train_loss": -11.381561279296875, "global_step": 200707, "epoch": 1194} {"train_loss": -11.440744400024414, "global_step": 200708, "epoch": 1194} {"train_loss": -11.235026359558105, "global_step": 200709, "epoch": 1194} {"train_loss": -11.33718490600586, "global_step": 200710, "epoch": 1194} {"train_loss": -11.271682739257812, "global_step": 200711, "epoch": 1194} {"train_loss": -11.444868087768555, "global_step": 200712, "epoch": 1194} {"train_loss": -11.165416717529297, "global_step": 200713, "epoch": 1194} {"train_loss": -11.556818008422852, "global_step": 200714, "epoch": 1194} {"train_loss": -10.85947036743164, "global_step": 200715, "epoch": 1194} {"train_loss": -11.26321792602539, "global_step": 200716, "epoch": 1194} {"train_loss": -11.306695938110352, "global_step": 200717, "epoch": 1194} {"train_loss": -11.053274154663086, "global_step": 200718, "epoch": 1194} {"train_loss": -11.383649826049805, "global_step": 200719, "epoch": 1194} {"train_loss": -10.7640380859375, "global_step": 200720, "epoch": 1194} {"train_loss": -11.465225219726562, "global_step": 200721, "epoch": 1194} {"train_loss": -10.967529296875, "global_step": 200722, "epoch": 1194} {"train_loss": -10.747119903564453, "global_step": 200723, "epoch": 1194} {"train_loss": -11.437749862670898, "global_step": 200724, "epoch": 1194} {"train_loss": -11.022517204284668, "global_step": 200725, "epoch": 1194} {"train_loss": -11.329996109008789, "global_step": 200726, "epoch": 1194} {"train_loss": -10.740970611572266, "global_step": 200727, "epoch": 1194} {"train_loss": -11.170293807983398, "global_step": 200728, "epoch": 1194} {"train_loss": -10.810968399047852, "global_step": 200729, "epoch": 1194} {"train_loss": -11.282642364501953, "global_step": 200730, "epoch": 1194} {"train_loss": -10.937677383422852, "global_step": 200731, "epoch": 1194} {"train_loss": -11.478132247924805, "global_step": 200732, "epoch": 1194} {"train_loss": -11.076997756958008, "global_step": 200733, "epoch": 1194} {"train_loss": -11.219476699829102, "global_step": 200734, "epoch": 1194} {"train_loss": -11.470865249633789, "global_step": 200735, "epoch": 1194} {"train_loss": -11.17050552368164, "global_step": 200736, "epoch": 1194} {"train_loss": -11.230236053466797, "global_step": 200737, "epoch": 1194} {"train_loss": -10.899665832519531, "global_step": 200738, "epoch": 1194} {"train_loss": -11.380402565002441, "global_step": 200739, "epoch": 1194} {"train_loss": -10.807721138000488, "global_step": 200740, "epoch": 1194} {"train_loss": -11.443334579467773, "global_step": 200741, "epoch": 1194} {"train_loss": -11.19359016418457, "global_step": 200742, "epoch": 1194} {"train_loss": -11.603792190551758, "global_step": 200743, "epoch": 1194} {"train_loss": -11.2901611328125, "global_step": 200744, "epoch": 1194} {"train_loss": -11.392597198486328, "global_step": 200745, "epoch": 1194} {"train_loss": -11.490005493164062, "global_step": 200746, "epoch": 1194} {"train_loss": -11.540242195129395, "global_step": 200747, "epoch": 1194} {"train_loss": -11.401768684387207, "global_step": 200748, "epoch": 1194} {"train_loss": -11.391840934753418, "global_step": 200749, "epoch": 1194} {"train_loss": -11.592096328735352, "global_step": 200750, "epoch": 1194} {"train_loss": -11.760906219482422, "global_step": 200751, "epoch": 1194} {"train_loss": -11.63167953491211, "global_step": 200752, "epoch": 1194} {"train_loss": -11.512582778930664, "global_step": 200753, "epoch": 1194} {"train_loss": -11.540754318237305, "global_step": 200754, "epoch": 1194} {"train_loss": -11.66586685180664, "global_step": 200755, "epoch": 1194} {"train_loss": -11.622447967529297, "global_step": 200756, "epoch": 1194} {"train_loss": -11.677677154541016, "global_step": 200757, "epoch": 1194} {"train_loss": -11.691251754760742, "global_step": 200758, "epoch": 1194} {"train_loss": -11.24534169265202, "global_step": 200759, "epoch": 1194, "val_loss": 252705.140625} {"train_loss": -11.874639511108398, "global_step": 200760, "epoch": 1195} {"train_loss": -11.48504638671875, "global_step": 200761, "epoch": 1195} {"train_loss": -11.619278907775879, "global_step": 200762, "epoch": 1195} {"train_loss": -11.605218887329102, "global_step": 200763, "epoch": 1195} {"train_loss": -11.857499122619629, "global_step": 200764, "epoch": 1195} {"train_loss": -11.61705493927002, "global_step": 200765, "epoch": 1195} {"train_loss": -11.646299362182617, "global_step": 200766, "epoch": 1195} {"train_loss": -11.807342529296875, "global_step": 200767, "epoch": 1195} {"train_loss": -11.78073501586914, "global_step": 200768, "epoch": 1195} {"train_loss": -11.617717742919922, "global_step": 200769, "epoch": 1195} {"train_loss": -11.649659156799316, "global_step": 200770, "epoch": 1195} {"train_loss": -11.801593780517578, "global_step": 200771, "epoch": 1195} {"train_loss": -11.610809326171875, "global_step": 200772, "epoch": 1195} {"train_loss": -11.843626022338867, "global_step": 200773, "epoch": 1195} {"train_loss": -11.382570266723633, "global_step": 200774, "epoch": 1195} {"train_loss": -11.557611465454102, "global_step": 200775, "epoch": 1195} {"train_loss": -11.509096145629883, "global_step": 200776, "epoch": 1195} {"train_loss": -11.2711181640625, "global_step": 200777, "epoch": 1195} {"train_loss": -11.759090423583984, "global_step": 200778, "epoch": 1195} {"train_loss": -11.876134872436523, "global_step": 200779, "epoch": 1195} {"train_loss": -11.855535507202148, "global_step": 200780, "epoch": 1195} {"train_loss": -11.766403198242188, "global_step": 200781, "epoch": 1195} {"train_loss": -11.661418914794922, "global_step": 200782, "epoch": 1195} {"train_loss": -11.336563110351562, "global_step": 200783, "epoch": 1195} {"train_loss": -11.708759307861328, "global_step": 200784, "epoch": 1195} {"train_loss": -11.783246994018555, "global_step": 200785, "epoch": 1195} {"train_loss": -11.477289199829102, "global_step": 200786, "epoch": 1195} {"train_loss": -11.26296615600586, "global_step": 200787, "epoch": 1195} {"train_loss": -11.138692855834961, "global_step": 200788, "epoch": 1195} {"train_loss": -11.320243835449219, "global_step": 200789, "epoch": 1195} {"train_loss": -11.015620231628418, "global_step": 200790, "epoch": 1195} {"train_loss": -11.034514427185059, "global_step": 200791, "epoch": 1195} {"train_loss": -10.800121307373047, "global_step": 200792, "epoch": 1195} {"train_loss": -11.7960205078125, "global_step": 200793, "epoch": 1195} {"train_loss": -11.05309772491455, "global_step": 200794, "epoch": 1195} {"train_loss": -11.261479377746582, "global_step": 200795, "epoch": 1195} {"train_loss": -10.23088264465332, "global_step": 200796, "epoch": 1195} {"train_loss": -11.336934089660645, "global_step": 200797, "epoch": 1195} {"train_loss": -11.102943420410156, "global_step": 200798, "epoch": 1195} {"train_loss": -11.580416679382324, "global_step": 200799, "epoch": 1195} {"train_loss": -10.732040405273438, "global_step": 200800, "epoch": 1195} {"train_loss": -11.663734436035156, "global_step": 200801, "epoch": 1195} {"train_loss": -10.739340782165527, "global_step": 200802, "epoch": 1195} {"train_loss": -11.182669639587402, "global_step": 200803, "epoch": 1195} {"train_loss": -10.985003471374512, "global_step": 200804, "epoch": 1195} {"train_loss": -11.285158157348633, "global_step": 200805, "epoch": 1195} {"train_loss": -10.83535099029541, "global_step": 200806, "epoch": 1195} {"train_loss": -11.52679443359375, "global_step": 200807, "epoch": 1195} {"train_loss": -10.996611595153809, "global_step": 200808, "epoch": 1195} {"train_loss": -11.738737106323242, "global_step": 200809, "epoch": 1195} {"train_loss": -11.042673110961914, "global_step": 200810, "epoch": 1195} {"train_loss": -10.989152908325195, "global_step": 200811, "epoch": 1195} {"train_loss": -11.102596282958984, "global_step": 200812, "epoch": 1195} {"train_loss": -10.884843826293945, "global_step": 200813, "epoch": 1195} {"train_loss": -11.241673469543457, "global_step": 200814, "epoch": 1195} {"train_loss": -11.244991302490234, "global_step": 200815, "epoch": 1195} {"train_loss": -11.209112167358398, "global_step": 200816, "epoch": 1195} {"train_loss": -11.673635482788086, "global_step": 200817, "epoch": 1195} {"train_loss": -10.64406681060791, "global_step": 200818, "epoch": 1195} {"train_loss": -11.451556205749512, "global_step": 200819, "epoch": 1195} {"train_loss": -10.689151763916016, "global_step": 200820, "epoch": 1195} {"train_loss": -11.143930435180664, "global_step": 200821, "epoch": 1195} {"train_loss": -11.091245651245117, "global_step": 200822, "epoch": 1195} {"train_loss": -11.449091911315918, "global_step": 200823, "epoch": 1195} {"train_loss": -11.554710388183594, "global_step": 200824, "epoch": 1195} {"train_loss": -10.806817054748535, "global_step": 200825, "epoch": 1195} {"train_loss": -11.606722831726074, "global_step": 200826, "epoch": 1195} {"train_loss": -11.035572052001953, "global_step": 200827, "epoch": 1195} {"train_loss": -11.456958770751953, "global_step": 200828, "epoch": 1195} {"train_loss": -11.263659477233887, "global_step": 200829, "epoch": 1195} {"train_loss": -11.089296340942383, "global_step": 200830, "epoch": 1195} {"train_loss": -11.463813781738281, "global_step": 200831, "epoch": 1195} {"train_loss": -11.069242477416992, "global_step": 200832, "epoch": 1195} {"train_loss": -11.61368179321289, "global_step": 200833, "epoch": 1195} {"train_loss": -11.618795394897461, "global_step": 200834, "epoch": 1195} {"train_loss": -11.679100036621094, "global_step": 200835, "epoch": 1195} {"train_loss": -11.729870796203613, "global_step": 200836, "epoch": 1195} {"train_loss": -11.468338012695312, "global_step": 200837, "epoch": 1195} {"train_loss": -11.643342971801758, "global_step": 200838, "epoch": 1195} {"train_loss": -11.51446533203125, "global_step": 200839, "epoch": 1195} {"train_loss": -11.37428092956543, "global_step": 200840, "epoch": 1195} {"train_loss": -11.64849853515625, "global_step": 200841, "epoch": 1195} {"train_loss": -11.67153549194336, "global_step": 200842, "epoch": 1195} {"train_loss": -11.806307792663574, "global_step": 200843, "epoch": 1195} {"train_loss": -11.203559875488281, "global_step": 200844, "epoch": 1195} {"train_loss": -11.611820220947266, "global_step": 200845, "epoch": 1195} {"train_loss": -11.49217414855957, "global_step": 200846, "epoch": 1195} {"train_loss": -11.710753440856934, "global_step": 200847, "epoch": 1195} {"train_loss": -11.479284286499023, "global_step": 200848, "epoch": 1195} {"train_loss": -11.28455638885498, "global_step": 200849, "epoch": 1195} {"train_loss": -11.355060577392578, "global_step": 200850, "epoch": 1195} {"train_loss": -10.941265106201172, "global_step": 200851, "epoch": 1195} {"train_loss": -11.534981727600098, "global_step": 200852, "epoch": 1195} {"train_loss": -10.909319877624512, "global_step": 200853, "epoch": 1195} {"train_loss": -11.182806015014648, "global_step": 200854, "epoch": 1195} {"train_loss": -11.270280838012695, "global_step": 200855, "epoch": 1195} {"train_loss": -11.344240188598633, "global_step": 200856, "epoch": 1195} {"train_loss": -10.760551452636719, "global_step": 200857, "epoch": 1195} {"train_loss": -11.057830810546875, "global_step": 200858, "epoch": 1195} {"train_loss": -11.147762298583984, "global_step": 200859, "epoch": 1195} {"train_loss": -11.463922500610352, "global_step": 200860, "epoch": 1195} {"train_loss": -11.379246711730957, "global_step": 200861, "epoch": 1195} {"train_loss": -11.399862289428711, "global_step": 200862, "epoch": 1195} {"train_loss": -11.587553977966309, "global_step": 200863, "epoch": 1195} {"train_loss": -11.164080619812012, "global_step": 200864, "epoch": 1195} {"train_loss": -11.376164436340332, "global_step": 200865, "epoch": 1195} {"train_loss": -11.141754150390625, "global_step": 200866, "epoch": 1195} {"train_loss": -11.233406066894531, "global_step": 200867, "epoch": 1195} {"train_loss": -11.267248153686523, "global_step": 200868, "epoch": 1195} {"train_loss": -10.983713150024414, "global_step": 200869, "epoch": 1195} {"train_loss": -9.99306869506836, "global_step": 200870, "epoch": 1195} {"train_loss": -10.868377685546875, "global_step": 200871, "epoch": 1195} {"train_loss": -11.081077575683594, "global_step": 200872, "epoch": 1195} {"train_loss": -10.514756202697754, "global_step": 200873, "epoch": 1195} {"train_loss": -10.767980575561523, "global_step": 200874, "epoch": 1195} {"train_loss": -10.633938789367676, "global_step": 200875, "epoch": 1195} {"train_loss": -10.406777381896973, "global_step": 200876, "epoch": 1195} {"train_loss": -10.477449417114258, "global_step": 200877, "epoch": 1195} {"train_loss": -10.906339645385742, "global_step": 200878, "epoch": 1195} {"train_loss": -10.232237815856934, "global_step": 200879, "epoch": 1195} {"train_loss": -10.891831398010254, "global_step": 200880, "epoch": 1195} {"train_loss": -11.374410629272461, "global_step": 200881, "epoch": 1195} {"train_loss": -10.552875518798828, "global_step": 200882, "epoch": 1195} {"train_loss": -11.530111312866211, "global_step": 200883, "epoch": 1195} {"train_loss": -11.198136329650879, "global_step": 200884, "epoch": 1195} {"train_loss": -10.844181060791016, "global_step": 200885, "epoch": 1195} {"train_loss": -11.440033912658691, "global_step": 200886, "epoch": 1195} {"train_loss": -11.06008529663086, "global_step": 200887, "epoch": 1195} {"train_loss": -11.033166885375977, "global_step": 200888, "epoch": 1195} {"train_loss": -10.828475952148438, "global_step": 200889, "epoch": 1195} {"train_loss": -10.831050872802734, "global_step": 200890, "epoch": 1195} {"train_loss": -11.222843170166016, "global_step": 200891, "epoch": 1195} {"train_loss": -11.162212371826172, "global_step": 200892, "epoch": 1195} {"train_loss": -11.202360153198242, "global_step": 200893, "epoch": 1195} {"train_loss": -11.102418899536133, "global_step": 200894, "epoch": 1195} {"train_loss": -11.194355964660645, "global_step": 200895, "epoch": 1195} {"train_loss": -11.140291213989258, "global_step": 200896, "epoch": 1195} {"train_loss": -11.224824905395508, "global_step": 200897, "epoch": 1195} {"train_loss": -11.234066009521484, "global_step": 200898, "epoch": 1195} {"train_loss": -11.490571975708008, "global_step": 200899, "epoch": 1195} {"train_loss": -11.420917510986328, "global_step": 200900, "epoch": 1195} {"train_loss": -11.330809593200684, "global_step": 200901, "epoch": 1195} {"train_loss": -11.184654235839844, "global_step": 200902, "epoch": 1195} {"train_loss": -11.340591430664062, "global_step": 200903, "epoch": 1195} {"train_loss": -11.409004211425781, "global_step": 200904, "epoch": 1195} {"train_loss": -11.478705406188965, "global_step": 200905, "epoch": 1195} {"train_loss": -11.604045867919922, "global_step": 200906, "epoch": 1195} {"train_loss": -11.467639923095703, "global_step": 200907, "epoch": 1195} {"train_loss": -11.522418022155762, "global_step": 200908, "epoch": 1195} {"train_loss": -11.100654602050781, "global_step": 200909, "epoch": 1195} {"train_loss": -11.634456634521484, "global_step": 200910, "epoch": 1195} {"train_loss": -11.192214965820312, "global_step": 200911, "epoch": 1195} {"train_loss": -11.245080947875977, "global_step": 200912, "epoch": 1195} {"train_loss": -11.552909851074219, "global_step": 200913, "epoch": 1195} {"train_loss": -11.428401947021484, "global_step": 200914, "epoch": 1195} {"train_loss": -11.381994247436523, "global_step": 200915, "epoch": 1195} {"train_loss": -11.473955154418945, "global_step": 200916, "epoch": 1195} {"train_loss": -11.305917739868164, "global_step": 200917, "epoch": 1195} {"train_loss": -11.32032585144043, "global_step": 200918, "epoch": 1195} {"train_loss": -11.338064193725586, "global_step": 200919, "epoch": 1195} {"train_loss": -10.662128448486328, "global_step": 200920, "epoch": 1195} {"train_loss": -10.858047485351562, "global_step": 200921, "epoch": 1195} {"train_loss": -10.5618896484375, "global_step": 200922, "epoch": 1195} {"train_loss": -10.744327545166016, "global_step": 200923, "epoch": 1195} {"train_loss": -11.01981258392334, "global_step": 200924, "epoch": 1195} {"train_loss": -11.442551612854004, "global_step": 200925, "epoch": 1195} {"train_loss": -11.056838035583496, "global_step": 200926, "epoch": 1195} {"train_loss": -11.27045388448806, "global_step": 200927, "epoch": 1195, "val_loss": 252123.015625, "train_action_mse_error": 0.18945857882499695} {"train_loss": -11.135759353637695, "global_step": 200928, "epoch": 1196} {"train_loss": -10.999088287353516, "global_step": 200929, "epoch": 1196} {"train_loss": -11.426259994506836, "global_step": 200930, "epoch": 1196} {"train_loss": -10.46640396118164, "global_step": 200931, "epoch": 1196} {"train_loss": -11.394451141357422, "global_step": 200932, "epoch": 1196} {"train_loss": -10.957290649414062, "global_step": 200933, "epoch": 1196} {"train_loss": -11.12617015838623, "global_step": 200934, "epoch": 1196} {"train_loss": -11.449405670166016, "global_step": 200935, "epoch": 1196} {"train_loss": -11.041131019592285, "global_step": 200936, "epoch": 1196} {"train_loss": -11.34896183013916, "global_step": 200937, "epoch": 1196} {"train_loss": -11.381836891174316, "global_step": 200938, "epoch": 1196} {"train_loss": -11.137954711914062, "global_step": 200939, "epoch": 1196} {"train_loss": -11.565561294555664, "global_step": 200940, "epoch": 1196} {"train_loss": -11.30654525756836, "global_step": 200941, "epoch": 1196} {"train_loss": -10.981843948364258, "global_step": 200942, "epoch": 1196} {"train_loss": -11.668391227722168, "global_step": 200943, "epoch": 1196} {"train_loss": -11.200437545776367, "global_step": 200944, "epoch": 1196} {"train_loss": -11.365339279174805, "global_step": 200945, "epoch": 1196} {"train_loss": -11.445535659790039, "global_step": 200946, "epoch": 1196} {"train_loss": -11.253372192382812, "global_step": 200947, "epoch": 1196} {"train_loss": -11.668595314025879, "global_step": 200948, "epoch": 1196} {"train_loss": -11.26578140258789, "global_step": 200949, "epoch": 1196} {"train_loss": -11.544698715209961, "global_step": 200950, "epoch": 1196} {"train_loss": -11.576089859008789, "global_step": 200951, "epoch": 1196} {"train_loss": -11.353548049926758, "global_step": 200952, "epoch": 1196} {"train_loss": -11.514629364013672, "global_step": 200953, "epoch": 1196} {"train_loss": -11.53744125366211, "global_step": 200954, "epoch": 1196} {"train_loss": -11.598142623901367, "global_step": 200955, "epoch": 1196} {"train_loss": -11.570233345031738, "global_step": 200956, "epoch": 1196} {"train_loss": -11.629334449768066, "global_step": 200957, "epoch": 1196} {"train_loss": -11.520971298217773, "global_step": 200958, "epoch": 1196} {"train_loss": -11.429693222045898, "global_step": 200959, "epoch": 1196} {"train_loss": -11.308292388916016, "global_step": 200960, "epoch": 1196} {"train_loss": -11.64663314819336, "global_step": 200961, "epoch": 1196} {"train_loss": -11.14997673034668, "global_step": 200962, "epoch": 1196} {"train_loss": -11.81546401977539, "global_step": 200963, "epoch": 1196} {"train_loss": -11.255881309509277, "global_step": 200964, "epoch": 1196} {"train_loss": -11.692804336547852, "global_step": 200965, "epoch": 1196} {"train_loss": -11.521595001220703, "global_step": 200966, "epoch": 1196} {"train_loss": -11.580559730529785, "global_step": 200967, "epoch": 1196} {"train_loss": -11.596172332763672, "global_step": 200968, "epoch": 1196} {"train_loss": -11.686027526855469, "global_step": 200969, "epoch": 1196} {"train_loss": -11.325556755065918, "global_step": 200970, "epoch": 1196} {"train_loss": -11.835081100463867, "global_step": 200971, "epoch": 1196} {"train_loss": -11.083906173706055, "global_step": 200972, "epoch": 1196} {"train_loss": -10.82895278930664, "global_step": 200973, "epoch": 1196} {"train_loss": -11.763410568237305, "global_step": 200974, "epoch": 1196} {"train_loss": -10.315597534179688, "global_step": 200975, "epoch": 1196} {"train_loss": -10.783106803894043, "global_step": 200976, "epoch": 1196} {"train_loss": -11.30134105682373, "global_step": 200977, "epoch": 1196} {"train_loss": -11.063841819763184, "global_step": 200978, "epoch": 1196} {"train_loss": -11.30759048461914, "global_step": 200979, "epoch": 1196} {"train_loss": -11.280463218688965, "global_step": 200980, "epoch": 1196} {"train_loss": -10.76627254486084, "global_step": 200981, "epoch": 1196} {"train_loss": -11.136372566223145, "global_step": 200982, "epoch": 1196} {"train_loss": -11.529802322387695, "global_step": 200983, "epoch": 1196} {"train_loss": -10.900747299194336, "global_step": 200984, "epoch": 1196} {"train_loss": -11.291603088378906, "global_step": 200985, "epoch": 1196} {"train_loss": -11.229608535766602, "global_step": 200986, "epoch": 1196} {"train_loss": -11.246212005615234, "global_step": 200987, "epoch": 1196} {"train_loss": -11.302457809448242, "global_step": 200988, "epoch": 1196} {"train_loss": -11.427848815917969, "global_step": 200989, "epoch": 1196} {"train_loss": -11.055047988891602, "global_step": 200990, "epoch": 1196} {"train_loss": -11.344710350036621, "global_step": 200991, "epoch": 1196} {"train_loss": -11.211878776550293, "global_step": 200992, "epoch": 1196} {"train_loss": -11.569158554077148, "global_step": 200993, "epoch": 1196} {"train_loss": -11.22126579284668, "global_step": 200994, "epoch": 1196} {"train_loss": -11.422630310058594, "global_step": 200995, "epoch": 1196} {"train_loss": -11.099063873291016, "global_step": 200996, "epoch": 1196} {"train_loss": -11.84880542755127, "global_step": 200997, "epoch": 1196} {"train_loss": -11.417854309082031, "global_step": 200998, "epoch": 1196} {"train_loss": -11.42229175567627, "global_step": 200999, "epoch": 1196} {"train_loss": -11.538248062133789, "global_step": 201000, "epoch": 1196} {"train_loss": -11.479232788085938, "global_step": 201001, "epoch": 1196} {"train_loss": -11.604548454284668, "global_step": 201002, "epoch": 1196} {"train_loss": -11.294577598571777, "global_step": 201003, "epoch": 1196} {"train_loss": -11.217350006103516, "global_step": 201004, "epoch": 1196} {"train_loss": -11.525327682495117, "global_step": 201005, "epoch": 1196} {"train_loss": -11.081897735595703, "global_step": 201006, "epoch": 1196} {"train_loss": -11.04505729675293, "global_step": 201007, "epoch": 1196} {"train_loss": -11.421361923217773, "global_step": 201008, "epoch": 1196} {"train_loss": -11.685127258300781, "global_step": 201009, "epoch": 1196} {"train_loss": -11.609441757202148, "global_step": 201010, "epoch": 1196} {"train_loss": -11.299687385559082, "global_step": 201011, "epoch": 1196} {"train_loss": -11.67405891418457, "global_step": 201012, "epoch": 1196} {"train_loss": -11.14980697631836, "global_step": 201013, "epoch": 1196} {"train_loss": -11.615400314331055, "global_step": 201014, "epoch": 1196} {"train_loss": -11.208032608032227, "global_step": 201015, "epoch": 1196} {"train_loss": -11.26785659790039, "global_step": 201016, "epoch": 1196} {"train_loss": -11.214171409606934, "global_step": 201017, "epoch": 1196} {"train_loss": -11.125921249389648, "global_step": 201018, "epoch": 1196} {"train_loss": -11.431800842285156, "global_step": 201019, "epoch": 1196} {"train_loss": -10.994632720947266, "global_step": 201020, "epoch": 1196} {"train_loss": -10.797473907470703, "global_step": 201021, "epoch": 1196} {"train_loss": -10.669629096984863, "global_step": 201022, "epoch": 1196} {"train_loss": -10.888158798217773, "global_step": 201023, "epoch": 1196} {"train_loss": -10.544609069824219, "global_step": 201024, "epoch": 1196} {"train_loss": -10.74224853515625, "global_step": 201025, "epoch": 1196} {"train_loss": -10.566435813903809, "global_step": 201026, "epoch": 1196} {"train_loss": -10.701623916625977, "global_step": 201027, "epoch": 1196} {"train_loss": -10.349519729614258, "global_step": 201028, "epoch": 1196} {"train_loss": -10.67873764038086, "global_step": 201029, "epoch": 1196} {"train_loss": -10.608846664428711, "global_step": 201030, "epoch": 1196} {"train_loss": -10.97231388092041, "global_step": 201031, "epoch": 1196} {"train_loss": -10.996576309204102, "global_step": 201032, "epoch": 1196} {"train_loss": -9.750561714172363, "global_step": 201033, "epoch": 1196} {"train_loss": -11.44289779663086, "global_step": 201034, "epoch": 1196} {"train_loss": -10.944177627563477, "global_step": 201035, "epoch": 1196} {"train_loss": -10.639056205749512, "global_step": 201036, "epoch": 1196} {"train_loss": -11.345592498779297, "global_step": 201037, "epoch": 1196} {"train_loss": -10.148571014404297, "global_step": 201038, "epoch": 1196} {"train_loss": -11.111692428588867, "global_step": 201039, "epoch": 1196} {"train_loss": -11.1060152053833, "global_step": 201040, "epoch": 1196} {"train_loss": -10.606194496154785, "global_step": 201041, "epoch": 1196} {"train_loss": -11.352989196777344, "global_step": 201042, "epoch": 1196} {"train_loss": -10.938926696777344, "global_step": 201043, "epoch": 1196} {"train_loss": -10.886012077331543, "global_step": 201044, "epoch": 1196} {"train_loss": -11.316752433776855, "global_step": 201045, "epoch": 1196} {"train_loss": -10.790695190429688, "global_step": 201046, "epoch": 1196} {"train_loss": -10.956405639648438, "global_step": 201047, "epoch": 1196} {"train_loss": -11.11081600189209, "global_step": 201048, "epoch": 1196} {"train_loss": -10.984674453735352, "global_step": 201049, "epoch": 1196} {"train_loss": -11.15352725982666, "global_step": 201050, "epoch": 1196} {"train_loss": -11.359270095825195, "global_step": 201051, "epoch": 1196} {"train_loss": -11.198287963867188, "global_step": 201052, "epoch": 1196} {"train_loss": -11.3190336227417, "global_step": 201053, "epoch": 1196} {"train_loss": -11.323246002197266, "global_step": 201054, "epoch": 1196} {"train_loss": -11.389570236206055, "global_step": 201055, "epoch": 1196} {"train_loss": -11.477344512939453, "global_step": 201056, "epoch": 1196} {"train_loss": -11.487582206726074, "global_step": 201057, "epoch": 1196} {"train_loss": -11.378705024719238, "global_step": 201058, "epoch": 1196} {"train_loss": -11.285737991333008, "global_step": 201059, "epoch": 1196} {"train_loss": -11.553277015686035, "global_step": 201060, "epoch": 1196} {"train_loss": -11.301895141601562, "global_step": 201061, "epoch": 1196} {"train_loss": -11.334817886352539, "global_step": 201062, "epoch": 1196} {"train_loss": -11.486448287963867, "global_step": 201063, "epoch": 1196} {"train_loss": -10.631057739257812, "global_step": 201064, "epoch": 1196} {"train_loss": -11.167882919311523, "global_step": 201065, "epoch": 1196} {"train_loss": -11.427099227905273, "global_step": 201066, "epoch": 1196} {"train_loss": -11.044088363647461, "global_step": 201067, "epoch": 1196} {"train_loss": -11.607809066772461, "global_step": 201068, "epoch": 1196} {"train_loss": -11.191394805908203, "global_step": 201069, "epoch": 1196} {"train_loss": -10.942041397094727, "global_step": 201070, "epoch": 1196} {"train_loss": -11.327777862548828, "global_step": 201071, "epoch": 1196} {"train_loss": -11.27028751373291, "global_step": 201072, "epoch": 1196} {"train_loss": -11.385358810424805, "global_step": 201073, "epoch": 1196} {"train_loss": -11.595738410949707, "global_step": 201074, "epoch": 1196} {"train_loss": -11.592948913574219, "global_step": 201075, "epoch": 1196} {"train_loss": -11.37951374053955, "global_step": 201076, "epoch": 1196} {"train_loss": -11.760503768920898, "global_step": 201077, "epoch": 1196} {"train_loss": -11.512940406799316, "global_step": 201078, "epoch": 1196} {"train_loss": -11.6217622756958, "global_step": 201079, "epoch": 1196} {"train_loss": -11.696660995483398, "global_step": 201080, "epoch": 1196} {"train_loss": -11.348468780517578, "global_step": 201081, "epoch": 1196} {"train_loss": -11.836353302001953, "global_step": 201082, "epoch": 1196} {"train_loss": -11.557948112487793, "global_step": 201083, "epoch": 1196} {"train_loss": -11.561326026916504, "global_step": 201084, "epoch": 1196} {"train_loss": -11.597064018249512, "global_step": 201085, "epoch": 1196} {"train_loss": -11.61792278289795, "global_step": 201086, "epoch": 1196} {"train_loss": -11.265483856201172, "global_step": 201087, "epoch": 1196} {"train_loss": -11.454935073852539, "global_step": 201088, "epoch": 1196} {"train_loss": -10.906800270080566, "global_step": 201089, "epoch": 1196} {"train_loss": -9.3108491897583, "global_step": 201090, "epoch": 1196} {"train_loss": -11.679458618164062, "global_step": 201091, "epoch": 1196} {"train_loss": -9.334321975708008, "global_step": 201092, "epoch": 1196} {"train_loss": -10.222469329833984, "global_step": 201093, "epoch": 1196} {"train_loss": -11.18789005279541, "global_step": 201094, "epoch": 1196} {"train_loss": -11.221296639669509, "global_step": 201095, "epoch": 1196, "val_loss": 253056.546875} {"train_loss": -11.05740737915039, "global_step": 201096, "epoch": 1197} {"train_loss": -10.042121887207031, "global_step": 201097, "epoch": 1197} {"train_loss": -10.762496948242188, "global_step": 201098, "epoch": 1197} {"train_loss": -11.103044509887695, "global_step": 201099, "epoch": 1197} {"train_loss": -10.07693862915039, "global_step": 201100, "epoch": 1197} {"train_loss": -11.134712219238281, "global_step": 201101, "epoch": 1197} {"train_loss": -10.735509872436523, "global_step": 201102, "epoch": 1197} {"train_loss": -10.70941162109375, "global_step": 201103, "epoch": 1197} {"train_loss": -10.289467811584473, "global_step": 201104, "epoch": 1197} {"train_loss": -10.838249206542969, "global_step": 201105, "epoch": 1197} {"train_loss": -10.720012664794922, "global_step": 201106, "epoch": 1197} {"train_loss": -11.357297897338867, "global_step": 201107, "epoch": 1197} {"train_loss": -11.379880905151367, "global_step": 201108, "epoch": 1197} {"train_loss": -11.262566566467285, "global_step": 201109, "epoch": 1197} {"train_loss": -11.359784126281738, "global_step": 201110, "epoch": 1197} {"train_loss": -10.653535842895508, "global_step": 201111, "epoch": 1197} {"train_loss": -11.566751480102539, "global_step": 201112, "epoch": 1197} {"train_loss": -10.726394653320312, "global_step": 201113, "epoch": 1197} {"train_loss": -11.38058090209961, "global_step": 201114, "epoch": 1197} {"train_loss": -10.760408401489258, "global_step": 201115, "epoch": 1197} {"train_loss": -11.186574935913086, "global_step": 201116, "epoch": 1197} {"train_loss": -10.712172508239746, "global_step": 201117, "epoch": 1197} {"train_loss": -11.073996543884277, "global_step": 201118, "epoch": 1197} {"train_loss": -10.78419303894043, "global_step": 201119, "epoch": 1197} {"train_loss": -11.410172462463379, "global_step": 201120, "epoch": 1197} {"train_loss": -10.724164962768555, "global_step": 201121, "epoch": 1197} {"train_loss": -11.579792022705078, "global_step": 201122, "epoch": 1197} {"train_loss": -11.122878074645996, "global_step": 201123, "epoch": 1197} {"train_loss": -11.4856538772583, "global_step": 201124, "epoch": 1197} {"train_loss": -11.006575584411621, "global_step": 201125, "epoch": 1197} {"train_loss": -11.381793975830078, "global_step": 201126, "epoch": 1197} {"train_loss": -10.982769966125488, "global_step": 201127, "epoch": 1197} {"train_loss": -11.477453231811523, "global_step": 201128, "epoch": 1197} {"train_loss": -10.862403869628906, "global_step": 201129, "epoch": 1197} {"train_loss": -11.397826194763184, "global_step": 201130, "epoch": 1197} {"train_loss": -10.944757461547852, "global_step": 201131, "epoch": 1197} {"train_loss": -11.532114028930664, "global_step": 201132, "epoch": 1197} {"train_loss": -11.2288179397583, "global_step": 201133, "epoch": 1197} {"train_loss": -11.340792655944824, "global_step": 201134, "epoch": 1197} {"train_loss": -11.159830093383789, "global_step": 201135, "epoch": 1197} {"train_loss": -11.454708099365234, "global_step": 201136, "epoch": 1197} {"train_loss": -10.987102508544922, "global_step": 201137, "epoch": 1197} {"train_loss": -11.355399131774902, "global_step": 201138, "epoch": 1197} {"train_loss": -11.353902816772461, "global_step": 201139, "epoch": 1197} {"train_loss": -11.573031425476074, "global_step": 201140, "epoch": 1197} {"train_loss": -11.74262523651123, "global_step": 201141, "epoch": 1197} {"train_loss": -11.391511917114258, "global_step": 201142, "epoch": 1197} {"train_loss": -11.471649169921875, "global_step": 201143, "epoch": 1197} {"train_loss": -11.483406066894531, "global_step": 201144, "epoch": 1197} {"train_loss": -11.374305725097656, "global_step": 201145, "epoch": 1197} {"train_loss": -11.441969871520996, "global_step": 201146, "epoch": 1197} {"train_loss": -11.25755786895752, "global_step": 201147, "epoch": 1197} {"train_loss": -11.25472640991211, "global_step": 201148, "epoch": 1197} {"train_loss": -11.458456039428711, "global_step": 201149, "epoch": 1197} {"train_loss": -11.210027694702148, "global_step": 201150, "epoch": 1197} {"train_loss": -11.167818069458008, "global_step": 201151, "epoch": 1197} {"train_loss": -11.203280448913574, "global_step": 201152, "epoch": 1197} {"train_loss": -10.92418098449707, "global_step": 201153, "epoch": 1197} {"train_loss": -11.406049728393555, "global_step": 201154, "epoch": 1197} {"train_loss": -11.01749038696289, "global_step": 201155, "epoch": 1197} {"train_loss": -11.565164566040039, "global_step": 201156, "epoch": 1197} {"train_loss": -10.72463607788086, "global_step": 201157, "epoch": 1197} {"train_loss": -11.644277572631836, "global_step": 201158, "epoch": 1197} {"train_loss": -10.978599548339844, "global_step": 201159, "epoch": 1197} {"train_loss": -11.641106605529785, "global_step": 201160, "epoch": 1197} {"train_loss": -11.175064086914062, "global_step": 201161, "epoch": 1197} {"train_loss": -11.155714988708496, "global_step": 201162, "epoch": 1197} {"train_loss": -11.17387866973877, "global_step": 201163, "epoch": 1197} {"train_loss": -11.305437088012695, "global_step": 201164, "epoch": 1197} {"train_loss": -11.531888008117676, "global_step": 201165, "epoch": 1197} {"train_loss": -11.113716125488281, "global_step": 201166, "epoch": 1197} {"train_loss": -11.847424507141113, "global_step": 201167, "epoch": 1197} {"train_loss": -11.57529067993164, "global_step": 201168, "epoch": 1197} {"train_loss": -11.654708862304688, "global_step": 201169, "epoch": 1197} {"train_loss": -11.656363487243652, "global_step": 201170, "epoch": 1197} {"train_loss": -11.686790466308594, "global_step": 201171, "epoch": 1197} {"train_loss": -11.614591598510742, "global_step": 201172, "epoch": 1197} {"train_loss": -11.52769660949707, "global_step": 201173, "epoch": 1197} {"train_loss": -11.826047897338867, "global_step": 201174, "epoch": 1197} {"train_loss": -11.68716812133789, "global_step": 201175, "epoch": 1197} {"train_loss": -11.8701753616333, "global_step": 201176, "epoch": 1197} {"train_loss": -11.688356399536133, "global_step": 201177, "epoch": 1197} {"train_loss": -11.783732414245605, "global_step": 201178, "epoch": 1197} {"train_loss": -11.733325958251953, "global_step": 201179, "epoch": 1197} {"train_loss": -11.77737045288086, "global_step": 201180, "epoch": 1197} {"train_loss": -11.299224853515625, "global_step": 201181, "epoch": 1197} {"train_loss": -11.185576438903809, "global_step": 201182, "epoch": 1197} {"train_loss": -11.508095741271973, "global_step": 201183, "epoch": 1197} {"train_loss": -11.376473426818848, "global_step": 201184, "epoch": 1197} {"train_loss": -10.823881149291992, "global_step": 201185, "epoch": 1197} {"train_loss": -10.863436698913574, "global_step": 201186, "epoch": 1197} {"train_loss": -11.397604942321777, "global_step": 201187, "epoch": 1197} {"train_loss": -9.942704200744629, "global_step": 201188, "epoch": 1197} {"train_loss": -10.185718536376953, "global_step": 201189, "epoch": 1197} {"train_loss": -11.522674560546875, "global_step": 201190, "epoch": 1197} {"train_loss": -9.99022102355957, "global_step": 201191, "epoch": 1197} {"train_loss": -11.16810417175293, "global_step": 201192, "epoch": 1197} {"train_loss": -10.799032211303711, "global_step": 201193, "epoch": 1197} {"train_loss": -9.568513870239258, "global_step": 201194, "epoch": 1197} {"train_loss": -11.048208236694336, "global_step": 201195, "epoch": 1197} {"train_loss": -10.632715225219727, "global_step": 201196, "epoch": 1197} {"train_loss": -10.317293167114258, "global_step": 201197, "epoch": 1197} {"train_loss": -10.838801383972168, "global_step": 201198, "epoch": 1197} {"train_loss": -10.248556137084961, "global_step": 201199, "epoch": 1197} {"train_loss": -9.775903701782227, "global_step": 201200, "epoch": 1197} {"train_loss": -10.737306594848633, "global_step": 201201, "epoch": 1197} {"train_loss": -10.27340316772461, "global_step": 201202, "epoch": 1197} {"train_loss": -9.686110496520996, "global_step": 201203, "epoch": 1197} {"train_loss": -10.109334945678711, "global_step": 201204, "epoch": 1197} {"train_loss": -8.931615829467773, "global_step": 201205, "epoch": 1197} {"train_loss": -9.049206733703613, "global_step": 201206, "epoch": 1197} {"train_loss": -10.371471405029297, "global_step": 201207, "epoch": 1197} {"train_loss": -8.774543762207031, "global_step": 201208, "epoch": 1197} {"train_loss": -8.624998092651367, "global_step": 201209, "epoch": 1197} {"train_loss": -9.52933406829834, "global_step": 201210, "epoch": 1197} {"train_loss": -10.508649826049805, "global_step": 201211, "epoch": 1197} {"train_loss": -9.119407653808594, "global_step": 201212, "epoch": 1197} {"train_loss": -9.98728084564209, "global_step": 201213, "epoch": 1197} {"train_loss": -10.368593215942383, "global_step": 201214, "epoch": 1197} {"train_loss": -9.48768138885498, "global_step": 201215, "epoch": 1197} {"train_loss": -10.013650894165039, "global_step": 201216, "epoch": 1197} {"train_loss": -10.908224105834961, "global_step": 201217, "epoch": 1197} {"train_loss": -10.278684616088867, "global_step": 201218, "epoch": 1197} {"train_loss": -10.150662422180176, "global_step": 201219, "epoch": 1197} {"train_loss": -10.849422454833984, "global_step": 201220, "epoch": 1197} {"train_loss": -10.325618743896484, "global_step": 201221, "epoch": 1197} {"train_loss": -10.762579917907715, "global_step": 201222, "epoch": 1197} {"train_loss": -10.875114440917969, "global_step": 201223, "epoch": 1197} {"train_loss": -10.502824783325195, "global_step": 201224, "epoch": 1197} {"train_loss": -10.835498809814453, "global_step": 201225, "epoch": 1197} {"train_loss": -10.913721084594727, "global_step": 201226, "epoch": 1197} {"train_loss": -10.932890892028809, "global_step": 201227, "epoch": 1197} {"train_loss": -11.052997589111328, "global_step": 201228, "epoch": 1197} {"train_loss": -10.815814971923828, "global_step": 201229, "epoch": 1197} {"train_loss": -11.17618179321289, "global_step": 201230, "epoch": 1197} {"train_loss": -10.996017456054688, "global_step": 201231, "epoch": 1197} {"train_loss": -10.83906364440918, "global_step": 201232, "epoch": 1197} {"train_loss": -10.993875503540039, "global_step": 201233, "epoch": 1197} {"train_loss": -11.069181442260742, "global_step": 201234, "epoch": 1197} {"train_loss": -11.230566024780273, "global_step": 201235, "epoch": 1197} {"train_loss": -11.298162460327148, "global_step": 201236, "epoch": 1197} {"train_loss": -10.977712631225586, "global_step": 201237, "epoch": 1197} {"train_loss": -11.296316146850586, "global_step": 201238, "epoch": 1197} {"train_loss": -11.240303039550781, "global_step": 201239, "epoch": 1197} {"train_loss": -11.06510066986084, "global_step": 201240, "epoch": 1197} {"train_loss": -11.255237579345703, "global_step": 201241, "epoch": 1197} {"train_loss": -11.143895149230957, "global_step": 201242, "epoch": 1197} {"train_loss": -11.1951265335083, "global_step": 201243, "epoch": 1197} {"train_loss": -11.245318412780762, "global_step": 201244, "epoch": 1197} {"train_loss": -11.361309051513672, "global_step": 201245, "epoch": 1197} {"train_loss": -11.338071823120117, "global_step": 201246, "epoch": 1197} {"train_loss": -11.048683166503906, "global_step": 201247, "epoch": 1197} {"train_loss": -11.348962783813477, "global_step": 201248, "epoch": 1197} {"train_loss": -11.458364486694336, "global_step": 201249, "epoch": 1197} {"train_loss": -11.305647850036621, "global_step": 201250, "epoch": 1197} {"train_loss": -11.309423446655273, "global_step": 201251, "epoch": 1197} {"train_loss": -11.356559753417969, "global_step": 201252, "epoch": 1197} {"train_loss": -11.271764755249023, "global_step": 201253, "epoch": 1197} {"train_loss": -11.37398910522461, "global_step": 201254, "epoch": 1197} {"train_loss": -11.298730850219727, "global_step": 201255, "epoch": 1197} {"train_loss": -11.304401397705078, "global_step": 201256, "epoch": 1197} {"train_loss": -11.397218704223633, "global_step": 201257, "epoch": 1197} {"train_loss": -11.413049697875977, "global_step": 201258, "epoch": 1197} {"train_loss": -11.270942687988281, "global_step": 201259, "epoch": 1197} {"train_loss": -11.408803939819336, "global_step": 201260, "epoch": 1197} {"train_loss": -11.44744873046875, "global_step": 201261, "epoch": 1197} {"train_loss": -11.329806327819824, "global_step": 201262, "epoch": 1197} {"train_loss": -10.997896665618534, "global_step": 201263, "epoch": 1197, "val_loss": 249151.1875} {"train_loss": -11.422280311584473, "global_step": 201264, "epoch": 1198} {"train_loss": -11.51927375793457, "global_step": 201265, "epoch": 1198} {"train_loss": -11.231196403503418, "global_step": 201266, "epoch": 1198} {"train_loss": -11.22734260559082, "global_step": 201267, "epoch": 1198} {"train_loss": -11.251640319824219, "global_step": 201268, "epoch": 1198} {"train_loss": -11.53112506866455, "global_step": 201269, "epoch": 1198} {"train_loss": -10.990419387817383, "global_step": 201270, "epoch": 1198} {"train_loss": -11.39356803894043, "global_step": 201271, "epoch": 1198} {"train_loss": -11.39445686340332, "global_step": 201272, "epoch": 1198} {"train_loss": -11.388384819030762, "global_step": 201273, "epoch": 1198} {"train_loss": -11.627618789672852, "global_step": 201274, "epoch": 1198} {"train_loss": -11.156512260437012, "global_step": 201275, "epoch": 1198} {"train_loss": -11.34982681274414, "global_step": 201276, "epoch": 1198} {"train_loss": -11.349987030029297, "global_step": 201277, "epoch": 1198} {"train_loss": -11.224424362182617, "global_step": 201278, "epoch": 1198} {"train_loss": -11.592147827148438, "global_step": 201279, "epoch": 1198} {"train_loss": -11.403097152709961, "global_step": 201280, "epoch": 1198} {"train_loss": -11.633255004882812, "global_step": 201281, "epoch": 1198} {"train_loss": -11.64938735961914, "global_step": 201282, "epoch": 1198} {"train_loss": -11.689359664916992, "global_step": 201283, "epoch": 1198} {"train_loss": -11.552268028259277, "global_step": 201284, "epoch": 1198} {"train_loss": -11.38141918182373, "global_step": 201285, "epoch": 1198} {"train_loss": -11.729793548583984, "global_step": 201286, "epoch": 1198} {"train_loss": -11.531274795532227, "global_step": 201287, "epoch": 1198} {"train_loss": -11.60472297668457, "global_step": 201288, "epoch": 1198} {"train_loss": -11.745512962341309, "global_step": 201289, "epoch": 1198} {"train_loss": -11.748129844665527, "global_step": 201290, "epoch": 1198} {"train_loss": -11.53017807006836, "global_step": 201291, "epoch": 1198} {"train_loss": -11.57638931274414, "global_step": 201292, "epoch": 1198} {"train_loss": -11.692209243774414, "global_step": 201293, "epoch": 1198} {"train_loss": -11.78651237487793, "global_step": 201294, "epoch": 1198} {"train_loss": -11.492027282714844, "global_step": 201295, "epoch": 1198} {"train_loss": -11.359395027160645, "global_step": 201296, "epoch": 1198} {"train_loss": -11.544075012207031, "global_step": 201297, "epoch": 1198} {"train_loss": -11.712567329406738, "global_step": 201298, "epoch": 1198} {"train_loss": -11.653773307800293, "global_step": 201299, "epoch": 1198} {"train_loss": -11.659931182861328, "global_step": 201300, "epoch": 1198} {"train_loss": -11.77168083190918, "global_step": 201301, "epoch": 1198} {"train_loss": -11.553951263427734, "global_step": 201302, "epoch": 1198} {"train_loss": -11.793193817138672, "global_step": 201303, "epoch": 1198} {"train_loss": -11.836114883422852, "global_step": 201304, "epoch": 1198} {"train_loss": -11.752037048339844, "global_step": 201305, "epoch": 1198} {"train_loss": -11.7647123336792, "global_step": 201306, "epoch": 1198} {"train_loss": -11.452690124511719, "global_step": 201307, "epoch": 1198} {"train_loss": -11.758371353149414, "global_step": 201308, "epoch": 1198} {"train_loss": -11.56736946105957, "global_step": 201309, "epoch": 1198} {"train_loss": -11.495012283325195, "global_step": 201310, "epoch": 1198} {"train_loss": -11.644686698913574, "global_step": 201311, "epoch": 1198} {"train_loss": -11.474953651428223, "global_step": 201312, "epoch": 1198} {"train_loss": -11.004013061523438, "global_step": 201313, "epoch": 1198} {"train_loss": -11.371088027954102, "global_step": 201314, "epoch": 1198} {"train_loss": -10.226713180541992, "global_step": 201315, "epoch": 1198} {"train_loss": -11.112313270568848, "global_step": 201316, "epoch": 1198} {"train_loss": -11.461431503295898, "global_step": 201317, "epoch": 1198} {"train_loss": -10.452709197998047, "global_step": 201318, "epoch": 1198} {"train_loss": -10.484039306640625, "global_step": 201319, "epoch": 1198} {"train_loss": -10.493276596069336, "global_step": 201320, "epoch": 1198} {"train_loss": -10.24696159362793, "global_step": 201321, "epoch": 1198} {"train_loss": -10.92135238647461, "global_step": 201322, "epoch": 1198} {"train_loss": -9.8123779296875, "global_step": 201323, "epoch": 1198} {"train_loss": -10.715314865112305, "global_step": 201324, "epoch": 1198} {"train_loss": -10.04982852935791, "global_step": 201325, "epoch": 1198} {"train_loss": -9.711954116821289, "global_step": 201326, "epoch": 1198} {"train_loss": -11.083619117736816, "global_step": 201327, "epoch": 1198} {"train_loss": -8.723971366882324, "global_step": 201328, "epoch": 1198} {"train_loss": -10.588262557983398, "global_step": 201329, "epoch": 1198} {"train_loss": -10.328388214111328, "global_step": 201330, "epoch": 1198} {"train_loss": -9.907171249389648, "global_step": 201331, "epoch": 1198} {"train_loss": -10.696331024169922, "global_step": 201332, "epoch": 1198} {"train_loss": -9.39647388458252, "global_step": 201333, "epoch": 1198} {"train_loss": -10.445686340332031, "global_step": 201334, "epoch": 1198} {"train_loss": -10.23123836517334, "global_step": 201335, "epoch": 1198} {"train_loss": -10.142217636108398, "global_step": 201336, "epoch": 1198} {"train_loss": -10.553566932678223, "global_step": 201337, "epoch": 1198} {"train_loss": -10.348262786865234, "global_step": 201338, "epoch": 1198} {"train_loss": -10.373485565185547, "global_step": 201339, "epoch": 1198} {"train_loss": -10.800963401794434, "global_step": 201340, "epoch": 1198} {"train_loss": -10.600126266479492, "global_step": 201341, "epoch": 1198} {"train_loss": -10.504207611083984, "global_step": 201342, "epoch": 1198} {"train_loss": -10.826595306396484, "global_step": 201343, "epoch": 1198} {"train_loss": -9.985133171081543, "global_step": 201344, "epoch": 1198} {"train_loss": -10.775379180908203, "global_step": 201345, "epoch": 1198} {"train_loss": -10.286436080932617, "global_step": 201346, "epoch": 1198} {"train_loss": -10.880558967590332, "global_step": 201347, "epoch": 1198} {"train_loss": -10.452704429626465, "global_step": 201348, "epoch": 1198} {"train_loss": -10.591887474060059, "global_step": 201349, "epoch": 1198} {"train_loss": -10.689879417419434, "global_step": 201350, "epoch": 1198} {"train_loss": -10.773187637329102, "global_step": 201351, "epoch": 1198} {"train_loss": -10.980008125305176, "global_step": 201352, "epoch": 1198} {"train_loss": -10.666400909423828, "global_step": 201353, "epoch": 1198} {"train_loss": -10.986841201782227, "global_step": 201354, "epoch": 1198} {"train_loss": -10.678182601928711, "global_step": 201355, "epoch": 1198} {"train_loss": -10.981857299804688, "global_step": 201356, "epoch": 1198} {"train_loss": -11.067193984985352, "global_step": 201357, "epoch": 1198} {"train_loss": -11.064862251281738, "global_step": 201358, "epoch": 1198} {"train_loss": -11.0378999710083, "global_step": 201359, "epoch": 1198} {"train_loss": -10.840241432189941, "global_step": 201360, "epoch": 1198} {"train_loss": -10.871337890625, "global_step": 201361, "epoch": 1198} {"train_loss": -10.801453590393066, "global_step": 201362, "epoch": 1198} {"train_loss": -10.972190856933594, "global_step": 201363, "epoch": 1198} {"train_loss": -11.173271179199219, "global_step": 201364, "epoch": 1198} {"train_loss": -10.80858039855957, "global_step": 201365, "epoch": 1198} {"train_loss": -11.057003021240234, "global_step": 201366, "epoch": 1198} {"train_loss": -11.237961769104004, "global_step": 201367, "epoch": 1198} {"train_loss": -10.80917739868164, "global_step": 201368, "epoch": 1198} {"train_loss": -11.46545696258545, "global_step": 201369, "epoch": 1198} {"train_loss": -10.994112014770508, "global_step": 201370, "epoch": 1198} {"train_loss": -11.116470336914062, "global_step": 201371, "epoch": 1198} {"train_loss": -11.293861389160156, "global_step": 201372, "epoch": 1198} {"train_loss": -11.170409202575684, "global_step": 201373, "epoch": 1198} {"train_loss": -11.370293617248535, "global_step": 201374, "epoch": 1198} {"train_loss": -11.356553077697754, "global_step": 201375, "epoch": 1198} {"train_loss": -11.439621925354004, "global_step": 201376, "epoch": 1198} {"train_loss": -11.503486633300781, "global_step": 201377, "epoch": 1198} {"train_loss": -11.401012420654297, "global_step": 201378, "epoch": 1198} {"train_loss": -11.546422958374023, "global_step": 201379, "epoch": 1198} {"train_loss": -11.375754356384277, "global_step": 201380, "epoch": 1198} {"train_loss": -11.41474723815918, "global_step": 201381, "epoch": 1198} {"train_loss": -11.371236801147461, "global_step": 201382, "epoch": 1198} {"train_loss": -11.492574691772461, "global_step": 201383, "epoch": 1198} {"train_loss": -11.51772689819336, "global_step": 201384, "epoch": 1198} {"train_loss": -11.581951141357422, "global_step": 201385, "epoch": 1198} {"train_loss": -11.444316864013672, "global_step": 201386, "epoch": 1198} {"train_loss": -11.56428337097168, "global_step": 201387, "epoch": 1198} {"train_loss": -11.536863327026367, "global_step": 201388, "epoch": 1198} {"train_loss": -11.557514190673828, "global_step": 201389, "epoch": 1198} {"train_loss": -11.456908226013184, "global_step": 201390, "epoch": 1198} {"train_loss": -11.478653907775879, "global_step": 201391, "epoch": 1198} {"train_loss": -11.54081916809082, "global_step": 201392, "epoch": 1198} {"train_loss": -11.452911376953125, "global_step": 201393, "epoch": 1198} {"train_loss": -11.673574447631836, "global_step": 201394, "epoch": 1198} {"train_loss": -11.423494338989258, "global_step": 201395, "epoch": 1198} {"train_loss": -11.447680473327637, "global_step": 201396, "epoch": 1198} {"train_loss": -11.55188274383545, "global_step": 201397, "epoch": 1198} {"train_loss": -11.51096248626709, "global_step": 201398, "epoch": 1198} {"train_loss": -11.555098533630371, "global_step": 201399, "epoch": 1198} {"train_loss": -11.368982315063477, "global_step": 201400, "epoch": 1198} {"train_loss": -11.538248062133789, "global_step": 201401, "epoch": 1198} {"train_loss": -11.397284507751465, "global_step": 201402, "epoch": 1198} {"train_loss": -11.313283920288086, "global_step": 201403, "epoch": 1198} {"train_loss": -11.399574279785156, "global_step": 201404, "epoch": 1198} {"train_loss": -11.443947792053223, "global_step": 201405, "epoch": 1198} {"train_loss": -11.471001625061035, "global_step": 201406, "epoch": 1198} {"train_loss": -11.327912330627441, "global_step": 201407, "epoch": 1198} {"train_loss": -11.486105918884277, "global_step": 201408, "epoch": 1198} {"train_loss": -11.563902854919434, "global_step": 201409, "epoch": 1198} {"train_loss": -11.513716697692871, "global_step": 201410, "epoch": 1198} {"train_loss": -11.599161148071289, "global_step": 201411, "epoch": 1198} {"train_loss": -11.468711853027344, "global_step": 201412, "epoch": 1198} {"train_loss": -11.430278778076172, "global_step": 201413, "epoch": 1198} {"train_loss": -11.767374038696289, "global_step": 201414, "epoch": 1198} {"train_loss": -11.670991897583008, "global_step": 201415, "epoch": 1198} {"train_loss": -11.715624809265137, "global_step": 201416, "epoch": 1198} {"train_loss": -11.790176391601562, "global_step": 201417, "epoch": 1198} {"train_loss": -11.83358383178711, "global_step": 201418, "epoch": 1198} {"train_loss": -11.6436767578125, "global_step": 201419, "epoch": 1198} {"train_loss": -11.896223068237305, "global_step": 201420, "epoch": 1198} {"train_loss": -11.473503112792969, "global_step": 201421, "epoch": 1198} {"train_loss": -11.562271118164062, "global_step": 201422, "epoch": 1198} {"train_loss": -11.841798782348633, "global_step": 201423, "epoch": 1198} {"train_loss": -11.489906311035156, "global_step": 201424, "epoch": 1198} {"train_loss": -11.684894561767578, "global_step": 201425, "epoch": 1198} {"train_loss": -11.635100364685059, "global_step": 201426, "epoch": 1198} {"train_loss": -11.645509719848633, "global_step": 201427, "epoch": 1198} {"train_loss": -11.570552825927734, "global_step": 201428, "epoch": 1198} {"train_loss": -11.637663841247559, "global_step": 201429, "epoch": 1198} {"train_loss": -11.654397964477539, "global_step": 201430, "epoch": 1198} {"train_loss": -11.217245045162382, "global_step": 201431, "epoch": 1198, "val_loss": 253727.171875} {"train_loss": -11.504688262939453, "global_step": 201432, "epoch": 1199} {"train_loss": -11.525412559509277, "global_step": 201433, "epoch": 1199} {"train_loss": -11.639878273010254, "global_step": 201434, "epoch": 1199} {"train_loss": -11.683634757995605, "global_step": 201435, "epoch": 1199} {"train_loss": -11.678182601928711, "global_step": 201436, "epoch": 1199} {"train_loss": -11.870843887329102, "global_step": 201437, "epoch": 1199} {"train_loss": -11.807682037353516, "global_step": 201438, "epoch": 1199} {"train_loss": -11.983081817626953, "global_step": 201439, "epoch": 1199} {"train_loss": -11.814897537231445, "global_step": 201440, "epoch": 1199} {"train_loss": -11.949075698852539, "global_step": 201441, "epoch": 1199} {"train_loss": -11.657096862792969, "global_step": 201442, "epoch": 1199} {"train_loss": -11.531578063964844, "global_step": 201443, "epoch": 1199} {"train_loss": -11.776365280151367, "global_step": 201444, "epoch": 1199} {"train_loss": -11.483207702636719, "global_step": 201445, "epoch": 1199} {"train_loss": -11.627553939819336, "global_step": 201446, "epoch": 1199} {"train_loss": -11.930717468261719, "global_step": 201447, "epoch": 1199} {"train_loss": -11.641410827636719, "global_step": 201448, "epoch": 1199} {"train_loss": -11.625982284545898, "global_step": 201449, "epoch": 1199} {"train_loss": -11.356658935546875, "global_step": 201450, "epoch": 1199} {"train_loss": -11.403125762939453, "global_step": 201451, "epoch": 1199} {"train_loss": -10.848756790161133, "global_step": 201452, "epoch": 1199} {"train_loss": -11.332422256469727, "global_step": 201453, "epoch": 1199} {"train_loss": -10.988116264343262, "global_step": 201454, "epoch": 1199} {"train_loss": -11.89659309387207, "global_step": 201455, "epoch": 1199} {"train_loss": -11.294323921203613, "global_step": 201456, "epoch": 1199} {"train_loss": -11.558464050292969, "global_step": 201457, "epoch": 1199} {"train_loss": -11.389034271240234, "global_step": 201458, "epoch": 1199} {"train_loss": -11.44088363647461, "global_step": 201459, "epoch": 1199} {"train_loss": -11.290907859802246, "global_step": 201460, "epoch": 1199} {"train_loss": -11.414449691772461, "global_step": 201461, "epoch": 1199} {"train_loss": -10.984018325805664, "global_step": 201462, "epoch": 1199} {"train_loss": -11.808427810668945, "global_step": 201463, "epoch": 1199} {"train_loss": -10.311735153198242, "global_step": 201464, "epoch": 1199} {"train_loss": -10.55836296081543, "global_step": 201465, "epoch": 1199} {"train_loss": -10.797231674194336, "global_step": 201466, "epoch": 1199} {"train_loss": -9.502018928527832, "global_step": 201467, "epoch": 1199} {"train_loss": -10.729422569274902, "global_step": 201468, "epoch": 1199} {"train_loss": -10.761836051940918, "global_step": 201469, "epoch": 1199} {"train_loss": -8.664800643920898, "global_step": 201470, "epoch": 1199} {"train_loss": -10.675007820129395, "global_step": 201471, "epoch": 1199} {"train_loss": -8.761298179626465, "global_step": 201472, "epoch": 1199} {"train_loss": -10.854509353637695, "global_step": 201473, "epoch": 1199} {"train_loss": -10.235919952392578, "global_step": 201474, "epoch": 1199} {"train_loss": -9.838305473327637, "global_step": 201475, "epoch": 1199} {"train_loss": -11.447423934936523, "global_step": 201476, "epoch": 1199} {"train_loss": -10.843528747558594, "global_step": 201477, "epoch": 1199} {"train_loss": -10.323068618774414, "global_step": 201478, "epoch": 1199} {"train_loss": -9.996207237243652, "global_step": 201479, "epoch": 1199} {"train_loss": -11.046621322631836, "global_step": 201480, "epoch": 1199} {"train_loss": -10.357931137084961, "global_step": 201481, "epoch": 1199} {"train_loss": -11.109060287475586, "global_step": 201482, "epoch": 1199} {"train_loss": -10.399694442749023, "global_step": 201483, "epoch": 1199} {"train_loss": -11.066313743591309, "global_step": 201484, "epoch": 1199} {"train_loss": -10.714877128601074, "global_step": 201485, "epoch": 1199} {"train_loss": -11.193687438964844, "global_step": 201486, "epoch": 1199} {"train_loss": -10.630390167236328, "global_step": 201487, "epoch": 1199} {"train_loss": -11.222915649414062, "global_step": 201488, "epoch": 1199} {"train_loss": -10.794930458068848, "global_step": 201489, "epoch": 1199} {"train_loss": -11.033528327941895, "global_step": 201490, "epoch": 1199} {"train_loss": -11.127067565917969, "global_step": 201491, "epoch": 1199} {"train_loss": -10.940557479858398, "global_step": 201492, "epoch": 1199} {"train_loss": -10.990299224853516, "global_step": 201493, "epoch": 1199} {"train_loss": -11.303815841674805, "global_step": 201494, "epoch": 1199} {"train_loss": -11.139463424682617, "global_step": 201495, "epoch": 1199} {"train_loss": -11.143960952758789, "global_step": 201496, "epoch": 1199} {"train_loss": -11.034128189086914, "global_step": 201497, "epoch": 1199} {"train_loss": -11.129816055297852, "global_step": 201498, "epoch": 1199} {"train_loss": -11.370194435119629, "global_step": 201499, "epoch": 1199} {"train_loss": -11.013195037841797, "global_step": 201500, "epoch": 1199} {"train_loss": -11.081201553344727, "global_step": 201501, "epoch": 1199} {"train_loss": -11.314409255981445, "global_step": 201502, "epoch": 1199} {"train_loss": -11.281784057617188, "global_step": 201503, "epoch": 1199} {"train_loss": -11.034911155700684, "global_step": 201504, "epoch": 1199} {"train_loss": -11.170331001281738, "global_step": 201505, "epoch": 1199} {"train_loss": -11.273740768432617, "global_step": 201506, "epoch": 1199} {"train_loss": -11.051589965820312, "global_step": 201507, "epoch": 1199} {"train_loss": -11.108577728271484, "global_step": 201508, "epoch": 1199} {"train_loss": -10.968647003173828, "global_step": 201509, "epoch": 1199} {"train_loss": -11.045534133911133, "global_step": 201510, "epoch": 1199} {"train_loss": -11.0509672164917, "global_step": 201511, "epoch": 1199} {"train_loss": -11.309896469116211, "global_step": 201512, "epoch": 1199} {"train_loss": -10.74820327758789, "global_step": 201513, "epoch": 1199} {"train_loss": -11.299585342407227, "global_step": 201514, "epoch": 1199} {"train_loss": -11.17677116394043, "global_step": 201515, "epoch": 1199} {"train_loss": -11.27767562866211, "global_step": 201516, "epoch": 1199} {"train_loss": -11.200689315795898, "global_step": 201517, "epoch": 1199} {"train_loss": -11.228384017944336, "global_step": 201518, "epoch": 1199} {"train_loss": -11.16016960144043, "global_step": 201519, "epoch": 1199} {"train_loss": -11.320133209228516, "global_step": 201520, "epoch": 1199} {"train_loss": -10.977685928344727, "global_step": 201521, "epoch": 1199} {"train_loss": -11.506792068481445, "global_step": 201522, "epoch": 1199} {"train_loss": -11.336836814880371, "global_step": 201523, "epoch": 1199} {"train_loss": -11.20445442199707, "global_step": 201524, "epoch": 1199} {"train_loss": -11.34820556640625, "global_step": 201525, "epoch": 1199} {"train_loss": -11.231550216674805, "global_step": 201526, "epoch": 1199} {"train_loss": -11.502079963684082, "global_step": 201527, "epoch": 1199} {"train_loss": -11.2470703125, "global_step": 201528, "epoch": 1199} {"train_loss": -11.499699592590332, "global_step": 201529, "epoch": 1199} {"train_loss": -11.279108047485352, "global_step": 201530, "epoch": 1199} {"train_loss": -11.296215057373047, "global_step": 201531, "epoch": 1199} {"train_loss": -11.380900382995605, "global_step": 201532, "epoch": 1199} {"train_loss": -11.602060317993164, "global_step": 201533, "epoch": 1199} {"train_loss": -11.480029106140137, "global_step": 201534, "epoch": 1199} {"train_loss": -11.359530448913574, "global_step": 201535, "epoch": 1199} {"train_loss": -11.432426452636719, "global_step": 201536, "epoch": 1199} {"train_loss": -11.526334762573242, "global_step": 201537, "epoch": 1199} {"train_loss": -11.678810119628906, "global_step": 201538, "epoch": 1199} {"train_loss": -11.336126327514648, "global_step": 201539, "epoch": 1199} {"train_loss": -11.831888198852539, "global_step": 201540, "epoch": 1199} {"train_loss": -11.620124816894531, "global_step": 201541, "epoch": 1199} {"train_loss": -11.502464294433594, "global_step": 201542, "epoch": 1199} {"train_loss": -11.366296768188477, "global_step": 201543, "epoch": 1199} {"train_loss": -11.632242202758789, "global_step": 201544, "epoch": 1199} {"train_loss": -11.821494102478027, "global_step": 201545, "epoch": 1199} {"train_loss": -11.467220306396484, "global_step": 201546, "epoch": 1199} {"train_loss": -11.639698028564453, "global_step": 201547, "epoch": 1199} {"train_loss": -11.541898727416992, "global_step": 201548, "epoch": 1199} {"train_loss": -11.499160766601562, "global_step": 201549, "epoch": 1199} {"train_loss": -11.430012702941895, "global_step": 201550, "epoch": 1199} {"train_loss": -11.635787963867188, "global_step": 201551, "epoch": 1199} {"train_loss": -11.539569854736328, "global_step": 201552, "epoch": 1199} {"train_loss": -11.44627857208252, "global_step": 201553, "epoch": 1199} {"train_loss": -11.609916687011719, "global_step": 201554, "epoch": 1199} {"train_loss": -11.593086242675781, "global_step": 201555, "epoch": 1199} {"train_loss": -11.650142669677734, "global_step": 201556, "epoch": 1199} {"train_loss": -11.551578521728516, "global_step": 201557, "epoch": 1199} {"train_loss": -11.635009765625, "global_step": 201558, "epoch": 1199} {"train_loss": -11.743122100830078, "global_step": 201559, "epoch": 1199} {"train_loss": -11.821887969970703, "global_step": 201560, "epoch": 1199} {"train_loss": -11.593500137329102, "global_step": 201561, "epoch": 1199} {"train_loss": -11.597310066223145, "global_step": 201562, "epoch": 1199} {"train_loss": -11.212334632873535, "global_step": 201563, "epoch": 1199} {"train_loss": -11.325929641723633, "global_step": 201564, "epoch": 1199} {"train_loss": -11.055912017822266, "global_step": 201565, "epoch": 1199} {"train_loss": -11.124641418457031, "global_step": 201566, "epoch": 1199} {"train_loss": -11.018044471740723, "global_step": 201567, "epoch": 1199} {"train_loss": -11.461271286010742, "global_step": 201568, "epoch": 1199} {"train_loss": -11.682689666748047, "global_step": 201569, "epoch": 1199} {"train_loss": -11.503449440002441, "global_step": 201570, "epoch": 1199} {"train_loss": -11.657001495361328, "global_step": 201571, "epoch": 1199} {"train_loss": -11.670537948608398, "global_step": 201572, "epoch": 1199} {"train_loss": -11.656962394714355, "global_step": 201573, "epoch": 1199} {"train_loss": -11.692941665649414, "global_step": 201574, "epoch": 1199} {"train_loss": -11.635368347167969, "global_step": 201575, "epoch": 1199} {"train_loss": -11.902261734008789, "global_step": 201576, "epoch": 1199} {"train_loss": -11.707616806030273, "global_step": 201577, "epoch": 1199} {"train_loss": -11.752585411071777, "global_step": 201578, "epoch": 1199} {"train_loss": -11.818502426147461, "global_step": 201579, "epoch": 1199} {"train_loss": -11.775824546813965, "global_step": 201580, "epoch": 1199} {"train_loss": -11.656526565551758, "global_step": 201581, "epoch": 1199} {"train_loss": -11.542614936828613, "global_step": 201582, "epoch": 1199} {"train_loss": -11.461148262023926, "global_step": 201583, "epoch": 1199} {"train_loss": -11.513041496276855, "global_step": 201584, "epoch": 1199} {"train_loss": -10.902673721313477, "global_step": 201585, "epoch": 1199} {"train_loss": -11.639776229858398, "global_step": 201586, "epoch": 1199} {"train_loss": -11.764893531799316, "global_step": 201587, "epoch": 1199} {"train_loss": -11.414319038391113, "global_step": 201588, "epoch": 1199} {"train_loss": -10.859696388244629, "global_step": 201589, "epoch": 1199} {"train_loss": -11.567832946777344, "global_step": 201590, "epoch": 1199} {"train_loss": -11.21944808959961, "global_step": 201591, "epoch": 1199} {"train_loss": -11.068986892700195, "global_step": 201592, "epoch": 1199} {"train_loss": -10.361013412475586, "global_step": 201593, "epoch": 1199} {"train_loss": -11.067911148071289, "global_step": 201594, "epoch": 1199} {"train_loss": -11.53245735168457, "global_step": 201595, "epoch": 1199} {"train_loss": -11.481521606445312, "global_step": 201596, "epoch": 1199} {"train_loss": -10.812609672546387, "global_step": 201597, "epoch": 1199} {"train_loss": -11.15522575378418, "global_step": 201598, "epoch": 1199} {"train_loss": -11.263655946368264, "global_step": 201599, "epoch": 1199, "val_loss": 253256.03125} {"train_loss": -9.79471206665039, "global_step": 201600, "epoch": 1200} {"train_loss": -10.704672813415527, "global_step": 201601, "epoch": 1200} {"train_loss": -10.87966537475586, "global_step": 201602, "epoch": 1200} {"train_loss": -9.76471996307373, "global_step": 201603, "epoch": 1200} {"train_loss": -10.873800277709961, "global_step": 201604, "epoch": 1200} {"train_loss": -11.016301155090332, "global_step": 201605, "epoch": 1200} {"train_loss": -10.229928970336914, "global_step": 201606, "epoch": 1200} {"train_loss": -11.23155689239502, "global_step": 201607, "epoch": 1200} {"train_loss": -10.20486831665039, "global_step": 201608, "epoch": 1200} {"train_loss": -11.038820266723633, "global_step": 201609, "epoch": 1200} {"train_loss": -10.558375358581543, "global_step": 201610, "epoch": 1200} {"train_loss": -11.164600372314453, "global_step": 201611, "epoch": 1200} {"train_loss": -11.084507942199707, "global_step": 201612, "epoch": 1200} {"train_loss": -11.051753997802734, "global_step": 201613, "epoch": 1200} {"train_loss": -11.106742858886719, "global_step": 201614, "epoch": 1200} {"train_loss": -10.417203903198242, "global_step": 201615, "epoch": 1200} {"train_loss": -11.467093467712402, "global_step": 201616, "epoch": 1200} {"train_loss": -10.946535110473633, "global_step": 201617, "epoch": 1200} {"train_loss": -11.062298774719238, "global_step": 201618, "epoch": 1200} {"train_loss": -11.273892402648926, "global_step": 201619, "epoch": 1200} {"train_loss": -11.188714981079102, "global_step": 201620, "epoch": 1200} {"train_loss": -11.16831111907959, "global_step": 201621, "epoch": 1200} {"train_loss": -11.250801086425781, "global_step": 201622, "epoch": 1200} {"train_loss": -11.086474418640137, "global_step": 201623, "epoch": 1200} {"train_loss": -11.285823822021484, "global_step": 201624, "epoch": 1200} {"train_loss": -11.248945236206055, "global_step": 201625, "epoch": 1200} {"train_loss": -10.933517456054688, "global_step": 201626, "epoch": 1200} {"train_loss": -11.352132797241211, "global_step": 201627, "epoch": 1200} {"train_loss": -11.388856887817383, "global_step": 201628, "epoch": 1200} {"train_loss": -11.364849090576172, "global_step": 201629, "epoch": 1200} {"train_loss": -11.513411521911621, "global_step": 201630, "epoch": 1200} {"train_loss": -11.514154434204102, "global_step": 201631, "epoch": 1200} {"train_loss": -11.509328842163086, "global_step": 201632, "epoch": 1200} {"train_loss": -11.439918518066406, "global_step": 201633, "epoch": 1200} {"train_loss": -11.461334228515625, "global_step": 201634, "epoch": 1200} {"train_loss": -11.519583702087402, "global_step": 201635, "epoch": 1200} {"train_loss": -11.71186351776123, "global_step": 201636, "epoch": 1200} {"train_loss": -11.422754287719727, "global_step": 201637, "epoch": 1200} {"train_loss": -11.490076065063477, "global_step": 201638, "epoch": 1200} {"train_loss": -11.095996856689453, "global_step": 201639, "epoch": 1200} {"train_loss": -11.494162559509277, "global_step": 201640, "epoch": 1200} {"train_loss": -11.304182052612305, "global_step": 201641, "epoch": 1200} {"train_loss": -11.53724479675293, "global_step": 201642, "epoch": 1200} {"train_loss": -11.36998176574707, "global_step": 201643, "epoch": 1200} {"train_loss": -11.530097961425781, "global_step": 201644, "epoch": 1200} {"train_loss": -11.369242668151855, "global_step": 201645, "epoch": 1200} {"train_loss": -11.44161605834961, "global_step": 201646, "epoch": 1200} {"train_loss": -11.621017456054688, "global_step": 201647, "epoch": 1200} {"train_loss": -11.51876163482666, "global_step": 201648, "epoch": 1200} {"train_loss": -11.680198669433594, "global_step": 201649, "epoch": 1200} {"train_loss": -11.509211540222168, "global_step": 201650, "epoch": 1200} {"train_loss": -11.677591323852539, "global_step": 201651, "epoch": 1200} {"train_loss": -11.410906791687012, "global_step": 201652, "epoch": 1200} {"train_loss": -11.547032356262207, "global_step": 201653, "epoch": 1200} {"train_loss": -11.736114501953125, "global_step": 201654, "epoch": 1200} {"train_loss": -11.474228858947754, "global_step": 201655, "epoch": 1200} {"train_loss": -11.584545135498047, "global_step": 201656, "epoch": 1200} {"train_loss": -11.682357788085938, "global_step": 201657, "epoch": 1200} {"train_loss": -11.550809860229492, "global_step": 201658, "epoch": 1200} {"train_loss": -11.828269958496094, "global_step": 201659, "epoch": 1200} {"train_loss": -11.376115798950195, "global_step": 201660, "epoch": 1200} {"train_loss": -11.569635391235352, "global_step": 201661, "epoch": 1200} {"train_loss": -11.56256103515625, "global_step": 201662, "epoch": 1200} {"train_loss": -11.60925006866455, "global_step": 201663, "epoch": 1200} {"train_loss": -11.807376861572266, "global_step": 201664, "epoch": 1200} {"train_loss": -11.751712799072266, "global_step": 201665, "epoch": 1200} {"train_loss": -11.693534851074219, "global_step": 201666, "epoch": 1200} {"train_loss": -11.663761138916016, "global_step": 201667, "epoch": 1200} {"train_loss": -11.523415565490723, "global_step": 201668, "epoch": 1200} {"train_loss": -11.645691871643066, "global_step": 201669, "epoch": 1200} {"train_loss": -11.456827163696289, "global_step": 201670, "epoch": 1200} {"train_loss": -11.640335083007812, "global_step": 201671, "epoch": 1200} {"train_loss": -11.483205795288086, "global_step": 201672, "epoch": 1200} {"train_loss": -11.774161338806152, "global_step": 201673, "epoch": 1200} {"train_loss": -11.457332611083984, "global_step": 201674, "epoch": 1200} {"train_loss": -11.580718994140625, "global_step": 201675, "epoch": 1200} {"train_loss": -11.598859786987305, "global_step": 201676, "epoch": 1200} {"train_loss": -11.71343994140625, "global_step": 201677, "epoch": 1200} {"train_loss": -11.322229385375977, "global_step": 201678, "epoch": 1200} {"train_loss": -11.290583610534668, "global_step": 201679, "epoch": 1200} {"train_loss": -11.15170955657959, "global_step": 201680, "epoch": 1200} {"train_loss": -11.327083587646484, "global_step": 201681, "epoch": 1200} {"train_loss": -10.937664031982422, "global_step": 201682, "epoch": 1200} {"train_loss": -11.146689414978027, "global_step": 201683, "epoch": 1200} {"train_loss": -11.097875595092773, "global_step": 201684, "epoch": 1200} {"train_loss": -10.02180290222168, "global_step": 201685, "epoch": 1200} {"train_loss": -11.048221588134766, "global_step": 201686, "epoch": 1200} {"train_loss": -10.844779968261719, "global_step": 201687, "epoch": 1200} {"train_loss": -10.02981185913086, "global_step": 201688, "epoch": 1200} {"train_loss": -10.96336555480957, "global_step": 201689, "epoch": 1200} {"train_loss": -10.482965469360352, "global_step": 201690, "epoch": 1200} {"train_loss": -11.112442016601562, "global_step": 201691, "epoch": 1200} {"train_loss": -10.750106811523438, "global_step": 201692, "epoch": 1200} {"train_loss": -10.688541412353516, "global_step": 201693, "epoch": 1200} {"train_loss": -10.994810104370117, "global_step": 201694, "epoch": 1200} {"train_loss": -10.556394577026367, "global_step": 201695, "epoch": 1200} {"train_loss": -10.344058990478516, "global_step": 201696, "epoch": 1200} {"train_loss": -11.109050750732422, "global_step": 201697, "epoch": 1200} {"train_loss": -9.675985336303711, "global_step": 201698, "epoch": 1200} {"train_loss": -11.254606246948242, "global_step": 201699, "epoch": 1200} {"train_loss": -10.127727508544922, "global_step": 201700, "epoch": 1200} {"train_loss": -11.027666091918945, "global_step": 201701, "epoch": 1200} {"train_loss": -10.328180313110352, "global_step": 201702, "epoch": 1200} {"train_loss": -11.26472282409668, "global_step": 201703, "epoch": 1200} {"train_loss": -10.059076309204102, "global_step": 201704, "epoch": 1200} {"train_loss": -10.76612663269043, "global_step": 201705, "epoch": 1200} {"train_loss": -10.094663619995117, "global_step": 201706, "epoch": 1200} {"train_loss": -10.639352798461914, "global_step": 201707, "epoch": 1200} {"train_loss": -10.623666763305664, "global_step": 201708, "epoch": 1200} {"train_loss": -10.633262634277344, "global_step": 201709, "epoch": 1200} {"train_loss": -11.06743049621582, "global_step": 201710, "epoch": 1200} {"train_loss": -10.613718032836914, "global_step": 201711, "epoch": 1200} {"train_loss": -11.124234199523926, "global_step": 201712, "epoch": 1200} {"train_loss": -10.956807136535645, "global_step": 201713, "epoch": 1200} {"train_loss": -10.879298210144043, "global_step": 201714, "epoch": 1200} {"train_loss": -11.074251174926758, "global_step": 201715, "epoch": 1200} {"train_loss": -11.140454292297363, "global_step": 201716, "epoch": 1200} {"train_loss": -11.180866241455078, "global_step": 201717, "epoch": 1200} {"train_loss": -11.160555839538574, "global_step": 201718, "epoch": 1200} {"train_loss": -11.241087913513184, "global_step": 201719, "epoch": 1200} {"train_loss": -11.15855598449707, "global_step": 201720, "epoch": 1200} {"train_loss": -11.335689544677734, "global_step": 201721, "epoch": 1200} {"train_loss": -11.398276329040527, "global_step": 201722, "epoch": 1200} {"train_loss": -11.3338623046875, "global_step": 201723, "epoch": 1200} {"train_loss": -11.380046844482422, "global_step": 201724, "epoch": 1200} {"train_loss": -11.430702209472656, "global_step": 201725, "epoch": 1200} {"train_loss": -11.424259185791016, "global_step": 201726, "epoch": 1200} {"train_loss": -11.30764389038086, "global_step": 201727, "epoch": 1200} {"train_loss": -11.424592971801758, "global_step": 201728, "epoch": 1200} {"train_loss": -11.45444107055664, "global_step": 201729, "epoch": 1200} {"train_loss": -11.383916854858398, "global_step": 201730, "epoch": 1200} {"train_loss": -11.594815254211426, "global_step": 201731, "epoch": 1200} {"train_loss": -11.219493865966797, "global_step": 201732, "epoch": 1200} {"train_loss": -11.252351760864258, "global_step": 201733, "epoch": 1200} {"train_loss": -11.537630081176758, "global_step": 201734, "epoch": 1200} {"train_loss": -11.6257905960083, "global_step": 201735, "epoch": 1200} {"train_loss": -11.552501678466797, "global_step": 201736, "epoch": 1200} {"train_loss": -11.72743034362793, "global_step": 201737, "epoch": 1200} {"train_loss": -11.405678749084473, "global_step": 201738, "epoch": 1200} {"train_loss": -11.683900833129883, "global_step": 201739, "epoch": 1200} {"train_loss": -11.338309288024902, "global_step": 201740, "epoch": 1200} {"train_loss": -11.570067405700684, "global_step": 201741, "epoch": 1200} {"train_loss": -11.617708206176758, "global_step": 201742, "epoch": 1200} {"train_loss": -11.766935348510742, "global_step": 201743, "epoch": 1200} {"train_loss": -11.679625511169434, "global_step": 201744, "epoch": 1200} {"train_loss": -11.5447998046875, "global_step": 201745, "epoch": 1200} {"train_loss": -11.64066219329834, "global_step": 201746, "epoch": 1200} {"train_loss": -11.661705017089844, "global_step": 201747, "epoch": 1200} {"train_loss": -11.684931755065918, "global_step": 201748, "epoch": 1200} {"train_loss": -11.55784797668457, "global_step": 201749, "epoch": 1200} {"train_loss": -11.735285758972168, "global_step": 201750, "epoch": 1200} {"train_loss": -11.48312759399414, "global_step": 201751, "epoch": 1200} {"train_loss": -11.840085983276367, "global_step": 201752, "epoch": 1200} {"train_loss": -11.821507453918457, "global_step": 201753, "epoch": 1200} {"train_loss": -11.811670303344727, "global_step": 201754, "epoch": 1200} {"train_loss": -11.74666976928711, "global_step": 201755, "epoch": 1200} {"train_loss": -11.724702835083008, "global_step": 201756, "epoch": 1200} {"train_loss": -11.84532642364502, "global_step": 201757, "epoch": 1200} {"train_loss": -11.78636646270752, "global_step": 201758, "epoch": 1200} {"train_loss": -11.474555015563965, "global_step": 201759, "epoch": 1200} {"train_loss": -11.535002708435059, "global_step": 201760, "epoch": 1200} {"train_loss": -11.667917251586914, "global_step": 201761, "epoch": 1200} {"train_loss": -11.385448455810547, "global_step": 201762, "epoch": 1200} {"train_loss": -11.668015480041504, "global_step": 201763, "epoch": 1200} {"train_loss": -11.661214828491211, "global_step": 201764, "epoch": 1200} {"train_loss": -11.711074829101562, "global_step": 201765, "epoch": 1200} {"train_loss": -11.651594161987305, "global_step": 201766, "epoch": 1200} {"train_loss": -11.259951744760786, "global_step": 201767, "epoch": 1200, "train/sim_max_reward_0": 0.9629567694290374, "train/sim_max_reward_1": 0.9738595725731262, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.16546820706372606, "train/sim_max_reward_4": 0.9604723131170863, "train/sim_max_reward_5": 0.5539358324121834, "test/sim_max_reward_4400000": 0.3934504880154055, "test/sim_max_reward_4400001": 0.9781174223851627, "test/sim_max_reward_4400002": 0.9887395630862211, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.40683602962530063, "test/sim_max_reward_4400005": 0.8606578488451337, "test/sim_max_reward_4400006": 0.6347774439693976, "test/sim_max_reward_4400007": 0.43771254433263, "test/sim_max_reward_4400008": 0.6005357510632192, "test/sim_max_reward_4400009": 0.39041200249603986, "test/sim_max_reward_4400010": 0.9636137582512565, "test/sim_max_reward_4400011": 0.8682506673217307, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.8798243628894403, "test/sim_max_reward_4400014": 0.9906947291367098, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.366709822858876, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 0.40346067140165826, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.6051709690138487, "test/sim_max_reward_4400022": 0.9947618990542316, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.9693330872926486, "test/sim_max_reward_4400025": 0.5138179859960181, "test/sim_max_reward_4400026": 0.04514995103869517, "test/sim_max_reward_4400027": 1.0, "test/sim_max_reward_4400028": 0.6946155595080802, "test/sim_max_reward_4400029": 0.43857488211473594, "test/sim_max_reward_4400030": 0.9735699509546216, "test/sim_max_reward_4400031": 0.9887481475944254, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.4545028341045362, "test/sim_max_reward_4400034": 0.48257787432699073, "test/sim_max_reward_4400035": 0.2853917399459123, "test/sim_max_reward_4400036": 0.36658192267058587, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.9753249302264748, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9748475051882542, "test/sim_max_reward_4400042": 0.9640986946960534, "test/sim_max_reward_4400043": 0.9923108351042945, "test/sim_max_reward_4400044": 0.9356166489258405, "test/sim_max_reward_4400045": 0.5675719205557008, "test/sim_max_reward_4400046": 0.3036101496260848, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6027821157658598, "test/mean_score": 0.5938036203844508, "val_loss": 250883.03125, "train_action_mse_error": 0.22270339727401733} {"train_loss": -11.663249969482422, "global_step": 201768, "epoch": 1201} {"train_loss": -11.50166130065918, "global_step": 201769, "epoch": 1201} {"train_loss": -11.824441909790039, "global_step": 201770, "epoch": 1201} {"train_loss": -11.449430465698242, "global_step": 201771, "epoch": 1201} {"train_loss": -11.328391075134277, "global_step": 201772, "epoch": 1201} {"train_loss": -11.119214057922363, "global_step": 201773, "epoch": 1201} {"train_loss": -11.777799606323242, "global_step": 201774, "epoch": 1201} {"train_loss": -10.690122604370117, "global_step": 201775, "epoch": 1201} {"train_loss": -10.679777145385742, "global_step": 201776, "epoch": 1201} {"train_loss": -10.508222579956055, "global_step": 201777, "epoch": 1201} {"train_loss": -11.303812980651855, "global_step": 201778, "epoch": 1201} {"train_loss": -11.19473934173584, "global_step": 201779, "epoch": 1201} {"train_loss": -11.240665435791016, "global_step": 201780, "epoch": 1201} {"train_loss": -11.448650360107422, "global_step": 201781, "epoch": 1201} {"train_loss": -10.91816520690918, "global_step": 201782, "epoch": 1201} {"train_loss": -11.344375610351562, "global_step": 201783, "epoch": 1201} {"train_loss": -11.574460983276367, "global_step": 201784, "epoch": 1201} {"train_loss": -11.364940643310547, "global_step": 201785, "epoch": 1201} {"train_loss": -11.65648078918457, "global_step": 201786, "epoch": 1201} {"train_loss": -11.625420570373535, "global_step": 201787, "epoch": 1201} {"train_loss": -11.531072616577148, "global_step": 201788, "epoch": 1201} {"train_loss": -11.462618827819824, "global_step": 201789, "epoch": 1201} {"train_loss": -11.350446701049805, "global_step": 201790, "epoch": 1201} {"train_loss": -11.62069320678711, "global_step": 201791, "epoch": 1201} {"train_loss": -11.58552360534668, "global_step": 201792, "epoch": 1201} {"train_loss": -11.366750717163086, "global_step": 201793, "epoch": 1201} {"train_loss": -11.576353073120117, "global_step": 201794, "epoch": 1201} {"train_loss": -11.308414459228516, "global_step": 201795, "epoch": 1201} {"train_loss": -11.24913215637207, "global_step": 201796, "epoch": 1201} {"train_loss": -10.993830680847168, "global_step": 201797, "epoch": 1201} {"train_loss": -11.364742279052734, "global_step": 201798, "epoch": 1201} {"train_loss": -11.264909744262695, "global_step": 201799, "epoch": 1201} {"train_loss": -10.931290626525879, "global_step": 201800, "epoch": 1201} {"train_loss": -11.251367568969727, "global_step": 201801, "epoch": 1201} {"train_loss": -11.463472366333008, "global_step": 201802, "epoch": 1201} {"train_loss": -11.546516418457031, "global_step": 201803, "epoch": 1201} {"train_loss": -11.223753929138184, "global_step": 201804, "epoch": 1201} {"train_loss": -11.293177604675293, "global_step": 201805, "epoch": 1201} {"train_loss": -11.23970890045166, "global_step": 201806, "epoch": 1201} {"train_loss": -11.036882400512695, "global_step": 201807, "epoch": 1201} {"train_loss": -11.399086952209473, "global_step": 201808, "epoch": 1201} {"train_loss": -11.136713027954102, "global_step": 201809, "epoch": 1201} {"train_loss": -11.31768798828125, "global_step": 201810, "epoch": 1201} {"train_loss": -11.636920928955078, "global_step": 201811, "epoch": 1201} {"train_loss": -11.134244918823242, "global_step": 201812, "epoch": 1201} {"train_loss": -11.410162925720215, "global_step": 201813, "epoch": 1201} {"train_loss": -11.401137351989746, "global_step": 201814, "epoch": 1201} {"train_loss": -11.125059127807617, "global_step": 201815, "epoch": 1201} {"train_loss": -11.504680633544922, "global_step": 201816, "epoch": 1201} {"train_loss": -11.518035888671875, "global_step": 201817, "epoch": 1201} {"train_loss": -11.35936164855957, "global_step": 201818, "epoch": 1201} {"train_loss": -11.568035125732422, "global_step": 201819, "epoch": 1201} {"train_loss": -11.409684181213379, "global_step": 201820, "epoch": 1201} {"train_loss": -11.018003463745117, "global_step": 201821, "epoch": 1201} {"train_loss": -11.665233612060547, "global_step": 201822, "epoch": 1201} {"train_loss": -11.681028366088867, "global_step": 201823, "epoch": 1201} {"train_loss": -11.604272842407227, "global_step": 201824, "epoch": 1201} {"train_loss": -11.395820617675781, "global_step": 201825, "epoch": 1201} {"train_loss": -11.136709213256836, "global_step": 201826, "epoch": 1201} {"train_loss": -11.22455883026123, "global_step": 201827, "epoch": 1201} {"train_loss": -10.905686378479004, "global_step": 201828, "epoch": 1201} {"train_loss": -11.178812026977539, "global_step": 201829, "epoch": 1201} {"train_loss": -11.037678718566895, "global_step": 201830, "epoch": 1201} {"train_loss": -11.232746124267578, "global_step": 201831, "epoch": 1201} {"train_loss": -10.664192199707031, "global_step": 201832, "epoch": 1201} {"train_loss": -10.65347957611084, "global_step": 201833, "epoch": 1201} {"train_loss": -11.14630126953125, "global_step": 201834, "epoch": 1201} {"train_loss": -10.725701332092285, "global_step": 201835, "epoch": 1201} {"train_loss": -11.50248908996582, "global_step": 201836, "epoch": 1201} {"train_loss": -10.617148399353027, "global_step": 201837, "epoch": 1201} {"train_loss": -11.438387870788574, "global_step": 201838, "epoch": 1201} {"train_loss": -11.026468276977539, "global_step": 201839, "epoch": 1201} {"train_loss": -11.249610900878906, "global_step": 201840, "epoch": 1201} {"train_loss": -10.942109107971191, "global_step": 201841, "epoch": 1201} {"train_loss": -11.318239212036133, "global_step": 201842, "epoch": 1201} {"train_loss": -11.077658653259277, "global_step": 201843, "epoch": 1201} {"train_loss": -11.53363037109375, "global_step": 201844, "epoch": 1201} {"train_loss": -10.910295486450195, "global_step": 201845, "epoch": 1201} {"train_loss": -10.993377685546875, "global_step": 201846, "epoch": 1201} {"train_loss": -11.45930290222168, "global_step": 201847, "epoch": 1201} {"train_loss": -11.125604629516602, "global_step": 201848, "epoch": 1201} {"train_loss": -10.883587837219238, "global_step": 201849, "epoch": 1201} {"train_loss": -11.446507453918457, "global_step": 201850, "epoch": 1201} {"train_loss": -11.063488006591797, "global_step": 201851, "epoch": 1201} {"train_loss": -11.47836685180664, "global_step": 201852, "epoch": 1201} {"train_loss": -11.068902015686035, "global_step": 201853, "epoch": 1201} {"train_loss": -11.065362930297852, "global_step": 201854, "epoch": 1201} {"train_loss": -11.22372817993164, "global_step": 201855, "epoch": 1201} {"train_loss": -11.415735244750977, "global_step": 201856, "epoch": 1201} {"train_loss": -11.351516723632812, "global_step": 201857, "epoch": 1201} {"train_loss": -10.972278594970703, "global_step": 201858, "epoch": 1201} {"train_loss": -11.276117324829102, "global_step": 201859, "epoch": 1201} {"train_loss": -11.162869453430176, "global_step": 201860, "epoch": 1201} {"train_loss": -10.919574737548828, "global_step": 201861, "epoch": 1201} {"train_loss": -11.011472702026367, "global_step": 201862, "epoch": 1201} {"train_loss": -11.083017349243164, "global_step": 201863, "epoch": 1201} {"train_loss": -10.72024154663086, "global_step": 201864, "epoch": 1201} {"train_loss": -10.860944747924805, "global_step": 201865, "epoch": 1201} {"train_loss": -9.634330749511719, "global_step": 201866, "epoch": 1201} {"train_loss": -10.5491304397583, "global_step": 201867, "epoch": 1201} {"train_loss": -10.384737014770508, "global_step": 201868, "epoch": 1201} {"train_loss": -10.554034233093262, "global_step": 201869, "epoch": 1201} {"train_loss": -10.522249221801758, "global_step": 201870, "epoch": 1201} {"train_loss": -10.384580612182617, "global_step": 201871, "epoch": 1201} {"train_loss": -10.420656204223633, "global_step": 201872, "epoch": 1201} {"train_loss": -10.25439167022705, "global_step": 201873, "epoch": 1201} {"train_loss": -10.820663452148438, "global_step": 201874, "epoch": 1201} {"train_loss": -9.264215469360352, "global_step": 201875, "epoch": 1201} {"train_loss": -11.202677726745605, "global_step": 201876, "epoch": 1201} {"train_loss": -10.128485679626465, "global_step": 201877, "epoch": 1201} {"train_loss": -10.830209732055664, "global_step": 201878, "epoch": 1201} {"train_loss": -9.490850448608398, "global_step": 201879, "epoch": 1201} {"train_loss": -10.990898132324219, "global_step": 201880, "epoch": 1201} {"train_loss": -9.859399795532227, "global_step": 201881, "epoch": 1201} {"train_loss": -10.914155960083008, "global_step": 201882, "epoch": 1201} {"train_loss": -10.376276016235352, "global_step": 201883, "epoch": 1201} {"train_loss": -10.484703063964844, "global_step": 201884, "epoch": 1201} {"train_loss": -10.59503173828125, "global_step": 201885, "epoch": 1201} {"train_loss": -10.392597198486328, "global_step": 201886, "epoch": 1201} {"train_loss": -10.733650207519531, "global_step": 201887, "epoch": 1201} {"train_loss": -11.08162784576416, "global_step": 201888, "epoch": 1201} {"train_loss": -11.017361640930176, "global_step": 201889, "epoch": 1201} {"train_loss": -11.14965534210205, "global_step": 201890, "epoch": 1201} {"train_loss": -11.427248001098633, "global_step": 201891, "epoch": 1201} {"train_loss": -11.033595085144043, "global_step": 201892, "epoch": 1201} {"train_loss": -11.306294441223145, "global_step": 201893, "epoch": 1201} {"train_loss": -11.204214096069336, "global_step": 201894, "epoch": 1201} {"train_loss": -11.163601875305176, "global_step": 201895, "epoch": 1201} {"train_loss": -11.108827590942383, "global_step": 201896, "epoch": 1201} {"train_loss": -11.2552490234375, "global_step": 201897, "epoch": 1201} {"train_loss": -11.185264587402344, "global_step": 201898, "epoch": 1201} {"train_loss": -11.432829856872559, "global_step": 201899, "epoch": 1201} {"train_loss": -11.078431129455566, "global_step": 201900, "epoch": 1201} {"train_loss": -11.359742164611816, "global_step": 201901, "epoch": 1201} {"train_loss": -11.374889373779297, "global_step": 201902, "epoch": 1201} {"train_loss": -11.294429779052734, "global_step": 201903, "epoch": 1201} {"train_loss": -11.37356185913086, "global_step": 201904, "epoch": 1201} {"train_loss": -11.456377029418945, "global_step": 201905, "epoch": 1201} {"train_loss": -11.544167518615723, "global_step": 201906, "epoch": 1201} {"train_loss": -11.482664108276367, "global_step": 201907, "epoch": 1201} {"train_loss": -11.473555564880371, "global_step": 201908, "epoch": 1201} {"train_loss": -11.573463439941406, "global_step": 201909, "epoch": 1201} {"train_loss": -11.604080200195312, "global_step": 201910, "epoch": 1201} {"train_loss": -11.553933143615723, "global_step": 201911, "epoch": 1201} {"train_loss": -11.583198547363281, "global_step": 201912, "epoch": 1201} {"train_loss": -11.559160232543945, "global_step": 201913, "epoch": 1201} {"train_loss": -11.713359832763672, "global_step": 201914, "epoch": 1201} {"train_loss": -11.621635437011719, "global_step": 201915, "epoch": 1201} {"train_loss": -11.720283508300781, "global_step": 201916, "epoch": 1201} {"train_loss": -11.607048034667969, "global_step": 201917, "epoch": 1201} {"train_loss": -11.63170051574707, "global_step": 201918, "epoch": 1201} {"train_loss": -11.602640151977539, "global_step": 201919, "epoch": 1201} {"train_loss": -11.655280113220215, "global_step": 201920, "epoch": 1201} {"train_loss": -11.636987686157227, "global_step": 201921, "epoch": 1201} {"train_loss": -11.693527221679688, "global_step": 201922, "epoch": 1201} {"train_loss": -11.646425247192383, "global_step": 201923, "epoch": 1201} {"train_loss": -11.703153610229492, "global_step": 201924, "epoch": 1201} {"train_loss": -11.601884841918945, "global_step": 201925, "epoch": 1201} {"train_loss": -11.590222358703613, "global_step": 201926, "epoch": 1201} {"train_loss": -11.747359275817871, "global_step": 201927, "epoch": 1201} {"train_loss": -11.635889053344727, "global_step": 201928, "epoch": 1201} {"train_loss": -11.801424026489258, "global_step": 201929, "epoch": 1201} {"train_loss": -11.616076469421387, "global_step": 201930, "epoch": 1201} {"train_loss": -11.79765510559082, "global_step": 201931, "epoch": 1201} {"train_loss": -11.539407730102539, "global_step": 201932, "epoch": 1201} {"train_loss": -11.812530517578125, "global_step": 201933, "epoch": 1201} {"train_loss": -11.603958129882812, "global_step": 201934, "epoch": 1201} {"train_loss": -11.20401140054067, "global_step": 201935, "epoch": 1201, "val_loss": 255169.515625} {"train_loss": -11.598716735839844, "global_step": 201936, "epoch": 1202} {"train_loss": -11.163078308105469, "global_step": 201937, "epoch": 1202} {"train_loss": -11.501779556274414, "global_step": 201938, "epoch": 1202} {"train_loss": -11.721813201904297, "global_step": 201939, "epoch": 1202} {"train_loss": -11.175697326660156, "global_step": 201940, "epoch": 1202} {"train_loss": -11.628501892089844, "global_step": 201941, "epoch": 1202} {"train_loss": -11.540727615356445, "global_step": 201942, "epoch": 1202} {"train_loss": -11.439300537109375, "global_step": 201943, "epoch": 1202} {"train_loss": -11.690603256225586, "global_step": 201944, "epoch": 1202} {"train_loss": -11.405338287353516, "global_step": 201945, "epoch": 1202} {"train_loss": -11.708473205566406, "global_step": 201946, "epoch": 1202} {"train_loss": -11.239814758300781, "global_step": 201947, "epoch": 1202} {"train_loss": -11.4041109085083, "global_step": 201948, "epoch": 1202} {"train_loss": -11.694940567016602, "global_step": 201949, "epoch": 1202} {"train_loss": -11.21847915649414, "global_step": 201950, "epoch": 1202} {"train_loss": -11.68588638305664, "global_step": 201951, "epoch": 1202} {"train_loss": -11.611333847045898, "global_step": 201952, "epoch": 1202} {"train_loss": -11.476757049560547, "global_step": 201953, "epoch": 1202} {"train_loss": -11.687512397766113, "global_step": 201954, "epoch": 1202} {"train_loss": -11.378850936889648, "global_step": 201955, "epoch": 1202} {"train_loss": -11.437603950500488, "global_step": 201956, "epoch": 1202} {"train_loss": -11.885724067687988, "global_step": 201957, "epoch": 1202} {"train_loss": -11.55392074584961, "global_step": 201958, "epoch": 1202} {"train_loss": -11.854837417602539, "global_step": 201959, "epoch": 1202} {"train_loss": -11.818357467651367, "global_step": 201960, "epoch": 1202} {"train_loss": -11.728105545043945, "global_step": 201961, "epoch": 1202} {"train_loss": -11.592445373535156, "global_step": 201962, "epoch": 1202} {"train_loss": -11.486751556396484, "global_step": 201963, "epoch": 1202} {"train_loss": -11.372321128845215, "global_step": 201964, "epoch": 1202} {"train_loss": -11.468515396118164, "global_step": 201965, "epoch": 1202} {"train_loss": -11.161733627319336, "global_step": 201966, "epoch": 1202} {"train_loss": -11.606313705444336, "global_step": 201967, "epoch": 1202} {"train_loss": -11.442835807800293, "global_step": 201968, "epoch": 1202} {"train_loss": -11.643363952636719, "global_step": 201969, "epoch": 1202} {"train_loss": -11.453445434570312, "global_step": 201970, "epoch": 1202} {"train_loss": -11.605327606201172, "global_step": 201971, "epoch": 1202} {"train_loss": -11.046470642089844, "global_step": 201972, "epoch": 1202} {"train_loss": -11.4520845413208, "global_step": 201973, "epoch": 1202} {"train_loss": -11.176715850830078, "global_step": 201974, "epoch": 1202} {"train_loss": -11.393202781677246, "global_step": 201975, "epoch": 1202} {"train_loss": -11.41036605834961, "global_step": 201976, "epoch": 1202} {"train_loss": -11.333539962768555, "global_step": 201977, "epoch": 1202} {"train_loss": -10.852744102478027, "global_step": 201978, "epoch": 1202} {"train_loss": -10.453767776489258, "global_step": 201979, "epoch": 1202} {"train_loss": -8.329855918884277, "global_step": 201980, "epoch": 1202} {"train_loss": -11.3165283203125, "global_step": 201981, "epoch": 1202} {"train_loss": -10.315685272216797, "global_step": 201982, "epoch": 1202} {"train_loss": -9.842529296875, "global_step": 201983, "epoch": 1202} {"train_loss": -10.70423698425293, "global_step": 201984, "epoch": 1202} {"train_loss": -10.86538314819336, "global_step": 201985, "epoch": 1202} {"train_loss": -10.576144218444824, "global_step": 201986, "epoch": 1202} {"train_loss": -11.065696716308594, "global_step": 201987, "epoch": 1202} {"train_loss": -10.32444953918457, "global_step": 201988, "epoch": 1202} {"train_loss": -10.506674766540527, "global_step": 201989, "epoch": 1202} {"train_loss": -11.000332832336426, "global_step": 201990, "epoch": 1202} {"train_loss": -11.061027526855469, "global_step": 201991, "epoch": 1202} {"train_loss": -11.097662925720215, "global_step": 201992, "epoch": 1202} {"train_loss": -11.232608795166016, "global_step": 201993, "epoch": 1202} {"train_loss": -11.043720245361328, "global_step": 201994, "epoch": 1202} {"train_loss": -11.208828926086426, "global_step": 201995, "epoch": 1202} {"train_loss": -10.81740665435791, "global_step": 201996, "epoch": 1202} {"train_loss": -10.827966690063477, "global_step": 201997, "epoch": 1202} {"train_loss": -10.763121604919434, "global_step": 201998, "epoch": 1202} {"train_loss": -11.104182243347168, "global_step": 201999, "epoch": 1202} {"train_loss": -10.996354103088379, "global_step": 202000, "epoch": 1202} {"train_loss": -11.06238079071045, "global_step": 202001, "epoch": 1202} {"train_loss": -11.08603286743164, "global_step": 202002, "epoch": 1202} {"train_loss": -10.982942581176758, "global_step": 202003, "epoch": 1202} {"train_loss": -11.237160682678223, "global_step": 202004, "epoch": 1202} {"train_loss": -11.170894622802734, "global_step": 202005, "epoch": 1202} {"train_loss": -11.182656288146973, "global_step": 202006, "epoch": 1202} {"train_loss": -11.423410415649414, "global_step": 202007, "epoch": 1202} {"train_loss": -11.138259887695312, "global_step": 202008, "epoch": 1202} {"train_loss": -11.445037841796875, "global_step": 202009, "epoch": 1202} {"train_loss": -10.843286514282227, "global_step": 202010, "epoch": 1202} {"train_loss": -11.044021606445312, "global_step": 202011, "epoch": 1202} {"train_loss": -11.243396759033203, "global_step": 202012, "epoch": 1202} {"train_loss": -11.348158836364746, "global_step": 202013, "epoch": 1202} {"train_loss": -11.212628364562988, "global_step": 202014, "epoch": 1202} {"train_loss": -11.14863395690918, "global_step": 202015, "epoch": 1202} {"train_loss": -11.35713005065918, "global_step": 202016, "epoch": 1202} {"train_loss": -11.380510330200195, "global_step": 202017, "epoch": 1202} {"train_loss": -11.220459938049316, "global_step": 202018, "epoch": 1202} {"train_loss": -11.31434154510498, "global_step": 202019, "epoch": 1202} {"train_loss": -11.370779037475586, "global_step": 202020, "epoch": 1202} {"train_loss": -11.32299518585205, "global_step": 202021, "epoch": 1202} {"train_loss": -11.239038467407227, "global_step": 202022, "epoch": 1202} {"train_loss": -11.507341384887695, "global_step": 202023, "epoch": 1202} {"train_loss": -11.249849319458008, "global_step": 202024, "epoch": 1202} {"train_loss": -11.504144668579102, "global_step": 202025, "epoch": 1202} {"train_loss": -11.628192901611328, "global_step": 202026, "epoch": 1202} {"train_loss": -11.053187370300293, "global_step": 202027, "epoch": 1202} {"train_loss": -11.400434494018555, "global_step": 202028, "epoch": 1202} {"train_loss": -10.934268951416016, "global_step": 202029, "epoch": 1202} {"train_loss": -11.696250915527344, "global_step": 202030, "epoch": 1202} {"train_loss": -11.380613327026367, "global_step": 202031, "epoch": 1202} {"train_loss": -11.246545791625977, "global_step": 202032, "epoch": 1202} {"train_loss": -11.503475189208984, "global_step": 202033, "epoch": 1202} {"train_loss": -11.132711410522461, "global_step": 202034, "epoch": 1202} {"train_loss": -11.29140853881836, "global_step": 202035, "epoch": 1202} {"train_loss": -11.336699485778809, "global_step": 202036, "epoch": 1202} {"train_loss": -11.176976203918457, "global_step": 202037, "epoch": 1202} {"train_loss": -11.284601211547852, "global_step": 202038, "epoch": 1202} {"train_loss": -11.291557312011719, "global_step": 202039, "epoch": 1202} {"train_loss": -10.830667495727539, "global_step": 202040, "epoch": 1202} {"train_loss": -11.182976722717285, "global_step": 202041, "epoch": 1202} {"train_loss": -10.852287292480469, "global_step": 202042, "epoch": 1202} {"train_loss": -10.941402435302734, "global_step": 202043, "epoch": 1202} {"train_loss": -10.817502975463867, "global_step": 202044, "epoch": 1202} {"train_loss": -11.362634658813477, "global_step": 202045, "epoch": 1202} {"train_loss": -11.198516845703125, "global_step": 202046, "epoch": 1202} {"train_loss": -11.309901237487793, "global_step": 202047, "epoch": 1202} {"train_loss": -11.426712989807129, "global_step": 202048, "epoch": 1202} {"train_loss": -10.897867202758789, "global_step": 202049, "epoch": 1202} {"train_loss": -11.55266284942627, "global_step": 202050, "epoch": 1202} {"train_loss": -10.653199195861816, "global_step": 202051, "epoch": 1202} {"train_loss": -11.378192901611328, "global_step": 202052, "epoch": 1202} {"train_loss": -11.05575180053711, "global_step": 202053, "epoch": 1202} {"train_loss": -11.451892852783203, "global_step": 202054, "epoch": 1202} {"train_loss": -11.400444030761719, "global_step": 202055, "epoch": 1202} {"train_loss": -11.035661697387695, "global_step": 202056, "epoch": 1202} {"train_loss": -11.597723007202148, "global_step": 202057, "epoch": 1202} {"train_loss": -11.157957077026367, "global_step": 202058, "epoch": 1202} {"train_loss": -11.414871215820312, "global_step": 202059, "epoch": 1202} {"train_loss": -11.25189208984375, "global_step": 202060, "epoch": 1202} {"train_loss": -11.132293701171875, "global_step": 202061, "epoch": 1202} {"train_loss": -11.28146743774414, "global_step": 202062, "epoch": 1202} {"train_loss": -11.00667667388916, "global_step": 202063, "epoch": 1202} {"train_loss": -11.337194442749023, "global_step": 202064, "epoch": 1202} {"train_loss": -11.336112976074219, "global_step": 202065, "epoch": 1202} {"train_loss": -11.42003059387207, "global_step": 202066, "epoch": 1202} {"train_loss": -11.51858139038086, "global_step": 202067, "epoch": 1202} {"train_loss": -10.747035026550293, "global_step": 202068, "epoch": 1202} {"train_loss": -11.130043029785156, "global_step": 202069, "epoch": 1202} {"train_loss": -10.72010326385498, "global_step": 202070, "epoch": 1202} {"train_loss": -10.526403427124023, "global_step": 202071, "epoch": 1202} {"train_loss": -10.858217239379883, "global_step": 202072, "epoch": 1202} {"train_loss": -10.774657249450684, "global_step": 202073, "epoch": 1202} {"train_loss": -11.378706932067871, "global_step": 202074, "epoch": 1202} {"train_loss": -11.205192565917969, "global_step": 202075, "epoch": 1202} {"train_loss": -11.611072540283203, "global_step": 202076, "epoch": 1202} {"train_loss": -11.495609283447266, "global_step": 202077, "epoch": 1202} {"train_loss": -11.514965057373047, "global_step": 202078, "epoch": 1202} {"train_loss": -11.308390617370605, "global_step": 202079, "epoch": 1202} {"train_loss": -11.087218284606934, "global_step": 202080, "epoch": 1202} {"train_loss": -11.308096885681152, "global_step": 202081, "epoch": 1202} {"train_loss": -11.342769622802734, "global_step": 202082, "epoch": 1202} {"train_loss": -11.242940902709961, "global_step": 202083, "epoch": 1202} {"train_loss": -11.13702392578125, "global_step": 202084, "epoch": 1202} {"train_loss": -10.95267391204834, "global_step": 202085, "epoch": 1202} {"train_loss": -11.182076454162598, "global_step": 202086, "epoch": 1202} {"train_loss": -11.151078224182129, "global_step": 202087, "epoch": 1202} {"train_loss": -10.828872680664062, "global_step": 202088, "epoch": 1202} {"train_loss": -11.105633735656738, "global_step": 202089, "epoch": 1202} {"train_loss": -10.909589767456055, "global_step": 202090, "epoch": 1202} {"train_loss": -11.401853561401367, "global_step": 202091, "epoch": 1202} {"train_loss": -11.294519424438477, "global_step": 202092, "epoch": 1202} {"train_loss": -11.152294158935547, "global_step": 202093, "epoch": 1202} {"train_loss": -11.263294219970703, "global_step": 202094, "epoch": 1202} {"train_loss": -11.105058670043945, "global_step": 202095, "epoch": 1202} {"train_loss": -11.385403633117676, "global_step": 202096, "epoch": 1202} {"train_loss": -11.423080444335938, "global_step": 202097, "epoch": 1202} {"train_loss": -11.291062355041504, "global_step": 202098, "epoch": 1202} {"train_loss": -11.33716106414795, "global_step": 202099, "epoch": 1202} {"train_loss": -11.188583374023438, "global_step": 202100, "epoch": 1202} {"train_loss": -11.555702209472656, "global_step": 202101, "epoch": 1202} {"train_loss": -10.968852996826172, "global_step": 202102, "epoch": 1202} {"train_loss": -11.217404910496303, "global_step": 202103, "epoch": 1202, "val_loss": 247796.859375} {"train_loss": -11.491912841796875, "global_step": 202104, "epoch": 1203} {"train_loss": -11.324419021606445, "global_step": 202105, "epoch": 1203} {"train_loss": -11.333864212036133, "global_step": 202106, "epoch": 1203} {"train_loss": -11.361166000366211, "global_step": 202107, "epoch": 1203} {"train_loss": -11.27062702178955, "global_step": 202108, "epoch": 1203} {"train_loss": -11.3850736618042, "global_step": 202109, "epoch": 1203} {"train_loss": -11.618732452392578, "global_step": 202110, "epoch": 1203} {"train_loss": -11.324665069580078, "global_step": 202111, "epoch": 1203} {"train_loss": -11.417478561401367, "global_step": 202112, "epoch": 1203} {"train_loss": -11.333076477050781, "global_step": 202113, "epoch": 1203} {"train_loss": -10.993288040161133, "global_step": 202114, "epoch": 1203} {"train_loss": -10.985368728637695, "global_step": 202115, "epoch": 1203} {"train_loss": -11.195403099060059, "global_step": 202116, "epoch": 1203} {"train_loss": -10.775680541992188, "global_step": 202117, "epoch": 1203} {"train_loss": -11.202516555786133, "global_step": 202118, "epoch": 1203} {"train_loss": -11.435384750366211, "global_step": 202119, "epoch": 1203} {"train_loss": -11.400178909301758, "global_step": 202120, "epoch": 1203} {"train_loss": -11.42855453491211, "global_step": 202121, "epoch": 1203} {"train_loss": -11.323781967163086, "global_step": 202122, "epoch": 1203} {"train_loss": -10.97884464263916, "global_step": 202123, "epoch": 1203} {"train_loss": -11.64991283416748, "global_step": 202124, "epoch": 1203} {"train_loss": -10.973886489868164, "global_step": 202125, "epoch": 1203} {"train_loss": -11.314937591552734, "global_step": 202126, "epoch": 1203} {"train_loss": -11.483776092529297, "global_step": 202127, "epoch": 1203} {"train_loss": -11.635025024414062, "global_step": 202128, "epoch": 1203} {"train_loss": -11.307621955871582, "global_step": 202129, "epoch": 1203} {"train_loss": -11.052213668823242, "global_step": 202130, "epoch": 1203} {"train_loss": -11.58708381652832, "global_step": 202131, "epoch": 1203} {"train_loss": -11.284241676330566, "global_step": 202132, "epoch": 1203} {"train_loss": -11.608407974243164, "global_step": 202133, "epoch": 1203} {"train_loss": -11.578412055969238, "global_step": 202134, "epoch": 1203} {"train_loss": -11.279485702514648, "global_step": 202135, "epoch": 1203} {"train_loss": -11.37154769897461, "global_step": 202136, "epoch": 1203} {"train_loss": -11.352727890014648, "global_step": 202137, "epoch": 1203} {"train_loss": -11.628829956054688, "global_step": 202138, "epoch": 1203} {"train_loss": -11.54753589630127, "global_step": 202139, "epoch": 1203} {"train_loss": -11.418720245361328, "global_step": 202140, "epoch": 1203} {"train_loss": -11.545526504516602, "global_step": 202141, "epoch": 1203} {"train_loss": -11.510767936706543, "global_step": 202142, "epoch": 1203} {"train_loss": -11.640935897827148, "global_step": 202143, "epoch": 1203} {"train_loss": -11.745262145996094, "global_step": 202144, "epoch": 1203} {"train_loss": -11.343936920166016, "global_step": 202145, "epoch": 1203} {"train_loss": -11.580976486206055, "global_step": 202146, "epoch": 1203} {"train_loss": -11.515556335449219, "global_step": 202147, "epoch": 1203} {"train_loss": -11.588017463684082, "global_step": 202148, "epoch": 1203} {"train_loss": -11.689532279968262, "global_step": 202149, "epoch": 1203} {"train_loss": -11.35576057434082, "global_step": 202150, "epoch": 1203} {"train_loss": -11.575311660766602, "global_step": 202151, "epoch": 1203} {"train_loss": -11.458196640014648, "global_step": 202152, "epoch": 1203} {"train_loss": -11.58707332611084, "global_step": 202153, "epoch": 1203} {"train_loss": -11.425804138183594, "global_step": 202154, "epoch": 1203} {"train_loss": -11.487655639648438, "global_step": 202155, "epoch": 1203} {"train_loss": -11.454729080200195, "global_step": 202156, "epoch": 1203} {"train_loss": -11.154151916503906, "global_step": 202157, "epoch": 1203} {"train_loss": -11.133951187133789, "global_step": 202158, "epoch": 1203} {"train_loss": -10.80461311340332, "global_step": 202159, "epoch": 1203} {"train_loss": -11.146470069885254, "global_step": 202160, "epoch": 1203} {"train_loss": -11.480695724487305, "global_step": 202161, "epoch": 1203} {"train_loss": -11.155204772949219, "global_step": 202162, "epoch": 1203} {"train_loss": -11.8423490524292, "global_step": 202163, "epoch": 1203} {"train_loss": -10.56498908996582, "global_step": 202164, "epoch": 1203} {"train_loss": -11.157001495361328, "global_step": 202165, "epoch": 1203} {"train_loss": -11.3302001953125, "global_step": 202166, "epoch": 1203} {"train_loss": -11.33360481262207, "global_step": 202167, "epoch": 1203} {"train_loss": -11.385086059570312, "global_step": 202168, "epoch": 1203} {"train_loss": -11.322456359863281, "global_step": 202169, "epoch": 1203} {"train_loss": -11.217370986938477, "global_step": 202170, "epoch": 1203} {"train_loss": -11.269797325134277, "global_step": 202171, "epoch": 1203} {"train_loss": -11.106164932250977, "global_step": 202172, "epoch": 1203} {"train_loss": -11.06683349609375, "global_step": 202173, "epoch": 1203} {"train_loss": -11.494071006774902, "global_step": 202174, "epoch": 1203} {"train_loss": -11.229181289672852, "global_step": 202175, "epoch": 1203} {"train_loss": -11.506509780883789, "global_step": 202176, "epoch": 1203} {"train_loss": -11.28272533416748, "global_step": 202177, "epoch": 1203} {"train_loss": -11.475717544555664, "global_step": 202178, "epoch": 1203} {"train_loss": -11.281780242919922, "global_step": 202179, "epoch": 1203} {"train_loss": -11.272401809692383, "global_step": 202180, "epoch": 1203} {"train_loss": -11.339851379394531, "global_step": 202181, "epoch": 1203} {"train_loss": -10.942090034484863, "global_step": 202182, "epoch": 1203} {"train_loss": -11.015955924987793, "global_step": 202183, "epoch": 1203} {"train_loss": -11.139364242553711, "global_step": 202184, "epoch": 1203} {"train_loss": -11.127235412597656, "global_step": 202185, "epoch": 1203} {"train_loss": -11.486993789672852, "global_step": 202186, "epoch": 1203} {"train_loss": -11.057374954223633, "global_step": 202187, "epoch": 1203} {"train_loss": -11.12612247467041, "global_step": 202188, "epoch": 1203} {"train_loss": -10.966798782348633, "global_step": 202189, "epoch": 1203} {"train_loss": -11.528564453125, "global_step": 202190, "epoch": 1203} {"train_loss": -10.736001968383789, "global_step": 202191, "epoch": 1203} {"train_loss": -11.059000015258789, "global_step": 202192, "epoch": 1203} {"train_loss": -10.78072738647461, "global_step": 202193, "epoch": 1203} {"train_loss": -11.480377197265625, "global_step": 202194, "epoch": 1203} {"train_loss": -11.26205825805664, "global_step": 202195, "epoch": 1203} {"train_loss": -11.221502304077148, "global_step": 202196, "epoch": 1203} {"train_loss": -11.094808578491211, "global_step": 202197, "epoch": 1203} {"train_loss": -10.868480682373047, "global_step": 202198, "epoch": 1203} {"train_loss": -11.024864196777344, "global_step": 202199, "epoch": 1203} {"train_loss": -11.428235054016113, "global_step": 202200, "epoch": 1203} {"train_loss": -11.05284309387207, "global_step": 202201, "epoch": 1203} {"train_loss": -11.184893608093262, "global_step": 202202, "epoch": 1203} {"train_loss": -11.075836181640625, "global_step": 202203, "epoch": 1203} {"train_loss": -11.332048416137695, "global_step": 202204, "epoch": 1203} {"train_loss": -11.351378440856934, "global_step": 202205, "epoch": 1203} {"train_loss": -11.228923797607422, "global_step": 202206, "epoch": 1203} {"train_loss": -11.004179000854492, "global_step": 202207, "epoch": 1203} {"train_loss": -11.009727478027344, "global_step": 202208, "epoch": 1203} {"train_loss": -11.128564834594727, "global_step": 202209, "epoch": 1203} {"train_loss": -11.125370979309082, "global_step": 202210, "epoch": 1203} {"train_loss": -10.77811050415039, "global_step": 202211, "epoch": 1203} {"train_loss": -11.187193870544434, "global_step": 202212, "epoch": 1203} {"train_loss": -11.096725463867188, "global_step": 202213, "epoch": 1203} {"train_loss": -10.249695777893066, "global_step": 202214, "epoch": 1203} {"train_loss": -11.404573440551758, "global_step": 202215, "epoch": 1203} {"train_loss": -10.492782592773438, "global_step": 202216, "epoch": 1203} {"train_loss": -11.444324493408203, "global_step": 202217, "epoch": 1203} {"train_loss": -10.955331802368164, "global_step": 202218, "epoch": 1203} {"train_loss": -11.360821723937988, "global_step": 202219, "epoch": 1203} {"train_loss": -11.217096328735352, "global_step": 202220, "epoch": 1203} {"train_loss": -11.339340209960938, "global_step": 202221, "epoch": 1203} {"train_loss": -11.413631439208984, "global_step": 202222, "epoch": 1203} {"train_loss": -11.358907699584961, "global_step": 202223, "epoch": 1203} {"train_loss": -11.231786727905273, "global_step": 202224, "epoch": 1203} {"train_loss": -11.303770065307617, "global_step": 202225, "epoch": 1203} {"train_loss": -11.369405746459961, "global_step": 202226, "epoch": 1203} {"train_loss": -11.317068099975586, "global_step": 202227, "epoch": 1203} {"train_loss": -11.06067943572998, "global_step": 202228, "epoch": 1203} {"train_loss": -11.227067947387695, "global_step": 202229, "epoch": 1203} {"train_loss": -11.322053909301758, "global_step": 202230, "epoch": 1203} {"train_loss": -11.117178916931152, "global_step": 202231, "epoch": 1203} {"train_loss": -11.216087341308594, "global_step": 202232, "epoch": 1203} {"train_loss": -11.183673858642578, "global_step": 202233, "epoch": 1203} {"train_loss": -11.468850135803223, "global_step": 202234, "epoch": 1203} {"train_loss": -11.210843086242676, "global_step": 202235, "epoch": 1203} {"train_loss": -11.45790958404541, "global_step": 202236, "epoch": 1203} {"train_loss": -11.353927612304688, "global_step": 202237, "epoch": 1203} {"train_loss": -11.306140899658203, "global_step": 202238, "epoch": 1203} {"train_loss": -11.21201229095459, "global_step": 202239, "epoch": 1203} {"train_loss": -11.393472671508789, "global_step": 202240, "epoch": 1203} {"train_loss": -11.068554878234863, "global_step": 202241, "epoch": 1203} {"train_loss": -11.408227920532227, "global_step": 202242, "epoch": 1203} {"train_loss": -11.34335708618164, "global_step": 202243, "epoch": 1203} {"train_loss": -11.333491325378418, "global_step": 202244, "epoch": 1203} {"train_loss": -11.123891830444336, "global_step": 202245, "epoch": 1203} {"train_loss": -11.427618026733398, "global_step": 202246, "epoch": 1203} {"train_loss": -11.084635734558105, "global_step": 202247, "epoch": 1203} {"train_loss": -11.21242904663086, "global_step": 202248, "epoch": 1203} {"train_loss": -11.102283477783203, "global_step": 202249, "epoch": 1203} {"train_loss": -11.681434631347656, "global_step": 202250, "epoch": 1203} {"train_loss": -11.083252906799316, "global_step": 202251, "epoch": 1203} {"train_loss": -11.396578788757324, "global_step": 202252, "epoch": 1203} {"train_loss": -11.309906005859375, "global_step": 202253, "epoch": 1203} {"train_loss": -10.910293579101562, "global_step": 202254, "epoch": 1203} {"train_loss": -11.333717346191406, "global_step": 202255, "epoch": 1203} {"train_loss": -11.37348747253418, "global_step": 202256, "epoch": 1203} {"train_loss": -11.26077651977539, "global_step": 202257, "epoch": 1203} {"train_loss": -11.21574592590332, "global_step": 202258, "epoch": 1203} {"train_loss": -10.828449249267578, "global_step": 202259, "epoch": 1203} {"train_loss": -10.963912010192871, "global_step": 202260, "epoch": 1203} {"train_loss": -11.652942657470703, "global_step": 202261, "epoch": 1203} {"train_loss": -11.006495475769043, "global_step": 202262, "epoch": 1203} {"train_loss": -11.366257667541504, "global_step": 202263, "epoch": 1203} {"train_loss": -11.465314865112305, "global_step": 202264, "epoch": 1203} {"train_loss": -11.267237663269043, "global_step": 202265, "epoch": 1203} {"train_loss": -11.267963409423828, "global_step": 202266, "epoch": 1203} {"train_loss": -11.346631050109863, "global_step": 202267, "epoch": 1203} {"train_loss": -11.334667205810547, "global_step": 202268, "epoch": 1203} {"train_loss": -11.187111854553223, "global_step": 202269, "epoch": 1203} {"train_loss": -11.373807907104492, "global_step": 202270, "epoch": 1203} {"train_loss": -11.272915930975051, "global_step": 202271, "epoch": 1203, "val_loss": 246854.640625} {"train_loss": -11.492697715759277, "global_step": 202272, "epoch": 1204} {"train_loss": -11.534223556518555, "global_step": 202273, "epoch": 1204} {"train_loss": -11.217247009277344, "global_step": 202274, "epoch": 1204} {"train_loss": -11.461869239807129, "global_step": 202275, "epoch": 1204} {"train_loss": -11.278671264648438, "global_step": 202276, "epoch": 1204} {"train_loss": -11.215070724487305, "global_step": 202277, "epoch": 1204} {"train_loss": -10.66561508178711, "global_step": 202278, "epoch": 1204} {"train_loss": -11.458032608032227, "global_step": 202279, "epoch": 1204} {"train_loss": -10.790048599243164, "global_step": 202280, "epoch": 1204} {"train_loss": -10.873798370361328, "global_step": 202281, "epoch": 1204} {"train_loss": -11.098018646240234, "global_step": 202282, "epoch": 1204} {"train_loss": -11.277753829956055, "global_step": 202283, "epoch": 1204} {"train_loss": -10.953510284423828, "global_step": 202284, "epoch": 1204} {"train_loss": -11.343610763549805, "global_step": 202285, "epoch": 1204} {"train_loss": -11.037519454956055, "global_step": 202286, "epoch": 1204} {"train_loss": -11.104276657104492, "global_step": 202287, "epoch": 1204} {"train_loss": -11.325851440429688, "global_step": 202288, "epoch": 1204} {"train_loss": -10.812573432922363, "global_step": 202289, "epoch": 1204} {"train_loss": -11.312200546264648, "global_step": 202290, "epoch": 1204} {"train_loss": -10.88892936706543, "global_step": 202291, "epoch": 1204} {"train_loss": -11.379663467407227, "global_step": 202292, "epoch": 1204} {"train_loss": -10.517419815063477, "global_step": 202293, "epoch": 1204} {"train_loss": -11.101364135742188, "global_step": 202294, "epoch": 1204} {"train_loss": -10.871957778930664, "global_step": 202295, "epoch": 1204} {"train_loss": -10.887386322021484, "global_step": 202296, "epoch": 1204} {"train_loss": -11.209218978881836, "global_step": 202297, "epoch": 1204} {"train_loss": -10.062379837036133, "global_step": 202298, "epoch": 1204} {"train_loss": -9.942682266235352, "global_step": 202299, "epoch": 1204} {"train_loss": -9.892749786376953, "global_step": 202300, "epoch": 1204} {"train_loss": -9.427885055541992, "global_step": 202301, "epoch": 1204} {"train_loss": -9.462935447692871, "global_step": 202302, "epoch": 1204} {"train_loss": -9.276119232177734, "global_step": 202303, "epoch": 1204} {"train_loss": -11.156478881835938, "global_step": 202304, "epoch": 1204} {"train_loss": -9.154919624328613, "global_step": 202305, "epoch": 1204} {"train_loss": -8.13473129272461, "global_step": 202306, "epoch": 1204} {"train_loss": -9.343623161315918, "global_step": 202307, "epoch": 1204} {"train_loss": -9.705913543701172, "global_step": 202308, "epoch": 1204} {"train_loss": -10.721349716186523, "global_step": 202309, "epoch": 1204} {"train_loss": -8.671737670898438, "global_step": 202310, "epoch": 1204} {"train_loss": -8.439339637756348, "global_step": 202311, "epoch": 1204} {"train_loss": -10.94817066192627, "global_step": 202312, "epoch": 1204} {"train_loss": -9.213722229003906, "global_step": 202313, "epoch": 1204} {"train_loss": -9.80734634399414, "global_step": 202314, "epoch": 1204} {"train_loss": -9.061044692993164, "global_step": 202315, "epoch": 1204} {"train_loss": -9.558412551879883, "global_step": 202316, "epoch": 1204} {"train_loss": -9.791300773620605, "global_step": 202317, "epoch": 1204} {"train_loss": -9.173137664794922, "global_step": 202318, "epoch": 1204} {"train_loss": -10.483726501464844, "global_step": 202319, "epoch": 1204} {"train_loss": -9.364038467407227, "global_step": 202320, "epoch": 1204} {"train_loss": -9.233837127685547, "global_step": 202321, "epoch": 1204} {"train_loss": -10.581201553344727, "global_step": 202322, "epoch": 1204} {"train_loss": -9.62291431427002, "global_step": 202323, "epoch": 1204} {"train_loss": -10.335847854614258, "global_step": 202324, "epoch": 1204} {"train_loss": -10.385395050048828, "global_step": 202325, "epoch": 1204} {"train_loss": -10.142766952514648, "global_step": 202326, "epoch": 1204} {"train_loss": -10.320902824401855, "global_step": 202327, "epoch": 1204} {"train_loss": -10.490927696228027, "global_step": 202328, "epoch": 1204} {"train_loss": -10.602482795715332, "global_step": 202329, "epoch": 1204} {"train_loss": -10.77955436706543, "global_step": 202330, "epoch": 1204} {"train_loss": -10.863277435302734, "global_step": 202331, "epoch": 1204} {"train_loss": -10.401399612426758, "global_step": 202332, "epoch": 1204} {"train_loss": -10.982412338256836, "global_step": 202333, "epoch": 1204} {"train_loss": -11.200246810913086, "global_step": 202334, "epoch": 1204} {"train_loss": -10.846601486206055, "global_step": 202335, "epoch": 1204} {"train_loss": -10.80252456665039, "global_step": 202336, "epoch": 1204} {"train_loss": -10.977096557617188, "global_step": 202337, "epoch": 1204} {"train_loss": -11.166830062866211, "global_step": 202338, "epoch": 1204} {"train_loss": -11.044181823730469, "global_step": 202339, "epoch": 1204} {"train_loss": -11.119294166564941, "global_step": 202340, "epoch": 1204} {"train_loss": -10.975685119628906, "global_step": 202341, "epoch": 1204} {"train_loss": -11.133621215820312, "global_step": 202342, "epoch": 1204} {"train_loss": -11.071256637573242, "global_step": 202343, "epoch": 1204} {"train_loss": -11.265724182128906, "global_step": 202344, "epoch": 1204} {"train_loss": -11.068914413452148, "global_step": 202345, "epoch": 1204} {"train_loss": -11.180830001831055, "global_step": 202346, "epoch": 1204} {"train_loss": -11.010343551635742, "global_step": 202347, "epoch": 1204} {"train_loss": -11.218012809753418, "global_step": 202348, "epoch": 1204} {"train_loss": -11.340017318725586, "global_step": 202349, "epoch": 1204} {"train_loss": -11.199729919433594, "global_step": 202350, "epoch": 1204} {"train_loss": -11.112457275390625, "global_step": 202351, "epoch": 1204} {"train_loss": -11.20036506652832, "global_step": 202352, "epoch": 1204} {"train_loss": -11.297612190246582, "global_step": 202353, "epoch": 1204} {"train_loss": -11.249002456665039, "global_step": 202354, "epoch": 1204} {"train_loss": -11.132478713989258, "global_step": 202355, "epoch": 1204} {"train_loss": -11.218132019042969, "global_step": 202356, "epoch": 1204} {"train_loss": -11.264730453491211, "global_step": 202357, "epoch": 1204} {"train_loss": -11.431768417358398, "global_step": 202358, "epoch": 1204} {"train_loss": -11.274831771850586, "global_step": 202359, "epoch": 1204} {"train_loss": -11.372573852539062, "global_step": 202360, "epoch": 1204} {"train_loss": -11.572749137878418, "global_step": 202361, "epoch": 1204} {"train_loss": -11.370434761047363, "global_step": 202362, "epoch": 1204} {"train_loss": -11.498592376708984, "global_step": 202363, "epoch": 1204} {"train_loss": -11.585760116577148, "global_step": 202364, "epoch": 1204} {"train_loss": -11.353961944580078, "global_step": 202365, "epoch": 1204} {"train_loss": -11.549558639526367, "global_step": 202366, "epoch": 1204} {"train_loss": -11.550954818725586, "global_step": 202367, "epoch": 1204} {"train_loss": -11.456714630126953, "global_step": 202368, "epoch": 1204} {"train_loss": -11.428226470947266, "global_step": 202369, "epoch": 1204} {"train_loss": -11.58782958984375, "global_step": 202370, "epoch": 1204} {"train_loss": -11.6497802734375, "global_step": 202371, "epoch": 1204} {"train_loss": -11.6524076461792, "global_step": 202372, "epoch": 1204} {"train_loss": -11.737752914428711, "global_step": 202373, "epoch": 1204} {"train_loss": -11.61385726928711, "global_step": 202374, "epoch": 1204} {"train_loss": -11.528068542480469, "global_step": 202375, "epoch": 1204} {"train_loss": -11.343652725219727, "global_step": 202376, "epoch": 1204} {"train_loss": -11.637042045593262, "global_step": 202377, "epoch": 1204} {"train_loss": -11.705911636352539, "global_step": 202378, "epoch": 1204} {"train_loss": -11.626646041870117, "global_step": 202379, "epoch": 1204} {"train_loss": -11.658864974975586, "global_step": 202380, "epoch": 1204} {"train_loss": -11.59602165222168, "global_step": 202381, "epoch": 1204} {"train_loss": -11.492475509643555, "global_step": 202382, "epoch": 1204} {"train_loss": -11.673848152160645, "global_step": 202383, "epoch": 1204} {"train_loss": -11.702736854553223, "global_step": 202384, "epoch": 1204} {"train_loss": -11.652888298034668, "global_step": 202385, "epoch": 1204} {"train_loss": -11.800065040588379, "global_step": 202386, "epoch": 1204} {"train_loss": -11.68294906616211, "global_step": 202387, "epoch": 1204} {"train_loss": -11.747509002685547, "global_step": 202388, "epoch": 1204} {"train_loss": -11.789194107055664, "global_step": 202389, "epoch": 1204} {"train_loss": -11.797586441040039, "global_step": 202390, "epoch": 1204} {"train_loss": -11.677532196044922, "global_step": 202391, "epoch": 1204} {"train_loss": -11.980027198791504, "global_step": 202392, "epoch": 1204} {"train_loss": -11.726880073547363, "global_step": 202393, "epoch": 1204} {"train_loss": -11.816200256347656, "global_step": 202394, "epoch": 1204} {"train_loss": -11.680961608886719, "global_step": 202395, "epoch": 1204} {"train_loss": -11.847291946411133, "global_step": 202396, "epoch": 1204} {"train_loss": -11.81351089477539, "global_step": 202397, "epoch": 1204} {"train_loss": -11.691068649291992, "global_step": 202398, "epoch": 1204} {"train_loss": -11.493738174438477, "global_step": 202399, "epoch": 1204} {"train_loss": -11.62641716003418, "global_step": 202400, "epoch": 1204} {"train_loss": -11.852742195129395, "global_step": 202401, "epoch": 1204} {"train_loss": -11.69314956665039, "global_step": 202402, "epoch": 1204} {"train_loss": -11.735297203063965, "global_step": 202403, "epoch": 1204} {"train_loss": -11.385201454162598, "global_step": 202404, "epoch": 1204} {"train_loss": -11.549542427062988, "global_step": 202405, "epoch": 1204} {"train_loss": -11.667937278747559, "global_step": 202406, "epoch": 1204} {"train_loss": -11.85791301727295, "global_step": 202407, "epoch": 1204} {"train_loss": -11.490839958190918, "global_step": 202408, "epoch": 1204} {"train_loss": -11.401397705078125, "global_step": 202409, "epoch": 1204} {"train_loss": -11.034379005432129, "global_step": 202410, "epoch": 1204} {"train_loss": -10.117587089538574, "global_step": 202411, "epoch": 1204} {"train_loss": -11.186301231384277, "global_step": 202412, "epoch": 1204} {"train_loss": -11.447118759155273, "global_step": 202413, "epoch": 1204} {"train_loss": -11.323026657104492, "global_step": 202414, "epoch": 1204} {"train_loss": -10.103017807006836, "global_step": 202415, "epoch": 1204} {"train_loss": -10.403825759887695, "global_step": 202416, "epoch": 1204} {"train_loss": -11.362834930419922, "global_step": 202417, "epoch": 1204} {"train_loss": -10.421445846557617, "global_step": 202418, "epoch": 1204} {"train_loss": -9.851842880249023, "global_step": 202419, "epoch": 1204} {"train_loss": -11.280216217041016, "global_step": 202420, "epoch": 1204} {"train_loss": -11.217187881469727, "global_step": 202421, "epoch": 1204} {"train_loss": -10.619861602783203, "global_step": 202422, "epoch": 1204} {"train_loss": -11.2992525100708, "global_step": 202423, "epoch": 1204} {"train_loss": -9.950824737548828, "global_step": 202424, "epoch": 1204} {"train_loss": -10.207237243652344, "global_step": 202425, "epoch": 1204} {"train_loss": -11.069416999816895, "global_step": 202426, "epoch": 1204} {"train_loss": -8.846004486083984, "global_step": 202427, "epoch": 1204} {"train_loss": -10.613321304321289, "global_step": 202428, "epoch": 1204} {"train_loss": -10.239253044128418, "global_step": 202429, "epoch": 1204} {"train_loss": -9.894390106201172, "global_step": 202430, "epoch": 1204} {"train_loss": -10.894290924072266, "global_step": 202431, "epoch": 1204} {"train_loss": -10.191272735595703, "global_step": 202432, "epoch": 1204} {"train_loss": -10.98376178741455, "global_step": 202433, "epoch": 1204} {"train_loss": -9.799288749694824, "global_step": 202434, "epoch": 1204} {"train_loss": -10.851705551147461, "global_step": 202435, "epoch": 1204} {"train_loss": -10.415094375610352, "global_step": 202436, "epoch": 1204} {"train_loss": -11.048526763916016, "global_step": 202437, "epoch": 1204} {"train_loss": -10.774100303649902, "global_step": 202438, "epoch": 1204} {"train_loss": -10.918437747728257, "global_step": 202439, "epoch": 1204, "val_loss": 244150.25} {"train_loss": -11.224912643432617, "global_step": 202440, "epoch": 1205} {"train_loss": -10.933501243591309, "global_step": 202441, "epoch": 1205} {"train_loss": -11.22851276397705, "global_step": 202442, "epoch": 1205} {"train_loss": -11.109063148498535, "global_step": 202443, "epoch": 1205} {"train_loss": -11.157182693481445, "global_step": 202444, "epoch": 1205} {"train_loss": -11.290959358215332, "global_step": 202445, "epoch": 1205} {"train_loss": -11.255544662475586, "global_step": 202446, "epoch": 1205} {"train_loss": -11.065898895263672, "global_step": 202447, "epoch": 1205} {"train_loss": -10.887945175170898, "global_step": 202448, "epoch": 1205} {"train_loss": -11.115034103393555, "global_step": 202449, "epoch": 1205} {"train_loss": -11.323284149169922, "global_step": 202450, "epoch": 1205} {"train_loss": -11.397339820861816, "global_step": 202451, "epoch": 1205} {"train_loss": -11.192943572998047, "global_step": 202452, "epoch": 1205} {"train_loss": -11.082500457763672, "global_step": 202453, "epoch": 1205} {"train_loss": -11.078214645385742, "global_step": 202454, "epoch": 1205} {"train_loss": -11.137067794799805, "global_step": 202455, "epoch": 1205} {"train_loss": -11.3145170211792, "global_step": 202456, "epoch": 1205} {"train_loss": -11.473941802978516, "global_step": 202457, "epoch": 1205} {"train_loss": -10.926149368286133, "global_step": 202458, "epoch": 1205} {"train_loss": -11.469200134277344, "global_step": 202459, "epoch": 1205} {"train_loss": -11.16834831237793, "global_step": 202460, "epoch": 1205} {"train_loss": -11.529311180114746, "global_step": 202461, "epoch": 1205} {"train_loss": -11.28693962097168, "global_step": 202462, "epoch": 1205} {"train_loss": -11.161273956298828, "global_step": 202463, "epoch": 1205} {"train_loss": -11.372894287109375, "global_step": 202464, "epoch": 1205} {"train_loss": -11.424509048461914, "global_step": 202465, "epoch": 1205} {"train_loss": -11.40831184387207, "global_step": 202466, "epoch": 1205} {"train_loss": -11.243124008178711, "global_step": 202467, "epoch": 1205} {"train_loss": -11.200729370117188, "global_step": 202468, "epoch": 1205} {"train_loss": -11.463525772094727, "global_step": 202469, "epoch": 1205} {"train_loss": -11.48980712890625, "global_step": 202470, "epoch": 1205} {"train_loss": -11.435583114624023, "global_step": 202471, "epoch": 1205} {"train_loss": -11.558012008666992, "global_step": 202472, "epoch": 1205} {"train_loss": -11.585161209106445, "global_step": 202473, "epoch": 1205} {"train_loss": -11.383443832397461, "global_step": 202474, "epoch": 1205} {"train_loss": -11.448690414428711, "global_step": 202475, "epoch": 1205} {"train_loss": -11.403470993041992, "global_step": 202476, "epoch": 1205} {"train_loss": -11.53980827331543, "global_step": 202477, "epoch": 1205} {"train_loss": -11.418832778930664, "global_step": 202478, "epoch": 1205} {"train_loss": -11.561190605163574, "global_step": 202479, "epoch": 1205} {"train_loss": -11.509282112121582, "global_step": 202480, "epoch": 1205} {"train_loss": -11.57763957977295, "global_step": 202481, "epoch": 1205} {"train_loss": -11.272198677062988, "global_step": 202482, "epoch": 1205} {"train_loss": -11.425186157226562, "global_step": 202483, "epoch": 1205} {"train_loss": -11.570098876953125, "global_step": 202484, "epoch": 1205} {"train_loss": -11.477192878723145, "global_step": 202485, "epoch": 1205} {"train_loss": -11.63524055480957, "global_step": 202486, "epoch": 1205} {"train_loss": -11.689352989196777, "global_step": 202487, "epoch": 1205} {"train_loss": -11.718300819396973, "global_step": 202488, "epoch": 1205} {"train_loss": -11.672067642211914, "global_step": 202489, "epoch": 1205} {"train_loss": -11.726052284240723, "global_step": 202490, "epoch": 1205} {"train_loss": -11.512578964233398, "global_step": 202491, "epoch": 1205} {"train_loss": -11.74612045288086, "global_step": 202492, "epoch": 1205} {"train_loss": -11.748607635498047, "global_step": 202493, "epoch": 1205} {"train_loss": -11.584528923034668, "global_step": 202494, "epoch": 1205} {"train_loss": -11.435174942016602, "global_step": 202495, "epoch": 1205} {"train_loss": -11.80692195892334, "global_step": 202496, "epoch": 1205} {"train_loss": -11.616172790527344, "global_step": 202497, "epoch": 1205} {"train_loss": -11.588504791259766, "global_step": 202498, "epoch": 1205} {"train_loss": -11.649307250976562, "global_step": 202499, "epoch": 1205} {"train_loss": -11.689845085144043, "global_step": 202500, "epoch": 1205} {"train_loss": -11.534673690795898, "global_step": 202501, "epoch": 1205} {"train_loss": -11.860374450683594, "global_step": 202502, "epoch": 1205} {"train_loss": -11.761093139648438, "global_step": 202503, "epoch": 1205} {"train_loss": -11.48829460144043, "global_step": 202504, "epoch": 1205} {"train_loss": -11.662363052368164, "global_step": 202505, "epoch": 1205} {"train_loss": -11.758211135864258, "global_step": 202506, "epoch": 1205} {"train_loss": -11.748867988586426, "global_step": 202507, "epoch": 1205} {"train_loss": -11.285452842712402, "global_step": 202508, "epoch": 1205} {"train_loss": -11.899393081665039, "global_step": 202509, "epoch": 1205} {"train_loss": -11.331510543823242, "global_step": 202510, "epoch": 1205} {"train_loss": -11.037491798400879, "global_step": 202511, "epoch": 1205} {"train_loss": -11.293304443359375, "global_step": 202512, "epoch": 1205} {"train_loss": -11.127946853637695, "global_step": 202513, "epoch": 1205} {"train_loss": -11.645299911499023, "global_step": 202514, "epoch": 1205} {"train_loss": -10.678593635559082, "global_step": 202515, "epoch": 1205} {"train_loss": -9.88693618774414, "global_step": 202516, "epoch": 1205} {"train_loss": -10.612964630126953, "global_step": 202517, "epoch": 1205} {"train_loss": -11.388463020324707, "global_step": 202518, "epoch": 1205} {"train_loss": -9.638046264648438, "global_step": 202519, "epoch": 1205} {"train_loss": -10.18997573852539, "global_step": 202520, "epoch": 1205} {"train_loss": -10.781824111938477, "global_step": 202521, "epoch": 1205} {"train_loss": -8.906835556030273, "global_step": 202522, "epoch": 1205} {"train_loss": -11.06693172454834, "global_step": 202523, "epoch": 1205} {"train_loss": -10.759130477905273, "global_step": 202524, "epoch": 1205} {"train_loss": -11.24730110168457, "global_step": 202525, "epoch": 1205} {"train_loss": -10.725934982299805, "global_step": 202526, "epoch": 1205} {"train_loss": -11.466009140014648, "global_step": 202527, "epoch": 1205} {"train_loss": -10.964104652404785, "global_step": 202528, "epoch": 1205} {"train_loss": -11.134817123413086, "global_step": 202529, "epoch": 1205} {"train_loss": -11.073963165283203, "global_step": 202530, "epoch": 1205} {"train_loss": -10.604696273803711, "global_step": 202531, "epoch": 1205} {"train_loss": -11.138724327087402, "global_step": 202532, "epoch": 1205} {"train_loss": -10.879404067993164, "global_step": 202533, "epoch": 1205} {"train_loss": -11.481233596801758, "global_step": 202534, "epoch": 1205} {"train_loss": -11.072423934936523, "global_step": 202535, "epoch": 1205} {"train_loss": -11.002373695373535, "global_step": 202536, "epoch": 1205} {"train_loss": -11.251758575439453, "global_step": 202537, "epoch": 1205} {"train_loss": -10.822473526000977, "global_step": 202538, "epoch": 1205} {"train_loss": -11.290306091308594, "global_step": 202539, "epoch": 1205} {"train_loss": -10.717727661132812, "global_step": 202540, "epoch": 1205} {"train_loss": -11.455991744995117, "global_step": 202541, "epoch": 1205} {"train_loss": -10.168916702270508, "global_step": 202542, "epoch": 1205} {"train_loss": -11.08102035522461, "global_step": 202543, "epoch": 1205} {"train_loss": -10.570093154907227, "global_step": 202544, "epoch": 1205} {"train_loss": -10.789624214172363, "global_step": 202545, "epoch": 1205} {"train_loss": -10.045061111450195, "global_step": 202546, "epoch": 1205} {"train_loss": -10.442142486572266, "global_step": 202547, "epoch": 1205} {"train_loss": -10.357828140258789, "global_step": 202548, "epoch": 1205} {"train_loss": -10.045072555541992, "global_step": 202549, "epoch": 1205} {"train_loss": -10.376516342163086, "global_step": 202550, "epoch": 1205} {"train_loss": -11.183076858520508, "global_step": 202551, "epoch": 1205} {"train_loss": -10.504518508911133, "global_step": 202552, "epoch": 1205} {"train_loss": -10.789849281311035, "global_step": 202553, "epoch": 1205} {"train_loss": -10.991479873657227, "global_step": 202554, "epoch": 1205} {"train_loss": -10.84898567199707, "global_step": 202555, "epoch": 1205} {"train_loss": -11.321176528930664, "global_step": 202556, "epoch": 1205} {"train_loss": -10.83521556854248, "global_step": 202557, "epoch": 1205} {"train_loss": -10.746707916259766, "global_step": 202558, "epoch": 1205} {"train_loss": -11.115171432495117, "global_step": 202559, "epoch": 1205} {"train_loss": -10.920320510864258, "global_step": 202560, "epoch": 1205} {"train_loss": -11.188823699951172, "global_step": 202561, "epoch": 1205} {"train_loss": -10.862960815429688, "global_step": 202562, "epoch": 1205} {"train_loss": -11.02640438079834, "global_step": 202563, "epoch": 1205} {"train_loss": -11.486425399780273, "global_step": 202564, "epoch": 1205} {"train_loss": -11.106873512268066, "global_step": 202565, "epoch": 1205} {"train_loss": -11.052767753601074, "global_step": 202566, "epoch": 1205} {"train_loss": -11.306485176086426, "global_step": 202567, "epoch": 1205} {"train_loss": -11.344207763671875, "global_step": 202568, "epoch": 1205} {"train_loss": -11.209468841552734, "global_step": 202569, "epoch": 1205} {"train_loss": -11.411642074584961, "global_step": 202570, "epoch": 1205} {"train_loss": -11.303522109985352, "global_step": 202571, "epoch": 1205} {"train_loss": -11.40301513671875, "global_step": 202572, "epoch": 1205} {"train_loss": -11.32689094543457, "global_step": 202573, "epoch": 1205} {"train_loss": -11.413686752319336, "global_step": 202574, "epoch": 1205} {"train_loss": -11.457401275634766, "global_step": 202575, "epoch": 1205} {"train_loss": -11.472953796386719, "global_step": 202576, "epoch": 1205} {"train_loss": -11.30942153930664, "global_step": 202577, "epoch": 1205} {"train_loss": -11.606399536132812, "global_step": 202578, "epoch": 1205} {"train_loss": -11.443814277648926, "global_step": 202579, "epoch": 1205} {"train_loss": -11.503351211547852, "global_step": 202580, "epoch": 1205} {"train_loss": -11.516072273254395, "global_step": 202581, "epoch": 1205} {"train_loss": -11.640253067016602, "global_step": 202582, "epoch": 1205} {"train_loss": -11.472360610961914, "global_step": 202583, "epoch": 1205} {"train_loss": -11.482717514038086, "global_step": 202584, "epoch": 1205} {"train_loss": -11.619142532348633, "global_step": 202585, "epoch": 1205} {"train_loss": -11.407485008239746, "global_step": 202586, "epoch": 1205} {"train_loss": -11.58437728881836, "global_step": 202587, "epoch": 1205} {"train_loss": -11.536933898925781, "global_step": 202588, "epoch": 1205} {"train_loss": -11.418330192565918, "global_step": 202589, "epoch": 1205} {"train_loss": -11.469976425170898, "global_step": 202590, "epoch": 1205} {"train_loss": -11.305160522460938, "global_step": 202591, "epoch": 1205} {"train_loss": -11.415475845336914, "global_step": 202592, "epoch": 1205} {"train_loss": -11.274044036865234, "global_step": 202593, "epoch": 1205} {"train_loss": -11.30467414855957, "global_step": 202594, "epoch": 1205} {"train_loss": -10.361790657043457, "global_step": 202595, "epoch": 1205} {"train_loss": -11.220998764038086, "global_step": 202596, "epoch": 1205} {"train_loss": -11.046881675720215, "global_step": 202597, "epoch": 1205} {"train_loss": -10.987934112548828, "global_step": 202598, "epoch": 1205} {"train_loss": -11.073965072631836, "global_step": 202599, "epoch": 1205} {"train_loss": -10.984308242797852, "global_step": 202600, "epoch": 1205} {"train_loss": -11.499153137207031, "global_step": 202601, "epoch": 1205} {"train_loss": -10.8024263381958, "global_step": 202602, "epoch": 1205} {"train_loss": -11.448110580444336, "global_step": 202603, "epoch": 1205} {"train_loss": -10.81316089630127, "global_step": 202604, "epoch": 1205} {"train_loss": -11.300525665283203, "global_step": 202605, "epoch": 1205} {"train_loss": -10.861560821533203, "global_step": 202606, "epoch": 1205} {"train_loss": -11.204190316654387, "global_step": 202607, "epoch": 1205, "val_loss": 247607.5, "train_action_mse_error": 2.184370756149292} {"train_loss": -11.236234664916992, "global_step": 202608, "epoch": 1206} {"train_loss": -10.821038246154785, "global_step": 202609, "epoch": 1206} {"train_loss": -10.967375755310059, "global_step": 202610, "epoch": 1206} {"train_loss": -11.330646514892578, "global_step": 202611, "epoch": 1206} {"train_loss": -11.284134864807129, "global_step": 202612, "epoch": 1206} {"train_loss": -11.289621353149414, "global_step": 202613, "epoch": 1206} {"train_loss": -11.398113250732422, "global_step": 202614, "epoch": 1206} {"train_loss": -10.856468200683594, "global_step": 202615, "epoch": 1206} {"train_loss": -10.74698543548584, "global_step": 202616, "epoch": 1206} {"train_loss": -11.059488296508789, "global_step": 202617, "epoch": 1206} {"train_loss": -11.148859024047852, "global_step": 202618, "epoch": 1206} {"train_loss": -10.941469192504883, "global_step": 202619, "epoch": 1206} {"train_loss": -11.402868270874023, "global_step": 202620, "epoch": 1206} {"train_loss": -11.07132339477539, "global_step": 202621, "epoch": 1206} {"train_loss": -11.340238571166992, "global_step": 202622, "epoch": 1206} {"train_loss": -11.03144645690918, "global_step": 202623, "epoch": 1206} {"train_loss": -10.860921859741211, "global_step": 202624, "epoch": 1206} {"train_loss": -11.358352661132812, "global_step": 202625, "epoch": 1206} {"train_loss": -11.2577543258667, "global_step": 202626, "epoch": 1206} {"train_loss": -11.431011199951172, "global_step": 202627, "epoch": 1206} {"train_loss": -11.405933380126953, "global_step": 202628, "epoch": 1206} {"train_loss": -11.1359281539917, "global_step": 202629, "epoch": 1206} {"train_loss": -11.464337348937988, "global_step": 202630, "epoch": 1206} {"train_loss": -11.142982482910156, "global_step": 202631, "epoch": 1206} {"train_loss": -11.537942886352539, "global_step": 202632, "epoch": 1206} {"train_loss": -11.285178184509277, "global_step": 202633, "epoch": 1206} {"train_loss": -11.465425491333008, "global_step": 202634, "epoch": 1206} {"train_loss": -11.500190734863281, "global_step": 202635, "epoch": 1206} {"train_loss": -11.241253852844238, "global_step": 202636, "epoch": 1206} {"train_loss": -11.721410751342773, "global_step": 202637, "epoch": 1206} {"train_loss": -11.437355995178223, "global_step": 202638, "epoch": 1206} {"train_loss": -11.398401260375977, "global_step": 202639, "epoch": 1206} {"train_loss": -11.430803298950195, "global_step": 202640, "epoch": 1206} {"train_loss": -11.36246109008789, "global_step": 202641, "epoch": 1206} {"train_loss": -11.543328285217285, "global_step": 202642, "epoch": 1206} {"train_loss": -11.454575538635254, "global_step": 202643, "epoch": 1206} {"train_loss": -11.515323638916016, "global_step": 202644, "epoch": 1206} {"train_loss": -11.34521484375, "global_step": 202645, "epoch": 1206} {"train_loss": -11.432193756103516, "global_step": 202646, "epoch": 1206} {"train_loss": -11.442365646362305, "global_step": 202647, "epoch": 1206} {"train_loss": -11.338687896728516, "global_step": 202648, "epoch": 1206} {"train_loss": -11.170492172241211, "global_step": 202649, "epoch": 1206} {"train_loss": -11.43079948425293, "global_step": 202650, "epoch": 1206} {"train_loss": -11.22072982788086, "global_step": 202651, "epoch": 1206} {"train_loss": -11.556917190551758, "global_step": 202652, "epoch": 1206} {"train_loss": -11.355066299438477, "global_step": 202653, "epoch": 1206} {"train_loss": -11.594764709472656, "global_step": 202654, "epoch": 1206} {"train_loss": -11.234010696411133, "global_step": 202655, "epoch": 1206} {"train_loss": -11.65158748626709, "global_step": 202656, "epoch": 1206} {"train_loss": -11.117856979370117, "global_step": 202657, "epoch": 1206} {"train_loss": -11.390077590942383, "global_step": 202658, "epoch": 1206} {"train_loss": -11.012054443359375, "global_step": 202659, "epoch": 1206} {"train_loss": -11.373714447021484, "global_step": 202660, "epoch": 1206} {"train_loss": -11.168171882629395, "global_step": 202661, "epoch": 1206} {"train_loss": -10.404624938964844, "global_step": 202662, "epoch": 1206} {"train_loss": -11.37328815460205, "global_step": 202663, "epoch": 1206} {"train_loss": -10.814213752746582, "global_step": 202664, "epoch": 1206} {"train_loss": -11.056324005126953, "global_step": 202665, "epoch": 1206} {"train_loss": -11.214349746704102, "global_step": 202666, "epoch": 1206} {"train_loss": -10.816068649291992, "global_step": 202667, "epoch": 1206} {"train_loss": -10.929800987243652, "global_step": 202668, "epoch": 1206} {"train_loss": -10.656059265136719, "global_step": 202669, "epoch": 1206} {"train_loss": -10.455435752868652, "global_step": 202670, "epoch": 1206} {"train_loss": -10.797033309936523, "global_step": 202671, "epoch": 1206} {"train_loss": -10.504664421081543, "global_step": 202672, "epoch": 1206} {"train_loss": -10.949941635131836, "global_step": 202673, "epoch": 1206} {"train_loss": -10.777860641479492, "global_step": 202674, "epoch": 1206} {"train_loss": -10.691834449768066, "global_step": 202675, "epoch": 1206} {"train_loss": -10.34000015258789, "global_step": 202676, "epoch": 1206} {"train_loss": -10.227298736572266, "global_step": 202677, "epoch": 1206} {"train_loss": -10.84396743774414, "global_step": 202678, "epoch": 1206} {"train_loss": -10.618790626525879, "global_step": 202679, "epoch": 1206} {"train_loss": -10.629100799560547, "global_step": 202680, "epoch": 1206} {"train_loss": -10.830580711364746, "global_step": 202681, "epoch": 1206} {"train_loss": -11.126026153564453, "global_step": 202682, "epoch": 1206} {"train_loss": -10.951034545898438, "global_step": 202683, "epoch": 1206} {"train_loss": -10.96295166015625, "global_step": 202684, "epoch": 1206} {"train_loss": -10.414863586425781, "global_step": 202685, "epoch": 1206} {"train_loss": -11.02554702758789, "global_step": 202686, "epoch": 1206} {"train_loss": -10.909259796142578, "global_step": 202687, "epoch": 1206} {"train_loss": -10.990720748901367, "global_step": 202688, "epoch": 1206} {"train_loss": -10.935625076293945, "global_step": 202689, "epoch": 1206} {"train_loss": -10.932605743408203, "global_step": 202690, "epoch": 1206} {"train_loss": -10.634763717651367, "global_step": 202691, "epoch": 1206} {"train_loss": -11.045793533325195, "global_step": 202692, "epoch": 1206} {"train_loss": -11.018768310546875, "global_step": 202693, "epoch": 1206} {"train_loss": -11.265570640563965, "global_step": 202694, "epoch": 1206} {"train_loss": -11.205704689025879, "global_step": 202695, "epoch": 1206} {"train_loss": -11.389128684997559, "global_step": 202696, "epoch": 1206} {"train_loss": -11.324318885803223, "global_step": 202697, "epoch": 1206} {"train_loss": -11.40811824798584, "global_step": 202698, "epoch": 1206} {"train_loss": -11.446981430053711, "global_step": 202699, "epoch": 1206} {"train_loss": -11.233787536621094, "global_step": 202700, "epoch": 1206} {"train_loss": -11.584917068481445, "global_step": 202701, "epoch": 1206} {"train_loss": -11.129400253295898, "global_step": 202702, "epoch": 1206} {"train_loss": -11.47564697265625, "global_step": 202703, "epoch": 1206} {"train_loss": -11.569757461547852, "global_step": 202704, "epoch": 1206} {"train_loss": -11.667795181274414, "global_step": 202705, "epoch": 1206} {"train_loss": -11.107002258300781, "global_step": 202706, "epoch": 1206} {"train_loss": -11.40180778503418, "global_step": 202707, "epoch": 1206} {"train_loss": -11.339641571044922, "global_step": 202708, "epoch": 1206} {"train_loss": -11.300539016723633, "global_step": 202709, "epoch": 1206} {"train_loss": -11.536401748657227, "global_step": 202710, "epoch": 1206} {"train_loss": -11.275703430175781, "global_step": 202711, "epoch": 1206} {"train_loss": -11.310415267944336, "global_step": 202712, "epoch": 1206} {"train_loss": -11.50906753540039, "global_step": 202713, "epoch": 1206} {"train_loss": -11.437314987182617, "global_step": 202714, "epoch": 1206} {"train_loss": -11.53791618347168, "global_step": 202715, "epoch": 1206} {"train_loss": -11.254612922668457, "global_step": 202716, "epoch": 1206} {"train_loss": -11.427370071411133, "global_step": 202717, "epoch": 1206} {"train_loss": -11.106910705566406, "global_step": 202718, "epoch": 1206} {"train_loss": -11.388154983520508, "global_step": 202719, "epoch": 1206} {"train_loss": -11.239227294921875, "global_step": 202720, "epoch": 1206} {"train_loss": -11.381526947021484, "global_step": 202721, "epoch": 1206} {"train_loss": -11.340633392333984, "global_step": 202722, "epoch": 1206} {"train_loss": -11.317020416259766, "global_step": 202723, "epoch": 1206} {"train_loss": -11.356759071350098, "global_step": 202724, "epoch": 1206} {"train_loss": -11.339641571044922, "global_step": 202725, "epoch": 1206} {"train_loss": -11.54200553894043, "global_step": 202726, "epoch": 1206} {"train_loss": -11.530118942260742, "global_step": 202727, "epoch": 1206} {"train_loss": -10.998611450195312, "global_step": 202728, "epoch": 1206} {"train_loss": -11.806697845458984, "global_step": 202729, "epoch": 1206} {"train_loss": -11.208234786987305, "global_step": 202730, "epoch": 1206} {"train_loss": -11.316325187683105, "global_step": 202731, "epoch": 1206} {"train_loss": -11.638399124145508, "global_step": 202732, "epoch": 1206} {"train_loss": -10.896041870117188, "global_step": 202733, "epoch": 1206} {"train_loss": -11.320318222045898, "global_step": 202734, "epoch": 1206} {"train_loss": -11.424667358398438, "global_step": 202735, "epoch": 1206} {"train_loss": -11.233259201049805, "global_step": 202736, "epoch": 1206} {"train_loss": -11.711746215820312, "global_step": 202737, "epoch": 1206} {"train_loss": -11.330375671386719, "global_step": 202738, "epoch": 1206} {"train_loss": -11.349752426147461, "global_step": 202739, "epoch": 1206} {"train_loss": -11.190446853637695, "global_step": 202740, "epoch": 1206} {"train_loss": -11.46494197845459, "global_step": 202741, "epoch": 1206} {"train_loss": -11.14413833618164, "global_step": 202742, "epoch": 1206} {"train_loss": -11.323186874389648, "global_step": 202743, "epoch": 1206} {"train_loss": -11.21176528930664, "global_step": 202744, "epoch": 1206} {"train_loss": -11.146142959594727, "global_step": 202745, "epoch": 1206} {"train_loss": -11.408313751220703, "global_step": 202746, "epoch": 1206} {"train_loss": -11.356374740600586, "global_step": 202747, "epoch": 1206} {"train_loss": -11.701833724975586, "global_step": 202748, "epoch": 1206} {"train_loss": -11.175745010375977, "global_step": 202749, "epoch": 1206} {"train_loss": -11.242584228515625, "global_step": 202750, "epoch": 1206} {"train_loss": -11.394906044006348, "global_step": 202751, "epoch": 1206} {"train_loss": -11.29509162902832, "global_step": 202752, "epoch": 1206} {"train_loss": -11.320457458496094, "global_step": 202753, "epoch": 1206} {"train_loss": -11.714159965515137, "global_step": 202754, "epoch": 1206} {"train_loss": -11.25339126586914, "global_step": 202755, "epoch": 1206} {"train_loss": -11.698189735412598, "global_step": 202756, "epoch": 1206} {"train_loss": -11.480945587158203, "global_step": 202757, "epoch": 1206} {"train_loss": -11.701740264892578, "global_step": 202758, "epoch": 1206} {"train_loss": -11.512033462524414, "global_step": 202759, "epoch": 1206} {"train_loss": -11.27491569519043, "global_step": 202760, "epoch": 1206} {"train_loss": -11.619905471801758, "global_step": 202761, "epoch": 1206} {"train_loss": -11.1448974609375, "global_step": 202762, "epoch": 1206} {"train_loss": -11.304230690002441, "global_step": 202763, "epoch": 1206} {"train_loss": -11.280628204345703, "global_step": 202764, "epoch": 1206} {"train_loss": -11.567544937133789, "global_step": 202765, "epoch": 1206} {"train_loss": -11.475892066955566, "global_step": 202766, "epoch": 1206} {"train_loss": -11.383966445922852, "global_step": 202767, "epoch": 1206} {"train_loss": -11.55473518371582, "global_step": 202768, "epoch": 1206} {"train_loss": -11.577762603759766, "global_step": 202769, "epoch": 1206} {"train_loss": -11.565350532531738, "global_step": 202770, "epoch": 1206} {"train_loss": -11.497099876403809, "global_step": 202771, "epoch": 1206} {"train_loss": -11.470576286315918, "global_step": 202772, "epoch": 1206} {"train_loss": -11.40269660949707, "global_step": 202773, "epoch": 1206} {"train_loss": -11.395620346069336, "global_step": 202774, "epoch": 1206} {"train_loss": -11.237992411568051, "global_step": 202775, "epoch": 1206, "val_loss": 247830.578125} {"train_loss": -11.431849479675293, "global_step": 202776, "epoch": 1207} {"train_loss": -10.598329544067383, "global_step": 202777, "epoch": 1207} {"train_loss": -11.544425964355469, "global_step": 202778, "epoch": 1207} {"train_loss": -10.578315734863281, "global_step": 202779, "epoch": 1207} {"train_loss": -11.008435249328613, "global_step": 202780, "epoch": 1207} {"train_loss": -11.081220626831055, "global_step": 202781, "epoch": 1207} {"train_loss": -10.875840187072754, "global_step": 202782, "epoch": 1207} {"train_loss": -10.843367576599121, "global_step": 202783, "epoch": 1207} {"train_loss": -11.444160461425781, "global_step": 202784, "epoch": 1207} {"train_loss": -11.028593063354492, "global_step": 202785, "epoch": 1207} {"train_loss": -10.91657829284668, "global_step": 202786, "epoch": 1207} {"train_loss": -11.689952850341797, "global_step": 202787, "epoch": 1207} {"train_loss": -10.954387664794922, "global_step": 202788, "epoch": 1207} {"train_loss": -11.441818237304688, "global_step": 202789, "epoch": 1207} {"train_loss": -11.417863845825195, "global_step": 202790, "epoch": 1207} {"train_loss": -11.16707706451416, "global_step": 202791, "epoch": 1207} {"train_loss": -11.601741790771484, "global_step": 202792, "epoch": 1207} {"train_loss": -11.274429321289062, "global_step": 202793, "epoch": 1207} {"train_loss": -11.293163299560547, "global_step": 202794, "epoch": 1207} {"train_loss": -11.012162208557129, "global_step": 202795, "epoch": 1207} {"train_loss": -11.314861297607422, "global_step": 202796, "epoch": 1207} {"train_loss": -11.123876571655273, "global_step": 202797, "epoch": 1207} {"train_loss": -11.496322631835938, "global_step": 202798, "epoch": 1207} {"train_loss": -11.124579429626465, "global_step": 202799, "epoch": 1207} {"train_loss": -11.584980010986328, "global_step": 202800, "epoch": 1207} {"train_loss": -11.051154136657715, "global_step": 202801, "epoch": 1207} {"train_loss": -11.40172290802002, "global_step": 202802, "epoch": 1207} {"train_loss": -11.090656280517578, "global_step": 202803, "epoch": 1207} {"train_loss": -11.225257873535156, "global_step": 202804, "epoch": 1207} {"train_loss": -11.007625579833984, "global_step": 202805, "epoch": 1207} {"train_loss": -11.370616912841797, "global_step": 202806, "epoch": 1207} {"train_loss": -11.386553764343262, "global_step": 202807, "epoch": 1207} {"train_loss": -11.24434757232666, "global_step": 202808, "epoch": 1207} {"train_loss": -11.307417869567871, "global_step": 202809, "epoch": 1207} {"train_loss": -10.869100570678711, "global_step": 202810, "epoch": 1207} {"train_loss": -11.480523109436035, "global_step": 202811, "epoch": 1207} {"train_loss": -11.328401565551758, "global_step": 202812, "epoch": 1207} {"train_loss": -11.077421188354492, "global_step": 202813, "epoch": 1207} {"train_loss": -11.04494857788086, "global_step": 202814, "epoch": 1207} {"train_loss": -11.440078735351562, "global_step": 202815, "epoch": 1207} {"train_loss": -11.162263870239258, "global_step": 202816, "epoch": 1207} {"train_loss": -11.148214340209961, "global_step": 202817, "epoch": 1207} {"train_loss": -11.361385345458984, "global_step": 202818, "epoch": 1207} {"train_loss": -11.130073547363281, "global_step": 202819, "epoch": 1207} {"train_loss": -11.498027801513672, "global_step": 202820, "epoch": 1207} {"train_loss": -11.242548942565918, "global_step": 202821, "epoch": 1207} {"train_loss": -11.37871265411377, "global_step": 202822, "epoch": 1207} {"train_loss": -10.999011993408203, "global_step": 202823, "epoch": 1207} {"train_loss": -11.447379112243652, "global_step": 202824, "epoch": 1207} {"train_loss": -11.184978485107422, "global_step": 202825, "epoch": 1207} {"train_loss": -11.204944610595703, "global_step": 202826, "epoch": 1207} {"train_loss": -11.544149398803711, "global_step": 202827, "epoch": 1207} {"train_loss": -11.280073165893555, "global_step": 202828, "epoch": 1207} {"train_loss": -11.402931213378906, "global_step": 202829, "epoch": 1207} {"train_loss": -11.419891357421875, "global_step": 202830, "epoch": 1207} {"train_loss": -11.263072967529297, "global_step": 202831, "epoch": 1207} {"train_loss": -11.51513671875, "global_step": 202832, "epoch": 1207} {"train_loss": -11.298563003540039, "global_step": 202833, "epoch": 1207} {"train_loss": -11.616805076599121, "global_step": 202834, "epoch": 1207} {"train_loss": -11.558334350585938, "global_step": 202835, "epoch": 1207} {"train_loss": -11.525230407714844, "global_step": 202836, "epoch": 1207} {"train_loss": -11.518226623535156, "global_step": 202837, "epoch": 1207} {"train_loss": -11.462272644042969, "global_step": 202838, "epoch": 1207} {"train_loss": -11.386322021484375, "global_step": 202839, "epoch": 1207} {"train_loss": -11.51157283782959, "global_step": 202840, "epoch": 1207} {"train_loss": -11.472500801086426, "global_step": 202841, "epoch": 1207} {"train_loss": -11.360962867736816, "global_step": 202842, "epoch": 1207} {"train_loss": -11.358926773071289, "global_step": 202843, "epoch": 1207} {"train_loss": -11.418049812316895, "global_step": 202844, "epoch": 1207} {"train_loss": -11.313470840454102, "global_step": 202845, "epoch": 1207} {"train_loss": -11.38713550567627, "global_step": 202846, "epoch": 1207} {"train_loss": -11.845975875854492, "global_step": 202847, "epoch": 1207} {"train_loss": -11.405876159667969, "global_step": 202848, "epoch": 1207} {"train_loss": -11.517913818359375, "global_step": 202849, "epoch": 1207} {"train_loss": -11.766111373901367, "global_step": 202850, "epoch": 1207} {"train_loss": -11.687222480773926, "global_step": 202851, "epoch": 1207} {"train_loss": -11.763172149658203, "global_step": 202852, "epoch": 1207} {"train_loss": -11.444820404052734, "global_step": 202853, "epoch": 1207} {"train_loss": -11.36884880065918, "global_step": 202854, "epoch": 1207} {"train_loss": -11.629429817199707, "global_step": 202855, "epoch": 1207} {"train_loss": -11.690071105957031, "global_step": 202856, "epoch": 1207} {"train_loss": -11.605301856994629, "global_step": 202857, "epoch": 1207} {"train_loss": -11.774431228637695, "global_step": 202858, "epoch": 1207} {"train_loss": -11.48876953125, "global_step": 202859, "epoch": 1207} {"train_loss": -11.622997283935547, "global_step": 202860, "epoch": 1207} {"train_loss": -11.769149780273438, "global_step": 202861, "epoch": 1207} {"train_loss": -11.645772933959961, "global_step": 202862, "epoch": 1207} {"train_loss": -11.707647323608398, "global_step": 202863, "epoch": 1207} {"train_loss": -11.699213027954102, "global_step": 202864, "epoch": 1207} {"train_loss": -11.598966598510742, "global_step": 202865, "epoch": 1207} {"train_loss": -11.655499458312988, "global_step": 202866, "epoch": 1207} {"train_loss": -11.802526473999023, "global_step": 202867, "epoch": 1207} {"train_loss": -11.636236190795898, "global_step": 202868, "epoch": 1207} {"train_loss": -11.781989097595215, "global_step": 202869, "epoch": 1207} {"train_loss": -11.74402141571045, "global_step": 202870, "epoch": 1207} {"train_loss": -11.849414825439453, "global_step": 202871, "epoch": 1207} {"train_loss": -11.680669784545898, "global_step": 202872, "epoch": 1207} {"train_loss": -11.48369026184082, "global_step": 202873, "epoch": 1207} {"train_loss": -11.462697982788086, "global_step": 202874, "epoch": 1207} {"train_loss": -11.54299545288086, "global_step": 202875, "epoch": 1207} {"train_loss": -11.262504577636719, "global_step": 202876, "epoch": 1207} {"train_loss": -11.48029899597168, "global_step": 202877, "epoch": 1207} {"train_loss": -11.083318710327148, "global_step": 202878, "epoch": 1207} {"train_loss": -11.006692886352539, "global_step": 202879, "epoch": 1207} {"train_loss": -10.642916679382324, "global_step": 202880, "epoch": 1207} {"train_loss": -11.830862045288086, "global_step": 202881, "epoch": 1207} {"train_loss": -9.980697631835938, "global_step": 202882, "epoch": 1207} {"train_loss": -10.182511329650879, "global_step": 202883, "epoch": 1207} {"train_loss": -9.81096076965332, "global_step": 202884, "epoch": 1207} {"train_loss": -10.62944221496582, "global_step": 202885, "epoch": 1207} {"train_loss": -10.728034973144531, "global_step": 202886, "epoch": 1207} {"train_loss": -11.262592315673828, "global_step": 202887, "epoch": 1207} {"train_loss": -10.863729476928711, "global_step": 202888, "epoch": 1207} {"train_loss": -11.736503601074219, "global_step": 202889, "epoch": 1207} {"train_loss": -11.182962417602539, "global_step": 202890, "epoch": 1207} {"train_loss": -11.13867473602295, "global_step": 202891, "epoch": 1207} {"train_loss": -11.188915252685547, "global_step": 202892, "epoch": 1207} {"train_loss": -11.296005249023438, "global_step": 202893, "epoch": 1207} {"train_loss": -10.658285140991211, "global_step": 202894, "epoch": 1207} {"train_loss": -11.171134948730469, "global_step": 202895, "epoch": 1207} {"train_loss": -10.638385772705078, "global_step": 202896, "epoch": 1207} {"train_loss": -10.551464080810547, "global_step": 202897, "epoch": 1207} {"train_loss": -11.394222259521484, "global_step": 202898, "epoch": 1207} {"train_loss": -11.04791259765625, "global_step": 202899, "epoch": 1207} {"train_loss": -11.381682395935059, "global_step": 202900, "epoch": 1207} {"train_loss": -11.44471549987793, "global_step": 202901, "epoch": 1207} {"train_loss": -11.329843521118164, "global_step": 202902, "epoch": 1207} {"train_loss": -11.509319305419922, "global_step": 202903, "epoch": 1207} {"train_loss": -11.50730037689209, "global_step": 202904, "epoch": 1207} {"train_loss": -11.621448516845703, "global_step": 202905, "epoch": 1207} {"train_loss": -11.56552791595459, "global_step": 202906, "epoch": 1207} {"train_loss": -11.598381996154785, "global_step": 202907, "epoch": 1207} {"train_loss": -11.679664611816406, "global_step": 202908, "epoch": 1207} {"train_loss": -11.334022521972656, "global_step": 202909, "epoch": 1207} {"train_loss": -11.591854095458984, "global_step": 202910, "epoch": 1207} {"train_loss": -11.392374038696289, "global_step": 202911, "epoch": 1207} {"train_loss": -11.509727478027344, "global_step": 202912, "epoch": 1207} {"train_loss": -11.569887161254883, "global_step": 202913, "epoch": 1207} {"train_loss": -11.608631134033203, "global_step": 202914, "epoch": 1207} {"train_loss": -11.252237319946289, "global_step": 202915, "epoch": 1207} {"train_loss": -11.71377944946289, "global_step": 202916, "epoch": 1207} {"train_loss": -11.529535293579102, "global_step": 202917, "epoch": 1207} {"train_loss": -11.470843315124512, "global_step": 202918, "epoch": 1207} {"train_loss": -11.65638256072998, "global_step": 202919, "epoch": 1207} {"train_loss": -11.077234268188477, "global_step": 202920, "epoch": 1207} {"train_loss": -11.370182037353516, "global_step": 202921, "epoch": 1207} {"train_loss": -10.869601249694824, "global_step": 202922, "epoch": 1207} {"train_loss": -10.045504570007324, "global_step": 202923, "epoch": 1207} {"train_loss": -10.134181022644043, "global_step": 202924, "epoch": 1207} {"train_loss": -11.202409744262695, "global_step": 202925, "epoch": 1207} {"train_loss": -9.832082748413086, "global_step": 202926, "epoch": 1207} {"train_loss": -11.478799819946289, "global_step": 202927, "epoch": 1207} {"train_loss": -10.366255760192871, "global_step": 202928, "epoch": 1207} {"train_loss": -11.139015197753906, "global_step": 202929, "epoch": 1207} {"train_loss": -11.23406982421875, "global_step": 202930, "epoch": 1207} {"train_loss": -11.3860502243042, "global_step": 202931, "epoch": 1207} {"train_loss": -11.4585599899292, "global_step": 202932, "epoch": 1207} {"train_loss": -11.211745262145996, "global_step": 202933, "epoch": 1207} {"train_loss": -11.376802444458008, "global_step": 202934, "epoch": 1207} {"train_loss": -11.425586700439453, "global_step": 202935, "epoch": 1207} {"train_loss": -11.092111587524414, "global_step": 202936, "epoch": 1207} {"train_loss": -11.254300117492676, "global_step": 202937, "epoch": 1207} {"train_loss": -11.118715286254883, "global_step": 202938, "epoch": 1207} {"train_loss": -11.73551082611084, "global_step": 202939, "epoch": 1207} {"train_loss": -11.015380859375, "global_step": 202940, "epoch": 1207} {"train_loss": -11.16893482208252, "global_step": 202941, "epoch": 1207} {"train_loss": -11.392913818359375, "global_step": 202942, "epoch": 1207} {"train_loss": -11.289554238319397, "global_step": 202943, "epoch": 1207, "val_loss": 251160.828125} {"train_loss": -11.466135025024414, "global_step": 202944, "epoch": 1208} {"train_loss": -11.37631893157959, "global_step": 202945, "epoch": 1208} {"train_loss": -11.177169799804688, "global_step": 202946, "epoch": 1208} {"train_loss": -11.46422004699707, "global_step": 202947, "epoch": 1208} {"train_loss": -11.249099731445312, "global_step": 202948, "epoch": 1208} {"train_loss": -11.456852912902832, "global_step": 202949, "epoch": 1208} {"train_loss": -11.336122512817383, "global_step": 202950, "epoch": 1208} {"train_loss": -11.37394905090332, "global_step": 202951, "epoch": 1208} {"train_loss": -11.139244079589844, "global_step": 202952, "epoch": 1208} {"train_loss": -11.353353500366211, "global_step": 202953, "epoch": 1208} {"train_loss": -11.161184310913086, "global_step": 202954, "epoch": 1208} {"train_loss": -11.397733688354492, "global_step": 202955, "epoch": 1208} {"train_loss": -11.14425277709961, "global_step": 202956, "epoch": 1208} {"train_loss": -11.513517379760742, "global_step": 202957, "epoch": 1208} {"train_loss": -11.743267059326172, "global_step": 202958, "epoch": 1208} {"train_loss": -11.62844467163086, "global_step": 202959, "epoch": 1208} {"train_loss": -11.473793029785156, "global_step": 202960, "epoch": 1208} {"train_loss": -11.654476165771484, "global_step": 202961, "epoch": 1208} {"train_loss": -11.750158309936523, "global_step": 202962, "epoch": 1208} {"train_loss": -11.607585906982422, "global_step": 202963, "epoch": 1208} {"train_loss": -11.387187957763672, "global_step": 202964, "epoch": 1208} {"train_loss": -11.3954439163208, "global_step": 202965, "epoch": 1208} {"train_loss": -11.529303550720215, "global_step": 202966, "epoch": 1208} {"train_loss": -11.479249000549316, "global_step": 202967, "epoch": 1208} {"train_loss": -11.556439399719238, "global_step": 202968, "epoch": 1208} {"train_loss": -11.669647216796875, "global_step": 202969, "epoch": 1208} {"train_loss": -11.817526817321777, "global_step": 202970, "epoch": 1208} {"train_loss": -11.646698951721191, "global_step": 202971, "epoch": 1208} {"train_loss": -11.796565055847168, "global_step": 202972, "epoch": 1208} {"train_loss": -11.65918254852295, "global_step": 202973, "epoch": 1208} {"train_loss": -11.59016227722168, "global_step": 202974, "epoch": 1208} {"train_loss": -11.630867958068848, "global_step": 202975, "epoch": 1208} {"train_loss": -11.833110809326172, "global_step": 202976, "epoch": 1208} {"train_loss": -11.684322357177734, "global_step": 202977, "epoch": 1208} {"train_loss": -11.789190292358398, "global_step": 202978, "epoch": 1208} {"train_loss": -11.645267486572266, "global_step": 202979, "epoch": 1208} {"train_loss": -12.020580291748047, "global_step": 202980, "epoch": 1208} {"train_loss": -11.724257469177246, "global_step": 202981, "epoch": 1208} {"train_loss": -11.74476432800293, "global_step": 202982, "epoch": 1208} {"train_loss": -11.923846244812012, "global_step": 202983, "epoch": 1208} {"train_loss": -11.711197853088379, "global_step": 202984, "epoch": 1208} {"train_loss": -11.628402709960938, "global_step": 202985, "epoch": 1208} {"train_loss": -11.814569473266602, "global_step": 202986, "epoch": 1208} {"train_loss": -11.844436645507812, "global_step": 202987, "epoch": 1208} {"train_loss": -11.589262962341309, "global_step": 202988, "epoch": 1208} {"train_loss": -11.414093017578125, "global_step": 202989, "epoch": 1208} {"train_loss": -11.520809173583984, "global_step": 202990, "epoch": 1208} {"train_loss": -11.380470275878906, "global_step": 202991, "epoch": 1208} {"train_loss": -11.376751899719238, "global_step": 202992, "epoch": 1208} {"train_loss": -11.90069580078125, "global_step": 202993, "epoch": 1208} {"train_loss": -10.925569534301758, "global_step": 202994, "epoch": 1208} {"train_loss": -10.984857559204102, "global_step": 202995, "epoch": 1208} {"train_loss": -11.316113471984863, "global_step": 202996, "epoch": 1208} {"train_loss": -11.55893325805664, "global_step": 202997, "epoch": 1208} {"train_loss": -11.12077808380127, "global_step": 202998, "epoch": 1208} {"train_loss": -11.422469139099121, "global_step": 202999, "epoch": 1208} {"train_loss": -11.676656723022461, "global_step": 203000, "epoch": 1208} {"train_loss": -10.78537368774414, "global_step": 203001, "epoch": 1208} {"train_loss": -10.783496856689453, "global_step": 203002, "epoch": 1208} {"train_loss": -11.211596488952637, "global_step": 203003, "epoch": 1208} {"train_loss": -11.06554126739502, "global_step": 203004, "epoch": 1208} {"train_loss": -10.389078140258789, "global_step": 203005, "epoch": 1208} {"train_loss": -10.170984268188477, "global_step": 203006, "epoch": 1208} {"train_loss": -10.326364517211914, "global_step": 203007, "epoch": 1208} {"train_loss": -8.759820938110352, "global_step": 203008, "epoch": 1208} {"train_loss": -9.321407318115234, "global_step": 203009, "epoch": 1208} {"train_loss": -9.356969833374023, "global_step": 203010, "epoch": 1208} {"train_loss": -7.677952289581299, "global_step": 203011, "epoch": 1208} {"train_loss": -8.808944702148438, "global_step": 203012, "epoch": 1208} {"train_loss": -9.400071144104004, "global_step": 203013, "epoch": 1208} {"train_loss": -8.490882873535156, "global_step": 203014, "epoch": 1208} {"train_loss": -8.82278060913086, "global_step": 203015, "epoch": 1208} {"train_loss": -9.187994956970215, "global_step": 203016, "epoch": 1208} {"train_loss": -8.84325122833252, "global_step": 203017, "epoch": 1208} {"train_loss": -6.128934383392334, "global_step": 203018, "epoch": 1208} {"train_loss": -6.393570423126221, "global_step": 203019, "epoch": 1208} {"train_loss": -6.832113742828369, "global_step": 203020, "epoch": 1208} {"train_loss": -6.698488235473633, "global_step": 203021, "epoch": 1208} {"train_loss": -7.178323745727539, "global_step": 203022, "epoch": 1208} {"train_loss": -7.179538249969482, "global_step": 203023, "epoch": 1208} {"train_loss": -9.635866165161133, "global_step": 203024, "epoch": 1208} {"train_loss": -7.527735233306885, "global_step": 203025, "epoch": 1208} {"train_loss": -8.059197425842285, "global_step": 203026, "epoch": 1208} {"train_loss": -10.061807632446289, "global_step": 203027, "epoch": 1208} {"train_loss": -9.98034381866455, "global_step": 203028, "epoch": 1208} {"train_loss": -9.334537506103516, "global_step": 203029, "epoch": 1208} {"train_loss": -8.683886528015137, "global_step": 203030, "epoch": 1208} {"train_loss": -10.321502685546875, "global_step": 203031, "epoch": 1208} {"train_loss": -9.580774307250977, "global_step": 203032, "epoch": 1208} {"train_loss": -9.37623405456543, "global_step": 203033, "epoch": 1208} {"train_loss": -9.867769241333008, "global_step": 203034, "epoch": 1208} {"train_loss": -10.281301498413086, "global_step": 203035, "epoch": 1208} {"train_loss": -9.64475154876709, "global_step": 203036, "epoch": 1208} {"train_loss": -9.643928527832031, "global_step": 203037, "epoch": 1208} {"train_loss": -10.529012680053711, "global_step": 203038, "epoch": 1208} {"train_loss": -10.560276985168457, "global_step": 203039, "epoch": 1208} {"train_loss": -10.367437362670898, "global_step": 203040, "epoch": 1208} {"train_loss": -10.6966552734375, "global_step": 203041, "epoch": 1208} {"train_loss": -10.470802307128906, "global_step": 203042, "epoch": 1208} {"train_loss": -10.570932388305664, "global_step": 203043, "epoch": 1208} {"train_loss": -10.572639465332031, "global_step": 203044, "epoch": 1208} {"train_loss": -10.444555282592773, "global_step": 203045, "epoch": 1208} {"train_loss": -10.465083122253418, "global_step": 203046, "epoch": 1208} {"train_loss": -10.50900650024414, "global_step": 203047, "epoch": 1208} {"train_loss": -10.467168807983398, "global_step": 203048, "epoch": 1208} {"train_loss": -10.65860366821289, "global_step": 203049, "epoch": 1208} {"train_loss": -10.7415771484375, "global_step": 203050, "epoch": 1208} {"train_loss": -10.617467880249023, "global_step": 203051, "epoch": 1208} {"train_loss": -10.912671089172363, "global_step": 203052, "epoch": 1208} {"train_loss": -10.882978439331055, "global_step": 203053, "epoch": 1208} {"train_loss": -10.646369934082031, "global_step": 203054, "epoch": 1208} {"train_loss": -10.751420021057129, "global_step": 203055, "epoch": 1208} {"train_loss": -10.632986068725586, "global_step": 203056, "epoch": 1208} {"train_loss": -10.906698226928711, "global_step": 203057, "epoch": 1208} {"train_loss": -11.061756134033203, "global_step": 203058, "epoch": 1208} {"train_loss": -10.702817916870117, "global_step": 203059, "epoch": 1208} {"train_loss": -10.986560821533203, "global_step": 203060, "epoch": 1208} {"train_loss": -10.917454719543457, "global_step": 203061, "epoch": 1208} {"train_loss": -10.931184768676758, "global_step": 203062, "epoch": 1208} {"train_loss": -10.904667854309082, "global_step": 203063, "epoch": 1208} {"train_loss": -10.987957000732422, "global_step": 203064, "epoch": 1208} {"train_loss": -10.843996047973633, "global_step": 203065, "epoch": 1208} {"train_loss": -11.01636791229248, "global_step": 203066, "epoch": 1208} {"train_loss": -11.118704795837402, "global_step": 203067, "epoch": 1208} {"train_loss": -11.186493873596191, "global_step": 203068, "epoch": 1208} {"train_loss": -11.23221206665039, "global_step": 203069, "epoch": 1208} {"train_loss": -11.175447463989258, "global_step": 203070, "epoch": 1208} {"train_loss": -11.077942848205566, "global_step": 203071, "epoch": 1208} {"train_loss": -11.225250244140625, "global_step": 203072, "epoch": 1208} {"train_loss": -11.17424201965332, "global_step": 203073, "epoch": 1208} {"train_loss": -11.21098518371582, "global_step": 203074, "epoch": 1208} {"train_loss": -11.155094146728516, "global_step": 203075, "epoch": 1208} {"train_loss": -11.438100814819336, "global_step": 203076, "epoch": 1208} {"train_loss": -11.201982498168945, "global_step": 203077, "epoch": 1208} {"train_loss": -11.324639320373535, "global_step": 203078, "epoch": 1208} {"train_loss": -11.253369331359863, "global_step": 203079, "epoch": 1208} {"train_loss": -11.467825889587402, "global_step": 203080, "epoch": 1208} {"train_loss": -11.31045913696289, "global_step": 203081, "epoch": 1208} {"train_loss": -11.38105583190918, "global_step": 203082, "epoch": 1208} {"train_loss": -11.546314239501953, "global_step": 203083, "epoch": 1208} {"train_loss": -11.378058433532715, "global_step": 203084, "epoch": 1208} {"train_loss": -11.417316436767578, "global_step": 203085, "epoch": 1208} {"train_loss": -11.414859771728516, "global_step": 203086, "epoch": 1208} {"train_loss": -11.54110336303711, "global_step": 203087, "epoch": 1208} {"train_loss": -11.322263717651367, "global_step": 203088, "epoch": 1208} {"train_loss": -11.426778793334961, "global_step": 203089, "epoch": 1208} {"train_loss": -11.619836807250977, "global_step": 203090, "epoch": 1208} {"train_loss": -11.67419147491455, "global_step": 203091, "epoch": 1208} {"train_loss": -11.525346755981445, "global_step": 203092, "epoch": 1208} {"train_loss": -11.536235809326172, "global_step": 203093, "epoch": 1208} {"train_loss": -11.666057586669922, "global_step": 203094, "epoch": 1208} {"train_loss": -11.621050834655762, "global_step": 203095, "epoch": 1208} {"train_loss": -11.601051330566406, "global_step": 203096, "epoch": 1208} {"train_loss": -11.557042121887207, "global_step": 203097, "epoch": 1208} {"train_loss": -11.740924835205078, "global_step": 203098, "epoch": 1208} {"train_loss": -11.482358932495117, "global_step": 203099, "epoch": 1208} {"train_loss": -11.603707313537598, "global_step": 203100, "epoch": 1208} {"train_loss": -11.648189544677734, "global_step": 203101, "epoch": 1208} {"train_loss": -11.545528411865234, "global_step": 203102, "epoch": 1208} {"train_loss": -11.689728736877441, "global_step": 203103, "epoch": 1208} {"train_loss": -11.73338508605957, "global_step": 203104, "epoch": 1208} {"train_loss": -11.712472915649414, "global_step": 203105, "epoch": 1208} {"train_loss": -11.691186904907227, "global_step": 203106, "epoch": 1208} {"train_loss": -11.73779582977295, "global_step": 203107, "epoch": 1208} {"train_loss": -11.658775329589844, "global_step": 203108, "epoch": 1208} {"train_loss": -11.657435417175293, "global_step": 203109, "epoch": 1208} {"train_loss": -11.78770637512207, "global_step": 203110, "epoch": 1208} {"train_loss": -10.831624945004782, "global_step": 203111, "epoch": 1208, "val_loss": 243932.921875} {"train_loss": -11.677978515625, "global_step": 203112, "epoch": 1209} {"train_loss": -11.915098190307617, "global_step": 203113, "epoch": 1209} {"train_loss": -11.56161880493164, "global_step": 203114, "epoch": 1209} {"train_loss": -11.845075607299805, "global_step": 203115, "epoch": 1209} {"train_loss": -11.695650100708008, "global_step": 203116, "epoch": 1209} {"train_loss": -11.372407913208008, "global_step": 203117, "epoch": 1209} {"train_loss": -11.758949279785156, "global_step": 203118, "epoch": 1209} {"train_loss": -11.6405668258667, "global_step": 203119, "epoch": 1209} {"train_loss": -11.649185180664062, "global_step": 203120, "epoch": 1209} {"train_loss": -11.853315353393555, "global_step": 203121, "epoch": 1209} {"train_loss": -11.658910751342773, "global_step": 203122, "epoch": 1209} {"train_loss": -11.652765274047852, "global_step": 203123, "epoch": 1209} {"train_loss": -11.941171646118164, "global_step": 203124, "epoch": 1209} {"train_loss": -11.580572128295898, "global_step": 203125, "epoch": 1209} {"train_loss": -11.899537086486816, "global_step": 203126, "epoch": 1209} {"train_loss": -12.087808609008789, "global_step": 203127, "epoch": 1209} {"train_loss": -11.592094421386719, "global_step": 203128, "epoch": 1209} {"train_loss": -11.942444801330566, "global_step": 203129, "epoch": 1209} {"train_loss": -11.625579833984375, "global_step": 203130, "epoch": 1209} {"train_loss": -11.587957382202148, "global_step": 203131, "epoch": 1209} {"train_loss": -11.302227020263672, "global_step": 203132, "epoch": 1209} {"train_loss": -11.697759628295898, "global_step": 203133, "epoch": 1209} {"train_loss": -11.364377975463867, "global_step": 203134, "epoch": 1209} {"train_loss": -11.23924446105957, "global_step": 203135, "epoch": 1209} {"train_loss": -11.13569450378418, "global_step": 203136, "epoch": 1209} {"train_loss": -11.123851776123047, "global_step": 203137, "epoch": 1209} {"train_loss": -11.38161849975586, "global_step": 203138, "epoch": 1209} {"train_loss": -11.959333419799805, "global_step": 203139, "epoch": 1209} {"train_loss": -11.297439575195312, "global_step": 203140, "epoch": 1209} {"train_loss": -11.39615249633789, "global_step": 203141, "epoch": 1209} {"train_loss": -11.403961181640625, "global_step": 203142, "epoch": 1209} {"train_loss": -10.63665771484375, "global_step": 203143, "epoch": 1209} {"train_loss": -9.611817359924316, "global_step": 203144, "epoch": 1209} {"train_loss": -9.093174934387207, "global_step": 203145, "epoch": 1209} {"train_loss": -7.799533367156982, "global_step": 203146, "epoch": 1209} {"train_loss": -9.115835189819336, "global_step": 203147, "epoch": 1209} {"train_loss": -10.179887771606445, "global_step": 203148, "epoch": 1209} {"train_loss": -6.828861236572266, "global_step": 203149, "epoch": 1209} {"train_loss": -10.78770637512207, "global_step": 203150, "epoch": 1209} {"train_loss": -5.367175102233887, "global_step": 203151, "epoch": 1209} {"train_loss": -9.050922393798828, "global_step": 203152, "epoch": 1209} {"train_loss": -9.499696731567383, "global_step": 203153, "epoch": 1209} {"train_loss": -9.917488098144531, "global_step": 203154, "epoch": 1209} {"train_loss": -8.798030853271484, "global_step": 203155, "epoch": 1209} {"train_loss": -9.62664794921875, "global_step": 203156, "epoch": 1209} {"train_loss": -8.345029830932617, "global_step": 203157, "epoch": 1209} {"train_loss": -9.34621810913086, "global_step": 203158, "epoch": 1209} {"train_loss": -9.536539077758789, "global_step": 203159, "epoch": 1209} {"train_loss": -10.33500862121582, "global_step": 203160, "epoch": 1209} {"train_loss": -10.681976318359375, "global_step": 203161, "epoch": 1209} {"train_loss": -9.916003227233887, "global_step": 203162, "epoch": 1209} {"train_loss": -10.929332733154297, "global_step": 203163, "epoch": 1209} {"train_loss": -9.511978149414062, "global_step": 203164, "epoch": 1209} {"train_loss": -10.470232009887695, "global_step": 203165, "epoch": 1209} {"train_loss": -10.142534255981445, "global_step": 203166, "epoch": 1209} {"train_loss": -10.606880187988281, "global_step": 203167, "epoch": 1209} {"train_loss": -10.552740097045898, "global_step": 203168, "epoch": 1209} {"train_loss": -10.137929916381836, "global_step": 203169, "epoch": 1209} {"train_loss": -10.785700798034668, "global_step": 203170, "epoch": 1209} {"train_loss": -9.989044189453125, "global_step": 203171, "epoch": 1209} {"train_loss": -10.991029739379883, "global_step": 203172, "epoch": 1209} {"train_loss": -10.46449089050293, "global_step": 203173, "epoch": 1209} {"train_loss": -10.68904972076416, "global_step": 203174, "epoch": 1209} {"train_loss": -10.866362571716309, "global_step": 203175, "epoch": 1209} {"train_loss": -10.425885200500488, "global_step": 203176, "epoch": 1209} {"train_loss": -10.565420150756836, "global_step": 203177, "epoch": 1209} {"train_loss": -11.01516342163086, "global_step": 203178, "epoch": 1209} {"train_loss": -10.639054298400879, "global_step": 203179, "epoch": 1209} {"train_loss": -10.795004844665527, "global_step": 203180, "epoch": 1209} {"train_loss": -11.196690559387207, "global_step": 203181, "epoch": 1209} {"train_loss": -10.726444244384766, "global_step": 203182, "epoch": 1209} {"train_loss": -10.90609073638916, "global_step": 203183, "epoch": 1209} {"train_loss": -10.903334617614746, "global_step": 203184, "epoch": 1209} {"train_loss": -11.124964714050293, "global_step": 203185, "epoch": 1209} {"train_loss": -10.999330520629883, "global_step": 203186, "epoch": 1209} {"train_loss": -10.969313621520996, "global_step": 203187, "epoch": 1209} {"train_loss": -10.860660552978516, "global_step": 203188, "epoch": 1209} {"train_loss": -10.82437515258789, "global_step": 203189, "epoch": 1209} {"train_loss": -11.066965103149414, "global_step": 203190, "epoch": 1209} {"train_loss": -11.048337936401367, "global_step": 203191, "epoch": 1209} {"train_loss": -11.076789855957031, "global_step": 203192, "epoch": 1209} {"train_loss": -11.3167142868042, "global_step": 203193, "epoch": 1209} {"train_loss": -11.258220672607422, "global_step": 203194, "epoch": 1209} {"train_loss": -11.19474983215332, "global_step": 203195, "epoch": 1209} {"train_loss": -11.17819595336914, "global_step": 203196, "epoch": 1209} {"train_loss": -11.164421081542969, "global_step": 203197, "epoch": 1209} {"train_loss": -11.263235092163086, "global_step": 203198, "epoch": 1209} {"train_loss": -11.308956146240234, "global_step": 203199, "epoch": 1209} {"train_loss": -11.33086109161377, "global_step": 203200, "epoch": 1209} {"train_loss": -11.445730209350586, "global_step": 203201, "epoch": 1209} {"train_loss": -11.300259590148926, "global_step": 203202, "epoch": 1209} {"train_loss": -11.37033462524414, "global_step": 203203, "epoch": 1209} {"train_loss": -11.316143035888672, "global_step": 203204, "epoch": 1209} {"train_loss": -11.174482345581055, "global_step": 203205, "epoch": 1209} {"train_loss": -11.267848014831543, "global_step": 203206, "epoch": 1209} {"train_loss": -11.486885070800781, "global_step": 203207, "epoch": 1209} {"train_loss": -11.307144165039062, "global_step": 203208, "epoch": 1209} {"train_loss": -11.25796127319336, "global_step": 203209, "epoch": 1209} {"train_loss": -11.44504165649414, "global_step": 203210, "epoch": 1209} {"train_loss": -11.296768188476562, "global_step": 203211, "epoch": 1209} {"train_loss": -11.495353698730469, "global_step": 203212, "epoch": 1209} {"train_loss": -11.297187805175781, "global_step": 203213, "epoch": 1209} {"train_loss": -11.576183319091797, "global_step": 203214, "epoch": 1209} {"train_loss": -11.50526237487793, "global_step": 203215, "epoch": 1209} {"train_loss": -11.46828556060791, "global_step": 203216, "epoch": 1209} {"train_loss": -11.379156112670898, "global_step": 203217, "epoch": 1209} {"train_loss": -11.423714637756348, "global_step": 203218, "epoch": 1209} {"train_loss": -11.682804107666016, "global_step": 203219, "epoch": 1209} {"train_loss": -11.378993034362793, "global_step": 203220, "epoch": 1209} {"train_loss": -11.56743335723877, "global_step": 203221, "epoch": 1209} {"train_loss": -11.652795791625977, "global_step": 203222, "epoch": 1209} {"train_loss": -11.33497142791748, "global_step": 203223, "epoch": 1209} {"train_loss": -11.715761184692383, "global_step": 203224, "epoch": 1209} {"train_loss": -11.580961227416992, "global_step": 203225, "epoch": 1209} {"train_loss": -11.588695526123047, "global_step": 203226, "epoch": 1209} {"train_loss": -11.808857917785645, "global_step": 203227, "epoch": 1209} {"train_loss": -11.461462020874023, "global_step": 203228, "epoch": 1209} {"train_loss": -11.703774452209473, "global_step": 203229, "epoch": 1209} {"train_loss": -11.706642150878906, "global_step": 203230, "epoch": 1209} {"train_loss": -11.623819351196289, "global_step": 203231, "epoch": 1209} {"train_loss": -11.603479385375977, "global_step": 203232, "epoch": 1209} {"train_loss": -11.484792709350586, "global_step": 203233, "epoch": 1209} {"train_loss": -11.36359691619873, "global_step": 203234, "epoch": 1209} {"train_loss": -11.549774169921875, "global_step": 203235, "epoch": 1209} {"train_loss": -11.672403335571289, "global_step": 203236, "epoch": 1209} {"train_loss": -11.45943832397461, "global_step": 203237, "epoch": 1209} {"train_loss": -11.624872207641602, "global_step": 203238, "epoch": 1209} {"train_loss": -11.624645233154297, "global_step": 203239, "epoch": 1209} {"train_loss": -11.689419746398926, "global_step": 203240, "epoch": 1209} {"train_loss": -11.421239852905273, "global_step": 203241, "epoch": 1209} {"train_loss": -11.900055885314941, "global_step": 203242, "epoch": 1209} {"train_loss": -11.576912879943848, "global_step": 203243, "epoch": 1209} {"train_loss": -11.823966979980469, "global_step": 203244, "epoch": 1209} {"train_loss": -11.649764060974121, "global_step": 203245, "epoch": 1209} {"train_loss": -11.631535530090332, "global_step": 203246, "epoch": 1209} {"train_loss": -11.964689254760742, "global_step": 203247, "epoch": 1209} {"train_loss": -11.647920608520508, "global_step": 203248, "epoch": 1209} {"train_loss": -11.78148365020752, "global_step": 203249, "epoch": 1209} {"train_loss": -11.736059188842773, "global_step": 203250, "epoch": 1209} {"train_loss": -11.372919082641602, "global_step": 203251, "epoch": 1209} {"train_loss": -11.573840141296387, "global_step": 203252, "epoch": 1209} {"train_loss": -11.493236541748047, "global_step": 203253, "epoch": 1209} {"train_loss": -11.388314247131348, "global_step": 203254, "epoch": 1209} {"train_loss": -11.577688217163086, "global_step": 203255, "epoch": 1209} {"train_loss": -11.5006685256958, "global_step": 203256, "epoch": 1209} {"train_loss": -11.157258987426758, "global_step": 203257, "epoch": 1209} {"train_loss": -11.409348487854004, "global_step": 203258, "epoch": 1209} {"train_loss": -11.719034194946289, "global_step": 203259, "epoch": 1209} {"train_loss": -11.70376968383789, "global_step": 203260, "epoch": 1209} {"train_loss": -11.825360298156738, "global_step": 203261, "epoch": 1209} {"train_loss": -11.637596130371094, "global_step": 203262, "epoch": 1209} {"train_loss": -11.891226768493652, "global_step": 203263, "epoch": 1209} {"train_loss": -11.787349700927734, "global_step": 203264, "epoch": 1209} {"train_loss": -11.174542427062988, "global_step": 203265, "epoch": 1209} {"train_loss": -11.336806297302246, "global_step": 203266, "epoch": 1209} {"train_loss": -10.802488327026367, "global_step": 203267, "epoch": 1209} {"train_loss": -11.119942665100098, "global_step": 203268, "epoch": 1209} {"train_loss": -10.397195816040039, "global_step": 203269, "epoch": 1209} {"train_loss": -10.989303588867188, "global_step": 203270, "epoch": 1209} {"train_loss": -9.815242767333984, "global_step": 203271, "epoch": 1209} {"train_loss": -9.48415470123291, "global_step": 203272, "epoch": 1209} {"train_loss": -8.912238121032715, "global_step": 203273, "epoch": 1209} {"train_loss": -11.3973970413208, "global_step": 203274, "epoch": 1209} {"train_loss": -9.159122467041016, "global_step": 203275, "epoch": 1209} {"train_loss": -10.161916732788086, "global_step": 203276, "epoch": 1209} {"train_loss": -10.60095500946045, "global_step": 203277, "epoch": 1209} {"train_loss": -9.672846794128418, "global_step": 203278, "epoch": 1209} {"train_loss": -11.015673083918434, "global_step": 203279, "epoch": 1209, "val_loss": 248670.90625} {"train_loss": -9.99521255493164, "global_step": 203280, "epoch": 1210} {"train_loss": -11.219998359680176, "global_step": 203281, "epoch": 1210} {"train_loss": -10.443916320800781, "global_step": 203282, "epoch": 1210} {"train_loss": -11.041987419128418, "global_step": 203283, "epoch": 1210} {"train_loss": -10.188688278198242, "global_step": 203284, "epoch": 1210} {"train_loss": -10.384241104125977, "global_step": 203285, "epoch": 1210} {"train_loss": -9.993003845214844, "global_step": 203286, "epoch": 1210} {"train_loss": -10.441173553466797, "global_step": 203287, "epoch": 1210} {"train_loss": -9.926651954650879, "global_step": 203288, "epoch": 1210} {"train_loss": -10.419425964355469, "global_step": 203289, "epoch": 1210} {"train_loss": -10.083633422851562, "global_step": 203290, "epoch": 1210} {"train_loss": -10.012099266052246, "global_step": 203291, "epoch": 1210} {"train_loss": -10.026134490966797, "global_step": 203292, "epoch": 1210} {"train_loss": -9.616787910461426, "global_step": 203293, "epoch": 1210} {"train_loss": -9.030057907104492, "global_step": 203294, "epoch": 1210} {"train_loss": -10.881294250488281, "global_step": 203295, "epoch": 1210} {"train_loss": -10.39638900756836, "global_step": 203296, "epoch": 1210} {"train_loss": -10.285260200500488, "global_step": 203297, "epoch": 1210} {"train_loss": -10.812080383300781, "global_step": 203298, "epoch": 1210} {"train_loss": -10.511613845825195, "global_step": 203299, "epoch": 1210} {"train_loss": -10.437664985656738, "global_step": 203300, "epoch": 1210} {"train_loss": -10.497109413146973, "global_step": 203301, "epoch": 1210} {"train_loss": -10.756967544555664, "global_step": 203302, "epoch": 1210} {"train_loss": -10.606587409973145, "global_step": 203303, "epoch": 1210} {"train_loss": -10.840922355651855, "global_step": 203304, "epoch": 1210} {"train_loss": -11.005901336669922, "global_step": 203305, "epoch": 1210} {"train_loss": -10.541923522949219, "global_step": 203306, "epoch": 1210} {"train_loss": -11.129556655883789, "global_step": 203307, "epoch": 1210} {"train_loss": -10.9940824508667, "global_step": 203308, "epoch": 1210} {"train_loss": -10.861410140991211, "global_step": 203309, "epoch": 1210} {"train_loss": -11.142603874206543, "global_step": 203310, "epoch": 1210} {"train_loss": -10.887715339660645, "global_step": 203311, "epoch": 1210} {"train_loss": -11.18008804321289, "global_step": 203312, "epoch": 1210} {"train_loss": -10.902841567993164, "global_step": 203313, "epoch": 1210} {"train_loss": -11.094640731811523, "global_step": 203314, "epoch": 1210} {"train_loss": -11.005989074707031, "global_step": 203315, "epoch": 1210} {"train_loss": -10.843185424804688, "global_step": 203316, "epoch": 1210} {"train_loss": -11.17755126953125, "global_step": 203317, "epoch": 1210} {"train_loss": -11.037845611572266, "global_step": 203318, "epoch": 1210} {"train_loss": -11.15659236907959, "global_step": 203319, "epoch": 1210} {"train_loss": -11.276021003723145, "global_step": 203320, "epoch": 1210} {"train_loss": -11.093121528625488, "global_step": 203321, "epoch": 1210} {"train_loss": -11.287219047546387, "global_step": 203322, "epoch": 1210} {"train_loss": -11.322021484375, "global_step": 203323, "epoch": 1210} {"train_loss": -11.154844284057617, "global_step": 203324, "epoch": 1210} {"train_loss": -10.975545883178711, "global_step": 203325, "epoch": 1210} {"train_loss": -11.136905670166016, "global_step": 203326, "epoch": 1210} {"train_loss": -11.198890686035156, "global_step": 203327, "epoch": 1210} {"train_loss": -11.182538986206055, "global_step": 203328, "epoch": 1210} {"train_loss": -11.232450485229492, "global_step": 203329, "epoch": 1210} {"train_loss": -11.409337997436523, "global_step": 203330, "epoch": 1210} {"train_loss": -11.179994583129883, "global_step": 203331, "epoch": 1210} {"train_loss": -11.566144943237305, "global_step": 203332, "epoch": 1210} {"train_loss": -11.365509986877441, "global_step": 203333, "epoch": 1210} {"train_loss": -11.434146881103516, "global_step": 203334, "epoch": 1210} {"train_loss": -10.970423698425293, "global_step": 203335, "epoch": 1210} {"train_loss": -11.127431869506836, "global_step": 203336, "epoch": 1210} {"train_loss": -11.354572296142578, "global_step": 203337, "epoch": 1210} {"train_loss": -11.140047073364258, "global_step": 203338, "epoch": 1210} {"train_loss": -11.539360046386719, "global_step": 203339, "epoch": 1210} {"train_loss": -11.252388000488281, "global_step": 203340, "epoch": 1210} {"train_loss": -11.482610702514648, "global_step": 203341, "epoch": 1210} {"train_loss": -11.30595588684082, "global_step": 203342, "epoch": 1210} {"train_loss": -11.429059028625488, "global_step": 203343, "epoch": 1210} {"train_loss": -11.401422500610352, "global_step": 203344, "epoch": 1210} {"train_loss": -11.659055709838867, "global_step": 203345, "epoch": 1210} {"train_loss": -11.522943496704102, "global_step": 203346, "epoch": 1210} {"train_loss": -11.35494613647461, "global_step": 203347, "epoch": 1210} {"train_loss": -11.445333480834961, "global_step": 203348, "epoch": 1210} {"train_loss": -11.523534774780273, "global_step": 203349, "epoch": 1210} {"train_loss": -11.598546981811523, "global_step": 203350, "epoch": 1210} {"train_loss": -11.607247352600098, "global_step": 203351, "epoch": 1210} {"train_loss": -11.546817779541016, "global_step": 203352, "epoch": 1210} {"train_loss": -11.6433687210083, "global_step": 203353, "epoch": 1210} {"train_loss": -11.733877182006836, "global_step": 203354, "epoch": 1210} {"train_loss": -11.539358139038086, "global_step": 203355, "epoch": 1210} {"train_loss": -11.638012886047363, "global_step": 203356, "epoch": 1210} {"train_loss": -11.483293533325195, "global_step": 203357, "epoch": 1210} {"train_loss": -11.490829467773438, "global_step": 203358, "epoch": 1210} {"train_loss": -11.652914047241211, "global_step": 203359, "epoch": 1210} {"train_loss": -11.637842178344727, "global_step": 203360, "epoch": 1210} {"train_loss": -11.76832103729248, "global_step": 203361, "epoch": 1210} {"train_loss": -11.5773344039917, "global_step": 203362, "epoch": 1210} {"train_loss": -11.601919174194336, "global_step": 203363, "epoch": 1210} {"train_loss": -11.68034553527832, "global_step": 203364, "epoch": 1210} {"train_loss": -11.736030578613281, "global_step": 203365, "epoch": 1210} {"train_loss": -11.721415519714355, "global_step": 203366, "epoch": 1210} {"train_loss": -11.530211448669434, "global_step": 203367, "epoch": 1210} {"train_loss": -11.58389663696289, "global_step": 203368, "epoch": 1210} {"train_loss": -11.195963859558105, "global_step": 203369, "epoch": 1210} {"train_loss": -11.6876802444458, "global_step": 203370, "epoch": 1210} {"train_loss": -11.464776992797852, "global_step": 203371, "epoch": 1210} {"train_loss": -11.727165222167969, "global_step": 203372, "epoch": 1210} {"train_loss": -11.263983726501465, "global_step": 203373, "epoch": 1210} {"train_loss": -11.837149620056152, "global_step": 203374, "epoch": 1210} {"train_loss": -11.190559387207031, "global_step": 203375, "epoch": 1210} {"train_loss": -11.698755264282227, "global_step": 203376, "epoch": 1210} {"train_loss": -11.35110092163086, "global_step": 203377, "epoch": 1210} {"train_loss": -10.579387664794922, "global_step": 203378, "epoch": 1210} {"train_loss": -11.278322219848633, "global_step": 203379, "epoch": 1210} {"train_loss": -11.17924976348877, "global_step": 203380, "epoch": 1210} {"train_loss": -10.89254379272461, "global_step": 203381, "epoch": 1210} {"train_loss": -10.95180606842041, "global_step": 203382, "epoch": 1210} {"train_loss": -11.481931686401367, "global_step": 203383, "epoch": 1210} {"train_loss": -10.773712158203125, "global_step": 203384, "epoch": 1210} {"train_loss": -11.004411697387695, "global_step": 203385, "epoch": 1210} {"train_loss": -11.278606414794922, "global_step": 203386, "epoch": 1210} {"train_loss": -11.160780906677246, "global_step": 203387, "epoch": 1210} {"train_loss": -11.605077743530273, "global_step": 203388, "epoch": 1210} {"train_loss": -10.937773704528809, "global_step": 203389, "epoch": 1210} {"train_loss": -11.209776878356934, "global_step": 203390, "epoch": 1210} {"train_loss": -11.215622901916504, "global_step": 203391, "epoch": 1210} {"train_loss": -11.586357116699219, "global_step": 203392, "epoch": 1210} {"train_loss": -11.311676025390625, "global_step": 203393, "epoch": 1210} {"train_loss": -11.25831413269043, "global_step": 203394, "epoch": 1210} {"train_loss": -11.494634628295898, "global_step": 203395, "epoch": 1210} {"train_loss": -11.487919807434082, "global_step": 203396, "epoch": 1210} {"train_loss": -11.360872268676758, "global_step": 203397, "epoch": 1210} {"train_loss": -10.903823852539062, "global_step": 203398, "epoch": 1210} {"train_loss": -11.169602394104004, "global_step": 203399, "epoch": 1210} {"train_loss": -11.272003173828125, "global_step": 203400, "epoch": 1210} {"train_loss": -11.152034759521484, "global_step": 203401, "epoch": 1210} {"train_loss": -11.271812438964844, "global_step": 203402, "epoch": 1210} {"train_loss": -11.288959503173828, "global_step": 203403, "epoch": 1210} {"train_loss": -10.801851272583008, "global_step": 203404, "epoch": 1210} {"train_loss": -11.416967391967773, "global_step": 203405, "epoch": 1210} {"train_loss": -11.035969734191895, "global_step": 203406, "epoch": 1210} {"train_loss": -11.03268814086914, "global_step": 203407, "epoch": 1210} {"train_loss": -11.062664031982422, "global_step": 203408, "epoch": 1210} {"train_loss": -11.189489364624023, "global_step": 203409, "epoch": 1210} {"train_loss": -11.35151481628418, "global_step": 203410, "epoch": 1210} {"train_loss": -11.281188011169434, "global_step": 203411, "epoch": 1210} {"train_loss": -11.100366592407227, "global_step": 203412, "epoch": 1210} {"train_loss": -11.495817184448242, "global_step": 203413, "epoch": 1210} {"train_loss": -10.90066146850586, "global_step": 203414, "epoch": 1210} {"train_loss": -11.422502517700195, "global_step": 203415, "epoch": 1210} {"train_loss": -10.622577667236328, "global_step": 203416, "epoch": 1210} {"train_loss": -11.307772636413574, "global_step": 203417, "epoch": 1210} {"train_loss": -10.669733047485352, "global_step": 203418, "epoch": 1210} {"train_loss": -10.6478271484375, "global_step": 203419, "epoch": 1210} {"train_loss": -10.883058547973633, "global_step": 203420, "epoch": 1210} {"train_loss": -10.749358177185059, "global_step": 203421, "epoch": 1210} {"train_loss": -11.334985733032227, "global_step": 203422, "epoch": 1210} {"train_loss": -11.122795104980469, "global_step": 203423, "epoch": 1210} {"train_loss": -11.012338638305664, "global_step": 203424, "epoch": 1210} {"train_loss": -11.287697792053223, "global_step": 203425, "epoch": 1210} {"train_loss": -11.277458190917969, "global_step": 203426, "epoch": 1210} {"train_loss": -10.860593795776367, "global_step": 203427, "epoch": 1210} {"train_loss": -11.397305488586426, "global_step": 203428, "epoch": 1210} {"train_loss": -10.766107559204102, "global_step": 203429, "epoch": 1210} {"train_loss": -11.173851013183594, "global_step": 203430, "epoch": 1210} {"train_loss": -11.104528427124023, "global_step": 203431, "epoch": 1210} {"train_loss": -11.06713581085205, "global_step": 203432, "epoch": 1210} {"train_loss": -11.171989440917969, "global_step": 203433, "epoch": 1210} {"train_loss": -11.13636589050293, "global_step": 203434, "epoch": 1210} {"train_loss": -11.368587493896484, "global_step": 203435, "epoch": 1210} {"train_loss": -11.305597305297852, "global_step": 203436, "epoch": 1210} {"train_loss": -11.3967924118042, "global_step": 203437, "epoch": 1210} {"train_loss": -11.414545059204102, "global_step": 203438, "epoch": 1210} {"train_loss": -10.830738067626953, "global_step": 203439, "epoch": 1210} {"train_loss": -11.706798553466797, "global_step": 203440, "epoch": 1210} {"train_loss": -11.23556900024414, "global_step": 203441, "epoch": 1210} {"train_loss": -11.226163864135742, "global_step": 203442, "epoch": 1210} {"train_loss": -11.446581840515137, "global_step": 203443, "epoch": 1210} {"train_loss": -11.259868621826172, "global_step": 203444, "epoch": 1210} {"train_loss": -11.424076080322266, "global_step": 203445, "epoch": 1210} {"train_loss": -11.30636215209961, "global_step": 203446, "epoch": 1210} {"train_loss": -11.12923132237934, "global_step": 203447, "epoch": 1210, "val_loss": 253274.234375, "train_action_mse_error": 0.4765852689743042} {"train_loss": -11.32524299621582, "global_step": 203448, "epoch": 1211} {"train_loss": -11.27149772644043, "global_step": 203449, "epoch": 1211} {"train_loss": -11.341815948486328, "global_step": 203450, "epoch": 1211} {"train_loss": -11.214948654174805, "global_step": 203451, "epoch": 1211} {"train_loss": -11.518241882324219, "global_step": 203452, "epoch": 1211} {"train_loss": -11.272659301757812, "global_step": 203453, "epoch": 1211} {"train_loss": -11.516104698181152, "global_step": 203454, "epoch": 1211} {"train_loss": -11.36353874206543, "global_step": 203455, "epoch": 1211} {"train_loss": -11.260403633117676, "global_step": 203456, "epoch": 1211} {"train_loss": -11.52151107788086, "global_step": 203457, "epoch": 1211} {"train_loss": -11.519834518432617, "global_step": 203458, "epoch": 1211} {"train_loss": -11.734809875488281, "global_step": 203459, "epoch": 1211} {"train_loss": -11.574396133422852, "global_step": 203460, "epoch": 1211} {"train_loss": -11.549860954284668, "global_step": 203461, "epoch": 1211} {"train_loss": -11.52285099029541, "global_step": 203462, "epoch": 1211} {"train_loss": -11.820489883422852, "global_step": 203463, "epoch": 1211} {"train_loss": -11.470905303955078, "global_step": 203464, "epoch": 1211} {"train_loss": -11.800122261047363, "global_step": 203465, "epoch": 1211} {"train_loss": -11.836206436157227, "global_step": 203466, "epoch": 1211} {"train_loss": -11.714195251464844, "global_step": 203467, "epoch": 1211} {"train_loss": -11.816995620727539, "global_step": 203468, "epoch": 1211} {"train_loss": -11.632179260253906, "global_step": 203469, "epoch": 1211} {"train_loss": -11.49295711517334, "global_step": 203470, "epoch": 1211} {"train_loss": -11.796036720275879, "global_step": 203471, "epoch": 1211} {"train_loss": -11.694355010986328, "global_step": 203472, "epoch": 1211} {"train_loss": -11.435454368591309, "global_step": 203473, "epoch": 1211} {"train_loss": -11.813461303710938, "global_step": 203474, "epoch": 1211} {"train_loss": -11.237129211425781, "global_step": 203475, "epoch": 1211} {"train_loss": -11.177002906799316, "global_step": 203476, "epoch": 1211} {"train_loss": -11.808904647827148, "global_step": 203477, "epoch": 1211} {"train_loss": -10.929849624633789, "global_step": 203478, "epoch": 1211} {"train_loss": -11.116189956665039, "global_step": 203479, "epoch": 1211} {"train_loss": -11.392133712768555, "global_step": 203480, "epoch": 1211} {"train_loss": -10.960161209106445, "global_step": 203481, "epoch": 1211} {"train_loss": -10.854077339172363, "global_step": 203482, "epoch": 1211} {"train_loss": -11.76305866241455, "global_step": 203483, "epoch": 1211} {"train_loss": -10.895225524902344, "global_step": 203484, "epoch": 1211} {"train_loss": -11.642106056213379, "global_step": 203485, "epoch": 1211} {"train_loss": -11.245052337646484, "global_step": 203486, "epoch": 1211} {"train_loss": -11.489267349243164, "global_step": 203487, "epoch": 1211} {"train_loss": -11.231671333312988, "global_step": 203488, "epoch": 1211} {"train_loss": -11.622713088989258, "global_step": 203489, "epoch": 1211} {"train_loss": -11.030698776245117, "global_step": 203490, "epoch": 1211} {"train_loss": -11.523994445800781, "global_step": 203491, "epoch": 1211} {"train_loss": -11.537324905395508, "global_step": 203492, "epoch": 1211} {"train_loss": -11.13418960571289, "global_step": 203493, "epoch": 1211} {"train_loss": -11.427556991577148, "global_step": 203494, "epoch": 1211} {"train_loss": -11.569149017333984, "global_step": 203495, "epoch": 1211} {"train_loss": -11.206847190856934, "global_step": 203496, "epoch": 1211} {"train_loss": -11.376174926757812, "global_step": 203497, "epoch": 1211} {"train_loss": -10.658769607543945, "global_step": 203498, "epoch": 1211} {"train_loss": -10.786626815795898, "global_step": 203499, "epoch": 1211} {"train_loss": -11.85460090637207, "global_step": 203500, "epoch": 1211} {"train_loss": -11.332357406616211, "global_step": 203501, "epoch": 1211} {"train_loss": -11.47488021850586, "global_step": 203502, "epoch": 1211} {"train_loss": -11.562121391296387, "global_step": 203503, "epoch": 1211} {"train_loss": -11.652170181274414, "global_step": 203504, "epoch": 1211} {"train_loss": -11.83230972290039, "global_step": 203505, "epoch": 1211} {"train_loss": -11.805121421813965, "global_step": 203506, "epoch": 1211} {"train_loss": -11.922867774963379, "global_step": 203507, "epoch": 1211} {"train_loss": -11.906232833862305, "global_step": 203508, "epoch": 1211} {"train_loss": -11.857741355895996, "global_step": 203509, "epoch": 1211} {"train_loss": -11.74193000793457, "global_step": 203510, "epoch": 1211} {"train_loss": -11.292009353637695, "global_step": 203511, "epoch": 1211} {"train_loss": -11.41808795928955, "global_step": 203512, "epoch": 1211} {"train_loss": -11.11120891571045, "global_step": 203513, "epoch": 1211} {"train_loss": -11.660537719726562, "global_step": 203514, "epoch": 1211} {"train_loss": -11.51142406463623, "global_step": 203515, "epoch": 1211} {"train_loss": -11.620312690734863, "global_step": 203516, "epoch": 1211} {"train_loss": -11.589988708496094, "global_step": 203517, "epoch": 1211} {"train_loss": -11.699189186096191, "global_step": 203518, "epoch": 1211} {"train_loss": -11.460679054260254, "global_step": 203519, "epoch": 1211} {"train_loss": -11.458395957946777, "global_step": 203520, "epoch": 1211} {"train_loss": -11.62567138671875, "global_step": 203521, "epoch": 1211} {"train_loss": -11.85574722290039, "global_step": 203522, "epoch": 1211} {"train_loss": -11.559669494628906, "global_step": 203523, "epoch": 1211} {"train_loss": -11.973464012145996, "global_step": 203524, "epoch": 1211} {"train_loss": -11.262598037719727, "global_step": 203525, "epoch": 1211} {"train_loss": -11.500478744506836, "global_step": 203526, "epoch": 1211} {"train_loss": -11.535608291625977, "global_step": 203527, "epoch": 1211} {"train_loss": -11.750297546386719, "global_step": 203528, "epoch": 1211} {"train_loss": -11.406290054321289, "global_step": 203529, "epoch": 1211} {"train_loss": -10.733914375305176, "global_step": 203530, "epoch": 1211} {"train_loss": -11.12804126739502, "global_step": 203531, "epoch": 1211} {"train_loss": -11.12165641784668, "global_step": 203532, "epoch": 1211} {"train_loss": -11.307130813598633, "global_step": 203533, "epoch": 1211} {"train_loss": -11.636775970458984, "global_step": 203534, "epoch": 1211} {"train_loss": -11.362805366516113, "global_step": 203535, "epoch": 1211} {"train_loss": -11.563291549682617, "global_step": 203536, "epoch": 1211} {"train_loss": -11.220840454101562, "global_step": 203537, "epoch": 1211} {"train_loss": -11.44150161743164, "global_step": 203538, "epoch": 1211} {"train_loss": -11.206548690795898, "global_step": 203539, "epoch": 1211} {"train_loss": -11.608674049377441, "global_step": 203540, "epoch": 1211} {"train_loss": -11.167091369628906, "global_step": 203541, "epoch": 1211} {"train_loss": -11.732654571533203, "global_step": 203542, "epoch": 1211} {"train_loss": -11.645307540893555, "global_step": 203543, "epoch": 1211} {"train_loss": -11.647403717041016, "global_step": 203544, "epoch": 1211} {"train_loss": -11.17648983001709, "global_step": 203545, "epoch": 1211} {"train_loss": -11.694974899291992, "global_step": 203546, "epoch": 1211} {"train_loss": -11.346712112426758, "global_step": 203547, "epoch": 1211} {"train_loss": -11.368045806884766, "global_step": 203548, "epoch": 1211} {"train_loss": -11.420376777648926, "global_step": 203549, "epoch": 1211} {"train_loss": -11.3151273727417, "global_step": 203550, "epoch": 1211} {"train_loss": -11.027288436889648, "global_step": 203551, "epoch": 1211} {"train_loss": -11.426420211791992, "global_step": 203552, "epoch": 1211} {"train_loss": -10.929691314697266, "global_step": 203553, "epoch": 1211} {"train_loss": -10.839057922363281, "global_step": 203554, "epoch": 1211} {"train_loss": -11.575122833251953, "global_step": 203555, "epoch": 1211} {"train_loss": -10.861519813537598, "global_step": 203556, "epoch": 1211} {"train_loss": -11.294343948364258, "global_step": 203557, "epoch": 1211} {"train_loss": -11.279199600219727, "global_step": 203558, "epoch": 1211} {"train_loss": -10.89990234375, "global_step": 203559, "epoch": 1211} {"train_loss": -11.08536148071289, "global_step": 203560, "epoch": 1211} {"train_loss": -11.488852500915527, "global_step": 203561, "epoch": 1211} {"train_loss": -10.85615348815918, "global_step": 203562, "epoch": 1211} {"train_loss": -11.40896224975586, "global_step": 203563, "epoch": 1211} {"train_loss": -11.38486099243164, "global_step": 203564, "epoch": 1211} {"train_loss": -11.41909408569336, "global_step": 203565, "epoch": 1211} {"train_loss": -11.39016342163086, "global_step": 203566, "epoch": 1211} {"train_loss": -11.44261360168457, "global_step": 203567, "epoch": 1211} {"train_loss": -11.804803848266602, "global_step": 203568, "epoch": 1211} {"train_loss": -11.393230438232422, "global_step": 203569, "epoch": 1211} {"train_loss": -11.577034950256348, "global_step": 203570, "epoch": 1211} {"train_loss": -11.408600807189941, "global_step": 203571, "epoch": 1211} {"train_loss": -11.820594787597656, "global_step": 203572, "epoch": 1211} {"train_loss": -11.586324691772461, "global_step": 203573, "epoch": 1211} {"train_loss": -11.041306495666504, "global_step": 203574, "epoch": 1211} {"train_loss": -11.777308464050293, "global_step": 203575, "epoch": 1211} {"train_loss": -11.160882949829102, "global_step": 203576, "epoch": 1211} {"train_loss": -11.397818565368652, "global_step": 203577, "epoch": 1211} {"train_loss": -11.285953521728516, "global_step": 203578, "epoch": 1211} {"train_loss": -11.44644546508789, "global_step": 203579, "epoch": 1211} {"train_loss": -11.25547981262207, "global_step": 203580, "epoch": 1211} {"train_loss": -11.434988021850586, "global_step": 203581, "epoch": 1211} {"train_loss": -11.514803886413574, "global_step": 203582, "epoch": 1211} {"train_loss": -11.418922424316406, "global_step": 203583, "epoch": 1211} {"train_loss": -11.515584945678711, "global_step": 203584, "epoch": 1211} {"train_loss": -10.840279579162598, "global_step": 203585, "epoch": 1211} {"train_loss": -11.335517883300781, "global_step": 203586, "epoch": 1211} {"train_loss": -11.223488807678223, "global_step": 203587, "epoch": 1211} {"train_loss": -11.387835502624512, "global_step": 203588, "epoch": 1211} {"train_loss": -11.031486511230469, "global_step": 203589, "epoch": 1211} {"train_loss": -11.624029159545898, "global_step": 203590, "epoch": 1211} {"train_loss": -11.389240264892578, "global_step": 203591, "epoch": 1211} {"train_loss": -11.498849868774414, "global_step": 203592, "epoch": 1211} {"train_loss": -11.223387718200684, "global_step": 203593, "epoch": 1211} {"train_loss": -11.329740524291992, "global_step": 203594, "epoch": 1211} {"train_loss": -11.682252883911133, "global_step": 203595, "epoch": 1211} {"train_loss": -11.601868629455566, "global_step": 203596, "epoch": 1211} {"train_loss": -11.568668365478516, "global_step": 203597, "epoch": 1211} {"train_loss": -11.48509407043457, "global_step": 203598, "epoch": 1211} {"train_loss": -11.330690383911133, "global_step": 203599, "epoch": 1211} {"train_loss": -11.741256713867188, "global_step": 203600, "epoch": 1211} {"train_loss": -11.468122482299805, "global_step": 203601, "epoch": 1211} {"train_loss": -11.784761428833008, "global_step": 203602, "epoch": 1211} {"train_loss": -11.899003028869629, "global_step": 203603, "epoch": 1211} {"train_loss": -11.804489135742188, "global_step": 203604, "epoch": 1211} {"train_loss": -11.567704200744629, "global_step": 203605, "epoch": 1211} {"train_loss": -11.329673767089844, "global_step": 203606, "epoch": 1211} {"train_loss": -10.985162734985352, "global_step": 203607, "epoch": 1211} {"train_loss": -11.44296932220459, "global_step": 203608, "epoch": 1211} {"train_loss": -11.717310905456543, "global_step": 203609, "epoch": 1211} {"train_loss": -11.55136489868164, "global_step": 203610, "epoch": 1211} {"train_loss": -11.688189506530762, "global_step": 203611, "epoch": 1211} {"train_loss": -11.803983688354492, "global_step": 203612, "epoch": 1211} {"train_loss": -11.508726119995117, "global_step": 203613, "epoch": 1211} {"train_loss": -11.320331573486328, "global_step": 203614, "epoch": 1211} {"train_loss": -11.438078409149533, "global_step": 203615, "epoch": 1211, "val_loss": 254915.078125} {"train_loss": -11.655534744262695, "global_step": 203616, "epoch": 1212} {"train_loss": -11.590639114379883, "global_step": 203617, "epoch": 1212} {"train_loss": -11.366118431091309, "global_step": 203618, "epoch": 1212} {"train_loss": -11.745461463928223, "global_step": 203619, "epoch": 1212} {"train_loss": -11.26094913482666, "global_step": 203620, "epoch": 1212} {"train_loss": -10.886598587036133, "global_step": 203621, "epoch": 1212} {"train_loss": -10.725351333618164, "global_step": 203622, "epoch": 1212} {"train_loss": -11.413484573364258, "global_step": 203623, "epoch": 1212} {"train_loss": -9.854689598083496, "global_step": 203624, "epoch": 1212} {"train_loss": -11.452310562133789, "global_step": 203625, "epoch": 1212} {"train_loss": -10.535154342651367, "global_step": 203626, "epoch": 1212} {"train_loss": -11.078073501586914, "global_step": 203627, "epoch": 1212} {"train_loss": -10.624465942382812, "global_step": 203628, "epoch": 1212} {"train_loss": -10.919608116149902, "global_step": 203629, "epoch": 1212} {"train_loss": -9.743268966674805, "global_step": 203630, "epoch": 1212} {"train_loss": -10.328837394714355, "global_step": 203631, "epoch": 1212} {"train_loss": -10.548863410949707, "global_step": 203632, "epoch": 1212} {"train_loss": -10.49352741241455, "global_step": 203633, "epoch": 1212} {"train_loss": -9.566896438598633, "global_step": 203634, "epoch": 1212} {"train_loss": -10.849292755126953, "global_step": 203635, "epoch": 1212} {"train_loss": -9.600998878479004, "global_step": 203636, "epoch": 1212} {"train_loss": -10.985245704650879, "global_step": 203637, "epoch": 1212} {"train_loss": -10.332463264465332, "global_step": 203638, "epoch": 1212} {"train_loss": -10.387216567993164, "global_step": 203639, "epoch": 1212} {"train_loss": -10.22579288482666, "global_step": 203640, "epoch": 1212} {"train_loss": -10.574714660644531, "global_step": 203641, "epoch": 1212} {"train_loss": -10.28830337524414, "global_step": 203642, "epoch": 1212} {"train_loss": -10.150885581970215, "global_step": 203643, "epoch": 1212} {"train_loss": -10.823138236999512, "global_step": 203644, "epoch": 1212} {"train_loss": -10.145634651184082, "global_step": 203645, "epoch": 1212} {"train_loss": -11.036108016967773, "global_step": 203646, "epoch": 1212} {"train_loss": -10.31999397277832, "global_step": 203647, "epoch": 1212} {"train_loss": -11.028746604919434, "global_step": 203648, "epoch": 1212} {"train_loss": -10.308837890625, "global_step": 203649, "epoch": 1212} {"train_loss": -11.08260726928711, "global_step": 203650, "epoch": 1212} {"train_loss": -10.732381820678711, "global_step": 203651, "epoch": 1212} {"train_loss": -10.811945915222168, "global_step": 203652, "epoch": 1212} {"train_loss": -10.829938888549805, "global_step": 203653, "epoch": 1212} {"train_loss": -10.647029876708984, "global_step": 203654, "epoch": 1212} {"train_loss": -10.96119499206543, "global_step": 203655, "epoch": 1212} {"train_loss": -11.025045394897461, "global_step": 203656, "epoch": 1212} {"train_loss": -11.201456069946289, "global_step": 203657, "epoch": 1212} {"train_loss": -10.895459175109863, "global_step": 203658, "epoch": 1212} {"train_loss": -11.258659362792969, "global_step": 203659, "epoch": 1212} {"train_loss": -11.147916793823242, "global_step": 203660, "epoch": 1212} {"train_loss": -10.665142059326172, "global_step": 203661, "epoch": 1212} {"train_loss": -11.147729873657227, "global_step": 203662, "epoch": 1212} {"train_loss": -11.119400024414062, "global_step": 203663, "epoch": 1212} {"train_loss": -11.284872055053711, "global_step": 203664, "epoch": 1212} {"train_loss": -11.20477294921875, "global_step": 203665, "epoch": 1212} {"train_loss": -11.416799545288086, "global_step": 203666, "epoch": 1212} {"train_loss": -11.347806930541992, "global_step": 203667, "epoch": 1212} {"train_loss": -11.454116821289062, "global_step": 203668, "epoch": 1212} {"train_loss": -11.490047454833984, "global_step": 203669, "epoch": 1212} {"train_loss": -11.405938148498535, "global_step": 203670, "epoch": 1212} {"train_loss": -11.66276741027832, "global_step": 203671, "epoch": 1212} {"train_loss": -11.392532348632812, "global_step": 203672, "epoch": 1212} {"train_loss": -11.397032737731934, "global_step": 203673, "epoch": 1212} {"train_loss": -11.509966850280762, "global_step": 203674, "epoch": 1212} {"train_loss": -11.531272888183594, "global_step": 203675, "epoch": 1212} {"train_loss": -11.602635383605957, "global_step": 203676, "epoch": 1212} {"train_loss": -11.62118911743164, "global_step": 203677, "epoch": 1212} {"train_loss": -11.698118209838867, "global_step": 203678, "epoch": 1212} {"train_loss": -11.489792823791504, "global_step": 203679, "epoch": 1212} {"train_loss": -11.379241943359375, "global_step": 203680, "epoch": 1212} {"train_loss": -11.561269760131836, "global_step": 203681, "epoch": 1212} {"train_loss": -11.369208335876465, "global_step": 203682, "epoch": 1212} {"train_loss": -11.532709121704102, "global_step": 203683, "epoch": 1212} {"train_loss": -11.316802978515625, "global_step": 203684, "epoch": 1212} {"train_loss": -11.397311210632324, "global_step": 203685, "epoch": 1212} {"train_loss": -11.71434211730957, "global_step": 203686, "epoch": 1212} {"train_loss": -11.284513473510742, "global_step": 203687, "epoch": 1212} {"train_loss": -11.64697265625, "global_step": 203688, "epoch": 1212} {"train_loss": -11.358083724975586, "global_step": 203689, "epoch": 1212} {"train_loss": -11.003793716430664, "global_step": 203690, "epoch": 1212} {"train_loss": -11.442766189575195, "global_step": 203691, "epoch": 1212} {"train_loss": -11.485696792602539, "global_step": 203692, "epoch": 1212} {"train_loss": -11.22402572631836, "global_step": 203693, "epoch": 1212} {"train_loss": -11.510339736938477, "global_step": 203694, "epoch": 1212} {"train_loss": -11.365835189819336, "global_step": 203695, "epoch": 1212} {"train_loss": -11.809085845947266, "global_step": 203696, "epoch": 1212} {"train_loss": -11.306550979614258, "global_step": 203697, "epoch": 1212} {"train_loss": -11.644704818725586, "global_step": 203698, "epoch": 1212} {"train_loss": -11.720718383789062, "global_step": 203699, "epoch": 1212} {"train_loss": -11.251075744628906, "global_step": 203700, "epoch": 1212} {"train_loss": -11.394323348999023, "global_step": 203701, "epoch": 1212} {"train_loss": -11.730779647827148, "global_step": 203702, "epoch": 1212} {"train_loss": -11.584541320800781, "global_step": 203703, "epoch": 1212} {"train_loss": -11.647368431091309, "global_step": 203704, "epoch": 1212} {"train_loss": -11.549356460571289, "global_step": 203705, "epoch": 1212} {"train_loss": -11.748181343078613, "global_step": 203706, "epoch": 1212} {"train_loss": -11.524333953857422, "global_step": 203707, "epoch": 1212} {"train_loss": -11.260091781616211, "global_step": 203708, "epoch": 1212} {"train_loss": -11.69853401184082, "global_step": 203709, "epoch": 1212} {"train_loss": -10.856048583984375, "global_step": 203710, "epoch": 1212} {"train_loss": -10.852551460266113, "global_step": 203711, "epoch": 1212} {"train_loss": -11.517269134521484, "global_step": 203712, "epoch": 1212} {"train_loss": -11.092954635620117, "global_step": 203713, "epoch": 1212} {"train_loss": -10.971939086914062, "global_step": 203714, "epoch": 1212} {"train_loss": -11.179766654968262, "global_step": 203715, "epoch": 1212} {"train_loss": -11.21232795715332, "global_step": 203716, "epoch": 1212} {"train_loss": -10.050206184387207, "global_step": 203717, "epoch": 1212} {"train_loss": -11.220487594604492, "global_step": 203718, "epoch": 1212} {"train_loss": -10.887325286865234, "global_step": 203719, "epoch": 1212} {"train_loss": -10.66220474243164, "global_step": 203720, "epoch": 1212} {"train_loss": -10.449422836303711, "global_step": 203721, "epoch": 1212} {"train_loss": -11.1104736328125, "global_step": 203722, "epoch": 1212} {"train_loss": -10.754762649536133, "global_step": 203723, "epoch": 1212} {"train_loss": -11.11677074432373, "global_step": 203724, "epoch": 1212} {"train_loss": -9.85677719116211, "global_step": 203725, "epoch": 1212} {"train_loss": -11.106677055358887, "global_step": 203726, "epoch": 1212} {"train_loss": -10.145112991333008, "global_step": 203727, "epoch": 1212} {"train_loss": -11.110538482666016, "global_step": 203728, "epoch": 1212} {"train_loss": -10.72548770904541, "global_step": 203729, "epoch": 1212} {"train_loss": -10.899660110473633, "global_step": 203730, "epoch": 1212} {"train_loss": -11.404470443725586, "global_step": 203731, "epoch": 1212} {"train_loss": -10.897634506225586, "global_step": 203732, "epoch": 1212} {"train_loss": -11.248427391052246, "global_step": 203733, "epoch": 1212} {"train_loss": -11.252717018127441, "global_step": 203734, "epoch": 1212} {"train_loss": -11.363210678100586, "global_step": 203735, "epoch": 1212} {"train_loss": -11.191265106201172, "global_step": 203736, "epoch": 1212} {"train_loss": -11.351797103881836, "global_step": 203737, "epoch": 1212} {"train_loss": -11.223819732666016, "global_step": 203738, "epoch": 1212} {"train_loss": -11.243717193603516, "global_step": 203739, "epoch": 1212} {"train_loss": -11.7216796875, "global_step": 203740, "epoch": 1212} {"train_loss": -11.489765167236328, "global_step": 203741, "epoch": 1212} {"train_loss": -11.495340347290039, "global_step": 203742, "epoch": 1212} {"train_loss": -11.54560661315918, "global_step": 203743, "epoch": 1212} {"train_loss": -11.281455039978027, "global_step": 203744, "epoch": 1212} {"train_loss": -11.362266540527344, "global_step": 203745, "epoch": 1212} {"train_loss": -11.20207405090332, "global_step": 203746, "epoch": 1212} {"train_loss": -11.553813934326172, "global_step": 203747, "epoch": 1212} {"train_loss": -10.911693572998047, "global_step": 203748, "epoch": 1212} {"train_loss": -11.42874526977539, "global_step": 203749, "epoch": 1212} {"train_loss": -11.05598258972168, "global_step": 203750, "epoch": 1212} {"train_loss": -11.249181747436523, "global_step": 203751, "epoch": 1212} {"train_loss": -11.597553253173828, "global_step": 203752, "epoch": 1212} {"train_loss": -11.132343292236328, "global_step": 203753, "epoch": 1212} {"train_loss": -11.666213989257812, "global_step": 203754, "epoch": 1212} {"train_loss": -10.84203052520752, "global_step": 203755, "epoch": 1212} {"train_loss": -11.439226150512695, "global_step": 203756, "epoch": 1212} {"train_loss": -11.015289306640625, "global_step": 203757, "epoch": 1212} {"train_loss": -11.725677490234375, "global_step": 203758, "epoch": 1212} {"train_loss": -11.272621154785156, "global_step": 203759, "epoch": 1212} {"train_loss": -11.308804512023926, "global_step": 203760, "epoch": 1212} {"train_loss": -11.55333137512207, "global_step": 203761, "epoch": 1212} {"train_loss": -11.523093223571777, "global_step": 203762, "epoch": 1212} {"train_loss": -11.637630462646484, "global_step": 203763, "epoch": 1212} {"train_loss": -11.101194381713867, "global_step": 203764, "epoch": 1212} {"train_loss": -11.251520156860352, "global_step": 203765, "epoch": 1212} {"train_loss": -11.497282981872559, "global_step": 203766, "epoch": 1212} {"train_loss": -11.390546798706055, "global_step": 203767, "epoch": 1212} {"train_loss": -11.454445838928223, "global_step": 203768, "epoch": 1212} {"train_loss": -11.145727157592773, "global_step": 203769, "epoch": 1212} {"train_loss": -11.524026870727539, "global_step": 203770, "epoch": 1212} {"train_loss": -11.310775756835938, "global_step": 203771, "epoch": 1212} {"train_loss": -10.956066131591797, "global_step": 203772, "epoch": 1212} {"train_loss": -11.490121841430664, "global_step": 203773, "epoch": 1212} {"train_loss": -11.003323554992676, "global_step": 203774, "epoch": 1212} {"train_loss": -11.053121566772461, "global_step": 203775, "epoch": 1212} {"train_loss": -11.004914283752441, "global_step": 203776, "epoch": 1212} {"train_loss": -10.89167594909668, "global_step": 203777, "epoch": 1212} {"train_loss": -11.470653533935547, "global_step": 203778, "epoch": 1212} {"train_loss": -10.81668472290039, "global_step": 203779, "epoch": 1212} {"train_loss": -11.162568092346191, "global_step": 203780, "epoch": 1212} {"train_loss": -11.381179809570312, "global_step": 203781, "epoch": 1212} {"train_loss": -11.131282806396484, "global_step": 203782, "epoch": 1212} {"train_loss": -11.136244898750668, "global_step": 203783, "epoch": 1212, "val_loss": 255458.703125} {"train_loss": -11.161165237426758, "global_step": 203784, "epoch": 1213} {"train_loss": -11.51659870147705, "global_step": 203785, "epoch": 1213} {"train_loss": -11.022636413574219, "global_step": 203786, "epoch": 1213} {"train_loss": -11.141073226928711, "global_step": 203787, "epoch": 1213} {"train_loss": -11.279199600219727, "global_step": 203788, "epoch": 1213} {"train_loss": -10.813949584960938, "global_step": 203789, "epoch": 1213} {"train_loss": -10.860767364501953, "global_step": 203790, "epoch": 1213} {"train_loss": -11.118573188781738, "global_step": 203791, "epoch": 1213} {"train_loss": -10.713266372680664, "global_step": 203792, "epoch": 1213} {"train_loss": -11.138127326965332, "global_step": 203793, "epoch": 1213} {"train_loss": -10.715152740478516, "global_step": 203794, "epoch": 1213} {"train_loss": -11.289304733276367, "global_step": 203795, "epoch": 1213} {"train_loss": -11.39011001586914, "global_step": 203796, "epoch": 1213} {"train_loss": -11.24930191040039, "global_step": 203797, "epoch": 1213} {"train_loss": -11.443621635437012, "global_step": 203798, "epoch": 1213} {"train_loss": -11.245674133300781, "global_step": 203799, "epoch": 1213} {"train_loss": -11.717585563659668, "global_step": 203800, "epoch": 1213} {"train_loss": -11.235345840454102, "global_step": 203801, "epoch": 1213} {"train_loss": -11.263461112976074, "global_step": 203802, "epoch": 1213} {"train_loss": -11.38521671295166, "global_step": 203803, "epoch": 1213} {"train_loss": -11.250716209411621, "global_step": 203804, "epoch": 1213} {"train_loss": -11.347349166870117, "global_step": 203805, "epoch": 1213} {"train_loss": -11.313814163208008, "global_step": 203806, "epoch": 1213} {"train_loss": -11.524040222167969, "global_step": 203807, "epoch": 1213} {"train_loss": -11.604881286621094, "global_step": 203808, "epoch": 1213} {"train_loss": -11.304960250854492, "global_step": 203809, "epoch": 1213} {"train_loss": -11.758112907409668, "global_step": 203810, "epoch": 1213} {"train_loss": -11.341424942016602, "global_step": 203811, "epoch": 1213} {"train_loss": -11.318456649780273, "global_step": 203812, "epoch": 1213} {"train_loss": -11.555898666381836, "global_step": 203813, "epoch": 1213} {"train_loss": -11.223146438598633, "global_step": 203814, "epoch": 1213} {"train_loss": -11.5345458984375, "global_step": 203815, "epoch": 1213} {"train_loss": -11.582438468933105, "global_step": 203816, "epoch": 1213} {"train_loss": -11.741020202636719, "global_step": 203817, "epoch": 1213} {"train_loss": -11.702821731567383, "global_step": 203818, "epoch": 1213} {"train_loss": -11.651559829711914, "global_step": 203819, "epoch": 1213} {"train_loss": -11.602338790893555, "global_step": 203820, "epoch": 1213} {"train_loss": -11.572405815124512, "global_step": 203821, "epoch": 1213} {"train_loss": -11.675524711608887, "global_step": 203822, "epoch": 1213} {"train_loss": -11.766461372375488, "global_step": 203823, "epoch": 1213} {"train_loss": -11.772529602050781, "global_step": 203824, "epoch": 1213} {"train_loss": -11.435345649719238, "global_step": 203825, "epoch": 1213} {"train_loss": -11.652217864990234, "global_step": 203826, "epoch": 1213} {"train_loss": -11.344879150390625, "global_step": 203827, "epoch": 1213} {"train_loss": -11.83390998840332, "global_step": 203828, "epoch": 1213} {"train_loss": -11.518994331359863, "global_step": 203829, "epoch": 1213} {"train_loss": -11.902871131896973, "global_step": 203830, "epoch": 1213} {"train_loss": -11.438364028930664, "global_step": 203831, "epoch": 1213} {"train_loss": -11.90594482421875, "global_step": 203832, "epoch": 1213} {"train_loss": -11.761327743530273, "global_step": 203833, "epoch": 1213} {"train_loss": -11.864120483398438, "global_step": 203834, "epoch": 1213} {"train_loss": -11.81266975402832, "global_step": 203835, "epoch": 1213} {"train_loss": -11.56629753112793, "global_step": 203836, "epoch": 1213} {"train_loss": -11.352273941040039, "global_step": 203837, "epoch": 1213} {"train_loss": -11.734664916992188, "global_step": 203838, "epoch": 1213} {"train_loss": -11.504974365234375, "global_step": 203839, "epoch": 1213} {"train_loss": -11.617785453796387, "global_step": 203840, "epoch": 1213} {"train_loss": -11.778124809265137, "global_step": 203841, "epoch": 1213} {"train_loss": -11.40969181060791, "global_step": 203842, "epoch": 1213} {"train_loss": -11.417102813720703, "global_step": 203843, "epoch": 1213} {"train_loss": -11.453916549682617, "global_step": 203844, "epoch": 1213} {"train_loss": -11.394205093383789, "global_step": 203845, "epoch": 1213} {"train_loss": -11.591129302978516, "global_step": 203846, "epoch": 1213} {"train_loss": -11.504850387573242, "global_step": 203847, "epoch": 1213} {"train_loss": -11.338335990905762, "global_step": 203848, "epoch": 1213} {"train_loss": -11.33842658996582, "global_step": 203849, "epoch": 1213} {"train_loss": -11.839879989624023, "global_step": 203850, "epoch": 1213} {"train_loss": -11.116801261901855, "global_step": 203851, "epoch": 1213} {"train_loss": -11.429463386535645, "global_step": 203852, "epoch": 1213} {"train_loss": -11.401747703552246, "global_step": 203853, "epoch": 1213} {"train_loss": -11.637367248535156, "global_step": 203854, "epoch": 1213} {"train_loss": -11.226728439331055, "global_step": 203855, "epoch": 1213} {"train_loss": -11.252668380737305, "global_step": 203856, "epoch": 1213} {"train_loss": -11.380146026611328, "global_step": 203857, "epoch": 1213} {"train_loss": -11.71786880493164, "global_step": 203858, "epoch": 1213} {"train_loss": -11.363595008850098, "global_step": 203859, "epoch": 1213} {"train_loss": -11.334696769714355, "global_step": 203860, "epoch": 1213} {"train_loss": -10.924227714538574, "global_step": 203861, "epoch": 1213} {"train_loss": -11.582395553588867, "global_step": 203862, "epoch": 1213} {"train_loss": -11.26002025604248, "global_step": 203863, "epoch": 1213} {"train_loss": -11.233274459838867, "global_step": 203864, "epoch": 1213} {"train_loss": -10.711590766906738, "global_step": 203865, "epoch": 1213} {"train_loss": -11.6327543258667, "global_step": 203866, "epoch": 1213} {"train_loss": -10.664505004882812, "global_step": 203867, "epoch": 1213} {"train_loss": -11.015764236450195, "global_step": 203868, "epoch": 1213} {"train_loss": -11.534528732299805, "global_step": 203869, "epoch": 1213} {"train_loss": -11.266733169555664, "global_step": 203870, "epoch": 1213} {"train_loss": -11.125276565551758, "global_step": 203871, "epoch": 1213} {"train_loss": -11.351552963256836, "global_step": 203872, "epoch": 1213} {"train_loss": -11.058210372924805, "global_step": 203873, "epoch": 1213} {"train_loss": -10.525144577026367, "global_step": 203874, "epoch": 1213} {"train_loss": -11.905109405517578, "global_step": 203875, "epoch": 1213} {"train_loss": -9.932473182678223, "global_step": 203876, "epoch": 1213} {"train_loss": -10.059184074401855, "global_step": 203877, "epoch": 1213} {"train_loss": -11.227813720703125, "global_step": 203878, "epoch": 1213} {"train_loss": -8.693780899047852, "global_step": 203879, "epoch": 1213} {"train_loss": -10.558075904846191, "global_step": 203880, "epoch": 1213} {"train_loss": -10.492627143859863, "global_step": 203881, "epoch": 1213} {"train_loss": -10.915470123291016, "global_step": 203882, "epoch": 1213} {"train_loss": -11.224661827087402, "global_step": 203883, "epoch": 1213} {"train_loss": -10.671056747436523, "global_step": 203884, "epoch": 1213} {"train_loss": -10.630535125732422, "global_step": 203885, "epoch": 1213} {"train_loss": -11.439475059509277, "global_step": 203886, "epoch": 1213} {"train_loss": -10.772878646850586, "global_step": 203887, "epoch": 1213} {"train_loss": -11.275491714477539, "global_step": 203888, "epoch": 1213} {"train_loss": -10.400354385375977, "global_step": 203889, "epoch": 1213} {"train_loss": -11.19623851776123, "global_step": 203890, "epoch": 1213} {"train_loss": -10.759337425231934, "global_step": 203891, "epoch": 1213} {"train_loss": -10.989106178283691, "global_step": 203892, "epoch": 1213} {"train_loss": -10.892492294311523, "global_step": 203893, "epoch": 1213} {"train_loss": -11.305758476257324, "global_step": 203894, "epoch": 1213} {"train_loss": -10.97184944152832, "global_step": 203895, "epoch": 1213} {"train_loss": -11.050629615783691, "global_step": 203896, "epoch": 1213} {"train_loss": -11.135377883911133, "global_step": 203897, "epoch": 1213} {"train_loss": -11.31568717956543, "global_step": 203898, "epoch": 1213} {"train_loss": -10.82075023651123, "global_step": 203899, "epoch": 1213} {"train_loss": -11.278082847595215, "global_step": 203900, "epoch": 1213} {"train_loss": -11.389699935913086, "global_step": 203901, "epoch": 1213} {"train_loss": -11.223443984985352, "global_step": 203902, "epoch": 1213} {"train_loss": -11.190767288208008, "global_step": 203903, "epoch": 1213} {"train_loss": -11.340962409973145, "global_step": 203904, "epoch": 1213} {"train_loss": -11.352145195007324, "global_step": 203905, "epoch": 1213} {"train_loss": -11.388669967651367, "global_step": 203906, "epoch": 1213} {"train_loss": -11.513274192810059, "global_step": 203907, "epoch": 1213} {"train_loss": -11.574420928955078, "global_step": 203908, "epoch": 1213} {"train_loss": -11.387187957763672, "global_step": 203909, "epoch": 1213} {"train_loss": -11.551309585571289, "global_step": 203910, "epoch": 1213} {"train_loss": -11.375075340270996, "global_step": 203911, "epoch": 1213} {"train_loss": -11.419965744018555, "global_step": 203912, "epoch": 1213} {"train_loss": -11.479862213134766, "global_step": 203913, "epoch": 1213} {"train_loss": -11.303863525390625, "global_step": 203914, "epoch": 1213} {"train_loss": -11.447041511535645, "global_step": 203915, "epoch": 1213} {"train_loss": -11.183713912963867, "global_step": 203916, "epoch": 1213} {"train_loss": -11.4992036819458, "global_step": 203917, "epoch": 1213} {"train_loss": -11.332723617553711, "global_step": 203918, "epoch": 1213} {"train_loss": -11.55626392364502, "global_step": 203919, "epoch": 1213} {"train_loss": -11.387762069702148, "global_step": 203920, "epoch": 1213} {"train_loss": -11.139715194702148, "global_step": 203921, "epoch": 1213} {"train_loss": -11.528873443603516, "global_step": 203922, "epoch": 1213} {"train_loss": -11.60369873046875, "global_step": 203923, "epoch": 1213} {"train_loss": -11.507036209106445, "global_step": 203924, "epoch": 1213} {"train_loss": -11.801689147949219, "global_step": 203925, "epoch": 1213} {"train_loss": -11.687509536743164, "global_step": 203926, "epoch": 1213} {"train_loss": -11.691574096679688, "global_step": 203927, "epoch": 1213} {"train_loss": -11.65276050567627, "global_step": 203928, "epoch": 1213} {"train_loss": -11.732217788696289, "global_step": 203929, "epoch": 1213} {"train_loss": -11.625104904174805, "global_step": 203930, "epoch": 1213} {"train_loss": -11.71091079711914, "global_step": 203931, "epoch": 1213} {"train_loss": -11.670082092285156, "global_step": 203932, "epoch": 1213} {"train_loss": -11.680095672607422, "global_step": 203933, "epoch": 1213} {"train_loss": -11.374988555908203, "global_step": 203934, "epoch": 1213} {"train_loss": -11.558614730834961, "global_step": 203935, "epoch": 1213} {"train_loss": -11.709304809570312, "global_step": 203936, "epoch": 1213} {"train_loss": -11.544183731079102, "global_step": 203937, "epoch": 1213} {"train_loss": -11.404500961303711, "global_step": 203938, "epoch": 1213} {"train_loss": -11.551761627197266, "global_step": 203939, "epoch": 1213} {"train_loss": -11.52782917022705, "global_step": 203940, "epoch": 1213} {"train_loss": -11.582428932189941, "global_step": 203941, "epoch": 1213} {"train_loss": -11.52706527709961, "global_step": 203942, "epoch": 1213} {"train_loss": -11.435229301452637, "global_step": 203943, "epoch": 1213} {"train_loss": -11.189096450805664, "global_step": 203944, "epoch": 1213} {"train_loss": -10.66956901550293, "global_step": 203945, "epoch": 1213} {"train_loss": -11.304839134216309, "global_step": 203946, "epoch": 1213} {"train_loss": -11.627323150634766, "global_step": 203947, "epoch": 1213} {"train_loss": -10.878623008728027, "global_step": 203948, "epoch": 1213} {"train_loss": -11.631114959716797, "global_step": 203949, "epoch": 1213} {"train_loss": -11.414833068847656, "global_step": 203950, "epoch": 1213} {"train_loss": -11.328271178972154, "global_step": 203951, "epoch": 1213, "val_loss": 256480.375} {"train_loss": -11.866333961486816, "global_step": 203952, "epoch": 1214} {"train_loss": -11.530111312866211, "global_step": 203953, "epoch": 1214} {"train_loss": -11.511829376220703, "global_step": 203954, "epoch": 1214} {"train_loss": -11.539648056030273, "global_step": 203955, "epoch": 1214} {"train_loss": -11.532020568847656, "global_step": 203956, "epoch": 1214} {"train_loss": -11.692667007446289, "global_step": 203957, "epoch": 1214} {"train_loss": -11.588226318359375, "global_step": 203958, "epoch": 1214} {"train_loss": -11.480712890625, "global_step": 203959, "epoch": 1214} {"train_loss": -11.598234176635742, "global_step": 203960, "epoch": 1214} {"train_loss": -11.735992431640625, "global_step": 203961, "epoch": 1214} {"train_loss": -11.321008682250977, "global_step": 203962, "epoch": 1214} {"train_loss": -11.16744327545166, "global_step": 203963, "epoch": 1214} {"train_loss": -11.561784744262695, "global_step": 203964, "epoch": 1214} {"train_loss": -11.459957122802734, "global_step": 203965, "epoch": 1214} {"train_loss": -11.040769577026367, "global_step": 203966, "epoch": 1214} {"train_loss": -10.347583770751953, "global_step": 203967, "epoch": 1214} {"train_loss": -11.40302848815918, "global_step": 203968, "epoch": 1214} {"train_loss": -11.771162033081055, "global_step": 203969, "epoch": 1214} {"train_loss": -11.171058654785156, "global_step": 203970, "epoch": 1214} {"train_loss": -11.791675567626953, "global_step": 203971, "epoch": 1214} {"train_loss": -11.59069538116455, "global_step": 203972, "epoch": 1214} {"train_loss": -11.641932487487793, "global_step": 203973, "epoch": 1214} {"train_loss": -11.741072654724121, "global_step": 203974, "epoch": 1214} {"train_loss": -11.570562362670898, "global_step": 203975, "epoch": 1214} {"train_loss": -11.814346313476562, "global_step": 203976, "epoch": 1214} {"train_loss": -11.765819549560547, "global_step": 203977, "epoch": 1214} {"train_loss": -11.496092796325684, "global_step": 203978, "epoch": 1214} {"train_loss": -11.59677505493164, "global_step": 203979, "epoch": 1214} {"train_loss": -11.583137512207031, "global_step": 203980, "epoch": 1214} {"train_loss": -11.097114562988281, "global_step": 203981, "epoch": 1214} {"train_loss": -11.617319107055664, "global_step": 203982, "epoch": 1214} {"train_loss": -11.324491500854492, "global_step": 203983, "epoch": 1214} {"train_loss": -10.172481536865234, "global_step": 203984, "epoch": 1214} {"train_loss": -10.516046524047852, "global_step": 203985, "epoch": 1214} {"train_loss": -11.15958309173584, "global_step": 203986, "epoch": 1214} {"train_loss": -11.022891998291016, "global_step": 203987, "epoch": 1214} {"train_loss": -10.692537307739258, "global_step": 203988, "epoch": 1214} {"train_loss": -10.708935737609863, "global_step": 203989, "epoch": 1214} {"train_loss": -10.95954418182373, "global_step": 203990, "epoch": 1214} {"train_loss": -10.904155731201172, "global_step": 203991, "epoch": 1214} {"train_loss": -10.383331298828125, "global_step": 203992, "epoch": 1214} {"train_loss": -10.056336402893066, "global_step": 203993, "epoch": 1214} {"train_loss": -10.440303802490234, "global_step": 203994, "epoch": 1214} {"train_loss": -9.615690231323242, "global_step": 203995, "epoch": 1214} {"train_loss": -11.29238224029541, "global_step": 203996, "epoch": 1214} {"train_loss": -8.64775276184082, "global_step": 203997, "epoch": 1214} {"train_loss": -10.543135643005371, "global_step": 203998, "epoch": 1214} {"train_loss": -9.56544303894043, "global_step": 203999, "epoch": 1214} {"train_loss": -10.565800666809082, "global_step": 204000, "epoch": 1214} {"train_loss": -10.809133529663086, "global_step": 204001, "epoch": 1214} {"train_loss": -10.981477737426758, "global_step": 204002, "epoch": 1214} {"train_loss": -10.392755508422852, "global_step": 204003, "epoch": 1214} {"train_loss": -10.60863971710205, "global_step": 204004, "epoch": 1214} {"train_loss": -11.006250381469727, "global_step": 204005, "epoch": 1214} {"train_loss": -10.404644012451172, "global_step": 204006, "epoch": 1214} {"train_loss": -10.814128875732422, "global_step": 204007, "epoch": 1214} {"train_loss": -10.928119659423828, "global_step": 204008, "epoch": 1214} {"train_loss": -10.612778663635254, "global_step": 204009, "epoch": 1214} {"train_loss": -10.588984489440918, "global_step": 204010, "epoch": 1214} {"train_loss": -11.015812873840332, "global_step": 204011, "epoch": 1214} {"train_loss": -10.675256729125977, "global_step": 204012, "epoch": 1214} {"train_loss": -11.048429489135742, "global_step": 204013, "epoch": 1214} {"train_loss": -10.915742874145508, "global_step": 204014, "epoch": 1214} {"train_loss": -11.067037582397461, "global_step": 204015, "epoch": 1214} {"train_loss": -11.025291442871094, "global_step": 204016, "epoch": 1214} {"train_loss": -11.166966438293457, "global_step": 204017, "epoch": 1214} {"train_loss": -11.300338745117188, "global_step": 204018, "epoch": 1214} {"train_loss": -11.091180801391602, "global_step": 204019, "epoch": 1214} {"train_loss": -11.12533187866211, "global_step": 204020, "epoch": 1214} {"train_loss": -11.147095680236816, "global_step": 204021, "epoch": 1214} {"train_loss": -11.043794631958008, "global_step": 204022, "epoch": 1214} {"train_loss": -11.223977088928223, "global_step": 204023, "epoch": 1214} {"train_loss": -11.389278411865234, "global_step": 204024, "epoch": 1214} {"train_loss": -11.144122123718262, "global_step": 204025, "epoch": 1214} {"train_loss": -11.18589973449707, "global_step": 204026, "epoch": 1214} {"train_loss": -11.438554763793945, "global_step": 204027, "epoch": 1214} {"train_loss": -11.174385070800781, "global_step": 204028, "epoch": 1214} {"train_loss": -11.29327392578125, "global_step": 204029, "epoch": 1214} {"train_loss": -11.282175064086914, "global_step": 204030, "epoch": 1214} {"train_loss": -11.429169654846191, "global_step": 204031, "epoch": 1214} {"train_loss": -11.158514022827148, "global_step": 204032, "epoch": 1214} {"train_loss": -11.353679656982422, "global_step": 204033, "epoch": 1214} {"train_loss": -11.240074157714844, "global_step": 204034, "epoch": 1214} {"train_loss": -11.598583221435547, "global_step": 204035, "epoch": 1214} {"train_loss": -11.66616439819336, "global_step": 204036, "epoch": 1214} {"train_loss": -11.473798751831055, "global_step": 204037, "epoch": 1214} {"train_loss": -11.487042427062988, "global_step": 204038, "epoch": 1214} {"train_loss": -11.494306564331055, "global_step": 204039, "epoch": 1214} {"train_loss": -11.744000434875488, "global_step": 204040, "epoch": 1214} {"train_loss": -11.678804397583008, "global_step": 204041, "epoch": 1214} {"train_loss": -11.689445495605469, "global_step": 204042, "epoch": 1214} {"train_loss": -11.700435638427734, "global_step": 204043, "epoch": 1214} {"train_loss": -11.557727813720703, "global_step": 204044, "epoch": 1214} {"train_loss": -11.607694625854492, "global_step": 204045, "epoch": 1214} {"train_loss": -11.472506523132324, "global_step": 204046, "epoch": 1214} {"train_loss": -11.682905197143555, "global_step": 204047, "epoch": 1214} {"train_loss": -11.504271507263184, "global_step": 204048, "epoch": 1214} {"train_loss": -11.836730003356934, "global_step": 204049, "epoch": 1214} {"train_loss": -11.666339874267578, "global_step": 204050, "epoch": 1214} {"train_loss": -11.6807861328125, "global_step": 204051, "epoch": 1214} {"train_loss": -11.745668411254883, "global_step": 204052, "epoch": 1214} {"train_loss": -11.539851188659668, "global_step": 204053, "epoch": 1214} {"train_loss": -11.944147109985352, "global_step": 204054, "epoch": 1214} {"train_loss": -11.655773162841797, "global_step": 204055, "epoch": 1214} {"train_loss": -11.824867248535156, "global_step": 204056, "epoch": 1214} {"train_loss": -11.641082763671875, "global_step": 204057, "epoch": 1214} {"train_loss": -11.531380653381348, "global_step": 204058, "epoch": 1214} {"train_loss": -11.446897506713867, "global_step": 204059, "epoch": 1214} {"train_loss": -11.66145133972168, "global_step": 204060, "epoch": 1214} {"train_loss": -11.436405181884766, "global_step": 204061, "epoch": 1214} {"train_loss": -11.921741485595703, "global_step": 204062, "epoch": 1214} {"train_loss": -11.57275104522705, "global_step": 204063, "epoch": 1214} {"train_loss": -11.747526168823242, "global_step": 204064, "epoch": 1214} {"train_loss": -11.52584457397461, "global_step": 204065, "epoch": 1214} {"train_loss": -11.617388725280762, "global_step": 204066, "epoch": 1214} {"train_loss": -11.746395111083984, "global_step": 204067, "epoch": 1214} {"train_loss": -11.066795349121094, "global_step": 204068, "epoch": 1214} {"train_loss": -11.04134750366211, "global_step": 204069, "epoch": 1214} {"train_loss": -11.718692779541016, "global_step": 204070, "epoch": 1214} {"train_loss": -11.128564834594727, "global_step": 204071, "epoch": 1214} {"train_loss": -10.962150573730469, "global_step": 204072, "epoch": 1214} {"train_loss": -11.37224292755127, "global_step": 204073, "epoch": 1214} {"train_loss": -11.250057220458984, "global_step": 204074, "epoch": 1214} {"train_loss": -11.439420700073242, "global_step": 204075, "epoch": 1214} {"train_loss": -11.398979187011719, "global_step": 204076, "epoch": 1214} {"train_loss": -11.14499568939209, "global_step": 204077, "epoch": 1214} {"train_loss": -11.08835220336914, "global_step": 204078, "epoch": 1214} {"train_loss": -10.906393051147461, "global_step": 204079, "epoch": 1214} {"train_loss": -11.164291381835938, "global_step": 204080, "epoch": 1214} {"train_loss": -11.278680801391602, "global_step": 204081, "epoch": 1214} {"train_loss": -10.924028396606445, "global_step": 204082, "epoch": 1214} {"train_loss": -11.667644500732422, "global_step": 204083, "epoch": 1214} {"train_loss": -10.994403839111328, "global_step": 204084, "epoch": 1214} {"train_loss": -11.383186340332031, "global_step": 204085, "epoch": 1214} {"train_loss": -10.280893325805664, "global_step": 204086, "epoch": 1214} {"train_loss": -11.072175979614258, "global_step": 204087, "epoch": 1214} {"train_loss": -11.104049682617188, "global_step": 204088, "epoch": 1214} {"train_loss": -10.74937629699707, "global_step": 204089, "epoch": 1214} {"train_loss": -11.58649730682373, "global_step": 204090, "epoch": 1214} {"train_loss": -10.272095680236816, "global_step": 204091, "epoch": 1214} {"train_loss": -10.600656509399414, "global_step": 204092, "epoch": 1214} {"train_loss": -11.304102897644043, "global_step": 204093, "epoch": 1214} {"train_loss": -10.30379867553711, "global_step": 204094, "epoch": 1214} {"train_loss": -11.439001083374023, "global_step": 204095, "epoch": 1214} {"train_loss": -10.943053245544434, "global_step": 204096, "epoch": 1214} {"train_loss": -11.019281387329102, "global_step": 204097, "epoch": 1214} {"train_loss": -11.125551223754883, "global_step": 204098, "epoch": 1214} {"train_loss": -10.84534740447998, "global_step": 204099, "epoch": 1214} {"train_loss": -11.188902854919434, "global_step": 204100, "epoch": 1214} {"train_loss": -11.018304824829102, "global_step": 204101, "epoch": 1214} {"train_loss": -11.454263687133789, "global_step": 204102, "epoch": 1214} {"train_loss": -11.28672981262207, "global_step": 204103, "epoch": 1214} {"train_loss": -11.512290954589844, "global_step": 204104, "epoch": 1214} {"train_loss": -11.17351245880127, "global_step": 204105, "epoch": 1214} {"train_loss": -11.512526512145996, "global_step": 204106, "epoch": 1214} {"train_loss": -11.408830642700195, "global_step": 204107, "epoch": 1214} {"train_loss": -11.357601165771484, "global_step": 204108, "epoch": 1214} {"train_loss": -11.491521835327148, "global_step": 204109, "epoch": 1214} {"train_loss": -11.523666381835938, "global_step": 204110, "epoch": 1214} {"train_loss": -11.387908935546875, "global_step": 204111, "epoch": 1214} {"train_loss": -11.282500267028809, "global_step": 204112, "epoch": 1214} {"train_loss": -11.645000457763672, "global_step": 204113, "epoch": 1214} {"train_loss": -11.537406921386719, "global_step": 204114, "epoch": 1214} {"train_loss": -11.488504409790039, "global_step": 204115, "epoch": 1214} {"train_loss": -11.174510955810547, "global_step": 204116, "epoch": 1214} {"train_loss": -11.435770034790039, "global_step": 204117, "epoch": 1214} {"train_loss": -11.515829086303711, "global_step": 204118, "epoch": 1214} {"train_loss": -11.232315307571774, "global_step": 204119, "epoch": 1214, "val_loss": 253722.46875} {"train_loss": -11.272682189941406, "global_step": 204120, "epoch": 1215} {"train_loss": -11.300911903381348, "global_step": 204121, "epoch": 1215} {"train_loss": -11.22237777709961, "global_step": 204122, "epoch": 1215} {"train_loss": -11.367538452148438, "global_step": 204123, "epoch": 1215} {"train_loss": -11.450723648071289, "global_step": 204124, "epoch": 1215} {"train_loss": -11.214079856872559, "global_step": 204125, "epoch": 1215} {"train_loss": -11.459136009216309, "global_step": 204126, "epoch": 1215} {"train_loss": -11.319258689880371, "global_step": 204127, "epoch": 1215} {"train_loss": -11.606659889221191, "global_step": 204128, "epoch": 1215} {"train_loss": -10.741323471069336, "global_step": 204129, "epoch": 1215} {"train_loss": -11.485578536987305, "global_step": 204130, "epoch": 1215} {"train_loss": -11.190088272094727, "global_step": 204131, "epoch": 1215} {"train_loss": -11.308636665344238, "global_step": 204132, "epoch": 1215} {"train_loss": -11.491134643554688, "global_step": 204133, "epoch": 1215} {"train_loss": -11.110893249511719, "global_step": 204134, "epoch": 1215} {"train_loss": -11.420787811279297, "global_step": 204135, "epoch": 1215} {"train_loss": -11.152833938598633, "global_step": 204136, "epoch": 1215} {"train_loss": -11.435636520385742, "global_step": 204137, "epoch": 1215} {"train_loss": -11.237096786499023, "global_step": 204138, "epoch": 1215} {"train_loss": -11.33070182800293, "global_step": 204139, "epoch": 1215} {"train_loss": -11.461135864257812, "global_step": 204140, "epoch": 1215} {"train_loss": -11.358871459960938, "global_step": 204141, "epoch": 1215} {"train_loss": -11.408975601196289, "global_step": 204142, "epoch": 1215} {"train_loss": -11.033700942993164, "global_step": 204143, "epoch": 1215} {"train_loss": -11.593557357788086, "global_step": 204144, "epoch": 1215} {"train_loss": -11.35138988494873, "global_step": 204145, "epoch": 1215} {"train_loss": -11.487245559692383, "global_step": 204146, "epoch": 1215} {"train_loss": -11.21332836151123, "global_step": 204147, "epoch": 1215} {"train_loss": -11.023804664611816, "global_step": 204148, "epoch": 1215} {"train_loss": -11.272468566894531, "global_step": 204149, "epoch": 1215} {"train_loss": -10.834638595581055, "global_step": 204150, "epoch": 1215} {"train_loss": -11.365842819213867, "global_step": 204151, "epoch": 1215} {"train_loss": -10.90421199798584, "global_step": 204152, "epoch": 1215} {"train_loss": -11.338905334472656, "global_step": 204153, "epoch": 1215} {"train_loss": -11.150463104248047, "global_step": 204154, "epoch": 1215} {"train_loss": -11.388965606689453, "global_step": 204155, "epoch": 1215} {"train_loss": -11.413237571716309, "global_step": 204156, "epoch": 1215} {"train_loss": -11.001461029052734, "global_step": 204157, "epoch": 1215} {"train_loss": -11.319931030273438, "global_step": 204158, "epoch": 1215} {"train_loss": -11.393943786621094, "global_step": 204159, "epoch": 1215} {"train_loss": -11.55472183227539, "global_step": 204160, "epoch": 1215} {"train_loss": -11.296961784362793, "global_step": 204161, "epoch": 1215} {"train_loss": -11.709772109985352, "global_step": 204162, "epoch": 1215} {"train_loss": -11.589041709899902, "global_step": 204163, "epoch": 1215} {"train_loss": -11.588281631469727, "global_step": 204164, "epoch": 1215} {"train_loss": -11.587417602539062, "global_step": 204165, "epoch": 1215} {"train_loss": -11.178162574768066, "global_step": 204166, "epoch": 1215} {"train_loss": -11.732194900512695, "global_step": 204167, "epoch": 1215} {"train_loss": -11.11253547668457, "global_step": 204168, "epoch": 1215} {"train_loss": -11.505830764770508, "global_step": 204169, "epoch": 1215} {"train_loss": -10.579460144042969, "global_step": 204170, "epoch": 1215} {"train_loss": -10.817774772644043, "global_step": 204171, "epoch": 1215} {"train_loss": -10.830659866333008, "global_step": 204172, "epoch": 1215} {"train_loss": -10.996971130371094, "global_step": 204173, "epoch": 1215} {"train_loss": -10.576528549194336, "global_step": 204174, "epoch": 1215} {"train_loss": -11.426328659057617, "global_step": 204175, "epoch": 1215} {"train_loss": -10.655471801757812, "global_step": 204176, "epoch": 1215} {"train_loss": -11.252815246582031, "global_step": 204177, "epoch": 1215} {"train_loss": -10.902179718017578, "global_step": 204178, "epoch": 1215} {"train_loss": -11.219280242919922, "global_step": 204179, "epoch": 1215} {"train_loss": -11.273235321044922, "global_step": 204180, "epoch": 1215} {"train_loss": -11.016029357910156, "global_step": 204181, "epoch": 1215} {"train_loss": -11.645758628845215, "global_step": 204182, "epoch": 1215} {"train_loss": -10.926612854003906, "global_step": 204183, "epoch": 1215} {"train_loss": -11.505722045898438, "global_step": 204184, "epoch": 1215} {"train_loss": -11.455583572387695, "global_step": 204185, "epoch": 1215} {"train_loss": -11.538614273071289, "global_step": 204186, "epoch": 1215} {"train_loss": -11.557655334472656, "global_step": 204187, "epoch": 1215} {"train_loss": -11.462579727172852, "global_step": 204188, "epoch": 1215} {"train_loss": -11.679877281188965, "global_step": 204189, "epoch": 1215} {"train_loss": -11.178166389465332, "global_step": 204190, "epoch": 1215} {"train_loss": -11.48928451538086, "global_step": 204191, "epoch": 1215} {"train_loss": -11.308942794799805, "global_step": 204192, "epoch": 1215} {"train_loss": -11.114100456237793, "global_step": 204193, "epoch": 1215} {"train_loss": -11.618755340576172, "global_step": 204194, "epoch": 1215} {"train_loss": -11.071417808532715, "global_step": 204195, "epoch": 1215} {"train_loss": -11.056458473205566, "global_step": 204196, "epoch": 1215} {"train_loss": -11.44904899597168, "global_step": 204197, "epoch": 1215} {"train_loss": -10.479219436645508, "global_step": 204198, "epoch": 1215} {"train_loss": -11.776150703430176, "global_step": 204199, "epoch": 1215} {"train_loss": -11.093744277954102, "global_step": 204200, "epoch": 1215} {"train_loss": -11.376687049865723, "global_step": 204201, "epoch": 1215} {"train_loss": -11.201274871826172, "global_step": 204202, "epoch": 1215} {"train_loss": -10.953704833984375, "global_step": 204203, "epoch": 1215} {"train_loss": -11.767230987548828, "global_step": 204204, "epoch": 1215} {"train_loss": -11.095598220825195, "global_step": 204205, "epoch": 1215} {"train_loss": -11.425251007080078, "global_step": 204206, "epoch": 1215} {"train_loss": -11.392518997192383, "global_step": 204207, "epoch": 1215} {"train_loss": -11.033384323120117, "global_step": 204208, "epoch": 1215} {"train_loss": -11.618354797363281, "global_step": 204209, "epoch": 1215} {"train_loss": -11.27835464477539, "global_step": 204210, "epoch": 1215} {"train_loss": -11.431364059448242, "global_step": 204211, "epoch": 1215} {"train_loss": -11.201842308044434, "global_step": 204212, "epoch": 1215} {"train_loss": -11.462248802185059, "global_step": 204213, "epoch": 1215} {"train_loss": -11.36453628540039, "global_step": 204214, "epoch": 1215} {"train_loss": -11.592819213867188, "global_step": 204215, "epoch": 1215} {"train_loss": -11.292686462402344, "global_step": 204216, "epoch": 1215} {"train_loss": -11.146690368652344, "global_step": 204217, "epoch": 1215} {"train_loss": -11.533981323242188, "global_step": 204218, "epoch": 1215} {"train_loss": -11.060426712036133, "global_step": 204219, "epoch": 1215} {"train_loss": -11.304276466369629, "global_step": 204220, "epoch": 1215} {"train_loss": -11.33745002746582, "global_step": 204221, "epoch": 1215} {"train_loss": -11.521615982055664, "global_step": 204222, "epoch": 1215} {"train_loss": -11.266069412231445, "global_step": 204223, "epoch": 1215} {"train_loss": -11.545265197753906, "global_step": 204224, "epoch": 1215} {"train_loss": -11.295855522155762, "global_step": 204225, "epoch": 1215} {"train_loss": -11.339323043823242, "global_step": 204226, "epoch": 1215} {"train_loss": -11.502604484558105, "global_step": 204227, "epoch": 1215} {"train_loss": -10.963560104370117, "global_step": 204228, "epoch": 1215} {"train_loss": -11.287761688232422, "global_step": 204229, "epoch": 1215} {"train_loss": -11.519323348999023, "global_step": 204230, "epoch": 1215} {"train_loss": -11.378792762756348, "global_step": 204231, "epoch": 1215} {"train_loss": -11.12601375579834, "global_step": 204232, "epoch": 1215} {"train_loss": -11.150257110595703, "global_step": 204233, "epoch": 1215} {"train_loss": -11.025003433227539, "global_step": 204234, "epoch": 1215} {"train_loss": -11.553645133972168, "global_step": 204235, "epoch": 1215} {"train_loss": -11.666217803955078, "global_step": 204236, "epoch": 1215} {"train_loss": -11.394966125488281, "global_step": 204237, "epoch": 1215} {"train_loss": -11.363350868225098, "global_step": 204238, "epoch": 1215} {"train_loss": -11.273927688598633, "global_step": 204239, "epoch": 1215} {"train_loss": -11.464139938354492, "global_step": 204240, "epoch": 1215} {"train_loss": -11.578546524047852, "global_step": 204241, "epoch": 1215} {"train_loss": -11.706883430480957, "global_step": 204242, "epoch": 1215} {"train_loss": -11.859546661376953, "global_step": 204243, "epoch": 1215} {"train_loss": -11.758798599243164, "global_step": 204244, "epoch": 1215} {"train_loss": -11.648679733276367, "global_step": 204245, "epoch": 1215} {"train_loss": -11.681473731994629, "global_step": 204246, "epoch": 1215} {"train_loss": -11.464619636535645, "global_step": 204247, "epoch": 1215} {"train_loss": -11.51190185546875, "global_step": 204248, "epoch": 1215} {"train_loss": -11.415533065795898, "global_step": 204249, "epoch": 1215} {"train_loss": -11.573680877685547, "global_step": 204250, "epoch": 1215} {"train_loss": -11.410846710205078, "global_step": 204251, "epoch": 1215} {"train_loss": -11.391557693481445, "global_step": 204252, "epoch": 1215} {"train_loss": -11.424430847167969, "global_step": 204253, "epoch": 1215} {"train_loss": -11.875581741333008, "global_step": 204254, "epoch": 1215} {"train_loss": -11.58415412902832, "global_step": 204255, "epoch": 1215} {"train_loss": -11.508672714233398, "global_step": 204256, "epoch": 1215} {"train_loss": -11.453388214111328, "global_step": 204257, "epoch": 1215} {"train_loss": -11.54247760772705, "global_step": 204258, "epoch": 1215} {"train_loss": -11.443167686462402, "global_step": 204259, "epoch": 1215} {"train_loss": -11.605179786682129, "global_step": 204260, "epoch": 1215} {"train_loss": -11.495019912719727, "global_step": 204261, "epoch": 1215} {"train_loss": -11.620004653930664, "global_step": 204262, "epoch": 1215} {"train_loss": -11.669546127319336, "global_step": 204263, "epoch": 1215} {"train_loss": -11.433924674987793, "global_step": 204264, "epoch": 1215} {"train_loss": -11.271768569946289, "global_step": 204265, "epoch": 1215} {"train_loss": -11.512130737304688, "global_step": 204266, "epoch": 1215} {"train_loss": -11.363746643066406, "global_step": 204267, "epoch": 1215} {"train_loss": -11.17526626586914, "global_step": 204268, "epoch": 1215} {"train_loss": -11.625174522399902, "global_step": 204269, "epoch": 1215} {"train_loss": -11.75904369354248, "global_step": 204270, "epoch": 1215} {"train_loss": -11.35232925415039, "global_step": 204271, "epoch": 1215} {"train_loss": -11.37322998046875, "global_step": 204272, "epoch": 1215} {"train_loss": -11.834232330322266, "global_step": 204273, "epoch": 1215} {"train_loss": -11.490219116210938, "global_step": 204274, "epoch": 1215} {"train_loss": -11.484498977661133, "global_step": 204275, "epoch": 1215} {"train_loss": -11.719932556152344, "global_step": 204276, "epoch": 1215} {"train_loss": -11.421414375305176, "global_step": 204277, "epoch": 1215} {"train_loss": -11.676998138427734, "global_step": 204278, "epoch": 1215} {"train_loss": -11.742020606994629, "global_step": 204279, "epoch": 1215} {"train_loss": -11.620983123779297, "global_step": 204280, "epoch": 1215} {"train_loss": -11.887739181518555, "global_step": 204281, "epoch": 1215} {"train_loss": -11.708856582641602, "global_step": 204282, "epoch": 1215} {"train_loss": -11.66508960723877, "global_step": 204283, "epoch": 1215} {"train_loss": -11.664276123046875, "global_step": 204284, "epoch": 1215} {"train_loss": -11.644670486450195, "global_step": 204285, "epoch": 1215} {"train_loss": -11.555122375488281, "global_step": 204286, "epoch": 1215} {"train_loss": -11.371703374953498, "global_step": 204287, "epoch": 1215, "val_loss": 252181.171875, "train_action_mse_error": 5.220681667327881} {"train_loss": -9.345122337341309, "global_step": 204288, "epoch": 1216} {"train_loss": -10.817829132080078, "global_step": 204289, "epoch": 1216} {"train_loss": -11.5504732131958, "global_step": 204290, "epoch": 1216} {"train_loss": -9.45605754852295, "global_step": 204291, "epoch": 1216} {"train_loss": -11.398962020874023, "global_step": 204292, "epoch": 1216} {"train_loss": -10.019572257995605, "global_step": 204293, "epoch": 1216} {"train_loss": -8.321123123168945, "global_step": 204294, "epoch": 1216} {"train_loss": -8.969585418701172, "global_step": 204295, "epoch": 1216} {"train_loss": -10.314192771911621, "global_step": 204296, "epoch": 1216} {"train_loss": -9.834125518798828, "global_step": 204297, "epoch": 1216} {"train_loss": -8.1610107421875, "global_step": 204298, "epoch": 1216} {"train_loss": -10.760610580444336, "global_step": 204299, "epoch": 1216} {"train_loss": -7.088257789611816, "global_step": 204300, "epoch": 1216} {"train_loss": -8.337945938110352, "global_step": 204301, "epoch": 1216} {"train_loss": -8.817048072814941, "global_step": 204302, "epoch": 1216} {"train_loss": -8.720823287963867, "global_step": 204303, "epoch": 1216} {"train_loss": -10.005426406860352, "global_step": 204304, "epoch": 1216} {"train_loss": -8.23910140991211, "global_step": 204305, "epoch": 1216} {"train_loss": -9.629602432250977, "global_step": 204306, "epoch": 1216} {"train_loss": -8.898338317871094, "global_step": 204307, "epoch": 1216} {"train_loss": -10.884492874145508, "global_step": 204308, "epoch": 1216} {"train_loss": -9.408885955810547, "global_step": 204309, "epoch": 1216} {"train_loss": -10.524187088012695, "global_step": 204310, "epoch": 1216} {"train_loss": -9.612375259399414, "global_step": 204311, "epoch": 1216} {"train_loss": -9.617963790893555, "global_step": 204312, "epoch": 1216} {"train_loss": -10.4161376953125, "global_step": 204313, "epoch": 1216} {"train_loss": -8.938417434692383, "global_step": 204314, "epoch": 1216} {"train_loss": -10.886859893798828, "global_step": 204315, "epoch": 1216} {"train_loss": -8.36819839477539, "global_step": 204316, "epoch": 1216} {"train_loss": -9.422399520874023, "global_step": 204317, "epoch": 1216} {"train_loss": -10.397811889648438, "global_step": 204318, "epoch": 1216} {"train_loss": -9.799243927001953, "global_step": 204319, "epoch": 1216} {"train_loss": -10.78101921081543, "global_step": 204320, "epoch": 1216} {"train_loss": -10.281695365905762, "global_step": 204321, "epoch": 1216} {"train_loss": -10.280808448791504, "global_step": 204322, "epoch": 1216} {"train_loss": -10.907289505004883, "global_step": 204323, "epoch": 1216} {"train_loss": -10.469778060913086, "global_step": 204324, "epoch": 1216} {"train_loss": -10.742898941040039, "global_step": 204325, "epoch": 1216} {"train_loss": -11.122098922729492, "global_step": 204326, "epoch": 1216} {"train_loss": -10.811944007873535, "global_step": 204327, "epoch": 1216} {"train_loss": -10.4977388381958, "global_step": 204328, "epoch": 1216} {"train_loss": -11.046326637268066, "global_step": 204329, "epoch": 1216} {"train_loss": -10.614814758300781, "global_step": 204330, "epoch": 1216} {"train_loss": -10.784332275390625, "global_step": 204331, "epoch": 1216} {"train_loss": -11.127544403076172, "global_step": 204332, "epoch": 1216} {"train_loss": -10.870704650878906, "global_step": 204333, "epoch": 1216} {"train_loss": -10.845355033874512, "global_step": 204334, "epoch": 1216} {"train_loss": -11.233399391174316, "global_step": 204335, "epoch": 1216} {"train_loss": -10.932564735412598, "global_step": 204336, "epoch": 1216} {"train_loss": -10.970727920532227, "global_step": 204337, "epoch": 1216} {"train_loss": -11.068196296691895, "global_step": 204338, "epoch": 1216} {"train_loss": -10.930915832519531, "global_step": 204339, "epoch": 1216} {"train_loss": -11.137569427490234, "global_step": 204340, "epoch": 1216} {"train_loss": -11.159602165222168, "global_step": 204341, "epoch": 1216} {"train_loss": -11.122968673706055, "global_step": 204342, "epoch": 1216} {"train_loss": -11.191137313842773, "global_step": 204343, "epoch": 1216} {"train_loss": -11.371593475341797, "global_step": 204344, "epoch": 1216} {"train_loss": -11.237847328186035, "global_step": 204345, "epoch": 1216} {"train_loss": -11.336344718933105, "global_step": 204346, "epoch": 1216} {"train_loss": -11.298741340637207, "global_step": 204347, "epoch": 1216} {"train_loss": -11.138737678527832, "global_step": 204348, "epoch": 1216} {"train_loss": -11.4298677444458, "global_step": 204349, "epoch": 1216} {"train_loss": -11.283792495727539, "global_step": 204350, "epoch": 1216} {"train_loss": -11.373146057128906, "global_step": 204351, "epoch": 1216} {"train_loss": -11.300167083740234, "global_step": 204352, "epoch": 1216} {"train_loss": -11.379207611083984, "global_step": 204353, "epoch": 1216} {"train_loss": -11.29768180847168, "global_step": 204354, "epoch": 1216} {"train_loss": -11.28515625, "global_step": 204355, "epoch": 1216} {"train_loss": -11.574300765991211, "global_step": 204356, "epoch": 1216} {"train_loss": -11.426326751708984, "global_step": 204357, "epoch": 1216} {"train_loss": -11.410075187683105, "global_step": 204358, "epoch": 1216} {"train_loss": -11.343700408935547, "global_step": 204359, "epoch": 1216} {"train_loss": -11.457487106323242, "global_step": 204360, "epoch": 1216} {"train_loss": -11.578781127929688, "global_step": 204361, "epoch": 1216} {"train_loss": -11.566566467285156, "global_step": 204362, "epoch": 1216} {"train_loss": -11.544706344604492, "global_step": 204363, "epoch": 1216} {"train_loss": -11.746639251708984, "global_step": 204364, "epoch": 1216} {"train_loss": -11.457170486450195, "global_step": 204365, "epoch": 1216} {"train_loss": -11.63165283203125, "global_step": 204366, "epoch": 1216} {"train_loss": -11.481156349182129, "global_step": 204367, "epoch": 1216} {"train_loss": -11.59378719329834, "global_step": 204368, "epoch": 1216} {"train_loss": -11.621602058410645, "global_step": 204369, "epoch": 1216} {"train_loss": -11.47610092163086, "global_step": 204370, "epoch": 1216} {"train_loss": -11.677800178527832, "global_step": 204371, "epoch": 1216} {"train_loss": -11.469545364379883, "global_step": 204372, "epoch": 1216} {"train_loss": -11.727041244506836, "global_step": 204373, "epoch": 1216} {"train_loss": -11.742156982421875, "global_step": 204374, "epoch": 1216} {"train_loss": -11.647597312927246, "global_step": 204375, "epoch": 1216} {"train_loss": -11.559477806091309, "global_step": 204376, "epoch": 1216} {"train_loss": -11.606021881103516, "global_step": 204377, "epoch": 1216} {"train_loss": -11.713251113891602, "global_step": 204378, "epoch": 1216} {"train_loss": -11.613696098327637, "global_step": 204379, "epoch": 1216} {"train_loss": -11.548683166503906, "global_step": 204380, "epoch": 1216} {"train_loss": -11.693575859069824, "global_step": 204381, "epoch": 1216} {"train_loss": -11.5543851852417, "global_step": 204382, "epoch": 1216} {"train_loss": -11.504573822021484, "global_step": 204383, "epoch": 1216} {"train_loss": -11.777294158935547, "global_step": 204384, "epoch": 1216} {"train_loss": -11.754829406738281, "global_step": 204385, "epoch": 1216} {"train_loss": -11.755084991455078, "global_step": 204386, "epoch": 1216} {"train_loss": -11.879419326782227, "global_step": 204387, "epoch": 1216} {"train_loss": -11.762309074401855, "global_step": 204388, "epoch": 1216} {"train_loss": -11.551562309265137, "global_step": 204389, "epoch": 1216} {"train_loss": -11.772490501403809, "global_step": 204390, "epoch": 1216} {"train_loss": -11.824179649353027, "global_step": 204391, "epoch": 1216} {"train_loss": -11.912599563598633, "global_step": 204392, "epoch": 1216} {"train_loss": -11.902691841125488, "global_step": 204393, "epoch": 1216} {"train_loss": -11.988120079040527, "global_step": 204394, "epoch": 1216} {"train_loss": -11.480464935302734, "global_step": 204395, "epoch": 1216} {"train_loss": -11.513391494750977, "global_step": 204396, "epoch": 1216} {"train_loss": -11.022356986999512, "global_step": 204397, "epoch": 1216} {"train_loss": -11.377045631408691, "global_step": 204398, "epoch": 1216} {"train_loss": -11.688283920288086, "global_step": 204399, "epoch": 1216} {"train_loss": -10.030933380126953, "global_step": 204400, "epoch": 1216} {"train_loss": -6.332075119018555, "global_step": 204401, "epoch": 1216} {"train_loss": -10.368256568908691, "global_step": 204402, "epoch": 1216} {"train_loss": -8.369831085205078, "global_step": 204403, "epoch": 1216} {"train_loss": -10.335383415222168, "global_step": 204404, "epoch": 1216} {"train_loss": -9.672274589538574, "global_step": 204405, "epoch": 1216} {"train_loss": -10.710525512695312, "global_step": 204406, "epoch": 1216} {"train_loss": -9.306543350219727, "global_step": 204407, "epoch": 1216} {"train_loss": -9.894563674926758, "global_step": 204408, "epoch": 1216} {"train_loss": -9.675132751464844, "global_step": 204409, "epoch": 1216} {"train_loss": -9.829107284545898, "global_step": 204410, "epoch": 1216} {"train_loss": -10.07894229888916, "global_step": 204411, "epoch": 1216} {"train_loss": -10.487590789794922, "global_step": 204412, "epoch": 1216} {"train_loss": -9.558956146240234, "global_step": 204413, "epoch": 1216} {"train_loss": -10.526346206665039, "global_step": 204414, "epoch": 1216} {"train_loss": -10.216754913330078, "global_step": 204415, "epoch": 1216} {"train_loss": -10.396112442016602, "global_step": 204416, "epoch": 1216} {"train_loss": -10.944988250732422, "global_step": 204417, "epoch": 1216} {"train_loss": -10.760823249816895, "global_step": 204418, "epoch": 1216} {"train_loss": -10.67081356048584, "global_step": 204419, "epoch": 1216} {"train_loss": -11.084711074829102, "global_step": 204420, "epoch": 1216} {"train_loss": -10.926861763000488, "global_step": 204421, "epoch": 1216} {"train_loss": -10.656177520751953, "global_step": 204422, "epoch": 1216} {"train_loss": -11.080129623413086, "global_step": 204423, "epoch": 1216} {"train_loss": -10.806678771972656, "global_step": 204424, "epoch": 1216} {"train_loss": -10.993446350097656, "global_step": 204425, "epoch": 1216} {"train_loss": -10.863380432128906, "global_step": 204426, "epoch": 1216} {"train_loss": -10.980484962463379, "global_step": 204427, "epoch": 1216} {"train_loss": -11.046979904174805, "global_step": 204428, "epoch": 1216} {"train_loss": -10.864280700683594, "global_step": 204429, "epoch": 1216} {"train_loss": -11.30485725402832, "global_step": 204430, "epoch": 1216} {"train_loss": -10.867030143737793, "global_step": 204431, "epoch": 1216} {"train_loss": -10.984848022460938, "global_step": 204432, "epoch": 1216} {"train_loss": -10.971407890319824, "global_step": 204433, "epoch": 1216} {"train_loss": -11.154595375061035, "global_step": 204434, "epoch": 1216} {"train_loss": -11.031371116638184, "global_step": 204435, "epoch": 1216} {"train_loss": -11.111120223999023, "global_step": 204436, "epoch": 1216} {"train_loss": -11.144558906555176, "global_step": 204437, "epoch": 1216} {"train_loss": -11.375774383544922, "global_step": 204438, "epoch": 1216} {"train_loss": -11.052528381347656, "global_step": 204439, "epoch": 1216} {"train_loss": -11.193404197692871, "global_step": 204440, "epoch": 1216} {"train_loss": -11.142007827758789, "global_step": 204441, "epoch": 1216} {"train_loss": -10.990355491638184, "global_step": 204442, "epoch": 1216} {"train_loss": -11.253540992736816, "global_step": 204443, "epoch": 1216} {"train_loss": -11.211328506469727, "global_step": 204444, "epoch": 1216} {"train_loss": -11.100835800170898, "global_step": 204445, "epoch": 1216} {"train_loss": -11.350128173828125, "global_step": 204446, "epoch": 1216} {"train_loss": -11.183181762695312, "global_step": 204447, "epoch": 1216} {"train_loss": -11.362380981445312, "global_step": 204448, "epoch": 1216} {"train_loss": -11.28117561340332, "global_step": 204449, "epoch": 1216} {"train_loss": -10.990553855895996, "global_step": 204450, "epoch": 1216} {"train_loss": -11.28941535949707, "global_step": 204451, "epoch": 1216} {"train_loss": -11.316771507263184, "global_step": 204452, "epoch": 1216} {"train_loss": -11.373546600341797, "global_step": 204453, "epoch": 1216} {"train_loss": -11.386287689208984, "global_step": 204454, "epoch": 1216} {"train_loss": -10.789251526196798, "global_step": 204455, "epoch": 1216, "val_loss": 255841.421875} {"train_loss": -11.595257759094238, "global_step": 204456, "epoch": 1217} {"train_loss": -11.379026412963867, "global_step": 204457, "epoch": 1217} {"train_loss": -11.31959342956543, "global_step": 204458, "epoch": 1217} {"train_loss": -11.497669219970703, "global_step": 204459, "epoch": 1217} {"train_loss": -11.343910217285156, "global_step": 204460, "epoch": 1217} {"train_loss": -11.554073333740234, "global_step": 204461, "epoch": 1217} {"train_loss": -11.33791732788086, "global_step": 204462, "epoch": 1217} {"train_loss": -11.643404006958008, "global_step": 204463, "epoch": 1217} {"train_loss": -11.360807418823242, "global_step": 204464, "epoch": 1217} {"train_loss": -11.379638671875, "global_step": 204465, "epoch": 1217} {"train_loss": -11.333688735961914, "global_step": 204466, "epoch": 1217} {"train_loss": -11.516398429870605, "global_step": 204467, "epoch": 1217} {"train_loss": -11.433782577514648, "global_step": 204468, "epoch": 1217} {"train_loss": -11.522476196289062, "global_step": 204469, "epoch": 1217} {"train_loss": -11.46235179901123, "global_step": 204470, "epoch": 1217} {"train_loss": -11.385232925415039, "global_step": 204471, "epoch": 1217} {"train_loss": -11.186616897583008, "global_step": 204472, "epoch": 1217} {"train_loss": -11.53415298461914, "global_step": 204473, "epoch": 1217} {"train_loss": -11.593629837036133, "global_step": 204474, "epoch": 1217} {"train_loss": -11.396026611328125, "global_step": 204475, "epoch": 1217} {"train_loss": -11.487513542175293, "global_step": 204476, "epoch": 1217} {"train_loss": -11.613264083862305, "global_step": 204477, "epoch": 1217} {"train_loss": -11.83181095123291, "global_step": 204478, "epoch": 1217} {"train_loss": -11.790151596069336, "global_step": 204479, "epoch": 1217} {"train_loss": -11.552783966064453, "global_step": 204480, "epoch": 1217} {"train_loss": -11.603950500488281, "global_step": 204481, "epoch": 1217} {"train_loss": -11.632076263427734, "global_step": 204482, "epoch": 1217} {"train_loss": -11.517175674438477, "global_step": 204483, "epoch": 1217} {"train_loss": -11.84024429321289, "global_step": 204484, "epoch": 1217} {"train_loss": -11.485798835754395, "global_step": 204485, "epoch": 1217} {"train_loss": -11.678686141967773, "global_step": 204486, "epoch": 1217} {"train_loss": -11.4697265625, "global_step": 204487, "epoch": 1217} {"train_loss": -11.359243392944336, "global_step": 204488, "epoch": 1217} {"train_loss": -11.553485870361328, "global_step": 204489, "epoch": 1217} {"train_loss": -11.33883285522461, "global_step": 204490, "epoch": 1217} {"train_loss": -11.737232208251953, "global_step": 204491, "epoch": 1217} {"train_loss": -11.602360725402832, "global_step": 204492, "epoch": 1217} {"train_loss": -11.725247383117676, "global_step": 204493, "epoch": 1217} {"train_loss": -11.439777374267578, "global_step": 204494, "epoch": 1217} {"train_loss": -11.594528198242188, "global_step": 204495, "epoch": 1217} {"train_loss": -11.701096534729004, "global_step": 204496, "epoch": 1217} {"train_loss": -11.342658996582031, "global_step": 204497, "epoch": 1217} {"train_loss": -11.402498245239258, "global_step": 204498, "epoch": 1217} {"train_loss": -11.629485130310059, "global_step": 204499, "epoch": 1217} {"train_loss": -11.602633476257324, "global_step": 204500, "epoch": 1217} {"train_loss": -11.22606372833252, "global_step": 204501, "epoch": 1217} {"train_loss": -11.548439979553223, "global_step": 204502, "epoch": 1217} {"train_loss": -11.094810485839844, "global_step": 204503, "epoch": 1217} {"train_loss": -10.771618843078613, "global_step": 204504, "epoch": 1217} {"train_loss": -11.559968948364258, "global_step": 204505, "epoch": 1217} {"train_loss": -10.056821823120117, "global_step": 204506, "epoch": 1217} {"train_loss": -10.987537384033203, "global_step": 204507, "epoch": 1217} {"train_loss": -11.299304008483887, "global_step": 204508, "epoch": 1217} {"train_loss": -9.993366241455078, "global_step": 204509, "epoch": 1217} {"train_loss": -11.185422897338867, "global_step": 204510, "epoch": 1217} {"train_loss": -10.69923210144043, "global_step": 204511, "epoch": 1217} {"train_loss": -11.216948509216309, "global_step": 204512, "epoch": 1217} {"train_loss": -10.90127944946289, "global_step": 204513, "epoch": 1217} {"train_loss": -11.250930786132812, "global_step": 204514, "epoch": 1217} {"train_loss": -11.068350791931152, "global_step": 204515, "epoch": 1217} {"train_loss": -10.852657318115234, "global_step": 204516, "epoch": 1217} {"train_loss": -11.165685653686523, "global_step": 204517, "epoch": 1217} {"train_loss": -11.045476913452148, "global_step": 204518, "epoch": 1217} {"train_loss": -11.631645202636719, "global_step": 204519, "epoch": 1217} {"train_loss": -11.138503074645996, "global_step": 204520, "epoch": 1217} {"train_loss": -11.175069808959961, "global_step": 204521, "epoch": 1217} {"train_loss": -11.432533264160156, "global_step": 204522, "epoch": 1217} {"train_loss": -11.1659517288208, "global_step": 204523, "epoch": 1217} {"train_loss": -11.481486320495605, "global_step": 204524, "epoch": 1217} {"train_loss": -11.289031028747559, "global_step": 204525, "epoch": 1217} {"train_loss": -11.339478492736816, "global_step": 204526, "epoch": 1217} {"train_loss": -11.44267749786377, "global_step": 204527, "epoch": 1217} {"train_loss": -11.308710098266602, "global_step": 204528, "epoch": 1217} {"train_loss": -11.44689655303955, "global_step": 204529, "epoch": 1217} {"train_loss": -11.318439483642578, "global_step": 204530, "epoch": 1217} {"train_loss": -11.441705703735352, "global_step": 204531, "epoch": 1217} {"train_loss": -11.248002052307129, "global_step": 204532, "epoch": 1217} {"train_loss": -11.51091480255127, "global_step": 204533, "epoch": 1217} {"train_loss": -11.457515716552734, "global_step": 204534, "epoch": 1217} {"train_loss": -11.541793823242188, "global_step": 204535, "epoch": 1217} {"train_loss": -11.76862621307373, "global_step": 204536, "epoch": 1217} {"train_loss": -11.384980201721191, "global_step": 204537, "epoch": 1217} {"train_loss": -11.799545288085938, "global_step": 204538, "epoch": 1217} {"train_loss": -11.253861427307129, "global_step": 204539, "epoch": 1217} {"train_loss": -11.34182357788086, "global_step": 204540, "epoch": 1217} {"train_loss": -11.51643180847168, "global_step": 204541, "epoch": 1217} {"train_loss": -11.460478782653809, "global_step": 204542, "epoch": 1217} {"train_loss": -11.728263854980469, "global_step": 204543, "epoch": 1217} {"train_loss": -11.360882759094238, "global_step": 204544, "epoch": 1217} {"train_loss": -11.670225143432617, "global_step": 204545, "epoch": 1217} {"train_loss": -11.510242462158203, "global_step": 204546, "epoch": 1217} {"train_loss": -11.071695327758789, "global_step": 204547, "epoch": 1217} {"train_loss": -11.708802223205566, "global_step": 204548, "epoch": 1217} {"train_loss": -11.314798355102539, "global_step": 204549, "epoch": 1217} {"train_loss": -11.210884094238281, "global_step": 204550, "epoch": 1217} {"train_loss": -11.357301712036133, "global_step": 204551, "epoch": 1217} {"train_loss": -11.237443923950195, "global_step": 204552, "epoch": 1217} {"train_loss": -11.497612953186035, "global_step": 204553, "epoch": 1217} {"train_loss": -11.455096244812012, "global_step": 204554, "epoch": 1217} {"train_loss": -11.09292984008789, "global_step": 204555, "epoch": 1217} {"train_loss": -11.452136993408203, "global_step": 204556, "epoch": 1217} {"train_loss": -11.352533340454102, "global_step": 204557, "epoch": 1217} {"train_loss": -11.348152160644531, "global_step": 204558, "epoch": 1217} {"train_loss": -10.976027488708496, "global_step": 204559, "epoch": 1217} {"train_loss": -11.505670547485352, "global_step": 204560, "epoch": 1217} {"train_loss": -11.303105354309082, "global_step": 204561, "epoch": 1217} {"train_loss": -11.63705825805664, "global_step": 204562, "epoch": 1217} {"train_loss": -11.51922607421875, "global_step": 204563, "epoch": 1217} {"train_loss": -11.336920738220215, "global_step": 204564, "epoch": 1217} {"train_loss": -11.435447692871094, "global_step": 204565, "epoch": 1217} {"train_loss": -11.131978988647461, "global_step": 204566, "epoch": 1217} {"train_loss": -11.47853946685791, "global_step": 204567, "epoch": 1217} {"train_loss": -11.621322631835938, "global_step": 204568, "epoch": 1217} {"train_loss": -11.232141494750977, "global_step": 204569, "epoch": 1217} {"train_loss": -11.920984268188477, "global_step": 204570, "epoch": 1217} {"train_loss": -11.490259170532227, "global_step": 204571, "epoch": 1217} {"train_loss": -11.646882057189941, "global_step": 204572, "epoch": 1217} {"train_loss": -11.552608489990234, "global_step": 204573, "epoch": 1217} {"train_loss": -11.582599639892578, "global_step": 204574, "epoch": 1217} {"train_loss": -11.129644393920898, "global_step": 204575, "epoch": 1217} {"train_loss": -11.516037940979004, "global_step": 204576, "epoch": 1217} {"train_loss": -11.203014373779297, "global_step": 204577, "epoch": 1217} {"train_loss": -11.55054759979248, "global_step": 204578, "epoch": 1217} {"train_loss": -11.010300636291504, "global_step": 204579, "epoch": 1217} {"train_loss": -11.361812591552734, "global_step": 204580, "epoch": 1217} {"train_loss": -11.14399528503418, "global_step": 204581, "epoch": 1217} {"train_loss": -11.436728477478027, "global_step": 204582, "epoch": 1217} {"train_loss": -11.408565521240234, "global_step": 204583, "epoch": 1217} {"train_loss": -11.317024230957031, "global_step": 204584, "epoch": 1217} {"train_loss": -11.355646133422852, "global_step": 204585, "epoch": 1217} {"train_loss": -11.61385726928711, "global_step": 204586, "epoch": 1217} {"train_loss": -11.057914733886719, "global_step": 204587, "epoch": 1217} {"train_loss": -11.247854232788086, "global_step": 204588, "epoch": 1217} {"train_loss": -11.688726425170898, "global_step": 204589, "epoch": 1217} {"train_loss": -11.388870239257812, "global_step": 204590, "epoch": 1217} {"train_loss": -11.600493431091309, "global_step": 204591, "epoch": 1217} {"train_loss": -11.65047836303711, "global_step": 204592, "epoch": 1217} {"train_loss": -11.417627334594727, "global_step": 204593, "epoch": 1217} {"train_loss": -11.75468635559082, "global_step": 204594, "epoch": 1217} {"train_loss": -10.757585525512695, "global_step": 204595, "epoch": 1217} {"train_loss": -11.645978927612305, "global_step": 204596, "epoch": 1217} {"train_loss": -11.39173698425293, "global_step": 204597, "epoch": 1217} {"train_loss": -11.014931678771973, "global_step": 204598, "epoch": 1217} {"train_loss": -11.769176483154297, "global_step": 204599, "epoch": 1217} {"train_loss": -11.19784927368164, "global_step": 204600, "epoch": 1217} {"train_loss": -11.138213157653809, "global_step": 204601, "epoch": 1217} {"train_loss": -11.565351486206055, "global_step": 204602, "epoch": 1217} {"train_loss": -11.246833801269531, "global_step": 204603, "epoch": 1217} {"train_loss": -11.540395736694336, "global_step": 204604, "epoch": 1217} {"train_loss": -11.635726928710938, "global_step": 204605, "epoch": 1217} {"train_loss": -11.731295585632324, "global_step": 204606, "epoch": 1217} {"train_loss": -11.4354248046875, "global_step": 204607, "epoch": 1217} {"train_loss": -11.625288963317871, "global_step": 204608, "epoch": 1217} {"train_loss": -11.345534324645996, "global_step": 204609, "epoch": 1217} {"train_loss": -11.672978401184082, "global_step": 204610, "epoch": 1217} {"train_loss": -11.483194351196289, "global_step": 204611, "epoch": 1217} {"train_loss": -11.624187469482422, "global_step": 204612, "epoch": 1217} {"train_loss": -11.379450798034668, "global_step": 204613, "epoch": 1217} {"train_loss": -11.459978103637695, "global_step": 204614, "epoch": 1217} {"train_loss": -11.482280731201172, "global_step": 204615, "epoch": 1217} {"train_loss": -11.053033828735352, "global_step": 204616, "epoch": 1217} {"train_loss": -11.242074966430664, "global_step": 204617, "epoch": 1217} {"train_loss": -10.393476486206055, "global_step": 204618, "epoch": 1217} {"train_loss": -10.683470726013184, "global_step": 204619, "epoch": 1217} {"train_loss": -10.693571090698242, "global_step": 204620, "epoch": 1217} {"train_loss": -10.413818359375, "global_step": 204621, "epoch": 1217} {"train_loss": -10.80331039428711, "global_step": 204622, "epoch": 1217} {"train_loss": -11.369099798656645, "global_step": 204623, "epoch": 1217, "val_loss": 255147.90625} {"train_loss": -10.075225830078125, "global_step": 204624, "epoch": 1218} {"train_loss": -10.790064811706543, "global_step": 204625, "epoch": 1218} {"train_loss": -9.953563690185547, "global_step": 204626, "epoch": 1218} {"train_loss": -11.326071739196777, "global_step": 204627, "epoch": 1218} {"train_loss": -10.069583892822266, "global_step": 204628, "epoch": 1218} {"train_loss": -10.380480766296387, "global_step": 204629, "epoch": 1218} {"train_loss": -10.84449577331543, "global_step": 204630, "epoch": 1218} {"train_loss": -10.64541244506836, "global_step": 204631, "epoch": 1218} {"train_loss": -10.81879711151123, "global_step": 204632, "epoch": 1218} {"train_loss": -10.63879108428955, "global_step": 204633, "epoch": 1218} {"train_loss": -10.800491333007812, "global_step": 204634, "epoch": 1218} {"train_loss": -10.82821273803711, "global_step": 204635, "epoch": 1218} {"train_loss": -10.60000228881836, "global_step": 204636, "epoch": 1218} {"train_loss": -11.279775619506836, "global_step": 204637, "epoch": 1218} {"train_loss": -10.496528625488281, "global_step": 204638, "epoch": 1218} {"train_loss": -11.118888854980469, "global_step": 204639, "epoch": 1218} {"train_loss": -10.671635627746582, "global_step": 204640, "epoch": 1218} {"train_loss": -11.201143264770508, "global_step": 204641, "epoch": 1218} {"train_loss": -10.969663619995117, "global_step": 204642, "epoch": 1218} {"train_loss": -10.817962646484375, "global_step": 204643, "epoch": 1218} {"train_loss": -11.391002655029297, "global_step": 204644, "epoch": 1218} {"train_loss": -10.786829948425293, "global_step": 204645, "epoch": 1218} {"train_loss": -11.126355171203613, "global_step": 204646, "epoch": 1218} {"train_loss": -11.043314933776855, "global_step": 204647, "epoch": 1218} {"train_loss": -10.922235488891602, "global_step": 204648, "epoch": 1218} {"train_loss": -11.134475708007812, "global_step": 204649, "epoch": 1218} {"train_loss": -10.99552059173584, "global_step": 204650, "epoch": 1218} {"train_loss": -11.022754669189453, "global_step": 204651, "epoch": 1218} {"train_loss": -11.537927627563477, "global_step": 204652, "epoch": 1218} {"train_loss": -11.422872543334961, "global_step": 204653, "epoch": 1218} {"train_loss": -11.307775497436523, "global_step": 204654, "epoch": 1218} {"train_loss": -11.196653366088867, "global_step": 204655, "epoch": 1218} {"train_loss": -11.329938888549805, "global_step": 204656, "epoch": 1218} {"train_loss": -11.227339744567871, "global_step": 204657, "epoch": 1218} {"train_loss": -11.522811889648438, "global_step": 204658, "epoch": 1218} {"train_loss": -11.48613166809082, "global_step": 204659, "epoch": 1218} {"train_loss": -11.289334297180176, "global_step": 204660, "epoch": 1218} {"train_loss": -11.529817581176758, "global_step": 204661, "epoch": 1218} {"train_loss": -11.274898529052734, "global_step": 204662, "epoch": 1218} {"train_loss": -11.42708969116211, "global_step": 204663, "epoch": 1218} {"train_loss": -11.567867279052734, "global_step": 204664, "epoch": 1218} {"train_loss": -11.226566314697266, "global_step": 204665, "epoch": 1218} {"train_loss": -11.507360458374023, "global_step": 204666, "epoch": 1218} {"train_loss": -11.402009010314941, "global_step": 204667, "epoch": 1218} {"train_loss": -11.432397842407227, "global_step": 204668, "epoch": 1218} {"train_loss": -11.232303619384766, "global_step": 204669, "epoch": 1218} {"train_loss": -11.549829483032227, "global_step": 204670, "epoch": 1218} {"train_loss": -11.095897674560547, "global_step": 204671, "epoch": 1218} {"train_loss": -11.45371150970459, "global_step": 204672, "epoch": 1218} {"train_loss": -11.622051239013672, "global_step": 204673, "epoch": 1218} {"train_loss": -11.454036712646484, "global_step": 204674, "epoch": 1218} {"train_loss": -11.595744132995605, "global_step": 204675, "epoch": 1218} {"train_loss": -11.7444486618042, "global_step": 204676, "epoch": 1218} {"train_loss": -11.4581298828125, "global_step": 204677, "epoch": 1218} {"train_loss": -11.797607421875, "global_step": 204678, "epoch": 1218} {"train_loss": -11.366116523742676, "global_step": 204679, "epoch": 1218} {"train_loss": -11.678102493286133, "global_step": 204680, "epoch": 1218} {"train_loss": -11.496261596679688, "global_step": 204681, "epoch": 1218} {"train_loss": -11.34939193725586, "global_step": 204682, "epoch": 1218} {"train_loss": -11.608504295349121, "global_step": 204683, "epoch": 1218} {"train_loss": -11.638364791870117, "global_step": 204684, "epoch": 1218} {"train_loss": -11.706049919128418, "global_step": 204685, "epoch": 1218} {"train_loss": -11.655891418457031, "global_step": 204686, "epoch": 1218} {"train_loss": -11.79787540435791, "global_step": 204687, "epoch": 1218} {"train_loss": -11.672889709472656, "global_step": 204688, "epoch": 1218} {"train_loss": -11.769336700439453, "global_step": 204689, "epoch": 1218} {"train_loss": -11.753687858581543, "global_step": 204690, "epoch": 1218} {"train_loss": -11.942808151245117, "global_step": 204691, "epoch": 1218} {"train_loss": -11.587111473083496, "global_step": 204692, "epoch": 1218} {"train_loss": -11.732734680175781, "global_step": 204693, "epoch": 1218} {"train_loss": -11.788357734680176, "global_step": 204694, "epoch": 1218} {"train_loss": -11.742891311645508, "global_step": 204695, "epoch": 1218} {"train_loss": -11.714670181274414, "global_step": 204696, "epoch": 1218} {"train_loss": -11.655786514282227, "global_step": 204697, "epoch": 1218} {"train_loss": -11.430909156799316, "global_step": 204698, "epoch": 1218} {"train_loss": -11.30733585357666, "global_step": 204699, "epoch": 1218} {"train_loss": -11.56234073638916, "global_step": 204700, "epoch": 1218} {"train_loss": -11.865440368652344, "global_step": 204701, "epoch": 1218} {"train_loss": -11.42219066619873, "global_step": 204702, "epoch": 1218} {"train_loss": -11.91067886352539, "global_step": 204703, "epoch": 1218} {"train_loss": -11.211711883544922, "global_step": 204704, "epoch": 1218} {"train_loss": -11.720952987670898, "global_step": 204705, "epoch": 1218} {"train_loss": -11.550230979919434, "global_step": 204706, "epoch": 1218} {"train_loss": -11.668231964111328, "global_step": 204707, "epoch": 1218} {"train_loss": -11.3795804977417, "global_step": 204708, "epoch": 1218} {"train_loss": -11.457704544067383, "global_step": 204709, "epoch": 1218} {"train_loss": -11.842806816101074, "global_step": 204710, "epoch": 1218} {"train_loss": -11.661149978637695, "global_step": 204711, "epoch": 1218} {"train_loss": -11.268580436706543, "global_step": 204712, "epoch": 1218} {"train_loss": -11.481636047363281, "global_step": 204713, "epoch": 1218} {"train_loss": -11.518134117126465, "global_step": 204714, "epoch": 1218} {"train_loss": -11.710272789001465, "global_step": 204715, "epoch": 1218} {"train_loss": -11.167679786682129, "global_step": 204716, "epoch": 1218} {"train_loss": -11.592493057250977, "global_step": 204717, "epoch": 1218} {"train_loss": -11.500576972961426, "global_step": 204718, "epoch": 1218} {"train_loss": -11.609469413757324, "global_step": 204719, "epoch": 1218} {"train_loss": -11.407928466796875, "global_step": 204720, "epoch": 1218} {"train_loss": -11.515792846679688, "global_step": 204721, "epoch": 1218} {"train_loss": -11.606285095214844, "global_step": 204722, "epoch": 1218} {"train_loss": -11.390578269958496, "global_step": 204723, "epoch": 1218} {"train_loss": -11.535818099975586, "global_step": 204724, "epoch": 1218} {"train_loss": -11.64677619934082, "global_step": 204725, "epoch": 1218} {"train_loss": -11.855691909790039, "global_step": 204726, "epoch": 1218} {"train_loss": -11.679210662841797, "global_step": 204727, "epoch": 1218} {"train_loss": -11.516818046569824, "global_step": 204728, "epoch": 1218} {"train_loss": -11.627779006958008, "global_step": 204729, "epoch": 1218} {"train_loss": -11.398340225219727, "global_step": 204730, "epoch": 1218} {"train_loss": -11.456281661987305, "global_step": 204731, "epoch": 1218} {"train_loss": -11.558893203735352, "global_step": 204732, "epoch": 1218} {"train_loss": -11.548662185668945, "global_step": 204733, "epoch": 1218} {"train_loss": -11.38672161102295, "global_step": 204734, "epoch": 1218} {"train_loss": -11.428370475769043, "global_step": 204735, "epoch": 1218} {"train_loss": -11.490585327148438, "global_step": 204736, "epoch": 1218} {"train_loss": -11.590660095214844, "global_step": 204737, "epoch": 1218} {"train_loss": -11.664316177368164, "global_step": 204738, "epoch": 1218} {"train_loss": -11.439019203186035, "global_step": 204739, "epoch": 1218} {"train_loss": -11.178544044494629, "global_step": 204740, "epoch": 1218} {"train_loss": -11.017965316772461, "global_step": 204741, "epoch": 1218} {"train_loss": -10.483564376831055, "global_step": 204742, "epoch": 1218} {"train_loss": -11.381546020507812, "global_step": 204743, "epoch": 1218} {"train_loss": -10.713628768920898, "global_step": 204744, "epoch": 1218} {"train_loss": -11.104883193969727, "global_step": 204745, "epoch": 1218} {"train_loss": -10.825735092163086, "global_step": 204746, "epoch": 1218} {"train_loss": -10.223469734191895, "global_step": 204747, "epoch": 1218} {"train_loss": -9.880484580993652, "global_step": 204748, "epoch": 1218} {"train_loss": -10.291407585144043, "global_step": 204749, "epoch": 1218} {"train_loss": -9.706098556518555, "global_step": 204750, "epoch": 1218} {"train_loss": -10.668798446655273, "global_step": 204751, "epoch": 1218} {"train_loss": -10.989087104797363, "global_step": 204752, "epoch": 1218} {"train_loss": -10.013631820678711, "global_step": 204753, "epoch": 1218} {"train_loss": -11.318506240844727, "global_step": 204754, "epoch": 1218} {"train_loss": -10.296550750732422, "global_step": 204755, "epoch": 1218} {"train_loss": -11.119657516479492, "global_step": 204756, "epoch": 1218} {"train_loss": -10.595185279846191, "global_step": 204757, "epoch": 1218} {"train_loss": -10.009855270385742, "global_step": 204758, "epoch": 1218} {"train_loss": -11.023691177368164, "global_step": 204759, "epoch": 1218} {"train_loss": -10.034845352172852, "global_step": 204760, "epoch": 1218} {"train_loss": -10.87535285949707, "global_step": 204761, "epoch": 1218} {"train_loss": -10.216262817382812, "global_step": 204762, "epoch": 1218} {"train_loss": -10.690231323242188, "global_step": 204763, "epoch": 1218} {"train_loss": -10.47199821472168, "global_step": 204764, "epoch": 1218} {"train_loss": -10.21353816986084, "global_step": 204765, "epoch": 1218} {"train_loss": -10.739044189453125, "global_step": 204766, "epoch": 1218} {"train_loss": -10.359258651733398, "global_step": 204767, "epoch": 1218} {"train_loss": -10.84892463684082, "global_step": 204768, "epoch": 1218} {"train_loss": -10.26829719543457, "global_step": 204769, "epoch": 1218} {"train_loss": -10.400854110717773, "global_step": 204770, "epoch": 1218} {"train_loss": -10.318838119506836, "global_step": 204771, "epoch": 1218} {"train_loss": -10.606180191040039, "global_step": 204772, "epoch": 1218} {"train_loss": -10.544351577758789, "global_step": 204773, "epoch": 1218} {"train_loss": -11.069644927978516, "global_step": 204774, "epoch": 1218} {"train_loss": -10.439390182495117, "global_step": 204775, "epoch": 1218} {"train_loss": -10.274995803833008, "global_step": 204776, "epoch": 1218} {"train_loss": -10.48249626159668, "global_step": 204777, "epoch": 1218} {"train_loss": -10.635785102844238, "global_step": 204778, "epoch": 1218} {"train_loss": -10.741312026977539, "global_step": 204779, "epoch": 1218} {"train_loss": -10.640079498291016, "global_step": 204780, "epoch": 1218} {"train_loss": -10.68243408203125, "global_step": 204781, "epoch": 1218} {"train_loss": -10.596981048583984, "global_step": 204782, "epoch": 1218} {"train_loss": -11.252092361450195, "global_step": 204783, "epoch": 1218} {"train_loss": -10.508411407470703, "global_step": 204784, "epoch": 1218} {"train_loss": -11.082818984985352, "global_step": 204785, "epoch": 1218} {"train_loss": -10.870809555053711, "global_step": 204786, "epoch": 1218} {"train_loss": -10.838679313659668, "global_step": 204787, "epoch": 1218} {"train_loss": -10.920463562011719, "global_step": 204788, "epoch": 1218} {"train_loss": -11.18476676940918, "global_step": 204789, "epoch": 1218} {"train_loss": -10.951272964477539, "global_step": 204790, "epoch": 1218} {"train_loss": -11.136819646472023, "global_step": 204791, "epoch": 1218, "val_loss": 254118.390625} {"train_loss": -11.175372123718262, "global_step": 204792, "epoch": 1219} {"train_loss": -10.528280258178711, "global_step": 204793, "epoch": 1219} {"train_loss": -11.365556716918945, "global_step": 204794, "epoch": 1219} {"train_loss": -10.503952980041504, "global_step": 204795, "epoch": 1219} {"train_loss": -11.25717830657959, "global_step": 204796, "epoch": 1219} {"train_loss": -10.854246139526367, "global_step": 204797, "epoch": 1219} {"train_loss": -11.250577926635742, "global_step": 204798, "epoch": 1219} {"train_loss": -10.888836860656738, "global_step": 204799, "epoch": 1219} {"train_loss": -11.048919677734375, "global_step": 204800, "epoch": 1219} {"train_loss": -11.41702651977539, "global_step": 204801, "epoch": 1219} {"train_loss": -10.982001304626465, "global_step": 204802, "epoch": 1219} {"train_loss": -11.167400360107422, "global_step": 204803, "epoch": 1219} {"train_loss": -11.383895874023438, "global_step": 204804, "epoch": 1219} {"train_loss": -11.264391899108887, "global_step": 204805, "epoch": 1219} {"train_loss": -11.24370002746582, "global_step": 204806, "epoch": 1219} {"train_loss": -11.46243953704834, "global_step": 204807, "epoch": 1219} {"train_loss": -11.348822593688965, "global_step": 204808, "epoch": 1219} {"train_loss": -11.239482879638672, "global_step": 204809, "epoch": 1219} {"train_loss": -11.453327178955078, "global_step": 204810, "epoch": 1219} {"train_loss": -11.24726676940918, "global_step": 204811, "epoch": 1219} {"train_loss": -11.468729019165039, "global_step": 204812, "epoch": 1219} {"train_loss": -11.522954940795898, "global_step": 204813, "epoch": 1219} {"train_loss": -11.528923988342285, "global_step": 204814, "epoch": 1219} {"train_loss": -11.53119945526123, "global_step": 204815, "epoch": 1219} {"train_loss": -11.760519981384277, "global_step": 204816, "epoch": 1219} {"train_loss": -11.618045806884766, "global_step": 204817, "epoch": 1219} {"train_loss": -11.633291244506836, "global_step": 204818, "epoch": 1219} {"train_loss": -11.446432113647461, "global_step": 204819, "epoch": 1219} {"train_loss": -11.613191604614258, "global_step": 204820, "epoch": 1219} {"train_loss": -11.705826759338379, "global_step": 204821, "epoch": 1219} {"train_loss": -11.515827178955078, "global_step": 204822, "epoch": 1219} {"train_loss": -11.70461654663086, "global_step": 204823, "epoch": 1219} {"train_loss": -11.669981956481934, "global_step": 204824, "epoch": 1219} {"train_loss": -11.43549919128418, "global_step": 204825, "epoch": 1219} {"train_loss": -11.664253234863281, "global_step": 204826, "epoch": 1219} {"train_loss": -11.692286491394043, "global_step": 204827, "epoch": 1219} {"train_loss": -11.627212524414062, "global_step": 204828, "epoch": 1219} {"train_loss": -11.674644470214844, "global_step": 204829, "epoch": 1219} {"train_loss": -11.698831558227539, "global_step": 204830, "epoch": 1219} {"train_loss": -11.530795097351074, "global_step": 204831, "epoch": 1219} {"train_loss": -11.574041366577148, "global_step": 204832, "epoch": 1219} {"train_loss": -11.586444854736328, "global_step": 204833, "epoch": 1219} {"train_loss": -11.728118896484375, "global_step": 204834, "epoch": 1219} {"train_loss": -11.695255279541016, "global_step": 204835, "epoch": 1219} {"train_loss": -11.415462493896484, "global_step": 204836, "epoch": 1219} {"train_loss": -11.684860229492188, "global_step": 204837, "epoch": 1219} {"train_loss": -11.741752624511719, "global_step": 204838, "epoch": 1219} {"train_loss": -11.512454986572266, "global_step": 204839, "epoch": 1219} {"train_loss": -11.790901184082031, "global_step": 204840, "epoch": 1219} {"train_loss": -11.83145523071289, "global_step": 204841, "epoch": 1219} {"train_loss": -11.668224334716797, "global_step": 204842, "epoch": 1219} {"train_loss": -11.543481826782227, "global_step": 204843, "epoch": 1219} {"train_loss": -11.533014297485352, "global_step": 204844, "epoch": 1219} {"train_loss": -11.701725006103516, "global_step": 204845, "epoch": 1219} {"train_loss": -11.7705078125, "global_step": 204846, "epoch": 1219} {"train_loss": -11.952899932861328, "global_step": 204847, "epoch": 1219} {"train_loss": -11.920202255249023, "global_step": 204848, "epoch": 1219} {"train_loss": -11.839747428894043, "global_step": 204849, "epoch": 1219} {"train_loss": -11.781021118164062, "global_step": 204850, "epoch": 1219} {"train_loss": -11.913423538208008, "global_step": 204851, "epoch": 1219} {"train_loss": -11.779045104980469, "global_step": 204852, "epoch": 1219} {"train_loss": -11.989656448364258, "global_step": 204853, "epoch": 1219} {"train_loss": -11.78320598602295, "global_step": 204854, "epoch": 1219} {"train_loss": -11.755382537841797, "global_step": 204855, "epoch": 1219} {"train_loss": -11.785796165466309, "global_step": 204856, "epoch": 1219} {"train_loss": -11.932769775390625, "global_step": 204857, "epoch": 1219} {"train_loss": -11.630193710327148, "global_step": 204858, "epoch": 1219} {"train_loss": -11.801738739013672, "global_step": 204859, "epoch": 1219} {"train_loss": -11.623807907104492, "global_step": 204860, "epoch": 1219} {"train_loss": -11.212297439575195, "global_step": 204861, "epoch": 1219} {"train_loss": -11.300748825073242, "global_step": 204862, "epoch": 1219} {"train_loss": -11.510151863098145, "global_step": 204863, "epoch": 1219} {"train_loss": -11.660511016845703, "global_step": 204864, "epoch": 1219} {"train_loss": -11.806203842163086, "global_step": 204865, "epoch": 1219} {"train_loss": -11.564011573791504, "global_step": 204866, "epoch": 1219} {"train_loss": -11.801645278930664, "global_step": 204867, "epoch": 1219} {"train_loss": -11.453170776367188, "global_step": 204868, "epoch": 1219} {"train_loss": -11.162397384643555, "global_step": 204869, "epoch": 1219} {"train_loss": -11.25277042388916, "global_step": 204870, "epoch": 1219} {"train_loss": -11.799177169799805, "global_step": 204871, "epoch": 1219} {"train_loss": -11.976371765136719, "global_step": 204872, "epoch": 1219} {"train_loss": -11.594406127929688, "global_step": 204873, "epoch": 1219} {"train_loss": -11.572200775146484, "global_step": 204874, "epoch": 1219} {"train_loss": -10.865869522094727, "global_step": 204875, "epoch": 1219} {"train_loss": -11.413307189941406, "global_step": 204876, "epoch": 1219} {"train_loss": -11.469635009765625, "global_step": 204877, "epoch": 1219} {"train_loss": -11.385380744934082, "global_step": 204878, "epoch": 1219} {"train_loss": -11.545936584472656, "global_step": 204879, "epoch": 1219} {"train_loss": -11.303040504455566, "global_step": 204880, "epoch": 1219} {"train_loss": -11.697690963745117, "global_step": 204881, "epoch": 1219} {"train_loss": -11.464456558227539, "global_step": 204882, "epoch": 1219} {"train_loss": -11.533031463623047, "global_step": 204883, "epoch": 1219} {"train_loss": -11.428760528564453, "global_step": 204884, "epoch": 1219} {"train_loss": -11.152837753295898, "global_step": 204885, "epoch": 1219} {"train_loss": -11.680747985839844, "global_step": 204886, "epoch": 1219} {"train_loss": -11.287981033325195, "global_step": 204887, "epoch": 1219} {"train_loss": -11.511006355285645, "global_step": 204888, "epoch": 1219} {"train_loss": -11.205726623535156, "global_step": 204889, "epoch": 1219} {"train_loss": -11.339412689208984, "global_step": 204890, "epoch": 1219} {"train_loss": -11.216399192810059, "global_step": 204891, "epoch": 1219} {"train_loss": -10.981480598449707, "global_step": 204892, "epoch": 1219} {"train_loss": -11.411870956420898, "global_step": 204893, "epoch": 1219} {"train_loss": -10.670299530029297, "global_step": 204894, "epoch": 1219} {"train_loss": -10.785028457641602, "global_step": 204895, "epoch": 1219} {"train_loss": -10.935983657836914, "global_step": 204896, "epoch": 1219} {"train_loss": -11.030753135681152, "global_step": 204897, "epoch": 1219} {"train_loss": -11.014619827270508, "global_step": 204898, "epoch": 1219} {"train_loss": -10.529170036315918, "global_step": 204899, "epoch": 1219} {"train_loss": -10.264890670776367, "global_step": 204900, "epoch": 1219} {"train_loss": -9.449748992919922, "global_step": 204901, "epoch": 1219} {"train_loss": -9.420166015625, "global_step": 204902, "epoch": 1219} {"train_loss": -10.646339416503906, "global_step": 204903, "epoch": 1219} {"train_loss": -9.017412185668945, "global_step": 204904, "epoch": 1219} {"train_loss": -9.206757545471191, "global_step": 204905, "epoch": 1219} {"train_loss": -10.44516658782959, "global_step": 204906, "epoch": 1219} {"train_loss": -9.594118118286133, "global_step": 204907, "epoch": 1219} {"train_loss": -10.500261306762695, "global_step": 204908, "epoch": 1219} {"train_loss": -10.106636047363281, "global_step": 204909, "epoch": 1219} {"train_loss": -10.554628372192383, "global_step": 204910, "epoch": 1219} {"train_loss": -9.318887710571289, "global_step": 204911, "epoch": 1219} {"train_loss": -10.929943084716797, "global_step": 204912, "epoch": 1219} {"train_loss": -8.72134780883789, "global_step": 204913, "epoch": 1219} {"train_loss": -11.289546966552734, "global_step": 204914, "epoch": 1219} {"train_loss": -9.224201202392578, "global_step": 204915, "epoch": 1219} {"train_loss": -10.538533210754395, "global_step": 204916, "epoch": 1219} {"train_loss": -10.438398361206055, "global_step": 204917, "epoch": 1219} {"train_loss": -10.92357349395752, "global_step": 204918, "epoch": 1219} {"train_loss": -10.95355224609375, "global_step": 204919, "epoch": 1219} {"train_loss": -9.55077075958252, "global_step": 204920, "epoch": 1219} {"train_loss": -10.914573669433594, "global_step": 204921, "epoch": 1219} {"train_loss": -10.332038879394531, "global_step": 204922, "epoch": 1219} {"train_loss": -9.847391128540039, "global_step": 204923, "epoch": 1219} {"train_loss": -11.129212379455566, "global_step": 204924, "epoch": 1219} {"train_loss": -10.408498764038086, "global_step": 204925, "epoch": 1219} {"train_loss": -10.59377670288086, "global_step": 204926, "epoch": 1219} {"train_loss": -10.348816871643066, "global_step": 204927, "epoch": 1219} {"train_loss": -10.979686737060547, "global_step": 204928, "epoch": 1219} {"train_loss": -10.527636528015137, "global_step": 204929, "epoch": 1219} {"train_loss": -11.20565414428711, "global_step": 204930, "epoch": 1219} {"train_loss": -10.893121719360352, "global_step": 204931, "epoch": 1219} {"train_loss": -10.942992210388184, "global_step": 204932, "epoch": 1219} {"train_loss": -10.732294082641602, "global_step": 204933, "epoch": 1219} {"train_loss": -10.46977424621582, "global_step": 204934, "epoch": 1219} {"train_loss": -11.273284912109375, "global_step": 204935, "epoch": 1219} {"train_loss": -10.9083251953125, "global_step": 204936, "epoch": 1219} {"train_loss": -11.254283905029297, "global_step": 204937, "epoch": 1219} {"train_loss": -10.888179779052734, "global_step": 204938, "epoch": 1219} {"train_loss": -10.574695587158203, "global_step": 204939, "epoch": 1219} {"train_loss": -11.02371597290039, "global_step": 204940, "epoch": 1219} {"train_loss": -10.816265106201172, "global_step": 204941, "epoch": 1219} {"train_loss": -11.02078628540039, "global_step": 204942, "epoch": 1219} {"train_loss": -11.051511764526367, "global_step": 204943, "epoch": 1219} {"train_loss": -11.050887107849121, "global_step": 204944, "epoch": 1219} {"train_loss": -11.218826293945312, "global_step": 204945, "epoch": 1219} {"train_loss": -11.159473419189453, "global_step": 204946, "epoch": 1219} {"train_loss": -11.263291358947754, "global_step": 204947, "epoch": 1219} {"train_loss": -11.224411010742188, "global_step": 204948, "epoch": 1219} {"train_loss": -11.154314041137695, "global_step": 204949, "epoch": 1219} {"train_loss": -11.336629867553711, "global_step": 204950, "epoch": 1219} {"train_loss": -10.989352226257324, "global_step": 204951, "epoch": 1219} {"train_loss": -11.27411937713623, "global_step": 204952, "epoch": 1219} {"train_loss": -11.18562126159668, "global_step": 204953, "epoch": 1219} {"train_loss": -11.25810432434082, "global_step": 204954, "epoch": 1219} {"train_loss": -11.310588836669922, "global_step": 204955, "epoch": 1219} {"train_loss": -11.314051628112793, "global_step": 204956, "epoch": 1219} {"train_loss": -11.349071502685547, "global_step": 204957, "epoch": 1219} {"train_loss": -11.46137809753418, "global_step": 204958, "epoch": 1219} {"train_loss": -11.172384347234454, "global_step": 204959, "epoch": 1219, "val_loss": 247082.859375} {"train_loss": -11.447973251342773, "global_step": 204960, "epoch": 1220} {"train_loss": -11.500733375549316, "global_step": 204961, "epoch": 1220} {"train_loss": -11.411632537841797, "global_step": 204962, "epoch": 1220} {"train_loss": -11.482744216918945, "global_step": 204963, "epoch": 1220} {"train_loss": -11.334095001220703, "global_step": 204964, "epoch": 1220} {"train_loss": -11.478528022766113, "global_step": 204965, "epoch": 1220} {"train_loss": -11.433260917663574, "global_step": 204966, "epoch": 1220} {"train_loss": -11.50079345703125, "global_step": 204967, "epoch": 1220} {"train_loss": -11.555215835571289, "global_step": 204968, "epoch": 1220} {"train_loss": -11.178937911987305, "global_step": 204969, "epoch": 1220} {"train_loss": -11.426386833190918, "global_step": 204970, "epoch": 1220} {"train_loss": -11.259572982788086, "global_step": 204971, "epoch": 1220} {"train_loss": -11.141838073730469, "global_step": 204972, "epoch": 1220} {"train_loss": -11.455682754516602, "global_step": 204973, "epoch": 1220} {"train_loss": -11.142542839050293, "global_step": 204974, "epoch": 1220} {"train_loss": -11.589325904846191, "global_step": 204975, "epoch": 1220} {"train_loss": -11.486071586608887, "global_step": 204976, "epoch": 1220} {"train_loss": -11.622722625732422, "global_step": 204977, "epoch": 1220} {"train_loss": -11.419639587402344, "global_step": 204978, "epoch": 1220} {"train_loss": -11.602588653564453, "global_step": 204979, "epoch": 1220} {"train_loss": -11.56985092163086, "global_step": 204980, "epoch": 1220} {"train_loss": -11.323169708251953, "global_step": 204981, "epoch": 1220} {"train_loss": -11.665063858032227, "global_step": 204982, "epoch": 1220} {"train_loss": -11.626415252685547, "global_step": 204983, "epoch": 1220} {"train_loss": -11.651280403137207, "global_step": 204984, "epoch": 1220} {"train_loss": -11.647850036621094, "global_step": 204985, "epoch": 1220} {"train_loss": -11.672219276428223, "global_step": 204986, "epoch": 1220} {"train_loss": -11.753154754638672, "global_step": 204987, "epoch": 1220} {"train_loss": -11.596536636352539, "global_step": 204988, "epoch": 1220} {"train_loss": -11.60673713684082, "global_step": 204989, "epoch": 1220} {"train_loss": -11.750702857971191, "global_step": 204990, "epoch": 1220} {"train_loss": -11.778475761413574, "global_step": 204991, "epoch": 1220} {"train_loss": -11.772153854370117, "global_step": 204992, "epoch": 1220} {"train_loss": -11.624631881713867, "global_step": 204993, "epoch": 1220} {"train_loss": -11.55312442779541, "global_step": 204994, "epoch": 1220} {"train_loss": -11.518714904785156, "global_step": 204995, "epoch": 1220} {"train_loss": -11.697198867797852, "global_step": 204996, "epoch": 1220} {"train_loss": -11.74437141418457, "global_step": 204997, "epoch": 1220} {"train_loss": -11.813838958740234, "global_step": 204998, "epoch": 1220} {"train_loss": -11.674657821655273, "global_step": 204999, "epoch": 1220} {"train_loss": -11.891080856323242, "global_step": 205000, "epoch": 1220} {"train_loss": -11.856073379516602, "global_step": 205001, "epoch": 1220} {"train_loss": -12.002655982971191, "global_step": 205002, "epoch": 1220} {"train_loss": -11.748220443725586, "global_step": 205003, "epoch": 1220} {"train_loss": -11.703434944152832, "global_step": 205004, "epoch": 1220} {"train_loss": -11.825681686401367, "global_step": 205005, "epoch": 1220} {"train_loss": -11.731915473937988, "global_step": 205006, "epoch": 1220} {"train_loss": -11.878875732421875, "global_step": 205007, "epoch": 1220} {"train_loss": -11.799026489257812, "global_step": 205008, "epoch": 1220} {"train_loss": -11.972380638122559, "global_step": 205009, "epoch": 1220} {"train_loss": -11.625935554504395, "global_step": 205010, "epoch": 1220} {"train_loss": -12.062509536743164, "global_step": 205011, "epoch": 1220} {"train_loss": -11.872669219970703, "global_step": 205012, "epoch": 1220} {"train_loss": -11.71268081665039, "global_step": 205013, "epoch": 1220} {"train_loss": -11.343594551086426, "global_step": 205014, "epoch": 1220} {"train_loss": -11.281916618347168, "global_step": 205015, "epoch": 1220} {"train_loss": -11.028377532958984, "global_step": 205016, "epoch": 1220} {"train_loss": -11.66763687133789, "global_step": 205017, "epoch": 1220} {"train_loss": -11.063985824584961, "global_step": 205018, "epoch": 1220} {"train_loss": -10.726926803588867, "global_step": 205019, "epoch": 1220} {"train_loss": -9.8630952835083, "global_step": 205020, "epoch": 1220} {"train_loss": -9.81527328491211, "global_step": 205021, "epoch": 1220} {"train_loss": -9.954446792602539, "global_step": 205022, "epoch": 1220} {"train_loss": -8.505605697631836, "global_step": 205023, "epoch": 1220} {"train_loss": -9.931475639343262, "global_step": 205024, "epoch": 1220} {"train_loss": -11.103937149047852, "global_step": 205025, "epoch": 1220} {"train_loss": -8.232746124267578, "global_step": 205026, "epoch": 1220} {"train_loss": -10.05348014831543, "global_step": 205027, "epoch": 1220} {"train_loss": -8.10446548461914, "global_step": 205028, "epoch": 1220} {"train_loss": -9.580915451049805, "global_step": 205029, "epoch": 1220} {"train_loss": -7.786673545837402, "global_step": 205030, "epoch": 1220} {"train_loss": -9.460124969482422, "global_step": 205031, "epoch": 1220} {"train_loss": -8.037758827209473, "global_step": 205032, "epoch": 1220} {"train_loss": -10.253650665283203, "global_step": 205033, "epoch": 1220} {"train_loss": -9.259469985961914, "global_step": 205034, "epoch": 1220} {"train_loss": -11.044893264770508, "global_step": 205035, "epoch": 1220} {"train_loss": -8.87512493133545, "global_step": 205036, "epoch": 1220} {"train_loss": -10.020020484924316, "global_step": 205037, "epoch": 1220} {"train_loss": -9.932771682739258, "global_step": 205038, "epoch": 1220} {"train_loss": -9.549860000610352, "global_step": 205039, "epoch": 1220} {"train_loss": -9.789728164672852, "global_step": 205040, "epoch": 1220} {"train_loss": -10.429911613464355, "global_step": 205041, "epoch": 1220} {"train_loss": -9.929603576660156, "global_step": 205042, "epoch": 1220} {"train_loss": -10.400147438049316, "global_step": 205043, "epoch": 1220} {"train_loss": -10.448637962341309, "global_step": 205044, "epoch": 1220} {"train_loss": -10.608555793762207, "global_step": 205045, "epoch": 1220} {"train_loss": -10.46875, "global_step": 205046, "epoch": 1220} {"train_loss": -10.318039894104004, "global_step": 205047, "epoch": 1220} {"train_loss": -10.194690704345703, "global_step": 205048, "epoch": 1220} {"train_loss": -10.385416984558105, "global_step": 205049, "epoch": 1220} {"train_loss": -10.699848175048828, "global_step": 205050, "epoch": 1220} {"train_loss": -10.551679611206055, "global_step": 205051, "epoch": 1220} {"train_loss": -10.488183975219727, "global_step": 205052, "epoch": 1220} {"train_loss": -10.743645668029785, "global_step": 205053, "epoch": 1220} {"train_loss": -10.960943222045898, "global_step": 205054, "epoch": 1220} {"train_loss": -10.84922981262207, "global_step": 205055, "epoch": 1220} {"train_loss": -10.610689163208008, "global_step": 205056, "epoch": 1220} {"train_loss": -11.017416954040527, "global_step": 205057, "epoch": 1220} {"train_loss": -11.105432510375977, "global_step": 205058, "epoch": 1220} {"train_loss": -10.791534423828125, "global_step": 205059, "epoch": 1220} {"train_loss": -11.306099891662598, "global_step": 205060, "epoch": 1220} {"train_loss": -11.205498695373535, "global_step": 205061, "epoch": 1220} {"train_loss": -10.769309043884277, "global_step": 205062, "epoch": 1220} {"train_loss": -10.85875415802002, "global_step": 205063, "epoch": 1220} {"train_loss": -11.208157539367676, "global_step": 205064, "epoch": 1220} {"train_loss": -11.031015396118164, "global_step": 205065, "epoch": 1220} {"train_loss": -11.008014678955078, "global_step": 205066, "epoch": 1220} {"train_loss": -11.220192909240723, "global_step": 205067, "epoch": 1220} {"train_loss": -11.29039478302002, "global_step": 205068, "epoch": 1220} {"train_loss": -11.111734390258789, "global_step": 205069, "epoch": 1220} {"train_loss": -11.056926727294922, "global_step": 205070, "epoch": 1220} {"train_loss": -10.93372917175293, "global_step": 205071, "epoch": 1220} {"train_loss": -11.181535720825195, "global_step": 205072, "epoch": 1220} {"train_loss": -11.130634307861328, "global_step": 205073, "epoch": 1220} {"train_loss": -11.348150253295898, "global_step": 205074, "epoch": 1220} {"train_loss": -11.369561195373535, "global_step": 205075, "epoch": 1220} {"train_loss": -11.042031288146973, "global_step": 205076, "epoch": 1220} {"train_loss": -11.145041465759277, "global_step": 205077, "epoch": 1220} {"train_loss": -11.372726440429688, "global_step": 205078, "epoch": 1220} {"train_loss": -11.23337173461914, "global_step": 205079, "epoch": 1220} {"train_loss": -11.34614086151123, "global_step": 205080, "epoch": 1220} {"train_loss": -11.203512191772461, "global_step": 205081, "epoch": 1220} {"train_loss": -11.277416229248047, "global_step": 205082, "epoch": 1220} {"train_loss": -11.260869979858398, "global_step": 205083, "epoch": 1220} {"train_loss": -11.60635757446289, "global_step": 205084, "epoch": 1220} {"train_loss": -11.333148956298828, "global_step": 205085, "epoch": 1220} {"train_loss": -11.30704402923584, "global_step": 205086, "epoch": 1220} {"train_loss": -11.492609977722168, "global_step": 205087, "epoch": 1220} {"train_loss": -11.472359657287598, "global_step": 205088, "epoch": 1220} {"train_loss": -11.546843528747559, "global_step": 205089, "epoch": 1220} {"train_loss": -11.644269943237305, "global_step": 205090, "epoch": 1220} {"train_loss": -11.774208068847656, "global_step": 205091, "epoch": 1220} {"train_loss": -11.575538635253906, "global_step": 205092, "epoch": 1220} {"train_loss": -11.458377838134766, "global_step": 205093, "epoch": 1220} {"train_loss": -11.52595329284668, "global_step": 205094, "epoch": 1220} {"train_loss": -11.670747756958008, "global_step": 205095, "epoch": 1220} {"train_loss": -11.757027626037598, "global_step": 205096, "epoch": 1220} {"train_loss": -11.587970733642578, "global_step": 205097, "epoch": 1220} {"train_loss": -11.573159217834473, "global_step": 205098, "epoch": 1220} {"train_loss": -11.843634605407715, "global_step": 205099, "epoch": 1220} {"train_loss": -11.806242942810059, "global_step": 205100, "epoch": 1220} {"train_loss": -11.539164543151855, "global_step": 205101, "epoch": 1220} {"train_loss": -11.601237297058105, "global_step": 205102, "epoch": 1220} {"train_loss": -11.662572860717773, "global_step": 205103, "epoch": 1220} {"train_loss": -11.71939468383789, "global_step": 205104, "epoch": 1220} {"train_loss": -11.753148078918457, "global_step": 205105, "epoch": 1220} {"train_loss": -11.646516799926758, "global_step": 205106, "epoch": 1220} {"train_loss": -11.64027214050293, "global_step": 205107, "epoch": 1220} {"train_loss": -11.84200668334961, "global_step": 205108, "epoch": 1220} {"train_loss": -11.835420608520508, "global_step": 205109, "epoch": 1220} {"train_loss": -11.698196411132812, "global_step": 205110, "epoch": 1220} {"train_loss": -11.898720741271973, "global_step": 205111, "epoch": 1220} {"train_loss": -11.702896118164062, "global_step": 205112, "epoch": 1220} {"train_loss": -11.741275787353516, "global_step": 205113, "epoch": 1220} {"train_loss": -11.770831108093262, "global_step": 205114, "epoch": 1220} {"train_loss": -11.857568740844727, "global_step": 205115, "epoch": 1220} {"train_loss": -11.793136596679688, "global_step": 205116, "epoch": 1220} {"train_loss": -11.759620666503906, "global_step": 205117, "epoch": 1220} {"train_loss": -11.752959251403809, "global_step": 205118, "epoch": 1220} {"train_loss": -11.991628646850586, "global_step": 205119, "epoch": 1220} {"train_loss": -11.59543228149414, "global_step": 205120, "epoch": 1220} {"train_loss": -11.77509880065918, "global_step": 205121, "epoch": 1220} {"train_loss": -11.534607887268066, "global_step": 205122, "epoch": 1220} {"train_loss": -11.93935775756836, "global_step": 205123, "epoch": 1220} {"train_loss": -11.841913223266602, "global_step": 205124, "epoch": 1220} {"train_loss": -11.577816009521484, "global_step": 205125, "epoch": 1220} {"train_loss": -11.827901840209961, "global_step": 205126, "epoch": 1220} {"train_loss": -11.168890708968753, "global_step": 205127, "epoch": 1220, "val_loss": 251097.609375, "train_action_mse_error": 0.11166833341121674} {"train_loss": -11.403608322143555, "global_step": 205128, "epoch": 1221} {"train_loss": -11.668441772460938, "global_step": 205129, "epoch": 1221} {"train_loss": -12.036163330078125, "global_step": 205130, "epoch": 1221} {"train_loss": -11.36800765991211, "global_step": 205131, "epoch": 1221} {"train_loss": -10.506562232971191, "global_step": 205132, "epoch": 1221} {"train_loss": -10.404266357421875, "global_step": 205133, "epoch": 1221} {"train_loss": -10.786968231201172, "global_step": 205134, "epoch": 1221} {"train_loss": -11.05301284790039, "global_step": 205135, "epoch": 1221} {"train_loss": -8.641260147094727, "global_step": 205136, "epoch": 1221} {"train_loss": -8.928458213806152, "global_step": 205137, "epoch": 1221} {"train_loss": -9.305368423461914, "global_step": 205138, "epoch": 1221} {"train_loss": -9.134191513061523, "global_step": 205139, "epoch": 1221} {"train_loss": -8.889116287231445, "global_step": 205140, "epoch": 1221} {"train_loss": -8.876462936401367, "global_step": 205141, "epoch": 1221} {"train_loss": -10.683009147644043, "global_step": 205142, "epoch": 1221} {"train_loss": -9.123387336730957, "global_step": 205143, "epoch": 1221} {"train_loss": -9.167084693908691, "global_step": 205144, "epoch": 1221} {"train_loss": -9.804519653320312, "global_step": 205145, "epoch": 1221} {"train_loss": -9.768719673156738, "global_step": 205146, "epoch": 1221} {"train_loss": -9.88548755645752, "global_step": 205147, "epoch": 1221} {"train_loss": -9.909238815307617, "global_step": 205148, "epoch": 1221} {"train_loss": -10.18410873413086, "global_step": 205149, "epoch": 1221} {"train_loss": -9.020222663879395, "global_step": 205150, "epoch": 1221} {"train_loss": -9.990486145019531, "global_step": 205151, "epoch": 1221} {"train_loss": -9.133936882019043, "global_step": 205152, "epoch": 1221} {"train_loss": -9.736030578613281, "global_step": 205153, "epoch": 1221} {"train_loss": -8.346388816833496, "global_step": 205154, "epoch": 1221} {"train_loss": -10.087703704833984, "global_step": 205155, "epoch": 1221} {"train_loss": -9.46274185180664, "global_step": 205156, "epoch": 1221} {"train_loss": -9.568984031677246, "global_step": 205157, "epoch": 1221} {"train_loss": -10.186844825744629, "global_step": 205158, "epoch": 1221} {"train_loss": -9.918146133422852, "global_step": 205159, "epoch": 1221} {"train_loss": -10.250371932983398, "global_step": 205160, "epoch": 1221} {"train_loss": -10.03890609741211, "global_step": 205161, "epoch": 1221} {"train_loss": -10.43326187133789, "global_step": 205162, "epoch": 1221} {"train_loss": -9.682604789733887, "global_step": 205163, "epoch": 1221} {"train_loss": -10.874465942382812, "global_step": 205164, "epoch": 1221} {"train_loss": -10.57722282409668, "global_step": 205165, "epoch": 1221} {"train_loss": -10.434744834899902, "global_step": 205166, "epoch": 1221} {"train_loss": -10.934861183166504, "global_step": 205167, "epoch": 1221} {"train_loss": -10.508508682250977, "global_step": 205168, "epoch": 1221} {"train_loss": -10.61983871459961, "global_step": 205169, "epoch": 1221} {"train_loss": -10.841329574584961, "global_step": 205170, "epoch": 1221} {"train_loss": -10.919103622436523, "global_step": 205171, "epoch": 1221} {"train_loss": -11.007417678833008, "global_step": 205172, "epoch": 1221} {"train_loss": -11.038919448852539, "global_step": 205173, "epoch": 1221} {"train_loss": -10.96661376953125, "global_step": 205174, "epoch": 1221} {"train_loss": -11.185859680175781, "global_step": 205175, "epoch": 1221} {"train_loss": -11.049901008605957, "global_step": 205176, "epoch": 1221} {"train_loss": -10.842859268188477, "global_step": 205177, "epoch": 1221} {"train_loss": -11.29080581665039, "global_step": 205178, "epoch": 1221} {"train_loss": -10.913835525512695, "global_step": 205179, "epoch": 1221} {"train_loss": -11.15418529510498, "global_step": 205180, "epoch": 1221} {"train_loss": -11.179952621459961, "global_step": 205181, "epoch": 1221} {"train_loss": -11.207132339477539, "global_step": 205182, "epoch": 1221} {"train_loss": -11.335762023925781, "global_step": 205183, "epoch": 1221} {"train_loss": -11.154003143310547, "global_step": 205184, "epoch": 1221} {"train_loss": -11.30804443359375, "global_step": 205185, "epoch": 1221} {"train_loss": -11.279048919677734, "global_step": 205186, "epoch": 1221} {"train_loss": -11.171032905578613, "global_step": 205187, "epoch": 1221} {"train_loss": -11.27769660949707, "global_step": 205188, "epoch": 1221} {"train_loss": -11.395992279052734, "global_step": 205189, "epoch": 1221} {"train_loss": -11.3857421875, "global_step": 205190, "epoch": 1221} {"train_loss": -11.111364364624023, "global_step": 205191, "epoch": 1221} {"train_loss": -11.112292289733887, "global_step": 205192, "epoch": 1221} {"train_loss": -11.382984161376953, "global_step": 205193, "epoch": 1221} {"train_loss": -11.430380821228027, "global_step": 205194, "epoch": 1221} {"train_loss": -11.40161418914795, "global_step": 205195, "epoch": 1221} {"train_loss": -11.424957275390625, "global_step": 205196, "epoch": 1221} {"train_loss": -11.454792022705078, "global_step": 205197, "epoch": 1221} {"train_loss": -11.62775993347168, "global_step": 205198, "epoch": 1221} {"train_loss": -11.391383171081543, "global_step": 205199, "epoch": 1221} {"train_loss": -11.332382202148438, "global_step": 205200, "epoch": 1221} {"train_loss": -11.499812126159668, "global_step": 205201, "epoch": 1221} {"train_loss": -11.511483192443848, "global_step": 205202, "epoch": 1221} {"train_loss": -11.410022735595703, "global_step": 205203, "epoch": 1221} {"train_loss": -11.510711669921875, "global_step": 205204, "epoch": 1221} {"train_loss": -11.539745330810547, "global_step": 205205, "epoch": 1221} {"train_loss": -11.531923294067383, "global_step": 205206, "epoch": 1221} {"train_loss": -11.687826156616211, "global_step": 205207, "epoch": 1221} {"train_loss": -11.687570571899414, "global_step": 205208, "epoch": 1221} {"train_loss": -11.641398429870605, "global_step": 205209, "epoch": 1221} {"train_loss": -11.55210018157959, "global_step": 205210, "epoch": 1221} {"train_loss": -11.657551765441895, "global_step": 205211, "epoch": 1221} {"train_loss": -11.625890731811523, "global_step": 205212, "epoch": 1221} {"train_loss": -11.584802627563477, "global_step": 205213, "epoch": 1221} {"train_loss": -11.722208976745605, "global_step": 205214, "epoch": 1221} {"train_loss": -11.733646392822266, "global_step": 205215, "epoch": 1221} {"train_loss": -11.716928482055664, "global_step": 205216, "epoch": 1221} {"train_loss": -11.514612197875977, "global_step": 205217, "epoch": 1221} {"train_loss": -11.592193603515625, "global_step": 205218, "epoch": 1221} {"train_loss": -11.696824073791504, "global_step": 205219, "epoch": 1221} {"train_loss": -11.673135757446289, "global_step": 205220, "epoch": 1221} {"train_loss": -11.798212051391602, "global_step": 205221, "epoch": 1221} {"train_loss": -11.491397857666016, "global_step": 205222, "epoch": 1221} {"train_loss": -11.75576114654541, "global_step": 205223, "epoch": 1221} {"train_loss": -11.767097473144531, "global_step": 205224, "epoch": 1221} {"train_loss": -11.695854187011719, "global_step": 205225, "epoch": 1221} {"train_loss": -11.833606719970703, "global_step": 205226, "epoch": 1221} {"train_loss": -11.466968536376953, "global_step": 205227, "epoch": 1221} {"train_loss": -11.741610527038574, "global_step": 205228, "epoch": 1221} {"train_loss": -11.776413917541504, "global_step": 205229, "epoch": 1221} {"train_loss": -11.56889533996582, "global_step": 205230, "epoch": 1221} {"train_loss": -11.850240707397461, "global_step": 205231, "epoch": 1221} {"train_loss": -11.632776260375977, "global_step": 205232, "epoch": 1221} {"train_loss": -11.659523010253906, "global_step": 205233, "epoch": 1221} {"train_loss": -11.795241355895996, "global_step": 205234, "epoch": 1221} {"train_loss": -11.743185043334961, "global_step": 205235, "epoch": 1221} {"train_loss": -11.99237060546875, "global_step": 205236, "epoch": 1221} {"train_loss": -11.801408767700195, "global_step": 205237, "epoch": 1221} {"train_loss": -11.54551887512207, "global_step": 205238, "epoch": 1221} {"train_loss": -11.60125732421875, "global_step": 205239, "epoch": 1221} {"train_loss": -11.575482368469238, "global_step": 205240, "epoch": 1221} {"train_loss": -11.739455223083496, "global_step": 205241, "epoch": 1221} {"train_loss": -12.126668930053711, "global_step": 205242, "epoch": 1221} {"train_loss": -11.876251220703125, "global_step": 205243, "epoch": 1221} {"train_loss": -11.806198120117188, "global_step": 205244, "epoch": 1221} {"train_loss": -11.861024856567383, "global_step": 205245, "epoch": 1221} {"train_loss": -11.939760208129883, "global_step": 205246, "epoch": 1221} {"train_loss": -11.81132698059082, "global_step": 205247, "epoch": 1221} {"train_loss": -11.752788543701172, "global_step": 205248, "epoch": 1221} {"train_loss": -11.956194877624512, "global_step": 205249, "epoch": 1221} {"train_loss": -11.798123359680176, "global_step": 205250, "epoch": 1221} {"train_loss": -11.911332130432129, "global_step": 205251, "epoch": 1221} {"train_loss": -11.612022399902344, "global_step": 205252, "epoch": 1221} {"train_loss": -11.914044380187988, "global_step": 205253, "epoch": 1221} {"train_loss": -11.295433044433594, "global_step": 205254, "epoch": 1221} {"train_loss": -10.885602951049805, "global_step": 205255, "epoch": 1221} {"train_loss": -11.462335586547852, "global_step": 205256, "epoch": 1221} {"train_loss": -11.40119743347168, "global_step": 205257, "epoch": 1221} {"train_loss": -11.189325332641602, "global_step": 205258, "epoch": 1221} {"train_loss": -11.092718124389648, "global_step": 205259, "epoch": 1221} {"train_loss": -11.7562255859375, "global_step": 205260, "epoch": 1221} {"train_loss": -10.51333999633789, "global_step": 205261, "epoch": 1221} {"train_loss": -10.986227035522461, "global_step": 205262, "epoch": 1221} {"train_loss": -10.75611400604248, "global_step": 205263, "epoch": 1221} {"train_loss": -11.35457992553711, "global_step": 205264, "epoch": 1221} {"train_loss": -10.58005142211914, "global_step": 205265, "epoch": 1221} {"train_loss": -11.247709274291992, "global_step": 205266, "epoch": 1221} {"train_loss": -11.05712890625, "global_step": 205267, "epoch": 1221} {"train_loss": -11.16061782836914, "global_step": 205268, "epoch": 1221} {"train_loss": -11.214005470275879, "global_step": 205269, "epoch": 1221} {"train_loss": -11.538454055786133, "global_step": 205270, "epoch": 1221} {"train_loss": -10.784043312072754, "global_step": 205271, "epoch": 1221} {"train_loss": -10.677428245544434, "global_step": 205272, "epoch": 1221} {"train_loss": -10.713245391845703, "global_step": 205273, "epoch": 1221} {"train_loss": -10.981661796569824, "global_step": 205274, "epoch": 1221} {"train_loss": -10.880748748779297, "global_step": 205275, "epoch": 1221} {"train_loss": -10.592090606689453, "global_step": 205276, "epoch": 1221} {"train_loss": -9.463634490966797, "global_step": 205277, "epoch": 1221} {"train_loss": -10.56325912475586, "global_step": 205278, "epoch": 1221} {"train_loss": -9.119190216064453, "global_step": 205279, "epoch": 1221} {"train_loss": -9.344863891601562, "global_step": 205280, "epoch": 1221} {"train_loss": -9.60824966430664, "global_step": 205281, "epoch": 1221} {"train_loss": -8.929840087890625, "global_step": 205282, "epoch": 1221} {"train_loss": -7.024823188781738, "global_step": 205283, "epoch": 1221} {"train_loss": -8.520663261413574, "global_step": 205284, "epoch": 1221} {"train_loss": -8.951465606689453, "global_step": 205285, "epoch": 1221} {"train_loss": -9.6520414352417, "global_step": 205286, "epoch": 1221} {"train_loss": -8.873687744140625, "global_step": 205287, "epoch": 1221} {"train_loss": -9.533632278442383, "global_step": 205288, "epoch": 1221} {"train_loss": -9.622893333435059, "global_step": 205289, "epoch": 1221} {"train_loss": -10.829248428344727, "global_step": 205290, "epoch": 1221} {"train_loss": -10.157407760620117, "global_step": 205291, "epoch": 1221} {"train_loss": -11.006500244140625, "global_step": 205292, "epoch": 1221} {"train_loss": -10.64621353149414, "global_step": 205293, "epoch": 1221} {"train_loss": -10.52653980255127, "global_step": 205294, "epoch": 1221} {"train_loss": -10.87200525261107, "global_step": 205295, "epoch": 1221, "val_loss": 251418.90625} {"train_loss": -10.898418426513672, "global_step": 205296, "epoch": 1222} {"train_loss": -10.8466157913208, "global_step": 205297, "epoch": 1222} {"train_loss": -10.869403839111328, "global_step": 205298, "epoch": 1222} {"train_loss": -10.753934860229492, "global_step": 205299, "epoch": 1222} {"train_loss": -11.147320747375488, "global_step": 205300, "epoch": 1222} {"train_loss": -10.956782341003418, "global_step": 205301, "epoch": 1222} {"train_loss": -10.905415534973145, "global_step": 205302, "epoch": 1222} {"train_loss": -11.356681823730469, "global_step": 205303, "epoch": 1222} {"train_loss": -10.889094352722168, "global_step": 205304, "epoch": 1222} {"train_loss": -11.195270538330078, "global_step": 205305, "epoch": 1222} {"train_loss": -11.19234848022461, "global_step": 205306, "epoch": 1222} {"train_loss": -11.278345108032227, "global_step": 205307, "epoch": 1222} {"train_loss": -11.097993850708008, "global_step": 205308, "epoch": 1222} {"train_loss": -11.082376480102539, "global_step": 205309, "epoch": 1222} {"train_loss": -11.18161392211914, "global_step": 205310, "epoch": 1222} {"train_loss": -10.935721397399902, "global_step": 205311, "epoch": 1222} {"train_loss": -11.468518257141113, "global_step": 205312, "epoch": 1222} {"train_loss": -11.236410140991211, "global_step": 205313, "epoch": 1222} {"train_loss": -11.251331329345703, "global_step": 205314, "epoch": 1222} {"train_loss": -11.295045852661133, "global_step": 205315, "epoch": 1222} {"train_loss": -11.527408599853516, "global_step": 205316, "epoch": 1222} {"train_loss": -11.285579681396484, "global_step": 205317, "epoch": 1222} {"train_loss": -11.256437301635742, "global_step": 205318, "epoch": 1222} {"train_loss": -11.30504322052002, "global_step": 205319, "epoch": 1222} {"train_loss": -11.441349029541016, "global_step": 205320, "epoch": 1222} {"train_loss": -11.575462341308594, "global_step": 205321, "epoch": 1222} {"train_loss": -11.419540405273438, "global_step": 205322, "epoch": 1222} {"train_loss": -11.396295547485352, "global_step": 205323, "epoch": 1222} {"train_loss": -11.470732688903809, "global_step": 205324, "epoch": 1222} {"train_loss": -11.458972930908203, "global_step": 205325, "epoch": 1222} {"train_loss": -11.49044418334961, "global_step": 205326, "epoch": 1222} {"train_loss": -11.706345558166504, "global_step": 205327, "epoch": 1222} {"train_loss": -11.542484283447266, "global_step": 205328, "epoch": 1222} {"train_loss": -11.552803039550781, "global_step": 205329, "epoch": 1222} {"train_loss": -11.550908088684082, "global_step": 205330, "epoch": 1222} {"train_loss": -11.549478530883789, "global_step": 205331, "epoch": 1222} {"train_loss": -11.455303192138672, "global_step": 205332, "epoch": 1222} {"train_loss": -11.59543514251709, "global_step": 205333, "epoch": 1222} {"train_loss": -11.63822078704834, "global_step": 205334, "epoch": 1222} {"train_loss": -11.47941780090332, "global_step": 205335, "epoch": 1222} {"train_loss": -11.549979209899902, "global_step": 205336, "epoch": 1222} {"train_loss": -11.485441207885742, "global_step": 205337, "epoch": 1222} {"train_loss": -11.625907897949219, "global_step": 205338, "epoch": 1222} {"train_loss": -11.723459243774414, "global_step": 205339, "epoch": 1222} {"train_loss": -11.626860618591309, "global_step": 205340, "epoch": 1222} {"train_loss": -11.619668960571289, "global_step": 205341, "epoch": 1222} {"train_loss": -11.603668212890625, "global_step": 205342, "epoch": 1222} {"train_loss": -11.863216400146484, "global_step": 205343, "epoch": 1222} {"train_loss": -11.599369049072266, "global_step": 205344, "epoch": 1222} {"train_loss": -11.713970184326172, "global_step": 205345, "epoch": 1222} {"train_loss": -11.646910667419434, "global_step": 205346, "epoch": 1222} {"train_loss": -11.671588897705078, "global_step": 205347, "epoch": 1222} {"train_loss": -11.673213958740234, "global_step": 205348, "epoch": 1222} {"train_loss": -11.824060440063477, "global_step": 205349, "epoch": 1222} {"train_loss": -11.810372352600098, "global_step": 205350, "epoch": 1222} {"train_loss": -11.680828094482422, "global_step": 205351, "epoch": 1222} {"train_loss": -11.715185165405273, "global_step": 205352, "epoch": 1222} {"train_loss": -11.526081085205078, "global_step": 205353, "epoch": 1222} {"train_loss": -11.832590103149414, "global_step": 205354, "epoch": 1222} {"train_loss": -11.575532913208008, "global_step": 205355, "epoch": 1222} {"train_loss": -12.047737121582031, "global_step": 205356, "epoch": 1222} {"train_loss": -11.7344970703125, "global_step": 205357, "epoch": 1222} {"train_loss": -11.701986312866211, "global_step": 205358, "epoch": 1222} {"train_loss": -11.178812980651855, "global_step": 205359, "epoch": 1222} {"train_loss": -11.211008071899414, "global_step": 205360, "epoch": 1222} {"train_loss": -11.431098937988281, "global_step": 205361, "epoch": 1222} {"train_loss": -11.383964538574219, "global_step": 205362, "epoch": 1222} {"train_loss": -11.056325912475586, "global_step": 205363, "epoch": 1222} {"train_loss": -10.730857849121094, "global_step": 205364, "epoch": 1222} {"train_loss": -11.475857734680176, "global_step": 205365, "epoch": 1222} {"train_loss": -11.589000701904297, "global_step": 205366, "epoch": 1222} {"train_loss": -11.575323104858398, "global_step": 205367, "epoch": 1222} {"train_loss": -10.999093055725098, "global_step": 205368, "epoch": 1222} {"train_loss": -11.625041961669922, "global_step": 205369, "epoch": 1222} {"train_loss": -11.504960060119629, "global_step": 205370, "epoch": 1222} {"train_loss": -11.245113372802734, "global_step": 205371, "epoch": 1222} {"train_loss": -11.142282485961914, "global_step": 205372, "epoch": 1222} {"train_loss": -11.556260108947754, "global_step": 205373, "epoch": 1222} {"train_loss": -11.268388748168945, "global_step": 205374, "epoch": 1222} {"train_loss": -11.442281723022461, "global_step": 205375, "epoch": 1222} {"train_loss": -11.581226348876953, "global_step": 205376, "epoch": 1222} {"train_loss": -11.549539566040039, "global_step": 205377, "epoch": 1222} {"train_loss": -11.311614036560059, "global_step": 205378, "epoch": 1222} {"train_loss": -11.8511323928833, "global_step": 205379, "epoch": 1222} {"train_loss": -11.145923614501953, "global_step": 205380, "epoch": 1222} {"train_loss": -11.562525749206543, "global_step": 205381, "epoch": 1222} {"train_loss": -11.666058540344238, "global_step": 205382, "epoch": 1222} {"train_loss": -11.65301513671875, "global_step": 205383, "epoch": 1222} {"train_loss": -11.652498245239258, "global_step": 205384, "epoch": 1222} {"train_loss": -11.607928276062012, "global_step": 205385, "epoch": 1222} {"train_loss": -11.695030212402344, "global_step": 205386, "epoch": 1222} {"train_loss": -11.765524864196777, "global_step": 205387, "epoch": 1222} {"train_loss": -11.499397277832031, "global_step": 205388, "epoch": 1222} {"train_loss": -11.76252555847168, "global_step": 205389, "epoch": 1222} {"train_loss": -11.870646476745605, "global_step": 205390, "epoch": 1222} {"train_loss": -11.634090423583984, "global_step": 205391, "epoch": 1222} {"train_loss": -11.684576034545898, "global_step": 205392, "epoch": 1222} {"train_loss": -11.411558151245117, "global_step": 205393, "epoch": 1222} {"train_loss": -11.640559196472168, "global_step": 205394, "epoch": 1222} {"train_loss": -11.429376602172852, "global_step": 205395, "epoch": 1222} {"train_loss": -11.226882934570312, "global_step": 205396, "epoch": 1222} {"train_loss": -10.873550415039062, "global_step": 205397, "epoch": 1222} {"train_loss": -11.144414901733398, "global_step": 205398, "epoch": 1222} {"train_loss": -11.125524520874023, "global_step": 205399, "epoch": 1222} {"train_loss": -10.934349060058594, "global_step": 205400, "epoch": 1222} {"train_loss": -9.370750427246094, "global_step": 205401, "epoch": 1222} {"train_loss": -10.49593734741211, "global_step": 205402, "epoch": 1222} {"train_loss": -11.273857116699219, "global_step": 205403, "epoch": 1222} {"train_loss": -10.531346321105957, "global_step": 205404, "epoch": 1222} {"train_loss": -11.358355522155762, "global_step": 205405, "epoch": 1222} {"train_loss": -11.490741729736328, "global_step": 205406, "epoch": 1222} {"train_loss": -10.853734970092773, "global_step": 205407, "epoch": 1222} {"train_loss": -10.737278938293457, "global_step": 205408, "epoch": 1222} {"train_loss": -11.36524486541748, "global_step": 205409, "epoch": 1222} {"train_loss": -11.063785552978516, "global_step": 205410, "epoch": 1222} {"train_loss": -9.803735733032227, "global_step": 205411, "epoch": 1222} {"train_loss": -11.22459602355957, "global_step": 205412, "epoch": 1222} {"train_loss": -11.260623931884766, "global_step": 205413, "epoch": 1222} {"train_loss": -10.886770248413086, "global_step": 205414, "epoch": 1222} {"train_loss": -11.093108177185059, "global_step": 205415, "epoch": 1222} {"train_loss": -10.646522521972656, "global_step": 205416, "epoch": 1222} {"train_loss": -11.40701675415039, "global_step": 205417, "epoch": 1222} {"train_loss": -10.967894554138184, "global_step": 205418, "epoch": 1222} {"train_loss": -10.981216430664062, "global_step": 205419, "epoch": 1222} {"train_loss": -11.314199447631836, "global_step": 205420, "epoch": 1222} {"train_loss": -10.96147346496582, "global_step": 205421, "epoch": 1222} {"train_loss": -11.197542190551758, "global_step": 205422, "epoch": 1222} {"train_loss": -11.456905364990234, "global_step": 205423, "epoch": 1222} {"train_loss": -10.683841705322266, "global_step": 205424, "epoch": 1222} {"train_loss": -11.069112777709961, "global_step": 205425, "epoch": 1222} {"train_loss": -11.560322761535645, "global_step": 205426, "epoch": 1222} {"train_loss": -10.995767593383789, "global_step": 205427, "epoch": 1222} {"train_loss": -11.1712646484375, "global_step": 205428, "epoch": 1222} {"train_loss": -11.377645492553711, "global_step": 205429, "epoch": 1222} {"train_loss": -11.482671737670898, "global_step": 205430, "epoch": 1222} {"train_loss": -11.363737106323242, "global_step": 205431, "epoch": 1222} {"train_loss": -11.263514518737793, "global_step": 205432, "epoch": 1222} {"train_loss": -11.362859725952148, "global_step": 205433, "epoch": 1222} {"train_loss": -11.321786880493164, "global_step": 205434, "epoch": 1222} {"train_loss": -11.249908447265625, "global_step": 205435, "epoch": 1222} {"train_loss": -11.042150497436523, "global_step": 205436, "epoch": 1222} {"train_loss": -11.237344741821289, "global_step": 205437, "epoch": 1222} {"train_loss": -11.428123474121094, "global_step": 205438, "epoch": 1222} {"train_loss": -11.038177490234375, "global_step": 205439, "epoch": 1222} {"train_loss": -11.28921127319336, "global_step": 205440, "epoch": 1222} {"train_loss": -11.3110990524292, "global_step": 205441, "epoch": 1222} {"train_loss": -11.128695487976074, "global_step": 205442, "epoch": 1222} {"train_loss": -11.638960838317871, "global_step": 205443, "epoch": 1222} {"train_loss": -11.138923645019531, "global_step": 205444, "epoch": 1222} {"train_loss": -11.325239181518555, "global_step": 205445, "epoch": 1222} {"train_loss": -11.184713363647461, "global_step": 205446, "epoch": 1222} {"train_loss": -11.565506935119629, "global_step": 205447, "epoch": 1222} {"train_loss": -11.476594924926758, "global_step": 205448, "epoch": 1222} {"train_loss": -11.27928352355957, "global_step": 205449, "epoch": 1222} {"train_loss": -11.344520568847656, "global_step": 205450, "epoch": 1222} {"train_loss": -11.514387130737305, "global_step": 205451, "epoch": 1222} {"train_loss": -11.263341903686523, "global_step": 205452, "epoch": 1222} {"train_loss": -11.215343475341797, "global_step": 205453, "epoch": 1222} {"train_loss": -11.515271186828613, "global_step": 205454, "epoch": 1222} {"train_loss": -11.506818771362305, "global_step": 205455, "epoch": 1222} {"train_loss": -11.055647850036621, "global_step": 205456, "epoch": 1222} {"train_loss": -11.100576400756836, "global_step": 205457, "epoch": 1222} {"train_loss": -11.283001899719238, "global_step": 205458, "epoch": 1222} {"train_loss": -11.795476913452148, "global_step": 205459, "epoch": 1222} {"train_loss": -11.323898315429688, "global_step": 205460, "epoch": 1222} {"train_loss": -11.475257873535156, "global_step": 205461, "epoch": 1222} {"train_loss": -11.402742385864258, "global_step": 205462, "epoch": 1222} {"train_loss": -11.334021204993839, "global_step": 205463, "epoch": 1222, "val_loss": 254448.265625} {"train_loss": -11.580902099609375, "global_step": 205464, "epoch": 1223} {"train_loss": -11.420899391174316, "global_step": 205465, "epoch": 1223} {"train_loss": -11.542724609375, "global_step": 205466, "epoch": 1223} {"train_loss": -11.52148723602295, "global_step": 205467, "epoch": 1223} {"train_loss": -11.388175964355469, "global_step": 205468, "epoch": 1223} {"train_loss": -11.550984382629395, "global_step": 205469, "epoch": 1223} {"train_loss": -11.428047180175781, "global_step": 205470, "epoch": 1223} {"train_loss": -11.394805908203125, "global_step": 205471, "epoch": 1223} {"train_loss": -11.659252166748047, "global_step": 205472, "epoch": 1223} {"train_loss": -11.225289344787598, "global_step": 205473, "epoch": 1223} {"train_loss": -11.154315948486328, "global_step": 205474, "epoch": 1223} {"train_loss": -11.40793228149414, "global_step": 205475, "epoch": 1223} {"train_loss": -11.430089950561523, "global_step": 205476, "epoch": 1223} {"train_loss": -11.195963859558105, "global_step": 205477, "epoch": 1223} {"train_loss": -11.418210983276367, "global_step": 205478, "epoch": 1223} {"train_loss": -11.116118431091309, "global_step": 205479, "epoch": 1223} {"train_loss": -11.02429485321045, "global_step": 205480, "epoch": 1223} {"train_loss": -11.19378662109375, "global_step": 205481, "epoch": 1223} {"train_loss": -11.414722442626953, "global_step": 205482, "epoch": 1223} {"train_loss": -11.59124755859375, "global_step": 205483, "epoch": 1223} {"train_loss": -11.485794067382812, "global_step": 205484, "epoch": 1223} {"train_loss": -11.557308197021484, "global_step": 205485, "epoch": 1223} {"train_loss": -11.407158851623535, "global_step": 205486, "epoch": 1223} {"train_loss": -11.42524242401123, "global_step": 205487, "epoch": 1223} {"train_loss": -11.507390975952148, "global_step": 205488, "epoch": 1223} {"train_loss": -11.661197662353516, "global_step": 205489, "epoch": 1223} {"train_loss": -11.312911987304688, "global_step": 205490, "epoch": 1223} {"train_loss": -11.61586856842041, "global_step": 205491, "epoch": 1223} {"train_loss": -11.351387977600098, "global_step": 205492, "epoch": 1223} {"train_loss": -11.480022430419922, "global_step": 205493, "epoch": 1223} {"train_loss": -11.33319091796875, "global_step": 205494, "epoch": 1223} {"train_loss": -11.62440299987793, "global_step": 205495, "epoch": 1223} {"train_loss": -11.592597961425781, "global_step": 205496, "epoch": 1223} {"train_loss": -11.496455192565918, "global_step": 205497, "epoch": 1223} {"train_loss": -11.29488468170166, "global_step": 205498, "epoch": 1223} {"train_loss": -11.244991302490234, "global_step": 205499, "epoch": 1223} {"train_loss": -10.930217742919922, "global_step": 205500, "epoch": 1223} {"train_loss": -11.393068313598633, "global_step": 205501, "epoch": 1223} {"train_loss": -10.861396789550781, "global_step": 205502, "epoch": 1223} {"train_loss": -10.823598861694336, "global_step": 205503, "epoch": 1223} {"train_loss": -11.339761734008789, "global_step": 205504, "epoch": 1223} {"train_loss": -11.630236625671387, "global_step": 205505, "epoch": 1223} {"train_loss": -10.419410705566406, "global_step": 205506, "epoch": 1223} {"train_loss": -10.9827880859375, "global_step": 205507, "epoch": 1223} {"train_loss": -10.8382568359375, "global_step": 205508, "epoch": 1223} {"train_loss": -10.691902160644531, "global_step": 205509, "epoch": 1223} {"train_loss": -10.311574935913086, "global_step": 205510, "epoch": 1223} {"train_loss": -10.313907623291016, "global_step": 205511, "epoch": 1223} {"train_loss": -10.161064147949219, "global_step": 205512, "epoch": 1223} {"train_loss": -10.255943298339844, "global_step": 205513, "epoch": 1223} {"train_loss": -11.311023712158203, "global_step": 205514, "epoch": 1223} {"train_loss": -10.535017013549805, "global_step": 205515, "epoch": 1223} {"train_loss": -10.555097579956055, "global_step": 205516, "epoch": 1223} {"train_loss": -10.937149047851562, "global_step": 205517, "epoch": 1223} {"train_loss": -10.548482894897461, "global_step": 205518, "epoch": 1223} {"train_loss": -10.820152282714844, "global_step": 205519, "epoch": 1223} {"train_loss": -10.318451881408691, "global_step": 205520, "epoch": 1223} {"train_loss": -11.114585876464844, "global_step": 205521, "epoch": 1223} {"train_loss": -11.005345344543457, "global_step": 205522, "epoch": 1223} {"train_loss": -10.817770004272461, "global_step": 205523, "epoch": 1223} {"train_loss": -10.617999076843262, "global_step": 205524, "epoch": 1223} {"train_loss": -10.762372970581055, "global_step": 205525, "epoch": 1223} {"train_loss": -11.143777847290039, "global_step": 205526, "epoch": 1223} {"train_loss": -10.514668464660645, "global_step": 205527, "epoch": 1223} {"train_loss": -11.355188369750977, "global_step": 205528, "epoch": 1223} {"train_loss": -10.204090118408203, "global_step": 205529, "epoch": 1223} {"train_loss": -11.409385681152344, "global_step": 205530, "epoch": 1223} {"train_loss": -10.779862403869629, "global_step": 205531, "epoch": 1223} {"train_loss": -11.07131290435791, "global_step": 205532, "epoch": 1223} {"train_loss": -10.674675941467285, "global_step": 205533, "epoch": 1223} {"train_loss": -11.038320541381836, "global_step": 205534, "epoch": 1223} {"train_loss": -10.83619213104248, "global_step": 205535, "epoch": 1223} {"train_loss": -11.364561080932617, "global_step": 205536, "epoch": 1223} {"train_loss": -10.71493148803711, "global_step": 205537, "epoch": 1223} {"train_loss": -11.386917114257812, "global_step": 205538, "epoch": 1223} {"train_loss": -11.08596420288086, "global_step": 205539, "epoch": 1223} {"train_loss": -11.321191787719727, "global_step": 205540, "epoch": 1223} {"train_loss": -11.412555694580078, "global_step": 205541, "epoch": 1223} {"train_loss": -11.48769760131836, "global_step": 205542, "epoch": 1223} {"train_loss": -11.349842071533203, "global_step": 205543, "epoch": 1223} {"train_loss": -11.384748458862305, "global_step": 205544, "epoch": 1223} {"train_loss": -11.51278305053711, "global_step": 205545, "epoch": 1223} {"train_loss": -11.328653335571289, "global_step": 205546, "epoch": 1223} {"train_loss": -11.366374969482422, "global_step": 205547, "epoch": 1223} {"train_loss": -11.454326629638672, "global_step": 205548, "epoch": 1223} {"train_loss": -11.525947570800781, "global_step": 205549, "epoch": 1223} {"train_loss": -11.497445106506348, "global_step": 205550, "epoch": 1223} {"train_loss": -11.510790824890137, "global_step": 205551, "epoch": 1223} {"train_loss": -11.343893051147461, "global_step": 205552, "epoch": 1223} {"train_loss": -11.604571342468262, "global_step": 205553, "epoch": 1223} {"train_loss": -11.555863380432129, "global_step": 205554, "epoch": 1223} {"train_loss": -11.54941463470459, "global_step": 205555, "epoch": 1223} {"train_loss": -11.5260591506958, "global_step": 205556, "epoch": 1223} {"train_loss": -11.540022850036621, "global_step": 205557, "epoch": 1223} {"train_loss": -11.663649559020996, "global_step": 205558, "epoch": 1223} {"train_loss": -11.692451477050781, "global_step": 205559, "epoch": 1223} {"train_loss": -11.770193099975586, "global_step": 205560, "epoch": 1223} {"train_loss": -11.796932220458984, "global_step": 205561, "epoch": 1223} {"train_loss": -11.732706069946289, "global_step": 205562, "epoch": 1223} {"train_loss": -11.841409683227539, "global_step": 205563, "epoch": 1223} {"train_loss": -11.63416862487793, "global_step": 205564, "epoch": 1223} {"train_loss": -11.872901916503906, "global_step": 205565, "epoch": 1223} {"train_loss": -11.685474395751953, "global_step": 205566, "epoch": 1223} {"train_loss": -11.643865585327148, "global_step": 205567, "epoch": 1223} {"train_loss": -11.851114273071289, "global_step": 205568, "epoch": 1223} {"train_loss": -11.707620620727539, "global_step": 205569, "epoch": 1223} {"train_loss": -11.683244705200195, "global_step": 205570, "epoch": 1223} {"train_loss": -11.5047025680542, "global_step": 205571, "epoch": 1223} {"train_loss": -11.714030265808105, "global_step": 205572, "epoch": 1223} {"train_loss": -11.91429328918457, "global_step": 205573, "epoch": 1223} {"train_loss": -11.848963737487793, "global_step": 205574, "epoch": 1223} {"train_loss": -11.81546688079834, "global_step": 205575, "epoch": 1223} {"train_loss": -11.813948631286621, "global_step": 205576, "epoch": 1223} {"train_loss": -11.714138984680176, "global_step": 205577, "epoch": 1223} {"train_loss": -11.791607856750488, "global_step": 205578, "epoch": 1223} {"train_loss": -11.8411865234375, "global_step": 205579, "epoch": 1223} {"train_loss": -11.673089981079102, "global_step": 205580, "epoch": 1223} {"train_loss": -11.653905868530273, "global_step": 205581, "epoch": 1223} {"train_loss": -11.57897663116455, "global_step": 205582, "epoch": 1223} {"train_loss": -11.875557899475098, "global_step": 205583, "epoch": 1223} {"train_loss": -11.817447662353516, "global_step": 205584, "epoch": 1223} {"train_loss": -11.649250030517578, "global_step": 205585, "epoch": 1223} {"train_loss": -11.803913116455078, "global_step": 205586, "epoch": 1223} {"train_loss": -11.272018432617188, "global_step": 205587, "epoch": 1223} {"train_loss": -11.68798828125, "global_step": 205588, "epoch": 1223} {"train_loss": -11.744379043579102, "global_step": 205589, "epoch": 1223} {"train_loss": -11.569385528564453, "global_step": 205590, "epoch": 1223} {"train_loss": -11.276097297668457, "global_step": 205591, "epoch": 1223} {"train_loss": -11.597410202026367, "global_step": 205592, "epoch": 1223} {"train_loss": -11.731192588806152, "global_step": 205593, "epoch": 1223} {"train_loss": -11.380462646484375, "global_step": 205594, "epoch": 1223} {"train_loss": -11.312583923339844, "global_step": 205595, "epoch": 1223} {"train_loss": -11.594852447509766, "global_step": 205596, "epoch": 1223} {"train_loss": -11.439411163330078, "global_step": 205597, "epoch": 1223} {"train_loss": -11.477989196777344, "global_step": 205598, "epoch": 1223} {"train_loss": -11.667672157287598, "global_step": 205599, "epoch": 1223} {"train_loss": -11.480452537536621, "global_step": 205600, "epoch": 1223} {"train_loss": -11.406509399414062, "global_step": 205601, "epoch": 1223} {"train_loss": -11.576129913330078, "global_step": 205602, "epoch": 1223} {"train_loss": -11.523128509521484, "global_step": 205603, "epoch": 1223} {"train_loss": -11.75497817993164, "global_step": 205604, "epoch": 1223} {"train_loss": -11.41398811340332, "global_step": 205605, "epoch": 1223} {"train_loss": -11.840005874633789, "global_step": 205606, "epoch": 1223} {"train_loss": -11.2804536819458, "global_step": 205607, "epoch": 1223} {"train_loss": -11.679582595825195, "global_step": 205608, "epoch": 1223} {"train_loss": -11.463668823242188, "global_step": 205609, "epoch": 1223} {"train_loss": -11.602154731750488, "global_step": 205610, "epoch": 1223} {"train_loss": -11.377799987792969, "global_step": 205611, "epoch": 1223} {"train_loss": -10.928361892700195, "global_step": 205612, "epoch": 1223} {"train_loss": -10.786102294921875, "global_step": 205613, "epoch": 1223} {"train_loss": -11.411510467529297, "global_step": 205614, "epoch": 1223} {"train_loss": -11.596004486083984, "global_step": 205615, "epoch": 1223} {"train_loss": -10.40765380859375, "global_step": 205616, "epoch": 1223} {"train_loss": -10.691786766052246, "global_step": 205617, "epoch": 1223} {"train_loss": -11.528444290161133, "global_step": 205618, "epoch": 1223} {"train_loss": -11.047262191772461, "global_step": 205619, "epoch": 1223} {"train_loss": -11.087265968322754, "global_step": 205620, "epoch": 1223} {"train_loss": -10.767940521240234, "global_step": 205621, "epoch": 1223} {"train_loss": -11.18772029876709, "global_step": 205622, "epoch": 1223} {"train_loss": -10.36096477508545, "global_step": 205623, "epoch": 1223} {"train_loss": -11.607648849487305, "global_step": 205624, "epoch": 1223} {"train_loss": -10.627449989318848, "global_step": 205625, "epoch": 1223} {"train_loss": -10.738832473754883, "global_step": 205626, "epoch": 1223} {"train_loss": -11.315802574157715, "global_step": 205627, "epoch": 1223} {"train_loss": -11.017731666564941, "global_step": 205628, "epoch": 1223} {"train_loss": -11.477246284484863, "global_step": 205629, "epoch": 1223} {"train_loss": -11.089117050170898, "global_step": 205630, "epoch": 1223} {"train_loss": -11.315839466594515, "global_step": 205631, "epoch": 1223, "val_loss": 253723.40625} {"train_loss": -11.379837036132812, "global_step": 205632, "epoch": 1224} {"train_loss": -10.960391998291016, "global_step": 205633, "epoch": 1224} {"train_loss": -10.971315383911133, "global_step": 205634, "epoch": 1224} {"train_loss": -11.093185424804688, "global_step": 205635, "epoch": 1224} {"train_loss": -11.714372634887695, "global_step": 205636, "epoch": 1224} {"train_loss": -11.218900680541992, "global_step": 205637, "epoch": 1224} {"train_loss": -11.441475868225098, "global_step": 205638, "epoch": 1224} {"train_loss": -11.742274284362793, "global_step": 205639, "epoch": 1224} {"train_loss": -10.744918823242188, "global_step": 205640, "epoch": 1224} {"train_loss": -11.415346145629883, "global_step": 205641, "epoch": 1224} {"train_loss": -10.858945846557617, "global_step": 205642, "epoch": 1224} {"train_loss": -11.47269058227539, "global_step": 205643, "epoch": 1224} {"train_loss": -10.818693161010742, "global_step": 205644, "epoch": 1224} {"train_loss": -11.040517807006836, "global_step": 205645, "epoch": 1224} {"train_loss": -10.292303085327148, "global_step": 205646, "epoch": 1224} {"train_loss": -11.270881652832031, "global_step": 205647, "epoch": 1224} {"train_loss": -11.253240585327148, "global_step": 205648, "epoch": 1224} {"train_loss": -11.450885772705078, "global_step": 205649, "epoch": 1224} {"train_loss": -11.179718017578125, "global_step": 205650, "epoch": 1224} {"train_loss": -11.364408493041992, "global_step": 205651, "epoch": 1224} {"train_loss": -11.03541374206543, "global_step": 205652, "epoch": 1224} {"train_loss": -10.996393203735352, "global_step": 205653, "epoch": 1224} {"train_loss": -10.729092597961426, "global_step": 205654, "epoch": 1224} {"train_loss": -11.22724723815918, "global_step": 205655, "epoch": 1224} {"train_loss": -10.937365531921387, "global_step": 205656, "epoch": 1224} {"train_loss": -10.804204940795898, "global_step": 205657, "epoch": 1224} {"train_loss": -11.275638580322266, "global_step": 205658, "epoch": 1224} {"train_loss": -9.8947114944458, "global_step": 205659, "epoch": 1224} {"train_loss": -11.231523513793945, "global_step": 205660, "epoch": 1224} {"train_loss": -10.415989875793457, "global_step": 205661, "epoch": 1224} {"train_loss": -9.733245849609375, "global_step": 205662, "epoch": 1224} {"train_loss": -11.040130615234375, "global_step": 205663, "epoch": 1224} {"train_loss": -9.55734634399414, "global_step": 205664, "epoch": 1224} {"train_loss": -10.05230712890625, "global_step": 205665, "epoch": 1224} {"train_loss": -9.919489860534668, "global_step": 205666, "epoch": 1224} {"train_loss": -9.642534255981445, "global_step": 205667, "epoch": 1224} {"train_loss": -9.170236587524414, "global_step": 205668, "epoch": 1224} {"train_loss": -8.762084007263184, "global_step": 205669, "epoch": 1224} {"train_loss": -9.54326343536377, "global_step": 205670, "epoch": 1224} {"train_loss": -10.768964767456055, "global_step": 205671, "epoch": 1224} {"train_loss": -8.830278396606445, "global_step": 205672, "epoch": 1224} {"train_loss": -9.750865936279297, "global_step": 205673, "epoch": 1224} {"train_loss": -10.110363006591797, "global_step": 205674, "epoch": 1224} {"train_loss": -9.750039100646973, "global_step": 205675, "epoch": 1224} {"train_loss": -9.958159446716309, "global_step": 205676, "epoch": 1224} {"train_loss": -10.840782165527344, "global_step": 205677, "epoch": 1224} {"train_loss": -10.396658897399902, "global_step": 205678, "epoch": 1224} {"train_loss": -10.751825332641602, "global_step": 205679, "epoch": 1224} {"train_loss": -11.090079307556152, "global_step": 205680, "epoch": 1224} {"train_loss": -10.427860260009766, "global_step": 205681, "epoch": 1224} {"train_loss": -10.718924522399902, "global_step": 205682, "epoch": 1224} {"train_loss": -11.01107406616211, "global_step": 205683, "epoch": 1224} {"train_loss": -10.95743465423584, "global_step": 205684, "epoch": 1224} {"train_loss": -11.01911735534668, "global_step": 205685, "epoch": 1224} {"train_loss": -11.130154609680176, "global_step": 205686, "epoch": 1224} {"train_loss": -11.194648742675781, "global_step": 205687, "epoch": 1224} {"train_loss": -10.964824676513672, "global_step": 205688, "epoch": 1224} {"train_loss": -11.23971939086914, "global_step": 205689, "epoch": 1224} {"train_loss": -11.24142837524414, "global_step": 205690, "epoch": 1224} {"train_loss": -11.270126342773438, "global_step": 205691, "epoch": 1224} {"train_loss": -11.279548645019531, "global_step": 205692, "epoch": 1224} {"train_loss": -11.372856140136719, "global_step": 205693, "epoch": 1224} {"train_loss": -11.454156875610352, "global_step": 205694, "epoch": 1224} {"train_loss": -11.433807373046875, "global_step": 205695, "epoch": 1224} {"train_loss": -11.352048873901367, "global_step": 205696, "epoch": 1224} {"train_loss": -11.194324493408203, "global_step": 205697, "epoch": 1224} {"train_loss": -11.419733047485352, "global_step": 205698, "epoch": 1224} {"train_loss": -11.395076751708984, "global_step": 205699, "epoch": 1224} {"train_loss": -11.739542961120605, "global_step": 205700, "epoch": 1224} {"train_loss": -11.469858169555664, "global_step": 205701, "epoch": 1224} {"train_loss": -11.595115661621094, "global_step": 205702, "epoch": 1224} {"train_loss": -11.548429489135742, "global_step": 205703, "epoch": 1224} {"train_loss": -11.465448379516602, "global_step": 205704, "epoch": 1224} {"train_loss": -11.591205596923828, "global_step": 205705, "epoch": 1224} {"train_loss": -11.635509490966797, "global_step": 205706, "epoch": 1224} {"train_loss": -11.583280563354492, "global_step": 205707, "epoch": 1224} {"train_loss": -11.443904876708984, "global_step": 205708, "epoch": 1224} {"train_loss": -11.422901153564453, "global_step": 205709, "epoch": 1224} {"train_loss": -11.445319175720215, "global_step": 205710, "epoch": 1224} {"train_loss": -11.575974464416504, "global_step": 205711, "epoch": 1224} {"train_loss": -11.640058517456055, "global_step": 205712, "epoch": 1224} {"train_loss": -11.527555465698242, "global_step": 205713, "epoch": 1224} {"train_loss": -11.717462539672852, "global_step": 205714, "epoch": 1224} {"train_loss": -11.48482608795166, "global_step": 205715, "epoch": 1224} {"train_loss": -11.679059982299805, "global_step": 205716, "epoch": 1224} {"train_loss": -11.347068786621094, "global_step": 205717, "epoch": 1224} {"train_loss": -11.840798377990723, "global_step": 205718, "epoch": 1224} {"train_loss": -11.568717002868652, "global_step": 205719, "epoch": 1224} {"train_loss": -11.787148475646973, "global_step": 205720, "epoch": 1224} {"train_loss": -11.63311767578125, "global_step": 205721, "epoch": 1224} {"train_loss": -11.750032424926758, "global_step": 205722, "epoch": 1224} {"train_loss": -11.831073760986328, "global_step": 205723, "epoch": 1224} {"train_loss": -11.651083946228027, "global_step": 205724, "epoch": 1224} {"train_loss": -11.66312313079834, "global_step": 205725, "epoch": 1224} {"train_loss": -11.625578880310059, "global_step": 205726, "epoch": 1224} {"train_loss": -11.682844161987305, "global_step": 205727, "epoch": 1224} {"train_loss": -11.737491607666016, "global_step": 205728, "epoch": 1224} {"train_loss": -11.726456642150879, "global_step": 205729, "epoch": 1224} {"train_loss": -11.860692977905273, "global_step": 205730, "epoch": 1224} {"train_loss": -11.854857444763184, "global_step": 205731, "epoch": 1224} {"train_loss": -11.819936752319336, "global_step": 205732, "epoch": 1224} {"train_loss": -11.953497886657715, "global_step": 205733, "epoch": 1224} {"train_loss": -11.66811752319336, "global_step": 205734, "epoch": 1224} {"train_loss": -11.857612609863281, "global_step": 205735, "epoch": 1224} {"train_loss": -12.020302772521973, "global_step": 205736, "epoch": 1224} {"train_loss": -11.70765209197998, "global_step": 205737, "epoch": 1224} {"train_loss": -11.680314064025879, "global_step": 205738, "epoch": 1224} {"train_loss": -11.489459991455078, "global_step": 205739, "epoch": 1224} {"train_loss": -11.658186912536621, "global_step": 205740, "epoch": 1224} {"train_loss": -11.788740158081055, "global_step": 205741, "epoch": 1224} {"train_loss": -11.30122184753418, "global_step": 205742, "epoch": 1224} {"train_loss": -11.399553298950195, "global_step": 205743, "epoch": 1224} {"train_loss": -11.476734161376953, "global_step": 205744, "epoch": 1224} {"train_loss": -11.680716514587402, "global_step": 205745, "epoch": 1224} {"train_loss": -11.528459548950195, "global_step": 205746, "epoch": 1224} {"train_loss": -11.454504013061523, "global_step": 205747, "epoch": 1224} {"train_loss": -11.825614929199219, "global_step": 205748, "epoch": 1224} {"train_loss": -11.495941162109375, "global_step": 205749, "epoch": 1224} {"train_loss": -11.28652572631836, "global_step": 205750, "epoch": 1224} {"train_loss": -11.452022552490234, "global_step": 205751, "epoch": 1224} {"train_loss": -11.440875053405762, "global_step": 205752, "epoch": 1224} {"train_loss": -11.504770278930664, "global_step": 205753, "epoch": 1224} {"train_loss": -11.662286758422852, "global_step": 205754, "epoch": 1224} {"train_loss": -11.487890243530273, "global_step": 205755, "epoch": 1224} {"train_loss": -11.587491989135742, "global_step": 205756, "epoch": 1224} {"train_loss": -11.123567581176758, "global_step": 205757, "epoch": 1224} {"train_loss": -10.726011276245117, "global_step": 205758, "epoch": 1224} {"train_loss": -9.939584732055664, "global_step": 205759, "epoch": 1224} {"train_loss": -10.026897430419922, "global_step": 205760, "epoch": 1224} {"train_loss": -7.336045265197754, "global_step": 205761, "epoch": 1224} {"train_loss": -7.859932899475098, "global_step": 205762, "epoch": 1224} {"train_loss": -7.315402030944824, "global_step": 205763, "epoch": 1224} {"train_loss": -7.1001362800598145, "global_step": 205764, "epoch": 1224} {"train_loss": -8.548684120178223, "global_step": 205765, "epoch": 1224} {"train_loss": -9.19485855102539, "global_step": 205766, "epoch": 1224} {"train_loss": -8.865413665771484, "global_step": 205767, "epoch": 1224} {"train_loss": -8.820866584777832, "global_step": 205768, "epoch": 1224} {"train_loss": -8.610739707946777, "global_step": 205769, "epoch": 1224} {"train_loss": -10.342680931091309, "global_step": 205770, "epoch": 1224} {"train_loss": -9.054481506347656, "global_step": 205771, "epoch": 1224} {"train_loss": -10.517512321472168, "global_step": 205772, "epoch": 1224} {"train_loss": -9.328653335571289, "global_step": 205773, "epoch": 1224} {"train_loss": -10.587223052978516, "global_step": 205774, "epoch": 1224} {"train_loss": -9.204885482788086, "global_step": 205775, "epoch": 1224} {"train_loss": -10.280518531799316, "global_step": 205776, "epoch": 1224} {"train_loss": -10.019365310668945, "global_step": 205777, "epoch": 1224} {"train_loss": -10.75043773651123, "global_step": 205778, "epoch": 1224} {"train_loss": -10.393604278564453, "global_step": 205779, "epoch": 1224} {"train_loss": -10.517565727233887, "global_step": 205780, "epoch": 1224} {"train_loss": -10.436456680297852, "global_step": 205781, "epoch": 1224} {"train_loss": -11.001407623291016, "global_step": 205782, "epoch": 1224} {"train_loss": -10.980562210083008, "global_step": 205783, "epoch": 1224} {"train_loss": -10.675889015197754, "global_step": 205784, "epoch": 1224} {"train_loss": -10.622084617614746, "global_step": 205785, "epoch": 1224} {"train_loss": -10.747265815734863, "global_step": 205786, "epoch": 1224} {"train_loss": -11.07807731628418, "global_step": 205787, "epoch": 1224} {"train_loss": -10.947720527648926, "global_step": 205788, "epoch": 1224} {"train_loss": -11.135345458984375, "global_step": 205789, "epoch": 1224} {"train_loss": -11.125350952148438, "global_step": 205790, "epoch": 1224} {"train_loss": -10.974740028381348, "global_step": 205791, "epoch": 1224} {"train_loss": -11.214912414550781, "global_step": 205792, "epoch": 1224} {"train_loss": -11.077744483947754, "global_step": 205793, "epoch": 1224} {"train_loss": -11.060924530029297, "global_step": 205794, "epoch": 1224} {"train_loss": -11.18632984161377, "global_step": 205795, "epoch": 1224} {"train_loss": -11.304216384887695, "global_step": 205796, "epoch": 1224} {"train_loss": -11.033390998840332, "global_step": 205797, "epoch": 1224} {"train_loss": -11.071250915527344, "global_step": 205798, "epoch": 1224} {"train_loss": -10.901971570083074, "global_step": 205799, "epoch": 1224, "val_loss": 242968.609375} {"train_loss": -11.203351974487305, "global_step": 205800, "epoch": 1225} {"train_loss": -11.325429916381836, "global_step": 205801, "epoch": 1225} {"train_loss": -11.415550231933594, "global_step": 205802, "epoch": 1225} {"train_loss": -11.129950523376465, "global_step": 205803, "epoch": 1225} {"train_loss": -11.118114471435547, "global_step": 205804, "epoch": 1225} {"train_loss": -11.450847625732422, "global_step": 205805, "epoch": 1225} {"train_loss": -11.240735054016113, "global_step": 205806, "epoch": 1225} {"train_loss": -11.49424934387207, "global_step": 205807, "epoch": 1225} {"train_loss": -11.182737350463867, "global_step": 205808, "epoch": 1225} {"train_loss": -11.359098434448242, "global_step": 205809, "epoch": 1225} {"train_loss": -11.04681396484375, "global_step": 205810, "epoch": 1225} {"train_loss": -11.33243179321289, "global_step": 205811, "epoch": 1225} {"train_loss": -11.385927200317383, "global_step": 205812, "epoch": 1225} {"train_loss": -11.25139045715332, "global_step": 205813, "epoch": 1225} {"train_loss": -11.522716522216797, "global_step": 205814, "epoch": 1225} {"train_loss": -11.15147876739502, "global_step": 205815, "epoch": 1225} {"train_loss": -11.694875717163086, "global_step": 205816, "epoch": 1225} {"train_loss": -11.334476470947266, "global_step": 205817, "epoch": 1225} {"train_loss": -11.519156455993652, "global_step": 205818, "epoch": 1225} {"train_loss": -11.402535438537598, "global_step": 205819, "epoch": 1225} {"train_loss": -11.466928482055664, "global_step": 205820, "epoch": 1225} {"train_loss": -11.378216743469238, "global_step": 205821, "epoch": 1225} {"train_loss": -11.700642585754395, "global_step": 205822, "epoch": 1225} {"train_loss": -11.280287742614746, "global_step": 205823, "epoch": 1225} {"train_loss": -11.43661880493164, "global_step": 205824, "epoch": 1225} {"train_loss": -11.377875328063965, "global_step": 205825, "epoch": 1225} {"train_loss": -11.685734748840332, "global_step": 205826, "epoch": 1225} {"train_loss": -11.362420082092285, "global_step": 205827, "epoch": 1225} {"train_loss": -11.55366325378418, "global_step": 205828, "epoch": 1225} {"train_loss": -11.269327163696289, "global_step": 205829, "epoch": 1225} {"train_loss": -11.246245384216309, "global_step": 205830, "epoch": 1225} {"train_loss": -11.630777359008789, "global_step": 205831, "epoch": 1225} {"train_loss": -10.578277587890625, "global_step": 205832, "epoch": 1225} {"train_loss": -11.559874534606934, "global_step": 205833, "epoch": 1225} {"train_loss": -10.700069427490234, "global_step": 205834, "epoch": 1225} {"train_loss": -11.367259979248047, "global_step": 205835, "epoch": 1225} {"train_loss": -10.853652954101562, "global_step": 205836, "epoch": 1225} {"train_loss": -10.541126251220703, "global_step": 205837, "epoch": 1225} {"train_loss": -11.152629852294922, "global_step": 205838, "epoch": 1225} {"train_loss": -11.079190254211426, "global_step": 205839, "epoch": 1225} {"train_loss": -11.168351173400879, "global_step": 205840, "epoch": 1225} {"train_loss": -11.015769958496094, "global_step": 205841, "epoch": 1225} {"train_loss": -11.15626335144043, "global_step": 205842, "epoch": 1225} {"train_loss": -11.684748649597168, "global_step": 205843, "epoch": 1225} {"train_loss": -11.079190254211426, "global_step": 205844, "epoch": 1225} {"train_loss": -11.428033828735352, "global_step": 205845, "epoch": 1225} {"train_loss": -11.32175064086914, "global_step": 205846, "epoch": 1225} {"train_loss": -11.175127983093262, "global_step": 205847, "epoch": 1225} {"train_loss": -11.302094459533691, "global_step": 205848, "epoch": 1225} {"train_loss": -11.484268188476562, "global_step": 205849, "epoch": 1225} {"train_loss": -11.371237754821777, "global_step": 205850, "epoch": 1225} {"train_loss": -11.506217002868652, "global_step": 205851, "epoch": 1225} {"train_loss": -11.125434875488281, "global_step": 205852, "epoch": 1225} {"train_loss": -10.946322441101074, "global_step": 205853, "epoch": 1225} {"train_loss": -11.613052368164062, "global_step": 205854, "epoch": 1225} {"train_loss": -11.069068908691406, "global_step": 205855, "epoch": 1225} {"train_loss": -11.518861770629883, "global_step": 205856, "epoch": 1225} {"train_loss": -10.837571144104004, "global_step": 205857, "epoch": 1225} {"train_loss": -11.180767059326172, "global_step": 205858, "epoch": 1225} {"train_loss": -10.749431610107422, "global_step": 205859, "epoch": 1225} {"train_loss": -11.386554718017578, "global_step": 205860, "epoch": 1225} {"train_loss": -11.416049003601074, "global_step": 205861, "epoch": 1225} {"train_loss": -11.226967811584473, "global_step": 205862, "epoch": 1225} {"train_loss": -11.269129753112793, "global_step": 205863, "epoch": 1225} {"train_loss": -11.272686004638672, "global_step": 205864, "epoch": 1225} {"train_loss": -11.411678314208984, "global_step": 205865, "epoch": 1225} {"train_loss": -11.169269561767578, "global_step": 205866, "epoch": 1225} {"train_loss": -11.646781921386719, "global_step": 205867, "epoch": 1225} {"train_loss": -11.283931732177734, "global_step": 205868, "epoch": 1225} {"train_loss": -11.204105377197266, "global_step": 205869, "epoch": 1225} {"train_loss": -11.302270889282227, "global_step": 205870, "epoch": 1225} {"train_loss": -11.404426574707031, "global_step": 205871, "epoch": 1225} {"train_loss": -11.170848846435547, "global_step": 205872, "epoch": 1225} {"train_loss": -11.026567459106445, "global_step": 205873, "epoch": 1225} {"train_loss": -11.014904975891113, "global_step": 205874, "epoch": 1225} {"train_loss": -10.734182357788086, "global_step": 205875, "epoch": 1225} {"train_loss": -10.7329683303833, "global_step": 205876, "epoch": 1225} {"train_loss": -11.058704376220703, "global_step": 205877, "epoch": 1225} {"train_loss": -10.496766090393066, "global_step": 205878, "epoch": 1225} {"train_loss": -11.548298835754395, "global_step": 205879, "epoch": 1225} {"train_loss": -10.79801082611084, "global_step": 205880, "epoch": 1225} {"train_loss": -11.219771385192871, "global_step": 205881, "epoch": 1225} {"train_loss": -11.314689636230469, "global_step": 205882, "epoch": 1225} {"train_loss": -10.961438179016113, "global_step": 205883, "epoch": 1225} {"train_loss": -11.406742095947266, "global_step": 205884, "epoch": 1225} {"train_loss": -11.059741020202637, "global_step": 205885, "epoch": 1225} {"train_loss": -10.927611351013184, "global_step": 205886, "epoch": 1225} {"train_loss": -11.47093391418457, "global_step": 205887, "epoch": 1225} {"train_loss": -11.128792762756348, "global_step": 205888, "epoch": 1225} {"train_loss": -11.093778610229492, "global_step": 205889, "epoch": 1225} {"train_loss": -11.554946899414062, "global_step": 205890, "epoch": 1225} {"train_loss": -11.459989547729492, "global_step": 205891, "epoch": 1225} {"train_loss": -11.475659370422363, "global_step": 205892, "epoch": 1225} {"train_loss": -11.648128509521484, "global_step": 205893, "epoch": 1225} {"train_loss": -11.155657768249512, "global_step": 205894, "epoch": 1225} {"train_loss": -11.658114433288574, "global_step": 205895, "epoch": 1225} {"train_loss": -11.191977500915527, "global_step": 205896, "epoch": 1225} {"train_loss": -11.315378189086914, "global_step": 205897, "epoch": 1225} {"train_loss": -11.298460006713867, "global_step": 205898, "epoch": 1225} {"train_loss": -11.214752197265625, "global_step": 205899, "epoch": 1225} {"train_loss": -11.512185096740723, "global_step": 205900, "epoch": 1225} {"train_loss": -11.388362884521484, "global_step": 205901, "epoch": 1225} {"train_loss": -11.456080436706543, "global_step": 205902, "epoch": 1225} {"train_loss": -11.58297348022461, "global_step": 205903, "epoch": 1225} {"train_loss": -11.575048446655273, "global_step": 205904, "epoch": 1225} {"train_loss": -11.579416275024414, "global_step": 205905, "epoch": 1225} {"train_loss": -11.50063705444336, "global_step": 205906, "epoch": 1225} {"train_loss": -11.709918975830078, "global_step": 205907, "epoch": 1225} {"train_loss": -11.249452590942383, "global_step": 205908, "epoch": 1225} {"train_loss": -11.641922950744629, "global_step": 205909, "epoch": 1225} {"train_loss": -11.264389991760254, "global_step": 205910, "epoch": 1225} {"train_loss": -11.52981185913086, "global_step": 205911, "epoch": 1225} {"train_loss": -11.56749153137207, "global_step": 205912, "epoch": 1225} {"train_loss": -11.189985275268555, "global_step": 205913, "epoch": 1225} {"train_loss": -11.177103042602539, "global_step": 205914, "epoch": 1225} {"train_loss": -11.319609642028809, "global_step": 205915, "epoch": 1225} {"train_loss": -11.182424545288086, "global_step": 205916, "epoch": 1225} {"train_loss": -11.706302642822266, "global_step": 205917, "epoch": 1225} {"train_loss": -11.488142967224121, "global_step": 205918, "epoch": 1225} {"train_loss": -11.572433471679688, "global_step": 205919, "epoch": 1225} {"train_loss": -11.797906875610352, "global_step": 205920, "epoch": 1225} {"train_loss": -11.57508659362793, "global_step": 205921, "epoch": 1225} {"train_loss": -11.66794204711914, "global_step": 205922, "epoch": 1225} {"train_loss": -11.385010719299316, "global_step": 205923, "epoch": 1225} {"train_loss": -10.741519927978516, "global_step": 205924, "epoch": 1225} {"train_loss": -11.215988159179688, "global_step": 205925, "epoch": 1225} {"train_loss": -11.38216781616211, "global_step": 205926, "epoch": 1225} {"train_loss": -11.085318565368652, "global_step": 205927, "epoch": 1225} {"train_loss": -11.246644020080566, "global_step": 205928, "epoch": 1225} {"train_loss": -11.504964828491211, "global_step": 205929, "epoch": 1225} {"train_loss": -11.274103164672852, "global_step": 205930, "epoch": 1225} {"train_loss": -11.812226295471191, "global_step": 205931, "epoch": 1225} {"train_loss": -11.272509574890137, "global_step": 205932, "epoch": 1225} {"train_loss": -11.560290336608887, "global_step": 205933, "epoch": 1225} {"train_loss": -11.470592498779297, "global_step": 205934, "epoch": 1225} {"train_loss": -11.261364936828613, "global_step": 205935, "epoch": 1225} {"train_loss": -11.732370376586914, "global_step": 205936, "epoch": 1225} {"train_loss": -11.666385650634766, "global_step": 205937, "epoch": 1225} {"train_loss": -11.148286819458008, "global_step": 205938, "epoch": 1225} {"train_loss": -11.273811340332031, "global_step": 205939, "epoch": 1225} {"train_loss": -11.81604290008545, "global_step": 205940, "epoch": 1225} {"train_loss": -11.172500610351562, "global_step": 205941, "epoch": 1225} {"train_loss": -11.60525894165039, "global_step": 205942, "epoch": 1225} {"train_loss": -11.843616485595703, "global_step": 205943, "epoch": 1225} {"train_loss": -11.44307804107666, "global_step": 205944, "epoch": 1225} {"train_loss": -11.635710716247559, "global_step": 205945, "epoch": 1225} {"train_loss": -11.583361625671387, "global_step": 205946, "epoch": 1225} {"train_loss": -11.677080154418945, "global_step": 205947, "epoch": 1225} {"train_loss": -11.699407577514648, "global_step": 205948, "epoch": 1225} {"train_loss": -11.505017280578613, "global_step": 205949, "epoch": 1225} {"train_loss": -11.581491470336914, "global_step": 205950, "epoch": 1225} {"train_loss": -11.596458435058594, "global_step": 205951, "epoch": 1225} {"train_loss": -11.465963363647461, "global_step": 205952, "epoch": 1225} {"train_loss": -11.578836441040039, "global_step": 205953, "epoch": 1225} {"train_loss": -11.387479782104492, "global_step": 205954, "epoch": 1225} {"train_loss": -11.410173416137695, "global_step": 205955, "epoch": 1225} {"train_loss": -11.598428726196289, "global_step": 205956, "epoch": 1225} {"train_loss": -11.735780715942383, "global_step": 205957, "epoch": 1225} {"train_loss": -11.649662017822266, "global_step": 205958, "epoch": 1225} {"train_loss": -11.475793838500977, "global_step": 205959, "epoch": 1225} {"train_loss": -11.579583168029785, "global_step": 205960, "epoch": 1225} {"train_loss": -11.504731178283691, "global_step": 205961, "epoch": 1225} {"train_loss": -11.531139373779297, "global_step": 205962, "epoch": 1225} {"train_loss": -11.288639068603516, "global_step": 205963, "epoch": 1225} {"train_loss": -11.252052307128906, "global_step": 205964, "epoch": 1225} {"train_loss": -11.734073638916016, "global_step": 205965, "epoch": 1225} {"train_loss": -11.157567977905273, "global_step": 205966, "epoch": 1225} {"train_loss": -11.346937145505633, "global_step": 205967, "epoch": 1225, "val_loss": 248166.859375, "train_action_mse_error": 1.99882173538208} {"train_loss": -11.28637981414795, "global_step": 205968, "epoch": 1226} {"train_loss": -11.37259292602539, "global_step": 205969, "epoch": 1226} {"train_loss": -11.652182579040527, "global_step": 205970, "epoch": 1226} {"train_loss": -11.674695014953613, "global_step": 205971, "epoch": 1226} {"train_loss": -11.434054374694824, "global_step": 205972, "epoch": 1226} {"train_loss": -11.148307800292969, "global_step": 205973, "epoch": 1226} {"train_loss": -11.42724323272705, "global_step": 205974, "epoch": 1226} {"train_loss": -11.559650421142578, "global_step": 205975, "epoch": 1226} {"train_loss": -11.516886711120605, "global_step": 205976, "epoch": 1226} {"train_loss": -10.883685111999512, "global_step": 205977, "epoch": 1226} {"train_loss": -11.618788719177246, "global_step": 205978, "epoch": 1226} {"train_loss": -11.30579662322998, "global_step": 205979, "epoch": 1226} {"train_loss": -10.12670612335205, "global_step": 205980, "epoch": 1226} {"train_loss": -11.015851974487305, "global_step": 205981, "epoch": 1226} {"train_loss": -10.606718063354492, "global_step": 205982, "epoch": 1226} {"train_loss": -11.394804000854492, "global_step": 205983, "epoch": 1226} {"train_loss": -10.631790161132812, "global_step": 205984, "epoch": 1226} {"train_loss": -11.429431915283203, "global_step": 205985, "epoch": 1226} {"train_loss": -10.789506912231445, "global_step": 205986, "epoch": 1226} {"train_loss": -10.487065315246582, "global_step": 205987, "epoch": 1226} {"train_loss": -11.071460723876953, "global_step": 205988, "epoch": 1226} {"train_loss": -11.168645858764648, "global_step": 205989, "epoch": 1226} {"train_loss": -10.310548782348633, "global_step": 205990, "epoch": 1226} {"train_loss": -11.26690673828125, "global_step": 205991, "epoch": 1226} {"train_loss": -11.182392120361328, "global_step": 205992, "epoch": 1226} {"train_loss": -11.059234619140625, "global_step": 205993, "epoch": 1226} {"train_loss": -11.289846420288086, "global_step": 205994, "epoch": 1226} {"train_loss": -11.411859512329102, "global_step": 205995, "epoch": 1226} {"train_loss": -11.40245532989502, "global_step": 205996, "epoch": 1226} {"train_loss": -11.162403106689453, "global_step": 205997, "epoch": 1226} {"train_loss": -11.568812370300293, "global_step": 205998, "epoch": 1226} {"train_loss": -11.427814483642578, "global_step": 205999, "epoch": 1226} {"train_loss": -11.332919120788574, "global_step": 206000, "epoch": 1226} {"train_loss": -11.247159957885742, "global_step": 206001, "epoch": 1226} {"train_loss": -11.685588836669922, "global_step": 206002, "epoch": 1226} {"train_loss": -11.48503303527832, "global_step": 206003, "epoch": 1226} {"train_loss": -11.734424591064453, "global_step": 206004, "epoch": 1226} {"train_loss": -11.22064208984375, "global_step": 206005, "epoch": 1226} {"train_loss": -11.241451263427734, "global_step": 206006, "epoch": 1226} {"train_loss": -10.796468734741211, "global_step": 206007, "epoch": 1226} {"train_loss": -10.165639877319336, "global_step": 206008, "epoch": 1226} {"train_loss": -10.788138389587402, "global_step": 206009, "epoch": 1226} {"train_loss": -10.165708541870117, "global_step": 206010, "epoch": 1226} {"train_loss": -10.97629165649414, "global_step": 206011, "epoch": 1226} {"train_loss": -11.034765243530273, "global_step": 206012, "epoch": 1226} {"train_loss": -10.75704574584961, "global_step": 206013, "epoch": 1226} {"train_loss": -11.055602073669434, "global_step": 206014, "epoch": 1226} {"train_loss": -11.21603775024414, "global_step": 206015, "epoch": 1226} {"train_loss": -11.301264762878418, "global_step": 206016, "epoch": 1226} {"train_loss": -10.516865730285645, "global_step": 206017, "epoch": 1226} {"train_loss": -11.376693725585938, "global_step": 206018, "epoch": 1226} {"train_loss": -10.846925735473633, "global_step": 206019, "epoch": 1226} {"train_loss": -11.153585433959961, "global_step": 206020, "epoch": 1226} {"train_loss": -10.93857192993164, "global_step": 206021, "epoch": 1226} {"train_loss": -10.775450706481934, "global_step": 206022, "epoch": 1226} {"train_loss": -11.28909683227539, "global_step": 206023, "epoch": 1226} {"train_loss": -10.660831451416016, "global_step": 206024, "epoch": 1226} {"train_loss": -11.119989395141602, "global_step": 206025, "epoch": 1226} {"train_loss": -10.881843566894531, "global_step": 206026, "epoch": 1226} {"train_loss": -11.13914680480957, "global_step": 206027, "epoch": 1226} {"train_loss": -10.909233093261719, "global_step": 206028, "epoch": 1226} {"train_loss": -11.118069648742676, "global_step": 206029, "epoch": 1226} {"train_loss": -11.110875129699707, "global_step": 206030, "epoch": 1226} {"train_loss": -11.059286117553711, "global_step": 206031, "epoch": 1226} {"train_loss": -10.814571380615234, "global_step": 206032, "epoch": 1226} {"train_loss": -11.242042541503906, "global_step": 206033, "epoch": 1226} {"train_loss": -10.903020858764648, "global_step": 206034, "epoch": 1226} {"train_loss": -11.554697036743164, "global_step": 206035, "epoch": 1226} {"train_loss": -11.09178352355957, "global_step": 206036, "epoch": 1226} {"train_loss": -11.479606628417969, "global_step": 206037, "epoch": 1226} {"train_loss": -11.445867538452148, "global_step": 206038, "epoch": 1226} {"train_loss": -11.435785293579102, "global_step": 206039, "epoch": 1226} {"train_loss": -11.524707794189453, "global_step": 206040, "epoch": 1226} {"train_loss": -11.508983612060547, "global_step": 206041, "epoch": 1226} {"train_loss": -11.57303237915039, "global_step": 206042, "epoch": 1226} {"train_loss": -11.424070358276367, "global_step": 206043, "epoch": 1226} {"train_loss": -11.38084602355957, "global_step": 206044, "epoch": 1226} {"train_loss": -11.524120330810547, "global_step": 206045, "epoch": 1226} {"train_loss": -11.38292407989502, "global_step": 206046, "epoch": 1226} {"train_loss": -11.535042762756348, "global_step": 206047, "epoch": 1226} {"train_loss": -11.516138076782227, "global_step": 206048, "epoch": 1226} {"train_loss": -11.799528121948242, "global_step": 206049, "epoch": 1226} {"train_loss": -11.477130889892578, "global_step": 206050, "epoch": 1226} {"train_loss": -11.515325546264648, "global_step": 206051, "epoch": 1226} {"train_loss": -11.432424545288086, "global_step": 206052, "epoch": 1226} {"train_loss": -11.5483980178833, "global_step": 206053, "epoch": 1226} {"train_loss": -11.504043579101562, "global_step": 206054, "epoch": 1226} {"train_loss": -11.656503677368164, "global_step": 206055, "epoch": 1226} {"train_loss": -11.631902694702148, "global_step": 206056, "epoch": 1226} {"train_loss": -11.413975715637207, "global_step": 206057, "epoch": 1226} {"train_loss": -11.43599796295166, "global_step": 206058, "epoch": 1226} {"train_loss": -11.600675582885742, "global_step": 206059, "epoch": 1226} {"train_loss": -11.46190357208252, "global_step": 206060, "epoch": 1226} {"train_loss": -11.663454055786133, "global_step": 206061, "epoch": 1226} {"train_loss": -11.609195709228516, "global_step": 206062, "epoch": 1226} {"train_loss": -11.603279113769531, "global_step": 206063, "epoch": 1226} {"train_loss": -11.485393524169922, "global_step": 206064, "epoch": 1226} {"train_loss": -11.484146118164062, "global_step": 206065, "epoch": 1226} {"train_loss": -11.514756202697754, "global_step": 206066, "epoch": 1226} {"train_loss": -11.663880348205566, "global_step": 206067, "epoch": 1226} {"train_loss": -11.585258483886719, "global_step": 206068, "epoch": 1226} {"train_loss": -11.538482666015625, "global_step": 206069, "epoch": 1226} {"train_loss": -11.639427185058594, "global_step": 206070, "epoch": 1226} {"train_loss": -11.585261344909668, "global_step": 206071, "epoch": 1226} {"train_loss": -11.51956558227539, "global_step": 206072, "epoch": 1226} {"train_loss": -11.573415756225586, "global_step": 206073, "epoch": 1226} {"train_loss": -11.078678131103516, "global_step": 206074, "epoch": 1226} {"train_loss": -11.66883659362793, "global_step": 206075, "epoch": 1226} {"train_loss": -11.105878829956055, "global_step": 206076, "epoch": 1226} {"train_loss": -10.465303421020508, "global_step": 206077, "epoch": 1226} {"train_loss": -11.782087326049805, "global_step": 206078, "epoch": 1226} {"train_loss": -11.002593994140625, "global_step": 206079, "epoch": 1226} {"train_loss": -10.571748733520508, "global_step": 206080, "epoch": 1226} {"train_loss": -11.426597595214844, "global_step": 206081, "epoch": 1226} {"train_loss": -11.048202514648438, "global_step": 206082, "epoch": 1226} {"train_loss": -11.084875106811523, "global_step": 206083, "epoch": 1226} {"train_loss": -11.263198852539062, "global_step": 206084, "epoch": 1226} {"train_loss": -10.982303619384766, "global_step": 206085, "epoch": 1226} {"train_loss": -10.995887756347656, "global_step": 206086, "epoch": 1226} {"train_loss": -10.911842346191406, "global_step": 206087, "epoch": 1226} {"train_loss": -11.43432903289795, "global_step": 206088, "epoch": 1226} {"train_loss": -11.220658302307129, "global_step": 206089, "epoch": 1226} {"train_loss": -11.369651794433594, "global_step": 206090, "epoch": 1226} {"train_loss": -10.897991180419922, "global_step": 206091, "epoch": 1226} {"train_loss": -11.365522384643555, "global_step": 206092, "epoch": 1226} {"train_loss": -10.794622421264648, "global_step": 206093, "epoch": 1226} {"train_loss": -11.251376152038574, "global_step": 206094, "epoch": 1226} {"train_loss": -11.257817268371582, "global_step": 206095, "epoch": 1226} {"train_loss": -11.138009071350098, "global_step": 206096, "epoch": 1226} {"train_loss": -11.173463821411133, "global_step": 206097, "epoch": 1226} {"train_loss": -11.034976959228516, "global_step": 206098, "epoch": 1226} {"train_loss": -11.552301406860352, "global_step": 206099, "epoch": 1226} {"train_loss": -10.821183204650879, "global_step": 206100, "epoch": 1226} {"train_loss": -11.296748161315918, "global_step": 206101, "epoch": 1226} {"train_loss": -11.457138061523438, "global_step": 206102, "epoch": 1226} {"train_loss": -11.245955467224121, "global_step": 206103, "epoch": 1226} {"train_loss": -11.481073379516602, "global_step": 206104, "epoch": 1226} {"train_loss": -11.506828308105469, "global_step": 206105, "epoch": 1226} {"train_loss": -11.366037368774414, "global_step": 206106, "epoch": 1226} {"train_loss": -11.46110725402832, "global_step": 206107, "epoch": 1226} {"train_loss": -11.183744430541992, "global_step": 206108, "epoch": 1226} {"train_loss": -11.409831047058105, "global_step": 206109, "epoch": 1226} {"train_loss": -11.372398376464844, "global_step": 206110, "epoch": 1226} {"train_loss": -11.434266090393066, "global_step": 206111, "epoch": 1226} {"train_loss": -11.38919734954834, "global_step": 206112, "epoch": 1226} {"train_loss": -11.406335830688477, "global_step": 206113, "epoch": 1226} {"train_loss": -11.576395034790039, "global_step": 206114, "epoch": 1226} {"train_loss": -11.165834426879883, "global_step": 206115, "epoch": 1226} {"train_loss": -11.356481552124023, "global_step": 206116, "epoch": 1226} {"train_loss": -11.733012199401855, "global_step": 206117, "epoch": 1226} {"train_loss": -11.554676055908203, "global_step": 206118, "epoch": 1226} {"train_loss": -11.434503555297852, "global_step": 206119, "epoch": 1226} {"train_loss": -11.315866470336914, "global_step": 206120, "epoch": 1226} {"train_loss": -11.583332061767578, "global_step": 206121, "epoch": 1226} {"train_loss": -11.379929542541504, "global_step": 206122, "epoch": 1226} {"train_loss": -11.271587371826172, "global_step": 206123, "epoch": 1226} {"train_loss": -11.607643127441406, "global_step": 206124, "epoch": 1226} {"train_loss": -11.18893051147461, "global_step": 206125, "epoch": 1226} {"train_loss": -11.380863189697266, "global_step": 206126, "epoch": 1226} {"train_loss": -11.67270278930664, "global_step": 206127, "epoch": 1226} {"train_loss": -11.622133255004883, "global_step": 206128, "epoch": 1226} {"train_loss": -11.531949996948242, "global_step": 206129, "epoch": 1226} {"train_loss": -11.567739486694336, "global_step": 206130, "epoch": 1226} {"train_loss": -11.515565872192383, "global_step": 206131, "epoch": 1226} {"train_loss": -11.210071563720703, "global_step": 206132, "epoch": 1226} {"train_loss": -11.501380920410156, "global_step": 206133, "epoch": 1226} {"train_loss": -11.694149017333984, "global_step": 206134, "epoch": 1226} {"train_loss": -11.276566670054482, "global_step": 206135, "epoch": 1226, "val_loss": 250643.84375} {"train_loss": -11.587791442871094, "global_step": 206136, "epoch": 1227} {"train_loss": -11.436258316040039, "global_step": 206137, "epoch": 1227} {"train_loss": -11.567588806152344, "global_step": 206138, "epoch": 1227} {"train_loss": -11.21190071105957, "global_step": 206139, "epoch": 1227} {"train_loss": -11.417683601379395, "global_step": 206140, "epoch": 1227} {"train_loss": -11.720210075378418, "global_step": 206141, "epoch": 1227} {"train_loss": -11.234498977661133, "global_step": 206142, "epoch": 1227} {"train_loss": -11.591972351074219, "global_step": 206143, "epoch": 1227} {"train_loss": -11.295453071594238, "global_step": 206144, "epoch": 1227} {"train_loss": -11.045119285583496, "global_step": 206145, "epoch": 1227} {"train_loss": -11.658567428588867, "global_step": 206146, "epoch": 1227} {"train_loss": -10.76572036743164, "global_step": 206147, "epoch": 1227} {"train_loss": -11.538217544555664, "global_step": 206148, "epoch": 1227} {"train_loss": -10.820696830749512, "global_step": 206149, "epoch": 1227} {"train_loss": -11.534998893737793, "global_step": 206150, "epoch": 1227} {"train_loss": -11.003128051757812, "global_step": 206151, "epoch": 1227} {"train_loss": -11.084468841552734, "global_step": 206152, "epoch": 1227} {"train_loss": -10.891496658325195, "global_step": 206153, "epoch": 1227} {"train_loss": -11.486982345581055, "global_step": 206154, "epoch": 1227} {"train_loss": -10.804864883422852, "global_step": 206155, "epoch": 1227} {"train_loss": -11.379898071289062, "global_step": 206156, "epoch": 1227} {"train_loss": -11.198272705078125, "global_step": 206157, "epoch": 1227} {"train_loss": -11.239879608154297, "global_step": 206158, "epoch": 1227} {"train_loss": -11.22143840789795, "global_step": 206159, "epoch": 1227} {"train_loss": -10.041627883911133, "global_step": 206160, "epoch": 1227} {"train_loss": -11.131378173828125, "global_step": 206161, "epoch": 1227} {"train_loss": -10.80069351196289, "global_step": 206162, "epoch": 1227} {"train_loss": -10.438554763793945, "global_step": 206163, "epoch": 1227} {"train_loss": -11.220682144165039, "global_step": 206164, "epoch": 1227} {"train_loss": -11.169685363769531, "global_step": 206165, "epoch": 1227} {"train_loss": -10.796331405639648, "global_step": 206166, "epoch": 1227} {"train_loss": -11.043268203735352, "global_step": 206167, "epoch": 1227} {"train_loss": -10.027952194213867, "global_step": 206168, "epoch": 1227} {"train_loss": -11.145318984985352, "global_step": 206169, "epoch": 1227} {"train_loss": -11.265867233276367, "global_step": 206170, "epoch": 1227} {"train_loss": -10.889184951782227, "global_step": 206171, "epoch": 1227} {"train_loss": -11.292564392089844, "global_step": 206172, "epoch": 1227} {"train_loss": -10.842351913452148, "global_step": 206173, "epoch": 1227} {"train_loss": -10.734731674194336, "global_step": 206174, "epoch": 1227} {"train_loss": -11.044610023498535, "global_step": 206175, "epoch": 1227} {"train_loss": -10.609002113342285, "global_step": 206176, "epoch": 1227} {"train_loss": -11.369816780090332, "global_step": 206177, "epoch": 1227} {"train_loss": -10.560327529907227, "global_step": 206178, "epoch": 1227} {"train_loss": -11.251575469970703, "global_step": 206179, "epoch": 1227} {"train_loss": -11.11689567565918, "global_step": 206180, "epoch": 1227} {"train_loss": -11.308085441589355, "global_step": 206181, "epoch": 1227} {"train_loss": -10.822823524475098, "global_step": 206182, "epoch": 1227} {"train_loss": -11.173711776733398, "global_step": 206183, "epoch": 1227} {"train_loss": -10.851654052734375, "global_step": 206184, "epoch": 1227} {"train_loss": -11.445290565490723, "global_step": 206185, "epoch": 1227} {"train_loss": -10.727968215942383, "global_step": 206186, "epoch": 1227} {"train_loss": -11.145468711853027, "global_step": 206187, "epoch": 1227} {"train_loss": -10.603752136230469, "global_step": 206188, "epoch": 1227} {"train_loss": -11.098067283630371, "global_step": 206189, "epoch": 1227} {"train_loss": -10.972973823547363, "global_step": 206190, "epoch": 1227} {"train_loss": -10.889708518981934, "global_step": 206191, "epoch": 1227} {"train_loss": -11.286731719970703, "global_step": 206192, "epoch": 1227} {"train_loss": -11.411735534667969, "global_step": 206193, "epoch": 1227} {"train_loss": -11.056145668029785, "global_step": 206194, "epoch": 1227} {"train_loss": -11.395952224731445, "global_step": 206195, "epoch": 1227} {"train_loss": -11.043563842773438, "global_step": 206196, "epoch": 1227} {"train_loss": -11.243648529052734, "global_step": 206197, "epoch": 1227} {"train_loss": -11.033418655395508, "global_step": 206198, "epoch": 1227} {"train_loss": -10.72280216217041, "global_step": 206199, "epoch": 1227} {"train_loss": -11.149799346923828, "global_step": 206200, "epoch": 1227} {"train_loss": -11.233512878417969, "global_step": 206201, "epoch": 1227} {"train_loss": -11.18949031829834, "global_step": 206202, "epoch": 1227} {"train_loss": -11.19087028503418, "global_step": 206203, "epoch": 1227} {"train_loss": -11.492485046386719, "global_step": 206204, "epoch": 1227} {"train_loss": -11.181501388549805, "global_step": 206205, "epoch": 1227} {"train_loss": -11.217920303344727, "global_step": 206206, "epoch": 1227} {"train_loss": -11.2114839553833, "global_step": 206207, "epoch": 1227} {"train_loss": -11.475156784057617, "global_step": 206208, "epoch": 1227} {"train_loss": -11.211177825927734, "global_step": 206209, "epoch": 1227} {"train_loss": -11.381940841674805, "global_step": 206210, "epoch": 1227} {"train_loss": -11.479681968688965, "global_step": 206211, "epoch": 1227} {"train_loss": -11.28383731842041, "global_step": 206212, "epoch": 1227} {"train_loss": -11.54150390625, "global_step": 206213, "epoch": 1227} {"train_loss": -11.396062850952148, "global_step": 206214, "epoch": 1227} {"train_loss": -11.588114738464355, "global_step": 206215, "epoch": 1227} {"train_loss": -11.263994216918945, "global_step": 206216, "epoch": 1227} {"train_loss": -11.466987609863281, "global_step": 206217, "epoch": 1227} {"train_loss": -10.943506240844727, "global_step": 206218, "epoch": 1227} {"train_loss": -11.42835807800293, "global_step": 206219, "epoch": 1227} {"train_loss": -10.752273559570312, "global_step": 206220, "epoch": 1227} {"train_loss": -11.384695053100586, "global_step": 206221, "epoch": 1227} {"train_loss": -11.206483840942383, "global_step": 206222, "epoch": 1227} {"train_loss": -10.722944259643555, "global_step": 206223, "epoch": 1227} {"train_loss": -11.47795295715332, "global_step": 206224, "epoch": 1227} {"train_loss": -10.874601364135742, "global_step": 206225, "epoch": 1227} {"train_loss": -11.470987319946289, "global_step": 206226, "epoch": 1227} {"train_loss": -10.925827980041504, "global_step": 206227, "epoch": 1227} {"train_loss": -11.595024108886719, "global_step": 206228, "epoch": 1227} {"train_loss": -11.59805679321289, "global_step": 206229, "epoch": 1227} {"train_loss": -11.501941680908203, "global_step": 206230, "epoch": 1227} {"train_loss": -11.529563903808594, "global_step": 206231, "epoch": 1227} {"train_loss": -11.45138931274414, "global_step": 206232, "epoch": 1227} {"train_loss": -11.7147216796875, "global_step": 206233, "epoch": 1227} {"train_loss": -11.56920051574707, "global_step": 206234, "epoch": 1227} {"train_loss": -11.431703567504883, "global_step": 206235, "epoch": 1227} {"train_loss": -11.864500999450684, "global_step": 206236, "epoch": 1227} {"train_loss": -11.754911422729492, "global_step": 206237, "epoch": 1227} {"train_loss": -11.394588470458984, "global_step": 206238, "epoch": 1227} {"train_loss": -11.784895896911621, "global_step": 206239, "epoch": 1227} {"train_loss": -11.92686653137207, "global_step": 206240, "epoch": 1227} {"train_loss": -11.605506896972656, "global_step": 206241, "epoch": 1227} {"train_loss": -11.714941024780273, "global_step": 206242, "epoch": 1227} {"train_loss": -11.666688919067383, "global_step": 206243, "epoch": 1227} {"train_loss": -11.72756576538086, "global_step": 206244, "epoch": 1227} {"train_loss": -11.59681510925293, "global_step": 206245, "epoch": 1227} {"train_loss": -11.705756187438965, "global_step": 206246, "epoch": 1227} {"train_loss": -11.765841484069824, "global_step": 206247, "epoch": 1227} {"train_loss": -11.76352310180664, "global_step": 206248, "epoch": 1227} {"train_loss": -11.757156372070312, "global_step": 206249, "epoch": 1227} {"train_loss": -11.674881935119629, "global_step": 206250, "epoch": 1227} {"train_loss": -11.571916580200195, "global_step": 206251, "epoch": 1227} {"train_loss": -11.545366287231445, "global_step": 206252, "epoch": 1227} {"train_loss": -11.672725677490234, "global_step": 206253, "epoch": 1227} {"train_loss": -11.688701629638672, "global_step": 206254, "epoch": 1227} {"train_loss": -11.867019653320312, "global_step": 206255, "epoch": 1227} {"train_loss": -11.766195297241211, "global_step": 206256, "epoch": 1227} {"train_loss": -11.578170776367188, "global_step": 206257, "epoch": 1227} {"train_loss": -11.669225692749023, "global_step": 206258, "epoch": 1227} {"train_loss": -11.58864974975586, "global_step": 206259, "epoch": 1227} {"train_loss": -11.637569427490234, "global_step": 206260, "epoch": 1227} {"train_loss": -11.776199340820312, "global_step": 206261, "epoch": 1227} {"train_loss": -12.089985847473145, "global_step": 206262, "epoch": 1227} {"train_loss": -11.59786605834961, "global_step": 206263, "epoch": 1227} {"train_loss": -11.776287078857422, "global_step": 206264, "epoch": 1227} {"train_loss": -11.757763862609863, "global_step": 206265, "epoch": 1227} {"train_loss": -11.683761596679688, "global_step": 206266, "epoch": 1227} {"train_loss": -11.810523986816406, "global_step": 206267, "epoch": 1227} {"train_loss": -11.925549507141113, "global_step": 206268, "epoch": 1227} {"train_loss": -11.647262573242188, "global_step": 206269, "epoch": 1227} {"train_loss": -11.469923973083496, "global_step": 206270, "epoch": 1227} {"train_loss": -11.397560119628906, "global_step": 206271, "epoch": 1227} {"train_loss": -11.721055030822754, "global_step": 206272, "epoch": 1227} {"train_loss": -11.193765640258789, "global_step": 206273, "epoch": 1227} {"train_loss": -10.672134399414062, "global_step": 206274, "epoch": 1227} {"train_loss": -11.322388648986816, "global_step": 206275, "epoch": 1227} {"train_loss": -11.688767433166504, "global_step": 206276, "epoch": 1227} {"train_loss": -11.381338119506836, "global_step": 206277, "epoch": 1227} {"train_loss": -11.539796829223633, "global_step": 206278, "epoch": 1227} {"train_loss": -11.508455276489258, "global_step": 206279, "epoch": 1227} {"train_loss": -11.089130401611328, "global_step": 206280, "epoch": 1227} {"train_loss": -10.817994117736816, "global_step": 206281, "epoch": 1227} {"train_loss": -10.964617729187012, "global_step": 206282, "epoch": 1227} {"train_loss": -9.883910179138184, "global_step": 206283, "epoch": 1227} {"train_loss": -11.245641708374023, "global_step": 206284, "epoch": 1227} {"train_loss": -10.597652435302734, "global_step": 206285, "epoch": 1227} {"train_loss": -10.608338356018066, "global_step": 206286, "epoch": 1227} {"train_loss": -11.03614616394043, "global_step": 206287, "epoch": 1227} {"train_loss": -10.852470397949219, "global_step": 206288, "epoch": 1227} {"train_loss": -11.148674011230469, "global_step": 206289, "epoch": 1227} {"train_loss": -10.644346237182617, "global_step": 206290, "epoch": 1227} {"train_loss": -11.345664978027344, "global_step": 206291, "epoch": 1227} {"train_loss": -10.790586471557617, "global_step": 206292, "epoch": 1227} {"train_loss": -10.467373847961426, "global_step": 206293, "epoch": 1227} {"train_loss": -11.107487678527832, "global_step": 206294, "epoch": 1227} {"train_loss": -10.094247817993164, "global_step": 206295, "epoch": 1227} {"train_loss": -11.318340301513672, "global_step": 206296, "epoch": 1227} {"train_loss": -10.755731582641602, "global_step": 206297, "epoch": 1227} {"train_loss": -10.904650688171387, "global_step": 206298, "epoch": 1227} {"train_loss": -10.61695384979248, "global_step": 206299, "epoch": 1227} {"train_loss": -10.979692459106445, "global_step": 206300, "epoch": 1227} {"train_loss": -10.847335815429688, "global_step": 206301, "epoch": 1227} {"train_loss": -10.786324501037598, "global_step": 206302, "epoch": 1227} {"train_loss": -11.244119570368813, "global_step": 206303, "epoch": 1227, "val_loss": 254109.96875} {"train_loss": -10.735292434692383, "global_step": 206304, "epoch": 1228} {"train_loss": -10.46332836151123, "global_step": 206305, "epoch": 1228} {"train_loss": -11.290513038635254, "global_step": 206306, "epoch": 1228} {"train_loss": -10.753939628601074, "global_step": 206307, "epoch": 1228} {"train_loss": -10.989614486694336, "global_step": 206308, "epoch": 1228} {"train_loss": -11.065207481384277, "global_step": 206309, "epoch": 1228} {"train_loss": -10.365327835083008, "global_step": 206310, "epoch": 1228} {"train_loss": -10.974081039428711, "global_step": 206311, "epoch": 1228} {"train_loss": -10.764690399169922, "global_step": 206312, "epoch": 1228} {"train_loss": -11.341564178466797, "global_step": 206313, "epoch": 1228} {"train_loss": -10.891260147094727, "global_step": 206314, "epoch": 1228} {"train_loss": -11.057833671569824, "global_step": 206315, "epoch": 1228} {"train_loss": -10.764368057250977, "global_step": 206316, "epoch": 1228} {"train_loss": -11.219696998596191, "global_step": 206317, "epoch": 1228} {"train_loss": -9.820722579956055, "global_step": 206318, "epoch": 1228} {"train_loss": -11.40422534942627, "global_step": 206319, "epoch": 1228} {"train_loss": -10.535259246826172, "global_step": 206320, "epoch": 1228} {"train_loss": -11.229984283447266, "global_step": 206321, "epoch": 1228} {"train_loss": -10.733491897583008, "global_step": 206322, "epoch": 1228} {"train_loss": -10.886898040771484, "global_step": 206323, "epoch": 1228} {"train_loss": -10.622136116027832, "global_step": 206324, "epoch": 1228} {"train_loss": -10.139263153076172, "global_step": 206325, "epoch": 1228} {"train_loss": -10.209929466247559, "global_step": 206326, "epoch": 1228} {"train_loss": -10.659671783447266, "global_step": 206327, "epoch": 1228} {"train_loss": -10.834434509277344, "global_step": 206328, "epoch": 1228} {"train_loss": -11.007569313049316, "global_step": 206329, "epoch": 1228} {"train_loss": -10.932381629943848, "global_step": 206330, "epoch": 1228} {"train_loss": -10.938699722290039, "global_step": 206331, "epoch": 1228} {"train_loss": -11.312292098999023, "global_step": 206332, "epoch": 1228} {"train_loss": -10.634346008300781, "global_step": 206333, "epoch": 1228} {"train_loss": -10.751067161560059, "global_step": 206334, "epoch": 1228} {"train_loss": -11.462742805480957, "global_step": 206335, "epoch": 1228} {"train_loss": -10.626483917236328, "global_step": 206336, "epoch": 1228} {"train_loss": -11.400062561035156, "global_step": 206337, "epoch": 1228} {"train_loss": -10.938152313232422, "global_step": 206338, "epoch": 1228} {"train_loss": -11.068193435668945, "global_step": 206339, "epoch": 1228} {"train_loss": -11.283907890319824, "global_step": 206340, "epoch": 1228} {"train_loss": -11.074275016784668, "global_step": 206341, "epoch": 1228} {"train_loss": -11.027044296264648, "global_step": 206342, "epoch": 1228} {"train_loss": -11.481135368347168, "global_step": 206343, "epoch": 1228} {"train_loss": -11.2327880859375, "global_step": 206344, "epoch": 1228} {"train_loss": -10.982934951782227, "global_step": 206345, "epoch": 1228} {"train_loss": -11.391079902648926, "global_step": 206346, "epoch": 1228} {"train_loss": -11.29220962524414, "global_step": 206347, "epoch": 1228} {"train_loss": -11.209794044494629, "global_step": 206348, "epoch": 1228} {"train_loss": -11.451949119567871, "global_step": 206349, "epoch": 1228} {"train_loss": -11.270830154418945, "global_step": 206350, "epoch": 1228} {"train_loss": -11.339847564697266, "global_step": 206351, "epoch": 1228} {"train_loss": -11.423367500305176, "global_step": 206352, "epoch": 1228} {"train_loss": -11.596856117248535, "global_step": 206353, "epoch": 1228} {"train_loss": -11.565190315246582, "global_step": 206354, "epoch": 1228} {"train_loss": -11.554696083068848, "global_step": 206355, "epoch": 1228} {"train_loss": -11.628959655761719, "global_step": 206356, "epoch": 1228} {"train_loss": -11.611751556396484, "global_step": 206357, "epoch": 1228} {"train_loss": -11.468433380126953, "global_step": 206358, "epoch": 1228} {"train_loss": -11.591102600097656, "global_step": 206359, "epoch": 1228} {"train_loss": -11.346538543701172, "global_step": 206360, "epoch": 1228} {"train_loss": -11.497036933898926, "global_step": 206361, "epoch": 1228} {"train_loss": -11.45449447631836, "global_step": 206362, "epoch": 1228} {"train_loss": -11.523260116577148, "global_step": 206363, "epoch": 1228} {"train_loss": -11.66004753112793, "global_step": 206364, "epoch": 1228} {"train_loss": -11.363273620605469, "global_step": 206365, "epoch": 1228} {"train_loss": -11.6695556640625, "global_step": 206366, "epoch": 1228} {"train_loss": -11.54885482788086, "global_step": 206367, "epoch": 1228} {"train_loss": -11.719819068908691, "global_step": 206368, "epoch": 1228} {"train_loss": -11.660358428955078, "global_step": 206369, "epoch": 1228} {"train_loss": -11.729288101196289, "global_step": 206370, "epoch": 1228} {"train_loss": -11.683113098144531, "global_step": 206371, "epoch": 1228} {"train_loss": -11.777125358581543, "global_step": 206372, "epoch": 1228} {"train_loss": -11.748374938964844, "global_step": 206373, "epoch": 1228} {"train_loss": -11.75218391418457, "global_step": 206374, "epoch": 1228} {"train_loss": -11.688111305236816, "global_step": 206375, "epoch": 1228} {"train_loss": -11.901551246643066, "global_step": 206376, "epoch": 1228} {"train_loss": -11.727029800415039, "global_step": 206377, "epoch": 1228} {"train_loss": -11.646245956420898, "global_step": 206378, "epoch": 1228} {"train_loss": -11.826098442077637, "global_step": 206379, "epoch": 1228} {"train_loss": -11.722246170043945, "global_step": 206380, "epoch": 1228} {"train_loss": -11.860760688781738, "global_step": 206381, "epoch": 1228} {"train_loss": -11.813688278198242, "global_step": 206382, "epoch": 1228} {"train_loss": -11.969575881958008, "global_step": 206383, "epoch": 1228} {"train_loss": -11.95082950592041, "global_step": 206384, "epoch": 1228} {"train_loss": -11.901100158691406, "global_step": 206385, "epoch": 1228} {"train_loss": -11.81875228881836, "global_step": 206386, "epoch": 1228} {"train_loss": -11.79115104675293, "global_step": 206387, "epoch": 1228} {"train_loss": -11.96728801727295, "global_step": 206388, "epoch": 1228} {"train_loss": -11.741381645202637, "global_step": 206389, "epoch": 1228} {"train_loss": -11.974320411682129, "global_step": 206390, "epoch": 1228} {"train_loss": -11.718315124511719, "global_step": 206391, "epoch": 1228} {"train_loss": -11.254124641418457, "global_step": 206392, "epoch": 1228} {"train_loss": -11.465248107910156, "global_step": 206393, "epoch": 1228} {"train_loss": -11.581976890563965, "global_step": 206394, "epoch": 1228} {"train_loss": -11.47916030883789, "global_step": 206395, "epoch": 1228} {"train_loss": -11.58190631866455, "global_step": 206396, "epoch": 1228} {"train_loss": -11.725078582763672, "global_step": 206397, "epoch": 1228} {"train_loss": -11.646724700927734, "global_step": 206398, "epoch": 1228} {"train_loss": -12.001725196838379, "global_step": 206399, "epoch": 1228} {"train_loss": -10.857881546020508, "global_step": 206400, "epoch": 1228} {"train_loss": -10.581246376037598, "global_step": 206401, "epoch": 1228} {"train_loss": -10.206509590148926, "global_step": 206402, "epoch": 1228} {"train_loss": -11.076131820678711, "global_step": 206403, "epoch": 1228} {"train_loss": -10.36858081817627, "global_step": 206404, "epoch": 1228} {"train_loss": -9.733318328857422, "global_step": 206405, "epoch": 1228} {"train_loss": -10.441998481750488, "global_step": 206406, "epoch": 1228} {"train_loss": -11.046670913696289, "global_step": 206407, "epoch": 1228} {"train_loss": -11.247196197509766, "global_step": 206408, "epoch": 1228} {"train_loss": -11.426344871520996, "global_step": 206409, "epoch": 1228} {"train_loss": -11.150622367858887, "global_step": 206410, "epoch": 1228} {"train_loss": -11.377236366271973, "global_step": 206411, "epoch": 1228} {"train_loss": -11.754563331604004, "global_step": 206412, "epoch": 1228} {"train_loss": -11.30746078491211, "global_step": 206413, "epoch": 1228} {"train_loss": -11.395279884338379, "global_step": 206414, "epoch": 1228} {"train_loss": -11.483609199523926, "global_step": 206415, "epoch": 1228} {"train_loss": -11.70235538482666, "global_step": 206416, "epoch": 1228} {"train_loss": -11.571876525878906, "global_step": 206417, "epoch": 1228} {"train_loss": -11.400135040283203, "global_step": 206418, "epoch": 1228} {"train_loss": -11.639368057250977, "global_step": 206419, "epoch": 1228} {"train_loss": -11.805625915527344, "global_step": 206420, "epoch": 1228} {"train_loss": -11.593976974487305, "global_step": 206421, "epoch": 1228} {"train_loss": -11.577146530151367, "global_step": 206422, "epoch": 1228} {"train_loss": -11.410999298095703, "global_step": 206423, "epoch": 1228} {"train_loss": -11.733081817626953, "global_step": 206424, "epoch": 1228} {"train_loss": -11.461227416992188, "global_step": 206425, "epoch": 1228} {"train_loss": -11.503288269042969, "global_step": 206426, "epoch": 1228} {"train_loss": -11.036206245422363, "global_step": 206427, "epoch": 1228} {"train_loss": -11.452690124511719, "global_step": 206428, "epoch": 1228} {"train_loss": -11.665995597839355, "global_step": 206429, "epoch": 1228} {"train_loss": -11.654516220092773, "global_step": 206430, "epoch": 1228} {"train_loss": -11.65842056274414, "global_step": 206431, "epoch": 1228} {"train_loss": -11.400545120239258, "global_step": 206432, "epoch": 1228} {"train_loss": -11.522248268127441, "global_step": 206433, "epoch": 1228} {"train_loss": -11.654345512390137, "global_step": 206434, "epoch": 1228} {"train_loss": -11.308046340942383, "global_step": 206435, "epoch": 1228} {"train_loss": -11.493602752685547, "global_step": 206436, "epoch": 1228} {"train_loss": -11.169654846191406, "global_step": 206437, "epoch": 1228} {"train_loss": -11.242704391479492, "global_step": 206438, "epoch": 1228} {"train_loss": -11.545132637023926, "global_step": 206439, "epoch": 1228} {"train_loss": -11.230537414550781, "global_step": 206440, "epoch": 1228} {"train_loss": -11.260743141174316, "global_step": 206441, "epoch": 1228} {"train_loss": -10.833852767944336, "global_step": 206442, "epoch": 1228} {"train_loss": -10.349308013916016, "global_step": 206443, "epoch": 1228} {"train_loss": -11.44912338256836, "global_step": 206444, "epoch": 1228} {"train_loss": -10.176127433776855, "global_step": 206445, "epoch": 1228} {"train_loss": -11.236566543579102, "global_step": 206446, "epoch": 1228} {"train_loss": -10.838624000549316, "global_step": 206447, "epoch": 1228} {"train_loss": -11.37430191040039, "global_step": 206448, "epoch": 1228} {"train_loss": -10.597838401794434, "global_step": 206449, "epoch": 1228} {"train_loss": -10.911989212036133, "global_step": 206450, "epoch": 1228} {"train_loss": -11.030570030212402, "global_step": 206451, "epoch": 1228} {"train_loss": -11.048089981079102, "global_step": 206452, "epoch": 1228} {"train_loss": -11.060956001281738, "global_step": 206453, "epoch": 1228} {"train_loss": -11.365589141845703, "global_step": 206454, "epoch": 1228} {"train_loss": -10.606378555297852, "global_step": 206455, "epoch": 1228} {"train_loss": -11.424027442932129, "global_step": 206456, "epoch": 1228} {"train_loss": -10.855594635009766, "global_step": 206457, "epoch": 1228} {"train_loss": -11.40342903137207, "global_step": 206458, "epoch": 1228} {"train_loss": -11.07685375213623, "global_step": 206459, "epoch": 1228} {"train_loss": -11.208465576171875, "global_step": 206460, "epoch": 1228} {"train_loss": -11.277430534362793, "global_step": 206461, "epoch": 1228} {"train_loss": -11.401987075805664, "global_step": 206462, "epoch": 1228} {"train_loss": -11.37620735168457, "global_step": 206463, "epoch": 1228} {"train_loss": -11.071185111999512, "global_step": 206464, "epoch": 1228} {"train_loss": -11.455856323242188, "global_step": 206465, "epoch": 1228} {"train_loss": -11.519761085510254, "global_step": 206466, "epoch": 1228} {"train_loss": -11.272472381591797, "global_step": 206467, "epoch": 1228} {"train_loss": -11.527814865112305, "global_step": 206468, "epoch": 1228} {"train_loss": -11.189444541931152, "global_step": 206469, "epoch": 1228} {"train_loss": -11.599321365356445, "global_step": 206470, "epoch": 1228} {"train_loss": -11.271112056005569, "global_step": 206471, "epoch": 1228, "val_loss": 254446.96875} {"train_loss": -11.255017280578613, "global_step": 206472, "epoch": 1229} {"train_loss": -10.197598457336426, "global_step": 206473, "epoch": 1229} {"train_loss": -11.42149543762207, "global_step": 206474, "epoch": 1229} {"train_loss": -10.78400707244873, "global_step": 206475, "epoch": 1229} {"train_loss": -11.108973503112793, "global_step": 206476, "epoch": 1229} {"train_loss": -11.44327163696289, "global_step": 206477, "epoch": 1229} {"train_loss": -10.584550857543945, "global_step": 206478, "epoch": 1229} {"train_loss": -11.399876594543457, "global_step": 206479, "epoch": 1229} {"train_loss": -10.650407791137695, "global_step": 206480, "epoch": 1229} {"train_loss": -11.547126770019531, "global_step": 206481, "epoch": 1229} {"train_loss": -10.877220153808594, "global_step": 206482, "epoch": 1229} {"train_loss": -11.334685325622559, "global_step": 206483, "epoch": 1229} {"train_loss": -11.173942565917969, "global_step": 206484, "epoch": 1229} {"train_loss": -11.07083511352539, "global_step": 206485, "epoch": 1229} {"train_loss": -11.536190032958984, "global_step": 206486, "epoch": 1229} {"train_loss": -11.09945297241211, "global_step": 206487, "epoch": 1229} {"train_loss": -11.54024887084961, "global_step": 206488, "epoch": 1229} {"train_loss": -11.337422370910645, "global_step": 206489, "epoch": 1229} {"train_loss": -11.072977066040039, "global_step": 206490, "epoch": 1229} {"train_loss": -11.638439178466797, "global_step": 206491, "epoch": 1229} {"train_loss": -10.797182083129883, "global_step": 206492, "epoch": 1229} {"train_loss": -11.61085033416748, "global_step": 206493, "epoch": 1229} {"train_loss": -11.051656723022461, "global_step": 206494, "epoch": 1229} {"train_loss": -11.171686172485352, "global_step": 206495, "epoch": 1229} {"train_loss": -11.508307456970215, "global_step": 206496, "epoch": 1229} {"train_loss": -11.001895904541016, "global_step": 206497, "epoch": 1229} {"train_loss": -11.603063583374023, "global_step": 206498, "epoch": 1229} {"train_loss": -11.373933792114258, "global_step": 206499, "epoch": 1229} {"train_loss": -11.514189720153809, "global_step": 206500, "epoch": 1229} {"train_loss": -11.545236587524414, "global_step": 206501, "epoch": 1229} {"train_loss": -11.406582832336426, "global_step": 206502, "epoch": 1229} {"train_loss": -11.703832626342773, "global_step": 206503, "epoch": 1229} {"train_loss": -11.4807710647583, "global_step": 206504, "epoch": 1229} {"train_loss": -11.361902236938477, "global_step": 206505, "epoch": 1229} {"train_loss": -11.55168342590332, "global_step": 206506, "epoch": 1229} {"train_loss": -11.088157653808594, "global_step": 206507, "epoch": 1229} {"train_loss": -11.789261817932129, "global_step": 206508, "epoch": 1229} {"train_loss": -11.634016036987305, "global_step": 206509, "epoch": 1229} {"train_loss": -11.736600875854492, "global_step": 206510, "epoch": 1229} {"train_loss": -11.790050506591797, "global_step": 206511, "epoch": 1229} {"train_loss": -11.592325210571289, "global_step": 206512, "epoch": 1229} {"train_loss": -11.619773864746094, "global_step": 206513, "epoch": 1229} {"train_loss": -11.788058280944824, "global_step": 206514, "epoch": 1229} {"train_loss": -11.54203987121582, "global_step": 206515, "epoch": 1229} {"train_loss": -11.747427940368652, "global_step": 206516, "epoch": 1229} {"train_loss": -11.485076904296875, "global_step": 206517, "epoch": 1229} {"train_loss": -11.737812995910645, "global_step": 206518, "epoch": 1229} {"train_loss": -11.740800857543945, "global_step": 206519, "epoch": 1229} {"train_loss": -11.602765083312988, "global_step": 206520, "epoch": 1229} {"train_loss": -11.603275299072266, "global_step": 206521, "epoch": 1229} {"train_loss": -11.710122108459473, "global_step": 206522, "epoch": 1229} {"train_loss": -11.774791717529297, "global_step": 206523, "epoch": 1229} {"train_loss": -11.515071868896484, "global_step": 206524, "epoch": 1229} {"train_loss": -11.475704193115234, "global_step": 206525, "epoch": 1229} {"train_loss": -11.880402565002441, "global_step": 206526, "epoch": 1229} {"train_loss": -11.47076416015625, "global_step": 206527, "epoch": 1229} {"train_loss": -11.397987365722656, "global_step": 206528, "epoch": 1229} {"train_loss": -11.652610778808594, "global_step": 206529, "epoch": 1229} {"train_loss": -10.809539794921875, "global_step": 206530, "epoch": 1229} {"train_loss": -10.986188888549805, "global_step": 206531, "epoch": 1229} {"train_loss": -11.630834579467773, "global_step": 206532, "epoch": 1229} {"train_loss": -11.068674087524414, "global_step": 206533, "epoch": 1229} {"train_loss": -11.623212814331055, "global_step": 206534, "epoch": 1229} {"train_loss": -11.523466110229492, "global_step": 206535, "epoch": 1229} {"train_loss": -11.435547828674316, "global_step": 206536, "epoch": 1229} {"train_loss": -11.64926528930664, "global_step": 206537, "epoch": 1229} {"train_loss": -11.665897369384766, "global_step": 206538, "epoch": 1229} {"train_loss": -11.589309692382812, "global_step": 206539, "epoch": 1229} {"train_loss": -11.438544273376465, "global_step": 206540, "epoch": 1229} {"train_loss": -11.730348587036133, "global_step": 206541, "epoch": 1229} {"train_loss": -11.26807689666748, "global_step": 206542, "epoch": 1229} {"train_loss": -11.4718017578125, "global_step": 206543, "epoch": 1229} {"train_loss": -11.444330215454102, "global_step": 206544, "epoch": 1229} {"train_loss": -11.170453071594238, "global_step": 206545, "epoch": 1229} {"train_loss": -11.88589096069336, "global_step": 206546, "epoch": 1229} {"train_loss": -11.355756759643555, "global_step": 206547, "epoch": 1229} {"train_loss": -11.018516540527344, "global_step": 206548, "epoch": 1229} {"train_loss": -11.605981826782227, "global_step": 206549, "epoch": 1229} {"train_loss": -11.176356315612793, "global_step": 206550, "epoch": 1229} {"train_loss": -10.744465827941895, "global_step": 206551, "epoch": 1229} {"train_loss": -11.415050506591797, "global_step": 206552, "epoch": 1229} {"train_loss": -11.250137329101562, "global_step": 206553, "epoch": 1229} {"train_loss": -10.72021484375, "global_step": 206554, "epoch": 1229} {"train_loss": -9.618087768554688, "global_step": 206555, "epoch": 1229} {"train_loss": -11.16560173034668, "global_step": 206556, "epoch": 1229} {"train_loss": -10.894562721252441, "global_step": 206557, "epoch": 1229} {"train_loss": -10.221518516540527, "global_step": 206558, "epoch": 1229} {"train_loss": -11.631315231323242, "global_step": 206559, "epoch": 1229} {"train_loss": -10.35455322265625, "global_step": 206560, "epoch": 1229} {"train_loss": -10.892341613769531, "global_step": 206561, "epoch": 1229} {"train_loss": -11.194103240966797, "global_step": 206562, "epoch": 1229} {"train_loss": -11.160213470458984, "global_step": 206563, "epoch": 1229} {"train_loss": -11.106892585754395, "global_step": 206564, "epoch": 1229} {"train_loss": -10.986108779907227, "global_step": 206565, "epoch": 1229} {"train_loss": -11.02544116973877, "global_step": 206566, "epoch": 1229} {"train_loss": -11.0059814453125, "global_step": 206567, "epoch": 1229} {"train_loss": -11.299459457397461, "global_step": 206568, "epoch": 1229} {"train_loss": -11.288298606872559, "global_step": 206569, "epoch": 1229} {"train_loss": -11.635406494140625, "global_step": 206570, "epoch": 1229} {"train_loss": -11.333842277526855, "global_step": 206571, "epoch": 1229} {"train_loss": -11.770013809204102, "global_step": 206572, "epoch": 1229} {"train_loss": -11.353631973266602, "global_step": 206573, "epoch": 1229} {"train_loss": -11.36581802368164, "global_step": 206574, "epoch": 1229} {"train_loss": -11.016897201538086, "global_step": 206575, "epoch": 1229} {"train_loss": -11.283052444458008, "global_step": 206576, "epoch": 1229} {"train_loss": -11.272309303283691, "global_step": 206577, "epoch": 1229} {"train_loss": -10.824211120605469, "global_step": 206578, "epoch": 1229} {"train_loss": -10.95454216003418, "global_step": 206579, "epoch": 1229} {"train_loss": -11.050363540649414, "global_step": 206580, "epoch": 1229} {"train_loss": -11.166642189025879, "global_step": 206581, "epoch": 1229} {"train_loss": -11.013504981994629, "global_step": 206582, "epoch": 1229} {"train_loss": -10.856228828430176, "global_step": 206583, "epoch": 1229} {"train_loss": -11.212540626525879, "global_step": 206584, "epoch": 1229} {"train_loss": -10.346277236938477, "global_step": 206585, "epoch": 1229} {"train_loss": -11.30241584777832, "global_step": 206586, "epoch": 1229} {"train_loss": -10.641942977905273, "global_step": 206587, "epoch": 1229} {"train_loss": -11.266769409179688, "global_step": 206588, "epoch": 1229} {"train_loss": -10.674406051635742, "global_step": 206589, "epoch": 1229} {"train_loss": -10.99609661102295, "global_step": 206590, "epoch": 1229} {"train_loss": -10.905502319335938, "global_step": 206591, "epoch": 1229} {"train_loss": -10.421459197998047, "global_step": 206592, "epoch": 1229} {"train_loss": -11.030354499816895, "global_step": 206593, "epoch": 1229} {"train_loss": -10.278166770935059, "global_step": 206594, "epoch": 1229} {"train_loss": -11.253938674926758, "global_step": 206595, "epoch": 1229} {"train_loss": -10.352587699890137, "global_step": 206596, "epoch": 1229} {"train_loss": -11.042394638061523, "global_step": 206597, "epoch": 1229} {"train_loss": -10.694889068603516, "global_step": 206598, "epoch": 1229} {"train_loss": -11.121826171875, "global_step": 206599, "epoch": 1229} {"train_loss": -10.999197959899902, "global_step": 206600, "epoch": 1229} {"train_loss": -11.379803657531738, "global_step": 206601, "epoch": 1229} {"train_loss": -11.128791809082031, "global_step": 206602, "epoch": 1229} {"train_loss": -11.249419212341309, "global_step": 206603, "epoch": 1229} {"train_loss": -11.316608428955078, "global_step": 206604, "epoch": 1229} {"train_loss": -10.83120346069336, "global_step": 206605, "epoch": 1229} {"train_loss": -11.306644439697266, "global_step": 206606, "epoch": 1229} {"train_loss": -10.833364486694336, "global_step": 206607, "epoch": 1229} {"train_loss": -10.985099792480469, "global_step": 206608, "epoch": 1229} {"train_loss": -11.557159423828125, "global_step": 206609, "epoch": 1229} {"train_loss": -11.366809844970703, "global_step": 206610, "epoch": 1229} {"train_loss": -11.46310043334961, "global_step": 206611, "epoch": 1229} {"train_loss": -11.305234909057617, "global_step": 206612, "epoch": 1229} {"train_loss": -11.385305404663086, "global_step": 206613, "epoch": 1229} {"train_loss": -11.22785758972168, "global_step": 206614, "epoch": 1229} {"train_loss": -11.383614540100098, "global_step": 206615, "epoch": 1229} {"train_loss": -11.35460090637207, "global_step": 206616, "epoch": 1229} {"train_loss": -11.194070816040039, "global_step": 206617, "epoch": 1229} {"train_loss": -11.057199478149414, "global_step": 206618, "epoch": 1229} {"train_loss": -11.431828498840332, "global_step": 206619, "epoch": 1229} {"train_loss": -11.453949928283691, "global_step": 206620, "epoch": 1229} {"train_loss": -11.139212608337402, "global_step": 206621, "epoch": 1229} {"train_loss": -11.401376724243164, "global_step": 206622, "epoch": 1229} {"train_loss": -11.107681274414062, "global_step": 206623, "epoch": 1229} {"train_loss": -11.662253379821777, "global_step": 206624, "epoch": 1229} {"train_loss": -11.349679946899414, "global_step": 206625, "epoch": 1229} {"train_loss": -11.571966171264648, "global_step": 206626, "epoch": 1229} {"train_loss": -11.413015365600586, "global_step": 206627, "epoch": 1229} {"train_loss": -11.411718368530273, "global_step": 206628, "epoch": 1229} {"train_loss": -11.527048110961914, "global_step": 206629, "epoch": 1229} {"train_loss": -11.533480644226074, "global_step": 206630, "epoch": 1229} {"train_loss": -11.507795333862305, "global_step": 206631, "epoch": 1229} {"train_loss": -11.345274925231934, "global_step": 206632, "epoch": 1229} {"train_loss": -11.42111873626709, "global_step": 206633, "epoch": 1229} {"train_loss": -11.658540725708008, "global_step": 206634, "epoch": 1229} {"train_loss": -11.670530319213867, "global_step": 206635, "epoch": 1229} {"train_loss": -11.404485702514648, "global_step": 206636, "epoch": 1229} {"train_loss": -11.546557426452637, "global_step": 206637, "epoch": 1229} {"train_loss": -11.525915145874023, "global_step": 206638, "epoch": 1229} {"train_loss": -11.267788052558899, "global_step": 206639, "epoch": 1229, "val_loss": 256405.03125} {"train_loss": -11.46080207824707, "global_step": 206640, "epoch": 1230} {"train_loss": -11.565740585327148, "global_step": 206641, "epoch": 1230} {"train_loss": -11.163028717041016, "global_step": 206642, "epoch": 1230} {"train_loss": -11.71402359008789, "global_step": 206643, "epoch": 1230} {"train_loss": -11.334909439086914, "global_step": 206644, "epoch": 1230} {"train_loss": -11.463865280151367, "global_step": 206645, "epoch": 1230} {"train_loss": -11.569822311401367, "global_step": 206646, "epoch": 1230} {"train_loss": -11.100812911987305, "global_step": 206647, "epoch": 1230} {"train_loss": -11.427165031433105, "global_step": 206648, "epoch": 1230} {"train_loss": -11.27406120300293, "global_step": 206649, "epoch": 1230} {"train_loss": -11.10342025756836, "global_step": 206650, "epoch": 1230} {"train_loss": -11.270891189575195, "global_step": 206651, "epoch": 1230} {"train_loss": -11.327346801757812, "global_step": 206652, "epoch": 1230} {"train_loss": -11.037389755249023, "global_step": 206653, "epoch": 1230} {"train_loss": -11.525761604309082, "global_step": 206654, "epoch": 1230} {"train_loss": -11.347342491149902, "global_step": 206655, "epoch": 1230} {"train_loss": -11.474868774414062, "global_step": 206656, "epoch": 1230} {"train_loss": -11.296436309814453, "global_step": 206657, "epoch": 1230} {"train_loss": -11.27459716796875, "global_step": 206658, "epoch": 1230} {"train_loss": -11.548688888549805, "global_step": 206659, "epoch": 1230} {"train_loss": -11.399885177612305, "global_step": 206660, "epoch": 1230} {"train_loss": -11.616615295410156, "global_step": 206661, "epoch": 1230} {"train_loss": -11.463495254516602, "global_step": 206662, "epoch": 1230} {"train_loss": -10.990530014038086, "global_step": 206663, "epoch": 1230} {"train_loss": -11.711786270141602, "global_step": 206664, "epoch": 1230} {"train_loss": -11.073141098022461, "global_step": 206665, "epoch": 1230} {"train_loss": -11.096151351928711, "global_step": 206666, "epoch": 1230} {"train_loss": -11.566798210144043, "global_step": 206667, "epoch": 1230} {"train_loss": -11.035323143005371, "global_step": 206668, "epoch": 1230} {"train_loss": -10.936626434326172, "global_step": 206669, "epoch": 1230} {"train_loss": -11.688549041748047, "global_step": 206670, "epoch": 1230} {"train_loss": -11.00745964050293, "global_step": 206671, "epoch": 1230} {"train_loss": -11.709872245788574, "global_step": 206672, "epoch": 1230} {"train_loss": -11.097311973571777, "global_step": 206673, "epoch": 1230} {"train_loss": -11.41589641571045, "global_step": 206674, "epoch": 1230} {"train_loss": -11.386377334594727, "global_step": 206675, "epoch": 1230} {"train_loss": -11.546998977661133, "global_step": 206676, "epoch": 1230} {"train_loss": -11.057978630065918, "global_step": 206677, "epoch": 1230} {"train_loss": -11.451244354248047, "global_step": 206678, "epoch": 1230} {"train_loss": -10.633793830871582, "global_step": 206679, "epoch": 1230} {"train_loss": -11.330209732055664, "global_step": 206680, "epoch": 1230} {"train_loss": -10.877212524414062, "global_step": 206681, "epoch": 1230} {"train_loss": -11.62820816040039, "global_step": 206682, "epoch": 1230} {"train_loss": -10.326362609863281, "global_step": 206683, "epoch": 1230} {"train_loss": -11.465202331542969, "global_step": 206684, "epoch": 1230} {"train_loss": -11.425671577453613, "global_step": 206685, "epoch": 1230} {"train_loss": -11.128408432006836, "global_step": 206686, "epoch": 1230} {"train_loss": -11.3197603225708, "global_step": 206687, "epoch": 1230} {"train_loss": -10.790159225463867, "global_step": 206688, "epoch": 1230} {"train_loss": -11.241242408752441, "global_step": 206689, "epoch": 1230} {"train_loss": -10.87977409362793, "global_step": 206690, "epoch": 1230} {"train_loss": -11.301435470581055, "global_step": 206691, "epoch": 1230} {"train_loss": -10.804224014282227, "global_step": 206692, "epoch": 1230} {"train_loss": -10.554197311401367, "global_step": 206693, "epoch": 1230} {"train_loss": -11.205795288085938, "global_step": 206694, "epoch": 1230} {"train_loss": -11.111255645751953, "global_step": 206695, "epoch": 1230} {"train_loss": -10.705002784729004, "global_step": 206696, "epoch": 1230} {"train_loss": -11.326570510864258, "global_step": 206697, "epoch": 1230} {"train_loss": -10.78481388092041, "global_step": 206698, "epoch": 1230} {"train_loss": -10.995811462402344, "global_step": 206699, "epoch": 1230} {"train_loss": -11.100008010864258, "global_step": 206700, "epoch": 1230} {"train_loss": -10.287406921386719, "global_step": 206701, "epoch": 1230} {"train_loss": -11.371053695678711, "global_step": 206702, "epoch": 1230} {"train_loss": -10.625535011291504, "global_step": 206703, "epoch": 1230} {"train_loss": -10.99693489074707, "global_step": 206704, "epoch": 1230} {"train_loss": -10.884891510009766, "global_step": 206705, "epoch": 1230} {"train_loss": -10.474424362182617, "global_step": 206706, "epoch": 1230} {"train_loss": -11.490381240844727, "global_step": 206707, "epoch": 1230} {"train_loss": -10.887452125549316, "global_step": 206708, "epoch": 1230} {"train_loss": -11.239282608032227, "global_step": 206709, "epoch": 1230} {"train_loss": -10.997360229492188, "global_step": 206710, "epoch": 1230} {"train_loss": -11.32504653930664, "global_step": 206711, "epoch": 1230} {"train_loss": -10.776071548461914, "global_step": 206712, "epoch": 1230} {"train_loss": -11.545079231262207, "global_step": 206713, "epoch": 1230} {"train_loss": -11.131739616394043, "global_step": 206714, "epoch": 1230} {"train_loss": -11.262158393859863, "global_step": 206715, "epoch": 1230} {"train_loss": -11.322386741638184, "global_step": 206716, "epoch": 1230} {"train_loss": -11.304861068725586, "global_step": 206717, "epoch": 1230} {"train_loss": -11.369863510131836, "global_step": 206718, "epoch": 1230} {"train_loss": -11.215219497680664, "global_step": 206719, "epoch": 1230} {"train_loss": -11.500452995300293, "global_step": 206720, "epoch": 1230} {"train_loss": -11.289669036865234, "global_step": 206721, "epoch": 1230} {"train_loss": -11.142000198364258, "global_step": 206722, "epoch": 1230} {"train_loss": -11.40899658203125, "global_step": 206723, "epoch": 1230} {"train_loss": -11.095614433288574, "global_step": 206724, "epoch": 1230} {"train_loss": -11.446187973022461, "global_step": 206725, "epoch": 1230} {"train_loss": -11.48016357421875, "global_step": 206726, "epoch": 1230} {"train_loss": -11.478078842163086, "global_step": 206727, "epoch": 1230} {"train_loss": -11.341564178466797, "global_step": 206728, "epoch": 1230} {"train_loss": -11.300969123840332, "global_step": 206729, "epoch": 1230} {"train_loss": -11.463643074035645, "global_step": 206730, "epoch": 1230} {"train_loss": -11.184036254882812, "global_step": 206731, "epoch": 1230} {"train_loss": -11.316590309143066, "global_step": 206732, "epoch": 1230} {"train_loss": -11.246214866638184, "global_step": 206733, "epoch": 1230} {"train_loss": -11.24151611328125, "global_step": 206734, "epoch": 1230} {"train_loss": -11.373336791992188, "global_step": 206735, "epoch": 1230} {"train_loss": -11.629449844360352, "global_step": 206736, "epoch": 1230} {"train_loss": -11.360054016113281, "global_step": 206737, "epoch": 1230} {"train_loss": -11.604331970214844, "global_step": 206738, "epoch": 1230} {"train_loss": -11.45478630065918, "global_step": 206739, "epoch": 1230} {"train_loss": -11.5789155960083, "global_step": 206740, "epoch": 1230} {"train_loss": -11.452316284179688, "global_step": 206741, "epoch": 1230} {"train_loss": -11.340278625488281, "global_step": 206742, "epoch": 1230} {"train_loss": -11.597970962524414, "global_step": 206743, "epoch": 1230} {"train_loss": -11.136215209960938, "global_step": 206744, "epoch": 1230} {"train_loss": -11.267751693725586, "global_step": 206745, "epoch": 1230} {"train_loss": -11.199674606323242, "global_step": 206746, "epoch": 1230} {"train_loss": -11.45658016204834, "global_step": 206747, "epoch": 1230} {"train_loss": -11.193358421325684, "global_step": 206748, "epoch": 1230} {"train_loss": -11.511641502380371, "global_step": 206749, "epoch": 1230} {"train_loss": -11.015125274658203, "global_step": 206750, "epoch": 1230} {"train_loss": -11.491040229797363, "global_step": 206751, "epoch": 1230} {"train_loss": -11.302057266235352, "global_step": 206752, "epoch": 1230} {"train_loss": -11.439292907714844, "global_step": 206753, "epoch": 1230} {"train_loss": -11.340421676635742, "global_step": 206754, "epoch": 1230} {"train_loss": -11.507486343383789, "global_step": 206755, "epoch": 1230} {"train_loss": -11.33413314819336, "global_step": 206756, "epoch": 1230} {"train_loss": -11.147339820861816, "global_step": 206757, "epoch": 1230} {"train_loss": -11.525060653686523, "global_step": 206758, "epoch": 1230} {"train_loss": -11.283620834350586, "global_step": 206759, "epoch": 1230} {"train_loss": -11.471527099609375, "global_step": 206760, "epoch": 1230} {"train_loss": -10.899188995361328, "global_step": 206761, "epoch": 1230} {"train_loss": -11.478511810302734, "global_step": 206762, "epoch": 1230} {"train_loss": -11.052289962768555, "global_step": 206763, "epoch": 1230} {"train_loss": -10.772064208984375, "global_step": 206764, "epoch": 1230} {"train_loss": -11.589138984680176, "global_step": 206765, "epoch": 1230} {"train_loss": -10.611466407775879, "global_step": 206766, "epoch": 1230} {"train_loss": -11.398090362548828, "global_step": 206767, "epoch": 1230} {"train_loss": -11.10366153717041, "global_step": 206768, "epoch": 1230} {"train_loss": -11.351814270019531, "global_step": 206769, "epoch": 1230} {"train_loss": -11.105009078979492, "global_step": 206770, "epoch": 1230} {"train_loss": -11.432902336120605, "global_step": 206771, "epoch": 1230} {"train_loss": -11.329643249511719, "global_step": 206772, "epoch": 1230} {"train_loss": -11.126022338867188, "global_step": 206773, "epoch": 1230} {"train_loss": -11.547521591186523, "global_step": 206774, "epoch": 1230} {"train_loss": -11.151308059692383, "global_step": 206775, "epoch": 1230} {"train_loss": -11.547950744628906, "global_step": 206776, "epoch": 1230} {"train_loss": -11.144827842712402, "global_step": 206777, "epoch": 1230} {"train_loss": -10.993331909179688, "global_step": 206778, "epoch": 1230} {"train_loss": -11.339179992675781, "global_step": 206779, "epoch": 1230} {"train_loss": -10.999942779541016, "global_step": 206780, "epoch": 1230} {"train_loss": -11.457578659057617, "global_step": 206781, "epoch": 1230} {"train_loss": -11.807886123657227, "global_step": 206782, "epoch": 1230} {"train_loss": -11.50723648071289, "global_step": 206783, "epoch": 1230} {"train_loss": -11.695463180541992, "global_step": 206784, "epoch": 1230} {"train_loss": -11.447227478027344, "global_step": 206785, "epoch": 1230} {"train_loss": -11.627832412719727, "global_step": 206786, "epoch": 1230} {"train_loss": -11.941713333129883, "global_step": 206787, "epoch": 1230} {"train_loss": -11.403532981872559, "global_step": 206788, "epoch": 1230} {"train_loss": -11.69564151763916, "global_step": 206789, "epoch": 1230} {"train_loss": -11.643583297729492, "global_step": 206790, "epoch": 1230} {"train_loss": -11.88278865814209, "global_step": 206791, "epoch": 1230} {"train_loss": -11.246908187866211, "global_step": 206792, "epoch": 1230} {"train_loss": -11.630257606506348, "global_step": 206793, "epoch": 1230} {"train_loss": -11.376440048217773, "global_step": 206794, "epoch": 1230} {"train_loss": -11.711179733276367, "global_step": 206795, "epoch": 1230} {"train_loss": -11.521507263183594, "global_step": 206796, "epoch": 1230} {"train_loss": -11.728448867797852, "global_step": 206797, "epoch": 1230} {"train_loss": -11.57832145690918, "global_step": 206798, "epoch": 1230} {"train_loss": -11.418352127075195, "global_step": 206799, "epoch": 1230} {"train_loss": -11.392194747924805, "global_step": 206800, "epoch": 1230} {"train_loss": -11.7985258102417, "global_step": 206801, "epoch": 1230} {"train_loss": -11.189708709716797, "global_step": 206802, "epoch": 1230} {"train_loss": -11.519501686096191, "global_step": 206803, "epoch": 1230} {"train_loss": -11.751668930053711, "global_step": 206804, "epoch": 1230} {"train_loss": -11.715550422668457, "global_step": 206805, "epoch": 1230} {"train_loss": -11.255189895629883, "global_step": 206806, "epoch": 1230} {"train_loss": -11.30118829863412, "global_step": 206807, "epoch": 1230, "val_loss": 256692.328125, "train_action_mse_error": 1.5615283250808716} {"train_loss": -11.448461532592773, "global_step": 206808, "epoch": 1231} {"train_loss": -11.080328941345215, "global_step": 206809, "epoch": 1231} {"train_loss": -11.676094055175781, "global_step": 206810, "epoch": 1231} {"train_loss": -11.414956092834473, "global_step": 206811, "epoch": 1231} {"train_loss": -11.193769454956055, "global_step": 206812, "epoch": 1231} {"train_loss": -11.559415817260742, "global_step": 206813, "epoch": 1231} {"train_loss": -11.387998580932617, "global_step": 206814, "epoch": 1231} {"train_loss": -11.2852201461792, "global_step": 206815, "epoch": 1231} {"train_loss": -11.665419578552246, "global_step": 206816, "epoch": 1231} {"train_loss": -11.751840591430664, "global_step": 206817, "epoch": 1231} {"train_loss": -11.538148880004883, "global_step": 206818, "epoch": 1231} {"train_loss": -11.239505767822266, "global_step": 206819, "epoch": 1231} {"train_loss": -10.97206974029541, "global_step": 206820, "epoch": 1231} {"train_loss": -11.724903106689453, "global_step": 206821, "epoch": 1231} {"train_loss": -11.281051635742188, "global_step": 206822, "epoch": 1231} {"train_loss": -11.549298286437988, "global_step": 206823, "epoch": 1231} {"train_loss": -11.505186080932617, "global_step": 206824, "epoch": 1231} {"train_loss": -11.476042747497559, "global_step": 206825, "epoch": 1231} {"train_loss": -11.55725383758545, "global_step": 206826, "epoch": 1231} {"train_loss": -11.296393394470215, "global_step": 206827, "epoch": 1231} {"train_loss": -11.422772407531738, "global_step": 206828, "epoch": 1231} {"train_loss": -11.351739883422852, "global_step": 206829, "epoch": 1231} {"train_loss": -11.49754524230957, "global_step": 206830, "epoch": 1231} {"train_loss": -11.375505447387695, "global_step": 206831, "epoch": 1231} {"train_loss": -11.545114517211914, "global_step": 206832, "epoch": 1231} {"train_loss": -11.459589004516602, "global_step": 206833, "epoch": 1231} {"train_loss": -11.67579460144043, "global_step": 206834, "epoch": 1231} {"train_loss": -11.620185852050781, "global_step": 206835, "epoch": 1231} {"train_loss": -11.323457717895508, "global_step": 206836, "epoch": 1231} {"train_loss": -11.08157730102539, "global_step": 206837, "epoch": 1231} {"train_loss": -11.463302612304688, "global_step": 206838, "epoch": 1231} {"train_loss": -11.312555313110352, "global_step": 206839, "epoch": 1231} {"train_loss": -11.386006355285645, "global_step": 206840, "epoch": 1231} {"train_loss": -11.345148086547852, "global_step": 206841, "epoch": 1231} {"train_loss": -11.714593887329102, "global_step": 206842, "epoch": 1231} {"train_loss": -11.455827713012695, "global_step": 206843, "epoch": 1231} {"train_loss": -10.92203140258789, "global_step": 206844, "epoch": 1231} {"train_loss": -11.667994499206543, "global_step": 206845, "epoch": 1231} {"train_loss": -10.867837905883789, "global_step": 206846, "epoch": 1231} {"train_loss": -10.995081901550293, "global_step": 206847, "epoch": 1231} {"train_loss": -11.584161758422852, "global_step": 206848, "epoch": 1231} {"train_loss": -11.10770034790039, "global_step": 206849, "epoch": 1231} {"train_loss": -11.258792877197266, "global_step": 206850, "epoch": 1231} {"train_loss": -11.53484058380127, "global_step": 206851, "epoch": 1231} {"train_loss": -11.030786514282227, "global_step": 206852, "epoch": 1231} {"train_loss": -11.560558319091797, "global_step": 206853, "epoch": 1231} {"train_loss": -11.416265487670898, "global_step": 206854, "epoch": 1231} {"train_loss": -11.136040687561035, "global_step": 206855, "epoch": 1231} {"train_loss": -11.518885612487793, "global_step": 206856, "epoch": 1231} {"train_loss": -11.376636505126953, "global_step": 206857, "epoch": 1231} {"train_loss": -11.408418655395508, "global_step": 206858, "epoch": 1231} {"train_loss": -11.243965148925781, "global_step": 206859, "epoch": 1231} {"train_loss": -11.565997123718262, "global_step": 206860, "epoch": 1231} {"train_loss": -11.292928695678711, "global_step": 206861, "epoch": 1231} {"train_loss": -11.250009536743164, "global_step": 206862, "epoch": 1231} {"train_loss": -11.422138214111328, "global_step": 206863, "epoch": 1231} {"train_loss": -11.229806900024414, "global_step": 206864, "epoch": 1231} {"train_loss": -11.322103500366211, "global_step": 206865, "epoch": 1231} {"train_loss": -11.31036376953125, "global_step": 206866, "epoch": 1231} {"train_loss": -10.852072715759277, "global_step": 206867, "epoch": 1231} {"train_loss": -11.489261627197266, "global_step": 206868, "epoch": 1231} {"train_loss": -10.413492202758789, "global_step": 206869, "epoch": 1231} {"train_loss": -11.346426010131836, "global_step": 206870, "epoch": 1231} {"train_loss": -10.85745620727539, "global_step": 206871, "epoch": 1231} {"train_loss": -10.485816955566406, "global_step": 206872, "epoch": 1231} {"train_loss": -11.512075424194336, "global_step": 206873, "epoch": 1231} {"train_loss": -10.846687316894531, "global_step": 206874, "epoch": 1231} {"train_loss": -11.168160438537598, "global_step": 206875, "epoch": 1231} {"train_loss": -10.175127029418945, "global_step": 206876, "epoch": 1231} {"train_loss": -10.59840202331543, "global_step": 206877, "epoch": 1231} {"train_loss": -10.957080841064453, "global_step": 206878, "epoch": 1231} {"train_loss": -10.84576416015625, "global_step": 206879, "epoch": 1231} {"train_loss": -11.076549530029297, "global_step": 206880, "epoch": 1231} {"train_loss": -10.677743911743164, "global_step": 206881, "epoch": 1231} {"train_loss": -11.45192813873291, "global_step": 206882, "epoch": 1231} {"train_loss": -10.568431854248047, "global_step": 206883, "epoch": 1231} {"train_loss": -11.418745994567871, "global_step": 206884, "epoch": 1231} {"train_loss": -10.967195510864258, "global_step": 206885, "epoch": 1231} {"train_loss": -11.511372566223145, "global_step": 206886, "epoch": 1231} {"train_loss": -11.408735275268555, "global_step": 206887, "epoch": 1231} {"train_loss": -11.181314468383789, "global_step": 206888, "epoch": 1231} {"train_loss": -11.287588119506836, "global_step": 206889, "epoch": 1231} {"train_loss": -11.188901901245117, "global_step": 206890, "epoch": 1231} {"train_loss": -11.315607070922852, "global_step": 206891, "epoch": 1231} {"train_loss": -11.337631225585938, "global_step": 206892, "epoch": 1231} {"train_loss": -11.386007308959961, "global_step": 206893, "epoch": 1231} {"train_loss": -11.319812774658203, "global_step": 206894, "epoch": 1231} {"train_loss": -11.436822891235352, "global_step": 206895, "epoch": 1231} {"train_loss": -11.688596725463867, "global_step": 206896, "epoch": 1231} {"train_loss": -11.18050765991211, "global_step": 206897, "epoch": 1231} {"train_loss": -11.515619277954102, "global_step": 206898, "epoch": 1231} {"train_loss": -11.38204574584961, "global_step": 206899, "epoch": 1231} {"train_loss": -11.274821281433105, "global_step": 206900, "epoch": 1231} {"train_loss": -11.642833709716797, "global_step": 206901, "epoch": 1231} {"train_loss": -11.261543273925781, "global_step": 206902, "epoch": 1231} {"train_loss": -11.670717239379883, "global_step": 206903, "epoch": 1231} {"train_loss": -11.275162696838379, "global_step": 206904, "epoch": 1231} {"train_loss": -11.444509506225586, "global_step": 206905, "epoch": 1231} {"train_loss": -11.511493682861328, "global_step": 206906, "epoch": 1231} {"train_loss": -11.529374122619629, "global_step": 206907, "epoch": 1231} {"train_loss": -11.578042984008789, "global_step": 206908, "epoch": 1231} {"train_loss": -11.334766387939453, "global_step": 206909, "epoch": 1231} {"train_loss": -11.601484298706055, "global_step": 206910, "epoch": 1231} {"train_loss": -11.215766906738281, "global_step": 206911, "epoch": 1231} {"train_loss": -11.410589218139648, "global_step": 206912, "epoch": 1231} {"train_loss": -11.74505615234375, "global_step": 206913, "epoch": 1231} {"train_loss": -11.49256706237793, "global_step": 206914, "epoch": 1231} {"train_loss": -11.474641799926758, "global_step": 206915, "epoch": 1231} {"train_loss": -11.48607063293457, "global_step": 206916, "epoch": 1231} {"train_loss": -11.467626571655273, "global_step": 206917, "epoch": 1231} {"train_loss": -11.469828605651855, "global_step": 206918, "epoch": 1231} {"train_loss": -11.324562072753906, "global_step": 206919, "epoch": 1231} {"train_loss": -11.544149398803711, "global_step": 206920, "epoch": 1231} {"train_loss": -11.2517671585083, "global_step": 206921, "epoch": 1231} {"train_loss": -11.196301460266113, "global_step": 206922, "epoch": 1231} {"train_loss": -11.404556274414062, "global_step": 206923, "epoch": 1231} {"train_loss": -11.513524055480957, "global_step": 206924, "epoch": 1231} {"train_loss": -11.551815032958984, "global_step": 206925, "epoch": 1231} {"train_loss": -11.635909080505371, "global_step": 206926, "epoch": 1231} {"train_loss": -11.605344772338867, "global_step": 206927, "epoch": 1231} {"train_loss": -11.688493728637695, "global_step": 206928, "epoch": 1231} {"train_loss": -11.649751663208008, "global_step": 206929, "epoch": 1231} {"train_loss": -11.343128204345703, "global_step": 206930, "epoch": 1231} {"train_loss": -11.6434965133667, "global_step": 206931, "epoch": 1231} {"train_loss": -11.57499885559082, "global_step": 206932, "epoch": 1231} {"train_loss": -11.701078414916992, "global_step": 206933, "epoch": 1231} {"train_loss": -11.537004470825195, "global_step": 206934, "epoch": 1231} {"train_loss": -11.54556655883789, "global_step": 206935, "epoch": 1231} {"train_loss": -11.504886627197266, "global_step": 206936, "epoch": 1231} {"train_loss": -11.577877044677734, "global_step": 206937, "epoch": 1231} {"train_loss": -11.218025207519531, "global_step": 206938, "epoch": 1231} {"train_loss": -11.55746078491211, "global_step": 206939, "epoch": 1231} {"train_loss": -11.12074089050293, "global_step": 206940, "epoch": 1231} {"train_loss": -10.249761581420898, "global_step": 206941, "epoch": 1231} {"train_loss": -10.909910202026367, "global_step": 206942, "epoch": 1231} {"train_loss": -11.492011070251465, "global_step": 206943, "epoch": 1231} {"train_loss": -11.137223243713379, "global_step": 206944, "epoch": 1231} {"train_loss": -11.412476539611816, "global_step": 206945, "epoch": 1231} {"train_loss": -11.671682357788086, "global_step": 206946, "epoch": 1231} {"train_loss": -11.528002738952637, "global_step": 206947, "epoch": 1231} {"train_loss": -11.79364013671875, "global_step": 206948, "epoch": 1231} {"train_loss": -11.468038558959961, "global_step": 206949, "epoch": 1231} {"train_loss": -11.780437469482422, "global_step": 206950, "epoch": 1231} {"train_loss": -11.646827697753906, "global_step": 206951, "epoch": 1231} {"train_loss": -11.727425575256348, "global_step": 206952, "epoch": 1231} {"train_loss": -11.441699028015137, "global_step": 206953, "epoch": 1231} {"train_loss": -11.451337814331055, "global_step": 206954, "epoch": 1231} {"train_loss": -11.640012741088867, "global_step": 206955, "epoch": 1231} {"train_loss": -11.545591354370117, "global_step": 206956, "epoch": 1231} {"train_loss": -11.453802108764648, "global_step": 206957, "epoch": 1231} {"train_loss": -11.390867233276367, "global_step": 206958, "epoch": 1231} {"train_loss": -11.646267890930176, "global_step": 206959, "epoch": 1231} {"train_loss": -11.365945816040039, "global_step": 206960, "epoch": 1231} {"train_loss": -11.344694137573242, "global_step": 206961, "epoch": 1231} {"train_loss": -11.762524604797363, "global_step": 206962, "epoch": 1231} {"train_loss": -11.437173843383789, "global_step": 206963, "epoch": 1231} {"train_loss": -11.319046974182129, "global_step": 206964, "epoch": 1231} {"train_loss": -11.50430965423584, "global_step": 206965, "epoch": 1231} {"train_loss": -11.668517112731934, "global_step": 206966, "epoch": 1231} {"train_loss": -11.018218994140625, "global_step": 206967, "epoch": 1231} {"train_loss": -11.585521697998047, "global_step": 206968, "epoch": 1231} {"train_loss": -11.306741714477539, "global_step": 206969, "epoch": 1231} {"train_loss": -11.110217094421387, "global_step": 206970, "epoch": 1231} {"train_loss": -11.104036331176758, "global_step": 206971, "epoch": 1231} {"train_loss": -10.445657730102539, "global_step": 206972, "epoch": 1231} {"train_loss": -11.338916778564453, "global_step": 206973, "epoch": 1231} {"train_loss": -10.798830032348633, "global_step": 206974, "epoch": 1231} {"train_loss": -11.345956064405895, "global_step": 206975, "epoch": 1231, "val_loss": 255752.984375} {"train_loss": -10.666128158569336, "global_step": 206976, "epoch": 1232} {"train_loss": -11.482256889343262, "global_step": 206977, "epoch": 1232} {"train_loss": -10.420255661010742, "global_step": 206978, "epoch": 1232} {"train_loss": -11.27497673034668, "global_step": 206979, "epoch": 1232} {"train_loss": -10.602813720703125, "global_step": 206980, "epoch": 1232} {"train_loss": -11.079507827758789, "global_step": 206981, "epoch": 1232} {"train_loss": -10.628870010375977, "global_step": 206982, "epoch": 1232} {"train_loss": -10.904440879821777, "global_step": 206983, "epoch": 1232} {"train_loss": -10.96534538269043, "global_step": 206984, "epoch": 1232} {"train_loss": -10.465377807617188, "global_step": 206985, "epoch": 1232} {"train_loss": -11.412407875061035, "global_step": 206986, "epoch": 1232} {"train_loss": -10.049352645874023, "global_step": 206987, "epoch": 1232} {"train_loss": -11.01307487487793, "global_step": 206988, "epoch": 1232} {"train_loss": -11.256429672241211, "global_step": 206989, "epoch": 1232} {"train_loss": -10.745201110839844, "global_step": 206990, "epoch": 1232} {"train_loss": -11.242903709411621, "global_step": 206991, "epoch": 1232} {"train_loss": -11.2222261428833, "global_step": 206992, "epoch": 1232} {"train_loss": -10.447717666625977, "global_step": 206993, "epoch": 1232} {"train_loss": -11.33237361907959, "global_step": 206994, "epoch": 1232} {"train_loss": -10.820995330810547, "global_step": 206995, "epoch": 1232} {"train_loss": -11.081523895263672, "global_step": 206996, "epoch": 1232} {"train_loss": -11.192167282104492, "global_step": 206997, "epoch": 1232} {"train_loss": -10.99439811706543, "global_step": 206998, "epoch": 1232} {"train_loss": -11.016496658325195, "global_step": 206999, "epoch": 1232} {"train_loss": -11.377126693725586, "global_step": 207000, "epoch": 1232} {"train_loss": -11.117502212524414, "global_step": 207001, "epoch": 1232} {"train_loss": -11.291640281677246, "global_step": 207002, "epoch": 1232} {"train_loss": -11.180624961853027, "global_step": 207003, "epoch": 1232} {"train_loss": -11.095268249511719, "global_step": 207004, "epoch": 1232} {"train_loss": -11.276444435119629, "global_step": 207005, "epoch": 1232} {"train_loss": -11.312511444091797, "global_step": 207006, "epoch": 1232} {"train_loss": -11.064813613891602, "global_step": 207007, "epoch": 1232} {"train_loss": -11.383906364440918, "global_step": 207008, "epoch": 1232} {"train_loss": -11.173023223876953, "global_step": 207009, "epoch": 1232} {"train_loss": -11.212740898132324, "global_step": 207010, "epoch": 1232} {"train_loss": -11.451644897460938, "global_step": 207011, "epoch": 1232} {"train_loss": -11.363856315612793, "global_step": 207012, "epoch": 1232} {"train_loss": -11.542160034179688, "global_step": 207013, "epoch": 1232} {"train_loss": -11.322606086730957, "global_step": 207014, "epoch": 1232} {"train_loss": -11.13882827758789, "global_step": 207015, "epoch": 1232} {"train_loss": -11.30252456665039, "global_step": 207016, "epoch": 1232} {"train_loss": -11.480464935302734, "global_step": 207017, "epoch": 1232} {"train_loss": -11.11326789855957, "global_step": 207018, "epoch": 1232} {"train_loss": -11.396317481994629, "global_step": 207019, "epoch": 1232} {"train_loss": -11.484817504882812, "global_step": 207020, "epoch": 1232} {"train_loss": -11.567473411560059, "global_step": 207021, "epoch": 1232} {"train_loss": -11.171297073364258, "global_step": 207022, "epoch": 1232} {"train_loss": -11.440642356872559, "global_step": 207023, "epoch": 1232} {"train_loss": -11.096723556518555, "global_step": 207024, "epoch": 1232} {"train_loss": -11.651750564575195, "global_step": 207025, "epoch": 1232} {"train_loss": -11.11768627166748, "global_step": 207026, "epoch": 1232} {"train_loss": -11.591176986694336, "global_step": 207027, "epoch": 1232} {"train_loss": -11.524272918701172, "global_step": 207028, "epoch": 1232} {"train_loss": -11.331578254699707, "global_step": 207029, "epoch": 1232} {"train_loss": -11.758295059204102, "global_step": 207030, "epoch": 1232} {"train_loss": -11.436805725097656, "global_step": 207031, "epoch": 1232} {"train_loss": -11.734296798706055, "global_step": 207032, "epoch": 1232} {"train_loss": -11.738077163696289, "global_step": 207033, "epoch": 1232} {"train_loss": -11.630279541015625, "global_step": 207034, "epoch": 1232} {"train_loss": -11.475411415100098, "global_step": 207035, "epoch": 1232} {"train_loss": -11.665885925292969, "global_step": 207036, "epoch": 1232} {"train_loss": -11.710269927978516, "global_step": 207037, "epoch": 1232} {"train_loss": -11.320564270019531, "global_step": 207038, "epoch": 1232} {"train_loss": -11.749907493591309, "global_step": 207039, "epoch": 1232} {"train_loss": -11.333727836608887, "global_step": 207040, "epoch": 1232} {"train_loss": -11.360612869262695, "global_step": 207041, "epoch": 1232} {"train_loss": -11.475865364074707, "global_step": 207042, "epoch": 1232} {"train_loss": -11.785365104675293, "global_step": 207043, "epoch": 1232} {"train_loss": -11.526488304138184, "global_step": 207044, "epoch": 1232} {"train_loss": -11.420411109924316, "global_step": 207045, "epoch": 1232} {"train_loss": -11.413719177246094, "global_step": 207046, "epoch": 1232} {"train_loss": -11.367786407470703, "global_step": 207047, "epoch": 1232} {"train_loss": -11.587502479553223, "global_step": 207048, "epoch": 1232} {"train_loss": -11.228466033935547, "global_step": 207049, "epoch": 1232} {"train_loss": -11.219210624694824, "global_step": 207050, "epoch": 1232} {"train_loss": -11.866326332092285, "global_step": 207051, "epoch": 1232} {"train_loss": -11.31591510772705, "global_step": 207052, "epoch": 1232} {"train_loss": -11.48788833618164, "global_step": 207053, "epoch": 1232} {"train_loss": -11.187138557434082, "global_step": 207054, "epoch": 1232} {"train_loss": -11.199140548706055, "global_step": 207055, "epoch": 1232} {"train_loss": -11.51280403137207, "global_step": 207056, "epoch": 1232} {"train_loss": -11.078591346740723, "global_step": 207057, "epoch": 1232} {"train_loss": -11.030782699584961, "global_step": 207058, "epoch": 1232} {"train_loss": -11.269408226013184, "global_step": 207059, "epoch": 1232} {"train_loss": -11.558782577514648, "global_step": 207060, "epoch": 1232} {"train_loss": -11.536005020141602, "global_step": 207061, "epoch": 1232} {"train_loss": -10.864662170410156, "global_step": 207062, "epoch": 1232} {"train_loss": -10.950125694274902, "global_step": 207063, "epoch": 1232} {"train_loss": -11.697517395019531, "global_step": 207064, "epoch": 1232} {"train_loss": -11.042600631713867, "global_step": 207065, "epoch": 1232} {"train_loss": -10.82004165649414, "global_step": 207066, "epoch": 1232} {"train_loss": -11.368316650390625, "global_step": 207067, "epoch": 1232} {"train_loss": -11.619604110717773, "global_step": 207068, "epoch": 1232} {"train_loss": -11.553108215332031, "global_step": 207069, "epoch": 1232} {"train_loss": -11.437139511108398, "global_step": 207070, "epoch": 1232} {"train_loss": -11.569260597229004, "global_step": 207071, "epoch": 1232} {"train_loss": -11.576818466186523, "global_step": 207072, "epoch": 1232} {"train_loss": -11.145453453063965, "global_step": 207073, "epoch": 1232} {"train_loss": -11.35700798034668, "global_step": 207074, "epoch": 1232} {"train_loss": -11.466407775878906, "global_step": 207075, "epoch": 1232} {"train_loss": -10.981461524963379, "global_step": 207076, "epoch": 1232} {"train_loss": -10.648921966552734, "global_step": 207077, "epoch": 1232} {"train_loss": -10.828807830810547, "global_step": 207078, "epoch": 1232} {"train_loss": -10.64843463897705, "global_step": 207079, "epoch": 1232} {"train_loss": -10.725893020629883, "global_step": 207080, "epoch": 1232} {"train_loss": -11.121722221374512, "global_step": 207081, "epoch": 1232} {"train_loss": -10.433330535888672, "global_step": 207082, "epoch": 1232} {"train_loss": -11.530803680419922, "global_step": 207083, "epoch": 1232} {"train_loss": -10.179990768432617, "global_step": 207084, "epoch": 1232} {"train_loss": -11.226773262023926, "global_step": 207085, "epoch": 1232} {"train_loss": -10.440009117126465, "global_step": 207086, "epoch": 1232} {"train_loss": -10.86825180053711, "global_step": 207087, "epoch": 1232} {"train_loss": -11.013461112976074, "global_step": 207088, "epoch": 1232} {"train_loss": -10.956745147705078, "global_step": 207089, "epoch": 1232} {"train_loss": -10.789061546325684, "global_step": 207090, "epoch": 1232} {"train_loss": -11.09144115447998, "global_step": 207091, "epoch": 1232} {"train_loss": -11.051637649536133, "global_step": 207092, "epoch": 1232} {"train_loss": -10.901305198669434, "global_step": 207093, "epoch": 1232} {"train_loss": -10.903142929077148, "global_step": 207094, "epoch": 1232} {"train_loss": -10.382128715515137, "global_step": 207095, "epoch": 1232} {"train_loss": -11.170573234558105, "global_step": 207096, "epoch": 1232} {"train_loss": -10.559410095214844, "global_step": 207097, "epoch": 1232} {"train_loss": -10.968120574951172, "global_step": 207098, "epoch": 1232} {"train_loss": -11.23037338256836, "global_step": 207099, "epoch": 1232} {"train_loss": -10.93016529083252, "global_step": 207100, "epoch": 1232} {"train_loss": -11.351630210876465, "global_step": 207101, "epoch": 1232} {"train_loss": -11.402596473693848, "global_step": 207102, "epoch": 1232} {"train_loss": -11.068105697631836, "global_step": 207103, "epoch": 1232} {"train_loss": -11.233724594116211, "global_step": 207104, "epoch": 1232} {"train_loss": -11.574779510498047, "global_step": 207105, "epoch": 1232} {"train_loss": -11.317911148071289, "global_step": 207106, "epoch": 1232} {"train_loss": -11.540129661560059, "global_step": 207107, "epoch": 1232} {"train_loss": -11.532808303833008, "global_step": 207108, "epoch": 1232} {"train_loss": -11.296127319335938, "global_step": 207109, "epoch": 1232} {"train_loss": -11.561605453491211, "global_step": 207110, "epoch": 1232} {"train_loss": -11.525592803955078, "global_step": 207111, "epoch": 1232} {"train_loss": -11.724372863769531, "global_step": 207112, "epoch": 1232} {"train_loss": -11.395572662353516, "global_step": 207113, "epoch": 1232} {"train_loss": -11.770036697387695, "global_step": 207114, "epoch": 1232} {"train_loss": -11.521421432495117, "global_step": 207115, "epoch": 1232} {"train_loss": -11.346046447753906, "global_step": 207116, "epoch": 1232} {"train_loss": -11.640425682067871, "global_step": 207117, "epoch": 1232} {"train_loss": -11.624061584472656, "global_step": 207118, "epoch": 1232} {"train_loss": -11.610849380493164, "global_step": 207119, "epoch": 1232} {"train_loss": -11.534123420715332, "global_step": 207120, "epoch": 1232} {"train_loss": -11.644155502319336, "global_step": 207121, "epoch": 1232} {"train_loss": -11.644371032714844, "global_step": 207122, "epoch": 1232} {"train_loss": -11.619382858276367, "global_step": 207123, "epoch": 1232} {"train_loss": -11.470285415649414, "global_step": 207124, "epoch": 1232} {"train_loss": -11.74767017364502, "global_step": 207125, "epoch": 1232} {"train_loss": -11.388339042663574, "global_step": 207126, "epoch": 1232} {"train_loss": -11.659395217895508, "global_step": 207127, "epoch": 1232} {"train_loss": -11.707305908203125, "global_step": 207128, "epoch": 1232} {"train_loss": -11.880714416503906, "global_step": 207129, "epoch": 1232} {"train_loss": -11.76309871673584, "global_step": 207130, "epoch": 1232} {"train_loss": -11.854022979736328, "global_step": 207131, "epoch": 1232} {"train_loss": -11.916104316711426, "global_step": 207132, "epoch": 1232} {"train_loss": -11.69455337524414, "global_step": 207133, "epoch": 1232} {"train_loss": -11.745462417602539, "global_step": 207134, "epoch": 1232} {"train_loss": -11.85219669342041, "global_step": 207135, "epoch": 1232} {"train_loss": -11.85080623626709, "global_step": 207136, "epoch": 1232} {"train_loss": -11.827144622802734, "global_step": 207137, "epoch": 1232} {"train_loss": -11.759024620056152, "global_step": 207138, "epoch": 1232} {"train_loss": -11.868867874145508, "global_step": 207139, "epoch": 1232} {"train_loss": -11.530803680419922, "global_step": 207140, "epoch": 1232} {"train_loss": -11.808605194091797, "global_step": 207141, "epoch": 1232} {"train_loss": -11.674285888671875, "global_step": 207142, "epoch": 1232} {"train_loss": -11.298473051616124, "global_step": 207143, "epoch": 1232, "val_loss": 253691.484375} {"train_loss": -11.571151733398438, "global_step": 207144, "epoch": 1233} {"train_loss": -11.710569381713867, "global_step": 207145, "epoch": 1233} {"train_loss": -11.617182731628418, "global_step": 207146, "epoch": 1233} {"train_loss": -11.860407829284668, "global_step": 207147, "epoch": 1233} {"train_loss": -11.839917182922363, "global_step": 207148, "epoch": 1233} {"train_loss": -11.64364242553711, "global_step": 207149, "epoch": 1233} {"train_loss": -11.706997871398926, "global_step": 207150, "epoch": 1233} {"train_loss": -11.257009506225586, "global_step": 207151, "epoch": 1233} {"train_loss": -11.536238670349121, "global_step": 207152, "epoch": 1233} {"train_loss": -11.588712692260742, "global_step": 207153, "epoch": 1233} {"train_loss": -11.840953826904297, "global_step": 207154, "epoch": 1233} {"train_loss": -11.78577709197998, "global_step": 207155, "epoch": 1233} {"train_loss": -11.593012809753418, "global_step": 207156, "epoch": 1233} {"train_loss": -11.651617050170898, "global_step": 207157, "epoch": 1233} {"train_loss": -11.615480422973633, "global_step": 207158, "epoch": 1233} {"train_loss": -11.84714126586914, "global_step": 207159, "epoch": 1233} {"train_loss": -11.811546325683594, "global_step": 207160, "epoch": 1233} {"train_loss": -12.061407089233398, "global_step": 207161, "epoch": 1233} {"train_loss": -11.66740608215332, "global_step": 207162, "epoch": 1233} {"train_loss": -11.843633651733398, "global_step": 207163, "epoch": 1233} {"train_loss": -11.918893814086914, "global_step": 207164, "epoch": 1233} {"train_loss": -11.827003479003906, "global_step": 207165, "epoch": 1233} {"train_loss": -11.355464935302734, "global_step": 207166, "epoch": 1233} {"train_loss": -11.79489517211914, "global_step": 207167, "epoch": 1233} {"train_loss": -11.318426132202148, "global_step": 207168, "epoch": 1233} {"train_loss": -11.46723461151123, "global_step": 207169, "epoch": 1233} {"train_loss": -11.40293025970459, "global_step": 207170, "epoch": 1233} {"train_loss": -11.632166862487793, "global_step": 207171, "epoch": 1233} {"train_loss": -11.2894287109375, "global_step": 207172, "epoch": 1233} {"train_loss": -11.408641815185547, "global_step": 207173, "epoch": 1233} {"train_loss": -11.279619216918945, "global_step": 207174, "epoch": 1233} {"train_loss": -11.45906925201416, "global_step": 207175, "epoch": 1233} {"train_loss": -11.109993934631348, "global_step": 207176, "epoch": 1233} {"train_loss": -11.84565544128418, "global_step": 207177, "epoch": 1233} {"train_loss": -10.997858047485352, "global_step": 207178, "epoch": 1233} {"train_loss": -10.922981262207031, "global_step": 207179, "epoch": 1233} {"train_loss": -10.416976928710938, "global_step": 207180, "epoch": 1233} {"train_loss": -9.198685646057129, "global_step": 207181, "epoch": 1233} {"train_loss": -10.549830436706543, "global_step": 207182, "epoch": 1233} {"train_loss": -8.165088653564453, "global_step": 207183, "epoch": 1233} {"train_loss": -9.298728942871094, "global_step": 207184, "epoch": 1233} {"train_loss": -10.410078048706055, "global_step": 207185, "epoch": 1233} {"train_loss": -8.175569534301758, "global_step": 207186, "epoch": 1233} {"train_loss": -9.487149238586426, "global_step": 207187, "epoch": 1233} {"train_loss": -10.725515365600586, "global_step": 207188, "epoch": 1233} {"train_loss": -9.247152328491211, "global_step": 207189, "epoch": 1233} {"train_loss": -9.313521385192871, "global_step": 207190, "epoch": 1233} {"train_loss": -9.951360702514648, "global_step": 207191, "epoch": 1233} {"train_loss": -9.290688514709473, "global_step": 207192, "epoch": 1233} {"train_loss": -9.894424438476562, "global_step": 207193, "epoch": 1233} {"train_loss": -9.504610061645508, "global_step": 207194, "epoch": 1233} {"train_loss": -9.840570449829102, "global_step": 207195, "epoch": 1233} {"train_loss": -10.480978012084961, "global_step": 207196, "epoch": 1233} {"train_loss": -10.900991439819336, "global_step": 207197, "epoch": 1233} {"train_loss": -10.340310096740723, "global_step": 207198, "epoch": 1233} {"train_loss": -10.958502769470215, "global_step": 207199, "epoch": 1233} {"train_loss": -10.09866714477539, "global_step": 207200, "epoch": 1233} {"train_loss": -10.952230453491211, "global_step": 207201, "epoch": 1233} {"train_loss": -10.62087631225586, "global_step": 207202, "epoch": 1233} {"train_loss": -10.56425666809082, "global_step": 207203, "epoch": 1233} {"train_loss": -10.381525039672852, "global_step": 207204, "epoch": 1233} {"train_loss": -10.57532787322998, "global_step": 207205, "epoch": 1233} {"train_loss": -10.314051628112793, "global_step": 207206, "epoch": 1233} {"train_loss": -11.24365234375, "global_step": 207207, "epoch": 1233} {"train_loss": -10.68514633178711, "global_step": 207208, "epoch": 1233} {"train_loss": -10.656036376953125, "global_step": 207209, "epoch": 1233} {"train_loss": -10.85995101928711, "global_step": 207210, "epoch": 1233} {"train_loss": -10.344793319702148, "global_step": 207211, "epoch": 1233} {"train_loss": -11.033456802368164, "global_step": 207212, "epoch": 1233} {"train_loss": -11.024185180664062, "global_step": 207213, "epoch": 1233} {"train_loss": -10.634754180908203, "global_step": 207214, "epoch": 1233} {"train_loss": -11.031381607055664, "global_step": 207215, "epoch": 1233} {"train_loss": -10.96589469909668, "global_step": 207216, "epoch": 1233} {"train_loss": -10.818376541137695, "global_step": 207217, "epoch": 1233} {"train_loss": -11.127041816711426, "global_step": 207218, "epoch": 1233} {"train_loss": -11.12567138671875, "global_step": 207219, "epoch": 1233} {"train_loss": -10.888879776000977, "global_step": 207220, "epoch": 1233} {"train_loss": -11.090892791748047, "global_step": 207221, "epoch": 1233} {"train_loss": -11.330185890197754, "global_step": 207222, "epoch": 1233} {"train_loss": -11.020641326904297, "global_step": 207223, "epoch": 1233} {"train_loss": -11.162023544311523, "global_step": 207224, "epoch": 1233} {"train_loss": -11.265193939208984, "global_step": 207225, "epoch": 1233} {"train_loss": -11.117332458496094, "global_step": 207226, "epoch": 1233} {"train_loss": -11.192252159118652, "global_step": 207227, "epoch": 1233} {"train_loss": -11.446769714355469, "global_step": 207228, "epoch": 1233} {"train_loss": -11.324203491210938, "global_step": 207229, "epoch": 1233} {"train_loss": -11.335479736328125, "global_step": 207230, "epoch": 1233} {"train_loss": -11.288593292236328, "global_step": 207231, "epoch": 1233} {"train_loss": -11.321066856384277, "global_step": 207232, "epoch": 1233} {"train_loss": -11.261219024658203, "global_step": 207233, "epoch": 1233} {"train_loss": -11.241976737976074, "global_step": 207234, "epoch": 1233} {"train_loss": -11.357917785644531, "global_step": 207235, "epoch": 1233} {"train_loss": -11.057685852050781, "global_step": 207236, "epoch": 1233} {"train_loss": -11.468128204345703, "global_step": 207237, "epoch": 1233} {"train_loss": -11.320513725280762, "global_step": 207238, "epoch": 1233} {"train_loss": -11.334606170654297, "global_step": 207239, "epoch": 1233} {"train_loss": -11.308074951171875, "global_step": 207240, "epoch": 1233} {"train_loss": -11.187524795532227, "global_step": 207241, "epoch": 1233} {"train_loss": -11.293987274169922, "global_step": 207242, "epoch": 1233} {"train_loss": -11.246576309204102, "global_step": 207243, "epoch": 1233} {"train_loss": -11.20823860168457, "global_step": 207244, "epoch": 1233} {"train_loss": -11.389947891235352, "global_step": 207245, "epoch": 1233} {"train_loss": -11.396868705749512, "global_step": 207246, "epoch": 1233} {"train_loss": -11.282685279846191, "global_step": 207247, "epoch": 1233} {"train_loss": -11.554094314575195, "global_step": 207248, "epoch": 1233} {"train_loss": -11.318410873413086, "global_step": 207249, "epoch": 1233} {"train_loss": -11.182246208190918, "global_step": 207250, "epoch": 1233} {"train_loss": -11.477972984313965, "global_step": 207251, "epoch": 1233} {"train_loss": -11.481193542480469, "global_step": 207252, "epoch": 1233} {"train_loss": -11.424155235290527, "global_step": 207253, "epoch": 1233} {"train_loss": -11.39812183380127, "global_step": 207254, "epoch": 1233} {"train_loss": -11.603250503540039, "global_step": 207255, "epoch": 1233} {"train_loss": -11.619331359863281, "global_step": 207256, "epoch": 1233} {"train_loss": -11.299602508544922, "global_step": 207257, "epoch": 1233} {"train_loss": -11.291102409362793, "global_step": 207258, "epoch": 1233} {"train_loss": -11.598371505737305, "global_step": 207259, "epoch": 1233} {"train_loss": -11.58755874633789, "global_step": 207260, "epoch": 1233} {"train_loss": -11.594578742980957, "global_step": 207261, "epoch": 1233} {"train_loss": -11.456762313842773, "global_step": 207262, "epoch": 1233} {"train_loss": -11.700678825378418, "global_step": 207263, "epoch": 1233} {"train_loss": -11.477376937866211, "global_step": 207264, "epoch": 1233} {"train_loss": -11.623779296875, "global_step": 207265, "epoch": 1233} {"train_loss": -11.693543434143066, "global_step": 207266, "epoch": 1233} {"train_loss": -11.608206748962402, "global_step": 207267, "epoch": 1233} {"train_loss": -11.696989059448242, "global_step": 207268, "epoch": 1233} {"train_loss": -11.54751968383789, "global_step": 207269, "epoch": 1233} {"train_loss": -11.640300750732422, "global_step": 207270, "epoch": 1233} {"train_loss": -11.679756164550781, "global_step": 207271, "epoch": 1233} {"train_loss": -11.507933616638184, "global_step": 207272, "epoch": 1233} {"train_loss": -11.55239486694336, "global_step": 207273, "epoch": 1233} {"train_loss": -11.732667922973633, "global_step": 207274, "epoch": 1233} {"train_loss": -11.616094589233398, "global_step": 207275, "epoch": 1233} {"train_loss": -11.49193000793457, "global_step": 207276, "epoch": 1233} {"train_loss": -11.720436096191406, "global_step": 207277, "epoch": 1233} {"train_loss": -11.593867301940918, "global_step": 207278, "epoch": 1233} {"train_loss": -11.873485565185547, "global_step": 207279, "epoch": 1233} {"train_loss": -11.667142868041992, "global_step": 207280, "epoch": 1233} {"train_loss": -12.015481948852539, "global_step": 207281, "epoch": 1233} {"train_loss": -11.506467819213867, "global_step": 207282, "epoch": 1233} {"train_loss": -11.786092758178711, "global_step": 207283, "epoch": 1233} {"train_loss": -11.617379188537598, "global_step": 207284, "epoch": 1233} {"train_loss": -11.872940063476562, "global_step": 207285, "epoch": 1233} {"train_loss": -11.796367645263672, "global_step": 207286, "epoch": 1233} {"train_loss": -11.821822166442871, "global_step": 207287, "epoch": 1233} {"train_loss": -11.488405227661133, "global_step": 207288, "epoch": 1233} {"train_loss": -11.69520092010498, "global_step": 207289, "epoch": 1233} {"train_loss": -11.751992225646973, "global_step": 207290, "epoch": 1233} {"train_loss": -11.670880317687988, "global_step": 207291, "epoch": 1233} {"train_loss": -11.858804702758789, "global_step": 207292, "epoch": 1233} {"train_loss": -11.711284637451172, "global_step": 207293, "epoch": 1233} {"train_loss": -11.71307373046875, "global_step": 207294, "epoch": 1233} {"train_loss": -11.665613174438477, "global_step": 207295, "epoch": 1233} {"train_loss": -11.871112823486328, "global_step": 207296, "epoch": 1233} {"train_loss": -11.690760612487793, "global_step": 207297, "epoch": 1233} {"train_loss": -11.795884132385254, "global_step": 207298, "epoch": 1233} {"train_loss": -11.791136741638184, "global_step": 207299, "epoch": 1233} {"train_loss": -11.878517150878906, "global_step": 207300, "epoch": 1233} {"train_loss": -11.714997291564941, "global_step": 207301, "epoch": 1233} {"train_loss": -11.899850845336914, "global_step": 207302, "epoch": 1233} {"train_loss": -11.890303611755371, "global_step": 207303, "epoch": 1233} {"train_loss": -11.838715553283691, "global_step": 207304, "epoch": 1233} {"train_loss": -11.936376571655273, "global_step": 207305, "epoch": 1233} {"train_loss": -11.85507583618164, "global_step": 207306, "epoch": 1233} {"train_loss": -11.608205795288086, "global_step": 207307, "epoch": 1233} {"train_loss": -11.72071361541748, "global_step": 207308, "epoch": 1233} {"train_loss": -11.560247421264648, "global_step": 207309, "epoch": 1233} {"train_loss": -11.457906723022461, "global_step": 207310, "epoch": 1233} {"train_loss": -11.24195274852571, "global_step": 207311, "epoch": 1233, "val_loss": 251424.71875} {"train_loss": -11.432548522949219, "global_step": 207312, "epoch": 1234} {"train_loss": -11.712990760803223, "global_step": 207313, "epoch": 1234} {"train_loss": -11.22041130065918, "global_step": 207314, "epoch": 1234} {"train_loss": -11.446659088134766, "global_step": 207315, "epoch": 1234} {"train_loss": -11.409114837646484, "global_step": 207316, "epoch": 1234} {"train_loss": -11.468399047851562, "global_step": 207317, "epoch": 1234} {"train_loss": -11.161741256713867, "global_step": 207318, "epoch": 1234} {"train_loss": -11.639795303344727, "global_step": 207319, "epoch": 1234} {"train_loss": -11.657560348510742, "global_step": 207320, "epoch": 1234} {"train_loss": -11.578974723815918, "global_step": 207321, "epoch": 1234} {"train_loss": -11.453120231628418, "global_step": 207322, "epoch": 1234} {"train_loss": -11.277416229248047, "global_step": 207323, "epoch": 1234} {"train_loss": -11.416483879089355, "global_step": 207324, "epoch": 1234} {"train_loss": -11.75770378112793, "global_step": 207325, "epoch": 1234} {"train_loss": -11.52835464477539, "global_step": 207326, "epoch": 1234} {"train_loss": -11.80262565612793, "global_step": 207327, "epoch": 1234} {"train_loss": -11.570701599121094, "global_step": 207328, "epoch": 1234} {"train_loss": -11.636280059814453, "global_step": 207329, "epoch": 1234} {"train_loss": -11.518869400024414, "global_step": 207330, "epoch": 1234} {"train_loss": -11.418195724487305, "global_step": 207331, "epoch": 1234} {"train_loss": -11.16856861114502, "global_step": 207332, "epoch": 1234} {"train_loss": -11.715664863586426, "global_step": 207333, "epoch": 1234} {"train_loss": -11.529027938842773, "global_step": 207334, "epoch": 1234} {"train_loss": -11.436986923217773, "global_step": 207335, "epoch": 1234} {"train_loss": -11.135018348693848, "global_step": 207336, "epoch": 1234} {"train_loss": -11.515630722045898, "global_step": 207337, "epoch": 1234} {"train_loss": -11.065226554870605, "global_step": 207338, "epoch": 1234} {"train_loss": -11.588708877563477, "global_step": 207339, "epoch": 1234} {"train_loss": -11.110910415649414, "global_step": 207340, "epoch": 1234} {"train_loss": -11.028433799743652, "global_step": 207341, "epoch": 1234} {"train_loss": -10.640119552612305, "global_step": 207342, "epoch": 1234} {"train_loss": -11.292516708374023, "global_step": 207343, "epoch": 1234} {"train_loss": -9.810465812683105, "global_step": 207344, "epoch": 1234} {"train_loss": -11.721393585205078, "global_step": 207345, "epoch": 1234} {"train_loss": -10.242696762084961, "global_step": 207346, "epoch": 1234} {"train_loss": -10.280227661132812, "global_step": 207347, "epoch": 1234} {"train_loss": -10.037237167358398, "global_step": 207348, "epoch": 1234} {"train_loss": -11.029277801513672, "global_step": 207349, "epoch": 1234} {"train_loss": -9.634563446044922, "global_step": 207350, "epoch": 1234} {"train_loss": -10.80329704284668, "global_step": 207351, "epoch": 1234} {"train_loss": -10.564586639404297, "global_step": 207352, "epoch": 1234} {"train_loss": -10.320545196533203, "global_step": 207353, "epoch": 1234} {"train_loss": -11.171018600463867, "global_step": 207354, "epoch": 1234} {"train_loss": -10.100008010864258, "global_step": 207355, "epoch": 1234} {"train_loss": -11.333429336547852, "global_step": 207356, "epoch": 1234} {"train_loss": -10.301219940185547, "global_step": 207357, "epoch": 1234} {"train_loss": -9.874866485595703, "global_step": 207358, "epoch": 1234} {"train_loss": -10.946463584899902, "global_step": 207359, "epoch": 1234} {"train_loss": -9.927974700927734, "global_step": 207360, "epoch": 1234} {"train_loss": -10.522968292236328, "global_step": 207361, "epoch": 1234} {"train_loss": -9.778934478759766, "global_step": 207362, "epoch": 1234} {"train_loss": -10.866119384765625, "global_step": 207363, "epoch": 1234} {"train_loss": -9.438400268554688, "global_step": 207364, "epoch": 1234} {"train_loss": -11.29812240600586, "global_step": 207365, "epoch": 1234} {"train_loss": -10.289311408996582, "global_step": 207366, "epoch": 1234} {"train_loss": -10.832855224609375, "global_step": 207367, "epoch": 1234} {"train_loss": -9.980241775512695, "global_step": 207368, "epoch": 1234} {"train_loss": -10.625688552856445, "global_step": 207369, "epoch": 1234} {"train_loss": -10.494560241699219, "global_step": 207370, "epoch": 1234} {"train_loss": -11.168779373168945, "global_step": 207371, "epoch": 1234} {"train_loss": -10.49280834197998, "global_step": 207372, "epoch": 1234} {"train_loss": -10.628242492675781, "global_step": 207373, "epoch": 1234} {"train_loss": -11.036759376525879, "global_step": 207374, "epoch": 1234} {"train_loss": -10.680231094360352, "global_step": 207375, "epoch": 1234} {"train_loss": -10.969347953796387, "global_step": 207376, "epoch": 1234} {"train_loss": -10.911256790161133, "global_step": 207377, "epoch": 1234} {"train_loss": -11.229089736938477, "global_step": 207378, "epoch": 1234} {"train_loss": -11.196592330932617, "global_step": 207379, "epoch": 1234} {"train_loss": -10.98658561706543, "global_step": 207380, "epoch": 1234} {"train_loss": -11.175191879272461, "global_step": 207381, "epoch": 1234} {"train_loss": -10.992593765258789, "global_step": 207382, "epoch": 1234} {"train_loss": -11.128993034362793, "global_step": 207383, "epoch": 1234} {"train_loss": -11.319491386413574, "global_step": 207384, "epoch": 1234} {"train_loss": -11.04981517791748, "global_step": 207385, "epoch": 1234} {"train_loss": -11.112831115722656, "global_step": 207386, "epoch": 1234} {"train_loss": -11.473431587219238, "global_step": 207387, "epoch": 1234} {"train_loss": -11.154430389404297, "global_step": 207388, "epoch": 1234} {"train_loss": -11.250334739685059, "global_step": 207389, "epoch": 1234} {"train_loss": -11.239295959472656, "global_step": 207390, "epoch": 1234} {"train_loss": -11.237295150756836, "global_step": 207391, "epoch": 1234} {"train_loss": -11.01046371459961, "global_step": 207392, "epoch": 1234} {"train_loss": -10.922111511230469, "global_step": 207393, "epoch": 1234} {"train_loss": -11.022850036621094, "global_step": 207394, "epoch": 1234} {"train_loss": -11.122076034545898, "global_step": 207395, "epoch": 1234} {"train_loss": -11.025819778442383, "global_step": 207396, "epoch": 1234} {"train_loss": -11.14056396484375, "global_step": 207397, "epoch": 1234} {"train_loss": -11.234354019165039, "global_step": 207398, "epoch": 1234} {"train_loss": -11.327198028564453, "global_step": 207399, "epoch": 1234} {"train_loss": -11.053733825683594, "global_step": 207400, "epoch": 1234} {"train_loss": -11.391584396362305, "global_step": 207401, "epoch": 1234} {"train_loss": -11.45801830291748, "global_step": 207402, "epoch": 1234} {"train_loss": -11.367230415344238, "global_step": 207403, "epoch": 1234} {"train_loss": -11.57791805267334, "global_step": 207404, "epoch": 1234} {"train_loss": -11.384008407592773, "global_step": 207405, "epoch": 1234} {"train_loss": -11.340356826782227, "global_step": 207406, "epoch": 1234} {"train_loss": -11.75197696685791, "global_step": 207407, "epoch": 1234} {"train_loss": -11.567132949829102, "global_step": 207408, "epoch": 1234} {"train_loss": -11.384939193725586, "global_step": 207409, "epoch": 1234} {"train_loss": -11.616342544555664, "global_step": 207410, "epoch": 1234} {"train_loss": -11.468496322631836, "global_step": 207411, "epoch": 1234} {"train_loss": -11.563813209533691, "global_step": 207412, "epoch": 1234} {"train_loss": -11.465372085571289, "global_step": 207413, "epoch": 1234} {"train_loss": -11.545424461364746, "global_step": 207414, "epoch": 1234} {"train_loss": -11.463642120361328, "global_step": 207415, "epoch": 1234} {"train_loss": -11.660205841064453, "global_step": 207416, "epoch": 1234} {"train_loss": -11.729061126708984, "global_step": 207417, "epoch": 1234} {"train_loss": -11.521198272705078, "global_step": 207418, "epoch": 1234} {"train_loss": -11.780628204345703, "global_step": 207419, "epoch": 1234} {"train_loss": -11.757406234741211, "global_step": 207420, "epoch": 1234} {"train_loss": -11.786718368530273, "global_step": 207421, "epoch": 1234} {"train_loss": -11.847034454345703, "global_step": 207422, "epoch": 1234} {"train_loss": -11.663064002990723, "global_step": 207423, "epoch": 1234} {"train_loss": -11.412878036499023, "global_step": 207424, "epoch": 1234} {"train_loss": -11.767073631286621, "global_step": 207425, "epoch": 1234} {"train_loss": -11.517809867858887, "global_step": 207426, "epoch": 1234} {"train_loss": -11.683351516723633, "global_step": 207427, "epoch": 1234} {"train_loss": -11.641305923461914, "global_step": 207428, "epoch": 1234} {"train_loss": -11.447985649108887, "global_step": 207429, "epoch": 1234} {"train_loss": -11.897771835327148, "global_step": 207430, "epoch": 1234} {"train_loss": -11.151381492614746, "global_step": 207431, "epoch": 1234} {"train_loss": -11.3841552734375, "global_step": 207432, "epoch": 1234} {"train_loss": -11.679098129272461, "global_step": 207433, "epoch": 1234} {"train_loss": -11.285416603088379, "global_step": 207434, "epoch": 1234} {"train_loss": -11.381837844848633, "global_step": 207435, "epoch": 1234} {"train_loss": -11.729585647583008, "global_step": 207436, "epoch": 1234} {"train_loss": -11.41014575958252, "global_step": 207437, "epoch": 1234} {"train_loss": -11.382461547851562, "global_step": 207438, "epoch": 1234} {"train_loss": -11.42729377746582, "global_step": 207439, "epoch": 1234} {"train_loss": -10.879104614257812, "global_step": 207440, "epoch": 1234} {"train_loss": -11.533879280090332, "global_step": 207441, "epoch": 1234} {"train_loss": -11.480348587036133, "global_step": 207442, "epoch": 1234} {"train_loss": -10.907149314880371, "global_step": 207443, "epoch": 1234} {"train_loss": -10.987994194030762, "global_step": 207444, "epoch": 1234} {"train_loss": -11.161039352416992, "global_step": 207445, "epoch": 1234} {"train_loss": -9.796316146850586, "global_step": 207446, "epoch": 1234} {"train_loss": -10.277103424072266, "global_step": 207447, "epoch": 1234} {"train_loss": -8.438268661499023, "global_step": 207448, "epoch": 1234} {"train_loss": -10.823265075683594, "global_step": 207449, "epoch": 1234} {"train_loss": -11.12298583984375, "global_step": 207450, "epoch": 1234} {"train_loss": -10.59636402130127, "global_step": 207451, "epoch": 1234} {"train_loss": -10.982258796691895, "global_step": 207452, "epoch": 1234} {"train_loss": -10.02133560180664, "global_step": 207453, "epoch": 1234} {"train_loss": -11.115260124206543, "global_step": 207454, "epoch": 1234} {"train_loss": -10.591279983520508, "global_step": 207455, "epoch": 1234} {"train_loss": -11.049112319946289, "global_step": 207456, "epoch": 1234} {"train_loss": -10.800545692443848, "global_step": 207457, "epoch": 1234} {"train_loss": -10.742523193359375, "global_step": 207458, "epoch": 1234} {"train_loss": -10.781039237976074, "global_step": 207459, "epoch": 1234} {"train_loss": -10.602058410644531, "global_step": 207460, "epoch": 1234} {"train_loss": -10.660579681396484, "global_step": 207461, "epoch": 1234} {"train_loss": -11.165750503540039, "global_step": 207462, "epoch": 1234} {"train_loss": -10.30233383178711, "global_step": 207463, "epoch": 1234} {"train_loss": -11.313095092773438, "global_step": 207464, "epoch": 1234} {"train_loss": -10.845146179199219, "global_step": 207465, "epoch": 1234} {"train_loss": -10.550939559936523, "global_step": 207466, "epoch": 1234} {"train_loss": -11.236967086791992, "global_step": 207467, "epoch": 1234} {"train_loss": -10.683783531188965, "global_step": 207468, "epoch": 1234} {"train_loss": -11.150251388549805, "global_step": 207469, "epoch": 1234} {"train_loss": -11.291184425354004, "global_step": 207470, "epoch": 1234} {"train_loss": -11.393749237060547, "global_step": 207471, "epoch": 1234} {"train_loss": -11.010321617126465, "global_step": 207472, "epoch": 1234} {"train_loss": -11.385644912719727, "global_step": 207473, "epoch": 1234} {"train_loss": -11.19052505493164, "global_step": 207474, "epoch": 1234} {"train_loss": -11.355655670166016, "global_step": 207475, "epoch": 1234} {"train_loss": -11.178704261779785, "global_step": 207476, "epoch": 1234} {"train_loss": -11.400032043457031, "global_step": 207477, "epoch": 1234} {"train_loss": -11.21440601348877, "global_step": 207478, "epoch": 1234} {"train_loss": -11.10418613184066, "global_step": 207479, "epoch": 1234, "val_loss": 252345.484375} {"train_loss": -11.296972274780273, "global_step": 207480, "epoch": 1235} {"train_loss": -11.28350830078125, "global_step": 207481, "epoch": 1235} {"train_loss": -11.329967498779297, "global_step": 207482, "epoch": 1235} {"train_loss": -11.1888427734375, "global_step": 207483, "epoch": 1235} {"train_loss": -11.33365249633789, "global_step": 207484, "epoch": 1235} {"train_loss": -11.119377136230469, "global_step": 207485, "epoch": 1235} {"train_loss": -11.184614181518555, "global_step": 207486, "epoch": 1235} {"train_loss": -11.501070022583008, "global_step": 207487, "epoch": 1235} {"train_loss": -11.142117500305176, "global_step": 207488, "epoch": 1235} {"train_loss": -11.378273010253906, "global_step": 207489, "epoch": 1235} {"train_loss": -11.332498550415039, "global_step": 207490, "epoch": 1235} {"train_loss": -11.30894660949707, "global_step": 207491, "epoch": 1235} {"train_loss": -11.354920387268066, "global_step": 207492, "epoch": 1235} {"train_loss": -11.43467903137207, "global_step": 207493, "epoch": 1235} {"train_loss": -11.462627410888672, "global_step": 207494, "epoch": 1235} {"train_loss": -11.316179275512695, "global_step": 207495, "epoch": 1235} {"train_loss": -11.504209518432617, "global_step": 207496, "epoch": 1235} {"train_loss": -11.435436248779297, "global_step": 207497, "epoch": 1235} {"train_loss": -11.39879035949707, "global_step": 207498, "epoch": 1235} {"train_loss": -11.57703971862793, "global_step": 207499, "epoch": 1235} {"train_loss": -11.412412643432617, "global_step": 207500, "epoch": 1235} {"train_loss": -11.50158405303955, "global_step": 207501, "epoch": 1235} {"train_loss": -11.527933120727539, "global_step": 207502, "epoch": 1235} {"train_loss": -11.695499420166016, "global_step": 207503, "epoch": 1235} {"train_loss": -11.779417037963867, "global_step": 207504, "epoch": 1235} {"train_loss": -11.727265357971191, "global_step": 207505, "epoch": 1235} {"train_loss": -11.475720405578613, "global_step": 207506, "epoch": 1235} {"train_loss": -11.89334487915039, "global_step": 207507, "epoch": 1235} {"train_loss": -11.641456604003906, "global_step": 207508, "epoch": 1235} {"train_loss": -11.425816535949707, "global_step": 207509, "epoch": 1235} {"train_loss": -11.694173812866211, "global_step": 207510, "epoch": 1235} {"train_loss": -11.773452758789062, "global_step": 207511, "epoch": 1235} {"train_loss": -11.71879768371582, "global_step": 207512, "epoch": 1235} {"train_loss": -11.661712646484375, "global_step": 207513, "epoch": 1235} {"train_loss": -11.813164710998535, "global_step": 207514, "epoch": 1235} {"train_loss": -11.815702438354492, "global_step": 207515, "epoch": 1235} {"train_loss": -11.90255069732666, "global_step": 207516, "epoch": 1235} {"train_loss": -11.818218231201172, "global_step": 207517, "epoch": 1235} {"train_loss": -11.849761009216309, "global_step": 207518, "epoch": 1235} {"train_loss": -11.5712251663208, "global_step": 207519, "epoch": 1235} {"train_loss": -11.851826667785645, "global_step": 207520, "epoch": 1235} {"train_loss": -11.911041259765625, "global_step": 207521, "epoch": 1235} {"train_loss": -11.767148971557617, "global_step": 207522, "epoch": 1235} {"train_loss": -11.647465705871582, "global_step": 207523, "epoch": 1235} {"train_loss": -11.889719009399414, "global_step": 207524, "epoch": 1235} {"train_loss": -11.70004653930664, "global_step": 207525, "epoch": 1235} {"train_loss": -11.801782608032227, "global_step": 207526, "epoch": 1235} {"train_loss": -11.759472846984863, "global_step": 207527, "epoch": 1235} {"train_loss": -11.643288612365723, "global_step": 207528, "epoch": 1235} {"train_loss": -11.6995210647583, "global_step": 207529, "epoch": 1235} {"train_loss": -11.635635375976562, "global_step": 207530, "epoch": 1235} {"train_loss": -11.686239242553711, "global_step": 207531, "epoch": 1235} {"train_loss": -11.578167915344238, "global_step": 207532, "epoch": 1235} {"train_loss": -11.374404907226562, "global_step": 207533, "epoch": 1235} {"train_loss": -10.7874755859375, "global_step": 207534, "epoch": 1235} {"train_loss": -10.771299362182617, "global_step": 207535, "epoch": 1235} {"train_loss": -11.324119567871094, "global_step": 207536, "epoch": 1235} {"train_loss": -11.414505004882812, "global_step": 207537, "epoch": 1235} {"train_loss": -11.178407669067383, "global_step": 207538, "epoch": 1235} {"train_loss": -10.784954071044922, "global_step": 207539, "epoch": 1235} {"train_loss": -11.41150188446045, "global_step": 207540, "epoch": 1235} {"train_loss": -11.430997848510742, "global_step": 207541, "epoch": 1235} {"train_loss": -10.962203025817871, "global_step": 207542, "epoch": 1235} {"train_loss": -11.075751304626465, "global_step": 207543, "epoch": 1235} {"train_loss": -11.656587600708008, "global_step": 207544, "epoch": 1235} {"train_loss": -10.677180290222168, "global_step": 207545, "epoch": 1235} {"train_loss": -10.102272987365723, "global_step": 207546, "epoch": 1235} {"train_loss": -11.314743995666504, "global_step": 207547, "epoch": 1235} {"train_loss": -10.988659858703613, "global_step": 207548, "epoch": 1235} {"train_loss": -10.253180503845215, "global_step": 207549, "epoch": 1235} {"train_loss": -11.14307975769043, "global_step": 207550, "epoch": 1235} {"train_loss": -10.54541015625, "global_step": 207551, "epoch": 1235} {"train_loss": -10.62191390991211, "global_step": 207552, "epoch": 1235} {"train_loss": -10.90749740600586, "global_step": 207553, "epoch": 1235} {"train_loss": -10.773263931274414, "global_step": 207554, "epoch": 1235} {"train_loss": -11.117969512939453, "global_step": 207555, "epoch": 1235} {"train_loss": -11.077859878540039, "global_step": 207556, "epoch": 1235} {"train_loss": -11.20109748840332, "global_step": 207557, "epoch": 1235} {"train_loss": -10.745088577270508, "global_step": 207558, "epoch": 1235} {"train_loss": -11.153190612792969, "global_step": 207559, "epoch": 1235} {"train_loss": -11.304729461669922, "global_step": 207560, "epoch": 1235} {"train_loss": -11.170938491821289, "global_step": 207561, "epoch": 1235} {"train_loss": -10.821508407592773, "global_step": 207562, "epoch": 1235} {"train_loss": -11.562082290649414, "global_step": 207563, "epoch": 1235} {"train_loss": -10.704469680786133, "global_step": 207564, "epoch": 1235} {"train_loss": -11.188224792480469, "global_step": 207565, "epoch": 1235} {"train_loss": -10.74104118347168, "global_step": 207566, "epoch": 1235} {"train_loss": -10.563669204711914, "global_step": 207567, "epoch": 1235} {"train_loss": -10.911581039428711, "global_step": 207568, "epoch": 1235} {"train_loss": -10.721379280090332, "global_step": 207569, "epoch": 1235} {"train_loss": -10.969643592834473, "global_step": 207570, "epoch": 1235} {"train_loss": -11.112007141113281, "global_step": 207571, "epoch": 1235} {"train_loss": -11.285013198852539, "global_step": 207572, "epoch": 1235} {"train_loss": -11.459468841552734, "global_step": 207573, "epoch": 1235} {"train_loss": -11.33159065246582, "global_step": 207574, "epoch": 1235} {"train_loss": -11.548500061035156, "global_step": 207575, "epoch": 1235} {"train_loss": -11.137466430664062, "global_step": 207576, "epoch": 1235} {"train_loss": -11.546611785888672, "global_step": 207577, "epoch": 1235} {"train_loss": -11.529986381530762, "global_step": 207578, "epoch": 1235} {"train_loss": -11.123769760131836, "global_step": 207579, "epoch": 1235} {"train_loss": -11.308906555175781, "global_step": 207580, "epoch": 1235} {"train_loss": -11.158535957336426, "global_step": 207581, "epoch": 1235} {"train_loss": -11.550929069519043, "global_step": 207582, "epoch": 1235} {"train_loss": -11.32876968383789, "global_step": 207583, "epoch": 1235} {"train_loss": -11.04128360748291, "global_step": 207584, "epoch": 1235} {"train_loss": -11.398448944091797, "global_step": 207585, "epoch": 1235} {"train_loss": -11.076459884643555, "global_step": 207586, "epoch": 1235} {"train_loss": -11.508841514587402, "global_step": 207587, "epoch": 1235} {"train_loss": -11.442154884338379, "global_step": 207588, "epoch": 1235} {"train_loss": -11.630029678344727, "global_step": 207589, "epoch": 1235} {"train_loss": -11.339600563049316, "global_step": 207590, "epoch": 1235} {"train_loss": -11.497179985046387, "global_step": 207591, "epoch": 1235} {"train_loss": -11.304449081420898, "global_step": 207592, "epoch": 1235} {"train_loss": -11.547344207763672, "global_step": 207593, "epoch": 1235} {"train_loss": -11.647140502929688, "global_step": 207594, "epoch": 1235} {"train_loss": -11.154854774475098, "global_step": 207595, "epoch": 1235} {"train_loss": -11.699384689331055, "global_step": 207596, "epoch": 1235} {"train_loss": -11.573807716369629, "global_step": 207597, "epoch": 1235} {"train_loss": -11.525636672973633, "global_step": 207598, "epoch": 1235} {"train_loss": -11.808489799499512, "global_step": 207599, "epoch": 1235} {"train_loss": -11.535305976867676, "global_step": 207600, "epoch": 1235} {"train_loss": -11.763166427612305, "global_step": 207601, "epoch": 1235} {"train_loss": -11.281000137329102, "global_step": 207602, "epoch": 1235} {"train_loss": -11.174759864807129, "global_step": 207603, "epoch": 1235} {"train_loss": -11.433307647705078, "global_step": 207604, "epoch": 1235} {"train_loss": -11.295454978942871, "global_step": 207605, "epoch": 1235} {"train_loss": -11.711782455444336, "global_step": 207606, "epoch": 1235} {"train_loss": -11.612861633300781, "global_step": 207607, "epoch": 1235} {"train_loss": -11.467208862304688, "global_step": 207608, "epoch": 1235} {"train_loss": -11.655144691467285, "global_step": 207609, "epoch": 1235} {"train_loss": -11.38990592956543, "global_step": 207610, "epoch": 1235} {"train_loss": -11.419272422790527, "global_step": 207611, "epoch": 1235} {"train_loss": -11.4700927734375, "global_step": 207612, "epoch": 1235} {"train_loss": -11.490389823913574, "global_step": 207613, "epoch": 1235} {"train_loss": -11.653890609741211, "global_step": 207614, "epoch": 1235} {"train_loss": -11.568206787109375, "global_step": 207615, "epoch": 1235} {"train_loss": -11.642522811889648, "global_step": 207616, "epoch": 1235} {"train_loss": -11.519180297851562, "global_step": 207617, "epoch": 1235} {"train_loss": -11.766805648803711, "global_step": 207618, "epoch": 1235} {"train_loss": -11.570839881896973, "global_step": 207619, "epoch": 1235} {"train_loss": -11.432144165039062, "global_step": 207620, "epoch": 1235} {"train_loss": -11.470235824584961, "global_step": 207621, "epoch": 1235} {"train_loss": -11.458402633666992, "global_step": 207622, "epoch": 1235} {"train_loss": -11.859542846679688, "global_step": 207623, "epoch": 1235} {"train_loss": -11.61123275756836, "global_step": 207624, "epoch": 1235} {"train_loss": -11.635684967041016, "global_step": 207625, "epoch": 1235} {"train_loss": -11.61910629272461, "global_step": 207626, "epoch": 1235} {"train_loss": -11.835162162780762, "global_step": 207627, "epoch": 1235} {"train_loss": -11.768402099609375, "global_step": 207628, "epoch": 1235} {"train_loss": -11.566423416137695, "global_step": 207629, "epoch": 1235} {"train_loss": -11.276603698730469, "global_step": 207630, "epoch": 1235} {"train_loss": -11.829652786254883, "global_step": 207631, "epoch": 1235} {"train_loss": -11.715885162353516, "global_step": 207632, "epoch": 1235} {"train_loss": -11.700407028198242, "global_step": 207633, "epoch": 1235} {"train_loss": -11.24749755859375, "global_step": 207634, "epoch": 1235} {"train_loss": -11.555416107177734, "global_step": 207635, "epoch": 1235} {"train_loss": -11.670503616333008, "global_step": 207636, "epoch": 1235} {"train_loss": -10.968149185180664, "global_step": 207637, "epoch": 1235} {"train_loss": -11.087872505187988, "global_step": 207638, "epoch": 1235} {"train_loss": -11.59766960144043, "global_step": 207639, "epoch": 1235} {"train_loss": -11.602293968200684, "global_step": 207640, "epoch": 1235} {"train_loss": -11.222824096679688, "global_step": 207641, "epoch": 1235} {"train_loss": -11.431804656982422, "global_step": 207642, "epoch": 1235} {"train_loss": -10.835113525390625, "global_step": 207643, "epoch": 1235} {"train_loss": -11.62736701965332, "global_step": 207644, "epoch": 1235} {"train_loss": -11.580269813537598, "global_step": 207645, "epoch": 1235} {"train_loss": -11.620816230773926, "global_step": 207646, "epoch": 1235} {"train_loss": -11.392574327332634, "global_step": 207647, "epoch": 1235, "val_loss": 253437.921875, "train_action_mse_error": 1.6747188568115234} {"train_loss": -11.449077606201172, "global_step": 207648, "epoch": 1236} {"train_loss": -11.822883605957031, "global_step": 207649, "epoch": 1236} {"train_loss": -11.365147590637207, "global_step": 207650, "epoch": 1236} {"train_loss": -11.23704719543457, "global_step": 207651, "epoch": 1236} {"train_loss": -10.917354583740234, "global_step": 207652, "epoch": 1236} {"train_loss": -11.810013771057129, "global_step": 207653, "epoch": 1236} {"train_loss": -11.366998672485352, "global_step": 207654, "epoch": 1236} {"train_loss": -11.005691528320312, "global_step": 207655, "epoch": 1236} {"train_loss": -11.20983600616455, "global_step": 207656, "epoch": 1236} {"train_loss": -11.33009147644043, "global_step": 207657, "epoch": 1236} {"train_loss": -10.379180908203125, "global_step": 207658, "epoch": 1236} {"train_loss": -11.447893142700195, "global_step": 207659, "epoch": 1236} {"train_loss": -10.954215049743652, "global_step": 207660, "epoch": 1236} {"train_loss": -11.023849487304688, "global_step": 207661, "epoch": 1236} {"train_loss": -10.934243202209473, "global_step": 207662, "epoch": 1236} {"train_loss": -10.924398422241211, "global_step": 207663, "epoch": 1236} {"train_loss": -11.132257461547852, "global_step": 207664, "epoch": 1236} {"train_loss": -11.117979049682617, "global_step": 207665, "epoch": 1236} {"train_loss": -11.017901420593262, "global_step": 207666, "epoch": 1236} {"train_loss": -11.317680358886719, "global_step": 207667, "epoch": 1236} {"train_loss": -11.03630256652832, "global_step": 207668, "epoch": 1236} {"train_loss": -11.36830997467041, "global_step": 207669, "epoch": 1236} {"train_loss": -11.433244705200195, "global_step": 207670, "epoch": 1236} {"train_loss": -11.012195587158203, "global_step": 207671, "epoch": 1236} {"train_loss": -11.216022491455078, "global_step": 207672, "epoch": 1236} {"train_loss": -11.403848648071289, "global_step": 207673, "epoch": 1236} {"train_loss": -11.311882019042969, "global_step": 207674, "epoch": 1236} {"train_loss": -11.49521255493164, "global_step": 207675, "epoch": 1236} {"train_loss": -11.462998390197754, "global_step": 207676, "epoch": 1236} {"train_loss": -11.66327953338623, "global_step": 207677, "epoch": 1236} {"train_loss": -11.160496711730957, "global_step": 207678, "epoch": 1236} {"train_loss": -11.48642349243164, "global_step": 207679, "epoch": 1236} {"train_loss": -11.48502254486084, "global_step": 207680, "epoch": 1236} {"train_loss": -11.551939010620117, "global_step": 207681, "epoch": 1236} {"train_loss": -11.438024520874023, "global_step": 207682, "epoch": 1236} {"train_loss": -11.272638320922852, "global_step": 207683, "epoch": 1236} {"train_loss": -11.197246551513672, "global_step": 207684, "epoch": 1236} {"train_loss": -11.53371810913086, "global_step": 207685, "epoch": 1236} {"train_loss": -11.440056800842285, "global_step": 207686, "epoch": 1236} {"train_loss": -11.1510648727417, "global_step": 207687, "epoch": 1236} {"train_loss": -11.465985298156738, "global_step": 207688, "epoch": 1236} {"train_loss": -11.381512641906738, "global_step": 207689, "epoch": 1236} {"train_loss": -11.257862091064453, "global_step": 207690, "epoch": 1236} {"train_loss": -11.59027099609375, "global_step": 207691, "epoch": 1236} {"train_loss": -11.543362617492676, "global_step": 207692, "epoch": 1236} {"train_loss": -11.609784126281738, "global_step": 207693, "epoch": 1236} {"train_loss": -11.74346923828125, "global_step": 207694, "epoch": 1236} {"train_loss": -11.79806137084961, "global_step": 207695, "epoch": 1236} {"train_loss": -11.547209739685059, "global_step": 207696, "epoch": 1236} {"train_loss": -11.636638641357422, "global_step": 207697, "epoch": 1236} {"train_loss": -11.43010139465332, "global_step": 207698, "epoch": 1236} {"train_loss": -11.574808120727539, "global_step": 207699, "epoch": 1236} {"train_loss": -11.750703811645508, "global_step": 207700, "epoch": 1236} {"train_loss": -11.463501930236816, "global_step": 207701, "epoch": 1236} {"train_loss": -11.550895690917969, "global_step": 207702, "epoch": 1236} {"train_loss": -11.550517082214355, "global_step": 207703, "epoch": 1236} {"train_loss": -11.295072555541992, "global_step": 207704, "epoch": 1236} {"train_loss": -11.667486190795898, "global_step": 207705, "epoch": 1236} {"train_loss": -11.58542537689209, "global_step": 207706, "epoch": 1236} {"train_loss": -11.510128021240234, "global_step": 207707, "epoch": 1236} {"train_loss": -11.590967178344727, "global_step": 207708, "epoch": 1236} {"train_loss": -11.697874069213867, "global_step": 207709, "epoch": 1236} {"train_loss": -11.343387603759766, "global_step": 207710, "epoch": 1236} {"train_loss": -11.282722473144531, "global_step": 207711, "epoch": 1236} {"train_loss": -10.580031394958496, "global_step": 207712, "epoch": 1236} {"train_loss": -11.258018493652344, "global_step": 207713, "epoch": 1236} {"train_loss": -10.157503128051758, "global_step": 207714, "epoch": 1236} {"train_loss": -10.250200271606445, "global_step": 207715, "epoch": 1236} {"train_loss": -10.366931915283203, "global_step": 207716, "epoch": 1236} {"train_loss": -10.935644149780273, "global_step": 207717, "epoch": 1236} {"train_loss": -10.45573902130127, "global_step": 207718, "epoch": 1236} {"train_loss": -10.178720474243164, "global_step": 207719, "epoch": 1236} {"train_loss": -11.241870880126953, "global_step": 207720, "epoch": 1236} {"train_loss": -9.945608139038086, "global_step": 207721, "epoch": 1236} {"train_loss": -11.237159729003906, "global_step": 207722, "epoch": 1236} {"train_loss": -9.855672836303711, "global_step": 207723, "epoch": 1236} {"train_loss": -11.078951835632324, "global_step": 207724, "epoch": 1236} {"train_loss": -10.2780179977417, "global_step": 207725, "epoch": 1236} {"train_loss": -10.910009384155273, "global_step": 207726, "epoch": 1236} {"train_loss": -11.059203147888184, "global_step": 207727, "epoch": 1236} {"train_loss": -10.711509704589844, "global_step": 207728, "epoch": 1236} {"train_loss": -10.174654960632324, "global_step": 207729, "epoch": 1236} {"train_loss": -11.215703964233398, "global_step": 207730, "epoch": 1236} {"train_loss": -10.484689712524414, "global_step": 207731, "epoch": 1236} {"train_loss": -11.4893798828125, "global_step": 207732, "epoch": 1236} {"train_loss": -11.075660705566406, "global_step": 207733, "epoch": 1236} {"train_loss": -10.943878173828125, "global_step": 207734, "epoch": 1236} {"train_loss": -10.775592803955078, "global_step": 207735, "epoch": 1236} {"train_loss": -11.064120292663574, "global_step": 207736, "epoch": 1236} {"train_loss": -10.755863189697266, "global_step": 207737, "epoch": 1236} {"train_loss": -11.471768379211426, "global_step": 207738, "epoch": 1236} {"train_loss": -11.021835327148438, "global_step": 207739, "epoch": 1236} {"train_loss": -11.518845558166504, "global_step": 207740, "epoch": 1236} {"train_loss": -11.186576843261719, "global_step": 207741, "epoch": 1236} {"train_loss": -11.077729225158691, "global_step": 207742, "epoch": 1236} {"train_loss": -11.142491340637207, "global_step": 207743, "epoch": 1236} {"train_loss": -11.219523429870605, "global_step": 207744, "epoch": 1236} {"train_loss": -11.192192077636719, "global_step": 207745, "epoch": 1236} {"train_loss": -11.432489395141602, "global_step": 207746, "epoch": 1236} {"train_loss": -11.202454566955566, "global_step": 207747, "epoch": 1236} {"train_loss": -11.280476570129395, "global_step": 207748, "epoch": 1236} {"train_loss": -11.231525421142578, "global_step": 207749, "epoch": 1236} {"train_loss": -11.383283615112305, "global_step": 207750, "epoch": 1236} {"train_loss": -11.151315689086914, "global_step": 207751, "epoch": 1236} {"train_loss": -11.326937675476074, "global_step": 207752, "epoch": 1236} {"train_loss": -11.464780807495117, "global_step": 207753, "epoch": 1236} {"train_loss": -11.712597846984863, "global_step": 207754, "epoch": 1236} {"train_loss": -11.646551132202148, "global_step": 207755, "epoch": 1236} {"train_loss": -11.358467102050781, "global_step": 207756, "epoch": 1236} {"train_loss": -11.340006828308105, "global_step": 207757, "epoch": 1236} {"train_loss": -11.430710792541504, "global_step": 207758, "epoch": 1236} {"train_loss": -11.666313171386719, "global_step": 207759, "epoch": 1236} {"train_loss": -11.660581588745117, "global_step": 207760, "epoch": 1236} {"train_loss": -11.508968353271484, "global_step": 207761, "epoch": 1236} {"train_loss": -11.615781784057617, "global_step": 207762, "epoch": 1236} {"train_loss": -11.403848648071289, "global_step": 207763, "epoch": 1236} {"train_loss": -11.557849884033203, "global_step": 207764, "epoch": 1236} {"train_loss": -11.702628135681152, "global_step": 207765, "epoch": 1236} {"train_loss": -11.776365280151367, "global_step": 207766, "epoch": 1236} {"train_loss": -11.724015235900879, "global_step": 207767, "epoch": 1236} {"train_loss": -11.64395809173584, "global_step": 207768, "epoch": 1236} {"train_loss": -11.759013175964355, "global_step": 207769, "epoch": 1236} {"train_loss": -11.687423706054688, "global_step": 207770, "epoch": 1236} {"train_loss": -11.742542266845703, "global_step": 207771, "epoch": 1236} {"train_loss": -11.923476219177246, "global_step": 207772, "epoch": 1236} {"train_loss": -11.749387741088867, "global_step": 207773, "epoch": 1236} {"train_loss": -11.754592895507812, "global_step": 207774, "epoch": 1236} {"train_loss": -11.73906135559082, "global_step": 207775, "epoch": 1236} {"train_loss": -11.58985710144043, "global_step": 207776, "epoch": 1236} {"train_loss": -11.871330261230469, "global_step": 207777, "epoch": 1236} {"train_loss": -11.556657791137695, "global_step": 207778, "epoch": 1236} {"train_loss": -11.892232894897461, "global_step": 207779, "epoch": 1236} {"train_loss": -11.952898025512695, "global_step": 207780, "epoch": 1236} {"train_loss": -11.688987731933594, "global_step": 207781, "epoch": 1236} {"train_loss": -11.79904842376709, "global_step": 207782, "epoch": 1236} {"train_loss": -11.849706649780273, "global_step": 207783, "epoch": 1236} {"train_loss": -11.926687240600586, "global_step": 207784, "epoch": 1236} {"train_loss": -11.885980606079102, "global_step": 207785, "epoch": 1236} {"train_loss": -11.638728141784668, "global_step": 207786, "epoch": 1236} {"train_loss": -11.775853157043457, "global_step": 207787, "epoch": 1236} {"train_loss": -11.643754959106445, "global_step": 207788, "epoch": 1236} {"train_loss": -11.861764907836914, "global_step": 207789, "epoch": 1236} {"train_loss": -11.399917602539062, "global_step": 207790, "epoch": 1236} {"train_loss": -11.175125122070312, "global_step": 207791, "epoch": 1236} {"train_loss": -10.58560848236084, "global_step": 207792, "epoch": 1236} {"train_loss": -10.498878479003906, "global_step": 207793, "epoch": 1236} {"train_loss": -11.299065589904785, "global_step": 207794, "epoch": 1236} {"train_loss": -11.170025825500488, "global_step": 207795, "epoch": 1236} {"train_loss": -11.010092735290527, "global_step": 207796, "epoch": 1236} {"train_loss": -11.097921371459961, "global_step": 207797, "epoch": 1236} {"train_loss": -11.201099395751953, "global_step": 207798, "epoch": 1236} {"train_loss": -11.244050979614258, "global_step": 207799, "epoch": 1236} {"train_loss": -11.47176456451416, "global_step": 207800, "epoch": 1236} {"train_loss": -11.514019012451172, "global_step": 207801, "epoch": 1236} {"train_loss": -10.556891441345215, "global_step": 207802, "epoch": 1236} {"train_loss": -10.910845756530762, "global_step": 207803, "epoch": 1236} {"train_loss": -11.338212966918945, "global_step": 207804, "epoch": 1236} {"train_loss": -11.386245727539062, "global_step": 207805, "epoch": 1236} {"train_loss": -11.302074432373047, "global_step": 207806, "epoch": 1236} {"train_loss": -11.37301254272461, "global_step": 207807, "epoch": 1236} {"train_loss": -11.432552337646484, "global_step": 207808, "epoch": 1236} {"train_loss": -11.089096069335938, "global_step": 207809, "epoch": 1236} {"train_loss": -11.441814422607422, "global_step": 207810, "epoch": 1236} {"train_loss": -11.052207946777344, "global_step": 207811, "epoch": 1236} {"train_loss": -10.465333938598633, "global_step": 207812, "epoch": 1236} {"train_loss": -11.355293273925781, "global_step": 207813, "epoch": 1236} {"train_loss": -10.99539566040039, "global_step": 207814, "epoch": 1236} {"train_loss": -11.290955861409506, "global_step": 207815, "epoch": 1236, "val_loss": 256874.453125} {"train_loss": -11.262985229492188, "global_step": 207816, "epoch": 1237} {"train_loss": -11.2913818359375, "global_step": 207817, "epoch": 1237} {"train_loss": -11.328752517700195, "global_step": 207818, "epoch": 1237} {"train_loss": -11.232178688049316, "global_step": 207819, "epoch": 1237} {"train_loss": -11.314932823181152, "global_step": 207820, "epoch": 1237} {"train_loss": -11.138689994812012, "global_step": 207821, "epoch": 1237} {"train_loss": -11.209220886230469, "global_step": 207822, "epoch": 1237} {"train_loss": -11.488479614257812, "global_step": 207823, "epoch": 1237} {"train_loss": -11.432024002075195, "global_step": 207824, "epoch": 1237} {"train_loss": -11.315605163574219, "global_step": 207825, "epoch": 1237} {"train_loss": -11.482406616210938, "global_step": 207826, "epoch": 1237} {"train_loss": -11.175597190856934, "global_step": 207827, "epoch": 1237} {"train_loss": -11.488399505615234, "global_step": 207828, "epoch": 1237} {"train_loss": -11.185628890991211, "global_step": 207829, "epoch": 1237} {"train_loss": -11.319644927978516, "global_step": 207830, "epoch": 1237} {"train_loss": -10.808656692504883, "global_step": 207831, "epoch": 1237} {"train_loss": -10.37161636352539, "global_step": 207832, "epoch": 1237} {"train_loss": -11.387545585632324, "global_step": 207833, "epoch": 1237} {"train_loss": -10.470071792602539, "global_step": 207834, "epoch": 1237} {"train_loss": -11.272911071777344, "global_step": 207835, "epoch": 1237} {"train_loss": -10.64983081817627, "global_step": 207836, "epoch": 1237} {"train_loss": -11.082273483276367, "global_step": 207837, "epoch": 1237} {"train_loss": -11.274659156799316, "global_step": 207838, "epoch": 1237} {"train_loss": -10.47847843170166, "global_step": 207839, "epoch": 1237} {"train_loss": -11.286478042602539, "global_step": 207840, "epoch": 1237} {"train_loss": -11.023853302001953, "global_step": 207841, "epoch": 1237} {"train_loss": -11.251481056213379, "global_step": 207842, "epoch": 1237} {"train_loss": -10.393796920776367, "global_step": 207843, "epoch": 1237} {"train_loss": -11.224488258361816, "global_step": 207844, "epoch": 1237} {"train_loss": -10.90433406829834, "global_step": 207845, "epoch": 1237} {"train_loss": -11.25183391571045, "global_step": 207846, "epoch": 1237} {"train_loss": -10.870945930480957, "global_step": 207847, "epoch": 1237} {"train_loss": -10.75408935546875, "global_step": 207848, "epoch": 1237} {"train_loss": -11.131631851196289, "global_step": 207849, "epoch": 1237} {"train_loss": -10.165339469909668, "global_step": 207850, "epoch": 1237} {"train_loss": -11.056888580322266, "global_step": 207851, "epoch": 1237} {"train_loss": -10.554216384887695, "global_step": 207852, "epoch": 1237} {"train_loss": -11.007030487060547, "global_step": 207853, "epoch": 1237} {"train_loss": -10.638116836547852, "global_step": 207854, "epoch": 1237} {"train_loss": -11.25423526763916, "global_step": 207855, "epoch": 1237} {"train_loss": -10.995599746704102, "global_step": 207856, "epoch": 1237} {"train_loss": -11.302593231201172, "global_step": 207857, "epoch": 1237} {"train_loss": -11.332986831665039, "global_step": 207858, "epoch": 1237} {"train_loss": -11.222759246826172, "global_step": 207859, "epoch": 1237} {"train_loss": -11.39109992980957, "global_step": 207860, "epoch": 1237} {"train_loss": -11.18528938293457, "global_step": 207861, "epoch": 1237} {"train_loss": -11.218971252441406, "global_step": 207862, "epoch": 1237} {"train_loss": -11.298171043395996, "global_step": 207863, "epoch": 1237} {"train_loss": -11.406818389892578, "global_step": 207864, "epoch": 1237} {"train_loss": -11.461705207824707, "global_step": 207865, "epoch": 1237} {"train_loss": -11.215736389160156, "global_step": 207866, "epoch": 1237} {"train_loss": -11.346649169921875, "global_step": 207867, "epoch": 1237} {"train_loss": -11.02004623413086, "global_step": 207868, "epoch": 1237} {"train_loss": -11.085562705993652, "global_step": 207869, "epoch": 1237} {"train_loss": -11.448888778686523, "global_step": 207870, "epoch": 1237} {"train_loss": -11.407958984375, "global_step": 207871, "epoch": 1237} {"train_loss": -11.34168815612793, "global_step": 207872, "epoch": 1237} {"train_loss": -11.261893272399902, "global_step": 207873, "epoch": 1237} {"train_loss": -11.515336990356445, "global_step": 207874, "epoch": 1237} {"train_loss": -11.640789985656738, "global_step": 207875, "epoch": 1237} {"train_loss": -11.61561107635498, "global_step": 207876, "epoch": 1237} {"train_loss": -11.161515235900879, "global_step": 207877, "epoch": 1237} {"train_loss": -11.509519577026367, "global_step": 207878, "epoch": 1237} {"train_loss": -11.562005996704102, "global_step": 207879, "epoch": 1237} {"train_loss": -11.479682922363281, "global_step": 207880, "epoch": 1237} {"train_loss": -11.63949966430664, "global_step": 207881, "epoch": 1237} {"train_loss": -11.649864196777344, "global_step": 207882, "epoch": 1237} {"train_loss": -11.445058822631836, "global_step": 207883, "epoch": 1237} {"train_loss": -11.3807373046875, "global_step": 207884, "epoch": 1237} {"train_loss": -11.502033233642578, "global_step": 207885, "epoch": 1237} {"train_loss": -11.599408149719238, "global_step": 207886, "epoch": 1237} {"train_loss": -11.45966911315918, "global_step": 207887, "epoch": 1237} {"train_loss": -11.775310516357422, "global_step": 207888, "epoch": 1237} {"train_loss": -11.501180648803711, "global_step": 207889, "epoch": 1237} {"train_loss": -11.445260047912598, "global_step": 207890, "epoch": 1237} {"train_loss": -11.405889511108398, "global_step": 207891, "epoch": 1237} {"train_loss": -11.876890182495117, "global_step": 207892, "epoch": 1237} {"train_loss": -11.66514778137207, "global_step": 207893, "epoch": 1237} {"train_loss": -11.75776481628418, "global_step": 207894, "epoch": 1237} {"train_loss": -11.711068153381348, "global_step": 207895, "epoch": 1237} {"train_loss": -11.556964874267578, "global_step": 207896, "epoch": 1237} {"train_loss": -11.555803298950195, "global_step": 207897, "epoch": 1237} {"train_loss": -11.847491264343262, "global_step": 207898, "epoch": 1237} {"train_loss": -11.930663108825684, "global_step": 207899, "epoch": 1237} {"train_loss": -11.607139587402344, "global_step": 207900, "epoch": 1237} {"train_loss": -11.646307945251465, "global_step": 207901, "epoch": 1237} {"train_loss": -11.870107650756836, "global_step": 207902, "epoch": 1237} {"train_loss": -11.713401794433594, "global_step": 207903, "epoch": 1237} {"train_loss": -11.678695678710938, "global_step": 207904, "epoch": 1237} {"train_loss": -12.01304817199707, "global_step": 207905, "epoch": 1237} {"train_loss": -11.728404998779297, "global_step": 207906, "epoch": 1237} {"train_loss": -11.84807300567627, "global_step": 207907, "epoch": 1237} {"train_loss": -11.836946487426758, "global_step": 207908, "epoch": 1237} {"train_loss": -11.790088653564453, "global_step": 207909, "epoch": 1237} {"train_loss": -11.775535583496094, "global_step": 207910, "epoch": 1237} {"train_loss": -11.500348091125488, "global_step": 207911, "epoch": 1237} {"train_loss": -11.609192848205566, "global_step": 207912, "epoch": 1237} {"train_loss": -10.969661712646484, "global_step": 207913, "epoch": 1237} {"train_loss": -11.337923049926758, "global_step": 207914, "epoch": 1237} {"train_loss": -11.388093948364258, "global_step": 207915, "epoch": 1237} {"train_loss": -11.331533432006836, "global_step": 207916, "epoch": 1237} {"train_loss": -11.615537643432617, "global_step": 207917, "epoch": 1237} {"train_loss": -11.291011810302734, "global_step": 207918, "epoch": 1237} {"train_loss": -11.067269325256348, "global_step": 207919, "epoch": 1237} {"train_loss": -10.916593551635742, "global_step": 207920, "epoch": 1237} {"train_loss": -10.059967994689941, "global_step": 207921, "epoch": 1237} {"train_loss": -10.984601974487305, "global_step": 207922, "epoch": 1237} {"train_loss": -11.132547378540039, "global_step": 207923, "epoch": 1237} {"train_loss": -11.523046493530273, "global_step": 207924, "epoch": 1237} {"train_loss": -10.754926681518555, "global_step": 207925, "epoch": 1237} {"train_loss": -11.543726921081543, "global_step": 207926, "epoch": 1237} {"train_loss": -10.908872604370117, "global_step": 207927, "epoch": 1237} {"train_loss": -11.376766204833984, "global_step": 207928, "epoch": 1237} {"train_loss": -11.418370246887207, "global_step": 207929, "epoch": 1237} {"train_loss": -11.49052906036377, "global_step": 207930, "epoch": 1237} {"train_loss": -11.112665176391602, "global_step": 207931, "epoch": 1237} {"train_loss": -11.533533096313477, "global_step": 207932, "epoch": 1237} {"train_loss": -11.47839069366455, "global_step": 207933, "epoch": 1237} {"train_loss": -11.417322158813477, "global_step": 207934, "epoch": 1237} {"train_loss": -11.092350959777832, "global_step": 207935, "epoch": 1237} {"train_loss": -11.556852340698242, "global_step": 207936, "epoch": 1237} {"train_loss": -11.386245727539062, "global_step": 207937, "epoch": 1237} {"train_loss": -11.58607006072998, "global_step": 207938, "epoch": 1237} {"train_loss": -11.027520179748535, "global_step": 207939, "epoch": 1237} {"train_loss": -11.353689193725586, "global_step": 207940, "epoch": 1237} {"train_loss": -11.207525253295898, "global_step": 207941, "epoch": 1237} {"train_loss": -11.599308013916016, "global_step": 207942, "epoch": 1237} {"train_loss": -11.642805099487305, "global_step": 207943, "epoch": 1237} {"train_loss": -11.3993501663208, "global_step": 207944, "epoch": 1237} {"train_loss": -11.345024108886719, "global_step": 207945, "epoch": 1237} {"train_loss": -11.498056411743164, "global_step": 207946, "epoch": 1237} {"train_loss": -11.557178497314453, "global_step": 207947, "epoch": 1237} {"train_loss": -11.462384223937988, "global_step": 207948, "epoch": 1237} {"train_loss": -11.256972312927246, "global_step": 207949, "epoch": 1237} {"train_loss": -11.57565689086914, "global_step": 207950, "epoch": 1237} {"train_loss": -11.465776443481445, "global_step": 207951, "epoch": 1237} {"train_loss": -11.459519386291504, "global_step": 207952, "epoch": 1237} {"train_loss": -11.467903137207031, "global_step": 207953, "epoch": 1237} {"train_loss": -11.026415824890137, "global_step": 207954, "epoch": 1237} {"train_loss": -11.41047477722168, "global_step": 207955, "epoch": 1237} {"train_loss": -10.823291778564453, "global_step": 207956, "epoch": 1237} {"train_loss": -11.335329055786133, "global_step": 207957, "epoch": 1237} {"train_loss": -10.957560539245605, "global_step": 207958, "epoch": 1237} {"train_loss": -11.400425910949707, "global_step": 207959, "epoch": 1237} {"train_loss": -10.887619018554688, "global_step": 207960, "epoch": 1237} {"train_loss": -10.814271926879883, "global_step": 207961, "epoch": 1237} {"train_loss": -11.58261489868164, "global_step": 207962, "epoch": 1237} {"train_loss": -10.675533294677734, "global_step": 207963, "epoch": 1237} {"train_loss": -11.312765121459961, "global_step": 207964, "epoch": 1237} {"train_loss": -11.186528205871582, "global_step": 207965, "epoch": 1237} {"train_loss": -11.036909103393555, "global_step": 207966, "epoch": 1237} {"train_loss": -11.586929321289062, "global_step": 207967, "epoch": 1237} {"train_loss": -10.461240768432617, "global_step": 207968, "epoch": 1237} {"train_loss": -11.02667236328125, "global_step": 207969, "epoch": 1237} {"train_loss": -9.891923904418945, "global_step": 207970, "epoch": 1237} {"train_loss": -11.437131881713867, "global_step": 207971, "epoch": 1237} {"train_loss": -10.114011764526367, "global_step": 207972, "epoch": 1237} {"train_loss": -10.921638488769531, "global_step": 207973, "epoch": 1237} {"train_loss": -9.161684036254883, "global_step": 207974, "epoch": 1237} {"train_loss": -11.450531959533691, "global_step": 207975, "epoch": 1237} {"train_loss": -10.400518417358398, "global_step": 207976, "epoch": 1237} {"train_loss": -11.572590827941895, "global_step": 207977, "epoch": 1237} {"train_loss": -10.57819652557373, "global_step": 207978, "epoch": 1237} {"train_loss": -11.07498550415039, "global_step": 207979, "epoch": 1237} {"train_loss": -10.2512845993042, "global_step": 207980, "epoch": 1237} {"train_loss": -10.963284492492676, "global_step": 207981, "epoch": 1237} {"train_loss": -9.793761253356934, "global_step": 207982, "epoch": 1237} {"train_loss": -11.243096402713231, "global_step": 207983, "epoch": 1237, "val_loss": 255289.15625} {"train_loss": -10.481049537658691, "global_step": 207984, "epoch": 1238} {"train_loss": -10.667682647705078, "global_step": 207985, "epoch": 1238} {"train_loss": -10.744410514831543, "global_step": 207986, "epoch": 1238} {"train_loss": -10.671436309814453, "global_step": 207987, "epoch": 1238} {"train_loss": -10.896406173706055, "global_step": 207988, "epoch": 1238} {"train_loss": -10.87992000579834, "global_step": 207989, "epoch": 1238} {"train_loss": -10.989086151123047, "global_step": 207990, "epoch": 1238} {"train_loss": -10.610076904296875, "global_step": 207991, "epoch": 1238} {"train_loss": -11.326883316040039, "global_step": 207992, "epoch": 1238} {"train_loss": -10.658716201782227, "global_step": 207993, "epoch": 1238} {"train_loss": -10.912877082824707, "global_step": 207994, "epoch": 1238} {"train_loss": -10.823587417602539, "global_step": 207995, "epoch": 1238} {"train_loss": -10.689050674438477, "global_step": 207996, "epoch": 1238} {"train_loss": -11.385557174682617, "global_step": 207997, "epoch": 1238} {"train_loss": -11.019346237182617, "global_step": 207998, "epoch": 1238} {"train_loss": -11.256532669067383, "global_step": 207999, "epoch": 1238} {"train_loss": -10.882927894592285, "global_step": 208000, "epoch": 1238} {"train_loss": -11.065990447998047, "global_step": 208001, "epoch": 1238} {"train_loss": -11.103569984436035, "global_step": 208002, "epoch": 1238} {"train_loss": -11.133522033691406, "global_step": 208003, "epoch": 1238} {"train_loss": -11.395622253417969, "global_step": 208004, "epoch": 1238} {"train_loss": -11.247429847717285, "global_step": 208005, "epoch": 1238} {"train_loss": -11.0672607421875, "global_step": 208006, "epoch": 1238} {"train_loss": -11.19599723815918, "global_step": 208007, "epoch": 1238} {"train_loss": -11.169143676757812, "global_step": 208008, "epoch": 1238} {"train_loss": -10.681173324584961, "global_step": 208009, "epoch": 1238} {"train_loss": -11.196735382080078, "global_step": 208010, "epoch": 1238} {"train_loss": -10.797834396362305, "global_step": 208011, "epoch": 1238} {"train_loss": -10.88525104522705, "global_step": 208012, "epoch": 1238} {"train_loss": -11.287836074829102, "global_step": 208013, "epoch": 1238} {"train_loss": -11.053173065185547, "global_step": 208014, "epoch": 1238} {"train_loss": -11.320222854614258, "global_step": 208015, "epoch": 1238} {"train_loss": -11.090429306030273, "global_step": 208016, "epoch": 1238} {"train_loss": -11.446529388427734, "global_step": 208017, "epoch": 1238} {"train_loss": -11.455163955688477, "global_step": 208018, "epoch": 1238} {"train_loss": -11.422037124633789, "global_step": 208019, "epoch": 1238} {"train_loss": -11.452696800231934, "global_step": 208020, "epoch": 1238} {"train_loss": -11.282981872558594, "global_step": 208021, "epoch": 1238} {"train_loss": -11.474861145019531, "global_step": 208022, "epoch": 1238} {"train_loss": -11.420305252075195, "global_step": 208023, "epoch": 1238} {"train_loss": -11.210977554321289, "global_step": 208024, "epoch": 1238} {"train_loss": -11.514986991882324, "global_step": 208025, "epoch": 1238} {"train_loss": -11.397698402404785, "global_step": 208026, "epoch": 1238} {"train_loss": -11.61798095703125, "global_step": 208027, "epoch": 1238} {"train_loss": -11.47769832611084, "global_step": 208028, "epoch": 1238} {"train_loss": -11.45079231262207, "global_step": 208029, "epoch": 1238} {"train_loss": -11.417814254760742, "global_step": 208030, "epoch": 1238} {"train_loss": -11.426794052124023, "global_step": 208031, "epoch": 1238} {"train_loss": -11.49026870727539, "global_step": 208032, "epoch": 1238} {"train_loss": -11.471529006958008, "global_step": 208033, "epoch": 1238} {"train_loss": -11.459369659423828, "global_step": 208034, "epoch": 1238} {"train_loss": -11.427281379699707, "global_step": 208035, "epoch": 1238} {"train_loss": -11.424762725830078, "global_step": 208036, "epoch": 1238} {"train_loss": -11.241178512573242, "global_step": 208037, "epoch": 1238} {"train_loss": -11.759544372558594, "global_step": 208038, "epoch": 1238} {"train_loss": -11.48475456237793, "global_step": 208039, "epoch": 1238} {"train_loss": -11.818061828613281, "global_step": 208040, "epoch": 1238} {"train_loss": -11.536643981933594, "global_step": 208041, "epoch": 1238} {"train_loss": -11.578286170959473, "global_step": 208042, "epoch": 1238} {"train_loss": -11.494457244873047, "global_step": 208043, "epoch": 1238} {"train_loss": -11.689762115478516, "global_step": 208044, "epoch": 1238} {"train_loss": -11.722618103027344, "global_step": 208045, "epoch": 1238} {"train_loss": -11.513106346130371, "global_step": 208046, "epoch": 1238} {"train_loss": -11.705297470092773, "global_step": 208047, "epoch": 1238} {"train_loss": -11.826325416564941, "global_step": 208048, "epoch": 1238} {"train_loss": -11.574018478393555, "global_step": 208049, "epoch": 1238} {"train_loss": -11.681635856628418, "global_step": 208050, "epoch": 1238} {"train_loss": -11.792827606201172, "global_step": 208051, "epoch": 1238} {"train_loss": -11.846733093261719, "global_step": 208052, "epoch": 1238} {"train_loss": -11.801865577697754, "global_step": 208053, "epoch": 1238} {"train_loss": -11.825557708740234, "global_step": 208054, "epoch": 1238} {"train_loss": -11.79130744934082, "global_step": 208055, "epoch": 1238} {"train_loss": -11.806252479553223, "global_step": 208056, "epoch": 1238} {"train_loss": -11.844060897827148, "global_step": 208057, "epoch": 1238} {"train_loss": -11.678834915161133, "global_step": 208058, "epoch": 1238} {"train_loss": -11.49683952331543, "global_step": 208059, "epoch": 1238} {"train_loss": -11.42241382598877, "global_step": 208060, "epoch": 1238} {"train_loss": -11.614882469177246, "global_step": 208061, "epoch": 1238} {"train_loss": -11.229814529418945, "global_step": 208062, "epoch": 1238} {"train_loss": -11.579360961914062, "global_step": 208063, "epoch": 1238} {"train_loss": -11.583008766174316, "global_step": 208064, "epoch": 1238} {"train_loss": -11.451375961303711, "global_step": 208065, "epoch": 1238} {"train_loss": -11.322256088256836, "global_step": 208066, "epoch": 1238} {"train_loss": -11.626527786254883, "global_step": 208067, "epoch": 1238} {"train_loss": -10.794116973876953, "global_step": 208068, "epoch": 1238} {"train_loss": -10.950946807861328, "global_step": 208069, "epoch": 1238} {"train_loss": -11.696110725402832, "global_step": 208070, "epoch": 1238} {"train_loss": -10.358417510986328, "global_step": 208071, "epoch": 1238} {"train_loss": -10.061994552612305, "global_step": 208072, "epoch": 1238} {"train_loss": -11.483367919921875, "global_step": 208073, "epoch": 1238} {"train_loss": -9.522679328918457, "global_step": 208074, "epoch": 1238} {"train_loss": -10.859350204467773, "global_step": 208075, "epoch": 1238} {"train_loss": -11.403383255004883, "global_step": 208076, "epoch": 1238} {"train_loss": -10.380270004272461, "global_step": 208077, "epoch": 1238} {"train_loss": -10.954584121704102, "global_step": 208078, "epoch": 1238} {"train_loss": -11.701728820800781, "global_step": 208079, "epoch": 1238} {"train_loss": -11.13538932800293, "global_step": 208080, "epoch": 1238} {"train_loss": -11.632768630981445, "global_step": 208081, "epoch": 1238} {"train_loss": -11.709993362426758, "global_step": 208082, "epoch": 1238} {"train_loss": -11.381857872009277, "global_step": 208083, "epoch": 1238} {"train_loss": -11.458260536193848, "global_step": 208084, "epoch": 1238} {"train_loss": -11.587158203125, "global_step": 208085, "epoch": 1238} {"train_loss": -11.475379943847656, "global_step": 208086, "epoch": 1238} {"train_loss": -11.529912948608398, "global_step": 208087, "epoch": 1238} {"train_loss": -11.525114059448242, "global_step": 208088, "epoch": 1238} {"train_loss": -11.623043060302734, "global_step": 208089, "epoch": 1238} {"train_loss": -11.531418800354004, "global_step": 208090, "epoch": 1238} {"train_loss": -11.421392440795898, "global_step": 208091, "epoch": 1238} {"train_loss": -11.108131408691406, "global_step": 208092, "epoch": 1238} {"train_loss": -11.071407318115234, "global_step": 208093, "epoch": 1238} {"train_loss": -10.026105880737305, "global_step": 208094, "epoch": 1238} {"train_loss": -10.833253860473633, "global_step": 208095, "epoch": 1238} {"train_loss": -11.116146087646484, "global_step": 208096, "epoch": 1238} {"train_loss": -10.944766998291016, "global_step": 208097, "epoch": 1238} {"train_loss": -10.71318244934082, "global_step": 208098, "epoch": 1238} {"train_loss": -11.520856857299805, "global_step": 208099, "epoch": 1238} {"train_loss": -10.569670677185059, "global_step": 208100, "epoch": 1238} {"train_loss": -10.639566421508789, "global_step": 208101, "epoch": 1238} {"train_loss": -11.284090042114258, "global_step": 208102, "epoch": 1238} {"train_loss": -10.823368072509766, "global_step": 208103, "epoch": 1238} {"train_loss": -11.074378967285156, "global_step": 208104, "epoch": 1238} {"train_loss": -11.127933502197266, "global_step": 208105, "epoch": 1238} {"train_loss": -11.374156951904297, "global_step": 208106, "epoch": 1238} {"train_loss": -11.072861671447754, "global_step": 208107, "epoch": 1238} {"train_loss": -11.133588790893555, "global_step": 208108, "epoch": 1238} {"train_loss": -10.903623580932617, "global_step": 208109, "epoch": 1238} {"train_loss": -11.24554443359375, "global_step": 208110, "epoch": 1238} {"train_loss": -10.91259765625, "global_step": 208111, "epoch": 1238} {"train_loss": -11.174962997436523, "global_step": 208112, "epoch": 1238} {"train_loss": -10.767890930175781, "global_step": 208113, "epoch": 1238} {"train_loss": -11.215814590454102, "global_step": 208114, "epoch": 1238} {"train_loss": -11.212812423706055, "global_step": 208115, "epoch": 1238} {"train_loss": -10.825239181518555, "global_step": 208116, "epoch": 1238} {"train_loss": -11.028711318969727, "global_step": 208117, "epoch": 1238} {"train_loss": -10.626646041870117, "global_step": 208118, "epoch": 1238} {"train_loss": -11.093680381774902, "global_step": 208119, "epoch": 1238} {"train_loss": -10.406838417053223, "global_step": 208120, "epoch": 1238} {"train_loss": -11.571327209472656, "global_step": 208121, "epoch": 1238} {"train_loss": -10.765886306762695, "global_step": 208122, "epoch": 1238} {"train_loss": -11.242019653320312, "global_step": 208123, "epoch": 1238} {"train_loss": -10.652297019958496, "global_step": 208124, "epoch": 1238} {"train_loss": -11.300235748291016, "global_step": 208125, "epoch": 1238} {"train_loss": -11.137057304382324, "global_step": 208126, "epoch": 1238} {"train_loss": -11.341876029968262, "global_step": 208127, "epoch": 1238} {"train_loss": -11.566065788269043, "global_step": 208128, "epoch": 1238} {"train_loss": -11.444048881530762, "global_step": 208129, "epoch": 1238} {"train_loss": -11.379671096801758, "global_step": 208130, "epoch": 1238} {"train_loss": -11.559196472167969, "global_step": 208131, "epoch": 1238} {"train_loss": -11.23066520690918, "global_step": 208132, "epoch": 1238} {"train_loss": -11.322010040283203, "global_step": 208133, "epoch": 1238} {"train_loss": -11.22378921508789, "global_step": 208134, "epoch": 1238} {"train_loss": -11.283300399780273, "global_step": 208135, "epoch": 1238} {"train_loss": -11.343891143798828, "global_step": 208136, "epoch": 1238} {"train_loss": -11.373722076416016, "global_step": 208137, "epoch": 1238} {"train_loss": -11.173931121826172, "global_step": 208138, "epoch": 1238} {"train_loss": -11.530881881713867, "global_step": 208139, "epoch": 1238} {"train_loss": -11.03819751739502, "global_step": 208140, "epoch": 1238} {"train_loss": -11.378971099853516, "global_step": 208141, "epoch": 1238} {"train_loss": -11.37165641784668, "global_step": 208142, "epoch": 1238} {"train_loss": -11.248506546020508, "global_step": 208143, "epoch": 1238} {"train_loss": -11.314070701599121, "global_step": 208144, "epoch": 1238} {"train_loss": -11.43441104888916, "global_step": 208145, "epoch": 1238} {"train_loss": -11.251441955566406, "global_step": 208146, "epoch": 1238} {"train_loss": -11.545417785644531, "global_step": 208147, "epoch": 1238} {"train_loss": -11.11679458618164, "global_step": 208148, "epoch": 1238} {"train_loss": -11.480829238891602, "global_step": 208149, "epoch": 1238} {"train_loss": -11.035704612731934, "global_step": 208150, "epoch": 1238} {"train_loss": -11.23533809185028, "global_step": 208151, "epoch": 1238, "val_loss": 255473.546875} {"train_loss": -10.88143539428711, "global_step": 208152, "epoch": 1239} {"train_loss": -11.256059646606445, "global_step": 208153, "epoch": 1239} {"train_loss": -11.115012168884277, "global_step": 208154, "epoch": 1239} {"train_loss": -10.84974479675293, "global_step": 208155, "epoch": 1239} {"train_loss": -11.321361541748047, "global_step": 208156, "epoch": 1239} {"train_loss": -9.712654113769531, "global_step": 208157, "epoch": 1239} {"train_loss": -11.281652450561523, "global_step": 208158, "epoch": 1239} {"train_loss": -9.86480712890625, "global_step": 208159, "epoch": 1239} {"train_loss": -11.324272155761719, "global_step": 208160, "epoch": 1239} {"train_loss": -10.727575302124023, "global_step": 208161, "epoch": 1239} {"train_loss": -10.326067924499512, "global_step": 208162, "epoch": 1239} {"train_loss": -11.329744338989258, "global_step": 208163, "epoch": 1239} {"train_loss": -10.606656074523926, "global_step": 208164, "epoch": 1239} {"train_loss": -11.26937484741211, "global_step": 208165, "epoch": 1239} {"train_loss": -10.446197509765625, "global_step": 208166, "epoch": 1239} {"train_loss": -10.982051849365234, "global_step": 208167, "epoch": 1239} {"train_loss": -10.674789428710938, "global_step": 208168, "epoch": 1239} {"train_loss": -11.459052085876465, "global_step": 208169, "epoch": 1239} {"train_loss": -10.44900894165039, "global_step": 208170, "epoch": 1239} {"train_loss": -11.255656242370605, "global_step": 208171, "epoch": 1239} {"train_loss": -10.916812896728516, "global_step": 208172, "epoch": 1239} {"train_loss": -11.350120544433594, "global_step": 208173, "epoch": 1239} {"train_loss": -11.000970840454102, "global_step": 208174, "epoch": 1239} {"train_loss": -11.098949432373047, "global_step": 208175, "epoch": 1239} {"train_loss": -10.732967376708984, "global_step": 208176, "epoch": 1239} {"train_loss": -11.33558177947998, "global_step": 208177, "epoch": 1239} {"train_loss": -10.897339820861816, "global_step": 208178, "epoch": 1239} {"train_loss": -11.257891654968262, "global_step": 208179, "epoch": 1239} {"train_loss": -10.783661842346191, "global_step": 208180, "epoch": 1239} {"train_loss": -11.241055488586426, "global_step": 208181, "epoch": 1239} {"train_loss": -11.135502815246582, "global_step": 208182, "epoch": 1239} {"train_loss": -11.0533447265625, "global_step": 208183, "epoch": 1239} {"train_loss": -11.246943473815918, "global_step": 208184, "epoch": 1239} {"train_loss": -11.428183555603027, "global_step": 208185, "epoch": 1239} {"train_loss": -11.117815017700195, "global_step": 208186, "epoch": 1239} {"train_loss": -11.340776443481445, "global_step": 208187, "epoch": 1239} {"train_loss": -11.329035758972168, "global_step": 208188, "epoch": 1239} {"train_loss": -10.810568809509277, "global_step": 208189, "epoch": 1239} {"train_loss": -11.465965270996094, "global_step": 208190, "epoch": 1239} {"train_loss": -11.330574035644531, "global_step": 208191, "epoch": 1239} {"train_loss": -10.96983528137207, "global_step": 208192, "epoch": 1239} {"train_loss": -11.436424255371094, "global_step": 208193, "epoch": 1239} {"train_loss": -11.073907852172852, "global_step": 208194, "epoch": 1239} {"train_loss": -11.448296546936035, "global_step": 208195, "epoch": 1239} {"train_loss": -11.505202293395996, "global_step": 208196, "epoch": 1239} {"train_loss": -11.497248649597168, "global_step": 208197, "epoch": 1239} {"train_loss": -11.332611083984375, "global_step": 208198, "epoch": 1239} {"train_loss": -11.846454620361328, "global_step": 208199, "epoch": 1239} {"train_loss": -11.227476119995117, "global_step": 208200, "epoch": 1239} {"train_loss": -11.571446418762207, "global_step": 208201, "epoch": 1239} {"train_loss": -11.261560440063477, "global_step": 208202, "epoch": 1239} {"train_loss": -11.24382209777832, "global_step": 208203, "epoch": 1239} {"train_loss": -11.406106948852539, "global_step": 208204, "epoch": 1239} {"train_loss": -11.271451950073242, "global_step": 208205, "epoch": 1239} {"train_loss": -11.658340454101562, "global_step": 208206, "epoch": 1239} {"train_loss": -11.54227066040039, "global_step": 208207, "epoch": 1239} {"train_loss": -11.645049095153809, "global_step": 208208, "epoch": 1239} {"train_loss": -11.73604679107666, "global_step": 208209, "epoch": 1239} {"train_loss": -11.637197494506836, "global_step": 208210, "epoch": 1239} {"train_loss": -11.650690078735352, "global_step": 208211, "epoch": 1239} {"train_loss": -11.010947227478027, "global_step": 208212, "epoch": 1239} {"train_loss": -11.508119583129883, "global_step": 208213, "epoch": 1239} {"train_loss": -11.58117961883545, "global_step": 208214, "epoch": 1239} {"train_loss": -11.559486389160156, "global_step": 208215, "epoch": 1239} {"train_loss": -11.501300811767578, "global_step": 208216, "epoch": 1239} {"train_loss": -11.510503768920898, "global_step": 208217, "epoch": 1239} {"train_loss": -11.51276969909668, "global_step": 208218, "epoch": 1239} {"train_loss": -11.276487350463867, "global_step": 208219, "epoch": 1239} {"train_loss": -11.35507869720459, "global_step": 208220, "epoch": 1239} {"train_loss": -11.258565902709961, "global_step": 208221, "epoch": 1239} {"train_loss": -11.684366226196289, "global_step": 208222, "epoch": 1239} {"train_loss": -11.375322341918945, "global_step": 208223, "epoch": 1239} {"train_loss": -11.454374313354492, "global_step": 208224, "epoch": 1239} {"train_loss": -11.502866744995117, "global_step": 208225, "epoch": 1239} {"train_loss": -11.510906219482422, "global_step": 208226, "epoch": 1239} {"train_loss": -11.263055801391602, "global_step": 208227, "epoch": 1239} {"train_loss": -11.380054473876953, "global_step": 208228, "epoch": 1239} {"train_loss": -11.455057144165039, "global_step": 208229, "epoch": 1239} {"train_loss": -11.311805725097656, "global_step": 208230, "epoch": 1239} {"train_loss": -11.80058479309082, "global_step": 208231, "epoch": 1239} {"train_loss": -11.18178939819336, "global_step": 208232, "epoch": 1239} {"train_loss": -11.748185157775879, "global_step": 208233, "epoch": 1239} {"train_loss": -11.1809720993042, "global_step": 208234, "epoch": 1239} {"train_loss": -11.302812576293945, "global_step": 208235, "epoch": 1239} {"train_loss": -11.760271072387695, "global_step": 208236, "epoch": 1239} {"train_loss": -11.148378372192383, "global_step": 208237, "epoch": 1239} {"train_loss": -11.679641723632812, "global_step": 208238, "epoch": 1239} {"train_loss": -11.446995735168457, "global_step": 208239, "epoch": 1239} {"train_loss": -11.38467025756836, "global_step": 208240, "epoch": 1239} {"train_loss": -11.647249221801758, "global_step": 208241, "epoch": 1239} {"train_loss": -11.329456329345703, "global_step": 208242, "epoch": 1239} {"train_loss": -11.656042098999023, "global_step": 208243, "epoch": 1239} {"train_loss": -11.399898529052734, "global_step": 208244, "epoch": 1239} {"train_loss": -11.774158477783203, "global_step": 208245, "epoch": 1239} {"train_loss": -11.562601089477539, "global_step": 208246, "epoch": 1239} {"train_loss": -11.51335620880127, "global_step": 208247, "epoch": 1239} {"train_loss": -11.679573059082031, "global_step": 208248, "epoch": 1239} {"train_loss": -11.36985969543457, "global_step": 208249, "epoch": 1239} {"train_loss": -11.648421287536621, "global_step": 208250, "epoch": 1239} {"train_loss": -11.27085018157959, "global_step": 208251, "epoch": 1239} {"train_loss": -11.805339813232422, "global_step": 208252, "epoch": 1239} {"train_loss": -11.39813232421875, "global_step": 208253, "epoch": 1239} {"train_loss": -11.646535873413086, "global_step": 208254, "epoch": 1239} {"train_loss": -11.28104305267334, "global_step": 208255, "epoch": 1239} {"train_loss": -11.727983474731445, "global_step": 208256, "epoch": 1239} {"train_loss": -11.393471717834473, "global_step": 208257, "epoch": 1239} {"train_loss": -11.757425308227539, "global_step": 208258, "epoch": 1239} {"train_loss": -11.477201461791992, "global_step": 208259, "epoch": 1239} {"train_loss": -11.552654266357422, "global_step": 208260, "epoch": 1239} {"train_loss": -11.262859344482422, "global_step": 208261, "epoch": 1239} {"train_loss": -11.298103332519531, "global_step": 208262, "epoch": 1239} {"train_loss": -11.248672485351562, "global_step": 208263, "epoch": 1239} {"train_loss": -11.202293395996094, "global_step": 208264, "epoch": 1239} {"train_loss": -10.645625114440918, "global_step": 208265, "epoch": 1239} {"train_loss": -10.764129638671875, "global_step": 208266, "epoch": 1239} {"train_loss": -11.001184463500977, "global_step": 208267, "epoch": 1239} {"train_loss": -11.360641479492188, "global_step": 208268, "epoch": 1239} {"train_loss": -10.703115463256836, "global_step": 208269, "epoch": 1239} {"train_loss": -11.068331718444824, "global_step": 208270, "epoch": 1239} {"train_loss": -11.18523120880127, "global_step": 208271, "epoch": 1239} {"train_loss": -11.406845092773438, "global_step": 208272, "epoch": 1239} {"train_loss": -11.228221893310547, "global_step": 208273, "epoch": 1239} {"train_loss": -11.235547065734863, "global_step": 208274, "epoch": 1239} {"train_loss": -10.833498001098633, "global_step": 208275, "epoch": 1239} {"train_loss": -11.593820571899414, "global_step": 208276, "epoch": 1239} {"train_loss": -11.402560234069824, "global_step": 208277, "epoch": 1239} {"train_loss": -11.100994110107422, "global_step": 208278, "epoch": 1239} {"train_loss": -11.114099502563477, "global_step": 208279, "epoch": 1239} {"train_loss": -11.200183868408203, "global_step": 208280, "epoch": 1239} {"train_loss": -11.444059371948242, "global_step": 208281, "epoch": 1239} {"train_loss": -11.523858070373535, "global_step": 208282, "epoch": 1239} {"train_loss": -11.141717910766602, "global_step": 208283, "epoch": 1239} {"train_loss": -11.004495620727539, "global_step": 208284, "epoch": 1239} {"train_loss": -11.516626358032227, "global_step": 208285, "epoch": 1239} {"train_loss": -11.217775344848633, "global_step": 208286, "epoch": 1239} {"train_loss": -11.571310043334961, "global_step": 208287, "epoch": 1239} {"train_loss": -11.230634689331055, "global_step": 208288, "epoch": 1239} {"train_loss": -11.618721008300781, "global_step": 208289, "epoch": 1239} {"train_loss": -11.488117218017578, "global_step": 208290, "epoch": 1239} {"train_loss": -11.445981979370117, "global_step": 208291, "epoch": 1239} {"train_loss": -11.576240539550781, "global_step": 208292, "epoch": 1239} {"train_loss": -10.6289701461792, "global_step": 208293, "epoch": 1239} {"train_loss": -11.33244514465332, "global_step": 208294, "epoch": 1239} {"train_loss": -11.068693161010742, "global_step": 208295, "epoch": 1239} {"train_loss": -11.086807250976562, "global_step": 208296, "epoch": 1239} {"train_loss": -11.607528686523438, "global_step": 208297, "epoch": 1239} {"train_loss": -10.933887481689453, "global_step": 208298, "epoch": 1239} {"train_loss": -11.459400177001953, "global_step": 208299, "epoch": 1239} {"train_loss": -11.211194038391113, "global_step": 208300, "epoch": 1239} {"train_loss": -10.67637825012207, "global_step": 208301, "epoch": 1239} {"train_loss": -11.422306060791016, "global_step": 208302, "epoch": 1239} {"train_loss": -10.999180793762207, "global_step": 208303, "epoch": 1239} {"train_loss": -11.22549057006836, "global_step": 208304, "epoch": 1239} {"train_loss": -11.302884101867676, "global_step": 208305, "epoch": 1239} {"train_loss": -11.225391387939453, "global_step": 208306, "epoch": 1239} {"train_loss": -11.513650894165039, "global_step": 208307, "epoch": 1239} {"train_loss": -11.341552734375, "global_step": 208308, "epoch": 1239} {"train_loss": -11.547174453735352, "global_step": 208309, "epoch": 1239} {"train_loss": -11.484903335571289, "global_step": 208310, "epoch": 1239} {"train_loss": -11.631481170654297, "global_step": 208311, "epoch": 1239} {"train_loss": -11.841425895690918, "global_step": 208312, "epoch": 1239} {"train_loss": -11.83104133605957, "global_step": 208313, "epoch": 1239} {"train_loss": -11.675039291381836, "global_step": 208314, "epoch": 1239} {"train_loss": -11.732715606689453, "global_step": 208315, "epoch": 1239} {"train_loss": -11.568132400512695, "global_step": 208316, "epoch": 1239} {"train_loss": -11.260404586791992, "global_step": 208317, "epoch": 1239} {"train_loss": -11.311933517456055, "global_step": 208318, "epoch": 1239} {"train_loss": -11.292290812446957, "global_step": 208319, "epoch": 1239, "val_loss": 254976.03125} {"train_loss": -11.771234512329102, "global_step": 208320, "epoch": 1240} {"train_loss": -10.783729553222656, "global_step": 208321, "epoch": 1240} {"train_loss": -11.380620002746582, "global_step": 208322, "epoch": 1240} {"train_loss": -11.399681091308594, "global_step": 208323, "epoch": 1240} {"train_loss": -10.89158821105957, "global_step": 208324, "epoch": 1240} {"train_loss": -11.334474563598633, "global_step": 208325, "epoch": 1240} {"train_loss": -11.189377784729004, "global_step": 208326, "epoch": 1240} {"train_loss": -11.211441040039062, "global_step": 208327, "epoch": 1240} {"train_loss": -11.015382766723633, "global_step": 208328, "epoch": 1240} {"train_loss": -11.316259384155273, "global_step": 208329, "epoch": 1240} {"train_loss": -11.28732967376709, "global_step": 208330, "epoch": 1240} {"train_loss": -11.438759803771973, "global_step": 208331, "epoch": 1240} {"train_loss": -11.41382884979248, "global_step": 208332, "epoch": 1240} {"train_loss": -11.350616455078125, "global_step": 208333, "epoch": 1240} {"train_loss": -11.56825065612793, "global_step": 208334, "epoch": 1240} {"train_loss": -11.325334548950195, "global_step": 208335, "epoch": 1240} {"train_loss": -11.49288272857666, "global_step": 208336, "epoch": 1240} {"train_loss": -11.581859588623047, "global_step": 208337, "epoch": 1240} {"train_loss": -11.443883895874023, "global_step": 208338, "epoch": 1240} {"train_loss": -10.970864295959473, "global_step": 208339, "epoch": 1240} {"train_loss": -11.302252769470215, "global_step": 208340, "epoch": 1240} {"train_loss": -11.3095703125, "global_step": 208341, "epoch": 1240} {"train_loss": -11.735681533813477, "global_step": 208342, "epoch": 1240} {"train_loss": -10.98336410522461, "global_step": 208343, "epoch": 1240} {"train_loss": -11.693700790405273, "global_step": 208344, "epoch": 1240} {"train_loss": -11.433307647705078, "global_step": 208345, "epoch": 1240} {"train_loss": -11.554534912109375, "global_step": 208346, "epoch": 1240} {"train_loss": -11.562332153320312, "global_step": 208347, "epoch": 1240} {"train_loss": -11.328328132629395, "global_step": 208348, "epoch": 1240} {"train_loss": -11.661169052124023, "global_step": 208349, "epoch": 1240} {"train_loss": -11.29988956451416, "global_step": 208350, "epoch": 1240} {"train_loss": -11.426252365112305, "global_step": 208351, "epoch": 1240} {"train_loss": -11.356180191040039, "global_step": 208352, "epoch": 1240} {"train_loss": -11.468955993652344, "global_step": 208353, "epoch": 1240} {"train_loss": -11.495290756225586, "global_step": 208354, "epoch": 1240} {"train_loss": -11.734185218811035, "global_step": 208355, "epoch": 1240} {"train_loss": -11.498979568481445, "global_step": 208356, "epoch": 1240} {"train_loss": -11.622098922729492, "global_step": 208357, "epoch": 1240} {"train_loss": -11.477439880371094, "global_step": 208358, "epoch": 1240} {"train_loss": -11.849735260009766, "global_step": 208359, "epoch": 1240} {"train_loss": -11.35425090789795, "global_step": 208360, "epoch": 1240} {"train_loss": -11.316549301147461, "global_step": 208361, "epoch": 1240} {"train_loss": -11.658251762390137, "global_step": 208362, "epoch": 1240} {"train_loss": -11.220199584960938, "global_step": 208363, "epoch": 1240} {"train_loss": -11.759027481079102, "global_step": 208364, "epoch": 1240} {"train_loss": -11.363487243652344, "global_step": 208365, "epoch": 1240} {"train_loss": -11.564943313598633, "global_step": 208366, "epoch": 1240} {"train_loss": -11.581985473632812, "global_step": 208367, "epoch": 1240} {"train_loss": -11.48341178894043, "global_step": 208368, "epoch": 1240} {"train_loss": -11.217662811279297, "global_step": 208369, "epoch": 1240} {"train_loss": -11.026561737060547, "global_step": 208370, "epoch": 1240} {"train_loss": -11.527196884155273, "global_step": 208371, "epoch": 1240} {"train_loss": -11.398164749145508, "global_step": 208372, "epoch": 1240} {"train_loss": -11.099509239196777, "global_step": 208373, "epoch": 1240} {"train_loss": -11.571542739868164, "global_step": 208374, "epoch": 1240} {"train_loss": -10.422691345214844, "global_step": 208375, "epoch": 1240} {"train_loss": -10.28526496887207, "global_step": 208376, "epoch": 1240} {"train_loss": -11.248078346252441, "global_step": 208377, "epoch": 1240} {"train_loss": -10.84040641784668, "global_step": 208378, "epoch": 1240} {"train_loss": -10.429746627807617, "global_step": 208379, "epoch": 1240} {"train_loss": -10.407751083374023, "global_step": 208380, "epoch": 1240} {"train_loss": -9.98314094543457, "global_step": 208381, "epoch": 1240} {"train_loss": -10.25790786743164, "global_step": 208382, "epoch": 1240} {"train_loss": -10.00216293334961, "global_step": 208383, "epoch": 1240} {"train_loss": -11.097902297973633, "global_step": 208384, "epoch": 1240} {"train_loss": -8.470279693603516, "global_step": 208385, "epoch": 1240} {"train_loss": -11.310663223266602, "global_step": 208386, "epoch": 1240} {"train_loss": -9.085097312927246, "global_step": 208387, "epoch": 1240} {"train_loss": -11.266308784484863, "global_step": 208388, "epoch": 1240} {"train_loss": -10.951262474060059, "global_step": 208389, "epoch": 1240} {"train_loss": -10.829030990600586, "global_step": 208390, "epoch": 1240} {"train_loss": -10.93144416809082, "global_step": 208391, "epoch": 1240} {"train_loss": -11.034858703613281, "global_step": 208392, "epoch": 1240} {"train_loss": -10.634467124938965, "global_step": 208393, "epoch": 1240} {"train_loss": -11.31572437286377, "global_step": 208394, "epoch": 1240} {"train_loss": -10.71499252319336, "global_step": 208395, "epoch": 1240} {"train_loss": -10.937477111816406, "global_step": 208396, "epoch": 1240} {"train_loss": -10.884845733642578, "global_step": 208397, "epoch": 1240} {"train_loss": -11.112083435058594, "global_step": 208398, "epoch": 1240} {"train_loss": -10.74520206451416, "global_step": 208399, "epoch": 1240} {"train_loss": -10.600748062133789, "global_step": 208400, "epoch": 1240} {"train_loss": -11.166820526123047, "global_step": 208401, "epoch": 1240} {"train_loss": -9.878424644470215, "global_step": 208402, "epoch": 1240} {"train_loss": -11.32888126373291, "global_step": 208403, "epoch": 1240} {"train_loss": -10.602567672729492, "global_step": 208404, "epoch": 1240} {"train_loss": -11.218132019042969, "global_step": 208405, "epoch": 1240} {"train_loss": -10.98801040649414, "global_step": 208406, "epoch": 1240} {"train_loss": -10.980437278747559, "global_step": 208407, "epoch": 1240} {"train_loss": -11.179513931274414, "global_step": 208408, "epoch": 1240} {"train_loss": -10.994078636169434, "global_step": 208409, "epoch": 1240} {"train_loss": -11.347004890441895, "global_step": 208410, "epoch": 1240} {"train_loss": -10.872785568237305, "global_step": 208411, "epoch": 1240} {"train_loss": -11.249350547790527, "global_step": 208412, "epoch": 1240} {"train_loss": -10.948320388793945, "global_step": 208413, "epoch": 1240} {"train_loss": -11.225737571716309, "global_step": 208414, "epoch": 1240} {"train_loss": -11.574060440063477, "global_step": 208415, "epoch": 1240} {"train_loss": -11.170639038085938, "global_step": 208416, "epoch": 1240} {"train_loss": -11.429622650146484, "global_step": 208417, "epoch": 1240} {"train_loss": -11.474658966064453, "global_step": 208418, "epoch": 1240} {"train_loss": -11.515291213989258, "global_step": 208419, "epoch": 1240} {"train_loss": -11.539921760559082, "global_step": 208420, "epoch": 1240} {"train_loss": -11.493139266967773, "global_step": 208421, "epoch": 1240} {"train_loss": -11.416162490844727, "global_step": 208422, "epoch": 1240} {"train_loss": -11.599506378173828, "global_step": 208423, "epoch": 1240} {"train_loss": -11.554319381713867, "global_step": 208424, "epoch": 1240} {"train_loss": -11.456336975097656, "global_step": 208425, "epoch": 1240} {"train_loss": -11.598227500915527, "global_step": 208426, "epoch": 1240} {"train_loss": -11.760892868041992, "global_step": 208427, "epoch": 1240} {"train_loss": -11.73589038848877, "global_step": 208428, "epoch": 1240} {"train_loss": -11.599000930786133, "global_step": 208429, "epoch": 1240} {"train_loss": -11.574036598205566, "global_step": 208430, "epoch": 1240} {"train_loss": -11.690361976623535, "global_step": 208431, "epoch": 1240} {"train_loss": -11.714527130126953, "global_step": 208432, "epoch": 1240} {"train_loss": -11.734109878540039, "global_step": 208433, "epoch": 1240} {"train_loss": -11.683637619018555, "global_step": 208434, "epoch": 1240} {"train_loss": -11.562658309936523, "global_step": 208435, "epoch": 1240} {"train_loss": -11.66166877746582, "global_step": 208436, "epoch": 1240} {"train_loss": -11.566764831542969, "global_step": 208437, "epoch": 1240} {"train_loss": -11.793283462524414, "global_step": 208438, "epoch": 1240} {"train_loss": -11.566450119018555, "global_step": 208439, "epoch": 1240} {"train_loss": -11.645763397216797, "global_step": 208440, "epoch": 1240} {"train_loss": -11.780241012573242, "global_step": 208441, "epoch": 1240} {"train_loss": -11.767864227294922, "global_step": 208442, "epoch": 1240} {"train_loss": -11.631052017211914, "global_step": 208443, "epoch": 1240} {"train_loss": -11.800512313842773, "global_step": 208444, "epoch": 1240} {"train_loss": -11.86836051940918, "global_step": 208445, "epoch": 1240} {"train_loss": -11.662385940551758, "global_step": 208446, "epoch": 1240} {"train_loss": -11.557233810424805, "global_step": 208447, "epoch": 1240} {"train_loss": -11.918268203735352, "global_step": 208448, "epoch": 1240} {"train_loss": -11.370389938354492, "global_step": 208449, "epoch": 1240} {"train_loss": -11.613808631896973, "global_step": 208450, "epoch": 1240} {"train_loss": -11.8684720993042, "global_step": 208451, "epoch": 1240} {"train_loss": -11.23267936706543, "global_step": 208452, "epoch": 1240} {"train_loss": -10.089767456054688, "global_step": 208453, "epoch": 1240} {"train_loss": -10.888810157775879, "global_step": 208454, "epoch": 1240} {"train_loss": -11.63473129272461, "global_step": 208455, "epoch": 1240} {"train_loss": -11.113157272338867, "global_step": 208456, "epoch": 1240} {"train_loss": -10.462493896484375, "global_step": 208457, "epoch": 1240} {"train_loss": -11.716606140136719, "global_step": 208458, "epoch": 1240} {"train_loss": -10.428598403930664, "global_step": 208459, "epoch": 1240} {"train_loss": -10.011150360107422, "global_step": 208460, "epoch": 1240} {"train_loss": -10.431204795837402, "global_step": 208461, "epoch": 1240} {"train_loss": -11.419418334960938, "global_step": 208462, "epoch": 1240} {"train_loss": -11.05239200592041, "global_step": 208463, "epoch": 1240} {"train_loss": -11.421181678771973, "global_step": 208464, "epoch": 1240} {"train_loss": -11.462929725646973, "global_step": 208465, "epoch": 1240} {"train_loss": -10.85300350189209, "global_step": 208466, "epoch": 1240} {"train_loss": -11.019402503967285, "global_step": 208467, "epoch": 1240} {"train_loss": -11.072075843811035, "global_step": 208468, "epoch": 1240} {"train_loss": -11.60621452331543, "global_step": 208469, "epoch": 1240} {"train_loss": -10.788021087646484, "global_step": 208470, "epoch": 1240} {"train_loss": -11.260232925415039, "global_step": 208471, "epoch": 1240} {"train_loss": -10.956086158752441, "global_step": 208472, "epoch": 1240} {"train_loss": -11.224803924560547, "global_step": 208473, "epoch": 1240} {"train_loss": -11.004659652709961, "global_step": 208474, "epoch": 1240} {"train_loss": -11.152576446533203, "global_step": 208475, "epoch": 1240} {"train_loss": -11.105802536010742, "global_step": 208476, "epoch": 1240} {"train_loss": -11.409139633178711, "global_step": 208477, "epoch": 1240} {"train_loss": -11.280416488647461, "global_step": 208478, "epoch": 1240} {"train_loss": -11.262031555175781, "global_step": 208479, "epoch": 1240} {"train_loss": -11.31378173828125, "global_step": 208480, "epoch": 1240} {"train_loss": -11.605262756347656, "global_step": 208481, "epoch": 1240} {"train_loss": -11.255395889282227, "global_step": 208482, "epoch": 1240} {"train_loss": -11.467445373535156, "global_step": 208483, "epoch": 1240} {"train_loss": -11.398338317871094, "global_step": 208484, "epoch": 1240} {"train_loss": -11.787684440612793, "global_step": 208485, "epoch": 1240} {"train_loss": -11.160009384155273, "global_step": 208486, "epoch": 1240} {"train_loss": -11.235311054048085, "global_step": 208487, "epoch": 1240, "val_loss": 248498.515625, "train_action_mse_error": 0.6454320549964905} {"train_loss": -10.969873428344727, "global_step": 208488, "epoch": 1241} {"train_loss": -11.214702606201172, "global_step": 208489, "epoch": 1241} {"train_loss": -11.205679893493652, "global_step": 208490, "epoch": 1241} {"train_loss": -11.161056518554688, "global_step": 208491, "epoch": 1241} {"train_loss": -11.047386169433594, "global_step": 208492, "epoch": 1241} {"train_loss": -11.349004745483398, "global_step": 208493, "epoch": 1241} {"train_loss": -10.90267562866211, "global_step": 208494, "epoch": 1241} {"train_loss": -10.941965103149414, "global_step": 208495, "epoch": 1241} {"train_loss": -11.41845417022705, "global_step": 208496, "epoch": 1241} {"train_loss": -10.79273796081543, "global_step": 208497, "epoch": 1241} {"train_loss": -11.548599243164062, "global_step": 208498, "epoch": 1241} {"train_loss": -10.923376083374023, "global_step": 208499, "epoch": 1241} {"train_loss": -11.366268157958984, "global_step": 208500, "epoch": 1241} {"train_loss": -11.27568531036377, "global_step": 208501, "epoch": 1241} {"train_loss": -11.15049934387207, "global_step": 208502, "epoch": 1241} {"train_loss": -11.222835540771484, "global_step": 208503, "epoch": 1241} {"train_loss": -11.152738571166992, "global_step": 208504, "epoch": 1241} {"train_loss": -10.972454071044922, "global_step": 208505, "epoch": 1241} {"train_loss": -11.21429443359375, "global_step": 208506, "epoch": 1241} {"train_loss": -11.065760612487793, "global_step": 208507, "epoch": 1241} {"train_loss": -11.2878999710083, "global_step": 208508, "epoch": 1241} {"train_loss": -11.148670196533203, "global_step": 208509, "epoch": 1241} {"train_loss": -11.576583862304688, "global_step": 208510, "epoch": 1241} {"train_loss": -11.129207611083984, "global_step": 208511, "epoch": 1241} {"train_loss": -11.676542282104492, "global_step": 208512, "epoch": 1241} {"train_loss": -11.180459976196289, "global_step": 208513, "epoch": 1241} {"train_loss": -11.418214797973633, "global_step": 208514, "epoch": 1241} {"train_loss": -11.48727035522461, "global_step": 208515, "epoch": 1241} {"train_loss": -11.153665542602539, "global_step": 208516, "epoch": 1241} {"train_loss": -11.55052375793457, "global_step": 208517, "epoch": 1241} {"train_loss": -11.279269218444824, "global_step": 208518, "epoch": 1241} {"train_loss": -11.653814315795898, "global_step": 208519, "epoch": 1241} {"train_loss": -11.357942581176758, "global_step": 208520, "epoch": 1241} {"train_loss": -11.472935676574707, "global_step": 208521, "epoch": 1241} {"train_loss": -11.5633544921875, "global_step": 208522, "epoch": 1241} {"train_loss": -11.366888046264648, "global_step": 208523, "epoch": 1241} {"train_loss": -11.672100067138672, "global_step": 208524, "epoch": 1241} {"train_loss": -11.320551872253418, "global_step": 208525, "epoch": 1241} {"train_loss": -11.420567512512207, "global_step": 208526, "epoch": 1241} {"train_loss": -11.46884536743164, "global_step": 208527, "epoch": 1241} {"train_loss": -11.605278015136719, "global_step": 208528, "epoch": 1241} {"train_loss": -11.435117721557617, "global_step": 208529, "epoch": 1241} {"train_loss": -11.462312698364258, "global_step": 208530, "epoch": 1241} {"train_loss": -11.538089752197266, "global_step": 208531, "epoch": 1241} {"train_loss": -11.096577644348145, "global_step": 208532, "epoch": 1241} {"train_loss": -11.51222038269043, "global_step": 208533, "epoch": 1241} {"train_loss": -10.983015060424805, "global_step": 208534, "epoch": 1241} {"train_loss": -11.512182235717773, "global_step": 208535, "epoch": 1241} {"train_loss": -11.041802406311035, "global_step": 208536, "epoch": 1241} {"train_loss": -11.382061958312988, "global_step": 208537, "epoch": 1241} {"train_loss": -11.498723983764648, "global_step": 208538, "epoch": 1241} {"train_loss": -11.166297912597656, "global_step": 208539, "epoch": 1241} {"train_loss": -11.17947769165039, "global_step": 208540, "epoch": 1241} {"train_loss": -11.20370864868164, "global_step": 208541, "epoch": 1241} {"train_loss": -11.488773345947266, "global_step": 208542, "epoch": 1241} {"train_loss": -10.967170715332031, "global_step": 208543, "epoch": 1241} {"train_loss": -11.593830108642578, "global_step": 208544, "epoch": 1241} {"train_loss": -11.265548706054688, "global_step": 208545, "epoch": 1241} {"train_loss": -11.495767593383789, "global_step": 208546, "epoch": 1241} {"train_loss": -10.779457092285156, "global_step": 208547, "epoch": 1241} {"train_loss": -11.37595272064209, "global_step": 208548, "epoch": 1241} {"train_loss": -11.005413055419922, "global_step": 208549, "epoch": 1241} {"train_loss": -11.22951889038086, "global_step": 208550, "epoch": 1241} {"train_loss": -11.275672912597656, "global_step": 208551, "epoch": 1241} {"train_loss": -10.866874694824219, "global_step": 208552, "epoch": 1241} {"train_loss": -11.568452835083008, "global_step": 208553, "epoch": 1241} {"train_loss": -11.370529174804688, "global_step": 208554, "epoch": 1241} {"train_loss": -11.709707260131836, "global_step": 208555, "epoch": 1241} {"train_loss": -11.511510848999023, "global_step": 208556, "epoch": 1241} {"train_loss": -11.81434154510498, "global_step": 208557, "epoch": 1241} {"train_loss": -11.788776397705078, "global_step": 208558, "epoch": 1241} {"train_loss": -11.614253044128418, "global_step": 208559, "epoch": 1241} {"train_loss": -11.834981918334961, "global_step": 208560, "epoch": 1241} {"train_loss": -11.848718643188477, "global_step": 208561, "epoch": 1241} {"train_loss": -11.86376667022705, "global_step": 208562, "epoch": 1241} {"train_loss": -11.718240737915039, "global_step": 208563, "epoch": 1241} {"train_loss": -11.500604629516602, "global_step": 208564, "epoch": 1241} {"train_loss": -11.884421348571777, "global_step": 208565, "epoch": 1241} {"train_loss": -11.46641731262207, "global_step": 208566, "epoch": 1241} {"train_loss": -11.710824966430664, "global_step": 208567, "epoch": 1241} {"train_loss": -11.610481262207031, "global_step": 208568, "epoch": 1241} {"train_loss": -11.907035827636719, "global_step": 208569, "epoch": 1241} {"train_loss": -11.762250900268555, "global_step": 208570, "epoch": 1241} {"train_loss": -11.81329345703125, "global_step": 208571, "epoch": 1241} {"train_loss": -11.619964599609375, "global_step": 208572, "epoch": 1241} {"train_loss": -11.82199478149414, "global_step": 208573, "epoch": 1241} {"train_loss": -11.741543769836426, "global_step": 208574, "epoch": 1241} {"train_loss": -11.771657943725586, "global_step": 208575, "epoch": 1241} {"train_loss": -11.874592781066895, "global_step": 208576, "epoch": 1241} {"train_loss": -11.396596908569336, "global_step": 208577, "epoch": 1241} {"train_loss": -11.804330825805664, "global_step": 208578, "epoch": 1241} {"train_loss": -11.67348861694336, "global_step": 208579, "epoch": 1241} {"train_loss": -11.435669898986816, "global_step": 208580, "epoch": 1241} {"train_loss": -11.495508193969727, "global_step": 208581, "epoch": 1241} {"train_loss": -11.44582748413086, "global_step": 208582, "epoch": 1241} {"train_loss": -11.331645965576172, "global_step": 208583, "epoch": 1241} {"train_loss": -11.379706382751465, "global_step": 208584, "epoch": 1241} {"train_loss": -11.48309326171875, "global_step": 208585, "epoch": 1241} {"train_loss": -11.311263084411621, "global_step": 208586, "epoch": 1241} {"train_loss": -11.577447891235352, "global_step": 208587, "epoch": 1241} {"train_loss": -11.278715133666992, "global_step": 208588, "epoch": 1241} {"train_loss": -11.133888244628906, "global_step": 208589, "epoch": 1241} {"train_loss": -11.770155906677246, "global_step": 208590, "epoch": 1241} {"train_loss": -11.43061637878418, "global_step": 208591, "epoch": 1241} {"train_loss": -11.315774917602539, "global_step": 208592, "epoch": 1241} {"train_loss": -11.275494575500488, "global_step": 208593, "epoch": 1241} {"train_loss": -11.483634948730469, "global_step": 208594, "epoch": 1241} {"train_loss": -11.095787048339844, "global_step": 208595, "epoch": 1241} {"train_loss": -11.539730072021484, "global_step": 208596, "epoch": 1241} {"train_loss": -11.373254776000977, "global_step": 208597, "epoch": 1241} {"train_loss": -11.384441375732422, "global_step": 208598, "epoch": 1241} {"train_loss": -11.477699279785156, "global_step": 208599, "epoch": 1241} {"train_loss": -11.3167724609375, "global_step": 208600, "epoch": 1241} {"train_loss": -11.59032917022705, "global_step": 208601, "epoch": 1241} {"train_loss": -11.477134704589844, "global_step": 208602, "epoch": 1241} {"train_loss": -11.613248825073242, "global_step": 208603, "epoch": 1241} {"train_loss": -11.73509407043457, "global_step": 208604, "epoch": 1241} {"train_loss": -11.696093559265137, "global_step": 208605, "epoch": 1241} {"train_loss": -11.364068984985352, "global_step": 208606, "epoch": 1241} {"train_loss": -11.71883487701416, "global_step": 208607, "epoch": 1241} {"train_loss": -11.574167251586914, "global_step": 208608, "epoch": 1241} {"train_loss": -11.736795425415039, "global_step": 208609, "epoch": 1241} {"train_loss": -11.21563720703125, "global_step": 208610, "epoch": 1241} {"train_loss": -11.323241233825684, "global_step": 208611, "epoch": 1241} {"train_loss": -11.687612533569336, "global_step": 208612, "epoch": 1241} {"train_loss": -11.547738075256348, "global_step": 208613, "epoch": 1241} {"train_loss": -10.95747184753418, "global_step": 208614, "epoch": 1241} {"train_loss": -11.487154960632324, "global_step": 208615, "epoch": 1241} {"train_loss": -11.23072338104248, "global_step": 208616, "epoch": 1241} {"train_loss": -11.244091033935547, "global_step": 208617, "epoch": 1241} {"train_loss": -10.946237564086914, "global_step": 208618, "epoch": 1241} {"train_loss": -11.083399772644043, "global_step": 208619, "epoch": 1241} {"train_loss": -11.28664779663086, "global_step": 208620, "epoch": 1241} {"train_loss": -11.29948616027832, "global_step": 208621, "epoch": 1241} {"train_loss": -11.32349681854248, "global_step": 208622, "epoch": 1241} {"train_loss": -11.404479026794434, "global_step": 208623, "epoch": 1241} {"train_loss": -11.211477279663086, "global_step": 208624, "epoch": 1241} {"train_loss": -11.198022842407227, "global_step": 208625, "epoch": 1241} {"train_loss": -10.887367248535156, "global_step": 208626, "epoch": 1241} {"train_loss": -11.22134017944336, "global_step": 208627, "epoch": 1241} {"train_loss": -11.468549728393555, "global_step": 208628, "epoch": 1241} {"train_loss": -11.209268569946289, "global_step": 208629, "epoch": 1241} {"train_loss": -11.307815551757812, "global_step": 208630, "epoch": 1241} {"train_loss": -10.995405197143555, "global_step": 208631, "epoch": 1241} {"train_loss": -10.794775009155273, "global_step": 208632, "epoch": 1241} {"train_loss": -11.570072174072266, "global_step": 208633, "epoch": 1241} {"train_loss": -11.041810989379883, "global_step": 208634, "epoch": 1241} {"train_loss": -11.474359512329102, "global_step": 208635, "epoch": 1241} {"train_loss": -10.941791534423828, "global_step": 208636, "epoch": 1241} {"train_loss": -11.179624557495117, "global_step": 208637, "epoch": 1241} {"train_loss": -11.49093246459961, "global_step": 208638, "epoch": 1241} {"train_loss": -10.963579177856445, "global_step": 208639, "epoch": 1241} {"train_loss": -11.074006080627441, "global_step": 208640, "epoch": 1241} {"train_loss": -11.2326021194458, "global_step": 208641, "epoch": 1241} {"train_loss": -11.019097328186035, "global_step": 208642, "epoch": 1241} {"train_loss": -11.441869735717773, "global_step": 208643, "epoch": 1241} {"train_loss": -10.992899894714355, "global_step": 208644, "epoch": 1241} {"train_loss": -11.194467544555664, "global_step": 208645, "epoch": 1241} {"train_loss": -11.046613693237305, "global_step": 208646, "epoch": 1241} {"train_loss": -11.179789543151855, "global_step": 208647, "epoch": 1241} {"train_loss": -10.861153602600098, "global_step": 208648, "epoch": 1241} {"train_loss": -11.180368423461914, "global_step": 208649, "epoch": 1241} {"train_loss": -11.59344482421875, "global_step": 208650, "epoch": 1241} {"train_loss": -11.07281494140625, "global_step": 208651, "epoch": 1241} {"train_loss": -11.686895370483398, "global_step": 208652, "epoch": 1241} {"train_loss": -11.52334976196289, "global_step": 208653, "epoch": 1241} {"train_loss": -10.86374282836914, "global_step": 208654, "epoch": 1241} {"train_loss": -11.364105150813149, "global_step": 208655, "epoch": 1241, "val_loss": 257641.703125} {"train_loss": -10.785924911499023, "global_step": 208656, "epoch": 1242} {"train_loss": -11.008190155029297, "global_step": 208657, "epoch": 1242} {"train_loss": -11.507396697998047, "global_step": 208658, "epoch": 1242} {"train_loss": -11.126189231872559, "global_step": 208659, "epoch": 1242} {"train_loss": -11.496143341064453, "global_step": 208660, "epoch": 1242} {"train_loss": -11.501763343811035, "global_step": 208661, "epoch": 1242} {"train_loss": -11.172542572021484, "global_step": 208662, "epoch": 1242} {"train_loss": -10.989164352416992, "global_step": 208663, "epoch": 1242} {"train_loss": -11.307365417480469, "global_step": 208664, "epoch": 1242} {"train_loss": -11.619640350341797, "global_step": 208665, "epoch": 1242} {"train_loss": -11.2930326461792, "global_step": 208666, "epoch": 1242} {"train_loss": -11.665079116821289, "global_step": 208667, "epoch": 1242} {"train_loss": -11.244855880737305, "global_step": 208668, "epoch": 1242} {"train_loss": -11.54996109008789, "global_step": 208669, "epoch": 1242} {"train_loss": -11.23263168334961, "global_step": 208670, "epoch": 1242} {"train_loss": -11.719381332397461, "global_step": 208671, "epoch": 1242} {"train_loss": -10.59878921508789, "global_step": 208672, "epoch": 1242} {"train_loss": -11.805150985717773, "global_step": 208673, "epoch": 1242} {"train_loss": -10.814094543457031, "global_step": 208674, "epoch": 1242} {"train_loss": -10.687379837036133, "global_step": 208675, "epoch": 1242} {"train_loss": -11.446283340454102, "global_step": 208676, "epoch": 1242} {"train_loss": -10.544506072998047, "global_step": 208677, "epoch": 1242} {"train_loss": -11.243511199951172, "global_step": 208678, "epoch": 1242} {"train_loss": -11.101122856140137, "global_step": 208679, "epoch": 1242} {"train_loss": -10.781015396118164, "global_step": 208680, "epoch": 1242} {"train_loss": -11.358742713928223, "global_step": 208681, "epoch": 1242} {"train_loss": -10.640054702758789, "global_step": 208682, "epoch": 1242} {"train_loss": -11.20218276977539, "global_step": 208683, "epoch": 1242} {"train_loss": -11.021060943603516, "global_step": 208684, "epoch": 1242} {"train_loss": -11.209738731384277, "global_step": 208685, "epoch": 1242} {"train_loss": -11.287837028503418, "global_step": 208686, "epoch": 1242} {"train_loss": -10.955055236816406, "global_step": 208687, "epoch": 1242} {"train_loss": -11.448835372924805, "global_step": 208688, "epoch": 1242} {"train_loss": -10.20609188079834, "global_step": 208689, "epoch": 1242} {"train_loss": -11.604101181030273, "global_step": 208690, "epoch": 1242} {"train_loss": -10.380599021911621, "global_step": 208691, "epoch": 1242} {"train_loss": -9.74291706085205, "global_step": 208692, "epoch": 1242} {"train_loss": -10.680566787719727, "global_step": 208693, "epoch": 1242} {"train_loss": -9.759822845458984, "global_step": 208694, "epoch": 1242} {"train_loss": -10.890077590942383, "global_step": 208695, "epoch": 1242} {"train_loss": -9.169525146484375, "global_step": 208696, "epoch": 1242} {"train_loss": -11.087224960327148, "global_step": 208697, "epoch": 1242} {"train_loss": -9.094168663024902, "global_step": 208698, "epoch": 1242} {"train_loss": -10.524003982543945, "global_step": 208699, "epoch": 1242} {"train_loss": -9.826973915100098, "global_step": 208700, "epoch": 1242} {"train_loss": -10.039777755737305, "global_step": 208701, "epoch": 1242} {"train_loss": -9.536428451538086, "global_step": 208702, "epoch": 1242} {"train_loss": -9.213842391967773, "global_step": 208703, "epoch": 1242} {"train_loss": -10.382104873657227, "global_step": 208704, "epoch": 1242} {"train_loss": -8.80355453491211, "global_step": 208705, "epoch": 1242} {"train_loss": -10.709685325622559, "global_step": 208706, "epoch": 1242} {"train_loss": -9.175674438476562, "global_step": 208707, "epoch": 1242} {"train_loss": -10.33692741394043, "global_step": 208708, "epoch": 1242} {"train_loss": -9.649173736572266, "global_step": 208709, "epoch": 1242} {"train_loss": -10.200929641723633, "global_step": 208710, "epoch": 1242} {"train_loss": -10.631356239318848, "global_step": 208711, "epoch": 1242} {"train_loss": -9.975885391235352, "global_step": 208712, "epoch": 1242} {"train_loss": -10.562358856201172, "global_step": 208713, "epoch": 1242} {"train_loss": -10.908447265625, "global_step": 208714, "epoch": 1242} {"train_loss": -10.945916175842285, "global_step": 208715, "epoch": 1242} {"train_loss": -11.092121124267578, "global_step": 208716, "epoch": 1242} {"train_loss": -10.892593383789062, "global_step": 208717, "epoch": 1242} {"train_loss": -10.696516036987305, "global_step": 208718, "epoch": 1242} {"train_loss": -11.069047927856445, "global_step": 208719, "epoch": 1242} {"train_loss": -10.763794898986816, "global_step": 208720, "epoch": 1242} {"train_loss": -11.067479133605957, "global_step": 208721, "epoch": 1242} {"train_loss": -10.93433952331543, "global_step": 208722, "epoch": 1242} {"train_loss": -10.88913345336914, "global_step": 208723, "epoch": 1242} {"train_loss": -11.288936614990234, "global_step": 208724, "epoch": 1242} {"train_loss": -11.054414749145508, "global_step": 208725, "epoch": 1242} {"train_loss": -11.164539337158203, "global_step": 208726, "epoch": 1242} {"train_loss": -11.235736846923828, "global_step": 208727, "epoch": 1242} {"train_loss": -11.011934280395508, "global_step": 208728, "epoch": 1242} {"train_loss": -11.261199951171875, "global_step": 208729, "epoch": 1242} {"train_loss": -11.202804565429688, "global_step": 208730, "epoch": 1242} {"train_loss": -11.009742736816406, "global_step": 208731, "epoch": 1242} {"train_loss": -11.344087600708008, "global_step": 208732, "epoch": 1242} {"train_loss": -11.326809883117676, "global_step": 208733, "epoch": 1242} {"train_loss": -11.14250373840332, "global_step": 208734, "epoch": 1242} {"train_loss": -11.200855255126953, "global_step": 208735, "epoch": 1242} {"train_loss": -11.212888717651367, "global_step": 208736, "epoch": 1242} {"train_loss": -11.316788673400879, "global_step": 208737, "epoch": 1242} {"train_loss": -11.20329475402832, "global_step": 208738, "epoch": 1242} {"train_loss": -11.208821296691895, "global_step": 208739, "epoch": 1242} {"train_loss": -11.334562301635742, "global_step": 208740, "epoch": 1242} {"train_loss": -11.326037406921387, "global_step": 208741, "epoch": 1242} {"train_loss": -11.392633438110352, "global_step": 208742, "epoch": 1242} {"train_loss": -11.508601188659668, "global_step": 208743, "epoch": 1242} {"train_loss": -11.452560424804688, "global_step": 208744, "epoch": 1242} {"train_loss": -11.318726539611816, "global_step": 208745, "epoch": 1242} {"train_loss": -11.522978782653809, "global_step": 208746, "epoch": 1242} {"train_loss": -11.529212951660156, "global_step": 208747, "epoch": 1242} {"train_loss": -11.45213794708252, "global_step": 208748, "epoch": 1242} {"train_loss": -11.617780685424805, "global_step": 208749, "epoch": 1242} {"train_loss": -11.499421119689941, "global_step": 208750, "epoch": 1242} {"train_loss": -11.622743606567383, "global_step": 208751, "epoch": 1242} {"train_loss": -11.47943115234375, "global_step": 208752, "epoch": 1242} {"train_loss": -11.575557708740234, "global_step": 208753, "epoch": 1242} {"train_loss": -11.5619478225708, "global_step": 208754, "epoch": 1242} {"train_loss": -11.543619155883789, "global_step": 208755, "epoch": 1242} {"train_loss": -11.629158020019531, "global_step": 208756, "epoch": 1242} {"train_loss": -11.578311920166016, "global_step": 208757, "epoch": 1242} {"train_loss": -11.633052825927734, "global_step": 208758, "epoch": 1242} {"train_loss": -11.659582138061523, "global_step": 208759, "epoch": 1242} {"train_loss": -11.696260452270508, "global_step": 208760, "epoch": 1242} {"train_loss": -11.711565017700195, "global_step": 208761, "epoch": 1242} {"train_loss": -11.474422454833984, "global_step": 208762, "epoch": 1242} {"train_loss": -11.637908935546875, "global_step": 208763, "epoch": 1242} {"train_loss": -11.739408493041992, "global_step": 208764, "epoch": 1242} {"train_loss": -11.533906936645508, "global_step": 208765, "epoch": 1242} {"train_loss": -11.888312339782715, "global_step": 208766, "epoch": 1242} {"train_loss": -11.755733489990234, "global_step": 208767, "epoch": 1242} {"train_loss": -11.846579551696777, "global_step": 208768, "epoch": 1242} {"train_loss": -11.715336799621582, "global_step": 208769, "epoch": 1242} {"train_loss": -11.588522911071777, "global_step": 208770, "epoch": 1242} {"train_loss": -11.66193962097168, "global_step": 208771, "epoch": 1242} {"train_loss": -11.67566967010498, "global_step": 208772, "epoch": 1242} {"train_loss": -11.632650375366211, "global_step": 208773, "epoch": 1242} {"train_loss": -11.785767555236816, "global_step": 208774, "epoch": 1242} {"train_loss": -11.909866333007812, "global_step": 208775, "epoch": 1242} {"train_loss": -11.806278228759766, "global_step": 208776, "epoch": 1242} {"train_loss": -11.721626281738281, "global_step": 208777, "epoch": 1242} {"train_loss": -11.822956085205078, "global_step": 208778, "epoch": 1242} {"train_loss": -11.866514205932617, "global_step": 208779, "epoch": 1242} {"train_loss": -11.837827682495117, "global_step": 208780, "epoch": 1242} {"train_loss": -12.072999954223633, "global_step": 208781, "epoch": 1242} {"train_loss": -11.84014892578125, "global_step": 208782, "epoch": 1242} {"train_loss": -11.997686386108398, "global_step": 208783, "epoch": 1242} {"train_loss": -11.831665992736816, "global_step": 208784, "epoch": 1242} {"train_loss": -11.95758056640625, "global_step": 208785, "epoch": 1242} {"train_loss": -11.83071231842041, "global_step": 208786, "epoch": 1242} {"train_loss": -12.027637481689453, "global_step": 208787, "epoch": 1242} {"train_loss": -11.690428733825684, "global_step": 208788, "epoch": 1242} {"train_loss": -11.519012451171875, "global_step": 208789, "epoch": 1242} {"train_loss": -11.62547492980957, "global_step": 208790, "epoch": 1242} {"train_loss": -10.631913185119629, "global_step": 208791, "epoch": 1242} {"train_loss": -11.526976585388184, "global_step": 208792, "epoch": 1242} {"train_loss": -11.067594528198242, "global_step": 208793, "epoch": 1242} {"train_loss": -11.240163803100586, "global_step": 208794, "epoch": 1242} {"train_loss": -11.237785339355469, "global_step": 208795, "epoch": 1242} {"train_loss": -11.125308990478516, "global_step": 208796, "epoch": 1242} {"train_loss": -11.426036834716797, "global_step": 208797, "epoch": 1242} {"train_loss": -11.127500534057617, "global_step": 208798, "epoch": 1242} {"train_loss": -11.24006462097168, "global_step": 208799, "epoch": 1242} {"train_loss": -10.804084777832031, "global_step": 208800, "epoch": 1242} {"train_loss": -10.297935485839844, "global_step": 208801, "epoch": 1242} {"train_loss": -10.97651195526123, "global_step": 208802, "epoch": 1242} {"train_loss": -11.022171020507812, "global_step": 208803, "epoch": 1242} {"train_loss": -11.247421264648438, "global_step": 208804, "epoch": 1242} {"train_loss": -11.688803672790527, "global_step": 208805, "epoch": 1242} {"train_loss": -11.355661392211914, "global_step": 208806, "epoch": 1242} {"train_loss": -10.855672836303711, "global_step": 208807, "epoch": 1242} {"train_loss": -11.020023345947266, "global_step": 208808, "epoch": 1242} {"train_loss": -11.134510040283203, "global_step": 208809, "epoch": 1242} {"train_loss": -11.139301300048828, "global_step": 208810, "epoch": 1242} {"train_loss": -10.986478805541992, "global_step": 208811, "epoch": 1242} {"train_loss": -10.953348159790039, "global_step": 208812, "epoch": 1242} {"train_loss": -10.673900604248047, "global_step": 208813, "epoch": 1242} {"train_loss": -11.203227996826172, "global_step": 208814, "epoch": 1242} {"train_loss": -11.195552825927734, "global_step": 208815, "epoch": 1242} {"train_loss": -10.891653060913086, "global_step": 208816, "epoch": 1242} {"train_loss": -10.986309051513672, "global_step": 208817, "epoch": 1242} {"train_loss": -10.2611083984375, "global_step": 208818, "epoch": 1242} {"train_loss": -10.590883255004883, "global_step": 208819, "epoch": 1242} {"train_loss": -10.43820571899414, "global_step": 208820, "epoch": 1242} {"train_loss": -10.937233924865723, "global_step": 208821, "epoch": 1242} {"train_loss": -10.609025955200195, "global_step": 208822, "epoch": 1242} {"train_loss": -11.116087919189816, "global_step": 208823, "epoch": 1242, "val_loss": 256377.1875} {"train_loss": -10.24577808380127, "global_step": 208824, "epoch": 1243} {"train_loss": -10.797258377075195, "global_step": 208825, "epoch": 1243} {"train_loss": -9.397528648376465, "global_step": 208826, "epoch": 1243} {"train_loss": -11.05282211303711, "global_step": 208827, "epoch": 1243} {"train_loss": -10.517562866210938, "global_step": 208828, "epoch": 1243} {"train_loss": -10.52422046661377, "global_step": 208829, "epoch": 1243} {"train_loss": -10.222283363342285, "global_step": 208830, "epoch": 1243} {"train_loss": -10.49760627746582, "global_step": 208831, "epoch": 1243} {"train_loss": -9.857484817504883, "global_step": 208832, "epoch": 1243} {"train_loss": -11.180051803588867, "global_step": 208833, "epoch": 1243} {"train_loss": -10.287649154663086, "global_step": 208834, "epoch": 1243} {"train_loss": -10.382630348205566, "global_step": 208835, "epoch": 1243} {"train_loss": -11.215919494628906, "global_step": 208836, "epoch": 1243} {"train_loss": -10.481155395507812, "global_step": 208837, "epoch": 1243} {"train_loss": -11.213184356689453, "global_step": 208838, "epoch": 1243} {"train_loss": -10.305342674255371, "global_step": 208839, "epoch": 1243} {"train_loss": -10.188998222351074, "global_step": 208840, "epoch": 1243} {"train_loss": -10.900165557861328, "global_step": 208841, "epoch": 1243} {"train_loss": -10.578102111816406, "global_step": 208842, "epoch": 1243} {"train_loss": -10.477789878845215, "global_step": 208843, "epoch": 1243} {"train_loss": -11.022098541259766, "global_step": 208844, "epoch": 1243} {"train_loss": -10.941736221313477, "global_step": 208845, "epoch": 1243} {"train_loss": -10.753824234008789, "global_step": 208846, "epoch": 1243} {"train_loss": -10.948662757873535, "global_step": 208847, "epoch": 1243} {"train_loss": -10.840805053710938, "global_step": 208848, "epoch": 1243} {"train_loss": -10.511188507080078, "global_step": 208849, "epoch": 1243} {"train_loss": -11.263542175292969, "global_step": 208850, "epoch": 1243} {"train_loss": -10.85295295715332, "global_step": 208851, "epoch": 1243} {"train_loss": -10.88539981842041, "global_step": 208852, "epoch": 1243} {"train_loss": -10.900623321533203, "global_step": 208853, "epoch": 1243} {"train_loss": -11.114490509033203, "global_step": 208854, "epoch": 1243} {"train_loss": -10.656222343444824, "global_step": 208855, "epoch": 1243} {"train_loss": -10.792570114135742, "global_step": 208856, "epoch": 1243} {"train_loss": -11.331610679626465, "global_step": 208857, "epoch": 1243} {"train_loss": -10.936675071716309, "global_step": 208858, "epoch": 1243} {"train_loss": -10.983250617980957, "global_step": 208859, "epoch": 1243} {"train_loss": -11.38046646118164, "global_step": 208860, "epoch": 1243} {"train_loss": -11.210366249084473, "global_step": 208861, "epoch": 1243} {"train_loss": -10.981833457946777, "global_step": 208862, "epoch": 1243} {"train_loss": -11.419559478759766, "global_step": 208863, "epoch": 1243} {"train_loss": -11.331222534179688, "global_step": 208864, "epoch": 1243} {"train_loss": -11.325879096984863, "global_step": 208865, "epoch": 1243} {"train_loss": -11.445329666137695, "global_step": 208866, "epoch": 1243} {"train_loss": -11.344980239868164, "global_step": 208867, "epoch": 1243} {"train_loss": -11.31392765045166, "global_step": 208868, "epoch": 1243} {"train_loss": -11.31813907623291, "global_step": 208869, "epoch": 1243} {"train_loss": -11.436625480651855, "global_step": 208870, "epoch": 1243} {"train_loss": -11.347692489624023, "global_step": 208871, "epoch": 1243} {"train_loss": -11.434127807617188, "global_step": 208872, "epoch": 1243} {"train_loss": -11.462233543395996, "global_step": 208873, "epoch": 1243} {"train_loss": -11.39756965637207, "global_step": 208874, "epoch": 1243} {"train_loss": -11.518779754638672, "global_step": 208875, "epoch": 1243} {"train_loss": -11.594202041625977, "global_step": 208876, "epoch": 1243} {"train_loss": -11.471649169921875, "global_step": 208877, "epoch": 1243} {"train_loss": -11.469873428344727, "global_step": 208878, "epoch": 1243} {"train_loss": -11.695369720458984, "global_step": 208879, "epoch": 1243} {"train_loss": -11.824811935424805, "global_step": 208880, "epoch": 1243} {"train_loss": -11.576401710510254, "global_step": 208881, "epoch": 1243} {"train_loss": -11.818095207214355, "global_step": 208882, "epoch": 1243} {"train_loss": -11.768272399902344, "global_step": 208883, "epoch": 1243} {"train_loss": -11.736800193786621, "global_step": 208884, "epoch": 1243} {"train_loss": -11.552574157714844, "global_step": 208885, "epoch": 1243} {"train_loss": -11.786295890808105, "global_step": 208886, "epoch": 1243} {"train_loss": -11.772655487060547, "global_step": 208887, "epoch": 1243} {"train_loss": -11.873085021972656, "global_step": 208888, "epoch": 1243} {"train_loss": -11.815241813659668, "global_step": 208889, "epoch": 1243} {"train_loss": -11.880623817443848, "global_step": 208890, "epoch": 1243} {"train_loss": -11.822901725769043, "global_step": 208891, "epoch": 1243} {"train_loss": -11.889568328857422, "global_step": 208892, "epoch": 1243} {"train_loss": -11.748781204223633, "global_step": 208893, "epoch": 1243} {"train_loss": -11.822216033935547, "global_step": 208894, "epoch": 1243} {"train_loss": -11.871074676513672, "global_step": 208895, "epoch": 1243} {"train_loss": -11.890427589416504, "global_step": 208896, "epoch": 1243} {"train_loss": -11.853004455566406, "global_step": 208897, "epoch": 1243} {"train_loss": -11.911154747009277, "global_step": 208898, "epoch": 1243} {"train_loss": -11.827926635742188, "global_step": 208899, "epoch": 1243} {"train_loss": -12.027008056640625, "global_step": 208900, "epoch": 1243} {"train_loss": -11.926742553710938, "global_step": 208901, "epoch": 1243} {"train_loss": -11.914741516113281, "global_step": 208902, "epoch": 1243} {"train_loss": -11.800047874450684, "global_step": 208903, "epoch": 1243} {"train_loss": -11.80776596069336, "global_step": 208904, "epoch": 1243} {"train_loss": -11.98664665222168, "global_step": 208905, "epoch": 1243} {"train_loss": -11.756545066833496, "global_step": 208906, "epoch": 1243} {"train_loss": -11.904733657836914, "global_step": 208907, "epoch": 1243} {"train_loss": -11.70167350769043, "global_step": 208908, "epoch": 1243} {"train_loss": -11.863489151000977, "global_step": 208909, "epoch": 1243} {"train_loss": -11.545979499816895, "global_step": 208910, "epoch": 1243} {"train_loss": -11.553094863891602, "global_step": 208911, "epoch": 1243} {"train_loss": -11.660934448242188, "global_step": 208912, "epoch": 1243} {"train_loss": -11.37507438659668, "global_step": 208913, "epoch": 1243} {"train_loss": -11.123618125915527, "global_step": 208914, "epoch": 1243} {"train_loss": -11.262823104858398, "global_step": 208915, "epoch": 1243} {"train_loss": -11.450417518615723, "global_step": 208916, "epoch": 1243} {"train_loss": -10.639278411865234, "global_step": 208917, "epoch": 1243} {"train_loss": -9.879046440124512, "global_step": 208918, "epoch": 1243} {"train_loss": -10.235322952270508, "global_step": 208919, "epoch": 1243} {"train_loss": -10.522022247314453, "global_step": 208920, "epoch": 1243} {"train_loss": -10.214646339416504, "global_step": 208921, "epoch": 1243} {"train_loss": -10.347222328186035, "global_step": 208922, "epoch": 1243} {"train_loss": -8.845014572143555, "global_step": 208923, "epoch": 1243} {"train_loss": -10.835174560546875, "global_step": 208924, "epoch": 1243} {"train_loss": -9.167930603027344, "global_step": 208925, "epoch": 1243} {"train_loss": -10.40084171295166, "global_step": 208926, "epoch": 1243} {"train_loss": -9.754608154296875, "global_step": 208927, "epoch": 1243} {"train_loss": -7.7398905754089355, "global_step": 208928, "epoch": 1243} {"train_loss": -8.144815444946289, "global_step": 208929, "epoch": 1243} {"train_loss": -10.246912956237793, "global_step": 208930, "epoch": 1243} {"train_loss": -8.453733444213867, "global_step": 208931, "epoch": 1243} {"train_loss": -10.43478775024414, "global_step": 208932, "epoch": 1243} {"train_loss": -9.093050003051758, "global_step": 208933, "epoch": 1243} {"train_loss": -9.155719757080078, "global_step": 208934, "epoch": 1243} {"train_loss": -8.783747673034668, "global_step": 208935, "epoch": 1243} {"train_loss": -9.439020156860352, "global_step": 208936, "epoch": 1243} {"train_loss": -10.34776782989502, "global_step": 208937, "epoch": 1243} {"train_loss": -9.414847373962402, "global_step": 208938, "epoch": 1243} {"train_loss": -10.341211318969727, "global_step": 208939, "epoch": 1243} {"train_loss": -10.196893692016602, "global_step": 208940, "epoch": 1243} {"train_loss": -10.415090560913086, "global_step": 208941, "epoch": 1243} {"train_loss": -10.177912712097168, "global_step": 208942, "epoch": 1243} {"train_loss": -10.935951232910156, "global_step": 208943, "epoch": 1243} {"train_loss": -10.34226131439209, "global_step": 208944, "epoch": 1243} {"train_loss": -10.64009952545166, "global_step": 208945, "epoch": 1243} {"train_loss": -10.883281707763672, "global_step": 208946, "epoch": 1243} {"train_loss": -10.417454719543457, "global_step": 208947, "epoch": 1243} {"train_loss": -10.793771743774414, "global_step": 208948, "epoch": 1243} {"train_loss": -10.885869979858398, "global_step": 208949, "epoch": 1243} {"train_loss": -10.90622329711914, "global_step": 208950, "epoch": 1243} {"train_loss": -10.84567642211914, "global_step": 208951, "epoch": 1243} {"train_loss": -10.801992416381836, "global_step": 208952, "epoch": 1243} {"train_loss": -11.111040115356445, "global_step": 208953, "epoch": 1243} {"train_loss": -10.823200225830078, "global_step": 208954, "epoch": 1243} {"train_loss": -11.21712589263916, "global_step": 208955, "epoch": 1243} {"train_loss": -10.955282211303711, "global_step": 208956, "epoch": 1243} {"train_loss": -10.978437423706055, "global_step": 208957, "epoch": 1243} {"train_loss": -11.151578903198242, "global_step": 208958, "epoch": 1243} {"train_loss": -11.037177085876465, "global_step": 208959, "epoch": 1243} {"train_loss": -10.832664489746094, "global_step": 208960, "epoch": 1243} {"train_loss": -11.003433227539062, "global_step": 208961, "epoch": 1243} {"train_loss": -10.904488563537598, "global_step": 208962, "epoch": 1243} {"train_loss": -11.281116485595703, "global_step": 208963, "epoch": 1243} {"train_loss": -10.793119430541992, "global_step": 208964, "epoch": 1243} {"train_loss": -10.99135971069336, "global_step": 208965, "epoch": 1243} {"train_loss": -11.148646354675293, "global_step": 208966, "epoch": 1243} {"train_loss": -10.906972885131836, "global_step": 208967, "epoch": 1243} {"train_loss": -11.115751266479492, "global_step": 208968, "epoch": 1243} {"train_loss": -11.137971878051758, "global_step": 208969, "epoch": 1243} {"train_loss": -11.112451553344727, "global_step": 208970, "epoch": 1243} {"train_loss": -10.92345142364502, "global_step": 208971, "epoch": 1243} {"train_loss": -11.087202072143555, "global_step": 208972, "epoch": 1243} {"train_loss": -11.141960144042969, "global_step": 208973, "epoch": 1243} {"train_loss": -11.341100692749023, "global_step": 208974, "epoch": 1243} {"train_loss": -11.366355895996094, "global_step": 208975, "epoch": 1243} {"train_loss": -11.245935440063477, "global_step": 208976, "epoch": 1243} {"train_loss": -11.219409942626953, "global_step": 208977, "epoch": 1243} {"train_loss": -11.129812240600586, "global_step": 208978, "epoch": 1243} {"train_loss": -11.233346939086914, "global_step": 208979, "epoch": 1243} {"train_loss": -11.37766170501709, "global_step": 208980, "epoch": 1243} {"train_loss": -11.423038482666016, "global_step": 208981, "epoch": 1243} {"train_loss": -11.514472007751465, "global_step": 208982, "epoch": 1243} {"train_loss": -11.314906120300293, "global_step": 208983, "epoch": 1243} {"train_loss": -11.202591896057129, "global_step": 208984, "epoch": 1243} {"train_loss": -11.384037971496582, "global_step": 208985, "epoch": 1243} {"train_loss": -11.425898551940918, "global_step": 208986, "epoch": 1243} {"train_loss": -11.543791770935059, "global_step": 208987, "epoch": 1243} {"train_loss": -11.561721801757812, "global_step": 208988, "epoch": 1243} {"train_loss": -11.524534225463867, "global_step": 208989, "epoch": 1243} {"train_loss": -11.502604484558105, "global_step": 208990, "epoch": 1243} {"train_loss": -10.980839510758718, "global_step": 208991, "epoch": 1243, "val_loss": 252544.53125} {"train_loss": -11.600725173950195, "global_step": 208992, "epoch": 1244} {"train_loss": -11.511454582214355, "global_step": 208993, "epoch": 1244} {"train_loss": -11.43091869354248, "global_step": 208994, "epoch": 1244} {"train_loss": -11.595138549804688, "global_step": 208995, "epoch": 1244} {"train_loss": -11.659168243408203, "global_step": 208996, "epoch": 1244} {"train_loss": -11.692577362060547, "global_step": 208997, "epoch": 1244} {"train_loss": -11.646458625793457, "global_step": 208998, "epoch": 1244} {"train_loss": -11.745670318603516, "global_step": 208999, "epoch": 1244} {"train_loss": -11.60883903503418, "global_step": 209000, "epoch": 1244} {"train_loss": -11.677980422973633, "global_step": 209001, "epoch": 1244} {"train_loss": -11.623656272888184, "global_step": 209002, "epoch": 1244} {"train_loss": -11.470916748046875, "global_step": 209003, "epoch": 1244} {"train_loss": -11.667633056640625, "global_step": 209004, "epoch": 1244} {"train_loss": -11.586524963378906, "global_step": 209005, "epoch": 1244} {"train_loss": -11.59412956237793, "global_step": 209006, "epoch": 1244} {"train_loss": -11.813142776489258, "global_step": 209007, "epoch": 1244} {"train_loss": -11.52483081817627, "global_step": 209008, "epoch": 1244} {"train_loss": -11.559510231018066, "global_step": 209009, "epoch": 1244} {"train_loss": -11.727182388305664, "global_step": 209010, "epoch": 1244} {"train_loss": -11.79218864440918, "global_step": 209011, "epoch": 1244} {"train_loss": -11.76915454864502, "global_step": 209012, "epoch": 1244} {"train_loss": -11.637443542480469, "global_step": 209013, "epoch": 1244} {"train_loss": -11.681567192077637, "global_step": 209014, "epoch": 1244} {"train_loss": -11.848979949951172, "global_step": 209015, "epoch": 1244} {"train_loss": -11.704419136047363, "global_step": 209016, "epoch": 1244} {"train_loss": -11.429378509521484, "global_step": 209017, "epoch": 1244} {"train_loss": -11.821980476379395, "global_step": 209018, "epoch": 1244} {"train_loss": -11.78924560546875, "global_step": 209019, "epoch": 1244} {"train_loss": -11.584598541259766, "global_step": 209020, "epoch": 1244} {"train_loss": -11.570150375366211, "global_step": 209021, "epoch": 1244} {"train_loss": -11.592941284179688, "global_step": 209022, "epoch": 1244} {"train_loss": -11.734848022460938, "global_step": 209023, "epoch": 1244} {"train_loss": -11.37550163269043, "global_step": 209024, "epoch": 1244} {"train_loss": -11.578245162963867, "global_step": 209025, "epoch": 1244} {"train_loss": -11.528658866882324, "global_step": 209026, "epoch": 1244} {"train_loss": -11.47601318359375, "global_step": 209027, "epoch": 1244} {"train_loss": -11.45090103149414, "global_step": 209028, "epoch": 1244} {"train_loss": -11.70541763305664, "global_step": 209029, "epoch": 1244} {"train_loss": -11.601335525512695, "global_step": 209030, "epoch": 1244} {"train_loss": -11.76094913482666, "global_step": 209031, "epoch": 1244} {"train_loss": -11.761398315429688, "global_step": 209032, "epoch": 1244} {"train_loss": -11.904481887817383, "global_step": 209033, "epoch": 1244} {"train_loss": -11.532169342041016, "global_step": 209034, "epoch": 1244} {"train_loss": -11.776223182678223, "global_step": 209035, "epoch": 1244} {"train_loss": -11.373401641845703, "global_step": 209036, "epoch": 1244} {"train_loss": -11.024066925048828, "global_step": 209037, "epoch": 1244} {"train_loss": -11.48943042755127, "global_step": 209038, "epoch": 1244} {"train_loss": -12.10003662109375, "global_step": 209039, "epoch": 1244} {"train_loss": -11.671514511108398, "global_step": 209040, "epoch": 1244} {"train_loss": -11.438729286193848, "global_step": 209041, "epoch": 1244} {"train_loss": -11.25110912322998, "global_step": 209042, "epoch": 1244} {"train_loss": -11.646964073181152, "global_step": 209043, "epoch": 1244} {"train_loss": -11.354738235473633, "global_step": 209044, "epoch": 1244} {"train_loss": -11.520708084106445, "global_step": 209045, "epoch": 1244} {"train_loss": -11.491376876831055, "global_step": 209046, "epoch": 1244} {"train_loss": -12.030269622802734, "global_step": 209047, "epoch": 1244} {"train_loss": -11.323354721069336, "global_step": 209048, "epoch": 1244} {"train_loss": -11.312314987182617, "global_step": 209049, "epoch": 1244} {"train_loss": -11.545337677001953, "global_step": 209050, "epoch": 1244} {"train_loss": -10.756895065307617, "global_step": 209051, "epoch": 1244} {"train_loss": -11.39067268371582, "global_step": 209052, "epoch": 1244} {"train_loss": -11.494178771972656, "global_step": 209053, "epoch": 1244} {"train_loss": -11.24665355682373, "global_step": 209054, "epoch": 1244} {"train_loss": -11.311357498168945, "global_step": 209055, "epoch": 1244} {"train_loss": -10.89466381072998, "global_step": 209056, "epoch": 1244} {"train_loss": -11.604515075683594, "global_step": 209057, "epoch": 1244} {"train_loss": -10.927899360656738, "global_step": 209058, "epoch": 1244} {"train_loss": -11.320323944091797, "global_step": 209059, "epoch": 1244} {"train_loss": -11.40062427520752, "global_step": 209060, "epoch": 1244} {"train_loss": -11.544038772583008, "global_step": 209061, "epoch": 1244} {"train_loss": -11.36734390258789, "global_step": 209062, "epoch": 1244} {"train_loss": -11.490339279174805, "global_step": 209063, "epoch": 1244} {"train_loss": -11.50244140625, "global_step": 209064, "epoch": 1244} {"train_loss": -11.574972152709961, "global_step": 209065, "epoch": 1244} {"train_loss": -11.546651840209961, "global_step": 209066, "epoch": 1244} {"train_loss": -11.534012794494629, "global_step": 209067, "epoch": 1244} {"train_loss": -11.470507621765137, "global_step": 209068, "epoch": 1244} {"train_loss": -11.622270584106445, "global_step": 209069, "epoch": 1244} {"train_loss": -11.650627136230469, "global_step": 209070, "epoch": 1244} {"train_loss": -11.703405380249023, "global_step": 209071, "epoch": 1244} {"train_loss": -11.586447715759277, "global_step": 209072, "epoch": 1244} {"train_loss": -11.130006790161133, "global_step": 209073, "epoch": 1244} {"train_loss": -11.439485549926758, "global_step": 209074, "epoch": 1244} {"train_loss": -11.366486549377441, "global_step": 209075, "epoch": 1244} {"train_loss": -11.079294204711914, "global_step": 209076, "epoch": 1244} {"train_loss": -10.699422836303711, "global_step": 209077, "epoch": 1244} {"train_loss": -10.542750358581543, "global_step": 209078, "epoch": 1244} {"train_loss": -10.371399879455566, "global_step": 209079, "epoch": 1244} {"train_loss": -9.31166934967041, "global_step": 209080, "epoch": 1244} {"train_loss": -10.917306900024414, "global_step": 209081, "epoch": 1244} {"train_loss": -7.884840965270996, "global_step": 209082, "epoch": 1244} {"train_loss": -8.811286926269531, "global_step": 209083, "epoch": 1244} {"train_loss": -10.588979721069336, "global_step": 209084, "epoch": 1244} {"train_loss": -8.818846702575684, "global_step": 209085, "epoch": 1244} {"train_loss": -8.980633735656738, "global_step": 209086, "epoch": 1244} {"train_loss": -8.897211074829102, "global_step": 209087, "epoch": 1244} {"train_loss": -10.658181190490723, "global_step": 209088, "epoch": 1244} {"train_loss": -9.206357955932617, "global_step": 209089, "epoch": 1244} {"train_loss": -10.628765106201172, "global_step": 209090, "epoch": 1244} {"train_loss": -10.467870712280273, "global_step": 209091, "epoch": 1244} {"train_loss": -11.045613288879395, "global_step": 209092, "epoch": 1244} {"train_loss": -10.329498291015625, "global_step": 209093, "epoch": 1244} {"train_loss": -10.650115013122559, "global_step": 209094, "epoch": 1244} {"train_loss": -10.465628623962402, "global_step": 209095, "epoch": 1244} {"train_loss": -10.644977569580078, "global_step": 209096, "epoch": 1244} {"train_loss": -10.676334381103516, "global_step": 209097, "epoch": 1244} {"train_loss": -10.638947486877441, "global_step": 209098, "epoch": 1244} {"train_loss": -10.833613395690918, "global_step": 209099, "epoch": 1244} {"train_loss": -11.225805282592773, "global_step": 209100, "epoch": 1244} {"train_loss": -10.940252304077148, "global_step": 209101, "epoch": 1244} {"train_loss": -11.399487495422363, "global_step": 209102, "epoch": 1244} {"train_loss": -11.032454490661621, "global_step": 209103, "epoch": 1244} {"train_loss": -11.198345184326172, "global_step": 209104, "epoch": 1244} {"train_loss": -11.327829360961914, "global_step": 209105, "epoch": 1244} {"train_loss": -11.313722610473633, "global_step": 209106, "epoch": 1244} {"train_loss": -11.291852951049805, "global_step": 209107, "epoch": 1244} {"train_loss": -11.264281272888184, "global_step": 209108, "epoch": 1244} {"train_loss": -11.135187149047852, "global_step": 209109, "epoch": 1244} {"train_loss": -11.094215393066406, "global_step": 209110, "epoch": 1244} {"train_loss": -11.219627380371094, "global_step": 209111, "epoch": 1244} {"train_loss": -11.423730850219727, "global_step": 209112, "epoch": 1244} {"train_loss": -11.466927528381348, "global_step": 209113, "epoch": 1244} {"train_loss": -11.107234954833984, "global_step": 209114, "epoch": 1244} {"train_loss": -11.446769714355469, "global_step": 209115, "epoch": 1244} {"train_loss": -11.321111679077148, "global_step": 209116, "epoch": 1244} {"train_loss": -11.307272911071777, "global_step": 209117, "epoch": 1244} {"train_loss": -11.52086353302002, "global_step": 209118, "epoch": 1244} {"train_loss": -11.241196632385254, "global_step": 209119, "epoch": 1244} {"train_loss": -11.38192367553711, "global_step": 209120, "epoch": 1244} {"train_loss": -11.490074157714844, "global_step": 209121, "epoch": 1244} {"train_loss": -11.313472747802734, "global_step": 209122, "epoch": 1244} {"train_loss": -11.436826705932617, "global_step": 209123, "epoch": 1244} {"train_loss": -11.642908096313477, "global_step": 209124, "epoch": 1244} {"train_loss": -11.439290046691895, "global_step": 209125, "epoch": 1244} {"train_loss": -11.542043685913086, "global_step": 209126, "epoch": 1244} {"train_loss": -11.794553756713867, "global_step": 209127, "epoch": 1244} {"train_loss": -11.464730262756348, "global_step": 209128, "epoch": 1244} {"train_loss": -11.586999893188477, "global_step": 209129, "epoch": 1244} {"train_loss": -11.461397171020508, "global_step": 209130, "epoch": 1244} {"train_loss": -11.566822052001953, "global_step": 209131, "epoch": 1244} {"train_loss": -11.621326446533203, "global_step": 209132, "epoch": 1244} {"train_loss": -11.587257385253906, "global_step": 209133, "epoch": 1244} {"train_loss": -11.823144912719727, "global_step": 209134, "epoch": 1244} {"train_loss": -11.720584869384766, "global_step": 209135, "epoch": 1244} {"train_loss": -11.634361267089844, "global_step": 209136, "epoch": 1244} {"train_loss": -11.610172271728516, "global_step": 209137, "epoch": 1244} {"train_loss": -11.757209777832031, "global_step": 209138, "epoch": 1244} {"train_loss": -11.708776473999023, "global_step": 209139, "epoch": 1244} {"train_loss": -11.60370922088623, "global_step": 209140, "epoch": 1244} {"train_loss": -11.72364330291748, "global_step": 209141, "epoch": 1244} {"train_loss": -11.74148941040039, "global_step": 209142, "epoch": 1244} {"train_loss": -11.635330200195312, "global_step": 209143, "epoch": 1244} {"train_loss": -11.673440933227539, "global_step": 209144, "epoch": 1244} {"train_loss": -11.696718215942383, "global_step": 209145, "epoch": 1244} {"train_loss": -11.596433639526367, "global_step": 209146, "epoch": 1244} {"train_loss": -11.858007431030273, "global_step": 209147, "epoch": 1244} {"train_loss": -11.66191291809082, "global_step": 209148, "epoch": 1244} {"train_loss": -11.702447891235352, "global_step": 209149, "epoch": 1244} {"train_loss": -11.86164379119873, "global_step": 209150, "epoch": 1244} {"train_loss": -11.217483520507812, "global_step": 209151, "epoch": 1244} {"train_loss": -11.768108367919922, "global_step": 209152, "epoch": 1244} {"train_loss": -11.439720153808594, "global_step": 209153, "epoch": 1244} {"train_loss": -11.560128211975098, "global_step": 209154, "epoch": 1244} {"train_loss": -11.231731414794922, "global_step": 209155, "epoch": 1244} {"train_loss": -11.702814102172852, "global_step": 209156, "epoch": 1244} {"train_loss": -11.707818984985352, "global_step": 209157, "epoch": 1244} {"train_loss": -11.723447799682617, "global_step": 209158, "epoch": 1244} {"train_loss": -11.319702523095268, "global_step": 209159, "epoch": 1244, "val_loss": 251894.125} {"train_loss": -11.672616958618164, "global_step": 209160, "epoch": 1245} {"train_loss": -10.992806434631348, "global_step": 209161, "epoch": 1245} {"train_loss": -11.355470657348633, "global_step": 209162, "epoch": 1245} {"train_loss": -10.985918998718262, "global_step": 209163, "epoch": 1245} {"train_loss": -11.106536865234375, "global_step": 209164, "epoch": 1245} {"train_loss": -11.118507385253906, "global_step": 209165, "epoch": 1245} {"train_loss": -11.727767944335938, "global_step": 209166, "epoch": 1245} {"train_loss": -10.816096305847168, "global_step": 209167, "epoch": 1245} {"train_loss": -11.377870559692383, "global_step": 209168, "epoch": 1245} {"train_loss": -10.787020683288574, "global_step": 209169, "epoch": 1245} {"train_loss": -11.580181121826172, "global_step": 209170, "epoch": 1245} {"train_loss": -11.411134719848633, "global_step": 209171, "epoch": 1245} {"train_loss": -11.414815902709961, "global_step": 209172, "epoch": 1245} {"train_loss": -11.273880004882812, "global_step": 209173, "epoch": 1245} {"train_loss": -11.603859901428223, "global_step": 209174, "epoch": 1245} {"train_loss": -11.117023468017578, "global_step": 209175, "epoch": 1245} {"train_loss": -10.955171585083008, "global_step": 209176, "epoch": 1245} {"train_loss": -11.490877151489258, "global_step": 209177, "epoch": 1245} {"train_loss": -11.315314292907715, "global_step": 209178, "epoch": 1245} {"train_loss": -11.109784126281738, "global_step": 209179, "epoch": 1245} {"train_loss": -11.435468673706055, "global_step": 209180, "epoch": 1245} {"train_loss": -11.55258846282959, "global_step": 209181, "epoch": 1245} {"train_loss": -11.202594757080078, "global_step": 209182, "epoch": 1245} {"train_loss": -11.714875221252441, "global_step": 209183, "epoch": 1245} {"train_loss": -11.020221710205078, "global_step": 209184, "epoch": 1245} {"train_loss": -11.038103103637695, "global_step": 209185, "epoch": 1245} {"train_loss": -11.770471572875977, "global_step": 209186, "epoch": 1245} {"train_loss": -11.418745040893555, "global_step": 209187, "epoch": 1245} {"train_loss": -11.468833923339844, "global_step": 209188, "epoch": 1245} {"train_loss": -10.546493530273438, "global_step": 209189, "epoch": 1245} {"train_loss": -11.226667404174805, "global_step": 209190, "epoch": 1245} {"train_loss": -10.838900566101074, "global_step": 209191, "epoch": 1245} {"train_loss": -11.230422973632812, "global_step": 209192, "epoch": 1245} {"train_loss": -11.153520584106445, "global_step": 209193, "epoch": 1245} {"train_loss": -9.99088191986084, "global_step": 209194, "epoch": 1245} {"train_loss": -11.605347633361816, "global_step": 209195, "epoch": 1245} {"train_loss": -10.61054801940918, "global_step": 209196, "epoch": 1245} {"train_loss": -10.542357444763184, "global_step": 209197, "epoch": 1245} {"train_loss": -10.908565521240234, "global_step": 209198, "epoch": 1245} {"train_loss": -10.4920072555542, "global_step": 209199, "epoch": 1245} {"train_loss": -10.629890441894531, "global_step": 209200, "epoch": 1245} {"train_loss": -10.148529052734375, "global_step": 209201, "epoch": 1245} {"train_loss": -11.045249938964844, "global_step": 209202, "epoch": 1245} {"train_loss": -10.379072189331055, "global_step": 209203, "epoch": 1245} {"train_loss": -10.815990447998047, "global_step": 209204, "epoch": 1245} {"train_loss": -10.770751953125, "global_step": 209205, "epoch": 1245} {"train_loss": -10.428009033203125, "global_step": 209206, "epoch": 1245} {"train_loss": -11.087774276733398, "global_step": 209207, "epoch": 1245} {"train_loss": -10.269543647766113, "global_step": 209208, "epoch": 1245} {"train_loss": -10.711854934692383, "global_step": 209209, "epoch": 1245} {"train_loss": -10.62086009979248, "global_step": 209210, "epoch": 1245} {"train_loss": -11.035423278808594, "global_step": 209211, "epoch": 1245} {"train_loss": -10.445999145507812, "global_step": 209212, "epoch": 1245} {"train_loss": -11.141311645507812, "global_step": 209213, "epoch": 1245} {"train_loss": -10.266786575317383, "global_step": 209214, "epoch": 1245} {"train_loss": -11.252433776855469, "global_step": 209215, "epoch": 1245} {"train_loss": -9.925493240356445, "global_step": 209216, "epoch": 1245} {"train_loss": -11.161334037780762, "global_step": 209217, "epoch": 1245} {"train_loss": -9.855766296386719, "global_step": 209218, "epoch": 1245} {"train_loss": -11.630622863769531, "global_step": 209219, "epoch": 1245} {"train_loss": -10.918132781982422, "global_step": 209220, "epoch": 1245} {"train_loss": -11.230218887329102, "global_step": 209221, "epoch": 1245} {"train_loss": -11.113153457641602, "global_step": 209222, "epoch": 1245} {"train_loss": -10.903995513916016, "global_step": 209223, "epoch": 1245} {"train_loss": -11.267086029052734, "global_step": 209224, "epoch": 1245} {"train_loss": -11.10374641418457, "global_step": 209225, "epoch": 1245} {"train_loss": -11.03033447265625, "global_step": 209226, "epoch": 1245} {"train_loss": -11.382916450500488, "global_step": 209227, "epoch": 1245} {"train_loss": -11.042274475097656, "global_step": 209228, "epoch": 1245} {"train_loss": -10.7628755569458, "global_step": 209229, "epoch": 1245} {"train_loss": -11.433486938476562, "global_step": 209230, "epoch": 1245} {"train_loss": -10.779932022094727, "global_step": 209231, "epoch": 1245} {"train_loss": -11.414396286010742, "global_step": 209232, "epoch": 1245} {"train_loss": -11.324349403381348, "global_step": 209233, "epoch": 1245} {"train_loss": -11.287620544433594, "global_step": 209234, "epoch": 1245} {"train_loss": -11.375387191772461, "global_step": 209235, "epoch": 1245} {"train_loss": -11.310869216918945, "global_step": 209236, "epoch": 1245} {"train_loss": -11.389537811279297, "global_step": 209237, "epoch": 1245} {"train_loss": -11.531473159790039, "global_step": 209238, "epoch": 1245} {"train_loss": -11.472774505615234, "global_step": 209239, "epoch": 1245} {"train_loss": -11.518354415893555, "global_step": 209240, "epoch": 1245} {"train_loss": -11.571942329406738, "global_step": 209241, "epoch": 1245} {"train_loss": -11.45423698425293, "global_step": 209242, "epoch": 1245} {"train_loss": -11.546415328979492, "global_step": 209243, "epoch": 1245} {"train_loss": -11.681228637695312, "global_step": 209244, "epoch": 1245} {"train_loss": -11.626774787902832, "global_step": 209245, "epoch": 1245} {"train_loss": -11.430042266845703, "global_step": 209246, "epoch": 1245} {"train_loss": -11.588033676147461, "global_step": 209247, "epoch": 1245} {"train_loss": -11.383131980895996, "global_step": 209248, "epoch": 1245} {"train_loss": -11.419632911682129, "global_step": 209249, "epoch": 1245} {"train_loss": -11.585865020751953, "global_step": 209250, "epoch": 1245} {"train_loss": -11.600547790527344, "global_step": 209251, "epoch": 1245} {"train_loss": -11.603857040405273, "global_step": 209252, "epoch": 1245} {"train_loss": -11.645208358764648, "global_step": 209253, "epoch": 1245} {"train_loss": -11.530248641967773, "global_step": 209254, "epoch": 1245} {"train_loss": -11.831361770629883, "global_step": 209255, "epoch": 1245} {"train_loss": -11.602090835571289, "global_step": 209256, "epoch": 1245} {"train_loss": -11.780341148376465, "global_step": 209257, "epoch": 1245} {"train_loss": -11.395469665527344, "global_step": 209258, "epoch": 1245} {"train_loss": -11.682794570922852, "global_step": 209259, "epoch": 1245} {"train_loss": -11.856108665466309, "global_step": 209260, "epoch": 1245} {"train_loss": -11.773842811584473, "global_step": 209261, "epoch": 1245} {"train_loss": -11.668144226074219, "global_step": 209262, "epoch": 1245} {"train_loss": -11.867050170898438, "global_step": 209263, "epoch": 1245} {"train_loss": -11.480432510375977, "global_step": 209264, "epoch": 1245} {"train_loss": -11.792552947998047, "global_step": 209265, "epoch": 1245} {"train_loss": -11.512386322021484, "global_step": 209266, "epoch": 1245} {"train_loss": -11.422032356262207, "global_step": 209267, "epoch": 1245} {"train_loss": -11.433774948120117, "global_step": 209268, "epoch": 1245} {"train_loss": -11.947013854980469, "global_step": 209269, "epoch": 1245} {"train_loss": -11.27541732788086, "global_step": 209270, "epoch": 1245} {"train_loss": -11.341316223144531, "global_step": 209271, "epoch": 1245} {"train_loss": -11.689584732055664, "global_step": 209272, "epoch": 1245} {"train_loss": -11.234195709228516, "global_step": 209273, "epoch": 1245} {"train_loss": -11.799040794372559, "global_step": 209274, "epoch": 1245} {"train_loss": -11.215243339538574, "global_step": 209275, "epoch": 1245} {"train_loss": -11.487664222717285, "global_step": 209276, "epoch": 1245} {"train_loss": -11.520519256591797, "global_step": 209277, "epoch": 1245} {"train_loss": -11.708769798278809, "global_step": 209278, "epoch": 1245} {"train_loss": -11.493246078491211, "global_step": 209279, "epoch": 1245} {"train_loss": -11.676152229309082, "global_step": 209280, "epoch": 1245} {"train_loss": -11.459522247314453, "global_step": 209281, "epoch": 1245} {"train_loss": -10.840310096740723, "global_step": 209282, "epoch": 1245} {"train_loss": -11.407541275024414, "global_step": 209283, "epoch": 1245} {"train_loss": -10.560676574707031, "global_step": 209284, "epoch": 1245} {"train_loss": -9.45086669921875, "global_step": 209285, "epoch": 1245} {"train_loss": -9.02049446105957, "global_step": 209286, "epoch": 1245} {"train_loss": -10.888593673706055, "global_step": 209287, "epoch": 1245} {"train_loss": -9.655672073364258, "global_step": 209288, "epoch": 1245} {"train_loss": -10.165189743041992, "global_step": 209289, "epoch": 1245} {"train_loss": -9.490554809570312, "global_step": 209290, "epoch": 1245} {"train_loss": -9.359245300292969, "global_step": 209291, "epoch": 1245} {"train_loss": -9.45716381072998, "global_step": 209292, "epoch": 1245} {"train_loss": -10.046036720275879, "global_step": 209293, "epoch": 1245} {"train_loss": -10.219951629638672, "global_step": 209294, "epoch": 1245} {"train_loss": -10.093755722045898, "global_step": 209295, "epoch": 1245} {"train_loss": -10.3092041015625, "global_step": 209296, "epoch": 1245} {"train_loss": -9.900520324707031, "global_step": 209297, "epoch": 1245} {"train_loss": -11.045770645141602, "global_step": 209298, "epoch": 1245} {"train_loss": -10.93724250793457, "global_step": 209299, "epoch": 1245} {"train_loss": -10.87844181060791, "global_step": 209300, "epoch": 1245} {"train_loss": -11.264636039733887, "global_step": 209301, "epoch": 1245} {"train_loss": -10.691336631774902, "global_step": 209302, "epoch": 1245} {"train_loss": -11.182267189025879, "global_step": 209303, "epoch": 1245} {"train_loss": -10.878135681152344, "global_step": 209304, "epoch": 1245} {"train_loss": -10.910341262817383, "global_step": 209305, "epoch": 1245} {"train_loss": -11.011054039001465, "global_step": 209306, "epoch": 1245} {"train_loss": -10.936243057250977, "global_step": 209307, "epoch": 1245} {"train_loss": -11.094291687011719, "global_step": 209308, "epoch": 1245} {"train_loss": -11.112431526184082, "global_step": 209309, "epoch": 1245} {"train_loss": -11.214241981506348, "global_step": 209310, "epoch": 1245} {"train_loss": -11.132267951965332, "global_step": 209311, "epoch": 1245} {"train_loss": -11.010534286499023, "global_step": 209312, "epoch": 1245} {"train_loss": -11.047872543334961, "global_step": 209313, "epoch": 1245} {"train_loss": -11.240921020507812, "global_step": 209314, "epoch": 1245} {"train_loss": -11.082694053649902, "global_step": 209315, "epoch": 1245} {"train_loss": -11.246962547302246, "global_step": 209316, "epoch": 1245} {"train_loss": -11.243162155151367, "global_step": 209317, "epoch": 1245} {"train_loss": -11.188714981079102, "global_step": 209318, "epoch": 1245} {"train_loss": -11.233322143554688, "global_step": 209319, "epoch": 1245} {"train_loss": -11.235589981079102, "global_step": 209320, "epoch": 1245} {"train_loss": -11.298727989196777, "global_step": 209321, "epoch": 1245} {"train_loss": -11.445178985595703, "global_step": 209322, "epoch": 1245} {"train_loss": -11.274932861328125, "global_step": 209323, "epoch": 1245} {"train_loss": -11.22452163696289, "global_step": 209324, "epoch": 1245} {"train_loss": -11.288362503051758, "global_step": 209325, "epoch": 1245} {"train_loss": -11.698763847351074, "global_step": 209326, "epoch": 1245} {"train_loss": -11.107003558249701, "global_step": 209327, "epoch": 1245, "val_loss": 254353.515625, "train_action_mse_error": 1.463958740234375} {"train_loss": -11.447633743286133, "global_step": 209328, "epoch": 1246} {"train_loss": -11.25716781616211, "global_step": 209329, "epoch": 1246} {"train_loss": -11.09967041015625, "global_step": 209330, "epoch": 1246} {"train_loss": -11.558130264282227, "global_step": 209331, "epoch": 1246} {"train_loss": -11.29974365234375, "global_step": 209332, "epoch": 1246} {"train_loss": -11.538288116455078, "global_step": 209333, "epoch": 1246} {"train_loss": -11.676216125488281, "global_step": 209334, "epoch": 1246} {"train_loss": -11.409464836120605, "global_step": 209335, "epoch": 1246} {"train_loss": -11.499601364135742, "global_step": 209336, "epoch": 1246} {"train_loss": -11.2774658203125, "global_step": 209337, "epoch": 1246} {"train_loss": -11.665336608886719, "global_step": 209338, "epoch": 1246} {"train_loss": -11.5980224609375, "global_step": 209339, "epoch": 1246} {"train_loss": -11.428787231445312, "global_step": 209340, "epoch": 1246} {"train_loss": -11.805988311767578, "global_step": 209341, "epoch": 1246} {"train_loss": -11.469419479370117, "global_step": 209342, "epoch": 1246} {"train_loss": -11.634263038635254, "global_step": 209343, "epoch": 1246} {"train_loss": -11.759671211242676, "global_step": 209344, "epoch": 1246} {"train_loss": -11.656960487365723, "global_step": 209345, "epoch": 1246} {"train_loss": -11.66360855102539, "global_step": 209346, "epoch": 1246} {"train_loss": -11.495121002197266, "global_step": 209347, "epoch": 1246} {"train_loss": -11.707942962646484, "global_step": 209348, "epoch": 1246} {"train_loss": -11.634418487548828, "global_step": 209349, "epoch": 1246} {"train_loss": -11.793024063110352, "global_step": 209350, "epoch": 1246} {"train_loss": -11.662887573242188, "global_step": 209351, "epoch": 1246} {"train_loss": -11.51298713684082, "global_step": 209352, "epoch": 1246} {"train_loss": -11.72003173828125, "global_step": 209353, "epoch": 1246} {"train_loss": -11.63279914855957, "global_step": 209354, "epoch": 1246} {"train_loss": -11.626585960388184, "global_step": 209355, "epoch": 1246} {"train_loss": -11.82144832611084, "global_step": 209356, "epoch": 1246} {"train_loss": -11.394079208374023, "global_step": 209357, "epoch": 1246} {"train_loss": -11.677846908569336, "global_step": 209358, "epoch": 1246} {"train_loss": -11.592559814453125, "global_step": 209359, "epoch": 1246} {"train_loss": -11.405006408691406, "global_step": 209360, "epoch": 1246} {"train_loss": -11.602729797363281, "global_step": 209361, "epoch": 1246} {"train_loss": -11.247200965881348, "global_step": 209362, "epoch": 1246} {"train_loss": -11.68303108215332, "global_step": 209363, "epoch": 1246} {"train_loss": -11.414721488952637, "global_step": 209364, "epoch": 1246} {"train_loss": -10.275250434875488, "global_step": 209365, "epoch": 1246} {"train_loss": -11.368997573852539, "global_step": 209366, "epoch": 1246} {"train_loss": -11.316329956054688, "global_step": 209367, "epoch": 1246} {"train_loss": -10.756315231323242, "global_step": 209368, "epoch": 1246} {"train_loss": -10.686861991882324, "global_step": 209369, "epoch": 1246} {"train_loss": -11.00796890258789, "global_step": 209370, "epoch": 1246} {"train_loss": -10.908387184143066, "global_step": 209371, "epoch": 1246} {"train_loss": -10.740800857543945, "global_step": 209372, "epoch": 1246} {"train_loss": -11.265422821044922, "global_step": 209373, "epoch": 1246} {"train_loss": -10.782733917236328, "global_step": 209374, "epoch": 1246} {"train_loss": -10.88316822052002, "global_step": 209375, "epoch": 1246} {"train_loss": -10.396130561828613, "global_step": 209376, "epoch": 1246} {"train_loss": -9.588732719421387, "global_step": 209377, "epoch": 1246} {"train_loss": -10.27855110168457, "global_step": 209378, "epoch": 1246} {"train_loss": -11.140800476074219, "global_step": 209379, "epoch": 1246} {"train_loss": -9.37689208984375, "global_step": 209380, "epoch": 1246} {"train_loss": -10.948211669921875, "global_step": 209381, "epoch": 1246} {"train_loss": -10.08812141418457, "global_step": 209382, "epoch": 1246} {"train_loss": -10.567460060119629, "global_step": 209383, "epoch": 1246} {"train_loss": -10.918203353881836, "global_step": 209384, "epoch": 1246} {"train_loss": -10.564552307128906, "global_step": 209385, "epoch": 1246} {"train_loss": -10.970431327819824, "global_step": 209386, "epoch": 1246} {"train_loss": -11.092206001281738, "global_step": 209387, "epoch": 1246} {"train_loss": -10.276230812072754, "global_step": 209388, "epoch": 1246} {"train_loss": -11.048103332519531, "global_step": 209389, "epoch": 1246} {"train_loss": -10.873136520385742, "global_step": 209390, "epoch": 1246} {"train_loss": -10.979761123657227, "global_step": 209391, "epoch": 1246} {"train_loss": -11.27650260925293, "global_step": 209392, "epoch": 1246} {"train_loss": -11.19459056854248, "global_step": 209393, "epoch": 1246} {"train_loss": -11.076902389526367, "global_step": 209394, "epoch": 1246} {"train_loss": -11.262371063232422, "global_step": 209395, "epoch": 1246} {"train_loss": -11.147858619689941, "global_step": 209396, "epoch": 1246} {"train_loss": -11.354771614074707, "global_step": 209397, "epoch": 1246} {"train_loss": -11.074728965759277, "global_step": 209398, "epoch": 1246} {"train_loss": -11.386014938354492, "global_step": 209399, "epoch": 1246} {"train_loss": -11.07097339630127, "global_step": 209400, "epoch": 1246} {"train_loss": -11.512472152709961, "global_step": 209401, "epoch": 1246} {"train_loss": -11.194873809814453, "global_step": 209402, "epoch": 1246} {"train_loss": -11.349003791809082, "global_step": 209403, "epoch": 1246} {"train_loss": -11.078441619873047, "global_step": 209404, "epoch": 1246} {"train_loss": -11.301440238952637, "global_step": 209405, "epoch": 1246} {"train_loss": -10.947935104370117, "global_step": 209406, "epoch": 1246} {"train_loss": -11.330570220947266, "global_step": 209407, "epoch": 1246} {"train_loss": -10.716046333312988, "global_step": 209408, "epoch": 1246} {"train_loss": -11.607181549072266, "global_step": 209409, "epoch": 1246} {"train_loss": -11.110662460327148, "global_step": 209410, "epoch": 1246} {"train_loss": -11.15517520904541, "global_step": 209411, "epoch": 1246} {"train_loss": -11.376134872436523, "global_step": 209412, "epoch": 1246} {"train_loss": -11.079870223999023, "global_step": 209413, "epoch": 1246} {"train_loss": -11.227027893066406, "global_step": 209414, "epoch": 1246} {"train_loss": -11.2437162399292, "global_step": 209415, "epoch": 1246} {"train_loss": -11.49742317199707, "global_step": 209416, "epoch": 1246} {"train_loss": -10.991488456726074, "global_step": 209417, "epoch": 1246} {"train_loss": -11.422834396362305, "global_step": 209418, "epoch": 1246} {"train_loss": -11.062015533447266, "global_step": 209419, "epoch": 1246} {"train_loss": -11.094091415405273, "global_step": 209420, "epoch": 1246} {"train_loss": -11.24306869506836, "global_step": 209421, "epoch": 1246} {"train_loss": -11.23112678527832, "global_step": 209422, "epoch": 1246} {"train_loss": -11.604840278625488, "global_step": 209423, "epoch": 1246} {"train_loss": -11.425939559936523, "global_step": 209424, "epoch": 1246} {"train_loss": -11.626423835754395, "global_step": 209425, "epoch": 1246} {"train_loss": -11.264963150024414, "global_step": 209426, "epoch": 1246} {"train_loss": -11.52885627746582, "global_step": 209427, "epoch": 1246} {"train_loss": -11.57621955871582, "global_step": 209428, "epoch": 1246} {"train_loss": -11.380786895751953, "global_step": 209429, "epoch": 1246} {"train_loss": -11.594807624816895, "global_step": 209430, "epoch": 1246} {"train_loss": -11.358234405517578, "global_step": 209431, "epoch": 1246} {"train_loss": -11.74599838256836, "global_step": 209432, "epoch": 1246} {"train_loss": -11.47242546081543, "global_step": 209433, "epoch": 1246} {"train_loss": -11.466821670532227, "global_step": 209434, "epoch": 1246} {"train_loss": -11.791923522949219, "global_step": 209435, "epoch": 1246} {"train_loss": -11.436925888061523, "global_step": 209436, "epoch": 1246} {"train_loss": -11.827064514160156, "global_step": 209437, "epoch": 1246} {"train_loss": -11.903457641601562, "global_step": 209438, "epoch": 1246} {"train_loss": -11.690580368041992, "global_step": 209439, "epoch": 1246} {"train_loss": -11.81706714630127, "global_step": 209440, "epoch": 1246} {"train_loss": -11.582894325256348, "global_step": 209441, "epoch": 1246} {"train_loss": -11.784309387207031, "global_step": 209442, "epoch": 1246} {"train_loss": -11.545817375183105, "global_step": 209443, "epoch": 1246} {"train_loss": -11.699016571044922, "global_step": 209444, "epoch": 1246} {"train_loss": -11.51919174194336, "global_step": 209445, "epoch": 1246} {"train_loss": -11.386115074157715, "global_step": 209446, "epoch": 1246} {"train_loss": -11.708292007446289, "global_step": 209447, "epoch": 1246} {"train_loss": -11.666215896606445, "global_step": 209448, "epoch": 1246} {"train_loss": -11.507681846618652, "global_step": 209449, "epoch": 1246} {"train_loss": -11.831666946411133, "global_step": 209450, "epoch": 1246} {"train_loss": -11.81818962097168, "global_step": 209451, "epoch": 1246} {"train_loss": -11.834844589233398, "global_step": 209452, "epoch": 1246} {"train_loss": -11.714086532592773, "global_step": 209453, "epoch": 1246} {"train_loss": -11.785545349121094, "global_step": 209454, "epoch": 1246} {"train_loss": -11.623311996459961, "global_step": 209455, "epoch": 1246} {"train_loss": -11.57111644744873, "global_step": 209456, "epoch": 1246} {"train_loss": -11.19918155670166, "global_step": 209457, "epoch": 1246} {"train_loss": -11.696603775024414, "global_step": 209458, "epoch": 1246} {"train_loss": -11.332253456115723, "global_step": 209459, "epoch": 1246} {"train_loss": -11.225974082946777, "global_step": 209460, "epoch": 1246} {"train_loss": -11.601367950439453, "global_step": 209461, "epoch": 1246} {"train_loss": -11.85040283203125, "global_step": 209462, "epoch": 1246} {"train_loss": -11.306619644165039, "global_step": 209463, "epoch": 1246} {"train_loss": -11.576883316040039, "global_step": 209464, "epoch": 1246} {"train_loss": -11.776203155517578, "global_step": 209465, "epoch": 1246} {"train_loss": -11.531776428222656, "global_step": 209466, "epoch": 1246} {"train_loss": -11.474884033203125, "global_step": 209467, "epoch": 1246} {"train_loss": -10.661121368408203, "global_step": 209468, "epoch": 1246} {"train_loss": -9.724637031555176, "global_step": 209469, "epoch": 1246} {"train_loss": -11.333223342895508, "global_step": 209470, "epoch": 1246} {"train_loss": -10.966835975646973, "global_step": 209471, "epoch": 1246} {"train_loss": -10.433069229125977, "global_step": 209472, "epoch": 1246} {"train_loss": -10.996274948120117, "global_step": 209473, "epoch": 1246} {"train_loss": -10.826168060302734, "global_step": 209474, "epoch": 1246} {"train_loss": -10.443323135375977, "global_step": 209475, "epoch": 1246} {"train_loss": -11.336758613586426, "global_step": 209476, "epoch": 1246} {"train_loss": -10.912178039550781, "global_step": 209477, "epoch": 1246} {"train_loss": -11.295228958129883, "global_step": 209478, "epoch": 1246} {"train_loss": -11.404596328735352, "global_step": 209479, "epoch": 1246} {"train_loss": -11.327557563781738, "global_step": 209480, "epoch": 1246} {"train_loss": -11.239233016967773, "global_step": 209481, "epoch": 1246} {"train_loss": -11.322257041931152, "global_step": 209482, "epoch": 1246} {"train_loss": -10.806726455688477, "global_step": 209483, "epoch": 1246} {"train_loss": -11.558788299560547, "global_step": 209484, "epoch": 1246} {"train_loss": -11.343221664428711, "global_step": 209485, "epoch": 1246} {"train_loss": -10.928074836730957, "global_step": 209486, "epoch": 1246} {"train_loss": -11.526460647583008, "global_step": 209487, "epoch": 1246} {"train_loss": -11.166071891784668, "global_step": 209488, "epoch": 1246} {"train_loss": -11.170333862304688, "global_step": 209489, "epoch": 1246} {"train_loss": -11.565977096557617, "global_step": 209490, "epoch": 1246} {"train_loss": -10.535186767578125, "global_step": 209491, "epoch": 1246} {"train_loss": -11.319986343383789, "global_step": 209492, "epoch": 1246} {"train_loss": -11.301868438720703, "global_step": 209493, "epoch": 1246} {"train_loss": -11.113826751708984, "global_step": 209494, "epoch": 1246} {"train_loss": -11.284157730284191, "global_step": 209495, "epoch": 1246, "val_loss": 254474.609375} {"train_loss": -11.097166061401367, "global_step": 209496, "epoch": 1247} {"train_loss": -11.418196678161621, "global_step": 209497, "epoch": 1247} {"train_loss": -11.057616233825684, "global_step": 209498, "epoch": 1247} {"train_loss": -11.319086074829102, "global_step": 209499, "epoch": 1247} {"train_loss": -11.34799861907959, "global_step": 209500, "epoch": 1247} {"train_loss": -11.513246536254883, "global_step": 209501, "epoch": 1247} {"train_loss": -11.662002563476562, "global_step": 209502, "epoch": 1247} {"train_loss": -11.421639442443848, "global_step": 209503, "epoch": 1247} {"train_loss": -11.563501358032227, "global_step": 209504, "epoch": 1247} {"train_loss": -11.484867095947266, "global_step": 209505, "epoch": 1247} {"train_loss": -11.504768371582031, "global_step": 209506, "epoch": 1247} {"train_loss": -11.516716003417969, "global_step": 209507, "epoch": 1247} {"train_loss": -11.175046920776367, "global_step": 209508, "epoch": 1247} {"train_loss": -11.611244201660156, "global_step": 209509, "epoch": 1247} {"train_loss": -11.362693786621094, "global_step": 209510, "epoch": 1247} {"train_loss": -11.150724411010742, "global_step": 209511, "epoch": 1247} {"train_loss": -11.446533203125, "global_step": 209512, "epoch": 1247} {"train_loss": -11.436590194702148, "global_step": 209513, "epoch": 1247} {"train_loss": -11.638359069824219, "global_step": 209514, "epoch": 1247} {"train_loss": -11.210610389709473, "global_step": 209515, "epoch": 1247} {"train_loss": -11.810981750488281, "global_step": 209516, "epoch": 1247} {"train_loss": -11.619943618774414, "global_step": 209517, "epoch": 1247} {"train_loss": -11.484742164611816, "global_step": 209518, "epoch": 1247} {"train_loss": -11.657135963439941, "global_step": 209519, "epoch": 1247} {"train_loss": -11.213077545166016, "global_step": 209520, "epoch": 1247} {"train_loss": -11.854165077209473, "global_step": 209521, "epoch": 1247} {"train_loss": -11.2354097366333, "global_step": 209522, "epoch": 1247} {"train_loss": -11.602052688598633, "global_step": 209523, "epoch": 1247} {"train_loss": -11.669535636901855, "global_step": 209524, "epoch": 1247} {"train_loss": -11.654365539550781, "global_step": 209525, "epoch": 1247} {"train_loss": -11.372356414794922, "global_step": 209526, "epoch": 1247} {"train_loss": -11.598215103149414, "global_step": 209527, "epoch": 1247} {"train_loss": -11.418774604797363, "global_step": 209528, "epoch": 1247} {"train_loss": -11.59201431274414, "global_step": 209529, "epoch": 1247} {"train_loss": -11.575740814208984, "global_step": 209530, "epoch": 1247} {"train_loss": -11.350065231323242, "global_step": 209531, "epoch": 1247} {"train_loss": -11.501180648803711, "global_step": 209532, "epoch": 1247} {"train_loss": -11.360163688659668, "global_step": 209533, "epoch": 1247} {"train_loss": -11.510680198669434, "global_step": 209534, "epoch": 1247} {"train_loss": -11.352535247802734, "global_step": 209535, "epoch": 1247} {"train_loss": -11.762471199035645, "global_step": 209536, "epoch": 1247} {"train_loss": -11.393329620361328, "global_step": 209537, "epoch": 1247} {"train_loss": -11.466714859008789, "global_step": 209538, "epoch": 1247} {"train_loss": -11.91453742980957, "global_step": 209539, "epoch": 1247} {"train_loss": -11.217401504516602, "global_step": 209540, "epoch": 1247} {"train_loss": -11.758228302001953, "global_step": 209541, "epoch": 1247} {"train_loss": -11.511866569519043, "global_step": 209542, "epoch": 1247} {"train_loss": -11.479063034057617, "global_step": 209543, "epoch": 1247} {"train_loss": -11.64805793762207, "global_step": 209544, "epoch": 1247} {"train_loss": -11.331904411315918, "global_step": 209545, "epoch": 1247} {"train_loss": -11.739864349365234, "global_step": 209546, "epoch": 1247} {"train_loss": -11.649991989135742, "global_step": 209547, "epoch": 1247} {"train_loss": -11.336790084838867, "global_step": 209548, "epoch": 1247} {"train_loss": -11.607246398925781, "global_step": 209549, "epoch": 1247} {"train_loss": -11.143671989440918, "global_step": 209550, "epoch": 1247} {"train_loss": -11.17684555053711, "global_step": 209551, "epoch": 1247} {"train_loss": -11.500020980834961, "global_step": 209552, "epoch": 1247} {"train_loss": -10.995193481445312, "global_step": 209553, "epoch": 1247} {"train_loss": -11.599204063415527, "global_step": 209554, "epoch": 1247} {"train_loss": -11.511062622070312, "global_step": 209555, "epoch": 1247} {"train_loss": -11.611946105957031, "global_step": 209556, "epoch": 1247} {"train_loss": -11.163413047790527, "global_step": 209557, "epoch": 1247} {"train_loss": -11.50014877319336, "global_step": 209558, "epoch": 1247} {"train_loss": -11.086172103881836, "global_step": 209559, "epoch": 1247} {"train_loss": -11.365213394165039, "global_step": 209560, "epoch": 1247} {"train_loss": -11.630941390991211, "global_step": 209561, "epoch": 1247} {"train_loss": -11.23216438293457, "global_step": 209562, "epoch": 1247} {"train_loss": -11.340888977050781, "global_step": 209563, "epoch": 1247} {"train_loss": -10.954336166381836, "global_step": 209564, "epoch": 1247} {"train_loss": -11.308294296264648, "global_step": 209565, "epoch": 1247} {"train_loss": -11.235233306884766, "global_step": 209566, "epoch": 1247} {"train_loss": -11.406282424926758, "global_step": 209567, "epoch": 1247} {"train_loss": -10.964288711547852, "global_step": 209568, "epoch": 1247} {"train_loss": -11.545907974243164, "global_step": 209569, "epoch": 1247} {"train_loss": -11.147743225097656, "global_step": 209570, "epoch": 1247} {"train_loss": -11.709016799926758, "global_step": 209571, "epoch": 1247} {"train_loss": -11.493999481201172, "global_step": 209572, "epoch": 1247} {"train_loss": -11.154714584350586, "global_step": 209573, "epoch": 1247} {"train_loss": -11.52101993560791, "global_step": 209574, "epoch": 1247} {"train_loss": -11.347373962402344, "global_step": 209575, "epoch": 1247} {"train_loss": -11.3863525390625, "global_step": 209576, "epoch": 1247} {"train_loss": -11.789913177490234, "global_step": 209577, "epoch": 1247} {"train_loss": -11.787795066833496, "global_step": 209578, "epoch": 1247} {"train_loss": -11.790739059448242, "global_step": 209579, "epoch": 1247} {"train_loss": -11.691299438476562, "global_step": 209580, "epoch": 1247} {"train_loss": -11.71304702758789, "global_step": 209581, "epoch": 1247} {"train_loss": -11.802528381347656, "global_step": 209582, "epoch": 1247} {"train_loss": -11.521285057067871, "global_step": 209583, "epoch": 1247} {"train_loss": -11.778375625610352, "global_step": 209584, "epoch": 1247} {"train_loss": -11.745403289794922, "global_step": 209585, "epoch": 1247} {"train_loss": -11.741442680358887, "global_step": 209586, "epoch": 1247} {"train_loss": -11.878402709960938, "global_step": 209587, "epoch": 1247} {"train_loss": -11.684815406799316, "global_step": 209588, "epoch": 1247} {"train_loss": -11.758964538574219, "global_step": 209589, "epoch": 1247} {"train_loss": -11.921056747436523, "global_step": 209590, "epoch": 1247} {"train_loss": -11.841032028198242, "global_step": 209591, "epoch": 1247} {"train_loss": -11.755559921264648, "global_step": 209592, "epoch": 1247} {"train_loss": -11.877223014831543, "global_step": 209593, "epoch": 1247} {"train_loss": -11.488117218017578, "global_step": 209594, "epoch": 1247} {"train_loss": -11.181474685668945, "global_step": 209595, "epoch": 1247} {"train_loss": -11.354106903076172, "global_step": 209596, "epoch": 1247} {"train_loss": -11.652976036071777, "global_step": 209597, "epoch": 1247} {"train_loss": -10.551322937011719, "global_step": 209598, "epoch": 1247} {"train_loss": -11.263505935668945, "global_step": 209599, "epoch": 1247} {"train_loss": -11.797138214111328, "global_step": 209600, "epoch": 1247} {"train_loss": -11.642902374267578, "global_step": 209601, "epoch": 1247} {"train_loss": -11.418188095092773, "global_step": 209602, "epoch": 1247} {"train_loss": -11.858699798583984, "global_step": 209603, "epoch": 1247} {"train_loss": -11.386558532714844, "global_step": 209604, "epoch": 1247} {"train_loss": -10.858145713806152, "global_step": 209605, "epoch": 1247} {"train_loss": -11.20954704284668, "global_step": 209606, "epoch": 1247} {"train_loss": -11.724019050598145, "global_step": 209607, "epoch": 1247} {"train_loss": -11.509300231933594, "global_step": 209608, "epoch": 1247} {"train_loss": -11.652502059936523, "global_step": 209609, "epoch": 1247} {"train_loss": -11.47951602935791, "global_step": 209610, "epoch": 1247} {"train_loss": -11.656721115112305, "global_step": 209611, "epoch": 1247} {"train_loss": -11.023298263549805, "global_step": 209612, "epoch": 1247} {"train_loss": -11.651618957519531, "global_step": 209613, "epoch": 1247} {"train_loss": -11.092336654663086, "global_step": 209614, "epoch": 1247} {"train_loss": -10.691747665405273, "global_step": 209615, "epoch": 1247} {"train_loss": -11.16719913482666, "global_step": 209616, "epoch": 1247} {"train_loss": -10.931282043457031, "global_step": 209617, "epoch": 1247} {"train_loss": -10.648263931274414, "global_step": 209618, "epoch": 1247} {"train_loss": -11.138954162597656, "global_step": 209619, "epoch": 1247} {"train_loss": -10.647254943847656, "global_step": 209620, "epoch": 1247} {"train_loss": -11.366079330444336, "global_step": 209621, "epoch": 1247} {"train_loss": -11.02334976196289, "global_step": 209622, "epoch": 1247} {"train_loss": -11.477824211120605, "global_step": 209623, "epoch": 1247} {"train_loss": -10.737907409667969, "global_step": 209624, "epoch": 1247} {"train_loss": -11.492409706115723, "global_step": 209625, "epoch": 1247} {"train_loss": -10.97668170928955, "global_step": 209626, "epoch": 1247} {"train_loss": -11.665961265563965, "global_step": 209627, "epoch": 1247} {"train_loss": -11.045967102050781, "global_step": 209628, "epoch": 1247} {"train_loss": -11.078339576721191, "global_step": 209629, "epoch": 1247} {"train_loss": -11.192022323608398, "global_step": 209630, "epoch": 1247} {"train_loss": -11.485358238220215, "global_step": 209631, "epoch": 1247} {"train_loss": -11.034509658813477, "global_step": 209632, "epoch": 1247} {"train_loss": -10.979930877685547, "global_step": 209633, "epoch": 1247} {"train_loss": -11.200681686401367, "global_step": 209634, "epoch": 1247} {"train_loss": -11.395176887512207, "global_step": 209635, "epoch": 1247} {"train_loss": -11.591853141784668, "global_step": 209636, "epoch": 1247} {"train_loss": -11.14828109741211, "global_step": 209637, "epoch": 1247} {"train_loss": -11.739202499389648, "global_step": 209638, "epoch": 1247} {"train_loss": -11.364249229431152, "global_step": 209639, "epoch": 1247} {"train_loss": -11.205309867858887, "global_step": 209640, "epoch": 1247} {"train_loss": -11.620607376098633, "global_step": 209641, "epoch": 1247} {"train_loss": -11.212553024291992, "global_step": 209642, "epoch": 1247} {"train_loss": -11.671710014343262, "global_step": 209643, "epoch": 1247} {"train_loss": -11.599811553955078, "global_step": 209644, "epoch": 1247} {"train_loss": -11.49846076965332, "global_step": 209645, "epoch": 1247} {"train_loss": -11.230367660522461, "global_step": 209646, "epoch": 1247} {"train_loss": -11.682485580444336, "global_step": 209647, "epoch": 1247} {"train_loss": -11.554719924926758, "global_step": 209648, "epoch": 1247} {"train_loss": -11.708967208862305, "global_step": 209649, "epoch": 1247} {"train_loss": -11.61742877960205, "global_step": 209650, "epoch": 1247} {"train_loss": -11.659671783447266, "global_step": 209651, "epoch": 1247} {"train_loss": -11.87473201751709, "global_step": 209652, "epoch": 1247} {"train_loss": -11.685946464538574, "global_step": 209653, "epoch": 1247} {"train_loss": -11.618976593017578, "global_step": 209654, "epoch": 1247} {"train_loss": -11.439848899841309, "global_step": 209655, "epoch": 1247} {"train_loss": -11.674622535705566, "global_step": 209656, "epoch": 1247} {"train_loss": -11.64937973022461, "global_step": 209657, "epoch": 1247} {"train_loss": -11.686674118041992, "global_step": 209658, "epoch": 1247} {"train_loss": -11.361616134643555, "global_step": 209659, "epoch": 1247} {"train_loss": -11.543094635009766, "global_step": 209660, "epoch": 1247} {"train_loss": -11.453572273254395, "global_step": 209661, "epoch": 1247} {"train_loss": -11.533658027648926, "global_step": 209662, "epoch": 1247} {"train_loss": -11.443519825027103, "global_step": 209663, "epoch": 1247, "val_loss": 258007.375} {"train_loss": -11.868377685546875, "global_step": 209664, "epoch": 1248} {"train_loss": -11.486571311950684, "global_step": 209665, "epoch": 1248} {"train_loss": -11.190919876098633, "global_step": 209666, "epoch": 1248} {"train_loss": -11.05821418762207, "global_step": 209667, "epoch": 1248} {"train_loss": -11.417462348937988, "global_step": 209668, "epoch": 1248} {"train_loss": -9.761431694030762, "global_step": 209669, "epoch": 1248} {"train_loss": -11.144630432128906, "global_step": 209670, "epoch": 1248} {"train_loss": -11.601557731628418, "global_step": 209671, "epoch": 1248} {"train_loss": -11.125968933105469, "global_step": 209672, "epoch": 1248} {"train_loss": -11.544998168945312, "global_step": 209673, "epoch": 1248} {"train_loss": -11.205974578857422, "global_step": 209674, "epoch": 1248} {"train_loss": -10.988382339477539, "global_step": 209675, "epoch": 1248} {"train_loss": -11.577470779418945, "global_step": 209676, "epoch": 1248} {"train_loss": -11.526768684387207, "global_step": 209677, "epoch": 1248} {"train_loss": -11.210777282714844, "global_step": 209678, "epoch": 1248} {"train_loss": -11.364453315734863, "global_step": 209679, "epoch": 1248} {"train_loss": -11.522768020629883, "global_step": 209680, "epoch": 1248} {"train_loss": -11.373632431030273, "global_step": 209681, "epoch": 1248} {"train_loss": -11.442609786987305, "global_step": 209682, "epoch": 1248} {"train_loss": -11.70724868774414, "global_step": 209683, "epoch": 1248} {"train_loss": -10.898075103759766, "global_step": 209684, "epoch": 1248} {"train_loss": -11.081521034240723, "global_step": 209685, "epoch": 1248} {"train_loss": -11.312167167663574, "global_step": 209686, "epoch": 1248} {"train_loss": -11.301958084106445, "global_step": 209687, "epoch": 1248} {"train_loss": -11.250240325927734, "global_step": 209688, "epoch": 1248} {"train_loss": -11.272948265075684, "global_step": 209689, "epoch": 1248} {"train_loss": -11.525201797485352, "global_step": 209690, "epoch": 1248} {"train_loss": -10.809654235839844, "global_step": 209691, "epoch": 1248} {"train_loss": -11.357686996459961, "global_step": 209692, "epoch": 1248} {"train_loss": -11.300800323486328, "global_step": 209693, "epoch": 1248} {"train_loss": -10.882553100585938, "global_step": 209694, "epoch": 1248} {"train_loss": -11.543964385986328, "global_step": 209695, "epoch": 1248} {"train_loss": -11.212773323059082, "global_step": 209696, "epoch": 1248} {"train_loss": -11.059040069580078, "global_step": 209697, "epoch": 1248} {"train_loss": -11.707351684570312, "global_step": 209698, "epoch": 1248} {"train_loss": -11.24677848815918, "global_step": 209699, "epoch": 1248} {"train_loss": -11.667798042297363, "global_step": 209700, "epoch": 1248} {"train_loss": -11.28074836730957, "global_step": 209701, "epoch": 1248} {"train_loss": -11.47569465637207, "global_step": 209702, "epoch": 1248} {"train_loss": -11.53793716430664, "global_step": 209703, "epoch": 1248} {"train_loss": -11.4960298538208, "global_step": 209704, "epoch": 1248} {"train_loss": -11.590234756469727, "global_step": 209705, "epoch": 1248} {"train_loss": -11.433603286743164, "global_step": 209706, "epoch": 1248} {"train_loss": -11.35561752319336, "global_step": 209707, "epoch": 1248} {"train_loss": -10.949430465698242, "global_step": 209708, "epoch": 1248} {"train_loss": -11.776334762573242, "global_step": 209709, "epoch": 1248} {"train_loss": -10.958885192871094, "global_step": 209710, "epoch": 1248} {"train_loss": -11.46599006652832, "global_step": 209711, "epoch": 1248} {"train_loss": -11.378464698791504, "global_step": 209712, "epoch": 1248} {"train_loss": -11.184186935424805, "global_step": 209713, "epoch": 1248} {"train_loss": -11.54684066772461, "global_step": 209714, "epoch": 1248} {"train_loss": -11.330253601074219, "global_step": 209715, "epoch": 1248} {"train_loss": -11.764517784118652, "global_step": 209716, "epoch": 1248} {"train_loss": -11.565245628356934, "global_step": 209717, "epoch": 1248} {"train_loss": -11.446283340454102, "global_step": 209718, "epoch": 1248} {"train_loss": -11.672956466674805, "global_step": 209719, "epoch": 1248} {"train_loss": -11.345745086669922, "global_step": 209720, "epoch": 1248} {"train_loss": -11.706174850463867, "global_step": 209721, "epoch": 1248} {"train_loss": -11.441400527954102, "global_step": 209722, "epoch": 1248} {"train_loss": -11.782931327819824, "global_step": 209723, "epoch": 1248} {"train_loss": -11.322368621826172, "global_step": 209724, "epoch": 1248} {"train_loss": -11.239358901977539, "global_step": 209725, "epoch": 1248} {"train_loss": -11.538803100585938, "global_step": 209726, "epoch": 1248} {"train_loss": -11.335098266601562, "global_step": 209727, "epoch": 1248} {"train_loss": -11.286520957946777, "global_step": 209728, "epoch": 1248} {"train_loss": -11.310712814331055, "global_step": 209729, "epoch": 1248} {"train_loss": -11.321503639221191, "global_step": 209730, "epoch": 1248} {"train_loss": -11.407154083251953, "global_step": 209731, "epoch": 1248} {"train_loss": -10.763229370117188, "global_step": 209732, "epoch": 1248} {"train_loss": -11.004592895507812, "global_step": 209733, "epoch": 1248} {"train_loss": -11.292583465576172, "global_step": 209734, "epoch": 1248} {"train_loss": -10.741700172424316, "global_step": 209735, "epoch": 1248} {"train_loss": -11.076528549194336, "global_step": 209736, "epoch": 1248} {"train_loss": -11.394285202026367, "global_step": 209737, "epoch": 1248} {"train_loss": -11.15764045715332, "global_step": 209738, "epoch": 1248} {"train_loss": -11.662514686584473, "global_step": 209739, "epoch": 1248} {"train_loss": -11.32951545715332, "global_step": 209740, "epoch": 1248} {"train_loss": -11.46362590789795, "global_step": 209741, "epoch": 1248} {"train_loss": -11.470185279846191, "global_step": 209742, "epoch": 1248} {"train_loss": -11.295914649963379, "global_step": 209743, "epoch": 1248} {"train_loss": -11.384553909301758, "global_step": 209744, "epoch": 1248} {"train_loss": -11.477066040039062, "global_step": 209745, "epoch": 1248} {"train_loss": -11.519826889038086, "global_step": 209746, "epoch": 1248} {"train_loss": -11.312551498413086, "global_step": 209747, "epoch": 1248} {"train_loss": -11.748444557189941, "global_step": 209748, "epoch": 1248} {"train_loss": -11.483205795288086, "global_step": 209749, "epoch": 1248} {"train_loss": -11.31241226196289, "global_step": 209750, "epoch": 1248} {"train_loss": -11.814373016357422, "global_step": 209751, "epoch": 1248} {"train_loss": -11.522384643554688, "global_step": 209752, "epoch": 1248} {"train_loss": -11.59903335571289, "global_step": 209753, "epoch": 1248} {"train_loss": -11.248469352722168, "global_step": 209754, "epoch": 1248} {"train_loss": -11.464688301086426, "global_step": 209755, "epoch": 1248} {"train_loss": -11.494821548461914, "global_step": 209756, "epoch": 1248} {"train_loss": -11.30377197265625, "global_step": 209757, "epoch": 1248} {"train_loss": -11.204727172851562, "global_step": 209758, "epoch": 1248} {"train_loss": -11.523344039916992, "global_step": 209759, "epoch": 1248} {"train_loss": -11.141857147216797, "global_step": 209760, "epoch": 1248} {"train_loss": -11.132387161254883, "global_step": 209761, "epoch": 1248} {"train_loss": -11.444433212280273, "global_step": 209762, "epoch": 1248} {"train_loss": -11.498153686523438, "global_step": 209763, "epoch": 1248} {"train_loss": -11.677531242370605, "global_step": 209764, "epoch": 1248} {"train_loss": -11.663351058959961, "global_step": 209765, "epoch": 1248} {"train_loss": -11.605890274047852, "global_step": 209766, "epoch": 1248} {"train_loss": -11.592700958251953, "global_step": 209767, "epoch": 1248} {"train_loss": -11.727296829223633, "global_step": 209768, "epoch": 1248} {"train_loss": -11.834644317626953, "global_step": 209769, "epoch": 1248} {"train_loss": -11.401824951171875, "global_step": 209770, "epoch": 1248} {"train_loss": -11.656974792480469, "global_step": 209771, "epoch": 1248} {"train_loss": -11.59044075012207, "global_step": 209772, "epoch": 1248} {"train_loss": -11.510552406311035, "global_step": 209773, "epoch": 1248} {"train_loss": -11.809453964233398, "global_step": 209774, "epoch": 1248} {"train_loss": -11.850018501281738, "global_step": 209775, "epoch": 1248} {"train_loss": -11.296682357788086, "global_step": 209776, "epoch": 1248} {"train_loss": -11.643954277038574, "global_step": 209777, "epoch": 1248} {"train_loss": -11.815271377563477, "global_step": 209778, "epoch": 1248} {"train_loss": -11.510177612304688, "global_step": 209779, "epoch": 1248} {"train_loss": -11.654621124267578, "global_step": 209780, "epoch": 1248} {"train_loss": -11.264955520629883, "global_step": 209781, "epoch": 1248} {"train_loss": -11.362279891967773, "global_step": 209782, "epoch": 1248} {"train_loss": -11.395780563354492, "global_step": 209783, "epoch": 1248} {"train_loss": -11.629522323608398, "global_step": 209784, "epoch": 1248} {"train_loss": -10.875748634338379, "global_step": 209785, "epoch": 1248} {"train_loss": -10.473962783813477, "global_step": 209786, "epoch": 1248} {"train_loss": -11.553590774536133, "global_step": 209787, "epoch": 1248} {"train_loss": -10.23483943939209, "global_step": 209788, "epoch": 1248} {"train_loss": -10.726069450378418, "global_step": 209789, "epoch": 1248} {"train_loss": -10.867086410522461, "global_step": 209790, "epoch": 1248} {"train_loss": -10.289640426635742, "global_step": 209791, "epoch": 1248} {"train_loss": -11.495999336242676, "global_step": 209792, "epoch": 1248} {"train_loss": -11.191702842712402, "global_step": 209793, "epoch": 1248} {"train_loss": -11.174494743347168, "global_step": 209794, "epoch": 1248} {"train_loss": -11.713362693786621, "global_step": 209795, "epoch": 1248} {"train_loss": -11.368322372436523, "global_step": 209796, "epoch": 1248} {"train_loss": -11.65931510925293, "global_step": 209797, "epoch": 1248} {"train_loss": -11.262696266174316, "global_step": 209798, "epoch": 1248} {"train_loss": -11.15513801574707, "global_step": 209799, "epoch": 1248} {"train_loss": -11.552985191345215, "global_step": 209800, "epoch": 1248} {"train_loss": -11.393083572387695, "global_step": 209801, "epoch": 1248} {"train_loss": -11.239603996276855, "global_step": 209802, "epoch": 1248} {"train_loss": -11.30459213256836, "global_step": 209803, "epoch": 1248} {"train_loss": -11.107752799987793, "global_step": 209804, "epoch": 1248} {"train_loss": -10.608209609985352, "global_step": 209805, "epoch": 1248} {"train_loss": -11.1597900390625, "global_step": 209806, "epoch": 1248} {"train_loss": -10.861288070678711, "global_step": 209807, "epoch": 1248} {"train_loss": -10.511401176452637, "global_step": 209808, "epoch": 1248} {"train_loss": -11.099275588989258, "global_step": 209809, "epoch": 1248} {"train_loss": -10.518854141235352, "global_step": 209810, "epoch": 1248} {"train_loss": -10.608477592468262, "global_step": 209811, "epoch": 1248} {"train_loss": -10.092939376831055, "global_step": 209812, "epoch": 1248} {"train_loss": -10.95952033996582, "global_step": 209813, "epoch": 1248} {"train_loss": -10.176593780517578, "global_step": 209814, "epoch": 1248} {"train_loss": -11.25583553314209, "global_step": 209815, "epoch": 1248} {"train_loss": -10.141313552856445, "global_step": 209816, "epoch": 1248} {"train_loss": -10.700512886047363, "global_step": 209817, "epoch": 1248} {"train_loss": -10.736937522888184, "global_step": 209818, "epoch": 1248} {"train_loss": -11.296546936035156, "global_step": 209819, "epoch": 1248} {"train_loss": -10.674734115600586, "global_step": 209820, "epoch": 1248} {"train_loss": -11.212924003601074, "global_step": 209821, "epoch": 1248} {"train_loss": -11.058155059814453, "global_step": 209822, "epoch": 1248} {"train_loss": -10.329757690429688, "global_step": 209823, "epoch": 1248} {"train_loss": -10.758511543273926, "global_step": 209824, "epoch": 1248} {"train_loss": -10.418880462646484, "global_step": 209825, "epoch": 1248} {"train_loss": -10.612112045288086, "global_step": 209826, "epoch": 1248} {"train_loss": -10.584527969360352, "global_step": 209827, "epoch": 1248} {"train_loss": -11.183399200439453, "global_step": 209828, "epoch": 1248} {"train_loss": -9.970115661621094, "global_step": 209829, "epoch": 1248} {"train_loss": -11.079209327697754, "global_step": 209830, "epoch": 1248} {"train_loss": -11.254984617233276, "global_step": 209831, "epoch": 1248, "val_loss": 257545.953125} {"train_loss": -10.802400588989258, "global_step": 209832, "epoch": 1249} {"train_loss": -10.783613204956055, "global_step": 209833, "epoch": 1249} {"train_loss": -10.492137908935547, "global_step": 209834, "epoch": 1249} {"train_loss": -10.695261001586914, "global_step": 209835, "epoch": 1249} {"train_loss": -11.078703880310059, "global_step": 209836, "epoch": 1249} {"train_loss": -10.869205474853516, "global_step": 209837, "epoch": 1249} {"train_loss": -11.2012300491333, "global_step": 209838, "epoch": 1249} {"train_loss": -11.246576309204102, "global_step": 209839, "epoch": 1249} {"train_loss": -11.21005630493164, "global_step": 209840, "epoch": 1249} {"train_loss": -11.31400203704834, "global_step": 209841, "epoch": 1249} {"train_loss": -11.222329139709473, "global_step": 209842, "epoch": 1249} {"train_loss": -11.318367004394531, "global_step": 209843, "epoch": 1249} {"train_loss": -11.279972076416016, "global_step": 209844, "epoch": 1249} {"train_loss": -11.312515258789062, "global_step": 209845, "epoch": 1249} {"train_loss": -11.211265563964844, "global_step": 209846, "epoch": 1249} {"train_loss": -10.882905006408691, "global_step": 209847, "epoch": 1249} {"train_loss": -11.494935989379883, "global_step": 209848, "epoch": 1249} {"train_loss": -11.278316497802734, "global_step": 209849, "epoch": 1249} {"train_loss": -11.550966262817383, "global_step": 209850, "epoch": 1249} {"train_loss": -11.1906099319458, "global_step": 209851, "epoch": 1249} {"train_loss": -11.532108306884766, "global_step": 209852, "epoch": 1249} {"train_loss": -11.118460655212402, "global_step": 209853, "epoch": 1249} {"train_loss": -11.3183012008667, "global_step": 209854, "epoch": 1249} {"train_loss": -11.443602561950684, "global_step": 209855, "epoch": 1249} {"train_loss": -11.371683120727539, "global_step": 209856, "epoch": 1249} {"train_loss": -11.623476028442383, "global_step": 209857, "epoch": 1249} {"train_loss": -11.384153366088867, "global_step": 209858, "epoch": 1249} {"train_loss": -11.50352668762207, "global_step": 209859, "epoch": 1249} {"train_loss": -11.719696998596191, "global_step": 209860, "epoch": 1249} {"train_loss": -11.293253898620605, "global_step": 209861, "epoch": 1249} {"train_loss": -11.604372024536133, "global_step": 209862, "epoch": 1249} {"train_loss": -11.462419509887695, "global_step": 209863, "epoch": 1249} {"train_loss": -11.666925430297852, "global_step": 209864, "epoch": 1249} {"train_loss": -11.469732284545898, "global_step": 209865, "epoch": 1249} {"train_loss": -11.681248664855957, "global_step": 209866, "epoch": 1249} {"train_loss": -11.383249282836914, "global_step": 209867, "epoch": 1249} {"train_loss": -11.554037094116211, "global_step": 209868, "epoch": 1249} {"train_loss": -11.624724388122559, "global_step": 209869, "epoch": 1249} {"train_loss": -11.744823455810547, "global_step": 209870, "epoch": 1249} {"train_loss": -11.639911651611328, "global_step": 209871, "epoch": 1249} {"train_loss": -11.865848541259766, "global_step": 209872, "epoch": 1249} {"train_loss": -11.703352928161621, "global_step": 209873, "epoch": 1249} {"train_loss": -11.491273880004883, "global_step": 209874, "epoch": 1249} {"train_loss": -11.769634246826172, "global_step": 209875, "epoch": 1249} {"train_loss": -11.712250709533691, "global_step": 209876, "epoch": 1249} {"train_loss": -11.561161041259766, "global_step": 209877, "epoch": 1249} {"train_loss": -11.782721519470215, "global_step": 209878, "epoch": 1249} {"train_loss": -11.586286544799805, "global_step": 209879, "epoch": 1249} {"train_loss": -11.760093688964844, "global_step": 209880, "epoch": 1249} {"train_loss": -11.707828521728516, "global_step": 209881, "epoch": 1249} {"train_loss": -11.73256778717041, "global_step": 209882, "epoch": 1249} {"train_loss": -11.835773468017578, "global_step": 209883, "epoch": 1249} {"train_loss": -11.779415130615234, "global_step": 209884, "epoch": 1249} {"train_loss": -11.937573432922363, "global_step": 209885, "epoch": 1249} {"train_loss": -11.854483604431152, "global_step": 209886, "epoch": 1249} {"train_loss": -11.790260314941406, "global_step": 209887, "epoch": 1249} {"train_loss": -11.830676078796387, "global_step": 209888, "epoch": 1249} {"train_loss": -11.985488891601562, "global_step": 209889, "epoch": 1249} {"train_loss": -11.926658630371094, "global_step": 209890, "epoch": 1249} {"train_loss": -11.941954612731934, "global_step": 209891, "epoch": 1249} {"train_loss": -11.948508262634277, "global_step": 209892, "epoch": 1249} {"train_loss": -11.851408958435059, "global_step": 209893, "epoch": 1249} {"train_loss": -11.872679710388184, "global_step": 209894, "epoch": 1249} {"train_loss": -12.027082443237305, "global_step": 209895, "epoch": 1249} {"train_loss": -12.000396728515625, "global_step": 209896, "epoch": 1249} {"train_loss": -11.858275413513184, "global_step": 209897, "epoch": 1249} {"train_loss": -11.853809356689453, "global_step": 209898, "epoch": 1249} {"train_loss": -12.135319709777832, "global_step": 209899, "epoch": 1249} {"train_loss": -11.943513870239258, "global_step": 209900, "epoch": 1249} {"train_loss": -11.980549812316895, "global_step": 209901, "epoch": 1249} {"train_loss": -11.824005126953125, "global_step": 209902, "epoch": 1249} {"train_loss": -12.039653778076172, "global_step": 209903, "epoch": 1249} {"train_loss": -11.64521598815918, "global_step": 209904, "epoch": 1249} {"train_loss": -11.979312896728516, "global_step": 209905, "epoch": 1249} {"train_loss": -11.785430908203125, "global_step": 209906, "epoch": 1249} {"train_loss": -11.787302017211914, "global_step": 209907, "epoch": 1249} {"train_loss": -11.826427459716797, "global_step": 209908, "epoch": 1249} {"train_loss": -10.952960014343262, "global_step": 209909, "epoch": 1249} {"train_loss": -9.903229713439941, "global_step": 209910, "epoch": 1249} {"train_loss": -10.48885726928711, "global_step": 209911, "epoch": 1249} {"train_loss": -11.844347953796387, "global_step": 209912, "epoch": 1249} {"train_loss": -9.676609992980957, "global_step": 209913, "epoch": 1249} {"train_loss": -9.465682983398438, "global_step": 209914, "epoch": 1249} {"train_loss": -10.35959529876709, "global_step": 209915, "epoch": 1249} {"train_loss": -10.92600154876709, "global_step": 209916, "epoch": 1249} {"train_loss": -10.766830444335938, "global_step": 209917, "epoch": 1249} {"train_loss": -8.68299674987793, "global_step": 209918, "epoch": 1249} {"train_loss": -10.047344207763672, "global_step": 209919, "epoch": 1249} {"train_loss": -8.881111145019531, "global_step": 209920, "epoch": 1249} {"train_loss": -8.782529830932617, "global_step": 209921, "epoch": 1249} {"train_loss": -8.693925857543945, "global_step": 209922, "epoch": 1249} {"train_loss": -8.706690788269043, "global_step": 209923, "epoch": 1249} {"train_loss": -10.441995620727539, "global_step": 209924, "epoch": 1249} {"train_loss": -8.720855712890625, "global_step": 209925, "epoch": 1249} {"train_loss": -9.469130516052246, "global_step": 209926, "epoch": 1249} {"train_loss": -10.540584564208984, "global_step": 209927, "epoch": 1249} {"train_loss": -10.309609413146973, "global_step": 209928, "epoch": 1249} {"train_loss": -11.086423873901367, "global_step": 209929, "epoch": 1249} {"train_loss": -10.8572998046875, "global_step": 209930, "epoch": 1249} {"train_loss": -11.260168075561523, "global_step": 209931, "epoch": 1249} {"train_loss": -10.658647537231445, "global_step": 209932, "epoch": 1249} {"train_loss": -10.952577590942383, "global_step": 209933, "epoch": 1249} {"train_loss": -10.477577209472656, "global_step": 209934, "epoch": 1249} {"train_loss": -11.04347038269043, "global_step": 209935, "epoch": 1249} {"train_loss": -10.545146942138672, "global_step": 209936, "epoch": 1249} {"train_loss": -11.009805679321289, "global_step": 209937, "epoch": 1249} {"train_loss": -10.882338523864746, "global_step": 209938, "epoch": 1249} {"train_loss": -11.001507759094238, "global_step": 209939, "epoch": 1249} {"train_loss": -10.852693557739258, "global_step": 209940, "epoch": 1249} {"train_loss": -10.926891326904297, "global_step": 209941, "epoch": 1249} {"train_loss": -11.068878173828125, "global_step": 209942, "epoch": 1249} {"train_loss": -10.582275390625, "global_step": 209943, "epoch": 1249} {"train_loss": -10.829940795898438, "global_step": 209944, "epoch": 1249} {"train_loss": -10.708175659179688, "global_step": 209945, "epoch": 1249} {"train_loss": -11.36992359161377, "global_step": 209946, "epoch": 1249} {"train_loss": -11.028586387634277, "global_step": 209947, "epoch": 1249} {"train_loss": -10.950620651245117, "global_step": 209948, "epoch": 1249} {"train_loss": -10.816739082336426, "global_step": 209949, "epoch": 1249} {"train_loss": -11.080738067626953, "global_step": 209950, "epoch": 1249} {"train_loss": -11.233986854553223, "global_step": 209951, "epoch": 1249} {"train_loss": -11.090492248535156, "global_step": 209952, "epoch": 1249} {"train_loss": -11.478433609008789, "global_step": 209953, "epoch": 1249} {"train_loss": -11.112653732299805, "global_step": 209954, "epoch": 1249} {"train_loss": -11.478615760803223, "global_step": 209955, "epoch": 1249} {"train_loss": -11.078056335449219, "global_step": 209956, "epoch": 1249} {"train_loss": -11.12309455871582, "global_step": 209957, "epoch": 1249} {"train_loss": -10.987777709960938, "global_step": 209958, "epoch": 1249} {"train_loss": -11.506611824035645, "global_step": 209959, "epoch": 1249} {"train_loss": -10.98447036743164, "global_step": 209960, "epoch": 1249} {"train_loss": -11.357781410217285, "global_step": 209961, "epoch": 1249} {"train_loss": -11.504021644592285, "global_step": 209962, "epoch": 1249} {"train_loss": -11.22335433959961, "global_step": 209963, "epoch": 1249} {"train_loss": -11.213949203491211, "global_step": 209964, "epoch": 1249} {"train_loss": -11.205810546875, "global_step": 209965, "epoch": 1249} {"train_loss": -11.242605209350586, "global_step": 209966, "epoch": 1249} {"train_loss": -11.32491683959961, "global_step": 209967, "epoch": 1249} {"train_loss": -11.28022575378418, "global_step": 209968, "epoch": 1249} {"train_loss": -11.219491004943848, "global_step": 209969, "epoch": 1249} {"train_loss": -11.430586814880371, "global_step": 209970, "epoch": 1249} {"train_loss": -11.161218643188477, "global_step": 209971, "epoch": 1249} {"train_loss": -11.527740478515625, "global_step": 209972, "epoch": 1249} {"train_loss": -11.39696979522705, "global_step": 209973, "epoch": 1249} {"train_loss": -11.641911506652832, "global_step": 209974, "epoch": 1249} {"train_loss": -11.533040046691895, "global_step": 209975, "epoch": 1249} {"train_loss": -11.559297561645508, "global_step": 209976, "epoch": 1249} {"train_loss": -11.528482437133789, "global_step": 209977, "epoch": 1249} {"train_loss": -11.338983535766602, "global_step": 209978, "epoch": 1249} {"train_loss": -11.493403434753418, "global_step": 209979, "epoch": 1249} {"train_loss": -11.54378890991211, "global_step": 209980, "epoch": 1249} {"train_loss": -11.26338005065918, "global_step": 209981, "epoch": 1249} {"train_loss": -11.70130729675293, "global_step": 209982, "epoch": 1249} {"train_loss": -11.513395309448242, "global_step": 209983, "epoch": 1249} {"train_loss": -11.632923126220703, "global_step": 209984, "epoch": 1249} {"train_loss": -11.702427864074707, "global_step": 209985, "epoch": 1249} {"train_loss": -11.578393936157227, "global_step": 209986, "epoch": 1249} {"train_loss": -11.612712860107422, "global_step": 209987, "epoch": 1249} {"train_loss": -11.75550365447998, "global_step": 209988, "epoch": 1249} {"train_loss": -11.505162239074707, "global_step": 209989, "epoch": 1249} {"train_loss": -11.659996032714844, "global_step": 209990, "epoch": 1249} {"train_loss": -11.796110153198242, "global_step": 209991, "epoch": 1249} {"train_loss": -11.689962387084961, "global_step": 209992, "epoch": 1249} {"train_loss": -11.33898639678955, "global_step": 209993, "epoch": 1249} {"train_loss": -11.53817367553711, "global_step": 209994, "epoch": 1249} {"train_loss": -11.667806625366211, "global_step": 209995, "epoch": 1249} {"train_loss": -11.631355285644531, "global_step": 209996, "epoch": 1249} {"train_loss": -11.448159217834473, "global_step": 209997, "epoch": 1249} {"train_loss": -11.246344566345215, "global_step": 209998, "epoch": 1249} {"train_loss": -11.233608592124213, "global_step": 209999, "epoch": 1249, "val_loss": 245426.546875} {"train_loss": -11.22572135925293, "global_step": 210000, "epoch": 1250} {"train_loss": -11.264389038085938, "global_step": 210001, "epoch": 1250} {"train_loss": -11.419296264648438, "global_step": 210002, "epoch": 1250} {"train_loss": -11.373727798461914, "global_step": 210003, "epoch": 1250} {"train_loss": -11.220396995544434, "global_step": 210004, "epoch": 1250} {"train_loss": -11.720410346984863, "global_step": 210005, "epoch": 1250} {"train_loss": -11.28935432434082, "global_step": 210006, "epoch": 1250} {"train_loss": -11.648185729980469, "global_step": 210007, "epoch": 1250} {"train_loss": -11.067671775817871, "global_step": 210008, "epoch": 1250} {"train_loss": -11.345483779907227, "global_step": 210009, "epoch": 1250} {"train_loss": -11.600107192993164, "global_step": 210010, "epoch": 1250} {"train_loss": -11.485882759094238, "global_step": 210011, "epoch": 1250} {"train_loss": -11.27899169921875, "global_step": 210012, "epoch": 1250} {"train_loss": -11.483555793762207, "global_step": 210013, "epoch": 1250} {"train_loss": -11.181371688842773, "global_step": 210014, "epoch": 1250} {"train_loss": -11.619641304016113, "global_step": 210015, "epoch": 1250} {"train_loss": -11.065149307250977, "global_step": 210016, "epoch": 1250} {"train_loss": -10.865638732910156, "global_step": 210017, "epoch": 1250} {"train_loss": -11.655878067016602, "global_step": 210018, "epoch": 1250} {"train_loss": -10.482985496520996, "global_step": 210019, "epoch": 1250} {"train_loss": -10.981243133544922, "global_step": 210020, "epoch": 1250} {"train_loss": -11.59373664855957, "global_step": 210021, "epoch": 1250} {"train_loss": -10.315973281860352, "global_step": 210022, "epoch": 1250} {"train_loss": -11.667701721191406, "global_step": 210023, "epoch": 1250} {"train_loss": -10.897436141967773, "global_step": 210024, "epoch": 1250} {"train_loss": -10.974048614501953, "global_step": 210025, "epoch": 1250} {"train_loss": -11.179513931274414, "global_step": 210026, "epoch": 1250} {"train_loss": -11.243789672851562, "global_step": 210027, "epoch": 1250} {"train_loss": -11.611129760742188, "global_step": 210028, "epoch": 1250} {"train_loss": -11.240354537963867, "global_step": 210029, "epoch": 1250} {"train_loss": -11.33914566040039, "global_step": 210030, "epoch": 1250} {"train_loss": -11.199458122253418, "global_step": 210031, "epoch": 1250} {"train_loss": -11.254369735717773, "global_step": 210032, "epoch": 1250} {"train_loss": -11.589463233947754, "global_step": 210033, "epoch": 1250} {"train_loss": -10.820904731750488, "global_step": 210034, "epoch": 1250} {"train_loss": -11.652008056640625, "global_step": 210035, "epoch": 1250} {"train_loss": -11.370063781738281, "global_step": 210036, "epoch": 1250} {"train_loss": -11.312116622924805, "global_step": 210037, "epoch": 1250} {"train_loss": -11.373954772949219, "global_step": 210038, "epoch": 1250} {"train_loss": -11.425808906555176, "global_step": 210039, "epoch": 1250} {"train_loss": -11.437475204467773, "global_step": 210040, "epoch": 1250} {"train_loss": -11.413374900817871, "global_step": 210041, "epoch": 1250} {"train_loss": -11.610149383544922, "global_step": 210042, "epoch": 1250} {"train_loss": -11.609830856323242, "global_step": 210043, "epoch": 1250} {"train_loss": -11.442920684814453, "global_step": 210044, "epoch": 1250} {"train_loss": -11.573182106018066, "global_step": 210045, "epoch": 1250} {"train_loss": -11.03187370300293, "global_step": 210046, "epoch": 1250} {"train_loss": -11.406379699707031, "global_step": 210047, "epoch": 1250} {"train_loss": -11.431640625, "global_step": 210048, "epoch": 1250} {"train_loss": -11.341151237487793, "global_step": 210049, "epoch": 1250} {"train_loss": -11.579357147216797, "global_step": 210050, "epoch": 1250} {"train_loss": -11.61553955078125, "global_step": 210051, "epoch": 1250} {"train_loss": -11.674469947814941, "global_step": 210052, "epoch": 1250} {"train_loss": -11.670536994934082, "global_step": 210053, "epoch": 1250} {"train_loss": -11.516374588012695, "global_step": 210054, "epoch": 1250} {"train_loss": -11.754263877868652, "global_step": 210055, "epoch": 1250} {"train_loss": -11.622313499450684, "global_step": 210056, "epoch": 1250} {"train_loss": -11.642003059387207, "global_step": 210057, "epoch": 1250} {"train_loss": -11.761616706848145, "global_step": 210058, "epoch": 1250} {"train_loss": -11.29673957824707, "global_step": 210059, "epoch": 1250} {"train_loss": -11.547372817993164, "global_step": 210060, "epoch": 1250} {"train_loss": -11.311748504638672, "global_step": 210061, "epoch": 1250} {"train_loss": -11.737382888793945, "global_step": 210062, "epoch": 1250} {"train_loss": -11.679630279541016, "global_step": 210063, "epoch": 1250} {"train_loss": -11.623875617980957, "global_step": 210064, "epoch": 1250} {"train_loss": -11.588924407958984, "global_step": 210065, "epoch": 1250} {"train_loss": -11.449480056762695, "global_step": 210066, "epoch": 1250} {"train_loss": -11.47339916229248, "global_step": 210067, "epoch": 1250} {"train_loss": -11.644132614135742, "global_step": 210068, "epoch": 1250} {"train_loss": -11.627178192138672, "global_step": 210069, "epoch": 1250} {"train_loss": -11.316436767578125, "global_step": 210070, "epoch": 1250} {"train_loss": -11.505772590637207, "global_step": 210071, "epoch": 1250} {"train_loss": -11.433032989501953, "global_step": 210072, "epoch": 1250} {"train_loss": -11.571395874023438, "global_step": 210073, "epoch": 1250} {"train_loss": -11.577447891235352, "global_step": 210074, "epoch": 1250} {"train_loss": -11.710355758666992, "global_step": 210075, "epoch": 1250} {"train_loss": -11.399477005004883, "global_step": 210076, "epoch": 1250} {"train_loss": -11.383308410644531, "global_step": 210077, "epoch": 1250} {"train_loss": -11.607137680053711, "global_step": 210078, "epoch": 1250} {"train_loss": -11.46464729309082, "global_step": 210079, "epoch": 1250} {"train_loss": -11.240043640136719, "global_step": 210080, "epoch": 1250} {"train_loss": -11.165678024291992, "global_step": 210081, "epoch": 1250} {"train_loss": -11.590934753417969, "global_step": 210082, "epoch": 1250} {"train_loss": -11.455816268920898, "global_step": 210083, "epoch": 1250} {"train_loss": -11.473676681518555, "global_step": 210084, "epoch": 1250} {"train_loss": -11.285011291503906, "global_step": 210085, "epoch": 1250} {"train_loss": -11.821810722351074, "global_step": 210086, "epoch": 1250} {"train_loss": -11.680663108825684, "global_step": 210087, "epoch": 1250} {"train_loss": -11.465693473815918, "global_step": 210088, "epoch": 1250} {"train_loss": -10.936098098754883, "global_step": 210089, "epoch": 1250} {"train_loss": -11.645978927612305, "global_step": 210090, "epoch": 1250} {"train_loss": -11.56184196472168, "global_step": 210091, "epoch": 1250} {"train_loss": -11.035253524780273, "global_step": 210092, "epoch": 1250} {"train_loss": -10.691442489624023, "global_step": 210093, "epoch": 1250} {"train_loss": -11.604436874389648, "global_step": 210094, "epoch": 1250} {"train_loss": -10.399999618530273, "global_step": 210095, "epoch": 1250} {"train_loss": -11.492788314819336, "global_step": 210096, "epoch": 1250} {"train_loss": -10.984384536743164, "global_step": 210097, "epoch": 1250} {"train_loss": -11.67957878112793, "global_step": 210098, "epoch": 1250} {"train_loss": -10.60251235961914, "global_step": 210099, "epoch": 1250} {"train_loss": -11.628862380981445, "global_step": 210100, "epoch": 1250} {"train_loss": -10.86294937133789, "global_step": 210101, "epoch": 1250} {"train_loss": -11.427163124084473, "global_step": 210102, "epoch": 1250} {"train_loss": -11.413177490234375, "global_step": 210103, "epoch": 1250} {"train_loss": -11.266653060913086, "global_step": 210104, "epoch": 1250} {"train_loss": -11.346572875976562, "global_step": 210105, "epoch": 1250} {"train_loss": -11.167911529541016, "global_step": 210106, "epoch": 1250} {"train_loss": -11.236572265625, "global_step": 210107, "epoch": 1250} {"train_loss": -11.495643615722656, "global_step": 210108, "epoch": 1250} {"train_loss": -11.338157653808594, "global_step": 210109, "epoch": 1250} {"train_loss": -11.1957368850708, "global_step": 210110, "epoch": 1250} {"train_loss": -11.682771682739258, "global_step": 210111, "epoch": 1250} {"train_loss": -11.35586166381836, "global_step": 210112, "epoch": 1250} {"train_loss": -11.429302215576172, "global_step": 210113, "epoch": 1250} {"train_loss": -11.022571563720703, "global_step": 210114, "epoch": 1250} {"train_loss": -11.298593521118164, "global_step": 210115, "epoch": 1250} {"train_loss": -11.441755294799805, "global_step": 210116, "epoch": 1250} {"train_loss": -11.543893814086914, "global_step": 210117, "epoch": 1250} {"train_loss": -11.627333641052246, "global_step": 210118, "epoch": 1250} {"train_loss": -11.45318603515625, "global_step": 210119, "epoch": 1250} {"train_loss": -11.630879402160645, "global_step": 210120, "epoch": 1250} {"train_loss": -11.207934379577637, "global_step": 210121, "epoch": 1250} {"train_loss": -11.718648910522461, "global_step": 210122, "epoch": 1250} {"train_loss": -11.39468002319336, "global_step": 210123, "epoch": 1250} {"train_loss": -11.299699783325195, "global_step": 210124, "epoch": 1250} {"train_loss": -11.444486618041992, "global_step": 210125, "epoch": 1250} {"train_loss": -11.777139663696289, "global_step": 210126, "epoch": 1250} {"train_loss": -11.107718467712402, "global_step": 210127, "epoch": 1250} {"train_loss": -11.4610595703125, "global_step": 210128, "epoch": 1250} {"train_loss": -11.363798141479492, "global_step": 210129, "epoch": 1250} {"train_loss": -10.660863876342773, "global_step": 210130, "epoch": 1250} {"train_loss": -11.560190200805664, "global_step": 210131, "epoch": 1250} {"train_loss": -11.235596656799316, "global_step": 210132, "epoch": 1250} {"train_loss": -11.191242218017578, "global_step": 210133, "epoch": 1250} {"train_loss": -11.391183853149414, "global_step": 210134, "epoch": 1250} {"train_loss": -10.969905853271484, "global_step": 210135, "epoch": 1250} {"train_loss": -11.47402572631836, "global_step": 210136, "epoch": 1250} {"train_loss": -11.448604583740234, "global_step": 210137, "epoch": 1250} {"train_loss": -11.350234031677246, "global_step": 210138, "epoch": 1250} {"train_loss": -11.250685691833496, "global_step": 210139, "epoch": 1250} {"train_loss": -11.117012977600098, "global_step": 210140, "epoch": 1250} {"train_loss": -11.594535827636719, "global_step": 210141, "epoch": 1250} {"train_loss": -11.239654541015625, "global_step": 210142, "epoch": 1250} {"train_loss": -11.391036987304688, "global_step": 210143, "epoch": 1250} {"train_loss": -11.647553443908691, "global_step": 210144, "epoch": 1250} {"train_loss": -11.44371509552002, "global_step": 210145, "epoch": 1250} {"train_loss": -11.312219619750977, "global_step": 210146, "epoch": 1250} {"train_loss": -11.048442840576172, "global_step": 210147, "epoch": 1250} {"train_loss": -11.025338172912598, "global_step": 210148, "epoch": 1250} {"train_loss": -10.962620735168457, "global_step": 210149, "epoch": 1250} {"train_loss": -11.672052383422852, "global_step": 210150, "epoch": 1250} {"train_loss": -10.714164733886719, "global_step": 210151, "epoch": 1250} {"train_loss": -11.777119636535645, "global_step": 210152, "epoch": 1250} {"train_loss": -11.267646789550781, "global_step": 210153, "epoch": 1250} {"train_loss": -11.422992706298828, "global_step": 210154, "epoch": 1250} {"train_loss": -11.449224472045898, "global_step": 210155, "epoch": 1250} {"train_loss": -11.345098495483398, "global_step": 210156, "epoch": 1250} {"train_loss": -11.40863037109375, "global_step": 210157, "epoch": 1250} {"train_loss": -11.66036605834961, "global_step": 210158, "epoch": 1250} {"train_loss": -11.211982727050781, "global_step": 210159, "epoch": 1250} {"train_loss": -11.699231147766113, "global_step": 210160, "epoch": 1250} {"train_loss": -11.522762298583984, "global_step": 210161, "epoch": 1250} {"train_loss": -11.598255157470703, "global_step": 210162, "epoch": 1250} {"train_loss": -11.797064781188965, "global_step": 210163, "epoch": 1250} {"train_loss": -11.271697998046875, "global_step": 210164, "epoch": 1250} {"train_loss": -11.687419891357422, "global_step": 210165, "epoch": 1250} {"train_loss": -11.104902267456055, "global_step": 210166, "epoch": 1250} {"train_loss": -11.374701267197018, "global_step": 210167, "epoch": 1250, "train/sim_max_reward_0": 0.48219981031633735, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.2189088131509831, "train/sim_max_reward_4": 0.9715086748196998, "train/sim_max_reward_5": 0.5163773999908099, "test/sim_max_reward_4400000": 0.9789235580671442, "test/sim_max_reward_4400001": 0.4937222173533036, "test/sim_max_reward_4400002": 0.08669380918123287, "test/sim_max_reward_4400003": 0.21315202057311847, "test/sim_max_reward_4400004": 0.6707259259899057, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 0.9517677846277489, "test/sim_max_reward_4400007": 0.9064573591168525, "test/sim_max_reward_4400008": 0.5603436930512111, "test/sim_max_reward_4400009": 0.03261388436332741, "test/sim_max_reward_4400010": 0.29618167612677676, "test/sim_max_reward_4400011": 0.9625989106998881, "test/sim_max_reward_4400012": 0.9925690887679397, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 0.34997877805189, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9743588658213286, "test/sim_max_reward_4400019": 0.3905339750569811, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 1.0, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.155241860762951, "test/sim_max_reward_4400024": 0.2837665875210072, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.08062866049528278, "test/sim_max_reward_4400027": 1.0, "test/sim_max_reward_4400028": 0.684900355477435, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9290140437227676, "test/sim_max_reward_4400031": 0.5062632114634866, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9769857432288135, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.28448406874321924, "test/sim_max_reward_4400036": 0.9333181355492364, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.9443345711772373, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.1575736019947732, "test/sim_max_reward_4400042": 0.029305959137296198, "test/sim_max_reward_4400043": 0.9835892435728196, "test/sim_max_reward_4400044": 0.9892722647317552, "test/sim_max_reward_4400045": 0.5607983885627843, "test/sim_max_reward_4400046": 0.9814447025027406, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.5314991163796384, "test/mean_score": 0.5585487571551849, "val_loss": 250935.828125, "train_action_mse_error": 2.850752592086792} {"train_loss": -11.314881324768066, "global_step": 210168, "epoch": 1251} {"train_loss": -11.726512908935547, "global_step": 210169, "epoch": 1251} {"train_loss": -11.60407829284668, "global_step": 210170, "epoch": 1251} {"train_loss": -11.231616973876953, "global_step": 210171, "epoch": 1251} {"train_loss": -11.602914810180664, "global_step": 210172, "epoch": 1251} {"train_loss": -11.139934539794922, "global_step": 210173, "epoch": 1251} {"train_loss": -11.38715934753418, "global_step": 210174, "epoch": 1251} {"train_loss": -11.50520133972168, "global_step": 210175, "epoch": 1251} {"train_loss": -11.590023040771484, "global_step": 210176, "epoch": 1251} {"train_loss": -11.721455574035645, "global_step": 210177, "epoch": 1251} {"train_loss": -11.581245422363281, "global_step": 210178, "epoch": 1251} {"train_loss": -11.330278396606445, "global_step": 210179, "epoch": 1251} {"train_loss": -11.761616706848145, "global_step": 210180, "epoch": 1251} {"train_loss": -11.742391586303711, "global_step": 210181, "epoch": 1251} {"train_loss": -11.749452590942383, "global_step": 210182, "epoch": 1251} {"train_loss": -11.707176208496094, "global_step": 210183, "epoch": 1251} {"train_loss": -11.215914726257324, "global_step": 210184, "epoch": 1251} {"train_loss": -11.328324317932129, "global_step": 210185, "epoch": 1251} {"train_loss": -11.475278854370117, "global_step": 210186, "epoch": 1251} {"train_loss": -11.642026901245117, "global_step": 210187, "epoch": 1251} {"train_loss": -11.786714553833008, "global_step": 210188, "epoch": 1251} {"train_loss": -11.750083923339844, "global_step": 210189, "epoch": 1251} {"train_loss": -11.827181816101074, "global_step": 210190, "epoch": 1251} {"train_loss": -11.834242820739746, "global_step": 210191, "epoch": 1251} {"train_loss": -11.607101440429688, "global_step": 210192, "epoch": 1251} {"train_loss": -11.903082847595215, "global_step": 210193, "epoch": 1251} {"train_loss": -11.872701644897461, "global_step": 210194, "epoch": 1251} {"train_loss": -11.568756103515625, "global_step": 210195, "epoch": 1251} {"train_loss": -11.660567283630371, "global_step": 210196, "epoch": 1251} {"train_loss": -11.739450454711914, "global_step": 210197, "epoch": 1251} {"train_loss": -11.84836483001709, "global_step": 210198, "epoch": 1251} {"train_loss": -11.76340103149414, "global_step": 210199, "epoch": 1251} {"train_loss": -11.54388427734375, "global_step": 210200, "epoch": 1251} {"train_loss": -11.890915870666504, "global_step": 210201, "epoch": 1251} {"train_loss": -11.908174514770508, "global_step": 210202, "epoch": 1251} {"train_loss": -11.73601245880127, "global_step": 210203, "epoch": 1251} {"train_loss": -11.249507904052734, "global_step": 210204, "epoch": 1251} {"train_loss": -11.768403053283691, "global_step": 210205, "epoch": 1251} {"train_loss": -11.62444019317627, "global_step": 210206, "epoch": 1251} {"train_loss": -11.708751678466797, "global_step": 210207, "epoch": 1251} {"train_loss": -11.756584167480469, "global_step": 210208, "epoch": 1251} {"train_loss": -11.693573951721191, "global_step": 210209, "epoch": 1251} {"train_loss": -10.98758316040039, "global_step": 210210, "epoch": 1251} {"train_loss": -10.790340423583984, "global_step": 210211, "epoch": 1251} {"train_loss": -11.401582717895508, "global_step": 210212, "epoch": 1251} {"train_loss": -11.090118408203125, "global_step": 210213, "epoch": 1251} {"train_loss": -9.667871475219727, "global_step": 210214, "epoch": 1251} {"train_loss": -11.656484603881836, "global_step": 210215, "epoch": 1251} {"train_loss": -10.80362319946289, "global_step": 210216, "epoch": 1251} {"train_loss": -10.749349594116211, "global_step": 210217, "epoch": 1251} {"train_loss": -9.504520416259766, "global_step": 210218, "epoch": 1251} {"train_loss": -10.413334846496582, "global_step": 210219, "epoch": 1251} {"train_loss": -10.163968086242676, "global_step": 210220, "epoch": 1251} {"train_loss": -10.063729286193848, "global_step": 210221, "epoch": 1251} {"train_loss": -9.937206268310547, "global_step": 210222, "epoch": 1251} {"train_loss": -8.787796974182129, "global_step": 210223, "epoch": 1251} {"train_loss": -11.290273666381836, "global_step": 210224, "epoch": 1251} {"train_loss": -10.327617645263672, "global_step": 210225, "epoch": 1251} {"train_loss": -10.710226058959961, "global_step": 210226, "epoch": 1251} {"train_loss": -10.324257850646973, "global_step": 210227, "epoch": 1251} {"train_loss": -10.252500534057617, "global_step": 210228, "epoch": 1251} {"train_loss": -10.481708526611328, "global_step": 210229, "epoch": 1251} {"train_loss": -10.38692855834961, "global_step": 210230, "epoch": 1251} {"train_loss": -11.16157054901123, "global_step": 210231, "epoch": 1251} {"train_loss": -10.980424880981445, "global_step": 210232, "epoch": 1251} {"train_loss": -11.036636352539062, "global_step": 210233, "epoch": 1251} {"train_loss": -11.018821716308594, "global_step": 210234, "epoch": 1251} {"train_loss": -11.042479515075684, "global_step": 210235, "epoch": 1251} {"train_loss": -11.251934051513672, "global_step": 210236, "epoch": 1251} {"train_loss": -11.282233238220215, "global_step": 210237, "epoch": 1251} {"train_loss": -11.054986953735352, "global_step": 210238, "epoch": 1251} {"train_loss": -11.023760795593262, "global_step": 210239, "epoch": 1251} {"train_loss": -10.825237274169922, "global_step": 210240, "epoch": 1251} {"train_loss": -10.669015884399414, "global_step": 210241, "epoch": 1251} {"train_loss": -11.170297622680664, "global_step": 210242, "epoch": 1251} {"train_loss": -11.303537368774414, "global_step": 210243, "epoch": 1251} {"train_loss": -10.814311981201172, "global_step": 210244, "epoch": 1251} {"train_loss": -10.884515762329102, "global_step": 210245, "epoch": 1251} {"train_loss": -11.06550407409668, "global_step": 210246, "epoch": 1251} {"train_loss": -10.913873672485352, "global_step": 210247, "epoch": 1251} {"train_loss": -11.44477653503418, "global_step": 210248, "epoch": 1251} {"train_loss": -11.289911270141602, "global_step": 210249, "epoch": 1251} {"train_loss": -11.16026496887207, "global_step": 210250, "epoch": 1251} {"train_loss": -11.446989059448242, "global_step": 210251, "epoch": 1251} {"train_loss": -11.489176750183105, "global_step": 210252, "epoch": 1251} {"train_loss": -11.558697700500488, "global_step": 210253, "epoch": 1251} {"train_loss": -11.230127334594727, "global_step": 210254, "epoch": 1251} {"train_loss": -11.475696563720703, "global_step": 210255, "epoch": 1251} {"train_loss": -11.410646438598633, "global_step": 210256, "epoch": 1251} {"train_loss": -11.215946197509766, "global_step": 210257, "epoch": 1251} {"train_loss": -11.229514122009277, "global_step": 210258, "epoch": 1251} {"train_loss": -11.452585220336914, "global_step": 210259, "epoch": 1251} {"train_loss": -11.247537612915039, "global_step": 210260, "epoch": 1251} {"train_loss": -11.245408058166504, "global_step": 210261, "epoch": 1251} {"train_loss": -11.382566452026367, "global_step": 210262, "epoch": 1251} {"train_loss": -11.660652160644531, "global_step": 210263, "epoch": 1251} {"train_loss": -11.237460136413574, "global_step": 210264, "epoch": 1251} {"train_loss": -11.423518180847168, "global_step": 210265, "epoch": 1251} {"train_loss": -11.624399185180664, "global_step": 210266, "epoch": 1251} {"train_loss": -11.501934051513672, "global_step": 210267, "epoch": 1251} {"train_loss": -11.758689880371094, "global_step": 210268, "epoch": 1251} {"train_loss": -11.637628555297852, "global_step": 210269, "epoch": 1251} {"train_loss": -11.628368377685547, "global_step": 210270, "epoch": 1251} {"train_loss": -11.523212432861328, "global_step": 210271, "epoch": 1251} {"train_loss": -11.45850944519043, "global_step": 210272, "epoch": 1251} {"train_loss": -11.62547492980957, "global_step": 210273, "epoch": 1251} {"train_loss": -11.727666854858398, "global_step": 210274, "epoch": 1251} {"train_loss": -11.720765113830566, "global_step": 210275, "epoch": 1251} {"train_loss": -11.541069030761719, "global_step": 210276, "epoch": 1251} {"train_loss": -11.63790512084961, "global_step": 210277, "epoch": 1251} {"train_loss": -11.769256591796875, "global_step": 210278, "epoch": 1251} {"train_loss": -11.548201560974121, "global_step": 210279, "epoch": 1251} {"train_loss": -11.753644943237305, "global_step": 210280, "epoch": 1251} {"train_loss": -11.601301193237305, "global_step": 210281, "epoch": 1251} {"train_loss": -11.807584762573242, "global_step": 210282, "epoch": 1251} {"train_loss": -11.139081954956055, "global_step": 210283, "epoch": 1251} {"train_loss": -11.816741943359375, "global_step": 210284, "epoch": 1251} {"train_loss": -11.811917304992676, "global_step": 210285, "epoch": 1251} {"train_loss": -11.602874755859375, "global_step": 210286, "epoch": 1251} {"train_loss": -11.622794151306152, "global_step": 210287, "epoch": 1251} {"train_loss": -11.669538497924805, "global_step": 210288, "epoch": 1251} {"train_loss": -11.193248748779297, "global_step": 210289, "epoch": 1251} {"train_loss": -11.295610427856445, "global_step": 210290, "epoch": 1251} {"train_loss": -11.808553695678711, "global_step": 210291, "epoch": 1251} {"train_loss": -11.702848434448242, "global_step": 210292, "epoch": 1251} {"train_loss": -11.56758975982666, "global_step": 210293, "epoch": 1251} {"train_loss": -11.760062217712402, "global_step": 210294, "epoch": 1251} {"train_loss": -11.845279693603516, "global_step": 210295, "epoch": 1251} {"train_loss": -11.490621566772461, "global_step": 210296, "epoch": 1251} {"train_loss": -11.324125289916992, "global_step": 210297, "epoch": 1251} {"train_loss": -11.635369300842285, "global_step": 210298, "epoch": 1251} {"train_loss": -11.868412017822266, "global_step": 210299, "epoch": 1251} {"train_loss": -11.556434631347656, "global_step": 210300, "epoch": 1251} {"train_loss": -11.212326049804688, "global_step": 210301, "epoch": 1251} {"train_loss": -11.490938186645508, "global_step": 210302, "epoch": 1251} {"train_loss": -11.42784309387207, "global_step": 210303, "epoch": 1251} {"train_loss": -11.835966110229492, "global_step": 210304, "epoch": 1251} {"train_loss": -11.389997482299805, "global_step": 210305, "epoch": 1251} {"train_loss": -11.754876136779785, "global_step": 210306, "epoch": 1251} {"train_loss": -11.623350143432617, "global_step": 210307, "epoch": 1251} {"train_loss": -11.553838729858398, "global_step": 210308, "epoch": 1251} {"train_loss": -11.648283958435059, "global_step": 210309, "epoch": 1251} {"train_loss": -11.396957397460938, "global_step": 210310, "epoch": 1251} {"train_loss": -11.588678359985352, "global_step": 210311, "epoch": 1251} {"train_loss": -11.612900733947754, "global_step": 210312, "epoch": 1251} {"train_loss": -11.545995712280273, "global_step": 210313, "epoch": 1251} {"train_loss": -11.564315795898438, "global_step": 210314, "epoch": 1251} {"train_loss": -11.378856658935547, "global_step": 210315, "epoch": 1251} {"train_loss": -11.10677719116211, "global_step": 210316, "epoch": 1251} {"train_loss": -11.32078742980957, "global_step": 210317, "epoch": 1251} {"train_loss": -11.19277572631836, "global_step": 210318, "epoch": 1251} {"train_loss": -11.651165962219238, "global_step": 210319, "epoch": 1251} {"train_loss": -11.341992378234863, "global_step": 210320, "epoch": 1251} {"train_loss": -11.207220077514648, "global_step": 210321, "epoch": 1251} {"train_loss": -11.481620788574219, "global_step": 210322, "epoch": 1251} {"train_loss": -10.982540130615234, "global_step": 210323, "epoch": 1251} {"train_loss": -10.48106575012207, "global_step": 210324, "epoch": 1251} {"train_loss": -11.242683410644531, "global_step": 210325, "epoch": 1251} {"train_loss": -11.663127899169922, "global_step": 210326, "epoch": 1251} {"train_loss": -11.431550979614258, "global_step": 210327, "epoch": 1251} {"train_loss": -10.922603607177734, "global_step": 210328, "epoch": 1251} {"train_loss": -11.713644027709961, "global_step": 210329, "epoch": 1251} {"train_loss": -11.330248832702637, "global_step": 210330, "epoch": 1251} {"train_loss": -10.889179229736328, "global_step": 210331, "epoch": 1251} {"train_loss": -11.145898818969727, "global_step": 210332, "epoch": 1251} {"train_loss": -11.518299102783203, "global_step": 210333, "epoch": 1251} {"train_loss": -10.286785125732422, "global_step": 210334, "epoch": 1251} {"train_loss": -11.330571963673545, "global_step": 210335, "epoch": 1251, "val_loss": 251912.90625} {"train_loss": -11.698543548583984, "global_step": 210336, "epoch": 1252} {"train_loss": -10.519474029541016, "global_step": 210337, "epoch": 1252} {"train_loss": -10.926520347595215, "global_step": 210338, "epoch": 1252} {"train_loss": -11.008060455322266, "global_step": 210339, "epoch": 1252} {"train_loss": -10.069565773010254, "global_step": 210340, "epoch": 1252} {"train_loss": -10.893238067626953, "global_step": 210341, "epoch": 1252} {"train_loss": -10.653152465820312, "global_step": 210342, "epoch": 1252} {"train_loss": -10.311155319213867, "global_step": 210343, "epoch": 1252} {"train_loss": -10.915956497192383, "global_step": 210344, "epoch": 1252} {"train_loss": -10.692144393920898, "global_step": 210345, "epoch": 1252} {"train_loss": -10.090598106384277, "global_step": 210346, "epoch": 1252} {"train_loss": -10.914777755737305, "global_step": 210347, "epoch": 1252} {"train_loss": -9.51877498626709, "global_step": 210348, "epoch": 1252} {"train_loss": -10.361854553222656, "global_step": 210349, "epoch": 1252} {"train_loss": -10.621740341186523, "global_step": 210350, "epoch": 1252} {"train_loss": -9.296978950500488, "global_step": 210351, "epoch": 1252} {"train_loss": -10.714027404785156, "global_step": 210352, "epoch": 1252} {"train_loss": -8.40833854675293, "global_step": 210353, "epoch": 1252} {"train_loss": -9.218606948852539, "global_step": 210354, "epoch": 1252} {"train_loss": -9.807323455810547, "global_step": 210355, "epoch": 1252} {"train_loss": -10.635309219360352, "global_step": 210356, "epoch": 1252} {"train_loss": -10.022636413574219, "global_step": 210357, "epoch": 1252} {"train_loss": -11.059014320373535, "global_step": 210358, "epoch": 1252} {"train_loss": -10.152231216430664, "global_step": 210359, "epoch": 1252} {"train_loss": -11.43543529510498, "global_step": 210360, "epoch": 1252} {"train_loss": -10.461922645568848, "global_step": 210361, "epoch": 1252} {"train_loss": -11.048112869262695, "global_step": 210362, "epoch": 1252} {"train_loss": -10.798561096191406, "global_step": 210363, "epoch": 1252} {"train_loss": -10.730155944824219, "global_step": 210364, "epoch": 1252} {"train_loss": -11.135372161865234, "global_step": 210365, "epoch": 1252} {"train_loss": -10.866523742675781, "global_step": 210366, "epoch": 1252} {"train_loss": -11.144527435302734, "global_step": 210367, "epoch": 1252} {"train_loss": -11.038642883300781, "global_step": 210368, "epoch": 1252} {"train_loss": -11.230039596557617, "global_step": 210369, "epoch": 1252} {"train_loss": -11.27762222290039, "global_step": 210370, "epoch": 1252} {"train_loss": -11.165812492370605, "global_step": 210371, "epoch": 1252} {"train_loss": -11.274358749389648, "global_step": 210372, "epoch": 1252} {"train_loss": -11.236974716186523, "global_step": 210373, "epoch": 1252} {"train_loss": -11.123271942138672, "global_step": 210374, "epoch": 1252} {"train_loss": -11.461174964904785, "global_step": 210375, "epoch": 1252} {"train_loss": -10.990711212158203, "global_step": 210376, "epoch": 1252} {"train_loss": -11.301006317138672, "global_step": 210377, "epoch": 1252} {"train_loss": -11.26166820526123, "global_step": 210378, "epoch": 1252} {"train_loss": -11.416630744934082, "global_step": 210379, "epoch": 1252} {"train_loss": -10.98214054107666, "global_step": 210380, "epoch": 1252} {"train_loss": -11.11286735534668, "global_step": 210381, "epoch": 1252} {"train_loss": -11.222940444946289, "global_step": 210382, "epoch": 1252} {"train_loss": -11.27680492401123, "global_step": 210383, "epoch": 1252} {"train_loss": -11.017902374267578, "global_step": 210384, "epoch": 1252} {"train_loss": -11.337064743041992, "global_step": 210385, "epoch": 1252} {"train_loss": -11.392853736877441, "global_step": 210386, "epoch": 1252} {"train_loss": -11.399324417114258, "global_step": 210387, "epoch": 1252} {"train_loss": -11.465476989746094, "global_step": 210388, "epoch": 1252} {"train_loss": -11.295751571655273, "global_step": 210389, "epoch": 1252} {"train_loss": -11.509201049804688, "global_step": 210390, "epoch": 1252} {"train_loss": -11.263595581054688, "global_step": 210391, "epoch": 1252} {"train_loss": -11.463210105895996, "global_step": 210392, "epoch": 1252} {"train_loss": -11.594184875488281, "global_step": 210393, "epoch": 1252} {"train_loss": -11.284184455871582, "global_step": 210394, "epoch": 1252} {"train_loss": -11.568599700927734, "global_step": 210395, "epoch": 1252} {"train_loss": -11.665979385375977, "global_step": 210396, "epoch": 1252} {"train_loss": -11.535442352294922, "global_step": 210397, "epoch": 1252} {"train_loss": -11.57020378112793, "global_step": 210398, "epoch": 1252} {"train_loss": -11.654967308044434, "global_step": 210399, "epoch": 1252} {"train_loss": -11.599853515625, "global_step": 210400, "epoch": 1252} {"train_loss": -11.740318298339844, "global_step": 210401, "epoch": 1252} {"train_loss": -11.586653709411621, "global_step": 210402, "epoch": 1252} {"train_loss": -11.830068588256836, "global_step": 210403, "epoch": 1252} {"train_loss": -11.72828483581543, "global_step": 210404, "epoch": 1252} {"train_loss": -11.75718879699707, "global_step": 210405, "epoch": 1252} {"train_loss": -11.69505500793457, "global_step": 210406, "epoch": 1252} {"train_loss": -11.733234405517578, "global_step": 210407, "epoch": 1252} {"train_loss": -11.796743392944336, "global_step": 210408, "epoch": 1252} {"train_loss": -11.518043518066406, "global_step": 210409, "epoch": 1252} {"train_loss": -11.89111614227295, "global_step": 210410, "epoch": 1252} {"train_loss": -11.281036376953125, "global_step": 210411, "epoch": 1252} {"train_loss": -11.820213317871094, "global_step": 210412, "epoch": 1252} {"train_loss": -11.621103286743164, "global_step": 210413, "epoch": 1252} {"train_loss": -11.56280517578125, "global_step": 210414, "epoch": 1252} {"train_loss": -11.329800605773926, "global_step": 210415, "epoch": 1252} {"train_loss": -12.091878890991211, "global_step": 210416, "epoch": 1252} {"train_loss": -11.252565383911133, "global_step": 210417, "epoch": 1252} {"train_loss": -11.556285858154297, "global_step": 210418, "epoch": 1252} {"train_loss": -11.638699531555176, "global_step": 210419, "epoch": 1252} {"train_loss": -11.556879043579102, "global_step": 210420, "epoch": 1252} {"train_loss": -11.825462341308594, "global_step": 210421, "epoch": 1252} {"train_loss": -11.767415046691895, "global_step": 210422, "epoch": 1252} {"train_loss": -11.793338775634766, "global_step": 210423, "epoch": 1252} {"train_loss": -11.797877311706543, "global_step": 210424, "epoch": 1252} {"train_loss": -11.923870086669922, "global_step": 210425, "epoch": 1252} {"train_loss": -11.785219192504883, "global_step": 210426, "epoch": 1252} {"train_loss": -11.699029922485352, "global_step": 210427, "epoch": 1252} {"train_loss": -11.868241310119629, "global_step": 210428, "epoch": 1252} {"train_loss": -11.499591827392578, "global_step": 210429, "epoch": 1252} {"train_loss": -11.61709976196289, "global_step": 210430, "epoch": 1252} {"train_loss": -11.636333465576172, "global_step": 210431, "epoch": 1252} {"train_loss": -11.506519317626953, "global_step": 210432, "epoch": 1252} {"train_loss": -11.800055503845215, "global_step": 210433, "epoch": 1252} {"train_loss": -11.69721794128418, "global_step": 210434, "epoch": 1252} {"train_loss": -11.340801239013672, "global_step": 210435, "epoch": 1252} {"train_loss": -11.851774215698242, "global_step": 210436, "epoch": 1252} {"train_loss": -11.73967170715332, "global_step": 210437, "epoch": 1252} {"train_loss": -11.858175277709961, "global_step": 210438, "epoch": 1252} {"train_loss": -11.869993209838867, "global_step": 210439, "epoch": 1252} {"train_loss": -11.644521713256836, "global_step": 210440, "epoch": 1252} {"train_loss": -11.531309127807617, "global_step": 210441, "epoch": 1252} {"train_loss": -11.555521011352539, "global_step": 210442, "epoch": 1252} {"train_loss": -11.470269203186035, "global_step": 210443, "epoch": 1252} {"train_loss": -12.070194244384766, "global_step": 210444, "epoch": 1252} {"train_loss": -11.563325881958008, "global_step": 210445, "epoch": 1252} {"train_loss": -11.675582885742188, "global_step": 210446, "epoch": 1252} {"train_loss": -11.568892478942871, "global_step": 210447, "epoch": 1252} {"train_loss": -11.092965126037598, "global_step": 210448, "epoch": 1252} {"train_loss": -11.038573265075684, "global_step": 210449, "epoch": 1252} {"train_loss": -11.31809139251709, "global_step": 210450, "epoch": 1252} {"train_loss": -10.469938278198242, "global_step": 210451, "epoch": 1252} {"train_loss": -11.163899421691895, "global_step": 210452, "epoch": 1252} {"train_loss": -10.750041007995605, "global_step": 210453, "epoch": 1252} {"train_loss": -11.452764511108398, "global_step": 210454, "epoch": 1252} {"train_loss": -10.907970428466797, "global_step": 210455, "epoch": 1252} {"train_loss": -11.320873260498047, "global_step": 210456, "epoch": 1252} {"train_loss": -10.832368850708008, "global_step": 210457, "epoch": 1252} {"train_loss": -11.250168800354004, "global_step": 210458, "epoch": 1252} {"train_loss": -11.213174819946289, "global_step": 210459, "epoch": 1252} {"train_loss": -11.181916236877441, "global_step": 210460, "epoch": 1252} {"train_loss": -11.433669090270996, "global_step": 210461, "epoch": 1252} {"train_loss": -11.465097427368164, "global_step": 210462, "epoch": 1252} {"train_loss": -11.528230667114258, "global_step": 210463, "epoch": 1252} {"train_loss": -11.281253814697266, "global_step": 210464, "epoch": 1252} {"train_loss": -11.206866264343262, "global_step": 210465, "epoch": 1252} {"train_loss": -11.26881217956543, "global_step": 210466, "epoch": 1252} {"train_loss": -11.369012832641602, "global_step": 210467, "epoch": 1252} {"train_loss": -11.359725952148438, "global_step": 210468, "epoch": 1252} {"train_loss": -11.70096492767334, "global_step": 210469, "epoch": 1252} {"train_loss": -11.513995170593262, "global_step": 210470, "epoch": 1252} {"train_loss": -11.440986633300781, "global_step": 210471, "epoch": 1252} {"train_loss": -11.545647621154785, "global_step": 210472, "epoch": 1252} {"train_loss": -11.211684226989746, "global_step": 210473, "epoch": 1252} {"train_loss": -11.356338500976562, "global_step": 210474, "epoch": 1252} {"train_loss": -11.35019302368164, "global_step": 210475, "epoch": 1252} {"train_loss": -10.81930160522461, "global_step": 210476, "epoch": 1252} {"train_loss": -11.493473052978516, "global_step": 210477, "epoch": 1252} {"train_loss": -10.91534423828125, "global_step": 210478, "epoch": 1252} {"train_loss": -11.498479843139648, "global_step": 210479, "epoch": 1252} {"train_loss": -10.942867279052734, "global_step": 210480, "epoch": 1252} {"train_loss": -11.276800155639648, "global_step": 210481, "epoch": 1252} {"train_loss": -11.027862548828125, "global_step": 210482, "epoch": 1252} {"train_loss": -10.8958740234375, "global_step": 210483, "epoch": 1252} {"train_loss": -11.062474250793457, "global_step": 210484, "epoch": 1252} {"train_loss": -11.246349334716797, "global_step": 210485, "epoch": 1252} {"train_loss": -11.143787384033203, "global_step": 210486, "epoch": 1252} {"train_loss": -11.328444480895996, "global_step": 210487, "epoch": 1252} {"train_loss": -11.36393928527832, "global_step": 210488, "epoch": 1252} {"train_loss": -11.549858093261719, "global_step": 210489, "epoch": 1252} {"train_loss": -11.541200637817383, "global_step": 210490, "epoch": 1252} {"train_loss": -11.070033073425293, "global_step": 210491, "epoch": 1252} {"train_loss": -11.363592147827148, "global_step": 210492, "epoch": 1252} {"train_loss": -11.516945838928223, "global_step": 210493, "epoch": 1252} {"train_loss": -11.282398223876953, "global_step": 210494, "epoch": 1252} {"train_loss": -11.505200386047363, "global_step": 210495, "epoch": 1252} {"train_loss": -11.101066589355469, "global_step": 210496, "epoch": 1252} {"train_loss": -10.962278366088867, "global_step": 210497, "epoch": 1252} {"train_loss": -11.537443161010742, "global_step": 210498, "epoch": 1252} {"train_loss": -10.988600730895996, "global_step": 210499, "epoch": 1252} {"train_loss": -11.44262409210205, "global_step": 210500, "epoch": 1252} {"train_loss": -11.188372611999512, "global_step": 210501, "epoch": 1252} {"train_loss": -10.801066398620605, "global_step": 210502, "epoch": 1252} {"train_loss": -11.240293673106603, "global_step": 210503, "epoch": 1252, "val_loss": 258308.421875} {"train_loss": -9.501314163208008, "global_step": 210504, "epoch": 1253} {"train_loss": -10.731132507324219, "global_step": 210505, "epoch": 1253} {"train_loss": -9.144726753234863, "global_step": 210506, "epoch": 1253} {"train_loss": -10.42914867401123, "global_step": 210507, "epoch": 1253} {"train_loss": -10.297329902648926, "global_step": 210508, "epoch": 1253} {"train_loss": -10.168283462524414, "global_step": 210509, "epoch": 1253} {"train_loss": -10.98642635345459, "global_step": 210510, "epoch": 1253} {"train_loss": -9.792802810668945, "global_step": 210511, "epoch": 1253} {"train_loss": -9.96436882019043, "global_step": 210512, "epoch": 1253} {"train_loss": -10.107999801635742, "global_step": 210513, "epoch": 1253} {"train_loss": -9.356269836425781, "global_step": 210514, "epoch": 1253} {"train_loss": -10.800426483154297, "global_step": 210515, "epoch": 1253} {"train_loss": -9.965694427490234, "global_step": 210516, "epoch": 1253} {"train_loss": -10.268503189086914, "global_step": 210517, "epoch": 1253} {"train_loss": -10.912333488464355, "global_step": 210518, "epoch": 1253} {"train_loss": -10.617362976074219, "global_step": 210519, "epoch": 1253} {"train_loss": -10.230908393859863, "global_step": 210520, "epoch": 1253} {"train_loss": -11.386791229248047, "global_step": 210521, "epoch": 1253} {"train_loss": -9.704486846923828, "global_step": 210522, "epoch": 1253} {"train_loss": -10.168691635131836, "global_step": 210523, "epoch": 1253} {"train_loss": -10.997037887573242, "global_step": 210524, "epoch": 1253} {"train_loss": -10.64590835571289, "global_step": 210525, "epoch": 1253} {"train_loss": -10.473457336425781, "global_step": 210526, "epoch": 1253} {"train_loss": -10.739218711853027, "global_step": 210527, "epoch": 1253} {"train_loss": -10.93836784362793, "global_step": 210528, "epoch": 1253} {"train_loss": -10.832010269165039, "global_step": 210529, "epoch": 1253} {"train_loss": -11.08950424194336, "global_step": 210530, "epoch": 1253} {"train_loss": -10.506619453430176, "global_step": 210531, "epoch": 1253} {"train_loss": -10.799221992492676, "global_step": 210532, "epoch": 1253} {"train_loss": -10.876937866210938, "global_step": 210533, "epoch": 1253} {"train_loss": -10.9221830368042, "global_step": 210534, "epoch": 1253} {"train_loss": -10.928488731384277, "global_step": 210535, "epoch": 1253} {"train_loss": -10.692728042602539, "global_step": 210536, "epoch": 1253} {"train_loss": -10.9467134475708, "global_step": 210537, "epoch": 1253} {"train_loss": -10.887615203857422, "global_step": 210538, "epoch": 1253} {"train_loss": -11.027856826782227, "global_step": 210539, "epoch": 1253} {"train_loss": -11.177562713623047, "global_step": 210540, "epoch": 1253} {"train_loss": -10.971780776977539, "global_step": 210541, "epoch": 1253} {"train_loss": -11.209249496459961, "global_step": 210542, "epoch": 1253} {"train_loss": -10.626625061035156, "global_step": 210543, "epoch": 1253} {"train_loss": -11.362625122070312, "global_step": 210544, "epoch": 1253} {"train_loss": -10.928882598876953, "global_step": 210545, "epoch": 1253} {"train_loss": -11.141195297241211, "global_step": 210546, "epoch": 1253} {"train_loss": -10.839630126953125, "global_step": 210547, "epoch": 1253} {"train_loss": -11.403787612915039, "global_step": 210548, "epoch": 1253} {"train_loss": -11.212494850158691, "global_step": 210549, "epoch": 1253} {"train_loss": -11.551679611206055, "global_step": 210550, "epoch": 1253} {"train_loss": -10.834035873413086, "global_step": 210551, "epoch": 1253} {"train_loss": -11.548013687133789, "global_step": 210552, "epoch": 1253} {"train_loss": -10.859188079833984, "global_step": 210553, "epoch": 1253} {"train_loss": -11.514680862426758, "global_step": 210554, "epoch": 1253} {"train_loss": -11.120323181152344, "global_step": 210555, "epoch": 1253} {"train_loss": -11.403219223022461, "global_step": 210556, "epoch": 1253} {"train_loss": -11.18716812133789, "global_step": 210557, "epoch": 1253} {"train_loss": -11.223241806030273, "global_step": 210558, "epoch": 1253} {"train_loss": -11.354676246643066, "global_step": 210559, "epoch": 1253} {"train_loss": -11.250356674194336, "global_step": 210560, "epoch": 1253} {"train_loss": -11.528047561645508, "global_step": 210561, "epoch": 1253} {"train_loss": -11.60718822479248, "global_step": 210562, "epoch": 1253} {"train_loss": -11.376060485839844, "global_step": 210563, "epoch": 1253} {"train_loss": -11.64382266998291, "global_step": 210564, "epoch": 1253} {"train_loss": -11.468400955200195, "global_step": 210565, "epoch": 1253} {"train_loss": -11.437856674194336, "global_step": 210566, "epoch": 1253} {"train_loss": -11.602113723754883, "global_step": 210567, "epoch": 1253} {"train_loss": -11.339405059814453, "global_step": 210568, "epoch": 1253} {"train_loss": -11.502103805541992, "global_step": 210569, "epoch": 1253} {"train_loss": -11.62176513671875, "global_step": 210570, "epoch": 1253} {"train_loss": -11.512526512145996, "global_step": 210571, "epoch": 1253} {"train_loss": -11.726373672485352, "global_step": 210572, "epoch": 1253} {"train_loss": -11.698433876037598, "global_step": 210573, "epoch": 1253} {"train_loss": -11.59178638458252, "global_step": 210574, "epoch": 1253} {"train_loss": -11.508621215820312, "global_step": 210575, "epoch": 1253} {"train_loss": -11.831913948059082, "global_step": 210576, "epoch": 1253} {"train_loss": -11.61053466796875, "global_step": 210577, "epoch": 1253} {"train_loss": -11.54065990447998, "global_step": 210578, "epoch": 1253} {"train_loss": -11.429341316223145, "global_step": 210579, "epoch": 1253} {"train_loss": -11.716976165771484, "global_step": 210580, "epoch": 1253} {"train_loss": -11.585351943969727, "global_step": 210581, "epoch": 1253} {"train_loss": -11.557713508605957, "global_step": 210582, "epoch": 1253} {"train_loss": -11.977224349975586, "global_step": 210583, "epoch": 1253} {"train_loss": -11.557540893554688, "global_step": 210584, "epoch": 1253} {"train_loss": -11.748123168945312, "global_step": 210585, "epoch": 1253} {"train_loss": -11.551996231079102, "global_step": 210586, "epoch": 1253} {"train_loss": -11.723261833190918, "global_step": 210587, "epoch": 1253} {"train_loss": -11.56740665435791, "global_step": 210588, "epoch": 1253} {"train_loss": -11.545319557189941, "global_step": 210589, "epoch": 1253} {"train_loss": -11.729647636413574, "global_step": 210590, "epoch": 1253} {"train_loss": -11.747024536132812, "global_step": 210591, "epoch": 1253} {"train_loss": -11.510534286499023, "global_step": 210592, "epoch": 1253} {"train_loss": -11.481101989746094, "global_step": 210593, "epoch": 1253} {"train_loss": -11.735010147094727, "global_step": 210594, "epoch": 1253} {"train_loss": -11.641143798828125, "global_step": 210595, "epoch": 1253} {"train_loss": -11.266157150268555, "global_step": 210596, "epoch": 1253} {"train_loss": -11.858312606811523, "global_step": 210597, "epoch": 1253} {"train_loss": -11.260677337646484, "global_step": 210598, "epoch": 1253} {"train_loss": -11.822585105895996, "global_step": 210599, "epoch": 1253} {"train_loss": -11.53249740600586, "global_step": 210600, "epoch": 1253} {"train_loss": -11.95964527130127, "global_step": 210601, "epoch": 1253} {"train_loss": -11.711973190307617, "global_step": 210602, "epoch": 1253} {"train_loss": -11.948720932006836, "global_step": 210603, "epoch": 1253} {"train_loss": -11.480865478515625, "global_step": 210604, "epoch": 1253} {"train_loss": -11.825380325317383, "global_step": 210605, "epoch": 1253} {"train_loss": -11.646652221679688, "global_step": 210606, "epoch": 1253} {"train_loss": -11.612951278686523, "global_step": 210607, "epoch": 1253} {"train_loss": -11.783071517944336, "global_step": 210608, "epoch": 1253} {"train_loss": -11.918988227844238, "global_step": 210609, "epoch": 1253} {"train_loss": -11.494787216186523, "global_step": 210610, "epoch": 1253} {"train_loss": -11.76010513305664, "global_step": 210611, "epoch": 1253} {"train_loss": -11.807940483093262, "global_step": 210612, "epoch": 1253} {"train_loss": -11.740877151489258, "global_step": 210613, "epoch": 1253} {"train_loss": -11.72572135925293, "global_step": 210614, "epoch": 1253} {"train_loss": -11.55438232421875, "global_step": 210615, "epoch": 1253} {"train_loss": -11.033977508544922, "global_step": 210616, "epoch": 1253} {"train_loss": -12.022804260253906, "global_step": 210617, "epoch": 1253} {"train_loss": -11.403441429138184, "global_step": 210618, "epoch": 1253} {"train_loss": -10.86691951751709, "global_step": 210619, "epoch": 1253} {"train_loss": -10.727951049804688, "global_step": 210620, "epoch": 1253} {"train_loss": -11.672409057617188, "global_step": 210621, "epoch": 1253} {"train_loss": -11.578361511230469, "global_step": 210622, "epoch": 1253} {"train_loss": -11.671305656433105, "global_step": 210623, "epoch": 1253} {"train_loss": -11.629060745239258, "global_step": 210624, "epoch": 1253} {"train_loss": -11.379058837890625, "global_step": 210625, "epoch": 1253} {"train_loss": -11.551850318908691, "global_step": 210626, "epoch": 1253} {"train_loss": -11.461105346679688, "global_step": 210627, "epoch": 1253} {"train_loss": -11.755976676940918, "global_step": 210628, "epoch": 1253} {"train_loss": -10.825783729553223, "global_step": 210629, "epoch": 1253} {"train_loss": -10.179840087890625, "global_step": 210630, "epoch": 1253} {"train_loss": -11.33309555053711, "global_step": 210631, "epoch": 1253} {"train_loss": -11.555580139160156, "global_step": 210632, "epoch": 1253} {"train_loss": -10.680635452270508, "global_step": 210633, "epoch": 1253} {"train_loss": -11.09649658203125, "global_step": 210634, "epoch": 1253} {"train_loss": -11.35550308227539, "global_step": 210635, "epoch": 1253} {"train_loss": -10.98295783996582, "global_step": 210636, "epoch": 1253} {"train_loss": -11.155683517456055, "global_step": 210637, "epoch": 1253} {"train_loss": -11.342367172241211, "global_step": 210638, "epoch": 1253} {"train_loss": -10.84591293334961, "global_step": 210639, "epoch": 1253} {"train_loss": -11.402962684631348, "global_step": 210640, "epoch": 1253} {"train_loss": -11.138031005859375, "global_step": 210641, "epoch": 1253} {"train_loss": -10.967455863952637, "global_step": 210642, "epoch": 1253} {"train_loss": -11.920315742492676, "global_step": 210643, "epoch": 1253} {"train_loss": -11.542917251586914, "global_step": 210644, "epoch": 1253} {"train_loss": -11.439453125, "global_step": 210645, "epoch": 1253} {"train_loss": -11.473794937133789, "global_step": 210646, "epoch": 1253} {"train_loss": -11.39955997467041, "global_step": 210647, "epoch": 1253} {"train_loss": -11.574522018432617, "global_step": 210648, "epoch": 1253} {"train_loss": -11.746532440185547, "global_step": 210649, "epoch": 1253} {"train_loss": -11.412803649902344, "global_step": 210650, "epoch": 1253} {"train_loss": -11.563593864440918, "global_step": 210651, "epoch": 1253} {"train_loss": -11.654638290405273, "global_step": 210652, "epoch": 1253} {"train_loss": -11.29397964477539, "global_step": 210653, "epoch": 1253} {"train_loss": -11.595754623413086, "global_step": 210654, "epoch": 1253} {"train_loss": -11.551586151123047, "global_step": 210655, "epoch": 1253} {"train_loss": -11.658613204956055, "global_step": 210656, "epoch": 1253} {"train_loss": -11.094873428344727, "global_step": 210657, "epoch": 1253} {"train_loss": -11.553505897521973, "global_step": 210658, "epoch": 1253} {"train_loss": -11.495491981506348, "global_step": 210659, "epoch": 1253} {"train_loss": -11.127496719360352, "global_step": 210660, "epoch": 1253} {"train_loss": -11.753265380859375, "global_step": 210661, "epoch": 1253} {"train_loss": -10.955772399902344, "global_step": 210662, "epoch": 1253} {"train_loss": -11.361425399780273, "global_step": 210663, "epoch": 1253} {"train_loss": -11.376558303833008, "global_step": 210664, "epoch": 1253} {"train_loss": -11.211846351623535, "global_step": 210665, "epoch": 1253} {"train_loss": -11.05795669555664, "global_step": 210666, "epoch": 1253} {"train_loss": -11.509424209594727, "global_step": 210667, "epoch": 1253} {"train_loss": -11.251230239868164, "global_step": 210668, "epoch": 1253} {"train_loss": -10.479223251342773, "global_step": 210669, "epoch": 1253} {"train_loss": -10.598325729370117, "global_step": 210670, "epoch": 1253} {"train_loss": -11.220848566009884, "global_step": 210671, "epoch": 1253, "val_loss": 254903.203125} {"train_loss": -10.087820053100586, "global_step": 210672, "epoch": 1254} {"train_loss": -10.197067260742188, "global_step": 210673, "epoch": 1254} {"train_loss": -8.33415412902832, "global_step": 210674, "epoch": 1254} {"train_loss": -8.866918563842773, "global_step": 210675, "epoch": 1254} {"train_loss": -10.084702491760254, "global_step": 210676, "epoch": 1254} {"train_loss": -8.807616233825684, "global_step": 210677, "epoch": 1254} {"train_loss": -8.493598937988281, "global_step": 210678, "epoch": 1254} {"train_loss": -9.219863891601562, "global_step": 210679, "epoch": 1254} {"train_loss": -8.916353225708008, "global_step": 210680, "epoch": 1254} {"train_loss": -8.051175117492676, "global_step": 210681, "epoch": 1254} {"train_loss": -10.6002779006958, "global_step": 210682, "epoch": 1254} {"train_loss": -9.557960510253906, "global_step": 210683, "epoch": 1254} {"train_loss": -9.617450714111328, "global_step": 210684, "epoch": 1254} {"train_loss": -8.56512451171875, "global_step": 210685, "epoch": 1254} {"train_loss": -10.43695068359375, "global_step": 210686, "epoch": 1254} {"train_loss": -9.166545867919922, "global_step": 210687, "epoch": 1254} {"train_loss": -10.340739250183105, "global_step": 210688, "epoch": 1254} {"train_loss": -10.257609367370605, "global_step": 210689, "epoch": 1254} {"train_loss": -8.722113609313965, "global_step": 210690, "epoch": 1254} {"train_loss": -9.774946212768555, "global_step": 210691, "epoch": 1254} {"train_loss": -10.002837181091309, "global_step": 210692, "epoch": 1254} {"train_loss": -9.300963401794434, "global_step": 210693, "epoch": 1254} {"train_loss": -10.006254196166992, "global_step": 210694, "epoch": 1254} {"train_loss": -9.813665390014648, "global_step": 210695, "epoch": 1254} {"train_loss": -10.660421371459961, "global_step": 210696, "epoch": 1254} {"train_loss": -10.149164199829102, "global_step": 210697, "epoch": 1254} {"train_loss": -9.36941146850586, "global_step": 210698, "epoch": 1254} {"train_loss": -11.032661437988281, "global_step": 210699, "epoch": 1254} {"train_loss": -9.757909774780273, "global_step": 210700, "epoch": 1254} {"train_loss": -10.432132720947266, "global_step": 210701, "epoch": 1254} {"train_loss": -10.658226013183594, "global_step": 210702, "epoch": 1254} {"train_loss": -10.000395774841309, "global_step": 210703, "epoch": 1254} {"train_loss": -10.677913665771484, "global_step": 210704, "epoch": 1254} {"train_loss": -10.810600280761719, "global_step": 210705, "epoch": 1254} {"train_loss": -10.30862808227539, "global_step": 210706, "epoch": 1254} {"train_loss": -10.915006637573242, "global_step": 210707, "epoch": 1254} {"train_loss": -10.90659236907959, "global_step": 210708, "epoch": 1254} {"train_loss": -10.862955093383789, "global_step": 210709, "epoch": 1254} {"train_loss": -10.803731918334961, "global_step": 210710, "epoch": 1254} {"train_loss": -10.602760314941406, "global_step": 210711, "epoch": 1254} {"train_loss": -11.004355430603027, "global_step": 210712, "epoch": 1254} {"train_loss": -10.867284774780273, "global_step": 210713, "epoch": 1254} {"train_loss": -10.76220703125, "global_step": 210714, "epoch": 1254} {"train_loss": -11.218021392822266, "global_step": 210715, "epoch": 1254} {"train_loss": -10.989437103271484, "global_step": 210716, "epoch": 1254} {"train_loss": -10.981847763061523, "global_step": 210717, "epoch": 1254} {"train_loss": -11.25229549407959, "global_step": 210718, "epoch": 1254} {"train_loss": -10.789336204528809, "global_step": 210719, "epoch": 1254} {"train_loss": -11.199470520019531, "global_step": 210720, "epoch": 1254} {"train_loss": -11.202451705932617, "global_step": 210721, "epoch": 1254} {"train_loss": -11.053619384765625, "global_step": 210722, "epoch": 1254} {"train_loss": -11.32246208190918, "global_step": 210723, "epoch": 1254} {"train_loss": -11.00318717956543, "global_step": 210724, "epoch": 1254} {"train_loss": -11.229557991027832, "global_step": 210725, "epoch": 1254} {"train_loss": -11.28150749206543, "global_step": 210726, "epoch": 1254} {"train_loss": -11.248237609863281, "global_step": 210727, "epoch": 1254} {"train_loss": -11.310758590698242, "global_step": 210728, "epoch": 1254} {"train_loss": -11.15015983581543, "global_step": 210729, "epoch": 1254} {"train_loss": -11.381889343261719, "global_step": 210730, "epoch": 1254} {"train_loss": -11.51121711730957, "global_step": 210731, "epoch": 1254} {"train_loss": -11.342296600341797, "global_step": 210732, "epoch": 1254} {"train_loss": -11.327512741088867, "global_step": 210733, "epoch": 1254} {"train_loss": -11.539559364318848, "global_step": 210734, "epoch": 1254} {"train_loss": -11.460161209106445, "global_step": 210735, "epoch": 1254} {"train_loss": -11.410137176513672, "global_step": 210736, "epoch": 1254} {"train_loss": -11.375946044921875, "global_step": 210737, "epoch": 1254} {"train_loss": -11.29083251953125, "global_step": 210738, "epoch": 1254} {"train_loss": -11.500960350036621, "global_step": 210739, "epoch": 1254} {"train_loss": -11.614062309265137, "global_step": 210740, "epoch": 1254} {"train_loss": -11.387392044067383, "global_step": 210741, "epoch": 1254} {"train_loss": -11.465502738952637, "global_step": 210742, "epoch": 1254} {"train_loss": -11.600493431091309, "global_step": 210743, "epoch": 1254} {"train_loss": -11.567489624023438, "global_step": 210744, "epoch": 1254} {"train_loss": -11.616656303405762, "global_step": 210745, "epoch": 1254} {"train_loss": -11.510223388671875, "global_step": 210746, "epoch": 1254} {"train_loss": -11.577909469604492, "global_step": 210747, "epoch": 1254} {"train_loss": -11.678108215332031, "global_step": 210748, "epoch": 1254} {"train_loss": -11.575822830200195, "global_step": 210749, "epoch": 1254} {"train_loss": -11.501116752624512, "global_step": 210750, "epoch": 1254} {"train_loss": -11.693174362182617, "global_step": 210751, "epoch": 1254} {"train_loss": -11.762006759643555, "global_step": 210752, "epoch": 1254} {"train_loss": -11.78116226196289, "global_step": 210753, "epoch": 1254} {"train_loss": -11.521699905395508, "global_step": 210754, "epoch": 1254} {"train_loss": -11.755619049072266, "global_step": 210755, "epoch": 1254} {"train_loss": -11.641200065612793, "global_step": 210756, "epoch": 1254} {"train_loss": -11.934122085571289, "global_step": 210757, "epoch": 1254} {"train_loss": -11.554651260375977, "global_step": 210758, "epoch": 1254} {"train_loss": -11.870621681213379, "global_step": 210759, "epoch": 1254} {"train_loss": -11.845659255981445, "global_step": 210760, "epoch": 1254} {"train_loss": -11.578697204589844, "global_step": 210761, "epoch": 1254} {"train_loss": -11.76745319366455, "global_step": 210762, "epoch": 1254} {"train_loss": -11.876995086669922, "global_step": 210763, "epoch": 1254} {"train_loss": -11.742280960083008, "global_step": 210764, "epoch": 1254} {"train_loss": -11.901994705200195, "global_step": 210765, "epoch": 1254} {"train_loss": -11.82695484161377, "global_step": 210766, "epoch": 1254} {"train_loss": -11.794317245483398, "global_step": 210767, "epoch": 1254} {"train_loss": -11.897811889648438, "global_step": 210768, "epoch": 1254} {"train_loss": -11.997230529785156, "global_step": 210769, "epoch": 1254} {"train_loss": -11.801359176635742, "global_step": 210770, "epoch": 1254} {"train_loss": -11.784872055053711, "global_step": 210771, "epoch": 1254} {"train_loss": -11.984809875488281, "global_step": 210772, "epoch": 1254} {"train_loss": -11.776405334472656, "global_step": 210773, "epoch": 1254} {"train_loss": -11.903579711914062, "global_step": 210774, "epoch": 1254} {"train_loss": -11.603708267211914, "global_step": 210775, "epoch": 1254} {"train_loss": -11.966241836547852, "global_step": 210776, "epoch": 1254} {"train_loss": -12.032329559326172, "global_step": 210777, "epoch": 1254} {"train_loss": -11.895279884338379, "global_step": 210778, "epoch": 1254} {"train_loss": -12.099408149719238, "global_step": 210779, "epoch": 1254} {"train_loss": -12.066776275634766, "global_step": 210780, "epoch": 1254} {"train_loss": -12.198728561401367, "global_step": 210781, "epoch": 1254} {"train_loss": -12.109058380126953, "global_step": 210782, "epoch": 1254} {"train_loss": -11.885205268859863, "global_step": 210783, "epoch": 1254} {"train_loss": -12.052177429199219, "global_step": 210784, "epoch": 1254} {"train_loss": -12.059412002563477, "global_step": 210785, "epoch": 1254} {"train_loss": -11.787354469299316, "global_step": 210786, "epoch": 1254} {"train_loss": -12.003628730773926, "global_step": 210787, "epoch": 1254} {"train_loss": -11.804521560668945, "global_step": 210788, "epoch": 1254} {"train_loss": -11.893732070922852, "global_step": 210789, "epoch": 1254} {"train_loss": -11.67816162109375, "global_step": 210790, "epoch": 1254} {"train_loss": -11.346657752990723, "global_step": 210791, "epoch": 1254} {"train_loss": -11.189062118530273, "global_step": 210792, "epoch": 1254} {"train_loss": -11.627080917358398, "global_step": 210793, "epoch": 1254} {"train_loss": -10.735212326049805, "global_step": 210794, "epoch": 1254} {"train_loss": -11.548094749450684, "global_step": 210795, "epoch": 1254} {"train_loss": -11.660844802856445, "global_step": 210796, "epoch": 1254} {"train_loss": -11.21835994720459, "global_step": 210797, "epoch": 1254} {"train_loss": -10.604015350341797, "global_step": 210798, "epoch": 1254} {"train_loss": -11.560969352722168, "global_step": 210799, "epoch": 1254} {"train_loss": -11.316377639770508, "global_step": 210800, "epoch": 1254} {"train_loss": -10.957657814025879, "global_step": 210801, "epoch": 1254} {"train_loss": -11.154589653015137, "global_step": 210802, "epoch": 1254} {"train_loss": -11.016651153564453, "global_step": 210803, "epoch": 1254} {"train_loss": -11.382874488830566, "global_step": 210804, "epoch": 1254} {"train_loss": -11.017646789550781, "global_step": 210805, "epoch": 1254} {"train_loss": -11.355449676513672, "global_step": 210806, "epoch": 1254} {"train_loss": -11.147909164428711, "global_step": 210807, "epoch": 1254} {"train_loss": -11.235757827758789, "global_step": 210808, "epoch": 1254} {"train_loss": -10.055517196655273, "global_step": 210809, "epoch": 1254} {"train_loss": -10.638813018798828, "global_step": 210810, "epoch": 1254} {"train_loss": -10.499624252319336, "global_step": 210811, "epoch": 1254} {"train_loss": -10.262828826904297, "global_step": 210812, "epoch": 1254} {"train_loss": -10.783735275268555, "global_step": 210813, "epoch": 1254} {"train_loss": -10.570962905883789, "global_step": 210814, "epoch": 1254} {"train_loss": -10.492609024047852, "global_step": 210815, "epoch": 1254} {"train_loss": -10.858736038208008, "global_step": 210816, "epoch": 1254} {"train_loss": -9.724333763122559, "global_step": 210817, "epoch": 1254} {"train_loss": -10.78481674194336, "global_step": 210818, "epoch": 1254} {"train_loss": -9.914064407348633, "global_step": 210819, "epoch": 1254} {"train_loss": -10.89018440246582, "global_step": 210820, "epoch": 1254} {"train_loss": -10.44918155670166, "global_step": 210821, "epoch": 1254} {"train_loss": -10.779539108276367, "global_step": 210822, "epoch": 1254} {"train_loss": -11.11393928527832, "global_step": 210823, "epoch": 1254} {"train_loss": -11.092997550964355, "global_step": 210824, "epoch": 1254} {"train_loss": -10.980367660522461, "global_step": 210825, "epoch": 1254} {"train_loss": -10.671405792236328, "global_step": 210826, "epoch": 1254} {"train_loss": -11.154326438903809, "global_step": 210827, "epoch": 1254} {"train_loss": -10.537424087524414, "global_step": 210828, "epoch": 1254} {"train_loss": -10.530977249145508, "global_step": 210829, "epoch": 1254} {"train_loss": -9.964216232299805, "global_step": 210830, "epoch": 1254} {"train_loss": -10.673632621765137, "global_step": 210831, "epoch": 1254} {"train_loss": -10.115690231323242, "global_step": 210832, "epoch": 1254} {"train_loss": -11.064571380615234, "global_step": 210833, "epoch": 1254} {"train_loss": -10.330196380615234, "global_step": 210834, "epoch": 1254} {"train_loss": -11.415285110473633, "global_step": 210835, "epoch": 1254} {"train_loss": -10.462846755981445, "global_step": 210836, "epoch": 1254} {"train_loss": -11.024856567382812, "global_step": 210837, "epoch": 1254} {"train_loss": -11.183122634887695, "global_step": 210838, "epoch": 1254} {"train_loss": -10.966149318785895, "global_step": 210839, "epoch": 1254, "val_loss": 258459.90625} {"train_loss": -10.970951080322266, "global_step": 210840, "epoch": 1255} {"train_loss": -11.22920036315918, "global_step": 210841, "epoch": 1255} {"train_loss": -11.209583282470703, "global_step": 210842, "epoch": 1255} {"train_loss": -11.220512390136719, "global_step": 210843, "epoch": 1255} {"train_loss": -11.098250389099121, "global_step": 210844, "epoch": 1255} {"train_loss": -11.330047607421875, "global_step": 210845, "epoch": 1255} {"train_loss": -11.19544792175293, "global_step": 210846, "epoch": 1255} {"train_loss": -11.274282455444336, "global_step": 210847, "epoch": 1255} {"train_loss": -11.293691635131836, "global_step": 210848, "epoch": 1255} {"train_loss": -11.391866683959961, "global_step": 210849, "epoch": 1255} {"train_loss": -11.38470458984375, "global_step": 210850, "epoch": 1255} {"train_loss": -11.41944694519043, "global_step": 210851, "epoch": 1255} {"train_loss": -11.331520080566406, "global_step": 210852, "epoch": 1255} {"train_loss": -11.296688079833984, "global_step": 210853, "epoch": 1255} {"train_loss": -11.340731620788574, "global_step": 210854, "epoch": 1255} {"train_loss": -11.505939483642578, "global_step": 210855, "epoch": 1255} {"train_loss": -11.58137321472168, "global_step": 210856, "epoch": 1255} {"train_loss": -11.251814842224121, "global_step": 210857, "epoch": 1255} {"train_loss": -11.53738784790039, "global_step": 210858, "epoch": 1255} {"train_loss": -11.655707359313965, "global_step": 210859, "epoch": 1255} {"train_loss": -11.505962371826172, "global_step": 210860, "epoch": 1255} {"train_loss": -11.59263801574707, "global_step": 210861, "epoch": 1255} {"train_loss": -11.478959083557129, "global_step": 210862, "epoch": 1255} {"train_loss": -11.516496658325195, "global_step": 210863, "epoch": 1255} {"train_loss": -11.605979919433594, "global_step": 210864, "epoch": 1255} {"train_loss": -11.600523948669434, "global_step": 210865, "epoch": 1255} {"train_loss": -11.448169708251953, "global_step": 210866, "epoch": 1255} {"train_loss": -11.586559295654297, "global_step": 210867, "epoch": 1255} {"train_loss": -11.62173843383789, "global_step": 210868, "epoch": 1255} {"train_loss": -11.528146743774414, "global_step": 210869, "epoch": 1255} {"train_loss": -11.491846084594727, "global_step": 210870, "epoch": 1255} {"train_loss": -11.751178741455078, "global_step": 210871, "epoch": 1255} {"train_loss": -11.622962951660156, "global_step": 210872, "epoch": 1255} {"train_loss": -11.796317100524902, "global_step": 210873, "epoch": 1255} {"train_loss": -11.608171463012695, "global_step": 210874, "epoch": 1255} {"train_loss": -11.813671112060547, "global_step": 210875, "epoch": 1255} {"train_loss": -11.420841217041016, "global_step": 210876, "epoch": 1255} {"train_loss": -11.579975128173828, "global_step": 210877, "epoch": 1255} {"train_loss": -11.625139236450195, "global_step": 210878, "epoch": 1255} {"train_loss": -11.609016418457031, "global_step": 210879, "epoch": 1255} {"train_loss": -11.81186294555664, "global_step": 210880, "epoch": 1255} {"train_loss": -11.61661148071289, "global_step": 210881, "epoch": 1255} {"train_loss": -11.661137580871582, "global_step": 210882, "epoch": 1255} {"train_loss": -11.75705337524414, "global_step": 210883, "epoch": 1255} {"train_loss": -11.675749778747559, "global_step": 210884, "epoch": 1255} {"train_loss": -11.819978713989258, "global_step": 210885, "epoch": 1255} {"train_loss": -11.701488494873047, "global_step": 210886, "epoch": 1255} {"train_loss": -11.526241302490234, "global_step": 210887, "epoch": 1255} {"train_loss": -11.741022109985352, "global_step": 210888, "epoch": 1255} {"train_loss": -11.840635299682617, "global_step": 210889, "epoch": 1255} {"train_loss": -11.862043380737305, "global_step": 210890, "epoch": 1255} {"train_loss": -11.992173194885254, "global_step": 210891, "epoch": 1255} {"train_loss": -11.901979446411133, "global_step": 210892, "epoch": 1255} {"train_loss": -11.886496543884277, "global_step": 210893, "epoch": 1255} {"train_loss": -11.880539894104004, "global_step": 210894, "epoch": 1255} {"train_loss": -11.882123947143555, "global_step": 210895, "epoch": 1255} {"train_loss": -11.958709716796875, "global_step": 210896, "epoch": 1255} {"train_loss": -11.884683609008789, "global_step": 210897, "epoch": 1255} {"train_loss": -11.906333923339844, "global_step": 210898, "epoch": 1255} {"train_loss": -11.780230522155762, "global_step": 210899, "epoch": 1255} {"train_loss": -11.67814826965332, "global_step": 210900, "epoch": 1255} {"train_loss": -11.504613876342773, "global_step": 210901, "epoch": 1255} {"train_loss": -11.346616744995117, "global_step": 210902, "epoch": 1255} {"train_loss": -11.378474235534668, "global_step": 210903, "epoch": 1255} {"train_loss": -11.762859344482422, "global_step": 210904, "epoch": 1255} {"train_loss": -11.151664733886719, "global_step": 210905, "epoch": 1255} {"train_loss": -11.335397720336914, "global_step": 210906, "epoch": 1255} {"train_loss": -11.307241439819336, "global_step": 210907, "epoch": 1255} {"train_loss": -11.593799591064453, "global_step": 210908, "epoch": 1255} {"train_loss": -11.644311904907227, "global_step": 210909, "epoch": 1255} {"train_loss": -11.50292682647705, "global_step": 210910, "epoch": 1255} {"train_loss": -11.334978103637695, "global_step": 210911, "epoch": 1255} {"train_loss": -11.797185897827148, "global_step": 210912, "epoch": 1255} {"train_loss": -11.614997863769531, "global_step": 210913, "epoch": 1255} {"train_loss": -11.415264129638672, "global_step": 210914, "epoch": 1255} {"train_loss": -11.535636901855469, "global_step": 210915, "epoch": 1255} {"train_loss": -11.600725173950195, "global_step": 210916, "epoch": 1255} {"train_loss": -11.520343780517578, "global_step": 210917, "epoch": 1255} {"train_loss": -11.065982818603516, "global_step": 210918, "epoch": 1255} {"train_loss": -11.616962432861328, "global_step": 210919, "epoch": 1255} {"train_loss": -10.954429626464844, "global_step": 210920, "epoch": 1255} {"train_loss": -9.651507377624512, "global_step": 210921, "epoch": 1255} {"train_loss": -10.762676239013672, "global_step": 210922, "epoch": 1255} {"train_loss": -10.738460540771484, "global_step": 210923, "epoch": 1255} {"train_loss": -9.225606918334961, "global_step": 210924, "epoch": 1255} {"train_loss": -10.55221176147461, "global_step": 210925, "epoch": 1255} {"train_loss": -7.115772724151611, "global_step": 210926, "epoch": 1255} {"train_loss": -7.6582841873168945, "global_step": 210927, "epoch": 1255} {"train_loss": -8.498077392578125, "global_step": 210928, "epoch": 1255} {"train_loss": -5.7672882080078125, "global_step": 210929, "epoch": 1255} {"train_loss": -8.744315147399902, "global_step": 210930, "epoch": 1255} {"train_loss": -6.870879173278809, "global_step": 210931, "epoch": 1255} {"train_loss": -5.736624717712402, "global_step": 210932, "epoch": 1255} {"train_loss": -10.029630661010742, "global_step": 210933, "epoch": 1255} {"train_loss": -7.4856696128845215, "global_step": 210934, "epoch": 1255} {"train_loss": -6.569728851318359, "global_step": 210935, "epoch": 1255} {"train_loss": -9.492815017700195, "global_step": 210936, "epoch": 1255} {"train_loss": -9.2432861328125, "global_step": 210937, "epoch": 1255} {"train_loss": -8.420197486877441, "global_step": 210938, "epoch": 1255} {"train_loss": -9.780180931091309, "global_step": 210939, "epoch": 1255} {"train_loss": -8.940507888793945, "global_step": 210940, "epoch": 1255} {"train_loss": -9.27387809753418, "global_step": 210941, "epoch": 1255} {"train_loss": -9.896530151367188, "global_step": 210942, "epoch": 1255} {"train_loss": -7.7110514640808105, "global_step": 210943, "epoch": 1255} {"train_loss": -7.845341205596924, "global_step": 210944, "epoch": 1255} {"train_loss": -9.245049476623535, "global_step": 210945, "epoch": 1255} {"train_loss": -8.855499267578125, "global_step": 210946, "epoch": 1255} {"train_loss": -9.446030616760254, "global_step": 210947, "epoch": 1255} {"train_loss": -9.652162551879883, "global_step": 210948, "epoch": 1255} {"train_loss": -9.175199508666992, "global_step": 210949, "epoch": 1255} {"train_loss": -10.529165267944336, "global_step": 210950, "epoch": 1255} {"train_loss": -10.033315658569336, "global_step": 210951, "epoch": 1255} {"train_loss": -10.014816284179688, "global_step": 210952, "epoch": 1255} {"train_loss": -10.821674346923828, "global_step": 210953, "epoch": 1255} {"train_loss": -10.386444091796875, "global_step": 210954, "epoch": 1255} {"train_loss": -10.048436164855957, "global_step": 210955, "epoch": 1255} {"train_loss": -10.597930908203125, "global_step": 210956, "epoch": 1255} {"train_loss": -10.386452674865723, "global_step": 210957, "epoch": 1255} {"train_loss": -10.42965030670166, "global_step": 210958, "epoch": 1255} {"train_loss": -10.670197486877441, "global_step": 210959, "epoch": 1255} {"train_loss": -10.285697937011719, "global_step": 210960, "epoch": 1255} {"train_loss": -10.586063385009766, "global_step": 210961, "epoch": 1255} {"train_loss": -10.552589416503906, "global_step": 210962, "epoch": 1255} {"train_loss": -10.535911560058594, "global_step": 210963, "epoch": 1255} {"train_loss": -10.645283699035645, "global_step": 210964, "epoch": 1255} {"train_loss": -10.962556838989258, "global_step": 210965, "epoch": 1255} {"train_loss": -10.69565486907959, "global_step": 210966, "epoch": 1255} {"train_loss": -10.763298034667969, "global_step": 210967, "epoch": 1255} {"train_loss": -10.806157112121582, "global_step": 210968, "epoch": 1255} {"train_loss": -10.931241989135742, "global_step": 210969, "epoch": 1255} {"train_loss": -10.666349411010742, "global_step": 210970, "epoch": 1255} {"train_loss": -10.740233421325684, "global_step": 210971, "epoch": 1255} {"train_loss": -10.875431060791016, "global_step": 210972, "epoch": 1255} {"train_loss": -11.096334457397461, "global_step": 210973, "epoch": 1255} {"train_loss": -10.973257064819336, "global_step": 210974, "epoch": 1255} {"train_loss": -10.939496994018555, "global_step": 210975, "epoch": 1255} {"train_loss": -11.051637649536133, "global_step": 210976, "epoch": 1255} {"train_loss": -11.07372760772705, "global_step": 210977, "epoch": 1255} {"train_loss": -11.075078010559082, "global_step": 210978, "epoch": 1255} {"train_loss": -11.101018905639648, "global_step": 210979, "epoch": 1255} {"train_loss": -11.092342376708984, "global_step": 210980, "epoch": 1255} {"train_loss": -11.219115257263184, "global_step": 210981, "epoch": 1255} {"train_loss": -11.329402923583984, "global_step": 210982, "epoch": 1255} {"train_loss": -11.273365020751953, "global_step": 210983, "epoch": 1255} {"train_loss": -11.181604385375977, "global_step": 210984, "epoch": 1255} {"train_loss": -11.193190574645996, "global_step": 210985, "epoch": 1255} {"train_loss": -11.237873077392578, "global_step": 210986, "epoch": 1255} {"train_loss": -11.271982192993164, "global_step": 210987, "epoch": 1255} {"train_loss": -11.391199111938477, "global_step": 210988, "epoch": 1255} {"train_loss": -11.344048500061035, "global_step": 210989, "epoch": 1255} {"train_loss": -11.20681381225586, "global_step": 210990, "epoch": 1255} {"train_loss": -11.181196212768555, "global_step": 210991, "epoch": 1255} {"train_loss": -11.306443214416504, "global_step": 210992, "epoch": 1255} {"train_loss": -11.286532402038574, "global_step": 210993, "epoch": 1255} {"train_loss": -11.388880729675293, "global_step": 210994, "epoch": 1255} {"train_loss": -11.31979751586914, "global_step": 210995, "epoch": 1255} {"train_loss": -11.443812370300293, "global_step": 210996, "epoch": 1255} {"train_loss": -11.351670265197754, "global_step": 210997, "epoch": 1255} {"train_loss": -11.374438285827637, "global_step": 210998, "epoch": 1255} {"train_loss": -11.503751754760742, "global_step": 210999, "epoch": 1255} {"train_loss": -11.441553115844727, "global_step": 211000, "epoch": 1255} {"train_loss": -11.551216125488281, "global_step": 211001, "epoch": 1255} {"train_loss": -11.477083206176758, "global_step": 211002, "epoch": 1255} {"train_loss": -11.634546279907227, "global_step": 211003, "epoch": 1255} {"train_loss": -11.497810363769531, "global_step": 211004, "epoch": 1255} {"train_loss": -11.440582275390625, "global_step": 211005, "epoch": 1255} {"train_loss": -11.336971282958984, "global_step": 211006, "epoch": 1255} {"train_loss": -10.865702509880066, "global_step": 211007, "epoch": 1255, "val_loss": 243176.5, "train_action_mse_error": 1.8602410554885864} {"train_loss": -11.663028717041016, "global_step": 211008, "epoch": 1256} {"train_loss": -11.653360366821289, "global_step": 211009, "epoch": 1256} {"train_loss": -11.630026817321777, "global_step": 211010, "epoch": 1256} {"train_loss": -11.603631019592285, "global_step": 211011, "epoch": 1256} {"train_loss": -11.776835441589355, "global_step": 211012, "epoch": 1256} {"train_loss": -11.72409725189209, "global_step": 211013, "epoch": 1256} {"train_loss": -11.645581245422363, "global_step": 211014, "epoch": 1256} {"train_loss": -11.451238632202148, "global_step": 211015, "epoch": 1256} {"train_loss": -11.646171569824219, "global_step": 211016, "epoch": 1256} {"train_loss": -11.670793533325195, "global_step": 211017, "epoch": 1256} {"train_loss": -11.554139137268066, "global_step": 211018, "epoch": 1256} {"train_loss": -11.57442855834961, "global_step": 211019, "epoch": 1256} {"train_loss": -11.798816680908203, "global_step": 211020, "epoch": 1256} {"train_loss": -11.635986328125, "global_step": 211021, "epoch": 1256} {"train_loss": -11.634941101074219, "global_step": 211022, "epoch": 1256} {"train_loss": -12.03177547454834, "global_step": 211023, "epoch": 1256} {"train_loss": -11.777493476867676, "global_step": 211024, "epoch": 1256} {"train_loss": -11.73782730102539, "global_step": 211025, "epoch": 1256} {"train_loss": -11.744086265563965, "global_step": 211026, "epoch": 1256} {"train_loss": -11.491070747375488, "global_step": 211027, "epoch": 1256} {"train_loss": -11.806559562683105, "global_step": 211028, "epoch": 1256} {"train_loss": -11.612405776977539, "global_step": 211029, "epoch": 1256} {"train_loss": -11.76103401184082, "global_step": 211030, "epoch": 1256} {"train_loss": -11.737648963928223, "global_step": 211031, "epoch": 1256} {"train_loss": -11.564849853515625, "global_step": 211032, "epoch": 1256} {"train_loss": -11.355100631713867, "global_step": 211033, "epoch": 1256} {"train_loss": -11.863729476928711, "global_step": 211034, "epoch": 1256} {"train_loss": -11.679338455200195, "global_step": 211035, "epoch": 1256} {"train_loss": -11.70942497253418, "global_step": 211036, "epoch": 1256} {"train_loss": -11.64690113067627, "global_step": 211037, "epoch": 1256} {"train_loss": -11.920754432678223, "global_step": 211038, "epoch": 1256} {"train_loss": -11.798054695129395, "global_step": 211039, "epoch": 1256} {"train_loss": -11.338029861450195, "global_step": 211040, "epoch": 1256} {"train_loss": -12.023077011108398, "global_step": 211041, "epoch": 1256} {"train_loss": -11.398317337036133, "global_step": 211042, "epoch": 1256} {"train_loss": -10.993879318237305, "global_step": 211043, "epoch": 1256} {"train_loss": -10.152039527893066, "global_step": 211044, "epoch": 1256} {"train_loss": -11.465269088745117, "global_step": 211045, "epoch": 1256} {"train_loss": -10.341381072998047, "global_step": 211046, "epoch": 1256} {"train_loss": -11.198099136352539, "global_step": 211047, "epoch": 1256} {"train_loss": -10.476997375488281, "global_step": 211048, "epoch": 1256} {"train_loss": -10.684839248657227, "global_step": 211049, "epoch": 1256} {"train_loss": -10.818768501281738, "global_step": 211050, "epoch": 1256} {"train_loss": -10.577857971191406, "global_step": 211051, "epoch": 1256} {"train_loss": -10.689811706542969, "global_step": 211052, "epoch": 1256} {"train_loss": -10.030266761779785, "global_step": 211053, "epoch": 1256} {"train_loss": -11.463293075561523, "global_step": 211054, "epoch": 1256} {"train_loss": -9.854349136352539, "global_step": 211055, "epoch": 1256} {"train_loss": -11.106128692626953, "global_step": 211056, "epoch": 1256} {"train_loss": -10.427549362182617, "global_step": 211057, "epoch": 1256} {"train_loss": -10.000707626342773, "global_step": 211058, "epoch": 1256} {"train_loss": -10.928364753723145, "global_step": 211059, "epoch": 1256} {"train_loss": -10.070650100708008, "global_step": 211060, "epoch": 1256} {"train_loss": -9.755843162536621, "global_step": 211061, "epoch": 1256} {"train_loss": -9.503190994262695, "global_step": 211062, "epoch": 1256} {"train_loss": -9.41458511352539, "global_step": 211063, "epoch": 1256} {"train_loss": -10.24144172668457, "global_step": 211064, "epoch": 1256} {"train_loss": -10.310003280639648, "global_step": 211065, "epoch": 1256} {"train_loss": -9.228957176208496, "global_step": 211066, "epoch": 1256} {"train_loss": -10.846292495727539, "global_step": 211067, "epoch": 1256} {"train_loss": -10.91579818725586, "global_step": 211068, "epoch": 1256} {"train_loss": -10.378046035766602, "global_step": 211069, "epoch": 1256} {"train_loss": -10.81392765045166, "global_step": 211070, "epoch": 1256} {"train_loss": -10.846954345703125, "global_step": 211071, "epoch": 1256} {"train_loss": -10.548196792602539, "global_step": 211072, "epoch": 1256} {"train_loss": -11.291177749633789, "global_step": 211073, "epoch": 1256} {"train_loss": -10.00322151184082, "global_step": 211074, "epoch": 1256} {"train_loss": -11.235319137573242, "global_step": 211075, "epoch": 1256} {"train_loss": -11.0303955078125, "global_step": 211076, "epoch": 1256} {"train_loss": -10.745101928710938, "global_step": 211077, "epoch": 1256} {"train_loss": -11.045581817626953, "global_step": 211078, "epoch": 1256} {"train_loss": -10.901596069335938, "global_step": 211079, "epoch": 1256} {"train_loss": -10.421162605285645, "global_step": 211080, "epoch": 1256} {"train_loss": -11.400808334350586, "global_step": 211081, "epoch": 1256} {"train_loss": -10.675914764404297, "global_step": 211082, "epoch": 1256} {"train_loss": -10.756354331970215, "global_step": 211083, "epoch": 1256} {"train_loss": -11.132270812988281, "global_step": 211084, "epoch": 1256} {"train_loss": -10.782443046569824, "global_step": 211085, "epoch": 1256} {"train_loss": -10.692628860473633, "global_step": 211086, "epoch": 1256} {"train_loss": -11.00609016418457, "global_step": 211087, "epoch": 1256} {"train_loss": -10.94405460357666, "global_step": 211088, "epoch": 1256} {"train_loss": -10.678293228149414, "global_step": 211089, "epoch": 1256} {"train_loss": -11.13491439819336, "global_step": 211090, "epoch": 1256} {"train_loss": -11.26779556274414, "global_step": 211091, "epoch": 1256} {"train_loss": -10.868868827819824, "global_step": 211092, "epoch": 1256} {"train_loss": -10.856919288635254, "global_step": 211093, "epoch": 1256} {"train_loss": -11.097921371459961, "global_step": 211094, "epoch": 1256} {"train_loss": -10.924774169921875, "global_step": 211095, "epoch": 1256} {"train_loss": -10.884265899658203, "global_step": 211096, "epoch": 1256} {"train_loss": -11.048851013183594, "global_step": 211097, "epoch": 1256} {"train_loss": -10.857449531555176, "global_step": 211098, "epoch": 1256} {"train_loss": -11.188247680664062, "global_step": 211099, "epoch": 1256} {"train_loss": -10.982690811157227, "global_step": 211100, "epoch": 1256} {"train_loss": -11.21603775024414, "global_step": 211101, "epoch": 1256} {"train_loss": -11.176217079162598, "global_step": 211102, "epoch": 1256} {"train_loss": -11.402969360351562, "global_step": 211103, "epoch": 1256} {"train_loss": -11.417013168334961, "global_step": 211104, "epoch": 1256} {"train_loss": -11.347213745117188, "global_step": 211105, "epoch": 1256} {"train_loss": -11.487004280090332, "global_step": 211106, "epoch": 1256} {"train_loss": -11.34248161315918, "global_step": 211107, "epoch": 1256} {"train_loss": -11.371278762817383, "global_step": 211108, "epoch": 1256} {"train_loss": -11.403802871704102, "global_step": 211109, "epoch": 1256} {"train_loss": -11.544645309448242, "global_step": 211110, "epoch": 1256} {"train_loss": -11.386486053466797, "global_step": 211111, "epoch": 1256} {"train_loss": -11.406675338745117, "global_step": 211112, "epoch": 1256} {"train_loss": -11.571698188781738, "global_step": 211113, "epoch": 1256} {"train_loss": -11.510247230529785, "global_step": 211114, "epoch": 1256} {"train_loss": -11.281190872192383, "global_step": 211115, "epoch": 1256} {"train_loss": -11.363422393798828, "global_step": 211116, "epoch": 1256} {"train_loss": -11.126115798950195, "global_step": 211117, "epoch": 1256} {"train_loss": -11.590860366821289, "global_step": 211118, "epoch": 1256} {"train_loss": -11.579391479492188, "global_step": 211119, "epoch": 1256} {"train_loss": -11.439139366149902, "global_step": 211120, "epoch": 1256} {"train_loss": -11.728694915771484, "global_step": 211121, "epoch": 1256} {"train_loss": -11.08704948425293, "global_step": 211122, "epoch": 1256} {"train_loss": -11.662604331970215, "global_step": 211123, "epoch": 1256} {"train_loss": -11.43293571472168, "global_step": 211124, "epoch": 1256} {"train_loss": -11.702888488769531, "global_step": 211125, "epoch": 1256} {"train_loss": -11.620504379272461, "global_step": 211126, "epoch": 1256} {"train_loss": -11.684368133544922, "global_step": 211127, "epoch": 1256} {"train_loss": -11.607786178588867, "global_step": 211128, "epoch": 1256} {"train_loss": -11.519437789916992, "global_step": 211129, "epoch": 1256} {"train_loss": -11.68362808227539, "global_step": 211130, "epoch": 1256} {"train_loss": -11.680144309997559, "global_step": 211131, "epoch": 1256} {"train_loss": -11.57780647277832, "global_step": 211132, "epoch": 1256} {"train_loss": -11.321227073669434, "global_step": 211133, "epoch": 1256} {"train_loss": -11.65931510925293, "global_step": 211134, "epoch": 1256} {"train_loss": -11.62592887878418, "global_step": 211135, "epoch": 1256} {"train_loss": -11.847892761230469, "global_step": 211136, "epoch": 1256} {"train_loss": -11.664830207824707, "global_step": 211137, "epoch": 1256} {"train_loss": -11.7904691696167, "global_step": 211138, "epoch": 1256} {"train_loss": -11.912233352661133, "global_step": 211139, "epoch": 1256} {"train_loss": -11.738840103149414, "global_step": 211140, "epoch": 1256} {"train_loss": -11.681699752807617, "global_step": 211141, "epoch": 1256} {"train_loss": -11.773027420043945, "global_step": 211142, "epoch": 1256} {"train_loss": -11.921941757202148, "global_step": 211143, "epoch": 1256} {"train_loss": -11.881058692932129, "global_step": 211144, "epoch": 1256} {"train_loss": -11.589803695678711, "global_step": 211145, "epoch": 1256} {"train_loss": -11.736652374267578, "global_step": 211146, "epoch": 1256} {"train_loss": -11.876543045043945, "global_step": 211147, "epoch": 1256} {"train_loss": -11.664694786071777, "global_step": 211148, "epoch": 1256} {"train_loss": -11.465067863464355, "global_step": 211149, "epoch": 1256} {"train_loss": -11.876798629760742, "global_step": 211150, "epoch": 1256} {"train_loss": -11.14928150177002, "global_step": 211151, "epoch": 1256} {"train_loss": -11.382991790771484, "global_step": 211152, "epoch": 1256} {"train_loss": -11.720645904541016, "global_step": 211153, "epoch": 1256} {"train_loss": -11.751079559326172, "global_step": 211154, "epoch": 1256} {"train_loss": -11.357425689697266, "global_step": 211155, "epoch": 1256} {"train_loss": -11.697235107421875, "global_step": 211156, "epoch": 1256} {"train_loss": -11.682706832885742, "global_step": 211157, "epoch": 1256} {"train_loss": -11.667265892028809, "global_step": 211158, "epoch": 1256} {"train_loss": -11.950447082519531, "global_step": 211159, "epoch": 1256} {"train_loss": -11.581350326538086, "global_step": 211160, "epoch": 1256} {"train_loss": -11.598016738891602, "global_step": 211161, "epoch": 1256} {"train_loss": -10.991531372070312, "global_step": 211162, "epoch": 1256} {"train_loss": -11.765661239624023, "global_step": 211163, "epoch": 1256} {"train_loss": -11.615705490112305, "global_step": 211164, "epoch": 1256} {"train_loss": -11.660383224487305, "global_step": 211165, "epoch": 1256} {"train_loss": -10.970844268798828, "global_step": 211166, "epoch": 1256} {"train_loss": -11.01175308227539, "global_step": 211167, "epoch": 1256} {"train_loss": -10.837442398071289, "global_step": 211168, "epoch": 1256} {"train_loss": -11.518427848815918, "global_step": 211169, "epoch": 1256} {"train_loss": -10.853669166564941, "global_step": 211170, "epoch": 1256} {"train_loss": -11.332428932189941, "global_step": 211171, "epoch": 1256} {"train_loss": -11.208005905151367, "global_step": 211172, "epoch": 1256} {"train_loss": -10.874000549316406, "global_step": 211173, "epoch": 1256} {"train_loss": -10.718873977661133, "global_step": 211174, "epoch": 1256} {"train_loss": -11.252807055200849, "global_step": 211175, "epoch": 1256, "val_loss": 244813.265625} {"train_loss": -10.693642616271973, "global_step": 211176, "epoch": 1257} {"train_loss": -10.66242790222168, "global_step": 211177, "epoch": 1257} {"train_loss": -11.443159103393555, "global_step": 211178, "epoch": 1257} {"train_loss": -9.968766212463379, "global_step": 211179, "epoch": 1257} {"train_loss": -11.609792709350586, "global_step": 211180, "epoch": 1257} {"train_loss": -11.214189529418945, "global_step": 211181, "epoch": 1257} {"train_loss": -11.16497802734375, "global_step": 211182, "epoch": 1257} {"train_loss": -11.304981231689453, "global_step": 211183, "epoch": 1257} {"train_loss": -11.251686096191406, "global_step": 211184, "epoch": 1257} {"train_loss": -11.415971755981445, "global_step": 211185, "epoch": 1257} {"train_loss": -11.145428657531738, "global_step": 211186, "epoch": 1257} {"train_loss": -11.367263793945312, "global_step": 211187, "epoch": 1257} {"train_loss": -11.392812728881836, "global_step": 211188, "epoch": 1257} {"train_loss": -11.64192008972168, "global_step": 211189, "epoch": 1257} {"train_loss": -11.221040725708008, "global_step": 211190, "epoch": 1257} {"train_loss": -11.37527847290039, "global_step": 211191, "epoch": 1257} {"train_loss": -11.308523178100586, "global_step": 211192, "epoch": 1257} {"train_loss": -11.48837661743164, "global_step": 211193, "epoch": 1257} {"train_loss": -11.312246322631836, "global_step": 211194, "epoch": 1257} {"train_loss": -11.258034706115723, "global_step": 211195, "epoch": 1257} {"train_loss": -11.525959014892578, "global_step": 211196, "epoch": 1257} {"train_loss": -11.223222732543945, "global_step": 211197, "epoch": 1257} {"train_loss": -11.45377254486084, "global_step": 211198, "epoch": 1257} {"train_loss": -11.581905364990234, "global_step": 211199, "epoch": 1257} {"train_loss": -11.331106185913086, "global_step": 211200, "epoch": 1257} {"train_loss": -11.30885124206543, "global_step": 211201, "epoch": 1257} {"train_loss": -11.387918472290039, "global_step": 211202, "epoch": 1257} {"train_loss": -11.603835105895996, "global_step": 211203, "epoch": 1257} {"train_loss": -11.581729888916016, "global_step": 211204, "epoch": 1257} {"train_loss": -11.395650863647461, "global_step": 211205, "epoch": 1257} {"train_loss": -11.363139152526855, "global_step": 211206, "epoch": 1257} {"train_loss": -11.682235717773438, "global_step": 211207, "epoch": 1257} {"train_loss": -11.282241821289062, "global_step": 211208, "epoch": 1257} {"train_loss": -11.629582405090332, "global_step": 211209, "epoch": 1257} {"train_loss": -11.162012100219727, "global_step": 211210, "epoch": 1257} {"train_loss": -11.674461364746094, "global_step": 211211, "epoch": 1257} {"train_loss": -11.014310836791992, "global_step": 211212, "epoch": 1257} {"train_loss": -11.257890701293945, "global_step": 211213, "epoch": 1257} {"train_loss": -11.140771865844727, "global_step": 211214, "epoch": 1257} {"train_loss": -11.107887268066406, "global_step": 211215, "epoch": 1257} {"train_loss": -10.979552268981934, "global_step": 211216, "epoch": 1257} {"train_loss": -11.537897109985352, "global_step": 211217, "epoch": 1257} {"train_loss": -11.356658935546875, "global_step": 211218, "epoch": 1257} {"train_loss": -11.411928176879883, "global_step": 211219, "epoch": 1257} {"train_loss": -11.098516464233398, "global_step": 211220, "epoch": 1257} {"train_loss": -11.42245864868164, "global_step": 211221, "epoch": 1257} {"train_loss": -11.481973648071289, "global_step": 211222, "epoch": 1257} {"train_loss": -11.258119583129883, "global_step": 211223, "epoch": 1257} {"train_loss": -11.68187141418457, "global_step": 211224, "epoch": 1257} {"train_loss": -11.271092414855957, "global_step": 211225, "epoch": 1257} {"train_loss": -11.880324363708496, "global_step": 211226, "epoch": 1257} {"train_loss": -11.443534851074219, "global_step": 211227, "epoch": 1257} {"train_loss": -11.646300315856934, "global_step": 211228, "epoch": 1257} {"train_loss": -11.521767616271973, "global_step": 211229, "epoch": 1257} {"train_loss": -11.6958646774292, "global_step": 211230, "epoch": 1257} {"train_loss": -11.425027847290039, "global_step": 211231, "epoch": 1257} {"train_loss": -11.795422554016113, "global_step": 211232, "epoch": 1257} {"train_loss": -11.583477020263672, "global_step": 211233, "epoch": 1257} {"train_loss": -11.476682662963867, "global_step": 211234, "epoch": 1257} {"train_loss": -11.637829780578613, "global_step": 211235, "epoch": 1257} {"train_loss": -11.40353012084961, "global_step": 211236, "epoch": 1257} {"train_loss": -11.261733055114746, "global_step": 211237, "epoch": 1257} {"train_loss": -11.816068649291992, "global_step": 211238, "epoch": 1257} {"train_loss": -11.468535423278809, "global_step": 211239, "epoch": 1257} {"train_loss": -11.512808799743652, "global_step": 211240, "epoch": 1257} {"train_loss": -11.450479507446289, "global_step": 211241, "epoch": 1257} {"train_loss": -11.582554817199707, "global_step": 211242, "epoch": 1257} {"train_loss": -11.49937629699707, "global_step": 211243, "epoch": 1257} {"train_loss": -11.686077117919922, "global_step": 211244, "epoch": 1257} {"train_loss": -11.541329383850098, "global_step": 211245, "epoch": 1257} {"train_loss": -11.81710433959961, "global_step": 211246, "epoch": 1257} {"train_loss": -11.610987663269043, "global_step": 211247, "epoch": 1257} {"train_loss": -11.676872253417969, "global_step": 211248, "epoch": 1257} {"train_loss": -11.867512702941895, "global_step": 211249, "epoch": 1257} {"train_loss": -11.577176094055176, "global_step": 211250, "epoch": 1257} {"train_loss": -11.889644622802734, "global_step": 211251, "epoch": 1257} {"train_loss": -11.865521430969238, "global_step": 211252, "epoch": 1257} {"train_loss": -11.820295333862305, "global_step": 211253, "epoch": 1257} {"train_loss": -11.677151679992676, "global_step": 211254, "epoch": 1257} {"train_loss": -11.659124374389648, "global_step": 211255, "epoch": 1257} {"train_loss": -11.752805709838867, "global_step": 211256, "epoch": 1257} {"train_loss": -11.550283432006836, "global_step": 211257, "epoch": 1257} {"train_loss": -11.799910545349121, "global_step": 211258, "epoch": 1257} {"train_loss": -11.776666641235352, "global_step": 211259, "epoch": 1257} {"train_loss": -11.18419075012207, "global_step": 211260, "epoch": 1257} {"train_loss": -11.663748741149902, "global_step": 211261, "epoch": 1257} {"train_loss": -11.826740264892578, "global_step": 211262, "epoch": 1257} {"train_loss": -10.682682991027832, "global_step": 211263, "epoch": 1257} {"train_loss": -11.444297790527344, "global_step": 211264, "epoch": 1257} {"train_loss": -11.34048080444336, "global_step": 211265, "epoch": 1257} {"train_loss": -9.823171615600586, "global_step": 211266, "epoch": 1257} {"train_loss": -10.183368682861328, "global_step": 211267, "epoch": 1257} {"train_loss": -11.375205993652344, "global_step": 211268, "epoch": 1257} {"train_loss": -10.016217231750488, "global_step": 211269, "epoch": 1257} {"train_loss": -10.687450408935547, "global_step": 211270, "epoch": 1257} {"train_loss": -10.828264236450195, "global_step": 211271, "epoch": 1257} {"train_loss": -9.367950439453125, "global_step": 211272, "epoch": 1257} {"train_loss": -10.10753059387207, "global_step": 211273, "epoch": 1257} {"train_loss": -9.79195499420166, "global_step": 211274, "epoch": 1257} {"train_loss": -9.543011665344238, "global_step": 211275, "epoch": 1257} {"train_loss": -9.802959442138672, "global_step": 211276, "epoch": 1257} {"train_loss": -9.482254028320312, "global_step": 211277, "epoch": 1257} {"train_loss": -8.817262649536133, "global_step": 211278, "epoch": 1257} {"train_loss": -10.834274291992188, "global_step": 211279, "epoch": 1257} {"train_loss": -9.1439208984375, "global_step": 211280, "epoch": 1257} {"train_loss": -10.721518516540527, "global_step": 211281, "epoch": 1257} {"train_loss": -9.832318305969238, "global_step": 211282, "epoch": 1257} {"train_loss": -9.689056396484375, "global_step": 211283, "epoch": 1257} {"train_loss": -10.774137496948242, "global_step": 211284, "epoch": 1257} {"train_loss": -10.473758697509766, "global_step": 211285, "epoch": 1257} {"train_loss": -9.90887451171875, "global_step": 211286, "epoch": 1257} {"train_loss": -11.168556213378906, "global_step": 211287, "epoch": 1257} {"train_loss": -10.461307525634766, "global_step": 211288, "epoch": 1257} {"train_loss": -10.591967582702637, "global_step": 211289, "epoch": 1257} {"train_loss": -11.135946273803711, "global_step": 211290, "epoch": 1257} {"train_loss": -10.15036678314209, "global_step": 211291, "epoch": 1257} {"train_loss": -10.491567611694336, "global_step": 211292, "epoch": 1257} {"train_loss": -10.806865692138672, "global_step": 211293, "epoch": 1257} {"train_loss": -10.803047180175781, "global_step": 211294, "epoch": 1257} {"train_loss": -10.565520286560059, "global_step": 211295, "epoch": 1257} {"train_loss": -11.149444580078125, "global_step": 211296, "epoch": 1257} {"train_loss": -10.598123550415039, "global_step": 211297, "epoch": 1257} {"train_loss": -10.871519088745117, "global_step": 211298, "epoch": 1257} {"train_loss": -11.211963653564453, "global_step": 211299, "epoch": 1257} {"train_loss": -11.15528678894043, "global_step": 211300, "epoch": 1257} {"train_loss": -11.097111701965332, "global_step": 211301, "epoch": 1257} {"train_loss": -11.061849594116211, "global_step": 211302, "epoch": 1257} {"train_loss": -11.183759689331055, "global_step": 211303, "epoch": 1257} {"train_loss": -10.846590995788574, "global_step": 211304, "epoch": 1257} {"train_loss": -11.394076347351074, "global_step": 211305, "epoch": 1257} {"train_loss": -10.774011611938477, "global_step": 211306, "epoch": 1257} {"train_loss": -11.035699844360352, "global_step": 211307, "epoch": 1257} {"train_loss": -11.351788520812988, "global_step": 211308, "epoch": 1257} {"train_loss": -11.190692901611328, "global_step": 211309, "epoch": 1257} {"train_loss": -11.142216682434082, "global_step": 211310, "epoch": 1257} {"train_loss": -11.110746383666992, "global_step": 211311, "epoch": 1257} {"train_loss": -11.23313045501709, "global_step": 211312, "epoch": 1257} {"train_loss": -11.17480754852295, "global_step": 211313, "epoch": 1257} {"train_loss": -11.426368713378906, "global_step": 211314, "epoch": 1257} {"train_loss": -11.100786209106445, "global_step": 211315, "epoch": 1257} {"train_loss": -11.357731819152832, "global_step": 211316, "epoch": 1257} {"train_loss": -11.3508939743042, "global_step": 211317, "epoch": 1257} {"train_loss": -11.284929275512695, "global_step": 211318, "epoch": 1257} {"train_loss": -11.356315612792969, "global_step": 211319, "epoch": 1257} {"train_loss": -11.412309646606445, "global_step": 211320, "epoch": 1257} {"train_loss": -11.555925369262695, "global_step": 211321, "epoch": 1257} {"train_loss": -11.426552772521973, "global_step": 211322, "epoch": 1257} {"train_loss": -11.605927467346191, "global_step": 211323, "epoch": 1257} {"train_loss": -11.517404556274414, "global_step": 211324, "epoch": 1257} {"train_loss": -11.549810409545898, "global_step": 211325, "epoch": 1257} {"train_loss": -11.642822265625, "global_step": 211326, "epoch": 1257} {"train_loss": -11.501165390014648, "global_step": 211327, "epoch": 1257} {"train_loss": -11.553401947021484, "global_step": 211328, "epoch": 1257} {"train_loss": -11.279041290283203, "global_step": 211329, "epoch": 1257} {"train_loss": -11.3142671585083, "global_step": 211330, "epoch": 1257} {"train_loss": -11.539892196655273, "global_step": 211331, "epoch": 1257} {"train_loss": -11.71971321105957, "global_step": 211332, "epoch": 1257} {"train_loss": -11.313596725463867, "global_step": 211333, "epoch": 1257} {"train_loss": -11.499776840209961, "global_step": 211334, "epoch": 1257} {"train_loss": -11.569472312927246, "global_step": 211335, "epoch": 1257} {"train_loss": -11.662464141845703, "global_step": 211336, "epoch": 1257} {"train_loss": -11.53321361541748, "global_step": 211337, "epoch": 1257} {"train_loss": -11.587179183959961, "global_step": 211338, "epoch": 1257} {"train_loss": -11.829230308532715, "global_step": 211339, "epoch": 1257} {"train_loss": -11.750458717346191, "global_step": 211340, "epoch": 1257} {"train_loss": -11.631195068359375, "global_step": 211341, "epoch": 1257} {"train_loss": -11.88733959197998, "global_step": 211342, "epoch": 1257} {"train_loss": -11.199874253500075, "global_step": 211343, "epoch": 1257, "val_loss": 248548.078125} {"train_loss": -11.713197708129883, "global_step": 211344, "epoch": 1258} {"train_loss": -11.60306453704834, "global_step": 211345, "epoch": 1258} {"train_loss": -11.62934398651123, "global_step": 211346, "epoch": 1258} {"train_loss": -11.645807266235352, "global_step": 211347, "epoch": 1258} {"train_loss": -11.734515190124512, "global_step": 211348, "epoch": 1258} {"train_loss": -11.844080924987793, "global_step": 211349, "epoch": 1258} {"train_loss": -11.634286880493164, "global_step": 211350, "epoch": 1258} {"train_loss": -11.842951774597168, "global_step": 211351, "epoch": 1258} {"train_loss": -11.779802322387695, "global_step": 211352, "epoch": 1258} {"train_loss": -11.735347747802734, "global_step": 211353, "epoch": 1258} {"train_loss": -11.714225769042969, "global_step": 211354, "epoch": 1258} {"train_loss": -11.621219635009766, "global_step": 211355, "epoch": 1258} {"train_loss": -11.610199928283691, "global_step": 211356, "epoch": 1258} {"train_loss": -11.490142822265625, "global_step": 211357, "epoch": 1258} {"train_loss": -10.829658508300781, "global_step": 211358, "epoch": 1258} {"train_loss": -11.691444396972656, "global_step": 211359, "epoch": 1258} {"train_loss": -11.270483016967773, "global_step": 211360, "epoch": 1258} {"train_loss": -11.593523025512695, "global_step": 211361, "epoch": 1258} {"train_loss": -11.6043119430542, "global_step": 211362, "epoch": 1258} {"train_loss": -11.322257995605469, "global_step": 211363, "epoch": 1258} {"train_loss": -11.560223579406738, "global_step": 211364, "epoch": 1258} {"train_loss": -11.595914840698242, "global_step": 211365, "epoch": 1258} {"train_loss": -11.305025100708008, "global_step": 211366, "epoch": 1258} {"train_loss": -11.847986221313477, "global_step": 211367, "epoch": 1258} {"train_loss": -11.484414100646973, "global_step": 211368, "epoch": 1258} {"train_loss": -11.47906494140625, "global_step": 211369, "epoch": 1258} {"train_loss": -11.600924491882324, "global_step": 211370, "epoch": 1258} {"train_loss": -11.39816665649414, "global_step": 211371, "epoch": 1258} {"train_loss": -11.855405807495117, "global_step": 211372, "epoch": 1258} {"train_loss": -11.668203353881836, "global_step": 211373, "epoch": 1258} {"train_loss": -11.610584259033203, "global_step": 211374, "epoch": 1258} {"train_loss": -11.759492874145508, "global_step": 211375, "epoch": 1258} {"train_loss": -11.771320343017578, "global_step": 211376, "epoch": 1258} {"train_loss": -11.68752670288086, "global_step": 211377, "epoch": 1258} {"train_loss": -11.627069473266602, "global_step": 211378, "epoch": 1258} {"train_loss": -11.958141326904297, "global_step": 211379, "epoch": 1258} {"train_loss": -11.719407081604004, "global_step": 211380, "epoch": 1258} {"train_loss": -11.576601028442383, "global_step": 211381, "epoch": 1258} {"train_loss": -11.79429817199707, "global_step": 211382, "epoch": 1258} {"train_loss": -11.604098320007324, "global_step": 211383, "epoch": 1258} {"train_loss": -11.612566947937012, "global_step": 211384, "epoch": 1258} {"train_loss": -11.591933250427246, "global_step": 211385, "epoch": 1258} {"train_loss": -11.421443939208984, "global_step": 211386, "epoch": 1258} {"train_loss": -10.995664596557617, "global_step": 211387, "epoch": 1258} {"train_loss": -11.621946334838867, "global_step": 211388, "epoch": 1258} {"train_loss": -11.586462020874023, "global_step": 211389, "epoch": 1258} {"train_loss": -11.321456909179688, "global_step": 211390, "epoch": 1258} {"train_loss": -10.720724105834961, "global_step": 211391, "epoch": 1258} {"train_loss": -11.339677810668945, "global_step": 211392, "epoch": 1258} {"train_loss": -11.519410133361816, "global_step": 211393, "epoch": 1258} {"train_loss": -10.710906982421875, "global_step": 211394, "epoch": 1258} {"train_loss": -10.768129348754883, "global_step": 211395, "epoch": 1258} {"train_loss": -10.865028381347656, "global_step": 211396, "epoch": 1258} {"train_loss": -11.309592247009277, "global_step": 211397, "epoch": 1258} {"train_loss": -10.468088150024414, "global_step": 211398, "epoch": 1258} {"train_loss": -11.308464050292969, "global_step": 211399, "epoch": 1258} {"train_loss": -11.004076957702637, "global_step": 211400, "epoch": 1258} {"train_loss": -10.681273460388184, "global_step": 211401, "epoch": 1258} {"train_loss": -10.638873100280762, "global_step": 211402, "epoch": 1258} {"train_loss": -11.6371488571167, "global_step": 211403, "epoch": 1258} {"train_loss": -10.777027130126953, "global_step": 211404, "epoch": 1258} {"train_loss": -11.433000564575195, "global_step": 211405, "epoch": 1258} {"train_loss": -10.363962173461914, "global_step": 211406, "epoch": 1258} {"train_loss": -11.107549667358398, "global_step": 211407, "epoch": 1258} {"train_loss": -10.06540298461914, "global_step": 211408, "epoch": 1258} {"train_loss": -10.577982902526855, "global_step": 211409, "epoch": 1258} {"train_loss": -11.2882080078125, "global_step": 211410, "epoch": 1258} {"train_loss": -10.8767728805542, "global_step": 211411, "epoch": 1258} {"train_loss": -11.426212310791016, "global_step": 211412, "epoch": 1258} {"train_loss": -11.227655410766602, "global_step": 211413, "epoch": 1258} {"train_loss": -11.482102394104004, "global_step": 211414, "epoch": 1258} {"train_loss": -11.414633750915527, "global_step": 211415, "epoch": 1258} {"train_loss": -11.720939636230469, "global_step": 211416, "epoch": 1258} {"train_loss": -11.30647087097168, "global_step": 211417, "epoch": 1258} {"train_loss": -11.2970552444458, "global_step": 211418, "epoch": 1258} {"train_loss": -11.483373641967773, "global_step": 211419, "epoch": 1258} {"train_loss": -11.50317096710205, "global_step": 211420, "epoch": 1258} {"train_loss": -11.644304275512695, "global_step": 211421, "epoch": 1258} {"train_loss": -11.314873695373535, "global_step": 211422, "epoch": 1258} {"train_loss": -11.253500938415527, "global_step": 211423, "epoch": 1258} {"train_loss": -11.456588745117188, "global_step": 211424, "epoch": 1258} {"train_loss": -11.23792552947998, "global_step": 211425, "epoch": 1258} {"train_loss": -11.600403785705566, "global_step": 211426, "epoch": 1258} {"train_loss": -11.184946060180664, "global_step": 211427, "epoch": 1258} {"train_loss": -11.598047256469727, "global_step": 211428, "epoch": 1258} {"train_loss": -11.36345100402832, "global_step": 211429, "epoch": 1258} {"train_loss": -11.631397247314453, "global_step": 211430, "epoch": 1258} {"train_loss": -11.464889526367188, "global_step": 211431, "epoch": 1258} {"train_loss": -11.529570579528809, "global_step": 211432, "epoch": 1258} {"train_loss": -11.410418510437012, "global_step": 211433, "epoch": 1258} {"train_loss": -11.678060531616211, "global_step": 211434, "epoch": 1258} {"train_loss": -11.157455444335938, "global_step": 211435, "epoch": 1258} {"train_loss": -11.4373140335083, "global_step": 211436, "epoch": 1258} {"train_loss": -11.464925765991211, "global_step": 211437, "epoch": 1258} {"train_loss": -11.398523330688477, "global_step": 211438, "epoch": 1258} {"train_loss": -11.75207805633545, "global_step": 211439, "epoch": 1258} {"train_loss": -11.184794425964355, "global_step": 211440, "epoch": 1258} {"train_loss": -11.615745544433594, "global_step": 211441, "epoch": 1258} {"train_loss": -11.411008834838867, "global_step": 211442, "epoch": 1258} {"train_loss": -11.68581485748291, "global_step": 211443, "epoch": 1258} {"train_loss": -11.539377212524414, "global_step": 211444, "epoch": 1258} {"train_loss": -11.540084838867188, "global_step": 211445, "epoch": 1258} {"train_loss": -11.609283447265625, "global_step": 211446, "epoch": 1258} {"train_loss": -11.620872497558594, "global_step": 211447, "epoch": 1258} {"train_loss": -11.59228801727295, "global_step": 211448, "epoch": 1258} {"train_loss": -11.70273494720459, "global_step": 211449, "epoch": 1258} {"train_loss": -11.677188873291016, "global_step": 211450, "epoch": 1258} {"train_loss": -11.406638145446777, "global_step": 211451, "epoch": 1258} {"train_loss": -11.504849433898926, "global_step": 211452, "epoch": 1258} {"train_loss": -11.694002151489258, "global_step": 211453, "epoch": 1258} {"train_loss": -11.215139389038086, "global_step": 211454, "epoch": 1258} {"train_loss": -11.807048797607422, "global_step": 211455, "epoch": 1258} {"train_loss": -11.264493942260742, "global_step": 211456, "epoch": 1258} {"train_loss": -11.603341102600098, "global_step": 211457, "epoch": 1258} {"train_loss": -11.137723922729492, "global_step": 211458, "epoch": 1258} {"train_loss": -11.607131958007812, "global_step": 211459, "epoch": 1258} {"train_loss": -11.669153213500977, "global_step": 211460, "epoch": 1258} {"train_loss": -11.47403335571289, "global_step": 211461, "epoch": 1258} {"train_loss": -11.438682556152344, "global_step": 211462, "epoch": 1258} {"train_loss": -11.499959945678711, "global_step": 211463, "epoch": 1258} {"train_loss": -11.063538551330566, "global_step": 211464, "epoch": 1258} {"train_loss": -11.4736328125, "global_step": 211465, "epoch": 1258} {"train_loss": -10.851296424865723, "global_step": 211466, "epoch": 1258} {"train_loss": -11.170868873596191, "global_step": 211467, "epoch": 1258} {"train_loss": -10.692583084106445, "global_step": 211468, "epoch": 1258} {"train_loss": -11.072097778320312, "global_step": 211469, "epoch": 1258} {"train_loss": -11.322787284851074, "global_step": 211470, "epoch": 1258} {"train_loss": -11.437524795532227, "global_step": 211471, "epoch": 1258} {"train_loss": -11.338892936706543, "global_step": 211472, "epoch": 1258} {"train_loss": -11.395666122436523, "global_step": 211473, "epoch": 1258} {"train_loss": -11.26089859008789, "global_step": 211474, "epoch": 1258} {"train_loss": -11.581798553466797, "global_step": 211475, "epoch": 1258} {"train_loss": -11.405821800231934, "global_step": 211476, "epoch": 1258} {"train_loss": -11.440607070922852, "global_step": 211477, "epoch": 1258} {"train_loss": -11.473799705505371, "global_step": 211478, "epoch": 1258} {"train_loss": -11.526834487915039, "global_step": 211479, "epoch": 1258} {"train_loss": -11.448204040527344, "global_step": 211480, "epoch": 1258} {"train_loss": -11.415567398071289, "global_step": 211481, "epoch": 1258} {"train_loss": -11.177343368530273, "global_step": 211482, "epoch": 1258} {"train_loss": -11.288774490356445, "global_step": 211483, "epoch": 1258} {"train_loss": -10.689748764038086, "global_step": 211484, "epoch": 1258} {"train_loss": -10.916082382202148, "global_step": 211485, "epoch": 1258} {"train_loss": -11.039667129516602, "global_step": 211486, "epoch": 1258} {"train_loss": -10.701896667480469, "global_step": 211487, "epoch": 1258} {"train_loss": -11.638191223144531, "global_step": 211488, "epoch": 1258} {"train_loss": -10.305516242980957, "global_step": 211489, "epoch": 1258} {"train_loss": -10.717338562011719, "global_step": 211490, "epoch": 1258} {"train_loss": -11.232080459594727, "global_step": 211491, "epoch": 1258} {"train_loss": -9.864721298217773, "global_step": 211492, "epoch": 1258} {"train_loss": -11.132434844970703, "global_step": 211493, "epoch": 1258} {"train_loss": -10.88636589050293, "global_step": 211494, "epoch": 1258} {"train_loss": -10.788455963134766, "global_step": 211495, "epoch": 1258} {"train_loss": -11.194150924682617, "global_step": 211496, "epoch": 1258} {"train_loss": -11.426639556884766, "global_step": 211497, "epoch": 1258} {"train_loss": -10.891639709472656, "global_step": 211498, "epoch": 1258} {"train_loss": -11.437142372131348, "global_step": 211499, "epoch": 1258} {"train_loss": -10.565488815307617, "global_step": 211500, "epoch": 1258} {"train_loss": -10.589730262756348, "global_step": 211501, "epoch": 1258} {"train_loss": -11.018915176391602, "global_step": 211502, "epoch": 1258} {"train_loss": -10.774949073791504, "global_step": 211503, "epoch": 1258} {"train_loss": -11.291740417480469, "global_step": 211504, "epoch": 1258} {"train_loss": -11.005573272705078, "global_step": 211505, "epoch": 1258} {"train_loss": -10.66364860534668, "global_step": 211506, "epoch": 1258} {"train_loss": -11.523921966552734, "global_step": 211507, "epoch": 1258} {"train_loss": -11.256553649902344, "global_step": 211508, "epoch": 1258} {"train_loss": -11.267696380615234, "global_step": 211509, "epoch": 1258} {"train_loss": -11.360066413879395, "global_step": 211510, "epoch": 1258} {"train_loss": -11.33775922797975, "global_step": 211511, "epoch": 1258, "val_loss": 251862.296875} {"train_loss": -11.47962474822998, "global_step": 211512, "epoch": 1259} {"train_loss": -10.99195384979248, "global_step": 211513, "epoch": 1259} {"train_loss": -11.573797225952148, "global_step": 211514, "epoch": 1259} {"train_loss": -11.538558959960938, "global_step": 211515, "epoch": 1259} {"train_loss": -11.276449203491211, "global_step": 211516, "epoch": 1259} {"train_loss": -11.224742889404297, "global_step": 211517, "epoch": 1259} {"train_loss": -11.509376525878906, "global_step": 211518, "epoch": 1259} {"train_loss": -11.534236907958984, "global_step": 211519, "epoch": 1259} {"train_loss": -11.562904357910156, "global_step": 211520, "epoch": 1259} {"train_loss": -11.384601593017578, "global_step": 211521, "epoch": 1259} {"train_loss": -11.28376579284668, "global_step": 211522, "epoch": 1259} {"train_loss": -11.425039291381836, "global_step": 211523, "epoch": 1259} {"train_loss": -11.252819061279297, "global_step": 211524, "epoch": 1259} {"train_loss": -11.636302947998047, "global_step": 211525, "epoch": 1259} {"train_loss": -11.263605117797852, "global_step": 211526, "epoch": 1259} {"train_loss": -11.610124588012695, "global_step": 211527, "epoch": 1259} {"train_loss": -11.425700187683105, "global_step": 211528, "epoch": 1259} {"train_loss": -11.3672513961792, "global_step": 211529, "epoch": 1259} {"train_loss": -11.390124320983887, "global_step": 211530, "epoch": 1259} {"train_loss": -11.405292510986328, "global_step": 211531, "epoch": 1259} {"train_loss": -11.369441986083984, "global_step": 211532, "epoch": 1259} {"train_loss": -11.5320405960083, "global_step": 211533, "epoch": 1259} {"train_loss": -11.515691757202148, "global_step": 211534, "epoch": 1259} {"train_loss": -11.494211196899414, "global_step": 211535, "epoch": 1259} {"train_loss": -11.426962852478027, "global_step": 211536, "epoch": 1259} {"train_loss": -11.56960678100586, "global_step": 211537, "epoch": 1259} {"train_loss": -11.455795288085938, "global_step": 211538, "epoch": 1259} {"train_loss": -11.61865234375, "global_step": 211539, "epoch": 1259} {"train_loss": -11.514110565185547, "global_step": 211540, "epoch": 1259} {"train_loss": -11.60816764831543, "global_step": 211541, "epoch": 1259} {"train_loss": -11.450960159301758, "global_step": 211542, "epoch": 1259} {"train_loss": -11.660597801208496, "global_step": 211543, "epoch": 1259} {"train_loss": -11.413305282592773, "global_step": 211544, "epoch": 1259} {"train_loss": -11.651777267456055, "global_step": 211545, "epoch": 1259} {"train_loss": -11.738618850708008, "global_step": 211546, "epoch": 1259} {"train_loss": -11.510272979736328, "global_step": 211547, "epoch": 1259} {"train_loss": -11.8446626663208, "global_step": 211548, "epoch": 1259} {"train_loss": -11.767196655273438, "global_step": 211549, "epoch": 1259} {"train_loss": -11.52266788482666, "global_step": 211550, "epoch": 1259} {"train_loss": -11.877660751342773, "global_step": 211551, "epoch": 1259} {"train_loss": -11.962897300720215, "global_step": 211552, "epoch": 1259} {"train_loss": -11.869306564331055, "global_step": 211553, "epoch": 1259} {"train_loss": -11.747055053710938, "global_step": 211554, "epoch": 1259} {"train_loss": -11.770557403564453, "global_step": 211555, "epoch": 1259} {"train_loss": -11.709488868713379, "global_step": 211556, "epoch": 1259} {"train_loss": -11.757844924926758, "global_step": 211557, "epoch": 1259} {"train_loss": -11.834095001220703, "global_step": 211558, "epoch": 1259} {"train_loss": -11.96345329284668, "global_step": 211559, "epoch": 1259} {"train_loss": -11.806770324707031, "global_step": 211560, "epoch": 1259} {"train_loss": -11.738749504089355, "global_step": 211561, "epoch": 1259} {"train_loss": -11.891867637634277, "global_step": 211562, "epoch": 1259} {"train_loss": -11.840187072753906, "global_step": 211563, "epoch": 1259} {"train_loss": -11.913198471069336, "global_step": 211564, "epoch": 1259} {"train_loss": -11.783604621887207, "global_step": 211565, "epoch": 1259} {"train_loss": -11.852838516235352, "global_step": 211566, "epoch": 1259} {"train_loss": -11.73829174041748, "global_step": 211567, "epoch": 1259} {"train_loss": -12.01041030883789, "global_step": 211568, "epoch": 1259} {"train_loss": -11.75125503540039, "global_step": 211569, "epoch": 1259} {"train_loss": -11.28364372253418, "global_step": 211570, "epoch": 1259} {"train_loss": -11.281320571899414, "global_step": 211571, "epoch": 1259} {"train_loss": -11.799494743347168, "global_step": 211572, "epoch": 1259} {"train_loss": -11.72711181640625, "global_step": 211573, "epoch": 1259} {"train_loss": -11.852607727050781, "global_step": 211574, "epoch": 1259} {"train_loss": -11.849119186401367, "global_step": 211575, "epoch": 1259} {"train_loss": -11.983394622802734, "global_step": 211576, "epoch": 1259} {"train_loss": -11.744462966918945, "global_step": 211577, "epoch": 1259} {"train_loss": -11.70984172821045, "global_step": 211578, "epoch": 1259} {"train_loss": -11.88311767578125, "global_step": 211579, "epoch": 1259} {"train_loss": -11.813421249389648, "global_step": 211580, "epoch": 1259} {"train_loss": -11.903827667236328, "global_step": 211581, "epoch": 1259} {"train_loss": -11.736740112304688, "global_step": 211582, "epoch": 1259} {"train_loss": -11.478292465209961, "global_step": 211583, "epoch": 1259} {"train_loss": -11.334121704101562, "global_step": 211584, "epoch": 1259} {"train_loss": -11.247404098510742, "global_step": 211585, "epoch": 1259} {"train_loss": -11.176168441772461, "global_step": 211586, "epoch": 1259} {"train_loss": -11.167015075683594, "global_step": 211587, "epoch": 1259} {"train_loss": -10.568382263183594, "global_step": 211588, "epoch": 1259} {"train_loss": -11.094523429870605, "global_step": 211589, "epoch": 1259} {"train_loss": -11.140584945678711, "global_step": 211590, "epoch": 1259} {"train_loss": -10.773453712463379, "global_step": 211591, "epoch": 1259} {"train_loss": -10.71548843383789, "global_step": 211592, "epoch": 1259} {"train_loss": -10.084051132202148, "global_step": 211593, "epoch": 1259} {"train_loss": -10.272039413452148, "global_step": 211594, "epoch": 1259} {"train_loss": -10.768508911132812, "global_step": 211595, "epoch": 1259} {"train_loss": -10.797581672668457, "global_step": 211596, "epoch": 1259} {"train_loss": -11.286686897277832, "global_step": 211597, "epoch": 1259} {"train_loss": -10.853395462036133, "global_step": 211598, "epoch": 1259} {"train_loss": -11.314994812011719, "global_step": 211599, "epoch": 1259} {"train_loss": -11.067476272583008, "global_step": 211600, "epoch": 1259} {"train_loss": -10.762049674987793, "global_step": 211601, "epoch": 1259} {"train_loss": -9.94683837890625, "global_step": 211602, "epoch": 1259} {"train_loss": -10.664896011352539, "global_step": 211603, "epoch": 1259} {"train_loss": -10.481178283691406, "global_step": 211604, "epoch": 1259} {"train_loss": -10.35310173034668, "global_step": 211605, "epoch": 1259} {"train_loss": -9.699845314025879, "global_step": 211606, "epoch": 1259} {"train_loss": -11.041555404663086, "global_step": 211607, "epoch": 1259} {"train_loss": -9.11904525756836, "global_step": 211608, "epoch": 1259} {"train_loss": -9.848281860351562, "global_step": 211609, "epoch": 1259} {"train_loss": -9.621328353881836, "global_step": 211610, "epoch": 1259} {"train_loss": -8.89009952545166, "global_step": 211611, "epoch": 1259} {"train_loss": -8.549060821533203, "global_step": 211612, "epoch": 1259} {"train_loss": -9.710808753967285, "global_step": 211613, "epoch": 1259} {"train_loss": -7.443579196929932, "global_step": 211614, "epoch": 1259} {"train_loss": -8.26106071472168, "global_step": 211615, "epoch": 1259} {"train_loss": -10.0398530960083, "global_step": 211616, "epoch": 1259} {"train_loss": -8.150146484375, "global_step": 211617, "epoch": 1259} {"train_loss": -9.367179870605469, "global_step": 211618, "epoch": 1259} {"train_loss": -8.296333312988281, "global_step": 211619, "epoch": 1259} {"train_loss": -9.566587448120117, "global_step": 211620, "epoch": 1259} {"train_loss": -9.254290580749512, "global_step": 211621, "epoch": 1259} {"train_loss": -9.293249130249023, "global_step": 211622, "epoch": 1259} {"train_loss": -10.060338020324707, "global_step": 211623, "epoch": 1259} {"train_loss": -9.424333572387695, "global_step": 211624, "epoch": 1259} {"train_loss": -9.40040397644043, "global_step": 211625, "epoch": 1259} {"train_loss": -9.317828178405762, "global_step": 211626, "epoch": 1259} {"train_loss": -9.320302963256836, "global_step": 211627, "epoch": 1259} {"train_loss": -10.072510719299316, "global_step": 211628, "epoch": 1259} {"train_loss": -9.921560287475586, "global_step": 211629, "epoch": 1259} {"train_loss": -8.956092834472656, "global_step": 211630, "epoch": 1259} {"train_loss": -10.396677017211914, "global_step": 211631, "epoch": 1259} {"train_loss": -10.127849578857422, "global_step": 211632, "epoch": 1259} {"train_loss": -10.17022705078125, "global_step": 211633, "epoch": 1259} {"train_loss": -10.669023513793945, "global_step": 211634, "epoch": 1259} {"train_loss": -10.713812828063965, "global_step": 211635, "epoch": 1259} {"train_loss": -10.427556037902832, "global_step": 211636, "epoch": 1259} {"train_loss": -10.719658851623535, "global_step": 211637, "epoch": 1259} {"train_loss": -10.755380630493164, "global_step": 211638, "epoch": 1259} {"train_loss": -10.32448959350586, "global_step": 211639, "epoch": 1259} {"train_loss": -10.494800567626953, "global_step": 211640, "epoch": 1259} {"train_loss": -10.599597930908203, "global_step": 211641, "epoch": 1259} {"train_loss": -10.629947662353516, "global_step": 211642, "epoch": 1259} {"train_loss": -10.5771484375, "global_step": 211643, "epoch": 1259} {"train_loss": -10.653726577758789, "global_step": 211644, "epoch": 1259} {"train_loss": -10.601332664489746, "global_step": 211645, "epoch": 1259} {"train_loss": -11.062871932983398, "global_step": 211646, "epoch": 1259} {"train_loss": -10.768238067626953, "global_step": 211647, "epoch": 1259} {"train_loss": -10.730476379394531, "global_step": 211648, "epoch": 1259} {"train_loss": -10.872039794921875, "global_step": 211649, "epoch": 1259} {"train_loss": -10.971473693847656, "global_step": 211650, "epoch": 1259} {"train_loss": -10.657574653625488, "global_step": 211651, "epoch": 1259} {"train_loss": -10.96579647064209, "global_step": 211652, "epoch": 1259} {"train_loss": -11.009523391723633, "global_step": 211653, "epoch": 1259} {"train_loss": -10.911874771118164, "global_step": 211654, "epoch": 1259} {"train_loss": -11.10507583618164, "global_step": 211655, "epoch": 1259} {"train_loss": -10.90401840209961, "global_step": 211656, "epoch": 1259} {"train_loss": -11.094371795654297, "global_step": 211657, "epoch": 1259} {"train_loss": -11.244405746459961, "global_step": 211658, "epoch": 1259} {"train_loss": -11.144990921020508, "global_step": 211659, "epoch": 1259} {"train_loss": -11.258417129516602, "global_step": 211660, "epoch": 1259} {"train_loss": -11.077795028686523, "global_step": 211661, "epoch": 1259} {"train_loss": -11.224678039550781, "global_step": 211662, "epoch": 1259} {"train_loss": -11.150307655334473, "global_step": 211663, "epoch": 1259} {"train_loss": -11.167113304138184, "global_step": 211664, "epoch": 1259} {"train_loss": -10.942630767822266, "global_step": 211665, "epoch": 1259} {"train_loss": -11.379341125488281, "global_step": 211666, "epoch": 1259} {"train_loss": -11.13067626953125, "global_step": 211667, "epoch": 1259} {"train_loss": -11.120841979980469, "global_step": 211668, "epoch": 1259} {"train_loss": -11.310810089111328, "global_step": 211669, "epoch": 1259} {"train_loss": -11.337054252624512, "global_step": 211670, "epoch": 1259} {"train_loss": -11.336227416992188, "global_step": 211671, "epoch": 1259} {"train_loss": -11.337574005126953, "global_step": 211672, "epoch": 1259} {"train_loss": -11.333890914916992, "global_step": 211673, "epoch": 1259} {"train_loss": -11.538933753967285, "global_step": 211674, "epoch": 1259} {"train_loss": -11.437477111816406, "global_step": 211675, "epoch": 1259} {"train_loss": -11.431489944458008, "global_step": 211676, "epoch": 1259} {"train_loss": -11.352325439453125, "global_step": 211677, "epoch": 1259} {"train_loss": -11.408429145812988, "global_step": 211678, "epoch": 1259} {"train_loss": -10.976204034828005, "global_step": 211679, "epoch": 1259, "val_loss": 255945.390625} {"train_loss": -11.546367645263672, "global_step": 211680, "epoch": 1260} {"train_loss": -11.610123634338379, "global_step": 211681, "epoch": 1260} {"train_loss": -11.479331970214844, "global_step": 211682, "epoch": 1260} {"train_loss": -11.556729316711426, "global_step": 211683, "epoch": 1260} {"train_loss": -11.535987854003906, "global_step": 211684, "epoch": 1260} {"train_loss": -11.596525192260742, "global_step": 211685, "epoch": 1260} {"train_loss": -11.603622436523438, "global_step": 211686, "epoch": 1260} {"train_loss": -11.76356315612793, "global_step": 211687, "epoch": 1260} {"train_loss": -11.581884384155273, "global_step": 211688, "epoch": 1260} {"train_loss": -11.63770866394043, "global_step": 211689, "epoch": 1260} {"train_loss": -11.677560806274414, "global_step": 211690, "epoch": 1260} {"train_loss": -11.626907348632812, "global_step": 211691, "epoch": 1260} {"train_loss": -11.776957511901855, "global_step": 211692, "epoch": 1260} {"train_loss": -11.532964706420898, "global_step": 211693, "epoch": 1260} {"train_loss": -11.642789840698242, "global_step": 211694, "epoch": 1260} {"train_loss": -11.782644271850586, "global_step": 211695, "epoch": 1260} {"train_loss": -11.614818572998047, "global_step": 211696, "epoch": 1260} {"train_loss": -11.750356674194336, "global_step": 211697, "epoch": 1260} {"train_loss": -11.861236572265625, "global_step": 211698, "epoch": 1260} {"train_loss": -11.809803009033203, "global_step": 211699, "epoch": 1260} {"train_loss": -11.858236312866211, "global_step": 211700, "epoch": 1260} {"train_loss": -11.762043952941895, "global_step": 211701, "epoch": 1260} {"train_loss": -11.863410949707031, "global_step": 211702, "epoch": 1260} {"train_loss": -11.79998779296875, "global_step": 211703, "epoch": 1260} {"train_loss": -11.770635604858398, "global_step": 211704, "epoch": 1260} {"train_loss": -11.699670791625977, "global_step": 211705, "epoch": 1260} {"train_loss": -11.958866119384766, "global_step": 211706, "epoch": 1260} {"train_loss": -11.850945472717285, "global_step": 211707, "epoch": 1260} {"train_loss": -11.839624404907227, "global_step": 211708, "epoch": 1260} {"train_loss": -11.721710205078125, "global_step": 211709, "epoch": 1260} {"train_loss": -11.69268798828125, "global_step": 211710, "epoch": 1260} {"train_loss": -11.697072982788086, "global_step": 211711, "epoch": 1260} {"train_loss": -11.395519256591797, "global_step": 211712, "epoch": 1260} {"train_loss": -11.551204681396484, "global_step": 211713, "epoch": 1260} {"train_loss": -11.8158540725708, "global_step": 211714, "epoch": 1260} {"train_loss": -11.704442977905273, "global_step": 211715, "epoch": 1260} {"train_loss": -11.508905410766602, "global_step": 211716, "epoch": 1260} {"train_loss": -11.468701362609863, "global_step": 211717, "epoch": 1260} {"train_loss": -11.703683853149414, "global_step": 211718, "epoch": 1260} {"train_loss": -11.655793190002441, "global_step": 211719, "epoch": 1260} {"train_loss": -11.62846565246582, "global_step": 211720, "epoch": 1260} {"train_loss": -11.80576229095459, "global_step": 211721, "epoch": 1260} {"train_loss": -11.394430160522461, "global_step": 211722, "epoch": 1260} {"train_loss": -11.132072448730469, "global_step": 211723, "epoch": 1260} {"train_loss": -11.614561080932617, "global_step": 211724, "epoch": 1260} {"train_loss": -11.422901153564453, "global_step": 211725, "epoch": 1260} {"train_loss": -11.125377655029297, "global_step": 211726, "epoch": 1260} {"train_loss": -11.757240295410156, "global_step": 211727, "epoch": 1260} {"train_loss": -11.402456283569336, "global_step": 211728, "epoch": 1260} {"train_loss": -10.052509307861328, "global_step": 211729, "epoch": 1260} {"train_loss": -11.609336853027344, "global_step": 211730, "epoch": 1260} {"train_loss": -11.032722473144531, "global_step": 211731, "epoch": 1260} {"train_loss": -10.477100372314453, "global_step": 211732, "epoch": 1260} {"train_loss": -10.41718864440918, "global_step": 211733, "epoch": 1260} {"train_loss": -11.602752685546875, "global_step": 211734, "epoch": 1260} {"train_loss": -10.396807670593262, "global_step": 211735, "epoch": 1260} {"train_loss": -10.711023330688477, "global_step": 211736, "epoch": 1260} {"train_loss": -10.784285545349121, "global_step": 211737, "epoch": 1260} {"train_loss": -9.875665664672852, "global_step": 211738, "epoch": 1260} {"train_loss": -11.288217544555664, "global_step": 211739, "epoch": 1260} {"train_loss": -10.506120681762695, "global_step": 211740, "epoch": 1260} {"train_loss": -10.802583694458008, "global_step": 211741, "epoch": 1260} {"train_loss": -10.934952735900879, "global_step": 211742, "epoch": 1260} {"train_loss": -11.21650218963623, "global_step": 211743, "epoch": 1260} {"train_loss": -11.258932113647461, "global_step": 211744, "epoch": 1260} {"train_loss": -11.335488319396973, "global_step": 211745, "epoch": 1260} {"train_loss": -11.134907722473145, "global_step": 211746, "epoch": 1260} {"train_loss": -11.022912979125977, "global_step": 211747, "epoch": 1260} {"train_loss": -11.174139022827148, "global_step": 211748, "epoch": 1260} {"train_loss": -11.301210403442383, "global_step": 211749, "epoch": 1260} {"train_loss": -11.638128280639648, "global_step": 211750, "epoch": 1260} {"train_loss": -11.07472038269043, "global_step": 211751, "epoch": 1260} {"train_loss": -11.70093059539795, "global_step": 211752, "epoch": 1260} {"train_loss": -11.108030319213867, "global_step": 211753, "epoch": 1260} {"train_loss": -11.513997077941895, "global_step": 211754, "epoch": 1260} {"train_loss": -11.336885452270508, "global_step": 211755, "epoch": 1260} {"train_loss": -11.261394500732422, "global_step": 211756, "epoch": 1260} {"train_loss": -11.352624893188477, "global_step": 211757, "epoch": 1260} {"train_loss": -11.457897186279297, "global_step": 211758, "epoch": 1260} {"train_loss": -11.10654354095459, "global_step": 211759, "epoch": 1260} {"train_loss": -11.412332534790039, "global_step": 211760, "epoch": 1260} {"train_loss": -11.143928527832031, "global_step": 211761, "epoch": 1260} {"train_loss": -11.391080856323242, "global_step": 211762, "epoch": 1260} {"train_loss": -11.523455619812012, "global_step": 211763, "epoch": 1260} {"train_loss": -11.424224853515625, "global_step": 211764, "epoch": 1260} {"train_loss": -11.376134872436523, "global_step": 211765, "epoch": 1260} {"train_loss": -11.308050155639648, "global_step": 211766, "epoch": 1260} {"train_loss": -11.654193878173828, "global_step": 211767, "epoch": 1260} {"train_loss": -11.393726348876953, "global_step": 211768, "epoch": 1260} {"train_loss": -11.542859077453613, "global_step": 211769, "epoch": 1260} {"train_loss": -11.47729206085205, "global_step": 211770, "epoch": 1260} {"train_loss": -11.660123825073242, "global_step": 211771, "epoch": 1260} {"train_loss": -11.628070831298828, "global_step": 211772, "epoch": 1260} {"train_loss": -11.543949127197266, "global_step": 211773, "epoch": 1260} {"train_loss": -11.274492263793945, "global_step": 211774, "epoch": 1260} {"train_loss": -11.541215896606445, "global_step": 211775, "epoch": 1260} {"train_loss": -11.565813064575195, "global_step": 211776, "epoch": 1260} {"train_loss": -11.585580825805664, "global_step": 211777, "epoch": 1260} {"train_loss": -11.397126197814941, "global_step": 211778, "epoch": 1260} {"train_loss": -11.50656795501709, "global_step": 211779, "epoch": 1260} {"train_loss": -11.633848190307617, "global_step": 211780, "epoch": 1260} {"train_loss": -11.524027824401855, "global_step": 211781, "epoch": 1260} {"train_loss": -11.534189224243164, "global_step": 211782, "epoch": 1260} {"train_loss": -11.567841529846191, "global_step": 211783, "epoch": 1260} {"train_loss": -11.638093948364258, "global_step": 211784, "epoch": 1260} {"train_loss": -11.66395378112793, "global_step": 211785, "epoch": 1260} {"train_loss": -11.54909896850586, "global_step": 211786, "epoch": 1260} {"train_loss": -11.684492111206055, "global_step": 211787, "epoch": 1260} {"train_loss": -11.821512222290039, "global_step": 211788, "epoch": 1260} {"train_loss": -11.623571395874023, "global_step": 211789, "epoch": 1260} {"train_loss": -11.689558029174805, "global_step": 211790, "epoch": 1260} {"train_loss": -11.231319427490234, "global_step": 211791, "epoch": 1260} {"train_loss": -11.836620330810547, "global_step": 211792, "epoch": 1260} {"train_loss": -11.59218978881836, "global_step": 211793, "epoch": 1260} {"train_loss": -11.822787284851074, "global_step": 211794, "epoch": 1260} {"train_loss": -11.732223510742188, "global_step": 211795, "epoch": 1260} {"train_loss": -11.84964370727539, "global_step": 211796, "epoch": 1260} {"train_loss": -11.813627243041992, "global_step": 211797, "epoch": 1260} {"train_loss": -11.537603378295898, "global_step": 211798, "epoch": 1260} {"train_loss": -11.670093536376953, "global_step": 211799, "epoch": 1260} {"train_loss": -11.910358428955078, "global_step": 211800, "epoch": 1260} {"train_loss": -11.550592422485352, "global_step": 211801, "epoch": 1260} {"train_loss": -11.909732818603516, "global_step": 211802, "epoch": 1260} {"train_loss": -11.80006217956543, "global_step": 211803, "epoch": 1260} {"train_loss": -11.608095169067383, "global_step": 211804, "epoch": 1260} {"train_loss": -11.881599426269531, "global_step": 211805, "epoch": 1260} {"train_loss": -11.492110252380371, "global_step": 211806, "epoch": 1260} {"train_loss": -11.374065399169922, "global_step": 211807, "epoch": 1260} {"train_loss": -11.47036075592041, "global_step": 211808, "epoch": 1260} {"train_loss": -11.702263832092285, "global_step": 211809, "epoch": 1260} {"train_loss": -11.243467330932617, "global_step": 211810, "epoch": 1260} {"train_loss": -11.232478141784668, "global_step": 211811, "epoch": 1260} {"train_loss": -11.093942642211914, "global_step": 211812, "epoch": 1260} {"train_loss": -11.467010498046875, "global_step": 211813, "epoch": 1260} {"train_loss": -11.40530776977539, "global_step": 211814, "epoch": 1260} {"train_loss": -11.733448028564453, "global_step": 211815, "epoch": 1260} {"train_loss": -11.670686721801758, "global_step": 211816, "epoch": 1260} {"train_loss": -11.406213760375977, "global_step": 211817, "epoch": 1260} {"train_loss": -11.360276222229004, "global_step": 211818, "epoch": 1260} {"train_loss": -10.924694061279297, "global_step": 211819, "epoch": 1260} {"train_loss": -10.84402084350586, "global_step": 211820, "epoch": 1260} {"train_loss": -11.123588562011719, "global_step": 211821, "epoch": 1260} {"train_loss": -11.885947227478027, "global_step": 211822, "epoch": 1260} {"train_loss": -10.96226692199707, "global_step": 211823, "epoch": 1260} {"train_loss": -11.399015426635742, "global_step": 211824, "epoch": 1260} {"train_loss": -11.12828254699707, "global_step": 211825, "epoch": 1260} {"train_loss": -10.77357006072998, "global_step": 211826, "epoch": 1260} {"train_loss": -11.411598205566406, "global_step": 211827, "epoch": 1260} {"train_loss": -10.843132019042969, "global_step": 211828, "epoch": 1260} {"train_loss": -10.63085651397705, "global_step": 211829, "epoch": 1260} {"train_loss": -11.285677909851074, "global_step": 211830, "epoch": 1260} {"train_loss": -11.008018493652344, "global_step": 211831, "epoch": 1260} {"train_loss": -10.74074649810791, "global_step": 211832, "epoch": 1260} {"train_loss": -11.046857833862305, "global_step": 211833, "epoch": 1260} {"train_loss": -11.357272148132324, "global_step": 211834, "epoch": 1260} {"train_loss": -10.97566032409668, "global_step": 211835, "epoch": 1260} {"train_loss": -11.314204216003418, "global_step": 211836, "epoch": 1260} {"train_loss": -10.97071361541748, "global_step": 211837, "epoch": 1260} {"train_loss": -11.143446922302246, "global_step": 211838, "epoch": 1260} {"train_loss": -11.561054229736328, "global_step": 211839, "epoch": 1260} {"train_loss": -11.317672729492188, "global_step": 211840, "epoch": 1260} {"train_loss": -11.479154586791992, "global_step": 211841, "epoch": 1260} {"train_loss": -11.398637771606445, "global_step": 211842, "epoch": 1260} {"train_loss": -11.242897987365723, "global_step": 211843, "epoch": 1260} {"train_loss": -11.47231674194336, "global_step": 211844, "epoch": 1260} {"train_loss": -10.989635467529297, "global_step": 211845, "epoch": 1260} {"train_loss": -11.35871410369873, "global_step": 211846, "epoch": 1260} {"train_loss": -11.42046316464742, "global_step": 211847, "epoch": 1260, "val_loss": 258204.34375, "train_action_mse_error": 1.7616959810256958} {"train_loss": -11.343473434448242, "global_step": 211848, "epoch": 1261} {"train_loss": -11.20618724822998, "global_step": 211849, "epoch": 1261} {"train_loss": -11.530532836914062, "global_step": 211850, "epoch": 1261} {"train_loss": -11.269603729248047, "global_step": 211851, "epoch": 1261} {"train_loss": -11.377713203430176, "global_step": 211852, "epoch": 1261} {"train_loss": -11.492107391357422, "global_step": 211853, "epoch": 1261} {"train_loss": -11.25472354888916, "global_step": 211854, "epoch": 1261} {"train_loss": -11.415975570678711, "global_step": 211855, "epoch": 1261} {"train_loss": -11.374551773071289, "global_step": 211856, "epoch": 1261} {"train_loss": -11.541635513305664, "global_step": 211857, "epoch": 1261} {"train_loss": -11.212451934814453, "global_step": 211858, "epoch": 1261} {"train_loss": -11.423700332641602, "global_step": 211859, "epoch": 1261} {"train_loss": -11.50571060180664, "global_step": 211860, "epoch": 1261} {"train_loss": -11.731998443603516, "global_step": 211861, "epoch": 1261} {"train_loss": -11.577255249023438, "global_step": 211862, "epoch": 1261} {"train_loss": -11.590038299560547, "global_step": 211863, "epoch": 1261} {"train_loss": -11.600008010864258, "global_step": 211864, "epoch": 1261} {"train_loss": -11.542683601379395, "global_step": 211865, "epoch": 1261} {"train_loss": -11.710430145263672, "global_step": 211866, "epoch": 1261} {"train_loss": -11.536773681640625, "global_step": 211867, "epoch": 1261} {"train_loss": -11.572967529296875, "global_step": 211868, "epoch": 1261} {"train_loss": -11.345549583435059, "global_step": 211869, "epoch": 1261} {"train_loss": -11.639220237731934, "global_step": 211870, "epoch": 1261} {"train_loss": -11.777591705322266, "global_step": 211871, "epoch": 1261} {"train_loss": -11.50527572631836, "global_step": 211872, "epoch": 1261} {"train_loss": -11.735785484313965, "global_step": 211873, "epoch": 1261} {"train_loss": -11.930325508117676, "global_step": 211874, "epoch": 1261} {"train_loss": -11.372913360595703, "global_step": 211875, "epoch": 1261} {"train_loss": -11.503421783447266, "global_step": 211876, "epoch": 1261} {"train_loss": -11.548789024353027, "global_step": 211877, "epoch": 1261} {"train_loss": -11.319622039794922, "global_step": 211878, "epoch": 1261} {"train_loss": -11.476367950439453, "global_step": 211879, "epoch": 1261} {"train_loss": -11.426753044128418, "global_step": 211880, "epoch": 1261} {"train_loss": -11.716836929321289, "global_step": 211881, "epoch": 1261} {"train_loss": -11.50870418548584, "global_step": 211882, "epoch": 1261} {"train_loss": -11.805526733398438, "global_step": 211883, "epoch": 1261} {"train_loss": -11.25783920288086, "global_step": 211884, "epoch": 1261} {"train_loss": -11.19943618774414, "global_step": 211885, "epoch": 1261} {"train_loss": -11.365406036376953, "global_step": 211886, "epoch": 1261} {"train_loss": -11.167828559875488, "global_step": 211887, "epoch": 1261} {"train_loss": -10.558996200561523, "global_step": 211888, "epoch": 1261} {"train_loss": -10.797454833984375, "global_step": 211889, "epoch": 1261} {"train_loss": -11.434349060058594, "global_step": 211890, "epoch": 1261} {"train_loss": -10.52501106262207, "global_step": 211891, "epoch": 1261} {"train_loss": -11.634605407714844, "global_step": 211892, "epoch": 1261} {"train_loss": -10.120210647583008, "global_step": 211893, "epoch": 1261} {"train_loss": -10.667119979858398, "global_step": 211894, "epoch": 1261} {"train_loss": -11.604578018188477, "global_step": 211895, "epoch": 1261} {"train_loss": -11.019512176513672, "global_step": 211896, "epoch": 1261} {"train_loss": -11.51015853881836, "global_step": 211897, "epoch": 1261} {"train_loss": -11.202613830566406, "global_step": 211898, "epoch": 1261} {"train_loss": -11.30168342590332, "global_step": 211899, "epoch": 1261} {"train_loss": -11.656026840209961, "global_step": 211900, "epoch": 1261} {"train_loss": -11.540163040161133, "global_step": 211901, "epoch": 1261} {"train_loss": -11.340169906616211, "global_step": 211902, "epoch": 1261} {"train_loss": -11.561883926391602, "global_step": 211903, "epoch": 1261} {"train_loss": -11.669637680053711, "global_step": 211904, "epoch": 1261} {"train_loss": -11.382110595703125, "global_step": 211905, "epoch": 1261} {"train_loss": -11.716348648071289, "global_step": 211906, "epoch": 1261} {"train_loss": -11.72882080078125, "global_step": 211907, "epoch": 1261} {"train_loss": -11.52527904510498, "global_step": 211908, "epoch": 1261} {"train_loss": -11.666191101074219, "global_step": 211909, "epoch": 1261} {"train_loss": -11.676097869873047, "global_step": 211910, "epoch": 1261} {"train_loss": -11.648374557495117, "global_step": 211911, "epoch": 1261} {"train_loss": -11.59022045135498, "global_step": 211912, "epoch": 1261} {"train_loss": -11.949726104736328, "global_step": 211913, "epoch": 1261} {"train_loss": -11.69063949584961, "global_step": 211914, "epoch": 1261} {"train_loss": -11.748422622680664, "global_step": 211915, "epoch": 1261} {"train_loss": -11.676416397094727, "global_step": 211916, "epoch": 1261} {"train_loss": -11.928974151611328, "global_step": 211917, "epoch": 1261} {"train_loss": -11.667829513549805, "global_step": 211918, "epoch": 1261} {"train_loss": -11.731179237365723, "global_step": 211919, "epoch": 1261} {"train_loss": -11.817150115966797, "global_step": 211920, "epoch": 1261} {"train_loss": -11.8997802734375, "global_step": 211921, "epoch": 1261} {"train_loss": -11.612062454223633, "global_step": 211922, "epoch": 1261} {"train_loss": -11.778525352478027, "global_step": 211923, "epoch": 1261} {"train_loss": -11.84278678894043, "global_step": 211924, "epoch": 1261} {"train_loss": -11.768097877502441, "global_step": 211925, "epoch": 1261} {"train_loss": -11.647664070129395, "global_step": 211926, "epoch": 1261} {"train_loss": -11.732275009155273, "global_step": 211927, "epoch": 1261} {"train_loss": -11.591034889221191, "global_step": 211928, "epoch": 1261} {"train_loss": -11.853272438049316, "global_step": 211929, "epoch": 1261} {"train_loss": -11.723861694335938, "global_step": 211930, "epoch": 1261} {"train_loss": -11.667760848999023, "global_step": 211931, "epoch": 1261} {"train_loss": -11.834656715393066, "global_step": 211932, "epoch": 1261} {"train_loss": -11.765806198120117, "global_step": 211933, "epoch": 1261} {"train_loss": -11.427966117858887, "global_step": 211934, "epoch": 1261} {"train_loss": -11.11931324005127, "global_step": 211935, "epoch": 1261} {"train_loss": -11.7941312789917, "global_step": 211936, "epoch": 1261} {"train_loss": -11.793431282043457, "global_step": 211937, "epoch": 1261} {"train_loss": -11.360509872436523, "global_step": 211938, "epoch": 1261} {"train_loss": -11.708534240722656, "global_step": 211939, "epoch": 1261} {"train_loss": -11.62706184387207, "global_step": 211940, "epoch": 1261} {"train_loss": -11.266907691955566, "global_step": 211941, "epoch": 1261} {"train_loss": -11.49632453918457, "global_step": 211942, "epoch": 1261} {"train_loss": -11.416040420532227, "global_step": 211943, "epoch": 1261} {"train_loss": -11.284782409667969, "global_step": 211944, "epoch": 1261} {"train_loss": -11.781876564025879, "global_step": 211945, "epoch": 1261} {"train_loss": -11.362407684326172, "global_step": 211946, "epoch": 1261} {"train_loss": -11.049043655395508, "global_step": 211947, "epoch": 1261} {"train_loss": -10.5908203125, "global_step": 211948, "epoch": 1261} {"train_loss": -11.408767700195312, "global_step": 211949, "epoch": 1261} {"train_loss": -11.451045989990234, "global_step": 211950, "epoch": 1261} {"train_loss": -10.578729629516602, "global_step": 211951, "epoch": 1261} {"train_loss": -9.128231048583984, "global_step": 211952, "epoch": 1261} {"train_loss": -10.249998092651367, "global_step": 211953, "epoch": 1261} {"train_loss": -11.529964447021484, "global_step": 211954, "epoch": 1261} {"train_loss": -9.637776374816895, "global_step": 211955, "epoch": 1261} {"train_loss": -10.735292434692383, "global_step": 211956, "epoch": 1261} {"train_loss": -11.103199005126953, "global_step": 211957, "epoch": 1261} {"train_loss": -9.76905345916748, "global_step": 211958, "epoch": 1261} {"train_loss": -11.292515754699707, "global_step": 211959, "epoch": 1261} {"train_loss": -10.084188461303711, "global_step": 211960, "epoch": 1261} {"train_loss": -10.399017333984375, "global_step": 211961, "epoch": 1261} {"train_loss": -11.23495101928711, "global_step": 211962, "epoch": 1261} {"train_loss": -10.432867050170898, "global_step": 211963, "epoch": 1261} {"train_loss": -11.475820541381836, "global_step": 211964, "epoch": 1261} {"train_loss": -11.262491226196289, "global_step": 211965, "epoch": 1261} {"train_loss": -11.25576114654541, "global_step": 211966, "epoch": 1261} {"train_loss": -11.354190826416016, "global_step": 211967, "epoch": 1261} {"train_loss": -11.319494247436523, "global_step": 211968, "epoch": 1261} {"train_loss": -11.506799697875977, "global_step": 211969, "epoch": 1261} {"train_loss": -11.097466468811035, "global_step": 211970, "epoch": 1261} {"train_loss": -11.36571216583252, "global_step": 211971, "epoch": 1261} {"train_loss": -11.458456993103027, "global_step": 211972, "epoch": 1261} {"train_loss": -11.21567153930664, "global_step": 211973, "epoch": 1261} {"train_loss": -11.353147506713867, "global_step": 211974, "epoch": 1261} {"train_loss": -10.99074935913086, "global_step": 211975, "epoch": 1261} {"train_loss": -11.43906307220459, "global_step": 211976, "epoch": 1261} {"train_loss": -10.92308521270752, "global_step": 211977, "epoch": 1261} {"train_loss": -11.349105834960938, "global_step": 211978, "epoch": 1261} {"train_loss": -11.206600189208984, "global_step": 211979, "epoch": 1261} {"train_loss": -11.203154563903809, "global_step": 211980, "epoch": 1261} {"train_loss": -11.298176765441895, "global_step": 211981, "epoch": 1261} {"train_loss": -11.534674644470215, "global_step": 211982, "epoch": 1261} {"train_loss": -11.372660636901855, "global_step": 211983, "epoch": 1261} {"train_loss": -11.434995651245117, "global_step": 211984, "epoch": 1261} {"train_loss": -11.532303810119629, "global_step": 211985, "epoch": 1261} {"train_loss": -11.587843894958496, "global_step": 211986, "epoch": 1261} {"train_loss": -11.600422859191895, "global_step": 211987, "epoch": 1261} {"train_loss": -11.499897003173828, "global_step": 211988, "epoch": 1261} {"train_loss": -11.449974060058594, "global_step": 211989, "epoch": 1261} {"train_loss": -11.6480131149292, "global_step": 211990, "epoch": 1261} {"train_loss": -11.712039947509766, "global_step": 211991, "epoch": 1261} {"train_loss": -11.657350540161133, "global_step": 211992, "epoch": 1261} {"train_loss": -11.560205459594727, "global_step": 211993, "epoch": 1261} {"train_loss": -11.353347778320312, "global_step": 211994, "epoch": 1261} {"train_loss": -11.36861515045166, "global_step": 211995, "epoch": 1261} {"train_loss": -11.441984176635742, "global_step": 211996, "epoch": 1261} {"train_loss": -11.421083450317383, "global_step": 211997, "epoch": 1261} {"train_loss": -10.991687774658203, "global_step": 211998, "epoch": 1261} {"train_loss": -11.582466125488281, "global_step": 211999, "epoch": 1261} {"train_loss": -11.424938201904297, "global_step": 212000, "epoch": 1261} {"train_loss": -11.524412155151367, "global_step": 212001, "epoch": 1261} {"train_loss": -11.363370895385742, "global_step": 212002, "epoch": 1261} {"train_loss": -11.678929328918457, "global_step": 212003, "epoch": 1261} {"train_loss": -11.558475494384766, "global_step": 212004, "epoch": 1261} {"train_loss": -11.175621032714844, "global_step": 212005, "epoch": 1261} {"train_loss": -11.501648902893066, "global_step": 212006, "epoch": 1261} {"train_loss": -11.522810935974121, "global_step": 212007, "epoch": 1261} {"train_loss": -11.540122032165527, "global_step": 212008, "epoch": 1261} {"train_loss": -11.66373062133789, "global_step": 212009, "epoch": 1261} {"train_loss": -11.52192497253418, "global_step": 212010, "epoch": 1261} {"train_loss": -11.471236228942871, "global_step": 212011, "epoch": 1261} {"train_loss": -11.541594505310059, "global_step": 212012, "epoch": 1261} {"train_loss": -11.955414772033691, "global_step": 212013, "epoch": 1261} {"train_loss": -11.7919921875, "global_step": 212014, "epoch": 1261} {"train_loss": -11.393028389839898, "global_step": 212015, "epoch": 1261, "val_loss": 256144.875} {"train_loss": -11.284215927124023, "global_step": 212016, "epoch": 1262} {"train_loss": -11.519185066223145, "global_step": 212017, "epoch": 1262} {"train_loss": -11.285011291503906, "global_step": 212018, "epoch": 1262} {"train_loss": -10.713600158691406, "global_step": 212019, "epoch": 1262} {"train_loss": -10.960992813110352, "global_step": 212020, "epoch": 1262} {"train_loss": -11.243000984191895, "global_step": 212021, "epoch": 1262} {"train_loss": -10.640816688537598, "global_step": 212022, "epoch": 1262} {"train_loss": -10.734598159790039, "global_step": 212023, "epoch": 1262} {"train_loss": -10.790290832519531, "global_step": 212024, "epoch": 1262} {"train_loss": -10.892080307006836, "global_step": 212025, "epoch": 1262} {"train_loss": -11.600946426391602, "global_step": 212026, "epoch": 1262} {"train_loss": -10.583040237426758, "global_step": 212027, "epoch": 1262} {"train_loss": -11.412766456604004, "global_step": 212028, "epoch": 1262} {"train_loss": -10.406813621520996, "global_step": 212029, "epoch": 1262} {"train_loss": -11.230016708374023, "global_step": 212030, "epoch": 1262} {"train_loss": -10.674816131591797, "global_step": 212031, "epoch": 1262} {"train_loss": -10.769387245178223, "global_step": 212032, "epoch": 1262} {"train_loss": -11.305339813232422, "global_step": 212033, "epoch": 1262} {"train_loss": -10.975756645202637, "global_step": 212034, "epoch": 1262} {"train_loss": -11.428716659545898, "global_step": 212035, "epoch": 1262} {"train_loss": -10.776655197143555, "global_step": 212036, "epoch": 1262} {"train_loss": -11.1765775680542, "global_step": 212037, "epoch": 1262} {"train_loss": -10.384590148925781, "global_step": 212038, "epoch": 1262} {"train_loss": -11.093689918518066, "global_step": 212039, "epoch": 1262} {"train_loss": -10.918234825134277, "global_step": 212040, "epoch": 1262} {"train_loss": -11.195658683776855, "global_step": 212041, "epoch": 1262} {"train_loss": -11.013734817504883, "global_step": 212042, "epoch": 1262} {"train_loss": -11.045448303222656, "global_step": 212043, "epoch": 1262} {"train_loss": -11.396636962890625, "global_step": 212044, "epoch": 1262} {"train_loss": -11.181968688964844, "global_step": 212045, "epoch": 1262} {"train_loss": -11.416656494140625, "global_step": 212046, "epoch": 1262} {"train_loss": -11.580491065979004, "global_step": 212047, "epoch": 1262} {"train_loss": -11.378263473510742, "global_step": 212048, "epoch": 1262} {"train_loss": -11.592954635620117, "global_step": 212049, "epoch": 1262} {"train_loss": -11.472943305969238, "global_step": 212050, "epoch": 1262} {"train_loss": -11.675870895385742, "global_step": 212051, "epoch": 1262} {"train_loss": -11.254425048828125, "global_step": 212052, "epoch": 1262} {"train_loss": -11.623528480529785, "global_step": 212053, "epoch": 1262} {"train_loss": -11.24205207824707, "global_step": 212054, "epoch": 1262} {"train_loss": -11.483830451965332, "global_step": 212055, "epoch": 1262} {"train_loss": -11.152399063110352, "global_step": 212056, "epoch": 1262} {"train_loss": -11.620152473449707, "global_step": 212057, "epoch": 1262} {"train_loss": -11.642581939697266, "global_step": 212058, "epoch": 1262} {"train_loss": -11.626382827758789, "global_step": 212059, "epoch": 1262} {"train_loss": -11.806266784667969, "global_step": 212060, "epoch": 1262} {"train_loss": -11.500964164733887, "global_step": 212061, "epoch": 1262} {"train_loss": -11.712026596069336, "global_step": 212062, "epoch": 1262} {"train_loss": -11.523600578308105, "global_step": 212063, "epoch": 1262} {"train_loss": -11.435935974121094, "global_step": 212064, "epoch": 1262} {"train_loss": -11.54765510559082, "global_step": 212065, "epoch": 1262} {"train_loss": -11.660991668701172, "global_step": 212066, "epoch": 1262} {"train_loss": -11.419234275817871, "global_step": 212067, "epoch": 1262} {"train_loss": -11.695064544677734, "global_step": 212068, "epoch": 1262} {"train_loss": -11.302230834960938, "global_step": 212069, "epoch": 1262} {"train_loss": -11.746047973632812, "global_step": 212070, "epoch": 1262} {"train_loss": -11.316686630249023, "global_step": 212071, "epoch": 1262} {"train_loss": -11.601449966430664, "global_step": 212072, "epoch": 1262} {"train_loss": -11.385292053222656, "global_step": 212073, "epoch": 1262} {"train_loss": -11.338748931884766, "global_step": 212074, "epoch": 1262} {"train_loss": -11.621187210083008, "global_step": 212075, "epoch": 1262} {"train_loss": -11.18511962890625, "global_step": 212076, "epoch": 1262} {"train_loss": -11.515729904174805, "global_step": 212077, "epoch": 1262} {"train_loss": -11.296609878540039, "global_step": 212078, "epoch": 1262} {"train_loss": -11.577150344848633, "global_step": 212079, "epoch": 1262} {"train_loss": -11.144848823547363, "global_step": 212080, "epoch": 1262} {"train_loss": -11.688770294189453, "global_step": 212081, "epoch": 1262} {"train_loss": -11.233793258666992, "global_step": 212082, "epoch": 1262} {"train_loss": -11.736959457397461, "global_step": 212083, "epoch": 1262} {"train_loss": -11.329061508178711, "global_step": 212084, "epoch": 1262} {"train_loss": -11.733213424682617, "global_step": 212085, "epoch": 1262} {"train_loss": -11.437385559082031, "global_step": 212086, "epoch": 1262} {"train_loss": -11.548055648803711, "global_step": 212087, "epoch": 1262} {"train_loss": -11.489542007446289, "global_step": 212088, "epoch": 1262} {"train_loss": -11.603399276733398, "global_step": 212089, "epoch": 1262} {"train_loss": -11.163257598876953, "global_step": 212090, "epoch": 1262} {"train_loss": -11.566740989685059, "global_step": 212091, "epoch": 1262} {"train_loss": -11.37654972076416, "global_step": 212092, "epoch": 1262} {"train_loss": -11.76530647277832, "global_step": 212093, "epoch": 1262} {"train_loss": -11.264842987060547, "global_step": 212094, "epoch": 1262} {"train_loss": -11.719437599182129, "global_step": 212095, "epoch": 1262} {"train_loss": -10.69050407409668, "global_step": 212096, "epoch": 1262} {"train_loss": -11.719398498535156, "global_step": 212097, "epoch": 1262} {"train_loss": -10.785787582397461, "global_step": 212098, "epoch": 1262} {"train_loss": -11.506732940673828, "global_step": 212099, "epoch": 1262} {"train_loss": -10.81578254699707, "global_step": 212100, "epoch": 1262} {"train_loss": -11.549644470214844, "global_step": 212101, "epoch": 1262} {"train_loss": -10.321006774902344, "global_step": 212102, "epoch": 1262} {"train_loss": -11.038853645324707, "global_step": 212103, "epoch": 1262} {"train_loss": -9.421730041503906, "global_step": 212104, "epoch": 1262} {"train_loss": -10.68666934967041, "global_step": 212105, "epoch": 1262} {"train_loss": -10.112728118896484, "global_step": 212106, "epoch": 1262} {"train_loss": -9.545756340026855, "global_step": 212107, "epoch": 1262} {"train_loss": -10.413854598999023, "global_step": 212108, "epoch": 1262} {"train_loss": -8.453559875488281, "global_step": 212109, "epoch": 1262} {"train_loss": -9.254069328308105, "global_step": 212110, "epoch": 1262} {"train_loss": -9.964794158935547, "global_step": 212111, "epoch": 1262} {"train_loss": -9.865202903747559, "global_step": 212112, "epoch": 1262} {"train_loss": -9.245222091674805, "global_step": 212113, "epoch": 1262} {"train_loss": -11.106778144836426, "global_step": 212114, "epoch": 1262} {"train_loss": -10.060556411743164, "global_step": 212115, "epoch": 1262} {"train_loss": -10.863420486450195, "global_step": 212116, "epoch": 1262} {"train_loss": -9.660873413085938, "global_step": 212117, "epoch": 1262} {"train_loss": -10.675344467163086, "global_step": 212118, "epoch": 1262} {"train_loss": -10.084962844848633, "global_step": 212119, "epoch": 1262} {"train_loss": -11.084091186523438, "global_step": 212120, "epoch": 1262} {"train_loss": -10.787577629089355, "global_step": 212121, "epoch": 1262} {"train_loss": -11.136001586914062, "global_step": 212122, "epoch": 1262} {"train_loss": -10.933815002441406, "global_step": 212123, "epoch": 1262} {"train_loss": -10.544866561889648, "global_step": 212124, "epoch": 1262} {"train_loss": -11.213218688964844, "global_step": 212125, "epoch": 1262} {"train_loss": -11.043451309204102, "global_step": 212126, "epoch": 1262} {"train_loss": -11.206624031066895, "global_step": 212127, "epoch": 1262} {"train_loss": -11.202798843383789, "global_step": 212128, "epoch": 1262} {"train_loss": -11.270156860351562, "global_step": 212129, "epoch": 1262} {"train_loss": -11.13491439819336, "global_step": 212130, "epoch": 1262} {"train_loss": -11.097957611083984, "global_step": 212131, "epoch": 1262} {"train_loss": -11.145576477050781, "global_step": 212132, "epoch": 1262} {"train_loss": -11.244823455810547, "global_step": 212133, "epoch": 1262} {"train_loss": -11.006590843200684, "global_step": 212134, "epoch": 1262} {"train_loss": -11.257038116455078, "global_step": 212135, "epoch": 1262} {"train_loss": -11.186605453491211, "global_step": 212136, "epoch": 1262} {"train_loss": -11.514156341552734, "global_step": 212137, "epoch": 1262} {"train_loss": -11.40001392364502, "global_step": 212138, "epoch": 1262} {"train_loss": -11.392995834350586, "global_step": 212139, "epoch": 1262} {"train_loss": -11.43327522277832, "global_step": 212140, "epoch": 1262} {"train_loss": -11.236576080322266, "global_step": 212141, "epoch": 1262} {"train_loss": -11.473618507385254, "global_step": 212142, "epoch": 1262} {"train_loss": -11.340578079223633, "global_step": 212143, "epoch": 1262} {"train_loss": -11.431680679321289, "global_step": 212144, "epoch": 1262} {"train_loss": -11.299397468566895, "global_step": 212145, "epoch": 1262} {"train_loss": -11.364465713500977, "global_step": 212146, "epoch": 1262} {"train_loss": -11.353033065795898, "global_step": 212147, "epoch": 1262} {"train_loss": -11.196810722351074, "global_step": 212148, "epoch": 1262} {"train_loss": -11.561236381530762, "global_step": 212149, "epoch": 1262} {"train_loss": -11.347552299499512, "global_step": 212150, "epoch": 1262} {"train_loss": -11.675834655761719, "global_step": 212151, "epoch": 1262} {"train_loss": -11.52880859375, "global_step": 212152, "epoch": 1262} {"train_loss": -11.558279037475586, "global_step": 212153, "epoch": 1262} {"train_loss": -11.675345420837402, "global_step": 212154, "epoch": 1262} {"train_loss": -11.556205749511719, "global_step": 212155, "epoch": 1262} {"train_loss": -11.60273551940918, "global_step": 212156, "epoch": 1262} {"train_loss": -11.71479606628418, "global_step": 212157, "epoch": 1262} {"train_loss": -11.65906810760498, "global_step": 212158, "epoch": 1262} {"train_loss": -11.724414825439453, "global_step": 212159, "epoch": 1262} {"train_loss": -11.705717086791992, "global_step": 212160, "epoch": 1262} {"train_loss": -11.746988296508789, "global_step": 212161, "epoch": 1262} {"train_loss": -11.710488319396973, "global_step": 212162, "epoch": 1262} {"train_loss": -11.82386589050293, "global_step": 212163, "epoch": 1262} {"train_loss": -11.69678020477295, "global_step": 212164, "epoch": 1262} {"train_loss": -11.656539916992188, "global_step": 212165, "epoch": 1262} {"train_loss": -11.5681734085083, "global_step": 212166, "epoch": 1262} {"train_loss": -11.631380081176758, "global_step": 212167, "epoch": 1262} {"train_loss": -11.858346939086914, "global_step": 212168, "epoch": 1262} {"train_loss": -11.487873077392578, "global_step": 212169, "epoch": 1262} {"train_loss": -11.438928604125977, "global_step": 212170, "epoch": 1262} {"train_loss": -11.64539623260498, "global_step": 212171, "epoch": 1262} {"train_loss": -11.716175079345703, "global_step": 212172, "epoch": 1262} {"train_loss": -11.687031745910645, "global_step": 212173, "epoch": 1262} {"train_loss": -11.949899673461914, "global_step": 212174, "epoch": 1262} {"train_loss": -11.722139358520508, "global_step": 212175, "epoch": 1262} {"train_loss": -11.7656831741333, "global_step": 212176, "epoch": 1262} {"train_loss": -11.797587394714355, "global_step": 212177, "epoch": 1262} {"train_loss": -11.71127986907959, "global_step": 212178, "epoch": 1262} {"train_loss": -11.647331237792969, "global_step": 212179, "epoch": 1262} {"train_loss": -11.715679168701172, "global_step": 212180, "epoch": 1262} {"train_loss": -11.674560546875, "global_step": 212181, "epoch": 1262} {"train_loss": -11.683591842651367, "global_step": 212182, "epoch": 1262} {"train_loss": -11.22700902393886, "global_step": 212183, "epoch": 1262, "val_loss": 254146.546875} {"train_loss": -11.39346694946289, "global_step": 212184, "epoch": 1263} {"train_loss": -11.797611236572266, "global_step": 212185, "epoch": 1263} {"train_loss": -11.774271965026855, "global_step": 212186, "epoch": 1263} {"train_loss": -11.346368789672852, "global_step": 212187, "epoch": 1263} {"train_loss": -11.465994834899902, "global_step": 212188, "epoch": 1263} {"train_loss": -11.72554874420166, "global_step": 212189, "epoch": 1263} {"train_loss": -11.079608917236328, "global_step": 212190, "epoch": 1263} {"train_loss": -11.234369277954102, "global_step": 212191, "epoch": 1263} {"train_loss": -11.714122772216797, "global_step": 212192, "epoch": 1263} {"train_loss": -11.06197738647461, "global_step": 212193, "epoch": 1263} {"train_loss": -11.120447158813477, "global_step": 212194, "epoch": 1263} {"train_loss": -10.268817901611328, "global_step": 212195, "epoch": 1263} {"train_loss": -11.45355224609375, "global_step": 212196, "epoch": 1263} {"train_loss": -10.224226951599121, "global_step": 212197, "epoch": 1263} {"train_loss": -11.146728515625, "global_step": 212198, "epoch": 1263} {"train_loss": -10.462886810302734, "global_step": 212199, "epoch": 1263} {"train_loss": -11.756217956542969, "global_step": 212200, "epoch": 1263} {"train_loss": -10.557119369506836, "global_step": 212201, "epoch": 1263} {"train_loss": -11.139883041381836, "global_step": 212202, "epoch": 1263} {"train_loss": -10.557939529418945, "global_step": 212203, "epoch": 1263} {"train_loss": -9.086285591125488, "global_step": 212204, "epoch": 1263} {"train_loss": -11.125455856323242, "global_step": 212205, "epoch": 1263} {"train_loss": -8.311164855957031, "global_step": 212206, "epoch": 1263} {"train_loss": -11.508179664611816, "global_step": 212207, "epoch": 1263} {"train_loss": -8.730735778808594, "global_step": 212208, "epoch": 1263} {"train_loss": -11.092254638671875, "global_step": 212209, "epoch": 1263} {"train_loss": -9.500702857971191, "global_step": 212210, "epoch": 1263} {"train_loss": -10.730098724365234, "global_step": 212211, "epoch": 1263} {"train_loss": -10.94709587097168, "global_step": 212212, "epoch": 1263} {"train_loss": -10.942440032958984, "global_step": 212213, "epoch": 1263} {"train_loss": -10.79983901977539, "global_step": 212214, "epoch": 1263} {"train_loss": -10.474611282348633, "global_step": 212215, "epoch": 1263} {"train_loss": -10.992698669433594, "global_step": 212216, "epoch": 1263} {"train_loss": -10.784730911254883, "global_step": 212217, "epoch": 1263} {"train_loss": -11.257706642150879, "global_step": 212218, "epoch": 1263} {"train_loss": -10.931510925292969, "global_step": 212219, "epoch": 1263} {"train_loss": -11.602226257324219, "global_step": 212220, "epoch": 1263} {"train_loss": -11.038712501525879, "global_step": 212221, "epoch": 1263} {"train_loss": -11.504849433898926, "global_step": 212222, "epoch": 1263} {"train_loss": -11.129652976989746, "global_step": 212223, "epoch": 1263} {"train_loss": -11.46261978149414, "global_step": 212224, "epoch": 1263} {"train_loss": -11.222338676452637, "global_step": 212225, "epoch": 1263} {"train_loss": -11.447494506835938, "global_step": 212226, "epoch": 1263} {"train_loss": -11.460966110229492, "global_step": 212227, "epoch": 1263} {"train_loss": -11.446226119995117, "global_step": 212228, "epoch": 1263} {"train_loss": -11.52641487121582, "global_step": 212229, "epoch": 1263} {"train_loss": -11.213708877563477, "global_step": 212230, "epoch": 1263} {"train_loss": -11.593931198120117, "global_step": 212231, "epoch": 1263} {"train_loss": -11.35616683959961, "global_step": 212232, "epoch": 1263} {"train_loss": -11.608409881591797, "global_step": 212233, "epoch": 1263} {"train_loss": -11.378253936767578, "global_step": 212234, "epoch": 1263} {"train_loss": -11.454801559448242, "global_step": 212235, "epoch": 1263} {"train_loss": -11.471753120422363, "global_step": 212236, "epoch": 1263} {"train_loss": -11.551365852355957, "global_step": 212237, "epoch": 1263} {"train_loss": -11.565674781799316, "global_step": 212238, "epoch": 1263} {"train_loss": -11.733583450317383, "global_step": 212239, "epoch": 1263} {"train_loss": -11.6007080078125, "global_step": 212240, "epoch": 1263} {"train_loss": -11.651535987854004, "global_step": 212241, "epoch": 1263} {"train_loss": -11.659542083740234, "global_step": 212242, "epoch": 1263} {"train_loss": -11.559425354003906, "global_step": 212243, "epoch": 1263} {"train_loss": -11.749691009521484, "global_step": 212244, "epoch": 1263} {"train_loss": -11.605827331542969, "global_step": 212245, "epoch": 1263} {"train_loss": -11.764854431152344, "global_step": 212246, "epoch": 1263} {"train_loss": -11.673942565917969, "global_step": 212247, "epoch": 1263} {"train_loss": -11.645674705505371, "global_step": 212248, "epoch": 1263} {"train_loss": -11.731040954589844, "global_step": 212249, "epoch": 1263} {"train_loss": -11.859062194824219, "global_step": 212250, "epoch": 1263} {"train_loss": -11.842662811279297, "global_step": 212251, "epoch": 1263} {"train_loss": -11.66724681854248, "global_step": 212252, "epoch": 1263} {"train_loss": -11.770834922790527, "global_step": 212253, "epoch": 1263} {"train_loss": -11.790854454040527, "global_step": 212254, "epoch": 1263} {"train_loss": -11.899042129516602, "global_step": 212255, "epoch": 1263} {"train_loss": -11.883562088012695, "global_step": 212256, "epoch": 1263} {"train_loss": -11.861562728881836, "global_step": 212257, "epoch": 1263} {"train_loss": -11.762408256530762, "global_step": 212258, "epoch": 1263} {"train_loss": -11.698789596557617, "global_step": 212259, "epoch": 1263} {"train_loss": -11.855706214904785, "global_step": 212260, "epoch": 1263} {"train_loss": -11.924328804016113, "global_step": 212261, "epoch": 1263} {"train_loss": -11.799601554870605, "global_step": 212262, "epoch": 1263} {"train_loss": -11.833271026611328, "global_step": 212263, "epoch": 1263} {"train_loss": -11.453328132629395, "global_step": 212264, "epoch": 1263} {"train_loss": -11.738883972167969, "global_step": 212265, "epoch": 1263} {"train_loss": -11.478487968444824, "global_step": 212266, "epoch": 1263} {"train_loss": -11.693885803222656, "global_step": 212267, "epoch": 1263} {"train_loss": -11.557112693786621, "global_step": 212268, "epoch": 1263} {"train_loss": -11.694223403930664, "global_step": 212269, "epoch": 1263} {"train_loss": -11.387651443481445, "global_step": 212270, "epoch": 1263} {"train_loss": -11.760055541992188, "global_step": 212271, "epoch": 1263} {"train_loss": -11.823663711547852, "global_step": 212272, "epoch": 1263} {"train_loss": -11.447541236877441, "global_step": 212273, "epoch": 1263} {"train_loss": -11.723920822143555, "global_step": 212274, "epoch": 1263} {"train_loss": -11.438093185424805, "global_step": 212275, "epoch": 1263} {"train_loss": -11.806522369384766, "global_step": 212276, "epoch": 1263} {"train_loss": -11.628870010375977, "global_step": 212277, "epoch": 1263} {"train_loss": -11.503767013549805, "global_step": 212278, "epoch": 1263} {"train_loss": -11.43138313293457, "global_step": 212279, "epoch": 1263} {"train_loss": -11.840017318725586, "global_step": 212280, "epoch": 1263} {"train_loss": -11.684946060180664, "global_step": 212281, "epoch": 1263} {"train_loss": -11.473348617553711, "global_step": 212282, "epoch": 1263} {"train_loss": -11.457468032836914, "global_step": 212283, "epoch": 1263} {"train_loss": -11.819772720336914, "global_step": 212284, "epoch": 1263} {"train_loss": -11.351253509521484, "global_step": 212285, "epoch": 1263} {"train_loss": -11.56672191619873, "global_step": 212286, "epoch": 1263} {"train_loss": -11.656826972961426, "global_step": 212287, "epoch": 1263} {"train_loss": -11.611310005187988, "global_step": 212288, "epoch": 1263} {"train_loss": -11.48214054107666, "global_step": 212289, "epoch": 1263} {"train_loss": -11.693252563476562, "global_step": 212290, "epoch": 1263} {"train_loss": -11.908469200134277, "global_step": 212291, "epoch": 1263} {"train_loss": -11.618694305419922, "global_step": 212292, "epoch": 1263} {"train_loss": -11.05329418182373, "global_step": 212293, "epoch": 1263} {"train_loss": -11.336899757385254, "global_step": 212294, "epoch": 1263} {"train_loss": -11.786406517028809, "global_step": 212295, "epoch": 1263} {"train_loss": -11.362001419067383, "global_step": 212296, "epoch": 1263} {"train_loss": -10.314423561096191, "global_step": 212297, "epoch": 1263} {"train_loss": -11.274598121643066, "global_step": 212298, "epoch": 1263} {"train_loss": -11.856142044067383, "global_step": 212299, "epoch": 1263} {"train_loss": -11.499245643615723, "global_step": 212300, "epoch": 1263} {"train_loss": -11.523581504821777, "global_step": 212301, "epoch": 1263} {"train_loss": -10.982913970947266, "global_step": 212302, "epoch": 1263} {"train_loss": -11.063882827758789, "global_step": 212303, "epoch": 1263} {"train_loss": -10.96376895904541, "global_step": 212304, "epoch": 1263} {"train_loss": -10.727808952331543, "global_step": 212305, "epoch": 1263} {"train_loss": -10.743795394897461, "global_step": 212306, "epoch": 1263} {"train_loss": -11.623668670654297, "global_step": 212307, "epoch": 1263} {"train_loss": -10.518668174743652, "global_step": 212308, "epoch": 1263} {"train_loss": -11.615238189697266, "global_step": 212309, "epoch": 1263} {"train_loss": -10.55557632446289, "global_step": 212310, "epoch": 1263} {"train_loss": -11.312057495117188, "global_step": 212311, "epoch": 1263} {"train_loss": -10.86530876159668, "global_step": 212312, "epoch": 1263} {"train_loss": -11.67834758758545, "global_step": 212313, "epoch": 1263} {"train_loss": -11.205857276916504, "global_step": 212314, "epoch": 1263} {"train_loss": -11.275257110595703, "global_step": 212315, "epoch": 1263} {"train_loss": -11.352865219116211, "global_step": 212316, "epoch": 1263} {"train_loss": -11.46338176727295, "global_step": 212317, "epoch": 1263} {"train_loss": -11.169206619262695, "global_step": 212318, "epoch": 1263} {"train_loss": -10.905738830566406, "global_step": 212319, "epoch": 1263} {"train_loss": -11.36854076385498, "global_step": 212320, "epoch": 1263} {"train_loss": -10.93687629699707, "global_step": 212321, "epoch": 1263} {"train_loss": -11.44687271118164, "global_step": 212322, "epoch": 1263} {"train_loss": -10.844175338745117, "global_step": 212323, "epoch": 1263} {"train_loss": -11.59312629699707, "global_step": 212324, "epoch": 1263} {"train_loss": -11.225751876831055, "global_step": 212325, "epoch": 1263} {"train_loss": -11.31489086151123, "global_step": 212326, "epoch": 1263} {"train_loss": -10.928893089294434, "global_step": 212327, "epoch": 1263} {"train_loss": -10.640849113464355, "global_step": 212328, "epoch": 1263} {"train_loss": -10.973272323608398, "global_step": 212329, "epoch": 1263} {"train_loss": -11.147425651550293, "global_step": 212330, "epoch": 1263} {"train_loss": -10.849502563476562, "global_step": 212331, "epoch": 1263} {"train_loss": -11.122105598449707, "global_step": 212332, "epoch": 1263} {"train_loss": -11.58210563659668, "global_step": 212333, "epoch": 1263} {"train_loss": -10.992698669433594, "global_step": 212334, "epoch": 1263} {"train_loss": -11.426899909973145, "global_step": 212335, "epoch": 1263} {"train_loss": -11.040192604064941, "global_step": 212336, "epoch": 1263} {"train_loss": -11.04704475402832, "global_step": 212337, "epoch": 1263} {"train_loss": -11.502981185913086, "global_step": 212338, "epoch": 1263} {"train_loss": -11.380846977233887, "global_step": 212339, "epoch": 1263} {"train_loss": -11.46367073059082, "global_step": 212340, "epoch": 1263} {"train_loss": -11.50698184967041, "global_step": 212341, "epoch": 1263} {"train_loss": -11.378071784973145, "global_step": 212342, "epoch": 1263} {"train_loss": -11.366918563842773, "global_step": 212343, "epoch": 1263} {"train_loss": -11.280160903930664, "global_step": 212344, "epoch": 1263} {"train_loss": -10.990839958190918, "global_step": 212345, "epoch": 1263} {"train_loss": -11.666614532470703, "global_step": 212346, "epoch": 1263} {"train_loss": -10.483489036560059, "global_step": 212347, "epoch": 1263} {"train_loss": -11.692270278930664, "global_step": 212348, "epoch": 1263} {"train_loss": -11.194032669067383, "global_step": 212349, "epoch": 1263} {"train_loss": -11.126272201538086, "global_step": 212350, "epoch": 1263} {"train_loss": -11.303768316904703, "global_step": 212351, "epoch": 1263, "val_loss": 257332.78125} {"train_loss": -11.007932662963867, "global_step": 212352, "epoch": 1264} {"train_loss": -11.57804012298584, "global_step": 212353, "epoch": 1264} {"train_loss": -11.064987182617188, "global_step": 212354, "epoch": 1264} {"train_loss": -11.358072280883789, "global_step": 212355, "epoch": 1264} {"train_loss": -11.363719940185547, "global_step": 212356, "epoch": 1264} {"train_loss": -10.165151596069336, "global_step": 212357, "epoch": 1264} {"train_loss": -11.335201263427734, "global_step": 212358, "epoch": 1264} {"train_loss": -10.279184341430664, "global_step": 212359, "epoch": 1264} {"train_loss": -10.78532600402832, "global_step": 212360, "epoch": 1264} {"train_loss": -11.015985488891602, "global_step": 212361, "epoch": 1264} {"train_loss": -10.867986679077148, "global_step": 212362, "epoch": 1264} {"train_loss": -10.877216339111328, "global_step": 212363, "epoch": 1264} {"train_loss": -11.314752578735352, "global_step": 212364, "epoch": 1264} {"train_loss": -10.853123664855957, "global_step": 212365, "epoch": 1264} {"train_loss": -10.431777954101562, "global_step": 212366, "epoch": 1264} {"train_loss": -10.987957000732422, "global_step": 212367, "epoch": 1264} {"train_loss": -10.947508811950684, "global_step": 212368, "epoch": 1264} {"train_loss": -11.091288566589355, "global_step": 212369, "epoch": 1264} {"train_loss": -11.465429306030273, "global_step": 212370, "epoch": 1264} {"train_loss": -11.028829574584961, "global_step": 212371, "epoch": 1264} {"train_loss": -11.14411735534668, "global_step": 212372, "epoch": 1264} {"train_loss": -11.148698806762695, "global_step": 212373, "epoch": 1264} {"train_loss": -11.459421157836914, "global_step": 212374, "epoch": 1264} {"train_loss": -11.380756378173828, "global_step": 212375, "epoch": 1264} {"train_loss": -11.434666633605957, "global_step": 212376, "epoch": 1264} {"train_loss": -11.47635269165039, "global_step": 212377, "epoch": 1264} {"train_loss": -11.477396011352539, "global_step": 212378, "epoch": 1264} {"train_loss": -11.069992065429688, "global_step": 212379, "epoch": 1264} {"train_loss": -11.589693069458008, "global_step": 212380, "epoch": 1264} {"train_loss": -11.471282958984375, "global_step": 212381, "epoch": 1264} {"train_loss": -11.558488845825195, "global_step": 212382, "epoch": 1264} {"train_loss": -11.385421752929688, "global_step": 212383, "epoch": 1264} {"train_loss": -11.448698043823242, "global_step": 212384, "epoch": 1264} {"train_loss": -11.299736022949219, "global_step": 212385, "epoch": 1264} {"train_loss": -11.646509170532227, "global_step": 212386, "epoch": 1264} {"train_loss": -11.423294067382812, "global_step": 212387, "epoch": 1264} {"train_loss": -11.386432647705078, "global_step": 212388, "epoch": 1264} {"train_loss": -11.777422904968262, "global_step": 212389, "epoch": 1264} {"train_loss": -11.622063636779785, "global_step": 212390, "epoch": 1264} {"train_loss": -11.46257209777832, "global_step": 212391, "epoch": 1264} {"train_loss": -11.256275177001953, "global_step": 212392, "epoch": 1264} {"train_loss": -11.544635772705078, "global_step": 212393, "epoch": 1264} {"train_loss": -11.438383102416992, "global_step": 212394, "epoch": 1264} {"train_loss": -11.786455154418945, "global_step": 212395, "epoch": 1264} {"train_loss": -11.589882850646973, "global_step": 212396, "epoch": 1264} {"train_loss": -11.760473251342773, "global_step": 212397, "epoch": 1264} {"train_loss": -11.593901634216309, "global_step": 212398, "epoch": 1264} {"train_loss": -11.653436660766602, "global_step": 212399, "epoch": 1264} {"train_loss": -11.295340538024902, "global_step": 212400, "epoch": 1264} {"train_loss": -11.570502281188965, "global_step": 212401, "epoch": 1264} {"train_loss": -11.506146430969238, "global_step": 212402, "epoch": 1264} {"train_loss": -11.450779914855957, "global_step": 212403, "epoch": 1264} {"train_loss": -11.473308563232422, "global_step": 212404, "epoch": 1264} {"train_loss": -11.42646312713623, "global_step": 212405, "epoch": 1264} {"train_loss": -11.735965728759766, "global_step": 212406, "epoch": 1264} {"train_loss": -10.63001537322998, "global_step": 212407, "epoch": 1264} {"train_loss": -11.725371360778809, "global_step": 212408, "epoch": 1264} {"train_loss": -10.89982795715332, "global_step": 212409, "epoch": 1264} {"train_loss": -11.626971244812012, "global_step": 212410, "epoch": 1264} {"train_loss": -11.112831115722656, "global_step": 212411, "epoch": 1264} {"train_loss": -11.28957748413086, "global_step": 212412, "epoch": 1264} {"train_loss": -11.705222129821777, "global_step": 212413, "epoch": 1264} {"train_loss": -11.298664093017578, "global_step": 212414, "epoch": 1264} {"train_loss": -11.782605171203613, "global_step": 212415, "epoch": 1264} {"train_loss": -11.573057174682617, "global_step": 212416, "epoch": 1264} {"train_loss": -11.508857727050781, "global_step": 212417, "epoch": 1264} {"train_loss": -11.236515045166016, "global_step": 212418, "epoch": 1264} {"train_loss": -11.445128440856934, "global_step": 212419, "epoch": 1264} {"train_loss": -11.774194717407227, "global_step": 212420, "epoch": 1264} {"train_loss": -11.386964797973633, "global_step": 212421, "epoch": 1264} {"train_loss": -11.607372283935547, "global_step": 212422, "epoch": 1264} {"train_loss": -11.80677318572998, "global_step": 212423, "epoch": 1264} {"train_loss": -11.382198333740234, "global_step": 212424, "epoch": 1264} {"train_loss": -11.772205352783203, "global_step": 212425, "epoch": 1264} {"train_loss": -11.478795051574707, "global_step": 212426, "epoch": 1264} {"train_loss": -11.535167694091797, "global_step": 212427, "epoch": 1264} {"train_loss": -11.606330871582031, "global_step": 212428, "epoch": 1264} {"train_loss": -11.809392929077148, "global_step": 212429, "epoch": 1264} {"train_loss": -11.915823936462402, "global_step": 212430, "epoch": 1264} {"train_loss": -11.618358612060547, "global_step": 212431, "epoch": 1264} {"train_loss": -11.746345520019531, "global_step": 212432, "epoch": 1264} {"train_loss": -11.535045623779297, "global_step": 212433, "epoch": 1264} {"train_loss": -11.603151321411133, "global_step": 212434, "epoch": 1264} {"train_loss": -11.437799453735352, "global_step": 212435, "epoch": 1264} {"train_loss": -11.335383415222168, "global_step": 212436, "epoch": 1264} {"train_loss": -11.087566375732422, "global_step": 212437, "epoch": 1264} {"train_loss": -11.21334457397461, "global_step": 212438, "epoch": 1264} {"train_loss": -11.331905364990234, "global_step": 212439, "epoch": 1264} {"train_loss": -10.52970027923584, "global_step": 212440, "epoch": 1264} {"train_loss": -10.86716079711914, "global_step": 212441, "epoch": 1264} {"train_loss": -11.147647857666016, "global_step": 212442, "epoch": 1264} {"train_loss": -10.757741928100586, "global_step": 212443, "epoch": 1264} {"train_loss": -11.017492294311523, "global_step": 212444, "epoch": 1264} {"train_loss": -11.055277824401855, "global_step": 212445, "epoch": 1264} {"train_loss": -11.093742370605469, "global_step": 212446, "epoch": 1264} {"train_loss": -11.440062522888184, "global_step": 212447, "epoch": 1264} {"train_loss": -11.05460262298584, "global_step": 212448, "epoch": 1264} {"train_loss": -11.433016777038574, "global_step": 212449, "epoch": 1264} {"train_loss": -11.04220962524414, "global_step": 212450, "epoch": 1264} {"train_loss": -11.32700252532959, "global_step": 212451, "epoch": 1264} {"train_loss": -10.859867095947266, "global_step": 212452, "epoch": 1264} {"train_loss": -10.684894561767578, "global_step": 212453, "epoch": 1264} {"train_loss": -10.378416061401367, "global_step": 212454, "epoch": 1264} {"train_loss": -11.380976676940918, "global_step": 212455, "epoch": 1264} {"train_loss": -9.709158897399902, "global_step": 212456, "epoch": 1264} {"train_loss": -11.309842109680176, "global_step": 212457, "epoch": 1264} {"train_loss": -10.098995208740234, "global_step": 212458, "epoch": 1264} {"train_loss": -9.997344970703125, "global_step": 212459, "epoch": 1264} {"train_loss": -10.965520858764648, "global_step": 212460, "epoch": 1264} {"train_loss": -10.532918930053711, "global_step": 212461, "epoch": 1264} {"train_loss": -9.432107925415039, "global_step": 212462, "epoch": 1264} {"train_loss": -10.411590576171875, "global_step": 212463, "epoch": 1264} {"train_loss": -10.641596794128418, "global_step": 212464, "epoch": 1264} {"train_loss": -10.679527282714844, "global_step": 212465, "epoch": 1264} {"train_loss": -10.62777328491211, "global_step": 212466, "epoch": 1264} {"train_loss": -10.354703903198242, "global_step": 212467, "epoch": 1264} {"train_loss": -11.226625442504883, "global_step": 212468, "epoch": 1264} {"train_loss": -10.532434463500977, "global_step": 212469, "epoch": 1264} {"train_loss": -11.12984848022461, "global_step": 212470, "epoch": 1264} {"train_loss": -11.157491683959961, "global_step": 212471, "epoch": 1264} {"train_loss": -10.864131927490234, "global_step": 212472, "epoch": 1264} {"train_loss": -10.919991493225098, "global_step": 212473, "epoch": 1264} {"train_loss": -11.282611846923828, "global_step": 212474, "epoch": 1264} {"train_loss": -11.074780464172363, "global_step": 212475, "epoch": 1264} {"train_loss": -11.11707878112793, "global_step": 212476, "epoch": 1264} {"train_loss": -10.876729965209961, "global_step": 212477, "epoch": 1264} {"train_loss": -11.189172744750977, "global_step": 212478, "epoch": 1264} {"train_loss": -11.243839263916016, "global_step": 212479, "epoch": 1264} {"train_loss": -11.416388511657715, "global_step": 212480, "epoch": 1264} {"train_loss": -11.396020889282227, "global_step": 212481, "epoch": 1264} {"train_loss": -11.21375560760498, "global_step": 212482, "epoch": 1264} {"train_loss": -11.311716079711914, "global_step": 212483, "epoch": 1264} {"train_loss": -11.471338272094727, "global_step": 212484, "epoch": 1264} {"train_loss": -11.257868766784668, "global_step": 212485, "epoch": 1264} {"train_loss": -11.346397399902344, "global_step": 212486, "epoch": 1264} {"train_loss": -11.410200119018555, "global_step": 212487, "epoch": 1264} {"train_loss": -11.456666946411133, "global_step": 212488, "epoch": 1264} {"train_loss": -11.475845336914062, "global_step": 212489, "epoch": 1264} {"train_loss": -11.501642227172852, "global_step": 212490, "epoch": 1264} {"train_loss": -11.507227897644043, "global_step": 212491, "epoch": 1264} {"train_loss": -11.711616516113281, "global_step": 212492, "epoch": 1264} {"train_loss": -11.64305305480957, "global_step": 212493, "epoch": 1264} {"train_loss": -11.642574310302734, "global_step": 212494, "epoch": 1264} {"train_loss": -11.754232406616211, "global_step": 212495, "epoch": 1264} {"train_loss": -11.513439178466797, "global_step": 212496, "epoch": 1264} {"train_loss": -11.546422958374023, "global_step": 212497, "epoch": 1264} {"train_loss": -11.597066879272461, "global_step": 212498, "epoch": 1264} {"train_loss": -11.61024284362793, "global_step": 212499, "epoch": 1264} {"train_loss": -11.81030559539795, "global_step": 212500, "epoch": 1264} {"train_loss": -11.786081314086914, "global_step": 212501, "epoch": 1264} {"train_loss": -11.604188919067383, "global_step": 212502, "epoch": 1264} {"train_loss": -11.782751083374023, "global_step": 212503, "epoch": 1264} {"train_loss": -11.773347854614258, "global_step": 212504, "epoch": 1264} {"train_loss": -11.564047813415527, "global_step": 212505, "epoch": 1264} {"train_loss": -11.637639999389648, "global_step": 212506, "epoch": 1264} {"train_loss": -11.714508056640625, "global_step": 212507, "epoch": 1264} {"train_loss": -11.695632934570312, "global_step": 212508, "epoch": 1264} {"train_loss": -11.798803329467773, "global_step": 212509, "epoch": 1264} {"train_loss": -11.5287504196167, "global_step": 212510, "epoch": 1264} {"train_loss": -11.764955520629883, "global_step": 212511, "epoch": 1264} {"train_loss": -11.806230545043945, "global_step": 212512, "epoch": 1264} {"train_loss": -11.520190238952637, "global_step": 212513, "epoch": 1264} {"train_loss": -11.931451797485352, "global_step": 212514, "epoch": 1264} {"train_loss": -11.449840545654297, "global_step": 212515, "epoch": 1264} {"train_loss": -11.974164962768555, "global_step": 212516, "epoch": 1264} {"train_loss": -11.641304016113281, "global_step": 212517, "epoch": 1264} {"train_loss": -11.512567520141602, "global_step": 212518, "epoch": 1264} {"train_loss": -11.295184589567638, "global_step": 212519, "epoch": 1264, "val_loss": 256981.15625} {"train_loss": -11.556774139404297, "global_step": 212520, "epoch": 1265} {"train_loss": -11.372184753417969, "global_step": 212521, "epoch": 1265} {"train_loss": -11.032846450805664, "global_step": 212522, "epoch": 1265} {"train_loss": -10.34134578704834, "global_step": 212523, "epoch": 1265} {"train_loss": -11.537484169006348, "global_step": 212524, "epoch": 1265} {"train_loss": -10.401201248168945, "global_step": 212525, "epoch": 1265} {"train_loss": -11.127848625183105, "global_step": 212526, "epoch": 1265} {"train_loss": -10.51287841796875, "global_step": 212527, "epoch": 1265} {"train_loss": -10.855224609375, "global_step": 212528, "epoch": 1265} {"train_loss": -10.747882843017578, "global_step": 212529, "epoch": 1265} {"train_loss": -10.593456268310547, "global_step": 212530, "epoch": 1265} {"train_loss": -10.694294929504395, "global_step": 212531, "epoch": 1265} {"train_loss": -9.700075149536133, "global_step": 212532, "epoch": 1265} {"train_loss": -9.671796798706055, "global_step": 212533, "epoch": 1265} {"train_loss": -10.818510055541992, "global_step": 212534, "epoch": 1265} {"train_loss": -9.850212097167969, "global_step": 212535, "epoch": 1265} {"train_loss": -11.606057167053223, "global_step": 212536, "epoch": 1265} {"train_loss": -10.424735069274902, "global_step": 212537, "epoch": 1265} {"train_loss": -11.109779357910156, "global_step": 212538, "epoch": 1265} {"train_loss": -11.106622695922852, "global_step": 212539, "epoch": 1265} {"train_loss": -10.998034477233887, "global_step": 212540, "epoch": 1265} {"train_loss": -11.40237045288086, "global_step": 212541, "epoch": 1265} {"train_loss": -11.011737823486328, "global_step": 212542, "epoch": 1265} {"train_loss": -11.340668678283691, "global_step": 212543, "epoch": 1265} {"train_loss": -11.028045654296875, "global_step": 212544, "epoch": 1265} {"train_loss": -11.191496849060059, "global_step": 212545, "epoch": 1265} {"train_loss": -11.431546211242676, "global_step": 212546, "epoch": 1265} {"train_loss": -11.381512641906738, "global_step": 212547, "epoch": 1265} {"train_loss": -11.61532974243164, "global_step": 212548, "epoch": 1265} {"train_loss": -11.416227340698242, "global_step": 212549, "epoch": 1265} {"train_loss": -11.527460098266602, "global_step": 212550, "epoch": 1265} {"train_loss": -11.490548133850098, "global_step": 212551, "epoch": 1265} {"train_loss": -11.439231872558594, "global_step": 212552, "epoch": 1265} {"train_loss": -11.724021911621094, "global_step": 212553, "epoch": 1265} {"train_loss": -11.484291076660156, "global_step": 212554, "epoch": 1265} {"train_loss": -11.394678115844727, "global_step": 212555, "epoch": 1265} {"train_loss": -11.581708908081055, "global_step": 212556, "epoch": 1265} {"train_loss": -11.147834777832031, "global_step": 212557, "epoch": 1265} {"train_loss": -11.64718246459961, "global_step": 212558, "epoch": 1265} {"train_loss": -11.390214920043945, "global_step": 212559, "epoch": 1265} {"train_loss": -11.364225387573242, "global_step": 212560, "epoch": 1265} {"train_loss": -11.278339385986328, "global_step": 212561, "epoch": 1265} {"train_loss": -11.348012924194336, "global_step": 212562, "epoch": 1265} {"train_loss": -11.435757637023926, "global_step": 212563, "epoch": 1265} {"train_loss": -10.865827560424805, "global_step": 212564, "epoch": 1265} {"train_loss": -11.686628341674805, "global_step": 212565, "epoch": 1265} {"train_loss": -11.083711624145508, "global_step": 212566, "epoch": 1265} {"train_loss": -11.565138816833496, "global_step": 212567, "epoch": 1265} {"train_loss": -11.026046752929688, "global_step": 212568, "epoch": 1265} {"train_loss": -11.684991836547852, "global_step": 212569, "epoch": 1265} {"train_loss": -11.299280166625977, "global_step": 212570, "epoch": 1265} {"train_loss": -11.79510498046875, "global_step": 212571, "epoch": 1265} {"train_loss": -11.599752426147461, "global_step": 212572, "epoch": 1265} {"train_loss": -11.591196060180664, "global_step": 212573, "epoch": 1265} {"train_loss": -11.506736755371094, "global_step": 212574, "epoch": 1265} {"train_loss": -11.642189025878906, "global_step": 212575, "epoch": 1265} {"train_loss": -11.681768417358398, "global_step": 212576, "epoch": 1265} {"train_loss": -11.654574394226074, "global_step": 212577, "epoch": 1265} {"train_loss": -11.855295181274414, "global_step": 212578, "epoch": 1265} {"train_loss": -11.803237915039062, "global_step": 212579, "epoch": 1265} {"train_loss": -11.744540214538574, "global_step": 212580, "epoch": 1265} {"train_loss": -11.775016784667969, "global_step": 212581, "epoch": 1265} {"train_loss": -11.54531478881836, "global_step": 212582, "epoch": 1265} {"train_loss": -11.905656814575195, "global_step": 212583, "epoch": 1265} {"train_loss": -11.647157669067383, "global_step": 212584, "epoch": 1265} {"train_loss": -11.795133590698242, "global_step": 212585, "epoch": 1265} {"train_loss": -11.482065200805664, "global_step": 212586, "epoch": 1265} {"train_loss": -11.717247009277344, "global_step": 212587, "epoch": 1265} {"train_loss": -11.65865707397461, "global_step": 212588, "epoch": 1265} {"train_loss": -11.830158233642578, "global_step": 212589, "epoch": 1265} {"train_loss": -11.642791748046875, "global_step": 212590, "epoch": 1265} {"train_loss": -11.398406982421875, "global_step": 212591, "epoch": 1265} {"train_loss": -11.8287353515625, "global_step": 212592, "epoch": 1265} {"train_loss": -11.64552116394043, "global_step": 212593, "epoch": 1265} {"train_loss": -11.897403717041016, "global_step": 212594, "epoch": 1265} {"train_loss": -11.792171478271484, "global_step": 212595, "epoch": 1265} {"train_loss": -11.826913833618164, "global_step": 212596, "epoch": 1265} {"train_loss": -11.808170318603516, "global_step": 212597, "epoch": 1265} {"train_loss": -11.729473114013672, "global_step": 212598, "epoch": 1265} {"train_loss": -11.811662673950195, "global_step": 212599, "epoch": 1265} {"train_loss": -11.691827774047852, "global_step": 212600, "epoch": 1265} {"train_loss": -11.533544540405273, "global_step": 212601, "epoch": 1265} {"train_loss": -11.763655662536621, "global_step": 212602, "epoch": 1265} {"train_loss": -11.810226440429688, "global_step": 212603, "epoch": 1265} {"train_loss": -11.338274002075195, "global_step": 212604, "epoch": 1265} {"train_loss": -11.6263427734375, "global_step": 212605, "epoch": 1265} {"train_loss": -11.828641891479492, "global_step": 212606, "epoch": 1265} {"train_loss": -11.868919372558594, "global_step": 212607, "epoch": 1265} {"train_loss": -11.855703353881836, "global_step": 212608, "epoch": 1265} {"train_loss": -11.992738723754883, "global_step": 212609, "epoch": 1265} {"train_loss": -12.005770683288574, "global_step": 212610, "epoch": 1265} {"train_loss": -11.767651557922363, "global_step": 212611, "epoch": 1265} {"train_loss": -11.461108207702637, "global_step": 212612, "epoch": 1265} {"train_loss": -12.069733619689941, "global_step": 212613, "epoch": 1265} {"train_loss": -11.759732246398926, "global_step": 212614, "epoch": 1265} {"train_loss": -11.510549545288086, "global_step": 212615, "epoch": 1265} {"train_loss": -11.607210159301758, "global_step": 212616, "epoch": 1265} {"train_loss": -11.910367012023926, "global_step": 212617, "epoch": 1265} {"train_loss": -11.692750930786133, "global_step": 212618, "epoch": 1265} {"train_loss": -11.385936737060547, "global_step": 212619, "epoch": 1265} {"train_loss": -11.527850151062012, "global_step": 212620, "epoch": 1265} {"train_loss": -11.872068405151367, "global_step": 212621, "epoch": 1265} {"train_loss": -11.503791809082031, "global_step": 212622, "epoch": 1265} {"train_loss": -11.167869567871094, "global_step": 212623, "epoch": 1265} {"train_loss": -11.75113296508789, "global_step": 212624, "epoch": 1265} {"train_loss": -11.738912582397461, "global_step": 212625, "epoch": 1265} {"train_loss": -10.96255111694336, "global_step": 212626, "epoch": 1265} {"train_loss": -11.570611000061035, "global_step": 212627, "epoch": 1265} {"train_loss": -11.524897575378418, "global_step": 212628, "epoch": 1265} {"train_loss": -11.262380599975586, "global_step": 212629, "epoch": 1265} {"train_loss": -11.048208236694336, "global_step": 212630, "epoch": 1265} {"train_loss": -10.744586944580078, "global_step": 212631, "epoch": 1265} {"train_loss": -11.486120223999023, "global_step": 212632, "epoch": 1265} {"train_loss": -10.869796752929688, "global_step": 212633, "epoch": 1265} {"train_loss": -10.70449447631836, "global_step": 212634, "epoch": 1265} {"train_loss": -10.938285827636719, "global_step": 212635, "epoch": 1265} {"train_loss": -11.1053466796875, "global_step": 212636, "epoch": 1265} {"train_loss": -8.864910125732422, "global_step": 212637, "epoch": 1265} {"train_loss": -10.969602584838867, "global_step": 212638, "epoch": 1265} {"train_loss": -11.353084564208984, "global_step": 212639, "epoch": 1265} {"train_loss": -11.337346076965332, "global_step": 212640, "epoch": 1265} {"train_loss": -11.075721740722656, "global_step": 212641, "epoch": 1265} {"train_loss": -11.400209426879883, "global_step": 212642, "epoch": 1265} {"train_loss": -10.257238388061523, "global_step": 212643, "epoch": 1265} {"train_loss": -11.48243522644043, "global_step": 212644, "epoch": 1265} {"train_loss": -11.144072532653809, "global_step": 212645, "epoch": 1265} {"train_loss": -10.680744171142578, "global_step": 212646, "epoch": 1265} {"train_loss": -10.934457778930664, "global_step": 212647, "epoch": 1265} {"train_loss": -10.701926231384277, "global_step": 212648, "epoch": 1265} {"train_loss": -10.556407928466797, "global_step": 212649, "epoch": 1265} {"train_loss": -11.040175437927246, "global_step": 212650, "epoch": 1265} {"train_loss": -11.447896957397461, "global_step": 212651, "epoch": 1265} {"train_loss": -11.046258926391602, "global_step": 212652, "epoch": 1265} {"train_loss": -11.295492172241211, "global_step": 212653, "epoch": 1265} {"train_loss": -11.327771186828613, "global_step": 212654, "epoch": 1265} {"train_loss": -10.954041481018066, "global_step": 212655, "epoch": 1265} {"train_loss": -11.478006362915039, "global_step": 212656, "epoch": 1265} {"train_loss": -11.031360626220703, "global_step": 212657, "epoch": 1265} {"train_loss": -11.528173446655273, "global_step": 212658, "epoch": 1265} {"train_loss": -11.1353759765625, "global_step": 212659, "epoch": 1265} {"train_loss": -11.25859260559082, "global_step": 212660, "epoch": 1265} {"train_loss": -11.558876991271973, "global_step": 212661, "epoch": 1265} {"train_loss": -11.56026554107666, "global_step": 212662, "epoch": 1265} {"train_loss": -11.334263801574707, "global_step": 212663, "epoch": 1265} {"train_loss": -11.308441162109375, "global_step": 212664, "epoch": 1265} {"train_loss": -11.73454761505127, "global_step": 212665, "epoch": 1265} {"train_loss": -11.422216415405273, "global_step": 212666, "epoch": 1265} {"train_loss": -11.373624801635742, "global_step": 212667, "epoch": 1265} {"train_loss": -11.632423400878906, "global_step": 212668, "epoch": 1265} {"train_loss": -11.404111862182617, "global_step": 212669, "epoch": 1265} {"train_loss": -11.46766471862793, "global_step": 212670, "epoch": 1265} {"train_loss": -11.220863342285156, "global_step": 212671, "epoch": 1265} {"train_loss": -11.428319931030273, "global_step": 212672, "epoch": 1265} {"train_loss": -11.12799072265625, "global_step": 212673, "epoch": 1265} {"train_loss": -11.46825885772705, "global_step": 212674, "epoch": 1265} {"train_loss": -11.218832015991211, "global_step": 212675, "epoch": 1265} {"train_loss": -11.345634460449219, "global_step": 212676, "epoch": 1265} {"train_loss": -11.571396827697754, "global_step": 212677, "epoch": 1265} {"train_loss": -11.727717399597168, "global_step": 212678, "epoch": 1265} {"train_loss": -11.544061660766602, "global_step": 212679, "epoch": 1265} {"train_loss": -11.74717903137207, "global_step": 212680, "epoch": 1265} {"train_loss": -11.555831909179688, "global_step": 212681, "epoch": 1265} {"train_loss": -11.877969741821289, "global_step": 212682, "epoch": 1265} {"train_loss": -11.63750171661377, "global_step": 212683, "epoch": 1265} {"train_loss": -11.553857803344727, "global_step": 212684, "epoch": 1265} {"train_loss": -11.667621612548828, "global_step": 212685, "epoch": 1265} {"train_loss": -11.676496505737305, "global_step": 212686, "epoch": 1265} {"train_loss": -11.358584472111293, "global_step": 212687, "epoch": 1265, "val_loss": 258160.78125, "train_action_mse_error": 2.220606803894043} {"train_loss": -11.580598831176758, "global_step": 212688, "epoch": 1266} {"train_loss": -11.475000381469727, "global_step": 212689, "epoch": 1266} {"train_loss": -11.667323112487793, "global_step": 212690, "epoch": 1266} {"train_loss": -11.492644309997559, "global_step": 212691, "epoch": 1266} {"train_loss": -11.789752006530762, "global_step": 212692, "epoch": 1266} {"train_loss": -11.631389617919922, "global_step": 212693, "epoch": 1266} {"train_loss": -11.470942497253418, "global_step": 212694, "epoch": 1266} {"train_loss": -11.719941139221191, "global_step": 212695, "epoch": 1266} {"train_loss": -11.579313278198242, "global_step": 212696, "epoch": 1266} {"train_loss": -11.310956954956055, "global_step": 212697, "epoch": 1266} {"train_loss": -11.714404106140137, "global_step": 212698, "epoch": 1266} {"train_loss": -11.473941802978516, "global_step": 212699, "epoch": 1266} {"train_loss": -11.811192512512207, "global_step": 212700, "epoch": 1266} {"train_loss": -11.38564682006836, "global_step": 212701, "epoch": 1266} {"train_loss": -11.905967712402344, "global_step": 212702, "epoch": 1266} {"train_loss": -11.25853157043457, "global_step": 212703, "epoch": 1266} {"train_loss": -11.738365173339844, "global_step": 212704, "epoch": 1266} {"train_loss": -11.432004928588867, "global_step": 212705, "epoch": 1266} {"train_loss": -11.820396423339844, "global_step": 212706, "epoch": 1266} {"train_loss": -11.143348693847656, "global_step": 212707, "epoch": 1266} {"train_loss": -11.666234970092773, "global_step": 212708, "epoch": 1266} {"train_loss": -11.294204711914062, "global_step": 212709, "epoch": 1266} {"train_loss": -11.539058685302734, "global_step": 212710, "epoch": 1266} {"train_loss": -11.242365837097168, "global_step": 212711, "epoch": 1266} {"train_loss": -11.561970710754395, "global_step": 212712, "epoch": 1266} {"train_loss": -11.160499572753906, "global_step": 212713, "epoch": 1266} {"train_loss": -10.934256553649902, "global_step": 212714, "epoch": 1266} {"train_loss": -11.466261863708496, "global_step": 212715, "epoch": 1266} {"train_loss": -10.713584899902344, "global_step": 212716, "epoch": 1266} {"train_loss": -11.31527328491211, "global_step": 212717, "epoch": 1266} {"train_loss": -11.276939392089844, "global_step": 212718, "epoch": 1266} {"train_loss": -10.381514549255371, "global_step": 212719, "epoch": 1266} {"train_loss": -11.746261596679688, "global_step": 212720, "epoch": 1266} {"train_loss": -10.99290657043457, "global_step": 212721, "epoch": 1266} {"train_loss": -10.985820770263672, "global_step": 212722, "epoch": 1266} {"train_loss": -11.330708503723145, "global_step": 212723, "epoch": 1266} {"train_loss": -11.333236694335938, "global_step": 212724, "epoch": 1266} {"train_loss": -11.37828254699707, "global_step": 212725, "epoch": 1266} {"train_loss": -10.761899948120117, "global_step": 212726, "epoch": 1266} {"train_loss": -11.287378311157227, "global_step": 212727, "epoch": 1266} {"train_loss": -11.66002082824707, "global_step": 212728, "epoch": 1266} {"train_loss": -11.497359275817871, "global_step": 212729, "epoch": 1266} {"train_loss": -11.555362701416016, "global_step": 212730, "epoch": 1266} {"train_loss": -11.053401947021484, "global_step": 212731, "epoch": 1266} {"train_loss": -11.667377471923828, "global_step": 212732, "epoch": 1266} {"train_loss": -11.364950180053711, "global_step": 212733, "epoch": 1266} {"train_loss": -11.44832706451416, "global_step": 212734, "epoch": 1266} {"train_loss": -11.197707176208496, "global_step": 212735, "epoch": 1266} {"train_loss": -11.695210456848145, "global_step": 212736, "epoch": 1266} {"train_loss": -11.671978950500488, "global_step": 212737, "epoch": 1266} {"train_loss": -11.764599800109863, "global_step": 212738, "epoch": 1266} {"train_loss": -11.646202087402344, "global_step": 212739, "epoch": 1266} {"train_loss": -11.773757934570312, "global_step": 212740, "epoch": 1266} {"train_loss": -11.705924034118652, "global_step": 212741, "epoch": 1266} {"train_loss": -11.642157554626465, "global_step": 212742, "epoch": 1266} {"train_loss": -11.594858169555664, "global_step": 212743, "epoch": 1266} {"train_loss": -11.731024742126465, "global_step": 212744, "epoch": 1266} {"train_loss": -11.624359130859375, "global_step": 212745, "epoch": 1266} {"train_loss": -11.733348846435547, "global_step": 212746, "epoch": 1266} {"train_loss": -11.795381546020508, "global_step": 212747, "epoch": 1266} {"train_loss": -11.66489028930664, "global_step": 212748, "epoch": 1266} {"train_loss": -11.744080543518066, "global_step": 212749, "epoch": 1266} {"train_loss": -11.790009498596191, "global_step": 212750, "epoch": 1266} {"train_loss": -11.584444046020508, "global_step": 212751, "epoch": 1266} {"train_loss": -11.48375415802002, "global_step": 212752, "epoch": 1266} {"train_loss": -11.922005653381348, "global_step": 212753, "epoch": 1266} {"train_loss": -11.682373046875, "global_step": 212754, "epoch": 1266} {"train_loss": -11.636646270751953, "global_step": 212755, "epoch": 1266} {"train_loss": -11.33687973022461, "global_step": 212756, "epoch": 1266} {"train_loss": -11.31606388092041, "global_step": 212757, "epoch": 1266} {"train_loss": -11.370298385620117, "global_step": 212758, "epoch": 1266} {"train_loss": -11.33183479309082, "global_step": 212759, "epoch": 1266} {"train_loss": -11.370489120483398, "global_step": 212760, "epoch": 1266} {"train_loss": -11.858524322509766, "global_step": 212761, "epoch": 1266} {"train_loss": -11.060853958129883, "global_step": 212762, "epoch": 1266} {"train_loss": -11.2431058883667, "global_step": 212763, "epoch": 1266} {"train_loss": -11.706768035888672, "global_step": 212764, "epoch": 1266} {"train_loss": -11.65402603149414, "global_step": 212765, "epoch": 1266} {"train_loss": -11.827404975891113, "global_step": 212766, "epoch": 1266} {"train_loss": -11.603889465332031, "global_step": 212767, "epoch": 1266} {"train_loss": -11.449851989746094, "global_step": 212768, "epoch": 1266} {"train_loss": -11.959127426147461, "global_step": 212769, "epoch": 1266} {"train_loss": -11.498783111572266, "global_step": 212770, "epoch": 1266} {"train_loss": -11.679110527038574, "global_step": 212771, "epoch": 1266} {"train_loss": -11.804353713989258, "global_step": 212772, "epoch": 1266} {"train_loss": -11.661706924438477, "global_step": 212773, "epoch": 1266} {"train_loss": -11.718379974365234, "global_step": 212774, "epoch": 1266} {"train_loss": -11.584888458251953, "global_step": 212775, "epoch": 1266} {"train_loss": -11.27678394317627, "global_step": 212776, "epoch": 1266} {"train_loss": -10.45091724395752, "global_step": 212777, "epoch": 1266} {"train_loss": -11.433958053588867, "global_step": 212778, "epoch": 1266} {"train_loss": -10.639551162719727, "global_step": 212779, "epoch": 1266} {"train_loss": -10.654108047485352, "global_step": 212780, "epoch": 1266} {"train_loss": -11.038045883178711, "global_step": 212781, "epoch": 1266} {"train_loss": -10.673602104187012, "global_step": 212782, "epoch": 1266} {"train_loss": -10.546414375305176, "global_step": 212783, "epoch": 1266} {"train_loss": -10.772146224975586, "global_step": 212784, "epoch": 1266} {"train_loss": -11.005268096923828, "global_step": 212785, "epoch": 1266} {"train_loss": -10.231672286987305, "global_step": 212786, "epoch": 1266} {"train_loss": -10.714498519897461, "global_step": 212787, "epoch": 1266} {"train_loss": -11.34147834777832, "global_step": 212788, "epoch": 1266} {"train_loss": -10.340326309204102, "global_step": 212789, "epoch": 1266} {"train_loss": -11.360313415527344, "global_step": 212790, "epoch": 1266} {"train_loss": -10.274456024169922, "global_step": 212791, "epoch": 1266} {"train_loss": -11.113764762878418, "global_step": 212792, "epoch": 1266} {"train_loss": -10.913619041442871, "global_step": 212793, "epoch": 1266} {"train_loss": -11.393558502197266, "global_step": 212794, "epoch": 1266} {"train_loss": -11.137096405029297, "global_step": 212795, "epoch": 1266} {"train_loss": -11.077959060668945, "global_step": 212796, "epoch": 1266} {"train_loss": -11.394401550292969, "global_step": 212797, "epoch": 1266} {"train_loss": -11.249513626098633, "global_step": 212798, "epoch": 1266} {"train_loss": -11.427764892578125, "global_step": 212799, "epoch": 1266} {"train_loss": -11.038330078125, "global_step": 212800, "epoch": 1266} {"train_loss": -11.456897735595703, "global_step": 212801, "epoch": 1266} {"train_loss": -10.751904487609863, "global_step": 212802, "epoch": 1266} {"train_loss": -11.494792938232422, "global_step": 212803, "epoch": 1266} {"train_loss": -10.866960525512695, "global_step": 212804, "epoch": 1266} {"train_loss": -11.296144485473633, "global_step": 212805, "epoch": 1266} {"train_loss": -11.180740356445312, "global_step": 212806, "epoch": 1266} {"train_loss": -11.241012573242188, "global_step": 212807, "epoch": 1266} {"train_loss": -11.412515640258789, "global_step": 212808, "epoch": 1266} {"train_loss": -11.287705421447754, "global_step": 212809, "epoch": 1266} {"train_loss": -11.21750259399414, "global_step": 212810, "epoch": 1266} {"train_loss": -11.084986686706543, "global_step": 212811, "epoch": 1266} {"train_loss": -11.147294998168945, "global_step": 212812, "epoch": 1266} {"train_loss": -11.648475646972656, "global_step": 212813, "epoch": 1266} {"train_loss": -11.163177490234375, "global_step": 212814, "epoch": 1266} {"train_loss": -11.587066650390625, "global_step": 212815, "epoch": 1266} {"train_loss": -11.198286056518555, "global_step": 212816, "epoch": 1266} {"train_loss": -11.546941757202148, "global_step": 212817, "epoch": 1266} {"train_loss": -11.484466552734375, "global_step": 212818, "epoch": 1266} {"train_loss": -11.336238861083984, "global_step": 212819, "epoch": 1266} {"train_loss": -11.295333862304688, "global_step": 212820, "epoch": 1266} {"train_loss": -11.257150650024414, "global_step": 212821, "epoch": 1266} {"train_loss": -11.350019454956055, "global_step": 212822, "epoch": 1266} {"train_loss": -11.637145042419434, "global_step": 212823, "epoch": 1266} {"train_loss": -11.195638656616211, "global_step": 212824, "epoch": 1266} {"train_loss": -11.111217498779297, "global_step": 212825, "epoch": 1266} {"train_loss": -10.981711387634277, "global_step": 212826, "epoch": 1266} {"train_loss": -11.475567817687988, "global_step": 212827, "epoch": 1266} {"train_loss": -11.300788879394531, "global_step": 212828, "epoch": 1266} {"train_loss": -11.150233268737793, "global_step": 212829, "epoch": 1266} {"train_loss": -11.522671699523926, "global_step": 212830, "epoch": 1266} {"train_loss": -11.353585243225098, "global_step": 212831, "epoch": 1266} {"train_loss": -11.56125545501709, "global_step": 212832, "epoch": 1266} {"train_loss": -11.273322105407715, "global_step": 212833, "epoch": 1266} {"train_loss": -11.658153533935547, "global_step": 212834, "epoch": 1266} {"train_loss": -11.562539100646973, "global_step": 212835, "epoch": 1266} {"train_loss": -11.625326156616211, "global_step": 212836, "epoch": 1266} {"train_loss": -11.530455589294434, "global_step": 212837, "epoch": 1266} {"train_loss": -11.726666450500488, "global_step": 212838, "epoch": 1266} {"train_loss": -11.685388565063477, "global_step": 212839, "epoch": 1266} {"train_loss": -11.839038848876953, "global_step": 212840, "epoch": 1266} {"train_loss": -11.511323928833008, "global_step": 212841, "epoch": 1266} {"train_loss": -11.523771286010742, "global_step": 212842, "epoch": 1266} {"train_loss": -11.295587539672852, "global_step": 212843, "epoch": 1266} {"train_loss": -11.403358459472656, "global_step": 212844, "epoch": 1266} {"train_loss": -11.473102569580078, "global_step": 212845, "epoch": 1266} {"train_loss": -11.843328475952148, "global_step": 212846, "epoch": 1266} {"train_loss": -11.138277053833008, "global_step": 212847, "epoch": 1266} {"train_loss": -11.730539321899414, "global_step": 212848, "epoch": 1266} {"train_loss": -11.41810417175293, "global_step": 212849, "epoch": 1266} {"train_loss": -11.69978141784668, "global_step": 212850, "epoch": 1266} {"train_loss": -11.46987247467041, "global_step": 212851, "epoch": 1266} {"train_loss": -11.475954055786133, "global_step": 212852, "epoch": 1266} {"train_loss": -11.787795066833496, "global_step": 212853, "epoch": 1266} {"train_loss": -11.454179763793945, "global_step": 212854, "epoch": 1266} {"train_loss": -11.386157052857536, "global_step": 212855, "epoch": 1266, "val_loss": 257711.015625} {"train_loss": -11.720779418945312, "global_step": 212856, "epoch": 1267} {"train_loss": -11.707027435302734, "global_step": 212857, "epoch": 1267} {"train_loss": -11.701440811157227, "global_step": 212858, "epoch": 1267} {"train_loss": -11.421351432800293, "global_step": 212859, "epoch": 1267} {"train_loss": -11.701744079589844, "global_step": 212860, "epoch": 1267} {"train_loss": -11.64179801940918, "global_step": 212861, "epoch": 1267} {"train_loss": -11.828157424926758, "global_step": 212862, "epoch": 1267} {"train_loss": -11.826207160949707, "global_step": 212863, "epoch": 1267} {"train_loss": -11.68687915802002, "global_step": 212864, "epoch": 1267} {"train_loss": -11.819937705993652, "global_step": 212865, "epoch": 1267} {"train_loss": -11.457905769348145, "global_step": 212866, "epoch": 1267} {"train_loss": -11.425432205200195, "global_step": 212867, "epoch": 1267} {"train_loss": -12.041311264038086, "global_step": 212868, "epoch": 1267} {"train_loss": -11.60110855102539, "global_step": 212869, "epoch": 1267} {"train_loss": -11.595885276794434, "global_step": 212870, "epoch": 1267} {"train_loss": -11.621135711669922, "global_step": 212871, "epoch": 1267} {"train_loss": -12.043566703796387, "global_step": 212872, "epoch": 1267} {"train_loss": -11.88805866241455, "global_step": 212873, "epoch": 1267} {"train_loss": -11.636690139770508, "global_step": 212874, "epoch": 1267} {"train_loss": -11.834394454956055, "global_step": 212875, "epoch": 1267} {"train_loss": -11.822917938232422, "global_step": 212876, "epoch": 1267} {"train_loss": -11.810787200927734, "global_step": 212877, "epoch": 1267} {"train_loss": -11.837451934814453, "global_step": 212878, "epoch": 1267} {"train_loss": -12.037552833557129, "global_step": 212879, "epoch": 1267} {"train_loss": -11.987449645996094, "global_step": 212880, "epoch": 1267} {"train_loss": -11.99896240234375, "global_step": 212881, "epoch": 1267} {"train_loss": -11.914722442626953, "global_step": 212882, "epoch": 1267} {"train_loss": -11.86549186706543, "global_step": 212883, "epoch": 1267} {"train_loss": -12.020620346069336, "global_step": 212884, "epoch": 1267} {"train_loss": -11.87617015838623, "global_step": 212885, "epoch": 1267} {"train_loss": -11.86400032043457, "global_step": 212886, "epoch": 1267} {"train_loss": -11.94811725616455, "global_step": 212887, "epoch": 1267} {"train_loss": -12.038726806640625, "global_step": 212888, "epoch": 1267} {"train_loss": -11.875162124633789, "global_step": 212889, "epoch": 1267} {"train_loss": -11.864686012268066, "global_step": 212890, "epoch": 1267} {"train_loss": -11.84899616241455, "global_step": 212891, "epoch": 1267} {"train_loss": -11.657445907592773, "global_step": 212892, "epoch": 1267} {"train_loss": -11.785418510437012, "global_step": 212893, "epoch": 1267} {"train_loss": -11.892106056213379, "global_step": 212894, "epoch": 1267} {"train_loss": -11.714433670043945, "global_step": 212895, "epoch": 1267} {"train_loss": -11.684478759765625, "global_step": 212896, "epoch": 1267} {"train_loss": -11.994680404663086, "global_step": 212897, "epoch": 1267} {"train_loss": -11.917449951171875, "global_step": 212898, "epoch": 1267} {"train_loss": -11.702638626098633, "global_step": 212899, "epoch": 1267} {"train_loss": -11.008306503295898, "global_step": 212900, "epoch": 1267} {"train_loss": -10.997671127319336, "global_step": 212901, "epoch": 1267} {"train_loss": -11.234025001525879, "global_step": 212902, "epoch": 1267} {"train_loss": -10.579263687133789, "global_step": 212903, "epoch": 1267} {"train_loss": -11.438591003417969, "global_step": 212904, "epoch": 1267} {"train_loss": -9.166744232177734, "global_step": 212905, "epoch": 1267} {"train_loss": -9.675296783447266, "global_step": 212906, "epoch": 1267} {"train_loss": -10.568678855895996, "global_step": 212907, "epoch": 1267} {"train_loss": -7.0359296798706055, "global_step": 212908, "epoch": 1267} {"train_loss": -8.307241439819336, "global_step": 212909, "epoch": 1267} {"train_loss": -8.473697662353516, "global_step": 212910, "epoch": 1267} {"train_loss": -9.925827026367188, "global_step": 212911, "epoch": 1267} {"train_loss": -9.553295135498047, "global_step": 212912, "epoch": 1267} {"train_loss": -8.763704299926758, "global_step": 212913, "epoch": 1267} {"train_loss": -10.633176803588867, "global_step": 212914, "epoch": 1267} {"train_loss": -8.382865905761719, "global_step": 212915, "epoch": 1267} {"train_loss": -9.371163368225098, "global_step": 212916, "epoch": 1267} {"train_loss": -8.456879615783691, "global_step": 212917, "epoch": 1267} {"train_loss": -7.893566131591797, "global_step": 212918, "epoch": 1267} {"train_loss": -8.886967658996582, "global_step": 212919, "epoch": 1267} {"train_loss": -10.353893280029297, "global_step": 212920, "epoch": 1267} {"train_loss": -9.889753341674805, "global_step": 212921, "epoch": 1267} {"train_loss": -9.381416320800781, "global_step": 212922, "epoch": 1267} {"train_loss": -9.307060241699219, "global_step": 212923, "epoch": 1267} {"train_loss": -10.228713989257812, "global_step": 212924, "epoch": 1267} {"train_loss": -10.03897762298584, "global_step": 212925, "epoch": 1267} {"train_loss": -9.572479248046875, "global_step": 212926, "epoch": 1267} {"train_loss": -9.561094284057617, "global_step": 212927, "epoch": 1267} {"train_loss": -10.3746337890625, "global_step": 212928, "epoch": 1267} {"train_loss": -9.47493839263916, "global_step": 212929, "epoch": 1267} {"train_loss": -10.51598834991455, "global_step": 212930, "epoch": 1267} {"train_loss": -10.760414123535156, "global_step": 212931, "epoch": 1267} {"train_loss": -10.629085540771484, "global_step": 212932, "epoch": 1267} {"train_loss": -10.352947235107422, "global_step": 212933, "epoch": 1267} {"train_loss": -10.998448371887207, "global_step": 212934, "epoch": 1267} {"train_loss": -10.736963272094727, "global_step": 212935, "epoch": 1267} {"train_loss": -11.035650253295898, "global_step": 212936, "epoch": 1267} {"train_loss": -10.524872779846191, "global_step": 212937, "epoch": 1267} {"train_loss": -10.957082748413086, "global_step": 212938, "epoch": 1267} {"train_loss": -10.65170669555664, "global_step": 212939, "epoch": 1267} {"train_loss": -10.88128662109375, "global_step": 212940, "epoch": 1267} {"train_loss": -11.058549880981445, "global_step": 212941, "epoch": 1267} {"train_loss": -11.063386917114258, "global_step": 212942, "epoch": 1267} {"train_loss": -11.075567245483398, "global_step": 212943, "epoch": 1267} {"train_loss": -11.130365371704102, "global_step": 212944, "epoch": 1267} {"train_loss": -11.283672332763672, "global_step": 212945, "epoch": 1267} {"train_loss": -11.23371696472168, "global_step": 212946, "epoch": 1267} {"train_loss": -11.19394302368164, "global_step": 212947, "epoch": 1267} {"train_loss": -11.222114562988281, "global_step": 212948, "epoch": 1267} {"train_loss": -11.198785781860352, "global_step": 212949, "epoch": 1267} {"train_loss": -11.338790893554688, "global_step": 212950, "epoch": 1267} {"train_loss": -11.301321029663086, "global_step": 212951, "epoch": 1267} {"train_loss": -11.178586959838867, "global_step": 212952, "epoch": 1267} {"train_loss": -11.106348037719727, "global_step": 212953, "epoch": 1267} {"train_loss": -11.305253982543945, "global_step": 212954, "epoch": 1267} {"train_loss": -11.1026611328125, "global_step": 212955, "epoch": 1267} {"train_loss": -11.306251525878906, "global_step": 212956, "epoch": 1267} {"train_loss": -11.419242858886719, "global_step": 212957, "epoch": 1267} {"train_loss": -11.234336853027344, "global_step": 212958, "epoch": 1267} {"train_loss": -11.413446426391602, "global_step": 212959, "epoch": 1267} {"train_loss": -11.209359169006348, "global_step": 212960, "epoch": 1267} {"train_loss": -11.586410522460938, "global_step": 212961, "epoch": 1267} {"train_loss": -11.101839065551758, "global_step": 212962, "epoch": 1267} {"train_loss": -11.410058975219727, "global_step": 212963, "epoch": 1267} {"train_loss": -11.296279907226562, "global_step": 212964, "epoch": 1267} {"train_loss": -11.472476959228516, "global_step": 212965, "epoch": 1267} {"train_loss": -11.48440933227539, "global_step": 212966, "epoch": 1267} {"train_loss": -11.420327186584473, "global_step": 212967, "epoch": 1267} {"train_loss": -11.421300888061523, "global_step": 212968, "epoch": 1267} {"train_loss": -11.537168502807617, "global_step": 212969, "epoch": 1267} {"train_loss": -11.521450996398926, "global_step": 212970, "epoch": 1267} {"train_loss": -11.47857666015625, "global_step": 212971, "epoch": 1267} {"train_loss": -11.318117141723633, "global_step": 212972, "epoch": 1267} {"train_loss": -11.537269592285156, "global_step": 212973, "epoch": 1267} {"train_loss": -11.481791496276855, "global_step": 212974, "epoch": 1267} {"train_loss": -11.317033767700195, "global_step": 212975, "epoch": 1267} {"train_loss": -11.653935432434082, "global_step": 212976, "epoch": 1267} {"train_loss": -11.238314628601074, "global_step": 212977, "epoch": 1267} {"train_loss": -11.3887939453125, "global_step": 212978, "epoch": 1267} {"train_loss": -11.717706680297852, "global_step": 212979, "epoch": 1267} {"train_loss": -11.592336654663086, "global_step": 212980, "epoch": 1267} {"train_loss": -11.649312973022461, "global_step": 212981, "epoch": 1267} {"train_loss": -11.614810943603516, "global_step": 212982, "epoch": 1267} {"train_loss": -11.549520492553711, "global_step": 212983, "epoch": 1267} {"train_loss": -11.62509536743164, "global_step": 212984, "epoch": 1267} {"train_loss": -11.655654907226562, "global_step": 212985, "epoch": 1267} {"train_loss": -11.772597312927246, "global_step": 212986, "epoch": 1267} {"train_loss": -11.566577911376953, "global_step": 212987, "epoch": 1267} {"train_loss": -11.827794075012207, "global_step": 212988, "epoch": 1267} {"train_loss": -11.638222694396973, "global_step": 212989, "epoch": 1267} {"train_loss": -11.691753387451172, "global_step": 212990, "epoch": 1267} {"train_loss": -11.855880737304688, "global_step": 212991, "epoch": 1267} {"train_loss": -11.669374465942383, "global_step": 212992, "epoch": 1267} {"train_loss": -11.865047454833984, "global_step": 212993, "epoch": 1267} {"train_loss": -11.65384292602539, "global_step": 212994, "epoch": 1267} {"train_loss": -11.695754051208496, "global_step": 212995, "epoch": 1267} {"train_loss": -11.667211532592773, "global_step": 212996, "epoch": 1267} {"train_loss": -11.850763320922852, "global_step": 212997, "epoch": 1267} {"train_loss": -11.642082214355469, "global_step": 212998, "epoch": 1267} {"train_loss": -11.699755668640137, "global_step": 212999, "epoch": 1267} {"train_loss": -11.679302215576172, "global_step": 213000, "epoch": 1267} {"train_loss": -11.645833969116211, "global_step": 213001, "epoch": 1267} {"train_loss": -11.73747444152832, "global_step": 213002, "epoch": 1267} {"train_loss": -11.867938995361328, "global_step": 213003, "epoch": 1267} {"train_loss": -11.752325057983398, "global_step": 213004, "epoch": 1267} {"train_loss": -11.769475936889648, "global_step": 213005, "epoch": 1267} {"train_loss": -11.834816932678223, "global_step": 213006, "epoch": 1267} {"train_loss": -11.681986808776855, "global_step": 213007, "epoch": 1267} {"train_loss": -11.699102401733398, "global_step": 213008, "epoch": 1267} {"train_loss": -11.409421920776367, "global_step": 213009, "epoch": 1267} {"train_loss": -11.44316291809082, "global_step": 213010, "epoch": 1267} {"train_loss": -11.508962631225586, "global_step": 213011, "epoch": 1267} {"train_loss": -11.7923583984375, "global_step": 213012, "epoch": 1267} {"train_loss": -11.625036239624023, "global_step": 213013, "epoch": 1267} {"train_loss": -11.626531600952148, "global_step": 213014, "epoch": 1267} {"train_loss": -11.707225799560547, "global_step": 213015, "epoch": 1267} {"train_loss": -11.31679916381836, "global_step": 213016, "epoch": 1267} {"train_loss": -11.526006698608398, "global_step": 213017, "epoch": 1267} {"train_loss": -11.75637435913086, "global_step": 213018, "epoch": 1267} {"train_loss": -11.795554161071777, "global_step": 213019, "epoch": 1267} {"train_loss": -11.639165878295898, "global_step": 213020, "epoch": 1267} {"train_loss": -11.919008255004883, "global_step": 213021, "epoch": 1267} {"train_loss": -11.608224868774414, "global_step": 213022, "epoch": 1267} {"train_loss": -11.197684651329403, "global_step": 213023, "epoch": 1267, "val_loss": 257242.640625} {"train_loss": -11.983560562133789, "global_step": 213024, "epoch": 1268} {"train_loss": -11.686342239379883, "global_step": 213025, "epoch": 1268} {"train_loss": -11.82166576385498, "global_step": 213026, "epoch": 1268} {"train_loss": -11.551677703857422, "global_step": 213027, "epoch": 1268} {"train_loss": -11.643186569213867, "global_step": 213028, "epoch": 1268} {"train_loss": -11.65194320678711, "global_step": 213029, "epoch": 1268} {"train_loss": -11.640726089477539, "global_step": 213030, "epoch": 1268} {"train_loss": -11.831527709960938, "global_step": 213031, "epoch": 1268} {"train_loss": -11.329143524169922, "global_step": 213032, "epoch": 1268} {"train_loss": -11.482246398925781, "global_step": 213033, "epoch": 1268} {"train_loss": -11.619646072387695, "global_step": 213034, "epoch": 1268} {"train_loss": -11.873738288879395, "global_step": 213035, "epoch": 1268} {"train_loss": -11.673900604248047, "global_step": 213036, "epoch": 1268} {"train_loss": -11.250287055969238, "global_step": 213037, "epoch": 1268} {"train_loss": -11.235651016235352, "global_step": 213038, "epoch": 1268} {"train_loss": -11.535417556762695, "global_step": 213039, "epoch": 1268} {"train_loss": -11.281566619873047, "global_step": 213040, "epoch": 1268} {"train_loss": -11.711512565612793, "global_step": 213041, "epoch": 1268} {"train_loss": -11.344234466552734, "global_step": 213042, "epoch": 1268} {"train_loss": -11.360000610351562, "global_step": 213043, "epoch": 1268} {"train_loss": -11.547996520996094, "global_step": 213044, "epoch": 1268} {"train_loss": -10.608811378479004, "global_step": 213045, "epoch": 1268} {"train_loss": -10.207670211791992, "global_step": 213046, "epoch": 1268} {"train_loss": -10.303070068359375, "global_step": 213047, "epoch": 1268} {"train_loss": -9.335203170776367, "global_step": 213048, "epoch": 1268} {"train_loss": -10.605999946594238, "global_step": 213049, "epoch": 1268} {"train_loss": -10.56376838684082, "global_step": 213050, "epoch": 1268} {"train_loss": -10.23519515991211, "global_step": 213051, "epoch": 1268} {"train_loss": -11.301949501037598, "global_step": 213052, "epoch": 1268} {"train_loss": -10.163064002990723, "global_step": 213053, "epoch": 1268} {"train_loss": -11.200668334960938, "global_step": 213054, "epoch": 1268} {"train_loss": -11.027955055236816, "global_step": 213055, "epoch": 1268} {"train_loss": -11.244160652160645, "global_step": 213056, "epoch": 1268} {"train_loss": -10.758577346801758, "global_step": 213057, "epoch": 1268} {"train_loss": -10.814508438110352, "global_step": 213058, "epoch": 1268} {"train_loss": -10.690528869628906, "global_step": 213059, "epoch": 1268} {"train_loss": -10.71041488647461, "global_step": 213060, "epoch": 1268} {"train_loss": -11.31393051147461, "global_step": 213061, "epoch": 1268} {"train_loss": -11.298437118530273, "global_step": 213062, "epoch": 1268} {"train_loss": -11.39285659790039, "global_step": 213063, "epoch": 1268} {"train_loss": -11.373125076293945, "global_step": 213064, "epoch": 1268} {"train_loss": -11.611255645751953, "global_step": 213065, "epoch": 1268} {"train_loss": -11.349100112915039, "global_step": 213066, "epoch": 1268} {"train_loss": -11.358240127563477, "global_step": 213067, "epoch": 1268} {"train_loss": -11.672630310058594, "global_step": 213068, "epoch": 1268} {"train_loss": -11.120260238647461, "global_step": 213069, "epoch": 1268} {"train_loss": -11.659067153930664, "global_step": 213070, "epoch": 1268} {"train_loss": -11.543854713439941, "global_step": 213071, "epoch": 1268} {"train_loss": -11.67201042175293, "global_step": 213072, "epoch": 1268} {"train_loss": -11.206446647644043, "global_step": 213073, "epoch": 1268} {"train_loss": -11.435568809509277, "global_step": 213074, "epoch": 1268} {"train_loss": -11.365626335144043, "global_step": 213075, "epoch": 1268} {"train_loss": -11.603096008300781, "global_step": 213076, "epoch": 1268} {"train_loss": -11.480469703674316, "global_step": 213077, "epoch": 1268} {"train_loss": -11.464606285095215, "global_step": 213078, "epoch": 1268} {"train_loss": -11.776289939880371, "global_step": 213079, "epoch": 1268} {"train_loss": -11.606751441955566, "global_step": 213080, "epoch": 1268} {"train_loss": -11.43384838104248, "global_step": 213081, "epoch": 1268} {"train_loss": -11.408756256103516, "global_step": 213082, "epoch": 1268} {"train_loss": -11.572568893432617, "global_step": 213083, "epoch": 1268} {"train_loss": -11.21921443939209, "global_step": 213084, "epoch": 1268} {"train_loss": -11.588125228881836, "global_step": 213085, "epoch": 1268} {"train_loss": -11.710000991821289, "global_step": 213086, "epoch": 1268} {"train_loss": -11.377365112304688, "global_step": 213087, "epoch": 1268} {"train_loss": -11.667648315429688, "global_step": 213088, "epoch": 1268} {"train_loss": -11.50600814819336, "global_step": 213089, "epoch": 1268} {"train_loss": -11.959287643432617, "global_step": 213090, "epoch": 1268} {"train_loss": -11.487602233886719, "global_step": 213091, "epoch": 1268} {"train_loss": -11.60595703125, "global_step": 213092, "epoch": 1268} {"train_loss": -11.515409469604492, "global_step": 213093, "epoch": 1268} {"train_loss": -11.611396789550781, "global_step": 213094, "epoch": 1268} {"train_loss": -11.421159744262695, "global_step": 213095, "epoch": 1268} {"train_loss": -11.613330841064453, "global_step": 213096, "epoch": 1268} {"train_loss": -11.727080345153809, "global_step": 213097, "epoch": 1268} {"train_loss": -11.684799194335938, "global_step": 213098, "epoch": 1268} {"train_loss": -11.321556091308594, "global_step": 213099, "epoch": 1268} {"train_loss": -11.548723220825195, "global_step": 213100, "epoch": 1268} {"train_loss": -11.458292007446289, "global_step": 213101, "epoch": 1268} {"train_loss": -11.815731048583984, "global_step": 213102, "epoch": 1268} {"train_loss": -11.176924705505371, "global_step": 213103, "epoch": 1268} {"train_loss": -11.407889366149902, "global_step": 213104, "epoch": 1268} {"train_loss": -11.503714561462402, "global_step": 213105, "epoch": 1268} {"train_loss": -11.888330459594727, "global_step": 213106, "epoch": 1268} {"train_loss": -11.555685043334961, "global_step": 213107, "epoch": 1268} {"train_loss": -11.451053619384766, "global_step": 213108, "epoch": 1268} {"train_loss": -11.606040954589844, "global_step": 213109, "epoch": 1268} {"train_loss": -11.735387802124023, "global_step": 213110, "epoch": 1268} {"train_loss": -11.769107818603516, "global_step": 213111, "epoch": 1268} {"train_loss": -11.27630615234375, "global_step": 213112, "epoch": 1268} {"train_loss": -11.59737777709961, "global_step": 213113, "epoch": 1268} {"train_loss": -11.432209014892578, "global_step": 213114, "epoch": 1268} {"train_loss": -11.751298904418945, "global_step": 213115, "epoch": 1268} {"train_loss": -11.40900993347168, "global_step": 213116, "epoch": 1268} {"train_loss": -11.491211891174316, "global_step": 213117, "epoch": 1268} {"train_loss": -11.66151237487793, "global_step": 213118, "epoch": 1268} {"train_loss": -11.644818305969238, "global_step": 213119, "epoch": 1268} {"train_loss": -11.346945762634277, "global_step": 213120, "epoch": 1268} {"train_loss": -11.255314826965332, "global_step": 213121, "epoch": 1268} {"train_loss": -11.410856246948242, "global_step": 213122, "epoch": 1268} {"train_loss": -10.925716400146484, "global_step": 213123, "epoch": 1268} {"train_loss": -10.384908676147461, "global_step": 213124, "epoch": 1268} {"train_loss": -10.556052207946777, "global_step": 213125, "epoch": 1268} {"train_loss": -10.880717277526855, "global_step": 213126, "epoch": 1268} {"train_loss": -10.886602401733398, "global_step": 213127, "epoch": 1268} {"train_loss": -10.750940322875977, "global_step": 213128, "epoch": 1268} {"train_loss": -11.069660186767578, "global_step": 213129, "epoch": 1268} {"train_loss": -10.346539497375488, "global_step": 213130, "epoch": 1268} {"train_loss": -11.779109001159668, "global_step": 213131, "epoch": 1268} {"train_loss": -10.515918731689453, "global_step": 213132, "epoch": 1268} {"train_loss": -11.35925006866455, "global_step": 213133, "epoch": 1268} {"train_loss": -10.927732467651367, "global_step": 213134, "epoch": 1268} {"train_loss": -10.741302490234375, "global_step": 213135, "epoch": 1268} {"train_loss": -11.30345344543457, "global_step": 213136, "epoch": 1268} {"train_loss": -10.891460418701172, "global_step": 213137, "epoch": 1268} {"train_loss": -11.089118957519531, "global_step": 213138, "epoch": 1268} {"train_loss": -11.122170448303223, "global_step": 213139, "epoch": 1268} {"train_loss": -10.732996940612793, "global_step": 213140, "epoch": 1268} {"train_loss": -11.135072708129883, "global_step": 213141, "epoch": 1268} {"train_loss": -11.065406799316406, "global_step": 213142, "epoch": 1268} {"train_loss": -11.326459884643555, "global_step": 213143, "epoch": 1268} {"train_loss": -10.91629695892334, "global_step": 213144, "epoch": 1268} {"train_loss": -11.33172607421875, "global_step": 213145, "epoch": 1268} {"train_loss": -11.063796997070312, "global_step": 213146, "epoch": 1268} {"train_loss": -11.363561630249023, "global_step": 213147, "epoch": 1268} {"train_loss": -10.840024948120117, "global_step": 213148, "epoch": 1268} {"train_loss": -11.061389923095703, "global_step": 213149, "epoch": 1268} {"train_loss": -10.378390312194824, "global_step": 213150, "epoch": 1268} {"train_loss": -11.206453323364258, "global_step": 213151, "epoch": 1268} {"train_loss": -10.757135391235352, "global_step": 213152, "epoch": 1268} {"train_loss": -10.575458526611328, "global_step": 213153, "epoch": 1268} {"train_loss": -11.542997360229492, "global_step": 213154, "epoch": 1268} {"train_loss": -10.660634994506836, "global_step": 213155, "epoch": 1268} {"train_loss": -11.5084228515625, "global_step": 213156, "epoch": 1268} {"train_loss": -10.601842880249023, "global_step": 213157, "epoch": 1268} {"train_loss": -11.253931045532227, "global_step": 213158, "epoch": 1268} {"train_loss": -11.119749069213867, "global_step": 213159, "epoch": 1268} {"train_loss": -11.183736801147461, "global_step": 213160, "epoch": 1268} {"train_loss": -11.13728141784668, "global_step": 213161, "epoch": 1268} {"train_loss": -11.38647174835205, "global_step": 213162, "epoch": 1268} {"train_loss": -10.823625564575195, "global_step": 213163, "epoch": 1268} {"train_loss": -11.582758903503418, "global_step": 213164, "epoch": 1268} {"train_loss": -11.545600891113281, "global_step": 213165, "epoch": 1268} {"train_loss": -11.427423477172852, "global_step": 213166, "epoch": 1268} {"train_loss": -11.526191711425781, "global_step": 213167, "epoch": 1268} {"train_loss": -11.569843292236328, "global_step": 213168, "epoch": 1268} {"train_loss": -11.73838996887207, "global_step": 213169, "epoch": 1268} {"train_loss": -11.181568145751953, "global_step": 213170, "epoch": 1268} {"train_loss": -11.424829483032227, "global_step": 213171, "epoch": 1268} {"train_loss": -11.227564811706543, "global_step": 213172, "epoch": 1268} {"train_loss": -11.29991340637207, "global_step": 213173, "epoch": 1268} {"train_loss": -11.657978057861328, "global_step": 213174, "epoch": 1268} {"train_loss": -11.178285598754883, "global_step": 213175, "epoch": 1268} {"train_loss": -11.697625160217285, "global_step": 213176, "epoch": 1268} {"train_loss": -11.289471626281738, "global_step": 213177, "epoch": 1268} {"train_loss": -11.423575401306152, "global_step": 213178, "epoch": 1268} {"train_loss": -11.531155586242676, "global_step": 213179, "epoch": 1268} {"train_loss": -11.502227783203125, "global_step": 213180, "epoch": 1268} {"train_loss": -11.620872497558594, "global_step": 213181, "epoch": 1268} {"train_loss": -11.409156799316406, "global_step": 213182, "epoch": 1268} {"train_loss": -11.602068901062012, "global_step": 213183, "epoch": 1268} {"train_loss": -11.707231521606445, "global_step": 213184, "epoch": 1268} {"train_loss": -11.672321319580078, "global_step": 213185, "epoch": 1268} {"train_loss": -11.416993141174316, "global_step": 213186, "epoch": 1268} {"train_loss": -11.606084823608398, "global_step": 213187, "epoch": 1268} {"train_loss": -11.587353706359863, "global_step": 213188, "epoch": 1268} {"train_loss": -11.64445686340332, "global_step": 213189, "epoch": 1268} {"train_loss": -11.639423370361328, "global_step": 213190, "epoch": 1268} {"train_loss": -11.304780273210435, "global_step": 213191, "epoch": 1268, "val_loss": 257102.140625} {"train_loss": -11.753416061401367, "global_step": 213192, "epoch": 1269} {"train_loss": -11.475375175476074, "global_step": 213193, "epoch": 1269} {"train_loss": -11.749688148498535, "global_step": 213194, "epoch": 1269} {"train_loss": -11.729808807373047, "global_step": 213195, "epoch": 1269} {"train_loss": -11.365617752075195, "global_step": 213196, "epoch": 1269} {"train_loss": -11.554706573486328, "global_step": 213197, "epoch": 1269} {"train_loss": -11.80175495147705, "global_step": 213198, "epoch": 1269} {"train_loss": -11.468011856079102, "global_step": 213199, "epoch": 1269} {"train_loss": -11.649906158447266, "global_step": 213200, "epoch": 1269} {"train_loss": -10.986543655395508, "global_step": 213201, "epoch": 1269} {"train_loss": -10.759841918945312, "global_step": 213202, "epoch": 1269} {"train_loss": -11.365318298339844, "global_step": 213203, "epoch": 1269} {"train_loss": -11.29149055480957, "global_step": 213204, "epoch": 1269} {"train_loss": -10.248567581176758, "global_step": 213205, "epoch": 1269} {"train_loss": -11.30663776397705, "global_step": 213206, "epoch": 1269} {"train_loss": -10.565654754638672, "global_step": 213207, "epoch": 1269} {"train_loss": -10.090811729431152, "global_step": 213208, "epoch": 1269} {"train_loss": -10.214345932006836, "global_step": 213209, "epoch": 1269} {"train_loss": -9.81776237487793, "global_step": 213210, "epoch": 1269} {"train_loss": -10.58031177520752, "global_step": 213211, "epoch": 1269} {"train_loss": -9.535029411315918, "global_step": 213212, "epoch": 1269} {"train_loss": -11.33320140838623, "global_step": 213213, "epoch": 1269} {"train_loss": -9.663286209106445, "global_step": 213214, "epoch": 1269} {"train_loss": -10.961334228515625, "global_step": 213215, "epoch": 1269} {"train_loss": -10.848711013793945, "global_step": 213216, "epoch": 1269} {"train_loss": -10.205362319946289, "global_step": 213217, "epoch": 1269} {"train_loss": -10.841419219970703, "global_step": 213218, "epoch": 1269} {"train_loss": -9.582178115844727, "global_step": 213219, "epoch": 1269} {"train_loss": -11.019493103027344, "global_step": 213220, "epoch": 1269} {"train_loss": -10.149735450744629, "global_step": 213221, "epoch": 1269} {"train_loss": -11.26132583618164, "global_step": 213222, "epoch": 1269} {"train_loss": -10.122156143188477, "global_step": 213223, "epoch": 1269} {"train_loss": -11.02546501159668, "global_step": 213224, "epoch": 1269} {"train_loss": -10.030941009521484, "global_step": 213225, "epoch": 1269} {"train_loss": -11.236520767211914, "global_step": 213226, "epoch": 1269} {"train_loss": -10.54306697845459, "global_step": 213227, "epoch": 1269} {"train_loss": -11.104009628295898, "global_step": 213228, "epoch": 1269} {"train_loss": -10.792581558227539, "global_step": 213229, "epoch": 1269} {"train_loss": -11.09787368774414, "global_step": 213230, "epoch": 1269} {"train_loss": -10.758155822753906, "global_step": 213231, "epoch": 1269} {"train_loss": -11.044954299926758, "global_step": 213232, "epoch": 1269} {"train_loss": -11.517768859863281, "global_step": 213233, "epoch": 1269} {"train_loss": -10.958077430725098, "global_step": 213234, "epoch": 1269} {"train_loss": -11.345368385314941, "global_step": 213235, "epoch": 1269} {"train_loss": -11.444692611694336, "global_step": 213236, "epoch": 1269} {"train_loss": -11.190149307250977, "global_step": 213237, "epoch": 1269} {"train_loss": -11.301276206970215, "global_step": 213238, "epoch": 1269} {"train_loss": -11.427075386047363, "global_step": 213239, "epoch": 1269} {"train_loss": -11.416586875915527, "global_step": 213240, "epoch": 1269} {"train_loss": -11.138284683227539, "global_step": 213241, "epoch": 1269} {"train_loss": -11.56204605102539, "global_step": 213242, "epoch": 1269} {"train_loss": -11.489033699035645, "global_step": 213243, "epoch": 1269} {"train_loss": -11.679180145263672, "global_step": 213244, "epoch": 1269} {"train_loss": -11.522684097290039, "global_step": 213245, "epoch": 1269} {"train_loss": -11.627452850341797, "global_step": 213246, "epoch": 1269} {"train_loss": -11.632281303405762, "global_step": 213247, "epoch": 1269} {"train_loss": -11.693082809448242, "global_step": 213248, "epoch": 1269} {"train_loss": -11.761058807373047, "global_step": 213249, "epoch": 1269} {"train_loss": -11.461885452270508, "global_step": 213250, "epoch": 1269} {"train_loss": -11.67679214477539, "global_step": 213251, "epoch": 1269} {"train_loss": -11.629354476928711, "global_step": 213252, "epoch": 1269} {"train_loss": -11.725400924682617, "global_step": 213253, "epoch": 1269} {"train_loss": -11.668984413146973, "global_step": 213254, "epoch": 1269} {"train_loss": -11.64120864868164, "global_step": 213255, "epoch": 1269} {"train_loss": -11.679723739624023, "global_step": 213256, "epoch": 1269} {"train_loss": -11.976059913635254, "global_step": 213257, "epoch": 1269} {"train_loss": -11.713373184204102, "global_step": 213258, "epoch": 1269} {"train_loss": -11.713241577148438, "global_step": 213259, "epoch": 1269} {"train_loss": -11.764989852905273, "global_step": 213260, "epoch": 1269} {"train_loss": -11.824090003967285, "global_step": 213261, "epoch": 1269} {"train_loss": -11.866121292114258, "global_step": 213262, "epoch": 1269} {"train_loss": -11.689127922058105, "global_step": 213263, "epoch": 1269} {"train_loss": -11.838556289672852, "global_step": 213264, "epoch": 1269} {"train_loss": -11.822969436645508, "global_step": 213265, "epoch": 1269} {"train_loss": -11.700211524963379, "global_step": 213266, "epoch": 1269} {"train_loss": -11.618731498718262, "global_step": 213267, "epoch": 1269} {"train_loss": -11.951605796813965, "global_step": 213268, "epoch": 1269} {"train_loss": -11.578840255737305, "global_step": 213269, "epoch": 1269} {"train_loss": -11.973687171936035, "global_step": 213270, "epoch": 1269} {"train_loss": -11.479040145874023, "global_step": 213271, "epoch": 1269} {"train_loss": -11.914754867553711, "global_step": 213272, "epoch": 1269} {"train_loss": -11.714345932006836, "global_step": 213273, "epoch": 1269} {"train_loss": -11.606616973876953, "global_step": 213274, "epoch": 1269} {"train_loss": -11.656301498413086, "global_step": 213275, "epoch": 1269} {"train_loss": -11.955828666687012, "global_step": 213276, "epoch": 1269} {"train_loss": -11.587156295776367, "global_step": 213277, "epoch": 1269} {"train_loss": -12.065685272216797, "global_step": 213278, "epoch": 1269} {"train_loss": -11.644996643066406, "global_step": 213279, "epoch": 1269} {"train_loss": -11.626933097839355, "global_step": 213280, "epoch": 1269} {"train_loss": -11.86738395690918, "global_step": 213281, "epoch": 1269} {"train_loss": -11.832523345947266, "global_step": 213282, "epoch": 1269} {"train_loss": -12.021064758300781, "global_step": 213283, "epoch": 1269} {"train_loss": -11.788455963134766, "global_step": 213284, "epoch": 1269} {"train_loss": -11.68166732788086, "global_step": 213285, "epoch": 1269} {"train_loss": -11.616684913635254, "global_step": 213286, "epoch": 1269} {"train_loss": -11.838032722473145, "global_step": 213287, "epoch": 1269} {"train_loss": -11.962834358215332, "global_step": 213288, "epoch": 1269} {"train_loss": -11.716724395751953, "global_step": 213289, "epoch": 1269} {"train_loss": -11.838953971862793, "global_step": 213290, "epoch": 1269} {"train_loss": -11.945267677307129, "global_step": 213291, "epoch": 1269} {"train_loss": -11.73541259765625, "global_step": 213292, "epoch": 1269} {"train_loss": -11.64857292175293, "global_step": 213293, "epoch": 1269} {"train_loss": -11.921538352966309, "global_step": 213294, "epoch": 1269} {"train_loss": -11.590666770935059, "global_step": 213295, "epoch": 1269} {"train_loss": -11.479341506958008, "global_step": 213296, "epoch": 1269} {"train_loss": -11.565258026123047, "global_step": 213297, "epoch": 1269} {"train_loss": -11.562780380249023, "global_step": 213298, "epoch": 1269} {"train_loss": -11.698441505432129, "global_step": 213299, "epoch": 1269} {"train_loss": -10.482885360717773, "global_step": 213300, "epoch": 1269} {"train_loss": -10.55410385131836, "global_step": 213301, "epoch": 1269} {"train_loss": -11.339221954345703, "global_step": 213302, "epoch": 1269} {"train_loss": -11.324356079101562, "global_step": 213303, "epoch": 1269} {"train_loss": -9.410442352294922, "global_step": 213304, "epoch": 1269} {"train_loss": -10.716184616088867, "global_step": 213305, "epoch": 1269} {"train_loss": -10.094527244567871, "global_step": 213306, "epoch": 1269} {"train_loss": -8.399477005004883, "global_step": 213307, "epoch": 1269} {"train_loss": -9.488142967224121, "global_step": 213308, "epoch": 1269} {"train_loss": -10.107121467590332, "global_step": 213309, "epoch": 1269} {"train_loss": -9.921712875366211, "global_step": 213310, "epoch": 1269} {"train_loss": -10.071651458740234, "global_step": 213311, "epoch": 1269} {"train_loss": -10.808609962463379, "global_step": 213312, "epoch": 1269} {"train_loss": -10.369743347167969, "global_step": 213313, "epoch": 1269} {"train_loss": -10.620692253112793, "global_step": 213314, "epoch": 1269} {"train_loss": -10.708792686462402, "global_step": 213315, "epoch": 1269} {"train_loss": -10.765764236450195, "global_step": 213316, "epoch": 1269} {"train_loss": -9.876769065856934, "global_step": 213317, "epoch": 1269} {"train_loss": -11.223820686340332, "global_step": 213318, "epoch": 1269} {"train_loss": -9.845582962036133, "global_step": 213319, "epoch": 1269} {"train_loss": -10.614678382873535, "global_step": 213320, "epoch": 1269} {"train_loss": -10.949017524719238, "global_step": 213321, "epoch": 1269} {"train_loss": -9.879011154174805, "global_step": 213322, "epoch": 1269} {"train_loss": -10.94294548034668, "global_step": 213323, "epoch": 1269} {"train_loss": -10.284697532653809, "global_step": 213324, "epoch": 1269} {"train_loss": -9.921977996826172, "global_step": 213325, "epoch": 1269} {"train_loss": -11.339695930480957, "global_step": 213326, "epoch": 1269} {"train_loss": -9.604703903198242, "global_step": 213327, "epoch": 1269} {"train_loss": -11.142496109008789, "global_step": 213328, "epoch": 1269} {"train_loss": -10.475728988647461, "global_step": 213329, "epoch": 1269} {"train_loss": -9.955524444580078, "global_step": 213330, "epoch": 1269} {"train_loss": -10.6751070022583, "global_step": 213331, "epoch": 1269} {"train_loss": -10.193675994873047, "global_step": 213332, "epoch": 1269} {"train_loss": -9.807855606079102, "global_step": 213333, "epoch": 1269} {"train_loss": -11.298616409301758, "global_step": 213334, "epoch": 1269} {"train_loss": -10.28866958618164, "global_step": 213335, "epoch": 1269} {"train_loss": -10.58822250366211, "global_step": 213336, "epoch": 1269} {"train_loss": -11.117788314819336, "global_step": 213337, "epoch": 1269} {"train_loss": -10.304281234741211, "global_step": 213338, "epoch": 1269} {"train_loss": -11.21832275390625, "global_step": 213339, "epoch": 1269} {"train_loss": -10.993865966796875, "global_step": 213340, "epoch": 1269} {"train_loss": -11.075339317321777, "global_step": 213341, "epoch": 1269} {"train_loss": -11.023143768310547, "global_step": 213342, "epoch": 1269} {"train_loss": -11.146987915039062, "global_step": 213343, "epoch": 1269} {"train_loss": -11.010797500610352, "global_step": 213344, "epoch": 1269} {"train_loss": -11.152053833007812, "global_step": 213345, "epoch": 1269} {"train_loss": -11.274078369140625, "global_step": 213346, "epoch": 1269} {"train_loss": -11.209211349487305, "global_step": 213347, "epoch": 1269} {"train_loss": -11.336359024047852, "global_step": 213348, "epoch": 1269} {"train_loss": -11.242744445800781, "global_step": 213349, "epoch": 1269} {"train_loss": -11.013823509216309, "global_step": 213350, "epoch": 1269} {"train_loss": -11.286951065063477, "global_step": 213351, "epoch": 1269} {"train_loss": -11.23073673248291, "global_step": 213352, "epoch": 1269} {"train_loss": -11.412225723266602, "global_step": 213353, "epoch": 1269} {"train_loss": -11.395071029663086, "global_step": 213354, "epoch": 1269} {"train_loss": -11.432126998901367, "global_step": 213355, "epoch": 1269} {"train_loss": -11.405397415161133, "global_step": 213356, "epoch": 1269} {"train_loss": -11.602209091186523, "global_step": 213357, "epoch": 1269} {"train_loss": -11.32109260559082, "global_step": 213358, "epoch": 1269} {"train_loss": -11.121291824749537, "global_step": 213359, "epoch": 1269, "val_loss": 257052.125} {"train_loss": -11.474709510803223, "global_step": 213360, "epoch": 1270} {"train_loss": -11.339466094970703, "global_step": 213361, "epoch": 1270} {"train_loss": -11.48206901550293, "global_step": 213362, "epoch": 1270} {"train_loss": -11.555571556091309, "global_step": 213363, "epoch": 1270} {"train_loss": -11.527084350585938, "global_step": 213364, "epoch": 1270} {"train_loss": -11.654643058776855, "global_step": 213365, "epoch": 1270} {"train_loss": -11.541666984558105, "global_step": 213366, "epoch": 1270} {"train_loss": -11.702999114990234, "global_step": 213367, "epoch": 1270} {"train_loss": -11.567296981811523, "global_step": 213368, "epoch": 1270} {"train_loss": -11.58071517944336, "global_step": 213369, "epoch": 1270} {"train_loss": -11.344517707824707, "global_step": 213370, "epoch": 1270} {"train_loss": -11.662717819213867, "global_step": 213371, "epoch": 1270} {"train_loss": -11.487640380859375, "global_step": 213372, "epoch": 1270} {"train_loss": -11.623106956481934, "global_step": 213373, "epoch": 1270} {"train_loss": -11.649191856384277, "global_step": 213374, "epoch": 1270} {"train_loss": -11.777728080749512, "global_step": 213375, "epoch": 1270} {"train_loss": -11.753887176513672, "global_step": 213376, "epoch": 1270} {"train_loss": -11.712015151977539, "global_step": 213377, "epoch": 1270} {"train_loss": -11.57451343536377, "global_step": 213378, "epoch": 1270} {"train_loss": -11.76965618133545, "global_step": 213379, "epoch": 1270} {"train_loss": -11.712624549865723, "global_step": 213380, "epoch": 1270} {"train_loss": -11.837921142578125, "global_step": 213381, "epoch": 1270} {"train_loss": -11.584503173828125, "global_step": 213382, "epoch": 1270} {"train_loss": -11.802706718444824, "global_step": 213383, "epoch": 1270} {"train_loss": -11.656720161437988, "global_step": 213384, "epoch": 1270} {"train_loss": -11.827495574951172, "global_step": 213385, "epoch": 1270} {"train_loss": -11.795732498168945, "global_step": 213386, "epoch": 1270} {"train_loss": -11.723016738891602, "global_step": 213387, "epoch": 1270} {"train_loss": -11.781871795654297, "global_step": 213388, "epoch": 1270} {"train_loss": -11.66096019744873, "global_step": 213389, "epoch": 1270} {"train_loss": -11.597602844238281, "global_step": 213390, "epoch": 1270} {"train_loss": -11.980646133422852, "global_step": 213391, "epoch": 1270} {"train_loss": -11.701321601867676, "global_step": 213392, "epoch": 1270} {"train_loss": -11.922066688537598, "global_step": 213393, "epoch": 1270} {"train_loss": -11.473356246948242, "global_step": 213394, "epoch": 1270} {"train_loss": -12.027427673339844, "global_step": 213395, "epoch": 1270} {"train_loss": -11.747987747192383, "global_step": 213396, "epoch": 1270} {"train_loss": -12.046348571777344, "global_step": 213397, "epoch": 1270} {"train_loss": -11.744732856750488, "global_step": 213398, "epoch": 1270} {"train_loss": -11.761772155761719, "global_step": 213399, "epoch": 1270} {"train_loss": -11.674402236938477, "global_step": 213400, "epoch": 1270} {"train_loss": -11.74671745300293, "global_step": 213401, "epoch": 1270} {"train_loss": -11.552764892578125, "global_step": 213402, "epoch": 1270} {"train_loss": -11.815717697143555, "global_step": 213403, "epoch": 1270} {"train_loss": -11.546578407287598, "global_step": 213404, "epoch": 1270} {"train_loss": -10.837215423583984, "global_step": 213405, "epoch": 1270} {"train_loss": -10.585592269897461, "global_step": 213406, "epoch": 1270} {"train_loss": -11.320606231689453, "global_step": 213407, "epoch": 1270} {"train_loss": -11.582536697387695, "global_step": 213408, "epoch": 1270} {"train_loss": -11.609465599060059, "global_step": 213409, "epoch": 1270} {"train_loss": -11.110391616821289, "global_step": 213410, "epoch": 1270} {"train_loss": -11.659786224365234, "global_step": 213411, "epoch": 1270} {"train_loss": -11.501656532287598, "global_step": 213412, "epoch": 1270} {"train_loss": -11.772770881652832, "global_step": 213413, "epoch": 1270} {"train_loss": -10.887134552001953, "global_step": 213414, "epoch": 1270} {"train_loss": -11.445659637451172, "global_step": 213415, "epoch": 1270} {"train_loss": -11.635697364807129, "global_step": 213416, "epoch": 1270} {"train_loss": -11.155176162719727, "global_step": 213417, "epoch": 1270} {"train_loss": -11.800384521484375, "global_step": 213418, "epoch": 1270} {"train_loss": -11.483980178833008, "global_step": 213419, "epoch": 1270} {"train_loss": -10.876253128051758, "global_step": 213420, "epoch": 1270} {"train_loss": -11.521953582763672, "global_step": 213421, "epoch": 1270} {"train_loss": -11.400585174560547, "global_step": 213422, "epoch": 1270} {"train_loss": -11.317357063293457, "global_step": 213423, "epoch": 1270} {"train_loss": -11.873346328735352, "global_step": 213424, "epoch": 1270} {"train_loss": -11.294700622558594, "global_step": 213425, "epoch": 1270} {"train_loss": -11.477062225341797, "global_step": 213426, "epoch": 1270} {"train_loss": -11.041935920715332, "global_step": 213427, "epoch": 1270} {"train_loss": -11.041267395019531, "global_step": 213428, "epoch": 1270} {"train_loss": -11.145660400390625, "global_step": 213429, "epoch": 1270} {"train_loss": -11.852458953857422, "global_step": 213430, "epoch": 1270} {"train_loss": -10.93925952911377, "global_step": 213431, "epoch": 1270} {"train_loss": -11.512134552001953, "global_step": 213432, "epoch": 1270} {"train_loss": -10.860830307006836, "global_step": 213433, "epoch": 1270} {"train_loss": -11.293601989746094, "global_step": 213434, "epoch": 1270} {"train_loss": -11.379127502441406, "global_step": 213435, "epoch": 1270} {"train_loss": -11.541107177734375, "global_step": 213436, "epoch": 1270} {"train_loss": -11.415992736816406, "global_step": 213437, "epoch": 1270} {"train_loss": -11.62557315826416, "global_step": 213438, "epoch": 1270} {"train_loss": -11.161649703979492, "global_step": 213439, "epoch": 1270} {"train_loss": -11.654975891113281, "global_step": 213440, "epoch": 1270} {"train_loss": -11.347989082336426, "global_step": 213441, "epoch": 1270} {"train_loss": -11.746788024902344, "global_step": 213442, "epoch": 1270} {"train_loss": -11.215713500976562, "global_step": 213443, "epoch": 1270} {"train_loss": -11.740388870239258, "global_step": 213444, "epoch": 1270} {"train_loss": -11.509809494018555, "global_step": 213445, "epoch": 1270} {"train_loss": -11.13011646270752, "global_step": 213446, "epoch": 1270} {"train_loss": -11.467611312866211, "global_step": 213447, "epoch": 1270} {"train_loss": -11.530387878417969, "global_step": 213448, "epoch": 1270} {"train_loss": -11.239158630371094, "global_step": 213449, "epoch": 1270} {"train_loss": -11.331984519958496, "global_step": 213450, "epoch": 1270} {"train_loss": -11.464483261108398, "global_step": 213451, "epoch": 1270} {"train_loss": -11.41671085357666, "global_step": 213452, "epoch": 1270} {"train_loss": -11.475229263305664, "global_step": 213453, "epoch": 1270} {"train_loss": -11.221205711364746, "global_step": 213454, "epoch": 1270} {"train_loss": -11.22547435760498, "global_step": 213455, "epoch": 1270} {"train_loss": -11.353727340698242, "global_step": 213456, "epoch": 1270} {"train_loss": -11.26015853881836, "global_step": 213457, "epoch": 1270} {"train_loss": -10.860759735107422, "global_step": 213458, "epoch": 1270} {"train_loss": -11.64628791809082, "global_step": 213459, "epoch": 1270} {"train_loss": -10.39151668548584, "global_step": 213460, "epoch": 1270} {"train_loss": -11.173944473266602, "global_step": 213461, "epoch": 1270} {"train_loss": -11.05238151550293, "global_step": 213462, "epoch": 1270} {"train_loss": -10.403006553649902, "global_step": 213463, "epoch": 1270} {"train_loss": -11.613603591918945, "global_step": 213464, "epoch": 1270} {"train_loss": -10.25338363647461, "global_step": 213465, "epoch": 1270} {"train_loss": -11.030439376831055, "global_step": 213466, "epoch": 1270} {"train_loss": -11.259532928466797, "global_step": 213467, "epoch": 1270} {"train_loss": -11.180967330932617, "global_step": 213468, "epoch": 1270} {"train_loss": -11.398990631103516, "global_step": 213469, "epoch": 1270} {"train_loss": -11.099888801574707, "global_step": 213470, "epoch": 1270} {"train_loss": -11.421154022216797, "global_step": 213471, "epoch": 1270} {"train_loss": -11.117345809936523, "global_step": 213472, "epoch": 1270} {"train_loss": -11.048316955566406, "global_step": 213473, "epoch": 1270} {"train_loss": -11.178736686706543, "global_step": 213474, "epoch": 1270} {"train_loss": -11.241013526916504, "global_step": 213475, "epoch": 1270} {"train_loss": -11.328963279724121, "global_step": 213476, "epoch": 1270} {"train_loss": -10.968452453613281, "global_step": 213477, "epoch": 1270} {"train_loss": -11.380083084106445, "global_step": 213478, "epoch": 1270} {"train_loss": -11.329593658447266, "global_step": 213479, "epoch": 1270} {"train_loss": -11.30676555633545, "global_step": 213480, "epoch": 1270} {"train_loss": -11.618468284606934, "global_step": 213481, "epoch": 1270} {"train_loss": -11.339092254638672, "global_step": 213482, "epoch": 1270} {"train_loss": -11.500741958618164, "global_step": 213483, "epoch": 1270} {"train_loss": -11.480082511901855, "global_step": 213484, "epoch": 1270} {"train_loss": -11.643495559692383, "global_step": 213485, "epoch": 1270} {"train_loss": -11.421112060546875, "global_step": 213486, "epoch": 1270} {"train_loss": -11.392987251281738, "global_step": 213487, "epoch": 1270} {"train_loss": -11.688741683959961, "global_step": 213488, "epoch": 1270} {"train_loss": -11.752376556396484, "global_step": 213489, "epoch": 1270} {"train_loss": -11.698017120361328, "global_step": 213490, "epoch": 1270} {"train_loss": -11.393903732299805, "global_step": 213491, "epoch": 1270} {"train_loss": -11.777631759643555, "global_step": 213492, "epoch": 1270} {"train_loss": -11.269308090209961, "global_step": 213493, "epoch": 1270} {"train_loss": -11.797496795654297, "global_step": 213494, "epoch": 1270} {"train_loss": -11.620735168457031, "global_step": 213495, "epoch": 1270} {"train_loss": -11.690666198730469, "global_step": 213496, "epoch": 1270} {"train_loss": -11.630245208740234, "global_step": 213497, "epoch": 1270} {"train_loss": -11.465340614318848, "global_step": 213498, "epoch": 1270} {"train_loss": -11.475570678710938, "global_step": 213499, "epoch": 1270} {"train_loss": -11.65210247039795, "global_step": 213500, "epoch": 1270} {"train_loss": -11.797286987304688, "global_step": 213501, "epoch": 1270} {"train_loss": -11.733354568481445, "global_step": 213502, "epoch": 1270} {"train_loss": -11.62380599975586, "global_step": 213503, "epoch": 1270} {"train_loss": -11.856186866760254, "global_step": 213504, "epoch": 1270} {"train_loss": -11.571330070495605, "global_step": 213505, "epoch": 1270} {"train_loss": -11.41293716430664, "global_step": 213506, "epoch": 1270} {"train_loss": -11.633079528808594, "global_step": 213507, "epoch": 1270} {"train_loss": -11.25421142578125, "global_step": 213508, "epoch": 1270} {"train_loss": -11.719049453735352, "global_step": 213509, "epoch": 1270} {"train_loss": -11.793190002441406, "global_step": 213510, "epoch": 1270} {"train_loss": -11.614447593688965, "global_step": 213511, "epoch": 1270} {"train_loss": -11.976348876953125, "global_step": 213512, "epoch": 1270} {"train_loss": -11.515972137451172, "global_step": 213513, "epoch": 1270} {"train_loss": -11.689262390136719, "global_step": 213514, "epoch": 1270} {"train_loss": -11.381473541259766, "global_step": 213515, "epoch": 1270} {"train_loss": -11.185432434082031, "global_step": 213516, "epoch": 1270} {"train_loss": -11.045141220092773, "global_step": 213517, "epoch": 1270} {"train_loss": -11.56743049621582, "global_step": 213518, "epoch": 1270} {"train_loss": -10.004921913146973, "global_step": 213519, "epoch": 1270} {"train_loss": -11.571246147155762, "global_step": 213520, "epoch": 1270} {"train_loss": -9.992660522460938, "global_step": 213521, "epoch": 1270} {"train_loss": -9.68528938293457, "global_step": 213522, "epoch": 1270} {"train_loss": -11.14653491973877, "global_step": 213523, "epoch": 1270} {"train_loss": -10.103931427001953, "global_step": 213524, "epoch": 1270} {"train_loss": -11.415255546569824, "global_step": 213525, "epoch": 1270} {"train_loss": -10.36825180053711, "global_step": 213526, "epoch": 1270} {"train_loss": -11.422897685141791, "global_step": 213527, "epoch": 1270, "val_loss": 256518.640625, "train_action_mse_error": 0.5448205471038818} {"train_loss": -10.227727890014648, "global_step": 213528, "epoch": 1271} {"train_loss": -11.234607696533203, "global_step": 213529, "epoch": 1271} {"train_loss": -10.91313362121582, "global_step": 213530, "epoch": 1271} {"train_loss": -11.449953079223633, "global_step": 213531, "epoch": 1271} {"train_loss": -11.25648307800293, "global_step": 213532, "epoch": 1271} {"train_loss": -11.063811302185059, "global_step": 213533, "epoch": 1271} {"train_loss": -11.108100891113281, "global_step": 213534, "epoch": 1271} {"train_loss": -11.234033584594727, "global_step": 213535, "epoch": 1271} {"train_loss": -11.217130661010742, "global_step": 213536, "epoch": 1271} {"train_loss": -11.0538969039917, "global_step": 213537, "epoch": 1271} {"train_loss": -11.43557071685791, "global_step": 213538, "epoch": 1271} {"train_loss": -10.976306915283203, "global_step": 213539, "epoch": 1271} {"train_loss": -10.934212684631348, "global_step": 213540, "epoch": 1271} {"train_loss": -11.541620254516602, "global_step": 213541, "epoch": 1271} {"train_loss": -10.772424697875977, "global_step": 213542, "epoch": 1271} {"train_loss": -11.46026611328125, "global_step": 213543, "epoch": 1271} {"train_loss": -10.69756031036377, "global_step": 213544, "epoch": 1271} {"train_loss": -10.712990760803223, "global_step": 213545, "epoch": 1271} {"train_loss": -10.096357345581055, "global_step": 213546, "epoch": 1271} {"train_loss": -10.752297401428223, "global_step": 213547, "epoch": 1271} {"train_loss": -10.392776489257812, "global_step": 213548, "epoch": 1271} {"train_loss": -10.70573902130127, "global_step": 213549, "epoch": 1271} {"train_loss": -10.746474266052246, "global_step": 213550, "epoch": 1271} {"train_loss": -10.456645965576172, "global_step": 213551, "epoch": 1271} {"train_loss": -10.964948654174805, "global_step": 213552, "epoch": 1271} {"train_loss": -10.992279052734375, "global_step": 213553, "epoch": 1271} {"train_loss": -10.475848197937012, "global_step": 213554, "epoch": 1271} {"train_loss": -11.28571891784668, "global_step": 213555, "epoch": 1271} {"train_loss": -10.68825912475586, "global_step": 213556, "epoch": 1271} {"train_loss": -11.20371150970459, "global_step": 213557, "epoch": 1271} {"train_loss": -10.662391662597656, "global_step": 213558, "epoch": 1271} {"train_loss": -11.493249893188477, "global_step": 213559, "epoch": 1271} {"train_loss": -11.175721168518066, "global_step": 213560, "epoch": 1271} {"train_loss": -11.128114700317383, "global_step": 213561, "epoch": 1271} {"train_loss": -11.019149780273438, "global_step": 213562, "epoch": 1271} {"train_loss": -10.651822090148926, "global_step": 213563, "epoch": 1271} {"train_loss": -11.606012344360352, "global_step": 213564, "epoch": 1271} {"train_loss": -10.753069877624512, "global_step": 213565, "epoch": 1271} {"train_loss": -11.271696090698242, "global_step": 213566, "epoch": 1271} {"train_loss": -11.262340545654297, "global_step": 213567, "epoch": 1271} {"train_loss": -11.083094596862793, "global_step": 213568, "epoch": 1271} {"train_loss": -11.188858032226562, "global_step": 213569, "epoch": 1271} {"train_loss": -10.908575057983398, "global_step": 213570, "epoch": 1271} {"train_loss": -11.504379272460938, "global_step": 213571, "epoch": 1271} {"train_loss": -11.102287292480469, "global_step": 213572, "epoch": 1271} {"train_loss": -11.554235458374023, "global_step": 213573, "epoch": 1271} {"train_loss": -11.374149322509766, "global_step": 213574, "epoch": 1271} {"train_loss": -11.391995429992676, "global_step": 213575, "epoch": 1271} {"train_loss": -11.24215030670166, "global_step": 213576, "epoch": 1271} {"train_loss": -11.477643966674805, "global_step": 213577, "epoch": 1271} {"train_loss": -11.55133056640625, "global_step": 213578, "epoch": 1271} {"train_loss": -11.37485122680664, "global_step": 213579, "epoch": 1271} {"train_loss": -11.59444522857666, "global_step": 213580, "epoch": 1271} {"train_loss": -11.736042022705078, "global_step": 213581, "epoch": 1271} {"train_loss": -11.384305953979492, "global_step": 213582, "epoch": 1271} {"train_loss": -11.370079040527344, "global_step": 213583, "epoch": 1271} {"train_loss": -11.338346481323242, "global_step": 213584, "epoch": 1271} {"train_loss": -11.493011474609375, "global_step": 213585, "epoch": 1271} {"train_loss": -11.220268249511719, "global_step": 213586, "epoch": 1271} {"train_loss": -11.610115051269531, "global_step": 213587, "epoch": 1271} {"train_loss": -11.39146900177002, "global_step": 213588, "epoch": 1271} {"train_loss": -11.671257019042969, "global_step": 213589, "epoch": 1271} {"train_loss": -11.359095573425293, "global_step": 213590, "epoch": 1271} {"train_loss": -11.468826293945312, "global_step": 213591, "epoch": 1271} {"train_loss": -11.632325172424316, "global_step": 213592, "epoch": 1271} {"train_loss": -11.518755912780762, "global_step": 213593, "epoch": 1271} {"train_loss": -11.46619701385498, "global_step": 213594, "epoch": 1271} {"train_loss": -11.411928176879883, "global_step": 213595, "epoch": 1271} {"train_loss": -11.464117050170898, "global_step": 213596, "epoch": 1271} {"train_loss": -11.372842788696289, "global_step": 213597, "epoch": 1271} {"train_loss": -11.421220779418945, "global_step": 213598, "epoch": 1271} {"train_loss": -11.767278671264648, "global_step": 213599, "epoch": 1271} {"train_loss": -11.456350326538086, "global_step": 213600, "epoch": 1271} {"train_loss": -11.774231910705566, "global_step": 213601, "epoch": 1271} {"train_loss": -11.373836517333984, "global_step": 213602, "epoch": 1271} {"train_loss": -11.657523155212402, "global_step": 213603, "epoch": 1271} {"train_loss": -11.52081298828125, "global_step": 213604, "epoch": 1271} {"train_loss": -11.524009704589844, "global_step": 213605, "epoch": 1271} {"train_loss": -11.67951774597168, "global_step": 213606, "epoch": 1271} {"train_loss": -11.842601776123047, "global_step": 213607, "epoch": 1271} {"train_loss": -11.758172988891602, "global_step": 213608, "epoch": 1271} {"train_loss": -11.759125709533691, "global_step": 213609, "epoch": 1271} {"train_loss": -11.888975143432617, "global_step": 213610, "epoch": 1271} {"train_loss": -11.48495864868164, "global_step": 213611, "epoch": 1271} {"train_loss": -11.692702293395996, "global_step": 213612, "epoch": 1271} {"train_loss": -11.600543975830078, "global_step": 213613, "epoch": 1271} {"train_loss": -11.745012283325195, "global_step": 213614, "epoch": 1271} {"train_loss": -11.613475799560547, "global_step": 213615, "epoch": 1271} {"train_loss": -11.759491920471191, "global_step": 213616, "epoch": 1271} {"train_loss": -11.096809387207031, "global_step": 213617, "epoch": 1271} {"train_loss": -11.218080520629883, "global_step": 213618, "epoch": 1271} {"train_loss": -11.571858406066895, "global_step": 213619, "epoch": 1271} {"train_loss": -11.50140380859375, "global_step": 213620, "epoch": 1271} {"train_loss": -11.359893798828125, "global_step": 213621, "epoch": 1271} {"train_loss": -11.456245422363281, "global_step": 213622, "epoch": 1271} {"train_loss": -11.258691787719727, "global_step": 213623, "epoch": 1271} {"train_loss": -11.580138206481934, "global_step": 213624, "epoch": 1271} {"train_loss": -11.093705177307129, "global_step": 213625, "epoch": 1271} {"train_loss": -11.408591270446777, "global_step": 213626, "epoch": 1271} {"train_loss": -11.538275718688965, "global_step": 213627, "epoch": 1271} {"train_loss": -11.296552658081055, "global_step": 213628, "epoch": 1271} {"train_loss": -11.446112632751465, "global_step": 213629, "epoch": 1271} {"train_loss": -11.269728660583496, "global_step": 213630, "epoch": 1271} {"train_loss": -10.833574295043945, "global_step": 213631, "epoch": 1271} {"train_loss": -11.521655082702637, "global_step": 213632, "epoch": 1271} {"train_loss": -11.228507995605469, "global_step": 213633, "epoch": 1271} {"train_loss": -11.241247177124023, "global_step": 213634, "epoch": 1271} {"train_loss": -11.812854766845703, "global_step": 213635, "epoch": 1271} {"train_loss": -11.48060417175293, "global_step": 213636, "epoch": 1271} {"train_loss": -11.725722312927246, "global_step": 213637, "epoch": 1271} {"train_loss": -11.711606979370117, "global_step": 213638, "epoch": 1271} {"train_loss": -11.588582992553711, "global_step": 213639, "epoch": 1271} {"train_loss": -11.953825950622559, "global_step": 213640, "epoch": 1271} {"train_loss": -11.14826488494873, "global_step": 213641, "epoch": 1271} {"train_loss": -11.072929382324219, "global_step": 213642, "epoch": 1271} {"train_loss": -11.689861297607422, "global_step": 213643, "epoch": 1271} {"train_loss": -11.42919921875, "global_step": 213644, "epoch": 1271} {"train_loss": -11.772258758544922, "global_step": 213645, "epoch": 1271} {"train_loss": -11.50323486328125, "global_step": 213646, "epoch": 1271} {"train_loss": -11.467463493347168, "global_step": 213647, "epoch": 1271} {"train_loss": -11.888580322265625, "global_step": 213648, "epoch": 1271} {"train_loss": -11.403526306152344, "global_step": 213649, "epoch": 1271} {"train_loss": -11.423809051513672, "global_step": 213650, "epoch": 1271} {"train_loss": -11.489463806152344, "global_step": 213651, "epoch": 1271} {"train_loss": -11.767251014709473, "global_step": 213652, "epoch": 1271} {"train_loss": -11.311426162719727, "global_step": 213653, "epoch": 1271} {"train_loss": -11.692292213439941, "global_step": 213654, "epoch": 1271} {"train_loss": -11.607967376708984, "global_step": 213655, "epoch": 1271} {"train_loss": -11.510004997253418, "global_step": 213656, "epoch": 1271} {"train_loss": -11.866629600524902, "global_step": 213657, "epoch": 1271} {"train_loss": -11.720291137695312, "global_step": 213658, "epoch": 1271} {"train_loss": -11.726020812988281, "global_step": 213659, "epoch": 1271} {"train_loss": -11.799980163574219, "global_step": 213660, "epoch": 1271} {"train_loss": -11.623346328735352, "global_step": 213661, "epoch": 1271} {"train_loss": -11.742496490478516, "global_step": 213662, "epoch": 1271} {"train_loss": -11.97362232208252, "global_step": 213663, "epoch": 1271} {"train_loss": -11.75216293334961, "global_step": 213664, "epoch": 1271} {"train_loss": -11.641955375671387, "global_step": 213665, "epoch": 1271} {"train_loss": -11.87515926361084, "global_step": 213666, "epoch": 1271} {"train_loss": -11.596758842468262, "global_step": 213667, "epoch": 1271} {"train_loss": -11.880149841308594, "global_step": 213668, "epoch": 1271} {"train_loss": -11.75699234008789, "global_step": 213669, "epoch": 1271} {"train_loss": -11.623095512390137, "global_step": 213670, "epoch": 1271} {"train_loss": -11.517295837402344, "global_step": 213671, "epoch": 1271} {"train_loss": -11.589844703674316, "global_step": 213672, "epoch": 1271} {"train_loss": -11.827628135681152, "global_step": 213673, "epoch": 1271} {"train_loss": -11.819929122924805, "global_step": 213674, "epoch": 1271} {"train_loss": -11.832884788513184, "global_step": 213675, "epoch": 1271} {"train_loss": -11.820289611816406, "global_step": 213676, "epoch": 1271} {"train_loss": -11.683144569396973, "global_step": 213677, "epoch": 1271} {"train_loss": -11.870231628417969, "global_step": 213678, "epoch": 1271} {"train_loss": -11.63940715789795, "global_step": 213679, "epoch": 1271} {"train_loss": -11.891477584838867, "global_step": 213680, "epoch": 1271} {"train_loss": -11.782896041870117, "global_step": 213681, "epoch": 1271} {"train_loss": -11.935019493103027, "global_step": 213682, "epoch": 1271} {"train_loss": -11.239822387695312, "global_step": 213683, "epoch": 1271} {"train_loss": -11.289093971252441, "global_step": 213684, "epoch": 1271} {"train_loss": -11.763614654541016, "global_step": 213685, "epoch": 1271} {"train_loss": -11.490804672241211, "global_step": 213686, "epoch": 1271} {"train_loss": -11.416585922241211, "global_step": 213687, "epoch": 1271} {"train_loss": -11.275838851928711, "global_step": 213688, "epoch": 1271} {"train_loss": -11.565499305725098, "global_step": 213689, "epoch": 1271} {"train_loss": -11.271561622619629, "global_step": 213690, "epoch": 1271} {"train_loss": -11.434371948242188, "global_step": 213691, "epoch": 1271} {"train_loss": -11.574690818786621, "global_step": 213692, "epoch": 1271} {"train_loss": -11.006694793701172, "global_step": 213693, "epoch": 1271} {"train_loss": -11.418207168579102, "global_step": 213694, "epoch": 1271} {"train_loss": -11.40041096437545, "global_step": 213695, "epoch": 1271, "val_loss": 255246.484375} {"train_loss": -11.444067001342773, "global_step": 213696, "epoch": 1272} {"train_loss": -11.336546897888184, "global_step": 213697, "epoch": 1272} {"train_loss": -11.055204391479492, "global_step": 213698, "epoch": 1272} {"train_loss": -11.265869140625, "global_step": 213699, "epoch": 1272} {"train_loss": -10.759170532226562, "global_step": 213700, "epoch": 1272} {"train_loss": -11.490128517150879, "global_step": 213701, "epoch": 1272} {"train_loss": -10.748518943786621, "global_step": 213702, "epoch": 1272} {"train_loss": -11.252213478088379, "global_step": 213703, "epoch": 1272} {"train_loss": -10.806506156921387, "global_step": 213704, "epoch": 1272} {"train_loss": -11.165614128112793, "global_step": 213705, "epoch": 1272} {"train_loss": -11.21744155883789, "global_step": 213706, "epoch": 1272} {"train_loss": -11.61593246459961, "global_step": 213707, "epoch": 1272} {"train_loss": -11.086241722106934, "global_step": 213708, "epoch": 1272} {"train_loss": -11.778257369995117, "global_step": 213709, "epoch": 1272} {"train_loss": -10.774734497070312, "global_step": 213710, "epoch": 1272} {"train_loss": -11.639498710632324, "global_step": 213711, "epoch": 1272} {"train_loss": -10.543672561645508, "global_step": 213712, "epoch": 1272} {"train_loss": -10.806493759155273, "global_step": 213713, "epoch": 1272} {"train_loss": -11.21856689453125, "global_step": 213714, "epoch": 1272} {"train_loss": -11.037617683410645, "global_step": 213715, "epoch": 1272} {"train_loss": -10.380876541137695, "global_step": 213716, "epoch": 1272} {"train_loss": -11.346522331237793, "global_step": 213717, "epoch": 1272} {"train_loss": -10.87186050415039, "global_step": 213718, "epoch": 1272} {"train_loss": -10.33073902130127, "global_step": 213719, "epoch": 1272} {"train_loss": -10.963918685913086, "global_step": 213720, "epoch": 1272} {"train_loss": -10.585391998291016, "global_step": 213721, "epoch": 1272} {"train_loss": -10.42011833190918, "global_step": 213722, "epoch": 1272} {"train_loss": -10.526178359985352, "global_step": 213723, "epoch": 1272} {"train_loss": -10.89156436920166, "global_step": 213724, "epoch": 1272} {"train_loss": -10.792670249938965, "global_step": 213725, "epoch": 1272} {"train_loss": -11.133657455444336, "global_step": 213726, "epoch": 1272} {"train_loss": -10.90949821472168, "global_step": 213727, "epoch": 1272} {"train_loss": -11.187007904052734, "global_step": 213728, "epoch": 1272} {"train_loss": -11.034655570983887, "global_step": 213729, "epoch": 1272} {"train_loss": -11.070110321044922, "global_step": 213730, "epoch": 1272} {"train_loss": -11.352511405944824, "global_step": 213731, "epoch": 1272} {"train_loss": -10.891039848327637, "global_step": 213732, "epoch": 1272} {"train_loss": -11.405505180358887, "global_step": 213733, "epoch": 1272} {"train_loss": -11.26705265045166, "global_step": 213734, "epoch": 1272} {"train_loss": -11.364835739135742, "global_step": 213735, "epoch": 1272} {"train_loss": -11.390083312988281, "global_step": 213736, "epoch": 1272} {"train_loss": -11.4622220993042, "global_step": 213737, "epoch": 1272} {"train_loss": -11.463982582092285, "global_step": 213738, "epoch": 1272} {"train_loss": -11.353752136230469, "global_step": 213739, "epoch": 1272} {"train_loss": -11.164169311523438, "global_step": 213740, "epoch": 1272} {"train_loss": -11.721866607666016, "global_step": 213741, "epoch": 1272} {"train_loss": -11.26048469543457, "global_step": 213742, "epoch": 1272} {"train_loss": -11.444843292236328, "global_step": 213743, "epoch": 1272} {"train_loss": -11.481517791748047, "global_step": 213744, "epoch": 1272} {"train_loss": -11.456184387207031, "global_step": 213745, "epoch": 1272} {"train_loss": -11.44901180267334, "global_step": 213746, "epoch": 1272} {"train_loss": -11.416202545166016, "global_step": 213747, "epoch": 1272} {"train_loss": -11.341039657592773, "global_step": 213748, "epoch": 1272} {"train_loss": -11.596536636352539, "global_step": 213749, "epoch": 1272} {"train_loss": -11.586504936218262, "global_step": 213750, "epoch": 1272} {"train_loss": -11.70810317993164, "global_step": 213751, "epoch": 1272} {"train_loss": -11.530518531799316, "global_step": 213752, "epoch": 1272} {"train_loss": -11.846235275268555, "global_step": 213753, "epoch": 1272} {"train_loss": -11.467521667480469, "global_step": 213754, "epoch": 1272} {"train_loss": -11.544572830200195, "global_step": 213755, "epoch": 1272} {"train_loss": -11.52259349822998, "global_step": 213756, "epoch": 1272} {"train_loss": -11.752102851867676, "global_step": 213757, "epoch": 1272} {"train_loss": -11.776537895202637, "global_step": 213758, "epoch": 1272} {"train_loss": -11.717923164367676, "global_step": 213759, "epoch": 1272} {"train_loss": -11.777227401733398, "global_step": 213760, "epoch": 1272} {"train_loss": -11.59650707244873, "global_step": 213761, "epoch": 1272} {"train_loss": -11.729829788208008, "global_step": 213762, "epoch": 1272} {"train_loss": -11.549251556396484, "global_step": 213763, "epoch": 1272} {"train_loss": -11.718314170837402, "global_step": 213764, "epoch": 1272} {"train_loss": -11.671549797058105, "global_step": 213765, "epoch": 1272} {"train_loss": -11.772663116455078, "global_step": 213766, "epoch": 1272} {"train_loss": -11.741981506347656, "global_step": 213767, "epoch": 1272} {"train_loss": -11.877805709838867, "global_step": 213768, "epoch": 1272} {"train_loss": -11.708845138549805, "global_step": 213769, "epoch": 1272} {"train_loss": -11.908876419067383, "global_step": 213770, "epoch": 1272} {"train_loss": -11.593507766723633, "global_step": 213771, "epoch": 1272} {"train_loss": -12.006767272949219, "global_step": 213772, "epoch": 1272} {"train_loss": -11.90792465209961, "global_step": 213773, "epoch": 1272} {"train_loss": -11.846051216125488, "global_step": 213774, "epoch": 1272} {"train_loss": -11.997050285339355, "global_step": 213775, "epoch": 1272} {"train_loss": -11.838340759277344, "global_step": 213776, "epoch": 1272} {"train_loss": -11.755363464355469, "global_step": 213777, "epoch": 1272} {"train_loss": -11.930893898010254, "global_step": 213778, "epoch": 1272} {"train_loss": -11.558694839477539, "global_step": 213779, "epoch": 1272} {"train_loss": -11.712628364562988, "global_step": 213780, "epoch": 1272} {"train_loss": -11.898785591125488, "global_step": 213781, "epoch": 1272} {"train_loss": -11.807588577270508, "global_step": 213782, "epoch": 1272} {"train_loss": -11.697858810424805, "global_step": 213783, "epoch": 1272} {"train_loss": -11.902070045471191, "global_step": 213784, "epoch": 1272} {"train_loss": -11.689781188964844, "global_step": 213785, "epoch": 1272} {"train_loss": -11.018902778625488, "global_step": 213786, "epoch": 1272} {"train_loss": -11.495655059814453, "global_step": 213787, "epoch": 1272} {"train_loss": -11.768041610717773, "global_step": 213788, "epoch": 1272} {"train_loss": -10.465690612792969, "global_step": 213789, "epoch": 1272} {"train_loss": -10.559032440185547, "global_step": 213790, "epoch": 1272} {"train_loss": -11.720857620239258, "global_step": 213791, "epoch": 1272} {"train_loss": -11.296049118041992, "global_step": 213792, "epoch": 1272} {"train_loss": -10.648305892944336, "global_step": 213793, "epoch": 1272} {"train_loss": -10.560653686523438, "global_step": 213794, "epoch": 1272} {"train_loss": -11.729958534240723, "global_step": 213795, "epoch": 1272} {"train_loss": -11.020830154418945, "global_step": 213796, "epoch": 1272} {"train_loss": -10.951284408569336, "global_step": 213797, "epoch": 1272} {"train_loss": -10.698193550109863, "global_step": 213798, "epoch": 1272} {"train_loss": -10.65584945678711, "global_step": 213799, "epoch": 1272} {"train_loss": -10.694642066955566, "global_step": 213800, "epoch": 1272} {"train_loss": -10.357598304748535, "global_step": 213801, "epoch": 1272} {"train_loss": -10.175043106079102, "global_step": 213802, "epoch": 1272} {"train_loss": -10.094438552856445, "global_step": 213803, "epoch": 1272} {"train_loss": -9.996749877929688, "global_step": 213804, "epoch": 1272} {"train_loss": -10.317951202392578, "global_step": 213805, "epoch": 1272} {"train_loss": -9.947612762451172, "global_step": 213806, "epoch": 1272} {"train_loss": -8.911160469055176, "global_step": 213807, "epoch": 1272} {"train_loss": -9.30648136138916, "global_step": 213808, "epoch": 1272} {"train_loss": -11.016321182250977, "global_step": 213809, "epoch": 1272} {"train_loss": -9.790496826171875, "global_step": 213810, "epoch": 1272} {"train_loss": -9.855772018432617, "global_step": 213811, "epoch": 1272} {"train_loss": -10.707509994506836, "global_step": 213812, "epoch": 1272} {"train_loss": -9.159627914428711, "global_step": 213813, "epoch": 1272} {"train_loss": -10.772424697875977, "global_step": 213814, "epoch": 1272} {"train_loss": -10.001541137695312, "global_step": 213815, "epoch": 1272} {"train_loss": -10.046445846557617, "global_step": 213816, "epoch": 1272} {"train_loss": -10.945932388305664, "global_step": 213817, "epoch": 1272} {"train_loss": -10.044466018676758, "global_step": 213818, "epoch": 1272} {"train_loss": -10.530384063720703, "global_step": 213819, "epoch": 1272} {"train_loss": -10.949932098388672, "global_step": 213820, "epoch": 1272} {"train_loss": -10.299561500549316, "global_step": 213821, "epoch": 1272} {"train_loss": -10.618511199951172, "global_step": 213822, "epoch": 1272} {"train_loss": -10.525713920593262, "global_step": 213823, "epoch": 1272} {"train_loss": -10.484586715698242, "global_step": 213824, "epoch": 1272} {"train_loss": -10.898260116577148, "global_step": 213825, "epoch": 1272} {"train_loss": -10.612802505493164, "global_step": 213826, "epoch": 1272} {"train_loss": -11.252596855163574, "global_step": 213827, "epoch": 1272} {"train_loss": -10.55421257019043, "global_step": 213828, "epoch": 1272} {"train_loss": -10.8919677734375, "global_step": 213829, "epoch": 1272} {"train_loss": -10.864822387695312, "global_step": 213830, "epoch": 1272} {"train_loss": -11.203255653381348, "global_step": 213831, "epoch": 1272} {"train_loss": -10.76351547241211, "global_step": 213832, "epoch": 1272} {"train_loss": -10.807987213134766, "global_step": 213833, "epoch": 1272} {"train_loss": -11.103466033935547, "global_step": 213834, "epoch": 1272} {"train_loss": -10.475545883178711, "global_step": 213835, "epoch": 1272} {"train_loss": -11.051502227783203, "global_step": 213836, "epoch": 1272} {"train_loss": -10.290739059448242, "global_step": 213837, "epoch": 1272} {"train_loss": -11.100788116455078, "global_step": 213838, "epoch": 1272} {"train_loss": -10.2559232711792, "global_step": 213839, "epoch": 1272} {"train_loss": -10.516195297241211, "global_step": 213840, "epoch": 1272} {"train_loss": -11.045684814453125, "global_step": 213841, "epoch": 1272} {"train_loss": -10.258475303649902, "global_step": 213842, "epoch": 1272} {"train_loss": -11.218996047973633, "global_step": 213843, "epoch": 1272} {"train_loss": -9.975808143615723, "global_step": 213844, "epoch": 1272} {"train_loss": -11.132429122924805, "global_step": 213845, "epoch": 1272} {"train_loss": -10.827459335327148, "global_step": 213846, "epoch": 1272} {"train_loss": -10.644862174987793, "global_step": 213847, "epoch": 1272} {"train_loss": -11.069822311401367, "global_step": 213848, "epoch": 1272} {"train_loss": -10.764680862426758, "global_step": 213849, "epoch": 1272} {"train_loss": -11.179097175598145, "global_step": 213850, "epoch": 1272} {"train_loss": -10.84212875366211, "global_step": 213851, "epoch": 1272} {"train_loss": -11.120060920715332, "global_step": 213852, "epoch": 1272} {"train_loss": -11.137533187866211, "global_step": 213853, "epoch": 1272} {"train_loss": -11.173283576965332, "global_step": 213854, "epoch": 1272} {"train_loss": -11.185786247253418, "global_step": 213855, "epoch": 1272} {"train_loss": -11.089452743530273, "global_step": 213856, "epoch": 1272} {"train_loss": -11.187006950378418, "global_step": 213857, "epoch": 1272} {"train_loss": -11.23497200012207, "global_step": 213858, "epoch": 1272} {"train_loss": -11.110420227050781, "global_step": 213859, "epoch": 1272} {"train_loss": -11.50048828125, "global_step": 213860, "epoch": 1272} {"train_loss": -11.126840591430664, "global_step": 213861, "epoch": 1272} {"train_loss": -11.24988079071045, "global_step": 213862, "epoch": 1272} {"train_loss": -11.075365549042111, "global_step": 213863, "epoch": 1272, "val_loss": 256579.1875} {"train_loss": -11.244884490966797, "global_step": 213864, "epoch": 1273} {"train_loss": -11.489766120910645, "global_step": 213865, "epoch": 1273} {"train_loss": -11.433730125427246, "global_step": 213866, "epoch": 1273} {"train_loss": -11.428869247436523, "global_step": 213867, "epoch": 1273} {"train_loss": -11.658817291259766, "global_step": 213868, "epoch": 1273} {"train_loss": -11.554521560668945, "global_step": 213869, "epoch": 1273} {"train_loss": -11.695964813232422, "global_step": 213870, "epoch": 1273} {"train_loss": -11.565973281860352, "global_step": 213871, "epoch": 1273} {"train_loss": -11.537010192871094, "global_step": 213872, "epoch": 1273} {"train_loss": -11.659586906433105, "global_step": 213873, "epoch": 1273} {"train_loss": -11.57518482208252, "global_step": 213874, "epoch": 1273} {"train_loss": -11.667215347290039, "global_step": 213875, "epoch": 1273} {"train_loss": -11.628915786743164, "global_step": 213876, "epoch": 1273} {"train_loss": -11.622573852539062, "global_step": 213877, "epoch": 1273} {"train_loss": -11.760589599609375, "global_step": 213878, "epoch": 1273} {"train_loss": -11.866327285766602, "global_step": 213879, "epoch": 1273} {"train_loss": -11.580902099609375, "global_step": 213880, "epoch": 1273} {"train_loss": -11.641801834106445, "global_step": 213881, "epoch": 1273} {"train_loss": -11.911163330078125, "global_step": 213882, "epoch": 1273} {"train_loss": -11.608649253845215, "global_step": 213883, "epoch": 1273} {"train_loss": -11.867767333984375, "global_step": 213884, "epoch": 1273} {"train_loss": -11.733028411865234, "global_step": 213885, "epoch": 1273} {"train_loss": -11.887348175048828, "global_step": 213886, "epoch": 1273} {"train_loss": -11.799213409423828, "global_step": 213887, "epoch": 1273} {"train_loss": -11.671910285949707, "global_step": 213888, "epoch": 1273} {"train_loss": -11.858943939208984, "global_step": 213889, "epoch": 1273} {"train_loss": -11.897302627563477, "global_step": 213890, "epoch": 1273} {"train_loss": -11.805638313293457, "global_step": 213891, "epoch": 1273} {"train_loss": -11.918411254882812, "global_step": 213892, "epoch": 1273} {"train_loss": -11.75208854675293, "global_step": 213893, "epoch": 1273} {"train_loss": -11.859088897705078, "global_step": 213894, "epoch": 1273} {"train_loss": -11.972567558288574, "global_step": 213895, "epoch": 1273} {"train_loss": -11.956450462341309, "global_step": 213896, "epoch": 1273} {"train_loss": -12.015076637268066, "global_step": 213897, "epoch": 1273} {"train_loss": -12.036806106567383, "global_step": 213898, "epoch": 1273} {"train_loss": -11.95321273803711, "global_step": 213899, "epoch": 1273} {"train_loss": -11.949190139770508, "global_step": 213900, "epoch": 1273} {"train_loss": -11.93899917602539, "global_step": 213901, "epoch": 1273} {"train_loss": -11.742263793945312, "global_step": 213902, "epoch": 1273} {"train_loss": -11.96373462677002, "global_step": 213903, "epoch": 1273} {"train_loss": -12.228560447692871, "global_step": 213904, "epoch": 1273} {"train_loss": -12.019262313842773, "global_step": 213905, "epoch": 1273} {"train_loss": -11.887284278869629, "global_step": 213906, "epoch": 1273} {"train_loss": -12.046794891357422, "global_step": 213907, "epoch": 1273} {"train_loss": -12.110161781311035, "global_step": 213908, "epoch": 1273} {"train_loss": -11.608911514282227, "global_step": 213909, "epoch": 1273} {"train_loss": -11.820533752441406, "global_step": 213910, "epoch": 1273} {"train_loss": -12.021045684814453, "global_step": 213911, "epoch": 1273} {"train_loss": -11.954309463500977, "global_step": 213912, "epoch": 1273} {"train_loss": -11.878881454467773, "global_step": 213913, "epoch": 1273} {"train_loss": -11.582560539245605, "global_step": 213914, "epoch": 1273} {"train_loss": -11.848039627075195, "global_step": 213915, "epoch": 1273} {"train_loss": -11.911676406860352, "global_step": 213916, "epoch": 1273} {"train_loss": -11.928173065185547, "global_step": 213917, "epoch": 1273} {"train_loss": -11.871082305908203, "global_step": 213918, "epoch": 1273} {"train_loss": -11.714408874511719, "global_step": 213919, "epoch": 1273} {"train_loss": -11.705973625183105, "global_step": 213920, "epoch": 1273} {"train_loss": -11.945109367370605, "global_step": 213921, "epoch": 1273} {"train_loss": -11.88615894317627, "global_step": 213922, "epoch": 1273} {"train_loss": -11.562074661254883, "global_step": 213923, "epoch": 1273} {"train_loss": -11.133079528808594, "global_step": 213924, "epoch": 1273} {"train_loss": -11.454094886779785, "global_step": 213925, "epoch": 1273} {"train_loss": -11.44934368133545, "global_step": 213926, "epoch": 1273} {"train_loss": -10.636289596557617, "global_step": 213927, "epoch": 1273} {"train_loss": -10.185323715209961, "global_step": 213928, "epoch": 1273} {"train_loss": -11.554327011108398, "global_step": 213929, "epoch": 1273} {"train_loss": -10.85930061340332, "global_step": 213930, "epoch": 1273} {"train_loss": -10.574628829956055, "global_step": 213931, "epoch": 1273} {"train_loss": -11.357538223266602, "global_step": 213932, "epoch": 1273} {"train_loss": -11.001293182373047, "global_step": 213933, "epoch": 1273} {"train_loss": -9.721284866333008, "global_step": 213934, "epoch": 1273} {"train_loss": -10.689448356628418, "global_step": 213935, "epoch": 1273} {"train_loss": -9.864949226379395, "global_step": 213936, "epoch": 1273} {"train_loss": -9.614116668701172, "global_step": 213937, "epoch": 1273} {"train_loss": -9.865680694580078, "global_step": 213938, "epoch": 1273} {"train_loss": -10.062984466552734, "global_step": 213939, "epoch": 1273} {"train_loss": -9.92798137664795, "global_step": 213940, "epoch": 1273} {"train_loss": -10.57813835144043, "global_step": 213941, "epoch": 1273} {"train_loss": -9.710283279418945, "global_step": 213942, "epoch": 1273} {"train_loss": -9.917879104614258, "global_step": 213943, "epoch": 1273} {"train_loss": -9.925100326538086, "global_step": 213944, "epoch": 1273} {"train_loss": -9.4031343460083, "global_step": 213945, "epoch": 1273} {"train_loss": -10.329023361206055, "global_step": 213946, "epoch": 1273} {"train_loss": -10.39017105102539, "global_step": 213947, "epoch": 1273} {"train_loss": -10.12002182006836, "global_step": 213948, "epoch": 1273} {"train_loss": -10.799959182739258, "global_step": 213949, "epoch": 1273} {"train_loss": -10.559606552124023, "global_step": 213950, "epoch": 1273} {"train_loss": -10.583513259887695, "global_step": 213951, "epoch": 1273} {"train_loss": -10.815718650817871, "global_step": 213952, "epoch": 1273} {"train_loss": -10.646112442016602, "global_step": 213953, "epoch": 1273} {"train_loss": -10.758678436279297, "global_step": 213954, "epoch": 1273} {"train_loss": -11.00528335571289, "global_step": 213955, "epoch": 1273} {"train_loss": -11.187562942504883, "global_step": 213956, "epoch": 1273} {"train_loss": -11.33405876159668, "global_step": 213957, "epoch": 1273} {"train_loss": -11.05483341217041, "global_step": 213958, "epoch": 1273} {"train_loss": -11.254526138305664, "global_step": 213959, "epoch": 1273} {"train_loss": -11.10117244720459, "global_step": 213960, "epoch": 1273} {"train_loss": -10.819533348083496, "global_step": 213961, "epoch": 1273} {"train_loss": -11.237493515014648, "global_step": 213962, "epoch": 1273} {"train_loss": -11.172510147094727, "global_step": 213963, "epoch": 1273} {"train_loss": -11.141700744628906, "global_step": 213964, "epoch": 1273} {"train_loss": -11.258901596069336, "global_step": 213965, "epoch": 1273} {"train_loss": -11.310750961303711, "global_step": 213966, "epoch": 1273} {"train_loss": -11.28226375579834, "global_step": 213967, "epoch": 1273} {"train_loss": -11.42325210571289, "global_step": 213968, "epoch": 1273} {"train_loss": -11.281658172607422, "global_step": 213969, "epoch": 1273} {"train_loss": -11.30163288116455, "global_step": 213970, "epoch": 1273} {"train_loss": -11.361327171325684, "global_step": 213971, "epoch": 1273} {"train_loss": -11.468719482421875, "global_step": 213972, "epoch": 1273} {"train_loss": -11.415799140930176, "global_step": 213973, "epoch": 1273} {"train_loss": -11.407110214233398, "global_step": 213974, "epoch": 1273} {"train_loss": -11.215335845947266, "global_step": 213975, "epoch": 1273} {"train_loss": -11.457867622375488, "global_step": 213976, "epoch": 1273} {"train_loss": -11.246766090393066, "global_step": 213977, "epoch": 1273} {"train_loss": -11.400039672851562, "global_step": 213978, "epoch": 1273} {"train_loss": -11.40656852722168, "global_step": 213979, "epoch": 1273} {"train_loss": -11.60194206237793, "global_step": 213980, "epoch": 1273} {"train_loss": -11.514361381530762, "global_step": 213981, "epoch": 1273} {"train_loss": -11.382205963134766, "global_step": 213982, "epoch": 1273} {"train_loss": -11.373390197753906, "global_step": 213983, "epoch": 1273} {"train_loss": -11.568704605102539, "global_step": 213984, "epoch": 1273} {"train_loss": -11.392685890197754, "global_step": 213985, "epoch": 1273} {"train_loss": -11.692485809326172, "global_step": 213986, "epoch": 1273} {"train_loss": -11.610280990600586, "global_step": 213987, "epoch": 1273} {"train_loss": -11.640949249267578, "global_step": 213988, "epoch": 1273} {"train_loss": -11.622665405273438, "global_step": 213989, "epoch": 1273} {"train_loss": -11.500500679016113, "global_step": 213990, "epoch": 1273} {"train_loss": -11.500311851501465, "global_step": 213991, "epoch": 1273} {"train_loss": -11.633594512939453, "global_step": 213992, "epoch": 1273} {"train_loss": -11.491205215454102, "global_step": 213993, "epoch": 1273} {"train_loss": -11.639284133911133, "global_step": 213994, "epoch": 1273} {"train_loss": -11.52615737915039, "global_step": 213995, "epoch": 1273} {"train_loss": -11.781428337097168, "global_step": 213996, "epoch": 1273} {"train_loss": -11.699440002441406, "global_step": 213997, "epoch": 1273} {"train_loss": -11.559986114501953, "global_step": 213998, "epoch": 1273} {"train_loss": -11.843132019042969, "global_step": 213999, "epoch": 1273} {"train_loss": -11.539281845092773, "global_step": 214000, "epoch": 1273} {"train_loss": -11.742118835449219, "global_step": 214001, "epoch": 1273} {"train_loss": -11.645712852478027, "global_step": 214002, "epoch": 1273} {"train_loss": -11.808396339416504, "global_step": 214003, "epoch": 1273} {"train_loss": -11.73040771484375, "global_step": 214004, "epoch": 1273} {"train_loss": -11.870182991027832, "global_step": 214005, "epoch": 1273} {"train_loss": -11.854574203491211, "global_step": 214006, "epoch": 1273} {"train_loss": -11.925698280334473, "global_step": 214007, "epoch": 1273} {"train_loss": -11.870110511779785, "global_step": 214008, "epoch": 1273} {"train_loss": -11.887094497680664, "global_step": 214009, "epoch": 1273} {"train_loss": -11.559896469116211, "global_step": 214010, "epoch": 1273} {"train_loss": -11.934959411621094, "global_step": 214011, "epoch": 1273} {"train_loss": -11.769891738891602, "global_step": 214012, "epoch": 1273} {"train_loss": -11.732473373413086, "global_step": 214013, "epoch": 1273} {"train_loss": -11.691162109375, "global_step": 214014, "epoch": 1273} {"train_loss": -11.72379207611084, "global_step": 214015, "epoch": 1273} {"train_loss": -11.843881607055664, "global_step": 214016, "epoch": 1273} {"train_loss": -11.542179107666016, "global_step": 214017, "epoch": 1273} {"train_loss": -11.913040161132812, "global_step": 214018, "epoch": 1273} {"train_loss": -11.4263916015625, "global_step": 214019, "epoch": 1273} {"train_loss": -11.22474479675293, "global_step": 214020, "epoch": 1273} {"train_loss": -11.268314361572266, "global_step": 214021, "epoch": 1273} {"train_loss": -10.971884727478027, "global_step": 214022, "epoch": 1273} {"train_loss": -11.414712905883789, "global_step": 214023, "epoch": 1273} {"train_loss": -11.275498390197754, "global_step": 214024, "epoch": 1273} {"train_loss": -10.655860900878906, "global_step": 214025, "epoch": 1273} {"train_loss": -11.435218811035156, "global_step": 214026, "epoch": 1273} {"train_loss": -11.493867874145508, "global_step": 214027, "epoch": 1273} {"train_loss": -10.885956764221191, "global_step": 214028, "epoch": 1273} {"train_loss": -11.902783393859863, "global_step": 214029, "epoch": 1273} {"train_loss": -10.881776809692383, "global_step": 214030, "epoch": 1273} {"train_loss": -11.399231320335751, "global_step": 214031, "epoch": 1273, "val_loss": 255688.796875} {"train_loss": -11.308221817016602, "global_step": 214032, "epoch": 1274} {"train_loss": -11.758737564086914, "global_step": 214033, "epoch": 1274} {"train_loss": -11.300359725952148, "global_step": 214034, "epoch": 1274} {"train_loss": -11.613582611083984, "global_step": 214035, "epoch": 1274} {"train_loss": -11.759126663208008, "global_step": 214036, "epoch": 1274} {"train_loss": -11.702621459960938, "global_step": 214037, "epoch": 1274} {"train_loss": -11.530407905578613, "global_step": 214038, "epoch": 1274} {"train_loss": -11.92028522491455, "global_step": 214039, "epoch": 1274} {"train_loss": -11.65397834777832, "global_step": 214040, "epoch": 1274} {"train_loss": -11.343362808227539, "global_step": 214041, "epoch": 1274} {"train_loss": -11.786457061767578, "global_step": 214042, "epoch": 1274} {"train_loss": -11.783342361450195, "global_step": 214043, "epoch": 1274} {"train_loss": -11.815864562988281, "global_step": 214044, "epoch": 1274} {"train_loss": -11.821146965026855, "global_step": 214045, "epoch": 1274} {"train_loss": -11.845102310180664, "global_step": 214046, "epoch": 1274} {"train_loss": -11.822088241577148, "global_step": 214047, "epoch": 1274} {"train_loss": -11.810598373413086, "global_step": 214048, "epoch": 1274} {"train_loss": -11.687410354614258, "global_step": 214049, "epoch": 1274} {"train_loss": -11.539649963378906, "global_step": 214050, "epoch": 1274} {"train_loss": -11.774798393249512, "global_step": 214051, "epoch": 1274} {"train_loss": -11.387847900390625, "global_step": 214052, "epoch": 1274} {"train_loss": -11.555093765258789, "global_step": 214053, "epoch": 1274} {"train_loss": -11.557373046875, "global_step": 214054, "epoch": 1274} {"train_loss": -11.181967735290527, "global_step": 214055, "epoch": 1274} {"train_loss": -11.542515754699707, "global_step": 214056, "epoch": 1274} {"train_loss": -11.494779586791992, "global_step": 214057, "epoch": 1274} {"train_loss": -11.321390151977539, "global_step": 214058, "epoch": 1274} {"train_loss": -11.834857940673828, "global_step": 214059, "epoch": 1274} {"train_loss": -11.227005004882812, "global_step": 214060, "epoch": 1274} {"train_loss": -11.26701831817627, "global_step": 214061, "epoch": 1274} {"train_loss": -11.552319526672363, "global_step": 214062, "epoch": 1274} {"train_loss": -11.634608268737793, "global_step": 214063, "epoch": 1274} {"train_loss": -11.422645568847656, "global_step": 214064, "epoch": 1274} {"train_loss": -11.553439140319824, "global_step": 214065, "epoch": 1274} {"train_loss": -11.102533340454102, "global_step": 214066, "epoch": 1274} {"train_loss": -11.515478134155273, "global_step": 214067, "epoch": 1274} {"train_loss": -10.194134712219238, "global_step": 214068, "epoch": 1274} {"train_loss": -10.824901580810547, "global_step": 214069, "epoch": 1274} {"train_loss": -10.974032402038574, "global_step": 214070, "epoch": 1274} {"train_loss": -10.940563201904297, "global_step": 214071, "epoch": 1274} {"train_loss": -9.469522476196289, "global_step": 214072, "epoch": 1274} {"train_loss": -10.92315673828125, "global_step": 214073, "epoch": 1274} {"train_loss": -9.121379852294922, "global_step": 214074, "epoch": 1274} {"train_loss": -11.052184104919434, "global_step": 214075, "epoch": 1274} {"train_loss": -9.434581756591797, "global_step": 214076, "epoch": 1274} {"train_loss": -9.63734245300293, "global_step": 214077, "epoch": 1274} {"train_loss": -10.979475021362305, "global_step": 214078, "epoch": 1274} {"train_loss": -10.229608535766602, "global_step": 214079, "epoch": 1274} {"train_loss": -11.178481101989746, "global_step": 214080, "epoch": 1274} {"train_loss": -10.54117202758789, "global_step": 214081, "epoch": 1274} {"train_loss": -11.360126495361328, "global_step": 214082, "epoch": 1274} {"train_loss": -10.977409362792969, "global_step": 214083, "epoch": 1274} {"train_loss": -11.143228530883789, "global_step": 214084, "epoch": 1274} {"train_loss": -10.626002311706543, "global_step": 214085, "epoch": 1274} {"train_loss": -11.119353294372559, "global_step": 214086, "epoch": 1274} {"train_loss": -11.174727439880371, "global_step": 214087, "epoch": 1274} {"train_loss": -11.079607009887695, "global_step": 214088, "epoch": 1274} {"train_loss": -11.418305397033691, "global_step": 214089, "epoch": 1274} {"train_loss": -10.95486831665039, "global_step": 214090, "epoch": 1274} {"train_loss": -11.13243293762207, "global_step": 214091, "epoch": 1274} {"train_loss": -11.138507843017578, "global_step": 214092, "epoch": 1274} {"train_loss": -11.017818450927734, "global_step": 214093, "epoch": 1274} {"train_loss": -10.964877128601074, "global_step": 214094, "epoch": 1274} {"train_loss": -11.161142349243164, "global_step": 214095, "epoch": 1274} {"train_loss": -11.25448226928711, "global_step": 214096, "epoch": 1274} {"train_loss": -11.331686019897461, "global_step": 214097, "epoch": 1274} {"train_loss": -11.456787109375, "global_step": 214098, "epoch": 1274} {"train_loss": -11.633156776428223, "global_step": 214099, "epoch": 1274} {"train_loss": -11.37243938446045, "global_step": 214100, "epoch": 1274} {"train_loss": -11.581491470336914, "global_step": 214101, "epoch": 1274} {"train_loss": -11.576433181762695, "global_step": 214102, "epoch": 1274} {"train_loss": -11.416049003601074, "global_step": 214103, "epoch": 1274} {"train_loss": -11.526944160461426, "global_step": 214104, "epoch": 1274} {"train_loss": -11.6587495803833, "global_step": 214105, "epoch": 1274} {"train_loss": -11.332733154296875, "global_step": 214106, "epoch": 1274} {"train_loss": -11.52896785736084, "global_step": 214107, "epoch": 1274} {"train_loss": -11.570556640625, "global_step": 214108, "epoch": 1274} {"train_loss": -11.627762794494629, "global_step": 214109, "epoch": 1274} {"train_loss": -11.425541877746582, "global_step": 214110, "epoch": 1274} {"train_loss": -11.586748123168945, "global_step": 214111, "epoch": 1274} {"train_loss": -11.681283950805664, "global_step": 214112, "epoch": 1274} {"train_loss": -11.718616485595703, "global_step": 214113, "epoch": 1274} {"train_loss": -11.916024208068848, "global_step": 214114, "epoch": 1274} {"train_loss": -11.80678653717041, "global_step": 214115, "epoch": 1274} {"train_loss": -11.70022201538086, "global_step": 214116, "epoch": 1274} {"train_loss": -11.665519714355469, "global_step": 214117, "epoch": 1274} {"train_loss": -11.62847900390625, "global_step": 214118, "epoch": 1274} {"train_loss": -11.844243049621582, "global_step": 214119, "epoch": 1274} {"train_loss": -11.670854568481445, "global_step": 214120, "epoch": 1274} {"train_loss": -11.59973430633545, "global_step": 214121, "epoch": 1274} {"train_loss": -11.738815307617188, "global_step": 214122, "epoch": 1274} {"train_loss": -11.507869720458984, "global_step": 214123, "epoch": 1274} {"train_loss": -11.779836654663086, "global_step": 214124, "epoch": 1274} {"train_loss": -11.687723159790039, "global_step": 214125, "epoch": 1274} {"train_loss": -11.622797012329102, "global_step": 214126, "epoch": 1274} {"train_loss": -11.72714614868164, "global_step": 214127, "epoch": 1274} {"train_loss": -11.350824356079102, "global_step": 214128, "epoch": 1274} {"train_loss": -11.907369613647461, "global_step": 214129, "epoch": 1274} {"train_loss": -11.65185260772705, "global_step": 214130, "epoch": 1274} {"train_loss": -11.887956619262695, "global_step": 214131, "epoch": 1274} {"train_loss": -11.672639846801758, "global_step": 214132, "epoch": 1274} {"train_loss": -11.410243034362793, "global_step": 214133, "epoch": 1274} {"train_loss": -11.731218338012695, "global_step": 214134, "epoch": 1274} {"train_loss": -11.429300308227539, "global_step": 214135, "epoch": 1274} {"train_loss": -11.622734069824219, "global_step": 214136, "epoch": 1274} {"train_loss": -11.225425720214844, "global_step": 214137, "epoch": 1274} {"train_loss": -11.458269119262695, "global_step": 214138, "epoch": 1274} {"train_loss": -11.299728393554688, "global_step": 214139, "epoch": 1274} {"train_loss": -11.457277297973633, "global_step": 214140, "epoch": 1274} {"train_loss": -11.646329879760742, "global_step": 214141, "epoch": 1274} {"train_loss": -11.750997543334961, "global_step": 214142, "epoch": 1274} {"train_loss": -11.400264739990234, "global_step": 214143, "epoch": 1274} {"train_loss": -11.804264068603516, "global_step": 214144, "epoch": 1274} {"train_loss": -11.442752838134766, "global_step": 214145, "epoch": 1274} {"train_loss": -11.484722137451172, "global_step": 214146, "epoch": 1274} {"train_loss": -11.443135261535645, "global_step": 214147, "epoch": 1274} {"train_loss": -11.761844635009766, "global_step": 214148, "epoch": 1274} {"train_loss": -11.771783828735352, "global_step": 214149, "epoch": 1274} {"train_loss": -11.73944091796875, "global_step": 214150, "epoch": 1274} {"train_loss": -11.032955169677734, "global_step": 214151, "epoch": 1274} {"train_loss": -11.727324485778809, "global_step": 214152, "epoch": 1274} {"train_loss": -11.522180557250977, "global_step": 214153, "epoch": 1274} {"train_loss": -11.633544921875, "global_step": 214154, "epoch": 1274} {"train_loss": -11.398210525512695, "global_step": 214155, "epoch": 1274} {"train_loss": -11.845187187194824, "global_step": 214156, "epoch": 1274} {"train_loss": -11.436570167541504, "global_step": 214157, "epoch": 1274} {"train_loss": -11.464285850524902, "global_step": 214158, "epoch": 1274} {"train_loss": -11.56450366973877, "global_step": 214159, "epoch": 1274} {"train_loss": -11.697210311889648, "global_step": 214160, "epoch": 1274} {"train_loss": -11.284639358520508, "global_step": 214161, "epoch": 1274} {"train_loss": -10.523273468017578, "global_step": 214162, "epoch": 1274} {"train_loss": -10.9202880859375, "global_step": 214163, "epoch": 1274} {"train_loss": -11.571104049682617, "global_step": 214164, "epoch": 1274} {"train_loss": -11.672185897827148, "global_step": 214165, "epoch": 1274} {"train_loss": -11.656820297241211, "global_step": 214166, "epoch": 1274} {"train_loss": -11.65029525756836, "global_step": 214167, "epoch": 1274} {"train_loss": -11.34314250946045, "global_step": 214168, "epoch": 1274} {"train_loss": -11.351604461669922, "global_step": 214169, "epoch": 1274} {"train_loss": -11.674327850341797, "global_step": 214170, "epoch": 1274} {"train_loss": -11.419727325439453, "global_step": 214171, "epoch": 1274} {"train_loss": -10.656754493713379, "global_step": 214172, "epoch": 1274} {"train_loss": -10.747016906738281, "global_step": 214173, "epoch": 1274} {"train_loss": -11.696918487548828, "global_step": 214174, "epoch": 1274} {"train_loss": -11.015233993530273, "global_step": 214175, "epoch": 1274} {"train_loss": -11.276914596557617, "global_step": 214176, "epoch": 1274} {"train_loss": -11.56876277923584, "global_step": 214177, "epoch": 1274} {"train_loss": -11.282403945922852, "global_step": 214178, "epoch": 1274} {"train_loss": -11.41301441192627, "global_step": 214179, "epoch": 1274} {"train_loss": -11.19713020324707, "global_step": 214180, "epoch": 1274} {"train_loss": -11.27174186706543, "global_step": 214181, "epoch": 1274} {"train_loss": -11.771648406982422, "global_step": 214182, "epoch": 1274} {"train_loss": -11.342058181762695, "global_step": 214183, "epoch": 1274} {"train_loss": -11.77468490600586, "global_step": 214184, "epoch": 1274} {"train_loss": -11.257121086120605, "global_step": 214185, "epoch": 1274} {"train_loss": -11.492472648620605, "global_step": 214186, "epoch": 1274} {"train_loss": -11.391308784484863, "global_step": 214187, "epoch": 1274} {"train_loss": -10.455653190612793, "global_step": 214188, "epoch": 1274} {"train_loss": -11.790172576904297, "global_step": 214189, "epoch": 1274} {"train_loss": -11.009289741516113, "global_step": 214190, "epoch": 1274} {"train_loss": -10.956174850463867, "global_step": 214191, "epoch": 1274} {"train_loss": -11.670050621032715, "global_step": 214192, "epoch": 1274} {"train_loss": -11.123823165893555, "global_step": 214193, "epoch": 1274} {"train_loss": -11.351285934448242, "global_step": 214194, "epoch": 1274} {"train_loss": -10.571734428405762, "global_step": 214195, "epoch": 1274} {"train_loss": -11.317228317260742, "global_step": 214196, "epoch": 1274} {"train_loss": -11.394001007080078, "global_step": 214197, "epoch": 1274} {"train_loss": -11.045988082885742, "global_step": 214198, "epoch": 1274} {"train_loss": -11.37561932064238, "global_step": 214199, "epoch": 1274, "val_loss": 259420.4375} {"train_loss": -10.89363956451416, "global_step": 214200, "epoch": 1275} {"train_loss": -11.764324188232422, "global_step": 214201, "epoch": 1275} {"train_loss": -10.920625686645508, "global_step": 214202, "epoch": 1275} {"train_loss": -11.710786819458008, "global_step": 214203, "epoch": 1275} {"train_loss": -11.037313461303711, "global_step": 214204, "epoch": 1275} {"train_loss": -11.513784408569336, "global_step": 214205, "epoch": 1275} {"train_loss": -11.496175765991211, "global_step": 214206, "epoch": 1275} {"train_loss": -11.438159942626953, "global_step": 214207, "epoch": 1275} {"train_loss": -11.483784675598145, "global_step": 214208, "epoch": 1275} {"train_loss": -10.998406410217285, "global_step": 214209, "epoch": 1275} {"train_loss": -11.495445251464844, "global_step": 214210, "epoch": 1275} {"train_loss": -11.199419021606445, "global_step": 214211, "epoch": 1275} {"train_loss": -11.309287071228027, "global_step": 214212, "epoch": 1275} {"train_loss": -11.35251522064209, "global_step": 214213, "epoch": 1275} {"train_loss": -11.108396530151367, "global_step": 214214, "epoch": 1275} {"train_loss": -11.401708602905273, "global_step": 214215, "epoch": 1275} {"train_loss": -11.395475387573242, "global_step": 214216, "epoch": 1275} {"train_loss": -11.232437133789062, "global_step": 214217, "epoch": 1275} {"train_loss": -10.731815338134766, "global_step": 214218, "epoch": 1275} {"train_loss": -10.9256591796875, "global_step": 214219, "epoch": 1275} {"train_loss": -11.12814998626709, "global_step": 214220, "epoch": 1275} {"train_loss": -11.07016372680664, "global_step": 214221, "epoch": 1275} {"train_loss": -10.88579273223877, "global_step": 214222, "epoch": 1275} {"train_loss": -10.380104064941406, "global_step": 214223, "epoch": 1275} {"train_loss": -11.283090591430664, "global_step": 214224, "epoch": 1275} {"train_loss": -10.216486930847168, "global_step": 214225, "epoch": 1275} {"train_loss": -10.53317642211914, "global_step": 214226, "epoch": 1275} {"train_loss": -10.871541023254395, "global_step": 214227, "epoch": 1275} {"train_loss": -10.795941352844238, "global_step": 214228, "epoch": 1275} {"train_loss": -11.208740234375, "global_step": 214229, "epoch": 1275} {"train_loss": -10.687701225280762, "global_step": 214230, "epoch": 1275} {"train_loss": -10.556757926940918, "global_step": 214231, "epoch": 1275} {"train_loss": -10.952180862426758, "global_step": 214232, "epoch": 1275} {"train_loss": -11.189339637756348, "global_step": 214233, "epoch": 1275} {"train_loss": -10.334273338317871, "global_step": 214234, "epoch": 1275} {"train_loss": -10.807992935180664, "global_step": 214235, "epoch": 1275} {"train_loss": -10.752798080444336, "global_step": 214236, "epoch": 1275} {"train_loss": -10.917051315307617, "global_step": 214237, "epoch": 1275} {"train_loss": -10.757185935974121, "global_step": 214238, "epoch": 1275} {"train_loss": -10.705389022827148, "global_step": 214239, "epoch": 1275} {"train_loss": -11.108851432800293, "global_step": 214240, "epoch": 1275} {"train_loss": -10.864530563354492, "global_step": 214241, "epoch": 1275} {"train_loss": -10.688131332397461, "global_step": 214242, "epoch": 1275} {"train_loss": -11.401128768920898, "global_step": 214243, "epoch": 1275} {"train_loss": -10.518594741821289, "global_step": 214244, "epoch": 1275} {"train_loss": -11.098485946655273, "global_step": 214245, "epoch": 1275} {"train_loss": -11.085052490234375, "global_step": 214246, "epoch": 1275} {"train_loss": -10.88871955871582, "global_step": 214247, "epoch": 1275} {"train_loss": -11.524349212646484, "global_step": 214248, "epoch": 1275} {"train_loss": -11.279670715332031, "global_step": 214249, "epoch": 1275} {"train_loss": -10.736946105957031, "global_step": 214250, "epoch": 1275} {"train_loss": -11.258808135986328, "global_step": 214251, "epoch": 1275} {"train_loss": -10.899299621582031, "global_step": 214252, "epoch": 1275} {"train_loss": -11.100068092346191, "global_step": 214253, "epoch": 1275} {"train_loss": -11.318145751953125, "global_step": 214254, "epoch": 1275} {"train_loss": -10.936908721923828, "global_step": 214255, "epoch": 1275} {"train_loss": -11.054235458374023, "global_step": 214256, "epoch": 1275} {"train_loss": -11.016702651977539, "global_step": 214257, "epoch": 1275} {"train_loss": -11.07443618774414, "global_step": 214258, "epoch": 1275} {"train_loss": -11.245262145996094, "global_step": 214259, "epoch": 1275} {"train_loss": -11.196667671203613, "global_step": 214260, "epoch": 1275} {"train_loss": -11.373071670532227, "global_step": 214261, "epoch": 1275} {"train_loss": -11.252555847167969, "global_step": 214262, "epoch": 1275} {"train_loss": -11.46629524230957, "global_step": 214263, "epoch": 1275} {"train_loss": -11.395215034484863, "global_step": 214264, "epoch": 1275} {"train_loss": -11.5070219039917, "global_step": 214265, "epoch": 1275} {"train_loss": -11.518539428710938, "global_step": 214266, "epoch": 1275} {"train_loss": -11.53715705871582, "global_step": 214267, "epoch": 1275} {"train_loss": -11.32697868347168, "global_step": 214268, "epoch": 1275} {"train_loss": -11.530672073364258, "global_step": 214269, "epoch": 1275} {"train_loss": -11.59119987487793, "global_step": 214270, "epoch": 1275} {"train_loss": -11.537484169006348, "global_step": 214271, "epoch": 1275} {"train_loss": -11.700347900390625, "global_step": 214272, "epoch": 1275} {"train_loss": -11.655889511108398, "global_step": 214273, "epoch": 1275} {"train_loss": -11.464088439941406, "global_step": 214274, "epoch": 1275} {"train_loss": -11.658886909484863, "global_step": 214275, "epoch": 1275} {"train_loss": -11.713848114013672, "global_step": 214276, "epoch": 1275} {"train_loss": -11.702434539794922, "global_step": 214277, "epoch": 1275} {"train_loss": -11.597576141357422, "global_step": 214278, "epoch": 1275} {"train_loss": -11.616135597229004, "global_step": 214279, "epoch": 1275} {"train_loss": -11.594710350036621, "global_step": 214280, "epoch": 1275} {"train_loss": -11.693567276000977, "global_step": 214281, "epoch": 1275} {"train_loss": -11.369037628173828, "global_step": 214282, "epoch": 1275} {"train_loss": -11.787528991699219, "global_step": 214283, "epoch": 1275} {"train_loss": -11.560192108154297, "global_step": 214284, "epoch": 1275} {"train_loss": -11.767534255981445, "global_step": 214285, "epoch": 1275} {"train_loss": -11.6914644241333, "global_step": 214286, "epoch": 1275} {"train_loss": -11.575108528137207, "global_step": 214287, "epoch": 1275} {"train_loss": -11.851366996765137, "global_step": 214288, "epoch": 1275} {"train_loss": -11.500123977661133, "global_step": 214289, "epoch": 1275} {"train_loss": -11.850642204284668, "global_step": 214290, "epoch": 1275} {"train_loss": -11.660418510437012, "global_step": 214291, "epoch": 1275} {"train_loss": -11.748586654663086, "global_step": 214292, "epoch": 1275} {"train_loss": -11.687911033630371, "global_step": 214293, "epoch": 1275} {"train_loss": -11.714845657348633, "global_step": 214294, "epoch": 1275} {"train_loss": -11.732532501220703, "global_step": 214295, "epoch": 1275} {"train_loss": -11.457722663879395, "global_step": 214296, "epoch": 1275} {"train_loss": -11.873823165893555, "global_step": 214297, "epoch": 1275} {"train_loss": -11.598834037780762, "global_step": 214298, "epoch": 1275} {"train_loss": -11.443300247192383, "global_step": 214299, "epoch": 1275} {"train_loss": -11.912149429321289, "global_step": 214300, "epoch": 1275} {"train_loss": -11.303699493408203, "global_step": 214301, "epoch": 1275} {"train_loss": -11.708788871765137, "global_step": 214302, "epoch": 1275} {"train_loss": -11.673184394836426, "global_step": 214303, "epoch": 1275} {"train_loss": -11.236623764038086, "global_step": 214304, "epoch": 1275} {"train_loss": -11.844703674316406, "global_step": 214305, "epoch": 1275} {"train_loss": -11.512043952941895, "global_step": 214306, "epoch": 1275} {"train_loss": -11.200453758239746, "global_step": 214307, "epoch": 1275} {"train_loss": -11.536236763000488, "global_step": 214308, "epoch": 1275} {"train_loss": -11.625152587890625, "global_step": 214309, "epoch": 1275} {"train_loss": -11.095757484436035, "global_step": 214310, "epoch": 1275} {"train_loss": -11.412910461425781, "global_step": 214311, "epoch": 1275} {"train_loss": -11.449243545532227, "global_step": 214312, "epoch": 1275} {"train_loss": -11.271295547485352, "global_step": 214313, "epoch": 1275} {"train_loss": -12.038042068481445, "global_step": 214314, "epoch": 1275} {"train_loss": -11.779820442199707, "global_step": 214315, "epoch": 1275} {"train_loss": -11.421377182006836, "global_step": 214316, "epoch": 1275} {"train_loss": -11.75822639465332, "global_step": 214317, "epoch": 1275} {"train_loss": -11.492730140686035, "global_step": 214318, "epoch": 1275} {"train_loss": -11.145193099975586, "global_step": 214319, "epoch": 1275} {"train_loss": -11.485937118530273, "global_step": 214320, "epoch": 1275} {"train_loss": -10.832180976867676, "global_step": 214321, "epoch": 1275} {"train_loss": -11.18921184539795, "global_step": 214322, "epoch": 1275} {"train_loss": -11.383728981018066, "global_step": 214323, "epoch": 1275} {"train_loss": -11.243955612182617, "global_step": 214324, "epoch": 1275} {"train_loss": -11.204299926757812, "global_step": 214325, "epoch": 1275} {"train_loss": -10.989156723022461, "global_step": 214326, "epoch": 1275} {"train_loss": -10.99610710144043, "global_step": 214327, "epoch": 1275} {"train_loss": -11.45654010772705, "global_step": 214328, "epoch": 1275} {"train_loss": -10.589334487915039, "global_step": 214329, "epoch": 1275} {"train_loss": -11.545324325561523, "global_step": 214330, "epoch": 1275} {"train_loss": -11.075348854064941, "global_step": 214331, "epoch": 1275} {"train_loss": -11.707895278930664, "global_step": 214332, "epoch": 1275} {"train_loss": -11.27025318145752, "global_step": 214333, "epoch": 1275} {"train_loss": -11.233959197998047, "global_step": 214334, "epoch": 1275} {"train_loss": -11.252670288085938, "global_step": 214335, "epoch": 1275} {"train_loss": -11.366475105285645, "global_step": 214336, "epoch": 1275} {"train_loss": -11.03175163269043, "global_step": 214337, "epoch": 1275} {"train_loss": -11.642692565917969, "global_step": 214338, "epoch": 1275} {"train_loss": -11.30929183959961, "global_step": 214339, "epoch": 1275} {"train_loss": -11.277582168579102, "global_step": 214340, "epoch": 1275} {"train_loss": -11.394761085510254, "global_step": 214341, "epoch": 1275} {"train_loss": -11.535951614379883, "global_step": 214342, "epoch": 1275} {"train_loss": -11.830606460571289, "global_step": 214343, "epoch": 1275} {"train_loss": -11.492514610290527, "global_step": 214344, "epoch": 1275} {"train_loss": -11.658614158630371, "global_step": 214345, "epoch": 1275} {"train_loss": -11.471029281616211, "global_step": 214346, "epoch": 1275} {"train_loss": -11.296354293823242, "global_step": 214347, "epoch": 1275} {"train_loss": -11.86803913116455, "global_step": 214348, "epoch": 1275} {"train_loss": -11.313203811645508, "global_step": 214349, "epoch": 1275} {"train_loss": -11.543181419372559, "global_step": 214350, "epoch": 1275} {"train_loss": -11.577801704406738, "global_step": 214351, "epoch": 1275} {"train_loss": -11.740152359008789, "global_step": 214352, "epoch": 1275} {"train_loss": -11.466426849365234, "global_step": 214353, "epoch": 1275} {"train_loss": -11.884847640991211, "global_step": 214354, "epoch": 1275} {"train_loss": -11.561279296875, "global_step": 214355, "epoch": 1275} {"train_loss": -11.714524269104004, "global_step": 214356, "epoch": 1275} {"train_loss": -11.715865135192871, "global_step": 214357, "epoch": 1275} {"train_loss": -11.72187614440918, "global_step": 214358, "epoch": 1275} {"train_loss": -11.731785774230957, "global_step": 214359, "epoch": 1275} {"train_loss": -11.563228607177734, "global_step": 214360, "epoch": 1275} {"train_loss": -11.549264907836914, "global_step": 214361, "epoch": 1275} {"train_loss": -11.835634231567383, "global_step": 214362, "epoch": 1275} {"train_loss": -11.762027740478516, "global_step": 214363, "epoch": 1275} {"train_loss": -11.77613639831543, "global_step": 214364, "epoch": 1275} {"train_loss": -11.179282188415527, "global_step": 214365, "epoch": 1275} {"train_loss": -11.273698806762695, "global_step": 214366, "epoch": 1275} {"train_loss": -11.342633292788552, "global_step": 214367, "epoch": 1275, "val_loss": 257289.6875, "train_action_mse_error": 1.394766092300415} {"train_loss": -11.75660228729248, "global_step": 214368, "epoch": 1276} {"train_loss": -11.785534858703613, "global_step": 214369, "epoch": 1276} {"train_loss": -11.496954917907715, "global_step": 214370, "epoch": 1276} {"train_loss": -12.059288024902344, "global_step": 214371, "epoch": 1276} {"train_loss": -11.88629150390625, "global_step": 214372, "epoch": 1276} {"train_loss": -11.772937774658203, "global_step": 214373, "epoch": 1276} {"train_loss": -11.489151000976562, "global_step": 214374, "epoch": 1276} {"train_loss": -11.141371726989746, "global_step": 214375, "epoch": 1276} {"train_loss": -11.896062850952148, "global_step": 214376, "epoch": 1276} {"train_loss": -11.745927810668945, "global_step": 214377, "epoch": 1276} {"train_loss": -11.55412483215332, "global_step": 214378, "epoch": 1276} {"train_loss": -11.733078956604004, "global_step": 214379, "epoch": 1276} {"train_loss": -11.762861251831055, "global_step": 214380, "epoch": 1276} {"train_loss": -11.485243797302246, "global_step": 214381, "epoch": 1276} {"train_loss": -11.914299964904785, "global_step": 214382, "epoch": 1276} {"train_loss": -11.380260467529297, "global_step": 214383, "epoch": 1276} {"train_loss": -11.617713928222656, "global_step": 214384, "epoch": 1276} {"train_loss": -11.444875717163086, "global_step": 214385, "epoch": 1276} {"train_loss": -11.436724662780762, "global_step": 214386, "epoch": 1276} {"train_loss": -11.322771072387695, "global_step": 214387, "epoch": 1276} {"train_loss": -11.88276195526123, "global_step": 214388, "epoch": 1276} {"train_loss": -11.286209106445312, "global_step": 214389, "epoch": 1276} {"train_loss": -10.839855194091797, "global_step": 214390, "epoch": 1276} {"train_loss": -11.780160903930664, "global_step": 214391, "epoch": 1276} {"train_loss": -10.214679718017578, "global_step": 214392, "epoch": 1276} {"train_loss": -10.701961517333984, "global_step": 214393, "epoch": 1276} {"train_loss": -11.332134246826172, "global_step": 214394, "epoch": 1276} {"train_loss": -9.359217643737793, "global_step": 214395, "epoch": 1276} {"train_loss": -11.534832954406738, "global_step": 214396, "epoch": 1276} {"train_loss": -10.278611183166504, "global_step": 214397, "epoch": 1276} {"train_loss": -9.19982624053955, "global_step": 214398, "epoch": 1276} {"train_loss": -11.007479667663574, "global_step": 214399, "epoch": 1276} {"train_loss": -9.236127853393555, "global_step": 214400, "epoch": 1276} {"train_loss": -9.042608261108398, "global_step": 214401, "epoch": 1276} {"train_loss": -11.716069221496582, "global_step": 214402, "epoch": 1276} {"train_loss": -9.992256164550781, "global_step": 214403, "epoch": 1276} {"train_loss": -11.030539512634277, "global_step": 214404, "epoch": 1276} {"train_loss": -11.208714485168457, "global_step": 214405, "epoch": 1276} {"train_loss": -10.981611251831055, "global_step": 214406, "epoch": 1276} {"train_loss": -11.334013938903809, "global_step": 214407, "epoch": 1276} {"train_loss": -10.808187484741211, "global_step": 214408, "epoch": 1276} {"train_loss": -10.514825820922852, "global_step": 214409, "epoch": 1276} {"train_loss": -10.730472564697266, "global_step": 214410, "epoch": 1276} {"train_loss": -10.579462051391602, "global_step": 214411, "epoch": 1276} {"train_loss": -10.736824989318848, "global_step": 214412, "epoch": 1276} {"train_loss": -10.349763870239258, "global_step": 214413, "epoch": 1276} {"train_loss": -10.57374095916748, "global_step": 214414, "epoch": 1276} {"train_loss": -10.680074691772461, "global_step": 214415, "epoch": 1276} {"train_loss": -10.346521377563477, "global_step": 214416, "epoch": 1276} {"train_loss": -10.58264446258545, "global_step": 214417, "epoch": 1276} {"train_loss": -10.856521606445312, "global_step": 214418, "epoch": 1276} {"train_loss": -10.597172737121582, "global_step": 214419, "epoch": 1276} {"train_loss": -10.714345932006836, "global_step": 214420, "epoch": 1276} {"train_loss": -10.671416282653809, "global_step": 214421, "epoch": 1276} {"train_loss": -10.167866706848145, "global_step": 214422, "epoch": 1276} {"train_loss": -11.350265502929688, "global_step": 214423, "epoch": 1276} {"train_loss": -10.529810905456543, "global_step": 214424, "epoch": 1276} {"train_loss": -10.831787109375, "global_step": 214425, "epoch": 1276} {"train_loss": -10.467794418334961, "global_step": 214426, "epoch": 1276} {"train_loss": -10.470247268676758, "global_step": 214427, "epoch": 1276} {"train_loss": -10.384299278259277, "global_step": 214428, "epoch": 1276} {"train_loss": -10.50393295288086, "global_step": 214429, "epoch": 1276} {"train_loss": -10.803659439086914, "global_step": 214430, "epoch": 1276} {"train_loss": -10.162833213806152, "global_step": 214431, "epoch": 1276} {"train_loss": -10.099151611328125, "global_step": 214432, "epoch": 1276} {"train_loss": -11.042367935180664, "global_step": 214433, "epoch": 1276} {"train_loss": -10.478784561157227, "global_step": 214434, "epoch": 1276} {"train_loss": -10.634618759155273, "global_step": 214435, "epoch": 1276} {"train_loss": -10.802534103393555, "global_step": 214436, "epoch": 1276} {"train_loss": -11.054131507873535, "global_step": 214437, "epoch": 1276} {"train_loss": -11.04888916015625, "global_step": 214438, "epoch": 1276} {"train_loss": -10.971526145935059, "global_step": 214439, "epoch": 1276} {"train_loss": -11.320775032043457, "global_step": 214440, "epoch": 1276} {"train_loss": -11.236690521240234, "global_step": 214441, "epoch": 1276} {"train_loss": -11.066596984863281, "global_step": 214442, "epoch": 1276} {"train_loss": -11.29802417755127, "global_step": 214443, "epoch": 1276} {"train_loss": -11.108945846557617, "global_step": 214444, "epoch": 1276} {"train_loss": -11.301762580871582, "global_step": 214445, "epoch": 1276} {"train_loss": -11.295312881469727, "global_step": 214446, "epoch": 1276} {"train_loss": -11.369511604309082, "global_step": 214447, "epoch": 1276} {"train_loss": -11.259376525878906, "global_step": 214448, "epoch": 1276} {"train_loss": -11.314168930053711, "global_step": 214449, "epoch": 1276} {"train_loss": -11.418441772460938, "global_step": 214450, "epoch": 1276} {"train_loss": -11.267415046691895, "global_step": 214451, "epoch": 1276} {"train_loss": -11.35662841796875, "global_step": 214452, "epoch": 1276} {"train_loss": -11.495941162109375, "global_step": 214453, "epoch": 1276} {"train_loss": -11.425294876098633, "global_step": 214454, "epoch": 1276} {"train_loss": -11.580720901489258, "global_step": 214455, "epoch": 1276} {"train_loss": -11.394262313842773, "global_step": 214456, "epoch": 1276} {"train_loss": -11.500129699707031, "global_step": 214457, "epoch": 1276} {"train_loss": -11.592964172363281, "global_step": 214458, "epoch": 1276} {"train_loss": -11.491663932800293, "global_step": 214459, "epoch": 1276} {"train_loss": -11.686330795288086, "global_step": 214460, "epoch": 1276} {"train_loss": -11.60640811920166, "global_step": 214461, "epoch": 1276} {"train_loss": -11.57696533203125, "global_step": 214462, "epoch": 1276} {"train_loss": -11.622265815734863, "global_step": 214463, "epoch": 1276} {"train_loss": -11.537520408630371, "global_step": 214464, "epoch": 1276} {"train_loss": -11.606725692749023, "global_step": 214465, "epoch": 1276} {"train_loss": -11.359230041503906, "global_step": 214466, "epoch": 1276} {"train_loss": -11.694912910461426, "global_step": 214467, "epoch": 1276} {"train_loss": -11.678292274475098, "global_step": 214468, "epoch": 1276} {"train_loss": -11.675448417663574, "global_step": 214469, "epoch": 1276} {"train_loss": -11.545856475830078, "global_step": 214470, "epoch": 1276} {"train_loss": -11.556821823120117, "global_step": 214471, "epoch": 1276} {"train_loss": -11.669733047485352, "global_step": 214472, "epoch": 1276} {"train_loss": -11.509334564208984, "global_step": 214473, "epoch": 1276} {"train_loss": -11.687294006347656, "global_step": 214474, "epoch": 1276} {"train_loss": -11.77041244506836, "global_step": 214475, "epoch": 1276} {"train_loss": -11.78248119354248, "global_step": 214476, "epoch": 1276} {"train_loss": -11.717172622680664, "global_step": 214477, "epoch": 1276} {"train_loss": -11.8643217086792, "global_step": 214478, "epoch": 1276} {"train_loss": -11.563652038574219, "global_step": 214479, "epoch": 1276} {"train_loss": -11.688716888427734, "global_step": 214480, "epoch": 1276} {"train_loss": -11.784521102905273, "global_step": 214481, "epoch": 1276} {"train_loss": -11.465442657470703, "global_step": 214482, "epoch": 1276} {"train_loss": -11.845074653625488, "global_step": 214483, "epoch": 1276} {"train_loss": -11.429207801818848, "global_step": 214484, "epoch": 1276} {"train_loss": -11.502821922302246, "global_step": 214485, "epoch": 1276} {"train_loss": -11.841317176818848, "global_step": 214486, "epoch": 1276} {"train_loss": -11.867420196533203, "global_step": 214487, "epoch": 1276} {"train_loss": -11.768186569213867, "global_step": 214488, "epoch": 1276} {"train_loss": -11.654134750366211, "global_step": 214489, "epoch": 1276} {"train_loss": -11.512224197387695, "global_step": 214490, "epoch": 1276} {"train_loss": -11.62000846862793, "global_step": 214491, "epoch": 1276} {"train_loss": -11.620768547058105, "global_step": 214492, "epoch": 1276} {"train_loss": -11.721671104431152, "global_step": 214493, "epoch": 1276} {"train_loss": -11.650001525878906, "global_step": 214494, "epoch": 1276} {"train_loss": -11.948448181152344, "global_step": 214495, "epoch": 1276} {"train_loss": -11.593782424926758, "global_step": 214496, "epoch": 1276} {"train_loss": -11.866899490356445, "global_step": 214497, "epoch": 1276} {"train_loss": -11.889886856079102, "global_step": 214498, "epoch": 1276} {"train_loss": -11.653334617614746, "global_step": 214499, "epoch": 1276} {"train_loss": -11.72276496887207, "global_step": 214500, "epoch": 1276} {"train_loss": -11.954614639282227, "global_step": 214501, "epoch": 1276} {"train_loss": -11.264299392700195, "global_step": 214502, "epoch": 1276} {"train_loss": -10.404520034790039, "global_step": 214503, "epoch": 1276} {"train_loss": -11.491168022155762, "global_step": 214504, "epoch": 1276} {"train_loss": -10.928918838500977, "global_step": 214505, "epoch": 1276} {"train_loss": -11.3363037109375, "global_step": 214506, "epoch": 1276} {"train_loss": -10.393869400024414, "global_step": 214507, "epoch": 1276} {"train_loss": -10.447537422180176, "global_step": 214508, "epoch": 1276} {"train_loss": -10.109831809997559, "global_step": 214509, "epoch": 1276} {"train_loss": -10.68740463256836, "global_step": 214510, "epoch": 1276} {"train_loss": -10.34238052368164, "global_step": 214511, "epoch": 1276} {"train_loss": -10.629340171813965, "global_step": 214512, "epoch": 1276} {"train_loss": -10.824080467224121, "global_step": 214513, "epoch": 1276} {"train_loss": -11.583929061889648, "global_step": 214514, "epoch": 1276} {"train_loss": -10.407058715820312, "global_step": 214515, "epoch": 1276} {"train_loss": -11.235334396362305, "global_step": 214516, "epoch": 1276} {"train_loss": -10.870489120483398, "global_step": 214517, "epoch": 1276} {"train_loss": -10.875953674316406, "global_step": 214518, "epoch": 1276} {"train_loss": -10.229103088378906, "global_step": 214519, "epoch": 1276} {"train_loss": -11.048839569091797, "global_step": 214520, "epoch": 1276} {"train_loss": -8.815441131591797, "global_step": 214521, "epoch": 1276} {"train_loss": -9.577205657958984, "global_step": 214522, "epoch": 1276} {"train_loss": -10.782051086425781, "global_step": 214523, "epoch": 1276} {"train_loss": -9.620709419250488, "global_step": 214524, "epoch": 1276} {"train_loss": -10.307826042175293, "global_step": 214525, "epoch": 1276} {"train_loss": -10.668214797973633, "global_step": 214526, "epoch": 1276} {"train_loss": -10.422558784484863, "global_step": 214527, "epoch": 1276} {"train_loss": -11.239992141723633, "global_step": 214528, "epoch": 1276} {"train_loss": -10.467772483825684, "global_step": 214529, "epoch": 1276} {"train_loss": -10.789974212646484, "global_step": 214530, "epoch": 1276} {"train_loss": -10.455684661865234, "global_step": 214531, "epoch": 1276} {"train_loss": -10.885560035705566, "global_step": 214532, "epoch": 1276} {"train_loss": -10.36452865600586, "global_step": 214533, "epoch": 1276} {"train_loss": -10.694925308227539, "global_step": 214534, "epoch": 1276} {"train_loss": -11.10267328080677, "global_step": 214535, "epoch": 1276, "val_loss": 252153.859375} {"train_loss": -11.14999771118164, "global_step": 214536, "epoch": 1277} {"train_loss": -11.188941955566406, "global_step": 214537, "epoch": 1277} {"train_loss": -10.825418472290039, "global_step": 214538, "epoch": 1277} {"train_loss": -11.23130989074707, "global_step": 214539, "epoch": 1277} {"train_loss": -11.076985359191895, "global_step": 214540, "epoch": 1277} {"train_loss": -10.961057662963867, "global_step": 214541, "epoch": 1277} {"train_loss": -11.254812240600586, "global_step": 214542, "epoch": 1277} {"train_loss": -10.914302825927734, "global_step": 214543, "epoch": 1277} {"train_loss": -10.857401847839355, "global_step": 214544, "epoch": 1277} {"train_loss": -11.124994277954102, "global_step": 214545, "epoch": 1277} {"train_loss": -10.99138069152832, "global_step": 214546, "epoch": 1277} {"train_loss": -10.912297248840332, "global_step": 214547, "epoch": 1277} {"train_loss": -11.141310691833496, "global_step": 214548, "epoch": 1277} {"train_loss": -10.782382011413574, "global_step": 214549, "epoch": 1277} {"train_loss": -11.494117736816406, "global_step": 214550, "epoch": 1277} {"train_loss": -11.088019371032715, "global_step": 214551, "epoch": 1277} {"train_loss": -10.709750175476074, "global_step": 214552, "epoch": 1277} {"train_loss": -11.119261741638184, "global_step": 214553, "epoch": 1277} {"train_loss": -10.988243103027344, "global_step": 214554, "epoch": 1277} {"train_loss": -11.266011238098145, "global_step": 214555, "epoch": 1277} {"train_loss": -11.276988983154297, "global_step": 214556, "epoch": 1277} {"train_loss": -11.353012084960938, "global_step": 214557, "epoch": 1277} {"train_loss": -11.030473709106445, "global_step": 214558, "epoch": 1277} {"train_loss": -11.35236644744873, "global_step": 214559, "epoch": 1277} {"train_loss": -11.00680160522461, "global_step": 214560, "epoch": 1277} {"train_loss": -11.555734634399414, "global_step": 214561, "epoch": 1277} {"train_loss": -10.722967147827148, "global_step": 214562, "epoch": 1277} {"train_loss": -11.567205429077148, "global_step": 214563, "epoch": 1277} {"train_loss": -10.900074005126953, "global_step": 214564, "epoch": 1277} {"train_loss": -10.997190475463867, "global_step": 214565, "epoch": 1277} {"train_loss": -10.698709487915039, "global_step": 214566, "epoch": 1277} {"train_loss": -11.276190757751465, "global_step": 214567, "epoch": 1277} {"train_loss": -10.798242568969727, "global_step": 214568, "epoch": 1277} {"train_loss": -10.98520278930664, "global_step": 214569, "epoch": 1277} {"train_loss": -10.765947341918945, "global_step": 214570, "epoch": 1277} {"train_loss": -10.52128791809082, "global_step": 214571, "epoch": 1277} {"train_loss": -11.596345901489258, "global_step": 214572, "epoch": 1277} {"train_loss": -11.047709465026855, "global_step": 214573, "epoch": 1277} {"train_loss": -11.169916152954102, "global_step": 214574, "epoch": 1277} {"train_loss": -11.331121444702148, "global_step": 214575, "epoch": 1277} {"train_loss": -11.165487289428711, "global_step": 214576, "epoch": 1277} {"train_loss": -11.334308624267578, "global_step": 214577, "epoch": 1277} {"train_loss": -11.657367706298828, "global_step": 214578, "epoch": 1277} {"train_loss": -11.295249938964844, "global_step": 214579, "epoch": 1277} {"train_loss": -11.37955093383789, "global_step": 214580, "epoch": 1277} {"train_loss": -11.743165969848633, "global_step": 214581, "epoch": 1277} {"train_loss": -11.323712348937988, "global_step": 214582, "epoch": 1277} {"train_loss": -11.370769500732422, "global_step": 214583, "epoch": 1277} {"train_loss": -11.488728523254395, "global_step": 214584, "epoch": 1277} {"train_loss": -11.446085929870605, "global_step": 214585, "epoch": 1277} {"train_loss": -11.6939697265625, "global_step": 214586, "epoch": 1277} {"train_loss": -11.57003116607666, "global_step": 214587, "epoch": 1277} {"train_loss": -11.448522567749023, "global_step": 214588, "epoch": 1277} {"train_loss": -11.511592864990234, "global_step": 214589, "epoch": 1277} {"train_loss": -11.28103256225586, "global_step": 214590, "epoch": 1277} {"train_loss": -11.578874588012695, "global_step": 214591, "epoch": 1277} {"train_loss": -11.610157012939453, "global_step": 214592, "epoch": 1277} {"train_loss": -11.577503204345703, "global_step": 214593, "epoch": 1277} {"train_loss": -11.817069053649902, "global_step": 214594, "epoch": 1277} {"train_loss": -11.408653259277344, "global_step": 214595, "epoch": 1277} {"train_loss": -11.762054443359375, "global_step": 214596, "epoch": 1277} {"train_loss": -11.700631141662598, "global_step": 214597, "epoch": 1277} {"train_loss": -11.593727111816406, "global_step": 214598, "epoch": 1277} {"train_loss": -11.598109245300293, "global_step": 214599, "epoch": 1277} {"train_loss": -11.76435375213623, "global_step": 214600, "epoch": 1277} {"train_loss": -11.718782424926758, "global_step": 214601, "epoch": 1277} {"train_loss": -11.78182601928711, "global_step": 214602, "epoch": 1277} {"train_loss": -11.684219360351562, "global_step": 214603, "epoch": 1277} {"train_loss": -11.588441848754883, "global_step": 214604, "epoch": 1277} {"train_loss": -11.682154655456543, "global_step": 214605, "epoch": 1277} {"train_loss": -11.864011764526367, "global_step": 214606, "epoch": 1277} {"train_loss": -11.897564888000488, "global_step": 214607, "epoch": 1277} {"train_loss": -11.846601486206055, "global_step": 214608, "epoch": 1277} {"train_loss": -11.840624809265137, "global_step": 214609, "epoch": 1277} {"train_loss": -11.934127807617188, "global_step": 214610, "epoch": 1277} {"train_loss": -11.658679962158203, "global_step": 214611, "epoch": 1277} {"train_loss": -11.759535789489746, "global_step": 214612, "epoch": 1277} {"train_loss": -12.084089279174805, "global_step": 214613, "epoch": 1277} {"train_loss": -11.840177536010742, "global_step": 214614, "epoch": 1277} {"train_loss": -11.8482084274292, "global_step": 214615, "epoch": 1277} {"train_loss": -12.022468566894531, "global_step": 214616, "epoch": 1277} {"train_loss": -12.016721725463867, "global_step": 214617, "epoch": 1277} {"train_loss": -12.020246505737305, "global_step": 214618, "epoch": 1277} {"train_loss": -12.117656707763672, "global_step": 214619, "epoch": 1277} {"train_loss": -12.078414916992188, "global_step": 214620, "epoch": 1277} {"train_loss": -12.055438995361328, "global_step": 214621, "epoch": 1277} {"train_loss": -12.105260848999023, "global_step": 214622, "epoch": 1277} {"train_loss": -11.910452842712402, "global_step": 214623, "epoch": 1277} {"train_loss": -11.548877716064453, "global_step": 214624, "epoch": 1277} {"train_loss": -11.765348434448242, "global_step": 214625, "epoch": 1277} {"train_loss": -11.853716850280762, "global_step": 214626, "epoch": 1277} {"train_loss": -11.885873794555664, "global_step": 214627, "epoch": 1277} {"train_loss": -11.839727401733398, "global_step": 214628, "epoch": 1277} {"train_loss": -11.92777156829834, "global_step": 214629, "epoch": 1277} {"train_loss": -11.765247344970703, "global_step": 214630, "epoch": 1277} {"train_loss": -11.671642303466797, "global_step": 214631, "epoch": 1277} {"train_loss": -11.669075012207031, "global_step": 214632, "epoch": 1277} {"train_loss": -11.926567077636719, "global_step": 214633, "epoch": 1277} {"train_loss": -11.75852108001709, "global_step": 214634, "epoch": 1277} {"train_loss": -11.463869094848633, "global_step": 214635, "epoch": 1277} {"train_loss": -11.049227714538574, "global_step": 214636, "epoch": 1277} {"train_loss": -11.249409675598145, "global_step": 214637, "epoch": 1277} {"train_loss": -11.907715797424316, "global_step": 214638, "epoch": 1277} {"train_loss": -11.179132461547852, "global_step": 214639, "epoch": 1277} {"train_loss": -10.027353286743164, "global_step": 214640, "epoch": 1277} {"train_loss": -10.83041000366211, "global_step": 214641, "epoch": 1277} {"train_loss": -11.750795364379883, "global_step": 214642, "epoch": 1277} {"train_loss": -11.218446731567383, "global_step": 214643, "epoch": 1277} {"train_loss": -10.606447219848633, "global_step": 214644, "epoch": 1277} {"train_loss": -10.82557487487793, "global_step": 214645, "epoch": 1277} {"train_loss": -11.575088500976562, "global_step": 214646, "epoch": 1277} {"train_loss": -10.598016738891602, "global_step": 214647, "epoch": 1277} {"train_loss": -10.44008731842041, "global_step": 214648, "epoch": 1277} {"train_loss": -10.179708480834961, "global_step": 214649, "epoch": 1277} {"train_loss": -10.583318710327148, "global_step": 214650, "epoch": 1277} {"train_loss": -10.057329177856445, "global_step": 214651, "epoch": 1277} {"train_loss": -10.929475784301758, "global_step": 214652, "epoch": 1277} {"train_loss": -10.12072467803955, "global_step": 214653, "epoch": 1277} {"train_loss": -11.434957504272461, "global_step": 214654, "epoch": 1277} {"train_loss": -10.258417129516602, "global_step": 214655, "epoch": 1277} {"train_loss": -10.817816734313965, "global_step": 214656, "epoch": 1277} {"train_loss": -11.238590240478516, "global_step": 214657, "epoch": 1277} {"train_loss": -10.516918182373047, "global_step": 214658, "epoch": 1277} {"train_loss": -11.576099395751953, "global_step": 214659, "epoch": 1277} {"train_loss": -10.869644165039062, "global_step": 214660, "epoch": 1277} {"train_loss": -11.01117992401123, "global_step": 214661, "epoch": 1277} {"train_loss": -11.394404411315918, "global_step": 214662, "epoch": 1277} {"train_loss": -10.764284133911133, "global_step": 214663, "epoch": 1277} {"train_loss": -11.115421295166016, "global_step": 214664, "epoch": 1277} {"train_loss": -11.061416625976562, "global_step": 214665, "epoch": 1277} {"train_loss": -9.994268417358398, "global_step": 214666, "epoch": 1277} {"train_loss": -10.598855972290039, "global_step": 214667, "epoch": 1277} {"train_loss": -10.038825988769531, "global_step": 214668, "epoch": 1277} {"train_loss": -10.252467155456543, "global_step": 214669, "epoch": 1277} {"train_loss": -9.826693534851074, "global_step": 214670, "epoch": 1277} {"train_loss": -10.376169204711914, "global_step": 214671, "epoch": 1277} {"train_loss": -11.125635147094727, "global_step": 214672, "epoch": 1277} {"train_loss": -10.79338550567627, "global_step": 214673, "epoch": 1277} {"train_loss": -10.650962829589844, "global_step": 214674, "epoch": 1277} {"train_loss": -11.208520889282227, "global_step": 214675, "epoch": 1277} {"train_loss": -10.760714530944824, "global_step": 214676, "epoch": 1277} {"train_loss": -11.01508903503418, "global_step": 214677, "epoch": 1277} {"train_loss": -11.284905433654785, "global_step": 214678, "epoch": 1277} {"train_loss": -10.978755950927734, "global_step": 214679, "epoch": 1277} {"train_loss": -11.44217300415039, "global_step": 214680, "epoch": 1277} {"train_loss": -11.06209659576416, "global_step": 214681, "epoch": 1277} {"train_loss": -11.272006034851074, "global_step": 214682, "epoch": 1277} {"train_loss": -11.171712875366211, "global_step": 214683, "epoch": 1277} {"train_loss": -11.06386947631836, "global_step": 214684, "epoch": 1277} {"train_loss": -11.27900505065918, "global_step": 214685, "epoch": 1277} {"train_loss": -11.124969482421875, "global_step": 214686, "epoch": 1277} {"train_loss": -11.081083297729492, "global_step": 214687, "epoch": 1277} {"train_loss": -11.183982849121094, "global_step": 214688, "epoch": 1277} {"train_loss": -10.808492660522461, "global_step": 214689, "epoch": 1277} {"train_loss": -11.235760688781738, "global_step": 214690, "epoch": 1277} {"train_loss": -10.795387268066406, "global_step": 214691, "epoch": 1277} {"train_loss": -11.405064582824707, "global_step": 214692, "epoch": 1277} {"train_loss": -11.25029182434082, "global_step": 214693, "epoch": 1277} {"train_loss": -11.31917953491211, "global_step": 214694, "epoch": 1277} {"train_loss": -11.323297500610352, "global_step": 214695, "epoch": 1277} {"train_loss": -11.21100902557373, "global_step": 214696, "epoch": 1277} {"train_loss": -11.043280601501465, "global_step": 214697, "epoch": 1277} {"train_loss": -11.466608047485352, "global_step": 214698, "epoch": 1277} {"train_loss": -11.179126739501953, "global_step": 214699, "epoch": 1277} {"train_loss": -11.66214370727539, "global_step": 214700, "epoch": 1277} {"train_loss": -11.337928771972656, "global_step": 214701, "epoch": 1277} {"train_loss": -11.55061149597168, "global_step": 214702, "epoch": 1277} {"train_loss": -11.257972155298505, "global_step": 214703, "epoch": 1277, "val_loss": 258207.234375} {"train_loss": -11.520814895629883, "global_step": 214704, "epoch": 1278} {"train_loss": -11.442222595214844, "global_step": 214705, "epoch": 1278} {"train_loss": -11.455158233642578, "global_step": 214706, "epoch": 1278} {"train_loss": -11.433867454528809, "global_step": 214707, "epoch": 1278} {"train_loss": -11.435606002807617, "global_step": 214708, "epoch": 1278} {"train_loss": -11.54097843170166, "global_step": 214709, "epoch": 1278} {"train_loss": -11.465404510498047, "global_step": 214710, "epoch": 1278} {"train_loss": -11.544570922851562, "global_step": 214711, "epoch": 1278} {"train_loss": -11.373010635375977, "global_step": 214712, "epoch": 1278} {"train_loss": -11.788822174072266, "global_step": 214713, "epoch": 1278} {"train_loss": -11.49189281463623, "global_step": 214714, "epoch": 1278} {"train_loss": -11.552223205566406, "global_step": 214715, "epoch": 1278} {"train_loss": -11.482548713684082, "global_step": 214716, "epoch": 1278} {"train_loss": -11.616031646728516, "global_step": 214717, "epoch": 1278} {"train_loss": -11.667481422424316, "global_step": 214718, "epoch": 1278} {"train_loss": -11.431588172912598, "global_step": 214719, "epoch": 1278} {"train_loss": -11.520127296447754, "global_step": 214720, "epoch": 1278} {"train_loss": -11.229591369628906, "global_step": 214721, "epoch": 1278} {"train_loss": -11.65260124206543, "global_step": 214722, "epoch": 1278} {"train_loss": -11.520463943481445, "global_step": 214723, "epoch": 1278} {"train_loss": -11.536449432373047, "global_step": 214724, "epoch": 1278} {"train_loss": -11.738076210021973, "global_step": 214725, "epoch": 1278} {"train_loss": -11.556766510009766, "global_step": 214726, "epoch": 1278} {"train_loss": -11.663619995117188, "global_step": 214727, "epoch": 1278} {"train_loss": -11.728601455688477, "global_step": 214728, "epoch": 1278} {"train_loss": -11.807311058044434, "global_step": 214729, "epoch": 1278} {"train_loss": -11.643850326538086, "global_step": 214730, "epoch": 1278} {"train_loss": -11.67112922668457, "global_step": 214731, "epoch": 1278} {"train_loss": -11.45324993133545, "global_step": 214732, "epoch": 1278} {"train_loss": -11.59648323059082, "global_step": 214733, "epoch": 1278} {"train_loss": -11.453310012817383, "global_step": 214734, "epoch": 1278} {"train_loss": -11.694622039794922, "global_step": 214735, "epoch": 1278} {"train_loss": -11.682701110839844, "global_step": 214736, "epoch": 1278} {"train_loss": -11.419260025024414, "global_step": 214737, "epoch": 1278} {"train_loss": -11.794851303100586, "global_step": 214738, "epoch": 1278} {"train_loss": -11.47523307800293, "global_step": 214739, "epoch": 1278} {"train_loss": -11.701236724853516, "global_step": 214740, "epoch": 1278} {"train_loss": -11.717765808105469, "global_step": 214741, "epoch": 1278} {"train_loss": -11.706628799438477, "global_step": 214742, "epoch": 1278} {"train_loss": -12.004539489746094, "global_step": 214743, "epoch": 1278} {"train_loss": -11.856115341186523, "global_step": 214744, "epoch": 1278} {"train_loss": -11.813756942749023, "global_step": 214745, "epoch": 1278} {"train_loss": -11.861175537109375, "global_step": 214746, "epoch": 1278} {"train_loss": -11.944765090942383, "global_step": 214747, "epoch": 1278} {"train_loss": -11.843283653259277, "global_step": 214748, "epoch": 1278} {"train_loss": -11.889291763305664, "global_step": 214749, "epoch": 1278} {"train_loss": -11.847249984741211, "global_step": 214750, "epoch": 1278} {"train_loss": -11.912200927734375, "global_step": 214751, "epoch": 1278} {"train_loss": -11.955883979797363, "global_step": 214752, "epoch": 1278} {"train_loss": -11.760202407836914, "global_step": 214753, "epoch": 1278} {"train_loss": -11.809154510498047, "global_step": 214754, "epoch": 1278} {"train_loss": -11.947978019714355, "global_step": 214755, "epoch": 1278} {"train_loss": -11.77875804901123, "global_step": 214756, "epoch": 1278} {"train_loss": -11.748849868774414, "global_step": 214757, "epoch": 1278} {"train_loss": -11.299642562866211, "global_step": 214758, "epoch": 1278} {"train_loss": -11.772706985473633, "global_step": 214759, "epoch": 1278} {"train_loss": -11.870704650878906, "global_step": 214760, "epoch": 1278} {"train_loss": -11.625554084777832, "global_step": 214761, "epoch": 1278} {"train_loss": -11.891406059265137, "global_step": 214762, "epoch": 1278} {"train_loss": -11.916629791259766, "global_step": 214763, "epoch": 1278} {"train_loss": -11.774800300598145, "global_step": 214764, "epoch": 1278} {"train_loss": -11.716717720031738, "global_step": 214765, "epoch": 1278} {"train_loss": -11.64273452758789, "global_step": 214766, "epoch": 1278} {"train_loss": -12.032150268554688, "global_step": 214767, "epoch": 1278} {"train_loss": -11.912397384643555, "global_step": 214768, "epoch": 1278} {"train_loss": -11.692567825317383, "global_step": 214769, "epoch": 1278} {"train_loss": -12.017267227172852, "global_step": 214770, "epoch": 1278} {"train_loss": -11.840648651123047, "global_step": 214771, "epoch": 1278} {"train_loss": -12.058670043945312, "global_step": 214772, "epoch": 1278} {"train_loss": -11.977113723754883, "global_step": 214773, "epoch": 1278} {"train_loss": -11.76551628112793, "global_step": 214774, "epoch": 1278} {"train_loss": -11.969013214111328, "global_step": 214775, "epoch": 1278} {"train_loss": -12.031733512878418, "global_step": 214776, "epoch": 1278} {"train_loss": -12.018037796020508, "global_step": 214777, "epoch": 1278} {"train_loss": -11.985095977783203, "global_step": 214778, "epoch": 1278} {"train_loss": -11.526166915893555, "global_step": 214779, "epoch": 1278} {"train_loss": -11.5165376663208, "global_step": 214780, "epoch": 1278} {"train_loss": -11.14981460571289, "global_step": 214781, "epoch": 1278} {"train_loss": -11.533402442932129, "global_step": 214782, "epoch": 1278} {"train_loss": -10.694692611694336, "global_step": 214783, "epoch": 1278} {"train_loss": -10.06402587890625, "global_step": 214784, "epoch": 1278} {"train_loss": -9.09527587890625, "global_step": 214785, "epoch": 1278} {"train_loss": -11.022279739379883, "global_step": 214786, "epoch": 1278} {"train_loss": -8.524300575256348, "global_step": 214787, "epoch": 1278} {"train_loss": -9.122650146484375, "global_step": 214788, "epoch": 1278} {"train_loss": -10.988569259643555, "global_step": 214789, "epoch": 1278} {"train_loss": -8.30592155456543, "global_step": 214790, "epoch": 1278} {"train_loss": -10.737054824829102, "global_step": 214791, "epoch": 1278} {"train_loss": -8.617755889892578, "global_step": 214792, "epoch": 1278} {"train_loss": -10.999277114868164, "global_step": 214793, "epoch": 1278} {"train_loss": -9.397306442260742, "global_step": 214794, "epoch": 1278} {"train_loss": -11.076576232910156, "global_step": 214795, "epoch": 1278} {"train_loss": -10.146041870117188, "global_step": 214796, "epoch": 1278} {"train_loss": -9.419282913208008, "global_step": 214797, "epoch": 1278} {"train_loss": -11.11986255645752, "global_step": 214798, "epoch": 1278} {"train_loss": -9.953282356262207, "global_step": 214799, "epoch": 1278} {"train_loss": -10.958545684814453, "global_step": 214800, "epoch": 1278} {"train_loss": -10.308123588562012, "global_step": 214801, "epoch": 1278} {"train_loss": -11.07364559173584, "global_step": 214802, "epoch": 1278} {"train_loss": -10.498228073120117, "global_step": 214803, "epoch": 1278} {"train_loss": -10.824416160583496, "global_step": 214804, "epoch": 1278} {"train_loss": -10.558900833129883, "global_step": 214805, "epoch": 1278} {"train_loss": -10.969182014465332, "global_step": 214806, "epoch": 1278} {"train_loss": -11.064460754394531, "global_step": 214807, "epoch": 1278} {"train_loss": -10.888744354248047, "global_step": 214808, "epoch": 1278} {"train_loss": -11.138975143432617, "global_step": 214809, "epoch": 1278} {"train_loss": -11.18471908569336, "global_step": 214810, "epoch": 1278} {"train_loss": -11.351969718933105, "global_step": 214811, "epoch": 1278} {"train_loss": -11.15160083770752, "global_step": 214812, "epoch": 1278} {"train_loss": -11.45588493347168, "global_step": 214813, "epoch": 1278} {"train_loss": -11.076457977294922, "global_step": 214814, "epoch": 1278} {"train_loss": -10.896864891052246, "global_step": 214815, "epoch": 1278} {"train_loss": -11.377204895019531, "global_step": 214816, "epoch": 1278} {"train_loss": -11.461977005004883, "global_step": 214817, "epoch": 1278} {"train_loss": -11.48861312866211, "global_step": 214818, "epoch": 1278} {"train_loss": -11.091994285583496, "global_step": 214819, "epoch": 1278} {"train_loss": -11.561761856079102, "global_step": 214820, "epoch": 1278} {"train_loss": -11.205188751220703, "global_step": 214821, "epoch": 1278} {"train_loss": -11.279726028442383, "global_step": 214822, "epoch": 1278} {"train_loss": -11.347902297973633, "global_step": 214823, "epoch": 1278} {"train_loss": -11.363947868347168, "global_step": 214824, "epoch": 1278} {"train_loss": -11.49213981628418, "global_step": 214825, "epoch": 1278} {"train_loss": -11.600626945495605, "global_step": 214826, "epoch": 1278} {"train_loss": -11.419368743896484, "global_step": 214827, "epoch": 1278} {"train_loss": -11.330192565917969, "global_step": 214828, "epoch": 1278} {"train_loss": -11.464775085449219, "global_step": 214829, "epoch": 1278} {"train_loss": -11.591872215270996, "global_step": 214830, "epoch": 1278} {"train_loss": -11.55991268157959, "global_step": 214831, "epoch": 1278} {"train_loss": -11.508426666259766, "global_step": 214832, "epoch": 1278} {"train_loss": -11.46399211883545, "global_step": 214833, "epoch": 1278} {"train_loss": -11.702308654785156, "global_step": 214834, "epoch": 1278} {"train_loss": -11.626365661621094, "global_step": 214835, "epoch": 1278} {"train_loss": -11.545784950256348, "global_step": 214836, "epoch": 1278} {"train_loss": -11.493181228637695, "global_step": 214837, "epoch": 1278} {"train_loss": -11.52701473236084, "global_step": 214838, "epoch": 1278} {"train_loss": -11.621702194213867, "global_step": 214839, "epoch": 1278} {"train_loss": -11.657516479492188, "global_step": 214840, "epoch": 1278} {"train_loss": -11.464042663574219, "global_step": 214841, "epoch": 1278} {"train_loss": -11.63720703125, "global_step": 214842, "epoch": 1278} {"train_loss": -11.60943603515625, "global_step": 214843, "epoch": 1278} {"train_loss": -11.577031135559082, "global_step": 214844, "epoch": 1278} {"train_loss": -11.527277946472168, "global_step": 214845, "epoch": 1278} {"train_loss": -11.7244873046875, "global_step": 214846, "epoch": 1278} {"train_loss": -11.76253890991211, "global_step": 214847, "epoch": 1278} {"train_loss": -11.837240219116211, "global_step": 214848, "epoch": 1278} {"train_loss": -11.513898849487305, "global_step": 214849, "epoch": 1278} {"train_loss": -11.44984245300293, "global_step": 214850, "epoch": 1278} {"train_loss": -11.664064407348633, "global_step": 214851, "epoch": 1278} {"train_loss": -11.727657318115234, "global_step": 214852, "epoch": 1278} {"train_loss": -11.598697662353516, "global_step": 214853, "epoch": 1278} {"train_loss": -11.705825805664062, "global_step": 214854, "epoch": 1278} {"train_loss": -11.657820701599121, "global_step": 214855, "epoch": 1278} {"train_loss": -11.526296615600586, "global_step": 214856, "epoch": 1278} {"train_loss": -11.661676406860352, "global_step": 214857, "epoch": 1278} {"train_loss": -11.671555519104004, "global_step": 214858, "epoch": 1278} {"train_loss": -11.808616638183594, "global_step": 214859, "epoch": 1278} {"train_loss": -11.297575950622559, "global_step": 214860, "epoch": 1278} {"train_loss": -11.410311698913574, "global_step": 214861, "epoch": 1278} {"train_loss": -11.400552749633789, "global_step": 214862, "epoch": 1278} {"train_loss": -11.143609046936035, "global_step": 214863, "epoch": 1278} {"train_loss": -11.274187088012695, "global_step": 214864, "epoch": 1278} {"train_loss": -11.35207748413086, "global_step": 214865, "epoch": 1278} {"train_loss": -11.313294410705566, "global_step": 214866, "epoch": 1278} {"train_loss": -11.033791542053223, "global_step": 214867, "epoch": 1278} {"train_loss": -11.297493934631348, "global_step": 214868, "epoch": 1278} {"train_loss": -11.175240516662598, "global_step": 214869, "epoch": 1278} {"train_loss": -11.554770469665527, "global_step": 214870, "epoch": 1278} {"train_loss": -11.376542494410561, "global_step": 214871, "epoch": 1278, "val_loss": 255690.203125} {"train_loss": -10.554265975952148, "global_step": 214872, "epoch": 1279} {"train_loss": -10.834068298339844, "global_step": 214873, "epoch": 1279} {"train_loss": -11.542840957641602, "global_step": 214874, "epoch": 1279} {"train_loss": -10.872753143310547, "global_step": 214875, "epoch": 1279} {"train_loss": -11.703704833984375, "global_step": 214876, "epoch": 1279} {"train_loss": -11.12243938446045, "global_step": 214877, "epoch": 1279} {"train_loss": -11.08176040649414, "global_step": 214878, "epoch": 1279} {"train_loss": -11.381448745727539, "global_step": 214879, "epoch": 1279} {"train_loss": -10.417231559753418, "global_step": 214880, "epoch": 1279} {"train_loss": -11.458518981933594, "global_step": 214881, "epoch": 1279} {"train_loss": -10.26357650756836, "global_step": 214882, "epoch": 1279} {"train_loss": -10.972103118896484, "global_step": 214883, "epoch": 1279} {"train_loss": -10.456281661987305, "global_step": 214884, "epoch": 1279} {"train_loss": -10.668949127197266, "global_step": 214885, "epoch": 1279} {"train_loss": -11.062644004821777, "global_step": 214886, "epoch": 1279} {"train_loss": -10.806211471557617, "global_step": 214887, "epoch": 1279} {"train_loss": -11.348666191101074, "global_step": 214888, "epoch": 1279} {"train_loss": -11.004861831665039, "global_step": 214889, "epoch": 1279} {"train_loss": -11.464812278747559, "global_step": 214890, "epoch": 1279} {"train_loss": -11.076308250427246, "global_step": 214891, "epoch": 1279} {"train_loss": -11.542669296264648, "global_step": 214892, "epoch": 1279} {"train_loss": -10.964499473571777, "global_step": 214893, "epoch": 1279} {"train_loss": -11.239295959472656, "global_step": 214894, "epoch": 1279} {"train_loss": -10.680841445922852, "global_step": 214895, "epoch": 1279} {"train_loss": -11.12601089477539, "global_step": 214896, "epoch": 1279} {"train_loss": -10.521751403808594, "global_step": 214897, "epoch": 1279} {"train_loss": -11.093586921691895, "global_step": 214898, "epoch": 1279} {"train_loss": -10.892437934875488, "global_step": 214899, "epoch": 1279} {"train_loss": -11.12339973449707, "global_step": 214900, "epoch": 1279} {"train_loss": -10.774351119995117, "global_step": 214901, "epoch": 1279} {"train_loss": -11.197854995727539, "global_step": 214902, "epoch": 1279} {"train_loss": -10.51095962524414, "global_step": 214903, "epoch": 1279} {"train_loss": -11.098848342895508, "global_step": 214904, "epoch": 1279} {"train_loss": -10.733884811401367, "global_step": 214905, "epoch": 1279} {"train_loss": -11.136757850646973, "global_step": 214906, "epoch": 1279} {"train_loss": -11.15155029296875, "global_step": 214907, "epoch": 1279} {"train_loss": -11.367011070251465, "global_step": 214908, "epoch": 1279} {"train_loss": -10.862736701965332, "global_step": 214909, "epoch": 1279} {"train_loss": -10.899564743041992, "global_step": 214910, "epoch": 1279} {"train_loss": -11.369988441467285, "global_step": 214911, "epoch": 1279} {"train_loss": -10.994768142700195, "global_step": 214912, "epoch": 1279} {"train_loss": -11.281923294067383, "global_step": 214913, "epoch": 1279} {"train_loss": -11.319732666015625, "global_step": 214914, "epoch": 1279} {"train_loss": -11.509822845458984, "global_step": 214915, "epoch": 1279} {"train_loss": -11.482833862304688, "global_step": 214916, "epoch": 1279} {"train_loss": -11.538522720336914, "global_step": 214917, "epoch": 1279} {"train_loss": -11.61870288848877, "global_step": 214918, "epoch": 1279} {"train_loss": -11.430732727050781, "global_step": 214919, "epoch": 1279} {"train_loss": -11.570067405700684, "global_step": 214920, "epoch": 1279} {"train_loss": -11.519327163696289, "global_step": 214921, "epoch": 1279} {"train_loss": -11.685953140258789, "global_step": 214922, "epoch": 1279} {"train_loss": -11.821928024291992, "global_step": 214923, "epoch": 1279} {"train_loss": -11.49336051940918, "global_step": 214924, "epoch": 1279} {"train_loss": -11.50813102722168, "global_step": 214925, "epoch": 1279} {"train_loss": -11.611406326293945, "global_step": 214926, "epoch": 1279} {"train_loss": -11.437211036682129, "global_step": 214927, "epoch": 1279} {"train_loss": -11.559976577758789, "global_step": 214928, "epoch": 1279} {"train_loss": -11.618490219116211, "global_step": 214929, "epoch": 1279} {"train_loss": -11.705482482910156, "global_step": 214930, "epoch": 1279} {"train_loss": -11.441611289978027, "global_step": 214931, "epoch": 1279} {"train_loss": -11.685708045959473, "global_step": 214932, "epoch": 1279} {"train_loss": -11.406759262084961, "global_step": 214933, "epoch": 1279} {"train_loss": -11.708869934082031, "global_step": 214934, "epoch": 1279} {"train_loss": -11.309532165527344, "global_step": 214935, "epoch": 1279} {"train_loss": -11.550604820251465, "global_step": 214936, "epoch": 1279} {"train_loss": -10.986753463745117, "global_step": 214937, "epoch": 1279} {"train_loss": -11.43044376373291, "global_step": 214938, "epoch": 1279} {"train_loss": -11.465845108032227, "global_step": 214939, "epoch": 1279} {"train_loss": -11.483421325683594, "global_step": 214940, "epoch": 1279} {"train_loss": -11.240995407104492, "global_step": 214941, "epoch": 1279} {"train_loss": -11.596867561340332, "global_step": 214942, "epoch": 1279} {"train_loss": -11.138740539550781, "global_step": 214943, "epoch": 1279} {"train_loss": -11.6322660446167, "global_step": 214944, "epoch": 1279} {"train_loss": -10.551368713378906, "global_step": 214945, "epoch": 1279} {"train_loss": -11.463228225708008, "global_step": 214946, "epoch": 1279} {"train_loss": -10.745001792907715, "global_step": 214947, "epoch": 1279} {"train_loss": -11.584153175354004, "global_step": 214948, "epoch": 1279} {"train_loss": -11.603828430175781, "global_step": 214949, "epoch": 1279} {"train_loss": -11.406986236572266, "global_step": 214950, "epoch": 1279} {"train_loss": -11.519121170043945, "global_step": 214951, "epoch": 1279} {"train_loss": -11.083372116088867, "global_step": 214952, "epoch": 1279} {"train_loss": -11.395893096923828, "global_step": 214953, "epoch": 1279} {"train_loss": -11.554601669311523, "global_step": 214954, "epoch": 1279} {"train_loss": -11.123868942260742, "global_step": 214955, "epoch": 1279} {"train_loss": -11.686598777770996, "global_step": 214956, "epoch": 1279} {"train_loss": -10.919633865356445, "global_step": 214957, "epoch": 1279} {"train_loss": -11.326305389404297, "global_step": 214958, "epoch": 1279} {"train_loss": -11.206275939941406, "global_step": 214959, "epoch": 1279} {"train_loss": -11.36510181427002, "global_step": 214960, "epoch": 1279} {"train_loss": -11.001575469970703, "global_step": 214961, "epoch": 1279} {"train_loss": -10.50389575958252, "global_step": 214962, "epoch": 1279} {"train_loss": -11.537592887878418, "global_step": 214963, "epoch": 1279} {"train_loss": -10.382241249084473, "global_step": 214964, "epoch": 1279} {"train_loss": -11.510016441345215, "global_step": 214965, "epoch": 1279} {"train_loss": -10.673847198486328, "global_step": 214966, "epoch": 1279} {"train_loss": -10.822793006896973, "global_step": 214967, "epoch": 1279} {"train_loss": -10.70573616027832, "global_step": 214968, "epoch": 1279} {"train_loss": -10.078734397888184, "global_step": 214969, "epoch": 1279} {"train_loss": -11.048880577087402, "global_step": 214970, "epoch": 1279} {"train_loss": -10.701170921325684, "global_step": 214971, "epoch": 1279} {"train_loss": -10.753571510314941, "global_step": 214972, "epoch": 1279} {"train_loss": -10.98939037322998, "global_step": 214973, "epoch": 1279} {"train_loss": -11.230277061462402, "global_step": 214974, "epoch": 1279} {"train_loss": -10.84792423248291, "global_step": 214975, "epoch": 1279} {"train_loss": -11.432190895080566, "global_step": 214976, "epoch": 1279} {"train_loss": -10.890563011169434, "global_step": 214977, "epoch": 1279} {"train_loss": -11.45596981048584, "global_step": 214978, "epoch": 1279} {"train_loss": -11.390531539916992, "global_step": 214979, "epoch": 1279} {"train_loss": -11.321311950683594, "global_step": 214980, "epoch": 1279} {"train_loss": -11.500954627990723, "global_step": 214981, "epoch": 1279} {"train_loss": -11.071736335754395, "global_step": 214982, "epoch": 1279} {"train_loss": -11.544015884399414, "global_step": 214983, "epoch": 1279} {"train_loss": -11.565668106079102, "global_step": 214984, "epoch": 1279} {"train_loss": -11.36199951171875, "global_step": 214985, "epoch": 1279} {"train_loss": -11.764264106750488, "global_step": 214986, "epoch": 1279} {"train_loss": -11.241338729858398, "global_step": 214987, "epoch": 1279} {"train_loss": -11.479757308959961, "global_step": 214988, "epoch": 1279} {"train_loss": -11.64369010925293, "global_step": 214989, "epoch": 1279} {"train_loss": -11.429780006408691, "global_step": 214990, "epoch": 1279} {"train_loss": -11.625753402709961, "global_step": 214991, "epoch": 1279} {"train_loss": -11.469736099243164, "global_step": 214992, "epoch": 1279} {"train_loss": -11.646581649780273, "global_step": 214993, "epoch": 1279} {"train_loss": -11.645269393920898, "global_step": 214994, "epoch": 1279} {"train_loss": -11.615680694580078, "global_step": 214995, "epoch": 1279} {"train_loss": -11.499346733093262, "global_step": 214996, "epoch": 1279} {"train_loss": -11.531380653381348, "global_step": 214997, "epoch": 1279} {"train_loss": -11.839324951171875, "global_step": 214998, "epoch": 1279} {"train_loss": -11.667006492614746, "global_step": 214999, "epoch": 1279} {"train_loss": -11.759397506713867, "global_step": 215000, "epoch": 1279} {"train_loss": -11.546931266784668, "global_step": 215001, "epoch": 1279} {"train_loss": -11.776107788085938, "global_step": 215002, "epoch": 1279} {"train_loss": -11.604225158691406, "global_step": 215003, "epoch": 1279} {"train_loss": -11.929186820983887, "global_step": 215004, "epoch": 1279} {"train_loss": -11.69413948059082, "global_step": 215005, "epoch": 1279} {"train_loss": -11.444000244140625, "global_step": 215006, "epoch": 1279} {"train_loss": -11.923004150390625, "global_step": 215007, "epoch": 1279} {"train_loss": -11.686058044433594, "global_step": 215008, "epoch": 1279} {"train_loss": -11.635382652282715, "global_step": 215009, "epoch": 1279} {"train_loss": -11.49497127532959, "global_step": 215010, "epoch": 1279} {"train_loss": -11.598630905151367, "global_step": 215011, "epoch": 1279} {"train_loss": -11.951263427734375, "global_step": 215012, "epoch": 1279} {"train_loss": -11.735993385314941, "global_step": 215013, "epoch": 1279} {"train_loss": -12.000329971313477, "global_step": 215014, "epoch": 1279} {"train_loss": -11.831962585449219, "global_step": 215015, "epoch": 1279} {"train_loss": -11.738027572631836, "global_step": 215016, "epoch": 1279} {"train_loss": -11.629294395446777, "global_step": 215017, "epoch": 1279} {"train_loss": -11.642923355102539, "global_step": 215018, "epoch": 1279} {"train_loss": -12.014986991882324, "global_step": 215019, "epoch": 1279} {"train_loss": -11.772722244262695, "global_step": 215020, "epoch": 1279} {"train_loss": -12.020644187927246, "global_step": 215021, "epoch": 1279} {"train_loss": -11.654563903808594, "global_step": 215022, "epoch": 1279} {"train_loss": -11.981254577636719, "global_step": 215023, "epoch": 1279} {"train_loss": -11.79017162322998, "global_step": 215024, "epoch": 1279} {"train_loss": -11.657306671142578, "global_step": 215025, "epoch": 1279} {"train_loss": -11.956238746643066, "global_step": 215026, "epoch": 1279} {"train_loss": -11.67061710357666, "global_step": 215027, "epoch": 1279} {"train_loss": -11.72729778289795, "global_step": 215028, "epoch": 1279} {"train_loss": -11.646407127380371, "global_step": 215029, "epoch": 1279} {"train_loss": -11.679755210876465, "global_step": 215030, "epoch": 1279} {"train_loss": -11.627452850341797, "global_step": 215031, "epoch": 1279} {"train_loss": -11.885019302368164, "global_step": 215032, "epoch": 1279} {"train_loss": -11.734384536743164, "global_step": 215033, "epoch": 1279} {"train_loss": -11.517772674560547, "global_step": 215034, "epoch": 1279} {"train_loss": -11.222515106201172, "global_step": 215035, "epoch": 1279} {"train_loss": -10.998889923095703, "global_step": 215036, "epoch": 1279} {"train_loss": -11.6011962890625, "global_step": 215037, "epoch": 1279} {"train_loss": -11.663494110107422, "global_step": 215038, "epoch": 1279} {"train_loss": -11.347204066458202, "global_step": 215039, "epoch": 1279, "val_loss": 258318.921875} {"train_loss": -11.45713996887207, "global_step": 215040, "epoch": 1280} {"train_loss": -11.436479568481445, "global_step": 215041, "epoch": 1280} {"train_loss": -11.310884475708008, "global_step": 215042, "epoch": 1280} {"train_loss": -11.51192855834961, "global_step": 215043, "epoch": 1280} {"train_loss": -10.561494827270508, "global_step": 215044, "epoch": 1280} {"train_loss": -10.868531227111816, "global_step": 215045, "epoch": 1280} {"train_loss": -10.716035842895508, "global_step": 215046, "epoch": 1280} {"train_loss": -11.027095794677734, "global_step": 215047, "epoch": 1280} {"train_loss": -10.165594100952148, "global_step": 215048, "epoch": 1280} {"train_loss": -11.35687255859375, "global_step": 215049, "epoch": 1280} {"train_loss": -10.33426284790039, "global_step": 215050, "epoch": 1280} {"train_loss": -10.814457893371582, "global_step": 215051, "epoch": 1280} {"train_loss": -11.525952339172363, "global_step": 215052, "epoch": 1280} {"train_loss": -10.957205772399902, "global_step": 215053, "epoch": 1280} {"train_loss": -11.49935531616211, "global_step": 215054, "epoch": 1280} {"train_loss": -10.659786224365234, "global_step": 215055, "epoch": 1280} {"train_loss": -11.095943450927734, "global_step": 215056, "epoch": 1280} {"train_loss": -11.03018569946289, "global_step": 215057, "epoch": 1280} {"train_loss": -10.857891082763672, "global_step": 215058, "epoch": 1280} {"train_loss": -11.407613754272461, "global_step": 215059, "epoch": 1280} {"train_loss": -10.643081665039062, "global_step": 215060, "epoch": 1280} {"train_loss": -11.534296989440918, "global_step": 215061, "epoch": 1280} {"train_loss": -10.522806167602539, "global_step": 215062, "epoch": 1280} {"train_loss": -11.097381591796875, "global_step": 215063, "epoch": 1280} {"train_loss": -10.95391845703125, "global_step": 215064, "epoch": 1280} {"train_loss": -10.871382713317871, "global_step": 215065, "epoch": 1280} {"train_loss": -10.884061813354492, "global_step": 215066, "epoch": 1280} {"train_loss": -11.154062271118164, "global_step": 215067, "epoch": 1280} {"train_loss": -10.96542739868164, "global_step": 215068, "epoch": 1280} {"train_loss": -11.11171817779541, "global_step": 215069, "epoch": 1280} {"train_loss": -10.480374336242676, "global_step": 215070, "epoch": 1280} {"train_loss": -10.088526725769043, "global_step": 215071, "epoch": 1280} {"train_loss": -11.234094619750977, "global_step": 215072, "epoch": 1280} {"train_loss": -10.587569236755371, "global_step": 215073, "epoch": 1280} {"train_loss": -10.993270874023438, "global_step": 215074, "epoch": 1280} {"train_loss": -11.080946922302246, "global_step": 215075, "epoch": 1280} {"train_loss": -11.208285331726074, "global_step": 215076, "epoch": 1280} {"train_loss": -10.494998931884766, "global_step": 215077, "epoch": 1280} {"train_loss": -10.870993614196777, "global_step": 215078, "epoch": 1280} {"train_loss": -10.692617416381836, "global_step": 215079, "epoch": 1280} {"train_loss": -11.136085510253906, "global_step": 215080, "epoch": 1280} {"train_loss": -11.101997375488281, "global_step": 215081, "epoch": 1280} {"train_loss": -10.995901107788086, "global_step": 215082, "epoch": 1280} {"train_loss": -11.140105247497559, "global_step": 215083, "epoch": 1280} {"train_loss": -11.408563613891602, "global_step": 215084, "epoch": 1280} {"train_loss": -11.065858840942383, "global_step": 215085, "epoch": 1280} {"train_loss": -11.008728981018066, "global_step": 215086, "epoch": 1280} {"train_loss": -11.520732879638672, "global_step": 215087, "epoch": 1280} {"train_loss": -11.169160842895508, "global_step": 215088, "epoch": 1280} {"train_loss": -11.469959259033203, "global_step": 215089, "epoch": 1280} {"train_loss": -11.408512115478516, "global_step": 215090, "epoch": 1280} {"train_loss": -11.499847412109375, "global_step": 215091, "epoch": 1280} {"train_loss": -11.520166397094727, "global_step": 215092, "epoch": 1280} {"train_loss": -11.584142684936523, "global_step": 215093, "epoch": 1280} {"train_loss": -11.53710651397705, "global_step": 215094, "epoch": 1280} {"train_loss": -11.789955139160156, "global_step": 215095, "epoch": 1280} {"train_loss": -11.659211158752441, "global_step": 215096, "epoch": 1280} {"train_loss": -11.527892112731934, "global_step": 215097, "epoch": 1280} {"train_loss": -11.43791389465332, "global_step": 215098, "epoch": 1280} {"train_loss": -11.726134300231934, "global_step": 215099, "epoch": 1280} {"train_loss": -11.560990333557129, "global_step": 215100, "epoch": 1280} {"train_loss": -11.72217845916748, "global_step": 215101, "epoch": 1280} {"train_loss": -11.658660888671875, "global_step": 215102, "epoch": 1280} {"train_loss": -11.686209678649902, "global_step": 215103, "epoch": 1280} {"train_loss": -11.694034576416016, "global_step": 215104, "epoch": 1280} {"train_loss": -11.808303833007812, "global_step": 215105, "epoch": 1280} {"train_loss": -11.529474258422852, "global_step": 215106, "epoch": 1280} {"train_loss": -11.704517364501953, "global_step": 215107, "epoch": 1280} {"train_loss": -11.891258239746094, "global_step": 215108, "epoch": 1280} {"train_loss": -11.723508834838867, "global_step": 215109, "epoch": 1280} {"train_loss": -11.806035995483398, "global_step": 215110, "epoch": 1280} {"train_loss": -11.848514556884766, "global_step": 215111, "epoch": 1280} {"train_loss": -11.411941528320312, "global_step": 215112, "epoch": 1280} {"train_loss": -11.819520950317383, "global_step": 215113, "epoch": 1280} {"train_loss": -11.809395790100098, "global_step": 215114, "epoch": 1280} {"train_loss": -11.96440315246582, "global_step": 215115, "epoch": 1280} {"train_loss": -11.771377563476562, "global_step": 215116, "epoch": 1280} {"train_loss": -11.865663528442383, "global_step": 215117, "epoch": 1280} {"train_loss": -11.944610595703125, "global_step": 215118, "epoch": 1280} {"train_loss": -11.633610725402832, "global_step": 215119, "epoch": 1280} {"train_loss": -11.871444702148438, "global_step": 215120, "epoch": 1280} {"train_loss": -11.708688735961914, "global_step": 215121, "epoch": 1280} {"train_loss": -11.914606094360352, "global_step": 215122, "epoch": 1280} {"train_loss": -11.761606216430664, "global_step": 215123, "epoch": 1280} {"train_loss": -11.721145629882812, "global_step": 215124, "epoch": 1280} {"train_loss": -11.886411666870117, "global_step": 215125, "epoch": 1280} {"train_loss": -11.926142692565918, "global_step": 215126, "epoch": 1280} {"train_loss": -11.922304153442383, "global_step": 215127, "epoch": 1280} {"train_loss": -11.757223129272461, "global_step": 215128, "epoch": 1280} {"train_loss": -11.830904006958008, "global_step": 215129, "epoch": 1280} {"train_loss": -11.850336074829102, "global_step": 215130, "epoch": 1280} {"train_loss": -12.028814315795898, "global_step": 215131, "epoch": 1280} {"train_loss": -12.122966766357422, "global_step": 215132, "epoch": 1280} {"train_loss": -11.740762710571289, "global_step": 215133, "epoch": 1280} {"train_loss": -11.981781959533691, "global_step": 215134, "epoch": 1280} {"train_loss": -11.970359802246094, "global_step": 215135, "epoch": 1280} {"train_loss": -11.798908233642578, "global_step": 215136, "epoch": 1280} {"train_loss": -11.994590759277344, "global_step": 215137, "epoch": 1280} {"train_loss": -11.786131858825684, "global_step": 215138, "epoch": 1280} {"train_loss": -11.756195068359375, "global_step": 215139, "epoch": 1280} {"train_loss": -11.929973602294922, "global_step": 215140, "epoch": 1280} {"train_loss": -11.730756759643555, "global_step": 215141, "epoch": 1280} {"train_loss": -11.614465713500977, "global_step": 215142, "epoch": 1280} {"train_loss": -11.957834243774414, "global_step": 215143, "epoch": 1280} {"train_loss": -11.752847671508789, "global_step": 215144, "epoch": 1280} {"train_loss": -11.234739303588867, "global_step": 215145, "epoch": 1280} {"train_loss": -11.01309585571289, "global_step": 215146, "epoch": 1280} {"train_loss": -11.066646575927734, "global_step": 215147, "epoch": 1280} {"train_loss": -11.438222885131836, "global_step": 215148, "epoch": 1280} {"train_loss": -10.876795768737793, "global_step": 215149, "epoch": 1280} {"train_loss": -11.711177825927734, "global_step": 215150, "epoch": 1280} {"train_loss": -11.502424240112305, "global_step": 215151, "epoch": 1280} {"train_loss": -11.41575813293457, "global_step": 215152, "epoch": 1280} {"train_loss": -10.901044845581055, "global_step": 215153, "epoch": 1280} {"train_loss": -11.117900848388672, "global_step": 215154, "epoch": 1280} {"train_loss": -11.525304794311523, "global_step": 215155, "epoch": 1280} {"train_loss": -11.43448257446289, "global_step": 215156, "epoch": 1280} {"train_loss": -11.389291763305664, "global_step": 215157, "epoch": 1280} {"train_loss": -10.921442985534668, "global_step": 215158, "epoch": 1280} {"train_loss": -9.763496398925781, "global_step": 215159, "epoch": 1280} {"train_loss": -10.543789863586426, "global_step": 215160, "epoch": 1280} {"train_loss": -10.53559684753418, "global_step": 215161, "epoch": 1280} {"train_loss": -10.088321685791016, "global_step": 215162, "epoch": 1280} {"train_loss": -10.67374038696289, "global_step": 215163, "epoch": 1280} {"train_loss": -10.858652114868164, "global_step": 215164, "epoch": 1280} {"train_loss": -10.284181594848633, "global_step": 215165, "epoch": 1280} {"train_loss": -11.140575408935547, "global_step": 215166, "epoch": 1280} {"train_loss": -11.013760566711426, "global_step": 215167, "epoch": 1280} {"train_loss": -11.186563491821289, "global_step": 215168, "epoch": 1280} {"train_loss": -11.09754467010498, "global_step": 215169, "epoch": 1280} {"train_loss": -11.205497741699219, "global_step": 215170, "epoch": 1280} {"train_loss": -10.932062149047852, "global_step": 215171, "epoch": 1280} {"train_loss": -10.856633186340332, "global_step": 215172, "epoch": 1280} {"train_loss": -11.223764419555664, "global_step": 215173, "epoch": 1280} {"train_loss": -11.121328353881836, "global_step": 215174, "epoch": 1280} {"train_loss": -10.95913028717041, "global_step": 215175, "epoch": 1280} {"train_loss": -11.267118453979492, "global_step": 215176, "epoch": 1280} {"train_loss": -11.25051212310791, "global_step": 215177, "epoch": 1280} {"train_loss": -11.390274047851562, "global_step": 215178, "epoch": 1280} {"train_loss": -11.097370147705078, "global_step": 215179, "epoch": 1280} {"train_loss": -11.46653938293457, "global_step": 215180, "epoch": 1280} {"train_loss": -11.420600891113281, "global_step": 215181, "epoch": 1280} {"train_loss": -11.029940605163574, "global_step": 215182, "epoch": 1280} {"train_loss": -11.55175495147705, "global_step": 215183, "epoch": 1280} {"train_loss": -11.384918212890625, "global_step": 215184, "epoch": 1280} {"train_loss": -11.302549362182617, "global_step": 215185, "epoch": 1280} {"train_loss": -11.359463691711426, "global_step": 215186, "epoch": 1280} {"train_loss": -11.259712219238281, "global_step": 215187, "epoch": 1280} {"train_loss": -11.561120986938477, "global_step": 215188, "epoch": 1280} {"train_loss": -11.235428810119629, "global_step": 215189, "epoch": 1280} {"train_loss": -11.520423889160156, "global_step": 215190, "epoch": 1280} {"train_loss": -11.326141357421875, "global_step": 215191, "epoch": 1280} {"train_loss": -11.397298812866211, "global_step": 215192, "epoch": 1280} {"train_loss": -11.6649169921875, "global_step": 215193, "epoch": 1280} {"train_loss": -11.31621265411377, "global_step": 215194, "epoch": 1280} {"train_loss": -11.559283256530762, "global_step": 215195, "epoch": 1280} {"train_loss": -11.501519203186035, "global_step": 215196, "epoch": 1280} {"train_loss": -11.412971496582031, "global_step": 215197, "epoch": 1280} {"train_loss": -11.700366973876953, "global_step": 215198, "epoch": 1280} {"train_loss": -11.266057968139648, "global_step": 215199, "epoch": 1280} {"train_loss": -11.691088676452637, "global_step": 215200, "epoch": 1280} {"train_loss": -11.513372421264648, "global_step": 215201, "epoch": 1280} {"train_loss": -11.157258987426758, "global_step": 215202, "epoch": 1280} {"train_loss": -11.843920707702637, "global_step": 215203, "epoch": 1280} {"train_loss": -11.281455993652344, "global_step": 215204, "epoch": 1280} {"train_loss": -11.528489112854004, "global_step": 215205, "epoch": 1280} {"train_loss": -11.724954605102539, "global_step": 215206, "epoch": 1280} {"train_loss": -11.32982425462632, "global_step": 215207, "epoch": 1280, "val_loss": 256455.609375, "train_action_mse_error": 2.205852508544922} {"train_loss": -11.788373947143555, "global_step": 215208, "epoch": 1281} {"train_loss": -11.492179870605469, "global_step": 215209, "epoch": 1281} {"train_loss": -11.77020263671875, "global_step": 215210, "epoch": 1281} {"train_loss": -11.819347381591797, "global_step": 215211, "epoch": 1281} {"train_loss": -11.63654899597168, "global_step": 215212, "epoch": 1281} {"train_loss": -11.810796737670898, "global_step": 215213, "epoch": 1281} {"train_loss": -11.71368408203125, "global_step": 215214, "epoch": 1281} {"train_loss": -11.967784881591797, "global_step": 215215, "epoch": 1281} {"train_loss": -11.857397079467773, "global_step": 215216, "epoch": 1281} {"train_loss": -11.616411209106445, "global_step": 215217, "epoch": 1281} {"train_loss": -11.789047241210938, "global_step": 215218, "epoch": 1281} {"train_loss": -11.668481826782227, "global_step": 215219, "epoch": 1281} {"train_loss": -11.62277603149414, "global_step": 215220, "epoch": 1281} {"train_loss": -11.744038581848145, "global_step": 215221, "epoch": 1281} {"train_loss": -11.345120429992676, "global_step": 215222, "epoch": 1281} {"train_loss": -11.601713180541992, "global_step": 215223, "epoch": 1281} {"train_loss": -11.516246795654297, "global_step": 215224, "epoch": 1281} {"train_loss": -11.11928653717041, "global_step": 215225, "epoch": 1281} {"train_loss": -11.73110580444336, "global_step": 215226, "epoch": 1281} {"train_loss": -11.003676414489746, "global_step": 215227, "epoch": 1281} {"train_loss": -11.647655487060547, "global_step": 215228, "epoch": 1281} {"train_loss": -11.683588027954102, "global_step": 215229, "epoch": 1281} {"train_loss": -11.346715927124023, "global_step": 215230, "epoch": 1281} {"train_loss": -11.523432731628418, "global_step": 215231, "epoch": 1281} {"train_loss": -11.45041275024414, "global_step": 215232, "epoch": 1281} {"train_loss": -11.189594268798828, "global_step": 215233, "epoch": 1281} {"train_loss": -11.418119430541992, "global_step": 215234, "epoch": 1281} {"train_loss": -10.550432205200195, "global_step": 215235, "epoch": 1281} {"train_loss": -11.646202087402344, "global_step": 215236, "epoch": 1281} {"train_loss": -10.89755630493164, "global_step": 215237, "epoch": 1281} {"train_loss": -11.466300010681152, "global_step": 215238, "epoch": 1281} {"train_loss": -10.885175704956055, "global_step": 215239, "epoch": 1281} {"train_loss": -11.45505142211914, "global_step": 215240, "epoch": 1281} {"train_loss": -11.452585220336914, "global_step": 215241, "epoch": 1281} {"train_loss": -11.487220764160156, "global_step": 215242, "epoch": 1281} {"train_loss": -11.469352722167969, "global_step": 215243, "epoch": 1281} {"train_loss": -11.293689727783203, "global_step": 215244, "epoch": 1281} {"train_loss": -11.295183181762695, "global_step": 215245, "epoch": 1281} {"train_loss": -11.235048294067383, "global_step": 215246, "epoch": 1281} {"train_loss": -11.632285118103027, "global_step": 215247, "epoch": 1281} {"train_loss": -11.202103614807129, "global_step": 215248, "epoch": 1281} {"train_loss": -11.480320930480957, "global_step": 215249, "epoch": 1281} {"train_loss": -11.424190521240234, "global_step": 215250, "epoch": 1281} {"train_loss": -11.173391342163086, "global_step": 215251, "epoch": 1281} {"train_loss": -11.051825523376465, "global_step": 215252, "epoch": 1281} {"train_loss": -10.935672760009766, "global_step": 215253, "epoch": 1281} {"train_loss": -11.29946517944336, "global_step": 215254, "epoch": 1281} {"train_loss": -11.346193313598633, "global_step": 215255, "epoch": 1281} {"train_loss": -11.021427154541016, "global_step": 215256, "epoch": 1281} {"train_loss": -11.021795272827148, "global_step": 215257, "epoch": 1281} {"train_loss": -11.361215591430664, "global_step": 215258, "epoch": 1281} {"train_loss": -11.430462837219238, "global_step": 215259, "epoch": 1281} {"train_loss": -10.827295303344727, "global_step": 215260, "epoch": 1281} {"train_loss": -11.418033599853516, "global_step": 215261, "epoch": 1281} {"train_loss": -11.318315505981445, "global_step": 215262, "epoch": 1281} {"train_loss": -11.535188674926758, "global_step": 215263, "epoch": 1281} {"train_loss": -11.505081176757812, "global_step": 215264, "epoch": 1281} {"train_loss": -11.239425659179688, "global_step": 215265, "epoch": 1281} {"train_loss": -11.608598709106445, "global_step": 215266, "epoch": 1281} {"train_loss": -11.532188415527344, "global_step": 215267, "epoch": 1281} {"train_loss": -11.557229995727539, "global_step": 215268, "epoch": 1281} {"train_loss": -11.693459510803223, "global_step": 215269, "epoch": 1281} {"train_loss": -11.84918212890625, "global_step": 215270, "epoch": 1281} {"train_loss": -11.618959426879883, "global_step": 215271, "epoch": 1281} {"train_loss": -11.88684368133545, "global_step": 215272, "epoch": 1281} {"train_loss": -11.840536117553711, "global_step": 215273, "epoch": 1281} {"train_loss": -11.69229507446289, "global_step": 215274, "epoch": 1281} {"train_loss": -11.92364501953125, "global_step": 215275, "epoch": 1281} {"train_loss": -11.607038497924805, "global_step": 215276, "epoch": 1281} {"train_loss": -11.546487808227539, "global_step": 215277, "epoch": 1281} {"train_loss": -11.281753540039062, "global_step": 215278, "epoch": 1281} {"train_loss": -11.357278823852539, "global_step": 215279, "epoch": 1281} {"train_loss": -11.596181869506836, "global_step": 215280, "epoch": 1281} {"train_loss": -11.443262100219727, "global_step": 215281, "epoch": 1281} {"train_loss": -11.54003620147705, "global_step": 215282, "epoch": 1281} {"train_loss": -10.990087509155273, "global_step": 215283, "epoch": 1281} {"train_loss": -10.935697555541992, "global_step": 215284, "epoch": 1281} {"train_loss": -11.4785795211792, "global_step": 215285, "epoch": 1281} {"train_loss": -11.648971557617188, "global_step": 215286, "epoch": 1281} {"train_loss": -10.483072280883789, "global_step": 215287, "epoch": 1281} {"train_loss": -11.108630180358887, "global_step": 215288, "epoch": 1281} {"train_loss": -11.45409107208252, "global_step": 215289, "epoch": 1281} {"train_loss": -11.358055114746094, "global_step": 215290, "epoch": 1281} {"train_loss": -11.61465835571289, "global_step": 215291, "epoch": 1281} {"train_loss": -11.491992950439453, "global_step": 215292, "epoch": 1281} {"train_loss": -10.957438468933105, "global_step": 215293, "epoch": 1281} {"train_loss": -11.673357963562012, "global_step": 215294, "epoch": 1281} {"train_loss": -11.221044540405273, "global_step": 215295, "epoch": 1281} {"train_loss": -10.995050430297852, "global_step": 215296, "epoch": 1281} {"train_loss": -11.571222305297852, "global_step": 215297, "epoch": 1281} {"train_loss": -10.826491355895996, "global_step": 215298, "epoch": 1281} {"train_loss": -11.139875411987305, "global_step": 215299, "epoch": 1281} {"train_loss": -10.813925743103027, "global_step": 215300, "epoch": 1281} {"train_loss": -11.393514633178711, "global_step": 215301, "epoch": 1281} {"train_loss": -10.86440372467041, "global_step": 215302, "epoch": 1281} {"train_loss": -10.952112197875977, "global_step": 215303, "epoch": 1281} {"train_loss": -11.260608673095703, "global_step": 215304, "epoch": 1281} {"train_loss": -11.236005783081055, "global_step": 215305, "epoch": 1281} {"train_loss": -11.19655990600586, "global_step": 215306, "epoch": 1281} {"train_loss": -11.519343376159668, "global_step": 215307, "epoch": 1281} {"train_loss": -11.013082504272461, "global_step": 215308, "epoch": 1281} {"train_loss": -11.34253215789795, "global_step": 215309, "epoch": 1281} {"train_loss": -11.052334785461426, "global_step": 215310, "epoch": 1281} {"train_loss": -11.513181686401367, "global_step": 215311, "epoch": 1281} {"train_loss": -11.078140258789062, "global_step": 215312, "epoch": 1281} {"train_loss": -11.496301651000977, "global_step": 215313, "epoch": 1281} {"train_loss": -10.77457046508789, "global_step": 215314, "epoch": 1281} {"train_loss": -11.089300155639648, "global_step": 215315, "epoch": 1281} {"train_loss": -10.851751327514648, "global_step": 215316, "epoch": 1281} {"train_loss": -11.101605415344238, "global_step": 215317, "epoch": 1281} {"train_loss": -11.382954597473145, "global_step": 215318, "epoch": 1281} {"train_loss": -11.361444473266602, "global_step": 215319, "epoch": 1281} {"train_loss": -11.025552749633789, "global_step": 215320, "epoch": 1281} {"train_loss": -11.03373908996582, "global_step": 215321, "epoch": 1281} {"train_loss": -11.161273002624512, "global_step": 215322, "epoch": 1281} {"train_loss": -10.882688522338867, "global_step": 215323, "epoch": 1281} {"train_loss": -11.409943580627441, "global_step": 215324, "epoch": 1281} {"train_loss": -11.080121040344238, "global_step": 215325, "epoch": 1281} {"train_loss": -11.179588317871094, "global_step": 215326, "epoch": 1281} {"train_loss": -11.030567169189453, "global_step": 215327, "epoch": 1281} {"train_loss": -10.833984375, "global_step": 215328, "epoch": 1281} {"train_loss": -10.447805404663086, "global_step": 215329, "epoch": 1281} {"train_loss": -10.746562957763672, "global_step": 215330, "epoch": 1281} {"train_loss": -10.599205017089844, "global_step": 215331, "epoch": 1281} {"train_loss": -10.703126907348633, "global_step": 215332, "epoch": 1281} {"train_loss": -10.236431121826172, "global_step": 215333, "epoch": 1281} {"train_loss": -10.873295783996582, "global_step": 215334, "epoch": 1281} {"train_loss": -10.991912841796875, "global_step": 215335, "epoch": 1281} {"train_loss": -11.203607559204102, "global_step": 215336, "epoch": 1281} {"train_loss": -10.964215278625488, "global_step": 215337, "epoch": 1281} {"train_loss": -11.304498672485352, "global_step": 215338, "epoch": 1281} {"train_loss": -11.070881843566895, "global_step": 215339, "epoch": 1281} {"train_loss": -11.201470375061035, "global_step": 215340, "epoch": 1281} {"train_loss": -11.464529037475586, "global_step": 215341, "epoch": 1281} {"train_loss": -11.17071533203125, "global_step": 215342, "epoch": 1281} {"train_loss": -11.25627613067627, "global_step": 215343, "epoch": 1281} {"train_loss": -11.262166976928711, "global_step": 215344, "epoch": 1281} {"train_loss": -11.273411750793457, "global_step": 215345, "epoch": 1281} {"train_loss": -11.62456226348877, "global_step": 215346, "epoch": 1281} {"train_loss": -11.436592102050781, "global_step": 215347, "epoch": 1281} {"train_loss": -11.431991577148438, "global_step": 215348, "epoch": 1281} {"train_loss": -11.44368839263916, "global_step": 215349, "epoch": 1281} {"train_loss": -11.700063705444336, "global_step": 215350, "epoch": 1281} {"train_loss": -11.653436660766602, "global_step": 215351, "epoch": 1281} {"train_loss": -11.440853118896484, "global_step": 215352, "epoch": 1281} {"train_loss": -11.718170166015625, "global_step": 215353, "epoch": 1281} {"train_loss": -11.553339004516602, "global_step": 215354, "epoch": 1281} {"train_loss": -11.393230438232422, "global_step": 215355, "epoch": 1281} {"train_loss": -11.669845581054688, "global_step": 215356, "epoch": 1281} {"train_loss": -11.467426300048828, "global_step": 215357, "epoch": 1281} {"train_loss": -11.838910102844238, "global_step": 215358, "epoch": 1281} {"train_loss": -11.642122268676758, "global_step": 215359, "epoch": 1281} {"train_loss": -11.645392417907715, "global_step": 215360, "epoch": 1281} {"train_loss": -11.713434219360352, "global_step": 215361, "epoch": 1281} {"train_loss": -11.62721061706543, "global_step": 215362, "epoch": 1281} {"train_loss": -11.444393157958984, "global_step": 215363, "epoch": 1281} {"train_loss": -12.000091552734375, "global_step": 215364, "epoch": 1281} {"train_loss": -11.584619522094727, "global_step": 215365, "epoch": 1281} {"train_loss": -11.554265022277832, "global_step": 215366, "epoch": 1281} {"train_loss": -11.755424499511719, "global_step": 215367, "epoch": 1281} {"train_loss": -11.814943313598633, "global_step": 215368, "epoch": 1281} {"train_loss": -11.70949935913086, "global_step": 215369, "epoch": 1281} {"train_loss": -11.909536361694336, "global_step": 215370, "epoch": 1281} {"train_loss": -11.754008293151855, "global_step": 215371, "epoch": 1281} {"train_loss": -11.880292892456055, "global_step": 215372, "epoch": 1281} {"train_loss": -11.970624923706055, "global_step": 215373, "epoch": 1281} {"train_loss": -11.930994987487793, "global_step": 215374, "epoch": 1281} {"train_loss": -11.372914728664217, "global_step": 215375, "epoch": 1281, "val_loss": 258314.140625} {"train_loss": -11.717955589294434, "global_step": 215376, "epoch": 1282} {"train_loss": -11.67281436920166, "global_step": 215377, "epoch": 1282} {"train_loss": -11.840023040771484, "global_step": 215378, "epoch": 1282} {"train_loss": -11.748273849487305, "global_step": 215379, "epoch": 1282} {"train_loss": -11.760831832885742, "global_step": 215380, "epoch": 1282} {"train_loss": -11.84253215789795, "global_step": 215381, "epoch": 1282} {"train_loss": -11.732040405273438, "global_step": 215382, "epoch": 1282} {"train_loss": -11.742805480957031, "global_step": 215383, "epoch": 1282} {"train_loss": -11.727314949035645, "global_step": 215384, "epoch": 1282} {"train_loss": -11.482049942016602, "global_step": 215385, "epoch": 1282} {"train_loss": -12.00544548034668, "global_step": 215386, "epoch": 1282} {"train_loss": -11.829248428344727, "global_step": 215387, "epoch": 1282} {"train_loss": -11.780355453491211, "global_step": 215388, "epoch": 1282} {"train_loss": -11.712689399719238, "global_step": 215389, "epoch": 1282} {"train_loss": -11.629524230957031, "global_step": 215390, "epoch": 1282} {"train_loss": -11.487861633300781, "global_step": 215391, "epoch": 1282} {"train_loss": -11.323283195495605, "global_step": 215392, "epoch": 1282} {"train_loss": -11.272500038146973, "global_step": 215393, "epoch": 1282} {"train_loss": -11.322164535522461, "global_step": 215394, "epoch": 1282} {"train_loss": -10.917466163635254, "global_step": 215395, "epoch": 1282} {"train_loss": -11.54847240447998, "global_step": 215396, "epoch": 1282} {"train_loss": -10.78238296508789, "global_step": 215397, "epoch": 1282} {"train_loss": -11.62971305847168, "global_step": 215398, "epoch": 1282} {"train_loss": -11.390701293945312, "global_step": 215399, "epoch": 1282} {"train_loss": -11.28697395324707, "global_step": 215400, "epoch": 1282} {"train_loss": -11.50520133972168, "global_step": 215401, "epoch": 1282} {"train_loss": -11.120616912841797, "global_step": 215402, "epoch": 1282} {"train_loss": -11.662866592407227, "global_step": 215403, "epoch": 1282} {"train_loss": -10.555303573608398, "global_step": 215404, "epoch": 1282} {"train_loss": -11.6038818359375, "global_step": 215405, "epoch": 1282} {"train_loss": -10.849853515625, "global_step": 215406, "epoch": 1282} {"train_loss": -11.83370590209961, "global_step": 215407, "epoch": 1282} {"train_loss": -10.719411849975586, "global_step": 215408, "epoch": 1282} {"train_loss": -11.445110321044922, "global_step": 215409, "epoch": 1282} {"train_loss": -11.483109474182129, "global_step": 215410, "epoch": 1282} {"train_loss": -10.841771125793457, "global_step": 215411, "epoch": 1282} {"train_loss": -11.418831825256348, "global_step": 215412, "epoch": 1282} {"train_loss": -11.0963716506958, "global_step": 215413, "epoch": 1282} {"train_loss": -11.312990188598633, "global_step": 215414, "epoch": 1282} {"train_loss": -11.04610538482666, "global_step": 215415, "epoch": 1282} {"train_loss": -10.465958595275879, "global_step": 215416, "epoch": 1282} {"train_loss": -11.220450401306152, "global_step": 215417, "epoch": 1282} {"train_loss": -11.416908264160156, "global_step": 215418, "epoch": 1282} {"train_loss": -10.320930480957031, "global_step": 215419, "epoch": 1282} {"train_loss": -11.082380294799805, "global_step": 215420, "epoch": 1282} {"train_loss": -11.482093811035156, "global_step": 215421, "epoch": 1282} {"train_loss": -11.23963451385498, "global_step": 215422, "epoch": 1282} {"train_loss": -10.980596542358398, "global_step": 215423, "epoch": 1282} {"train_loss": -10.857339859008789, "global_step": 215424, "epoch": 1282} {"train_loss": -10.920822143554688, "global_step": 215425, "epoch": 1282} {"train_loss": -10.949676513671875, "global_step": 215426, "epoch": 1282} {"train_loss": -10.753035545349121, "global_step": 215427, "epoch": 1282} {"train_loss": -11.5598783493042, "global_step": 215428, "epoch": 1282} {"train_loss": -11.098424911499023, "global_step": 215429, "epoch": 1282} {"train_loss": -11.050922393798828, "global_step": 215430, "epoch": 1282} {"train_loss": -10.742168426513672, "global_step": 215431, "epoch": 1282} {"train_loss": -11.533005714416504, "global_step": 215432, "epoch": 1282} {"train_loss": -11.434900283813477, "global_step": 215433, "epoch": 1282} {"train_loss": -11.312334060668945, "global_step": 215434, "epoch": 1282} {"train_loss": -11.14183235168457, "global_step": 215435, "epoch": 1282} {"train_loss": -11.195996284484863, "global_step": 215436, "epoch": 1282} {"train_loss": -10.858125686645508, "global_step": 215437, "epoch": 1282} {"train_loss": -11.308256149291992, "global_step": 215438, "epoch": 1282} {"train_loss": -11.359169006347656, "global_step": 215439, "epoch": 1282} {"train_loss": -11.304673194885254, "global_step": 215440, "epoch": 1282} {"train_loss": -11.144420623779297, "global_step": 215441, "epoch": 1282} {"train_loss": -11.403493881225586, "global_step": 215442, "epoch": 1282} {"train_loss": -11.451849937438965, "global_step": 215443, "epoch": 1282} {"train_loss": -11.42259407043457, "global_step": 215444, "epoch": 1282} {"train_loss": -11.247560501098633, "global_step": 215445, "epoch": 1282} {"train_loss": -10.90072250366211, "global_step": 215446, "epoch": 1282} {"train_loss": -11.459077835083008, "global_step": 215447, "epoch": 1282} {"train_loss": -11.030220031738281, "global_step": 215448, "epoch": 1282} {"train_loss": -11.47822380065918, "global_step": 215449, "epoch": 1282} {"train_loss": -11.042543411254883, "global_step": 215450, "epoch": 1282} {"train_loss": -10.82662582397461, "global_step": 215451, "epoch": 1282} {"train_loss": -11.557451248168945, "global_step": 215452, "epoch": 1282} {"train_loss": -11.040057182312012, "global_step": 215453, "epoch": 1282} {"train_loss": -11.460976600646973, "global_step": 215454, "epoch": 1282} {"train_loss": -11.347028732299805, "global_step": 215455, "epoch": 1282} {"train_loss": -11.076169967651367, "global_step": 215456, "epoch": 1282} {"train_loss": -11.649431228637695, "global_step": 215457, "epoch": 1282} {"train_loss": -11.195699691772461, "global_step": 215458, "epoch": 1282} {"train_loss": -11.365060806274414, "global_step": 215459, "epoch": 1282} {"train_loss": -11.335058212280273, "global_step": 215460, "epoch": 1282} {"train_loss": -11.316329956054688, "global_step": 215461, "epoch": 1282} {"train_loss": -11.56883430480957, "global_step": 215462, "epoch": 1282} {"train_loss": -11.296126365661621, "global_step": 215463, "epoch": 1282} {"train_loss": -11.579341888427734, "global_step": 215464, "epoch": 1282} {"train_loss": -11.290064811706543, "global_step": 215465, "epoch": 1282} {"train_loss": -11.472471237182617, "global_step": 215466, "epoch": 1282} {"train_loss": -11.584826469421387, "global_step": 215467, "epoch": 1282} {"train_loss": -11.497488021850586, "global_step": 215468, "epoch": 1282} {"train_loss": -11.41430950164795, "global_step": 215469, "epoch": 1282} {"train_loss": -11.255996704101562, "global_step": 215470, "epoch": 1282} {"train_loss": -11.305120468139648, "global_step": 215471, "epoch": 1282} {"train_loss": -11.060811042785645, "global_step": 215472, "epoch": 1282} {"train_loss": -10.539640426635742, "global_step": 215473, "epoch": 1282} {"train_loss": -11.174121856689453, "global_step": 215474, "epoch": 1282} {"train_loss": -11.331403732299805, "global_step": 215475, "epoch": 1282} {"train_loss": -11.626148223876953, "global_step": 215476, "epoch": 1282} {"train_loss": -11.229511260986328, "global_step": 215477, "epoch": 1282} {"train_loss": -11.539535522460938, "global_step": 215478, "epoch": 1282} {"train_loss": -11.459721565246582, "global_step": 215479, "epoch": 1282} {"train_loss": -11.62150764465332, "global_step": 215480, "epoch": 1282} {"train_loss": -11.564506530761719, "global_step": 215481, "epoch": 1282} {"train_loss": -11.465456008911133, "global_step": 215482, "epoch": 1282} {"train_loss": -11.027103424072266, "global_step": 215483, "epoch": 1282} {"train_loss": -11.226219177246094, "global_step": 215484, "epoch": 1282} {"train_loss": -11.019166946411133, "global_step": 215485, "epoch": 1282} {"train_loss": -11.657269477844238, "global_step": 215486, "epoch": 1282} {"train_loss": -11.538885116577148, "global_step": 215487, "epoch": 1282} {"train_loss": -11.540492057800293, "global_step": 215488, "epoch": 1282} {"train_loss": -11.4161958694458, "global_step": 215489, "epoch": 1282} {"train_loss": -11.720136642456055, "global_step": 215490, "epoch": 1282} {"train_loss": -11.472240447998047, "global_step": 215491, "epoch": 1282} {"train_loss": -11.792545318603516, "global_step": 215492, "epoch": 1282} {"train_loss": -11.939724922180176, "global_step": 215493, "epoch": 1282} {"train_loss": -11.654546737670898, "global_step": 215494, "epoch": 1282} {"train_loss": -11.75490665435791, "global_step": 215495, "epoch": 1282} {"train_loss": -11.627948760986328, "global_step": 215496, "epoch": 1282} {"train_loss": -11.790830612182617, "global_step": 215497, "epoch": 1282} {"train_loss": -11.788674354553223, "global_step": 215498, "epoch": 1282} {"train_loss": -11.336432456970215, "global_step": 215499, "epoch": 1282} {"train_loss": -11.72110652923584, "global_step": 215500, "epoch": 1282} {"train_loss": -11.821405410766602, "global_step": 215501, "epoch": 1282} {"train_loss": -11.721464157104492, "global_step": 215502, "epoch": 1282} {"train_loss": -11.590034484863281, "global_step": 215503, "epoch": 1282} {"train_loss": -11.709426879882812, "global_step": 215504, "epoch": 1282} {"train_loss": -11.590323448181152, "global_step": 215505, "epoch": 1282} {"train_loss": -11.661169052124023, "global_step": 215506, "epoch": 1282} {"train_loss": -11.218502044677734, "global_step": 215507, "epoch": 1282} {"train_loss": -11.372294425964355, "global_step": 215508, "epoch": 1282} {"train_loss": -11.592523574829102, "global_step": 215509, "epoch": 1282} {"train_loss": -11.290205001831055, "global_step": 215510, "epoch": 1282} {"train_loss": -11.874640464782715, "global_step": 215511, "epoch": 1282} {"train_loss": -11.212234497070312, "global_step": 215512, "epoch": 1282} {"train_loss": -11.184396743774414, "global_step": 215513, "epoch": 1282} {"train_loss": -11.442386627197266, "global_step": 215514, "epoch": 1282} {"train_loss": -11.435523986816406, "global_step": 215515, "epoch": 1282} {"train_loss": -11.375041961669922, "global_step": 215516, "epoch": 1282} {"train_loss": -11.749980926513672, "global_step": 215517, "epoch": 1282} {"train_loss": -11.604997634887695, "global_step": 215518, "epoch": 1282} {"train_loss": -11.339926719665527, "global_step": 215519, "epoch": 1282} {"train_loss": -11.542169570922852, "global_step": 215520, "epoch": 1282} {"train_loss": -11.087782859802246, "global_step": 215521, "epoch": 1282} {"train_loss": -11.345813751220703, "global_step": 215522, "epoch": 1282} {"train_loss": -11.167179107666016, "global_step": 215523, "epoch": 1282} {"train_loss": -10.830382347106934, "global_step": 215524, "epoch": 1282} {"train_loss": -11.561715126037598, "global_step": 215525, "epoch": 1282} {"train_loss": -10.429765701293945, "global_step": 215526, "epoch": 1282} {"train_loss": -11.177314758300781, "global_step": 215527, "epoch": 1282} {"train_loss": -10.085428237915039, "global_step": 215528, "epoch": 1282} {"train_loss": -10.331217765808105, "global_step": 215529, "epoch": 1282} {"train_loss": -11.384284973144531, "global_step": 215530, "epoch": 1282} {"train_loss": -10.538490295410156, "global_step": 215531, "epoch": 1282} {"train_loss": -11.493183135986328, "global_step": 215532, "epoch": 1282} {"train_loss": -10.669998168945312, "global_step": 215533, "epoch": 1282} {"train_loss": -11.0382661819458, "global_step": 215534, "epoch": 1282} {"train_loss": -11.13232707977295, "global_step": 215535, "epoch": 1282} {"train_loss": -10.538719177246094, "global_step": 215536, "epoch": 1282} {"train_loss": -11.245506286621094, "global_step": 215537, "epoch": 1282} {"train_loss": -9.955145835876465, "global_step": 215538, "epoch": 1282} {"train_loss": -11.492136001586914, "global_step": 215539, "epoch": 1282} {"train_loss": -10.37985610961914, "global_step": 215540, "epoch": 1282} {"train_loss": -11.354955673217773, "global_step": 215541, "epoch": 1282} {"train_loss": -9.888362884521484, "global_step": 215542, "epoch": 1282} {"train_loss": -11.304091266223363, "global_step": 215543, "epoch": 1282, "val_loss": 256885.984375} {"train_loss": -10.711112976074219, "global_step": 215544, "epoch": 1283} {"train_loss": -10.927450180053711, "global_step": 215545, "epoch": 1283} {"train_loss": -10.970203399658203, "global_step": 215546, "epoch": 1283} {"train_loss": -10.953401565551758, "global_step": 215547, "epoch": 1283} {"train_loss": -10.983932495117188, "global_step": 215548, "epoch": 1283} {"train_loss": -11.303010940551758, "global_step": 215549, "epoch": 1283} {"train_loss": -11.323589324951172, "global_step": 215550, "epoch": 1283} {"train_loss": -11.192444801330566, "global_step": 215551, "epoch": 1283} {"train_loss": -11.299216270446777, "global_step": 215552, "epoch": 1283} {"train_loss": -11.395750045776367, "global_step": 215553, "epoch": 1283} {"train_loss": -11.441731452941895, "global_step": 215554, "epoch": 1283} {"train_loss": -11.378594398498535, "global_step": 215555, "epoch": 1283} {"train_loss": -11.51650619506836, "global_step": 215556, "epoch": 1283} {"train_loss": -11.429344177246094, "global_step": 215557, "epoch": 1283} {"train_loss": -11.494075775146484, "global_step": 215558, "epoch": 1283} {"train_loss": -11.453812599182129, "global_step": 215559, "epoch": 1283} {"train_loss": -11.514829635620117, "global_step": 215560, "epoch": 1283} {"train_loss": -11.51572036743164, "global_step": 215561, "epoch": 1283} {"train_loss": -11.47121524810791, "global_step": 215562, "epoch": 1283} {"train_loss": -11.632139205932617, "global_step": 215563, "epoch": 1283} {"train_loss": -11.383928298950195, "global_step": 215564, "epoch": 1283} {"train_loss": -11.473644256591797, "global_step": 215565, "epoch": 1283} {"train_loss": -11.417734146118164, "global_step": 215566, "epoch": 1283} {"train_loss": -11.424753189086914, "global_step": 215567, "epoch": 1283} {"train_loss": -11.680521011352539, "global_step": 215568, "epoch": 1283} {"train_loss": -11.350788116455078, "global_step": 215569, "epoch": 1283} {"train_loss": -11.487249374389648, "global_step": 215570, "epoch": 1283} {"train_loss": -11.252225875854492, "global_step": 215571, "epoch": 1283} {"train_loss": -11.782661437988281, "global_step": 215572, "epoch": 1283} {"train_loss": -11.089361190795898, "global_step": 215573, "epoch": 1283} {"train_loss": -11.50368881225586, "global_step": 215574, "epoch": 1283} {"train_loss": -11.419828414916992, "global_step": 215575, "epoch": 1283} {"train_loss": -11.491606712341309, "global_step": 215576, "epoch": 1283} {"train_loss": -11.368124008178711, "global_step": 215577, "epoch": 1283} {"train_loss": -11.52197265625, "global_step": 215578, "epoch": 1283} {"train_loss": -11.445356369018555, "global_step": 215579, "epoch": 1283} {"train_loss": -11.427087783813477, "global_step": 215580, "epoch": 1283} {"train_loss": -11.603006362915039, "global_step": 215581, "epoch": 1283} {"train_loss": -11.48393440246582, "global_step": 215582, "epoch": 1283} {"train_loss": -11.18649673461914, "global_step": 215583, "epoch": 1283} {"train_loss": -11.188837051391602, "global_step": 215584, "epoch": 1283} {"train_loss": -11.500162124633789, "global_step": 215585, "epoch": 1283} {"train_loss": -11.004005432128906, "global_step": 215586, "epoch": 1283} {"train_loss": -11.794593811035156, "global_step": 215587, "epoch": 1283} {"train_loss": -11.484701156616211, "global_step": 215588, "epoch": 1283} {"train_loss": -11.378658294677734, "global_step": 215589, "epoch": 1283} {"train_loss": -11.75282096862793, "global_step": 215590, "epoch": 1283} {"train_loss": -11.46046257019043, "global_step": 215591, "epoch": 1283} {"train_loss": -11.81734561920166, "global_step": 215592, "epoch": 1283} {"train_loss": -11.353487014770508, "global_step": 215593, "epoch": 1283} {"train_loss": -11.869343757629395, "global_step": 215594, "epoch": 1283} {"train_loss": -11.493350982666016, "global_step": 215595, "epoch": 1283} {"train_loss": -11.86575698852539, "global_step": 215596, "epoch": 1283} {"train_loss": -11.656723976135254, "global_step": 215597, "epoch": 1283} {"train_loss": -11.622756958007812, "global_step": 215598, "epoch": 1283} {"train_loss": -11.875303268432617, "global_step": 215599, "epoch": 1283} {"train_loss": -11.855274200439453, "global_step": 215600, "epoch": 1283} {"train_loss": -11.767455101013184, "global_step": 215601, "epoch": 1283} {"train_loss": -11.921655654907227, "global_step": 215602, "epoch": 1283} {"train_loss": -11.875921249389648, "global_step": 215603, "epoch": 1283} {"train_loss": -11.912726402282715, "global_step": 215604, "epoch": 1283} {"train_loss": -11.71930980682373, "global_step": 215605, "epoch": 1283} {"train_loss": -11.814918518066406, "global_step": 215606, "epoch": 1283} {"train_loss": -11.979366302490234, "global_step": 215607, "epoch": 1283} {"train_loss": -11.746082305908203, "global_step": 215608, "epoch": 1283} {"train_loss": -12.088974952697754, "global_step": 215609, "epoch": 1283} {"train_loss": -11.80112075805664, "global_step": 215610, "epoch": 1283} {"train_loss": -11.983622550964355, "global_step": 215611, "epoch": 1283} {"train_loss": -11.82492733001709, "global_step": 215612, "epoch": 1283} {"train_loss": -11.887432098388672, "global_step": 215613, "epoch": 1283} {"train_loss": -11.491674423217773, "global_step": 215614, "epoch": 1283} {"train_loss": -11.655506134033203, "global_step": 215615, "epoch": 1283} {"train_loss": -11.764369010925293, "global_step": 215616, "epoch": 1283} {"train_loss": -11.831661224365234, "global_step": 215617, "epoch": 1283} {"train_loss": -11.504742622375488, "global_step": 215618, "epoch": 1283} {"train_loss": -11.384698867797852, "global_step": 215619, "epoch": 1283} {"train_loss": -11.768949508666992, "global_step": 215620, "epoch": 1283} {"train_loss": -11.421483993530273, "global_step": 215621, "epoch": 1283} {"train_loss": -11.92056655883789, "global_step": 215622, "epoch": 1283} {"train_loss": -11.67962646484375, "global_step": 215623, "epoch": 1283} {"train_loss": -11.699771881103516, "global_step": 215624, "epoch": 1283} {"train_loss": -11.529138565063477, "global_step": 215625, "epoch": 1283} {"train_loss": -11.746532440185547, "global_step": 215626, "epoch": 1283} {"train_loss": -11.721267700195312, "global_step": 215627, "epoch": 1283} {"train_loss": -11.572321891784668, "global_step": 215628, "epoch": 1283} {"train_loss": -11.277299880981445, "global_step": 215629, "epoch": 1283} {"train_loss": -11.207725524902344, "global_step": 215630, "epoch": 1283} {"train_loss": -12.063257217407227, "global_step": 215631, "epoch": 1283} {"train_loss": -11.272047996520996, "global_step": 215632, "epoch": 1283} {"train_loss": -11.212276458740234, "global_step": 215633, "epoch": 1283} {"train_loss": -11.244302749633789, "global_step": 215634, "epoch": 1283} {"train_loss": -11.46274185180664, "global_step": 215635, "epoch": 1283} {"train_loss": -11.311884880065918, "global_step": 215636, "epoch": 1283} {"train_loss": -11.375741004943848, "global_step": 215637, "epoch": 1283} {"train_loss": -11.130037307739258, "global_step": 215638, "epoch": 1283} {"train_loss": -11.671189308166504, "global_step": 215639, "epoch": 1283} {"train_loss": -11.249476432800293, "global_step": 215640, "epoch": 1283} {"train_loss": -11.355891227722168, "global_step": 215641, "epoch": 1283} {"train_loss": -11.102649688720703, "global_step": 215642, "epoch": 1283} {"train_loss": -11.536808013916016, "global_step": 215643, "epoch": 1283} {"train_loss": -11.513440132141113, "global_step": 215644, "epoch": 1283} {"train_loss": -11.400705337524414, "global_step": 215645, "epoch": 1283} {"train_loss": -10.745606422424316, "global_step": 215646, "epoch": 1283} {"train_loss": -11.420564651489258, "global_step": 215647, "epoch": 1283} {"train_loss": -11.622649192810059, "global_step": 215648, "epoch": 1283} {"train_loss": -11.422425270080566, "global_step": 215649, "epoch": 1283} {"train_loss": -11.656746864318848, "global_step": 215650, "epoch": 1283} {"train_loss": -11.183843612670898, "global_step": 215651, "epoch": 1283} {"train_loss": -11.880548477172852, "global_step": 215652, "epoch": 1283} {"train_loss": -11.32342529296875, "global_step": 215653, "epoch": 1283} {"train_loss": -11.700830459594727, "global_step": 215654, "epoch": 1283} {"train_loss": -11.007709503173828, "global_step": 215655, "epoch": 1283} {"train_loss": -11.526504516601562, "global_step": 215656, "epoch": 1283} {"train_loss": -11.611385345458984, "global_step": 215657, "epoch": 1283} {"train_loss": -10.72685718536377, "global_step": 215658, "epoch": 1283} {"train_loss": -11.228973388671875, "global_step": 215659, "epoch": 1283} {"train_loss": -10.914179801940918, "global_step": 215660, "epoch": 1283} {"train_loss": -10.079808235168457, "global_step": 215661, "epoch": 1283} {"train_loss": -11.193353652954102, "global_step": 215662, "epoch": 1283} {"train_loss": -10.052902221679688, "global_step": 215663, "epoch": 1283} {"train_loss": -10.585750579833984, "global_step": 215664, "epoch": 1283} {"train_loss": -10.22817611694336, "global_step": 215665, "epoch": 1283} {"train_loss": -10.388557434082031, "global_step": 215666, "epoch": 1283} {"train_loss": -9.830521583557129, "global_step": 215667, "epoch": 1283} {"train_loss": -10.257795333862305, "global_step": 215668, "epoch": 1283} {"train_loss": -9.869043350219727, "global_step": 215669, "epoch": 1283} {"train_loss": -11.37990951538086, "global_step": 215670, "epoch": 1283} {"train_loss": -9.829099655151367, "global_step": 215671, "epoch": 1283} {"train_loss": -10.427511215209961, "global_step": 215672, "epoch": 1283} {"train_loss": -10.897336959838867, "global_step": 215673, "epoch": 1283} {"train_loss": -10.138819694519043, "global_step": 215674, "epoch": 1283} {"train_loss": -10.67603874206543, "global_step": 215675, "epoch": 1283} {"train_loss": -10.895755767822266, "global_step": 215676, "epoch": 1283} {"train_loss": -10.452618598937988, "global_step": 215677, "epoch": 1283} {"train_loss": -11.002693176269531, "global_step": 215678, "epoch": 1283} {"train_loss": -10.643661499023438, "global_step": 215679, "epoch": 1283} {"train_loss": -10.485437393188477, "global_step": 215680, "epoch": 1283} {"train_loss": -11.598967552185059, "global_step": 215681, "epoch": 1283} {"train_loss": -11.169572830200195, "global_step": 215682, "epoch": 1283} {"train_loss": -11.218881607055664, "global_step": 215683, "epoch": 1283} {"train_loss": -11.293319702148438, "global_step": 215684, "epoch": 1283} {"train_loss": -10.996681213378906, "global_step": 215685, "epoch": 1283} {"train_loss": -11.429569244384766, "global_step": 215686, "epoch": 1283} {"train_loss": -11.157303810119629, "global_step": 215687, "epoch": 1283} {"train_loss": -11.070707321166992, "global_step": 215688, "epoch": 1283} {"train_loss": -11.18331241607666, "global_step": 215689, "epoch": 1283} {"train_loss": -11.083162307739258, "global_step": 215690, "epoch": 1283} {"train_loss": -11.235313415527344, "global_step": 215691, "epoch": 1283} {"train_loss": -11.390280723571777, "global_step": 215692, "epoch": 1283} {"train_loss": -11.29758071899414, "global_step": 215693, "epoch": 1283} {"train_loss": -11.452699661254883, "global_step": 215694, "epoch": 1283} {"train_loss": -11.492050170898438, "global_step": 215695, "epoch": 1283} {"train_loss": -11.511370658874512, "global_step": 215696, "epoch": 1283} {"train_loss": -11.38453483581543, "global_step": 215697, "epoch": 1283} {"train_loss": -11.477510452270508, "global_step": 215698, "epoch": 1283} {"train_loss": -11.582468032836914, "global_step": 215699, "epoch": 1283} {"train_loss": -11.352900505065918, "global_step": 215700, "epoch": 1283} {"train_loss": -11.634339332580566, "global_step": 215701, "epoch": 1283} {"train_loss": -11.283632278442383, "global_step": 215702, "epoch": 1283} {"train_loss": -11.73775577545166, "global_step": 215703, "epoch": 1283} {"train_loss": -11.427724838256836, "global_step": 215704, "epoch": 1283} {"train_loss": -11.657929420471191, "global_step": 215705, "epoch": 1283} {"train_loss": -11.503715515136719, "global_step": 215706, "epoch": 1283} {"train_loss": -11.669876098632812, "global_step": 215707, "epoch": 1283} {"train_loss": -11.306034088134766, "global_step": 215708, "epoch": 1283} {"train_loss": -11.93112564086914, "global_step": 215709, "epoch": 1283} {"train_loss": -11.552865982055664, "global_step": 215710, "epoch": 1283} {"train_loss": -11.352307785125006, "global_step": 215711, "epoch": 1283, "val_loss": 254779.5625} {"train_loss": -11.572359085083008, "global_step": 215712, "epoch": 1284} {"train_loss": -11.631118774414062, "global_step": 215713, "epoch": 1284} {"train_loss": -11.148975372314453, "global_step": 215714, "epoch": 1284} {"train_loss": -11.614322662353516, "global_step": 215715, "epoch": 1284} {"train_loss": -11.173898696899414, "global_step": 215716, "epoch": 1284} {"train_loss": -11.223089218139648, "global_step": 215717, "epoch": 1284} {"train_loss": -11.480192184448242, "global_step": 215718, "epoch": 1284} {"train_loss": -11.420079231262207, "global_step": 215719, "epoch": 1284} {"train_loss": -11.430557250976562, "global_step": 215720, "epoch": 1284} {"train_loss": -11.602706909179688, "global_step": 215721, "epoch": 1284} {"train_loss": -11.418172836303711, "global_step": 215722, "epoch": 1284} {"train_loss": -11.635574340820312, "global_step": 215723, "epoch": 1284} {"train_loss": -11.336498260498047, "global_step": 215724, "epoch": 1284} {"train_loss": -11.741880416870117, "global_step": 215725, "epoch": 1284} {"train_loss": -11.508907318115234, "global_step": 215726, "epoch": 1284} {"train_loss": -11.555838584899902, "global_step": 215727, "epoch": 1284} {"train_loss": -11.856046676635742, "global_step": 215728, "epoch": 1284} {"train_loss": -11.390207290649414, "global_step": 215729, "epoch": 1284} {"train_loss": -11.807018280029297, "global_step": 215730, "epoch": 1284} {"train_loss": -11.372295379638672, "global_step": 215731, "epoch": 1284} {"train_loss": -11.496868133544922, "global_step": 215732, "epoch": 1284} {"train_loss": -11.830336570739746, "global_step": 215733, "epoch": 1284} {"train_loss": -11.441985130310059, "global_step": 215734, "epoch": 1284} {"train_loss": -11.40882682800293, "global_step": 215735, "epoch": 1284} {"train_loss": -11.512798309326172, "global_step": 215736, "epoch": 1284} {"train_loss": -10.337417602539062, "global_step": 215737, "epoch": 1284} {"train_loss": -10.80643081665039, "global_step": 215738, "epoch": 1284} {"train_loss": -11.8136568069458, "global_step": 215739, "epoch": 1284} {"train_loss": -10.540645599365234, "global_step": 215740, "epoch": 1284} {"train_loss": -11.473085403442383, "global_step": 215741, "epoch": 1284} {"train_loss": -11.180732727050781, "global_step": 215742, "epoch": 1284} {"train_loss": -11.33475112915039, "global_step": 215743, "epoch": 1284} {"train_loss": -11.396678924560547, "global_step": 215744, "epoch": 1284} {"train_loss": -11.246617317199707, "global_step": 215745, "epoch": 1284} {"train_loss": -10.897969245910645, "global_step": 215746, "epoch": 1284} {"train_loss": -11.008056640625, "global_step": 215747, "epoch": 1284} {"train_loss": -11.120670318603516, "global_step": 215748, "epoch": 1284} {"train_loss": -10.87116527557373, "global_step": 215749, "epoch": 1284} {"train_loss": -11.246540069580078, "global_step": 215750, "epoch": 1284} {"train_loss": -10.851404190063477, "global_step": 215751, "epoch": 1284} {"train_loss": -11.279804229736328, "global_step": 215752, "epoch": 1284} {"train_loss": -11.16346549987793, "global_step": 215753, "epoch": 1284} {"train_loss": -10.8170747756958, "global_step": 215754, "epoch": 1284} {"train_loss": -11.604414939880371, "global_step": 215755, "epoch": 1284} {"train_loss": -10.112749099731445, "global_step": 215756, "epoch": 1284} {"train_loss": -11.310538291931152, "global_step": 215757, "epoch": 1284} {"train_loss": -10.945634841918945, "global_step": 215758, "epoch": 1284} {"train_loss": -11.152791976928711, "global_step": 215759, "epoch": 1284} {"train_loss": -11.174456596374512, "global_step": 215760, "epoch": 1284} {"train_loss": -10.78001594543457, "global_step": 215761, "epoch": 1284} {"train_loss": -11.169153213500977, "global_step": 215762, "epoch": 1284} {"train_loss": -10.653605461120605, "global_step": 215763, "epoch": 1284} {"train_loss": -11.546920776367188, "global_step": 215764, "epoch": 1284} {"train_loss": -10.754984855651855, "global_step": 215765, "epoch": 1284} {"train_loss": -11.411210060119629, "global_step": 215766, "epoch": 1284} {"train_loss": -10.820182800292969, "global_step": 215767, "epoch": 1284} {"train_loss": -10.452820777893066, "global_step": 215768, "epoch": 1284} {"train_loss": -11.169512748718262, "global_step": 215769, "epoch": 1284} {"train_loss": -10.078934669494629, "global_step": 215770, "epoch": 1284} {"train_loss": -11.585905075073242, "global_step": 215771, "epoch": 1284} {"train_loss": -10.85873031616211, "global_step": 215772, "epoch": 1284} {"train_loss": -11.164752960205078, "global_step": 215773, "epoch": 1284} {"train_loss": -11.258794784545898, "global_step": 215774, "epoch": 1284} {"train_loss": -11.15156364440918, "global_step": 215775, "epoch": 1284} {"train_loss": -11.353860855102539, "global_step": 215776, "epoch": 1284} {"train_loss": -11.642510414123535, "global_step": 215777, "epoch": 1284} {"train_loss": -11.452455520629883, "global_step": 215778, "epoch": 1284} {"train_loss": -11.583330154418945, "global_step": 215779, "epoch": 1284} {"train_loss": -11.495993614196777, "global_step": 215780, "epoch": 1284} {"train_loss": -11.813234329223633, "global_step": 215781, "epoch": 1284} {"train_loss": -11.561258316040039, "global_step": 215782, "epoch": 1284} {"train_loss": -11.535133361816406, "global_step": 215783, "epoch": 1284} {"train_loss": -11.803595542907715, "global_step": 215784, "epoch": 1284} {"train_loss": -11.787285804748535, "global_step": 215785, "epoch": 1284} {"train_loss": -11.57596206665039, "global_step": 215786, "epoch": 1284} {"train_loss": -11.800979614257812, "global_step": 215787, "epoch": 1284} {"train_loss": -11.514644622802734, "global_step": 215788, "epoch": 1284} {"train_loss": -11.804290771484375, "global_step": 215789, "epoch": 1284} {"train_loss": -11.747048377990723, "global_step": 215790, "epoch": 1284} {"train_loss": -11.705461502075195, "global_step": 215791, "epoch": 1284} {"train_loss": -11.225767135620117, "global_step": 215792, "epoch": 1284} {"train_loss": -11.716403007507324, "global_step": 215793, "epoch": 1284} {"train_loss": -11.49979305267334, "global_step": 215794, "epoch": 1284} {"train_loss": -11.818788528442383, "global_step": 215795, "epoch": 1284} {"train_loss": -11.511639595031738, "global_step": 215796, "epoch": 1284} {"train_loss": -11.562719345092773, "global_step": 215797, "epoch": 1284} {"train_loss": -11.47758674621582, "global_step": 215798, "epoch": 1284} {"train_loss": -11.627847671508789, "global_step": 215799, "epoch": 1284} {"train_loss": -11.667558670043945, "global_step": 215800, "epoch": 1284} {"train_loss": -11.592159271240234, "global_step": 215801, "epoch": 1284} {"train_loss": -11.628745079040527, "global_step": 215802, "epoch": 1284} {"train_loss": -11.496113777160645, "global_step": 215803, "epoch": 1284} {"train_loss": -11.649740219116211, "global_step": 215804, "epoch": 1284} {"train_loss": -11.535013198852539, "global_step": 215805, "epoch": 1284} {"train_loss": -11.759846687316895, "global_step": 215806, "epoch": 1284} {"train_loss": -11.373739242553711, "global_step": 215807, "epoch": 1284} {"train_loss": -11.278099060058594, "global_step": 215808, "epoch": 1284} {"train_loss": -11.429325103759766, "global_step": 215809, "epoch": 1284} {"train_loss": -11.644340515136719, "global_step": 215810, "epoch": 1284} {"train_loss": -11.694632530212402, "global_step": 215811, "epoch": 1284} {"train_loss": -11.641458511352539, "global_step": 215812, "epoch": 1284} {"train_loss": -11.667684555053711, "global_step": 215813, "epoch": 1284} {"train_loss": -11.552820205688477, "global_step": 215814, "epoch": 1284} {"train_loss": -11.710092544555664, "global_step": 215815, "epoch": 1284} {"train_loss": -11.49148178100586, "global_step": 215816, "epoch": 1284} {"train_loss": -11.389721870422363, "global_step": 215817, "epoch": 1284} {"train_loss": -11.756288528442383, "global_step": 215818, "epoch": 1284} {"train_loss": -11.445194244384766, "global_step": 215819, "epoch": 1284} {"train_loss": -11.580466270446777, "global_step": 215820, "epoch": 1284} {"train_loss": -11.756998062133789, "global_step": 215821, "epoch": 1284} {"train_loss": -11.74404525756836, "global_step": 215822, "epoch": 1284} {"train_loss": -11.869536399841309, "global_step": 215823, "epoch": 1284} {"train_loss": -11.804518699645996, "global_step": 215824, "epoch": 1284} {"train_loss": -11.50199031829834, "global_step": 215825, "epoch": 1284} {"train_loss": -11.7020845413208, "global_step": 215826, "epoch": 1284} {"train_loss": -11.902270317077637, "global_step": 215827, "epoch": 1284} {"train_loss": -11.74886417388916, "global_step": 215828, "epoch": 1284} {"train_loss": -11.841594696044922, "global_step": 215829, "epoch": 1284} {"train_loss": -11.683744430541992, "global_step": 215830, "epoch": 1284} {"train_loss": -11.623845100402832, "global_step": 215831, "epoch": 1284} {"train_loss": -11.868112564086914, "global_step": 215832, "epoch": 1284} {"train_loss": -11.896344184875488, "global_step": 215833, "epoch": 1284} {"train_loss": -11.766874313354492, "global_step": 215834, "epoch": 1284} {"train_loss": -11.719398498535156, "global_step": 215835, "epoch": 1284} {"train_loss": -12.030874252319336, "global_step": 215836, "epoch": 1284} {"train_loss": -11.58462142944336, "global_step": 215837, "epoch": 1284} {"train_loss": -11.36441707611084, "global_step": 215838, "epoch": 1284} {"train_loss": -11.626619338989258, "global_step": 215839, "epoch": 1284} {"train_loss": -11.626898765563965, "global_step": 215840, "epoch": 1284} {"train_loss": -10.82597541809082, "global_step": 215841, "epoch": 1284} {"train_loss": -11.14862060546875, "global_step": 215842, "epoch": 1284} {"train_loss": -11.673067092895508, "global_step": 215843, "epoch": 1284} {"train_loss": -11.509408950805664, "global_step": 215844, "epoch": 1284} {"train_loss": -10.797651290893555, "global_step": 215845, "epoch": 1284} {"train_loss": -11.596990585327148, "global_step": 215846, "epoch": 1284} {"train_loss": -11.496335983276367, "global_step": 215847, "epoch": 1284} {"train_loss": -11.33468246459961, "global_step": 215848, "epoch": 1284} {"train_loss": -11.654772758483887, "global_step": 215849, "epoch": 1284} {"train_loss": -11.689767837524414, "global_step": 215850, "epoch": 1284} {"train_loss": -11.705294609069824, "global_step": 215851, "epoch": 1284} {"train_loss": -11.327330589294434, "global_step": 215852, "epoch": 1284} {"train_loss": -11.355123519897461, "global_step": 215853, "epoch": 1284} {"train_loss": -11.501367568969727, "global_step": 215854, "epoch": 1284} {"train_loss": -11.706779479980469, "global_step": 215855, "epoch": 1284} {"train_loss": -11.330135345458984, "global_step": 215856, "epoch": 1284} {"train_loss": -11.414579391479492, "global_step": 215857, "epoch": 1284} {"train_loss": -11.455810546875, "global_step": 215858, "epoch": 1284} {"train_loss": -11.319217681884766, "global_step": 215859, "epoch": 1284} {"train_loss": -11.802572250366211, "global_step": 215860, "epoch": 1284} {"train_loss": -11.470052719116211, "global_step": 215861, "epoch": 1284} {"train_loss": -11.145928382873535, "global_step": 215862, "epoch": 1284} {"train_loss": -11.514942169189453, "global_step": 215863, "epoch": 1284} {"train_loss": -11.442561149597168, "global_step": 215864, "epoch": 1284} {"train_loss": -10.845197677612305, "global_step": 215865, "epoch": 1284} {"train_loss": -11.220186233520508, "global_step": 215866, "epoch": 1284} {"train_loss": -11.27575969696045, "global_step": 215867, "epoch": 1284} {"train_loss": -11.032571792602539, "global_step": 215868, "epoch": 1284} {"train_loss": -11.789579391479492, "global_step": 215869, "epoch": 1284} {"train_loss": -11.27994155883789, "global_step": 215870, "epoch": 1284} {"train_loss": -11.24849796295166, "global_step": 215871, "epoch": 1284} {"train_loss": -11.14103889465332, "global_step": 215872, "epoch": 1284} {"train_loss": -11.350345611572266, "global_step": 215873, "epoch": 1284} {"train_loss": -10.80949592590332, "global_step": 215874, "epoch": 1284} {"train_loss": -11.147357940673828, "global_step": 215875, "epoch": 1284} {"train_loss": -10.76959228515625, "global_step": 215876, "epoch": 1284} {"train_loss": -10.708671569824219, "global_step": 215877, "epoch": 1284} {"train_loss": -11.006291389465332, "global_step": 215878, "epoch": 1284} {"train_loss": -11.400976186706906, "global_step": 215879, "epoch": 1284, "val_loss": 256235.90625} {"train_loss": -11.339202880859375, "global_step": 215880, "epoch": 1285} {"train_loss": -11.159133911132812, "global_step": 215881, "epoch": 1285} {"train_loss": -11.404788970947266, "global_step": 215882, "epoch": 1285} {"train_loss": -11.324057579040527, "global_step": 215883, "epoch": 1285} {"train_loss": -11.206838607788086, "global_step": 215884, "epoch": 1285} {"train_loss": -11.459824562072754, "global_step": 215885, "epoch": 1285} {"train_loss": -11.227182388305664, "global_step": 215886, "epoch": 1285} {"train_loss": -11.370847702026367, "global_step": 215887, "epoch": 1285} {"train_loss": -11.665390014648438, "global_step": 215888, "epoch": 1285} {"train_loss": -11.338449478149414, "global_step": 215889, "epoch": 1285} {"train_loss": -11.51748275756836, "global_step": 215890, "epoch": 1285} {"train_loss": -11.35816764831543, "global_step": 215891, "epoch": 1285} {"train_loss": -11.288167953491211, "global_step": 215892, "epoch": 1285} {"train_loss": -11.687666893005371, "global_step": 215893, "epoch": 1285} {"train_loss": -11.409147262573242, "global_step": 215894, "epoch": 1285} {"train_loss": -11.372152328491211, "global_step": 215895, "epoch": 1285} {"train_loss": -11.482036590576172, "global_step": 215896, "epoch": 1285} {"train_loss": -11.329345703125, "global_step": 215897, "epoch": 1285} {"train_loss": -10.713102340698242, "global_step": 215898, "epoch": 1285} {"train_loss": -11.430013656616211, "global_step": 215899, "epoch": 1285} {"train_loss": -10.905279159545898, "global_step": 215900, "epoch": 1285} {"train_loss": -10.948619842529297, "global_step": 215901, "epoch": 1285} {"train_loss": -10.947830200195312, "global_step": 215902, "epoch": 1285} {"train_loss": -10.374292373657227, "global_step": 215903, "epoch": 1285} {"train_loss": -11.519046783447266, "global_step": 215904, "epoch": 1285} {"train_loss": -10.284442901611328, "global_step": 215905, "epoch": 1285} {"train_loss": -11.617781639099121, "global_step": 215906, "epoch": 1285} {"train_loss": -10.524882316589355, "global_step": 215907, "epoch": 1285} {"train_loss": -11.421175003051758, "global_step": 215908, "epoch": 1285} {"train_loss": -11.013433456420898, "global_step": 215909, "epoch": 1285} {"train_loss": -11.097307205200195, "global_step": 215910, "epoch": 1285} {"train_loss": -11.307641983032227, "global_step": 215911, "epoch": 1285} {"train_loss": -10.817416191101074, "global_step": 215912, "epoch": 1285} {"train_loss": -11.59837532043457, "global_step": 215913, "epoch": 1285} {"train_loss": -11.438206672668457, "global_step": 215914, "epoch": 1285} {"train_loss": -11.296063423156738, "global_step": 215915, "epoch": 1285} {"train_loss": -11.314593315124512, "global_step": 215916, "epoch": 1285} {"train_loss": -11.45012092590332, "global_step": 215917, "epoch": 1285} {"train_loss": -11.152740478515625, "global_step": 215918, "epoch": 1285} {"train_loss": -11.300148010253906, "global_step": 215919, "epoch": 1285} {"train_loss": -11.35726547241211, "global_step": 215920, "epoch": 1285} {"train_loss": -11.146510124206543, "global_step": 215921, "epoch": 1285} {"train_loss": -11.13801097869873, "global_step": 215922, "epoch": 1285} {"train_loss": -11.326984405517578, "global_step": 215923, "epoch": 1285} {"train_loss": -11.036029815673828, "global_step": 215924, "epoch": 1285} {"train_loss": -11.482077598571777, "global_step": 215925, "epoch": 1285} {"train_loss": -11.265066146850586, "global_step": 215926, "epoch": 1285} {"train_loss": -11.311455726623535, "global_step": 215927, "epoch": 1285} {"train_loss": -11.325678825378418, "global_step": 215928, "epoch": 1285} {"train_loss": -11.353686332702637, "global_step": 215929, "epoch": 1285} {"train_loss": -11.10053825378418, "global_step": 215930, "epoch": 1285} {"train_loss": -11.71403694152832, "global_step": 215931, "epoch": 1285} {"train_loss": -10.799541473388672, "global_step": 215932, "epoch": 1285} {"train_loss": -11.451421737670898, "global_step": 215933, "epoch": 1285} {"train_loss": -11.314569473266602, "global_step": 215934, "epoch": 1285} {"train_loss": -11.18388557434082, "global_step": 215935, "epoch": 1285} {"train_loss": -11.52363109588623, "global_step": 215936, "epoch": 1285} {"train_loss": -10.966310501098633, "global_step": 215937, "epoch": 1285} {"train_loss": -11.471076965332031, "global_step": 215938, "epoch": 1285} {"train_loss": -11.329654693603516, "global_step": 215939, "epoch": 1285} {"train_loss": -11.187302589416504, "global_step": 215940, "epoch": 1285} {"train_loss": -11.449378967285156, "global_step": 215941, "epoch": 1285} {"train_loss": -11.334720611572266, "global_step": 215942, "epoch": 1285} {"train_loss": -11.232599258422852, "global_step": 215943, "epoch": 1285} {"train_loss": -11.521565437316895, "global_step": 215944, "epoch": 1285} {"train_loss": -11.585046768188477, "global_step": 215945, "epoch": 1285} {"train_loss": -11.512351989746094, "global_step": 215946, "epoch": 1285} {"train_loss": -11.585248947143555, "global_step": 215947, "epoch": 1285} {"train_loss": -11.292917251586914, "global_step": 215948, "epoch": 1285} {"train_loss": -11.332138061523438, "global_step": 215949, "epoch": 1285} {"train_loss": -11.356246948242188, "global_step": 215950, "epoch": 1285} {"train_loss": -11.629478454589844, "global_step": 215951, "epoch": 1285} {"train_loss": -11.517945289611816, "global_step": 215952, "epoch": 1285} {"train_loss": -11.670381546020508, "global_step": 215953, "epoch": 1285} {"train_loss": -11.051852226257324, "global_step": 215954, "epoch": 1285} {"train_loss": -11.700983047485352, "global_step": 215955, "epoch": 1285} {"train_loss": -11.305258750915527, "global_step": 215956, "epoch": 1285} {"train_loss": -11.616641998291016, "global_step": 215957, "epoch": 1285} {"train_loss": -11.406803131103516, "global_step": 215958, "epoch": 1285} {"train_loss": -11.392099380493164, "global_step": 215959, "epoch": 1285} {"train_loss": -11.529420852661133, "global_step": 215960, "epoch": 1285} {"train_loss": -11.301847457885742, "global_step": 215961, "epoch": 1285} {"train_loss": -11.504545211791992, "global_step": 215962, "epoch": 1285} {"train_loss": -11.457414627075195, "global_step": 215963, "epoch": 1285} {"train_loss": -11.122100830078125, "global_step": 215964, "epoch": 1285} {"train_loss": -11.247186660766602, "global_step": 215965, "epoch": 1285} {"train_loss": -11.082010269165039, "global_step": 215966, "epoch": 1285} {"train_loss": -11.443574905395508, "global_step": 215967, "epoch": 1285} {"train_loss": -10.875106811523438, "global_step": 215968, "epoch": 1285} {"train_loss": -11.128429412841797, "global_step": 215969, "epoch": 1285} {"train_loss": -11.107933044433594, "global_step": 215970, "epoch": 1285} {"train_loss": -10.666337013244629, "global_step": 215971, "epoch": 1285} {"train_loss": -10.794683456420898, "global_step": 215972, "epoch": 1285} {"train_loss": -11.29509162902832, "global_step": 215973, "epoch": 1285} {"train_loss": -11.013594627380371, "global_step": 215974, "epoch": 1285} {"train_loss": -11.438600540161133, "global_step": 215975, "epoch": 1285} {"train_loss": -10.999550819396973, "global_step": 215976, "epoch": 1285} {"train_loss": -11.303862571716309, "global_step": 215977, "epoch": 1285} {"train_loss": -11.32837963104248, "global_step": 215978, "epoch": 1285} {"train_loss": -11.566303253173828, "global_step": 215979, "epoch": 1285} {"train_loss": -11.251737594604492, "global_step": 215980, "epoch": 1285} {"train_loss": -11.273773193359375, "global_step": 215981, "epoch": 1285} {"train_loss": -11.233489036560059, "global_step": 215982, "epoch": 1285} {"train_loss": -11.422576904296875, "global_step": 215983, "epoch": 1285} {"train_loss": -11.217842102050781, "global_step": 215984, "epoch": 1285} {"train_loss": -11.349853515625, "global_step": 215985, "epoch": 1285} {"train_loss": -11.65960693359375, "global_step": 215986, "epoch": 1285} {"train_loss": -10.988828659057617, "global_step": 215987, "epoch": 1285} {"train_loss": -11.35329532623291, "global_step": 215988, "epoch": 1285} {"train_loss": -11.183188438415527, "global_step": 215989, "epoch": 1285} {"train_loss": -10.904070854187012, "global_step": 215990, "epoch": 1285} {"train_loss": -11.514665603637695, "global_step": 215991, "epoch": 1285} {"train_loss": -11.37745189666748, "global_step": 215992, "epoch": 1285} {"train_loss": -11.429830551147461, "global_step": 215993, "epoch": 1285} {"train_loss": -11.072575569152832, "global_step": 215994, "epoch": 1285} {"train_loss": -10.788537979125977, "global_step": 215995, "epoch": 1285} {"train_loss": -11.62540054321289, "global_step": 215996, "epoch": 1285} {"train_loss": -11.144464492797852, "global_step": 215997, "epoch": 1285} {"train_loss": -11.505340576171875, "global_step": 215998, "epoch": 1285} {"train_loss": -10.60299015045166, "global_step": 215999, "epoch": 1285} {"train_loss": -11.714010238647461, "global_step": 216000, "epoch": 1285} {"train_loss": -10.842863082885742, "global_step": 216001, "epoch": 1285} {"train_loss": -11.27595043182373, "global_step": 216002, "epoch": 1285} {"train_loss": -11.003883361816406, "global_step": 216003, "epoch": 1285} {"train_loss": -10.96982192993164, "global_step": 216004, "epoch": 1285} {"train_loss": -10.543661117553711, "global_step": 216005, "epoch": 1285} {"train_loss": -10.73781681060791, "global_step": 216006, "epoch": 1285} {"train_loss": -11.06869125366211, "global_step": 216007, "epoch": 1285} {"train_loss": -10.404922485351562, "global_step": 216008, "epoch": 1285} {"train_loss": -10.687806129455566, "global_step": 216009, "epoch": 1285} {"train_loss": -10.842231750488281, "global_step": 216010, "epoch": 1285} {"train_loss": -10.573089599609375, "global_step": 216011, "epoch": 1285} {"train_loss": -10.799640655517578, "global_step": 216012, "epoch": 1285} {"train_loss": -9.871575355529785, "global_step": 216013, "epoch": 1285} {"train_loss": -11.083715438842773, "global_step": 216014, "epoch": 1285} {"train_loss": -10.201087951660156, "global_step": 216015, "epoch": 1285} {"train_loss": -11.103317260742188, "global_step": 216016, "epoch": 1285} {"train_loss": -10.312304496765137, "global_step": 216017, "epoch": 1285} {"train_loss": -10.122114181518555, "global_step": 216018, "epoch": 1285} {"train_loss": -11.006237030029297, "global_step": 216019, "epoch": 1285} {"train_loss": -10.123698234558105, "global_step": 216020, "epoch": 1285} {"train_loss": -11.034799575805664, "global_step": 216021, "epoch": 1285} {"train_loss": -10.920791625976562, "global_step": 216022, "epoch": 1285} {"train_loss": -10.63857650756836, "global_step": 216023, "epoch": 1285} {"train_loss": -10.91562271118164, "global_step": 216024, "epoch": 1285} {"train_loss": -10.500984191894531, "global_step": 216025, "epoch": 1285} {"train_loss": -10.946088790893555, "global_step": 216026, "epoch": 1285} {"train_loss": -10.951109886169434, "global_step": 216027, "epoch": 1285} {"train_loss": -10.697315216064453, "global_step": 216028, "epoch": 1285} {"train_loss": -11.134247779846191, "global_step": 216029, "epoch": 1285} {"train_loss": -11.26405143737793, "global_step": 216030, "epoch": 1285} {"train_loss": -10.74186897277832, "global_step": 216031, "epoch": 1285} {"train_loss": -11.183561325073242, "global_step": 216032, "epoch": 1285} {"train_loss": -11.024445533752441, "global_step": 216033, "epoch": 1285} {"train_loss": -10.502294540405273, "global_step": 216034, "epoch": 1285} {"train_loss": -11.218952178955078, "global_step": 216035, "epoch": 1285} {"train_loss": -11.130597114562988, "global_step": 216036, "epoch": 1285} {"train_loss": -10.841489791870117, "global_step": 216037, "epoch": 1285} {"train_loss": -11.399520874023438, "global_step": 216038, "epoch": 1285} {"train_loss": -11.067033767700195, "global_step": 216039, "epoch": 1285} {"train_loss": -11.035665512084961, "global_step": 216040, "epoch": 1285} {"train_loss": -11.30363655090332, "global_step": 216041, "epoch": 1285} {"train_loss": -11.21662712097168, "global_step": 216042, "epoch": 1285} {"train_loss": -11.149945259094238, "global_step": 216043, "epoch": 1285} {"train_loss": -11.389188766479492, "global_step": 216044, "epoch": 1285} {"train_loss": -11.421621322631836, "global_step": 216045, "epoch": 1285} {"train_loss": -10.964282989501953, "global_step": 216046, "epoch": 1285} {"train_loss": -11.166581619353522, "global_step": 216047, "epoch": 1285, "val_loss": 257374.703125, "train_action_mse_error": 0.41463279724121094} {"train_loss": -11.560601234436035, "global_step": 216048, "epoch": 1286} {"train_loss": -11.099515914916992, "global_step": 216049, "epoch": 1286} {"train_loss": -11.499408721923828, "global_step": 216050, "epoch": 1286} {"train_loss": -11.579145431518555, "global_step": 216051, "epoch": 1286} {"train_loss": -11.161458015441895, "global_step": 216052, "epoch": 1286} {"train_loss": -11.424281120300293, "global_step": 216053, "epoch": 1286} {"train_loss": -11.49863052368164, "global_step": 216054, "epoch": 1286} {"train_loss": -11.710602760314941, "global_step": 216055, "epoch": 1286} {"train_loss": -11.498462677001953, "global_step": 216056, "epoch": 1286} {"train_loss": -11.548038482666016, "global_step": 216057, "epoch": 1286} {"train_loss": -11.623327255249023, "global_step": 216058, "epoch": 1286} {"train_loss": -11.583030700683594, "global_step": 216059, "epoch": 1286} {"train_loss": -11.738910675048828, "global_step": 216060, "epoch": 1286} {"train_loss": -11.641253471374512, "global_step": 216061, "epoch": 1286} {"train_loss": -11.636826515197754, "global_step": 216062, "epoch": 1286} {"train_loss": -11.76168441772461, "global_step": 216063, "epoch": 1286} {"train_loss": -11.722847938537598, "global_step": 216064, "epoch": 1286} {"train_loss": -11.679947853088379, "global_step": 216065, "epoch": 1286} {"train_loss": -11.678325653076172, "global_step": 216066, "epoch": 1286} {"train_loss": -11.64025592803955, "global_step": 216067, "epoch": 1286} {"train_loss": -11.688408851623535, "global_step": 216068, "epoch": 1286} {"train_loss": -11.630005836486816, "global_step": 216069, "epoch": 1286} {"train_loss": -11.825737953186035, "global_step": 216070, "epoch": 1286} {"train_loss": -11.314720153808594, "global_step": 216071, "epoch": 1286} {"train_loss": -11.756143569946289, "global_step": 216072, "epoch": 1286} {"train_loss": -11.581802368164062, "global_step": 216073, "epoch": 1286} {"train_loss": -11.887228965759277, "global_step": 216074, "epoch": 1286} {"train_loss": -11.699779510498047, "global_step": 216075, "epoch": 1286} {"train_loss": -11.75550651550293, "global_step": 216076, "epoch": 1286} {"train_loss": -11.965909957885742, "global_step": 216077, "epoch": 1286} {"train_loss": -11.632658004760742, "global_step": 216078, "epoch": 1286} {"train_loss": -11.768770217895508, "global_step": 216079, "epoch": 1286} {"train_loss": -11.481158256530762, "global_step": 216080, "epoch": 1286} {"train_loss": -11.721672058105469, "global_step": 216081, "epoch": 1286} {"train_loss": -11.835925102233887, "global_step": 216082, "epoch": 1286} {"train_loss": -11.863990783691406, "global_step": 216083, "epoch": 1286} {"train_loss": -12.005029678344727, "global_step": 216084, "epoch": 1286} {"train_loss": -11.689817428588867, "global_step": 216085, "epoch": 1286} {"train_loss": -11.483223915100098, "global_step": 216086, "epoch": 1286} {"train_loss": -11.535197257995605, "global_step": 216087, "epoch": 1286} {"train_loss": -11.804498672485352, "global_step": 216088, "epoch": 1286} {"train_loss": -11.908671379089355, "global_step": 216089, "epoch": 1286} {"train_loss": -11.657770156860352, "global_step": 216090, "epoch": 1286} {"train_loss": -11.83188247680664, "global_step": 216091, "epoch": 1286} {"train_loss": -11.570362091064453, "global_step": 216092, "epoch": 1286} {"train_loss": -12.118003845214844, "global_step": 216093, "epoch": 1286} {"train_loss": -11.535001754760742, "global_step": 216094, "epoch": 1286} {"train_loss": -11.895967483520508, "global_step": 216095, "epoch": 1286} {"train_loss": -11.852458000183105, "global_step": 216096, "epoch": 1286} {"train_loss": -11.625011444091797, "global_step": 216097, "epoch": 1286} {"train_loss": -11.844829559326172, "global_step": 216098, "epoch": 1286} {"train_loss": -11.755165100097656, "global_step": 216099, "epoch": 1286} {"train_loss": -12.093814849853516, "global_step": 216100, "epoch": 1286} {"train_loss": -11.721399307250977, "global_step": 216101, "epoch": 1286} {"train_loss": -11.763175010681152, "global_step": 216102, "epoch": 1286} {"train_loss": -11.835227966308594, "global_step": 216103, "epoch": 1286} {"train_loss": -11.717052459716797, "global_step": 216104, "epoch": 1286} {"train_loss": -11.911771774291992, "global_step": 216105, "epoch": 1286} {"train_loss": -11.726449966430664, "global_step": 216106, "epoch": 1286} {"train_loss": -11.696737289428711, "global_step": 216107, "epoch": 1286} {"train_loss": -11.560332298278809, "global_step": 216108, "epoch": 1286} {"train_loss": -11.772478103637695, "global_step": 216109, "epoch": 1286} {"train_loss": -11.694283485412598, "global_step": 216110, "epoch": 1286} {"train_loss": -12.030412673950195, "global_step": 216111, "epoch": 1286} {"train_loss": -11.51713752746582, "global_step": 216112, "epoch": 1286} {"train_loss": -11.321405410766602, "global_step": 216113, "epoch": 1286} {"train_loss": -11.166685104370117, "global_step": 216114, "epoch": 1286} {"train_loss": -11.266756057739258, "global_step": 216115, "epoch": 1286} {"train_loss": -11.329381942749023, "global_step": 216116, "epoch": 1286} {"train_loss": -11.292675018310547, "global_step": 216117, "epoch": 1286} {"train_loss": -11.40291976928711, "global_step": 216118, "epoch": 1286} {"train_loss": -11.741349220275879, "global_step": 216119, "epoch": 1286} {"train_loss": -11.445880889892578, "global_step": 216120, "epoch": 1286} {"train_loss": -11.413372993469238, "global_step": 216121, "epoch": 1286} {"train_loss": -11.446647644042969, "global_step": 216122, "epoch": 1286} {"train_loss": -11.708545684814453, "global_step": 216123, "epoch": 1286} {"train_loss": -10.853126525878906, "global_step": 216124, "epoch": 1286} {"train_loss": -11.387340545654297, "global_step": 216125, "epoch": 1286} {"train_loss": -10.917595863342285, "global_step": 216126, "epoch": 1286} {"train_loss": -11.10502815246582, "global_step": 216127, "epoch": 1286} {"train_loss": -10.88682746887207, "global_step": 216128, "epoch": 1286} {"train_loss": -9.196783065795898, "global_step": 216129, "epoch": 1286} {"train_loss": -11.25594711303711, "global_step": 216130, "epoch": 1286} {"train_loss": -10.42319107055664, "global_step": 216131, "epoch": 1286} {"train_loss": -10.986634254455566, "global_step": 216132, "epoch": 1286} {"train_loss": -11.153299331665039, "global_step": 216133, "epoch": 1286} {"train_loss": -10.376007080078125, "global_step": 216134, "epoch": 1286} {"train_loss": -10.480871200561523, "global_step": 216135, "epoch": 1286} {"train_loss": -10.641797065734863, "global_step": 216136, "epoch": 1286} {"train_loss": -10.049004554748535, "global_step": 216137, "epoch": 1286} {"train_loss": -10.856948852539062, "global_step": 216138, "epoch": 1286} {"train_loss": -10.345306396484375, "global_step": 216139, "epoch": 1286} {"train_loss": -11.137619018554688, "global_step": 216140, "epoch": 1286} {"train_loss": -10.975249290466309, "global_step": 216141, "epoch": 1286} {"train_loss": -11.154632568359375, "global_step": 216142, "epoch": 1286} {"train_loss": -11.764469146728516, "global_step": 216143, "epoch": 1286} {"train_loss": -10.986639022827148, "global_step": 216144, "epoch": 1286} {"train_loss": -10.801270484924316, "global_step": 216145, "epoch": 1286} {"train_loss": -10.700345993041992, "global_step": 216146, "epoch": 1286} {"train_loss": -10.716651916503906, "global_step": 216147, "epoch": 1286} {"train_loss": -10.820640563964844, "global_step": 216148, "epoch": 1286} {"train_loss": -11.10074520111084, "global_step": 216149, "epoch": 1286} {"train_loss": -11.015825271606445, "global_step": 216150, "epoch": 1286} {"train_loss": -11.13210678100586, "global_step": 216151, "epoch": 1286} {"train_loss": -11.15978717803955, "global_step": 216152, "epoch": 1286} {"train_loss": -11.292116165161133, "global_step": 216153, "epoch": 1286} {"train_loss": -11.264382362365723, "global_step": 216154, "epoch": 1286} {"train_loss": -11.226883888244629, "global_step": 216155, "epoch": 1286} {"train_loss": -11.294469833374023, "global_step": 216156, "epoch": 1286} {"train_loss": -11.178014755249023, "global_step": 216157, "epoch": 1286} {"train_loss": -11.221502304077148, "global_step": 216158, "epoch": 1286} {"train_loss": -11.028518676757812, "global_step": 216159, "epoch": 1286} {"train_loss": -11.421110153198242, "global_step": 216160, "epoch": 1286} {"train_loss": -11.156861305236816, "global_step": 216161, "epoch": 1286} {"train_loss": -11.16318416595459, "global_step": 216162, "epoch": 1286} {"train_loss": -11.380711555480957, "global_step": 216163, "epoch": 1286} {"train_loss": -11.09289836883545, "global_step": 216164, "epoch": 1286} {"train_loss": -11.165117263793945, "global_step": 216165, "epoch": 1286} {"train_loss": -11.301454544067383, "global_step": 216166, "epoch": 1286} {"train_loss": -11.285199165344238, "global_step": 216167, "epoch": 1286} {"train_loss": -11.548164367675781, "global_step": 216168, "epoch": 1286} {"train_loss": -11.334553718566895, "global_step": 216169, "epoch": 1286} {"train_loss": -11.16099739074707, "global_step": 216170, "epoch": 1286} {"train_loss": -11.268068313598633, "global_step": 216171, "epoch": 1286} {"train_loss": -11.223312377929688, "global_step": 216172, "epoch": 1286} {"train_loss": -11.501765251159668, "global_step": 216173, "epoch": 1286} {"train_loss": -11.318201065063477, "global_step": 216174, "epoch": 1286} {"train_loss": -11.090435028076172, "global_step": 216175, "epoch": 1286} {"train_loss": -11.271595001220703, "global_step": 216176, "epoch": 1286} {"train_loss": -11.419293403625488, "global_step": 216177, "epoch": 1286} {"train_loss": -11.538705825805664, "global_step": 216178, "epoch": 1286} {"train_loss": -11.540843963623047, "global_step": 216179, "epoch": 1286} {"train_loss": -11.376252174377441, "global_step": 216180, "epoch": 1286} {"train_loss": -11.70819091796875, "global_step": 216181, "epoch": 1286} {"train_loss": -11.500192642211914, "global_step": 216182, "epoch": 1286} {"train_loss": -11.588886260986328, "global_step": 216183, "epoch": 1286} {"train_loss": -11.703737258911133, "global_step": 216184, "epoch": 1286} {"train_loss": -11.710850715637207, "global_step": 216185, "epoch": 1286} {"train_loss": -11.598608016967773, "global_step": 216186, "epoch": 1286} {"train_loss": -11.408422470092773, "global_step": 216187, "epoch": 1286} {"train_loss": -11.7781982421875, "global_step": 216188, "epoch": 1286} {"train_loss": -11.52900218963623, "global_step": 216189, "epoch": 1286} {"train_loss": -11.62686538696289, "global_step": 216190, "epoch": 1286} {"train_loss": -11.618818283081055, "global_step": 216191, "epoch": 1286} {"train_loss": -11.51922607421875, "global_step": 216192, "epoch": 1286} {"train_loss": -11.790417671203613, "global_step": 216193, "epoch": 1286} {"train_loss": -11.495341300964355, "global_step": 216194, "epoch": 1286} {"train_loss": -11.821413040161133, "global_step": 216195, "epoch": 1286} {"train_loss": -11.783495903015137, "global_step": 216196, "epoch": 1286} {"train_loss": -11.899070739746094, "global_step": 216197, "epoch": 1286} {"train_loss": -11.70241928100586, "global_step": 216198, "epoch": 1286} {"train_loss": -11.896126747131348, "global_step": 216199, "epoch": 1286} {"train_loss": -11.741405487060547, "global_step": 216200, "epoch": 1286} {"train_loss": -12.059743881225586, "global_step": 216201, "epoch": 1286} {"train_loss": -11.905403137207031, "global_step": 216202, "epoch": 1286} {"train_loss": -11.731328964233398, "global_step": 216203, "epoch": 1286} {"train_loss": -11.817682266235352, "global_step": 216204, "epoch": 1286} {"train_loss": -11.84548568725586, "global_step": 216205, "epoch": 1286} {"train_loss": -11.96989631652832, "global_step": 216206, "epoch": 1286} {"train_loss": -11.792644500732422, "global_step": 216207, "epoch": 1286} {"train_loss": -11.563814163208008, "global_step": 216208, "epoch": 1286} {"train_loss": -12.021957397460938, "global_step": 216209, "epoch": 1286} {"train_loss": -11.651407241821289, "global_step": 216210, "epoch": 1286} {"train_loss": -11.450139999389648, "global_step": 216211, "epoch": 1286} {"train_loss": -11.90142822265625, "global_step": 216212, "epoch": 1286} {"train_loss": -11.618505477905273, "global_step": 216213, "epoch": 1286} {"train_loss": -11.550323486328125, "global_step": 216214, "epoch": 1286} {"train_loss": -11.46490504628136, "global_step": 216215, "epoch": 1286, "val_loss": 257039.53125} {"train_loss": -10.456055641174316, "global_step": 216216, "epoch": 1287} {"train_loss": -11.268316268920898, "global_step": 216217, "epoch": 1287} {"train_loss": -11.711416244506836, "global_step": 216218, "epoch": 1287} {"train_loss": -10.82550048828125, "global_step": 216219, "epoch": 1287} {"train_loss": -11.560465812683105, "global_step": 216220, "epoch": 1287} {"train_loss": -11.270755767822266, "global_step": 216221, "epoch": 1287} {"train_loss": -11.712076187133789, "global_step": 216222, "epoch": 1287} {"train_loss": -11.55435562133789, "global_step": 216223, "epoch": 1287} {"train_loss": -11.580507278442383, "global_step": 216224, "epoch": 1287} {"train_loss": -11.324909210205078, "global_step": 216225, "epoch": 1287} {"train_loss": -11.57935619354248, "global_step": 216226, "epoch": 1287} {"train_loss": -11.301536560058594, "global_step": 216227, "epoch": 1287} {"train_loss": -11.149517059326172, "global_step": 216228, "epoch": 1287} {"train_loss": -11.538213729858398, "global_step": 216229, "epoch": 1287} {"train_loss": -10.409969329833984, "global_step": 216230, "epoch": 1287} {"train_loss": -11.422931671142578, "global_step": 216231, "epoch": 1287} {"train_loss": -10.52933120727539, "global_step": 216232, "epoch": 1287} {"train_loss": -10.284189224243164, "global_step": 216233, "epoch": 1287} {"train_loss": -11.170987129211426, "global_step": 216234, "epoch": 1287} {"train_loss": -9.97802448272705, "global_step": 216235, "epoch": 1287} {"train_loss": -10.311929702758789, "global_step": 216236, "epoch": 1287} {"train_loss": -9.921622276306152, "global_step": 216237, "epoch": 1287} {"train_loss": -11.234158515930176, "global_step": 216238, "epoch": 1287} {"train_loss": -10.530017852783203, "global_step": 216239, "epoch": 1287} {"train_loss": -10.945745468139648, "global_step": 216240, "epoch": 1287} {"train_loss": -10.87972354888916, "global_step": 216241, "epoch": 1287} {"train_loss": -10.402837753295898, "global_step": 216242, "epoch": 1287} {"train_loss": -11.136724472045898, "global_step": 216243, "epoch": 1287} {"train_loss": -11.093358039855957, "global_step": 216244, "epoch": 1287} {"train_loss": -10.91408634185791, "global_step": 216245, "epoch": 1287} {"train_loss": -11.488950729370117, "global_step": 216246, "epoch": 1287} {"train_loss": -10.958580017089844, "global_step": 216247, "epoch": 1287} {"train_loss": -11.40257453918457, "global_step": 216248, "epoch": 1287} {"train_loss": -11.281949996948242, "global_step": 216249, "epoch": 1287} {"train_loss": -11.358563423156738, "global_step": 216250, "epoch": 1287} {"train_loss": -11.483296394348145, "global_step": 216251, "epoch": 1287} {"train_loss": -11.249228477478027, "global_step": 216252, "epoch": 1287} {"train_loss": -11.362863540649414, "global_step": 216253, "epoch": 1287} {"train_loss": -11.31264877319336, "global_step": 216254, "epoch": 1287} {"train_loss": -11.451946258544922, "global_step": 216255, "epoch": 1287} {"train_loss": -11.088014602661133, "global_step": 216256, "epoch": 1287} {"train_loss": -11.55069351196289, "global_step": 216257, "epoch": 1287} {"train_loss": -11.075300216674805, "global_step": 216258, "epoch": 1287} {"train_loss": -10.920600891113281, "global_step": 216259, "epoch": 1287} {"train_loss": -11.09243392944336, "global_step": 216260, "epoch": 1287} {"train_loss": -11.031990051269531, "global_step": 216261, "epoch": 1287} {"train_loss": -11.384488105773926, "global_step": 216262, "epoch": 1287} {"train_loss": -11.084678649902344, "global_step": 216263, "epoch": 1287} {"train_loss": -11.402120590209961, "global_step": 216264, "epoch": 1287} {"train_loss": -11.21281623840332, "global_step": 216265, "epoch": 1287} {"train_loss": -11.105060577392578, "global_step": 216266, "epoch": 1287} {"train_loss": -11.247663497924805, "global_step": 216267, "epoch": 1287} {"train_loss": -11.095251083374023, "global_step": 216268, "epoch": 1287} {"train_loss": -11.164417266845703, "global_step": 216269, "epoch": 1287} {"train_loss": -11.386133193969727, "global_step": 216270, "epoch": 1287} {"train_loss": -11.341075897216797, "global_step": 216271, "epoch": 1287} {"train_loss": -11.586315155029297, "global_step": 216272, "epoch": 1287} {"train_loss": -11.024547576904297, "global_step": 216273, "epoch": 1287} {"train_loss": -11.140032768249512, "global_step": 216274, "epoch": 1287} {"train_loss": -11.330318450927734, "global_step": 216275, "epoch": 1287} {"train_loss": -11.131067276000977, "global_step": 216276, "epoch": 1287} {"train_loss": -11.224018096923828, "global_step": 216277, "epoch": 1287} {"train_loss": -11.168034553527832, "global_step": 216278, "epoch": 1287} {"train_loss": -11.402215957641602, "global_step": 216279, "epoch": 1287} {"train_loss": -10.654136657714844, "global_step": 216280, "epoch": 1287} {"train_loss": -11.067821502685547, "global_step": 216281, "epoch": 1287} {"train_loss": -10.854022979736328, "global_step": 216282, "epoch": 1287} {"train_loss": -11.089034080505371, "global_step": 216283, "epoch": 1287} {"train_loss": -11.495079040527344, "global_step": 216284, "epoch": 1287} {"train_loss": -11.159507751464844, "global_step": 216285, "epoch": 1287} {"train_loss": -11.772256851196289, "global_step": 216286, "epoch": 1287} {"train_loss": -11.155684471130371, "global_step": 216287, "epoch": 1287} {"train_loss": -11.742169380187988, "global_step": 216288, "epoch": 1287} {"train_loss": -11.370187759399414, "global_step": 216289, "epoch": 1287} {"train_loss": -11.188907623291016, "global_step": 216290, "epoch": 1287} {"train_loss": -11.507360458374023, "global_step": 216291, "epoch": 1287} {"train_loss": -11.27369499206543, "global_step": 216292, "epoch": 1287} {"train_loss": -11.342294692993164, "global_step": 216293, "epoch": 1287} {"train_loss": -11.123873710632324, "global_step": 216294, "epoch": 1287} {"train_loss": -11.381043434143066, "global_step": 216295, "epoch": 1287} {"train_loss": -11.652708053588867, "global_step": 216296, "epoch": 1287} {"train_loss": -10.913191795349121, "global_step": 216297, "epoch": 1287} {"train_loss": -11.774590492248535, "global_step": 216298, "epoch": 1287} {"train_loss": -11.203624725341797, "global_step": 216299, "epoch": 1287} {"train_loss": -11.746566772460938, "global_step": 216300, "epoch": 1287} {"train_loss": -11.160734176635742, "global_step": 216301, "epoch": 1287} {"train_loss": -11.601380348205566, "global_step": 216302, "epoch": 1287} {"train_loss": -11.692421913146973, "global_step": 216303, "epoch": 1287} {"train_loss": -11.654788970947266, "global_step": 216304, "epoch": 1287} {"train_loss": -11.823579788208008, "global_step": 216305, "epoch": 1287} {"train_loss": -11.741168022155762, "global_step": 216306, "epoch": 1287} {"train_loss": -11.817953109741211, "global_step": 216307, "epoch": 1287} {"train_loss": -11.750150680541992, "global_step": 216308, "epoch": 1287} {"train_loss": -11.679702758789062, "global_step": 216309, "epoch": 1287} {"train_loss": -11.811493873596191, "global_step": 216310, "epoch": 1287} {"train_loss": -11.763456344604492, "global_step": 216311, "epoch": 1287} {"train_loss": -11.895830154418945, "global_step": 216312, "epoch": 1287} {"train_loss": -11.720560073852539, "global_step": 216313, "epoch": 1287} {"train_loss": -11.864206314086914, "global_step": 216314, "epoch": 1287} {"train_loss": -11.913765907287598, "global_step": 216315, "epoch": 1287} {"train_loss": -11.711633682250977, "global_step": 216316, "epoch": 1287} {"train_loss": -11.825401306152344, "global_step": 216317, "epoch": 1287} {"train_loss": -11.790633201599121, "global_step": 216318, "epoch": 1287} {"train_loss": -11.994340896606445, "global_step": 216319, "epoch": 1287} {"train_loss": -11.72285270690918, "global_step": 216320, "epoch": 1287} {"train_loss": -11.738429069519043, "global_step": 216321, "epoch": 1287} {"train_loss": -11.931215286254883, "global_step": 216322, "epoch": 1287} {"train_loss": -12.028815269470215, "global_step": 216323, "epoch": 1287} {"train_loss": -11.842781066894531, "global_step": 216324, "epoch": 1287} {"train_loss": -11.88474178314209, "global_step": 216325, "epoch": 1287} {"train_loss": -11.739468574523926, "global_step": 216326, "epoch": 1287} {"train_loss": -11.934980392456055, "global_step": 216327, "epoch": 1287} {"train_loss": -11.814493179321289, "global_step": 216328, "epoch": 1287} {"train_loss": -11.833356857299805, "global_step": 216329, "epoch": 1287} {"train_loss": -11.69639778137207, "global_step": 216330, "epoch": 1287} {"train_loss": -12.126368522644043, "global_step": 216331, "epoch": 1287} {"train_loss": -12.019804000854492, "global_step": 216332, "epoch": 1287} {"train_loss": -11.411380767822266, "global_step": 216333, "epoch": 1287} {"train_loss": -12.029727935791016, "global_step": 216334, "epoch": 1287} {"train_loss": -11.749542236328125, "global_step": 216335, "epoch": 1287} {"train_loss": -11.617057800292969, "global_step": 216336, "epoch": 1287} {"train_loss": -11.634817123413086, "global_step": 216337, "epoch": 1287} {"train_loss": -11.90618896484375, "global_step": 216338, "epoch": 1287} {"train_loss": -11.535392761230469, "global_step": 216339, "epoch": 1287} {"train_loss": -11.202119827270508, "global_step": 216340, "epoch": 1287} {"train_loss": -11.452402114868164, "global_step": 216341, "epoch": 1287} {"train_loss": -11.775442123413086, "global_step": 216342, "epoch": 1287} {"train_loss": -11.283415794372559, "global_step": 216343, "epoch": 1287} {"train_loss": -11.549683570861816, "global_step": 216344, "epoch": 1287} {"train_loss": -11.26498031616211, "global_step": 216345, "epoch": 1287} {"train_loss": -11.664117813110352, "global_step": 216346, "epoch": 1287} {"train_loss": -11.22331428527832, "global_step": 216347, "epoch": 1287} {"train_loss": -11.50766372680664, "global_step": 216348, "epoch": 1287} {"train_loss": -11.478596687316895, "global_step": 216349, "epoch": 1287} {"train_loss": -11.538629531860352, "global_step": 216350, "epoch": 1287} {"train_loss": -11.56818962097168, "global_step": 216351, "epoch": 1287} {"train_loss": -11.450545310974121, "global_step": 216352, "epoch": 1287} {"train_loss": -11.839637756347656, "global_step": 216353, "epoch": 1287} {"train_loss": -11.170573234558105, "global_step": 216354, "epoch": 1287} {"train_loss": -11.546646118164062, "global_step": 216355, "epoch": 1287} {"train_loss": -11.412541389465332, "global_step": 216356, "epoch": 1287} {"train_loss": -10.450907707214355, "global_step": 216357, "epoch": 1287} {"train_loss": -11.486824035644531, "global_step": 216358, "epoch": 1287} {"train_loss": -10.920820236206055, "global_step": 216359, "epoch": 1287} {"train_loss": -9.510392189025879, "global_step": 216360, "epoch": 1287} {"train_loss": -11.0028076171875, "global_step": 216361, "epoch": 1287} {"train_loss": -10.42339038848877, "global_step": 216362, "epoch": 1287} {"train_loss": -7.901497840881348, "global_step": 216363, "epoch": 1287} {"train_loss": -10.715789794921875, "global_step": 216364, "epoch": 1287} {"train_loss": -9.650712966918945, "global_step": 216365, "epoch": 1287} {"train_loss": -10.673534393310547, "global_step": 216366, "epoch": 1287} {"train_loss": -10.511573791503906, "global_step": 216367, "epoch": 1287} {"train_loss": -10.925153732299805, "global_step": 216368, "epoch": 1287} {"train_loss": -11.065762519836426, "global_step": 216369, "epoch": 1287} {"train_loss": -11.196023941040039, "global_step": 216370, "epoch": 1287} {"train_loss": -10.994479179382324, "global_step": 216371, "epoch": 1287} {"train_loss": -11.43203353881836, "global_step": 216372, "epoch": 1287} {"train_loss": -11.17150592803955, "global_step": 216373, "epoch": 1287} {"train_loss": -11.314491271972656, "global_step": 216374, "epoch": 1287} {"train_loss": -11.047100067138672, "global_step": 216375, "epoch": 1287} {"train_loss": -11.049094200134277, "global_step": 216376, "epoch": 1287} {"train_loss": -11.380450248718262, "global_step": 216377, "epoch": 1287} {"train_loss": -11.084797859191895, "global_step": 216378, "epoch": 1287} {"train_loss": -11.715316772460938, "global_step": 216379, "epoch": 1287} {"train_loss": -11.324970245361328, "global_step": 216380, "epoch": 1287} {"train_loss": -11.268171310424805, "global_step": 216381, "epoch": 1287} {"train_loss": -11.312313079833984, "global_step": 216382, "epoch": 1287} {"train_loss": -11.291330002603077, "global_step": 216383, "epoch": 1287, "val_loss": 255386.46875} {"train_loss": -11.339353561401367, "global_step": 216384, "epoch": 1288} {"train_loss": -11.317626953125, "global_step": 216385, "epoch": 1288} {"train_loss": -11.235239028930664, "global_step": 216386, "epoch": 1288} {"train_loss": -11.32065200805664, "global_step": 216387, "epoch": 1288} {"train_loss": -11.56021785736084, "global_step": 216388, "epoch": 1288} {"train_loss": -11.269140243530273, "global_step": 216389, "epoch": 1288} {"train_loss": -11.706704139709473, "global_step": 216390, "epoch": 1288} {"train_loss": -11.403566360473633, "global_step": 216391, "epoch": 1288} {"train_loss": -11.074358940124512, "global_step": 216392, "epoch": 1288} {"train_loss": -11.688394546508789, "global_step": 216393, "epoch": 1288} {"train_loss": -11.424846649169922, "global_step": 216394, "epoch": 1288} {"train_loss": -11.599023818969727, "global_step": 216395, "epoch": 1288} {"train_loss": -11.613369941711426, "global_step": 216396, "epoch": 1288} {"train_loss": -11.494356155395508, "global_step": 216397, "epoch": 1288} {"train_loss": -11.599139213562012, "global_step": 216398, "epoch": 1288} {"train_loss": -11.714975357055664, "global_step": 216399, "epoch": 1288} {"train_loss": -11.306880950927734, "global_step": 216400, "epoch": 1288} {"train_loss": -11.683323860168457, "global_step": 216401, "epoch": 1288} {"train_loss": -11.678054809570312, "global_step": 216402, "epoch": 1288} {"train_loss": -11.344112396240234, "global_step": 216403, "epoch": 1288} {"train_loss": -11.771951675415039, "global_step": 216404, "epoch": 1288} {"train_loss": -11.537240982055664, "global_step": 216405, "epoch": 1288} {"train_loss": -11.462767601013184, "global_step": 216406, "epoch": 1288} {"train_loss": -11.597408294677734, "global_step": 216407, "epoch": 1288} {"train_loss": -11.455677032470703, "global_step": 216408, "epoch": 1288} {"train_loss": -11.741069793701172, "global_step": 216409, "epoch": 1288} {"train_loss": -11.660483360290527, "global_step": 216410, "epoch": 1288} {"train_loss": -11.592445373535156, "global_step": 216411, "epoch": 1288} {"train_loss": -11.668078422546387, "global_step": 216412, "epoch": 1288} {"train_loss": -11.416032791137695, "global_step": 216413, "epoch": 1288} {"train_loss": -11.580938339233398, "global_step": 216414, "epoch": 1288} {"train_loss": -11.530549049377441, "global_step": 216415, "epoch": 1288} {"train_loss": -11.420236587524414, "global_step": 216416, "epoch": 1288} {"train_loss": -11.341626167297363, "global_step": 216417, "epoch": 1288} {"train_loss": -11.372639656066895, "global_step": 216418, "epoch": 1288} {"train_loss": -11.801980972290039, "global_step": 216419, "epoch": 1288} {"train_loss": -11.28813648223877, "global_step": 216420, "epoch": 1288} {"train_loss": -11.566652297973633, "global_step": 216421, "epoch": 1288} {"train_loss": -11.870515823364258, "global_step": 216422, "epoch": 1288} {"train_loss": -11.082472801208496, "global_step": 216423, "epoch": 1288} {"train_loss": -11.14179515838623, "global_step": 216424, "epoch": 1288} {"train_loss": -11.336694717407227, "global_step": 216425, "epoch": 1288} {"train_loss": -11.206376075744629, "global_step": 216426, "epoch": 1288} {"train_loss": -10.360247611999512, "global_step": 216427, "epoch": 1288} {"train_loss": -11.522196769714355, "global_step": 216428, "epoch": 1288} {"train_loss": -10.954545974731445, "global_step": 216429, "epoch": 1288} {"train_loss": -10.88232421875, "global_step": 216430, "epoch": 1288} {"train_loss": -11.598281860351562, "global_step": 216431, "epoch": 1288} {"train_loss": -10.742565155029297, "global_step": 216432, "epoch": 1288} {"train_loss": -10.680756568908691, "global_step": 216433, "epoch": 1288} {"train_loss": -11.410085678100586, "global_step": 216434, "epoch": 1288} {"train_loss": -9.968563079833984, "global_step": 216435, "epoch": 1288} {"train_loss": -11.574882507324219, "global_step": 216436, "epoch": 1288} {"train_loss": -10.475841522216797, "global_step": 216437, "epoch": 1288} {"train_loss": -10.766429901123047, "global_step": 216438, "epoch": 1288} {"train_loss": -11.276366233825684, "global_step": 216439, "epoch": 1288} {"train_loss": -10.595029830932617, "global_step": 216440, "epoch": 1288} {"train_loss": -11.711135864257812, "global_step": 216441, "epoch": 1288} {"train_loss": -10.511995315551758, "global_step": 216442, "epoch": 1288} {"train_loss": -11.372886657714844, "global_step": 216443, "epoch": 1288} {"train_loss": -10.689336776733398, "global_step": 216444, "epoch": 1288} {"train_loss": -11.092753410339355, "global_step": 216445, "epoch": 1288} {"train_loss": -11.260307312011719, "global_step": 216446, "epoch": 1288} {"train_loss": -10.39468002319336, "global_step": 216447, "epoch": 1288} {"train_loss": -11.480536460876465, "global_step": 216448, "epoch": 1288} {"train_loss": -10.636837005615234, "global_step": 216449, "epoch": 1288} {"train_loss": -11.035539627075195, "global_step": 216450, "epoch": 1288} {"train_loss": -11.112200736999512, "global_step": 216451, "epoch": 1288} {"train_loss": -10.426780700683594, "global_step": 216452, "epoch": 1288} {"train_loss": -11.543512344360352, "global_step": 216453, "epoch": 1288} {"train_loss": -10.564775466918945, "global_step": 216454, "epoch": 1288} {"train_loss": -11.027884483337402, "global_step": 216455, "epoch": 1288} {"train_loss": -11.402551651000977, "global_step": 216456, "epoch": 1288} {"train_loss": -11.061336517333984, "global_step": 216457, "epoch": 1288} {"train_loss": -11.280200004577637, "global_step": 216458, "epoch": 1288} {"train_loss": -11.261519432067871, "global_step": 216459, "epoch": 1288} {"train_loss": -10.914763450622559, "global_step": 216460, "epoch": 1288} {"train_loss": -11.332435607910156, "global_step": 216461, "epoch": 1288} {"train_loss": -11.036396026611328, "global_step": 216462, "epoch": 1288} {"train_loss": -10.760997772216797, "global_step": 216463, "epoch": 1288} {"train_loss": -10.82171630859375, "global_step": 216464, "epoch": 1288} {"train_loss": -10.542397499084473, "global_step": 216465, "epoch": 1288} {"train_loss": -11.063448905944824, "global_step": 216466, "epoch": 1288} {"train_loss": -11.407161712646484, "global_step": 216467, "epoch": 1288} {"train_loss": -10.856340408325195, "global_step": 216468, "epoch": 1288} {"train_loss": -10.820637702941895, "global_step": 216469, "epoch": 1288} {"train_loss": -11.072582244873047, "global_step": 216470, "epoch": 1288} {"train_loss": -10.840011596679688, "global_step": 216471, "epoch": 1288} {"train_loss": -11.335724830627441, "global_step": 216472, "epoch": 1288} {"train_loss": -10.758255004882812, "global_step": 216473, "epoch": 1288} {"train_loss": -11.345013618469238, "global_step": 216474, "epoch": 1288} {"train_loss": -10.685101509094238, "global_step": 216475, "epoch": 1288} {"train_loss": -11.075551986694336, "global_step": 216476, "epoch": 1288} {"train_loss": -10.714223861694336, "global_step": 216477, "epoch": 1288} {"train_loss": -11.07300853729248, "global_step": 216478, "epoch": 1288} {"train_loss": -10.941906929016113, "global_step": 216479, "epoch": 1288} {"train_loss": -11.33468246459961, "global_step": 216480, "epoch": 1288} {"train_loss": -11.362936019897461, "global_step": 216481, "epoch": 1288} {"train_loss": -11.355691909790039, "global_step": 216482, "epoch": 1288} {"train_loss": -11.398292541503906, "global_step": 216483, "epoch": 1288} {"train_loss": -11.408295631408691, "global_step": 216484, "epoch": 1288} {"train_loss": -11.418731689453125, "global_step": 216485, "epoch": 1288} {"train_loss": -11.455564498901367, "global_step": 216486, "epoch": 1288} {"train_loss": -11.08497428894043, "global_step": 216487, "epoch": 1288} {"train_loss": -11.247869491577148, "global_step": 216488, "epoch": 1288} {"train_loss": -11.465655326843262, "global_step": 216489, "epoch": 1288} {"train_loss": -11.396900177001953, "global_step": 216490, "epoch": 1288} {"train_loss": -11.485715866088867, "global_step": 216491, "epoch": 1288} {"train_loss": -11.248205184936523, "global_step": 216492, "epoch": 1288} {"train_loss": -11.65015983581543, "global_step": 216493, "epoch": 1288} {"train_loss": -11.238822937011719, "global_step": 216494, "epoch": 1288} {"train_loss": -11.661493301391602, "global_step": 216495, "epoch": 1288} {"train_loss": -11.243607521057129, "global_step": 216496, "epoch": 1288} {"train_loss": -11.543915748596191, "global_step": 216497, "epoch": 1288} {"train_loss": -11.322998046875, "global_step": 216498, "epoch": 1288} {"train_loss": -11.427726745605469, "global_step": 216499, "epoch": 1288} {"train_loss": -11.442460060119629, "global_step": 216500, "epoch": 1288} {"train_loss": -11.538796424865723, "global_step": 216501, "epoch": 1288} {"train_loss": -11.230195999145508, "global_step": 216502, "epoch": 1288} {"train_loss": -11.255085945129395, "global_step": 216503, "epoch": 1288} {"train_loss": -11.54118537902832, "global_step": 216504, "epoch": 1288} {"train_loss": -11.408085823059082, "global_step": 216505, "epoch": 1288} {"train_loss": -11.731407165527344, "global_step": 216506, "epoch": 1288} {"train_loss": -11.234493255615234, "global_step": 216507, "epoch": 1288} {"train_loss": -11.523545265197754, "global_step": 216508, "epoch": 1288} {"train_loss": -11.435152053833008, "global_step": 216509, "epoch": 1288} {"train_loss": -11.621989250183105, "global_step": 216510, "epoch": 1288} {"train_loss": -11.759567260742188, "global_step": 216511, "epoch": 1288} {"train_loss": -11.691864013671875, "global_step": 216512, "epoch": 1288} {"train_loss": -11.558204650878906, "global_step": 216513, "epoch": 1288} {"train_loss": -11.7581787109375, "global_step": 216514, "epoch": 1288} {"train_loss": -11.732027053833008, "global_step": 216515, "epoch": 1288} {"train_loss": -11.686100006103516, "global_step": 216516, "epoch": 1288} {"train_loss": -11.686755180358887, "global_step": 216517, "epoch": 1288} {"train_loss": -11.55459976196289, "global_step": 216518, "epoch": 1288} {"train_loss": -11.816949844360352, "global_step": 216519, "epoch": 1288} {"train_loss": -11.40230941772461, "global_step": 216520, "epoch": 1288} {"train_loss": -11.660348892211914, "global_step": 216521, "epoch": 1288} {"train_loss": -11.818634986877441, "global_step": 216522, "epoch": 1288} {"train_loss": -11.815710067749023, "global_step": 216523, "epoch": 1288} {"train_loss": -11.480318069458008, "global_step": 216524, "epoch": 1288} {"train_loss": -11.761038780212402, "global_step": 216525, "epoch": 1288} {"train_loss": -11.749865531921387, "global_step": 216526, "epoch": 1288} {"train_loss": -11.594949722290039, "global_step": 216527, "epoch": 1288} {"train_loss": -11.681903839111328, "global_step": 216528, "epoch": 1288} {"train_loss": -11.518784523010254, "global_step": 216529, "epoch": 1288} {"train_loss": -11.56080436706543, "global_step": 216530, "epoch": 1288} {"train_loss": -11.876655578613281, "global_step": 216531, "epoch": 1288} {"train_loss": -11.577909469604492, "global_step": 216532, "epoch": 1288} {"train_loss": -11.792760848999023, "global_step": 216533, "epoch": 1288} {"train_loss": -11.750700950622559, "global_step": 216534, "epoch": 1288} {"train_loss": -11.815855026245117, "global_step": 216535, "epoch": 1288} {"train_loss": -11.818872451782227, "global_step": 216536, "epoch": 1288} {"train_loss": -11.742630004882812, "global_step": 216537, "epoch": 1288} {"train_loss": -11.720349311828613, "global_step": 216538, "epoch": 1288} {"train_loss": -11.363006591796875, "global_step": 216539, "epoch": 1288} {"train_loss": -11.864625930786133, "global_step": 216540, "epoch": 1288} {"train_loss": -11.64873218536377, "global_step": 216541, "epoch": 1288} {"train_loss": -11.824560165405273, "global_step": 216542, "epoch": 1288} {"train_loss": -11.756263732910156, "global_step": 216543, "epoch": 1288} {"train_loss": -11.852344512939453, "global_step": 216544, "epoch": 1288} {"train_loss": -11.9071044921875, "global_step": 216545, "epoch": 1288} {"train_loss": -11.410429954528809, "global_step": 216546, "epoch": 1288} {"train_loss": -11.932503700256348, "global_step": 216547, "epoch": 1288} {"train_loss": -11.590666770935059, "global_step": 216548, "epoch": 1288} {"train_loss": -11.932653427124023, "global_step": 216549, "epoch": 1288} {"train_loss": -11.835188865661621, "global_step": 216550, "epoch": 1288} {"train_loss": -11.369424104690552, "global_step": 216551, "epoch": 1288, "val_loss": 257020.5} {"train_loss": -11.902753829956055, "global_step": 216552, "epoch": 1289} {"train_loss": -11.870124816894531, "global_step": 216553, "epoch": 1289} {"train_loss": -11.82659912109375, "global_step": 216554, "epoch": 1289} {"train_loss": -11.516949653625488, "global_step": 216555, "epoch": 1289} {"train_loss": -11.672195434570312, "global_step": 216556, "epoch": 1289} {"train_loss": -11.96535873413086, "global_step": 216557, "epoch": 1289} {"train_loss": -11.717857360839844, "global_step": 216558, "epoch": 1289} {"train_loss": -11.419853210449219, "global_step": 216559, "epoch": 1289} {"train_loss": -11.993378639221191, "global_step": 216560, "epoch": 1289} {"train_loss": -11.89964485168457, "global_step": 216561, "epoch": 1289} {"train_loss": -11.677139282226562, "global_step": 216562, "epoch": 1289} {"train_loss": -11.303524017333984, "global_step": 216563, "epoch": 1289} {"train_loss": -12.038812637329102, "global_step": 216564, "epoch": 1289} {"train_loss": -11.228693008422852, "global_step": 216565, "epoch": 1289} {"train_loss": -11.223550796508789, "global_step": 216566, "epoch": 1289} {"train_loss": -11.4847412109375, "global_step": 216567, "epoch": 1289} {"train_loss": -11.505642890930176, "global_step": 216568, "epoch": 1289} {"train_loss": -10.190507888793945, "global_step": 216569, "epoch": 1289} {"train_loss": -11.67522144317627, "global_step": 216570, "epoch": 1289} {"train_loss": -10.7610502243042, "global_step": 216571, "epoch": 1289} {"train_loss": -11.25432014465332, "global_step": 216572, "epoch": 1289} {"train_loss": -11.039856910705566, "global_step": 216573, "epoch": 1289} {"train_loss": -11.182188034057617, "global_step": 216574, "epoch": 1289} {"train_loss": -11.351980209350586, "global_step": 216575, "epoch": 1289} {"train_loss": -11.336006164550781, "global_step": 216576, "epoch": 1289} {"train_loss": -10.526752471923828, "global_step": 216577, "epoch": 1289} {"train_loss": -10.219404220581055, "global_step": 216578, "epoch": 1289} {"train_loss": -10.898749351501465, "global_step": 216579, "epoch": 1289} {"train_loss": -9.520931243896484, "global_step": 216580, "epoch": 1289} {"train_loss": -10.616948127746582, "global_step": 216581, "epoch": 1289} {"train_loss": -7.9964728355407715, "global_step": 216582, "epoch": 1289} {"train_loss": -10.451349258422852, "global_step": 216583, "epoch": 1289} {"train_loss": -8.464641571044922, "global_step": 216584, "epoch": 1289} {"train_loss": -9.928174018859863, "global_step": 216585, "epoch": 1289} {"train_loss": -8.706570625305176, "global_step": 216586, "epoch": 1289} {"train_loss": -10.237577438354492, "global_step": 216587, "epoch": 1289} {"train_loss": -9.807830810546875, "global_step": 216588, "epoch": 1289} {"train_loss": -9.627534866333008, "global_step": 216589, "epoch": 1289} {"train_loss": -9.873198509216309, "global_step": 216590, "epoch": 1289} {"train_loss": -9.072251319885254, "global_step": 216591, "epoch": 1289} {"train_loss": -10.54328441619873, "global_step": 216592, "epoch": 1289} {"train_loss": -9.744126319885254, "global_step": 216593, "epoch": 1289} {"train_loss": -10.405269622802734, "global_step": 216594, "epoch": 1289} {"train_loss": -9.661767959594727, "global_step": 216595, "epoch": 1289} {"train_loss": -10.144876480102539, "global_step": 216596, "epoch": 1289} {"train_loss": -10.0250244140625, "global_step": 216597, "epoch": 1289} {"train_loss": -10.598762512207031, "global_step": 216598, "epoch": 1289} {"train_loss": -10.08781623840332, "global_step": 216599, "epoch": 1289} {"train_loss": -10.247947692871094, "global_step": 216600, "epoch": 1289} {"train_loss": -10.360369682312012, "global_step": 216601, "epoch": 1289} {"train_loss": -10.763341903686523, "global_step": 216602, "epoch": 1289} {"train_loss": -10.573102951049805, "global_step": 216603, "epoch": 1289} {"train_loss": -10.47709846496582, "global_step": 216604, "epoch": 1289} {"train_loss": -10.884687423706055, "global_step": 216605, "epoch": 1289} {"train_loss": -10.629984855651855, "global_step": 216606, "epoch": 1289} {"train_loss": -11.008933067321777, "global_step": 216607, "epoch": 1289} {"train_loss": -10.761280059814453, "global_step": 216608, "epoch": 1289} {"train_loss": -11.180784225463867, "global_step": 216609, "epoch": 1289} {"train_loss": -10.543013572692871, "global_step": 216610, "epoch": 1289} {"train_loss": -10.962790489196777, "global_step": 216611, "epoch": 1289} {"train_loss": -10.933650970458984, "global_step": 216612, "epoch": 1289} {"train_loss": -10.857492446899414, "global_step": 216613, "epoch": 1289} {"train_loss": -11.094802856445312, "global_step": 216614, "epoch": 1289} {"train_loss": -10.793540954589844, "global_step": 216615, "epoch": 1289} {"train_loss": -11.109904289245605, "global_step": 216616, "epoch": 1289} {"train_loss": -11.051986694335938, "global_step": 216617, "epoch": 1289} {"train_loss": -11.113706588745117, "global_step": 216618, "epoch": 1289} {"train_loss": -10.996310234069824, "global_step": 216619, "epoch": 1289} {"train_loss": -11.231234550476074, "global_step": 216620, "epoch": 1289} {"train_loss": -11.143794059753418, "global_step": 216621, "epoch": 1289} {"train_loss": -10.994979858398438, "global_step": 216622, "epoch": 1289} {"train_loss": -11.18204402923584, "global_step": 216623, "epoch": 1289} {"train_loss": -11.08542251586914, "global_step": 216624, "epoch": 1289} {"train_loss": -11.519996643066406, "global_step": 216625, "epoch": 1289} {"train_loss": -11.338729858398438, "global_step": 216626, "epoch": 1289} {"train_loss": -11.238431930541992, "global_step": 216627, "epoch": 1289} {"train_loss": -11.355527877807617, "global_step": 216628, "epoch": 1289} {"train_loss": -11.467813491821289, "global_step": 216629, "epoch": 1289} {"train_loss": -11.311017990112305, "global_step": 216630, "epoch": 1289} {"train_loss": -11.356287002563477, "global_step": 216631, "epoch": 1289} {"train_loss": -11.494388580322266, "global_step": 216632, "epoch": 1289} {"train_loss": -11.440868377685547, "global_step": 216633, "epoch": 1289} {"train_loss": -11.24777889251709, "global_step": 216634, "epoch": 1289} {"train_loss": -11.37667465209961, "global_step": 216635, "epoch": 1289} {"train_loss": -11.529504776000977, "global_step": 216636, "epoch": 1289} {"train_loss": -11.497977256774902, "global_step": 216637, "epoch": 1289} {"train_loss": -11.614984512329102, "global_step": 216638, "epoch": 1289} {"train_loss": -11.688908576965332, "global_step": 216639, "epoch": 1289} {"train_loss": -11.605670928955078, "global_step": 216640, "epoch": 1289} {"train_loss": -11.519603729248047, "global_step": 216641, "epoch": 1289} {"train_loss": -11.584247589111328, "global_step": 216642, "epoch": 1289} {"train_loss": -11.743818283081055, "global_step": 216643, "epoch": 1289} {"train_loss": -11.593521118164062, "global_step": 216644, "epoch": 1289} {"train_loss": -11.641642570495605, "global_step": 216645, "epoch": 1289} {"train_loss": -11.600299835205078, "global_step": 216646, "epoch": 1289} {"train_loss": -11.723711013793945, "global_step": 216647, "epoch": 1289} {"train_loss": -11.649903297424316, "global_step": 216648, "epoch": 1289} {"train_loss": -11.491480827331543, "global_step": 216649, "epoch": 1289} {"train_loss": -11.639291763305664, "global_step": 216650, "epoch": 1289} {"train_loss": -11.680374145507812, "global_step": 216651, "epoch": 1289} {"train_loss": -11.504329681396484, "global_step": 216652, "epoch": 1289} {"train_loss": -11.515827178955078, "global_step": 216653, "epoch": 1289} {"train_loss": -11.605158805847168, "global_step": 216654, "epoch": 1289} {"train_loss": -11.732471466064453, "global_step": 216655, "epoch": 1289} {"train_loss": -11.690186500549316, "global_step": 216656, "epoch": 1289} {"train_loss": -11.694303512573242, "global_step": 216657, "epoch": 1289} {"train_loss": -11.585915565490723, "global_step": 216658, "epoch": 1289} {"train_loss": -11.515645027160645, "global_step": 216659, "epoch": 1289} {"train_loss": -11.706029891967773, "global_step": 216660, "epoch": 1289} {"train_loss": -11.468963623046875, "global_step": 216661, "epoch": 1289} {"train_loss": -11.554583549499512, "global_step": 216662, "epoch": 1289} {"train_loss": -11.771217346191406, "global_step": 216663, "epoch": 1289} {"train_loss": -11.55839729309082, "global_step": 216664, "epoch": 1289} {"train_loss": -11.76833724975586, "global_step": 216665, "epoch": 1289} {"train_loss": -11.64249038696289, "global_step": 216666, "epoch": 1289} {"train_loss": -11.837148666381836, "global_step": 216667, "epoch": 1289} {"train_loss": -11.381145477294922, "global_step": 216668, "epoch": 1289} {"train_loss": -11.378432273864746, "global_step": 216669, "epoch": 1289} {"train_loss": -11.782215118408203, "global_step": 216670, "epoch": 1289} {"train_loss": -11.42768669128418, "global_step": 216671, "epoch": 1289} {"train_loss": -11.845637321472168, "global_step": 216672, "epoch": 1289} {"train_loss": -11.795503616333008, "global_step": 216673, "epoch": 1289} {"train_loss": -11.72634506225586, "global_step": 216674, "epoch": 1289} {"train_loss": -11.879435539245605, "global_step": 216675, "epoch": 1289} {"train_loss": -11.664396286010742, "global_step": 216676, "epoch": 1289} {"train_loss": -11.88819694519043, "global_step": 216677, "epoch": 1289} {"train_loss": -11.723365783691406, "global_step": 216678, "epoch": 1289} {"train_loss": -11.45333194732666, "global_step": 216679, "epoch": 1289} {"train_loss": -11.898416519165039, "global_step": 216680, "epoch": 1289} {"train_loss": -11.744182586669922, "global_step": 216681, "epoch": 1289} {"train_loss": -11.842909812927246, "global_step": 216682, "epoch": 1289} {"train_loss": -11.831523895263672, "global_step": 216683, "epoch": 1289} {"train_loss": -11.751469612121582, "global_step": 216684, "epoch": 1289} {"train_loss": -11.896549224853516, "global_step": 216685, "epoch": 1289} {"train_loss": -11.747760772705078, "global_step": 216686, "epoch": 1289} {"train_loss": -11.563331604003906, "global_step": 216687, "epoch": 1289} {"train_loss": -11.98667049407959, "global_step": 216688, "epoch": 1289} {"train_loss": -11.551188468933105, "global_step": 216689, "epoch": 1289} {"train_loss": -11.938706398010254, "global_step": 216690, "epoch": 1289} {"train_loss": -11.727460861206055, "global_step": 216691, "epoch": 1289} {"train_loss": -11.948975563049316, "global_step": 216692, "epoch": 1289} {"train_loss": -11.945528030395508, "global_step": 216693, "epoch": 1289} {"train_loss": -11.783134460449219, "global_step": 216694, "epoch": 1289} {"train_loss": -11.906041145324707, "global_step": 216695, "epoch": 1289} {"train_loss": -11.60547924041748, "global_step": 216696, "epoch": 1289} {"train_loss": -11.23069953918457, "global_step": 216697, "epoch": 1289} {"train_loss": -11.682796478271484, "global_step": 216698, "epoch": 1289} {"train_loss": -11.318620681762695, "global_step": 216699, "epoch": 1289} {"train_loss": -11.03800106048584, "global_step": 216700, "epoch": 1289} {"train_loss": -11.770484924316406, "global_step": 216701, "epoch": 1289} {"train_loss": -11.603134155273438, "global_step": 216702, "epoch": 1289} {"train_loss": -11.259294509887695, "global_step": 216703, "epoch": 1289} {"train_loss": -11.276418685913086, "global_step": 216704, "epoch": 1289} {"train_loss": -12.004230499267578, "global_step": 216705, "epoch": 1289} {"train_loss": -11.667793273925781, "global_step": 216706, "epoch": 1289} {"train_loss": -11.518543243408203, "global_step": 216707, "epoch": 1289} {"train_loss": -11.444538116455078, "global_step": 216708, "epoch": 1289} {"train_loss": -11.539905548095703, "global_step": 216709, "epoch": 1289} {"train_loss": -11.349854469299316, "global_step": 216710, "epoch": 1289} {"train_loss": -11.374432563781738, "global_step": 216711, "epoch": 1289} {"train_loss": -11.785195350646973, "global_step": 216712, "epoch": 1289} {"train_loss": -11.492352485656738, "global_step": 216713, "epoch": 1289} {"train_loss": -10.771635055541992, "global_step": 216714, "epoch": 1289} {"train_loss": -10.619478225708008, "global_step": 216715, "epoch": 1289} {"train_loss": -11.580192565917969, "global_step": 216716, "epoch": 1289} {"train_loss": -9.76788330078125, "global_step": 216717, "epoch": 1289} {"train_loss": -10.300738334655762, "global_step": 216718, "epoch": 1289} {"train_loss": -11.205191234747568, "global_step": 216719, "epoch": 1289, "val_loss": 254956.65625} {"train_loss": -10.043190002441406, "global_step": 216720, "epoch": 1290} {"train_loss": -11.128347396850586, "global_step": 216721, "epoch": 1290} {"train_loss": -10.165253639221191, "global_step": 216722, "epoch": 1290} {"train_loss": -10.078505516052246, "global_step": 216723, "epoch": 1290} {"train_loss": -10.325847625732422, "global_step": 216724, "epoch": 1290} {"train_loss": -9.313224792480469, "global_step": 216725, "epoch": 1290} {"train_loss": -8.125500679016113, "global_step": 216726, "epoch": 1290} {"train_loss": -7.40606164932251, "global_step": 216727, "epoch": 1290} {"train_loss": -9.515091896057129, "global_step": 216728, "epoch": 1290} {"train_loss": -9.575855255126953, "global_step": 216729, "epoch": 1290} {"train_loss": -9.15813159942627, "global_step": 216730, "epoch": 1290} {"train_loss": -9.091156959533691, "global_step": 216731, "epoch": 1290} {"train_loss": -8.620241165161133, "global_step": 216732, "epoch": 1290} {"train_loss": -10.216923713684082, "global_step": 216733, "epoch": 1290} {"train_loss": -8.895496368408203, "global_step": 216734, "epoch": 1290} {"train_loss": -9.155284881591797, "global_step": 216735, "epoch": 1290} {"train_loss": -10.186471939086914, "global_step": 216736, "epoch": 1290} {"train_loss": -9.870051383972168, "global_step": 216737, "epoch": 1290} {"train_loss": -10.755919456481934, "global_step": 216738, "epoch": 1290} {"train_loss": -9.92381763458252, "global_step": 216739, "epoch": 1290} {"train_loss": -11.261167526245117, "global_step": 216740, "epoch": 1290} {"train_loss": -10.17109489440918, "global_step": 216741, "epoch": 1290} {"train_loss": -10.26458740234375, "global_step": 216742, "epoch": 1290} {"train_loss": -10.54330825805664, "global_step": 216743, "epoch": 1290} {"train_loss": -10.384096145629883, "global_step": 216744, "epoch": 1290} {"train_loss": -10.019893646240234, "global_step": 216745, "epoch": 1290} {"train_loss": -10.689599990844727, "global_step": 216746, "epoch": 1290} {"train_loss": -10.720489501953125, "global_step": 216747, "epoch": 1290} {"train_loss": -10.253812789916992, "global_step": 216748, "epoch": 1290} {"train_loss": -10.916964530944824, "global_step": 216749, "epoch": 1290} {"train_loss": -11.188858032226562, "global_step": 216750, "epoch": 1290} {"train_loss": -10.49513053894043, "global_step": 216751, "epoch": 1290} {"train_loss": -10.752607345581055, "global_step": 216752, "epoch": 1290} {"train_loss": -11.138863563537598, "global_step": 216753, "epoch": 1290} {"train_loss": -10.698070526123047, "global_step": 216754, "epoch": 1290} {"train_loss": -10.83428955078125, "global_step": 216755, "epoch": 1290} {"train_loss": -11.175949096679688, "global_step": 216756, "epoch": 1290} {"train_loss": -10.992243766784668, "global_step": 216757, "epoch": 1290} {"train_loss": -10.955134391784668, "global_step": 216758, "epoch": 1290} {"train_loss": -11.069815635681152, "global_step": 216759, "epoch": 1290} {"train_loss": -11.133506774902344, "global_step": 216760, "epoch": 1290} {"train_loss": -10.907270431518555, "global_step": 216761, "epoch": 1290} {"train_loss": -11.326245307922363, "global_step": 216762, "epoch": 1290} {"train_loss": -11.240899085998535, "global_step": 216763, "epoch": 1290} {"train_loss": -10.984474182128906, "global_step": 216764, "epoch": 1290} {"train_loss": -11.089505195617676, "global_step": 216765, "epoch": 1290} {"train_loss": -11.346473693847656, "global_step": 216766, "epoch": 1290} {"train_loss": -11.140392303466797, "global_step": 216767, "epoch": 1290} {"train_loss": -11.166559219360352, "global_step": 216768, "epoch": 1290} {"train_loss": -11.23758316040039, "global_step": 216769, "epoch": 1290} {"train_loss": -11.118722915649414, "global_step": 216770, "epoch": 1290} {"train_loss": -11.340514183044434, "global_step": 216771, "epoch": 1290} {"train_loss": -11.404542922973633, "global_step": 216772, "epoch": 1290} {"train_loss": -11.351360321044922, "global_step": 216773, "epoch": 1290} {"train_loss": -11.267666816711426, "global_step": 216774, "epoch": 1290} {"train_loss": -11.432535171508789, "global_step": 216775, "epoch": 1290} {"train_loss": -11.366533279418945, "global_step": 216776, "epoch": 1290} {"train_loss": -11.35362434387207, "global_step": 216777, "epoch": 1290} {"train_loss": -11.237468719482422, "global_step": 216778, "epoch": 1290} {"train_loss": -11.44660758972168, "global_step": 216779, "epoch": 1290} {"train_loss": -11.466249465942383, "global_step": 216780, "epoch": 1290} {"train_loss": -11.571956634521484, "global_step": 216781, "epoch": 1290} {"train_loss": -11.538795471191406, "global_step": 216782, "epoch": 1290} {"train_loss": -11.729045867919922, "global_step": 216783, "epoch": 1290} {"train_loss": -11.450447082519531, "global_step": 216784, "epoch": 1290} {"train_loss": -11.86923599243164, "global_step": 216785, "epoch": 1290} {"train_loss": -11.42078971862793, "global_step": 216786, "epoch": 1290} {"train_loss": -11.580276489257812, "global_step": 216787, "epoch": 1290} {"train_loss": -11.333988189697266, "global_step": 216788, "epoch": 1290} {"train_loss": -11.789205551147461, "global_step": 216789, "epoch": 1290} {"train_loss": -11.80196475982666, "global_step": 216790, "epoch": 1290} {"train_loss": -11.692985534667969, "global_step": 216791, "epoch": 1290} {"train_loss": -11.565618515014648, "global_step": 216792, "epoch": 1290} {"train_loss": -11.513668060302734, "global_step": 216793, "epoch": 1290} {"train_loss": -11.663883209228516, "global_step": 216794, "epoch": 1290} {"train_loss": -11.840274810791016, "global_step": 216795, "epoch": 1290} {"train_loss": -11.826139450073242, "global_step": 216796, "epoch": 1290} {"train_loss": -11.607900619506836, "global_step": 216797, "epoch": 1290} {"train_loss": -11.848907470703125, "global_step": 216798, "epoch": 1290} {"train_loss": -11.927334785461426, "global_step": 216799, "epoch": 1290} {"train_loss": -11.630678176879883, "global_step": 216800, "epoch": 1290} {"train_loss": -11.78795051574707, "global_step": 216801, "epoch": 1290} {"train_loss": -11.910012245178223, "global_step": 216802, "epoch": 1290} {"train_loss": -11.791488647460938, "global_step": 216803, "epoch": 1290} {"train_loss": -11.652517318725586, "global_step": 216804, "epoch": 1290} {"train_loss": -11.606635093688965, "global_step": 216805, "epoch": 1290} {"train_loss": -11.870939254760742, "global_step": 216806, "epoch": 1290} {"train_loss": -11.97854995727539, "global_step": 216807, "epoch": 1290} {"train_loss": -11.801993370056152, "global_step": 216808, "epoch": 1290} {"train_loss": -11.749610900878906, "global_step": 216809, "epoch": 1290} {"train_loss": -11.91728687286377, "global_step": 216810, "epoch": 1290} {"train_loss": -11.850099563598633, "global_step": 216811, "epoch": 1290} {"train_loss": -11.914158821105957, "global_step": 216812, "epoch": 1290} {"train_loss": -11.956552505493164, "global_step": 216813, "epoch": 1290} {"train_loss": -11.916152954101562, "global_step": 216814, "epoch": 1290} {"train_loss": -11.780069351196289, "global_step": 216815, "epoch": 1290} {"train_loss": -11.753108978271484, "global_step": 216816, "epoch": 1290} {"train_loss": -11.909120559692383, "global_step": 216817, "epoch": 1290} {"train_loss": -11.861164093017578, "global_step": 216818, "epoch": 1290} {"train_loss": -11.73411750793457, "global_step": 216819, "epoch": 1290} {"train_loss": -11.985517501831055, "global_step": 216820, "epoch": 1290} {"train_loss": -11.94325065612793, "global_step": 216821, "epoch": 1290} {"train_loss": -11.795433044433594, "global_step": 216822, "epoch": 1290} {"train_loss": -11.780437469482422, "global_step": 216823, "epoch": 1290} {"train_loss": -11.751035690307617, "global_step": 216824, "epoch": 1290} {"train_loss": -11.832006454467773, "global_step": 216825, "epoch": 1290} {"train_loss": -11.914319038391113, "global_step": 216826, "epoch": 1290} {"train_loss": -11.822166442871094, "global_step": 216827, "epoch": 1290} {"train_loss": -12.159219741821289, "global_step": 216828, "epoch": 1290} {"train_loss": -11.788025856018066, "global_step": 216829, "epoch": 1290} {"train_loss": -11.684966087341309, "global_step": 216830, "epoch": 1290} {"train_loss": -11.615434646606445, "global_step": 216831, "epoch": 1290} {"train_loss": -12.018444061279297, "global_step": 216832, "epoch": 1290} {"train_loss": -11.370906829833984, "global_step": 216833, "epoch": 1290} {"train_loss": -11.832834243774414, "global_step": 216834, "epoch": 1290} {"train_loss": -11.821325302124023, "global_step": 216835, "epoch": 1290} {"train_loss": -11.72172737121582, "global_step": 216836, "epoch": 1290} {"train_loss": -11.698429107666016, "global_step": 216837, "epoch": 1290} {"train_loss": -11.984710693359375, "global_step": 216838, "epoch": 1290} {"train_loss": -11.827728271484375, "global_step": 216839, "epoch": 1290} {"train_loss": -11.833905220031738, "global_step": 216840, "epoch": 1290} {"train_loss": -11.66853141784668, "global_step": 216841, "epoch": 1290} {"train_loss": -11.635176658630371, "global_step": 216842, "epoch": 1290} {"train_loss": -11.764347076416016, "global_step": 216843, "epoch": 1290} {"train_loss": -11.45357608795166, "global_step": 216844, "epoch": 1290} {"train_loss": -11.206804275512695, "global_step": 216845, "epoch": 1290} {"train_loss": -11.64886474609375, "global_step": 216846, "epoch": 1290} {"train_loss": -10.98225212097168, "global_step": 216847, "epoch": 1290} {"train_loss": -10.201071739196777, "global_step": 216848, "epoch": 1290} {"train_loss": -11.338214874267578, "global_step": 216849, "epoch": 1290} {"train_loss": -11.292823791503906, "global_step": 216850, "epoch": 1290} {"train_loss": -10.69787311553955, "global_step": 216851, "epoch": 1290} {"train_loss": -9.582039833068848, "global_step": 216852, "epoch": 1290} {"train_loss": -11.301952362060547, "global_step": 216853, "epoch": 1290} {"train_loss": -10.424459457397461, "global_step": 216854, "epoch": 1290} {"train_loss": -9.050424575805664, "global_step": 216855, "epoch": 1290} {"train_loss": -10.232089042663574, "global_step": 216856, "epoch": 1290} {"train_loss": -10.889856338500977, "global_step": 216857, "epoch": 1290} {"train_loss": -10.45529556274414, "global_step": 216858, "epoch": 1290} {"train_loss": -8.970653533935547, "global_step": 216859, "epoch": 1290} {"train_loss": -11.03466510772705, "global_step": 216860, "epoch": 1290} {"train_loss": -8.513683319091797, "global_step": 216861, "epoch": 1290} {"train_loss": -11.283702850341797, "global_step": 216862, "epoch": 1290} {"train_loss": -10.26199722290039, "global_step": 216863, "epoch": 1290} {"train_loss": -10.673980712890625, "global_step": 216864, "epoch": 1290} {"train_loss": -10.299574851989746, "global_step": 216865, "epoch": 1290} {"train_loss": -10.944007873535156, "global_step": 216866, "epoch": 1290} {"train_loss": -10.68143367767334, "global_step": 216867, "epoch": 1290} {"train_loss": -10.888915061950684, "global_step": 216868, "epoch": 1290} {"train_loss": -11.002266883850098, "global_step": 216869, "epoch": 1290} {"train_loss": -10.456472396850586, "global_step": 216870, "epoch": 1290} {"train_loss": -10.82931137084961, "global_step": 216871, "epoch": 1290} {"train_loss": -11.150226593017578, "global_step": 216872, "epoch": 1290} {"train_loss": -10.75137710571289, "global_step": 216873, "epoch": 1290} {"train_loss": -10.907630920410156, "global_step": 216874, "epoch": 1290} {"train_loss": -11.069186210632324, "global_step": 216875, "epoch": 1290} {"train_loss": -10.960079193115234, "global_step": 216876, "epoch": 1290} {"train_loss": -10.714273452758789, "global_step": 216877, "epoch": 1290} {"train_loss": -11.314800262451172, "global_step": 216878, "epoch": 1290} {"train_loss": -10.945318222045898, "global_step": 216879, "epoch": 1290} {"train_loss": -10.796568870544434, "global_step": 216880, "epoch": 1290} {"train_loss": -10.788908004760742, "global_step": 216881, "epoch": 1290} {"train_loss": -11.251741409301758, "global_step": 216882, "epoch": 1290} {"train_loss": -10.733460426330566, "global_step": 216883, "epoch": 1290} {"train_loss": -11.244077682495117, "global_step": 216884, "epoch": 1290} {"train_loss": -10.751565933227539, "global_step": 216885, "epoch": 1290} {"train_loss": -11.119163513183594, "global_step": 216886, "epoch": 1290} {"train_loss": -11.042511568182992, "global_step": 216887, "epoch": 1290, "val_loss": 253482.15625, "train_action_mse_error": 1.7837635278701782} {"train_loss": -10.89142894744873, "global_step": 216888, "epoch": 1291} {"train_loss": -10.967981338500977, "global_step": 216889, "epoch": 1291} {"train_loss": -10.971771240234375, "global_step": 216890, "epoch": 1291} {"train_loss": -11.268314361572266, "global_step": 216891, "epoch": 1291} {"train_loss": -10.946008682250977, "global_step": 216892, "epoch": 1291} {"train_loss": -10.868547439575195, "global_step": 216893, "epoch": 1291} {"train_loss": -10.535680770874023, "global_step": 216894, "epoch": 1291} {"train_loss": -11.079618453979492, "global_step": 216895, "epoch": 1291} {"train_loss": -10.795700073242188, "global_step": 216896, "epoch": 1291} {"train_loss": -10.870288848876953, "global_step": 216897, "epoch": 1291} {"train_loss": -11.204803466796875, "global_step": 216898, "epoch": 1291} {"train_loss": -11.001761436462402, "global_step": 216899, "epoch": 1291} {"train_loss": -11.4109525680542, "global_step": 216900, "epoch": 1291} {"train_loss": -11.191923141479492, "global_step": 216901, "epoch": 1291} {"train_loss": -11.203929901123047, "global_step": 216902, "epoch": 1291} {"train_loss": -11.373414993286133, "global_step": 216903, "epoch": 1291} {"train_loss": -11.3444185256958, "global_step": 216904, "epoch": 1291} {"train_loss": -11.14067268371582, "global_step": 216905, "epoch": 1291} {"train_loss": -11.448015213012695, "global_step": 216906, "epoch": 1291} {"train_loss": -11.318453788757324, "global_step": 216907, "epoch": 1291} {"train_loss": -11.362302780151367, "global_step": 216908, "epoch": 1291} {"train_loss": -11.310319900512695, "global_step": 216909, "epoch": 1291} {"train_loss": -11.40688419342041, "global_step": 216910, "epoch": 1291} {"train_loss": -11.600157737731934, "global_step": 216911, "epoch": 1291} {"train_loss": -11.3793363571167, "global_step": 216912, "epoch": 1291} {"train_loss": -11.517765045166016, "global_step": 216913, "epoch": 1291} {"train_loss": -11.654008865356445, "global_step": 216914, "epoch": 1291} {"train_loss": -11.22256088256836, "global_step": 216915, "epoch": 1291} {"train_loss": -11.440683364868164, "global_step": 216916, "epoch": 1291} {"train_loss": -11.47389030456543, "global_step": 216917, "epoch": 1291} {"train_loss": -11.573246002197266, "global_step": 216918, "epoch": 1291} {"train_loss": -11.392215728759766, "global_step": 216919, "epoch": 1291} {"train_loss": -11.623626708984375, "global_step": 216920, "epoch": 1291} {"train_loss": -11.527076721191406, "global_step": 216921, "epoch": 1291} {"train_loss": -11.524703979492188, "global_step": 216922, "epoch": 1291} {"train_loss": -11.661633491516113, "global_step": 216923, "epoch": 1291} {"train_loss": -11.482561111450195, "global_step": 216924, "epoch": 1291} {"train_loss": -11.528974533081055, "global_step": 216925, "epoch": 1291} {"train_loss": -11.613611221313477, "global_step": 216926, "epoch": 1291} {"train_loss": -11.771524429321289, "global_step": 216927, "epoch": 1291} {"train_loss": -11.772088050842285, "global_step": 216928, "epoch": 1291} {"train_loss": -11.661941528320312, "global_step": 216929, "epoch": 1291} {"train_loss": -11.510503768920898, "global_step": 216930, "epoch": 1291} {"train_loss": -11.822273254394531, "global_step": 216931, "epoch": 1291} {"train_loss": -11.773983001708984, "global_step": 216932, "epoch": 1291} {"train_loss": -11.699528694152832, "global_step": 216933, "epoch": 1291} {"train_loss": -11.798844337463379, "global_step": 216934, "epoch": 1291} {"train_loss": -11.91081428527832, "global_step": 216935, "epoch": 1291} {"train_loss": -11.73019027709961, "global_step": 216936, "epoch": 1291} {"train_loss": -11.9222993850708, "global_step": 216937, "epoch": 1291} {"train_loss": -11.718259811401367, "global_step": 216938, "epoch": 1291} {"train_loss": -11.749855041503906, "global_step": 216939, "epoch": 1291} {"train_loss": -11.916678428649902, "global_step": 216940, "epoch": 1291} {"train_loss": -11.928235054016113, "global_step": 216941, "epoch": 1291} {"train_loss": -11.707269668579102, "global_step": 216942, "epoch": 1291} {"train_loss": -11.871685028076172, "global_step": 216943, "epoch": 1291} {"train_loss": -11.889954566955566, "global_step": 216944, "epoch": 1291} {"train_loss": -11.869078636169434, "global_step": 216945, "epoch": 1291} {"train_loss": -11.854622840881348, "global_step": 216946, "epoch": 1291} {"train_loss": -11.932085037231445, "global_step": 216947, "epoch": 1291} {"train_loss": -11.92585563659668, "global_step": 216948, "epoch": 1291} {"train_loss": -11.952606201171875, "global_step": 216949, "epoch": 1291} {"train_loss": -11.877994537353516, "global_step": 216950, "epoch": 1291} {"train_loss": -11.902475357055664, "global_step": 216951, "epoch": 1291} {"train_loss": -11.82101058959961, "global_step": 216952, "epoch": 1291} {"train_loss": -11.9517822265625, "global_step": 216953, "epoch": 1291} {"train_loss": -12.019350051879883, "global_step": 216954, "epoch": 1291} {"train_loss": -11.774068832397461, "global_step": 216955, "epoch": 1291} {"train_loss": -11.665185928344727, "global_step": 216956, "epoch": 1291} {"train_loss": -11.839569091796875, "global_step": 216957, "epoch": 1291} {"train_loss": -11.902563095092773, "global_step": 216958, "epoch": 1291} {"train_loss": -11.5201997756958, "global_step": 216959, "epoch": 1291} {"train_loss": -11.263447761535645, "global_step": 216960, "epoch": 1291} {"train_loss": -11.127434730529785, "global_step": 216961, "epoch": 1291} {"train_loss": -11.744181632995605, "global_step": 216962, "epoch": 1291} {"train_loss": -10.970558166503906, "global_step": 216963, "epoch": 1291} {"train_loss": -10.765060424804688, "global_step": 216964, "epoch": 1291} {"train_loss": -11.73976993560791, "global_step": 216965, "epoch": 1291} {"train_loss": -11.310301780700684, "global_step": 216966, "epoch": 1291} {"train_loss": -11.171130180358887, "global_step": 216967, "epoch": 1291} {"train_loss": -10.493440628051758, "global_step": 216968, "epoch": 1291} {"train_loss": -11.496856689453125, "global_step": 216969, "epoch": 1291} {"train_loss": -11.311484336853027, "global_step": 216970, "epoch": 1291} {"train_loss": -11.335769653320312, "global_step": 216971, "epoch": 1291} {"train_loss": -10.894133567810059, "global_step": 216972, "epoch": 1291} {"train_loss": -11.3377685546875, "global_step": 216973, "epoch": 1291} {"train_loss": -11.594314575195312, "global_step": 216974, "epoch": 1291} {"train_loss": -11.191213607788086, "global_step": 216975, "epoch": 1291} {"train_loss": -11.211908340454102, "global_step": 216976, "epoch": 1291} {"train_loss": -11.556022644042969, "global_step": 216977, "epoch": 1291} {"train_loss": -11.592639923095703, "global_step": 216978, "epoch": 1291} {"train_loss": -10.687000274658203, "global_step": 216979, "epoch": 1291} {"train_loss": -11.717729568481445, "global_step": 216980, "epoch": 1291} {"train_loss": -11.647313117980957, "global_step": 216981, "epoch": 1291} {"train_loss": -11.622883796691895, "global_step": 216982, "epoch": 1291} {"train_loss": -11.309507369995117, "global_step": 216983, "epoch": 1291} {"train_loss": -11.950616836547852, "global_step": 216984, "epoch": 1291} {"train_loss": -11.514498710632324, "global_step": 216985, "epoch": 1291} {"train_loss": -11.915931701660156, "global_step": 216986, "epoch": 1291} {"train_loss": -11.232200622558594, "global_step": 216987, "epoch": 1291} {"train_loss": -11.628303527832031, "global_step": 216988, "epoch": 1291} {"train_loss": -11.378015518188477, "global_step": 216989, "epoch": 1291} {"train_loss": -11.525297164916992, "global_step": 216990, "epoch": 1291} {"train_loss": -11.436792373657227, "global_step": 216991, "epoch": 1291} {"train_loss": -11.435816764831543, "global_step": 216992, "epoch": 1291} {"train_loss": -11.215563774108887, "global_step": 216993, "epoch": 1291} {"train_loss": -11.664288520812988, "global_step": 216994, "epoch": 1291} {"train_loss": -10.776483535766602, "global_step": 216995, "epoch": 1291} {"train_loss": -11.936212539672852, "global_step": 216996, "epoch": 1291} {"train_loss": -11.287144660949707, "global_step": 216997, "epoch": 1291} {"train_loss": -11.50069808959961, "global_step": 216998, "epoch": 1291} {"train_loss": -11.27037239074707, "global_step": 216999, "epoch": 1291} {"train_loss": -11.361021041870117, "global_step": 217000, "epoch": 1291} {"train_loss": -11.44735336303711, "global_step": 217001, "epoch": 1291} {"train_loss": -11.598461151123047, "global_step": 217002, "epoch": 1291} {"train_loss": -11.543071746826172, "global_step": 217003, "epoch": 1291} {"train_loss": -11.293923377990723, "global_step": 217004, "epoch": 1291} {"train_loss": -11.18730640411377, "global_step": 217005, "epoch": 1291} {"train_loss": -11.090188026428223, "global_step": 217006, "epoch": 1291} {"train_loss": -11.231700897216797, "global_step": 217007, "epoch": 1291} {"train_loss": -9.738931655883789, "global_step": 217008, "epoch": 1291} {"train_loss": -11.237624168395996, "global_step": 217009, "epoch": 1291} {"train_loss": -10.534847259521484, "global_step": 217010, "epoch": 1291} {"train_loss": -11.250405311584473, "global_step": 217011, "epoch": 1291} {"train_loss": -11.418736457824707, "global_step": 217012, "epoch": 1291} {"train_loss": -10.667999267578125, "global_step": 217013, "epoch": 1291} {"train_loss": -11.629034042358398, "global_step": 217014, "epoch": 1291} {"train_loss": -10.697126388549805, "global_step": 217015, "epoch": 1291} {"train_loss": -11.393935203552246, "global_step": 217016, "epoch": 1291} {"train_loss": -10.950151443481445, "global_step": 217017, "epoch": 1291} {"train_loss": -11.608647346496582, "global_step": 217018, "epoch": 1291} {"train_loss": -11.717184066772461, "global_step": 217019, "epoch": 1291} {"train_loss": -11.208728790283203, "global_step": 217020, "epoch": 1291} {"train_loss": -11.598114013671875, "global_step": 217021, "epoch": 1291} {"train_loss": -11.50844955444336, "global_step": 217022, "epoch": 1291} {"train_loss": -11.420194625854492, "global_step": 217023, "epoch": 1291} {"train_loss": -11.199544906616211, "global_step": 217024, "epoch": 1291} {"train_loss": -11.496675491333008, "global_step": 217025, "epoch": 1291} {"train_loss": -11.409594535827637, "global_step": 217026, "epoch": 1291} {"train_loss": -11.599466323852539, "global_step": 217027, "epoch": 1291} {"train_loss": -11.700143814086914, "global_step": 217028, "epoch": 1291} {"train_loss": -11.164907455444336, "global_step": 217029, "epoch": 1291} {"train_loss": -11.57186222076416, "global_step": 217030, "epoch": 1291} {"train_loss": -11.45517349243164, "global_step": 217031, "epoch": 1291} {"train_loss": -11.401395797729492, "global_step": 217032, "epoch": 1291} {"train_loss": -11.169086456298828, "global_step": 217033, "epoch": 1291} {"train_loss": -11.61877727508545, "global_step": 217034, "epoch": 1291} {"train_loss": -11.364517211914062, "global_step": 217035, "epoch": 1291} {"train_loss": -11.500146865844727, "global_step": 217036, "epoch": 1291} {"train_loss": -11.122221946716309, "global_step": 217037, "epoch": 1291} {"train_loss": -11.430200576782227, "global_step": 217038, "epoch": 1291} {"train_loss": -11.515302658081055, "global_step": 217039, "epoch": 1291} {"train_loss": -10.936300277709961, "global_step": 217040, "epoch": 1291} {"train_loss": -11.046335220336914, "global_step": 217041, "epoch": 1291} {"train_loss": -11.508756637573242, "global_step": 217042, "epoch": 1291} {"train_loss": -11.351829528808594, "global_step": 217043, "epoch": 1291} {"train_loss": -11.737420082092285, "global_step": 217044, "epoch": 1291} {"train_loss": -11.48039722442627, "global_step": 217045, "epoch": 1291} {"train_loss": -11.542848587036133, "global_step": 217046, "epoch": 1291} {"train_loss": -11.644559860229492, "global_step": 217047, "epoch": 1291} {"train_loss": -11.587376594543457, "global_step": 217048, "epoch": 1291} {"train_loss": -11.571142196655273, "global_step": 217049, "epoch": 1291} {"train_loss": -11.444250106811523, "global_step": 217050, "epoch": 1291} {"train_loss": -12.086999893188477, "global_step": 217051, "epoch": 1291} {"train_loss": -11.5607271194458, "global_step": 217052, "epoch": 1291} {"train_loss": -11.742755889892578, "global_step": 217053, "epoch": 1291} {"train_loss": -11.425491333007812, "global_step": 217054, "epoch": 1291} {"train_loss": -11.437435524804252, "global_step": 217055, "epoch": 1291, "val_loss": 256090.125} {"train_loss": -11.269572257995605, "global_step": 217056, "epoch": 1292} {"train_loss": -11.621862411499023, "global_step": 217057, "epoch": 1292} {"train_loss": -11.850687026977539, "global_step": 217058, "epoch": 1292} {"train_loss": -11.629170417785645, "global_step": 217059, "epoch": 1292} {"train_loss": -11.908525466918945, "global_step": 217060, "epoch": 1292} {"train_loss": -11.633859634399414, "global_step": 217061, "epoch": 1292} {"train_loss": -11.759733200073242, "global_step": 217062, "epoch": 1292} {"train_loss": -11.76895523071289, "global_step": 217063, "epoch": 1292} {"train_loss": -11.642736434936523, "global_step": 217064, "epoch": 1292} {"train_loss": -11.618703842163086, "global_step": 217065, "epoch": 1292} {"train_loss": -11.678325653076172, "global_step": 217066, "epoch": 1292} {"train_loss": -11.095754623413086, "global_step": 217067, "epoch": 1292} {"train_loss": -11.432561874389648, "global_step": 217068, "epoch": 1292} {"train_loss": -11.662225723266602, "global_step": 217069, "epoch": 1292} {"train_loss": -11.729418754577637, "global_step": 217070, "epoch": 1292} {"train_loss": -11.46036434173584, "global_step": 217071, "epoch": 1292} {"train_loss": -11.786504745483398, "global_step": 217072, "epoch": 1292} {"train_loss": -11.557954788208008, "global_step": 217073, "epoch": 1292} {"train_loss": -11.61014175415039, "global_step": 217074, "epoch": 1292} {"train_loss": -11.799968719482422, "global_step": 217075, "epoch": 1292} {"train_loss": -11.835082054138184, "global_step": 217076, "epoch": 1292} {"train_loss": -11.331954956054688, "global_step": 217077, "epoch": 1292} {"train_loss": -11.93851089477539, "global_step": 217078, "epoch": 1292} {"train_loss": -11.776686668395996, "global_step": 217079, "epoch": 1292} {"train_loss": -11.975248336791992, "global_step": 217080, "epoch": 1292} {"train_loss": -11.880814552307129, "global_step": 217081, "epoch": 1292} {"train_loss": -12.029401779174805, "global_step": 217082, "epoch": 1292} {"train_loss": -11.774833679199219, "global_step": 217083, "epoch": 1292} {"train_loss": -11.618237495422363, "global_step": 217084, "epoch": 1292} {"train_loss": -11.73360824584961, "global_step": 217085, "epoch": 1292} {"train_loss": -11.682703018188477, "global_step": 217086, "epoch": 1292} {"train_loss": -11.925508499145508, "global_step": 217087, "epoch": 1292} {"train_loss": -11.658536911010742, "global_step": 217088, "epoch": 1292} {"train_loss": -11.423908233642578, "global_step": 217089, "epoch": 1292} {"train_loss": -11.688328742980957, "global_step": 217090, "epoch": 1292} {"train_loss": -11.768765449523926, "global_step": 217091, "epoch": 1292} {"train_loss": -11.261702537536621, "global_step": 217092, "epoch": 1292} {"train_loss": -11.945680618286133, "global_step": 217093, "epoch": 1292} {"train_loss": -11.466527938842773, "global_step": 217094, "epoch": 1292} {"train_loss": -11.875516891479492, "global_step": 217095, "epoch": 1292} {"train_loss": -11.790201187133789, "global_step": 217096, "epoch": 1292} {"train_loss": -11.553169250488281, "global_step": 217097, "epoch": 1292} {"train_loss": -11.403175354003906, "global_step": 217098, "epoch": 1292} {"train_loss": -11.514911651611328, "global_step": 217099, "epoch": 1292} {"train_loss": -11.863350868225098, "global_step": 217100, "epoch": 1292} {"train_loss": -12.004304885864258, "global_step": 217101, "epoch": 1292} {"train_loss": -11.684225082397461, "global_step": 217102, "epoch": 1292} {"train_loss": -11.733975410461426, "global_step": 217103, "epoch": 1292} {"train_loss": -11.869028091430664, "global_step": 217104, "epoch": 1292} {"train_loss": -11.37247371673584, "global_step": 217105, "epoch": 1292} {"train_loss": -11.256765365600586, "global_step": 217106, "epoch": 1292} {"train_loss": -11.619157791137695, "global_step": 217107, "epoch": 1292} {"train_loss": -11.239631652832031, "global_step": 217108, "epoch": 1292} {"train_loss": -11.611392974853516, "global_step": 217109, "epoch": 1292} {"train_loss": -11.268501281738281, "global_step": 217110, "epoch": 1292} {"train_loss": -10.89052963256836, "global_step": 217111, "epoch": 1292} {"train_loss": -11.40798282623291, "global_step": 217112, "epoch": 1292} {"train_loss": -10.392241477966309, "global_step": 217113, "epoch": 1292} {"train_loss": -10.718391418457031, "global_step": 217114, "epoch": 1292} {"train_loss": -10.891153335571289, "global_step": 217115, "epoch": 1292} {"train_loss": -11.091744422912598, "global_step": 217116, "epoch": 1292} {"train_loss": -10.71037769317627, "global_step": 217117, "epoch": 1292} {"train_loss": -11.824362754821777, "global_step": 217118, "epoch": 1292} {"train_loss": -10.66826343536377, "global_step": 217119, "epoch": 1292} {"train_loss": -11.128959655761719, "global_step": 217120, "epoch": 1292} {"train_loss": -11.046245574951172, "global_step": 217121, "epoch": 1292} {"train_loss": -10.8147611618042, "global_step": 217122, "epoch": 1292} {"train_loss": -11.72490119934082, "global_step": 217123, "epoch": 1292} {"train_loss": -10.984745979309082, "global_step": 217124, "epoch": 1292} {"train_loss": -11.110671997070312, "global_step": 217125, "epoch": 1292} {"train_loss": -11.640100479125977, "global_step": 217126, "epoch": 1292} {"train_loss": -11.231977462768555, "global_step": 217127, "epoch": 1292} {"train_loss": -11.153493881225586, "global_step": 217128, "epoch": 1292} {"train_loss": -11.26289176940918, "global_step": 217129, "epoch": 1292} {"train_loss": -11.003299713134766, "global_step": 217130, "epoch": 1292} {"train_loss": -11.571879386901855, "global_step": 217131, "epoch": 1292} {"train_loss": -11.01366901397705, "global_step": 217132, "epoch": 1292} {"train_loss": -11.074975967407227, "global_step": 217133, "epoch": 1292} {"train_loss": -11.253143310546875, "global_step": 217134, "epoch": 1292} {"train_loss": -10.149374008178711, "global_step": 217135, "epoch": 1292} {"train_loss": -11.684242248535156, "global_step": 217136, "epoch": 1292} {"train_loss": -11.304689407348633, "global_step": 217137, "epoch": 1292} {"train_loss": -11.70781135559082, "global_step": 217138, "epoch": 1292} {"train_loss": -11.09672737121582, "global_step": 217139, "epoch": 1292} {"train_loss": -11.209831237792969, "global_step": 217140, "epoch": 1292} {"train_loss": -11.547477722167969, "global_step": 217141, "epoch": 1292} {"train_loss": -10.921497344970703, "global_step": 217142, "epoch": 1292} {"train_loss": -11.207063674926758, "global_step": 217143, "epoch": 1292} {"train_loss": -10.627037048339844, "global_step": 217144, "epoch": 1292} {"train_loss": -10.388616561889648, "global_step": 217145, "epoch": 1292} {"train_loss": -11.387228012084961, "global_step": 217146, "epoch": 1292} {"train_loss": -10.48201847076416, "global_step": 217147, "epoch": 1292} {"train_loss": -11.413870811462402, "global_step": 217148, "epoch": 1292} {"train_loss": -10.759403228759766, "global_step": 217149, "epoch": 1292} {"train_loss": -10.864651679992676, "global_step": 217150, "epoch": 1292} {"train_loss": -11.000558853149414, "global_step": 217151, "epoch": 1292} {"train_loss": -10.99970817565918, "global_step": 217152, "epoch": 1292} {"train_loss": -11.491144180297852, "global_step": 217153, "epoch": 1292} {"train_loss": -10.449670791625977, "global_step": 217154, "epoch": 1292} {"train_loss": -11.307673454284668, "global_step": 217155, "epoch": 1292} {"train_loss": -10.935690879821777, "global_step": 217156, "epoch": 1292} {"train_loss": -10.986917495727539, "global_step": 217157, "epoch": 1292} {"train_loss": -11.33547592163086, "global_step": 217158, "epoch": 1292} {"train_loss": -11.448596954345703, "global_step": 217159, "epoch": 1292} {"train_loss": -11.475661277770996, "global_step": 217160, "epoch": 1292} {"train_loss": -11.56732177734375, "global_step": 217161, "epoch": 1292} {"train_loss": -11.339896202087402, "global_step": 217162, "epoch": 1292} {"train_loss": -11.645030975341797, "global_step": 217163, "epoch": 1292} {"train_loss": -11.446447372436523, "global_step": 217164, "epoch": 1292} {"train_loss": -11.53145980834961, "global_step": 217165, "epoch": 1292} {"train_loss": -11.342851638793945, "global_step": 217166, "epoch": 1292} {"train_loss": -11.588800430297852, "global_step": 217167, "epoch": 1292} {"train_loss": -11.450811386108398, "global_step": 217168, "epoch": 1292} {"train_loss": -11.755727767944336, "global_step": 217169, "epoch": 1292} {"train_loss": -11.481389999389648, "global_step": 217170, "epoch": 1292} {"train_loss": -11.475111961364746, "global_step": 217171, "epoch": 1292} {"train_loss": -11.599994659423828, "global_step": 217172, "epoch": 1292} {"train_loss": -11.41610336303711, "global_step": 217173, "epoch": 1292} {"train_loss": -11.68756103515625, "global_step": 217174, "epoch": 1292} {"train_loss": -11.675313949584961, "global_step": 217175, "epoch": 1292} {"train_loss": -11.509586334228516, "global_step": 217176, "epoch": 1292} {"train_loss": -11.683564186096191, "global_step": 217177, "epoch": 1292} {"train_loss": -11.29802131652832, "global_step": 217178, "epoch": 1292} {"train_loss": -11.694612503051758, "global_step": 217179, "epoch": 1292} {"train_loss": -11.861101150512695, "global_step": 217180, "epoch": 1292} {"train_loss": -11.803192138671875, "global_step": 217181, "epoch": 1292} {"train_loss": -11.818220138549805, "global_step": 217182, "epoch": 1292} {"train_loss": -11.722681045532227, "global_step": 217183, "epoch": 1292} {"train_loss": -11.457365989685059, "global_step": 217184, "epoch": 1292} {"train_loss": -11.886209487915039, "global_step": 217185, "epoch": 1292} {"train_loss": -11.578195571899414, "global_step": 217186, "epoch": 1292} {"train_loss": -11.848442077636719, "global_step": 217187, "epoch": 1292} {"train_loss": -11.741961479187012, "global_step": 217188, "epoch": 1292} {"train_loss": -11.607137680053711, "global_step": 217189, "epoch": 1292} {"train_loss": -11.943665504455566, "global_step": 217190, "epoch": 1292} {"train_loss": -11.64632797241211, "global_step": 217191, "epoch": 1292} {"train_loss": -11.953811645507812, "global_step": 217192, "epoch": 1292} {"train_loss": -11.630040168762207, "global_step": 217193, "epoch": 1292} {"train_loss": -11.745871543884277, "global_step": 217194, "epoch": 1292} {"train_loss": -11.708772659301758, "global_step": 217195, "epoch": 1292} {"train_loss": -11.901948928833008, "global_step": 217196, "epoch": 1292} {"train_loss": -11.846378326416016, "global_step": 217197, "epoch": 1292} {"train_loss": -11.825603485107422, "global_step": 217198, "epoch": 1292} {"train_loss": -11.806262969970703, "global_step": 217199, "epoch": 1292} {"train_loss": -11.728845596313477, "global_step": 217200, "epoch": 1292} {"train_loss": -11.59943962097168, "global_step": 217201, "epoch": 1292} {"train_loss": -11.709772109985352, "global_step": 217202, "epoch": 1292} {"train_loss": -11.638168334960938, "global_step": 217203, "epoch": 1292} {"train_loss": -11.730530738830566, "global_step": 217204, "epoch": 1292} {"train_loss": -11.766627311706543, "global_step": 217205, "epoch": 1292} {"train_loss": -11.189146995544434, "global_step": 217206, "epoch": 1292} {"train_loss": -11.607940673828125, "global_step": 217207, "epoch": 1292} {"train_loss": -11.933795928955078, "global_step": 217208, "epoch": 1292} {"train_loss": -11.216880798339844, "global_step": 217209, "epoch": 1292} {"train_loss": -12.033621788024902, "global_step": 217210, "epoch": 1292} {"train_loss": -11.387125968933105, "global_step": 217211, "epoch": 1292} {"train_loss": -11.596338272094727, "global_step": 217212, "epoch": 1292} {"train_loss": -11.84968376159668, "global_step": 217213, "epoch": 1292} {"train_loss": -11.602411270141602, "global_step": 217214, "epoch": 1292} {"train_loss": -11.68787956237793, "global_step": 217215, "epoch": 1292} {"train_loss": -11.640764236450195, "global_step": 217216, "epoch": 1292} {"train_loss": -11.878938674926758, "global_step": 217217, "epoch": 1292} {"train_loss": -11.503158569335938, "global_step": 217218, "epoch": 1292} {"train_loss": -11.732596397399902, "global_step": 217219, "epoch": 1292} {"train_loss": -11.29643726348877, "global_step": 217220, "epoch": 1292} {"train_loss": -11.130085945129395, "global_step": 217221, "epoch": 1292} {"train_loss": -11.211386680603027, "global_step": 217222, "epoch": 1292} {"train_loss": -11.4780402580897, "global_step": 217223, "epoch": 1292, "val_loss": 253947.078125} {"train_loss": -11.224475860595703, "global_step": 217224, "epoch": 1293} {"train_loss": -11.38392448425293, "global_step": 217225, "epoch": 1293} {"train_loss": -10.812447547912598, "global_step": 217226, "epoch": 1293} {"train_loss": -11.47494125366211, "global_step": 217227, "epoch": 1293} {"train_loss": -10.93124771118164, "global_step": 217228, "epoch": 1293} {"train_loss": -10.59269905090332, "global_step": 217229, "epoch": 1293} {"train_loss": -10.592754364013672, "global_step": 217230, "epoch": 1293} {"train_loss": -11.602493286132812, "global_step": 217231, "epoch": 1293} {"train_loss": -11.463676452636719, "global_step": 217232, "epoch": 1293} {"train_loss": -11.318262100219727, "global_step": 217233, "epoch": 1293} {"train_loss": -11.30328369140625, "global_step": 217234, "epoch": 1293} {"train_loss": -10.954115867614746, "global_step": 217235, "epoch": 1293} {"train_loss": -11.20828628540039, "global_step": 217236, "epoch": 1293} {"train_loss": -11.051283836364746, "global_step": 217237, "epoch": 1293} {"train_loss": -11.229574203491211, "global_step": 217238, "epoch": 1293} {"train_loss": -10.493865013122559, "global_step": 217239, "epoch": 1293} {"train_loss": -11.582021713256836, "global_step": 217240, "epoch": 1293} {"train_loss": -10.120172500610352, "global_step": 217241, "epoch": 1293} {"train_loss": -10.003881454467773, "global_step": 217242, "epoch": 1293} {"train_loss": -10.512561798095703, "global_step": 217243, "epoch": 1293} {"train_loss": -10.292409896850586, "global_step": 217244, "epoch": 1293} {"train_loss": -10.424022674560547, "global_step": 217245, "epoch": 1293} {"train_loss": -9.717227935791016, "global_step": 217246, "epoch": 1293} {"train_loss": -9.577866554260254, "global_step": 217247, "epoch": 1293} {"train_loss": -9.933164596557617, "global_step": 217248, "epoch": 1293} {"train_loss": -10.328266143798828, "global_step": 217249, "epoch": 1293} {"train_loss": -8.525671005249023, "global_step": 217250, "epoch": 1293} {"train_loss": -9.933414459228516, "global_step": 217251, "epoch": 1293} {"train_loss": -11.103920936584473, "global_step": 217252, "epoch": 1293} {"train_loss": -9.945152282714844, "global_step": 217253, "epoch": 1293} {"train_loss": -10.486543655395508, "global_step": 217254, "epoch": 1293} {"train_loss": -10.46004581451416, "global_step": 217255, "epoch": 1293} {"train_loss": -9.943887710571289, "global_step": 217256, "epoch": 1293} {"train_loss": -10.995854377746582, "global_step": 217257, "epoch": 1293} {"train_loss": -10.76116943359375, "global_step": 217258, "epoch": 1293} {"train_loss": -10.54006290435791, "global_step": 217259, "epoch": 1293} {"train_loss": -10.884902954101562, "global_step": 217260, "epoch": 1293} {"train_loss": -10.696444511413574, "global_step": 217261, "epoch": 1293} {"train_loss": -10.481982231140137, "global_step": 217262, "epoch": 1293} {"train_loss": -10.89422607421875, "global_step": 217263, "epoch": 1293} {"train_loss": -10.813725471496582, "global_step": 217264, "epoch": 1293} {"train_loss": -10.874343872070312, "global_step": 217265, "epoch": 1293} {"train_loss": -11.1920747756958, "global_step": 217266, "epoch": 1293} {"train_loss": -10.360889434814453, "global_step": 217267, "epoch": 1293} {"train_loss": -10.979470252990723, "global_step": 217268, "epoch": 1293} {"train_loss": -11.117843627929688, "global_step": 217269, "epoch": 1293} {"train_loss": -10.725292205810547, "global_step": 217270, "epoch": 1293} {"train_loss": -11.159412384033203, "global_step": 217271, "epoch": 1293} {"train_loss": -10.630315780639648, "global_step": 217272, "epoch": 1293} {"train_loss": -11.177947998046875, "global_step": 217273, "epoch": 1293} {"train_loss": -11.233774185180664, "global_step": 217274, "epoch": 1293} {"train_loss": -11.150891304016113, "global_step": 217275, "epoch": 1293} {"train_loss": -11.23705005645752, "global_step": 217276, "epoch": 1293} {"train_loss": -11.023641586303711, "global_step": 217277, "epoch": 1293} {"train_loss": -11.185731887817383, "global_step": 217278, "epoch": 1293} {"train_loss": -10.971044540405273, "global_step": 217279, "epoch": 1293} {"train_loss": -11.150491714477539, "global_step": 217280, "epoch": 1293} {"train_loss": -11.394906997680664, "global_step": 217281, "epoch": 1293} {"train_loss": -11.150324821472168, "global_step": 217282, "epoch": 1293} {"train_loss": -11.292210578918457, "global_step": 217283, "epoch": 1293} {"train_loss": -11.408343315124512, "global_step": 217284, "epoch": 1293} {"train_loss": -11.474430084228516, "global_step": 217285, "epoch": 1293} {"train_loss": -11.333999633789062, "global_step": 217286, "epoch": 1293} {"train_loss": -11.54315185546875, "global_step": 217287, "epoch": 1293} {"train_loss": -11.226227760314941, "global_step": 217288, "epoch": 1293} {"train_loss": -11.313362121582031, "global_step": 217289, "epoch": 1293} {"train_loss": -11.43792724609375, "global_step": 217290, "epoch": 1293} {"train_loss": -11.439048767089844, "global_step": 217291, "epoch": 1293} {"train_loss": -11.384809494018555, "global_step": 217292, "epoch": 1293} {"train_loss": -11.323149681091309, "global_step": 217293, "epoch": 1293} {"train_loss": -11.384822845458984, "global_step": 217294, "epoch": 1293} {"train_loss": -11.443710327148438, "global_step": 217295, "epoch": 1293} {"train_loss": -11.660046577453613, "global_step": 217296, "epoch": 1293} {"train_loss": -11.572736740112305, "global_step": 217297, "epoch": 1293} {"train_loss": -11.720596313476562, "global_step": 217298, "epoch": 1293} {"train_loss": -11.680624008178711, "global_step": 217299, "epoch": 1293} {"train_loss": -11.536201477050781, "global_step": 217300, "epoch": 1293} {"train_loss": -11.610241889953613, "global_step": 217301, "epoch": 1293} {"train_loss": -11.72180461883545, "global_step": 217302, "epoch": 1293} {"train_loss": -11.742727279663086, "global_step": 217303, "epoch": 1293} {"train_loss": -11.828439712524414, "global_step": 217304, "epoch": 1293} {"train_loss": -11.59410285949707, "global_step": 217305, "epoch": 1293} {"train_loss": -11.56855583190918, "global_step": 217306, "epoch": 1293} {"train_loss": -11.5412015914917, "global_step": 217307, "epoch": 1293} {"train_loss": -11.875858306884766, "global_step": 217308, "epoch": 1293} {"train_loss": -11.522773742675781, "global_step": 217309, "epoch": 1293} {"train_loss": -11.643662452697754, "global_step": 217310, "epoch": 1293} {"train_loss": -11.66766357421875, "global_step": 217311, "epoch": 1293} {"train_loss": -11.72801399230957, "global_step": 217312, "epoch": 1293} {"train_loss": -11.889120101928711, "global_step": 217313, "epoch": 1293} {"train_loss": -11.7196044921875, "global_step": 217314, "epoch": 1293} {"train_loss": -11.688350677490234, "global_step": 217315, "epoch": 1293} {"train_loss": -11.662105560302734, "global_step": 217316, "epoch": 1293} {"train_loss": -11.84089183807373, "global_step": 217317, "epoch": 1293} {"train_loss": -11.894380569458008, "global_step": 217318, "epoch": 1293} {"train_loss": -11.82088851928711, "global_step": 217319, "epoch": 1293} {"train_loss": -11.92350959777832, "global_step": 217320, "epoch": 1293} {"train_loss": -11.826825141906738, "global_step": 217321, "epoch": 1293} {"train_loss": -11.962800979614258, "global_step": 217322, "epoch": 1293} {"train_loss": -11.683349609375, "global_step": 217323, "epoch": 1293} {"train_loss": -11.91390609741211, "global_step": 217324, "epoch": 1293} {"train_loss": -11.763324737548828, "global_step": 217325, "epoch": 1293} {"train_loss": -11.67462158203125, "global_step": 217326, "epoch": 1293} {"train_loss": -11.825601577758789, "global_step": 217327, "epoch": 1293} {"train_loss": -11.875865936279297, "global_step": 217328, "epoch": 1293} {"train_loss": -11.562613487243652, "global_step": 217329, "epoch": 1293} {"train_loss": -11.317193031311035, "global_step": 217330, "epoch": 1293} {"train_loss": -11.460342407226562, "global_step": 217331, "epoch": 1293} {"train_loss": -11.275873184204102, "global_step": 217332, "epoch": 1293} {"train_loss": -10.99182415008545, "global_step": 217333, "epoch": 1293} {"train_loss": -11.283859252929688, "global_step": 217334, "epoch": 1293} {"train_loss": -12.004058837890625, "global_step": 217335, "epoch": 1293} {"train_loss": -10.773275375366211, "global_step": 217336, "epoch": 1293} {"train_loss": -10.354351043701172, "global_step": 217337, "epoch": 1293} {"train_loss": -11.314187049865723, "global_step": 217338, "epoch": 1293} {"train_loss": -11.133341789245605, "global_step": 217339, "epoch": 1293} {"train_loss": -10.651915550231934, "global_step": 217340, "epoch": 1293} {"train_loss": -11.564460754394531, "global_step": 217341, "epoch": 1293} {"train_loss": -10.670333862304688, "global_step": 217342, "epoch": 1293} {"train_loss": -10.823417663574219, "global_step": 217343, "epoch": 1293} {"train_loss": -10.275909423828125, "global_step": 217344, "epoch": 1293} {"train_loss": -10.948009490966797, "global_step": 217345, "epoch": 1293} {"train_loss": -10.671208381652832, "global_step": 217346, "epoch": 1293} {"train_loss": -10.423707962036133, "global_step": 217347, "epoch": 1293} {"train_loss": -10.873019218444824, "global_step": 217348, "epoch": 1293} {"train_loss": -10.49127197265625, "global_step": 217349, "epoch": 1293} {"train_loss": -11.173053741455078, "global_step": 217350, "epoch": 1293} {"train_loss": -10.591007232666016, "global_step": 217351, "epoch": 1293} {"train_loss": -10.822006225585938, "global_step": 217352, "epoch": 1293} {"train_loss": -11.12196159362793, "global_step": 217353, "epoch": 1293} {"train_loss": -10.374902725219727, "global_step": 217354, "epoch": 1293} {"train_loss": -11.229249954223633, "global_step": 217355, "epoch": 1293} {"train_loss": -10.97927474975586, "global_step": 217356, "epoch": 1293} {"train_loss": -11.260047912597656, "global_step": 217357, "epoch": 1293} {"train_loss": -10.5781888961792, "global_step": 217358, "epoch": 1293} {"train_loss": -11.331984519958496, "global_step": 217359, "epoch": 1293} {"train_loss": -10.859838485717773, "global_step": 217360, "epoch": 1293} {"train_loss": -11.563026428222656, "global_step": 217361, "epoch": 1293} {"train_loss": -10.99081039428711, "global_step": 217362, "epoch": 1293} {"train_loss": -11.426813125610352, "global_step": 217363, "epoch": 1293} {"train_loss": -10.853099822998047, "global_step": 217364, "epoch": 1293} {"train_loss": -11.252975463867188, "global_step": 217365, "epoch": 1293} {"train_loss": -11.091371536254883, "global_step": 217366, "epoch": 1293} {"train_loss": -11.035273551940918, "global_step": 217367, "epoch": 1293} {"train_loss": -10.803628921508789, "global_step": 217368, "epoch": 1293} {"train_loss": -11.275750160217285, "global_step": 217369, "epoch": 1293} {"train_loss": -11.15230941772461, "global_step": 217370, "epoch": 1293} {"train_loss": -11.027881622314453, "global_step": 217371, "epoch": 1293} {"train_loss": -11.602432250976562, "global_step": 217372, "epoch": 1293} {"train_loss": -11.277633666992188, "global_step": 217373, "epoch": 1293} {"train_loss": -11.337254524230957, "global_step": 217374, "epoch": 1293} {"train_loss": -11.415990829467773, "global_step": 217375, "epoch": 1293} {"train_loss": -11.265999794006348, "global_step": 217376, "epoch": 1293} {"train_loss": -11.477245330810547, "global_step": 217377, "epoch": 1293} {"train_loss": -11.432533264160156, "global_step": 217378, "epoch": 1293} {"train_loss": -11.191350936889648, "global_step": 217379, "epoch": 1293} {"train_loss": -11.553285598754883, "global_step": 217380, "epoch": 1293} {"train_loss": -11.411361694335938, "global_step": 217381, "epoch": 1293} {"train_loss": -11.28323745727539, "global_step": 217382, "epoch": 1293} {"train_loss": -11.57109546661377, "global_step": 217383, "epoch": 1293} {"train_loss": -11.313820838928223, "global_step": 217384, "epoch": 1293} {"train_loss": -11.39346694946289, "global_step": 217385, "epoch": 1293} {"train_loss": -11.407386779785156, "global_step": 217386, "epoch": 1293} {"train_loss": -11.18364143371582, "global_step": 217387, "epoch": 1293} {"train_loss": -11.420815467834473, "global_step": 217388, "epoch": 1293} {"train_loss": -11.230476379394531, "global_step": 217389, "epoch": 1293} {"train_loss": -11.512831687927246, "global_step": 217390, "epoch": 1293} {"train_loss": -11.139105728694371, "global_step": 217391, "epoch": 1293, "val_loss": 252957.578125} {"train_loss": -11.649532318115234, "global_step": 217392, "epoch": 1294} {"train_loss": -11.177776336669922, "global_step": 217393, "epoch": 1294} {"train_loss": -11.653705596923828, "global_step": 217394, "epoch": 1294} {"train_loss": -11.44442081451416, "global_step": 217395, "epoch": 1294} {"train_loss": -11.70590877532959, "global_step": 217396, "epoch": 1294} {"train_loss": -11.45305061340332, "global_step": 217397, "epoch": 1294} {"train_loss": -11.62222957611084, "global_step": 217398, "epoch": 1294} {"train_loss": -11.393027305603027, "global_step": 217399, "epoch": 1294} {"train_loss": -11.637809753417969, "global_step": 217400, "epoch": 1294} {"train_loss": -11.65277099609375, "global_step": 217401, "epoch": 1294} {"train_loss": -11.701234817504883, "global_step": 217402, "epoch": 1294} {"train_loss": -11.459005355834961, "global_step": 217403, "epoch": 1294} {"train_loss": -11.55810546875, "global_step": 217404, "epoch": 1294} {"train_loss": -11.706889152526855, "global_step": 217405, "epoch": 1294} {"train_loss": -11.632728576660156, "global_step": 217406, "epoch": 1294} {"train_loss": -11.795541763305664, "global_step": 217407, "epoch": 1294} {"train_loss": -11.743579864501953, "global_step": 217408, "epoch": 1294} {"train_loss": -11.673274040222168, "global_step": 217409, "epoch": 1294} {"train_loss": -11.98141098022461, "global_step": 217410, "epoch": 1294} {"train_loss": -11.725452423095703, "global_step": 217411, "epoch": 1294} {"train_loss": -11.603336334228516, "global_step": 217412, "epoch": 1294} {"train_loss": -11.69683837890625, "global_step": 217413, "epoch": 1294} {"train_loss": -11.905354499816895, "global_step": 217414, "epoch": 1294} {"train_loss": -11.702788352966309, "global_step": 217415, "epoch": 1294} {"train_loss": -11.493247032165527, "global_step": 217416, "epoch": 1294} {"train_loss": -11.697366714477539, "global_step": 217417, "epoch": 1294} {"train_loss": -11.68090534210205, "global_step": 217418, "epoch": 1294} {"train_loss": -11.430121421813965, "global_step": 217419, "epoch": 1294} {"train_loss": -11.7568941116333, "global_step": 217420, "epoch": 1294} {"train_loss": -11.66405963897705, "global_step": 217421, "epoch": 1294} {"train_loss": -11.634875297546387, "global_step": 217422, "epoch": 1294} {"train_loss": -11.554418563842773, "global_step": 217423, "epoch": 1294} {"train_loss": -11.676643371582031, "global_step": 217424, "epoch": 1294} {"train_loss": -11.509383201599121, "global_step": 217425, "epoch": 1294} {"train_loss": -11.692131042480469, "global_step": 217426, "epoch": 1294} {"train_loss": -11.672785758972168, "global_step": 217427, "epoch": 1294} {"train_loss": -11.922073364257812, "global_step": 217428, "epoch": 1294} {"train_loss": -11.52354621887207, "global_step": 217429, "epoch": 1294} {"train_loss": -11.753182411193848, "global_step": 217430, "epoch": 1294} {"train_loss": -11.420316696166992, "global_step": 217431, "epoch": 1294} {"train_loss": -11.958599090576172, "global_step": 217432, "epoch": 1294} {"train_loss": -11.694705963134766, "global_step": 217433, "epoch": 1294} {"train_loss": -11.94472885131836, "global_step": 217434, "epoch": 1294} {"train_loss": -11.8030424118042, "global_step": 217435, "epoch": 1294} {"train_loss": -11.829891204833984, "global_step": 217436, "epoch": 1294} {"train_loss": -11.491165161132812, "global_step": 217437, "epoch": 1294} {"train_loss": -11.548833847045898, "global_step": 217438, "epoch": 1294} {"train_loss": -11.621652603149414, "global_step": 217439, "epoch": 1294} {"train_loss": -11.038589477539062, "global_step": 217440, "epoch": 1294} {"train_loss": -11.555063247680664, "global_step": 217441, "epoch": 1294} {"train_loss": -12.114381790161133, "global_step": 217442, "epoch": 1294} {"train_loss": -11.529248237609863, "global_step": 217443, "epoch": 1294} {"train_loss": -11.217636108398438, "global_step": 217444, "epoch": 1294} {"train_loss": -11.790359497070312, "global_step": 217445, "epoch": 1294} {"train_loss": -11.511001586914062, "global_step": 217446, "epoch": 1294} {"train_loss": -10.749988555908203, "global_step": 217447, "epoch": 1294} {"train_loss": -11.152989387512207, "global_step": 217448, "epoch": 1294} {"train_loss": -11.814453125, "global_step": 217449, "epoch": 1294} {"train_loss": -11.587892532348633, "global_step": 217450, "epoch": 1294} {"train_loss": -11.308530807495117, "global_step": 217451, "epoch": 1294} {"train_loss": -11.858166694641113, "global_step": 217452, "epoch": 1294} {"train_loss": -11.921915054321289, "global_step": 217453, "epoch": 1294} {"train_loss": -11.891656875610352, "global_step": 217454, "epoch": 1294} {"train_loss": -11.608610153198242, "global_step": 217455, "epoch": 1294} {"train_loss": -11.820594787597656, "global_step": 217456, "epoch": 1294} {"train_loss": -11.721818923950195, "global_step": 217457, "epoch": 1294} {"train_loss": -11.899596214294434, "global_step": 217458, "epoch": 1294} {"train_loss": -11.3274564743042, "global_step": 217459, "epoch": 1294} {"train_loss": -11.270970344543457, "global_step": 217460, "epoch": 1294} {"train_loss": -12.04831314086914, "global_step": 217461, "epoch": 1294} {"train_loss": -11.702030181884766, "global_step": 217462, "epoch": 1294} {"train_loss": -11.731553077697754, "global_step": 217463, "epoch": 1294} {"train_loss": -11.768688201904297, "global_step": 217464, "epoch": 1294} {"train_loss": -11.630009651184082, "global_step": 217465, "epoch": 1294} {"train_loss": -11.647274017333984, "global_step": 217466, "epoch": 1294} {"train_loss": -11.79294204711914, "global_step": 217467, "epoch": 1294} {"train_loss": -11.38205337524414, "global_step": 217468, "epoch": 1294} {"train_loss": -11.50710678100586, "global_step": 217469, "epoch": 1294} {"train_loss": -11.662139892578125, "global_step": 217470, "epoch": 1294} {"train_loss": -11.428305625915527, "global_step": 217471, "epoch": 1294} {"train_loss": -11.499507904052734, "global_step": 217472, "epoch": 1294} {"train_loss": -11.58859920501709, "global_step": 217473, "epoch": 1294} {"train_loss": -11.681768417358398, "global_step": 217474, "epoch": 1294} {"train_loss": -11.477479934692383, "global_step": 217475, "epoch": 1294} {"train_loss": -11.858577728271484, "global_step": 217476, "epoch": 1294} {"train_loss": -11.522266387939453, "global_step": 217477, "epoch": 1294} {"train_loss": -11.467220306396484, "global_step": 217478, "epoch": 1294} {"train_loss": -11.193593978881836, "global_step": 217479, "epoch": 1294} {"train_loss": -11.301465034484863, "global_step": 217480, "epoch": 1294} {"train_loss": -11.295706748962402, "global_step": 217481, "epoch": 1294} {"train_loss": -11.189952850341797, "global_step": 217482, "epoch": 1294} {"train_loss": -10.694437026977539, "global_step": 217483, "epoch": 1294} {"train_loss": -11.197741508483887, "global_step": 217484, "epoch": 1294} {"train_loss": -10.66922664642334, "global_step": 217485, "epoch": 1294} {"train_loss": -8.8531494140625, "global_step": 217486, "epoch": 1294} {"train_loss": -9.05334186553955, "global_step": 217487, "epoch": 1294} {"train_loss": -10.441877365112305, "global_step": 217488, "epoch": 1294} {"train_loss": -7.468257427215576, "global_step": 217489, "epoch": 1294} {"train_loss": -7.976802349090576, "global_step": 217490, "epoch": 1294} {"train_loss": -9.844717025756836, "global_step": 217491, "epoch": 1294} {"train_loss": -7.68633508682251, "global_step": 217492, "epoch": 1294} {"train_loss": -9.323440551757812, "global_step": 217493, "epoch": 1294} {"train_loss": -9.074347496032715, "global_step": 217494, "epoch": 1294} {"train_loss": -10.25410270690918, "global_step": 217495, "epoch": 1294} {"train_loss": -9.585954666137695, "global_step": 217496, "epoch": 1294} {"train_loss": -10.072858810424805, "global_step": 217497, "epoch": 1294} {"train_loss": -10.223231315612793, "global_step": 217498, "epoch": 1294} {"train_loss": -10.7203369140625, "global_step": 217499, "epoch": 1294} {"train_loss": -10.467864990234375, "global_step": 217500, "epoch": 1294} {"train_loss": -10.504470825195312, "global_step": 217501, "epoch": 1294} {"train_loss": -10.696473121643066, "global_step": 217502, "epoch": 1294} {"train_loss": -10.789427757263184, "global_step": 217503, "epoch": 1294} {"train_loss": -11.096806526184082, "global_step": 217504, "epoch": 1294} {"train_loss": -10.865592956542969, "global_step": 217505, "epoch": 1294} {"train_loss": -10.622411727905273, "global_step": 217506, "epoch": 1294} {"train_loss": -10.881684303283691, "global_step": 217507, "epoch": 1294} {"train_loss": -11.12701416015625, "global_step": 217508, "epoch": 1294} {"train_loss": -10.933533668518066, "global_step": 217509, "epoch": 1294} {"train_loss": -10.934587478637695, "global_step": 217510, "epoch": 1294} {"train_loss": -11.019622802734375, "global_step": 217511, "epoch": 1294} {"train_loss": -10.784160614013672, "global_step": 217512, "epoch": 1294} {"train_loss": -11.329858779907227, "global_step": 217513, "epoch": 1294} {"train_loss": -11.394391059875488, "global_step": 217514, "epoch": 1294} {"train_loss": -11.129579544067383, "global_step": 217515, "epoch": 1294} {"train_loss": -11.155660629272461, "global_step": 217516, "epoch": 1294} {"train_loss": -11.21246337890625, "global_step": 217517, "epoch": 1294} {"train_loss": -11.463512420654297, "global_step": 217518, "epoch": 1294} {"train_loss": -10.862396240234375, "global_step": 217519, "epoch": 1294} {"train_loss": -11.404680252075195, "global_step": 217520, "epoch": 1294} {"train_loss": -11.371182441711426, "global_step": 217521, "epoch": 1294} {"train_loss": -11.199419021606445, "global_step": 217522, "epoch": 1294} {"train_loss": -11.324206352233887, "global_step": 217523, "epoch": 1294} {"train_loss": -11.576133728027344, "global_step": 217524, "epoch": 1294} {"train_loss": -11.37771987915039, "global_step": 217525, "epoch": 1294} {"train_loss": -11.079511642456055, "global_step": 217526, "epoch": 1294} {"train_loss": -11.476318359375, "global_step": 217527, "epoch": 1294} {"train_loss": -11.394068717956543, "global_step": 217528, "epoch": 1294} {"train_loss": -11.388729095458984, "global_step": 217529, "epoch": 1294} {"train_loss": -11.359344482421875, "global_step": 217530, "epoch": 1294} {"train_loss": -11.530364990234375, "global_step": 217531, "epoch": 1294} {"train_loss": -11.454387664794922, "global_step": 217532, "epoch": 1294} {"train_loss": -11.756711959838867, "global_step": 217533, "epoch": 1294} {"train_loss": -11.70763111114502, "global_step": 217534, "epoch": 1294} {"train_loss": -11.640883445739746, "global_step": 217535, "epoch": 1294} {"train_loss": -11.496686935424805, "global_step": 217536, "epoch": 1294} {"train_loss": -11.628061294555664, "global_step": 217537, "epoch": 1294} {"train_loss": -11.663057327270508, "global_step": 217538, "epoch": 1294} {"train_loss": -11.633800506591797, "global_step": 217539, "epoch": 1294} {"train_loss": -11.809176445007324, "global_step": 217540, "epoch": 1294} {"train_loss": -11.286714553833008, "global_step": 217541, "epoch": 1294} {"train_loss": -11.563677787780762, "global_step": 217542, "epoch": 1294} {"train_loss": -11.770336151123047, "global_step": 217543, "epoch": 1294} {"train_loss": -11.638738632202148, "global_step": 217544, "epoch": 1294} {"train_loss": -11.607784271240234, "global_step": 217545, "epoch": 1294} {"train_loss": -11.624969482421875, "global_step": 217546, "epoch": 1294} {"train_loss": -11.7791109085083, "global_step": 217547, "epoch": 1294} {"train_loss": -11.43936824798584, "global_step": 217548, "epoch": 1294} {"train_loss": -11.807479858398438, "global_step": 217549, "epoch": 1294} {"train_loss": -11.500779151916504, "global_step": 217550, "epoch": 1294} {"train_loss": -11.859493255615234, "global_step": 217551, "epoch": 1294} {"train_loss": -11.650917053222656, "global_step": 217552, "epoch": 1294} {"train_loss": -11.573846817016602, "global_step": 217553, "epoch": 1294} {"train_loss": -11.441396713256836, "global_step": 217554, "epoch": 1294} {"train_loss": -11.906355857849121, "global_step": 217555, "epoch": 1294} {"train_loss": -11.40655517578125, "global_step": 217556, "epoch": 1294} {"train_loss": -11.63327407836914, "global_step": 217557, "epoch": 1294} {"train_loss": -11.632139205932617, "global_step": 217558, "epoch": 1294} {"train_loss": -11.315709003380366, "global_step": 217559, "epoch": 1294, "val_loss": 249937.515625} {"train_loss": -11.796942710876465, "global_step": 217560, "epoch": 1295} {"train_loss": -11.643107414245605, "global_step": 217561, "epoch": 1295} {"train_loss": -11.791849136352539, "global_step": 217562, "epoch": 1295} {"train_loss": -12.020825386047363, "global_step": 217563, "epoch": 1295} {"train_loss": -11.85713005065918, "global_step": 217564, "epoch": 1295} {"train_loss": -11.956188201904297, "global_step": 217565, "epoch": 1295} {"train_loss": -11.914648056030273, "global_step": 217566, "epoch": 1295} {"train_loss": -11.802314758300781, "global_step": 217567, "epoch": 1295} {"train_loss": -11.471439361572266, "global_step": 217568, "epoch": 1295} {"train_loss": -11.661486625671387, "global_step": 217569, "epoch": 1295} {"train_loss": -11.685616493225098, "global_step": 217570, "epoch": 1295} {"train_loss": -11.875713348388672, "global_step": 217571, "epoch": 1295} {"train_loss": -11.728742599487305, "global_step": 217572, "epoch": 1295} {"train_loss": -11.861245155334473, "global_step": 217573, "epoch": 1295} {"train_loss": -12.04908275604248, "global_step": 217574, "epoch": 1295} {"train_loss": -11.511423110961914, "global_step": 217575, "epoch": 1295} {"train_loss": -11.573318481445312, "global_step": 217576, "epoch": 1295} {"train_loss": -11.470430374145508, "global_step": 217577, "epoch": 1295} {"train_loss": -11.606348991394043, "global_step": 217578, "epoch": 1295} {"train_loss": -11.358175277709961, "global_step": 217579, "epoch": 1295} {"train_loss": -10.980661392211914, "global_step": 217580, "epoch": 1295} {"train_loss": -10.80663776397705, "global_step": 217581, "epoch": 1295} {"train_loss": -11.015777587890625, "global_step": 217582, "epoch": 1295} {"train_loss": -11.138589859008789, "global_step": 217583, "epoch": 1295} {"train_loss": -8.26704216003418, "global_step": 217584, "epoch": 1295} {"train_loss": -9.55064868927002, "global_step": 217585, "epoch": 1295} {"train_loss": -10.502847671508789, "global_step": 217586, "epoch": 1295} {"train_loss": -7.678613662719727, "global_step": 217587, "epoch": 1295} {"train_loss": -7.874632835388184, "global_step": 217588, "epoch": 1295} {"train_loss": -9.424304962158203, "global_step": 217589, "epoch": 1295} {"train_loss": -9.096458435058594, "global_step": 217590, "epoch": 1295} {"train_loss": -8.839418411254883, "global_step": 217591, "epoch": 1295} {"train_loss": -10.199336051940918, "global_step": 217592, "epoch": 1295} {"train_loss": -9.199092864990234, "global_step": 217593, "epoch": 1295} {"train_loss": -9.926360130310059, "global_step": 217594, "epoch": 1295} {"train_loss": -10.420815467834473, "global_step": 217595, "epoch": 1295} {"train_loss": -9.386415481567383, "global_step": 217596, "epoch": 1295} {"train_loss": -11.030067443847656, "global_step": 217597, "epoch": 1295} {"train_loss": -9.442259788513184, "global_step": 217598, "epoch": 1295} {"train_loss": -10.818307876586914, "global_step": 217599, "epoch": 1295} {"train_loss": -10.199505805969238, "global_step": 217600, "epoch": 1295} {"train_loss": -10.743478775024414, "global_step": 217601, "epoch": 1295} {"train_loss": -10.917473793029785, "global_step": 217602, "epoch": 1295} {"train_loss": -10.689334869384766, "global_step": 217603, "epoch": 1295} {"train_loss": -10.914665222167969, "global_step": 217604, "epoch": 1295} {"train_loss": -11.141347885131836, "global_step": 217605, "epoch": 1295} {"train_loss": -11.118072509765625, "global_step": 217606, "epoch": 1295} {"train_loss": -10.870037078857422, "global_step": 217607, "epoch": 1295} {"train_loss": -11.268765449523926, "global_step": 217608, "epoch": 1295} {"train_loss": -11.084763526916504, "global_step": 217609, "epoch": 1295} {"train_loss": -11.48255443572998, "global_step": 217610, "epoch": 1295} {"train_loss": -11.301464080810547, "global_step": 217611, "epoch": 1295} {"train_loss": -11.359496116638184, "global_step": 217612, "epoch": 1295} {"train_loss": -11.314373016357422, "global_step": 217613, "epoch": 1295} {"train_loss": -11.192441940307617, "global_step": 217614, "epoch": 1295} {"train_loss": -11.426398277282715, "global_step": 217615, "epoch": 1295} {"train_loss": -11.371926307678223, "global_step": 217616, "epoch": 1295} {"train_loss": -11.452959060668945, "global_step": 217617, "epoch": 1295} {"train_loss": -11.535589218139648, "global_step": 217618, "epoch": 1295} {"train_loss": -11.385625839233398, "global_step": 217619, "epoch": 1295} {"train_loss": -11.214134216308594, "global_step": 217620, "epoch": 1295} {"train_loss": -11.31514835357666, "global_step": 217621, "epoch": 1295} {"train_loss": -11.363947868347168, "global_step": 217622, "epoch": 1295} {"train_loss": -11.249058723449707, "global_step": 217623, "epoch": 1295} {"train_loss": -11.645435333251953, "global_step": 217624, "epoch": 1295} {"train_loss": -10.895347595214844, "global_step": 217625, "epoch": 1295} {"train_loss": -11.44740104675293, "global_step": 217626, "epoch": 1295} {"train_loss": -11.023099899291992, "global_step": 217627, "epoch": 1295} {"train_loss": -11.39295768737793, "global_step": 217628, "epoch": 1295} {"train_loss": -11.479658126831055, "global_step": 217629, "epoch": 1295} {"train_loss": -10.966135025024414, "global_step": 217630, "epoch": 1295} {"train_loss": -11.421273231506348, "global_step": 217631, "epoch": 1295} {"train_loss": -11.554515838623047, "global_step": 217632, "epoch": 1295} {"train_loss": -11.56188678741455, "global_step": 217633, "epoch": 1295} {"train_loss": -11.57199478149414, "global_step": 217634, "epoch": 1295} {"train_loss": -11.506509780883789, "global_step": 217635, "epoch": 1295} {"train_loss": -11.452896118164062, "global_step": 217636, "epoch": 1295} {"train_loss": -11.675334930419922, "global_step": 217637, "epoch": 1295} {"train_loss": -11.488632202148438, "global_step": 217638, "epoch": 1295} {"train_loss": -11.708366394042969, "global_step": 217639, "epoch": 1295} {"train_loss": -11.62339973449707, "global_step": 217640, "epoch": 1295} {"train_loss": -11.628116607666016, "global_step": 217641, "epoch": 1295} {"train_loss": -11.51752758026123, "global_step": 217642, "epoch": 1295} {"train_loss": -11.779776573181152, "global_step": 217643, "epoch": 1295} {"train_loss": -11.492866516113281, "global_step": 217644, "epoch": 1295} {"train_loss": -11.797518730163574, "global_step": 217645, "epoch": 1295} {"train_loss": -11.664690017700195, "global_step": 217646, "epoch": 1295} {"train_loss": -11.778908729553223, "global_step": 217647, "epoch": 1295} {"train_loss": -11.841697692871094, "global_step": 217648, "epoch": 1295} {"train_loss": -11.730374336242676, "global_step": 217649, "epoch": 1295} {"train_loss": -11.494953155517578, "global_step": 217650, "epoch": 1295} {"train_loss": -11.662755966186523, "global_step": 217651, "epoch": 1295} {"train_loss": -11.751188278198242, "global_step": 217652, "epoch": 1295} {"train_loss": -11.671091079711914, "global_step": 217653, "epoch": 1295} {"train_loss": -11.605169296264648, "global_step": 217654, "epoch": 1295} {"train_loss": -11.73720645904541, "global_step": 217655, "epoch": 1295} {"train_loss": -11.712408065795898, "global_step": 217656, "epoch": 1295} {"train_loss": -11.725690841674805, "global_step": 217657, "epoch": 1295} {"train_loss": -11.588603019714355, "global_step": 217658, "epoch": 1295} {"train_loss": -11.86567497253418, "global_step": 217659, "epoch": 1295} {"train_loss": -11.738773345947266, "global_step": 217660, "epoch": 1295} {"train_loss": -11.653742790222168, "global_step": 217661, "epoch": 1295} {"train_loss": -11.940990447998047, "global_step": 217662, "epoch": 1295} {"train_loss": -11.645268440246582, "global_step": 217663, "epoch": 1295} {"train_loss": -11.773316383361816, "global_step": 217664, "epoch": 1295} {"train_loss": -11.687288284301758, "global_step": 217665, "epoch": 1295} {"train_loss": -11.713595390319824, "global_step": 217666, "epoch": 1295} {"train_loss": -11.94330883026123, "global_step": 217667, "epoch": 1295} {"train_loss": -11.55508041381836, "global_step": 217668, "epoch": 1295} {"train_loss": -11.847291946411133, "global_step": 217669, "epoch": 1295} {"train_loss": -11.742350578308105, "global_step": 217670, "epoch": 1295} {"train_loss": -12.024345397949219, "global_step": 217671, "epoch": 1295} {"train_loss": -11.85577392578125, "global_step": 217672, "epoch": 1295} {"train_loss": -11.89421272277832, "global_step": 217673, "epoch": 1295} {"train_loss": -11.380189895629883, "global_step": 217674, "epoch": 1295} {"train_loss": -11.924956321716309, "global_step": 217675, "epoch": 1295} {"train_loss": -11.687311172485352, "global_step": 217676, "epoch": 1295} {"train_loss": -11.478679656982422, "global_step": 217677, "epoch": 1295} {"train_loss": -11.719457626342773, "global_step": 217678, "epoch": 1295} {"train_loss": -11.861456871032715, "global_step": 217679, "epoch": 1295} {"train_loss": -11.28009033203125, "global_step": 217680, "epoch": 1295} {"train_loss": -11.788774490356445, "global_step": 217681, "epoch": 1295} {"train_loss": -11.327794075012207, "global_step": 217682, "epoch": 1295} {"train_loss": -11.472265243530273, "global_step": 217683, "epoch": 1295} {"train_loss": -11.477617263793945, "global_step": 217684, "epoch": 1295} {"train_loss": -11.374415397644043, "global_step": 217685, "epoch": 1295} {"train_loss": -10.158470153808594, "global_step": 217686, "epoch": 1295} {"train_loss": -11.800016403198242, "global_step": 217687, "epoch": 1295} {"train_loss": -10.710576057434082, "global_step": 217688, "epoch": 1295} {"train_loss": -10.863574981689453, "global_step": 217689, "epoch": 1295} {"train_loss": -11.146184921264648, "global_step": 217690, "epoch": 1295} {"train_loss": -11.07779312133789, "global_step": 217691, "epoch": 1295} {"train_loss": -10.856353759765625, "global_step": 217692, "epoch": 1295} {"train_loss": -11.488822937011719, "global_step": 217693, "epoch": 1295} {"train_loss": -10.857301712036133, "global_step": 217694, "epoch": 1295} {"train_loss": -11.50946044921875, "global_step": 217695, "epoch": 1295} {"train_loss": -11.032506942749023, "global_step": 217696, "epoch": 1295} {"train_loss": -10.98189926147461, "global_step": 217697, "epoch": 1295} {"train_loss": -11.181734085083008, "global_step": 217698, "epoch": 1295} {"train_loss": -11.162494659423828, "global_step": 217699, "epoch": 1295} {"train_loss": -11.04014778137207, "global_step": 217700, "epoch": 1295} {"train_loss": -11.661502838134766, "global_step": 217701, "epoch": 1295} {"train_loss": -11.439277648925781, "global_step": 217702, "epoch": 1295} {"train_loss": -11.722111701965332, "global_step": 217703, "epoch": 1295} {"train_loss": -11.232292175292969, "global_step": 217704, "epoch": 1295} {"train_loss": -11.487321853637695, "global_step": 217705, "epoch": 1295} {"train_loss": -11.590202331542969, "global_step": 217706, "epoch": 1295} {"train_loss": -11.295022964477539, "global_step": 217707, "epoch": 1295} {"train_loss": -11.469024658203125, "global_step": 217708, "epoch": 1295} {"train_loss": -11.31500244140625, "global_step": 217709, "epoch": 1295} {"train_loss": -11.319046020507812, "global_step": 217710, "epoch": 1295} {"train_loss": -11.344761848449707, "global_step": 217711, "epoch": 1295} {"train_loss": -11.70569896697998, "global_step": 217712, "epoch": 1295} {"train_loss": -11.273614883422852, "global_step": 217713, "epoch": 1295} {"train_loss": -11.709138870239258, "global_step": 217714, "epoch": 1295} {"train_loss": -11.531608581542969, "global_step": 217715, "epoch": 1295} {"train_loss": -11.787166595458984, "global_step": 217716, "epoch": 1295} {"train_loss": -11.521843910217285, "global_step": 217717, "epoch": 1295} {"train_loss": -11.580528259277344, "global_step": 217718, "epoch": 1295} {"train_loss": -11.338128089904785, "global_step": 217719, "epoch": 1295} {"train_loss": -11.73459243774414, "global_step": 217720, "epoch": 1295} {"train_loss": -11.590845108032227, "global_step": 217721, "epoch": 1295} {"train_loss": -11.562479972839355, "global_step": 217722, "epoch": 1295} {"train_loss": -11.632856369018555, "global_step": 217723, "epoch": 1295} {"train_loss": -11.446407318115234, "global_step": 217724, "epoch": 1295} {"train_loss": -12.06977653503418, "global_step": 217725, "epoch": 1295} {"train_loss": -11.462679862976074, "global_step": 217726, "epoch": 1295} {"train_loss": -11.283856675738381, "global_step": 217727, "epoch": 1295, "val_loss": 250406.671875, "train_action_mse_error": 1.424124002456665} {"train_loss": -11.37473201751709, "global_step": 217728, "epoch": 1296} {"train_loss": -11.700904846191406, "global_step": 217729, "epoch": 1296} {"train_loss": -11.448180198669434, "global_step": 217730, "epoch": 1296} {"train_loss": -11.360784530639648, "global_step": 217731, "epoch": 1296} {"train_loss": -11.537311553955078, "global_step": 217732, "epoch": 1296} {"train_loss": -11.24100112915039, "global_step": 217733, "epoch": 1296} {"train_loss": -11.807716369628906, "global_step": 217734, "epoch": 1296} {"train_loss": -11.314363479614258, "global_step": 217735, "epoch": 1296} {"train_loss": -11.521827697753906, "global_step": 217736, "epoch": 1296} {"train_loss": -11.602745056152344, "global_step": 217737, "epoch": 1296} {"train_loss": -11.819360733032227, "global_step": 217738, "epoch": 1296} {"train_loss": -11.98538589477539, "global_step": 217739, "epoch": 1296} {"train_loss": -11.689643859863281, "global_step": 217740, "epoch": 1296} {"train_loss": -11.894664764404297, "global_step": 217741, "epoch": 1296} {"train_loss": -11.637273788452148, "global_step": 217742, "epoch": 1296} {"train_loss": -12.009685516357422, "global_step": 217743, "epoch": 1296} {"train_loss": -11.72805118560791, "global_step": 217744, "epoch": 1296} {"train_loss": -11.704416275024414, "global_step": 217745, "epoch": 1296} {"train_loss": -11.795919418334961, "global_step": 217746, "epoch": 1296} {"train_loss": -11.74195671081543, "global_step": 217747, "epoch": 1296} {"train_loss": -11.745373725891113, "global_step": 217748, "epoch": 1296} {"train_loss": -11.862093925476074, "global_step": 217749, "epoch": 1296} {"train_loss": -12.059475898742676, "global_step": 217750, "epoch": 1296} {"train_loss": -11.522679328918457, "global_step": 217751, "epoch": 1296} {"train_loss": -11.858016967773438, "global_step": 217752, "epoch": 1296} {"train_loss": -11.77374267578125, "global_step": 217753, "epoch": 1296} {"train_loss": -11.641359329223633, "global_step": 217754, "epoch": 1296} {"train_loss": -12.058843612670898, "global_step": 217755, "epoch": 1296} {"train_loss": -11.819352149963379, "global_step": 217756, "epoch": 1296} {"train_loss": -11.861629486083984, "global_step": 217757, "epoch": 1296} {"train_loss": -12.062058448791504, "global_step": 217758, "epoch": 1296} {"train_loss": -11.7745943069458, "global_step": 217759, "epoch": 1296} {"train_loss": -11.945287704467773, "global_step": 217760, "epoch": 1296} {"train_loss": -11.998495101928711, "global_step": 217761, "epoch": 1296} {"train_loss": -11.928085327148438, "global_step": 217762, "epoch": 1296} {"train_loss": -11.763914108276367, "global_step": 217763, "epoch": 1296} {"train_loss": -11.931655883789062, "global_step": 217764, "epoch": 1296} {"train_loss": -12.016533851623535, "global_step": 217765, "epoch": 1296} {"train_loss": -11.737704277038574, "global_step": 217766, "epoch": 1296} {"train_loss": -11.357961654663086, "global_step": 217767, "epoch": 1296} {"train_loss": -10.441879272460938, "global_step": 217768, "epoch": 1296} {"train_loss": -11.225244522094727, "global_step": 217769, "epoch": 1296} {"train_loss": -11.046749114990234, "global_step": 217770, "epoch": 1296} {"train_loss": -9.902700424194336, "global_step": 217771, "epoch": 1296} {"train_loss": -9.823115348815918, "global_step": 217772, "epoch": 1296} {"train_loss": -11.506722450256348, "global_step": 217773, "epoch": 1296} {"train_loss": -7.776485443115234, "global_step": 217774, "epoch": 1296} {"train_loss": -10.887289047241211, "global_step": 217775, "epoch": 1296} {"train_loss": -10.799242973327637, "global_step": 217776, "epoch": 1296} {"train_loss": -9.023103713989258, "global_step": 217777, "epoch": 1296} {"train_loss": -10.295356750488281, "global_step": 217778, "epoch": 1296} {"train_loss": -7.291192531585693, "global_step": 217779, "epoch": 1296} {"train_loss": -7.4383955001831055, "global_step": 217780, "epoch": 1296} {"train_loss": -9.898059844970703, "global_step": 217781, "epoch": 1296} {"train_loss": -8.710641860961914, "global_step": 217782, "epoch": 1296} {"train_loss": -7.53643798828125, "global_step": 217783, "epoch": 1296} {"train_loss": -7.440853595733643, "global_step": 217784, "epoch": 1296} {"train_loss": -7.746965408325195, "global_step": 217785, "epoch": 1296} {"train_loss": -8.506630897521973, "global_step": 217786, "epoch": 1296} {"train_loss": -9.243568420410156, "global_step": 217787, "epoch": 1296} {"train_loss": -9.942328453063965, "global_step": 217788, "epoch": 1296} {"train_loss": -8.392244338989258, "global_step": 217789, "epoch": 1296} {"train_loss": -9.03679084777832, "global_step": 217790, "epoch": 1296} {"train_loss": -9.075357437133789, "global_step": 217791, "epoch": 1296} {"train_loss": -10.273845672607422, "global_step": 217792, "epoch": 1296} {"train_loss": -9.10240364074707, "global_step": 217793, "epoch": 1296} {"train_loss": -9.518247604370117, "global_step": 217794, "epoch": 1296} {"train_loss": -9.796476364135742, "global_step": 217795, "epoch": 1296} {"train_loss": -9.226083755493164, "global_step": 217796, "epoch": 1296} {"train_loss": -9.96812629699707, "global_step": 217797, "epoch": 1296} {"train_loss": -9.554584503173828, "global_step": 217798, "epoch": 1296} {"train_loss": -9.125197410583496, "global_step": 217799, "epoch": 1296} {"train_loss": -9.976221084594727, "global_step": 217800, "epoch": 1296} {"train_loss": -10.140475273132324, "global_step": 217801, "epoch": 1296} {"train_loss": -10.297964096069336, "global_step": 217802, "epoch": 1296} {"train_loss": -9.610635757446289, "global_step": 217803, "epoch": 1296} {"train_loss": -10.634037971496582, "global_step": 217804, "epoch": 1296} {"train_loss": -10.504161834716797, "global_step": 217805, "epoch": 1296} {"train_loss": -10.68493938446045, "global_step": 217806, "epoch": 1296} {"train_loss": -10.884273529052734, "global_step": 217807, "epoch": 1296} {"train_loss": -10.840496063232422, "global_step": 217808, "epoch": 1296} {"train_loss": -10.885255813598633, "global_step": 217809, "epoch": 1296} {"train_loss": -10.882711410522461, "global_step": 217810, "epoch": 1296} {"train_loss": -10.863879203796387, "global_step": 217811, "epoch": 1296} {"train_loss": -10.923563957214355, "global_step": 217812, "epoch": 1296} {"train_loss": -10.618600845336914, "global_step": 217813, "epoch": 1296} {"train_loss": -11.007153511047363, "global_step": 217814, "epoch": 1296} {"train_loss": -10.96401596069336, "global_step": 217815, "epoch": 1296} {"train_loss": -11.185432434082031, "global_step": 217816, "epoch": 1296} {"train_loss": -10.746566772460938, "global_step": 217817, "epoch": 1296} {"train_loss": -11.083440780639648, "global_step": 217818, "epoch": 1296} {"train_loss": -11.036742210388184, "global_step": 217819, "epoch": 1296} {"train_loss": -11.145302772521973, "global_step": 217820, "epoch": 1296} {"train_loss": -11.010862350463867, "global_step": 217821, "epoch": 1296} {"train_loss": -11.314382553100586, "global_step": 217822, "epoch": 1296} {"train_loss": -11.295381546020508, "global_step": 217823, "epoch": 1296} {"train_loss": -11.31800651550293, "global_step": 217824, "epoch": 1296} {"train_loss": -11.275398254394531, "global_step": 217825, "epoch": 1296} {"train_loss": -11.269291877746582, "global_step": 217826, "epoch": 1296} {"train_loss": -10.989034652709961, "global_step": 217827, "epoch": 1296} {"train_loss": -11.291282653808594, "global_step": 217828, "epoch": 1296} {"train_loss": -11.32650089263916, "global_step": 217829, "epoch": 1296} {"train_loss": -11.299225807189941, "global_step": 217830, "epoch": 1296} {"train_loss": -11.273447036743164, "global_step": 217831, "epoch": 1296} {"train_loss": -11.132318496704102, "global_step": 217832, "epoch": 1296} {"train_loss": -11.141962051391602, "global_step": 217833, "epoch": 1296} {"train_loss": -11.223062515258789, "global_step": 217834, "epoch": 1296} {"train_loss": -11.451515197753906, "global_step": 217835, "epoch": 1296} {"train_loss": -11.30078125, "global_step": 217836, "epoch": 1296} {"train_loss": -11.535646438598633, "global_step": 217837, "epoch": 1296} {"train_loss": -11.34319019317627, "global_step": 217838, "epoch": 1296} {"train_loss": -11.625307083129883, "global_step": 217839, "epoch": 1296} {"train_loss": -11.456570625305176, "global_step": 217840, "epoch": 1296} {"train_loss": -11.625713348388672, "global_step": 217841, "epoch": 1296} {"train_loss": -11.424169540405273, "global_step": 217842, "epoch": 1296} {"train_loss": -11.494083404541016, "global_step": 217843, "epoch": 1296} {"train_loss": -11.418350219726562, "global_step": 217844, "epoch": 1296} {"train_loss": -11.565354347229004, "global_step": 217845, "epoch": 1296} {"train_loss": -11.6575927734375, "global_step": 217846, "epoch": 1296} {"train_loss": -11.546186447143555, "global_step": 217847, "epoch": 1296} {"train_loss": -11.610437393188477, "global_step": 217848, "epoch": 1296} {"train_loss": -11.564023971557617, "global_step": 217849, "epoch": 1296} {"train_loss": -11.642289161682129, "global_step": 217850, "epoch": 1296} {"train_loss": -11.702348709106445, "global_step": 217851, "epoch": 1296} {"train_loss": -11.63968276977539, "global_step": 217852, "epoch": 1296} {"train_loss": -11.677342414855957, "global_step": 217853, "epoch": 1296} {"train_loss": -11.680031776428223, "global_step": 217854, "epoch": 1296} {"train_loss": -11.743940353393555, "global_step": 217855, "epoch": 1296} {"train_loss": -11.760774612426758, "global_step": 217856, "epoch": 1296} {"train_loss": -11.623283386230469, "global_step": 217857, "epoch": 1296} {"train_loss": -11.66211986541748, "global_step": 217858, "epoch": 1296} {"train_loss": -11.729933738708496, "global_step": 217859, "epoch": 1296} {"train_loss": -11.754947662353516, "global_step": 217860, "epoch": 1296} {"train_loss": -11.899955749511719, "global_step": 217861, "epoch": 1296} {"train_loss": -11.700550079345703, "global_step": 217862, "epoch": 1296} {"train_loss": -11.896880149841309, "global_step": 217863, "epoch": 1296} {"train_loss": -11.81153392791748, "global_step": 217864, "epoch": 1296} {"train_loss": -11.961689949035645, "global_step": 217865, "epoch": 1296} {"train_loss": -11.821810722351074, "global_step": 217866, "epoch": 1296} {"train_loss": -11.823264122009277, "global_step": 217867, "epoch": 1296} {"train_loss": -11.937406539916992, "global_step": 217868, "epoch": 1296} {"train_loss": -11.898606300354004, "global_step": 217869, "epoch": 1296} {"train_loss": -11.880166053771973, "global_step": 217870, "epoch": 1296} {"train_loss": -12.038837432861328, "global_step": 217871, "epoch": 1296} {"train_loss": -11.724618911743164, "global_step": 217872, "epoch": 1296} {"train_loss": -11.430868148803711, "global_step": 217873, "epoch": 1296} {"train_loss": -11.277314186096191, "global_step": 217874, "epoch": 1296} {"train_loss": -11.707352638244629, "global_step": 217875, "epoch": 1296} {"train_loss": -11.853711128234863, "global_step": 217876, "epoch": 1296} {"train_loss": -11.345137596130371, "global_step": 217877, "epoch": 1296} {"train_loss": -11.40015983581543, "global_step": 217878, "epoch": 1296} {"train_loss": -11.748015403747559, "global_step": 217879, "epoch": 1296} {"train_loss": -11.451881408691406, "global_step": 217880, "epoch": 1296} {"train_loss": -11.64031982421875, "global_step": 217881, "epoch": 1296} {"train_loss": -11.586626052856445, "global_step": 217882, "epoch": 1296} {"train_loss": -11.350692749023438, "global_step": 217883, "epoch": 1296} {"train_loss": -11.190973281860352, "global_step": 217884, "epoch": 1296} {"train_loss": -10.994980812072754, "global_step": 217885, "epoch": 1296} {"train_loss": -11.6399507522583, "global_step": 217886, "epoch": 1296} {"train_loss": -11.482683181762695, "global_step": 217887, "epoch": 1296} {"train_loss": -11.395874977111816, "global_step": 217888, "epoch": 1296} {"train_loss": -10.044377326965332, "global_step": 217889, "epoch": 1296} {"train_loss": -10.41714096069336, "global_step": 217890, "epoch": 1296} {"train_loss": -11.010884284973145, "global_step": 217891, "epoch": 1296} {"train_loss": -11.809272766113281, "global_step": 217892, "epoch": 1296} {"train_loss": -11.47542953491211, "global_step": 217893, "epoch": 1296} {"train_loss": -10.799979209899902, "global_step": 217894, "epoch": 1296} {"train_loss": -11.04173897561573, "global_step": 217895, "epoch": 1296, "val_loss": 250066.59375} {"train_loss": -11.007938385009766, "global_step": 217896, "epoch": 1297} {"train_loss": -10.813074111938477, "global_step": 217897, "epoch": 1297} {"train_loss": -10.83554458618164, "global_step": 217898, "epoch": 1297} {"train_loss": -9.556551933288574, "global_step": 217899, "epoch": 1297} {"train_loss": -10.291112899780273, "global_step": 217900, "epoch": 1297} {"train_loss": -8.84048843383789, "global_step": 217901, "epoch": 1297} {"train_loss": -10.800374031066895, "global_step": 217902, "epoch": 1297} {"train_loss": -9.69875717163086, "global_step": 217903, "epoch": 1297} {"train_loss": -9.734107971191406, "global_step": 217904, "epoch": 1297} {"train_loss": -8.143467903137207, "global_step": 217905, "epoch": 1297} {"train_loss": -10.518632888793945, "global_step": 217906, "epoch": 1297} {"train_loss": -9.519866943359375, "global_step": 217907, "epoch": 1297} {"train_loss": -10.349210739135742, "global_step": 217908, "epoch": 1297} {"train_loss": -10.827136039733887, "global_step": 217909, "epoch": 1297} {"train_loss": -10.118550300598145, "global_step": 217910, "epoch": 1297} {"train_loss": -11.043960571289062, "global_step": 217911, "epoch": 1297} {"train_loss": -10.389947891235352, "global_step": 217912, "epoch": 1297} {"train_loss": -10.230094909667969, "global_step": 217913, "epoch": 1297} {"train_loss": -9.603063583374023, "global_step": 217914, "epoch": 1297} {"train_loss": -9.989339828491211, "global_step": 217915, "epoch": 1297} {"train_loss": -10.08639907836914, "global_step": 217916, "epoch": 1297} {"train_loss": -9.984110832214355, "global_step": 217917, "epoch": 1297} {"train_loss": -10.168851852416992, "global_step": 217918, "epoch": 1297} {"train_loss": -10.640289306640625, "global_step": 217919, "epoch": 1297} {"train_loss": -9.471269607543945, "global_step": 217920, "epoch": 1297} {"train_loss": -11.290687561035156, "global_step": 217921, "epoch": 1297} {"train_loss": -10.411752700805664, "global_step": 217922, "epoch": 1297} {"train_loss": -11.249261856079102, "global_step": 217923, "epoch": 1297} {"train_loss": -10.98583698272705, "global_step": 217924, "epoch": 1297} {"train_loss": -10.901996612548828, "global_step": 217925, "epoch": 1297} {"train_loss": -11.005317687988281, "global_step": 217926, "epoch": 1297} {"train_loss": -10.935722351074219, "global_step": 217927, "epoch": 1297} {"train_loss": -11.230114936828613, "global_step": 217928, "epoch": 1297} {"train_loss": -11.179706573486328, "global_step": 217929, "epoch": 1297} {"train_loss": -11.377349853515625, "global_step": 217930, "epoch": 1297} {"train_loss": -11.34897232055664, "global_step": 217931, "epoch": 1297} {"train_loss": -11.296586990356445, "global_step": 217932, "epoch": 1297} {"train_loss": -11.335552215576172, "global_step": 217933, "epoch": 1297} {"train_loss": -11.235885620117188, "global_step": 217934, "epoch": 1297} {"train_loss": -11.294172286987305, "global_step": 217935, "epoch": 1297} {"train_loss": -11.365854263305664, "global_step": 217936, "epoch": 1297} {"train_loss": -11.489267349243164, "global_step": 217937, "epoch": 1297} {"train_loss": -11.300670623779297, "global_step": 217938, "epoch": 1297} {"train_loss": -11.246526718139648, "global_step": 217939, "epoch": 1297} {"train_loss": -11.26581859588623, "global_step": 217940, "epoch": 1297} {"train_loss": -11.556640625, "global_step": 217941, "epoch": 1297} {"train_loss": -11.446431159973145, "global_step": 217942, "epoch": 1297} {"train_loss": -11.498226165771484, "global_step": 217943, "epoch": 1297} {"train_loss": -11.70653247833252, "global_step": 217944, "epoch": 1297} {"train_loss": -11.553566932678223, "global_step": 217945, "epoch": 1297} {"train_loss": -11.49953556060791, "global_step": 217946, "epoch": 1297} {"train_loss": -11.686124801635742, "global_step": 217947, "epoch": 1297} {"train_loss": -11.736613273620605, "global_step": 217948, "epoch": 1297} {"train_loss": -11.531891822814941, "global_step": 217949, "epoch": 1297} {"train_loss": -11.506397247314453, "global_step": 217950, "epoch": 1297} {"train_loss": -11.428592681884766, "global_step": 217951, "epoch": 1297} {"train_loss": -11.566292762756348, "global_step": 217952, "epoch": 1297} {"train_loss": -11.74067211151123, "global_step": 217953, "epoch": 1297} {"train_loss": -11.585859298706055, "global_step": 217954, "epoch": 1297} {"train_loss": -11.706293106079102, "global_step": 217955, "epoch": 1297} {"train_loss": -11.684391021728516, "global_step": 217956, "epoch": 1297} {"train_loss": -11.52964973449707, "global_step": 217957, "epoch": 1297} {"train_loss": -11.82577896118164, "global_step": 217958, "epoch": 1297} {"train_loss": -11.650076866149902, "global_step": 217959, "epoch": 1297} {"train_loss": -11.827880859375, "global_step": 217960, "epoch": 1297} {"train_loss": -11.736156463623047, "global_step": 217961, "epoch": 1297} {"train_loss": -11.811698913574219, "global_step": 217962, "epoch": 1297} {"train_loss": -11.837202072143555, "global_step": 217963, "epoch": 1297} {"train_loss": -11.642083168029785, "global_step": 217964, "epoch": 1297} {"train_loss": -11.717305183410645, "global_step": 217965, "epoch": 1297} {"train_loss": -11.631351470947266, "global_step": 217966, "epoch": 1297} {"train_loss": -11.822103500366211, "global_step": 217967, "epoch": 1297} {"train_loss": -11.998401641845703, "global_step": 217968, "epoch": 1297} {"train_loss": -11.447242736816406, "global_step": 217969, "epoch": 1297} {"train_loss": -12.068446159362793, "global_step": 217970, "epoch": 1297} {"train_loss": -11.664510726928711, "global_step": 217971, "epoch": 1297} {"train_loss": -11.925390243530273, "global_step": 217972, "epoch": 1297} {"train_loss": -11.821874618530273, "global_step": 217973, "epoch": 1297} {"train_loss": -11.753144264221191, "global_step": 217974, "epoch": 1297} {"train_loss": -11.827327728271484, "global_step": 217975, "epoch": 1297} {"train_loss": -11.806548118591309, "global_step": 217976, "epoch": 1297} {"train_loss": -11.821914672851562, "global_step": 217977, "epoch": 1297} {"train_loss": -11.985067367553711, "global_step": 217978, "epoch": 1297} {"train_loss": -11.645598411560059, "global_step": 217979, "epoch": 1297} {"train_loss": -11.609073638916016, "global_step": 217980, "epoch": 1297} {"train_loss": -11.819674491882324, "global_step": 217981, "epoch": 1297} {"train_loss": -12.03028392791748, "global_step": 217982, "epoch": 1297} {"train_loss": -11.72985553741455, "global_step": 217983, "epoch": 1297} {"train_loss": -11.715371131896973, "global_step": 217984, "epoch": 1297} {"train_loss": -11.788434982299805, "global_step": 217985, "epoch": 1297} {"train_loss": -11.969615936279297, "global_step": 217986, "epoch": 1297} {"train_loss": -11.704229354858398, "global_step": 217987, "epoch": 1297} {"train_loss": -11.500975608825684, "global_step": 217988, "epoch": 1297} {"train_loss": -11.646917343139648, "global_step": 217989, "epoch": 1297} {"train_loss": -11.67204475402832, "global_step": 217990, "epoch": 1297} {"train_loss": -11.868461608886719, "global_step": 217991, "epoch": 1297} {"train_loss": -11.696304321289062, "global_step": 217992, "epoch": 1297} {"train_loss": -11.781201362609863, "global_step": 217993, "epoch": 1297} {"train_loss": -11.477798461914062, "global_step": 217994, "epoch": 1297} {"train_loss": -12.025328636169434, "global_step": 217995, "epoch": 1297} {"train_loss": -11.915000915527344, "global_step": 217996, "epoch": 1297} {"train_loss": -11.96226692199707, "global_step": 217997, "epoch": 1297} {"train_loss": -11.567438125610352, "global_step": 217998, "epoch": 1297} {"train_loss": -11.585182189941406, "global_step": 217999, "epoch": 1297} {"train_loss": -11.77145004272461, "global_step": 218000, "epoch": 1297} {"train_loss": -11.67210578918457, "global_step": 218001, "epoch": 1297} {"train_loss": -11.514920234680176, "global_step": 218002, "epoch": 1297} {"train_loss": -11.828125, "global_step": 218003, "epoch": 1297} {"train_loss": -11.621831893920898, "global_step": 218004, "epoch": 1297} {"train_loss": -11.553291320800781, "global_step": 218005, "epoch": 1297} {"train_loss": -11.062491416931152, "global_step": 218006, "epoch": 1297} {"train_loss": -11.871902465820312, "global_step": 218007, "epoch": 1297} {"train_loss": -10.787083625793457, "global_step": 218008, "epoch": 1297} {"train_loss": -10.940805435180664, "global_step": 218009, "epoch": 1297} {"train_loss": -10.480920791625977, "global_step": 218010, "epoch": 1297} {"train_loss": -11.334335327148438, "global_step": 218011, "epoch": 1297} {"train_loss": -11.139799118041992, "global_step": 218012, "epoch": 1297} {"train_loss": -11.07374382019043, "global_step": 218013, "epoch": 1297} {"train_loss": -11.2470121383667, "global_step": 218014, "epoch": 1297} {"train_loss": -11.627206802368164, "global_step": 218015, "epoch": 1297} {"train_loss": -11.222768783569336, "global_step": 218016, "epoch": 1297} {"train_loss": -11.166139602661133, "global_step": 218017, "epoch": 1297} {"train_loss": -11.461343765258789, "global_step": 218018, "epoch": 1297} {"train_loss": -11.587108612060547, "global_step": 218019, "epoch": 1297} {"train_loss": -11.667415618896484, "global_step": 218020, "epoch": 1297} {"train_loss": -11.258630752563477, "global_step": 218021, "epoch": 1297} {"train_loss": -11.459723472595215, "global_step": 218022, "epoch": 1297} {"train_loss": -11.204766273498535, "global_step": 218023, "epoch": 1297} {"train_loss": -11.406866073608398, "global_step": 218024, "epoch": 1297} {"train_loss": -11.408336639404297, "global_step": 218025, "epoch": 1297} {"train_loss": -11.60666275024414, "global_step": 218026, "epoch": 1297} {"train_loss": -11.75655460357666, "global_step": 218027, "epoch": 1297} {"train_loss": -11.497159957885742, "global_step": 218028, "epoch": 1297} {"train_loss": -11.700965881347656, "global_step": 218029, "epoch": 1297} {"train_loss": -11.547189712524414, "global_step": 218030, "epoch": 1297} {"train_loss": -11.616745948791504, "global_step": 218031, "epoch": 1297} {"train_loss": -11.7052001953125, "global_step": 218032, "epoch": 1297} {"train_loss": -11.300361633300781, "global_step": 218033, "epoch": 1297} {"train_loss": -11.568172454833984, "global_step": 218034, "epoch": 1297} {"train_loss": -11.779889106750488, "global_step": 218035, "epoch": 1297} {"train_loss": -11.830911636352539, "global_step": 218036, "epoch": 1297} {"train_loss": -11.494812965393066, "global_step": 218037, "epoch": 1297} {"train_loss": -11.59052562713623, "global_step": 218038, "epoch": 1297} {"train_loss": -11.825716972351074, "global_step": 218039, "epoch": 1297} {"train_loss": -11.406429290771484, "global_step": 218040, "epoch": 1297} {"train_loss": -11.609676361083984, "global_step": 218041, "epoch": 1297} {"train_loss": -11.68551254272461, "global_step": 218042, "epoch": 1297} {"train_loss": -11.401416778564453, "global_step": 218043, "epoch": 1297} {"train_loss": -11.950754165649414, "global_step": 218044, "epoch": 1297} {"train_loss": -11.580137252807617, "global_step": 218045, "epoch": 1297} {"train_loss": -11.682855606079102, "global_step": 218046, "epoch": 1297} {"train_loss": -11.98762321472168, "global_step": 218047, "epoch": 1297} {"train_loss": -11.792341232299805, "global_step": 218048, "epoch": 1297} {"train_loss": -11.364933967590332, "global_step": 218049, "epoch": 1297} {"train_loss": -11.789901733398438, "global_step": 218050, "epoch": 1297} {"train_loss": -11.313957214355469, "global_step": 218051, "epoch": 1297} {"train_loss": -11.143259048461914, "global_step": 218052, "epoch": 1297} {"train_loss": -11.427389144897461, "global_step": 218053, "epoch": 1297} {"train_loss": -11.304186820983887, "global_step": 218054, "epoch": 1297} {"train_loss": -11.605281829833984, "global_step": 218055, "epoch": 1297} {"train_loss": -11.561941146850586, "global_step": 218056, "epoch": 1297} {"train_loss": -11.66112995147705, "global_step": 218057, "epoch": 1297} {"train_loss": -11.644538879394531, "global_step": 218058, "epoch": 1297} {"train_loss": -11.296845436096191, "global_step": 218059, "epoch": 1297} {"train_loss": -11.36690902709961, "global_step": 218060, "epoch": 1297} {"train_loss": -11.552413940429688, "global_step": 218061, "epoch": 1297} {"train_loss": -11.582731246948242, "global_step": 218062, "epoch": 1297} {"train_loss": -11.327493713015603, "global_step": 218063, "epoch": 1297, "val_loss": 256957.59375} {"train_loss": -11.140803337097168, "global_step": 218064, "epoch": 1298} {"train_loss": -11.0113525390625, "global_step": 218065, "epoch": 1298} {"train_loss": -11.36506462097168, "global_step": 218066, "epoch": 1298} {"train_loss": -10.265265464782715, "global_step": 218067, "epoch": 1298} {"train_loss": -10.640701293945312, "global_step": 218068, "epoch": 1298} {"train_loss": -11.674652099609375, "global_step": 218069, "epoch": 1298} {"train_loss": -11.071402549743652, "global_step": 218070, "epoch": 1298} {"train_loss": -10.630067825317383, "global_step": 218071, "epoch": 1298} {"train_loss": -11.327695846557617, "global_step": 218072, "epoch": 1298} {"train_loss": -11.792827606201172, "global_step": 218073, "epoch": 1298} {"train_loss": -11.550970077514648, "global_step": 218074, "epoch": 1298} {"train_loss": -11.684561729431152, "global_step": 218075, "epoch": 1298} {"train_loss": -11.786787033081055, "global_step": 218076, "epoch": 1298} {"train_loss": -11.725942611694336, "global_step": 218077, "epoch": 1298} {"train_loss": -11.472270011901855, "global_step": 218078, "epoch": 1298} {"train_loss": -11.581404685974121, "global_step": 218079, "epoch": 1298} {"train_loss": -11.520608901977539, "global_step": 218080, "epoch": 1298} {"train_loss": -11.73228931427002, "global_step": 218081, "epoch": 1298} {"train_loss": -11.623428344726562, "global_step": 218082, "epoch": 1298} {"train_loss": -11.623016357421875, "global_step": 218083, "epoch": 1298} {"train_loss": -11.729907989501953, "global_step": 218084, "epoch": 1298} {"train_loss": -11.233799934387207, "global_step": 218085, "epoch": 1298} {"train_loss": -11.544694900512695, "global_step": 218086, "epoch": 1298} {"train_loss": -11.544790267944336, "global_step": 218087, "epoch": 1298} {"train_loss": -11.60599136352539, "global_step": 218088, "epoch": 1298} {"train_loss": -11.724388122558594, "global_step": 218089, "epoch": 1298} {"train_loss": -11.637094497680664, "global_step": 218090, "epoch": 1298} {"train_loss": -11.41086196899414, "global_step": 218091, "epoch": 1298} {"train_loss": -11.737305641174316, "global_step": 218092, "epoch": 1298} {"train_loss": -11.5185546875, "global_step": 218093, "epoch": 1298} {"train_loss": -11.819075584411621, "global_step": 218094, "epoch": 1298} {"train_loss": -11.635255813598633, "global_step": 218095, "epoch": 1298} {"train_loss": -11.393765449523926, "global_step": 218096, "epoch": 1298} {"train_loss": -11.65227222442627, "global_step": 218097, "epoch": 1298} {"train_loss": -11.918716430664062, "global_step": 218098, "epoch": 1298} {"train_loss": -11.746475219726562, "global_step": 218099, "epoch": 1298} {"train_loss": -11.589282035827637, "global_step": 218100, "epoch": 1298} {"train_loss": -11.770696640014648, "global_step": 218101, "epoch": 1298} {"train_loss": -11.55486011505127, "global_step": 218102, "epoch": 1298} {"train_loss": -11.45413589477539, "global_step": 218103, "epoch": 1298} {"train_loss": -11.19605827331543, "global_step": 218104, "epoch": 1298} {"train_loss": -11.530974388122559, "global_step": 218105, "epoch": 1298} {"train_loss": -10.668578147888184, "global_step": 218106, "epoch": 1298} {"train_loss": -11.635339736938477, "global_step": 218107, "epoch": 1298} {"train_loss": -11.474931716918945, "global_step": 218108, "epoch": 1298} {"train_loss": -11.140668869018555, "global_step": 218109, "epoch": 1298} {"train_loss": -11.488698959350586, "global_step": 218110, "epoch": 1298} {"train_loss": -11.851036071777344, "global_step": 218111, "epoch": 1298} {"train_loss": -11.87006664276123, "global_step": 218112, "epoch": 1298} {"train_loss": -11.79234504699707, "global_step": 218113, "epoch": 1298} {"train_loss": -11.664735794067383, "global_step": 218114, "epoch": 1298} {"train_loss": -11.852899551391602, "global_step": 218115, "epoch": 1298} {"train_loss": -11.51820182800293, "global_step": 218116, "epoch": 1298} {"train_loss": -11.118997573852539, "global_step": 218117, "epoch": 1298} {"train_loss": -11.491621017456055, "global_step": 218118, "epoch": 1298} {"train_loss": -10.820358276367188, "global_step": 218119, "epoch": 1298} {"train_loss": -9.826156616210938, "global_step": 218120, "epoch": 1298} {"train_loss": -11.531569480895996, "global_step": 218121, "epoch": 1298} {"train_loss": -11.172761917114258, "global_step": 218122, "epoch": 1298} {"train_loss": -10.664052963256836, "global_step": 218123, "epoch": 1298} {"train_loss": -11.497063636779785, "global_step": 218124, "epoch": 1298} {"train_loss": -9.780330657958984, "global_step": 218125, "epoch": 1298} {"train_loss": -11.617715835571289, "global_step": 218126, "epoch": 1298} {"train_loss": -10.066962242126465, "global_step": 218127, "epoch": 1298} {"train_loss": -10.912862777709961, "global_step": 218128, "epoch": 1298} {"train_loss": -10.613153457641602, "global_step": 218129, "epoch": 1298} {"train_loss": -10.96169376373291, "global_step": 218130, "epoch": 1298} {"train_loss": -11.213022232055664, "global_step": 218131, "epoch": 1298} {"train_loss": -10.846717834472656, "global_step": 218132, "epoch": 1298} {"train_loss": -11.32319450378418, "global_step": 218133, "epoch": 1298} {"train_loss": -10.414079666137695, "global_step": 218134, "epoch": 1298} {"train_loss": -11.227823257446289, "global_step": 218135, "epoch": 1298} {"train_loss": -11.132282257080078, "global_step": 218136, "epoch": 1298} {"train_loss": -11.487165451049805, "global_step": 218137, "epoch": 1298} {"train_loss": -11.229031562805176, "global_step": 218138, "epoch": 1298} {"train_loss": -11.331720352172852, "global_step": 218139, "epoch": 1298} {"train_loss": -11.382962226867676, "global_step": 218140, "epoch": 1298} {"train_loss": -11.517346382141113, "global_step": 218141, "epoch": 1298} {"train_loss": -11.293939590454102, "global_step": 218142, "epoch": 1298} {"train_loss": -11.532143592834473, "global_step": 218143, "epoch": 1298} {"train_loss": -11.405492782592773, "global_step": 218144, "epoch": 1298} {"train_loss": -11.610301971435547, "global_step": 218145, "epoch": 1298} {"train_loss": -11.527950286865234, "global_step": 218146, "epoch": 1298} {"train_loss": -11.442863464355469, "global_step": 218147, "epoch": 1298} {"train_loss": -11.375402450561523, "global_step": 218148, "epoch": 1298} {"train_loss": -11.47342300415039, "global_step": 218149, "epoch": 1298} {"train_loss": -11.790608406066895, "global_step": 218150, "epoch": 1298} {"train_loss": -11.250288009643555, "global_step": 218151, "epoch": 1298} {"train_loss": -11.744863510131836, "global_step": 218152, "epoch": 1298} {"train_loss": -11.64414119720459, "global_step": 218153, "epoch": 1298} {"train_loss": -11.64655590057373, "global_step": 218154, "epoch": 1298} {"train_loss": -11.539164543151855, "global_step": 218155, "epoch": 1298} {"train_loss": -11.254902839660645, "global_step": 218156, "epoch": 1298} {"train_loss": -11.698020935058594, "global_step": 218157, "epoch": 1298} {"train_loss": -11.546358108520508, "global_step": 218158, "epoch": 1298} {"train_loss": -11.286345481872559, "global_step": 218159, "epoch": 1298} {"train_loss": -11.698820114135742, "global_step": 218160, "epoch": 1298} {"train_loss": -11.392851829528809, "global_step": 218161, "epoch": 1298} {"train_loss": -11.57908821105957, "global_step": 218162, "epoch": 1298} {"train_loss": -11.659797668457031, "global_step": 218163, "epoch": 1298} {"train_loss": -11.396512985229492, "global_step": 218164, "epoch": 1298} {"train_loss": -11.501839637756348, "global_step": 218165, "epoch": 1298} {"train_loss": -11.200483322143555, "global_step": 218166, "epoch": 1298} {"train_loss": -10.880985260009766, "global_step": 218167, "epoch": 1298} {"train_loss": -11.135473251342773, "global_step": 218168, "epoch": 1298} {"train_loss": -11.719268798828125, "global_step": 218169, "epoch": 1298} {"train_loss": -11.41429328918457, "global_step": 218170, "epoch": 1298} {"train_loss": -11.923404693603516, "global_step": 218171, "epoch": 1298} {"train_loss": -11.557823181152344, "global_step": 218172, "epoch": 1298} {"train_loss": -11.459261894226074, "global_step": 218173, "epoch": 1298} {"train_loss": -11.72653579711914, "global_step": 218174, "epoch": 1298} {"train_loss": -11.594660758972168, "global_step": 218175, "epoch": 1298} {"train_loss": -11.484700202941895, "global_step": 218176, "epoch": 1298} {"train_loss": -11.649698257446289, "global_step": 218177, "epoch": 1298} {"train_loss": -11.046972274780273, "global_step": 218178, "epoch": 1298} {"train_loss": -11.567769050598145, "global_step": 218179, "epoch": 1298} {"train_loss": -10.677460670471191, "global_step": 218180, "epoch": 1298} {"train_loss": -10.66169548034668, "global_step": 218181, "epoch": 1298} {"train_loss": -10.854771614074707, "global_step": 218182, "epoch": 1298} {"train_loss": -10.670166015625, "global_step": 218183, "epoch": 1298} {"train_loss": -11.13211441040039, "global_step": 218184, "epoch": 1298} {"train_loss": -11.199692726135254, "global_step": 218185, "epoch": 1298} {"train_loss": -11.001006126403809, "global_step": 218186, "epoch": 1298} {"train_loss": -11.246753692626953, "global_step": 218187, "epoch": 1298} {"train_loss": -10.746874809265137, "global_step": 218188, "epoch": 1298} {"train_loss": -11.186460494995117, "global_step": 218189, "epoch": 1298} {"train_loss": -10.604220390319824, "global_step": 218190, "epoch": 1298} {"train_loss": -10.96786880493164, "global_step": 218191, "epoch": 1298} {"train_loss": -11.20444107055664, "global_step": 218192, "epoch": 1298} {"train_loss": -10.53757381439209, "global_step": 218193, "epoch": 1298} {"train_loss": -11.446266174316406, "global_step": 218194, "epoch": 1298} {"train_loss": -11.277113914489746, "global_step": 218195, "epoch": 1298} {"train_loss": -11.18000316619873, "global_step": 218196, "epoch": 1298} {"train_loss": -11.325004577636719, "global_step": 218197, "epoch": 1298} {"train_loss": -10.87363052368164, "global_step": 218198, "epoch": 1298} {"train_loss": -11.312920570373535, "global_step": 218199, "epoch": 1298} {"train_loss": -11.488289833068848, "global_step": 218200, "epoch": 1298} {"train_loss": -11.64687728881836, "global_step": 218201, "epoch": 1298} {"train_loss": -11.635248184204102, "global_step": 218202, "epoch": 1298} {"train_loss": -11.619560241699219, "global_step": 218203, "epoch": 1298} {"train_loss": -11.570594787597656, "global_step": 218204, "epoch": 1298} {"train_loss": -11.712930679321289, "global_step": 218205, "epoch": 1298} {"train_loss": -11.672080039978027, "global_step": 218206, "epoch": 1298} {"train_loss": -11.596920013427734, "global_step": 218207, "epoch": 1298} {"train_loss": -11.748488426208496, "global_step": 218208, "epoch": 1298} {"train_loss": -11.907328605651855, "global_step": 218209, "epoch": 1298} {"train_loss": -11.756586074829102, "global_step": 218210, "epoch": 1298} {"train_loss": -11.690238952636719, "global_step": 218211, "epoch": 1298} {"train_loss": -11.79820728302002, "global_step": 218212, "epoch": 1298} {"train_loss": -11.829363822937012, "global_step": 218213, "epoch": 1298} {"train_loss": -11.697032928466797, "global_step": 218214, "epoch": 1298} {"train_loss": -11.964912414550781, "global_step": 218215, "epoch": 1298} {"train_loss": -11.820406913757324, "global_step": 218216, "epoch": 1298} {"train_loss": -11.56654167175293, "global_step": 218217, "epoch": 1298} {"train_loss": -11.752840042114258, "global_step": 218218, "epoch": 1298} {"train_loss": -11.683025360107422, "global_step": 218219, "epoch": 1298} {"train_loss": -11.641136169433594, "global_step": 218220, "epoch": 1298} {"train_loss": -11.828798294067383, "global_step": 218221, "epoch": 1298} {"train_loss": -11.515909194946289, "global_step": 218222, "epoch": 1298} {"train_loss": -11.811479568481445, "global_step": 218223, "epoch": 1298} {"train_loss": -11.675893783569336, "global_step": 218224, "epoch": 1298} {"train_loss": -11.710098266601562, "global_step": 218225, "epoch": 1298} {"train_loss": -11.600549697875977, "global_step": 218226, "epoch": 1298} {"train_loss": -11.488922119140625, "global_step": 218227, "epoch": 1298} {"train_loss": -11.899423599243164, "global_step": 218228, "epoch": 1298} {"train_loss": -11.828760147094727, "global_step": 218229, "epoch": 1298} {"train_loss": -11.582887649536133, "global_step": 218230, "epoch": 1298} {"train_loss": -11.401621966134934, "global_step": 218231, "epoch": 1298, "val_loss": 258906.0625} {"train_loss": -11.094730377197266, "global_step": 218232, "epoch": 1299} {"train_loss": -11.467024803161621, "global_step": 218233, "epoch": 1299} {"train_loss": -12.062087059020996, "global_step": 218234, "epoch": 1299} {"train_loss": -11.428080558776855, "global_step": 218235, "epoch": 1299} {"train_loss": -11.725748062133789, "global_step": 218236, "epoch": 1299} {"train_loss": -11.782814979553223, "global_step": 218237, "epoch": 1299} {"train_loss": -11.847129821777344, "global_step": 218238, "epoch": 1299} {"train_loss": -11.643037796020508, "global_step": 218239, "epoch": 1299} {"train_loss": -11.97923755645752, "global_step": 218240, "epoch": 1299} {"train_loss": -12.010149002075195, "global_step": 218241, "epoch": 1299} {"train_loss": -11.598827362060547, "global_step": 218242, "epoch": 1299} {"train_loss": -11.708366394042969, "global_step": 218243, "epoch": 1299} {"train_loss": -11.924554824829102, "global_step": 218244, "epoch": 1299} {"train_loss": -11.704289436340332, "global_step": 218245, "epoch": 1299} {"train_loss": -11.877790451049805, "global_step": 218246, "epoch": 1299} {"train_loss": -12.06568717956543, "global_step": 218247, "epoch": 1299} {"train_loss": -11.828356742858887, "global_step": 218248, "epoch": 1299} {"train_loss": -11.91797924041748, "global_step": 218249, "epoch": 1299} {"train_loss": -11.982108116149902, "global_step": 218250, "epoch": 1299} {"train_loss": -12.019330978393555, "global_step": 218251, "epoch": 1299} {"train_loss": -12.010501861572266, "global_step": 218252, "epoch": 1299} {"train_loss": -11.802122116088867, "global_step": 218253, "epoch": 1299} {"train_loss": -11.823925971984863, "global_step": 218254, "epoch": 1299} {"train_loss": -11.90938663482666, "global_step": 218255, "epoch": 1299} {"train_loss": -11.708391189575195, "global_step": 218256, "epoch": 1299} {"train_loss": -12.052080154418945, "global_step": 218257, "epoch": 1299} {"train_loss": -11.884918212890625, "global_step": 218258, "epoch": 1299} {"train_loss": -12.074647903442383, "global_step": 218259, "epoch": 1299} {"train_loss": -11.96261978149414, "global_step": 218260, "epoch": 1299} {"train_loss": -12.133699417114258, "global_step": 218261, "epoch": 1299} {"train_loss": -11.915796279907227, "global_step": 218262, "epoch": 1299} {"train_loss": -12.147714614868164, "global_step": 218263, "epoch": 1299} {"train_loss": -11.860666275024414, "global_step": 218264, "epoch": 1299} {"train_loss": -11.632129669189453, "global_step": 218265, "epoch": 1299} {"train_loss": -11.916327476501465, "global_step": 218266, "epoch": 1299} {"train_loss": -11.8223295211792, "global_step": 218267, "epoch": 1299} {"train_loss": -11.694555282592773, "global_step": 218268, "epoch": 1299} {"train_loss": -11.335718154907227, "global_step": 218269, "epoch": 1299} {"train_loss": -11.280998229980469, "global_step": 218270, "epoch": 1299} {"train_loss": -11.451311111450195, "global_step": 218271, "epoch": 1299} {"train_loss": -11.950382232666016, "global_step": 218272, "epoch": 1299} {"train_loss": -11.84040355682373, "global_step": 218273, "epoch": 1299} {"train_loss": -11.738506317138672, "global_step": 218274, "epoch": 1299} {"train_loss": -11.885793685913086, "global_step": 218275, "epoch": 1299} {"train_loss": -11.825798034667969, "global_step": 218276, "epoch": 1299} {"train_loss": -12.1254243850708, "global_step": 218277, "epoch": 1299} {"train_loss": -11.580568313598633, "global_step": 218278, "epoch": 1299} {"train_loss": -11.436702728271484, "global_step": 218279, "epoch": 1299} {"train_loss": -11.194005966186523, "global_step": 218280, "epoch": 1299} {"train_loss": -11.742023468017578, "global_step": 218281, "epoch": 1299} {"train_loss": -11.59933853149414, "global_step": 218282, "epoch": 1299} {"train_loss": -11.3486967086792, "global_step": 218283, "epoch": 1299} {"train_loss": -11.407193183898926, "global_step": 218284, "epoch": 1299} {"train_loss": -10.87486457824707, "global_step": 218285, "epoch": 1299} {"train_loss": -10.454774856567383, "global_step": 218286, "epoch": 1299} {"train_loss": -11.325164794921875, "global_step": 218287, "epoch": 1299} {"train_loss": -11.584114074707031, "global_step": 218288, "epoch": 1299} {"train_loss": -10.704216003417969, "global_step": 218289, "epoch": 1299} {"train_loss": -9.076105117797852, "global_step": 218290, "epoch": 1299} {"train_loss": -11.08144474029541, "global_step": 218291, "epoch": 1299} {"train_loss": -9.561912536621094, "global_step": 218292, "epoch": 1299} {"train_loss": -10.00816535949707, "global_step": 218293, "epoch": 1299} {"train_loss": -11.060269355773926, "global_step": 218294, "epoch": 1299} {"train_loss": -10.431694984436035, "global_step": 218295, "epoch": 1299} {"train_loss": -11.295991897583008, "global_step": 218296, "epoch": 1299} {"train_loss": -10.661500930786133, "global_step": 218297, "epoch": 1299} {"train_loss": -10.60482406616211, "global_step": 218298, "epoch": 1299} {"train_loss": -11.11640739440918, "global_step": 218299, "epoch": 1299} {"train_loss": -9.845792770385742, "global_step": 218300, "epoch": 1299} {"train_loss": -11.64846420288086, "global_step": 218301, "epoch": 1299} {"train_loss": -9.648187637329102, "global_step": 218302, "epoch": 1299} {"train_loss": -11.432165145874023, "global_step": 218303, "epoch": 1299} {"train_loss": -10.145309448242188, "global_step": 218304, "epoch": 1299} {"train_loss": -11.372000694274902, "global_step": 218305, "epoch": 1299} {"train_loss": -11.313864707946777, "global_step": 218306, "epoch": 1299} {"train_loss": -11.518360137939453, "global_step": 218307, "epoch": 1299} {"train_loss": -11.147540092468262, "global_step": 218308, "epoch": 1299} {"train_loss": -11.407119750976562, "global_step": 218309, "epoch": 1299} {"train_loss": -11.28140640258789, "global_step": 218310, "epoch": 1299} {"train_loss": -11.696014404296875, "global_step": 218311, "epoch": 1299} {"train_loss": -11.417692184448242, "global_step": 218312, "epoch": 1299} {"train_loss": -11.594482421875, "global_step": 218313, "epoch": 1299} {"train_loss": -11.533065795898438, "global_step": 218314, "epoch": 1299} {"train_loss": -11.293996810913086, "global_step": 218315, "epoch": 1299} {"train_loss": -11.51026439666748, "global_step": 218316, "epoch": 1299} {"train_loss": -11.544447898864746, "global_step": 218317, "epoch": 1299} {"train_loss": -11.508121490478516, "global_step": 218318, "epoch": 1299} {"train_loss": -11.259109497070312, "global_step": 218319, "epoch": 1299} {"train_loss": -11.760200500488281, "global_step": 218320, "epoch": 1299} {"train_loss": -11.46806526184082, "global_step": 218321, "epoch": 1299} {"train_loss": -11.159421920776367, "global_step": 218322, "epoch": 1299} {"train_loss": -11.275347709655762, "global_step": 218323, "epoch": 1299} {"train_loss": -11.487510681152344, "global_step": 218324, "epoch": 1299} {"train_loss": -11.34274673461914, "global_step": 218325, "epoch": 1299} {"train_loss": -11.486103057861328, "global_step": 218326, "epoch": 1299} {"train_loss": -11.775894165039062, "global_step": 218327, "epoch": 1299} {"train_loss": -11.587125778198242, "global_step": 218328, "epoch": 1299} {"train_loss": -11.540765762329102, "global_step": 218329, "epoch": 1299} {"train_loss": -11.587102890014648, "global_step": 218330, "epoch": 1299} {"train_loss": -11.722784996032715, "global_step": 218331, "epoch": 1299} {"train_loss": -11.668378829956055, "global_step": 218332, "epoch": 1299} {"train_loss": -11.654308319091797, "global_step": 218333, "epoch": 1299} {"train_loss": -11.648277282714844, "global_step": 218334, "epoch": 1299} {"train_loss": -11.783699989318848, "global_step": 218335, "epoch": 1299} {"train_loss": -11.86966323852539, "global_step": 218336, "epoch": 1299} {"train_loss": -11.693970680236816, "global_step": 218337, "epoch": 1299} {"train_loss": -11.846260070800781, "global_step": 218338, "epoch": 1299} {"train_loss": -11.7763032913208, "global_step": 218339, "epoch": 1299} {"train_loss": -11.812200546264648, "global_step": 218340, "epoch": 1299} {"train_loss": -11.977057456970215, "global_step": 218341, "epoch": 1299} {"train_loss": -11.872560501098633, "global_step": 218342, "epoch": 1299} {"train_loss": -11.896167755126953, "global_step": 218343, "epoch": 1299} {"train_loss": -11.638671875, "global_step": 218344, "epoch": 1299} {"train_loss": -11.626167297363281, "global_step": 218345, "epoch": 1299} {"train_loss": -11.652713775634766, "global_step": 218346, "epoch": 1299} {"train_loss": -11.60378646850586, "global_step": 218347, "epoch": 1299} {"train_loss": -11.454151153564453, "global_step": 218348, "epoch": 1299} {"train_loss": -11.785737991333008, "global_step": 218349, "epoch": 1299} {"train_loss": -11.691350936889648, "global_step": 218350, "epoch": 1299} {"train_loss": -11.52453899383545, "global_step": 218351, "epoch": 1299} {"train_loss": -11.352262496948242, "global_step": 218352, "epoch": 1299} {"train_loss": -12.088248252868652, "global_step": 218353, "epoch": 1299} {"train_loss": -10.999391555786133, "global_step": 218354, "epoch": 1299} {"train_loss": -10.129669189453125, "global_step": 218355, "epoch": 1299} {"train_loss": -11.459410667419434, "global_step": 218356, "epoch": 1299} {"train_loss": -11.917740821838379, "global_step": 218357, "epoch": 1299} {"train_loss": -10.99185562133789, "global_step": 218358, "epoch": 1299} {"train_loss": -11.384557723999023, "global_step": 218359, "epoch": 1299} {"train_loss": -11.516408920288086, "global_step": 218360, "epoch": 1299} {"train_loss": -11.506257057189941, "global_step": 218361, "epoch": 1299} {"train_loss": -11.908337593078613, "global_step": 218362, "epoch": 1299} {"train_loss": -11.439974784851074, "global_step": 218363, "epoch": 1299} {"train_loss": -11.867615699768066, "global_step": 218364, "epoch": 1299} {"train_loss": -11.405227661132812, "global_step": 218365, "epoch": 1299} {"train_loss": -11.831214904785156, "global_step": 218366, "epoch": 1299} {"train_loss": -11.424674034118652, "global_step": 218367, "epoch": 1299} {"train_loss": -11.687925338745117, "global_step": 218368, "epoch": 1299} {"train_loss": -10.940808296203613, "global_step": 218369, "epoch": 1299} {"train_loss": -10.861003875732422, "global_step": 218370, "epoch": 1299} {"train_loss": -11.60251235961914, "global_step": 218371, "epoch": 1299} {"train_loss": -11.230302810668945, "global_step": 218372, "epoch": 1299} {"train_loss": -11.259302139282227, "global_step": 218373, "epoch": 1299} {"train_loss": -11.403772354125977, "global_step": 218374, "epoch": 1299} {"train_loss": -11.266897201538086, "global_step": 218375, "epoch": 1299} {"train_loss": -10.823101043701172, "global_step": 218376, "epoch": 1299} {"train_loss": -11.699446678161621, "global_step": 218377, "epoch": 1299} {"train_loss": -11.5305757522583, "global_step": 218378, "epoch": 1299} {"train_loss": -11.194099426269531, "global_step": 218379, "epoch": 1299} {"train_loss": -11.51494312286377, "global_step": 218380, "epoch": 1299} {"train_loss": -11.424543380737305, "global_step": 218381, "epoch": 1299} {"train_loss": -11.425620079040527, "global_step": 218382, "epoch": 1299} {"train_loss": -11.58736515045166, "global_step": 218383, "epoch": 1299} {"train_loss": -11.579751968383789, "global_step": 218384, "epoch": 1299} {"train_loss": -11.324538230895996, "global_step": 218385, "epoch": 1299} {"train_loss": -11.114458084106445, "global_step": 218386, "epoch": 1299} {"train_loss": -11.372892379760742, "global_step": 218387, "epoch": 1299} {"train_loss": -11.425209045410156, "global_step": 218388, "epoch": 1299} {"train_loss": -11.671236991882324, "global_step": 218389, "epoch": 1299} {"train_loss": -11.190988540649414, "global_step": 218390, "epoch": 1299} {"train_loss": -10.005504608154297, "global_step": 218391, "epoch": 1299} {"train_loss": -10.174224853515625, "global_step": 218392, "epoch": 1299} {"train_loss": -10.079999923706055, "global_step": 218393, "epoch": 1299} {"train_loss": -8.690428733825684, "global_step": 218394, "epoch": 1299} {"train_loss": -10.388910293579102, "global_step": 218395, "epoch": 1299} {"train_loss": -7.943887233734131, "global_step": 218396, "epoch": 1299} {"train_loss": -9.94221305847168, "global_step": 218397, "epoch": 1299} {"train_loss": -9.165277481079102, "global_step": 218398, "epoch": 1299} {"train_loss": -11.37342294341042, "global_step": 218399, "epoch": 1299, "val_loss": 259967.578125} {"train_loss": -9.561633110046387, "global_step": 218400, "epoch": 1300} {"train_loss": -8.183802604675293, "global_step": 218401, "epoch": 1300} {"train_loss": -8.952174186706543, "global_step": 218402, "epoch": 1300} {"train_loss": -9.714279174804688, "global_step": 218403, "epoch": 1300} {"train_loss": -10.028406143188477, "global_step": 218404, "epoch": 1300} {"train_loss": -10.142919540405273, "global_step": 218405, "epoch": 1300} {"train_loss": -10.259237289428711, "global_step": 218406, "epoch": 1300} {"train_loss": -9.727426528930664, "global_step": 218407, "epoch": 1300} {"train_loss": -10.268957138061523, "global_step": 218408, "epoch": 1300} {"train_loss": -10.195903778076172, "global_step": 218409, "epoch": 1300} {"train_loss": -10.622762680053711, "global_step": 218410, "epoch": 1300} {"train_loss": -11.036253929138184, "global_step": 218411, "epoch": 1300} {"train_loss": -10.436914443969727, "global_step": 218412, "epoch": 1300} {"train_loss": -11.043013572692871, "global_step": 218413, "epoch": 1300} {"train_loss": -10.8845796585083, "global_step": 218414, "epoch": 1300} {"train_loss": -10.554078102111816, "global_step": 218415, "epoch": 1300} {"train_loss": -11.224967956542969, "global_step": 218416, "epoch": 1300} {"train_loss": -10.891960144042969, "global_step": 218417, "epoch": 1300} {"train_loss": -10.687947273254395, "global_step": 218418, "epoch": 1300} {"train_loss": -11.09254264831543, "global_step": 218419, "epoch": 1300} {"train_loss": -10.926665306091309, "global_step": 218420, "epoch": 1300} {"train_loss": -11.049168586730957, "global_step": 218421, "epoch": 1300} {"train_loss": -10.852179527282715, "global_step": 218422, "epoch": 1300} {"train_loss": -11.168071746826172, "global_step": 218423, "epoch": 1300} {"train_loss": -10.683523178100586, "global_step": 218424, "epoch": 1300} {"train_loss": -11.134368896484375, "global_step": 218425, "epoch": 1300} {"train_loss": -11.030056953430176, "global_step": 218426, "epoch": 1300} {"train_loss": -10.588105201721191, "global_step": 218427, "epoch": 1300} {"train_loss": -11.090641021728516, "global_step": 218428, "epoch": 1300} {"train_loss": -11.224599838256836, "global_step": 218429, "epoch": 1300} {"train_loss": -11.101774215698242, "global_step": 218430, "epoch": 1300} {"train_loss": -11.013626098632812, "global_step": 218431, "epoch": 1300} {"train_loss": -10.890872955322266, "global_step": 218432, "epoch": 1300} {"train_loss": -11.294381141662598, "global_step": 218433, "epoch": 1300} {"train_loss": -11.192626953125, "global_step": 218434, "epoch": 1300} {"train_loss": -10.97065544128418, "global_step": 218435, "epoch": 1300} {"train_loss": -11.400629043579102, "global_step": 218436, "epoch": 1300} {"train_loss": -11.105855941772461, "global_step": 218437, "epoch": 1300} {"train_loss": -11.37682819366455, "global_step": 218438, "epoch": 1300} {"train_loss": -11.421918869018555, "global_step": 218439, "epoch": 1300} {"train_loss": -11.05489730834961, "global_step": 218440, "epoch": 1300} {"train_loss": -11.222441673278809, "global_step": 218441, "epoch": 1300} {"train_loss": -11.253243446350098, "global_step": 218442, "epoch": 1300} {"train_loss": -11.236101150512695, "global_step": 218443, "epoch": 1300} {"train_loss": -11.30343246459961, "global_step": 218444, "epoch": 1300} {"train_loss": -11.322428703308105, "global_step": 218445, "epoch": 1300} {"train_loss": -11.359429359436035, "global_step": 218446, "epoch": 1300} {"train_loss": -11.289892196655273, "global_step": 218447, "epoch": 1300} {"train_loss": -11.530277252197266, "global_step": 218448, "epoch": 1300} {"train_loss": -11.161794662475586, "global_step": 218449, "epoch": 1300} {"train_loss": -11.40730094909668, "global_step": 218450, "epoch": 1300} {"train_loss": -11.429750442504883, "global_step": 218451, "epoch": 1300} {"train_loss": -11.23164176940918, "global_step": 218452, "epoch": 1300} {"train_loss": -11.273015975952148, "global_step": 218453, "epoch": 1300} {"train_loss": -11.471246719360352, "global_step": 218454, "epoch": 1300} {"train_loss": -11.619731903076172, "global_step": 218455, "epoch": 1300} {"train_loss": -11.580513000488281, "global_step": 218456, "epoch": 1300} {"train_loss": -11.468585014343262, "global_step": 218457, "epoch": 1300} {"train_loss": -11.627959251403809, "global_step": 218458, "epoch": 1300} {"train_loss": -11.408111572265625, "global_step": 218459, "epoch": 1300} {"train_loss": -11.64354419708252, "global_step": 218460, "epoch": 1300} {"train_loss": -11.540544509887695, "global_step": 218461, "epoch": 1300} {"train_loss": -11.668933868408203, "global_step": 218462, "epoch": 1300} {"train_loss": -11.668168067932129, "global_step": 218463, "epoch": 1300} {"train_loss": -11.783367156982422, "global_step": 218464, "epoch": 1300} {"train_loss": -11.524127960205078, "global_step": 218465, "epoch": 1300} {"train_loss": -11.550021171569824, "global_step": 218466, "epoch": 1300} {"train_loss": -11.513506889343262, "global_step": 218467, "epoch": 1300} {"train_loss": -11.64261531829834, "global_step": 218468, "epoch": 1300} {"train_loss": -11.50413703918457, "global_step": 218469, "epoch": 1300} {"train_loss": -11.64377212524414, "global_step": 218470, "epoch": 1300} {"train_loss": -11.328269958496094, "global_step": 218471, "epoch": 1300} {"train_loss": -11.581605911254883, "global_step": 218472, "epoch": 1300} {"train_loss": -11.310867309570312, "global_step": 218473, "epoch": 1300} {"train_loss": -11.469905853271484, "global_step": 218474, "epoch": 1300} {"train_loss": -11.328144073486328, "global_step": 218475, "epoch": 1300} {"train_loss": -11.477806091308594, "global_step": 218476, "epoch": 1300} {"train_loss": -11.740312576293945, "global_step": 218477, "epoch": 1300} {"train_loss": -10.970353126525879, "global_step": 218478, "epoch": 1300} {"train_loss": -11.605725288391113, "global_step": 218479, "epoch": 1300} {"train_loss": -11.317938804626465, "global_step": 218480, "epoch": 1300} {"train_loss": -11.207460403442383, "global_step": 218481, "epoch": 1300} {"train_loss": -11.526190757751465, "global_step": 218482, "epoch": 1300} {"train_loss": -11.242012023925781, "global_step": 218483, "epoch": 1300} {"train_loss": -11.702683448791504, "global_step": 218484, "epoch": 1300} {"train_loss": -11.5054931640625, "global_step": 218485, "epoch": 1300} {"train_loss": -11.804244995117188, "global_step": 218486, "epoch": 1300} {"train_loss": -11.480449676513672, "global_step": 218487, "epoch": 1300} {"train_loss": -11.393447875976562, "global_step": 218488, "epoch": 1300} {"train_loss": -11.862573623657227, "global_step": 218489, "epoch": 1300} {"train_loss": -11.203985214233398, "global_step": 218490, "epoch": 1300} {"train_loss": -11.56745719909668, "global_step": 218491, "epoch": 1300} {"train_loss": -11.574552536010742, "global_step": 218492, "epoch": 1300} {"train_loss": -10.686378479003906, "global_step": 218493, "epoch": 1300} {"train_loss": -11.462139129638672, "global_step": 218494, "epoch": 1300} {"train_loss": -11.155085563659668, "global_step": 218495, "epoch": 1300} {"train_loss": -11.27161693572998, "global_step": 218496, "epoch": 1300} {"train_loss": -11.40334701538086, "global_step": 218497, "epoch": 1300} {"train_loss": -11.608213424682617, "global_step": 218498, "epoch": 1300} {"train_loss": -11.460611343383789, "global_step": 218499, "epoch": 1300} {"train_loss": -11.643508911132812, "global_step": 218500, "epoch": 1300} {"train_loss": -11.69670295715332, "global_step": 218501, "epoch": 1300} {"train_loss": -11.547892570495605, "global_step": 218502, "epoch": 1300} {"train_loss": -11.681143760681152, "global_step": 218503, "epoch": 1300} {"train_loss": -11.42880630493164, "global_step": 218504, "epoch": 1300} {"train_loss": -11.84347915649414, "global_step": 218505, "epoch": 1300} {"train_loss": -11.480727195739746, "global_step": 218506, "epoch": 1300} {"train_loss": -11.594413757324219, "global_step": 218507, "epoch": 1300} {"train_loss": -11.549352645874023, "global_step": 218508, "epoch": 1300} {"train_loss": -11.319720268249512, "global_step": 218509, "epoch": 1300} {"train_loss": -11.689167976379395, "global_step": 218510, "epoch": 1300} {"train_loss": -11.080936431884766, "global_step": 218511, "epoch": 1300} {"train_loss": -11.903984069824219, "global_step": 218512, "epoch": 1300} {"train_loss": -11.258190155029297, "global_step": 218513, "epoch": 1300} {"train_loss": -11.469358444213867, "global_step": 218514, "epoch": 1300} {"train_loss": -11.307634353637695, "global_step": 218515, "epoch": 1300} {"train_loss": -11.072809219360352, "global_step": 218516, "epoch": 1300} {"train_loss": -10.598285675048828, "global_step": 218517, "epoch": 1300} {"train_loss": -11.621238708496094, "global_step": 218518, "epoch": 1300} {"train_loss": -10.668102264404297, "global_step": 218519, "epoch": 1300} {"train_loss": -11.074871063232422, "global_step": 218520, "epoch": 1300} {"train_loss": -11.375351905822754, "global_step": 218521, "epoch": 1300} {"train_loss": -10.989571571350098, "global_step": 218522, "epoch": 1300} {"train_loss": -11.393182754516602, "global_step": 218523, "epoch": 1300} {"train_loss": -10.889659881591797, "global_step": 218524, "epoch": 1300} {"train_loss": -11.284537315368652, "global_step": 218525, "epoch": 1300} {"train_loss": -11.038681030273438, "global_step": 218526, "epoch": 1300} {"train_loss": -11.59607982635498, "global_step": 218527, "epoch": 1300} {"train_loss": -11.14564037322998, "global_step": 218528, "epoch": 1300} {"train_loss": -11.657787322998047, "global_step": 218529, "epoch": 1300} {"train_loss": -11.452993392944336, "global_step": 218530, "epoch": 1300} {"train_loss": -11.476097106933594, "global_step": 218531, "epoch": 1300} {"train_loss": -11.385799407958984, "global_step": 218532, "epoch": 1300} {"train_loss": -11.605018615722656, "global_step": 218533, "epoch": 1300} {"train_loss": -11.883566856384277, "global_step": 218534, "epoch": 1300} {"train_loss": -11.25520133972168, "global_step": 218535, "epoch": 1300} {"train_loss": -11.492636680603027, "global_step": 218536, "epoch": 1300} {"train_loss": -11.29472541809082, "global_step": 218537, "epoch": 1300} {"train_loss": -11.642824172973633, "global_step": 218538, "epoch": 1300} {"train_loss": -11.651163101196289, "global_step": 218539, "epoch": 1300} {"train_loss": -11.449052810668945, "global_step": 218540, "epoch": 1300} {"train_loss": -11.300890922546387, "global_step": 218541, "epoch": 1300} {"train_loss": -11.549808502197266, "global_step": 218542, "epoch": 1300} {"train_loss": -11.092691421508789, "global_step": 218543, "epoch": 1300} {"train_loss": -11.352210998535156, "global_step": 218544, "epoch": 1300} {"train_loss": -11.29484748840332, "global_step": 218545, "epoch": 1300} {"train_loss": -11.080280303955078, "global_step": 218546, "epoch": 1300} {"train_loss": -11.580511093139648, "global_step": 218547, "epoch": 1300} {"train_loss": -10.960548400878906, "global_step": 218548, "epoch": 1300} {"train_loss": -11.020419120788574, "global_step": 218549, "epoch": 1300} {"train_loss": -11.183235168457031, "global_step": 218550, "epoch": 1300} {"train_loss": -11.192533493041992, "global_step": 218551, "epoch": 1300} {"train_loss": -11.317903518676758, "global_step": 218552, "epoch": 1300} {"train_loss": -10.965533256530762, "global_step": 218553, "epoch": 1300} {"train_loss": -11.297582626342773, "global_step": 218554, "epoch": 1300} {"train_loss": -10.789530754089355, "global_step": 218555, "epoch": 1300} {"train_loss": -11.568355560302734, "global_step": 218556, "epoch": 1300} {"train_loss": -11.050018310546875, "global_step": 218557, "epoch": 1300} {"train_loss": -11.496971130371094, "global_step": 218558, "epoch": 1300} {"train_loss": -11.279481887817383, "global_step": 218559, "epoch": 1300} {"train_loss": -11.122020721435547, "global_step": 218560, "epoch": 1300} {"train_loss": -11.26463794708252, "global_step": 218561, "epoch": 1300} {"train_loss": -11.117744445800781, "global_step": 218562, "epoch": 1300} {"train_loss": -11.35825252532959, "global_step": 218563, "epoch": 1300} {"train_loss": -11.411078453063965, "global_step": 218564, "epoch": 1300} {"train_loss": -11.496010780334473, "global_step": 218565, "epoch": 1300} {"train_loss": -11.17238998413086, "global_step": 218566, "epoch": 1300} {"train_loss": -11.21590404851096, "global_step": 218567, "epoch": 1300, "train/sim_max_reward_0": 0.6937461595207023, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 6.556237081971408e-06, "train/sim_max_reward_3": 0.6421632788446466, "train/sim_max_reward_4": 0.05372351936867168, "train/sim_max_reward_5": 0.5377413934310721, "test/sim_max_reward_4400000": 0.9952157428530599, "test/sim_max_reward_4400001": 0.5286374510148746, "test/sim_max_reward_4400002": 0.06128797782423358, "test/sim_max_reward_4400003": 0.20856834103650862, "test/sim_max_reward_4400004": 0.46095586121268106, "test/sim_max_reward_4400005": 0.9153031980008646, "test/sim_max_reward_4400006": 0.8904473550433784, "test/sim_max_reward_4400007": 0.48802530368079877, "test/sim_max_reward_4400008": 0.5805807905227531, "test/sim_max_reward_4400009": 0.028056084893255426, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 0.9894633360495665, "test/sim_max_reward_4400013": 0.9617645963564861, "test/sim_max_reward_4400014": 0.971122821119265, "test/sim_max_reward_4400015": 0.9189080880380663, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9819261961840361, "test/sim_max_reward_4400019": 0.4264030596268733, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.9702785237814853, "test/sim_max_reward_4400022": 0.9688120777069005, "test/sim_max_reward_4400023": 0.13720733777010335, "test/sim_max_reward_4400024": 0.2969932807243459, "test/sim_max_reward_4400025": 0.658485560551477, "test/sim_max_reward_4400026": 0.08639877864622329, "test/sim_max_reward_4400027": 0.9864079875543297, "test/sim_max_reward_4400028": 1.0, "test/sim_max_reward_4400029": 0.5499298202190608, "test/sim_max_reward_4400030": 0.9697179650432873, "test/sim_max_reward_4400031": 0.9796547793120512, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.38355894791118855, "test/sim_max_reward_4400034": 0.9612717795240248, "test/sim_max_reward_4400035": 0.9612182325408658, "test/sim_max_reward_4400036": 0.3759027793596416, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.9725183231988491, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9525921894499834, "test/sim_max_reward_4400042": 0.026409268316691197, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.542880240849976, "test/sim_max_reward_4400045": 0.9523849562111911, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.8401594334599137, "train/mean_score": 0.4878968179003625, "test/mean_score": 0.6395889693117658, "val_loss": 259242.03125, "train_action_mse_error": 0.4423171281814575} {"train_loss": -11.211841583251953, "global_step": 218568, "epoch": 1301} {"train_loss": -11.553464889526367, "global_step": 218569, "epoch": 1301} {"train_loss": -11.185789108276367, "global_step": 218570, "epoch": 1301} {"train_loss": -11.44129467010498, "global_step": 218571, "epoch": 1301} {"train_loss": -11.461071968078613, "global_step": 218572, "epoch": 1301} {"train_loss": -11.749555587768555, "global_step": 218573, "epoch": 1301} {"train_loss": -11.664894104003906, "global_step": 218574, "epoch": 1301} {"train_loss": -11.606539726257324, "global_step": 218575, "epoch": 1301} {"train_loss": -11.356172561645508, "global_step": 218576, "epoch": 1301} {"train_loss": -11.699372291564941, "global_step": 218577, "epoch": 1301} {"train_loss": -11.711543083190918, "global_step": 218578, "epoch": 1301} {"train_loss": -11.633767127990723, "global_step": 218579, "epoch": 1301} {"train_loss": -11.633810043334961, "global_step": 218580, "epoch": 1301} {"train_loss": -11.778596878051758, "global_step": 218581, "epoch": 1301} {"train_loss": -11.805078506469727, "global_step": 218582, "epoch": 1301} {"train_loss": -11.555816650390625, "global_step": 218583, "epoch": 1301} {"train_loss": -11.728779792785645, "global_step": 218584, "epoch": 1301} {"train_loss": -11.653478622436523, "global_step": 218585, "epoch": 1301} {"train_loss": -11.545256614685059, "global_step": 218586, "epoch": 1301} {"train_loss": -11.62192440032959, "global_step": 218587, "epoch": 1301} {"train_loss": -11.364664077758789, "global_step": 218588, "epoch": 1301} {"train_loss": -11.675154685974121, "global_step": 218589, "epoch": 1301} {"train_loss": -11.591838836669922, "global_step": 218590, "epoch": 1301} {"train_loss": -11.814813613891602, "global_step": 218591, "epoch": 1301} {"train_loss": -11.634201049804688, "global_step": 218592, "epoch": 1301} {"train_loss": -11.60232162475586, "global_step": 218593, "epoch": 1301} {"train_loss": -11.67408275604248, "global_step": 218594, "epoch": 1301} {"train_loss": -11.612578392028809, "global_step": 218595, "epoch": 1301} {"train_loss": -11.601499557495117, "global_step": 218596, "epoch": 1301} {"train_loss": -11.683796882629395, "global_step": 218597, "epoch": 1301} {"train_loss": -11.26172161102295, "global_step": 218598, "epoch": 1301} {"train_loss": -11.832389831542969, "global_step": 218599, "epoch": 1301} {"train_loss": -11.500990867614746, "global_step": 218600, "epoch": 1301} {"train_loss": -11.61508560180664, "global_step": 218601, "epoch": 1301} {"train_loss": -11.964027404785156, "global_step": 218602, "epoch": 1301} {"train_loss": -11.337296485900879, "global_step": 218603, "epoch": 1301} {"train_loss": -11.656046867370605, "global_step": 218604, "epoch": 1301} {"train_loss": -11.590961456298828, "global_step": 218605, "epoch": 1301} {"train_loss": -11.454828262329102, "global_step": 218606, "epoch": 1301} {"train_loss": -11.256875991821289, "global_step": 218607, "epoch": 1301} {"train_loss": -11.561609268188477, "global_step": 218608, "epoch": 1301} {"train_loss": -11.459485054016113, "global_step": 218609, "epoch": 1301} {"train_loss": -11.03984260559082, "global_step": 218610, "epoch": 1301} {"train_loss": -11.546689987182617, "global_step": 218611, "epoch": 1301} {"train_loss": -11.502548217773438, "global_step": 218612, "epoch": 1301} {"train_loss": -11.245962142944336, "global_step": 218613, "epoch": 1301} {"train_loss": -11.289156913757324, "global_step": 218614, "epoch": 1301} {"train_loss": -11.270214080810547, "global_step": 218615, "epoch": 1301} {"train_loss": -11.547130584716797, "global_step": 218616, "epoch": 1301} {"train_loss": -10.464654922485352, "global_step": 218617, "epoch": 1301} {"train_loss": -11.681098937988281, "global_step": 218618, "epoch": 1301} {"train_loss": -11.268407821655273, "global_step": 218619, "epoch": 1301} {"train_loss": -11.515539169311523, "global_step": 218620, "epoch": 1301} {"train_loss": -11.545620918273926, "global_step": 218621, "epoch": 1301} {"train_loss": -11.2150297164917, "global_step": 218622, "epoch": 1301} {"train_loss": -11.688384056091309, "global_step": 218623, "epoch": 1301} {"train_loss": -11.541485786437988, "global_step": 218624, "epoch": 1301} {"train_loss": -11.932812690734863, "global_step": 218625, "epoch": 1301} {"train_loss": -11.495404243469238, "global_step": 218626, "epoch": 1301} {"train_loss": -11.630949974060059, "global_step": 218627, "epoch": 1301} {"train_loss": -11.951131820678711, "global_step": 218628, "epoch": 1301} {"train_loss": -11.62513256072998, "global_step": 218629, "epoch": 1301} {"train_loss": -11.566715240478516, "global_step": 218630, "epoch": 1301} {"train_loss": -11.589360237121582, "global_step": 218631, "epoch": 1301} {"train_loss": -11.60449504852295, "global_step": 218632, "epoch": 1301} {"train_loss": -11.842256546020508, "global_step": 218633, "epoch": 1301} {"train_loss": -11.161781311035156, "global_step": 218634, "epoch": 1301} {"train_loss": -11.86866569519043, "global_step": 218635, "epoch": 1301} {"train_loss": -11.459037780761719, "global_step": 218636, "epoch": 1301} {"train_loss": -11.667867660522461, "global_step": 218637, "epoch": 1301} {"train_loss": -11.314217567443848, "global_step": 218638, "epoch": 1301} {"train_loss": -11.764139175415039, "global_step": 218639, "epoch": 1301} {"train_loss": -11.22467041015625, "global_step": 218640, "epoch": 1301} {"train_loss": -11.391206741333008, "global_step": 218641, "epoch": 1301} {"train_loss": -11.560620307922363, "global_step": 218642, "epoch": 1301} {"train_loss": -11.116758346557617, "global_step": 218643, "epoch": 1301} {"train_loss": -11.372110366821289, "global_step": 218644, "epoch": 1301} {"train_loss": -11.27612590789795, "global_step": 218645, "epoch": 1301} {"train_loss": -11.372045516967773, "global_step": 218646, "epoch": 1301} {"train_loss": -10.77505874633789, "global_step": 218647, "epoch": 1301} {"train_loss": -11.775760650634766, "global_step": 218648, "epoch": 1301} {"train_loss": -10.687944412231445, "global_step": 218649, "epoch": 1301} {"train_loss": -10.805335998535156, "global_step": 218650, "epoch": 1301} {"train_loss": -10.648642539978027, "global_step": 218651, "epoch": 1301} {"train_loss": -11.441816329956055, "global_step": 218652, "epoch": 1301} {"train_loss": -10.654342651367188, "global_step": 218653, "epoch": 1301} {"train_loss": -10.346264839172363, "global_step": 218654, "epoch": 1301} {"train_loss": -11.030645370483398, "global_step": 218655, "epoch": 1301} {"train_loss": -10.227422714233398, "global_step": 218656, "epoch": 1301} {"train_loss": -11.162174224853516, "global_step": 218657, "epoch": 1301} {"train_loss": -10.307493209838867, "global_step": 218658, "epoch": 1301} {"train_loss": -10.333311080932617, "global_step": 218659, "epoch": 1301} {"train_loss": -10.150772094726562, "global_step": 218660, "epoch": 1301} {"train_loss": -11.182186126708984, "global_step": 218661, "epoch": 1301} {"train_loss": -10.183414459228516, "global_step": 218662, "epoch": 1301} {"train_loss": -11.120221138000488, "global_step": 218663, "epoch": 1301} {"train_loss": -10.868640899658203, "global_step": 218664, "epoch": 1301} {"train_loss": -11.056931495666504, "global_step": 218665, "epoch": 1301} {"train_loss": -10.947220802307129, "global_step": 218666, "epoch": 1301} {"train_loss": -10.867313385009766, "global_step": 218667, "epoch": 1301} {"train_loss": -11.148614883422852, "global_step": 218668, "epoch": 1301} {"train_loss": -11.069685935974121, "global_step": 218669, "epoch": 1301} {"train_loss": -11.369236946105957, "global_step": 218670, "epoch": 1301} {"train_loss": -11.167093276977539, "global_step": 218671, "epoch": 1301} {"train_loss": -11.318268775939941, "global_step": 218672, "epoch": 1301} {"train_loss": -11.55261516571045, "global_step": 218673, "epoch": 1301} {"train_loss": -11.51995849609375, "global_step": 218674, "epoch": 1301} {"train_loss": -11.544244766235352, "global_step": 218675, "epoch": 1301} {"train_loss": -11.524011611938477, "global_step": 218676, "epoch": 1301} {"train_loss": -11.783878326416016, "global_step": 218677, "epoch": 1301} {"train_loss": -11.66840648651123, "global_step": 218678, "epoch": 1301} {"train_loss": -11.59286117553711, "global_step": 218679, "epoch": 1301} {"train_loss": -11.725570678710938, "global_step": 218680, "epoch": 1301} {"train_loss": -11.618732452392578, "global_step": 218681, "epoch": 1301} {"train_loss": -11.763309478759766, "global_step": 218682, "epoch": 1301} {"train_loss": -11.652009963989258, "global_step": 218683, "epoch": 1301} {"train_loss": -11.867487907409668, "global_step": 218684, "epoch": 1301} {"train_loss": -11.819452285766602, "global_step": 218685, "epoch": 1301} {"train_loss": -11.713489532470703, "global_step": 218686, "epoch": 1301} {"train_loss": -11.912008285522461, "global_step": 218687, "epoch": 1301} {"train_loss": -11.628244400024414, "global_step": 218688, "epoch": 1301} {"train_loss": -11.837605476379395, "global_step": 218689, "epoch": 1301} {"train_loss": -11.612621307373047, "global_step": 218690, "epoch": 1301} {"train_loss": -11.711736679077148, "global_step": 218691, "epoch": 1301} {"train_loss": -11.742133140563965, "global_step": 218692, "epoch": 1301} {"train_loss": -11.64354419708252, "global_step": 218693, "epoch": 1301} {"train_loss": -11.853565216064453, "global_step": 218694, "epoch": 1301} {"train_loss": -11.612276077270508, "global_step": 218695, "epoch": 1301} {"train_loss": -11.8013277053833, "global_step": 218696, "epoch": 1301} {"train_loss": -11.787671089172363, "global_step": 218697, "epoch": 1301} {"train_loss": -11.627317428588867, "global_step": 218698, "epoch": 1301} {"train_loss": -12.014371871948242, "global_step": 218699, "epoch": 1301} {"train_loss": -11.776185989379883, "global_step": 218700, "epoch": 1301} {"train_loss": -11.935413360595703, "global_step": 218701, "epoch": 1301} {"train_loss": -11.871362686157227, "global_step": 218702, "epoch": 1301} {"train_loss": -11.871665954589844, "global_step": 218703, "epoch": 1301} {"train_loss": -11.76431655883789, "global_step": 218704, "epoch": 1301} {"train_loss": -11.902870178222656, "global_step": 218705, "epoch": 1301} {"train_loss": -11.731034278869629, "global_step": 218706, "epoch": 1301} {"train_loss": -11.850966453552246, "global_step": 218707, "epoch": 1301} {"train_loss": -12.088367462158203, "global_step": 218708, "epoch": 1301} {"train_loss": -12.020695686340332, "global_step": 218709, "epoch": 1301} {"train_loss": -11.804483413696289, "global_step": 218710, "epoch": 1301} {"train_loss": -12.00777530670166, "global_step": 218711, "epoch": 1301} {"train_loss": -11.87507438659668, "global_step": 218712, "epoch": 1301} {"train_loss": -11.739826202392578, "global_step": 218713, "epoch": 1301} {"train_loss": -12.012137413024902, "global_step": 218714, "epoch": 1301} {"train_loss": -11.78084945678711, "global_step": 218715, "epoch": 1301} {"train_loss": -11.31033706665039, "global_step": 218716, "epoch": 1301} {"train_loss": -11.771028518676758, "global_step": 218717, "epoch": 1301} {"train_loss": -11.994857788085938, "global_step": 218718, "epoch": 1301} {"train_loss": -11.75210952758789, "global_step": 218719, "epoch": 1301} {"train_loss": -11.7566556930542, "global_step": 218720, "epoch": 1301} {"train_loss": -11.869659423828125, "global_step": 218721, "epoch": 1301} {"train_loss": -11.906697273254395, "global_step": 218722, "epoch": 1301} {"train_loss": -11.674933433532715, "global_step": 218723, "epoch": 1301} {"train_loss": -11.283985137939453, "global_step": 218724, "epoch": 1301} {"train_loss": -11.659125328063965, "global_step": 218725, "epoch": 1301} {"train_loss": -12.040817260742188, "global_step": 218726, "epoch": 1301} {"train_loss": -11.474087715148926, "global_step": 218727, "epoch": 1301} {"train_loss": -11.430339813232422, "global_step": 218728, "epoch": 1301} {"train_loss": -11.637805938720703, "global_step": 218729, "epoch": 1301} {"train_loss": -11.867018699645996, "global_step": 218730, "epoch": 1301} {"train_loss": -11.537100791931152, "global_step": 218731, "epoch": 1301} {"train_loss": -10.67226791381836, "global_step": 218732, "epoch": 1301} {"train_loss": -10.385335922241211, "global_step": 218733, "epoch": 1301} {"train_loss": -11.986921310424805, "global_step": 218734, "epoch": 1301} {"train_loss": -11.488703926404318, "global_step": 218735, "epoch": 1301, "val_loss": 259390.03125} {"train_loss": -10.669235229492188, "global_step": 218736, "epoch": 1302} {"train_loss": -10.871033668518066, "global_step": 218737, "epoch": 1302} {"train_loss": -11.460036277770996, "global_step": 218738, "epoch": 1302} {"train_loss": -11.21346664428711, "global_step": 218739, "epoch": 1302} {"train_loss": -10.009567260742188, "global_step": 218740, "epoch": 1302} {"train_loss": -11.059348106384277, "global_step": 218741, "epoch": 1302} {"train_loss": -10.32787036895752, "global_step": 218742, "epoch": 1302} {"train_loss": -9.618124008178711, "global_step": 218743, "epoch": 1302} {"train_loss": -10.799007415771484, "global_step": 218744, "epoch": 1302} {"train_loss": -11.295332908630371, "global_step": 218745, "epoch": 1302} {"train_loss": -10.741069793701172, "global_step": 218746, "epoch": 1302} {"train_loss": -11.237273216247559, "global_step": 218747, "epoch": 1302} {"train_loss": -10.559396743774414, "global_step": 218748, "epoch": 1302} {"train_loss": -11.395877838134766, "global_step": 218749, "epoch": 1302} {"train_loss": -10.63563346862793, "global_step": 218750, "epoch": 1302} {"train_loss": -10.637550354003906, "global_step": 218751, "epoch": 1302} {"train_loss": -11.135995864868164, "global_step": 218752, "epoch": 1302} {"train_loss": -10.720947265625, "global_step": 218753, "epoch": 1302} {"train_loss": -10.978379249572754, "global_step": 218754, "epoch": 1302} {"train_loss": -10.355867385864258, "global_step": 218755, "epoch": 1302} {"train_loss": -10.551492691040039, "global_step": 218756, "epoch": 1302} {"train_loss": -10.959907531738281, "global_step": 218757, "epoch": 1302} {"train_loss": -10.723819732666016, "global_step": 218758, "epoch": 1302} {"train_loss": -11.25946044921875, "global_step": 218759, "epoch": 1302} {"train_loss": -10.864574432373047, "global_step": 218760, "epoch": 1302} {"train_loss": -11.232982635498047, "global_step": 218761, "epoch": 1302} {"train_loss": -11.348212242126465, "global_step": 218762, "epoch": 1302} {"train_loss": -11.039094924926758, "global_step": 218763, "epoch": 1302} {"train_loss": -11.278335571289062, "global_step": 218764, "epoch": 1302} {"train_loss": -11.460184097290039, "global_step": 218765, "epoch": 1302} {"train_loss": -11.099806785583496, "global_step": 218766, "epoch": 1302} {"train_loss": -11.416597366333008, "global_step": 218767, "epoch": 1302} {"train_loss": -10.927815437316895, "global_step": 218768, "epoch": 1302} {"train_loss": -11.198315620422363, "global_step": 218769, "epoch": 1302} {"train_loss": -11.111008644104004, "global_step": 218770, "epoch": 1302} {"train_loss": -11.254405975341797, "global_step": 218771, "epoch": 1302} {"train_loss": -11.4171142578125, "global_step": 218772, "epoch": 1302} {"train_loss": -11.279308319091797, "global_step": 218773, "epoch": 1302} {"train_loss": -10.875946044921875, "global_step": 218774, "epoch": 1302} {"train_loss": -11.328197479248047, "global_step": 218775, "epoch": 1302} {"train_loss": -10.51300048828125, "global_step": 218776, "epoch": 1302} {"train_loss": -11.406496047973633, "global_step": 218777, "epoch": 1302} {"train_loss": -10.140083312988281, "global_step": 218778, "epoch": 1302} {"train_loss": -10.98052978515625, "global_step": 218779, "epoch": 1302} {"train_loss": -11.31236457824707, "global_step": 218780, "epoch": 1302} {"train_loss": -10.687626838684082, "global_step": 218781, "epoch": 1302} {"train_loss": -11.073131561279297, "global_step": 218782, "epoch": 1302} {"train_loss": -10.316268920898438, "global_step": 218783, "epoch": 1302} {"train_loss": -11.382960319519043, "global_step": 218784, "epoch": 1302} {"train_loss": -10.620450973510742, "global_step": 218785, "epoch": 1302} {"train_loss": -10.607477188110352, "global_step": 218786, "epoch": 1302} {"train_loss": -11.357498168945312, "global_step": 218787, "epoch": 1302} {"train_loss": -10.65705680847168, "global_step": 218788, "epoch": 1302} {"train_loss": -10.951982498168945, "global_step": 218789, "epoch": 1302} {"train_loss": -11.018157958984375, "global_step": 218790, "epoch": 1302} {"train_loss": -10.462503433227539, "global_step": 218791, "epoch": 1302} {"train_loss": -11.073075294494629, "global_step": 218792, "epoch": 1302} {"train_loss": -10.838404655456543, "global_step": 218793, "epoch": 1302} {"train_loss": -10.818878173828125, "global_step": 218794, "epoch": 1302} {"train_loss": -11.307939529418945, "global_step": 218795, "epoch": 1302} {"train_loss": -10.93470573425293, "global_step": 218796, "epoch": 1302} {"train_loss": -11.381168365478516, "global_step": 218797, "epoch": 1302} {"train_loss": -10.831520080566406, "global_step": 218798, "epoch": 1302} {"train_loss": -10.543182373046875, "global_step": 218799, "epoch": 1302} {"train_loss": -11.139791488647461, "global_step": 218800, "epoch": 1302} {"train_loss": -11.120004653930664, "global_step": 218801, "epoch": 1302} {"train_loss": -10.785621643066406, "global_step": 218802, "epoch": 1302} {"train_loss": -11.39609146118164, "global_step": 218803, "epoch": 1302} {"train_loss": -10.750211715698242, "global_step": 218804, "epoch": 1302} {"train_loss": -11.332531929016113, "global_step": 218805, "epoch": 1302} {"train_loss": -11.235525131225586, "global_step": 218806, "epoch": 1302} {"train_loss": -11.36429214477539, "global_step": 218807, "epoch": 1302} {"train_loss": -11.271919250488281, "global_step": 218808, "epoch": 1302} {"train_loss": -11.283178329467773, "global_step": 218809, "epoch": 1302} {"train_loss": -11.348855972290039, "global_step": 218810, "epoch": 1302} {"train_loss": -11.414461135864258, "global_step": 218811, "epoch": 1302} {"train_loss": -11.645197868347168, "global_step": 218812, "epoch": 1302} {"train_loss": -11.657193183898926, "global_step": 218813, "epoch": 1302} {"train_loss": -11.656631469726562, "global_step": 218814, "epoch": 1302} {"train_loss": -11.596450805664062, "global_step": 218815, "epoch": 1302} {"train_loss": -11.712186813354492, "global_step": 218816, "epoch": 1302} {"train_loss": -11.56736946105957, "global_step": 218817, "epoch": 1302} {"train_loss": -11.68570613861084, "global_step": 218818, "epoch": 1302} {"train_loss": -11.632318496704102, "global_step": 218819, "epoch": 1302} {"train_loss": -11.641682624816895, "global_step": 218820, "epoch": 1302} {"train_loss": -11.894538879394531, "global_step": 218821, "epoch": 1302} {"train_loss": -11.87224006652832, "global_step": 218822, "epoch": 1302} {"train_loss": -11.907541275024414, "global_step": 218823, "epoch": 1302} {"train_loss": -11.850503921508789, "global_step": 218824, "epoch": 1302} {"train_loss": -11.824773788452148, "global_step": 218825, "epoch": 1302} {"train_loss": -11.728401184082031, "global_step": 218826, "epoch": 1302} {"train_loss": -11.9263916015625, "global_step": 218827, "epoch": 1302} {"train_loss": -11.700098037719727, "global_step": 218828, "epoch": 1302} {"train_loss": -11.911893844604492, "global_step": 218829, "epoch": 1302} {"train_loss": -11.730998992919922, "global_step": 218830, "epoch": 1302} {"train_loss": -11.909830093383789, "global_step": 218831, "epoch": 1302} {"train_loss": -11.752816200256348, "global_step": 218832, "epoch": 1302} {"train_loss": -11.81711196899414, "global_step": 218833, "epoch": 1302} {"train_loss": -11.800261497497559, "global_step": 218834, "epoch": 1302} {"train_loss": -11.692733764648438, "global_step": 218835, "epoch": 1302} {"train_loss": -11.717695236206055, "global_step": 218836, "epoch": 1302} {"train_loss": -11.656450271606445, "global_step": 218837, "epoch": 1302} {"train_loss": -11.811602592468262, "global_step": 218838, "epoch": 1302} {"train_loss": -11.78353500366211, "global_step": 218839, "epoch": 1302} {"train_loss": -11.840396881103516, "global_step": 218840, "epoch": 1302} {"train_loss": -11.850682258605957, "global_step": 218841, "epoch": 1302} {"train_loss": -11.264324188232422, "global_step": 218842, "epoch": 1302} {"train_loss": -11.739936828613281, "global_step": 218843, "epoch": 1302} {"train_loss": -11.84946060180664, "global_step": 218844, "epoch": 1302} {"train_loss": -11.926023483276367, "global_step": 218845, "epoch": 1302} {"train_loss": -11.791990280151367, "global_step": 218846, "epoch": 1302} {"train_loss": -11.798755645751953, "global_step": 218847, "epoch": 1302} {"train_loss": -11.839672088623047, "global_step": 218848, "epoch": 1302} {"train_loss": -11.652952194213867, "global_step": 218849, "epoch": 1302} {"train_loss": -11.489143371582031, "global_step": 218850, "epoch": 1302} {"train_loss": -11.672316551208496, "global_step": 218851, "epoch": 1302} {"train_loss": -11.200870513916016, "global_step": 218852, "epoch": 1302} {"train_loss": -11.340932846069336, "global_step": 218853, "epoch": 1302} {"train_loss": -11.774150848388672, "global_step": 218854, "epoch": 1302} {"train_loss": -10.470640182495117, "global_step": 218855, "epoch": 1302} {"train_loss": -11.028610229492188, "global_step": 218856, "epoch": 1302} {"train_loss": -11.752069473266602, "global_step": 218857, "epoch": 1302} {"train_loss": -10.327433586120605, "global_step": 218858, "epoch": 1302} {"train_loss": -11.380821228027344, "global_step": 218859, "epoch": 1302} {"train_loss": -9.955881118774414, "global_step": 218860, "epoch": 1302} {"train_loss": -9.992790222167969, "global_step": 218861, "epoch": 1302} {"train_loss": -10.514932632446289, "global_step": 218862, "epoch": 1302} {"train_loss": -10.90974235534668, "global_step": 218863, "epoch": 1302} {"train_loss": -10.493213653564453, "global_step": 218864, "epoch": 1302} {"train_loss": -10.976522445678711, "global_step": 218865, "epoch": 1302} {"train_loss": -11.109298706054688, "global_step": 218866, "epoch": 1302} {"train_loss": -10.5436372756958, "global_step": 218867, "epoch": 1302} {"train_loss": -11.584268569946289, "global_step": 218868, "epoch": 1302} {"train_loss": -10.790946960449219, "global_step": 218869, "epoch": 1302} {"train_loss": -10.971227645874023, "global_step": 218870, "epoch": 1302} {"train_loss": -10.880375862121582, "global_step": 218871, "epoch": 1302} {"train_loss": -10.895155906677246, "global_step": 218872, "epoch": 1302} {"train_loss": -11.260528564453125, "global_step": 218873, "epoch": 1302} {"train_loss": -10.991464614868164, "global_step": 218874, "epoch": 1302} {"train_loss": -11.462089538574219, "global_step": 218875, "epoch": 1302} {"train_loss": -11.195535659790039, "global_step": 218876, "epoch": 1302} {"train_loss": -11.319559097290039, "global_step": 218877, "epoch": 1302} {"train_loss": -11.51235580444336, "global_step": 218878, "epoch": 1302} {"train_loss": -11.464896202087402, "global_step": 218879, "epoch": 1302} {"train_loss": -11.597365379333496, "global_step": 218880, "epoch": 1302} {"train_loss": -10.797056198120117, "global_step": 218881, "epoch": 1302} {"train_loss": -11.429555892944336, "global_step": 218882, "epoch": 1302} {"train_loss": -11.124204635620117, "global_step": 218883, "epoch": 1302} {"train_loss": -11.592668533325195, "global_step": 218884, "epoch": 1302} {"train_loss": -11.715836524963379, "global_step": 218885, "epoch": 1302} {"train_loss": -11.569887161254883, "global_step": 218886, "epoch": 1302} {"train_loss": -11.713004112243652, "global_step": 218887, "epoch": 1302} {"train_loss": -11.523609161376953, "global_step": 218888, "epoch": 1302} {"train_loss": -11.698240280151367, "global_step": 218889, "epoch": 1302} {"train_loss": -11.49420166015625, "global_step": 218890, "epoch": 1302} {"train_loss": -11.7943115234375, "global_step": 218891, "epoch": 1302} {"train_loss": -11.535585403442383, "global_step": 218892, "epoch": 1302} {"train_loss": -11.652432441711426, "global_step": 218893, "epoch": 1302} {"train_loss": -11.591432571411133, "global_step": 218894, "epoch": 1302} {"train_loss": -11.735466003417969, "global_step": 218895, "epoch": 1302} {"train_loss": -11.84278392791748, "global_step": 218896, "epoch": 1302} {"train_loss": -11.630393981933594, "global_step": 218897, "epoch": 1302} {"train_loss": -11.480865478515625, "global_step": 218898, "epoch": 1302} {"train_loss": -11.558798789978027, "global_step": 218899, "epoch": 1302} {"train_loss": -11.419632911682129, "global_step": 218900, "epoch": 1302} {"train_loss": -11.710835456848145, "global_step": 218901, "epoch": 1302} {"train_loss": -11.416770935058594, "global_step": 218902, "epoch": 1302} {"train_loss": -11.24113743078141, "global_step": 218903, "epoch": 1302, "val_loss": 258494.875} {"train_loss": -11.664298057556152, "global_step": 218904, "epoch": 1303} {"train_loss": -10.381420135498047, "global_step": 218905, "epoch": 1303} {"train_loss": -11.67662525177002, "global_step": 218906, "epoch": 1303} {"train_loss": -10.439727783203125, "global_step": 218907, "epoch": 1303} {"train_loss": -11.512039184570312, "global_step": 218908, "epoch": 1303} {"train_loss": -10.721508026123047, "global_step": 218909, "epoch": 1303} {"train_loss": -11.478371620178223, "global_step": 218910, "epoch": 1303} {"train_loss": -10.96041488647461, "global_step": 218911, "epoch": 1303} {"train_loss": -10.988932609558105, "global_step": 218912, "epoch": 1303} {"train_loss": -11.596766471862793, "global_step": 218913, "epoch": 1303} {"train_loss": -10.7210693359375, "global_step": 218914, "epoch": 1303} {"train_loss": -11.729970932006836, "global_step": 218915, "epoch": 1303} {"train_loss": -10.90302848815918, "global_step": 218916, "epoch": 1303} {"train_loss": -11.545638084411621, "global_step": 218917, "epoch": 1303} {"train_loss": -10.90748405456543, "global_step": 218918, "epoch": 1303} {"train_loss": -11.495630264282227, "global_step": 218919, "epoch": 1303} {"train_loss": -11.112588882446289, "global_step": 218920, "epoch": 1303} {"train_loss": -11.500718116760254, "global_step": 218921, "epoch": 1303} {"train_loss": -10.78378963470459, "global_step": 218922, "epoch": 1303} {"train_loss": -11.160240173339844, "global_step": 218923, "epoch": 1303} {"train_loss": -10.515373229980469, "global_step": 218924, "epoch": 1303} {"train_loss": -11.343746185302734, "global_step": 218925, "epoch": 1303} {"train_loss": -10.723037719726562, "global_step": 218926, "epoch": 1303} {"train_loss": -11.156742095947266, "global_step": 218927, "epoch": 1303} {"train_loss": -11.275227546691895, "global_step": 218928, "epoch": 1303} {"train_loss": -10.784348487854004, "global_step": 218929, "epoch": 1303} {"train_loss": -11.551675796508789, "global_step": 218930, "epoch": 1303} {"train_loss": -10.91714859008789, "global_step": 218931, "epoch": 1303} {"train_loss": -11.23920726776123, "global_step": 218932, "epoch": 1303} {"train_loss": -11.24035358428955, "global_step": 218933, "epoch": 1303} {"train_loss": -10.943300247192383, "global_step": 218934, "epoch": 1303} {"train_loss": -11.53095531463623, "global_step": 218935, "epoch": 1303} {"train_loss": -10.785457611083984, "global_step": 218936, "epoch": 1303} {"train_loss": -10.919103622436523, "global_step": 218937, "epoch": 1303} {"train_loss": -11.642770767211914, "global_step": 218938, "epoch": 1303} {"train_loss": -10.969572067260742, "global_step": 218939, "epoch": 1303} {"train_loss": -11.58973503112793, "global_step": 218940, "epoch": 1303} {"train_loss": -11.419931411743164, "global_step": 218941, "epoch": 1303} {"train_loss": -11.194819450378418, "global_step": 218942, "epoch": 1303} {"train_loss": -11.794242858886719, "global_step": 218943, "epoch": 1303} {"train_loss": -11.249666213989258, "global_step": 218944, "epoch": 1303} {"train_loss": -11.458130836486816, "global_step": 218945, "epoch": 1303} {"train_loss": -11.61260986328125, "global_step": 218946, "epoch": 1303} {"train_loss": -11.406145095825195, "global_step": 218947, "epoch": 1303} {"train_loss": -11.485489845275879, "global_step": 218948, "epoch": 1303} {"train_loss": -11.67805290222168, "global_step": 218949, "epoch": 1303} {"train_loss": -11.442770957946777, "global_step": 218950, "epoch": 1303} {"train_loss": -11.561023712158203, "global_step": 218951, "epoch": 1303} {"train_loss": -11.573015213012695, "global_step": 218952, "epoch": 1303} {"train_loss": -11.62285041809082, "global_step": 218953, "epoch": 1303} {"train_loss": -11.67029857635498, "global_step": 218954, "epoch": 1303} {"train_loss": -11.654394149780273, "global_step": 218955, "epoch": 1303} {"train_loss": -11.343147277832031, "global_step": 218956, "epoch": 1303} {"train_loss": -11.67982292175293, "global_step": 218957, "epoch": 1303} {"train_loss": -11.462904930114746, "global_step": 218958, "epoch": 1303} {"train_loss": -11.335816383361816, "global_step": 218959, "epoch": 1303} {"train_loss": -11.21324348449707, "global_step": 218960, "epoch": 1303} {"train_loss": -11.485780715942383, "global_step": 218961, "epoch": 1303} {"train_loss": -11.509456634521484, "global_step": 218962, "epoch": 1303} {"train_loss": -11.53444766998291, "global_step": 218963, "epoch": 1303} {"train_loss": -11.675131797790527, "global_step": 218964, "epoch": 1303} {"train_loss": -11.617181777954102, "global_step": 218965, "epoch": 1303} {"train_loss": -11.725311279296875, "global_step": 218966, "epoch": 1303} {"train_loss": -11.613337516784668, "global_step": 218967, "epoch": 1303} {"train_loss": -11.81307315826416, "global_step": 218968, "epoch": 1303} {"train_loss": -11.664684295654297, "global_step": 218969, "epoch": 1303} {"train_loss": -11.782548904418945, "global_step": 218970, "epoch": 1303} {"train_loss": -11.656501770019531, "global_step": 218971, "epoch": 1303} {"train_loss": -11.79987621307373, "global_step": 218972, "epoch": 1303} {"train_loss": -11.711614608764648, "global_step": 218973, "epoch": 1303} {"train_loss": -11.885876655578613, "global_step": 218974, "epoch": 1303} {"train_loss": -11.888376235961914, "global_step": 218975, "epoch": 1303} {"train_loss": -11.700867652893066, "global_step": 218976, "epoch": 1303} {"train_loss": -11.845550537109375, "global_step": 218977, "epoch": 1303} {"train_loss": -11.695943832397461, "global_step": 218978, "epoch": 1303} {"train_loss": -11.558156967163086, "global_step": 218979, "epoch": 1303} {"train_loss": -11.661330223083496, "global_step": 218980, "epoch": 1303} {"train_loss": -11.477136611938477, "global_step": 218981, "epoch": 1303} {"train_loss": -11.863567352294922, "global_step": 218982, "epoch": 1303} {"train_loss": -11.705249786376953, "global_step": 218983, "epoch": 1303} {"train_loss": -11.671557426452637, "global_step": 218984, "epoch": 1303} {"train_loss": -11.710366249084473, "global_step": 218985, "epoch": 1303} {"train_loss": -11.847750663757324, "global_step": 218986, "epoch": 1303} {"train_loss": -11.70106315612793, "global_step": 218987, "epoch": 1303} {"train_loss": -11.560097694396973, "global_step": 218988, "epoch": 1303} {"train_loss": -11.764352798461914, "global_step": 218989, "epoch": 1303} {"train_loss": -11.455289840698242, "global_step": 218990, "epoch": 1303} {"train_loss": -10.93907356262207, "global_step": 218991, "epoch": 1303} {"train_loss": -11.556685447692871, "global_step": 218992, "epoch": 1303} {"train_loss": -11.327889442443848, "global_step": 218993, "epoch": 1303} {"train_loss": -11.326539993286133, "global_step": 218994, "epoch": 1303} {"train_loss": -11.630171775817871, "global_step": 218995, "epoch": 1303} {"train_loss": -11.494560241699219, "global_step": 218996, "epoch": 1303} {"train_loss": -11.782451629638672, "global_step": 218997, "epoch": 1303} {"train_loss": -11.344735145568848, "global_step": 218998, "epoch": 1303} {"train_loss": -11.515288352966309, "global_step": 218999, "epoch": 1303} {"train_loss": -11.814728736877441, "global_step": 219000, "epoch": 1303} {"train_loss": -11.939643859863281, "global_step": 219001, "epoch": 1303} {"train_loss": -11.89855670928955, "global_step": 219002, "epoch": 1303} {"train_loss": -11.680975914001465, "global_step": 219003, "epoch": 1303} {"train_loss": -11.853304862976074, "global_step": 219004, "epoch": 1303} {"train_loss": -11.808161735534668, "global_step": 219005, "epoch": 1303} {"train_loss": -11.707159042358398, "global_step": 219006, "epoch": 1303} {"train_loss": -11.529022216796875, "global_step": 219007, "epoch": 1303} {"train_loss": -11.931730270385742, "global_step": 219008, "epoch": 1303} {"train_loss": -11.854191780090332, "global_step": 219009, "epoch": 1303} {"train_loss": -11.647318840026855, "global_step": 219010, "epoch": 1303} {"train_loss": -11.853323936462402, "global_step": 219011, "epoch": 1303} {"train_loss": -11.670167922973633, "global_step": 219012, "epoch": 1303} {"train_loss": -11.75493049621582, "global_step": 219013, "epoch": 1303} {"train_loss": -11.936508178710938, "global_step": 219014, "epoch": 1303} {"train_loss": -11.169715881347656, "global_step": 219015, "epoch": 1303} {"train_loss": -11.770938873291016, "global_step": 219016, "epoch": 1303} {"train_loss": -11.415895462036133, "global_step": 219017, "epoch": 1303} {"train_loss": -11.899212837219238, "global_step": 219018, "epoch": 1303} {"train_loss": -11.171117782592773, "global_step": 219019, "epoch": 1303} {"train_loss": -11.65200424194336, "global_step": 219020, "epoch": 1303} {"train_loss": -11.538784980773926, "global_step": 219021, "epoch": 1303} {"train_loss": -11.563124656677246, "global_step": 219022, "epoch": 1303} {"train_loss": -11.4345703125, "global_step": 219023, "epoch": 1303} {"train_loss": -11.258645057678223, "global_step": 219024, "epoch": 1303} {"train_loss": -10.980245590209961, "global_step": 219025, "epoch": 1303} {"train_loss": -11.787909507751465, "global_step": 219026, "epoch": 1303} {"train_loss": -11.050810813903809, "global_step": 219027, "epoch": 1303} {"train_loss": -11.265436172485352, "global_step": 219028, "epoch": 1303} {"train_loss": -11.19715404510498, "global_step": 219029, "epoch": 1303} {"train_loss": -11.149080276489258, "global_step": 219030, "epoch": 1303} {"train_loss": -9.278022766113281, "global_step": 219031, "epoch": 1303} {"train_loss": -10.978899002075195, "global_step": 219032, "epoch": 1303} {"train_loss": -8.875381469726562, "global_step": 219033, "epoch": 1303} {"train_loss": -9.481504440307617, "global_step": 219034, "epoch": 1303} {"train_loss": -11.046035766601562, "global_step": 219035, "epoch": 1303} {"train_loss": -7.652793884277344, "global_step": 219036, "epoch": 1303} {"train_loss": -10.301877975463867, "global_step": 219037, "epoch": 1303} {"train_loss": -8.560306549072266, "global_step": 219038, "epoch": 1303} {"train_loss": -9.633890151977539, "global_step": 219039, "epoch": 1303} {"train_loss": -9.11375904083252, "global_step": 219040, "epoch": 1303} {"train_loss": -9.94325065612793, "global_step": 219041, "epoch": 1303} {"train_loss": -9.895037651062012, "global_step": 219042, "epoch": 1303} {"train_loss": -10.748289108276367, "global_step": 219043, "epoch": 1303} {"train_loss": -8.797728538513184, "global_step": 219044, "epoch": 1303} {"train_loss": -10.480491638183594, "global_step": 219045, "epoch": 1303} {"train_loss": -10.64889144897461, "global_step": 219046, "epoch": 1303} {"train_loss": -10.056780815124512, "global_step": 219047, "epoch": 1303} {"train_loss": -11.02322769165039, "global_step": 219048, "epoch": 1303} {"train_loss": -10.390024185180664, "global_step": 219049, "epoch": 1303} {"train_loss": -10.645512580871582, "global_step": 219050, "epoch": 1303} {"train_loss": -10.973597526550293, "global_step": 219051, "epoch": 1303} {"train_loss": -10.709526062011719, "global_step": 219052, "epoch": 1303} {"train_loss": -10.830412864685059, "global_step": 219053, "epoch": 1303} {"train_loss": -10.959543228149414, "global_step": 219054, "epoch": 1303} {"train_loss": -10.681182861328125, "global_step": 219055, "epoch": 1303} {"train_loss": -10.972905158996582, "global_step": 219056, "epoch": 1303} {"train_loss": -11.007040023803711, "global_step": 219057, "epoch": 1303} {"train_loss": -10.924551010131836, "global_step": 219058, "epoch": 1303} {"train_loss": -11.372485160827637, "global_step": 219059, "epoch": 1303} {"train_loss": -11.188811302185059, "global_step": 219060, "epoch": 1303} {"train_loss": -11.057458877563477, "global_step": 219061, "epoch": 1303} {"train_loss": -11.431425094604492, "global_step": 219062, "epoch": 1303} {"train_loss": -10.950403213500977, "global_step": 219063, "epoch": 1303} {"train_loss": -11.083956718444824, "global_step": 219064, "epoch": 1303} {"train_loss": -11.178824424743652, "global_step": 219065, "epoch": 1303} {"train_loss": -11.316448211669922, "global_step": 219066, "epoch": 1303} {"train_loss": -11.395475387573242, "global_step": 219067, "epoch": 1303} {"train_loss": -11.310264587402344, "global_step": 219068, "epoch": 1303} {"train_loss": -11.175018310546875, "global_step": 219069, "epoch": 1303} {"train_loss": -11.432981491088867, "global_step": 219070, "epoch": 1303} {"train_loss": -11.223228664625259, "global_step": 219071, "epoch": 1303, "val_loss": 261985.625} {"train_loss": -11.349945068359375, "global_step": 219072, "epoch": 1304} {"train_loss": -11.122223854064941, "global_step": 219073, "epoch": 1304} {"train_loss": -11.373597145080566, "global_step": 219074, "epoch": 1304} {"train_loss": -11.264410972595215, "global_step": 219075, "epoch": 1304} {"train_loss": -11.428704261779785, "global_step": 219076, "epoch": 1304} {"train_loss": -11.316070556640625, "global_step": 219077, "epoch": 1304} {"train_loss": -11.624811172485352, "global_step": 219078, "epoch": 1304} {"train_loss": -11.395109176635742, "global_step": 219079, "epoch": 1304} {"train_loss": -11.437003135681152, "global_step": 219080, "epoch": 1304} {"train_loss": -11.455175399780273, "global_step": 219081, "epoch": 1304} {"train_loss": -11.550498962402344, "global_step": 219082, "epoch": 1304} {"train_loss": -11.41996955871582, "global_step": 219083, "epoch": 1304} {"train_loss": -11.390792846679688, "global_step": 219084, "epoch": 1304} {"train_loss": -11.625457763671875, "global_step": 219085, "epoch": 1304} {"train_loss": -11.489839553833008, "global_step": 219086, "epoch": 1304} {"train_loss": -11.711678504943848, "global_step": 219087, "epoch": 1304} {"train_loss": -11.604198455810547, "global_step": 219088, "epoch": 1304} {"train_loss": -11.668770790100098, "global_step": 219089, "epoch": 1304} {"train_loss": -11.599113464355469, "global_step": 219090, "epoch": 1304} {"train_loss": -11.604413986206055, "global_step": 219091, "epoch": 1304} {"train_loss": -11.635412216186523, "global_step": 219092, "epoch": 1304} {"train_loss": -11.673239707946777, "global_step": 219093, "epoch": 1304} {"train_loss": -11.714451789855957, "global_step": 219094, "epoch": 1304} {"train_loss": -11.634004592895508, "global_step": 219095, "epoch": 1304} {"train_loss": -11.59040641784668, "global_step": 219096, "epoch": 1304} {"train_loss": -11.778614044189453, "global_step": 219097, "epoch": 1304} {"train_loss": -11.525331497192383, "global_step": 219098, "epoch": 1304} {"train_loss": -11.62922477722168, "global_step": 219099, "epoch": 1304} {"train_loss": -11.731582641601562, "global_step": 219100, "epoch": 1304} {"train_loss": -11.56342887878418, "global_step": 219101, "epoch": 1304} {"train_loss": -11.905515670776367, "global_step": 219102, "epoch": 1304} {"train_loss": -11.733396530151367, "global_step": 219103, "epoch": 1304} {"train_loss": -11.620431900024414, "global_step": 219104, "epoch": 1304} {"train_loss": -11.918069839477539, "global_step": 219105, "epoch": 1304} {"train_loss": -11.788517951965332, "global_step": 219106, "epoch": 1304} {"train_loss": -11.765907287597656, "global_step": 219107, "epoch": 1304} {"train_loss": -11.926691055297852, "global_step": 219108, "epoch": 1304} {"train_loss": -11.62387752532959, "global_step": 219109, "epoch": 1304} {"train_loss": -11.766563415527344, "global_step": 219110, "epoch": 1304} {"train_loss": -11.839426040649414, "global_step": 219111, "epoch": 1304} {"train_loss": -11.697616577148438, "global_step": 219112, "epoch": 1304} {"train_loss": -11.967809677124023, "global_step": 219113, "epoch": 1304} {"train_loss": -11.823159217834473, "global_step": 219114, "epoch": 1304} {"train_loss": -12.055830001831055, "global_step": 219115, "epoch": 1304} {"train_loss": -11.586305618286133, "global_step": 219116, "epoch": 1304} {"train_loss": -12.047361373901367, "global_step": 219117, "epoch": 1304} {"train_loss": -11.879810333251953, "global_step": 219118, "epoch": 1304} {"train_loss": -11.974849700927734, "global_step": 219119, "epoch": 1304} {"train_loss": -11.978558540344238, "global_step": 219120, "epoch": 1304} {"train_loss": -11.890291213989258, "global_step": 219121, "epoch": 1304} {"train_loss": -12.112289428710938, "global_step": 219122, "epoch": 1304} {"train_loss": -11.882230758666992, "global_step": 219123, "epoch": 1304} {"train_loss": -11.940479278564453, "global_step": 219124, "epoch": 1304} {"train_loss": -12.062966346740723, "global_step": 219125, "epoch": 1304} {"train_loss": -11.82199478149414, "global_step": 219126, "epoch": 1304} {"train_loss": -11.97663688659668, "global_step": 219127, "epoch": 1304} {"train_loss": -12.124504089355469, "global_step": 219128, "epoch": 1304} {"train_loss": -11.767541885375977, "global_step": 219129, "epoch": 1304} {"train_loss": -12.173762321472168, "global_step": 219130, "epoch": 1304} {"train_loss": -11.874632835388184, "global_step": 219131, "epoch": 1304} {"train_loss": -11.994625091552734, "global_step": 219132, "epoch": 1304} {"train_loss": -11.911230087280273, "global_step": 219133, "epoch": 1304} {"train_loss": -11.901273727416992, "global_step": 219134, "epoch": 1304} {"train_loss": -11.734945297241211, "global_step": 219135, "epoch": 1304} {"train_loss": -11.202269554138184, "global_step": 219136, "epoch": 1304} {"train_loss": -11.860342025756836, "global_step": 219137, "epoch": 1304} {"train_loss": -12.164339065551758, "global_step": 219138, "epoch": 1304} {"train_loss": -11.968788146972656, "global_step": 219139, "epoch": 1304} {"train_loss": -11.71566104888916, "global_step": 219140, "epoch": 1304} {"train_loss": -11.704500198364258, "global_step": 219141, "epoch": 1304} {"train_loss": -11.170879364013672, "global_step": 219142, "epoch": 1304} {"train_loss": -11.119329452514648, "global_step": 219143, "epoch": 1304} {"train_loss": -11.419092178344727, "global_step": 219144, "epoch": 1304} {"train_loss": -11.690765380859375, "global_step": 219145, "epoch": 1304} {"train_loss": -11.877532958984375, "global_step": 219146, "epoch": 1304} {"train_loss": -11.560783386230469, "global_step": 219147, "epoch": 1304} {"train_loss": -10.737460136413574, "global_step": 219148, "epoch": 1304} {"train_loss": -9.984655380249023, "global_step": 219149, "epoch": 1304} {"train_loss": -11.157270431518555, "global_step": 219150, "epoch": 1304} {"train_loss": -11.212190628051758, "global_step": 219151, "epoch": 1304} {"train_loss": -11.347082138061523, "global_step": 219152, "epoch": 1304} {"train_loss": -10.74647045135498, "global_step": 219153, "epoch": 1304} {"train_loss": -10.893128395080566, "global_step": 219154, "epoch": 1304} {"train_loss": -11.471587181091309, "global_step": 219155, "epoch": 1304} {"train_loss": -11.168584823608398, "global_step": 219156, "epoch": 1304} {"train_loss": -11.152091979980469, "global_step": 219157, "epoch": 1304} {"train_loss": -11.73103141784668, "global_step": 219158, "epoch": 1304} {"train_loss": -11.217100143432617, "global_step": 219159, "epoch": 1304} {"train_loss": -11.226465225219727, "global_step": 219160, "epoch": 1304} {"train_loss": -10.916370391845703, "global_step": 219161, "epoch": 1304} {"train_loss": -11.293075561523438, "global_step": 219162, "epoch": 1304} {"train_loss": -11.18292236328125, "global_step": 219163, "epoch": 1304} {"train_loss": -11.310314178466797, "global_step": 219164, "epoch": 1304} {"train_loss": -10.901031494140625, "global_step": 219165, "epoch": 1304} {"train_loss": -10.369640350341797, "global_step": 219166, "epoch": 1304} {"train_loss": -10.482854843139648, "global_step": 219167, "epoch": 1304} {"train_loss": -10.368727684020996, "global_step": 219168, "epoch": 1304} {"train_loss": -10.119924545288086, "global_step": 219169, "epoch": 1304} {"train_loss": -11.733960151672363, "global_step": 219170, "epoch": 1304} {"train_loss": -10.109668731689453, "global_step": 219171, "epoch": 1304} {"train_loss": -10.784571647644043, "global_step": 219172, "epoch": 1304} {"train_loss": -10.500410079956055, "global_step": 219173, "epoch": 1304} {"train_loss": -10.303640365600586, "global_step": 219174, "epoch": 1304} {"train_loss": -11.346153259277344, "global_step": 219175, "epoch": 1304} {"train_loss": -10.777864456176758, "global_step": 219176, "epoch": 1304} {"train_loss": -11.426122665405273, "global_step": 219177, "epoch": 1304} {"train_loss": -11.252935409545898, "global_step": 219178, "epoch": 1304} {"train_loss": -11.443755149841309, "global_step": 219179, "epoch": 1304} {"train_loss": -10.98211669921875, "global_step": 219180, "epoch": 1304} {"train_loss": -11.345321655273438, "global_step": 219181, "epoch": 1304} {"train_loss": -10.957947731018066, "global_step": 219182, "epoch": 1304} {"train_loss": -11.162976264953613, "global_step": 219183, "epoch": 1304} {"train_loss": -10.89306926727295, "global_step": 219184, "epoch": 1304} {"train_loss": -11.511086463928223, "global_step": 219185, "epoch": 1304} {"train_loss": -11.257288932800293, "global_step": 219186, "epoch": 1304} {"train_loss": -11.440727233886719, "global_step": 219187, "epoch": 1304} {"train_loss": -11.017372131347656, "global_step": 219188, "epoch": 1304} {"train_loss": -11.525793075561523, "global_step": 219189, "epoch": 1304} {"train_loss": -11.411656379699707, "global_step": 219190, "epoch": 1304} {"train_loss": -11.42397403717041, "global_step": 219191, "epoch": 1304} {"train_loss": -11.342535018920898, "global_step": 219192, "epoch": 1304} {"train_loss": -11.42475414276123, "global_step": 219193, "epoch": 1304} {"train_loss": -11.532644271850586, "global_step": 219194, "epoch": 1304} {"train_loss": -11.08575439453125, "global_step": 219195, "epoch": 1304} {"train_loss": -11.397122383117676, "global_step": 219196, "epoch": 1304} {"train_loss": -11.349679946899414, "global_step": 219197, "epoch": 1304} {"train_loss": -11.331523895263672, "global_step": 219198, "epoch": 1304} {"train_loss": -11.020633697509766, "global_step": 219199, "epoch": 1304} {"train_loss": -11.295279502868652, "global_step": 219200, "epoch": 1304} {"train_loss": -11.114782333374023, "global_step": 219201, "epoch": 1304} {"train_loss": -11.487545013427734, "global_step": 219202, "epoch": 1304} {"train_loss": -11.230551719665527, "global_step": 219203, "epoch": 1304} {"train_loss": -11.32474422454834, "global_step": 219204, "epoch": 1304} {"train_loss": -11.182926177978516, "global_step": 219205, "epoch": 1304} {"train_loss": -11.306354522705078, "global_step": 219206, "epoch": 1304} {"train_loss": -11.353447914123535, "global_step": 219207, "epoch": 1304} {"train_loss": -11.420584678649902, "global_step": 219208, "epoch": 1304} {"train_loss": -11.119796752929688, "global_step": 219209, "epoch": 1304} {"train_loss": -11.678177833557129, "global_step": 219210, "epoch": 1304} {"train_loss": -11.017074584960938, "global_step": 219211, "epoch": 1304} {"train_loss": -11.487554550170898, "global_step": 219212, "epoch": 1304} {"train_loss": -11.482736587524414, "global_step": 219213, "epoch": 1304} {"train_loss": -11.404253005981445, "global_step": 219214, "epoch": 1304} {"train_loss": -11.232513427734375, "global_step": 219215, "epoch": 1304} {"train_loss": -11.587944030761719, "global_step": 219216, "epoch": 1304} {"train_loss": -11.256633758544922, "global_step": 219217, "epoch": 1304} {"train_loss": -11.491517066955566, "global_step": 219218, "epoch": 1304} {"train_loss": -11.100347518920898, "global_step": 219219, "epoch": 1304} {"train_loss": -11.424982070922852, "global_step": 219220, "epoch": 1304} {"train_loss": -11.565451622009277, "global_step": 219221, "epoch": 1304} {"train_loss": -11.464884757995605, "global_step": 219222, "epoch": 1304} {"train_loss": -11.521587371826172, "global_step": 219223, "epoch": 1304} {"train_loss": -11.54170036315918, "global_step": 219224, "epoch": 1304} {"train_loss": -11.891388893127441, "global_step": 219225, "epoch": 1304} {"train_loss": -11.622648239135742, "global_step": 219226, "epoch": 1304} {"train_loss": -11.651106834411621, "global_step": 219227, "epoch": 1304} {"train_loss": -11.389619827270508, "global_step": 219228, "epoch": 1304} {"train_loss": -11.834413528442383, "global_step": 219229, "epoch": 1304} {"train_loss": -11.628840446472168, "global_step": 219230, "epoch": 1304} {"train_loss": -11.728408813476562, "global_step": 219231, "epoch": 1304} {"train_loss": -11.728748321533203, "global_step": 219232, "epoch": 1304} {"train_loss": -11.671960830688477, "global_step": 219233, "epoch": 1304} {"train_loss": -11.68639087677002, "global_step": 219234, "epoch": 1304} {"train_loss": -11.517087936401367, "global_step": 219235, "epoch": 1304} {"train_loss": -11.826814651489258, "global_step": 219236, "epoch": 1304} {"train_loss": -11.648696899414062, "global_step": 219237, "epoch": 1304} {"train_loss": -11.831635475158691, "global_step": 219238, "epoch": 1304} {"train_loss": -11.457434841564723, "global_step": 219239, "epoch": 1304, "val_loss": 259331.046875} {"train_loss": -11.870317459106445, "global_step": 219240, "epoch": 1305} {"train_loss": -11.781652450561523, "global_step": 219241, "epoch": 1305} {"train_loss": -11.68972396850586, "global_step": 219242, "epoch": 1305} {"train_loss": -11.818678855895996, "global_step": 219243, "epoch": 1305} {"train_loss": -11.618724822998047, "global_step": 219244, "epoch": 1305} {"train_loss": -11.83875846862793, "global_step": 219245, "epoch": 1305} {"train_loss": -11.598755836486816, "global_step": 219246, "epoch": 1305} {"train_loss": -11.288797378540039, "global_step": 219247, "epoch": 1305} {"train_loss": -11.501980781555176, "global_step": 219248, "epoch": 1305} {"train_loss": -11.77796459197998, "global_step": 219249, "epoch": 1305} {"train_loss": -11.371882438659668, "global_step": 219250, "epoch": 1305} {"train_loss": -12.003768920898438, "global_step": 219251, "epoch": 1305} {"train_loss": -11.23640251159668, "global_step": 219252, "epoch": 1305} {"train_loss": -10.282798767089844, "global_step": 219253, "epoch": 1305} {"train_loss": -11.492353439331055, "global_step": 219254, "epoch": 1305} {"train_loss": -11.109786033630371, "global_step": 219255, "epoch": 1305} {"train_loss": -9.18449878692627, "global_step": 219256, "epoch": 1305} {"train_loss": -10.943380355834961, "global_step": 219257, "epoch": 1305} {"train_loss": -10.089393615722656, "global_step": 219258, "epoch": 1305} {"train_loss": -8.762950897216797, "global_step": 219259, "epoch": 1305} {"train_loss": -11.478259086608887, "global_step": 219260, "epoch": 1305} {"train_loss": -8.535415649414062, "global_step": 219261, "epoch": 1305} {"train_loss": -10.241470336914062, "global_step": 219262, "epoch": 1305} {"train_loss": -9.253511428833008, "global_step": 219263, "epoch": 1305} {"train_loss": -10.477337837219238, "global_step": 219264, "epoch": 1305} {"train_loss": -9.990058898925781, "global_step": 219265, "epoch": 1305} {"train_loss": -10.822274208068848, "global_step": 219266, "epoch": 1305} {"train_loss": -10.23897933959961, "global_step": 219267, "epoch": 1305} {"train_loss": -11.20609188079834, "global_step": 219268, "epoch": 1305} {"train_loss": -10.311236381530762, "global_step": 219269, "epoch": 1305} {"train_loss": -11.279857635498047, "global_step": 219270, "epoch": 1305} {"train_loss": -10.404155731201172, "global_step": 219271, "epoch": 1305} {"train_loss": -10.799195289611816, "global_step": 219272, "epoch": 1305} {"train_loss": -10.807024955749512, "global_step": 219273, "epoch": 1305} {"train_loss": -10.939302444458008, "global_step": 219274, "epoch": 1305} {"train_loss": -10.43747329711914, "global_step": 219275, "epoch": 1305} {"train_loss": -11.046144485473633, "global_step": 219276, "epoch": 1305} {"train_loss": -10.762594223022461, "global_step": 219277, "epoch": 1305} {"train_loss": -11.114636421203613, "global_step": 219278, "epoch": 1305} {"train_loss": -11.079998970031738, "global_step": 219279, "epoch": 1305} {"train_loss": -11.219844818115234, "global_step": 219280, "epoch": 1305} {"train_loss": -11.334385871887207, "global_step": 219281, "epoch": 1305} {"train_loss": -11.05767822265625, "global_step": 219282, "epoch": 1305} {"train_loss": -11.171335220336914, "global_step": 219283, "epoch": 1305} {"train_loss": -11.279916763305664, "global_step": 219284, "epoch": 1305} {"train_loss": -11.130180358886719, "global_step": 219285, "epoch": 1305} {"train_loss": -11.308122634887695, "global_step": 219286, "epoch": 1305} {"train_loss": -11.552173614501953, "global_step": 219287, "epoch": 1305} {"train_loss": -11.272068977355957, "global_step": 219288, "epoch": 1305} {"train_loss": -11.34918212890625, "global_step": 219289, "epoch": 1305} {"train_loss": -11.270029067993164, "global_step": 219290, "epoch": 1305} {"train_loss": -11.308758735656738, "global_step": 219291, "epoch": 1305} {"train_loss": -11.567940711975098, "global_step": 219292, "epoch": 1305} {"train_loss": -11.619521141052246, "global_step": 219293, "epoch": 1305} {"train_loss": -11.054210662841797, "global_step": 219294, "epoch": 1305} {"train_loss": -11.403258323669434, "global_step": 219295, "epoch": 1305} {"train_loss": -11.320556640625, "global_step": 219296, "epoch": 1305} {"train_loss": -11.574729919433594, "global_step": 219297, "epoch": 1305} {"train_loss": -11.626551628112793, "global_step": 219298, "epoch": 1305} {"train_loss": -11.410284042358398, "global_step": 219299, "epoch": 1305} {"train_loss": -11.545296669006348, "global_step": 219300, "epoch": 1305} {"train_loss": -11.43562126159668, "global_step": 219301, "epoch": 1305} {"train_loss": -11.343399047851562, "global_step": 219302, "epoch": 1305} {"train_loss": -11.661443710327148, "global_step": 219303, "epoch": 1305} {"train_loss": -11.473398208618164, "global_step": 219304, "epoch": 1305} {"train_loss": -11.345442771911621, "global_step": 219305, "epoch": 1305} {"train_loss": -11.477191925048828, "global_step": 219306, "epoch": 1305} {"train_loss": -11.323347091674805, "global_step": 219307, "epoch": 1305} {"train_loss": -11.839804649353027, "global_step": 219308, "epoch": 1305} {"train_loss": -11.332571983337402, "global_step": 219309, "epoch": 1305} {"train_loss": -11.81973648071289, "global_step": 219310, "epoch": 1305} {"train_loss": -11.779243469238281, "global_step": 219311, "epoch": 1305} {"train_loss": -11.704913139343262, "global_step": 219312, "epoch": 1305} {"train_loss": -11.536624908447266, "global_step": 219313, "epoch": 1305} {"train_loss": -11.663542747497559, "global_step": 219314, "epoch": 1305} {"train_loss": -11.560569763183594, "global_step": 219315, "epoch": 1305} {"train_loss": -11.68879508972168, "global_step": 219316, "epoch": 1305} {"train_loss": -11.727415084838867, "global_step": 219317, "epoch": 1305} {"train_loss": -11.77186107635498, "global_step": 219318, "epoch": 1305} {"train_loss": -11.919435501098633, "global_step": 219319, "epoch": 1305} {"train_loss": -11.927248001098633, "global_step": 219320, "epoch": 1305} {"train_loss": -11.958026885986328, "global_step": 219321, "epoch": 1305} {"train_loss": -11.682592391967773, "global_step": 219322, "epoch": 1305} {"train_loss": -11.913580894470215, "global_step": 219323, "epoch": 1305} {"train_loss": -11.82087516784668, "global_step": 219324, "epoch": 1305} {"train_loss": -11.727378845214844, "global_step": 219325, "epoch": 1305} {"train_loss": -11.904359817504883, "global_step": 219326, "epoch": 1305} {"train_loss": -11.87777328491211, "global_step": 219327, "epoch": 1305} {"train_loss": -11.890789031982422, "global_step": 219328, "epoch": 1305} {"train_loss": -11.688568115234375, "global_step": 219329, "epoch": 1305} {"train_loss": -11.950058937072754, "global_step": 219330, "epoch": 1305} {"train_loss": -11.939196586608887, "global_step": 219331, "epoch": 1305} {"train_loss": -11.99339771270752, "global_step": 219332, "epoch": 1305} {"train_loss": -11.777565956115723, "global_step": 219333, "epoch": 1305} {"train_loss": -11.879172325134277, "global_step": 219334, "epoch": 1305} {"train_loss": -11.680503845214844, "global_step": 219335, "epoch": 1305} {"train_loss": -11.928976058959961, "global_step": 219336, "epoch": 1305} {"train_loss": -12.0408935546875, "global_step": 219337, "epoch": 1305} {"train_loss": -11.903800964355469, "global_step": 219338, "epoch": 1305} {"train_loss": -12.09838581085205, "global_step": 219339, "epoch": 1305} {"train_loss": -11.727706909179688, "global_step": 219340, "epoch": 1305} {"train_loss": -11.790521621704102, "global_step": 219341, "epoch": 1305} {"train_loss": -11.789724349975586, "global_step": 219342, "epoch": 1305} {"train_loss": -12.025087356567383, "global_step": 219343, "epoch": 1305} {"train_loss": -11.957860946655273, "global_step": 219344, "epoch": 1305} {"train_loss": -11.470121383666992, "global_step": 219345, "epoch": 1305} {"train_loss": -11.755914688110352, "global_step": 219346, "epoch": 1305} {"train_loss": -11.902454376220703, "global_step": 219347, "epoch": 1305} {"train_loss": -11.919393539428711, "global_step": 219348, "epoch": 1305} {"train_loss": -11.736587524414062, "global_step": 219349, "epoch": 1305} {"train_loss": -12.011037826538086, "global_step": 219350, "epoch": 1305} {"train_loss": -11.938255310058594, "global_step": 219351, "epoch": 1305} {"train_loss": -11.732087135314941, "global_step": 219352, "epoch": 1305} {"train_loss": -12.126611709594727, "global_step": 219353, "epoch": 1305} {"train_loss": -11.930500030517578, "global_step": 219354, "epoch": 1305} {"train_loss": -11.906222343444824, "global_step": 219355, "epoch": 1305} {"train_loss": -11.729597091674805, "global_step": 219356, "epoch": 1305} {"train_loss": -11.789374351501465, "global_step": 219357, "epoch": 1305} {"train_loss": -11.736021995544434, "global_step": 219358, "epoch": 1305} {"train_loss": -12.017642974853516, "global_step": 219359, "epoch": 1305} {"train_loss": -11.713315963745117, "global_step": 219360, "epoch": 1305} {"train_loss": -11.510162353515625, "global_step": 219361, "epoch": 1305} {"train_loss": -11.175593376159668, "global_step": 219362, "epoch": 1305} {"train_loss": -11.080212593078613, "global_step": 219363, "epoch": 1305} {"train_loss": -11.310856819152832, "global_step": 219364, "epoch": 1305} {"train_loss": -11.843782424926758, "global_step": 219365, "epoch": 1305} {"train_loss": -11.007601737976074, "global_step": 219366, "epoch": 1305} {"train_loss": -11.639476776123047, "global_step": 219367, "epoch": 1305} {"train_loss": -11.044633865356445, "global_step": 219368, "epoch": 1305} {"train_loss": -9.86946964263916, "global_step": 219369, "epoch": 1305} {"train_loss": -11.445174217224121, "global_step": 219370, "epoch": 1305} {"train_loss": -11.128310203552246, "global_step": 219371, "epoch": 1305} {"train_loss": -11.037617683410645, "global_step": 219372, "epoch": 1305} {"train_loss": -11.580680847167969, "global_step": 219373, "epoch": 1305} {"train_loss": -10.591334342956543, "global_step": 219374, "epoch": 1305} {"train_loss": -10.645174026489258, "global_step": 219375, "epoch": 1305} {"train_loss": -11.359243392944336, "global_step": 219376, "epoch": 1305} {"train_loss": -10.520124435424805, "global_step": 219377, "epoch": 1305} {"train_loss": -11.549216270446777, "global_step": 219378, "epoch": 1305} {"train_loss": -10.74752140045166, "global_step": 219379, "epoch": 1305} {"train_loss": -11.36916732788086, "global_step": 219380, "epoch": 1305} {"train_loss": -11.375555038452148, "global_step": 219381, "epoch": 1305} {"train_loss": -11.341890335083008, "global_step": 219382, "epoch": 1305} {"train_loss": -11.188565254211426, "global_step": 219383, "epoch": 1305} {"train_loss": -11.48682975769043, "global_step": 219384, "epoch": 1305} {"train_loss": -11.623421669006348, "global_step": 219385, "epoch": 1305} {"train_loss": -10.830554962158203, "global_step": 219386, "epoch": 1305} {"train_loss": -10.986721992492676, "global_step": 219387, "epoch": 1305} {"train_loss": -11.359601974487305, "global_step": 219388, "epoch": 1305} {"train_loss": -11.180706977844238, "global_step": 219389, "epoch": 1305} {"train_loss": -11.337739944458008, "global_step": 219390, "epoch": 1305} {"train_loss": -11.428974151611328, "global_step": 219391, "epoch": 1305} {"train_loss": -10.922859191894531, "global_step": 219392, "epoch": 1305} {"train_loss": -10.890464782714844, "global_step": 219393, "epoch": 1305} {"train_loss": -10.5546875, "global_step": 219394, "epoch": 1305} {"train_loss": -11.106304168701172, "global_step": 219395, "epoch": 1305} {"train_loss": -11.39940071105957, "global_step": 219396, "epoch": 1305} {"train_loss": -10.161138534545898, "global_step": 219397, "epoch": 1305} {"train_loss": -11.083316802978516, "global_step": 219398, "epoch": 1305} {"train_loss": -10.51655101776123, "global_step": 219399, "epoch": 1305} {"train_loss": -10.967456817626953, "global_step": 219400, "epoch": 1305} {"train_loss": -11.376106262207031, "global_step": 219401, "epoch": 1305} {"train_loss": -11.085805892944336, "global_step": 219402, "epoch": 1305} {"train_loss": -11.030416488647461, "global_step": 219403, "epoch": 1305} {"train_loss": -11.55535888671875, "global_step": 219404, "epoch": 1305} {"train_loss": -11.171841621398926, "global_step": 219405, "epoch": 1305} {"train_loss": -11.28727912902832, "global_step": 219406, "epoch": 1305} {"train_loss": -11.32180452914465, "global_step": 219407, "epoch": 1305, "val_loss": 262781.09375, "train_action_mse_error": 1.4788451194763184} {"train_loss": -11.474014282226562, "global_step": 219408, "epoch": 1306} {"train_loss": -11.18089485168457, "global_step": 219409, "epoch": 1306} {"train_loss": -11.579242706298828, "global_step": 219410, "epoch": 1306} {"train_loss": -10.949180603027344, "global_step": 219411, "epoch": 1306} {"train_loss": -11.258380889892578, "global_step": 219412, "epoch": 1306} {"train_loss": -11.001986503601074, "global_step": 219413, "epoch": 1306} {"train_loss": -11.05130672454834, "global_step": 219414, "epoch": 1306} {"train_loss": -11.156534194946289, "global_step": 219415, "epoch": 1306} {"train_loss": -11.136739730834961, "global_step": 219416, "epoch": 1306} {"train_loss": -11.275458335876465, "global_step": 219417, "epoch": 1306} {"train_loss": -10.877900123596191, "global_step": 219418, "epoch": 1306} {"train_loss": -11.13551139831543, "global_step": 219419, "epoch": 1306} {"train_loss": -10.792978286743164, "global_step": 219420, "epoch": 1306} {"train_loss": -11.335515022277832, "global_step": 219421, "epoch": 1306} {"train_loss": -10.84196662902832, "global_step": 219422, "epoch": 1306} {"train_loss": -11.342588424682617, "global_step": 219423, "epoch": 1306} {"train_loss": -11.056656837463379, "global_step": 219424, "epoch": 1306} {"train_loss": -11.048321723937988, "global_step": 219425, "epoch": 1306} {"train_loss": -11.319109916687012, "global_step": 219426, "epoch": 1306} {"train_loss": -10.637308120727539, "global_step": 219427, "epoch": 1306} {"train_loss": -11.267963409423828, "global_step": 219428, "epoch": 1306} {"train_loss": -10.648981094360352, "global_step": 219429, "epoch": 1306} {"train_loss": -11.134693145751953, "global_step": 219430, "epoch": 1306} {"train_loss": -11.222334861755371, "global_step": 219431, "epoch": 1306} {"train_loss": -11.420902252197266, "global_step": 219432, "epoch": 1306} {"train_loss": -11.207276344299316, "global_step": 219433, "epoch": 1306} {"train_loss": -11.675052642822266, "global_step": 219434, "epoch": 1306} {"train_loss": -11.209728240966797, "global_step": 219435, "epoch": 1306} {"train_loss": -11.644137382507324, "global_step": 219436, "epoch": 1306} {"train_loss": -11.102611541748047, "global_step": 219437, "epoch": 1306} {"train_loss": -11.51939582824707, "global_step": 219438, "epoch": 1306} {"train_loss": -11.34411907196045, "global_step": 219439, "epoch": 1306} {"train_loss": -11.62753677368164, "global_step": 219440, "epoch": 1306} {"train_loss": -11.340978622436523, "global_step": 219441, "epoch": 1306} {"train_loss": -11.430827140808105, "global_step": 219442, "epoch": 1306} {"train_loss": -11.56506061553955, "global_step": 219443, "epoch": 1306} {"train_loss": -11.57326889038086, "global_step": 219444, "epoch": 1306} {"train_loss": -11.566655158996582, "global_step": 219445, "epoch": 1306} {"train_loss": -11.388383865356445, "global_step": 219446, "epoch": 1306} {"train_loss": -11.79110336303711, "global_step": 219447, "epoch": 1306} {"train_loss": -11.434944152832031, "global_step": 219448, "epoch": 1306} {"train_loss": -11.735393524169922, "global_step": 219449, "epoch": 1306} {"train_loss": -11.483060836791992, "global_step": 219450, "epoch": 1306} {"train_loss": -11.904025077819824, "global_step": 219451, "epoch": 1306} {"train_loss": -11.545820236206055, "global_step": 219452, "epoch": 1306} {"train_loss": -11.480009078979492, "global_step": 219453, "epoch": 1306} {"train_loss": -11.800182342529297, "global_step": 219454, "epoch": 1306} {"train_loss": -11.539176940917969, "global_step": 219455, "epoch": 1306} {"train_loss": -11.523283958435059, "global_step": 219456, "epoch": 1306} {"train_loss": -11.571534156799316, "global_step": 219457, "epoch": 1306} {"train_loss": -11.819852828979492, "global_step": 219458, "epoch": 1306} {"train_loss": -11.326762199401855, "global_step": 219459, "epoch": 1306} {"train_loss": -11.832643508911133, "global_step": 219460, "epoch": 1306} {"train_loss": -11.52115249633789, "global_step": 219461, "epoch": 1306} {"train_loss": -11.600854873657227, "global_step": 219462, "epoch": 1306} {"train_loss": -11.42741870880127, "global_step": 219463, "epoch": 1306} {"train_loss": -11.547345161437988, "global_step": 219464, "epoch": 1306} {"train_loss": -11.89572525024414, "global_step": 219465, "epoch": 1306} {"train_loss": -11.6420316696167, "global_step": 219466, "epoch": 1306} {"train_loss": -11.626346588134766, "global_step": 219467, "epoch": 1306} {"train_loss": -11.875509262084961, "global_step": 219468, "epoch": 1306} {"train_loss": -11.795454025268555, "global_step": 219469, "epoch": 1306} {"train_loss": -11.995479583740234, "global_step": 219470, "epoch": 1306} {"train_loss": -11.49573040008545, "global_step": 219471, "epoch": 1306} {"train_loss": -11.937957763671875, "global_step": 219472, "epoch": 1306} {"train_loss": -11.490171432495117, "global_step": 219473, "epoch": 1306} {"train_loss": -11.578424453735352, "global_step": 219474, "epoch": 1306} {"train_loss": -11.819269180297852, "global_step": 219475, "epoch": 1306} {"train_loss": -11.16732406616211, "global_step": 219476, "epoch": 1306} {"train_loss": -11.442373275756836, "global_step": 219477, "epoch": 1306} {"train_loss": -11.749133110046387, "global_step": 219478, "epoch": 1306} {"train_loss": -11.543792724609375, "global_step": 219479, "epoch": 1306} {"train_loss": -11.938070297241211, "global_step": 219480, "epoch": 1306} {"train_loss": -11.228519439697266, "global_step": 219481, "epoch": 1306} {"train_loss": -11.89097785949707, "global_step": 219482, "epoch": 1306} {"train_loss": -11.503766059875488, "global_step": 219483, "epoch": 1306} {"train_loss": -11.412034034729004, "global_step": 219484, "epoch": 1306} {"train_loss": -11.630850791931152, "global_step": 219485, "epoch": 1306} {"train_loss": -10.977317810058594, "global_step": 219486, "epoch": 1306} {"train_loss": -11.783442497253418, "global_step": 219487, "epoch": 1306} {"train_loss": -11.276208877563477, "global_step": 219488, "epoch": 1306} {"train_loss": -11.261157035827637, "global_step": 219489, "epoch": 1306} {"train_loss": -11.454264640808105, "global_step": 219490, "epoch": 1306} {"train_loss": -11.63486099243164, "global_step": 219491, "epoch": 1306} {"train_loss": -11.212900161743164, "global_step": 219492, "epoch": 1306} {"train_loss": -10.76124382019043, "global_step": 219493, "epoch": 1306} {"train_loss": -11.291130065917969, "global_step": 219494, "epoch": 1306} {"train_loss": -10.047372817993164, "global_step": 219495, "epoch": 1306} {"train_loss": -11.438858985900879, "global_step": 219496, "epoch": 1306} {"train_loss": -10.421795845031738, "global_step": 219497, "epoch": 1306} {"train_loss": -10.733110427856445, "global_step": 219498, "epoch": 1306} {"train_loss": -10.278059959411621, "global_step": 219499, "epoch": 1306} {"train_loss": -9.99125862121582, "global_step": 219500, "epoch": 1306} {"train_loss": -11.22714900970459, "global_step": 219501, "epoch": 1306} {"train_loss": -8.963364601135254, "global_step": 219502, "epoch": 1306} {"train_loss": -11.165334701538086, "global_step": 219503, "epoch": 1306} {"train_loss": -10.105733871459961, "global_step": 219504, "epoch": 1306} {"train_loss": -10.06489372253418, "global_step": 219505, "epoch": 1306} {"train_loss": -11.522427558898926, "global_step": 219506, "epoch": 1306} {"train_loss": -10.454643249511719, "global_step": 219507, "epoch": 1306} {"train_loss": -10.868922233581543, "global_step": 219508, "epoch": 1306} {"train_loss": -11.482229232788086, "global_step": 219509, "epoch": 1306} {"train_loss": -10.55163860321045, "global_step": 219510, "epoch": 1306} {"train_loss": -11.21902084350586, "global_step": 219511, "epoch": 1306} {"train_loss": -10.985607147216797, "global_step": 219512, "epoch": 1306} {"train_loss": -10.94703197479248, "global_step": 219513, "epoch": 1306} {"train_loss": -11.797927856445312, "global_step": 219514, "epoch": 1306} {"train_loss": -10.930035591125488, "global_step": 219515, "epoch": 1306} {"train_loss": -11.303382873535156, "global_step": 219516, "epoch": 1306} {"train_loss": -11.198683738708496, "global_step": 219517, "epoch": 1306} {"train_loss": -11.051141738891602, "global_step": 219518, "epoch": 1306} {"train_loss": -11.590712547302246, "global_step": 219519, "epoch": 1306} {"train_loss": -10.963565826416016, "global_step": 219520, "epoch": 1306} {"train_loss": -11.460591316223145, "global_step": 219521, "epoch": 1306} {"train_loss": -11.380773544311523, "global_step": 219522, "epoch": 1306} {"train_loss": -11.532964706420898, "global_step": 219523, "epoch": 1306} {"train_loss": -11.358465194702148, "global_step": 219524, "epoch": 1306} {"train_loss": -11.470090866088867, "global_step": 219525, "epoch": 1306} {"train_loss": -11.69361400604248, "global_step": 219526, "epoch": 1306} {"train_loss": -11.235093116760254, "global_step": 219527, "epoch": 1306} {"train_loss": -11.438337326049805, "global_step": 219528, "epoch": 1306} {"train_loss": -11.551929473876953, "global_step": 219529, "epoch": 1306} {"train_loss": -11.69886302947998, "global_step": 219530, "epoch": 1306} {"train_loss": -11.541316986083984, "global_step": 219531, "epoch": 1306} {"train_loss": -11.65848159790039, "global_step": 219532, "epoch": 1306} {"train_loss": -11.681264877319336, "global_step": 219533, "epoch": 1306} {"train_loss": -11.612640380859375, "global_step": 219534, "epoch": 1306} {"train_loss": -11.747796058654785, "global_step": 219535, "epoch": 1306} {"train_loss": -11.651775360107422, "global_step": 219536, "epoch": 1306} {"train_loss": -11.703380584716797, "global_step": 219537, "epoch": 1306} {"train_loss": -11.68890380859375, "global_step": 219538, "epoch": 1306} {"train_loss": -11.765945434570312, "global_step": 219539, "epoch": 1306} {"train_loss": -11.834676742553711, "global_step": 219540, "epoch": 1306} {"train_loss": -11.80120849609375, "global_step": 219541, "epoch": 1306} {"train_loss": -11.830303192138672, "global_step": 219542, "epoch": 1306} {"train_loss": -11.783205032348633, "global_step": 219543, "epoch": 1306} {"train_loss": -11.87047004699707, "global_step": 219544, "epoch": 1306} {"train_loss": -11.565598487854004, "global_step": 219545, "epoch": 1306} {"train_loss": -11.9375638961792, "global_step": 219546, "epoch": 1306} {"train_loss": -11.564624786376953, "global_step": 219547, "epoch": 1306} {"train_loss": -11.823397636413574, "global_step": 219548, "epoch": 1306} {"train_loss": -12.013479232788086, "global_step": 219549, "epoch": 1306} {"train_loss": -11.911588668823242, "global_step": 219550, "epoch": 1306} {"train_loss": -11.980552673339844, "global_step": 219551, "epoch": 1306} {"train_loss": -12.043251037597656, "global_step": 219552, "epoch": 1306} {"train_loss": -11.930427551269531, "global_step": 219553, "epoch": 1306} {"train_loss": -11.802215576171875, "global_step": 219554, "epoch": 1306} {"train_loss": -11.684813499450684, "global_step": 219555, "epoch": 1306} {"train_loss": -11.900812149047852, "global_step": 219556, "epoch": 1306} {"train_loss": -11.647632598876953, "global_step": 219557, "epoch": 1306} {"train_loss": -11.513813018798828, "global_step": 219558, "epoch": 1306} {"train_loss": -11.535401344299316, "global_step": 219559, "epoch": 1306} {"train_loss": -11.556812286376953, "global_step": 219560, "epoch": 1306} {"train_loss": -11.445039749145508, "global_step": 219561, "epoch": 1306} {"train_loss": -11.509048461914062, "global_step": 219562, "epoch": 1306} {"train_loss": -11.579696655273438, "global_step": 219563, "epoch": 1306} {"train_loss": -11.526215553283691, "global_step": 219564, "epoch": 1306} {"train_loss": -11.262372970581055, "global_step": 219565, "epoch": 1306} {"train_loss": -11.269947052001953, "global_step": 219566, "epoch": 1306} {"train_loss": -11.527920722961426, "global_step": 219567, "epoch": 1306} {"train_loss": -11.414822578430176, "global_step": 219568, "epoch": 1306} {"train_loss": -11.414592742919922, "global_step": 219569, "epoch": 1306} {"train_loss": -11.35641860961914, "global_step": 219570, "epoch": 1306} {"train_loss": -11.754494667053223, "global_step": 219571, "epoch": 1306} {"train_loss": -11.353358268737793, "global_step": 219572, "epoch": 1306} {"train_loss": -10.713741302490234, "global_step": 219573, "epoch": 1306} {"train_loss": -11.70050048828125, "global_step": 219574, "epoch": 1306} {"train_loss": -11.383769398643857, "global_step": 219575, "epoch": 1306, "val_loss": 259581.609375} {"train_loss": -10.839937210083008, "global_step": 219576, "epoch": 1307} {"train_loss": -11.276597023010254, "global_step": 219577, "epoch": 1307} {"train_loss": -11.409311294555664, "global_step": 219578, "epoch": 1307} {"train_loss": -10.014518737792969, "global_step": 219579, "epoch": 1307} {"train_loss": -11.310707092285156, "global_step": 219580, "epoch": 1307} {"train_loss": -10.789363861083984, "global_step": 219581, "epoch": 1307} {"train_loss": -11.480936050415039, "global_step": 219582, "epoch": 1307} {"train_loss": -10.762384414672852, "global_step": 219583, "epoch": 1307} {"train_loss": -10.843137741088867, "global_step": 219584, "epoch": 1307} {"train_loss": -11.445013046264648, "global_step": 219585, "epoch": 1307} {"train_loss": -10.305425643920898, "global_step": 219586, "epoch": 1307} {"train_loss": -10.719093322753906, "global_step": 219587, "epoch": 1307} {"train_loss": -11.435006141662598, "global_step": 219588, "epoch": 1307} {"train_loss": -10.277002334594727, "global_step": 219589, "epoch": 1307} {"train_loss": -11.109992980957031, "global_step": 219590, "epoch": 1307} {"train_loss": -9.577747344970703, "global_step": 219591, "epoch": 1307} {"train_loss": -11.305956840515137, "global_step": 219592, "epoch": 1307} {"train_loss": -10.008505821228027, "global_step": 219593, "epoch": 1307} {"train_loss": -11.32950210571289, "global_step": 219594, "epoch": 1307} {"train_loss": -10.185977935791016, "global_step": 219595, "epoch": 1307} {"train_loss": -11.512823104858398, "global_step": 219596, "epoch": 1307} {"train_loss": -9.910411834716797, "global_step": 219597, "epoch": 1307} {"train_loss": -11.467035293579102, "global_step": 219598, "epoch": 1307} {"train_loss": -9.908397674560547, "global_step": 219599, "epoch": 1307} {"train_loss": -11.28314208984375, "global_step": 219600, "epoch": 1307} {"train_loss": -10.338480949401855, "global_step": 219601, "epoch": 1307} {"train_loss": -11.241142272949219, "global_step": 219602, "epoch": 1307} {"train_loss": -10.619011878967285, "global_step": 219603, "epoch": 1307} {"train_loss": -11.33155345916748, "global_step": 219604, "epoch": 1307} {"train_loss": -10.677734375, "global_step": 219605, "epoch": 1307} {"train_loss": -11.105401992797852, "global_step": 219606, "epoch": 1307} {"train_loss": -11.361038208007812, "global_step": 219607, "epoch": 1307} {"train_loss": -10.991769790649414, "global_step": 219608, "epoch": 1307} {"train_loss": -11.366876602172852, "global_step": 219609, "epoch": 1307} {"train_loss": -11.361289978027344, "global_step": 219610, "epoch": 1307} {"train_loss": -11.148691177368164, "global_step": 219611, "epoch": 1307} {"train_loss": -11.123016357421875, "global_step": 219612, "epoch": 1307} {"train_loss": -11.652286529541016, "global_step": 219613, "epoch": 1307} {"train_loss": -11.37432861328125, "global_step": 219614, "epoch": 1307} {"train_loss": -11.589767456054688, "global_step": 219615, "epoch": 1307} {"train_loss": -11.472607612609863, "global_step": 219616, "epoch": 1307} {"train_loss": -11.02474594116211, "global_step": 219617, "epoch": 1307} {"train_loss": -11.465961456298828, "global_step": 219618, "epoch": 1307} {"train_loss": -11.437058448791504, "global_step": 219619, "epoch": 1307} {"train_loss": -11.420467376708984, "global_step": 219620, "epoch": 1307} {"train_loss": -11.223726272583008, "global_step": 219621, "epoch": 1307} {"train_loss": -11.485128402709961, "global_step": 219622, "epoch": 1307} {"train_loss": -11.387472152709961, "global_step": 219623, "epoch": 1307} {"train_loss": -11.386072158813477, "global_step": 219624, "epoch": 1307} {"train_loss": -11.377413749694824, "global_step": 219625, "epoch": 1307} {"train_loss": -11.538628578186035, "global_step": 219626, "epoch": 1307} {"train_loss": -11.478250503540039, "global_step": 219627, "epoch": 1307} {"train_loss": -11.415066719055176, "global_step": 219628, "epoch": 1307} {"train_loss": -11.751709938049316, "global_step": 219629, "epoch": 1307} {"train_loss": -11.415101051330566, "global_step": 219630, "epoch": 1307} {"train_loss": -11.542595863342285, "global_step": 219631, "epoch": 1307} {"train_loss": -11.424674987792969, "global_step": 219632, "epoch": 1307} {"train_loss": -11.738180160522461, "global_step": 219633, "epoch": 1307} {"train_loss": -11.741116523742676, "global_step": 219634, "epoch": 1307} {"train_loss": -11.695030212402344, "global_step": 219635, "epoch": 1307} {"train_loss": -11.497533798217773, "global_step": 219636, "epoch": 1307} {"train_loss": -11.690956115722656, "global_step": 219637, "epoch": 1307} {"train_loss": -11.828346252441406, "global_step": 219638, "epoch": 1307} {"train_loss": -11.794206619262695, "global_step": 219639, "epoch": 1307} {"train_loss": -11.58333683013916, "global_step": 219640, "epoch": 1307} {"train_loss": -11.684845924377441, "global_step": 219641, "epoch": 1307} {"train_loss": -11.584284782409668, "global_step": 219642, "epoch": 1307} {"train_loss": -11.519969940185547, "global_step": 219643, "epoch": 1307} {"train_loss": -11.689031600952148, "global_step": 219644, "epoch": 1307} {"train_loss": -11.183290481567383, "global_step": 219645, "epoch": 1307} {"train_loss": -11.539542198181152, "global_step": 219646, "epoch": 1307} {"train_loss": -11.807783126831055, "global_step": 219647, "epoch": 1307} {"train_loss": -11.532496452331543, "global_step": 219648, "epoch": 1307} {"train_loss": -11.897951126098633, "global_step": 219649, "epoch": 1307} {"train_loss": -11.879918098449707, "global_step": 219650, "epoch": 1307} {"train_loss": -11.70998764038086, "global_step": 219651, "epoch": 1307} {"train_loss": -11.889896392822266, "global_step": 219652, "epoch": 1307} {"train_loss": -11.643848419189453, "global_step": 219653, "epoch": 1307} {"train_loss": -11.907032012939453, "global_step": 219654, "epoch": 1307} {"train_loss": -12.03317928314209, "global_step": 219655, "epoch": 1307} {"train_loss": -11.343999862670898, "global_step": 219656, "epoch": 1307} {"train_loss": -11.816673278808594, "global_step": 219657, "epoch": 1307} {"train_loss": -11.583582878112793, "global_step": 219658, "epoch": 1307} {"train_loss": -11.779096603393555, "global_step": 219659, "epoch": 1307} {"train_loss": -11.828519821166992, "global_step": 219660, "epoch": 1307} {"train_loss": -11.678442001342773, "global_step": 219661, "epoch": 1307} {"train_loss": -11.723426818847656, "global_step": 219662, "epoch": 1307} {"train_loss": -11.865242004394531, "global_step": 219663, "epoch": 1307} {"train_loss": -11.827150344848633, "global_step": 219664, "epoch": 1307} {"train_loss": -11.878594398498535, "global_step": 219665, "epoch": 1307} {"train_loss": -11.848652839660645, "global_step": 219666, "epoch": 1307} {"train_loss": -11.437711715698242, "global_step": 219667, "epoch": 1307} {"train_loss": -11.639120101928711, "global_step": 219668, "epoch": 1307} {"train_loss": -11.391602516174316, "global_step": 219669, "epoch": 1307} {"train_loss": -11.34251880645752, "global_step": 219670, "epoch": 1307} {"train_loss": -11.55015754699707, "global_step": 219671, "epoch": 1307} {"train_loss": -11.464679718017578, "global_step": 219672, "epoch": 1307} {"train_loss": -11.332087516784668, "global_step": 219673, "epoch": 1307} {"train_loss": -11.266366958618164, "global_step": 219674, "epoch": 1307} {"train_loss": -11.444063186645508, "global_step": 219675, "epoch": 1307} {"train_loss": -10.548985481262207, "global_step": 219676, "epoch": 1307} {"train_loss": -11.762929916381836, "global_step": 219677, "epoch": 1307} {"train_loss": -11.274152755737305, "global_step": 219678, "epoch": 1307} {"train_loss": -11.640666007995605, "global_step": 219679, "epoch": 1307} {"train_loss": -10.974763870239258, "global_step": 219680, "epoch": 1307} {"train_loss": -11.367413520812988, "global_step": 219681, "epoch": 1307} {"train_loss": -11.258281707763672, "global_step": 219682, "epoch": 1307} {"train_loss": -10.685997009277344, "global_step": 219683, "epoch": 1307} {"train_loss": -10.816032409667969, "global_step": 219684, "epoch": 1307} {"train_loss": -11.535529136657715, "global_step": 219685, "epoch": 1307} {"train_loss": -11.66323184967041, "global_step": 219686, "epoch": 1307} {"train_loss": -10.777904510498047, "global_step": 219687, "epoch": 1307} {"train_loss": -11.223155975341797, "global_step": 219688, "epoch": 1307} {"train_loss": -11.837451934814453, "global_step": 219689, "epoch": 1307} {"train_loss": -11.503152847290039, "global_step": 219690, "epoch": 1307} {"train_loss": -11.534311294555664, "global_step": 219691, "epoch": 1307} {"train_loss": -11.694329261779785, "global_step": 219692, "epoch": 1307} {"train_loss": -11.641783714294434, "global_step": 219693, "epoch": 1307} {"train_loss": -11.683320999145508, "global_step": 219694, "epoch": 1307} {"train_loss": -11.696691513061523, "global_step": 219695, "epoch": 1307} {"train_loss": -11.510486602783203, "global_step": 219696, "epoch": 1307} {"train_loss": -11.295637130737305, "global_step": 219697, "epoch": 1307} {"train_loss": -11.532312393188477, "global_step": 219698, "epoch": 1307} {"train_loss": -10.753631591796875, "global_step": 219699, "epoch": 1307} {"train_loss": -11.018146514892578, "global_step": 219700, "epoch": 1307} {"train_loss": -11.304194450378418, "global_step": 219701, "epoch": 1307} {"train_loss": -10.71133804321289, "global_step": 219702, "epoch": 1307} {"train_loss": -11.43624496459961, "global_step": 219703, "epoch": 1307} {"train_loss": -10.667497634887695, "global_step": 219704, "epoch": 1307} {"train_loss": -11.140377044677734, "global_step": 219705, "epoch": 1307} {"train_loss": -11.006341934204102, "global_step": 219706, "epoch": 1307} {"train_loss": -11.187627792358398, "global_step": 219707, "epoch": 1307} {"train_loss": -11.518692016601562, "global_step": 219708, "epoch": 1307} {"train_loss": -11.513944625854492, "global_step": 219709, "epoch": 1307} {"train_loss": -11.662714004516602, "global_step": 219710, "epoch": 1307} {"train_loss": -11.291759490966797, "global_step": 219711, "epoch": 1307} {"train_loss": -11.594314575195312, "global_step": 219712, "epoch": 1307} {"train_loss": -11.62220573425293, "global_step": 219713, "epoch": 1307} {"train_loss": -11.640249252319336, "global_step": 219714, "epoch": 1307} {"train_loss": -11.886521339416504, "global_step": 219715, "epoch": 1307} {"train_loss": -11.81924819946289, "global_step": 219716, "epoch": 1307} {"train_loss": -11.694931030273438, "global_step": 219717, "epoch": 1307} {"train_loss": -11.959325790405273, "global_step": 219718, "epoch": 1307} {"train_loss": -11.520280838012695, "global_step": 219719, "epoch": 1307} {"train_loss": -11.664926528930664, "global_step": 219720, "epoch": 1307} {"train_loss": -11.056217193603516, "global_step": 219721, "epoch": 1307} {"train_loss": -11.534906387329102, "global_step": 219722, "epoch": 1307} {"train_loss": -11.655144691467285, "global_step": 219723, "epoch": 1307} {"train_loss": -11.568472862243652, "global_step": 219724, "epoch": 1307} {"train_loss": -11.881401062011719, "global_step": 219725, "epoch": 1307} {"train_loss": -11.37569808959961, "global_step": 219726, "epoch": 1307} {"train_loss": -11.972156524658203, "global_step": 219727, "epoch": 1307} {"train_loss": -11.326546669006348, "global_step": 219728, "epoch": 1307} {"train_loss": -11.673809051513672, "global_step": 219729, "epoch": 1307} {"train_loss": -11.503917694091797, "global_step": 219730, "epoch": 1307} {"train_loss": -11.852968215942383, "global_step": 219731, "epoch": 1307} {"train_loss": -11.636411666870117, "global_step": 219732, "epoch": 1307} {"train_loss": -11.802084922790527, "global_step": 219733, "epoch": 1307} {"train_loss": -11.510923385620117, "global_step": 219734, "epoch": 1307} {"train_loss": -11.984203338623047, "global_step": 219735, "epoch": 1307} {"train_loss": -11.839032173156738, "global_step": 219736, "epoch": 1307} {"train_loss": -11.686958312988281, "global_step": 219737, "epoch": 1307} {"train_loss": -11.785940170288086, "global_step": 219738, "epoch": 1307} {"train_loss": -11.721078872680664, "global_step": 219739, "epoch": 1307} {"train_loss": -11.334732055664062, "global_step": 219740, "epoch": 1307} {"train_loss": -11.704233169555664, "global_step": 219741, "epoch": 1307} {"train_loss": -11.629716873168945, "global_step": 219742, "epoch": 1307} {"train_loss": -11.38694307349977, "global_step": 219743, "epoch": 1307, "val_loss": 259548.359375} {"train_loss": -11.43289566040039, "global_step": 219744, "epoch": 1308} {"train_loss": -11.93771743774414, "global_step": 219745, "epoch": 1308} {"train_loss": -11.419988632202148, "global_step": 219746, "epoch": 1308} {"train_loss": -11.590152740478516, "global_step": 219747, "epoch": 1308} {"train_loss": -11.74968147277832, "global_step": 219748, "epoch": 1308} {"train_loss": -11.544648170471191, "global_step": 219749, "epoch": 1308} {"train_loss": -11.308343887329102, "global_step": 219750, "epoch": 1308} {"train_loss": -11.660645484924316, "global_step": 219751, "epoch": 1308} {"train_loss": -11.7071533203125, "global_step": 219752, "epoch": 1308} {"train_loss": -11.86446762084961, "global_step": 219753, "epoch": 1308} {"train_loss": -11.948020935058594, "global_step": 219754, "epoch": 1308} {"train_loss": -11.93730354309082, "global_step": 219755, "epoch": 1308} {"train_loss": -11.64261245727539, "global_step": 219756, "epoch": 1308} {"train_loss": -11.740154266357422, "global_step": 219757, "epoch": 1308} {"train_loss": -11.798328399658203, "global_step": 219758, "epoch": 1308} {"train_loss": -11.699752807617188, "global_step": 219759, "epoch": 1308} {"train_loss": -11.679360389709473, "global_step": 219760, "epoch": 1308} {"train_loss": -11.892374038696289, "global_step": 219761, "epoch": 1308} {"train_loss": -11.778485298156738, "global_step": 219762, "epoch": 1308} {"train_loss": -11.81169605255127, "global_step": 219763, "epoch": 1308} {"train_loss": -11.903375625610352, "global_step": 219764, "epoch": 1308} {"train_loss": -11.76662826538086, "global_step": 219765, "epoch": 1308} {"train_loss": -11.243169784545898, "global_step": 219766, "epoch": 1308} {"train_loss": -11.518867492675781, "global_step": 219767, "epoch": 1308} {"train_loss": -12.097391128540039, "global_step": 219768, "epoch": 1308} {"train_loss": -11.884069442749023, "global_step": 219769, "epoch": 1308} {"train_loss": -11.456313133239746, "global_step": 219770, "epoch": 1308} {"train_loss": -11.848015785217285, "global_step": 219771, "epoch": 1308} {"train_loss": -11.524932861328125, "global_step": 219772, "epoch": 1308} {"train_loss": -11.820465087890625, "global_step": 219773, "epoch": 1308} {"train_loss": -11.66951847076416, "global_step": 219774, "epoch": 1308} {"train_loss": -11.676597595214844, "global_step": 219775, "epoch": 1308} {"train_loss": -11.704388618469238, "global_step": 219776, "epoch": 1308} {"train_loss": -11.54598331451416, "global_step": 219777, "epoch": 1308} {"train_loss": -11.854142189025879, "global_step": 219778, "epoch": 1308} {"train_loss": -11.35634994506836, "global_step": 219779, "epoch": 1308} {"train_loss": -11.017250061035156, "global_step": 219780, "epoch": 1308} {"train_loss": -11.205499649047852, "global_step": 219781, "epoch": 1308} {"train_loss": -11.383570671081543, "global_step": 219782, "epoch": 1308} {"train_loss": -11.641409873962402, "global_step": 219783, "epoch": 1308} {"train_loss": -11.765724182128906, "global_step": 219784, "epoch": 1308} {"train_loss": -11.175470352172852, "global_step": 219785, "epoch": 1308} {"train_loss": -11.807992935180664, "global_step": 219786, "epoch": 1308} {"train_loss": -11.264265060424805, "global_step": 219787, "epoch": 1308} {"train_loss": -9.804323196411133, "global_step": 219788, "epoch": 1308} {"train_loss": -11.317164421081543, "global_step": 219789, "epoch": 1308} {"train_loss": -10.838966369628906, "global_step": 219790, "epoch": 1308} {"train_loss": -10.288923263549805, "global_step": 219791, "epoch": 1308} {"train_loss": -10.484872817993164, "global_step": 219792, "epoch": 1308} {"train_loss": -10.26834487915039, "global_step": 219793, "epoch": 1308} {"train_loss": -8.619123458862305, "global_step": 219794, "epoch": 1308} {"train_loss": -10.182563781738281, "global_step": 219795, "epoch": 1308} {"train_loss": -8.64267349243164, "global_step": 219796, "epoch": 1308} {"train_loss": -10.099676132202148, "global_step": 219797, "epoch": 1308} {"train_loss": -8.262540817260742, "global_step": 219798, "epoch": 1308} {"train_loss": -8.534236907958984, "global_step": 219799, "epoch": 1308} {"train_loss": -8.205015182495117, "global_step": 219800, "epoch": 1308} {"train_loss": -9.370603561401367, "global_step": 219801, "epoch": 1308} {"train_loss": -10.365711212158203, "global_step": 219802, "epoch": 1308} {"train_loss": -9.462623596191406, "global_step": 219803, "epoch": 1308} {"train_loss": -10.42833137512207, "global_step": 219804, "epoch": 1308} {"train_loss": -9.417424201965332, "global_step": 219805, "epoch": 1308} {"train_loss": -9.770875930786133, "global_step": 219806, "epoch": 1308} {"train_loss": -10.380901336669922, "global_step": 219807, "epoch": 1308} {"train_loss": -8.995373725891113, "global_step": 219808, "epoch": 1308} {"train_loss": -10.795215606689453, "global_step": 219809, "epoch": 1308} {"train_loss": -9.496042251586914, "global_step": 219810, "epoch": 1308} {"train_loss": -10.561521530151367, "global_step": 219811, "epoch": 1308} {"train_loss": -10.534173011779785, "global_step": 219812, "epoch": 1308} {"train_loss": -10.33425521850586, "global_step": 219813, "epoch": 1308} {"train_loss": -10.73701000213623, "global_step": 219814, "epoch": 1308} {"train_loss": -10.467398643493652, "global_step": 219815, "epoch": 1308} {"train_loss": -11.088895797729492, "global_step": 219816, "epoch": 1308} {"train_loss": -10.878072738647461, "global_step": 219817, "epoch": 1308} {"train_loss": -10.803373336791992, "global_step": 219818, "epoch": 1308} {"train_loss": -11.006120681762695, "global_step": 219819, "epoch": 1308} {"train_loss": -11.043862342834473, "global_step": 219820, "epoch": 1308} {"train_loss": -11.049721717834473, "global_step": 219821, "epoch": 1308} {"train_loss": -11.109088897705078, "global_step": 219822, "epoch": 1308} {"train_loss": -11.299257278442383, "global_step": 219823, "epoch": 1308} {"train_loss": -10.944170951843262, "global_step": 219824, "epoch": 1308} {"train_loss": -11.297380447387695, "global_step": 219825, "epoch": 1308} {"train_loss": -11.07877254486084, "global_step": 219826, "epoch": 1308} {"train_loss": -11.252153396606445, "global_step": 219827, "epoch": 1308} {"train_loss": -11.350976943969727, "global_step": 219828, "epoch": 1308} {"train_loss": -11.116023063659668, "global_step": 219829, "epoch": 1308} {"train_loss": -11.188867568969727, "global_step": 219830, "epoch": 1308} {"train_loss": -11.271024703979492, "global_step": 219831, "epoch": 1308} {"train_loss": -11.140312194824219, "global_step": 219832, "epoch": 1308} {"train_loss": -11.366312026977539, "global_step": 219833, "epoch": 1308} {"train_loss": -11.272603034973145, "global_step": 219834, "epoch": 1308} {"train_loss": -11.268028259277344, "global_step": 219835, "epoch": 1308} {"train_loss": -11.392810821533203, "global_step": 219836, "epoch": 1308} {"train_loss": -11.244513511657715, "global_step": 219837, "epoch": 1308} {"train_loss": -11.242975234985352, "global_step": 219838, "epoch": 1308} {"train_loss": -11.545644760131836, "global_step": 219839, "epoch": 1308} {"train_loss": -11.410530090332031, "global_step": 219840, "epoch": 1308} {"train_loss": -11.50462818145752, "global_step": 219841, "epoch": 1308} {"train_loss": -11.517095565795898, "global_step": 219842, "epoch": 1308} {"train_loss": -11.566271781921387, "global_step": 219843, "epoch": 1308} {"train_loss": -11.62587833404541, "global_step": 219844, "epoch": 1308} {"train_loss": -11.70826530456543, "global_step": 219845, "epoch": 1308} {"train_loss": -11.448077201843262, "global_step": 219846, "epoch": 1308} {"train_loss": -11.651063919067383, "global_step": 219847, "epoch": 1308} {"train_loss": -11.707825660705566, "global_step": 219848, "epoch": 1308} {"train_loss": -11.508014678955078, "global_step": 219849, "epoch": 1308} {"train_loss": -11.824257850646973, "global_step": 219850, "epoch": 1308} {"train_loss": -11.456384658813477, "global_step": 219851, "epoch": 1308} {"train_loss": -11.723464965820312, "global_step": 219852, "epoch": 1308} {"train_loss": -11.650017738342285, "global_step": 219853, "epoch": 1308} {"train_loss": -11.412412643432617, "global_step": 219854, "epoch": 1308} {"train_loss": -11.566957473754883, "global_step": 219855, "epoch": 1308} {"train_loss": -11.764859199523926, "global_step": 219856, "epoch": 1308} {"train_loss": -11.703920364379883, "global_step": 219857, "epoch": 1308} {"train_loss": -11.81631851196289, "global_step": 219858, "epoch": 1308} {"train_loss": -11.731712341308594, "global_step": 219859, "epoch": 1308} {"train_loss": -11.66358757019043, "global_step": 219860, "epoch": 1308} {"train_loss": -11.872180938720703, "global_step": 219861, "epoch": 1308} {"train_loss": -11.897305488586426, "global_step": 219862, "epoch": 1308} {"train_loss": -11.867340087890625, "global_step": 219863, "epoch": 1308} {"train_loss": -11.908927917480469, "global_step": 219864, "epoch": 1308} {"train_loss": -11.841753959655762, "global_step": 219865, "epoch": 1308} {"train_loss": -12.028160095214844, "global_step": 219866, "epoch": 1308} {"train_loss": -11.830438613891602, "global_step": 219867, "epoch": 1308} {"train_loss": -11.886514663696289, "global_step": 219868, "epoch": 1308} {"train_loss": -11.882472038269043, "global_step": 219869, "epoch": 1308} {"train_loss": -11.749526977539062, "global_step": 219870, "epoch": 1308} {"train_loss": -11.767099380493164, "global_step": 219871, "epoch": 1308} {"train_loss": -11.908912658691406, "global_step": 219872, "epoch": 1308} {"train_loss": -11.830812454223633, "global_step": 219873, "epoch": 1308} {"train_loss": -11.794224739074707, "global_step": 219874, "epoch": 1308} {"train_loss": -11.975770950317383, "global_step": 219875, "epoch": 1308} {"train_loss": -11.681558609008789, "global_step": 219876, "epoch": 1308} {"train_loss": -11.921735763549805, "global_step": 219877, "epoch": 1308} {"train_loss": -11.910157203674316, "global_step": 219878, "epoch": 1308} {"train_loss": -11.529390335083008, "global_step": 219879, "epoch": 1308} {"train_loss": -11.881261825561523, "global_step": 219880, "epoch": 1308} {"train_loss": -11.891674995422363, "global_step": 219881, "epoch": 1308} {"train_loss": -11.457714080810547, "global_step": 219882, "epoch": 1308} {"train_loss": -11.357498168945312, "global_step": 219883, "epoch": 1308} {"train_loss": -11.880104064941406, "global_step": 219884, "epoch": 1308} {"train_loss": -11.206267356872559, "global_step": 219885, "epoch": 1308} {"train_loss": -11.740031242370605, "global_step": 219886, "epoch": 1308} {"train_loss": -11.43187427520752, "global_step": 219887, "epoch": 1308} {"train_loss": -11.231639862060547, "global_step": 219888, "epoch": 1308} {"train_loss": -11.117792129516602, "global_step": 219889, "epoch": 1308} {"train_loss": -10.748041152954102, "global_step": 219890, "epoch": 1308} {"train_loss": -9.13612174987793, "global_step": 219891, "epoch": 1308} {"train_loss": -10.145225524902344, "global_step": 219892, "epoch": 1308} {"train_loss": -11.180810928344727, "global_step": 219893, "epoch": 1308} {"train_loss": -7.249045372009277, "global_step": 219894, "epoch": 1308} {"train_loss": -11.040506362915039, "global_step": 219895, "epoch": 1308} {"train_loss": -7.645829200744629, "global_step": 219896, "epoch": 1308} {"train_loss": -7.392884731292725, "global_step": 219897, "epoch": 1308} {"train_loss": -8.987785339355469, "global_step": 219898, "epoch": 1308} {"train_loss": -8.834139823913574, "global_step": 219899, "epoch": 1308} {"train_loss": -9.55716323852539, "global_step": 219900, "epoch": 1308} {"train_loss": -7.835434913635254, "global_step": 219901, "epoch": 1308} {"train_loss": -7.173825740814209, "global_step": 219902, "epoch": 1308} {"train_loss": -7.661838531494141, "global_step": 219903, "epoch": 1308} {"train_loss": -8.923345565795898, "global_step": 219904, "epoch": 1308} {"train_loss": -8.722015380859375, "global_step": 219905, "epoch": 1308} {"train_loss": -9.089569091796875, "global_step": 219906, "epoch": 1308} {"train_loss": -8.190074920654297, "global_step": 219907, "epoch": 1308} {"train_loss": -9.175704956054688, "global_step": 219908, "epoch": 1308} {"train_loss": -8.857574462890625, "global_step": 219909, "epoch": 1308} {"train_loss": -10.379915237426758, "global_step": 219910, "epoch": 1308} {"train_loss": -10.944719053450084, "global_step": 219911, "epoch": 1308, "val_loss": 251818.8125} {"train_loss": -9.462061882019043, "global_step": 219912, "epoch": 1309} {"train_loss": -10.620317459106445, "global_step": 219913, "epoch": 1309} {"train_loss": -9.772090911865234, "global_step": 219914, "epoch": 1309} {"train_loss": -10.005544662475586, "global_step": 219915, "epoch": 1309} {"train_loss": -10.130123138427734, "global_step": 219916, "epoch": 1309} {"train_loss": -9.383878707885742, "global_step": 219917, "epoch": 1309} {"train_loss": -10.406311988830566, "global_step": 219918, "epoch": 1309} {"train_loss": -9.994400024414062, "global_step": 219919, "epoch": 1309} {"train_loss": -10.658949851989746, "global_step": 219920, "epoch": 1309} {"train_loss": -10.201433181762695, "global_step": 219921, "epoch": 1309} {"train_loss": -10.752115249633789, "global_step": 219922, "epoch": 1309} {"train_loss": -10.727174758911133, "global_step": 219923, "epoch": 1309} {"train_loss": -10.189037322998047, "global_step": 219924, "epoch": 1309} {"train_loss": -11.045764923095703, "global_step": 219925, "epoch": 1309} {"train_loss": -10.92488956451416, "global_step": 219926, "epoch": 1309} {"train_loss": -10.563457489013672, "global_step": 219927, "epoch": 1309} {"train_loss": -10.997591972351074, "global_step": 219928, "epoch": 1309} {"train_loss": -10.992669105529785, "global_step": 219929, "epoch": 1309} {"train_loss": -10.752664566040039, "global_step": 219930, "epoch": 1309} {"train_loss": -11.107965469360352, "global_step": 219931, "epoch": 1309} {"train_loss": -11.140941619873047, "global_step": 219932, "epoch": 1309} {"train_loss": -10.959181785583496, "global_step": 219933, "epoch": 1309} {"train_loss": -11.178749084472656, "global_step": 219934, "epoch": 1309} {"train_loss": -11.187128067016602, "global_step": 219935, "epoch": 1309} {"train_loss": -11.06800365447998, "global_step": 219936, "epoch": 1309} {"train_loss": -11.299415588378906, "global_step": 219937, "epoch": 1309} {"train_loss": -11.298161506652832, "global_step": 219938, "epoch": 1309} {"train_loss": -11.2400541305542, "global_step": 219939, "epoch": 1309} {"train_loss": -11.188592910766602, "global_step": 219940, "epoch": 1309} {"train_loss": -11.454280853271484, "global_step": 219941, "epoch": 1309} {"train_loss": -11.46108341217041, "global_step": 219942, "epoch": 1309} {"train_loss": -11.363077163696289, "global_step": 219943, "epoch": 1309} {"train_loss": -11.151605606079102, "global_step": 219944, "epoch": 1309} {"train_loss": -11.527032852172852, "global_step": 219945, "epoch": 1309} {"train_loss": -11.333255767822266, "global_step": 219946, "epoch": 1309} {"train_loss": -11.416044235229492, "global_step": 219947, "epoch": 1309} {"train_loss": -11.50262451171875, "global_step": 219948, "epoch": 1309} {"train_loss": -11.522284507751465, "global_step": 219949, "epoch": 1309} {"train_loss": -11.468719482421875, "global_step": 219950, "epoch": 1309} {"train_loss": -11.4471435546875, "global_step": 219951, "epoch": 1309} {"train_loss": -11.52166748046875, "global_step": 219952, "epoch": 1309} {"train_loss": -11.455634117126465, "global_step": 219953, "epoch": 1309} {"train_loss": -11.447996139526367, "global_step": 219954, "epoch": 1309} {"train_loss": -11.561193466186523, "global_step": 219955, "epoch": 1309} {"train_loss": -11.419820785522461, "global_step": 219956, "epoch": 1309} {"train_loss": -11.56906509399414, "global_step": 219957, "epoch": 1309} {"train_loss": -11.475778579711914, "global_step": 219958, "epoch": 1309} {"train_loss": -11.470601081848145, "global_step": 219959, "epoch": 1309} {"train_loss": -11.474903106689453, "global_step": 219960, "epoch": 1309} {"train_loss": -11.519993782043457, "global_step": 219961, "epoch": 1309} {"train_loss": -11.548385620117188, "global_step": 219962, "epoch": 1309} {"train_loss": -11.5726318359375, "global_step": 219963, "epoch": 1309} {"train_loss": -11.504837036132812, "global_step": 219964, "epoch": 1309} {"train_loss": -11.806455612182617, "global_step": 219965, "epoch": 1309} {"train_loss": -11.605356216430664, "global_step": 219966, "epoch": 1309} {"train_loss": -11.558988571166992, "global_step": 219967, "epoch": 1309} {"train_loss": -11.600576400756836, "global_step": 219968, "epoch": 1309} {"train_loss": -11.794870376586914, "global_step": 219969, "epoch": 1309} {"train_loss": -11.895807266235352, "global_step": 219970, "epoch": 1309} {"train_loss": -11.730266571044922, "global_step": 219971, "epoch": 1309} {"train_loss": -11.76860523223877, "global_step": 219972, "epoch": 1309} {"train_loss": -11.702293395996094, "global_step": 219973, "epoch": 1309} {"train_loss": -11.847248077392578, "global_step": 219974, "epoch": 1309} {"train_loss": -11.759697914123535, "global_step": 219975, "epoch": 1309} {"train_loss": -11.710942268371582, "global_step": 219976, "epoch": 1309} {"train_loss": -11.813436508178711, "global_step": 219977, "epoch": 1309} {"train_loss": -11.87274169921875, "global_step": 219978, "epoch": 1309} {"train_loss": -11.90338134765625, "global_step": 219979, "epoch": 1309} {"train_loss": -11.786905288696289, "global_step": 219980, "epoch": 1309} {"train_loss": -11.904820442199707, "global_step": 219981, "epoch": 1309} {"train_loss": -11.844953536987305, "global_step": 219982, "epoch": 1309} {"train_loss": -12.020509719848633, "global_step": 219983, "epoch": 1309} {"train_loss": -11.781576156616211, "global_step": 219984, "epoch": 1309} {"train_loss": -11.949416160583496, "global_step": 219985, "epoch": 1309} {"train_loss": -12.024434089660645, "global_step": 219986, "epoch": 1309} {"train_loss": -11.898646354675293, "global_step": 219987, "epoch": 1309} {"train_loss": -11.918288230895996, "global_step": 219988, "epoch": 1309} {"train_loss": -12.031265258789062, "global_step": 219989, "epoch": 1309} {"train_loss": -11.92119026184082, "global_step": 219990, "epoch": 1309} {"train_loss": -11.945143699645996, "global_step": 219991, "epoch": 1309} {"train_loss": -11.966312408447266, "global_step": 219992, "epoch": 1309} {"train_loss": -12.049158096313477, "global_step": 219993, "epoch": 1309} {"train_loss": -11.971231460571289, "global_step": 219994, "epoch": 1309} {"train_loss": -12.050889015197754, "global_step": 219995, "epoch": 1309} {"train_loss": -12.069367408752441, "global_step": 219996, "epoch": 1309} {"train_loss": -12.094752311706543, "global_step": 219997, "epoch": 1309} {"train_loss": -12.046380996704102, "global_step": 219998, "epoch": 1309} {"train_loss": -11.77543830871582, "global_step": 219999, "epoch": 1309} {"train_loss": -11.870943069458008, "global_step": 220000, "epoch": 1309} {"train_loss": -12.15146255493164, "global_step": 220001, "epoch": 1309} {"train_loss": -11.888016700744629, "global_step": 220002, "epoch": 1309} {"train_loss": -12.104552268981934, "global_step": 220003, "epoch": 1309} {"train_loss": -11.646018981933594, "global_step": 220004, "epoch": 1309} {"train_loss": -10.664135932922363, "global_step": 220005, "epoch": 1309} {"train_loss": -11.668673515319824, "global_step": 220006, "epoch": 1309} {"train_loss": -11.845542907714844, "global_step": 220007, "epoch": 1309} {"train_loss": -10.428655624389648, "global_step": 220008, "epoch": 1309} {"train_loss": -7.763442039489746, "global_step": 220009, "epoch": 1309} {"train_loss": -10.934808731079102, "global_step": 220010, "epoch": 1309} {"train_loss": -10.506461143493652, "global_step": 220011, "epoch": 1309} {"train_loss": -9.239654541015625, "global_step": 220012, "epoch": 1309} {"train_loss": -9.878204345703125, "global_step": 220013, "epoch": 1309} {"train_loss": -11.648393630981445, "global_step": 220014, "epoch": 1309} {"train_loss": -9.356025695800781, "global_step": 220015, "epoch": 1309} {"train_loss": -9.207907676696777, "global_step": 220016, "epoch": 1309} {"train_loss": -11.019328117370605, "global_step": 220017, "epoch": 1309} {"train_loss": -8.65622329711914, "global_step": 220018, "epoch": 1309} {"train_loss": -10.10667896270752, "global_step": 220019, "epoch": 1309} {"train_loss": -11.098443984985352, "global_step": 220020, "epoch": 1309} {"train_loss": -9.830848693847656, "global_step": 220021, "epoch": 1309} {"train_loss": -10.52676010131836, "global_step": 220022, "epoch": 1309} {"train_loss": -9.880178451538086, "global_step": 220023, "epoch": 1309} {"train_loss": -11.133596420288086, "global_step": 220024, "epoch": 1309} {"train_loss": -10.919076919555664, "global_step": 220025, "epoch": 1309} {"train_loss": -11.198160171508789, "global_step": 220026, "epoch": 1309} {"train_loss": -10.548508644104004, "global_step": 220027, "epoch": 1309} {"train_loss": -11.219456672668457, "global_step": 220028, "epoch": 1309} {"train_loss": -10.697004318237305, "global_step": 220029, "epoch": 1309} {"train_loss": -10.973769187927246, "global_step": 220030, "epoch": 1309} {"train_loss": -11.084970474243164, "global_step": 220031, "epoch": 1309} {"train_loss": -10.875625610351562, "global_step": 220032, "epoch": 1309} {"train_loss": -10.608640670776367, "global_step": 220033, "epoch": 1309} {"train_loss": -11.065648078918457, "global_step": 220034, "epoch": 1309} {"train_loss": -10.30180549621582, "global_step": 220035, "epoch": 1309} {"train_loss": -11.261531829833984, "global_step": 220036, "epoch": 1309} {"train_loss": -10.681178092956543, "global_step": 220037, "epoch": 1309} {"train_loss": -10.939494132995605, "global_step": 220038, "epoch": 1309} {"train_loss": -10.456592559814453, "global_step": 220039, "epoch": 1309} {"train_loss": -11.135628700256348, "global_step": 220040, "epoch": 1309} {"train_loss": -10.206439971923828, "global_step": 220041, "epoch": 1309} {"train_loss": -11.407838821411133, "global_step": 220042, "epoch": 1309} {"train_loss": -10.75306510925293, "global_step": 220043, "epoch": 1309} {"train_loss": -11.429563522338867, "global_step": 220044, "epoch": 1309} {"train_loss": -10.963859558105469, "global_step": 220045, "epoch": 1309} {"train_loss": -11.200050354003906, "global_step": 220046, "epoch": 1309} {"train_loss": -11.032318115234375, "global_step": 220047, "epoch": 1309} {"train_loss": -10.910024642944336, "global_step": 220048, "epoch": 1309} {"train_loss": -11.023760795593262, "global_step": 220049, "epoch": 1309} {"train_loss": -11.233606338500977, "global_step": 220050, "epoch": 1309} {"train_loss": -11.184103965759277, "global_step": 220051, "epoch": 1309} {"train_loss": -11.158650398254395, "global_step": 220052, "epoch": 1309} {"train_loss": -11.240884780883789, "global_step": 220053, "epoch": 1309} {"train_loss": -11.163293838500977, "global_step": 220054, "epoch": 1309} {"train_loss": -11.293750762939453, "global_step": 220055, "epoch": 1309} {"train_loss": -11.236662864685059, "global_step": 220056, "epoch": 1309} {"train_loss": -11.184342384338379, "global_step": 220057, "epoch": 1309} {"train_loss": -11.462308883666992, "global_step": 220058, "epoch": 1309} {"train_loss": -11.302422523498535, "global_step": 220059, "epoch": 1309} {"train_loss": -11.340728759765625, "global_step": 220060, "epoch": 1309} {"train_loss": -11.394163131713867, "global_step": 220061, "epoch": 1309} {"train_loss": -11.532666206359863, "global_step": 220062, "epoch": 1309} {"train_loss": -11.349035263061523, "global_step": 220063, "epoch": 1309} {"train_loss": -11.386726379394531, "global_step": 220064, "epoch": 1309} {"train_loss": -11.33163070678711, "global_step": 220065, "epoch": 1309} {"train_loss": -11.534893035888672, "global_step": 220066, "epoch": 1309} {"train_loss": -11.444190979003906, "global_step": 220067, "epoch": 1309} {"train_loss": -11.56919002532959, "global_step": 220068, "epoch": 1309} {"train_loss": -11.574797630310059, "global_step": 220069, "epoch": 1309} {"train_loss": -11.670036315917969, "global_step": 220070, "epoch": 1309} {"train_loss": -11.600957870483398, "global_step": 220071, "epoch": 1309} {"train_loss": -11.335931777954102, "global_step": 220072, "epoch": 1309} {"train_loss": -11.609085083007812, "global_step": 220073, "epoch": 1309} {"train_loss": -11.513906478881836, "global_step": 220074, "epoch": 1309} {"train_loss": -11.633066177368164, "global_step": 220075, "epoch": 1309} {"train_loss": -11.785211563110352, "global_step": 220076, "epoch": 1309} {"train_loss": -11.565570831298828, "global_step": 220077, "epoch": 1309} {"train_loss": -11.684965133666992, "global_step": 220078, "epoch": 1309} {"train_loss": -11.195860391571408, "global_step": 220079, "epoch": 1309, "val_loss": 256765.71875} {"train_loss": -11.425291061401367, "global_step": 220080, "epoch": 1310} {"train_loss": -11.960843086242676, "global_step": 220081, "epoch": 1310} {"train_loss": -11.82862663269043, "global_step": 220082, "epoch": 1310} {"train_loss": -11.835809707641602, "global_step": 220083, "epoch": 1310} {"train_loss": -11.462453842163086, "global_step": 220084, "epoch": 1310} {"train_loss": -11.804917335510254, "global_step": 220085, "epoch": 1310} {"train_loss": -11.498815536499023, "global_step": 220086, "epoch": 1310} {"train_loss": -11.845831871032715, "global_step": 220087, "epoch": 1310} {"train_loss": -11.912379264831543, "global_step": 220088, "epoch": 1310} {"train_loss": -11.675811767578125, "global_step": 220089, "epoch": 1310} {"train_loss": -11.890653610229492, "global_step": 220090, "epoch": 1310} {"train_loss": -11.557282447814941, "global_step": 220091, "epoch": 1310} {"train_loss": -11.875346183776855, "global_step": 220092, "epoch": 1310} {"train_loss": -11.782159805297852, "global_step": 220093, "epoch": 1310} {"train_loss": -11.755499839782715, "global_step": 220094, "epoch": 1310} {"train_loss": -11.928141593933105, "global_step": 220095, "epoch": 1310} {"train_loss": -11.693103790283203, "global_step": 220096, "epoch": 1310} {"train_loss": -11.935192108154297, "global_step": 220097, "epoch": 1310} {"train_loss": -11.97170639038086, "global_step": 220098, "epoch": 1310} {"train_loss": -12.051958084106445, "global_step": 220099, "epoch": 1310} {"train_loss": -11.916531562805176, "global_step": 220100, "epoch": 1310} {"train_loss": -12.094204902648926, "global_step": 220101, "epoch": 1310} {"train_loss": -11.927011489868164, "global_step": 220102, "epoch": 1310} {"train_loss": -11.959839820861816, "global_step": 220103, "epoch": 1310} {"train_loss": -11.628564834594727, "global_step": 220104, "epoch": 1310} {"train_loss": -11.77195930480957, "global_step": 220105, "epoch": 1310} {"train_loss": -11.867515563964844, "global_step": 220106, "epoch": 1310} {"train_loss": -11.779106140136719, "global_step": 220107, "epoch": 1310} {"train_loss": -11.99000358581543, "global_step": 220108, "epoch": 1310} {"train_loss": -11.820662498474121, "global_step": 220109, "epoch": 1310} {"train_loss": -12.015697479248047, "global_step": 220110, "epoch": 1310} {"train_loss": -11.789345741271973, "global_step": 220111, "epoch": 1310} {"train_loss": -11.938265800476074, "global_step": 220112, "epoch": 1310} {"train_loss": -11.513741493225098, "global_step": 220113, "epoch": 1310} {"train_loss": -11.516166687011719, "global_step": 220114, "epoch": 1310} {"train_loss": -11.661698341369629, "global_step": 220115, "epoch": 1310} {"train_loss": -11.179412841796875, "global_step": 220116, "epoch": 1310} {"train_loss": -11.458292007446289, "global_step": 220117, "epoch": 1310} {"train_loss": -11.574567794799805, "global_step": 220118, "epoch": 1310} {"train_loss": -11.323250770568848, "global_step": 220119, "epoch": 1310} {"train_loss": -11.023031234741211, "global_step": 220120, "epoch": 1310} {"train_loss": -11.471586227416992, "global_step": 220121, "epoch": 1310} {"train_loss": -11.701675415039062, "global_step": 220122, "epoch": 1310} {"train_loss": -11.320268630981445, "global_step": 220123, "epoch": 1310} {"train_loss": -11.04038143157959, "global_step": 220124, "epoch": 1310} {"train_loss": -11.74873161315918, "global_step": 220125, "epoch": 1310} {"train_loss": -11.390091896057129, "global_step": 220126, "epoch": 1310} {"train_loss": -11.796775817871094, "global_step": 220127, "epoch": 1310} {"train_loss": -11.867696762084961, "global_step": 220128, "epoch": 1310} {"train_loss": -11.9115629196167, "global_step": 220129, "epoch": 1310} {"train_loss": -11.469581604003906, "global_step": 220130, "epoch": 1310} {"train_loss": -11.785382270812988, "global_step": 220131, "epoch": 1310} {"train_loss": -11.697477340698242, "global_step": 220132, "epoch": 1310} {"train_loss": -11.71815013885498, "global_step": 220133, "epoch": 1310} {"train_loss": -11.767644882202148, "global_step": 220134, "epoch": 1310} {"train_loss": -11.436527252197266, "global_step": 220135, "epoch": 1310} {"train_loss": -11.46028995513916, "global_step": 220136, "epoch": 1310} {"train_loss": -11.825008392333984, "global_step": 220137, "epoch": 1310} {"train_loss": -11.549263000488281, "global_step": 220138, "epoch": 1310} {"train_loss": -11.662330627441406, "global_step": 220139, "epoch": 1310} {"train_loss": -11.395402908325195, "global_step": 220140, "epoch": 1310} {"train_loss": -11.710226058959961, "global_step": 220141, "epoch": 1310} {"train_loss": -11.89737319946289, "global_step": 220142, "epoch": 1310} {"train_loss": -11.730683326721191, "global_step": 220143, "epoch": 1310} {"train_loss": -11.834031105041504, "global_step": 220144, "epoch": 1310} {"train_loss": -11.8662691116333, "global_step": 220145, "epoch": 1310} {"train_loss": -11.827083587646484, "global_step": 220146, "epoch": 1310} {"train_loss": -11.555782318115234, "global_step": 220147, "epoch": 1310} {"train_loss": -11.760766983032227, "global_step": 220148, "epoch": 1310} {"train_loss": -11.156657218933105, "global_step": 220149, "epoch": 1310} {"train_loss": -11.88125228881836, "global_step": 220150, "epoch": 1310} {"train_loss": -11.463861465454102, "global_step": 220151, "epoch": 1310} {"train_loss": -10.484962463378906, "global_step": 220152, "epoch": 1310} {"train_loss": -9.061107635498047, "global_step": 220153, "epoch": 1310} {"train_loss": -10.02358627319336, "global_step": 220154, "epoch": 1310} {"train_loss": -10.196791648864746, "global_step": 220155, "epoch": 1310} {"train_loss": -8.448705673217773, "global_step": 220156, "epoch": 1310} {"train_loss": -10.113300323486328, "global_step": 220157, "epoch": 1310} {"train_loss": -9.398561477661133, "global_step": 220158, "epoch": 1310} {"train_loss": -11.056499481201172, "global_step": 220159, "epoch": 1310} {"train_loss": -10.767596244812012, "global_step": 220160, "epoch": 1310} {"train_loss": -10.877278327941895, "global_step": 220161, "epoch": 1310} {"train_loss": -11.162906646728516, "global_step": 220162, "epoch": 1310} {"train_loss": -10.372781753540039, "global_step": 220163, "epoch": 1310} {"train_loss": -11.533933639526367, "global_step": 220164, "epoch": 1310} {"train_loss": -10.752401351928711, "global_step": 220165, "epoch": 1310} {"train_loss": -10.765886306762695, "global_step": 220166, "epoch": 1310} {"train_loss": -11.213855743408203, "global_step": 220167, "epoch": 1310} {"train_loss": -11.025382995605469, "global_step": 220168, "epoch": 1310} {"train_loss": -11.243791580200195, "global_step": 220169, "epoch": 1310} {"train_loss": -11.055849075317383, "global_step": 220170, "epoch": 1310} {"train_loss": -11.55962085723877, "global_step": 220171, "epoch": 1310} {"train_loss": -11.050385475158691, "global_step": 220172, "epoch": 1310} {"train_loss": -11.713173866271973, "global_step": 220173, "epoch": 1310} {"train_loss": -11.162742614746094, "global_step": 220174, "epoch": 1310} {"train_loss": -11.36948013305664, "global_step": 220175, "epoch": 1310} {"train_loss": -11.09583854675293, "global_step": 220176, "epoch": 1310} {"train_loss": -11.23597526550293, "global_step": 220177, "epoch": 1310} {"train_loss": -11.20331859588623, "global_step": 220178, "epoch": 1310} {"train_loss": -11.238389015197754, "global_step": 220179, "epoch": 1310} {"train_loss": -11.056745529174805, "global_step": 220180, "epoch": 1310} {"train_loss": -11.232080459594727, "global_step": 220181, "epoch": 1310} {"train_loss": -11.044519424438477, "global_step": 220182, "epoch": 1310} {"train_loss": -11.232250213623047, "global_step": 220183, "epoch": 1310} {"train_loss": -11.098638534545898, "global_step": 220184, "epoch": 1310} {"train_loss": -11.34179401397705, "global_step": 220185, "epoch": 1310} {"train_loss": -11.171923637390137, "global_step": 220186, "epoch": 1310} {"train_loss": -11.336524963378906, "global_step": 220187, "epoch": 1310} {"train_loss": -11.20535659790039, "global_step": 220188, "epoch": 1310} {"train_loss": -11.218671798706055, "global_step": 220189, "epoch": 1310} {"train_loss": -11.234312057495117, "global_step": 220190, "epoch": 1310} {"train_loss": -11.24644947052002, "global_step": 220191, "epoch": 1310} {"train_loss": -11.493755340576172, "global_step": 220192, "epoch": 1310} {"train_loss": -11.340591430664062, "global_step": 220193, "epoch": 1310} {"train_loss": -11.606953620910645, "global_step": 220194, "epoch": 1310} {"train_loss": -11.45966911315918, "global_step": 220195, "epoch": 1310} {"train_loss": -11.561149597167969, "global_step": 220196, "epoch": 1310} {"train_loss": -11.286642074584961, "global_step": 220197, "epoch": 1310} {"train_loss": -11.301660537719727, "global_step": 220198, "epoch": 1310} {"train_loss": -10.847740173339844, "global_step": 220199, "epoch": 1310} {"train_loss": -11.041328430175781, "global_step": 220200, "epoch": 1310} {"train_loss": -10.976068496704102, "global_step": 220201, "epoch": 1310} {"train_loss": -11.496374130249023, "global_step": 220202, "epoch": 1310} {"train_loss": -10.884687423706055, "global_step": 220203, "epoch": 1310} {"train_loss": -11.380681991577148, "global_step": 220204, "epoch": 1310} {"train_loss": -11.147680282592773, "global_step": 220205, "epoch": 1310} {"train_loss": -11.727598190307617, "global_step": 220206, "epoch": 1310} {"train_loss": -11.407350540161133, "global_step": 220207, "epoch": 1310} {"train_loss": -11.609945297241211, "global_step": 220208, "epoch": 1310} {"train_loss": -11.659504890441895, "global_step": 220209, "epoch": 1310} {"train_loss": -11.548356056213379, "global_step": 220210, "epoch": 1310} {"train_loss": -11.53962230682373, "global_step": 220211, "epoch": 1310} {"train_loss": -11.588030815124512, "global_step": 220212, "epoch": 1310} {"train_loss": -11.300225257873535, "global_step": 220213, "epoch": 1310} {"train_loss": -11.755162239074707, "global_step": 220214, "epoch": 1310} {"train_loss": -11.235855102539062, "global_step": 220215, "epoch": 1310} {"train_loss": -11.449089050292969, "global_step": 220216, "epoch": 1310} {"train_loss": -11.583523750305176, "global_step": 220217, "epoch": 1310} {"train_loss": -11.30278205871582, "global_step": 220218, "epoch": 1310} {"train_loss": -11.535674095153809, "global_step": 220219, "epoch": 1310} {"train_loss": -11.503349304199219, "global_step": 220220, "epoch": 1310} {"train_loss": -11.058454513549805, "global_step": 220221, "epoch": 1310} {"train_loss": -11.757551193237305, "global_step": 220222, "epoch": 1310} {"train_loss": -11.286876678466797, "global_step": 220223, "epoch": 1310} {"train_loss": -11.638875961303711, "global_step": 220224, "epoch": 1310} {"train_loss": -11.496294021606445, "global_step": 220225, "epoch": 1310} {"train_loss": -11.630548477172852, "global_step": 220226, "epoch": 1310} {"train_loss": -11.69192886352539, "global_step": 220227, "epoch": 1310} {"train_loss": -11.584199905395508, "global_step": 220228, "epoch": 1310} {"train_loss": -11.779220581054688, "global_step": 220229, "epoch": 1310} {"train_loss": -11.761470794677734, "global_step": 220230, "epoch": 1310} {"train_loss": -11.672887802124023, "global_step": 220231, "epoch": 1310} {"train_loss": -11.514856338500977, "global_step": 220232, "epoch": 1310} {"train_loss": -11.67959976196289, "global_step": 220233, "epoch": 1310} {"train_loss": -11.869242668151855, "global_step": 220234, "epoch": 1310} {"train_loss": -11.784464836120605, "global_step": 220235, "epoch": 1310} {"train_loss": -11.74543285369873, "global_step": 220236, "epoch": 1310} {"train_loss": -11.571011543273926, "global_step": 220237, "epoch": 1310} {"train_loss": -11.812819480895996, "global_step": 220238, "epoch": 1310} {"train_loss": -11.821436882019043, "global_step": 220239, "epoch": 1310} {"train_loss": -11.52269172668457, "global_step": 220240, "epoch": 1310} {"train_loss": -11.931365966796875, "global_step": 220241, "epoch": 1310} {"train_loss": -11.80205249786377, "global_step": 220242, "epoch": 1310} {"train_loss": -11.501991271972656, "global_step": 220243, "epoch": 1310} {"train_loss": -11.638209342956543, "global_step": 220244, "epoch": 1310} {"train_loss": -11.784293174743652, "global_step": 220245, "epoch": 1310} {"train_loss": -11.74616813659668, "global_step": 220246, "epoch": 1310} {"train_loss": -11.44714363416036, "global_step": 220247, "epoch": 1310, "val_loss": 260787.40625, "train_action_mse_error": 2.212691068649292} {"train_loss": -11.799858093261719, "global_step": 220248, "epoch": 1311} {"train_loss": -11.584205627441406, "global_step": 220249, "epoch": 1311} {"train_loss": -11.648202896118164, "global_step": 220250, "epoch": 1311} {"train_loss": -11.441767692565918, "global_step": 220251, "epoch": 1311} {"train_loss": -11.093428611755371, "global_step": 220252, "epoch": 1311} {"train_loss": -11.565444946289062, "global_step": 220253, "epoch": 1311} {"train_loss": -11.754171371459961, "global_step": 220254, "epoch": 1311} {"train_loss": -10.573671340942383, "global_step": 220255, "epoch": 1311} {"train_loss": -10.93690299987793, "global_step": 220256, "epoch": 1311} {"train_loss": -11.534514427185059, "global_step": 220257, "epoch": 1311} {"train_loss": -11.539067268371582, "global_step": 220258, "epoch": 1311} {"train_loss": -11.123409271240234, "global_step": 220259, "epoch": 1311} {"train_loss": -11.852792739868164, "global_step": 220260, "epoch": 1311} {"train_loss": -11.322394371032715, "global_step": 220261, "epoch": 1311} {"train_loss": -10.710890769958496, "global_step": 220262, "epoch": 1311} {"train_loss": -11.538125991821289, "global_step": 220263, "epoch": 1311} {"train_loss": -11.662599563598633, "global_step": 220264, "epoch": 1311} {"train_loss": -9.928020477294922, "global_step": 220265, "epoch": 1311} {"train_loss": -11.39850902557373, "global_step": 220266, "epoch": 1311} {"train_loss": -11.70633316040039, "global_step": 220267, "epoch": 1311} {"train_loss": -10.946708679199219, "global_step": 220268, "epoch": 1311} {"train_loss": -11.50334644317627, "global_step": 220269, "epoch": 1311} {"train_loss": -11.898574829101562, "global_step": 220270, "epoch": 1311} {"train_loss": -11.200632095336914, "global_step": 220271, "epoch": 1311} {"train_loss": -11.67953872680664, "global_step": 220272, "epoch": 1311} {"train_loss": -11.495100021362305, "global_step": 220273, "epoch": 1311} {"train_loss": -11.64804458618164, "global_step": 220274, "epoch": 1311} {"train_loss": -11.77718734741211, "global_step": 220275, "epoch": 1311} {"train_loss": -11.262022972106934, "global_step": 220276, "epoch": 1311} {"train_loss": -11.732526779174805, "global_step": 220277, "epoch": 1311} {"train_loss": -11.52383804321289, "global_step": 220278, "epoch": 1311} {"train_loss": -11.366607666015625, "global_step": 220279, "epoch": 1311} {"train_loss": -11.70345687866211, "global_step": 220280, "epoch": 1311} {"train_loss": -11.743459701538086, "global_step": 220281, "epoch": 1311} {"train_loss": -11.191302299499512, "global_step": 220282, "epoch": 1311} {"train_loss": -11.860751152038574, "global_step": 220283, "epoch": 1311} {"train_loss": -11.519344329833984, "global_step": 220284, "epoch": 1311} {"train_loss": -11.516890525817871, "global_step": 220285, "epoch": 1311} {"train_loss": -11.76273250579834, "global_step": 220286, "epoch": 1311} {"train_loss": -11.610032081604004, "global_step": 220287, "epoch": 1311} {"train_loss": -11.666358947753906, "global_step": 220288, "epoch": 1311} {"train_loss": -11.847590446472168, "global_step": 220289, "epoch": 1311} {"train_loss": -11.647470474243164, "global_step": 220290, "epoch": 1311} {"train_loss": -11.875761032104492, "global_step": 220291, "epoch": 1311} {"train_loss": -11.708980560302734, "global_step": 220292, "epoch": 1311} {"train_loss": -11.862771987915039, "global_step": 220293, "epoch": 1311} {"train_loss": -11.909849166870117, "global_step": 220294, "epoch": 1311} {"train_loss": -11.911771774291992, "global_step": 220295, "epoch": 1311} {"train_loss": -11.820123672485352, "global_step": 220296, "epoch": 1311} {"train_loss": -11.71493148803711, "global_step": 220297, "epoch": 1311} {"train_loss": -11.76812744140625, "global_step": 220298, "epoch": 1311} {"train_loss": -11.882564544677734, "global_step": 220299, "epoch": 1311} {"train_loss": -12.020012855529785, "global_step": 220300, "epoch": 1311} {"train_loss": -11.85235595703125, "global_step": 220301, "epoch": 1311} {"train_loss": -11.909056663513184, "global_step": 220302, "epoch": 1311} {"train_loss": -11.807060241699219, "global_step": 220303, "epoch": 1311} {"train_loss": -12.185142517089844, "global_step": 220304, "epoch": 1311} {"train_loss": -11.791959762573242, "global_step": 220305, "epoch": 1311} {"train_loss": -11.765764236450195, "global_step": 220306, "epoch": 1311} {"train_loss": -11.668721199035645, "global_step": 220307, "epoch": 1311} {"train_loss": -11.55788803100586, "global_step": 220308, "epoch": 1311} {"train_loss": -11.600893020629883, "global_step": 220309, "epoch": 1311} {"train_loss": -11.894733428955078, "global_step": 220310, "epoch": 1311} {"train_loss": -11.292022705078125, "global_step": 220311, "epoch": 1311} {"train_loss": -11.659189224243164, "global_step": 220312, "epoch": 1311} {"train_loss": -11.961980819702148, "global_step": 220313, "epoch": 1311} {"train_loss": -10.968843460083008, "global_step": 220314, "epoch": 1311} {"train_loss": -11.195938110351562, "global_step": 220315, "epoch": 1311} {"train_loss": -11.382379531860352, "global_step": 220316, "epoch": 1311} {"train_loss": -10.232595443725586, "global_step": 220317, "epoch": 1311} {"train_loss": -9.701310157775879, "global_step": 220318, "epoch": 1311} {"train_loss": -10.69652271270752, "global_step": 220319, "epoch": 1311} {"train_loss": -11.297140121459961, "global_step": 220320, "epoch": 1311} {"train_loss": -11.401395797729492, "global_step": 220321, "epoch": 1311} {"train_loss": -10.161922454833984, "global_step": 220322, "epoch": 1311} {"train_loss": -11.67338752746582, "global_step": 220323, "epoch": 1311} {"train_loss": -11.229019165039062, "global_step": 220324, "epoch": 1311} {"train_loss": -11.300276756286621, "global_step": 220325, "epoch": 1311} {"train_loss": -11.420360565185547, "global_step": 220326, "epoch": 1311} {"train_loss": -10.597407341003418, "global_step": 220327, "epoch": 1311} {"train_loss": -11.583003044128418, "global_step": 220328, "epoch": 1311} {"train_loss": -11.26016616821289, "global_step": 220329, "epoch": 1311} {"train_loss": -11.285423278808594, "global_step": 220330, "epoch": 1311} {"train_loss": -11.598976135253906, "global_step": 220331, "epoch": 1311} {"train_loss": -11.096792221069336, "global_step": 220332, "epoch": 1311} {"train_loss": -11.508647918701172, "global_step": 220333, "epoch": 1311} {"train_loss": -11.493927955627441, "global_step": 220334, "epoch": 1311} {"train_loss": -11.177949905395508, "global_step": 220335, "epoch": 1311} {"train_loss": -11.28198528289795, "global_step": 220336, "epoch": 1311} {"train_loss": -11.36113452911377, "global_step": 220337, "epoch": 1311} {"train_loss": -11.35416030883789, "global_step": 220338, "epoch": 1311} {"train_loss": -11.843019485473633, "global_step": 220339, "epoch": 1311} {"train_loss": -11.427261352539062, "global_step": 220340, "epoch": 1311} {"train_loss": -11.585424423217773, "global_step": 220341, "epoch": 1311} {"train_loss": -11.557820320129395, "global_step": 220342, "epoch": 1311} {"train_loss": -11.555472373962402, "global_step": 220343, "epoch": 1311} {"train_loss": -11.551799774169922, "global_step": 220344, "epoch": 1311} {"train_loss": -11.727651596069336, "global_step": 220345, "epoch": 1311} {"train_loss": -11.151445388793945, "global_step": 220346, "epoch": 1311} {"train_loss": -11.402503967285156, "global_step": 220347, "epoch": 1311} {"train_loss": -11.088924407958984, "global_step": 220348, "epoch": 1311} {"train_loss": -11.696632385253906, "global_step": 220349, "epoch": 1311} {"train_loss": -11.422872543334961, "global_step": 220350, "epoch": 1311} {"train_loss": -11.618721008300781, "global_step": 220351, "epoch": 1311} {"train_loss": -11.313849449157715, "global_step": 220352, "epoch": 1311} {"train_loss": -11.62332534790039, "global_step": 220353, "epoch": 1311} {"train_loss": -11.617770195007324, "global_step": 220354, "epoch": 1311} {"train_loss": -11.557428359985352, "global_step": 220355, "epoch": 1311} {"train_loss": -11.469949722290039, "global_step": 220356, "epoch": 1311} {"train_loss": -11.762754440307617, "global_step": 220357, "epoch": 1311} {"train_loss": -11.357559204101562, "global_step": 220358, "epoch": 1311} {"train_loss": -11.62511920928955, "global_step": 220359, "epoch": 1311} {"train_loss": -11.852972030639648, "global_step": 220360, "epoch": 1311} {"train_loss": -11.304696083068848, "global_step": 220361, "epoch": 1311} {"train_loss": -11.646965026855469, "global_step": 220362, "epoch": 1311} {"train_loss": -11.348121643066406, "global_step": 220363, "epoch": 1311} {"train_loss": -11.636341094970703, "global_step": 220364, "epoch": 1311} {"train_loss": -11.16266918182373, "global_step": 220365, "epoch": 1311} {"train_loss": -11.287450790405273, "global_step": 220366, "epoch": 1311} {"train_loss": -11.180656433105469, "global_step": 220367, "epoch": 1311} {"train_loss": -11.300176620483398, "global_step": 220368, "epoch": 1311} {"train_loss": -11.730730056762695, "global_step": 220369, "epoch": 1311} {"train_loss": -11.317611694335938, "global_step": 220370, "epoch": 1311} {"train_loss": -11.587698936462402, "global_step": 220371, "epoch": 1311} {"train_loss": -11.416616439819336, "global_step": 220372, "epoch": 1311} {"train_loss": -11.491205215454102, "global_step": 220373, "epoch": 1311} {"train_loss": -11.417165756225586, "global_step": 220374, "epoch": 1311} {"train_loss": -11.117218017578125, "global_step": 220375, "epoch": 1311} {"train_loss": -11.323700904846191, "global_step": 220376, "epoch": 1311} {"train_loss": -10.844337463378906, "global_step": 220377, "epoch": 1311} {"train_loss": -11.313070297241211, "global_step": 220378, "epoch": 1311} {"train_loss": -10.790563583374023, "global_step": 220379, "epoch": 1311} {"train_loss": -11.265541076660156, "global_step": 220380, "epoch": 1311} {"train_loss": -10.733647346496582, "global_step": 220381, "epoch": 1311} {"train_loss": -10.92225170135498, "global_step": 220382, "epoch": 1311} {"train_loss": -10.82767105102539, "global_step": 220383, "epoch": 1311} {"train_loss": -11.173946380615234, "global_step": 220384, "epoch": 1311} {"train_loss": -10.079872131347656, "global_step": 220385, "epoch": 1311} {"train_loss": -11.324435234069824, "global_step": 220386, "epoch": 1311} {"train_loss": -10.043219566345215, "global_step": 220387, "epoch": 1311} {"train_loss": -11.208162307739258, "global_step": 220388, "epoch": 1311} {"train_loss": -10.313770294189453, "global_step": 220389, "epoch": 1311} {"train_loss": -11.20060920715332, "global_step": 220390, "epoch": 1311} {"train_loss": -11.499014854431152, "global_step": 220391, "epoch": 1311} {"train_loss": -10.967140197753906, "global_step": 220392, "epoch": 1311} {"train_loss": -10.95808219909668, "global_step": 220393, "epoch": 1311} {"train_loss": -11.270837783813477, "global_step": 220394, "epoch": 1311} {"train_loss": -9.922712326049805, "global_step": 220395, "epoch": 1311} {"train_loss": -10.9097318649292, "global_step": 220396, "epoch": 1311} {"train_loss": -10.38793659210205, "global_step": 220397, "epoch": 1311} {"train_loss": -10.317138671875, "global_step": 220398, "epoch": 1311} {"train_loss": -11.108152389526367, "global_step": 220399, "epoch": 1311} {"train_loss": -10.788461685180664, "global_step": 220400, "epoch": 1311} {"train_loss": -10.407610893249512, "global_step": 220401, "epoch": 1311} {"train_loss": -10.664304733276367, "global_step": 220402, "epoch": 1311} {"train_loss": -10.610931396484375, "global_step": 220403, "epoch": 1311} {"train_loss": -9.47651481628418, "global_step": 220404, "epoch": 1311} {"train_loss": -10.958158493041992, "global_step": 220405, "epoch": 1311} {"train_loss": -10.704343795776367, "global_step": 220406, "epoch": 1311} {"train_loss": -10.806532859802246, "global_step": 220407, "epoch": 1311} {"train_loss": -11.00695514678955, "global_step": 220408, "epoch": 1311} {"train_loss": -11.181103706359863, "global_step": 220409, "epoch": 1311} {"train_loss": -10.929338455200195, "global_step": 220410, "epoch": 1311} {"train_loss": -11.28239631652832, "global_step": 220411, "epoch": 1311} {"train_loss": -11.554073333740234, "global_step": 220412, "epoch": 1311} {"train_loss": -11.254695892333984, "global_step": 220413, "epoch": 1311} {"train_loss": -11.324254989624023, "global_step": 220414, "epoch": 1311} {"train_loss": -11.32349639847165, "global_step": 220415, "epoch": 1311, "val_loss": 259560.734375} {"train_loss": -11.339553833007812, "global_step": 220416, "epoch": 1312} {"train_loss": -11.540399551391602, "global_step": 220417, "epoch": 1312} {"train_loss": -11.411218643188477, "global_step": 220418, "epoch": 1312} {"train_loss": -11.624497413635254, "global_step": 220419, "epoch": 1312} {"train_loss": -11.589831352233887, "global_step": 220420, "epoch": 1312} {"train_loss": -11.731708526611328, "global_step": 220421, "epoch": 1312} {"train_loss": -11.470233917236328, "global_step": 220422, "epoch": 1312} {"train_loss": -11.473359107971191, "global_step": 220423, "epoch": 1312} {"train_loss": -11.643044471740723, "global_step": 220424, "epoch": 1312} {"train_loss": -11.696566581726074, "global_step": 220425, "epoch": 1312} {"train_loss": -11.570196151733398, "global_step": 220426, "epoch": 1312} {"train_loss": -11.73922348022461, "global_step": 220427, "epoch": 1312} {"train_loss": -11.699591636657715, "global_step": 220428, "epoch": 1312} {"train_loss": -11.590301513671875, "global_step": 220429, "epoch": 1312} {"train_loss": -11.835887908935547, "global_step": 220430, "epoch": 1312} {"train_loss": -11.700065612792969, "global_step": 220431, "epoch": 1312} {"train_loss": -11.63889217376709, "global_step": 220432, "epoch": 1312} {"train_loss": -11.859153747558594, "global_step": 220433, "epoch": 1312} {"train_loss": -11.7880859375, "global_step": 220434, "epoch": 1312} {"train_loss": -11.80009651184082, "global_step": 220435, "epoch": 1312} {"train_loss": -11.980307579040527, "global_step": 220436, "epoch": 1312} {"train_loss": -11.67470932006836, "global_step": 220437, "epoch": 1312} {"train_loss": -11.839799880981445, "global_step": 220438, "epoch": 1312} {"train_loss": -11.669506072998047, "global_step": 220439, "epoch": 1312} {"train_loss": -11.704917907714844, "global_step": 220440, "epoch": 1312} {"train_loss": -11.535591125488281, "global_step": 220441, "epoch": 1312} {"train_loss": -11.913766860961914, "global_step": 220442, "epoch": 1312} {"train_loss": -11.839499473571777, "global_step": 220443, "epoch": 1312} {"train_loss": -11.666051864624023, "global_step": 220444, "epoch": 1312} {"train_loss": -11.894317626953125, "global_step": 220445, "epoch": 1312} {"train_loss": -11.91932487487793, "global_step": 220446, "epoch": 1312} {"train_loss": -11.973061561584473, "global_step": 220447, "epoch": 1312} {"train_loss": -11.790590286254883, "global_step": 220448, "epoch": 1312} {"train_loss": -11.865427017211914, "global_step": 220449, "epoch": 1312} {"train_loss": -11.872323989868164, "global_step": 220450, "epoch": 1312} {"train_loss": -11.97714614868164, "global_step": 220451, "epoch": 1312} {"train_loss": -12.094457626342773, "global_step": 220452, "epoch": 1312} {"train_loss": -11.981755256652832, "global_step": 220453, "epoch": 1312} {"train_loss": -11.889501571655273, "global_step": 220454, "epoch": 1312} {"train_loss": -11.446624755859375, "global_step": 220455, "epoch": 1312} {"train_loss": -11.437649726867676, "global_step": 220456, "epoch": 1312} {"train_loss": -11.401178359985352, "global_step": 220457, "epoch": 1312} {"train_loss": -11.530177116394043, "global_step": 220458, "epoch": 1312} {"train_loss": -11.268132209777832, "global_step": 220459, "epoch": 1312} {"train_loss": -11.123624801635742, "global_step": 220460, "epoch": 1312} {"train_loss": -11.050434112548828, "global_step": 220461, "epoch": 1312} {"train_loss": -11.544198989868164, "global_step": 220462, "epoch": 1312} {"train_loss": -11.4703369140625, "global_step": 220463, "epoch": 1312} {"train_loss": -10.795476913452148, "global_step": 220464, "epoch": 1312} {"train_loss": -10.201068878173828, "global_step": 220465, "epoch": 1312} {"train_loss": -10.82505989074707, "global_step": 220466, "epoch": 1312} {"train_loss": -11.36601448059082, "global_step": 220467, "epoch": 1312} {"train_loss": -11.577909469604492, "global_step": 220468, "epoch": 1312} {"train_loss": -11.404605865478516, "global_step": 220469, "epoch": 1312} {"train_loss": -11.515588760375977, "global_step": 220470, "epoch": 1312} {"train_loss": -10.89657974243164, "global_step": 220471, "epoch": 1312} {"train_loss": -11.123316764831543, "global_step": 220472, "epoch": 1312} {"train_loss": -11.293249130249023, "global_step": 220473, "epoch": 1312} {"train_loss": -11.13896656036377, "global_step": 220474, "epoch": 1312} {"train_loss": -11.29019832611084, "global_step": 220475, "epoch": 1312} {"train_loss": -10.952655792236328, "global_step": 220476, "epoch": 1312} {"train_loss": -11.548727989196777, "global_step": 220477, "epoch": 1312} {"train_loss": -10.889413833618164, "global_step": 220478, "epoch": 1312} {"train_loss": -11.056564331054688, "global_step": 220479, "epoch": 1312} {"train_loss": -10.716694831848145, "global_step": 220480, "epoch": 1312} {"train_loss": -11.154924392700195, "global_step": 220481, "epoch": 1312} {"train_loss": -10.178627967834473, "global_step": 220482, "epoch": 1312} {"train_loss": -10.843008041381836, "global_step": 220483, "epoch": 1312} {"train_loss": -11.318499565124512, "global_step": 220484, "epoch": 1312} {"train_loss": -11.043107986450195, "global_step": 220485, "epoch": 1312} {"train_loss": -11.448941230773926, "global_step": 220486, "epoch": 1312} {"train_loss": -11.521736145019531, "global_step": 220487, "epoch": 1312} {"train_loss": -11.299241065979004, "global_step": 220488, "epoch": 1312} {"train_loss": -11.700971603393555, "global_step": 220489, "epoch": 1312} {"train_loss": -11.597553253173828, "global_step": 220490, "epoch": 1312} {"train_loss": -11.659076690673828, "global_step": 220491, "epoch": 1312} {"train_loss": -11.534990310668945, "global_step": 220492, "epoch": 1312} {"train_loss": -11.686651229858398, "global_step": 220493, "epoch": 1312} {"train_loss": -11.78585433959961, "global_step": 220494, "epoch": 1312} {"train_loss": -11.541015625, "global_step": 220495, "epoch": 1312} {"train_loss": -11.682775497436523, "global_step": 220496, "epoch": 1312} {"train_loss": -11.829486846923828, "global_step": 220497, "epoch": 1312} {"train_loss": -11.630008697509766, "global_step": 220498, "epoch": 1312} {"train_loss": -11.710947036743164, "global_step": 220499, "epoch": 1312} {"train_loss": -11.495294570922852, "global_step": 220500, "epoch": 1312} {"train_loss": -11.813800811767578, "global_step": 220501, "epoch": 1312} {"train_loss": -11.592045783996582, "global_step": 220502, "epoch": 1312} {"train_loss": -11.559911727905273, "global_step": 220503, "epoch": 1312} {"train_loss": -11.272937774658203, "global_step": 220504, "epoch": 1312} {"train_loss": -11.105525970458984, "global_step": 220505, "epoch": 1312} {"train_loss": -11.501411437988281, "global_step": 220506, "epoch": 1312} {"train_loss": -10.979046821594238, "global_step": 220507, "epoch": 1312} {"train_loss": -11.596282958984375, "global_step": 220508, "epoch": 1312} {"train_loss": -11.688966751098633, "global_step": 220509, "epoch": 1312} {"train_loss": -11.475943565368652, "global_step": 220510, "epoch": 1312} {"train_loss": -11.607383728027344, "global_step": 220511, "epoch": 1312} {"train_loss": -11.348068237304688, "global_step": 220512, "epoch": 1312} {"train_loss": -11.666648864746094, "global_step": 220513, "epoch": 1312} {"train_loss": -10.977683067321777, "global_step": 220514, "epoch": 1312} {"train_loss": -11.82540512084961, "global_step": 220515, "epoch": 1312} {"train_loss": -11.523195266723633, "global_step": 220516, "epoch": 1312} {"train_loss": -11.632463455200195, "global_step": 220517, "epoch": 1312} {"train_loss": -11.32878303527832, "global_step": 220518, "epoch": 1312} {"train_loss": -11.5292387008667, "global_step": 220519, "epoch": 1312} {"train_loss": -11.388736724853516, "global_step": 220520, "epoch": 1312} {"train_loss": -11.513561248779297, "global_step": 220521, "epoch": 1312} {"train_loss": -11.512665748596191, "global_step": 220522, "epoch": 1312} {"train_loss": -11.152036666870117, "global_step": 220523, "epoch": 1312} {"train_loss": -11.683899879455566, "global_step": 220524, "epoch": 1312} {"train_loss": -11.433537483215332, "global_step": 220525, "epoch": 1312} {"train_loss": -11.864034652709961, "global_step": 220526, "epoch": 1312} {"train_loss": -11.59494400024414, "global_step": 220527, "epoch": 1312} {"train_loss": -11.317217826843262, "global_step": 220528, "epoch": 1312} {"train_loss": -11.638940811157227, "global_step": 220529, "epoch": 1312} {"train_loss": -11.48834228515625, "global_step": 220530, "epoch": 1312} {"train_loss": -11.67053508758545, "global_step": 220531, "epoch": 1312} {"train_loss": -11.222563743591309, "global_step": 220532, "epoch": 1312} {"train_loss": -11.474587440490723, "global_step": 220533, "epoch": 1312} {"train_loss": -11.456186294555664, "global_step": 220534, "epoch": 1312} {"train_loss": -11.533491134643555, "global_step": 220535, "epoch": 1312} {"train_loss": -11.830013275146484, "global_step": 220536, "epoch": 1312} {"train_loss": -11.56340503692627, "global_step": 220537, "epoch": 1312} {"train_loss": -11.888813018798828, "global_step": 220538, "epoch": 1312} {"train_loss": -11.814516067504883, "global_step": 220539, "epoch": 1312} {"train_loss": -11.703805923461914, "global_step": 220540, "epoch": 1312} {"train_loss": -11.798981666564941, "global_step": 220541, "epoch": 1312} {"train_loss": -11.924958229064941, "global_step": 220542, "epoch": 1312} {"train_loss": -11.914009094238281, "global_step": 220543, "epoch": 1312} {"train_loss": -11.823999404907227, "global_step": 220544, "epoch": 1312} {"train_loss": -11.860004425048828, "global_step": 220545, "epoch": 1312} {"train_loss": -11.931636810302734, "global_step": 220546, "epoch": 1312} {"train_loss": -11.69369888305664, "global_step": 220547, "epoch": 1312} {"train_loss": -11.958351135253906, "global_step": 220548, "epoch": 1312} {"train_loss": -11.700326919555664, "global_step": 220549, "epoch": 1312} {"train_loss": -11.895719528198242, "global_step": 220550, "epoch": 1312} {"train_loss": -11.817134857177734, "global_step": 220551, "epoch": 1312} {"train_loss": -11.58087158203125, "global_step": 220552, "epoch": 1312} {"train_loss": -11.53828239440918, "global_step": 220553, "epoch": 1312} {"train_loss": -11.796211242675781, "global_step": 220554, "epoch": 1312} {"train_loss": -12.025461196899414, "global_step": 220555, "epoch": 1312} {"train_loss": -12.032927513122559, "global_step": 220556, "epoch": 1312} {"train_loss": -12.065674781799316, "global_step": 220557, "epoch": 1312} {"train_loss": -12.092214584350586, "global_step": 220558, "epoch": 1312} {"train_loss": -12.111316680908203, "global_step": 220559, "epoch": 1312} {"train_loss": -11.91054630279541, "global_step": 220560, "epoch": 1312} {"train_loss": -11.663825988769531, "global_step": 220561, "epoch": 1312} {"train_loss": -11.99535083770752, "global_step": 220562, "epoch": 1312} {"train_loss": -12.121206283569336, "global_step": 220563, "epoch": 1312} {"train_loss": -11.8894624710083, "global_step": 220564, "epoch": 1312} {"train_loss": -11.95897388458252, "global_step": 220565, "epoch": 1312} {"train_loss": -11.927051544189453, "global_step": 220566, "epoch": 1312} {"train_loss": -11.754461288452148, "global_step": 220567, "epoch": 1312} {"train_loss": -12.033032417297363, "global_step": 220568, "epoch": 1312} {"train_loss": -11.838688850402832, "global_step": 220569, "epoch": 1312} {"train_loss": -11.9478759765625, "global_step": 220570, "epoch": 1312} {"train_loss": -11.927181243896484, "global_step": 220571, "epoch": 1312} {"train_loss": -11.95019245147705, "global_step": 220572, "epoch": 1312} {"train_loss": -11.257719993591309, "global_step": 220573, "epoch": 1312} {"train_loss": -11.681825637817383, "global_step": 220574, "epoch": 1312} {"train_loss": -11.96640396118164, "global_step": 220575, "epoch": 1312} {"train_loss": -11.656760215759277, "global_step": 220576, "epoch": 1312} {"train_loss": -11.800490379333496, "global_step": 220577, "epoch": 1312} {"train_loss": -11.928138732910156, "global_step": 220578, "epoch": 1312} {"train_loss": -12.049161911010742, "global_step": 220579, "epoch": 1312} {"train_loss": -11.734384536743164, "global_step": 220580, "epoch": 1312} {"train_loss": -11.49169635772705, "global_step": 220581, "epoch": 1312} {"train_loss": -11.767301559448242, "global_step": 220582, "epoch": 1312} {"train_loss": -11.58511281581152, "global_step": 220583, "epoch": 1312, "val_loss": 262039.9375} {"train_loss": -10.883462905883789, "global_step": 220584, "epoch": 1313} {"train_loss": -10.06092357635498, "global_step": 220585, "epoch": 1313} {"train_loss": -11.37636947631836, "global_step": 220586, "epoch": 1313} {"train_loss": -9.268089294433594, "global_step": 220587, "epoch": 1313} {"train_loss": -10.928241729736328, "global_step": 220588, "epoch": 1313} {"train_loss": -9.784921646118164, "global_step": 220589, "epoch": 1313} {"train_loss": -10.032400131225586, "global_step": 220590, "epoch": 1313} {"train_loss": -11.221481323242188, "global_step": 220591, "epoch": 1313} {"train_loss": -10.512513160705566, "global_step": 220592, "epoch": 1313} {"train_loss": -10.634281158447266, "global_step": 220593, "epoch": 1313} {"train_loss": -11.08868408203125, "global_step": 220594, "epoch": 1313} {"train_loss": -11.222250938415527, "global_step": 220595, "epoch": 1313} {"train_loss": -11.359085083007812, "global_step": 220596, "epoch": 1313} {"train_loss": -10.630884170532227, "global_step": 220597, "epoch": 1313} {"train_loss": -10.692468643188477, "global_step": 220598, "epoch": 1313} {"train_loss": -9.950359344482422, "global_step": 220599, "epoch": 1313} {"train_loss": -11.08448600769043, "global_step": 220600, "epoch": 1313} {"train_loss": -9.900177955627441, "global_step": 220601, "epoch": 1313} {"train_loss": -10.731832504272461, "global_step": 220602, "epoch": 1313} {"train_loss": -10.273765563964844, "global_step": 220603, "epoch": 1313} {"train_loss": -9.912972450256348, "global_step": 220604, "epoch": 1313} {"train_loss": -11.482868194580078, "global_step": 220605, "epoch": 1313} {"train_loss": -9.956933975219727, "global_step": 220606, "epoch": 1313} {"train_loss": -11.10757827758789, "global_step": 220607, "epoch": 1313} {"train_loss": -10.413854598999023, "global_step": 220608, "epoch": 1313} {"train_loss": -11.031365394592285, "global_step": 220609, "epoch": 1313} {"train_loss": -10.258888244628906, "global_step": 220610, "epoch": 1313} {"train_loss": -10.704564094543457, "global_step": 220611, "epoch": 1313} {"train_loss": -10.474815368652344, "global_step": 220612, "epoch": 1313} {"train_loss": -10.710725784301758, "global_step": 220613, "epoch": 1313} {"train_loss": -11.137260437011719, "global_step": 220614, "epoch": 1313} {"train_loss": -10.734476089477539, "global_step": 220615, "epoch": 1313} {"train_loss": -11.394667625427246, "global_step": 220616, "epoch": 1313} {"train_loss": -11.168733596801758, "global_step": 220617, "epoch": 1313} {"train_loss": -11.270998001098633, "global_step": 220618, "epoch": 1313} {"train_loss": -11.289264678955078, "global_step": 220619, "epoch": 1313} {"train_loss": -11.31296157836914, "global_step": 220620, "epoch": 1313} {"train_loss": -11.467815399169922, "global_step": 220621, "epoch": 1313} {"train_loss": -11.11907958984375, "global_step": 220622, "epoch": 1313} {"train_loss": -11.027547836303711, "global_step": 220623, "epoch": 1313} {"train_loss": -11.47195816040039, "global_step": 220624, "epoch": 1313} {"train_loss": -11.164163589477539, "global_step": 220625, "epoch": 1313} {"train_loss": -11.383301734924316, "global_step": 220626, "epoch": 1313} {"train_loss": -11.188579559326172, "global_step": 220627, "epoch": 1313} {"train_loss": -11.593914985656738, "global_step": 220628, "epoch": 1313} {"train_loss": -11.294025421142578, "global_step": 220629, "epoch": 1313} {"train_loss": -11.299583435058594, "global_step": 220630, "epoch": 1313} {"train_loss": -11.534568786621094, "global_step": 220631, "epoch": 1313} {"train_loss": -11.334678649902344, "global_step": 220632, "epoch": 1313} {"train_loss": -11.52927017211914, "global_step": 220633, "epoch": 1313} {"train_loss": -11.296282768249512, "global_step": 220634, "epoch": 1313} {"train_loss": -11.314579963684082, "global_step": 220635, "epoch": 1313} {"train_loss": -11.167009353637695, "global_step": 220636, "epoch": 1313} {"train_loss": -11.691938400268555, "global_step": 220637, "epoch": 1313} {"train_loss": -11.86307144165039, "global_step": 220638, "epoch": 1313} {"train_loss": -11.430020332336426, "global_step": 220639, "epoch": 1313} {"train_loss": -11.787592887878418, "global_step": 220640, "epoch": 1313} {"train_loss": -11.438835144042969, "global_step": 220641, "epoch": 1313} {"train_loss": -11.632384300231934, "global_step": 220642, "epoch": 1313} {"train_loss": -11.572818756103516, "global_step": 220643, "epoch": 1313} {"train_loss": -11.480513572692871, "global_step": 220644, "epoch": 1313} {"train_loss": -11.637983322143555, "global_step": 220645, "epoch": 1313} {"train_loss": -11.682182312011719, "global_step": 220646, "epoch": 1313} {"train_loss": -11.480520248413086, "global_step": 220647, "epoch": 1313} {"train_loss": -11.593563079833984, "global_step": 220648, "epoch": 1313} {"train_loss": -11.625657081604004, "global_step": 220649, "epoch": 1313} {"train_loss": -11.550060272216797, "global_step": 220650, "epoch": 1313} {"train_loss": -11.653270721435547, "global_step": 220651, "epoch": 1313} {"train_loss": -11.872102737426758, "global_step": 220652, "epoch": 1313} {"train_loss": -11.682717323303223, "global_step": 220653, "epoch": 1313} {"train_loss": -11.861417770385742, "global_step": 220654, "epoch": 1313} {"train_loss": -11.536216735839844, "global_step": 220655, "epoch": 1313} {"train_loss": -11.770986557006836, "global_step": 220656, "epoch": 1313} {"train_loss": -11.742979049682617, "global_step": 220657, "epoch": 1313} {"train_loss": -11.554141998291016, "global_step": 220658, "epoch": 1313} {"train_loss": -11.728124618530273, "global_step": 220659, "epoch": 1313} {"train_loss": -11.876961708068848, "global_step": 220660, "epoch": 1313} {"train_loss": -11.830547332763672, "global_step": 220661, "epoch": 1313} {"train_loss": -11.934211730957031, "global_step": 220662, "epoch": 1313} {"train_loss": -11.821325302124023, "global_step": 220663, "epoch": 1313} {"train_loss": -11.744447708129883, "global_step": 220664, "epoch": 1313} {"train_loss": -11.87482738494873, "global_step": 220665, "epoch": 1313} {"train_loss": -11.777848243713379, "global_step": 220666, "epoch": 1313} {"train_loss": -11.926556587219238, "global_step": 220667, "epoch": 1313} {"train_loss": -11.80785846710205, "global_step": 220668, "epoch": 1313} {"train_loss": -11.778718948364258, "global_step": 220669, "epoch": 1313} {"train_loss": -12.044516563415527, "global_step": 220670, "epoch": 1313} {"train_loss": -12.039830207824707, "global_step": 220671, "epoch": 1313} {"train_loss": -11.940009117126465, "global_step": 220672, "epoch": 1313} {"train_loss": -11.880924224853516, "global_step": 220673, "epoch": 1313} {"train_loss": -11.652826309204102, "global_step": 220674, "epoch": 1313} {"train_loss": -11.936396598815918, "global_step": 220675, "epoch": 1313} {"train_loss": -11.984618186950684, "global_step": 220676, "epoch": 1313} {"train_loss": -11.88637638092041, "global_step": 220677, "epoch": 1313} {"train_loss": -11.78023910522461, "global_step": 220678, "epoch": 1313} {"train_loss": -11.719037055969238, "global_step": 220679, "epoch": 1313} {"train_loss": -11.883874893188477, "global_step": 220680, "epoch": 1313} {"train_loss": -11.656087875366211, "global_step": 220681, "epoch": 1313} {"train_loss": -11.96464729309082, "global_step": 220682, "epoch": 1313} {"train_loss": -11.80919075012207, "global_step": 220683, "epoch": 1313} {"train_loss": -11.441778182983398, "global_step": 220684, "epoch": 1313} {"train_loss": -11.829620361328125, "global_step": 220685, "epoch": 1313} {"train_loss": -11.525775909423828, "global_step": 220686, "epoch": 1313} {"train_loss": -11.452332496643066, "global_step": 220687, "epoch": 1313} {"train_loss": -10.556529998779297, "global_step": 220688, "epoch": 1313} {"train_loss": -11.35911750793457, "global_step": 220689, "epoch": 1313} {"train_loss": -10.563145637512207, "global_step": 220690, "epoch": 1313} {"train_loss": -11.119024276733398, "global_step": 220691, "epoch": 1313} {"train_loss": -10.627245903015137, "global_step": 220692, "epoch": 1313} {"train_loss": -11.34255313873291, "global_step": 220693, "epoch": 1313} {"train_loss": -8.514254570007324, "global_step": 220694, "epoch": 1313} {"train_loss": -11.251479148864746, "global_step": 220695, "epoch": 1313} {"train_loss": -9.364276885986328, "global_step": 220696, "epoch": 1313} {"train_loss": -10.895772933959961, "global_step": 220697, "epoch": 1313} {"train_loss": -10.074281692504883, "global_step": 220698, "epoch": 1313} {"train_loss": -10.063718795776367, "global_step": 220699, "epoch": 1313} {"train_loss": -10.703901290893555, "global_step": 220700, "epoch": 1313} {"train_loss": -10.23999309539795, "global_step": 220701, "epoch": 1313} {"train_loss": -11.32854175567627, "global_step": 220702, "epoch": 1313} {"train_loss": -9.44892692565918, "global_step": 220703, "epoch": 1313} {"train_loss": -11.49838638305664, "global_step": 220704, "epoch": 1313} {"train_loss": -9.861127853393555, "global_step": 220705, "epoch": 1313} {"train_loss": -10.701574325561523, "global_step": 220706, "epoch": 1313} {"train_loss": -11.137740135192871, "global_step": 220707, "epoch": 1313} {"train_loss": -10.698848724365234, "global_step": 220708, "epoch": 1313} {"train_loss": -11.375146865844727, "global_step": 220709, "epoch": 1313} {"train_loss": -11.104105949401855, "global_step": 220710, "epoch": 1313} {"train_loss": -11.283584594726562, "global_step": 220711, "epoch": 1313} {"train_loss": -11.535305976867676, "global_step": 220712, "epoch": 1313} {"train_loss": -10.986615180969238, "global_step": 220713, "epoch": 1313} {"train_loss": -11.91949462890625, "global_step": 220714, "epoch": 1313} {"train_loss": -11.435736656188965, "global_step": 220715, "epoch": 1313} {"train_loss": -11.583984375, "global_step": 220716, "epoch": 1313} {"train_loss": -11.578267097473145, "global_step": 220717, "epoch": 1313} {"train_loss": -11.167603492736816, "global_step": 220718, "epoch": 1313} {"train_loss": -11.637532234191895, "global_step": 220719, "epoch": 1313} {"train_loss": -11.659869194030762, "global_step": 220720, "epoch": 1313} {"train_loss": -11.602836608886719, "global_step": 220721, "epoch": 1313} {"train_loss": -11.623224258422852, "global_step": 220722, "epoch": 1313} {"train_loss": -11.705431938171387, "global_step": 220723, "epoch": 1313} {"train_loss": -11.597516059875488, "global_step": 220724, "epoch": 1313} {"train_loss": -11.850260734558105, "global_step": 220725, "epoch": 1313} {"train_loss": -11.286520004272461, "global_step": 220726, "epoch": 1313} {"train_loss": -11.629297256469727, "global_step": 220727, "epoch": 1313} {"train_loss": -11.630989074707031, "global_step": 220728, "epoch": 1313} {"train_loss": -11.871984481811523, "global_step": 220729, "epoch": 1313} {"train_loss": -11.528877258300781, "global_step": 220730, "epoch": 1313} {"train_loss": -11.351439476013184, "global_step": 220731, "epoch": 1313} {"train_loss": -11.796570777893066, "global_step": 220732, "epoch": 1313} {"train_loss": -11.548290252685547, "global_step": 220733, "epoch": 1313} {"train_loss": -11.763378143310547, "global_step": 220734, "epoch": 1313} {"train_loss": -11.927970886230469, "global_step": 220735, "epoch": 1313} {"train_loss": -11.653238296508789, "global_step": 220736, "epoch": 1313} {"train_loss": -11.80640983581543, "global_step": 220737, "epoch": 1313} {"train_loss": -12.094121932983398, "global_step": 220738, "epoch": 1313} {"train_loss": -11.820804595947266, "global_step": 220739, "epoch": 1313} {"train_loss": -11.967092514038086, "global_step": 220740, "epoch": 1313} {"train_loss": -11.760205268859863, "global_step": 220741, "epoch": 1313} {"train_loss": -11.70179271697998, "global_step": 220742, "epoch": 1313} {"train_loss": -11.939007759094238, "global_step": 220743, "epoch": 1313} {"train_loss": -11.654422760009766, "global_step": 220744, "epoch": 1313} {"train_loss": -11.958464622497559, "global_step": 220745, "epoch": 1313} {"train_loss": -11.883321762084961, "global_step": 220746, "epoch": 1313} {"train_loss": -11.652847290039062, "global_step": 220747, "epoch": 1313} {"train_loss": -11.971768379211426, "global_step": 220748, "epoch": 1313} {"train_loss": -11.83745002746582, "global_step": 220749, "epoch": 1313} {"train_loss": -11.46761703491211, "global_step": 220750, "epoch": 1313} {"train_loss": -11.298324062710716, "global_step": 220751, "epoch": 1313, "val_loss": 253208.359375} {"train_loss": -11.936639785766602, "global_step": 220752, "epoch": 1314} {"train_loss": -11.714893341064453, "global_step": 220753, "epoch": 1314} {"train_loss": -11.711285591125488, "global_step": 220754, "epoch": 1314} {"train_loss": -11.799846649169922, "global_step": 220755, "epoch": 1314} {"train_loss": -11.84054946899414, "global_step": 220756, "epoch": 1314} {"train_loss": -11.52406120300293, "global_step": 220757, "epoch": 1314} {"train_loss": -11.808141708374023, "global_step": 220758, "epoch": 1314} {"train_loss": -11.74156665802002, "global_step": 220759, "epoch": 1314} {"train_loss": -11.465434074401855, "global_step": 220760, "epoch": 1314} {"train_loss": -11.683992385864258, "global_step": 220761, "epoch": 1314} {"train_loss": -11.585674285888672, "global_step": 220762, "epoch": 1314} {"train_loss": -11.733550071716309, "global_step": 220763, "epoch": 1314} {"train_loss": -11.717994689941406, "global_step": 220764, "epoch": 1314} {"train_loss": -11.604156494140625, "global_step": 220765, "epoch": 1314} {"train_loss": -11.7633638381958, "global_step": 220766, "epoch": 1314} {"train_loss": -11.798742294311523, "global_step": 220767, "epoch": 1314} {"train_loss": -11.828563690185547, "global_step": 220768, "epoch": 1314} {"train_loss": -11.227896690368652, "global_step": 220769, "epoch": 1314} {"train_loss": -10.389474868774414, "global_step": 220770, "epoch": 1314} {"train_loss": -11.142889022827148, "global_step": 220771, "epoch": 1314} {"train_loss": -11.244598388671875, "global_step": 220772, "epoch": 1314} {"train_loss": -10.70890998840332, "global_step": 220773, "epoch": 1314} {"train_loss": -9.591726303100586, "global_step": 220774, "epoch": 1314} {"train_loss": -10.503962516784668, "global_step": 220775, "epoch": 1314} {"train_loss": -7.710878372192383, "global_step": 220776, "epoch": 1314} {"train_loss": -7.298584938049316, "global_step": 220777, "epoch": 1314} {"train_loss": -8.020221710205078, "global_step": 220778, "epoch": 1314} {"train_loss": -9.749985694885254, "global_step": 220779, "epoch": 1314} {"train_loss": -8.987812042236328, "global_step": 220780, "epoch": 1314} {"train_loss": -8.704395294189453, "global_step": 220781, "epoch": 1314} {"train_loss": -10.120153427124023, "global_step": 220782, "epoch": 1314} {"train_loss": -9.290473937988281, "global_step": 220783, "epoch": 1314} {"train_loss": -8.656476974487305, "global_step": 220784, "epoch": 1314} {"train_loss": -8.950803756713867, "global_step": 220785, "epoch": 1314} {"train_loss": -10.551971435546875, "global_step": 220786, "epoch": 1314} {"train_loss": -9.145223617553711, "global_step": 220787, "epoch": 1314} {"train_loss": -9.890328407287598, "global_step": 220788, "epoch": 1314} {"train_loss": -10.104639053344727, "global_step": 220789, "epoch": 1314} {"train_loss": -9.543538093566895, "global_step": 220790, "epoch": 1314} {"train_loss": -10.057945251464844, "global_step": 220791, "epoch": 1314} {"train_loss": -10.424224853515625, "global_step": 220792, "epoch": 1314} {"train_loss": -10.289901733398438, "global_step": 220793, "epoch": 1314} {"train_loss": -10.09383773803711, "global_step": 220794, "epoch": 1314} {"train_loss": -10.684109687805176, "global_step": 220795, "epoch": 1314} {"train_loss": -10.008691787719727, "global_step": 220796, "epoch": 1314} {"train_loss": -11.131380081176758, "global_step": 220797, "epoch": 1314} {"train_loss": -9.802504539489746, "global_step": 220798, "epoch": 1314} {"train_loss": -10.877660751342773, "global_step": 220799, "epoch": 1314} {"train_loss": -10.442739486694336, "global_step": 220800, "epoch": 1314} {"train_loss": -10.827116012573242, "global_step": 220801, "epoch": 1314} {"train_loss": -10.712624549865723, "global_step": 220802, "epoch": 1314} {"train_loss": -10.96860122680664, "global_step": 220803, "epoch": 1314} {"train_loss": -10.782720565795898, "global_step": 220804, "epoch": 1314} {"train_loss": -11.119283676147461, "global_step": 220805, "epoch": 1314} {"train_loss": -11.056879043579102, "global_step": 220806, "epoch": 1314} {"train_loss": -10.87112808227539, "global_step": 220807, "epoch": 1314} {"train_loss": -10.75936508178711, "global_step": 220808, "epoch": 1314} {"train_loss": -11.222268104553223, "global_step": 220809, "epoch": 1314} {"train_loss": -11.006059646606445, "global_step": 220810, "epoch": 1314} {"train_loss": -11.013975143432617, "global_step": 220811, "epoch": 1314} {"train_loss": -10.920093536376953, "global_step": 220812, "epoch": 1314} {"train_loss": -10.931541442871094, "global_step": 220813, "epoch": 1314} {"train_loss": -11.023792266845703, "global_step": 220814, "epoch": 1314} {"train_loss": -11.165732383728027, "global_step": 220815, "epoch": 1314} {"train_loss": -11.374146461486816, "global_step": 220816, "epoch": 1314} {"train_loss": -11.152229309082031, "global_step": 220817, "epoch": 1314} {"train_loss": -11.219882011413574, "global_step": 220818, "epoch": 1314} {"train_loss": -11.33074951171875, "global_step": 220819, "epoch": 1314} {"train_loss": -11.187145233154297, "global_step": 220820, "epoch": 1314} {"train_loss": -11.250520706176758, "global_step": 220821, "epoch": 1314} {"train_loss": -11.260647773742676, "global_step": 220822, "epoch": 1314} {"train_loss": -11.236808776855469, "global_step": 220823, "epoch": 1314} {"train_loss": -11.369203567504883, "global_step": 220824, "epoch": 1314} {"train_loss": -11.49090576171875, "global_step": 220825, "epoch": 1314} {"train_loss": -11.52650260925293, "global_step": 220826, "epoch": 1314} {"train_loss": -11.287556648254395, "global_step": 220827, "epoch": 1314} {"train_loss": -11.441831588745117, "global_step": 220828, "epoch": 1314} {"train_loss": -11.46035099029541, "global_step": 220829, "epoch": 1314} {"train_loss": -11.414339065551758, "global_step": 220830, "epoch": 1314} {"train_loss": -11.676376342773438, "global_step": 220831, "epoch": 1314} {"train_loss": -11.488956451416016, "global_step": 220832, "epoch": 1314} {"train_loss": -11.57169246673584, "global_step": 220833, "epoch": 1314} {"train_loss": -11.409597396850586, "global_step": 220834, "epoch": 1314} {"train_loss": -11.566418647766113, "global_step": 220835, "epoch": 1314} {"train_loss": -11.59097671508789, "global_step": 220836, "epoch": 1314} {"train_loss": -11.477304458618164, "global_step": 220837, "epoch": 1314} {"train_loss": -11.733604431152344, "global_step": 220838, "epoch": 1314} {"train_loss": -11.481520652770996, "global_step": 220839, "epoch": 1314} {"train_loss": -11.467117309570312, "global_step": 220840, "epoch": 1314} {"train_loss": -11.5086669921875, "global_step": 220841, "epoch": 1314} {"train_loss": -11.637300491333008, "global_step": 220842, "epoch": 1314} {"train_loss": -11.671321868896484, "global_step": 220843, "epoch": 1314} {"train_loss": -11.358854293823242, "global_step": 220844, "epoch": 1314} {"train_loss": -11.590144157409668, "global_step": 220845, "epoch": 1314} {"train_loss": -11.523824691772461, "global_step": 220846, "epoch": 1314} {"train_loss": -11.865287780761719, "global_step": 220847, "epoch": 1314} {"train_loss": -11.71235179901123, "global_step": 220848, "epoch": 1314} {"train_loss": -11.700883865356445, "global_step": 220849, "epoch": 1314} {"train_loss": -11.681675910949707, "global_step": 220850, "epoch": 1314} {"train_loss": -11.683112144470215, "global_step": 220851, "epoch": 1314} {"train_loss": -11.869956016540527, "global_step": 220852, "epoch": 1314} {"train_loss": -11.682172775268555, "global_step": 220853, "epoch": 1314} {"train_loss": -11.824223518371582, "global_step": 220854, "epoch": 1314} {"train_loss": -11.736141204833984, "global_step": 220855, "epoch": 1314} {"train_loss": -11.667985916137695, "global_step": 220856, "epoch": 1314} {"train_loss": -11.910829544067383, "global_step": 220857, "epoch": 1314} {"train_loss": -11.76558780670166, "global_step": 220858, "epoch": 1314} {"train_loss": -11.961801528930664, "global_step": 220859, "epoch": 1314} {"train_loss": -11.703939437866211, "global_step": 220860, "epoch": 1314} {"train_loss": -11.740015983581543, "global_step": 220861, "epoch": 1314} {"train_loss": -11.929901123046875, "global_step": 220862, "epoch": 1314} {"train_loss": -11.975550651550293, "global_step": 220863, "epoch": 1314} {"train_loss": -11.84822940826416, "global_step": 220864, "epoch": 1314} {"train_loss": -11.814271926879883, "global_step": 220865, "epoch": 1314} {"train_loss": -12.008994102478027, "global_step": 220866, "epoch": 1314} {"train_loss": -11.89613151550293, "global_step": 220867, "epoch": 1314} {"train_loss": -11.710164070129395, "global_step": 220868, "epoch": 1314} {"train_loss": -11.8982572555542, "global_step": 220869, "epoch": 1314} {"train_loss": -11.805977821350098, "global_step": 220870, "epoch": 1314} {"train_loss": -12.045808792114258, "global_step": 220871, "epoch": 1314} {"train_loss": -11.796289443969727, "global_step": 220872, "epoch": 1314} {"train_loss": -11.968887329101562, "global_step": 220873, "epoch": 1314} {"train_loss": -12.066629409790039, "global_step": 220874, "epoch": 1314} {"train_loss": -11.895383834838867, "global_step": 220875, "epoch": 1314} {"train_loss": -11.947711944580078, "global_step": 220876, "epoch": 1314} {"train_loss": -11.977157592773438, "global_step": 220877, "epoch": 1314} {"train_loss": -11.772397994995117, "global_step": 220878, "epoch": 1314} {"train_loss": -11.737051963806152, "global_step": 220879, "epoch": 1314} {"train_loss": -11.857659339904785, "global_step": 220880, "epoch": 1314} {"train_loss": -11.499403953552246, "global_step": 220881, "epoch": 1314} {"train_loss": -11.751338005065918, "global_step": 220882, "epoch": 1314} {"train_loss": -12.000591278076172, "global_step": 220883, "epoch": 1314} {"train_loss": -11.581714630126953, "global_step": 220884, "epoch": 1314} {"train_loss": -11.308015823364258, "global_step": 220885, "epoch": 1314} {"train_loss": -11.469152450561523, "global_step": 220886, "epoch": 1314} {"train_loss": -11.51363754272461, "global_step": 220887, "epoch": 1314} {"train_loss": -11.842887878417969, "global_step": 220888, "epoch": 1314} {"train_loss": -11.311161994934082, "global_step": 220889, "epoch": 1314} {"train_loss": -11.907926559448242, "global_step": 220890, "epoch": 1314} {"train_loss": -12.055747985839844, "global_step": 220891, "epoch": 1314} {"train_loss": -12.005720138549805, "global_step": 220892, "epoch": 1314} {"train_loss": -11.73946762084961, "global_step": 220893, "epoch": 1314} {"train_loss": -11.698028564453125, "global_step": 220894, "epoch": 1314} {"train_loss": -11.577778816223145, "global_step": 220895, "epoch": 1314} {"train_loss": -11.770162582397461, "global_step": 220896, "epoch": 1314} {"train_loss": -11.809968948364258, "global_step": 220897, "epoch": 1314} {"train_loss": -10.739501953125, "global_step": 220898, "epoch": 1314} {"train_loss": -9.919351577758789, "global_step": 220899, "epoch": 1314} {"train_loss": -11.767044067382812, "global_step": 220900, "epoch": 1314} {"train_loss": -11.706809043884277, "global_step": 220901, "epoch": 1314} {"train_loss": -10.909395217895508, "global_step": 220902, "epoch": 1314} {"train_loss": -11.161073684692383, "global_step": 220903, "epoch": 1314} {"train_loss": -11.937255859375, "global_step": 220904, "epoch": 1314} {"train_loss": -11.434671401977539, "global_step": 220905, "epoch": 1314} {"train_loss": -10.097524642944336, "global_step": 220906, "epoch": 1314} {"train_loss": -11.189205169677734, "global_step": 220907, "epoch": 1314} {"train_loss": -11.527730941772461, "global_step": 220908, "epoch": 1314} {"train_loss": -11.652467727661133, "global_step": 220909, "epoch": 1314} {"train_loss": -10.877355575561523, "global_step": 220910, "epoch": 1314} {"train_loss": -11.954569816589355, "global_step": 220911, "epoch": 1314} {"train_loss": -11.210119247436523, "global_step": 220912, "epoch": 1314} {"train_loss": -11.028377532958984, "global_step": 220913, "epoch": 1314} {"train_loss": -11.212318420410156, "global_step": 220914, "epoch": 1314} {"train_loss": -11.486952781677246, "global_step": 220915, "epoch": 1314} {"train_loss": -10.861194610595703, "global_step": 220916, "epoch": 1314} {"train_loss": -11.069952011108398, "global_step": 220917, "epoch": 1314} {"train_loss": -10.659096717834473, "global_step": 220918, "epoch": 1314} {"train_loss": -11.197426154499961, "global_step": 220919, "epoch": 1314, "val_loss": 259899.296875} {"train_loss": -10.202489852905273, "global_step": 220920, "epoch": 1315} {"train_loss": -11.223016738891602, "global_step": 220921, "epoch": 1315} {"train_loss": -9.317090034484863, "global_step": 220922, "epoch": 1315} {"train_loss": -11.243315696716309, "global_step": 220923, "epoch": 1315} {"train_loss": -9.224102973937988, "global_step": 220924, "epoch": 1315} {"train_loss": -10.838115692138672, "global_step": 220925, "epoch": 1315} {"train_loss": -10.482372283935547, "global_step": 220926, "epoch": 1315} {"train_loss": -10.263716697692871, "global_step": 220927, "epoch": 1315} {"train_loss": -10.372239112854004, "global_step": 220928, "epoch": 1315} {"train_loss": -10.549181938171387, "global_step": 220929, "epoch": 1315} {"train_loss": -9.897998809814453, "global_step": 220930, "epoch": 1315} {"train_loss": -11.260153770446777, "global_step": 220931, "epoch": 1315} {"train_loss": -10.352901458740234, "global_step": 220932, "epoch": 1315} {"train_loss": -11.330900192260742, "global_step": 220933, "epoch": 1315} {"train_loss": -11.062548637390137, "global_step": 220934, "epoch": 1315} {"train_loss": -11.285755157470703, "global_step": 220935, "epoch": 1315} {"train_loss": -11.044718742370605, "global_step": 220936, "epoch": 1315} {"train_loss": -10.62263011932373, "global_step": 220937, "epoch": 1315} {"train_loss": -11.144535064697266, "global_step": 220938, "epoch": 1315} {"train_loss": -11.337154388427734, "global_step": 220939, "epoch": 1315} {"train_loss": -10.488765716552734, "global_step": 220940, "epoch": 1315} {"train_loss": -10.884689331054688, "global_step": 220941, "epoch": 1315} {"train_loss": -11.030939102172852, "global_step": 220942, "epoch": 1315} {"train_loss": -11.076780319213867, "global_step": 220943, "epoch": 1315} {"train_loss": -11.410167694091797, "global_step": 220944, "epoch": 1315} {"train_loss": -10.996493339538574, "global_step": 220945, "epoch": 1315} {"train_loss": -11.452842712402344, "global_step": 220946, "epoch": 1315} {"train_loss": -11.058025360107422, "global_step": 220947, "epoch": 1315} {"train_loss": -11.349020004272461, "global_step": 220948, "epoch": 1315} {"train_loss": -11.36503791809082, "global_step": 220949, "epoch": 1315} {"train_loss": -10.987953186035156, "global_step": 220950, "epoch": 1315} {"train_loss": -11.569122314453125, "global_step": 220951, "epoch": 1315} {"train_loss": -10.97504997253418, "global_step": 220952, "epoch": 1315} {"train_loss": -11.518426895141602, "global_step": 220953, "epoch": 1315} {"train_loss": -11.504237174987793, "global_step": 220954, "epoch": 1315} {"train_loss": -11.334226608276367, "global_step": 220955, "epoch": 1315} {"train_loss": -11.663492202758789, "global_step": 220956, "epoch": 1315} {"train_loss": -11.28703784942627, "global_step": 220957, "epoch": 1315} {"train_loss": -11.485244750976562, "global_step": 220958, "epoch": 1315} {"train_loss": -11.103866577148438, "global_step": 220959, "epoch": 1315} {"train_loss": -11.275932312011719, "global_step": 220960, "epoch": 1315} {"train_loss": -11.09154987335205, "global_step": 220961, "epoch": 1315} {"train_loss": -11.407379150390625, "global_step": 220962, "epoch": 1315} {"train_loss": -11.49764633178711, "global_step": 220963, "epoch": 1315} {"train_loss": -11.424824714660645, "global_step": 220964, "epoch": 1315} {"train_loss": -11.47752571105957, "global_step": 220965, "epoch": 1315} {"train_loss": -11.084973335266113, "global_step": 220966, "epoch": 1315} {"train_loss": -11.080802917480469, "global_step": 220967, "epoch": 1315} {"train_loss": -10.47176742553711, "global_step": 220968, "epoch": 1315} {"train_loss": -10.856728553771973, "global_step": 220969, "epoch": 1315} {"train_loss": -11.058937072753906, "global_step": 220970, "epoch": 1315} {"train_loss": -10.088752746582031, "global_step": 220971, "epoch": 1315} {"train_loss": -11.183572769165039, "global_step": 220972, "epoch": 1315} {"train_loss": -10.47810173034668, "global_step": 220973, "epoch": 1315} {"train_loss": -10.550610542297363, "global_step": 220974, "epoch": 1315} {"train_loss": -10.846298217773438, "global_step": 220975, "epoch": 1315} {"train_loss": -10.688453674316406, "global_step": 220976, "epoch": 1315} {"train_loss": -10.748435974121094, "global_step": 220977, "epoch": 1315} {"train_loss": -10.742971420288086, "global_step": 220978, "epoch": 1315} {"train_loss": -10.759361267089844, "global_step": 220979, "epoch": 1315} {"train_loss": -11.257430076599121, "global_step": 220980, "epoch": 1315} {"train_loss": -11.173250198364258, "global_step": 220981, "epoch": 1315} {"train_loss": -11.335390090942383, "global_step": 220982, "epoch": 1315} {"train_loss": -11.174654960632324, "global_step": 220983, "epoch": 1315} {"train_loss": -11.110301971435547, "global_step": 220984, "epoch": 1315} {"train_loss": -11.31069564819336, "global_step": 220985, "epoch": 1315} {"train_loss": -11.093629837036133, "global_step": 220986, "epoch": 1315} {"train_loss": -11.674246788024902, "global_step": 220987, "epoch": 1315} {"train_loss": -11.124970436096191, "global_step": 220988, "epoch": 1315} {"train_loss": -11.313952445983887, "global_step": 220989, "epoch": 1315} {"train_loss": -11.429096221923828, "global_step": 220990, "epoch": 1315} {"train_loss": -11.170467376708984, "global_step": 220991, "epoch": 1315} {"train_loss": -11.454036712646484, "global_step": 220992, "epoch": 1315} {"train_loss": -11.509479522705078, "global_step": 220993, "epoch": 1315} {"train_loss": -11.289006233215332, "global_step": 220994, "epoch": 1315} {"train_loss": -11.487452507019043, "global_step": 220995, "epoch": 1315} {"train_loss": -11.549028396606445, "global_step": 220996, "epoch": 1315} {"train_loss": -11.065435409545898, "global_step": 220997, "epoch": 1315} {"train_loss": -11.652402877807617, "global_step": 220998, "epoch": 1315} {"train_loss": -11.596353530883789, "global_step": 220999, "epoch": 1315} {"train_loss": -11.61275863647461, "global_step": 221000, "epoch": 1315} {"train_loss": -11.512088775634766, "global_step": 221001, "epoch": 1315} {"train_loss": -11.409725189208984, "global_step": 221002, "epoch": 1315} {"train_loss": -11.660258293151855, "global_step": 221003, "epoch": 1315} {"train_loss": -11.57138729095459, "global_step": 221004, "epoch": 1315} {"train_loss": -11.455183982849121, "global_step": 221005, "epoch": 1315} {"train_loss": -11.81840991973877, "global_step": 221006, "epoch": 1315} {"train_loss": -11.6968355178833, "global_step": 221007, "epoch": 1315} {"train_loss": -11.783866882324219, "global_step": 221008, "epoch": 1315} {"train_loss": -11.606956481933594, "global_step": 221009, "epoch": 1315} {"train_loss": -11.74561882019043, "global_step": 221010, "epoch": 1315} {"train_loss": -11.838956832885742, "global_step": 221011, "epoch": 1315} {"train_loss": -11.485773086547852, "global_step": 221012, "epoch": 1315} {"train_loss": -11.925033569335938, "global_step": 221013, "epoch": 1315} {"train_loss": -11.809276580810547, "global_step": 221014, "epoch": 1315} {"train_loss": -11.648452758789062, "global_step": 221015, "epoch": 1315} {"train_loss": -12.023284912109375, "global_step": 221016, "epoch": 1315} {"train_loss": -11.805628776550293, "global_step": 221017, "epoch": 1315} {"train_loss": -11.910204887390137, "global_step": 221018, "epoch": 1315} {"train_loss": -11.933734893798828, "global_step": 221019, "epoch": 1315} {"train_loss": -11.954629898071289, "global_step": 221020, "epoch": 1315} {"train_loss": -11.868538856506348, "global_step": 221021, "epoch": 1315} {"train_loss": -11.915919303894043, "global_step": 221022, "epoch": 1315} {"train_loss": -11.856549263000488, "global_step": 221023, "epoch": 1315} {"train_loss": -11.967510223388672, "global_step": 221024, "epoch": 1315} {"train_loss": -12.023860931396484, "global_step": 221025, "epoch": 1315} {"train_loss": -11.953104019165039, "global_step": 221026, "epoch": 1315} {"train_loss": -11.876705169677734, "global_step": 221027, "epoch": 1315} {"train_loss": -11.894491195678711, "global_step": 221028, "epoch": 1315} {"train_loss": -11.951801300048828, "global_step": 221029, "epoch": 1315} {"train_loss": -11.776870727539062, "global_step": 221030, "epoch": 1315} {"train_loss": -11.912622451782227, "global_step": 221031, "epoch": 1315} {"train_loss": -12.064539909362793, "global_step": 221032, "epoch": 1315} {"train_loss": -11.836502075195312, "global_step": 221033, "epoch": 1315} {"train_loss": -12.141371726989746, "global_step": 221034, "epoch": 1315} {"train_loss": -11.829279899597168, "global_step": 221035, "epoch": 1315} {"train_loss": -11.662708282470703, "global_step": 221036, "epoch": 1315} {"train_loss": -11.870294570922852, "global_step": 221037, "epoch": 1315} {"train_loss": -11.83354377746582, "global_step": 221038, "epoch": 1315} {"train_loss": -11.810272216796875, "global_step": 221039, "epoch": 1315} {"train_loss": -11.692307472229004, "global_step": 221040, "epoch": 1315} {"train_loss": -11.499946594238281, "global_step": 221041, "epoch": 1315} {"train_loss": -11.05428695678711, "global_step": 221042, "epoch": 1315} {"train_loss": -12.005023956298828, "global_step": 221043, "epoch": 1315} {"train_loss": -11.421693801879883, "global_step": 221044, "epoch": 1315} {"train_loss": -11.986352920532227, "global_step": 221045, "epoch": 1315} {"train_loss": -11.452816009521484, "global_step": 221046, "epoch": 1315} {"train_loss": -11.462427139282227, "global_step": 221047, "epoch": 1315} {"train_loss": -11.667278289794922, "global_step": 221048, "epoch": 1315} {"train_loss": -10.953498840332031, "global_step": 221049, "epoch": 1315} {"train_loss": -10.507608413696289, "global_step": 221050, "epoch": 1315} {"train_loss": -11.586219787597656, "global_step": 221051, "epoch": 1315} {"train_loss": -11.05383586883545, "global_step": 221052, "epoch": 1315} {"train_loss": -11.5355224609375, "global_step": 221053, "epoch": 1315} {"train_loss": -11.625900268554688, "global_step": 221054, "epoch": 1315} {"train_loss": -11.291084289550781, "global_step": 221055, "epoch": 1315} {"train_loss": -10.786880493164062, "global_step": 221056, "epoch": 1315} {"train_loss": -9.726724624633789, "global_step": 221057, "epoch": 1315} {"train_loss": -11.114883422851562, "global_step": 221058, "epoch": 1315} {"train_loss": -8.534540176391602, "global_step": 221059, "epoch": 1315} {"train_loss": -9.804980278015137, "global_step": 221060, "epoch": 1315} {"train_loss": -10.73980712890625, "global_step": 221061, "epoch": 1315} {"train_loss": -9.768793106079102, "global_step": 221062, "epoch": 1315} {"train_loss": -10.067912101745605, "global_step": 221063, "epoch": 1315} {"train_loss": -11.405386924743652, "global_step": 221064, "epoch": 1315} {"train_loss": -10.178189277648926, "global_step": 221065, "epoch": 1315} {"train_loss": -11.085103988647461, "global_step": 221066, "epoch": 1315} {"train_loss": -9.673208236694336, "global_step": 221067, "epoch": 1315} {"train_loss": -10.176107406616211, "global_step": 221068, "epoch": 1315} {"train_loss": -10.892717361450195, "global_step": 221069, "epoch": 1315} {"train_loss": -9.294537544250488, "global_step": 221070, "epoch": 1315} {"train_loss": -11.006080627441406, "global_step": 221071, "epoch": 1315} {"train_loss": -10.36906623840332, "global_step": 221072, "epoch": 1315} {"train_loss": -11.228370666503906, "global_step": 221073, "epoch": 1315} {"train_loss": -10.282523155212402, "global_step": 221074, "epoch": 1315} {"train_loss": -11.013101577758789, "global_step": 221075, "epoch": 1315} {"train_loss": -10.014415740966797, "global_step": 221076, "epoch": 1315} {"train_loss": -11.059815406799316, "global_step": 221077, "epoch": 1315} {"train_loss": -10.313024520874023, "global_step": 221078, "epoch": 1315} {"train_loss": -10.878545761108398, "global_step": 221079, "epoch": 1315} {"train_loss": -10.384161949157715, "global_step": 221080, "epoch": 1315} {"train_loss": -11.253936767578125, "global_step": 221081, "epoch": 1315} {"train_loss": -10.499460220336914, "global_step": 221082, "epoch": 1315} {"train_loss": -11.169242858886719, "global_step": 221083, "epoch": 1315} {"train_loss": -10.521352767944336, "global_step": 221084, "epoch": 1315} {"train_loss": -11.290586471557617, "global_step": 221085, "epoch": 1315} {"train_loss": -10.953864097595215, "global_step": 221086, "epoch": 1315} {"train_loss": -11.159815004893712, "global_step": 221087, "epoch": 1315, "val_loss": 253532.359375, "train_action_mse_error": 0.35464954376220703} {"train_loss": -11.148287773132324, "global_step": 221088, "epoch": 1316} {"train_loss": -11.243293762207031, "global_step": 221089, "epoch": 1316} {"train_loss": -11.460149765014648, "global_step": 221090, "epoch": 1316} {"train_loss": -10.982063293457031, "global_step": 221091, "epoch": 1316} {"train_loss": -11.414238929748535, "global_step": 221092, "epoch": 1316} {"train_loss": -11.532175064086914, "global_step": 221093, "epoch": 1316} {"train_loss": -11.091135025024414, "global_step": 221094, "epoch": 1316} {"train_loss": -11.366233825683594, "global_step": 221095, "epoch": 1316} {"train_loss": -11.443981170654297, "global_step": 221096, "epoch": 1316} {"train_loss": -11.580154418945312, "global_step": 221097, "epoch": 1316} {"train_loss": -11.11335563659668, "global_step": 221098, "epoch": 1316} {"train_loss": -11.497302055358887, "global_step": 221099, "epoch": 1316} {"train_loss": -11.359663963317871, "global_step": 221100, "epoch": 1316} {"train_loss": -11.30972957611084, "global_step": 221101, "epoch": 1316} {"train_loss": -11.293340682983398, "global_step": 221102, "epoch": 1316} {"train_loss": -11.32470703125, "global_step": 221103, "epoch": 1316} {"train_loss": -11.508384704589844, "global_step": 221104, "epoch": 1316} {"train_loss": -11.55349349975586, "global_step": 221105, "epoch": 1316} {"train_loss": -11.268997192382812, "global_step": 221106, "epoch": 1316} {"train_loss": -11.662736892700195, "global_step": 221107, "epoch": 1316} {"train_loss": -11.378807067871094, "global_step": 221108, "epoch": 1316} {"train_loss": -11.501014709472656, "global_step": 221109, "epoch": 1316} {"train_loss": -11.595386505126953, "global_step": 221110, "epoch": 1316} {"train_loss": -11.341057777404785, "global_step": 221111, "epoch": 1316} {"train_loss": -11.633706092834473, "global_step": 221112, "epoch": 1316} {"train_loss": -11.637319564819336, "global_step": 221113, "epoch": 1316} {"train_loss": -11.532899856567383, "global_step": 221114, "epoch": 1316} {"train_loss": -11.535465240478516, "global_step": 221115, "epoch": 1316} {"train_loss": -11.798389434814453, "global_step": 221116, "epoch": 1316} {"train_loss": -11.475831985473633, "global_step": 221117, "epoch": 1316} {"train_loss": -11.632499694824219, "global_step": 221118, "epoch": 1316} {"train_loss": -11.730777740478516, "global_step": 221119, "epoch": 1316} {"train_loss": -11.621318817138672, "global_step": 221120, "epoch": 1316} {"train_loss": -11.58688735961914, "global_step": 221121, "epoch": 1316} {"train_loss": -11.85832405090332, "global_step": 221122, "epoch": 1316} {"train_loss": -11.735507011413574, "global_step": 221123, "epoch": 1316} {"train_loss": -11.682560920715332, "global_step": 221124, "epoch": 1316} {"train_loss": -11.623209953308105, "global_step": 221125, "epoch": 1316} {"train_loss": -11.71845531463623, "global_step": 221126, "epoch": 1316} {"train_loss": -11.819918632507324, "global_step": 221127, "epoch": 1316} {"train_loss": -11.770278930664062, "global_step": 221128, "epoch": 1316} {"train_loss": -11.608482360839844, "global_step": 221129, "epoch": 1316} {"train_loss": -11.767045974731445, "global_step": 221130, "epoch": 1316} {"train_loss": -11.874757766723633, "global_step": 221131, "epoch": 1316} {"train_loss": -11.879165649414062, "global_step": 221132, "epoch": 1316} {"train_loss": -11.86424446105957, "global_step": 221133, "epoch": 1316} {"train_loss": -11.945174217224121, "global_step": 221134, "epoch": 1316} {"train_loss": -11.87530517578125, "global_step": 221135, "epoch": 1316} {"train_loss": -11.780937194824219, "global_step": 221136, "epoch": 1316} {"train_loss": -12.105344772338867, "global_step": 221137, "epoch": 1316} {"train_loss": -11.950139045715332, "global_step": 221138, "epoch": 1316} {"train_loss": -11.615306854248047, "global_step": 221139, "epoch": 1316} {"train_loss": -12.060163497924805, "global_step": 221140, "epoch": 1316} {"train_loss": -11.857653617858887, "global_step": 221141, "epoch": 1316} {"train_loss": -11.85503101348877, "global_step": 221142, "epoch": 1316} {"train_loss": -11.835479736328125, "global_step": 221143, "epoch": 1316} {"train_loss": -11.962364196777344, "global_step": 221144, "epoch": 1316} {"train_loss": -11.95824146270752, "global_step": 221145, "epoch": 1316} {"train_loss": -11.67930793762207, "global_step": 221146, "epoch": 1316} {"train_loss": -11.899422645568848, "global_step": 221147, "epoch": 1316} {"train_loss": -11.768089294433594, "global_step": 221148, "epoch": 1316} {"train_loss": -11.945442199707031, "global_step": 221149, "epoch": 1316} {"train_loss": -11.84079360961914, "global_step": 221150, "epoch": 1316} {"train_loss": -11.955156326293945, "global_step": 221151, "epoch": 1316} {"train_loss": -11.998064041137695, "global_step": 221152, "epoch": 1316} {"train_loss": -12.22620964050293, "global_step": 221153, "epoch": 1316} {"train_loss": -11.680703163146973, "global_step": 221154, "epoch": 1316} {"train_loss": -11.992439270019531, "global_step": 221155, "epoch": 1316} {"train_loss": -11.913711547851562, "global_step": 221156, "epoch": 1316} {"train_loss": -11.73774242401123, "global_step": 221157, "epoch": 1316} {"train_loss": -11.833189964294434, "global_step": 221158, "epoch": 1316} {"train_loss": -11.851530075073242, "global_step": 221159, "epoch": 1316} {"train_loss": -11.75016975402832, "global_step": 221160, "epoch": 1316} {"train_loss": -11.560487747192383, "global_step": 221161, "epoch": 1316} {"train_loss": -12.075491905212402, "global_step": 221162, "epoch": 1316} {"train_loss": -11.669239044189453, "global_step": 221163, "epoch": 1316} {"train_loss": -11.385683059692383, "global_step": 221164, "epoch": 1316} {"train_loss": -11.080900192260742, "global_step": 221165, "epoch": 1316} {"train_loss": -11.574844360351562, "global_step": 221166, "epoch": 1316} {"train_loss": -11.866358757019043, "global_step": 221167, "epoch": 1316} {"train_loss": -11.164007186889648, "global_step": 221168, "epoch": 1316} {"train_loss": -8.589685440063477, "global_step": 221169, "epoch": 1316} {"train_loss": -9.584297180175781, "global_step": 221170, "epoch": 1316} {"train_loss": -10.849963188171387, "global_step": 221171, "epoch": 1316} {"train_loss": -8.367681503295898, "global_step": 221172, "epoch": 1316} {"train_loss": -10.70298957824707, "global_step": 221173, "epoch": 1316} {"train_loss": -10.208938598632812, "global_step": 221174, "epoch": 1316} {"train_loss": -8.354113578796387, "global_step": 221175, "epoch": 1316} {"train_loss": -8.17791748046875, "global_step": 221176, "epoch": 1316} {"train_loss": -9.988731384277344, "global_step": 221177, "epoch": 1316} {"train_loss": -9.768285751342773, "global_step": 221178, "epoch": 1316} {"train_loss": -9.758374214172363, "global_step": 221179, "epoch": 1316} {"train_loss": -10.407638549804688, "global_step": 221180, "epoch": 1316} {"train_loss": -9.851934432983398, "global_step": 221181, "epoch": 1316} {"train_loss": -10.280783653259277, "global_step": 221182, "epoch": 1316} {"train_loss": -9.905488014221191, "global_step": 221183, "epoch": 1316} {"train_loss": -10.297367095947266, "global_step": 221184, "epoch": 1316} {"train_loss": -9.381412506103516, "global_step": 221185, "epoch": 1316} {"train_loss": -10.131787300109863, "global_step": 221186, "epoch": 1316} {"train_loss": -9.264491081237793, "global_step": 221187, "epoch": 1316} {"train_loss": -10.218299865722656, "global_step": 221188, "epoch": 1316} {"train_loss": -9.871990203857422, "global_step": 221189, "epoch": 1316} {"train_loss": -9.70248031616211, "global_step": 221190, "epoch": 1316} {"train_loss": -10.675016403198242, "global_step": 221191, "epoch": 1316} {"train_loss": -10.892505645751953, "global_step": 221192, "epoch": 1316} {"train_loss": -10.207988739013672, "global_step": 221193, "epoch": 1316} {"train_loss": -10.39340877532959, "global_step": 221194, "epoch": 1316} {"train_loss": -10.695476531982422, "global_step": 221195, "epoch": 1316} {"train_loss": -9.292722702026367, "global_step": 221196, "epoch": 1316} {"train_loss": -11.134960174560547, "global_step": 221197, "epoch": 1316} {"train_loss": -10.472285270690918, "global_step": 221198, "epoch": 1316} {"train_loss": -10.145331382751465, "global_step": 221199, "epoch": 1316} {"train_loss": -10.446151733398438, "global_step": 221200, "epoch": 1316} {"train_loss": -10.937581062316895, "global_step": 221201, "epoch": 1316} {"train_loss": -9.888529777526855, "global_step": 221202, "epoch": 1316} {"train_loss": -10.716182708740234, "global_step": 221203, "epoch": 1316} {"train_loss": -10.607681274414062, "global_step": 221204, "epoch": 1316} {"train_loss": -10.537322998046875, "global_step": 221205, "epoch": 1316} {"train_loss": -10.578123092651367, "global_step": 221206, "epoch": 1316} {"train_loss": -11.15653133392334, "global_step": 221207, "epoch": 1316} {"train_loss": -10.870317459106445, "global_step": 221208, "epoch": 1316} {"train_loss": -10.481424331665039, "global_step": 221209, "epoch": 1316} {"train_loss": -10.905319213867188, "global_step": 221210, "epoch": 1316} {"train_loss": -11.138248443603516, "global_step": 221211, "epoch": 1316} {"train_loss": -10.371932029724121, "global_step": 221212, "epoch": 1316} {"train_loss": -10.944533348083496, "global_step": 221213, "epoch": 1316} {"train_loss": -10.901420593261719, "global_step": 221214, "epoch": 1316} {"train_loss": -10.72623062133789, "global_step": 221215, "epoch": 1316} {"train_loss": -11.043638229370117, "global_step": 221216, "epoch": 1316} {"train_loss": -11.140398025512695, "global_step": 221217, "epoch": 1316} {"train_loss": -11.032402038574219, "global_step": 221218, "epoch": 1316} {"train_loss": -11.038257598876953, "global_step": 221219, "epoch": 1316} {"train_loss": -11.135526657104492, "global_step": 221220, "epoch": 1316} {"train_loss": -11.102991104125977, "global_step": 221221, "epoch": 1316} {"train_loss": -11.16919994354248, "global_step": 221222, "epoch": 1316} {"train_loss": -11.139555931091309, "global_step": 221223, "epoch": 1316} {"train_loss": -10.945371627807617, "global_step": 221224, "epoch": 1316} {"train_loss": -11.342020988464355, "global_step": 221225, "epoch": 1316} {"train_loss": -11.306462287902832, "global_step": 221226, "epoch": 1316} {"train_loss": -11.292070388793945, "global_step": 221227, "epoch": 1316} {"train_loss": -11.242019653320312, "global_step": 221228, "epoch": 1316} {"train_loss": -11.522647857666016, "global_step": 221229, "epoch": 1316} {"train_loss": -11.442826271057129, "global_step": 221230, "epoch": 1316} {"train_loss": -11.303548812866211, "global_step": 221231, "epoch": 1316} {"train_loss": -11.514678001403809, "global_step": 221232, "epoch": 1316} {"train_loss": -11.212116241455078, "global_step": 221233, "epoch": 1316} {"train_loss": -11.347349166870117, "global_step": 221234, "epoch": 1316} {"train_loss": -11.363943099975586, "global_step": 221235, "epoch": 1316} {"train_loss": -11.387544631958008, "global_step": 221236, "epoch": 1316} {"train_loss": -11.524840354919434, "global_step": 221237, "epoch": 1316} {"train_loss": -11.37589168548584, "global_step": 221238, "epoch": 1316} {"train_loss": -11.515762329101562, "global_step": 221239, "epoch": 1316} {"train_loss": -11.42100715637207, "global_step": 221240, "epoch": 1316} {"train_loss": -11.404603958129883, "global_step": 221241, "epoch": 1316} {"train_loss": -11.474691390991211, "global_step": 221242, "epoch": 1316} {"train_loss": -11.527047157287598, "global_step": 221243, "epoch": 1316} {"train_loss": -11.735921859741211, "global_step": 221244, "epoch": 1316} {"train_loss": -11.653718948364258, "global_step": 221245, "epoch": 1316} {"train_loss": -11.600650787353516, "global_step": 221246, "epoch": 1316} {"train_loss": -11.452080726623535, "global_step": 221247, "epoch": 1316} {"train_loss": -11.528923034667969, "global_step": 221248, "epoch": 1316} {"train_loss": -11.719245910644531, "global_step": 221249, "epoch": 1316} {"train_loss": -11.829482078552246, "global_step": 221250, "epoch": 1316} {"train_loss": -11.80656623840332, "global_step": 221251, "epoch": 1316} {"train_loss": -11.707185745239258, "global_step": 221252, "epoch": 1316} {"train_loss": -11.703741073608398, "global_step": 221253, "epoch": 1316} {"train_loss": -11.911855697631836, "global_step": 221254, "epoch": 1316} {"train_loss": -11.184223214785257, "global_step": 221255, "epoch": 1316, "val_loss": 259146.015625} {"train_loss": -11.739889144897461, "global_step": 221256, "epoch": 1317} {"train_loss": -11.935400009155273, "global_step": 221257, "epoch": 1317} {"train_loss": -11.839982986450195, "global_step": 221258, "epoch": 1317} {"train_loss": -11.63295841217041, "global_step": 221259, "epoch": 1317} {"train_loss": -11.659457206726074, "global_step": 221260, "epoch": 1317} {"train_loss": -11.88412094116211, "global_step": 221261, "epoch": 1317} {"train_loss": -11.72852611541748, "global_step": 221262, "epoch": 1317} {"train_loss": -11.599298477172852, "global_step": 221263, "epoch": 1317} {"train_loss": -11.880859375, "global_step": 221264, "epoch": 1317} {"train_loss": -11.451879501342773, "global_step": 221265, "epoch": 1317} {"train_loss": -11.426498413085938, "global_step": 221266, "epoch": 1317} {"train_loss": -11.898117065429688, "global_step": 221267, "epoch": 1317} {"train_loss": -10.869162559509277, "global_step": 221268, "epoch": 1317} {"train_loss": -11.718770027160645, "global_step": 221269, "epoch": 1317} {"train_loss": -10.966667175292969, "global_step": 221270, "epoch": 1317} {"train_loss": -11.399089813232422, "global_step": 221271, "epoch": 1317} {"train_loss": -11.70692253112793, "global_step": 221272, "epoch": 1317} {"train_loss": -11.09206771850586, "global_step": 221273, "epoch": 1317} {"train_loss": -11.824459075927734, "global_step": 221274, "epoch": 1317} {"train_loss": -11.75676155090332, "global_step": 221275, "epoch": 1317} {"train_loss": -11.306406021118164, "global_step": 221276, "epoch": 1317} {"train_loss": -11.89274787902832, "global_step": 221277, "epoch": 1317} {"train_loss": -11.948070526123047, "global_step": 221278, "epoch": 1317} {"train_loss": -11.735541343688965, "global_step": 221279, "epoch": 1317} {"train_loss": -11.677059173583984, "global_step": 221280, "epoch": 1317} {"train_loss": -11.861593246459961, "global_step": 221281, "epoch": 1317} {"train_loss": -11.667835235595703, "global_step": 221282, "epoch": 1317} {"train_loss": -11.686140060424805, "global_step": 221283, "epoch": 1317} {"train_loss": -12.004830360412598, "global_step": 221284, "epoch": 1317} {"train_loss": -11.767281532287598, "global_step": 221285, "epoch": 1317} {"train_loss": -11.787076950073242, "global_step": 221286, "epoch": 1317} {"train_loss": -11.72119426727295, "global_step": 221287, "epoch": 1317} {"train_loss": -11.981460571289062, "global_step": 221288, "epoch": 1317} {"train_loss": -11.85354995727539, "global_step": 221289, "epoch": 1317} {"train_loss": -11.697280883789062, "global_step": 221290, "epoch": 1317} {"train_loss": -11.826824188232422, "global_step": 221291, "epoch": 1317} {"train_loss": -11.81804084777832, "global_step": 221292, "epoch": 1317} {"train_loss": -11.923260688781738, "global_step": 221293, "epoch": 1317} {"train_loss": -11.891742706298828, "global_step": 221294, "epoch": 1317} {"train_loss": -11.959223747253418, "global_step": 221295, "epoch": 1317} {"train_loss": -11.878076553344727, "global_step": 221296, "epoch": 1317} {"train_loss": -12.03426456451416, "global_step": 221297, "epoch": 1317} {"train_loss": -11.846841812133789, "global_step": 221298, "epoch": 1317} {"train_loss": -11.71579360961914, "global_step": 221299, "epoch": 1317} {"train_loss": -11.913492202758789, "global_step": 221300, "epoch": 1317} {"train_loss": -11.929194450378418, "global_step": 221301, "epoch": 1317} {"train_loss": -11.867877960205078, "global_step": 221302, "epoch": 1317} {"train_loss": -11.750248908996582, "global_step": 221303, "epoch": 1317} {"train_loss": -11.893094062805176, "global_step": 221304, "epoch": 1317} {"train_loss": -11.730990409851074, "global_step": 221305, "epoch": 1317} {"train_loss": -11.641427993774414, "global_step": 221306, "epoch": 1317} {"train_loss": -11.930503845214844, "global_step": 221307, "epoch": 1317} {"train_loss": -11.442116737365723, "global_step": 221308, "epoch": 1317} {"train_loss": -11.20527458190918, "global_step": 221309, "epoch": 1317} {"train_loss": -10.635293006896973, "global_step": 221310, "epoch": 1317} {"train_loss": -12.002342224121094, "global_step": 221311, "epoch": 1317} {"train_loss": -10.686507225036621, "global_step": 221312, "epoch": 1317} {"train_loss": -10.813864707946777, "global_step": 221313, "epoch": 1317} {"train_loss": -10.96487808227539, "global_step": 221314, "epoch": 1317} {"train_loss": -8.822951316833496, "global_step": 221315, "epoch": 1317} {"train_loss": -10.938409805297852, "global_step": 221316, "epoch": 1317} {"train_loss": -9.892934799194336, "global_step": 221317, "epoch": 1317} {"train_loss": -10.688558578491211, "global_step": 221318, "epoch": 1317} {"train_loss": -10.993097305297852, "global_step": 221319, "epoch": 1317} {"train_loss": -10.750110626220703, "global_step": 221320, "epoch": 1317} {"train_loss": -11.172029495239258, "global_step": 221321, "epoch": 1317} {"train_loss": -10.516521453857422, "global_step": 221322, "epoch": 1317} {"train_loss": -11.68061637878418, "global_step": 221323, "epoch": 1317} {"train_loss": -10.859869956970215, "global_step": 221324, "epoch": 1317} {"train_loss": -10.912437438964844, "global_step": 221325, "epoch": 1317} {"train_loss": -11.161245346069336, "global_step": 221326, "epoch": 1317} {"train_loss": -10.635868072509766, "global_step": 221327, "epoch": 1317} {"train_loss": -10.953184127807617, "global_step": 221328, "epoch": 1317} {"train_loss": -10.80217170715332, "global_step": 221329, "epoch": 1317} {"train_loss": -10.679186820983887, "global_step": 221330, "epoch": 1317} {"train_loss": -10.907526016235352, "global_step": 221331, "epoch": 1317} {"train_loss": -9.858534812927246, "global_step": 221332, "epoch": 1317} {"train_loss": -11.241044998168945, "global_step": 221333, "epoch": 1317} {"train_loss": -10.031991958618164, "global_step": 221334, "epoch": 1317} {"train_loss": -11.147624015808105, "global_step": 221335, "epoch": 1317} {"train_loss": -10.969979286193848, "global_step": 221336, "epoch": 1317} {"train_loss": -10.750507354736328, "global_step": 221337, "epoch": 1317} {"train_loss": -11.104558944702148, "global_step": 221338, "epoch": 1317} {"train_loss": -11.145599365234375, "global_step": 221339, "epoch": 1317} {"train_loss": -11.241581916809082, "global_step": 221340, "epoch": 1317} {"train_loss": -11.293401718139648, "global_step": 221341, "epoch": 1317} {"train_loss": -11.024066925048828, "global_step": 221342, "epoch": 1317} {"train_loss": -11.000160217285156, "global_step": 221343, "epoch": 1317} {"train_loss": -11.188484191894531, "global_step": 221344, "epoch": 1317} {"train_loss": -11.018473625183105, "global_step": 221345, "epoch": 1317} {"train_loss": -11.358180046081543, "global_step": 221346, "epoch": 1317} {"train_loss": -11.11764144897461, "global_step": 221347, "epoch": 1317} {"train_loss": -11.570121765136719, "global_step": 221348, "epoch": 1317} {"train_loss": -10.986815452575684, "global_step": 221349, "epoch": 1317} {"train_loss": -11.154258728027344, "global_step": 221350, "epoch": 1317} {"train_loss": -10.85273265838623, "global_step": 221351, "epoch": 1317} {"train_loss": -11.158112525939941, "global_step": 221352, "epoch": 1317} {"train_loss": -10.775375366210938, "global_step": 221353, "epoch": 1317} {"train_loss": -11.412436485290527, "global_step": 221354, "epoch": 1317} {"train_loss": -11.3602294921875, "global_step": 221355, "epoch": 1317} {"train_loss": -11.172471046447754, "global_step": 221356, "epoch": 1317} {"train_loss": -11.595792770385742, "global_step": 221357, "epoch": 1317} {"train_loss": -11.06047534942627, "global_step": 221358, "epoch": 1317} {"train_loss": -11.477814674377441, "global_step": 221359, "epoch": 1317} {"train_loss": -11.204527854919434, "global_step": 221360, "epoch": 1317} {"train_loss": -11.351463317871094, "global_step": 221361, "epoch": 1317} {"train_loss": -11.360042572021484, "global_step": 221362, "epoch": 1317} {"train_loss": -11.68138313293457, "global_step": 221363, "epoch": 1317} {"train_loss": -11.538959503173828, "global_step": 221364, "epoch": 1317} {"train_loss": -11.35444450378418, "global_step": 221365, "epoch": 1317} {"train_loss": -11.645447731018066, "global_step": 221366, "epoch": 1317} {"train_loss": -11.410460472106934, "global_step": 221367, "epoch": 1317} {"train_loss": -11.775757789611816, "global_step": 221368, "epoch": 1317} {"train_loss": -11.436748504638672, "global_step": 221369, "epoch": 1317} {"train_loss": -11.534436225891113, "global_step": 221370, "epoch": 1317} {"train_loss": -11.451061248779297, "global_step": 221371, "epoch": 1317} {"train_loss": -11.626077651977539, "global_step": 221372, "epoch": 1317} {"train_loss": -11.826908111572266, "global_step": 221373, "epoch": 1317} {"train_loss": -11.523364067077637, "global_step": 221374, "epoch": 1317} {"train_loss": -11.698053359985352, "global_step": 221375, "epoch": 1317} {"train_loss": -11.560005187988281, "global_step": 221376, "epoch": 1317} {"train_loss": -11.728642463684082, "global_step": 221377, "epoch": 1317} {"train_loss": -11.713149070739746, "global_step": 221378, "epoch": 1317} {"train_loss": -11.845376968383789, "global_step": 221379, "epoch": 1317} {"train_loss": -11.733102798461914, "global_step": 221380, "epoch": 1317} {"train_loss": -11.935181617736816, "global_step": 221381, "epoch": 1317} {"train_loss": -11.972469329833984, "global_step": 221382, "epoch": 1317} {"train_loss": -11.742837905883789, "global_step": 221383, "epoch": 1317} {"train_loss": -11.954452514648438, "global_step": 221384, "epoch": 1317} {"train_loss": -11.688644409179688, "global_step": 221385, "epoch": 1317} {"train_loss": -11.737152099609375, "global_step": 221386, "epoch": 1317} {"train_loss": -11.741199493408203, "global_step": 221387, "epoch": 1317} {"train_loss": -11.445920944213867, "global_step": 221388, "epoch": 1317} {"train_loss": -11.777275085449219, "global_step": 221389, "epoch": 1317} {"train_loss": -11.720641136169434, "global_step": 221390, "epoch": 1317} {"train_loss": -11.793193817138672, "global_step": 221391, "epoch": 1317} {"train_loss": -11.492897033691406, "global_step": 221392, "epoch": 1317} {"train_loss": -11.612836837768555, "global_step": 221393, "epoch": 1317} {"train_loss": -11.545580863952637, "global_step": 221394, "epoch": 1317} {"train_loss": -11.62038803100586, "global_step": 221395, "epoch": 1317} {"train_loss": -11.290487289428711, "global_step": 221396, "epoch": 1317} {"train_loss": -12.100147247314453, "global_step": 221397, "epoch": 1317} {"train_loss": -11.214849472045898, "global_step": 221398, "epoch": 1317} {"train_loss": -11.160855293273926, "global_step": 221399, "epoch": 1317} {"train_loss": -11.534045219421387, "global_step": 221400, "epoch": 1317} {"train_loss": -11.669357299804688, "global_step": 221401, "epoch": 1317} {"train_loss": -11.979355812072754, "global_step": 221402, "epoch": 1317} {"train_loss": -11.903942108154297, "global_step": 221403, "epoch": 1317} {"train_loss": -11.997415542602539, "global_step": 221404, "epoch": 1317} {"train_loss": -11.868864059448242, "global_step": 221405, "epoch": 1317} {"train_loss": -11.809894561767578, "global_step": 221406, "epoch": 1317} {"train_loss": -11.76463508605957, "global_step": 221407, "epoch": 1317} {"train_loss": -11.55931282043457, "global_step": 221408, "epoch": 1317} {"train_loss": -11.851770401000977, "global_step": 221409, "epoch": 1317} {"train_loss": -11.969728469848633, "global_step": 221410, "epoch": 1317} {"train_loss": -11.462118148803711, "global_step": 221411, "epoch": 1317} {"train_loss": -11.945170402526855, "global_step": 221412, "epoch": 1317} {"train_loss": -11.534093856811523, "global_step": 221413, "epoch": 1317} {"train_loss": -11.201437950134277, "global_step": 221414, "epoch": 1317} {"train_loss": -11.545969009399414, "global_step": 221415, "epoch": 1317} {"train_loss": -11.551656723022461, "global_step": 221416, "epoch": 1317} {"train_loss": -11.455434799194336, "global_step": 221417, "epoch": 1317} {"train_loss": -11.469890594482422, "global_step": 221418, "epoch": 1317} {"train_loss": -11.719131469726562, "global_step": 221419, "epoch": 1317} {"train_loss": -11.50571060180664, "global_step": 221420, "epoch": 1317} {"train_loss": -10.842905044555664, "global_step": 221421, "epoch": 1317} {"train_loss": -11.350997924804688, "global_step": 221422, "epoch": 1317} {"train_loss": -11.452840952646165, "global_step": 221423, "epoch": 1317, "val_loss": 257640.234375} {"train_loss": -10.293486595153809, "global_step": 221424, "epoch": 1318} {"train_loss": -10.881832122802734, "global_step": 221425, "epoch": 1318} {"train_loss": -11.199186325073242, "global_step": 221426, "epoch": 1318} {"train_loss": -10.247098922729492, "global_step": 221427, "epoch": 1318} {"train_loss": -9.75551986694336, "global_step": 221428, "epoch": 1318} {"train_loss": -10.660744667053223, "global_step": 221429, "epoch": 1318} {"train_loss": -11.414694786071777, "global_step": 221430, "epoch": 1318} {"train_loss": -10.33987045288086, "global_step": 221431, "epoch": 1318} {"train_loss": -10.849014282226562, "global_step": 221432, "epoch": 1318} {"train_loss": -11.499627113342285, "global_step": 221433, "epoch": 1318} {"train_loss": -10.691865921020508, "global_step": 221434, "epoch": 1318} {"train_loss": -11.078617095947266, "global_step": 221435, "epoch": 1318} {"train_loss": -11.380533218383789, "global_step": 221436, "epoch": 1318} {"train_loss": -10.975311279296875, "global_step": 221437, "epoch": 1318} {"train_loss": -11.651388168334961, "global_step": 221438, "epoch": 1318} {"train_loss": -11.035381317138672, "global_step": 221439, "epoch": 1318} {"train_loss": -11.150418281555176, "global_step": 221440, "epoch": 1318} {"train_loss": -11.1680269241333, "global_step": 221441, "epoch": 1318} {"train_loss": -11.438066482543945, "global_step": 221442, "epoch": 1318} {"train_loss": -11.472835540771484, "global_step": 221443, "epoch": 1318} {"train_loss": -11.298530578613281, "global_step": 221444, "epoch": 1318} {"train_loss": -11.518482208251953, "global_step": 221445, "epoch": 1318} {"train_loss": -11.450042724609375, "global_step": 221446, "epoch": 1318} {"train_loss": -11.219649314880371, "global_step": 221447, "epoch": 1318} {"train_loss": -11.12828254699707, "global_step": 221448, "epoch": 1318} {"train_loss": -10.284646987915039, "global_step": 221449, "epoch": 1318} {"train_loss": -10.802669525146484, "global_step": 221450, "epoch": 1318} {"train_loss": -9.732988357543945, "global_step": 221451, "epoch": 1318} {"train_loss": -9.611390113830566, "global_step": 221452, "epoch": 1318} {"train_loss": -10.792716026306152, "global_step": 221453, "epoch": 1318} {"train_loss": -9.755077362060547, "global_step": 221454, "epoch": 1318} {"train_loss": -9.490167617797852, "global_step": 221455, "epoch": 1318} {"train_loss": -10.760418891906738, "global_step": 221456, "epoch": 1318} {"train_loss": -8.333948135375977, "global_step": 221457, "epoch": 1318} {"train_loss": -9.19998550415039, "global_step": 221458, "epoch": 1318} {"train_loss": -9.765342712402344, "global_step": 221459, "epoch": 1318} {"train_loss": -9.16789436340332, "global_step": 221460, "epoch": 1318} {"train_loss": -10.123125076293945, "global_step": 221461, "epoch": 1318} {"train_loss": -11.168206214904785, "global_step": 221462, "epoch": 1318} {"train_loss": -9.810821533203125, "global_step": 221463, "epoch": 1318} {"train_loss": -10.940193176269531, "global_step": 221464, "epoch": 1318} {"train_loss": -10.644407272338867, "global_step": 221465, "epoch": 1318} {"train_loss": -10.998542785644531, "global_step": 221466, "epoch": 1318} {"train_loss": -11.010554313659668, "global_step": 221467, "epoch": 1318} {"train_loss": -10.958072662353516, "global_step": 221468, "epoch": 1318} {"train_loss": -10.429737091064453, "global_step": 221469, "epoch": 1318} {"train_loss": -11.232017517089844, "global_step": 221470, "epoch": 1318} {"train_loss": -10.754083633422852, "global_step": 221471, "epoch": 1318} {"train_loss": -11.373884201049805, "global_step": 221472, "epoch": 1318} {"train_loss": -11.15281867980957, "global_step": 221473, "epoch": 1318} {"train_loss": -11.025747299194336, "global_step": 221474, "epoch": 1318} {"train_loss": -11.06894302368164, "global_step": 221475, "epoch": 1318} {"train_loss": -11.345155715942383, "global_step": 221476, "epoch": 1318} {"train_loss": -11.047369956970215, "global_step": 221477, "epoch": 1318} {"train_loss": -11.324100494384766, "global_step": 221478, "epoch": 1318} {"train_loss": -11.042412757873535, "global_step": 221479, "epoch": 1318} {"train_loss": -11.500572204589844, "global_step": 221480, "epoch": 1318} {"train_loss": -11.139911651611328, "global_step": 221481, "epoch": 1318} {"train_loss": -11.417266845703125, "global_step": 221482, "epoch": 1318} {"train_loss": -10.9476318359375, "global_step": 221483, "epoch": 1318} {"train_loss": -11.415267944335938, "global_step": 221484, "epoch": 1318} {"train_loss": -11.03541374206543, "global_step": 221485, "epoch": 1318} {"train_loss": -11.52824592590332, "global_step": 221486, "epoch": 1318} {"train_loss": -11.446715354919434, "global_step": 221487, "epoch": 1318} {"train_loss": -11.404291152954102, "global_step": 221488, "epoch": 1318} {"train_loss": -11.52456283569336, "global_step": 221489, "epoch": 1318} {"train_loss": -11.52005386352539, "global_step": 221490, "epoch": 1318} {"train_loss": -11.290760040283203, "global_step": 221491, "epoch": 1318} {"train_loss": -11.515096664428711, "global_step": 221492, "epoch": 1318} {"train_loss": -11.655037879943848, "global_step": 221493, "epoch": 1318} {"train_loss": -11.462373733520508, "global_step": 221494, "epoch": 1318} {"train_loss": -11.416189193725586, "global_step": 221495, "epoch": 1318} {"train_loss": -11.486759185791016, "global_step": 221496, "epoch": 1318} {"train_loss": -11.652022361755371, "global_step": 221497, "epoch": 1318} {"train_loss": -11.709413528442383, "global_step": 221498, "epoch": 1318} {"train_loss": -11.611072540283203, "global_step": 221499, "epoch": 1318} {"train_loss": -11.520524978637695, "global_step": 221500, "epoch": 1318} {"train_loss": -11.707513809204102, "global_step": 221501, "epoch": 1318} {"train_loss": -11.731931686401367, "global_step": 221502, "epoch": 1318} {"train_loss": -11.710994720458984, "global_step": 221503, "epoch": 1318} {"train_loss": -11.86328125, "global_step": 221504, "epoch": 1318} {"train_loss": -11.83833122253418, "global_step": 221505, "epoch": 1318} {"train_loss": -11.668386459350586, "global_step": 221506, "epoch": 1318} {"train_loss": -11.876860618591309, "global_step": 221507, "epoch": 1318} {"train_loss": -11.745892524719238, "global_step": 221508, "epoch": 1318} {"train_loss": -11.852130889892578, "global_step": 221509, "epoch": 1318} {"train_loss": -11.780012130737305, "global_step": 221510, "epoch": 1318} {"train_loss": -11.871576309204102, "global_step": 221511, "epoch": 1318} {"train_loss": -11.82210636138916, "global_step": 221512, "epoch": 1318} {"train_loss": -11.925065994262695, "global_step": 221513, "epoch": 1318} {"train_loss": -11.917804718017578, "global_step": 221514, "epoch": 1318} {"train_loss": -11.839211463928223, "global_step": 221515, "epoch": 1318} {"train_loss": -11.847217559814453, "global_step": 221516, "epoch": 1318} {"train_loss": -11.906370162963867, "global_step": 221517, "epoch": 1318} {"train_loss": -11.775376319885254, "global_step": 221518, "epoch": 1318} {"train_loss": -11.785391807556152, "global_step": 221519, "epoch": 1318} {"train_loss": -11.843926429748535, "global_step": 221520, "epoch": 1318} {"train_loss": -11.810791015625, "global_step": 221521, "epoch": 1318} {"train_loss": -11.82801628112793, "global_step": 221522, "epoch": 1318} {"train_loss": -11.942753791809082, "global_step": 221523, "epoch": 1318} {"train_loss": -12.070971488952637, "global_step": 221524, "epoch": 1318} {"train_loss": -12.052421569824219, "global_step": 221525, "epoch": 1318} {"train_loss": -11.919575691223145, "global_step": 221526, "epoch": 1318} {"train_loss": -11.841741561889648, "global_step": 221527, "epoch": 1318} {"train_loss": -11.844010353088379, "global_step": 221528, "epoch": 1318} {"train_loss": -11.939665794372559, "global_step": 221529, "epoch": 1318} {"train_loss": -11.994209289550781, "global_step": 221530, "epoch": 1318} {"train_loss": -11.972999572753906, "global_step": 221531, "epoch": 1318} {"train_loss": -12.091217041015625, "global_step": 221532, "epoch": 1318} {"train_loss": -11.688749313354492, "global_step": 221533, "epoch": 1318} {"train_loss": -11.449630737304688, "global_step": 221534, "epoch": 1318} {"train_loss": -11.967004776000977, "global_step": 221535, "epoch": 1318} {"train_loss": -11.530715942382812, "global_step": 221536, "epoch": 1318} {"train_loss": -11.760705947875977, "global_step": 221537, "epoch": 1318} {"train_loss": -11.798578262329102, "global_step": 221538, "epoch": 1318} {"train_loss": -12.112348556518555, "global_step": 221539, "epoch": 1318} {"train_loss": -11.2976713180542, "global_step": 221540, "epoch": 1318} {"train_loss": -10.867576599121094, "global_step": 221541, "epoch": 1318} {"train_loss": -11.741069793701172, "global_step": 221542, "epoch": 1318} {"train_loss": -10.886005401611328, "global_step": 221543, "epoch": 1318} {"train_loss": -11.87264633178711, "global_step": 221544, "epoch": 1318} {"train_loss": -11.601550102233887, "global_step": 221545, "epoch": 1318} {"train_loss": -11.640887260437012, "global_step": 221546, "epoch": 1318} {"train_loss": -11.418926239013672, "global_step": 221547, "epoch": 1318} {"train_loss": -11.466976165771484, "global_step": 221548, "epoch": 1318} {"train_loss": -10.993013381958008, "global_step": 221549, "epoch": 1318} {"train_loss": -11.543295860290527, "global_step": 221550, "epoch": 1318} {"train_loss": -10.965766906738281, "global_step": 221551, "epoch": 1318} {"train_loss": -11.384824752807617, "global_step": 221552, "epoch": 1318} {"train_loss": -10.999216079711914, "global_step": 221553, "epoch": 1318} {"train_loss": -10.956746101379395, "global_step": 221554, "epoch": 1318} {"train_loss": -11.12331771850586, "global_step": 221555, "epoch": 1318} {"train_loss": -10.598155975341797, "global_step": 221556, "epoch": 1318} {"train_loss": -10.078283309936523, "global_step": 221557, "epoch": 1318} {"train_loss": -11.242636680603027, "global_step": 221558, "epoch": 1318} {"train_loss": -10.407065391540527, "global_step": 221559, "epoch": 1318} {"train_loss": -10.991668701171875, "global_step": 221560, "epoch": 1318} {"train_loss": -10.49163818359375, "global_step": 221561, "epoch": 1318} {"train_loss": -10.847221374511719, "global_step": 221562, "epoch": 1318} {"train_loss": -10.616981506347656, "global_step": 221563, "epoch": 1318} {"train_loss": -11.035163879394531, "global_step": 221564, "epoch": 1318} {"train_loss": -10.671585083007812, "global_step": 221565, "epoch": 1318} {"train_loss": -11.614509582519531, "global_step": 221566, "epoch": 1318} {"train_loss": -10.900449752807617, "global_step": 221567, "epoch": 1318} {"train_loss": -11.142068862915039, "global_step": 221568, "epoch": 1318} {"train_loss": -11.324166297912598, "global_step": 221569, "epoch": 1318} {"train_loss": -11.392227172851562, "global_step": 221570, "epoch": 1318} {"train_loss": -11.254913330078125, "global_step": 221571, "epoch": 1318} {"train_loss": -11.547219276428223, "global_step": 221572, "epoch": 1318} {"train_loss": -11.37132740020752, "global_step": 221573, "epoch": 1318} {"train_loss": -11.326701164245605, "global_step": 221574, "epoch": 1318} {"train_loss": -11.48440933227539, "global_step": 221575, "epoch": 1318} {"train_loss": -11.580060958862305, "global_step": 221576, "epoch": 1318} {"train_loss": -11.64970588684082, "global_step": 221577, "epoch": 1318} {"train_loss": -11.48606014251709, "global_step": 221578, "epoch": 1318} {"train_loss": -11.767843246459961, "global_step": 221579, "epoch": 1318} {"train_loss": -11.524581909179688, "global_step": 221580, "epoch": 1318} {"train_loss": -11.317859649658203, "global_step": 221581, "epoch": 1318} {"train_loss": -11.69338607788086, "global_step": 221582, "epoch": 1318} {"train_loss": -11.412178039550781, "global_step": 221583, "epoch": 1318} {"train_loss": -11.689553260803223, "global_step": 221584, "epoch": 1318} {"train_loss": -11.471763610839844, "global_step": 221585, "epoch": 1318} {"train_loss": -11.69215202331543, "global_step": 221586, "epoch": 1318} {"train_loss": -11.513175964355469, "global_step": 221587, "epoch": 1318} {"train_loss": -11.634087562561035, "global_step": 221588, "epoch": 1318} {"train_loss": -11.63815689086914, "global_step": 221589, "epoch": 1318} {"train_loss": -11.543539047241211, "global_step": 221590, "epoch": 1318} {"train_loss": -11.247697347686405, "global_step": 221591, "epoch": 1318, "val_loss": 261332.953125} {"train_loss": -11.66707706451416, "global_step": 221592, "epoch": 1319} {"train_loss": -11.787532806396484, "global_step": 221593, "epoch": 1319} {"train_loss": -11.892590522766113, "global_step": 221594, "epoch": 1319} {"train_loss": -11.618047714233398, "global_step": 221595, "epoch": 1319} {"train_loss": -11.842289924621582, "global_step": 221596, "epoch": 1319} {"train_loss": -11.510370254516602, "global_step": 221597, "epoch": 1319} {"train_loss": -11.806096076965332, "global_step": 221598, "epoch": 1319} {"train_loss": -11.960138320922852, "global_step": 221599, "epoch": 1319} {"train_loss": -11.852959632873535, "global_step": 221600, "epoch": 1319} {"train_loss": -11.894895553588867, "global_step": 221601, "epoch": 1319} {"train_loss": -11.785218238830566, "global_step": 221602, "epoch": 1319} {"train_loss": -11.81067180633545, "global_step": 221603, "epoch": 1319} {"train_loss": -11.753312110900879, "global_step": 221604, "epoch": 1319} {"train_loss": -11.99665641784668, "global_step": 221605, "epoch": 1319} {"train_loss": -11.817167282104492, "global_step": 221606, "epoch": 1319} {"train_loss": -11.632253646850586, "global_step": 221607, "epoch": 1319} {"train_loss": -11.686485290527344, "global_step": 221608, "epoch": 1319} {"train_loss": -11.925134658813477, "global_step": 221609, "epoch": 1319} {"train_loss": -11.880237579345703, "global_step": 221610, "epoch": 1319} {"train_loss": -12.029516220092773, "global_step": 221611, "epoch": 1319} {"train_loss": -11.80234146118164, "global_step": 221612, "epoch": 1319} {"train_loss": -11.798054695129395, "global_step": 221613, "epoch": 1319} {"train_loss": -11.857646942138672, "global_step": 221614, "epoch": 1319} {"train_loss": -11.880167007446289, "global_step": 221615, "epoch": 1319} {"train_loss": -11.958364486694336, "global_step": 221616, "epoch": 1319} {"train_loss": -11.836624145507812, "global_step": 221617, "epoch": 1319} {"train_loss": -11.619100570678711, "global_step": 221618, "epoch": 1319} {"train_loss": -11.811609268188477, "global_step": 221619, "epoch": 1319} {"train_loss": -11.540138244628906, "global_step": 221620, "epoch": 1319} {"train_loss": -11.80013656616211, "global_step": 221621, "epoch": 1319} {"train_loss": -11.839147567749023, "global_step": 221622, "epoch": 1319} {"train_loss": -11.52607536315918, "global_step": 221623, "epoch": 1319} {"train_loss": -11.581321716308594, "global_step": 221624, "epoch": 1319} {"train_loss": -11.86789608001709, "global_step": 221625, "epoch": 1319} {"train_loss": -11.440607070922852, "global_step": 221626, "epoch": 1319} {"train_loss": -11.1036376953125, "global_step": 221627, "epoch": 1319} {"train_loss": -10.697064399719238, "global_step": 221628, "epoch": 1319} {"train_loss": -11.187540054321289, "global_step": 221629, "epoch": 1319} {"train_loss": -11.020793914794922, "global_step": 221630, "epoch": 1319} {"train_loss": -10.829629898071289, "global_step": 221631, "epoch": 1319} {"train_loss": -9.406336784362793, "global_step": 221632, "epoch": 1319} {"train_loss": -10.680904388427734, "global_step": 221633, "epoch": 1319} {"train_loss": -10.555721282958984, "global_step": 221634, "epoch": 1319} {"train_loss": -9.774432182312012, "global_step": 221635, "epoch": 1319} {"train_loss": -10.834731101989746, "global_step": 221636, "epoch": 1319} {"train_loss": -10.686548233032227, "global_step": 221637, "epoch": 1319} {"train_loss": -9.758520126342773, "global_step": 221638, "epoch": 1319} {"train_loss": -10.945554733276367, "global_step": 221639, "epoch": 1319} {"train_loss": -9.583954811096191, "global_step": 221640, "epoch": 1319} {"train_loss": -10.952754020690918, "global_step": 221641, "epoch": 1319} {"train_loss": -9.359752655029297, "global_step": 221642, "epoch": 1319} {"train_loss": -10.830562591552734, "global_step": 221643, "epoch": 1319} {"train_loss": -10.413475036621094, "global_step": 221644, "epoch": 1319} {"train_loss": -9.954710960388184, "global_step": 221645, "epoch": 1319} {"train_loss": -11.290512084960938, "global_step": 221646, "epoch": 1319} {"train_loss": -10.214824676513672, "global_step": 221647, "epoch": 1319} {"train_loss": -11.302556991577148, "global_step": 221648, "epoch": 1319} {"train_loss": -10.539000511169434, "global_step": 221649, "epoch": 1319} {"train_loss": -11.005876541137695, "global_step": 221650, "epoch": 1319} {"train_loss": -10.657658576965332, "global_step": 221651, "epoch": 1319} {"train_loss": -10.963188171386719, "global_step": 221652, "epoch": 1319} {"train_loss": -11.208991050720215, "global_step": 221653, "epoch": 1319} {"train_loss": -10.744840621948242, "global_step": 221654, "epoch": 1319} {"train_loss": -11.506561279296875, "global_step": 221655, "epoch": 1319} {"train_loss": -11.023017883300781, "global_step": 221656, "epoch": 1319} {"train_loss": -11.359029769897461, "global_step": 221657, "epoch": 1319} {"train_loss": -11.353918075561523, "global_step": 221658, "epoch": 1319} {"train_loss": -11.027630805969238, "global_step": 221659, "epoch": 1319} {"train_loss": -11.356061935424805, "global_step": 221660, "epoch": 1319} {"train_loss": -11.21783447265625, "global_step": 221661, "epoch": 1319} {"train_loss": -11.366973876953125, "global_step": 221662, "epoch": 1319} {"train_loss": -11.359184265136719, "global_step": 221663, "epoch": 1319} {"train_loss": -11.247784614562988, "global_step": 221664, "epoch": 1319} {"train_loss": -11.089494705200195, "global_step": 221665, "epoch": 1319} {"train_loss": -11.304747581481934, "global_step": 221666, "epoch": 1319} {"train_loss": -11.526006698608398, "global_step": 221667, "epoch": 1319} {"train_loss": -11.16796875, "global_step": 221668, "epoch": 1319} {"train_loss": -11.438966751098633, "global_step": 221669, "epoch": 1319} {"train_loss": -11.239892959594727, "global_step": 221670, "epoch": 1319} {"train_loss": -11.25708293914795, "global_step": 221671, "epoch": 1319} {"train_loss": -11.251379013061523, "global_step": 221672, "epoch": 1319} {"train_loss": -11.401102066040039, "global_step": 221673, "epoch": 1319} {"train_loss": -11.460695266723633, "global_step": 221674, "epoch": 1319} {"train_loss": -11.238391876220703, "global_step": 221675, "epoch": 1319} {"train_loss": -11.559452056884766, "global_step": 221676, "epoch": 1319} {"train_loss": -11.571525573730469, "global_step": 221677, "epoch": 1319} {"train_loss": -11.262592315673828, "global_step": 221678, "epoch": 1319} {"train_loss": -11.614837646484375, "global_step": 221679, "epoch": 1319} {"train_loss": -11.627219200134277, "global_step": 221680, "epoch": 1319} {"train_loss": -11.463974952697754, "global_step": 221681, "epoch": 1319} {"train_loss": -11.3639497756958, "global_step": 221682, "epoch": 1319} {"train_loss": -11.544842720031738, "global_step": 221683, "epoch": 1319} {"train_loss": -11.688695907592773, "global_step": 221684, "epoch": 1319} {"train_loss": -11.36431884765625, "global_step": 221685, "epoch": 1319} {"train_loss": -11.577651023864746, "global_step": 221686, "epoch": 1319} {"train_loss": -11.47395133972168, "global_step": 221687, "epoch": 1319} {"train_loss": -11.801618576049805, "global_step": 221688, "epoch": 1319} {"train_loss": -11.784404754638672, "global_step": 221689, "epoch": 1319} {"train_loss": -11.774145126342773, "global_step": 221690, "epoch": 1319} {"train_loss": -11.585159301757812, "global_step": 221691, "epoch": 1319} {"train_loss": -11.732112884521484, "global_step": 221692, "epoch": 1319} {"train_loss": -11.847293853759766, "global_step": 221693, "epoch": 1319} {"train_loss": -11.688507080078125, "global_step": 221694, "epoch": 1319} {"train_loss": -12.010713577270508, "global_step": 221695, "epoch": 1319} {"train_loss": -11.640338897705078, "global_step": 221696, "epoch": 1319} {"train_loss": -11.753852844238281, "global_step": 221697, "epoch": 1319} {"train_loss": -11.596532821655273, "global_step": 221698, "epoch": 1319} {"train_loss": -11.679094314575195, "global_step": 221699, "epoch": 1319} {"train_loss": -11.892868041992188, "global_step": 221700, "epoch": 1319} {"train_loss": -11.829577445983887, "global_step": 221701, "epoch": 1319} {"train_loss": -11.670970916748047, "global_step": 221702, "epoch": 1319} {"train_loss": -11.95094108581543, "global_step": 221703, "epoch": 1319} {"train_loss": -11.265691757202148, "global_step": 221704, "epoch": 1319} {"train_loss": -11.798463821411133, "global_step": 221705, "epoch": 1319} {"train_loss": -11.485576629638672, "global_step": 221706, "epoch": 1319} {"train_loss": -11.383620262145996, "global_step": 221707, "epoch": 1319} {"train_loss": -11.885808944702148, "global_step": 221708, "epoch": 1319} {"train_loss": -11.715738296508789, "global_step": 221709, "epoch": 1319} {"train_loss": -11.431589126586914, "global_step": 221710, "epoch": 1319} {"train_loss": -11.672895431518555, "global_step": 221711, "epoch": 1319} {"train_loss": -11.69260311126709, "global_step": 221712, "epoch": 1319} {"train_loss": -11.925576210021973, "global_step": 221713, "epoch": 1319} {"train_loss": -11.85909652709961, "global_step": 221714, "epoch": 1319} {"train_loss": -11.37935733795166, "global_step": 221715, "epoch": 1319} {"train_loss": -11.648283004760742, "global_step": 221716, "epoch": 1319} {"train_loss": -12.050540924072266, "global_step": 221717, "epoch": 1319} {"train_loss": -11.123579978942871, "global_step": 221718, "epoch": 1319} {"train_loss": -11.295495986938477, "global_step": 221719, "epoch": 1319} {"train_loss": -11.672195434570312, "global_step": 221720, "epoch": 1319} {"train_loss": -11.811612129211426, "global_step": 221721, "epoch": 1319} {"train_loss": -11.622053146362305, "global_step": 221722, "epoch": 1319} {"train_loss": -11.706125259399414, "global_step": 221723, "epoch": 1319} {"train_loss": -11.701780319213867, "global_step": 221724, "epoch": 1319} {"train_loss": -11.784492492675781, "global_step": 221725, "epoch": 1319} {"train_loss": -11.445602416992188, "global_step": 221726, "epoch": 1319} {"train_loss": -11.69954776763916, "global_step": 221727, "epoch": 1319} {"train_loss": -11.379596710205078, "global_step": 221728, "epoch": 1319} {"train_loss": -11.480794906616211, "global_step": 221729, "epoch": 1319} {"train_loss": -11.3616304397583, "global_step": 221730, "epoch": 1319} {"train_loss": -11.592442512512207, "global_step": 221731, "epoch": 1319} {"train_loss": -11.192005157470703, "global_step": 221732, "epoch": 1319} {"train_loss": -11.598762512207031, "global_step": 221733, "epoch": 1319} {"train_loss": -10.961519241333008, "global_step": 221734, "epoch": 1319} {"train_loss": -11.294321060180664, "global_step": 221735, "epoch": 1319} {"train_loss": -11.20244026184082, "global_step": 221736, "epoch": 1319} {"train_loss": -11.41286849975586, "global_step": 221737, "epoch": 1319} {"train_loss": -11.291982650756836, "global_step": 221738, "epoch": 1319} {"train_loss": -11.349435806274414, "global_step": 221739, "epoch": 1319} {"train_loss": -11.31786060333252, "global_step": 221740, "epoch": 1319} {"train_loss": -11.57967758178711, "global_step": 221741, "epoch": 1319} {"train_loss": -11.305447578430176, "global_step": 221742, "epoch": 1319} {"train_loss": -11.305158615112305, "global_step": 221743, "epoch": 1319} {"train_loss": -11.610986709594727, "global_step": 221744, "epoch": 1319} {"train_loss": -11.291213989257812, "global_step": 221745, "epoch": 1319} {"train_loss": -11.743692398071289, "global_step": 221746, "epoch": 1319} {"train_loss": -11.474266052246094, "global_step": 221747, "epoch": 1319} {"train_loss": -11.153753280639648, "global_step": 221748, "epoch": 1319} {"train_loss": -11.416619300842285, "global_step": 221749, "epoch": 1319} {"train_loss": -11.460765838623047, "global_step": 221750, "epoch": 1319} {"train_loss": -10.138833999633789, "global_step": 221751, "epoch": 1319} {"train_loss": -11.722177505493164, "global_step": 221752, "epoch": 1319} {"train_loss": -11.152754783630371, "global_step": 221753, "epoch": 1319} {"train_loss": -11.001057624816895, "global_step": 221754, "epoch": 1319} {"train_loss": -11.401857376098633, "global_step": 221755, "epoch": 1319} {"train_loss": -11.691662788391113, "global_step": 221756, "epoch": 1319} {"train_loss": -10.965127944946289, "global_step": 221757, "epoch": 1319} {"train_loss": -11.716227531433105, "global_step": 221758, "epoch": 1319} {"train_loss": -11.393708915937514, "global_step": 221759, "epoch": 1319, "val_loss": 262374.5625} {"train_loss": -11.182666778564453, "global_step": 221760, "epoch": 1320} {"train_loss": -11.583503723144531, "global_step": 221761, "epoch": 1320} {"train_loss": -10.671354293823242, "global_step": 221762, "epoch": 1320} {"train_loss": -11.733333587646484, "global_step": 221763, "epoch": 1320} {"train_loss": -10.708816528320312, "global_step": 221764, "epoch": 1320} {"train_loss": -11.171051025390625, "global_step": 221765, "epoch": 1320} {"train_loss": -11.436138153076172, "global_step": 221766, "epoch": 1320} {"train_loss": -10.779303550720215, "global_step": 221767, "epoch": 1320} {"train_loss": -11.63894271850586, "global_step": 221768, "epoch": 1320} {"train_loss": -11.072002410888672, "global_step": 221769, "epoch": 1320} {"train_loss": -11.28095817565918, "global_step": 221770, "epoch": 1320} {"train_loss": -10.837570190429688, "global_step": 221771, "epoch": 1320} {"train_loss": -10.931867599487305, "global_step": 221772, "epoch": 1320} {"train_loss": -11.34981918334961, "global_step": 221773, "epoch": 1320} {"train_loss": -10.924857139587402, "global_step": 221774, "epoch": 1320} {"train_loss": -11.417718887329102, "global_step": 221775, "epoch": 1320} {"train_loss": -11.306659698486328, "global_step": 221776, "epoch": 1320} {"train_loss": -11.620868682861328, "global_step": 221777, "epoch": 1320} {"train_loss": -11.73507308959961, "global_step": 221778, "epoch": 1320} {"train_loss": -11.512361526489258, "global_step": 221779, "epoch": 1320} {"train_loss": -11.629164695739746, "global_step": 221780, "epoch": 1320} {"train_loss": -11.723404884338379, "global_step": 221781, "epoch": 1320} {"train_loss": -11.735307693481445, "global_step": 221782, "epoch": 1320} {"train_loss": -11.727956771850586, "global_step": 221783, "epoch": 1320} {"train_loss": -11.855621337890625, "global_step": 221784, "epoch": 1320} {"train_loss": -11.585379600524902, "global_step": 221785, "epoch": 1320} {"train_loss": -11.821438789367676, "global_step": 221786, "epoch": 1320} {"train_loss": -11.678483963012695, "global_step": 221787, "epoch": 1320} {"train_loss": -11.749788284301758, "global_step": 221788, "epoch": 1320} {"train_loss": -11.80049991607666, "global_step": 221789, "epoch": 1320} {"train_loss": -11.545449256896973, "global_step": 221790, "epoch": 1320} {"train_loss": -11.679457664489746, "global_step": 221791, "epoch": 1320} {"train_loss": -11.64923095703125, "global_step": 221792, "epoch": 1320} {"train_loss": -11.715362548828125, "global_step": 221793, "epoch": 1320} {"train_loss": -11.531521797180176, "global_step": 221794, "epoch": 1320} {"train_loss": -11.771369934082031, "global_step": 221795, "epoch": 1320} {"train_loss": -11.93967342376709, "global_step": 221796, "epoch": 1320} {"train_loss": -11.704080581665039, "global_step": 221797, "epoch": 1320} {"train_loss": -11.860624313354492, "global_step": 221798, "epoch": 1320} {"train_loss": -11.647234916687012, "global_step": 221799, "epoch": 1320} {"train_loss": -11.90296745300293, "global_step": 221800, "epoch": 1320} {"train_loss": -11.790322303771973, "global_step": 221801, "epoch": 1320} {"train_loss": -11.778573036193848, "global_step": 221802, "epoch": 1320} {"train_loss": -11.788278579711914, "global_step": 221803, "epoch": 1320} {"train_loss": -11.929155349731445, "global_step": 221804, "epoch": 1320} {"train_loss": -11.807955741882324, "global_step": 221805, "epoch": 1320} {"train_loss": -11.81627082824707, "global_step": 221806, "epoch": 1320} {"train_loss": -11.589505195617676, "global_step": 221807, "epoch": 1320} {"train_loss": -11.658583641052246, "global_step": 221808, "epoch": 1320} {"train_loss": -11.51389217376709, "global_step": 221809, "epoch": 1320} {"train_loss": -11.483113288879395, "global_step": 221810, "epoch": 1320} {"train_loss": -11.934305191040039, "global_step": 221811, "epoch": 1320} {"train_loss": -11.857622146606445, "global_step": 221812, "epoch": 1320} {"train_loss": -11.618141174316406, "global_step": 221813, "epoch": 1320} {"train_loss": -11.76229476928711, "global_step": 221814, "epoch": 1320} {"train_loss": -11.941352844238281, "global_step": 221815, "epoch": 1320} {"train_loss": -11.806622505187988, "global_step": 221816, "epoch": 1320} {"train_loss": -11.760823249816895, "global_step": 221817, "epoch": 1320} {"train_loss": -11.61115837097168, "global_step": 221818, "epoch": 1320} {"train_loss": -12.018875122070312, "global_step": 221819, "epoch": 1320} {"train_loss": -11.72842788696289, "global_step": 221820, "epoch": 1320} {"train_loss": -11.134028434753418, "global_step": 221821, "epoch": 1320} {"train_loss": -10.547127723693848, "global_step": 221822, "epoch": 1320} {"train_loss": -11.375865936279297, "global_step": 221823, "epoch": 1320} {"train_loss": -10.892271041870117, "global_step": 221824, "epoch": 1320} {"train_loss": -11.536884307861328, "global_step": 221825, "epoch": 1320} {"train_loss": -11.217121124267578, "global_step": 221826, "epoch": 1320} {"train_loss": -11.66325855255127, "global_step": 221827, "epoch": 1320} {"train_loss": -11.150489807128906, "global_step": 221828, "epoch": 1320} {"train_loss": -10.758769989013672, "global_step": 221829, "epoch": 1320} {"train_loss": -10.935439109802246, "global_step": 221830, "epoch": 1320} {"train_loss": -11.631900787353516, "global_step": 221831, "epoch": 1320} {"train_loss": -11.521574020385742, "global_step": 221832, "epoch": 1320} {"train_loss": -11.421306610107422, "global_step": 221833, "epoch": 1320} {"train_loss": -11.498933792114258, "global_step": 221834, "epoch": 1320} {"train_loss": -10.996109008789062, "global_step": 221835, "epoch": 1320} {"train_loss": -11.308504104614258, "global_step": 221836, "epoch": 1320} {"train_loss": -10.992659568786621, "global_step": 221837, "epoch": 1320} {"train_loss": -11.250446319580078, "global_step": 221838, "epoch": 1320} {"train_loss": -10.734621047973633, "global_step": 221839, "epoch": 1320} {"train_loss": -10.8333740234375, "global_step": 221840, "epoch": 1320} {"train_loss": -11.306329727172852, "global_step": 221841, "epoch": 1320} {"train_loss": -10.882081985473633, "global_step": 221842, "epoch": 1320} {"train_loss": -11.528268814086914, "global_step": 221843, "epoch": 1320} {"train_loss": -11.05558967590332, "global_step": 221844, "epoch": 1320} {"train_loss": -11.37681770324707, "global_step": 221845, "epoch": 1320} {"train_loss": -11.14289665222168, "global_step": 221846, "epoch": 1320} {"train_loss": -10.443178176879883, "global_step": 221847, "epoch": 1320} {"train_loss": -11.175432205200195, "global_step": 221848, "epoch": 1320} {"train_loss": -10.212961196899414, "global_step": 221849, "epoch": 1320} {"train_loss": -9.424213409423828, "global_step": 221850, "epoch": 1320} {"train_loss": -10.79653549194336, "global_step": 221851, "epoch": 1320} {"train_loss": -10.46237564086914, "global_step": 221852, "epoch": 1320} {"train_loss": -10.426164627075195, "global_step": 221853, "epoch": 1320} {"train_loss": -10.874337196350098, "global_step": 221854, "epoch": 1320} {"train_loss": -10.786649703979492, "global_step": 221855, "epoch": 1320} {"train_loss": -10.123576164245605, "global_step": 221856, "epoch": 1320} {"train_loss": -11.161050796508789, "global_step": 221857, "epoch": 1320} {"train_loss": -10.07534408569336, "global_step": 221858, "epoch": 1320} {"train_loss": -11.324701309204102, "global_step": 221859, "epoch": 1320} {"train_loss": -10.483808517456055, "global_step": 221860, "epoch": 1320} {"train_loss": -10.781250953674316, "global_step": 221861, "epoch": 1320} {"train_loss": -10.487855911254883, "global_step": 221862, "epoch": 1320} {"train_loss": -11.337931632995605, "global_step": 221863, "epoch": 1320} {"train_loss": -10.801079750061035, "global_step": 221864, "epoch": 1320} {"train_loss": -11.09140396118164, "global_step": 221865, "epoch": 1320} {"train_loss": -10.675970077514648, "global_step": 221866, "epoch": 1320} {"train_loss": -10.80124282836914, "global_step": 221867, "epoch": 1320} {"train_loss": -10.722650527954102, "global_step": 221868, "epoch": 1320} {"train_loss": -10.881551742553711, "global_step": 221869, "epoch": 1320} {"train_loss": -10.587883949279785, "global_step": 221870, "epoch": 1320} {"train_loss": -11.123342514038086, "global_step": 221871, "epoch": 1320} {"train_loss": -11.235787391662598, "global_step": 221872, "epoch": 1320} {"train_loss": -10.664859771728516, "global_step": 221873, "epoch": 1320} {"train_loss": -10.884305953979492, "global_step": 221874, "epoch": 1320} {"train_loss": -11.061603546142578, "global_step": 221875, "epoch": 1320} {"train_loss": -10.616968154907227, "global_step": 221876, "epoch": 1320} {"train_loss": -10.9779634475708, "global_step": 221877, "epoch": 1320} {"train_loss": -10.21027946472168, "global_step": 221878, "epoch": 1320} {"train_loss": -11.146970748901367, "global_step": 221879, "epoch": 1320} {"train_loss": -10.799842834472656, "global_step": 221880, "epoch": 1320} {"train_loss": -10.439679145812988, "global_step": 221881, "epoch": 1320} {"train_loss": -10.359489440917969, "global_step": 221882, "epoch": 1320} {"train_loss": -10.526719093322754, "global_step": 221883, "epoch": 1320} {"train_loss": -10.587836265563965, "global_step": 221884, "epoch": 1320} {"train_loss": -11.279146194458008, "global_step": 221885, "epoch": 1320} {"train_loss": -10.736143112182617, "global_step": 221886, "epoch": 1320} {"train_loss": -11.070838928222656, "global_step": 221887, "epoch": 1320} {"train_loss": -11.403703689575195, "global_step": 221888, "epoch": 1320} {"train_loss": -11.072860717773438, "global_step": 221889, "epoch": 1320} {"train_loss": -11.198959350585938, "global_step": 221890, "epoch": 1320} {"train_loss": -11.414572715759277, "global_step": 221891, "epoch": 1320} {"train_loss": -11.352514266967773, "global_step": 221892, "epoch": 1320} {"train_loss": -11.555716514587402, "global_step": 221893, "epoch": 1320} {"train_loss": -11.467351913452148, "global_step": 221894, "epoch": 1320} {"train_loss": -11.542551040649414, "global_step": 221895, "epoch": 1320} {"train_loss": -11.588310241699219, "global_step": 221896, "epoch": 1320} {"train_loss": -11.538629531860352, "global_step": 221897, "epoch": 1320} {"train_loss": -11.466093063354492, "global_step": 221898, "epoch": 1320} {"train_loss": -11.263099670410156, "global_step": 221899, "epoch": 1320} {"train_loss": -11.183237075805664, "global_step": 221900, "epoch": 1320} {"train_loss": -11.651398658752441, "global_step": 221901, "epoch": 1320} {"train_loss": -11.454412460327148, "global_step": 221902, "epoch": 1320} {"train_loss": -11.339639663696289, "global_step": 221903, "epoch": 1320} {"train_loss": -11.368075370788574, "global_step": 221904, "epoch": 1320} {"train_loss": -11.389455795288086, "global_step": 221905, "epoch": 1320} {"train_loss": -11.15369987487793, "global_step": 221906, "epoch": 1320} {"train_loss": -11.75507926940918, "global_step": 221907, "epoch": 1320} {"train_loss": -11.239330291748047, "global_step": 221908, "epoch": 1320} {"train_loss": -11.831913948059082, "global_step": 221909, "epoch": 1320} {"train_loss": -11.273321151733398, "global_step": 221910, "epoch": 1320} {"train_loss": -11.712204933166504, "global_step": 221911, "epoch": 1320} {"train_loss": -11.407292366027832, "global_step": 221912, "epoch": 1320} {"train_loss": -11.574735641479492, "global_step": 221913, "epoch": 1320} {"train_loss": -11.546660423278809, "global_step": 221914, "epoch": 1320} {"train_loss": -11.334415435791016, "global_step": 221915, "epoch": 1320} {"train_loss": -11.508398056030273, "global_step": 221916, "epoch": 1320} {"train_loss": -11.66994857788086, "global_step": 221917, "epoch": 1320} {"train_loss": -11.62389850616455, "global_step": 221918, "epoch": 1320} {"train_loss": -11.582834243774414, "global_step": 221919, "epoch": 1320} {"train_loss": -11.67793083190918, "global_step": 221920, "epoch": 1320} {"train_loss": -11.4724702835083, "global_step": 221921, "epoch": 1320} {"train_loss": -11.373634338378906, "global_step": 221922, "epoch": 1320} {"train_loss": -11.547140121459961, "global_step": 221923, "epoch": 1320} {"train_loss": -11.348047256469727, "global_step": 221924, "epoch": 1320} {"train_loss": -11.736478805541992, "global_step": 221925, "epoch": 1320} {"train_loss": -11.381603240966797, "global_step": 221926, "epoch": 1320} {"train_loss": -11.282652162370228, "global_step": 221927, "epoch": 1320, "val_loss": 262626.9375, "train_action_mse_error": 1.7213444709777832} {"train_loss": -11.749889373779297, "global_step": 221928, "epoch": 1321} {"train_loss": -11.489751815795898, "global_step": 221929, "epoch": 1321} {"train_loss": -11.751386642456055, "global_step": 221930, "epoch": 1321} {"train_loss": -11.531017303466797, "global_step": 221931, "epoch": 1321} {"train_loss": -11.733989715576172, "global_step": 221932, "epoch": 1321} {"train_loss": -11.577254295349121, "global_step": 221933, "epoch": 1321} {"train_loss": -11.618124008178711, "global_step": 221934, "epoch": 1321} {"train_loss": -11.568278312683105, "global_step": 221935, "epoch": 1321} {"train_loss": -11.719681739807129, "global_step": 221936, "epoch": 1321} {"train_loss": -11.85702896118164, "global_step": 221937, "epoch": 1321} {"train_loss": -11.775131225585938, "global_step": 221938, "epoch": 1321} {"train_loss": -11.971186637878418, "global_step": 221939, "epoch": 1321} {"train_loss": -11.790518760681152, "global_step": 221940, "epoch": 1321} {"train_loss": -12.048542022705078, "global_step": 221941, "epoch": 1321} {"train_loss": -11.719703674316406, "global_step": 221942, "epoch": 1321} {"train_loss": -11.850420951843262, "global_step": 221943, "epoch": 1321} {"train_loss": -11.590596199035645, "global_step": 221944, "epoch": 1321} {"train_loss": -11.69093132019043, "global_step": 221945, "epoch": 1321} {"train_loss": -11.722647666931152, "global_step": 221946, "epoch": 1321} {"train_loss": -11.713534355163574, "global_step": 221947, "epoch": 1321} {"train_loss": -11.664759635925293, "global_step": 221948, "epoch": 1321} {"train_loss": -11.917121887207031, "global_step": 221949, "epoch": 1321} {"train_loss": -11.781740188598633, "global_step": 221950, "epoch": 1321} {"train_loss": -11.966131210327148, "global_step": 221951, "epoch": 1321} {"train_loss": -11.664173126220703, "global_step": 221952, "epoch": 1321} {"train_loss": -11.89045238494873, "global_step": 221953, "epoch": 1321} {"train_loss": -11.95245361328125, "global_step": 221954, "epoch": 1321} {"train_loss": -11.860309600830078, "global_step": 221955, "epoch": 1321} {"train_loss": -11.890726089477539, "global_step": 221956, "epoch": 1321} {"train_loss": -12.075223922729492, "global_step": 221957, "epoch": 1321} {"train_loss": -11.694725036621094, "global_step": 221958, "epoch": 1321} {"train_loss": -11.872976303100586, "global_step": 221959, "epoch": 1321} {"train_loss": -11.96285629272461, "global_step": 221960, "epoch": 1321} {"train_loss": -11.792986869812012, "global_step": 221961, "epoch": 1321} {"train_loss": -12.12039852142334, "global_step": 221962, "epoch": 1321} {"train_loss": -11.989970207214355, "global_step": 221963, "epoch": 1321} {"train_loss": -11.973634719848633, "global_step": 221964, "epoch": 1321} {"train_loss": -12.12332534790039, "global_step": 221965, "epoch": 1321} {"train_loss": -11.718613624572754, "global_step": 221966, "epoch": 1321} {"train_loss": -11.747228622436523, "global_step": 221967, "epoch": 1321} {"train_loss": -12.119623184204102, "global_step": 221968, "epoch": 1321} {"train_loss": -11.909746170043945, "global_step": 221969, "epoch": 1321} {"train_loss": -11.393779754638672, "global_step": 221970, "epoch": 1321} {"train_loss": -11.788654327392578, "global_step": 221971, "epoch": 1321} {"train_loss": -11.974811553955078, "global_step": 221972, "epoch": 1321} {"train_loss": -11.22960090637207, "global_step": 221973, "epoch": 1321} {"train_loss": -11.290451049804688, "global_step": 221974, "epoch": 1321} {"train_loss": -12.025721549987793, "global_step": 221975, "epoch": 1321} {"train_loss": -11.735986709594727, "global_step": 221976, "epoch": 1321} {"train_loss": -11.648305892944336, "global_step": 221977, "epoch": 1321} {"train_loss": -11.036367416381836, "global_step": 221978, "epoch": 1321} {"train_loss": -10.255220413208008, "global_step": 221979, "epoch": 1321} {"train_loss": -11.787772178649902, "global_step": 221980, "epoch": 1321} {"train_loss": -11.292022705078125, "global_step": 221981, "epoch": 1321} {"train_loss": -9.559103965759277, "global_step": 221982, "epoch": 1321} {"train_loss": -11.470697402954102, "global_step": 221983, "epoch": 1321} {"train_loss": -10.634235382080078, "global_step": 221984, "epoch": 1321} {"train_loss": -10.628894805908203, "global_step": 221985, "epoch": 1321} {"train_loss": -11.591678619384766, "global_step": 221986, "epoch": 1321} {"train_loss": -10.039497375488281, "global_step": 221987, "epoch": 1321} {"train_loss": -10.974654197692871, "global_step": 221988, "epoch": 1321} {"train_loss": -10.913525581359863, "global_step": 221989, "epoch": 1321} {"train_loss": -11.28231430053711, "global_step": 221990, "epoch": 1321} {"train_loss": -11.049906730651855, "global_step": 221991, "epoch": 1321} {"train_loss": -10.941052436828613, "global_step": 221992, "epoch": 1321} {"train_loss": -11.545019149780273, "global_step": 221993, "epoch": 1321} {"train_loss": -11.176556587219238, "global_step": 221994, "epoch": 1321} {"train_loss": -11.241263389587402, "global_step": 221995, "epoch": 1321} {"train_loss": -11.425190925598145, "global_step": 221996, "epoch": 1321} {"train_loss": -11.375715255737305, "global_step": 221997, "epoch": 1321} {"train_loss": -11.379638671875, "global_step": 221998, "epoch": 1321} {"train_loss": -10.959423065185547, "global_step": 221999, "epoch": 1321} {"train_loss": -11.605016708374023, "global_step": 222000, "epoch": 1321} {"train_loss": -11.19692611694336, "global_step": 222001, "epoch": 1321} {"train_loss": -11.36443042755127, "global_step": 222002, "epoch": 1321} {"train_loss": -11.733055114746094, "global_step": 222003, "epoch": 1321} {"train_loss": -11.458178520202637, "global_step": 222004, "epoch": 1321} {"train_loss": -10.976898193359375, "global_step": 222005, "epoch": 1321} {"train_loss": -11.264694213867188, "global_step": 222006, "epoch": 1321} {"train_loss": -11.365373611450195, "global_step": 222007, "epoch": 1321} {"train_loss": -11.123054504394531, "global_step": 222008, "epoch": 1321} {"train_loss": -11.451717376708984, "global_step": 222009, "epoch": 1321} {"train_loss": -11.301437377929688, "global_step": 222010, "epoch": 1321} {"train_loss": -11.50864315032959, "global_step": 222011, "epoch": 1321} {"train_loss": -11.194540023803711, "global_step": 222012, "epoch": 1321} {"train_loss": -11.560235977172852, "global_step": 222013, "epoch": 1321} {"train_loss": -11.486695289611816, "global_step": 222014, "epoch": 1321} {"train_loss": -11.590968132019043, "global_step": 222015, "epoch": 1321} {"train_loss": -11.336185455322266, "global_step": 222016, "epoch": 1321} {"train_loss": -11.719976425170898, "global_step": 222017, "epoch": 1321} {"train_loss": -11.591684341430664, "global_step": 222018, "epoch": 1321} {"train_loss": -11.441981315612793, "global_step": 222019, "epoch": 1321} {"train_loss": -11.63817310333252, "global_step": 222020, "epoch": 1321} {"train_loss": -11.410701751708984, "global_step": 222021, "epoch": 1321} {"train_loss": -11.517159461975098, "global_step": 222022, "epoch": 1321} {"train_loss": -11.411078453063965, "global_step": 222023, "epoch": 1321} {"train_loss": -11.253036499023438, "global_step": 222024, "epoch": 1321} {"train_loss": -11.609138488769531, "global_step": 222025, "epoch": 1321} {"train_loss": -11.231674194335938, "global_step": 222026, "epoch": 1321} {"train_loss": -11.638280868530273, "global_step": 222027, "epoch": 1321} {"train_loss": -11.49131965637207, "global_step": 222028, "epoch": 1321} {"train_loss": -11.631912231445312, "global_step": 222029, "epoch": 1321} {"train_loss": -11.377364158630371, "global_step": 222030, "epoch": 1321} {"train_loss": -11.47597885131836, "global_step": 222031, "epoch": 1321} {"train_loss": -11.670365333557129, "global_step": 222032, "epoch": 1321} {"train_loss": -11.490985870361328, "global_step": 222033, "epoch": 1321} {"train_loss": -11.568317413330078, "global_step": 222034, "epoch": 1321} {"train_loss": -11.373078346252441, "global_step": 222035, "epoch": 1321} {"train_loss": -11.227893829345703, "global_step": 222036, "epoch": 1321} {"train_loss": -11.334962844848633, "global_step": 222037, "epoch": 1321} {"train_loss": -11.314783096313477, "global_step": 222038, "epoch": 1321} {"train_loss": -11.503958702087402, "global_step": 222039, "epoch": 1321} {"train_loss": -11.339407920837402, "global_step": 222040, "epoch": 1321} {"train_loss": -10.898237228393555, "global_step": 222041, "epoch": 1321} {"train_loss": -11.115699768066406, "global_step": 222042, "epoch": 1321} {"train_loss": -11.480076789855957, "global_step": 222043, "epoch": 1321} {"train_loss": -10.796677589416504, "global_step": 222044, "epoch": 1321} {"train_loss": -11.424524307250977, "global_step": 222045, "epoch": 1321} {"train_loss": -11.186198234558105, "global_step": 222046, "epoch": 1321} {"train_loss": -11.269495964050293, "global_step": 222047, "epoch": 1321} {"train_loss": -11.516339302062988, "global_step": 222048, "epoch": 1321} {"train_loss": -11.125479698181152, "global_step": 222049, "epoch": 1321} {"train_loss": -11.227886199951172, "global_step": 222050, "epoch": 1321} {"train_loss": -11.42945671081543, "global_step": 222051, "epoch": 1321} {"train_loss": -11.468761444091797, "global_step": 222052, "epoch": 1321} {"train_loss": -11.287671089172363, "global_step": 222053, "epoch": 1321} {"train_loss": -11.647199630737305, "global_step": 222054, "epoch": 1321} {"train_loss": -11.545554161071777, "global_step": 222055, "epoch": 1321} {"train_loss": -11.241172790527344, "global_step": 222056, "epoch": 1321} {"train_loss": -11.380046844482422, "global_step": 222057, "epoch": 1321} {"train_loss": -11.316608428955078, "global_step": 222058, "epoch": 1321} {"train_loss": -11.740886688232422, "global_step": 222059, "epoch": 1321} {"train_loss": -11.615367889404297, "global_step": 222060, "epoch": 1321} {"train_loss": -11.28918170928955, "global_step": 222061, "epoch": 1321} {"train_loss": -11.46455192565918, "global_step": 222062, "epoch": 1321} {"train_loss": -11.298115730285645, "global_step": 222063, "epoch": 1321} {"train_loss": -11.468975067138672, "global_step": 222064, "epoch": 1321} {"train_loss": -11.103254318237305, "global_step": 222065, "epoch": 1321} {"train_loss": -11.521204948425293, "global_step": 222066, "epoch": 1321} {"train_loss": -10.748786926269531, "global_step": 222067, "epoch": 1321} {"train_loss": -11.192180633544922, "global_step": 222068, "epoch": 1321} {"train_loss": -10.94892692565918, "global_step": 222069, "epoch": 1321} {"train_loss": -11.101119995117188, "global_step": 222070, "epoch": 1321} {"train_loss": -11.271258354187012, "global_step": 222071, "epoch": 1321} {"train_loss": -11.066225051879883, "global_step": 222072, "epoch": 1321} {"train_loss": -11.87513542175293, "global_step": 222073, "epoch": 1321} {"train_loss": -10.942215919494629, "global_step": 222074, "epoch": 1321} {"train_loss": -11.656961441040039, "global_step": 222075, "epoch": 1321} {"train_loss": -11.273208618164062, "global_step": 222076, "epoch": 1321} {"train_loss": -11.572026252746582, "global_step": 222077, "epoch": 1321} {"train_loss": -11.174201011657715, "global_step": 222078, "epoch": 1321} {"train_loss": -11.362833023071289, "global_step": 222079, "epoch": 1321} {"train_loss": -11.647967338562012, "global_step": 222080, "epoch": 1321} {"train_loss": -11.387353897094727, "global_step": 222081, "epoch": 1321} {"train_loss": -11.648874282836914, "global_step": 222082, "epoch": 1321} {"train_loss": -10.908363342285156, "global_step": 222083, "epoch": 1321} {"train_loss": -10.598179817199707, "global_step": 222084, "epoch": 1321} {"train_loss": -10.751378059387207, "global_step": 222085, "epoch": 1321} {"train_loss": -9.171375274658203, "global_step": 222086, "epoch": 1321} {"train_loss": -10.24901008605957, "global_step": 222087, "epoch": 1321} {"train_loss": -8.7200288772583, "global_step": 222088, "epoch": 1321} {"train_loss": -10.900489807128906, "global_step": 222089, "epoch": 1321} {"train_loss": -9.38320541381836, "global_step": 222090, "epoch": 1321} {"train_loss": -10.414746284484863, "global_step": 222091, "epoch": 1321} {"train_loss": -10.796443939208984, "global_step": 222092, "epoch": 1321} {"train_loss": -10.323281288146973, "global_step": 222093, "epoch": 1321} {"train_loss": -10.536870956420898, "global_step": 222094, "epoch": 1321} {"train_loss": -11.36671246801104, "global_step": 222095, "epoch": 1321, "val_loss": 260887.140625} {"train_loss": -10.441673278808594, "global_step": 222096, "epoch": 1322} {"train_loss": -9.616056442260742, "global_step": 222097, "epoch": 1322} {"train_loss": -10.424038887023926, "global_step": 222098, "epoch": 1322} {"train_loss": -10.325883865356445, "global_step": 222099, "epoch": 1322} {"train_loss": -10.310224533081055, "global_step": 222100, "epoch": 1322} {"train_loss": -10.234345436096191, "global_step": 222101, "epoch": 1322} {"train_loss": -11.000974655151367, "global_step": 222102, "epoch": 1322} {"train_loss": -10.428369522094727, "global_step": 222103, "epoch": 1322} {"train_loss": -10.912862777709961, "global_step": 222104, "epoch": 1322} {"train_loss": -11.16041088104248, "global_step": 222105, "epoch": 1322} {"train_loss": -10.971611022949219, "global_step": 222106, "epoch": 1322} {"train_loss": -11.22343635559082, "global_step": 222107, "epoch": 1322} {"train_loss": -11.183130264282227, "global_step": 222108, "epoch": 1322} {"train_loss": -11.49206829071045, "global_step": 222109, "epoch": 1322} {"train_loss": -11.076176643371582, "global_step": 222110, "epoch": 1322} {"train_loss": -11.15307331085205, "global_step": 222111, "epoch": 1322} {"train_loss": -11.435919761657715, "global_step": 222112, "epoch": 1322} {"train_loss": -11.564985275268555, "global_step": 222113, "epoch": 1322} {"train_loss": -11.450199127197266, "global_step": 222114, "epoch": 1322} {"train_loss": -11.52208137512207, "global_step": 222115, "epoch": 1322} {"train_loss": -11.460451126098633, "global_step": 222116, "epoch": 1322} {"train_loss": -11.417501449584961, "global_step": 222117, "epoch": 1322} {"train_loss": -11.522170066833496, "global_step": 222118, "epoch": 1322} {"train_loss": -11.6527099609375, "global_step": 222119, "epoch": 1322} {"train_loss": -11.467754364013672, "global_step": 222120, "epoch": 1322} {"train_loss": -11.686283111572266, "global_step": 222121, "epoch": 1322} {"train_loss": -11.620718955993652, "global_step": 222122, "epoch": 1322} {"train_loss": -11.608407974243164, "global_step": 222123, "epoch": 1322} {"train_loss": -11.584047317504883, "global_step": 222124, "epoch": 1322} {"train_loss": -11.749631881713867, "global_step": 222125, "epoch": 1322} {"train_loss": -11.53791618347168, "global_step": 222126, "epoch": 1322} {"train_loss": -11.577686309814453, "global_step": 222127, "epoch": 1322} {"train_loss": -11.37240219116211, "global_step": 222128, "epoch": 1322} {"train_loss": -11.656423568725586, "global_step": 222129, "epoch": 1322} {"train_loss": -11.319890975952148, "global_step": 222130, "epoch": 1322} {"train_loss": -11.699846267700195, "global_step": 222131, "epoch": 1322} {"train_loss": -11.749329566955566, "global_step": 222132, "epoch": 1322} {"train_loss": -11.57763671875, "global_step": 222133, "epoch": 1322} {"train_loss": -11.815013885498047, "global_step": 222134, "epoch": 1322} {"train_loss": -11.787518501281738, "global_step": 222135, "epoch": 1322} {"train_loss": -11.589874267578125, "global_step": 222136, "epoch": 1322} {"train_loss": -11.628177642822266, "global_step": 222137, "epoch": 1322} {"train_loss": -11.721076965332031, "global_step": 222138, "epoch": 1322} {"train_loss": -11.845497131347656, "global_step": 222139, "epoch": 1322} {"train_loss": -11.73135757446289, "global_step": 222140, "epoch": 1322} {"train_loss": -11.801740646362305, "global_step": 222141, "epoch": 1322} {"train_loss": -11.786502838134766, "global_step": 222142, "epoch": 1322} {"train_loss": -11.678135871887207, "global_step": 222143, "epoch": 1322} {"train_loss": -11.752016067504883, "global_step": 222144, "epoch": 1322} {"train_loss": -11.901420593261719, "global_step": 222145, "epoch": 1322} {"train_loss": -11.787940979003906, "global_step": 222146, "epoch": 1322} {"train_loss": -11.777654647827148, "global_step": 222147, "epoch": 1322} {"train_loss": -11.881546020507812, "global_step": 222148, "epoch": 1322} {"train_loss": -11.860381126403809, "global_step": 222149, "epoch": 1322} {"train_loss": -11.788850784301758, "global_step": 222150, "epoch": 1322} {"train_loss": -11.800511360168457, "global_step": 222151, "epoch": 1322} {"train_loss": -11.835737228393555, "global_step": 222152, "epoch": 1322} {"train_loss": -11.777654647827148, "global_step": 222153, "epoch": 1322} {"train_loss": -11.962688446044922, "global_step": 222154, "epoch": 1322} {"train_loss": -11.982608795166016, "global_step": 222155, "epoch": 1322} {"train_loss": -12.06328296661377, "global_step": 222156, "epoch": 1322} {"train_loss": -12.00349235534668, "global_step": 222157, "epoch": 1322} {"train_loss": -12.026674270629883, "global_step": 222158, "epoch": 1322} {"train_loss": -12.019655227661133, "global_step": 222159, "epoch": 1322} {"train_loss": -11.873472213745117, "global_step": 222160, "epoch": 1322} {"train_loss": -11.995399475097656, "global_step": 222161, "epoch": 1322} {"train_loss": -12.006132125854492, "global_step": 222162, "epoch": 1322} {"train_loss": -12.115035057067871, "global_step": 222163, "epoch": 1322} {"train_loss": -11.744093894958496, "global_step": 222164, "epoch": 1322} {"train_loss": -11.960467338562012, "global_step": 222165, "epoch": 1322} {"train_loss": -11.860549926757812, "global_step": 222166, "epoch": 1322} {"train_loss": -11.73564338684082, "global_step": 222167, "epoch": 1322} {"train_loss": -11.509510040283203, "global_step": 222168, "epoch": 1322} {"train_loss": -12.234031677246094, "global_step": 222169, "epoch": 1322} {"train_loss": -11.771577835083008, "global_step": 222170, "epoch": 1322} {"train_loss": -12.11716079711914, "global_step": 222171, "epoch": 1322} {"train_loss": -12.01962661743164, "global_step": 222172, "epoch": 1322} {"train_loss": -11.761148452758789, "global_step": 222173, "epoch": 1322} {"train_loss": -11.447463989257812, "global_step": 222174, "epoch": 1322} {"train_loss": -12.146632194519043, "global_step": 222175, "epoch": 1322} {"train_loss": -11.799559593200684, "global_step": 222176, "epoch": 1322} {"train_loss": -11.473339080810547, "global_step": 222177, "epoch": 1322} {"train_loss": -11.062894821166992, "global_step": 222178, "epoch": 1322} {"train_loss": -11.744470596313477, "global_step": 222179, "epoch": 1322} {"train_loss": -11.635364532470703, "global_step": 222180, "epoch": 1322} {"train_loss": -11.741966247558594, "global_step": 222181, "epoch": 1322} {"train_loss": -11.642112731933594, "global_step": 222182, "epoch": 1322} {"train_loss": -11.805593490600586, "global_step": 222183, "epoch": 1322} {"train_loss": -11.60875415802002, "global_step": 222184, "epoch": 1322} {"train_loss": -11.87484359741211, "global_step": 222185, "epoch": 1322} {"train_loss": -11.91446590423584, "global_step": 222186, "epoch": 1322} {"train_loss": -11.59384536743164, "global_step": 222187, "epoch": 1322} {"train_loss": -11.917647361755371, "global_step": 222188, "epoch": 1322} {"train_loss": -11.666194915771484, "global_step": 222189, "epoch": 1322} {"train_loss": -11.652975082397461, "global_step": 222190, "epoch": 1322} {"train_loss": -11.860876083374023, "global_step": 222191, "epoch": 1322} {"train_loss": -11.81389045715332, "global_step": 222192, "epoch": 1322} {"train_loss": -11.788034439086914, "global_step": 222193, "epoch": 1322} {"train_loss": -11.679009437561035, "global_step": 222194, "epoch": 1322} {"train_loss": -11.856969833374023, "global_step": 222195, "epoch": 1322} {"train_loss": -11.422672271728516, "global_step": 222196, "epoch": 1322} {"train_loss": -11.317148208618164, "global_step": 222197, "epoch": 1322} {"train_loss": -11.1113920211792, "global_step": 222198, "epoch": 1322} {"train_loss": -11.278138160705566, "global_step": 222199, "epoch": 1322} {"train_loss": -11.73177433013916, "global_step": 222200, "epoch": 1322} {"train_loss": -11.10228443145752, "global_step": 222201, "epoch": 1322} {"train_loss": -11.555195808410645, "global_step": 222202, "epoch": 1322} {"train_loss": -10.72490119934082, "global_step": 222203, "epoch": 1322} {"train_loss": -11.611726760864258, "global_step": 222204, "epoch": 1322} {"train_loss": -11.22105598449707, "global_step": 222205, "epoch": 1322} {"train_loss": -11.237646102905273, "global_step": 222206, "epoch": 1322} {"train_loss": -10.957752227783203, "global_step": 222207, "epoch": 1322} {"train_loss": -10.992120742797852, "global_step": 222208, "epoch": 1322} {"train_loss": -9.717133522033691, "global_step": 222209, "epoch": 1322} {"train_loss": -10.545147895812988, "global_step": 222210, "epoch": 1322} {"train_loss": -9.895015716552734, "global_step": 222211, "epoch": 1322} {"train_loss": -8.83806324005127, "global_step": 222212, "epoch": 1322} {"train_loss": -9.354811668395996, "global_step": 222213, "epoch": 1322} {"train_loss": -10.804439544677734, "global_step": 222214, "epoch": 1322} {"train_loss": -10.05819034576416, "global_step": 222215, "epoch": 1322} {"train_loss": -9.218570709228516, "global_step": 222216, "epoch": 1322} {"train_loss": -9.19019889831543, "global_step": 222217, "epoch": 1322} {"train_loss": -10.899250984191895, "global_step": 222218, "epoch": 1322} {"train_loss": -10.051240921020508, "global_step": 222219, "epoch": 1322} {"train_loss": -10.981857299804688, "global_step": 222220, "epoch": 1322} {"train_loss": -10.501946449279785, "global_step": 222221, "epoch": 1322} {"train_loss": -10.056568145751953, "global_step": 222222, "epoch": 1322} {"train_loss": -11.081720352172852, "global_step": 222223, "epoch": 1322} {"train_loss": -10.51207160949707, "global_step": 222224, "epoch": 1322} {"train_loss": -11.731158256530762, "global_step": 222225, "epoch": 1322} {"train_loss": -10.489688873291016, "global_step": 222226, "epoch": 1322} {"train_loss": -11.057744979858398, "global_step": 222227, "epoch": 1322} {"train_loss": -10.86284351348877, "global_step": 222228, "epoch": 1322} {"train_loss": -11.489008903503418, "global_step": 222229, "epoch": 1322} {"train_loss": -11.17452621459961, "global_step": 222230, "epoch": 1322} {"train_loss": -11.366300582885742, "global_step": 222231, "epoch": 1322} {"train_loss": -11.015528678894043, "global_step": 222232, "epoch": 1322} {"train_loss": -11.037817001342773, "global_step": 222233, "epoch": 1322} {"train_loss": -10.783475875854492, "global_step": 222234, "epoch": 1322} {"train_loss": -10.866177558898926, "global_step": 222235, "epoch": 1322} {"train_loss": -10.6734619140625, "global_step": 222236, "epoch": 1322} {"train_loss": -10.722722053527832, "global_step": 222237, "epoch": 1322} {"train_loss": -10.877543449401855, "global_step": 222238, "epoch": 1322} {"train_loss": -10.308866500854492, "global_step": 222239, "epoch": 1322} {"train_loss": -11.140205383300781, "global_step": 222240, "epoch": 1322} {"train_loss": -10.964561462402344, "global_step": 222241, "epoch": 1322} {"train_loss": -11.29283332824707, "global_step": 222242, "epoch": 1322} {"train_loss": -10.771261215209961, "global_step": 222243, "epoch": 1322} {"train_loss": -11.040261268615723, "global_step": 222244, "epoch": 1322} {"train_loss": -10.932934761047363, "global_step": 222245, "epoch": 1322} {"train_loss": -11.130468368530273, "global_step": 222246, "epoch": 1322} {"train_loss": -11.459678649902344, "global_step": 222247, "epoch": 1322} {"train_loss": -11.02182388305664, "global_step": 222248, "epoch": 1322} {"train_loss": -11.176280975341797, "global_step": 222249, "epoch": 1322} {"train_loss": -11.310909271240234, "global_step": 222250, "epoch": 1322} {"train_loss": -11.226798057556152, "global_step": 222251, "epoch": 1322} {"train_loss": -11.17658519744873, "global_step": 222252, "epoch": 1322} {"train_loss": -11.71026611328125, "global_step": 222253, "epoch": 1322} {"train_loss": -11.3402099609375, "global_step": 222254, "epoch": 1322} {"train_loss": -11.59766674041748, "global_step": 222255, "epoch": 1322} {"train_loss": -11.148542404174805, "global_step": 222256, "epoch": 1322} {"train_loss": -11.390582084655762, "global_step": 222257, "epoch": 1322} {"train_loss": -11.373191833496094, "global_step": 222258, "epoch": 1322} {"train_loss": -11.627151489257812, "global_step": 222259, "epoch": 1322} {"train_loss": -11.413399696350098, "global_step": 222260, "epoch": 1322} {"train_loss": -11.685335159301758, "global_step": 222261, "epoch": 1322} {"train_loss": -11.243131637573242, "global_step": 222262, "epoch": 1322} {"train_loss": -11.317635235332308, "global_step": 222263, "epoch": 1322, "val_loss": 257533.078125} {"train_loss": -11.357651710510254, "global_step": 222264, "epoch": 1323} {"train_loss": -10.996996879577637, "global_step": 222265, "epoch": 1323} {"train_loss": -11.171615600585938, "global_step": 222266, "epoch": 1323} {"train_loss": -11.185516357421875, "global_step": 222267, "epoch": 1323} {"train_loss": -11.41172981262207, "global_step": 222268, "epoch": 1323} {"train_loss": -11.078688621520996, "global_step": 222269, "epoch": 1323} {"train_loss": -11.528615951538086, "global_step": 222270, "epoch": 1323} {"train_loss": -11.372453689575195, "global_step": 222271, "epoch": 1323} {"train_loss": -11.37918472290039, "global_step": 222272, "epoch": 1323} {"train_loss": -11.521536827087402, "global_step": 222273, "epoch": 1323} {"train_loss": -11.483468055725098, "global_step": 222274, "epoch": 1323} {"train_loss": -11.424235343933105, "global_step": 222275, "epoch": 1323} {"train_loss": -11.759072303771973, "global_step": 222276, "epoch": 1323} {"train_loss": -11.691826820373535, "global_step": 222277, "epoch": 1323} {"train_loss": -11.461042404174805, "global_step": 222278, "epoch": 1323} {"train_loss": -11.304698944091797, "global_step": 222279, "epoch": 1323} {"train_loss": -11.412435531616211, "global_step": 222280, "epoch": 1323} {"train_loss": -11.45967960357666, "global_step": 222281, "epoch": 1323} {"train_loss": -11.447443962097168, "global_step": 222282, "epoch": 1323} {"train_loss": -11.590263366699219, "global_step": 222283, "epoch": 1323} {"train_loss": -11.473373413085938, "global_step": 222284, "epoch": 1323} {"train_loss": -11.700178146362305, "global_step": 222285, "epoch": 1323} {"train_loss": -11.702445030212402, "global_step": 222286, "epoch": 1323} {"train_loss": -11.51927375793457, "global_step": 222287, "epoch": 1323} {"train_loss": -11.335163116455078, "global_step": 222288, "epoch": 1323} {"train_loss": -11.39607048034668, "global_step": 222289, "epoch": 1323} {"train_loss": -11.666601181030273, "global_step": 222290, "epoch": 1323} {"train_loss": -11.482647895812988, "global_step": 222291, "epoch": 1323} {"train_loss": -11.69620418548584, "global_step": 222292, "epoch": 1323} {"train_loss": -11.42643928527832, "global_step": 222293, "epoch": 1323} {"train_loss": -11.746381759643555, "global_step": 222294, "epoch": 1323} {"train_loss": -11.367642402648926, "global_step": 222295, "epoch": 1323} {"train_loss": -11.796035766601562, "global_step": 222296, "epoch": 1323} {"train_loss": -11.785589218139648, "global_step": 222297, "epoch": 1323} {"train_loss": -11.724870681762695, "global_step": 222298, "epoch": 1323} {"train_loss": -11.784228324890137, "global_step": 222299, "epoch": 1323} {"train_loss": -11.647021293640137, "global_step": 222300, "epoch": 1323} {"train_loss": -11.743672370910645, "global_step": 222301, "epoch": 1323} {"train_loss": -11.988009452819824, "global_step": 222302, "epoch": 1323} {"train_loss": -11.926345825195312, "global_step": 222303, "epoch": 1323} {"train_loss": -11.920730590820312, "global_step": 222304, "epoch": 1323} {"train_loss": -11.901335716247559, "global_step": 222305, "epoch": 1323} {"train_loss": -12.051508903503418, "global_step": 222306, "epoch": 1323} {"train_loss": -11.876338958740234, "global_step": 222307, "epoch": 1323} {"train_loss": -11.70265007019043, "global_step": 222308, "epoch": 1323} {"train_loss": -11.769510269165039, "global_step": 222309, "epoch": 1323} {"train_loss": -11.854623794555664, "global_step": 222310, "epoch": 1323} {"train_loss": -11.740084648132324, "global_step": 222311, "epoch": 1323} {"train_loss": -11.706554412841797, "global_step": 222312, "epoch": 1323} {"train_loss": -11.853782653808594, "global_step": 222313, "epoch": 1323} {"train_loss": -11.653257369995117, "global_step": 222314, "epoch": 1323} {"train_loss": -11.84455394744873, "global_step": 222315, "epoch": 1323} {"train_loss": -11.981276512145996, "global_step": 222316, "epoch": 1323} {"train_loss": -12.113195419311523, "global_step": 222317, "epoch": 1323} {"train_loss": -11.995460510253906, "global_step": 222318, "epoch": 1323} {"train_loss": -12.184774398803711, "global_step": 222319, "epoch": 1323} {"train_loss": -11.944798469543457, "global_step": 222320, "epoch": 1323} {"train_loss": -12.000080108642578, "global_step": 222321, "epoch": 1323} {"train_loss": -11.981961250305176, "global_step": 222322, "epoch": 1323} {"train_loss": -12.017566680908203, "global_step": 222323, "epoch": 1323} {"train_loss": -11.98049259185791, "global_step": 222324, "epoch": 1323} {"train_loss": -12.218351364135742, "global_step": 222325, "epoch": 1323} {"train_loss": -11.954115867614746, "global_step": 222326, "epoch": 1323} {"train_loss": -11.93970775604248, "global_step": 222327, "epoch": 1323} {"train_loss": -11.96438217163086, "global_step": 222328, "epoch": 1323} {"train_loss": -12.082538604736328, "global_step": 222329, "epoch": 1323} {"train_loss": -12.019695281982422, "global_step": 222330, "epoch": 1323} {"train_loss": -11.72032356262207, "global_step": 222331, "epoch": 1323} {"train_loss": -11.535820007324219, "global_step": 222332, "epoch": 1323} {"train_loss": -11.894840240478516, "global_step": 222333, "epoch": 1323} {"train_loss": -11.784638404846191, "global_step": 222334, "epoch": 1323} {"train_loss": -11.34760856628418, "global_step": 222335, "epoch": 1323} {"train_loss": -11.96516227722168, "global_step": 222336, "epoch": 1323} {"train_loss": -11.818063735961914, "global_step": 222337, "epoch": 1323} {"train_loss": -11.718794822692871, "global_step": 222338, "epoch": 1323} {"train_loss": -11.930822372436523, "global_step": 222339, "epoch": 1323} {"train_loss": -11.604427337646484, "global_step": 222340, "epoch": 1323} {"train_loss": -11.641066551208496, "global_step": 222341, "epoch": 1323} {"train_loss": -11.672174453735352, "global_step": 222342, "epoch": 1323} {"train_loss": -11.499543190002441, "global_step": 222343, "epoch": 1323} {"train_loss": -10.544851303100586, "global_step": 222344, "epoch": 1323} {"train_loss": -11.130577087402344, "global_step": 222345, "epoch": 1323} {"train_loss": -11.802854537963867, "global_step": 222346, "epoch": 1323} {"train_loss": -10.324257850646973, "global_step": 222347, "epoch": 1323} {"train_loss": -10.747302055358887, "global_step": 222348, "epoch": 1323} {"train_loss": -11.33184814453125, "global_step": 222349, "epoch": 1323} {"train_loss": -8.5589599609375, "global_step": 222350, "epoch": 1323} {"train_loss": -9.682310104370117, "global_step": 222351, "epoch": 1323} {"train_loss": -11.097978591918945, "global_step": 222352, "epoch": 1323} {"train_loss": -9.795063972473145, "global_step": 222353, "epoch": 1323} {"train_loss": -11.581428527832031, "global_step": 222354, "epoch": 1323} {"train_loss": -9.983428955078125, "global_step": 222355, "epoch": 1323} {"train_loss": -10.640213966369629, "global_step": 222356, "epoch": 1323} {"train_loss": -11.168700218200684, "global_step": 222357, "epoch": 1323} {"train_loss": -10.525758743286133, "global_step": 222358, "epoch": 1323} {"train_loss": -11.074615478515625, "global_step": 222359, "epoch": 1323} {"train_loss": -10.99471378326416, "global_step": 222360, "epoch": 1323} {"train_loss": -11.12979507446289, "global_step": 222361, "epoch": 1323} {"train_loss": -10.985187530517578, "global_step": 222362, "epoch": 1323} {"train_loss": -9.956000328063965, "global_step": 222363, "epoch": 1323} {"train_loss": -10.72895622253418, "global_step": 222364, "epoch": 1323} {"train_loss": -10.105327606201172, "global_step": 222365, "epoch": 1323} {"train_loss": -9.788224220275879, "global_step": 222366, "epoch": 1323} {"train_loss": -10.827472686767578, "global_step": 222367, "epoch": 1323} {"train_loss": -10.547176361083984, "global_step": 222368, "epoch": 1323} {"train_loss": -10.805156707763672, "global_step": 222369, "epoch": 1323} {"train_loss": -10.469093322753906, "global_step": 222370, "epoch": 1323} {"train_loss": -9.979362487792969, "global_step": 222371, "epoch": 1323} {"train_loss": -10.910170555114746, "global_step": 222372, "epoch": 1323} {"train_loss": -10.44011116027832, "global_step": 222373, "epoch": 1323} {"train_loss": -10.89607048034668, "global_step": 222374, "epoch": 1323} {"train_loss": -10.724246978759766, "global_step": 222375, "epoch": 1323} {"train_loss": -11.144830703735352, "global_step": 222376, "epoch": 1323} {"train_loss": -10.821207046508789, "global_step": 222377, "epoch": 1323} {"train_loss": -10.779605865478516, "global_step": 222378, "epoch": 1323} {"train_loss": -10.807962417602539, "global_step": 222379, "epoch": 1323} {"train_loss": -10.353525161743164, "global_step": 222380, "epoch": 1323} {"train_loss": -11.16236400604248, "global_step": 222381, "epoch": 1323} {"train_loss": -10.402986526489258, "global_step": 222382, "epoch": 1323} {"train_loss": -10.657979965209961, "global_step": 222383, "epoch": 1323} {"train_loss": -10.687664985656738, "global_step": 222384, "epoch": 1323} {"train_loss": -10.287571907043457, "global_step": 222385, "epoch": 1323} {"train_loss": -10.906155586242676, "global_step": 222386, "epoch": 1323} {"train_loss": -10.28564453125, "global_step": 222387, "epoch": 1323} {"train_loss": -10.7786865234375, "global_step": 222388, "epoch": 1323} {"train_loss": -10.582188606262207, "global_step": 222389, "epoch": 1323} {"train_loss": -10.283452987670898, "global_step": 222390, "epoch": 1323} {"train_loss": -11.063328742980957, "global_step": 222391, "epoch": 1323} {"train_loss": -10.34847354888916, "global_step": 222392, "epoch": 1323} {"train_loss": -11.409053802490234, "global_step": 222393, "epoch": 1323} {"train_loss": -11.052633285522461, "global_step": 222394, "epoch": 1323} {"train_loss": -11.052328109741211, "global_step": 222395, "epoch": 1323} {"train_loss": -11.149089813232422, "global_step": 222396, "epoch": 1323} {"train_loss": -11.170040130615234, "global_step": 222397, "epoch": 1323} {"train_loss": -10.958786010742188, "global_step": 222398, "epoch": 1323} {"train_loss": -11.292789459228516, "global_step": 222399, "epoch": 1323} {"train_loss": -11.266233444213867, "global_step": 222400, "epoch": 1323} {"train_loss": -11.49806022644043, "global_step": 222401, "epoch": 1323} {"train_loss": -11.226715087890625, "global_step": 222402, "epoch": 1323} {"train_loss": -11.406330108642578, "global_step": 222403, "epoch": 1323} {"train_loss": -11.580535888671875, "global_step": 222404, "epoch": 1323} {"train_loss": -11.355806350708008, "global_step": 222405, "epoch": 1323} {"train_loss": -11.324787139892578, "global_step": 222406, "epoch": 1323} {"train_loss": -11.685165405273438, "global_step": 222407, "epoch": 1323} {"train_loss": -11.536697387695312, "global_step": 222408, "epoch": 1323} {"train_loss": -11.500889778137207, "global_step": 222409, "epoch": 1323} {"train_loss": -11.458427429199219, "global_step": 222410, "epoch": 1323} {"train_loss": -11.650918006896973, "global_step": 222411, "epoch": 1323} {"train_loss": -11.588910102844238, "global_step": 222412, "epoch": 1323} {"train_loss": -11.482076644897461, "global_step": 222413, "epoch": 1323} {"train_loss": -11.60112190246582, "global_step": 222414, "epoch": 1323} {"train_loss": -11.537426948547363, "global_step": 222415, "epoch": 1323} {"train_loss": -11.39871597290039, "global_step": 222416, "epoch": 1323} {"train_loss": -11.852468490600586, "global_step": 222417, "epoch": 1323} {"train_loss": -11.464122772216797, "global_step": 222418, "epoch": 1323} {"train_loss": -11.68655776977539, "global_step": 222419, "epoch": 1323} {"train_loss": -11.625712394714355, "global_step": 222420, "epoch": 1323} {"train_loss": -11.68735408782959, "global_step": 222421, "epoch": 1323} {"train_loss": -11.727485656738281, "global_step": 222422, "epoch": 1323} {"train_loss": -11.71692180633545, "global_step": 222423, "epoch": 1323} {"train_loss": -11.389881134033203, "global_step": 222424, "epoch": 1323} {"train_loss": -11.844367980957031, "global_step": 222425, "epoch": 1323} {"train_loss": -11.513792037963867, "global_step": 222426, "epoch": 1323} {"train_loss": -11.702681541442871, "global_step": 222427, "epoch": 1323} {"train_loss": -11.67631721496582, "global_step": 222428, "epoch": 1323} {"train_loss": -11.6959228515625, "global_step": 222429, "epoch": 1323} {"train_loss": -11.731207847595215, "global_step": 222430, "epoch": 1323} {"train_loss": -11.333585103352865, "global_step": 222431, "epoch": 1323, "val_loss": 259082.828125} {"train_loss": -11.820808410644531, "global_step": 222432, "epoch": 1324} {"train_loss": -11.785351753234863, "global_step": 222433, "epoch": 1324} {"train_loss": -11.655950546264648, "global_step": 222434, "epoch": 1324} {"train_loss": -11.688119888305664, "global_step": 222435, "epoch": 1324} {"train_loss": -11.589848518371582, "global_step": 222436, "epoch": 1324} {"train_loss": -11.980883598327637, "global_step": 222437, "epoch": 1324} {"train_loss": -11.545245170593262, "global_step": 222438, "epoch": 1324} {"train_loss": -11.874486923217773, "global_step": 222439, "epoch": 1324} {"train_loss": -11.601789474487305, "global_step": 222440, "epoch": 1324} {"train_loss": -11.857606887817383, "global_step": 222441, "epoch": 1324} {"train_loss": -11.749531745910645, "global_step": 222442, "epoch": 1324} {"train_loss": -11.644502639770508, "global_step": 222443, "epoch": 1324} {"train_loss": -11.791577339172363, "global_step": 222444, "epoch": 1324} {"train_loss": -11.707154273986816, "global_step": 222445, "epoch": 1324} {"train_loss": -11.685043334960938, "global_step": 222446, "epoch": 1324} {"train_loss": -11.893294334411621, "global_step": 222447, "epoch": 1324} {"train_loss": -11.725192070007324, "global_step": 222448, "epoch": 1324} {"train_loss": -11.711729049682617, "global_step": 222449, "epoch": 1324} {"train_loss": -11.796135902404785, "global_step": 222450, "epoch": 1324} {"train_loss": -11.187858581542969, "global_step": 222451, "epoch": 1324} {"train_loss": -11.904752731323242, "global_step": 222452, "epoch": 1324} {"train_loss": -11.568416595458984, "global_step": 222453, "epoch": 1324} {"train_loss": -11.543938636779785, "global_step": 222454, "epoch": 1324} {"train_loss": -11.947153091430664, "global_step": 222455, "epoch": 1324} {"train_loss": -11.326313018798828, "global_step": 222456, "epoch": 1324} {"train_loss": -10.070314407348633, "global_step": 222457, "epoch": 1324} {"train_loss": -11.456446647644043, "global_step": 222458, "epoch": 1324} {"train_loss": -11.27894401550293, "global_step": 222459, "epoch": 1324} {"train_loss": -10.683133125305176, "global_step": 222460, "epoch": 1324} {"train_loss": -11.98459243774414, "global_step": 222461, "epoch": 1324} {"train_loss": -11.088794708251953, "global_step": 222462, "epoch": 1324} {"train_loss": -11.281390190124512, "global_step": 222463, "epoch": 1324} {"train_loss": -11.693754196166992, "global_step": 222464, "epoch": 1324} {"train_loss": -11.1048002243042, "global_step": 222465, "epoch": 1324} {"train_loss": -11.880399703979492, "global_step": 222466, "epoch": 1324} {"train_loss": -11.728269577026367, "global_step": 222467, "epoch": 1324} {"train_loss": -11.925288200378418, "global_step": 222468, "epoch": 1324} {"train_loss": -11.495079040527344, "global_step": 222469, "epoch": 1324} {"train_loss": -11.588727951049805, "global_step": 222470, "epoch": 1324} {"train_loss": -11.486570358276367, "global_step": 222471, "epoch": 1324} {"train_loss": -10.768736839294434, "global_step": 222472, "epoch": 1324} {"train_loss": -11.511938095092773, "global_step": 222473, "epoch": 1324} {"train_loss": -10.608267784118652, "global_step": 222474, "epoch": 1324} {"train_loss": -11.448698997497559, "global_step": 222475, "epoch": 1324} {"train_loss": -11.266316413879395, "global_step": 222476, "epoch": 1324} {"train_loss": -11.081487655639648, "global_step": 222477, "epoch": 1324} {"train_loss": -11.710399627685547, "global_step": 222478, "epoch": 1324} {"train_loss": -11.12686538696289, "global_step": 222479, "epoch": 1324} {"train_loss": -11.301992416381836, "global_step": 222480, "epoch": 1324} {"train_loss": -11.366584777832031, "global_step": 222481, "epoch": 1324} {"train_loss": -10.962390899658203, "global_step": 222482, "epoch": 1324} {"train_loss": -11.474212646484375, "global_step": 222483, "epoch": 1324} {"train_loss": -10.907727241516113, "global_step": 222484, "epoch": 1324} {"train_loss": -11.023767471313477, "global_step": 222485, "epoch": 1324} {"train_loss": -10.8018798828125, "global_step": 222486, "epoch": 1324} {"train_loss": -10.966522216796875, "global_step": 222487, "epoch": 1324} {"train_loss": -10.889820098876953, "global_step": 222488, "epoch": 1324} {"train_loss": -9.789223670959473, "global_step": 222489, "epoch": 1324} {"train_loss": -11.174561500549316, "global_step": 222490, "epoch": 1324} {"train_loss": -10.06614875793457, "global_step": 222491, "epoch": 1324} {"train_loss": -11.027961730957031, "global_step": 222492, "epoch": 1324} {"train_loss": -10.539271354675293, "global_step": 222493, "epoch": 1324} {"train_loss": -10.559305191040039, "global_step": 222494, "epoch": 1324} {"train_loss": -10.413604736328125, "global_step": 222495, "epoch": 1324} {"train_loss": -11.269380569458008, "global_step": 222496, "epoch": 1324} {"train_loss": -10.856789588928223, "global_step": 222497, "epoch": 1324} {"train_loss": -10.743080139160156, "global_step": 222498, "epoch": 1324} {"train_loss": -11.331506729125977, "global_step": 222499, "epoch": 1324} {"train_loss": -11.16206169128418, "global_step": 222500, "epoch": 1324} {"train_loss": -11.269631385803223, "global_step": 222501, "epoch": 1324} {"train_loss": -11.312288284301758, "global_step": 222502, "epoch": 1324} {"train_loss": -11.442146301269531, "global_step": 222503, "epoch": 1324} {"train_loss": -11.132667541503906, "global_step": 222504, "epoch": 1324} {"train_loss": -11.342876434326172, "global_step": 222505, "epoch": 1324} {"train_loss": -11.017587661743164, "global_step": 222506, "epoch": 1324} {"train_loss": -11.535982131958008, "global_step": 222507, "epoch": 1324} {"train_loss": -10.347089767456055, "global_step": 222508, "epoch": 1324} {"train_loss": -11.359180450439453, "global_step": 222509, "epoch": 1324} {"train_loss": -10.538025856018066, "global_step": 222510, "epoch": 1324} {"train_loss": -11.325504302978516, "global_step": 222511, "epoch": 1324} {"train_loss": -10.768657684326172, "global_step": 222512, "epoch": 1324} {"train_loss": -11.280293464660645, "global_step": 222513, "epoch": 1324} {"train_loss": -11.267178535461426, "global_step": 222514, "epoch": 1324} {"train_loss": -11.46358871459961, "global_step": 222515, "epoch": 1324} {"train_loss": -11.110428810119629, "global_step": 222516, "epoch": 1324} {"train_loss": -11.290193557739258, "global_step": 222517, "epoch": 1324} {"train_loss": -11.262025833129883, "global_step": 222518, "epoch": 1324} {"train_loss": -11.251935958862305, "global_step": 222519, "epoch": 1324} {"train_loss": -11.523052215576172, "global_step": 222520, "epoch": 1324} {"train_loss": -10.799001693725586, "global_step": 222521, "epoch": 1324} {"train_loss": -11.371246337890625, "global_step": 222522, "epoch": 1324} {"train_loss": -11.106371879577637, "global_step": 222523, "epoch": 1324} {"train_loss": -11.468804359436035, "global_step": 222524, "epoch": 1324} {"train_loss": -10.907886505126953, "global_step": 222525, "epoch": 1324} {"train_loss": -11.641307830810547, "global_step": 222526, "epoch": 1324} {"train_loss": -11.15438461303711, "global_step": 222527, "epoch": 1324} {"train_loss": -11.469181060791016, "global_step": 222528, "epoch": 1324} {"train_loss": -11.426259994506836, "global_step": 222529, "epoch": 1324} {"train_loss": -11.703385353088379, "global_step": 222530, "epoch": 1324} {"train_loss": -11.622871398925781, "global_step": 222531, "epoch": 1324} {"train_loss": -11.691610336303711, "global_step": 222532, "epoch": 1324} {"train_loss": -11.68031120300293, "global_step": 222533, "epoch": 1324} {"train_loss": -11.54006576538086, "global_step": 222534, "epoch": 1324} {"train_loss": -11.752235412597656, "global_step": 222535, "epoch": 1324} {"train_loss": -11.624267578125, "global_step": 222536, "epoch": 1324} {"train_loss": -11.972267150878906, "global_step": 222537, "epoch": 1324} {"train_loss": -11.546821594238281, "global_step": 222538, "epoch": 1324} {"train_loss": -11.83757495880127, "global_step": 222539, "epoch": 1324} {"train_loss": -11.689672470092773, "global_step": 222540, "epoch": 1324} {"train_loss": -11.896602630615234, "global_step": 222541, "epoch": 1324} {"train_loss": -11.853134155273438, "global_step": 222542, "epoch": 1324} {"train_loss": -11.920795440673828, "global_step": 222543, "epoch": 1324} {"train_loss": -11.842286109924316, "global_step": 222544, "epoch": 1324} {"train_loss": -11.85090160369873, "global_step": 222545, "epoch": 1324} {"train_loss": -11.704322814941406, "global_step": 222546, "epoch": 1324} {"train_loss": -11.806482315063477, "global_step": 222547, "epoch": 1324} {"train_loss": -11.79349136352539, "global_step": 222548, "epoch": 1324} {"train_loss": -11.867841720581055, "global_step": 222549, "epoch": 1324} {"train_loss": -11.811423301696777, "global_step": 222550, "epoch": 1324} {"train_loss": -11.905014038085938, "global_step": 222551, "epoch": 1324} {"train_loss": -12.027891159057617, "global_step": 222552, "epoch": 1324} {"train_loss": -12.05355167388916, "global_step": 222553, "epoch": 1324} {"train_loss": -11.917900085449219, "global_step": 222554, "epoch": 1324} {"train_loss": -11.8008394241333, "global_step": 222555, "epoch": 1324} {"train_loss": -12.12980842590332, "global_step": 222556, "epoch": 1324} {"train_loss": -12.022721290588379, "global_step": 222557, "epoch": 1324} {"train_loss": -12.134515762329102, "global_step": 222558, "epoch": 1324} {"train_loss": -11.999945640563965, "global_step": 222559, "epoch": 1324} {"train_loss": -11.874670028686523, "global_step": 222560, "epoch": 1324} {"train_loss": -11.762803077697754, "global_step": 222561, "epoch": 1324} {"train_loss": -11.875802040100098, "global_step": 222562, "epoch": 1324} {"train_loss": -11.882522583007812, "global_step": 222563, "epoch": 1324} {"train_loss": -12.169700622558594, "global_step": 222564, "epoch": 1324} {"train_loss": -11.681557655334473, "global_step": 222565, "epoch": 1324} {"train_loss": -11.814047813415527, "global_step": 222566, "epoch": 1324} {"train_loss": -11.944467544555664, "global_step": 222567, "epoch": 1324} {"train_loss": -11.785530090332031, "global_step": 222568, "epoch": 1324} {"train_loss": -11.525755882263184, "global_step": 222569, "epoch": 1324} {"train_loss": -11.7081298828125, "global_step": 222570, "epoch": 1324} {"train_loss": -11.610156059265137, "global_step": 222571, "epoch": 1324} {"train_loss": -11.666034698486328, "global_step": 222572, "epoch": 1324} {"train_loss": -11.494827270507812, "global_step": 222573, "epoch": 1324} {"train_loss": -11.788792610168457, "global_step": 222574, "epoch": 1324} {"train_loss": -11.92108154296875, "global_step": 222575, "epoch": 1324} {"train_loss": -11.385534286499023, "global_step": 222576, "epoch": 1324} {"train_loss": -12.198661804199219, "global_step": 222577, "epoch": 1324} {"train_loss": -11.826186180114746, "global_step": 222578, "epoch": 1324} {"train_loss": -11.827571868896484, "global_step": 222579, "epoch": 1324} {"train_loss": -11.397876739501953, "global_step": 222580, "epoch": 1324} {"train_loss": -11.924356460571289, "global_step": 222581, "epoch": 1324} {"train_loss": -11.676614761352539, "global_step": 222582, "epoch": 1324} {"train_loss": -11.798578262329102, "global_step": 222583, "epoch": 1324} {"train_loss": -11.875137329101562, "global_step": 222584, "epoch": 1324} {"train_loss": -11.733858108520508, "global_step": 222585, "epoch": 1324} {"train_loss": -11.79313850402832, "global_step": 222586, "epoch": 1324} {"train_loss": -12.063480377197266, "global_step": 222587, "epoch": 1324} {"train_loss": -11.762328147888184, "global_step": 222588, "epoch": 1324} {"train_loss": -11.709674835205078, "global_step": 222589, "epoch": 1324} {"train_loss": -10.7947416305542, "global_step": 222590, "epoch": 1324} {"train_loss": -11.33279800415039, "global_step": 222591, "epoch": 1324} {"train_loss": -11.045279502868652, "global_step": 222592, "epoch": 1324} {"train_loss": -11.757406234741211, "global_step": 222593, "epoch": 1324} {"train_loss": -9.794929504394531, "global_step": 222594, "epoch": 1324} {"train_loss": -9.659463882446289, "global_step": 222595, "epoch": 1324} {"train_loss": -9.993892669677734, "global_step": 222596, "epoch": 1324} {"train_loss": -11.379589080810547, "global_step": 222597, "epoch": 1324} {"train_loss": -9.367157936096191, "global_step": 222598, "epoch": 1324} {"train_loss": -11.43400808175405, "global_step": 222599, "epoch": 1324, "val_loss": 260716.359375} {"train_loss": -10.306547164916992, "global_step": 222600, "epoch": 1325} {"train_loss": -10.484636306762695, "global_step": 222601, "epoch": 1325} {"train_loss": -10.895912170410156, "global_step": 222602, "epoch": 1325} {"train_loss": -10.114681243896484, "global_step": 222603, "epoch": 1325} {"train_loss": -11.010026931762695, "global_step": 222604, "epoch": 1325} {"train_loss": -9.69926643371582, "global_step": 222605, "epoch": 1325} {"train_loss": -10.410459518432617, "global_step": 222606, "epoch": 1325} {"train_loss": -11.296651840209961, "global_step": 222607, "epoch": 1325} {"train_loss": -10.56760025024414, "global_step": 222608, "epoch": 1325} {"train_loss": -11.443958282470703, "global_step": 222609, "epoch": 1325} {"train_loss": -10.882776260375977, "global_step": 222610, "epoch": 1325} {"train_loss": -11.318717002868652, "global_step": 222611, "epoch": 1325} {"train_loss": -11.301547050476074, "global_step": 222612, "epoch": 1325} {"train_loss": -11.235201835632324, "global_step": 222613, "epoch": 1325} {"train_loss": -11.381044387817383, "global_step": 222614, "epoch": 1325} {"train_loss": -11.617887496948242, "global_step": 222615, "epoch": 1325} {"train_loss": -11.356401443481445, "global_step": 222616, "epoch": 1325} {"train_loss": -11.536052703857422, "global_step": 222617, "epoch": 1325} {"train_loss": -11.510924339294434, "global_step": 222618, "epoch": 1325} {"train_loss": -11.459939956665039, "global_step": 222619, "epoch": 1325} {"train_loss": -11.495807647705078, "global_step": 222620, "epoch": 1325} {"train_loss": -11.582500457763672, "global_step": 222621, "epoch": 1325} {"train_loss": -11.454453468322754, "global_step": 222622, "epoch": 1325} {"train_loss": -11.586819648742676, "global_step": 222623, "epoch": 1325} {"train_loss": -11.4843111038208, "global_step": 222624, "epoch": 1325} {"train_loss": -11.690061569213867, "global_step": 222625, "epoch": 1325} {"train_loss": -11.715692520141602, "global_step": 222626, "epoch": 1325} {"train_loss": -11.523138999938965, "global_step": 222627, "epoch": 1325} {"train_loss": -11.750543594360352, "global_step": 222628, "epoch": 1325} {"train_loss": -11.406059265136719, "global_step": 222629, "epoch": 1325} {"train_loss": -11.89829158782959, "global_step": 222630, "epoch": 1325} {"train_loss": -11.521535873413086, "global_step": 222631, "epoch": 1325} {"train_loss": -11.969704627990723, "global_step": 222632, "epoch": 1325} {"train_loss": -11.68130111694336, "global_step": 222633, "epoch": 1325} {"train_loss": -11.811727523803711, "global_step": 222634, "epoch": 1325} {"train_loss": -11.809341430664062, "global_step": 222635, "epoch": 1325} {"train_loss": -11.774154663085938, "global_step": 222636, "epoch": 1325} {"train_loss": -11.678656578063965, "global_step": 222637, "epoch": 1325} {"train_loss": -11.658284187316895, "global_step": 222638, "epoch": 1325} {"train_loss": -11.594720840454102, "global_step": 222639, "epoch": 1325} {"train_loss": -11.758590698242188, "global_step": 222640, "epoch": 1325} {"train_loss": -11.820932388305664, "global_step": 222641, "epoch": 1325} {"train_loss": -11.713536262512207, "global_step": 222642, "epoch": 1325} {"train_loss": -11.708307266235352, "global_step": 222643, "epoch": 1325} {"train_loss": -11.36964225769043, "global_step": 222644, "epoch": 1325} {"train_loss": -11.935673713684082, "global_step": 222645, "epoch": 1325} {"train_loss": -11.267330169677734, "global_step": 222646, "epoch": 1325} {"train_loss": -11.702897071838379, "global_step": 222647, "epoch": 1325} {"train_loss": -11.453813552856445, "global_step": 222648, "epoch": 1325} {"train_loss": -11.491434097290039, "global_step": 222649, "epoch": 1325} {"train_loss": -11.654121398925781, "global_step": 222650, "epoch": 1325} {"train_loss": -11.63753604888916, "global_step": 222651, "epoch": 1325} {"train_loss": -12.11007022857666, "global_step": 222652, "epoch": 1325} {"train_loss": -11.476032257080078, "global_step": 222653, "epoch": 1325} {"train_loss": -11.723161697387695, "global_step": 222654, "epoch": 1325} {"train_loss": -11.858476638793945, "global_step": 222655, "epoch": 1325} {"train_loss": -11.902177810668945, "global_step": 222656, "epoch": 1325} {"train_loss": -11.924072265625, "global_step": 222657, "epoch": 1325} {"train_loss": -11.642118453979492, "global_step": 222658, "epoch": 1325} {"train_loss": -11.686380386352539, "global_step": 222659, "epoch": 1325} {"train_loss": -11.825315475463867, "global_step": 222660, "epoch": 1325} {"train_loss": -11.118017196655273, "global_step": 222661, "epoch": 1325} {"train_loss": -11.989251136779785, "global_step": 222662, "epoch": 1325} {"train_loss": -11.414519309997559, "global_step": 222663, "epoch": 1325} {"train_loss": -11.555805206298828, "global_step": 222664, "epoch": 1325} {"train_loss": -11.718253135681152, "global_step": 222665, "epoch": 1325} {"train_loss": -11.730985641479492, "global_step": 222666, "epoch": 1325} {"train_loss": -11.326743125915527, "global_step": 222667, "epoch": 1325} {"train_loss": -11.695929527282715, "global_step": 222668, "epoch": 1325} {"train_loss": -11.537784576416016, "global_step": 222669, "epoch": 1325} {"train_loss": -11.647408485412598, "global_step": 222670, "epoch": 1325} {"train_loss": -11.491743087768555, "global_step": 222671, "epoch": 1325} {"train_loss": -11.63218879699707, "global_step": 222672, "epoch": 1325} {"train_loss": -11.463298797607422, "global_step": 222673, "epoch": 1325} {"train_loss": -11.213109970092773, "global_step": 222674, "epoch": 1325} {"train_loss": -11.874932289123535, "global_step": 222675, "epoch": 1325} {"train_loss": -12.027749061584473, "global_step": 222676, "epoch": 1325} {"train_loss": -11.67780876159668, "global_step": 222677, "epoch": 1325} {"train_loss": -11.909140586853027, "global_step": 222678, "epoch": 1325} {"train_loss": -11.849111557006836, "global_step": 222679, "epoch": 1325} {"train_loss": -12.130836486816406, "global_step": 222680, "epoch": 1325} {"train_loss": -11.75006103515625, "global_step": 222681, "epoch": 1325} {"train_loss": -11.97348403930664, "global_step": 222682, "epoch": 1325} {"train_loss": -11.953006744384766, "global_step": 222683, "epoch": 1325} {"train_loss": -12.053132057189941, "global_step": 222684, "epoch": 1325} {"train_loss": -11.504161834716797, "global_step": 222685, "epoch": 1325} {"train_loss": -11.636877059936523, "global_step": 222686, "epoch": 1325} {"train_loss": -11.903507232666016, "global_step": 222687, "epoch": 1325} {"train_loss": -11.392528533935547, "global_step": 222688, "epoch": 1325} {"train_loss": -11.327043533325195, "global_step": 222689, "epoch": 1325} {"train_loss": -12.006308555603027, "global_step": 222690, "epoch": 1325} {"train_loss": -11.621883392333984, "global_step": 222691, "epoch": 1325} {"train_loss": -11.012836456298828, "global_step": 222692, "epoch": 1325} {"train_loss": -11.369239807128906, "global_step": 222693, "epoch": 1325} {"train_loss": -11.411375999450684, "global_step": 222694, "epoch": 1325} {"train_loss": -10.79680061340332, "global_step": 222695, "epoch": 1325} {"train_loss": -11.277541160583496, "global_step": 222696, "epoch": 1325} {"train_loss": -11.63351821899414, "global_step": 222697, "epoch": 1325} {"train_loss": -10.626946449279785, "global_step": 222698, "epoch": 1325} {"train_loss": -11.6181640625, "global_step": 222699, "epoch": 1325} {"train_loss": -11.629793167114258, "global_step": 222700, "epoch": 1325} {"train_loss": -11.010406494140625, "global_step": 222701, "epoch": 1325} {"train_loss": -11.663862228393555, "global_step": 222702, "epoch": 1325} {"train_loss": -11.702237129211426, "global_step": 222703, "epoch": 1325} {"train_loss": -11.303272247314453, "global_step": 222704, "epoch": 1325} {"train_loss": -11.43079662322998, "global_step": 222705, "epoch": 1325} {"train_loss": -11.283638000488281, "global_step": 222706, "epoch": 1325} {"train_loss": -11.149182319641113, "global_step": 222707, "epoch": 1325} {"train_loss": -11.216796875, "global_step": 222708, "epoch": 1325} {"train_loss": -10.994145393371582, "global_step": 222709, "epoch": 1325} {"train_loss": -11.367538452148438, "global_step": 222710, "epoch": 1325} {"train_loss": -10.82686996459961, "global_step": 222711, "epoch": 1325} {"train_loss": -10.639198303222656, "global_step": 222712, "epoch": 1325} {"train_loss": -11.182892799377441, "global_step": 222713, "epoch": 1325} {"train_loss": -10.204696655273438, "global_step": 222714, "epoch": 1325} {"train_loss": -11.458271026611328, "global_step": 222715, "epoch": 1325} {"train_loss": -10.770593643188477, "global_step": 222716, "epoch": 1325} {"train_loss": -10.945290565490723, "global_step": 222717, "epoch": 1325} {"train_loss": -11.483564376831055, "global_step": 222718, "epoch": 1325} {"train_loss": -10.987764358520508, "global_step": 222719, "epoch": 1325} {"train_loss": -11.558225631713867, "global_step": 222720, "epoch": 1325} {"train_loss": -11.566276550292969, "global_step": 222721, "epoch": 1325} {"train_loss": -11.459856033325195, "global_step": 222722, "epoch": 1325} {"train_loss": -11.772621154785156, "global_step": 222723, "epoch": 1325} {"train_loss": -11.261260986328125, "global_step": 222724, "epoch": 1325} {"train_loss": -11.692367553710938, "global_step": 222725, "epoch": 1325} {"train_loss": -11.389248847961426, "global_step": 222726, "epoch": 1325} {"train_loss": -11.499059677124023, "global_step": 222727, "epoch": 1325} {"train_loss": -11.867532730102539, "global_step": 222728, "epoch": 1325} {"train_loss": -11.159135818481445, "global_step": 222729, "epoch": 1325} {"train_loss": -11.600456237792969, "global_step": 222730, "epoch": 1325} {"train_loss": -11.416200637817383, "global_step": 222731, "epoch": 1325} {"train_loss": -11.510452270507812, "global_step": 222732, "epoch": 1325} {"train_loss": -11.474851608276367, "global_step": 222733, "epoch": 1325} {"train_loss": -11.295587539672852, "global_step": 222734, "epoch": 1325} {"train_loss": -11.06789779663086, "global_step": 222735, "epoch": 1325} {"train_loss": -11.521883964538574, "global_step": 222736, "epoch": 1325} {"train_loss": -11.167230606079102, "global_step": 222737, "epoch": 1325} {"train_loss": -11.913905143737793, "global_step": 222738, "epoch": 1325} {"train_loss": -10.836808204650879, "global_step": 222739, "epoch": 1325} {"train_loss": -12.009931564331055, "global_step": 222740, "epoch": 1325} {"train_loss": -11.441934585571289, "global_step": 222741, "epoch": 1325} {"train_loss": -11.269478797912598, "global_step": 222742, "epoch": 1325} {"train_loss": -11.085532188415527, "global_step": 222743, "epoch": 1325} {"train_loss": -11.513605117797852, "global_step": 222744, "epoch": 1325} {"train_loss": -11.384256362915039, "global_step": 222745, "epoch": 1325} {"train_loss": -11.139656066894531, "global_step": 222746, "epoch": 1325} {"train_loss": -11.426745414733887, "global_step": 222747, "epoch": 1325} {"train_loss": -11.495588302612305, "global_step": 222748, "epoch": 1325} {"train_loss": -11.812131881713867, "global_step": 222749, "epoch": 1325} {"train_loss": -11.503447532653809, "global_step": 222750, "epoch": 1325} {"train_loss": -11.523033142089844, "global_step": 222751, "epoch": 1325} {"train_loss": -11.666641235351562, "global_step": 222752, "epoch": 1325} {"train_loss": -11.81216812133789, "global_step": 222753, "epoch": 1325} {"train_loss": -11.406044006347656, "global_step": 222754, "epoch": 1325} {"train_loss": -11.500887870788574, "global_step": 222755, "epoch": 1325} {"train_loss": -11.858024597167969, "global_step": 222756, "epoch": 1325} {"train_loss": -11.461856842041016, "global_step": 222757, "epoch": 1325} {"train_loss": -11.89272689819336, "global_step": 222758, "epoch": 1325} {"train_loss": -11.657655715942383, "global_step": 222759, "epoch": 1325} {"train_loss": -11.435388565063477, "global_step": 222760, "epoch": 1325} {"train_loss": -10.940322875976562, "global_step": 222761, "epoch": 1325} {"train_loss": -11.607791900634766, "global_step": 222762, "epoch": 1325} {"train_loss": -11.12601089477539, "global_step": 222763, "epoch": 1325} {"train_loss": -11.48017692565918, "global_step": 222764, "epoch": 1325} {"train_loss": -10.698067665100098, "global_step": 222765, "epoch": 1325} {"train_loss": -11.443902969360352, "global_step": 222766, "epoch": 1325} {"train_loss": -11.450281682468596, "global_step": 222767, "epoch": 1325, "val_loss": 260148.59375, "train_action_mse_error": 3.590200185775757} {"train_loss": -11.472702026367188, "global_step": 222768, "epoch": 1326} {"train_loss": -11.019925117492676, "global_step": 222769, "epoch": 1326} {"train_loss": -11.556976318359375, "global_step": 222770, "epoch": 1326} {"train_loss": -11.191658973693848, "global_step": 222771, "epoch": 1326} {"train_loss": -11.613231658935547, "global_step": 222772, "epoch": 1326} {"train_loss": -11.164161682128906, "global_step": 222773, "epoch": 1326} {"train_loss": -11.715781211853027, "global_step": 222774, "epoch": 1326} {"train_loss": -11.474870681762695, "global_step": 222775, "epoch": 1326} {"train_loss": -11.779985427856445, "global_step": 222776, "epoch": 1326} {"train_loss": -11.522348403930664, "global_step": 222777, "epoch": 1326} {"train_loss": -11.47421646118164, "global_step": 222778, "epoch": 1326} {"train_loss": -10.915437698364258, "global_step": 222779, "epoch": 1326} {"train_loss": -11.40962028503418, "global_step": 222780, "epoch": 1326} {"train_loss": -11.807889938354492, "global_step": 222781, "epoch": 1326} {"train_loss": -11.24654483795166, "global_step": 222782, "epoch": 1326} {"train_loss": -11.70687484741211, "global_step": 222783, "epoch": 1326} {"train_loss": -10.623556137084961, "global_step": 222784, "epoch": 1326} {"train_loss": -11.522197723388672, "global_step": 222785, "epoch": 1326} {"train_loss": -11.396159172058105, "global_step": 222786, "epoch": 1326} {"train_loss": -10.946990966796875, "global_step": 222787, "epoch": 1326} {"train_loss": -11.202030181884766, "global_step": 222788, "epoch": 1326} {"train_loss": -11.272505760192871, "global_step": 222789, "epoch": 1326} {"train_loss": -11.374333381652832, "global_step": 222790, "epoch": 1326} {"train_loss": -11.34748363494873, "global_step": 222791, "epoch": 1326} {"train_loss": -11.470393180847168, "global_step": 222792, "epoch": 1326} {"train_loss": -11.125675201416016, "global_step": 222793, "epoch": 1326} {"train_loss": -11.51349925994873, "global_step": 222794, "epoch": 1326} {"train_loss": -11.468080520629883, "global_step": 222795, "epoch": 1326} {"train_loss": -11.527658462524414, "global_step": 222796, "epoch": 1326} {"train_loss": -11.357823371887207, "global_step": 222797, "epoch": 1326} {"train_loss": -11.480862617492676, "global_step": 222798, "epoch": 1326} {"train_loss": -11.207115173339844, "global_step": 222799, "epoch": 1326} {"train_loss": -11.246471405029297, "global_step": 222800, "epoch": 1326} {"train_loss": -11.168943405151367, "global_step": 222801, "epoch": 1326} {"train_loss": -11.280933380126953, "global_step": 222802, "epoch": 1326} {"train_loss": -10.999825477600098, "global_step": 222803, "epoch": 1326} {"train_loss": -11.349525451660156, "global_step": 222804, "epoch": 1326} {"train_loss": -10.814897537231445, "global_step": 222805, "epoch": 1326} {"train_loss": -11.421476364135742, "global_step": 222806, "epoch": 1326} {"train_loss": -11.118971824645996, "global_step": 222807, "epoch": 1326} {"train_loss": -10.933719635009766, "global_step": 222808, "epoch": 1326} {"train_loss": -11.504229545593262, "global_step": 222809, "epoch": 1326} {"train_loss": -11.27400016784668, "global_step": 222810, "epoch": 1326} {"train_loss": -10.957351684570312, "global_step": 222811, "epoch": 1326} {"train_loss": -11.363852500915527, "global_step": 222812, "epoch": 1326} {"train_loss": -11.172619819641113, "global_step": 222813, "epoch": 1326} {"train_loss": -11.365062713623047, "global_step": 222814, "epoch": 1326} {"train_loss": -11.422602653503418, "global_step": 222815, "epoch": 1326} {"train_loss": -11.347980499267578, "global_step": 222816, "epoch": 1326} {"train_loss": -11.41110610961914, "global_step": 222817, "epoch": 1326} {"train_loss": -11.303781509399414, "global_step": 222818, "epoch": 1326} {"train_loss": -11.652827262878418, "global_step": 222819, "epoch": 1326} {"train_loss": -11.603093147277832, "global_step": 222820, "epoch": 1326} {"train_loss": -11.72059440612793, "global_step": 222821, "epoch": 1326} {"train_loss": -11.598577499389648, "global_step": 222822, "epoch": 1326} {"train_loss": -11.601350784301758, "global_step": 222823, "epoch": 1326} {"train_loss": -11.50670051574707, "global_step": 222824, "epoch": 1326} {"train_loss": -11.58735466003418, "global_step": 222825, "epoch": 1326} {"train_loss": -11.719917297363281, "global_step": 222826, "epoch": 1326} {"train_loss": -11.495187759399414, "global_step": 222827, "epoch": 1326} {"train_loss": -11.597587585449219, "global_step": 222828, "epoch": 1326} {"train_loss": -11.364771842956543, "global_step": 222829, "epoch": 1326} {"train_loss": -11.369462966918945, "global_step": 222830, "epoch": 1326} {"train_loss": -11.856307983398438, "global_step": 222831, "epoch": 1326} {"train_loss": -11.330951690673828, "global_step": 222832, "epoch": 1326} {"train_loss": -11.50979232788086, "global_step": 222833, "epoch": 1326} {"train_loss": -11.750592231750488, "global_step": 222834, "epoch": 1326} {"train_loss": -11.48602294921875, "global_step": 222835, "epoch": 1326} {"train_loss": -11.65040111541748, "global_step": 222836, "epoch": 1326} {"train_loss": -11.791622161865234, "global_step": 222837, "epoch": 1326} {"train_loss": -11.653989791870117, "global_step": 222838, "epoch": 1326} {"train_loss": -11.925714492797852, "global_step": 222839, "epoch": 1326} {"train_loss": -11.676901817321777, "global_step": 222840, "epoch": 1326} {"train_loss": -11.545141220092773, "global_step": 222841, "epoch": 1326} {"train_loss": -11.660137176513672, "global_step": 222842, "epoch": 1326} {"train_loss": -11.78135871887207, "global_step": 222843, "epoch": 1326} {"train_loss": -11.689559936523438, "global_step": 222844, "epoch": 1326} {"train_loss": -11.839327812194824, "global_step": 222845, "epoch": 1326} {"train_loss": -11.645155906677246, "global_step": 222846, "epoch": 1326} {"train_loss": -11.874425888061523, "global_step": 222847, "epoch": 1326} {"train_loss": -11.840776443481445, "global_step": 222848, "epoch": 1326} {"train_loss": -11.790328979492188, "global_step": 222849, "epoch": 1326} {"train_loss": -11.5016508102417, "global_step": 222850, "epoch": 1326} {"train_loss": -11.618511199951172, "global_step": 222851, "epoch": 1326} {"train_loss": -11.557561874389648, "global_step": 222852, "epoch": 1326} {"train_loss": -11.743448257446289, "global_step": 222853, "epoch": 1326} {"train_loss": -11.800542831420898, "global_step": 222854, "epoch": 1326} {"train_loss": -11.830981254577637, "global_step": 222855, "epoch": 1326} {"train_loss": -11.744474411010742, "global_step": 222856, "epoch": 1326} {"train_loss": -12.03822135925293, "global_step": 222857, "epoch": 1326} {"train_loss": -11.948381423950195, "global_step": 222858, "epoch": 1326} {"train_loss": -11.862848281860352, "global_step": 222859, "epoch": 1326} {"train_loss": -11.897139549255371, "global_step": 222860, "epoch": 1326} {"train_loss": -11.913829803466797, "global_step": 222861, "epoch": 1326} {"train_loss": -11.92586612701416, "global_step": 222862, "epoch": 1326} {"train_loss": -12.141470909118652, "global_step": 222863, "epoch": 1326} {"train_loss": -11.841062545776367, "global_step": 222864, "epoch": 1326} {"train_loss": -11.837127685546875, "global_step": 222865, "epoch": 1326} {"train_loss": -12.005449295043945, "global_step": 222866, "epoch": 1326} {"train_loss": -11.664681434631348, "global_step": 222867, "epoch": 1326} {"train_loss": -11.95180892944336, "global_step": 222868, "epoch": 1326} {"train_loss": -11.96280574798584, "global_step": 222869, "epoch": 1326} {"train_loss": -11.812385559082031, "global_step": 222870, "epoch": 1326} {"train_loss": -11.982635498046875, "global_step": 222871, "epoch": 1326} {"train_loss": -12.013439178466797, "global_step": 222872, "epoch": 1326} {"train_loss": -12.163357734680176, "global_step": 222873, "epoch": 1326} {"train_loss": -12.184263229370117, "global_step": 222874, "epoch": 1326} {"train_loss": -12.084929466247559, "global_step": 222875, "epoch": 1326} {"train_loss": -11.924112319946289, "global_step": 222876, "epoch": 1326} {"train_loss": -12.109216690063477, "global_step": 222877, "epoch": 1326} {"train_loss": -12.156272888183594, "global_step": 222878, "epoch": 1326} {"train_loss": -11.995195388793945, "global_step": 222879, "epoch": 1326} {"train_loss": -11.916860580444336, "global_step": 222880, "epoch": 1326} {"train_loss": -12.061470985412598, "global_step": 222881, "epoch": 1326} {"train_loss": -11.9190034866333, "global_step": 222882, "epoch": 1326} {"train_loss": -11.945846557617188, "global_step": 222883, "epoch": 1326} {"train_loss": -11.732450485229492, "global_step": 222884, "epoch": 1326} {"train_loss": -11.528173446655273, "global_step": 222885, "epoch": 1326} {"train_loss": -11.336151123046875, "global_step": 222886, "epoch": 1326} {"train_loss": -11.934834480285645, "global_step": 222887, "epoch": 1326} {"train_loss": -11.878129959106445, "global_step": 222888, "epoch": 1326} {"train_loss": -9.559394836425781, "global_step": 222889, "epoch": 1326} {"train_loss": -9.57260513305664, "global_step": 222890, "epoch": 1326} {"train_loss": -10.408722877502441, "global_step": 222891, "epoch": 1326} {"train_loss": -11.084688186645508, "global_step": 222892, "epoch": 1326} {"train_loss": -8.854964256286621, "global_step": 222893, "epoch": 1326} {"train_loss": -10.334342002868652, "global_step": 222894, "epoch": 1326} {"train_loss": -7.93747091293335, "global_step": 222895, "epoch": 1326} {"train_loss": -7.107126712799072, "global_step": 222896, "epoch": 1326} {"train_loss": -7.573178768157959, "global_step": 222897, "epoch": 1326} {"train_loss": -8.380555152893066, "global_step": 222898, "epoch": 1326} {"train_loss": -8.80091667175293, "global_step": 222899, "epoch": 1326} {"train_loss": -8.406861305236816, "global_step": 222900, "epoch": 1326} {"train_loss": -8.639009475708008, "global_step": 222901, "epoch": 1326} {"train_loss": -8.835451126098633, "global_step": 222902, "epoch": 1326} {"train_loss": -9.853191375732422, "global_step": 222903, "epoch": 1326} {"train_loss": -9.39571762084961, "global_step": 222904, "epoch": 1326} {"train_loss": -10.90555191040039, "global_step": 222905, "epoch": 1326} {"train_loss": -10.461688995361328, "global_step": 222906, "epoch": 1326} {"train_loss": -10.018142700195312, "global_step": 222907, "epoch": 1326} {"train_loss": -10.283931732177734, "global_step": 222908, "epoch": 1326} {"train_loss": -10.017579078674316, "global_step": 222909, "epoch": 1326} {"train_loss": -9.879888534545898, "global_step": 222910, "epoch": 1326} {"train_loss": -10.119119644165039, "global_step": 222911, "epoch": 1326} {"train_loss": -10.756328582763672, "global_step": 222912, "epoch": 1326} {"train_loss": -10.010887145996094, "global_step": 222913, "epoch": 1326} {"train_loss": -10.506977081298828, "global_step": 222914, "epoch": 1326} {"train_loss": -10.381460189819336, "global_step": 222915, "epoch": 1326} {"train_loss": -10.506673812866211, "global_step": 222916, "epoch": 1326} {"train_loss": -10.600231170654297, "global_step": 222917, "epoch": 1326} {"train_loss": -9.873214721679688, "global_step": 222918, "epoch": 1326} {"train_loss": -10.41668701171875, "global_step": 222919, "epoch": 1326} {"train_loss": -10.794304847717285, "global_step": 222920, "epoch": 1326} {"train_loss": -10.733798027038574, "global_step": 222921, "epoch": 1326} {"train_loss": -11.054838180541992, "global_step": 222922, "epoch": 1326} {"train_loss": -10.626018524169922, "global_step": 222923, "epoch": 1326} {"train_loss": -11.282909393310547, "global_step": 222924, "epoch": 1326} {"train_loss": -10.784002304077148, "global_step": 222925, "epoch": 1326} {"train_loss": -11.010210037231445, "global_step": 222926, "epoch": 1326} {"train_loss": -11.237136840820312, "global_step": 222927, "epoch": 1326} {"train_loss": -10.769359588623047, "global_step": 222928, "epoch": 1326} {"train_loss": -11.005664825439453, "global_step": 222929, "epoch": 1326} {"train_loss": -11.411165237426758, "global_step": 222930, "epoch": 1326} {"train_loss": -10.7778902053833, "global_step": 222931, "epoch": 1326} {"train_loss": -11.274703979492188, "global_step": 222932, "epoch": 1326} {"train_loss": -11.17794418334961, "global_step": 222933, "epoch": 1326} {"train_loss": -11.079648971557617, "global_step": 222934, "epoch": 1326} {"train_loss": -11.176867045107342, "global_step": 222935, "epoch": 1326, "val_loss": 254235.65625} {"train_loss": -10.867444038391113, "global_step": 222936, "epoch": 1327} {"train_loss": -11.262163162231445, "global_step": 222937, "epoch": 1327} {"train_loss": -11.166072845458984, "global_step": 222938, "epoch": 1327} {"train_loss": -11.174196243286133, "global_step": 222939, "epoch": 1327} {"train_loss": -11.317338943481445, "global_step": 222940, "epoch": 1327} {"train_loss": -11.260199546813965, "global_step": 222941, "epoch": 1327} {"train_loss": -11.010501861572266, "global_step": 222942, "epoch": 1327} {"train_loss": -11.425182342529297, "global_step": 222943, "epoch": 1327} {"train_loss": -11.354621887207031, "global_step": 222944, "epoch": 1327} {"train_loss": -11.495309829711914, "global_step": 222945, "epoch": 1327} {"train_loss": -11.627412796020508, "global_step": 222946, "epoch": 1327} {"train_loss": -11.57077693939209, "global_step": 222947, "epoch": 1327} {"train_loss": -11.57244873046875, "global_step": 222948, "epoch": 1327} {"train_loss": -11.509044647216797, "global_step": 222949, "epoch": 1327} {"train_loss": -11.556831359863281, "global_step": 222950, "epoch": 1327} {"train_loss": -11.554689407348633, "global_step": 222951, "epoch": 1327} {"train_loss": -11.746988296508789, "global_step": 222952, "epoch": 1327} {"train_loss": -11.55447769165039, "global_step": 222953, "epoch": 1327} {"train_loss": -11.474859237670898, "global_step": 222954, "epoch": 1327} {"train_loss": -11.748359680175781, "global_step": 222955, "epoch": 1327} {"train_loss": -11.641093254089355, "global_step": 222956, "epoch": 1327} {"train_loss": -11.643927574157715, "global_step": 222957, "epoch": 1327} {"train_loss": -11.623283386230469, "global_step": 222958, "epoch": 1327} {"train_loss": -11.647481918334961, "global_step": 222959, "epoch": 1327} {"train_loss": -11.673951148986816, "global_step": 222960, "epoch": 1327} {"train_loss": -11.407261848449707, "global_step": 222961, "epoch": 1327} {"train_loss": -11.739959716796875, "global_step": 222962, "epoch": 1327} {"train_loss": -11.706871032714844, "global_step": 222963, "epoch": 1327} {"train_loss": -11.790576934814453, "global_step": 222964, "epoch": 1327} {"train_loss": -11.82816219329834, "global_step": 222965, "epoch": 1327} {"train_loss": -11.815308570861816, "global_step": 222966, "epoch": 1327} {"train_loss": -11.895268440246582, "global_step": 222967, "epoch": 1327} {"train_loss": -11.82748031616211, "global_step": 222968, "epoch": 1327} {"train_loss": -11.706274032592773, "global_step": 222969, "epoch": 1327} {"train_loss": -11.960250854492188, "global_step": 222970, "epoch": 1327} {"train_loss": -11.908641815185547, "global_step": 222971, "epoch": 1327} {"train_loss": -11.914749145507812, "global_step": 222972, "epoch": 1327} {"train_loss": -11.777946472167969, "global_step": 222973, "epoch": 1327} {"train_loss": -11.811847686767578, "global_step": 222974, "epoch": 1327} {"train_loss": -11.817394256591797, "global_step": 222975, "epoch": 1327} {"train_loss": -11.76893138885498, "global_step": 222976, "epoch": 1327} {"train_loss": -11.850988388061523, "global_step": 222977, "epoch": 1327} {"train_loss": -11.592416763305664, "global_step": 222978, "epoch": 1327} {"train_loss": -11.842743873596191, "global_step": 222979, "epoch": 1327} {"train_loss": -11.851341247558594, "global_step": 222980, "epoch": 1327} {"train_loss": -11.916354179382324, "global_step": 222981, "epoch": 1327} {"train_loss": -11.706131935119629, "global_step": 222982, "epoch": 1327} {"train_loss": -12.035834312438965, "global_step": 222983, "epoch": 1327} {"train_loss": -11.811903953552246, "global_step": 222984, "epoch": 1327} {"train_loss": -11.70236587524414, "global_step": 222985, "epoch": 1327} {"train_loss": -11.290929794311523, "global_step": 222986, "epoch": 1327} {"train_loss": -11.749856948852539, "global_step": 222987, "epoch": 1327} {"train_loss": -11.603649139404297, "global_step": 222988, "epoch": 1327} {"train_loss": -10.77595329284668, "global_step": 222989, "epoch": 1327} {"train_loss": -10.798791885375977, "global_step": 222990, "epoch": 1327} {"train_loss": -10.601314544677734, "global_step": 222991, "epoch": 1327} {"train_loss": -10.431961059570312, "global_step": 222992, "epoch": 1327} {"train_loss": -10.652286529541016, "global_step": 222993, "epoch": 1327} {"train_loss": -11.23970890045166, "global_step": 222994, "epoch": 1327} {"train_loss": -11.066758155822754, "global_step": 222995, "epoch": 1327} {"train_loss": -11.108993530273438, "global_step": 222996, "epoch": 1327} {"train_loss": -11.17594051361084, "global_step": 222997, "epoch": 1327} {"train_loss": -10.844762802124023, "global_step": 222998, "epoch": 1327} {"train_loss": -11.506876945495605, "global_step": 222999, "epoch": 1327} {"train_loss": -10.817424774169922, "global_step": 223000, "epoch": 1327} {"train_loss": -11.663125038146973, "global_step": 223001, "epoch": 1327} {"train_loss": -11.292693138122559, "global_step": 223002, "epoch": 1327} {"train_loss": -11.628198623657227, "global_step": 223003, "epoch": 1327} {"train_loss": -11.534740447998047, "global_step": 223004, "epoch": 1327} {"train_loss": -11.598335266113281, "global_step": 223005, "epoch": 1327} {"train_loss": -11.914274215698242, "global_step": 223006, "epoch": 1327} {"train_loss": -11.385275840759277, "global_step": 223007, "epoch": 1327} {"train_loss": -11.720846176147461, "global_step": 223008, "epoch": 1327} {"train_loss": -11.413703918457031, "global_step": 223009, "epoch": 1327} {"train_loss": -11.776029586791992, "global_step": 223010, "epoch": 1327} {"train_loss": -11.81578254699707, "global_step": 223011, "epoch": 1327} {"train_loss": -11.722225189208984, "global_step": 223012, "epoch": 1327} {"train_loss": -11.594427108764648, "global_step": 223013, "epoch": 1327} {"train_loss": -11.8401460647583, "global_step": 223014, "epoch": 1327} {"train_loss": -11.819263458251953, "global_step": 223015, "epoch": 1327} {"train_loss": -11.591066360473633, "global_step": 223016, "epoch": 1327} {"train_loss": -11.998119354248047, "global_step": 223017, "epoch": 1327} {"train_loss": -11.955510139465332, "global_step": 223018, "epoch": 1327} {"train_loss": -11.841768264770508, "global_step": 223019, "epoch": 1327} {"train_loss": -11.958084106445312, "global_step": 223020, "epoch": 1327} {"train_loss": -11.756657600402832, "global_step": 223021, "epoch": 1327} {"train_loss": -11.902643203735352, "global_step": 223022, "epoch": 1327} {"train_loss": -11.957475662231445, "global_step": 223023, "epoch": 1327} {"train_loss": -11.912817001342773, "global_step": 223024, "epoch": 1327} {"train_loss": -11.975769996643066, "global_step": 223025, "epoch": 1327} {"train_loss": -11.759832382202148, "global_step": 223026, "epoch": 1327} {"train_loss": -11.844886779785156, "global_step": 223027, "epoch": 1327} {"train_loss": -11.49659538269043, "global_step": 223028, "epoch": 1327} {"train_loss": -10.943506240844727, "global_step": 223029, "epoch": 1327} {"train_loss": -11.349403381347656, "global_step": 223030, "epoch": 1327} {"train_loss": -11.953256607055664, "global_step": 223031, "epoch": 1327} {"train_loss": -11.56130599975586, "global_step": 223032, "epoch": 1327} {"train_loss": -10.590773582458496, "global_step": 223033, "epoch": 1327} {"train_loss": -11.113414764404297, "global_step": 223034, "epoch": 1327} {"train_loss": -11.694961547851562, "global_step": 223035, "epoch": 1327} {"train_loss": -10.523414611816406, "global_step": 223036, "epoch": 1327} {"train_loss": -11.083690643310547, "global_step": 223037, "epoch": 1327} {"train_loss": -11.171283721923828, "global_step": 223038, "epoch": 1327} {"train_loss": -10.97545337677002, "global_step": 223039, "epoch": 1327} {"train_loss": -10.632410049438477, "global_step": 223040, "epoch": 1327} {"train_loss": -11.419240951538086, "global_step": 223041, "epoch": 1327} {"train_loss": -11.081130981445312, "global_step": 223042, "epoch": 1327} {"train_loss": -9.920190811157227, "global_step": 223043, "epoch": 1327} {"train_loss": -11.378646850585938, "global_step": 223044, "epoch": 1327} {"train_loss": -10.006680488586426, "global_step": 223045, "epoch": 1327} {"train_loss": -10.277433395385742, "global_step": 223046, "epoch": 1327} {"train_loss": -8.937175750732422, "global_step": 223047, "epoch": 1327} {"train_loss": -9.044288635253906, "global_step": 223048, "epoch": 1327} {"train_loss": -9.309571266174316, "global_step": 223049, "epoch": 1327} {"train_loss": -10.52009105682373, "global_step": 223050, "epoch": 1327} {"train_loss": -9.67837142944336, "global_step": 223051, "epoch": 1327} {"train_loss": -11.051665306091309, "global_step": 223052, "epoch": 1327} {"train_loss": -9.8107328414917, "global_step": 223053, "epoch": 1327} {"train_loss": -11.072161674499512, "global_step": 223054, "epoch": 1327} {"train_loss": -10.060086250305176, "global_step": 223055, "epoch": 1327} {"train_loss": -10.756237030029297, "global_step": 223056, "epoch": 1327} {"train_loss": -9.66283893585205, "global_step": 223057, "epoch": 1327} {"train_loss": -11.192300796508789, "global_step": 223058, "epoch": 1327} {"train_loss": -9.850931167602539, "global_step": 223059, "epoch": 1327} {"train_loss": -11.196371078491211, "global_step": 223060, "epoch": 1327} {"train_loss": -10.372579574584961, "global_step": 223061, "epoch": 1327} {"train_loss": -10.358181953430176, "global_step": 223062, "epoch": 1327} {"train_loss": -10.760053634643555, "global_step": 223063, "epoch": 1327} {"train_loss": -10.699203491210938, "global_step": 223064, "epoch": 1327} {"train_loss": -11.096635818481445, "global_step": 223065, "epoch": 1327} {"train_loss": -10.741104125976562, "global_step": 223066, "epoch": 1327} {"train_loss": -11.079168319702148, "global_step": 223067, "epoch": 1327} {"train_loss": -10.618451118469238, "global_step": 223068, "epoch": 1327} {"train_loss": -11.270689010620117, "global_step": 223069, "epoch": 1327} {"train_loss": -10.715335845947266, "global_step": 223070, "epoch": 1327} {"train_loss": -10.8936767578125, "global_step": 223071, "epoch": 1327} {"train_loss": -11.167720794677734, "global_step": 223072, "epoch": 1327} {"train_loss": -10.775138854980469, "global_step": 223073, "epoch": 1327} {"train_loss": -11.423337936401367, "global_step": 223074, "epoch": 1327} {"train_loss": -11.324437141418457, "global_step": 223075, "epoch": 1327} {"train_loss": -11.181009292602539, "global_step": 223076, "epoch": 1327} {"train_loss": -11.42595100402832, "global_step": 223077, "epoch": 1327} {"train_loss": -11.27719783782959, "global_step": 223078, "epoch": 1327} {"train_loss": -11.322881698608398, "global_step": 223079, "epoch": 1327} {"train_loss": -11.060702323913574, "global_step": 223080, "epoch": 1327} {"train_loss": -11.436800956726074, "global_step": 223081, "epoch": 1327} {"train_loss": -11.574089050292969, "global_step": 223082, "epoch": 1327} {"train_loss": -11.196510314941406, "global_step": 223083, "epoch": 1327} {"train_loss": -11.371529579162598, "global_step": 223084, "epoch": 1327} {"train_loss": -11.515206336975098, "global_step": 223085, "epoch": 1327} {"train_loss": -11.355915069580078, "global_step": 223086, "epoch": 1327} {"train_loss": -11.503944396972656, "global_step": 223087, "epoch": 1327} {"train_loss": -11.416723251342773, "global_step": 223088, "epoch": 1327} {"train_loss": -11.543384552001953, "global_step": 223089, "epoch": 1327} {"train_loss": -11.468295097351074, "global_step": 223090, "epoch": 1327} {"train_loss": -11.497352600097656, "global_step": 223091, "epoch": 1327} {"train_loss": -11.624433517456055, "global_step": 223092, "epoch": 1327} {"train_loss": -11.696898460388184, "global_step": 223093, "epoch": 1327} {"train_loss": -11.516685485839844, "global_step": 223094, "epoch": 1327} {"train_loss": -11.504892349243164, "global_step": 223095, "epoch": 1327} {"train_loss": -11.700675964355469, "global_step": 223096, "epoch": 1327} {"train_loss": -11.682822227478027, "global_step": 223097, "epoch": 1327} {"train_loss": -11.775199890136719, "global_step": 223098, "epoch": 1327} {"train_loss": -11.718917846679688, "global_step": 223099, "epoch": 1327} {"train_loss": -11.811211585998535, "global_step": 223100, "epoch": 1327} {"train_loss": -11.874147415161133, "global_step": 223101, "epoch": 1327} {"train_loss": -11.8760347366333, "global_step": 223102, "epoch": 1327} {"train_loss": -11.318481348809742, "global_step": 223103, "epoch": 1327, "val_loss": 262799.9375} {"train_loss": -11.785316467285156, "global_step": 223104, "epoch": 1328} {"train_loss": -11.965581893920898, "global_step": 223105, "epoch": 1328} {"train_loss": -11.919172286987305, "global_step": 223106, "epoch": 1328} {"train_loss": -11.777373313903809, "global_step": 223107, "epoch": 1328} {"train_loss": -11.970821380615234, "global_step": 223108, "epoch": 1328} {"train_loss": -11.956850051879883, "global_step": 223109, "epoch": 1328} {"train_loss": -11.747823715209961, "global_step": 223110, "epoch": 1328} {"train_loss": -11.861488342285156, "global_step": 223111, "epoch": 1328} {"train_loss": -11.936973571777344, "global_step": 223112, "epoch": 1328} {"train_loss": -11.86424732208252, "global_step": 223113, "epoch": 1328} {"train_loss": -11.921305656433105, "global_step": 223114, "epoch": 1328} {"train_loss": -12.033136367797852, "global_step": 223115, "epoch": 1328} {"train_loss": -12.135930061340332, "global_step": 223116, "epoch": 1328} {"train_loss": -12.081271171569824, "global_step": 223117, "epoch": 1328} {"train_loss": -11.94205379486084, "global_step": 223118, "epoch": 1328} {"train_loss": -11.839700698852539, "global_step": 223119, "epoch": 1328} {"train_loss": -12.029168128967285, "global_step": 223120, "epoch": 1328} {"train_loss": -11.909189224243164, "global_step": 223121, "epoch": 1328} {"train_loss": -12.034978866577148, "global_step": 223122, "epoch": 1328} {"train_loss": -12.017906188964844, "global_step": 223123, "epoch": 1328} {"train_loss": -12.153955459594727, "global_step": 223124, "epoch": 1328} {"train_loss": -12.078696250915527, "global_step": 223125, "epoch": 1328} {"train_loss": -12.063326835632324, "global_step": 223126, "epoch": 1328} {"train_loss": -11.878202438354492, "global_step": 223127, "epoch": 1328} {"train_loss": -11.903507232666016, "global_step": 223128, "epoch": 1328} {"train_loss": -11.799336433410645, "global_step": 223129, "epoch": 1328} {"train_loss": -12.017642974853516, "global_step": 223130, "epoch": 1328} {"train_loss": -11.971994400024414, "global_step": 223131, "epoch": 1328} {"train_loss": -11.827796936035156, "global_step": 223132, "epoch": 1328} {"train_loss": -11.97677230834961, "global_step": 223133, "epoch": 1328} {"train_loss": -11.529234886169434, "global_step": 223134, "epoch": 1328} {"train_loss": -11.927308082580566, "global_step": 223135, "epoch": 1328} {"train_loss": -11.844182014465332, "global_step": 223136, "epoch": 1328} {"train_loss": -11.745903015136719, "global_step": 223137, "epoch": 1328} {"train_loss": -11.932439804077148, "global_step": 223138, "epoch": 1328} {"train_loss": -12.223930358886719, "global_step": 223139, "epoch": 1328} {"train_loss": -12.04227066040039, "global_step": 223140, "epoch": 1328} {"train_loss": -11.911027908325195, "global_step": 223141, "epoch": 1328} {"train_loss": -11.98707389831543, "global_step": 223142, "epoch": 1328} {"train_loss": -11.864774703979492, "global_step": 223143, "epoch": 1328} {"train_loss": -11.820610046386719, "global_step": 223144, "epoch": 1328} {"train_loss": -11.635688781738281, "global_step": 223145, "epoch": 1328} {"train_loss": -11.206971168518066, "global_step": 223146, "epoch": 1328} {"train_loss": -11.875000953674316, "global_step": 223147, "epoch": 1328} {"train_loss": -11.842010498046875, "global_step": 223148, "epoch": 1328} {"train_loss": -11.710585594177246, "global_step": 223149, "epoch": 1328} {"train_loss": -10.637459754943848, "global_step": 223150, "epoch": 1328} {"train_loss": -11.813268661499023, "global_step": 223151, "epoch": 1328} {"train_loss": -10.047548294067383, "global_step": 223152, "epoch": 1328} {"train_loss": -11.474254608154297, "global_step": 223153, "epoch": 1328} {"train_loss": -10.147134780883789, "global_step": 223154, "epoch": 1328} {"train_loss": -12.026522636413574, "global_step": 223155, "epoch": 1328} {"train_loss": -10.711845397949219, "global_step": 223156, "epoch": 1328} {"train_loss": -11.664751052856445, "global_step": 223157, "epoch": 1328} {"train_loss": -10.74893569946289, "global_step": 223158, "epoch": 1328} {"train_loss": -11.529740333557129, "global_step": 223159, "epoch": 1328} {"train_loss": -11.283021926879883, "global_step": 223160, "epoch": 1328} {"train_loss": -11.543210983276367, "global_step": 223161, "epoch": 1328} {"train_loss": -10.326351165771484, "global_step": 223162, "epoch": 1328} {"train_loss": -10.861482620239258, "global_step": 223163, "epoch": 1328} {"train_loss": -10.945679664611816, "global_step": 223164, "epoch": 1328} {"train_loss": -10.672612190246582, "global_step": 223165, "epoch": 1328} {"train_loss": -10.31599235534668, "global_step": 223166, "epoch": 1328} {"train_loss": -9.81828498840332, "global_step": 223167, "epoch": 1328} {"train_loss": -10.092124938964844, "global_step": 223168, "epoch": 1328} {"train_loss": -10.50715160369873, "global_step": 223169, "epoch": 1328} {"train_loss": -9.747821807861328, "global_step": 223170, "epoch": 1328} {"train_loss": -9.25874137878418, "global_step": 223171, "epoch": 1328} {"train_loss": -10.255447387695312, "global_step": 223172, "epoch": 1328} {"train_loss": -9.782898902893066, "global_step": 223173, "epoch": 1328} {"train_loss": -10.355154037475586, "global_step": 223174, "epoch": 1328} {"train_loss": -9.183740615844727, "global_step": 223175, "epoch": 1328} {"train_loss": -10.967863082885742, "global_step": 223176, "epoch": 1328} {"train_loss": -8.485546112060547, "global_step": 223177, "epoch": 1328} {"train_loss": -10.984886169433594, "global_step": 223178, "epoch": 1328} {"train_loss": -9.348834037780762, "global_step": 223179, "epoch": 1328} {"train_loss": -10.005725860595703, "global_step": 223180, "epoch": 1328} {"train_loss": -10.285051345825195, "global_step": 223181, "epoch": 1328} {"train_loss": -10.199722290039062, "global_step": 223182, "epoch": 1328} {"train_loss": -9.970966339111328, "global_step": 223183, "epoch": 1328} {"train_loss": -10.704614639282227, "global_step": 223184, "epoch": 1328} {"train_loss": -10.363197326660156, "global_step": 223185, "epoch": 1328} {"train_loss": -10.217065811157227, "global_step": 223186, "epoch": 1328} {"train_loss": -10.903101921081543, "global_step": 223187, "epoch": 1328} {"train_loss": -10.272501945495605, "global_step": 223188, "epoch": 1328} {"train_loss": -10.06599235534668, "global_step": 223189, "epoch": 1328} {"train_loss": -10.775578498840332, "global_step": 223190, "epoch": 1328} {"train_loss": -10.623336791992188, "global_step": 223191, "epoch": 1328} {"train_loss": -10.337413787841797, "global_step": 223192, "epoch": 1328} {"train_loss": -10.510940551757812, "global_step": 223193, "epoch": 1328} {"train_loss": -10.989139556884766, "global_step": 223194, "epoch": 1328} {"train_loss": -9.618139266967773, "global_step": 223195, "epoch": 1328} {"train_loss": -10.076854705810547, "global_step": 223196, "epoch": 1328} {"train_loss": -10.895523071289062, "global_step": 223197, "epoch": 1328} {"train_loss": -10.203302383422852, "global_step": 223198, "epoch": 1328} {"train_loss": -10.23910140991211, "global_step": 223199, "epoch": 1328} {"train_loss": -10.878565788269043, "global_step": 223200, "epoch": 1328} {"train_loss": -10.813018798828125, "global_step": 223201, "epoch": 1328} {"train_loss": -10.0750093460083, "global_step": 223202, "epoch": 1328} {"train_loss": -10.901049613952637, "global_step": 223203, "epoch": 1328} {"train_loss": -11.339241027832031, "global_step": 223204, "epoch": 1328} {"train_loss": -10.696037292480469, "global_step": 223205, "epoch": 1328} {"train_loss": -10.987942695617676, "global_step": 223206, "epoch": 1328} {"train_loss": -11.274858474731445, "global_step": 223207, "epoch": 1328} {"train_loss": -11.015810012817383, "global_step": 223208, "epoch": 1328} {"train_loss": -11.061083793640137, "global_step": 223209, "epoch": 1328} {"train_loss": -11.206197738647461, "global_step": 223210, "epoch": 1328} {"train_loss": -11.124335289001465, "global_step": 223211, "epoch": 1328} {"train_loss": -11.09343433380127, "global_step": 223212, "epoch": 1328} {"train_loss": -11.1234769821167, "global_step": 223213, "epoch": 1328} {"train_loss": -11.299603462219238, "global_step": 223214, "epoch": 1328} {"train_loss": -11.259464263916016, "global_step": 223215, "epoch": 1328} {"train_loss": -11.033586502075195, "global_step": 223216, "epoch": 1328} {"train_loss": -11.259246826171875, "global_step": 223217, "epoch": 1328} {"train_loss": -11.17109203338623, "global_step": 223218, "epoch": 1328} {"train_loss": -11.330056190490723, "global_step": 223219, "epoch": 1328} {"train_loss": -11.064128875732422, "global_step": 223220, "epoch": 1328} {"train_loss": -11.451372146606445, "global_step": 223221, "epoch": 1328} {"train_loss": -11.339179992675781, "global_step": 223222, "epoch": 1328} {"train_loss": -11.059688568115234, "global_step": 223223, "epoch": 1328} {"train_loss": -11.376983642578125, "global_step": 223224, "epoch": 1328} {"train_loss": -11.526368141174316, "global_step": 223225, "epoch": 1328} {"train_loss": -11.335494041442871, "global_step": 223226, "epoch": 1328} {"train_loss": -11.39039421081543, "global_step": 223227, "epoch": 1328} {"train_loss": -11.511275291442871, "global_step": 223228, "epoch": 1328} {"train_loss": -11.38077449798584, "global_step": 223229, "epoch": 1328} {"train_loss": -11.46038818359375, "global_step": 223230, "epoch": 1328} {"train_loss": -11.482366561889648, "global_step": 223231, "epoch": 1328} {"train_loss": -11.384641647338867, "global_step": 223232, "epoch": 1328} {"train_loss": -11.349063873291016, "global_step": 223233, "epoch": 1328} {"train_loss": -11.555344581604004, "global_step": 223234, "epoch": 1328} {"train_loss": -11.727931022644043, "global_step": 223235, "epoch": 1328} {"train_loss": -11.396021842956543, "global_step": 223236, "epoch": 1328} {"train_loss": -11.628564834594727, "global_step": 223237, "epoch": 1328} {"train_loss": -11.619743347167969, "global_step": 223238, "epoch": 1328} {"train_loss": -11.613260269165039, "global_step": 223239, "epoch": 1328} {"train_loss": -11.719015121459961, "global_step": 223240, "epoch": 1328} {"train_loss": -11.63219928741455, "global_step": 223241, "epoch": 1328} {"train_loss": -11.774857521057129, "global_step": 223242, "epoch": 1328} {"train_loss": -11.402742385864258, "global_step": 223243, "epoch": 1328} {"train_loss": -11.59444808959961, "global_step": 223244, "epoch": 1328} {"train_loss": -11.716964721679688, "global_step": 223245, "epoch": 1328} {"train_loss": -11.613809585571289, "global_step": 223246, "epoch": 1328} {"train_loss": -11.774792671203613, "global_step": 223247, "epoch": 1328} {"train_loss": -11.728425979614258, "global_step": 223248, "epoch": 1328} {"train_loss": -11.870206832885742, "global_step": 223249, "epoch": 1328} {"train_loss": -11.764324188232422, "global_step": 223250, "epoch": 1328} {"train_loss": -11.782598495483398, "global_step": 223251, "epoch": 1328} {"train_loss": -11.669559478759766, "global_step": 223252, "epoch": 1328} {"train_loss": -11.873085021972656, "global_step": 223253, "epoch": 1328} {"train_loss": -11.796680450439453, "global_step": 223254, "epoch": 1328} {"train_loss": -11.786310195922852, "global_step": 223255, "epoch": 1328} {"train_loss": -11.781229019165039, "global_step": 223256, "epoch": 1328} {"train_loss": -11.757429122924805, "global_step": 223257, "epoch": 1328} {"train_loss": -11.900551795959473, "global_step": 223258, "epoch": 1328} {"train_loss": -11.791376113891602, "global_step": 223259, "epoch": 1328} {"train_loss": -11.923336029052734, "global_step": 223260, "epoch": 1328} {"train_loss": -11.817484855651855, "global_step": 223261, "epoch": 1328} {"train_loss": -11.972078323364258, "global_step": 223262, "epoch": 1328} {"train_loss": -11.982572555541992, "global_step": 223263, "epoch": 1328} {"train_loss": -12.079547882080078, "global_step": 223264, "epoch": 1328} {"train_loss": -12.031720161437988, "global_step": 223265, "epoch": 1328} {"train_loss": -12.077970504760742, "global_step": 223266, "epoch": 1328} {"train_loss": -11.852128982543945, "global_step": 223267, "epoch": 1328} {"train_loss": -11.884608268737793, "global_step": 223268, "epoch": 1328} {"train_loss": -11.798195838928223, "global_step": 223269, "epoch": 1328} {"train_loss": -12.053064346313477, "global_step": 223270, "epoch": 1328} {"train_loss": -11.295783888726007, "global_step": 223271, "epoch": 1328, "val_loss": 260956.359375} {"train_loss": -11.917585372924805, "global_step": 223272, "epoch": 1329} {"train_loss": -11.824125289916992, "global_step": 223273, "epoch": 1329} {"train_loss": -11.977090835571289, "global_step": 223274, "epoch": 1329} {"train_loss": -11.673345565795898, "global_step": 223275, "epoch": 1329} {"train_loss": -11.606170654296875, "global_step": 223276, "epoch": 1329} {"train_loss": -12.181161880493164, "global_step": 223277, "epoch": 1329} {"train_loss": -11.873906135559082, "global_step": 223278, "epoch": 1329} {"train_loss": -11.846574783325195, "global_step": 223279, "epoch": 1329} {"train_loss": -11.587028503417969, "global_step": 223280, "epoch": 1329} {"train_loss": -11.815495491027832, "global_step": 223281, "epoch": 1329} {"train_loss": -12.00017261505127, "global_step": 223282, "epoch": 1329} {"train_loss": -11.747928619384766, "global_step": 223283, "epoch": 1329} {"train_loss": -11.25904655456543, "global_step": 223284, "epoch": 1329} {"train_loss": -11.921674728393555, "global_step": 223285, "epoch": 1329} {"train_loss": -11.915699005126953, "global_step": 223286, "epoch": 1329} {"train_loss": -10.933784484863281, "global_step": 223287, "epoch": 1329} {"train_loss": -10.929975509643555, "global_step": 223288, "epoch": 1329} {"train_loss": -12.199308395385742, "global_step": 223289, "epoch": 1329} {"train_loss": -10.967046737670898, "global_step": 223290, "epoch": 1329} {"train_loss": -9.932413101196289, "global_step": 223291, "epoch": 1329} {"train_loss": -10.885156631469727, "global_step": 223292, "epoch": 1329} {"train_loss": -11.575600624084473, "global_step": 223293, "epoch": 1329} {"train_loss": -10.048553466796875, "global_step": 223294, "epoch": 1329} {"train_loss": -11.631282806396484, "global_step": 223295, "epoch": 1329} {"train_loss": -11.32624626159668, "global_step": 223296, "epoch": 1329} {"train_loss": -9.162346839904785, "global_step": 223297, "epoch": 1329} {"train_loss": -11.160451889038086, "global_step": 223298, "epoch": 1329} {"train_loss": -8.827526092529297, "global_step": 223299, "epoch": 1329} {"train_loss": -10.144161224365234, "global_step": 223300, "epoch": 1329} {"train_loss": -10.564626693725586, "global_step": 223301, "epoch": 1329} {"train_loss": -8.666508674621582, "global_step": 223302, "epoch": 1329} {"train_loss": -10.277284622192383, "global_step": 223303, "epoch": 1329} {"train_loss": -8.994855880737305, "global_step": 223304, "epoch": 1329} {"train_loss": -9.798105239868164, "global_step": 223305, "epoch": 1329} {"train_loss": -10.098971366882324, "global_step": 223306, "epoch": 1329} {"train_loss": -10.114360809326172, "global_step": 223307, "epoch": 1329} {"train_loss": -8.629871368408203, "global_step": 223308, "epoch": 1329} {"train_loss": -8.952319145202637, "global_step": 223309, "epoch": 1329} {"train_loss": -9.308727264404297, "global_step": 223310, "epoch": 1329} {"train_loss": -9.953862190246582, "global_step": 223311, "epoch": 1329} {"train_loss": -10.121603012084961, "global_step": 223312, "epoch": 1329} {"train_loss": -9.892156600952148, "global_step": 223313, "epoch": 1329} {"train_loss": -9.887643814086914, "global_step": 223314, "epoch": 1329} {"train_loss": -10.626907348632812, "global_step": 223315, "epoch": 1329} {"train_loss": -10.126697540283203, "global_step": 223316, "epoch": 1329} {"train_loss": -10.101426124572754, "global_step": 223317, "epoch": 1329} {"train_loss": -10.39050579071045, "global_step": 223318, "epoch": 1329} {"train_loss": -10.538564682006836, "global_step": 223319, "epoch": 1329} {"train_loss": -9.237541198730469, "global_step": 223320, "epoch": 1329} {"train_loss": -10.235574722290039, "global_step": 223321, "epoch": 1329} {"train_loss": -10.37153434753418, "global_step": 223322, "epoch": 1329} {"train_loss": -10.10440444946289, "global_step": 223323, "epoch": 1329} {"train_loss": -10.657746315002441, "global_step": 223324, "epoch": 1329} {"train_loss": -10.631223678588867, "global_step": 223325, "epoch": 1329} {"train_loss": -11.111900329589844, "global_step": 223326, "epoch": 1329} {"train_loss": -10.51354694366455, "global_step": 223327, "epoch": 1329} {"train_loss": -11.318587303161621, "global_step": 223328, "epoch": 1329} {"train_loss": -10.919475555419922, "global_step": 223329, "epoch": 1329} {"train_loss": -10.165544509887695, "global_step": 223330, "epoch": 1329} {"train_loss": -11.29008960723877, "global_step": 223331, "epoch": 1329} {"train_loss": -10.682699203491211, "global_step": 223332, "epoch": 1329} {"train_loss": -11.113794326782227, "global_step": 223333, "epoch": 1329} {"train_loss": -11.176443099975586, "global_step": 223334, "epoch": 1329} {"train_loss": -11.0343599319458, "global_step": 223335, "epoch": 1329} {"train_loss": -10.913524627685547, "global_step": 223336, "epoch": 1329} {"train_loss": -11.25525951385498, "global_step": 223337, "epoch": 1329} {"train_loss": -10.892312049865723, "global_step": 223338, "epoch": 1329} {"train_loss": -11.191876411437988, "global_step": 223339, "epoch": 1329} {"train_loss": -11.478771209716797, "global_step": 223340, "epoch": 1329} {"train_loss": -11.207540512084961, "global_step": 223341, "epoch": 1329} {"train_loss": -11.228403091430664, "global_step": 223342, "epoch": 1329} {"train_loss": -11.319005012512207, "global_step": 223343, "epoch": 1329} {"train_loss": -11.056721687316895, "global_step": 223344, "epoch": 1329} {"train_loss": -11.191991806030273, "global_step": 223345, "epoch": 1329} {"train_loss": -11.401100158691406, "global_step": 223346, "epoch": 1329} {"train_loss": -11.443470001220703, "global_step": 223347, "epoch": 1329} {"train_loss": -11.315535545349121, "global_step": 223348, "epoch": 1329} {"train_loss": -11.373669624328613, "global_step": 223349, "epoch": 1329} {"train_loss": -11.57589054107666, "global_step": 223350, "epoch": 1329} {"train_loss": -11.43160629272461, "global_step": 223351, "epoch": 1329} {"train_loss": -11.177482604980469, "global_step": 223352, "epoch": 1329} {"train_loss": -11.45840072631836, "global_step": 223353, "epoch": 1329} {"train_loss": -11.551198959350586, "global_step": 223354, "epoch": 1329} {"train_loss": -11.711605072021484, "global_step": 223355, "epoch": 1329} {"train_loss": -11.567790985107422, "global_step": 223356, "epoch": 1329} {"train_loss": -11.595579147338867, "global_step": 223357, "epoch": 1329} {"train_loss": -11.565597534179688, "global_step": 223358, "epoch": 1329} {"train_loss": -11.628591537475586, "global_step": 223359, "epoch": 1329} {"train_loss": -11.332221031188965, "global_step": 223360, "epoch": 1329} {"train_loss": -11.783140182495117, "global_step": 223361, "epoch": 1329} {"train_loss": -11.571584701538086, "global_step": 223362, "epoch": 1329} {"train_loss": -11.46697998046875, "global_step": 223363, "epoch": 1329} {"train_loss": -11.471181869506836, "global_step": 223364, "epoch": 1329} {"train_loss": -11.56794548034668, "global_step": 223365, "epoch": 1329} {"train_loss": -11.72414779663086, "global_step": 223366, "epoch": 1329} {"train_loss": -11.797286033630371, "global_step": 223367, "epoch": 1329} {"train_loss": -11.37894058227539, "global_step": 223368, "epoch": 1329} {"train_loss": -11.607691764831543, "global_step": 223369, "epoch": 1329} {"train_loss": -11.774782180786133, "global_step": 223370, "epoch": 1329} {"train_loss": -11.765525817871094, "global_step": 223371, "epoch": 1329} {"train_loss": -11.541548728942871, "global_step": 223372, "epoch": 1329} {"train_loss": -11.796297073364258, "global_step": 223373, "epoch": 1329} {"train_loss": -11.787420272827148, "global_step": 223374, "epoch": 1329} {"train_loss": -11.868038177490234, "global_step": 223375, "epoch": 1329} {"train_loss": -11.683380126953125, "global_step": 223376, "epoch": 1329} {"train_loss": -11.917184829711914, "global_step": 223377, "epoch": 1329} {"train_loss": -11.915485382080078, "global_step": 223378, "epoch": 1329} {"train_loss": -11.84500503540039, "global_step": 223379, "epoch": 1329} {"train_loss": -11.658421516418457, "global_step": 223380, "epoch": 1329} {"train_loss": -11.74261474609375, "global_step": 223381, "epoch": 1329} {"train_loss": -12.05681324005127, "global_step": 223382, "epoch": 1329} {"train_loss": -11.891210556030273, "global_step": 223383, "epoch": 1329} {"train_loss": -11.831731796264648, "global_step": 223384, "epoch": 1329} {"train_loss": -12.027973175048828, "global_step": 223385, "epoch": 1329} {"train_loss": -11.796211242675781, "global_step": 223386, "epoch": 1329} {"train_loss": -11.997444152832031, "global_step": 223387, "epoch": 1329} {"train_loss": -12.064596176147461, "global_step": 223388, "epoch": 1329} {"train_loss": -11.860252380371094, "global_step": 223389, "epoch": 1329} {"train_loss": -11.973124504089355, "global_step": 223390, "epoch": 1329} {"train_loss": -11.95290756225586, "global_step": 223391, "epoch": 1329} {"train_loss": -11.893486976623535, "global_step": 223392, "epoch": 1329} {"train_loss": -11.989167213439941, "global_step": 223393, "epoch": 1329} {"train_loss": -11.788609504699707, "global_step": 223394, "epoch": 1329} {"train_loss": -11.808635711669922, "global_step": 223395, "epoch": 1329} {"train_loss": -11.88473129272461, "global_step": 223396, "epoch": 1329} {"train_loss": -11.705353736877441, "global_step": 223397, "epoch": 1329} {"train_loss": -11.931573867797852, "global_step": 223398, "epoch": 1329} {"train_loss": -11.406791687011719, "global_step": 223399, "epoch": 1329} {"train_loss": -11.419754028320312, "global_step": 223400, "epoch": 1329} {"train_loss": -11.437734603881836, "global_step": 223401, "epoch": 1329} {"train_loss": -11.082460403442383, "global_step": 223402, "epoch": 1329} {"train_loss": -11.819321632385254, "global_step": 223403, "epoch": 1329} {"train_loss": -11.625941276550293, "global_step": 223404, "epoch": 1329} {"train_loss": -10.703653335571289, "global_step": 223405, "epoch": 1329} {"train_loss": -8.934650421142578, "global_step": 223406, "epoch": 1329} {"train_loss": -10.69015884399414, "global_step": 223407, "epoch": 1329} {"train_loss": -6.995487689971924, "global_step": 223408, "epoch": 1329} {"train_loss": -8.264760971069336, "global_step": 223409, "epoch": 1329} {"train_loss": -7.732226371765137, "global_step": 223410, "epoch": 1329} {"train_loss": -9.687323570251465, "global_step": 223411, "epoch": 1329} {"train_loss": -6.735396862030029, "global_step": 223412, "epoch": 1329} {"train_loss": -8.40516471862793, "global_step": 223413, "epoch": 1329} {"train_loss": -9.035240173339844, "global_step": 223414, "epoch": 1329} {"train_loss": -10.216019630432129, "global_step": 223415, "epoch": 1329} {"train_loss": -8.59621524810791, "global_step": 223416, "epoch": 1329} {"train_loss": -8.809127807617188, "global_step": 223417, "epoch": 1329} {"train_loss": -9.535577774047852, "global_step": 223418, "epoch": 1329} {"train_loss": -7.546210289001465, "global_step": 223419, "epoch": 1329} {"train_loss": -8.737701416015625, "global_step": 223420, "epoch": 1329} {"train_loss": -8.949894905090332, "global_step": 223421, "epoch": 1329} {"train_loss": -8.739972114562988, "global_step": 223422, "epoch": 1329} {"train_loss": -8.323409080505371, "global_step": 223423, "epoch": 1329} {"train_loss": -8.376755714416504, "global_step": 223424, "epoch": 1329} {"train_loss": -10.630044937133789, "global_step": 223425, "epoch": 1329} {"train_loss": -8.600151062011719, "global_step": 223426, "epoch": 1329} {"train_loss": -9.603399276733398, "global_step": 223427, "epoch": 1329} {"train_loss": -9.495473861694336, "global_step": 223428, "epoch": 1329} {"train_loss": -9.482545852661133, "global_step": 223429, "epoch": 1329} {"train_loss": -10.780296325683594, "global_step": 223430, "epoch": 1329} {"train_loss": -9.436083793640137, "global_step": 223431, "epoch": 1329} {"train_loss": -10.369335174560547, "global_step": 223432, "epoch": 1329} {"train_loss": -10.906787872314453, "global_step": 223433, "epoch": 1329} {"train_loss": -10.323668479919434, "global_step": 223434, "epoch": 1329} {"train_loss": -10.417101860046387, "global_step": 223435, "epoch": 1329} {"train_loss": -10.801216125488281, "global_step": 223436, "epoch": 1329} {"train_loss": -10.498334884643555, "global_step": 223437, "epoch": 1329} {"train_loss": -10.654684066772461, "global_step": 223438, "epoch": 1329} {"train_loss": -10.79261707124256, "global_step": 223439, "epoch": 1329, "val_loss": 247952.421875} {"train_loss": -10.811128616333008, "global_step": 223440, "epoch": 1330} {"train_loss": -10.955320358276367, "global_step": 223441, "epoch": 1330} {"train_loss": -10.981327056884766, "global_step": 223442, "epoch": 1330} {"train_loss": -10.945512771606445, "global_step": 223443, "epoch": 1330} {"train_loss": -11.147236824035645, "global_step": 223444, "epoch": 1330} {"train_loss": -11.069870948791504, "global_step": 223445, "epoch": 1330} {"train_loss": -11.022472381591797, "global_step": 223446, "epoch": 1330} {"train_loss": -11.192548751831055, "global_step": 223447, "epoch": 1330} {"train_loss": -11.087244987487793, "global_step": 223448, "epoch": 1330} {"train_loss": -10.961021423339844, "global_step": 223449, "epoch": 1330} {"train_loss": -11.377674102783203, "global_step": 223450, "epoch": 1330} {"train_loss": -11.154356956481934, "global_step": 223451, "epoch": 1330} {"train_loss": -11.293294906616211, "global_step": 223452, "epoch": 1330} {"train_loss": -11.089542388916016, "global_step": 223453, "epoch": 1330} {"train_loss": -11.324533462524414, "global_step": 223454, "epoch": 1330} {"train_loss": -11.197330474853516, "global_step": 223455, "epoch": 1330} {"train_loss": -11.105555534362793, "global_step": 223456, "epoch": 1330} {"train_loss": -11.192808151245117, "global_step": 223457, "epoch": 1330} {"train_loss": -11.330674171447754, "global_step": 223458, "epoch": 1330} {"train_loss": -11.168119430541992, "global_step": 223459, "epoch": 1330} {"train_loss": -11.222965240478516, "global_step": 223460, "epoch": 1330} {"train_loss": -11.054698944091797, "global_step": 223461, "epoch": 1330} {"train_loss": -11.427814483642578, "global_step": 223462, "epoch": 1330} {"train_loss": -11.492090225219727, "global_step": 223463, "epoch": 1330} {"train_loss": -11.342059135437012, "global_step": 223464, "epoch": 1330} {"train_loss": -11.480958938598633, "global_step": 223465, "epoch": 1330} {"train_loss": -11.29683780670166, "global_step": 223466, "epoch": 1330} {"train_loss": -11.575338363647461, "global_step": 223467, "epoch": 1330} {"train_loss": -11.458088874816895, "global_step": 223468, "epoch": 1330} {"train_loss": -11.380777359008789, "global_step": 223469, "epoch": 1330} {"train_loss": -11.467348098754883, "global_step": 223470, "epoch": 1330} {"train_loss": -11.492592811584473, "global_step": 223471, "epoch": 1330} {"train_loss": -11.52988052368164, "global_step": 223472, "epoch": 1330} {"train_loss": -11.355589866638184, "global_step": 223473, "epoch": 1330} {"train_loss": -11.570453643798828, "global_step": 223474, "epoch": 1330} {"train_loss": -11.571826934814453, "global_step": 223475, "epoch": 1330} {"train_loss": -11.64610481262207, "global_step": 223476, "epoch": 1330} {"train_loss": -11.614607810974121, "global_step": 223477, "epoch": 1330} {"train_loss": -11.33169937133789, "global_step": 223478, "epoch": 1330} {"train_loss": -11.72708511352539, "global_step": 223479, "epoch": 1330} {"train_loss": -11.547796249389648, "global_step": 223480, "epoch": 1330} {"train_loss": -11.553001403808594, "global_step": 223481, "epoch": 1330} {"train_loss": -11.758993148803711, "global_step": 223482, "epoch": 1330} {"train_loss": -11.54023551940918, "global_step": 223483, "epoch": 1330} {"train_loss": -11.59054946899414, "global_step": 223484, "epoch": 1330} {"train_loss": -11.62877082824707, "global_step": 223485, "epoch": 1330} {"train_loss": -11.573686599731445, "global_step": 223486, "epoch": 1330} {"train_loss": -11.709219932556152, "global_step": 223487, "epoch": 1330} {"train_loss": -11.369176864624023, "global_step": 223488, "epoch": 1330} {"train_loss": -11.682476997375488, "global_step": 223489, "epoch": 1330} {"train_loss": -11.763404846191406, "global_step": 223490, "epoch": 1330} {"train_loss": -11.52613639831543, "global_step": 223491, "epoch": 1330} {"train_loss": -11.582964897155762, "global_step": 223492, "epoch": 1330} {"train_loss": -11.652198791503906, "global_step": 223493, "epoch": 1330} {"train_loss": -11.367508888244629, "global_step": 223494, "epoch": 1330} {"train_loss": -11.494012832641602, "global_step": 223495, "epoch": 1330} {"train_loss": -11.460306167602539, "global_step": 223496, "epoch": 1330} {"train_loss": -11.670902252197266, "global_step": 223497, "epoch": 1330} {"train_loss": -11.368799209594727, "global_step": 223498, "epoch": 1330} {"train_loss": -11.58564281463623, "global_step": 223499, "epoch": 1330} {"train_loss": -11.612188339233398, "global_step": 223500, "epoch": 1330} {"train_loss": -11.649310111999512, "global_step": 223501, "epoch": 1330} {"train_loss": -11.46019172668457, "global_step": 223502, "epoch": 1330} {"train_loss": -11.565093994140625, "global_step": 223503, "epoch": 1330} {"train_loss": -11.645106315612793, "global_step": 223504, "epoch": 1330} {"train_loss": -11.64044189453125, "global_step": 223505, "epoch": 1330} {"train_loss": -11.559467315673828, "global_step": 223506, "epoch": 1330} {"train_loss": -11.698247909545898, "global_step": 223507, "epoch": 1330} {"train_loss": -11.700908660888672, "global_step": 223508, "epoch": 1330} {"train_loss": -11.664913177490234, "global_step": 223509, "epoch": 1330} {"train_loss": -11.543216705322266, "global_step": 223510, "epoch": 1330} {"train_loss": -11.331658363342285, "global_step": 223511, "epoch": 1330} {"train_loss": -11.348541259765625, "global_step": 223512, "epoch": 1330} {"train_loss": -11.702360153198242, "global_step": 223513, "epoch": 1330} {"train_loss": -11.537120819091797, "global_step": 223514, "epoch": 1330} {"train_loss": -11.75208568572998, "global_step": 223515, "epoch": 1330} {"train_loss": -11.563077926635742, "global_step": 223516, "epoch": 1330} {"train_loss": -11.874946594238281, "global_step": 223517, "epoch": 1330} {"train_loss": -11.61953067779541, "global_step": 223518, "epoch": 1330} {"train_loss": -11.484768867492676, "global_step": 223519, "epoch": 1330} {"train_loss": -11.476354598999023, "global_step": 223520, "epoch": 1330} {"train_loss": -11.595648765563965, "global_step": 223521, "epoch": 1330} {"train_loss": -11.112268447875977, "global_step": 223522, "epoch": 1330} {"train_loss": -11.940275192260742, "global_step": 223523, "epoch": 1330} {"train_loss": -11.270566940307617, "global_step": 223524, "epoch": 1330} {"train_loss": -11.412149429321289, "global_step": 223525, "epoch": 1330} {"train_loss": -11.788797378540039, "global_step": 223526, "epoch": 1330} {"train_loss": -11.393478393554688, "global_step": 223527, "epoch": 1330} {"train_loss": -11.746938705444336, "global_step": 223528, "epoch": 1330} {"train_loss": -11.50826358795166, "global_step": 223529, "epoch": 1330} {"train_loss": -11.546414375305176, "global_step": 223530, "epoch": 1330} {"train_loss": -11.871850967407227, "global_step": 223531, "epoch": 1330} {"train_loss": -11.444759368896484, "global_step": 223532, "epoch": 1330} {"train_loss": -11.643604278564453, "global_step": 223533, "epoch": 1330} {"train_loss": -11.981578826904297, "global_step": 223534, "epoch": 1330} {"train_loss": -11.69715690612793, "global_step": 223535, "epoch": 1330} {"train_loss": -11.631631851196289, "global_step": 223536, "epoch": 1330} {"train_loss": -11.760393142700195, "global_step": 223537, "epoch": 1330} {"train_loss": -11.689697265625, "global_step": 223538, "epoch": 1330} {"train_loss": -11.97601318359375, "global_step": 223539, "epoch": 1330} {"train_loss": -11.797011375427246, "global_step": 223540, "epoch": 1330} {"train_loss": -11.823819160461426, "global_step": 223541, "epoch": 1330} {"train_loss": -12.088194847106934, "global_step": 223542, "epoch": 1330} {"train_loss": -11.693610191345215, "global_step": 223543, "epoch": 1330} {"train_loss": -11.769720077514648, "global_step": 223544, "epoch": 1330} {"train_loss": -11.813880920410156, "global_step": 223545, "epoch": 1330} {"train_loss": -11.608102798461914, "global_step": 223546, "epoch": 1330} {"train_loss": -11.869819641113281, "global_step": 223547, "epoch": 1330} {"train_loss": -11.918961524963379, "global_step": 223548, "epoch": 1330} {"train_loss": -11.965538024902344, "global_step": 223549, "epoch": 1330} {"train_loss": -11.641090393066406, "global_step": 223550, "epoch": 1330} {"train_loss": -11.748323440551758, "global_step": 223551, "epoch": 1330} {"train_loss": -11.868894577026367, "global_step": 223552, "epoch": 1330} {"train_loss": -12.041166305541992, "global_step": 223553, "epoch": 1330} {"train_loss": -12.008713722229004, "global_step": 223554, "epoch": 1330} {"train_loss": -11.804657936096191, "global_step": 223555, "epoch": 1330} {"train_loss": -11.749102592468262, "global_step": 223556, "epoch": 1330} {"train_loss": -11.741016387939453, "global_step": 223557, "epoch": 1330} {"train_loss": -11.633146286010742, "global_step": 223558, "epoch": 1330} {"train_loss": -11.988704681396484, "global_step": 223559, "epoch": 1330} {"train_loss": -11.18242073059082, "global_step": 223560, "epoch": 1330} {"train_loss": -11.48989200592041, "global_step": 223561, "epoch": 1330} {"train_loss": -11.4935884475708, "global_step": 223562, "epoch": 1330} {"train_loss": -10.930755615234375, "global_step": 223563, "epoch": 1330} {"train_loss": -11.392285346984863, "global_step": 223564, "epoch": 1330} {"train_loss": -11.8623628616333, "global_step": 223565, "epoch": 1330} {"train_loss": -11.099660873413086, "global_step": 223566, "epoch": 1330} {"train_loss": -11.765409469604492, "global_step": 223567, "epoch": 1330} {"train_loss": -11.46561050415039, "global_step": 223568, "epoch": 1330} {"train_loss": -11.940092086791992, "global_step": 223569, "epoch": 1330} {"train_loss": -11.144472122192383, "global_step": 223570, "epoch": 1330} {"train_loss": -11.78671646118164, "global_step": 223571, "epoch": 1330} {"train_loss": -11.511433601379395, "global_step": 223572, "epoch": 1330} {"train_loss": -11.916364669799805, "global_step": 223573, "epoch": 1330} {"train_loss": -11.499563217163086, "global_step": 223574, "epoch": 1330} {"train_loss": -11.67156982421875, "global_step": 223575, "epoch": 1330} {"train_loss": -11.400808334350586, "global_step": 223576, "epoch": 1330} {"train_loss": -11.093900680541992, "global_step": 223577, "epoch": 1330} {"train_loss": -10.996173858642578, "global_step": 223578, "epoch": 1330} {"train_loss": -11.981657981872559, "global_step": 223579, "epoch": 1330} {"train_loss": -10.942455291748047, "global_step": 223580, "epoch": 1330} {"train_loss": -10.85927963256836, "global_step": 223581, "epoch": 1330} {"train_loss": -11.46499252319336, "global_step": 223582, "epoch": 1330} {"train_loss": -11.63321304321289, "global_step": 223583, "epoch": 1330} {"train_loss": -11.204373359680176, "global_step": 223584, "epoch": 1330} {"train_loss": -11.649626731872559, "global_step": 223585, "epoch": 1330} {"train_loss": -11.263996124267578, "global_step": 223586, "epoch": 1330} {"train_loss": -11.825700759887695, "global_step": 223587, "epoch": 1330} {"train_loss": -11.136882781982422, "global_step": 223588, "epoch": 1330} {"train_loss": -11.26533031463623, "global_step": 223589, "epoch": 1330} {"train_loss": -11.589426040649414, "global_step": 223590, "epoch": 1330} {"train_loss": -11.369144439697266, "global_step": 223591, "epoch": 1330} {"train_loss": -11.41633415222168, "global_step": 223592, "epoch": 1330} {"train_loss": -11.683298110961914, "global_step": 223593, "epoch": 1330} {"train_loss": -11.69723129272461, "global_step": 223594, "epoch": 1330} {"train_loss": -11.770179748535156, "global_step": 223595, "epoch": 1330} {"train_loss": -11.465085983276367, "global_step": 223596, "epoch": 1330} {"train_loss": -11.600000381469727, "global_step": 223597, "epoch": 1330} {"train_loss": -11.43941593170166, "global_step": 223598, "epoch": 1330} {"train_loss": -11.391704559326172, "global_step": 223599, "epoch": 1330} {"train_loss": -11.676299095153809, "global_step": 223600, "epoch": 1330} {"train_loss": -11.626220703125, "global_step": 223601, "epoch": 1330} {"train_loss": -11.584571838378906, "global_step": 223602, "epoch": 1330} {"train_loss": -11.90005111694336, "global_step": 223603, "epoch": 1330} {"train_loss": -11.706427574157715, "global_step": 223604, "epoch": 1330} {"train_loss": -11.630208015441895, "global_step": 223605, "epoch": 1330} {"train_loss": -11.750575065612793, "global_step": 223606, "epoch": 1330} {"train_loss": -11.520612921033587, "global_step": 223607, "epoch": 1330, "val_loss": 254458.5625, "train_action_mse_error": 5.237478256225586} {"train_loss": -10.693184852600098, "global_step": 223608, "epoch": 1331} {"train_loss": -11.84014892578125, "global_step": 223609, "epoch": 1331} {"train_loss": -10.730825424194336, "global_step": 223610, "epoch": 1331} {"train_loss": -11.234046936035156, "global_step": 223611, "epoch": 1331} {"train_loss": -11.641660690307617, "global_step": 223612, "epoch": 1331} {"train_loss": -10.767610549926758, "global_step": 223613, "epoch": 1331} {"train_loss": -11.78891372680664, "global_step": 223614, "epoch": 1331} {"train_loss": -11.454010963439941, "global_step": 223615, "epoch": 1331} {"train_loss": -11.267135620117188, "global_step": 223616, "epoch": 1331} {"train_loss": -11.909674644470215, "global_step": 223617, "epoch": 1331} {"train_loss": -11.353391647338867, "global_step": 223618, "epoch": 1331} {"train_loss": -11.483686447143555, "global_step": 223619, "epoch": 1331} {"train_loss": -11.656322479248047, "global_step": 223620, "epoch": 1331} {"train_loss": -10.76278305053711, "global_step": 223621, "epoch": 1331} {"train_loss": -11.887969970703125, "global_step": 223622, "epoch": 1331} {"train_loss": -10.905078887939453, "global_step": 223623, "epoch": 1331} {"train_loss": -10.850914001464844, "global_step": 223624, "epoch": 1331} {"train_loss": -11.410222053527832, "global_step": 223625, "epoch": 1331} {"train_loss": -10.185940742492676, "global_step": 223626, "epoch": 1331} {"train_loss": -11.719436645507812, "global_step": 223627, "epoch": 1331} {"train_loss": -11.28404712677002, "global_step": 223628, "epoch": 1331} {"train_loss": -10.720882415771484, "global_step": 223629, "epoch": 1331} {"train_loss": -11.344072341918945, "global_step": 223630, "epoch": 1331} {"train_loss": -10.581506729125977, "global_step": 223631, "epoch": 1331} {"train_loss": -11.458648681640625, "global_step": 223632, "epoch": 1331} {"train_loss": -9.795862197875977, "global_step": 223633, "epoch": 1331} {"train_loss": -11.68954086303711, "global_step": 223634, "epoch": 1331} {"train_loss": -9.965280532836914, "global_step": 223635, "epoch": 1331} {"train_loss": -10.805630683898926, "global_step": 223636, "epoch": 1331} {"train_loss": -11.296610832214355, "global_step": 223637, "epoch": 1331} {"train_loss": -10.897699356079102, "global_step": 223638, "epoch": 1331} {"train_loss": -11.011444091796875, "global_step": 223639, "epoch": 1331} {"train_loss": -10.937047958374023, "global_step": 223640, "epoch": 1331} {"train_loss": -11.043872833251953, "global_step": 223641, "epoch": 1331} {"train_loss": -10.979679107666016, "global_step": 223642, "epoch": 1331} {"train_loss": -11.175138473510742, "global_step": 223643, "epoch": 1331} {"train_loss": -10.961481094360352, "global_step": 223644, "epoch": 1331} {"train_loss": -11.185300827026367, "global_step": 223645, "epoch": 1331} {"train_loss": -10.869169235229492, "global_step": 223646, "epoch": 1331} {"train_loss": -11.06778621673584, "global_step": 223647, "epoch": 1331} {"train_loss": -11.004878997802734, "global_step": 223648, "epoch": 1331} {"train_loss": -11.224681854248047, "global_step": 223649, "epoch": 1331} {"train_loss": -11.576104164123535, "global_step": 223650, "epoch": 1331} {"train_loss": -10.874393463134766, "global_step": 223651, "epoch": 1331} {"train_loss": -11.505406379699707, "global_step": 223652, "epoch": 1331} {"train_loss": -10.949116706848145, "global_step": 223653, "epoch": 1331} {"train_loss": -11.456819534301758, "global_step": 223654, "epoch": 1331} {"train_loss": -10.907943725585938, "global_step": 223655, "epoch": 1331} {"train_loss": -11.105666160583496, "global_step": 223656, "epoch": 1331} {"train_loss": -11.173948287963867, "global_step": 223657, "epoch": 1331} {"train_loss": -11.546945571899414, "global_step": 223658, "epoch": 1331} {"train_loss": -10.998766899108887, "global_step": 223659, "epoch": 1331} {"train_loss": -11.560541152954102, "global_step": 223660, "epoch": 1331} {"train_loss": -11.281478881835938, "global_step": 223661, "epoch": 1331} {"train_loss": -11.30749225616455, "global_step": 223662, "epoch": 1331} {"train_loss": -11.184257507324219, "global_step": 223663, "epoch": 1331} {"train_loss": -11.586895942687988, "global_step": 223664, "epoch": 1331} {"train_loss": -11.052103042602539, "global_step": 223665, "epoch": 1331} {"train_loss": -11.584012031555176, "global_step": 223666, "epoch": 1331} {"train_loss": -11.405153274536133, "global_step": 223667, "epoch": 1331} {"train_loss": -11.302005767822266, "global_step": 223668, "epoch": 1331} {"train_loss": -11.303033828735352, "global_step": 223669, "epoch": 1331} {"train_loss": -11.778360366821289, "global_step": 223670, "epoch": 1331} {"train_loss": -11.22482681274414, "global_step": 223671, "epoch": 1331} {"train_loss": -11.560462951660156, "global_step": 223672, "epoch": 1331} {"train_loss": -11.349834442138672, "global_step": 223673, "epoch": 1331} {"train_loss": -11.600957870483398, "global_step": 223674, "epoch": 1331} {"train_loss": -11.475312232971191, "global_step": 223675, "epoch": 1331} {"train_loss": -11.70529556274414, "global_step": 223676, "epoch": 1331} {"train_loss": -11.433365821838379, "global_step": 223677, "epoch": 1331} {"train_loss": -11.803770065307617, "global_step": 223678, "epoch": 1331} {"train_loss": -11.6798677444458, "global_step": 223679, "epoch": 1331} {"train_loss": -11.763898849487305, "global_step": 223680, "epoch": 1331} {"train_loss": -11.708147048950195, "global_step": 223681, "epoch": 1331} {"train_loss": -11.618755340576172, "global_step": 223682, "epoch": 1331} {"train_loss": -11.66622543334961, "global_step": 223683, "epoch": 1331} {"train_loss": -11.749536514282227, "global_step": 223684, "epoch": 1331} {"train_loss": -11.705156326293945, "global_step": 223685, "epoch": 1331} {"train_loss": -11.815126419067383, "global_step": 223686, "epoch": 1331} {"train_loss": -11.801456451416016, "global_step": 223687, "epoch": 1331} {"train_loss": -11.81224536895752, "global_step": 223688, "epoch": 1331} {"train_loss": -11.797306060791016, "global_step": 223689, "epoch": 1331} {"train_loss": -11.671524047851562, "global_step": 223690, "epoch": 1331} {"train_loss": -11.84587287902832, "global_step": 223691, "epoch": 1331} {"train_loss": -11.91236686706543, "global_step": 223692, "epoch": 1331} {"train_loss": -11.554386138916016, "global_step": 223693, "epoch": 1331} {"train_loss": -11.866159439086914, "global_step": 223694, "epoch": 1331} {"train_loss": -11.801973342895508, "global_step": 223695, "epoch": 1331} {"train_loss": -12.094402313232422, "global_step": 223696, "epoch": 1331} {"train_loss": -11.866556167602539, "global_step": 223697, "epoch": 1331} {"train_loss": -11.825723648071289, "global_step": 223698, "epoch": 1331} {"train_loss": -11.863749504089355, "global_step": 223699, "epoch": 1331} {"train_loss": -11.75200080871582, "global_step": 223700, "epoch": 1331} {"train_loss": -11.892375946044922, "global_step": 223701, "epoch": 1331} {"train_loss": -11.913142204284668, "global_step": 223702, "epoch": 1331} {"train_loss": -11.95423698425293, "global_step": 223703, "epoch": 1331} {"train_loss": -11.76318359375, "global_step": 223704, "epoch": 1331} {"train_loss": -11.579083442687988, "global_step": 223705, "epoch": 1331} {"train_loss": -11.759114265441895, "global_step": 223706, "epoch": 1331} {"train_loss": -11.59615421295166, "global_step": 223707, "epoch": 1331} {"train_loss": -11.796648979187012, "global_step": 223708, "epoch": 1331} {"train_loss": -11.849189758300781, "global_step": 223709, "epoch": 1331} {"train_loss": -12.08167839050293, "global_step": 223710, "epoch": 1331} {"train_loss": -11.935850143432617, "global_step": 223711, "epoch": 1331} {"train_loss": -12.121862411499023, "global_step": 223712, "epoch": 1331} {"train_loss": -11.95541763305664, "global_step": 223713, "epoch": 1331} {"train_loss": -11.775711059570312, "global_step": 223714, "epoch": 1331} {"train_loss": -11.638303756713867, "global_step": 223715, "epoch": 1331} {"train_loss": -11.64371395111084, "global_step": 223716, "epoch": 1331} {"train_loss": -11.44149398803711, "global_step": 223717, "epoch": 1331} {"train_loss": -11.084224700927734, "global_step": 223718, "epoch": 1331} {"train_loss": -11.560970306396484, "global_step": 223719, "epoch": 1331} {"train_loss": -11.689750671386719, "global_step": 223720, "epoch": 1331} {"train_loss": -11.136558532714844, "global_step": 223721, "epoch": 1331} {"train_loss": -11.288654327392578, "global_step": 223722, "epoch": 1331} {"train_loss": -11.492450714111328, "global_step": 223723, "epoch": 1331} {"train_loss": -11.409516334533691, "global_step": 223724, "epoch": 1331} {"train_loss": -11.000969886779785, "global_step": 223725, "epoch": 1331} {"train_loss": -10.721702575683594, "global_step": 223726, "epoch": 1331} {"train_loss": -11.91236686706543, "global_step": 223727, "epoch": 1331} {"train_loss": -10.54102897644043, "global_step": 223728, "epoch": 1331} {"train_loss": -11.04840087890625, "global_step": 223729, "epoch": 1331} {"train_loss": -10.729412078857422, "global_step": 223730, "epoch": 1331} {"train_loss": -11.370607376098633, "global_step": 223731, "epoch": 1331} {"train_loss": -11.171760559082031, "global_step": 223732, "epoch": 1331} {"train_loss": -11.538599967956543, "global_step": 223733, "epoch": 1331} {"train_loss": -11.653108596801758, "global_step": 223734, "epoch": 1331} {"train_loss": -10.882336616516113, "global_step": 223735, "epoch": 1331} {"train_loss": -11.202049255371094, "global_step": 223736, "epoch": 1331} {"train_loss": -11.125846862792969, "global_step": 223737, "epoch": 1331} {"train_loss": -11.532549858093262, "global_step": 223738, "epoch": 1331} {"train_loss": -10.582392692565918, "global_step": 223739, "epoch": 1331} {"train_loss": -11.487524032592773, "global_step": 223740, "epoch": 1331} {"train_loss": -11.38996696472168, "global_step": 223741, "epoch": 1331} {"train_loss": -11.26533317565918, "global_step": 223742, "epoch": 1331} {"train_loss": -11.27506160736084, "global_step": 223743, "epoch": 1331} {"train_loss": -11.333881378173828, "global_step": 223744, "epoch": 1331} {"train_loss": -11.163724899291992, "global_step": 223745, "epoch": 1331} {"train_loss": -11.303211212158203, "global_step": 223746, "epoch": 1331} {"train_loss": -11.068792343139648, "global_step": 223747, "epoch": 1331} {"train_loss": -11.348143577575684, "global_step": 223748, "epoch": 1331} {"train_loss": -11.732810974121094, "global_step": 223749, "epoch": 1331} {"train_loss": -11.327892303466797, "global_step": 223750, "epoch": 1331} {"train_loss": -11.699883460998535, "global_step": 223751, "epoch": 1331} {"train_loss": -11.367504119873047, "global_step": 223752, "epoch": 1331} {"train_loss": -11.720541000366211, "global_step": 223753, "epoch": 1331} {"train_loss": -11.666028022766113, "global_step": 223754, "epoch": 1331} {"train_loss": -11.653822898864746, "global_step": 223755, "epoch": 1331} {"train_loss": -11.44898796081543, "global_step": 223756, "epoch": 1331} {"train_loss": -11.488237380981445, "global_step": 223757, "epoch": 1331} {"train_loss": -11.766739845275879, "global_step": 223758, "epoch": 1331} {"train_loss": -11.673189163208008, "global_step": 223759, "epoch": 1331} {"train_loss": -11.51736068725586, "global_step": 223760, "epoch": 1331} {"train_loss": -11.334686279296875, "global_step": 223761, "epoch": 1331} {"train_loss": -11.483538627624512, "global_step": 223762, "epoch": 1331} {"train_loss": -11.497593879699707, "global_step": 223763, "epoch": 1331} {"train_loss": -11.403928756713867, "global_step": 223764, "epoch": 1331} {"train_loss": -11.893686294555664, "global_step": 223765, "epoch": 1331} {"train_loss": -11.299007415771484, "global_step": 223766, "epoch": 1331} {"train_loss": -11.003602981567383, "global_step": 223767, "epoch": 1331} {"train_loss": -11.599205017089844, "global_step": 223768, "epoch": 1331} {"train_loss": -11.57565975189209, "global_step": 223769, "epoch": 1331} {"train_loss": -10.73482894897461, "global_step": 223770, "epoch": 1331} {"train_loss": -11.307327270507812, "global_step": 223771, "epoch": 1331} {"train_loss": -11.253379821777344, "global_step": 223772, "epoch": 1331} {"train_loss": -10.992246627807617, "global_step": 223773, "epoch": 1331} {"train_loss": -11.300278663635254, "global_step": 223774, "epoch": 1331} {"train_loss": -11.394094126565117, "global_step": 223775, "epoch": 1331, "val_loss": 256185.484375} {"train_loss": -11.129860877990723, "global_step": 223776, "epoch": 1332} {"train_loss": -11.469337463378906, "global_step": 223777, "epoch": 1332} {"train_loss": -11.90887451171875, "global_step": 223778, "epoch": 1332} {"train_loss": -11.441131591796875, "global_step": 223779, "epoch": 1332} {"train_loss": -11.91763687133789, "global_step": 223780, "epoch": 1332} {"train_loss": -11.396005630493164, "global_step": 223781, "epoch": 1332} {"train_loss": -11.385980606079102, "global_step": 223782, "epoch": 1332} {"train_loss": -11.400444030761719, "global_step": 223783, "epoch": 1332} {"train_loss": -11.597075462341309, "global_step": 223784, "epoch": 1332} {"train_loss": -11.617575645446777, "global_step": 223785, "epoch": 1332} {"train_loss": -11.415634155273438, "global_step": 223786, "epoch": 1332} {"train_loss": -11.912489891052246, "global_step": 223787, "epoch": 1332} {"train_loss": -11.427160263061523, "global_step": 223788, "epoch": 1332} {"train_loss": -11.745705604553223, "global_step": 223789, "epoch": 1332} {"train_loss": -11.39068603515625, "global_step": 223790, "epoch": 1332} {"train_loss": -11.78365421295166, "global_step": 223791, "epoch": 1332} {"train_loss": -11.789941787719727, "global_step": 223792, "epoch": 1332} {"train_loss": -11.910994529724121, "global_step": 223793, "epoch": 1332} {"train_loss": -11.814909934997559, "global_step": 223794, "epoch": 1332} {"train_loss": -11.661714553833008, "global_step": 223795, "epoch": 1332} {"train_loss": -11.657306671142578, "global_step": 223796, "epoch": 1332} {"train_loss": -11.746089935302734, "global_step": 223797, "epoch": 1332} {"train_loss": -12.033041000366211, "global_step": 223798, "epoch": 1332} {"train_loss": -11.553848266601562, "global_step": 223799, "epoch": 1332} {"train_loss": -11.7130126953125, "global_step": 223800, "epoch": 1332} {"train_loss": -12.06802749633789, "global_step": 223801, "epoch": 1332} {"train_loss": -11.897209167480469, "global_step": 223802, "epoch": 1332} {"train_loss": -11.92523193359375, "global_step": 223803, "epoch": 1332} {"train_loss": -11.915959358215332, "global_step": 223804, "epoch": 1332} {"train_loss": -11.826835632324219, "global_step": 223805, "epoch": 1332} {"train_loss": -12.08357048034668, "global_step": 223806, "epoch": 1332} {"train_loss": -11.902036666870117, "global_step": 223807, "epoch": 1332} {"train_loss": -11.697135925292969, "global_step": 223808, "epoch": 1332} {"train_loss": -12.164041519165039, "global_step": 223809, "epoch": 1332} {"train_loss": -11.50525188446045, "global_step": 223810, "epoch": 1332} {"train_loss": -11.833547592163086, "global_step": 223811, "epoch": 1332} {"train_loss": -11.840221405029297, "global_step": 223812, "epoch": 1332} {"train_loss": -11.818558692932129, "global_step": 223813, "epoch": 1332} {"train_loss": -11.80730152130127, "global_step": 223814, "epoch": 1332} {"train_loss": -11.914819717407227, "global_step": 223815, "epoch": 1332} {"train_loss": -11.705831527709961, "global_step": 223816, "epoch": 1332} {"train_loss": -11.81155776977539, "global_step": 223817, "epoch": 1332} {"train_loss": -11.878068923950195, "global_step": 223818, "epoch": 1332} {"train_loss": -12.042911529541016, "global_step": 223819, "epoch": 1332} {"train_loss": -11.910405158996582, "global_step": 223820, "epoch": 1332} {"train_loss": -12.008749008178711, "global_step": 223821, "epoch": 1332} {"train_loss": -12.030115127563477, "global_step": 223822, "epoch": 1332} {"train_loss": -11.859258651733398, "global_step": 223823, "epoch": 1332} {"train_loss": -11.570316314697266, "global_step": 223824, "epoch": 1332} {"train_loss": -11.937236785888672, "global_step": 223825, "epoch": 1332} {"train_loss": -11.916022300720215, "global_step": 223826, "epoch": 1332} {"train_loss": -11.564115524291992, "global_step": 223827, "epoch": 1332} {"train_loss": -11.629257202148438, "global_step": 223828, "epoch": 1332} {"train_loss": -12.00362491607666, "global_step": 223829, "epoch": 1332} {"train_loss": -11.576086044311523, "global_step": 223830, "epoch": 1332} {"train_loss": -11.434714317321777, "global_step": 223831, "epoch": 1332} {"train_loss": -11.661731719970703, "global_step": 223832, "epoch": 1332} {"train_loss": -11.272550582885742, "global_step": 223833, "epoch": 1332} {"train_loss": -10.501324653625488, "global_step": 223834, "epoch": 1332} {"train_loss": -11.164253234863281, "global_step": 223835, "epoch": 1332} {"train_loss": -11.274139404296875, "global_step": 223836, "epoch": 1332} {"train_loss": -11.568641662597656, "global_step": 223837, "epoch": 1332} {"train_loss": -10.989702224731445, "global_step": 223838, "epoch": 1332} {"train_loss": -11.141629219055176, "global_step": 223839, "epoch": 1332} {"train_loss": -11.507930755615234, "global_step": 223840, "epoch": 1332} {"train_loss": -11.52586841583252, "global_step": 223841, "epoch": 1332} {"train_loss": -11.443262100219727, "global_step": 223842, "epoch": 1332} {"train_loss": -11.522330284118652, "global_step": 223843, "epoch": 1332} {"train_loss": -11.71711254119873, "global_step": 223844, "epoch": 1332} {"train_loss": -11.860288619995117, "global_step": 223845, "epoch": 1332} {"train_loss": -11.59528923034668, "global_step": 223846, "epoch": 1332} {"train_loss": -11.723602294921875, "global_step": 223847, "epoch": 1332} {"train_loss": -11.337600708007812, "global_step": 223848, "epoch": 1332} {"train_loss": -11.161956787109375, "global_step": 223849, "epoch": 1332} {"train_loss": -11.578544616699219, "global_step": 223850, "epoch": 1332} {"train_loss": -11.070363998413086, "global_step": 223851, "epoch": 1332} {"train_loss": -11.161520004272461, "global_step": 223852, "epoch": 1332} {"train_loss": -11.552115440368652, "global_step": 223853, "epoch": 1332} {"train_loss": -10.705521583557129, "global_step": 223854, "epoch": 1332} {"train_loss": -10.53919792175293, "global_step": 223855, "epoch": 1332} {"train_loss": -11.37889289855957, "global_step": 223856, "epoch": 1332} {"train_loss": -11.469547271728516, "global_step": 223857, "epoch": 1332} {"train_loss": -10.267020225524902, "global_step": 223858, "epoch": 1332} {"train_loss": -11.878679275512695, "global_step": 223859, "epoch": 1332} {"train_loss": -10.953104972839355, "global_step": 223860, "epoch": 1332} {"train_loss": -11.311040878295898, "global_step": 223861, "epoch": 1332} {"train_loss": -11.664925575256348, "global_step": 223862, "epoch": 1332} {"train_loss": -11.573442459106445, "global_step": 223863, "epoch": 1332} {"train_loss": -11.397476196289062, "global_step": 223864, "epoch": 1332} {"train_loss": -11.731210708618164, "global_step": 223865, "epoch": 1332} {"train_loss": -11.365787506103516, "global_step": 223866, "epoch": 1332} {"train_loss": -10.694001197814941, "global_step": 223867, "epoch": 1332} {"train_loss": -10.961930274963379, "global_step": 223868, "epoch": 1332} {"train_loss": -10.68183708190918, "global_step": 223869, "epoch": 1332} {"train_loss": -10.770442962646484, "global_step": 223870, "epoch": 1332} {"train_loss": -11.281852722167969, "global_step": 223871, "epoch": 1332} {"train_loss": -10.169309616088867, "global_step": 223872, "epoch": 1332} {"train_loss": -11.630485534667969, "global_step": 223873, "epoch": 1332} {"train_loss": -11.326037406921387, "global_step": 223874, "epoch": 1332} {"train_loss": -11.162348747253418, "global_step": 223875, "epoch": 1332} {"train_loss": -10.913851737976074, "global_step": 223876, "epoch": 1332} {"train_loss": -11.499576568603516, "global_step": 223877, "epoch": 1332} {"train_loss": -11.359006881713867, "global_step": 223878, "epoch": 1332} {"train_loss": -11.289569854736328, "global_step": 223879, "epoch": 1332} {"train_loss": -10.51972484588623, "global_step": 223880, "epoch": 1332} {"train_loss": -10.777509689331055, "global_step": 223881, "epoch": 1332} {"train_loss": -11.058490753173828, "global_step": 223882, "epoch": 1332} {"train_loss": -10.973480224609375, "global_step": 223883, "epoch": 1332} {"train_loss": -11.139846801757812, "global_step": 223884, "epoch": 1332} {"train_loss": -11.035847663879395, "global_step": 223885, "epoch": 1332} {"train_loss": -11.13241958618164, "global_step": 223886, "epoch": 1332} {"train_loss": -11.541489601135254, "global_step": 223887, "epoch": 1332} {"train_loss": -11.086725234985352, "global_step": 223888, "epoch": 1332} {"train_loss": -11.308707237243652, "global_step": 223889, "epoch": 1332} {"train_loss": -10.840444564819336, "global_step": 223890, "epoch": 1332} {"train_loss": -11.334901809692383, "global_step": 223891, "epoch": 1332} {"train_loss": -11.306131362915039, "global_step": 223892, "epoch": 1332} {"train_loss": -11.423187255859375, "global_step": 223893, "epoch": 1332} {"train_loss": -11.579253196716309, "global_step": 223894, "epoch": 1332} {"train_loss": -11.453240394592285, "global_step": 223895, "epoch": 1332} {"train_loss": -11.31516170501709, "global_step": 223896, "epoch": 1332} {"train_loss": -11.111380577087402, "global_step": 223897, "epoch": 1332} {"train_loss": -11.425566673278809, "global_step": 223898, "epoch": 1332} {"train_loss": -11.183570861816406, "global_step": 223899, "epoch": 1332} {"train_loss": -11.24226188659668, "global_step": 223900, "epoch": 1332} {"train_loss": -11.832334518432617, "global_step": 223901, "epoch": 1332} {"train_loss": -11.039620399475098, "global_step": 223902, "epoch": 1332} {"train_loss": -11.25600814819336, "global_step": 223903, "epoch": 1332} {"train_loss": -10.94572639465332, "global_step": 223904, "epoch": 1332} {"train_loss": -11.375457763671875, "global_step": 223905, "epoch": 1332} {"train_loss": -11.538106918334961, "global_step": 223906, "epoch": 1332} {"train_loss": -11.00207805633545, "global_step": 223907, "epoch": 1332} {"train_loss": -11.681730270385742, "global_step": 223908, "epoch": 1332} {"train_loss": -10.486859321594238, "global_step": 223909, "epoch": 1332} {"train_loss": -11.544755935668945, "global_step": 223910, "epoch": 1332} {"train_loss": -10.748403549194336, "global_step": 223911, "epoch": 1332} {"train_loss": -10.947980880737305, "global_step": 223912, "epoch": 1332} {"train_loss": -11.268196105957031, "global_step": 223913, "epoch": 1332} {"train_loss": -11.306862831115723, "global_step": 223914, "epoch": 1332} {"train_loss": -11.057759284973145, "global_step": 223915, "epoch": 1332} {"train_loss": -10.884927749633789, "global_step": 223916, "epoch": 1332} {"train_loss": -11.273842811584473, "global_step": 223917, "epoch": 1332} {"train_loss": -10.609902381896973, "global_step": 223918, "epoch": 1332} {"train_loss": -11.475719451904297, "global_step": 223919, "epoch": 1332} {"train_loss": -10.621885299682617, "global_step": 223920, "epoch": 1332} {"train_loss": -11.559959411621094, "global_step": 223921, "epoch": 1332} {"train_loss": -11.257354736328125, "global_step": 223922, "epoch": 1332} {"train_loss": -11.121912002563477, "global_step": 223923, "epoch": 1332} {"train_loss": -11.420431137084961, "global_step": 223924, "epoch": 1332} {"train_loss": -11.197341918945312, "global_step": 223925, "epoch": 1332} {"train_loss": -11.455501556396484, "global_step": 223926, "epoch": 1332} {"train_loss": -11.285860061645508, "global_step": 223927, "epoch": 1332} {"train_loss": -11.33691692352295, "global_step": 223928, "epoch": 1332} {"train_loss": -11.492002487182617, "global_step": 223929, "epoch": 1332} {"train_loss": -11.445528984069824, "global_step": 223930, "epoch": 1332} {"train_loss": -11.604642868041992, "global_step": 223931, "epoch": 1332} {"train_loss": -11.656185150146484, "global_step": 223932, "epoch": 1332} {"train_loss": -11.577984809875488, "global_step": 223933, "epoch": 1332} {"train_loss": -11.712387084960938, "global_step": 223934, "epoch": 1332} {"train_loss": -11.326334953308105, "global_step": 223935, "epoch": 1332} {"train_loss": -11.638830184936523, "global_step": 223936, "epoch": 1332} {"train_loss": -11.36026382446289, "global_step": 223937, "epoch": 1332} {"train_loss": -11.807052612304688, "global_step": 223938, "epoch": 1332} {"train_loss": -11.491968154907227, "global_step": 223939, "epoch": 1332} {"train_loss": -11.503600120544434, "global_step": 223940, "epoch": 1332} {"train_loss": -11.706473350524902, "global_step": 223941, "epoch": 1332} {"train_loss": -11.293828964233398, "global_step": 223942, "epoch": 1332} {"train_loss": -11.429441383906774, "global_step": 223943, "epoch": 1332, "val_loss": 256651.765625} {"train_loss": -11.65303897857666, "global_step": 223944, "epoch": 1333} {"train_loss": -11.701775550842285, "global_step": 223945, "epoch": 1333} {"train_loss": -11.657861709594727, "global_step": 223946, "epoch": 1333} {"train_loss": -11.83675765991211, "global_step": 223947, "epoch": 1333} {"train_loss": -11.734567642211914, "global_step": 223948, "epoch": 1333} {"train_loss": -11.38606071472168, "global_step": 223949, "epoch": 1333} {"train_loss": -11.838238716125488, "global_step": 223950, "epoch": 1333} {"train_loss": -11.409340858459473, "global_step": 223951, "epoch": 1333} {"train_loss": -11.488628387451172, "global_step": 223952, "epoch": 1333} {"train_loss": -11.632808685302734, "global_step": 223953, "epoch": 1333} {"train_loss": -11.624082565307617, "global_step": 223954, "epoch": 1333} {"train_loss": -11.899087905883789, "global_step": 223955, "epoch": 1333} {"train_loss": -11.675106048583984, "global_step": 223956, "epoch": 1333} {"train_loss": -11.78806209564209, "global_step": 223957, "epoch": 1333} {"train_loss": -11.914854049682617, "global_step": 223958, "epoch": 1333} {"train_loss": -11.872446060180664, "global_step": 223959, "epoch": 1333} {"train_loss": -11.809377670288086, "global_step": 223960, "epoch": 1333} {"train_loss": -11.874358177185059, "global_step": 223961, "epoch": 1333} {"train_loss": -11.850601196289062, "global_step": 223962, "epoch": 1333} {"train_loss": -11.73453140258789, "global_step": 223963, "epoch": 1333} {"train_loss": -11.882087707519531, "global_step": 223964, "epoch": 1333} {"train_loss": -11.685819625854492, "global_step": 223965, "epoch": 1333} {"train_loss": -11.79720687866211, "global_step": 223966, "epoch": 1333} {"train_loss": -11.622978210449219, "global_step": 223967, "epoch": 1333} {"train_loss": -11.843643188476562, "global_step": 223968, "epoch": 1333} {"train_loss": -11.625545501708984, "global_step": 223969, "epoch": 1333} {"train_loss": -11.586372375488281, "global_step": 223970, "epoch": 1333} {"train_loss": -11.913106918334961, "global_step": 223971, "epoch": 1333} {"train_loss": -12.063255310058594, "global_step": 223972, "epoch": 1333} {"train_loss": -11.817928314208984, "global_step": 223973, "epoch": 1333} {"train_loss": -11.964344024658203, "global_step": 223974, "epoch": 1333} {"train_loss": -11.85863971710205, "global_step": 223975, "epoch": 1333} {"train_loss": -12.125679969787598, "global_step": 223976, "epoch": 1333} {"train_loss": -11.803606033325195, "global_step": 223977, "epoch": 1333} {"train_loss": -11.948424339294434, "global_step": 223978, "epoch": 1333} {"train_loss": -11.930937767028809, "global_step": 223979, "epoch": 1333} {"train_loss": -11.918207168579102, "global_step": 223980, "epoch": 1333} {"train_loss": -11.757530212402344, "global_step": 223981, "epoch": 1333} {"train_loss": -11.99361515045166, "global_step": 223982, "epoch": 1333} {"train_loss": -11.954095840454102, "global_step": 223983, "epoch": 1333} {"train_loss": -11.89573860168457, "global_step": 223984, "epoch": 1333} {"train_loss": -11.952169418334961, "global_step": 223985, "epoch": 1333} {"train_loss": -12.118785858154297, "global_step": 223986, "epoch": 1333} {"train_loss": -11.940533638000488, "global_step": 223987, "epoch": 1333} {"train_loss": -12.066915512084961, "global_step": 223988, "epoch": 1333} {"train_loss": -12.178339958190918, "global_step": 223989, "epoch": 1333} {"train_loss": -12.054205894470215, "global_step": 223990, "epoch": 1333} {"train_loss": -11.663668632507324, "global_step": 223991, "epoch": 1333} {"train_loss": -11.331095695495605, "global_step": 223992, "epoch": 1333} {"train_loss": -11.157119750976562, "global_step": 223993, "epoch": 1333} {"train_loss": -11.645275115966797, "global_step": 223994, "epoch": 1333} {"train_loss": -11.929414749145508, "global_step": 223995, "epoch": 1333} {"train_loss": -11.078361511230469, "global_step": 223996, "epoch": 1333} {"train_loss": -10.552599906921387, "global_step": 223997, "epoch": 1333} {"train_loss": -10.46512222290039, "global_step": 223998, "epoch": 1333} {"train_loss": -11.600638389587402, "global_step": 223999, "epoch": 1333} {"train_loss": -9.909055709838867, "global_step": 224000, "epoch": 1333} {"train_loss": -9.080089569091797, "global_step": 224001, "epoch": 1333} {"train_loss": -11.770605087280273, "global_step": 224002, "epoch": 1333} {"train_loss": -9.09207534790039, "global_step": 224003, "epoch": 1333} {"train_loss": -8.59027099609375, "global_step": 224004, "epoch": 1333} {"train_loss": -11.55339527130127, "global_step": 224005, "epoch": 1333} {"train_loss": -8.812252044677734, "global_step": 224006, "epoch": 1333} {"train_loss": -11.22747802734375, "global_step": 224007, "epoch": 1333} {"train_loss": -10.77818775177002, "global_step": 224008, "epoch": 1333} {"train_loss": -11.1292142868042, "global_step": 224009, "epoch": 1333} {"train_loss": -10.910690307617188, "global_step": 224010, "epoch": 1333} {"train_loss": -10.920585632324219, "global_step": 224011, "epoch": 1333} {"train_loss": -11.631696701049805, "global_step": 224012, "epoch": 1333} {"train_loss": -11.35831356048584, "global_step": 224013, "epoch": 1333} {"train_loss": -10.978376388549805, "global_step": 224014, "epoch": 1333} {"train_loss": -11.392938613891602, "global_step": 224015, "epoch": 1333} {"train_loss": -10.77902603149414, "global_step": 224016, "epoch": 1333} {"train_loss": -11.285829544067383, "global_step": 224017, "epoch": 1333} {"train_loss": -10.632442474365234, "global_step": 224018, "epoch": 1333} {"train_loss": -11.48592758178711, "global_step": 224019, "epoch": 1333} {"train_loss": -11.178709983825684, "global_step": 224020, "epoch": 1333} {"train_loss": -11.042884826660156, "global_step": 224021, "epoch": 1333} {"train_loss": -11.552624702453613, "global_step": 224022, "epoch": 1333} {"train_loss": -11.193126678466797, "global_step": 224023, "epoch": 1333} {"train_loss": -11.533550262451172, "global_step": 224024, "epoch": 1333} {"train_loss": -11.179023742675781, "global_step": 224025, "epoch": 1333} {"train_loss": -11.809911727905273, "global_step": 224026, "epoch": 1333} {"train_loss": -11.44873332977295, "global_step": 224027, "epoch": 1333} {"train_loss": -11.5234375, "global_step": 224028, "epoch": 1333} {"train_loss": -11.53443431854248, "global_step": 224029, "epoch": 1333} {"train_loss": -11.756242752075195, "global_step": 224030, "epoch": 1333} {"train_loss": -11.400934219360352, "global_step": 224031, "epoch": 1333} {"train_loss": -11.710750579833984, "global_step": 224032, "epoch": 1333} {"train_loss": -11.137372970581055, "global_step": 224033, "epoch": 1333} {"train_loss": -11.440131187438965, "global_step": 224034, "epoch": 1333} {"train_loss": -11.358247756958008, "global_step": 224035, "epoch": 1333} {"train_loss": -11.712387084960938, "global_step": 224036, "epoch": 1333} {"train_loss": -11.711236000061035, "global_step": 224037, "epoch": 1333} {"train_loss": -11.248393058776855, "global_step": 224038, "epoch": 1333} {"train_loss": -11.734193801879883, "global_step": 224039, "epoch": 1333} {"train_loss": -11.595717430114746, "global_step": 224040, "epoch": 1333} {"train_loss": -11.297033309936523, "global_step": 224041, "epoch": 1333} {"train_loss": -11.51832389831543, "global_step": 224042, "epoch": 1333} {"train_loss": -10.923868179321289, "global_step": 224043, "epoch": 1333} {"train_loss": -11.367118835449219, "global_step": 224044, "epoch": 1333} {"train_loss": -11.34873104095459, "global_step": 224045, "epoch": 1333} {"train_loss": -11.335740089416504, "global_step": 224046, "epoch": 1333} {"train_loss": -11.50854778289795, "global_step": 224047, "epoch": 1333} {"train_loss": -11.231500625610352, "global_step": 224048, "epoch": 1333} {"train_loss": -11.551162719726562, "global_step": 224049, "epoch": 1333} {"train_loss": -11.44897747039795, "global_step": 224050, "epoch": 1333} {"train_loss": -11.71964168548584, "global_step": 224051, "epoch": 1333} {"train_loss": -11.686559677124023, "global_step": 224052, "epoch": 1333} {"train_loss": -11.297714233398438, "global_step": 224053, "epoch": 1333} {"train_loss": -11.78377914428711, "global_step": 224054, "epoch": 1333} {"train_loss": -11.514752388000488, "global_step": 224055, "epoch": 1333} {"train_loss": -11.882133483886719, "global_step": 224056, "epoch": 1333} {"train_loss": -11.507881164550781, "global_step": 224057, "epoch": 1333} {"train_loss": -11.659313201904297, "global_step": 224058, "epoch": 1333} {"train_loss": -11.601404190063477, "global_step": 224059, "epoch": 1333} {"train_loss": -11.550826072692871, "global_step": 224060, "epoch": 1333} {"train_loss": -11.72203540802002, "global_step": 224061, "epoch": 1333} {"train_loss": -11.735313415527344, "global_step": 224062, "epoch": 1333} {"train_loss": -11.269536972045898, "global_step": 224063, "epoch": 1333} {"train_loss": -11.887137413024902, "global_step": 224064, "epoch": 1333} {"train_loss": -11.493650436401367, "global_step": 224065, "epoch": 1333} {"train_loss": -11.646408081054688, "global_step": 224066, "epoch": 1333} {"train_loss": -11.752110481262207, "global_step": 224067, "epoch": 1333} {"train_loss": -11.776556015014648, "global_step": 224068, "epoch": 1333} {"train_loss": -11.932857513427734, "global_step": 224069, "epoch": 1333} {"train_loss": -11.794509887695312, "global_step": 224070, "epoch": 1333} {"train_loss": -11.564796447753906, "global_step": 224071, "epoch": 1333} {"train_loss": -11.907763481140137, "global_step": 224072, "epoch": 1333} {"train_loss": -11.832719802856445, "global_step": 224073, "epoch": 1333} {"train_loss": -11.695199012756348, "global_step": 224074, "epoch": 1333} {"train_loss": -11.823275566101074, "global_step": 224075, "epoch": 1333} {"train_loss": -11.957544326782227, "global_step": 224076, "epoch": 1333} {"train_loss": -11.655080795288086, "global_step": 224077, "epoch": 1333} {"train_loss": -10.852838516235352, "global_step": 224078, "epoch": 1333} {"train_loss": -10.349874496459961, "global_step": 224079, "epoch": 1333} {"train_loss": -11.770275115966797, "global_step": 224080, "epoch": 1333} {"train_loss": -11.434189796447754, "global_step": 224081, "epoch": 1333} {"train_loss": -11.791936874389648, "global_step": 224082, "epoch": 1333} {"train_loss": -11.674298286437988, "global_step": 224083, "epoch": 1333} {"train_loss": -11.743093490600586, "global_step": 224084, "epoch": 1333} {"train_loss": -11.79699420928955, "global_step": 224085, "epoch": 1333} {"train_loss": -11.663592338562012, "global_step": 224086, "epoch": 1333} {"train_loss": -11.838017463684082, "global_step": 224087, "epoch": 1333} {"train_loss": -11.564953804016113, "global_step": 224088, "epoch": 1333} {"train_loss": -11.360814094543457, "global_step": 224089, "epoch": 1333} {"train_loss": -11.504995346069336, "global_step": 224090, "epoch": 1333} {"train_loss": -11.499451637268066, "global_step": 224091, "epoch": 1333} {"train_loss": -11.175695419311523, "global_step": 224092, "epoch": 1333} {"train_loss": -11.605365753173828, "global_step": 224093, "epoch": 1333} {"train_loss": -11.440027236938477, "global_step": 224094, "epoch": 1333} {"train_loss": -10.736885070800781, "global_step": 224095, "epoch": 1333} {"train_loss": -11.625314712524414, "global_step": 224096, "epoch": 1333} {"train_loss": -10.82595157623291, "global_step": 224097, "epoch": 1333} {"train_loss": -11.691003799438477, "global_step": 224098, "epoch": 1333} {"train_loss": -11.491401672363281, "global_step": 224099, "epoch": 1333} {"train_loss": -10.829123497009277, "global_step": 224100, "epoch": 1333} {"train_loss": -10.876114845275879, "global_step": 224101, "epoch": 1333} {"train_loss": -11.087355613708496, "global_step": 224102, "epoch": 1333} {"train_loss": -10.970247268676758, "global_step": 224103, "epoch": 1333} {"train_loss": -11.353198051452637, "global_step": 224104, "epoch": 1333} {"train_loss": -11.532905578613281, "global_step": 224105, "epoch": 1333} {"train_loss": -10.88106632232666, "global_step": 224106, "epoch": 1333} {"train_loss": -11.344350814819336, "global_step": 224107, "epoch": 1333} {"train_loss": -10.928558349609375, "global_step": 224108, "epoch": 1333} {"train_loss": -11.119789123535156, "global_step": 224109, "epoch": 1333} {"train_loss": -11.469132423400879, "global_step": 224110, "epoch": 1333} {"train_loss": -11.462092269034613, "global_step": 224111, "epoch": 1333, "val_loss": 258209.4375} {"train_loss": -11.221481323242188, "global_step": 224112, "epoch": 1334} {"train_loss": -11.686809539794922, "global_step": 224113, "epoch": 1334} {"train_loss": -11.36789608001709, "global_step": 224114, "epoch": 1334} {"train_loss": -11.363941192626953, "global_step": 224115, "epoch": 1334} {"train_loss": -11.09426498413086, "global_step": 224116, "epoch": 1334} {"train_loss": -11.032383918762207, "global_step": 224117, "epoch": 1334} {"train_loss": -11.13530158996582, "global_step": 224118, "epoch": 1334} {"train_loss": -10.69245719909668, "global_step": 224119, "epoch": 1334} {"train_loss": -11.473023414611816, "global_step": 224120, "epoch": 1334} {"train_loss": -10.849207878112793, "global_step": 224121, "epoch": 1334} {"train_loss": -11.368313789367676, "global_step": 224122, "epoch": 1334} {"train_loss": -11.388078689575195, "global_step": 224123, "epoch": 1334} {"train_loss": -11.5946044921875, "global_step": 224124, "epoch": 1334} {"train_loss": -11.657279014587402, "global_step": 224125, "epoch": 1334} {"train_loss": -11.13552474975586, "global_step": 224126, "epoch": 1334} {"train_loss": -11.818031311035156, "global_step": 224127, "epoch": 1334} {"train_loss": -11.620719909667969, "global_step": 224128, "epoch": 1334} {"train_loss": -11.653654098510742, "global_step": 224129, "epoch": 1334} {"train_loss": -11.580337524414062, "global_step": 224130, "epoch": 1334} {"train_loss": -11.411222457885742, "global_step": 224131, "epoch": 1334} {"train_loss": -11.545125007629395, "global_step": 224132, "epoch": 1334} {"train_loss": -11.407837867736816, "global_step": 224133, "epoch": 1334} {"train_loss": -11.505393028259277, "global_step": 224134, "epoch": 1334} {"train_loss": -11.703376770019531, "global_step": 224135, "epoch": 1334} {"train_loss": -11.502326011657715, "global_step": 224136, "epoch": 1334} {"train_loss": -11.478157043457031, "global_step": 224137, "epoch": 1334} {"train_loss": -11.63752555847168, "global_step": 224138, "epoch": 1334} {"train_loss": -11.206859588623047, "global_step": 224139, "epoch": 1334} {"train_loss": -11.638925552368164, "global_step": 224140, "epoch": 1334} {"train_loss": -11.65673828125, "global_step": 224141, "epoch": 1334} {"train_loss": -11.216143608093262, "global_step": 224142, "epoch": 1334} {"train_loss": -11.694643020629883, "global_step": 224143, "epoch": 1334} {"train_loss": -11.384623527526855, "global_step": 224144, "epoch": 1334} {"train_loss": -11.4622802734375, "global_step": 224145, "epoch": 1334} {"train_loss": -11.818859100341797, "global_step": 224146, "epoch": 1334} {"train_loss": -11.557236671447754, "global_step": 224147, "epoch": 1334} {"train_loss": -11.729765892028809, "global_step": 224148, "epoch": 1334} {"train_loss": -11.47686767578125, "global_step": 224149, "epoch": 1334} {"train_loss": -11.43857192993164, "global_step": 224150, "epoch": 1334} {"train_loss": -11.428668975830078, "global_step": 224151, "epoch": 1334} {"train_loss": -11.101177215576172, "global_step": 224152, "epoch": 1334} {"train_loss": -11.56365966796875, "global_step": 224153, "epoch": 1334} {"train_loss": -10.9214506149292, "global_step": 224154, "epoch": 1334} {"train_loss": -11.148734092712402, "global_step": 224155, "epoch": 1334} {"train_loss": -11.758047103881836, "global_step": 224156, "epoch": 1334} {"train_loss": -11.307167053222656, "global_step": 224157, "epoch": 1334} {"train_loss": -11.551563262939453, "global_step": 224158, "epoch": 1334} {"train_loss": -11.62305736541748, "global_step": 224159, "epoch": 1334} {"train_loss": -11.400093078613281, "global_step": 224160, "epoch": 1334} {"train_loss": -11.341547966003418, "global_step": 224161, "epoch": 1334} {"train_loss": -11.598224639892578, "global_step": 224162, "epoch": 1334} {"train_loss": -10.829879760742188, "global_step": 224163, "epoch": 1334} {"train_loss": -11.569912910461426, "global_step": 224164, "epoch": 1334} {"train_loss": -11.460007667541504, "global_step": 224165, "epoch": 1334} {"train_loss": -11.43891716003418, "global_step": 224166, "epoch": 1334} {"train_loss": -11.692798614501953, "global_step": 224167, "epoch": 1334} {"train_loss": -11.36567497253418, "global_step": 224168, "epoch": 1334} {"train_loss": -11.379850387573242, "global_step": 224169, "epoch": 1334} {"train_loss": -11.6443510055542, "global_step": 224170, "epoch": 1334} {"train_loss": -11.231319427490234, "global_step": 224171, "epoch": 1334} {"train_loss": -11.329288482666016, "global_step": 224172, "epoch": 1334} {"train_loss": -11.49420166015625, "global_step": 224173, "epoch": 1334} {"train_loss": -11.514249801635742, "global_step": 224174, "epoch": 1334} {"train_loss": -11.532331466674805, "global_step": 224175, "epoch": 1334} {"train_loss": -11.633277893066406, "global_step": 224176, "epoch": 1334} {"train_loss": -11.858366012573242, "global_step": 224177, "epoch": 1334} {"train_loss": -11.532896995544434, "global_step": 224178, "epoch": 1334} {"train_loss": -11.720674514770508, "global_step": 224179, "epoch": 1334} {"train_loss": -11.253033638000488, "global_step": 224180, "epoch": 1334} {"train_loss": -11.741050720214844, "global_step": 224181, "epoch": 1334} {"train_loss": -11.299663543701172, "global_step": 224182, "epoch": 1334} {"train_loss": -11.633005142211914, "global_step": 224183, "epoch": 1334} {"train_loss": -11.458427429199219, "global_step": 224184, "epoch": 1334} {"train_loss": -11.667621612548828, "global_step": 224185, "epoch": 1334} {"train_loss": -11.705511093139648, "global_step": 224186, "epoch": 1334} {"train_loss": -11.862188339233398, "global_step": 224187, "epoch": 1334} {"train_loss": -11.556560516357422, "global_step": 224188, "epoch": 1334} {"train_loss": -11.654844284057617, "global_step": 224189, "epoch": 1334} {"train_loss": -11.634122848510742, "global_step": 224190, "epoch": 1334} {"train_loss": -11.59439468383789, "global_step": 224191, "epoch": 1334} {"train_loss": -11.70879077911377, "global_step": 224192, "epoch": 1334} {"train_loss": -11.723966598510742, "global_step": 224193, "epoch": 1334} {"train_loss": -11.896305084228516, "global_step": 224194, "epoch": 1334} {"train_loss": -11.677042007446289, "global_step": 224195, "epoch": 1334} {"train_loss": -11.85763168334961, "global_step": 224196, "epoch": 1334} {"train_loss": -11.734844207763672, "global_step": 224197, "epoch": 1334} {"train_loss": -11.59848403930664, "global_step": 224198, "epoch": 1334} {"train_loss": -11.729278564453125, "global_step": 224199, "epoch": 1334} {"train_loss": -11.326786041259766, "global_step": 224200, "epoch": 1334} {"train_loss": -11.204587936401367, "global_step": 224201, "epoch": 1334} {"train_loss": -11.833149909973145, "global_step": 224202, "epoch": 1334} {"train_loss": -11.535955429077148, "global_step": 224203, "epoch": 1334} {"train_loss": -11.381603240966797, "global_step": 224204, "epoch": 1334} {"train_loss": -11.790677070617676, "global_step": 224205, "epoch": 1334} {"train_loss": -11.175775527954102, "global_step": 224206, "epoch": 1334} {"train_loss": -11.837019920349121, "global_step": 224207, "epoch": 1334} {"train_loss": -11.540903091430664, "global_step": 224208, "epoch": 1334} {"train_loss": -11.674481391906738, "global_step": 224209, "epoch": 1334} {"train_loss": -11.458250045776367, "global_step": 224210, "epoch": 1334} {"train_loss": -11.277900695800781, "global_step": 224211, "epoch": 1334} {"train_loss": -11.478862762451172, "global_step": 224212, "epoch": 1334} {"train_loss": -11.522406578063965, "global_step": 224213, "epoch": 1334} {"train_loss": -10.507063865661621, "global_step": 224214, "epoch": 1334} {"train_loss": -11.175453186035156, "global_step": 224215, "epoch": 1334} {"train_loss": -11.733442306518555, "global_step": 224216, "epoch": 1334} {"train_loss": -11.557273864746094, "global_step": 224217, "epoch": 1334} {"train_loss": -11.373333930969238, "global_step": 224218, "epoch": 1334} {"train_loss": -11.848897933959961, "global_step": 224219, "epoch": 1334} {"train_loss": -11.42481803894043, "global_step": 224220, "epoch": 1334} {"train_loss": -11.49919319152832, "global_step": 224221, "epoch": 1334} {"train_loss": -11.65336799621582, "global_step": 224222, "epoch": 1334} {"train_loss": -11.668816566467285, "global_step": 224223, "epoch": 1334} {"train_loss": -11.481346130371094, "global_step": 224224, "epoch": 1334} {"train_loss": -11.918904304504395, "global_step": 224225, "epoch": 1334} {"train_loss": -11.784040451049805, "global_step": 224226, "epoch": 1334} {"train_loss": -11.512189865112305, "global_step": 224227, "epoch": 1334} {"train_loss": -11.522425651550293, "global_step": 224228, "epoch": 1334} {"train_loss": -11.720661163330078, "global_step": 224229, "epoch": 1334} {"train_loss": -11.393138885498047, "global_step": 224230, "epoch": 1334} {"train_loss": -11.478723526000977, "global_step": 224231, "epoch": 1334} {"train_loss": -11.603621482849121, "global_step": 224232, "epoch": 1334} {"train_loss": -11.577797889709473, "global_step": 224233, "epoch": 1334} {"train_loss": -11.593276023864746, "global_step": 224234, "epoch": 1334} {"train_loss": -11.833797454833984, "global_step": 224235, "epoch": 1334} {"train_loss": -11.242953300476074, "global_step": 224236, "epoch": 1334} {"train_loss": -11.553050994873047, "global_step": 224237, "epoch": 1334} {"train_loss": -11.377035140991211, "global_step": 224238, "epoch": 1334} {"train_loss": -11.196680068969727, "global_step": 224239, "epoch": 1334} {"train_loss": -11.435346603393555, "global_step": 224240, "epoch": 1334} {"train_loss": -11.201905250549316, "global_step": 224241, "epoch": 1334} {"train_loss": -11.129180908203125, "global_step": 224242, "epoch": 1334} {"train_loss": -11.738992691040039, "global_step": 224243, "epoch": 1334} {"train_loss": -11.205636978149414, "global_step": 224244, "epoch": 1334} {"train_loss": -11.307793617248535, "global_step": 224245, "epoch": 1334} {"train_loss": -11.483125686645508, "global_step": 224246, "epoch": 1334} {"train_loss": -10.728271484375, "global_step": 224247, "epoch": 1334} {"train_loss": -11.634622573852539, "global_step": 224248, "epoch": 1334} {"train_loss": -10.11949348449707, "global_step": 224249, "epoch": 1334} {"train_loss": -11.089934349060059, "global_step": 224250, "epoch": 1334} {"train_loss": -11.705678939819336, "global_step": 224251, "epoch": 1334} {"train_loss": -10.844523429870605, "global_step": 224252, "epoch": 1334} {"train_loss": -11.697978973388672, "global_step": 224253, "epoch": 1334} {"train_loss": -11.094880104064941, "global_step": 224254, "epoch": 1334} {"train_loss": -11.662551879882812, "global_step": 224255, "epoch": 1334} {"train_loss": -11.335600852966309, "global_step": 224256, "epoch": 1334} {"train_loss": -11.529220581054688, "global_step": 224257, "epoch": 1334} {"train_loss": -11.814352035522461, "global_step": 224258, "epoch": 1334} {"train_loss": -11.609773635864258, "global_step": 224259, "epoch": 1334} {"train_loss": -11.78955078125, "global_step": 224260, "epoch": 1334} {"train_loss": -11.624593734741211, "global_step": 224261, "epoch": 1334} {"train_loss": -11.728330612182617, "global_step": 224262, "epoch": 1334} {"train_loss": -11.898061752319336, "global_step": 224263, "epoch": 1334} {"train_loss": -12.010223388671875, "global_step": 224264, "epoch": 1334} {"train_loss": -11.5576171875, "global_step": 224265, "epoch": 1334} {"train_loss": -11.914033889770508, "global_step": 224266, "epoch": 1334} {"train_loss": -11.931894302368164, "global_step": 224267, "epoch": 1334} {"train_loss": -11.537947654724121, "global_step": 224268, "epoch": 1334} {"train_loss": -11.84587287902832, "global_step": 224269, "epoch": 1334} {"train_loss": -11.651455879211426, "global_step": 224270, "epoch": 1334} {"train_loss": -11.847616195678711, "global_step": 224271, "epoch": 1334} {"train_loss": -11.750965118408203, "global_step": 224272, "epoch": 1334} {"train_loss": -11.883148193359375, "global_step": 224273, "epoch": 1334} {"train_loss": -12.00761604309082, "global_step": 224274, "epoch": 1334} {"train_loss": -12.019750595092773, "global_step": 224275, "epoch": 1334} {"train_loss": -12.037059783935547, "global_step": 224276, "epoch": 1334} {"train_loss": -11.814214706420898, "global_step": 224277, "epoch": 1334} {"train_loss": -11.932528495788574, "global_step": 224278, "epoch": 1334} {"train_loss": -11.515750288963318, "global_step": 224279, "epoch": 1334, "val_loss": 260044.328125} {"train_loss": -11.843771934509277, "global_step": 224280, "epoch": 1335} {"train_loss": -12.022955894470215, "global_step": 224281, "epoch": 1335} {"train_loss": -11.964385986328125, "global_step": 224282, "epoch": 1335} {"train_loss": -11.918173789978027, "global_step": 224283, "epoch": 1335} {"train_loss": -11.817598342895508, "global_step": 224284, "epoch": 1335} {"train_loss": -12.077885627746582, "global_step": 224285, "epoch": 1335} {"train_loss": -12.179882049560547, "global_step": 224286, "epoch": 1335} {"train_loss": -12.124608993530273, "global_step": 224287, "epoch": 1335} {"train_loss": -11.99785041809082, "global_step": 224288, "epoch": 1335} {"train_loss": -11.765058517456055, "global_step": 224289, "epoch": 1335} {"train_loss": -12.222028732299805, "global_step": 224290, "epoch": 1335} {"train_loss": -11.705440521240234, "global_step": 224291, "epoch": 1335} {"train_loss": -11.797979354858398, "global_step": 224292, "epoch": 1335} {"train_loss": -11.92082405090332, "global_step": 224293, "epoch": 1335} {"train_loss": -11.471774101257324, "global_step": 224294, "epoch": 1335} {"train_loss": -11.418841361999512, "global_step": 224295, "epoch": 1335} {"train_loss": -11.872349739074707, "global_step": 224296, "epoch": 1335} {"train_loss": -11.665811538696289, "global_step": 224297, "epoch": 1335} {"train_loss": -11.76553726196289, "global_step": 224298, "epoch": 1335} {"train_loss": -11.02517318725586, "global_step": 224299, "epoch": 1335} {"train_loss": -9.892520904541016, "global_step": 224300, "epoch": 1335} {"train_loss": -7.944123268127441, "global_step": 224301, "epoch": 1335} {"train_loss": -10.31718921661377, "global_step": 224302, "epoch": 1335} {"train_loss": -6.283694267272949, "global_step": 224303, "epoch": 1335} {"train_loss": -7.752941131591797, "global_step": 224304, "epoch": 1335} {"train_loss": -7.490570068359375, "global_step": 224305, "epoch": 1335} {"train_loss": -9.033382415771484, "global_step": 224306, "epoch": 1335} {"train_loss": -7.125831127166748, "global_step": 224307, "epoch": 1335} {"train_loss": -6.070713520050049, "global_step": 224308, "epoch": 1335} {"train_loss": -8.109443664550781, "global_step": 224309, "epoch": 1335} {"train_loss": -8.1896390914917, "global_step": 224310, "epoch": 1335} {"train_loss": -7.17933464050293, "global_step": 224311, "epoch": 1335} {"train_loss": -9.780075073242188, "global_step": 224312, "epoch": 1335} {"train_loss": -7.932981967926025, "global_step": 224313, "epoch": 1335} {"train_loss": -7.7806315422058105, "global_step": 224314, "epoch": 1335} {"train_loss": -9.576803207397461, "global_step": 224315, "epoch": 1335} {"train_loss": -9.178382873535156, "global_step": 224316, "epoch": 1335} {"train_loss": -9.928852081298828, "global_step": 224317, "epoch": 1335} {"train_loss": -9.249725341796875, "global_step": 224318, "epoch": 1335} {"train_loss": -10.167555809020996, "global_step": 224319, "epoch": 1335} {"train_loss": -9.796854019165039, "global_step": 224320, "epoch": 1335} {"train_loss": -9.393179893493652, "global_step": 224321, "epoch": 1335} {"train_loss": -10.388821601867676, "global_step": 224322, "epoch": 1335} {"train_loss": -9.44034481048584, "global_step": 224323, "epoch": 1335} {"train_loss": -10.740983009338379, "global_step": 224324, "epoch": 1335} {"train_loss": -10.041629791259766, "global_step": 224325, "epoch": 1335} {"train_loss": -10.749689102172852, "global_step": 224326, "epoch": 1335} {"train_loss": -10.756603240966797, "global_step": 224327, "epoch": 1335} {"train_loss": -10.025080680847168, "global_step": 224328, "epoch": 1335} {"train_loss": -10.655278205871582, "global_step": 224329, "epoch": 1335} {"train_loss": -10.525655746459961, "global_step": 224330, "epoch": 1335} {"train_loss": -11.035493850708008, "global_step": 224331, "epoch": 1335} {"train_loss": -10.919403076171875, "global_step": 224332, "epoch": 1335} {"train_loss": -10.383868217468262, "global_step": 224333, "epoch": 1335} {"train_loss": -11.077066421508789, "global_step": 224334, "epoch": 1335} {"train_loss": -10.941658020019531, "global_step": 224335, "epoch": 1335} {"train_loss": -10.893691062927246, "global_step": 224336, "epoch": 1335} {"train_loss": -11.023118019104004, "global_step": 224337, "epoch": 1335} {"train_loss": -10.938048362731934, "global_step": 224338, "epoch": 1335} {"train_loss": -11.108760833740234, "global_step": 224339, "epoch": 1335} {"train_loss": -11.147192001342773, "global_step": 224340, "epoch": 1335} {"train_loss": -10.899106979370117, "global_step": 224341, "epoch": 1335} {"train_loss": -10.958906173706055, "global_step": 224342, "epoch": 1335} {"train_loss": -11.023024559020996, "global_step": 224343, "epoch": 1335} {"train_loss": -11.337162017822266, "global_step": 224344, "epoch": 1335} {"train_loss": -11.266366958618164, "global_step": 224345, "epoch": 1335} {"train_loss": -11.194904327392578, "global_step": 224346, "epoch": 1335} {"train_loss": -11.1754732131958, "global_step": 224347, "epoch": 1335} {"train_loss": -11.412433624267578, "global_step": 224348, "epoch": 1335} {"train_loss": -11.242177963256836, "global_step": 224349, "epoch": 1335} {"train_loss": -11.435647964477539, "global_step": 224350, "epoch": 1335} {"train_loss": -11.317045211791992, "global_step": 224351, "epoch": 1335} {"train_loss": -11.397850036621094, "global_step": 224352, "epoch": 1335} {"train_loss": -11.343228340148926, "global_step": 224353, "epoch": 1335} {"train_loss": -11.198233604431152, "global_step": 224354, "epoch": 1335} {"train_loss": -11.452239036560059, "global_step": 224355, "epoch": 1335} {"train_loss": -11.451602935791016, "global_step": 224356, "epoch": 1335} {"train_loss": -11.531606674194336, "global_step": 224357, "epoch": 1335} {"train_loss": -11.428048133850098, "global_step": 224358, "epoch": 1335} {"train_loss": -11.494939804077148, "global_step": 224359, "epoch": 1335} {"train_loss": -11.541421890258789, "global_step": 224360, "epoch": 1335} {"train_loss": -11.623445510864258, "global_step": 224361, "epoch": 1335} {"train_loss": -11.557785034179688, "global_step": 224362, "epoch": 1335} {"train_loss": -11.683055877685547, "global_step": 224363, "epoch": 1335} {"train_loss": -11.636019706726074, "global_step": 224364, "epoch": 1335} {"train_loss": -11.770687103271484, "global_step": 224365, "epoch": 1335} {"train_loss": -11.517354965209961, "global_step": 224366, "epoch": 1335} {"train_loss": -11.66789436340332, "global_step": 224367, "epoch": 1335} {"train_loss": -11.687363624572754, "global_step": 224368, "epoch": 1335} {"train_loss": -11.53389835357666, "global_step": 224369, "epoch": 1335} {"train_loss": -11.843843460083008, "global_step": 224370, "epoch": 1335} {"train_loss": -11.801033020019531, "global_step": 224371, "epoch": 1335} {"train_loss": -11.561333656311035, "global_step": 224372, "epoch": 1335} {"train_loss": -11.930742263793945, "global_step": 224373, "epoch": 1335} {"train_loss": -11.652584075927734, "global_step": 224374, "epoch": 1335} {"train_loss": -11.820446968078613, "global_step": 224375, "epoch": 1335} {"train_loss": -11.543123245239258, "global_step": 224376, "epoch": 1335} {"train_loss": -11.928537368774414, "global_step": 224377, "epoch": 1335} {"train_loss": -11.896744728088379, "global_step": 224378, "epoch": 1335} {"train_loss": -11.689657211303711, "global_step": 224379, "epoch": 1335} {"train_loss": -11.849103927612305, "global_step": 224380, "epoch": 1335} {"train_loss": -11.806471824645996, "global_step": 224381, "epoch": 1335} {"train_loss": -11.841590881347656, "global_step": 224382, "epoch": 1335} {"train_loss": -11.943357467651367, "global_step": 224383, "epoch": 1335} {"train_loss": -11.935516357421875, "global_step": 224384, "epoch": 1335} {"train_loss": -11.815938949584961, "global_step": 224385, "epoch": 1335} {"train_loss": -12.118095397949219, "global_step": 224386, "epoch": 1335} {"train_loss": -11.96789264678955, "global_step": 224387, "epoch": 1335} {"train_loss": -12.054780960083008, "global_step": 224388, "epoch": 1335} {"train_loss": -11.813892364501953, "global_step": 224389, "epoch": 1335} {"train_loss": -11.838619232177734, "global_step": 224390, "epoch": 1335} {"train_loss": -11.847368240356445, "global_step": 224391, "epoch": 1335} {"train_loss": -11.909677505493164, "global_step": 224392, "epoch": 1335} {"train_loss": -11.89177417755127, "global_step": 224393, "epoch": 1335} {"train_loss": -11.866987228393555, "global_step": 224394, "epoch": 1335} {"train_loss": -11.860299110412598, "global_step": 224395, "epoch": 1335} {"train_loss": -11.777822494506836, "global_step": 224396, "epoch": 1335} {"train_loss": -12.067729949951172, "global_step": 224397, "epoch": 1335} {"train_loss": -11.634855270385742, "global_step": 224398, "epoch": 1335} {"train_loss": -12.09266471862793, "global_step": 224399, "epoch": 1335} {"train_loss": -11.907257080078125, "global_step": 224400, "epoch": 1335} {"train_loss": -12.179719924926758, "global_step": 224401, "epoch": 1335} {"train_loss": -11.864961624145508, "global_step": 224402, "epoch": 1335} {"train_loss": -11.722614288330078, "global_step": 224403, "epoch": 1335} {"train_loss": -11.750880241394043, "global_step": 224404, "epoch": 1335} {"train_loss": -11.791657447814941, "global_step": 224405, "epoch": 1335} {"train_loss": -12.07935905456543, "global_step": 224406, "epoch": 1335} {"train_loss": -11.982635498046875, "global_step": 224407, "epoch": 1335} {"train_loss": -11.55578899383545, "global_step": 224408, "epoch": 1335} {"train_loss": -11.36529541015625, "global_step": 224409, "epoch": 1335} {"train_loss": -11.857210159301758, "global_step": 224410, "epoch": 1335} {"train_loss": -11.78699016571045, "global_step": 224411, "epoch": 1335} {"train_loss": -11.53911304473877, "global_step": 224412, "epoch": 1335} {"train_loss": -11.395484924316406, "global_step": 224413, "epoch": 1335} {"train_loss": -11.34592056274414, "global_step": 224414, "epoch": 1335} {"train_loss": -11.668720245361328, "global_step": 224415, "epoch": 1335} {"train_loss": -12.025825500488281, "global_step": 224416, "epoch": 1335} {"train_loss": -11.985763549804688, "global_step": 224417, "epoch": 1335} {"train_loss": -11.692205429077148, "global_step": 224418, "epoch": 1335} {"train_loss": -11.443365097045898, "global_step": 224419, "epoch": 1335} {"train_loss": -10.479376792907715, "global_step": 224420, "epoch": 1335} {"train_loss": -10.495253562927246, "global_step": 224421, "epoch": 1335} {"train_loss": -11.736352920532227, "global_step": 224422, "epoch": 1335} {"train_loss": -11.880539894104004, "global_step": 224423, "epoch": 1335} {"train_loss": -10.972856521606445, "global_step": 224424, "epoch": 1335} {"train_loss": -11.304681777954102, "global_step": 224425, "epoch": 1335} {"train_loss": -11.85931396484375, "global_step": 224426, "epoch": 1335} {"train_loss": -11.43922233581543, "global_step": 224427, "epoch": 1335} {"train_loss": -11.57992172241211, "global_step": 224428, "epoch": 1335} {"train_loss": -11.588257789611816, "global_step": 224429, "epoch": 1335} {"train_loss": -11.780352592468262, "global_step": 224430, "epoch": 1335} {"train_loss": -11.605318069458008, "global_step": 224431, "epoch": 1335} {"train_loss": -11.516408920288086, "global_step": 224432, "epoch": 1335} {"train_loss": -11.963411331176758, "global_step": 224433, "epoch": 1335} {"train_loss": -11.600123405456543, "global_step": 224434, "epoch": 1335} {"train_loss": -11.802988052368164, "global_step": 224435, "epoch": 1335} {"train_loss": -11.909156799316406, "global_step": 224436, "epoch": 1335} {"train_loss": -11.724447250366211, "global_step": 224437, "epoch": 1335} {"train_loss": -11.297000885009766, "global_step": 224438, "epoch": 1335} {"train_loss": -11.841485023498535, "global_step": 224439, "epoch": 1335} {"train_loss": -11.416744232177734, "global_step": 224440, "epoch": 1335} {"train_loss": -10.13209342956543, "global_step": 224441, "epoch": 1335} {"train_loss": -10.348057746887207, "global_step": 224442, "epoch": 1335} {"train_loss": -11.178937911987305, "global_step": 224443, "epoch": 1335} {"train_loss": -10.864006996154785, "global_step": 224444, "epoch": 1335} {"train_loss": -10.027591705322266, "global_step": 224445, "epoch": 1335} {"train_loss": -10.820657730102539, "global_step": 224446, "epoch": 1335} {"train_loss": -11.096922272727603, "global_step": 224447, "epoch": 1335, "val_loss": 252021.5, "train_action_mse_error": 1.971353530883789} {"train_loss": -9.488245010375977, "global_step": 224448, "epoch": 1336} {"train_loss": -10.451506614685059, "global_step": 224449, "epoch": 1336} {"train_loss": -9.082708358764648, "global_step": 224450, "epoch": 1336} {"train_loss": -8.575088500976562, "global_step": 224451, "epoch": 1336} {"train_loss": -7.5699920654296875, "global_step": 224452, "epoch": 1336} {"train_loss": -8.703800201416016, "global_step": 224453, "epoch": 1336} {"train_loss": -9.395930290222168, "global_step": 224454, "epoch": 1336} {"train_loss": -9.790691375732422, "global_step": 224455, "epoch": 1336} {"train_loss": -9.244120597839355, "global_step": 224456, "epoch": 1336} {"train_loss": -9.111391067504883, "global_step": 224457, "epoch": 1336} {"train_loss": -9.73941707611084, "global_step": 224458, "epoch": 1336} {"train_loss": -9.7731294631958, "global_step": 224459, "epoch": 1336} {"train_loss": -9.661969184875488, "global_step": 224460, "epoch": 1336} {"train_loss": -10.089797973632812, "global_step": 224461, "epoch": 1336} {"train_loss": -10.040892601013184, "global_step": 224462, "epoch": 1336} {"train_loss": -10.310004234313965, "global_step": 224463, "epoch": 1336} {"train_loss": -10.329331398010254, "global_step": 224464, "epoch": 1336} {"train_loss": -9.918996810913086, "global_step": 224465, "epoch": 1336} {"train_loss": -10.475340843200684, "global_step": 224466, "epoch": 1336} {"train_loss": -11.109256744384766, "global_step": 224467, "epoch": 1336} {"train_loss": -10.427253723144531, "global_step": 224468, "epoch": 1336} {"train_loss": -10.786639213562012, "global_step": 224469, "epoch": 1336} {"train_loss": -10.841249465942383, "global_step": 224470, "epoch": 1336} {"train_loss": -10.555673599243164, "global_step": 224471, "epoch": 1336} {"train_loss": -10.998390197753906, "global_step": 224472, "epoch": 1336} {"train_loss": -11.379197120666504, "global_step": 224473, "epoch": 1336} {"train_loss": -10.956056594848633, "global_step": 224474, "epoch": 1336} {"train_loss": -10.98550796508789, "global_step": 224475, "epoch": 1336} {"train_loss": -11.265275955200195, "global_step": 224476, "epoch": 1336} {"train_loss": -11.161690711975098, "global_step": 224477, "epoch": 1336} {"train_loss": -10.934246063232422, "global_step": 224478, "epoch": 1336} {"train_loss": -11.17443561553955, "global_step": 224479, "epoch": 1336} {"train_loss": -11.217985153198242, "global_step": 224480, "epoch": 1336} {"train_loss": -11.125940322875977, "global_step": 224481, "epoch": 1336} {"train_loss": -11.183931350708008, "global_step": 224482, "epoch": 1336} {"train_loss": -10.962076187133789, "global_step": 224483, "epoch": 1336} {"train_loss": -11.133670806884766, "global_step": 224484, "epoch": 1336} {"train_loss": -11.14512825012207, "global_step": 224485, "epoch": 1336} {"train_loss": -11.375452995300293, "global_step": 224486, "epoch": 1336} {"train_loss": -11.004687309265137, "global_step": 224487, "epoch": 1336} {"train_loss": -11.130489349365234, "global_step": 224488, "epoch": 1336} {"train_loss": -11.107712745666504, "global_step": 224489, "epoch": 1336} {"train_loss": -11.191990852355957, "global_step": 224490, "epoch": 1336} {"train_loss": -11.344425201416016, "global_step": 224491, "epoch": 1336} {"train_loss": -11.117433547973633, "global_step": 224492, "epoch": 1336} {"train_loss": -11.299883842468262, "global_step": 224493, "epoch": 1336} {"train_loss": -11.248834609985352, "global_step": 224494, "epoch": 1336} {"train_loss": -11.46949577331543, "global_step": 224495, "epoch": 1336} {"train_loss": -11.346076011657715, "global_step": 224496, "epoch": 1336} {"train_loss": -11.447155952453613, "global_step": 224497, "epoch": 1336} {"train_loss": -11.484308242797852, "global_step": 224498, "epoch": 1336} {"train_loss": -11.390398025512695, "global_step": 224499, "epoch": 1336} {"train_loss": -11.390829086303711, "global_step": 224500, "epoch": 1336} {"train_loss": -11.592327117919922, "global_step": 224501, "epoch": 1336} {"train_loss": -11.478751182556152, "global_step": 224502, "epoch": 1336} {"train_loss": -11.644244194030762, "global_step": 224503, "epoch": 1336} {"train_loss": -11.492351531982422, "global_step": 224504, "epoch": 1336} {"train_loss": -11.784829139709473, "global_step": 224505, "epoch": 1336} {"train_loss": -11.549421310424805, "global_step": 224506, "epoch": 1336} {"train_loss": -11.628861427307129, "global_step": 224507, "epoch": 1336} {"train_loss": -11.8944091796875, "global_step": 224508, "epoch": 1336} {"train_loss": -11.770917892456055, "global_step": 224509, "epoch": 1336} {"train_loss": -11.79800796508789, "global_step": 224510, "epoch": 1336} {"train_loss": -11.654006958007812, "global_step": 224511, "epoch": 1336} {"train_loss": -11.700223922729492, "global_step": 224512, "epoch": 1336} {"train_loss": -11.707763671875, "global_step": 224513, "epoch": 1336} {"train_loss": -11.778928756713867, "global_step": 224514, "epoch": 1336} {"train_loss": -11.72960090637207, "global_step": 224515, "epoch": 1336} {"train_loss": -11.944840431213379, "global_step": 224516, "epoch": 1336} {"train_loss": -11.80400276184082, "global_step": 224517, "epoch": 1336} {"train_loss": -11.983346939086914, "global_step": 224518, "epoch": 1336} {"train_loss": -11.812788963317871, "global_step": 224519, "epoch": 1336} {"train_loss": -11.821372985839844, "global_step": 224520, "epoch": 1336} {"train_loss": -11.881380081176758, "global_step": 224521, "epoch": 1336} {"train_loss": -11.852737426757812, "global_step": 224522, "epoch": 1336} {"train_loss": -11.85418701171875, "global_step": 224523, "epoch": 1336} {"train_loss": -11.913313865661621, "global_step": 224524, "epoch": 1336} {"train_loss": -11.91545295715332, "global_step": 224525, "epoch": 1336} {"train_loss": -11.858988761901855, "global_step": 224526, "epoch": 1336} {"train_loss": -11.989173889160156, "global_step": 224527, "epoch": 1336} {"train_loss": -12.050384521484375, "global_step": 224528, "epoch": 1336} {"train_loss": -12.072300910949707, "global_step": 224529, "epoch": 1336} {"train_loss": -12.0402193069458, "global_step": 224530, "epoch": 1336} {"train_loss": -11.741044998168945, "global_step": 224531, "epoch": 1336} {"train_loss": -12.004647254943848, "global_step": 224532, "epoch": 1336} {"train_loss": -11.928739547729492, "global_step": 224533, "epoch": 1336} {"train_loss": -11.90491771697998, "global_step": 224534, "epoch": 1336} {"train_loss": -11.705704689025879, "global_step": 224535, "epoch": 1336} {"train_loss": -11.820005416870117, "global_step": 224536, "epoch": 1336} {"train_loss": -12.047950744628906, "global_step": 224537, "epoch": 1336} {"train_loss": -11.800544738769531, "global_step": 224538, "epoch": 1336} {"train_loss": -11.557130813598633, "global_step": 224539, "epoch": 1336} {"train_loss": -11.899765014648438, "global_step": 224540, "epoch": 1336} {"train_loss": -12.05084228515625, "global_step": 224541, "epoch": 1336} {"train_loss": -12.038467407226562, "global_step": 224542, "epoch": 1336} {"train_loss": -11.919892311096191, "global_step": 224543, "epoch": 1336} {"train_loss": -11.902581214904785, "global_step": 224544, "epoch": 1336} {"train_loss": -11.704065322875977, "global_step": 224545, "epoch": 1336} {"train_loss": -12.073694229125977, "global_step": 224546, "epoch": 1336} {"train_loss": -11.825157165527344, "global_step": 224547, "epoch": 1336} {"train_loss": -11.956416130065918, "global_step": 224548, "epoch": 1336} {"train_loss": -11.946928977966309, "global_step": 224549, "epoch": 1336} {"train_loss": -11.932928085327148, "global_step": 224550, "epoch": 1336} {"train_loss": -11.631721496582031, "global_step": 224551, "epoch": 1336} {"train_loss": -11.827291488647461, "global_step": 224552, "epoch": 1336} {"train_loss": -10.227193832397461, "global_step": 224553, "epoch": 1336} {"train_loss": -9.253656387329102, "global_step": 224554, "epoch": 1336} {"train_loss": -9.663497924804688, "global_step": 224555, "epoch": 1336} {"train_loss": -7.766528129577637, "global_step": 224556, "epoch": 1336} {"train_loss": -9.469594955444336, "global_step": 224557, "epoch": 1336} {"train_loss": -6.957131385803223, "global_step": 224558, "epoch": 1336} {"train_loss": -8.422761917114258, "global_step": 224559, "epoch": 1336} {"train_loss": -8.563485145568848, "global_step": 224560, "epoch": 1336} {"train_loss": -10.632020950317383, "global_step": 224561, "epoch": 1336} {"train_loss": -9.8876953125, "global_step": 224562, "epoch": 1336} {"train_loss": -8.651679992675781, "global_step": 224563, "epoch": 1336} {"train_loss": -8.330937385559082, "global_step": 224564, "epoch": 1336} {"train_loss": -7.514682769775391, "global_step": 224565, "epoch": 1336} {"train_loss": -9.857431411743164, "global_step": 224566, "epoch": 1336} {"train_loss": -9.310195922851562, "global_step": 224567, "epoch": 1336} {"train_loss": -9.832113265991211, "global_step": 224568, "epoch": 1336} {"train_loss": -10.311073303222656, "global_step": 224569, "epoch": 1336} {"train_loss": -9.682975769042969, "global_step": 224570, "epoch": 1336} {"train_loss": -9.507943153381348, "global_step": 224571, "epoch": 1336} {"train_loss": -10.28071403503418, "global_step": 224572, "epoch": 1336} {"train_loss": -9.35983657836914, "global_step": 224573, "epoch": 1336} {"train_loss": -9.673227310180664, "global_step": 224574, "epoch": 1336} {"train_loss": -10.665777206420898, "global_step": 224575, "epoch": 1336} {"train_loss": -9.607291221618652, "global_step": 224576, "epoch": 1336} {"train_loss": -9.765884399414062, "global_step": 224577, "epoch": 1336} {"train_loss": -10.651626586914062, "global_step": 224578, "epoch": 1336} {"train_loss": -10.541091918945312, "global_step": 224579, "epoch": 1336} {"train_loss": -10.151552200317383, "global_step": 224580, "epoch": 1336} {"train_loss": -10.85932445526123, "global_step": 224581, "epoch": 1336} {"train_loss": -10.308645248413086, "global_step": 224582, "epoch": 1336} {"train_loss": -10.292688369750977, "global_step": 224583, "epoch": 1336} {"train_loss": -10.459403991699219, "global_step": 224584, "epoch": 1336} {"train_loss": -11.330471992492676, "global_step": 224585, "epoch": 1336} {"train_loss": -10.758502960205078, "global_step": 224586, "epoch": 1336} {"train_loss": -11.243194580078125, "global_step": 224587, "epoch": 1336} {"train_loss": -11.215316772460938, "global_step": 224588, "epoch": 1336} {"train_loss": -11.19582462310791, "global_step": 224589, "epoch": 1336} {"train_loss": -11.35089111328125, "global_step": 224590, "epoch": 1336} {"train_loss": -11.170682907104492, "global_step": 224591, "epoch": 1336} {"train_loss": -11.309514999389648, "global_step": 224592, "epoch": 1336} {"train_loss": -11.50543212890625, "global_step": 224593, "epoch": 1336} {"train_loss": -11.30545425415039, "global_step": 224594, "epoch": 1336} {"train_loss": -11.39296817779541, "global_step": 224595, "epoch": 1336} {"train_loss": -11.237943649291992, "global_step": 224596, "epoch": 1336} {"train_loss": -11.671073913574219, "global_step": 224597, "epoch": 1336} {"train_loss": -11.366348266601562, "global_step": 224598, "epoch": 1336} {"train_loss": -11.565842628479004, "global_step": 224599, "epoch": 1336} {"train_loss": -11.29723834991455, "global_step": 224600, "epoch": 1336} {"train_loss": -11.543100357055664, "global_step": 224601, "epoch": 1336} {"train_loss": -11.315765380859375, "global_step": 224602, "epoch": 1336} {"train_loss": -11.509450912475586, "global_step": 224603, "epoch": 1336} {"train_loss": -11.417694091796875, "global_step": 224604, "epoch": 1336} {"train_loss": -11.616077423095703, "global_step": 224605, "epoch": 1336} {"train_loss": -11.474308967590332, "global_step": 224606, "epoch": 1336} {"train_loss": -11.718914031982422, "global_step": 224607, "epoch": 1336} {"train_loss": -11.603322982788086, "global_step": 224608, "epoch": 1336} {"train_loss": -11.725139617919922, "global_step": 224609, "epoch": 1336} {"train_loss": -11.712445259094238, "global_step": 224610, "epoch": 1336} {"train_loss": -11.433034896850586, "global_step": 224611, "epoch": 1336} {"train_loss": -11.56168270111084, "global_step": 224612, "epoch": 1336} {"train_loss": -11.703512191772461, "global_step": 224613, "epoch": 1336} {"train_loss": -11.698709487915039, "global_step": 224614, "epoch": 1336} {"train_loss": -10.932945075489226, "global_step": 224615, "epoch": 1336, "val_loss": 252004.078125} {"train_loss": -11.79745101928711, "global_step": 224616, "epoch": 1337} {"train_loss": -11.632137298583984, "global_step": 224617, "epoch": 1337} {"train_loss": -11.719388961791992, "global_step": 224618, "epoch": 1337} {"train_loss": -11.752191543579102, "global_step": 224619, "epoch": 1337} {"train_loss": -11.736557960510254, "global_step": 224620, "epoch": 1337} {"train_loss": -11.60037612915039, "global_step": 224621, "epoch": 1337} {"train_loss": -11.68191909790039, "global_step": 224622, "epoch": 1337} {"train_loss": -11.775789260864258, "global_step": 224623, "epoch": 1337} {"train_loss": -11.762786865234375, "global_step": 224624, "epoch": 1337} {"train_loss": -11.705339431762695, "global_step": 224625, "epoch": 1337} {"train_loss": -11.518486976623535, "global_step": 224626, "epoch": 1337} {"train_loss": -11.809043884277344, "global_step": 224627, "epoch": 1337} {"train_loss": -11.479992866516113, "global_step": 224628, "epoch": 1337} {"train_loss": -11.882760047912598, "global_step": 224629, "epoch": 1337} {"train_loss": -11.672331809997559, "global_step": 224630, "epoch": 1337} {"train_loss": -11.69015884399414, "global_step": 224631, "epoch": 1337} {"train_loss": -11.754756927490234, "global_step": 224632, "epoch": 1337} {"train_loss": -11.525983810424805, "global_step": 224633, "epoch": 1337} {"train_loss": -11.679343223571777, "global_step": 224634, "epoch": 1337} {"train_loss": -11.701555252075195, "global_step": 224635, "epoch": 1337} {"train_loss": -11.58869457244873, "global_step": 224636, "epoch": 1337} {"train_loss": -11.810495376586914, "global_step": 224637, "epoch": 1337} {"train_loss": -11.493261337280273, "global_step": 224638, "epoch": 1337} {"train_loss": -11.641916275024414, "global_step": 224639, "epoch": 1337} {"train_loss": -11.73481559753418, "global_step": 224640, "epoch": 1337} {"train_loss": -10.688643455505371, "global_step": 224641, "epoch": 1337} {"train_loss": -11.289495468139648, "global_step": 224642, "epoch": 1337} {"train_loss": -11.748090744018555, "global_step": 224643, "epoch": 1337} {"train_loss": -11.218692779541016, "global_step": 224644, "epoch": 1337} {"train_loss": -11.759140014648438, "global_step": 224645, "epoch": 1337} {"train_loss": -11.697277069091797, "global_step": 224646, "epoch": 1337} {"train_loss": -11.709403991699219, "global_step": 224647, "epoch": 1337} {"train_loss": -11.678491592407227, "global_step": 224648, "epoch": 1337} {"train_loss": -11.764703750610352, "global_step": 224649, "epoch": 1337} {"train_loss": -11.665060997009277, "global_step": 224650, "epoch": 1337} {"train_loss": -11.672501564025879, "global_step": 224651, "epoch": 1337} {"train_loss": -11.890281677246094, "global_step": 224652, "epoch": 1337} {"train_loss": -11.802469253540039, "global_step": 224653, "epoch": 1337} {"train_loss": -11.393051147460938, "global_step": 224654, "epoch": 1337} {"train_loss": -11.765409469604492, "global_step": 224655, "epoch": 1337} {"train_loss": -12.042923927307129, "global_step": 224656, "epoch": 1337} {"train_loss": -11.846147537231445, "global_step": 224657, "epoch": 1337} {"train_loss": -11.633005142211914, "global_step": 224658, "epoch": 1337} {"train_loss": -11.861051559448242, "global_step": 224659, "epoch": 1337} {"train_loss": -11.560726165771484, "global_step": 224660, "epoch": 1337} {"train_loss": -11.223185539245605, "global_step": 224661, "epoch": 1337} {"train_loss": -11.831159591674805, "global_step": 224662, "epoch": 1337} {"train_loss": -11.302732467651367, "global_step": 224663, "epoch": 1337} {"train_loss": -11.850953102111816, "global_step": 224664, "epoch": 1337} {"train_loss": -11.545815467834473, "global_step": 224665, "epoch": 1337} {"train_loss": -11.014652252197266, "global_step": 224666, "epoch": 1337} {"train_loss": -11.863638877868652, "global_step": 224667, "epoch": 1337} {"train_loss": -10.043343544006348, "global_step": 224668, "epoch": 1337} {"train_loss": -8.935977935791016, "global_step": 224669, "epoch": 1337} {"train_loss": -9.938850402832031, "global_step": 224670, "epoch": 1337} {"train_loss": -9.458332061767578, "global_step": 224671, "epoch": 1337} {"train_loss": -9.258358001708984, "global_step": 224672, "epoch": 1337} {"train_loss": -9.71743106842041, "global_step": 224673, "epoch": 1337} {"train_loss": -9.226814270019531, "global_step": 224674, "epoch": 1337} {"train_loss": -7.746030807495117, "global_step": 224675, "epoch": 1337} {"train_loss": -8.030637741088867, "global_step": 224676, "epoch": 1337} {"train_loss": -9.2703218460083, "global_step": 224677, "epoch": 1337} {"train_loss": -9.718229293823242, "global_step": 224678, "epoch": 1337} {"train_loss": -8.193506240844727, "global_step": 224679, "epoch": 1337} {"train_loss": -8.72297191619873, "global_step": 224680, "epoch": 1337} {"train_loss": -10.053918838500977, "global_step": 224681, "epoch": 1337} {"train_loss": -9.999053955078125, "global_step": 224682, "epoch": 1337} {"train_loss": -9.760490417480469, "global_step": 224683, "epoch": 1337} {"train_loss": -10.333353042602539, "global_step": 224684, "epoch": 1337} {"train_loss": -10.662787437438965, "global_step": 224685, "epoch": 1337} {"train_loss": -9.936568260192871, "global_step": 224686, "epoch": 1337} {"train_loss": -10.321003913879395, "global_step": 224687, "epoch": 1337} {"train_loss": -10.493974685668945, "global_step": 224688, "epoch": 1337} {"train_loss": -10.1839017868042, "global_step": 224689, "epoch": 1337} {"train_loss": -10.97964096069336, "global_step": 224690, "epoch": 1337} {"train_loss": -10.829816818237305, "global_step": 224691, "epoch": 1337} {"train_loss": -10.429669380187988, "global_step": 224692, "epoch": 1337} {"train_loss": -10.74577808380127, "global_step": 224693, "epoch": 1337} {"train_loss": -10.700580596923828, "global_step": 224694, "epoch": 1337} {"train_loss": -10.262388229370117, "global_step": 224695, "epoch": 1337} {"train_loss": -11.150070190429688, "global_step": 224696, "epoch": 1337} {"train_loss": -10.785138130187988, "global_step": 224697, "epoch": 1337} {"train_loss": -10.383359909057617, "global_step": 224698, "epoch": 1337} {"train_loss": -10.336002349853516, "global_step": 224699, "epoch": 1337} {"train_loss": -10.409555435180664, "global_step": 224700, "epoch": 1337} {"train_loss": -10.799960136413574, "global_step": 224701, "epoch": 1337} {"train_loss": -10.853034973144531, "global_step": 224702, "epoch": 1337} {"train_loss": -10.601478576660156, "global_step": 224703, "epoch": 1337} {"train_loss": -10.839550971984863, "global_step": 224704, "epoch": 1337} {"train_loss": -11.15777587890625, "global_step": 224705, "epoch": 1337} {"train_loss": -10.580497741699219, "global_step": 224706, "epoch": 1337} {"train_loss": -11.081814765930176, "global_step": 224707, "epoch": 1337} {"train_loss": -11.255335807800293, "global_step": 224708, "epoch": 1337} {"train_loss": -10.658994674682617, "global_step": 224709, "epoch": 1337} {"train_loss": -11.306623458862305, "global_step": 224710, "epoch": 1337} {"train_loss": -10.848264694213867, "global_step": 224711, "epoch": 1337} {"train_loss": -10.821189880371094, "global_step": 224712, "epoch": 1337} {"train_loss": -11.175655364990234, "global_step": 224713, "epoch": 1337} {"train_loss": -11.07952880859375, "global_step": 224714, "epoch": 1337} {"train_loss": -10.764240264892578, "global_step": 224715, "epoch": 1337} {"train_loss": -11.209962844848633, "global_step": 224716, "epoch": 1337} {"train_loss": -11.504773139953613, "global_step": 224717, "epoch": 1337} {"train_loss": -11.119871139526367, "global_step": 224718, "epoch": 1337} {"train_loss": -11.315603256225586, "global_step": 224719, "epoch": 1337} {"train_loss": -11.280332565307617, "global_step": 224720, "epoch": 1337} {"train_loss": -11.086591720581055, "global_step": 224721, "epoch": 1337} {"train_loss": -11.323522567749023, "global_step": 224722, "epoch": 1337} {"train_loss": -11.253129959106445, "global_step": 224723, "epoch": 1337} {"train_loss": -11.481163024902344, "global_step": 224724, "epoch": 1337} {"train_loss": -11.285557746887207, "global_step": 224725, "epoch": 1337} {"train_loss": -11.273637771606445, "global_step": 224726, "epoch": 1337} {"train_loss": -11.197257041931152, "global_step": 224727, "epoch": 1337} {"train_loss": -11.294620513916016, "global_step": 224728, "epoch": 1337} {"train_loss": -11.536730766296387, "global_step": 224729, "epoch": 1337} {"train_loss": -11.537363052368164, "global_step": 224730, "epoch": 1337} {"train_loss": -11.375221252441406, "global_step": 224731, "epoch": 1337} {"train_loss": -11.536593437194824, "global_step": 224732, "epoch": 1337} {"train_loss": -11.337080001831055, "global_step": 224733, "epoch": 1337} {"train_loss": -11.487858772277832, "global_step": 224734, "epoch": 1337} {"train_loss": -11.64205551147461, "global_step": 224735, "epoch": 1337} {"train_loss": -11.511873245239258, "global_step": 224736, "epoch": 1337} {"train_loss": -11.51666259765625, "global_step": 224737, "epoch": 1337} {"train_loss": -11.730228424072266, "global_step": 224738, "epoch": 1337} {"train_loss": -11.589637756347656, "global_step": 224739, "epoch": 1337} {"train_loss": -11.468238830566406, "global_step": 224740, "epoch": 1337} {"train_loss": -11.63405704498291, "global_step": 224741, "epoch": 1337} {"train_loss": -11.408307075500488, "global_step": 224742, "epoch": 1337} {"train_loss": -11.573943138122559, "global_step": 224743, "epoch": 1337} {"train_loss": -11.628087997436523, "global_step": 224744, "epoch": 1337} {"train_loss": -11.477615356445312, "global_step": 224745, "epoch": 1337} {"train_loss": -11.693513870239258, "global_step": 224746, "epoch": 1337} {"train_loss": -11.480182647705078, "global_step": 224747, "epoch": 1337} {"train_loss": -11.774219512939453, "global_step": 224748, "epoch": 1337} {"train_loss": -11.680883407592773, "global_step": 224749, "epoch": 1337} {"train_loss": -11.882659912109375, "global_step": 224750, "epoch": 1337} {"train_loss": -11.783069610595703, "global_step": 224751, "epoch": 1337} {"train_loss": -11.821091651916504, "global_step": 224752, "epoch": 1337} {"train_loss": -11.689611434936523, "global_step": 224753, "epoch": 1337} {"train_loss": -11.774629592895508, "global_step": 224754, "epoch": 1337} {"train_loss": -11.830341339111328, "global_step": 224755, "epoch": 1337} {"train_loss": -11.798980712890625, "global_step": 224756, "epoch": 1337} {"train_loss": -11.85794448852539, "global_step": 224757, "epoch": 1337} {"train_loss": -11.880319595336914, "global_step": 224758, "epoch": 1337} {"train_loss": -11.865777969360352, "global_step": 224759, "epoch": 1337} {"train_loss": -11.983213424682617, "global_step": 224760, "epoch": 1337} {"train_loss": -11.693316459655762, "global_step": 224761, "epoch": 1337} {"train_loss": -11.69011116027832, "global_step": 224762, "epoch": 1337} {"train_loss": -11.824823379516602, "global_step": 224763, "epoch": 1337} {"train_loss": -11.745311737060547, "global_step": 224764, "epoch": 1337} {"train_loss": -11.684907913208008, "global_step": 224765, "epoch": 1337} {"train_loss": -11.80179214477539, "global_step": 224766, "epoch": 1337} {"train_loss": -11.771858215332031, "global_step": 224767, "epoch": 1337} {"train_loss": -11.7728910446167, "global_step": 224768, "epoch": 1337} {"train_loss": -11.442146301269531, "global_step": 224769, "epoch": 1337} {"train_loss": -11.738523483276367, "global_step": 224770, "epoch": 1337} {"train_loss": -11.93189811706543, "global_step": 224771, "epoch": 1337} {"train_loss": -11.74266529083252, "global_step": 224772, "epoch": 1337} {"train_loss": -11.503854751586914, "global_step": 224773, "epoch": 1337} {"train_loss": -11.997123718261719, "global_step": 224774, "epoch": 1337} {"train_loss": -11.733528137207031, "global_step": 224775, "epoch": 1337} {"train_loss": -11.981990814208984, "global_step": 224776, "epoch": 1337} {"train_loss": -12.039667129516602, "global_step": 224777, "epoch": 1337} {"train_loss": -11.817815780639648, "global_step": 224778, "epoch": 1337} {"train_loss": -11.907848358154297, "global_step": 224779, "epoch": 1337} {"train_loss": -12.020743370056152, "global_step": 224780, "epoch": 1337} {"train_loss": -11.84649658203125, "global_step": 224781, "epoch": 1337} {"train_loss": -11.9149808883667, "global_step": 224782, "epoch": 1337} {"train_loss": -11.232297477268038, "global_step": 224783, "epoch": 1337, "val_loss": 259435.484375} {"train_loss": -11.748146057128906, "global_step": 224784, "epoch": 1338} {"train_loss": -10.994906425476074, "global_step": 224785, "epoch": 1338} {"train_loss": -11.168437004089355, "global_step": 224786, "epoch": 1338} {"train_loss": -11.82426643371582, "global_step": 224787, "epoch": 1338} {"train_loss": -11.559370994567871, "global_step": 224788, "epoch": 1338} {"train_loss": -11.280953407287598, "global_step": 224789, "epoch": 1338} {"train_loss": -11.837529182434082, "global_step": 224790, "epoch": 1338} {"train_loss": -11.532367706298828, "global_step": 224791, "epoch": 1338} {"train_loss": -11.136768341064453, "global_step": 224792, "epoch": 1338} {"train_loss": -11.548601150512695, "global_step": 224793, "epoch": 1338} {"train_loss": -11.788877487182617, "global_step": 224794, "epoch": 1338} {"train_loss": -11.563764572143555, "global_step": 224795, "epoch": 1338} {"train_loss": -11.633879661560059, "global_step": 224796, "epoch": 1338} {"train_loss": -11.369084358215332, "global_step": 224797, "epoch": 1338} {"train_loss": -11.852837562561035, "global_step": 224798, "epoch": 1338} {"train_loss": -11.0726318359375, "global_step": 224799, "epoch": 1338} {"train_loss": -11.951878547668457, "global_step": 224800, "epoch": 1338} {"train_loss": -11.013404846191406, "global_step": 224801, "epoch": 1338} {"train_loss": -11.370466232299805, "global_step": 224802, "epoch": 1338} {"train_loss": -11.187042236328125, "global_step": 224803, "epoch": 1338} {"train_loss": -11.479312896728516, "global_step": 224804, "epoch": 1338} {"train_loss": -11.395062446594238, "global_step": 224805, "epoch": 1338} {"train_loss": -11.487054824829102, "global_step": 224806, "epoch": 1338} {"train_loss": -11.129389762878418, "global_step": 224807, "epoch": 1338} {"train_loss": -11.210723876953125, "global_step": 224808, "epoch": 1338} {"train_loss": -11.815935134887695, "global_step": 224809, "epoch": 1338} {"train_loss": -11.405104637145996, "global_step": 224810, "epoch": 1338} {"train_loss": -11.039114952087402, "global_step": 224811, "epoch": 1338} {"train_loss": -11.408878326416016, "global_step": 224812, "epoch": 1338} {"train_loss": -11.51294231414795, "global_step": 224813, "epoch": 1338} {"train_loss": -11.11620807647705, "global_step": 224814, "epoch": 1338} {"train_loss": -11.292263984680176, "global_step": 224815, "epoch": 1338} {"train_loss": -11.797758102416992, "global_step": 224816, "epoch": 1338} {"train_loss": -11.086336135864258, "global_step": 224817, "epoch": 1338} {"train_loss": -11.292305946350098, "global_step": 224818, "epoch": 1338} {"train_loss": -11.494855880737305, "global_step": 224819, "epoch": 1338} {"train_loss": -11.363999366760254, "global_step": 224820, "epoch": 1338} {"train_loss": -11.807208061218262, "global_step": 224821, "epoch": 1338} {"train_loss": -11.597200393676758, "global_step": 224822, "epoch": 1338} {"train_loss": -11.487565994262695, "global_step": 224823, "epoch": 1338} {"train_loss": -11.512785911560059, "global_step": 224824, "epoch": 1338} {"train_loss": -11.428308486938477, "global_step": 224825, "epoch": 1338} {"train_loss": -11.340761184692383, "global_step": 224826, "epoch": 1338} {"train_loss": -11.29405403137207, "global_step": 224827, "epoch": 1338} {"train_loss": -11.323633193969727, "global_step": 224828, "epoch": 1338} {"train_loss": -11.094149589538574, "global_step": 224829, "epoch": 1338} {"train_loss": -11.882347106933594, "global_step": 224830, "epoch": 1338} {"train_loss": -11.269237518310547, "global_step": 224831, "epoch": 1338} {"train_loss": -11.481822967529297, "global_step": 224832, "epoch": 1338} {"train_loss": -11.364969253540039, "global_step": 224833, "epoch": 1338} {"train_loss": -11.700189590454102, "global_step": 224834, "epoch": 1338} {"train_loss": -11.399948120117188, "global_step": 224835, "epoch": 1338} {"train_loss": -11.250482559204102, "global_step": 224836, "epoch": 1338} {"train_loss": -11.349433898925781, "global_step": 224837, "epoch": 1338} {"train_loss": -11.678343772888184, "global_step": 224838, "epoch": 1338} {"train_loss": -11.084688186645508, "global_step": 224839, "epoch": 1338} {"train_loss": -11.807722091674805, "global_step": 224840, "epoch": 1338} {"train_loss": -11.129511833190918, "global_step": 224841, "epoch": 1338} {"train_loss": -10.935179710388184, "global_step": 224842, "epoch": 1338} {"train_loss": -11.71235466003418, "global_step": 224843, "epoch": 1338} {"train_loss": -11.12875747680664, "global_step": 224844, "epoch": 1338} {"train_loss": -11.400784492492676, "global_step": 224845, "epoch": 1338} {"train_loss": -11.351551055908203, "global_step": 224846, "epoch": 1338} {"train_loss": -11.139732360839844, "global_step": 224847, "epoch": 1338} {"train_loss": -11.124810218811035, "global_step": 224848, "epoch": 1338} {"train_loss": -11.299779891967773, "global_step": 224849, "epoch": 1338} {"train_loss": -11.174007415771484, "global_step": 224850, "epoch": 1338} {"train_loss": -11.249479293823242, "global_step": 224851, "epoch": 1338} {"train_loss": -11.366525650024414, "global_step": 224852, "epoch": 1338} {"train_loss": -11.777923583984375, "global_step": 224853, "epoch": 1338} {"train_loss": -11.56641960144043, "global_step": 224854, "epoch": 1338} {"train_loss": -11.691781997680664, "global_step": 224855, "epoch": 1338} {"train_loss": -11.389385223388672, "global_step": 224856, "epoch": 1338} {"train_loss": -11.676090240478516, "global_step": 224857, "epoch": 1338} {"train_loss": -11.963342666625977, "global_step": 224858, "epoch": 1338} {"train_loss": -11.580461502075195, "global_step": 224859, "epoch": 1338} {"train_loss": -11.860492706298828, "global_step": 224860, "epoch": 1338} {"train_loss": -11.508657455444336, "global_step": 224861, "epoch": 1338} {"train_loss": -11.815573692321777, "global_step": 224862, "epoch": 1338} {"train_loss": -11.818588256835938, "global_step": 224863, "epoch": 1338} {"train_loss": -11.71953296661377, "global_step": 224864, "epoch": 1338} {"train_loss": -11.966318130493164, "global_step": 224865, "epoch": 1338} {"train_loss": -11.697998046875, "global_step": 224866, "epoch": 1338} {"train_loss": -11.643026351928711, "global_step": 224867, "epoch": 1338} {"train_loss": -11.541330337524414, "global_step": 224868, "epoch": 1338} {"train_loss": -11.219919204711914, "global_step": 224869, "epoch": 1338} {"train_loss": -12.127187728881836, "global_step": 224870, "epoch": 1338} {"train_loss": -11.122720718383789, "global_step": 224871, "epoch": 1338} {"train_loss": -11.417743682861328, "global_step": 224872, "epoch": 1338} {"train_loss": -11.214824676513672, "global_step": 224873, "epoch": 1338} {"train_loss": -10.83218002319336, "global_step": 224874, "epoch": 1338} {"train_loss": -10.916411399841309, "global_step": 224875, "epoch": 1338} {"train_loss": -10.637603759765625, "global_step": 224876, "epoch": 1338} {"train_loss": -10.253958702087402, "global_step": 224877, "epoch": 1338} {"train_loss": -11.218217849731445, "global_step": 224878, "epoch": 1338} {"train_loss": -9.698264122009277, "global_step": 224879, "epoch": 1338} {"train_loss": -10.295839309692383, "global_step": 224880, "epoch": 1338} {"train_loss": -10.734844207763672, "global_step": 224881, "epoch": 1338} {"train_loss": -10.698694229125977, "global_step": 224882, "epoch": 1338} {"train_loss": -10.758448600769043, "global_step": 224883, "epoch": 1338} {"train_loss": -10.49378776550293, "global_step": 224884, "epoch": 1338} {"train_loss": -11.411651611328125, "global_step": 224885, "epoch": 1338} {"train_loss": -10.840544700622559, "global_step": 224886, "epoch": 1338} {"train_loss": -11.612520217895508, "global_step": 224887, "epoch": 1338} {"train_loss": -10.958934783935547, "global_step": 224888, "epoch": 1338} {"train_loss": -11.458891868591309, "global_step": 224889, "epoch": 1338} {"train_loss": -11.286944389343262, "global_step": 224890, "epoch": 1338} {"train_loss": -11.271092414855957, "global_step": 224891, "epoch": 1338} {"train_loss": -11.431245803833008, "global_step": 224892, "epoch": 1338} {"train_loss": -11.312365531921387, "global_step": 224893, "epoch": 1338} {"train_loss": -11.623542785644531, "global_step": 224894, "epoch": 1338} {"train_loss": -11.496828079223633, "global_step": 224895, "epoch": 1338} {"train_loss": -11.295317649841309, "global_step": 224896, "epoch": 1338} {"train_loss": -11.324742317199707, "global_step": 224897, "epoch": 1338} {"train_loss": -11.194856643676758, "global_step": 224898, "epoch": 1338} {"train_loss": -11.503828048706055, "global_step": 224899, "epoch": 1338} {"train_loss": -10.949070930480957, "global_step": 224900, "epoch": 1338} {"train_loss": -11.353377342224121, "global_step": 224901, "epoch": 1338} {"train_loss": -11.43036937713623, "global_step": 224902, "epoch": 1338} {"train_loss": -10.952733993530273, "global_step": 224903, "epoch": 1338} {"train_loss": -11.522361755371094, "global_step": 224904, "epoch": 1338} {"train_loss": -11.360798835754395, "global_step": 224905, "epoch": 1338} {"train_loss": -10.564208984375, "global_step": 224906, "epoch": 1338} {"train_loss": -11.166414260864258, "global_step": 224907, "epoch": 1338} {"train_loss": -10.381515502929688, "global_step": 224908, "epoch": 1338} {"train_loss": -11.480438232421875, "global_step": 224909, "epoch": 1338} {"train_loss": -10.412965774536133, "global_step": 224910, "epoch": 1338} {"train_loss": -11.629053115844727, "global_step": 224911, "epoch": 1338} {"train_loss": -10.289121627807617, "global_step": 224912, "epoch": 1338} {"train_loss": -11.47708797454834, "global_step": 224913, "epoch": 1338} {"train_loss": -10.930000305175781, "global_step": 224914, "epoch": 1338} {"train_loss": -11.021646499633789, "global_step": 224915, "epoch": 1338} {"train_loss": -11.1431884765625, "global_step": 224916, "epoch": 1338} {"train_loss": -11.391693115234375, "global_step": 224917, "epoch": 1338} {"train_loss": -11.093935012817383, "global_step": 224918, "epoch": 1338} {"train_loss": -11.224730491638184, "global_step": 224919, "epoch": 1338} {"train_loss": -11.33888053894043, "global_step": 224920, "epoch": 1338} {"train_loss": -11.053476333618164, "global_step": 224921, "epoch": 1338} {"train_loss": -11.63028335571289, "global_step": 224922, "epoch": 1338} {"train_loss": -11.11172103881836, "global_step": 224923, "epoch": 1338} {"train_loss": -11.463655471801758, "global_step": 224924, "epoch": 1338} {"train_loss": -11.645406723022461, "global_step": 224925, "epoch": 1338} {"train_loss": -11.371393203735352, "global_step": 224926, "epoch": 1338} {"train_loss": -11.536251068115234, "global_step": 224927, "epoch": 1338} {"train_loss": -11.577981948852539, "global_step": 224928, "epoch": 1338} {"train_loss": -11.480297088623047, "global_step": 224929, "epoch": 1338} {"train_loss": -11.653884887695312, "global_step": 224930, "epoch": 1338} {"train_loss": -11.369505882263184, "global_step": 224931, "epoch": 1338} {"train_loss": -11.565130233764648, "global_step": 224932, "epoch": 1338} {"train_loss": -11.625041961669922, "global_step": 224933, "epoch": 1338} {"train_loss": -11.305472373962402, "global_step": 224934, "epoch": 1338} {"train_loss": -11.742888450622559, "global_step": 224935, "epoch": 1338} {"train_loss": -11.752618789672852, "global_step": 224936, "epoch": 1338} {"train_loss": -11.536343574523926, "global_step": 224937, "epoch": 1338} {"train_loss": -11.551027297973633, "global_step": 224938, "epoch": 1338} {"train_loss": -11.716691970825195, "global_step": 224939, "epoch": 1338} {"train_loss": -11.416389465332031, "global_step": 224940, "epoch": 1338} {"train_loss": -11.752949714660645, "global_step": 224941, "epoch": 1338} {"train_loss": -11.659578323364258, "global_step": 224942, "epoch": 1338} {"train_loss": -12.035865783691406, "global_step": 224943, "epoch": 1338} {"train_loss": -11.706975936889648, "global_step": 224944, "epoch": 1338} {"train_loss": -11.822810173034668, "global_step": 224945, "epoch": 1338} {"train_loss": -11.846168518066406, "global_step": 224946, "epoch": 1338} {"train_loss": -11.594450950622559, "global_step": 224947, "epoch": 1338} {"train_loss": -11.619091033935547, "global_step": 224948, "epoch": 1338} {"train_loss": -11.634201049804688, "global_step": 224949, "epoch": 1338} {"train_loss": -12.044662475585938, "global_step": 224950, "epoch": 1338} {"train_loss": -11.372710636683873, "global_step": 224951, "epoch": 1338, "val_loss": 262505.8125} {"train_loss": -11.865791320800781, "global_step": 224952, "epoch": 1339} {"train_loss": -11.968103408813477, "global_step": 224953, "epoch": 1339} {"train_loss": -11.751728057861328, "global_step": 224954, "epoch": 1339} {"train_loss": -11.69930362701416, "global_step": 224955, "epoch": 1339} {"train_loss": -11.746500015258789, "global_step": 224956, "epoch": 1339} {"train_loss": -12.005990982055664, "global_step": 224957, "epoch": 1339} {"train_loss": -11.86490249633789, "global_step": 224958, "epoch": 1339} {"train_loss": -11.943995475769043, "global_step": 224959, "epoch": 1339} {"train_loss": -12.031511306762695, "global_step": 224960, "epoch": 1339} {"train_loss": -11.816916465759277, "global_step": 224961, "epoch": 1339} {"train_loss": -12.049850463867188, "global_step": 224962, "epoch": 1339} {"train_loss": -11.864616394042969, "global_step": 224963, "epoch": 1339} {"train_loss": -11.816125869750977, "global_step": 224964, "epoch": 1339} {"train_loss": -12.009482383728027, "global_step": 224965, "epoch": 1339} {"train_loss": -11.961590766906738, "global_step": 224966, "epoch": 1339} {"train_loss": -11.604745864868164, "global_step": 224967, "epoch": 1339} {"train_loss": -11.403060913085938, "global_step": 224968, "epoch": 1339} {"train_loss": -11.067743301391602, "global_step": 224969, "epoch": 1339} {"train_loss": -11.78841781616211, "global_step": 224970, "epoch": 1339} {"train_loss": -11.366423606872559, "global_step": 224971, "epoch": 1339} {"train_loss": -10.160533905029297, "global_step": 224972, "epoch": 1339} {"train_loss": -10.796470642089844, "global_step": 224973, "epoch": 1339} {"train_loss": -11.382869720458984, "global_step": 224974, "epoch": 1339} {"train_loss": -10.016185760498047, "global_step": 224975, "epoch": 1339} {"train_loss": -10.76642894744873, "global_step": 224976, "epoch": 1339} {"train_loss": -10.537092208862305, "global_step": 224977, "epoch": 1339} {"train_loss": -8.760513305664062, "global_step": 224978, "epoch": 1339} {"train_loss": -9.116742134094238, "global_step": 224979, "epoch": 1339} {"train_loss": -11.144976615905762, "global_step": 224980, "epoch": 1339} {"train_loss": -10.348123550415039, "global_step": 224981, "epoch": 1339} {"train_loss": -10.171579360961914, "global_step": 224982, "epoch": 1339} {"train_loss": -10.912649154663086, "global_step": 224983, "epoch": 1339} {"train_loss": -10.31772232055664, "global_step": 224984, "epoch": 1339} {"train_loss": -11.372672080993652, "global_step": 224985, "epoch": 1339} {"train_loss": -10.617276191711426, "global_step": 224986, "epoch": 1339} {"train_loss": -11.353141784667969, "global_step": 224987, "epoch": 1339} {"train_loss": -11.047187805175781, "global_step": 224988, "epoch": 1339} {"train_loss": -11.364266395568848, "global_step": 224989, "epoch": 1339} {"train_loss": -11.161445617675781, "global_step": 224990, "epoch": 1339} {"train_loss": -11.513218879699707, "global_step": 224991, "epoch": 1339} {"train_loss": -10.860288619995117, "global_step": 224992, "epoch": 1339} {"train_loss": -11.453943252563477, "global_step": 224993, "epoch": 1339} {"train_loss": -11.165701866149902, "global_step": 224994, "epoch": 1339} {"train_loss": -11.248319625854492, "global_step": 224995, "epoch": 1339} {"train_loss": -11.21900463104248, "global_step": 224996, "epoch": 1339} {"train_loss": -11.322051048278809, "global_step": 224997, "epoch": 1339} {"train_loss": -11.382065773010254, "global_step": 224998, "epoch": 1339} {"train_loss": -10.949668884277344, "global_step": 224999, "epoch": 1339} {"train_loss": -11.544851303100586, "global_step": 225000, "epoch": 1339} {"train_loss": -11.095142364501953, "global_step": 225001, "epoch": 1339} {"train_loss": -11.550315856933594, "global_step": 225002, "epoch": 1339} {"train_loss": -11.451950073242188, "global_step": 225003, "epoch": 1339} {"train_loss": -11.36100959777832, "global_step": 225004, "epoch": 1339} {"train_loss": -11.322246551513672, "global_step": 225005, "epoch": 1339} {"train_loss": -11.409854888916016, "global_step": 225006, "epoch": 1339} {"train_loss": -11.019062042236328, "global_step": 225007, "epoch": 1339} {"train_loss": -11.392091751098633, "global_step": 225008, "epoch": 1339} {"train_loss": -10.979448318481445, "global_step": 225009, "epoch": 1339} {"train_loss": -11.309882164001465, "global_step": 225010, "epoch": 1339} {"train_loss": -11.170258522033691, "global_step": 225011, "epoch": 1339} {"train_loss": -11.635618209838867, "global_step": 225012, "epoch": 1339} {"train_loss": -11.501514434814453, "global_step": 225013, "epoch": 1339} {"train_loss": -11.514164924621582, "global_step": 225014, "epoch": 1339} {"train_loss": -11.659880638122559, "global_step": 225015, "epoch": 1339} {"train_loss": -11.382193565368652, "global_step": 225016, "epoch": 1339} {"train_loss": -11.442398071289062, "global_step": 225017, "epoch": 1339} {"train_loss": -11.071136474609375, "global_step": 225018, "epoch": 1339} {"train_loss": -11.505853652954102, "global_step": 225019, "epoch": 1339} {"train_loss": -11.064592361450195, "global_step": 225020, "epoch": 1339} {"train_loss": -11.923397064208984, "global_step": 225021, "epoch": 1339} {"train_loss": -11.168646812438965, "global_step": 225022, "epoch": 1339} {"train_loss": -11.716818809509277, "global_step": 225023, "epoch": 1339} {"train_loss": -11.506720542907715, "global_step": 225024, "epoch": 1339} {"train_loss": -11.230879783630371, "global_step": 225025, "epoch": 1339} {"train_loss": -11.78269100189209, "global_step": 225026, "epoch": 1339} {"train_loss": -11.50876235961914, "global_step": 225027, "epoch": 1339} {"train_loss": -11.483034133911133, "global_step": 225028, "epoch": 1339} {"train_loss": -11.845478057861328, "global_step": 225029, "epoch": 1339} {"train_loss": -11.559986114501953, "global_step": 225030, "epoch": 1339} {"train_loss": -11.735001564025879, "global_step": 225031, "epoch": 1339} {"train_loss": -11.641087532043457, "global_step": 225032, "epoch": 1339} {"train_loss": -11.762889862060547, "global_step": 225033, "epoch": 1339} {"train_loss": -11.505159378051758, "global_step": 225034, "epoch": 1339} {"train_loss": -11.892898559570312, "global_step": 225035, "epoch": 1339} {"train_loss": -11.601593017578125, "global_step": 225036, "epoch": 1339} {"train_loss": -11.580169677734375, "global_step": 225037, "epoch": 1339} {"train_loss": -11.829635620117188, "global_step": 225038, "epoch": 1339} {"train_loss": -11.613525390625, "global_step": 225039, "epoch": 1339} {"train_loss": -11.98387336730957, "global_step": 225040, "epoch": 1339} {"train_loss": -11.59006404876709, "global_step": 225041, "epoch": 1339} {"train_loss": -11.722517013549805, "global_step": 225042, "epoch": 1339} {"train_loss": -11.871366500854492, "global_step": 225043, "epoch": 1339} {"train_loss": -11.482385635375977, "global_step": 225044, "epoch": 1339} {"train_loss": -11.920190811157227, "global_step": 225045, "epoch": 1339} {"train_loss": -11.393648147583008, "global_step": 225046, "epoch": 1339} {"train_loss": -11.807684898376465, "global_step": 225047, "epoch": 1339} {"train_loss": -11.665511131286621, "global_step": 225048, "epoch": 1339} {"train_loss": -11.9292573928833, "global_step": 225049, "epoch": 1339} {"train_loss": -12.072149276733398, "global_step": 225050, "epoch": 1339} {"train_loss": -11.778388977050781, "global_step": 225051, "epoch": 1339} {"train_loss": -12.064364433288574, "global_step": 225052, "epoch": 1339} {"train_loss": -11.957061767578125, "global_step": 225053, "epoch": 1339} {"train_loss": -11.871944427490234, "global_step": 225054, "epoch": 1339} {"train_loss": -11.924699783325195, "global_step": 225055, "epoch": 1339} {"train_loss": -11.836410522460938, "global_step": 225056, "epoch": 1339} {"train_loss": -11.838369369506836, "global_step": 225057, "epoch": 1339} {"train_loss": -11.878744125366211, "global_step": 225058, "epoch": 1339} {"train_loss": -11.92765998840332, "global_step": 225059, "epoch": 1339} {"train_loss": -11.698991775512695, "global_step": 225060, "epoch": 1339} {"train_loss": -11.939512252807617, "global_step": 225061, "epoch": 1339} {"train_loss": -11.749835968017578, "global_step": 225062, "epoch": 1339} {"train_loss": -11.957939147949219, "global_step": 225063, "epoch": 1339} {"train_loss": -11.780525207519531, "global_step": 225064, "epoch": 1339} {"train_loss": -11.944345474243164, "global_step": 225065, "epoch": 1339} {"train_loss": -11.69351863861084, "global_step": 225066, "epoch": 1339} {"train_loss": -11.374267578125, "global_step": 225067, "epoch": 1339} {"train_loss": -11.848308563232422, "global_step": 225068, "epoch": 1339} {"train_loss": -11.562405586242676, "global_step": 225069, "epoch": 1339} {"train_loss": -11.652549743652344, "global_step": 225070, "epoch": 1339} {"train_loss": -11.909479141235352, "global_step": 225071, "epoch": 1339} {"train_loss": -11.692031860351562, "global_step": 225072, "epoch": 1339} {"train_loss": -11.921335220336914, "global_step": 225073, "epoch": 1339} {"train_loss": -11.62138557434082, "global_step": 225074, "epoch": 1339} {"train_loss": -11.863588333129883, "global_step": 225075, "epoch": 1339} {"train_loss": -11.448456764221191, "global_step": 225076, "epoch": 1339} {"train_loss": -11.965989112854004, "global_step": 225077, "epoch": 1339} {"train_loss": -11.546234130859375, "global_step": 225078, "epoch": 1339} {"train_loss": -11.642255783081055, "global_step": 225079, "epoch": 1339} {"train_loss": -11.058341979980469, "global_step": 225080, "epoch": 1339} {"train_loss": -11.22729206085205, "global_step": 225081, "epoch": 1339} {"train_loss": -11.713525772094727, "global_step": 225082, "epoch": 1339} {"train_loss": -11.784360885620117, "global_step": 225083, "epoch": 1339} {"train_loss": -11.58453369140625, "global_step": 225084, "epoch": 1339} {"train_loss": -11.846970558166504, "global_step": 225085, "epoch": 1339} {"train_loss": -11.594704627990723, "global_step": 225086, "epoch": 1339} {"train_loss": -11.211788177490234, "global_step": 225087, "epoch": 1339} {"train_loss": -11.630970001220703, "global_step": 225088, "epoch": 1339} {"train_loss": -11.645071029663086, "global_step": 225089, "epoch": 1339} {"train_loss": -11.939112663269043, "global_step": 225090, "epoch": 1339} {"train_loss": -11.490310668945312, "global_step": 225091, "epoch": 1339} {"train_loss": -11.963826179504395, "global_step": 225092, "epoch": 1339} {"train_loss": -11.32659912109375, "global_step": 225093, "epoch": 1339} {"train_loss": -11.767338752746582, "global_step": 225094, "epoch": 1339} {"train_loss": -11.763572692871094, "global_step": 225095, "epoch": 1339} {"train_loss": -11.716302871704102, "global_step": 225096, "epoch": 1339} {"train_loss": -11.167234420776367, "global_step": 225097, "epoch": 1339} {"train_loss": -11.500675201416016, "global_step": 225098, "epoch": 1339} {"train_loss": -10.157878875732422, "global_step": 225099, "epoch": 1339} {"train_loss": -10.900182723999023, "global_step": 225100, "epoch": 1339} {"train_loss": -10.94259262084961, "global_step": 225101, "epoch": 1339} {"train_loss": -11.041994094848633, "global_step": 225102, "epoch": 1339} {"train_loss": -11.418688774108887, "global_step": 225103, "epoch": 1339} {"train_loss": -11.071673393249512, "global_step": 225104, "epoch": 1339} {"train_loss": -10.773275375366211, "global_step": 225105, "epoch": 1339} {"train_loss": -11.552398681640625, "global_step": 225106, "epoch": 1339} {"train_loss": -10.175738334655762, "global_step": 225107, "epoch": 1339} {"train_loss": -10.648448944091797, "global_step": 225108, "epoch": 1339} {"train_loss": -10.717162132263184, "global_step": 225109, "epoch": 1339} {"train_loss": -10.312640190124512, "global_step": 225110, "epoch": 1339} {"train_loss": -11.487845420837402, "global_step": 225111, "epoch": 1339} {"train_loss": -10.098628044128418, "global_step": 225112, "epoch": 1339} {"train_loss": -11.478231430053711, "global_step": 225113, "epoch": 1339} {"train_loss": -10.067840576171875, "global_step": 225114, "epoch": 1339} {"train_loss": -10.305746078491211, "global_step": 225115, "epoch": 1339} {"train_loss": -10.047672271728516, "global_step": 225116, "epoch": 1339} {"train_loss": -10.568347930908203, "global_step": 225117, "epoch": 1339} {"train_loss": -9.374786376953125, "global_step": 225118, "epoch": 1339} {"train_loss": -11.37617874713171, "global_step": 225119, "epoch": 1339, "val_loss": 261449.09375} {"train_loss": -10.33751392364502, "global_step": 225120, "epoch": 1340} {"train_loss": -11.03071403503418, "global_step": 225121, "epoch": 1340} {"train_loss": -10.662054061889648, "global_step": 225122, "epoch": 1340} {"train_loss": -10.109498977661133, "global_step": 225123, "epoch": 1340} {"train_loss": -10.747093200683594, "global_step": 225124, "epoch": 1340} {"train_loss": -10.361757278442383, "global_step": 225125, "epoch": 1340} {"train_loss": -11.339164733886719, "global_step": 225126, "epoch": 1340} {"train_loss": -10.548683166503906, "global_step": 225127, "epoch": 1340} {"train_loss": -11.240011215209961, "global_step": 225128, "epoch": 1340} {"train_loss": -10.920384407043457, "global_step": 225129, "epoch": 1340} {"train_loss": -11.196481704711914, "global_step": 225130, "epoch": 1340} {"train_loss": -11.524860382080078, "global_step": 225131, "epoch": 1340} {"train_loss": -11.33255386352539, "global_step": 225132, "epoch": 1340} {"train_loss": -11.292763710021973, "global_step": 225133, "epoch": 1340} {"train_loss": -11.59211540222168, "global_step": 225134, "epoch": 1340} {"train_loss": -11.32139778137207, "global_step": 225135, "epoch": 1340} {"train_loss": -11.315361022949219, "global_step": 225136, "epoch": 1340} {"train_loss": -11.266524314880371, "global_step": 225137, "epoch": 1340} {"train_loss": -11.21112060546875, "global_step": 225138, "epoch": 1340} {"train_loss": -11.485321044921875, "global_step": 225139, "epoch": 1340} {"train_loss": -11.723743438720703, "global_step": 225140, "epoch": 1340} {"train_loss": -11.219273567199707, "global_step": 225141, "epoch": 1340} {"train_loss": -11.466123580932617, "global_step": 225142, "epoch": 1340} {"train_loss": -11.45448112487793, "global_step": 225143, "epoch": 1340} {"train_loss": -11.424182891845703, "global_step": 225144, "epoch": 1340} {"train_loss": -11.627802848815918, "global_step": 225145, "epoch": 1340} {"train_loss": -11.616039276123047, "global_step": 225146, "epoch": 1340} {"train_loss": -11.551345825195312, "global_step": 225147, "epoch": 1340} {"train_loss": -11.741796493530273, "global_step": 225148, "epoch": 1340} {"train_loss": -11.515057563781738, "global_step": 225149, "epoch": 1340} {"train_loss": -11.716510772705078, "global_step": 225150, "epoch": 1340} {"train_loss": -11.675137519836426, "global_step": 225151, "epoch": 1340} {"train_loss": -11.74708080291748, "global_step": 225152, "epoch": 1340} {"train_loss": -11.867098808288574, "global_step": 225153, "epoch": 1340} {"train_loss": -11.661169052124023, "global_step": 225154, "epoch": 1340} {"train_loss": -11.842172622680664, "global_step": 225155, "epoch": 1340} {"train_loss": -11.654874801635742, "global_step": 225156, "epoch": 1340} {"train_loss": -11.769943237304688, "global_step": 225157, "epoch": 1340} {"train_loss": -11.928071975708008, "global_step": 225158, "epoch": 1340} {"train_loss": -11.846588134765625, "global_step": 225159, "epoch": 1340} {"train_loss": -11.688284873962402, "global_step": 225160, "epoch": 1340} {"train_loss": -11.932670593261719, "global_step": 225161, "epoch": 1340} {"train_loss": -11.919320106506348, "global_step": 225162, "epoch": 1340} {"train_loss": -11.8856201171875, "global_step": 225163, "epoch": 1340} {"train_loss": -11.841651916503906, "global_step": 225164, "epoch": 1340} {"train_loss": -11.936769485473633, "global_step": 225165, "epoch": 1340} {"train_loss": -11.920042037963867, "global_step": 225166, "epoch": 1340} {"train_loss": -11.922433853149414, "global_step": 225167, "epoch": 1340} {"train_loss": -11.701543807983398, "global_step": 225168, "epoch": 1340} {"train_loss": -11.90353012084961, "global_step": 225169, "epoch": 1340} {"train_loss": -12.112650871276855, "global_step": 225170, "epoch": 1340} {"train_loss": -11.849950790405273, "global_step": 225171, "epoch": 1340} {"train_loss": -11.881797790527344, "global_step": 225172, "epoch": 1340} {"train_loss": -12.04195785522461, "global_step": 225173, "epoch": 1340} {"train_loss": -11.872695922851562, "global_step": 225174, "epoch": 1340} {"train_loss": -12.122995376586914, "global_step": 225175, "epoch": 1340} {"train_loss": -12.029829025268555, "global_step": 225176, "epoch": 1340} {"train_loss": -11.826081275939941, "global_step": 225177, "epoch": 1340} {"train_loss": -11.953885078430176, "global_step": 225178, "epoch": 1340} {"train_loss": -11.840444564819336, "global_step": 225179, "epoch": 1340} {"train_loss": -11.613155364990234, "global_step": 225180, "epoch": 1340} {"train_loss": -11.117971420288086, "global_step": 225181, "epoch": 1340} {"train_loss": -11.130144119262695, "global_step": 225182, "epoch": 1340} {"train_loss": -10.591558456420898, "global_step": 225183, "epoch": 1340} {"train_loss": -11.457337379455566, "global_step": 225184, "epoch": 1340} {"train_loss": -9.687238693237305, "global_step": 225185, "epoch": 1340} {"train_loss": -11.468452453613281, "global_step": 225186, "epoch": 1340} {"train_loss": -10.419658660888672, "global_step": 225187, "epoch": 1340} {"train_loss": -11.092218399047852, "global_step": 225188, "epoch": 1340} {"train_loss": -11.871953964233398, "global_step": 225189, "epoch": 1340} {"train_loss": -11.199798583984375, "global_step": 225190, "epoch": 1340} {"train_loss": -11.34576416015625, "global_step": 225191, "epoch": 1340} {"train_loss": -11.316169738769531, "global_step": 225192, "epoch": 1340} {"train_loss": -11.120429992675781, "global_step": 225193, "epoch": 1340} {"train_loss": -10.799863815307617, "global_step": 225194, "epoch": 1340} {"train_loss": -11.398137092590332, "global_step": 225195, "epoch": 1340} {"train_loss": -11.00298023223877, "global_step": 225196, "epoch": 1340} {"train_loss": -11.428733825683594, "global_step": 225197, "epoch": 1340} {"train_loss": -10.665966033935547, "global_step": 225198, "epoch": 1340} {"train_loss": -11.41654109954834, "global_step": 225199, "epoch": 1340} {"train_loss": -11.196931838989258, "global_step": 225200, "epoch": 1340} {"train_loss": -10.833732604980469, "global_step": 225201, "epoch": 1340} {"train_loss": -11.290048599243164, "global_step": 225202, "epoch": 1340} {"train_loss": -10.763116836547852, "global_step": 225203, "epoch": 1340} {"train_loss": -11.266149520874023, "global_step": 225204, "epoch": 1340} {"train_loss": -10.773456573486328, "global_step": 225205, "epoch": 1340} {"train_loss": -11.566633224487305, "global_step": 225206, "epoch": 1340} {"train_loss": -10.971037864685059, "global_step": 225207, "epoch": 1340} {"train_loss": -11.443253517150879, "global_step": 225208, "epoch": 1340} {"train_loss": -11.2854585647583, "global_step": 225209, "epoch": 1340} {"train_loss": -11.670955657958984, "global_step": 225210, "epoch": 1340} {"train_loss": -11.684318542480469, "global_step": 225211, "epoch": 1340} {"train_loss": -11.355406761169434, "global_step": 225212, "epoch": 1340} {"train_loss": -11.707080841064453, "global_step": 225213, "epoch": 1340} {"train_loss": -11.207643508911133, "global_step": 225214, "epoch": 1340} {"train_loss": -11.395251274108887, "global_step": 225215, "epoch": 1340} {"train_loss": -11.36042594909668, "global_step": 225216, "epoch": 1340} {"train_loss": -11.580791473388672, "global_step": 225217, "epoch": 1340} {"train_loss": -11.047648429870605, "global_step": 225218, "epoch": 1340} {"train_loss": -11.34918212890625, "global_step": 225219, "epoch": 1340} {"train_loss": -11.345846176147461, "global_step": 225220, "epoch": 1340} {"train_loss": -11.705195426940918, "global_step": 225221, "epoch": 1340} {"train_loss": -11.274667739868164, "global_step": 225222, "epoch": 1340} {"train_loss": -11.57779598236084, "global_step": 225223, "epoch": 1340} {"train_loss": -11.479294776916504, "global_step": 225224, "epoch": 1340} {"train_loss": -11.196533203125, "global_step": 225225, "epoch": 1340} {"train_loss": -11.51645565032959, "global_step": 225226, "epoch": 1340} {"train_loss": -11.61372184753418, "global_step": 225227, "epoch": 1340} {"train_loss": -11.459446907043457, "global_step": 225228, "epoch": 1340} {"train_loss": -11.404688835144043, "global_step": 225229, "epoch": 1340} {"train_loss": -10.963998794555664, "global_step": 225230, "epoch": 1340} {"train_loss": -11.112895965576172, "global_step": 225231, "epoch": 1340} {"train_loss": -11.68900203704834, "global_step": 225232, "epoch": 1340} {"train_loss": -11.194870948791504, "global_step": 225233, "epoch": 1340} {"train_loss": -11.26551628112793, "global_step": 225234, "epoch": 1340} {"train_loss": -11.491430282592773, "global_step": 225235, "epoch": 1340} {"train_loss": -11.563811302185059, "global_step": 225236, "epoch": 1340} {"train_loss": -11.807015419006348, "global_step": 225237, "epoch": 1340} {"train_loss": -11.320335388183594, "global_step": 225238, "epoch": 1340} {"train_loss": -11.413244247436523, "global_step": 225239, "epoch": 1340} {"train_loss": -11.178716659545898, "global_step": 225240, "epoch": 1340} {"train_loss": -11.427164077758789, "global_step": 225241, "epoch": 1340} {"train_loss": -11.596656799316406, "global_step": 225242, "epoch": 1340} {"train_loss": -11.3846435546875, "global_step": 225243, "epoch": 1340} {"train_loss": -11.579852104187012, "global_step": 225244, "epoch": 1340} {"train_loss": -11.467535018920898, "global_step": 225245, "epoch": 1340} {"train_loss": -11.624011993408203, "global_step": 225246, "epoch": 1340} {"train_loss": -11.58873176574707, "global_step": 225247, "epoch": 1340} {"train_loss": -11.152962684631348, "global_step": 225248, "epoch": 1340} {"train_loss": -11.68548583984375, "global_step": 225249, "epoch": 1340} {"train_loss": -11.596177101135254, "global_step": 225250, "epoch": 1340} {"train_loss": -11.637894630432129, "global_step": 225251, "epoch": 1340} {"train_loss": -11.569486618041992, "global_step": 225252, "epoch": 1340} {"train_loss": -11.598255157470703, "global_step": 225253, "epoch": 1340} {"train_loss": -12.000448226928711, "global_step": 225254, "epoch": 1340} {"train_loss": -11.763006210327148, "global_step": 225255, "epoch": 1340} {"train_loss": -11.935914039611816, "global_step": 225256, "epoch": 1340} {"train_loss": -11.603464126586914, "global_step": 225257, "epoch": 1340} {"train_loss": -11.906972885131836, "global_step": 225258, "epoch": 1340} {"train_loss": -11.914799690246582, "global_step": 225259, "epoch": 1340} {"train_loss": -11.889094352722168, "global_step": 225260, "epoch": 1340} {"train_loss": -11.820169448852539, "global_step": 225261, "epoch": 1340} {"train_loss": -11.783435821533203, "global_step": 225262, "epoch": 1340} {"train_loss": -11.895742416381836, "global_step": 225263, "epoch": 1340} {"train_loss": -11.674816131591797, "global_step": 225264, "epoch": 1340} {"train_loss": -11.967293739318848, "global_step": 225265, "epoch": 1340} {"train_loss": -11.575765609741211, "global_step": 225266, "epoch": 1340} {"train_loss": -11.855700492858887, "global_step": 225267, "epoch": 1340} {"train_loss": -11.923224449157715, "global_step": 225268, "epoch": 1340} {"train_loss": -11.885210037231445, "global_step": 225269, "epoch": 1340} {"train_loss": -11.953567504882812, "global_step": 225270, "epoch": 1340} {"train_loss": -11.797191619873047, "global_step": 225271, "epoch": 1340} {"train_loss": -11.872916221618652, "global_step": 225272, "epoch": 1340} {"train_loss": -12.012674331665039, "global_step": 225273, "epoch": 1340} {"train_loss": -11.974780082702637, "global_step": 225274, "epoch": 1340} {"train_loss": -11.895195960998535, "global_step": 225275, "epoch": 1340} {"train_loss": -11.998473167419434, "global_step": 225276, "epoch": 1340} {"train_loss": -12.028626441955566, "global_step": 225277, "epoch": 1340} {"train_loss": -12.056699752807617, "global_step": 225278, "epoch": 1340} {"train_loss": -12.063169479370117, "global_step": 225279, "epoch": 1340} {"train_loss": -12.00293254852295, "global_step": 225280, "epoch": 1340} {"train_loss": -11.837810516357422, "global_step": 225281, "epoch": 1340} {"train_loss": -11.862835884094238, "global_step": 225282, "epoch": 1340} {"train_loss": -11.704712867736816, "global_step": 225283, "epoch": 1340} {"train_loss": -11.975188255310059, "global_step": 225284, "epoch": 1340} {"train_loss": -11.584104537963867, "global_step": 225285, "epoch": 1340} {"train_loss": -11.960492134094238, "global_step": 225286, "epoch": 1340} {"train_loss": -11.508440250442142, "global_step": 225287, "epoch": 1340, "val_loss": 261515.75, "train_action_mse_error": 1.4687283039093018} {"train_loss": -12.174718856811523, "global_step": 225288, "epoch": 1341} {"train_loss": -11.81595230102539, "global_step": 225289, "epoch": 1341} {"train_loss": -12.116523742675781, "global_step": 225290, "epoch": 1341} {"train_loss": -11.94281005859375, "global_step": 225291, "epoch": 1341} {"train_loss": -12.113426208496094, "global_step": 225292, "epoch": 1341} {"train_loss": -11.864742279052734, "global_step": 225293, "epoch": 1341} {"train_loss": -11.912939071655273, "global_step": 225294, "epoch": 1341} {"train_loss": -11.913568496704102, "global_step": 225295, "epoch": 1341} {"train_loss": -12.074456214904785, "global_step": 225296, "epoch": 1341} {"train_loss": -11.754971504211426, "global_step": 225297, "epoch": 1341} {"train_loss": -11.97412109375, "global_step": 225298, "epoch": 1341} {"train_loss": -11.344593048095703, "global_step": 225299, "epoch": 1341} {"train_loss": -11.770761489868164, "global_step": 225300, "epoch": 1341} {"train_loss": -11.44854736328125, "global_step": 225301, "epoch": 1341} {"train_loss": -11.681350708007812, "global_step": 225302, "epoch": 1341} {"train_loss": -11.626801490783691, "global_step": 225303, "epoch": 1341} {"train_loss": -11.682408332824707, "global_step": 225304, "epoch": 1341} {"train_loss": -11.061511993408203, "global_step": 225305, "epoch": 1341} {"train_loss": -10.988239288330078, "global_step": 225306, "epoch": 1341} {"train_loss": -10.556681632995605, "global_step": 225307, "epoch": 1341} {"train_loss": -11.619171142578125, "global_step": 225308, "epoch": 1341} {"train_loss": -8.819269180297852, "global_step": 225309, "epoch": 1341} {"train_loss": -10.442712783813477, "global_step": 225310, "epoch": 1341} {"train_loss": -9.424837112426758, "global_step": 225311, "epoch": 1341} {"train_loss": -8.926817893981934, "global_step": 225312, "epoch": 1341} {"train_loss": -8.515729904174805, "global_step": 225313, "epoch": 1341} {"train_loss": -10.232660293579102, "global_step": 225314, "epoch": 1341} {"train_loss": -10.843135833740234, "global_step": 225315, "epoch": 1341} {"train_loss": -10.065693855285645, "global_step": 225316, "epoch": 1341} {"train_loss": -10.187294006347656, "global_step": 225317, "epoch": 1341} {"train_loss": -11.070243835449219, "global_step": 225318, "epoch": 1341} {"train_loss": -10.627586364746094, "global_step": 225319, "epoch": 1341} {"train_loss": -10.796660423278809, "global_step": 225320, "epoch": 1341} {"train_loss": -11.135229110717773, "global_step": 225321, "epoch": 1341} {"train_loss": -10.633867263793945, "global_step": 225322, "epoch": 1341} {"train_loss": -11.526920318603516, "global_step": 225323, "epoch": 1341} {"train_loss": -11.380919456481934, "global_step": 225324, "epoch": 1341} {"train_loss": -11.449430465698242, "global_step": 225325, "epoch": 1341} {"train_loss": -11.380563735961914, "global_step": 225326, "epoch": 1341} {"train_loss": -11.179641723632812, "global_step": 225327, "epoch": 1341} {"train_loss": -11.497254371643066, "global_step": 225328, "epoch": 1341} {"train_loss": -11.290985107421875, "global_step": 225329, "epoch": 1341} {"train_loss": -11.420784950256348, "global_step": 225330, "epoch": 1341} {"train_loss": -11.039987564086914, "global_step": 225331, "epoch": 1341} {"train_loss": -11.525924682617188, "global_step": 225332, "epoch": 1341} {"train_loss": -11.045347213745117, "global_step": 225333, "epoch": 1341} {"train_loss": -10.919034957885742, "global_step": 225334, "epoch": 1341} {"train_loss": -11.360285758972168, "global_step": 225335, "epoch": 1341} {"train_loss": -10.924952507019043, "global_step": 225336, "epoch": 1341} {"train_loss": -11.53002643585205, "global_step": 225337, "epoch": 1341} {"train_loss": -11.365217208862305, "global_step": 225338, "epoch": 1341} {"train_loss": -11.341543197631836, "global_step": 225339, "epoch": 1341} {"train_loss": -11.60205078125, "global_step": 225340, "epoch": 1341} {"train_loss": -11.455074310302734, "global_step": 225341, "epoch": 1341} {"train_loss": -11.385902404785156, "global_step": 225342, "epoch": 1341} {"train_loss": -11.626626968383789, "global_step": 225343, "epoch": 1341} {"train_loss": -11.721644401550293, "global_step": 225344, "epoch": 1341} {"train_loss": -11.547221183776855, "global_step": 225345, "epoch": 1341} {"train_loss": -11.891357421875, "global_step": 225346, "epoch": 1341} {"train_loss": -11.441524505615234, "global_step": 225347, "epoch": 1341} {"train_loss": -11.619344711303711, "global_step": 225348, "epoch": 1341} {"train_loss": -11.40818977355957, "global_step": 225349, "epoch": 1341} {"train_loss": -11.513093948364258, "global_step": 225350, "epoch": 1341} {"train_loss": -11.448150634765625, "global_step": 225351, "epoch": 1341} {"train_loss": -11.613924026489258, "global_step": 225352, "epoch": 1341} {"train_loss": -11.487013816833496, "global_step": 225353, "epoch": 1341} {"train_loss": -11.568202018737793, "global_step": 225354, "epoch": 1341} {"train_loss": -11.58581829071045, "global_step": 225355, "epoch": 1341} {"train_loss": -11.813665390014648, "global_step": 225356, "epoch": 1341} {"train_loss": -11.308061599731445, "global_step": 225357, "epoch": 1341} {"train_loss": -11.535323143005371, "global_step": 225358, "epoch": 1341} {"train_loss": -11.073892593383789, "global_step": 225359, "epoch": 1341} {"train_loss": -11.60940170288086, "global_step": 225360, "epoch": 1341} {"train_loss": -11.01701545715332, "global_step": 225361, "epoch": 1341} {"train_loss": -11.186187744140625, "global_step": 225362, "epoch": 1341} {"train_loss": -11.410822868347168, "global_step": 225363, "epoch": 1341} {"train_loss": -11.413431167602539, "global_step": 225364, "epoch": 1341} {"train_loss": -11.116964340209961, "global_step": 225365, "epoch": 1341} {"train_loss": -11.788476943969727, "global_step": 225366, "epoch": 1341} {"train_loss": -11.029969215393066, "global_step": 225367, "epoch": 1341} {"train_loss": -11.514798164367676, "global_step": 225368, "epoch": 1341} {"train_loss": -11.597308158874512, "global_step": 225369, "epoch": 1341} {"train_loss": -11.47488784790039, "global_step": 225370, "epoch": 1341} {"train_loss": -11.747415542602539, "global_step": 225371, "epoch": 1341} {"train_loss": -11.331573486328125, "global_step": 225372, "epoch": 1341} {"train_loss": -11.760738372802734, "global_step": 225373, "epoch": 1341} {"train_loss": -11.323759078979492, "global_step": 225374, "epoch": 1341} {"train_loss": -11.492027282714844, "global_step": 225375, "epoch": 1341} {"train_loss": -11.44656753540039, "global_step": 225376, "epoch": 1341} {"train_loss": -11.619782447814941, "global_step": 225377, "epoch": 1341} {"train_loss": -10.81520938873291, "global_step": 225378, "epoch": 1341} {"train_loss": -11.299125671386719, "global_step": 225379, "epoch": 1341} {"train_loss": -11.665342330932617, "global_step": 225380, "epoch": 1341} {"train_loss": -11.052863121032715, "global_step": 225381, "epoch": 1341} {"train_loss": -11.423717498779297, "global_step": 225382, "epoch": 1341} {"train_loss": -11.551666259765625, "global_step": 225383, "epoch": 1341} {"train_loss": -11.046390533447266, "global_step": 225384, "epoch": 1341} {"train_loss": -11.918806076049805, "global_step": 225385, "epoch": 1341} {"train_loss": -11.321355819702148, "global_step": 225386, "epoch": 1341} {"train_loss": -11.185548782348633, "global_step": 225387, "epoch": 1341} {"train_loss": -11.683171272277832, "global_step": 225388, "epoch": 1341} {"train_loss": -11.29078483581543, "global_step": 225389, "epoch": 1341} {"train_loss": -11.416521072387695, "global_step": 225390, "epoch": 1341} {"train_loss": -11.78628158569336, "global_step": 225391, "epoch": 1341} {"train_loss": -11.859025001525879, "global_step": 225392, "epoch": 1341} {"train_loss": -11.825337409973145, "global_step": 225393, "epoch": 1341} {"train_loss": -11.315595626831055, "global_step": 225394, "epoch": 1341} {"train_loss": -11.485946655273438, "global_step": 225395, "epoch": 1341} {"train_loss": -11.881513595581055, "global_step": 225396, "epoch": 1341} {"train_loss": -11.19072151184082, "global_step": 225397, "epoch": 1341} {"train_loss": -11.712841033935547, "global_step": 225398, "epoch": 1341} {"train_loss": -11.033266067504883, "global_step": 225399, "epoch": 1341} {"train_loss": -11.394217491149902, "global_step": 225400, "epoch": 1341} {"train_loss": -11.255658149719238, "global_step": 225401, "epoch": 1341} {"train_loss": -11.722047805786133, "global_step": 225402, "epoch": 1341} {"train_loss": -11.30963134765625, "global_step": 225403, "epoch": 1341} {"train_loss": -11.826093673706055, "global_step": 225404, "epoch": 1341} {"train_loss": -11.43277359008789, "global_step": 225405, "epoch": 1341} {"train_loss": -11.419568061828613, "global_step": 225406, "epoch": 1341} {"train_loss": -11.630533218383789, "global_step": 225407, "epoch": 1341} {"train_loss": -11.642634391784668, "global_step": 225408, "epoch": 1341} {"train_loss": -11.960439682006836, "global_step": 225409, "epoch": 1341} {"train_loss": -11.396448135375977, "global_step": 225410, "epoch": 1341} {"train_loss": -11.417682647705078, "global_step": 225411, "epoch": 1341} {"train_loss": -11.829803466796875, "global_step": 225412, "epoch": 1341} {"train_loss": -11.653682708740234, "global_step": 225413, "epoch": 1341} {"train_loss": -11.608100891113281, "global_step": 225414, "epoch": 1341} {"train_loss": -11.814750671386719, "global_step": 225415, "epoch": 1341} {"train_loss": -11.797353744506836, "global_step": 225416, "epoch": 1341} {"train_loss": -11.500414848327637, "global_step": 225417, "epoch": 1341} {"train_loss": -11.748519897460938, "global_step": 225418, "epoch": 1341} {"train_loss": -11.499820709228516, "global_step": 225419, "epoch": 1341} {"train_loss": -11.863101959228516, "global_step": 225420, "epoch": 1341} {"train_loss": -11.7220458984375, "global_step": 225421, "epoch": 1341} {"train_loss": -11.491609573364258, "global_step": 225422, "epoch": 1341} {"train_loss": -11.643400192260742, "global_step": 225423, "epoch": 1341} {"train_loss": -11.771300315856934, "global_step": 225424, "epoch": 1341} {"train_loss": -11.492744445800781, "global_step": 225425, "epoch": 1341} {"train_loss": -11.685920715332031, "global_step": 225426, "epoch": 1341} {"train_loss": -11.702461242675781, "global_step": 225427, "epoch": 1341} {"train_loss": -11.588197708129883, "global_step": 225428, "epoch": 1341} {"train_loss": -12.030643463134766, "global_step": 225429, "epoch": 1341} {"train_loss": -11.853265762329102, "global_step": 225430, "epoch": 1341} {"train_loss": -11.844310760498047, "global_step": 225431, "epoch": 1341} {"train_loss": -11.859898567199707, "global_step": 225432, "epoch": 1341} {"train_loss": -12.006525993347168, "global_step": 225433, "epoch": 1341} {"train_loss": -11.642444610595703, "global_step": 225434, "epoch": 1341} {"train_loss": -11.70552921295166, "global_step": 225435, "epoch": 1341} {"train_loss": -11.603630065917969, "global_step": 225436, "epoch": 1341} {"train_loss": -11.867051124572754, "global_step": 225437, "epoch": 1341} {"train_loss": -11.656442642211914, "global_step": 225438, "epoch": 1341} {"train_loss": -11.665538787841797, "global_step": 225439, "epoch": 1341} {"train_loss": -12.020330429077148, "global_step": 225440, "epoch": 1341} {"train_loss": -11.213874816894531, "global_step": 225441, "epoch": 1341} {"train_loss": -12.203014373779297, "global_step": 225442, "epoch": 1341} {"train_loss": -11.418004989624023, "global_step": 225443, "epoch": 1341} {"train_loss": -11.763566970825195, "global_step": 225444, "epoch": 1341} {"train_loss": -11.822299003601074, "global_step": 225445, "epoch": 1341} {"train_loss": -11.71434211730957, "global_step": 225446, "epoch": 1341} {"train_loss": -11.922591209411621, "global_step": 225447, "epoch": 1341} {"train_loss": -11.951507568359375, "global_step": 225448, "epoch": 1341} {"train_loss": -11.823513984680176, "global_step": 225449, "epoch": 1341} {"train_loss": -11.795888900756836, "global_step": 225450, "epoch": 1341} {"train_loss": -11.84665298461914, "global_step": 225451, "epoch": 1341} {"train_loss": -11.44175910949707, "global_step": 225452, "epoch": 1341} {"train_loss": -11.757875442504883, "global_step": 225453, "epoch": 1341} {"train_loss": -12.087501525878906, "global_step": 225454, "epoch": 1341} {"train_loss": -11.443465454237801, "global_step": 225455, "epoch": 1341, "val_loss": 259582.578125} {"train_loss": -11.476436614990234, "global_step": 225456, "epoch": 1342} {"train_loss": -11.612305641174316, "global_step": 225457, "epoch": 1342} {"train_loss": -11.799487113952637, "global_step": 225458, "epoch": 1342} {"train_loss": -11.898554801940918, "global_step": 225459, "epoch": 1342} {"train_loss": -11.750720024108887, "global_step": 225460, "epoch": 1342} {"train_loss": -11.301332473754883, "global_step": 225461, "epoch": 1342} {"train_loss": -11.868717193603516, "global_step": 225462, "epoch": 1342} {"train_loss": -11.441198348999023, "global_step": 225463, "epoch": 1342} {"train_loss": -10.940458297729492, "global_step": 225464, "epoch": 1342} {"train_loss": -11.298230171203613, "global_step": 225465, "epoch": 1342} {"train_loss": -11.831085205078125, "global_step": 225466, "epoch": 1342} {"train_loss": -11.55026912689209, "global_step": 225467, "epoch": 1342} {"train_loss": -11.217666625976562, "global_step": 225468, "epoch": 1342} {"train_loss": -11.791638374328613, "global_step": 225469, "epoch": 1342} {"train_loss": -11.462032318115234, "global_step": 225470, "epoch": 1342} {"train_loss": -11.53898811340332, "global_step": 225471, "epoch": 1342} {"train_loss": -11.060209274291992, "global_step": 225472, "epoch": 1342} {"train_loss": -11.162559509277344, "global_step": 225473, "epoch": 1342} {"train_loss": -10.927221298217773, "global_step": 225474, "epoch": 1342} {"train_loss": -10.001983642578125, "global_step": 225475, "epoch": 1342} {"train_loss": -9.857608795166016, "global_step": 225476, "epoch": 1342} {"train_loss": -10.174243927001953, "global_step": 225477, "epoch": 1342} {"train_loss": -9.614273071289062, "global_step": 225478, "epoch": 1342} {"train_loss": -8.402552604675293, "global_step": 225479, "epoch": 1342} {"train_loss": -11.607614517211914, "global_step": 225480, "epoch": 1342} {"train_loss": -9.648913383483887, "global_step": 225481, "epoch": 1342} {"train_loss": -10.533243179321289, "global_step": 225482, "epoch": 1342} {"train_loss": -9.921099662780762, "global_step": 225483, "epoch": 1342} {"train_loss": -9.576315879821777, "global_step": 225484, "epoch": 1342} {"train_loss": -11.36764144897461, "global_step": 225485, "epoch": 1342} {"train_loss": -9.897570610046387, "global_step": 225486, "epoch": 1342} {"train_loss": -10.854461669921875, "global_step": 225487, "epoch": 1342} {"train_loss": -9.577756881713867, "global_step": 225488, "epoch": 1342} {"train_loss": -9.449113845825195, "global_step": 225489, "epoch": 1342} {"train_loss": -10.75003719329834, "global_step": 225490, "epoch": 1342} {"train_loss": -10.105575561523438, "global_step": 225491, "epoch": 1342} {"train_loss": -10.281560897827148, "global_step": 225492, "epoch": 1342} {"train_loss": -11.198965072631836, "global_step": 225493, "epoch": 1342} {"train_loss": -10.397315979003906, "global_step": 225494, "epoch": 1342} {"train_loss": -11.363574981689453, "global_step": 225495, "epoch": 1342} {"train_loss": -11.002275466918945, "global_step": 225496, "epoch": 1342} {"train_loss": -11.317815780639648, "global_step": 225497, "epoch": 1342} {"train_loss": -10.804882049560547, "global_step": 225498, "epoch": 1342} {"train_loss": -10.191181182861328, "global_step": 225499, "epoch": 1342} {"train_loss": -11.415544509887695, "global_step": 225500, "epoch": 1342} {"train_loss": -9.9833984375, "global_step": 225501, "epoch": 1342} {"train_loss": -11.519331932067871, "global_step": 225502, "epoch": 1342} {"train_loss": -10.930322647094727, "global_step": 225503, "epoch": 1342} {"train_loss": -11.299129486083984, "global_step": 225504, "epoch": 1342} {"train_loss": -10.514242172241211, "global_step": 225505, "epoch": 1342} {"train_loss": -11.486804008483887, "global_step": 225506, "epoch": 1342} {"train_loss": -10.90613079071045, "global_step": 225507, "epoch": 1342} {"train_loss": -11.444061279296875, "global_step": 225508, "epoch": 1342} {"train_loss": -10.955198287963867, "global_step": 225509, "epoch": 1342} {"train_loss": -11.351381301879883, "global_step": 225510, "epoch": 1342} {"train_loss": -11.002445220947266, "global_step": 225511, "epoch": 1342} {"train_loss": -11.480847358703613, "global_step": 225512, "epoch": 1342} {"train_loss": -11.539885520935059, "global_step": 225513, "epoch": 1342} {"train_loss": -11.612204551696777, "global_step": 225514, "epoch": 1342} {"train_loss": -11.351763725280762, "global_step": 225515, "epoch": 1342} {"train_loss": -11.407410621643066, "global_step": 225516, "epoch": 1342} {"train_loss": -11.46841812133789, "global_step": 225517, "epoch": 1342} {"train_loss": -11.234668731689453, "global_step": 225518, "epoch": 1342} {"train_loss": -11.315629959106445, "global_step": 225519, "epoch": 1342} {"train_loss": -11.647867202758789, "global_step": 225520, "epoch": 1342} {"train_loss": -11.359987258911133, "global_step": 225521, "epoch": 1342} {"train_loss": -11.460509300231934, "global_step": 225522, "epoch": 1342} {"train_loss": -11.641866683959961, "global_step": 225523, "epoch": 1342} {"train_loss": -11.427498817443848, "global_step": 225524, "epoch": 1342} {"train_loss": -11.49006462097168, "global_step": 225525, "epoch": 1342} {"train_loss": -11.70409107208252, "global_step": 225526, "epoch": 1342} {"train_loss": -11.52903938293457, "global_step": 225527, "epoch": 1342} {"train_loss": -11.393791198730469, "global_step": 225528, "epoch": 1342} {"train_loss": -11.536186218261719, "global_step": 225529, "epoch": 1342} {"train_loss": -11.497501373291016, "global_step": 225530, "epoch": 1342} {"train_loss": -11.71317195892334, "global_step": 225531, "epoch": 1342} {"train_loss": -11.471395492553711, "global_step": 225532, "epoch": 1342} {"train_loss": -11.527463912963867, "global_step": 225533, "epoch": 1342} {"train_loss": -11.609519958496094, "global_step": 225534, "epoch": 1342} {"train_loss": -11.834527969360352, "global_step": 225535, "epoch": 1342} {"train_loss": -11.27835750579834, "global_step": 225536, "epoch": 1342} {"train_loss": -11.816507339477539, "global_step": 225537, "epoch": 1342} {"train_loss": -11.429590225219727, "global_step": 225538, "epoch": 1342} {"train_loss": -11.458379745483398, "global_step": 225539, "epoch": 1342} {"train_loss": -11.660473823547363, "global_step": 225540, "epoch": 1342} {"train_loss": -11.533388137817383, "global_step": 225541, "epoch": 1342} {"train_loss": -11.838621139526367, "global_step": 225542, "epoch": 1342} {"train_loss": -11.48550796508789, "global_step": 225543, "epoch": 1342} {"train_loss": -11.656307220458984, "global_step": 225544, "epoch": 1342} {"train_loss": -11.594804763793945, "global_step": 225545, "epoch": 1342} {"train_loss": -11.772693634033203, "global_step": 225546, "epoch": 1342} {"train_loss": -11.525938034057617, "global_step": 225547, "epoch": 1342} {"train_loss": -11.671869277954102, "global_step": 225548, "epoch": 1342} {"train_loss": -11.752192497253418, "global_step": 225549, "epoch": 1342} {"train_loss": -11.620677947998047, "global_step": 225550, "epoch": 1342} {"train_loss": -11.59000301361084, "global_step": 225551, "epoch": 1342} {"train_loss": -11.591483116149902, "global_step": 225552, "epoch": 1342} {"train_loss": -11.498476028442383, "global_step": 225553, "epoch": 1342} {"train_loss": -11.618038177490234, "global_step": 225554, "epoch": 1342} {"train_loss": -11.504064559936523, "global_step": 225555, "epoch": 1342} {"train_loss": -11.546141624450684, "global_step": 225556, "epoch": 1342} {"train_loss": -11.663032531738281, "global_step": 225557, "epoch": 1342} {"train_loss": -11.569440841674805, "global_step": 225558, "epoch": 1342} {"train_loss": -11.387365341186523, "global_step": 225559, "epoch": 1342} {"train_loss": -11.715497016906738, "global_step": 225560, "epoch": 1342} {"train_loss": -11.570761680603027, "global_step": 225561, "epoch": 1342} {"train_loss": -11.537572860717773, "global_step": 225562, "epoch": 1342} {"train_loss": -11.961187362670898, "global_step": 225563, "epoch": 1342} {"train_loss": -11.607083320617676, "global_step": 225564, "epoch": 1342} {"train_loss": -11.750500679016113, "global_step": 225565, "epoch": 1342} {"train_loss": -11.61900520324707, "global_step": 225566, "epoch": 1342} {"train_loss": -11.43730354309082, "global_step": 225567, "epoch": 1342} {"train_loss": -11.753600120544434, "global_step": 225568, "epoch": 1342} {"train_loss": -11.551212310791016, "global_step": 225569, "epoch": 1342} {"train_loss": -11.374263763427734, "global_step": 225570, "epoch": 1342} {"train_loss": -12.154268264770508, "global_step": 225571, "epoch": 1342} {"train_loss": -11.290218353271484, "global_step": 225572, "epoch": 1342} {"train_loss": -11.414978981018066, "global_step": 225573, "epoch": 1342} {"train_loss": -11.407529830932617, "global_step": 225574, "epoch": 1342} {"train_loss": -11.103292465209961, "global_step": 225575, "epoch": 1342} {"train_loss": -11.750476837158203, "global_step": 225576, "epoch": 1342} {"train_loss": -11.377605438232422, "global_step": 225577, "epoch": 1342} {"train_loss": -11.65147590637207, "global_step": 225578, "epoch": 1342} {"train_loss": -11.578847885131836, "global_step": 225579, "epoch": 1342} {"train_loss": -11.770341873168945, "global_step": 225580, "epoch": 1342} {"train_loss": -11.599337577819824, "global_step": 225581, "epoch": 1342} {"train_loss": -11.57368278503418, "global_step": 225582, "epoch": 1342} {"train_loss": -11.078618049621582, "global_step": 225583, "epoch": 1342} {"train_loss": -11.425938606262207, "global_step": 225584, "epoch": 1342} {"train_loss": -11.250907897949219, "global_step": 225585, "epoch": 1342} {"train_loss": -10.364994049072266, "global_step": 225586, "epoch": 1342} {"train_loss": -11.521796226501465, "global_step": 225587, "epoch": 1342} {"train_loss": -10.790972709655762, "global_step": 225588, "epoch": 1342} {"train_loss": -10.428342819213867, "global_step": 225589, "epoch": 1342} {"train_loss": -11.305355072021484, "global_step": 225590, "epoch": 1342} {"train_loss": -11.149900436401367, "global_step": 225591, "epoch": 1342} {"train_loss": -11.024219512939453, "global_step": 225592, "epoch": 1342} {"train_loss": -10.86069393157959, "global_step": 225593, "epoch": 1342} {"train_loss": -11.050362586975098, "global_step": 225594, "epoch": 1342} {"train_loss": -10.842598915100098, "global_step": 225595, "epoch": 1342} {"train_loss": -11.184131622314453, "global_step": 225596, "epoch": 1342} {"train_loss": -11.56584358215332, "global_step": 225597, "epoch": 1342} {"train_loss": -11.357083320617676, "global_step": 225598, "epoch": 1342} {"train_loss": -10.78731918334961, "global_step": 225599, "epoch": 1342} {"train_loss": -11.546744346618652, "global_step": 225600, "epoch": 1342} {"train_loss": -10.78222942352295, "global_step": 225601, "epoch": 1342} {"train_loss": -11.62669849395752, "global_step": 225602, "epoch": 1342} {"train_loss": -11.060941696166992, "global_step": 225603, "epoch": 1342} {"train_loss": -11.737393379211426, "global_step": 225604, "epoch": 1342} {"train_loss": -11.34926986694336, "global_step": 225605, "epoch": 1342} {"train_loss": -11.17470932006836, "global_step": 225606, "epoch": 1342} {"train_loss": -11.513504981994629, "global_step": 225607, "epoch": 1342} {"train_loss": -11.113618850708008, "global_step": 225608, "epoch": 1342} {"train_loss": -11.605449676513672, "global_step": 225609, "epoch": 1342} {"train_loss": -11.087811470031738, "global_step": 225610, "epoch": 1342} {"train_loss": -11.573434829711914, "global_step": 225611, "epoch": 1342} {"train_loss": -11.068267822265625, "global_step": 225612, "epoch": 1342} {"train_loss": -11.545578002929688, "global_step": 225613, "epoch": 1342} {"train_loss": -11.395974159240723, "global_step": 225614, "epoch": 1342} {"train_loss": -11.607208251953125, "global_step": 225615, "epoch": 1342} {"train_loss": -10.986565589904785, "global_step": 225616, "epoch": 1342} {"train_loss": -11.550666809082031, "global_step": 225617, "epoch": 1342} {"train_loss": -11.031946182250977, "global_step": 225618, "epoch": 1342} {"train_loss": -11.163491249084473, "global_step": 225619, "epoch": 1342} {"train_loss": -11.182632446289062, "global_step": 225620, "epoch": 1342} {"train_loss": -11.222867965698242, "global_step": 225621, "epoch": 1342} {"train_loss": -11.388423919677734, "global_step": 225622, "epoch": 1342} {"train_loss": -11.242239844231378, "global_step": 225623, "epoch": 1342, "val_loss": 260237.71875} {"train_loss": -11.122831344604492, "global_step": 225624, "epoch": 1343} {"train_loss": -11.098335266113281, "global_step": 225625, "epoch": 1343} {"train_loss": -11.079170227050781, "global_step": 225626, "epoch": 1343} {"train_loss": -10.7742338180542, "global_step": 225627, "epoch": 1343} {"train_loss": -11.035749435424805, "global_step": 225628, "epoch": 1343} {"train_loss": -10.85322380065918, "global_step": 225629, "epoch": 1343} {"train_loss": -11.593328475952148, "global_step": 225630, "epoch": 1343} {"train_loss": -10.568193435668945, "global_step": 225631, "epoch": 1343} {"train_loss": -11.224994659423828, "global_step": 225632, "epoch": 1343} {"train_loss": -11.001764297485352, "global_step": 225633, "epoch": 1343} {"train_loss": -11.10373306274414, "global_step": 225634, "epoch": 1343} {"train_loss": -10.857078552246094, "global_step": 225635, "epoch": 1343} {"train_loss": -11.070497512817383, "global_step": 225636, "epoch": 1343} {"train_loss": -11.064866065979004, "global_step": 225637, "epoch": 1343} {"train_loss": -11.078105926513672, "global_step": 225638, "epoch": 1343} {"train_loss": -11.540467262268066, "global_step": 225639, "epoch": 1343} {"train_loss": -11.359601974487305, "global_step": 225640, "epoch": 1343} {"train_loss": -11.106507301330566, "global_step": 225641, "epoch": 1343} {"train_loss": -11.502031326293945, "global_step": 225642, "epoch": 1343} {"train_loss": -11.615742683410645, "global_step": 225643, "epoch": 1343} {"train_loss": -11.368772506713867, "global_step": 225644, "epoch": 1343} {"train_loss": -11.694711685180664, "global_step": 225645, "epoch": 1343} {"train_loss": -11.399550437927246, "global_step": 225646, "epoch": 1343} {"train_loss": -11.543695449829102, "global_step": 225647, "epoch": 1343} {"train_loss": -11.528139114379883, "global_step": 225648, "epoch": 1343} {"train_loss": -11.680846214294434, "global_step": 225649, "epoch": 1343} {"train_loss": -11.4473295211792, "global_step": 225650, "epoch": 1343} {"train_loss": -11.519495010375977, "global_step": 225651, "epoch": 1343} {"train_loss": -11.368698120117188, "global_step": 225652, "epoch": 1343} {"train_loss": -11.643543243408203, "global_step": 225653, "epoch": 1343} {"train_loss": -11.593339920043945, "global_step": 225654, "epoch": 1343} {"train_loss": -11.57005500793457, "global_step": 225655, "epoch": 1343} {"train_loss": -11.631744384765625, "global_step": 225656, "epoch": 1343} {"train_loss": -11.546989440917969, "global_step": 225657, "epoch": 1343} {"train_loss": -11.549243927001953, "global_step": 225658, "epoch": 1343} {"train_loss": -11.571192741394043, "global_step": 225659, "epoch": 1343} {"train_loss": -11.729242324829102, "global_step": 225660, "epoch": 1343} {"train_loss": -11.635093688964844, "global_step": 225661, "epoch": 1343} {"train_loss": -11.769067764282227, "global_step": 225662, "epoch": 1343} {"train_loss": -11.640043258666992, "global_step": 225663, "epoch": 1343} {"train_loss": -11.700424194335938, "global_step": 225664, "epoch": 1343} {"train_loss": -11.80667495727539, "global_step": 225665, "epoch": 1343} {"train_loss": -11.602903366088867, "global_step": 225666, "epoch": 1343} {"train_loss": -11.949562072753906, "global_step": 225667, "epoch": 1343} {"train_loss": -11.861822128295898, "global_step": 225668, "epoch": 1343} {"train_loss": -11.676227569580078, "global_step": 225669, "epoch": 1343} {"train_loss": -11.872051239013672, "global_step": 225670, "epoch": 1343} {"train_loss": -11.73382568359375, "global_step": 225671, "epoch": 1343} {"train_loss": -11.959169387817383, "global_step": 225672, "epoch": 1343} {"train_loss": -11.805375099182129, "global_step": 225673, "epoch": 1343} {"train_loss": -11.775148391723633, "global_step": 225674, "epoch": 1343} {"train_loss": -11.728745460510254, "global_step": 225675, "epoch": 1343} {"train_loss": -11.859634399414062, "global_step": 225676, "epoch": 1343} {"train_loss": -12.090947151184082, "global_step": 225677, "epoch": 1343} {"train_loss": -11.799352645874023, "global_step": 225678, "epoch": 1343} {"train_loss": -11.819469451904297, "global_step": 225679, "epoch": 1343} {"train_loss": -11.936384201049805, "global_step": 225680, "epoch": 1343} {"train_loss": -11.921918869018555, "global_step": 225681, "epoch": 1343} {"train_loss": -11.86678695678711, "global_step": 225682, "epoch": 1343} {"train_loss": -12.079009056091309, "global_step": 225683, "epoch": 1343} {"train_loss": -11.825146675109863, "global_step": 225684, "epoch": 1343} {"train_loss": -11.903358459472656, "global_step": 225685, "epoch": 1343} {"train_loss": -11.912153244018555, "global_step": 225686, "epoch": 1343} {"train_loss": -11.928701400756836, "global_step": 225687, "epoch": 1343} {"train_loss": -11.960208892822266, "global_step": 225688, "epoch": 1343} {"train_loss": -11.931427001953125, "global_step": 225689, "epoch": 1343} {"train_loss": -11.988239288330078, "global_step": 225690, "epoch": 1343} {"train_loss": -12.040245056152344, "global_step": 225691, "epoch": 1343} {"train_loss": -12.036033630371094, "global_step": 225692, "epoch": 1343} {"train_loss": -12.024582862854004, "global_step": 225693, "epoch": 1343} {"train_loss": -11.86967658996582, "global_step": 225694, "epoch": 1343} {"train_loss": -12.141263961791992, "global_step": 225695, "epoch": 1343} {"train_loss": -12.109560012817383, "global_step": 225696, "epoch": 1343} {"train_loss": -11.848834991455078, "global_step": 225697, "epoch": 1343} {"train_loss": -12.05718994140625, "global_step": 225698, "epoch": 1343} {"train_loss": -12.082073211669922, "global_step": 225699, "epoch": 1343} {"train_loss": -12.10844612121582, "global_step": 225700, "epoch": 1343} {"train_loss": -12.083900451660156, "global_step": 225701, "epoch": 1343} {"train_loss": -11.865309715270996, "global_step": 225702, "epoch": 1343} {"train_loss": -12.087013244628906, "global_step": 225703, "epoch": 1343} {"train_loss": -12.042909622192383, "global_step": 225704, "epoch": 1343} {"train_loss": -11.987945556640625, "global_step": 225705, "epoch": 1343} {"train_loss": -11.914223670959473, "global_step": 225706, "epoch": 1343} {"train_loss": -11.995539665222168, "global_step": 225707, "epoch": 1343} {"train_loss": -11.984742164611816, "global_step": 225708, "epoch": 1343} {"train_loss": -11.575292587280273, "global_step": 225709, "epoch": 1343} {"train_loss": -9.985965728759766, "global_step": 225710, "epoch": 1343} {"train_loss": -9.91053581237793, "global_step": 225711, "epoch": 1343} {"train_loss": -11.318719863891602, "global_step": 225712, "epoch": 1343} {"train_loss": -10.613069534301758, "global_step": 225713, "epoch": 1343} {"train_loss": -9.685633659362793, "global_step": 225714, "epoch": 1343} {"train_loss": -10.296682357788086, "global_step": 225715, "epoch": 1343} {"train_loss": -10.89509105682373, "global_step": 225716, "epoch": 1343} {"train_loss": -9.541580200195312, "global_step": 225717, "epoch": 1343} {"train_loss": -8.619403839111328, "global_step": 225718, "epoch": 1343} {"train_loss": -10.679271697998047, "global_step": 225719, "epoch": 1343} {"train_loss": -10.114486694335938, "global_step": 225720, "epoch": 1343} {"train_loss": -9.377714157104492, "global_step": 225721, "epoch": 1343} {"train_loss": -11.051860809326172, "global_step": 225722, "epoch": 1343} {"train_loss": -9.95944595336914, "global_step": 225723, "epoch": 1343} {"train_loss": -10.601909637451172, "global_step": 225724, "epoch": 1343} {"train_loss": -10.752752304077148, "global_step": 225725, "epoch": 1343} {"train_loss": -10.833398818969727, "global_step": 225726, "epoch": 1343} {"train_loss": -11.07689094543457, "global_step": 225727, "epoch": 1343} {"train_loss": -10.91650104522705, "global_step": 225728, "epoch": 1343} {"train_loss": -10.48205280303955, "global_step": 225729, "epoch": 1343} {"train_loss": -10.48443603515625, "global_step": 225730, "epoch": 1343} {"train_loss": -10.82358169555664, "global_step": 225731, "epoch": 1343} {"train_loss": -10.74226188659668, "global_step": 225732, "epoch": 1343} {"train_loss": -11.122702598571777, "global_step": 225733, "epoch": 1343} {"train_loss": -11.183675765991211, "global_step": 225734, "epoch": 1343} {"train_loss": -10.97045612335205, "global_step": 225735, "epoch": 1343} {"train_loss": -10.960424423217773, "global_step": 225736, "epoch": 1343} {"train_loss": -11.198917388916016, "global_step": 225737, "epoch": 1343} {"train_loss": -11.059137344360352, "global_step": 225738, "epoch": 1343} {"train_loss": -11.016183853149414, "global_step": 225739, "epoch": 1343} {"train_loss": -11.213348388671875, "global_step": 225740, "epoch": 1343} {"train_loss": -11.591287612915039, "global_step": 225741, "epoch": 1343} {"train_loss": -11.224440574645996, "global_step": 225742, "epoch": 1343} {"train_loss": -11.426621437072754, "global_step": 225743, "epoch": 1343} {"train_loss": -11.287639617919922, "global_step": 225744, "epoch": 1343} {"train_loss": -11.556299209594727, "global_step": 225745, "epoch": 1343} {"train_loss": -11.576814651489258, "global_step": 225746, "epoch": 1343} {"train_loss": -11.490602493286133, "global_step": 225747, "epoch": 1343} {"train_loss": -11.2870512008667, "global_step": 225748, "epoch": 1343} {"train_loss": -11.49760627746582, "global_step": 225749, "epoch": 1343} {"train_loss": -11.590112686157227, "global_step": 225750, "epoch": 1343} {"train_loss": -11.277284622192383, "global_step": 225751, "epoch": 1343} {"train_loss": -11.557374000549316, "global_step": 225752, "epoch": 1343} {"train_loss": -11.68053150177002, "global_step": 225753, "epoch": 1343} {"train_loss": -11.689252853393555, "global_step": 225754, "epoch": 1343} {"train_loss": -11.668846130371094, "global_step": 225755, "epoch": 1343} {"train_loss": -11.629804611206055, "global_step": 225756, "epoch": 1343} {"train_loss": -11.679108619689941, "global_step": 225757, "epoch": 1343} {"train_loss": -11.73466682434082, "global_step": 225758, "epoch": 1343} {"train_loss": -11.61268138885498, "global_step": 225759, "epoch": 1343} {"train_loss": -11.70849609375, "global_step": 225760, "epoch": 1343} {"train_loss": -11.618645668029785, "global_step": 225761, "epoch": 1343} {"train_loss": -11.716339111328125, "global_step": 225762, "epoch": 1343} {"train_loss": -11.611072540283203, "global_step": 225763, "epoch": 1343} {"train_loss": -11.85274887084961, "global_step": 225764, "epoch": 1343} {"train_loss": -11.576160430908203, "global_step": 225765, "epoch": 1343} {"train_loss": -11.541410446166992, "global_step": 225766, "epoch": 1343} {"train_loss": -11.719194412231445, "global_step": 225767, "epoch": 1343} {"train_loss": -11.764484405517578, "global_step": 225768, "epoch": 1343} {"train_loss": -11.939634323120117, "global_step": 225769, "epoch": 1343} {"train_loss": -11.676605224609375, "global_step": 225770, "epoch": 1343} {"train_loss": -11.654341697692871, "global_step": 225771, "epoch": 1343} {"train_loss": -11.793316841125488, "global_step": 225772, "epoch": 1343} {"train_loss": -11.655685424804688, "global_step": 225773, "epoch": 1343} {"train_loss": -11.816553115844727, "global_step": 225774, "epoch": 1343} {"train_loss": -11.96140193939209, "global_step": 225775, "epoch": 1343} {"train_loss": -11.86955451965332, "global_step": 225776, "epoch": 1343} {"train_loss": -12.1011962890625, "global_step": 225777, "epoch": 1343} {"train_loss": -11.906257629394531, "global_step": 225778, "epoch": 1343} {"train_loss": -12.01065444946289, "global_step": 225779, "epoch": 1343} {"train_loss": -11.710762977600098, "global_step": 225780, "epoch": 1343} {"train_loss": -11.945274353027344, "global_step": 225781, "epoch": 1343} {"train_loss": -12.073575973510742, "global_step": 225782, "epoch": 1343} {"train_loss": -12.090055465698242, "global_step": 225783, "epoch": 1343} {"train_loss": -11.981679916381836, "global_step": 225784, "epoch": 1343} {"train_loss": -12.295303344726562, "global_step": 225785, "epoch": 1343} {"train_loss": -12.169088363647461, "global_step": 225786, "epoch": 1343} {"train_loss": -11.85575008392334, "global_step": 225787, "epoch": 1343} {"train_loss": -11.90287971496582, "global_step": 225788, "epoch": 1343} {"train_loss": -11.948864936828613, "global_step": 225789, "epoch": 1343} {"train_loss": -12.17182731628418, "global_step": 225790, "epoch": 1343} {"train_loss": -11.47987403188433, "global_step": 225791, "epoch": 1343, "val_loss": 262464.0625} {"train_loss": -11.734556198120117, "global_step": 225792, "epoch": 1344} {"train_loss": -11.910350799560547, "global_step": 225793, "epoch": 1344} {"train_loss": -11.956222534179688, "global_step": 225794, "epoch": 1344} {"train_loss": -11.80340576171875, "global_step": 225795, "epoch": 1344} {"train_loss": -11.608363151550293, "global_step": 225796, "epoch": 1344} {"train_loss": -11.665388107299805, "global_step": 225797, "epoch": 1344} {"train_loss": -11.727245330810547, "global_step": 225798, "epoch": 1344} {"train_loss": -11.913125991821289, "global_step": 225799, "epoch": 1344} {"train_loss": -11.264749526977539, "global_step": 225800, "epoch": 1344} {"train_loss": -11.412653923034668, "global_step": 225801, "epoch": 1344} {"train_loss": -11.606273651123047, "global_step": 225802, "epoch": 1344} {"train_loss": -11.625866889953613, "global_step": 225803, "epoch": 1344} {"train_loss": -10.38170051574707, "global_step": 225804, "epoch": 1344} {"train_loss": -10.263923645019531, "global_step": 225805, "epoch": 1344} {"train_loss": -11.140791893005371, "global_step": 225806, "epoch": 1344} {"train_loss": -10.555190086364746, "global_step": 225807, "epoch": 1344} {"train_loss": -11.264527320861816, "global_step": 225808, "epoch": 1344} {"train_loss": -10.535387992858887, "global_step": 225809, "epoch": 1344} {"train_loss": -10.673982620239258, "global_step": 225810, "epoch": 1344} {"train_loss": -11.434661865234375, "global_step": 225811, "epoch": 1344} {"train_loss": -10.996206283569336, "global_step": 225812, "epoch": 1344} {"train_loss": -10.58448600769043, "global_step": 225813, "epoch": 1344} {"train_loss": -11.410537719726562, "global_step": 225814, "epoch": 1344} {"train_loss": -10.598373413085938, "global_step": 225815, "epoch": 1344} {"train_loss": -10.585163116455078, "global_step": 225816, "epoch": 1344} {"train_loss": -11.741147994995117, "global_step": 225817, "epoch": 1344} {"train_loss": -10.321075439453125, "global_step": 225818, "epoch": 1344} {"train_loss": -11.52964973449707, "global_step": 225819, "epoch": 1344} {"train_loss": -10.402145385742188, "global_step": 225820, "epoch": 1344} {"train_loss": -10.47886848449707, "global_step": 225821, "epoch": 1344} {"train_loss": -10.190059661865234, "global_step": 225822, "epoch": 1344} {"train_loss": -10.093204498291016, "global_step": 225823, "epoch": 1344} {"train_loss": -10.88127326965332, "global_step": 225824, "epoch": 1344} {"train_loss": -9.439455032348633, "global_step": 225825, "epoch": 1344} {"train_loss": -10.05112075805664, "global_step": 225826, "epoch": 1344} {"train_loss": -9.746374130249023, "global_step": 225827, "epoch": 1344} {"train_loss": -10.5245361328125, "global_step": 225828, "epoch": 1344} {"train_loss": -9.617498397827148, "global_step": 225829, "epoch": 1344} {"train_loss": -10.238506317138672, "global_step": 225830, "epoch": 1344} {"train_loss": -9.754294395446777, "global_step": 225831, "epoch": 1344} {"train_loss": -10.334115982055664, "global_step": 225832, "epoch": 1344} {"train_loss": -10.002225875854492, "global_step": 225833, "epoch": 1344} {"train_loss": -9.770662307739258, "global_step": 225834, "epoch": 1344} {"train_loss": -10.919668197631836, "global_step": 225835, "epoch": 1344} {"train_loss": -10.607451438903809, "global_step": 225836, "epoch": 1344} {"train_loss": -10.322408676147461, "global_step": 225837, "epoch": 1344} {"train_loss": -11.515458106994629, "global_step": 225838, "epoch": 1344} {"train_loss": -10.819589614868164, "global_step": 225839, "epoch": 1344} {"train_loss": -11.124853134155273, "global_step": 225840, "epoch": 1344} {"train_loss": -11.251556396484375, "global_step": 225841, "epoch": 1344} {"train_loss": -10.935548782348633, "global_step": 225842, "epoch": 1344} {"train_loss": -11.310783386230469, "global_step": 225843, "epoch": 1344} {"train_loss": -11.176817893981934, "global_step": 225844, "epoch": 1344} {"train_loss": -11.405652046203613, "global_step": 225845, "epoch": 1344} {"train_loss": -11.16286849975586, "global_step": 225846, "epoch": 1344} {"train_loss": -11.376520156860352, "global_step": 225847, "epoch": 1344} {"train_loss": -11.412505149841309, "global_step": 225848, "epoch": 1344} {"train_loss": -11.28640365600586, "global_step": 225849, "epoch": 1344} {"train_loss": -11.203229904174805, "global_step": 225850, "epoch": 1344} {"train_loss": -11.369207382202148, "global_step": 225851, "epoch": 1344} {"train_loss": -11.474836349487305, "global_step": 225852, "epoch": 1344} {"train_loss": -11.450241088867188, "global_step": 225853, "epoch": 1344} {"train_loss": -11.388486862182617, "global_step": 225854, "epoch": 1344} {"train_loss": -11.351768493652344, "global_step": 225855, "epoch": 1344} {"train_loss": -11.300867080688477, "global_step": 225856, "epoch": 1344} {"train_loss": -11.445720672607422, "global_step": 225857, "epoch": 1344} {"train_loss": -11.130806922912598, "global_step": 225858, "epoch": 1344} {"train_loss": -11.369888305664062, "global_step": 225859, "epoch": 1344} {"train_loss": -11.211280822753906, "global_step": 225860, "epoch": 1344} {"train_loss": -11.487396240234375, "global_step": 225861, "epoch": 1344} {"train_loss": -11.196776390075684, "global_step": 225862, "epoch": 1344} {"train_loss": -11.609628677368164, "global_step": 225863, "epoch": 1344} {"train_loss": -11.54238510131836, "global_step": 225864, "epoch": 1344} {"train_loss": -11.371779441833496, "global_step": 225865, "epoch": 1344} {"train_loss": -11.58029556274414, "global_step": 225866, "epoch": 1344} {"train_loss": -11.31614875793457, "global_step": 225867, "epoch": 1344} {"train_loss": -11.629230499267578, "global_step": 225868, "epoch": 1344} {"train_loss": -11.316509246826172, "global_step": 225869, "epoch": 1344} {"train_loss": -11.586036682128906, "global_step": 225870, "epoch": 1344} {"train_loss": -11.514341354370117, "global_step": 225871, "epoch": 1344} {"train_loss": -11.553788185119629, "global_step": 225872, "epoch": 1344} {"train_loss": -11.569011688232422, "global_step": 225873, "epoch": 1344} {"train_loss": -11.57640266418457, "global_step": 225874, "epoch": 1344} {"train_loss": -11.586772918701172, "global_step": 225875, "epoch": 1344} {"train_loss": -11.600713729858398, "global_step": 225876, "epoch": 1344} {"train_loss": -12.043034553527832, "global_step": 225877, "epoch": 1344} {"train_loss": -11.618114471435547, "global_step": 225878, "epoch": 1344} {"train_loss": -11.575794219970703, "global_step": 225879, "epoch": 1344} {"train_loss": -11.855772018432617, "global_step": 225880, "epoch": 1344} {"train_loss": -11.789470672607422, "global_step": 225881, "epoch": 1344} {"train_loss": -11.795351028442383, "global_step": 225882, "epoch": 1344} {"train_loss": -11.89750862121582, "global_step": 225883, "epoch": 1344} {"train_loss": -11.934198379516602, "global_step": 225884, "epoch": 1344} {"train_loss": -11.732706069946289, "global_step": 225885, "epoch": 1344} {"train_loss": -11.869379997253418, "global_step": 225886, "epoch": 1344} {"train_loss": -11.582891464233398, "global_step": 225887, "epoch": 1344} {"train_loss": -11.628226280212402, "global_step": 225888, "epoch": 1344} {"train_loss": -11.988338470458984, "global_step": 225889, "epoch": 1344} {"train_loss": -11.63421630859375, "global_step": 225890, "epoch": 1344} {"train_loss": -11.894832611083984, "global_step": 225891, "epoch": 1344} {"train_loss": -11.72474479675293, "global_step": 225892, "epoch": 1344} {"train_loss": -11.890033721923828, "global_step": 225893, "epoch": 1344} {"train_loss": -11.857831001281738, "global_step": 225894, "epoch": 1344} {"train_loss": -11.942105293273926, "global_step": 225895, "epoch": 1344} {"train_loss": -11.89025592803955, "global_step": 225896, "epoch": 1344} {"train_loss": -11.959403991699219, "global_step": 225897, "epoch": 1344} {"train_loss": -11.806608200073242, "global_step": 225898, "epoch": 1344} {"train_loss": -11.85335636138916, "global_step": 225899, "epoch": 1344} {"train_loss": -11.223494529724121, "global_step": 225900, "epoch": 1344} {"train_loss": -11.779611587524414, "global_step": 225901, "epoch": 1344} {"train_loss": -11.388469696044922, "global_step": 225902, "epoch": 1344} {"train_loss": -11.652495384216309, "global_step": 225903, "epoch": 1344} {"train_loss": -11.677457809448242, "global_step": 225904, "epoch": 1344} {"train_loss": -11.554615020751953, "global_step": 225905, "epoch": 1344} {"train_loss": -11.429962158203125, "global_step": 225906, "epoch": 1344} {"train_loss": -11.893434524536133, "global_step": 225907, "epoch": 1344} {"train_loss": -11.793854713439941, "global_step": 225908, "epoch": 1344} {"train_loss": -11.735198974609375, "global_step": 225909, "epoch": 1344} {"train_loss": -11.341202735900879, "global_step": 225910, "epoch": 1344} {"train_loss": -12.001718521118164, "global_step": 225911, "epoch": 1344} {"train_loss": -11.738853454589844, "global_step": 225912, "epoch": 1344} {"train_loss": -11.364752769470215, "global_step": 225913, "epoch": 1344} {"train_loss": -11.633502960205078, "global_step": 225914, "epoch": 1344} {"train_loss": -11.620018005371094, "global_step": 225915, "epoch": 1344} {"train_loss": -11.37636947631836, "global_step": 225916, "epoch": 1344} {"train_loss": -11.112730026245117, "global_step": 225917, "epoch": 1344} {"train_loss": -11.750267028808594, "global_step": 225918, "epoch": 1344} {"train_loss": -10.515950202941895, "global_step": 225919, "epoch": 1344} {"train_loss": -9.557955741882324, "global_step": 225920, "epoch": 1344} {"train_loss": -11.419246673583984, "global_step": 225921, "epoch": 1344} {"train_loss": -8.58945083618164, "global_step": 225922, "epoch": 1344} {"train_loss": -7.732630729675293, "global_step": 225923, "epoch": 1344} {"train_loss": -8.591297149658203, "global_step": 225924, "epoch": 1344} {"train_loss": -10.473945617675781, "global_step": 225925, "epoch": 1344} {"train_loss": -7.166544437408447, "global_step": 225926, "epoch": 1344} {"train_loss": -9.191730499267578, "global_step": 225927, "epoch": 1344} {"train_loss": -9.679359436035156, "global_step": 225928, "epoch": 1344} {"train_loss": -10.331929206848145, "global_step": 225929, "epoch": 1344} {"train_loss": -9.336633682250977, "global_step": 225930, "epoch": 1344} {"train_loss": -10.730195999145508, "global_step": 225931, "epoch": 1344} {"train_loss": -9.936772346496582, "global_step": 225932, "epoch": 1344} {"train_loss": -10.698005676269531, "global_step": 225933, "epoch": 1344} {"train_loss": -10.30815315246582, "global_step": 225934, "epoch": 1344} {"train_loss": -10.681888580322266, "global_step": 225935, "epoch": 1344} {"train_loss": -10.371676445007324, "global_step": 225936, "epoch": 1344} {"train_loss": -10.316606521606445, "global_step": 225937, "epoch": 1344} {"train_loss": -10.803176879882812, "global_step": 225938, "epoch": 1344} {"train_loss": -10.532073974609375, "global_step": 225939, "epoch": 1344} {"train_loss": -10.75239086151123, "global_step": 225940, "epoch": 1344} {"train_loss": -10.82837200164795, "global_step": 225941, "epoch": 1344} {"train_loss": -10.607667922973633, "global_step": 225942, "epoch": 1344} {"train_loss": -11.064924240112305, "global_step": 225943, "epoch": 1344} {"train_loss": -10.910154342651367, "global_step": 225944, "epoch": 1344} {"train_loss": -11.083284378051758, "global_step": 225945, "epoch": 1344} {"train_loss": -10.901144027709961, "global_step": 225946, "epoch": 1344} {"train_loss": -11.166961669921875, "global_step": 225947, "epoch": 1344} {"train_loss": -11.041458129882812, "global_step": 225948, "epoch": 1344} {"train_loss": -11.413837432861328, "global_step": 225949, "epoch": 1344} {"train_loss": -10.799384117126465, "global_step": 225950, "epoch": 1344} {"train_loss": -11.338397979736328, "global_step": 225951, "epoch": 1344} {"train_loss": -11.086999893188477, "global_step": 225952, "epoch": 1344} {"train_loss": -11.171480178833008, "global_step": 225953, "epoch": 1344} {"train_loss": -11.535957336425781, "global_step": 225954, "epoch": 1344} {"train_loss": -10.972320556640625, "global_step": 225955, "epoch": 1344} {"train_loss": -11.50352668762207, "global_step": 225956, "epoch": 1344} {"train_loss": -11.27640151977539, "global_step": 225957, "epoch": 1344} {"train_loss": -11.404895782470703, "global_step": 225958, "epoch": 1344} {"train_loss": -11.083758623827071, "global_step": 225959, "epoch": 1344, "val_loss": 253349.703125} {"train_loss": -11.5072660446167, "global_step": 225960, "epoch": 1345} {"train_loss": -11.251551628112793, "global_step": 225961, "epoch": 1345} {"train_loss": -11.197513580322266, "global_step": 225962, "epoch": 1345} {"train_loss": -11.343445777893066, "global_step": 225963, "epoch": 1345} {"train_loss": -11.383563995361328, "global_step": 225964, "epoch": 1345} {"train_loss": -11.703277587890625, "global_step": 225965, "epoch": 1345} {"train_loss": -11.190216064453125, "global_step": 225966, "epoch": 1345} {"train_loss": -11.565923690795898, "global_step": 225967, "epoch": 1345} {"train_loss": -11.327116012573242, "global_step": 225968, "epoch": 1345} {"train_loss": -11.66242790222168, "global_step": 225969, "epoch": 1345} {"train_loss": -11.360876083374023, "global_step": 225970, "epoch": 1345} {"train_loss": -11.657265663146973, "global_step": 225971, "epoch": 1345} {"train_loss": -11.400195121765137, "global_step": 225972, "epoch": 1345} {"train_loss": -11.377256393432617, "global_step": 225973, "epoch": 1345} {"train_loss": -11.546998977661133, "global_step": 225974, "epoch": 1345} {"train_loss": -11.430098533630371, "global_step": 225975, "epoch": 1345} {"train_loss": -11.451648712158203, "global_step": 225976, "epoch": 1345} {"train_loss": -11.357110023498535, "global_step": 225977, "epoch": 1345} {"train_loss": -11.546091079711914, "global_step": 225978, "epoch": 1345} {"train_loss": -11.28988265991211, "global_step": 225979, "epoch": 1345} {"train_loss": -11.630118370056152, "global_step": 225980, "epoch": 1345} {"train_loss": -10.992231369018555, "global_step": 225981, "epoch": 1345} {"train_loss": -11.568248748779297, "global_step": 225982, "epoch": 1345} {"train_loss": -11.198423385620117, "global_step": 225983, "epoch": 1345} {"train_loss": -11.59666633605957, "global_step": 225984, "epoch": 1345} {"train_loss": -11.234729766845703, "global_step": 225985, "epoch": 1345} {"train_loss": -11.606760025024414, "global_step": 225986, "epoch": 1345} {"train_loss": -10.885507583618164, "global_step": 225987, "epoch": 1345} {"train_loss": -11.528316497802734, "global_step": 225988, "epoch": 1345} {"train_loss": -11.041479110717773, "global_step": 225989, "epoch": 1345} {"train_loss": -11.665319442749023, "global_step": 225990, "epoch": 1345} {"train_loss": -11.364404678344727, "global_step": 225991, "epoch": 1345} {"train_loss": -11.421730041503906, "global_step": 225992, "epoch": 1345} {"train_loss": -11.212437629699707, "global_step": 225993, "epoch": 1345} {"train_loss": -11.243789672851562, "global_step": 225994, "epoch": 1345} {"train_loss": -11.185893058776855, "global_step": 225995, "epoch": 1345} {"train_loss": -11.889924049377441, "global_step": 225996, "epoch": 1345} {"train_loss": -11.14225959777832, "global_step": 225997, "epoch": 1345} {"train_loss": -11.774459838867188, "global_step": 225998, "epoch": 1345} {"train_loss": -11.614400863647461, "global_step": 225999, "epoch": 1345} {"train_loss": -11.640544891357422, "global_step": 226000, "epoch": 1345} {"train_loss": -11.855813980102539, "global_step": 226001, "epoch": 1345} {"train_loss": -11.851911544799805, "global_step": 226002, "epoch": 1345} {"train_loss": -11.786585807800293, "global_step": 226003, "epoch": 1345} {"train_loss": -11.484541893005371, "global_step": 226004, "epoch": 1345} {"train_loss": -11.647855758666992, "global_step": 226005, "epoch": 1345} {"train_loss": -11.774468421936035, "global_step": 226006, "epoch": 1345} {"train_loss": -11.769001007080078, "global_step": 226007, "epoch": 1345} {"train_loss": -12.00052547454834, "global_step": 226008, "epoch": 1345} {"train_loss": -11.6856689453125, "global_step": 226009, "epoch": 1345} {"train_loss": -12.067392349243164, "global_step": 226010, "epoch": 1345} {"train_loss": -11.720184326171875, "global_step": 226011, "epoch": 1345} {"train_loss": -11.850854873657227, "global_step": 226012, "epoch": 1345} {"train_loss": -11.750539779663086, "global_step": 226013, "epoch": 1345} {"train_loss": -11.876775741577148, "global_step": 226014, "epoch": 1345} {"train_loss": -11.697205543518066, "global_step": 226015, "epoch": 1345} {"train_loss": -11.837240219116211, "global_step": 226016, "epoch": 1345} {"train_loss": -11.837409973144531, "global_step": 226017, "epoch": 1345} {"train_loss": -11.982001304626465, "global_step": 226018, "epoch": 1345} {"train_loss": -11.90587043762207, "global_step": 226019, "epoch": 1345} {"train_loss": -11.718557357788086, "global_step": 226020, "epoch": 1345} {"train_loss": -11.991945266723633, "global_step": 226021, "epoch": 1345} {"train_loss": -11.929054260253906, "global_step": 226022, "epoch": 1345} {"train_loss": -11.542964935302734, "global_step": 226023, "epoch": 1345} {"train_loss": -12.153831481933594, "global_step": 226024, "epoch": 1345} {"train_loss": -11.95492935180664, "global_step": 226025, "epoch": 1345} {"train_loss": -11.575580596923828, "global_step": 226026, "epoch": 1345} {"train_loss": -11.515414237976074, "global_step": 226027, "epoch": 1345} {"train_loss": -11.824865341186523, "global_step": 226028, "epoch": 1345} {"train_loss": -11.902667999267578, "global_step": 226029, "epoch": 1345} {"train_loss": -11.537629127502441, "global_step": 226030, "epoch": 1345} {"train_loss": -11.637613296508789, "global_step": 226031, "epoch": 1345} {"train_loss": -11.900232315063477, "global_step": 226032, "epoch": 1345} {"train_loss": -11.952808380126953, "global_step": 226033, "epoch": 1345} {"train_loss": -11.888875961303711, "global_step": 226034, "epoch": 1345} {"train_loss": -11.68145751953125, "global_step": 226035, "epoch": 1345} {"train_loss": -11.490278244018555, "global_step": 226036, "epoch": 1345} {"train_loss": -11.405460357666016, "global_step": 226037, "epoch": 1345} {"train_loss": -11.619091033935547, "global_step": 226038, "epoch": 1345} {"train_loss": -11.327323913574219, "global_step": 226039, "epoch": 1345} {"train_loss": -11.766155242919922, "global_step": 226040, "epoch": 1345} {"train_loss": -11.214015007019043, "global_step": 226041, "epoch": 1345} {"train_loss": -10.975517272949219, "global_step": 226042, "epoch": 1345} {"train_loss": -11.6810884475708, "global_step": 226043, "epoch": 1345} {"train_loss": -11.181997299194336, "global_step": 226044, "epoch": 1345} {"train_loss": -11.414337158203125, "global_step": 226045, "epoch": 1345} {"train_loss": -11.17692756652832, "global_step": 226046, "epoch": 1345} {"train_loss": -11.386816024780273, "global_step": 226047, "epoch": 1345} {"train_loss": -10.84101676940918, "global_step": 226048, "epoch": 1345} {"train_loss": -10.984293937683105, "global_step": 226049, "epoch": 1345} {"train_loss": -9.038562774658203, "global_step": 226050, "epoch": 1345} {"train_loss": -11.505590438842773, "global_step": 226051, "epoch": 1345} {"train_loss": -9.901359558105469, "global_step": 226052, "epoch": 1345} {"train_loss": -11.187082290649414, "global_step": 226053, "epoch": 1345} {"train_loss": -10.41553020477295, "global_step": 226054, "epoch": 1345} {"train_loss": -10.874235153198242, "global_step": 226055, "epoch": 1345} {"train_loss": -10.018913269042969, "global_step": 226056, "epoch": 1345} {"train_loss": -10.476651191711426, "global_step": 226057, "epoch": 1345} {"train_loss": -10.659435272216797, "global_step": 226058, "epoch": 1345} {"train_loss": -10.335744857788086, "global_step": 226059, "epoch": 1345} {"train_loss": -11.749731063842773, "global_step": 226060, "epoch": 1345} {"train_loss": -10.271734237670898, "global_step": 226061, "epoch": 1345} {"train_loss": -11.548738479614258, "global_step": 226062, "epoch": 1345} {"train_loss": -10.999639511108398, "global_step": 226063, "epoch": 1345} {"train_loss": -10.83691692352295, "global_step": 226064, "epoch": 1345} {"train_loss": -11.431829452514648, "global_step": 226065, "epoch": 1345} {"train_loss": -10.261962890625, "global_step": 226066, "epoch": 1345} {"train_loss": -11.597430229187012, "global_step": 226067, "epoch": 1345} {"train_loss": -10.628986358642578, "global_step": 226068, "epoch": 1345} {"train_loss": -10.78752613067627, "global_step": 226069, "epoch": 1345} {"train_loss": -11.204813003540039, "global_step": 226070, "epoch": 1345} {"train_loss": -10.64334487915039, "global_step": 226071, "epoch": 1345} {"train_loss": -10.785642623901367, "global_step": 226072, "epoch": 1345} {"train_loss": -10.68604850769043, "global_step": 226073, "epoch": 1345} {"train_loss": -11.065679550170898, "global_step": 226074, "epoch": 1345} {"train_loss": -10.536107063293457, "global_step": 226075, "epoch": 1345} {"train_loss": -11.29051399230957, "global_step": 226076, "epoch": 1345} {"train_loss": -10.650100708007812, "global_step": 226077, "epoch": 1345} {"train_loss": -11.416149139404297, "global_step": 226078, "epoch": 1345} {"train_loss": -10.985742568969727, "global_step": 226079, "epoch": 1345} {"train_loss": -11.605018615722656, "global_step": 226080, "epoch": 1345} {"train_loss": -11.177207946777344, "global_step": 226081, "epoch": 1345} {"train_loss": -11.0260009765625, "global_step": 226082, "epoch": 1345} {"train_loss": -11.526283264160156, "global_step": 226083, "epoch": 1345} {"train_loss": -11.303104400634766, "global_step": 226084, "epoch": 1345} {"train_loss": -11.296897888183594, "global_step": 226085, "epoch": 1345} {"train_loss": -11.339312553405762, "global_step": 226086, "epoch": 1345} {"train_loss": -10.730997085571289, "global_step": 226087, "epoch": 1345} {"train_loss": -11.428899765014648, "global_step": 226088, "epoch": 1345} {"train_loss": -11.255853652954102, "global_step": 226089, "epoch": 1345} {"train_loss": -11.350822448730469, "global_step": 226090, "epoch": 1345} {"train_loss": -11.477368354797363, "global_step": 226091, "epoch": 1345} {"train_loss": -11.291772842407227, "global_step": 226092, "epoch": 1345} {"train_loss": -11.615646362304688, "global_step": 226093, "epoch": 1345} {"train_loss": -11.547011375427246, "global_step": 226094, "epoch": 1345} {"train_loss": -11.526150703430176, "global_step": 226095, "epoch": 1345} {"train_loss": -11.714061737060547, "global_step": 226096, "epoch": 1345} {"train_loss": -11.628564834594727, "global_step": 226097, "epoch": 1345} {"train_loss": -11.590261459350586, "global_step": 226098, "epoch": 1345} {"train_loss": -11.6148099899292, "global_step": 226099, "epoch": 1345} {"train_loss": -11.496258735656738, "global_step": 226100, "epoch": 1345} {"train_loss": -11.464305877685547, "global_step": 226101, "epoch": 1345} {"train_loss": -11.329496383666992, "global_step": 226102, "epoch": 1345} {"train_loss": -11.590768814086914, "global_step": 226103, "epoch": 1345} {"train_loss": -11.502388000488281, "global_step": 226104, "epoch": 1345} {"train_loss": -11.315757751464844, "global_step": 226105, "epoch": 1345} {"train_loss": -11.505231857299805, "global_step": 226106, "epoch": 1345} {"train_loss": -11.573427200317383, "global_step": 226107, "epoch": 1345} {"train_loss": -11.39793586730957, "global_step": 226108, "epoch": 1345} {"train_loss": -11.617321014404297, "global_step": 226109, "epoch": 1345} {"train_loss": -11.607139587402344, "global_step": 226110, "epoch": 1345} {"train_loss": -11.510738372802734, "global_step": 226111, "epoch": 1345} {"train_loss": -11.83977222442627, "global_step": 226112, "epoch": 1345} {"train_loss": -11.586809158325195, "global_step": 226113, "epoch": 1345} {"train_loss": -11.670838356018066, "global_step": 226114, "epoch": 1345} {"train_loss": -11.726325035095215, "global_step": 226115, "epoch": 1345} {"train_loss": -11.491178512573242, "global_step": 226116, "epoch": 1345} {"train_loss": -11.759843826293945, "global_step": 226117, "epoch": 1345} {"train_loss": -11.67653751373291, "global_step": 226118, "epoch": 1345} {"train_loss": -11.823724746704102, "global_step": 226119, "epoch": 1345} {"train_loss": -11.581266403198242, "global_step": 226120, "epoch": 1345} {"train_loss": -11.783945083618164, "global_step": 226121, "epoch": 1345} {"train_loss": -11.572233200073242, "global_step": 226122, "epoch": 1345} {"train_loss": -11.51893424987793, "global_step": 226123, "epoch": 1345} {"train_loss": -11.851612091064453, "global_step": 226124, "epoch": 1345} {"train_loss": -11.55056381225586, "global_step": 226125, "epoch": 1345} {"train_loss": -11.589414596557617, "global_step": 226126, "epoch": 1345} {"train_loss": -11.405091915811811, "global_step": 226127, "epoch": 1345, "val_loss": 255234.15625, "train_action_mse_error": 1.623509168624878} {"train_loss": -11.31079387664795, "global_step": 226128, "epoch": 1346} {"train_loss": -11.567082405090332, "global_step": 226129, "epoch": 1346} {"train_loss": -11.835304260253906, "global_step": 226130, "epoch": 1346} {"train_loss": -11.567266464233398, "global_step": 226131, "epoch": 1346} {"train_loss": -11.844038009643555, "global_step": 226132, "epoch": 1346} {"train_loss": -11.296749114990234, "global_step": 226133, "epoch": 1346} {"train_loss": -11.423544883728027, "global_step": 226134, "epoch": 1346} {"train_loss": -11.691825866699219, "global_step": 226135, "epoch": 1346} {"train_loss": -11.37544059753418, "global_step": 226136, "epoch": 1346} {"train_loss": -11.658329010009766, "global_step": 226137, "epoch": 1346} {"train_loss": -11.536892890930176, "global_step": 226138, "epoch": 1346} {"train_loss": -11.324592590332031, "global_step": 226139, "epoch": 1346} {"train_loss": -11.823261260986328, "global_step": 226140, "epoch": 1346} {"train_loss": -10.87510871887207, "global_step": 226141, "epoch": 1346} {"train_loss": -11.307056427001953, "global_step": 226142, "epoch": 1346} {"train_loss": -11.547013282775879, "global_step": 226143, "epoch": 1346} {"train_loss": -11.77286434173584, "global_step": 226144, "epoch": 1346} {"train_loss": -11.56802749633789, "global_step": 226145, "epoch": 1346} {"train_loss": -11.870559692382812, "global_step": 226146, "epoch": 1346} {"train_loss": -11.796775817871094, "global_step": 226147, "epoch": 1346} {"train_loss": -11.545923233032227, "global_step": 226148, "epoch": 1346} {"train_loss": -11.822107315063477, "global_step": 226149, "epoch": 1346} {"train_loss": -11.578435897827148, "global_step": 226150, "epoch": 1346} {"train_loss": -11.824433326721191, "global_step": 226151, "epoch": 1346} {"train_loss": -11.840670585632324, "global_step": 226152, "epoch": 1346} {"train_loss": -11.856246948242188, "global_step": 226153, "epoch": 1346} {"train_loss": -11.872060775756836, "global_step": 226154, "epoch": 1346} {"train_loss": -11.724172592163086, "global_step": 226155, "epoch": 1346} {"train_loss": -11.650836944580078, "global_step": 226156, "epoch": 1346} {"train_loss": -11.933496475219727, "global_step": 226157, "epoch": 1346} {"train_loss": -11.597555160522461, "global_step": 226158, "epoch": 1346} {"train_loss": -11.901585578918457, "global_step": 226159, "epoch": 1346} {"train_loss": -11.55341911315918, "global_step": 226160, "epoch": 1346} {"train_loss": -11.8271484375, "global_step": 226161, "epoch": 1346} {"train_loss": -11.887001037597656, "global_step": 226162, "epoch": 1346} {"train_loss": -11.85611343383789, "global_step": 226163, "epoch": 1346} {"train_loss": -11.502135276794434, "global_step": 226164, "epoch": 1346} {"train_loss": -11.82887077331543, "global_step": 226165, "epoch": 1346} {"train_loss": -11.61497974395752, "global_step": 226166, "epoch": 1346} {"train_loss": -11.61737060546875, "global_step": 226167, "epoch": 1346} {"train_loss": -11.86430835723877, "global_step": 226168, "epoch": 1346} {"train_loss": -11.895323753356934, "global_step": 226169, "epoch": 1346} {"train_loss": -12.087846755981445, "global_step": 226170, "epoch": 1346} {"train_loss": -11.749641418457031, "global_step": 226171, "epoch": 1346} {"train_loss": -12.177042961120605, "global_step": 226172, "epoch": 1346} {"train_loss": -12.011259078979492, "global_step": 226173, "epoch": 1346} {"train_loss": -11.991055488586426, "global_step": 226174, "epoch": 1346} {"train_loss": -11.867541313171387, "global_step": 226175, "epoch": 1346} {"train_loss": -12.013154983520508, "global_step": 226176, "epoch": 1346} {"train_loss": -12.157167434692383, "global_step": 226177, "epoch": 1346} {"train_loss": -11.701804161071777, "global_step": 226178, "epoch": 1346} {"train_loss": -11.212945938110352, "global_step": 226179, "epoch": 1346} {"train_loss": -11.626504898071289, "global_step": 226180, "epoch": 1346} {"train_loss": -11.769318580627441, "global_step": 226181, "epoch": 1346} {"train_loss": -11.704495429992676, "global_step": 226182, "epoch": 1346} {"train_loss": -11.931689262390137, "global_step": 226183, "epoch": 1346} {"train_loss": -11.939404487609863, "global_step": 226184, "epoch": 1346} {"train_loss": -11.916848182678223, "global_step": 226185, "epoch": 1346} {"train_loss": -11.965003967285156, "global_step": 226186, "epoch": 1346} {"train_loss": -11.925413131713867, "global_step": 226187, "epoch": 1346} {"train_loss": -11.75257682800293, "global_step": 226188, "epoch": 1346} {"train_loss": -11.779666900634766, "global_step": 226189, "epoch": 1346} {"train_loss": -11.770330429077148, "global_step": 226190, "epoch": 1346} {"train_loss": -11.875707626342773, "global_step": 226191, "epoch": 1346} {"train_loss": -11.302270889282227, "global_step": 226192, "epoch": 1346} {"train_loss": -11.469738960266113, "global_step": 226193, "epoch": 1346} {"train_loss": -11.471965789794922, "global_step": 226194, "epoch": 1346} {"train_loss": -11.346349716186523, "global_step": 226195, "epoch": 1346} {"train_loss": -11.187759399414062, "global_step": 226196, "epoch": 1346} {"train_loss": -11.31361198425293, "global_step": 226197, "epoch": 1346} {"train_loss": -11.098906517028809, "global_step": 226198, "epoch": 1346} {"train_loss": -10.648380279541016, "global_step": 226199, "epoch": 1346} {"train_loss": -11.039344787597656, "global_step": 226200, "epoch": 1346} {"train_loss": -11.098285675048828, "global_step": 226201, "epoch": 1346} {"train_loss": -11.08543586730957, "global_step": 226202, "epoch": 1346} {"train_loss": -10.84287166595459, "global_step": 226203, "epoch": 1346} {"train_loss": -10.327848434448242, "global_step": 226204, "epoch": 1346} {"train_loss": -10.992500305175781, "global_step": 226205, "epoch": 1346} {"train_loss": -11.234285354614258, "global_step": 226206, "epoch": 1346} {"train_loss": -10.511738777160645, "global_step": 226207, "epoch": 1346} {"train_loss": -10.516088485717773, "global_step": 226208, "epoch": 1346} {"train_loss": -11.45610237121582, "global_step": 226209, "epoch": 1346} {"train_loss": -10.929327011108398, "global_step": 226210, "epoch": 1346} {"train_loss": -10.842679977416992, "global_step": 226211, "epoch": 1346} {"train_loss": -11.001583099365234, "global_step": 226212, "epoch": 1346} {"train_loss": -10.847236633300781, "global_step": 226213, "epoch": 1346} {"train_loss": -10.91148853302002, "global_step": 226214, "epoch": 1346} {"train_loss": -11.2446870803833, "global_step": 226215, "epoch": 1346} {"train_loss": -11.100027084350586, "global_step": 226216, "epoch": 1346} {"train_loss": -11.307463645935059, "global_step": 226217, "epoch": 1346} {"train_loss": -10.776540756225586, "global_step": 226218, "epoch": 1346} {"train_loss": -10.963306427001953, "global_step": 226219, "epoch": 1346} {"train_loss": -11.343939781188965, "global_step": 226220, "epoch": 1346} {"train_loss": -9.899239540100098, "global_step": 226221, "epoch": 1346} {"train_loss": -11.176666259765625, "global_step": 226222, "epoch": 1346} {"train_loss": -10.275715827941895, "global_step": 226223, "epoch": 1346} {"train_loss": -10.697047233581543, "global_step": 226224, "epoch": 1346} {"train_loss": -11.308184623718262, "global_step": 226225, "epoch": 1346} {"train_loss": -10.368401527404785, "global_step": 226226, "epoch": 1346} {"train_loss": -11.457965850830078, "global_step": 226227, "epoch": 1346} {"train_loss": -10.786338806152344, "global_step": 226228, "epoch": 1346} {"train_loss": -11.667102813720703, "global_step": 226229, "epoch": 1346} {"train_loss": -11.767820358276367, "global_step": 226230, "epoch": 1346} {"train_loss": -11.247245788574219, "global_step": 226231, "epoch": 1346} {"train_loss": -11.368522644042969, "global_step": 226232, "epoch": 1346} {"train_loss": -11.299654006958008, "global_step": 226233, "epoch": 1346} {"train_loss": -11.380878448486328, "global_step": 226234, "epoch": 1346} {"train_loss": -11.262595176696777, "global_step": 226235, "epoch": 1346} {"train_loss": -11.386740684509277, "global_step": 226236, "epoch": 1346} {"train_loss": -11.436273574829102, "global_step": 226237, "epoch": 1346} {"train_loss": -11.258516311645508, "global_step": 226238, "epoch": 1346} {"train_loss": -11.509570121765137, "global_step": 226239, "epoch": 1346} {"train_loss": -11.08629035949707, "global_step": 226240, "epoch": 1346} {"train_loss": -10.834471702575684, "global_step": 226241, "epoch": 1346} {"train_loss": -11.253969192504883, "global_step": 226242, "epoch": 1346} {"train_loss": -11.194404602050781, "global_step": 226243, "epoch": 1346} {"train_loss": -11.187088012695312, "global_step": 226244, "epoch": 1346} {"train_loss": -11.035179138183594, "global_step": 226245, "epoch": 1346} {"train_loss": -11.182476043701172, "global_step": 226246, "epoch": 1346} {"train_loss": -11.014849662780762, "global_step": 226247, "epoch": 1346} {"train_loss": -10.967306137084961, "global_step": 226248, "epoch": 1346} {"train_loss": -11.365489959716797, "global_step": 226249, "epoch": 1346} {"train_loss": -11.164371490478516, "global_step": 226250, "epoch": 1346} {"train_loss": -11.309869766235352, "global_step": 226251, "epoch": 1346} {"train_loss": -10.88083267211914, "global_step": 226252, "epoch": 1346} {"train_loss": -11.074483871459961, "global_step": 226253, "epoch": 1346} {"train_loss": -11.321844100952148, "global_step": 226254, "epoch": 1346} {"train_loss": -11.081040382385254, "global_step": 226255, "epoch": 1346} {"train_loss": -11.616273880004883, "global_step": 226256, "epoch": 1346} {"train_loss": -11.592317581176758, "global_step": 226257, "epoch": 1346} {"train_loss": -11.677826881408691, "global_step": 226258, "epoch": 1346} {"train_loss": -11.402466773986816, "global_step": 226259, "epoch": 1346} {"train_loss": -11.815526962280273, "global_step": 226260, "epoch": 1346} {"train_loss": -11.396635055541992, "global_step": 226261, "epoch": 1346} {"train_loss": -11.78303337097168, "global_step": 226262, "epoch": 1346} {"train_loss": -11.600380897521973, "global_step": 226263, "epoch": 1346} {"train_loss": -11.597112655639648, "global_step": 226264, "epoch": 1346} {"train_loss": -11.49020767211914, "global_step": 226265, "epoch": 1346} {"train_loss": -11.643024444580078, "global_step": 226266, "epoch": 1346} {"train_loss": -11.492761611938477, "global_step": 226267, "epoch": 1346} {"train_loss": -11.547540664672852, "global_step": 226268, "epoch": 1346} {"train_loss": -11.302806854248047, "global_step": 226269, "epoch": 1346} {"train_loss": -11.43002986907959, "global_step": 226270, "epoch": 1346} {"train_loss": -11.580342292785645, "global_step": 226271, "epoch": 1346} {"train_loss": -11.376977920532227, "global_step": 226272, "epoch": 1346} {"train_loss": -11.824491500854492, "global_step": 226273, "epoch": 1346} {"train_loss": -11.604369163513184, "global_step": 226274, "epoch": 1346} {"train_loss": -11.492095947265625, "global_step": 226275, "epoch": 1346} {"train_loss": -11.835667610168457, "global_step": 226276, "epoch": 1346} {"train_loss": -11.742167472839355, "global_step": 226277, "epoch": 1346} {"train_loss": -11.725857734680176, "global_step": 226278, "epoch": 1346} {"train_loss": -11.44813060760498, "global_step": 226279, "epoch": 1346} {"train_loss": -11.766059875488281, "global_step": 226280, "epoch": 1346} {"train_loss": -11.711982727050781, "global_step": 226281, "epoch": 1346} {"train_loss": -11.663034439086914, "global_step": 226282, "epoch": 1346} {"train_loss": -11.836177825927734, "global_step": 226283, "epoch": 1346} {"train_loss": -11.867876052856445, "global_step": 226284, "epoch": 1346} {"train_loss": -11.946310043334961, "global_step": 226285, "epoch": 1346} {"train_loss": -11.731792449951172, "global_step": 226286, "epoch": 1346} {"train_loss": -11.653959274291992, "global_step": 226287, "epoch": 1346} {"train_loss": -11.927092552185059, "global_step": 226288, "epoch": 1346} {"train_loss": -11.772951126098633, "global_step": 226289, "epoch": 1346} {"train_loss": -11.757619857788086, "global_step": 226290, "epoch": 1346} {"train_loss": -11.831949234008789, "global_step": 226291, "epoch": 1346} {"train_loss": -11.74921989440918, "global_step": 226292, "epoch": 1346} {"train_loss": -11.626396179199219, "global_step": 226293, "epoch": 1346} {"train_loss": -11.661966323852539, "global_step": 226294, "epoch": 1346} {"train_loss": -11.46612951301393, "global_step": 226295, "epoch": 1346, "val_loss": 258609.96875} {"train_loss": -11.789962768554688, "global_step": 226296, "epoch": 1347} {"train_loss": -11.759973526000977, "global_step": 226297, "epoch": 1347} {"train_loss": -11.63707160949707, "global_step": 226298, "epoch": 1347} {"train_loss": -11.980607986450195, "global_step": 226299, "epoch": 1347} {"train_loss": -11.823904037475586, "global_step": 226300, "epoch": 1347} {"train_loss": -12.110092163085938, "global_step": 226301, "epoch": 1347} {"train_loss": -11.950401306152344, "global_step": 226302, "epoch": 1347} {"train_loss": -11.925049781799316, "global_step": 226303, "epoch": 1347} {"train_loss": -11.698525428771973, "global_step": 226304, "epoch": 1347} {"train_loss": -11.782194137573242, "global_step": 226305, "epoch": 1347} {"train_loss": -11.756613731384277, "global_step": 226306, "epoch": 1347} {"train_loss": -11.712165832519531, "global_step": 226307, "epoch": 1347} {"train_loss": -11.618778228759766, "global_step": 226308, "epoch": 1347} {"train_loss": -11.923676490783691, "global_step": 226309, "epoch": 1347} {"train_loss": -11.716808319091797, "global_step": 226310, "epoch": 1347} {"train_loss": -11.49024486541748, "global_step": 226311, "epoch": 1347} {"train_loss": -12.086409568786621, "global_step": 226312, "epoch": 1347} {"train_loss": -11.692864418029785, "global_step": 226313, "epoch": 1347} {"train_loss": -11.834844589233398, "global_step": 226314, "epoch": 1347} {"train_loss": -11.814371109008789, "global_step": 226315, "epoch": 1347} {"train_loss": -11.923609733581543, "global_step": 226316, "epoch": 1347} {"train_loss": -11.974803924560547, "global_step": 226317, "epoch": 1347} {"train_loss": -11.298089981079102, "global_step": 226318, "epoch": 1347} {"train_loss": -11.579658508300781, "global_step": 226319, "epoch": 1347} {"train_loss": -11.100648880004883, "global_step": 226320, "epoch": 1347} {"train_loss": -11.480036735534668, "global_step": 226321, "epoch": 1347} {"train_loss": -10.611292839050293, "global_step": 226322, "epoch": 1347} {"train_loss": -11.341151237487793, "global_step": 226323, "epoch": 1347} {"train_loss": -11.649323463439941, "global_step": 226324, "epoch": 1347} {"train_loss": -10.638920783996582, "global_step": 226325, "epoch": 1347} {"train_loss": -10.014404296875, "global_step": 226326, "epoch": 1347} {"train_loss": -11.011384963989258, "global_step": 226327, "epoch": 1347} {"train_loss": -10.529576301574707, "global_step": 226328, "epoch": 1347} {"train_loss": -10.444070816040039, "global_step": 226329, "epoch": 1347} {"train_loss": -10.702199935913086, "global_step": 226330, "epoch": 1347} {"train_loss": -11.069400787353516, "global_step": 226331, "epoch": 1347} {"train_loss": -10.460116386413574, "global_step": 226332, "epoch": 1347} {"train_loss": -10.678579330444336, "global_step": 226333, "epoch": 1347} {"train_loss": -9.868535995483398, "global_step": 226334, "epoch": 1347} {"train_loss": -10.377995491027832, "global_step": 226335, "epoch": 1347} {"train_loss": -10.545256614685059, "global_step": 226336, "epoch": 1347} {"train_loss": -10.580371856689453, "global_step": 226337, "epoch": 1347} {"train_loss": -11.425518989562988, "global_step": 226338, "epoch": 1347} {"train_loss": -11.005926132202148, "global_step": 226339, "epoch": 1347} {"train_loss": -10.90455436706543, "global_step": 226340, "epoch": 1347} {"train_loss": -11.481012344360352, "global_step": 226341, "epoch": 1347} {"train_loss": -10.455230712890625, "global_step": 226342, "epoch": 1347} {"train_loss": -11.372943878173828, "global_step": 226343, "epoch": 1347} {"train_loss": -10.694662094116211, "global_step": 226344, "epoch": 1347} {"train_loss": -11.51392936706543, "global_step": 226345, "epoch": 1347} {"train_loss": -10.804389953613281, "global_step": 226346, "epoch": 1347} {"train_loss": -11.033279418945312, "global_step": 226347, "epoch": 1347} {"train_loss": -11.364277839660645, "global_step": 226348, "epoch": 1347} {"train_loss": -10.931934356689453, "global_step": 226349, "epoch": 1347} {"train_loss": -11.01740837097168, "global_step": 226350, "epoch": 1347} {"train_loss": -11.519905090332031, "global_step": 226351, "epoch": 1347} {"train_loss": -10.894408226013184, "global_step": 226352, "epoch": 1347} {"train_loss": -11.345959663391113, "global_step": 226353, "epoch": 1347} {"train_loss": -10.990625381469727, "global_step": 226354, "epoch": 1347} {"train_loss": -11.549126625061035, "global_step": 226355, "epoch": 1347} {"train_loss": -11.401004791259766, "global_step": 226356, "epoch": 1347} {"train_loss": -11.144731521606445, "global_step": 226357, "epoch": 1347} {"train_loss": -11.488545417785645, "global_step": 226358, "epoch": 1347} {"train_loss": -11.656634330749512, "global_step": 226359, "epoch": 1347} {"train_loss": -11.436790466308594, "global_step": 226360, "epoch": 1347} {"train_loss": -11.61133098602295, "global_step": 226361, "epoch": 1347} {"train_loss": -11.527099609375, "global_step": 226362, "epoch": 1347} {"train_loss": -11.567060470581055, "global_step": 226363, "epoch": 1347} {"train_loss": -11.614330291748047, "global_step": 226364, "epoch": 1347} {"train_loss": -11.768001556396484, "global_step": 226365, "epoch": 1347} {"train_loss": -11.7243070602417, "global_step": 226366, "epoch": 1347} {"train_loss": -11.792754173278809, "global_step": 226367, "epoch": 1347} {"train_loss": -11.68667221069336, "global_step": 226368, "epoch": 1347} {"train_loss": -11.565450668334961, "global_step": 226369, "epoch": 1347} {"train_loss": -11.681644439697266, "global_step": 226370, "epoch": 1347} {"train_loss": -11.715469360351562, "global_step": 226371, "epoch": 1347} {"train_loss": -11.545679092407227, "global_step": 226372, "epoch": 1347} {"train_loss": -11.637885093688965, "global_step": 226373, "epoch": 1347} {"train_loss": -11.861791610717773, "global_step": 226374, "epoch": 1347} {"train_loss": -11.84199333190918, "global_step": 226375, "epoch": 1347} {"train_loss": -11.702394485473633, "global_step": 226376, "epoch": 1347} {"train_loss": -11.669625282287598, "global_step": 226377, "epoch": 1347} {"train_loss": -11.936271667480469, "global_step": 226378, "epoch": 1347} {"train_loss": -11.716775894165039, "global_step": 226379, "epoch": 1347} {"train_loss": -11.931182861328125, "global_step": 226380, "epoch": 1347} {"train_loss": -11.730298042297363, "global_step": 226381, "epoch": 1347} {"train_loss": -11.773927688598633, "global_step": 226382, "epoch": 1347} {"train_loss": -11.380084991455078, "global_step": 226383, "epoch": 1347} {"train_loss": -11.821314811706543, "global_step": 226384, "epoch": 1347} {"train_loss": -11.755352973937988, "global_step": 226385, "epoch": 1347} {"train_loss": -11.832457542419434, "global_step": 226386, "epoch": 1347} {"train_loss": -11.879192352294922, "global_step": 226387, "epoch": 1347} {"train_loss": -11.616863250732422, "global_step": 226388, "epoch": 1347} {"train_loss": -11.877706527709961, "global_step": 226389, "epoch": 1347} {"train_loss": -12.042657852172852, "global_step": 226390, "epoch": 1347} {"train_loss": -11.75627613067627, "global_step": 226391, "epoch": 1347} {"train_loss": -11.638973236083984, "global_step": 226392, "epoch": 1347} {"train_loss": -11.5819091796875, "global_step": 226393, "epoch": 1347} {"train_loss": -11.58538818359375, "global_step": 226394, "epoch": 1347} {"train_loss": -11.907898902893066, "global_step": 226395, "epoch": 1347} {"train_loss": -11.716046333312988, "global_step": 226396, "epoch": 1347} {"train_loss": -11.746161460876465, "global_step": 226397, "epoch": 1347} {"train_loss": -11.751049041748047, "global_step": 226398, "epoch": 1347} {"train_loss": -11.515531539916992, "global_step": 226399, "epoch": 1347} {"train_loss": -11.494003295898438, "global_step": 226400, "epoch": 1347} {"train_loss": -11.940648078918457, "global_step": 226401, "epoch": 1347} {"train_loss": -11.710033416748047, "global_step": 226402, "epoch": 1347} {"train_loss": -10.954489707946777, "global_step": 226403, "epoch": 1347} {"train_loss": -11.242300033569336, "global_step": 226404, "epoch": 1347} {"train_loss": -11.768030166625977, "global_step": 226405, "epoch": 1347} {"train_loss": -11.294472694396973, "global_step": 226406, "epoch": 1347} {"train_loss": -11.317001342773438, "global_step": 226407, "epoch": 1347} {"train_loss": -11.694141387939453, "global_step": 226408, "epoch": 1347} {"train_loss": -11.67715072631836, "global_step": 226409, "epoch": 1347} {"train_loss": -11.620231628417969, "global_step": 226410, "epoch": 1347} {"train_loss": -11.788204193115234, "global_step": 226411, "epoch": 1347} {"train_loss": -11.755413055419922, "global_step": 226412, "epoch": 1347} {"train_loss": -11.841920852661133, "global_step": 226413, "epoch": 1347} {"train_loss": -11.417621612548828, "global_step": 226414, "epoch": 1347} {"train_loss": -11.771905899047852, "global_step": 226415, "epoch": 1347} {"train_loss": -11.330306053161621, "global_step": 226416, "epoch": 1347} {"train_loss": -11.645326614379883, "global_step": 226417, "epoch": 1347} {"train_loss": -11.222969055175781, "global_step": 226418, "epoch": 1347} {"train_loss": -11.43359375, "global_step": 226419, "epoch": 1347} {"train_loss": -11.33049201965332, "global_step": 226420, "epoch": 1347} {"train_loss": -11.690828323364258, "global_step": 226421, "epoch": 1347} {"train_loss": -11.582711219787598, "global_step": 226422, "epoch": 1347} {"train_loss": -11.583955764770508, "global_step": 226423, "epoch": 1347} {"train_loss": -11.421438217163086, "global_step": 226424, "epoch": 1347} {"train_loss": -11.642658233642578, "global_step": 226425, "epoch": 1347} {"train_loss": -11.108919143676758, "global_step": 226426, "epoch": 1347} {"train_loss": -11.596845626831055, "global_step": 226427, "epoch": 1347} {"train_loss": -11.283187866210938, "global_step": 226428, "epoch": 1347} {"train_loss": -11.420574188232422, "global_step": 226429, "epoch": 1347} {"train_loss": -11.619970321655273, "global_step": 226430, "epoch": 1347} {"train_loss": -11.724798202514648, "global_step": 226431, "epoch": 1347} {"train_loss": -10.94639778137207, "global_step": 226432, "epoch": 1347} {"train_loss": -11.517411231994629, "global_step": 226433, "epoch": 1347} {"train_loss": -11.80245304107666, "global_step": 226434, "epoch": 1347} {"train_loss": -11.732576370239258, "global_step": 226435, "epoch": 1347} {"train_loss": -11.584724426269531, "global_step": 226436, "epoch": 1347} {"train_loss": -12.05504035949707, "global_step": 226437, "epoch": 1347} {"train_loss": -11.324539184570312, "global_step": 226438, "epoch": 1347} {"train_loss": -11.532449722290039, "global_step": 226439, "epoch": 1347} {"train_loss": -11.837600708007812, "global_step": 226440, "epoch": 1347} {"train_loss": -11.159977912902832, "global_step": 226441, "epoch": 1347} {"train_loss": -11.650288581848145, "global_step": 226442, "epoch": 1347} {"train_loss": -11.65611457824707, "global_step": 226443, "epoch": 1347} {"train_loss": -10.949471473693848, "global_step": 226444, "epoch": 1347} {"train_loss": -11.599874496459961, "global_step": 226445, "epoch": 1347} {"train_loss": -10.83887004852295, "global_step": 226446, "epoch": 1347} {"train_loss": -10.354543685913086, "global_step": 226447, "epoch": 1347} {"train_loss": -11.47763729095459, "global_step": 226448, "epoch": 1347} {"train_loss": -11.204054832458496, "global_step": 226449, "epoch": 1347} {"train_loss": -10.108592987060547, "global_step": 226450, "epoch": 1347} {"train_loss": -11.676981925964355, "global_step": 226451, "epoch": 1347} {"train_loss": -10.797101974487305, "global_step": 226452, "epoch": 1347} {"train_loss": -11.149659156799316, "global_step": 226453, "epoch": 1347} {"train_loss": -10.894491195678711, "global_step": 226454, "epoch": 1347} {"train_loss": -10.7394437789917, "global_step": 226455, "epoch": 1347} {"train_loss": -11.339193344116211, "global_step": 226456, "epoch": 1347} {"train_loss": -10.90839958190918, "global_step": 226457, "epoch": 1347} {"train_loss": -11.180231094360352, "global_step": 226458, "epoch": 1347} {"train_loss": -10.326350212097168, "global_step": 226459, "epoch": 1347} {"train_loss": -10.235377311706543, "global_step": 226460, "epoch": 1347} {"train_loss": -10.755556106567383, "global_step": 226461, "epoch": 1347} {"train_loss": -10.23714542388916, "global_step": 226462, "epoch": 1347} {"train_loss": -11.404442560105096, "global_step": 226463, "epoch": 1347, "val_loss": 262323.625} {"train_loss": -10.332856178283691, "global_step": 226464, "epoch": 1348} {"train_loss": -10.517302513122559, "global_step": 226465, "epoch": 1348} {"train_loss": -11.317281723022461, "global_step": 226466, "epoch": 1348} {"train_loss": -10.501694679260254, "global_step": 226467, "epoch": 1348} {"train_loss": -10.493987083435059, "global_step": 226468, "epoch": 1348} {"train_loss": -11.289749145507812, "global_step": 226469, "epoch": 1348} {"train_loss": -10.90967845916748, "global_step": 226470, "epoch": 1348} {"train_loss": -11.059136390686035, "global_step": 226471, "epoch": 1348} {"train_loss": -11.255193710327148, "global_step": 226472, "epoch": 1348} {"train_loss": -10.920866012573242, "global_step": 226473, "epoch": 1348} {"train_loss": -11.162818908691406, "global_step": 226474, "epoch": 1348} {"train_loss": -11.161752700805664, "global_step": 226475, "epoch": 1348} {"train_loss": -10.803873062133789, "global_step": 226476, "epoch": 1348} {"train_loss": -11.361507415771484, "global_step": 226477, "epoch": 1348} {"train_loss": -11.161907196044922, "global_step": 226478, "epoch": 1348} {"train_loss": -11.389598846435547, "global_step": 226479, "epoch": 1348} {"train_loss": -11.517692565917969, "global_step": 226480, "epoch": 1348} {"train_loss": -11.150245666503906, "global_step": 226481, "epoch": 1348} {"train_loss": -11.649405479431152, "global_step": 226482, "epoch": 1348} {"train_loss": -11.361913681030273, "global_step": 226483, "epoch": 1348} {"train_loss": -11.479528427124023, "global_step": 226484, "epoch": 1348} {"train_loss": -11.503645896911621, "global_step": 226485, "epoch": 1348} {"train_loss": -11.580934524536133, "global_step": 226486, "epoch": 1348} {"train_loss": -11.59153938293457, "global_step": 226487, "epoch": 1348} {"train_loss": -11.871118545532227, "global_step": 226488, "epoch": 1348} {"train_loss": -11.442869186401367, "global_step": 226489, "epoch": 1348} {"train_loss": -11.6348876953125, "global_step": 226490, "epoch": 1348} {"train_loss": -11.53573989868164, "global_step": 226491, "epoch": 1348} {"train_loss": -11.430559158325195, "global_step": 226492, "epoch": 1348} {"train_loss": -11.769203186035156, "global_step": 226493, "epoch": 1348} {"train_loss": -11.680084228515625, "global_step": 226494, "epoch": 1348} {"train_loss": -11.527700424194336, "global_step": 226495, "epoch": 1348} {"train_loss": -12.042030334472656, "global_step": 226496, "epoch": 1348} {"train_loss": -11.534839630126953, "global_step": 226497, "epoch": 1348} {"train_loss": -11.647449493408203, "global_step": 226498, "epoch": 1348} {"train_loss": -11.492786407470703, "global_step": 226499, "epoch": 1348} {"train_loss": -11.744139671325684, "global_step": 226500, "epoch": 1348} {"train_loss": -11.383710861206055, "global_step": 226501, "epoch": 1348} {"train_loss": -11.692037582397461, "global_step": 226502, "epoch": 1348} {"train_loss": -11.437007904052734, "global_step": 226503, "epoch": 1348} {"train_loss": -11.51649284362793, "global_step": 226504, "epoch": 1348} {"train_loss": -11.553668022155762, "global_step": 226505, "epoch": 1348} {"train_loss": -11.599640846252441, "global_step": 226506, "epoch": 1348} {"train_loss": -11.756943702697754, "global_step": 226507, "epoch": 1348} {"train_loss": -11.740560531616211, "global_step": 226508, "epoch": 1348} {"train_loss": -11.601480484008789, "global_step": 226509, "epoch": 1348} {"train_loss": -11.47886848449707, "global_step": 226510, "epoch": 1348} {"train_loss": -11.709310531616211, "global_step": 226511, "epoch": 1348} {"train_loss": -11.68753433227539, "global_step": 226512, "epoch": 1348} {"train_loss": -11.6906099319458, "global_step": 226513, "epoch": 1348} {"train_loss": -11.845613479614258, "global_step": 226514, "epoch": 1348} {"train_loss": -11.613546371459961, "global_step": 226515, "epoch": 1348} {"train_loss": -11.525944709777832, "global_step": 226516, "epoch": 1348} {"train_loss": -11.598993301391602, "global_step": 226517, "epoch": 1348} {"train_loss": -11.726698875427246, "global_step": 226518, "epoch": 1348} {"train_loss": -11.91019058227539, "global_step": 226519, "epoch": 1348} {"train_loss": -10.774787902832031, "global_step": 226520, "epoch": 1348} {"train_loss": -11.344049453735352, "global_step": 226521, "epoch": 1348} {"train_loss": -11.837846755981445, "global_step": 226522, "epoch": 1348} {"train_loss": -11.040592193603516, "global_step": 226523, "epoch": 1348} {"train_loss": -10.792457580566406, "global_step": 226524, "epoch": 1348} {"train_loss": -11.822198867797852, "global_step": 226525, "epoch": 1348} {"train_loss": -10.835253715515137, "global_step": 226526, "epoch": 1348} {"train_loss": -11.166264533996582, "global_step": 226527, "epoch": 1348} {"train_loss": -11.471384048461914, "global_step": 226528, "epoch": 1348} {"train_loss": -10.67301082611084, "global_step": 226529, "epoch": 1348} {"train_loss": -11.62887954711914, "global_step": 226530, "epoch": 1348} {"train_loss": -11.60690975189209, "global_step": 226531, "epoch": 1348} {"train_loss": -11.191787719726562, "global_step": 226532, "epoch": 1348} {"train_loss": -11.8631591796875, "global_step": 226533, "epoch": 1348} {"train_loss": -11.099365234375, "global_step": 226534, "epoch": 1348} {"train_loss": -11.335264205932617, "global_step": 226535, "epoch": 1348} {"train_loss": -11.142220497131348, "global_step": 226536, "epoch": 1348} {"train_loss": -11.74512767791748, "global_step": 226537, "epoch": 1348} {"train_loss": -11.464139938354492, "global_step": 226538, "epoch": 1348} {"train_loss": -11.365094184875488, "global_step": 226539, "epoch": 1348} {"train_loss": -11.458307266235352, "global_step": 226540, "epoch": 1348} {"train_loss": -11.214544296264648, "global_step": 226541, "epoch": 1348} {"train_loss": -11.397587776184082, "global_step": 226542, "epoch": 1348} {"train_loss": -11.584051132202148, "global_step": 226543, "epoch": 1348} {"train_loss": -11.718936920166016, "global_step": 226544, "epoch": 1348} {"train_loss": -11.433538436889648, "global_step": 226545, "epoch": 1348} {"train_loss": -11.994901657104492, "global_step": 226546, "epoch": 1348} {"train_loss": -11.621088027954102, "global_step": 226547, "epoch": 1348} {"train_loss": -11.974825859069824, "global_step": 226548, "epoch": 1348} {"train_loss": -11.837675094604492, "global_step": 226549, "epoch": 1348} {"train_loss": -11.820229530334473, "global_step": 226550, "epoch": 1348} {"train_loss": -11.766777038574219, "global_step": 226551, "epoch": 1348} {"train_loss": -11.785297393798828, "global_step": 226552, "epoch": 1348} {"train_loss": -11.959333419799805, "global_step": 226553, "epoch": 1348} {"train_loss": -11.588768005371094, "global_step": 226554, "epoch": 1348} {"train_loss": -11.482297897338867, "global_step": 226555, "epoch": 1348} {"train_loss": -12.008211135864258, "global_step": 226556, "epoch": 1348} {"train_loss": -11.294620513916016, "global_step": 226557, "epoch": 1348} {"train_loss": -11.651863098144531, "global_step": 226558, "epoch": 1348} {"train_loss": -11.415467262268066, "global_step": 226559, "epoch": 1348} {"train_loss": -11.957115173339844, "global_step": 226560, "epoch": 1348} {"train_loss": -11.475234031677246, "global_step": 226561, "epoch": 1348} {"train_loss": -11.605485916137695, "global_step": 226562, "epoch": 1348} {"train_loss": -11.403326988220215, "global_step": 226563, "epoch": 1348} {"train_loss": -11.636926651000977, "global_step": 226564, "epoch": 1348} {"train_loss": -11.936935424804688, "global_step": 226565, "epoch": 1348} {"train_loss": -11.059186935424805, "global_step": 226566, "epoch": 1348} {"train_loss": -11.27771282196045, "global_step": 226567, "epoch": 1348} {"train_loss": -11.305882453918457, "global_step": 226568, "epoch": 1348} {"train_loss": -10.726940155029297, "global_step": 226569, "epoch": 1348} {"train_loss": -11.298455238342285, "global_step": 226570, "epoch": 1348} {"train_loss": -11.4627046585083, "global_step": 226571, "epoch": 1348} {"train_loss": -10.660186767578125, "global_step": 226572, "epoch": 1348} {"train_loss": -11.398591995239258, "global_step": 226573, "epoch": 1348} {"train_loss": -11.240179061889648, "global_step": 226574, "epoch": 1348} {"train_loss": -11.338306427001953, "global_step": 226575, "epoch": 1348} {"train_loss": -11.216386795043945, "global_step": 226576, "epoch": 1348} {"train_loss": -11.512256622314453, "global_step": 226577, "epoch": 1348} {"train_loss": -11.182111740112305, "global_step": 226578, "epoch": 1348} {"train_loss": -11.294881820678711, "global_step": 226579, "epoch": 1348} {"train_loss": -11.102928161621094, "global_step": 226580, "epoch": 1348} {"train_loss": -10.99078369140625, "global_step": 226581, "epoch": 1348} {"train_loss": -10.6526460647583, "global_step": 226582, "epoch": 1348} {"train_loss": -11.600329399108887, "global_step": 226583, "epoch": 1348} {"train_loss": -11.233966827392578, "global_step": 226584, "epoch": 1348} {"train_loss": -11.28835391998291, "global_step": 226585, "epoch": 1348} {"train_loss": -11.026154518127441, "global_step": 226586, "epoch": 1348} {"train_loss": -11.06820011138916, "global_step": 226587, "epoch": 1348} {"train_loss": -11.243825912475586, "global_step": 226588, "epoch": 1348} {"train_loss": -10.915146827697754, "global_step": 226589, "epoch": 1348} {"train_loss": -11.17429256439209, "global_step": 226590, "epoch": 1348} {"train_loss": -11.329216957092285, "global_step": 226591, "epoch": 1348} {"train_loss": -10.517105102539062, "global_step": 226592, "epoch": 1348} {"train_loss": -10.598225593566895, "global_step": 226593, "epoch": 1348} {"train_loss": -11.069604873657227, "global_step": 226594, "epoch": 1348} {"train_loss": -10.658246994018555, "global_step": 226595, "epoch": 1348} {"train_loss": -11.214208602905273, "global_step": 226596, "epoch": 1348} {"train_loss": -10.710128784179688, "global_step": 226597, "epoch": 1348} {"train_loss": -10.991954803466797, "global_step": 226598, "epoch": 1348} {"train_loss": -11.356290817260742, "global_step": 226599, "epoch": 1348} {"train_loss": -10.850746154785156, "global_step": 226600, "epoch": 1348} {"train_loss": -11.19764518737793, "global_step": 226601, "epoch": 1348} {"train_loss": -11.32491397857666, "global_step": 226602, "epoch": 1348} {"train_loss": -10.039712905883789, "global_step": 226603, "epoch": 1348} {"train_loss": -11.435009002685547, "global_step": 226604, "epoch": 1348} {"train_loss": -10.86740493774414, "global_step": 226605, "epoch": 1348} {"train_loss": -11.116316795349121, "global_step": 226606, "epoch": 1348} {"train_loss": -11.08358383178711, "global_step": 226607, "epoch": 1348} {"train_loss": -10.953752517700195, "global_step": 226608, "epoch": 1348} {"train_loss": -11.296151161193848, "global_step": 226609, "epoch": 1348} {"train_loss": -11.356878280639648, "global_step": 226610, "epoch": 1348} {"train_loss": -11.489398002624512, "global_step": 226611, "epoch": 1348} {"train_loss": -11.096460342407227, "global_step": 226612, "epoch": 1348} {"train_loss": -11.507944107055664, "global_step": 226613, "epoch": 1348} {"train_loss": -11.195378303527832, "global_step": 226614, "epoch": 1348} {"train_loss": -11.395883560180664, "global_step": 226615, "epoch": 1348} {"train_loss": -11.761651992797852, "global_step": 226616, "epoch": 1348} {"train_loss": -11.356926918029785, "global_step": 226617, "epoch": 1348} {"train_loss": -11.611825942993164, "global_step": 226618, "epoch": 1348} {"train_loss": -11.6090726852417, "global_step": 226619, "epoch": 1348} {"train_loss": -11.389118194580078, "global_step": 226620, "epoch": 1348} {"train_loss": -11.478029251098633, "global_step": 226621, "epoch": 1348} {"train_loss": -11.70134162902832, "global_step": 226622, "epoch": 1348} {"train_loss": -11.45992374420166, "global_step": 226623, "epoch": 1348} {"train_loss": -11.755596160888672, "global_step": 226624, "epoch": 1348} {"train_loss": -11.912469863891602, "global_step": 226625, "epoch": 1348} {"train_loss": -11.633806228637695, "global_step": 226626, "epoch": 1348} {"train_loss": -11.87266731262207, "global_step": 226627, "epoch": 1348} {"train_loss": -11.911147117614746, "global_step": 226628, "epoch": 1348} {"train_loss": -11.662734031677246, "global_step": 226629, "epoch": 1348} {"train_loss": -11.90378475189209, "global_step": 226630, "epoch": 1348} {"train_loss": -11.380503098169962, "global_step": 226631, "epoch": 1348, "val_loss": 261441.34375} {"train_loss": -11.934246063232422, "global_step": 226632, "epoch": 1349} {"train_loss": -11.682554244995117, "global_step": 226633, "epoch": 1349} {"train_loss": -11.829208374023438, "global_step": 226634, "epoch": 1349} {"train_loss": -11.972907066345215, "global_step": 226635, "epoch": 1349} {"train_loss": -11.962051391601562, "global_step": 226636, "epoch": 1349} {"train_loss": -11.77126693725586, "global_step": 226637, "epoch": 1349} {"train_loss": -11.87901496887207, "global_step": 226638, "epoch": 1349} {"train_loss": -11.666540145874023, "global_step": 226639, "epoch": 1349} {"train_loss": -11.562000274658203, "global_step": 226640, "epoch": 1349} {"train_loss": -11.669792175292969, "global_step": 226641, "epoch": 1349} {"train_loss": -11.658624649047852, "global_step": 226642, "epoch": 1349} {"train_loss": -11.722570419311523, "global_step": 226643, "epoch": 1349} {"train_loss": -11.635217666625977, "global_step": 226644, "epoch": 1349} {"train_loss": -11.976728439331055, "global_step": 226645, "epoch": 1349} {"train_loss": -11.771217346191406, "global_step": 226646, "epoch": 1349} {"train_loss": -11.764609336853027, "global_step": 226647, "epoch": 1349} {"train_loss": -11.599635124206543, "global_step": 226648, "epoch": 1349} {"train_loss": -11.734753608703613, "global_step": 226649, "epoch": 1349} {"train_loss": -11.901250839233398, "global_step": 226650, "epoch": 1349} {"train_loss": -11.559167861938477, "global_step": 226651, "epoch": 1349} {"train_loss": -11.74974250793457, "global_step": 226652, "epoch": 1349} {"train_loss": -11.73770809173584, "global_step": 226653, "epoch": 1349} {"train_loss": -11.464727401733398, "global_step": 226654, "epoch": 1349} {"train_loss": -11.595535278320312, "global_step": 226655, "epoch": 1349} {"train_loss": -11.675272941589355, "global_step": 226656, "epoch": 1349} {"train_loss": -11.475316047668457, "global_step": 226657, "epoch": 1349} {"train_loss": -11.653053283691406, "global_step": 226658, "epoch": 1349} {"train_loss": -11.62672233581543, "global_step": 226659, "epoch": 1349} {"train_loss": -11.894084930419922, "global_step": 226660, "epoch": 1349} {"train_loss": -11.640490531921387, "global_step": 226661, "epoch": 1349} {"train_loss": -11.465323448181152, "global_step": 226662, "epoch": 1349} {"train_loss": -11.425808906555176, "global_step": 226663, "epoch": 1349} {"train_loss": -11.211833953857422, "global_step": 226664, "epoch": 1349} {"train_loss": -11.708771705627441, "global_step": 226665, "epoch": 1349} {"train_loss": -10.966014862060547, "global_step": 226666, "epoch": 1349} {"train_loss": -10.715639114379883, "global_step": 226667, "epoch": 1349} {"train_loss": -11.209005355834961, "global_step": 226668, "epoch": 1349} {"train_loss": -11.157167434692383, "global_step": 226669, "epoch": 1349} {"train_loss": -10.915149688720703, "global_step": 226670, "epoch": 1349} {"train_loss": -10.444437980651855, "global_step": 226671, "epoch": 1349} {"train_loss": -10.037261009216309, "global_step": 226672, "epoch": 1349} {"train_loss": -10.102559089660645, "global_step": 226673, "epoch": 1349} {"train_loss": -9.019061088562012, "global_step": 226674, "epoch": 1349} {"train_loss": -10.383519172668457, "global_step": 226675, "epoch": 1349} {"train_loss": -9.172369956970215, "global_step": 226676, "epoch": 1349} {"train_loss": -9.040918350219727, "global_step": 226677, "epoch": 1349} {"train_loss": -9.94045639038086, "global_step": 226678, "epoch": 1349} {"train_loss": -9.70130729675293, "global_step": 226679, "epoch": 1349} {"train_loss": -8.975337982177734, "global_step": 226680, "epoch": 1349} {"train_loss": -8.234915733337402, "global_step": 226681, "epoch": 1349} {"train_loss": -10.338701248168945, "global_step": 226682, "epoch": 1349} {"train_loss": -10.149250030517578, "global_step": 226683, "epoch": 1349} {"train_loss": -9.566900253295898, "global_step": 226684, "epoch": 1349} {"train_loss": -9.97783088684082, "global_step": 226685, "epoch": 1349} {"train_loss": -10.250127792358398, "global_step": 226686, "epoch": 1349} {"train_loss": -9.505085945129395, "global_step": 226687, "epoch": 1349} {"train_loss": -9.284183502197266, "global_step": 226688, "epoch": 1349} {"train_loss": -10.948469161987305, "global_step": 226689, "epoch": 1349} {"train_loss": -10.427433967590332, "global_step": 226690, "epoch": 1349} {"train_loss": -10.48863697052002, "global_step": 226691, "epoch": 1349} {"train_loss": -11.028146743774414, "global_step": 226692, "epoch": 1349} {"train_loss": -11.004424095153809, "global_step": 226693, "epoch": 1349} {"train_loss": -10.316854476928711, "global_step": 226694, "epoch": 1349} {"train_loss": -11.430312156677246, "global_step": 226695, "epoch": 1349} {"train_loss": -10.834915161132812, "global_step": 226696, "epoch": 1349} {"train_loss": -11.130645751953125, "global_step": 226697, "epoch": 1349} {"train_loss": -11.245514869689941, "global_step": 226698, "epoch": 1349} {"train_loss": -10.931549072265625, "global_step": 226699, "epoch": 1349} {"train_loss": -11.318350791931152, "global_step": 226700, "epoch": 1349} {"train_loss": -11.22637939453125, "global_step": 226701, "epoch": 1349} {"train_loss": -11.076651573181152, "global_step": 226702, "epoch": 1349} {"train_loss": -11.019020080566406, "global_step": 226703, "epoch": 1349} {"train_loss": -11.209802627563477, "global_step": 226704, "epoch": 1349} {"train_loss": -11.473146438598633, "global_step": 226705, "epoch": 1349} {"train_loss": -11.172372817993164, "global_step": 226706, "epoch": 1349} {"train_loss": -11.239402770996094, "global_step": 226707, "epoch": 1349} {"train_loss": -11.488574981689453, "global_step": 226708, "epoch": 1349} {"train_loss": -11.328755378723145, "global_step": 226709, "epoch": 1349} {"train_loss": -11.386284828186035, "global_step": 226710, "epoch": 1349} {"train_loss": -11.229647636413574, "global_step": 226711, "epoch": 1349} {"train_loss": -11.479619026184082, "global_step": 226712, "epoch": 1349} {"train_loss": -11.386590957641602, "global_step": 226713, "epoch": 1349} {"train_loss": -11.415205001831055, "global_step": 226714, "epoch": 1349} {"train_loss": -11.426534652709961, "global_step": 226715, "epoch": 1349} {"train_loss": -11.596644401550293, "global_step": 226716, "epoch": 1349} {"train_loss": -11.181684494018555, "global_step": 226717, "epoch": 1349} {"train_loss": -11.382429122924805, "global_step": 226718, "epoch": 1349} {"train_loss": -11.429434776306152, "global_step": 226719, "epoch": 1349} {"train_loss": -11.661264419555664, "global_step": 226720, "epoch": 1349} {"train_loss": -11.648078918457031, "global_step": 226721, "epoch": 1349} {"train_loss": -11.561361312866211, "global_step": 226722, "epoch": 1349} {"train_loss": -11.705537796020508, "global_step": 226723, "epoch": 1349} {"train_loss": -11.519063949584961, "global_step": 226724, "epoch": 1349} {"train_loss": -11.660947799682617, "global_step": 226725, "epoch": 1349} {"train_loss": -11.750304222106934, "global_step": 226726, "epoch": 1349} {"train_loss": -11.80583381652832, "global_step": 226727, "epoch": 1349} {"train_loss": -11.747332572937012, "global_step": 226728, "epoch": 1349} {"train_loss": -11.771970748901367, "global_step": 226729, "epoch": 1349} {"train_loss": -11.733416557312012, "global_step": 226730, "epoch": 1349} {"train_loss": -11.955513000488281, "global_step": 226731, "epoch": 1349} {"train_loss": -11.77611255645752, "global_step": 226732, "epoch": 1349} {"train_loss": -12.024673461914062, "global_step": 226733, "epoch": 1349} {"train_loss": -11.877100944519043, "global_step": 226734, "epoch": 1349} {"train_loss": -11.59628677368164, "global_step": 226735, "epoch": 1349} {"train_loss": -11.832189559936523, "global_step": 226736, "epoch": 1349} {"train_loss": -11.830163955688477, "global_step": 226737, "epoch": 1349} {"train_loss": -11.652711868286133, "global_step": 226738, "epoch": 1349} {"train_loss": -11.825291633605957, "global_step": 226739, "epoch": 1349} {"train_loss": -11.83442497253418, "global_step": 226740, "epoch": 1349} {"train_loss": -12.03028678894043, "global_step": 226741, "epoch": 1349} {"train_loss": -11.87349796295166, "global_step": 226742, "epoch": 1349} {"train_loss": -11.801016807556152, "global_step": 226743, "epoch": 1349} {"train_loss": -11.723825454711914, "global_step": 226744, "epoch": 1349} {"train_loss": -11.943201065063477, "global_step": 226745, "epoch": 1349} {"train_loss": -11.726404190063477, "global_step": 226746, "epoch": 1349} {"train_loss": -12.018835067749023, "global_step": 226747, "epoch": 1349} {"train_loss": -12.018095016479492, "global_step": 226748, "epoch": 1349} {"train_loss": -11.816650390625, "global_step": 226749, "epoch": 1349} {"train_loss": -11.922714233398438, "global_step": 226750, "epoch": 1349} {"train_loss": -12.123586654663086, "global_step": 226751, "epoch": 1349} {"train_loss": -11.556714057922363, "global_step": 226752, "epoch": 1349} {"train_loss": -11.407114028930664, "global_step": 226753, "epoch": 1349} {"train_loss": -11.755109786987305, "global_step": 226754, "epoch": 1349} {"train_loss": -11.689224243164062, "global_step": 226755, "epoch": 1349} {"train_loss": -10.358455657958984, "global_step": 226756, "epoch": 1349} {"train_loss": -11.272212028503418, "global_step": 226757, "epoch": 1349} {"train_loss": -11.668508529663086, "global_step": 226758, "epoch": 1349} {"train_loss": -11.285069465637207, "global_step": 226759, "epoch": 1349} {"train_loss": -11.03188705444336, "global_step": 226760, "epoch": 1349} {"train_loss": -11.24520492553711, "global_step": 226761, "epoch": 1349} {"train_loss": -11.833477973937988, "global_step": 226762, "epoch": 1349} {"train_loss": -11.495844841003418, "global_step": 226763, "epoch": 1349} {"train_loss": -11.533478736877441, "global_step": 226764, "epoch": 1349} {"train_loss": -11.592916488647461, "global_step": 226765, "epoch": 1349} {"train_loss": -11.856902122497559, "global_step": 226766, "epoch": 1349} {"train_loss": -11.811704635620117, "global_step": 226767, "epoch": 1349} {"train_loss": -11.69958782196045, "global_step": 226768, "epoch": 1349} {"train_loss": -11.786222457885742, "global_step": 226769, "epoch": 1349} {"train_loss": -11.457267761230469, "global_step": 226770, "epoch": 1349} {"train_loss": -12.002321243286133, "global_step": 226771, "epoch": 1349} {"train_loss": -11.683934211730957, "global_step": 226772, "epoch": 1349} {"train_loss": -10.677777290344238, "global_step": 226773, "epoch": 1349} {"train_loss": -10.818334579467773, "global_step": 226774, "epoch": 1349} {"train_loss": -11.307907104492188, "global_step": 226775, "epoch": 1349} {"train_loss": -10.705514907836914, "global_step": 226776, "epoch": 1349} {"train_loss": -10.565260887145996, "global_step": 226777, "epoch": 1349} {"train_loss": -11.445911407470703, "global_step": 226778, "epoch": 1349} {"train_loss": -9.905654907226562, "global_step": 226779, "epoch": 1349} {"train_loss": -11.009401321411133, "global_step": 226780, "epoch": 1349} {"train_loss": -11.029991149902344, "global_step": 226781, "epoch": 1349} {"train_loss": -10.326292991638184, "global_step": 226782, "epoch": 1349} {"train_loss": -11.384281158447266, "global_step": 226783, "epoch": 1349} {"train_loss": -11.096224784851074, "global_step": 226784, "epoch": 1349} {"train_loss": -11.075704574584961, "global_step": 226785, "epoch": 1349} {"train_loss": -11.760061264038086, "global_step": 226786, "epoch": 1349} {"train_loss": -11.147212982177734, "global_step": 226787, "epoch": 1349} {"train_loss": -11.643302917480469, "global_step": 226788, "epoch": 1349} {"train_loss": -11.143146514892578, "global_step": 226789, "epoch": 1349} {"train_loss": -11.041736602783203, "global_step": 226790, "epoch": 1349} {"train_loss": -11.872138977050781, "global_step": 226791, "epoch": 1349} {"train_loss": -10.811511993408203, "global_step": 226792, "epoch": 1349} {"train_loss": -11.72238540649414, "global_step": 226793, "epoch": 1349} {"train_loss": -11.357948303222656, "global_step": 226794, "epoch": 1349} {"train_loss": -11.096977233886719, "global_step": 226795, "epoch": 1349} {"train_loss": -11.539972305297852, "global_step": 226796, "epoch": 1349} {"train_loss": -11.586528778076172, "global_step": 226797, "epoch": 1349} {"train_loss": -11.601603507995605, "global_step": 226798, "epoch": 1349} {"train_loss": -11.273906707763672, "global_step": 226799, "epoch": 1349, "val_loss": 259980.265625} {"train_loss": -11.748677253723145, "global_step": 226800, "epoch": 1350} {"train_loss": -11.694831848144531, "global_step": 226801, "epoch": 1350} {"train_loss": -11.639822006225586, "global_step": 226802, "epoch": 1350} {"train_loss": -11.475318908691406, "global_step": 226803, "epoch": 1350} {"train_loss": -11.505985260009766, "global_step": 226804, "epoch": 1350} {"train_loss": -11.671375274658203, "global_step": 226805, "epoch": 1350} {"train_loss": -11.370121002197266, "global_step": 226806, "epoch": 1350} {"train_loss": -11.765085220336914, "global_step": 226807, "epoch": 1350} {"train_loss": -11.617403030395508, "global_step": 226808, "epoch": 1350} {"train_loss": -11.827594757080078, "global_step": 226809, "epoch": 1350} {"train_loss": -11.587240219116211, "global_step": 226810, "epoch": 1350} {"train_loss": -11.694873809814453, "global_step": 226811, "epoch": 1350} {"train_loss": -11.760296821594238, "global_step": 226812, "epoch": 1350} {"train_loss": -11.750519752502441, "global_step": 226813, "epoch": 1350} {"train_loss": -11.689151763916016, "global_step": 226814, "epoch": 1350} {"train_loss": -11.826658248901367, "global_step": 226815, "epoch": 1350} {"train_loss": -11.97256088256836, "global_step": 226816, "epoch": 1350} {"train_loss": -11.819677352905273, "global_step": 226817, "epoch": 1350} {"train_loss": -11.625463485717773, "global_step": 226818, "epoch": 1350} {"train_loss": -11.548125267028809, "global_step": 226819, "epoch": 1350} {"train_loss": -11.789948463439941, "global_step": 226820, "epoch": 1350} {"train_loss": -11.837847709655762, "global_step": 226821, "epoch": 1350} {"train_loss": -11.616243362426758, "global_step": 226822, "epoch": 1350} {"train_loss": -11.871915817260742, "global_step": 226823, "epoch": 1350} {"train_loss": -11.88929557800293, "global_step": 226824, "epoch": 1350} {"train_loss": -11.40943717956543, "global_step": 226825, "epoch": 1350} {"train_loss": -11.873162269592285, "global_step": 226826, "epoch": 1350} {"train_loss": -11.202628135681152, "global_step": 226827, "epoch": 1350} {"train_loss": -11.785022735595703, "global_step": 226828, "epoch": 1350} {"train_loss": -11.262287139892578, "global_step": 226829, "epoch": 1350} {"train_loss": -11.514639854431152, "global_step": 226830, "epoch": 1350} {"train_loss": -11.465767860412598, "global_step": 226831, "epoch": 1350} {"train_loss": -11.681796073913574, "global_step": 226832, "epoch": 1350} {"train_loss": -11.743727684020996, "global_step": 226833, "epoch": 1350} {"train_loss": -11.404895782470703, "global_step": 226834, "epoch": 1350} {"train_loss": -11.773195266723633, "global_step": 226835, "epoch": 1350} {"train_loss": -11.357600212097168, "global_step": 226836, "epoch": 1350} {"train_loss": -11.939203262329102, "global_step": 226837, "epoch": 1350} {"train_loss": -11.298667907714844, "global_step": 226838, "epoch": 1350} {"train_loss": -11.711098670959473, "global_step": 226839, "epoch": 1350} {"train_loss": -11.188819885253906, "global_step": 226840, "epoch": 1350} {"train_loss": -11.8775634765625, "global_step": 226841, "epoch": 1350} {"train_loss": -11.435589790344238, "global_step": 226842, "epoch": 1350} {"train_loss": -11.16044807434082, "global_step": 226843, "epoch": 1350} {"train_loss": -11.182154655456543, "global_step": 226844, "epoch": 1350} {"train_loss": -11.180868148803711, "global_step": 226845, "epoch": 1350} {"train_loss": -10.693033218383789, "global_step": 226846, "epoch": 1350} {"train_loss": -11.653647422790527, "global_step": 226847, "epoch": 1350} {"train_loss": -10.533334732055664, "global_step": 226848, "epoch": 1350} {"train_loss": -10.997618675231934, "global_step": 226849, "epoch": 1350} {"train_loss": -11.152408599853516, "global_step": 226850, "epoch": 1350} {"train_loss": -10.192079544067383, "global_step": 226851, "epoch": 1350} {"train_loss": -11.453275680541992, "global_step": 226852, "epoch": 1350} {"train_loss": -10.489225387573242, "global_step": 226853, "epoch": 1350} {"train_loss": -11.217100143432617, "global_step": 226854, "epoch": 1350} {"train_loss": -10.573845863342285, "global_step": 226855, "epoch": 1350} {"train_loss": -10.321151733398438, "global_step": 226856, "epoch": 1350} {"train_loss": -11.370318412780762, "global_step": 226857, "epoch": 1350} {"train_loss": -10.374101638793945, "global_step": 226858, "epoch": 1350} {"train_loss": -10.899410247802734, "global_step": 226859, "epoch": 1350} {"train_loss": -9.970947265625, "global_step": 226860, "epoch": 1350} {"train_loss": -11.499073028564453, "global_step": 226861, "epoch": 1350} {"train_loss": -10.889326095581055, "global_step": 226862, "epoch": 1350} {"train_loss": -10.870953559875488, "global_step": 226863, "epoch": 1350} {"train_loss": -10.694952964782715, "global_step": 226864, "epoch": 1350} {"train_loss": -11.640203475952148, "global_step": 226865, "epoch": 1350} {"train_loss": -10.58358383178711, "global_step": 226866, "epoch": 1350} {"train_loss": -11.83670425415039, "global_step": 226867, "epoch": 1350} {"train_loss": -10.979377746582031, "global_step": 226868, "epoch": 1350} {"train_loss": -11.491788864135742, "global_step": 226869, "epoch": 1350} {"train_loss": -11.17651653289795, "global_step": 226870, "epoch": 1350} {"train_loss": -11.257698059082031, "global_step": 226871, "epoch": 1350} {"train_loss": -11.337696075439453, "global_step": 226872, "epoch": 1350} {"train_loss": -10.867145538330078, "global_step": 226873, "epoch": 1350} {"train_loss": -11.439963340759277, "global_step": 226874, "epoch": 1350} {"train_loss": -11.231082916259766, "global_step": 226875, "epoch": 1350} {"train_loss": -11.295660018920898, "global_step": 226876, "epoch": 1350} {"train_loss": -11.396883010864258, "global_step": 226877, "epoch": 1350} {"train_loss": -11.037323951721191, "global_step": 226878, "epoch": 1350} {"train_loss": -11.383792877197266, "global_step": 226879, "epoch": 1350} {"train_loss": -11.17923355102539, "global_step": 226880, "epoch": 1350} {"train_loss": -11.390579223632812, "global_step": 226881, "epoch": 1350} {"train_loss": -11.330427169799805, "global_step": 226882, "epoch": 1350} {"train_loss": -11.660545349121094, "global_step": 226883, "epoch": 1350} {"train_loss": -11.332327842712402, "global_step": 226884, "epoch": 1350} {"train_loss": -11.36640739440918, "global_step": 226885, "epoch": 1350} {"train_loss": -11.756214141845703, "global_step": 226886, "epoch": 1350} {"train_loss": -11.262102127075195, "global_step": 226887, "epoch": 1350} {"train_loss": -11.496259689331055, "global_step": 226888, "epoch": 1350} {"train_loss": -11.057711601257324, "global_step": 226889, "epoch": 1350} {"train_loss": -11.312603950500488, "global_step": 226890, "epoch": 1350} {"train_loss": -11.132184982299805, "global_step": 226891, "epoch": 1350} {"train_loss": -10.951512336730957, "global_step": 226892, "epoch": 1350} {"train_loss": -11.76833724975586, "global_step": 226893, "epoch": 1350} {"train_loss": -11.267029762268066, "global_step": 226894, "epoch": 1350} {"train_loss": -11.496980667114258, "global_step": 226895, "epoch": 1350} {"train_loss": -11.441899299621582, "global_step": 226896, "epoch": 1350} {"train_loss": -11.035938262939453, "global_step": 226897, "epoch": 1350} {"train_loss": -11.420026779174805, "global_step": 226898, "epoch": 1350} {"train_loss": -10.93291187286377, "global_step": 226899, "epoch": 1350} {"train_loss": -11.221192359924316, "global_step": 226900, "epoch": 1350} {"train_loss": -10.69600772857666, "global_step": 226901, "epoch": 1350} {"train_loss": -11.216079711914062, "global_step": 226902, "epoch": 1350} {"train_loss": -10.5186185836792, "global_step": 226903, "epoch": 1350} {"train_loss": -10.651695251464844, "global_step": 226904, "epoch": 1350} {"train_loss": -11.060115814208984, "global_step": 226905, "epoch": 1350} {"train_loss": -10.941093444824219, "global_step": 226906, "epoch": 1350} {"train_loss": -11.307428359985352, "global_step": 226907, "epoch": 1350} {"train_loss": -11.093687057495117, "global_step": 226908, "epoch": 1350} {"train_loss": -11.194096565246582, "global_step": 226909, "epoch": 1350} {"train_loss": -11.201776504516602, "global_step": 226910, "epoch": 1350} {"train_loss": -11.470141410827637, "global_step": 226911, "epoch": 1350} {"train_loss": -10.903951644897461, "global_step": 226912, "epoch": 1350} {"train_loss": -11.475902557373047, "global_step": 226913, "epoch": 1350} {"train_loss": -11.282123565673828, "global_step": 226914, "epoch": 1350} {"train_loss": -11.43951416015625, "global_step": 226915, "epoch": 1350} {"train_loss": -11.4019775390625, "global_step": 226916, "epoch": 1350} {"train_loss": -11.45875358581543, "global_step": 226917, "epoch": 1350} {"train_loss": -11.18162727355957, "global_step": 226918, "epoch": 1350} {"train_loss": -11.484884262084961, "global_step": 226919, "epoch": 1350} {"train_loss": -10.949104309082031, "global_step": 226920, "epoch": 1350} {"train_loss": -11.4461030960083, "global_step": 226921, "epoch": 1350} {"train_loss": -11.337525367736816, "global_step": 226922, "epoch": 1350} {"train_loss": -11.071907043457031, "global_step": 226923, "epoch": 1350} {"train_loss": -11.600994110107422, "global_step": 226924, "epoch": 1350} {"train_loss": -11.094260215759277, "global_step": 226925, "epoch": 1350} {"train_loss": -11.439371109008789, "global_step": 226926, "epoch": 1350} {"train_loss": -11.260128021240234, "global_step": 226927, "epoch": 1350} {"train_loss": -11.422969818115234, "global_step": 226928, "epoch": 1350} {"train_loss": -11.204517364501953, "global_step": 226929, "epoch": 1350} {"train_loss": -11.43840217590332, "global_step": 226930, "epoch": 1350} {"train_loss": -11.097270965576172, "global_step": 226931, "epoch": 1350} {"train_loss": -11.521219253540039, "global_step": 226932, "epoch": 1350} {"train_loss": -11.007782936096191, "global_step": 226933, "epoch": 1350} {"train_loss": -11.502703666687012, "global_step": 226934, "epoch": 1350} {"train_loss": -10.695337295532227, "global_step": 226935, "epoch": 1350} {"train_loss": -11.59797477722168, "global_step": 226936, "epoch": 1350} {"train_loss": -11.437394142150879, "global_step": 226937, "epoch": 1350} {"train_loss": -10.872705459594727, "global_step": 226938, "epoch": 1350} {"train_loss": -10.878711700439453, "global_step": 226939, "epoch": 1350} {"train_loss": -11.080888748168945, "global_step": 226940, "epoch": 1350} {"train_loss": -10.836430549621582, "global_step": 226941, "epoch": 1350} {"train_loss": -11.531107902526855, "global_step": 226942, "epoch": 1350} {"train_loss": -10.880382537841797, "global_step": 226943, "epoch": 1350} {"train_loss": -11.698795318603516, "global_step": 226944, "epoch": 1350} {"train_loss": -11.088237762451172, "global_step": 226945, "epoch": 1350} {"train_loss": -11.783967971801758, "global_step": 226946, "epoch": 1350} {"train_loss": -11.203524589538574, "global_step": 226947, "epoch": 1350} {"train_loss": -11.571279525756836, "global_step": 226948, "epoch": 1350} {"train_loss": -11.530933380126953, "global_step": 226949, "epoch": 1350} {"train_loss": -11.405763626098633, "global_step": 226950, "epoch": 1350} {"train_loss": -11.150777816772461, "global_step": 226951, "epoch": 1350} {"train_loss": -11.72044563293457, "global_step": 226952, "epoch": 1350} {"train_loss": -11.250210762023926, "global_step": 226953, "epoch": 1350} {"train_loss": -11.609003067016602, "global_step": 226954, "epoch": 1350} {"train_loss": -11.430602073669434, "global_step": 226955, "epoch": 1350} {"train_loss": -11.591045379638672, "global_step": 226956, "epoch": 1350} {"train_loss": -11.385666847229004, "global_step": 226957, "epoch": 1350} {"train_loss": -11.420291900634766, "global_step": 226958, "epoch": 1350} {"train_loss": -11.330497741699219, "global_step": 226959, "epoch": 1350} {"train_loss": -11.217202186584473, "global_step": 226960, "epoch": 1350} {"train_loss": -11.432286262512207, "global_step": 226961, "epoch": 1350} {"train_loss": -11.421960830688477, "global_step": 226962, "epoch": 1350} {"train_loss": -11.531129837036133, "global_step": 226963, "epoch": 1350} {"train_loss": -11.463668823242188, "global_step": 226964, "epoch": 1350} {"train_loss": -11.360225677490234, "global_step": 226965, "epoch": 1350} {"train_loss": -11.939981460571289, "global_step": 226966, "epoch": 1350} {"train_loss": -11.326681091671897, "global_step": 226967, "epoch": 1350, "train/sim_max_reward_0": 0.5544849454847991, "train/sim_max_reward_1": 0.9408179469236942, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.9303104537709144, "train/sim_max_reward_5": 0.5153906289425118, "test/sim_max_reward_4400000": 0.9961547245891661, "test/sim_max_reward_4400001": 0.8079204936615464, "test/sim_max_reward_4400002": 0.13755320815086983, "test/sim_max_reward_4400003": 0.006941294541223048, "test/sim_max_reward_4400004": 0.9357692322744546, "test/sim_max_reward_4400005": 0.9450532096022277, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 0.5429275275179266, "test/sim_max_reward_4400008": 0.5783399751992923, "test/sim_max_reward_4400009": 0.03420018545296306, "test/sim_max_reward_4400010": 0.9850358042718844, "test/sim_max_reward_4400011": 0.964899697206528, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.9526971191534858, "test/sim_max_reward_4400014": 0.5569304119290374, "test/sim_max_reward_4400015": 0.24260846104680017, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.8654915928499095, "test/sim_max_reward_4400019": 0.3757030913168348, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.3020821751537066, "test/sim_max_reward_4400022": 0.9830340269569552, "test/sim_max_reward_4400023": 0.14011232053518935, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.5657036043459233, "test/sim_max_reward_4400026": 0.10331360378122788, "test/sim_max_reward_4400027": 0.979583487371008, "test/sim_max_reward_4400028": 0.6964400925570827, "test/sim_max_reward_4400029": 0.630980140957891, "test/sim_max_reward_4400030": 0.9832329974615366, "test/sim_max_reward_4400031": 0.6122696935732266, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.1397239407266126, "test/sim_max_reward_4400034": 0.9405839534093862, "test/sim_max_reward_4400035": 0.9623077072489048, "test/sim_max_reward_4400036": 0.3672560106520132, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.06087655724947307, "test/sim_max_reward_4400042": 0.9915685168399396, "test/sim_max_reward_4400043": 0.019521873285325217, "test/sim_max_reward_4400044": 0.6212148550779396, "test/sim_max_reward_4400045": 0.0, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6568339958536533, "test/mean_score": 0.5307576494203373, "val_loss": 260563.5, "train_action_mse_error": 2.8486618995666504} {"train_loss": -11.602396011352539, "global_step": 226968, "epoch": 1351} {"train_loss": -11.813669204711914, "global_step": 226969, "epoch": 1351} {"train_loss": -11.570549011230469, "global_step": 226970, "epoch": 1351} {"train_loss": -11.789504051208496, "global_step": 226971, "epoch": 1351} {"train_loss": -11.73880386352539, "global_step": 226972, "epoch": 1351} {"train_loss": -11.401243209838867, "global_step": 226973, "epoch": 1351} {"train_loss": -11.751075744628906, "global_step": 226974, "epoch": 1351} {"train_loss": -11.335943222045898, "global_step": 226975, "epoch": 1351} {"train_loss": -11.919102668762207, "global_step": 226976, "epoch": 1351} {"train_loss": -11.468158721923828, "global_step": 226977, "epoch": 1351} {"train_loss": -11.712532997131348, "global_step": 226978, "epoch": 1351} {"train_loss": -11.692032814025879, "global_step": 226979, "epoch": 1351} {"train_loss": -11.668047904968262, "global_step": 226980, "epoch": 1351} {"train_loss": -11.68675422668457, "global_step": 226981, "epoch": 1351} {"train_loss": -11.767203330993652, "global_step": 226982, "epoch": 1351} {"train_loss": -11.550308227539062, "global_step": 226983, "epoch": 1351} {"train_loss": -11.691173553466797, "global_step": 226984, "epoch": 1351} {"train_loss": -11.609611511230469, "global_step": 226985, "epoch": 1351} {"train_loss": -11.127863883972168, "global_step": 226986, "epoch": 1351} {"train_loss": -11.422393798828125, "global_step": 226987, "epoch": 1351} {"train_loss": -11.096612930297852, "global_step": 226988, "epoch": 1351} {"train_loss": -11.67016887664795, "global_step": 226989, "epoch": 1351} {"train_loss": -10.768013000488281, "global_step": 226990, "epoch": 1351} {"train_loss": -11.899441719055176, "global_step": 226991, "epoch": 1351} {"train_loss": -10.941747665405273, "global_step": 226992, "epoch": 1351} {"train_loss": -11.10764217376709, "global_step": 226993, "epoch": 1351} {"train_loss": -11.275336265563965, "global_step": 226994, "epoch": 1351} {"train_loss": -11.207967758178711, "global_step": 226995, "epoch": 1351} {"train_loss": -11.566667556762695, "global_step": 226996, "epoch": 1351} {"train_loss": -11.375457763671875, "global_step": 226997, "epoch": 1351} {"train_loss": -11.132328033447266, "global_step": 226998, "epoch": 1351} {"train_loss": -11.690305709838867, "global_step": 226999, "epoch": 1351} {"train_loss": -11.344063758850098, "global_step": 227000, "epoch": 1351} {"train_loss": -11.65407943725586, "global_step": 227001, "epoch": 1351} {"train_loss": -11.435552597045898, "global_step": 227002, "epoch": 1351} {"train_loss": -11.219186782836914, "global_step": 227003, "epoch": 1351} {"train_loss": -11.628976821899414, "global_step": 227004, "epoch": 1351} {"train_loss": -11.15599250793457, "global_step": 227005, "epoch": 1351} {"train_loss": -11.335346221923828, "global_step": 227006, "epoch": 1351} {"train_loss": -11.69906234741211, "global_step": 227007, "epoch": 1351} {"train_loss": -11.253803253173828, "global_step": 227008, "epoch": 1351} {"train_loss": -11.55746078491211, "global_step": 227009, "epoch": 1351} {"train_loss": -11.28953742980957, "global_step": 227010, "epoch": 1351} {"train_loss": -11.72209644317627, "global_step": 227011, "epoch": 1351} {"train_loss": -11.385284423828125, "global_step": 227012, "epoch": 1351} {"train_loss": -11.546083450317383, "global_step": 227013, "epoch": 1351} {"train_loss": -11.215972900390625, "global_step": 227014, "epoch": 1351} {"train_loss": -10.726987838745117, "global_step": 227015, "epoch": 1351} {"train_loss": -11.500330924987793, "global_step": 227016, "epoch": 1351} {"train_loss": -10.918539047241211, "global_step": 227017, "epoch": 1351} {"train_loss": -11.349711418151855, "global_step": 227018, "epoch": 1351} {"train_loss": -11.3885498046875, "global_step": 227019, "epoch": 1351} {"train_loss": -11.044282913208008, "global_step": 227020, "epoch": 1351} {"train_loss": -11.822402954101562, "global_step": 227021, "epoch": 1351} {"train_loss": -11.001455307006836, "global_step": 227022, "epoch": 1351} {"train_loss": -11.576959609985352, "global_step": 227023, "epoch": 1351} {"train_loss": -10.748795509338379, "global_step": 227024, "epoch": 1351} {"train_loss": -11.555353164672852, "global_step": 227025, "epoch": 1351} {"train_loss": -11.246713638305664, "global_step": 227026, "epoch": 1351} {"train_loss": -11.514512062072754, "global_step": 227027, "epoch": 1351} {"train_loss": -11.468814849853516, "global_step": 227028, "epoch": 1351} {"train_loss": -10.94128131866455, "global_step": 227029, "epoch": 1351} {"train_loss": -11.528621673583984, "global_step": 227030, "epoch": 1351} {"train_loss": -11.483536720275879, "global_step": 227031, "epoch": 1351} {"train_loss": -11.551753997802734, "global_step": 227032, "epoch": 1351} {"train_loss": -11.526374816894531, "global_step": 227033, "epoch": 1351} {"train_loss": -11.590450286865234, "global_step": 227034, "epoch": 1351} {"train_loss": -11.651069641113281, "global_step": 227035, "epoch": 1351} {"train_loss": -11.257972717285156, "global_step": 227036, "epoch": 1351} {"train_loss": -11.495027542114258, "global_step": 227037, "epoch": 1351} {"train_loss": -11.283769607543945, "global_step": 227038, "epoch": 1351} {"train_loss": -11.641401290893555, "global_step": 227039, "epoch": 1351} {"train_loss": -11.547966003417969, "global_step": 227040, "epoch": 1351} {"train_loss": -11.495662689208984, "global_step": 227041, "epoch": 1351} {"train_loss": -11.572105407714844, "global_step": 227042, "epoch": 1351} {"train_loss": -11.362175941467285, "global_step": 227043, "epoch": 1351} {"train_loss": -11.456866264343262, "global_step": 227044, "epoch": 1351} {"train_loss": -11.46992301940918, "global_step": 227045, "epoch": 1351} {"train_loss": -11.223015785217285, "global_step": 227046, "epoch": 1351} {"train_loss": -11.504228591918945, "global_step": 227047, "epoch": 1351} {"train_loss": -11.358843803405762, "global_step": 227048, "epoch": 1351} {"train_loss": -11.305150985717773, "global_step": 227049, "epoch": 1351} {"train_loss": -11.774698257446289, "global_step": 227050, "epoch": 1351} {"train_loss": -11.270763397216797, "global_step": 227051, "epoch": 1351} {"train_loss": -10.926931381225586, "global_step": 227052, "epoch": 1351} {"train_loss": -11.721439361572266, "global_step": 227053, "epoch": 1351} {"train_loss": -11.300239562988281, "global_step": 227054, "epoch": 1351} {"train_loss": -11.495118141174316, "global_step": 227055, "epoch": 1351} {"train_loss": -11.447294235229492, "global_step": 227056, "epoch": 1351} {"train_loss": -11.667608261108398, "global_step": 227057, "epoch": 1351} {"train_loss": -11.461642265319824, "global_step": 227058, "epoch": 1351} {"train_loss": -11.742769241333008, "global_step": 227059, "epoch": 1351} {"train_loss": -11.578060150146484, "global_step": 227060, "epoch": 1351} {"train_loss": -11.472417831420898, "global_step": 227061, "epoch": 1351} {"train_loss": -11.685659408569336, "global_step": 227062, "epoch": 1351} {"train_loss": -11.559938430786133, "global_step": 227063, "epoch": 1351} {"train_loss": -11.596771240234375, "global_step": 227064, "epoch": 1351} {"train_loss": -11.728364944458008, "global_step": 227065, "epoch": 1351} {"train_loss": -11.688091278076172, "global_step": 227066, "epoch": 1351} {"train_loss": -11.451263427734375, "global_step": 227067, "epoch": 1351} {"train_loss": -11.629061698913574, "global_step": 227068, "epoch": 1351} {"train_loss": -11.198402404785156, "global_step": 227069, "epoch": 1351} {"train_loss": -11.720048904418945, "global_step": 227070, "epoch": 1351} {"train_loss": -11.02345085144043, "global_step": 227071, "epoch": 1351} {"train_loss": -11.869888305664062, "global_step": 227072, "epoch": 1351} {"train_loss": -11.179056167602539, "global_step": 227073, "epoch": 1351} {"train_loss": -11.806390762329102, "global_step": 227074, "epoch": 1351} {"train_loss": -11.626262664794922, "global_step": 227075, "epoch": 1351} {"train_loss": -11.498866081237793, "global_step": 227076, "epoch": 1351} {"train_loss": -11.533658981323242, "global_step": 227077, "epoch": 1351} {"train_loss": -11.470826148986816, "global_step": 227078, "epoch": 1351} {"train_loss": -11.560256958007812, "global_step": 227079, "epoch": 1351} {"train_loss": -10.986272811889648, "global_step": 227080, "epoch": 1351} {"train_loss": -11.230865478515625, "global_step": 227081, "epoch": 1351} {"train_loss": -10.831110000610352, "global_step": 227082, "epoch": 1351} {"train_loss": -11.14759635925293, "global_step": 227083, "epoch": 1351} {"train_loss": -11.57626724243164, "global_step": 227084, "epoch": 1351} {"train_loss": -10.743134498596191, "global_step": 227085, "epoch": 1351} {"train_loss": -11.757052421569824, "global_step": 227086, "epoch": 1351} {"train_loss": -11.066363334655762, "global_step": 227087, "epoch": 1351} {"train_loss": -11.48681640625, "global_step": 227088, "epoch": 1351} {"train_loss": -11.147141456604004, "global_step": 227089, "epoch": 1351} {"train_loss": -11.260658264160156, "global_step": 227090, "epoch": 1351} {"train_loss": -11.752721786499023, "global_step": 227091, "epoch": 1351} {"train_loss": -10.819938659667969, "global_step": 227092, "epoch": 1351} {"train_loss": -11.772293090820312, "global_step": 227093, "epoch": 1351} {"train_loss": -11.207235336303711, "global_step": 227094, "epoch": 1351} {"train_loss": -11.686275482177734, "global_step": 227095, "epoch": 1351} {"train_loss": -11.63133430480957, "global_step": 227096, "epoch": 1351} {"train_loss": -11.053871154785156, "global_step": 227097, "epoch": 1351} {"train_loss": -11.194714546203613, "global_step": 227098, "epoch": 1351} {"train_loss": -11.17225456237793, "global_step": 227099, "epoch": 1351} {"train_loss": -11.55769157409668, "global_step": 227100, "epoch": 1351} {"train_loss": -10.965579986572266, "global_step": 227101, "epoch": 1351} {"train_loss": -11.241704940795898, "global_step": 227102, "epoch": 1351} {"train_loss": -11.003284454345703, "global_step": 227103, "epoch": 1351} {"train_loss": -11.55127239227295, "global_step": 227104, "epoch": 1351} {"train_loss": -11.341679573059082, "global_step": 227105, "epoch": 1351} {"train_loss": -11.745251655578613, "global_step": 227106, "epoch": 1351} {"train_loss": -11.468116760253906, "global_step": 227107, "epoch": 1351} {"train_loss": -11.662630081176758, "global_step": 227108, "epoch": 1351} {"train_loss": -11.625306129455566, "global_step": 227109, "epoch": 1351} {"train_loss": -11.802640914916992, "global_step": 227110, "epoch": 1351} {"train_loss": -11.537558555603027, "global_step": 227111, "epoch": 1351} {"train_loss": -11.686545372009277, "global_step": 227112, "epoch": 1351} {"train_loss": -11.614490509033203, "global_step": 227113, "epoch": 1351} {"train_loss": -11.611599922180176, "global_step": 227114, "epoch": 1351} {"train_loss": -11.64167594909668, "global_step": 227115, "epoch": 1351} {"train_loss": -11.472014427185059, "global_step": 227116, "epoch": 1351} {"train_loss": -11.815801620483398, "global_step": 227117, "epoch": 1351} {"train_loss": -11.453985214233398, "global_step": 227118, "epoch": 1351} {"train_loss": -11.835734367370605, "global_step": 227119, "epoch": 1351} {"train_loss": -11.506457328796387, "global_step": 227120, "epoch": 1351} {"train_loss": -11.863499641418457, "global_step": 227121, "epoch": 1351} {"train_loss": -11.75969123840332, "global_step": 227122, "epoch": 1351} {"train_loss": -11.533133506774902, "global_step": 227123, "epoch": 1351} {"train_loss": -11.948053359985352, "global_step": 227124, "epoch": 1351} {"train_loss": -11.807625770568848, "global_step": 227125, "epoch": 1351} {"train_loss": -11.620235443115234, "global_step": 227126, "epoch": 1351} {"train_loss": -11.372121810913086, "global_step": 227127, "epoch": 1351} {"train_loss": -11.540016174316406, "global_step": 227128, "epoch": 1351} {"train_loss": -11.652217864990234, "global_step": 227129, "epoch": 1351} {"train_loss": -11.458013534545898, "global_step": 227130, "epoch": 1351} {"train_loss": -11.731544494628906, "global_step": 227131, "epoch": 1351} {"train_loss": -11.221891403198242, "global_step": 227132, "epoch": 1351} {"train_loss": -11.425090789794922, "global_step": 227133, "epoch": 1351} {"train_loss": -11.88086223602295, "global_step": 227134, "epoch": 1351} {"train_loss": -11.45806976727077, "global_step": 227135, "epoch": 1351, "val_loss": 263599.75} {"train_loss": -11.043100357055664, "global_step": 227136, "epoch": 1352} {"train_loss": -11.54837417602539, "global_step": 227137, "epoch": 1352} {"train_loss": -11.21505355834961, "global_step": 227138, "epoch": 1352} {"train_loss": -11.456770896911621, "global_step": 227139, "epoch": 1352} {"train_loss": -11.394388198852539, "global_step": 227140, "epoch": 1352} {"train_loss": -11.570556640625, "global_step": 227141, "epoch": 1352} {"train_loss": -11.514566421508789, "global_step": 227142, "epoch": 1352} {"train_loss": -11.487889289855957, "global_step": 227143, "epoch": 1352} {"train_loss": -11.411762237548828, "global_step": 227144, "epoch": 1352} {"train_loss": -11.717842102050781, "global_step": 227145, "epoch": 1352} {"train_loss": -11.27093505859375, "global_step": 227146, "epoch": 1352} {"train_loss": -11.379447937011719, "global_step": 227147, "epoch": 1352} {"train_loss": -11.661687850952148, "global_step": 227148, "epoch": 1352} {"train_loss": -11.195487976074219, "global_step": 227149, "epoch": 1352} {"train_loss": -10.807295799255371, "global_step": 227150, "epoch": 1352} {"train_loss": -11.29594612121582, "global_step": 227151, "epoch": 1352} {"train_loss": -11.163514137268066, "global_step": 227152, "epoch": 1352} {"train_loss": -11.089637756347656, "global_step": 227153, "epoch": 1352} {"train_loss": -11.688328742980957, "global_step": 227154, "epoch": 1352} {"train_loss": -11.180767059326172, "global_step": 227155, "epoch": 1352} {"train_loss": -11.38405704498291, "global_step": 227156, "epoch": 1352} {"train_loss": -11.560888290405273, "global_step": 227157, "epoch": 1352} {"train_loss": -11.261539459228516, "global_step": 227158, "epoch": 1352} {"train_loss": -11.734987258911133, "global_step": 227159, "epoch": 1352} {"train_loss": -11.48416519165039, "global_step": 227160, "epoch": 1352} {"train_loss": -11.355430603027344, "global_step": 227161, "epoch": 1352} {"train_loss": -11.45539665222168, "global_step": 227162, "epoch": 1352} {"train_loss": -11.460229873657227, "global_step": 227163, "epoch": 1352} {"train_loss": -11.364324569702148, "global_step": 227164, "epoch": 1352} {"train_loss": -11.565347671508789, "global_step": 227165, "epoch": 1352} {"train_loss": -11.719671249389648, "global_step": 227166, "epoch": 1352} {"train_loss": -11.760814666748047, "global_step": 227167, "epoch": 1352} {"train_loss": -11.611039161682129, "global_step": 227168, "epoch": 1352} {"train_loss": -11.754975318908691, "global_step": 227169, "epoch": 1352} {"train_loss": -11.692343711853027, "global_step": 227170, "epoch": 1352} {"train_loss": -11.694952964782715, "global_step": 227171, "epoch": 1352} {"train_loss": -11.560657501220703, "global_step": 227172, "epoch": 1352} {"train_loss": -11.63937759399414, "global_step": 227173, "epoch": 1352} {"train_loss": -11.578714370727539, "global_step": 227174, "epoch": 1352} {"train_loss": -11.38172721862793, "global_step": 227175, "epoch": 1352} {"train_loss": -11.805785179138184, "global_step": 227176, "epoch": 1352} {"train_loss": -11.594589233398438, "global_step": 227177, "epoch": 1352} {"train_loss": -11.564291000366211, "global_step": 227178, "epoch": 1352} {"train_loss": -11.86369514465332, "global_step": 227179, "epoch": 1352} {"train_loss": -11.517654418945312, "global_step": 227180, "epoch": 1352} {"train_loss": -11.836896896362305, "global_step": 227181, "epoch": 1352} {"train_loss": -11.592809677124023, "global_step": 227182, "epoch": 1352} {"train_loss": -12.049731254577637, "global_step": 227183, "epoch": 1352} {"train_loss": -12.036247253417969, "global_step": 227184, "epoch": 1352} {"train_loss": -11.846353530883789, "global_step": 227185, "epoch": 1352} {"train_loss": -11.94058895111084, "global_step": 227186, "epoch": 1352} {"train_loss": -11.953411102294922, "global_step": 227187, "epoch": 1352} {"train_loss": -11.986045837402344, "global_step": 227188, "epoch": 1352} {"train_loss": -11.862707138061523, "global_step": 227189, "epoch": 1352} {"train_loss": -11.682987213134766, "global_step": 227190, "epoch": 1352} {"train_loss": -11.696269035339355, "global_step": 227191, "epoch": 1352} {"train_loss": -12.054922103881836, "global_step": 227192, "epoch": 1352} {"train_loss": -11.463105201721191, "global_step": 227193, "epoch": 1352} {"train_loss": -11.843999862670898, "global_step": 227194, "epoch": 1352} {"train_loss": -11.873159408569336, "global_step": 227195, "epoch": 1352} {"train_loss": -11.745675086975098, "global_step": 227196, "epoch": 1352} {"train_loss": -11.646137237548828, "global_step": 227197, "epoch": 1352} {"train_loss": -12.06214714050293, "global_step": 227198, "epoch": 1352} {"train_loss": -11.77099609375, "global_step": 227199, "epoch": 1352} {"train_loss": -11.706588745117188, "global_step": 227200, "epoch": 1352} {"train_loss": -11.472650527954102, "global_step": 227201, "epoch": 1352} {"train_loss": -11.706786155700684, "global_step": 227202, "epoch": 1352} {"train_loss": -10.788375854492188, "global_step": 227203, "epoch": 1352} {"train_loss": -10.890790939331055, "global_step": 227204, "epoch": 1352} {"train_loss": -11.498146057128906, "global_step": 227205, "epoch": 1352} {"train_loss": -11.041455268859863, "global_step": 227206, "epoch": 1352} {"train_loss": -11.111427307128906, "global_step": 227207, "epoch": 1352} {"train_loss": -11.48498821258545, "global_step": 227208, "epoch": 1352} {"train_loss": -8.218490600585938, "global_step": 227209, "epoch": 1352} {"train_loss": -11.096031188964844, "global_step": 227210, "epoch": 1352} {"train_loss": -8.630626678466797, "global_step": 227211, "epoch": 1352} {"train_loss": -9.206846237182617, "global_step": 227212, "epoch": 1352} {"train_loss": -9.73655891418457, "global_step": 227213, "epoch": 1352} {"train_loss": -10.328545570373535, "global_step": 227214, "epoch": 1352} {"train_loss": -11.250051498413086, "global_step": 227215, "epoch": 1352} {"train_loss": -10.326577186584473, "global_step": 227216, "epoch": 1352} {"train_loss": -11.413654327392578, "global_step": 227217, "epoch": 1352} {"train_loss": -10.559392929077148, "global_step": 227218, "epoch": 1352} {"train_loss": -10.808454513549805, "global_step": 227219, "epoch": 1352} {"train_loss": -10.901881217956543, "global_step": 227220, "epoch": 1352} {"train_loss": -11.302659034729004, "global_step": 227221, "epoch": 1352} {"train_loss": -10.758079528808594, "global_step": 227222, "epoch": 1352} {"train_loss": -11.214652061462402, "global_step": 227223, "epoch": 1352} {"train_loss": -11.338672637939453, "global_step": 227224, "epoch": 1352} {"train_loss": -11.394580841064453, "global_step": 227225, "epoch": 1352} {"train_loss": -11.013901710510254, "global_step": 227226, "epoch": 1352} {"train_loss": -11.548099517822266, "global_step": 227227, "epoch": 1352} {"train_loss": -11.262445449829102, "global_step": 227228, "epoch": 1352} {"train_loss": -11.458976745605469, "global_step": 227229, "epoch": 1352} {"train_loss": -11.341169357299805, "global_step": 227230, "epoch": 1352} {"train_loss": -11.55959701538086, "global_step": 227231, "epoch": 1352} {"train_loss": -11.718066215515137, "global_step": 227232, "epoch": 1352} {"train_loss": -11.473966598510742, "global_step": 227233, "epoch": 1352} {"train_loss": -11.680139541625977, "global_step": 227234, "epoch": 1352} {"train_loss": -11.571332931518555, "global_step": 227235, "epoch": 1352} {"train_loss": -11.620376586914062, "global_step": 227236, "epoch": 1352} {"train_loss": -11.465599060058594, "global_step": 227237, "epoch": 1352} {"train_loss": -11.781888961791992, "global_step": 227238, "epoch": 1352} {"train_loss": -11.645143508911133, "global_step": 227239, "epoch": 1352} {"train_loss": -11.629992485046387, "global_step": 227240, "epoch": 1352} {"train_loss": -11.881231307983398, "global_step": 227241, "epoch": 1352} {"train_loss": -11.591560363769531, "global_step": 227242, "epoch": 1352} {"train_loss": -11.729652404785156, "global_step": 227243, "epoch": 1352} {"train_loss": -11.717469215393066, "global_step": 227244, "epoch": 1352} {"train_loss": -11.784209251403809, "global_step": 227245, "epoch": 1352} {"train_loss": -11.875733375549316, "global_step": 227246, "epoch": 1352} {"train_loss": -11.606517791748047, "global_step": 227247, "epoch": 1352} {"train_loss": -11.860200881958008, "global_step": 227248, "epoch": 1352} {"train_loss": -11.799120903015137, "global_step": 227249, "epoch": 1352} {"train_loss": -11.709275245666504, "global_step": 227250, "epoch": 1352} {"train_loss": -11.704743385314941, "global_step": 227251, "epoch": 1352} {"train_loss": -11.762642860412598, "global_step": 227252, "epoch": 1352} {"train_loss": -11.698763847351074, "global_step": 227253, "epoch": 1352} {"train_loss": -11.727052688598633, "global_step": 227254, "epoch": 1352} {"train_loss": -11.442408561706543, "global_step": 227255, "epoch": 1352} {"train_loss": -11.660541534423828, "global_step": 227256, "epoch": 1352} {"train_loss": -11.320777893066406, "global_step": 227257, "epoch": 1352} {"train_loss": -11.849681854248047, "global_step": 227258, "epoch": 1352} {"train_loss": -11.67005443572998, "global_step": 227259, "epoch": 1352} {"train_loss": -11.731072425842285, "global_step": 227260, "epoch": 1352} {"train_loss": -11.92864990234375, "global_step": 227261, "epoch": 1352} {"train_loss": -11.629633903503418, "global_step": 227262, "epoch": 1352} {"train_loss": -11.655521392822266, "global_step": 227263, "epoch": 1352} {"train_loss": -11.728358268737793, "global_step": 227264, "epoch": 1352} {"train_loss": -11.309186935424805, "global_step": 227265, "epoch": 1352} {"train_loss": -11.574468612670898, "global_step": 227266, "epoch": 1352} {"train_loss": -11.777175903320312, "global_step": 227267, "epoch": 1352} {"train_loss": -11.496679306030273, "global_step": 227268, "epoch": 1352} {"train_loss": -11.83311653137207, "global_step": 227269, "epoch": 1352} {"train_loss": -11.762153625488281, "global_step": 227270, "epoch": 1352} {"train_loss": -11.7416353225708, "global_step": 227271, "epoch": 1352} {"train_loss": -11.693891525268555, "global_step": 227272, "epoch": 1352} {"train_loss": -11.841670989990234, "global_step": 227273, "epoch": 1352} {"train_loss": -12.028127670288086, "global_step": 227274, "epoch": 1352} {"train_loss": -11.486457824707031, "global_step": 227275, "epoch": 1352} {"train_loss": -11.749306678771973, "global_step": 227276, "epoch": 1352} {"train_loss": -11.78756332397461, "global_step": 227277, "epoch": 1352} {"train_loss": -11.548440933227539, "global_step": 227278, "epoch": 1352} {"train_loss": -11.704007148742676, "global_step": 227279, "epoch": 1352} {"train_loss": -11.394819259643555, "global_step": 227280, "epoch": 1352} {"train_loss": -11.362081527709961, "global_step": 227281, "epoch": 1352} {"train_loss": -11.592172622680664, "global_step": 227282, "epoch": 1352} {"train_loss": -11.536308288574219, "global_step": 227283, "epoch": 1352} {"train_loss": -11.774005889892578, "global_step": 227284, "epoch": 1352} {"train_loss": -11.177457809448242, "global_step": 227285, "epoch": 1352} {"train_loss": -12.042549133300781, "global_step": 227286, "epoch": 1352} {"train_loss": -11.101753234863281, "global_step": 227287, "epoch": 1352} {"train_loss": -10.954164505004883, "global_step": 227288, "epoch": 1352} {"train_loss": -11.897236824035645, "global_step": 227289, "epoch": 1352} {"train_loss": -11.61782455444336, "global_step": 227290, "epoch": 1352} {"train_loss": -11.421867370605469, "global_step": 227291, "epoch": 1352} {"train_loss": -11.854787826538086, "global_step": 227292, "epoch": 1352} {"train_loss": -11.776481628417969, "global_step": 227293, "epoch": 1352} {"train_loss": -11.827177047729492, "global_step": 227294, "epoch": 1352} {"train_loss": -12.05945873260498, "global_step": 227295, "epoch": 1352} {"train_loss": -11.805997848510742, "global_step": 227296, "epoch": 1352} {"train_loss": -11.931659698486328, "global_step": 227297, "epoch": 1352} {"train_loss": -11.7940673828125, "global_step": 227298, "epoch": 1352} {"train_loss": -11.904848098754883, "global_step": 227299, "epoch": 1352} {"train_loss": -11.62276554107666, "global_step": 227300, "epoch": 1352} {"train_loss": -11.700872421264648, "global_step": 227301, "epoch": 1352} {"train_loss": -11.646251678466797, "global_step": 227302, "epoch": 1352} {"train_loss": -11.48841210774013, "global_step": 227303, "epoch": 1352, "val_loss": 257635.03125} {"train_loss": -11.272174835205078, "global_step": 227304, "epoch": 1353} {"train_loss": -10.44990062713623, "global_step": 227305, "epoch": 1353} {"train_loss": -10.378442764282227, "global_step": 227306, "epoch": 1353} {"train_loss": -10.665014266967773, "global_step": 227307, "epoch": 1353} {"train_loss": -9.394048690795898, "global_step": 227308, "epoch": 1353} {"train_loss": -10.136911392211914, "global_step": 227309, "epoch": 1353} {"train_loss": -9.431093215942383, "global_step": 227310, "epoch": 1353} {"train_loss": -10.392107009887695, "global_step": 227311, "epoch": 1353} {"train_loss": -10.25535774230957, "global_step": 227312, "epoch": 1353} {"train_loss": -11.605935096740723, "global_step": 227313, "epoch": 1353} {"train_loss": -10.513862609863281, "global_step": 227314, "epoch": 1353} {"train_loss": -11.432077407836914, "global_step": 227315, "epoch": 1353} {"train_loss": -11.01240348815918, "global_step": 227316, "epoch": 1353} {"train_loss": -11.249961853027344, "global_step": 227317, "epoch": 1353} {"train_loss": -11.106545448303223, "global_step": 227318, "epoch": 1353} {"train_loss": -10.887040138244629, "global_step": 227319, "epoch": 1353} {"train_loss": -10.757068634033203, "global_step": 227320, "epoch": 1353} {"train_loss": -10.067975997924805, "global_step": 227321, "epoch": 1353} {"train_loss": -11.029152870178223, "global_step": 227322, "epoch": 1353} {"train_loss": -10.416458129882812, "global_step": 227323, "epoch": 1353} {"train_loss": -11.498807907104492, "global_step": 227324, "epoch": 1353} {"train_loss": -10.736236572265625, "global_step": 227325, "epoch": 1353} {"train_loss": -11.509892463684082, "global_step": 227326, "epoch": 1353} {"train_loss": -11.159996032714844, "global_step": 227327, "epoch": 1353} {"train_loss": -10.813191413879395, "global_step": 227328, "epoch": 1353} {"train_loss": -11.634708404541016, "global_step": 227329, "epoch": 1353} {"train_loss": -10.838990211486816, "global_step": 227330, "epoch": 1353} {"train_loss": -10.980331420898438, "global_step": 227331, "epoch": 1353} {"train_loss": -11.225912094116211, "global_step": 227332, "epoch": 1353} {"train_loss": -10.9093017578125, "global_step": 227333, "epoch": 1353} {"train_loss": -10.924201011657715, "global_step": 227334, "epoch": 1353} {"train_loss": -11.591201782226562, "global_step": 227335, "epoch": 1353} {"train_loss": -10.685376167297363, "global_step": 227336, "epoch": 1353} {"train_loss": -11.722509384155273, "global_step": 227337, "epoch": 1353} {"train_loss": -11.03752326965332, "global_step": 227338, "epoch": 1353} {"train_loss": -11.299474716186523, "global_step": 227339, "epoch": 1353} {"train_loss": -11.634381294250488, "global_step": 227340, "epoch": 1353} {"train_loss": -10.925743103027344, "global_step": 227341, "epoch": 1353} {"train_loss": -11.233067512512207, "global_step": 227342, "epoch": 1353} {"train_loss": -11.40190315246582, "global_step": 227343, "epoch": 1353} {"train_loss": -11.491697311401367, "global_step": 227344, "epoch": 1353} {"train_loss": -11.392114639282227, "global_step": 227345, "epoch": 1353} {"train_loss": -11.524826049804688, "global_step": 227346, "epoch": 1353} {"train_loss": -11.259307861328125, "global_step": 227347, "epoch": 1353} {"train_loss": -11.672258377075195, "global_step": 227348, "epoch": 1353} {"train_loss": -11.568929672241211, "global_step": 227349, "epoch": 1353} {"train_loss": -11.356462478637695, "global_step": 227350, "epoch": 1353} {"train_loss": -11.488136291503906, "global_step": 227351, "epoch": 1353} {"train_loss": -11.591930389404297, "global_step": 227352, "epoch": 1353} {"train_loss": -11.567766189575195, "global_step": 227353, "epoch": 1353} {"train_loss": -11.345125198364258, "global_step": 227354, "epoch": 1353} {"train_loss": -11.813532829284668, "global_step": 227355, "epoch": 1353} {"train_loss": -11.339212417602539, "global_step": 227356, "epoch": 1353} {"train_loss": -11.563405990600586, "global_step": 227357, "epoch": 1353} {"train_loss": -11.800661087036133, "global_step": 227358, "epoch": 1353} {"train_loss": -10.863876342773438, "global_step": 227359, "epoch": 1353} {"train_loss": -11.611042022705078, "global_step": 227360, "epoch": 1353} {"train_loss": -11.388444900512695, "global_step": 227361, "epoch": 1353} {"train_loss": -11.959315299987793, "global_step": 227362, "epoch": 1353} {"train_loss": -11.69239330291748, "global_step": 227363, "epoch": 1353} {"train_loss": -11.630834579467773, "global_step": 227364, "epoch": 1353} {"train_loss": -11.64113998413086, "global_step": 227365, "epoch": 1353} {"train_loss": -11.85879135131836, "global_step": 227366, "epoch": 1353} {"train_loss": -11.483785629272461, "global_step": 227367, "epoch": 1353} {"train_loss": -11.91067886352539, "global_step": 227368, "epoch": 1353} {"train_loss": -11.746620178222656, "global_step": 227369, "epoch": 1353} {"train_loss": -11.764835357666016, "global_step": 227370, "epoch": 1353} {"train_loss": -11.854473114013672, "global_step": 227371, "epoch": 1353} {"train_loss": -11.737058639526367, "global_step": 227372, "epoch": 1353} {"train_loss": -11.925862312316895, "global_step": 227373, "epoch": 1353} {"train_loss": -12.106674194335938, "global_step": 227374, "epoch": 1353} {"train_loss": -11.582263946533203, "global_step": 227375, "epoch": 1353} {"train_loss": -11.886873245239258, "global_step": 227376, "epoch": 1353} {"train_loss": -11.938714981079102, "global_step": 227377, "epoch": 1353} {"train_loss": -11.838323593139648, "global_step": 227378, "epoch": 1353} {"train_loss": -11.552545547485352, "global_step": 227379, "epoch": 1353} {"train_loss": -11.883528709411621, "global_step": 227380, "epoch": 1353} {"train_loss": -11.327795028686523, "global_step": 227381, "epoch": 1353} {"train_loss": -11.534677505493164, "global_step": 227382, "epoch": 1353} {"train_loss": -11.628175735473633, "global_step": 227383, "epoch": 1353} {"train_loss": -11.959461212158203, "global_step": 227384, "epoch": 1353} {"train_loss": -11.72066879272461, "global_step": 227385, "epoch": 1353} {"train_loss": -11.639586448669434, "global_step": 227386, "epoch": 1353} {"train_loss": -11.473393440246582, "global_step": 227387, "epoch": 1353} {"train_loss": -11.381915092468262, "global_step": 227388, "epoch": 1353} {"train_loss": -10.009605407714844, "global_step": 227389, "epoch": 1353} {"train_loss": -11.970837593078613, "global_step": 227390, "epoch": 1353} {"train_loss": -11.371587753295898, "global_step": 227391, "epoch": 1353} {"train_loss": -11.130167961120605, "global_step": 227392, "epoch": 1353} {"train_loss": -11.420867919921875, "global_step": 227393, "epoch": 1353} {"train_loss": -11.57685661315918, "global_step": 227394, "epoch": 1353} {"train_loss": -10.909063339233398, "global_step": 227395, "epoch": 1353} {"train_loss": -11.00554370880127, "global_step": 227396, "epoch": 1353} {"train_loss": -11.770915985107422, "global_step": 227397, "epoch": 1353} {"train_loss": -11.436504364013672, "global_step": 227398, "epoch": 1353} {"train_loss": -11.457406997680664, "global_step": 227399, "epoch": 1353} {"train_loss": -11.797479629516602, "global_step": 227400, "epoch": 1353} {"train_loss": -11.92929744720459, "global_step": 227401, "epoch": 1353} {"train_loss": -11.199485778808594, "global_step": 227402, "epoch": 1353} {"train_loss": -11.469161033630371, "global_step": 227403, "epoch": 1353} {"train_loss": -11.464203834533691, "global_step": 227404, "epoch": 1353} {"train_loss": -10.466151237487793, "global_step": 227405, "epoch": 1353} {"train_loss": -10.663522720336914, "global_step": 227406, "epoch": 1353} {"train_loss": -11.585773468017578, "global_step": 227407, "epoch": 1353} {"train_loss": -11.342288970947266, "global_step": 227408, "epoch": 1353} {"train_loss": -11.0858793258667, "global_step": 227409, "epoch": 1353} {"train_loss": -11.675121307373047, "global_step": 227410, "epoch": 1353} {"train_loss": -11.594417572021484, "global_step": 227411, "epoch": 1353} {"train_loss": -11.656435012817383, "global_step": 227412, "epoch": 1353} {"train_loss": -11.752422332763672, "global_step": 227413, "epoch": 1353} {"train_loss": -11.722539901733398, "global_step": 227414, "epoch": 1353} {"train_loss": -11.41324234008789, "global_step": 227415, "epoch": 1353} {"train_loss": -11.646964073181152, "global_step": 227416, "epoch": 1353} {"train_loss": -11.696845054626465, "global_step": 227417, "epoch": 1353} {"train_loss": -11.204017639160156, "global_step": 227418, "epoch": 1353} {"train_loss": -11.40652847290039, "global_step": 227419, "epoch": 1353} {"train_loss": -11.20556926727295, "global_step": 227420, "epoch": 1353} {"train_loss": -11.518211364746094, "global_step": 227421, "epoch": 1353} {"train_loss": -11.493343353271484, "global_step": 227422, "epoch": 1353} {"train_loss": -11.058176040649414, "global_step": 227423, "epoch": 1353} {"train_loss": -11.799836158752441, "global_step": 227424, "epoch": 1353} {"train_loss": -11.192573547363281, "global_step": 227425, "epoch": 1353} {"train_loss": -11.591386795043945, "global_step": 227426, "epoch": 1353} {"train_loss": -11.51724910736084, "global_step": 227427, "epoch": 1353} {"train_loss": -11.631046295166016, "global_step": 227428, "epoch": 1353} {"train_loss": -11.134033203125, "global_step": 227429, "epoch": 1353} {"train_loss": -11.933752059936523, "global_step": 227430, "epoch": 1353} {"train_loss": -11.33471965789795, "global_step": 227431, "epoch": 1353} {"train_loss": -11.268921852111816, "global_step": 227432, "epoch": 1353} {"train_loss": -11.639856338500977, "global_step": 227433, "epoch": 1353} {"train_loss": -10.06617546081543, "global_step": 227434, "epoch": 1353} {"train_loss": -12.011144638061523, "global_step": 227435, "epoch": 1353} {"train_loss": -10.4453763961792, "global_step": 227436, "epoch": 1353} {"train_loss": -11.105777740478516, "global_step": 227437, "epoch": 1353} {"train_loss": -11.296323776245117, "global_step": 227438, "epoch": 1353} {"train_loss": -10.188812255859375, "global_step": 227439, "epoch": 1353} {"train_loss": -11.389558792114258, "global_step": 227440, "epoch": 1353} {"train_loss": -10.963615417480469, "global_step": 227441, "epoch": 1353} {"train_loss": -11.076408386230469, "global_step": 227442, "epoch": 1353} {"train_loss": -10.848506927490234, "global_step": 227443, "epoch": 1353} {"train_loss": -10.354307174682617, "global_step": 227444, "epoch": 1353} {"train_loss": -10.92546272277832, "global_step": 227445, "epoch": 1353} {"train_loss": -11.479991912841797, "global_step": 227446, "epoch": 1353} {"train_loss": -10.630247116088867, "global_step": 227447, "epoch": 1353} {"train_loss": -11.451909065246582, "global_step": 227448, "epoch": 1353} {"train_loss": -10.649141311645508, "global_step": 227449, "epoch": 1353} {"train_loss": -11.034523010253906, "global_step": 227450, "epoch": 1353} {"train_loss": -10.471036911010742, "global_step": 227451, "epoch": 1353} {"train_loss": -11.055130958557129, "global_step": 227452, "epoch": 1353} {"train_loss": -11.092023849487305, "global_step": 227453, "epoch": 1353} {"train_loss": -10.845939636230469, "global_step": 227454, "epoch": 1353} {"train_loss": -11.362013816833496, "global_step": 227455, "epoch": 1353} {"train_loss": -10.8480806350708, "global_step": 227456, "epoch": 1353} {"train_loss": -11.333868980407715, "global_step": 227457, "epoch": 1353} {"train_loss": -11.248580932617188, "global_step": 227458, "epoch": 1353} {"train_loss": -10.737425804138184, "global_step": 227459, "epoch": 1353} {"train_loss": -11.462553977966309, "global_step": 227460, "epoch": 1353} {"train_loss": -11.562095642089844, "global_step": 227461, "epoch": 1353} {"train_loss": -11.220956802368164, "global_step": 227462, "epoch": 1353} {"train_loss": -11.265767097473145, "global_step": 227463, "epoch": 1353} {"train_loss": -11.60992431640625, "global_step": 227464, "epoch": 1353} {"train_loss": -11.6260404586792, "global_step": 227465, "epoch": 1353} {"train_loss": -11.334421157836914, "global_step": 227466, "epoch": 1353} {"train_loss": -11.32150936126709, "global_step": 227467, "epoch": 1353} {"train_loss": -11.27271556854248, "global_step": 227468, "epoch": 1353} {"train_loss": -11.716462135314941, "global_step": 227469, "epoch": 1353} {"train_loss": -11.554788589477539, "global_step": 227470, "epoch": 1353} {"train_loss": -11.279339705194745, "global_step": 227471, "epoch": 1353, "val_loss": 260795.03125} {"train_loss": -11.458154678344727, "global_step": 227472, "epoch": 1354} {"train_loss": -11.456228256225586, "global_step": 227473, "epoch": 1354} {"train_loss": -11.508508682250977, "global_step": 227474, "epoch": 1354} {"train_loss": -11.637404441833496, "global_step": 227475, "epoch": 1354} {"train_loss": -11.34733772277832, "global_step": 227476, "epoch": 1354} {"train_loss": -11.315367698669434, "global_step": 227477, "epoch": 1354} {"train_loss": -11.589014053344727, "global_step": 227478, "epoch": 1354} {"train_loss": -11.746382713317871, "global_step": 227479, "epoch": 1354} {"train_loss": -11.710518836975098, "global_step": 227480, "epoch": 1354} {"train_loss": -11.477852821350098, "global_step": 227481, "epoch": 1354} {"train_loss": -11.465071678161621, "global_step": 227482, "epoch": 1354} {"train_loss": -11.771648406982422, "global_step": 227483, "epoch": 1354} {"train_loss": -11.502250671386719, "global_step": 227484, "epoch": 1354} {"train_loss": -11.537359237670898, "global_step": 227485, "epoch": 1354} {"train_loss": -11.565945625305176, "global_step": 227486, "epoch": 1354} {"train_loss": -11.61227035522461, "global_step": 227487, "epoch": 1354} {"train_loss": -11.782744407653809, "global_step": 227488, "epoch": 1354} {"train_loss": -11.450578689575195, "global_step": 227489, "epoch": 1354} {"train_loss": -11.70138168334961, "global_step": 227490, "epoch": 1354} {"train_loss": -11.356708526611328, "global_step": 227491, "epoch": 1354} {"train_loss": -11.667437553405762, "global_step": 227492, "epoch": 1354} {"train_loss": -11.610916137695312, "global_step": 227493, "epoch": 1354} {"train_loss": -11.791864395141602, "global_step": 227494, "epoch": 1354} {"train_loss": -11.498855590820312, "global_step": 227495, "epoch": 1354} {"train_loss": -11.82550048828125, "global_step": 227496, "epoch": 1354} {"train_loss": -11.669961929321289, "global_step": 227497, "epoch": 1354} {"train_loss": -11.61282730102539, "global_step": 227498, "epoch": 1354} {"train_loss": -11.87435531616211, "global_step": 227499, "epoch": 1354} {"train_loss": -11.777555465698242, "global_step": 227500, "epoch": 1354} {"train_loss": -11.787788391113281, "global_step": 227501, "epoch": 1354} {"train_loss": -11.617668151855469, "global_step": 227502, "epoch": 1354} {"train_loss": -11.68851089477539, "global_step": 227503, "epoch": 1354} {"train_loss": -11.862319946289062, "global_step": 227504, "epoch": 1354} {"train_loss": -11.547933578491211, "global_step": 227505, "epoch": 1354} {"train_loss": -11.734552383422852, "global_step": 227506, "epoch": 1354} {"train_loss": -11.72998046875, "global_step": 227507, "epoch": 1354} {"train_loss": -11.698857307434082, "global_step": 227508, "epoch": 1354} {"train_loss": -11.842986106872559, "global_step": 227509, "epoch": 1354} {"train_loss": -11.783949851989746, "global_step": 227510, "epoch": 1354} {"train_loss": -11.865730285644531, "global_step": 227511, "epoch": 1354} {"train_loss": -11.630880355834961, "global_step": 227512, "epoch": 1354} {"train_loss": -11.855982780456543, "global_step": 227513, "epoch": 1354} {"train_loss": -11.666877746582031, "global_step": 227514, "epoch": 1354} {"train_loss": -11.906306266784668, "global_step": 227515, "epoch": 1354} {"train_loss": -11.469929695129395, "global_step": 227516, "epoch": 1354} {"train_loss": -11.987998008728027, "global_step": 227517, "epoch": 1354} {"train_loss": -11.782581329345703, "global_step": 227518, "epoch": 1354} {"train_loss": -11.77281379699707, "global_step": 227519, "epoch": 1354} {"train_loss": -12.07829761505127, "global_step": 227520, "epoch": 1354} {"train_loss": -11.79855728149414, "global_step": 227521, "epoch": 1354} {"train_loss": -11.884024620056152, "global_step": 227522, "epoch": 1354} {"train_loss": -11.704419136047363, "global_step": 227523, "epoch": 1354} {"train_loss": -12.16785717010498, "global_step": 227524, "epoch": 1354} {"train_loss": -12.109418869018555, "global_step": 227525, "epoch": 1354} {"train_loss": -12.096906661987305, "global_step": 227526, "epoch": 1354} {"train_loss": -11.830143928527832, "global_step": 227527, "epoch": 1354} {"train_loss": -11.97938346862793, "global_step": 227528, "epoch": 1354} {"train_loss": -12.069281578063965, "global_step": 227529, "epoch": 1354} {"train_loss": -11.896713256835938, "global_step": 227530, "epoch": 1354} {"train_loss": -11.871305465698242, "global_step": 227531, "epoch": 1354} {"train_loss": -12.151981353759766, "global_step": 227532, "epoch": 1354} {"train_loss": -11.909032821655273, "global_step": 227533, "epoch": 1354} {"train_loss": -12.079903602600098, "global_step": 227534, "epoch": 1354} {"train_loss": -11.842814445495605, "global_step": 227535, "epoch": 1354} {"train_loss": -12.021110534667969, "global_step": 227536, "epoch": 1354} {"train_loss": -11.730253219604492, "global_step": 227537, "epoch": 1354} {"train_loss": -12.039170265197754, "global_step": 227538, "epoch": 1354} {"train_loss": -11.727880477905273, "global_step": 227539, "epoch": 1354} {"train_loss": -11.87281322479248, "global_step": 227540, "epoch": 1354} {"train_loss": -11.648669242858887, "global_step": 227541, "epoch": 1354} {"train_loss": -11.178096771240234, "global_step": 227542, "epoch": 1354} {"train_loss": -11.361133575439453, "global_step": 227543, "epoch": 1354} {"train_loss": -11.505842208862305, "global_step": 227544, "epoch": 1354} {"train_loss": -11.73358154296875, "global_step": 227545, "epoch": 1354} {"train_loss": -10.794317245483398, "global_step": 227546, "epoch": 1354} {"train_loss": -9.903148651123047, "global_step": 227547, "epoch": 1354} {"train_loss": -10.037702560424805, "global_step": 227548, "epoch": 1354} {"train_loss": -10.991976737976074, "global_step": 227549, "epoch": 1354} {"train_loss": -11.608596801757812, "global_step": 227550, "epoch": 1354} {"train_loss": -11.38532543182373, "global_step": 227551, "epoch": 1354} {"train_loss": -10.121223449707031, "global_step": 227552, "epoch": 1354} {"train_loss": -11.16592025756836, "global_step": 227553, "epoch": 1354} {"train_loss": -11.525506973266602, "global_step": 227554, "epoch": 1354} {"train_loss": -10.571038246154785, "global_step": 227555, "epoch": 1354} {"train_loss": -11.742345809936523, "global_step": 227556, "epoch": 1354} {"train_loss": -11.058883666992188, "global_step": 227557, "epoch": 1354} {"train_loss": -11.141141891479492, "global_step": 227558, "epoch": 1354} {"train_loss": -11.644314765930176, "global_step": 227559, "epoch": 1354} {"train_loss": -11.44290542602539, "global_step": 227560, "epoch": 1354} {"train_loss": -11.79223918914795, "global_step": 227561, "epoch": 1354} {"train_loss": -11.598077774047852, "global_step": 227562, "epoch": 1354} {"train_loss": -11.698657035827637, "global_step": 227563, "epoch": 1354} {"train_loss": -11.645992279052734, "global_step": 227564, "epoch": 1354} {"train_loss": -11.676292419433594, "global_step": 227565, "epoch": 1354} {"train_loss": -11.911779403686523, "global_step": 227566, "epoch": 1354} {"train_loss": -11.251791000366211, "global_step": 227567, "epoch": 1354} {"train_loss": -11.647014617919922, "global_step": 227568, "epoch": 1354} {"train_loss": -11.169971466064453, "global_step": 227569, "epoch": 1354} {"train_loss": -11.518569946289062, "global_step": 227570, "epoch": 1354} {"train_loss": -11.173599243164062, "global_step": 227571, "epoch": 1354} {"train_loss": -11.068076133728027, "global_step": 227572, "epoch": 1354} {"train_loss": -10.928780555725098, "global_step": 227573, "epoch": 1354} {"train_loss": -10.602608680725098, "global_step": 227574, "epoch": 1354} {"train_loss": -11.313980102539062, "global_step": 227575, "epoch": 1354} {"train_loss": -10.402515411376953, "global_step": 227576, "epoch": 1354} {"train_loss": -11.724146842956543, "global_step": 227577, "epoch": 1354} {"train_loss": -10.886595726013184, "global_step": 227578, "epoch": 1354} {"train_loss": -11.281110763549805, "global_step": 227579, "epoch": 1354} {"train_loss": -11.289257049560547, "global_step": 227580, "epoch": 1354} {"train_loss": -10.214241027832031, "global_step": 227581, "epoch": 1354} {"train_loss": -11.326608657836914, "global_step": 227582, "epoch": 1354} {"train_loss": -10.483366012573242, "global_step": 227583, "epoch": 1354} {"train_loss": -11.058571815490723, "global_step": 227584, "epoch": 1354} {"train_loss": -11.182906150817871, "global_step": 227585, "epoch": 1354} {"train_loss": -11.179254531860352, "global_step": 227586, "epoch": 1354} {"train_loss": -11.074974060058594, "global_step": 227587, "epoch": 1354} {"train_loss": -11.16728401184082, "global_step": 227588, "epoch": 1354} {"train_loss": -11.342512130737305, "global_step": 227589, "epoch": 1354} {"train_loss": -11.02965259552002, "global_step": 227590, "epoch": 1354} {"train_loss": -11.279775619506836, "global_step": 227591, "epoch": 1354} {"train_loss": -11.475427627563477, "global_step": 227592, "epoch": 1354} {"train_loss": -11.255239486694336, "global_step": 227593, "epoch": 1354} {"train_loss": -11.481735229492188, "global_step": 227594, "epoch": 1354} {"train_loss": -11.354066848754883, "global_step": 227595, "epoch": 1354} {"train_loss": -11.814380645751953, "global_step": 227596, "epoch": 1354} {"train_loss": -11.161283493041992, "global_step": 227597, "epoch": 1354} {"train_loss": -11.67742919921875, "global_step": 227598, "epoch": 1354} {"train_loss": -11.31894302368164, "global_step": 227599, "epoch": 1354} {"train_loss": -11.740293502807617, "global_step": 227600, "epoch": 1354} {"train_loss": -11.356146812438965, "global_step": 227601, "epoch": 1354} {"train_loss": -11.482635498046875, "global_step": 227602, "epoch": 1354} {"train_loss": -11.580302238464355, "global_step": 227603, "epoch": 1354} {"train_loss": -11.371376037597656, "global_step": 227604, "epoch": 1354} {"train_loss": -11.512772560119629, "global_step": 227605, "epoch": 1354} {"train_loss": -11.27906608581543, "global_step": 227606, "epoch": 1354} {"train_loss": -11.450754165649414, "global_step": 227607, "epoch": 1354} {"train_loss": -11.541752815246582, "global_step": 227608, "epoch": 1354} {"train_loss": -11.578407287597656, "global_step": 227609, "epoch": 1354} {"train_loss": -11.602632522583008, "global_step": 227610, "epoch": 1354} {"train_loss": -11.111942291259766, "global_step": 227611, "epoch": 1354} {"train_loss": -11.745320320129395, "global_step": 227612, "epoch": 1354} {"train_loss": -11.383918762207031, "global_step": 227613, "epoch": 1354} {"train_loss": -11.74394702911377, "global_step": 227614, "epoch": 1354} {"train_loss": -11.453775405883789, "global_step": 227615, "epoch": 1354} {"train_loss": -11.517656326293945, "global_step": 227616, "epoch": 1354} {"train_loss": -11.538432121276855, "global_step": 227617, "epoch": 1354} {"train_loss": -11.688533782958984, "global_step": 227618, "epoch": 1354} {"train_loss": -11.760348320007324, "global_step": 227619, "epoch": 1354} {"train_loss": -11.900335311889648, "global_step": 227620, "epoch": 1354} {"train_loss": -11.83634090423584, "global_step": 227621, "epoch": 1354} {"train_loss": -11.785591125488281, "global_step": 227622, "epoch": 1354} {"train_loss": -11.815876007080078, "global_step": 227623, "epoch": 1354} {"train_loss": -11.835563659667969, "global_step": 227624, "epoch": 1354} {"train_loss": -11.675378799438477, "global_step": 227625, "epoch": 1354} {"train_loss": -11.865903854370117, "global_step": 227626, "epoch": 1354} {"train_loss": -11.70028305053711, "global_step": 227627, "epoch": 1354} {"train_loss": -11.66847038269043, "global_step": 227628, "epoch": 1354} {"train_loss": -11.652870178222656, "global_step": 227629, "epoch": 1354} {"train_loss": -11.659784317016602, "global_step": 227630, "epoch": 1354} {"train_loss": -11.729482650756836, "global_step": 227631, "epoch": 1354} {"train_loss": -11.412875175476074, "global_step": 227632, "epoch": 1354} {"train_loss": -11.70635986328125, "global_step": 227633, "epoch": 1354} {"train_loss": -11.77277946472168, "global_step": 227634, "epoch": 1354} {"train_loss": -11.518102645874023, "global_step": 227635, "epoch": 1354} {"train_loss": -11.829587936401367, "global_step": 227636, "epoch": 1354} {"train_loss": -11.388543128967285, "global_step": 227637, "epoch": 1354} {"train_loss": -11.660835266113281, "global_step": 227638, "epoch": 1354} {"train_loss": -11.530508240063986, "global_step": 227639, "epoch": 1354, "val_loss": 261962.25} {"train_loss": -11.018461227416992, "global_step": 227640, "epoch": 1355} {"train_loss": -10.24081039428711, "global_step": 227641, "epoch": 1355} {"train_loss": -11.391378402709961, "global_step": 227642, "epoch": 1355} {"train_loss": -11.407682418823242, "global_step": 227643, "epoch": 1355} {"train_loss": -10.892719268798828, "global_step": 227644, "epoch": 1355} {"train_loss": -11.833501815795898, "global_step": 227645, "epoch": 1355} {"train_loss": -11.621904373168945, "global_step": 227646, "epoch": 1355} {"train_loss": -11.684615135192871, "global_step": 227647, "epoch": 1355} {"train_loss": -11.800992965698242, "global_step": 227648, "epoch": 1355} {"train_loss": -11.81252670288086, "global_step": 227649, "epoch": 1355} {"train_loss": -11.634841918945312, "global_step": 227650, "epoch": 1355} {"train_loss": -11.609079360961914, "global_step": 227651, "epoch": 1355} {"train_loss": -11.950662612915039, "global_step": 227652, "epoch": 1355} {"train_loss": -11.784652709960938, "global_step": 227653, "epoch": 1355} {"train_loss": -11.999821662902832, "global_step": 227654, "epoch": 1355} {"train_loss": -11.899421691894531, "global_step": 227655, "epoch": 1355} {"train_loss": -11.972179412841797, "global_step": 227656, "epoch": 1355} {"train_loss": -11.759057998657227, "global_step": 227657, "epoch": 1355} {"train_loss": -11.953344345092773, "global_step": 227658, "epoch": 1355} {"train_loss": -11.763044357299805, "global_step": 227659, "epoch": 1355} {"train_loss": -11.89497184753418, "global_step": 227660, "epoch": 1355} {"train_loss": -11.982257843017578, "global_step": 227661, "epoch": 1355} {"train_loss": -11.908326148986816, "global_step": 227662, "epoch": 1355} {"train_loss": -12.12850570678711, "global_step": 227663, "epoch": 1355} {"train_loss": -12.002068519592285, "global_step": 227664, "epoch": 1355} {"train_loss": -11.992354393005371, "global_step": 227665, "epoch": 1355} {"train_loss": -12.022886276245117, "global_step": 227666, "epoch": 1355} {"train_loss": -11.802026748657227, "global_step": 227667, "epoch": 1355} {"train_loss": -12.001550674438477, "global_step": 227668, "epoch": 1355} {"train_loss": -11.744486808776855, "global_step": 227669, "epoch": 1355} {"train_loss": -11.918487548828125, "global_step": 227670, "epoch": 1355} {"train_loss": -11.952507019042969, "global_step": 227671, "epoch": 1355} {"train_loss": -11.609293937683105, "global_step": 227672, "epoch": 1355} {"train_loss": -11.982828140258789, "global_step": 227673, "epoch": 1355} {"train_loss": -11.665491104125977, "global_step": 227674, "epoch": 1355} {"train_loss": -12.18217658996582, "global_step": 227675, "epoch": 1355} {"train_loss": -11.849013328552246, "global_step": 227676, "epoch": 1355} {"train_loss": -12.280716896057129, "global_step": 227677, "epoch": 1355} {"train_loss": -11.762467384338379, "global_step": 227678, "epoch": 1355} {"train_loss": -11.923221588134766, "global_step": 227679, "epoch": 1355} {"train_loss": -11.887640953063965, "global_step": 227680, "epoch": 1355} {"train_loss": -12.149636268615723, "global_step": 227681, "epoch": 1355} {"train_loss": -11.909335136413574, "global_step": 227682, "epoch": 1355} {"train_loss": -11.988557815551758, "global_step": 227683, "epoch": 1355} {"train_loss": -11.821474075317383, "global_step": 227684, "epoch": 1355} {"train_loss": -11.836418151855469, "global_step": 227685, "epoch": 1355} {"train_loss": -11.870753288269043, "global_step": 227686, "epoch": 1355} {"train_loss": -11.628914833068848, "global_step": 227687, "epoch": 1355} {"train_loss": -11.073343276977539, "global_step": 227688, "epoch": 1355} {"train_loss": -10.955720901489258, "global_step": 227689, "epoch": 1355} {"train_loss": -11.297223091125488, "global_step": 227690, "epoch": 1355} {"train_loss": -11.407623291015625, "global_step": 227691, "epoch": 1355} {"train_loss": -11.37037467956543, "global_step": 227692, "epoch": 1355} {"train_loss": -11.057188034057617, "global_step": 227693, "epoch": 1355} {"train_loss": -11.335258483886719, "global_step": 227694, "epoch": 1355} {"train_loss": -11.569494247436523, "global_step": 227695, "epoch": 1355} {"train_loss": -11.275579452514648, "global_step": 227696, "epoch": 1355} {"train_loss": -9.933178901672363, "global_step": 227697, "epoch": 1355} {"train_loss": -10.936317443847656, "global_step": 227698, "epoch": 1355} {"train_loss": -10.614065170288086, "global_step": 227699, "epoch": 1355} {"train_loss": -10.32862663269043, "global_step": 227700, "epoch": 1355} {"train_loss": -10.094411849975586, "global_step": 227701, "epoch": 1355} {"train_loss": -11.450193405151367, "global_step": 227702, "epoch": 1355} {"train_loss": -8.274663925170898, "global_step": 227703, "epoch": 1355} {"train_loss": -10.850753784179688, "global_step": 227704, "epoch": 1355} {"train_loss": -9.021903038024902, "global_step": 227705, "epoch": 1355} {"train_loss": -8.753732681274414, "global_step": 227706, "epoch": 1355} {"train_loss": -10.996604919433594, "global_step": 227707, "epoch": 1355} {"train_loss": -9.549866676330566, "global_step": 227708, "epoch": 1355} {"train_loss": -10.784116744995117, "global_step": 227709, "epoch": 1355} {"train_loss": -10.013816833496094, "global_step": 227710, "epoch": 1355} {"train_loss": -10.169200897216797, "global_step": 227711, "epoch": 1355} {"train_loss": -10.126611709594727, "global_step": 227712, "epoch": 1355} {"train_loss": -10.814104080200195, "global_step": 227713, "epoch": 1355} {"train_loss": -9.666166305541992, "global_step": 227714, "epoch": 1355} {"train_loss": -11.402966499328613, "global_step": 227715, "epoch": 1355} {"train_loss": -10.52290153503418, "global_step": 227716, "epoch": 1355} {"train_loss": -10.57115364074707, "global_step": 227717, "epoch": 1355} {"train_loss": -11.384943008422852, "global_step": 227718, "epoch": 1355} {"train_loss": -10.848063468933105, "global_step": 227719, "epoch": 1355} {"train_loss": -11.193668365478516, "global_step": 227720, "epoch": 1355} {"train_loss": -11.119129180908203, "global_step": 227721, "epoch": 1355} {"train_loss": -11.575691223144531, "global_step": 227722, "epoch": 1355} {"train_loss": -11.332931518554688, "global_step": 227723, "epoch": 1355} {"train_loss": -11.600659370422363, "global_step": 227724, "epoch": 1355} {"train_loss": -11.131784439086914, "global_step": 227725, "epoch": 1355} {"train_loss": -11.489961624145508, "global_step": 227726, "epoch": 1355} {"train_loss": -11.229791641235352, "global_step": 227727, "epoch": 1355} {"train_loss": -11.57022476196289, "global_step": 227728, "epoch": 1355} {"train_loss": -11.377276420593262, "global_step": 227729, "epoch": 1355} {"train_loss": -11.141380310058594, "global_step": 227730, "epoch": 1355} {"train_loss": -11.39956283569336, "global_step": 227731, "epoch": 1355} {"train_loss": -11.586946487426758, "global_step": 227732, "epoch": 1355} {"train_loss": -11.51510238647461, "global_step": 227733, "epoch": 1355} {"train_loss": -11.79068374633789, "global_step": 227734, "epoch": 1355} {"train_loss": -11.522851943969727, "global_step": 227735, "epoch": 1355} {"train_loss": -11.704530715942383, "global_step": 227736, "epoch": 1355} {"train_loss": -11.613301277160645, "global_step": 227737, "epoch": 1355} {"train_loss": -11.596109390258789, "global_step": 227738, "epoch": 1355} {"train_loss": -11.636096954345703, "global_step": 227739, "epoch": 1355} {"train_loss": -11.725852966308594, "global_step": 227740, "epoch": 1355} {"train_loss": -11.719627380371094, "global_step": 227741, "epoch": 1355} {"train_loss": -11.487544059753418, "global_step": 227742, "epoch": 1355} {"train_loss": -11.389328956604004, "global_step": 227743, "epoch": 1355} {"train_loss": -11.558380126953125, "global_step": 227744, "epoch": 1355} {"train_loss": -11.643150329589844, "global_step": 227745, "epoch": 1355} {"train_loss": -11.655860900878906, "global_step": 227746, "epoch": 1355} {"train_loss": -11.526312828063965, "global_step": 227747, "epoch": 1355} {"train_loss": -11.460555076599121, "global_step": 227748, "epoch": 1355} {"train_loss": -11.683235168457031, "global_step": 227749, "epoch": 1355} {"train_loss": -11.284096717834473, "global_step": 227750, "epoch": 1355} {"train_loss": -11.614439010620117, "global_step": 227751, "epoch": 1355} {"train_loss": -11.456814765930176, "global_step": 227752, "epoch": 1355} {"train_loss": -11.8868408203125, "global_step": 227753, "epoch": 1355} {"train_loss": -11.59794807434082, "global_step": 227754, "epoch": 1355} {"train_loss": -11.697166442871094, "global_step": 227755, "epoch": 1355} {"train_loss": -11.731668472290039, "global_step": 227756, "epoch": 1355} {"train_loss": -11.691104888916016, "global_step": 227757, "epoch": 1355} {"train_loss": -11.551080703735352, "global_step": 227758, "epoch": 1355} {"train_loss": -11.432790756225586, "global_step": 227759, "epoch": 1355} {"train_loss": -11.812033653259277, "global_step": 227760, "epoch": 1355} {"train_loss": -11.742241859436035, "global_step": 227761, "epoch": 1355} {"train_loss": -11.893316268920898, "global_step": 227762, "epoch": 1355} {"train_loss": -11.954303741455078, "global_step": 227763, "epoch": 1355} {"train_loss": -11.820223808288574, "global_step": 227764, "epoch": 1355} {"train_loss": -11.854425430297852, "global_step": 227765, "epoch": 1355} {"train_loss": -11.872377395629883, "global_step": 227766, "epoch": 1355} {"train_loss": -12.044305801391602, "global_step": 227767, "epoch": 1355} {"train_loss": -12.01103401184082, "global_step": 227768, "epoch": 1355} {"train_loss": -11.73497486114502, "global_step": 227769, "epoch": 1355} {"train_loss": -11.895132064819336, "global_step": 227770, "epoch": 1355} {"train_loss": -11.892375946044922, "global_step": 227771, "epoch": 1355} {"train_loss": -12.082019805908203, "global_step": 227772, "epoch": 1355} {"train_loss": -11.98807144165039, "global_step": 227773, "epoch": 1355} {"train_loss": -11.691155433654785, "global_step": 227774, "epoch": 1355} {"train_loss": -11.875093460083008, "global_step": 227775, "epoch": 1355} {"train_loss": -11.94253158569336, "global_step": 227776, "epoch": 1355} {"train_loss": -11.995823860168457, "global_step": 227777, "epoch": 1355} {"train_loss": -11.917171478271484, "global_step": 227778, "epoch": 1355} {"train_loss": -12.028570175170898, "global_step": 227779, "epoch": 1355} {"train_loss": -12.13473129272461, "global_step": 227780, "epoch": 1355} {"train_loss": -11.948624610900879, "global_step": 227781, "epoch": 1355} {"train_loss": -12.233756065368652, "global_step": 227782, "epoch": 1355} {"train_loss": -11.64829158782959, "global_step": 227783, "epoch": 1355} {"train_loss": -11.888494491577148, "global_step": 227784, "epoch": 1355} {"train_loss": -11.751460075378418, "global_step": 227785, "epoch": 1355} {"train_loss": -12.013654708862305, "global_step": 227786, "epoch": 1355} {"train_loss": -11.91118049621582, "global_step": 227787, "epoch": 1355} {"train_loss": -12.171205520629883, "global_step": 227788, "epoch": 1355} {"train_loss": -11.827903747558594, "global_step": 227789, "epoch": 1355} {"train_loss": -12.05539321899414, "global_step": 227790, "epoch": 1355} {"train_loss": -11.832043647766113, "global_step": 227791, "epoch": 1355} {"train_loss": -11.713957786560059, "global_step": 227792, "epoch": 1355} {"train_loss": -12.095393180847168, "global_step": 227793, "epoch": 1355} {"train_loss": -12.063480377197266, "global_step": 227794, "epoch": 1355} {"train_loss": -12.137687683105469, "global_step": 227795, "epoch": 1355} {"train_loss": -11.845775604248047, "global_step": 227796, "epoch": 1355} {"train_loss": -11.825304985046387, "global_step": 227797, "epoch": 1355} {"train_loss": -12.174295425415039, "global_step": 227798, "epoch": 1355} {"train_loss": -11.854425430297852, "global_step": 227799, "epoch": 1355} {"train_loss": -11.945884704589844, "global_step": 227800, "epoch": 1355} {"train_loss": -12.04789924621582, "global_step": 227801, "epoch": 1355} {"train_loss": -11.92590618133545, "global_step": 227802, "epoch": 1355} {"train_loss": -11.998157501220703, "global_step": 227803, "epoch": 1355} {"train_loss": -11.979679107666016, "global_step": 227804, "epoch": 1355} {"train_loss": -11.994049072265625, "global_step": 227805, "epoch": 1355} {"train_loss": -11.789392471313477, "global_step": 227806, "epoch": 1355} {"train_loss": -11.534558035078502, "global_step": 227807, "epoch": 1355, "val_loss": 260431.640625, "train_action_mse_error": 1.7655725479125977} {"train_loss": -11.883697509765625, "global_step": 227808, "epoch": 1356} {"train_loss": -12.082107543945312, "global_step": 227809, "epoch": 1356} {"train_loss": -12.056300163269043, "global_step": 227810, "epoch": 1356} {"train_loss": -11.387613296508789, "global_step": 227811, "epoch": 1356} {"train_loss": -11.906783103942871, "global_step": 227812, "epoch": 1356} {"train_loss": -11.598735809326172, "global_step": 227813, "epoch": 1356} {"train_loss": -10.871847152709961, "global_step": 227814, "epoch": 1356} {"train_loss": -11.043111801147461, "global_step": 227815, "epoch": 1356} {"train_loss": -11.829723358154297, "global_step": 227816, "epoch": 1356} {"train_loss": -11.023894309997559, "global_step": 227817, "epoch": 1356} {"train_loss": -9.467362403869629, "global_step": 227818, "epoch": 1356} {"train_loss": -11.53667163848877, "global_step": 227819, "epoch": 1356} {"train_loss": -11.520371437072754, "global_step": 227820, "epoch": 1356} {"train_loss": -10.017295837402344, "global_step": 227821, "epoch": 1356} {"train_loss": -11.213295936584473, "global_step": 227822, "epoch": 1356} {"train_loss": -11.29550552368164, "global_step": 227823, "epoch": 1356} {"train_loss": -10.174429893493652, "global_step": 227824, "epoch": 1356} {"train_loss": -10.478187561035156, "global_step": 227825, "epoch": 1356} {"train_loss": -11.476642608642578, "global_step": 227826, "epoch": 1356} {"train_loss": -10.126307487487793, "global_step": 227827, "epoch": 1356} {"train_loss": -10.753353118896484, "global_step": 227828, "epoch": 1356} {"train_loss": -10.68862247467041, "global_step": 227829, "epoch": 1356} {"train_loss": -10.425249099731445, "global_step": 227830, "epoch": 1356} {"train_loss": -11.710763931274414, "global_step": 227831, "epoch": 1356} {"train_loss": -10.604852676391602, "global_step": 227832, "epoch": 1356} {"train_loss": -11.23335075378418, "global_step": 227833, "epoch": 1356} {"train_loss": -11.196163177490234, "global_step": 227834, "epoch": 1356} {"train_loss": -11.329153060913086, "global_step": 227835, "epoch": 1356} {"train_loss": -10.830589294433594, "global_step": 227836, "epoch": 1356} {"train_loss": -11.191984176635742, "global_step": 227837, "epoch": 1356} {"train_loss": -10.953775405883789, "global_step": 227838, "epoch": 1356} {"train_loss": -11.293477058410645, "global_step": 227839, "epoch": 1356} {"train_loss": -10.868064880371094, "global_step": 227840, "epoch": 1356} {"train_loss": -11.304872512817383, "global_step": 227841, "epoch": 1356} {"train_loss": -11.137594223022461, "global_step": 227842, "epoch": 1356} {"train_loss": -11.398085594177246, "global_step": 227843, "epoch": 1356} {"train_loss": -10.994673728942871, "global_step": 227844, "epoch": 1356} {"train_loss": -11.257735252380371, "global_step": 227845, "epoch": 1356} {"train_loss": -11.403539657592773, "global_step": 227846, "epoch": 1356} {"train_loss": -10.853302001953125, "global_step": 227847, "epoch": 1356} {"train_loss": -10.783567428588867, "global_step": 227848, "epoch": 1356} {"train_loss": -11.194936752319336, "global_step": 227849, "epoch": 1356} {"train_loss": -11.208621978759766, "global_step": 227850, "epoch": 1356} {"train_loss": -10.879671096801758, "global_step": 227851, "epoch": 1356} {"train_loss": -11.722118377685547, "global_step": 227852, "epoch": 1356} {"train_loss": -11.117624282836914, "global_step": 227853, "epoch": 1356} {"train_loss": -11.09569263458252, "global_step": 227854, "epoch": 1356} {"train_loss": -11.298019409179688, "global_step": 227855, "epoch": 1356} {"train_loss": -11.062644958496094, "global_step": 227856, "epoch": 1356} {"train_loss": -11.676076889038086, "global_step": 227857, "epoch": 1356} {"train_loss": -11.274452209472656, "global_step": 227858, "epoch": 1356} {"train_loss": -11.780900955200195, "global_step": 227859, "epoch": 1356} {"train_loss": -11.23123836517334, "global_step": 227860, "epoch": 1356} {"train_loss": -11.448147773742676, "global_step": 227861, "epoch": 1356} {"train_loss": -11.099918365478516, "global_step": 227862, "epoch": 1356} {"train_loss": -11.346476554870605, "global_step": 227863, "epoch": 1356} {"train_loss": -11.375327110290527, "global_step": 227864, "epoch": 1356} {"train_loss": -11.290618896484375, "global_step": 227865, "epoch": 1356} {"train_loss": -11.290271759033203, "global_step": 227866, "epoch": 1356} {"train_loss": -11.293779373168945, "global_step": 227867, "epoch": 1356} {"train_loss": -11.478715896606445, "global_step": 227868, "epoch": 1356} {"train_loss": -11.65313720703125, "global_step": 227869, "epoch": 1356} {"train_loss": -11.673639297485352, "global_step": 227870, "epoch": 1356} {"train_loss": -11.610296249389648, "global_step": 227871, "epoch": 1356} {"train_loss": -11.748086929321289, "global_step": 227872, "epoch": 1356} {"train_loss": -11.308563232421875, "global_step": 227873, "epoch": 1356} {"train_loss": -11.52553653717041, "global_step": 227874, "epoch": 1356} {"train_loss": -11.408859252929688, "global_step": 227875, "epoch": 1356} {"train_loss": -11.462616920471191, "global_step": 227876, "epoch": 1356} {"train_loss": -11.668839454650879, "global_step": 227877, "epoch": 1356} {"train_loss": -11.531436920166016, "global_step": 227878, "epoch": 1356} {"train_loss": -11.693464279174805, "global_step": 227879, "epoch": 1356} {"train_loss": -11.322423934936523, "global_step": 227880, "epoch": 1356} {"train_loss": -11.683649063110352, "global_step": 227881, "epoch": 1356} {"train_loss": -11.457342147827148, "global_step": 227882, "epoch": 1356} {"train_loss": -11.621018409729004, "global_step": 227883, "epoch": 1356} {"train_loss": -11.850971221923828, "global_step": 227884, "epoch": 1356} {"train_loss": -11.133207321166992, "global_step": 227885, "epoch": 1356} {"train_loss": -11.491264343261719, "global_step": 227886, "epoch": 1356} {"train_loss": -11.15896224975586, "global_step": 227887, "epoch": 1356} {"train_loss": -11.67397689819336, "global_step": 227888, "epoch": 1356} {"train_loss": -11.395252227783203, "global_step": 227889, "epoch": 1356} {"train_loss": -11.153844833374023, "global_step": 227890, "epoch": 1356} {"train_loss": -11.381669044494629, "global_step": 227891, "epoch": 1356} {"train_loss": -11.420036315917969, "global_step": 227892, "epoch": 1356} {"train_loss": -11.506509780883789, "global_step": 227893, "epoch": 1356} {"train_loss": -11.357952117919922, "global_step": 227894, "epoch": 1356} {"train_loss": -11.542344093322754, "global_step": 227895, "epoch": 1356} {"train_loss": -11.367996215820312, "global_step": 227896, "epoch": 1356} {"train_loss": -11.91882038116455, "global_step": 227897, "epoch": 1356} {"train_loss": -11.393993377685547, "global_step": 227898, "epoch": 1356} {"train_loss": -11.60712718963623, "global_step": 227899, "epoch": 1356} {"train_loss": -11.549028396606445, "global_step": 227900, "epoch": 1356} {"train_loss": -11.783393859863281, "global_step": 227901, "epoch": 1356} {"train_loss": -11.84859848022461, "global_step": 227902, "epoch": 1356} {"train_loss": -11.587940216064453, "global_step": 227903, "epoch": 1356} {"train_loss": -11.574773788452148, "global_step": 227904, "epoch": 1356} {"train_loss": -11.651451110839844, "global_step": 227905, "epoch": 1356} {"train_loss": -11.654541015625, "global_step": 227906, "epoch": 1356} {"train_loss": -12.00454330444336, "global_step": 227907, "epoch": 1356} {"train_loss": -11.504375457763672, "global_step": 227908, "epoch": 1356} {"train_loss": -11.678378105163574, "global_step": 227909, "epoch": 1356} {"train_loss": -11.684748649597168, "global_step": 227910, "epoch": 1356} {"train_loss": -11.564536094665527, "global_step": 227911, "epoch": 1356} {"train_loss": -11.829170227050781, "global_step": 227912, "epoch": 1356} {"train_loss": -11.50502872467041, "global_step": 227913, "epoch": 1356} {"train_loss": -11.795589447021484, "global_step": 227914, "epoch": 1356} {"train_loss": -11.564403533935547, "global_step": 227915, "epoch": 1356} {"train_loss": -11.573064804077148, "global_step": 227916, "epoch": 1356} {"train_loss": -11.656203269958496, "global_step": 227917, "epoch": 1356} {"train_loss": -11.87161636352539, "global_step": 227918, "epoch": 1356} {"train_loss": -11.837785720825195, "global_step": 227919, "epoch": 1356} {"train_loss": -11.779850006103516, "global_step": 227920, "epoch": 1356} {"train_loss": -11.312604904174805, "global_step": 227921, "epoch": 1356} {"train_loss": -11.60693359375, "global_step": 227922, "epoch": 1356} {"train_loss": -12.009162902832031, "global_step": 227923, "epoch": 1356} {"train_loss": -11.869162559509277, "global_step": 227924, "epoch": 1356} {"train_loss": -11.96347427368164, "global_step": 227925, "epoch": 1356} {"train_loss": -11.794818878173828, "global_step": 227926, "epoch": 1356} {"train_loss": -11.929502487182617, "global_step": 227927, "epoch": 1356} {"train_loss": -12.12861156463623, "global_step": 227928, "epoch": 1356} {"train_loss": -12.021781921386719, "global_step": 227929, "epoch": 1356} {"train_loss": -11.90993881225586, "global_step": 227930, "epoch": 1356} {"train_loss": -12.015335083007812, "global_step": 227931, "epoch": 1356} {"train_loss": -12.250685691833496, "global_step": 227932, "epoch": 1356} {"train_loss": -12.06796646118164, "global_step": 227933, "epoch": 1356} {"train_loss": -11.85519790649414, "global_step": 227934, "epoch": 1356} {"train_loss": -11.92381477355957, "global_step": 227935, "epoch": 1356} {"train_loss": -11.934276580810547, "global_step": 227936, "epoch": 1356} {"train_loss": -12.051321029663086, "global_step": 227937, "epoch": 1356} {"train_loss": -11.92487621307373, "global_step": 227938, "epoch": 1356} {"train_loss": -11.713003158569336, "global_step": 227939, "epoch": 1356} {"train_loss": -11.8500337600708, "global_step": 227940, "epoch": 1356} {"train_loss": -12.028999328613281, "global_step": 227941, "epoch": 1356} {"train_loss": -11.76840877532959, "global_step": 227942, "epoch": 1356} {"train_loss": -11.795185089111328, "global_step": 227943, "epoch": 1356} {"train_loss": -11.739481925964355, "global_step": 227944, "epoch": 1356} {"train_loss": -11.316218376159668, "global_step": 227945, "epoch": 1356} {"train_loss": -11.037431716918945, "global_step": 227946, "epoch": 1356} {"train_loss": -11.192737579345703, "global_step": 227947, "epoch": 1356} {"train_loss": -11.790471076965332, "global_step": 227948, "epoch": 1356} {"train_loss": -10.57861614227295, "global_step": 227949, "epoch": 1356} {"train_loss": -11.77955436706543, "global_step": 227950, "epoch": 1356} {"train_loss": -11.202131271362305, "global_step": 227951, "epoch": 1356} {"train_loss": -9.58502197265625, "global_step": 227952, "epoch": 1356} {"train_loss": -11.547111511230469, "global_step": 227953, "epoch": 1356} {"train_loss": -10.914791107177734, "global_step": 227954, "epoch": 1356} {"train_loss": -10.39659595489502, "global_step": 227955, "epoch": 1356} {"train_loss": -11.28363037109375, "global_step": 227956, "epoch": 1356} {"train_loss": -11.063940048217773, "global_step": 227957, "epoch": 1356} {"train_loss": -9.641014099121094, "global_step": 227958, "epoch": 1356} {"train_loss": -11.252219200134277, "global_step": 227959, "epoch": 1356} {"train_loss": -10.308208465576172, "global_step": 227960, "epoch": 1356} {"train_loss": -10.254409790039062, "global_step": 227961, "epoch": 1356} {"train_loss": -11.267485618591309, "global_step": 227962, "epoch": 1356} {"train_loss": -9.90321159362793, "global_step": 227963, "epoch": 1356} {"train_loss": -11.195366859436035, "global_step": 227964, "epoch": 1356} {"train_loss": -11.04964828491211, "global_step": 227965, "epoch": 1356} {"train_loss": -11.095069885253906, "global_step": 227966, "epoch": 1356} {"train_loss": -11.290679931640625, "global_step": 227967, "epoch": 1356} {"train_loss": -10.909406661987305, "global_step": 227968, "epoch": 1356} {"train_loss": -10.705114364624023, "global_step": 227969, "epoch": 1356} {"train_loss": -11.004941940307617, "global_step": 227970, "epoch": 1356} {"train_loss": -10.332236289978027, "global_step": 227971, "epoch": 1356} {"train_loss": -10.506762504577637, "global_step": 227972, "epoch": 1356} {"train_loss": -9.145965576171875, "global_step": 227973, "epoch": 1356} {"train_loss": -9.604248046875, "global_step": 227974, "epoch": 1356} {"train_loss": -11.320640683174133, "global_step": 227975, "epoch": 1356, "val_loss": 263212.03125} {"train_loss": -10.235211372375488, "global_step": 227976, "epoch": 1357} {"train_loss": -8.391263008117676, "global_step": 227977, "epoch": 1357} {"train_loss": -8.222332000732422, "global_step": 227978, "epoch": 1357} {"train_loss": -9.323575973510742, "global_step": 227979, "epoch": 1357} {"train_loss": -9.811742782592773, "global_step": 227980, "epoch": 1357} {"train_loss": -9.598053932189941, "global_step": 227981, "epoch": 1357} {"train_loss": -10.146928787231445, "global_step": 227982, "epoch": 1357} {"train_loss": -9.722261428833008, "global_step": 227983, "epoch": 1357} {"train_loss": -10.044294357299805, "global_step": 227984, "epoch": 1357} {"train_loss": -11.207395553588867, "global_step": 227985, "epoch": 1357} {"train_loss": -10.325967788696289, "global_step": 227986, "epoch": 1357} {"train_loss": -9.580924987792969, "global_step": 227987, "epoch": 1357} {"train_loss": -10.172689437866211, "global_step": 227988, "epoch": 1357} {"train_loss": -10.460922241210938, "global_step": 227989, "epoch": 1357} {"train_loss": -9.67473030090332, "global_step": 227990, "epoch": 1357} {"train_loss": -10.521475791931152, "global_step": 227991, "epoch": 1357} {"train_loss": -11.080456733703613, "global_step": 227992, "epoch": 1357} {"train_loss": -10.515613555908203, "global_step": 227993, "epoch": 1357} {"train_loss": -10.663540840148926, "global_step": 227994, "epoch": 1357} {"train_loss": -11.009923934936523, "global_step": 227995, "epoch": 1357} {"train_loss": -10.761553764343262, "global_step": 227996, "epoch": 1357} {"train_loss": -10.329825401306152, "global_step": 227997, "epoch": 1357} {"train_loss": -10.83202075958252, "global_step": 227998, "epoch": 1357} {"train_loss": -11.036745071411133, "global_step": 227999, "epoch": 1357} {"train_loss": -11.053923606872559, "global_step": 228000, "epoch": 1357} {"train_loss": -10.892009735107422, "global_step": 228001, "epoch": 1357} {"train_loss": -11.311981201171875, "global_step": 228002, "epoch": 1357} {"train_loss": -11.275936126708984, "global_step": 228003, "epoch": 1357} {"train_loss": -11.09205436706543, "global_step": 228004, "epoch": 1357} {"train_loss": -11.138148307800293, "global_step": 228005, "epoch": 1357} {"train_loss": -11.355634689331055, "global_step": 228006, "epoch": 1357} {"train_loss": -11.48210620880127, "global_step": 228007, "epoch": 1357} {"train_loss": -11.498320579528809, "global_step": 228008, "epoch": 1357} {"train_loss": -11.40005111694336, "global_step": 228009, "epoch": 1357} {"train_loss": -11.640698432922363, "global_step": 228010, "epoch": 1357} {"train_loss": -11.62033462524414, "global_step": 228011, "epoch": 1357} {"train_loss": -11.565862655639648, "global_step": 228012, "epoch": 1357} {"train_loss": -11.22817325592041, "global_step": 228013, "epoch": 1357} {"train_loss": -11.474371910095215, "global_step": 228014, "epoch": 1357} {"train_loss": -11.552552223205566, "global_step": 228015, "epoch": 1357} {"train_loss": -11.503681182861328, "global_step": 228016, "epoch": 1357} {"train_loss": -11.422548294067383, "global_step": 228017, "epoch": 1357} {"train_loss": -11.377055168151855, "global_step": 228018, "epoch": 1357} {"train_loss": -11.43494701385498, "global_step": 228019, "epoch": 1357} {"train_loss": -11.570792198181152, "global_step": 228020, "epoch": 1357} {"train_loss": -11.575878143310547, "global_step": 228021, "epoch": 1357} {"train_loss": -11.72875690460205, "global_step": 228022, "epoch": 1357} {"train_loss": -11.273860931396484, "global_step": 228023, "epoch": 1357} {"train_loss": -11.559223175048828, "global_step": 228024, "epoch": 1357} {"train_loss": -11.456750869750977, "global_step": 228025, "epoch": 1357} {"train_loss": -11.53693962097168, "global_step": 228026, "epoch": 1357} {"train_loss": -11.691417694091797, "global_step": 228027, "epoch": 1357} {"train_loss": -11.641326904296875, "global_step": 228028, "epoch": 1357} {"train_loss": -11.441184043884277, "global_step": 228029, "epoch": 1357} {"train_loss": -11.797686576843262, "global_step": 228030, "epoch": 1357} {"train_loss": -11.518787384033203, "global_step": 228031, "epoch": 1357} {"train_loss": -11.587020874023438, "global_step": 228032, "epoch": 1357} {"train_loss": -11.533631324768066, "global_step": 228033, "epoch": 1357} {"train_loss": -11.825841903686523, "global_step": 228034, "epoch": 1357} {"train_loss": -11.72562313079834, "global_step": 228035, "epoch": 1357} {"train_loss": -11.74262809753418, "global_step": 228036, "epoch": 1357} {"train_loss": -11.669979095458984, "global_step": 228037, "epoch": 1357} {"train_loss": -11.86651611328125, "global_step": 228038, "epoch": 1357} {"train_loss": -11.807205200195312, "global_step": 228039, "epoch": 1357} {"train_loss": -11.686077117919922, "global_step": 228040, "epoch": 1357} {"train_loss": -11.784017562866211, "global_step": 228041, "epoch": 1357} {"train_loss": -11.845170974731445, "global_step": 228042, "epoch": 1357} {"train_loss": -11.352983474731445, "global_step": 228043, "epoch": 1357} {"train_loss": -11.628376007080078, "global_step": 228044, "epoch": 1357} {"train_loss": -11.197043418884277, "global_step": 228045, "epoch": 1357} {"train_loss": -10.850621223449707, "global_step": 228046, "epoch": 1357} {"train_loss": -11.727059364318848, "global_step": 228047, "epoch": 1357} {"train_loss": -10.92324447631836, "global_step": 228048, "epoch": 1357} {"train_loss": -11.646061897277832, "global_step": 228049, "epoch": 1357} {"train_loss": -11.280119895935059, "global_step": 228050, "epoch": 1357} {"train_loss": -11.175763130187988, "global_step": 228051, "epoch": 1357} {"train_loss": -11.536702156066895, "global_step": 228052, "epoch": 1357} {"train_loss": -11.093544960021973, "global_step": 228053, "epoch": 1357} {"train_loss": -11.558859825134277, "global_step": 228054, "epoch": 1357} {"train_loss": -11.203914642333984, "global_step": 228055, "epoch": 1357} {"train_loss": -11.710111618041992, "global_step": 228056, "epoch": 1357} {"train_loss": -11.343454360961914, "global_step": 228057, "epoch": 1357} {"train_loss": -10.86958122253418, "global_step": 228058, "epoch": 1357} {"train_loss": -11.48417854309082, "global_step": 228059, "epoch": 1357} {"train_loss": -11.312698364257812, "global_step": 228060, "epoch": 1357} {"train_loss": -11.680794715881348, "global_step": 228061, "epoch": 1357} {"train_loss": -11.373462677001953, "global_step": 228062, "epoch": 1357} {"train_loss": -11.661166191101074, "global_step": 228063, "epoch": 1357} {"train_loss": -11.365201950073242, "global_step": 228064, "epoch": 1357} {"train_loss": -11.152939796447754, "global_step": 228065, "epoch": 1357} {"train_loss": -11.70965576171875, "global_step": 228066, "epoch": 1357} {"train_loss": -11.196210861206055, "global_step": 228067, "epoch": 1357} {"train_loss": -11.745437622070312, "global_step": 228068, "epoch": 1357} {"train_loss": -11.142473220825195, "global_step": 228069, "epoch": 1357} {"train_loss": -11.668237686157227, "global_step": 228070, "epoch": 1357} {"train_loss": -11.227682113647461, "global_step": 228071, "epoch": 1357} {"train_loss": -11.663265228271484, "global_step": 228072, "epoch": 1357} {"train_loss": -11.340998649597168, "global_step": 228073, "epoch": 1357} {"train_loss": -11.362319946289062, "global_step": 228074, "epoch": 1357} {"train_loss": -11.734895706176758, "global_step": 228075, "epoch": 1357} {"train_loss": -11.591337203979492, "global_step": 228076, "epoch": 1357} {"train_loss": -11.820910453796387, "global_step": 228077, "epoch": 1357} {"train_loss": -11.760796546936035, "global_step": 228078, "epoch": 1357} {"train_loss": -11.507311820983887, "global_step": 228079, "epoch": 1357} {"train_loss": -11.562711715698242, "global_step": 228080, "epoch": 1357} {"train_loss": -11.773735046386719, "global_step": 228081, "epoch": 1357} {"train_loss": -11.742084503173828, "global_step": 228082, "epoch": 1357} {"train_loss": -11.649490356445312, "global_step": 228083, "epoch": 1357} {"train_loss": -11.596935272216797, "global_step": 228084, "epoch": 1357} {"train_loss": -11.524711608886719, "global_step": 228085, "epoch": 1357} {"train_loss": -11.417274475097656, "global_step": 228086, "epoch": 1357} {"train_loss": -11.583709716796875, "global_step": 228087, "epoch": 1357} {"train_loss": -11.662883758544922, "global_step": 228088, "epoch": 1357} {"train_loss": -11.734136581420898, "global_step": 228089, "epoch": 1357} {"train_loss": -11.810535430908203, "global_step": 228090, "epoch": 1357} {"train_loss": -11.325960159301758, "global_step": 228091, "epoch": 1357} {"train_loss": -11.638741493225098, "global_step": 228092, "epoch": 1357} {"train_loss": -11.435014724731445, "global_step": 228093, "epoch": 1357} {"train_loss": -11.791847229003906, "global_step": 228094, "epoch": 1357} {"train_loss": -11.388588905334473, "global_step": 228095, "epoch": 1357} {"train_loss": -11.478403091430664, "global_step": 228096, "epoch": 1357} {"train_loss": -11.764495849609375, "global_step": 228097, "epoch": 1357} {"train_loss": -11.110442161560059, "global_step": 228098, "epoch": 1357} {"train_loss": -11.753366470336914, "global_step": 228099, "epoch": 1357} {"train_loss": -11.516216278076172, "global_step": 228100, "epoch": 1357} {"train_loss": -11.277284622192383, "global_step": 228101, "epoch": 1357} {"train_loss": -11.865306854248047, "global_step": 228102, "epoch": 1357} {"train_loss": -11.257375717163086, "global_step": 228103, "epoch": 1357} {"train_loss": -11.486116409301758, "global_step": 228104, "epoch": 1357} {"train_loss": -11.314971923828125, "global_step": 228105, "epoch": 1357} {"train_loss": -11.855348587036133, "global_step": 228106, "epoch": 1357} {"train_loss": -11.147542953491211, "global_step": 228107, "epoch": 1357} {"train_loss": -11.73044204711914, "global_step": 228108, "epoch": 1357} {"train_loss": -11.586050987243652, "global_step": 228109, "epoch": 1357} {"train_loss": -11.862297058105469, "global_step": 228110, "epoch": 1357} {"train_loss": -11.432476997375488, "global_step": 228111, "epoch": 1357} {"train_loss": -11.743169784545898, "global_step": 228112, "epoch": 1357} {"train_loss": -12.032922744750977, "global_step": 228113, "epoch": 1357} {"train_loss": -11.386383056640625, "global_step": 228114, "epoch": 1357} {"train_loss": -11.654632568359375, "global_step": 228115, "epoch": 1357} {"train_loss": -11.64858627319336, "global_step": 228116, "epoch": 1357} {"train_loss": -11.971805572509766, "global_step": 228117, "epoch": 1357} {"train_loss": -11.586761474609375, "global_step": 228118, "epoch": 1357} {"train_loss": -11.839856147766113, "global_step": 228119, "epoch": 1357} {"train_loss": -12.127754211425781, "global_step": 228120, "epoch": 1357} {"train_loss": -11.850980758666992, "global_step": 228121, "epoch": 1357} {"train_loss": -11.749702453613281, "global_step": 228122, "epoch": 1357} {"train_loss": -11.895909309387207, "global_step": 228123, "epoch": 1357} {"train_loss": -11.700082778930664, "global_step": 228124, "epoch": 1357} {"train_loss": -11.905660629272461, "global_step": 228125, "epoch": 1357} {"train_loss": -11.585105895996094, "global_step": 228126, "epoch": 1357} {"train_loss": -11.886899948120117, "global_step": 228127, "epoch": 1357} {"train_loss": -11.826922416687012, "global_step": 228128, "epoch": 1357} {"train_loss": -11.534473419189453, "global_step": 228129, "epoch": 1357} {"train_loss": -11.895759582519531, "global_step": 228130, "epoch": 1357} {"train_loss": -11.855642318725586, "global_step": 228131, "epoch": 1357} {"train_loss": -11.795122146606445, "global_step": 228132, "epoch": 1357} {"train_loss": -11.84526538848877, "global_step": 228133, "epoch": 1357} {"train_loss": -12.051433563232422, "global_step": 228134, "epoch": 1357} {"train_loss": -11.478921890258789, "global_step": 228135, "epoch": 1357} {"train_loss": -10.279972076416016, "global_step": 228136, "epoch": 1357} {"train_loss": -10.993337631225586, "global_step": 228137, "epoch": 1357} {"train_loss": -11.440656661987305, "global_step": 228138, "epoch": 1357} {"train_loss": -11.368839263916016, "global_step": 228139, "epoch": 1357} {"train_loss": -11.362144470214844, "global_step": 228140, "epoch": 1357} {"train_loss": -11.607495307922363, "global_step": 228141, "epoch": 1357} {"train_loss": -11.298924446105957, "global_step": 228142, "epoch": 1357} {"train_loss": -11.336506678944541, "global_step": 228143, "epoch": 1357, "val_loss": 264777.1875} {"train_loss": -11.513036727905273, "global_step": 228144, "epoch": 1358} {"train_loss": -11.61145305633545, "global_step": 228145, "epoch": 1358} {"train_loss": -11.947981834411621, "global_step": 228146, "epoch": 1358} {"train_loss": -11.520550727844238, "global_step": 228147, "epoch": 1358} {"train_loss": -11.88404655456543, "global_step": 228148, "epoch": 1358} {"train_loss": -11.812719345092773, "global_step": 228149, "epoch": 1358} {"train_loss": -11.908241271972656, "global_step": 228150, "epoch": 1358} {"train_loss": -11.644689559936523, "global_step": 228151, "epoch": 1358} {"train_loss": -11.822391510009766, "global_step": 228152, "epoch": 1358} {"train_loss": -11.599544525146484, "global_step": 228153, "epoch": 1358} {"train_loss": -11.654133796691895, "global_step": 228154, "epoch": 1358} {"train_loss": -11.930452346801758, "global_step": 228155, "epoch": 1358} {"train_loss": -11.815255165100098, "global_step": 228156, "epoch": 1358} {"train_loss": -11.826398849487305, "global_step": 228157, "epoch": 1358} {"train_loss": -11.997358322143555, "global_step": 228158, "epoch": 1358} {"train_loss": -11.663134574890137, "global_step": 228159, "epoch": 1358} {"train_loss": -11.750923156738281, "global_step": 228160, "epoch": 1358} {"train_loss": -11.581979751586914, "global_step": 228161, "epoch": 1358} {"train_loss": -11.720357894897461, "global_step": 228162, "epoch": 1358} {"train_loss": -12.062663078308105, "global_step": 228163, "epoch": 1358} {"train_loss": -11.869264602661133, "global_step": 228164, "epoch": 1358} {"train_loss": -11.936840057373047, "global_step": 228165, "epoch": 1358} {"train_loss": -12.062431335449219, "global_step": 228166, "epoch": 1358} {"train_loss": -12.008649826049805, "global_step": 228167, "epoch": 1358} {"train_loss": -11.998170852661133, "global_step": 228168, "epoch": 1358} {"train_loss": -11.909988403320312, "global_step": 228169, "epoch": 1358} {"train_loss": -11.944364547729492, "global_step": 228170, "epoch": 1358} {"train_loss": -11.995468139648438, "global_step": 228171, "epoch": 1358} {"train_loss": -11.838558197021484, "global_step": 228172, "epoch": 1358} {"train_loss": -11.727895736694336, "global_step": 228173, "epoch": 1358} {"train_loss": -11.838558197021484, "global_step": 228174, "epoch": 1358} {"train_loss": -11.945723533630371, "global_step": 228175, "epoch": 1358} {"train_loss": -11.868844985961914, "global_step": 228176, "epoch": 1358} {"train_loss": -11.87742805480957, "global_step": 228177, "epoch": 1358} {"train_loss": -11.728240013122559, "global_step": 228178, "epoch": 1358} {"train_loss": -11.347803115844727, "global_step": 228179, "epoch": 1358} {"train_loss": -10.675762176513672, "global_step": 228180, "epoch": 1358} {"train_loss": -11.290657997131348, "global_step": 228181, "epoch": 1358} {"train_loss": -10.756101608276367, "global_step": 228182, "epoch": 1358} {"train_loss": -10.348060607910156, "global_step": 228183, "epoch": 1358} {"train_loss": -11.534152030944824, "global_step": 228184, "epoch": 1358} {"train_loss": -11.184213638305664, "global_step": 228185, "epoch": 1358} {"train_loss": -11.101346969604492, "global_step": 228186, "epoch": 1358} {"train_loss": -11.32737922668457, "global_step": 228187, "epoch": 1358} {"train_loss": -11.547362327575684, "global_step": 228188, "epoch": 1358} {"train_loss": -11.430273056030273, "global_step": 228189, "epoch": 1358} {"train_loss": -11.649574279785156, "global_step": 228190, "epoch": 1358} {"train_loss": -11.285787582397461, "global_step": 228191, "epoch": 1358} {"train_loss": -10.838990211486816, "global_step": 228192, "epoch": 1358} {"train_loss": -11.560176849365234, "global_step": 228193, "epoch": 1358} {"train_loss": -11.152374267578125, "global_step": 228194, "epoch": 1358} {"train_loss": -10.847116470336914, "global_step": 228195, "epoch": 1358} {"train_loss": -11.574420928955078, "global_step": 228196, "epoch": 1358} {"train_loss": -11.160141944885254, "global_step": 228197, "epoch": 1358} {"train_loss": -11.250864028930664, "global_step": 228198, "epoch": 1358} {"train_loss": -11.898307800292969, "global_step": 228199, "epoch": 1358} {"train_loss": -11.050178527832031, "global_step": 228200, "epoch": 1358} {"train_loss": -11.598136901855469, "global_step": 228201, "epoch": 1358} {"train_loss": -11.469877243041992, "global_step": 228202, "epoch": 1358} {"train_loss": -11.24365520477295, "global_step": 228203, "epoch": 1358} {"train_loss": -11.835803985595703, "global_step": 228204, "epoch": 1358} {"train_loss": -10.665932655334473, "global_step": 228205, "epoch": 1358} {"train_loss": -11.22957992553711, "global_step": 228206, "epoch": 1358} {"train_loss": -11.571267127990723, "global_step": 228207, "epoch": 1358} {"train_loss": -11.695402145385742, "global_step": 228208, "epoch": 1358} {"train_loss": -11.765218734741211, "global_step": 228209, "epoch": 1358} {"train_loss": -11.249940872192383, "global_step": 228210, "epoch": 1358} {"train_loss": -11.485406875610352, "global_step": 228211, "epoch": 1358} {"train_loss": -11.697250366210938, "global_step": 228212, "epoch": 1358} {"train_loss": -11.526654243469238, "global_step": 228213, "epoch": 1358} {"train_loss": -11.558201789855957, "global_step": 228214, "epoch": 1358} {"train_loss": -11.778116226196289, "global_step": 228215, "epoch": 1358} {"train_loss": -11.556081771850586, "global_step": 228216, "epoch": 1358} {"train_loss": -11.656669616699219, "global_step": 228217, "epoch": 1358} {"train_loss": -11.831947326660156, "global_step": 228218, "epoch": 1358} {"train_loss": -11.643453598022461, "global_step": 228219, "epoch": 1358} {"train_loss": -11.578880310058594, "global_step": 228220, "epoch": 1358} {"train_loss": -11.884174346923828, "global_step": 228221, "epoch": 1358} {"train_loss": -11.721996307373047, "global_step": 228222, "epoch": 1358} {"train_loss": -11.844614028930664, "global_step": 228223, "epoch": 1358} {"train_loss": -11.218077659606934, "global_step": 228224, "epoch": 1358} {"train_loss": -11.814191818237305, "global_step": 228225, "epoch": 1358} {"train_loss": -11.924751281738281, "global_step": 228226, "epoch": 1358} {"train_loss": -11.743896484375, "global_step": 228227, "epoch": 1358} {"train_loss": -11.595035552978516, "global_step": 228228, "epoch": 1358} {"train_loss": -11.813758850097656, "global_step": 228229, "epoch": 1358} {"train_loss": -11.872119903564453, "global_step": 228230, "epoch": 1358} {"train_loss": -11.465616226196289, "global_step": 228231, "epoch": 1358} {"train_loss": -11.818239212036133, "global_step": 228232, "epoch": 1358} {"train_loss": -11.645940780639648, "global_step": 228233, "epoch": 1358} {"train_loss": -10.974802017211914, "global_step": 228234, "epoch": 1358} {"train_loss": -11.911619186401367, "global_step": 228235, "epoch": 1358} {"train_loss": -11.617693901062012, "global_step": 228236, "epoch": 1358} {"train_loss": -11.838722229003906, "global_step": 228237, "epoch": 1358} {"train_loss": -11.485595703125, "global_step": 228238, "epoch": 1358} {"train_loss": -11.162450790405273, "global_step": 228239, "epoch": 1358} {"train_loss": -11.31423282623291, "global_step": 228240, "epoch": 1358} {"train_loss": -11.301523208618164, "global_step": 228241, "epoch": 1358} {"train_loss": -10.552083969116211, "global_step": 228242, "epoch": 1358} {"train_loss": -11.564709663391113, "global_step": 228243, "epoch": 1358} {"train_loss": -11.205423355102539, "global_step": 228244, "epoch": 1358} {"train_loss": -10.514381408691406, "global_step": 228245, "epoch": 1358} {"train_loss": -10.896032333374023, "global_step": 228246, "epoch": 1358} {"train_loss": -10.28305721282959, "global_step": 228247, "epoch": 1358} {"train_loss": -10.992170333862305, "global_step": 228248, "epoch": 1358} {"train_loss": -10.82543659210205, "global_step": 228249, "epoch": 1358} {"train_loss": -10.173542976379395, "global_step": 228250, "epoch": 1358} {"train_loss": -9.842994689941406, "global_step": 228251, "epoch": 1358} {"train_loss": -10.966181755065918, "global_step": 228252, "epoch": 1358} {"train_loss": -10.03674602508545, "global_step": 228253, "epoch": 1358} {"train_loss": -10.566913604736328, "global_step": 228254, "epoch": 1358} {"train_loss": -10.491878509521484, "global_step": 228255, "epoch": 1358} {"train_loss": -10.655723571777344, "global_step": 228256, "epoch": 1358} {"train_loss": -10.15707778930664, "global_step": 228257, "epoch": 1358} {"train_loss": -10.865717887878418, "global_step": 228258, "epoch": 1358} {"train_loss": -10.834951400756836, "global_step": 228259, "epoch": 1358} {"train_loss": -11.084394454956055, "global_step": 228260, "epoch": 1358} {"train_loss": -10.957797050476074, "global_step": 228261, "epoch": 1358} {"train_loss": -10.219200134277344, "global_step": 228262, "epoch": 1358} {"train_loss": -10.347360610961914, "global_step": 228263, "epoch": 1358} {"train_loss": -10.564857482910156, "global_step": 228264, "epoch": 1358} {"train_loss": -9.25422477722168, "global_step": 228265, "epoch": 1358} {"train_loss": -10.797115325927734, "global_step": 228266, "epoch": 1358} {"train_loss": -9.914275169372559, "global_step": 228267, "epoch": 1358} {"train_loss": -10.630977630615234, "global_step": 228268, "epoch": 1358} {"train_loss": -10.281495094299316, "global_step": 228269, "epoch": 1358} {"train_loss": -11.006916046142578, "global_step": 228270, "epoch": 1358} {"train_loss": -10.477025985717773, "global_step": 228271, "epoch": 1358} {"train_loss": -10.931519508361816, "global_step": 228272, "epoch": 1358} {"train_loss": -11.062643051147461, "global_step": 228273, "epoch": 1358} {"train_loss": -11.226009368896484, "global_step": 228274, "epoch": 1358} {"train_loss": -11.01756477355957, "global_step": 228275, "epoch": 1358} {"train_loss": -11.34524154663086, "global_step": 228276, "epoch": 1358} {"train_loss": -10.853912353515625, "global_step": 228277, "epoch": 1358} {"train_loss": -11.25505256652832, "global_step": 228278, "epoch": 1358} {"train_loss": -10.986403465270996, "global_step": 228279, "epoch": 1358} {"train_loss": -11.311978340148926, "global_step": 228280, "epoch": 1358} {"train_loss": -10.839003562927246, "global_step": 228281, "epoch": 1358} {"train_loss": -11.218523025512695, "global_step": 228282, "epoch": 1358} {"train_loss": -10.875907897949219, "global_step": 228283, "epoch": 1358} {"train_loss": -11.166011810302734, "global_step": 228284, "epoch": 1358} {"train_loss": -10.908597946166992, "global_step": 228285, "epoch": 1358} {"train_loss": -10.454925537109375, "global_step": 228286, "epoch": 1358} {"train_loss": -11.411789894104004, "global_step": 228287, "epoch": 1358} {"train_loss": -10.626794815063477, "global_step": 228288, "epoch": 1358} {"train_loss": -11.213515281677246, "global_step": 228289, "epoch": 1358} {"train_loss": -11.352422714233398, "global_step": 228290, "epoch": 1358} {"train_loss": -11.391300201416016, "global_step": 228291, "epoch": 1358} {"train_loss": -11.069390296936035, "global_step": 228292, "epoch": 1358} {"train_loss": -11.552713394165039, "global_step": 228293, "epoch": 1358} {"train_loss": -10.907434463500977, "global_step": 228294, "epoch": 1358} {"train_loss": -11.52349853515625, "global_step": 228295, "epoch": 1358} {"train_loss": -11.220161437988281, "global_step": 228296, "epoch": 1358} {"train_loss": -11.248627662658691, "global_step": 228297, "epoch": 1358} {"train_loss": -11.167911529541016, "global_step": 228298, "epoch": 1358} {"train_loss": -11.118510246276855, "global_step": 228299, "epoch": 1358} {"train_loss": -11.35244369506836, "global_step": 228300, "epoch": 1358} {"train_loss": -11.060827255249023, "global_step": 228301, "epoch": 1358} {"train_loss": -11.486394882202148, "global_step": 228302, "epoch": 1358} {"train_loss": -10.989320755004883, "global_step": 228303, "epoch": 1358} {"train_loss": -11.67724895477295, "global_step": 228304, "epoch": 1358} {"train_loss": -11.565250396728516, "global_step": 228305, "epoch": 1358} {"train_loss": -11.551299095153809, "global_step": 228306, "epoch": 1358} {"train_loss": -11.716085433959961, "global_step": 228307, "epoch": 1358} {"train_loss": -11.528453826904297, "global_step": 228308, "epoch": 1358} {"train_loss": -11.49218463897705, "global_step": 228309, "epoch": 1358} {"train_loss": -11.687658309936523, "global_step": 228310, "epoch": 1358} {"train_loss": -11.31757626647041, "global_step": 228311, "epoch": 1358, "val_loss": 262410.8125} {"train_loss": -11.541769027709961, "global_step": 228312, "epoch": 1359} {"train_loss": -11.852534294128418, "global_step": 228313, "epoch": 1359} {"train_loss": -11.671867370605469, "global_step": 228314, "epoch": 1359} {"train_loss": -11.652586936950684, "global_step": 228315, "epoch": 1359} {"train_loss": -11.623860359191895, "global_step": 228316, "epoch": 1359} {"train_loss": -11.680964469909668, "global_step": 228317, "epoch": 1359} {"train_loss": -11.895666122436523, "global_step": 228318, "epoch": 1359} {"train_loss": -11.77747917175293, "global_step": 228319, "epoch": 1359} {"train_loss": -11.534510612487793, "global_step": 228320, "epoch": 1359} {"train_loss": -11.64761734008789, "global_step": 228321, "epoch": 1359} {"train_loss": -11.537463188171387, "global_step": 228322, "epoch": 1359} {"train_loss": -11.765562057495117, "global_step": 228323, "epoch": 1359} {"train_loss": -11.3502197265625, "global_step": 228324, "epoch": 1359} {"train_loss": -11.699703216552734, "global_step": 228325, "epoch": 1359} {"train_loss": -11.726304054260254, "global_step": 228326, "epoch": 1359} {"train_loss": -11.772565841674805, "global_step": 228327, "epoch": 1359} {"train_loss": -11.872167587280273, "global_step": 228328, "epoch": 1359} {"train_loss": -11.825322151184082, "global_step": 228329, "epoch": 1359} {"train_loss": -11.969217300415039, "global_step": 228330, "epoch": 1359} {"train_loss": -11.91191291809082, "global_step": 228331, "epoch": 1359} {"train_loss": -11.761610984802246, "global_step": 228332, "epoch": 1359} {"train_loss": -11.867325782775879, "global_step": 228333, "epoch": 1359} {"train_loss": -11.667896270751953, "global_step": 228334, "epoch": 1359} {"train_loss": -11.869714736938477, "global_step": 228335, "epoch": 1359} {"train_loss": -11.942694664001465, "global_step": 228336, "epoch": 1359} {"train_loss": -12.091471672058105, "global_step": 228337, "epoch": 1359} {"train_loss": -11.86391544342041, "global_step": 228338, "epoch": 1359} {"train_loss": -11.981947898864746, "global_step": 228339, "epoch": 1359} {"train_loss": -11.84332275390625, "global_step": 228340, "epoch": 1359} {"train_loss": -11.976133346557617, "global_step": 228341, "epoch": 1359} {"train_loss": -11.763812065124512, "global_step": 228342, "epoch": 1359} {"train_loss": -12.038154602050781, "global_step": 228343, "epoch": 1359} {"train_loss": -12.01617431640625, "global_step": 228344, "epoch": 1359} {"train_loss": -12.11140251159668, "global_step": 228345, "epoch": 1359} {"train_loss": -12.00212287902832, "global_step": 228346, "epoch": 1359} {"train_loss": -12.002601623535156, "global_step": 228347, "epoch": 1359} {"train_loss": -12.091649055480957, "global_step": 228348, "epoch": 1359} {"train_loss": -11.955921173095703, "global_step": 228349, "epoch": 1359} {"train_loss": -12.12969970703125, "global_step": 228350, "epoch": 1359} {"train_loss": -12.267916679382324, "global_step": 228351, "epoch": 1359} {"train_loss": -11.979902267456055, "global_step": 228352, "epoch": 1359} {"train_loss": -11.999977111816406, "global_step": 228353, "epoch": 1359} {"train_loss": -12.083184242248535, "global_step": 228354, "epoch": 1359} {"train_loss": -11.832605361938477, "global_step": 228355, "epoch": 1359} {"train_loss": -12.02486515045166, "global_step": 228356, "epoch": 1359} {"train_loss": -11.922630310058594, "global_step": 228357, "epoch": 1359} {"train_loss": -11.9235200881958, "global_step": 228358, "epoch": 1359} {"train_loss": -11.74555778503418, "global_step": 228359, "epoch": 1359} {"train_loss": -12.157119750976562, "global_step": 228360, "epoch": 1359} {"train_loss": -11.367545127868652, "global_step": 228361, "epoch": 1359} {"train_loss": -11.96141529083252, "global_step": 228362, "epoch": 1359} {"train_loss": -12.061307907104492, "global_step": 228363, "epoch": 1359} {"train_loss": -11.916166305541992, "global_step": 228364, "epoch": 1359} {"train_loss": -11.251800537109375, "global_step": 228365, "epoch": 1359} {"train_loss": -11.78439712524414, "global_step": 228366, "epoch": 1359} {"train_loss": -12.033720970153809, "global_step": 228367, "epoch": 1359} {"train_loss": -11.83195972442627, "global_step": 228368, "epoch": 1359} {"train_loss": -11.963785171508789, "global_step": 228369, "epoch": 1359} {"train_loss": -12.087760925292969, "global_step": 228370, "epoch": 1359} {"train_loss": -12.138115882873535, "global_step": 228371, "epoch": 1359} {"train_loss": -11.981101036071777, "global_step": 228372, "epoch": 1359} {"train_loss": -12.103318214416504, "global_step": 228373, "epoch": 1359} {"train_loss": -11.952814102172852, "global_step": 228374, "epoch": 1359} {"train_loss": -11.759397506713867, "global_step": 228375, "epoch": 1359} {"train_loss": -11.806668281555176, "global_step": 228376, "epoch": 1359} {"train_loss": -11.91981315612793, "global_step": 228377, "epoch": 1359} {"train_loss": -11.728723526000977, "global_step": 228378, "epoch": 1359} {"train_loss": -10.775066375732422, "global_step": 228379, "epoch": 1359} {"train_loss": -11.273578643798828, "global_step": 228380, "epoch": 1359} {"train_loss": -11.309289932250977, "global_step": 228381, "epoch": 1359} {"train_loss": -11.266204833984375, "global_step": 228382, "epoch": 1359} {"train_loss": -10.472789764404297, "global_step": 228383, "epoch": 1359} {"train_loss": -11.233386039733887, "global_step": 228384, "epoch": 1359} {"train_loss": -11.509788513183594, "global_step": 228385, "epoch": 1359} {"train_loss": -8.378934860229492, "global_step": 228386, "epoch": 1359} {"train_loss": -8.925313949584961, "global_step": 228387, "epoch": 1359} {"train_loss": -10.844252586364746, "global_step": 228388, "epoch": 1359} {"train_loss": -9.20957088470459, "global_step": 228389, "epoch": 1359} {"train_loss": -8.514419555664062, "global_step": 228390, "epoch": 1359} {"train_loss": -9.30343246459961, "global_step": 228391, "epoch": 1359} {"train_loss": -8.530261039733887, "global_step": 228392, "epoch": 1359} {"train_loss": -8.900616645812988, "global_step": 228393, "epoch": 1359} {"train_loss": -7.65423583984375, "global_step": 228394, "epoch": 1359} {"train_loss": -8.126270294189453, "global_step": 228395, "epoch": 1359} {"train_loss": -8.724270820617676, "global_step": 228396, "epoch": 1359} {"train_loss": -9.584199905395508, "global_step": 228397, "epoch": 1359} {"train_loss": -9.552335739135742, "global_step": 228398, "epoch": 1359} {"train_loss": -9.295851707458496, "global_step": 228399, "epoch": 1359} {"train_loss": -9.358793258666992, "global_step": 228400, "epoch": 1359} {"train_loss": -10.37617301940918, "global_step": 228401, "epoch": 1359} {"train_loss": -9.471843719482422, "global_step": 228402, "epoch": 1359} {"train_loss": -10.321565628051758, "global_step": 228403, "epoch": 1359} {"train_loss": -10.606729507446289, "global_step": 228404, "epoch": 1359} {"train_loss": -10.812906265258789, "global_step": 228405, "epoch": 1359} {"train_loss": -11.097864151000977, "global_step": 228406, "epoch": 1359} {"train_loss": -10.887073516845703, "global_step": 228407, "epoch": 1359} {"train_loss": -10.843668937683105, "global_step": 228408, "epoch": 1359} {"train_loss": -10.870284080505371, "global_step": 228409, "epoch": 1359} {"train_loss": -10.592597961425781, "global_step": 228410, "epoch": 1359} {"train_loss": -11.163702964782715, "global_step": 228411, "epoch": 1359} {"train_loss": -11.093425750732422, "global_step": 228412, "epoch": 1359} {"train_loss": -11.093484878540039, "global_step": 228413, "epoch": 1359} {"train_loss": -11.283945083618164, "global_step": 228414, "epoch": 1359} {"train_loss": -11.306238174438477, "global_step": 228415, "epoch": 1359} {"train_loss": -11.224604606628418, "global_step": 228416, "epoch": 1359} {"train_loss": -11.411256790161133, "global_step": 228417, "epoch": 1359} {"train_loss": -11.045671463012695, "global_step": 228418, "epoch": 1359} {"train_loss": -11.611730575561523, "global_step": 228419, "epoch": 1359} {"train_loss": -11.42715072631836, "global_step": 228420, "epoch": 1359} {"train_loss": -11.139259338378906, "global_step": 228421, "epoch": 1359} {"train_loss": -11.217378616333008, "global_step": 228422, "epoch": 1359} {"train_loss": -11.272721290588379, "global_step": 228423, "epoch": 1359} {"train_loss": -11.561500549316406, "global_step": 228424, "epoch": 1359} {"train_loss": -11.46731185913086, "global_step": 228425, "epoch": 1359} {"train_loss": -11.500176429748535, "global_step": 228426, "epoch": 1359} {"train_loss": -11.5498046875, "global_step": 228427, "epoch": 1359} {"train_loss": -11.693483352661133, "global_step": 228428, "epoch": 1359} {"train_loss": -11.55668830871582, "global_step": 228429, "epoch": 1359} {"train_loss": -11.7457275390625, "global_step": 228430, "epoch": 1359} {"train_loss": -11.660155296325684, "global_step": 228431, "epoch": 1359} {"train_loss": -11.745429992675781, "global_step": 228432, "epoch": 1359} {"train_loss": -11.60865592956543, "global_step": 228433, "epoch": 1359} {"train_loss": -11.804983139038086, "global_step": 228434, "epoch": 1359} {"train_loss": -11.522119522094727, "global_step": 228435, "epoch": 1359} {"train_loss": -11.777036666870117, "global_step": 228436, "epoch": 1359} {"train_loss": -11.590418815612793, "global_step": 228437, "epoch": 1359} {"train_loss": -11.688483238220215, "global_step": 228438, "epoch": 1359} {"train_loss": -11.622945785522461, "global_step": 228439, "epoch": 1359} {"train_loss": -11.765582084655762, "global_step": 228440, "epoch": 1359} {"train_loss": -11.808913230895996, "global_step": 228441, "epoch": 1359} {"train_loss": -11.703744888305664, "global_step": 228442, "epoch": 1359} {"train_loss": -11.890033721923828, "global_step": 228443, "epoch": 1359} {"train_loss": -11.750534057617188, "global_step": 228444, "epoch": 1359} {"train_loss": -11.994613647460938, "global_step": 228445, "epoch": 1359} {"train_loss": -11.892332077026367, "global_step": 228446, "epoch": 1359} {"train_loss": -11.861611366271973, "global_step": 228447, "epoch": 1359} {"train_loss": -11.76602554321289, "global_step": 228448, "epoch": 1359} {"train_loss": -11.758773803710938, "global_step": 228449, "epoch": 1359} {"train_loss": -12.016641616821289, "global_step": 228450, "epoch": 1359} {"train_loss": -11.879390716552734, "global_step": 228451, "epoch": 1359} {"train_loss": -11.95705509185791, "global_step": 228452, "epoch": 1359} {"train_loss": -11.720232009887695, "global_step": 228453, "epoch": 1359} {"train_loss": -11.993099212646484, "global_step": 228454, "epoch": 1359} {"train_loss": -11.812905311584473, "global_step": 228455, "epoch": 1359} {"train_loss": -11.862359046936035, "global_step": 228456, "epoch": 1359} {"train_loss": -11.946927070617676, "global_step": 228457, "epoch": 1359} {"train_loss": -11.80908489227295, "global_step": 228458, "epoch": 1359} {"train_loss": -12.022724151611328, "global_step": 228459, "epoch": 1359} {"train_loss": -11.999885559082031, "global_step": 228460, "epoch": 1359} {"train_loss": -12.031503677368164, "global_step": 228461, "epoch": 1359} {"train_loss": -11.931652069091797, "global_step": 228462, "epoch": 1359} {"train_loss": -11.961843490600586, "global_step": 228463, "epoch": 1359} {"train_loss": -11.815384864807129, "global_step": 228464, "epoch": 1359} {"train_loss": -11.755126953125, "global_step": 228465, "epoch": 1359} {"train_loss": -11.816469192504883, "global_step": 228466, "epoch": 1359} {"train_loss": -11.833944320678711, "global_step": 228467, "epoch": 1359} {"train_loss": -11.742301940917969, "global_step": 228468, "epoch": 1359} {"train_loss": -11.89780044555664, "global_step": 228469, "epoch": 1359} {"train_loss": -11.771206855773926, "global_step": 228470, "epoch": 1359} {"train_loss": -11.232329368591309, "global_step": 228471, "epoch": 1359} {"train_loss": -11.845624923706055, "global_step": 228472, "epoch": 1359} {"train_loss": -11.840699195861816, "global_step": 228473, "epoch": 1359} {"train_loss": -11.191237449645996, "global_step": 228474, "epoch": 1359} {"train_loss": -10.754254341125488, "global_step": 228475, "epoch": 1359} {"train_loss": -11.50027084350586, "global_step": 228476, "epoch": 1359} {"train_loss": -10.213685989379883, "global_step": 228477, "epoch": 1359} {"train_loss": -11.867021560668945, "global_step": 228478, "epoch": 1359} {"train_loss": -11.400197466214498, "global_step": 228479, "epoch": 1359, "val_loss": 258468.703125} {"train_loss": -11.25139331817627, "global_step": 228480, "epoch": 1360} {"train_loss": -11.641739845275879, "global_step": 228481, "epoch": 1360} {"train_loss": -11.617484092712402, "global_step": 228482, "epoch": 1360} {"train_loss": -11.412191390991211, "global_step": 228483, "epoch": 1360} {"train_loss": -11.911493301391602, "global_step": 228484, "epoch": 1360} {"train_loss": -11.8533935546875, "global_step": 228485, "epoch": 1360} {"train_loss": -11.351999282836914, "global_step": 228486, "epoch": 1360} {"train_loss": -11.66257095336914, "global_step": 228487, "epoch": 1360} {"train_loss": -11.459853172302246, "global_step": 228488, "epoch": 1360} {"train_loss": -11.81576919555664, "global_step": 228489, "epoch": 1360} {"train_loss": -11.963722229003906, "global_step": 228490, "epoch": 1360} {"train_loss": -11.605960845947266, "global_step": 228491, "epoch": 1360} {"train_loss": -11.753999710083008, "global_step": 228492, "epoch": 1360} {"train_loss": -11.431087493896484, "global_step": 228493, "epoch": 1360} {"train_loss": -12.112005233764648, "global_step": 228494, "epoch": 1360} {"train_loss": -11.681208610534668, "global_step": 228495, "epoch": 1360} {"train_loss": -11.664386749267578, "global_step": 228496, "epoch": 1360} {"train_loss": -11.76031494140625, "global_step": 228497, "epoch": 1360} {"train_loss": -11.793445587158203, "global_step": 228498, "epoch": 1360} {"train_loss": -11.116706848144531, "global_step": 228499, "epoch": 1360} {"train_loss": -11.384909629821777, "global_step": 228500, "epoch": 1360} {"train_loss": -11.567169189453125, "global_step": 228501, "epoch": 1360} {"train_loss": -10.934326171875, "global_step": 228502, "epoch": 1360} {"train_loss": -10.729752540588379, "global_step": 228503, "epoch": 1360} {"train_loss": -11.44221019744873, "global_step": 228504, "epoch": 1360} {"train_loss": -11.464434623718262, "global_step": 228505, "epoch": 1360} {"train_loss": -10.608175277709961, "global_step": 228506, "epoch": 1360} {"train_loss": -11.5526123046875, "global_step": 228507, "epoch": 1360} {"train_loss": -10.664972305297852, "global_step": 228508, "epoch": 1360} {"train_loss": -10.21171760559082, "global_step": 228509, "epoch": 1360} {"train_loss": -11.134502410888672, "global_step": 228510, "epoch": 1360} {"train_loss": -9.104070663452148, "global_step": 228511, "epoch": 1360} {"train_loss": -11.419114112854004, "global_step": 228512, "epoch": 1360} {"train_loss": -9.11679458618164, "global_step": 228513, "epoch": 1360} {"train_loss": -10.53042984008789, "global_step": 228514, "epoch": 1360} {"train_loss": -10.955890655517578, "global_step": 228515, "epoch": 1360} {"train_loss": -10.755518913269043, "global_step": 228516, "epoch": 1360} {"train_loss": -10.398321151733398, "global_step": 228517, "epoch": 1360} {"train_loss": -10.332247734069824, "global_step": 228518, "epoch": 1360} {"train_loss": -10.317638397216797, "global_step": 228519, "epoch": 1360} {"train_loss": -11.4116792678833, "global_step": 228520, "epoch": 1360} {"train_loss": -10.8798828125, "global_step": 228521, "epoch": 1360} {"train_loss": -11.176820755004883, "global_step": 228522, "epoch": 1360} {"train_loss": -11.319007873535156, "global_step": 228523, "epoch": 1360} {"train_loss": -10.803886413574219, "global_step": 228524, "epoch": 1360} {"train_loss": -11.150712966918945, "global_step": 228525, "epoch": 1360} {"train_loss": -10.302011489868164, "global_step": 228526, "epoch": 1360} {"train_loss": -11.44228744506836, "global_step": 228527, "epoch": 1360} {"train_loss": -11.495904922485352, "global_step": 228528, "epoch": 1360} {"train_loss": -10.952411651611328, "global_step": 228529, "epoch": 1360} {"train_loss": -11.30143928527832, "global_step": 228530, "epoch": 1360} {"train_loss": -11.396343231201172, "global_step": 228531, "epoch": 1360} {"train_loss": -11.623025894165039, "global_step": 228532, "epoch": 1360} {"train_loss": -11.044108390808105, "global_step": 228533, "epoch": 1360} {"train_loss": -11.573614120483398, "global_step": 228534, "epoch": 1360} {"train_loss": -11.09563159942627, "global_step": 228535, "epoch": 1360} {"train_loss": -11.542527198791504, "global_step": 228536, "epoch": 1360} {"train_loss": -11.506592750549316, "global_step": 228537, "epoch": 1360} {"train_loss": -11.359997749328613, "global_step": 228538, "epoch": 1360} {"train_loss": -11.20838737487793, "global_step": 228539, "epoch": 1360} {"train_loss": -11.51023006439209, "global_step": 228540, "epoch": 1360} {"train_loss": -11.67158317565918, "global_step": 228541, "epoch": 1360} {"train_loss": -11.390506744384766, "global_step": 228542, "epoch": 1360} {"train_loss": -11.462811470031738, "global_step": 228543, "epoch": 1360} {"train_loss": -11.659950256347656, "global_step": 228544, "epoch": 1360} {"train_loss": -11.439203262329102, "global_step": 228545, "epoch": 1360} {"train_loss": -11.678675651550293, "global_step": 228546, "epoch": 1360} {"train_loss": -11.250429153442383, "global_step": 228547, "epoch": 1360} {"train_loss": -11.432943344116211, "global_step": 228548, "epoch": 1360} {"train_loss": -11.392128944396973, "global_step": 228549, "epoch": 1360} {"train_loss": -11.571768760681152, "global_step": 228550, "epoch": 1360} {"train_loss": -11.771954536437988, "global_step": 228551, "epoch": 1360} {"train_loss": -11.30746078491211, "global_step": 228552, "epoch": 1360} {"train_loss": -11.679996490478516, "global_step": 228553, "epoch": 1360} {"train_loss": -11.51884937286377, "global_step": 228554, "epoch": 1360} {"train_loss": -11.433477401733398, "global_step": 228555, "epoch": 1360} {"train_loss": -11.824928283691406, "global_step": 228556, "epoch": 1360} {"train_loss": -11.337991714477539, "global_step": 228557, "epoch": 1360} {"train_loss": -11.794761657714844, "global_step": 228558, "epoch": 1360} {"train_loss": -11.8258056640625, "global_step": 228559, "epoch": 1360} {"train_loss": -11.660989761352539, "global_step": 228560, "epoch": 1360} {"train_loss": -11.570816993713379, "global_step": 228561, "epoch": 1360} {"train_loss": -11.73967170715332, "global_step": 228562, "epoch": 1360} {"train_loss": -11.47693920135498, "global_step": 228563, "epoch": 1360} {"train_loss": -11.847249984741211, "global_step": 228564, "epoch": 1360} {"train_loss": -12.001737594604492, "global_step": 228565, "epoch": 1360} {"train_loss": -11.974312782287598, "global_step": 228566, "epoch": 1360} {"train_loss": -11.893647193908691, "global_step": 228567, "epoch": 1360} {"train_loss": -11.957695007324219, "global_step": 228568, "epoch": 1360} {"train_loss": -12.10506534576416, "global_step": 228569, "epoch": 1360} {"train_loss": -12.034818649291992, "global_step": 228570, "epoch": 1360} {"train_loss": -11.736776351928711, "global_step": 228571, "epoch": 1360} {"train_loss": -11.873695373535156, "global_step": 228572, "epoch": 1360} {"train_loss": -11.866915702819824, "global_step": 228573, "epoch": 1360} {"train_loss": -12.16226577758789, "global_step": 228574, "epoch": 1360} {"train_loss": -12.03508186340332, "global_step": 228575, "epoch": 1360} {"train_loss": -11.80890941619873, "global_step": 228576, "epoch": 1360} {"train_loss": -11.95122241973877, "global_step": 228577, "epoch": 1360} {"train_loss": -12.1622314453125, "global_step": 228578, "epoch": 1360} {"train_loss": -12.095366477966309, "global_step": 228579, "epoch": 1360} {"train_loss": -11.709908485412598, "global_step": 228580, "epoch": 1360} {"train_loss": -11.83418083190918, "global_step": 228581, "epoch": 1360} {"train_loss": -12.006607055664062, "global_step": 228582, "epoch": 1360} {"train_loss": -11.494025230407715, "global_step": 228583, "epoch": 1360} {"train_loss": -12.05615520477295, "global_step": 228584, "epoch": 1360} {"train_loss": -11.825628280639648, "global_step": 228585, "epoch": 1360} {"train_loss": -11.324397087097168, "global_step": 228586, "epoch": 1360} {"train_loss": -11.569960594177246, "global_step": 228587, "epoch": 1360} {"train_loss": -11.918956756591797, "global_step": 228588, "epoch": 1360} {"train_loss": -11.5236234664917, "global_step": 228589, "epoch": 1360} {"train_loss": -11.964332580566406, "global_step": 228590, "epoch": 1360} {"train_loss": -11.80194091796875, "global_step": 228591, "epoch": 1360} {"train_loss": -11.359172821044922, "global_step": 228592, "epoch": 1360} {"train_loss": -11.58901596069336, "global_step": 228593, "epoch": 1360} {"train_loss": -11.93522834777832, "global_step": 228594, "epoch": 1360} {"train_loss": -11.317774772644043, "global_step": 228595, "epoch": 1360} {"train_loss": -10.34264087677002, "global_step": 228596, "epoch": 1360} {"train_loss": -10.512956619262695, "global_step": 228597, "epoch": 1360} {"train_loss": -11.302507400512695, "global_step": 228598, "epoch": 1360} {"train_loss": -10.656383514404297, "global_step": 228599, "epoch": 1360} {"train_loss": -10.511768341064453, "global_step": 228600, "epoch": 1360} {"train_loss": -11.801773071289062, "global_step": 228601, "epoch": 1360} {"train_loss": -10.913825988769531, "global_step": 228602, "epoch": 1360} {"train_loss": -11.22327709197998, "global_step": 228603, "epoch": 1360} {"train_loss": -11.409383773803711, "global_step": 228604, "epoch": 1360} {"train_loss": -10.8187894821167, "global_step": 228605, "epoch": 1360} {"train_loss": -11.391473770141602, "global_step": 228606, "epoch": 1360} {"train_loss": -10.796974182128906, "global_step": 228607, "epoch": 1360} {"train_loss": -10.86749267578125, "global_step": 228608, "epoch": 1360} {"train_loss": -10.133552551269531, "global_step": 228609, "epoch": 1360} {"train_loss": -9.995831489562988, "global_step": 228610, "epoch": 1360} {"train_loss": -11.045835494995117, "global_step": 228611, "epoch": 1360} {"train_loss": -9.923758506774902, "global_step": 228612, "epoch": 1360} {"train_loss": -9.329780578613281, "global_step": 228613, "epoch": 1360} {"train_loss": -9.982693672180176, "global_step": 228614, "epoch": 1360} {"train_loss": -10.575590133666992, "global_step": 228615, "epoch": 1360} {"train_loss": -9.740633010864258, "global_step": 228616, "epoch": 1360} {"train_loss": -10.395378112792969, "global_step": 228617, "epoch": 1360} {"train_loss": -10.254831314086914, "global_step": 228618, "epoch": 1360} {"train_loss": -10.909950256347656, "global_step": 228619, "epoch": 1360} {"train_loss": -10.310080528259277, "global_step": 228620, "epoch": 1360} {"train_loss": -10.551766395568848, "global_step": 228621, "epoch": 1360} {"train_loss": -10.964933395385742, "global_step": 228622, "epoch": 1360} {"train_loss": -10.792579650878906, "global_step": 228623, "epoch": 1360} {"train_loss": -10.464961051940918, "global_step": 228624, "epoch": 1360} {"train_loss": -11.127725601196289, "global_step": 228625, "epoch": 1360} {"train_loss": -10.65500259399414, "global_step": 228626, "epoch": 1360} {"train_loss": -11.281610488891602, "global_step": 228627, "epoch": 1360} {"train_loss": -10.845993995666504, "global_step": 228628, "epoch": 1360} {"train_loss": -10.628816604614258, "global_step": 228629, "epoch": 1360} {"train_loss": -11.083242416381836, "global_step": 228630, "epoch": 1360} {"train_loss": -10.907267570495605, "global_step": 228631, "epoch": 1360} {"train_loss": -11.152793884277344, "global_step": 228632, "epoch": 1360} {"train_loss": -10.935046195983887, "global_step": 228633, "epoch": 1360} {"train_loss": -11.298702239990234, "global_step": 228634, "epoch": 1360} {"train_loss": -11.330310821533203, "global_step": 228635, "epoch": 1360} {"train_loss": -11.36812686920166, "global_step": 228636, "epoch": 1360} {"train_loss": -11.272480964660645, "global_step": 228637, "epoch": 1360} {"train_loss": -11.060049057006836, "global_step": 228638, "epoch": 1360} {"train_loss": -11.27604866027832, "global_step": 228639, "epoch": 1360} {"train_loss": -11.357645988464355, "global_step": 228640, "epoch": 1360} {"train_loss": -11.362343788146973, "global_step": 228641, "epoch": 1360} {"train_loss": -11.598503112792969, "global_step": 228642, "epoch": 1360} {"train_loss": -11.26655387878418, "global_step": 228643, "epoch": 1360} {"train_loss": -11.381793975830078, "global_step": 228644, "epoch": 1360} {"train_loss": -11.217470169067383, "global_step": 228645, "epoch": 1360} {"train_loss": -11.517443656921387, "global_step": 228646, "epoch": 1360} {"train_loss": -11.270326171602521, "global_step": 228647, "epoch": 1360, "val_loss": 257735.828125, "train_action_mse_error": 1.6265233755111694} {"train_loss": -11.596085548400879, "global_step": 228648, "epoch": 1361} {"train_loss": -11.411206245422363, "global_step": 228649, "epoch": 1361} {"train_loss": -11.600007057189941, "global_step": 228650, "epoch": 1361} {"train_loss": -11.601394653320312, "global_step": 228651, "epoch": 1361} {"train_loss": -11.5606689453125, "global_step": 228652, "epoch": 1361} {"train_loss": -11.717185974121094, "global_step": 228653, "epoch": 1361} {"train_loss": -11.516387939453125, "global_step": 228654, "epoch": 1361} {"train_loss": -11.688169479370117, "global_step": 228655, "epoch": 1361} {"train_loss": -11.590970993041992, "global_step": 228656, "epoch": 1361} {"train_loss": -11.609264373779297, "global_step": 228657, "epoch": 1361} {"train_loss": -11.797527313232422, "global_step": 228658, "epoch": 1361} {"train_loss": -11.821791648864746, "global_step": 228659, "epoch": 1361} {"train_loss": -11.874037742614746, "global_step": 228660, "epoch": 1361} {"train_loss": -11.642385482788086, "global_step": 228661, "epoch": 1361} {"train_loss": -11.519342422485352, "global_step": 228662, "epoch": 1361} {"train_loss": -12.02237319946289, "global_step": 228663, "epoch": 1361} {"train_loss": -11.875085830688477, "global_step": 228664, "epoch": 1361} {"train_loss": -11.708894729614258, "global_step": 228665, "epoch": 1361} {"train_loss": -11.595874786376953, "global_step": 228666, "epoch": 1361} {"train_loss": -11.960189819335938, "global_step": 228667, "epoch": 1361} {"train_loss": -11.835139274597168, "global_step": 228668, "epoch": 1361} {"train_loss": -11.918127059936523, "global_step": 228669, "epoch": 1361} {"train_loss": -11.969084739685059, "global_step": 228670, "epoch": 1361} {"train_loss": -12.083799362182617, "global_step": 228671, "epoch": 1361} {"train_loss": -11.896167755126953, "global_step": 228672, "epoch": 1361} {"train_loss": -11.862956047058105, "global_step": 228673, "epoch": 1361} {"train_loss": -11.849897384643555, "global_step": 228674, "epoch": 1361} {"train_loss": -11.849170684814453, "global_step": 228675, "epoch": 1361} {"train_loss": -12.009540557861328, "global_step": 228676, "epoch": 1361} {"train_loss": -11.820893287658691, "global_step": 228677, "epoch": 1361} {"train_loss": -11.892355918884277, "global_step": 228678, "epoch": 1361} {"train_loss": -11.99376392364502, "global_step": 228679, "epoch": 1361} {"train_loss": -12.069818496704102, "global_step": 228680, "epoch": 1361} {"train_loss": -11.824423789978027, "global_step": 228681, "epoch": 1361} {"train_loss": -12.115312576293945, "global_step": 228682, "epoch": 1361} {"train_loss": -11.757482528686523, "global_step": 228683, "epoch": 1361} {"train_loss": -11.90796184539795, "global_step": 228684, "epoch": 1361} {"train_loss": -11.966633796691895, "global_step": 228685, "epoch": 1361} {"train_loss": -12.259515762329102, "global_step": 228686, "epoch": 1361} {"train_loss": -11.885942459106445, "global_step": 228687, "epoch": 1361} {"train_loss": -12.066205978393555, "global_step": 228688, "epoch": 1361} {"train_loss": -11.929869651794434, "global_step": 228689, "epoch": 1361} {"train_loss": -12.009794235229492, "global_step": 228690, "epoch": 1361} {"train_loss": -12.117875099182129, "global_step": 228691, "epoch": 1361} {"train_loss": -12.238832473754883, "global_step": 228692, "epoch": 1361} {"train_loss": -12.079174041748047, "global_step": 228693, "epoch": 1361} {"train_loss": -12.017870903015137, "global_step": 228694, "epoch": 1361} {"train_loss": -12.129700660705566, "global_step": 228695, "epoch": 1361} {"train_loss": -12.052112579345703, "global_step": 228696, "epoch": 1361} {"train_loss": -12.0271635055542, "global_step": 228697, "epoch": 1361} {"train_loss": -12.099088668823242, "global_step": 228698, "epoch": 1361} {"train_loss": -11.731181144714355, "global_step": 228699, "epoch": 1361} {"train_loss": -12.02203369140625, "global_step": 228700, "epoch": 1361} {"train_loss": -12.004802703857422, "global_step": 228701, "epoch": 1361} {"train_loss": -11.794490814208984, "global_step": 228702, "epoch": 1361} {"train_loss": -11.724093437194824, "global_step": 228703, "epoch": 1361} {"train_loss": -12.174742698669434, "global_step": 228704, "epoch": 1361} {"train_loss": -12.082088470458984, "global_step": 228705, "epoch": 1361} {"train_loss": -11.621749877929688, "global_step": 228706, "epoch": 1361} {"train_loss": -10.974120140075684, "global_step": 228707, "epoch": 1361} {"train_loss": -10.259851455688477, "global_step": 228708, "epoch": 1361} {"train_loss": -11.537208557128906, "global_step": 228709, "epoch": 1361} {"train_loss": -11.587390899658203, "global_step": 228710, "epoch": 1361} {"train_loss": -11.275323867797852, "global_step": 228711, "epoch": 1361} {"train_loss": -11.336240768432617, "global_step": 228712, "epoch": 1361} {"train_loss": -11.917646408081055, "global_step": 228713, "epoch": 1361} {"train_loss": -11.892179489135742, "global_step": 228714, "epoch": 1361} {"train_loss": -11.902046203613281, "global_step": 228715, "epoch": 1361} {"train_loss": -11.665742874145508, "global_step": 228716, "epoch": 1361} {"train_loss": -11.761333465576172, "global_step": 228717, "epoch": 1361} {"train_loss": -11.638599395751953, "global_step": 228718, "epoch": 1361} {"train_loss": -11.902589797973633, "global_step": 228719, "epoch": 1361} {"train_loss": -11.978554725646973, "global_step": 228720, "epoch": 1361} {"train_loss": -11.54710578918457, "global_step": 228721, "epoch": 1361} {"train_loss": -11.376012802124023, "global_step": 228722, "epoch": 1361} {"train_loss": -12.03281307220459, "global_step": 228723, "epoch": 1361} {"train_loss": -11.686732292175293, "global_step": 228724, "epoch": 1361} {"train_loss": -11.229551315307617, "global_step": 228725, "epoch": 1361} {"train_loss": -11.819286346435547, "global_step": 228726, "epoch": 1361} {"train_loss": -12.028894424438477, "global_step": 228727, "epoch": 1361} {"train_loss": -11.542557716369629, "global_step": 228728, "epoch": 1361} {"train_loss": -11.243570327758789, "global_step": 228729, "epoch": 1361} {"train_loss": -11.891109466552734, "global_step": 228730, "epoch": 1361} {"train_loss": -11.392723083496094, "global_step": 228731, "epoch": 1361} {"train_loss": -11.203645706176758, "global_step": 228732, "epoch": 1361} {"train_loss": -11.78067398071289, "global_step": 228733, "epoch": 1361} {"train_loss": -11.507099151611328, "global_step": 228734, "epoch": 1361} {"train_loss": -11.804338455200195, "global_step": 228735, "epoch": 1361} {"train_loss": -11.903104782104492, "global_step": 228736, "epoch": 1361} {"train_loss": -11.751922607421875, "global_step": 228737, "epoch": 1361} {"train_loss": -11.43653678894043, "global_step": 228738, "epoch": 1361} {"train_loss": -11.3248929977417, "global_step": 228739, "epoch": 1361} {"train_loss": -11.281087875366211, "global_step": 228740, "epoch": 1361} {"train_loss": -11.462244033813477, "global_step": 228741, "epoch": 1361} {"train_loss": -10.985466003417969, "global_step": 228742, "epoch": 1361} {"train_loss": -11.024197578430176, "global_step": 228743, "epoch": 1361} {"train_loss": -11.887035369873047, "global_step": 228744, "epoch": 1361} {"train_loss": -11.616830825805664, "global_step": 228745, "epoch": 1361} {"train_loss": -11.048017501831055, "global_step": 228746, "epoch": 1361} {"train_loss": -11.540727615356445, "global_step": 228747, "epoch": 1361} {"train_loss": -10.948549270629883, "global_step": 228748, "epoch": 1361} {"train_loss": -10.377835273742676, "global_step": 228749, "epoch": 1361} {"train_loss": -11.039962768554688, "global_step": 228750, "epoch": 1361} {"train_loss": -11.826507568359375, "global_step": 228751, "epoch": 1361} {"train_loss": -10.486515045166016, "global_step": 228752, "epoch": 1361} {"train_loss": -11.289247512817383, "global_step": 228753, "epoch": 1361} {"train_loss": -11.690715789794922, "global_step": 228754, "epoch": 1361} {"train_loss": -11.542509078979492, "global_step": 228755, "epoch": 1361} {"train_loss": -11.678610801696777, "global_step": 228756, "epoch": 1361} {"train_loss": -11.470361709594727, "global_step": 228757, "epoch": 1361} {"train_loss": -11.515644073486328, "global_step": 228758, "epoch": 1361} {"train_loss": -11.436040878295898, "global_step": 228759, "epoch": 1361} {"train_loss": -11.441823959350586, "global_step": 228760, "epoch": 1361} {"train_loss": -11.708932876586914, "global_step": 228761, "epoch": 1361} {"train_loss": -11.646614074707031, "global_step": 228762, "epoch": 1361} {"train_loss": -11.46558952331543, "global_step": 228763, "epoch": 1361} {"train_loss": -11.299520492553711, "global_step": 228764, "epoch": 1361} {"train_loss": -12.012434959411621, "global_step": 228765, "epoch": 1361} {"train_loss": -11.44387435913086, "global_step": 228766, "epoch": 1361} {"train_loss": -11.840226173400879, "global_step": 228767, "epoch": 1361} {"train_loss": -11.550948143005371, "global_step": 228768, "epoch": 1361} {"train_loss": -11.222018241882324, "global_step": 228769, "epoch": 1361} {"train_loss": -10.610689163208008, "global_step": 228770, "epoch": 1361} {"train_loss": -9.020698547363281, "global_step": 228771, "epoch": 1361} {"train_loss": -9.84504222869873, "global_step": 228772, "epoch": 1361} {"train_loss": -11.033451080322266, "global_step": 228773, "epoch": 1361} {"train_loss": -9.221832275390625, "global_step": 228774, "epoch": 1361} {"train_loss": -11.454358100891113, "global_step": 228775, "epoch": 1361} {"train_loss": -9.461421966552734, "global_step": 228776, "epoch": 1361} {"train_loss": -11.180330276489258, "global_step": 228777, "epoch": 1361} {"train_loss": -10.604165077209473, "global_step": 228778, "epoch": 1361} {"train_loss": -10.344781875610352, "global_step": 228779, "epoch": 1361} {"train_loss": -11.347234725952148, "global_step": 228780, "epoch": 1361} {"train_loss": -10.270648956298828, "global_step": 228781, "epoch": 1361} {"train_loss": -11.277069091796875, "global_step": 228782, "epoch": 1361} {"train_loss": -10.952282905578613, "global_step": 228783, "epoch": 1361} {"train_loss": -11.192846298217773, "global_step": 228784, "epoch": 1361} {"train_loss": -11.528244018554688, "global_step": 228785, "epoch": 1361} {"train_loss": -11.125659942626953, "global_step": 228786, "epoch": 1361} {"train_loss": -11.216083526611328, "global_step": 228787, "epoch": 1361} {"train_loss": -10.50477409362793, "global_step": 228788, "epoch": 1361} {"train_loss": -11.368362426757812, "global_step": 228789, "epoch": 1361} {"train_loss": -10.44627571105957, "global_step": 228790, "epoch": 1361} {"train_loss": -10.941803932189941, "global_step": 228791, "epoch": 1361} {"train_loss": -10.945884704589844, "global_step": 228792, "epoch": 1361} {"train_loss": -10.770617485046387, "global_step": 228793, "epoch": 1361} {"train_loss": -11.107318878173828, "global_step": 228794, "epoch": 1361} {"train_loss": -10.71334457397461, "global_step": 228795, "epoch": 1361} {"train_loss": -11.044517517089844, "global_step": 228796, "epoch": 1361} {"train_loss": -11.336450576782227, "global_step": 228797, "epoch": 1361} {"train_loss": -10.719125747680664, "global_step": 228798, "epoch": 1361} {"train_loss": -11.545381546020508, "global_step": 228799, "epoch": 1361} {"train_loss": -11.150208473205566, "global_step": 228800, "epoch": 1361} {"train_loss": -11.401707649230957, "global_step": 228801, "epoch": 1361} {"train_loss": -11.52676773071289, "global_step": 228802, "epoch": 1361} {"train_loss": -11.30297565460205, "global_step": 228803, "epoch": 1361} {"train_loss": -11.440479278564453, "global_step": 228804, "epoch": 1361} {"train_loss": -11.487895011901855, "global_step": 228805, "epoch": 1361} {"train_loss": -11.380311965942383, "global_step": 228806, "epoch": 1361} {"train_loss": -11.367698669433594, "global_step": 228807, "epoch": 1361} {"train_loss": -11.636038780212402, "global_step": 228808, "epoch": 1361} {"train_loss": -11.320544242858887, "global_step": 228809, "epoch": 1361} {"train_loss": -11.453694343566895, "global_step": 228810, "epoch": 1361} {"train_loss": -11.631760597229004, "global_step": 228811, "epoch": 1361} {"train_loss": -11.531549453735352, "global_step": 228812, "epoch": 1361} {"train_loss": -11.62443733215332, "global_step": 228813, "epoch": 1361} {"train_loss": -11.526676177978516, "global_step": 228814, "epoch": 1361} {"train_loss": -11.493029651187715, "global_step": 228815, "epoch": 1361, "val_loss": 260634.9375} {"train_loss": -11.420166969299316, "global_step": 228816, "epoch": 1362} {"train_loss": -11.406253814697266, "global_step": 228817, "epoch": 1362} {"train_loss": -11.553762435913086, "global_step": 228818, "epoch": 1362} {"train_loss": -11.747995376586914, "global_step": 228819, "epoch": 1362} {"train_loss": -11.613639831542969, "global_step": 228820, "epoch": 1362} {"train_loss": -11.704503059387207, "global_step": 228821, "epoch": 1362} {"train_loss": -11.491682052612305, "global_step": 228822, "epoch": 1362} {"train_loss": -11.71180248260498, "global_step": 228823, "epoch": 1362} {"train_loss": -11.794679641723633, "global_step": 228824, "epoch": 1362} {"train_loss": -11.624279022216797, "global_step": 228825, "epoch": 1362} {"train_loss": -11.729520797729492, "global_step": 228826, "epoch": 1362} {"train_loss": -11.509729385375977, "global_step": 228827, "epoch": 1362} {"train_loss": -11.605457305908203, "global_step": 228828, "epoch": 1362} {"train_loss": -11.809557914733887, "global_step": 228829, "epoch": 1362} {"train_loss": -11.571924209594727, "global_step": 228830, "epoch": 1362} {"train_loss": -11.671920776367188, "global_step": 228831, "epoch": 1362} {"train_loss": -11.476259231567383, "global_step": 228832, "epoch": 1362} {"train_loss": -11.649243354797363, "global_step": 228833, "epoch": 1362} {"train_loss": -11.758942604064941, "global_step": 228834, "epoch": 1362} {"train_loss": -11.754093170166016, "global_step": 228835, "epoch": 1362} {"train_loss": -11.647499084472656, "global_step": 228836, "epoch": 1362} {"train_loss": -11.502710342407227, "global_step": 228837, "epoch": 1362} {"train_loss": -11.589822769165039, "global_step": 228838, "epoch": 1362} {"train_loss": -11.705390930175781, "global_step": 228839, "epoch": 1362} {"train_loss": -11.75312614440918, "global_step": 228840, "epoch": 1362} {"train_loss": -11.606021881103516, "global_step": 228841, "epoch": 1362} {"train_loss": -11.411308288574219, "global_step": 228842, "epoch": 1362} {"train_loss": -11.621150970458984, "global_step": 228843, "epoch": 1362} {"train_loss": -11.505702018737793, "global_step": 228844, "epoch": 1362} {"train_loss": -12.049650192260742, "global_step": 228845, "epoch": 1362} {"train_loss": -11.56894302368164, "global_step": 228846, "epoch": 1362} {"train_loss": -11.778508186340332, "global_step": 228847, "epoch": 1362} {"train_loss": -11.459728240966797, "global_step": 228848, "epoch": 1362} {"train_loss": -11.663175582885742, "global_step": 228849, "epoch": 1362} {"train_loss": -11.722637176513672, "global_step": 228850, "epoch": 1362} {"train_loss": -11.697277069091797, "global_step": 228851, "epoch": 1362} {"train_loss": -11.926241874694824, "global_step": 228852, "epoch": 1362} {"train_loss": -11.91612720489502, "global_step": 228853, "epoch": 1362} {"train_loss": -11.913529396057129, "global_step": 228854, "epoch": 1362} {"train_loss": -11.880983352661133, "global_step": 228855, "epoch": 1362} {"train_loss": -11.831350326538086, "global_step": 228856, "epoch": 1362} {"train_loss": -11.875740051269531, "global_step": 228857, "epoch": 1362} {"train_loss": -11.698369026184082, "global_step": 228858, "epoch": 1362} {"train_loss": -11.886014938354492, "global_step": 228859, "epoch": 1362} {"train_loss": -11.982173919677734, "global_step": 228860, "epoch": 1362} {"train_loss": -11.87254810333252, "global_step": 228861, "epoch": 1362} {"train_loss": -11.839397430419922, "global_step": 228862, "epoch": 1362} {"train_loss": -12.024542808532715, "global_step": 228863, "epoch": 1362} {"train_loss": -11.199563980102539, "global_step": 228864, "epoch": 1362} {"train_loss": -11.606943130493164, "global_step": 228865, "epoch": 1362} {"train_loss": -11.76891803741455, "global_step": 228866, "epoch": 1362} {"train_loss": -11.784139633178711, "global_step": 228867, "epoch": 1362} {"train_loss": -11.815664291381836, "global_step": 228868, "epoch": 1362} {"train_loss": -12.041017532348633, "global_step": 228869, "epoch": 1362} {"train_loss": -11.723724365234375, "global_step": 228870, "epoch": 1362} {"train_loss": -11.685874938964844, "global_step": 228871, "epoch": 1362} {"train_loss": -11.446343421936035, "global_step": 228872, "epoch": 1362} {"train_loss": -11.508423805236816, "global_step": 228873, "epoch": 1362} {"train_loss": -10.681023597717285, "global_step": 228874, "epoch": 1362} {"train_loss": -11.010613441467285, "global_step": 228875, "epoch": 1362} {"train_loss": -11.632770538330078, "global_step": 228876, "epoch": 1362} {"train_loss": -11.84928035736084, "global_step": 228877, "epoch": 1362} {"train_loss": -11.688916206359863, "global_step": 228878, "epoch": 1362} {"train_loss": -11.057740211486816, "global_step": 228879, "epoch": 1362} {"train_loss": -11.84129524230957, "global_step": 228880, "epoch": 1362} {"train_loss": -11.174127578735352, "global_step": 228881, "epoch": 1362} {"train_loss": -11.42812728881836, "global_step": 228882, "epoch": 1362} {"train_loss": -11.398752212524414, "global_step": 228883, "epoch": 1362} {"train_loss": -10.644415855407715, "global_step": 228884, "epoch": 1362} {"train_loss": -11.659387588500977, "global_step": 228885, "epoch": 1362} {"train_loss": -10.8890380859375, "global_step": 228886, "epoch": 1362} {"train_loss": -11.290886878967285, "global_step": 228887, "epoch": 1362} {"train_loss": -11.159618377685547, "global_step": 228888, "epoch": 1362} {"train_loss": -11.681426048278809, "global_step": 228889, "epoch": 1362} {"train_loss": -10.956626892089844, "global_step": 228890, "epoch": 1362} {"train_loss": -11.566558837890625, "global_step": 228891, "epoch": 1362} {"train_loss": -10.469049453735352, "global_step": 228892, "epoch": 1362} {"train_loss": -11.2306547164917, "global_step": 228893, "epoch": 1362} {"train_loss": -11.252588272094727, "global_step": 228894, "epoch": 1362} {"train_loss": -11.540042877197266, "global_step": 228895, "epoch": 1362} {"train_loss": -11.756752014160156, "global_step": 228896, "epoch": 1362} {"train_loss": -11.556726455688477, "global_step": 228897, "epoch": 1362} {"train_loss": -11.886924743652344, "global_step": 228898, "epoch": 1362} {"train_loss": -11.54635238647461, "global_step": 228899, "epoch": 1362} {"train_loss": -11.745317459106445, "global_step": 228900, "epoch": 1362} {"train_loss": -11.762391090393066, "global_step": 228901, "epoch": 1362} {"train_loss": -11.547826766967773, "global_step": 228902, "epoch": 1362} {"train_loss": -11.367471694946289, "global_step": 228903, "epoch": 1362} {"train_loss": -11.687265396118164, "global_step": 228904, "epoch": 1362} {"train_loss": -11.424491882324219, "global_step": 228905, "epoch": 1362} {"train_loss": -11.397150993347168, "global_step": 228906, "epoch": 1362} {"train_loss": -11.549154281616211, "global_step": 228907, "epoch": 1362} {"train_loss": -11.238104820251465, "global_step": 228908, "epoch": 1362} {"train_loss": -11.333024024963379, "global_step": 228909, "epoch": 1362} {"train_loss": -11.388279914855957, "global_step": 228910, "epoch": 1362} {"train_loss": -11.296524047851562, "global_step": 228911, "epoch": 1362} {"train_loss": -11.437273025512695, "global_step": 228912, "epoch": 1362} {"train_loss": -11.587045669555664, "global_step": 228913, "epoch": 1362} {"train_loss": -10.387335777282715, "global_step": 228914, "epoch": 1362} {"train_loss": -11.42143440246582, "global_step": 228915, "epoch": 1362} {"train_loss": -11.081668853759766, "global_step": 228916, "epoch": 1362} {"train_loss": -11.169466018676758, "global_step": 228917, "epoch": 1362} {"train_loss": -11.682295799255371, "global_step": 228918, "epoch": 1362} {"train_loss": -10.772317886352539, "global_step": 228919, "epoch": 1362} {"train_loss": -11.66035270690918, "global_step": 228920, "epoch": 1362} {"train_loss": -11.141461372375488, "global_step": 228921, "epoch": 1362} {"train_loss": -11.576772689819336, "global_step": 228922, "epoch": 1362} {"train_loss": -10.934391021728516, "global_step": 228923, "epoch": 1362} {"train_loss": -10.643922805786133, "global_step": 228924, "epoch": 1362} {"train_loss": -11.390755653381348, "global_step": 228925, "epoch": 1362} {"train_loss": -10.972296714782715, "global_step": 228926, "epoch": 1362} {"train_loss": -11.423949241638184, "global_step": 228927, "epoch": 1362} {"train_loss": -11.304998397827148, "global_step": 228928, "epoch": 1362} {"train_loss": -11.11357307434082, "global_step": 228929, "epoch": 1362} {"train_loss": -11.469223022460938, "global_step": 228930, "epoch": 1362} {"train_loss": -10.539822578430176, "global_step": 228931, "epoch": 1362} {"train_loss": -11.234371185302734, "global_step": 228932, "epoch": 1362} {"train_loss": -11.22194766998291, "global_step": 228933, "epoch": 1362} {"train_loss": -10.520195007324219, "global_step": 228934, "epoch": 1362} {"train_loss": -11.676010131835938, "global_step": 228935, "epoch": 1362} {"train_loss": -10.8271484375, "global_step": 228936, "epoch": 1362} {"train_loss": -11.233449935913086, "global_step": 228937, "epoch": 1362} {"train_loss": -11.440749168395996, "global_step": 228938, "epoch": 1362} {"train_loss": -10.749645233154297, "global_step": 228939, "epoch": 1362} {"train_loss": -11.63548469543457, "global_step": 228940, "epoch": 1362} {"train_loss": -10.365123748779297, "global_step": 228941, "epoch": 1362} {"train_loss": -11.341757774353027, "global_step": 228942, "epoch": 1362} {"train_loss": -11.460426330566406, "global_step": 228943, "epoch": 1362} {"train_loss": -11.286011695861816, "global_step": 228944, "epoch": 1362} {"train_loss": -11.400117874145508, "global_step": 228945, "epoch": 1362} {"train_loss": -11.28431510925293, "global_step": 228946, "epoch": 1362} {"train_loss": -11.396785736083984, "global_step": 228947, "epoch": 1362} {"train_loss": -11.378490447998047, "global_step": 228948, "epoch": 1362} {"train_loss": -11.465110778808594, "global_step": 228949, "epoch": 1362} {"train_loss": -11.834967613220215, "global_step": 228950, "epoch": 1362} {"train_loss": -11.258549690246582, "global_step": 228951, "epoch": 1362} {"train_loss": -11.672887802124023, "global_step": 228952, "epoch": 1362} {"train_loss": -11.463590621948242, "global_step": 228953, "epoch": 1362} {"train_loss": -11.724884033203125, "global_step": 228954, "epoch": 1362} {"train_loss": -11.707756042480469, "global_step": 228955, "epoch": 1362} {"train_loss": -11.388677597045898, "global_step": 228956, "epoch": 1362} {"train_loss": -11.490097045898438, "global_step": 228957, "epoch": 1362} {"train_loss": -11.829452514648438, "global_step": 228958, "epoch": 1362} {"train_loss": -11.517528533935547, "global_step": 228959, "epoch": 1362} {"train_loss": -11.791088104248047, "global_step": 228960, "epoch": 1362} {"train_loss": -11.408124923706055, "global_step": 228961, "epoch": 1362} {"train_loss": -11.576086044311523, "global_step": 228962, "epoch": 1362} {"train_loss": -11.490567207336426, "global_step": 228963, "epoch": 1362} {"train_loss": -11.102436065673828, "global_step": 228964, "epoch": 1362} {"train_loss": -11.786808013916016, "global_step": 228965, "epoch": 1362} {"train_loss": -11.464611053466797, "global_step": 228966, "epoch": 1362} {"train_loss": -11.516271591186523, "global_step": 228967, "epoch": 1362} {"train_loss": -11.624815940856934, "global_step": 228968, "epoch": 1362} {"train_loss": -11.56313705444336, "global_step": 228969, "epoch": 1362} {"train_loss": -11.860576629638672, "global_step": 228970, "epoch": 1362} {"train_loss": -11.572366714477539, "global_step": 228971, "epoch": 1362} {"train_loss": -11.619215965270996, "global_step": 228972, "epoch": 1362} {"train_loss": -11.517692565917969, "global_step": 228973, "epoch": 1362} {"train_loss": -11.421038627624512, "global_step": 228974, "epoch": 1362} {"train_loss": -11.880668640136719, "global_step": 228975, "epoch": 1362} {"train_loss": -11.435001373291016, "global_step": 228976, "epoch": 1362} {"train_loss": -11.852724075317383, "global_step": 228977, "epoch": 1362} {"train_loss": -11.565225601196289, "global_step": 228978, "epoch": 1362} {"train_loss": -11.700908660888672, "global_step": 228979, "epoch": 1362} {"train_loss": -11.798351287841797, "global_step": 228980, "epoch": 1362} {"train_loss": -11.655023574829102, "global_step": 228981, "epoch": 1362} {"train_loss": -11.8369140625, "global_step": 228982, "epoch": 1362} {"train_loss": -11.491290120851426, "global_step": 228983, "epoch": 1362, "val_loss": 262789.625} {"train_loss": -11.66597843170166, "global_step": 228984, "epoch": 1363} {"train_loss": -11.506509780883789, "global_step": 228985, "epoch": 1363} {"train_loss": -11.451288223266602, "global_step": 228986, "epoch": 1363} {"train_loss": -11.561592102050781, "global_step": 228987, "epoch": 1363} {"train_loss": -11.84742546081543, "global_step": 228988, "epoch": 1363} {"train_loss": -11.778765678405762, "global_step": 228989, "epoch": 1363} {"train_loss": -11.975190162658691, "global_step": 228990, "epoch": 1363} {"train_loss": -11.739809036254883, "global_step": 228991, "epoch": 1363} {"train_loss": -11.87320327758789, "global_step": 228992, "epoch": 1363} {"train_loss": -11.563146591186523, "global_step": 228993, "epoch": 1363} {"train_loss": -11.821586608886719, "global_step": 228994, "epoch": 1363} {"train_loss": -11.430502891540527, "global_step": 228995, "epoch": 1363} {"train_loss": -11.818403244018555, "global_step": 228996, "epoch": 1363} {"train_loss": -11.555474281311035, "global_step": 228997, "epoch": 1363} {"train_loss": -11.723320960998535, "global_step": 228998, "epoch": 1363} {"train_loss": -11.259050369262695, "global_step": 228999, "epoch": 1363} {"train_loss": -11.851493835449219, "global_step": 229000, "epoch": 1363} {"train_loss": -11.632935523986816, "global_step": 229001, "epoch": 1363} {"train_loss": -11.843881607055664, "global_step": 229002, "epoch": 1363} {"train_loss": -11.240579605102539, "global_step": 229003, "epoch": 1363} {"train_loss": -10.95174789428711, "global_step": 229004, "epoch": 1363} {"train_loss": -11.22752857208252, "global_step": 229005, "epoch": 1363} {"train_loss": -11.168142318725586, "global_step": 229006, "epoch": 1363} {"train_loss": -10.155170440673828, "global_step": 229007, "epoch": 1363} {"train_loss": -11.750602722167969, "global_step": 229008, "epoch": 1363} {"train_loss": -11.443429946899414, "global_step": 229009, "epoch": 1363} {"train_loss": -10.859492301940918, "global_step": 229010, "epoch": 1363} {"train_loss": -11.776463508605957, "global_step": 229011, "epoch": 1363} {"train_loss": -11.016395568847656, "global_step": 229012, "epoch": 1363} {"train_loss": -11.80577278137207, "global_step": 229013, "epoch": 1363} {"train_loss": -10.992846488952637, "global_step": 229014, "epoch": 1363} {"train_loss": -10.877193450927734, "global_step": 229015, "epoch": 1363} {"train_loss": -11.349687576293945, "global_step": 229016, "epoch": 1363} {"train_loss": -11.609582901000977, "global_step": 229017, "epoch": 1363} {"train_loss": -11.322010040283203, "global_step": 229018, "epoch": 1363} {"train_loss": -11.479110717773438, "global_step": 229019, "epoch": 1363} {"train_loss": -11.589138984680176, "global_step": 229020, "epoch": 1363} {"train_loss": -11.756972312927246, "global_step": 229021, "epoch": 1363} {"train_loss": -11.289239883422852, "global_step": 229022, "epoch": 1363} {"train_loss": -11.54490852355957, "global_step": 229023, "epoch": 1363} {"train_loss": -11.658594131469727, "global_step": 229024, "epoch": 1363} {"train_loss": -11.501130104064941, "global_step": 229025, "epoch": 1363} {"train_loss": -11.068157196044922, "global_step": 229026, "epoch": 1363} {"train_loss": -11.63005256652832, "global_step": 229027, "epoch": 1363} {"train_loss": -11.58072566986084, "global_step": 229028, "epoch": 1363} {"train_loss": -11.401044845581055, "global_step": 229029, "epoch": 1363} {"train_loss": -11.698196411132812, "global_step": 229030, "epoch": 1363} {"train_loss": -11.622835159301758, "global_step": 229031, "epoch": 1363} {"train_loss": -11.694594383239746, "global_step": 229032, "epoch": 1363} {"train_loss": -11.525228500366211, "global_step": 229033, "epoch": 1363} {"train_loss": -11.513777732849121, "global_step": 229034, "epoch": 1363} {"train_loss": -11.444580078125, "global_step": 229035, "epoch": 1363} {"train_loss": -11.416085243225098, "global_step": 229036, "epoch": 1363} {"train_loss": -11.52609634399414, "global_step": 229037, "epoch": 1363} {"train_loss": -11.767692565917969, "global_step": 229038, "epoch": 1363} {"train_loss": -11.468290328979492, "global_step": 229039, "epoch": 1363} {"train_loss": -11.692138671875, "global_step": 229040, "epoch": 1363} {"train_loss": -11.618534088134766, "global_step": 229041, "epoch": 1363} {"train_loss": -11.343221664428711, "global_step": 229042, "epoch": 1363} {"train_loss": -10.970142364501953, "global_step": 229043, "epoch": 1363} {"train_loss": -11.596356391906738, "global_step": 229044, "epoch": 1363} {"train_loss": -11.266111373901367, "global_step": 229045, "epoch": 1363} {"train_loss": -11.643585205078125, "global_step": 229046, "epoch": 1363} {"train_loss": -11.404829025268555, "global_step": 229047, "epoch": 1363} {"train_loss": -11.725963592529297, "global_step": 229048, "epoch": 1363} {"train_loss": -11.861661911010742, "global_step": 229049, "epoch": 1363} {"train_loss": -11.696097373962402, "global_step": 229050, "epoch": 1363} {"train_loss": -11.74824333190918, "global_step": 229051, "epoch": 1363} {"train_loss": -11.711278915405273, "global_step": 229052, "epoch": 1363} {"train_loss": -11.70074462890625, "global_step": 229053, "epoch": 1363} {"train_loss": -11.696905136108398, "global_step": 229054, "epoch": 1363} {"train_loss": -11.864585876464844, "global_step": 229055, "epoch": 1363} {"train_loss": -11.93429183959961, "global_step": 229056, "epoch": 1363} {"train_loss": -11.381368637084961, "global_step": 229057, "epoch": 1363} {"train_loss": -11.725532531738281, "global_step": 229058, "epoch": 1363} {"train_loss": -11.321892738342285, "global_step": 229059, "epoch": 1363} {"train_loss": -11.624693870544434, "global_step": 229060, "epoch": 1363} {"train_loss": -11.512516975402832, "global_step": 229061, "epoch": 1363} {"train_loss": -11.705599784851074, "global_step": 229062, "epoch": 1363} {"train_loss": -11.63670825958252, "global_step": 229063, "epoch": 1363} {"train_loss": -11.468957901000977, "global_step": 229064, "epoch": 1363} {"train_loss": -11.532973289489746, "global_step": 229065, "epoch": 1363} {"train_loss": -11.764724731445312, "global_step": 229066, "epoch": 1363} {"train_loss": -11.745258331298828, "global_step": 229067, "epoch": 1363} {"train_loss": -11.555559158325195, "global_step": 229068, "epoch": 1363} {"train_loss": -11.91566276550293, "global_step": 229069, "epoch": 1363} {"train_loss": -11.687627792358398, "global_step": 229070, "epoch": 1363} {"train_loss": -11.845977783203125, "global_step": 229071, "epoch": 1363} {"train_loss": -11.691120147705078, "global_step": 229072, "epoch": 1363} {"train_loss": -11.785909652709961, "global_step": 229073, "epoch": 1363} {"train_loss": -12.000214576721191, "global_step": 229074, "epoch": 1363} {"train_loss": -11.587188720703125, "global_step": 229075, "epoch": 1363} {"train_loss": -11.849878311157227, "global_step": 229076, "epoch": 1363} {"train_loss": -11.971773147583008, "global_step": 229077, "epoch": 1363} {"train_loss": -11.99135971069336, "global_step": 229078, "epoch": 1363} {"train_loss": -11.884138107299805, "global_step": 229079, "epoch": 1363} {"train_loss": -11.710628509521484, "global_step": 229080, "epoch": 1363} {"train_loss": -11.780740737915039, "global_step": 229081, "epoch": 1363} {"train_loss": -11.926823616027832, "global_step": 229082, "epoch": 1363} {"train_loss": -11.663818359375, "global_step": 229083, "epoch": 1363} {"train_loss": -11.367663383483887, "global_step": 229084, "epoch": 1363} {"train_loss": -11.860486030578613, "global_step": 229085, "epoch": 1363} {"train_loss": -11.69214916229248, "global_step": 229086, "epoch": 1363} {"train_loss": -11.639810562133789, "global_step": 229087, "epoch": 1363} {"train_loss": -11.783772468566895, "global_step": 229088, "epoch": 1363} {"train_loss": -12.013201713562012, "global_step": 229089, "epoch": 1363} {"train_loss": -11.850882530212402, "global_step": 229090, "epoch": 1363} {"train_loss": -12.000187873840332, "global_step": 229091, "epoch": 1363} {"train_loss": -12.020931243896484, "global_step": 229092, "epoch": 1363} {"train_loss": -12.004788398742676, "global_step": 229093, "epoch": 1363} {"train_loss": -11.714814186096191, "global_step": 229094, "epoch": 1363} {"train_loss": -11.761116027832031, "global_step": 229095, "epoch": 1363} {"train_loss": -12.011981964111328, "global_step": 229096, "epoch": 1363} {"train_loss": -12.037919998168945, "global_step": 229097, "epoch": 1363} {"train_loss": -11.886802673339844, "global_step": 229098, "epoch": 1363} {"train_loss": -11.97433090209961, "global_step": 229099, "epoch": 1363} {"train_loss": -11.827280044555664, "global_step": 229100, "epoch": 1363} {"train_loss": -11.533470153808594, "global_step": 229101, "epoch": 1363} {"train_loss": -11.86771011352539, "global_step": 229102, "epoch": 1363} {"train_loss": -11.943580627441406, "global_step": 229103, "epoch": 1363} {"train_loss": -11.948257446289062, "global_step": 229104, "epoch": 1363} {"train_loss": -11.770821571350098, "global_step": 229105, "epoch": 1363} {"train_loss": -12.059328079223633, "global_step": 229106, "epoch": 1363} {"train_loss": -12.027359962463379, "global_step": 229107, "epoch": 1363} {"train_loss": -11.900262832641602, "global_step": 229108, "epoch": 1363} {"train_loss": -11.838712692260742, "global_step": 229109, "epoch": 1363} {"train_loss": -11.97640609741211, "global_step": 229110, "epoch": 1363} {"train_loss": -11.440235137939453, "global_step": 229111, "epoch": 1363} {"train_loss": -11.989045143127441, "global_step": 229112, "epoch": 1363} {"train_loss": -11.641144752502441, "global_step": 229113, "epoch": 1363} {"train_loss": -11.839487075805664, "global_step": 229114, "epoch": 1363} {"train_loss": -11.652643203735352, "global_step": 229115, "epoch": 1363} {"train_loss": -12.089973449707031, "global_step": 229116, "epoch": 1363} {"train_loss": -12.004461288452148, "global_step": 229117, "epoch": 1363} {"train_loss": -12.17152214050293, "global_step": 229118, "epoch": 1363} {"train_loss": -11.636871337890625, "global_step": 229119, "epoch": 1363} {"train_loss": -11.602840423583984, "global_step": 229120, "epoch": 1363} {"train_loss": -11.191353797912598, "global_step": 229121, "epoch": 1363} {"train_loss": -12.060968399047852, "global_step": 229122, "epoch": 1363} {"train_loss": -11.171562194824219, "global_step": 229123, "epoch": 1363} {"train_loss": -10.606673240661621, "global_step": 229124, "epoch": 1363} {"train_loss": -10.895465850830078, "global_step": 229125, "epoch": 1363} {"train_loss": -11.772664070129395, "global_step": 229126, "epoch": 1363} {"train_loss": -11.750085830688477, "global_step": 229127, "epoch": 1363} {"train_loss": -11.401079177856445, "global_step": 229128, "epoch": 1363} {"train_loss": -11.067025184631348, "global_step": 229129, "epoch": 1363} {"train_loss": -11.141042709350586, "global_step": 229130, "epoch": 1363} {"train_loss": -10.81890869140625, "global_step": 229131, "epoch": 1363} {"train_loss": -11.872964859008789, "global_step": 229132, "epoch": 1363} {"train_loss": -11.270952224731445, "global_step": 229133, "epoch": 1363} {"train_loss": -11.17941951751709, "global_step": 229134, "epoch": 1363} {"train_loss": -11.114944458007812, "global_step": 229135, "epoch": 1363} {"train_loss": -10.47836971282959, "global_step": 229136, "epoch": 1363} {"train_loss": -9.567140579223633, "global_step": 229137, "epoch": 1363} {"train_loss": -9.540252685546875, "global_step": 229138, "epoch": 1363} {"train_loss": -9.044578552246094, "global_step": 229139, "epoch": 1363} {"train_loss": -9.175520896911621, "global_step": 229140, "epoch": 1363} {"train_loss": -7.378236770629883, "global_step": 229141, "epoch": 1363} {"train_loss": -7.7907257080078125, "global_step": 229142, "epoch": 1363} {"train_loss": -8.784098625183105, "global_step": 229143, "epoch": 1363} {"train_loss": -8.795787811279297, "global_step": 229144, "epoch": 1363} {"train_loss": -9.009766578674316, "global_step": 229145, "epoch": 1363} {"train_loss": -7.441728591918945, "global_step": 229146, "epoch": 1363} {"train_loss": -8.240907669067383, "global_step": 229147, "epoch": 1363} {"train_loss": -8.739578247070312, "global_step": 229148, "epoch": 1363} {"train_loss": -10.592636108398438, "global_step": 229149, "epoch": 1363} {"train_loss": -8.615303993225098, "global_step": 229150, "epoch": 1363} {"train_loss": -11.36129263469151, "global_step": 229151, "epoch": 1363, "val_loss": 258565.453125} {"train_loss": -9.404504776000977, "global_step": 229152, "epoch": 1364} {"train_loss": -10.589797019958496, "global_step": 229153, "epoch": 1364} {"train_loss": -8.913436889648438, "global_step": 229154, "epoch": 1364} {"train_loss": -10.427862167358398, "global_step": 229155, "epoch": 1364} {"train_loss": -9.698883056640625, "global_step": 229156, "epoch": 1364} {"train_loss": -9.931684494018555, "global_step": 229157, "epoch": 1364} {"train_loss": -10.084766387939453, "global_step": 229158, "epoch": 1364} {"train_loss": -10.19569206237793, "global_step": 229159, "epoch": 1364} {"train_loss": -10.143331527709961, "global_step": 229160, "epoch": 1364} {"train_loss": -10.144683837890625, "global_step": 229161, "epoch": 1364} {"train_loss": -10.638388633728027, "global_step": 229162, "epoch": 1364} {"train_loss": -9.785152435302734, "global_step": 229163, "epoch": 1364} {"train_loss": -10.846511840820312, "global_step": 229164, "epoch": 1364} {"train_loss": -11.025182723999023, "global_step": 229165, "epoch": 1364} {"train_loss": -10.21636962890625, "global_step": 229166, "epoch": 1364} {"train_loss": -11.007080078125, "global_step": 229167, "epoch": 1364} {"train_loss": -10.595622062683105, "global_step": 229168, "epoch": 1364} {"train_loss": -10.739011764526367, "global_step": 229169, "epoch": 1364} {"train_loss": -11.026182174682617, "global_step": 229170, "epoch": 1364} {"train_loss": -10.56640338897705, "global_step": 229171, "epoch": 1364} {"train_loss": -10.824930191040039, "global_step": 229172, "epoch": 1364} {"train_loss": -11.021163940429688, "global_step": 229173, "epoch": 1364} {"train_loss": -10.917459487915039, "global_step": 229174, "epoch": 1364} {"train_loss": -11.099072456359863, "global_step": 229175, "epoch": 1364} {"train_loss": -11.262319564819336, "global_step": 229176, "epoch": 1364} {"train_loss": -11.220255851745605, "global_step": 229177, "epoch": 1364} {"train_loss": -11.366679191589355, "global_step": 229178, "epoch": 1364} {"train_loss": -11.181413650512695, "global_step": 229179, "epoch": 1364} {"train_loss": -11.2124662399292, "global_step": 229180, "epoch": 1364} {"train_loss": -11.431098937988281, "global_step": 229181, "epoch": 1364} {"train_loss": -10.989728927612305, "global_step": 229182, "epoch": 1364} {"train_loss": -11.518241882324219, "global_step": 229183, "epoch": 1364} {"train_loss": -11.39545726776123, "global_step": 229184, "epoch": 1364} {"train_loss": -11.400857925415039, "global_step": 229185, "epoch": 1364} {"train_loss": -11.222700119018555, "global_step": 229186, "epoch": 1364} {"train_loss": -11.192927360534668, "global_step": 229187, "epoch": 1364} {"train_loss": -11.453290939331055, "global_step": 229188, "epoch": 1364} {"train_loss": -11.225772857666016, "global_step": 229189, "epoch": 1364} {"train_loss": -11.41778564453125, "global_step": 229190, "epoch": 1364} {"train_loss": -11.359764099121094, "global_step": 229191, "epoch": 1364} {"train_loss": -11.601987838745117, "global_step": 229192, "epoch": 1364} {"train_loss": -11.513351440429688, "global_step": 229193, "epoch": 1364} {"train_loss": -11.597078323364258, "global_step": 229194, "epoch": 1364} {"train_loss": -11.360723495483398, "global_step": 229195, "epoch": 1364} {"train_loss": -11.669990539550781, "global_step": 229196, "epoch": 1364} {"train_loss": -11.605674743652344, "global_step": 229197, "epoch": 1364} {"train_loss": -11.422307968139648, "global_step": 229198, "epoch": 1364} {"train_loss": -11.626935005187988, "global_step": 229199, "epoch": 1364} {"train_loss": -11.394006729125977, "global_step": 229200, "epoch": 1364} {"train_loss": -11.602556228637695, "global_step": 229201, "epoch": 1364} {"train_loss": -11.588724136352539, "global_step": 229202, "epoch": 1364} {"train_loss": -11.868850708007812, "global_step": 229203, "epoch": 1364} {"train_loss": -11.629045486450195, "global_step": 229204, "epoch": 1364} {"train_loss": -11.765934944152832, "global_step": 229205, "epoch": 1364} {"train_loss": -11.664339065551758, "global_step": 229206, "epoch": 1364} {"train_loss": -11.649539947509766, "global_step": 229207, "epoch": 1364} {"train_loss": -11.58791732788086, "global_step": 229208, "epoch": 1364} {"train_loss": -11.742372512817383, "global_step": 229209, "epoch": 1364} {"train_loss": -11.825141906738281, "global_step": 229210, "epoch": 1364} {"train_loss": -11.799076080322266, "global_step": 229211, "epoch": 1364} {"train_loss": -11.815553665161133, "global_step": 229212, "epoch": 1364} {"train_loss": -11.83209228515625, "global_step": 229213, "epoch": 1364} {"train_loss": -11.715139389038086, "global_step": 229214, "epoch": 1364} {"train_loss": -11.802774429321289, "global_step": 229215, "epoch": 1364} {"train_loss": -11.808591842651367, "global_step": 229216, "epoch": 1364} {"train_loss": -11.7543306350708, "global_step": 229217, "epoch": 1364} {"train_loss": -11.962396621704102, "global_step": 229218, "epoch": 1364} {"train_loss": -11.784517288208008, "global_step": 229219, "epoch": 1364} {"train_loss": -11.792484283447266, "global_step": 229220, "epoch": 1364} {"train_loss": -11.736679077148438, "global_step": 229221, "epoch": 1364} {"train_loss": -11.770593643188477, "global_step": 229222, "epoch": 1364} {"train_loss": -11.711073875427246, "global_step": 229223, "epoch": 1364} {"train_loss": -11.894014358520508, "global_step": 229224, "epoch": 1364} {"train_loss": -11.871814727783203, "global_step": 229225, "epoch": 1364} {"train_loss": -11.900508880615234, "global_step": 229226, "epoch": 1364} {"train_loss": -11.724669456481934, "global_step": 229227, "epoch": 1364} {"train_loss": -12.058820724487305, "global_step": 229228, "epoch": 1364} {"train_loss": -11.82787799835205, "global_step": 229229, "epoch": 1364} {"train_loss": -11.776662826538086, "global_step": 229230, "epoch": 1364} {"train_loss": -12.045555114746094, "global_step": 229231, "epoch": 1364} {"train_loss": -11.843093872070312, "global_step": 229232, "epoch": 1364} {"train_loss": -11.790594100952148, "global_step": 229233, "epoch": 1364} {"train_loss": -11.950037002563477, "global_step": 229234, "epoch": 1364} {"train_loss": -11.765615463256836, "global_step": 229235, "epoch": 1364} {"train_loss": -12.215068817138672, "global_step": 229236, "epoch": 1364} {"train_loss": -12.036611557006836, "global_step": 229237, "epoch": 1364} {"train_loss": -12.004669189453125, "global_step": 229238, "epoch": 1364} {"train_loss": -11.87562370300293, "global_step": 229239, "epoch": 1364} {"train_loss": -12.16975212097168, "global_step": 229240, "epoch": 1364} {"train_loss": -12.008934020996094, "global_step": 229241, "epoch": 1364} {"train_loss": -11.975957870483398, "global_step": 229242, "epoch": 1364} {"train_loss": -11.986577987670898, "global_step": 229243, "epoch": 1364} {"train_loss": -12.192235946655273, "global_step": 229244, "epoch": 1364} {"train_loss": -11.889135360717773, "global_step": 229245, "epoch": 1364} {"train_loss": -11.968767166137695, "global_step": 229246, "epoch": 1364} {"train_loss": -11.968011856079102, "global_step": 229247, "epoch": 1364} {"train_loss": -11.976806640625, "global_step": 229248, "epoch": 1364} {"train_loss": -12.0187349319458, "global_step": 229249, "epoch": 1364} {"train_loss": -11.844165802001953, "global_step": 229250, "epoch": 1364} {"train_loss": -11.544220924377441, "global_step": 229251, "epoch": 1364} {"train_loss": -12.032092094421387, "global_step": 229252, "epoch": 1364} {"train_loss": -11.766112327575684, "global_step": 229253, "epoch": 1364} {"train_loss": -11.822585105895996, "global_step": 229254, "epoch": 1364} {"train_loss": -11.681427001953125, "global_step": 229255, "epoch": 1364} {"train_loss": -11.24418830871582, "global_step": 229256, "epoch": 1364} {"train_loss": -10.558897018432617, "global_step": 229257, "epoch": 1364} {"train_loss": -10.450468063354492, "global_step": 229258, "epoch": 1364} {"train_loss": -11.489486694335938, "global_step": 229259, "epoch": 1364} {"train_loss": -11.12189769744873, "global_step": 229260, "epoch": 1364} {"train_loss": -10.518745422363281, "global_step": 229261, "epoch": 1364} {"train_loss": -10.075884819030762, "global_step": 229262, "epoch": 1364} {"train_loss": -10.052582740783691, "global_step": 229263, "epoch": 1364} {"train_loss": -10.96022891998291, "global_step": 229264, "epoch": 1364} {"train_loss": -8.735902786254883, "global_step": 229265, "epoch": 1364} {"train_loss": -8.544408798217773, "global_step": 229266, "epoch": 1364} {"train_loss": -10.44304084777832, "global_step": 229267, "epoch": 1364} {"train_loss": -9.001599311828613, "global_step": 229268, "epoch": 1364} {"train_loss": -9.520434379577637, "global_step": 229269, "epoch": 1364} {"train_loss": -9.458667755126953, "global_step": 229270, "epoch": 1364} {"train_loss": -7.259634494781494, "global_step": 229271, "epoch": 1364} {"train_loss": -8.662322998046875, "global_step": 229272, "epoch": 1364} {"train_loss": -9.598039627075195, "global_step": 229273, "epoch": 1364} {"train_loss": -10.117088317871094, "global_step": 229274, "epoch": 1364} {"train_loss": -8.909984588623047, "global_step": 229275, "epoch": 1364} {"train_loss": -10.320765495300293, "global_step": 229276, "epoch": 1364} {"train_loss": -10.350797653198242, "global_step": 229277, "epoch": 1364} {"train_loss": -9.240545272827148, "global_step": 229278, "epoch": 1364} {"train_loss": -10.615615844726562, "global_step": 229279, "epoch": 1364} {"train_loss": -9.903922080993652, "global_step": 229280, "epoch": 1364} {"train_loss": -10.003154754638672, "global_step": 229281, "epoch": 1364} {"train_loss": -10.690140724182129, "global_step": 229282, "epoch": 1364} {"train_loss": -10.735692977905273, "global_step": 229283, "epoch": 1364} {"train_loss": -10.284770011901855, "global_step": 229284, "epoch": 1364} {"train_loss": -11.078386306762695, "global_step": 229285, "epoch": 1364} {"train_loss": -10.818410873413086, "global_step": 229286, "epoch": 1364} {"train_loss": -10.876557350158691, "global_step": 229287, "epoch": 1364} {"train_loss": -11.1407470703125, "global_step": 229288, "epoch": 1364} {"train_loss": -11.169761657714844, "global_step": 229289, "epoch": 1364} {"train_loss": -10.912896156311035, "global_step": 229290, "epoch": 1364} {"train_loss": -11.102117538452148, "global_step": 229291, "epoch": 1364} {"train_loss": -11.423250198364258, "global_step": 229292, "epoch": 1364} {"train_loss": -11.344093322753906, "global_step": 229293, "epoch": 1364} {"train_loss": -11.15922737121582, "global_step": 229294, "epoch": 1364} {"train_loss": -11.49161148071289, "global_step": 229295, "epoch": 1364} {"train_loss": -11.465633392333984, "global_step": 229296, "epoch": 1364} {"train_loss": -11.406961441040039, "global_step": 229297, "epoch": 1364} {"train_loss": -11.53382682800293, "global_step": 229298, "epoch": 1364} {"train_loss": -11.380542755126953, "global_step": 229299, "epoch": 1364} {"train_loss": -11.231407165527344, "global_step": 229300, "epoch": 1364} {"train_loss": -11.39975357055664, "global_step": 229301, "epoch": 1364} {"train_loss": -11.383027076721191, "global_step": 229302, "epoch": 1364} {"train_loss": -11.099430084228516, "global_step": 229303, "epoch": 1364} {"train_loss": -11.467187881469727, "global_step": 229304, "epoch": 1364} {"train_loss": -11.348344802856445, "global_step": 229305, "epoch": 1364} {"train_loss": -11.437936782836914, "global_step": 229306, "epoch": 1364} {"train_loss": -11.529947280883789, "global_step": 229307, "epoch": 1364} {"train_loss": -11.447101593017578, "global_step": 229308, "epoch": 1364} {"train_loss": -11.501441955566406, "global_step": 229309, "epoch": 1364} {"train_loss": -11.38679313659668, "global_step": 229310, "epoch": 1364} {"train_loss": -11.49142837524414, "global_step": 229311, "epoch": 1364} {"train_loss": -11.418550491333008, "global_step": 229312, "epoch": 1364} {"train_loss": -11.652342796325684, "global_step": 229313, "epoch": 1364} {"train_loss": -11.533958435058594, "global_step": 229314, "epoch": 1364} {"train_loss": -11.461999893188477, "global_step": 229315, "epoch": 1364} {"train_loss": -11.816692352294922, "global_step": 229316, "epoch": 1364} {"train_loss": -11.498628616333008, "global_step": 229317, "epoch": 1364} {"train_loss": -11.664897918701172, "global_step": 229318, "epoch": 1364} {"train_loss": -11.147461121990567, "global_step": 229319, "epoch": 1364, "val_loss": 251107.1875} {"train_loss": -11.560151100158691, "global_step": 229320, "epoch": 1365} {"train_loss": -11.513693809509277, "global_step": 229321, "epoch": 1365} {"train_loss": -11.306103706359863, "global_step": 229322, "epoch": 1365} {"train_loss": -11.535585403442383, "global_step": 229323, "epoch": 1365} {"train_loss": -11.63875961303711, "global_step": 229324, "epoch": 1365} {"train_loss": -11.36638355255127, "global_step": 229325, "epoch": 1365} {"train_loss": -11.379339218139648, "global_step": 229326, "epoch": 1365} {"train_loss": -11.731857299804688, "global_step": 229327, "epoch": 1365} {"train_loss": -11.296380043029785, "global_step": 229328, "epoch": 1365} {"train_loss": -11.73827075958252, "global_step": 229329, "epoch": 1365} {"train_loss": -11.527993202209473, "global_step": 229330, "epoch": 1365} {"train_loss": -11.807132720947266, "global_step": 229331, "epoch": 1365} {"train_loss": -11.256362915039062, "global_step": 229332, "epoch": 1365} {"train_loss": -11.376139640808105, "global_step": 229333, "epoch": 1365} {"train_loss": -11.81793212890625, "global_step": 229334, "epoch": 1365} {"train_loss": -11.784385681152344, "global_step": 229335, "epoch": 1365} {"train_loss": -11.661886215209961, "global_step": 229336, "epoch": 1365} {"train_loss": -11.81974983215332, "global_step": 229337, "epoch": 1365} {"train_loss": -11.482946395874023, "global_step": 229338, "epoch": 1365} {"train_loss": -11.38843059539795, "global_step": 229339, "epoch": 1365} {"train_loss": -11.85285758972168, "global_step": 229340, "epoch": 1365} {"train_loss": -11.73183822631836, "global_step": 229341, "epoch": 1365} {"train_loss": -11.691841125488281, "global_step": 229342, "epoch": 1365} {"train_loss": -11.746874809265137, "global_step": 229343, "epoch": 1365} {"train_loss": -11.687633514404297, "global_step": 229344, "epoch": 1365} {"train_loss": -11.670821189880371, "global_step": 229345, "epoch": 1365} {"train_loss": -11.871201515197754, "global_step": 229346, "epoch": 1365} {"train_loss": -11.532238006591797, "global_step": 229347, "epoch": 1365} {"train_loss": -11.589357376098633, "global_step": 229348, "epoch": 1365} {"train_loss": -11.746160507202148, "global_step": 229349, "epoch": 1365} {"train_loss": -11.733720779418945, "global_step": 229350, "epoch": 1365} {"train_loss": -11.748939514160156, "global_step": 229351, "epoch": 1365} {"train_loss": -11.74128532409668, "global_step": 229352, "epoch": 1365} {"train_loss": -11.713200569152832, "global_step": 229353, "epoch": 1365} {"train_loss": -12.029108047485352, "global_step": 229354, "epoch": 1365} {"train_loss": -11.844583511352539, "global_step": 229355, "epoch": 1365} {"train_loss": -11.578156471252441, "global_step": 229356, "epoch": 1365} {"train_loss": -11.819195747375488, "global_step": 229357, "epoch": 1365} {"train_loss": -11.678972244262695, "global_step": 229358, "epoch": 1365} {"train_loss": -11.858415603637695, "global_step": 229359, "epoch": 1365} {"train_loss": -11.654193878173828, "global_step": 229360, "epoch": 1365} {"train_loss": -11.540006637573242, "global_step": 229361, "epoch": 1365} {"train_loss": -11.389766693115234, "global_step": 229362, "epoch": 1365} {"train_loss": -12.03155517578125, "global_step": 229363, "epoch": 1365} {"train_loss": -11.344446182250977, "global_step": 229364, "epoch": 1365} {"train_loss": -11.465424537658691, "global_step": 229365, "epoch": 1365} {"train_loss": -11.31756591796875, "global_step": 229366, "epoch": 1365} {"train_loss": -10.699247360229492, "global_step": 229367, "epoch": 1365} {"train_loss": -10.462638854980469, "global_step": 229368, "epoch": 1365} {"train_loss": -11.421661376953125, "global_step": 229369, "epoch": 1365} {"train_loss": -10.425418853759766, "global_step": 229370, "epoch": 1365} {"train_loss": -10.730874061584473, "global_step": 229371, "epoch": 1365} {"train_loss": -11.032100677490234, "global_step": 229372, "epoch": 1365} {"train_loss": -11.146324157714844, "global_step": 229373, "epoch": 1365} {"train_loss": -11.292703628540039, "global_step": 229374, "epoch": 1365} {"train_loss": -11.09945011138916, "global_step": 229375, "epoch": 1365} {"train_loss": -11.403375625610352, "global_step": 229376, "epoch": 1365} {"train_loss": -11.776765823364258, "global_step": 229377, "epoch": 1365} {"train_loss": -11.266651153564453, "global_step": 229378, "epoch": 1365} {"train_loss": -11.55881404876709, "global_step": 229379, "epoch": 1365} {"train_loss": -11.41627311706543, "global_step": 229380, "epoch": 1365} {"train_loss": -11.414570808410645, "global_step": 229381, "epoch": 1365} {"train_loss": -11.664586067199707, "global_step": 229382, "epoch": 1365} {"train_loss": -11.122015953063965, "global_step": 229383, "epoch": 1365} {"train_loss": -11.603398323059082, "global_step": 229384, "epoch": 1365} {"train_loss": -11.439498901367188, "global_step": 229385, "epoch": 1365} {"train_loss": -11.69443130493164, "global_step": 229386, "epoch": 1365} {"train_loss": -11.38638687133789, "global_step": 229387, "epoch": 1365} {"train_loss": -11.237689971923828, "global_step": 229388, "epoch": 1365} {"train_loss": -11.443340301513672, "global_step": 229389, "epoch": 1365} {"train_loss": -11.13976001739502, "global_step": 229390, "epoch": 1365} {"train_loss": -11.738967895507812, "global_step": 229391, "epoch": 1365} {"train_loss": -11.46566390991211, "global_step": 229392, "epoch": 1365} {"train_loss": -11.158879280090332, "global_step": 229393, "epoch": 1365} {"train_loss": -11.491823196411133, "global_step": 229394, "epoch": 1365} {"train_loss": -11.453117370605469, "global_step": 229395, "epoch": 1365} {"train_loss": -11.646498680114746, "global_step": 229396, "epoch": 1365} {"train_loss": -11.70657730102539, "global_step": 229397, "epoch": 1365} {"train_loss": -11.617712020874023, "global_step": 229398, "epoch": 1365} {"train_loss": -11.625694274902344, "global_step": 229399, "epoch": 1365} {"train_loss": -11.491146087646484, "global_step": 229400, "epoch": 1365} {"train_loss": -11.591885566711426, "global_step": 229401, "epoch": 1365} {"train_loss": -11.176835060119629, "global_step": 229402, "epoch": 1365} {"train_loss": -11.991621017456055, "global_step": 229403, "epoch": 1365} {"train_loss": -11.736492156982422, "global_step": 229404, "epoch": 1365} {"train_loss": -11.648575782775879, "global_step": 229405, "epoch": 1365} {"train_loss": -11.637991905212402, "global_step": 229406, "epoch": 1365} {"train_loss": -11.378201484680176, "global_step": 229407, "epoch": 1365} {"train_loss": -11.66691780090332, "global_step": 229408, "epoch": 1365} {"train_loss": -11.070514678955078, "global_step": 229409, "epoch": 1365} {"train_loss": -11.734315872192383, "global_step": 229410, "epoch": 1365} {"train_loss": -11.02118968963623, "global_step": 229411, "epoch": 1365} {"train_loss": -11.539386749267578, "global_step": 229412, "epoch": 1365} {"train_loss": -11.092937469482422, "global_step": 229413, "epoch": 1365} {"train_loss": -11.180909156799316, "global_step": 229414, "epoch": 1365} {"train_loss": -10.633295059204102, "global_step": 229415, "epoch": 1365} {"train_loss": -11.739399909973145, "global_step": 229416, "epoch": 1365} {"train_loss": -11.05023193359375, "global_step": 229417, "epoch": 1365} {"train_loss": -11.707542419433594, "global_step": 229418, "epoch": 1365} {"train_loss": -11.007333755493164, "global_step": 229419, "epoch": 1365} {"train_loss": -11.467877388000488, "global_step": 229420, "epoch": 1365} {"train_loss": -11.320656776428223, "global_step": 229421, "epoch": 1365} {"train_loss": -11.301136016845703, "global_step": 229422, "epoch": 1365} {"train_loss": -11.547236442565918, "global_step": 229423, "epoch": 1365} {"train_loss": -11.40573501586914, "global_step": 229424, "epoch": 1365} {"train_loss": -11.277557373046875, "global_step": 229425, "epoch": 1365} {"train_loss": -11.752873420715332, "global_step": 229426, "epoch": 1365} {"train_loss": -10.961633682250977, "global_step": 229427, "epoch": 1365} {"train_loss": -11.672208786010742, "global_step": 229428, "epoch": 1365} {"train_loss": -10.844383239746094, "global_step": 229429, "epoch": 1365} {"train_loss": -11.291257858276367, "global_step": 229430, "epoch": 1365} {"train_loss": -10.60495376586914, "global_step": 229431, "epoch": 1365} {"train_loss": -11.021156311035156, "global_step": 229432, "epoch": 1365} {"train_loss": -10.460784912109375, "global_step": 229433, "epoch": 1365} {"train_loss": -10.960763931274414, "global_step": 229434, "epoch": 1365} {"train_loss": -11.283773422241211, "global_step": 229435, "epoch": 1365} {"train_loss": -11.055169105529785, "global_step": 229436, "epoch": 1365} {"train_loss": -11.12419319152832, "global_step": 229437, "epoch": 1365} {"train_loss": -11.441990852355957, "global_step": 229438, "epoch": 1365} {"train_loss": -11.108688354492188, "global_step": 229439, "epoch": 1365} {"train_loss": -11.477438926696777, "global_step": 229440, "epoch": 1365} {"train_loss": -11.722827911376953, "global_step": 229441, "epoch": 1365} {"train_loss": -11.363700866699219, "global_step": 229442, "epoch": 1365} {"train_loss": -11.564044952392578, "global_step": 229443, "epoch": 1365} {"train_loss": -11.770378112792969, "global_step": 229444, "epoch": 1365} {"train_loss": -11.329212188720703, "global_step": 229445, "epoch": 1365} {"train_loss": -11.745553970336914, "global_step": 229446, "epoch": 1365} {"train_loss": -11.581069946289062, "global_step": 229447, "epoch": 1365} {"train_loss": -11.683298110961914, "global_step": 229448, "epoch": 1365} {"train_loss": -11.716466903686523, "global_step": 229449, "epoch": 1365} {"train_loss": -11.710893630981445, "global_step": 229450, "epoch": 1365} {"train_loss": -11.603286743164062, "global_step": 229451, "epoch": 1365} {"train_loss": -11.455551147460938, "global_step": 229452, "epoch": 1365} {"train_loss": -11.276287078857422, "global_step": 229453, "epoch": 1365} {"train_loss": -11.559089660644531, "global_step": 229454, "epoch": 1365} {"train_loss": -11.391997337341309, "global_step": 229455, "epoch": 1365} {"train_loss": -11.434672355651855, "global_step": 229456, "epoch": 1365} {"train_loss": -11.893836975097656, "global_step": 229457, "epoch": 1365} {"train_loss": -11.416240692138672, "global_step": 229458, "epoch": 1365} {"train_loss": -11.693958282470703, "global_step": 229459, "epoch": 1365} {"train_loss": -11.69565200805664, "global_step": 229460, "epoch": 1365} {"train_loss": -11.570232391357422, "global_step": 229461, "epoch": 1365} {"train_loss": -11.542269706726074, "global_step": 229462, "epoch": 1365} {"train_loss": -11.442727088928223, "global_step": 229463, "epoch": 1365} {"train_loss": -11.631813049316406, "global_step": 229464, "epoch": 1365} {"train_loss": -11.513204574584961, "global_step": 229465, "epoch": 1365} {"train_loss": -11.512121200561523, "global_step": 229466, "epoch": 1365} {"train_loss": -11.42497730255127, "global_step": 229467, "epoch": 1365} {"train_loss": -11.140274047851562, "global_step": 229468, "epoch": 1365} {"train_loss": -11.644156455993652, "global_step": 229469, "epoch": 1365} {"train_loss": -11.517265319824219, "global_step": 229470, "epoch": 1365} {"train_loss": -11.743758201599121, "global_step": 229471, "epoch": 1365} {"train_loss": -11.555893898010254, "global_step": 229472, "epoch": 1365} {"train_loss": -11.617963790893555, "global_step": 229473, "epoch": 1365} {"train_loss": -11.225381851196289, "global_step": 229474, "epoch": 1365} {"train_loss": -11.666009902954102, "global_step": 229475, "epoch": 1365} {"train_loss": -11.206903457641602, "global_step": 229476, "epoch": 1365} {"train_loss": -11.583940505981445, "global_step": 229477, "epoch": 1365} {"train_loss": -11.618082046508789, "global_step": 229478, "epoch": 1365} {"train_loss": -11.060785293579102, "global_step": 229479, "epoch": 1365} {"train_loss": -11.578418731689453, "global_step": 229480, "epoch": 1365} {"train_loss": -11.09393310546875, "global_step": 229481, "epoch": 1365} {"train_loss": -10.777957916259766, "global_step": 229482, "epoch": 1365} {"train_loss": -10.733938217163086, "global_step": 229483, "epoch": 1365} {"train_loss": -11.210650444030762, "global_step": 229484, "epoch": 1365} {"train_loss": -10.567817687988281, "global_step": 229485, "epoch": 1365} {"train_loss": -11.020133018493652, "global_step": 229486, "epoch": 1365} {"train_loss": -11.436803925605048, "global_step": 229487, "epoch": 1365, "val_loss": 257341.546875, "train_action_mse_error": 1.6286520957946777} {"train_loss": -10.365357398986816, "global_step": 229488, "epoch": 1366} {"train_loss": -11.0502347946167, "global_step": 229489, "epoch": 1366} {"train_loss": -10.645794868469238, "global_step": 229490, "epoch": 1366} {"train_loss": -11.16504192352295, "global_step": 229491, "epoch": 1366} {"train_loss": -11.103008270263672, "global_step": 229492, "epoch": 1366} {"train_loss": -10.6936616897583, "global_step": 229493, "epoch": 1366} {"train_loss": -11.650023460388184, "global_step": 229494, "epoch": 1366} {"train_loss": -11.13618278503418, "global_step": 229495, "epoch": 1366} {"train_loss": -11.197463989257812, "global_step": 229496, "epoch": 1366} {"train_loss": -11.142240524291992, "global_step": 229497, "epoch": 1366} {"train_loss": -11.319021224975586, "global_step": 229498, "epoch": 1366} {"train_loss": -11.593659400939941, "global_step": 229499, "epoch": 1366} {"train_loss": -11.326250076293945, "global_step": 229500, "epoch": 1366} {"train_loss": -11.387331008911133, "global_step": 229501, "epoch": 1366} {"train_loss": -11.773765563964844, "global_step": 229502, "epoch": 1366} {"train_loss": -11.36098861694336, "global_step": 229503, "epoch": 1366} {"train_loss": -11.537538528442383, "global_step": 229504, "epoch": 1366} {"train_loss": -11.455890655517578, "global_step": 229505, "epoch": 1366} {"train_loss": -11.613338470458984, "global_step": 229506, "epoch": 1366} {"train_loss": -11.483028411865234, "global_step": 229507, "epoch": 1366} {"train_loss": -11.75273323059082, "global_step": 229508, "epoch": 1366} {"train_loss": -11.642755508422852, "global_step": 229509, "epoch": 1366} {"train_loss": -11.584556579589844, "global_step": 229510, "epoch": 1366} {"train_loss": -11.347187042236328, "global_step": 229511, "epoch": 1366} {"train_loss": -11.509744644165039, "global_step": 229512, "epoch": 1366} {"train_loss": -11.582468032836914, "global_step": 229513, "epoch": 1366} {"train_loss": -11.772378921508789, "global_step": 229514, "epoch": 1366} {"train_loss": -11.748939514160156, "global_step": 229515, "epoch": 1366} {"train_loss": -11.620150566101074, "global_step": 229516, "epoch": 1366} {"train_loss": -11.585296630859375, "global_step": 229517, "epoch": 1366} {"train_loss": -11.71733283996582, "global_step": 229518, "epoch": 1366} {"train_loss": -11.687332153320312, "global_step": 229519, "epoch": 1366} {"train_loss": -11.692205429077148, "global_step": 229520, "epoch": 1366} {"train_loss": -11.839761734008789, "global_step": 229521, "epoch": 1366} {"train_loss": -11.709007263183594, "global_step": 229522, "epoch": 1366} {"train_loss": -11.808767318725586, "global_step": 229523, "epoch": 1366} {"train_loss": -11.783119201660156, "global_step": 229524, "epoch": 1366} {"train_loss": -11.879858016967773, "global_step": 229525, "epoch": 1366} {"train_loss": -11.741893768310547, "global_step": 229526, "epoch": 1366} {"train_loss": -11.695905685424805, "global_step": 229527, "epoch": 1366} {"train_loss": -11.546507835388184, "global_step": 229528, "epoch": 1366} {"train_loss": -11.930398941040039, "global_step": 229529, "epoch": 1366} {"train_loss": -11.77413272857666, "global_step": 229530, "epoch": 1366} {"train_loss": -11.233864784240723, "global_step": 229531, "epoch": 1366} {"train_loss": -11.634044647216797, "global_step": 229532, "epoch": 1366} {"train_loss": -11.615274429321289, "global_step": 229533, "epoch": 1366} {"train_loss": -11.524833679199219, "global_step": 229534, "epoch": 1366} {"train_loss": -11.728950500488281, "global_step": 229535, "epoch": 1366} {"train_loss": -11.189605712890625, "global_step": 229536, "epoch": 1366} {"train_loss": -11.103347778320312, "global_step": 229537, "epoch": 1366} {"train_loss": -11.613122940063477, "global_step": 229538, "epoch": 1366} {"train_loss": -11.73737907409668, "global_step": 229539, "epoch": 1366} {"train_loss": -11.640945434570312, "global_step": 229540, "epoch": 1366} {"train_loss": -11.307014465332031, "global_step": 229541, "epoch": 1366} {"train_loss": -11.652496337890625, "global_step": 229542, "epoch": 1366} {"train_loss": -11.236946105957031, "global_step": 229543, "epoch": 1366} {"train_loss": -11.543354034423828, "global_step": 229544, "epoch": 1366} {"train_loss": -10.072610855102539, "global_step": 229545, "epoch": 1366} {"train_loss": -9.769754409790039, "global_step": 229546, "epoch": 1366} {"train_loss": -11.484451293945312, "global_step": 229547, "epoch": 1366} {"train_loss": -10.710527420043945, "global_step": 229548, "epoch": 1366} {"train_loss": -11.14535140991211, "global_step": 229549, "epoch": 1366} {"train_loss": -10.851348876953125, "global_step": 229550, "epoch": 1366} {"train_loss": -10.149749755859375, "global_step": 229551, "epoch": 1366} {"train_loss": -10.974129676818848, "global_step": 229552, "epoch": 1366} {"train_loss": -10.887782096862793, "global_step": 229553, "epoch": 1366} {"train_loss": -10.127696990966797, "global_step": 229554, "epoch": 1366} {"train_loss": -10.814401626586914, "global_step": 229555, "epoch": 1366} {"train_loss": -10.447985649108887, "global_step": 229556, "epoch": 1366} {"train_loss": -11.13025951385498, "global_step": 229557, "epoch": 1366} {"train_loss": -10.957916259765625, "global_step": 229558, "epoch": 1366} {"train_loss": -10.70015811920166, "global_step": 229559, "epoch": 1366} {"train_loss": -11.486065864562988, "global_step": 229560, "epoch": 1366} {"train_loss": -10.995083808898926, "global_step": 229561, "epoch": 1366} {"train_loss": -11.618593215942383, "global_step": 229562, "epoch": 1366} {"train_loss": -11.115581512451172, "global_step": 229563, "epoch": 1366} {"train_loss": -11.49418830871582, "global_step": 229564, "epoch": 1366} {"train_loss": -11.42670726776123, "global_step": 229565, "epoch": 1366} {"train_loss": -11.383718490600586, "global_step": 229566, "epoch": 1366} {"train_loss": -11.489053726196289, "global_step": 229567, "epoch": 1366} {"train_loss": -11.23806095123291, "global_step": 229568, "epoch": 1366} {"train_loss": -10.839128494262695, "global_step": 229569, "epoch": 1366} {"train_loss": -11.550939559936523, "global_step": 229570, "epoch": 1366} {"train_loss": -10.966367721557617, "global_step": 229571, "epoch": 1366} {"train_loss": -11.645336151123047, "global_step": 229572, "epoch": 1366} {"train_loss": -11.41882610321045, "global_step": 229573, "epoch": 1366} {"train_loss": -11.312204360961914, "global_step": 229574, "epoch": 1366} {"train_loss": -11.667863845825195, "global_step": 229575, "epoch": 1366} {"train_loss": -11.260115623474121, "global_step": 229576, "epoch": 1366} {"train_loss": -11.519233703613281, "global_step": 229577, "epoch": 1366} {"train_loss": -11.333913803100586, "global_step": 229578, "epoch": 1366} {"train_loss": -11.632326126098633, "global_step": 229579, "epoch": 1366} {"train_loss": -11.42458724975586, "global_step": 229580, "epoch": 1366} {"train_loss": -11.752302169799805, "global_step": 229581, "epoch": 1366} {"train_loss": -11.326775550842285, "global_step": 229582, "epoch": 1366} {"train_loss": -11.633138656616211, "global_step": 229583, "epoch": 1366} {"train_loss": -11.582250595092773, "global_step": 229584, "epoch": 1366} {"train_loss": -11.412370681762695, "global_step": 229585, "epoch": 1366} {"train_loss": -11.676732063293457, "global_step": 229586, "epoch": 1366} {"train_loss": -11.369617462158203, "global_step": 229587, "epoch": 1366} {"train_loss": -11.880754470825195, "global_step": 229588, "epoch": 1366} {"train_loss": -10.768630981445312, "global_step": 229589, "epoch": 1366} {"train_loss": -11.76618480682373, "global_step": 229590, "epoch": 1366} {"train_loss": -11.288076400756836, "global_step": 229591, "epoch": 1366} {"train_loss": -11.554271697998047, "global_step": 229592, "epoch": 1366} {"train_loss": -11.553603172302246, "global_step": 229593, "epoch": 1366} {"train_loss": -11.701898574829102, "global_step": 229594, "epoch": 1366} {"train_loss": -11.490935325622559, "global_step": 229595, "epoch": 1366} {"train_loss": -11.563201904296875, "global_step": 229596, "epoch": 1366} {"train_loss": -11.411182403564453, "global_step": 229597, "epoch": 1366} {"train_loss": -11.860570907592773, "global_step": 229598, "epoch": 1366} {"train_loss": -11.335920333862305, "global_step": 229599, "epoch": 1366} {"train_loss": -11.90907096862793, "global_step": 229600, "epoch": 1366} {"train_loss": -11.434069633483887, "global_step": 229601, "epoch": 1366} {"train_loss": -10.907278060913086, "global_step": 229602, "epoch": 1366} {"train_loss": -11.435894012451172, "global_step": 229603, "epoch": 1366} {"train_loss": -10.72294807434082, "global_step": 229604, "epoch": 1366} {"train_loss": -11.646743774414062, "global_step": 229605, "epoch": 1366} {"train_loss": -11.086758613586426, "global_step": 229606, "epoch": 1366} {"train_loss": -11.321901321411133, "global_step": 229607, "epoch": 1366} {"train_loss": -11.708841323852539, "global_step": 229608, "epoch": 1366} {"train_loss": -11.411665916442871, "global_step": 229609, "epoch": 1366} {"train_loss": -11.801824569702148, "global_step": 229610, "epoch": 1366} {"train_loss": -11.583475112915039, "global_step": 229611, "epoch": 1366} {"train_loss": -11.717598915100098, "global_step": 229612, "epoch": 1366} {"train_loss": -11.405706405639648, "global_step": 229613, "epoch": 1366} {"train_loss": -11.751033782958984, "global_step": 229614, "epoch": 1366} {"train_loss": -11.732046127319336, "global_step": 229615, "epoch": 1366} {"train_loss": -11.96628189086914, "global_step": 229616, "epoch": 1366} {"train_loss": -11.477387428283691, "global_step": 229617, "epoch": 1366} {"train_loss": -11.80568790435791, "global_step": 229618, "epoch": 1366} {"train_loss": -11.45155143737793, "global_step": 229619, "epoch": 1366} {"train_loss": -11.706039428710938, "global_step": 229620, "epoch": 1366} {"train_loss": -11.751623153686523, "global_step": 229621, "epoch": 1366} {"train_loss": -11.37874698638916, "global_step": 229622, "epoch": 1366} {"train_loss": -11.56943416595459, "global_step": 229623, "epoch": 1366} {"train_loss": -11.784587860107422, "global_step": 229624, "epoch": 1366} {"train_loss": -11.880887031555176, "global_step": 229625, "epoch": 1366} {"train_loss": -11.622312545776367, "global_step": 229626, "epoch": 1366} {"train_loss": -11.950662612915039, "global_step": 229627, "epoch": 1366} {"train_loss": -11.483194351196289, "global_step": 229628, "epoch": 1366} {"train_loss": -11.826284408569336, "global_step": 229629, "epoch": 1366} {"train_loss": -11.750994682312012, "global_step": 229630, "epoch": 1366} {"train_loss": -11.310510635375977, "global_step": 229631, "epoch": 1366} {"train_loss": -11.730400085449219, "global_step": 229632, "epoch": 1366} {"train_loss": -11.369592666625977, "global_step": 229633, "epoch": 1366} {"train_loss": -11.550978660583496, "global_step": 229634, "epoch": 1366} {"train_loss": -11.648492813110352, "global_step": 229635, "epoch": 1366} {"train_loss": -11.439176559448242, "global_step": 229636, "epoch": 1366} {"train_loss": -11.199771881103516, "global_step": 229637, "epoch": 1366} {"train_loss": -11.686227798461914, "global_step": 229638, "epoch": 1366} {"train_loss": -11.48727035522461, "global_step": 229639, "epoch": 1366} {"train_loss": -11.455924034118652, "global_step": 229640, "epoch": 1366} {"train_loss": -11.706892967224121, "global_step": 229641, "epoch": 1366} {"train_loss": -11.767800331115723, "global_step": 229642, "epoch": 1366} {"train_loss": -11.626684188842773, "global_step": 229643, "epoch": 1366} {"train_loss": -11.648998260498047, "global_step": 229644, "epoch": 1366} {"train_loss": -11.686470985412598, "global_step": 229645, "epoch": 1366} {"train_loss": -11.78339672088623, "global_step": 229646, "epoch": 1366} {"train_loss": -11.820375442504883, "global_step": 229647, "epoch": 1366} {"train_loss": -11.955755233764648, "global_step": 229648, "epoch": 1366} {"train_loss": -11.848313331604004, "global_step": 229649, "epoch": 1366} {"train_loss": -11.736150741577148, "global_step": 229650, "epoch": 1366} {"train_loss": -11.538243293762207, "global_step": 229651, "epoch": 1366} {"train_loss": -11.62191390991211, "global_step": 229652, "epoch": 1366} {"train_loss": -11.98774242401123, "global_step": 229653, "epoch": 1366} {"train_loss": -12.0298433303833, "global_step": 229654, "epoch": 1366} {"train_loss": -11.449380988166446, "global_step": 229655, "epoch": 1366, "val_loss": 260028.953125} {"train_loss": -11.46877670288086, "global_step": 229656, "epoch": 1367} {"train_loss": -11.558771133422852, "global_step": 229657, "epoch": 1367} {"train_loss": -11.257493019104004, "global_step": 229658, "epoch": 1367} {"train_loss": -11.76410961151123, "global_step": 229659, "epoch": 1367} {"train_loss": -11.027522087097168, "global_step": 229660, "epoch": 1367} {"train_loss": -8.946471214294434, "global_step": 229661, "epoch": 1367} {"train_loss": -11.459630012512207, "global_step": 229662, "epoch": 1367} {"train_loss": -11.1006441116333, "global_step": 229663, "epoch": 1367} {"train_loss": -10.067328453063965, "global_step": 229664, "epoch": 1367} {"train_loss": -10.068666458129883, "global_step": 229665, "epoch": 1367} {"train_loss": -11.565289497375488, "global_step": 229666, "epoch": 1367} {"train_loss": -9.79759407043457, "global_step": 229667, "epoch": 1367} {"train_loss": -10.782449722290039, "global_step": 229668, "epoch": 1367} {"train_loss": -10.211470603942871, "global_step": 229669, "epoch": 1367} {"train_loss": -10.306547164916992, "global_step": 229670, "epoch": 1367} {"train_loss": -11.108953475952148, "global_step": 229671, "epoch": 1367} {"train_loss": -10.343122482299805, "global_step": 229672, "epoch": 1367} {"train_loss": -10.810443878173828, "global_step": 229673, "epoch": 1367} {"train_loss": -11.211641311645508, "global_step": 229674, "epoch": 1367} {"train_loss": -11.207294464111328, "global_step": 229675, "epoch": 1367} {"train_loss": -10.484127044677734, "global_step": 229676, "epoch": 1367} {"train_loss": -11.2116060256958, "global_step": 229677, "epoch": 1367} {"train_loss": -11.135305404663086, "global_step": 229678, "epoch": 1367} {"train_loss": -10.963888168334961, "global_step": 229679, "epoch": 1367} {"train_loss": -11.160676956176758, "global_step": 229680, "epoch": 1367} {"train_loss": -10.552547454833984, "global_step": 229681, "epoch": 1367} {"train_loss": -11.093289375305176, "global_step": 229682, "epoch": 1367} {"train_loss": -10.77784538269043, "global_step": 229683, "epoch": 1367} {"train_loss": -11.263402938842773, "global_step": 229684, "epoch": 1367} {"train_loss": -11.168785095214844, "global_step": 229685, "epoch": 1367} {"train_loss": -11.493623733520508, "global_step": 229686, "epoch": 1367} {"train_loss": -11.578587532043457, "global_step": 229687, "epoch": 1367} {"train_loss": -11.287097930908203, "global_step": 229688, "epoch": 1367} {"train_loss": -11.3560209274292, "global_step": 229689, "epoch": 1367} {"train_loss": -11.634469985961914, "global_step": 229690, "epoch": 1367} {"train_loss": -11.59776782989502, "global_step": 229691, "epoch": 1367} {"train_loss": -11.751705169677734, "global_step": 229692, "epoch": 1367} {"train_loss": -11.263116836547852, "global_step": 229693, "epoch": 1367} {"train_loss": -11.574408531188965, "global_step": 229694, "epoch": 1367} {"train_loss": -11.529609680175781, "global_step": 229695, "epoch": 1367} {"train_loss": -11.528570175170898, "global_step": 229696, "epoch": 1367} {"train_loss": -11.299863815307617, "global_step": 229697, "epoch": 1367} {"train_loss": -11.569778442382812, "global_step": 229698, "epoch": 1367} {"train_loss": -11.419012069702148, "global_step": 229699, "epoch": 1367} {"train_loss": -11.62626838684082, "global_step": 229700, "epoch": 1367} {"train_loss": -11.697522163391113, "global_step": 229701, "epoch": 1367} {"train_loss": -11.636826515197754, "global_step": 229702, "epoch": 1367} {"train_loss": -11.682960510253906, "global_step": 229703, "epoch": 1367} {"train_loss": -11.659302711486816, "global_step": 229704, "epoch": 1367} {"train_loss": -11.680350303649902, "global_step": 229705, "epoch": 1367} {"train_loss": -11.858631134033203, "global_step": 229706, "epoch": 1367} {"train_loss": -11.549850463867188, "global_step": 229707, "epoch": 1367} {"train_loss": -11.751220703125, "global_step": 229708, "epoch": 1367} {"train_loss": -11.715492248535156, "global_step": 229709, "epoch": 1367} {"train_loss": -11.776525497436523, "global_step": 229710, "epoch": 1367} {"train_loss": -11.603340148925781, "global_step": 229711, "epoch": 1367} {"train_loss": -11.64036750793457, "global_step": 229712, "epoch": 1367} {"train_loss": -11.649319648742676, "global_step": 229713, "epoch": 1367} {"train_loss": -11.816812515258789, "global_step": 229714, "epoch": 1367} {"train_loss": -11.371335983276367, "global_step": 229715, "epoch": 1367} {"train_loss": -11.491087913513184, "global_step": 229716, "epoch": 1367} {"train_loss": -11.388416290283203, "global_step": 229717, "epoch": 1367} {"train_loss": -11.326889038085938, "global_step": 229718, "epoch": 1367} {"train_loss": -11.62077522277832, "global_step": 229719, "epoch": 1367} {"train_loss": -11.313407897949219, "global_step": 229720, "epoch": 1367} {"train_loss": -11.420053482055664, "global_step": 229721, "epoch": 1367} {"train_loss": -11.461397171020508, "global_step": 229722, "epoch": 1367} {"train_loss": -11.536077499389648, "global_step": 229723, "epoch": 1367} {"train_loss": -11.263496398925781, "global_step": 229724, "epoch": 1367} {"train_loss": -11.731464385986328, "global_step": 229725, "epoch": 1367} {"train_loss": -11.466384887695312, "global_step": 229726, "epoch": 1367} {"train_loss": -11.645551681518555, "global_step": 229727, "epoch": 1367} {"train_loss": -11.644923210144043, "global_step": 229728, "epoch": 1367} {"train_loss": -11.58726692199707, "global_step": 229729, "epoch": 1367} {"train_loss": -11.70902156829834, "global_step": 229730, "epoch": 1367} {"train_loss": -11.817243576049805, "global_step": 229731, "epoch": 1367} {"train_loss": -11.765326499938965, "global_step": 229732, "epoch": 1367} {"train_loss": -11.754447937011719, "global_step": 229733, "epoch": 1367} {"train_loss": -11.7299165725708, "global_step": 229734, "epoch": 1367} {"train_loss": -11.857507705688477, "global_step": 229735, "epoch": 1367} {"train_loss": -11.727781295776367, "global_step": 229736, "epoch": 1367} {"train_loss": -11.698509216308594, "global_step": 229737, "epoch": 1367} {"train_loss": -11.870950698852539, "global_step": 229738, "epoch": 1367} {"train_loss": -11.627059936523438, "global_step": 229739, "epoch": 1367} {"train_loss": -11.558932304382324, "global_step": 229740, "epoch": 1367} {"train_loss": -11.485095024108887, "global_step": 229741, "epoch": 1367} {"train_loss": -11.642690658569336, "global_step": 229742, "epoch": 1367} {"train_loss": -11.619495391845703, "global_step": 229743, "epoch": 1367} {"train_loss": -11.756258964538574, "global_step": 229744, "epoch": 1367} {"train_loss": -11.433588027954102, "global_step": 229745, "epoch": 1367} {"train_loss": -11.710577964782715, "global_step": 229746, "epoch": 1367} {"train_loss": -11.938923835754395, "global_step": 229747, "epoch": 1367} {"train_loss": -11.691862106323242, "global_step": 229748, "epoch": 1367} {"train_loss": -12.148141860961914, "global_step": 229749, "epoch": 1367} {"train_loss": -11.870058059692383, "global_step": 229750, "epoch": 1367} {"train_loss": -12.040369033813477, "global_step": 229751, "epoch": 1367} {"train_loss": -11.960939407348633, "global_step": 229752, "epoch": 1367} {"train_loss": -11.66159725189209, "global_step": 229753, "epoch": 1367} {"train_loss": -12.042272567749023, "global_step": 229754, "epoch": 1367} {"train_loss": -11.76854133605957, "global_step": 229755, "epoch": 1367} {"train_loss": -11.749452590942383, "global_step": 229756, "epoch": 1367} {"train_loss": -11.566076278686523, "global_step": 229757, "epoch": 1367} {"train_loss": -11.758285522460938, "global_step": 229758, "epoch": 1367} {"train_loss": -11.691816329956055, "global_step": 229759, "epoch": 1367} {"train_loss": -11.660446166992188, "global_step": 229760, "epoch": 1367} {"train_loss": -11.342910766601562, "global_step": 229761, "epoch": 1367} {"train_loss": -11.354681015014648, "global_step": 229762, "epoch": 1367} {"train_loss": -11.082230567932129, "global_step": 229763, "epoch": 1367} {"train_loss": -11.294013023376465, "global_step": 229764, "epoch": 1367} {"train_loss": -11.35104751586914, "global_step": 229765, "epoch": 1367} {"train_loss": -10.35024642944336, "global_step": 229766, "epoch": 1367} {"train_loss": -11.256086349487305, "global_step": 229767, "epoch": 1367} {"train_loss": -11.048422813415527, "global_step": 229768, "epoch": 1367} {"train_loss": -11.332159042358398, "global_step": 229769, "epoch": 1367} {"train_loss": -11.231542587280273, "global_step": 229770, "epoch": 1367} {"train_loss": -10.932497024536133, "global_step": 229771, "epoch": 1367} {"train_loss": -10.461609840393066, "global_step": 229772, "epoch": 1367} {"train_loss": -11.18328857421875, "global_step": 229773, "epoch": 1367} {"train_loss": -9.352851867675781, "global_step": 229774, "epoch": 1367} {"train_loss": -10.530863761901855, "global_step": 229775, "epoch": 1367} {"train_loss": -10.645421981811523, "global_step": 229776, "epoch": 1367} {"train_loss": -10.421342849731445, "global_step": 229777, "epoch": 1367} {"train_loss": -9.139348983764648, "global_step": 229778, "epoch": 1367} {"train_loss": -10.504873275756836, "global_step": 229779, "epoch": 1367} {"train_loss": -10.037870407104492, "global_step": 229780, "epoch": 1367} {"train_loss": -10.748558044433594, "global_step": 229781, "epoch": 1367} {"train_loss": -10.267387390136719, "global_step": 229782, "epoch": 1367} {"train_loss": -10.230900764465332, "global_step": 229783, "epoch": 1367} {"train_loss": -10.810402870178223, "global_step": 229784, "epoch": 1367} {"train_loss": -10.502745628356934, "global_step": 229785, "epoch": 1367} {"train_loss": -10.129037857055664, "global_step": 229786, "epoch": 1367} {"train_loss": -11.02985954284668, "global_step": 229787, "epoch": 1367} {"train_loss": -10.987321853637695, "global_step": 229788, "epoch": 1367} {"train_loss": -11.372305870056152, "global_step": 229789, "epoch": 1367} {"train_loss": -10.620567321777344, "global_step": 229790, "epoch": 1367} {"train_loss": -11.326634407043457, "global_step": 229791, "epoch": 1367} {"train_loss": -11.453108787536621, "global_step": 229792, "epoch": 1367} {"train_loss": -11.119144439697266, "global_step": 229793, "epoch": 1367} {"train_loss": -11.264669418334961, "global_step": 229794, "epoch": 1367} {"train_loss": -10.919122695922852, "global_step": 229795, "epoch": 1367} {"train_loss": -11.279150009155273, "global_step": 229796, "epoch": 1367} {"train_loss": -11.344091415405273, "global_step": 229797, "epoch": 1367} {"train_loss": -11.430071830749512, "global_step": 229798, "epoch": 1367} {"train_loss": -11.485138893127441, "global_step": 229799, "epoch": 1367} {"train_loss": -11.329828262329102, "global_step": 229800, "epoch": 1367} {"train_loss": -11.387819290161133, "global_step": 229801, "epoch": 1367} {"train_loss": -11.355077743530273, "global_step": 229802, "epoch": 1367} {"train_loss": -11.44537353515625, "global_step": 229803, "epoch": 1367} {"train_loss": -11.625448226928711, "global_step": 229804, "epoch": 1367} {"train_loss": -11.341211318969727, "global_step": 229805, "epoch": 1367} {"train_loss": -11.139019012451172, "global_step": 229806, "epoch": 1367} {"train_loss": -11.36083984375, "global_step": 229807, "epoch": 1367} {"train_loss": -11.707229614257812, "global_step": 229808, "epoch": 1367} {"train_loss": -11.515352249145508, "global_step": 229809, "epoch": 1367} {"train_loss": -11.667287826538086, "global_step": 229810, "epoch": 1367} {"train_loss": -11.735045433044434, "global_step": 229811, "epoch": 1367} {"train_loss": -11.483993530273438, "global_step": 229812, "epoch": 1367} {"train_loss": -11.46214485168457, "global_step": 229813, "epoch": 1367} {"train_loss": -11.505193710327148, "global_step": 229814, "epoch": 1367} {"train_loss": -11.528688430786133, "global_step": 229815, "epoch": 1367} {"train_loss": -11.79257583618164, "global_step": 229816, "epoch": 1367} {"train_loss": -11.330842018127441, "global_step": 229817, "epoch": 1367} {"train_loss": -11.534188270568848, "global_step": 229818, "epoch": 1367} {"train_loss": -11.156896591186523, "global_step": 229819, "epoch": 1367} {"train_loss": -11.660146713256836, "global_step": 229820, "epoch": 1367} {"train_loss": -11.252573013305664, "global_step": 229821, "epoch": 1367} {"train_loss": -11.79055404663086, "global_step": 229822, "epoch": 1367} {"train_loss": -11.291407732736497, "global_step": 229823, "epoch": 1367, "val_loss": 264082.90625} {"train_loss": -11.608342170715332, "global_step": 229824, "epoch": 1368} {"train_loss": -11.226945877075195, "global_step": 229825, "epoch": 1368} {"train_loss": -11.762296676635742, "global_step": 229826, "epoch": 1368} {"train_loss": -11.43753433227539, "global_step": 229827, "epoch": 1368} {"train_loss": -11.769102096557617, "global_step": 229828, "epoch": 1368} {"train_loss": -11.447063446044922, "global_step": 229829, "epoch": 1368} {"train_loss": -11.74062442779541, "global_step": 229830, "epoch": 1368} {"train_loss": -11.701671600341797, "global_step": 229831, "epoch": 1368} {"train_loss": -11.487607955932617, "global_step": 229832, "epoch": 1368} {"train_loss": -11.730609893798828, "global_step": 229833, "epoch": 1368} {"train_loss": -11.577184677124023, "global_step": 229834, "epoch": 1368} {"train_loss": -11.790048599243164, "global_step": 229835, "epoch": 1368} {"train_loss": -11.832115173339844, "global_step": 229836, "epoch": 1368} {"train_loss": -11.806808471679688, "global_step": 229837, "epoch": 1368} {"train_loss": -11.711748123168945, "global_step": 229838, "epoch": 1368} {"train_loss": -11.719301223754883, "global_step": 229839, "epoch": 1368} {"train_loss": -11.885486602783203, "global_step": 229840, "epoch": 1368} {"train_loss": -11.506057739257812, "global_step": 229841, "epoch": 1368} {"train_loss": -11.925056457519531, "global_step": 229842, "epoch": 1368} {"train_loss": -11.67059326171875, "global_step": 229843, "epoch": 1368} {"train_loss": -11.648611068725586, "global_step": 229844, "epoch": 1368} {"train_loss": -11.608768463134766, "global_step": 229845, "epoch": 1368} {"train_loss": -11.368060111999512, "global_step": 229846, "epoch": 1368} {"train_loss": -11.69787311553955, "global_step": 229847, "epoch": 1368} {"train_loss": -11.564533233642578, "global_step": 229848, "epoch": 1368} {"train_loss": -12.163241386413574, "global_step": 229849, "epoch": 1368} {"train_loss": -11.738237380981445, "global_step": 229850, "epoch": 1368} {"train_loss": -11.69442081451416, "global_step": 229851, "epoch": 1368} {"train_loss": -11.987046241760254, "global_step": 229852, "epoch": 1368} {"train_loss": -11.609415054321289, "global_step": 229853, "epoch": 1368} {"train_loss": -11.503433227539062, "global_step": 229854, "epoch": 1368} {"train_loss": -11.838077545166016, "global_step": 229855, "epoch": 1368} {"train_loss": -11.403738021850586, "global_step": 229856, "epoch": 1368} {"train_loss": -11.983789443969727, "global_step": 229857, "epoch": 1368} {"train_loss": -11.508203506469727, "global_step": 229858, "epoch": 1368} {"train_loss": -11.760229110717773, "global_step": 229859, "epoch": 1368} {"train_loss": -11.818227767944336, "global_step": 229860, "epoch": 1368} {"train_loss": -11.684530258178711, "global_step": 229861, "epoch": 1368} {"train_loss": -12.03186321258545, "global_step": 229862, "epoch": 1368} {"train_loss": -12.021117210388184, "global_step": 229863, "epoch": 1368} {"train_loss": -11.886543273925781, "global_step": 229864, "epoch": 1368} {"train_loss": -11.935361862182617, "global_step": 229865, "epoch": 1368} {"train_loss": -11.813495635986328, "global_step": 229866, "epoch": 1368} {"train_loss": -11.86021614074707, "global_step": 229867, "epoch": 1368} {"train_loss": -11.833642959594727, "global_step": 229868, "epoch": 1368} {"train_loss": -11.823132514953613, "global_step": 229869, "epoch": 1368} {"train_loss": -12.158113479614258, "global_step": 229870, "epoch": 1368} {"train_loss": -11.996631622314453, "global_step": 229871, "epoch": 1368} {"train_loss": -11.942302703857422, "global_step": 229872, "epoch": 1368} {"train_loss": -11.888628959655762, "global_step": 229873, "epoch": 1368} {"train_loss": -11.894119262695312, "global_step": 229874, "epoch": 1368} {"train_loss": -11.967256546020508, "global_step": 229875, "epoch": 1368} {"train_loss": -11.70561408996582, "global_step": 229876, "epoch": 1368} {"train_loss": -11.756592750549316, "global_step": 229877, "epoch": 1368} {"train_loss": -12.033552169799805, "global_step": 229878, "epoch": 1368} {"train_loss": -11.67945671081543, "global_step": 229879, "epoch": 1368} {"train_loss": -11.803519248962402, "global_step": 229880, "epoch": 1368} {"train_loss": -11.570205688476562, "global_step": 229881, "epoch": 1368} {"train_loss": -12.074812889099121, "global_step": 229882, "epoch": 1368} {"train_loss": -11.608771324157715, "global_step": 229883, "epoch": 1368} {"train_loss": -12.02883529663086, "global_step": 229884, "epoch": 1368} {"train_loss": -11.46249008178711, "global_step": 229885, "epoch": 1368} {"train_loss": -11.909360885620117, "global_step": 229886, "epoch": 1368} {"train_loss": -11.589930534362793, "global_step": 229887, "epoch": 1368} {"train_loss": -11.841903686523438, "global_step": 229888, "epoch": 1368} {"train_loss": -11.759944915771484, "global_step": 229889, "epoch": 1368} {"train_loss": -11.538227081298828, "global_step": 229890, "epoch": 1368} {"train_loss": -11.118064880371094, "global_step": 229891, "epoch": 1368} {"train_loss": -11.413771629333496, "global_step": 229892, "epoch": 1368} {"train_loss": -11.395062446594238, "global_step": 229893, "epoch": 1368} {"train_loss": -11.383085250854492, "global_step": 229894, "epoch": 1368} {"train_loss": -11.368745803833008, "global_step": 229895, "epoch": 1368} {"train_loss": -10.697429656982422, "global_step": 229896, "epoch": 1368} {"train_loss": -10.956222534179688, "global_step": 229897, "epoch": 1368} {"train_loss": -9.914289474487305, "global_step": 229898, "epoch": 1368} {"train_loss": -11.010720252990723, "global_step": 229899, "epoch": 1368} {"train_loss": -10.101724624633789, "global_step": 229900, "epoch": 1368} {"train_loss": -11.23465633392334, "global_step": 229901, "epoch": 1368} {"train_loss": -10.881196975708008, "global_step": 229902, "epoch": 1368} {"train_loss": -10.420854568481445, "global_step": 229903, "epoch": 1368} {"train_loss": -11.188802719116211, "global_step": 229904, "epoch": 1368} {"train_loss": -10.594161987304688, "global_step": 229905, "epoch": 1368} {"train_loss": -10.78860092163086, "global_step": 229906, "epoch": 1368} {"train_loss": -11.348630905151367, "global_step": 229907, "epoch": 1368} {"train_loss": -10.1928071975708, "global_step": 229908, "epoch": 1368} {"train_loss": -9.601701736450195, "global_step": 229909, "epoch": 1368} {"train_loss": -10.799413681030273, "global_step": 229910, "epoch": 1368} {"train_loss": -8.893571853637695, "global_step": 229911, "epoch": 1368} {"train_loss": -11.073151588439941, "global_step": 229912, "epoch": 1368} {"train_loss": -10.307357788085938, "global_step": 229913, "epoch": 1368} {"train_loss": -10.803243637084961, "global_step": 229914, "epoch": 1368} {"train_loss": -9.28870964050293, "global_step": 229915, "epoch": 1368} {"train_loss": -10.709613800048828, "global_step": 229916, "epoch": 1368} {"train_loss": -10.01571273803711, "global_step": 229917, "epoch": 1368} {"train_loss": -11.530863761901855, "global_step": 229918, "epoch": 1368} {"train_loss": -10.902107238769531, "global_step": 229919, "epoch": 1368} {"train_loss": -11.289379119873047, "global_step": 229920, "epoch": 1368} {"train_loss": -10.75853157043457, "global_step": 229921, "epoch": 1368} {"train_loss": -11.11522388458252, "global_step": 229922, "epoch": 1368} {"train_loss": -10.959903717041016, "global_step": 229923, "epoch": 1368} {"train_loss": -11.313043594360352, "global_step": 229924, "epoch": 1368} {"train_loss": -11.227178573608398, "global_step": 229925, "epoch": 1368} {"train_loss": -11.402132987976074, "global_step": 229926, "epoch": 1368} {"train_loss": -11.342401504516602, "global_step": 229927, "epoch": 1368} {"train_loss": -11.213287353515625, "global_step": 229928, "epoch": 1368} {"train_loss": -11.339225769042969, "global_step": 229929, "epoch": 1368} {"train_loss": -11.753395080566406, "global_step": 229930, "epoch": 1368} {"train_loss": -11.066350936889648, "global_step": 229931, "epoch": 1368} {"train_loss": -11.523481369018555, "global_step": 229932, "epoch": 1368} {"train_loss": -11.199110984802246, "global_step": 229933, "epoch": 1368} {"train_loss": -11.456733703613281, "global_step": 229934, "epoch": 1368} {"train_loss": -11.66923999786377, "global_step": 229935, "epoch": 1368} {"train_loss": -11.181924819946289, "global_step": 229936, "epoch": 1368} {"train_loss": -11.270377159118652, "global_step": 229937, "epoch": 1368} {"train_loss": -11.199129104614258, "global_step": 229938, "epoch": 1368} {"train_loss": -11.254693984985352, "global_step": 229939, "epoch": 1368} {"train_loss": -11.392189025878906, "global_step": 229940, "epoch": 1368} {"train_loss": -11.591852188110352, "global_step": 229941, "epoch": 1368} {"train_loss": -11.023344039916992, "global_step": 229942, "epoch": 1368} {"train_loss": -11.587409973144531, "global_step": 229943, "epoch": 1368} {"train_loss": -11.366501808166504, "global_step": 229944, "epoch": 1368} {"train_loss": -11.412384033203125, "global_step": 229945, "epoch": 1368} {"train_loss": -11.61967658996582, "global_step": 229946, "epoch": 1368} {"train_loss": -11.467121124267578, "global_step": 229947, "epoch": 1368} {"train_loss": -11.488443374633789, "global_step": 229948, "epoch": 1368} {"train_loss": -11.3868408203125, "global_step": 229949, "epoch": 1368} {"train_loss": -11.521017074584961, "global_step": 229950, "epoch": 1368} {"train_loss": -11.500696182250977, "global_step": 229951, "epoch": 1368} {"train_loss": -11.466773986816406, "global_step": 229952, "epoch": 1368} {"train_loss": -11.622865676879883, "global_step": 229953, "epoch": 1368} {"train_loss": -11.498283386230469, "global_step": 229954, "epoch": 1368} {"train_loss": -11.684957504272461, "global_step": 229955, "epoch": 1368} {"train_loss": -11.524019241333008, "global_step": 229956, "epoch": 1368} {"train_loss": -11.419161796569824, "global_step": 229957, "epoch": 1368} {"train_loss": -11.723575592041016, "global_step": 229958, "epoch": 1368} {"train_loss": -11.522890090942383, "global_step": 229959, "epoch": 1368} {"train_loss": -11.731855392456055, "global_step": 229960, "epoch": 1368} {"train_loss": -11.561492919921875, "global_step": 229961, "epoch": 1368} {"train_loss": -11.895171165466309, "global_step": 229962, "epoch": 1368} {"train_loss": -11.251140594482422, "global_step": 229963, "epoch": 1368} {"train_loss": -11.830852508544922, "global_step": 229964, "epoch": 1368} {"train_loss": -11.264652252197266, "global_step": 229965, "epoch": 1368} {"train_loss": -11.479883193969727, "global_step": 229966, "epoch": 1368} {"train_loss": -11.873061180114746, "global_step": 229967, "epoch": 1368} {"train_loss": -11.172929763793945, "global_step": 229968, "epoch": 1368} {"train_loss": -11.751370429992676, "global_step": 229969, "epoch": 1368} {"train_loss": -11.406707763671875, "global_step": 229970, "epoch": 1368} {"train_loss": -10.972755432128906, "global_step": 229971, "epoch": 1368} {"train_loss": -11.942238807678223, "global_step": 229972, "epoch": 1368} {"train_loss": -11.208124160766602, "global_step": 229973, "epoch": 1368} {"train_loss": -11.75865364074707, "global_step": 229974, "epoch": 1368} {"train_loss": -11.387649536132812, "global_step": 229975, "epoch": 1368} {"train_loss": -11.165160179138184, "global_step": 229976, "epoch": 1368} {"train_loss": -11.63364028930664, "global_step": 229977, "epoch": 1368} {"train_loss": -11.12429428100586, "global_step": 229978, "epoch": 1368} {"train_loss": -11.408952713012695, "global_step": 229979, "epoch": 1368} {"train_loss": -11.777464866638184, "global_step": 229980, "epoch": 1368} {"train_loss": -11.280538558959961, "global_step": 229981, "epoch": 1368} {"train_loss": -11.930463790893555, "global_step": 229982, "epoch": 1368} {"train_loss": -10.87845230102539, "global_step": 229983, "epoch": 1368} {"train_loss": -11.602411270141602, "global_step": 229984, "epoch": 1368} {"train_loss": -11.622831344604492, "global_step": 229985, "epoch": 1368} {"train_loss": -11.402399063110352, "global_step": 229986, "epoch": 1368} {"train_loss": -11.834779739379883, "global_step": 229987, "epoch": 1368} {"train_loss": -11.901662826538086, "global_step": 229988, "epoch": 1368} {"train_loss": -11.766979217529297, "global_step": 229989, "epoch": 1368} {"train_loss": -11.546319961547852, "global_step": 229990, "epoch": 1368} {"train_loss": -11.438530558631534, "global_step": 229991, "epoch": 1368, "val_loss": 263234.59375} {"train_loss": -11.700590133666992, "global_step": 229992, "epoch": 1369} {"train_loss": -11.414594650268555, "global_step": 229993, "epoch": 1369} {"train_loss": -11.850261688232422, "global_step": 229994, "epoch": 1369} {"train_loss": -11.319902420043945, "global_step": 229995, "epoch": 1369} {"train_loss": -11.670729637145996, "global_step": 229996, "epoch": 1369} {"train_loss": -11.770414352416992, "global_step": 229997, "epoch": 1369} {"train_loss": -11.471663475036621, "global_step": 229998, "epoch": 1369} {"train_loss": -11.64747428894043, "global_step": 229999, "epoch": 1369} {"train_loss": -11.784626007080078, "global_step": 230000, "epoch": 1369} {"train_loss": -11.380857467651367, "global_step": 230001, "epoch": 1369} {"train_loss": -11.579940795898438, "global_step": 230002, "epoch": 1369} {"train_loss": -10.996088027954102, "global_step": 230003, "epoch": 1369} {"train_loss": -11.856826782226562, "global_step": 230004, "epoch": 1369} {"train_loss": -11.402874946594238, "global_step": 230005, "epoch": 1369} {"train_loss": -10.882338523864746, "global_step": 230006, "epoch": 1369} {"train_loss": -11.556169509887695, "global_step": 230007, "epoch": 1369} {"train_loss": -11.563034057617188, "global_step": 230008, "epoch": 1369} {"train_loss": -11.881473541259766, "global_step": 230009, "epoch": 1369} {"train_loss": -11.795052528381348, "global_step": 230010, "epoch": 1369} {"train_loss": -11.340743064880371, "global_step": 230011, "epoch": 1369} {"train_loss": -11.530280113220215, "global_step": 230012, "epoch": 1369} {"train_loss": -11.968246459960938, "global_step": 230013, "epoch": 1369} {"train_loss": -11.370579719543457, "global_step": 230014, "epoch": 1369} {"train_loss": -11.943353652954102, "global_step": 230015, "epoch": 1369} {"train_loss": -11.594844818115234, "global_step": 230016, "epoch": 1369} {"train_loss": -11.821435928344727, "global_step": 230017, "epoch": 1369} {"train_loss": -11.75456714630127, "global_step": 230018, "epoch": 1369} {"train_loss": -11.65709400177002, "global_step": 230019, "epoch": 1369} {"train_loss": -11.99205493927002, "global_step": 230020, "epoch": 1369} {"train_loss": -11.627334594726562, "global_step": 230021, "epoch": 1369} {"train_loss": -12.042396545410156, "global_step": 230022, "epoch": 1369} {"train_loss": -11.772418975830078, "global_step": 230023, "epoch": 1369} {"train_loss": -11.907419204711914, "global_step": 230024, "epoch": 1369} {"train_loss": -12.019445419311523, "global_step": 230025, "epoch": 1369} {"train_loss": -11.703361511230469, "global_step": 230026, "epoch": 1369} {"train_loss": -11.755288124084473, "global_step": 230027, "epoch": 1369} {"train_loss": -12.049704551696777, "global_step": 230028, "epoch": 1369} {"train_loss": -11.840991973876953, "global_step": 230029, "epoch": 1369} {"train_loss": -11.94552993774414, "global_step": 230030, "epoch": 1369} {"train_loss": -11.672606468200684, "global_step": 230031, "epoch": 1369} {"train_loss": -11.950693130493164, "global_step": 230032, "epoch": 1369} {"train_loss": -11.890644073486328, "global_step": 230033, "epoch": 1369} {"train_loss": -11.763693809509277, "global_step": 230034, "epoch": 1369} {"train_loss": -12.031888961791992, "global_step": 230035, "epoch": 1369} {"train_loss": -11.822999954223633, "global_step": 230036, "epoch": 1369} {"train_loss": -12.010714530944824, "global_step": 230037, "epoch": 1369} {"train_loss": -11.917021751403809, "global_step": 230038, "epoch": 1369} {"train_loss": -11.916145324707031, "global_step": 230039, "epoch": 1369} {"train_loss": -12.003334045410156, "global_step": 230040, "epoch": 1369} {"train_loss": -11.67557430267334, "global_step": 230041, "epoch": 1369} {"train_loss": -12.052438735961914, "global_step": 230042, "epoch": 1369} {"train_loss": -11.70072078704834, "global_step": 230043, "epoch": 1369} {"train_loss": -11.917145729064941, "global_step": 230044, "epoch": 1369} {"train_loss": -11.498554229736328, "global_step": 230045, "epoch": 1369} {"train_loss": -11.881814956665039, "global_step": 230046, "epoch": 1369} {"train_loss": -11.16843318939209, "global_step": 230047, "epoch": 1369} {"train_loss": -11.547412872314453, "global_step": 230048, "epoch": 1369} {"train_loss": -11.864665985107422, "global_step": 230049, "epoch": 1369} {"train_loss": -11.62157154083252, "global_step": 230050, "epoch": 1369} {"train_loss": -11.631559371948242, "global_step": 230051, "epoch": 1369} {"train_loss": -11.751142501831055, "global_step": 230052, "epoch": 1369} {"train_loss": -11.006711959838867, "global_step": 230053, "epoch": 1369} {"train_loss": -11.021957397460938, "global_step": 230054, "epoch": 1369} {"train_loss": -11.510660171508789, "global_step": 230055, "epoch": 1369} {"train_loss": -11.180267333984375, "global_step": 230056, "epoch": 1369} {"train_loss": -10.189742088317871, "global_step": 230057, "epoch": 1369} {"train_loss": -11.054449081420898, "global_step": 230058, "epoch": 1369} {"train_loss": -9.698490142822266, "global_step": 230059, "epoch": 1369} {"train_loss": -10.31983757019043, "global_step": 230060, "epoch": 1369} {"train_loss": -10.720669746398926, "global_step": 230061, "epoch": 1369} {"train_loss": -9.979745864868164, "global_step": 230062, "epoch": 1369} {"train_loss": -9.12611198425293, "global_step": 230063, "epoch": 1369} {"train_loss": -10.152619361877441, "global_step": 230064, "epoch": 1369} {"train_loss": -10.243461608886719, "global_step": 230065, "epoch": 1369} {"train_loss": -10.659270286560059, "global_step": 230066, "epoch": 1369} {"train_loss": -9.037823677062988, "global_step": 230067, "epoch": 1369} {"train_loss": -10.854453086853027, "global_step": 230068, "epoch": 1369} {"train_loss": -9.614253997802734, "global_step": 230069, "epoch": 1369} {"train_loss": -10.960588455200195, "global_step": 230070, "epoch": 1369} {"train_loss": -10.903759956359863, "global_step": 230071, "epoch": 1369} {"train_loss": -10.335670471191406, "global_step": 230072, "epoch": 1369} {"train_loss": -11.234846115112305, "global_step": 230073, "epoch": 1369} {"train_loss": -9.135066986083984, "global_step": 230074, "epoch": 1369} {"train_loss": -10.546104431152344, "global_step": 230075, "epoch": 1369} {"train_loss": -10.81411361694336, "global_step": 230076, "epoch": 1369} {"train_loss": -10.210046768188477, "global_step": 230077, "epoch": 1369} {"train_loss": -10.97539234161377, "global_step": 230078, "epoch": 1369} {"train_loss": -9.825496673583984, "global_step": 230079, "epoch": 1369} {"train_loss": -10.768768310546875, "global_step": 230080, "epoch": 1369} {"train_loss": -10.927057266235352, "global_step": 230081, "epoch": 1369} {"train_loss": -10.882570266723633, "global_step": 230082, "epoch": 1369} {"train_loss": -11.16372013092041, "global_step": 230083, "epoch": 1369} {"train_loss": -11.07925796508789, "global_step": 230084, "epoch": 1369} {"train_loss": -10.85912799835205, "global_step": 230085, "epoch": 1369} {"train_loss": -11.019912719726562, "global_step": 230086, "epoch": 1369} {"train_loss": -11.203717231750488, "global_step": 230087, "epoch": 1369} {"train_loss": -11.066494941711426, "global_step": 230088, "epoch": 1369} {"train_loss": -11.28990364074707, "global_step": 230089, "epoch": 1369} {"train_loss": -11.143583297729492, "global_step": 230090, "epoch": 1369} {"train_loss": -11.228748321533203, "global_step": 230091, "epoch": 1369} {"train_loss": -11.21036148071289, "global_step": 230092, "epoch": 1369} {"train_loss": -11.111923217773438, "global_step": 230093, "epoch": 1369} {"train_loss": -11.276291847229004, "global_step": 230094, "epoch": 1369} {"train_loss": -11.259965896606445, "global_step": 230095, "epoch": 1369} {"train_loss": -11.211752891540527, "global_step": 230096, "epoch": 1369} {"train_loss": -11.403980255126953, "global_step": 230097, "epoch": 1369} {"train_loss": -11.382320404052734, "global_step": 230098, "epoch": 1369} {"train_loss": -11.142740249633789, "global_step": 230099, "epoch": 1369} {"train_loss": -10.966063499450684, "global_step": 230100, "epoch": 1369} {"train_loss": -11.023818969726562, "global_step": 230101, "epoch": 1369} {"train_loss": -11.502190589904785, "global_step": 230102, "epoch": 1369} {"train_loss": -10.989295959472656, "global_step": 230103, "epoch": 1369} {"train_loss": -11.520509719848633, "global_step": 230104, "epoch": 1369} {"train_loss": -11.308411598205566, "global_step": 230105, "epoch": 1369} {"train_loss": -11.173430442810059, "global_step": 230106, "epoch": 1369} {"train_loss": -11.466550827026367, "global_step": 230107, "epoch": 1369} {"train_loss": -11.38245964050293, "global_step": 230108, "epoch": 1369} {"train_loss": -11.537297248840332, "global_step": 230109, "epoch": 1369} {"train_loss": -11.168784141540527, "global_step": 230110, "epoch": 1369} {"train_loss": -11.61948299407959, "global_step": 230111, "epoch": 1369} {"train_loss": -11.461591720581055, "global_step": 230112, "epoch": 1369} {"train_loss": -11.602814674377441, "global_step": 230113, "epoch": 1369} {"train_loss": -11.587696075439453, "global_step": 230114, "epoch": 1369} {"train_loss": -11.205204010009766, "global_step": 230115, "epoch": 1369} {"train_loss": -11.628750801086426, "global_step": 230116, "epoch": 1369} {"train_loss": -11.687393188476562, "global_step": 230117, "epoch": 1369} {"train_loss": -11.573087692260742, "global_step": 230118, "epoch": 1369} {"train_loss": -11.520872116088867, "global_step": 230119, "epoch": 1369} {"train_loss": -11.490381240844727, "global_step": 230120, "epoch": 1369} {"train_loss": -11.445960998535156, "global_step": 230121, "epoch": 1369} {"train_loss": -11.865640640258789, "global_step": 230122, "epoch": 1369} {"train_loss": -11.423238754272461, "global_step": 230123, "epoch": 1369} {"train_loss": -11.750725746154785, "global_step": 230124, "epoch": 1369} {"train_loss": -11.772350311279297, "global_step": 230125, "epoch": 1369} {"train_loss": -11.736763000488281, "global_step": 230126, "epoch": 1369} {"train_loss": -11.839570045471191, "global_step": 230127, "epoch": 1369} {"train_loss": -11.862714767456055, "global_step": 230128, "epoch": 1369} {"train_loss": -11.577852249145508, "global_step": 230129, "epoch": 1369} {"train_loss": -11.890586853027344, "global_step": 230130, "epoch": 1369} {"train_loss": -11.895271301269531, "global_step": 230131, "epoch": 1369} {"train_loss": -11.64509391784668, "global_step": 230132, "epoch": 1369} {"train_loss": -11.793083190917969, "global_step": 230133, "epoch": 1369} {"train_loss": -11.90758228302002, "global_step": 230134, "epoch": 1369} {"train_loss": -11.63525390625, "global_step": 230135, "epoch": 1369} {"train_loss": -11.996654510498047, "global_step": 230136, "epoch": 1369} {"train_loss": -12.058792114257812, "global_step": 230137, "epoch": 1369} {"train_loss": -11.929750442504883, "global_step": 230138, "epoch": 1369} {"train_loss": -11.833450317382812, "global_step": 230139, "epoch": 1369} {"train_loss": -12.06196117401123, "global_step": 230140, "epoch": 1369} {"train_loss": -12.078261375427246, "global_step": 230141, "epoch": 1369} {"train_loss": -11.923151969909668, "global_step": 230142, "epoch": 1369} {"train_loss": -11.900064468383789, "global_step": 230143, "epoch": 1369} {"train_loss": -11.854302406311035, "global_step": 230144, "epoch": 1369} {"train_loss": -11.919960021972656, "global_step": 230145, "epoch": 1369} {"train_loss": -11.402084350585938, "global_step": 230146, "epoch": 1369} {"train_loss": -11.84393310546875, "global_step": 230147, "epoch": 1369} {"train_loss": -11.712596893310547, "global_step": 230148, "epoch": 1369} {"train_loss": -11.863609313964844, "global_step": 230149, "epoch": 1369} {"train_loss": -11.570333480834961, "global_step": 230150, "epoch": 1369} {"train_loss": -11.939691543579102, "global_step": 230151, "epoch": 1369} {"train_loss": -11.705443382263184, "global_step": 230152, "epoch": 1369} {"train_loss": -12.084880828857422, "global_step": 230153, "epoch": 1369} {"train_loss": -11.555891036987305, "global_step": 230154, "epoch": 1369} {"train_loss": -11.797294616699219, "global_step": 230155, "epoch": 1369} {"train_loss": -11.811131477355957, "global_step": 230156, "epoch": 1369} {"train_loss": -10.989431381225586, "global_step": 230157, "epoch": 1369} {"train_loss": -10.687054634094238, "global_step": 230158, "epoch": 1369} {"train_loss": -11.399550653639293, "global_step": 230159, "epoch": 1369, "val_loss": 258700.328125} {"train_loss": -11.313955307006836, "global_step": 230160, "epoch": 1370} {"train_loss": -12.010297775268555, "global_step": 230161, "epoch": 1370} {"train_loss": -11.73912239074707, "global_step": 230162, "epoch": 1370} {"train_loss": -11.639760971069336, "global_step": 230163, "epoch": 1370} {"train_loss": -11.59170150756836, "global_step": 230164, "epoch": 1370} {"train_loss": -11.96776294708252, "global_step": 230165, "epoch": 1370} {"train_loss": -11.60031509399414, "global_step": 230166, "epoch": 1370} {"train_loss": -11.506366729736328, "global_step": 230167, "epoch": 1370} {"train_loss": -11.827356338500977, "global_step": 230168, "epoch": 1370} {"train_loss": -10.241474151611328, "global_step": 230169, "epoch": 1370} {"train_loss": -9.488025665283203, "global_step": 230170, "epoch": 1370} {"train_loss": -11.409582138061523, "global_step": 230171, "epoch": 1370} {"train_loss": -9.73934555053711, "global_step": 230172, "epoch": 1370} {"train_loss": -10.358597755432129, "global_step": 230173, "epoch": 1370} {"train_loss": -6.989148139953613, "global_step": 230174, "epoch": 1370} {"train_loss": -8.643085479736328, "global_step": 230175, "epoch": 1370} {"train_loss": -9.60097599029541, "global_step": 230176, "epoch": 1370} {"train_loss": -10.232917785644531, "global_step": 230177, "epoch": 1370} {"train_loss": -7.651998043060303, "global_step": 230178, "epoch": 1370} {"train_loss": -8.823768615722656, "global_step": 230179, "epoch": 1370} {"train_loss": -9.5711088180542, "global_step": 230180, "epoch": 1370} {"train_loss": -9.773775100708008, "global_step": 230181, "epoch": 1370} {"train_loss": -9.424546241760254, "global_step": 230182, "epoch": 1370} {"train_loss": -8.706689834594727, "global_step": 230183, "epoch": 1370} {"train_loss": -9.733327865600586, "global_step": 230184, "epoch": 1370} {"train_loss": -9.676700592041016, "global_step": 230185, "epoch": 1370} {"train_loss": -9.602590560913086, "global_step": 230186, "epoch": 1370} {"train_loss": -9.310585021972656, "global_step": 230187, "epoch": 1370} {"train_loss": -10.342100143432617, "global_step": 230188, "epoch": 1370} {"train_loss": -9.540863990783691, "global_step": 230189, "epoch": 1370} {"train_loss": -10.027273178100586, "global_step": 230190, "epoch": 1370} {"train_loss": -10.441761016845703, "global_step": 230191, "epoch": 1370} {"train_loss": -9.358214378356934, "global_step": 230192, "epoch": 1370} {"train_loss": -11.249740600585938, "global_step": 230193, "epoch": 1370} {"train_loss": -9.707670211791992, "global_step": 230194, "epoch": 1370} {"train_loss": -10.813345909118652, "global_step": 230195, "epoch": 1370} {"train_loss": -10.624526977539062, "global_step": 230196, "epoch": 1370} {"train_loss": -10.450309753417969, "global_step": 230197, "epoch": 1370} {"train_loss": -10.845776557922363, "global_step": 230198, "epoch": 1370} {"train_loss": -10.874637603759766, "global_step": 230199, "epoch": 1370} {"train_loss": -11.05320930480957, "global_step": 230200, "epoch": 1370} {"train_loss": -10.654268264770508, "global_step": 230201, "epoch": 1370} {"train_loss": -10.75269889831543, "global_step": 230202, "epoch": 1370} {"train_loss": -11.185962677001953, "global_step": 230203, "epoch": 1370} {"train_loss": -10.911338806152344, "global_step": 230204, "epoch": 1370} {"train_loss": -11.242513656616211, "global_step": 230205, "epoch": 1370} {"train_loss": -11.147566795349121, "global_step": 230206, "epoch": 1370} {"train_loss": -11.313261032104492, "global_step": 230207, "epoch": 1370} {"train_loss": -10.855208396911621, "global_step": 230208, "epoch": 1370} {"train_loss": -11.292610168457031, "global_step": 230209, "epoch": 1370} {"train_loss": -11.084972381591797, "global_step": 230210, "epoch": 1370} {"train_loss": -11.117685317993164, "global_step": 230211, "epoch": 1370} {"train_loss": -11.543807029724121, "global_step": 230212, "epoch": 1370} {"train_loss": -11.078069686889648, "global_step": 230213, "epoch": 1370} {"train_loss": -11.374088287353516, "global_step": 230214, "epoch": 1370} {"train_loss": -11.416849136352539, "global_step": 230215, "epoch": 1370} {"train_loss": -11.354637145996094, "global_step": 230216, "epoch": 1370} {"train_loss": -11.263176918029785, "global_step": 230217, "epoch": 1370} {"train_loss": -11.119051933288574, "global_step": 230218, "epoch": 1370} {"train_loss": -11.460165023803711, "global_step": 230219, "epoch": 1370} {"train_loss": -11.412924766540527, "global_step": 230220, "epoch": 1370} {"train_loss": -11.236618041992188, "global_step": 230221, "epoch": 1370} {"train_loss": -11.722713470458984, "global_step": 230222, "epoch": 1370} {"train_loss": -11.139323234558105, "global_step": 230223, "epoch": 1370} {"train_loss": -11.352897644042969, "global_step": 230224, "epoch": 1370} {"train_loss": -11.378265380859375, "global_step": 230225, "epoch": 1370} {"train_loss": -11.474449157714844, "global_step": 230226, "epoch": 1370} {"train_loss": -11.528921127319336, "global_step": 230227, "epoch": 1370} {"train_loss": -11.470144271850586, "global_step": 230228, "epoch": 1370} {"train_loss": -11.527261734008789, "global_step": 230229, "epoch": 1370} {"train_loss": -11.506547927856445, "global_step": 230230, "epoch": 1370} {"train_loss": -11.570363998413086, "global_step": 230231, "epoch": 1370} {"train_loss": -11.651749610900879, "global_step": 230232, "epoch": 1370} {"train_loss": -11.778543472290039, "global_step": 230233, "epoch": 1370} {"train_loss": -11.506643295288086, "global_step": 230234, "epoch": 1370} {"train_loss": -11.463245391845703, "global_step": 230235, "epoch": 1370} {"train_loss": -11.689325332641602, "global_step": 230236, "epoch": 1370} {"train_loss": -11.390201568603516, "global_step": 230237, "epoch": 1370} {"train_loss": -11.621459007263184, "global_step": 230238, "epoch": 1370} {"train_loss": -11.721824645996094, "global_step": 230239, "epoch": 1370} {"train_loss": -11.870089530944824, "global_step": 230240, "epoch": 1370} {"train_loss": -11.693605422973633, "global_step": 230241, "epoch": 1370} {"train_loss": -11.777884483337402, "global_step": 230242, "epoch": 1370} {"train_loss": -11.795135498046875, "global_step": 230243, "epoch": 1370} {"train_loss": -11.839080810546875, "global_step": 230244, "epoch": 1370} {"train_loss": -11.883722305297852, "global_step": 230245, "epoch": 1370} {"train_loss": -11.773308753967285, "global_step": 230246, "epoch": 1370} {"train_loss": -11.671431541442871, "global_step": 230247, "epoch": 1370} {"train_loss": -11.814897537231445, "global_step": 230248, "epoch": 1370} {"train_loss": -11.53848934173584, "global_step": 230249, "epoch": 1370} {"train_loss": -11.747264862060547, "global_step": 230250, "epoch": 1370} {"train_loss": -11.814661026000977, "global_step": 230251, "epoch": 1370} {"train_loss": -11.885679244995117, "global_step": 230252, "epoch": 1370} {"train_loss": -11.800275802612305, "global_step": 230253, "epoch": 1370} {"train_loss": -11.563475608825684, "global_step": 230254, "epoch": 1370} {"train_loss": -11.669262886047363, "global_step": 230255, "epoch": 1370} {"train_loss": -11.958107948303223, "global_step": 230256, "epoch": 1370} {"train_loss": -11.802414894104004, "global_step": 230257, "epoch": 1370} {"train_loss": -11.893884658813477, "global_step": 230258, "epoch": 1370} {"train_loss": -11.911245346069336, "global_step": 230259, "epoch": 1370} {"train_loss": -11.847638130187988, "global_step": 230260, "epoch": 1370} {"train_loss": -11.943312644958496, "global_step": 230261, "epoch": 1370} {"train_loss": -11.781439781188965, "global_step": 230262, "epoch": 1370} {"train_loss": -11.99881362915039, "global_step": 230263, "epoch": 1370} {"train_loss": -12.034266471862793, "global_step": 230264, "epoch": 1370} {"train_loss": -11.964319229125977, "global_step": 230265, "epoch": 1370} {"train_loss": -11.946277618408203, "global_step": 230266, "epoch": 1370} {"train_loss": -12.112833023071289, "global_step": 230267, "epoch": 1370} {"train_loss": -12.142051696777344, "global_step": 230268, "epoch": 1370} {"train_loss": -11.798515319824219, "global_step": 230269, "epoch": 1370} {"train_loss": -12.117279052734375, "global_step": 230270, "epoch": 1370} {"train_loss": -12.07293701171875, "global_step": 230271, "epoch": 1370} {"train_loss": -11.892593383789062, "global_step": 230272, "epoch": 1370} {"train_loss": -12.118704795837402, "global_step": 230273, "epoch": 1370} {"train_loss": -12.153877258300781, "global_step": 230274, "epoch": 1370} {"train_loss": -11.958656311035156, "global_step": 230275, "epoch": 1370} {"train_loss": -11.915834426879883, "global_step": 230276, "epoch": 1370} {"train_loss": -12.043660163879395, "global_step": 230277, "epoch": 1370} {"train_loss": -12.191383361816406, "global_step": 230278, "epoch": 1370} {"train_loss": -11.920090675354004, "global_step": 230279, "epoch": 1370} {"train_loss": -12.077795028686523, "global_step": 230280, "epoch": 1370} {"train_loss": -11.968978881835938, "global_step": 230281, "epoch": 1370} {"train_loss": -11.765884399414062, "global_step": 230282, "epoch": 1370} {"train_loss": -11.818675994873047, "global_step": 230283, "epoch": 1370} {"train_loss": -11.468591690063477, "global_step": 230284, "epoch": 1370} {"train_loss": -11.570779800415039, "global_step": 230285, "epoch": 1370} {"train_loss": -11.525336265563965, "global_step": 230286, "epoch": 1370} {"train_loss": -11.39079475402832, "global_step": 230287, "epoch": 1370} {"train_loss": -11.497920989990234, "global_step": 230288, "epoch": 1370} {"train_loss": -11.065372467041016, "global_step": 230289, "epoch": 1370} {"train_loss": -11.255777359008789, "global_step": 230290, "epoch": 1370} {"train_loss": -11.015950202941895, "global_step": 230291, "epoch": 1370} {"train_loss": -10.301865577697754, "global_step": 230292, "epoch": 1370} {"train_loss": -11.109643936157227, "global_step": 230293, "epoch": 1370} {"train_loss": -11.217096328735352, "global_step": 230294, "epoch": 1370} {"train_loss": -11.42739200592041, "global_step": 230295, "epoch": 1370} {"train_loss": -10.86479377746582, "global_step": 230296, "epoch": 1370} {"train_loss": -9.9625883102417, "global_step": 230297, "epoch": 1370} {"train_loss": -11.617696762084961, "global_step": 230298, "epoch": 1370} {"train_loss": -9.744073867797852, "global_step": 230299, "epoch": 1370} {"train_loss": -9.917628288269043, "global_step": 230300, "epoch": 1370} {"train_loss": -11.394201278686523, "global_step": 230301, "epoch": 1370} {"train_loss": -10.221773147583008, "global_step": 230302, "epoch": 1370} {"train_loss": -11.29242992401123, "global_step": 230303, "epoch": 1370} {"train_loss": -10.827680587768555, "global_step": 230304, "epoch": 1370} {"train_loss": -10.297805786132812, "global_step": 230305, "epoch": 1370} {"train_loss": -9.888407707214355, "global_step": 230306, "epoch": 1370} {"train_loss": -11.130760192871094, "global_step": 230307, "epoch": 1370} {"train_loss": -9.491927146911621, "global_step": 230308, "epoch": 1370} {"train_loss": -11.081155776977539, "global_step": 230309, "epoch": 1370} {"train_loss": -10.427207946777344, "global_step": 230310, "epoch": 1370} {"train_loss": -10.48746109008789, "global_step": 230311, "epoch": 1370} {"train_loss": -10.455179214477539, "global_step": 230312, "epoch": 1370} {"train_loss": -10.95956802368164, "global_step": 230313, "epoch": 1370} {"train_loss": -9.924602508544922, "global_step": 230314, "epoch": 1370} {"train_loss": -11.310340881347656, "global_step": 230315, "epoch": 1370} {"train_loss": -10.707666397094727, "global_step": 230316, "epoch": 1370} {"train_loss": -10.744009017944336, "global_step": 230317, "epoch": 1370} {"train_loss": -10.710308074951172, "global_step": 230318, "epoch": 1370} {"train_loss": -10.863197326660156, "global_step": 230319, "epoch": 1370} {"train_loss": -10.198770523071289, "global_step": 230320, "epoch": 1370} {"train_loss": -10.892271995544434, "global_step": 230321, "epoch": 1370} {"train_loss": -10.707422256469727, "global_step": 230322, "epoch": 1370} {"train_loss": -10.719490051269531, "global_step": 230323, "epoch": 1370} {"train_loss": -10.294471740722656, "global_step": 230324, "epoch": 1370} {"train_loss": -10.198539733886719, "global_step": 230325, "epoch": 1370} {"train_loss": -10.151432991027832, "global_step": 230326, "epoch": 1370} {"train_loss": -11.063341722601937, "global_step": 230327, "epoch": 1370, "val_loss": 263687.6875, "train_action_mse_error": 1.8098130226135254} {"train_loss": -10.527941703796387, "global_step": 230328, "epoch": 1371} {"train_loss": -10.040911674499512, "global_step": 230329, "epoch": 1371} {"train_loss": -11.19350528717041, "global_step": 230330, "epoch": 1371} {"train_loss": -10.460407257080078, "global_step": 230331, "epoch": 1371} {"train_loss": -11.308944702148438, "global_step": 230332, "epoch": 1371} {"train_loss": -10.65312385559082, "global_step": 230333, "epoch": 1371} {"train_loss": -11.561676025390625, "global_step": 230334, "epoch": 1371} {"train_loss": -10.848127365112305, "global_step": 230335, "epoch": 1371} {"train_loss": -11.471888542175293, "global_step": 230336, "epoch": 1371} {"train_loss": -11.207443237304688, "global_step": 230337, "epoch": 1371} {"train_loss": -11.297691345214844, "global_step": 230338, "epoch": 1371} {"train_loss": -11.39504337310791, "global_step": 230339, "epoch": 1371} {"train_loss": -11.46087646484375, "global_step": 230340, "epoch": 1371} {"train_loss": -10.997535705566406, "global_step": 230341, "epoch": 1371} {"train_loss": -11.194990158081055, "global_step": 230342, "epoch": 1371} {"train_loss": -11.229583740234375, "global_step": 230343, "epoch": 1371} {"train_loss": -11.534521102905273, "global_step": 230344, "epoch": 1371} {"train_loss": -11.754085540771484, "global_step": 230345, "epoch": 1371} {"train_loss": -11.360239028930664, "global_step": 230346, "epoch": 1371} {"train_loss": -11.501544952392578, "global_step": 230347, "epoch": 1371} {"train_loss": -11.440203666687012, "global_step": 230348, "epoch": 1371} {"train_loss": -11.489764213562012, "global_step": 230349, "epoch": 1371} {"train_loss": -11.430410385131836, "global_step": 230350, "epoch": 1371} {"train_loss": -11.5030517578125, "global_step": 230351, "epoch": 1371} {"train_loss": -11.672477722167969, "global_step": 230352, "epoch": 1371} {"train_loss": -11.36739730834961, "global_step": 230353, "epoch": 1371} {"train_loss": -11.553958892822266, "global_step": 230354, "epoch": 1371} {"train_loss": -11.377558708190918, "global_step": 230355, "epoch": 1371} {"train_loss": -11.778974533081055, "global_step": 230356, "epoch": 1371} {"train_loss": -11.517294883728027, "global_step": 230357, "epoch": 1371} {"train_loss": -11.766407012939453, "global_step": 230358, "epoch": 1371} {"train_loss": -11.54339599609375, "global_step": 230359, "epoch": 1371} {"train_loss": -11.345298767089844, "global_step": 230360, "epoch": 1371} {"train_loss": -11.432528495788574, "global_step": 230361, "epoch": 1371} {"train_loss": -11.383428573608398, "global_step": 230362, "epoch": 1371} {"train_loss": -11.731855392456055, "global_step": 230363, "epoch": 1371} {"train_loss": -11.593360900878906, "global_step": 230364, "epoch": 1371} {"train_loss": -11.63877010345459, "global_step": 230365, "epoch": 1371} {"train_loss": -11.860107421875, "global_step": 230366, "epoch": 1371} {"train_loss": -11.874405860900879, "global_step": 230367, "epoch": 1371} {"train_loss": -11.928316116333008, "global_step": 230368, "epoch": 1371} {"train_loss": -11.610733985900879, "global_step": 230369, "epoch": 1371} {"train_loss": -11.836307525634766, "global_step": 230370, "epoch": 1371} {"train_loss": -11.82988452911377, "global_step": 230371, "epoch": 1371} {"train_loss": -11.623381614685059, "global_step": 230372, "epoch": 1371} {"train_loss": -11.887831687927246, "global_step": 230373, "epoch": 1371} {"train_loss": -11.66511344909668, "global_step": 230374, "epoch": 1371} {"train_loss": -11.863706588745117, "global_step": 230375, "epoch": 1371} {"train_loss": -11.537614822387695, "global_step": 230376, "epoch": 1371} {"train_loss": -11.760335922241211, "global_step": 230377, "epoch": 1371} {"train_loss": -11.724922180175781, "global_step": 230378, "epoch": 1371} {"train_loss": -11.698469161987305, "global_step": 230379, "epoch": 1371} {"train_loss": -11.494562149047852, "global_step": 230380, "epoch": 1371} {"train_loss": -11.63687515258789, "global_step": 230381, "epoch": 1371} {"train_loss": -11.543807983398438, "global_step": 230382, "epoch": 1371} {"train_loss": -11.554582595825195, "global_step": 230383, "epoch": 1371} {"train_loss": -11.813854217529297, "global_step": 230384, "epoch": 1371} {"train_loss": -11.644737243652344, "global_step": 230385, "epoch": 1371} {"train_loss": -11.67165756225586, "global_step": 230386, "epoch": 1371} {"train_loss": -11.729360580444336, "global_step": 230387, "epoch": 1371} {"train_loss": -11.672136306762695, "global_step": 230388, "epoch": 1371} {"train_loss": -11.985969543457031, "global_step": 230389, "epoch": 1371} {"train_loss": -11.312973022460938, "global_step": 230390, "epoch": 1371} {"train_loss": -11.77560043334961, "global_step": 230391, "epoch": 1371} {"train_loss": -11.585790634155273, "global_step": 230392, "epoch": 1371} {"train_loss": -11.309374809265137, "global_step": 230393, "epoch": 1371} {"train_loss": -11.928155899047852, "global_step": 230394, "epoch": 1371} {"train_loss": -11.175544738769531, "global_step": 230395, "epoch": 1371} {"train_loss": -11.706578254699707, "global_step": 230396, "epoch": 1371} {"train_loss": -11.870223999023438, "global_step": 230397, "epoch": 1371} {"train_loss": -11.355328559875488, "global_step": 230398, "epoch": 1371} {"train_loss": -12.072538375854492, "global_step": 230399, "epoch": 1371} {"train_loss": -11.35607624053955, "global_step": 230400, "epoch": 1371} {"train_loss": -11.372335433959961, "global_step": 230401, "epoch": 1371} {"train_loss": -12.032033920288086, "global_step": 230402, "epoch": 1371} {"train_loss": -10.879922866821289, "global_step": 230403, "epoch": 1371} {"train_loss": -11.773551940917969, "global_step": 230404, "epoch": 1371} {"train_loss": -11.526430130004883, "global_step": 230405, "epoch": 1371} {"train_loss": -11.161689758300781, "global_step": 230406, "epoch": 1371} {"train_loss": -11.99636173248291, "global_step": 230407, "epoch": 1371} {"train_loss": -11.54580307006836, "global_step": 230408, "epoch": 1371} {"train_loss": -12.011239051818848, "global_step": 230409, "epoch": 1371} {"train_loss": -11.367111206054688, "global_step": 230410, "epoch": 1371} {"train_loss": -11.77656364440918, "global_step": 230411, "epoch": 1371} {"train_loss": -11.864227294921875, "global_step": 230412, "epoch": 1371} {"train_loss": -11.660299301147461, "global_step": 230413, "epoch": 1371} {"train_loss": -11.975400924682617, "global_step": 230414, "epoch": 1371} {"train_loss": -11.929939270019531, "global_step": 230415, "epoch": 1371} {"train_loss": -11.890890121459961, "global_step": 230416, "epoch": 1371} {"train_loss": -12.031654357910156, "global_step": 230417, "epoch": 1371} {"train_loss": -11.999824523925781, "global_step": 230418, "epoch": 1371} {"train_loss": -11.947059631347656, "global_step": 230419, "epoch": 1371} {"train_loss": -11.996513366699219, "global_step": 230420, "epoch": 1371} {"train_loss": -11.887825012207031, "global_step": 230421, "epoch": 1371} {"train_loss": -11.958902359008789, "global_step": 230422, "epoch": 1371} {"train_loss": -11.917614936828613, "global_step": 230423, "epoch": 1371} {"train_loss": -11.916289329528809, "global_step": 230424, "epoch": 1371} {"train_loss": -11.676387786865234, "global_step": 230425, "epoch": 1371} {"train_loss": -11.606650352478027, "global_step": 230426, "epoch": 1371} {"train_loss": -11.729949951171875, "global_step": 230427, "epoch": 1371} {"train_loss": -11.8582763671875, "global_step": 230428, "epoch": 1371} {"train_loss": -11.47549819946289, "global_step": 230429, "epoch": 1371} {"train_loss": -11.175060272216797, "global_step": 230430, "epoch": 1371} {"train_loss": -11.40499210357666, "global_step": 230431, "epoch": 1371} {"train_loss": -11.623035430908203, "global_step": 230432, "epoch": 1371} {"train_loss": -11.117413520812988, "global_step": 230433, "epoch": 1371} {"train_loss": -11.637981414794922, "global_step": 230434, "epoch": 1371} {"train_loss": -10.913261413574219, "global_step": 230435, "epoch": 1371} {"train_loss": -11.395881652832031, "global_step": 230436, "epoch": 1371} {"train_loss": -11.10578727722168, "global_step": 230437, "epoch": 1371} {"train_loss": -10.852760314941406, "global_step": 230438, "epoch": 1371} {"train_loss": -11.025007247924805, "global_step": 230439, "epoch": 1371} {"train_loss": -10.95695686340332, "global_step": 230440, "epoch": 1371} {"train_loss": -11.178794860839844, "global_step": 230441, "epoch": 1371} {"train_loss": -10.658784866333008, "global_step": 230442, "epoch": 1371} {"train_loss": -11.857272148132324, "global_step": 230443, "epoch": 1371} {"train_loss": -10.813720703125, "global_step": 230444, "epoch": 1371} {"train_loss": -10.399225234985352, "global_step": 230445, "epoch": 1371} {"train_loss": -10.021940231323242, "global_step": 230446, "epoch": 1371} {"train_loss": -11.236335754394531, "global_step": 230447, "epoch": 1371} {"train_loss": -10.316987037658691, "global_step": 230448, "epoch": 1371} {"train_loss": -10.728233337402344, "global_step": 230449, "epoch": 1371} {"train_loss": -11.397773742675781, "global_step": 230450, "epoch": 1371} {"train_loss": -10.736061096191406, "global_step": 230451, "epoch": 1371} {"train_loss": -11.173361778259277, "global_step": 230452, "epoch": 1371} {"train_loss": -11.288223266601562, "global_step": 230453, "epoch": 1371} {"train_loss": -10.220602035522461, "global_step": 230454, "epoch": 1371} {"train_loss": -10.888444900512695, "global_step": 230455, "epoch": 1371} {"train_loss": -11.331649780273438, "global_step": 230456, "epoch": 1371} {"train_loss": -10.8389892578125, "global_step": 230457, "epoch": 1371} {"train_loss": -11.300873756408691, "global_step": 230458, "epoch": 1371} {"train_loss": -10.728124618530273, "global_step": 230459, "epoch": 1371} {"train_loss": -11.384727478027344, "global_step": 230460, "epoch": 1371} {"train_loss": -10.778254508972168, "global_step": 230461, "epoch": 1371} {"train_loss": -11.226418495178223, "global_step": 230462, "epoch": 1371} {"train_loss": -10.976139068603516, "global_step": 230463, "epoch": 1371} {"train_loss": -11.035009384155273, "global_step": 230464, "epoch": 1371} {"train_loss": -11.706063270568848, "global_step": 230465, "epoch": 1371} {"train_loss": -11.202411651611328, "global_step": 230466, "epoch": 1371} {"train_loss": -11.177547454833984, "global_step": 230467, "epoch": 1371} {"train_loss": -11.392685890197754, "global_step": 230468, "epoch": 1371} {"train_loss": -11.464311599731445, "global_step": 230469, "epoch": 1371} {"train_loss": -11.526444435119629, "global_step": 230470, "epoch": 1371} {"train_loss": -11.661623001098633, "global_step": 230471, "epoch": 1371} {"train_loss": -11.50520133972168, "global_step": 230472, "epoch": 1371} {"train_loss": -11.747188568115234, "global_step": 230473, "epoch": 1371} {"train_loss": -11.535297393798828, "global_step": 230474, "epoch": 1371} {"train_loss": -11.728080749511719, "global_step": 230475, "epoch": 1371} {"train_loss": -11.450746536254883, "global_step": 230476, "epoch": 1371} {"train_loss": -11.824902534484863, "global_step": 230477, "epoch": 1371} {"train_loss": -11.546134948730469, "global_step": 230478, "epoch": 1371} {"train_loss": -11.494199752807617, "global_step": 230479, "epoch": 1371} {"train_loss": -11.653081893920898, "global_step": 230480, "epoch": 1371} {"train_loss": -11.768448829650879, "global_step": 230481, "epoch": 1371} {"train_loss": -11.63367748260498, "global_step": 230482, "epoch": 1371} {"train_loss": -11.868745803833008, "global_step": 230483, "epoch": 1371} {"train_loss": -11.388328552246094, "global_step": 230484, "epoch": 1371} {"train_loss": -11.759455680847168, "global_step": 230485, "epoch": 1371} {"train_loss": -11.870352745056152, "global_step": 230486, "epoch": 1371} {"train_loss": -11.456039428710938, "global_step": 230487, "epoch": 1371} {"train_loss": -11.980669975280762, "global_step": 230488, "epoch": 1371} {"train_loss": -11.417734146118164, "global_step": 230489, "epoch": 1371} {"train_loss": -11.824272155761719, "global_step": 230490, "epoch": 1371} {"train_loss": -11.696557998657227, "global_step": 230491, "epoch": 1371} {"train_loss": -11.625042915344238, "global_step": 230492, "epoch": 1371} {"train_loss": -11.678116798400879, "global_step": 230493, "epoch": 1371} {"train_loss": -11.529980659484863, "global_step": 230494, "epoch": 1371} {"train_loss": -11.464216465041751, "global_step": 230495, "epoch": 1371, "val_loss": 261404.515625} {"train_loss": -11.388528823852539, "global_step": 230496, "epoch": 1372} {"train_loss": -11.835306167602539, "global_step": 230497, "epoch": 1372} {"train_loss": -11.433351516723633, "global_step": 230498, "epoch": 1372} {"train_loss": -11.66342830657959, "global_step": 230499, "epoch": 1372} {"train_loss": -11.55174446105957, "global_step": 230500, "epoch": 1372} {"train_loss": -11.391433715820312, "global_step": 230501, "epoch": 1372} {"train_loss": -11.438529968261719, "global_step": 230502, "epoch": 1372} {"train_loss": -11.179798126220703, "global_step": 230503, "epoch": 1372} {"train_loss": -11.829645156860352, "global_step": 230504, "epoch": 1372} {"train_loss": -11.437047004699707, "global_step": 230505, "epoch": 1372} {"train_loss": -10.97281265258789, "global_step": 230506, "epoch": 1372} {"train_loss": -11.45252513885498, "global_step": 230507, "epoch": 1372} {"train_loss": -11.075861930847168, "global_step": 230508, "epoch": 1372} {"train_loss": -10.920845985412598, "global_step": 230509, "epoch": 1372} {"train_loss": -11.906702041625977, "global_step": 230510, "epoch": 1372} {"train_loss": -10.819272994995117, "global_step": 230511, "epoch": 1372} {"train_loss": -11.777883529663086, "global_step": 230512, "epoch": 1372} {"train_loss": -11.647579193115234, "global_step": 230513, "epoch": 1372} {"train_loss": -11.703479766845703, "global_step": 230514, "epoch": 1372} {"train_loss": -10.852641105651855, "global_step": 230515, "epoch": 1372} {"train_loss": -11.507211685180664, "global_step": 230516, "epoch": 1372} {"train_loss": -11.284025192260742, "global_step": 230517, "epoch": 1372} {"train_loss": -11.739068984985352, "global_step": 230518, "epoch": 1372} {"train_loss": -11.01998519897461, "global_step": 230519, "epoch": 1372} {"train_loss": -11.357158660888672, "global_step": 230520, "epoch": 1372} {"train_loss": -11.009657859802246, "global_step": 230521, "epoch": 1372} {"train_loss": -11.629745483398438, "global_step": 230522, "epoch": 1372} {"train_loss": -10.67259407043457, "global_step": 230523, "epoch": 1372} {"train_loss": -11.301324844360352, "global_step": 230524, "epoch": 1372} {"train_loss": -10.772263526916504, "global_step": 230525, "epoch": 1372} {"train_loss": -11.237419128417969, "global_step": 230526, "epoch": 1372} {"train_loss": -10.853771209716797, "global_step": 230527, "epoch": 1372} {"train_loss": -10.843116760253906, "global_step": 230528, "epoch": 1372} {"train_loss": -9.70901870727539, "global_step": 230529, "epoch": 1372} {"train_loss": -11.00301742553711, "global_step": 230530, "epoch": 1372} {"train_loss": -8.844362258911133, "global_step": 230531, "epoch": 1372} {"train_loss": -10.261650085449219, "global_step": 230532, "epoch": 1372} {"train_loss": -9.253944396972656, "global_step": 230533, "epoch": 1372} {"train_loss": -10.692427635192871, "global_step": 230534, "epoch": 1372} {"train_loss": -11.220781326293945, "global_step": 230535, "epoch": 1372} {"train_loss": -11.163291931152344, "global_step": 230536, "epoch": 1372} {"train_loss": -11.046222686767578, "global_step": 230537, "epoch": 1372} {"train_loss": -11.388909339904785, "global_step": 230538, "epoch": 1372} {"train_loss": -11.126184463500977, "global_step": 230539, "epoch": 1372} {"train_loss": -11.253807067871094, "global_step": 230540, "epoch": 1372} {"train_loss": -11.131382942199707, "global_step": 230541, "epoch": 1372} {"train_loss": -11.301158905029297, "global_step": 230542, "epoch": 1372} {"train_loss": -11.304527282714844, "global_step": 230543, "epoch": 1372} {"train_loss": -10.668779373168945, "global_step": 230544, "epoch": 1372} {"train_loss": -11.392082214355469, "global_step": 230545, "epoch": 1372} {"train_loss": -11.152862548828125, "global_step": 230546, "epoch": 1372} {"train_loss": -11.511825561523438, "global_step": 230547, "epoch": 1372} {"train_loss": -11.471031188964844, "global_step": 230548, "epoch": 1372} {"train_loss": -11.270845413208008, "global_step": 230549, "epoch": 1372} {"train_loss": -11.721041679382324, "global_step": 230550, "epoch": 1372} {"train_loss": -11.34748649597168, "global_step": 230551, "epoch": 1372} {"train_loss": -11.689579963684082, "global_step": 230552, "epoch": 1372} {"train_loss": -11.465709686279297, "global_step": 230553, "epoch": 1372} {"train_loss": -11.701557159423828, "global_step": 230554, "epoch": 1372} {"train_loss": -11.439376831054688, "global_step": 230555, "epoch": 1372} {"train_loss": -11.596015930175781, "global_step": 230556, "epoch": 1372} {"train_loss": -11.680010795593262, "global_step": 230557, "epoch": 1372} {"train_loss": -11.753276824951172, "global_step": 230558, "epoch": 1372} {"train_loss": -11.716917037963867, "global_step": 230559, "epoch": 1372} {"train_loss": -11.761067390441895, "global_step": 230560, "epoch": 1372} {"train_loss": -11.783941268920898, "global_step": 230561, "epoch": 1372} {"train_loss": -11.651165008544922, "global_step": 230562, "epoch": 1372} {"train_loss": -11.765308380126953, "global_step": 230563, "epoch": 1372} {"train_loss": -11.654399871826172, "global_step": 230564, "epoch": 1372} {"train_loss": -11.692239761352539, "global_step": 230565, "epoch": 1372} {"train_loss": -11.694587707519531, "global_step": 230566, "epoch": 1372} {"train_loss": -11.4796781539917, "global_step": 230567, "epoch": 1372} {"train_loss": -11.709872245788574, "global_step": 230568, "epoch": 1372} {"train_loss": -11.265329360961914, "global_step": 230569, "epoch": 1372} {"train_loss": -11.736298561096191, "global_step": 230570, "epoch": 1372} {"train_loss": -11.624725341796875, "global_step": 230571, "epoch": 1372} {"train_loss": -11.603325843811035, "global_step": 230572, "epoch": 1372} {"train_loss": -11.836750030517578, "global_step": 230573, "epoch": 1372} {"train_loss": -11.419011116027832, "global_step": 230574, "epoch": 1372} {"train_loss": -11.744763374328613, "global_step": 230575, "epoch": 1372} {"train_loss": -11.511395454406738, "global_step": 230576, "epoch": 1372} {"train_loss": -11.52676010131836, "global_step": 230577, "epoch": 1372} {"train_loss": -11.601727485656738, "global_step": 230578, "epoch": 1372} {"train_loss": -11.398333549499512, "global_step": 230579, "epoch": 1372} {"train_loss": -11.64252758026123, "global_step": 230580, "epoch": 1372} {"train_loss": -11.253290176391602, "global_step": 230581, "epoch": 1372} {"train_loss": -11.725456237792969, "global_step": 230582, "epoch": 1372} {"train_loss": -11.231988906860352, "global_step": 230583, "epoch": 1372} {"train_loss": -11.851601600646973, "global_step": 230584, "epoch": 1372} {"train_loss": -11.48787784576416, "global_step": 230585, "epoch": 1372} {"train_loss": -11.765582084655762, "global_step": 230586, "epoch": 1372} {"train_loss": -11.51124382019043, "global_step": 230587, "epoch": 1372} {"train_loss": -11.289726257324219, "global_step": 230588, "epoch": 1372} {"train_loss": -11.762385368347168, "global_step": 230589, "epoch": 1372} {"train_loss": -11.39630126953125, "global_step": 230590, "epoch": 1372} {"train_loss": -11.55898666381836, "global_step": 230591, "epoch": 1372} {"train_loss": -11.639081954956055, "global_step": 230592, "epoch": 1372} {"train_loss": -11.440378189086914, "global_step": 230593, "epoch": 1372} {"train_loss": -10.986703872680664, "global_step": 230594, "epoch": 1372} {"train_loss": -11.804194450378418, "global_step": 230595, "epoch": 1372} {"train_loss": -11.245077133178711, "global_step": 230596, "epoch": 1372} {"train_loss": -11.866598129272461, "global_step": 230597, "epoch": 1372} {"train_loss": -11.246108055114746, "global_step": 230598, "epoch": 1372} {"train_loss": -11.576037406921387, "global_step": 230599, "epoch": 1372} {"train_loss": -11.562911987304688, "global_step": 230600, "epoch": 1372} {"train_loss": -11.850595474243164, "global_step": 230601, "epoch": 1372} {"train_loss": -11.409122467041016, "global_step": 230602, "epoch": 1372} {"train_loss": -11.95248031616211, "global_step": 230603, "epoch": 1372} {"train_loss": -11.518293380737305, "global_step": 230604, "epoch": 1372} {"train_loss": -11.91851806640625, "global_step": 230605, "epoch": 1372} {"train_loss": -11.680614471435547, "global_step": 230606, "epoch": 1372} {"train_loss": -12.011871337890625, "global_step": 230607, "epoch": 1372} {"train_loss": -11.590800285339355, "global_step": 230608, "epoch": 1372} {"train_loss": -11.78322982788086, "global_step": 230609, "epoch": 1372} {"train_loss": -11.964621543884277, "global_step": 230610, "epoch": 1372} {"train_loss": -11.82390022277832, "global_step": 230611, "epoch": 1372} {"train_loss": -11.984939575195312, "global_step": 230612, "epoch": 1372} {"train_loss": -11.748212814331055, "global_step": 230613, "epoch": 1372} {"train_loss": -11.802909851074219, "global_step": 230614, "epoch": 1372} {"train_loss": -11.818070411682129, "global_step": 230615, "epoch": 1372} {"train_loss": -11.443634033203125, "global_step": 230616, "epoch": 1372} {"train_loss": -11.724458694458008, "global_step": 230617, "epoch": 1372} {"train_loss": -11.897856712341309, "global_step": 230618, "epoch": 1372} {"train_loss": -11.898609161376953, "global_step": 230619, "epoch": 1372} {"train_loss": -11.721223831176758, "global_step": 230620, "epoch": 1372} {"train_loss": -11.689532279968262, "global_step": 230621, "epoch": 1372} {"train_loss": -11.897834777832031, "global_step": 230622, "epoch": 1372} {"train_loss": -11.965720176696777, "global_step": 230623, "epoch": 1372} {"train_loss": -11.697674751281738, "global_step": 230624, "epoch": 1372} {"train_loss": -11.939127922058105, "global_step": 230625, "epoch": 1372} {"train_loss": -11.772132873535156, "global_step": 230626, "epoch": 1372} {"train_loss": -11.789892196655273, "global_step": 230627, "epoch": 1372} {"train_loss": -11.466463088989258, "global_step": 230628, "epoch": 1372} {"train_loss": -11.913768768310547, "global_step": 230629, "epoch": 1372} {"train_loss": -10.747426986694336, "global_step": 230630, "epoch": 1372} {"train_loss": -11.82467269897461, "global_step": 230631, "epoch": 1372} {"train_loss": -11.814164161682129, "global_step": 230632, "epoch": 1372} {"train_loss": -11.57664966583252, "global_step": 230633, "epoch": 1372} {"train_loss": -11.499539375305176, "global_step": 230634, "epoch": 1372} {"train_loss": -11.157297134399414, "global_step": 230635, "epoch": 1372} {"train_loss": -11.094842910766602, "global_step": 230636, "epoch": 1372} {"train_loss": -11.448202133178711, "global_step": 230637, "epoch": 1372} {"train_loss": -11.416711807250977, "global_step": 230638, "epoch": 1372} {"train_loss": -9.93482494354248, "global_step": 230639, "epoch": 1372} {"train_loss": -11.727851867675781, "global_step": 230640, "epoch": 1372} {"train_loss": -11.131093978881836, "global_step": 230641, "epoch": 1372} {"train_loss": -10.30355453491211, "global_step": 230642, "epoch": 1372} {"train_loss": -11.148468017578125, "global_step": 230643, "epoch": 1372} {"train_loss": -11.612220764160156, "global_step": 230644, "epoch": 1372} {"train_loss": -11.09433650970459, "global_step": 230645, "epoch": 1372} {"train_loss": -11.20887279510498, "global_step": 230646, "epoch": 1372} {"train_loss": -11.854578018188477, "global_step": 230647, "epoch": 1372} {"train_loss": -11.336441040039062, "global_step": 230648, "epoch": 1372} {"train_loss": -11.708026885986328, "global_step": 230649, "epoch": 1372} {"train_loss": -10.556983947753906, "global_step": 230650, "epoch": 1372} {"train_loss": -11.477585792541504, "global_step": 230651, "epoch": 1372} {"train_loss": -11.09379768371582, "global_step": 230652, "epoch": 1372} {"train_loss": -11.323348999023438, "global_step": 230653, "epoch": 1372} {"train_loss": -10.158194541931152, "global_step": 230654, "epoch": 1372} {"train_loss": -10.94375228881836, "global_step": 230655, "epoch": 1372} {"train_loss": -10.393413543701172, "global_step": 230656, "epoch": 1372} {"train_loss": -10.377988815307617, "global_step": 230657, "epoch": 1372} {"train_loss": -10.562362670898438, "global_step": 230658, "epoch": 1372} {"train_loss": -9.952884674072266, "global_step": 230659, "epoch": 1372} {"train_loss": -11.562196731567383, "global_step": 230660, "epoch": 1372} {"train_loss": -10.520622253417969, "global_step": 230661, "epoch": 1372} {"train_loss": -11.222929000854492, "global_step": 230662, "epoch": 1372} {"train_loss": -11.371501411710467, "global_step": 230663, "epoch": 1372, "val_loss": 262826.625} {"train_loss": -10.93273639678955, "global_step": 230664, "epoch": 1373} {"train_loss": -10.861154556274414, "global_step": 230665, "epoch": 1373} {"train_loss": -10.679159164428711, "global_step": 230666, "epoch": 1373} {"train_loss": -11.134746551513672, "global_step": 230667, "epoch": 1373} {"train_loss": -10.235873222351074, "global_step": 230668, "epoch": 1373} {"train_loss": -11.02872085571289, "global_step": 230669, "epoch": 1373} {"train_loss": -11.178750038146973, "global_step": 230670, "epoch": 1373} {"train_loss": -10.960290908813477, "global_step": 230671, "epoch": 1373} {"train_loss": -11.12038803100586, "global_step": 230672, "epoch": 1373} {"train_loss": -11.43531608581543, "global_step": 230673, "epoch": 1373} {"train_loss": -10.949657440185547, "global_step": 230674, "epoch": 1373} {"train_loss": -11.593086242675781, "global_step": 230675, "epoch": 1373} {"train_loss": -11.068429946899414, "global_step": 230676, "epoch": 1373} {"train_loss": -11.272570610046387, "global_step": 230677, "epoch": 1373} {"train_loss": -11.449106216430664, "global_step": 230678, "epoch": 1373} {"train_loss": -11.41388988494873, "global_step": 230679, "epoch": 1373} {"train_loss": -11.017621994018555, "global_step": 230680, "epoch": 1373} {"train_loss": -11.507617950439453, "global_step": 230681, "epoch": 1373} {"train_loss": -11.056388854980469, "global_step": 230682, "epoch": 1373} {"train_loss": -11.738199234008789, "global_step": 230683, "epoch": 1373} {"train_loss": -11.480680465698242, "global_step": 230684, "epoch": 1373} {"train_loss": -11.519070625305176, "global_step": 230685, "epoch": 1373} {"train_loss": -11.216419219970703, "global_step": 230686, "epoch": 1373} {"train_loss": -11.526250839233398, "global_step": 230687, "epoch": 1373} {"train_loss": -11.248772621154785, "global_step": 230688, "epoch": 1373} {"train_loss": -11.660844802856445, "global_step": 230689, "epoch": 1373} {"train_loss": -11.469711303710938, "global_step": 230690, "epoch": 1373} {"train_loss": -11.800369262695312, "global_step": 230691, "epoch": 1373} {"train_loss": -11.455394744873047, "global_step": 230692, "epoch": 1373} {"train_loss": -11.66773796081543, "global_step": 230693, "epoch": 1373} {"train_loss": -11.157674789428711, "global_step": 230694, "epoch": 1373} {"train_loss": -11.53628158569336, "global_step": 230695, "epoch": 1373} {"train_loss": -11.228170394897461, "global_step": 230696, "epoch": 1373} {"train_loss": -11.55215835571289, "global_step": 230697, "epoch": 1373} {"train_loss": -11.433982849121094, "global_step": 230698, "epoch": 1373} {"train_loss": -11.875665664672852, "global_step": 230699, "epoch": 1373} {"train_loss": -11.556931495666504, "global_step": 230700, "epoch": 1373} {"train_loss": -11.558534622192383, "global_step": 230701, "epoch": 1373} {"train_loss": -11.71533203125, "global_step": 230702, "epoch": 1373} {"train_loss": -11.39572811126709, "global_step": 230703, "epoch": 1373} {"train_loss": -11.706666946411133, "global_step": 230704, "epoch": 1373} {"train_loss": -11.826995849609375, "global_step": 230705, "epoch": 1373} {"train_loss": -11.679109573364258, "global_step": 230706, "epoch": 1373} {"train_loss": -11.554192543029785, "global_step": 230707, "epoch": 1373} {"train_loss": -11.6257905960083, "global_step": 230708, "epoch": 1373} {"train_loss": -11.496191024780273, "global_step": 230709, "epoch": 1373} {"train_loss": -11.904708862304688, "global_step": 230710, "epoch": 1373} {"train_loss": -11.608329772949219, "global_step": 230711, "epoch": 1373} {"train_loss": -11.492403030395508, "global_step": 230712, "epoch": 1373} {"train_loss": -11.737942695617676, "global_step": 230713, "epoch": 1373} {"train_loss": -11.492491722106934, "global_step": 230714, "epoch": 1373} {"train_loss": -11.846456527709961, "global_step": 230715, "epoch": 1373} {"train_loss": -11.575041770935059, "global_step": 230716, "epoch": 1373} {"train_loss": -11.661676406860352, "global_step": 230717, "epoch": 1373} {"train_loss": -11.782134056091309, "global_step": 230718, "epoch": 1373} {"train_loss": -11.677380561828613, "global_step": 230719, "epoch": 1373} {"train_loss": -12.008647918701172, "global_step": 230720, "epoch": 1373} {"train_loss": -11.478911399841309, "global_step": 230721, "epoch": 1373} {"train_loss": -11.733694076538086, "global_step": 230722, "epoch": 1373} {"train_loss": -11.767569541931152, "global_step": 230723, "epoch": 1373} {"train_loss": -11.456744194030762, "global_step": 230724, "epoch": 1373} {"train_loss": -12.03254222869873, "global_step": 230725, "epoch": 1373} {"train_loss": -10.961834907531738, "global_step": 230726, "epoch": 1373} {"train_loss": -11.494756698608398, "global_step": 230727, "epoch": 1373} {"train_loss": -11.724102020263672, "global_step": 230728, "epoch": 1373} {"train_loss": -11.274328231811523, "global_step": 230729, "epoch": 1373} {"train_loss": -12.017538070678711, "global_step": 230730, "epoch": 1373} {"train_loss": -11.562313079833984, "global_step": 230731, "epoch": 1373} {"train_loss": -11.857890129089355, "global_step": 230732, "epoch": 1373} {"train_loss": -11.810646057128906, "global_step": 230733, "epoch": 1373} {"train_loss": -11.8638916015625, "global_step": 230734, "epoch": 1373} {"train_loss": -11.462117195129395, "global_step": 230735, "epoch": 1373} {"train_loss": -11.97185230255127, "global_step": 230736, "epoch": 1373} {"train_loss": -11.52949333190918, "global_step": 230737, "epoch": 1373} {"train_loss": -11.96422004699707, "global_step": 230738, "epoch": 1373} {"train_loss": -11.723617553710938, "global_step": 230739, "epoch": 1373} {"train_loss": -11.62557601928711, "global_step": 230740, "epoch": 1373} {"train_loss": -11.435367584228516, "global_step": 230741, "epoch": 1373} {"train_loss": -11.122437477111816, "global_step": 230742, "epoch": 1373} {"train_loss": -11.222009658813477, "global_step": 230743, "epoch": 1373} {"train_loss": -12.049205780029297, "global_step": 230744, "epoch": 1373} {"train_loss": -11.33215618133545, "global_step": 230745, "epoch": 1373} {"train_loss": -11.245429992675781, "global_step": 230746, "epoch": 1373} {"train_loss": -11.355167388916016, "global_step": 230747, "epoch": 1373} {"train_loss": -11.422000885009766, "global_step": 230748, "epoch": 1373} {"train_loss": -11.423604965209961, "global_step": 230749, "epoch": 1373} {"train_loss": -11.542346954345703, "global_step": 230750, "epoch": 1373} {"train_loss": -11.659501075744629, "global_step": 230751, "epoch": 1373} {"train_loss": -11.621185302734375, "global_step": 230752, "epoch": 1373} {"train_loss": -11.195446968078613, "global_step": 230753, "epoch": 1373} {"train_loss": -11.381958961486816, "global_step": 230754, "epoch": 1373} {"train_loss": -11.731830596923828, "global_step": 230755, "epoch": 1373} {"train_loss": -11.472118377685547, "global_step": 230756, "epoch": 1373} {"train_loss": -11.640022277832031, "global_step": 230757, "epoch": 1373} {"train_loss": -11.15572452545166, "global_step": 230758, "epoch": 1373} {"train_loss": -11.43549633026123, "global_step": 230759, "epoch": 1373} {"train_loss": -11.560698509216309, "global_step": 230760, "epoch": 1373} {"train_loss": -11.516254425048828, "global_step": 230761, "epoch": 1373} {"train_loss": -11.875401496887207, "global_step": 230762, "epoch": 1373} {"train_loss": -11.662242889404297, "global_step": 230763, "epoch": 1373} {"train_loss": -11.947561264038086, "global_step": 230764, "epoch": 1373} {"train_loss": -11.911256790161133, "global_step": 230765, "epoch": 1373} {"train_loss": -11.742142677307129, "global_step": 230766, "epoch": 1373} {"train_loss": -11.80936050415039, "global_step": 230767, "epoch": 1373} {"train_loss": -11.556718826293945, "global_step": 230768, "epoch": 1373} {"train_loss": -11.74106216430664, "global_step": 230769, "epoch": 1373} {"train_loss": -11.404890060424805, "global_step": 230770, "epoch": 1373} {"train_loss": -11.661178588867188, "global_step": 230771, "epoch": 1373} {"train_loss": -11.58669662475586, "global_step": 230772, "epoch": 1373} {"train_loss": -11.801620483398438, "global_step": 230773, "epoch": 1373} {"train_loss": -11.587735176086426, "global_step": 230774, "epoch": 1373} {"train_loss": -12.024139404296875, "global_step": 230775, "epoch": 1373} {"train_loss": -11.197736740112305, "global_step": 230776, "epoch": 1373} {"train_loss": -11.107799530029297, "global_step": 230777, "epoch": 1373} {"train_loss": -11.828084945678711, "global_step": 230778, "epoch": 1373} {"train_loss": -11.616161346435547, "global_step": 230779, "epoch": 1373} {"train_loss": -11.370909690856934, "global_step": 230780, "epoch": 1373} {"train_loss": -11.908842086791992, "global_step": 230781, "epoch": 1373} {"train_loss": -11.469724655151367, "global_step": 230782, "epoch": 1373} {"train_loss": -11.789213180541992, "global_step": 230783, "epoch": 1373} {"train_loss": -11.610580444335938, "global_step": 230784, "epoch": 1373} {"train_loss": -11.550132751464844, "global_step": 230785, "epoch": 1373} {"train_loss": -12.137504577636719, "global_step": 230786, "epoch": 1373} {"train_loss": -11.733331680297852, "global_step": 230787, "epoch": 1373} {"train_loss": -11.727591514587402, "global_step": 230788, "epoch": 1373} {"train_loss": -11.927106857299805, "global_step": 230789, "epoch": 1373} {"train_loss": -11.800943374633789, "global_step": 230790, "epoch": 1373} {"train_loss": -11.524310111999512, "global_step": 230791, "epoch": 1373} {"train_loss": -11.968839645385742, "global_step": 230792, "epoch": 1373} {"train_loss": -11.425727844238281, "global_step": 230793, "epoch": 1373} {"train_loss": -11.731407165527344, "global_step": 230794, "epoch": 1373} {"train_loss": -12.01409912109375, "global_step": 230795, "epoch": 1373} {"train_loss": -11.458178520202637, "global_step": 230796, "epoch": 1373} {"train_loss": -11.847309112548828, "global_step": 230797, "epoch": 1373} {"train_loss": -11.847736358642578, "global_step": 230798, "epoch": 1373} {"train_loss": -11.595352172851562, "global_step": 230799, "epoch": 1373} {"train_loss": -10.772221565246582, "global_step": 230800, "epoch": 1373} {"train_loss": -10.583608627319336, "global_step": 230801, "epoch": 1373} {"train_loss": -11.873817443847656, "global_step": 230802, "epoch": 1373} {"train_loss": -11.101548194885254, "global_step": 230803, "epoch": 1373} {"train_loss": -11.462275505065918, "global_step": 230804, "epoch": 1373} {"train_loss": -11.764833450317383, "global_step": 230805, "epoch": 1373} {"train_loss": -10.918231964111328, "global_step": 230806, "epoch": 1373} {"train_loss": -11.455016136169434, "global_step": 230807, "epoch": 1373} {"train_loss": -11.906539916992188, "global_step": 230808, "epoch": 1373} {"train_loss": -11.750828742980957, "global_step": 230809, "epoch": 1373} {"train_loss": -11.912689208984375, "global_step": 230810, "epoch": 1373} {"train_loss": -11.980951309204102, "global_step": 230811, "epoch": 1373} {"train_loss": -11.487751960754395, "global_step": 230812, "epoch": 1373} {"train_loss": -11.82937240600586, "global_step": 230813, "epoch": 1373} {"train_loss": -11.630454063415527, "global_step": 230814, "epoch": 1373} {"train_loss": -11.506085395812988, "global_step": 230815, "epoch": 1373} {"train_loss": -11.582655906677246, "global_step": 230816, "epoch": 1373} {"train_loss": -11.437122344970703, "global_step": 230817, "epoch": 1373} {"train_loss": -11.706380844116211, "global_step": 230818, "epoch": 1373} {"train_loss": -11.501224517822266, "global_step": 230819, "epoch": 1373} {"train_loss": -11.623677253723145, "global_step": 230820, "epoch": 1373} {"train_loss": -11.764406204223633, "global_step": 230821, "epoch": 1373} {"train_loss": -11.616579055786133, "global_step": 230822, "epoch": 1373} {"train_loss": -11.672138214111328, "global_step": 230823, "epoch": 1373} {"train_loss": -11.442338943481445, "global_step": 230824, "epoch": 1373} {"train_loss": -11.72813892364502, "global_step": 230825, "epoch": 1373} {"train_loss": -11.201332092285156, "global_step": 230826, "epoch": 1373} {"train_loss": -11.34497356414795, "global_step": 230827, "epoch": 1373} {"train_loss": -11.201639175415039, "global_step": 230828, "epoch": 1373} {"train_loss": -11.32962703704834, "global_step": 230829, "epoch": 1373} {"train_loss": -10.93675422668457, "global_step": 230830, "epoch": 1373} {"train_loss": -11.533501108487448, "global_step": 230831, "epoch": 1373, "val_loss": 265897.09375} {"train_loss": -10.815877914428711, "global_step": 230832, "epoch": 1374} {"train_loss": -11.49740219116211, "global_step": 230833, "epoch": 1374} {"train_loss": -11.083891868591309, "global_step": 230834, "epoch": 1374} {"train_loss": -11.596115112304688, "global_step": 230835, "epoch": 1374} {"train_loss": -10.881576538085938, "global_step": 230836, "epoch": 1374} {"train_loss": -11.534330368041992, "global_step": 230837, "epoch": 1374} {"train_loss": -10.872954368591309, "global_step": 230838, "epoch": 1374} {"train_loss": -10.953922271728516, "global_step": 230839, "epoch": 1374} {"train_loss": -11.256624221801758, "global_step": 230840, "epoch": 1374} {"train_loss": -11.749731063842773, "global_step": 230841, "epoch": 1374} {"train_loss": -11.099785804748535, "global_step": 230842, "epoch": 1374} {"train_loss": -11.724977493286133, "global_step": 230843, "epoch": 1374} {"train_loss": -11.411128997802734, "global_step": 230844, "epoch": 1374} {"train_loss": -10.920827865600586, "global_step": 230845, "epoch": 1374} {"train_loss": -11.851838111877441, "global_step": 230846, "epoch": 1374} {"train_loss": -11.342536926269531, "global_step": 230847, "epoch": 1374} {"train_loss": -11.458280563354492, "global_step": 230848, "epoch": 1374} {"train_loss": -11.697693824768066, "global_step": 230849, "epoch": 1374} {"train_loss": -11.599044799804688, "global_step": 230850, "epoch": 1374} {"train_loss": -11.752553939819336, "global_step": 230851, "epoch": 1374} {"train_loss": -11.62802505493164, "global_step": 230852, "epoch": 1374} {"train_loss": -11.518102645874023, "global_step": 230853, "epoch": 1374} {"train_loss": -11.457420349121094, "global_step": 230854, "epoch": 1374} {"train_loss": -11.19536304473877, "global_step": 230855, "epoch": 1374} {"train_loss": -11.88296127319336, "global_step": 230856, "epoch": 1374} {"train_loss": -11.592050552368164, "global_step": 230857, "epoch": 1374} {"train_loss": -11.604546546936035, "global_step": 230858, "epoch": 1374} {"train_loss": -11.698786735534668, "global_step": 230859, "epoch": 1374} {"train_loss": -11.809067726135254, "global_step": 230860, "epoch": 1374} {"train_loss": -11.790483474731445, "global_step": 230861, "epoch": 1374} {"train_loss": -11.701911926269531, "global_step": 230862, "epoch": 1374} {"train_loss": -11.833036422729492, "global_step": 230863, "epoch": 1374} {"train_loss": -11.54036808013916, "global_step": 230864, "epoch": 1374} {"train_loss": -11.613479614257812, "global_step": 230865, "epoch": 1374} {"train_loss": -11.51681900024414, "global_step": 230866, "epoch": 1374} {"train_loss": -11.522470474243164, "global_step": 230867, "epoch": 1374} {"train_loss": -11.40662956237793, "global_step": 230868, "epoch": 1374} {"train_loss": -11.462911605834961, "global_step": 230869, "epoch": 1374} {"train_loss": -10.31789779663086, "global_step": 230870, "epoch": 1374} {"train_loss": -10.990127563476562, "global_step": 230871, "epoch": 1374} {"train_loss": -10.717177391052246, "global_step": 230872, "epoch": 1374} {"train_loss": -11.178032875061035, "global_step": 230873, "epoch": 1374} {"train_loss": -11.096477508544922, "global_step": 230874, "epoch": 1374} {"train_loss": -11.069356918334961, "global_step": 230875, "epoch": 1374} {"train_loss": -11.250245094299316, "global_step": 230876, "epoch": 1374} {"train_loss": -11.242269515991211, "global_step": 230877, "epoch": 1374} {"train_loss": -10.448641777038574, "global_step": 230878, "epoch": 1374} {"train_loss": -11.429859161376953, "global_step": 230879, "epoch": 1374} {"train_loss": -10.50042724609375, "global_step": 230880, "epoch": 1374} {"train_loss": -10.915224075317383, "global_step": 230881, "epoch": 1374} {"train_loss": -9.634113311767578, "global_step": 230882, "epoch": 1374} {"train_loss": -11.117448806762695, "global_step": 230883, "epoch": 1374} {"train_loss": -10.452598571777344, "global_step": 230884, "epoch": 1374} {"train_loss": -10.77337646484375, "global_step": 230885, "epoch": 1374} {"train_loss": -9.278768539428711, "global_step": 230886, "epoch": 1374} {"train_loss": -11.273796081542969, "global_step": 230887, "epoch": 1374} {"train_loss": -9.048524856567383, "global_step": 230888, "epoch": 1374} {"train_loss": -11.41118335723877, "global_step": 230889, "epoch": 1374} {"train_loss": -9.365781784057617, "global_step": 230890, "epoch": 1374} {"train_loss": -9.390890121459961, "global_step": 230891, "epoch": 1374} {"train_loss": -10.899576187133789, "global_step": 230892, "epoch": 1374} {"train_loss": -10.728287696838379, "global_step": 230893, "epoch": 1374} {"train_loss": -10.071240425109863, "global_step": 230894, "epoch": 1374} {"train_loss": -11.10986042022705, "global_step": 230895, "epoch": 1374} {"train_loss": -10.711038589477539, "global_step": 230896, "epoch": 1374} {"train_loss": -10.36492919921875, "global_step": 230897, "epoch": 1374} {"train_loss": -11.044403076171875, "global_step": 230898, "epoch": 1374} {"train_loss": -10.900943756103516, "global_step": 230899, "epoch": 1374} {"train_loss": -10.57048225402832, "global_step": 230900, "epoch": 1374} {"train_loss": -11.169027328491211, "global_step": 230901, "epoch": 1374} {"train_loss": -11.287601470947266, "global_step": 230902, "epoch": 1374} {"train_loss": -10.937369346618652, "global_step": 230903, "epoch": 1374} {"train_loss": -11.373048782348633, "global_step": 230904, "epoch": 1374} {"train_loss": -11.448149681091309, "global_step": 230905, "epoch": 1374} {"train_loss": -10.9680757522583, "global_step": 230906, "epoch": 1374} {"train_loss": -11.380329132080078, "global_step": 230907, "epoch": 1374} {"train_loss": -11.540952682495117, "global_step": 230908, "epoch": 1374} {"train_loss": -11.204010009765625, "global_step": 230909, "epoch": 1374} {"train_loss": -11.450119018554688, "global_step": 230910, "epoch": 1374} {"train_loss": -11.355711936950684, "global_step": 230911, "epoch": 1374} {"train_loss": -11.398909568786621, "global_step": 230912, "epoch": 1374} {"train_loss": -11.415008544921875, "global_step": 230913, "epoch": 1374} {"train_loss": -11.564480781555176, "global_step": 230914, "epoch": 1374} {"train_loss": -11.607090950012207, "global_step": 230915, "epoch": 1374} {"train_loss": -11.532499313354492, "global_step": 230916, "epoch": 1374} {"train_loss": -11.621850967407227, "global_step": 230917, "epoch": 1374} {"train_loss": -11.530767440795898, "global_step": 230918, "epoch": 1374} {"train_loss": -11.64509391784668, "global_step": 230919, "epoch": 1374} {"train_loss": -11.726924896240234, "global_step": 230920, "epoch": 1374} {"train_loss": -11.570734024047852, "global_step": 230921, "epoch": 1374} {"train_loss": -11.648378372192383, "global_step": 230922, "epoch": 1374} {"train_loss": -11.689926147460938, "global_step": 230923, "epoch": 1374} {"train_loss": -11.66456413269043, "global_step": 230924, "epoch": 1374} {"train_loss": -11.745728492736816, "global_step": 230925, "epoch": 1374} {"train_loss": -11.690025329589844, "global_step": 230926, "epoch": 1374} {"train_loss": -11.509733200073242, "global_step": 230927, "epoch": 1374} {"train_loss": -11.87884521484375, "global_step": 230928, "epoch": 1374} {"train_loss": -11.60413646697998, "global_step": 230929, "epoch": 1374} {"train_loss": -11.746782302856445, "global_step": 230930, "epoch": 1374} {"train_loss": -11.70926570892334, "global_step": 230931, "epoch": 1374} {"train_loss": -11.598213195800781, "global_step": 230932, "epoch": 1374} {"train_loss": -11.664899826049805, "global_step": 230933, "epoch": 1374} {"train_loss": -11.783498764038086, "global_step": 230934, "epoch": 1374} {"train_loss": -11.713747024536133, "global_step": 230935, "epoch": 1374} {"train_loss": -11.80320930480957, "global_step": 230936, "epoch": 1374} {"train_loss": -11.814764022827148, "global_step": 230937, "epoch": 1374} {"train_loss": -11.893610000610352, "global_step": 230938, "epoch": 1374} {"train_loss": -11.85968017578125, "global_step": 230939, "epoch": 1374} {"train_loss": -11.765890121459961, "global_step": 230940, "epoch": 1374} {"train_loss": -11.993036270141602, "global_step": 230941, "epoch": 1374} {"train_loss": -12.086875915527344, "global_step": 230942, "epoch": 1374} {"train_loss": -11.983719825744629, "global_step": 230943, "epoch": 1374} {"train_loss": -11.653641700744629, "global_step": 230944, "epoch": 1374} {"train_loss": -11.913026809692383, "global_step": 230945, "epoch": 1374} {"train_loss": -12.04033088684082, "global_step": 230946, "epoch": 1374} {"train_loss": -11.734491348266602, "global_step": 230947, "epoch": 1374} {"train_loss": -12.012641906738281, "global_step": 230948, "epoch": 1374} {"train_loss": -11.968917846679688, "global_step": 230949, "epoch": 1374} {"train_loss": -12.011054992675781, "global_step": 230950, "epoch": 1374} {"train_loss": -11.97043514251709, "global_step": 230951, "epoch": 1374} {"train_loss": -11.93264389038086, "global_step": 230952, "epoch": 1374} {"train_loss": -11.938793182373047, "global_step": 230953, "epoch": 1374} {"train_loss": -11.98802375793457, "global_step": 230954, "epoch": 1374} {"train_loss": -12.0236177444458, "global_step": 230955, "epoch": 1374} {"train_loss": -11.974443435668945, "global_step": 230956, "epoch": 1374} {"train_loss": -12.051963806152344, "global_step": 230957, "epoch": 1374} {"train_loss": -12.036651611328125, "global_step": 230958, "epoch": 1374} {"train_loss": -12.106739044189453, "global_step": 230959, "epoch": 1374} {"train_loss": -11.976173400878906, "global_step": 230960, "epoch": 1374} {"train_loss": -11.812411308288574, "global_step": 230961, "epoch": 1374} {"train_loss": -11.890637397766113, "global_step": 230962, "epoch": 1374} {"train_loss": -11.783985137939453, "global_step": 230963, "epoch": 1374} {"train_loss": -12.008291244506836, "global_step": 230964, "epoch": 1374} {"train_loss": -11.811948776245117, "global_step": 230965, "epoch": 1374} {"train_loss": -11.744245529174805, "global_step": 230966, "epoch": 1374} {"train_loss": -12.180803298950195, "global_step": 230967, "epoch": 1374} {"train_loss": -11.95600700378418, "global_step": 230968, "epoch": 1374} {"train_loss": -11.614849090576172, "global_step": 230969, "epoch": 1374} {"train_loss": -11.811206817626953, "global_step": 230970, "epoch": 1374} {"train_loss": -11.993546485900879, "global_step": 230971, "epoch": 1374} {"train_loss": -12.025275230407715, "global_step": 230972, "epoch": 1374} {"train_loss": -12.141549110412598, "global_step": 230973, "epoch": 1374} {"train_loss": -12.056925773620605, "global_step": 230974, "epoch": 1374} {"train_loss": -11.715720176696777, "global_step": 230975, "epoch": 1374} {"train_loss": -12.113232612609863, "global_step": 230976, "epoch": 1374} {"train_loss": -11.694490432739258, "global_step": 230977, "epoch": 1374} {"train_loss": -11.832897186279297, "global_step": 230978, "epoch": 1374} {"train_loss": -10.445741653442383, "global_step": 230979, "epoch": 1374} {"train_loss": -12.091073989868164, "global_step": 230980, "epoch": 1374} {"train_loss": -11.269636154174805, "global_step": 230981, "epoch": 1374} {"train_loss": -11.658228874206543, "global_step": 230982, "epoch": 1374} {"train_loss": -11.33544921875, "global_step": 230983, "epoch": 1374} {"train_loss": -11.734972953796387, "global_step": 230984, "epoch": 1374} {"train_loss": -11.227568626403809, "global_step": 230985, "epoch": 1374} {"train_loss": -11.824723243713379, "global_step": 230986, "epoch": 1374} {"train_loss": -11.889925956726074, "global_step": 230987, "epoch": 1374} {"train_loss": -11.997117042541504, "global_step": 230988, "epoch": 1374} {"train_loss": -11.84521484375, "global_step": 230989, "epoch": 1374} {"train_loss": -11.812270164489746, "global_step": 230990, "epoch": 1374} {"train_loss": -11.643850326538086, "global_step": 230991, "epoch": 1374} {"train_loss": -12.128942489624023, "global_step": 230992, "epoch": 1374} {"train_loss": -11.877155303955078, "global_step": 230993, "epoch": 1374} {"train_loss": -11.654389381408691, "global_step": 230994, "epoch": 1374} {"train_loss": -11.868310928344727, "global_step": 230995, "epoch": 1374} {"train_loss": -11.936538696289062, "global_step": 230996, "epoch": 1374} {"train_loss": -12.105313301086426, "global_step": 230997, "epoch": 1374} {"train_loss": -11.749944686889648, "global_step": 230998, "epoch": 1374} {"train_loss": -11.469618178549267, "global_step": 230999, "epoch": 1374, "val_loss": 263628.90625} {"train_loss": -10.833030700683594, "global_step": 231000, "epoch": 1375} {"train_loss": -11.012840270996094, "global_step": 231001, "epoch": 1375} {"train_loss": -11.797868728637695, "global_step": 231002, "epoch": 1375} {"train_loss": -11.136638641357422, "global_step": 231003, "epoch": 1375} {"train_loss": -10.108251571655273, "global_step": 231004, "epoch": 1375} {"train_loss": -11.321971893310547, "global_step": 231005, "epoch": 1375} {"train_loss": -10.329696655273438, "global_step": 231006, "epoch": 1375} {"train_loss": -7.597770690917969, "global_step": 231007, "epoch": 1375} {"train_loss": -10.603997230529785, "global_step": 231008, "epoch": 1375} {"train_loss": -7.6722846031188965, "global_step": 231009, "epoch": 1375} {"train_loss": -10.399761199951172, "global_step": 231010, "epoch": 1375} {"train_loss": -8.641559600830078, "global_step": 231011, "epoch": 1375} {"train_loss": -9.984342575073242, "global_step": 231012, "epoch": 1375} {"train_loss": -9.078307151794434, "global_step": 231013, "epoch": 1375} {"train_loss": -10.643965721130371, "global_step": 231014, "epoch": 1375} {"train_loss": -10.232013702392578, "global_step": 231015, "epoch": 1375} {"train_loss": -10.220951080322266, "global_step": 231016, "epoch": 1375} {"train_loss": -10.389995574951172, "global_step": 231017, "epoch": 1375} {"train_loss": -10.593932151794434, "global_step": 231018, "epoch": 1375} {"train_loss": -10.055709838867188, "global_step": 231019, "epoch": 1375} {"train_loss": -10.48344898223877, "global_step": 231020, "epoch": 1375} {"train_loss": -11.245586395263672, "global_step": 231021, "epoch": 1375} {"train_loss": -10.695496559143066, "global_step": 231022, "epoch": 1375} {"train_loss": -11.372672080993652, "global_step": 231023, "epoch": 1375} {"train_loss": -10.686909675598145, "global_step": 231024, "epoch": 1375} {"train_loss": -11.444164276123047, "global_step": 231025, "epoch": 1375} {"train_loss": -11.04589557647705, "global_step": 231026, "epoch": 1375} {"train_loss": -11.268274307250977, "global_step": 231027, "epoch": 1375} {"train_loss": -10.883512496948242, "global_step": 231028, "epoch": 1375} {"train_loss": -11.253744125366211, "global_step": 231029, "epoch": 1375} {"train_loss": -10.839064598083496, "global_step": 231030, "epoch": 1375} {"train_loss": -11.37192153930664, "global_step": 231031, "epoch": 1375} {"train_loss": -11.369240760803223, "global_step": 231032, "epoch": 1375} {"train_loss": -11.345840454101562, "global_step": 231033, "epoch": 1375} {"train_loss": -11.258125305175781, "global_step": 231034, "epoch": 1375} {"train_loss": -11.184322357177734, "global_step": 231035, "epoch": 1375} {"train_loss": -11.080131530761719, "global_step": 231036, "epoch": 1375} {"train_loss": -11.529125213623047, "global_step": 231037, "epoch": 1375} {"train_loss": -11.097806930541992, "global_step": 231038, "epoch": 1375} {"train_loss": -11.521736145019531, "global_step": 231039, "epoch": 1375} {"train_loss": -11.280710220336914, "global_step": 231040, "epoch": 1375} {"train_loss": -11.058196067810059, "global_step": 231041, "epoch": 1375} {"train_loss": -11.201809883117676, "global_step": 231042, "epoch": 1375} {"train_loss": -11.439529418945312, "global_step": 231043, "epoch": 1375} {"train_loss": -11.432388305664062, "global_step": 231044, "epoch": 1375} {"train_loss": -11.378206253051758, "global_step": 231045, "epoch": 1375} {"train_loss": -11.160039901733398, "global_step": 231046, "epoch": 1375} {"train_loss": -11.431684494018555, "global_step": 231047, "epoch": 1375} {"train_loss": -11.602142333984375, "global_step": 231048, "epoch": 1375} {"train_loss": -11.540523529052734, "global_step": 231049, "epoch": 1375} {"train_loss": -11.847640991210938, "global_step": 231050, "epoch": 1375} {"train_loss": -11.39683723449707, "global_step": 231051, "epoch": 1375} {"train_loss": -11.653175354003906, "global_step": 231052, "epoch": 1375} {"train_loss": -11.678950309753418, "global_step": 231053, "epoch": 1375} {"train_loss": -11.8350248336792, "global_step": 231054, "epoch": 1375} {"train_loss": -11.670415878295898, "global_step": 231055, "epoch": 1375} {"train_loss": -11.60606575012207, "global_step": 231056, "epoch": 1375} {"train_loss": -11.637514114379883, "global_step": 231057, "epoch": 1375} {"train_loss": -11.759376525878906, "global_step": 231058, "epoch": 1375} {"train_loss": -11.555797576904297, "global_step": 231059, "epoch": 1375} {"train_loss": -11.794660568237305, "global_step": 231060, "epoch": 1375} {"train_loss": -11.6511869430542, "global_step": 231061, "epoch": 1375} {"train_loss": -11.838748931884766, "global_step": 231062, "epoch": 1375} {"train_loss": -11.573808670043945, "global_step": 231063, "epoch": 1375} {"train_loss": -11.585845947265625, "global_step": 231064, "epoch": 1375} {"train_loss": -11.697366714477539, "global_step": 231065, "epoch": 1375} {"train_loss": -11.724349975585938, "global_step": 231066, "epoch": 1375} {"train_loss": -11.515057563781738, "global_step": 231067, "epoch": 1375} {"train_loss": -11.797843933105469, "global_step": 231068, "epoch": 1375} {"train_loss": -11.614012718200684, "global_step": 231069, "epoch": 1375} {"train_loss": -11.457765579223633, "global_step": 231070, "epoch": 1375} {"train_loss": -11.673056602478027, "global_step": 231071, "epoch": 1375} {"train_loss": -11.599708557128906, "global_step": 231072, "epoch": 1375} {"train_loss": -11.974567413330078, "global_step": 231073, "epoch": 1375} {"train_loss": -11.867074966430664, "global_step": 231074, "epoch": 1375} {"train_loss": -11.804698944091797, "global_step": 231075, "epoch": 1375} {"train_loss": -11.812137603759766, "global_step": 231076, "epoch": 1375} {"train_loss": -12.005104064941406, "global_step": 231077, "epoch": 1375} {"train_loss": -11.976238250732422, "global_step": 231078, "epoch": 1375} {"train_loss": -11.697595596313477, "global_step": 231079, "epoch": 1375} {"train_loss": -11.981439590454102, "global_step": 231080, "epoch": 1375} {"train_loss": -11.90575122833252, "global_step": 231081, "epoch": 1375} {"train_loss": -11.864127159118652, "global_step": 231082, "epoch": 1375} {"train_loss": -11.927289962768555, "global_step": 231083, "epoch": 1375} {"train_loss": -11.878799438476562, "global_step": 231084, "epoch": 1375} {"train_loss": -11.723556518554688, "global_step": 231085, "epoch": 1375} {"train_loss": -11.704139709472656, "global_step": 231086, "epoch": 1375} {"train_loss": -11.712261199951172, "global_step": 231087, "epoch": 1375} {"train_loss": -11.598599433898926, "global_step": 231088, "epoch": 1375} {"train_loss": -11.768973350524902, "global_step": 231089, "epoch": 1375} {"train_loss": -11.475951194763184, "global_step": 231090, "epoch": 1375} {"train_loss": -11.935649871826172, "global_step": 231091, "epoch": 1375} {"train_loss": -11.753843307495117, "global_step": 231092, "epoch": 1375} {"train_loss": -11.87628173828125, "global_step": 231093, "epoch": 1375} {"train_loss": -12.006012916564941, "global_step": 231094, "epoch": 1375} {"train_loss": -11.490421295166016, "global_step": 231095, "epoch": 1375} {"train_loss": -11.698484420776367, "global_step": 231096, "epoch": 1375} {"train_loss": -11.612079620361328, "global_step": 231097, "epoch": 1375} {"train_loss": -11.996274948120117, "global_step": 231098, "epoch": 1375} {"train_loss": -11.838800430297852, "global_step": 231099, "epoch": 1375} {"train_loss": -11.955402374267578, "global_step": 231100, "epoch": 1375} {"train_loss": -11.867369651794434, "global_step": 231101, "epoch": 1375} {"train_loss": -11.62253189086914, "global_step": 231102, "epoch": 1375} {"train_loss": -11.997611999511719, "global_step": 231103, "epoch": 1375} {"train_loss": -11.384052276611328, "global_step": 231104, "epoch": 1375} {"train_loss": -11.502233505249023, "global_step": 231105, "epoch": 1375} {"train_loss": -11.507914543151855, "global_step": 231106, "epoch": 1375} {"train_loss": -11.748467445373535, "global_step": 231107, "epoch": 1375} {"train_loss": -11.29067325592041, "global_step": 231108, "epoch": 1375} {"train_loss": -11.308639526367188, "global_step": 231109, "epoch": 1375} {"train_loss": -11.581785202026367, "global_step": 231110, "epoch": 1375} {"train_loss": -10.696550369262695, "global_step": 231111, "epoch": 1375} {"train_loss": -11.135345458984375, "global_step": 231112, "epoch": 1375} {"train_loss": -11.558523178100586, "global_step": 231113, "epoch": 1375} {"train_loss": -11.670495986938477, "global_step": 231114, "epoch": 1375} {"train_loss": -11.365652084350586, "global_step": 231115, "epoch": 1375} {"train_loss": -11.601447105407715, "global_step": 231116, "epoch": 1375} {"train_loss": -11.95488166809082, "global_step": 231117, "epoch": 1375} {"train_loss": -11.52067756652832, "global_step": 231118, "epoch": 1375} {"train_loss": -11.761102676391602, "global_step": 231119, "epoch": 1375} {"train_loss": -11.816092491149902, "global_step": 231120, "epoch": 1375} {"train_loss": -11.90194320678711, "global_step": 231121, "epoch": 1375} {"train_loss": -11.74429702758789, "global_step": 231122, "epoch": 1375} {"train_loss": -11.436649322509766, "global_step": 231123, "epoch": 1375} {"train_loss": -11.972890853881836, "global_step": 231124, "epoch": 1375} {"train_loss": -11.588061332702637, "global_step": 231125, "epoch": 1375} {"train_loss": -11.882166862487793, "global_step": 231126, "epoch": 1375} {"train_loss": -11.283486366271973, "global_step": 231127, "epoch": 1375} {"train_loss": -11.76547622680664, "global_step": 231128, "epoch": 1375} {"train_loss": -11.449499130249023, "global_step": 231129, "epoch": 1375} {"train_loss": -10.921239852905273, "global_step": 231130, "epoch": 1375} {"train_loss": -10.516324996948242, "global_step": 231131, "epoch": 1375} {"train_loss": -11.590047836303711, "global_step": 231132, "epoch": 1375} {"train_loss": -10.954205513000488, "global_step": 231133, "epoch": 1375} {"train_loss": -10.54808235168457, "global_step": 231134, "epoch": 1375} {"train_loss": -11.159807205200195, "global_step": 231135, "epoch": 1375} {"train_loss": -10.888763427734375, "global_step": 231136, "epoch": 1375} {"train_loss": -9.690207481384277, "global_step": 231137, "epoch": 1375} {"train_loss": -11.011285781860352, "global_step": 231138, "epoch": 1375} {"train_loss": -6.970162868499756, "global_step": 231139, "epoch": 1375} {"train_loss": -6.781379699707031, "global_step": 231140, "epoch": 1375} {"train_loss": -7.1504974365234375, "global_step": 231141, "epoch": 1375} {"train_loss": -8.766545295715332, "global_step": 231142, "epoch": 1375} {"train_loss": -7.144918918609619, "global_step": 231143, "epoch": 1375} {"train_loss": -6.712763786315918, "global_step": 231144, "epoch": 1375} {"train_loss": -6.624015808105469, "global_step": 231145, "epoch": 1375} {"train_loss": -6.737968444824219, "global_step": 231146, "epoch": 1375} {"train_loss": -7.3682942390441895, "global_step": 231147, "epoch": 1375} {"train_loss": -7.949162483215332, "global_step": 231148, "epoch": 1375} {"train_loss": -7.304749488830566, "global_step": 231149, "epoch": 1375} {"train_loss": -7.573580741882324, "global_step": 231150, "epoch": 1375} {"train_loss": -8.641420364379883, "global_step": 231151, "epoch": 1375} {"train_loss": -7.976119041442871, "global_step": 231152, "epoch": 1375} {"train_loss": -8.119719505310059, "global_step": 231153, "epoch": 1375} {"train_loss": -9.523750305175781, "global_step": 231154, "epoch": 1375} {"train_loss": -9.01925277709961, "global_step": 231155, "epoch": 1375} {"train_loss": -9.027255058288574, "global_step": 231156, "epoch": 1375} {"train_loss": -9.864931106567383, "global_step": 231157, "epoch": 1375} {"train_loss": -10.396323204040527, "global_step": 231158, "epoch": 1375} {"train_loss": -10.60875129699707, "global_step": 231159, "epoch": 1375} {"train_loss": -10.751486778259277, "global_step": 231160, "epoch": 1375} {"train_loss": -10.702816009521484, "global_step": 231161, "epoch": 1375} {"train_loss": -10.327688217163086, "global_step": 231162, "epoch": 1375} {"train_loss": -10.274818420410156, "global_step": 231163, "epoch": 1375} {"train_loss": -10.572294235229492, "global_step": 231164, "epoch": 1375} {"train_loss": -10.61056900024414, "global_step": 231165, "epoch": 1375} {"train_loss": -10.917060852050781, "global_step": 231166, "epoch": 1375} {"train_loss": -10.872817533356804, "global_step": 231167, "epoch": 1375, "val_loss": 249478.28125, "train_action_mse_error": 3.4607462882995605} {"train_loss": -10.660735130310059, "global_step": 231168, "epoch": 1376} {"train_loss": -10.827325820922852, "global_step": 231169, "epoch": 1376} {"train_loss": -10.93699836730957, "global_step": 231170, "epoch": 1376} {"train_loss": -10.76011848449707, "global_step": 231171, "epoch": 1376} {"train_loss": -11.132440567016602, "global_step": 231172, "epoch": 1376} {"train_loss": -11.108955383300781, "global_step": 231173, "epoch": 1376} {"train_loss": -11.19791030883789, "global_step": 231174, "epoch": 1376} {"train_loss": -11.047605514526367, "global_step": 231175, "epoch": 1376} {"train_loss": -10.998023986816406, "global_step": 231176, "epoch": 1376} {"train_loss": -11.101068496704102, "global_step": 231177, "epoch": 1376} {"train_loss": -10.953458786010742, "global_step": 231178, "epoch": 1376} {"train_loss": -11.239389419555664, "global_step": 231179, "epoch": 1376} {"train_loss": -11.304659843444824, "global_step": 231180, "epoch": 1376} {"train_loss": -11.295331954956055, "global_step": 231181, "epoch": 1376} {"train_loss": -11.188982009887695, "global_step": 231182, "epoch": 1376} {"train_loss": -11.593531608581543, "global_step": 231183, "epoch": 1376} {"train_loss": -11.45283317565918, "global_step": 231184, "epoch": 1376} {"train_loss": -11.412344932556152, "global_step": 231185, "epoch": 1376} {"train_loss": -11.560245513916016, "global_step": 231186, "epoch": 1376} {"train_loss": -11.439628601074219, "global_step": 231187, "epoch": 1376} {"train_loss": -11.389131546020508, "global_step": 231188, "epoch": 1376} {"train_loss": -11.326339721679688, "global_step": 231189, "epoch": 1376} {"train_loss": -11.442137718200684, "global_step": 231190, "epoch": 1376} {"train_loss": -11.609992980957031, "global_step": 231191, "epoch": 1376} {"train_loss": -11.417258262634277, "global_step": 231192, "epoch": 1376} {"train_loss": -11.566790580749512, "global_step": 231193, "epoch": 1376} {"train_loss": -11.483733177185059, "global_step": 231194, "epoch": 1376} {"train_loss": -11.573789596557617, "global_step": 231195, "epoch": 1376} {"train_loss": -11.676445960998535, "global_step": 231196, "epoch": 1376} {"train_loss": -11.444698333740234, "global_step": 231197, "epoch": 1376} {"train_loss": -11.477684020996094, "global_step": 231198, "epoch": 1376} {"train_loss": -11.593924522399902, "global_step": 231199, "epoch": 1376} {"train_loss": -11.580057144165039, "global_step": 231200, "epoch": 1376} {"train_loss": -11.854650497436523, "global_step": 231201, "epoch": 1376} {"train_loss": -11.594446182250977, "global_step": 231202, "epoch": 1376} {"train_loss": -11.572226524353027, "global_step": 231203, "epoch": 1376} {"train_loss": -11.551732063293457, "global_step": 231204, "epoch": 1376} {"train_loss": -11.55181884765625, "global_step": 231205, "epoch": 1376} {"train_loss": -11.562583923339844, "global_step": 231206, "epoch": 1376} {"train_loss": -11.770962715148926, "global_step": 231207, "epoch": 1376} {"train_loss": -11.884770393371582, "global_step": 231208, "epoch": 1376} {"train_loss": -11.692676544189453, "global_step": 231209, "epoch": 1376} {"train_loss": -11.701055526733398, "global_step": 231210, "epoch": 1376} {"train_loss": -11.708342552185059, "global_step": 231211, "epoch": 1376} {"train_loss": -11.800174713134766, "global_step": 231212, "epoch": 1376} {"train_loss": -11.645172119140625, "global_step": 231213, "epoch": 1376} {"train_loss": -11.691095352172852, "global_step": 231214, "epoch": 1376} {"train_loss": -11.445844650268555, "global_step": 231215, "epoch": 1376} {"train_loss": -11.82412052154541, "global_step": 231216, "epoch": 1376} {"train_loss": -11.560548782348633, "global_step": 231217, "epoch": 1376} {"train_loss": -11.678211212158203, "global_step": 231218, "epoch": 1376} {"train_loss": -11.583749771118164, "global_step": 231219, "epoch": 1376} {"train_loss": -11.441102981567383, "global_step": 231220, "epoch": 1376} {"train_loss": -11.132469177246094, "global_step": 231221, "epoch": 1376} {"train_loss": -11.796384811401367, "global_step": 231222, "epoch": 1376} {"train_loss": -11.371984481811523, "global_step": 231223, "epoch": 1376} {"train_loss": -11.446730613708496, "global_step": 231224, "epoch": 1376} {"train_loss": -11.171910285949707, "global_step": 231225, "epoch": 1376} {"train_loss": -11.220205307006836, "global_step": 231226, "epoch": 1376} {"train_loss": -11.736800193786621, "global_step": 231227, "epoch": 1376} {"train_loss": -11.430614471435547, "global_step": 231228, "epoch": 1376} {"train_loss": -10.757013320922852, "global_step": 231229, "epoch": 1376} {"train_loss": -11.524894714355469, "global_step": 231230, "epoch": 1376} {"train_loss": -8.638397216796875, "global_step": 231231, "epoch": 1376} {"train_loss": -11.133516311645508, "global_step": 231232, "epoch": 1376} {"train_loss": -9.367143630981445, "global_step": 231233, "epoch": 1376} {"train_loss": -9.370826721191406, "global_step": 231234, "epoch": 1376} {"train_loss": -10.275077819824219, "global_step": 231235, "epoch": 1376} {"train_loss": -8.68652629852295, "global_step": 231236, "epoch": 1376} {"train_loss": -10.963396072387695, "global_step": 231237, "epoch": 1376} {"train_loss": -8.911911010742188, "global_step": 231238, "epoch": 1376} {"train_loss": -11.220405578613281, "global_step": 231239, "epoch": 1376} {"train_loss": -10.232015609741211, "global_step": 231240, "epoch": 1376} {"train_loss": -11.231367111206055, "global_step": 231241, "epoch": 1376} {"train_loss": -10.17457103729248, "global_step": 231242, "epoch": 1376} {"train_loss": -11.332746505737305, "global_step": 231243, "epoch": 1376} {"train_loss": -10.033818244934082, "global_step": 231244, "epoch": 1376} {"train_loss": -11.383331298828125, "global_step": 231245, "epoch": 1376} {"train_loss": -10.610773086547852, "global_step": 231246, "epoch": 1376} {"train_loss": -11.297040939331055, "global_step": 231247, "epoch": 1376} {"train_loss": -10.799776077270508, "global_step": 231248, "epoch": 1376} {"train_loss": -11.37626838684082, "global_step": 231249, "epoch": 1376} {"train_loss": -11.096025466918945, "global_step": 231250, "epoch": 1376} {"train_loss": -11.618598937988281, "global_step": 231251, "epoch": 1376} {"train_loss": -11.230241775512695, "global_step": 231252, "epoch": 1376} {"train_loss": -11.419983863830566, "global_step": 231253, "epoch": 1376} {"train_loss": -11.545226097106934, "global_step": 231254, "epoch": 1376} {"train_loss": -11.368693351745605, "global_step": 231255, "epoch": 1376} {"train_loss": -11.674125671386719, "global_step": 231256, "epoch": 1376} {"train_loss": -11.16281509399414, "global_step": 231257, "epoch": 1376} {"train_loss": -11.44709587097168, "global_step": 231258, "epoch": 1376} {"train_loss": -11.44472885131836, "global_step": 231259, "epoch": 1376} {"train_loss": -11.467987060546875, "global_step": 231260, "epoch": 1376} {"train_loss": -11.658645629882812, "global_step": 231261, "epoch": 1376} {"train_loss": -11.454217910766602, "global_step": 231262, "epoch": 1376} {"train_loss": -11.634961128234863, "global_step": 231263, "epoch": 1376} {"train_loss": -11.623431205749512, "global_step": 231264, "epoch": 1376} {"train_loss": -11.342291831970215, "global_step": 231265, "epoch": 1376} {"train_loss": -11.789562225341797, "global_step": 231266, "epoch": 1376} {"train_loss": -11.945465087890625, "global_step": 231267, "epoch": 1376} {"train_loss": -11.613605499267578, "global_step": 231268, "epoch": 1376} {"train_loss": -11.553539276123047, "global_step": 231269, "epoch": 1376} {"train_loss": -11.890009880065918, "global_step": 231270, "epoch": 1376} {"train_loss": -11.696922302246094, "global_step": 231271, "epoch": 1376} {"train_loss": -11.77366828918457, "global_step": 231272, "epoch": 1376} {"train_loss": -11.668535232543945, "global_step": 231273, "epoch": 1376} {"train_loss": -11.847990989685059, "global_step": 231274, "epoch": 1376} {"train_loss": -11.558550834655762, "global_step": 231275, "epoch": 1376} {"train_loss": -11.73610782623291, "global_step": 231276, "epoch": 1376} {"train_loss": -11.766145706176758, "global_step": 231277, "epoch": 1376} {"train_loss": -11.435689926147461, "global_step": 231278, "epoch": 1376} {"train_loss": -11.819311141967773, "global_step": 231279, "epoch": 1376} {"train_loss": -11.760932922363281, "global_step": 231280, "epoch": 1376} {"train_loss": -11.752137184143066, "global_step": 231281, "epoch": 1376} {"train_loss": -11.496480941772461, "global_step": 231282, "epoch": 1376} {"train_loss": -11.652740478515625, "global_step": 231283, "epoch": 1376} {"train_loss": -11.830143928527832, "global_step": 231284, "epoch": 1376} {"train_loss": -11.909191131591797, "global_step": 231285, "epoch": 1376} {"train_loss": -11.788424491882324, "global_step": 231286, "epoch": 1376} {"train_loss": -11.700695037841797, "global_step": 231287, "epoch": 1376} {"train_loss": -11.64598274230957, "global_step": 231288, "epoch": 1376} {"train_loss": -11.921972274780273, "global_step": 231289, "epoch": 1376} {"train_loss": -11.80693531036377, "global_step": 231290, "epoch": 1376} {"train_loss": -12.116207122802734, "global_step": 231291, "epoch": 1376} {"train_loss": -11.808853149414062, "global_step": 231292, "epoch": 1376} {"train_loss": -11.762081146240234, "global_step": 231293, "epoch": 1376} {"train_loss": -11.881481170654297, "global_step": 231294, "epoch": 1376} {"train_loss": -11.9520263671875, "global_step": 231295, "epoch": 1376} {"train_loss": -11.979951858520508, "global_step": 231296, "epoch": 1376} {"train_loss": -11.941902160644531, "global_step": 231297, "epoch": 1376} {"train_loss": -11.835905075073242, "global_step": 231298, "epoch": 1376} {"train_loss": -11.87928581237793, "global_step": 231299, "epoch": 1376} {"train_loss": -12.087875366210938, "global_step": 231300, "epoch": 1376} {"train_loss": -11.827777862548828, "global_step": 231301, "epoch": 1376} {"train_loss": -11.758627891540527, "global_step": 231302, "epoch": 1376} {"train_loss": -11.814470291137695, "global_step": 231303, "epoch": 1376} {"train_loss": -11.94272518157959, "global_step": 231304, "epoch": 1376} {"train_loss": -11.358967781066895, "global_step": 231305, "epoch": 1376} {"train_loss": -12.054176330566406, "global_step": 231306, "epoch": 1376} {"train_loss": -11.37427806854248, "global_step": 231307, "epoch": 1376} {"train_loss": -11.847139358520508, "global_step": 231308, "epoch": 1376} {"train_loss": -11.709590911865234, "global_step": 231309, "epoch": 1376} {"train_loss": -11.393877983093262, "global_step": 231310, "epoch": 1376} {"train_loss": -11.765188217163086, "global_step": 231311, "epoch": 1376} {"train_loss": -11.688118934631348, "global_step": 231312, "epoch": 1376} {"train_loss": -11.459610939025879, "global_step": 231313, "epoch": 1376} {"train_loss": -11.71738052368164, "global_step": 231314, "epoch": 1376} {"train_loss": -11.848578453063965, "global_step": 231315, "epoch": 1376} {"train_loss": -11.513045310974121, "global_step": 231316, "epoch": 1376} {"train_loss": -11.76297378540039, "global_step": 231317, "epoch": 1376} {"train_loss": -11.57846736907959, "global_step": 231318, "epoch": 1376} {"train_loss": -11.007950782775879, "global_step": 231319, "epoch": 1376} {"train_loss": -11.864419937133789, "global_step": 231320, "epoch": 1376} {"train_loss": -11.694260597229004, "global_step": 231321, "epoch": 1376} {"train_loss": -11.090822219848633, "global_step": 231322, "epoch": 1376} {"train_loss": -11.04778003692627, "global_step": 231323, "epoch": 1376} {"train_loss": -11.641338348388672, "global_step": 231324, "epoch": 1376} {"train_loss": -11.143281936645508, "global_step": 231325, "epoch": 1376} {"train_loss": -11.596464157104492, "global_step": 231326, "epoch": 1376} {"train_loss": -11.448139190673828, "global_step": 231327, "epoch": 1376} {"train_loss": -11.861323356628418, "global_step": 231328, "epoch": 1376} {"train_loss": -10.323423385620117, "global_step": 231329, "epoch": 1376} {"train_loss": -11.036233901977539, "global_step": 231330, "epoch": 1376} {"train_loss": -11.649014472961426, "global_step": 231331, "epoch": 1376} {"train_loss": -10.954462051391602, "global_step": 231332, "epoch": 1376} {"train_loss": -11.484106063842773, "global_step": 231333, "epoch": 1376} {"train_loss": -11.757955551147461, "global_step": 231334, "epoch": 1376} {"train_loss": -11.406988592374892, "global_step": 231335, "epoch": 1376, "val_loss": 257066.84375} {"train_loss": -11.415485382080078, "global_step": 231336, "epoch": 1377} {"train_loss": -11.249979019165039, "global_step": 231337, "epoch": 1377} {"train_loss": -10.899327278137207, "global_step": 231338, "epoch": 1377} {"train_loss": -11.237852096557617, "global_step": 231339, "epoch": 1377} {"train_loss": -11.467689514160156, "global_step": 231340, "epoch": 1377} {"train_loss": -11.549696922302246, "global_step": 231341, "epoch": 1377} {"train_loss": -11.601176261901855, "global_step": 231342, "epoch": 1377} {"train_loss": -11.541078567504883, "global_step": 231343, "epoch": 1377} {"train_loss": -11.350176811218262, "global_step": 231344, "epoch": 1377} {"train_loss": -11.096593856811523, "global_step": 231345, "epoch": 1377} {"train_loss": -11.106452941894531, "global_step": 231346, "epoch": 1377} {"train_loss": -11.466822624206543, "global_step": 231347, "epoch": 1377} {"train_loss": -11.49555778503418, "global_step": 231348, "epoch": 1377} {"train_loss": -11.25442123413086, "global_step": 231349, "epoch": 1377} {"train_loss": -11.550997734069824, "global_step": 231350, "epoch": 1377} {"train_loss": -11.367330551147461, "global_step": 231351, "epoch": 1377} {"train_loss": -11.300076484680176, "global_step": 231352, "epoch": 1377} {"train_loss": -11.617769241333008, "global_step": 231353, "epoch": 1377} {"train_loss": -11.179266929626465, "global_step": 231354, "epoch": 1377} {"train_loss": -11.889739990234375, "global_step": 231355, "epoch": 1377} {"train_loss": -11.5106201171875, "global_step": 231356, "epoch": 1377} {"train_loss": -11.666610717773438, "global_step": 231357, "epoch": 1377} {"train_loss": -11.247489929199219, "global_step": 231358, "epoch": 1377} {"train_loss": -11.418102264404297, "global_step": 231359, "epoch": 1377} {"train_loss": -11.281400680541992, "global_step": 231360, "epoch": 1377} {"train_loss": -11.397489547729492, "global_step": 231361, "epoch": 1377} {"train_loss": -11.789398193359375, "global_step": 231362, "epoch": 1377} {"train_loss": -11.103973388671875, "global_step": 231363, "epoch": 1377} {"train_loss": -11.573356628417969, "global_step": 231364, "epoch": 1377} {"train_loss": -11.544157028198242, "global_step": 231365, "epoch": 1377} {"train_loss": -11.298444747924805, "global_step": 231366, "epoch": 1377} {"train_loss": -11.620447158813477, "global_step": 231367, "epoch": 1377} {"train_loss": -11.084327697753906, "global_step": 231368, "epoch": 1377} {"train_loss": -11.506857872009277, "global_step": 231369, "epoch": 1377} {"train_loss": -10.398460388183594, "global_step": 231370, "epoch": 1377} {"train_loss": -11.313826560974121, "global_step": 231371, "epoch": 1377} {"train_loss": -11.309072494506836, "global_step": 231372, "epoch": 1377} {"train_loss": -10.886998176574707, "global_step": 231373, "epoch": 1377} {"train_loss": -10.858089447021484, "global_step": 231374, "epoch": 1377} {"train_loss": -11.425884246826172, "global_step": 231375, "epoch": 1377} {"train_loss": -11.235676765441895, "global_step": 231376, "epoch": 1377} {"train_loss": -11.213006973266602, "global_step": 231377, "epoch": 1377} {"train_loss": -11.601776123046875, "global_step": 231378, "epoch": 1377} {"train_loss": -10.862322807312012, "global_step": 231379, "epoch": 1377} {"train_loss": -11.704116821289062, "global_step": 231380, "epoch": 1377} {"train_loss": -11.335219383239746, "global_step": 231381, "epoch": 1377} {"train_loss": -11.299379348754883, "global_step": 231382, "epoch": 1377} {"train_loss": -11.344200134277344, "global_step": 231383, "epoch": 1377} {"train_loss": -11.20503044128418, "global_step": 231384, "epoch": 1377} {"train_loss": -10.972661972045898, "global_step": 231385, "epoch": 1377} {"train_loss": -11.380090713500977, "global_step": 231386, "epoch": 1377} {"train_loss": -10.5990571975708, "global_step": 231387, "epoch": 1377} {"train_loss": -11.486879348754883, "global_step": 231388, "epoch": 1377} {"train_loss": -11.202798843383789, "global_step": 231389, "epoch": 1377} {"train_loss": -11.044103622436523, "global_step": 231390, "epoch": 1377} {"train_loss": -11.26949405670166, "global_step": 231391, "epoch": 1377} {"train_loss": -10.386919021606445, "global_step": 231392, "epoch": 1377} {"train_loss": -11.263540267944336, "global_step": 231393, "epoch": 1377} {"train_loss": -10.967103958129883, "global_step": 231394, "epoch": 1377} {"train_loss": -10.731999397277832, "global_step": 231395, "epoch": 1377} {"train_loss": -11.8746976852417, "global_step": 231396, "epoch": 1377} {"train_loss": -10.765364646911621, "global_step": 231397, "epoch": 1377} {"train_loss": -11.729215621948242, "global_step": 231398, "epoch": 1377} {"train_loss": -11.231912612915039, "global_step": 231399, "epoch": 1377} {"train_loss": -11.512800216674805, "global_step": 231400, "epoch": 1377} {"train_loss": -11.064386367797852, "global_step": 231401, "epoch": 1377} {"train_loss": -11.306648254394531, "global_step": 231402, "epoch": 1377} {"train_loss": -11.290809631347656, "global_step": 231403, "epoch": 1377} {"train_loss": -11.524250030517578, "global_step": 231404, "epoch": 1377} {"train_loss": -11.655879020690918, "global_step": 231405, "epoch": 1377} {"train_loss": -11.536612510681152, "global_step": 231406, "epoch": 1377} {"train_loss": -11.726091384887695, "global_step": 231407, "epoch": 1377} {"train_loss": -11.403973579406738, "global_step": 231408, "epoch": 1377} {"train_loss": -11.681684494018555, "global_step": 231409, "epoch": 1377} {"train_loss": -11.817366600036621, "global_step": 231410, "epoch": 1377} {"train_loss": -11.743959426879883, "global_step": 231411, "epoch": 1377} {"train_loss": -11.800996780395508, "global_step": 231412, "epoch": 1377} {"train_loss": -11.724267959594727, "global_step": 231413, "epoch": 1377} {"train_loss": -11.652135848999023, "global_step": 231414, "epoch": 1377} {"train_loss": -11.894350051879883, "global_step": 231415, "epoch": 1377} {"train_loss": -11.779304504394531, "global_step": 231416, "epoch": 1377} {"train_loss": -11.80366325378418, "global_step": 231417, "epoch": 1377} {"train_loss": -11.659212112426758, "global_step": 231418, "epoch": 1377} {"train_loss": -11.853453636169434, "global_step": 231419, "epoch": 1377} {"train_loss": -11.893136024475098, "global_step": 231420, "epoch": 1377} {"train_loss": -11.847951889038086, "global_step": 231421, "epoch": 1377} {"train_loss": -11.772480010986328, "global_step": 231422, "epoch": 1377} {"train_loss": -11.759217262268066, "global_step": 231423, "epoch": 1377} {"train_loss": -11.850567817687988, "global_step": 231424, "epoch": 1377} {"train_loss": -11.744972229003906, "global_step": 231425, "epoch": 1377} {"train_loss": -12.097135543823242, "global_step": 231426, "epoch": 1377} {"train_loss": -11.858528137207031, "global_step": 231427, "epoch": 1377} {"train_loss": -11.895865440368652, "global_step": 231428, "epoch": 1377} {"train_loss": -11.858041763305664, "global_step": 231429, "epoch": 1377} {"train_loss": -11.880306243896484, "global_step": 231430, "epoch": 1377} {"train_loss": -11.865832328796387, "global_step": 231431, "epoch": 1377} {"train_loss": -12.033592224121094, "global_step": 231432, "epoch": 1377} {"train_loss": -11.997459411621094, "global_step": 231433, "epoch": 1377} {"train_loss": -11.813501358032227, "global_step": 231434, "epoch": 1377} {"train_loss": -11.810523986816406, "global_step": 231435, "epoch": 1377} {"train_loss": -11.894432067871094, "global_step": 231436, "epoch": 1377} {"train_loss": -11.476869583129883, "global_step": 231437, "epoch": 1377} {"train_loss": -11.962263107299805, "global_step": 231438, "epoch": 1377} {"train_loss": -11.573484420776367, "global_step": 231439, "epoch": 1377} {"train_loss": -11.812044143676758, "global_step": 231440, "epoch": 1377} {"train_loss": -11.814350128173828, "global_step": 231441, "epoch": 1377} {"train_loss": -11.928439140319824, "global_step": 231442, "epoch": 1377} {"train_loss": -11.956242561340332, "global_step": 231443, "epoch": 1377} {"train_loss": -11.887395858764648, "global_step": 231444, "epoch": 1377} {"train_loss": -11.816394805908203, "global_step": 231445, "epoch": 1377} {"train_loss": -11.749161720275879, "global_step": 231446, "epoch": 1377} {"train_loss": -11.7448148727417, "global_step": 231447, "epoch": 1377} {"train_loss": -12.045745849609375, "global_step": 231448, "epoch": 1377} {"train_loss": -11.719696044921875, "global_step": 231449, "epoch": 1377} {"train_loss": -11.677031517028809, "global_step": 231450, "epoch": 1377} {"train_loss": -12.12569808959961, "global_step": 231451, "epoch": 1377} {"train_loss": -11.826325416564941, "global_step": 231452, "epoch": 1377} {"train_loss": -11.513236999511719, "global_step": 231453, "epoch": 1377} {"train_loss": -11.812482833862305, "global_step": 231454, "epoch": 1377} {"train_loss": -11.794654846191406, "global_step": 231455, "epoch": 1377} {"train_loss": -11.34894847869873, "global_step": 231456, "epoch": 1377} {"train_loss": -11.823701858520508, "global_step": 231457, "epoch": 1377} {"train_loss": -11.8583345413208, "global_step": 231458, "epoch": 1377} {"train_loss": -11.702596664428711, "global_step": 231459, "epoch": 1377} {"train_loss": -11.21636962890625, "global_step": 231460, "epoch": 1377} {"train_loss": -11.115032196044922, "global_step": 231461, "epoch": 1377} {"train_loss": -11.53248119354248, "global_step": 231462, "epoch": 1377} {"train_loss": -11.378653526306152, "global_step": 231463, "epoch": 1377} {"train_loss": -10.70526123046875, "global_step": 231464, "epoch": 1377} {"train_loss": -11.81098747253418, "global_step": 231465, "epoch": 1377} {"train_loss": -11.223312377929688, "global_step": 231466, "epoch": 1377} {"train_loss": -11.066996574401855, "global_step": 231467, "epoch": 1377} {"train_loss": -11.099075317382812, "global_step": 231468, "epoch": 1377} {"train_loss": -11.552882194519043, "global_step": 231469, "epoch": 1377} {"train_loss": -10.778626441955566, "global_step": 231470, "epoch": 1377} {"train_loss": -11.138570785522461, "global_step": 231471, "epoch": 1377} {"train_loss": -11.77797794342041, "global_step": 231472, "epoch": 1377} {"train_loss": -10.846654891967773, "global_step": 231473, "epoch": 1377} {"train_loss": -11.17485237121582, "global_step": 231474, "epoch": 1377} {"train_loss": -11.478248596191406, "global_step": 231475, "epoch": 1377} {"train_loss": -11.534709930419922, "global_step": 231476, "epoch": 1377} {"train_loss": -11.042226791381836, "global_step": 231477, "epoch": 1377} {"train_loss": -11.200394630432129, "global_step": 231478, "epoch": 1377} {"train_loss": -11.461215019226074, "global_step": 231479, "epoch": 1377} {"train_loss": -11.538315773010254, "global_step": 231480, "epoch": 1377} {"train_loss": -11.358335494995117, "global_step": 231481, "epoch": 1377} {"train_loss": -11.2901029586792, "global_step": 231482, "epoch": 1377} {"train_loss": -11.502325057983398, "global_step": 231483, "epoch": 1377} {"train_loss": -11.41074275970459, "global_step": 231484, "epoch": 1377} {"train_loss": -11.398807525634766, "global_step": 231485, "epoch": 1377} {"train_loss": -11.328603744506836, "global_step": 231486, "epoch": 1377} {"train_loss": -10.693696975708008, "global_step": 231487, "epoch": 1377} {"train_loss": -11.437921524047852, "global_step": 231488, "epoch": 1377} {"train_loss": -11.582761764526367, "global_step": 231489, "epoch": 1377} {"train_loss": -11.392965316772461, "global_step": 231490, "epoch": 1377} {"train_loss": -11.449234008789062, "global_step": 231491, "epoch": 1377} {"train_loss": -11.171399116516113, "global_step": 231492, "epoch": 1377} {"train_loss": -11.144775390625, "global_step": 231493, "epoch": 1377} {"train_loss": -11.706621170043945, "global_step": 231494, "epoch": 1377} {"train_loss": -11.045578002929688, "global_step": 231495, "epoch": 1377} {"train_loss": -11.80653190612793, "global_step": 231496, "epoch": 1377} {"train_loss": -10.945855140686035, "global_step": 231497, "epoch": 1377} {"train_loss": -11.273368835449219, "global_step": 231498, "epoch": 1377} {"train_loss": -11.194986343383789, "global_step": 231499, "epoch": 1377} {"train_loss": -11.50655746459961, "global_step": 231500, "epoch": 1377} {"train_loss": -11.680591583251953, "global_step": 231501, "epoch": 1377} {"train_loss": -11.39015007019043, "global_step": 231502, "epoch": 1377} {"train_loss": -11.462463554881868, "global_step": 231503, "epoch": 1377, "val_loss": 265530.0625} {"train_loss": -11.328688621520996, "global_step": 231504, "epoch": 1378} {"train_loss": -10.935901641845703, "global_step": 231505, "epoch": 1378} {"train_loss": -11.267041206359863, "global_step": 231506, "epoch": 1378} {"train_loss": -11.520890235900879, "global_step": 231507, "epoch": 1378} {"train_loss": -11.58903980255127, "global_step": 231508, "epoch": 1378} {"train_loss": -11.537544250488281, "global_step": 231509, "epoch": 1378} {"train_loss": -11.223443984985352, "global_step": 231510, "epoch": 1378} {"train_loss": -11.634249687194824, "global_step": 231511, "epoch": 1378} {"train_loss": -11.405253410339355, "global_step": 231512, "epoch": 1378} {"train_loss": -11.540443420410156, "global_step": 231513, "epoch": 1378} {"train_loss": -11.553831100463867, "global_step": 231514, "epoch": 1378} {"train_loss": -11.362053871154785, "global_step": 231515, "epoch": 1378} {"train_loss": -11.692184448242188, "global_step": 231516, "epoch": 1378} {"train_loss": -11.594334602355957, "global_step": 231517, "epoch": 1378} {"train_loss": -11.62349796295166, "global_step": 231518, "epoch": 1378} {"train_loss": -11.19841194152832, "global_step": 231519, "epoch": 1378} {"train_loss": -11.529913902282715, "global_step": 231520, "epoch": 1378} {"train_loss": -11.72391128540039, "global_step": 231521, "epoch": 1378} {"train_loss": -11.93086051940918, "global_step": 231522, "epoch": 1378} {"train_loss": -11.58188533782959, "global_step": 231523, "epoch": 1378} {"train_loss": -11.994930267333984, "global_step": 231524, "epoch": 1378} {"train_loss": -11.581543922424316, "global_step": 231525, "epoch": 1378} {"train_loss": -11.669973373413086, "global_step": 231526, "epoch": 1378} {"train_loss": -11.139664649963379, "global_step": 231527, "epoch": 1378} {"train_loss": -11.712583541870117, "global_step": 231528, "epoch": 1378} {"train_loss": -11.642068862915039, "global_step": 231529, "epoch": 1378} {"train_loss": -11.262073516845703, "global_step": 231530, "epoch": 1378} {"train_loss": -11.68836784362793, "global_step": 231531, "epoch": 1378} {"train_loss": -11.712276458740234, "global_step": 231532, "epoch": 1378} {"train_loss": -11.440004348754883, "global_step": 231533, "epoch": 1378} {"train_loss": -11.723387718200684, "global_step": 231534, "epoch": 1378} {"train_loss": -11.463558197021484, "global_step": 231535, "epoch": 1378} {"train_loss": -11.543441772460938, "global_step": 231536, "epoch": 1378} {"train_loss": -11.447158813476562, "global_step": 231537, "epoch": 1378} {"train_loss": -10.918344497680664, "global_step": 231538, "epoch": 1378} {"train_loss": -10.808408737182617, "global_step": 231539, "epoch": 1378} {"train_loss": -11.88590145111084, "global_step": 231540, "epoch": 1378} {"train_loss": -10.917370796203613, "global_step": 231541, "epoch": 1378} {"train_loss": -11.230514526367188, "global_step": 231542, "epoch": 1378} {"train_loss": -10.407774925231934, "global_step": 231543, "epoch": 1378} {"train_loss": -11.34864616394043, "global_step": 231544, "epoch": 1378} {"train_loss": -10.89438247680664, "global_step": 231545, "epoch": 1378} {"train_loss": -11.403244018554688, "global_step": 231546, "epoch": 1378} {"train_loss": -11.27285385131836, "global_step": 231547, "epoch": 1378} {"train_loss": -11.592731475830078, "global_step": 231548, "epoch": 1378} {"train_loss": -10.878928184509277, "global_step": 231549, "epoch": 1378} {"train_loss": -10.311540603637695, "global_step": 231550, "epoch": 1378} {"train_loss": -11.109243392944336, "global_step": 231551, "epoch": 1378} {"train_loss": -10.839286804199219, "global_step": 231552, "epoch": 1378} {"train_loss": -10.666121482849121, "global_step": 231553, "epoch": 1378} {"train_loss": -10.315505981445312, "global_step": 231554, "epoch": 1378} {"train_loss": -11.089641571044922, "global_step": 231555, "epoch": 1378} {"train_loss": -10.640523910522461, "global_step": 231556, "epoch": 1378} {"train_loss": -10.721150398254395, "global_step": 231557, "epoch": 1378} {"train_loss": -10.793371200561523, "global_step": 231558, "epoch": 1378} {"train_loss": -10.510196685791016, "global_step": 231559, "epoch": 1378} {"train_loss": -9.961284637451172, "global_step": 231560, "epoch": 1378} {"train_loss": -11.12366008758545, "global_step": 231561, "epoch": 1378} {"train_loss": -10.724374771118164, "global_step": 231562, "epoch": 1378} {"train_loss": -10.876697540283203, "global_step": 231563, "epoch": 1378} {"train_loss": -11.076443672180176, "global_step": 231564, "epoch": 1378} {"train_loss": -10.986729621887207, "global_step": 231565, "epoch": 1378} {"train_loss": -10.939020156860352, "global_step": 231566, "epoch": 1378} {"train_loss": -11.148700714111328, "global_step": 231567, "epoch": 1378} {"train_loss": -11.33991527557373, "global_step": 231568, "epoch": 1378} {"train_loss": -11.34578800201416, "global_step": 231569, "epoch": 1378} {"train_loss": -11.613096237182617, "global_step": 231570, "epoch": 1378} {"train_loss": -11.095342636108398, "global_step": 231571, "epoch": 1378} {"train_loss": -11.761248588562012, "global_step": 231572, "epoch": 1378} {"train_loss": -11.153276443481445, "global_step": 231573, "epoch": 1378} {"train_loss": -11.480648040771484, "global_step": 231574, "epoch": 1378} {"train_loss": -11.593379974365234, "global_step": 231575, "epoch": 1378} {"train_loss": -11.268003463745117, "global_step": 231576, "epoch": 1378} {"train_loss": -11.409818649291992, "global_step": 231577, "epoch": 1378} {"train_loss": -11.708824157714844, "global_step": 231578, "epoch": 1378} {"train_loss": -11.414548873901367, "global_step": 231579, "epoch": 1378} {"train_loss": -11.628581047058105, "global_step": 231580, "epoch": 1378} {"train_loss": -11.679012298583984, "global_step": 231581, "epoch": 1378} {"train_loss": -11.3438138961792, "global_step": 231582, "epoch": 1378} {"train_loss": -11.487276077270508, "global_step": 231583, "epoch": 1378} {"train_loss": -11.437579154968262, "global_step": 231584, "epoch": 1378} {"train_loss": -11.525724411010742, "global_step": 231585, "epoch": 1378} {"train_loss": -11.677234649658203, "global_step": 231586, "epoch": 1378} {"train_loss": -11.530197143554688, "global_step": 231587, "epoch": 1378} {"train_loss": -11.626884460449219, "global_step": 231588, "epoch": 1378} {"train_loss": -11.89093017578125, "global_step": 231589, "epoch": 1378} {"train_loss": -11.739555358886719, "global_step": 231590, "epoch": 1378} {"train_loss": -11.606196403503418, "global_step": 231591, "epoch": 1378} {"train_loss": -12.066386222839355, "global_step": 231592, "epoch": 1378} {"train_loss": -11.75623607635498, "global_step": 231593, "epoch": 1378} {"train_loss": -11.760530471801758, "global_step": 231594, "epoch": 1378} {"train_loss": -11.891220092773438, "global_step": 231595, "epoch": 1378} {"train_loss": -11.930456161499023, "global_step": 231596, "epoch": 1378} {"train_loss": -11.821526527404785, "global_step": 231597, "epoch": 1378} {"train_loss": -12.048290252685547, "global_step": 231598, "epoch": 1378} {"train_loss": -11.733060836791992, "global_step": 231599, "epoch": 1378} {"train_loss": -11.885232925415039, "global_step": 231600, "epoch": 1378} {"train_loss": -11.913442611694336, "global_step": 231601, "epoch": 1378} {"train_loss": -11.808479309082031, "global_step": 231602, "epoch": 1378} {"train_loss": -11.8090181350708, "global_step": 231603, "epoch": 1378} {"train_loss": -11.763531684875488, "global_step": 231604, "epoch": 1378} {"train_loss": -11.846288681030273, "global_step": 231605, "epoch": 1378} {"train_loss": -12.056382179260254, "global_step": 231606, "epoch": 1378} {"train_loss": -11.865537643432617, "global_step": 231607, "epoch": 1378} {"train_loss": -12.08130168914795, "global_step": 231608, "epoch": 1378} {"train_loss": -11.848968505859375, "global_step": 231609, "epoch": 1378} {"train_loss": -11.870149612426758, "global_step": 231610, "epoch": 1378} {"train_loss": -12.030152320861816, "global_step": 231611, "epoch": 1378} {"train_loss": -12.01239013671875, "global_step": 231612, "epoch": 1378} {"train_loss": -11.818359375, "global_step": 231613, "epoch": 1378} {"train_loss": -11.814934730529785, "global_step": 231614, "epoch": 1378} {"train_loss": -11.847345352172852, "global_step": 231615, "epoch": 1378} {"train_loss": -11.920211791992188, "global_step": 231616, "epoch": 1378} {"train_loss": -11.99451732635498, "global_step": 231617, "epoch": 1378} {"train_loss": -11.79460334777832, "global_step": 231618, "epoch": 1378} {"train_loss": -11.923524856567383, "global_step": 231619, "epoch": 1378} {"train_loss": -11.960145950317383, "global_step": 231620, "epoch": 1378} {"train_loss": -12.235124588012695, "global_step": 231621, "epoch": 1378} {"train_loss": -11.944549560546875, "global_step": 231622, "epoch": 1378} {"train_loss": -11.674703598022461, "global_step": 231623, "epoch": 1378} {"train_loss": -11.608211517333984, "global_step": 231624, "epoch": 1378} {"train_loss": -11.867703437805176, "global_step": 231625, "epoch": 1378} {"train_loss": -11.986808776855469, "global_step": 231626, "epoch": 1378} {"train_loss": -11.616155624389648, "global_step": 231627, "epoch": 1378} {"train_loss": -11.59389877319336, "global_step": 231628, "epoch": 1378} {"train_loss": -11.786271095275879, "global_step": 231629, "epoch": 1378} {"train_loss": -11.468986511230469, "global_step": 231630, "epoch": 1378} {"train_loss": -10.825294494628906, "global_step": 231631, "epoch": 1378} {"train_loss": -10.924295425415039, "global_step": 231632, "epoch": 1378} {"train_loss": -11.38296127319336, "global_step": 231633, "epoch": 1378} {"train_loss": -10.580132484436035, "global_step": 231634, "epoch": 1378} {"train_loss": -11.751594543457031, "global_step": 231635, "epoch": 1378} {"train_loss": -11.21107292175293, "global_step": 231636, "epoch": 1378} {"train_loss": -11.652666091918945, "global_step": 231637, "epoch": 1378} {"train_loss": -11.47288703918457, "global_step": 231638, "epoch": 1378} {"train_loss": -11.630120277404785, "global_step": 231639, "epoch": 1378} {"train_loss": -11.322982788085938, "global_step": 231640, "epoch": 1378} {"train_loss": -11.501066207885742, "global_step": 231641, "epoch": 1378} {"train_loss": -11.371644973754883, "global_step": 231642, "epoch": 1378} {"train_loss": -11.762248992919922, "global_step": 231643, "epoch": 1378} {"train_loss": -11.549247741699219, "global_step": 231644, "epoch": 1378} {"train_loss": -11.794909477233887, "global_step": 231645, "epoch": 1378} {"train_loss": -11.652986526489258, "global_step": 231646, "epoch": 1378} {"train_loss": -11.558785438537598, "global_step": 231647, "epoch": 1378} {"train_loss": -11.776613235473633, "global_step": 231648, "epoch": 1378} {"train_loss": -11.44240665435791, "global_step": 231649, "epoch": 1378} {"train_loss": -10.956363677978516, "global_step": 231650, "epoch": 1378} {"train_loss": -11.473966598510742, "global_step": 231651, "epoch": 1378} {"train_loss": -11.442012786865234, "global_step": 231652, "epoch": 1378} {"train_loss": -10.773676872253418, "global_step": 231653, "epoch": 1378} {"train_loss": -11.200607299804688, "global_step": 231654, "epoch": 1378} {"train_loss": -11.167564392089844, "global_step": 231655, "epoch": 1378} {"train_loss": -10.80556869506836, "global_step": 231656, "epoch": 1378} {"train_loss": -11.439252853393555, "global_step": 231657, "epoch": 1378} {"train_loss": -10.851154327392578, "global_step": 231658, "epoch": 1378} {"train_loss": -11.760726928710938, "global_step": 231659, "epoch": 1378} {"train_loss": -10.666412353515625, "global_step": 231660, "epoch": 1378} {"train_loss": -11.576687812805176, "global_step": 231661, "epoch": 1378} {"train_loss": -10.75417709350586, "global_step": 231662, "epoch": 1378} {"train_loss": -10.8551607131958, "global_step": 231663, "epoch": 1378} {"train_loss": -10.89702320098877, "global_step": 231664, "epoch": 1378} {"train_loss": -11.276752471923828, "global_step": 231665, "epoch": 1378} {"train_loss": -11.020099639892578, "global_step": 231666, "epoch": 1378} {"train_loss": -11.39068603515625, "global_step": 231667, "epoch": 1378} {"train_loss": -10.806255340576172, "global_step": 231668, "epoch": 1378} {"train_loss": -11.367862701416016, "global_step": 231669, "epoch": 1378} {"train_loss": -11.376216888427734, "global_step": 231670, "epoch": 1378} {"train_loss": -11.431238089288984, "global_step": 231671, "epoch": 1378, "val_loss": 263587.0} {"train_loss": -11.553470611572266, "global_step": 231672, "epoch": 1379} {"train_loss": -10.73565673828125, "global_step": 231673, "epoch": 1379} {"train_loss": -11.507501602172852, "global_step": 231674, "epoch": 1379} {"train_loss": -10.186484336853027, "global_step": 231675, "epoch": 1379} {"train_loss": -11.467556953430176, "global_step": 231676, "epoch": 1379} {"train_loss": -10.709089279174805, "global_step": 231677, "epoch": 1379} {"train_loss": -11.127164840698242, "global_step": 231678, "epoch": 1379} {"train_loss": -10.659599304199219, "global_step": 231679, "epoch": 1379} {"train_loss": -10.744958877563477, "global_step": 231680, "epoch": 1379} {"train_loss": -10.531856536865234, "global_step": 231681, "epoch": 1379} {"train_loss": -11.105744361877441, "global_step": 231682, "epoch": 1379} {"train_loss": -11.308218955993652, "global_step": 231683, "epoch": 1379} {"train_loss": -11.363276481628418, "global_step": 231684, "epoch": 1379} {"train_loss": -11.523139953613281, "global_step": 231685, "epoch": 1379} {"train_loss": -10.88420295715332, "global_step": 231686, "epoch": 1379} {"train_loss": -11.632893562316895, "global_step": 231687, "epoch": 1379} {"train_loss": -11.221022605895996, "global_step": 231688, "epoch": 1379} {"train_loss": -11.445425987243652, "global_step": 231689, "epoch": 1379} {"train_loss": -11.501834869384766, "global_step": 231690, "epoch": 1379} {"train_loss": -10.958414077758789, "global_step": 231691, "epoch": 1379} {"train_loss": -11.566073417663574, "global_step": 231692, "epoch": 1379} {"train_loss": -11.001351356506348, "global_step": 231693, "epoch": 1379} {"train_loss": -11.55263900756836, "global_step": 231694, "epoch": 1379} {"train_loss": -11.320048332214355, "global_step": 231695, "epoch": 1379} {"train_loss": -11.56192398071289, "global_step": 231696, "epoch": 1379} {"train_loss": -11.174854278564453, "global_step": 231697, "epoch": 1379} {"train_loss": -11.576769828796387, "global_step": 231698, "epoch": 1379} {"train_loss": -11.173115730285645, "global_step": 231699, "epoch": 1379} {"train_loss": -11.536117553710938, "global_step": 231700, "epoch": 1379} {"train_loss": -11.67667007446289, "global_step": 231701, "epoch": 1379} {"train_loss": -11.714252471923828, "global_step": 231702, "epoch": 1379} {"train_loss": -11.54697036743164, "global_step": 231703, "epoch": 1379} {"train_loss": -11.82442855834961, "global_step": 231704, "epoch": 1379} {"train_loss": -11.478693008422852, "global_step": 231705, "epoch": 1379} {"train_loss": -11.748575210571289, "global_step": 231706, "epoch": 1379} {"train_loss": -11.61867904663086, "global_step": 231707, "epoch": 1379} {"train_loss": -11.594549179077148, "global_step": 231708, "epoch": 1379} {"train_loss": -11.693419456481934, "global_step": 231709, "epoch": 1379} {"train_loss": -11.698450088500977, "global_step": 231710, "epoch": 1379} {"train_loss": -11.883783340454102, "global_step": 231711, "epoch": 1379} {"train_loss": -11.749473571777344, "global_step": 231712, "epoch": 1379} {"train_loss": -11.773920059204102, "global_step": 231713, "epoch": 1379} {"train_loss": -11.847301483154297, "global_step": 231714, "epoch": 1379} {"train_loss": -11.902883529663086, "global_step": 231715, "epoch": 1379} {"train_loss": -11.99658203125, "global_step": 231716, "epoch": 1379} {"train_loss": -11.842672348022461, "global_step": 231717, "epoch": 1379} {"train_loss": -11.74399185180664, "global_step": 231718, "epoch": 1379} {"train_loss": -11.814937591552734, "global_step": 231719, "epoch": 1379} {"train_loss": -11.756462097167969, "global_step": 231720, "epoch": 1379} {"train_loss": -11.979061126708984, "global_step": 231721, "epoch": 1379} {"train_loss": -11.9237060546875, "global_step": 231722, "epoch": 1379} {"train_loss": -11.923452377319336, "global_step": 231723, "epoch": 1379} {"train_loss": -11.987247467041016, "global_step": 231724, "epoch": 1379} {"train_loss": -11.869217872619629, "global_step": 231725, "epoch": 1379} {"train_loss": -11.755973815917969, "global_step": 231726, "epoch": 1379} {"train_loss": -12.098968505859375, "global_step": 231727, "epoch": 1379} {"train_loss": -12.017196655273438, "global_step": 231728, "epoch": 1379} {"train_loss": -11.863065719604492, "global_step": 231729, "epoch": 1379} {"train_loss": -11.962775230407715, "global_step": 231730, "epoch": 1379} {"train_loss": -12.028295516967773, "global_step": 231731, "epoch": 1379} {"train_loss": -11.98998737335205, "global_step": 231732, "epoch": 1379} {"train_loss": -11.896295547485352, "global_step": 231733, "epoch": 1379} {"train_loss": -11.930380821228027, "global_step": 231734, "epoch": 1379} {"train_loss": -11.908625602722168, "global_step": 231735, "epoch": 1379} {"train_loss": -12.154298782348633, "global_step": 231736, "epoch": 1379} {"train_loss": -12.060809135437012, "global_step": 231737, "epoch": 1379} {"train_loss": -12.149227142333984, "global_step": 231738, "epoch": 1379} {"train_loss": -12.108400344848633, "global_step": 231739, "epoch": 1379} {"train_loss": -11.982717514038086, "global_step": 231740, "epoch": 1379} {"train_loss": -12.063647270202637, "global_step": 231741, "epoch": 1379} {"train_loss": -11.956766128540039, "global_step": 231742, "epoch": 1379} {"train_loss": -11.81352710723877, "global_step": 231743, "epoch": 1379} {"train_loss": -12.076961517333984, "global_step": 231744, "epoch": 1379} {"train_loss": -12.046920776367188, "global_step": 231745, "epoch": 1379} {"train_loss": -11.54974365234375, "global_step": 231746, "epoch": 1379} {"train_loss": -11.176669120788574, "global_step": 231747, "epoch": 1379} {"train_loss": -11.918072700500488, "global_step": 231748, "epoch": 1379} {"train_loss": -10.891363143920898, "global_step": 231749, "epoch": 1379} {"train_loss": -11.525087356567383, "global_step": 231750, "epoch": 1379} {"train_loss": -11.841522216796875, "global_step": 231751, "epoch": 1379} {"train_loss": -11.371978759765625, "global_step": 231752, "epoch": 1379} {"train_loss": -11.653215408325195, "global_step": 231753, "epoch": 1379} {"train_loss": -11.392953872680664, "global_step": 231754, "epoch": 1379} {"train_loss": -11.77742862701416, "global_step": 231755, "epoch": 1379} {"train_loss": -12.004060745239258, "global_step": 231756, "epoch": 1379} {"train_loss": -11.955933570861816, "global_step": 231757, "epoch": 1379} {"train_loss": -11.35651969909668, "global_step": 231758, "epoch": 1379} {"train_loss": -11.272850036621094, "global_step": 231759, "epoch": 1379} {"train_loss": -11.456275939941406, "global_step": 231760, "epoch": 1379} {"train_loss": -11.303176879882812, "global_step": 231761, "epoch": 1379} {"train_loss": -11.779117584228516, "global_step": 231762, "epoch": 1379} {"train_loss": -10.619060516357422, "global_step": 231763, "epoch": 1379} {"train_loss": -10.341693878173828, "global_step": 231764, "epoch": 1379} {"train_loss": -10.654476165771484, "global_step": 231765, "epoch": 1379} {"train_loss": -11.841021537780762, "global_step": 231766, "epoch": 1379} {"train_loss": -10.519472122192383, "global_step": 231767, "epoch": 1379} {"train_loss": -10.462714195251465, "global_step": 231768, "epoch": 1379} {"train_loss": -10.869280815124512, "global_step": 231769, "epoch": 1379} {"train_loss": -10.83362865447998, "global_step": 231770, "epoch": 1379} {"train_loss": -11.04366683959961, "global_step": 231771, "epoch": 1379} {"train_loss": -11.18567943572998, "global_step": 231772, "epoch": 1379} {"train_loss": -10.805231094360352, "global_step": 231773, "epoch": 1379} {"train_loss": -11.407596588134766, "global_step": 231774, "epoch": 1379} {"train_loss": -10.861019134521484, "global_step": 231775, "epoch": 1379} {"train_loss": -11.425531387329102, "global_step": 231776, "epoch": 1379} {"train_loss": -11.296862602233887, "global_step": 231777, "epoch": 1379} {"train_loss": -11.763050079345703, "global_step": 231778, "epoch": 1379} {"train_loss": -11.867526054382324, "global_step": 231779, "epoch": 1379} {"train_loss": -11.274171829223633, "global_step": 231780, "epoch": 1379} {"train_loss": -11.883088111877441, "global_step": 231781, "epoch": 1379} {"train_loss": -11.822393417358398, "global_step": 231782, "epoch": 1379} {"train_loss": -11.580293655395508, "global_step": 231783, "epoch": 1379} {"train_loss": -11.443710327148438, "global_step": 231784, "epoch": 1379} {"train_loss": -11.47408676147461, "global_step": 231785, "epoch": 1379} {"train_loss": -11.536029815673828, "global_step": 231786, "epoch": 1379} {"train_loss": -11.291431427001953, "global_step": 231787, "epoch": 1379} {"train_loss": -10.958453178405762, "global_step": 231788, "epoch": 1379} {"train_loss": -11.490469932556152, "global_step": 231789, "epoch": 1379} {"train_loss": -11.422285079956055, "global_step": 231790, "epoch": 1379} {"train_loss": -11.731409072875977, "global_step": 231791, "epoch": 1379} {"train_loss": -11.094618797302246, "global_step": 231792, "epoch": 1379} {"train_loss": -11.525445938110352, "global_step": 231793, "epoch": 1379} {"train_loss": -11.368170738220215, "global_step": 231794, "epoch": 1379} {"train_loss": -11.29969310760498, "global_step": 231795, "epoch": 1379} {"train_loss": -11.70220947265625, "global_step": 231796, "epoch": 1379} {"train_loss": -11.260808944702148, "global_step": 231797, "epoch": 1379} {"train_loss": -11.540227890014648, "global_step": 231798, "epoch": 1379} {"train_loss": -11.294536590576172, "global_step": 231799, "epoch": 1379} {"train_loss": -11.227872848510742, "global_step": 231800, "epoch": 1379} {"train_loss": -11.626754760742188, "global_step": 231801, "epoch": 1379} {"train_loss": -11.467123031616211, "global_step": 231802, "epoch": 1379} {"train_loss": -11.647604942321777, "global_step": 231803, "epoch": 1379} {"train_loss": -11.422832489013672, "global_step": 231804, "epoch": 1379} {"train_loss": -11.035015106201172, "global_step": 231805, "epoch": 1379} {"train_loss": -11.46220588684082, "global_step": 231806, "epoch": 1379} {"train_loss": -11.620689392089844, "global_step": 231807, "epoch": 1379} {"train_loss": -11.61206340789795, "global_step": 231808, "epoch": 1379} {"train_loss": -11.515426635742188, "global_step": 231809, "epoch": 1379} {"train_loss": -11.571473121643066, "global_step": 231810, "epoch": 1379} {"train_loss": -11.722366333007812, "global_step": 231811, "epoch": 1379} {"train_loss": -11.44240951538086, "global_step": 231812, "epoch": 1379} {"train_loss": -11.713520050048828, "global_step": 231813, "epoch": 1379} {"train_loss": -11.749853134155273, "global_step": 231814, "epoch": 1379} {"train_loss": -11.668540000915527, "global_step": 231815, "epoch": 1379} {"train_loss": -11.701030731201172, "global_step": 231816, "epoch": 1379} {"train_loss": -11.697763442993164, "global_step": 231817, "epoch": 1379} {"train_loss": -11.558069229125977, "global_step": 231818, "epoch": 1379} {"train_loss": -11.883176803588867, "global_step": 231819, "epoch": 1379} {"train_loss": -11.551260948181152, "global_step": 231820, "epoch": 1379} {"train_loss": -11.764485359191895, "global_step": 231821, "epoch": 1379} {"train_loss": -11.766679763793945, "global_step": 231822, "epoch": 1379} {"train_loss": -11.647748947143555, "global_step": 231823, "epoch": 1379} {"train_loss": -11.516868591308594, "global_step": 231824, "epoch": 1379} {"train_loss": -11.530328750610352, "global_step": 231825, "epoch": 1379} {"train_loss": -11.793869018554688, "global_step": 231826, "epoch": 1379} {"train_loss": -11.448323249816895, "global_step": 231827, "epoch": 1379} {"train_loss": -12.113426208496094, "global_step": 231828, "epoch": 1379} {"train_loss": -11.615558624267578, "global_step": 231829, "epoch": 1379} {"train_loss": -11.940881729125977, "global_step": 231830, "epoch": 1379} {"train_loss": -11.809566497802734, "global_step": 231831, "epoch": 1379} {"train_loss": -11.450843811035156, "global_step": 231832, "epoch": 1379} {"train_loss": -11.887702941894531, "global_step": 231833, "epoch": 1379} {"train_loss": -11.845805168151855, "global_step": 231834, "epoch": 1379} {"train_loss": -11.860790252685547, "global_step": 231835, "epoch": 1379} {"train_loss": -11.552149772644043, "global_step": 231836, "epoch": 1379} {"train_loss": -11.90451717376709, "global_step": 231837, "epoch": 1379} {"train_loss": -11.74281120300293, "global_step": 231838, "epoch": 1379} {"train_loss": -11.534658210618156, "global_step": 231839, "epoch": 1379, "val_loss": 263958.875} {"train_loss": -11.746854782104492, "global_step": 231840, "epoch": 1380} {"train_loss": -11.732431411743164, "global_step": 231841, "epoch": 1380} {"train_loss": -11.609375953674316, "global_step": 231842, "epoch": 1380} {"train_loss": -11.567574501037598, "global_step": 231843, "epoch": 1380} {"train_loss": -12.022441864013672, "global_step": 231844, "epoch": 1380} {"train_loss": -11.776376724243164, "global_step": 231845, "epoch": 1380} {"train_loss": -11.50655746459961, "global_step": 231846, "epoch": 1380} {"train_loss": -11.705568313598633, "global_step": 231847, "epoch": 1380} {"train_loss": -11.748111724853516, "global_step": 231848, "epoch": 1380} {"train_loss": -11.680025100708008, "global_step": 231849, "epoch": 1380} {"train_loss": -10.753751754760742, "global_step": 231850, "epoch": 1380} {"train_loss": -11.873296737670898, "global_step": 231851, "epoch": 1380} {"train_loss": -11.56408405303955, "global_step": 231852, "epoch": 1380} {"train_loss": -11.387273788452148, "global_step": 231853, "epoch": 1380} {"train_loss": -10.939825057983398, "global_step": 231854, "epoch": 1380} {"train_loss": -11.466449737548828, "global_step": 231855, "epoch": 1380} {"train_loss": -11.802437782287598, "global_step": 231856, "epoch": 1380} {"train_loss": -10.966550827026367, "global_step": 231857, "epoch": 1380} {"train_loss": -11.563403129577637, "global_step": 231858, "epoch": 1380} {"train_loss": -12.001307487487793, "global_step": 231859, "epoch": 1380} {"train_loss": -10.57119083404541, "global_step": 231860, "epoch": 1380} {"train_loss": -10.057655334472656, "global_step": 231861, "epoch": 1380} {"train_loss": -11.145153045654297, "global_step": 231862, "epoch": 1380} {"train_loss": -9.736078262329102, "global_step": 231863, "epoch": 1380} {"train_loss": -11.074067115783691, "global_step": 231864, "epoch": 1380} {"train_loss": -10.741997718811035, "global_step": 231865, "epoch": 1380} {"train_loss": -10.047687530517578, "global_step": 231866, "epoch": 1380} {"train_loss": -11.475896835327148, "global_step": 231867, "epoch": 1380} {"train_loss": -11.241436958312988, "global_step": 231868, "epoch": 1380} {"train_loss": -11.497737884521484, "global_step": 231869, "epoch": 1380} {"train_loss": -11.18930721282959, "global_step": 231870, "epoch": 1380} {"train_loss": -11.329297065734863, "global_step": 231871, "epoch": 1380} {"train_loss": -11.177423477172852, "global_step": 231872, "epoch": 1380} {"train_loss": -10.857271194458008, "global_step": 231873, "epoch": 1380} {"train_loss": -10.93790054321289, "global_step": 231874, "epoch": 1380} {"train_loss": -11.174222946166992, "global_step": 231875, "epoch": 1380} {"train_loss": -11.021106719970703, "global_step": 231876, "epoch": 1380} {"train_loss": -11.314568519592285, "global_step": 231877, "epoch": 1380} {"train_loss": -11.118074417114258, "global_step": 231878, "epoch": 1380} {"train_loss": -11.569091796875, "global_step": 231879, "epoch": 1380} {"train_loss": -11.05738639831543, "global_step": 231880, "epoch": 1380} {"train_loss": -10.873861312866211, "global_step": 231881, "epoch": 1380} {"train_loss": -11.20415210723877, "global_step": 231882, "epoch": 1380} {"train_loss": -11.217301368713379, "global_step": 231883, "epoch": 1380} {"train_loss": -10.845159530639648, "global_step": 231884, "epoch": 1380} {"train_loss": -10.985151290893555, "global_step": 231885, "epoch": 1380} {"train_loss": -10.806432723999023, "global_step": 231886, "epoch": 1380} {"train_loss": -11.066728591918945, "global_step": 231887, "epoch": 1380} {"train_loss": -10.711173057556152, "global_step": 231888, "epoch": 1380} {"train_loss": -10.857952117919922, "global_step": 231889, "epoch": 1380} {"train_loss": -10.632144927978516, "global_step": 231890, "epoch": 1380} {"train_loss": -10.660652160644531, "global_step": 231891, "epoch": 1380} {"train_loss": -11.137860298156738, "global_step": 231892, "epoch": 1380} {"train_loss": -10.389242172241211, "global_step": 231893, "epoch": 1380} {"train_loss": -11.772232055664062, "global_step": 231894, "epoch": 1380} {"train_loss": -10.59559154510498, "global_step": 231895, "epoch": 1380} {"train_loss": -11.230823516845703, "global_step": 231896, "epoch": 1380} {"train_loss": -11.038246154785156, "global_step": 231897, "epoch": 1380} {"train_loss": -11.284095764160156, "global_step": 231898, "epoch": 1380} {"train_loss": -10.938735961914062, "global_step": 231899, "epoch": 1380} {"train_loss": -11.351460456848145, "global_step": 231900, "epoch": 1380} {"train_loss": -11.25523853302002, "global_step": 231901, "epoch": 1380} {"train_loss": -11.668563842773438, "global_step": 231902, "epoch": 1380} {"train_loss": -11.076308250427246, "global_step": 231903, "epoch": 1380} {"train_loss": -11.484134674072266, "global_step": 231904, "epoch": 1380} {"train_loss": -11.216521263122559, "global_step": 231905, "epoch": 1380} {"train_loss": -11.195135116577148, "global_step": 231906, "epoch": 1380} {"train_loss": -11.572273254394531, "global_step": 231907, "epoch": 1380} {"train_loss": -11.277534484863281, "global_step": 231908, "epoch": 1380} {"train_loss": -11.417756080627441, "global_step": 231909, "epoch": 1380} {"train_loss": -11.187335968017578, "global_step": 231910, "epoch": 1380} {"train_loss": -11.462738990783691, "global_step": 231911, "epoch": 1380} {"train_loss": -11.473472595214844, "global_step": 231912, "epoch": 1380} {"train_loss": -11.699847221374512, "global_step": 231913, "epoch": 1380} {"train_loss": -11.459071159362793, "global_step": 231914, "epoch": 1380} {"train_loss": -11.68906307220459, "global_step": 231915, "epoch": 1380} {"train_loss": -11.291952133178711, "global_step": 231916, "epoch": 1380} {"train_loss": -11.530710220336914, "global_step": 231917, "epoch": 1380} {"train_loss": -11.483529090881348, "global_step": 231918, "epoch": 1380} {"train_loss": -11.379386901855469, "global_step": 231919, "epoch": 1380} {"train_loss": -11.269172668457031, "global_step": 231920, "epoch": 1380} {"train_loss": -11.427152633666992, "global_step": 231921, "epoch": 1380} {"train_loss": -11.573872566223145, "global_step": 231922, "epoch": 1380} {"train_loss": -11.611404418945312, "global_step": 231923, "epoch": 1380} {"train_loss": -11.63878059387207, "global_step": 231924, "epoch": 1380} {"train_loss": -11.661792755126953, "global_step": 231925, "epoch": 1380} {"train_loss": -11.395730972290039, "global_step": 231926, "epoch": 1380} {"train_loss": -11.580218315124512, "global_step": 231927, "epoch": 1380} {"train_loss": -11.574581146240234, "global_step": 231928, "epoch": 1380} {"train_loss": -11.632465362548828, "global_step": 231929, "epoch": 1380} {"train_loss": -11.85621452331543, "global_step": 231930, "epoch": 1380} {"train_loss": -11.707088470458984, "global_step": 231931, "epoch": 1380} {"train_loss": -11.813591003417969, "global_step": 231932, "epoch": 1380} {"train_loss": -11.731093406677246, "global_step": 231933, "epoch": 1380} {"train_loss": -11.816469192504883, "global_step": 231934, "epoch": 1380} {"train_loss": -11.724347114562988, "global_step": 231935, "epoch": 1380} {"train_loss": -11.750843048095703, "global_step": 231936, "epoch": 1380} {"train_loss": -11.787967681884766, "global_step": 231937, "epoch": 1380} {"train_loss": -11.797173500061035, "global_step": 231938, "epoch": 1380} {"train_loss": -11.879850387573242, "global_step": 231939, "epoch": 1380} {"train_loss": -11.917423248291016, "global_step": 231940, "epoch": 1380} {"train_loss": -11.815027236938477, "global_step": 231941, "epoch": 1380} {"train_loss": -11.749635696411133, "global_step": 231942, "epoch": 1380} {"train_loss": -11.818464279174805, "global_step": 231943, "epoch": 1380} {"train_loss": -11.833985328674316, "global_step": 231944, "epoch": 1380} {"train_loss": -11.821796417236328, "global_step": 231945, "epoch": 1380} {"train_loss": -11.70810604095459, "global_step": 231946, "epoch": 1380} {"train_loss": -11.795116424560547, "global_step": 231947, "epoch": 1380} {"train_loss": -11.937131881713867, "global_step": 231948, "epoch": 1380} {"train_loss": -11.763887405395508, "global_step": 231949, "epoch": 1380} {"train_loss": -11.957422256469727, "global_step": 231950, "epoch": 1380} {"train_loss": -12.038973808288574, "global_step": 231951, "epoch": 1380} {"train_loss": -11.825748443603516, "global_step": 231952, "epoch": 1380} {"train_loss": -11.892106056213379, "global_step": 231953, "epoch": 1380} {"train_loss": -12.09588623046875, "global_step": 231954, "epoch": 1380} {"train_loss": -12.067150115966797, "global_step": 231955, "epoch": 1380} {"train_loss": -11.776305198669434, "global_step": 231956, "epoch": 1380} {"train_loss": -12.013465881347656, "global_step": 231957, "epoch": 1380} {"train_loss": -11.838682174682617, "global_step": 231958, "epoch": 1380} {"train_loss": -11.811503410339355, "global_step": 231959, "epoch": 1380} {"train_loss": -11.71429443359375, "global_step": 231960, "epoch": 1380} {"train_loss": -11.886393547058105, "global_step": 231961, "epoch": 1380} {"train_loss": -11.646956443786621, "global_step": 231962, "epoch": 1380} {"train_loss": -11.79020881652832, "global_step": 231963, "epoch": 1380} {"train_loss": -11.91798210144043, "global_step": 231964, "epoch": 1380} {"train_loss": -12.1646146774292, "global_step": 231965, "epoch": 1380} {"train_loss": -11.794612884521484, "global_step": 231966, "epoch": 1380} {"train_loss": -11.668853759765625, "global_step": 231967, "epoch": 1380} {"train_loss": -11.86640739440918, "global_step": 231968, "epoch": 1380} {"train_loss": -11.890254974365234, "global_step": 231969, "epoch": 1380} {"train_loss": -11.432886123657227, "global_step": 231970, "epoch": 1380} {"train_loss": -11.73151969909668, "global_step": 231971, "epoch": 1380} {"train_loss": -11.829367637634277, "global_step": 231972, "epoch": 1380} {"train_loss": -11.426908493041992, "global_step": 231973, "epoch": 1380} {"train_loss": -11.337685585021973, "global_step": 231974, "epoch": 1380} {"train_loss": -11.822571754455566, "global_step": 231975, "epoch": 1380} {"train_loss": -11.945136070251465, "global_step": 231976, "epoch": 1380} {"train_loss": -11.956226348876953, "global_step": 231977, "epoch": 1380} {"train_loss": -11.887543678283691, "global_step": 231978, "epoch": 1380} {"train_loss": -11.5904541015625, "global_step": 231979, "epoch": 1380} {"train_loss": -11.81037712097168, "global_step": 231980, "epoch": 1380} {"train_loss": -11.814339637756348, "global_step": 231981, "epoch": 1380} {"train_loss": -11.207239151000977, "global_step": 231982, "epoch": 1380} {"train_loss": -11.312239646911621, "global_step": 231983, "epoch": 1380} {"train_loss": -11.276016235351562, "global_step": 231984, "epoch": 1380} {"train_loss": -11.36130142211914, "global_step": 231985, "epoch": 1380} {"train_loss": -10.00304126739502, "global_step": 231986, "epoch": 1380} {"train_loss": -11.581433296203613, "global_step": 231987, "epoch": 1380} {"train_loss": -10.49119758605957, "global_step": 231988, "epoch": 1380} {"train_loss": -11.510920524597168, "global_step": 231989, "epoch": 1380} {"train_loss": -10.746356964111328, "global_step": 231990, "epoch": 1380} {"train_loss": -10.989168167114258, "global_step": 231991, "epoch": 1380} {"train_loss": -9.87072467803955, "global_step": 231992, "epoch": 1380} {"train_loss": -10.72579288482666, "global_step": 231993, "epoch": 1380} {"train_loss": -11.353485107421875, "global_step": 231994, "epoch": 1380} {"train_loss": -11.008355140686035, "global_step": 231995, "epoch": 1380} {"train_loss": -11.569067001342773, "global_step": 231996, "epoch": 1380} {"train_loss": -10.745320320129395, "global_step": 231997, "epoch": 1380} {"train_loss": -11.37478256225586, "global_step": 231998, "epoch": 1380} {"train_loss": -10.44782829284668, "global_step": 231999, "epoch": 1380} {"train_loss": -11.270818710327148, "global_step": 232000, "epoch": 1380} {"train_loss": -11.359634399414062, "global_step": 232001, "epoch": 1380} {"train_loss": -11.154085159301758, "global_step": 232002, "epoch": 1380} {"train_loss": -10.858940124511719, "global_step": 232003, "epoch": 1380} {"train_loss": -11.091047286987305, "global_step": 232004, "epoch": 1380} {"train_loss": -11.425788879394531, "global_step": 232005, "epoch": 1380} {"train_loss": -10.955743789672852, "global_step": 232006, "epoch": 1380} {"train_loss": -11.395471975916909, "global_step": 232007, "epoch": 1380, "val_loss": 263540.0625, "train_action_mse_error": 1.73850679397583} {"train_loss": -10.79797077178955, "global_step": 232008, "epoch": 1381} {"train_loss": -11.114462852478027, "global_step": 232009, "epoch": 1381} {"train_loss": -10.592494010925293, "global_step": 232010, "epoch": 1381} {"train_loss": -10.426448822021484, "global_step": 232011, "epoch": 1381} {"train_loss": -10.403029441833496, "global_step": 232012, "epoch": 1381} {"train_loss": -10.142354965209961, "global_step": 232013, "epoch": 1381} {"train_loss": -10.95595932006836, "global_step": 232014, "epoch": 1381} {"train_loss": -9.71925163269043, "global_step": 232015, "epoch": 1381} {"train_loss": -10.892362594604492, "global_step": 232016, "epoch": 1381} {"train_loss": -10.291143417358398, "global_step": 232017, "epoch": 1381} {"train_loss": -11.129343032836914, "global_step": 232018, "epoch": 1381} {"train_loss": -10.453097343444824, "global_step": 232019, "epoch": 1381} {"train_loss": -11.096673965454102, "global_step": 232020, "epoch": 1381} {"train_loss": -10.826215744018555, "global_step": 232021, "epoch": 1381} {"train_loss": -11.247879028320312, "global_step": 232022, "epoch": 1381} {"train_loss": -11.094277381896973, "global_step": 232023, "epoch": 1381} {"train_loss": -11.168712615966797, "global_step": 232024, "epoch": 1381} {"train_loss": -10.494413375854492, "global_step": 232025, "epoch": 1381} {"train_loss": -11.405611038208008, "global_step": 232026, "epoch": 1381} {"train_loss": -10.685070037841797, "global_step": 232027, "epoch": 1381} {"train_loss": -10.915024757385254, "global_step": 232028, "epoch": 1381} {"train_loss": -11.17935562133789, "global_step": 232029, "epoch": 1381} {"train_loss": -11.283102035522461, "global_step": 232030, "epoch": 1381} {"train_loss": -11.522916793823242, "global_step": 232031, "epoch": 1381} {"train_loss": -11.122137069702148, "global_step": 232032, "epoch": 1381} {"train_loss": -11.486576080322266, "global_step": 232033, "epoch": 1381} {"train_loss": -11.431516647338867, "global_step": 232034, "epoch": 1381} {"train_loss": -11.517267227172852, "global_step": 232035, "epoch": 1381} {"train_loss": -11.468206405639648, "global_step": 232036, "epoch": 1381} {"train_loss": -11.410250663757324, "global_step": 232037, "epoch": 1381} {"train_loss": -11.533397674560547, "global_step": 232038, "epoch": 1381} {"train_loss": -11.794400215148926, "global_step": 232039, "epoch": 1381} {"train_loss": -11.546575546264648, "global_step": 232040, "epoch": 1381} {"train_loss": -11.649820327758789, "global_step": 232041, "epoch": 1381} {"train_loss": -11.373725891113281, "global_step": 232042, "epoch": 1381} {"train_loss": -11.673428535461426, "global_step": 232043, "epoch": 1381} {"train_loss": -11.625155448913574, "global_step": 232044, "epoch": 1381} {"train_loss": -11.73858642578125, "global_step": 232045, "epoch": 1381} {"train_loss": -11.54788589477539, "global_step": 232046, "epoch": 1381} {"train_loss": -11.744963645935059, "global_step": 232047, "epoch": 1381} {"train_loss": -11.783442497253418, "global_step": 232048, "epoch": 1381} {"train_loss": -11.84579086303711, "global_step": 232049, "epoch": 1381} {"train_loss": -11.675874710083008, "global_step": 232050, "epoch": 1381} {"train_loss": -11.798195838928223, "global_step": 232051, "epoch": 1381} {"train_loss": -11.787957191467285, "global_step": 232052, "epoch": 1381} {"train_loss": -11.881181716918945, "global_step": 232053, "epoch": 1381} {"train_loss": -11.702117919921875, "global_step": 232054, "epoch": 1381} {"train_loss": -11.56007194519043, "global_step": 232055, "epoch": 1381} {"train_loss": -11.665855407714844, "global_step": 232056, "epoch": 1381} {"train_loss": -11.849847793579102, "global_step": 232057, "epoch": 1381} {"train_loss": -11.87729263305664, "global_step": 232058, "epoch": 1381} {"train_loss": -11.819644927978516, "global_step": 232059, "epoch": 1381} {"train_loss": -11.93893051147461, "global_step": 232060, "epoch": 1381} {"train_loss": -12.024149894714355, "global_step": 232061, "epoch": 1381} {"train_loss": -11.911787986755371, "global_step": 232062, "epoch": 1381} {"train_loss": -11.861234664916992, "global_step": 232063, "epoch": 1381} {"train_loss": -11.935544967651367, "global_step": 232064, "epoch": 1381} {"train_loss": -12.121618270874023, "global_step": 232065, "epoch": 1381} {"train_loss": -12.111166954040527, "global_step": 232066, "epoch": 1381} {"train_loss": -11.900735855102539, "global_step": 232067, "epoch": 1381} {"train_loss": -12.137171745300293, "global_step": 232068, "epoch": 1381} {"train_loss": -12.085155487060547, "global_step": 232069, "epoch": 1381} {"train_loss": -11.870615005493164, "global_step": 232070, "epoch": 1381} {"train_loss": -11.944955825805664, "global_step": 232071, "epoch": 1381} {"train_loss": -11.918172836303711, "global_step": 232072, "epoch": 1381} {"train_loss": -12.0447998046875, "global_step": 232073, "epoch": 1381} {"train_loss": -12.082562446594238, "global_step": 232074, "epoch": 1381} {"train_loss": -11.984797477722168, "global_step": 232075, "epoch": 1381} {"train_loss": -12.065422058105469, "global_step": 232076, "epoch": 1381} {"train_loss": -11.676351547241211, "global_step": 232077, "epoch": 1381} {"train_loss": -11.931838989257812, "global_step": 232078, "epoch": 1381} {"train_loss": -11.938430786132812, "global_step": 232079, "epoch": 1381} {"train_loss": -11.534664154052734, "global_step": 232080, "epoch": 1381} {"train_loss": -12.166532516479492, "global_step": 232081, "epoch": 1381} {"train_loss": -11.784778594970703, "global_step": 232082, "epoch": 1381} {"train_loss": -11.943161964416504, "global_step": 232083, "epoch": 1381} {"train_loss": -11.874106407165527, "global_step": 232084, "epoch": 1381} {"train_loss": -11.534577369689941, "global_step": 232085, "epoch": 1381} {"train_loss": -11.63109016418457, "global_step": 232086, "epoch": 1381} {"train_loss": -12.025228500366211, "global_step": 232087, "epoch": 1381} {"train_loss": -11.764666557312012, "global_step": 232088, "epoch": 1381} {"train_loss": -11.565077781677246, "global_step": 232089, "epoch": 1381} {"train_loss": -11.348705291748047, "global_step": 232090, "epoch": 1381} {"train_loss": -11.904937744140625, "global_step": 232091, "epoch": 1381} {"train_loss": -11.558418273925781, "global_step": 232092, "epoch": 1381} {"train_loss": -11.579048156738281, "global_step": 232093, "epoch": 1381} {"train_loss": -11.680008888244629, "global_step": 232094, "epoch": 1381} {"train_loss": -11.871360778808594, "global_step": 232095, "epoch": 1381} {"train_loss": -11.522028923034668, "global_step": 232096, "epoch": 1381} {"train_loss": -11.929389953613281, "global_step": 232097, "epoch": 1381} {"train_loss": -11.6474609375, "global_step": 232098, "epoch": 1381} {"train_loss": -10.947586059570312, "global_step": 232099, "epoch": 1381} {"train_loss": -11.279938697814941, "global_step": 232100, "epoch": 1381} {"train_loss": -11.92046070098877, "global_step": 232101, "epoch": 1381} {"train_loss": -10.304559707641602, "global_step": 232102, "epoch": 1381} {"train_loss": -11.341119766235352, "global_step": 232103, "epoch": 1381} {"train_loss": -11.198272705078125, "global_step": 232104, "epoch": 1381} {"train_loss": -10.628646850585938, "global_step": 232105, "epoch": 1381} {"train_loss": -11.216361045837402, "global_step": 232106, "epoch": 1381} {"train_loss": -10.939615249633789, "global_step": 232107, "epoch": 1381} {"train_loss": -9.83180046081543, "global_step": 232108, "epoch": 1381} {"train_loss": -11.756851196289062, "global_step": 232109, "epoch": 1381} {"train_loss": -10.155900955200195, "global_step": 232110, "epoch": 1381} {"train_loss": -11.09836483001709, "global_step": 232111, "epoch": 1381} {"train_loss": -11.106472969055176, "global_step": 232112, "epoch": 1381} {"train_loss": -10.713232040405273, "global_step": 232113, "epoch": 1381} {"train_loss": -10.744431495666504, "global_step": 232114, "epoch": 1381} {"train_loss": -10.210460662841797, "global_step": 232115, "epoch": 1381} {"train_loss": -11.176811218261719, "global_step": 232116, "epoch": 1381} {"train_loss": -10.912252426147461, "global_step": 232117, "epoch": 1381} {"train_loss": -11.253288269042969, "global_step": 232118, "epoch": 1381} {"train_loss": -11.252138137817383, "global_step": 232119, "epoch": 1381} {"train_loss": -11.741205215454102, "global_step": 232120, "epoch": 1381} {"train_loss": -11.384711265563965, "global_step": 232121, "epoch": 1381} {"train_loss": -11.258216857910156, "global_step": 232122, "epoch": 1381} {"train_loss": -11.251421928405762, "global_step": 232123, "epoch": 1381} {"train_loss": -11.15485668182373, "global_step": 232124, "epoch": 1381} {"train_loss": -11.476318359375, "global_step": 232125, "epoch": 1381} {"train_loss": -11.513906478881836, "global_step": 232126, "epoch": 1381} {"train_loss": -11.1402587890625, "global_step": 232127, "epoch": 1381} {"train_loss": -11.615201950073242, "global_step": 232128, "epoch": 1381} {"train_loss": -11.211365699768066, "global_step": 232129, "epoch": 1381} {"train_loss": -11.21196174621582, "global_step": 232130, "epoch": 1381} {"train_loss": -11.718399047851562, "global_step": 232131, "epoch": 1381} {"train_loss": -11.077167510986328, "global_step": 232132, "epoch": 1381} {"train_loss": -11.517704010009766, "global_step": 232133, "epoch": 1381} {"train_loss": -11.030623435974121, "global_step": 232134, "epoch": 1381} {"train_loss": -11.485345840454102, "global_step": 232135, "epoch": 1381} {"train_loss": -11.369253158569336, "global_step": 232136, "epoch": 1381} {"train_loss": -11.48230266571045, "global_step": 232137, "epoch": 1381} {"train_loss": -11.58922290802002, "global_step": 232138, "epoch": 1381} {"train_loss": -11.768746376037598, "global_step": 232139, "epoch": 1381} {"train_loss": -11.731404304504395, "global_step": 232140, "epoch": 1381} {"train_loss": -11.669044494628906, "global_step": 232141, "epoch": 1381} {"train_loss": -11.64156436920166, "global_step": 232142, "epoch": 1381} {"train_loss": -11.704435348510742, "global_step": 232143, "epoch": 1381} {"train_loss": -11.742401123046875, "global_step": 232144, "epoch": 1381} {"train_loss": -11.652627944946289, "global_step": 232145, "epoch": 1381} {"train_loss": -11.64986801147461, "global_step": 232146, "epoch": 1381} {"train_loss": -11.619543075561523, "global_step": 232147, "epoch": 1381} {"train_loss": -11.778044700622559, "global_step": 232148, "epoch": 1381} {"train_loss": -11.595695495605469, "global_step": 232149, "epoch": 1381} {"train_loss": -11.869632720947266, "global_step": 232150, "epoch": 1381} {"train_loss": -11.695571899414062, "global_step": 232151, "epoch": 1381} {"train_loss": -11.947214126586914, "global_step": 232152, "epoch": 1381} {"train_loss": -11.670272827148438, "global_step": 232153, "epoch": 1381} {"train_loss": -11.668864250183105, "global_step": 232154, "epoch": 1381} {"train_loss": -11.971019744873047, "global_step": 232155, "epoch": 1381} {"train_loss": -11.68076229095459, "global_step": 232156, "epoch": 1381} {"train_loss": -11.848278045654297, "global_step": 232157, "epoch": 1381} {"train_loss": -11.763669967651367, "global_step": 232158, "epoch": 1381} {"train_loss": -11.84615421295166, "global_step": 232159, "epoch": 1381} {"train_loss": -11.812700271606445, "global_step": 232160, "epoch": 1381} {"train_loss": -12.030040740966797, "global_step": 232161, "epoch": 1381} {"train_loss": -11.889537811279297, "global_step": 232162, "epoch": 1381} {"train_loss": -12.033866882324219, "global_step": 232163, "epoch": 1381} {"train_loss": -11.522756576538086, "global_step": 232164, "epoch": 1381} {"train_loss": -11.96006965637207, "global_step": 232165, "epoch": 1381} {"train_loss": -11.945767402648926, "global_step": 232166, "epoch": 1381} {"train_loss": -11.998510360717773, "global_step": 232167, "epoch": 1381} {"train_loss": -12.072145462036133, "global_step": 232168, "epoch": 1381} {"train_loss": -11.953206062316895, "global_step": 232169, "epoch": 1381} {"train_loss": -12.036720275878906, "global_step": 232170, "epoch": 1381} {"train_loss": -12.021013259887695, "global_step": 232171, "epoch": 1381} {"train_loss": -11.779081344604492, "global_step": 232172, "epoch": 1381} {"train_loss": -11.700450897216797, "global_step": 232173, "epoch": 1381} {"train_loss": -11.702059745788574, "global_step": 232174, "epoch": 1381} {"train_loss": -11.496605384917487, "global_step": 232175, "epoch": 1381, "val_loss": 264334.09375} {"train_loss": -12.152839660644531, "global_step": 232176, "epoch": 1382} {"train_loss": -11.639161109924316, "global_step": 232177, "epoch": 1382} {"train_loss": -11.793880462646484, "global_step": 232178, "epoch": 1382} {"train_loss": -11.292646408081055, "global_step": 232179, "epoch": 1382} {"train_loss": -11.15152359008789, "global_step": 232180, "epoch": 1382} {"train_loss": -11.605249404907227, "global_step": 232181, "epoch": 1382} {"train_loss": -11.816750526428223, "global_step": 232182, "epoch": 1382} {"train_loss": -11.551214218139648, "global_step": 232183, "epoch": 1382} {"train_loss": -11.520219802856445, "global_step": 232184, "epoch": 1382} {"train_loss": -11.668216705322266, "global_step": 232185, "epoch": 1382} {"train_loss": -11.882867813110352, "global_step": 232186, "epoch": 1382} {"train_loss": -11.573184967041016, "global_step": 232187, "epoch": 1382} {"train_loss": -11.62592887878418, "global_step": 232188, "epoch": 1382} {"train_loss": -12.112356185913086, "global_step": 232189, "epoch": 1382} {"train_loss": -11.998746871948242, "global_step": 232190, "epoch": 1382} {"train_loss": -11.921436309814453, "global_step": 232191, "epoch": 1382} {"train_loss": -12.069252967834473, "global_step": 232192, "epoch": 1382} {"train_loss": -11.479198455810547, "global_step": 232193, "epoch": 1382} {"train_loss": -11.752098083496094, "global_step": 232194, "epoch": 1382} {"train_loss": -11.925064086914062, "global_step": 232195, "epoch": 1382} {"train_loss": -11.60842514038086, "global_step": 232196, "epoch": 1382} {"train_loss": -11.968860626220703, "global_step": 232197, "epoch": 1382} {"train_loss": -11.985088348388672, "global_step": 232198, "epoch": 1382} {"train_loss": -11.397348403930664, "global_step": 232199, "epoch": 1382} {"train_loss": -11.668296813964844, "global_step": 232200, "epoch": 1382} {"train_loss": -11.61780834197998, "global_step": 232201, "epoch": 1382} {"train_loss": -11.198881149291992, "global_step": 232202, "epoch": 1382} {"train_loss": -12.10287094116211, "global_step": 232203, "epoch": 1382} {"train_loss": -11.736701965332031, "global_step": 232204, "epoch": 1382} {"train_loss": -11.643259048461914, "global_step": 232205, "epoch": 1382} {"train_loss": -11.782022476196289, "global_step": 232206, "epoch": 1382} {"train_loss": -11.628787994384766, "global_step": 232207, "epoch": 1382} {"train_loss": -11.682048797607422, "global_step": 232208, "epoch": 1382} {"train_loss": -12.094188690185547, "global_step": 232209, "epoch": 1382} {"train_loss": -11.395270347595215, "global_step": 232210, "epoch": 1382} {"train_loss": -11.431489944458008, "global_step": 232211, "epoch": 1382} {"train_loss": -12.07312297821045, "global_step": 232212, "epoch": 1382} {"train_loss": -11.62997817993164, "global_step": 232213, "epoch": 1382} {"train_loss": -11.655807495117188, "global_step": 232214, "epoch": 1382} {"train_loss": -11.874492645263672, "global_step": 232215, "epoch": 1382} {"train_loss": -11.459671020507812, "global_step": 232216, "epoch": 1382} {"train_loss": -11.24728012084961, "global_step": 232217, "epoch": 1382} {"train_loss": -12.035551071166992, "global_step": 232218, "epoch": 1382} {"train_loss": -11.48932933807373, "global_step": 232219, "epoch": 1382} {"train_loss": -11.664009094238281, "global_step": 232220, "epoch": 1382} {"train_loss": -10.791582107543945, "global_step": 232221, "epoch": 1382} {"train_loss": -11.289979934692383, "global_step": 232222, "epoch": 1382} {"train_loss": -10.834196090698242, "global_step": 232223, "epoch": 1382} {"train_loss": -11.381024360656738, "global_step": 232224, "epoch": 1382} {"train_loss": -10.4617338180542, "global_step": 232225, "epoch": 1382} {"train_loss": -11.543426513671875, "global_step": 232226, "epoch": 1382} {"train_loss": -11.722256660461426, "global_step": 232227, "epoch": 1382} {"train_loss": -10.656089782714844, "global_step": 232228, "epoch": 1382} {"train_loss": -10.518158912658691, "global_step": 232229, "epoch": 1382} {"train_loss": -10.708322525024414, "global_step": 232230, "epoch": 1382} {"train_loss": -11.477996826171875, "global_step": 232231, "epoch": 1382} {"train_loss": -9.56379508972168, "global_step": 232232, "epoch": 1382} {"train_loss": -11.245113372802734, "global_step": 232233, "epoch": 1382} {"train_loss": -11.121907234191895, "global_step": 232234, "epoch": 1382} {"train_loss": -11.133563995361328, "global_step": 232235, "epoch": 1382} {"train_loss": -11.580557823181152, "global_step": 232236, "epoch": 1382} {"train_loss": -11.293067932128906, "global_step": 232237, "epoch": 1382} {"train_loss": -11.411019325256348, "global_step": 232238, "epoch": 1382} {"train_loss": -11.215973854064941, "global_step": 232239, "epoch": 1382} {"train_loss": -11.226608276367188, "global_step": 232240, "epoch": 1382} {"train_loss": -11.334019660949707, "global_step": 232241, "epoch": 1382} {"train_loss": -11.589463233947754, "global_step": 232242, "epoch": 1382} {"train_loss": -10.995634078979492, "global_step": 232243, "epoch": 1382} {"train_loss": -11.572625160217285, "global_step": 232244, "epoch": 1382} {"train_loss": -11.057262420654297, "global_step": 232245, "epoch": 1382} {"train_loss": -11.535032272338867, "global_step": 232246, "epoch": 1382} {"train_loss": -11.322364807128906, "global_step": 232247, "epoch": 1382} {"train_loss": -11.002921104431152, "global_step": 232248, "epoch": 1382} {"train_loss": -11.422259330749512, "global_step": 232249, "epoch": 1382} {"train_loss": -10.781831741333008, "global_step": 232250, "epoch": 1382} {"train_loss": -10.261184692382812, "global_step": 232251, "epoch": 1382} {"train_loss": -11.0037202835083, "global_step": 232252, "epoch": 1382} {"train_loss": -8.727052688598633, "global_step": 232253, "epoch": 1382} {"train_loss": -10.941837310791016, "global_step": 232254, "epoch": 1382} {"train_loss": -9.256128311157227, "global_step": 232255, "epoch": 1382} {"train_loss": -11.080745697021484, "global_step": 232256, "epoch": 1382} {"train_loss": -8.875903129577637, "global_step": 232257, "epoch": 1382} {"train_loss": -11.015496253967285, "global_step": 232258, "epoch": 1382} {"train_loss": -10.279353141784668, "global_step": 232259, "epoch": 1382} {"train_loss": -11.270380973815918, "global_step": 232260, "epoch": 1382} {"train_loss": -10.421202659606934, "global_step": 232261, "epoch": 1382} {"train_loss": -11.252532958984375, "global_step": 232262, "epoch": 1382} {"train_loss": -11.201777458190918, "global_step": 232263, "epoch": 1382} {"train_loss": -11.258398056030273, "global_step": 232264, "epoch": 1382} {"train_loss": -11.147331237792969, "global_step": 232265, "epoch": 1382} {"train_loss": -11.418933868408203, "global_step": 232266, "epoch": 1382} {"train_loss": -11.39082145690918, "global_step": 232267, "epoch": 1382} {"train_loss": -11.27700424194336, "global_step": 232268, "epoch": 1382} {"train_loss": -11.375045776367188, "global_step": 232269, "epoch": 1382} {"train_loss": -11.284889221191406, "global_step": 232270, "epoch": 1382} {"train_loss": -11.303860664367676, "global_step": 232271, "epoch": 1382} {"train_loss": -11.017041206359863, "global_step": 232272, "epoch": 1382} {"train_loss": -11.59996223449707, "global_step": 232273, "epoch": 1382} {"train_loss": -11.386519432067871, "global_step": 232274, "epoch": 1382} {"train_loss": -11.522872924804688, "global_step": 232275, "epoch": 1382} {"train_loss": -11.3141508102417, "global_step": 232276, "epoch": 1382} {"train_loss": -11.503859519958496, "global_step": 232277, "epoch": 1382} {"train_loss": -11.414889335632324, "global_step": 232278, "epoch": 1382} {"train_loss": -11.331897735595703, "global_step": 232279, "epoch": 1382} {"train_loss": -11.531286239624023, "global_step": 232280, "epoch": 1382} {"train_loss": -11.68576717376709, "global_step": 232281, "epoch": 1382} {"train_loss": -11.682992935180664, "global_step": 232282, "epoch": 1382} {"train_loss": -11.486246109008789, "global_step": 232283, "epoch": 1382} {"train_loss": -11.577823638916016, "global_step": 232284, "epoch": 1382} {"train_loss": -11.458205223083496, "global_step": 232285, "epoch": 1382} {"train_loss": -11.831989288330078, "global_step": 232286, "epoch": 1382} {"train_loss": -11.790733337402344, "global_step": 232287, "epoch": 1382} {"train_loss": -11.727612495422363, "global_step": 232288, "epoch": 1382} {"train_loss": -11.542383193969727, "global_step": 232289, "epoch": 1382} {"train_loss": -11.527034759521484, "global_step": 232290, "epoch": 1382} {"train_loss": -11.636067390441895, "global_step": 232291, "epoch": 1382} {"train_loss": -11.81248664855957, "global_step": 232292, "epoch": 1382} {"train_loss": -12.044474601745605, "global_step": 232293, "epoch": 1382} {"train_loss": -11.830469131469727, "global_step": 232294, "epoch": 1382} {"train_loss": -11.720197677612305, "global_step": 232295, "epoch": 1382} {"train_loss": -11.922607421875, "global_step": 232296, "epoch": 1382} {"train_loss": -11.856857299804688, "global_step": 232297, "epoch": 1382} {"train_loss": -11.939972877502441, "global_step": 232298, "epoch": 1382} {"train_loss": -11.828178405761719, "global_step": 232299, "epoch": 1382} {"train_loss": -12.001472473144531, "global_step": 232300, "epoch": 1382} {"train_loss": -11.86570930480957, "global_step": 232301, "epoch": 1382} {"train_loss": -11.999198913574219, "global_step": 232302, "epoch": 1382} {"train_loss": -12.085261344909668, "global_step": 232303, "epoch": 1382} {"train_loss": -12.111745834350586, "global_step": 232304, "epoch": 1382} {"train_loss": -11.936092376708984, "global_step": 232305, "epoch": 1382} {"train_loss": -12.013391494750977, "global_step": 232306, "epoch": 1382} {"train_loss": -11.94593620300293, "global_step": 232307, "epoch": 1382} {"train_loss": -11.85569953918457, "global_step": 232308, "epoch": 1382} {"train_loss": -11.805534362792969, "global_step": 232309, "epoch": 1382} {"train_loss": -11.77932357788086, "global_step": 232310, "epoch": 1382} {"train_loss": -11.515115737915039, "global_step": 232311, "epoch": 1382} {"train_loss": -11.731271743774414, "global_step": 232312, "epoch": 1382} {"train_loss": -11.904784202575684, "global_step": 232313, "epoch": 1382} {"train_loss": -11.781234741210938, "global_step": 232314, "epoch": 1382} {"train_loss": -11.763896942138672, "global_step": 232315, "epoch": 1382} {"train_loss": -12.022331237792969, "global_step": 232316, "epoch": 1382} {"train_loss": -11.830397605895996, "global_step": 232317, "epoch": 1382} {"train_loss": -11.947175979614258, "global_step": 232318, "epoch": 1382} {"train_loss": -11.936426162719727, "global_step": 232319, "epoch": 1382} {"train_loss": -11.919483184814453, "global_step": 232320, "epoch": 1382} {"train_loss": -11.785160064697266, "global_step": 232321, "epoch": 1382} {"train_loss": -12.157496452331543, "global_step": 232322, "epoch": 1382} {"train_loss": -11.899093627929688, "global_step": 232323, "epoch": 1382} {"train_loss": -11.797606468200684, "global_step": 232324, "epoch": 1382} {"train_loss": -11.92796802520752, "global_step": 232325, "epoch": 1382} {"train_loss": -11.839164733886719, "global_step": 232326, "epoch": 1382} {"train_loss": -11.747272491455078, "global_step": 232327, "epoch": 1382} {"train_loss": -11.723929405212402, "global_step": 232328, "epoch": 1382} {"train_loss": -12.018704414367676, "global_step": 232329, "epoch": 1382} {"train_loss": -10.58866024017334, "global_step": 232330, "epoch": 1382} {"train_loss": -11.53985595703125, "global_step": 232331, "epoch": 1382} {"train_loss": -11.844783782958984, "global_step": 232332, "epoch": 1382} {"train_loss": -11.304658889770508, "global_step": 232333, "epoch": 1382} {"train_loss": -11.62497329711914, "global_step": 232334, "epoch": 1382} {"train_loss": -11.699261665344238, "global_step": 232335, "epoch": 1382} {"train_loss": -12.140360832214355, "global_step": 232336, "epoch": 1382} {"train_loss": -11.749156951904297, "global_step": 232337, "epoch": 1382} {"train_loss": -11.709810256958008, "global_step": 232338, "epoch": 1382} {"train_loss": -11.85333251953125, "global_step": 232339, "epoch": 1382} {"train_loss": -11.66767692565918, "global_step": 232340, "epoch": 1382} {"train_loss": -11.767213821411133, "global_step": 232341, "epoch": 1382} {"train_loss": -11.553327560424805, "global_step": 232342, "epoch": 1382} {"train_loss": -11.493359066191173, "global_step": 232343, "epoch": 1382, "val_loss": 263358.09375} {"train_loss": -11.89181137084961, "global_step": 232344, "epoch": 1383} {"train_loss": -11.149892807006836, "global_step": 232345, "epoch": 1383} {"train_loss": -11.591468811035156, "global_step": 232346, "epoch": 1383} {"train_loss": -11.610701560974121, "global_step": 232347, "epoch": 1383} {"train_loss": -11.815608978271484, "global_step": 232348, "epoch": 1383} {"train_loss": -11.572824478149414, "global_step": 232349, "epoch": 1383} {"train_loss": -11.842424392700195, "global_step": 232350, "epoch": 1383} {"train_loss": -11.582637786865234, "global_step": 232351, "epoch": 1383} {"train_loss": -11.713695526123047, "global_step": 232352, "epoch": 1383} {"train_loss": -11.811379432678223, "global_step": 232353, "epoch": 1383} {"train_loss": -11.625730514526367, "global_step": 232354, "epoch": 1383} {"train_loss": -11.896242141723633, "global_step": 232355, "epoch": 1383} {"train_loss": -11.830244064331055, "global_step": 232356, "epoch": 1383} {"train_loss": -12.01844596862793, "global_step": 232357, "epoch": 1383} {"train_loss": -11.905333518981934, "global_step": 232358, "epoch": 1383} {"train_loss": -11.807801246643066, "global_step": 232359, "epoch": 1383} {"train_loss": -11.737398147583008, "global_step": 232360, "epoch": 1383} {"train_loss": -11.803380966186523, "global_step": 232361, "epoch": 1383} {"train_loss": -11.689459800720215, "global_step": 232362, "epoch": 1383} {"train_loss": -11.536155700683594, "global_step": 232363, "epoch": 1383} {"train_loss": -11.766408920288086, "global_step": 232364, "epoch": 1383} {"train_loss": -11.877823829650879, "global_step": 232365, "epoch": 1383} {"train_loss": -11.503419876098633, "global_step": 232366, "epoch": 1383} {"train_loss": -11.518320083618164, "global_step": 232367, "epoch": 1383} {"train_loss": -11.178315162658691, "global_step": 232368, "epoch": 1383} {"train_loss": -11.78326416015625, "global_step": 232369, "epoch": 1383} {"train_loss": -11.627126693725586, "global_step": 232370, "epoch": 1383} {"train_loss": -11.448105812072754, "global_step": 232371, "epoch": 1383} {"train_loss": -11.550521850585938, "global_step": 232372, "epoch": 1383} {"train_loss": -11.953380584716797, "global_step": 232373, "epoch": 1383} {"train_loss": -10.980681419372559, "global_step": 232374, "epoch": 1383} {"train_loss": -11.073429107666016, "global_step": 232375, "epoch": 1383} {"train_loss": -10.710220336914062, "global_step": 232376, "epoch": 1383} {"train_loss": -11.576026916503906, "global_step": 232377, "epoch": 1383} {"train_loss": -11.737350463867188, "global_step": 232378, "epoch": 1383} {"train_loss": -10.449596405029297, "global_step": 232379, "epoch": 1383} {"train_loss": -10.05262565612793, "global_step": 232380, "epoch": 1383} {"train_loss": -11.420284271240234, "global_step": 232381, "epoch": 1383} {"train_loss": -9.54826545715332, "global_step": 232382, "epoch": 1383} {"train_loss": -9.39001178741455, "global_step": 232383, "epoch": 1383} {"train_loss": -11.356868743896484, "global_step": 232384, "epoch": 1383} {"train_loss": -8.755693435668945, "global_step": 232385, "epoch": 1383} {"train_loss": -9.069938659667969, "global_step": 232386, "epoch": 1383} {"train_loss": -10.367321968078613, "global_step": 232387, "epoch": 1383} {"train_loss": -11.080738067626953, "global_step": 232388, "epoch": 1383} {"train_loss": -9.450949668884277, "global_step": 232389, "epoch": 1383} {"train_loss": -10.51820182800293, "global_step": 232390, "epoch": 1383} {"train_loss": -10.260221481323242, "global_step": 232391, "epoch": 1383} {"train_loss": -10.043153762817383, "global_step": 232392, "epoch": 1383} {"train_loss": -11.090776443481445, "global_step": 232393, "epoch": 1383} {"train_loss": -10.672677993774414, "global_step": 232394, "epoch": 1383} {"train_loss": -10.425548553466797, "global_step": 232395, "epoch": 1383} {"train_loss": -11.422674179077148, "global_step": 232396, "epoch": 1383} {"train_loss": -10.186298370361328, "global_step": 232397, "epoch": 1383} {"train_loss": -10.813441276550293, "global_step": 232398, "epoch": 1383} {"train_loss": -10.619248390197754, "global_step": 232399, "epoch": 1383} {"train_loss": -10.565727233886719, "global_step": 232400, "epoch": 1383} {"train_loss": -11.168070793151855, "global_step": 232401, "epoch": 1383} {"train_loss": -10.797971725463867, "global_step": 232402, "epoch": 1383} {"train_loss": -10.955509185791016, "global_step": 232403, "epoch": 1383} {"train_loss": -11.019502639770508, "global_step": 232404, "epoch": 1383} {"train_loss": -11.1104097366333, "global_step": 232405, "epoch": 1383} {"train_loss": -11.183853149414062, "global_step": 232406, "epoch": 1383} {"train_loss": -11.409873008728027, "global_step": 232407, "epoch": 1383} {"train_loss": -11.094884872436523, "global_step": 232408, "epoch": 1383} {"train_loss": -11.36530590057373, "global_step": 232409, "epoch": 1383} {"train_loss": -11.2720947265625, "global_step": 232410, "epoch": 1383} {"train_loss": -11.304445266723633, "global_step": 232411, "epoch": 1383} {"train_loss": -11.401171684265137, "global_step": 232412, "epoch": 1383} {"train_loss": -11.719364166259766, "global_step": 232413, "epoch": 1383} {"train_loss": -11.604532241821289, "global_step": 232414, "epoch": 1383} {"train_loss": -11.609251976013184, "global_step": 232415, "epoch": 1383} {"train_loss": -11.753973960876465, "global_step": 232416, "epoch": 1383} {"train_loss": -11.454883575439453, "global_step": 232417, "epoch": 1383} {"train_loss": -11.466269493103027, "global_step": 232418, "epoch": 1383} {"train_loss": -11.620304107666016, "global_step": 232419, "epoch": 1383} {"train_loss": -11.621691703796387, "global_step": 232420, "epoch": 1383} {"train_loss": -11.595890045166016, "global_step": 232421, "epoch": 1383} {"train_loss": -11.484234809875488, "global_step": 232422, "epoch": 1383} {"train_loss": -11.384742736816406, "global_step": 232423, "epoch": 1383} {"train_loss": -11.7154541015625, "global_step": 232424, "epoch": 1383} {"train_loss": -11.3133544921875, "global_step": 232425, "epoch": 1383} {"train_loss": -11.734590530395508, "global_step": 232426, "epoch": 1383} {"train_loss": -11.496678352355957, "global_step": 232427, "epoch": 1383} {"train_loss": -11.602693557739258, "global_step": 232428, "epoch": 1383} {"train_loss": -11.720344543457031, "global_step": 232429, "epoch": 1383} {"train_loss": -11.708341598510742, "global_step": 232430, "epoch": 1383} {"train_loss": -11.562646865844727, "global_step": 232431, "epoch": 1383} {"train_loss": -11.67088794708252, "global_step": 232432, "epoch": 1383} {"train_loss": -11.480608940124512, "global_step": 232433, "epoch": 1383} {"train_loss": -11.754203796386719, "global_step": 232434, "epoch": 1383} {"train_loss": -11.760605812072754, "global_step": 232435, "epoch": 1383} {"train_loss": -11.665637969970703, "global_step": 232436, "epoch": 1383} {"train_loss": -11.750199317932129, "global_step": 232437, "epoch": 1383} {"train_loss": -11.590959548950195, "global_step": 232438, "epoch": 1383} {"train_loss": -11.806072235107422, "global_step": 232439, "epoch": 1383} {"train_loss": -11.466774940490723, "global_step": 232440, "epoch": 1383} {"train_loss": -11.592897415161133, "global_step": 232441, "epoch": 1383} {"train_loss": -11.401191711425781, "global_step": 232442, "epoch": 1383} {"train_loss": -11.932083129882812, "global_step": 232443, "epoch": 1383} {"train_loss": -11.719058990478516, "global_step": 232444, "epoch": 1383} {"train_loss": -11.680669784545898, "global_step": 232445, "epoch": 1383} {"train_loss": -11.782577514648438, "global_step": 232446, "epoch": 1383} {"train_loss": -11.563852310180664, "global_step": 232447, "epoch": 1383} {"train_loss": -11.878992080688477, "global_step": 232448, "epoch": 1383} {"train_loss": -11.772468566894531, "global_step": 232449, "epoch": 1383} {"train_loss": -11.860974311828613, "global_step": 232450, "epoch": 1383} {"train_loss": -11.985894203186035, "global_step": 232451, "epoch": 1383} {"train_loss": -11.913620948791504, "global_step": 232452, "epoch": 1383} {"train_loss": -11.974372863769531, "global_step": 232453, "epoch": 1383} {"train_loss": -11.789873123168945, "global_step": 232454, "epoch": 1383} {"train_loss": -11.82151985168457, "global_step": 232455, "epoch": 1383} {"train_loss": -11.99843978881836, "global_step": 232456, "epoch": 1383} {"train_loss": -11.963785171508789, "global_step": 232457, "epoch": 1383} {"train_loss": -11.91671371459961, "global_step": 232458, "epoch": 1383} {"train_loss": -12.015983581542969, "global_step": 232459, "epoch": 1383} {"train_loss": -12.154617309570312, "global_step": 232460, "epoch": 1383} {"train_loss": -11.815180778503418, "global_step": 232461, "epoch": 1383} {"train_loss": -11.874849319458008, "global_step": 232462, "epoch": 1383} {"train_loss": -12.174932479858398, "global_step": 232463, "epoch": 1383} {"train_loss": -12.192035675048828, "global_step": 232464, "epoch": 1383} {"train_loss": -12.000802993774414, "global_step": 232465, "epoch": 1383} {"train_loss": -11.901558876037598, "global_step": 232466, "epoch": 1383} {"train_loss": -11.942699432373047, "global_step": 232467, "epoch": 1383} {"train_loss": -11.929523468017578, "global_step": 232468, "epoch": 1383} {"train_loss": -12.08929443359375, "global_step": 232469, "epoch": 1383} {"train_loss": -11.847671508789062, "global_step": 232470, "epoch": 1383} {"train_loss": -12.22509765625, "global_step": 232471, "epoch": 1383} {"train_loss": -11.906705856323242, "global_step": 232472, "epoch": 1383} {"train_loss": -12.257057189941406, "global_step": 232473, "epoch": 1383} {"train_loss": -11.95402717590332, "global_step": 232474, "epoch": 1383} {"train_loss": -12.304525375366211, "global_step": 232475, "epoch": 1383} {"train_loss": -11.881204605102539, "global_step": 232476, "epoch": 1383} {"train_loss": -11.936803817749023, "global_step": 232477, "epoch": 1383} {"train_loss": -11.951817512512207, "global_step": 232478, "epoch": 1383} {"train_loss": -11.625710487365723, "global_step": 232479, "epoch": 1383} {"train_loss": -11.698009490966797, "global_step": 232480, "epoch": 1383} {"train_loss": -11.575906753540039, "global_step": 232481, "epoch": 1383} {"train_loss": -11.571958541870117, "global_step": 232482, "epoch": 1383} {"train_loss": -11.865625381469727, "global_step": 232483, "epoch": 1383} {"train_loss": -11.765348434448242, "global_step": 232484, "epoch": 1383} {"train_loss": -11.814932823181152, "global_step": 232485, "epoch": 1383} {"train_loss": -11.795137405395508, "global_step": 232486, "epoch": 1383} {"train_loss": -11.860363006591797, "global_step": 232487, "epoch": 1383} {"train_loss": -11.801606178283691, "global_step": 232488, "epoch": 1383} {"train_loss": -12.212276458740234, "global_step": 232489, "epoch": 1383} {"train_loss": -11.915430068969727, "global_step": 232490, "epoch": 1383} {"train_loss": -11.6987886428833, "global_step": 232491, "epoch": 1383} {"train_loss": -12.075361251831055, "global_step": 232492, "epoch": 1383} {"train_loss": -11.754708290100098, "global_step": 232493, "epoch": 1383} {"train_loss": -11.261176109313965, "global_step": 232494, "epoch": 1383} {"train_loss": -11.270720481872559, "global_step": 232495, "epoch": 1383} {"train_loss": -11.711038589477539, "global_step": 232496, "epoch": 1383} {"train_loss": -11.57206916809082, "global_step": 232497, "epoch": 1383} {"train_loss": -11.51690673828125, "global_step": 232498, "epoch": 1383} {"train_loss": -10.858451843261719, "global_step": 232499, "epoch": 1383} {"train_loss": -11.406734466552734, "global_step": 232500, "epoch": 1383} {"train_loss": -11.741846084594727, "global_step": 232501, "epoch": 1383} {"train_loss": -11.305991172790527, "global_step": 232502, "epoch": 1383} {"train_loss": -11.375924110412598, "global_step": 232503, "epoch": 1383} {"train_loss": -11.318245887756348, "global_step": 232504, "epoch": 1383} {"train_loss": -11.326675415039062, "global_step": 232505, "epoch": 1383} {"train_loss": -11.498346328735352, "global_step": 232506, "epoch": 1383} {"train_loss": -11.086518287658691, "global_step": 232507, "epoch": 1383} {"train_loss": -11.4249849319458, "global_step": 232508, "epoch": 1383} {"train_loss": -11.501900672912598, "global_step": 232509, "epoch": 1383} {"train_loss": -11.166577339172363, "global_step": 232510, "epoch": 1383} {"train_loss": -11.47723765032632, "global_step": 232511, "epoch": 1383, "val_loss": 258668.078125} {"train_loss": -11.748687744140625, "global_step": 232512, "epoch": 1384} {"train_loss": -11.671286582946777, "global_step": 232513, "epoch": 1384} {"train_loss": -11.127503395080566, "global_step": 232514, "epoch": 1384} {"train_loss": -11.35537338256836, "global_step": 232515, "epoch": 1384} {"train_loss": -11.513635635375977, "global_step": 232516, "epoch": 1384} {"train_loss": -11.464859962463379, "global_step": 232517, "epoch": 1384} {"train_loss": -11.638833045959473, "global_step": 232518, "epoch": 1384} {"train_loss": -11.051507949829102, "global_step": 232519, "epoch": 1384} {"train_loss": -11.44433307647705, "global_step": 232520, "epoch": 1384} {"train_loss": -11.171197891235352, "global_step": 232521, "epoch": 1384} {"train_loss": -11.082025527954102, "global_step": 232522, "epoch": 1384} {"train_loss": -10.945585250854492, "global_step": 232523, "epoch": 1384} {"train_loss": -11.521150588989258, "global_step": 232524, "epoch": 1384} {"train_loss": -10.866601943969727, "global_step": 232525, "epoch": 1384} {"train_loss": -11.109243392944336, "global_step": 232526, "epoch": 1384} {"train_loss": -11.200355529785156, "global_step": 232527, "epoch": 1384} {"train_loss": -11.358478546142578, "global_step": 232528, "epoch": 1384} {"train_loss": -11.096574783325195, "global_step": 232529, "epoch": 1384} {"train_loss": -11.529321670532227, "global_step": 232530, "epoch": 1384} {"train_loss": -11.405659675598145, "global_step": 232531, "epoch": 1384} {"train_loss": -11.509231567382812, "global_step": 232532, "epoch": 1384} {"train_loss": -11.552034378051758, "global_step": 232533, "epoch": 1384} {"train_loss": -11.621896743774414, "global_step": 232534, "epoch": 1384} {"train_loss": -11.429679870605469, "global_step": 232535, "epoch": 1384} {"train_loss": -11.417991638183594, "global_step": 232536, "epoch": 1384} {"train_loss": -11.091728210449219, "global_step": 232537, "epoch": 1384} {"train_loss": -11.6527681350708, "global_step": 232538, "epoch": 1384} {"train_loss": -11.3178071975708, "global_step": 232539, "epoch": 1384} {"train_loss": -11.054880142211914, "global_step": 232540, "epoch": 1384} {"train_loss": -11.023740768432617, "global_step": 232541, "epoch": 1384} {"train_loss": -10.797883987426758, "global_step": 232542, "epoch": 1384} {"train_loss": -10.919392585754395, "global_step": 232543, "epoch": 1384} {"train_loss": -10.836803436279297, "global_step": 232544, "epoch": 1384} {"train_loss": -10.98037338256836, "global_step": 232545, "epoch": 1384} {"train_loss": -11.016034126281738, "global_step": 232546, "epoch": 1384} {"train_loss": -10.96603775024414, "global_step": 232547, "epoch": 1384} {"train_loss": -10.618827819824219, "global_step": 232548, "epoch": 1384} {"train_loss": -11.405145645141602, "global_step": 232549, "epoch": 1384} {"train_loss": -10.480180740356445, "global_step": 232550, "epoch": 1384} {"train_loss": -11.33419418334961, "global_step": 232551, "epoch": 1384} {"train_loss": -10.91581916809082, "global_step": 232552, "epoch": 1384} {"train_loss": -11.243867874145508, "global_step": 232553, "epoch": 1384} {"train_loss": -11.10174560546875, "global_step": 232554, "epoch": 1384} {"train_loss": -11.24439811706543, "global_step": 232555, "epoch": 1384} {"train_loss": -11.621770858764648, "global_step": 232556, "epoch": 1384} {"train_loss": -11.332086563110352, "global_step": 232557, "epoch": 1384} {"train_loss": -11.397550582885742, "global_step": 232558, "epoch": 1384} {"train_loss": -11.347816467285156, "global_step": 232559, "epoch": 1384} {"train_loss": -11.462651252746582, "global_step": 232560, "epoch": 1384} {"train_loss": -11.37096881866455, "global_step": 232561, "epoch": 1384} {"train_loss": -11.54496955871582, "global_step": 232562, "epoch": 1384} {"train_loss": -11.524187088012695, "global_step": 232563, "epoch": 1384} {"train_loss": -11.595962524414062, "global_step": 232564, "epoch": 1384} {"train_loss": -11.689285278320312, "global_step": 232565, "epoch": 1384} {"train_loss": -11.964250564575195, "global_step": 232566, "epoch": 1384} {"train_loss": -11.614221572875977, "global_step": 232567, "epoch": 1384} {"train_loss": -11.272844314575195, "global_step": 232568, "epoch": 1384} {"train_loss": -11.710002899169922, "global_step": 232569, "epoch": 1384} {"train_loss": -11.416818618774414, "global_step": 232570, "epoch": 1384} {"train_loss": -11.618423461914062, "global_step": 232571, "epoch": 1384} {"train_loss": -11.483195304870605, "global_step": 232572, "epoch": 1384} {"train_loss": -11.67324447631836, "global_step": 232573, "epoch": 1384} {"train_loss": -11.596614837646484, "global_step": 232574, "epoch": 1384} {"train_loss": -11.318106651306152, "global_step": 232575, "epoch": 1384} {"train_loss": -11.479278564453125, "global_step": 232576, "epoch": 1384} {"train_loss": -11.353629112243652, "global_step": 232577, "epoch": 1384} {"train_loss": -11.600276947021484, "global_step": 232578, "epoch": 1384} {"train_loss": -11.831114768981934, "global_step": 232579, "epoch": 1384} {"train_loss": -11.542041778564453, "global_step": 232580, "epoch": 1384} {"train_loss": -11.816194534301758, "global_step": 232581, "epoch": 1384} {"train_loss": -11.719705581665039, "global_step": 232582, "epoch": 1384} {"train_loss": -11.827619552612305, "global_step": 232583, "epoch": 1384} {"train_loss": -11.758049011230469, "global_step": 232584, "epoch": 1384} {"train_loss": -11.767483711242676, "global_step": 232585, "epoch": 1384} {"train_loss": -11.655587196350098, "global_step": 232586, "epoch": 1384} {"train_loss": -11.718328475952148, "global_step": 232587, "epoch": 1384} {"train_loss": -11.797662734985352, "global_step": 232588, "epoch": 1384} {"train_loss": -11.933521270751953, "global_step": 232589, "epoch": 1384} {"train_loss": -11.927583694458008, "global_step": 232590, "epoch": 1384} {"train_loss": -11.849632263183594, "global_step": 232591, "epoch": 1384} {"train_loss": -11.835880279541016, "global_step": 232592, "epoch": 1384} {"train_loss": -11.63009262084961, "global_step": 232593, "epoch": 1384} {"train_loss": -11.909128189086914, "global_step": 232594, "epoch": 1384} {"train_loss": -11.857902526855469, "global_step": 232595, "epoch": 1384} {"train_loss": -11.783615112304688, "global_step": 232596, "epoch": 1384} {"train_loss": -11.711896896362305, "global_step": 232597, "epoch": 1384} {"train_loss": -12.023256301879883, "global_step": 232598, "epoch": 1384} {"train_loss": -11.509441375732422, "global_step": 232599, "epoch": 1384} {"train_loss": -11.863584518432617, "global_step": 232600, "epoch": 1384} {"train_loss": -11.926939964294434, "global_step": 232601, "epoch": 1384} {"train_loss": -11.634819030761719, "global_step": 232602, "epoch": 1384} {"train_loss": -11.739920616149902, "global_step": 232603, "epoch": 1384} {"train_loss": -11.668262481689453, "global_step": 232604, "epoch": 1384} {"train_loss": -11.532981872558594, "global_step": 232605, "epoch": 1384} {"train_loss": -11.741037368774414, "global_step": 232606, "epoch": 1384} {"train_loss": -11.675118446350098, "global_step": 232607, "epoch": 1384} {"train_loss": -11.415514945983887, "global_step": 232608, "epoch": 1384} {"train_loss": -11.577783584594727, "global_step": 232609, "epoch": 1384} {"train_loss": -11.487825393676758, "global_step": 232610, "epoch": 1384} {"train_loss": -11.5885009765625, "global_step": 232611, "epoch": 1384} {"train_loss": -11.18984603881836, "global_step": 232612, "epoch": 1384} {"train_loss": -11.267951011657715, "global_step": 232613, "epoch": 1384} {"train_loss": -11.855905532836914, "global_step": 232614, "epoch": 1384} {"train_loss": -11.584037780761719, "global_step": 232615, "epoch": 1384} {"train_loss": -11.489486694335938, "global_step": 232616, "epoch": 1384} {"train_loss": -11.572168350219727, "global_step": 232617, "epoch": 1384} {"train_loss": -11.55746078491211, "global_step": 232618, "epoch": 1384} {"train_loss": -11.989973068237305, "global_step": 232619, "epoch": 1384} {"train_loss": -11.467081069946289, "global_step": 232620, "epoch": 1384} {"train_loss": -11.599298477172852, "global_step": 232621, "epoch": 1384} {"train_loss": -11.890619277954102, "global_step": 232622, "epoch": 1384} {"train_loss": -11.671443939208984, "global_step": 232623, "epoch": 1384} {"train_loss": -11.199283599853516, "global_step": 232624, "epoch": 1384} {"train_loss": -12.00377082824707, "global_step": 232625, "epoch": 1384} {"train_loss": -11.256627082824707, "global_step": 232626, "epoch": 1384} {"train_loss": -11.659232139587402, "global_step": 232627, "epoch": 1384} {"train_loss": -11.911136627197266, "global_step": 232628, "epoch": 1384} {"train_loss": -11.421005249023438, "global_step": 232629, "epoch": 1384} {"train_loss": -11.523141860961914, "global_step": 232630, "epoch": 1384} {"train_loss": -12.017051696777344, "global_step": 232631, "epoch": 1384} {"train_loss": -11.46049690246582, "global_step": 232632, "epoch": 1384} {"train_loss": -11.90202522277832, "global_step": 232633, "epoch": 1384} {"train_loss": -11.732244491577148, "global_step": 232634, "epoch": 1384} {"train_loss": -11.976000785827637, "global_step": 232635, "epoch": 1384} {"train_loss": -11.849567413330078, "global_step": 232636, "epoch": 1384} {"train_loss": -11.785730361938477, "global_step": 232637, "epoch": 1384} {"train_loss": -11.547870635986328, "global_step": 232638, "epoch": 1384} {"train_loss": -11.958551406860352, "global_step": 232639, "epoch": 1384} {"train_loss": -11.601633071899414, "global_step": 232640, "epoch": 1384} {"train_loss": -11.728313446044922, "global_step": 232641, "epoch": 1384} {"train_loss": -11.625690460205078, "global_step": 232642, "epoch": 1384} {"train_loss": -11.562482833862305, "global_step": 232643, "epoch": 1384} {"train_loss": -11.616983413696289, "global_step": 232644, "epoch": 1384} {"train_loss": -11.610487937927246, "global_step": 232645, "epoch": 1384} {"train_loss": -11.766376495361328, "global_step": 232646, "epoch": 1384} {"train_loss": -11.848608016967773, "global_step": 232647, "epoch": 1384} {"train_loss": -11.973413467407227, "global_step": 232648, "epoch": 1384} {"train_loss": -11.946999549865723, "global_step": 232649, "epoch": 1384} {"train_loss": -11.516996383666992, "global_step": 232650, "epoch": 1384} {"train_loss": -11.683664321899414, "global_step": 232651, "epoch": 1384} {"train_loss": -12.124231338500977, "global_step": 232652, "epoch": 1384} {"train_loss": -11.963627815246582, "global_step": 232653, "epoch": 1384} {"train_loss": -11.895848274230957, "global_step": 232654, "epoch": 1384} {"train_loss": -11.919818878173828, "global_step": 232655, "epoch": 1384} {"train_loss": -11.813215255737305, "global_step": 232656, "epoch": 1384} {"train_loss": -11.958429336547852, "global_step": 232657, "epoch": 1384} {"train_loss": -11.48232650756836, "global_step": 232658, "epoch": 1384} {"train_loss": -11.638803482055664, "global_step": 232659, "epoch": 1384} {"train_loss": -11.989072799682617, "global_step": 232660, "epoch": 1384} {"train_loss": -11.810985565185547, "global_step": 232661, "epoch": 1384} {"train_loss": -11.866765975952148, "global_step": 232662, "epoch": 1384} {"train_loss": -11.847990989685059, "global_step": 232663, "epoch": 1384} {"train_loss": -11.554219245910645, "global_step": 232664, "epoch": 1384} {"train_loss": -11.731679916381836, "global_step": 232665, "epoch": 1384} {"train_loss": -11.478950500488281, "global_step": 232666, "epoch": 1384} {"train_loss": -11.504060745239258, "global_step": 232667, "epoch": 1384} {"train_loss": -10.991968154907227, "global_step": 232668, "epoch": 1384} {"train_loss": -11.541933059692383, "global_step": 232669, "epoch": 1384} {"train_loss": -10.503838539123535, "global_step": 232670, "epoch": 1384} {"train_loss": -10.590179443359375, "global_step": 232671, "epoch": 1384} {"train_loss": -11.593740463256836, "global_step": 232672, "epoch": 1384} {"train_loss": -10.806659698486328, "global_step": 232673, "epoch": 1384} {"train_loss": -9.57229232788086, "global_step": 232674, "epoch": 1384} {"train_loss": -11.369327545166016, "global_step": 232675, "epoch": 1384} {"train_loss": -10.396172523498535, "global_step": 232676, "epoch": 1384} {"train_loss": -10.289969444274902, "global_step": 232677, "epoch": 1384} {"train_loss": -11.389862060546875, "global_step": 232678, "epoch": 1384} {"train_loss": -11.497549670083183, "global_step": 232679, "epoch": 1384, "val_loss": 262106.6875} {"train_loss": -11.501953125, "global_step": 232680, "epoch": 1385} {"train_loss": -10.432945251464844, "global_step": 232681, "epoch": 1385} {"train_loss": -11.429187774658203, "global_step": 232682, "epoch": 1385} {"train_loss": -10.66660213470459, "global_step": 232683, "epoch": 1385} {"train_loss": -11.770285606384277, "global_step": 232684, "epoch": 1385} {"train_loss": -11.19796371459961, "global_step": 232685, "epoch": 1385} {"train_loss": -11.531950950622559, "global_step": 232686, "epoch": 1385} {"train_loss": -11.041143417358398, "global_step": 232687, "epoch": 1385} {"train_loss": -11.155948638916016, "global_step": 232688, "epoch": 1385} {"train_loss": -11.594983100891113, "global_step": 232689, "epoch": 1385} {"train_loss": -11.276298522949219, "global_step": 232690, "epoch": 1385} {"train_loss": -11.025296211242676, "global_step": 232691, "epoch": 1385} {"train_loss": -11.195859909057617, "global_step": 232692, "epoch": 1385} {"train_loss": -11.497148513793945, "global_step": 232693, "epoch": 1385} {"train_loss": -11.645065307617188, "global_step": 232694, "epoch": 1385} {"train_loss": -11.201238632202148, "global_step": 232695, "epoch": 1385} {"train_loss": -11.255971908569336, "global_step": 232696, "epoch": 1385} {"train_loss": -11.556558609008789, "global_step": 232697, "epoch": 1385} {"train_loss": -11.370129585266113, "global_step": 232698, "epoch": 1385} {"train_loss": -11.530707359313965, "global_step": 232699, "epoch": 1385} {"train_loss": -11.092458724975586, "global_step": 232700, "epoch": 1385} {"train_loss": -11.613712310791016, "global_step": 232701, "epoch": 1385} {"train_loss": -11.284527778625488, "global_step": 232702, "epoch": 1385} {"train_loss": -11.490330696105957, "global_step": 232703, "epoch": 1385} {"train_loss": -11.75365924835205, "global_step": 232704, "epoch": 1385} {"train_loss": -11.48265552520752, "global_step": 232705, "epoch": 1385} {"train_loss": -11.56142807006836, "global_step": 232706, "epoch": 1385} {"train_loss": -11.253791809082031, "global_step": 232707, "epoch": 1385} {"train_loss": -11.48766803741455, "global_step": 232708, "epoch": 1385} {"train_loss": -11.434534072875977, "global_step": 232709, "epoch": 1385} {"train_loss": -11.651206016540527, "global_step": 232710, "epoch": 1385} {"train_loss": -11.84561824798584, "global_step": 232711, "epoch": 1385} {"train_loss": -11.919242858886719, "global_step": 232712, "epoch": 1385} {"train_loss": -11.672768592834473, "global_step": 232713, "epoch": 1385} {"train_loss": -11.557487487792969, "global_step": 232714, "epoch": 1385} {"train_loss": -11.723654747009277, "global_step": 232715, "epoch": 1385} {"train_loss": -11.723162651062012, "global_step": 232716, "epoch": 1385} {"train_loss": -11.682317733764648, "global_step": 232717, "epoch": 1385} {"train_loss": -11.595481872558594, "global_step": 232718, "epoch": 1385} {"train_loss": -11.830496788024902, "global_step": 232719, "epoch": 1385} {"train_loss": -11.708967208862305, "global_step": 232720, "epoch": 1385} {"train_loss": -11.790412902832031, "global_step": 232721, "epoch": 1385} {"train_loss": -11.888688087463379, "global_step": 232722, "epoch": 1385} {"train_loss": -11.766992568969727, "global_step": 232723, "epoch": 1385} {"train_loss": -11.660808563232422, "global_step": 232724, "epoch": 1385} {"train_loss": -12.025219917297363, "global_step": 232725, "epoch": 1385} {"train_loss": -11.61233139038086, "global_step": 232726, "epoch": 1385} {"train_loss": -11.821321487426758, "global_step": 232727, "epoch": 1385} {"train_loss": -12.00165843963623, "global_step": 232728, "epoch": 1385} {"train_loss": -11.818284034729004, "global_step": 232729, "epoch": 1385} {"train_loss": -11.780027389526367, "global_step": 232730, "epoch": 1385} {"train_loss": -11.907770156860352, "global_step": 232731, "epoch": 1385} {"train_loss": -11.89958381652832, "global_step": 232732, "epoch": 1385} {"train_loss": -11.679113388061523, "global_step": 232733, "epoch": 1385} {"train_loss": -11.769355773925781, "global_step": 232734, "epoch": 1385} {"train_loss": -11.6666898727417, "global_step": 232735, "epoch": 1385} {"train_loss": -11.867966651916504, "global_step": 232736, "epoch": 1385} {"train_loss": -11.690752983093262, "global_step": 232737, "epoch": 1385} {"train_loss": -11.650259971618652, "global_step": 232738, "epoch": 1385} {"train_loss": -11.849932670593262, "global_step": 232739, "epoch": 1385} {"train_loss": -11.866649627685547, "global_step": 232740, "epoch": 1385} {"train_loss": -11.714349746704102, "global_step": 232741, "epoch": 1385} {"train_loss": -11.86539077758789, "global_step": 232742, "epoch": 1385} {"train_loss": -11.666553497314453, "global_step": 232743, "epoch": 1385} {"train_loss": -11.437984466552734, "global_step": 232744, "epoch": 1385} {"train_loss": -12.017721176147461, "global_step": 232745, "epoch": 1385} {"train_loss": -11.615510940551758, "global_step": 232746, "epoch": 1385} {"train_loss": -11.957497596740723, "global_step": 232747, "epoch": 1385} {"train_loss": -11.935150146484375, "global_step": 232748, "epoch": 1385} {"train_loss": -12.02987289428711, "global_step": 232749, "epoch": 1385} {"train_loss": -11.864255905151367, "global_step": 232750, "epoch": 1385} {"train_loss": -12.039447784423828, "global_step": 232751, "epoch": 1385} {"train_loss": -11.850775718688965, "global_step": 232752, "epoch": 1385} {"train_loss": -11.703986167907715, "global_step": 232753, "epoch": 1385} {"train_loss": -11.54965591430664, "global_step": 232754, "epoch": 1385} {"train_loss": -11.85498046875, "global_step": 232755, "epoch": 1385} {"train_loss": -11.992015838623047, "global_step": 232756, "epoch": 1385} {"train_loss": -11.56418228149414, "global_step": 232757, "epoch": 1385} {"train_loss": -11.780108451843262, "global_step": 232758, "epoch": 1385} {"train_loss": -11.519169807434082, "global_step": 232759, "epoch": 1385} {"train_loss": -11.857398986816406, "global_step": 232760, "epoch": 1385} {"train_loss": -11.199788093566895, "global_step": 232761, "epoch": 1385} {"train_loss": -10.923665046691895, "global_step": 232762, "epoch": 1385} {"train_loss": -11.861886024475098, "global_step": 232763, "epoch": 1385} {"train_loss": -10.63054370880127, "global_step": 232764, "epoch": 1385} {"train_loss": -11.030652046203613, "global_step": 232765, "epoch": 1385} {"train_loss": -9.813339233398438, "global_step": 232766, "epoch": 1385} {"train_loss": -11.317895889282227, "global_step": 232767, "epoch": 1385} {"train_loss": -10.516702651977539, "global_step": 232768, "epoch": 1385} {"train_loss": -10.80539321899414, "global_step": 232769, "epoch": 1385} {"train_loss": -10.679817199707031, "global_step": 232770, "epoch": 1385} {"train_loss": -11.430421829223633, "global_step": 232771, "epoch": 1385} {"train_loss": -10.781109809875488, "global_step": 232772, "epoch": 1385} {"train_loss": -9.426294326782227, "global_step": 232773, "epoch": 1385} {"train_loss": -11.399429321289062, "global_step": 232774, "epoch": 1385} {"train_loss": -10.139742851257324, "global_step": 232775, "epoch": 1385} {"train_loss": -10.259238243103027, "global_step": 232776, "epoch": 1385} {"train_loss": -11.15791130065918, "global_step": 232777, "epoch": 1385} {"train_loss": -9.871728897094727, "global_step": 232778, "epoch": 1385} {"train_loss": -10.835792541503906, "global_step": 232779, "epoch": 1385} {"train_loss": -10.733991622924805, "global_step": 232780, "epoch": 1385} {"train_loss": -10.802846908569336, "global_step": 232781, "epoch": 1385} {"train_loss": -10.810144424438477, "global_step": 232782, "epoch": 1385} {"train_loss": -11.155357360839844, "global_step": 232783, "epoch": 1385} {"train_loss": -10.912208557128906, "global_step": 232784, "epoch": 1385} {"train_loss": -11.132696151733398, "global_step": 232785, "epoch": 1385} {"train_loss": -11.300045013427734, "global_step": 232786, "epoch": 1385} {"train_loss": -11.078956604003906, "global_step": 232787, "epoch": 1385} {"train_loss": -11.297836303710938, "global_step": 232788, "epoch": 1385} {"train_loss": -10.812500953674316, "global_step": 232789, "epoch": 1385} {"train_loss": -11.259765625, "global_step": 232790, "epoch": 1385} {"train_loss": -11.148755073547363, "global_step": 232791, "epoch": 1385} {"train_loss": -10.886326789855957, "global_step": 232792, "epoch": 1385} {"train_loss": -11.247200965881348, "global_step": 232793, "epoch": 1385} {"train_loss": -11.401867866516113, "global_step": 232794, "epoch": 1385} {"train_loss": -11.288192749023438, "global_step": 232795, "epoch": 1385} {"train_loss": -11.53003215789795, "global_step": 232796, "epoch": 1385} {"train_loss": -11.058454513549805, "global_step": 232797, "epoch": 1385} {"train_loss": -11.525754928588867, "global_step": 232798, "epoch": 1385} {"train_loss": -11.17266845703125, "global_step": 232799, "epoch": 1385} {"train_loss": -11.412897109985352, "global_step": 232800, "epoch": 1385} {"train_loss": -11.320856094360352, "global_step": 232801, "epoch": 1385} {"train_loss": -11.097996711730957, "global_step": 232802, "epoch": 1385} {"train_loss": -10.795010566711426, "global_step": 232803, "epoch": 1385} {"train_loss": -11.505973815917969, "global_step": 232804, "epoch": 1385} {"train_loss": -10.951314926147461, "global_step": 232805, "epoch": 1385} {"train_loss": -11.376033782958984, "global_step": 232806, "epoch": 1385} {"train_loss": -11.50786018371582, "global_step": 232807, "epoch": 1385} {"train_loss": -11.54121208190918, "global_step": 232808, "epoch": 1385} {"train_loss": -11.699480056762695, "global_step": 232809, "epoch": 1385} {"train_loss": -11.680952072143555, "global_step": 232810, "epoch": 1385} {"train_loss": -11.687328338623047, "global_step": 232811, "epoch": 1385} {"train_loss": -11.732087135314941, "global_step": 232812, "epoch": 1385} {"train_loss": -11.6453857421875, "global_step": 232813, "epoch": 1385} {"train_loss": -11.491883277893066, "global_step": 232814, "epoch": 1385} {"train_loss": -11.77427864074707, "global_step": 232815, "epoch": 1385} {"train_loss": -11.898652076721191, "global_step": 232816, "epoch": 1385} {"train_loss": -11.561885833740234, "global_step": 232817, "epoch": 1385} {"train_loss": -11.796548843383789, "global_step": 232818, "epoch": 1385} {"train_loss": -11.696979522705078, "global_step": 232819, "epoch": 1385} {"train_loss": -11.774324417114258, "global_step": 232820, "epoch": 1385} {"train_loss": -11.86252212524414, "global_step": 232821, "epoch": 1385} {"train_loss": -11.723209381103516, "global_step": 232822, "epoch": 1385} {"train_loss": -11.860757827758789, "global_step": 232823, "epoch": 1385} {"train_loss": -11.913373947143555, "global_step": 232824, "epoch": 1385} {"train_loss": -11.771793365478516, "global_step": 232825, "epoch": 1385} {"train_loss": -11.886821746826172, "global_step": 232826, "epoch": 1385} {"train_loss": -11.889700889587402, "global_step": 232827, "epoch": 1385} {"train_loss": -11.718854904174805, "global_step": 232828, "epoch": 1385} {"train_loss": -11.791799545288086, "global_step": 232829, "epoch": 1385} {"train_loss": -11.823685646057129, "global_step": 232830, "epoch": 1385} {"train_loss": -11.718692779541016, "global_step": 232831, "epoch": 1385} {"train_loss": -11.82436752319336, "global_step": 232832, "epoch": 1385} {"train_loss": -11.843353271484375, "global_step": 232833, "epoch": 1385} {"train_loss": -11.863672256469727, "global_step": 232834, "epoch": 1385} {"train_loss": -11.828067779541016, "global_step": 232835, "epoch": 1385} {"train_loss": -11.589502334594727, "global_step": 232836, "epoch": 1385} {"train_loss": -11.840082168579102, "global_step": 232837, "epoch": 1385} {"train_loss": -11.979284286499023, "global_step": 232838, "epoch": 1385} {"train_loss": -11.653571128845215, "global_step": 232839, "epoch": 1385} {"train_loss": -11.56577205657959, "global_step": 232840, "epoch": 1385} {"train_loss": -11.992103576660156, "global_step": 232841, "epoch": 1385} {"train_loss": -11.733848571777344, "global_step": 232842, "epoch": 1385} {"train_loss": -12.01048755645752, "global_step": 232843, "epoch": 1385} {"train_loss": -11.574016571044922, "global_step": 232844, "epoch": 1385} {"train_loss": -12.008464813232422, "global_step": 232845, "epoch": 1385} {"train_loss": -12.06698226928711, "global_step": 232846, "epoch": 1385} {"train_loss": -11.48246655577705, "global_step": 232847, "epoch": 1385, "val_loss": 263220.78125, "train_action_mse_error": 1.7894506454467773} {"train_loss": -11.842071533203125, "global_step": 232848, "epoch": 1386} {"train_loss": -12.051170349121094, "global_step": 232849, "epoch": 1386} {"train_loss": -12.143465042114258, "global_step": 232850, "epoch": 1386} {"train_loss": -12.105515480041504, "global_step": 232851, "epoch": 1386} {"train_loss": -12.00800895690918, "global_step": 232852, "epoch": 1386} {"train_loss": -12.100125312805176, "global_step": 232853, "epoch": 1386} {"train_loss": -11.993780136108398, "global_step": 232854, "epoch": 1386} {"train_loss": -12.147411346435547, "global_step": 232855, "epoch": 1386} {"train_loss": -11.874519348144531, "global_step": 232856, "epoch": 1386} {"train_loss": -12.008707046508789, "global_step": 232857, "epoch": 1386} {"train_loss": -11.895928382873535, "global_step": 232858, "epoch": 1386} {"train_loss": -11.843643188476562, "global_step": 232859, "epoch": 1386} {"train_loss": -11.841325759887695, "global_step": 232860, "epoch": 1386} {"train_loss": -11.219304084777832, "global_step": 232861, "epoch": 1386} {"train_loss": -10.396848678588867, "global_step": 232862, "epoch": 1386} {"train_loss": -11.084903717041016, "global_step": 232863, "epoch": 1386} {"train_loss": -11.685598373413086, "global_step": 232864, "epoch": 1386} {"train_loss": -10.018877983093262, "global_step": 232865, "epoch": 1386} {"train_loss": -10.224851608276367, "global_step": 232866, "epoch": 1386} {"train_loss": -11.074793815612793, "global_step": 232867, "epoch": 1386} {"train_loss": -10.681756973266602, "global_step": 232868, "epoch": 1386} {"train_loss": -10.542713165283203, "global_step": 232869, "epoch": 1386} {"train_loss": -11.170358657836914, "global_step": 232870, "epoch": 1386} {"train_loss": -9.949331283569336, "global_step": 232871, "epoch": 1386} {"train_loss": -11.30099105834961, "global_step": 232872, "epoch": 1386} {"train_loss": -10.016843795776367, "global_step": 232873, "epoch": 1386} {"train_loss": -7.422126770019531, "global_step": 232874, "epoch": 1386} {"train_loss": -9.174118041992188, "global_step": 232875, "epoch": 1386} {"train_loss": -10.450531005859375, "global_step": 232876, "epoch": 1386} {"train_loss": -8.661535263061523, "global_step": 232877, "epoch": 1386} {"train_loss": -8.869796752929688, "global_step": 232878, "epoch": 1386} {"train_loss": -7.170407295227051, "global_step": 232879, "epoch": 1386} {"train_loss": -8.173541069030762, "global_step": 232880, "epoch": 1386} {"train_loss": -8.454007148742676, "global_step": 232881, "epoch": 1386} {"train_loss": -8.925470352172852, "global_step": 232882, "epoch": 1386} {"train_loss": -9.342348098754883, "global_step": 232883, "epoch": 1386} {"train_loss": -9.202184677124023, "global_step": 232884, "epoch": 1386} {"train_loss": -8.055793762207031, "global_step": 232885, "epoch": 1386} {"train_loss": -9.638104438781738, "global_step": 232886, "epoch": 1386} {"train_loss": -10.808755874633789, "global_step": 232887, "epoch": 1386} {"train_loss": -9.392699241638184, "global_step": 232888, "epoch": 1386} {"train_loss": -10.958477020263672, "global_step": 232889, "epoch": 1386} {"train_loss": -10.359441757202148, "global_step": 232890, "epoch": 1386} {"train_loss": -10.344104766845703, "global_step": 232891, "epoch": 1386} {"train_loss": -10.882026672363281, "global_step": 232892, "epoch": 1386} {"train_loss": -11.205467224121094, "global_step": 232893, "epoch": 1386} {"train_loss": -10.829824447631836, "global_step": 232894, "epoch": 1386} {"train_loss": -11.293572425842285, "global_step": 232895, "epoch": 1386} {"train_loss": -11.058095932006836, "global_step": 232896, "epoch": 1386} {"train_loss": -11.47146224975586, "global_step": 232897, "epoch": 1386} {"train_loss": -11.21832275390625, "global_step": 232898, "epoch": 1386} {"train_loss": -11.328908920288086, "global_step": 232899, "epoch": 1386} {"train_loss": -11.153087615966797, "global_step": 232900, "epoch": 1386} {"train_loss": -11.356907844543457, "global_step": 232901, "epoch": 1386} {"train_loss": -11.063167572021484, "global_step": 232902, "epoch": 1386} {"train_loss": -11.205390930175781, "global_step": 232903, "epoch": 1386} {"train_loss": -11.352242469787598, "global_step": 232904, "epoch": 1386} {"train_loss": -11.127150535583496, "global_step": 232905, "epoch": 1386} {"train_loss": -11.676229476928711, "global_step": 232906, "epoch": 1386} {"train_loss": -11.03662109375, "global_step": 232907, "epoch": 1386} {"train_loss": -11.706001281738281, "global_step": 232908, "epoch": 1386} {"train_loss": -11.151117324829102, "global_step": 232909, "epoch": 1386} {"train_loss": -11.455591201782227, "global_step": 232910, "epoch": 1386} {"train_loss": -11.482125282287598, "global_step": 232911, "epoch": 1386} {"train_loss": -11.460926055908203, "global_step": 232912, "epoch": 1386} {"train_loss": -11.44963264465332, "global_step": 232913, "epoch": 1386} {"train_loss": -11.716055870056152, "global_step": 232914, "epoch": 1386} {"train_loss": -11.463926315307617, "global_step": 232915, "epoch": 1386} {"train_loss": -11.691633224487305, "global_step": 232916, "epoch": 1386} {"train_loss": -11.537325859069824, "global_step": 232917, "epoch": 1386} {"train_loss": -11.571894645690918, "global_step": 232918, "epoch": 1386} {"train_loss": -11.717737197875977, "global_step": 232919, "epoch": 1386} {"train_loss": -11.499410629272461, "global_step": 232920, "epoch": 1386} {"train_loss": -11.737119674682617, "global_step": 232921, "epoch": 1386} {"train_loss": -11.694108963012695, "global_step": 232922, "epoch": 1386} {"train_loss": -11.72903060913086, "global_step": 232923, "epoch": 1386} {"train_loss": -11.641857147216797, "global_step": 232924, "epoch": 1386} {"train_loss": -11.560873031616211, "global_step": 232925, "epoch": 1386} {"train_loss": -11.495027542114258, "global_step": 232926, "epoch": 1386} {"train_loss": -11.850379943847656, "global_step": 232927, "epoch": 1386} {"train_loss": -11.709762573242188, "global_step": 232928, "epoch": 1386} {"train_loss": -11.84146499633789, "global_step": 232929, "epoch": 1386} {"train_loss": -11.644170761108398, "global_step": 232930, "epoch": 1386} {"train_loss": -11.786823272705078, "global_step": 232931, "epoch": 1386} {"train_loss": -11.816888809204102, "global_step": 232932, "epoch": 1386} {"train_loss": -11.753595352172852, "global_step": 232933, "epoch": 1386} {"train_loss": -11.918813705444336, "global_step": 232934, "epoch": 1386} {"train_loss": -11.919331550598145, "global_step": 232935, "epoch": 1386} {"train_loss": -11.921418190002441, "global_step": 232936, "epoch": 1386} {"train_loss": -11.838092803955078, "global_step": 232937, "epoch": 1386} {"train_loss": -11.802270889282227, "global_step": 232938, "epoch": 1386} {"train_loss": -12.107272148132324, "global_step": 232939, "epoch": 1386} {"train_loss": -12.028526306152344, "global_step": 232940, "epoch": 1386} {"train_loss": -11.675743103027344, "global_step": 232941, "epoch": 1386} {"train_loss": -12.023538589477539, "global_step": 232942, "epoch": 1386} {"train_loss": -11.91794490814209, "global_step": 232943, "epoch": 1386} {"train_loss": -11.950456619262695, "global_step": 232944, "epoch": 1386} {"train_loss": -11.834162712097168, "global_step": 232945, "epoch": 1386} {"train_loss": -11.761406898498535, "global_step": 232946, "epoch": 1386} {"train_loss": -11.524486541748047, "global_step": 232947, "epoch": 1386} {"train_loss": -12.059515953063965, "global_step": 232948, "epoch": 1386} {"train_loss": -11.646231651306152, "global_step": 232949, "epoch": 1386} {"train_loss": -11.653388977050781, "global_step": 232950, "epoch": 1386} {"train_loss": -11.906229972839355, "global_step": 232951, "epoch": 1386} {"train_loss": -11.904480934143066, "global_step": 232952, "epoch": 1386} {"train_loss": -11.621891975402832, "global_step": 232953, "epoch": 1386} {"train_loss": -11.782857894897461, "global_step": 232954, "epoch": 1386} {"train_loss": -11.891031265258789, "global_step": 232955, "epoch": 1386} {"train_loss": -11.975170135498047, "global_step": 232956, "epoch": 1386} {"train_loss": -12.145879745483398, "global_step": 232957, "epoch": 1386} {"train_loss": -11.76643180847168, "global_step": 232958, "epoch": 1386} {"train_loss": -12.021219253540039, "global_step": 232959, "epoch": 1386} {"train_loss": -11.851106643676758, "global_step": 232960, "epoch": 1386} {"train_loss": -12.167067527770996, "global_step": 232961, "epoch": 1386} {"train_loss": -11.733020782470703, "global_step": 232962, "epoch": 1386} {"train_loss": -12.076140403747559, "global_step": 232963, "epoch": 1386} {"train_loss": -12.150694847106934, "global_step": 232964, "epoch": 1386} {"train_loss": -11.873248100280762, "global_step": 232965, "epoch": 1386} {"train_loss": -12.14986801147461, "global_step": 232966, "epoch": 1386} {"train_loss": -11.560747146606445, "global_step": 232967, "epoch": 1386} {"train_loss": -10.994935989379883, "global_step": 232968, "epoch": 1386} {"train_loss": -11.468486785888672, "global_step": 232969, "epoch": 1386} {"train_loss": -11.897858619689941, "global_step": 232970, "epoch": 1386} {"train_loss": -11.863374710083008, "global_step": 232971, "epoch": 1386} {"train_loss": -12.062460899353027, "global_step": 232972, "epoch": 1386} {"train_loss": -12.130697250366211, "global_step": 232973, "epoch": 1386} {"train_loss": -11.898551940917969, "global_step": 232974, "epoch": 1386} {"train_loss": -11.777690887451172, "global_step": 232975, "epoch": 1386} {"train_loss": -11.790316581726074, "global_step": 232976, "epoch": 1386} {"train_loss": -11.941322326660156, "global_step": 232977, "epoch": 1386} {"train_loss": -11.777721405029297, "global_step": 232978, "epoch": 1386} {"train_loss": -11.602426528930664, "global_step": 232979, "epoch": 1386} {"train_loss": -12.092933654785156, "global_step": 232980, "epoch": 1386} {"train_loss": -11.694517135620117, "global_step": 232981, "epoch": 1386} {"train_loss": -11.660639762878418, "global_step": 232982, "epoch": 1386} {"train_loss": -11.72891902923584, "global_step": 232983, "epoch": 1386} {"train_loss": -11.217288970947266, "global_step": 232984, "epoch": 1386} {"train_loss": -10.431708335876465, "global_step": 232985, "epoch": 1386} {"train_loss": -11.156786918640137, "global_step": 232986, "epoch": 1386} {"train_loss": -12.033905982971191, "global_step": 232987, "epoch": 1386} {"train_loss": -10.813533782958984, "global_step": 232988, "epoch": 1386} {"train_loss": -9.936861038208008, "global_step": 232989, "epoch": 1386} {"train_loss": -11.604336738586426, "global_step": 232990, "epoch": 1386} {"train_loss": -10.935970306396484, "global_step": 232991, "epoch": 1386} {"train_loss": -10.054330825805664, "global_step": 232992, "epoch": 1386} {"train_loss": -11.20154094696045, "global_step": 232993, "epoch": 1386} {"train_loss": -11.882583618164062, "global_step": 232994, "epoch": 1386} {"train_loss": -10.594547271728516, "global_step": 232995, "epoch": 1386} {"train_loss": -10.643305778503418, "global_step": 232996, "epoch": 1386} {"train_loss": -11.805076599121094, "global_step": 232997, "epoch": 1386} {"train_loss": -10.67903995513916, "global_step": 232998, "epoch": 1386} {"train_loss": -11.459001541137695, "global_step": 232999, "epoch": 1386} {"train_loss": -11.786839485168457, "global_step": 233000, "epoch": 1386} {"train_loss": -11.182605743408203, "global_step": 233001, "epoch": 1386} {"train_loss": -11.316047668457031, "global_step": 233002, "epoch": 1386} {"train_loss": -11.655322074890137, "global_step": 233003, "epoch": 1386} {"train_loss": -11.235485076904297, "global_step": 233004, "epoch": 1386} {"train_loss": -11.573075294494629, "global_step": 233005, "epoch": 1386} {"train_loss": -11.52910041809082, "global_step": 233006, "epoch": 1386} {"train_loss": -10.998504638671875, "global_step": 233007, "epoch": 1386} {"train_loss": -11.44919204711914, "global_step": 233008, "epoch": 1386} {"train_loss": -11.545438766479492, "global_step": 233009, "epoch": 1386} {"train_loss": -11.567562103271484, "global_step": 233010, "epoch": 1386} {"train_loss": -11.498897552490234, "global_step": 233011, "epoch": 1386} {"train_loss": -11.622490882873535, "global_step": 233012, "epoch": 1386} {"train_loss": -11.74603271484375, "global_step": 233013, "epoch": 1386} {"train_loss": -11.515436172485352, "global_step": 233014, "epoch": 1386} {"train_loss": -11.27884840965271, "global_step": 233015, "epoch": 1386, "val_loss": 263041.9375} {"train_loss": -11.459320068359375, "global_step": 233016, "epoch": 1387} {"train_loss": -11.803349494934082, "global_step": 233017, "epoch": 1387} {"train_loss": -11.476922035217285, "global_step": 233018, "epoch": 1387} {"train_loss": -11.633548736572266, "global_step": 233019, "epoch": 1387} {"train_loss": -11.829503059387207, "global_step": 233020, "epoch": 1387} {"train_loss": -11.832218170166016, "global_step": 233021, "epoch": 1387} {"train_loss": -11.965812683105469, "global_step": 233022, "epoch": 1387} {"train_loss": -11.900118827819824, "global_step": 233023, "epoch": 1387} {"train_loss": -11.851726531982422, "global_step": 233024, "epoch": 1387} {"train_loss": -11.786962509155273, "global_step": 233025, "epoch": 1387} {"train_loss": -11.697368621826172, "global_step": 233026, "epoch": 1387} {"train_loss": -11.789138793945312, "global_step": 233027, "epoch": 1387} {"train_loss": -11.736821174621582, "global_step": 233028, "epoch": 1387} {"train_loss": -11.757501602172852, "global_step": 233029, "epoch": 1387} {"train_loss": -11.763367652893066, "global_step": 233030, "epoch": 1387} {"train_loss": -11.844746589660645, "global_step": 233031, "epoch": 1387} {"train_loss": -11.703475952148438, "global_step": 233032, "epoch": 1387} {"train_loss": -11.998459815979004, "global_step": 233033, "epoch": 1387} {"train_loss": -11.646726608276367, "global_step": 233034, "epoch": 1387} {"train_loss": -11.809488296508789, "global_step": 233035, "epoch": 1387} {"train_loss": -11.628032684326172, "global_step": 233036, "epoch": 1387} {"train_loss": -11.41195297241211, "global_step": 233037, "epoch": 1387} {"train_loss": -11.657796859741211, "global_step": 233038, "epoch": 1387} {"train_loss": -11.626392364501953, "global_step": 233039, "epoch": 1387} {"train_loss": -11.271270751953125, "global_step": 233040, "epoch": 1387} {"train_loss": -11.939666748046875, "global_step": 233041, "epoch": 1387} {"train_loss": -11.424206733703613, "global_step": 233042, "epoch": 1387} {"train_loss": -11.78729248046875, "global_step": 233043, "epoch": 1387} {"train_loss": -11.534789085388184, "global_step": 233044, "epoch": 1387} {"train_loss": -11.181337356567383, "global_step": 233045, "epoch": 1387} {"train_loss": -11.767280578613281, "global_step": 233046, "epoch": 1387} {"train_loss": -11.626466751098633, "global_step": 233047, "epoch": 1387} {"train_loss": -11.645278930664062, "global_step": 233048, "epoch": 1387} {"train_loss": -11.77764892578125, "global_step": 233049, "epoch": 1387} {"train_loss": -11.45056438446045, "global_step": 233050, "epoch": 1387} {"train_loss": -11.787399291992188, "global_step": 233051, "epoch": 1387} {"train_loss": -11.62961483001709, "global_step": 233052, "epoch": 1387} {"train_loss": -12.050098419189453, "global_step": 233053, "epoch": 1387} {"train_loss": -11.703514099121094, "global_step": 233054, "epoch": 1387} {"train_loss": -11.878878593444824, "global_step": 233055, "epoch": 1387} {"train_loss": -11.812238693237305, "global_step": 233056, "epoch": 1387} {"train_loss": -11.86056900024414, "global_step": 233057, "epoch": 1387} {"train_loss": -11.843331336975098, "global_step": 233058, "epoch": 1387} {"train_loss": -11.608847618103027, "global_step": 233059, "epoch": 1387} {"train_loss": -11.445768356323242, "global_step": 233060, "epoch": 1387} {"train_loss": -11.777453422546387, "global_step": 233061, "epoch": 1387} {"train_loss": -11.649053573608398, "global_step": 233062, "epoch": 1387} {"train_loss": -11.87723445892334, "global_step": 233063, "epoch": 1387} {"train_loss": -11.467676162719727, "global_step": 233064, "epoch": 1387} {"train_loss": -11.601774215698242, "global_step": 233065, "epoch": 1387} {"train_loss": -11.570524215698242, "global_step": 233066, "epoch": 1387} {"train_loss": -11.348920822143555, "global_step": 233067, "epoch": 1387} {"train_loss": -11.862699508666992, "global_step": 233068, "epoch": 1387} {"train_loss": -11.325499534606934, "global_step": 233069, "epoch": 1387} {"train_loss": -10.7398042678833, "global_step": 233070, "epoch": 1387} {"train_loss": -11.394505500793457, "global_step": 233071, "epoch": 1387} {"train_loss": -10.259459495544434, "global_step": 233072, "epoch": 1387} {"train_loss": -11.156537055969238, "global_step": 233073, "epoch": 1387} {"train_loss": -10.682372093200684, "global_step": 233074, "epoch": 1387} {"train_loss": -10.733545303344727, "global_step": 233075, "epoch": 1387} {"train_loss": -10.222891807556152, "global_step": 233076, "epoch": 1387} {"train_loss": -9.405729293823242, "global_step": 233077, "epoch": 1387} {"train_loss": -10.594197273254395, "global_step": 233078, "epoch": 1387} {"train_loss": -9.164619445800781, "global_step": 233079, "epoch": 1387} {"train_loss": -10.399578094482422, "global_step": 233080, "epoch": 1387} {"train_loss": -9.187471389770508, "global_step": 233081, "epoch": 1387} {"train_loss": -10.707193374633789, "global_step": 233082, "epoch": 1387} {"train_loss": -10.060044288635254, "global_step": 233083, "epoch": 1387} {"train_loss": -10.397431373596191, "global_step": 233084, "epoch": 1387} {"train_loss": -10.737386703491211, "global_step": 233085, "epoch": 1387} {"train_loss": -10.997925758361816, "global_step": 233086, "epoch": 1387} {"train_loss": -10.18262767791748, "global_step": 233087, "epoch": 1387} {"train_loss": -11.283443450927734, "global_step": 233088, "epoch": 1387} {"train_loss": -10.495285987854004, "global_step": 233089, "epoch": 1387} {"train_loss": -11.319238662719727, "global_step": 233090, "epoch": 1387} {"train_loss": -10.402372360229492, "global_step": 233091, "epoch": 1387} {"train_loss": -11.053160667419434, "global_step": 233092, "epoch": 1387} {"train_loss": -10.64527702331543, "global_step": 233093, "epoch": 1387} {"train_loss": -10.829136848449707, "global_step": 233094, "epoch": 1387} {"train_loss": -10.927644729614258, "global_step": 233095, "epoch": 1387} {"train_loss": -11.486960411071777, "global_step": 233096, "epoch": 1387} {"train_loss": -11.126521110534668, "global_step": 233097, "epoch": 1387} {"train_loss": -11.381410598754883, "global_step": 233098, "epoch": 1387} {"train_loss": -11.126057624816895, "global_step": 233099, "epoch": 1387} {"train_loss": -10.902713775634766, "global_step": 233100, "epoch": 1387} {"train_loss": -11.376800537109375, "global_step": 233101, "epoch": 1387} {"train_loss": -10.888967514038086, "global_step": 233102, "epoch": 1387} {"train_loss": -11.4905366897583, "global_step": 233103, "epoch": 1387} {"train_loss": -11.101217269897461, "global_step": 233104, "epoch": 1387} {"train_loss": -11.335016250610352, "global_step": 233105, "epoch": 1387} {"train_loss": -11.144567489624023, "global_step": 233106, "epoch": 1387} {"train_loss": -11.604450225830078, "global_step": 233107, "epoch": 1387} {"train_loss": -11.325857162475586, "global_step": 233108, "epoch": 1387} {"train_loss": -11.286239624023438, "global_step": 233109, "epoch": 1387} {"train_loss": -11.716585159301758, "global_step": 233110, "epoch": 1387} {"train_loss": -11.356935501098633, "global_step": 233111, "epoch": 1387} {"train_loss": -11.736518859863281, "global_step": 233112, "epoch": 1387} {"train_loss": -11.764013290405273, "global_step": 233113, "epoch": 1387} {"train_loss": -11.691972732543945, "global_step": 233114, "epoch": 1387} {"train_loss": -11.904151916503906, "global_step": 233115, "epoch": 1387} {"train_loss": -11.499231338500977, "global_step": 233116, "epoch": 1387} {"train_loss": -11.470874786376953, "global_step": 233117, "epoch": 1387} {"train_loss": -11.417181015014648, "global_step": 233118, "epoch": 1387} {"train_loss": -11.753395080566406, "global_step": 233119, "epoch": 1387} {"train_loss": -11.752778053283691, "global_step": 233120, "epoch": 1387} {"train_loss": -11.734394073486328, "global_step": 233121, "epoch": 1387} {"train_loss": -11.452768325805664, "global_step": 233122, "epoch": 1387} {"train_loss": -11.734832763671875, "global_step": 233123, "epoch": 1387} {"train_loss": -11.926207542419434, "global_step": 233124, "epoch": 1387} {"train_loss": -11.70908260345459, "global_step": 233125, "epoch": 1387} {"train_loss": -11.66550064086914, "global_step": 233126, "epoch": 1387} {"train_loss": -11.674957275390625, "global_step": 233127, "epoch": 1387} {"train_loss": -11.609699249267578, "global_step": 233128, "epoch": 1387} {"train_loss": -11.63733196258545, "global_step": 233129, "epoch": 1387} {"train_loss": -11.866007804870605, "global_step": 233130, "epoch": 1387} {"train_loss": -11.687113761901855, "global_step": 233131, "epoch": 1387} {"train_loss": -11.854970932006836, "global_step": 233132, "epoch": 1387} {"train_loss": -11.768747329711914, "global_step": 233133, "epoch": 1387} {"train_loss": -11.858137130737305, "global_step": 233134, "epoch": 1387} {"train_loss": -11.715137481689453, "global_step": 233135, "epoch": 1387} {"train_loss": -11.756996154785156, "global_step": 233136, "epoch": 1387} {"train_loss": -11.685522079467773, "global_step": 233137, "epoch": 1387} {"train_loss": -11.96487045288086, "global_step": 233138, "epoch": 1387} {"train_loss": -11.656484603881836, "global_step": 233139, "epoch": 1387} {"train_loss": -11.772398948669434, "global_step": 233140, "epoch": 1387} {"train_loss": -11.654707908630371, "global_step": 233141, "epoch": 1387} {"train_loss": -11.771751403808594, "global_step": 233142, "epoch": 1387} {"train_loss": -11.672136306762695, "global_step": 233143, "epoch": 1387} {"train_loss": -12.010543823242188, "global_step": 233144, "epoch": 1387} {"train_loss": -11.961142539978027, "global_step": 233145, "epoch": 1387} {"train_loss": -11.794502258300781, "global_step": 233146, "epoch": 1387} {"train_loss": -11.54361343383789, "global_step": 233147, "epoch": 1387} {"train_loss": -11.881258964538574, "global_step": 233148, "epoch": 1387} {"train_loss": -12.049821853637695, "global_step": 233149, "epoch": 1387} {"train_loss": -11.446088790893555, "global_step": 233150, "epoch": 1387} {"train_loss": -11.677287101745605, "global_step": 233151, "epoch": 1387} {"train_loss": -11.743606567382812, "global_step": 233152, "epoch": 1387} {"train_loss": -11.806680679321289, "global_step": 233153, "epoch": 1387} {"train_loss": -11.881114959716797, "global_step": 233154, "epoch": 1387} {"train_loss": -11.74197769165039, "global_step": 233155, "epoch": 1387} {"train_loss": -11.981816291809082, "global_step": 233156, "epoch": 1387} {"train_loss": -11.58474063873291, "global_step": 233157, "epoch": 1387} {"train_loss": -10.921607971191406, "global_step": 233158, "epoch": 1387} {"train_loss": -10.356499671936035, "global_step": 233159, "epoch": 1387} {"train_loss": -11.04706859588623, "global_step": 233160, "epoch": 1387} {"train_loss": -11.73750114440918, "global_step": 233161, "epoch": 1387} {"train_loss": -11.186779022216797, "global_step": 233162, "epoch": 1387} {"train_loss": -11.208571434020996, "global_step": 233163, "epoch": 1387} {"train_loss": -11.707744598388672, "global_step": 233164, "epoch": 1387} {"train_loss": -11.016560554504395, "global_step": 233165, "epoch": 1387} {"train_loss": -11.682488441467285, "global_step": 233166, "epoch": 1387} {"train_loss": -11.716499328613281, "global_step": 233167, "epoch": 1387} {"train_loss": -11.494729995727539, "global_step": 233168, "epoch": 1387} {"train_loss": -11.886316299438477, "global_step": 233169, "epoch": 1387} {"train_loss": -11.192850112915039, "global_step": 233170, "epoch": 1387} {"train_loss": -11.748251914978027, "global_step": 233171, "epoch": 1387} {"train_loss": -11.472118377685547, "global_step": 233172, "epoch": 1387} {"train_loss": -11.848636627197266, "global_step": 233173, "epoch": 1387} {"train_loss": -11.292060852050781, "global_step": 233174, "epoch": 1387} {"train_loss": -11.727699279785156, "global_step": 233175, "epoch": 1387} {"train_loss": -11.451542854309082, "global_step": 233176, "epoch": 1387} {"train_loss": -11.752285957336426, "global_step": 233177, "epoch": 1387} {"train_loss": -11.667634963989258, "global_step": 233178, "epoch": 1387} {"train_loss": -11.590499877929688, "global_step": 233179, "epoch": 1387} {"train_loss": -10.992688179016113, "global_step": 233180, "epoch": 1387} {"train_loss": -11.28986930847168, "global_step": 233181, "epoch": 1387} {"train_loss": -11.661571502685547, "global_step": 233182, "epoch": 1387} {"train_loss": -11.445923419225783, "global_step": 233183, "epoch": 1387, "val_loss": 261610.9375} {"train_loss": -11.63865852355957, "global_step": 233184, "epoch": 1388} {"train_loss": -11.349154472351074, "global_step": 233185, "epoch": 1388} {"train_loss": -11.019453048706055, "global_step": 233186, "epoch": 1388} {"train_loss": -11.056366920471191, "global_step": 233187, "epoch": 1388} {"train_loss": -10.355400085449219, "global_step": 233188, "epoch": 1388} {"train_loss": -10.509980201721191, "global_step": 233189, "epoch": 1388} {"train_loss": -10.25501823425293, "global_step": 233190, "epoch": 1388} {"train_loss": -9.723587989807129, "global_step": 233191, "epoch": 1388} {"train_loss": -10.29609203338623, "global_step": 233192, "epoch": 1388} {"train_loss": -10.312576293945312, "global_step": 233193, "epoch": 1388} {"train_loss": -9.24740982055664, "global_step": 233194, "epoch": 1388} {"train_loss": -10.63222885131836, "global_step": 233195, "epoch": 1388} {"train_loss": -9.482488632202148, "global_step": 233196, "epoch": 1388} {"train_loss": -10.146842956542969, "global_step": 233197, "epoch": 1388} {"train_loss": -8.407304763793945, "global_step": 233198, "epoch": 1388} {"train_loss": -10.140581130981445, "global_step": 233199, "epoch": 1388} {"train_loss": -9.2801513671875, "global_step": 233200, "epoch": 1388} {"train_loss": -11.295218467712402, "global_step": 233201, "epoch": 1388} {"train_loss": -10.123103141784668, "global_step": 233202, "epoch": 1388} {"train_loss": -11.149717330932617, "global_step": 233203, "epoch": 1388} {"train_loss": -10.619203567504883, "global_step": 233204, "epoch": 1388} {"train_loss": -11.151229858398438, "global_step": 233205, "epoch": 1388} {"train_loss": -10.854001998901367, "global_step": 233206, "epoch": 1388} {"train_loss": -11.245590209960938, "global_step": 233207, "epoch": 1388} {"train_loss": -11.233358383178711, "global_step": 233208, "epoch": 1388} {"train_loss": -11.001640319824219, "global_step": 233209, "epoch": 1388} {"train_loss": -11.229423522949219, "global_step": 233210, "epoch": 1388} {"train_loss": -11.37173080444336, "global_step": 233211, "epoch": 1388} {"train_loss": -11.213089942932129, "global_step": 233212, "epoch": 1388} {"train_loss": -11.49817943572998, "global_step": 233213, "epoch": 1388} {"train_loss": -11.246399879455566, "global_step": 233214, "epoch": 1388} {"train_loss": -11.244565963745117, "global_step": 233215, "epoch": 1388} {"train_loss": -11.492555618286133, "global_step": 233216, "epoch": 1388} {"train_loss": -11.648929595947266, "global_step": 233217, "epoch": 1388} {"train_loss": -11.495780944824219, "global_step": 233218, "epoch": 1388} {"train_loss": -11.549818992614746, "global_step": 233219, "epoch": 1388} {"train_loss": -11.704891204833984, "global_step": 233220, "epoch": 1388} {"train_loss": -11.501855850219727, "global_step": 233221, "epoch": 1388} {"train_loss": -11.477346420288086, "global_step": 233222, "epoch": 1388} {"train_loss": -11.672091484069824, "global_step": 233223, "epoch": 1388} {"train_loss": -11.722424507141113, "global_step": 233224, "epoch": 1388} {"train_loss": -11.372459411621094, "global_step": 233225, "epoch": 1388} {"train_loss": -11.792301177978516, "global_step": 233226, "epoch": 1388} {"train_loss": -11.58148193359375, "global_step": 233227, "epoch": 1388} {"train_loss": -11.843866348266602, "global_step": 233228, "epoch": 1388} {"train_loss": -11.865422248840332, "global_step": 233229, "epoch": 1388} {"train_loss": -11.610196113586426, "global_step": 233230, "epoch": 1388} {"train_loss": -11.496749877929688, "global_step": 233231, "epoch": 1388} {"train_loss": -11.556707382202148, "global_step": 233232, "epoch": 1388} {"train_loss": -11.686656951904297, "global_step": 233233, "epoch": 1388} {"train_loss": -11.512116432189941, "global_step": 233234, "epoch": 1388} {"train_loss": -11.853219985961914, "global_step": 233235, "epoch": 1388} {"train_loss": -11.845794677734375, "global_step": 233236, "epoch": 1388} {"train_loss": -11.640447616577148, "global_step": 233237, "epoch": 1388} {"train_loss": -11.903488159179688, "global_step": 233238, "epoch": 1388} {"train_loss": -11.66650676727295, "global_step": 233239, "epoch": 1388} {"train_loss": -11.973479270935059, "global_step": 233240, "epoch": 1388} {"train_loss": -11.912971496582031, "global_step": 233241, "epoch": 1388} {"train_loss": -11.584769248962402, "global_step": 233242, "epoch": 1388} {"train_loss": -11.931602478027344, "global_step": 233243, "epoch": 1388} {"train_loss": -11.756956100463867, "global_step": 233244, "epoch": 1388} {"train_loss": -11.889945983886719, "global_step": 233245, "epoch": 1388} {"train_loss": -11.902888298034668, "global_step": 233246, "epoch": 1388} {"train_loss": -11.714615821838379, "global_step": 233247, "epoch": 1388} {"train_loss": -11.880043029785156, "global_step": 233248, "epoch": 1388} {"train_loss": -11.887212753295898, "global_step": 233249, "epoch": 1388} {"train_loss": -11.955388069152832, "global_step": 233250, "epoch": 1388} {"train_loss": -11.718344688415527, "global_step": 233251, "epoch": 1388} {"train_loss": -11.976484298706055, "global_step": 233252, "epoch": 1388} {"train_loss": -11.88235855102539, "global_step": 233253, "epoch": 1388} {"train_loss": -11.836528778076172, "global_step": 233254, "epoch": 1388} {"train_loss": -11.783912658691406, "global_step": 233255, "epoch": 1388} {"train_loss": -11.893531799316406, "global_step": 233256, "epoch": 1388} {"train_loss": -11.895380020141602, "global_step": 233257, "epoch": 1388} {"train_loss": -12.07071304321289, "global_step": 233258, "epoch": 1388} {"train_loss": -11.821922302246094, "global_step": 233259, "epoch": 1388} {"train_loss": -11.922113418579102, "global_step": 233260, "epoch": 1388} {"train_loss": -11.985478401184082, "global_step": 233261, "epoch": 1388} {"train_loss": -12.000292778015137, "global_step": 233262, "epoch": 1388} {"train_loss": -11.864070892333984, "global_step": 233263, "epoch": 1388} {"train_loss": -12.012760162353516, "global_step": 233264, "epoch": 1388} {"train_loss": -11.897686958312988, "global_step": 233265, "epoch": 1388} {"train_loss": -12.07712173461914, "global_step": 233266, "epoch": 1388} {"train_loss": -11.604520797729492, "global_step": 233267, "epoch": 1388} {"train_loss": -12.047832489013672, "global_step": 233268, "epoch": 1388} {"train_loss": -12.00638484954834, "global_step": 233269, "epoch": 1388} {"train_loss": -11.89213752746582, "global_step": 233270, "epoch": 1388} {"train_loss": -11.971811294555664, "global_step": 233271, "epoch": 1388} {"train_loss": -11.830718040466309, "global_step": 233272, "epoch": 1388} {"train_loss": -12.072807312011719, "global_step": 233273, "epoch": 1388} {"train_loss": -11.939057350158691, "global_step": 233274, "epoch": 1388} {"train_loss": -11.82738971710205, "global_step": 233275, "epoch": 1388} {"train_loss": -11.186832427978516, "global_step": 233276, "epoch": 1388} {"train_loss": -11.750019073486328, "global_step": 233277, "epoch": 1388} {"train_loss": -11.847945213317871, "global_step": 233278, "epoch": 1388} {"train_loss": -11.747138023376465, "global_step": 233279, "epoch": 1388} {"train_loss": -11.591063499450684, "global_step": 233280, "epoch": 1388} {"train_loss": -11.862220764160156, "global_step": 233281, "epoch": 1388} {"train_loss": -11.718193054199219, "global_step": 233282, "epoch": 1388} {"train_loss": -11.71504020690918, "global_step": 233283, "epoch": 1388} {"train_loss": -11.830196380615234, "global_step": 233284, "epoch": 1388} {"train_loss": -11.679546356201172, "global_step": 233285, "epoch": 1388} {"train_loss": -11.85762882232666, "global_step": 233286, "epoch": 1388} {"train_loss": -11.818499565124512, "global_step": 233287, "epoch": 1388} {"train_loss": -11.610873222351074, "global_step": 233288, "epoch": 1388} {"train_loss": -11.781466484069824, "global_step": 233289, "epoch": 1388} {"train_loss": -11.452278137207031, "global_step": 233290, "epoch": 1388} {"train_loss": -11.509610176086426, "global_step": 233291, "epoch": 1388} {"train_loss": -11.640135765075684, "global_step": 233292, "epoch": 1388} {"train_loss": -11.957937240600586, "global_step": 233293, "epoch": 1388} {"train_loss": -12.186500549316406, "global_step": 233294, "epoch": 1388} {"train_loss": -12.189992904663086, "global_step": 233295, "epoch": 1388} {"train_loss": -11.914660453796387, "global_step": 233296, "epoch": 1388} {"train_loss": -12.087217330932617, "global_step": 233297, "epoch": 1388} {"train_loss": -11.99011516571045, "global_step": 233298, "epoch": 1388} {"train_loss": -11.752317428588867, "global_step": 233299, "epoch": 1388} {"train_loss": -11.971965789794922, "global_step": 233300, "epoch": 1388} {"train_loss": -11.799650192260742, "global_step": 233301, "epoch": 1388} {"train_loss": -11.919967651367188, "global_step": 233302, "epoch": 1388} {"train_loss": -12.019771575927734, "global_step": 233303, "epoch": 1388} {"train_loss": -11.64760684967041, "global_step": 233304, "epoch": 1388} {"train_loss": -11.712066650390625, "global_step": 233305, "epoch": 1388} {"train_loss": -12.028871536254883, "global_step": 233306, "epoch": 1388} {"train_loss": -11.065726280212402, "global_step": 233307, "epoch": 1388} {"train_loss": -10.513710975646973, "global_step": 233308, "epoch": 1388} {"train_loss": -11.68978214263916, "global_step": 233309, "epoch": 1388} {"train_loss": -11.655906677246094, "global_step": 233310, "epoch": 1388} {"train_loss": -10.921262741088867, "global_step": 233311, "epoch": 1388} {"train_loss": -11.921319961547852, "global_step": 233312, "epoch": 1388} {"train_loss": -11.560819625854492, "global_step": 233313, "epoch": 1388} {"train_loss": -11.7741060256958, "global_step": 233314, "epoch": 1388} {"train_loss": -11.797866821289062, "global_step": 233315, "epoch": 1388} {"train_loss": -11.377618789672852, "global_step": 233316, "epoch": 1388} {"train_loss": -11.39031982421875, "global_step": 233317, "epoch": 1388} {"train_loss": -11.270296096801758, "global_step": 233318, "epoch": 1388} {"train_loss": -12.230817794799805, "global_step": 233319, "epoch": 1388} {"train_loss": -11.485102653503418, "global_step": 233320, "epoch": 1388} {"train_loss": -11.724858283996582, "global_step": 233321, "epoch": 1388} {"train_loss": -11.760845184326172, "global_step": 233322, "epoch": 1388} {"train_loss": -11.589784622192383, "global_step": 233323, "epoch": 1388} {"train_loss": -11.37065601348877, "global_step": 233324, "epoch": 1388} {"train_loss": -11.518738746643066, "global_step": 233325, "epoch": 1388} {"train_loss": -11.6263427734375, "global_step": 233326, "epoch": 1388} {"train_loss": -11.0545654296875, "global_step": 233327, "epoch": 1388} {"train_loss": -11.021321296691895, "global_step": 233328, "epoch": 1388} {"train_loss": -11.762225151062012, "global_step": 233329, "epoch": 1388} {"train_loss": -11.150611877441406, "global_step": 233330, "epoch": 1388} {"train_loss": -10.168885231018066, "global_step": 233331, "epoch": 1388} {"train_loss": -11.034793853759766, "global_step": 233332, "epoch": 1388} {"train_loss": -11.556192398071289, "global_step": 233333, "epoch": 1388} {"train_loss": -11.47055435180664, "global_step": 233334, "epoch": 1388} {"train_loss": -10.933162689208984, "global_step": 233335, "epoch": 1388} {"train_loss": -11.558910369873047, "global_step": 233336, "epoch": 1388} {"train_loss": -11.098849296569824, "global_step": 233337, "epoch": 1388} {"train_loss": -11.437030792236328, "global_step": 233338, "epoch": 1388} {"train_loss": -11.356552124023438, "global_step": 233339, "epoch": 1388} {"train_loss": -11.048689842224121, "global_step": 233340, "epoch": 1388} {"train_loss": -11.655832290649414, "global_step": 233341, "epoch": 1388} {"train_loss": -11.019994735717773, "global_step": 233342, "epoch": 1388} {"train_loss": -10.954345703125, "global_step": 233343, "epoch": 1388} {"train_loss": -11.669478416442871, "global_step": 233344, "epoch": 1388} {"train_loss": -11.118854522705078, "global_step": 233345, "epoch": 1388} {"train_loss": -11.647834777832031, "global_step": 233346, "epoch": 1388} {"train_loss": -11.30815601348877, "global_step": 233347, "epoch": 1388} {"train_loss": -11.357515335083008, "global_step": 233348, "epoch": 1388} {"train_loss": -11.589963912963867, "global_step": 233349, "epoch": 1388} {"train_loss": -10.622020721435547, "global_step": 233350, "epoch": 1388} {"train_loss": -11.460918812524705, "global_step": 233351, "epoch": 1388, "val_loss": 265103.3125} {"train_loss": -10.588345527648926, "global_step": 233352, "epoch": 1389} {"train_loss": -11.450112342834473, "global_step": 233353, "epoch": 1389} {"train_loss": -10.72551155090332, "global_step": 233354, "epoch": 1389} {"train_loss": -11.222145080566406, "global_step": 233355, "epoch": 1389} {"train_loss": -11.677555084228516, "global_step": 233356, "epoch": 1389} {"train_loss": -10.846927642822266, "global_step": 233357, "epoch": 1389} {"train_loss": -11.768152236938477, "global_step": 233358, "epoch": 1389} {"train_loss": -11.379251480102539, "global_step": 233359, "epoch": 1389} {"train_loss": -11.285161018371582, "global_step": 233360, "epoch": 1389} {"train_loss": -11.608463287353516, "global_step": 233361, "epoch": 1389} {"train_loss": -10.99726676940918, "global_step": 233362, "epoch": 1389} {"train_loss": -11.440759658813477, "global_step": 233363, "epoch": 1389} {"train_loss": -11.140130043029785, "global_step": 233364, "epoch": 1389} {"train_loss": -11.277081489562988, "global_step": 233365, "epoch": 1389} {"train_loss": -10.693580627441406, "global_step": 233366, "epoch": 1389} {"train_loss": -11.424301147460938, "global_step": 233367, "epoch": 1389} {"train_loss": -10.910179138183594, "global_step": 233368, "epoch": 1389} {"train_loss": -10.830886840820312, "global_step": 233369, "epoch": 1389} {"train_loss": -11.25970458984375, "global_step": 233370, "epoch": 1389} {"train_loss": -11.125707626342773, "global_step": 233371, "epoch": 1389} {"train_loss": -11.333911895751953, "global_step": 233372, "epoch": 1389} {"train_loss": -11.184287071228027, "global_step": 233373, "epoch": 1389} {"train_loss": -11.539424896240234, "global_step": 233374, "epoch": 1389} {"train_loss": -11.267669677734375, "global_step": 233375, "epoch": 1389} {"train_loss": -11.73296070098877, "global_step": 233376, "epoch": 1389} {"train_loss": -10.922059059143066, "global_step": 233377, "epoch": 1389} {"train_loss": -11.907179832458496, "global_step": 233378, "epoch": 1389} {"train_loss": -10.979656219482422, "global_step": 233379, "epoch": 1389} {"train_loss": -11.839990615844727, "global_step": 233380, "epoch": 1389} {"train_loss": -11.246525764465332, "global_step": 233381, "epoch": 1389} {"train_loss": -11.608689308166504, "global_step": 233382, "epoch": 1389} {"train_loss": -11.380256652832031, "global_step": 233383, "epoch": 1389} {"train_loss": -11.723864555358887, "global_step": 233384, "epoch": 1389} {"train_loss": -11.318603515625, "global_step": 233385, "epoch": 1389} {"train_loss": -11.58114242553711, "global_step": 233386, "epoch": 1389} {"train_loss": -11.680438041687012, "global_step": 233387, "epoch": 1389} {"train_loss": -11.853710174560547, "global_step": 233388, "epoch": 1389} {"train_loss": -11.485936164855957, "global_step": 233389, "epoch": 1389} {"train_loss": -11.64505672454834, "global_step": 233390, "epoch": 1389} {"train_loss": -11.733642578125, "global_step": 233391, "epoch": 1389} {"train_loss": -12.008113861083984, "global_step": 233392, "epoch": 1389} {"train_loss": -11.56110954284668, "global_step": 233393, "epoch": 1389} {"train_loss": -11.893357276916504, "global_step": 233394, "epoch": 1389} {"train_loss": -11.81195068359375, "global_step": 233395, "epoch": 1389} {"train_loss": -11.74277114868164, "global_step": 233396, "epoch": 1389} {"train_loss": -11.728425025939941, "global_step": 233397, "epoch": 1389} {"train_loss": -11.853702545166016, "global_step": 233398, "epoch": 1389} {"train_loss": -11.6614351272583, "global_step": 233399, "epoch": 1389} {"train_loss": -11.787103652954102, "global_step": 233400, "epoch": 1389} {"train_loss": -11.941442489624023, "global_step": 233401, "epoch": 1389} {"train_loss": -11.50649642944336, "global_step": 233402, "epoch": 1389} {"train_loss": -11.790363311767578, "global_step": 233403, "epoch": 1389} {"train_loss": -11.703174591064453, "global_step": 233404, "epoch": 1389} {"train_loss": -11.762245178222656, "global_step": 233405, "epoch": 1389} {"train_loss": -11.758994102478027, "global_step": 233406, "epoch": 1389} {"train_loss": -11.393389701843262, "global_step": 233407, "epoch": 1389} {"train_loss": -11.824066162109375, "global_step": 233408, "epoch": 1389} {"train_loss": -11.676562309265137, "global_step": 233409, "epoch": 1389} {"train_loss": -11.688695907592773, "global_step": 233410, "epoch": 1389} {"train_loss": -12.023566246032715, "global_step": 233411, "epoch": 1389} {"train_loss": -11.623798370361328, "global_step": 233412, "epoch": 1389} {"train_loss": -11.96639633178711, "global_step": 233413, "epoch": 1389} {"train_loss": -11.440261840820312, "global_step": 233414, "epoch": 1389} {"train_loss": -10.757606506347656, "global_step": 233415, "epoch": 1389} {"train_loss": -11.868766784667969, "global_step": 233416, "epoch": 1389} {"train_loss": -11.452627182006836, "global_step": 233417, "epoch": 1389} {"train_loss": -11.231404304504395, "global_step": 233418, "epoch": 1389} {"train_loss": -11.873478889465332, "global_step": 233419, "epoch": 1389} {"train_loss": -11.793684005737305, "global_step": 233420, "epoch": 1389} {"train_loss": -11.420594215393066, "global_step": 233421, "epoch": 1389} {"train_loss": -11.874727249145508, "global_step": 233422, "epoch": 1389} {"train_loss": -11.56641960144043, "global_step": 233423, "epoch": 1389} {"train_loss": -11.654229164123535, "global_step": 233424, "epoch": 1389} {"train_loss": -11.864372253417969, "global_step": 233425, "epoch": 1389} {"train_loss": -11.692314147949219, "global_step": 233426, "epoch": 1389} {"train_loss": -11.910531044006348, "global_step": 233427, "epoch": 1389} {"train_loss": -11.818704605102539, "global_step": 233428, "epoch": 1389} {"train_loss": -11.82193660736084, "global_step": 233429, "epoch": 1389} {"train_loss": -11.831988334655762, "global_step": 233430, "epoch": 1389} {"train_loss": -11.962303161621094, "global_step": 233431, "epoch": 1389} {"train_loss": -12.134271621704102, "global_step": 233432, "epoch": 1389} {"train_loss": -11.941547393798828, "global_step": 233433, "epoch": 1389} {"train_loss": -11.901359558105469, "global_step": 233434, "epoch": 1389} {"train_loss": -11.755669593811035, "global_step": 233435, "epoch": 1389} {"train_loss": -12.088808059692383, "global_step": 233436, "epoch": 1389} {"train_loss": -12.025094985961914, "global_step": 233437, "epoch": 1389} {"train_loss": -11.726524353027344, "global_step": 233438, "epoch": 1389} {"train_loss": -11.875556945800781, "global_step": 233439, "epoch": 1389} {"train_loss": -12.046111106872559, "global_step": 233440, "epoch": 1389} {"train_loss": -11.981081008911133, "global_step": 233441, "epoch": 1389} {"train_loss": -11.786870956420898, "global_step": 233442, "epoch": 1389} {"train_loss": -11.84467601776123, "global_step": 233443, "epoch": 1389} {"train_loss": -11.913281440734863, "global_step": 233444, "epoch": 1389} {"train_loss": -11.85057258605957, "global_step": 233445, "epoch": 1389} {"train_loss": -11.620800018310547, "global_step": 233446, "epoch": 1389} {"train_loss": -12.245121002197266, "global_step": 233447, "epoch": 1389} {"train_loss": -11.331172943115234, "global_step": 233448, "epoch": 1389} {"train_loss": -11.70712947845459, "global_step": 233449, "epoch": 1389} {"train_loss": -11.846653938293457, "global_step": 233450, "epoch": 1389} {"train_loss": -11.847942352294922, "global_step": 233451, "epoch": 1389} {"train_loss": -11.988179206848145, "global_step": 233452, "epoch": 1389} {"train_loss": -11.730157852172852, "global_step": 233453, "epoch": 1389} {"train_loss": -12.068750381469727, "global_step": 233454, "epoch": 1389} {"train_loss": -11.857820510864258, "global_step": 233455, "epoch": 1389} {"train_loss": -11.822341918945312, "global_step": 233456, "epoch": 1389} {"train_loss": -11.825048446655273, "global_step": 233457, "epoch": 1389} {"train_loss": -11.907054901123047, "global_step": 233458, "epoch": 1389} {"train_loss": -11.347461700439453, "global_step": 233459, "epoch": 1389} {"train_loss": -12.096923828125, "global_step": 233460, "epoch": 1389} {"train_loss": -11.412321090698242, "global_step": 233461, "epoch": 1389} {"train_loss": -10.78225326538086, "global_step": 233462, "epoch": 1389} {"train_loss": -11.452325820922852, "global_step": 233463, "epoch": 1389} {"train_loss": -11.9520263671875, "global_step": 233464, "epoch": 1389} {"train_loss": -11.497705459594727, "global_step": 233465, "epoch": 1389} {"train_loss": -11.442733764648438, "global_step": 233466, "epoch": 1389} {"train_loss": -11.517692565917969, "global_step": 233467, "epoch": 1389} {"train_loss": -10.787983894348145, "global_step": 233468, "epoch": 1389} {"train_loss": -11.157194137573242, "global_step": 233469, "epoch": 1389} {"train_loss": -11.855297088623047, "global_step": 233470, "epoch": 1389} {"train_loss": -11.261616706848145, "global_step": 233471, "epoch": 1389} {"train_loss": -11.239038467407227, "global_step": 233472, "epoch": 1389} {"train_loss": -12.046655654907227, "global_step": 233473, "epoch": 1389} {"train_loss": -11.446245193481445, "global_step": 233474, "epoch": 1389} {"train_loss": -10.669706344604492, "global_step": 233475, "epoch": 1389} {"train_loss": -11.473410606384277, "global_step": 233476, "epoch": 1389} {"train_loss": -11.348794937133789, "global_step": 233477, "epoch": 1389} {"train_loss": -11.184778213500977, "global_step": 233478, "epoch": 1389} {"train_loss": -11.313051223754883, "global_step": 233479, "epoch": 1389} {"train_loss": -11.258895874023438, "global_step": 233480, "epoch": 1389} {"train_loss": -11.46383285522461, "global_step": 233481, "epoch": 1389} {"train_loss": -11.527487754821777, "global_step": 233482, "epoch": 1389} {"train_loss": -11.807683944702148, "global_step": 233483, "epoch": 1389} {"train_loss": -11.715377807617188, "global_step": 233484, "epoch": 1389} {"train_loss": -11.114300727844238, "global_step": 233485, "epoch": 1389} {"train_loss": -11.589441299438477, "global_step": 233486, "epoch": 1389} {"train_loss": -11.229970932006836, "global_step": 233487, "epoch": 1389} {"train_loss": -11.276220321655273, "global_step": 233488, "epoch": 1389} {"train_loss": -11.638784408569336, "global_step": 233489, "epoch": 1389} {"train_loss": -11.690347671508789, "global_step": 233490, "epoch": 1389} {"train_loss": -11.35201644897461, "global_step": 233491, "epoch": 1389} {"train_loss": -10.693414688110352, "global_step": 233492, "epoch": 1389} {"train_loss": -10.914815902709961, "global_step": 233493, "epoch": 1389} {"train_loss": -11.364537239074707, "global_step": 233494, "epoch": 1389} {"train_loss": -10.002908706665039, "global_step": 233495, "epoch": 1389} {"train_loss": -11.738127708435059, "global_step": 233496, "epoch": 1389} {"train_loss": -10.857436180114746, "global_step": 233497, "epoch": 1389} {"train_loss": -11.031627655029297, "global_step": 233498, "epoch": 1389} {"train_loss": -11.716852188110352, "global_step": 233499, "epoch": 1389} {"train_loss": -11.292482376098633, "global_step": 233500, "epoch": 1389} {"train_loss": -11.529921531677246, "global_step": 233501, "epoch": 1389} {"train_loss": -11.232827186584473, "global_step": 233502, "epoch": 1389} {"train_loss": -11.474618911743164, "global_step": 233503, "epoch": 1389} {"train_loss": -11.511491775512695, "global_step": 233504, "epoch": 1389} {"train_loss": -11.175361633300781, "global_step": 233505, "epoch": 1389} {"train_loss": -11.231963157653809, "global_step": 233506, "epoch": 1389} {"train_loss": -11.522579193115234, "global_step": 233507, "epoch": 1389} {"train_loss": -11.325786590576172, "global_step": 233508, "epoch": 1389} {"train_loss": -11.36104965209961, "global_step": 233509, "epoch": 1389} {"train_loss": -11.593083381652832, "global_step": 233510, "epoch": 1389} {"train_loss": -11.573431015014648, "global_step": 233511, "epoch": 1389} {"train_loss": -11.220245361328125, "global_step": 233512, "epoch": 1389} {"train_loss": -11.130108833312988, "global_step": 233513, "epoch": 1389} {"train_loss": -11.082603454589844, "global_step": 233514, "epoch": 1389} {"train_loss": -11.713846206665039, "global_step": 233515, "epoch": 1389} {"train_loss": -11.157563209533691, "global_step": 233516, "epoch": 1389} {"train_loss": -11.63486385345459, "global_step": 233517, "epoch": 1389} {"train_loss": -11.551239013671875, "global_step": 233518, "epoch": 1389} {"train_loss": -11.522337209610711, "global_step": 233519, "epoch": 1389, "val_loss": 266464.125} {"train_loss": -11.649166107177734, "global_step": 233520, "epoch": 1390} {"train_loss": -11.619898796081543, "global_step": 233521, "epoch": 1390} {"train_loss": -12.110151290893555, "global_step": 233522, "epoch": 1390} {"train_loss": -11.34029769897461, "global_step": 233523, "epoch": 1390} {"train_loss": -11.640533447265625, "global_step": 233524, "epoch": 1390} {"train_loss": -11.776973724365234, "global_step": 233525, "epoch": 1390} {"train_loss": -11.803207397460938, "global_step": 233526, "epoch": 1390} {"train_loss": -11.780969619750977, "global_step": 233527, "epoch": 1390} {"train_loss": -11.384254455566406, "global_step": 233528, "epoch": 1390} {"train_loss": -12.00529956817627, "global_step": 233529, "epoch": 1390} {"train_loss": -11.690001487731934, "global_step": 233530, "epoch": 1390} {"train_loss": -11.902831077575684, "global_step": 233531, "epoch": 1390} {"train_loss": -11.726242065429688, "global_step": 233532, "epoch": 1390} {"train_loss": -11.889342308044434, "global_step": 233533, "epoch": 1390} {"train_loss": -11.855453491210938, "global_step": 233534, "epoch": 1390} {"train_loss": -12.00042724609375, "global_step": 233535, "epoch": 1390} {"train_loss": -11.868260383605957, "global_step": 233536, "epoch": 1390} {"train_loss": -11.506291389465332, "global_step": 233537, "epoch": 1390} {"train_loss": -11.970748901367188, "global_step": 233538, "epoch": 1390} {"train_loss": -11.976120948791504, "global_step": 233539, "epoch": 1390} {"train_loss": -11.937198638916016, "global_step": 233540, "epoch": 1390} {"train_loss": -12.093721389770508, "global_step": 233541, "epoch": 1390} {"train_loss": -11.969741821289062, "global_step": 233542, "epoch": 1390} {"train_loss": -11.647634506225586, "global_step": 233543, "epoch": 1390} {"train_loss": -11.733952522277832, "global_step": 233544, "epoch": 1390} {"train_loss": -11.776421546936035, "global_step": 233545, "epoch": 1390} {"train_loss": -11.97216510772705, "global_step": 233546, "epoch": 1390} {"train_loss": -11.83962631225586, "global_step": 233547, "epoch": 1390} {"train_loss": -11.728433609008789, "global_step": 233548, "epoch": 1390} {"train_loss": -11.750419616699219, "global_step": 233549, "epoch": 1390} {"train_loss": -10.52326488494873, "global_step": 233550, "epoch": 1390} {"train_loss": -11.599085807800293, "global_step": 233551, "epoch": 1390} {"train_loss": -11.776080131530762, "global_step": 233552, "epoch": 1390} {"train_loss": -11.10930061340332, "global_step": 233553, "epoch": 1390} {"train_loss": -11.626611709594727, "global_step": 233554, "epoch": 1390} {"train_loss": -11.57756233215332, "global_step": 233555, "epoch": 1390} {"train_loss": -11.018890380859375, "global_step": 233556, "epoch": 1390} {"train_loss": -11.469289779663086, "global_step": 233557, "epoch": 1390} {"train_loss": -11.589869499206543, "global_step": 233558, "epoch": 1390} {"train_loss": -11.733283042907715, "global_step": 233559, "epoch": 1390} {"train_loss": -11.354684829711914, "global_step": 233560, "epoch": 1390} {"train_loss": -11.632984161376953, "global_step": 233561, "epoch": 1390} {"train_loss": -11.725275039672852, "global_step": 233562, "epoch": 1390} {"train_loss": -11.577630043029785, "global_step": 233563, "epoch": 1390} {"train_loss": -11.572717666625977, "global_step": 233564, "epoch": 1390} {"train_loss": -11.871638298034668, "global_step": 233565, "epoch": 1390} {"train_loss": -11.664766311645508, "global_step": 233566, "epoch": 1390} {"train_loss": -11.963272094726562, "global_step": 233567, "epoch": 1390} {"train_loss": -11.9010009765625, "global_step": 233568, "epoch": 1390} {"train_loss": -11.804876327514648, "global_step": 233569, "epoch": 1390} {"train_loss": -12.03327465057373, "global_step": 233570, "epoch": 1390} {"train_loss": -12.057798385620117, "global_step": 233571, "epoch": 1390} {"train_loss": -11.933439254760742, "global_step": 233572, "epoch": 1390} {"train_loss": -11.709481239318848, "global_step": 233573, "epoch": 1390} {"train_loss": -11.930028915405273, "global_step": 233574, "epoch": 1390} {"train_loss": -11.844822883605957, "global_step": 233575, "epoch": 1390} {"train_loss": -11.647237777709961, "global_step": 233576, "epoch": 1390} {"train_loss": -11.450433731079102, "global_step": 233577, "epoch": 1390} {"train_loss": -11.547088623046875, "global_step": 233578, "epoch": 1390} {"train_loss": -10.834243774414062, "global_step": 233579, "epoch": 1390} {"train_loss": -11.680578231811523, "global_step": 233580, "epoch": 1390} {"train_loss": -11.005330085754395, "global_step": 233581, "epoch": 1390} {"train_loss": -11.077648162841797, "global_step": 233582, "epoch": 1390} {"train_loss": -10.518514633178711, "global_step": 233583, "epoch": 1390} {"train_loss": -11.470951080322266, "global_step": 233584, "epoch": 1390} {"train_loss": -10.03317642211914, "global_step": 233585, "epoch": 1390} {"train_loss": -11.027963638305664, "global_step": 233586, "epoch": 1390} {"train_loss": -9.864521026611328, "global_step": 233587, "epoch": 1390} {"train_loss": -10.126611709594727, "global_step": 233588, "epoch": 1390} {"train_loss": -10.518804550170898, "global_step": 233589, "epoch": 1390} {"train_loss": -9.631269454956055, "global_step": 233590, "epoch": 1390} {"train_loss": -9.904498100280762, "global_step": 233591, "epoch": 1390} {"train_loss": -10.351974487304688, "global_step": 233592, "epoch": 1390} {"train_loss": -10.967386245727539, "global_step": 233593, "epoch": 1390} {"train_loss": -10.731058120727539, "global_step": 233594, "epoch": 1390} {"train_loss": -10.633540153503418, "global_step": 233595, "epoch": 1390} {"train_loss": -10.846626281738281, "global_step": 233596, "epoch": 1390} {"train_loss": -10.810011863708496, "global_step": 233597, "epoch": 1390} {"train_loss": -10.566755294799805, "global_step": 233598, "epoch": 1390} {"train_loss": -11.452991485595703, "global_step": 233599, "epoch": 1390} {"train_loss": -10.417238235473633, "global_step": 233600, "epoch": 1390} {"train_loss": -10.50094985961914, "global_step": 233601, "epoch": 1390} {"train_loss": -11.212410926818848, "global_step": 233602, "epoch": 1390} {"train_loss": -9.63949966430664, "global_step": 233603, "epoch": 1390} {"train_loss": -10.952738761901855, "global_step": 233604, "epoch": 1390} {"train_loss": -9.885031700134277, "global_step": 233605, "epoch": 1390} {"train_loss": -10.714651107788086, "global_step": 233606, "epoch": 1390} {"train_loss": -10.99064826965332, "global_step": 233607, "epoch": 1390} {"train_loss": -10.809879302978516, "global_step": 233608, "epoch": 1390} {"train_loss": -11.006402969360352, "global_step": 233609, "epoch": 1390} {"train_loss": -11.187915802001953, "global_step": 233610, "epoch": 1390} {"train_loss": -10.848493576049805, "global_step": 233611, "epoch": 1390} {"train_loss": -11.187423706054688, "global_step": 233612, "epoch": 1390} {"train_loss": -11.232626914978027, "global_step": 233613, "epoch": 1390} {"train_loss": -11.135841369628906, "global_step": 233614, "epoch": 1390} {"train_loss": -11.109268188476562, "global_step": 233615, "epoch": 1390} {"train_loss": -11.359411239624023, "global_step": 233616, "epoch": 1390} {"train_loss": -11.296077728271484, "global_step": 233617, "epoch": 1390} {"train_loss": -10.946654319763184, "global_step": 233618, "epoch": 1390} {"train_loss": -11.327977180480957, "global_step": 233619, "epoch": 1390} {"train_loss": -11.230454444885254, "global_step": 233620, "epoch": 1390} {"train_loss": -11.330545425415039, "global_step": 233621, "epoch": 1390} {"train_loss": -11.504701614379883, "global_step": 233622, "epoch": 1390} {"train_loss": -11.588555335998535, "global_step": 233623, "epoch": 1390} {"train_loss": -11.706502914428711, "global_step": 233624, "epoch": 1390} {"train_loss": -11.382585525512695, "global_step": 233625, "epoch": 1390} {"train_loss": -11.632308959960938, "global_step": 233626, "epoch": 1390} {"train_loss": -11.804863929748535, "global_step": 233627, "epoch": 1390} {"train_loss": -11.495864868164062, "global_step": 233628, "epoch": 1390} {"train_loss": -11.691394805908203, "global_step": 233629, "epoch": 1390} {"train_loss": -11.519956588745117, "global_step": 233630, "epoch": 1390} {"train_loss": -11.613485336303711, "global_step": 233631, "epoch": 1390} {"train_loss": -11.643054008483887, "global_step": 233632, "epoch": 1390} {"train_loss": -11.905998229980469, "global_step": 233633, "epoch": 1390} {"train_loss": -11.764383316040039, "global_step": 233634, "epoch": 1390} {"train_loss": -11.747905731201172, "global_step": 233635, "epoch": 1390} {"train_loss": -11.831575393676758, "global_step": 233636, "epoch": 1390} {"train_loss": -11.625749588012695, "global_step": 233637, "epoch": 1390} {"train_loss": -11.704952239990234, "global_step": 233638, "epoch": 1390} {"train_loss": -11.684840202331543, "global_step": 233639, "epoch": 1390} {"train_loss": -11.874492645263672, "global_step": 233640, "epoch": 1390} {"train_loss": -11.88941764831543, "global_step": 233641, "epoch": 1390} {"train_loss": -11.84603500366211, "global_step": 233642, "epoch": 1390} {"train_loss": -11.888396263122559, "global_step": 233643, "epoch": 1390} {"train_loss": -11.935757637023926, "global_step": 233644, "epoch": 1390} {"train_loss": -11.872563362121582, "global_step": 233645, "epoch": 1390} {"train_loss": -12.053140640258789, "global_step": 233646, "epoch": 1390} {"train_loss": -11.897665977478027, "global_step": 233647, "epoch": 1390} {"train_loss": -11.918725967407227, "global_step": 233648, "epoch": 1390} {"train_loss": -11.712173461914062, "global_step": 233649, "epoch": 1390} {"train_loss": -11.97094440460205, "global_step": 233650, "epoch": 1390} {"train_loss": -11.787672996520996, "global_step": 233651, "epoch": 1390} {"train_loss": -11.783683776855469, "global_step": 233652, "epoch": 1390} {"train_loss": -12.02447509765625, "global_step": 233653, "epoch": 1390} {"train_loss": -12.037714004516602, "global_step": 233654, "epoch": 1390} {"train_loss": -12.210346221923828, "global_step": 233655, "epoch": 1390} {"train_loss": -12.070796012878418, "global_step": 233656, "epoch": 1390} {"train_loss": -11.783830642700195, "global_step": 233657, "epoch": 1390} {"train_loss": -12.099031448364258, "global_step": 233658, "epoch": 1390} {"train_loss": -11.887892723083496, "global_step": 233659, "epoch": 1390} {"train_loss": -12.219839096069336, "global_step": 233660, "epoch": 1390} {"train_loss": -12.019020080566406, "global_step": 233661, "epoch": 1390} {"train_loss": -12.06216812133789, "global_step": 233662, "epoch": 1390} {"train_loss": -12.148298263549805, "global_step": 233663, "epoch": 1390} {"train_loss": -12.080489158630371, "global_step": 233664, "epoch": 1390} {"train_loss": -12.126702308654785, "global_step": 233665, "epoch": 1390} {"train_loss": -12.076618194580078, "global_step": 233666, "epoch": 1390} {"train_loss": -12.151443481445312, "global_step": 233667, "epoch": 1390} {"train_loss": -11.929557800292969, "global_step": 233668, "epoch": 1390} {"train_loss": -11.628315925598145, "global_step": 233669, "epoch": 1390} {"train_loss": -12.083013534545898, "global_step": 233670, "epoch": 1390} {"train_loss": -12.144503593444824, "global_step": 233671, "epoch": 1390} {"train_loss": -11.97724723815918, "global_step": 233672, "epoch": 1390} {"train_loss": -11.830697059631348, "global_step": 233673, "epoch": 1390} {"train_loss": -12.11577033996582, "global_step": 233674, "epoch": 1390} {"train_loss": -11.359853744506836, "global_step": 233675, "epoch": 1390} {"train_loss": -11.524625778198242, "global_step": 233676, "epoch": 1390} {"train_loss": -11.509991645812988, "global_step": 233677, "epoch": 1390} {"train_loss": -11.764984130859375, "global_step": 233678, "epoch": 1390} {"train_loss": -10.569436073303223, "global_step": 233679, "epoch": 1390} {"train_loss": -8.993400573730469, "global_step": 233680, "epoch": 1390} {"train_loss": -9.737006187438965, "global_step": 233681, "epoch": 1390} {"train_loss": -11.208913803100586, "global_step": 233682, "epoch": 1390} {"train_loss": -10.067346572875977, "global_step": 233683, "epoch": 1390} {"train_loss": -10.978114128112793, "global_step": 233684, "epoch": 1390} {"train_loss": -10.699407577514648, "global_step": 233685, "epoch": 1390} {"train_loss": -11.750368118286133, "global_step": 233686, "epoch": 1390} {"train_loss": -11.459712789172219, "global_step": 233687, "epoch": 1390, "val_loss": 263197.125, "train_action_mse_error": 1.4919943809509277} {"train_loss": -10.738035202026367, "global_step": 233688, "epoch": 1391} {"train_loss": -11.557458877563477, "global_step": 233689, "epoch": 1391} {"train_loss": -9.966069221496582, "global_step": 233690, "epoch": 1391} {"train_loss": -11.609732627868652, "global_step": 233691, "epoch": 1391} {"train_loss": -10.249526977539062, "global_step": 233692, "epoch": 1391} {"train_loss": -11.494094848632812, "global_step": 233693, "epoch": 1391} {"train_loss": -10.927581787109375, "global_step": 233694, "epoch": 1391} {"train_loss": -11.346461296081543, "global_step": 233695, "epoch": 1391} {"train_loss": -10.915105819702148, "global_step": 233696, "epoch": 1391} {"train_loss": -10.707292556762695, "global_step": 233697, "epoch": 1391} {"train_loss": -11.414283752441406, "global_step": 233698, "epoch": 1391} {"train_loss": -10.767337799072266, "global_step": 233699, "epoch": 1391} {"train_loss": -11.513758659362793, "global_step": 233700, "epoch": 1391} {"train_loss": -11.293844223022461, "global_step": 233701, "epoch": 1391} {"train_loss": -11.532678604125977, "global_step": 233702, "epoch": 1391} {"train_loss": -11.201171875, "global_step": 233703, "epoch": 1391} {"train_loss": -11.392169952392578, "global_step": 233704, "epoch": 1391} {"train_loss": -11.57067584991455, "global_step": 233705, "epoch": 1391} {"train_loss": -11.14831256866455, "global_step": 233706, "epoch": 1391} {"train_loss": -11.774958610534668, "global_step": 233707, "epoch": 1391} {"train_loss": -11.195188522338867, "global_step": 233708, "epoch": 1391} {"train_loss": -11.663686752319336, "global_step": 233709, "epoch": 1391} {"train_loss": -11.654630661010742, "global_step": 233710, "epoch": 1391} {"train_loss": -11.791138648986816, "global_step": 233711, "epoch": 1391} {"train_loss": -11.698453903198242, "global_step": 233712, "epoch": 1391} {"train_loss": -11.636571884155273, "global_step": 233713, "epoch": 1391} {"train_loss": -11.904411315917969, "global_step": 233714, "epoch": 1391} {"train_loss": -11.35145092010498, "global_step": 233715, "epoch": 1391} {"train_loss": -11.868462562561035, "global_step": 233716, "epoch": 1391} {"train_loss": -11.37714672088623, "global_step": 233717, "epoch": 1391} {"train_loss": -11.88691234588623, "global_step": 233718, "epoch": 1391} {"train_loss": -11.952661514282227, "global_step": 233719, "epoch": 1391} {"train_loss": -11.573509216308594, "global_step": 233720, "epoch": 1391} {"train_loss": -11.787367820739746, "global_step": 233721, "epoch": 1391} {"train_loss": -11.419267654418945, "global_step": 233722, "epoch": 1391} {"train_loss": -11.951383590698242, "global_step": 233723, "epoch": 1391} {"train_loss": -11.523078918457031, "global_step": 233724, "epoch": 1391} {"train_loss": -11.982921600341797, "global_step": 233725, "epoch": 1391} {"train_loss": -11.637003898620605, "global_step": 233726, "epoch": 1391} {"train_loss": -11.422719955444336, "global_step": 233727, "epoch": 1391} {"train_loss": -11.782938003540039, "global_step": 233728, "epoch": 1391} {"train_loss": -10.936271667480469, "global_step": 233729, "epoch": 1391} {"train_loss": -11.937212944030762, "global_step": 233730, "epoch": 1391} {"train_loss": -11.07418441772461, "global_step": 233731, "epoch": 1391} {"train_loss": -11.267427444458008, "global_step": 233732, "epoch": 1391} {"train_loss": -11.232931137084961, "global_step": 233733, "epoch": 1391} {"train_loss": -10.049032211303711, "global_step": 233734, "epoch": 1391} {"train_loss": -11.618762969970703, "global_step": 233735, "epoch": 1391} {"train_loss": -10.393474578857422, "global_step": 233736, "epoch": 1391} {"train_loss": -11.292073249816895, "global_step": 233737, "epoch": 1391} {"train_loss": -10.822708129882812, "global_step": 233738, "epoch": 1391} {"train_loss": -11.118033409118652, "global_step": 233739, "epoch": 1391} {"train_loss": -11.143540382385254, "global_step": 233740, "epoch": 1391} {"train_loss": -10.726076126098633, "global_step": 233741, "epoch": 1391} {"train_loss": -11.520710945129395, "global_step": 233742, "epoch": 1391} {"train_loss": -11.37199592590332, "global_step": 233743, "epoch": 1391} {"train_loss": -11.690698623657227, "global_step": 233744, "epoch": 1391} {"train_loss": -11.154401779174805, "global_step": 233745, "epoch": 1391} {"train_loss": -11.378568649291992, "global_step": 233746, "epoch": 1391} {"train_loss": -11.382829666137695, "global_step": 233747, "epoch": 1391} {"train_loss": -11.552335739135742, "global_step": 233748, "epoch": 1391} {"train_loss": -11.11442756652832, "global_step": 233749, "epoch": 1391} {"train_loss": -11.750370979309082, "global_step": 233750, "epoch": 1391} {"train_loss": -11.038764953613281, "global_step": 233751, "epoch": 1391} {"train_loss": -11.729949951171875, "global_step": 233752, "epoch": 1391} {"train_loss": -11.443465232849121, "global_step": 233753, "epoch": 1391} {"train_loss": -11.707073211669922, "global_step": 233754, "epoch": 1391} {"train_loss": -11.4327392578125, "global_step": 233755, "epoch": 1391} {"train_loss": -11.670938491821289, "global_step": 233756, "epoch": 1391} {"train_loss": -11.53196907043457, "global_step": 233757, "epoch": 1391} {"train_loss": -11.60838508605957, "global_step": 233758, "epoch": 1391} {"train_loss": -11.66099739074707, "global_step": 233759, "epoch": 1391} {"train_loss": -11.59765625, "global_step": 233760, "epoch": 1391} {"train_loss": -11.40463924407959, "global_step": 233761, "epoch": 1391} {"train_loss": -11.530019760131836, "global_step": 233762, "epoch": 1391} {"train_loss": -10.897075653076172, "global_step": 233763, "epoch": 1391} {"train_loss": -11.832828521728516, "global_step": 233764, "epoch": 1391} {"train_loss": -11.367467880249023, "global_step": 233765, "epoch": 1391} {"train_loss": -11.685895919799805, "global_step": 233766, "epoch": 1391} {"train_loss": -11.658793449401855, "global_step": 233767, "epoch": 1391} {"train_loss": -11.363565444946289, "global_step": 233768, "epoch": 1391} {"train_loss": -11.765976905822754, "global_step": 233769, "epoch": 1391} {"train_loss": -11.715720176696777, "global_step": 233770, "epoch": 1391} {"train_loss": -11.85287094116211, "global_step": 233771, "epoch": 1391} {"train_loss": -11.632394790649414, "global_step": 233772, "epoch": 1391} {"train_loss": -11.756410598754883, "global_step": 233773, "epoch": 1391} {"train_loss": -11.779559135437012, "global_step": 233774, "epoch": 1391} {"train_loss": -11.673212051391602, "global_step": 233775, "epoch": 1391} {"train_loss": -11.887533187866211, "global_step": 233776, "epoch": 1391} {"train_loss": -11.684907913208008, "global_step": 233777, "epoch": 1391} {"train_loss": -11.82807445526123, "global_step": 233778, "epoch": 1391} {"train_loss": -11.958349227905273, "global_step": 233779, "epoch": 1391} {"train_loss": -11.454145431518555, "global_step": 233780, "epoch": 1391} {"train_loss": -11.848504066467285, "global_step": 233781, "epoch": 1391} {"train_loss": -11.778793334960938, "global_step": 233782, "epoch": 1391} {"train_loss": -11.946783065795898, "global_step": 233783, "epoch": 1391} {"train_loss": -11.956792831420898, "global_step": 233784, "epoch": 1391} {"train_loss": -11.849848747253418, "global_step": 233785, "epoch": 1391} {"train_loss": -11.9469575881958, "global_step": 233786, "epoch": 1391} {"train_loss": -11.879558563232422, "global_step": 233787, "epoch": 1391} {"train_loss": -11.892068862915039, "global_step": 233788, "epoch": 1391} {"train_loss": -11.993551254272461, "global_step": 233789, "epoch": 1391} {"train_loss": -11.844192504882812, "global_step": 233790, "epoch": 1391} {"train_loss": -11.925191879272461, "global_step": 233791, "epoch": 1391} {"train_loss": -12.168668746948242, "global_step": 233792, "epoch": 1391} {"train_loss": -11.855470657348633, "global_step": 233793, "epoch": 1391} {"train_loss": -11.7235689163208, "global_step": 233794, "epoch": 1391} {"train_loss": -11.964208602905273, "global_step": 233795, "epoch": 1391} {"train_loss": -11.88287353515625, "global_step": 233796, "epoch": 1391} {"train_loss": -11.72265338897705, "global_step": 233797, "epoch": 1391} {"train_loss": -11.843871116638184, "global_step": 233798, "epoch": 1391} {"train_loss": -11.844023704528809, "global_step": 233799, "epoch": 1391} {"train_loss": -11.89033317565918, "global_step": 233800, "epoch": 1391} {"train_loss": -11.809303283691406, "global_step": 233801, "epoch": 1391} {"train_loss": -12.065023422241211, "global_step": 233802, "epoch": 1391} {"train_loss": -11.68118667602539, "global_step": 233803, "epoch": 1391} {"train_loss": -12.068406105041504, "global_step": 233804, "epoch": 1391} {"train_loss": -11.971738815307617, "global_step": 233805, "epoch": 1391} {"train_loss": -11.746233940124512, "global_step": 233806, "epoch": 1391} {"train_loss": -11.417895317077637, "global_step": 233807, "epoch": 1391} {"train_loss": -11.552460670471191, "global_step": 233808, "epoch": 1391} {"train_loss": -11.7545166015625, "global_step": 233809, "epoch": 1391} {"train_loss": -11.520626068115234, "global_step": 233810, "epoch": 1391} {"train_loss": -12.013051986694336, "global_step": 233811, "epoch": 1391} {"train_loss": -12.116518020629883, "global_step": 233812, "epoch": 1391} {"train_loss": -11.671045303344727, "global_step": 233813, "epoch": 1391} {"train_loss": -11.819986343383789, "global_step": 233814, "epoch": 1391} {"train_loss": -11.869154930114746, "global_step": 233815, "epoch": 1391} {"train_loss": -11.629565238952637, "global_step": 233816, "epoch": 1391} {"train_loss": -11.548202514648438, "global_step": 233817, "epoch": 1391} {"train_loss": -12.05398178100586, "global_step": 233818, "epoch": 1391} {"train_loss": -11.891408920288086, "global_step": 233819, "epoch": 1391} {"train_loss": -11.814398765563965, "global_step": 233820, "epoch": 1391} {"train_loss": -11.77338981628418, "global_step": 233821, "epoch": 1391} {"train_loss": -12.230925559997559, "global_step": 233822, "epoch": 1391} {"train_loss": -11.513882637023926, "global_step": 233823, "epoch": 1391} {"train_loss": -10.563173294067383, "global_step": 233824, "epoch": 1391} {"train_loss": -11.209349632263184, "global_step": 233825, "epoch": 1391} {"train_loss": -11.858572006225586, "global_step": 233826, "epoch": 1391} {"train_loss": -9.53607177734375, "global_step": 233827, "epoch": 1391} {"train_loss": -9.960439682006836, "global_step": 233828, "epoch": 1391} {"train_loss": -10.999982833862305, "global_step": 233829, "epoch": 1391} {"train_loss": -9.374959945678711, "global_step": 233830, "epoch": 1391} {"train_loss": -10.01396369934082, "global_step": 233831, "epoch": 1391} {"train_loss": -8.888588905334473, "global_step": 233832, "epoch": 1391} {"train_loss": -9.496102333068848, "global_step": 233833, "epoch": 1391} {"train_loss": -10.053184509277344, "global_step": 233834, "epoch": 1391} {"train_loss": -10.593470573425293, "global_step": 233835, "epoch": 1391} {"train_loss": -10.459399223327637, "global_step": 233836, "epoch": 1391} {"train_loss": -10.146486282348633, "global_step": 233837, "epoch": 1391} {"train_loss": -10.714742660522461, "global_step": 233838, "epoch": 1391} {"train_loss": -10.80075740814209, "global_step": 233839, "epoch": 1391} {"train_loss": -10.541364669799805, "global_step": 233840, "epoch": 1391} {"train_loss": -9.534287452697754, "global_step": 233841, "epoch": 1391} {"train_loss": -10.924936294555664, "global_step": 233842, "epoch": 1391} {"train_loss": -9.618274688720703, "global_step": 233843, "epoch": 1391} {"train_loss": -11.26241683959961, "global_step": 233844, "epoch": 1391} {"train_loss": -9.976211547851562, "global_step": 233845, "epoch": 1391} {"train_loss": -10.79903793334961, "global_step": 233846, "epoch": 1391} {"train_loss": -9.800910949707031, "global_step": 233847, "epoch": 1391} {"train_loss": -10.46174144744873, "global_step": 233848, "epoch": 1391} {"train_loss": -10.623815536499023, "global_step": 233849, "epoch": 1391} {"train_loss": -10.579444885253906, "global_step": 233850, "epoch": 1391} {"train_loss": -9.932706832885742, "global_step": 233851, "epoch": 1391} {"train_loss": -9.814477920532227, "global_step": 233852, "epoch": 1391} {"train_loss": -10.911181449890137, "global_step": 233853, "epoch": 1391} {"train_loss": -9.995047569274902, "global_step": 233854, "epoch": 1391} {"train_loss": -11.324922453789483, "global_step": 233855, "epoch": 1391, "val_loss": 264366.1875} {"train_loss": -10.126047134399414, "global_step": 233856, "epoch": 1392} {"train_loss": -10.360734939575195, "global_step": 233857, "epoch": 1392} {"train_loss": -10.5230712890625, "global_step": 233858, "epoch": 1392} {"train_loss": -10.190518379211426, "global_step": 233859, "epoch": 1392} {"train_loss": -11.080862998962402, "global_step": 233860, "epoch": 1392} {"train_loss": -10.529485702514648, "global_step": 233861, "epoch": 1392} {"train_loss": -11.05571174621582, "global_step": 233862, "epoch": 1392} {"train_loss": -10.748638153076172, "global_step": 233863, "epoch": 1392} {"train_loss": -11.431427001953125, "global_step": 233864, "epoch": 1392} {"train_loss": -11.105535507202148, "global_step": 233865, "epoch": 1392} {"train_loss": -11.310396194458008, "global_step": 233866, "epoch": 1392} {"train_loss": -11.33626937866211, "global_step": 233867, "epoch": 1392} {"train_loss": -11.447927474975586, "global_step": 233868, "epoch": 1392} {"train_loss": -11.447113037109375, "global_step": 233869, "epoch": 1392} {"train_loss": -11.143413543701172, "global_step": 233870, "epoch": 1392} {"train_loss": -11.536962509155273, "global_step": 233871, "epoch": 1392} {"train_loss": -11.211263656616211, "global_step": 233872, "epoch": 1392} {"train_loss": -11.511419296264648, "global_step": 233873, "epoch": 1392} {"train_loss": -11.64279556274414, "global_step": 233874, "epoch": 1392} {"train_loss": -11.274423599243164, "global_step": 233875, "epoch": 1392} {"train_loss": -11.54705810546875, "global_step": 233876, "epoch": 1392} {"train_loss": -11.606266975402832, "global_step": 233877, "epoch": 1392} {"train_loss": -11.460257530212402, "global_step": 233878, "epoch": 1392} {"train_loss": -11.450276374816895, "global_step": 233879, "epoch": 1392} {"train_loss": -11.718619346618652, "global_step": 233880, "epoch": 1392} {"train_loss": -11.34119701385498, "global_step": 233881, "epoch": 1392} {"train_loss": -11.723183631896973, "global_step": 233882, "epoch": 1392} {"train_loss": -11.688392639160156, "global_step": 233883, "epoch": 1392} {"train_loss": -11.652992248535156, "global_step": 233884, "epoch": 1392} {"train_loss": -11.51123046875, "global_step": 233885, "epoch": 1392} {"train_loss": -11.83851432800293, "global_step": 233886, "epoch": 1392} {"train_loss": -11.158110618591309, "global_step": 233887, "epoch": 1392} {"train_loss": -11.626304626464844, "global_step": 233888, "epoch": 1392} {"train_loss": -11.486474990844727, "global_step": 233889, "epoch": 1392} {"train_loss": -11.497703552246094, "global_step": 233890, "epoch": 1392} {"train_loss": -11.616029739379883, "global_step": 233891, "epoch": 1392} {"train_loss": -11.497045516967773, "global_step": 233892, "epoch": 1392} {"train_loss": -11.389558792114258, "global_step": 233893, "epoch": 1392} {"train_loss": -11.722164154052734, "global_step": 233894, "epoch": 1392} {"train_loss": -11.349710464477539, "global_step": 233895, "epoch": 1392} {"train_loss": -11.924585342407227, "global_step": 233896, "epoch": 1392} {"train_loss": -11.694914817810059, "global_step": 233897, "epoch": 1392} {"train_loss": -11.531050682067871, "global_step": 233898, "epoch": 1392} {"train_loss": -11.716361999511719, "global_step": 233899, "epoch": 1392} {"train_loss": -11.672822952270508, "global_step": 233900, "epoch": 1392} {"train_loss": -11.69561767578125, "global_step": 233901, "epoch": 1392} {"train_loss": -11.718832015991211, "global_step": 233902, "epoch": 1392} {"train_loss": -11.482623100280762, "global_step": 233903, "epoch": 1392} {"train_loss": -11.837077140808105, "global_step": 233904, "epoch": 1392} {"train_loss": -11.645015716552734, "global_step": 233905, "epoch": 1392} {"train_loss": -11.46348762512207, "global_step": 233906, "epoch": 1392} {"train_loss": -11.8604154586792, "global_step": 233907, "epoch": 1392} {"train_loss": -11.686293601989746, "global_step": 233908, "epoch": 1392} {"train_loss": -11.865300178527832, "global_step": 233909, "epoch": 1392} {"train_loss": -11.594472885131836, "global_step": 233910, "epoch": 1392} {"train_loss": -11.95758056640625, "global_step": 233911, "epoch": 1392} {"train_loss": -11.820978164672852, "global_step": 233912, "epoch": 1392} {"train_loss": -11.999759674072266, "global_step": 233913, "epoch": 1392} {"train_loss": -12.04813003540039, "global_step": 233914, "epoch": 1392} {"train_loss": -11.884004592895508, "global_step": 233915, "epoch": 1392} {"train_loss": -11.945317268371582, "global_step": 233916, "epoch": 1392} {"train_loss": -12.183069229125977, "global_step": 233917, "epoch": 1392} {"train_loss": -11.984018325805664, "global_step": 233918, "epoch": 1392} {"train_loss": -12.014062881469727, "global_step": 233919, "epoch": 1392} {"train_loss": -12.0365629196167, "global_step": 233920, "epoch": 1392} {"train_loss": -12.01241683959961, "global_step": 233921, "epoch": 1392} {"train_loss": -12.22897720336914, "global_step": 233922, "epoch": 1392} {"train_loss": -12.12167739868164, "global_step": 233923, "epoch": 1392} {"train_loss": -12.074995994567871, "global_step": 233924, "epoch": 1392} {"train_loss": -11.986023902893066, "global_step": 233925, "epoch": 1392} {"train_loss": -12.123538970947266, "global_step": 233926, "epoch": 1392} {"train_loss": -12.102182388305664, "global_step": 233927, "epoch": 1392} {"train_loss": -11.906620025634766, "global_step": 233928, "epoch": 1392} {"train_loss": -12.055471420288086, "global_step": 233929, "epoch": 1392} {"train_loss": -12.181368827819824, "global_step": 233930, "epoch": 1392} {"train_loss": -11.865596771240234, "global_step": 233931, "epoch": 1392} {"train_loss": -12.133045196533203, "global_step": 233932, "epoch": 1392} {"train_loss": -11.736353874206543, "global_step": 233933, "epoch": 1392} {"train_loss": -11.79504108428955, "global_step": 233934, "epoch": 1392} {"train_loss": -12.175344467163086, "global_step": 233935, "epoch": 1392} {"train_loss": -12.018514633178711, "global_step": 233936, "epoch": 1392} {"train_loss": -12.027950286865234, "global_step": 233937, "epoch": 1392} {"train_loss": -11.930529594421387, "global_step": 233938, "epoch": 1392} {"train_loss": -12.104564666748047, "global_step": 233939, "epoch": 1392} {"train_loss": -12.199687957763672, "global_step": 233940, "epoch": 1392} {"train_loss": -11.854133605957031, "global_step": 233941, "epoch": 1392} {"train_loss": -12.221563339233398, "global_step": 233942, "epoch": 1392} {"train_loss": -11.987401962280273, "global_step": 233943, "epoch": 1392} {"train_loss": -11.601068496704102, "global_step": 233944, "epoch": 1392} {"train_loss": -11.852514266967773, "global_step": 233945, "epoch": 1392} {"train_loss": -11.857105255126953, "global_step": 233946, "epoch": 1392} {"train_loss": -11.759376525878906, "global_step": 233947, "epoch": 1392} {"train_loss": -11.74519157409668, "global_step": 233948, "epoch": 1392} {"train_loss": -11.847955703735352, "global_step": 233949, "epoch": 1392} {"train_loss": -11.609420776367188, "global_step": 233950, "epoch": 1392} {"train_loss": -10.709718704223633, "global_step": 233951, "epoch": 1392} {"train_loss": -10.959274291992188, "global_step": 233952, "epoch": 1392} {"train_loss": -11.611644744873047, "global_step": 233953, "epoch": 1392} {"train_loss": -11.071540832519531, "global_step": 233954, "epoch": 1392} {"train_loss": -10.263690948486328, "global_step": 233955, "epoch": 1392} {"train_loss": -10.713750839233398, "global_step": 233956, "epoch": 1392} {"train_loss": -10.804618835449219, "global_step": 233957, "epoch": 1392} {"train_loss": -11.199962615966797, "global_step": 233958, "epoch": 1392} {"train_loss": -8.893115997314453, "global_step": 233959, "epoch": 1392} {"train_loss": -9.446720123291016, "global_step": 233960, "epoch": 1392} {"train_loss": -9.560635566711426, "global_step": 233961, "epoch": 1392} {"train_loss": -9.745013236999512, "global_step": 233962, "epoch": 1392} {"train_loss": -9.218461990356445, "global_step": 233963, "epoch": 1392} {"train_loss": -11.104991912841797, "global_step": 233964, "epoch": 1392} {"train_loss": -10.481634140014648, "global_step": 233965, "epoch": 1392} {"train_loss": -11.295999526977539, "global_step": 233966, "epoch": 1392} {"train_loss": -10.244085311889648, "global_step": 233967, "epoch": 1392} {"train_loss": -10.719839096069336, "global_step": 233968, "epoch": 1392} {"train_loss": -11.133186340332031, "global_step": 233969, "epoch": 1392} {"train_loss": -10.500757217407227, "global_step": 233970, "epoch": 1392} {"train_loss": -11.686761856079102, "global_step": 233971, "epoch": 1392} {"train_loss": -10.301156997680664, "global_step": 233972, "epoch": 1392} {"train_loss": -11.12183952331543, "global_step": 233973, "epoch": 1392} {"train_loss": -11.35025405883789, "global_step": 233974, "epoch": 1392} {"train_loss": -10.68546199798584, "global_step": 233975, "epoch": 1392} {"train_loss": -11.19102668762207, "global_step": 233976, "epoch": 1392} {"train_loss": -10.448147773742676, "global_step": 233977, "epoch": 1392} {"train_loss": -11.189786911010742, "global_step": 233978, "epoch": 1392} {"train_loss": -10.705479621887207, "global_step": 233979, "epoch": 1392} {"train_loss": -10.51292610168457, "global_step": 233980, "epoch": 1392} {"train_loss": -11.250852584838867, "global_step": 233981, "epoch": 1392} {"train_loss": -10.471935272216797, "global_step": 233982, "epoch": 1392} {"train_loss": -11.058822631835938, "global_step": 233983, "epoch": 1392} {"train_loss": -10.720236778259277, "global_step": 233984, "epoch": 1392} {"train_loss": -10.655722618103027, "global_step": 233985, "epoch": 1392} {"train_loss": -11.194744110107422, "global_step": 233986, "epoch": 1392} {"train_loss": -10.524041175842285, "global_step": 233987, "epoch": 1392} {"train_loss": -11.15424919128418, "global_step": 233988, "epoch": 1392} {"train_loss": -11.037496566772461, "global_step": 233989, "epoch": 1392} {"train_loss": -10.789470672607422, "global_step": 233990, "epoch": 1392} {"train_loss": -11.385005950927734, "global_step": 233991, "epoch": 1392} {"train_loss": -10.560522079467773, "global_step": 233992, "epoch": 1392} {"train_loss": -11.132387161254883, "global_step": 233993, "epoch": 1392} {"train_loss": -11.110408782958984, "global_step": 233994, "epoch": 1392} {"train_loss": -11.220104217529297, "global_step": 233995, "epoch": 1392} {"train_loss": -11.425912857055664, "global_step": 233996, "epoch": 1392} {"train_loss": -11.468490600585938, "global_step": 233997, "epoch": 1392} {"train_loss": -11.323709487915039, "global_step": 233998, "epoch": 1392} {"train_loss": -11.535527229309082, "global_step": 233999, "epoch": 1392} {"train_loss": -11.364730834960938, "global_step": 234000, "epoch": 1392} {"train_loss": -11.516338348388672, "global_step": 234001, "epoch": 1392} {"train_loss": -11.003381729125977, "global_step": 234002, "epoch": 1392} {"train_loss": -11.328634262084961, "global_step": 234003, "epoch": 1392} {"train_loss": -11.097759246826172, "global_step": 234004, "epoch": 1392} {"train_loss": -11.4379301071167, "global_step": 234005, "epoch": 1392} {"train_loss": -10.986513137817383, "global_step": 234006, "epoch": 1392} {"train_loss": -11.4056396484375, "global_step": 234007, "epoch": 1392} {"train_loss": -11.623237609863281, "global_step": 234008, "epoch": 1392} {"train_loss": -11.129629135131836, "global_step": 234009, "epoch": 1392} {"train_loss": -11.664787292480469, "global_step": 234010, "epoch": 1392} {"train_loss": -11.512955665588379, "global_step": 234011, "epoch": 1392} {"train_loss": -11.577519416809082, "global_step": 234012, "epoch": 1392} {"train_loss": -11.508925437927246, "global_step": 234013, "epoch": 1392} {"train_loss": -11.623445510864258, "global_step": 234014, "epoch": 1392} {"train_loss": -11.388611793518066, "global_step": 234015, "epoch": 1392} {"train_loss": -11.584821701049805, "global_step": 234016, "epoch": 1392} {"train_loss": -11.607002258300781, "global_step": 234017, "epoch": 1392} {"train_loss": -11.586478233337402, "global_step": 234018, "epoch": 1392} {"train_loss": -11.740198135375977, "global_step": 234019, "epoch": 1392} {"train_loss": -11.604385375976562, "global_step": 234020, "epoch": 1392} {"train_loss": -11.597160339355469, "global_step": 234021, "epoch": 1392} {"train_loss": -11.886113166809082, "global_step": 234022, "epoch": 1392} {"train_loss": -11.372288777714683, "global_step": 234023, "epoch": 1392, "val_loss": 262740.53125} {"train_loss": -11.71263313293457, "global_step": 234024, "epoch": 1393} {"train_loss": -11.751350402832031, "global_step": 234025, "epoch": 1393} {"train_loss": -11.920412063598633, "global_step": 234026, "epoch": 1393} {"train_loss": -11.810782432556152, "global_step": 234027, "epoch": 1393} {"train_loss": -11.907076835632324, "global_step": 234028, "epoch": 1393} {"train_loss": -11.908930778503418, "global_step": 234029, "epoch": 1393} {"train_loss": -11.848078727722168, "global_step": 234030, "epoch": 1393} {"train_loss": -11.861140251159668, "global_step": 234031, "epoch": 1393} {"train_loss": -11.94899845123291, "global_step": 234032, "epoch": 1393} {"train_loss": -11.73245620727539, "global_step": 234033, "epoch": 1393} {"train_loss": -11.938217163085938, "global_step": 234034, "epoch": 1393} {"train_loss": -11.934192657470703, "global_step": 234035, "epoch": 1393} {"train_loss": -11.800480842590332, "global_step": 234036, "epoch": 1393} {"train_loss": -12.024702072143555, "global_step": 234037, "epoch": 1393} {"train_loss": -11.869010925292969, "global_step": 234038, "epoch": 1393} {"train_loss": -11.687165260314941, "global_step": 234039, "epoch": 1393} {"train_loss": -11.780569076538086, "global_step": 234040, "epoch": 1393} {"train_loss": -11.646461486816406, "global_step": 234041, "epoch": 1393} {"train_loss": -11.730867385864258, "global_step": 234042, "epoch": 1393} {"train_loss": -11.825850486755371, "global_step": 234043, "epoch": 1393} {"train_loss": -11.723733901977539, "global_step": 234044, "epoch": 1393} {"train_loss": -11.769968032836914, "global_step": 234045, "epoch": 1393} {"train_loss": -11.563777923583984, "global_step": 234046, "epoch": 1393} {"train_loss": -11.776201248168945, "global_step": 234047, "epoch": 1393} {"train_loss": -11.918639183044434, "global_step": 234048, "epoch": 1393} {"train_loss": -11.481419563293457, "global_step": 234049, "epoch": 1393} {"train_loss": -11.864075660705566, "global_step": 234050, "epoch": 1393} {"train_loss": -11.87399959564209, "global_step": 234051, "epoch": 1393} {"train_loss": -11.491064071655273, "global_step": 234052, "epoch": 1393} {"train_loss": -11.794103622436523, "global_step": 234053, "epoch": 1393} {"train_loss": -11.756175994873047, "global_step": 234054, "epoch": 1393} {"train_loss": -11.7024564743042, "global_step": 234055, "epoch": 1393} {"train_loss": -11.937529563903809, "global_step": 234056, "epoch": 1393} {"train_loss": -11.576744079589844, "global_step": 234057, "epoch": 1393} {"train_loss": -12.065986633300781, "global_step": 234058, "epoch": 1393} {"train_loss": -11.722593307495117, "global_step": 234059, "epoch": 1393} {"train_loss": -11.609163284301758, "global_step": 234060, "epoch": 1393} {"train_loss": -11.994781494140625, "global_step": 234061, "epoch": 1393} {"train_loss": -12.03287124633789, "global_step": 234062, "epoch": 1393} {"train_loss": -12.064933776855469, "global_step": 234063, "epoch": 1393} {"train_loss": -11.993402481079102, "global_step": 234064, "epoch": 1393} {"train_loss": -11.90864372253418, "global_step": 234065, "epoch": 1393} {"train_loss": -11.986326217651367, "global_step": 234066, "epoch": 1393} {"train_loss": -11.452152252197266, "global_step": 234067, "epoch": 1393} {"train_loss": -12.138336181640625, "global_step": 234068, "epoch": 1393} {"train_loss": -11.756990432739258, "global_step": 234069, "epoch": 1393} {"train_loss": -11.84023666381836, "global_step": 234070, "epoch": 1393} {"train_loss": -11.660806655883789, "global_step": 234071, "epoch": 1393} {"train_loss": -11.484908103942871, "global_step": 234072, "epoch": 1393} {"train_loss": -11.750911712646484, "global_step": 234073, "epoch": 1393} {"train_loss": -11.678939819335938, "global_step": 234074, "epoch": 1393} {"train_loss": -11.242055892944336, "global_step": 234075, "epoch": 1393} {"train_loss": -11.683547973632812, "global_step": 234076, "epoch": 1393} {"train_loss": -11.92114543914795, "global_step": 234077, "epoch": 1393} {"train_loss": -11.482294082641602, "global_step": 234078, "epoch": 1393} {"train_loss": -12.006479263305664, "global_step": 234079, "epoch": 1393} {"train_loss": -10.878822326660156, "global_step": 234080, "epoch": 1393} {"train_loss": -11.934823989868164, "global_step": 234081, "epoch": 1393} {"train_loss": -11.775458335876465, "global_step": 234082, "epoch": 1393} {"train_loss": -11.483643531799316, "global_step": 234083, "epoch": 1393} {"train_loss": -11.872954368591309, "global_step": 234084, "epoch": 1393} {"train_loss": -11.897756576538086, "global_step": 234085, "epoch": 1393} {"train_loss": -11.744132995605469, "global_step": 234086, "epoch": 1393} {"train_loss": -11.93307876586914, "global_step": 234087, "epoch": 1393} {"train_loss": -11.647480010986328, "global_step": 234088, "epoch": 1393} {"train_loss": -11.882244110107422, "global_step": 234089, "epoch": 1393} {"train_loss": -11.606425285339355, "global_step": 234090, "epoch": 1393} {"train_loss": -11.236196517944336, "global_step": 234091, "epoch": 1393} {"train_loss": -11.643693923950195, "global_step": 234092, "epoch": 1393} {"train_loss": -11.417058944702148, "global_step": 234093, "epoch": 1393} {"train_loss": -11.084126472473145, "global_step": 234094, "epoch": 1393} {"train_loss": -11.994577407836914, "global_step": 234095, "epoch": 1393} {"train_loss": -11.578723907470703, "global_step": 234096, "epoch": 1393} {"train_loss": -11.56939697265625, "global_step": 234097, "epoch": 1393} {"train_loss": -11.716554641723633, "global_step": 234098, "epoch": 1393} {"train_loss": -11.159357070922852, "global_step": 234099, "epoch": 1393} {"train_loss": -11.668583869934082, "global_step": 234100, "epoch": 1393} {"train_loss": -11.916454315185547, "global_step": 234101, "epoch": 1393} {"train_loss": -11.214313507080078, "global_step": 234102, "epoch": 1393} {"train_loss": -11.642942428588867, "global_step": 234103, "epoch": 1393} {"train_loss": -11.892755508422852, "global_step": 234104, "epoch": 1393} {"train_loss": -11.128494262695312, "global_step": 234105, "epoch": 1393} {"train_loss": -11.971001625061035, "global_step": 234106, "epoch": 1393} {"train_loss": -11.416230201721191, "global_step": 234107, "epoch": 1393} {"train_loss": -11.632255554199219, "global_step": 234108, "epoch": 1393} {"train_loss": -11.705079078674316, "global_step": 234109, "epoch": 1393} {"train_loss": -11.468927383422852, "global_step": 234110, "epoch": 1393} {"train_loss": -11.797656059265137, "global_step": 234111, "epoch": 1393} {"train_loss": -11.465770721435547, "global_step": 234112, "epoch": 1393} {"train_loss": -10.937747955322266, "global_step": 234113, "epoch": 1393} {"train_loss": -10.993335723876953, "global_step": 234114, "epoch": 1393} {"train_loss": -11.311141967773438, "global_step": 234115, "epoch": 1393} {"train_loss": -11.288061141967773, "global_step": 234116, "epoch": 1393} {"train_loss": -11.451117515563965, "global_step": 234117, "epoch": 1393} {"train_loss": -11.008687019348145, "global_step": 234118, "epoch": 1393} {"train_loss": -11.289108276367188, "global_step": 234119, "epoch": 1393} {"train_loss": -10.862585067749023, "global_step": 234120, "epoch": 1393} {"train_loss": -11.285406112670898, "global_step": 234121, "epoch": 1393} {"train_loss": -11.182811737060547, "global_step": 234122, "epoch": 1393} {"train_loss": -10.706232070922852, "global_step": 234123, "epoch": 1393} {"train_loss": -11.423870086669922, "global_step": 234124, "epoch": 1393} {"train_loss": -10.525217056274414, "global_step": 234125, "epoch": 1393} {"train_loss": -10.048606872558594, "global_step": 234126, "epoch": 1393} {"train_loss": -11.268770217895508, "global_step": 234127, "epoch": 1393} {"train_loss": -10.723262786865234, "global_step": 234128, "epoch": 1393} {"train_loss": -10.908256530761719, "global_step": 234129, "epoch": 1393} {"train_loss": -11.133049964904785, "global_step": 234130, "epoch": 1393} {"train_loss": -11.182476043701172, "global_step": 234131, "epoch": 1393} {"train_loss": -11.649219512939453, "global_step": 234132, "epoch": 1393} {"train_loss": -10.876903533935547, "global_step": 234133, "epoch": 1393} {"train_loss": -10.663376808166504, "global_step": 234134, "epoch": 1393} {"train_loss": -11.335675239562988, "global_step": 234135, "epoch": 1393} {"train_loss": -10.969547271728516, "global_step": 234136, "epoch": 1393} {"train_loss": -11.693148612976074, "global_step": 234137, "epoch": 1393} {"train_loss": -11.308809280395508, "global_step": 234138, "epoch": 1393} {"train_loss": -11.468549728393555, "global_step": 234139, "epoch": 1393} {"train_loss": -11.129197120666504, "global_step": 234140, "epoch": 1393} {"train_loss": -11.704364776611328, "global_step": 234141, "epoch": 1393} {"train_loss": -11.343761444091797, "global_step": 234142, "epoch": 1393} {"train_loss": -11.608911514282227, "global_step": 234143, "epoch": 1393} {"train_loss": -11.783509254455566, "global_step": 234144, "epoch": 1393} {"train_loss": -11.261743545532227, "global_step": 234145, "epoch": 1393} {"train_loss": -11.896422386169434, "global_step": 234146, "epoch": 1393} {"train_loss": -11.48041820526123, "global_step": 234147, "epoch": 1393} {"train_loss": -11.544816970825195, "global_step": 234148, "epoch": 1393} {"train_loss": -11.641912460327148, "global_step": 234149, "epoch": 1393} {"train_loss": -11.56761646270752, "global_step": 234150, "epoch": 1393} {"train_loss": -11.948851585388184, "global_step": 234151, "epoch": 1393} {"train_loss": -11.461021423339844, "global_step": 234152, "epoch": 1393} {"train_loss": -11.74311637878418, "global_step": 234153, "epoch": 1393} {"train_loss": -11.225693702697754, "global_step": 234154, "epoch": 1393} {"train_loss": -11.850732803344727, "global_step": 234155, "epoch": 1393} {"train_loss": -11.634220123291016, "global_step": 234156, "epoch": 1393} {"train_loss": -11.805058479309082, "global_step": 234157, "epoch": 1393} {"train_loss": -11.673075675964355, "global_step": 234158, "epoch": 1393} {"train_loss": -11.861043930053711, "global_step": 234159, "epoch": 1393} {"train_loss": -11.62016487121582, "global_step": 234160, "epoch": 1393} {"train_loss": -11.663309097290039, "global_step": 234161, "epoch": 1393} {"train_loss": -11.803033828735352, "global_step": 234162, "epoch": 1393} {"train_loss": -11.757774353027344, "global_step": 234163, "epoch": 1393} {"train_loss": -11.777950286865234, "global_step": 234164, "epoch": 1393} {"train_loss": -11.827184677124023, "global_step": 234165, "epoch": 1393} {"train_loss": -11.710619926452637, "global_step": 234166, "epoch": 1393} {"train_loss": -11.690735816955566, "global_step": 234167, "epoch": 1393} {"train_loss": -11.906590461730957, "global_step": 234168, "epoch": 1393} {"train_loss": -11.652819633483887, "global_step": 234169, "epoch": 1393} {"train_loss": -11.816503524780273, "global_step": 234170, "epoch": 1393} {"train_loss": -11.719261169433594, "global_step": 234171, "epoch": 1393} {"train_loss": -11.936285018920898, "global_step": 234172, "epoch": 1393} {"train_loss": -11.814788818359375, "global_step": 234173, "epoch": 1393} {"train_loss": -11.858909606933594, "global_step": 234174, "epoch": 1393} {"train_loss": -11.406346321105957, "global_step": 234175, "epoch": 1393} {"train_loss": -11.980305671691895, "global_step": 234176, "epoch": 1393} {"train_loss": -11.986383438110352, "global_step": 234177, "epoch": 1393} {"train_loss": -11.715173721313477, "global_step": 234178, "epoch": 1393} {"train_loss": -11.509044647216797, "global_step": 234179, "epoch": 1393} {"train_loss": -11.45977783203125, "global_step": 234180, "epoch": 1393} {"train_loss": -11.540975570678711, "global_step": 234181, "epoch": 1393} {"train_loss": -11.471187591552734, "global_step": 234182, "epoch": 1393} {"train_loss": -11.370022773742676, "global_step": 234183, "epoch": 1393} {"train_loss": -11.30328369140625, "global_step": 234184, "epoch": 1393} {"train_loss": -11.225383758544922, "global_step": 234185, "epoch": 1393} {"train_loss": -11.642940521240234, "global_step": 234186, "epoch": 1393} {"train_loss": -11.535369873046875, "global_step": 234187, "epoch": 1393} {"train_loss": -11.182244300842285, "global_step": 234188, "epoch": 1393} {"train_loss": -11.946256637573242, "global_step": 234189, "epoch": 1393} {"train_loss": -11.365432739257812, "global_step": 234190, "epoch": 1393} {"train_loss": -11.595153110367912, "global_step": 234191, "epoch": 1393, "val_loss": 263070.96875} {"train_loss": -11.846929550170898, "global_step": 234192, "epoch": 1394} {"train_loss": -11.583189964294434, "global_step": 234193, "epoch": 1394} {"train_loss": -11.8826904296875, "global_step": 234194, "epoch": 1394} {"train_loss": -11.728867530822754, "global_step": 234195, "epoch": 1394} {"train_loss": -11.759453773498535, "global_step": 234196, "epoch": 1394} {"train_loss": -11.67945671081543, "global_step": 234197, "epoch": 1394} {"train_loss": -11.883596420288086, "global_step": 234198, "epoch": 1394} {"train_loss": -11.948151588439941, "global_step": 234199, "epoch": 1394} {"train_loss": -11.836542129516602, "global_step": 234200, "epoch": 1394} {"train_loss": -11.883444786071777, "global_step": 234201, "epoch": 1394} {"train_loss": -11.482965469360352, "global_step": 234202, "epoch": 1394} {"train_loss": -11.568153381347656, "global_step": 234203, "epoch": 1394} {"train_loss": -11.921989440917969, "global_step": 234204, "epoch": 1394} {"train_loss": -11.75053882598877, "global_step": 234205, "epoch": 1394} {"train_loss": -11.547950744628906, "global_step": 234206, "epoch": 1394} {"train_loss": -11.828460693359375, "global_step": 234207, "epoch": 1394} {"train_loss": -11.838176727294922, "global_step": 234208, "epoch": 1394} {"train_loss": -11.60935115814209, "global_step": 234209, "epoch": 1394} {"train_loss": -11.809039115905762, "global_step": 234210, "epoch": 1394} {"train_loss": -11.10145378112793, "global_step": 234211, "epoch": 1394} {"train_loss": -11.716766357421875, "global_step": 234212, "epoch": 1394} {"train_loss": -12.027677536010742, "global_step": 234213, "epoch": 1394} {"train_loss": -11.512723922729492, "global_step": 234214, "epoch": 1394} {"train_loss": -11.083313941955566, "global_step": 234215, "epoch": 1394} {"train_loss": -11.562826156616211, "global_step": 234216, "epoch": 1394} {"train_loss": -11.629122734069824, "global_step": 234217, "epoch": 1394} {"train_loss": -11.191498756408691, "global_step": 234218, "epoch": 1394} {"train_loss": -11.774730682373047, "global_step": 234219, "epoch": 1394} {"train_loss": -11.821956634521484, "global_step": 234220, "epoch": 1394} {"train_loss": -11.306375503540039, "global_step": 234221, "epoch": 1394} {"train_loss": -11.485567092895508, "global_step": 234222, "epoch": 1394} {"train_loss": -11.864194869995117, "global_step": 234223, "epoch": 1394} {"train_loss": -11.598224639892578, "global_step": 234224, "epoch": 1394} {"train_loss": -11.66804313659668, "global_step": 234225, "epoch": 1394} {"train_loss": -11.902555465698242, "global_step": 234226, "epoch": 1394} {"train_loss": -11.98207950592041, "global_step": 234227, "epoch": 1394} {"train_loss": -11.404720306396484, "global_step": 234228, "epoch": 1394} {"train_loss": -11.784358024597168, "global_step": 234229, "epoch": 1394} {"train_loss": -11.785725593566895, "global_step": 234230, "epoch": 1394} {"train_loss": -12.023784637451172, "global_step": 234231, "epoch": 1394} {"train_loss": -11.776581764221191, "global_step": 234232, "epoch": 1394} {"train_loss": -11.764935493469238, "global_step": 234233, "epoch": 1394} {"train_loss": -11.810657501220703, "global_step": 234234, "epoch": 1394} {"train_loss": -11.893606185913086, "global_step": 234235, "epoch": 1394} {"train_loss": -12.203083038330078, "global_step": 234236, "epoch": 1394} {"train_loss": -11.673709869384766, "global_step": 234237, "epoch": 1394} {"train_loss": -11.397892951965332, "global_step": 234238, "epoch": 1394} {"train_loss": -11.536834716796875, "global_step": 234239, "epoch": 1394} {"train_loss": -11.705309867858887, "global_step": 234240, "epoch": 1394} {"train_loss": -11.226129531860352, "global_step": 234241, "epoch": 1394} {"train_loss": -11.332271575927734, "global_step": 234242, "epoch": 1394} {"train_loss": -11.372126579284668, "global_step": 234243, "epoch": 1394} {"train_loss": -10.910937309265137, "global_step": 234244, "epoch": 1394} {"train_loss": -10.582464218139648, "global_step": 234245, "epoch": 1394} {"train_loss": -11.927115440368652, "global_step": 234246, "epoch": 1394} {"train_loss": -10.532211303710938, "global_step": 234247, "epoch": 1394} {"train_loss": -11.848913192749023, "global_step": 234248, "epoch": 1394} {"train_loss": -11.111503601074219, "global_step": 234249, "epoch": 1394} {"train_loss": -11.398148536682129, "global_step": 234250, "epoch": 1394} {"train_loss": -11.374098777770996, "global_step": 234251, "epoch": 1394} {"train_loss": -10.96664047241211, "global_step": 234252, "epoch": 1394} {"train_loss": -10.9657564163208, "global_step": 234253, "epoch": 1394} {"train_loss": -10.937976837158203, "global_step": 234254, "epoch": 1394} {"train_loss": -10.416629791259766, "global_step": 234255, "epoch": 1394} {"train_loss": -10.702281951904297, "global_step": 234256, "epoch": 1394} {"train_loss": -10.526935577392578, "global_step": 234257, "epoch": 1394} {"train_loss": -9.641136169433594, "global_step": 234258, "epoch": 1394} {"train_loss": -11.170621871948242, "global_step": 234259, "epoch": 1394} {"train_loss": -10.518421173095703, "global_step": 234260, "epoch": 1394} {"train_loss": -10.467304229736328, "global_step": 234261, "epoch": 1394} {"train_loss": -10.881179809570312, "global_step": 234262, "epoch": 1394} {"train_loss": -10.791179656982422, "global_step": 234263, "epoch": 1394} {"train_loss": -11.587516784667969, "global_step": 234264, "epoch": 1394} {"train_loss": -11.224964141845703, "global_step": 234265, "epoch": 1394} {"train_loss": -11.343687057495117, "global_step": 234266, "epoch": 1394} {"train_loss": -11.364644050598145, "global_step": 234267, "epoch": 1394} {"train_loss": -11.21249008178711, "global_step": 234268, "epoch": 1394} {"train_loss": -11.536802291870117, "global_step": 234269, "epoch": 1394} {"train_loss": -11.696598052978516, "global_step": 234270, "epoch": 1394} {"train_loss": -11.59020709991455, "global_step": 234271, "epoch": 1394} {"train_loss": -11.739169120788574, "global_step": 234272, "epoch": 1394} {"train_loss": -11.864439010620117, "global_step": 234273, "epoch": 1394} {"train_loss": -11.636359214782715, "global_step": 234274, "epoch": 1394} {"train_loss": -11.83612060546875, "global_step": 234275, "epoch": 1394} {"train_loss": -11.658483505249023, "global_step": 234276, "epoch": 1394} {"train_loss": -11.950752258300781, "global_step": 234277, "epoch": 1394} {"train_loss": -11.710086822509766, "global_step": 234278, "epoch": 1394} {"train_loss": -11.86724853515625, "global_step": 234279, "epoch": 1394} {"train_loss": -11.870635986328125, "global_step": 234280, "epoch": 1394} {"train_loss": -11.69253158569336, "global_step": 234281, "epoch": 1394} {"train_loss": -11.818758964538574, "global_step": 234282, "epoch": 1394} {"train_loss": -11.744766235351562, "global_step": 234283, "epoch": 1394} {"train_loss": -11.703775405883789, "global_step": 234284, "epoch": 1394} {"train_loss": -11.715585708618164, "global_step": 234285, "epoch": 1394} {"train_loss": -11.862297058105469, "global_step": 234286, "epoch": 1394} {"train_loss": -11.25831413269043, "global_step": 234287, "epoch": 1394} {"train_loss": -11.983181953430176, "global_step": 234288, "epoch": 1394} {"train_loss": -11.65667724609375, "global_step": 234289, "epoch": 1394} {"train_loss": -11.603822708129883, "global_step": 234290, "epoch": 1394} {"train_loss": -11.712287902832031, "global_step": 234291, "epoch": 1394} {"train_loss": -11.492120742797852, "global_step": 234292, "epoch": 1394} {"train_loss": -11.706449508666992, "global_step": 234293, "epoch": 1394} {"train_loss": -11.732248306274414, "global_step": 234294, "epoch": 1394} {"train_loss": -10.49958610534668, "global_step": 234295, "epoch": 1394} {"train_loss": -11.583187103271484, "global_step": 234296, "epoch": 1394} {"train_loss": -11.540639877319336, "global_step": 234297, "epoch": 1394} {"train_loss": -10.6289701461792, "global_step": 234298, "epoch": 1394} {"train_loss": -11.740701675415039, "global_step": 234299, "epoch": 1394} {"train_loss": -10.826583862304688, "global_step": 234300, "epoch": 1394} {"train_loss": -9.880709648132324, "global_step": 234301, "epoch": 1394} {"train_loss": -11.606829643249512, "global_step": 234302, "epoch": 1394} {"train_loss": -10.234349250793457, "global_step": 234303, "epoch": 1394} {"train_loss": -11.253639221191406, "global_step": 234304, "epoch": 1394} {"train_loss": -10.949665069580078, "global_step": 234305, "epoch": 1394} {"train_loss": -10.664636611938477, "global_step": 234306, "epoch": 1394} {"train_loss": -10.87753677368164, "global_step": 234307, "epoch": 1394} {"train_loss": -9.307644844055176, "global_step": 234308, "epoch": 1394} {"train_loss": -9.949761390686035, "global_step": 234309, "epoch": 1394} {"train_loss": -11.029219627380371, "global_step": 234310, "epoch": 1394} {"train_loss": -10.152087211608887, "global_step": 234311, "epoch": 1394} {"train_loss": -10.598124504089355, "global_step": 234312, "epoch": 1394} {"train_loss": -11.031179428100586, "global_step": 234313, "epoch": 1394} {"train_loss": -10.127127647399902, "global_step": 234314, "epoch": 1394} {"train_loss": -10.859247207641602, "global_step": 234315, "epoch": 1394} {"train_loss": -9.47563362121582, "global_step": 234316, "epoch": 1394} {"train_loss": -10.551523208618164, "global_step": 234317, "epoch": 1394} {"train_loss": -9.605554580688477, "global_step": 234318, "epoch": 1394} {"train_loss": -10.635431289672852, "global_step": 234319, "epoch": 1394} {"train_loss": -9.837109565734863, "global_step": 234320, "epoch": 1394} {"train_loss": -10.917478561401367, "global_step": 234321, "epoch": 1394} {"train_loss": -10.929738998413086, "global_step": 234322, "epoch": 1394} {"train_loss": -10.755279541015625, "global_step": 234323, "epoch": 1394} {"train_loss": -11.34868049621582, "global_step": 234324, "epoch": 1394} {"train_loss": -10.499679565429688, "global_step": 234325, "epoch": 1394} {"train_loss": -10.858983993530273, "global_step": 234326, "epoch": 1394} {"train_loss": -10.967849731445312, "global_step": 234327, "epoch": 1394} {"train_loss": -10.742606163024902, "global_step": 234328, "epoch": 1394} {"train_loss": -10.746153831481934, "global_step": 234329, "epoch": 1394} {"train_loss": -11.101263999938965, "global_step": 234330, "epoch": 1394} {"train_loss": -11.237627983093262, "global_step": 234331, "epoch": 1394} {"train_loss": -10.947669982910156, "global_step": 234332, "epoch": 1394} {"train_loss": -11.192501068115234, "global_step": 234333, "epoch": 1394} {"train_loss": -10.897077560424805, "global_step": 234334, "epoch": 1394} {"train_loss": -11.500680923461914, "global_step": 234335, "epoch": 1394} {"train_loss": -11.133224487304688, "global_step": 234336, "epoch": 1394} {"train_loss": -11.66130542755127, "global_step": 234337, "epoch": 1394} {"train_loss": -10.702203750610352, "global_step": 234338, "epoch": 1394} {"train_loss": -11.073867797851562, "global_step": 234339, "epoch": 1394} {"train_loss": -11.026481628417969, "global_step": 234340, "epoch": 1394} {"train_loss": -11.019388198852539, "global_step": 234341, "epoch": 1394} {"train_loss": -11.297422409057617, "global_step": 234342, "epoch": 1394} {"train_loss": -11.149336814880371, "global_step": 234343, "epoch": 1394} {"train_loss": -11.517698287963867, "global_step": 234344, "epoch": 1394} {"train_loss": -11.157821655273438, "global_step": 234345, "epoch": 1394} {"train_loss": -11.642433166503906, "global_step": 234346, "epoch": 1394} {"train_loss": -11.537729263305664, "global_step": 234347, "epoch": 1394} {"train_loss": -11.117290496826172, "global_step": 234348, "epoch": 1394} {"train_loss": -11.670129776000977, "global_step": 234349, "epoch": 1394} {"train_loss": -11.448199272155762, "global_step": 234350, "epoch": 1394} {"train_loss": -11.5164213180542, "global_step": 234351, "epoch": 1394} {"train_loss": -11.289284706115723, "global_step": 234352, "epoch": 1394} {"train_loss": -11.496026992797852, "global_step": 234353, "epoch": 1394} {"train_loss": -11.359044075012207, "global_step": 234354, "epoch": 1394} {"train_loss": -11.444437980651855, "global_step": 234355, "epoch": 1394} {"train_loss": -11.709354400634766, "global_step": 234356, "epoch": 1394} {"train_loss": -11.341748237609863, "global_step": 234357, "epoch": 1394} {"train_loss": -11.645090103149414, "global_step": 234358, "epoch": 1394} {"train_loss": -11.304552606173925, "global_step": 234359, "epoch": 1394, "val_loss": 263385.28125} {"train_loss": -11.546289443969727, "global_step": 234360, "epoch": 1395} {"train_loss": -11.689781188964844, "global_step": 234361, "epoch": 1395} {"train_loss": -11.489442825317383, "global_step": 234362, "epoch": 1395} {"train_loss": -11.850428581237793, "global_step": 234363, "epoch": 1395} {"train_loss": -11.642614364624023, "global_step": 234364, "epoch": 1395} {"train_loss": -11.616543769836426, "global_step": 234365, "epoch": 1395} {"train_loss": -11.758010864257812, "global_step": 234366, "epoch": 1395} {"train_loss": -11.825372695922852, "global_step": 234367, "epoch": 1395} {"train_loss": -11.748403549194336, "global_step": 234368, "epoch": 1395} {"train_loss": -11.8472261428833, "global_step": 234369, "epoch": 1395} {"train_loss": -11.884428024291992, "global_step": 234370, "epoch": 1395} {"train_loss": -11.738120079040527, "global_step": 234371, "epoch": 1395} {"train_loss": -11.638837814331055, "global_step": 234372, "epoch": 1395} {"train_loss": -11.934493064880371, "global_step": 234373, "epoch": 1395} {"train_loss": -11.811517715454102, "global_step": 234374, "epoch": 1395} {"train_loss": -12.057133674621582, "global_step": 234375, "epoch": 1395} {"train_loss": -11.901420593261719, "global_step": 234376, "epoch": 1395} {"train_loss": -11.938011169433594, "global_step": 234377, "epoch": 1395} {"train_loss": -12.015203475952148, "global_step": 234378, "epoch": 1395} {"train_loss": -11.83544635772705, "global_step": 234379, "epoch": 1395} {"train_loss": -12.053671836853027, "global_step": 234380, "epoch": 1395} {"train_loss": -11.78567886352539, "global_step": 234381, "epoch": 1395} {"train_loss": -11.96104621887207, "global_step": 234382, "epoch": 1395} {"train_loss": -11.905738830566406, "global_step": 234383, "epoch": 1395} {"train_loss": -12.156139373779297, "global_step": 234384, "epoch": 1395} {"train_loss": -12.162166595458984, "global_step": 234385, "epoch": 1395} {"train_loss": -11.969635009765625, "global_step": 234386, "epoch": 1395} {"train_loss": -12.236103057861328, "global_step": 234387, "epoch": 1395} {"train_loss": -12.023218154907227, "global_step": 234388, "epoch": 1395} {"train_loss": -11.985392570495605, "global_step": 234389, "epoch": 1395} {"train_loss": -11.929051399230957, "global_step": 234390, "epoch": 1395} {"train_loss": -12.10299301147461, "global_step": 234391, "epoch": 1395} {"train_loss": -11.911165237426758, "global_step": 234392, "epoch": 1395} {"train_loss": -12.11792278289795, "global_step": 234393, "epoch": 1395} {"train_loss": -12.14203929901123, "global_step": 234394, "epoch": 1395} {"train_loss": -11.941997528076172, "global_step": 234395, "epoch": 1395} {"train_loss": -12.151876449584961, "global_step": 234396, "epoch": 1395} {"train_loss": -11.912029266357422, "global_step": 234397, "epoch": 1395} {"train_loss": -12.128780364990234, "global_step": 234398, "epoch": 1395} {"train_loss": -12.246519088745117, "global_step": 234399, "epoch": 1395} {"train_loss": -12.096637725830078, "global_step": 234400, "epoch": 1395} {"train_loss": -12.193358421325684, "global_step": 234401, "epoch": 1395} {"train_loss": -12.060490608215332, "global_step": 234402, "epoch": 1395} {"train_loss": -12.072383880615234, "global_step": 234403, "epoch": 1395} {"train_loss": -12.099645614624023, "global_step": 234404, "epoch": 1395} {"train_loss": -11.850038528442383, "global_step": 234405, "epoch": 1395} {"train_loss": -12.201778411865234, "global_step": 234406, "epoch": 1395} {"train_loss": -12.008073806762695, "global_step": 234407, "epoch": 1395} {"train_loss": -12.115425109863281, "global_step": 234408, "epoch": 1395} {"train_loss": -11.599632263183594, "global_step": 234409, "epoch": 1395} {"train_loss": -11.987653732299805, "global_step": 234410, "epoch": 1395} {"train_loss": -12.089590072631836, "global_step": 234411, "epoch": 1395} {"train_loss": -12.056824684143066, "global_step": 234412, "epoch": 1395} {"train_loss": -12.230403900146484, "global_step": 234413, "epoch": 1395} {"train_loss": -11.637510299682617, "global_step": 234414, "epoch": 1395} {"train_loss": -11.86440658569336, "global_step": 234415, "epoch": 1395} {"train_loss": -11.144872665405273, "global_step": 234416, "epoch": 1395} {"train_loss": -11.544286727905273, "global_step": 234417, "epoch": 1395} {"train_loss": -11.048759460449219, "global_step": 234418, "epoch": 1395} {"train_loss": -11.41158676147461, "global_step": 234419, "epoch": 1395} {"train_loss": -11.150611877441406, "global_step": 234420, "epoch": 1395} {"train_loss": -9.059983253479004, "global_step": 234421, "epoch": 1395} {"train_loss": -10.744148254394531, "global_step": 234422, "epoch": 1395} {"train_loss": -9.918210983276367, "global_step": 234423, "epoch": 1395} {"train_loss": -10.326628684997559, "global_step": 234424, "epoch": 1395} {"train_loss": -8.972167015075684, "global_step": 234425, "epoch": 1395} {"train_loss": -8.944297790527344, "global_step": 234426, "epoch": 1395} {"train_loss": -10.481017112731934, "global_step": 234427, "epoch": 1395} {"train_loss": -9.80174732208252, "global_step": 234428, "epoch": 1395} {"train_loss": -8.663040161132812, "global_step": 234429, "epoch": 1395} {"train_loss": -10.261585235595703, "global_step": 234430, "epoch": 1395} {"train_loss": -9.05948257446289, "global_step": 234431, "epoch": 1395} {"train_loss": -9.40689468383789, "global_step": 234432, "epoch": 1395} {"train_loss": -9.553049087524414, "global_step": 234433, "epoch": 1395} {"train_loss": -10.119148254394531, "global_step": 234434, "epoch": 1395} {"train_loss": -10.226133346557617, "global_step": 234435, "epoch": 1395} {"train_loss": -9.161678314208984, "global_step": 234436, "epoch": 1395} {"train_loss": -10.067357063293457, "global_step": 234437, "epoch": 1395} {"train_loss": -9.370015144348145, "global_step": 234438, "epoch": 1395} {"train_loss": -9.538288116455078, "global_step": 234439, "epoch": 1395} {"train_loss": -10.963457107543945, "global_step": 234440, "epoch": 1395} {"train_loss": -9.16163444519043, "global_step": 234441, "epoch": 1395} {"train_loss": -10.316225051879883, "global_step": 234442, "epoch": 1395} {"train_loss": -10.088186264038086, "global_step": 234443, "epoch": 1395} {"train_loss": -9.929346084594727, "global_step": 234444, "epoch": 1395} {"train_loss": -9.662704467773438, "global_step": 234445, "epoch": 1395} {"train_loss": -10.47553825378418, "global_step": 234446, "epoch": 1395} {"train_loss": -9.49260139465332, "global_step": 234447, "epoch": 1395} {"train_loss": -11.04600715637207, "global_step": 234448, "epoch": 1395} {"train_loss": -9.97800064086914, "global_step": 234449, "epoch": 1395} {"train_loss": -10.607246398925781, "global_step": 234450, "epoch": 1395} {"train_loss": -11.230347633361816, "global_step": 234451, "epoch": 1395} {"train_loss": -10.721063613891602, "global_step": 234452, "epoch": 1395} {"train_loss": -10.939117431640625, "global_step": 234453, "epoch": 1395} {"train_loss": -11.208335876464844, "global_step": 234454, "epoch": 1395} {"train_loss": -10.969643592834473, "global_step": 234455, "epoch": 1395} {"train_loss": -10.93205738067627, "global_step": 234456, "epoch": 1395} {"train_loss": -11.240933418273926, "global_step": 234457, "epoch": 1395} {"train_loss": -10.869941711425781, "global_step": 234458, "epoch": 1395} {"train_loss": -11.062952995300293, "global_step": 234459, "epoch": 1395} {"train_loss": -11.049368858337402, "global_step": 234460, "epoch": 1395} {"train_loss": -10.841912269592285, "global_step": 234461, "epoch": 1395} {"train_loss": -10.778814315795898, "global_step": 234462, "epoch": 1395} {"train_loss": -10.92644214630127, "global_step": 234463, "epoch": 1395} {"train_loss": -10.969247817993164, "global_step": 234464, "epoch": 1395} {"train_loss": -10.655123710632324, "global_step": 234465, "epoch": 1395} {"train_loss": -11.286580085754395, "global_step": 234466, "epoch": 1395} {"train_loss": -11.13334846496582, "global_step": 234467, "epoch": 1395} {"train_loss": -11.064006805419922, "global_step": 234468, "epoch": 1395} {"train_loss": -11.276034355163574, "global_step": 234469, "epoch": 1395} {"train_loss": -11.31852912902832, "global_step": 234470, "epoch": 1395} {"train_loss": -10.924993515014648, "global_step": 234471, "epoch": 1395} {"train_loss": -11.363285064697266, "global_step": 234472, "epoch": 1395} {"train_loss": -11.321695327758789, "global_step": 234473, "epoch": 1395} {"train_loss": -10.994230270385742, "global_step": 234474, "epoch": 1395} {"train_loss": -11.13143539428711, "global_step": 234475, "epoch": 1395} {"train_loss": -11.513211250305176, "global_step": 234476, "epoch": 1395} {"train_loss": -10.992365837097168, "global_step": 234477, "epoch": 1395} {"train_loss": -11.16423225402832, "global_step": 234478, "epoch": 1395} {"train_loss": -10.714887619018555, "global_step": 234479, "epoch": 1395} {"train_loss": -11.172800064086914, "global_step": 234480, "epoch": 1395} {"train_loss": -10.563423156738281, "global_step": 234481, "epoch": 1395} {"train_loss": -11.207682609558105, "global_step": 234482, "epoch": 1395} {"train_loss": -11.04343318939209, "global_step": 234483, "epoch": 1395} {"train_loss": -11.044364929199219, "global_step": 234484, "epoch": 1395} {"train_loss": -11.431676864624023, "global_step": 234485, "epoch": 1395} {"train_loss": -11.323776245117188, "global_step": 234486, "epoch": 1395} {"train_loss": -11.173629760742188, "global_step": 234487, "epoch": 1395} {"train_loss": -11.360532760620117, "global_step": 234488, "epoch": 1395} {"train_loss": -11.467284202575684, "global_step": 234489, "epoch": 1395} {"train_loss": -11.359506607055664, "global_step": 234490, "epoch": 1395} {"train_loss": -11.514122009277344, "global_step": 234491, "epoch": 1395} {"train_loss": -11.34343147277832, "global_step": 234492, "epoch": 1395} {"train_loss": -11.543264389038086, "global_step": 234493, "epoch": 1395} {"train_loss": -11.237869262695312, "global_step": 234494, "epoch": 1395} {"train_loss": -11.66288948059082, "global_step": 234495, "epoch": 1395} {"train_loss": -11.515926361083984, "global_step": 234496, "epoch": 1395} {"train_loss": -11.569828033447266, "global_step": 234497, "epoch": 1395} {"train_loss": -11.658774375915527, "global_step": 234498, "epoch": 1395} {"train_loss": -11.594921112060547, "global_step": 234499, "epoch": 1395} {"train_loss": -11.512167930603027, "global_step": 234500, "epoch": 1395} {"train_loss": -11.351405143737793, "global_step": 234501, "epoch": 1395} {"train_loss": -11.536094665527344, "global_step": 234502, "epoch": 1395} {"train_loss": -11.599029541015625, "global_step": 234503, "epoch": 1395} {"train_loss": -11.607333183288574, "global_step": 234504, "epoch": 1395} {"train_loss": -11.800992965698242, "global_step": 234505, "epoch": 1395} {"train_loss": -11.739802360534668, "global_step": 234506, "epoch": 1395} {"train_loss": -11.908130645751953, "global_step": 234507, "epoch": 1395} {"train_loss": -11.952393531799316, "global_step": 234508, "epoch": 1395} {"train_loss": -11.79547119140625, "global_step": 234509, "epoch": 1395} {"train_loss": -11.831415176391602, "global_step": 234510, "epoch": 1395} {"train_loss": -11.608133316040039, "global_step": 234511, "epoch": 1395} {"train_loss": -11.747530937194824, "global_step": 234512, "epoch": 1395} {"train_loss": -11.60619831085205, "global_step": 234513, "epoch": 1395} {"train_loss": -11.961777687072754, "global_step": 234514, "epoch": 1395} {"train_loss": -11.863985061645508, "global_step": 234515, "epoch": 1395} {"train_loss": -11.957905769348145, "global_step": 234516, "epoch": 1395} {"train_loss": -11.827688217163086, "global_step": 234517, "epoch": 1395} {"train_loss": -11.926542282104492, "global_step": 234518, "epoch": 1395} {"train_loss": -11.884526252746582, "global_step": 234519, "epoch": 1395} {"train_loss": -12.017817497253418, "global_step": 234520, "epoch": 1395} {"train_loss": -11.938173294067383, "global_step": 234521, "epoch": 1395} {"train_loss": -11.94955062866211, "global_step": 234522, "epoch": 1395} {"train_loss": -11.920544624328613, "global_step": 234523, "epoch": 1395} {"train_loss": -12.065784454345703, "global_step": 234524, "epoch": 1395} {"train_loss": -11.93222713470459, "global_step": 234525, "epoch": 1395} {"train_loss": -11.86506462097168, "global_step": 234526, "epoch": 1395} {"train_loss": -11.300099685078575, "global_step": 234527, "epoch": 1395, "val_loss": 262827.15625, "train_action_mse_error": 1.3964108228683472} {"train_loss": -12.085260391235352, "global_step": 234528, "epoch": 1396} {"train_loss": -12.089680671691895, "global_step": 234529, "epoch": 1396} {"train_loss": -11.928445816040039, "global_step": 234530, "epoch": 1396} {"train_loss": -12.056180953979492, "global_step": 234531, "epoch": 1396} {"train_loss": -12.108654022216797, "global_step": 234532, "epoch": 1396} {"train_loss": -12.171361923217773, "global_step": 234533, "epoch": 1396} {"train_loss": -12.285834312438965, "global_step": 234534, "epoch": 1396} {"train_loss": -12.147274017333984, "global_step": 234535, "epoch": 1396} {"train_loss": -12.081221580505371, "global_step": 234536, "epoch": 1396} {"train_loss": -11.926101684570312, "global_step": 234537, "epoch": 1396} {"train_loss": -11.958826065063477, "global_step": 234538, "epoch": 1396} {"train_loss": -12.017244338989258, "global_step": 234539, "epoch": 1396} {"train_loss": -11.662364959716797, "global_step": 234540, "epoch": 1396} {"train_loss": -11.7977933883667, "global_step": 234541, "epoch": 1396} {"train_loss": -11.794872283935547, "global_step": 234542, "epoch": 1396} {"train_loss": -11.594964981079102, "global_step": 234543, "epoch": 1396} {"train_loss": -11.711803436279297, "global_step": 234544, "epoch": 1396} {"train_loss": -12.081947326660156, "global_step": 234545, "epoch": 1396} {"train_loss": -11.804374694824219, "global_step": 234546, "epoch": 1396} {"train_loss": -11.896696090698242, "global_step": 234547, "epoch": 1396} {"train_loss": -11.891382217407227, "global_step": 234548, "epoch": 1396} {"train_loss": -11.698287963867188, "global_step": 234549, "epoch": 1396} {"train_loss": -11.858975410461426, "global_step": 234550, "epoch": 1396} {"train_loss": -11.445642471313477, "global_step": 234551, "epoch": 1396} {"train_loss": -11.321640014648438, "global_step": 234552, "epoch": 1396} {"train_loss": -11.15356159210205, "global_step": 234553, "epoch": 1396} {"train_loss": -11.222496032714844, "global_step": 234554, "epoch": 1396} {"train_loss": -9.660978317260742, "global_step": 234555, "epoch": 1396} {"train_loss": -10.591764450073242, "global_step": 234556, "epoch": 1396} {"train_loss": -11.089359283447266, "global_step": 234557, "epoch": 1396} {"train_loss": -9.163073539733887, "global_step": 234558, "epoch": 1396} {"train_loss": -10.256501197814941, "global_step": 234559, "epoch": 1396} {"train_loss": -10.887346267700195, "global_step": 234560, "epoch": 1396} {"train_loss": -10.823553085327148, "global_step": 234561, "epoch": 1396} {"train_loss": -10.512594223022461, "global_step": 234562, "epoch": 1396} {"train_loss": -11.370790481567383, "global_step": 234563, "epoch": 1396} {"train_loss": -11.430516242980957, "global_step": 234564, "epoch": 1396} {"train_loss": -10.785898208618164, "global_step": 234565, "epoch": 1396} {"train_loss": -10.680047035217285, "global_step": 234566, "epoch": 1396} {"train_loss": -8.858543395996094, "global_step": 234567, "epoch": 1396} {"train_loss": -9.134471893310547, "global_step": 234568, "epoch": 1396} {"train_loss": -9.379819869995117, "global_step": 234569, "epoch": 1396} {"train_loss": -11.077754974365234, "global_step": 234570, "epoch": 1396} {"train_loss": -9.813619613647461, "global_step": 234571, "epoch": 1396} {"train_loss": -10.520400047302246, "global_step": 234572, "epoch": 1396} {"train_loss": -10.199356079101562, "global_step": 234573, "epoch": 1396} {"train_loss": -10.685160636901855, "global_step": 234574, "epoch": 1396} {"train_loss": -10.86819839477539, "global_step": 234575, "epoch": 1396} {"train_loss": -10.52224349975586, "global_step": 234576, "epoch": 1396} {"train_loss": -10.351388931274414, "global_step": 234577, "epoch": 1396} {"train_loss": -11.08476448059082, "global_step": 234578, "epoch": 1396} {"train_loss": -10.301741600036621, "global_step": 234579, "epoch": 1396} {"train_loss": -11.294384002685547, "global_step": 234580, "epoch": 1396} {"train_loss": -11.348993301391602, "global_step": 234581, "epoch": 1396} {"train_loss": -11.106968879699707, "global_step": 234582, "epoch": 1396} {"train_loss": -11.490801811218262, "global_step": 234583, "epoch": 1396} {"train_loss": -11.39317512512207, "global_step": 234584, "epoch": 1396} {"train_loss": -11.175830841064453, "global_step": 234585, "epoch": 1396} {"train_loss": -11.390338897705078, "global_step": 234586, "epoch": 1396} {"train_loss": -11.11737060546875, "global_step": 234587, "epoch": 1396} {"train_loss": -10.873761177062988, "global_step": 234588, "epoch": 1396} {"train_loss": -11.306061744689941, "global_step": 234589, "epoch": 1396} {"train_loss": -11.206184387207031, "global_step": 234590, "epoch": 1396} {"train_loss": -11.309995651245117, "global_step": 234591, "epoch": 1396} {"train_loss": -11.337163925170898, "global_step": 234592, "epoch": 1396} {"train_loss": -11.461020469665527, "global_step": 234593, "epoch": 1396} {"train_loss": -11.365727424621582, "global_step": 234594, "epoch": 1396} {"train_loss": -11.39981460571289, "global_step": 234595, "epoch": 1396} {"train_loss": -11.42098617553711, "global_step": 234596, "epoch": 1396} {"train_loss": -11.174890518188477, "global_step": 234597, "epoch": 1396} {"train_loss": -11.75551986694336, "global_step": 234598, "epoch": 1396} {"train_loss": -11.246294021606445, "global_step": 234599, "epoch": 1396} {"train_loss": -11.492225646972656, "global_step": 234600, "epoch": 1396} {"train_loss": -11.654594421386719, "global_step": 234601, "epoch": 1396} {"train_loss": -11.528924942016602, "global_step": 234602, "epoch": 1396} {"train_loss": -11.769248008728027, "global_step": 234603, "epoch": 1396} {"train_loss": -11.664203643798828, "global_step": 234604, "epoch": 1396} {"train_loss": -11.6177339553833, "global_step": 234605, "epoch": 1396} {"train_loss": -11.737534523010254, "global_step": 234606, "epoch": 1396} {"train_loss": -11.7916841506958, "global_step": 234607, "epoch": 1396} {"train_loss": -11.759873390197754, "global_step": 234608, "epoch": 1396} {"train_loss": -11.88294792175293, "global_step": 234609, "epoch": 1396} {"train_loss": -11.90902328491211, "global_step": 234610, "epoch": 1396} {"train_loss": -11.69601821899414, "global_step": 234611, "epoch": 1396} {"train_loss": -11.765820503234863, "global_step": 234612, "epoch": 1396} {"train_loss": -11.728639602661133, "global_step": 234613, "epoch": 1396} {"train_loss": -11.727442741394043, "global_step": 234614, "epoch": 1396} {"train_loss": -11.719030380249023, "global_step": 234615, "epoch": 1396} {"train_loss": -11.900877952575684, "global_step": 234616, "epoch": 1396} {"train_loss": -11.800751686096191, "global_step": 234617, "epoch": 1396} {"train_loss": -11.851482391357422, "global_step": 234618, "epoch": 1396} {"train_loss": -11.74453353881836, "global_step": 234619, "epoch": 1396} {"train_loss": -11.665177345275879, "global_step": 234620, "epoch": 1396} {"train_loss": -11.950044631958008, "global_step": 234621, "epoch": 1396} {"train_loss": -11.856170654296875, "global_step": 234622, "epoch": 1396} {"train_loss": -11.717159271240234, "global_step": 234623, "epoch": 1396} {"train_loss": -11.733832359313965, "global_step": 234624, "epoch": 1396} {"train_loss": -11.617698669433594, "global_step": 234625, "epoch": 1396} {"train_loss": -11.936346054077148, "global_step": 234626, "epoch": 1396} {"train_loss": -11.574207305908203, "global_step": 234627, "epoch": 1396} {"train_loss": -11.824189186096191, "global_step": 234628, "epoch": 1396} {"train_loss": -11.529470443725586, "global_step": 234629, "epoch": 1396} {"train_loss": -11.780756950378418, "global_step": 234630, "epoch": 1396} {"train_loss": -11.739933013916016, "global_step": 234631, "epoch": 1396} {"train_loss": -11.530119895935059, "global_step": 234632, "epoch": 1396} {"train_loss": -12.055889129638672, "global_step": 234633, "epoch": 1396} {"train_loss": -11.706659317016602, "global_step": 234634, "epoch": 1396} {"train_loss": -11.776580810546875, "global_step": 234635, "epoch": 1396} {"train_loss": -11.929922103881836, "global_step": 234636, "epoch": 1396} {"train_loss": -11.925803184509277, "global_step": 234637, "epoch": 1396} {"train_loss": -11.808619499206543, "global_step": 234638, "epoch": 1396} {"train_loss": -11.833916664123535, "global_step": 234639, "epoch": 1396} {"train_loss": -11.612062454223633, "global_step": 234640, "epoch": 1396} {"train_loss": -12.189889907836914, "global_step": 234641, "epoch": 1396} {"train_loss": -11.808248519897461, "global_step": 234642, "epoch": 1396} {"train_loss": -11.740832328796387, "global_step": 234643, "epoch": 1396} {"train_loss": -12.041022300720215, "global_step": 234644, "epoch": 1396} {"train_loss": -11.990516662597656, "global_step": 234645, "epoch": 1396} {"train_loss": -11.990751266479492, "global_step": 234646, "epoch": 1396} {"train_loss": -11.846552848815918, "global_step": 234647, "epoch": 1396} {"train_loss": -12.049055099487305, "global_step": 234648, "epoch": 1396} {"train_loss": -11.564985275268555, "global_step": 234649, "epoch": 1396} {"train_loss": -11.99019718170166, "global_step": 234650, "epoch": 1396} {"train_loss": -11.417268753051758, "global_step": 234651, "epoch": 1396} {"train_loss": -11.75239372253418, "global_step": 234652, "epoch": 1396} {"train_loss": -11.461580276489258, "global_step": 234653, "epoch": 1396} {"train_loss": -11.597908020019531, "global_step": 234654, "epoch": 1396} {"train_loss": -10.855425834655762, "global_step": 234655, "epoch": 1396} {"train_loss": -11.02613639831543, "global_step": 234656, "epoch": 1396} {"train_loss": -11.481908798217773, "global_step": 234657, "epoch": 1396} {"train_loss": -11.56517219543457, "global_step": 234658, "epoch": 1396} {"train_loss": -11.448162078857422, "global_step": 234659, "epoch": 1396} {"train_loss": -11.844284057617188, "global_step": 234660, "epoch": 1396} {"train_loss": -11.742408752441406, "global_step": 234661, "epoch": 1396} {"train_loss": -11.7158784866333, "global_step": 234662, "epoch": 1396} {"train_loss": -11.736286163330078, "global_step": 234663, "epoch": 1396} {"train_loss": -11.858214378356934, "global_step": 234664, "epoch": 1396} {"train_loss": -11.63939094543457, "global_step": 234665, "epoch": 1396} {"train_loss": -11.735066413879395, "global_step": 234666, "epoch": 1396} {"train_loss": -11.807408332824707, "global_step": 234667, "epoch": 1396} {"train_loss": -11.603209495544434, "global_step": 234668, "epoch": 1396} {"train_loss": -11.928977012634277, "global_step": 234669, "epoch": 1396} {"train_loss": -11.500041961669922, "global_step": 234670, "epoch": 1396} {"train_loss": -11.173242568969727, "global_step": 234671, "epoch": 1396} {"train_loss": -11.629533767700195, "global_step": 234672, "epoch": 1396} {"train_loss": -11.642321586608887, "global_step": 234673, "epoch": 1396} {"train_loss": -11.440988540649414, "global_step": 234674, "epoch": 1396} {"train_loss": -11.44033145904541, "global_step": 234675, "epoch": 1396} {"train_loss": -12.025747299194336, "global_step": 234676, "epoch": 1396} {"train_loss": -11.238872528076172, "global_step": 234677, "epoch": 1396} {"train_loss": -11.163350105285645, "global_step": 234678, "epoch": 1396} {"train_loss": -11.926801681518555, "global_step": 234679, "epoch": 1396} {"train_loss": -11.31545352935791, "global_step": 234680, "epoch": 1396} {"train_loss": -11.717573165893555, "global_step": 234681, "epoch": 1396} {"train_loss": -11.688720703125, "global_step": 234682, "epoch": 1396} {"train_loss": -11.298796653747559, "global_step": 234683, "epoch": 1396} {"train_loss": -11.31485366821289, "global_step": 234684, "epoch": 1396} {"train_loss": -11.337850570678711, "global_step": 234685, "epoch": 1396} {"train_loss": -11.187350273132324, "global_step": 234686, "epoch": 1396} {"train_loss": -11.541645050048828, "global_step": 234687, "epoch": 1396} {"train_loss": -11.491472244262695, "global_step": 234688, "epoch": 1396} {"train_loss": -11.795489311218262, "global_step": 234689, "epoch": 1396} {"train_loss": -11.498159408569336, "global_step": 234690, "epoch": 1396} {"train_loss": -11.549072265625, "global_step": 234691, "epoch": 1396} {"train_loss": -11.517870903015137, "global_step": 234692, "epoch": 1396} {"train_loss": -11.442571640014648, "global_step": 234693, "epoch": 1396} {"train_loss": -11.451674461364746, "global_step": 234694, "epoch": 1396} {"train_loss": -11.467671871185303, "global_step": 234695, "epoch": 1396, "val_loss": 265364.15625} {"train_loss": -11.143991470336914, "global_step": 234696, "epoch": 1397} {"train_loss": -11.54555606842041, "global_step": 234697, "epoch": 1397} {"train_loss": -11.899068832397461, "global_step": 234698, "epoch": 1397} {"train_loss": -11.209884643554688, "global_step": 234699, "epoch": 1397} {"train_loss": -11.093306541442871, "global_step": 234700, "epoch": 1397} {"train_loss": -11.715860366821289, "global_step": 234701, "epoch": 1397} {"train_loss": -11.148397445678711, "global_step": 234702, "epoch": 1397} {"train_loss": -11.784172058105469, "global_step": 234703, "epoch": 1397} {"train_loss": -11.639272689819336, "global_step": 234704, "epoch": 1397} {"train_loss": -11.357544898986816, "global_step": 234705, "epoch": 1397} {"train_loss": -11.784536361694336, "global_step": 234706, "epoch": 1397} {"train_loss": -11.579065322875977, "global_step": 234707, "epoch": 1397} {"train_loss": -11.811456680297852, "global_step": 234708, "epoch": 1397} {"train_loss": -11.59774398803711, "global_step": 234709, "epoch": 1397} {"train_loss": -11.698036193847656, "global_step": 234710, "epoch": 1397} {"train_loss": -11.934974670410156, "global_step": 234711, "epoch": 1397} {"train_loss": -11.552242279052734, "global_step": 234712, "epoch": 1397} {"train_loss": -11.605745315551758, "global_step": 234713, "epoch": 1397} {"train_loss": -11.579366683959961, "global_step": 234714, "epoch": 1397} {"train_loss": -11.487445831298828, "global_step": 234715, "epoch": 1397} {"train_loss": -11.90123462677002, "global_step": 234716, "epoch": 1397} {"train_loss": -11.56734561920166, "global_step": 234717, "epoch": 1397} {"train_loss": -11.53441333770752, "global_step": 234718, "epoch": 1397} {"train_loss": -11.6428804397583, "global_step": 234719, "epoch": 1397} {"train_loss": -11.474509239196777, "global_step": 234720, "epoch": 1397} {"train_loss": -11.246826171875, "global_step": 234721, "epoch": 1397} {"train_loss": -11.931486129760742, "global_step": 234722, "epoch": 1397} {"train_loss": -11.323700904846191, "global_step": 234723, "epoch": 1397} {"train_loss": -11.589137077331543, "global_step": 234724, "epoch": 1397} {"train_loss": -11.314456939697266, "global_step": 234725, "epoch": 1397} {"train_loss": -11.719823837280273, "global_step": 234726, "epoch": 1397} {"train_loss": -11.169160842895508, "global_step": 234727, "epoch": 1397} {"train_loss": -11.5269775390625, "global_step": 234728, "epoch": 1397} {"train_loss": -12.035937309265137, "global_step": 234729, "epoch": 1397} {"train_loss": -11.607072830200195, "global_step": 234730, "epoch": 1397} {"train_loss": -12.080733299255371, "global_step": 234731, "epoch": 1397} {"train_loss": -12.077932357788086, "global_step": 234732, "epoch": 1397} {"train_loss": -11.59686279296875, "global_step": 234733, "epoch": 1397} {"train_loss": -11.650426864624023, "global_step": 234734, "epoch": 1397} {"train_loss": -11.705398559570312, "global_step": 234735, "epoch": 1397} {"train_loss": -11.672700881958008, "global_step": 234736, "epoch": 1397} {"train_loss": -11.675727844238281, "global_step": 234737, "epoch": 1397} {"train_loss": -11.63536262512207, "global_step": 234738, "epoch": 1397} {"train_loss": -11.80703353881836, "global_step": 234739, "epoch": 1397} {"train_loss": -11.756500244140625, "global_step": 234740, "epoch": 1397} {"train_loss": -11.258480072021484, "global_step": 234741, "epoch": 1397} {"train_loss": -11.895895004272461, "global_step": 234742, "epoch": 1397} {"train_loss": -11.425286293029785, "global_step": 234743, "epoch": 1397} {"train_loss": -11.6285400390625, "global_step": 234744, "epoch": 1397} {"train_loss": -11.869385719299316, "global_step": 234745, "epoch": 1397} {"train_loss": -11.656026840209961, "global_step": 234746, "epoch": 1397} {"train_loss": -12.057573318481445, "global_step": 234747, "epoch": 1397} {"train_loss": -11.66346549987793, "global_step": 234748, "epoch": 1397} {"train_loss": -11.795260429382324, "global_step": 234749, "epoch": 1397} {"train_loss": -11.61249828338623, "global_step": 234750, "epoch": 1397} {"train_loss": -12.222336769104004, "global_step": 234751, "epoch": 1397} {"train_loss": -11.736686706542969, "global_step": 234752, "epoch": 1397} {"train_loss": -12.126893997192383, "global_step": 234753, "epoch": 1397} {"train_loss": -11.750825881958008, "global_step": 234754, "epoch": 1397} {"train_loss": -12.040825843811035, "global_step": 234755, "epoch": 1397} {"train_loss": -11.964784622192383, "global_step": 234756, "epoch": 1397} {"train_loss": -11.663758277893066, "global_step": 234757, "epoch": 1397} {"train_loss": -11.891998291015625, "global_step": 234758, "epoch": 1397} {"train_loss": -11.808369636535645, "global_step": 234759, "epoch": 1397} {"train_loss": -12.143142700195312, "global_step": 234760, "epoch": 1397} {"train_loss": -11.821273803710938, "global_step": 234761, "epoch": 1397} {"train_loss": -11.570429801940918, "global_step": 234762, "epoch": 1397} {"train_loss": -11.838556289672852, "global_step": 234763, "epoch": 1397} {"train_loss": -11.89379596710205, "global_step": 234764, "epoch": 1397} {"train_loss": -11.302457809448242, "global_step": 234765, "epoch": 1397} {"train_loss": -9.768416404724121, "global_step": 234766, "epoch": 1397} {"train_loss": -11.361421585083008, "global_step": 234767, "epoch": 1397} {"train_loss": -11.384182929992676, "global_step": 234768, "epoch": 1397} {"train_loss": -10.553972244262695, "global_step": 234769, "epoch": 1397} {"train_loss": -11.695341110229492, "global_step": 234770, "epoch": 1397} {"train_loss": -11.383996963500977, "global_step": 234771, "epoch": 1397} {"train_loss": -10.926847457885742, "global_step": 234772, "epoch": 1397} {"train_loss": -11.205711364746094, "global_step": 234773, "epoch": 1397} {"train_loss": -11.694933891296387, "global_step": 234774, "epoch": 1397} {"train_loss": -10.4329833984375, "global_step": 234775, "epoch": 1397} {"train_loss": -10.442458152770996, "global_step": 234776, "epoch": 1397} {"train_loss": -11.466110229492188, "global_step": 234777, "epoch": 1397} {"train_loss": -10.794361114501953, "global_step": 234778, "epoch": 1397} {"train_loss": -11.035021781921387, "global_step": 234779, "epoch": 1397} {"train_loss": -11.495768547058105, "global_step": 234780, "epoch": 1397} {"train_loss": -11.201952934265137, "global_step": 234781, "epoch": 1397} {"train_loss": -10.955997467041016, "global_step": 234782, "epoch": 1397} {"train_loss": -11.801046371459961, "global_step": 234783, "epoch": 1397} {"train_loss": -11.235230445861816, "global_step": 234784, "epoch": 1397} {"train_loss": -11.54677677154541, "global_step": 234785, "epoch": 1397} {"train_loss": -11.409351348876953, "global_step": 234786, "epoch": 1397} {"train_loss": -11.708327293395996, "global_step": 234787, "epoch": 1397} {"train_loss": -11.61611270904541, "global_step": 234788, "epoch": 1397} {"train_loss": -11.744495391845703, "global_step": 234789, "epoch": 1397} {"train_loss": -11.319446563720703, "global_step": 234790, "epoch": 1397} {"train_loss": -11.504464149475098, "global_step": 234791, "epoch": 1397} {"train_loss": -11.658742904663086, "global_step": 234792, "epoch": 1397} {"train_loss": -11.616613388061523, "global_step": 234793, "epoch": 1397} {"train_loss": -11.675350189208984, "global_step": 234794, "epoch": 1397} {"train_loss": -11.64594554901123, "global_step": 234795, "epoch": 1397} {"train_loss": -11.692054748535156, "global_step": 234796, "epoch": 1397} {"train_loss": -11.425594329833984, "global_step": 234797, "epoch": 1397} {"train_loss": -11.78816032409668, "global_step": 234798, "epoch": 1397} {"train_loss": -11.722723007202148, "global_step": 234799, "epoch": 1397} {"train_loss": -11.786996841430664, "global_step": 234800, "epoch": 1397} {"train_loss": -11.721456527709961, "global_step": 234801, "epoch": 1397} {"train_loss": -11.833539962768555, "global_step": 234802, "epoch": 1397} {"train_loss": -11.761329650878906, "global_step": 234803, "epoch": 1397} {"train_loss": -11.906777381896973, "global_step": 234804, "epoch": 1397} {"train_loss": -11.812549591064453, "global_step": 234805, "epoch": 1397} {"train_loss": -11.567329406738281, "global_step": 234806, "epoch": 1397} {"train_loss": -11.383674621582031, "global_step": 234807, "epoch": 1397} {"train_loss": -11.6611328125, "global_step": 234808, "epoch": 1397} {"train_loss": -11.761344909667969, "global_step": 234809, "epoch": 1397} {"train_loss": -11.345010757446289, "global_step": 234810, "epoch": 1397} {"train_loss": -11.584518432617188, "global_step": 234811, "epoch": 1397} {"train_loss": -11.413124084472656, "global_step": 234812, "epoch": 1397} {"train_loss": -11.377145767211914, "global_step": 234813, "epoch": 1397} {"train_loss": -11.55647087097168, "global_step": 234814, "epoch": 1397} {"train_loss": -11.423742294311523, "global_step": 234815, "epoch": 1397} {"train_loss": -11.769655227661133, "global_step": 234816, "epoch": 1397} {"train_loss": -11.748878479003906, "global_step": 234817, "epoch": 1397} {"train_loss": -11.376752853393555, "global_step": 234818, "epoch": 1397} {"train_loss": -11.588521957397461, "global_step": 234819, "epoch": 1397} {"train_loss": -11.334786415100098, "global_step": 234820, "epoch": 1397} {"train_loss": -11.55563735961914, "global_step": 234821, "epoch": 1397} {"train_loss": -11.820189476013184, "global_step": 234822, "epoch": 1397} {"train_loss": -10.796034812927246, "global_step": 234823, "epoch": 1397} {"train_loss": -11.666963577270508, "global_step": 234824, "epoch": 1397} {"train_loss": -11.354391098022461, "global_step": 234825, "epoch": 1397} {"train_loss": -11.204827308654785, "global_step": 234826, "epoch": 1397} {"train_loss": -12.069347381591797, "global_step": 234827, "epoch": 1397} {"train_loss": -11.273518562316895, "global_step": 234828, "epoch": 1397} {"train_loss": -11.47529125213623, "global_step": 234829, "epoch": 1397} {"train_loss": -11.449597358703613, "global_step": 234830, "epoch": 1397} {"train_loss": -11.743538856506348, "global_step": 234831, "epoch": 1397} {"train_loss": -11.564099311828613, "global_step": 234832, "epoch": 1397} {"train_loss": -11.864259719848633, "global_step": 234833, "epoch": 1397} {"train_loss": -11.702741622924805, "global_step": 234834, "epoch": 1397} {"train_loss": -11.884860038757324, "global_step": 234835, "epoch": 1397} {"train_loss": -11.633384704589844, "global_step": 234836, "epoch": 1397} {"train_loss": -11.684691429138184, "global_step": 234837, "epoch": 1397} {"train_loss": -11.691917419433594, "global_step": 234838, "epoch": 1397} {"train_loss": -11.761679649353027, "global_step": 234839, "epoch": 1397} {"train_loss": -12.16081428527832, "global_step": 234840, "epoch": 1397} {"train_loss": -11.843236923217773, "global_step": 234841, "epoch": 1397} {"train_loss": -11.822776794433594, "global_step": 234842, "epoch": 1397} {"train_loss": -12.018118858337402, "global_step": 234843, "epoch": 1397} {"train_loss": -11.848299026489258, "global_step": 234844, "epoch": 1397} {"train_loss": -11.931465148925781, "global_step": 234845, "epoch": 1397} {"train_loss": -11.991060256958008, "global_step": 234846, "epoch": 1397} {"train_loss": -11.606040954589844, "global_step": 234847, "epoch": 1397} {"train_loss": -11.584123611450195, "global_step": 234848, "epoch": 1397} {"train_loss": -11.768484115600586, "global_step": 234849, "epoch": 1397} {"train_loss": -11.948747634887695, "global_step": 234850, "epoch": 1397} {"train_loss": -11.658907890319824, "global_step": 234851, "epoch": 1397} {"train_loss": -11.968029022216797, "global_step": 234852, "epoch": 1397} {"train_loss": -11.646862030029297, "global_step": 234853, "epoch": 1397} {"train_loss": -11.860954284667969, "global_step": 234854, "epoch": 1397} {"train_loss": -11.927577018737793, "global_step": 234855, "epoch": 1397} {"train_loss": -12.078323364257812, "global_step": 234856, "epoch": 1397} {"train_loss": -11.674101829528809, "global_step": 234857, "epoch": 1397} {"train_loss": -11.798733711242676, "global_step": 234858, "epoch": 1397} {"train_loss": -11.952428817749023, "global_step": 234859, "epoch": 1397} {"train_loss": -11.449868202209473, "global_step": 234860, "epoch": 1397} {"train_loss": -11.74998664855957, "global_step": 234861, "epoch": 1397} {"train_loss": -11.718717575073242, "global_step": 234862, "epoch": 1397} {"train_loss": -11.60103938693092, "global_step": 234863, "epoch": 1397, "val_loss": 264709.25} {"train_loss": -10.751607894897461, "global_step": 234864, "epoch": 1398} {"train_loss": -11.916492462158203, "global_step": 234865, "epoch": 1398} {"train_loss": -9.865412712097168, "global_step": 234866, "epoch": 1398} {"train_loss": -10.159538269042969, "global_step": 234867, "epoch": 1398} {"train_loss": -11.745141983032227, "global_step": 234868, "epoch": 1398} {"train_loss": -10.990694046020508, "global_step": 234869, "epoch": 1398} {"train_loss": -10.705747604370117, "global_step": 234870, "epoch": 1398} {"train_loss": -11.035945892333984, "global_step": 234871, "epoch": 1398} {"train_loss": -11.451751708984375, "global_step": 234872, "epoch": 1398} {"train_loss": -11.34416675567627, "global_step": 234873, "epoch": 1398} {"train_loss": -11.474010467529297, "global_step": 234874, "epoch": 1398} {"train_loss": -11.443440437316895, "global_step": 234875, "epoch": 1398} {"train_loss": -11.655925750732422, "global_step": 234876, "epoch": 1398} {"train_loss": -11.538958549499512, "global_step": 234877, "epoch": 1398} {"train_loss": -11.79991340637207, "global_step": 234878, "epoch": 1398} {"train_loss": -11.79780387878418, "global_step": 234879, "epoch": 1398} {"train_loss": -11.616127014160156, "global_step": 234880, "epoch": 1398} {"train_loss": -11.952028274536133, "global_step": 234881, "epoch": 1398} {"train_loss": -11.559856414794922, "global_step": 234882, "epoch": 1398} {"train_loss": -11.481344223022461, "global_step": 234883, "epoch": 1398} {"train_loss": -11.676697731018066, "global_step": 234884, "epoch": 1398} {"train_loss": -11.629607200622559, "global_step": 234885, "epoch": 1398} {"train_loss": -11.531756401062012, "global_step": 234886, "epoch": 1398} {"train_loss": -11.645959854125977, "global_step": 234887, "epoch": 1398} {"train_loss": -11.950071334838867, "global_step": 234888, "epoch": 1398} {"train_loss": -11.539253234863281, "global_step": 234889, "epoch": 1398} {"train_loss": -11.858806610107422, "global_step": 234890, "epoch": 1398} {"train_loss": -11.772178649902344, "global_step": 234891, "epoch": 1398} {"train_loss": -12.080266952514648, "global_step": 234892, "epoch": 1398} {"train_loss": -11.483491897583008, "global_step": 234893, "epoch": 1398} {"train_loss": -11.545588493347168, "global_step": 234894, "epoch": 1398} {"train_loss": -11.558239936828613, "global_step": 234895, "epoch": 1398} {"train_loss": -11.824644088745117, "global_step": 234896, "epoch": 1398} {"train_loss": -11.524279594421387, "global_step": 234897, "epoch": 1398} {"train_loss": -11.440775871276855, "global_step": 234898, "epoch": 1398} {"train_loss": -11.90707015991211, "global_step": 234899, "epoch": 1398} {"train_loss": -11.39439582824707, "global_step": 234900, "epoch": 1398} {"train_loss": -11.979877471923828, "global_step": 234901, "epoch": 1398} {"train_loss": -11.170270919799805, "global_step": 234902, "epoch": 1398} {"train_loss": -11.791980743408203, "global_step": 234903, "epoch": 1398} {"train_loss": -11.597068786621094, "global_step": 234904, "epoch": 1398} {"train_loss": -11.920048713684082, "global_step": 234905, "epoch": 1398} {"train_loss": -11.616573333740234, "global_step": 234906, "epoch": 1398} {"train_loss": -11.802428245544434, "global_step": 234907, "epoch": 1398} {"train_loss": -11.862171173095703, "global_step": 234908, "epoch": 1398} {"train_loss": -11.875980377197266, "global_step": 234909, "epoch": 1398} {"train_loss": -11.73547077178955, "global_step": 234910, "epoch": 1398} {"train_loss": -11.847023963928223, "global_step": 234911, "epoch": 1398} {"train_loss": -11.806814193725586, "global_step": 234912, "epoch": 1398} {"train_loss": -11.812362670898438, "global_step": 234913, "epoch": 1398} {"train_loss": -11.765361785888672, "global_step": 234914, "epoch": 1398} {"train_loss": -11.94732666015625, "global_step": 234915, "epoch": 1398} {"train_loss": -11.518716812133789, "global_step": 234916, "epoch": 1398} {"train_loss": -11.726763725280762, "global_step": 234917, "epoch": 1398} {"train_loss": -11.979379653930664, "global_step": 234918, "epoch": 1398} {"train_loss": -11.303825378417969, "global_step": 234919, "epoch": 1398} {"train_loss": -11.109611511230469, "global_step": 234920, "epoch": 1398} {"train_loss": -11.572332382202148, "global_step": 234921, "epoch": 1398} {"train_loss": -12.160245895385742, "global_step": 234922, "epoch": 1398} {"train_loss": -11.497919082641602, "global_step": 234923, "epoch": 1398} {"train_loss": -11.74215316772461, "global_step": 234924, "epoch": 1398} {"train_loss": -11.607467651367188, "global_step": 234925, "epoch": 1398} {"train_loss": -11.349550247192383, "global_step": 234926, "epoch": 1398} {"train_loss": -11.394655227661133, "global_step": 234927, "epoch": 1398} {"train_loss": -11.39913558959961, "global_step": 234928, "epoch": 1398} {"train_loss": -11.252997398376465, "global_step": 234929, "epoch": 1398} {"train_loss": -11.14570426940918, "global_step": 234930, "epoch": 1398} {"train_loss": -10.861286163330078, "global_step": 234931, "epoch": 1398} {"train_loss": -10.826061248779297, "global_step": 234932, "epoch": 1398} {"train_loss": -11.010187149047852, "global_step": 234933, "epoch": 1398} {"train_loss": -10.493332862854004, "global_step": 234934, "epoch": 1398} {"train_loss": -10.865668296813965, "global_step": 234935, "epoch": 1398} {"train_loss": -11.113088607788086, "global_step": 234936, "epoch": 1398} {"train_loss": -10.30696964263916, "global_step": 234937, "epoch": 1398} {"train_loss": -10.362425804138184, "global_step": 234938, "epoch": 1398} {"train_loss": -10.686935424804688, "global_step": 234939, "epoch": 1398} {"train_loss": -10.145779609680176, "global_step": 234940, "epoch": 1398} {"train_loss": -11.346879005432129, "global_step": 234941, "epoch": 1398} {"train_loss": -9.533124923706055, "global_step": 234942, "epoch": 1398} {"train_loss": -11.195930480957031, "global_step": 234943, "epoch": 1398} {"train_loss": -11.3474760055542, "global_step": 234944, "epoch": 1398} {"train_loss": -11.080011367797852, "global_step": 234945, "epoch": 1398} {"train_loss": -11.598116874694824, "global_step": 234946, "epoch": 1398} {"train_loss": -11.383761405944824, "global_step": 234947, "epoch": 1398} {"train_loss": -11.679239273071289, "global_step": 234948, "epoch": 1398} {"train_loss": -11.401168823242188, "global_step": 234949, "epoch": 1398} {"train_loss": -11.293533325195312, "global_step": 234950, "epoch": 1398} {"train_loss": -11.590932846069336, "global_step": 234951, "epoch": 1398} {"train_loss": -11.416194915771484, "global_step": 234952, "epoch": 1398} {"train_loss": -11.497623443603516, "global_step": 234953, "epoch": 1398} {"train_loss": -11.77053451538086, "global_step": 234954, "epoch": 1398} {"train_loss": -11.476678848266602, "global_step": 234955, "epoch": 1398} {"train_loss": -11.793951988220215, "global_step": 234956, "epoch": 1398} {"train_loss": -11.742525100708008, "global_step": 234957, "epoch": 1398} {"train_loss": -11.627039909362793, "global_step": 234958, "epoch": 1398} {"train_loss": -11.669178009033203, "global_step": 234959, "epoch": 1398} {"train_loss": -11.733607292175293, "global_step": 234960, "epoch": 1398} {"train_loss": -11.616255760192871, "global_step": 234961, "epoch": 1398} {"train_loss": -11.78396224975586, "global_step": 234962, "epoch": 1398} {"train_loss": -11.848346710205078, "global_step": 234963, "epoch": 1398} {"train_loss": -11.795309066772461, "global_step": 234964, "epoch": 1398} {"train_loss": -12.04466724395752, "global_step": 234965, "epoch": 1398} {"train_loss": -11.705632209777832, "global_step": 234966, "epoch": 1398} {"train_loss": -11.926198959350586, "global_step": 234967, "epoch": 1398} {"train_loss": -11.828622817993164, "global_step": 234968, "epoch": 1398} {"train_loss": -11.875536918640137, "global_step": 234969, "epoch": 1398} {"train_loss": -11.62977409362793, "global_step": 234970, "epoch": 1398} {"train_loss": -11.762316703796387, "global_step": 234971, "epoch": 1398} {"train_loss": -11.66450023651123, "global_step": 234972, "epoch": 1398} {"train_loss": -11.799724578857422, "global_step": 234973, "epoch": 1398} {"train_loss": -11.761760711669922, "global_step": 234974, "epoch": 1398} {"train_loss": -11.947040557861328, "global_step": 234975, "epoch": 1398} {"train_loss": -11.836090087890625, "global_step": 234976, "epoch": 1398} {"train_loss": -12.057974815368652, "global_step": 234977, "epoch": 1398} {"train_loss": -11.490873336791992, "global_step": 234978, "epoch": 1398} {"train_loss": -12.085382461547852, "global_step": 234979, "epoch": 1398} {"train_loss": -11.601235389709473, "global_step": 234980, "epoch": 1398} {"train_loss": -11.761109352111816, "global_step": 234981, "epoch": 1398} {"train_loss": -11.667118072509766, "global_step": 234982, "epoch": 1398} {"train_loss": -11.745436668395996, "global_step": 234983, "epoch": 1398} {"train_loss": -11.069757461547852, "global_step": 234984, "epoch": 1398} {"train_loss": -11.872259140014648, "global_step": 234985, "epoch": 1398} {"train_loss": -10.772984504699707, "global_step": 234986, "epoch": 1398} {"train_loss": -10.947698593139648, "global_step": 234987, "epoch": 1398} {"train_loss": -11.175257682800293, "global_step": 234988, "epoch": 1398} {"train_loss": -10.947122573852539, "global_step": 234989, "epoch": 1398} {"train_loss": -10.638629913330078, "global_step": 234990, "epoch": 1398} {"train_loss": -11.014961242675781, "global_step": 234991, "epoch": 1398} {"train_loss": -11.253288269042969, "global_step": 234992, "epoch": 1398} {"train_loss": -11.081003189086914, "global_step": 234993, "epoch": 1398} {"train_loss": -11.178573608398438, "global_step": 234994, "epoch": 1398} {"train_loss": -10.87570571899414, "global_step": 234995, "epoch": 1398} {"train_loss": -10.868614196777344, "global_step": 234996, "epoch": 1398} {"train_loss": -11.337982177734375, "global_step": 234997, "epoch": 1398} {"train_loss": -10.360091209411621, "global_step": 234998, "epoch": 1398} {"train_loss": -10.92846965789795, "global_step": 234999, "epoch": 1398} {"train_loss": -11.134756088256836, "global_step": 235000, "epoch": 1398} {"train_loss": -11.400829315185547, "global_step": 235001, "epoch": 1398} {"train_loss": -10.858510971069336, "global_step": 235002, "epoch": 1398} {"train_loss": -11.289710998535156, "global_step": 235003, "epoch": 1398} {"train_loss": -11.433988571166992, "global_step": 235004, "epoch": 1398} {"train_loss": -11.2479887008667, "global_step": 235005, "epoch": 1398} {"train_loss": -11.43431282043457, "global_step": 235006, "epoch": 1398} {"train_loss": -11.585970878601074, "global_step": 235007, "epoch": 1398} {"train_loss": -11.611474990844727, "global_step": 235008, "epoch": 1398} {"train_loss": -11.653127670288086, "global_step": 235009, "epoch": 1398} {"train_loss": -11.459549903869629, "global_step": 235010, "epoch": 1398} {"train_loss": -11.308631896972656, "global_step": 235011, "epoch": 1398} {"train_loss": -11.703899383544922, "global_step": 235012, "epoch": 1398} {"train_loss": -11.559616088867188, "global_step": 235013, "epoch": 1398} {"train_loss": -11.840747833251953, "global_step": 235014, "epoch": 1398} {"train_loss": -11.794084548950195, "global_step": 235015, "epoch": 1398} {"train_loss": -11.639822006225586, "global_step": 235016, "epoch": 1398} {"train_loss": -11.735297203063965, "global_step": 235017, "epoch": 1398} {"train_loss": -11.444613456726074, "global_step": 235018, "epoch": 1398} {"train_loss": -11.98634147644043, "global_step": 235019, "epoch": 1398} {"train_loss": -11.676513671875, "global_step": 235020, "epoch": 1398} {"train_loss": -11.773012161254883, "global_step": 235021, "epoch": 1398} {"train_loss": -11.58289909362793, "global_step": 235022, "epoch": 1398} {"train_loss": -11.979206085205078, "global_step": 235023, "epoch": 1398} {"train_loss": -11.77463150024414, "global_step": 235024, "epoch": 1398} {"train_loss": -11.86172103881836, "global_step": 235025, "epoch": 1398} {"train_loss": -11.842333793640137, "global_step": 235026, "epoch": 1398} {"train_loss": -11.681718826293945, "global_step": 235027, "epoch": 1398} {"train_loss": -11.732758522033691, "global_step": 235028, "epoch": 1398} {"train_loss": -11.802727699279785, "global_step": 235029, "epoch": 1398} {"train_loss": -12.037424087524414, "global_step": 235030, "epoch": 1398} {"train_loss": -11.475680254754566, "global_step": 235031, "epoch": 1398, "val_loss": 266447.8125} {"train_loss": -11.766883850097656, "global_step": 235032, "epoch": 1399} {"train_loss": -11.610849380493164, "global_step": 235033, "epoch": 1399} {"train_loss": -11.927816390991211, "global_step": 235034, "epoch": 1399} {"train_loss": -11.936995506286621, "global_step": 235035, "epoch": 1399} {"train_loss": -11.839815139770508, "global_step": 235036, "epoch": 1399} {"train_loss": -11.843355178833008, "global_step": 235037, "epoch": 1399} {"train_loss": -11.732807159423828, "global_step": 235038, "epoch": 1399} {"train_loss": -11.81470775604248, "global_step": 235039, "epoch": 1399} {"train_loss": -12.095939636230469, "global_step": 235040, "epoch": 1399} {"train_loss": -12.025739669799805, "global_step": 235041, "epoch": 1399} {"train_loss": -11.826491355895996, "global_step": 235042, "epoch": 1399} {"train_loss": -11.982007026672363, "global_step": 235043, "epoch": 1399} {"train_loss": -12.118019104003906, "global_step": 235044, "epoch": 1399} {"train_loss": -11.839191436767578, "global_step": 235045, "epoch": 1399} {"train_loss": -11.818303108215332, "global_step": 235046, "epoch": 1399} {"train_loss": -12.010427474975586, "global_step": 235047, "epoch": 1399} {"train_loss": -12.099288940429688, "global_step": 235048, "epoch": 1399} {"train_loss": -11.933670043945312, "global_step": 235049, "epoch": 1399} {"train_loss": -11.839303016662598, "global_step": 235050, "epoch": 1399} {"train_loss": -12.111050605773926, "global_step": 235051, "epoch": 1399} {"train_loss": -11.77061653137207, "global_step": 235052, "epoch": 1399} {"train_loss": -12.123881340026855, "global_step": 235053, "epoch": 1399} {"train_loss": -12.009729385375977, "global_step": 235054, "epoch": 1399} {"train_loss": -12.02192497253418, "global_step": 235055, "epoch": 1399} {"train_loss": -11.423406600952148, "global_step": 235056, "epoch": 1399} {"train_loss": -11.85369873046875, "global_step": 235057, "epoch": 1399} {"train_loss": -11.071695327758789, "global_step": 235058, "epoch": 1399} {"train_loss": -10.857322692871094, "global_step": 235059, "epoch": 1399} {"train_loss": -11.687788963317871, "global_step": 235060, "epoch": 1399} {"train_loss": -11.304032325744629, "global_step": 235061, "epoch": 1399} {"train_loss": -11.36507511138916, "global_step": 235062, "epoch": 1399} {"train_loss": -11.866606712341309, "global_step": 235063, "epoch": 1399} {"train_loss": -11.264148712158203, "global_step": 235064, "epoch": 1399} {"train_loss": -11.124164581298828, "global_step": 235065, "epoch": 1399} {"train_loss": -11.620559692382812, "global_step": 235066, "epoch": 1399} {"train_loss": -10.700000762939453, "global_step": 235067, "epoch": 1399} {"train_loss": -11.698795318603516, "global_step": 235068, "epoch": 1399} {"train_loss": -11.34062671661377, "global_step": 235069, "epoch": 1399} {"train_loss": -10.73223876953125, "global_step": 235070, "epoch": 1399} {"train_loss": -12.025078773498535, "global_step": 235071, "epoch": 1399} {"train_loss": -11.261308670043945, "global_step": 235072, "epoch": 1399} {"train_loss": -11.64294147491455, "global_step": 235073, "epoch": 1399} {"train_loss": -11.621641159057617, "global_step": 235074, "epoch": 1399} {"train_loss": -11.534622192382812, "global_step": 235075, "epoch": 1399} {"train_loss": -11.469255447387695, "global_step": 235076, "epoch": 1399} {"train_loss": -11.268527030944824, "global_step": 235077, "epoch": 1399} {"train_loss": -11.56827163696289, "global_step": 235078, "epoch": 1399} {"train_loss": -11.641536712646484, "global_step": 235079, "epoch": 1399} {"train_loss": -11.483856201171875, "global_step": 235080, "epoch": 1399} {"train_loss": -10.927217483520508, "global_step": 235081, "epoch": 1399} {"train_loss": -11.648568153381348, "global_step": 235082, "epoch": 1399} {"train_loss": -11.1249361038208, "global_step": 235083, "epoch": 1399} {"train_loss": -11.497573852539062, "global_step": 235084, "epoch": 1399} {"train_loss": -11.246231079101562, "global_step": 235085, "epoch": 1399} {"train_loss": -11.220544815063477, "global_step": 235086, "epoch": 1399} {"train_loss": -10.498022079467773, "global_step": 235087, "epoch": 1399} {"train_loss": -11.375336647033691, "global_step": 235088, "epoch": 1399} {"train_loss": -10.727079391479492, "global_step": 235089, "epoch": 1399} {"train_loss": -11.28636646270752, "global_step": 235090, "epoch": 1399} {"train_loss": -11.263740539550781, "global_step": 235091, "epoch": 1399} {"train_loss": -11.279836654663086, "global_step": 235092, "epoch": 1399} {"train_loss": -11.436494827270508, "global_step": 235093, "epoch": 1399} {"train_loss": -11.470012664794922, "global_step": 235094, "epoch": 1399} {"train_loss": -11.188879013061523, "global_step": 235095, "epoch": 1399} {"train_loss": -11.173738479614258, "global_step": 235096, "epoch": 1399} {"train_loss": -11.0599946975708, "global_step": 235097, "epoch": 1399} {"train_loss": -10.515714645385742, "global_step": 235098, "epoch": 1399} {"train_loss": -11.62921142578125, "global_step": 235099, "epoch": 1399} {"train_loss": -11.13753604888916, "global_step": 235100, "epoch": 1399} {"train_loss": -10.956770896911621, "global_step": 235101, "epoch": 1399} {"train_loss": -10.700492858886719, "global_step": 235102, "epoch": 1399} {"train_loss": -11.040701866149902, "global_step": 235103, "epoch": 1399} {"train_loss": -11.117488861083984, "global_step": 235104, "epoch": 1399} {"train_loss": -10.83248519897461, "global_step": 235105, "epoch": 1399} {"train_loss": -10.906621932983398, "global_step": 235106, "epoch": 1399} {"train_loss": -10.53978157043457, "global_step": 235107, "epoch": 1399} {"train_loss": -10.300496101379395, "global_step": 235108, "epoch": 1399} {"train_loss": -10.923120498657227, "global_step": 235109, "epoch": 1399} {"train_loss": -10.716468811035156, "global_step": 235110, "epoch": 1399} {"train_loss": -10.872597694396973, "global_step": 235111, "epoch": 1399} {"train_loss": -10.896432876586914, "global_step": 235112, "epoch": 1399} {"train_loss": -10.999931335449219, "global_step": 235113, "epoch": 1399} {"train_loss": -10.942398071289062, "global_step": 235114, "epoch": 1399} {"train_loss": -11.234498023986816, "global_step": 235115, "epoch": 1399} {"train_loss": -11.28877067565918, "global_step": 235116, "epoch": 1399} {"train_loss": -11.097702980041504, "global_step": 235117, "epoch": 1399} {"train_loss": -11.334274291992188, "global_step": 235118, "epoch": 1399} {"train_loss": -10.830940246582031, "global_step": 235119, "epoch": 1399} {"train_loss": -11.257760047912598, "global_step": 235120, "epoch": 1399} {"train_loss": -11.523828506469727, "global_step": 235121, "epoch": 1399} {"train_loss": -10.993921279907227, "global_step": 235122, "epoch": 1399} {"train_loss": -11.60144329071045, "global_step": 235123, "epoch": 1399} {"train_loss": -11.304595947265625, "global_step": 235124, "epoch": 1399} {"train_loss": -11.283897399902344, "global_step": 235125, "epoch": 1399} {"train_loss": -11.465062141418457, "global_step": 235126, "epoch": 1399} {"train_loss": -11.320816040039062, "global_step": 235127, "epoch": 1399} {"train_loss": -11.628114700317383, "global_step": 235128, "epoch": 1399} {"train_loss": -11.55793571472168, "global_step": 235129, "epoch": 1399} {"train_loss": -11.802654266357422, "global_step": 235130, "epoch": 1399} {"train_loss": -11.347599983215332, "global_step": 235131, "epoch": 1399} {"train_loss": -11.730743408203125, "global_step": 235132, "epoch": 1399} {"train_loss": -11.658262252807617, "global_step": 235133, "epoch": 1399} {"train_loss": -11.65101146697998, "global_step": 235134, "epoch": 1399} {"train_loss": -11.557703018188477, "global_step": 235135, "epoch": 1399} {"train_loss": -11.810214042663574, "global_step": 235136, "epoch": 1399} {"train_loss": -11.482641220092773, "global_step": 235137, "epoch": 1399} {"train_loss": -11.506412506103516, "global_step": 235138, "epoch": 1399} {"train_loss": -11.58938980102539, "global_step": 235139, "epoch": 1399} {"train_loss": -11.55451488494873, "global_step": 235140, "epoch": 1399} {"train_loss": -11.753413200378418, "global_step": 235141, "epoch": 1399} {"train_loss": -11.826187133789062, "global_step": 235142, "epoch": 1399} {"train_loss": -11.374939918518066, "global_step": 235143, "epoch": 1399} {"train_loss": -11.759572982788086, "global_step": 235144, "epoch": 1399} {"train_loss": -11.539719581604004, "global_step": 235145, "epoch": 1399} {"train_loss": -11.94631576538086, "global_step": 235146, "epoch": 1399} {"train_loss": -11.569365501403809, "global_step": 235147, "epoch": 1399} {"train_loss": -11.790853500366211, "global_step": 235148, "epoch": 1399} {"train_loss": -11.793588638305664, "global_step": 235149, "epoch": 1399} {"train_loss": -11.7340726852417, "global_step": 235150, "epoch": 1399} {"train_loss": -11.714004516601562, "global_step": 235151, "epoch": 1399} {"train_loss": -11.623332977294922, "global_step": 235152, "epoch": 1399} {"train_loss": -11.868032455444336, "global_step": 235153, "epoch": 1399} {"train_loss": -11.920232772827148, "global_step": 235154, "epoch": 1399} {"train_loss": -11.638897895812988, "global_step": 235155, "epoch": 1399} {"train_loss": -11.907470703125, "global_step": 235156, "epoch": 1399} {"train_loss": -11.8184814453125, "global_step": 235157, "epoch": 1399} {"train_loss": -11.519024848937988, "global_step": 235158, "epoch": 1399} {"train_loss": -11.54819107055664, "global_step": 235159, "epoch": 1399} {"train_loss": -11.594675064086914, "global_step": 235160, "epoch": 1399} {"train_loss": -11.686614990234375, "global_step": 235161, "epoch": 1399} {"train_loss": -11.779410362243652, "global_step": 235162, "epoch": 1399} {"train_loss": -11.827857971191406, "global_step": 235163, "epoch": 1399} {"train_loss": -11.857610702514648, "global_step": 235164, "epoch": 1399} {"train_loss": -11.432415008544922, "global_step": 235165, "epoch": 1399} {"train_loss": -11.569182395935059, "global_step": 235166, "epoch": 1399} {"train_loss": -11.343847274780273, "global_step": 235167, "epoch": 1399} {"train_loss": -11.75900650024414, "global_step": 235168, "epoch": 1399} {"train_loss": -11.637828826904297, "global_step": 235169, "epoch": 1399} {"train_loss": -11.72604751586914, "global_step": 235170, "epoch": 1399} {"train_loss": -12.0664644241333, "global_step": 235171, "epoch": 1399} {"train_loss": -11.63460636138916, "global_step": 235172, "epoch": 1399} {"train_loss": -11.69559097290039, "global_step": 235173, "epoch": 1399} {"train_loss": -11.959644317626953, "global_step": 235174, "epoch": 1399} {"train_loss": -11.535736083984375, "global_step": 235175, "epoch": 1399} {"train_loss": -11.556979179382324, "global_step": 235176, "epoch": 1399} {"train_loss": -11.83908748626709, "global_step": 235177, "epoch": 1399} {"train_loss": -11.871084213256836, "global_step": 235178, "epoch": 1399} {"train_loss": -11.670480728149414, "global_step": 235179, "epoch": 1399} {"train_loss": -11.8314208984375, "global_step": 235180, "epoch": 1399} {"train_loss": -11.547518730163574, "global_step": 235181, "epoch": 1399} {"train_loss": -11.770852088928223, "global_step": 235182, "epoch": 1399} {"train_loss": -11.771364212036133, "global_step": 235183, "epoch": 1399} {"train_loss": -11.801922798156738, "global_step": 235184, "epoch": 1399} {"train_loss": -11.374471664428711, "global_step": 235185, "epoch": 1399} {"train_loss": -11.518129348754883, "global_step": 235186, "epoch": 1399} {"train_loss": -11.691129684448242, "global_step": 235187, "epoch": 1399} {"train_loss": -11.17278003692627, "global_step": 235188, "epoch": 1399} {"train_loss": -11.781645774841309, "global_step": 235189, "epoch": 1399} {"train_loss": -11.648364067077637, "global_step": 235190, "epoch": 1399} {"train_loss": -11.430334091186523, "global_step": 235191, "epoch": 1399} {"train_loss": -11.657600402832031, "global_step": 235192, "epoch": 1399} {"train_loss": -11.757585525512695, "global_step": 235193, "epoch": 1399} {"train_loss": -11.763748168945312, "global_step": 235194, "epoch": 1399} {"train_loss": -11.311018943786621, "global_step": 235195, "epoch": 1399} {"train_loss": -11.59060001373291, "global_step": 235196, "epoch": 1399} {"train_loss": -11.626672744750977, "global_step": 235197, "epoch": 1399} {"train_loss": -11.413820266723633, "global_step": 235198, "epoch": 1399} {"train_loss": -11.504647249267215, "global_step": 235199, "epoch": 1399, "val_loss": 263047.96875} {"train_loss": -12.07149887084961, "global_step": 235200, "epoch": 1400} {"train_loss": -11.610330581665039, "global_step": 235201, "epoch": 1400} {"train_loss": -11.946861267089844, "global_step": 235202, "epoch": 1400} {"train_loss": -11.834728240966797, "global_step": 235203, "epoch": 1400} {"train_loss": -11.913984298706055, "global_step": 235204, "epoch": 1400} {"train_loss": -11.72810173034668, "global_step": 235205, "epoch": 1400} {"train_loss": -12.090045928955078, "global_step": 235206, "epoch": 1400} {"train_loss": -11.682842254638672, "global_step": 235207, "epoch": 1400} {"train_loss": -11.81889533996582, "global_step": 235208, "epoch": 1400} {"train_loss": -11.667530059814453, "global_step": 235209, "epoch": 1400} {"train_loss": -11.694917678833008, "global_step": 235210, "epoch": 1400} {"train_loss": -11.942209243774414, "global_step": 235211, "epoch": 1400} {"train_loss": -11.379682540893555, "global_step": 235212, "epoch": 1400} {"train_loss": -11.71290397644043, "global_step": 235213, "epoch": 1400} {"train_loss": -11.646980285644531, "global_step": 235214, "epoch": 1400} {"train_loss": -10.812287330627441, "global_step": 235215, "epoch": 1400} {"train_loss": -11.833337783813477, "global_step": 235216, "epoch": 1400} {"train_loss": -11.430137634277344, "global_step": 235217, "epoch": 1400} {"train_loss": -11.280801773071289, "global_step": 235218, "epoch": 1400} {"train_loss": -11.697782516479492, "global_step": 235219, "epoch": 1400} {"train_loss": -11.162816047668457, "global_step": 235220, "epoch": 1400} {"train_loss": -10.780083656311035, "global_step": 235221, "epoch": 1400} {"train_loss": -11.332180976867676, "global_step": 235222, "epoch": 1400} {"train_loss": -10.882055282592773, "global_step": 235223, "epoch": 1400} {"train_loss": -9.639856338500977, "global_step": 235224, "epoch": 1400} {"train_loss": -11.526875495910645, "global_step": 235225, "epoch": 1400} {"train_loss": -11.223785400390625, "global_step": 235226, "epoch": 1400} {"train_loss": -10.710813522338867, "global_step": 235227, "epoch": 1400} {"train_loss": -11.636590957641602, "global_step": 235228, "epoch": 1400} {"train_loss": -10.990533828735352, "global_step": 235229, "epoch": 1400} {"train_loss": -11.153219223022461, "global_step": 235230, "epoch": 1400} {"train_loss": -11.553781509399414, "global_step": 235231, "epoch": 1400} {"train_loss": -10.865827560424805, "global_step": 235232, "epoch": 1400} {"train_loss": -10.360142707824707, "global_step": 235233, "epoch": 1400} {"train_loss": -11.521270751953125, "global_step": 235234, "epoch": 1400} {"train_loss": -11.109349250793457, "global_step": 235235, "epoch": 1400} {"train_loss": -11.514595031738281, "global_step": 235236, "epoch": 1400} {"train_loss": -10.952282905578613, "global_step": 235237, "epoch": 1400} {"train_loss": -10.946538925170898, "global_step": 235238, "epoch": 1400} {"train_loss": -10.99200439453125, "global_step": 235239, "epoch": 1400} {"train_loss": -10.884370803833008, "global_step": 235240, "epoch": 1400} {"train_loss": -10.816567420959473, "global_step": 235241, "epoch": 1400} {"train_loss": -11.431955337524414, "global_step": 235242, "epoch": 1400} {"train_loss": -11.533345222473145, "global_step": 235243, "epoch": 1400} {"train_loss": -11.412463188171387, "global_step": 235244, "epoch": 1400} {"train_loss": -11.715734481811523, "global_step": 235245, "epoch": 1400} {"train_loss": -11.40150260925293, "global_step": 235246, "epoch": 1400} {"train_loss": -11.70853328704834, "global_step": 235247, "epoch": 1400} {"train_loss": -11.579378128051758, "global_step": 235248, "epoch": 1400} {"train_loss": -11.638086318969727, "global_step": 235249, "epoch": 1400} {"train_loss": -11.909231185913086, "global_step": 235250, "epoch": 1400} {"train_loss": -11.879117965698242, "global_step": 235251, "epoch": 1400} {"train_loss": -11.90218734741211, "global_step": 235252, "epoch": 1400} {"train_loss": -11.770061492919922, "global_step": 235253, "epoch": 1400} {"train_loss": -11.658332824707031, "global_step": 235254, "epoch": 1400} {"train_loss": -11.616020202636719, "global_step": 235255, "epoch": 1400} {"train_loss": -11.802156448364258, "global_step": 235256, "epoch": 1400} {"train_loss": -11.67617130279541, "global_step": 235257, "epoch": 1400} {"train_loss": -11.896158218383789, "global_step": 235258, "epoch": 1400} {"train_loss": -11.80786418914795, "global_step": 235259, "epoch": 1400} {"train_loss": -11.668011665344238, "global_step": 235260, "epoch": 1400} {"train_loss": -11.837234497070312, "global_step": 235261, "epoch": 1400} {"train_loss": -11.805850982666016, "global_step": 235262, "epoch": 1400} {"train_loss": -11.647315979003906, "global_step": 235263, "epoch": 1400} {"train_loss": -11.77143669128418, "global_step": 235264, "epoch": 1400} {"train_loss": -11.535270690917969, "global_step": 235265, "epoch": 1400} {"train_loss": -11.769593238830566, "global_step": 235266, "epoch": 1400} {"train_loss": -11.603212356567383, "global_step": 235267, "epoch": 1400} {"train_loss": -11.809259414672852, "global_step": 235268, "epoch": 1400} {"train_loss": -11.769370079040527, "global_step": 235269, "epoch": 1400} {"train_loss": -11.945629119873047, "global_step": 235270, "epoch": 1400} {"train_loss": -11.705609321594238, "global_step": 235271, "epoch": 1400} {"train_loss": -11.806398391723633, "global_step": 235272, "epoch": 1400} {"train_loss": -11.801130294799805, "global_step": 235273, "epoch": 1400} {"train_loss": -11.929941177368164, "global_step": 235274, "epoch": 1400} {"train_loss": -11.883013725280762, "global_step": 235275, "epoch": 1400} {"train_loss": -11.901228904724121, "global_step": 235276, "epoch": 1400} {"train_loss": -11.863801002502441, "global_step": 235277, "epoch": 1400} {"train_loss": -11.669092178344727, "global_step": 235278, "epoch": 1400} {"train_loss": -12.045064926147461, "global_step": 235279, "epoch": 1400} {"train_loss": -11.566460609436035, "global_step": 235280, "epoch": 1400} {"train_loss": -11.863391876220703, "global_step": 235281, "epoch": 1400} {"train_loss": -11.476433753967285, "global_step": 235282, "epoch": 1400} {"train_loss": -11.053335189819336, "global_step": 235283, "epoch": 1400} {"train_loss": -12.229290962219238, "global_step": 235284, "epoch": 1400} {"train_loss": -11.239370346069336, "global_step": 235285, "epoch": 1400} {"train_loss": -11.933577537536621, "global_step": 235286, "epoch": 1400} {"train_loss": -11.771444320678711, "global_step": 235287, "epoch": 1400} {"train_loss": -11.741843223571777, "global_step": 235288, "epoch": 1400} {"train_loss": -11.805707931518555, "global_step": 235289, "epoch": 1400} {"train_loss": -11.72901725769043, "global_step": 235290, "epoch": 1400} {"train_loss": -11.694450378417969, "global_step": 235291, "epoch": 1400} {"train_loss": -10.945454597473145, "global_step": 235292, "epoch": 1400} {"train_loss": -11.893107414245605, "global_step": 235293, "epoch": 1400} {"train_loss": -11.331670761108398, "global_step": 235294, "epoch": 1400} {"train_loss": -11.39764404296875, "global_step": 235295, "epoch": 1400} {"train_loss": -11.634820938110352, "global_step": 235296, "epoch": 1400} {"train_loss": -11.581537246704102, "global_step": 235297, "epoch": 1400} {"train_loss": -11.75152587890625, "global_step": 235298, "epoch": 1400} {"train_loss": -11.774693489074707, "global_step": 235299, "epoch": 1400} {"train_loss": -11.786052703857422, "global_step": 235300, "epoch": 1400} {"train_loss": -11.47100830078125, "global_step": 235301, "epoch": 1400} {"train_loss": -11.567842483520508, "global_step": 235302, "epoch": 1400} {"train_loss": -11.795225143432617, "global_step": 235303, "epoch": 1400} {"train_loss": -11.952798843383789, "global_step": 235304, "epoch": 1400} {"train_loss": -11.831056594848633, "global_step": 235305, "epoch": 1400} {"train_loss": -11.8007173538208, "global_step": 235306, "epoch": 1400} {"train_loss": -11.699394226074219, "global_step": 235307, "epoch": 1400} {"train_loss": -11.896671295166016, "global_step": 235308, "epoch": 1400} {"train_loss": -11.685734748840332, "global_step": 235309, "epoch": 1400} {"train_loss": -11.870706558227539, "global_step": 235310, "epoch": 1400} {"train_loss": -11.460142135620117, "global_step": 235311, "epoch": 1400} {"train_loss": -12.078213691711426, "global_step": 235312, "epoch": 1400} {"train_loss": -11.50326156616211, "global_step": 235313, "epoch": 1400} {"train_loss": -11.585630416870117, "global_step": 235314, "epoch": 1400} {"train_loss": -12.043989181518555, "global_step": 235315, "epoch": 1400} {"train_loss": -11.601655006408691, "global_step": 235316, "epoch": 1400} {"train_loss": -11.574353218078613, "global_step": 235317, "epoch": 1400} {"train_loss": -12.018219947814941, "global_step": 235318, "epoch": 1400} {"train_loss": -10.979104042053223, "global_step": 235319, "epoch": 1400} {"train_loss": -11.165998458862305, "global_step": 235320, "epoch": 1400} {"train_loss": -11.890152931213379, "global_step": 235321, "epoch": 1400} {"train_loss": -11.186202049255371, "global_step": 235322, "epoch": 1400} {"train_loss": -11.325431823730469, "global_step": 235323, "epoch": 1400} {"train_loss": -11.914737701416016, "global_step": 235324, "epoch": 1400} {"train_loss": -11.020413398742676, "global_step": 235325, "epoch": 1400} {"train_loss": -11.820569038391113, "global_step": 235326, "epoch": 1400} {"train_loss": -11.534965515136719, "global_step": 235327, "epoch": 1400} {"train_loss": -11.364097595214844, "global_step": 235328, "epoch": 1400} {"train_loss": -12.124598503112793, "global_step": 235329, "epoch": 1400} {"train_loss": -11.361420631408691, "global_step": 235330, "epoch": 1400} {"train_loss": -11.970298767089844, "global_step": 235331, "epoch": 1400} {"train_loss": -10.710686683654785, "global_step": 235332, "epoch": 1400} {"train_loss": -11.827875137329102, "global_step": 235333, "epoch": 1400} {"train_loss": -11.800238609313965, "global_step": 235334, "epoch": 1400} {"train_loss": -11.462700843811035, "global_step": 235335, "epoch": 1400} {"train_loss": -12.061423301696777, "global_step": 235336, "epoch": 1400} {"train_loss": -11.391464233398438, "global_step": 235337, "epoch": 1400} {"train_loss": -11.6819486618042, "global_step": 235338, "epoch": 1400} {"train_loss": -11.587481498718262, "global_step": 235339, "epoch": 1400} {"train_loss": -11.953786849975586, "global_step": 235340, "epoch": 1400} {"train_loss": -11.868363380432129, "global_step": 235341, "epoch": 1400} {"train_loss": -11.99245548248291, "global_step": 235342, "epoch": 1400} {"train_loss": -11.728545188903809, "global_step": 235343, "epoch": 1400} {"train_loss": -11.784477233886719, "global_step": 235344, "epoch": 1400} {"train_loss": -11.49930477142334, "global_step": 235345, "epoch": 1400} {"train_loss": -11.796307563781738, "global_step": 235346, "epoch": 1400} {"train_loss": -11.36307144165039, "global_step": 235347, "epoch": 1400} {"train_loss": -11.588150024414062, "global_step": 235348, "epoch": 1400} {"train_loss": -11.554803848266602, "global_step": 235349, "epoch": 1400} {"train_loss": -11.622446060180664, "global_step": 235350, "epoch": 1400} {"train_loss": -11.143519401550293, "global_step": 235351, "epoch": 1400} {"train_loss": -11.980056762695312, "global_step": 235352, "epoch": 1400} {"train_loss": -11.58764362335205, "global_step": 235353, "epoch": 1400} {"train_loss": -11.61915397644043, "global_step": 235354, "epoch": 1400} {"train_loss": -11.008092880249023, "global_step": 235355, "epoch": 1400} {"train_loss": -11.381571769714355, "global_step": 235356, "epoch": 1400} {"train_loss": -11.93979263305664, "global_step": 235357, "epoch": 1400} {"train_loss": -11.411752700805664, "global_step": 235358, "epoch": 1400} {"train_loss": -11.868009567260742, "global_step": 235359, "epoch": 1400} {"train_loss": -11.411079406738281, "global_step": 235360, "epoch": 1400} {"train_loss": -11.679819107055664, "global_step": 235361, "epoch": 1400} {"train_loss": -11.793758392333984, "global_step": 235362, "epoch": 1400} {"train_loss": -11.680482864379883, "global_step": 235363, "epoch": 1400} {"train_loss": -12.032873153686523, "global_step": 235364, "epoch": 1400} {"train_loss": -11.811967849731445, "global_step": 235365, "epoch": 1400} {"train_loss": -12.179336547851562, "global_step": 235366, "epoch": 1400} {"train_loss": -11.59055901709057, "global_step": 235367, "epoch": 1400, "train/sim_max_reward_0": 0.6517691344187034, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.9332210316228853, "train/sim_max_reward_4": 0.3221755139639959, "train/sim_max_reward_5": 0.6193146889730501, "test/sim_max_reward_4400000": 0.9895800706687784, "test/sim_max_reward_4400001": 0.3713728507428945, "test/sim_max_reward_4400002": 0.06053279421136337, "test/sim_max_reward_4400003": 0.4159142210344029, "test/sim_max_reward_4400004": 0.9813896041246929, "test/sim_max_reward_4400005": 0.9999452002199606, "test/sim_max_reward_4400006": 0.8538529650056115, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 0.5516238017508289, "test/sim_max_reward_4400009": 0.4291737291534544, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 0.3023622266950023, "test/sim_max_reward_4400012": 0.9570369781237128, "test/sim_max_reward_4400013": 0.8070834196022312, "test/sim_max_reward_4400014": 0.9812434874255845, "test/sim_max_reward_4400015": 0.4023655004566168, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9582657979284834, "test/sim_max_reward_4400019": 0.4588901178705478, "test/sim_max_reward_4400020": 0.40622807524828747, "test/sim_max_reward_4400021": 0.9630375851541083, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.9734055884428647, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.6127609095945667, "test/sim_max_reward_4400026": 0.10714578425122946, "test/sim_max_reward_4400027": 0.3598927694284052, "test/sim_max_reward_4400028": 0.9856934024104497, "test/sim_max_reward_4400029": 0.42203577063562936, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.9479554063057153, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.3685177125914646, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.9897728520682896, "test/sim_max_reward_4400036": 0.9802786560136991, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.9869651076479465, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9831173801609338, "test/sim_max_reward_4400042": 0.03655752284559263, "test/sim_max_reward_4400043": 0.030289334452675117, "test/sim_max_reward_4400044": 0.9708071536189481, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.3245455872374389, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.5877467281631058, "test/mean_score": 0.6213589201988811, "val_loss": 265746.09375, "train_action_mse_error": 1.3341885805130005} {"train_loss": -11.807928085327148, "global_step": 235368, "epoch": 1401} {"train_loss": -11.564398765563965, "global_step": 235369, "epoch": 1401} {"train_loss": -11.736747741699219, "global_step": 235370, "epoch": 1401} {"train_loss": -11.745458602905273, "global_step": 235371, "epoch": 1401} {"train_loss": -11.675925254821777, "global_step": 235372, "epoch": 1401} {"train_loss": -11.980388641357422, "global_step": 235373, "epoch": 1401} {"train_loss": -11.846916198730469, "global_step": 235374, "epoch": 1401} {"train_loss": -11.815443992614746, "global_step": 235375, "epoch": 1401} {"train_loss": -11.94266128540039, "global_step": 235376, "epoch": 1401} {"train_loss": -11.796049118041992, "global_step": 235377, "epoch": 1401} {"train_loss": -11.669118881225586, "global_step": 235378, "epoch": 1401} {"train_loss": -11.930511474609375, "global_step": 235379, "epoch": 1401} {"train_loss": -11.85394287109375, "global_step": 235380, "epoch": 1401} {"train_loss": -11.826777458190918, "global_step": 235381, "epoch": 1401} {"train_loss": -11.814043998718262, "global_step": 235382, "epoch": 1401} {"train_loss": -11.965540885925293, "global_step": 235383, "epoch": 1401} {"train_loss": -11.950891494750977, "global_step": 235384, "epoch": 1401} {"train_loss": -12.046710968017578, "global_step": 235385, "epoch": 1401} {"train_loss": -11.700152397155762, "global_step": 235386, "epoch": 1401} {"train_loss": -11.893545150756836, "global_step": 235387, "epoch": 1401} {"train_loss": -11.806063652038574, "global_step": 235388, "epoch": 1401} {"train_loss": -11.398178100585938, "global_step": 235389, "epoch": 1401} {"train_loss": -11.736455917358398, "global_step": 235390, "epoch": 1401} {"train_loss": -11.76880168914795, "global_step": 235391, "epoch": 1401} {"train_loss": -10.949606895446777, "global_step": 235392, "epoch": 1401} {"train_loss": -10.984580993652344, "global_step": 235393, "epoch": 1401} {"train_loss": -12.156368255615234, "global_step": 235394, "epoch": 1401} {"train_loss": -12.181486129760742, "global_step": 235395, "epoch": 1401} {"train_loss": -11.203630447387695, "global_step": 235396, "epoch": 1401} {"train_loss": -11.562177658081055, "global_step": 235397, "epoch": 1401} {"train_loss": -12.026707649230957, "global_step": 235398, "epoch": 1401} {"train_loss": -11.189596176147461, "global_step": 235399, "epoch": 1401} {"train_loss": -10.95602035522461, "global_step": 235400, "epoch": 1401} {"train_loss": -10.929847717285156, "global_step": 235401, "epoch": 1401} {"train_loss": -11.623825073242188, "global_step": 235402, "epoch": 1401} {"train_loss": -11.145066261291504, "global_step": 235403, "epoch": 1401} {"train_loss": -9.81161117553711, "global_step": 235404, "epoch": 1401} {"train_loss": -10.254181861877441, "global_step": 235405, "epoch": 1401} {"train_loss": -10.197216033935547, "global_step": 235406, "epoch": 1401} {"train_loss": -10.795110702514648, "global_step": 235407, "epoch": 1401} {"train_loss": -10.403502464294434, "global_step": 235408, "epoch": 1401} {"train_loss": -9.483068466186523, "global_step": 235409, "epoch": 1401} {"train_loss": -9.098840713500977, "global_step": 235410, "epoch": 1401} {"train_loss": -8.751039505004883, "global_step": 235411, "epoch": 1401} {"train_loss": -10.525399208068848, "global_step": 235412, "epoch": 1401} {"train_loss": -7.778883457183838, "global_step": 235413, "epoch": 1401} {"train_loss": -8.900629043579102, "global_step": 235414, "epoch": 1401} {"train_loss": -8.163192749023438, "global_step": 235415, "epoch": 1401} {"train_loss": -10.426275253295898, "global_step": 235416, "epoch": 1401} {"train_loss": -8.78924560546875, "global_step": 235417, "epoch": 1401} {"train_loss": -9.216538429260254, "global_step": 235418, "epoch": 1401} {"train_loss": -10.455549240112305, "global_step": 235419, "epoch": 1401} {"train_loss": -9.082844734191895, "global_step": 235420, "epoch": 1401} {"train_loss": -10.031296730041504, "global_step": 235421, "epoch": 1401} {"train_loss": -10.165903091430664, "global_step": 235422, "epoch": 1401} {"train_loss": -10.31011962890625, "global_step": 235423, "epoch": 1401} {"train_loss": -10.887798309326172, "global_step": 235424, "epoch": 1401} {"train_loss": -10.32018756866455, "global_step": 235425, "epoch": 1401} {"train_loss": -10.802186012268066, "global_step": 235426, "epoch": 1401} {"train_loss": -11.004402160644531, "global_step": 235427, "epoch": 1401} {"train_loss": -11.184531211853027, "global_step": 235428, "epoch": 1401} {"train_loss": -10.97642707824707, "global_step": 235429, "epoch": 1401} {"train_loss": -11.395502090454102, "global_step": 235430, "epoch": 1401} {"train_loss": -11.06181526184082, "global_step": 235431, "epoch": 1401} {"train_loss": -11.257797241210938, "global_step": 235432, "epoch": 1401} {"train_loss": -11.408534049987793, "global_step": 235433, "epoch": 1401} {"train_loss": -11.425314903259277, "global_step": 235434, "epoch": 1401} {"train_loss": -11.213325500488281, "global_step": 235435, "epoch": 1401} {"train_loss": -11.567813873291016, "global_step": 235436, "epoch": 1401} {"train_loss": -11.155061721801758, "global_step": 235437, "epoch": 1401} {"train_loss": -11.148491859436035, "global_step": 235438, "epoch": 1401} {"train_loss": -11.56734848022461, "global_step": 235439, "epoch": 1401} {"train_loss": -11.428484916687012, "global_step": 235440, "epoch": 1401} {"train_loss": -11.346750259399414, "global_step": 235441, "epoch": 1401} {"train_loss": -11.398902893066406, "global_step": 235442, "epoch": 1401} {"train_loss": -11.564864158630371, "global_step": 235443, "epoch": 1401} {"train_loss": -11.40009880065918, "global_step": 235444, "epoch": 1401} {"train_loss": -11.24801254272461, "global_step": 235445, "epoch": 1401} {"train_loss": -11.562676429748535, "global_step": 235446, "epoch": 1401} {"train_loss": -11.424705505371094, "global_step": 235447, "epoch": 1401} {"train_loss": -11.202789306640625, "global_step": 235448, "epoch": 1401} {"train_loss": -11.270458221435547, "global_step": 235449, "epoch": 1401} {"train_loss": -11.584613800048828, "global_step": 235450, "epoch": 1401} {"train_loss": -11.214876174926758, "global_step": 235451, "epoch": 1401} {"train_loss": -11.490152359008789, "global_step": 235452, "epoch": 1401} {"train_loss": -11.798290252685547, "global_step": 235453, "epoch": 1401} {"train_loss": -11.509546279907227, "global_step": 235454, "epoch": 1401} {"train_loss": -11.634992599487305, "global_step": 235455, "epoch": 1401} {"train_loss": -11.760851860046387, "global_step": 235456, "epoch": 1401} {"train_loss": -11.663898468017578, "global_step": 235457, "epoch": 1401} {"train_loss": -11.54395866394043, "global_step": 235458, "epoch": 1401} {"train_loss": -11.677803993225098, "global_step": 235459, "epoch": 1401} {"train_loss": -11.742656707763672, "global_step": 235460, "epoch": 1401} {"train_loss": -11.78811264038086, "global_step": 235461, "epoch": 1401} {"train_loss": -11.915692329406738, "global_step": 235462, "epoch": 1401} {"train_loss": -11.756195068359375, "global_step": 235463, "epoch": 1401} {"train_loss": -11.896963119506836, "global_step": 235464, "epoch": 1401} {"train_loss": -11.779172897338867, "global_step": 235465, "epoch": 1401} {"train_loss": -11.767990112304688, "global_step": 235466, "epoch": 1401} {"train_loss": -11.61322021484375, "global_step": 235467, "epoch": 1401} {"train_loss": -11.887517929077148, "global_step": 235468, "epoch": 1401} {"train_loss": -11.684585571289062, "global_step": 235469, "epoch": 1401} {"train_loss": -11.874408721923828, "global_step": 235470, "epoch": 1401} {"train_loss": -11.797903060913086, "global_step": 235471, "epoch": 1401} {"train_loss": -11.960155487060547, "global_step": 235472, "epoch": 1401} {"train_loss": -11.778249740600586, "global_step": 235473, "epoch": 1401} {"train_loss": -12.067752838134766, "global_step": 235474, "epoch": 1401} {"train_loss": -11.655888557434082, "global_step": 235475, "epoch": 1401} {"train_loss": -12.07902717590332, "global_step": 235476, "epoch": 1401} {"train_loss": -11.672293663024902, "global_step": 235477, "epoch": 1401} {"train_loss": -12.057910919189453, "global_step": 235478, "epoch": 1401} {"train_loss": -11.790945053100586, "global_step": 235479, "epoch": 1401} {"train_loss": -11.895035743713379, "global_step": 235480, "epoch": 1401} {"train_loss": -11.721761703491211, "global_step": 235481, "epoch": 1401} {"train_loss": -12.113786697387695, "global_step": 235482, "epoch": 1401} {"train_loss": -11.891664505004883, "global_step": 235483, "epoch": 1401} {"train_loss": -12.113574981689453, "global_step": 235484, "epoch": 1401} {"train_loss": -12.140302658081055, "global_step": 235485, "epoch": 1401} {"train_loss": -11.94191837310791, "global_step": 235486, "epoch": 1401} {"train_loss": -11.996504783630371, "global_step": 235487, "epoch": 1401} {"train_loss": -12.022785186767578, "global_step": 235488, "epoch": 1401} {"train_loss": -11.928669929504395, "global_step": 235489, "epoch": 1401} {"train_loss": -11.886640548706055, "global_step": 235490, "epoch": 1401} {"train_loss": -11.994579315185547, "global_step": 235491, "epoch": 1401} {"train_loss": -12.043254852294922, "global_step": 235492, "epoch": 1401} {"train_loss": -11.949783325195312, "global_step": 235493, "epoch": 1401} {"train_loss": -12.15461254119873, "global_step": 235494, "epoch": 1401} {"train_loss": -12.00436019897461, "global_step": 235495, "epoch": 1401} {"train_loss": -12.366365432739258, "global_step": 235496, "epoch": 1401} {"train_loss": -12.202507972717285, "global_step": 235497, "epoch": 1401} {"train_loss": -12.149279594421387, "global_step": 235498, "epoch": 1401} {"train_loss": -12.087043762207031, "global_step": 235499, "epoch": 1401} {"train_loss": -11.796733856201172, "global_step": 235500, "epoch": 1401} {"train_loss": -11.978890419006348, "global_step": 235501, "epoch": 1401} {"train_loss": -11.783068656921387, "global_step": 235502, "epoch": 1401} {"train_loss": -12.080305099487305, "global_step": 235503, "epoch": 1401} {"train_loss": -12.033788681030273, "global_step": 235504, "epoch": 1401} {"train_loss": -11.714600563049316, "global_step": 235505, "epoch": 1401} {"train_loss": -11.623326301574707, "global_step": 235506, "epoch": 1401} {"train_loss": -11.298595428466797, "global_step": 235507, "epoch": 1401} {"train_loss": -11.353046417236328, "global_step": 235508, "epoch": 1401} {"train_loss": -11.618118286132812, "global_step": 235509, "epoch": 1401} {"train_loss": -11.803569793701172, "global_step": 235510, "epoch": 1401} {"train_loss": -11.559242248535156, "global_step": 235511, "epoch": 1401} {"train_loss": -10.999868392944336, "global_step": 235512, "epoch": 1401} {"train_loss": -11.053911209106445, "global_step": 235513, "epoch": 1401} {"train_loss": -11.8494873046875, "global_step": 235514, "epoch": 1401} {"train_loss": -11.385324478149414, "global_step": 235515, "epoch": 1401} {"train_loss": -11.670182228088379, "global_step": 235516, "epoch": 1401} {"train_loss": -11.588377952575684, "global_step": 235517, "epoch": 1401} {"train_loss": -11.965032577514648, "global_step": 235518, "epoch": 1401} {"train_loss": -11.915838241577148, "global_step": 235519, "epoch": 1401} {"train_loss": -11.68319320678711, "global_step": 235520, "epoch": 1401} {"train_loss": -11.714410781860352, "global_step": 235521, "epoch": 1401} {"train_loss": -11.937780380249023, "global_step": 235522, "epoch": 1401} {"train_loss": -11.625972747802734, "global_step": 235523, "epoch": 1401} {"train_loss": -11.791954040527344, "global_step": 235524, "epoch": 1401} {"train_loss": -11.825197219848633, "global_step": 235525, "epoch": 1401} {"train_loss": -11.350773811340332, "global_step": 235526, "epoch": 1401} {"train_loss": -12.054384231567383, "global_step": 235527, "epoch": 1401} {"train_loss": -11.702810287475586, "global_step": 235528, "epoch": 1401} {"train_loss": -11.493128776550293, "global_step": 235529, "epoch": 1401} {"train_loss": -11.828269958496094, "global_step": 235530, "epoch": 1401} {"train_loss": -11.881830215454102, "global_step": 235531, "epoch": 1401} {"train_loss": -11.268445014953613, "global_step": 235532, "epoch": 1401} {"train_loss": -12.092765808105469, "global_step": 235533, "epoch": 1401} {"train_loss": -11.6784029006958, "global_step": 235534, "epoch": 1401} {"train_loss": -11.422067173889705, "global_step": 235535, "epoch": 1401, "val_loss": 265659.5} {"train_loss": -11.609979629516602, "global_step": 235536, "epoch": 1402} {"train_loss": -11.475263595581055, "global_step": 235537, "epoch": 1402} {"train_loss": -11.42010498046875, "global_step": 235538, "epoch": 1402} {"train_loss": -11.238418579101562, "global_step": 235539, "epoch": 1402} {"train_loss": -11.376301765441895, "global_step": 235540, "epoch": 1402} {"train_loss": -11.416852951049805, "global_step": 235541, "epoch": 1402} {"train_loss": -11.485218048095703, "global_step": 235542, "epoch": 1402} {"train_loss": -11.388195037841797, "global_step": 235543, "epoch": 1402} {"train_loss": -11.828539848327637, "global_step": 235544, "epoch": 1402} {"train_loss": -11.28692626953125, "global_step": 235545, "epoch": 1402} {"train_loss": -11.089923858642578, "global_step": 235546, "epoch": 1402} {"train_loss": -11.689054489135742, "global_step": 235547, "epoch": 1402} {"train_loss": -11.488195419311523, "global_step": 235548, "epoch": 1402} {"train_loss": -11.941305160522461, "global_step": 235549, "epoch": 1402} {"train_loss": -11.392919540405273, "global_step": 235550, "epoch": 1402} {"train_loss": -11.553579330444336, "global_step": 235551, "epoch": 1402} {"train_loss": -11.803520202636719, "global_step": 235552, "epoch": 1402} {"train_loss": -11.460614204406738, "global_step": 235553, "epoch": 1402} {"train_loss": -11.248973846435547, "global_step": 235554, "epoch": 1402} {"train_loss": -11.256183624267578, "global_step": 235555, "epoch": 1402} {"train_loss": -11.248186111450195, "global_step": 235556, "epoch": 1402} {"train_loss": -11.556018829345703, "global_step": 235557, "epoch": 1402} {"train_loss": -11.629351615905762, "global_step": 235558, "epoch": 1402} {"train_loss": -10.913461685180664, "global_step": 235559, "epoch": 1402} {"train_loss": -10.808547019958496, "global_step": 235560, "epoch": 1402} {"train_loss": -10.486865043640137, "global_step": 235561, "epoch": 1402} {"train_loss": -11.34132194519043, "global_step": 235562, "epoch": 1402} {"train_loss": -11.315574645996094, "global_step": 235563, "epoch": 1402} {"train_loss": -10.930315017700195, "global_step": 235564, "epoch": 1402} {"train_loss": -11.886552810668945, "global_step": 235565, "epoch": 1402} {"train_loss": -10.833076477050781, "global_step": 235566, "epoch": 1402} {"train_loss": -11.304021835327148, "global_step": 235567, "epoch": 1402} {"train_loss": -11.125970840454102, "global_step": 235568, "epoch": 1402} {"train_loss": -11.350452423095703, "global_step": 235569, "epoch": 1402} {"train_loss": -11.412064552307129, "global_step": 235570, "epoch": 1402} {"train_loss": -11.572415351867676, "global_step": 235571, "epoch": 1402} {"train_loss": -11.332707405090332, "global_step": 235572, "epoch": 1402} {"train_loss": -11.475924491882324, "global_step": 235573, "epoch": 1402} {"train_loss": -11.73083782196045, "global_step": 235574, "epoch": 1402} {"train_loss": -11.266550064086914, "global_step": 235575, "epoch": 1402} {"train_loss": -11.450664520263672, "global_step": 235576, "epoch": 1402} {"train_loss": -11.617171287536621, "global_step": 235577, "epoch": 1402} {"train_loss": -11.653263092041016, "global_step": 235578, "epoch": 1402} {"train_loss": -11.85232925415039, "global_step": 235579, "epoch": 1402} {"train_loss": -11.524053573608398, "global_step": 235580, "epoch": 1402} {"train_loss": -11.824370384216309, "global_step": 235581, "epoch": 1402} {"train_loss": -11.666943550109863, "global_step": 235582, "epoch": 1402} {"train_loss": -11.779781341552734, "global_step": 235583, "epoch": 1402} {"train_loss": -11.686424255371094, "global_step": 235584, "epoch": 1402} {"train_loss": -11.545445442199707, "global_step": 235585, "epoch": 1402} {"train_loss": -11.700643539428711, "global_step": 235586, "epoch": 1402} {"train_loss": -11.943220138549805, "global_step": 235587, "epoch": 1402} {"train_loss": -11.896873474121094, "global_step": 235588, "epoch": 1402} {"train_loss": -11.681072235107422, "global_step": 235589, "epoch": 1402} {"train_loss": -11.858501434326172, "global_step": 235590, "epoch": 1402} {"train_loss": -11.824518203735352, "global_step": 235591, "epoch": 1402} {"train_loss": -11.66114616394043, "global_step": 235592, "epoch": 1402} {"train_loss": -11.87665843963623, "global_step": 235593, "epoch": 1402} {"train_loss": -11.881546974182129, "global_step": 235594, "epoch": 1402} {"train_loss": -11.883487701416016, "global_step": 235595, "epoch": 1402} {"train_loss": -11.94871997833252, "global_step": 235596, "epoch": 1402} {"train_loss": -12.035872459411621, "global_step": 235597, "epoch": 1402} {"train_loss": -11.965028762817383, "global_step": 235598, "epoch": 1402} {"train_loss": -11.90041732788086, "global_step": 235599, "epoch": 1402} {"train_loss": -12.065939903259277, "global_step": 235600, "epoch": 1402} {"train_loss": -11.76524543762207, "global_step": 235601, "epoch": 1402} {"train_loss": -11.799073219299316, "global_step": 235602, "epoch": 1402} {"train_loss": -11.977010726928711, "global_step": 235603, "epoch": 1402} {"train_loss": -11.816648483276367, "global_step": 235604, "epoch": 1402} {"train_loss": -11.730218887329102, "global_step": 235605, "epoch": 1402} {"train_loss": -11.468390464782715, "global_step": 235606, "epoch": 1402} {"train_loss": -11.949708938598633, "global_step": 235607, "epoch": 1402} {"train_loss": -11.800531387329102, "global_step": 235608, "epoch": 1402} {"train_loss": -11.904291152954102, "global_step": 235609, "epoch": 1402} {"train_loss": -11.917695999145508, "global_step": 235610, "epoch": 1402} {"train_loss": -11.799798965454102, "global_step": 235611, "epoch": 1402} {"train_loss": -11.738967895507812, "global_step": 235612, "epoch": 1402} {"train_loss": -12.173456192016602, "global_step": 235613, "epoch": 1402} {"train_loss": -11.639944076538086, "global_step": 235614, "epoch": 1402} {"train_loss": -11.382064819335938, "global_step": 235615, "epoch": 1402} {"train_loss": -12.093114852905273, "global_step": 235616, "epoch": 1402} {"train_loss": -11.719280242919922, "global_step": 235617, "epoch": 1402} {"train_loss": -11.994495391845703, "global_step": 235618, "epoch": 1402} {"train_loss": -12.110393524169922, "global_step": 235619, "epoch": 1402} {"train_loss": -12.000555038452148, "global_step": 235620, "epoch": 1402} {"train_loss": -11.887079238891602, "global_step": 235621, "epoch": 1402} {"train_loss": -12.159419059753418, "global_step": 235622, "epoch": 1402} {"train_loss": -11.763148307800293, "global_step": 235623, "epoch": 1402} {"train_loss": -11.578447341918945, "global_step": 235624, "epoch": 1402} {"train_loss": -11.400068283081055, "global_step": 235625, "epoch": 1402} {"train_loss": -11.655256271362305, "global_step": 235626, "epoch": 1402} {"train_loss": -10.407833099365234, "global_step": 235627, "epoch": 1402} {"train_loss": -11.056376457214355, "global_step": 235628, "epoch": 1402} {"train_loss": -11.356485366821289, "global_step": 235629, "epoch": 1402} {"train_loss": -10.259720802307129, "global_step": 235630, "epoch": 1402} {"train_loss": -11.069564819335938, "global_step": 235631, "epoch": 1402} {"train_loss": -10.606218338012695, "global_step": 235632, "epoch": 1402} {"train_loss": -9.585071563720703, "global_step": 235633, "epoch": 1402} {"train_loss": -8.739068984985352, "global_step": 235634, "epoch": 1402} {"train_loss": -11.57175064086914, "global_step": 235635, "epoch": 1402} {"train_loss": -8.713050842285156, "global_step": 235636, "epoch": 1402} {"train_loss": -9.745499610900879, "global_step": 235637, "epoch": 1402} {"train_loss": -10.321113586425781, "global_step": 235638, "epoch": 1402} {"train_loss": -9.510085105895996, "global_step": 235639, "epoch": 1402} {"train_loss": -10.764143943786621, "global_step": 235640, "epoch": 1402} {"train_loss": -9.537910461425781, "global_step": 235641, "epoch": 1402} {"train_loss": -10.576377868652344, "global_step": 235642, "epoch": 1402} {"train_loss": -10.128279685974121, "global_step": 235643, "epoch": 1402} {"train_loss": -10.263851165771484, "global_step": 235644, "epoch": 1402} {"train_loss": -9.844383239746094, "global_step": 235645, "epoch": 1402} {"train_loss": -11.070341110229492, "global_step": 235646, "epoch": 1402} {"train_loss": -10.61328125, "global_step": 235647, "epoch": 1402} {"train_loss": -11.585707664489746, "global_step": 235648, "epoch": 1402} {"train_loss": -10.684279441833496, "global_step": 235649, "epoch": 1402} {"train_loss": -11.182215690612793, "global_step": 235650, "epoch": 1402} {"train_loss": -10.266648292541504, "global_step": 235651, "epoch": 1402} {"train_loss": -11.253889083862305, "global_step": 235652, "epoch": 1402} {"train_loss": -10.839067459106445, "global_step": 235653, "epoch": 1402} {"train_loss": -11.315382957458496, "global_step": 235654, "epoch": 1402} {"train_loss": -10.817895889282227, "global_step": 235655, "epoch": 1402} {"train_loss": -11.511272430419922, "global_step": 235656, "epoch": 1402} {"train_loss": -11.143269538879395, "global_step": 235657, "epoch": 1402} {"train_loss": -11.536054611206055, "global_step": 235658, "epoch": 1402} {"train_loss": -11.333907127380371, "global_step": 235659, "epoch": 1402} {"train_loss": -11.139063835144043, "global_step": 235660, "epoch": 1402} {"train_loss": -11.72553825378418, "global_step": 235661, "epoch": 1402} {"train_loss": -11.43496322631836, "global_step": 235662, "epoch": 1402} {"train_loss": -11.66087532043457, "global_step": 235663, "epoch": 1402} {"train_loss": -11.754144668579102, "global_step": 235664, "epoch": 1402} {"train_loss": -11.686738967895508, "global_step": 235665, "epoch": 1402} {"train_loss": -11.45940113067627, "global_step": 235666, "epoch": 1402} {"train_loss": -11.650078773498535, "global_step": 235667, "epoch": 1402} {"train_loss": -11.754222869873047, "global_step": 235668, "epoch": 1402} {"train_loss": -11.348280906677246, "global_step": 235669, "epoch": 1402} {"train_loss": -11.620986938476562, "global_step": 235670, "epoch": 1402} {"train_loss": -11.35205364227295, "global_step": 235671, "epoch": 1402} {"train_loss": -11.536591529846191, "global_step": 235672, "epoch": 1402} {"train_loss": -11.611200332641602, "global_step": 235673, "epoch": 1402} {"train_loss": -11.641456604003906, "global_step": 235674, "epoch": 1402} {"train_loss": -11.532428741455078, "global_step": 235675, "epoch": 1402} {"train_loss": -11.702589988708496, "global_step": 235676, "epoch": 1402} {"train_loss": -11.672443389892578, "global_step": 235677, "epoch": 1402} {"train_loss": -11.659832000732422, "global_step": 235678, "epoch": 1402} {"train_loss": -11.955612182617188, "global_step": 235679, "epoch": 1402} {"train_loss": -11.553022384643555, "global_step": 235680, "epoch": 1402} {"train_loss": -11.582244873046875, "global_step": 235681, "epoch": 1402} {"train_loss": -11.605981826782227, "global_step": 235682, "epoch": 1402} {"train_loss": -11.731281280517578, "global_step": 235683, "epoch": 1402} {"train_loss": -11.801198959350586, "global_step": 235684, "epoch": 1402} {"train_loss": -11.857194900512695, "global_step": 235685, "epoch": 1402} {"train_loss": -11.73945140838623, "global_step": 235686, "epoch": 1402} {"train_loss": -11.935649871826172, "global_step": 235687, "epoch": 1402} {"train_loss": -11.810818672180176, "global_step": 235688, "epoch": 1402} {"train_loss": -11.92006778717041, "global_step": 235689, "epoch": 1402} {"train_loss": -11.867250442504883, "global_step": 235690, "epoch": 1402} {"train_loss": -11.90031623840332, "global_step": 235691, "epoch": 1402} {"train_loss": -11.809514999389648, "global_step": 235692, "epoch": 1402} {"train_loss": -11.933061599731445, "global_step": 235693, "epoch": 1402} {"train_loss": -12.12541389465332, "global_step": 235694, "epoch": 1402} {"train_loss": -11.95728874206543, "global_step": 235695, "epoch": 1402} {"train_loss": -11.648191452026367, "global_step": 235696, "epoch": 1402} {"train_loss": -11.867243766784668, "global_step": 235697, "epoch": 1402} {"train_loss": -11.731157302856445, "global_step": 235698, "epoch": 1402} {"train_loss": -12.004165649414062, "global_step": 235699, "epoch": 1402} {"train_loss": -11.80670166015625, "global_step": 235700, "epoch": 1402} {"train_loss": -12.044482231140137, "global_step": 235701, "epoch": 1402} {"train_loss": -11.814943313598633, "global_step": 235702, "epoch": 1402} {"train_loss": -11.44029616741907, "global_step": 235703, "epoch": 1402, "val_loss": 256481.953125} {"train_loss": -11.948345184326172, "global_step": 235704, "epoch": 1403} {"train_loss": -11.940784454345703, "global_step": 235705, "epoch": 1403} {"train_loss": -11.9328031539917, "global_step": 235706, "epoch": 1403} {"train_loss": -11.823942184448242, "global_step": 235707, "epoch": 1403} {"train_loss": -11.856415748596191, "global_step": 235708, "epoch": 1403} {"train_loss": -12.05712890625, "global_step": 235709, "epoch": 1403} {"train_loss": -11.814166069030762, "global_step": 235710, "epoch": 1403} {"train_loss": -11.988092422485352, "global_step": 235711, "epoch": 1403} {"train_loss": -11.915077209472656, "global_step": 235712, "epoch": 1403} {"train_loss": -11.89190673828125, "global_step": 235713, "epoch": 1403} {"train_loss": -11.551133155822754, "global_step": 235714, "epoch": 1403} {"train_loss": -11.816314697265625, "global_step": 235715, "epoch": 1403} {"train_loss": -12.05347728729248, "global_step": 235716, "epoch": 1403} {"train_loss": -11.81251335144043, "global_step": 235717, "epoch": 1403} {"train_loss": -11.355914115905762, "global_step": 235718, "epoch": 1403} {"train_loss": -11.73489761352539, "global_step": 235719, "epoch": 1403} {"train_loss": -11.984763145446777, "global_step": 235720, "epoch": 1403} {"train_loss": -11.799290657043457, "global_step": 235721, "epoch": 1403} {"train_loss": -11.270570755004883, "global_step": 235722, "epoch": 1403} {"train_loss": -10.236879348754883, "global_step": 235723, "epoch": 1403} {"train_loss": -10.943155288696289, "global_step": 235724, "epoch": 1403} {"train_loss": -11.765447616577148, "global_step": 235725, "epoch": 1403} {"train_loss": -11.64677619934082, "global_step": 235726, "epoch": 1403} {"train_loss": -9.61309814453125, "global_step": 235727, "epoch": 1403} {"train_loss": -10.359628677368164, "global_step": 235728, "epoch": 1403} {"train_loss": -11.901327133178711, "global_step": 235729, "epoch": 1403} {"train_loss": -9.656463623046875, "global_step": 235730, "epoch": 1403} {"train_loss": -11.025517463684082, "global_step": 235731, "epoch": 1403} {"train_loss": -11.040288925170898, "global_step": 235732, "epoch": 1403} {"train_loss": -11.002904891967773, "global_step": 235733, "epoch": 1403} {"train_loss": -10.586264610290527, "global_step": 235734, "epoch": 1403} {"train_loss": -10.9691162109375, "global_step": 235735, "epoch": 1403} {"train_loss": -10.995147705078125, "global_step": 235736, "epoch": 1403} {"train_loss": -11.192024230957031, "global_step": 235737, "epoch": 1403} {"train_loss": -11.028505325317383, "global_step": 235738, "epoch": 1403} {"train_loss": -11.512650489807129, "global_step": 235739, "epoch": 1403} {"train_loss": -10.761153221130371, "global_step": 235740, "epoch": 1403} {"train_loss": -11.588438034057617, "global_step": 235741, "epoch": 1403} {"train_loss": -11.04065990447998, "global_step": 235742, "epoch": 1403} {"train_loss": -11.740984916687012, "global_step": 235743, "epoch": 1403} {"train_loss": -10.544022560119629, "global_step": 235744, "epoch": 1403} {"train_loss": -11.478191375732422, "global_step": 235745, "epoch": 1403} {"train_loss": -11.41209602355957, "global_step": 235746, "epoch": 1403} {"train_loss": -11.401355743408203, "global_step": 235747, "epoch": 1403} {"train_loss": -11.341893196105957, "global_step": 235748, "epoch": 1403} {"train_loss": -10.960296630859375, "global_step": 235749, "epoch": 1403} {"train_loss": -11.529336929321289, "global_step": 235750, "epoch": 1403} {"train_loss": -11.302165031433105, "global_step": 235751, "epoch": 1403} {"train_loss": -11.70409107208252, "global_step": 235752, "epoch": 1403} {"train_loss": -11.14142894744873, "global_step": 235753, "epoch": 1403} {"train_loss": -11.350933074951172, "global_step": 235754, "epoch": 1403} {"train_loss": -11.939188003540039, "global_step": 235755, "epoch": 1403} {"train_loss": -11.253329277038574, "global_step": 235756, "epoch": 1403} {"train_loss": -11.187034606933594, "global_step": 235757, "epoch": 1403} {"train_loss": -11.28657341003418, "global_step": 235758, "epoch": 1403} {"train_loss": -10.444629669189453, "global_step": 235759, "epoch": 1403} {"train_loss": -11.83156967163086, "global_step": 235760, "epoch": 1403} {"train_loss": -11.2380952835083, "global_step": 235761, "epoch": 1403} {"train_loss": -11.181535720825195, "global_step": 235762, "epoch": 1403} {"train_loss": -11.227018356323242, "global_step": 235763, "epoch": 1403} {"train_loss": -11.077461242675781, "global_step": 235764, "epoch": 1403} {"train_loss": -11.869287490844727, "global_step": 235765, "epoch": 1403} {"train_loss": -11.049112319946289, "global_step": 235766, "epoch": 1403} {"train_loss": -11.418129920959473, "global_step": 235767, "epoch": 1403} {"train_loss": -11.114273071289062, "global_step": 235768, "epoch": 1403} {"train_loss": -11.857892990112305, "global_step": 235769, "epoch": 1403} {"train_loss": -10.947060585021973, "global_step": 235770, "epoch": 1403} {"train_loss": -11.640109062194824, "global_step": 235771, "epoch": 1403} {"train_loss": -11.411869049072266, "global_step": 235772, "epoch": 1403} {"train_loss": -11.745467185974121, "global_step": 235773, "epoch": 1403} {"train_loss": -10.925931930541992, "global_step": 235774, "epoch": 1403} {"train_loss": -11.410290718078613, "global_step": 235775, "epoch": 1403} {"train_loss": -11.294631958007812, "global_step": 235776, "epoch": 1403} {"train_loss": -11.189298629760742, "global_step": 235777, "epoch": 1403} {"train_loss": -11.699691772460938, "global_step": 235778, "epoch": 1403} {"train_loss": -11.590309143066406, "global_step": 235779, "epoch": 1403} {"train_loss": -11.758160591125488, "global_step": 235780, "epoch": 1403} {"train_loss": -11.867645263671875, "global_step": 235781, "epoch": 1403} {"train_loss": -11.627151489257812, "global_step": 235782, "epoch": 1403} {"train_loss": -11.730955123901367, "global_step": 235783, "epoch": 1403} {"train_loss": -11.784524917602539, "global_step": 235784, "epoch": 1403} {"train_loss": -11.881080627441406, "global_step": 235785, "epoch": 1403} {"train_loss": -11.826690673828125, "global_step": 235786, "epoch": 1403} {"train_loss": -11.596708297729492, "global_step": 235787, "epoch": 1403} {"train_loss": -11.882576942443848, "global_step": 235788, "epoch": 1403} {"train_loss": -11.79348373413086, "global_step": 235789, "epoch": 1403} {"train_loss": -11.638480186462402, "global_step": 235790, "epoch": 1403} {"train_loss": -12.074557304382324, "global_step": 235791, "epoch": 1403} {"train_loss": -11.600447654724121, "global_step": 235792, "epoch": 1403} {"train_loss": -11.753396987915039, "global_step": 235793, "epoch": 1403} {"train_loss": -11.680357933044434, "global_step": 235794, "epoch": 1403} {"train_loss": -11.743276596069336, "global_step": 235795, "epoch": 1403} {"train_loss": -11.848831176757812, "global_step": 235796, "epoch": 1403} {"train_loss": -12.048929214477539, "global_step": 235797, "epoch": 1403} {"train_loss": -12.070722579956055, "global_step": 235798, "epoch": 1403} {"train_loss": -11.98904800415039, "global_step": 235799, "epoch": 1403} {"train_loss": -12.010629653930664, "global_step": 235800, "epoch": 1403} {"train_loss": -11.969858169555664, "global_step": 235801, "epoch": 1403} {"train_loss": -12.114795684814453, "global_step": 235802, "epoch": 1403} {"train_loss": -12.1339111328125, "global_step": 235803, "epoch": 1403} {"train_loss": -12.176648139953613, "global_step": 235804, "epoch": 1403} {"train_loss": -12.130945205688477, "global_step": 235805, "epoch": 1403} {"train_loss": -12.090167045593262, "global_step": 235806, "epoch": 1403} {"train_loss": -12.11351490020752, "global_step": 235807, "epoch": 1403} {"train_loss": -12.072366714477539, "global_step": 235808, "epoch": 1403} {"train_loss": -12.082381248474121, "global_step": 235809, "epoch": 1403} {"train_loss": -12.059999465942383, "global_step": 235810, "epoch": 1403} {"train_loss": -11.786029815673828, "global_step": 235811, "epoch": 1403} {"train_loss": -12.11427116394043, "global_step": 235812, "epoch": 1403} {"train_loss": -12.115274429321289, "global_step": 235813, "epoch": 1403} {"train_loss": -12.06289005279541, "global_step": 235814, "epoch": 1403} {"train_loss": -12.128867149353027, "global_step": 235815, "epoch": 1403} {"train_loss": -12.0430908203125, "global_step": 235816, "epoch": 1403} {"train_loss": -12.015108108520508, "global_step": 235817, "epoch": 1403} {"train_loss": -12.008214950561523, "global_step": 235818, "epoch": 1403} {"train_loss": -11.933195114135742, "global_step": 235819, "epoch": 1403} {"train_loss": -12.058631896972656, "global_step": 235820, "epoch": 1403} {"train_loss": -12.159099578857422, "global_step": 235821, "epoch": 1403} {"train_loss": -11.85322380065918, "global_step": 235822, "epoch": 1403} {"train_loss": -11.861297607421875, "global_step": 235823, "epoch": 1403} {"train_loss": -12.076870918273926, "global_step": 235824, "epoch": 1403} {"train_loss": -11.915399551391602, "global_step": 235825, "epoch": 1403} {"train_loss": -11.745378494262695, "global_step": 235826, "epoch": 1403} {"train_loss": -12.123571395874023, "global_step": 235827, "epoch": 1403} {"train_loss": -12.006056785583496, "global_step": 235828, "epoch": 1403} {"train_loss": -11.972024917602539, "global_step": 235829, "epoch": 1403} {"train_loss": -12.099867820739746, "global_step": 235830, "epoch": 1403} {"train_loss": -12.190982818603516, "global_step": 235831, "epoch": 1403} {"train_loss": -11.474746704101562, "global_step": 235832, "epoch": 1403} {"train_loss": -11.53872299194336, "global_step": 235833, "epoch": 1403} {"train_loss": -9.970364570617676, "global_step": 235834, "epoch": 1403} {"train_loss": -9.514665603637695, "global_step": 235835, "epoch": 1403} {"train_loss": -10.14171028137207, "global_step": 235836, "epoch": 1403} {"train_loss": -11.398519515991211, "global_step": 235837, "epoch": 1403} {"train_loss": -10.344036102294922, "global_step": 235838, "epoch": 1403} {"train_loss": -10.385252952575684, "global_step": 235839, "epoch": 1403} {"train_loss": -11.465531349182129, "global_step": 235840, "epoch": 1403} {"train_loss": -11.021065711975098, "global_step": 235841, "epoch": 1403} {"train_loss": -11.178716659545898, "global_step": 235842, "epoch": 1403} {"train_loss": -10.762677192687988, "global_step": 235843, "epoch": 1403} {"train_loss": -11.109475135803223, "global_step": 235844, "epoch": 1403} {"train_loss": -9.600788116455078, "global_step": 235845, "epoch": 1403} {"train_loss": -10.12397575378418, "global_step": 235846, "epoch": 1403} {"train_loss": -10.383033752441406, "global_step": 235847, "epoch": 1403} {"train_loss": -8.927356719970703, "global_step": 235848, "epoch": 1403} {"train_loss": -8.658404350280762, "global_step": 235849, "epoch": 1403} {"train_loss": -9.15799331665039, "global_step": 235850, "epoch": 1403} {"train_loss": -10.265867233276367, "global_step": 235851, "epoch": 1403} {"train_loss": -8.701168060302734, "global_step": 235852, "epoch": 1403} {"train_loss": -9.793778419494629, "global_step": 235853, "epoch": 1403} {"train_loss": -9.511442184448242, "global_step": 235854, "epoch": 1403} {"train_loss": -10.317251205444336, "global_step": 235855, "epoch": 1403} {"train_loss": -10.269140243530273, "global_step": 235856, "epoch": 1403} {"train_loss": -10.289480209350586, "global_step": 235857, "epoch": 1403} {"train_loss": -11.123917579650879, "global_step": 235858, "epoch": 1403} {"train_loss": -10.287439346313477, "global_step": 235859, "epoch": 1403} {"train_loss": -11.07738208770752, "global_step": 235860, "epoch": 1403} {"train_loss": -10.839693069458008, "global_step": 235861, "epoch": 1403} {"train_loss": -11.154891967773438, "global_step": 235862, "epoch": 1403} {"train_loss": -10.952061653137207, "global_step": 235863, "epoch": 1403} {"train_loss": -11.372862815856934, "global_step": 235864, "epoch": 1403} {"train_loss": -11.357917785644531, "global_step": 235865, "epoch": 1403} {"train_loss": -11.300509452819824, "global_step": 235866, "epoch": 1403} {"train_loss": -11.269122123718262, "global_step": 235867, "epoch": 1403} {"train_loss": -11.033541679382324, "global_step": 235868, "epoch": 1403} {"train_loss": -11.286598205566406, "global_step": 235869, "epoch": 1403} {"train_loss": -11.196333885192871, "global_step": 235870, "epoch": 1403} {"train_loss": -11.348750988642374, "global_step": 235871, "epoch": 1403, "val_loss": 264114.71875} {"train_loss": -11.489002227783203, "global_step": 235872, "epoch": 1404} {"train_loss": -11.510353088378906, "global_step": 235873, "epoch": 1404} {"train_loss": -11.309369087219238, "global_step": 235874, "epoch": 1404} {"train_loss": -11.448433876037598, "global_step": 235875, "epoch": 1404} {"train_loss": -11.390243530273438, "global_step": 235876, "epoch": 1404} {"train_loss": -11.636922836303711, "global_step": 235877, "epoch": 1404} {"train_loss": -11.501110076904297, "global_step": 235878, "epoch": 1404} {"train_loss": -11.566567420959473, "global_step": 235879, "epoch": 1404} {"train_loss": -11.510825157165527, "global_step": 235880, "epoch": 1404} {"train_loss": -11.73420524597168, "global_step": 235881, "epoch": 1404} {"train_loss": -11.58294677734375, "global_step": 235882, "epoch": 1404} {"train_loss": -11.492149353027344, "global_step": 235883, "epoch": 1404} {"train_loss": -11.697835922241211, "global_step": 235884, "epoch": 1404} {"train_loss": -11.428875923156738, "global_step": 235885, "epoch": 1404} {"train_loss": -11.693670272827148, "global_step": 235886, "epoch": 1404} {"train_loss": -11.706777572631836, "global_step": 235887, "epoch": 1404} {"train_loss": -11.464818000793457, "global_step": 235888, "epoch": 1404} {"train_loss": -11.534975051879883, "global_step": 235889, "epoch": 1404} {"train_loss": -11.705977439880371, "global_step": 235890, "epoch": 1404} {"train_loss": -11.771405220031738, "global_step": 235891, "epoch": 1404} {"train_loss": -11.791236877441406, "global_step": 235892, "epoch": 1404} {"train_loss": -11.473690032958984, "global_step": 235893, "epoch": 1404} {"train_loss": -11.777137756347656, "global_step": 235894, "epoch": 1404} {"train_loss": -11.620058059692383, "global_step": 235895, "epoch": 1404} {"train_loss": -11.760269165039062, "global_step": 235896, "epoch": 1404} {"train_loss": -11.761757850646973, "global_step": 235897, "epoch": 1404} {"train_loss": -11.951027870178223, "global_step": 235898, "epoch": 1404} {"train_loss": -11.860552787780762, "global_step": 235899, "epoch": 1404} {"train_loss": -11.901721000671387, "global_step": 235900, "epoch": 1404} {"train_loss": -11.823671340942383, "global_step": 235901, "epoch": 1404} {"train_loss": -11.936739921569824, "global_step": 235902, "epoch": 1404} {"train_loss": -11.909980773925781, "global_step": 235903, "epoch": 1404} {"train_loss": -11.869489669799805, "global_step": 235904, "epoch": 1404} {"train_loss": -11.819421768188477, "global_step": 235905, "epoch": 1404} {"train_loss": -12.028347969055176, "global_step": 235906, "epoch": 1404} {"train_loss": -12.022012710571289, "global_step": 235907, "epoch": 1404} {"train_loss": -12.043257713317871, "global_step": 235908, "epoch": 1404} {"train_loss": -12.127037048339844, "global_step": 235909, "epoch": 1404} {"train_loss": -12.00275993347168, "global_step": 235910, "epoch": 1404} {"train_loss": -11.93574047088623, "global_step": 235911, "epoch": 1404} {"train_loss": -12.065296173095703, "global_step": 235912, "epoch": 1404} {"train_loss": -12.026300430297852, "global_step": 235913, "epoch": 1404} {"train_loss": -12.184629440307617, "global_step": 235914, "epoch": 1404} {"train_loss": -11.943424224853516, "global_step": 235915, "epoch": 1404} {"train_loss": -12.072221755981445, "global_step": 235916, "epoch": 1404} {"train_loss": -11.960851669311523, "global_step": 235917, "epoch": 1404} {"train_loss": -12.163383483886719, "global_step": 235918, "epoch": 1404} {"train_loss": -12.15505313873291, "global_step": 235919, "epoch": 1404} {"train_loss": -11.994657516479492, "global_step": 235920, "epoch": 1404} {"train_loss": -12.082164764404297, "global_step": 235921, "epoch": 1404} {"train_loss": -11.774099349975586, "global_step": 235922, "epoch": 1404} {"train_loss": -12.103958129882812, "global_step": 235923, "epoch": 1404} {"train_loss": -12.15086555480957, "global_step": 235924, "epoch": 1404} {"train_loss": -11.737174034118652, "global_step": 235925, "epoch": 1404} {"train_loss": -11.858596801757812, "global_step": 235926, "epoch": 1404} {"train_loss": -12.175374984741211, "global_step": 235927, "epoch": 1404} {"train_loss": -11.781661987304688, "global_step": 235928, "epoch": 1404} {"train_loss": -12.067901611328125, "global_step": 235929, "epoch": 1404} {"train_loss": -12.23161506652832, "global_step": 235930, "epoch": 1404} {"train_loss": -11.956113815307617, "global_step": 235931, "epoch": 1404} {"train_loss": -12.18453598022461, "global_step": 235932, "epoch": 1404} {"train_loss": -12.289098739624023, "global_step": 235933, "epoch": 1404} {"train_loss": -11.68701171875, "global_step": 235934, "epoch": 1404} {"train_loss": -11.943292617797852, "global_step": 235935, "epoch": 1404} {"train_loss": -12.107513427734375, "global_step": 235936, "epoch": 1404} {"train_loss": -11.841334342956543, "global_step": 235937, "epoch": 1404} {"train_loss": -11.701875686645508, "global_step": 235938, "epoch": 1404} {"train_loss": -12.149620056152344, "global_step": 235939, "epoch": 1404} {"train_loss": -12.139802932739258, "global_step": 235940, "epoch": 1404} {"train_loss": -12.011300086975098, "global_step": 235941, "epoch": 1404} {"train_loss": -11.798704147338867, "global_step": 235942, "epoch": 1404} {"train_loss": -12.006972312927246, "global_step": 235943, "epoch": 1404} {"train_loss": -11.905752182006836, "global_step": 235944, "epoch": 1404} {"train_loss": -11.983484268188477, "global_step": 235945, "epoch": 1404} {"train_loss": -11.980506896972656, "global_step": 235946, "epoch": 1404} {"train_loss": -12.044425010681152, "global_step": 235947, "epoch": 1404} {"train_loss": -12.122871398925781, "global_step": 235948, "epoch": 1404} {"train_loss": -11.928974151611328, "global_step": 235949, "epoch": 1404} {"train_loss": -11.93735408782959, "global_step": 235950, "epoch": 1404} {"train_loss": -11.951252937316895, "global_step": 235951, "epoch": 1404} {"train_loss": -12.214153289794922, "global_step": 235952, "epoch": 1404} {"train_loss": -12.032835006713867, "global_step": 235953, "epoch": 1404} {"train_loss": -11.88313102722168, "global_step": 235954, "epoch": 1404} {"train_loss": -12.041399002075195, "global_step": 235955, "epoch": 1404} {"train_loss": -11.783658027648926, "global_step": 235956, "epoch": 1404} {"train_loss": -11.754717826843262, "global_step": 235957, "epoch": 1404} {"train_loss": -11.924739837646484, "global_step": 235958, "epoch": 1404} {"train_loss": -11.983561515808105, "global_step": 235959, "epoch": 1404} {"train_loss": -11.988839149475098, "global_step": 235960, "epoch": 1404} {"train_loss": -10.664192199707031, "global_step": 235961, "epoch": 1404} {"train_loss": -11.222667694091797, "global_step": 235962, "epoch": 1404} {"train_loss": -11.497907638549805, "global_step": 235963, "epoch": 1404} {"train_loss": -11.993231773376465, "global_step": 235964, "epoch": 1404} {"train_loss": -10.871971130371094, "global_step": 235965, "epoch": 1404} {"train_loss": -10.42713737487793, "global_step": 235966, "epoch": 1404} {"train_loss": -9.996919631958008, "global_step": 235967, "epoch": 1404} {"train_loss": -11.701370239257812, "global_step": 235968, "epoch": 1404} {"train_loss": -11.043895721435547, "global_step": 235969, "epoch": 1404} {"train_loss": -9.996648788452148, "global_step": 235970, "epoch": 1404} {"train_loss": -9.441779136657715, "global_step": 235971, "epoch": 1404} {"train_loss": -10.322559356689453, "global_step": 235972, "epoch": 1404} {"train_loss": -9.680632591247559, "global_step": 235973, "epoch": 1404} {"train_loss": -10.70419979095459, "global_step": 235974, "epoch": 1404} {"train_loss": -10.5825834274292, "global_step": 235975, "epoch": 1404} {"train_loss": -10.715319633483887, "global_step": 235976, "epoch": 1404} {"train_loss": -10.444724082946777, "global_step": 235977, "epoch": 1404} {"train_loss": -10.096002578735352, "global_step": 235978, "epoch": 1404} {"train_loss": -10.170438766479492, "global_step": 235979, "epoch": 1404} {"train_loss": -11.46091079711914, "global_step": 235980, "epoch": 1404} {"train_loss": -9.796613693237305, "global_step": 235981, "epoch": 1404} {"train_loss": -10.89741325378418, "global_step": 235982, "epoch": 1404} {"train_loss": -9.735937118530273, "global_step": 235983, "epoch": 1404} {"train_loss": -10.856261253356934, "global_step": 235984, "epoch": 1404} {"train_loss": -10.805509567260742, "global_step": 235985, "epoch": 1404} {"train_loss": -10.739620208740234, "global_step": 235986, "epoch": 1404} {"train_loss": -10.59977912902832, "global_step": 235987, "epoch": 1404} {"train_loss": -10.926629066467285, "global_step": 235988, "epoch": 1404} {"train_loss": -10.58907413482666, "global_step": 235989, "epoch": 1404} {"train_loss": -10.746075630187988, "global_step": 235990, "epoch": 1404} {"train_loss": -11.53392219543457, "global_step": 235991, "epoch": 1404} {"train_loss": -11.160652160644531, "global_step": 235992, "epoch": 1404} {"train_loss": -11.222013473510742, "global_step": 235993, "epoch": 1404} {"train_loss": -11.148406982421875, "global_step": 235994, "epoch": 1404} {"train_loss": -11.201079368591309, "global_step": 235995, "epoch": 1404} {"train_loss": -11.276039123535156, "global_step": 235996, "epoch": 1404} {"train_loss": -11.09111213684082, "global_step": 235997, "epoch": 1404} {"train_loss": -11.328685760498047, "global_step": 235998, "epoch": 1404} {"train_loss": -11.25979995727539, "global_step": 235999, "epoch": 1404} {"train_loss": -10.995157241821289, "global_step": 236000, "epoch": 1404} {"train_loss": -11.120769500732422, "global_step": 236001, "epoch": 1404} {"train_loss": -11.572919845581055, "global_step": 236002, "epoch": 1404} {"train_loss": -11.460983276367188, "global_step": 236003, "epoch": 1404} {"train_loss": -11.685375213623047, "global_step": 236004, "epoch": 1404} {"train_loss": -11.540216445922852, "global_step": 236005, "epoch": 1404} {"train_loss": -11.523455619812012, "global_step": 236006, "epoch": 1404} {"train_loss": -11.402957916259766, "global_step": 236007, "epoch": 1404} {"train_loss": -11.804546356201172, "global_step": 236008, "epoch": 1404} {"train_loss": -11.690839767456055, "global_step": 236009, "epoch": 1404} {"train_loss": -11.373303413391113, "global_step": 236010, "epoch": 1404} {"train_loss": -11.568517684936523, "global_step": 236011, "epoch": 1404} {"train_loss": -11.643014907836914, "global_step": 236012, "epoch": 1404} {"train_loss": -11.72785758972168, "global_step": 236013, "epoch": 1404} {"train_loss": -11.684494018554688, "global_step": 236014, "epoch": 1404} {"train_loss": -11.590420722961426, "global_step": 236015, "epoch": 1404} {"train_loss": -11.615507125854492, "global_step": 236016, "epoch": 1404} {"train_loss": -11.659093856811523, "global_step": 236017, "epoch": 1404} {"train_loss": -11.759166717529297, "global_step": 236018, "epoch": 1404} {"train_loss": -11.57131576538086, "global_step": 236019, "epoch": 1404} {"train_loss": -11.585464477539062, "global_step": 236020, "epoch": 1404} {"train_loss": -11.182804107666016, "global_step": 236021, "epoch": 1404} {"train_loss": -11.632181167602539, "global_step": 236022, "epoch": 1404} {"train_loss": -11.112591743469238, "global_step": 236023, "epoch": 1404} {"train_loss": -11.677408218383789, "global_step": 236024, "epoch": 1404} {"train_loss": -11.192516326904297, "global_step": 236025, "epoch": 1404} {"train_loss": -11.75190544128418, "global_step": 236026, "epoch": 1404} {"train_loss": -11.398601531982422, "global_step": 236027, "epoch": 1404} {"train_loss": -11.806087493896484, "global_step": 236028, "epoch": 1404} {"train_loss": -11.395339965820312, "global_step": 236029, "epoch": 1404} {"train_loss": -11.78156852722168, "global_step": 236030, "epoch": 1404} {"train_loss": -11.512214660644531, "global_step": 236031, "epoch": 1404} {"train_loss": -11.717472076416016, "global_step": 236032, "epoch": 1404} {"train_loss": -11.848587036132812, "global_step": 236033, "epoch": 1404} {"train_loss": -11.811338424682617, "global_step": 236034, "epoch": 1404} {"train_loss": -11.82650375366211, "global_step": 236035, "epoch": 1404} {"train_loss": -11.884641647338867, "global_step": 236036, "epoch": 1404} {"train_loss": -11.77432632446289, "global_step": 236037, "epoch": 1404} {"train_loss": -11.975494384765625, "global_step": 236038, "epoch": 1404} {"train_loss": -11.548008833612714, "global_step": 236039, "epoch": 1404, "val_loss": 266585.03125} {"train_loss": -11.971855163574219, "global_step": 236040, "epoch": 1405} {"train_loss": -11.780618667602539, "global_step": 236041, "epoch": 1405} {"train_loss": -11.920100212097168, "global_step": 236042, "epoch": 1405} {"train_loss": -11.858070373535156, "global_step": 236043, "epoch": 1405} {"train_loss": -11.871453285217285, "global_step": 236044, "epoch": 1405} {"train_loss": -11.609972953796387, "global_step": 236045, "epoch": 1405} {"train_loss": -12.032644271850586, "global_step": 236046, "epoch": 1405} {"train_loss": -11.863037109375, "global_step": 236047, "epoch": 1405} {"train_loss": -11.961334228515625, "global_step": 236048, "epoch": 1405} {"train_loss": -11.942394256591797, "global_step": 236049, "epoch": 1405} {"train_loss": -11.598194122314453, "global_step": 236050, "epoch": 1405} {"train_loss": -11.968009948730469, "global_step": 236051, "epoch": 1405} {"train_loss": -11.811717987060547, "global_step": 236052, "epoch": 1405} {"train_loss": -11.678269386291504, "global_step": 236053, "epoch": 1405} {"train_loss": -11.851492881774902, "global_step": 236054, "epoch": 1405} {"train_loss": -11.727764129638672, "global_step": 236055, "epoch": 1405} {"train_loss": -11.880985260009766, "global_step": 236056, "epoch": 1405} {"train_loss": -11.465255737304688, "global_step": 236057, "epoch": 1405} {"train_loss": -11.680549621582031, "global_step": 236058, "epoch": 1405} {"train_loss": -11.799932479858398, "global_step": 236059, "epoch": 1405} {"train_loss": -11.61619758605957, "global_step": 236060, "epoch": 1405} {"train_loss": -11.723118782043457, "global_step": 236061, "epoch": 1405} {"train_loss": -11.794347763061523, "global_step": 236062, "epoch": 1405} {"train_loss": -11.606039047241211, "global_step": 236063, "epoch": 1405} {"train_loss": -12.071361541748047, "global_step": 236064, "epoch": 1405} {"train_loss": -11.47739028930664, "global_step": 236065, "epoch": 1405} {"train_loss": -11.673734664916992, "global_step": 236066, "epoch": 1405} {"train_loss": -12.028268814086914, "global_step": 236067, "epoch": 1405} {"train_loss": -11.694917678833008, "global_step": 236068, "epoch": 1405} {"train_loss": -11.715303421020508, "global_step": 236069, "epoch": 1405} {"train_loss": -11.74105453491211, "global_step": 236070, "epoch": 1405} {"train_loss": -11.334705352783203, "global_step": 236071, "epoch": 1405} {"train_loss": -11.855742454528809, "global_step": 236072, "epoch": 1405} {"train_loss": -11.341949462890625, "global_step": 236073, "epoch": 1405} {"train_loss": -11.729904174804688, "global_step": 236074, "epoch": 1405} {"train_loss": -11.641725540161133, "global_step": 236075, "epoch": 1405} {"train_loss": -11.83006763458252, "global_step": 236076, "epoch": 1405} {"train_loss": -11.82689380645752, "global_step": 236077, "epoch": 1405} {"train_loss": -11.972931861877441, "global_step": 236078, "epoch": 1405} {"train_loss": -11.942134857177734, "global_step": 236079, "epoch": 1405} {"train_loss": -11.62449836730957, "global_step": 236080, "epoch": 1405} {"train_loss": -12.096342086791992, "global_step": 236081, "epoch": 1405} {"train_loss": -12.128791809082031, "global_step": 236082, "epoch": 1405} {"train_loss": -12.037883758544922, "global_step": 236083, "epoch": 1405} {"train_loss": -11.881892204284668, "global_step": 236084, "epoch": 1405} {"train_loss": -12.125579833984375, "global_step": 236085, "epoch": 1405} {"train_loss": -11.790241241455078, "global_step": 236086, "epoch": 1405} {"train_loss": -11.729887008666992, "global_step": 236087, "epoch": 1405} {"train_loss": -11.878565788269043, "global_step": 236088, "epoch": 1405} {"train_loss": -11.77149772644043, "global_step": 236089, "epoch": 1405} {"train_loss": -11.933158874511719, "global_step": 236090, "epoch": 1405} {"train_loss": -11.746374130249023, "global_step": 236091, "epoch": 1405} {"train_loss": -11.979862213134766, "global_step": 236092, "epoch": 1405} {"train_loss": -11.809076309204102, "global_step": 236093, "epoch": 1405} {"train_loss": -11.894359588623047, "global_step": 236094, "epoch": 1405} {"train_loss": -11.620525360107422, "global_step": 236095, "epoch": 1405} {"train_loss": -11.82305908203125, "global_step": 236096, "epoch": 1405} {"train_loss": -11.91111946105957, "global_step": 236097, "epoch": 1405} {"train_loss": -11.987371444702148, "global_step": 236098, "epoch": 1405} {"train_loss": -11.371235847473145, "global_step": 236099, "epoch": 1405} {"train_loss": -11.667217254638672, "global_step": 236100, "epoch": 1405} {"train_loss": -12.039420127868652, "global_step": 236101, "epoch": 1405} {"train_loss": -11.433805465698242, "global_step": 236102, "epoch": 1405} {"train_loss": -11.40223503112793, "global_step": 236103, "epoch": 1405} {"train_loss": -11.948221206665039, "global_step": 236104, "epoch": 1405} {"train_loss": -11.926130294799805, "global_step": 236105, "epoch": 1405} {"train_loss": -11.736319541931152, "global_step": 236106, "epoch": 1405} {"train_loss": -11.867244720458984, "global_step": 236107, "epoch": 1405} {"train_loss": -11.591947555541992, "global_step": 236108, "epoch": 1405} {"train_loss": -11.75589370727539, "global_step": 236109, "epoch": 1405} {"train_loss": -10.36907958984375, "global_step": 236110, "epoch": 1405} {"train_loss": -11.781264305114746, "global_step": 236111, "epoch": 1405} {"train_loss": -10.274685859680176, "global_step": 236112, "epoch": 1405} {"train_loss": -11.57655143737793, "global_step": 236113, "epoch": 1405} {"train_loss": -10.476964950561523, "global_step": 236114, "epoch": 1405} {"train_loss": -11.13302993774414, "global_step": 236115, "epoch": 1405} {"train_loss": -10.088580131530762, "global_step": 236116, "epoch": 1405} {"train_loss": -11.052037239074707, "global_step": 236117, "epoch": 1405} {"train_loss": -11.114835739135742, "global_step": 236118, "epoch": 1405} {"train_loss": -10.084207534790039, "global_step": 236119, "epoch": 1405} {"train_loss": -11.219355583190918, "global_step": 236120, "epoch": 1405} {"train_loss": -10.82083511352539, "global_step": 236121, "epoch": 1405} {"train_loss": -10.87385368347168, "global_step": 236122, "epoch": 1405} {"train_loss": -10.648483276367188, "global_step": 236123, "epoch": 1405} {"train_loss": -10.376750946044922, "global_step": 236124, "epoch": 1405} {"train_loss": -10.513406753540039, "global_step": 236125, "epoch": 1405} {"train_loss": -10.009614944458008, "global_step": 236126, "epoch": 1405} {"train_loss": -10.902525901794434, "global_step": 236127, "epoch": 1405} {"train_loss": -10.529318809509277, "global_step": 236128, "epoch": 1405} {"train_loss": -10.287735939025879, "global_step": 236129, "epoch": 1405} {"train_loss": -11.608161926269531, "global_step": 236130, "epoch": 1405} {"train_loss": -10.238382339477539, "global_step": 236131, "epoch": 1405} {"train_loss": -11.037249565124512, "global_step": 236132, "epoch": 1405} {"train_loss": -10.832276344299316, "global_step": 236133, "epoch": 1405} {"train_loss": -10.329292297363281, "global_step": 236134, "epoch": 1405} {"train_loss": -10.844623565673828, "global_step": 236135, "epoch": 1405} {"train_loss": -10.293182373046875, "global_step": 236136, "epoch": 1405} {"train_loss": -11.612759590148926, "global_step": 236137, "epoch": 1405} {"train_loss": -10.12491226196289, "global_step": 236138, "epoch": 1405} {"train_loss": -11.559288024902344, "global_step": 236139, "epoch": 1405} {"train_loss": -10.86953067779541, "global_step": 236140, "epoch": 1405} {"train_loss": -10.843133926391602, "global_step": 236141, "epoch": 1405} {"train_loss": -11.363729476928711, "global_step": 236142, "epoch": 1405} {"train_loss": -11.459157943725586, "global_step": 236143, "epoch": 1405} {"train_loss": -10.777458190917969, "global_step": 236144, "epoch": 1405} {"train_loss": -11.296847343444824, "global_step": 236145, "epoch": 1405} {"train_loss": -10.73336410522461, "global_step": 236146, "epoch": 1405} {"train_loss": -10.61337947845459, "global_step": 236147, "epoch": 1405} {"train_loss": -10.843360900878906, "global_step": 236148, "epoch": 1405} {"train_loss": -11.03143310546875, "global_step": 236149, "epoch": 1405} {"train_loss": -10.766021728515625, "global_step": 236150, "epoch": 1405} {"train_loss": -11.131243705749512, "global_step": 236151, "epoch": 1405} {"train_loss": -10.652917861938477, "global_step": 236152, "epoch": 1405} {"train_loss": -11.025055885314941, "global_step": 236153, "epoch": 1405} {"train_loss": -11.208849906921387, "global_step": 236154, "epoch": 1405} {"train_loss": -11.367461204528809, "global_step": 236155, "epoch": 1405} {"train_loss": -11.269441604614258, "global_step": 236156, "epoch": 1405} {"train_loss": -11.05255126953125, "global_step": 236157, "epoch": 1405} {"train_loss": -11.557697296142578, "global_step": 236158, "epoch": 1405} {"train_loss": -11.014019012451172, "global_step": 236159, "epoch": 1405} {"train_loss": -11.43218994140625, "global_step": 236160, "epoch": 1405} {"train_loss": -11.477121353149414, "global_step": 236161, "epoch": 1405} {"train_loss": -11.35425090789795, "global_step": 236162, "epoch": 1405} {"train_loss": -11.578542709350586, "global_step": 236163, "epoch": 1405} {"train_loss": -11.390129089355469, "global_step": 236164, "epoch": 1405} {"train_loss": -11.549373626708984, "global_step": 236165, "epoch": 1405} {"train_loss": -11.544628143310547, "global_step": 236166, "epoch": 1405} {"train_loss": -11.553165435791016, "global_step": 236167, "epoch": 1405} {"train_loss": -11.314720153808594, "global_step": 236168, "epoch": 1405} {"train_loss": -11.724250793457031, "global_step": 236169, "epoch": 1405} {"train_loss": -11.555374145507812, "global_step": 236170, "epoch": 1405} {"train_loss": -11.90626335144043, "global_step": 236171, "epoch": 1405} {"train_loss": -11.76807975769043, "global_step": 236172, "epoch": 1405} {"train_loss": -11.739084243774414, "global_step": 236173, "epoch": 1405} {"train_loss": -11.514423370361328, "global_step": 236174, "epoch": 1405} {"train_loss": -11.725627899169922, "global_step": 236175, "epoch": 1405} {"train_loss": -11.706311225891113, "global_step": 236176, "epoch": 1405} {"train_loss": -11.554133415222168, "global_step": 236177, "epoch": 1405} {"train_loss": -11.849940299987793, "global_step": 236178, "epoch": 1405} {"train_loss": -11.847018241882324, "global_step": 236179, "epoch": 1405} {"train_loss": -11.854775428771973, "global_step": 236180, "epoch": 1405} {"train_loss": -11.856473922729492, "global_step": 236181, "epoch": 1405} {"train_loss": -11.781923294067383, "global_step": 236182, "epoch": 1405} {"train_loss": -11.879300117492676, "global_step": 236183, "epoch": 1405} {"train_loss": -11.679520606994629, "global_step": 236184, "epoch": 1405} {"train_loss": -11.810516357421875, "global_step": 236185, "epoch": 1405} {"train_loss": -11.862333297729492, "global_step": 236186, "epoch": 1405} {"train_loss": -11.865358352661133, "global_step": 236187, "epoch": 1405} {"train_loss": -11.910614013671875, "global_step": 236188, "epoch": 1405} {"train_loss": -11.900009155273438, "global_step": 236189, "epoch": 1405} {"train_loss": -11.951969146728516, "global_step": 236190, "epoch": 1405} {"train_loss": -12.004100799560547, "global_step": 236191, "epoch": 1405} {"train_loss": -11.867393493652344, "global_step": 236192, "epoch": 1405} {"train_loss": -12.05646800994873, "global_step": 236193, "epoch": 1405} {"train_loss": -12.040483474731445, "global_step": 236194, "epoch": 1405} {"train_loss": -11.931391716003418, "global_step": 236195, "epoch": 1405} {"train_loss": -12.135311126708984, "global_step": 236196, "epoch": 1405} {"train_loss": -11.78645133972168, "global_step": 236197, "epoch": 1405} {"train_loss": -12.029609680175781, "global_step": 236198, "epoch": 1405} {"train_loss": -11.927583694458008, "global_step": 236199, "epoch": 1405} {"train_loss": -11.928348541259766, "global_step": 236200, "epoch": 1405} {"train_loss": -12.016554832458496, "global_step": 236201, "epoch": 1405} {"train_loss": -12.019176483154297, "global_step": 236202, "epoch": 1405} {"train_loss": -11.938697814941406, "global_step": 236203, "epoch": 1405} {"train_loss": -12.067785263061523, "global_step": 236204, "epoch": 1405} {"train_loss": -12.045089721679688, "global_step": 236205, "epoch": 1405} {"train_loss": -11.784636497497559, "global_step": 236206, "epoch": 1405} {"train_loss": -11.518790574300857, "global_step": 236207, "epoch": 1405, "val_loss": 261643.359375, "train_action_mse_error": 1.6699854135513306} {"train_loss": -12.231635093688965, "global_step": 236208, "epoch": 1406} {"train_loss": -11.780184745788574, "global_step": 236209, "epoch": 1406} {"train_loss": -12.10978889465332, "global_step": 236210, "epoch": 1406} {"train_loss": -12.119680404663086, "global_step": 236211, "epoch": 1406} {"train_loss": -11.953397750854492, "global_step": 236212, "epoch": 1406} {"train_loss": -11.941328048706055, "global_step": 236213, "epoch": 1406} {"train_loss": -12.169865608215332, "global_step": 236214, "epoch": 1406} {"train_loss": -11.748462677001953, "global_step": 236215, "epoch": 1406} {"train_loss": -11.838518142700195, "global_step": 236216, "epoch": 1406} {"train_loss": -11.100873947143555, "global_step": 236217, "epoch": 1406} {"train_loss": -10.886489868164062, "global_step": 236218, "epoch": 1406} {"train_loss": -10.433538436889648, "global_step": 236219, "epoch": 1406} {"train_loss": -11.814574241638184, "global_step": 236220, "epoch": 1406} {"train_loss": -10.394340515136719, "global_step": 236221, "epoch": 1406} {"train_loss": -11.652741432189941, "global_step": 236222, "epoch": 1406} {"train_loss": -11.27484130859375, "global_step": 236223, "epoch": 1406} {"train_loss": -10.865479469299316, "global_step": 236224, "epoch": 1406} {"train_loss": -9.763408660888672, "global_step": 236225, "epoch": 1406} {"train_loss": -8.81190013885498, "global_step": 236226, "epoch": 1406} {"train_loss": -11.021078109741211, "global_step": 236227, "epoch": 1406} {"train_loss": -9.323612213134766, "global_step": 236228, "epoch": 1406} {"train_loss": -8.238005638122559, "global_step": 236229, "epoch": 1406} {"train_loss": -10.458040237426758, "global_step": 236230, "epoch": 1406} {"train_loss": -9.735090255737305, "global_step": 236231, "epoch": 1406} {"train_loss": -9.39797592163086, "global_step": 236232, "epoch": 1406} {"train_loss": -9.981544494628906, "global_step": 236233, "epoch": 1406} {"train_loss": -10.395936965942383, "global_step": 236234, "epoch": 1406} {"train_loss": -9.905627250671387, "global_step": 236235, "epoch": 1406} {"train_loss": -11.16757583618164, "global_step": 236236, "epoch": 1406} {"train_loss": -10.350837707519531, "global_step": 236237, "epoch": 1406} {"train_loss": -10.573148727416992, "global_step": 236238, "epoch": 1406} {"train_loss": -10.570158004760742, "global_step": 236239, "epoch": 1406} {"train_loss": -10.068788528442383, "global_step": 236240, "epoch": 1406} {"train_loss": -10.79649543762207, "global_step": 236241, "epoch": 1406} {"train_loss": -10.911277770996094, "global_step": 236242, "epoch": 1406} {"train_loss": -10.609055519104004, "global_step": 236243, "epoch": 1406} {"train_loss": -11.20311450958252, "global_step": 236244, "epoch": 1406} {"train_loss": -10.628804206848145, "global_step": 236245, "epoch": 1406} {"train_loss": -9.91819953918457, "global_step": 236246, "epoch": 1406} {"train_loss": -11.128636360168457, "global_step": 236247, "epoch": 1406} {"train_loss": -11.23103141784668, "global_step": 236248, "epoch": 1406} {"train_loss": -10.676933288574219, "global_step": 236249, "epoch": 1406} {"train_loss": -11.285037994384766, "global_step": 236250, "epoch": 1406} {"train_loss": -11.03462028503418, "global_step": 236251, "epoch": 1406} {"train_loss": -11.003151893615723, "global_step": 236252, "epoch": 1406} {"train_loss": -11.035871505737305, "global_step": 236253, "epoch": 1406} {"train_loss": -10.860379219055176, "global_step": 236254, "epoch": 1406} {"train_loss": -10.891297340393066, "global_step": 236255, "epoch": 1406} {"train_loss": -11.251197814941406, "global_step": 236256, "epoch": 1406} {"train_loss": -10.50823974609375, "global_step": 236257, "epoch": 1406} {"train_loss": -11.421337127685547, "global_step": 236258, "epoch": 1406} {"train_loss": -11.173463821411133, "global_step": 236259, "epoch": 1406} {"train_loss": -11.201833724975586, "global_step": 236260, "epoch": 1406} {"train_loss": -11.456294059753418, "global_step": 236261, "epoch": 1406} {"train_loss": -10.958635330200195, "global_step": 236262, "epoch": 1406} {"train_loss": -11.431680679321289, "global_step": 236263, "epoch": 1406} {"train_loss": -11.427417755126953, "global_step": 236264, "epoch": 1406} {"train_loss": -11.547979354858398, "global_step": 236265, "epoch": 1406} {"train_loss": -11.34323787689209, "global_step": 236266, "epoch": 1406} {"train_loss": -11.46893310546875, "global_step": 236267, "epoch": 1406} {"train_loss": -11.160149574279785, "global_step": 236268, "epoch": 1406} {"train_loss": -11.627010345458984, "global_step": 236269, "epoch": 1406} {"train_loss": -11.591500282287598, "global_step": 236270, "epoch": 1406} {"train_loss": -11.609514236450195, "global_step": 236271, "epoch": 1406} {"train_loss": -11.731618881225586, "global_step": 236272, "epoch": 1406} {"train_loss": -11.833515167236328, "global_step": 236273, "epoch": 1406} {"train_loss": -11.473434448242188, "global_step": 236274, "epoch": 1406} {"train_loss": -11.750509262084961, "global_step": 236275, "epoch": 1406} {"train_loss": -11.50887680053711, "global_step": 236276, "epoch": 1406} {"train_loss": -11.709449768066406, "global_step": 236277, "epoch": 1406} {"train_loss": -11.726420402526855, "global_step": 236278, "epoch": 1406} {"train_loss": -11.700458526611328, "global_step": 236279, "epoch": 1406} {"train_loss": -11.632696151733398, "global_step": 236280, "epoch": 1406} {"train_loss": -11.722994804382324, "global_step": 236281, "epoch": 1406} {"train_loss": -11.266934394836426, "global_step": 236282, "epoch": 1406} {"train_loss": -11.955305099487305, "global_step": 236283, "epoch": 1406} {"train_loss": -11.768243789672852, "global_step": 236284, "epoch": 1406} {"train_loss": -11.65379524230957, "global_step": 236285, "epoch": 1406} {"train_loss": -11.674341201782227, "global_step": 236286, "epoch": 1406} {"train_loss": -11.703475952148438, "global_step": 236287, "epoch": 1406} {"train_loss": -11.797357559204102, "global_step": 236288, "epoch": 1406} {"train_loss": -11.979304313659668, "global_step": 236289, "epoch": 1406} {"train_loss": -11.76357650756836, "global_step": 236290, "epoch": 1406} {"train_loss": -11.848212242126465, "global_step": 236291, "epoch": 1406} {"train_loss": -11.743117332458496, "global_step": 236292, "epoch": 1406} {"train_loss": -11.892691612243652, "global_step": 236293, "epoch": 1406} {"train_loss": -11.759016036987305, "global_step": 236294, "epoch": 1406} {"train_loss": -11.955928802490234, "global_step": 236295, "epoch": 1406} {"train_loss": -11.817850112915039, "global_step": 236296, "epoch": 1406} {"train_loss": -12.101290702819824, "global_step": 236297, "epoch": 1406} {"train_loss": -11.942554473876953, "global_step": 236298, "epoch": 1406} {"train_loss": -12.081245422363281, "global_step": 236299, "epoch": 1406} {"train_loss": -11.897814750671387, "global_step": 236300, "epoch": 1406} {"train_loss": -12.002439498901367, "global_step": 236301, "epoch": 1406} {"train_loss": -11.621262550354004, "global_step": 236302, "epoch": 1406} {"train_loss": -11.823633193969727, "global_step": 236303, "epoch": 1406} {"train_loss": -11.889373779296875, "global_step": 236304, "epoch": 1406} {"train_loss": -11.975918769836426, "global_step": 236305, "epoch": 1406} {"train_loss": -11.887372970581055, "global_step": 236306, "epoch": 1406} {"train_loss": -11.961555480957031, "global_step": 236307, "epoch": 1406} {"train_loss": -11.967864036560059, "global_step": 236308, "epoch": 1406} {"train_loss": -11.705829620361328, "global_step": 236309, "epoch": 1406} {"train_loss": -11.855582237243652, "global_step": 236310, "epoch": 1406} {"train_loss": -11.897851943969727, "global_step": 236311, "epoch": 1406} {"train_loss": -11.664750099182129, "global_step": 236312, "epoch": 1406} {"train_loss": -12.000728607177734, "global_step": 236313, "epoch": 1406} {"train_loss": -11.945853233337402, "global_step": 236314, "epoch": 1406} {"train_loss": -12.000865936279297, "global_step": 236315, "epoch": 1406} {"train_loss": -12.017330169677734, "global_step": 236316, "epoch": 1406} {"train_loss": -11.275843620300293, "global_step": 236317, "epoch": 1406} {"train_loss": -11.655805587768555, "global_step": 236318, "epoch": 1406} {"train_loss": -11.602499008178711, "global_step": 236319, "epoch": 1406} {"train_loss": -11.869983673095703, "global_step": 236320, "epoch": 1406} {"train_loss": -11.382515907287598, "global_step": 236321, "epoch": 1406} {"train_loss": -10.885978698730469, "global_step": 236322, "epoch": 1406} {"train_loss": -12.004301071166992, "global_step": 236323, "epoch": 1406} {"train_loss": -11.032215118408203, "global_step": 236324, "epoch": 1406} {"train_loss": -11.74081039428711, "global_step": 236325, "epoch": 1406} {"train_loss": -11.54277515411377, "global_step": 236326, "epoch": 1406} {"train_loss": -11.362237930297852, "global_step": 236327, "epoch": 1406} {"train_loss": -10.408366203308105, "global_step": 236328, "epoch": 1406} {"train_loss": -11.463325500488281, "global_step": 236329, "epoch": 1406} {"train_loss": -10.96611213684082, "global_step": 236330, "epoch": 1406} {"train_loss": -8.744964599609375, "global_step": 236331, "epoch": 1406} {"train_loss": -9.008932113647461, "global_step": 236332, "epoch": 1406} {"train_loss": -9.714494705200195, "global_step": 236333, "epoch": 1406} {"train_loss": -10.702560424804688, "global_step": 236334, "epoch": 1406} {"train_loss": -10.67441177368164, "global_step": 236335, "epoch": 1406} {"train_loss": -9.706073760986328, "global_step": 236336, "epoch": 1406} {"train_loss": -11.167205810546875, "global_step": 236337, "epoch": 1406} {"train_loss": -10.795948028564453, "global_step": 236338, "epoch": 1406} {"train_loss": -11.453512191772461, "global_step": 236339, "epoch": 1406} {"train_loss": -10.972587585449219, "global_step": 236340, "epoch": 1406} {"train_loss": -10.264789581298828, "global_step": 236341, "epoch": 1406} {"train_loss": -11.739974975585938, "global_step": 236342, "epoch": 1406} {"train_loss": -10.76637077331543, "global_step": 236343, "epoch": 1406} {"train_loss": -10.987784385681152, "global_step": 236344, "epoch": 1406} {"train_loss": -11.323616027832031, "global_step": 236345, "epoch": 1406} {"train_loss": -11.289007186889648, "global_step": 236346, "epoch": 1406} {"train_loss": -11.308451652526855, "global_step": 236347, "epoch": 1406} {"train_loss": -11.509211540222168, "global_step": 236348, "epoch": 1406} {"train_loss": -11.5565767288208, "global_step": 236349, "epoch": 1406} {"train_loss": -11.501425743103027, "global_step": 236350, "epoch": 1406} {"train_loss": -11.271986961364746, "global_step": 236351, "epoch": 1406} {"train_loss": -11.72768783569336, "global_step": 236352, "epoch": 1406} {"train_loss": -11.47878360748291, "global_step": 236353, "epoch": 1406} {"train_loss": -11.579681396484375, "global_step": 236354, "epoch": 1406} {"train_loss": -11.74150276184082, "global_step": 236355, "epoch": 1406} {"train_loss": -11.580013275146484, "global_step": 236356, "epoch": 1406} {"train_loss": -11.806476593017578, "global_step": 236357, "epoch": 1406} {"train_loss": -11.409467697143555, "global_step": 236358, "epoch": 1406} {"train_loss": -11.55310344696045, "global_step": 236359, "epoch": 1406} {"train_loss": -11.627669334411621, "global_step": 236360, "epoch": 1406} {"train_loss": -11.745655059814453, "global_step": 236361, "epoch": 1406} {"train_loss": -11.81817626953125, "global_step": 236362, "epoch": 1406} {"train_loss": -11.752413749694824, "global_step": 236363, "epoch": 1406} {"train_loss": -11.524712562561035, "global_step": 236364, "epoch": 1406} {"train_loss": -11.509504318237305, "global_step": 236365, "epoch": 1406} {"train_loss": -11.749527931213379, "global_step": 236366, "epoch": 1406} {"train_loss": -11.659560203552246, "global_step": 236367, "epoch": 1406} {"train_loss": -11.522851943969727, "global_step": 236368, "epoch": 1406} {"train_loss": -11.751188278198242, "global_step": 236369, "epoch": 1406} {"train_loss": -11.636480331420898, "global_step": 236370, "epoch": 1406} {"train_loss": -11.690263748168945, "global_step": 236371, "epoch": 1406} {"train_loss": -11.488587379455566, "global_step": 236372, "epoch": 1406} {"train_loss": -11.611593246459961, "global_step": 236373, "epoch": 1406} {"train_loss": -11.790313720703125, "global_step": 236374, "epoch": 1406} {"train_loss": -11.293418276877631, "global_step": 236375, "epoch": 1406, "val_loss": 259046.1875} {"train_loss": -11.74968433380127, "global_step": 236376, "epoch": 1407} {"train_loss": -11.541099548339844, "global_step": 236377, "epoch": 1407} {"train_loss": -11.581461906433105, "global_step": 236378, "epoch": 1407} {"train_loss": -11.186949729919434, "global_step": 236379, "epoch": 1407} {"train_loss": -11.818731307983398, "global_step": 236380, "epoch": 1407} {"train_loss": -11.411149024963379, "global_step": 236381, "epoch": 1407} {"train_loss": -11.605405807495117, "global_step": 236382, "epoch": 1407} {"train_loss": -11.628013610839844, "global_step": 236383, "epoch": 1407} {"train_loss": -11.716361999511719, "global_step": 236384, "epoch": 1407} {"train_loss": -11.030241012573242, "global_step": 236385, "epoch": 1407} {"train_loss": -11.480231285095215, "global_step": 236386, "epoch": 1407} {"train_loss": -11.497323036193848, "global_step": 236387, "epoch": 1407} {"train_loss": -11.548477172851562, "global_step": 236388, "epoch": 1407} {"train_loss": -11.925106048583984, "global_step": 236389, "epoch": 1407} {"train_loss": -11.548309326171875, "global_step": 236390, "epoch": 1407} {"train_loss": -11.469657897949219, "global_step": 236391, "epoch": 1407} {"train_loss": -11.488487243652344, "global_step": 236392, "epoch": 1407} {"train_loss": -11.642599105834961, "global_step": 236393, "epoch": 1407} {"train_loss": -11.37472915649414, "global_step": 236394, "epoch": 1407} {"train_loss": -11.217771530151367, "global_step": 236395, "epoch": 1407} {"train_loss": -11.347692489624023, "global_step": 236396, "epoch": 1407} {"train_loss": -11.439070701599121, "global_step": 236397, "epoch": 1407} {"train_loss": -11.76952075958252, "global_step": 236398, "epoch": 1407} {"train_loss": -11.702235221862793, "global_step": 236399, "epoch": 1407} {"train_loss": -11.800400733947754, "global_step": 236400, "epoch": 1407} {"train_loss": -11.647293090820312, "global_step": 236401, "epoch": 1407} {"train_loss": -11.84228801727295, "global_step": 236402, "epoch": 1407} {"train_loss": -11.27361011505127, "global_step": 236403, "epoch": 1407} {"train_loss": -11.961124420166016, "global_step": 236404, "epoch": 1407} {"train_loss": -11.860142707824707, "global_step": 236405, "epoch": 1407} {"train_loss": -11.86636734008789, "global_step": 236406, "epoch": 1407} {"train_loss": -11.833664894104004, "global_step": 236407, "epoch": 1407} {"train_loss": -11.849813461303711, "global_step": 236408, "epoch": 1407} {"train_loss": -12.029874801635742, "global_step": 236409, "epoch": 1407} {"train_loss": -11.897369384765625, "global_step": 236410, "epoch": 1407} {"train_loss": -11.958358764648438, "global_step": 236411, "epoch": 1407} {"train_loss": -11.754250526428223, "global_step": 236412, "epoch": 1407} {"train_loss": -11.95334243774414, "global_step": 236413, "epoch": 1407} {"train_loss": -11.85010814666748, "global_step": 236414, "epoch": 1407} {"train_loss": -12.121182441711426, "global_step": 236415, "epoch": 1407} {"train_loss": -12.028067588806152, "global_step": 236416, "epoch": 1407} {"train_loss": -11.908126831054688, "global_step": 236417, "epoch": 1407} {"train_loss": -12.146076202392578, "global_step": 236418, "epoch": 1407} {"train_loss": -11.887216567993164, "global_step": 236419, "epoch": 1407} {"train_loss": -11.942081451416016, "global_step": 236420, "epoch": 1407} {"train_loss": -12.101269721984863, "global_step": 236421, "epoch": 1407} {"train_loss": -11.941688537597656, "global_step": 236422, "epoch": 1407} {"train_loss": -11.71080207824707, "global_step": 236423, "epoch": 1407} {"train_loss": -11.9420166015625, "global_step": 236424, "epoch": 1407} {"train_loss": -11.743762969970703, "global_step": 236425, "epoch": 1407} {"train_loss": -11.50505542755127, "global_step": 236426, "epoch": 1407} {"train_loss": -11.51418685913086, "global_step": 236427, "epoch": 1407} {"train_loss": -11.691690444946289, "global_step": 236428, "epoch": 1407} {"train_loss": -11.392833709716797, "global_step": 236429, "epoch": 1407} {"train_loss": -11.163818359375, "global_step": 236430, "epoch": 1407} {"train_loss": -11.671468734741211, "global_step": 236431, "epoch": 1407} {"train_loss": -11.196853637695312, "global_step": 236432, "epoch": 1407} {"train_loss": -12.090575218200684, "global_step": 236433, "epoch": 1407} {"train_loss": -11.601139068603516, "global_step": 236434, "epoch": 1407} {"train_loss": -11.766860961914062, "global_step": 236435, "epoch": 1407} {"train_loss": -11.695584297180176, "global_step": 236436, "epoch": 1407} {"train_loss": -12.029645919799805, "global_step": 236437, "epoch": 1407} {"train_loss": -11.923519134521484, "global_step": 236438, "epoch": 1407} {"train_loss": -11.62935733795166, "global_step": 236439, "epoch": 1407} {"train_loss": -11.872302055358887, "global_step": 236440, "epoch": 1407} {"train_loss": -11.467949867248535, "global_step": 236441, "epoch": 1407} {"train_loss": -11.927427291870117, "global_step": 236442, "epoch": 1407} {"train_loss": -11.408626556396484, "global_step": 236443, "epoch": 1407} {"train_loss": -11.437749862670898, "global_step": 236444, "epoch": 1407} {"train_loss": -10.301194190979004, "global_step": 236445, "epoch": 1407} {"train_loss": -10.592287063598633, "global_step": 236446, "epoch": 1407} {"train_loss": -11.56245231628418, "global_step": 236447, "epoch": 1407} {"train_loss": -11.621915817260742, "global_step": 236448, "epoch": 1407} {"train_loss": -10.827107429504395, "global_step": 236449, "epoch": 1407} {"train_loss": -11.479551315307617, "global_step": 236450, "epoch": 1407} {"train_loss": -11.81145191192627, "global_step": 236451, "epoch": 1407} {"train_loss": -10.961671829223633, "global_step": 236452, "epoch": 1407} {"train_loss": -10.474821090698242, "global_step": 236453, "epoch": 1407} {"train_loss": -11.506081581115723, "global_step": 236454, "epoch": 1407} {"train_loss": -9.87253475189209, "global_step": 236455, "epoch": 1407} {"train_loss": -11.282414436340332, "global_step": 236456, "epoch": 1407} {"train_loss": -9.07905101776123, "global_step": 236457, "epoch": 1407} {"train_loss": -10.98404598236084, "global_step": 236458, "epoch": 1407} {"train_loss": -11.175433158874512, "global_step": 236459, "epoch": 1407} {"train_loss": -10.433807373046875, "global_step": 236460, "epoch": 1407} {"train_loss": -11.15646743774414, "global_step": 236461, "epoch": 1407} {"train_loss": -9.90269947052002, "global_step": 236462, "epoch": 1407} {"train_loss": -10.873065948486328, "global_step": 236463, "epoch": 1407} {"train_loss": -10.120293617248535, "global_step": 236464, "epoch": 1407} {"train_loss": -10.625965118408203, "global_step": 236465, "epoch": 1407} {"train_loss": -11.354754447937012, "global_step": 236466, "epoch": 1407} {"train_loss": -10.741714477539062, "global_step": 236467, "epoch": 1407} {"train_loss": -11.683744430541992, "global_step": 236468, "epoch": 1407} {"train_loss": -10.882980346679688, "global_step": 236469, "epoch": 1407} {"train_loss": -11.35149097442627, "global_step": 236470, "epoch": 1407} {"train_loss": -11.299970626831055, "global_step": 236471, "epoch": 1407} {"train_loss": -11.420354843139648, "global_step": 236472, "epoch": 1407} {"train_loss": -11.295818328857422, "global_step": 236473, "epoch": 1407} {"train_loss": -11.381464958190918, "global_step": 236474, "epoch": 1407} {"train_loss": -11.449920654296875, "global_step": 236475, "epoch": 1407} {"train_loss": -11.363059997558594, "global_step": 236476, "epoch": 1407} {"train_loss": -11.555779457092285, "global_step": 236477, "epoch": 1407} {"train_loss": -11.438197135925293, "global_step": 236478, "epoch": 1407} {"train_loss": -11.086804389953613, "global_step": 236479, "epoch": 1407} {"train_loss": -11.188213348388672, "global_step": 236480, "epoch": 1407} {"train_loss": -11.418771743774414, "global_step": 236481, "epoch": 1407} {"train_loss": -10.660574913024902, "global_step": 236482, "epoch": 1407} {"train_loss": -11.276169776916504, "global_step": 236483, "epoch": 1407} {"train_loss": -11.041614532470703, "global_step": 236484, "epoch": 1407} {"train_loss": -10.83327865600586, "global_step": 236485, "epoch": 1407} {"train_loss": -11.02650260925293, "global_step": 236486, "epoch": 1407} {"train_loss": -11.05944538116455, "global_step": 236487, "epoch": 1407} {"train_loss": -11.037922859191895, "global_step": 236488, "epoch": 1407} {"train_loss": -10.914661407470703, "global_step": 236489, "epoch": 1407} {"train_loss": -11.719958305358887, "global_step": 236490, "epoch": 1407} {"train_loss": -11.231515884399414, "global_step": 236491, "epoch": 1407} {"train_loss": -11.364181518554688, "global_step": 236492, "epoch": 1407} {"train_loss": -11.26693344116211, "global_step": 236493, "epoch": 1407} {"train_loss": -11.468437194824219, "global_step": 236494, "epoch": 1407} {"train_loss": -11.284025192260742, "global_step": 236495, "epoch": 1407} {"train_loss": -11.539003372192383, "global_step": 236496, "epoch": 1407} {"train_loss": -11.514752388000488, "global_step": 236497, "epoch": 1407} {"train_loss": -11.8546781539917, "global_step": 236498, "epoch": 1407} {"train_loss": -11.471084594726562, "global_step": 236499, "epoch": 1407} {"train_loss": -11.776111602783203, "global_step": 236500, "epoch": 1407} {"train_loss": -11.419855117797852, "global_step": 236501, "epoch": 1407} {"train_loss": -11.883044242858887, "global_step": 236502, "epoch": 1407} {"train_loss": -11.537025451660156, "global_step": 236503, "epoch": 1407} {"train_loss": -11.83728313446045, "global_step": 236504, "epoch": 1407} {"train_loss": -11.682770729064941, "global_step": 236505, "epoch": 1407} {"train_loss": -11.912077903747559, "global_step": 236506, "epoch": 1407} {"train_loss": -11.88379192352295, "global_step": 236507, "epoch": 1407} {"train_loss": -11.8560791015625, "global_step": 236508, "epoch": 1407} {"train_loss": -11.796797752380371, "global_step": 236509, "epoch": 1407} {"train_loss": -11.795904159545898, "global_step": 236510, "epoch": 1407} {"train_loss": -11.729394912719727, "global_step": 236511, "epoch": 1407} {"train_loss": -11.69991683959961, "global_step": 236512, "epoch": 1407} {"train_loss": -11.85400676727295, "global_step": 236513, "epoch": 1407} {"train_loss": -11.760651588439941, "global_step": 236514, "epoch": 1407} {"train_loss": -11.897903442382812, "global_step": 236515, "epoch": 1407} {"train_loss": -11.845355987548828, "global_step": 236516, "epoch": 1407} {"train_loss": -11.696067810058594, "global_step": 236517, "epoch": 1407} {"train_loss": -11.734416961669922, "global_step": 236518, "epoch": 1407} {"train_loss": -11.80384635925293, "global_step": 236519, "epoch": 1407} {"train_loss": -11.842195510864258, "global_step": 236520, "epoch": 1407} {"train_loss": -11.644536972045898, "global_step": 236521, "epoch": 1407} {"train_loss": -11.82758903503418, "global_step": 236522, "epoch": 1407} {"train_loss": -11.624946594238281, "global_step": 236523, "epoch": 1407} {"train_loss": -11.90477466583252, "global_step": 236524, "epoch": 1407} {"train_loss": -11.784736633300781, "global_step": 236525, "epoch": 1407} {"train_loss": -11.74029541015625, "global_step": 236526, "epoch": 1407} {"train_loss": -11.852121353149414, "global_step": 236527, "epoch": 1407} {"train_loss": -11.796703338623047, "global_step": 236528, "epoch": 1407} {"train_loss": -11.776151657104492, "global_step": 236529, "epoch": 1407} {"train_loss": -11.592856407165527, "global_step": 236530, "epoch": 1407} {"train_loss": -11.911748886108398, "global_step": 236531, "epoch": 1407} {"train_loss": -11.650160789489746, "global_step": 236532, "epoch": 1407} {"train_loss": -12.014503479003906, "global_step": 236533, "epoch": 1407} {"train_loss": -11.97269058227539, "global_step": 236534, "epoch": 1407} {"train_loss": -11.584036827087402, "global_step": 236535, "epoch": 1407} {"train_loss": -11.73377513885498, "global_step": 236536, "epoch": 1407} {"train_loss": -11.989448547363281, "global_step": 236537, "epoch": 1407} {"train_loss": -11.465612411499023, "global_step": 236538, "epoch": 1407} {"train_loss": -11.68846321105957, "global_step": 236539, "epoch": 1407} {"train_loss": -11.475181579589844, "global_step": 236540, "epoch": 1407} {"train_loss": -12.060586929321289, "global_step": 236541, "epoch": 1407} {"train_loss": -11.89474105834961, "global_step": 236542, "epoch": 1407} {"train_loss": -11.515641547384716, "global_step": 236543, "epoch": 1407, "val_loss": 257398.25} {"train_loss": -11.84298038482666, "global_step": 236544, "epoch": 1408} {"train_loss": -11.744214057922363, "global_step": 236545, "epoch": 1408} {"train_loss": -11.862846374511719, "global_step": 236546, "epoch": 1408} {"train_loss": -11.892565727233887, "global_step": 236547, "epoch": 1408} {"train_loss": -11.761754989624023, "global_step": 236548, "epoch": 1408} {"train_loss": -11.959589958190918, "global_step": 236549, "epoch": 1408} {"train_loss": -11.455921173095703, "global_step": 236550, "epoch": 1408} {"train_loss": -11.697749137878418, "global_step": 236551, "epoch": 1408} {"train_loss": -12.09819221496582, "global_step": 236552, "epoch": 1408} {"train_loss": -11.962903022766113, "global_step": 236553, "epoch": 1408} {"train_loss": -11.868167877197266, "global_step": 236554, "epoch": 1408} {"train_loss": -11.515098571777344, "global_step": 236555, "epoch": 1408} {"train_loss": -11.836252212524414, "global_step": 236556, "epoch": 1408} {"train_loss": -12.024259567260742, "global_step": 236557, "epoch": 1408} {"train_loss": -11.90460205078125, "global_step": 236558, "epoch": 1408} {"train_loss": -11.67506217956543, "global_step": 236559, "epoch": 1408} {"train_loss": -12.041879653930664, "global_step": 236560, "epoch": 1408} {"train_loss": -11.50562572479248, "global_step": 236561, "epoch": 1408} {"train_loss": -11.027170181274414, "global_step": 236562, "epoch": 1408} {"train_loss": -11.90699577331543, "global_step": 236563, "epoch": 1408} {"train_loss": -11.55750560760498, "global_step": 236564, "epoch": 1408} {"train_loss": -11.827935218811035, "global_step": 236565, "epoch": 1408} {"train_loss": -10.94247817993164, "global_step": 236566, "epoch": 1408} {"train_loss": -11.00461196899414, "global_step": 236567, "epoch": 1408} {"train_loss": -11.847480773925781, "global_step": 236568, "epoch": 1408} {"train_loss": -10.61485767364502, "global_step": 236569, "epoch": 1408} {"train_loss": -11.009506225585938, "global_step": 236570, "epoch": 1408} {"train_loss": -11.753175735473633, "global_step": 236571, "epoch": 1408} {"train_loss": -10.832659721374512, "global_step": 236572, "epoch": 1408} {"train_loss": -11.894981384277344, "global_step": 236573, "epoch": 1408} {"train_loss": -11.174644470214844, "global_step": 236574, "epoch": 1408} {"train_loss": -10.957795143127441, "global_step": 236575, "epoch": 1408} {"train_loss": -11.461931228637695, "global_step": 236576, "epoch": 1408} {"train_loss": -11.074127197265625, "global_step": 236577, "epoch": 1408} {"train_loss": -11.50411319732666, "global_step": 236578, "epoch": 1408} {"train_loss": -11.05415153503418, "global_step": 236579, "epoch": 1408} {"train_loss": -11.388994216918945, "global_step": 236580, "epoch": 1408} {"train_loss": -11.151971817016602, "global_step": 236581, "epoch": 1408} {"train_loss": -11.172708511352539, "global_step": 236582, "epoch": 1408} {"train_loss": -11.563985824584961, "global_step": 236583, "epoch": 1408} {"train_loss": -10.836054801940918, "global_step": 236584, "epoch": 1408} {"train_loss": -11.810349464416504, "global_step": 236585, "epoch": 1408} {"train_loss": -11.289993286132812, "global_step": 236586, "epoch": 1408} {"train_loss": -11.35999870300293, "global_step": 236587, "epoch": 1408} {"train_loss": -11.548593521118164, "global_step": 236588, "epoch": 1408} {"train_loss": -11.434999465942383, "global_step": 236589, "epoch": 1408} {"train_loss": -11.546188354492188, "global_step": 236590, "epoch": 1408} {"train_loss": -11.308353424072266, "global_step": 236591, "epoch": 1408} {"train_loss": -11.656478881835938, "global_step": 236592, "epoch": 1408} {"train_loss": -11.585006713867188, "global_step": 236593, "epoch": 1408} {"train_loss": -11.682223320007324, "global_step": 236594, "epoch": 1408} {"train_loss": -11.623889923095703, "global_step": 236595, "epoch": 1408} {"train_loss": -11.748870849609375, "global_step": 236596, "epoch": 1408} {"train_loss": -11.90412712097168, "global_step": 236597, "epoch": 1408} {"train_loss": -11.718242645263672, "global_step": 236598, "epoch": 1408} {"train_loss": -11.669210433959961, "global_step": 236599, "epoch": 1408} {"train_loss": -11.425731658935547, "global_step": 236600, "epoch": 1408} {"train_loss": -11.813319206237793, "global_step": 236601, "epoch": 1408} {"train_loss": -11.732583999633789, "global_step": 236602, "epoch": 1408} {"train_loss": -11.7039794921875, "global_step": 236603, "epoch": 1408} {"train_loss": -11.87857437133789, "global_step": 236604, "epoch": 1408} {"train_loss": -11.743403434753418, "global_step": 236605, "epoch": 1408} {"train_loss": -11.656852722167969, "global_step": 236606, "epoch": 1408} {"train_loss": -11.716190338134766, "global_step": 236607, "epoch": 1408} {"train_loss": -11.685096740722656, "global_step": 236608, "epoch": 1408} {"train_loss": -11.735101699829102, "global_step": 236609, "epoch": 1408} {"train_loss": -11.896773338317871, "global_step": 236610, "epoch": 1408} {"train_loss": -11.838197708129883, "global_step": 236611, "epoch": 1408} {"train_loss": -11.631298065185547, "global_step": 236612, "epoch": 1408} {"train_loss": -12.071308135986328, "global_step": 236613, "epoch": 1408} {"train_loss": -11.669755935668945, "global_step": 236614, "epoch": 1408} {"train_loss": -11.72459602355957, "global_step": 236615, "epoch": 1408} {"train_loss": -12.031937599182129, "global_step": 236616, "epoch": 1408} {"train_loss": -11.799830436706543, "global_step": 236617, "epoch": 1408} {"train_loss": -11.736971855163574, "global_step": 236618, "epoch": 1408} {"train_loss": -12.15559196472168, "global_step": 236619, "epoch": 1408} {"train_loss": -11.840784072875977, "global_step": 236620, "epoch": 1408} {"train_loss": -11.648758888244629, "global_step": 236621, "epoch": 1408} {"train_loss": -11.836462020874023, "global_step": 236622, "epoch": 1408} {"train_loss": -12.01806354522705, "global_step": 236623, "epoch": 1408} {"train_loss": -11.828929901123047, "global_step": 236624, "epoch": 1408} {"train_loss": -11.915973663330078, "global_step": 236625, "epoch": 1408} {"train_loss": -12.020586967468262, "global_step": 236626, "epoch": 1408} {"train_loss": -11.426501274108887, "global_step": 236627, "epoch": 1408} {"train_loss": -11.95632266998291, "global_step": 236628, "epoch": 1408} {"train_loss": -12.147478103637695, "global_step": 236629, "epoch": 1408} {"train_loss": -11.939314842224121, "global_step": 236630, "epoch": 1408} {"train_loss": -11.935567855834961, "global_step": 236631, "epoch": 1408} {"train_loss": -12.036458015441895, "global_step": 236632, "epoch": 1408} {"train_loss": -11.880536079406738, "global_step": 236633, "epoch": 1408} {"train_loss": -12.191638946533203, "global_step": 236634, "epoch": 1408} {"train_loss": -11.784137725830078, "global_step": 236635, "epoch": 1408} {"train_loss": -11.972814559936523, "global_step": 236636, "epoch": 1408} {"train_loss": -11.878463745117188, "global_step": 236637, "epoch": 1408} {"train_loss": -11.723873138427734, "global_step": 236638, "epoch": 1408} {"train_loss": -11.699213027954102, "global_step": 236639, "epoch": 1408} {"train_loss": -11.847097396850586, "global_step": 236640, "epoch": 1408} {"train_loss": -11.692209243774414, "global_step": 236641, "epoch": 1408} {"train_loss": -11.424201965332031, "global_step": 236642, "epoch": 1408} {"train_loss": -11.302620887756348, "global_step": 236643, "epoch": 1408} {"train_loss": -11.19741153717041, "global_step": 236644, "epoch": 1408} {"train_loss": -12.187272071838379, "global_step": 236645, "epoch": 1408} {"train_loss": -11.992173194885254, "global_step": 236646, "epoch": 1408} {"train_loss": -11.587691307067871, "global_step": 236647, "epoch": 1408} {"train_loss": -11.215396881103516, "global_step": 236648, "epoch": 1408} {"train_loss": -11.756357192993164, "global_step": 236649, "epoch": 1408} {"train_loss": -11.8695707321167, "global_step": 236650, "epoch": 1408} {"train_loss": -11.177865982055664, "global_step": 236651, "epoch": 1408} {"train_loss": -10.92036247253418, "global_step": 236652, "epoch": 1408} {"train_loss": -11.083871841430664, "global_step": 236653, "epoch": 1408} {"train_loss": -11.911983489990234, "global_step": 236654, "epoch": 1408} {"train_loss": -11.791454315185547, "global_step": 236655, "epoch": 1408} {"train_loss": -12.219019889831543, "global_step": 236656, "epoch": 1408} {"train_loss": -11.41788387298584, "global_step": 236657, "epoch": 1408} {"train_loss": -11.890144348144531, "global_step": 236658, "epoch": 1408} {"train_loss": -11.737855911254883, "global_step": 236659, "epoch": 1408} {"train_loss": -11.791796684265137, "global_step": 236660, "epoch": 1408} {"train_loss": -11.673208236694336, "global_step": 236661, "epoch": 1408} {"train_loss": -11.420818328857422, "global_step": 236662, "epoch": 1408} {"train_loss": -11.506301879882812, "global_step": 236663, "epoch": 1408} {"train_loss": -11.525394439697266, "global_step": 236664, "epoch": 1408} {"train_loss": -10.953653335571289, "global_step": 236665, "epoch": 1408} {"train_loss": -11.376230239868164, "global_step": 236666, "epoch": 1408} {"train_loss": -11.542160034179688, "global_step": 236667, "epoch": 1408} {"train_loss": -10.488147735595703, "global_step": 236668, "epoch": 1408} {"train_loss": -9.768674850463867, "global_step": 236669, "epoch": 1408} {"train_loss": -10.63632869720459, "global_step": 236670, "epoch": 1408} {"train_loss": -9.040623664855957, "global_step": 236671, "epoch": 1408} {"train_loss": -8.711029052734375, "global_step": 236672, "epoch": 1408} {"train_loss": -10.625638008117676, "global_step": 236673, "epoch": 1408} {"train_loss": -8.610881805419922, "global_step": 236674, "epoch": 1408} {"train_loss": -8.649999618530273, "global_step": 236675, "epoch": 1408} {"train_loss": -10.234956741333008, "global_step": 236676, "epoch": 1408} {"train_loss": -8.037242889404297, "global_step": 236677, "epoch": 1408} {"train_loss": -8.327655792236328, "global_step": 236678, "epoch": 1408} {"train_loss": -8.582143783569336, "global_step": 236679, "epoch": 1408} {"train_loss": -10.313533782958984, "global_step": 236680, "epoch": 1408} {"train_loss": -8.604248046875, "global_step": 236681, "epoch": 1408} {"train_loss": -8.993746757507324, "global_step": 236682, "epoch": 1408} {"train_loss": -10.725296020507812, "global_step": 236683, "epoch": 1408} {"train_loss": -9.606186866760254, "global_step": 236684, "epoch": 1408} {"train_loss": -10.130498886108398, "global_step": 236685, "epoch": 1408} {"train_loss": -8.79089069366455, "global_step": 236686, "epoch": 1408} {"train_loss": -10.774431228637695, "global_step": 236687, "epoch": 1408} {"train_loss": -10.151723861694336, "global_step": 236688, "epoch": 1408} {"train_loss": -9.238981246948242, "global_step": 236689, "epoch": 1408} {"train_loss": -10.570378303527832, "global_step": 236690, "epoch": 1408} {"train_loss": -9.972155570983887, "global_step": 236691, "epoch": 1408} {"train_loss": -10.670768737792969, "global_step": 236692, "epoch": 1408} {"train_loss": -10.727970123291016, "global_step": 236693, "epoch": 1408} {"train_loss": -10.76559829711914, "global_step": 236694, "epoch": 1408} {"train_loss": -10.52810001373291, "global_step": 236695, "epoch": 1408} {"train_loss": -11.091382026672363, "global_step": 236696, "epoch": 1408} {"train_loss": -10.866402626037598, "global_step": 236697, "epoch": 1408} {"train_loss": -10.97091007232666, "global_step": 236698, "epoch": 1408} {"train_loss": -11.069613456726074, "global_step": 236699, "epoch": 1408} {"train_loss": -11.212268829345703, "global_step": 236700, "epoch": 1408} {"train_loss": -10.952140808105469, "global_step": 236701, "epoch": 1408} {"train_loss": -11.286796569824219, "global_step": 236702, "epoch": 1408} {"train_loss": -10.96328353881836, "global_step": 236703, "epoch": 1408} {"train_loss": -10.83661937713623, "global_step": 236704, "epoch": 1408} {"train_loss": -11.258527755737305, "global_step": 236705, "epoch": 1408} {"train_loss": -11.095480918884277, "global_step": 236706, "epoch": 1408} {"train_loss": -10.983722686767578, "global_step": 236707, "epoch": 1408} {"train_loss": -10.991769790649414, "global_step": 236708, "epoch": 1408} {"train_loss": -11.244390487670898, "global_step": 236709, "epoch": 1408} {"train_loss": -11.17985725402832, "global_step": 236710, "epoch": 1408} {"train_loss": -11.267976653008233, "global_step": 236711, "epoch": 1408, "val_loss": 252409.8125} {"train_loss": -11.409360885620117, "global_step": 236712, "epoch": 1409} {"train_loss": -11.354100227355957, "global_step": 236713, "epoch": 1409} {"train_loss": -11.365945816040039, "global_step": 236714, "epoch": 1409} {"train_loss": -11.332200050354004, "global_step": 236715, "epoch": 1409} {"train_loss": -11.44304084777832, "global_step": 236716, "epoch": 1409} {"train_loss": -11.166011810302734, "global_step": 236717, "epoch": 1409} {"train_loss": -11.469703674316406, "global_step": 236718, "epoch": 1409} {"train_loss": -11.519613265991211, "global_step": 236719, "epoch": 1409} {"train_loss": -11.463981628417969, "global_step": 236720, "epoch": 1409} {"train_loss": -11.363452911376953, "global_step": 236721, "epoch": 1409} {"train_loss": -11.594379425048828, "global_step": 236722, "epoch": 1409} {"train_loss": -11.625226974487305, "global_step": 236723, "epoch": 1409} {"train_loss": -11.415843963623047, "global_step": 236724, "epoch": 1409} {"train_loss": -11.52283763885498, "global_step": 236725, "epoch": 1409} {"train_loss": -11.549135208129883, "global_step": 236726, "epoch": 1409} {"train_loss": -11.379840850830078, "global_step": 236727, "epoch": 1409} {"train_loss": -11.711191177368164, "global_step": 236728, "epoch": 1409} {"train_loss": -11.508163452148438, "global_step": 236729, "epoch": 1409} {"train_loss": -11.592429161071777, "global_step": 236730, "epoch": 1409} {"train_loss": -11.72525405883789, "global_step": 236731, "epoch": 1409} {"train_loss": -11.759411811828613, "global_step": 236732, "epoch": 1409} {"train_loss": -11.597906112670898, "global_step": 236733, "epoch": 1409} {"train_loss": -11.608133316040039, "global_step": 236734, "epoch": 1409} {"train_loss": -11.720121383666992, "global_step": 236735, "epoch": 1409} {"train_loss": -11.595276832580566, "global_step": 236736, "epoch": 1409} {"train_loss": -11.59175968170166, "global_step": 236737, "epoch": 1409} {"train_loss": -11.860198974609375, "global_step": 236738, "epoch": 1409} {"train_loss": -11.612131118774414, "global_step": 236739, "epoch": 1409} {"train_loss": -11.708513259887695, "global_step": 236740, "epoch": 1409} {"train_loss": -11.655271530151367, "global_step": 236741, "epoch": 1409} {"train_loss": -11.621481895446777, "global_step": 236742, "epoch": 1409} {"train_loss": -11.555559158325195, "global_step": 236743, "epoch": 1409} {"train_loss": -11.87939167022705, "global_step": 236744, "epoch": 1409} {"train_loss": -11.762282371520996, "global_step": 236745, "epoch": 1409} {"train_loss": -11.74086856842041, "global_step": 236746, "epoch": 1409} {"train_loss": -11.783166885375977, "global_step": 236747, "epoch": 1409} {"train_loss": -11.8063325881958, "global_step": 236748, "epoch": 1409} {"train_loss": -11.991583824157715, "global_step": 236749, "epoch": 1409} {"train_loss": -11.891348838806152, "global_step": 236750, "epoch": 1409} {"train_loss": -11.869348526000977, "global_step": 236751, "epoch": 1409} {"train_loss": -11.86626148223877, "global_step": 236752, "epoch": 1409} {"train_loss": -11.922637939453125, "global_step": 236753, "epoch": 1409} {"train_loss": -11.871708869934082, "global_step": 236754, "epoch": 1409} {"train_loss": -11.72761344909668, "global_step": 236755, "epoch": 1409} {"train_loss": -11.849259376525879, "global_step": 236756, "epoch": 1409} {"train_loss": -11.92070484161377, "global_step": 236757, "epoch": 1409} {"train_loss": -12.051913261413574, "global_step": 236758, "epoch": 1409} {"train_loss": -11.837949752807617, "global_step": 236759, "epoch": 1409} {"train_loss": -11.930294036865234, "global_step": 236760, "epoch": 1409} {"train_loss": -11.786087036132812, "global_step": 236761, "epoch": 1409} {"train_loss": -11.679668426513672, "global_step": 236762, "epoch": 1409} {"train_loss": -12.141761779785156, "global_step": 236763, "epoch": 1409} {"train_loss": -11.839120864868164, "global_step": 236764, "epoch": 1409} {"train_loss": -11.767699241638184, "global_step": 236765, "epoch": 1409} {"train_loss": -11.645082473754883, "global_step": 236766, "epoch": 1409} {"train_loss": -11.5840425491333, "global_step": 236767, "epoch": 1409} {"train_loss": -11.726911544799805, "global_step": 236768, "epoch": 1409} {"train_loss": -11.843271255493164, "global_step": 236769, "epoch": 1409} {"train_loss": -11.248600006103516, "global_step": 236770, "epoch": 1409} {"train_loss": -11.641845703125, "global_step": 236771, "epoch": 1409} {"train_loss": -12.01331901550293, "global_step": 236772, "epoch": 1409} {"train_loss": -11.821076393127441, "global_step": 236773, "epoch": 1409} {"train_loss": -11.954000473022461, "global_step": 236774, "epoch": 1409} {"train_loss": -11.856115341186523, "global_step": 236775, "epoch": 1409} {"train_loss": -11.83661937713623, "global_step": 236776, "epoch": 1409} {"train_loss": -11.633110046386719, "global_step": 236777, "epoch": 1409} {"train_loss": -11.95775032043457, "global_step": 236778, "epoch": 1409} {"train_loss": -11.714340209960938, "global_step": 236779, "epoch": 1409} {"train_loss": -11.919503211975098, "global_step": 236780, "epoch": 1409} {"train_loss": -11.823959350585938, "global_step": 236781, "epoch": 1409} {"train_loss": -11.847857475280762, "global_step": 236782, "epoch": 1409} {"train_loss": -11.829938888549805, "global_step": 236783, "epoch": 1409} {"train_loss": -11.822547912597656, "global_step": 236784, "epoch": 1409} {"train_loss": -11.632019996643066, "global_step": 236785, "epoch": 1409} {"train_loss": -11.878744125366211, "global_step": 236786, "epoch": 1409} {"train_loss": -11.371203422546387, "global_step": 236787, "epoch": 1409} {"train_loss": -11.401836395263672, "global_step": 236788, "epoch": 1409} {"train_loss": -11.035358428955078, "global_step": 236789, "epoch": 1409} {"train_loss": -11.710841178894043, "global_step": 236790, "epoch": 1409} {"train_loss": -11.51950740814209, "global_step": 236791, "epoch": 1409} {"train_loss": -11.555281639099121, "global_step": 236792, "epoch": 1409} {"train_loss": -11.870414733886719, "global_step": 236793, "epoch": 1409} {"train_loss": -11.57894515991211, "global_step": 236794, "epoch": 1409} {"train_loss": -11.991171836853027, "global_step": 236795, "epoch": 1409} {"train_loss": -11.486101150512695, "global_step": 236796, "epoch": 1409} {"train_loss": -11.803092956542969, "global_step": 236797, "epoch": 1409} {"train_loss": -11.667396545410156, "global_step": 236798, "epoch": 1409} {"train_loss": -11.322586059570312, "global_step": 236799, "epoch": 1409} {"train_loss": -11.059831619262695, "global_step": 236800, "epoch": 1409} {"train_loss": -11.409367561340332, "global_step": 236801, "epoch": 1409} {"train_loss": -11.334442138671875, "global_step": 236802, "epoch": 1409} {"train_loss": -10.7958345413208, "global_step": 236803, "epoch": 1409} {"train_loss": -11.338306427001953, "global_step": 236804, "epoch": 1409} {"train_loss": -10.601058959960938, "global_step": 236805, "epoch": 1409} {"train_loss": -11.33542251586914, "global_step": 236806, "epoch": 1409} {"train_loss": -10.487922668457031, "global_step": 236807, "epoch": 1409} {"train_loss": -11.441490173339844, "global_step": 236808, "epoch": 1409} {"train_loss": -10.611549377441406, "global_step": 236809, "epoch": 1409} {"train_loss": -11.135801315307617, "global_step": 236810, "epoch": 1409} {"train_loss": -10.37378978729248, "global_step": 236811, "epoch": 1409} {"train_loss": -10.866028785705566, "global_step": 236812, "epoch": 1409} {"train_loss": -10.218862533569336, "global_step": 236813, "epoch": 1409} {"train_loss": -11.128583908081055, "global_step": 236814, "epoch": 1409} {"train_loss": -10.314976692199707, "global_step": 236815, "epoch": 1409} {"train_loss": -10.798714637756348, "global_step": 236816, "epoch": 1409} {"train_loss": -11.091405868530273, "global_step": 236817, "epoch": 1409} {"train_loss": -9.888777732849121, "global_step": 236818, "epoch": 1409} {"train_loss": -11.430099487304688, "global_step": 236819, "epoch": 1409} {"train_loss": -10.096057891845703, "global_step": 236820, "epoch": 1409} {"train_loss": -10.275102615356445, "global_step": 236821, "epoch": 1409} {"train_loss": -10.808229446411133, "global_step": 236822, "epoch": 1409} {"train_loss": -10.586124420166016, "global_step": 236823, "epoch": 1409} {"train_loss": -10.429174423217773, "global_step": 236824, "epoch": 1409} {"train_loss": -10.6676025390625, "global_step": 236825, "epoch": 1409} {"train_loss": -9.78176212310791, "global_step": 236826, "epoch": 1409} {"train_loss": -10.501398086547852, "global_step": 236827, "epoch": 1409} {"train_loss": -10.743666648864746, "global_step": 236828, "epoch": 1409} {"train_loss": -10.509468078613281, "global_step": 236829, "epoch": 1409} {"train_loss": -10.682265281677246, "global_step": 236830, "epoch": 1409} {"train_loss": -10.270486831665039, "global_step": 236831, "epoch": 1409} {"train_loss": -10.957621574401855, "global_step": 236832, "epoch": 1409} {"train_loss": -10.812942504882812, "global_step": 236833, "epoch": 1409} {"train_loss": -10.4630765914917, "global_step": 236834, "epoch": 1409} {"train_loss": -11.48025894165039, "global_step": 236835, "epoch": 1409} {"train_loss": -10.638813018798828, "global_step": 236836, "epoch": 1409} {"train_loss": -11.30954647064209, "global_step": 236837, "epoch": 1409} {"train_loss": -11.238670349121094, "global_step": 236838, "epoch": 1409} {"train_loss": -10.725032806396484, "global_step": 236839, "epoch": 1409} {"train_loss": -11.463231086730957, "global_step": 236840, "epoch": 1409} {"train_loss": -10.794581413269043, "global_step": 236841, "epoch": 1409} {"train_loss": -11.374709129333496, "global_step": 236842, "epoch": 1409} {"train_loss": -11.290437698364258, "global_step": 236843, "epoch": 1409} {"train_loss": -11.327728271484375, "global_step": 236844, "epoch": 1409} {"train_loss": -11.292678833007812, "global_step": 236845, "epoch": 1409} {"train_loss": -11.264939308166504, "global_step": 236846, "epoch": 1409} {"train_loss": -11.296075820922852, "global_step": 236847, "epoch": 1409} {"train_loss": -11.340766906738281, "global_step": 236848, "epoch": 1409} {"train_loss": -11.30035400390625, "global_step": 236849, "epoch": 1409} {"train_loss": -11.445051193237305, "global_step": 236850, "epoch": 1409} {"train_loss": -11.286712646484375, "global_step": 236851, "epoch": 1409} {"train_loss": -11.305532455444336, "global_step": 236852, "epoch": 1409} {"train_loss": -11.415787696838379, "global_step": 236853, "epoch": 1409} {"train_loss": -11.151449203491211, "global_step": 236854, "epoch": 1409} {"train_loss": -11.579845428466797, "global_step": 236855, "epoch": 1409} {"train_loss": -11.092389106750488, "global_step": 236856, "epoch": 1409} {"train_loss": -11.550825119018555, "global_step": 236857, "epoch": 1409} {"train_loss": -11.229586601257324, "global_step": 236858, "epoch": 1409} {"train_loss": -11.438892364501953, "global_step": 236859, "epoch": 1409} {"train_loss": -11.303707122802734, "global_step": 236860, "epoch": 1409} {"train_loss": -11.683666229248047, "global_step": 236861, "epoch": 1409} {"train_loss": -11.212125778198242, "global_step": 236862, "epoch": 1409} {"train_loss": -11.476556777954102, "global_step": 236863, "epoch": 1409} {"train_loss": -11.572572708129883, "global_step": 236864, "epoch": 1409} {"train_loss": -11.712236404418945, "global_step": 236865, "epoch": 1409} {"train_loss": -11.414310455322266, "global_step": 236866, "epoch": 1409} {"train_loss": -11.683830261230469, "global_step": 236867, "epoch": 1409} {"train_loss": -11.707906723022461, "global_step": 236868, "epoch": 1409} {"train_loss": -11.484209060668945, "global_step": 236869, "epoch": 1409} {"train_loss": -11.648412704467773, "global_step": 236870, "epoch": 1409} {"train_loss": -11.393449783325195, "global_step": 236871, "epoch": 1409} {"train_loss": -11.802043914794922, "global_step": 236872, "epoch": 1409} {"train_loss": -11.69320297241211, "global_step": 236873, "epoch": 1409} {"train_loss": -11.740201950073242, "global_step": 236874, "epoch": 1409} {"train_loss": -11.877485275268555, "global_step": 236875, "epoch": 1409} {"train_loss": -11.846531867980957, "global_step": 236876, "epoch": 1409} {"train_loss": -11.812723159790039, "global_step": 236877, "epoch": 1409} {"train_loss": -11.75533676147461, "global_step": 236878, "epoch": 1409} {"train_loss": -11.413087969734555, "global_step": 236879, "epoch": 1409, "val_loss": 265201.0625} {"train_loss": -11.717733383178711, "global_step": 236880, "epoch": 1410} {"train_loss": -11.798486709594727, "global_step": 236881, "epoch": 1410} {"train_loss": -11.857133865356445, "global_step": 236882, "epoch": 1410} {"train_loss": -11.840795516967773, "global_step": 236883, "epoch": 1410} {"train_loss": -11.642623901367188, "global_step": 236884, "epoch": 1410} {"train_loss": -11.876096725463867, "global_step": 236885, "epoch": 1410} {"train_loss": -11.719650268554688, "global_step": 236886, "epoch": 1410} {"train_loss": -11.877382278442383, "global_step": 236887, "epoch": 1410} {"train_loss": -11.889348983764648, "global_step": 236888, "epoch": 1410} {"train_loss": -11.742955207824707, "global_step": 236889, "epoch": 1410} {"train_loss": -11.98680305480957, "global_step": 236890, "epoch": 1410} {"train_loss": -11.789766311645508, "global_step": 236891, "epoch": 1410} {"train_loss": -12.01962661743164, "global_step": 236892, "epoch": 1410} {"train_loss": -11.840614318847656, "global_step": 236893, "epoch": 1410} {"train_loss": -11.919795989990234, "global_step": 236894, "epoch": 1410} {"train_loss": -11.985466003417969, "global_step": 236895, "epoch": 1410} {"train_loss": -12.054183006286621, "global_step": 236896, "epoch": 1410} {"train_loss": -12.01943588256836, "global_step": 236897, "epoch": 1410} {"train_loss": -11.73015022277832, "global_step": 236898, "epoch": 1410} {"train_loss": -12.023111343383789, "global_step": 236899, "epoch": 1410} {"train_loss": -11.78913688659668, "global_step": 236900, "epoch": 1410} {"train_loss": -11.925224304199219, "global_step": 236901, "epoch": 1410} {"train_loss": -11.934717178344727, "global_step": 236902, "epoch": 1410} {"train_loss": -12.123555183410645, "global_step": 236903, "epoch": 1410} {"train_loss": -12.10036849975586, "global_step": 236904, "epoch": 1410} {"train_loss": -11.776422500610352, "global_step": 236905, "epoch": 1410} {"train_loss": -11.915107727050781, "global_step": 236906, "epoch": 1410} {"train_loss": -11.601096153259277, "global_step": 236907, "epoch": 1410} {"train_loss": -11.640522003173828, "global_step": 236908, "epoch": 1410} {"train_loss": -11.658857345581055, "global_step": 236909, "epoch": 1410} {"train_loss": -11.190564155578613, "global_step": 236910, "epoch": 1410} {"train_loss": -11.61974048614502, "global_step": 236911, "epoch": 1410} {"train_loss": -11.660900115966797, "global_step": 236912, "epoch": 1410} {"train_loss": -11.653675079345703, "global_step": 236913, "epoch": 1410} {"train_loss": -11.807687759399414, "global_step": 236914, "epoch": 1410} {"train_loss": -11.942037582397461, "global_step": 236915, "epoch": 1410} {"train_loss": -11.806085586547852, "global_step": 236916, "epoch": 1410} {"train_loss": -12.0894775390625, "global_step": 236917, "epoch": 1410} {"train_loss": -11.93250846862793, "global_step": 236918, "epoch": 1410} {"train_loss": -11.736795425415039, "global_step": 236919, "epoch": 1410} {"train_loss": -11.613384246826172, "global_step": 236920, "epoch": 1410} {"train_loss": -11.680675506591797, "global_step": 236921, "epoch": 1410} {"train_loss": -11.825124740600586, "global_step": 236922, "epoch": 1410} {"train_loss": -11.959354400634766, "global_step": 236923, "epoch": 1410} {"train_loss": -11.88620376586914, "global_step": 236924, "epoch": 1410} {"train_loss": -11.945547103881836, "global_step": 236925, "epoch": 1410} {"train_loss": -11.886835098266602, "global_step": 236926, "epoch": 1410} {"train_loss": -12.071101188659668, "global_step": 236927, "epoch": 1410} {"train_loss": -12.070919036865234, "global_step": 236928, "epoch": 1410} {"train_loss": -11.847977638244629, "global_step": 236929, "epoch": 1410} {"train_loss": -11.855292320251465, "global_step": 236930, "epoch": 1410} {"train_loss": -11.978033065795898, "global_step": 236931, "epoch": 1410} {"train_loss": -12.042919158935547, "global_step": 236932, "epoch": 1410} {"train_loss": -11.77931022644043, "global_step": 236933, "epoch": 1410} {"train_loss": -11.886329650878906, "global_step": 236934, "epoch": 1410} {"train_loss": -11.097763061523438, "global_step": 236935, "epoch": 1410} {"train_loss": -11.73604965209961, "global_step": 236936, "epoch": 1410} {"train_loss": -11.715105056762695, "global_step": 236937, "epoch": 1410} {"train_loss": -11.625836372375488, "global_step": 236938, "epoch": 1410} {"train_loss": -11.919676780700684, "global_step": 236939, "epoch": 1410} {"train_loss": -11.963436126708984, "global_step": 236940, "epoch": 1410} {"train_loss": -11.66731071472168, "global_step": 236941, "epoch": 1410} {"train_loss": -11.630062103271484, "global_step": 236942, "epoch": 1410} {"train_loss": -12.104928970336914, "global_step": 236943, "epoch": 1410} {"train_loss": -11.972814559936523, "global_step": 236944, "epoch": 1410} {"train_loss": -11.613259315490723, "global_step": 236945, "epoch": 1410} {"train_loss": -11.4396333694458, "global_step": 236946, "epoch": 1410} {"train_loss": -11.422576904296875, "global_step": 236947, "epoch": 1410} {"train_loss": -11.748201370239258, "global_step": 236948, "epoch": 1410} {"train_loss": -11.623125076293945, "global_step": 236949, "epoch": 1410} {"train_loss": -11.796062469482422, "global_step": 236950, "epoch": 1410} {"train_loss": -11.418415069580078, "global_step": 236951, "epoch": 1410} {"train_loss": -11.757214546203613, "global_step": 236952, "epoch": 1410} {"train_loss": -11.675918579101562, "global_step": 236953, "epoch": 1410} {"train_loss": -11.261443138122559, "global_step": 236954, "epoch": 1410} {"train_loss": -11.08740234375, "global_step": 236955, "epoch": 1410} {"train_loss": -11.451886177062988, "global_step": 236956, "epoch": 1410} {"train_loss": -11.906707763671875, "global_step": 236957, "epoch": 1410} {"train_loss": -11.107398986816406, "global_step": 236958, "epoch": 1410} {"train_loss": -11.271160125732422, "global_step": 236959, "epoch": 1410} {"train_loss": -11.466375350952148, "global_step": 236960, "epoch": 1410} {"train_loss": -11.974345207214355, "global_step": 236961, "epoch": 1410} {"train_loss": -11.233379364013672, "global_step": 236962, "epoch": 1410} {"train_loss": -11.902023315429688, "global_step": 236963, "epoch": 1410} {"train_loss": -11.317182540893555, "global_step": 236964, "epoch": 1410} {"train_loss": -10.8795166015625, "global_step": 236965, "epoch": 1410} {"train_loss": -10.587523460388184, "global_step": 236966, "epoch": 1410} {"train_loss": -11.87473201751709, "global_step": 236967, "epoch": 1410} {"train_loss": -11.575052261352539, "global_step": 236968, "epoch": 1410} {"train_loss": -11.236589431762695, "global_step": 236969, "epoch": 1410} {"train_loss": -11.587322235107422, "global_step": 236970, "epoch": 1410} {"train_loss": -11.325027465820312, "global_step": 236971, "epoch": 1410} {"train_loss": -11.606184005737305, "global_step": 236972, "epoch": 1410} {"train_loss": -11.462679862976074, "global_step": 236973, "epoch": 1410} {"train_loss": -11.645356178283691, "global_step": 236974, "epoch": 1410} {"train_loss": -11.497501373291016, "global_step": 236975, "epoch": 1410} {"train_loss": -11.659540176391602, "global_step": 236976, "epoch": 1410} {"train_loss": -11.525106430053711, "global_step": 236977, "epoch": 1410} {"train_loss": -11.40490436553955, "global_step": 236978, "epoch": 1410} {"train_loss": -11.622248649597168, "global_step": 236979, "epoch": 1410} {"train_loss": -11.362667083740234, "global_step": 236980, "epoch": 1410} {"train_loss": -11.437786102294922, "global_step": 236981, "epoch": 1410} {"train_loss": -11.56051254272461, "global_step": 236982, "epoch": 1410} {"train_loss": -11.71483039855957, "global_step": 236983, "epoch": 1410} {"train_loss": -11.084741592407227, "global_step": 236984, "epoch": 1410} {"train_loss": -11.672136306762695, "global_step": 236985, "epoch": 1410} {"train_loss": -11.372442245483398, "global_step": 236986, "epoch": 1410} {"train_loss": -11.628671646118164, "global_step": 236987, "epoch": 1410} {"train_loss": -10.838735580444336, "global_step": 236988, "epoch": 1410} {"train_loss": -11.12309741973877, "global_step": 236989, "epoch": 1410} {"train_loss": -11.191816329956055, "global_step": 236990, "epoch": 1410} {"train_loss": -10.837501525878906, "global_step": 236991, "epoch": 1410} {"train_loss": -11.078319549560547, "global_step": 236992, "epoch": 1410} {"train_loss": -10.963996887207031, "global_step": 236993, "epoch": 1410} {"train_loss": -11.480298042297363, "global_step": 236994, "epoch": 1410} {"train_loss": -10.802030563354492, "global_step": 236995, "epoch": 1410} {"train_loss": -11.498828887939453, "global_step": 236996, "epoch": 1410} {"train_loss": -11.160734176635742, "global_step": 236997, "epoch": 1410} {"train_loss": -11.47566032409668, "global_step": 236998, "epoch": 1410} {"train_loss": -10.980596542358398, "global_step": 236999, "epoch": 1410} {"train_loss": -11.194063186645508, "global_step": 237000, "epoch": 1410} {"train_loss": -11.654729843139648, "global_step": 237001, "epoch": 1410} {"train_loss": -11.056280136108398, "global_step": 237002, "epoch": 1410} {"train_loss": -11.223369598388672, "global_step": 237003, "epoch": 1410} {"train_loss": -11.058156967163086, "global_step": 237004, "epoch": 1410} {"train_loss": -11.228226661682129, "global_step": 237005, "epoch": 1410} {"train_loss": -11.313461303710938, "global_step": 237006, "epoch": 1410} {"train_loss": -11.134772300720215, "global_step": 237007, "epoch": 1410} {"train_loss": -11.350570678710938, "global_step": 237008, "epoch": 1410} {"train_loss": -11.517900466918945, "global_step": 237009, "epoch": 1410} {"train_loss": -11.218039512634277, "global_step": 237010, "epoch": 1410} {"train_loss": -10.880664825439453, "global_step": 237011, "epoch": 1410} {"train_loss": -11.519265174865723, "global_step": 237012, "epoch": 1410} {"train_loss": -10.570857048034668, "global_step": 237013, "epoch": 1410} {"train_loss": -11.075878143310547, "global_step": 237014, "epoch": 1410} {"train_loss": -10.769222259521484, "global_step": 237015, "epoch": 1410} {"train_loss": -11.184017181396484, "global_step": 237016, "epoch": 1410} {"train_loss": -11.25832748413086, "global_step": 237017, "epoch": 1410} {"train_loss": -10.721291542053223, "global_step": 237018, "epoch": 1410} {"train_loss": -11.466315269470215, "global_step": 237019, "epoch": 1410} {"train_loss": -11.39776611328125, "global_step": 237020, "epoch": 1410} {"train_loss": -11.35070514678955, "global_step": 237021, "epoch": 1410} {"train_loss": -11.458598136901855, "global_step": 237022, "epoch": 1410} {"train_loss": -11.750123023986816, "global_step": 237023, "epoch": 1410} {"train_loss": -11.324078559875488, "global_step": 237024, "epoch": 1410} {"train_loss": -11.693547248840332, "global_step": 237025, "epoch": 1410} {"train_loss": -11.57630443572998, "global_step": 237026, "epoch": 1410} {"train_loss": -11.555002212524414, "global_step": 237027, "epoch": 1410} {"train_loss": -11.66992473602295, "global_step": 237028, "epoch": 1410} {"train_loss": -11.558732032775879, "global_step": 237029, "epoch": 1410} {"train_loss": -11.711742401123047, "global_step": 237030, "epoch": 1410} {"train_loss": -11.457168579101562, "global_step": 237031, "epoch": 1410} {"train_loss": -11.888265609741211, "global_step": 237032, "epoch": 1410} {"train_loss": -11.769433975219727, "global_step": 237033, "epoch": 1410} {"train_loss": -11.779208183288574, "global_step": 237034, "epoch": 1410} {"train_loss": -11.656607627868652, "global_step": 237035, "epoch": 1410} {"train_loss": -11.745264053344727, "global_step": 237036, "epoch": 1410} {"train_loss": -11.797926902770996, "global_step": 237037, "epoch": 1410} {"train_loss": -11.755599975585938, "global_step": 237038, "epoch": 1410} {"train_loss": -11.61775016784668, "global_step": 237039, "epoch": 1410} {"train_loss": -11.75234603881836, "global_step": 237040, "epoch": 1410} {"train_loss": -11.47048568725586, "global_step": 237041, "epoch": 1410} {"train_loss": -11.96933364868164, "global_step": 237042, "epoch": 1410} {"train_loss": -11.719376564025879, "global_step": 237043, "epoch": 1410} {"train_loss": -11.763256072998047, "global_step": 237044, "epoch": 1410} {"train_loss": -12.012726783752441, "global_step": 237045, "epoch": 1410} {"train_loss": -11.797550201416016, "global_step": 237046, "epoch": 1410} {"train_loss": -11.587343352181572, "global_step": 237047, "epoch": 1410, "val_loss": 265724.90625, "train_action_mse_error": 1.3199297189712524} {"train_loss": -11.494569778442383, "global_step": 237048, "epoch": 1411} {"train_loss": -11.861245155334473, "global_step": 237049, "epoch": 1411} {"train_loss": -12.015419006347656, "global_step": 237050, "epoch": 1411} {"train_loss": -12.072221755981445, "global_step": 237051, "epoch": 1411} {"train_loss": -11.775365829467773, "global_step": 237052, "epoch": 1411} {"train_loss": -11.963290214538574, "global_step": 237053, "epoch": 1411} {"train_loss": -11.873144149780273, "global_step": 237054, "epoch": 1411} {"train_loss": -11.76369857788086, "global_step": 237055, "epoch": 1411} {"train_loss": -12.124069213867188, "global_step": 237056, "epoch": 1411} {"train_loss": -11.525226593017578, "global_step": 237057, "epoch": 1411} {"train_loss": -11.99139404296875, "global_step": 237058, "epoch": 1411} {"train_loss": -11.978521347045898, "global_step": 237059, "epoch": 1411} {"train_loss": -11.667234420776367, "global_step": 237060, "epoch": 1411} {"train_loss": -11.762939453125, "global_step": 237061, "epoch": 1411} {"train_loss": -12.040196418762207, "global_step": 237062, "epoch": 1411} {"train_loss": -12.009936332702637, "global_step": 237063, "epoch": 1411} {"train_loss": -12.069397926330566, "global_step": 237064, "epoch": 1411} {"train_loss": -12.051580429077148, "global_step": 237065, "epoch": 1411} {"train_loss": -11.78790283203125, "global_step": 237066, "epoch": 1411} {"train_loss": -11.853498458862305, "global_step": 237067, "epoch": 1411} {"train_loss": -12.008091926574707, "global_step": 237068, "epoch": 1411} {"train_loss": -11.967267990112305, "global_step": 237069, "epoch": 1411} {"train_loss": -11.641401290893555, "global_step": 237070, "epoch": 1411} {"train_loss": -11.356151580810547, "global_step": 237071, "epoch": 1411} {"train_loss": -11.687475204467773, "global_step": 237072, "epoch": 1411} {"train_loss": -11.136636734008789, "global_step": 237073, "epoch": 1411} {"train_loss": -11.316831588745117, "global_step": 237074, "epoch": 1411} {"train_loss": -11.788708686828613, "global_step": 237075, "epoch": 1411} {"train_loss": -10.96702766418457, "global_step": 237076, "epoch": 1411} {"train_loss": -11.150177001953125, "global_step": 237077, "epoch": 1411} {"train_loss": -11.384926795959473, "global_step": 237078, "epoch": 1411} {"train_loss": -11.681400299072266, "global_step": 237079, "epoch": 1411} {"train_loss": -10.890792846679688, "global_step": 237080, "epoch": 1411} {"train_loss": -10.619340896606445, "global_step": 237081, "epoch": 1411} {"train_loss": -11.517921447753906, "global_step": 237082, "epoch": 1411} {"train_loss": -11.793513298034668, "global_step": 237083, "epoch": 1411} {"train_loss": -10.513814926147461, "global_step": 237084, "epoch": 1411} {"train_loss": -9.429311752319336, "global_step": 237085, "epoch": 1411} {"train_loss": -11.430194854736328, "global_step": 237086, "epoch": 1411} {"train_loss": -10.584766387939453, "global_step": 237087, "epoch": 1411} {"train_loss": -11.325408935546875, "global_step": 237088, "epoch": 1411} {"train_loss": -10.350101470947266, "global_step": 237089, "epoch": 1411} {"train_loss": -11.543319702148438, "global_step": 237090, "epoch": 1411} {"train_loss": -11.311800003051758, "global_step": 237091, "epoch": 1411} {"train_loss": -11.179732322692871, "global_step": 237092, "epoch": 1411} {"train_loss": -11.366275787353516, "global_step": 237093, "epoch": 1411} {"train_loss": -11.52134895324707, "global_step": 237094, "epoch": 1411} {"train_loss": -11.476988792419434, "global_step": 237095, "epoch": 1411} {"train_loss": -11.125007629394531, "global_step": 237096, "epoch": 1411} {"train_loss": -11.534034729003906, "global_step": 237097, "epoch": 1411} {"train_loss": -11.231328964233398, "global_step": 237098, "epoch": 1411} {"train_loss": -11.72273063659668, "global_step": 237099, "epoch": 1411} {"train_loss": -11.01919937133789, "global_step": 237100, "epoch": 1411} {"train_loss": -11.820124626159668, "global_step": 237101, "epoch": 1411} {"train_loss": -10.653158187866211, "global_step": 237102, "epoch": 1411} {"train_loss": -10.549418449401855, "global_step": 237103, "epoch": 1411} {"train_loss": -10.724601745605469, "global_step": 237104, "epoch": 1411} {"train_loss": -10.842331886291504, "global_step": 237105, "epoch": 1411} {"train_loss": -10.069665908813477, "global_step": 237106, "epoch": 1411} {"train_loss": -10.798089981079102, "global_step": 237107, "epoch": 1411} {"train_loss": -10.516141891479492, "global_step": 237108, "epoch": 1411} {"train_loss": -10.493633270263672, "global_step": 237109, "epoch": 1411} {"train_loss": -9.922167778015137, "global_step": 237110, "epoch": 1411} {"train_loss": -10.466672897338867, "global_step": 237111, "epoch": 1411} {"train_loss": -9.470640182495117, "global_step": 237112, "epoch": 1411} {"train_loss": -11.512350082397461, "global_step": 237113, "epoch": 1411} {"train_loss": -9.869606018066406, "global_step": 237114, "epoch": 1411} {"train_loss": -11.39553451538086, "global_step": 237115, "epoch": 1411} {"train_loss": -10.605195999145508, "global_step": 237116, "epoch": 1411} {"train_loss": -10.763956069946289, "global_step": 237117, "epoch": 1411} {"train_loss": -11.154720306396484, "global_step": 237118, "epoch": 1411} {"train_loss": -11.089628219604492, "global_step": 237119, "epoch": 1411} {"train_loss": -10.74903392791748, "global_step": 237120, "epoch": 1411} {"train_loss": -11.416873931884766, "global_step": 237121, "epoch": 1411} {"train_loss": -10.973146438598633, "global_step": 237122, "epoch": 1411} {"train_loss": -11.466170310974121, "global_step": 237123, "epoch": 1411} {"train_loss": -11.239904403686523, "global_step": 237124, "epoch": 1411} {"train_loss": -11.112112045288086, "global_step": 237125, "epoch": 1411} {"train_loss": -10.804344177246094, "global_step": 237126, "epoch": 1411} {"train_loss": -11.268617630004883, "global_step": 237127, "epoch": 1411} {"train_loss": -11.416143417358398, "global_step": 237128, "epoch": 1411} {"train_loss": -11.086464881896973, "global_step": 237129, "epoch": 1411} {"train_loss": -11.411805152893066, "global_step": 237130, "epoch": 1411} {"train_loss": -11.624929428100586, "global_step": 237131, "epoch": 1411} {"train_loss": -11.212911605834961, "global_step": 237132, "epoch": 1411} {"train_loss": -11.582464218139648, "global_step": 237133, "epoch": 1411} {"train_loss": -11.465917587280273, "global_step": 237134, "epoch": 1411} {"train_loss": -11.445756912231445, "global_step": 237135, "epoch": 1411} {"train_loss": -11.367914199829102, "global_step": 237136, "epoch": 1411} {"train_loss": -11.734113693237305, "global_step": 237137, "epoch": 1411} {"train_loss": -11.728670120239258, "global_step": 237138, "epoch": 1411} {"train_loss": -11.49759292602539, "global_step": 237139, "epoch": 1411} {"train_loss": -11.625081062316895, "global_step": 237140, "epoch": 1411} {"train_loss": -11.546560287475586, "global_step": 237141, "epoch": 1411} {"train_loss": -11.521282196044922, "global_step": 237142, "epoch": 1411} {"train_loss": -11.379886627197266, "global_step": 237143, "epoch": 1411} {"train_loss": -11.714106559753418, "global_step": 237144, "epoch": 1411} {"train_loss": -11.672266006469727, "global_step": 237145, "epoch": 1411} {"train_loss": -11.648866653442383, "global_step": 237146, "epoch": 1411} {"train_loss": -11.64065933227539, "global_step": 237147, "epoch": 1411} {"train_loss": -11.52109146118164, "global_step": 237148, "epoch": 1411} {"train_loss": -11.772085189819336, "global_step": 237149, "epoch": 1411} {"train_loss": -11.760622024536133, "global_step": 237150, "epoch": 1411} {"train_loss": -11.675066947937012, "global_step": 237151, "epoch": 1411} {"train_loss": -11.501041412353516, "global_step": 237152, "epoch": 1411} {"train_loss": -11.639921188354492, "global_step": 237153, "epoch": 1411} {"train_loss": -11.71190357208252, "global_step": 237154, "epoch": 1411} {"train_loss": -11.584085464477539, "global_step": 237155, "epoch": 1411} {"train_loss": -11.730145454406738, "global_step": 237156, "epoch": 1411} {"train_loss": -11.485273361206055, "global_step": 237157, "epoch": 1411} {"train_loss": -11.707656860351562, "global_step": 237158, "epoch": 1411} {"train_loss": -11.715353012084961, "global_step": 237159, "epoch": 1411} {"train_loss": -11.501605987548828, "global_step": 237160, "epoch": 1411} {"train_loss": -11.852124214172363, "global_step": 237161, "epoch": 1411} {"train_loss": -11.335579872131348, "global_step": 237162, "epoch": 1411} {"train_loss": -11.580061912536621, "global_step": 237163, "epoch": 1411} {"train_loss": -11.542413711547852, "global_step": 237164, "epoch": 1411} {"train_loss": -11.603803634643555, "global_step": 237165, "epoch": 1411} {"train_loss": -11.689384460449219, "global_step": 237166, "epoch": 1411} {"train_loss": -11.289874076843262, "global_step": 237167, "epoch": 1411} {"train_loss": -11.478588104248047, "global_step": 237168, "epoch": 1411} {"train_loss": -11.650815963745117, "global_step": 237169, "epoch": 1411} {"train_loss": -11.532196044921875, "global_step": 237170, "epoch": 1411} {"train_loss": -11.897137641906738, "global_step": 237171, "epoch": 1411} {"train_loss": -11.822486877441406, "global_step": 237172, "epoch": 1411} {"train_loss": -11.750507354736328, "global_step": 237173, "epoch": 1411} {"train_loss": -11.825652122497559, "global_step": 237174, "epoch": 1411} {"train_loss": -11.330221176147461, "global_step": 237175, "epoch": 1411} {"train_loss": -11.711021423339844, "global_step": 237176, "epoch": 1411} {"train_loss": -11.709714889526367, "global_step": 237177, "epoch": 1411} {"train_loss": -11.380072593688965, "global_step": 237178, "epoch": 1411} {"train_loss": -11.719337463378906, "global_step": 237179, "epoch": 1411} {"train_loss": -11.835348129272461, "global_step": 237180, "epoch": 1411} {"train_loss": -11.805769920349121, "global_step": 237181, "epoch": 1411} {"train_loss": -11.914170265197754, "global_step": 237182, "epoch": 1411} {"train_loss": -11.843400955200195, "global_step": 237183, "epoch": 1411} {"train_loss": -12.140100479125977, "global_step": 237184, "epoch": 1411} {"train_loss": -12.067848205566406, "global_step": 237185, "epoch": 1411} {"train_loss": -12.080865859985352, "global_step": 237186, "epoch": 1411} {"train_loss": -12.005179405212402, "global_step": 237187, "epoch": 1411} {"train_loss": -12.117799758911133, "global_step": 237188, "epoch": 1411} {"train_loss": -11.718169212341309, "global_step": 237189, "epoch": 1411} {"train_loss": -11.755359649658203, "global_step": 237190, "epoch": 1411} {"train_loss": -11.955240249633789, "global_step": 237191, "epoch": 1411} {"train_loss": -11.898250579833984, "global_step": 237192, "epoch": 1411} {"train_loss": -11.806960105895996, "global_step": 237193, "epoch": 1411} {"train_loss": -11.931408882141113, "global_step": 237194, "epoch": 1411} {"train_loss": -11.816370010375977, "global_step": 237195, "epoch": 1411} {"train_loss": -11.646734237670898, "global_step": 237196, "epoch": 1411} {"train_loss": -12.002546310424805, "global_step": 237197, "epoch": 1411} {"train_loss": -11.658028602600098, "global_step": 237198, "epoch": 1411} {"train_loss": -11.590522766113281, "global_step": 237199, "epoch": 1411} {"train_loss": -11.742259979248047, "global_step": 237200, "epoch": 1411} {"train_loss": -11.521418571472168, "global_step": 237201, "epoch": 1411} {"train_loss": -11.971199035644531, "global_step": 237202, "epoch": 1411} {"train_loss": -11.923845291137695, "global_step": 237203, "epoch": 1411} {"train_loss": -11.152243614196777, "global_step": 237204, "epoch": 1411} {"train_loss": -11.62257194519043, "global_step": 237205, "epoch": 1411} {"train_loss": -11.63054084777832, "global_step": 237206, "epoch": 1411} {"train_loss": -11.364683151245117, "global_step": 237207, "epoch": 1411} {"train_loss": -11.71016788482666, "global_step": 237208, "epoch": 1411} {"train_loss": -11.558029174804688, "global_step": 237209, "epoch": 1411} {"train_loss": -12.011128425598145, "global_step": 237210, "epoch": 1411} {"train_loss": -11.537616729736328, "global_step": 237211, "epoch": 1411} {"train_loss": -11.916553497314453, "global_step": 237212, "epoch": 1411} {"train_loss": -11.6900053024292, "global_step": 237213, "epoch": 1411} {"train_loss": -11.291556358337402, "global_step": 237214, "epoch": 1411} {"train_loss": -11.46851806981223, "global_step": 237215, "epoch": 1411, "val_loss": 265014.71875} {"train_loss": -10.331195831298828, "global_step": 237216, "epoch": 1412} {"train_loss": -10.701202392578125, "global_step": 237217, "epoch": 1412} {"train_loss": -11.639324188232422, "global_step": 237218, "epoch": 1412} {"train_loss": -10.362486839294434, "global_step": 237219, "epoch": 1412} {"train_loss": -7.875759601593018, "global_step": 237220, "epoch": 1412} {"train_loss": -9.005216598510742, "global_step": 237221, "epoch": 1412} {"train_loss": -10.56689453125, "global_step": 237222, "epoch": 1412} {"train_loss": -9.837899208068848, "global_step": 237223, "epoch": 1412} {"train_loss": -9.626094818115234, "global_step": 237224, "epoch": 1412} {"train_loss": -9.754768371582031, "global_step": 237225, "epoch": 1412} {"train_loss": -9.80058479309082, "global_step": 237226, "epoch": 1412} {"train_loss": -10.79833984375, "global_step": 237227, "epoch": 1412} {"train_loss": -9.889266014099121, "global_step": 237228, "epoch": 1412} {"train_loss": -9.843667030334473, "global_step": 237229, "epoch": 1412} {"train_loss": -10.817516326904297, "global_step": 237230, "epoch": 1412} {"train_loss": -10.120052337646484, "global_step": 237231, "epoch": 1412} {"train_loss": -10.216440200805664, "global_step": 237232, "epoch": 1412} {"train_loss": -9.773740768432617, "global_step": 237233, "epoch": 1412} {"train_loss": -10.041285514831543, "global_step": 237234, "epoch": 1412} {"train_loss": -10.315351486206055, "global_step": 237235, "epoch": 1412} {"train_loss": -9.92265510559082, "global_step": 237236, "epoch": 1412} {"train_loss": -10.13524341583252, "global_step": 237237, "epoch": 1412} {"train_loss": -11.115509033203125, "global_step": 237238, "epoch": 1412} {"train_loss": -9.882431983947754, "global_step": 237239, "epoch": 1412} {"train_loss": -11.049016952514648, "global_step": 237240, "epoch": 1412} {"train_loss": -11.083784103393555, "global_step": 237241, "epoch": 1412} {"train_loss": -11.157344818115234, "global_step": 237242, "epoch": 1412} {"train_loss": -11.27471923828125, "global_step": 237243, "epoch": 1412} {"train_loss": -11.053061485290527, "global_step": 237244, "epoch": 1412} {"train_loss": -11.002517700195312, "global_step": 237245, "epoch": 1412} {"train_loss": -11.482599258422852, "global_step": 237246, "epoch": 1412} {"train_loss": -11.252397537231445, "global_step": 237247, "epoch": 1412} {"train_loss": -11.140115737915039, "global_step": 237248, "epoch": 1412} {"train_loss": -11.303020477294922, "global_step": 237249, "epoch": 1412} {"train_loss": -11.541986465454102, "global_step": 237250, "epoch": 1412} {"train_loss": -11.391373634338379, "global_step": 237251, "epoch": 1412} {"train_loss": -11.507296562194824, "global_step": 237252, "epoch": 1412} {"train_loss": -11.52432632446289, "global_step": 237253, "epoch": 1412} {"train_loss": -11.55374526977539, "global_step": 237254, "epoch": 1412} {"train_loss": -11.763147354125977, "global_step": 237255, "epoch": 1412} {"train_loss": -11.475445747375488, "global_step": 237256, "epoch": 1412} {"train_loss": -11.718103408813477, "global_step": 237257, "epoch": 1412} {"train_loss": -11.501084327697754, "global_step": 237258, "epoch": 1412} {"train_loss": -11.496042251586914, "global_step": 237259, "epoch": 1412} {"train_loss": -11.61964225769043, "global_step": 237260, "epoch": 1412} {"train_loss": -11.583625793457031, "global_step": 237261, "epoch": 1412} {"train_loss": -11.569292068481445, "global_step": 237262, "epoch": 1412} {"train_loss": -11.708797454833984, "global_step": 237263, "epoch": 1412} {"train_loss": -11.644160270690918, "global_step": 237264, "epoch": 1412} {"train_loss": -11.623958587646484, "global_step": 237265, "epoch": 1412} {"train_loss": -11.552261352539062, "global_step": 237266, "epoch": 1412} {"train_loss": -11.331673622131348, "global_step": 237267, "epoch": 1412} {"train_loss": -11.72319221496582, "global_step": 237268, "epoch": 1412} {"train_loss": -11.93606948852539, "global_step": 237269, "epoch": 1412} {"train_loss": -11.850476264953613, "global_step": 237270, "epoch": 1412} {"train_loss": -11.566959381103516, "global_step": 237271, "epoch": 1412} {"train_loss": -11.718595504760742, "global_step": 237272, "epoch": 1412} {"train_loss": -11.793428421020508, "global_step": 237273, "epoch": 1412} {"train_loss": -11.924459457397461, "global_step": 237274, "epoch": 1412} {"train_loss": -11.946032524108887, "global_step": 237275, "epoch": 1412} {"train_loss": -11.921745300292969, "global_step": 237276, "epoch": 1412} {"train_loss": -11.777721405029297, "global_step": 237277, "epoch": 1412} {"train_loss": -11.892965316772461, "global_step": 237278, "epoch": 1412} {"train_loss": -12.04666519165039, "global_step": 237279, "epoch": 1412} {"train_loss": -11.798171997070312, "global_step": 237280, "epoch": 1412} {"train_loss": -12.016759872436523, "global_step": 237281, "epoch": 1412} {"train_loss": -12.073354721069336, "global_step": 237282, "epoch": 1412} {"train_loss": -11.882000923156738, "global_step": 237283, "epoch": 1412} {"train_loss": -11.93316650390625, "global_step": 237284, "epoch": 1412} {"train_loss": -11.907339096069336, "global_step": 237285, "epoch": 1412} {"train_loss": -12.169760704040527, "global_step": 237286, "epoch": 1412} {"train_loss": -12.054969787597656, "global_step": 237287, "epoch": 1412} {"train_loss": -12.077689170837402, "global_step": 237288, "epoch": 1412} {"train_loss": -12.072690963745117, "global_step": 237289, "epoch": 1412} {"train_loss": -12.121776580810547, "global_step": 237290, "epoch": 1412} {"train_loss": -11.976751327514648, "global_step": 237291, "epoch": 1412} {"train_loss": -11.938935279846191, "global_step": 237292, "epoch": 1412} {"train_loss": -11.930418014526367, "global_step": 237293, "epoch": 1412} {"train_loss": -12.107035636901855, "global_step": 237294, "epoch": 1412} {"train_loss": -12.075069427490234, "global_step": 237295, "epoch": 1412} {"train_loss": -12.04068374633789, "global_step": 237296, "epoch": 1412} {"train_loss": -12.129305839538574, "global_step": 237297, "epoch": 1412} {"train_loss": -12.031549453735352, "global_step": 237298, "epoch": 1412} {"train_loss": -12.060567855834961, "global_step": 237299, "epoch": 1412} {"train_loss": -12.036312103271484, "global_step": 237300, "epoch": 1412} {"train_loss": -12.09310245513916, "global_step": 237301, "epoch": 1412} {"train_loss": -12.18088436126709, "global_step": 237302, "epoch": 1412} {"train_loss": -12.223067283630371, "global_step": 237303, "epoch": 1412} {"train_loss": -12.110075950622559, "global_step": 237304, "epoch": 1412} {"train_loss": -11.979940414428711, "global_step": 237305, "epoch": 1412} {"train_loss": -12.145549774169922, "global_step": 237306, "epoch": 1412} {"train_loss": -11.985343933105469, "global_step": 237307, "epoch": 1412} {"train_loss": -12.06984806060791, "global_step": 237308, "epoch": 1412} {"train_loss": -11.990751266479492, "global_step": 237309, "epoch": 1412} {"train_loss": -12.024433135986328, "global_step": 237310, "epoch": 1412} {"train_loss": -12.14848518371582, "global_step": 237311, "epoch": 1412} {"train_loss": -11.960342407226562, "global_step": 237312, "epoch": 1412} {"train_loss": -11.815200805664062, "global_step": 237313, "epoch": 1412} {"train_loss": -12.020137786865234, "global_step": 237314, "epoch": 1412} {"train_loss": -12.253657341003418, "global_step": 237315, "epoch": 1412} {"train_loss": -12.190435409545898, "global_step": 237316, "epoch": 1412} {"train_loss": -11.957380294799805, "global_step": 237317, "epoch": 1412} {"train_loss": -11.754940032958984, "global_step": 237318, "epoch": 1412} {"train_loss": -11.893310546875, "global_step": 237319, "epoch": 1412} {"train_loss": -11.677041053771973, "global_step": 237320, "epoch": 1412} {"train_loss": -11.872854232788086, "global_step": 237321, "epoch": 1412} {"train_loss": -11.555866241455078, "global_step": 237322, "epoch": 1412} {"train_loss": -10.725343704223633, "global_step": 237323, "epoch": 1412} {"train_loss": -10.644596099853516, "global_step": 237324, "epoch": 1412} {"train_loss": -11.858036041259766, "global_step": 237325, "epoch": 1412} {"train_loss": -11.494630813598633, "global_step": 237326, "epoch": 1412} {"train_loss": -11.095057487487793, "global_step": 237327, "epoch": 1412} {"train_loss": -11.689640998840332, "global_step": 237328, "epoch": 1412} {"train_loss": -11.690675735473633, "global_step": 237329, "epoch": 1412} {"train_loss": -11.00174331665039, "global_step": 237330, "epoch": 1412} {"train_loss": -11.194697380065918, "global_step": 237331, "epoch": 1412} {"train_loss": -11.090202331542969, "global_step": 237332, "epoch": 1412} {"train_loss": -11.52491569519043, "global_step": 237333, "epoch": 1412} {"train_loss": -11.079071998596191, "global_step": 237334, "epoch": 1412} {"train_loss": -10.686988830566406, "global_step": 237335, "epoch": 1412} {"train_loss": -10.976032257080078, "global_step": 237336, "epoch": 1412} {"train_loss": -11.829030990600586, "global_step": 237337, "epoch": 1412} {"train_loss": -10.806900024414062, "global_step": 237338, "epoch": 1412} {"train_loss": -11.439361572265625, "global_step": 237339, "epoch": 1412} {"train_loss": -11.22705078125, "global_step": 237340, "epoch": 1412} {"train_loss": -11.365632057189941, "global_step": 237341, "epoch": 1412} {"train_loss": -11.147379875183105, "global_step": 237342, "epoch": 1412} {"train_loss": -11.83657455444336, "global_step": 237343, "epoch": 1412} {"train_loss": -11.52208137512207, "global_step": 237344, "epoch": 1412} {"train_loss": -11.403481483459473, "global_step": 237345, "epoch": 1412} {"train_loss": -11.846563339233398, "global_step": 237346, "epoch": 1412} {"train_loss": -11.047757148742676, "global_step": 237347, "epoch": 1412} {"train_loss": -11.078262329101562, "global_step": 237348, "epoch": 1412} {"train_loss": -11.737104415893555, "global_step": 237349, "epoch": 1412} {"train_loss": -11.335180282592773, "global_step": 237350, "epoch": 1412} {"train_loss": -10.499807357788086, "global_step": 237351, "epoch": 1412} {"train_loss": -11.544746398925781, "global_step": 237352, "epoch": 1412} {"train_loss": -11.0503568649292, "global_step": 237353, "epoch": 1412} {"train_loss": -10.657880783081055, "global_step": 237354, "epoch": 1412} {"train_loss": -11.622833251953125, "global_step": 237355, "epoch": 1412} {"train_loss": -9.875643730163574, "global_step": 237356, "epoch": 1412} {"train_loss": -11.232924461364746, "global_step": 237357, "epoch": 1412} {"train_loss": -11.114323616027832, "global_step": 237358, "epoch": 1412} {"train_loss": -10.744586944580078, "global_step": 237359, "epoch": 1412} {"train_loss": -11.622091293334961, "global_step": 237360, "epoch": 1412} {"train_loss": -11.301825523376465, "global_step": 237361, "epoch": 1412} {"train_loss": -11.191412925720215, "global_step": 237362, "epoch": 1412} {"train_loss": -11.438183784484863, "global_step": 237363, "epoch": 1412} {"train_loss": -10.799537658691406, "global_step": 237364, "epoch": 1412} {"train_loss": -11.589664459228516, "global_step": 237365, "epoch": 1412} {"train_loss": -11.119537353515625, "global_step": 237366, "epoch": 1412} {"train_loss": -11.411657333374023, "global_step": 237367, "epoch": 1412} {"train_loss": -11.138252258300781, "global_step": 237368, "epoch": 1412} {"train_loss": -11.064699172973633, "global_step": 237369, "epoch": 1412} {"train_loss": -11.45369815826416, "global_step": 237370, "epoch": 1412} {"train_loss": -10.849660873413086, "global_step": 237371, "epoch": 1412} {"train_loss": -11.547813415527344, "global_step": 237372, "epoch": 1412} {"train_loss": -10.48171329498291, "global_step": 237373, "epoch": 1412} {"train_loss": -11.5167236328125, "global_step": 237374, "epoch": 1412} {"train_loss": -10.723346710205078, "global_step": 237375, "epoch": 1412} {"train_loss": -11.101211547851562, "global_step": 237376, "epoch": 1412} {"train_loss": -10.6953706741333, "global_step": 237377, "epoch": 1412} {"train_loss": -11.15081787109375, "global_step": 237378, "epoch": 1412} {"train_loss": -10.97134017944336, "global_step": 237379, "epoch": 1412} {"train_loss": -11.074356079101562, "global_step": 237380, "epoch": 1412} {"train_loss": -11.055915832519531, "global_step": 237381, "epoch": 1412} {"train_loss": -11.375189781188965, "global_step": 237382, "epoch": 1412} {"train_loss": -11.33100160814467, "global_step": 237383, "epoch": 1412, "val_loss": 264671.53125} {"train_loss": -11.652008056640625, "global_step": 237384, "epoch": 1413} {"train_loss": -11.405638694763184, "global_step": 237385, "epoch": 1413} {"train_loss": -11.266317367553711, "global_step": 237386, "epoch": 1413} {"train_loss": -11.543798446655273, "global_step": 237387, "epoch": 1413} {"train_loss": -11.18233871459961, "global_step": 237388, "epoch": 1413} {"train_loss": -11.403083801269531, "global_step": 237389, "epoch": 1413} {"train_loss": -11.129003524780273, "global_step": 237390, "epoch": 1413} {"train_loss": -11.65993881225586, "global_step": 237391, "epoch": 1413} {"train_loss": -11.387100219726562, "global_step": 237392, "epoch": 1413} {"train_loss": -11.457775115966797, "global_step": 237393, "epoch": 1413} {"train_loss": -11.695785522460938, "global_step": 237394, "epoch": 1413} {"train_loss": -11.518228530883789, "global_step": 237395, "epoch": 1413} {"train_loss": -11.718902587890625, "global_step": 237396, "epoch": 1413} {"train_loss": -11.406404495239258, "global_step": 237397, "epoch": 1413} {"train_loss": -11.397195816040039, "global_step": 237398, "epoch": 1413} {"train_loss": -11.508885383605957, "global_step": 237399, "epoch": 1413} {"train_loss": -11.626115798950195, "global_step": 237400, "epoch": 1413} {"train_loss": -11.734956741333008, "global_step": 237401, "epoch": 1413} {"train_loss": -11.528984069824219, "global_step": 237402, "epoch": 1413} {"train_loss": -11.75792407989502, "global_step": 237403, "epoch": 1413} {"train_loss": -11.419787406921387, "global_step": 237404, "epoch": 1413} {"train_loss": -11.876408576965332, "global_step": 237405, "epoch": 1413} {"train_loss": -11.870063781738281, "global_step": 237406, "epoch": 1413} {"train_loss": -11.777108192443848, "global_step": 237407, "epoch": 1413} {"train_loss": -11.760125160217285, "global_step": 237408, "epoch": 1413} {"train_loss": -11.949365615844727, "global_step": 237409, "epoch": 1413} {"train_loss": -11.924118995666504, "global_step": 237410, "epoch": 1413} {"train_loss": -11.835260391235352, "global_step": 237411, "epoch": 1413} {"train_loss": -11.90108871459961, "global_step": 237412, "epoch": 1413} {"train_loss": -11.959836959838867, "global_step": 237413, "epoch": 1413} {"train_loss": -11.821155548095703, "global_step": 237414, "epoch": 1413} {"train_loss": -11.925139427185059, "global_step": 237415, "epoch": 1413} {"train_loss": -11.832869529724121, "global_step": 237416, "epoch": 1413} {"train_loss": -11.847726821899414, "global_step": 237417, "epoch": 1413} {"train_loss": -12.017919540405273, "global_step": 237418, "epoch": 1413} {"train_loss": -11.766477584838867, "global_step": 237419, "epoch": 1413} {"train_loss": -12.021233558654785, "global_step": 237420, "epoch": 1413} {"train_loss": -11.738937377929688, "global_step": 237421, "epoch": 1413} {"train_loss": -11.61889934539795, "global_step": 237422, "epoch": 1413} {"train_loss": -11.944114685058594, "global_step": 237423, "epoch": 1413} {"train_loss": -11.825422286987305, "global_step": 237424, "epoch": 1413} {"train_loss": -12.013240814208984, "global_step": 237425, "epoch": 1413} {"train_loss": -11.926498413085938, "global_step": 237426, "epoch": 1413} {"train_loss": -11.948570251464844, "global_step": 237427, "epoch": 1413} {"train_loss": -12.025883674621582, "global_step": 237428, "epoch": 1413} {"train_loss": -12.003057479858398, "global_step": 237429, "epoch": 1413} {"train_loss": -11.884407043457031, "global_step": 237430, "epoch": 1413} {"train_loss": -12.11512279510498, "global_step": 237431, "epoch": 1413} {"train_loss": -11.877716064453125, "global_step": 237432, "epoch": 1413} {"train_loss": -11.895855903625488, "global_step": 237433, "epoch": 1413} {"train_loss": -11.949304580688477, "global_step": 237434, "epoch": 1413} {"train_loss": -12.000791549682617, "global_step": 237435, "epoch": 1413} {"train_loss": -12.104616165161133, "global_step": 237436, "epoch": 1413} {"train_loss": -11.99919605255127, "global_step": 237437, "epoch": 1413} {"train_loss": -12.129636764526367, "global_step": 237438, "epoch": 1413} {"train_loss": -12.197286605834961, "global_step": 237439, "epoch": 1413} {"train_loss": -11.998335838317871, "global_step": 237440, "epoch": 1413} {"train_loss": -12.084272384643555, "global_step": 237441, "epoch": 1413} {"train_loss": -11.841520309448242, "global_step": 237442, "epoch": 1413} {"train_loss": -11.838769912719727, "global_step": 237443, "epoch": 1413} {"train_loss": -11.836443901062012, "global_step": 237444, "epoch": 1413} {"train_loss": -12.218269348144531, "global_step": 237445, "epoch": 1413} {"train_loss": -11.621472358703613, "global_step": 237446, "epoch": 1413} {"train_loss": -11.73460578918457, "global_step": 237447, "epoch": 1413} {"train_loss": -12.015390396118164, "global_step": 237448, "epoch": 1413} {"train_loss": -11.721426010131836, "global_step": 237449, "epoch": 1413} {"train_loss": -11.883886337280273, "global_step": 237450, "epoch": 1413} {"train_loss": -11.948443412780762, "global_step": 237451, "epoch": 1413} {"train_loss": -11.807053565979004, "global_step": 237452, "epoch": 1413} {"train_loss": -11.899085998535156, "global_step": 237453, "epoch": 1413} {"train_loss": -12.120058059692383, "global_step": 237454, "epoch": 1413} {"train_loss": -11.877420425415039, "global_step": 237455, "epoch": 1413} {"train_loss": -11.774640083312988, "global_step": 237456, "epoch": 1413} {"train_loss": -11.869529724121094, "global_step": 237457, "epoch": 1413} {"train_loss": -11.948022842407227, "global_step": 237458, "epoch": 1413} {"train_loss": -11.676570892333984, "global_step": 237459, "epoch": 1413} {"train_loss": -11.687557220458984, "global_step": 237460, "epoch": 1413} {"train_loss": -11.788089752197266, "global_step": 237461, "epoch": 1413} {"train_loss": -11.912795066833496, "global_step": 237462, "epoch": 1413} {"train_loss": -11.659737586975098, "global_step": 237463, "epoch": 1413} {"train_loss": -11.869094848632812, "global_step": 237464, "epoch": 1413} {"train_loss": -11.894495010375977, "global_step": 237465, "epoch": 1413} {"train_loss": -11.803682327270508, "global_step": 237466, "epoch": 1413} {"train_loss": -11.963123321533203, "global_step": 237467, "epoch": 1413} {"train_loss": -11.603469848632812, "global_step": 237468, "epoch": 1413} {"train_loss": -11.99842643737793, "global_step": 237469, "epoch": 1413} {"train_loss": -11.78683090209961, "global_step": 237470, "epoch": 1413} {"train_loss": -11.622884750366211, "global_step": 237471, "epoch": 1413} {"train_loss": -11.742643356323242, "global_step": 237472, "epoch": 1413} {"train_loss": -11.406984329223633, "global_step": 237473, "epoch": 1413} {"train_loss": -11.348484992980957, "global_step": 237474, "epoch": 1413} {"train_loss": -11.679553031921387, "global_step": 237475, "epoch": 1413} {"train_loss": -11.768571853637695, "global_step": 237476, "epoch": 1413} {"train_loss": -11.588512420654297, "global_step": 237477, "epoch": 1413} {"train_loss": -11.588937759399414, "global_step": 237478, "epoch": 1413} {"train_loss": -11.841440200805664, "global_step": 237479, "epoch": 1413} {"train_loss": -11.483187675476074, "global_step": 237480, "epoch": 1413} {"train_loss": -11.205978393554688, "global_step": 237481, "epoch": 1413} {"train_loss": -11.194249153137207, "global_step": 237482, "epoch": 1413} {"train_loss": -10.700736999511719, "global_step": 237483, "epoch": 1413} {"train_loss": -10.836404800415039, "global_step": 237484, "epoch": 1413} {"train_loss": -11.2317476272583, "global_step": 237485, "epoch": 1413} {"train_loss": -11.248315811157227, "global_step": 237486, "epoch": 1413} {"train_loss": -9.353811264038086, "global_step": 237487, "epoch": 1413} {"train_loss": -10.567548751831055, "global_step": 237488, "epoch": 1413} {"train_loss": -8.09052562713623, "global_step": 237489, "epoch": 1413} {"train_loss": -7.240233421325684, "global_step": 237490, "epoch": 1413} {"train_loss": -6.4442925453186035, "global_step": 237491, "epoch": 1413} {"train_loss": -8.974621772766113, "global_step": 237492, "epoch": 1413} {"train_loss": -9.548303604125977, "global_step": 237493, "epoch": 1413} {"train_loss": -9.298291206359863, "global_step": 237494, "epoch": 1413} {"train_loss": -9.473838806152344, "global_step": 237495, "epoch": 1413} {"train_loss": -9.922958374023438, "global_step": 237496, "epoch": 1413} {"train_loss": -9.192737579345703, "global_step": 237497, "epoch": 1413} {"train_loss": -10.086188316345215, "global_step": 237498, "epoch": 1413} {"train_loss": -10.856550216674805, "global_step": 237499, "epoch": 1413} {"train_loss": -9.346145629882812, "global_step": 237500, "epoch": 1413} {"train_loss": -10.9691801071167, "global_step": 237501, "epoch": 1413} {"train_loss": -10.641536712646484, "global_step": 237502, "epoch": 1413} {"train_loss": -10.66763973236084, "global_step": 237503, "epoch": 1413} {"train_loss": -10.993273735046387, "global_step": 237504, "epoch": 1413} {"train_loss": -10.224588394165039, "global_step": 237505, "epoch": 1413} {"train_loss": -10.65240478515625, "global_step": 237506, "epoch": 1413} {"train_loss": -11.089680671691895, "global_step": 237507, "epoch": 1413} {"train_loss": -10.832022666931152, "global_step": 237508, "epoch": 1413} {"train_loss": -10.956942558288574, "global_step": 237509, "epoch": 1413} {"train_loss": -10.486611366271973, "global_step": 237510, "epoch": 1413} {"train_loss": -10.924501419067383, "global_step": 237511, "epoch": 1413} {"train_loss": -10.873147964477539, "global_step": 237512, "epoch": 1413} {"train_loss": -11.30897331237793, "global_step": 237513, "epoch": 1413} {"train_loss": -11.13597297668457, "global_step": 237514, "epoch": 1413} {"train_loss": -11.236217498779297, "global_step": 237515, "epoch": 1413} {"train_loss": -10.963571548461914, "global_step": 237516, "epoch": 1413} {"train_loss": -11.165279388427734, "global_step": 237517, "epoch": 1413} {"train_loss": -11.216925621032715, "global_step": 237518, "epoch": 1413} {"train_loss": -11.123701095581055, "global_step": 237519, "epoch": 1413} {"train_loss": -10.777437210083008, "global_step": 237520, "epoch": 1413} {"train_loss": -11.185884475708008, "global_step": 237521, "epoch": 1413} {"train_loss": -10.938594818115234, "global_step": 237522, "epoch": 1413} {"train_loss": -11.493486404418945, "global_step": 237523, "epoch": 1413} {"train_loss": -11.055272102355957, "global_step": 237524, "epoch": 1413} {"train_loss": -11.194122314453125, "global_step": 237525, "epoch": 1413} {"train_loss": -11.14228630065918, "global_step": 237526, "epoch": 1413} {"train_loss": -10.658507347106934, "global_step": 237527, "epoch": 1413} {"train_loss": -11.506121635437012, "global_step": 237528, "epoch": 1413} {"train_loss": -11.2371826171875, "global_step": 237529, "epoch": 1413} {"train_loss": -11.465628623962402, "global_step": 237530, "epoch": 1413} {"train_loss": -11.373468399047852, "global_step": 237531, "epoch": 1413} {"train_loss": -11.297500610351562, "global_step": 237532, "epoch": 1413} {"train_loss": -11.342561721801758, "global_step": 237533, "epoch": 1413} {"train_loss": -11.585853576660156, "global_step": 237534, "epoch": 1413} {"train_loss": -10.991582870483398, "global_step": 237535, "epoch": 1413} {"train_loss": -11.602863311767578, "global_step": 237536, "epoch": 1413} {"train_loss": -10.929944038391113, "global_step": 237537, "epoch": 1413} {"train_loss": -11.451934814453125, "global_step": 237538, "epoch": 1413} {"train_loss": -11.181303024291992, "global_step": 237539, "epoch": 1413} {"train_loss": -11.457481384277344, "global_step": 237540, "epoch": 1413} {"train_loss": -11.587388038635254, "global_step": 237541, "epoch": 1413} {"train_loss": -11.224624633789062, "global_step": 237542, "epoch": 1413} {"train_loss": -11.589521408081055, "global_step": 237543, "epoch": 1413} {"train_loss": -11.37934398651123, "global_step": 237544, "epoch": 1413} {"train_loss": -11.338600158691406, "global_step": 237545, "epoch": 1413} {"train_loss": -11.497377395629883, "global_step": 237546, "epoch": 1413} {"train_loss": -11.452211380004883, "global_step": 237547, "epoch": 1413} {"train_loss": -11.373705863952637, "global_step": 237548, "epoch": 1413} {"train_loss": -11.357100486755371, "global_step": 237549, "epoch": 1413} {"train_loss": -11.12789535522461, "global_step": 237550, "epoch": 1413} {"train_loss": -11.345092151846204, "global_step": 237551, "epoch": 1413, "val_loss": 256982.921875} {"train_loss": -11.368555068969727, "global_step": 237552, "epoch": 1414} {"train_loss": -11.42230224609375, "global_step": 237553, "epoch": 1414} {"train_loss": -11.634912490844727, "global_step": 237554, "epoch": 1414} {"train_loss": -11.341525077819824, "global_step": 237555, "epoch": 1414} {"train_loss": -11.507526397705078, "global_step": 237556, "epoch": 1414} {"train_loss": -11.677314758300781, "global_step": 237557, "epoch": 1414} {"train_loss": -11.949823379516602, "global_step": 237558, "epoch": 1414} {"train_loss": -11.641936302185059, "global_step": 237559, "epoch": 1414} {"train_loss": -11.895718574523926, "global_step": 237560, "epoch": 1414} {"train_loss": -11.68373966217041, "global_step": 237561, "epoch": 1414} {"train_loss": -11.578845977783203, "global_step": 237562, "epoch": 1414} {"train_loss": -11.959955215454102, "global_step": 237563, "epoch": 1414} {"train_loss": -11.635274887084961, "global_step": 237564, "epoch": 1414} {"train_loss": -11.856945037841797, "global_step": 237565, "epoch": 1414} {"train_loss": -11.639890670776367, "global_step": 237566, "epoch": 1414} {"train_loss": -11.80687427520752, "global_step": 237567, "epoch": 1414} {"train_loss": -11.514890670776367, "global_step": 237568, "epoch": 1414} {"train_loss": -11.742100715637207, "global_step": 237569, "epoch": 1414} {"train_loss": -11.809257507324219, "global_step": 237570, "epoch": 1414} {"train_loss": -11.665631294250488, "global_step": 237571, "epoch": 1414} {"train_loss": -11.71609115600586, "global_step": 237572, "epoch": 1414} {"train_loss": -11.6716890335083, "global_step": 237573, "epoch": 1414} {"train_loss": -11.392498016357422, "global_step": 237574, "epoch": 1414} {"train_loss": -10.668646812438965, "global_step": 237575, "epoch": 1414} {"train_loss": -11.59153938293457, "global_step": 237576, "epoch": 1414} {"train_loss": -11.067681312561035, "global_step": 237577, "epoch": 1414} {"train_loss": -11.60239028930664, "global_step": 237578, "epoch": 1414} {"train_loss": -11.424223899841309, "global_step": 237579, "epoch": 1414} {"train_loss": -11.2449951171875, "global_step": 237580, "epoch": 1414} {"train_loss": -11.670904159545898, "global_step": 237581, "epoch": 1414} {"train_loss": -11.253856658935547, "global_step": 237582, "epoch": 1414} {"train_loss": -11.384523391723633, "global_step": 237583, "epoch": 1414} {"train_loss": -10.950439453125, "global_step": 237584, "epoch": 1414} {"train_loss": -11.396465301513672, "global_step": 237585, "epoch": 1414} {"train_loss": -11.588154792785645, "global_step": 237586, "epoch": 1414} {"train_loss": -11.556108474731445, "global_step": 237587, "epoch": 1414} {"train_loss": -11.521456718444824, "global_step": 237588, "epoch": 1414} {"train_loss": -11.332527160644531, "global_step": 237589, "epoch": 1414} {"train_loss": -11.69498062133789, "global_step": 237590, "epoch": 1414} {"train_loss": -11.563582420349121, "global_step": 237591, "epoch": 1414} {"train_loss": -11.84083080291748, "global_step": 237592, "epoch": 1414} {"train_loss": -11.823251724243164, "global_step": 237593, "epoch": 1414} {"train_loss": -11.880643844604492, "global_step": 237594, "epoch": 1414} {"train_loss": -11.95987606048584, "global_step": 237595, "epoch": 1414} {"train_loss": -11.945392608642578, "global_step": 237596, "epoch": 1414} {"train_loss": -11.86172103881836, "global_step": 237597, "epoch": 1414} {"train_loss": -11.86166000366211, "global_step": 237598, "epoch": 1414} {"train_loss": -11.957633972167969, "global_step": 237599, "epoch": 1414} {"train_loss": -11.90505599975586, "global_step": 237600, "epoch": 1414} {"train_loss": -11.53506851196289, "global_step": 237601, "epoch": 1414} {"train_loss": -11.932018280029297, "global_step": 237602, "epoch": 1414} {"train_loss": -11.281586647033691, "global_step": 237603, "epoch": 1414} {"train_loss": -11.579888343811035, "global_step": 237604, "epoch": 1414} {"train_loss": -11.509721755981445, "global_step": 237605, "epoch": 1414} {"train_loss": -11.96078872680664, "global_step": 237606, "epoch": 1414} {"train_loss": -11.355990409851074, "global_step": 237607, "epoch": 1414} {"train_loss": -11.950364112854004, "global_step": 237608, "epoch": 1414} {"train_loss": -11.293744087219238, "global_step": 237609, "epoch": 1414} {"train_loss": -11.085153579711914, "global_step": 237610, "epoch": 1414} {"train_loss": -11.282732009887695, "global_step": 237611, "epoch": 1414} {"train_loss": -10.939363479614258, "global_step": 237612, "epoch": 1414} {"train_loss": -11.842655181884766, "global_step": 237613, "epoch": 1414} {"train_loss": -11.186992645263672, "global_step": 237614, "epoch": 1414} {"train_loss": -11.837811470031738, "global_step": 237615, "epoch": 1414} {"train_loss": -11.65340805053711, "global_step": 237616, "epoch": 1414} {"train_loss": -11.677709579467773, "global_step": 237617, "epoch": 1414} {"train_loss": -11.679640769958496, "global_step": 237618, "epoch": 1414} {"train_loss": -11.367525100708008, "global_step": 237619, "epoch": 1414} {"train_loss": -11.622718811035156, "global_step": 237620, "epoch": 1414} {"train_loss": -11.28603458404541, "global_step": 237621, "epoch": 1414} {"train_loss": -11.431008338928223, "global_step": 237622, "epoch": 1414} {"train_loss": -11.851055145263672, "global_step": 237623, "epoch": 1414} {"train_loss": -11.690645217895508, "global_step": 237624, "epoch": 1414} {"train_loss": -11.941025733947754, "global_step": 237625, "epoch": 1414} {"train_loss": -11.403450965881348, "global_step": 237626, "epoch": 1414} {"train_loss": -11.603123664855957, "global_step": 237627, "epoch": 1414} {"train_loss": -11.822622299194336, "global_step": 237628, "epoch": 1414} {"train_loss": -11.369950294494629, "global_step": 237629, "epoch": 1414} {"train_loss": -11.577554702758789, "global_step": 237630, "epoch": 1414} {"train_loss": -11.793580055236816, "global_step": 237631, "epoch": 1414} {"train_loss": -11.696039199829102, "global_step": 237632, "epoch": 1414} {"train_loss": -11.520970344543457, "global_step": 237633, "epoch": 1414} {"train_loss": -12.078184127807617, "global_step": 237634, "epoch": 1414} {"train_loss": -11.622411727905273, "global_step": 237635, "epoch": 1414} {"train_loss": -11.53952407836914, "global_step": 237636, "epoch": 1414} {"train_loss": -11.867959022521973, "global_step": 237637, "epoch": 1414} {"train_loss": -11.708157539367676, "global_step": 237638, "epoch": 1414} {"train_loss": -11.935074806213379, "global_step": 237639, "epoch": 1414} {"train_loss": -11.750951766967773, "global_step": 237640, "epoch": 1414} {"train_loss": -11.592981338500977, "global_step": 237641, "epoch": 1414} {"train_loss": -11.788900375366211, "global_step": 237642, "epoch": 1414} {"train_loss": -11.951909065246582, "global_step": 237643, "epoch": 1414} {"train_loss": -11.687901496887207, "global_step": 237644, "epoch": 1414} {"train_loss": -11.954055786132812, "global_step": 237645, "epoch": 1414} {"train_loss": -11.937699317932129, "global_step": 237646, "epoch": 1414} {"train_loss": -11.847336769104004, "global_step": 237647, "epoch": 1414} {"train_loss": -11.768863677978516, "global_step": 237648, "epoch": 1414} {"train_loss": -11.712394714355469, "global_step": 237649, "epoch": 1414} {"train_loss": -12.15919303894043, "global_step": 237650, "epoch": 1414} {"train_loss": -11.90408992767334, "global_step": 237651, "epoch": 1414} {"train_loss": -11.627401351928711, "global_step": 237652, "epoch": 1414} {"train_loss": -11.474464416503906, "global_step": 237653, "epoch": 1414} {"train_loss": -11.993858337402344, "global_step": 237654, "epoch": 1414} {"train_loss": -11.719754219055176, "global_step": 237655, "epoch": 1414} {"train_loss": -12.011406898498535, "global_step": 237656, "epoch": 1414} {"train_loss": -11.683805465698242, "global_step": 237657, "epoch": 1414} {"train_loss": -12.126983642578125, "global_step": 237658, "epoch": 1414} {"train_loss": -11.311723709106445, "global_step": 237659, "epoch": 1414} {"train_loss": -11.634939193725586, "global_step": 237660, "epoch": 1414} {"train_loss": -11.88075065612793, "global_step": 237661, "epoch": 1414} {"train_loss": -11.927558898925781, "global_step": 237662, "epoch": 1414} {"train_loss": -11.202871322631836, "global_step": 237663, "epoch": 1414} {"train_loss": -11.584894180297852, "global_step": 237664, "epoch": 1414} {"train_loss": -11.743152618408203, "global_step": 237665, "epoch": 1414} {"train_loss": -11.727439880371094, "global_step": 237666, "epoch": 1414} {"train_loss": -11.655637741088867, "global_step": 237667, "epoch": 1414} {"train_loss": -11.913151741027832, "global_step": 237668, "epoch": 1414} {"train_loss": -10.98702335357666, "global_step": 237669, "epoch": 1414} {"train_loss": -11.793536186218262, "global_step": 237670, "epoch": 1414} {"train_loss": -11.756092071533203, "global_step": 237671, "epoch": 1414} {"train_loss": -11.579387664794922, "global_step": 237672, "epoch": 1414} {"train_loss": -11.728902816772461, "global_step": 237673, "epoch": 1414} {"train_loss": -11.464048385620117, "global_step": 237674, "epoch": 1414} {"train_loss": -11.757792472839355, "global_step": 237675, "epoch": 1414} {"train_loss": -11.37534236907959, "global_step": 237676, "epoch": 1414} {"train_loss": -11.185009956359863, "global_step": 237677, "epoch": 1414} {"train_loss": -11.486316680908203, "global_step": 237678, "epoch": 1414} {"train_loss": -10.950187683105469, "global_step": 237679, "epoch": 1414} {"train_loss": -9.668119430541992, "global_step": 237680, "epoch": 1414} {"train_loss": -11.226478576660156, "global_step": 237681, "epoch": 1414} {"train_loss": -10.104907989501953, "global_step": 237682, "epoch": 1414} {"train_loss": -10.592758178710938, "global_step": 237683, "epoch": 1414} {"train_loss": -11.288063049316406, "global_step": 237684, "epoch": 1414} {"train_loss": -11.038745880126953, "global_step": 237685, "epoch": 1414} {"train_loss": -10.375743865966797, "global_step": 237686, "epoch": 1414} {"train_loss": -11.608762741088867, "global_step": 237687, "epoch": 1414} {"train_loss": -9.888605117797852, "global_step": 237688, "epoch": 1414} {"train_loss": -11.349308013916016, "global_step": 237689, "epoch": 1414} {"train_loss": -10.774410247802734, "global_step": 237690, "epoch": 1414} {"train_loss": -10.887012481689453, "global_step": 237691, "epoch": 1414} {"train_loss": -11.081080436706543, "global_step": 237692, "epoch": 1414} {"train_loss": -11.332978248596191, "global_step": 237693, "epoch": 1414} {"train_loss": -11.87179183959961, "global_step": 237694, "epoch": 1414} {"train_loss": -11.638973236083984, "global_step": 237695, "epoch": 1414} {"train_loss": -11.849525451660156, "global_step": 237696, "epoch": 1414} {"train_loss": -11.594512939453125, "global_step": 237697, "epoch": 1414} {"train_loss": -11.411199569702148, "global_step": 237698, "epoch": 1414} {"train_loss": -11.63875675201416, "global_step": 237699, "epoch": 1414} {"train_loss": -11.682740211486816, "global_step": 237700, "epoch": 1414} {"train_loss": -11.517928123474121, "global_step": 237701, "epoch": 1414} {"train_loss": -11.668082237243652, "global_step": 237702, "epoch": 1414} {"train_loss": -11.612814903259277, "global_step": 237703, "epoch": 1414} {"train_loss": -11.482381820678711, "global_step": 237704, "epoch": 1414} {"train_loss": -11.570158958435059, "global_step": 237705, "epoch": 1414} {"train_loss": -11.67175579071045, "global_step": 237706, "epoch": 1414} {"train_loss": -11.893178939819336, "global_step": 237707, "epoch": 1414} {"train_loss": -11.706162452697754, "global_step": 237708, "epoch": 1414} {"train_loss": -11.863964080810547, "global_step": 237709, "epoch": 1414} {"train_loss": -11.867055892944336, "global_step": 237710, "epoch": 1414} {"train_loss": -11.880415916442871, "global_step": 237711, "epoch": 1414} {"train_loss": -11.812591552734375, "global_step": 237712, "epoch": 1414} {"train_loss": -11.746284484863281, "global_step": 237713, "epoch": 1414} {"train_loss": -11.929393768310547, "global_step": 237714, "epoch": 1414} {"train_loss": -11.747936248779297, "global_step": 237715, "epoch": 1414} {"train_loss": -11.760055541992188, "global_step": 237716, "epoch": 1414} {"train_loss": -11.689401626586914, "global_step": 237717, "epoch": 1414} {"train_loss": -11.814088821411133, "global_step": 237718, "epoch": 1414} {"train_loss": -11.572508687064762, "global_step": 237719, "epoch": 1414, "val_loss": 264790.375} {"train_loss": -11.684524536132812, "global_step": 237720, "epoch": 1415} {"train_loss": -11.996721267700195, "global_step": 237721, "epoch": 1415} {"train_loss": -11.926937103271484, "global_step": 237722, "epoch": 1415} {"train_loss": -11.872983932495117, "global_step": 237723, "epoch": 1415} {"train_loss": -11.72011947631836, "global_step": 237724, "epoch": 1415} {"train_loss": -12.06609058380127, "global_step": 237725, "epoch": 1415} {"train_loss": -12.069499969482422, "global_step": 237726, "epoch": 1415} {"train_loss": -11.899246215820312, "global_step": 237727, "epoch": 1415} {"train_loss": -11.892032623291016, "global_step": 237728, "epoch": 1415} {"train_loss": -11.925392150878906, "global_step": 237729, "epoch": 1415} {"train_loss": -11.707877159118652, "global_step": 237730, "epoch": 1415} {"train_loss": -12.179468154907227, "global_step": 237731, "epoch": 1415} {"train_loss": -11.921229362487793, "global_step": 237732, "epoch": 1415} {"train_loss": -11.945005416870117, "global_step": 237733, "epoch": 1415} {"train_loss": -12.053621292114258, "global_step": 237734, "epoch": 1415} {"train_loss": -12.064981460571289, "global_step": 237735, "epoch": 1415} {"train_loss": -11.928987503051758, "global_step": 237736, "epoch": 1415} {"train_loss": -12.121440887451172, "global_step": 237737, "epoch": 1415} {"train_loss": -12.154397964477539, "global_step": 237738, "epoch": 1415} {"train_loss": -12.007492065429688, "global_step": 237739, "epoch": 1415} {"train_loss": -12.090490341186523, "global_step": 237740, "epoch": 1415} {"train_loss": -11.995479583740234, "global_step": 237741, "epoch": 1415} {"train_loss": -12.166156768798828, "global_step": 237742, "epoch": 1415} {"train_loss": -11.866904258728027, "global_step": 237743, "epoch": 1415} {"train_loss": -12.133064270019531, "global_step": 237744, "epoch": 1415} {"train_loss": -12.054056167602539, "global_step": 237745, "epoch": 1415} {"train_loss": -12.060813903808594, "global_step": 237746, "epoch": 1415} {"train_loss": -12.047323226928711, "global_step": 237747, "epoch": 1415} {"train_loss": -12.057022094726562, "global_step": 237748, "epoch": 1415} {"train_loss": -12.08052921295166, "global_step": 237749, "epoch": 1415} {"train_loss": -12.169486999511719, "global_step": 237750, "epoch": 1415} {"train_loss": -12.049699783325195, "global_step": 237751, "epoch": 1415} {"train_loss": -11.903495788574219, "global_step": 237752, "epoch": 1415} {"train_loss": -12.027877807617188, "global_step": 237753, "epoch": 1415} {"train_loss": -12.038460731506348, "global_step": 237754, "epoch": 1415} {"train_loss": -12.169227600097656, "global_step": 237755, "epoch": 1415} {"train_loss": -12.022595405578613, "global_step": 237756, "epoch": 1415} {"train_loss": -11.985782623291016, "global_step": 237757, "epoch": 1415} {"train_loss": -11.613506317138672, "global_step": 237758, "epoch": 1415} {"train_loss": -11.887755393981934, "global_step": 237759, "epoch": 1415} {"train_loss": -11.69660758972168, "global_step": 237760, "epoch": 1415} {"train_loss": -11.667264938354492, "global_step": 237761, "epoch": 1415} {"train_loss": -11.716763496398926, "global_step": 237762, "epoch": 1415} {"train_loss": -11.435977935791016, "global_step": 237763, "epoch": 1415} {"train_loss": -11.550100326538086, "global_step": 237764, "epoch": 1415} {"train_loss": -12.016895294189453, "global_step": 237765, "epoch": 1415} {"train_loss": -10.926956176757812, "global_step": 237766, "epoch": 1415} {"train_loss": -10.890704154968262, "global_step": 237767, "epoch": 1415} {"train_loss": -11.332612991333008, "global_step": 237768, "epoch": 1415} {"train_loss": -11.245079040527344, "global_step": 237769, "epoch": 1415} {"train_loss": -11.93800163269043, "global_step": 237770, "epoch": 1415} {"train_loss": -11.140876770019531, "global_step": 237771, "epoch": 1415} {"train_loss": -11.122062683105469, "global_step": 237772, "epoch": 1415} {"train_loss": -11.134235382080078, "global_step": 237773, "epoch": 1415} {"train_loss": -11.543558120727539, "global_step": 237774, "epoch": 1415} {"train_loss": -11.371709823608398, "global_step": 237775, "epoch": 1415} {"train_loss": -9.723033905029297, "global_step": 237776, "epoch": 1415} {"train_loss": -10.65616226196289, "global_step": 237777, "epoch": 1415} {"train_loss": -11.068984031677246, "global_step": 237778, "epoch": 1415} {"train_loss": -9.79849910736084, "global_step": 237779, "epoch": 1415} {"train_loss": -10.589052200317383, "global_step": 237780, "epoch": 1415} {"train_loss": -10.176389694213867, "global_step": 237781, "epoch": 1415} {"train_loss": -10.512911796569824, "global_step": 237782, "epoch": 1415} {"train_loss": -11.043500900268555, "global_step": 237783, "epoch": 1415} {"train_loss": -10.069005966186523, "global_step": 237784, "epoch": 1415} {"train_loss": -9.959892272949219, "global_step": 237785, "epoch": 1415} {"train_loss": -9.500345230102539, "global_step": 237786, "epoch": 1415} {"train_loss": -10.586368560791016, "global_step": 237787, "epoch": 1415} {"train_loss": -9.069732666015625, "global_step": 237788, "epoch": 1415} {"train_loss": -8.309783935546875, "global_step": 237789, "epoch": 1415} {"train_loss": -10.244342803955078, "global_step": 237790, "epoch": 1415} {"train_loss": -8.278522491455078, "global_step": 237791, "epoch": 1415} {"train_loss": -8.819067001342773, "global_step": 237792, "epoch": 1415} {"train_loss": -9.040665626525879, "global_step": 237793, "epoch": 1415} {"train_loss": -9.16209602355957, "global_step": 237794, "epoch": 1415} {"train_loss": -8.976849555969238, "global_step": 237795, "epoch": 1415} {"train_loss": -10.41530990600586, "global_step": 237796, "epoch": 1415} {"train_loss": -9.336467742919922, "global_step": 237797, "epoch": 1415} {"train_loss": -10.512413024902344, "global_step": 237798, "epoch": 1415} {"train_loss": -9.577016830444336, "global_step": 237799, "epoch": 1415} {"train_loss": -11.142570495605469, "global_step": 237800, "epoch": 1415} {"train_loss": -10.500347137451172, "global_step": 237801, "epoch": 1415} {"train_loss": -11.135786056518555, "global_step": 237802, "epoch": 1415} {"train_loss": -10.531177520751953, "global_step": 237803, "epoch": 1415} {"train_loss": -11.058252334594727, "global_step": 237804, "epoch": 1415} {"train_loss": -10.59948444366455, "global_step": 237805, "epoch": 1415} {"train_loss": -10.884602546691895, "global_step": 237806, "epoch": 1415} {"train_loss": -10.533451080322266, "global_step": 237807, "epoch": 1415} {"train_loss": -11.205777168273926, "global_step": 237808, "epoch": 1415} {"train_loss": -10.86801815032959, "global_step": 237809, "epoch": 1415} {"train_loss": -11.032194137573242, "global_step": 237810, "epoch": 1415} {"train_loss": -11.201061248779297, "global_step": 237811, "epoch": 1415} {"train_loss": -10.782402038574219, "global_step": 237812, "epoch": 1415} {"train_loss": -10.827971458435059, "global_step": 237813, "epoch": 1415} {"train_loss": -11.194866180419922, "global_step": 237814, "epoch": 1415} {"train_loss": -10.862051963806152, "global_step": 237815, "epoch": 1415} {"train_loss": -10.65013313293457, "global_step": 237816, "epoch": 1415} {"train_loss": -11.45165729522705, "global_step": 237817, "epoch": 1415} {"train_loss": -10.577770233154297, "global_step": 237818, "epoch": 1415} {"train_loss": -11.248737335205078, "global_step": 237819, "epoch": 1415} {"train_loss": -11.144590377807617, "global_step": 237820, "epoch": 1415} {"train_loss": -11.219099044799805, "global_step": 237821, "epoch": 1415} {"train_loss": -11.33795166015625, "global_step": 237822, "epoch": 1415} {"train_loss": -11.388631820678711, "global_step": 237823, "epoch": 1415} {"train_loss": -11.392522811889648, "global_step": 237824, "epoch": 1415} {"train_loss": -11.348037719726562, "global_step": 237825, "epoch": 1415} {"train_loss": -11.500777244567871, "global_step": 237826, "epoch": 1415} {"train_loss": -11.53559684753418, "global_step": 237827, "epoch": 1415} {"train_loss": -11.30668830871582, "global_step": 237828, "epoch": 1415} {"train_loss": -11.504176139831543, "global_step": 237829, "epoch": 1415} {"train_loss": -11.567642211914062, "global_step": 237830, "epoch": 1415} {"train_loss": -11.414887428283691, "global_step": 237831, "epoch": 1415} {"train_loss": -11.496845245361328, "global_step": 237832, "epoch": 1415} {"train_loss": -11.616924285888672, "global_step": 237833, "epoch": 1415} {"train_loss": -11.410810470581055, "global_step": 237834, "epoch": 1415} {"train_loss": -11.371618270874023, "global_step": 237835, "epoch": 1415} {"train_loss": -11.574207305908203, "global_step": 237836, "epoch": 1415} {"train_loss": -11.672774314880371, "global_step": 237837, "epoch": 1415} {"train_loss": -11.582928657531738, "global_step": 237838, "epoch": 1415} {"train_loss": -11.851566314697266, "global_step": 237839, "epoch": 1415} {"train_loss": -11.527130126953125, "global_step": 237840, "epoch": 1415} {"train_loss": -11.685770034790039, "global_step": 237841, "epoch": 1415} {"train_loss": -11.673042297363281, "global_step": 237842, "epoch": 1415} {"train_loss": -11.627519607543945, "global_step": 237843, "epoch": 1415} {"train_loss": -11.58681869506836, "global_step": 237844, "epoch": 1415} {"train_loss": -11.753232955932617, "global_step": 237845, "epoch": 1415} {"train_loss": -11.769433975219727, "global_step": 237846, "epoch": 1415} {"train_loss": -11.768535614013672, "global_step": 237847, "epoch": 1415} {"train_loss": -11.624224662780762, "global_step": 237848, "epoch": 1415} {"train_loss": -11.506099700927734, "global_step": 237849, "epoch": 1415} {"train_loss": -11.83692455291748, "global_step": 237850, "epoch": 1415} {"train_loss": -11.804912567138672, "global_step": 237851, "epoch": 1415} {"train_loss": -11.674541473388672, "global_step": 237852, "epoch": 1415} {"train_loss": -11.79731273651123, "global_step": 237853, "epoch": 1415} {"train_loss": -11.525047302246094, "global_step": 237854, "epoch": 1415} {"train_loss": -11.86536979675293, "global_step": 237855, "epoch": 1415} {"train_loss": -11.739180564880371, "global_step": 237856, "epoch": 1415} {"train_loss": -11.699907302856445, "global_step": 237857, "epoch": 1415} {"train_loss": -11.943704605102539, "global_step": 237858, "epoch": 1415} {"train_loss": -11.895709991455078, "global_step": 237859, "epoch": 1415} {"train_loss": -12.039909362792969, "global_step": 237860, "epoch": 1415} {"train_loss": -11.798273086547852, "global_step": 237861, "epoch": 1415} {"train_loss": -12.06519889831543, "global_step": 237862, "epoch": 1415} {"train_loss": -11.943859100341797, "global_step": 237863, "epoch": 1415} {"train_loss": -11.99612045288086, "global_step": 237864, "epoch": 1415} {"train_loss": -11.95187759399414, "global_step": 237865, "epoch": 1415} {"train_loss": -12.057778358459473, "global_step": 237866, "epoch": 1415} {"train_loss": -11.928624153137207, "global_step": 237867, "epoch": 1415} {"train_loss": -11.890405654907227, "global_step": 237868, "epoch": 1415} {"train_loss": -11.860624313354492, "global_step": 237869, "epoch": 1415} {"train_loss": -11.760978698730469, "global_step": 237870, "epoch": 1415} {"train_loss": -11.852180480957031, "global_step": 237871, "epoch": 1415} {"train_loss": -11.894125938415527, "global_step": 237872, "epoch": 1415} {"train_loss": -12.047786712646484, "global_step": 237873, "epoch": 1415} {"train_loss": -12.063023567199707, "global_step": 237874, "epoch": 1415} {"train_loss": -11.905778884887695, "global_step": 237875, "epoch": 1415} {"train_loss": -11.787094116210938, "global_step": 237876, "epoch": 1415} {"train_loss": -11.880495071411133, "global_step": 237877, "epoch": 1415} {"train_loss": -11.586776733398438, "global_step": 237878, "epoch": 1415} {"train_loss": -11.558544158935547, "global_step": 237879, "epoch": 1415} {"train_loss": -11.857951164245605, "global_step": 237880, "epoch": 1415} {"train_loss": -11.370950698852539, "global_step": 237881, "epoch": 1415} {"train_loss": -11.174073219299316, "global_step": 237882, "epoch": 1415} {"train_loss": -11.935949325561523, "global_step": 237883, "epoch": 1415} {"train_loss": -11.358270645141602, "global_step": 237884, "epoch": 1415} {"train_loss": -11.434378623962402, "global_step": 237885, "epoch": 1415} {"train_loss": -11.768379211425781, "global_step": 237886, "epoch": 1415} {"train_loss": -11.367190281550089, "global_step": 237887, "epoch": 1415, "val_loss": 262586.375, "train_action_mse_error": 1.4180101156234741} {"train_loss": -11.73546028137207, "global_step": 237888, "epoch": 1416} {"train_loss": -10.841384887695312, "global_step": 237889, "epoch": 1416} {"train_loss": -11.350312232971191, "global_step": 237890, "epoch": 1416} {"train_loss": -11.641380310058594, "global_step": 237891, "epoch": 1416} {"train_loss": -10.078516006469727, "global_step": 237892, "epoch": 1416} {"train_loss": -11.891141891479492, "global_step": 237893, "epoch": 1416} {"train_loss": -11.160745620727539, "global_step": 237894, "epoch": 1416} {"train_loss": -10.402321815490723, "global_step": 237895, "epoch": 1416} {"train_loss": -11.403434753417969, "global_step": 237896, "epoch": 1416} {"train_loss": -11.16026782989502, "global_step": 237897, "epoch": 1416} {"train_loss": -11.522446632385254, "global_step": 237898, "epoch": 1416} {"train_loss": -10.853191375732422, "global_step": 237899, "epoch": 1416} {"train_loss": -9.932796478271484, "global_step": 237900, "epoch": 1416} {"train_loss": -11.557900428771973, "global_step": 237901, "epoch": 1416} {"train_loss": -10.79711627960205, "global_step": 237902, "epoch": 1416} {"train_loss": -9.955955505371094, "global_step": 237903, "epoch": 1416} {"train_loss": -10.40412425994873, "global_step": 237904, "epoch": 1416} {"train_loss": -8.213678359985352, "global_step": 237905, "epoch": 1416} {"train_loss": -9.117042541503906, "global_step": 237906, "epoch": 1416} {"train_loss": -9.970847129821777, "global_step": 237907, "epoch": 1416} {"train_loss": -10.089041709899902, "global_step": 237908, "epoch": 1416} {"train_loss": -9.664796829223633, "global_step": 237909, "epoch": 1416} {"train_loss": -10.32534122467041, "global_step": 237910, "epoch": 1416} {"train_loss": -9.10423469543457, "global_step": 237911, "epoch": 1416} {"train_loss": -11.273626327514648, "global_step": 237912, "epoch": 1416} {"train_loss": -9.652509689331055, "global_step": 237913, "epoch": 1416} {"train_loss": -10.934462547302246, "global_step": 237914, "epoch": 1416} {"train_loss": -11.123207092285156, "global_step": 237915, "epoch": 1416} {"train_loss": -10.658695220947266, "global_step": 237916, "epoch": 1416} {"train_loss": -11.339969635009766, "global_step": 237917, "epoch": 1416} {"train_loss": -11.365918159484863, "global_step": 237918, "epoch": 1416} {"train_loss": -11.368644714355469, "global_step": 237919, "epoch": 1416} {"train_loss": -11.671834945678711, "global_step": 237920, "epoch": 1416} {"train_loss": -11.231874465942383, "global_step": 237921, "epoch": 1416} {"train_loss": -11.325773239135742, "global_step": 237922, "epoch": 1416} {"train_loss": -11.684049606323242, "global_step": 237923, "epoch": 1416} {"train_loss": -11.225055694580078, "global_step": 237924, "epoch": 1416} {"train_loss": -11.746843338012695, "global_step": 237925, "epoch": 1416} {"train_loss": -11.537341117858887, "global_step": 237926, "epoch": 1416} {"train_loss": -11.436958312988281, "global_step": 237927, "epoch": 1416} {"train_loss": -11.586830139160156, "global_step": 237928, "epoch": 1416} {"train_loss": -11.826162338256836, "global_step": 237929, "epoch": 1416} {"train_loss": -11.513151168823242, "global_step": 237930, "epoch": 1416} {"train_loss": -11.77833080291748, "global_step": 237931, "epoch": 1416} {"train_loss": -11.475543022155762, "global_step": 237932, "epoch": 1416} {"train_loss": -11.713360786437988, "global_step": 237933, "epoch": 1416} {"train_loss": -11.640785217285156, "global_step": 237934, "epoch": 1416} {"train_loss": -11.58030891418457, "global_step": 237935, "epoch": 1416} {"train_loss": -11.589608192443848, "global_step": 237936, "epoch": 1416} {"train_loss": -11.645308494567871, "global_step": 237937, "epoch": 1416} {"train_loss": -11.183595657348633, "global_step": 237938, "epoch": 1416} {"train_loss": -11.741390228271484, "global_step": 237939, "epoch": 1416} {"train_loss": -11.741408348083496, "global_step": 237940, "epoch": 1416} {"train_loss": -11.588642120361328, "global_step": 237941, "epoch": 1416} {"train_loss": -11.744626998901367, "global_step": 237942, "epoch": 1416} {"train_loss": -11.686727523803711, "global_step": 237943, "epoch": 1416} {"train_loss": -11.692322731018066, "global_step": 237944, "epoch": 1416} {"train_loss": -11.622522354125977, "global_step": 237945, "epoch": 1416} {"train_loss": -11.706331253051758, "global_step": 237946, "epoch": 1416} {"train_loss": -11.914569854736328, "global_step": 237947, "epoch": 1416} {"train_loss": -11.524636268615723, "global_step": 237948, "epoch": 1416} {"train_loss": -11.782133102416992, "global_step": 237949, "epoch": 1416} {"train_loss": -11.811833381652832, "global_step": 237950, "epoch": 1416} {"train_loss": -11.865642547607422, "global_step": 237951, "epoch": 1416} {"train_loss": -11.618524551391602, "global_step": 237952, "epoch": 1416} {"train_loss": -11.72848892211914, "global_step": 237953, "epoch": 1416} {"train_loss": -11.569283485412598, "global_step": 237954, "epoch": 1416} {"train_loss": -11.637470245361328, "global_step": 237955, "epoch": 1416} {"train_loss": -11.407363891601562, "global_step": 237956, "epoch": 1416} {"train_loss": -11.652449607849121, "global_step": 237957, "epoch": 1416} {"train_loss": -11.328285217285156, "global_step": 237958, "epoch": 1416} {"train_loss": -11.64806842803955, "global_step": 237959, "epoch": 1416} {"train_loss": -11.343986511230469, "global_step": 237960, "epoch": 1416} {"train_loss": -11.638971328735352, "global_step": 237961, "epoch": 1416} {"train_loss": -11.024604797363281, "global_step": 237962, "epoch": 1416} {"train_loss": -11.798273086547852, "global_step": 237963, "epoch": 1416} {"train_loss": -11.022509574890137, "global_step": 237964, "epoch": 1416} {"train_loss": -11.404510498046875, "global_step": 237965, "epoch": 1416} {"train_loss": -11.601778030395508, "global_step": 237966, "epoch": 1416} {"train_loss": -11.636306762695312, "global_step": 237967, "epoch": 1416} {"train_loss": -11.443450927734375, "global_step": 237968, "epoch": 1416} {"train_loss": -11.218639373779297, "global_step": 237969, "epoch": 1416} {"train_loss": -11.558894157409668, "global_step": 237970, "epoch": 1416} {"train_loss": -11.710430145263672, "global_step": 237971, "epoch": 1416} {"train_loss": -11.414056777954102, "global_step": 237972, "epoch": 1416} {"train_loss": -11.346845626831055, "global_step": 237973, "epoch": 1416} {"train_loss": -11.622247695922852, "global_step": 237974, "epoch": 1416} {"train_loss": -11.1112060546875, "global_step": 237975, "epoch": 1416} {"train_loss": -11.452014923095703, "global_step": 237976, "epoch": 1416} {"train_loss": -10.803503036499023, "global_step": 237977, "epoch": 1416} {"train_loss": -11.673778533935547, "global_step": 237978, "epoch": 1416} {"train_loss": -11.004030227661133, "global_step": 237979, "epoch": 1416} {"train_loss": -11.341043472290039, "global_step": 237980, "epoch": 1416} {"train_loss": -11.319989204406738, "global_step": 237981, "epoch": 1416} {"train_loss": -11.616392135620117, "global_step": 237982, "epoch": 1416} {"train_loss": -11.136427879333496, "global_step": 237983, "epoch": 1416} {"train_loss": -11.358123779296875, "global_step": 237984, "epoch": 1416} {"train_loss": -11.178064346313477, "global_step": 237985, "epoch": 1416} {"train_loss": -10.584466934204102, "global_step": 237986, "epoch": 1416} {"train_loss": -11.84134578704834, "global_step": 237987, "epoch": 1416} {"train_loss": -10.72287368774414, "global_step": 237988, "epoch": 1416} {"train_loss": -11.728114128112793, "global_step": 237989, "epoch": 1416} {"train_loss": -11.193397521972656, "global_step": 237990, "epoch": 1416} {"train_loss": -11.270414352416992, "global_step": 237991, "epoch": 1416} {"train_loss": -11.917863845825195, "global_step": 237992, "epoch": 1416} {"train_loss": -11.63908863067627, "global_step": 237993, "epoch": 1416} {"train_loss": -11.795793533325195, "global_step": 237994, "epoch": 1416} {"train_loss": -11.550779342651367, "global_step": 237995, "epoch": 1416} {"train_loss": -11.942961692810059, "global_step": 237996, "epoch": 1416} {"train_loss": -11.513951301574707, "global_step": 237997, "epoch": 1416} {"train_loss": -11.81399154663086, "global_step": 237998, "epoch": 1416} {"train_loss": -11.75533676147461, "global_step": 237999, "epoch": 1416} {"train_loss": -11.997514724731445, "global_step": 238000, "epoch": 1416} {"train_loss": -11.565974235534668, "global_step": 238001, "epoch": 1416} {"train_loss": -12.001384735107422, "global_step": 238002, "epoch": 1416} {"train_loss": -11.340937614440918, "global_step": 238003, "epoch": 1416} {"train_loss": -11.94664478302002, "global_step": 238004, "epoch": 1416} {"train_loss": -11.59118938446045, "global_step": 238005, "epoch": 1416} {"train_loss": -11.795160293579102, "global_step": 238006, "epoch": 1416} {"train_loss": -11.993903160095215, "global_step": 238007, "epoch": 1416} {"train_loss": -11.730547904968262, "global_step": 238008, "epoch": 1416} {"train_loss": -11.548175811767578, "global_step": 238009, "epoch": 1416} {"train_loss": -11.648681640625, "global_step": 238010, "epoch": 1416} {"train_loss": -11.395527839660645, "global_step": 238011, "epoch": 1416} {"train_loss": -12.058111190795898, "global_step": 238012, "epoch": 1416} {"train_loss": -11.468511581420898, "global_step": 238013, "epoch": 1416} {"train_loss": -12.154216766357422, "global_step": 238014, "epoch": 1416} {"train_loss": -11.356147766113281, "global_step": 238015, "epoch": 1416} {"train_loss": -11.666990280151367, "global_step": 238016, "epoch": 1416} {"train_loss": -11.316675186157227, "global_step": 238017, "epoch": 1416} {"train_loss": -11.716259002685547, "global_step": 238018, "epoch": 1416} {"train_loss": -11.617183685302734, "global_step": 238019, "epoch": 1416} {"train_loss": -11.985633850097656, "global_step": 238020, "epoch": 1416} {"train_loss": -11.178804397583008, "global_step": 238021, "epoch": 1416} {"train_loss": -11.838221549987793, "global_step": 238022, "epoch": 1416} {"train_loss": -11.482023239135742, "global_step": 238023, "epoch": 1416} {"train_loss": -11.820381164550781, "global_step": 238024, "epoch": 1416} {"train_loss": -11.53248405456543, "global_step": 238025, "epoch": 1416} {"train_loss": -11.247655868530273, "global_step": 238026, "epoch": 1416} {"train_loss": -11.619132041931152, "global_step": 238027, "epoch": 1416} {"train_loss": -11.7616548538208, "global_step": 238028, "epoch": 1416} {"train_loss": -11.771556854248047, "global_step": 238029, "epoch": 1416} {"train_loss": -10.964767456054688, "global_step": 238030, "epoch": 1416} {"train_loss": -11.571266174316406, "global_step": 238031, "epoch": 1416} {"train_loss": -12.04483413696289, "global_step": 238032, "epoch": 1416} {"train_loss": -11.171121597290039, "global_step": 238033, "epoch": 1416} {"train_loss": -11.379457473754883, "global_step": 238034, "epoch": 1416} {"train_loss": -11.579009056091309, "global_step": 238035, "epoch": 1416} {"train_loss": -11.218015670776367, "global_step": 238036, "epoch": 1416} {"train_loss": -11.688448905944824, "global_step": 238037, "epoch": 1416} {"train_loss": -11.78272533416748, "global_step": 238038, "epoch": 1416} {"train_loss": -11.663161277770996, "global_step": 238039, "epoch": 1416} {"train_loss": -11.916852951049805, "global_step": 238040, "epoch": 1416} {"train_loss": -11.724021911621094, "global_step": 238041, "epoch": 1416} {"train_loss": -10.921746253967285, "global_step": 238042, "epoch": 1416} {"train_loss": -11.302088737487793, "global_step": 238043, "epoch": 1416} {"train_loss": -11.701761245727539, "global_step": 238044, "epoch": 1416} {"train_loss": -11.560918807983398, "global_step": 238045, "epoch": 1416} {"train_loss": -11.785979270935059, "global_step": 238046, "epoch": 1416} {"train_loss": -11.637060165405273, "global_step": 238047, "epoch": 1416} {"train_loss": -11.944557189941406, "global_step": 238048, "epoch": 1416} {"train_loss": -11.506645202636719, "global_step": 238049, "epoch": 1416} {"train_loss": -11.852476119995117, "global_step": 238050, "epoch": 1416} {"train_loss": -11.42971420288086, "global_step": 238051, "epoch": 1416} {"train_loss": -11.658935546875, "global_step": 238052, "epoch": 1416} {"train_loss": -11.812850952148438, "global_step": 238053, "epoch": 1416} {"train_loss": -11.317776679992676, "global_step": 238054, "epoch": 1416} {"train_loss": -11.383908504531497, "global_step": 238055, "epoch": 1416, "val_loss": 265036.28125} {"train_loss": -11.675064086914062, "global_step": 238056, "epoch": 1417} {"train_loss": -11.748936653137207, "global_step": 238057, "epoch": 1417} {"train_loss": -11.810046195983887, "global_step": 238058, "epoch": 1417} {"train_loss": -11.730961799621582, "global_step": 238059, "epoch": 1417} {"train_loss": -11.855411529541016, "global_step": 238060, "epoch": 1417} {"train_loss": -11.614877700805664, "global_step": 238061, "epoch": 1417} {"train_loss": -11.726896286010742, "global_step": 238062, "epoch": 1417} {"train_loss": -11.380614280700684, "global_step": 238063, "epoch": 1417} {"train_loss": -11.688228607177734, "global_step": 238064, "epoch": 1417} {"train_loss": -11.559770584106445, "global_step": 238065, "epoch": 1417} {"train_loss": -11.86402702331543, "global_step": 238066, "epoch": 1417} {"train_loss": -11.396448135375977, "global_step": 238067, "epoch": 1417} {"train_loss": -11.674882888793945, "global_step": 238068, "epoch": 1417} {"train_loss": -11.8328857421875, "global_step": 238069, "epoch": 1417} {"train_loss": -11.350116729736328, "global_step": 238070, "epoch": 1417} {"train_loss": -11.884432792663574, "global_step": 238071, "epoch": 1417} {"train_loss": -11.053361892700195, "global_step": 238072, "epoch": 1417} {"train_loss": -11.370018005371094, "global_step": 238073, "epoch": 1417} {"train_loss": -11.470596313476562, "global_step": 238074, "epoch": 1417} {"train_loss": -11.835055351257324, "global_step": 238075, "epoch": 1417} {"train_loss": -11.44862174987793, "global_step": 238076, "epoch": 1417} {"train_loss": -11.618688583374023, "global_step": 238077, "epoch": 1417} {"train_loss": -11.210506439208984, "global_step": 238078, "epoch": 1417} {"train_loss": -11.803821563720703, "global_step": 238079, "epoch": 1417} {"train_loss": -11.61977767944336, "global_step": 238080, "epoch": 1417} {"train_loss": -11.542011260986328, "global_step": 238081, "epoch": 1417} {"train_loss": -11.405954360961914, "global_step": 238082, "epoch": 1417} {"train_loss": -11.781164169311523, "global_step": 238083, "epoch": 1417} {"train_loss": -11.403398513793945, "global_step": 238084, "epoch": 1417} {"train_loss": -11.78577995300293, "global_step": 238085, "epoch": 1417} {"train_loss": -11.394733428955078, "global_step": 238086, "epoch": 1417} {"train_loss": -11.296651840209961, "global_step": 238087, "epoch": 1417} {"train_loss": -11.561227798461914, "global_step": 238088, "epoch": 1417} {"train_loss": -11.342066764831543, "global_step": 238089, "epoch": 1417} {"train_loss": -11.675447463989258, "global_step": 238090, "epoch": 1417} {"train_loss": -11.626551628112793, "global_step": 238091, "epoch": 1417} {"train_loss": -11.899799346923828, "global_step": 238092, "epoch": 1417} {"train_loss": -11.701250076293945, "global_step": 238093, "epoch": 1417} {"train_loss": -11.566934585571289, "global_step": 238094, "epoch": 1417} {"train_loss": -11.628068923950195, "global_step": 238095, "epoch": 1417} {"train_loss": -11.824678421020508, "global_step": 238096, "epoch": 1417} {"train_loss": -11.42007064819336, "global_step": 238097, "epoch": 1417} {"train_loss": -11.600555419921875, "global_step": 238098, "epoch": 1417} {"train_loss": -11.657090187072754, "global_step": 238099, "epoch": 1417} {"train_loss": -10.679208755493164, "global_step": 238100, "epoch": 1417} {"train_loss": -11.95885944366455, "global_step": 238101, "epoch": 1417} {"train_loss": -10.935644149780273, "global_step": 238102, "epoch": 1417} {"train_loss": -11.929435729980469, "global_step": 238103, "epoch": 1417} {"train_loss": -11.621264457702637, "global_step": 238104, "epoch": 1417} {"train_loss": -11.851203918457031, "global_step": 238105, "epoch": 1417} {"train_loss": -11.842870712280273, "global_step": 238106, "epoch": 1417} {"train_loss": -11.686993598937988, "global_step": 238107, "epoch": 1417} {"train_loss": -11.853407859802246, "global_step": 238108, "epoch": 1417} {"train_loss": -11.496725082397461, "global_step": 238109, "epoch": 1417} {"train_loss": -11.651877403259277, "global_step": 238110, "epoch": 1417} {"train_loss": -11.984844207763672, "global_step": 238111, "epoch": 1417} {"train_loss": -11.43014907836914, "global_step": 238112, "epoch": 1417} {"train_loss": -11.958049774169922, "global_step": 238113, "epoch": 1417} {"train_loss": -11.523173332214355, "global_step": 238114, "epoch": 1417} {"train_loss": -11.677369117736816, "global_step": 238115, "epoch": 1417} {"train_loss": -11.787025451660156, "global_step": 238116, "epoch": 1417} {"train_loss": -11.688992500305176, "global_step": 238117, "epoch": 1417} {"train_loss": -11.711247444152832, "global_step": 238118, "epoch": 1417} {"train_loss": -11.305279731750488, "global_step": 238119, "epoch": 1417} {"train_loss": -11.669775009155273, "global_step": 238120, "epoch": 1417} {"train_loss": -11.517139434814453, "global_step": 238121, "epoch": 1417} {"train_loss": -11.538942337036133, "global_step": 238122, "epoch": 1417} {"train_loss": -11.563332557678223, "global_step": 238123, "epoch": 1417} {"train_loss": -11.329824447631836, "global_step": 238124, "epoch": 1417} {"train_loss": -11.361626625061035, "global_step": 238125, "epoch": 1417} {"train_loss": -11.764139175415039, "global_step": 238126, "epoch": 1417} {"train_loss": -11.645173072814941, "global_step": 238127, "epoch": 1417} {"train_loss": -11.250444412231445, "global_step": 238128, "epoch": 1417} {"train_loss": -11.874629974365234, "global_step": 238129, "epoch": 1417} {"train_loss": -11.49262809753418, "global_step": 238130, "epoch": 1417} {"train_loss": -11.633800506591797, "global_step": 238131, "epoch": 1417} {"train_loss": -11.567682266235352, "global_step": 238132, "epoch": 1417} {"train_loss": -11.618085861206055, "global_step": 238133, "epoch": 1417} {"train_loss": -11.587451934814453, "global_step": 238134, "epoch": 1417} {"train_loss": -11.394804000854492, "global_step": 238135, "epoch": 1417} {"train_loss": -11.79327392578125, "global_step": 238136, "epoch": 1417} {"train_loss": -11.416343688964844, "global_step": 238137, "epoch": 1417} {"train_loss": -11.545130729675293, "global_step": 238138, "epoch": 1417} {"train_loss": -11.380529403686523, "global_step": 238139, "epoch": 1417} {"train_loss": -11.745816230773926, "global_step": 238140, "epoch": 1417} {"train_loss": -11.842100143432617, "global_step": 238141, "epoch": 1417} {"train_loss": -11.475418090820312, "global_step": 238142, "epoch": 1417} {"train_loss": -11.994550704956055, "global_step": 238143, "epoch": 1417} {"train_loss": -11.790651321411133, "global_step": 238144, "epoch": 1417} {"train_loss": -11.956511497497559, "global_step": 238145, "epoch": 1417} {"train_loss": -11.79239559173584, "global_step": 238146, "epoch": 1417} {"train_loss": -11.744808197021484, "global_step": 238147, "epoch": 1417} {"train_loss": -11.894857406616211, "global_step": 238148, "epoch": 1417} {"train_loss": -12.090888977050781, "global_step": 238149, "epoch": 1417} {"train_loss": -11.857410430908203, "global_step": 238150, "epoch": 1417} {"train_loss": -11.829802513122559, "global_step": 238151, "epoch": 1417} {"train_loss": -11.573989868164062, "global_step": 238152, "epoch": 1417} {"train_loss": -11.63264274597168, "global_step": 238153, "epoch": 1417} {"train_loss": -11.97526741027832, "global_step": 238154, "epoch": 1417} {"train_loss": -11.744586944580078, "global_step": 238155, "epoch": 1417} {"train_loss": -11.698312759399414, "global_step": 238156, "epoch": 1417} {"train_loss": -12.078876495361328, "global_step": 238157, "epoch": 1417} {"train_loss": -11.726613998413086, "global_step": 238158, "epoch": 1417} {"train_loss": -11.883991241455078, "global_step": 238159, "epoch": 1417} {"train_loss": -11.921625137329102, "global_step": 238160, "epoch": 1417} {"train_loss": -11.960222244262695, "global_step": 238161, "epoch": 1417} {"train_loss": -11.83445930480957, "global_step": 238162, "epoch": 1417} {"train_loss": -11.635631561279297, "global_step": 238163, "epoch": 1417} {"train_loss": -11.969823837280273, "global_step": 238164, "epoch": 1417} {"train_loss": -11.838272094726562, "global_step": 238165, "epoch": 1417} {"train_loss": -11.758359909057617, "global_step": 238166, "epoch": 1417} {"train_loss": -11.59675121307373, "global_step": 238167, "epoch": 1417} {"train_loss": -12.017955780029297, "global_step": 238168, "epoch": 1417} {"train_loss": -11.390545845031738, "global_step": 238169, "epoch": 1417} {"train_loss": -11.84425163269043, "global_step": 238170, "epoch": 1417} {"train_loss": -11.609023094177246, "global_step": 238171, "epoch": 1417} {"train_loss": -10.527458190917969, "global_step": 238172, "epoch": 1417} {"train_loss": -11.089401245117188, "global_step": 238173, "epoch": 1417} {"train_loss": -11.453680038452148, "global_step": 238174, "epoch": 1417} {"train_loss": -11.251663208007812, "global_step": 238175, "epoch": 1417} {"train_loss": -10.874922752380371, "global_step": 238176, "epoch": 1417} {"train_loss": -10.721290588378906, "global_step": 238177, "epoch": 1417} {"train_loss": -10.580718994140625, "global_step": 238178, "epoch": 1417} {"train_loss": -11.482135772705078, "global_step": 238179, "epoch": 1417} {"train_loss": -10.926253318786621, "global_step": 238180, "epoch": 1417} {"train_loss": -10.32352066040039, "global_step": 238181, "epoch": 1417} {"train_loss": -11.639649391174316, "global_step": 238182, "epoch": 1417} {"train_loss": -10.361352920532227, "global_step": 238183, "epoch": 1417} {"train_loss": -11.720775604248047, "global_step": 238184, "epoch": 1417} {"train_loss": -10.729061126708984, "global_step": 238185, "epoch": 1417} {"train_loss": -11.401910781860352, "global_step": 238186, "epoch": 1417} {"train_loss": -11.213907241821289, "global_step": 238187, "epoch": 1417} {"train_loss": -10.199821472167969, "global_step": 238188, "epoch": 1417} {"train_loss": -11.459087371826172, "global_step": 238189, "epoch": 1417} {"train_loss": -11.128255844116211, "global_step": 238190, "epoch": 1417} {"train_loss": -11.398341178894043, "global_step": 238191, "epoch": 1417} {"train_loss": -11.447154998779297, "global_step": 238192, "epoch": 1417} {"train_loss": -11.517868041992188, "global_step": 238193, "epoch": 1417} {"train_loss": -11.708552360534668, "global_step": 238194, "epoch": 1417} {"train_loss": -11.52238655090332, "global_step": 238195, "epoch": 1417} {"train_loss": -11.771875381469727, "global_step": 238196, "epoch": 1417} {"train_loss": -11.705795288085938, "global_step": 238197, "epoch": 1417} {"train_loss": -11.789277076721191, "global_step": 238198, "epoch": 1417} {"train_loss": -11.505867958068848, "global_step": 238199, "epoch": 1417} {"train_loss": -11.434165000915527, "global_step": 238200, "epoch": 1417} {"train_loss": -11.63984489440918, "global_step": 238201, "epoch": 1417} {"train_loss": -11.720972061157227, "global_step": 238202, "epoch": 1417} {"train_loss": -11.46782112121582, "global_step": 238203, "epoch": 1417} {"train_loss": -11.685694694519043, "global_step": 238204, "epoch": 1417} {"train_loss": -11.199516296386719, "global_step": 238205, "epoch": 1417} {"train_loss": -11.523088455200195, "global_step": 238206, "epoch": 1417} {"train_loss": -11.418113708496094, "global_step": 238207, "epoch": 1417} {"train_loss": -11.810242652893066, "global_step": 238208, "epoch": 1417} {"train_loss": -11.52222728729248, "global_step": 238209, "epoch": 1417} {"train_loss": -11.763486862182617, "global_step": 238210, "epoch": 1417} {"train_loss": -11.808215141296387, "global_step": 238211, "epoch": 1417} {"train_loss": -11.635207176208496, "global_step": 238212, "epoch": 1417} {"train_loss": -11.513089179992676, "global_step": 238213, "epoch": 1417} {"train_loss": -11.61718463897705, "global_step": 238214, "epoch": 1417} {"train_loss": -11.642908096313477, "global_step": 238215, "epoch": 1417} {"train_loss": -11.333309173583984, "global_step": 238216, "epoch": 1417} {"train_loss": -11.80322265625, "global_step": 238217, "epoch": 1417} {"train_loss": -11.631454467773438, "global_step": 238218, "epoch": 1417} {"train_loss": -11.614705085754395, "global_step": 238219, "epoch": 1417} {"train_loss": -11.561555862426758, "global_step": 238220, "epoch": 1417} {"train_loss": -11.531394958496094, "global_step": 238221, "epoch": 1417} {"train_loss": -11.790023803710938, "global_step": 238222, "epoch": 1417} {"train_loss": -11.567264795303345, "global_step": 238223, "epoch": 1417, "val_loss": 267322.53125} {"train_loss": -11.534049987792969, "global_step": 238224, "epoch": 1418} {"train_loss": -11.535362243652344, "global_step": 238225, "epoch": 1418} {"train_loss": -11.706049919128418, "global_step": 238226, "epoch": 1418} {"train_loss": -11.404236793518066, "global_step": 238227, "epoch": 1418} {"train_loss": -11.774995803833008, "global_step": 238228, "epoch": 1418} {"train_loss": -11.600910186767578, "global_step": 238229, "epoch": 1418} {"train_loss": -11.566122055053711, "global_step": 238230, "epoch": 1418} {"train_loss": -11.762130737304688, "global_step": 238231, "epoch": 1418} {"train_loss": -11.938760757446289, "global_step": 238232, "epoch": 1418} {"train_loss": -11.424541473388672, "global_step": 238233, "epoch": 1418} {"train_loss": -11.937370300292969, "global_step": 238234, "epoch": 1418} {"train_loss": -11.72038459777832, "global_step": 238235, "epoch": 1418} {"train_loss": -11.839896202087402, "global_step": 238236, "epoch": 1418} {"train_loss": -11.754531860351562, "global_step": 238237, "epoch": 1418} {"train_loss": -11.637186050415039, "global_step": 238238, "epoch": 1418} {"train_loss": -12.054959297180176, "global_step": 238239, "epoch": 1418} {"train_loss": -11.724555969238281, "global_step": 238240, "epoch": 1418} {"train_loss": -12.039688110351562, "global_step": 238241, "epoch": 1418} {"train_loss": -11.902044296264648, "global_step": 238242, "epoch": 1418} {"train_loss": -11.956636428833008, "global_step": 238243, "epoch": 1418} {"train_loss": -12.180160522460938, "global_step": 238244, "epoch": 1418} {"train_loss": -11.837705612182617, "global_step": 238245, "epoch": 1418} {"train_loss": -11.975099563598633, "global_step": 238246, "epoch": 1418} {"train_loss": -11.958982467651367, "global_step": 238247, "epoch": 1418} {"train_loss": -12.089153289794922, "global_step": 238248, "epoch": 1418} {"train_loss": -11.915127754211426, "global_step": 238249, "epoch": 1418} {"train_loss": -11.824552536010742, "global_step": 238250, "epoch": 1418} {"train_loss": -11.82194709777832, "global_step": 238251, "epoch": 1418} {"train_loss": -12.1390380859375, "global_step": 238252, "epoch": 1418} {"train_loss": -12.109517097473145, "global_step": 238253, "epoch": 1418} {"train_loss": -11.796591758728027, "global_step": 238254, "epoch": 1418} {"train_loss": -11.966217041015625, "global_step": 238255, "epoch": 1418} {"train_loss": -11.964347839355469, "global_step": 238256, "epoch": 1418} {"train_loss": -11.981358528137207, "global_step": 238257, "epoch": 1418} {"train_loss": -11.740039825439453, "global_step": 238258, "epoch": 1418} {"train_loss": -12.011859893798828, "global_step": 238259, "epoch": 1418} {"train_loss": -11.867536544799805, "global_step": 238260, "epoch": 1418} {"train_loss": -11.846719741821289, "global_step": 238261, "epoch": 1418} {"train_loss": -12.116613388061523, "global_step": 238262, "epoch": 1418} {"train_loss": -11.588214874267578, "global_step": 238263, "epoch": 1418} {"train_loss": -11.859044075012207, "global_step": 238264, "epoch": 1418} {"train_loss": -11.555036544799805, "global_step": 238265, "epoch": 1418} {"train_loss": -11.904569625854492, "global_step": 238266, "epoch": 1418} {"train_loss": -12.137361526489258, "global_step": 238267, "epoch": 1418} {"train_loss": -11.782360076904297, "global_step": 238268, "epoch": 1418} {"train_loss": -11.589689254760742, "global_step": 238269, "epoch": 1418} {"train_loss": -12.14082145690918, "global_step": 238270, "epoch": 1418} {"train_loss": -12.214441299438477, "global_step": 238271, "epoch": 1418} {"train_loss": -11.922733306884766, "global_step": 238272, "epoch": 1418} {"train_loss": -11.950288772583008, "global_step": 238273, "epoch": 1418} {"train_loss": -11.986205101013184, "global_step": 238274, "epoch": 1418} {"train_loss": -12.165735244750977, "global_step": 238275, "epoch": 1418} {"train_loss": -11.825153350830078, "global_step": 238276, "epoch": 1418} {"train_loss": -11.877908706665039, "global_step": 238277, "epoch": 1418} {"train_loss": -12.079133987426758, "global_step": 238278, "epoch": 1418} {"train_loss": -11.955130577087402, "global_step": 238279, "epoch": 1418} {"train_loss": -12.118322372436523, "global_step": 238280, "epoch": 1418} {"train_loss": -12.084117889404297, "global_step": 238281, "epoch": 1418} {"train_loss": -11.873380661010742, "global_step": 238282, "epoch": 1418} {"train_loss": -11.784812927246094, "global_step": 238283, "epoch": 1418} {"train_loss": -11.50030517578125, "global_step": 238284, "epoch": 1418} {"train_loss": -10.440938949584961, "global_step": 238285, "epoch": 1418} {"train_loss": -11.136001586914062, "global_step": 238286, "epoch": 1418} {"train_loss": -11.936727523803711, "global_step": 238287, "epoch": 1418} {"train_loss": -10.408310890197754, "global_step": 238288, "epoch": 1418} {"train_loss": -10.926677703857422, "global_step": 238289, "epoch": 1418} {"train_loss": -11.977882385253906, "global_step": 238290, "epoch": 1418} {"train_loss": -11.012375831604004, "global_step": 238291, "epoch": 1418} {"train_loss": -9.280237197875977, "global_step": 238292, "epoch": 1418} {"train_loss": -10.777826309204102, "global_step": 238293, "epoch": 1418} {"train_loss": -7.645327091217041, "global_step": 238294, "epoch": 1418} {"train_loss": -10.508367538452148, "global_step": 238295, "epoch": 1418} {"train_loss": -8.454136848449707, "global_step": 238296, "epoch": 1418} {"train_loss": -8.446842193603516, "global_step": 238297, "epoch": 1418} {"train_loss": -8.735660552978516, "global_step": 238298, "epoch": 1418} {"train_loss": -11.28503704071045, "global_step": 238299, "epoch": 1418} {"train_loss": -9.47165584564209, "global_step": 238300, "epoch": 1418} {"train_loss": -10.58159065246582, "global_step": 238301, "epoch": 1418} {"train_loss": -9.953164100646973, "global_step": 238302, "epoch": 1418} {"train_loss": -9.95098876953125, "global_step": 238303, "epoch": 1418} {"train_loss": -10.613451957702637, "global_step": 238304, "epoch": 1418} {"train_loss": -9.863471984863281, "global_step": 238305, "epoch": 1418} {"train_loss": -10.917136192321777, "global_step": 238306, "epoch": 1418} {"train_loss": -9.922880172729492, "global_step": 238307, "epoch": 1418} {"train_loss": -10.125985145568848, "global_step": 238308, "epoch": 1418} {"train_loss": -11.210404396057129, "global_step": 238309, "epoch": 1418} {"train_loss": -9.906865119934082, "global_step": 238310, "epoch": 1418} {"train_loss": -9.516565322875977, "global_step": 238311, "epoch": 1418} {"train_loss": -11.499773979187012, "global_step": 238312, "epoch": 1418} {"train_loss": -9.92492389678955, "global_step": 238313, "epoch": 1418} {"train_loss": -11.009477615356445, "global_step": 238314, "epoch": 1418} {"train_loss": -10.791059494018555, "global_step": 238315, "epoch": 1418} {"train_loss": -10.922689437866211, "global_step": 238316, "epoch": 1418} {"train_loss": -10.997669219970703, "global_step": 238317, "epoch": 1418} {"train_loss": -11.465518951416016, "global_step": 238318, "epoch": 1418} {"train_loss": -10.94711685180664, "global_step": 238319, "epoch": 1418} {"train_loss": -11.650728225708008, "global_step": 238320, "epoch": 1418} {"train_loss": -11.166218757629395, "global_step": 238321, "epoch": 1418} {"train_loss": -11.250605583190918, "global_step": 238322, "epoch": 1418} {"train_loss": -11.003535270690918, "global_step": 238323, "epoch": 1418} {"train_loss": -11.320262908935547, "global_step": 238324, "epoch": 1418} {"train_loss": -10.481945037841797, "global_step": 238325, "epoch": 1418} {"train_loss": -11.332670211791992, "global_step": 238326, "epoch": 1418} {"train_loss": -11.001184463500977, "global_step": 238327, "epoch": 1418} {"train_loss": -11.369516372680664, "global_step": 238328, "epoch": 1418} {"train_loss": -11.431589126586914, "global_step": 238329, "epoch": 1418} {"train_loss": -11.343279838562012, "global_step": 238330, "epoch": 1418} {"train_loss": -11.56509017944336, "global_step": 238331, "epoch": 1418} {"train_loss": -11.653017044067383, "global_step": 238332, "epoch": 1418} {"train_loss": -11.24006462097168, "global_step": 238333, "epoch": 1418} {"train_loss": -11.492317199707031, "global_step": 238334, "epoch": 1418} {"train_loss": -11.593826293945312, "global_step": 238335, "epoch": 1418} {"train_loss": -11.417280197143555, "global_step": 238336, "epoch": 1418} {"train_loss": -11.603551864624023, "global_step": 238337, "epoch": 1418} {"train_loss": -11.746734619140625, "global_step": 238338, "epoch": 1418} {"train_loss": -11.585968017578125, "global_step": 238339, "epoch": 1418} {"train_loss": -11.845553398132324, "global_step": 238340, "epoch": 1418} {"train_loss": -11.829483032226562, "global_step": 238341, "epoch": 1418} {"train_loss": -11.61229133605957, "global_step": 238342, "epoch": 1418} {"train_loss": -11.564065933227539, "global_step": 238343, "epoch": 1418} {"train_loss": -11.634414672851562, "global_step": 238344, "epoch": 1418} {"train_loss": -11.710740089416504, "global_step": 238345, "epoch": 1418} {"train_loss": -11.663677215576172, "global_step": 238346, "epoch": 1418} {"train_loss": -11.807151794433594, "global_step": 238347, "epoch": 1418} {"train_loss": -11.818217277526855, "global_step": 238348, "epoch": 1418} {"train_loss": -11.885557174682617, "global_step": 238349, "epoch": 1418} {"train_loss": -11.806652069091797, "global_step": 238350, "epoch": 1418} {"train_loss": -11.758508682250977, "global_step": 238351, "epoch": 1418} {"train_loss": -11.77137279510498, "global_step": 238352, "epoch": 1418} {"train_loss": -11.91185188293457, "global_step": 238353, "epoch": 1418} {"train_loss": -11.868478775024414, "global_step": 238354, "epoch": 1418} {"train_loss": -11.8600492477417, "global_step": 238355, "epoch": 1418} {"train_loss": -12.153282165527344, "global_step": 238356, "epoch": 1418} {"train_loss": -11.73830795288086, "global_step": 238357, "epoch": 1418} {"train_loss": -11.964311599731445, "global_step": 238358, "epoch": 1418} {"train_loss": -11.763866424560547, "global_step": 238359, "epoch": 1418} {"train_loss": -11.843746185302734, "global_step": 238360, "epoch": 1418} {"train_loss": -11.811737060546875, "global_step": 238361, "epoch": 1418} {"train_loss": -12.113004684448242, "global_step": 238362, "epoch": 1418} {"train_loss": -12.082748413085938, "global_step": 238363, "epoch": 1418} {"train_loss": -12.045829772949219, "global_step": 238364, "epoch": 1418} {"train_loss": -12.130151748657227, "global_step": 238365, "epoch": 1418} {"train_loss": -12.127837181091309, "global_step": 238366, "epoch": 1418} {"train_loss": -11.92406177520752, "global_step": 238367, "epoch": 1418} {"train_loss": -12.024654388427734, "global_step": 238368, "epoch": 1418} {"train_loss": -12.076800346374512, "global_step": 238369, "epoch": 1418} {"train_loss": -12.095924377441406, "global_step": 238370, "epoch": 1418} {"train_loss": -11.90831470489502, "global_step": 238371, "epoch": 1418} {"train_loss": -11.968090057373047, "global_step": 238372, "epoch": 1418} {"train_loss": -11.699678421020508, "global_step": 238373, "epoch": 1418} {"train_loss": -11.647232055664062, "global_step": 238374, "epoch": 1418} {"train_loss": -11.964820861816406, "global_step": 238375, "epoch": 1418} {"train_loss": -12.015227317810059, "global_step": 238376, "epoch": 1418} {"train_loss": -11.654547691345215, "global_step": 238377, "epoch": 1418} {"train_loss": -11.126079559326172, "global_step": 238378, "epoch": 1418} {"train_loss": -10.853778839111328, "global_step": 238379, "epoch": 1418} {"train_loss": -11.345549583435059, "global_step": 238380, "epoch": 1418} {"train_loss": -11.322456359863281, "global_step": 238381, "epoch": 1418} {"train_loss": -11.7955961227417, "global_step": 238382, "epoch": 1418} {"train_loss": -11.585871696472168, "global_step": 238383, "epoch": 1418} {"train_loss": -11.789762496948242, "global_step": 238384, "epoch": 1418} {"train_loss": -11.731956481933594, "global_step": 238385, "epoch": 1418} {"train_loss": -11.567296981811523, "global_step": 238386, "epoch": 1418} {"train_loss": -11.043140411376953, "global_step": 238387, "epoch": 1418} {"train_loss": -10.839988708496094, "global_step": 238388, "epoch": 1418} {"train_loss": -11.332598686218262, "global_step": 238389, "epoch": 1418} {"train_loss": -11.144826889038086, "global_step": 238390, "epoch": 1418} {"train_loss": -11.44864476010913, "global_step": 238391, "epoch": 1418, "val_loss": 266536.4375} {"train_loss": -11.434253692626953, "global_step": 238392, "epoch": 1419} {"train_loss": -11.700855255126953, "global_step": 238393, "epoch": 1419} {"train_loss": -11.859054565429688, "global_step": 238394, "epoch": 1419} {"train_loss": -10.656357765197754, "global_step": 238395, "epoch": 1419} {"train_loss": -11.47038459777832, "global_step": 238396, "epoch": 1419} {"train_loss": -11.898541450500488, "global_step": 238397, "epoch": 1419} {"train_loss": -11.274383544921875, "global_step": 238398, "epoch": 1419} {"train_loss": -11.300666809082031, "global_step": 238399, "epoch": 1419} {"train_loss": -11.545683860778809, "global_step": 238400, "epoch": 1419} {"train_loss": -11.175483703613281, "global_step": 238401, "epoch": 1419} {"train_loss": -10.818343162536621, "global_step": 238402, "epoch": 1419} {"train_loss": -11.865623474121094, "global_step": 238403, "epoch": 1419} {"train_loss": -9.609428405761719, "global_step": 238404, "epoch": 1419} {"train_loss": -10.715263366699219, "global_step": 238405, "epoch": 1419} {"train_loss": -11.322768211364746, "global_step": 238406, "epoch": 1419} {"train_loss": -9.925302505493164, "global_step": 238407, "epoch": 1419} {"train_loss": -11.715676307678223, "global_step": 238408, "epoch": 1419} {"train_loss": -10.202777862548828, "global_step": 238409, "epoch": 1419} {"train_loss": -11.04863166809082, "global_step": 238410, "epoch": 1419} {"train_loss": -11.103425979614258, "global_step": 238411, "epoch": 1419} {"train_loss": -10.675983428955078, "global_step": 238412, "epoch": 1419} {"train_loss": -11.577491760253906, "global_step": 238413, "epoch": 1419} {"train_loss": -10.821128845214844, "global_step": 238414, "epoch": 1419} {"train_loss": -11.13096809387207, "global_step": 238415, "epoch": 1419} {"train_loss": -11.27252197265625, "global_step": 238416, "epoch": 1419} {"train_loss": -11.545310974121094, "global_step": 238417, "epoch": 1419} {"train_loss": -11.721040725708008, "global_step": 238418, "epoch": 1419} {"train_loss": -11.373886108398438, "global_step": 238419, "epoch": 1419} {"train_loss": -11.626609802246094, "global_step": 238420, "epoch": 1419} {"train_loss": -11.376557350158691, "global_step": 238421, "epoch": 1419} {"train_loss": -11.714859008789062, "global_step": 238422, "epoch": 1419} {"train_loss": -11.646260261535645, "global_step": 238423, "epoch": 1419} {"train_loss": -11.395126342773438, "global_step": 238424, "epoch": 1419} {"train_loss": -11.812646865844727, "global_step": 238425, "epoch": 1419} {"train_loss": -11.881376266479492, "global_step": 238426, "epoch": 1419} {"train_loss": -11.763980865478516, "global_step": 238427, "epoch": 1419} {"train_loss": -11.560487747192383, "global_step": 238428, "epoch": 1419} {"train_loss": -11.630546569824219, "global_step": 238429, "epoch": 1419} {"train_loss": -11.530134201049805, "global_step": 238430, "epoch": 1419} {"train_loss": -11.815345764160156, "global_step": 238431, "epoch": 1419} {"train_loss": -11.49056339263916, "global_step": 238432, "epoch": 1419} {"train_loss": -11.848651885986328, "global_step": 238433, "epoch": 1419} {"train_loss": -11.46318244934082, "global_step": 238434, "epoch": 1419} {"train_loss": -11.838163375854492, "global_step": 238435, "epoch": 1419} {"train_loss": -11.514055252075195, "global_step": 238436, "epoch": 1419} {"train_loss": -11.655943870544434, "global_step": 238437, "epoch": 1419} {"train_loss": -11.484220504760742, "global_step": 238438, "epoch": 1419} {"train_loss": -11.771751403808594, "global_step": 238439, "epoch": 1419} {"train_loss": -11.545120239257812, "global_step": 238440, "epoch": 1419} {"train_loss": -11.87614631652832, "global_step": 238441, "epoch": 1419} {"train_loss": -11.699838638305664, "global_step": 238442, "epoch": 1419} {"train_loss": -11.794960975646973, "global_step": 238443, "epoch": 1419} {"train_loss": -11.87787914276123, "global_step": 238444, "epoch": 1419} {"train_loss": -11.726469993591309, "global_step": 238445, "epoch": 1419} {"train_loss": -11.949600219726562, "global_step": 238446, "epoch": 1419} {"train_loss": -11.238176345825195, "global_step": 238447, "epoch": 1419} {"train_loss": -11.924927711486816, "global_step": 238448, "epoch": 1419} {"train_loss": -11.541844367980957, "global_step": 238449, "epoch": 1419} {"train_loss": -11.882450103759766, "global_step": 238450, "epoch": 1419} {"train_loss": -11.66453742980957, "global_step": 238451, "epoch": 1419} {"train_loss": -11.47649097442627, "global_step": 238452, "epoch": 1419} {"train_loss": -11.541768074035645, "global_step": 238453, "epoch": 1419} {"train_loss": -11.713296890258789, "global_step": 238454, "epoch": 1419} {"train_loss": -11.952688217163086, "global_step": 238455, "epoch": 1419} {"train_loss": -11.809826850891113, "global_step": 238456, "epoch": 1419} {"train_loss": -11.806666374206543, "global_step": 238457, "epoch": 1419} {"train_loss": -11.680893898010254, "global_step": 238458, "epoch": 1419} {"train_loss": -12.017263412475586, "global_step": 238459, "epoch": 1419} {"train_loss": -11.434659004211426, "global_step": 238460, "epoch": 1419} {"train_loss": -12.069243431091309, "global_step": 238461, "epoch": 1419} {"train_loss": -11.863110542297363, "global_step": 238462, "epoch": 1419} {"train_loss": -11.672151565551758, "global_step": 238463, "epoch": 1419} {"train_loss": -11.959552764892578, "global_step": 238464, "epoch": 1419} {"train_loss": -11.516271591186523, "global_step": 238465, "epoch": 1419} {"train_loss": -11.720479965209961, "global_step": 238466, "epoch": 1419} {"train_loss": -11.763962745666504, "global_step": 238467, "epoch": 1419} {"train_loss": -11.971747398376465, "global_step": 238468, "epoch": 1419} {"train_loss": -11.624332427978516, "global_step": 238469, "epoch": 1419} {"train_loss": -11.75534439086914, "global_step": 238470, "epoch": 1419} {"train_loss": -11.997751235961914, "global_step": 238471, "epoch": 1419} {"train_loss": -11.829566955566406, "global_step": 238472, "epoch": 1419} {"train_loss": -11.657058715820312, "global_step": 238473, "epoch": 1419} {"train_loss": -11.860042572021484, "global_step": 238474, "epoch": 1419} {"train_loss": -11.858070373535156, "global_step": 238475, "epoch": 1419} {"train_loss": -11.448017120361328, "global_step": 238476, "epoch": 1419} {"train_loss": -11.72381591796875, "global_step": 238477, "epoch": 1419} {"train_loss": -11.986445426940918, "global_step": 238478, "epoch": 1419} {"train_loss": -11.7849760055542, "global_step": 238479, "epoch": 1419} {"train_loss": -11.857440948486328, "global_step": 238480, "epoch": 1419} {"train_loss": -11.62777042388916, "global_step": 238481, "epoch": 1419} {"train_loss": -11.95474910736084, "global_step": 238482, "epoch": 1419} {"train_loss": -11.63798713684082, "global_step": 238483, "epoch": 1419} {"train_loss": -11.968896865844727, "global_step": 238484, "epoch": 1419} {"train_loss": -11.61418342590332, "global_step": 238485, "epoch": 1419} {"train_loss": -11.856966018676758, "global_step": 238486, "epoch": 1419} {"train_loss": -11.724029541015625, "global_step": 238487, "epoch": 1419} {"train_loss": -11.954593658447266, "global_step": 238488, "epoch": 1419} {"train_loss": -11.805193901062012, "global_step": 238489, "epoch": 1419} {"train_loss": -11.994823455810547, "global_step": 238490, "epoch": 1419} {"train_loss": -11.94980239868164, "global_step": 238491, "epoch": 1419} {"train_loss": -11.938202857971191, "global_step": 238492, "epoch": 1419} {"train_loss": -11.981548309326172, "global_step": 238493, "epoch": 1419} {"train_loss": -12.207816123962402, "global_step": 238494, "epoch": 1419} {"train_loss": -12.079898834228516, "global_step": 238495, "epoch": 1419} {"train_loss": -11.855766296386719, "global_step": 238496, "epoch": 1419} {"train_loss": -11.897053718566895, "global_step": 238497, "epoch": 1419} {"train_loss": -12.000046730041504, "global_step": 238498, "epoch": 1419} {"train_loss": -12.184944152832031, "global_step": 238499, "epoch": 1419} {"train_loss": -12.110689163208008, "global_step": 238500, "epoch": 1419} {"train_loss": -11.620887756347656, "global_step": 238501, "epoch": 1419} {"train_loss": -11.453319549560547, "global_step": 238502, "epoch": 1419} {"train_loss": -11.83935546875, "global_step": 238503, "epoch": 1419} {"train_loss": -11.833244323730469, "global_step": 238504, "epoch": 1419} {"train_loss": -11.59067153930664, "global_step": 238505, "epoch": 1419} {"train_loss": -10.800468444824219, "global_step": 238506, "epoch": 1419} {"train_loss": -12.112153053283691, "global_step": 238507, "epoch": 1419} {"train_loss": -11.213375091552734, "global_step": 238508, "epoch": 1419} {"train_loss": -10.994176864624023, "global_step": 238509, "epoch": 1419} {"train_loss": -11.333768844604492, "global_step": 238510, "epoch": 1419} {"train_loss": -11.104087829589844, "global_step": 238511, "epoch": 1419} {"train_loss": -10.667576789855957, "global_step": 238512, "epoch": 1419} {"train_loss": -9.824374198913574, "global_step": 238513, "epoch": 1419} {"train_loss": -11.157803535461426, "global_step": 238514, "epoch": 1419} {"train_loss": -11.032809257507324, "global_step": 238515, "epoch": 1419} {"train_loss": -9.330276489257812, "global_step": 238516, "epoch": 1419} {"train_loss": -11.789612770080566, "global_step": 238517, "epoch": 1419} {"train_loss": -9.961490631103516, "global_step": 238518, "epoch": 1419} {"train_loss": -9.487820625305176, "global_step": 238519, "epoch": 1419} {"train_loss": -11.759763717651367, "global_step": 238520, "epoch": 1419} {"train_loss": -9.999719619750977, "global_step": 238521, "epoch": 1419} {"train_loss": -11.512275695800781, "global_step": 238522, "epoch": 1419} {"train_loss": -11.516106605529785, "global_step": 238523, "epoch": 1419} {"train_loss": -10.963312149047852, "global_step": 238524, "epoch": 1419} {"train_loss": -11.84654426574707, "global_step": 238525, "epoch": 1419} {"train_loss": -11.121427536010742, "global_step": 238526, "epoch": 1419} {"train_loss": -11.582294464111328, "global_step": 238527, "epoch": 1419} {"train_loss": -11.711029052734375, "global_step": 238528, "epoch": 1419} {"train_loss": -11.727670669555664, "global_step": 238529, "epoch": 1419} {"train_loss": -11.403599739074707, "global_step": 238530, "epoch": 1419} {"train_loss": -11.795707702636719, "global_step": 238531, "epoch": 1419} {"train_loss": -11.535297393798828, "global_step": 238532, "epoch": 1419} {"train_loss": -11.682844161987305, "global_step": 238533, "epoch": 1419} {"train_loss": -12.091512680053711, "global_step": 238534, "epoch": 1419} {"train_loss": -11.678083419799805, "global_step": 238535, "epoch": 1419} {"train_loss": -11.926726341247559, "global_step": 238536, "epoch": 1419} {"train_loss": -11.582572937011719, "global_step": 238537, "epoch": 1419} {"train_loss": -11.912864685058594, "global_step": 238538, "epoch": 1419} {"train_loss": -11.684181213378906, "global_step": 238539, "epoch": 1419} {"train_loss": -12.064600944519043, "global_step": 238540, "epoch": 1419} {"train_loss": -11.846244812011719, "global_step": 238541, "epoch": 1419} {"train_loss": -11.977457046508789, "global_step": 238542, "epoch": 1419} {"train_loss": -11.746322631835938, "global_step": 238543, "epoch": 1419} {"train_loss": -11.85239315032959, "global_step": 238544, "epoch": 1419} {"train_loss": -12.00422477722168, "global_step": 238545, "epoch": 1419} {"train_loss": -11.8945951461792, "global_step": 238546, "epoch": 1419} {"train_loss": -11.947336196899414, "global_step": 238547, "epoch": 1419} {"train_loss": -11.73513412475586, "global_step": 238548, "epoch": 1419} {"train_loss": -11.969343185424805, "global_step": 238549, "epoch": 1419} {"train_loss": -11.786909103393555, "global_step": 238550, "epoch": 1419} {"train_loss": -12.069133758544922, "global_step": 238551, "epoch": 1419} {"train_loss": -11.67384147644043, "global_step": 238552, "epoch": 1419} {"train_loss": -11.959662437438965, "global_step": 238553, "epoch": 1419} {"train_loss": -11.872936248779297, "global_step": 238554, "epoch": 1419} {"train_loss": -11.740939140319824, "global_step": 238555, "epoch": 1419} {"train_loss": -11.974594116210938, "global_step": 238556, "epoch": 1419} {"train_loss": -11.896156311035156, "global_step": 238557, "epoch": 1419} {"train_loss": -11.80767822265625, "global_step": 238558, "epoch": 1419} {"train_loss": -11.569526876722064, "global_step": 238559, "epoch": 1419, "val_loss": 264305.3125} {"train_loss": -11.745136260986328, "global_step": 238560, "epoch": 1420} {"train_loss": -11.9705810546875, "global_step": 238561, "epoch": 1420} {"train_loss": -11.907486915588379, "global_step": 238562, "epoch": 1420} {"train_loss": -11.863371849060059, "global_step": 238563, "epoch": 1420} {"train_loss": -11.954780578613281, "global_step": 238564, "epoch": 1420} {"train_loss": -11.966388702392578, "global_step": 238565, "epoch": 1420} {"train_loss": -11.799631118774414, "global_step": 238566, "epoch": 1420} {"train_loss": -11.673629760742188, "global_step": 238567, "epoch": 1420} {"train_loss": -11.87259292602539, "global_step": 238568, "epoch": 1420} {"train_loss": -11.807733535766602, "global_step": 238569, "epoch": 1420} {"train_loss": -11.519465446472168, "global_step": 238570, "epoch": 1420} {"train_loss": -11.865314483642578, "global_step": 238571, "epoch": 1420} {"train_loss": -11.781649589538574, "global_step": 238572, "epoch": 1420} {"train_loss": -12.077177047729492, "global_step": 238573, "epoch": 1420} {"train_loss": -12.108865737915039, "global_step": 238574, "epoch": 1420} {"train_loss": -11.72574520111084, "global_step": 238575, "epoch": 1420} {"train_loss": -11.318578720092773, "global_step": 238576, "epoch": 1420} {"train_loss": -11.476981163024902, "global_step": 238577, "epoch": 1420} {"train_loss": -11.097695350646973, "global_step": 238578, "epoch": 1420} {"train_loss": -10.976460456848145, "global_step": 238579, "epoch": 1420} {"train_loss": -11.895365715026855, "global_step": 238580, "epoch": 1420} {"train_loss": -11.66916275024414, "global_step": 238581, "epoch": 1420} {"train_loss": -11.628439903259277, "global_step": 238582, "epoch": 1420} {"train_loss": -11.66269588470459, "global_step": 238583, "epoch": 1420} {"train_loss": -11.439464569091797, "global_step": 238584, "epoch": 1420} {"train_loss": -11.354945182800293, "global_step": 238585, "epoch": 1420} {"train_loss": -11.632118225097656, "global_step": 238586, "epoch": 1420} {"train_loss": -10.961958885192871, "global_step": 238587, "epoch": 1420} {"train_loss": -11.935844421386719, "global_step": 238588, "epoch": 1420} {"train_loss": -11.372709274291992, "global_step": 238589, "epoch": 1420} {"train_loss": -10.809768676757812, "global_step": 238590, "epoch": 1420} {"train_loss": -10.889351844787598, "global_step": 238591, "epoch": 1420} {"train_loss": -11.885555267333984, "global_step": 238592, "epoch": 1420} {"train_loss": -10.777667999267578, "global_step": 238593, "epoch": 1420} {"train_loss": -10.608448028564453, "global_step": 238594, "epoch": 1420} {"train_loss": -11.589162826538086, "global_step": 238595, "epoch": 1420} {"train_loss": -11.29426383972168, "global_step": 238596, "epoch": 1420} {"train_loss": -11.024605751037598, "global_step": 238597, "epoch": 1420} {"train_loss": -11.666217803955078, "global_step": 238598, "epoch": 1420} {"train_loss": -11.184953689575195, "global_step": 238599, "epoch": 1420} {"train_loss": -11.257791519165039, "global_step": 238600, "epoch": 1420} {"train_loss": -11.6576566696167, "global_step": 238601, "epoch": 1420} {"train_loss": -11.398460388183594, "global_step": 238602, "epoch": 1420} {"train_loss": -11.44903564453125, "global_step": 238603, "epoch": 1420} {"train_loss": -11.406847953796387, "global_step": 238604, "epoch": 1420} {"train_loss": -11.830575942993164, "global_step": 238605, "epoch": 1420} {"train_loss": -11.367258071899414, "global_step": 238606, "epoch": 1420} {"train_loss": -11.94766616821289, "global_step": 238607, "epoch": 1420} {"train_loss": -11.799884796142578, "global_step": 238608, "epoch": 1420} {"train_loss": -11.552793502807617, "global_step": 238609, "epoch": 1420} {"train_loss": -11.32778549194336, "global_step": 238610, "epoch": 1420} {"train_loss": -11.56977653503418, "global_step": 238611, "epoch": 1420} {"train_loss": -11.856056213378906, "global_step": 238612, "epoch": 1420} {"train_loss": -11.51468276977539, "global_step": 238613, "epoch": 1420} {"train_loss": -11.612984657287598, "global_step": 238614, "epoch": 1420} {"train_loss": -11.195021629333496, "global_step": 238615, "epoch": 1420} {"train_loss": -11.863737106323242, "global_step": 238616, "epoch": 1420} {"train_loss": -11.596851348876953, "global_step": 238617, "epoch": 1420} {"train_loss": -11.862890243530273, "global_step": 238618, "epoch": 1420} {"train_loss": -11.871960639953613, "global_step": 238619, "epoch": 1420} {"train_loss": -11.53696060180664, "global_step": 238620, "epoch": 1420} {"train_loss": -12.027101516723633, "global_step": 238621, "epoch": 1420} {"train_loss": -11.669418334960938, "global_step": 238622, "epoch": 1420} {"train_loss": -11.799891471862793, "global_step": 238623, "epoch": 1420} {"train_loss": -11.602190971374512, "global_step": 238624, "epoch": 1420} {"train_loss": -11.573841094970703, "global_step": 238625, "epoch": 1420} {"train_loss": -12.105462074279785, "global_step": 238626, "epoch": 1420} {"train_loss": -11.37500286102295, "global_step": 238627, "epoch": 1420} {"train_loss": -11.971442222595215, "global_step": 238628, "epoch": 1420} {"train_loss": -11.640661239624023, "global_step": 238629, "epoch": 1420} {"train_loss": -11.873546600341797, "global_step": 238630, "epoch": 1420} {"train_loss": -11.28122615814209, "global_step": 238631, "epoch": 1420} {"train_loss": -12.045169830322266, "global_step": 238632, "epoch": 1420} {"train_loss": -11.688170433044434, "global_step": 238633, "epoch": 1420} {"train_loss": -11.642265319824219, "global_step": 238634, "epoch": 1420} {"train_loss": -11.491765022277832, "global_step": 238635, "epoch": 1420} {"train_loss": -11.204584121704102, "global_step": 238636, "epoch": 1420} {"train_loss": -11.771806716918945, "global_step": 238637, "epoch": 1420} {"train_loss": -11.732072830200195, "global_step": 238638, "epoch": 1420} {"train_loss": -11.989187240600586, "global_step": 238639, "epoch": 1420} {"train_loss": -11.804535865783691, "global_step": 238640, "epoch": 1420} {"train_loss": -11.66187858581543, "global_step": 238641, "epoch": 1420} {"train_loss": -11.980009078979492, "global_step": 238642, "epoch": 1420} {"train_loss": -11.591400146484375, "global_step": 238643, "epoch": 1420} {"train_loss": -11.973841667175293, "global_step": 238644, "epoch": 1420} {"train_loss": -11.59231185913086, "global_step": 238645, "epoch": 1420} {"train_loss": -11.115922927856445, "global_step": 238646, "epoch": 1420} {"train_loss": -11.124414443969727, "global_step": 238647, "epoch": 1420} {"train_loss": -11.248022079467773, "global_step": 238648, "epoch": 1420} {"train_loss": -10.81393051147461, "global_step": 238649, "epoch": 1420} {"train_loss": -11.986225128173828, "global_step": 238650, "epoch": 1420} {"train_loss": -11.278162956237793, "global_step": 238651, "epoch": 1420} {"train_loss": -11.916431427001953, "global_step": 238652, "epoch": 1420} {"train_loss": -11.798060417175293, "global_step": 238653, "epoch": 1420} {"train_loss": -11.638496398925781, "global_step": 238654, "epoch": 1420} {"train_loss": -11.503408432006836, "global_step": 238655, "epoch": 1420} {"train_loss": -11.399903297424316, "global_step": 238656, "epoch": 1420} {"train_loss": -10.42082405090332, "global_step": 238657, "epoch": 1420} {"train_loss": -11.905405044555664, "global_step": 238658, "epoch": 1420} {"train_loss": -11.188392639160156, "global_step": 238659, "epoch": 1420} {"train_loss": -11.55355167388916, "global_step": 238660, "epoch": 1420} {"train_loss": -10.959264755249023, "global_step": 238661, "epoch": 1420} {"train_loss": -11.360567092895508, "global_step": 238662, "epoch": 1420} {"train_loss": -11.357955932617188, "global_step": 238663, "epoch": 1420} {"train_loss": -11.245430946350098, "global_step": 238664, "epoch": 1420} {"train_loss": -11.505020141601562, "global_step": 238665, "epoch": 1420} {"train_loss": -11.237579345703125, "global_step": 238666, "epoch": 1420} {"train_loss": -11.643539428710938, "global_step": 238667, "epoch": 1420} {"train_loss": -11.231039047241211, "global_step": 238668, "epoch": 1420} {"train_loss": -11.686331748962402, "global_step": 238669, "epoch": 1420} {"train_loss": -11.44538402557373, "global_step": 238670, "epoch": 1420} {"train_loss": -11.355111122131348, "global_step": 238671, "epoch": 1420} {"train_loss": -11.21476936340332, "global_step": 238672, "epoch": 1420} {"train_loss": -11.244941711425781, "global_step": 238673, "epoch": 1420} {"train_loss": -11.604004859924316, "global_step": 238674, "epoch": 1420} {"train_loss": -11.222099304199219, "global_step": 238675, "epoch": 1420} {"train_loss": -11.228524208068848, "global_step": 238676, "epoch": 1420} {"train_loss": -11.420005798339844, "global_step": 238677, "epoch": 1420} {"train_loss": -11.2919282913208, "global_step": 238678, "epoch": 1420} {"train_loss": -11.632620811462402, "global_step": 238679, "epoch": 1420} {"train_loss": -11.363886833190918, "global_step": 238680, "epoch": 1420} {"train_loss": -10.581403732299805, "global_step": 238681, "epoch": 1420} {"train_loss": -10.65392017364502, "global_step": 238682, "epoch": 1420} {"train_loss": -10.70448112487793, "global_step": 238683, "epoch": 1420} {"train_loss": -10.640917778015137, "global_step": 238684, "epoch": 1420} {"train_loss": -10.899744987487793, "global_step": 238685, "epoch": 1420} {"train_loss": -10.639514923095703, "global_step": 238686, "epoch": 1420} {"train_loss": -11.124876022338867, "global_step": 238687, "epoch": 1420} {"train_loss": -10.525933265686035, "global_step": 238688, "epoch": 1420} {"train_loss": -9.871980667114258, "global_step": 238689, "epoch": 1420} {"train_loss": -11.293882369995117, "global_step": 238690, "epoch": 1420} {"train_loss": -10.767593383789062, "global_step": 238691, "epoch": 1420} {"train_loss": -11.21325397491455, "global_step": 238692, "epoch": 1420} {"train_loss": -11.098140716552734, "global_step": 238693, "epoch": 1420} {"train_loss": -11.31690502166748, "global_step": 238694, "epoch": 1420} {"train_loss": -11.333080291748047, "global_step": 238695, "epoch": 1420} {"train_loss": -11.282670021057129, "global_step": 238696, "epoch": 1420} {"train_loss": -11.396675109863281, "global_step": 238697, "epoch": 1420} {"train_loss": -10.832109451293945, "global_step": 238698, "epoch": 1420} {"train_loss": -11.493608474731445, "global_step": 238699, "epoch": 1420} {"train_loss": -11.335927963256836, "global_step": 238700, "epoch": 1420} {"train_loss": -11.6375732421875, "global_step": 238701, "epoch": 1420} {"train_loss": -11.61316204071045, "global_step": 238702, "epoch": 1420} {"train_loss": -11.545066833496094, "global_step": 238703, "epoch": 1420} {"train_loss": -11.639760971069336, "global_step": 238704, "epoch": 1420} {"train_loss": -11.639091491699219, "global_step": 238705, "epoch": 1420} {"train_loss": -11.635976791381836, "global_step": 238706, "epoch": 1420} {"train_loss": -11.717306137084961, "global_step": 238707, "epoch": 1420} {"train_loss": -11.878870010375977, "global_step": 238708, "epoch": 1420} {"train_loss": -11.686171531677246, "global_step": 238709, "epoch": 1420} {"train_loss": -11.745832443237305, "global_step": 238710, "epoch": 1420} {"train_loss": -11.88309097290039, "global_step": 238711, "epoch": 1420} {"train_loss": -11.97801685333252, "global_step": 238712, "epoch": 1420} {"train_loss": -11.86475944519043, "global_step": 238713, "epoch": 1420} {"train_loss": -12.018397331237793, "global_step": 238714, "epoch": 1420} {"train_loss": -11.882862091064453, "global_step": 238715, "epoch": 1420} {"train_loss": -12.011987686157227, "global_step": 238716, "epoch": 1420} {"train_loss": -11.61741828918457, "global_step": 238717, "epoch": 1420} {"train_loss": -12.143502235412598, "global_step": 238718, "epoch": 1420} {"train_loss": -12.021672248840332, "global_step": 238719, "epoch": 1420} {"train_loss": -11.865180969238281, "global_step": 238720, "epoch": 1420} {"train_loss": -11.873915672302246, "global_step": 238721, "epoch": 1420} {"train_loss": -11.971077919006348, "global_step": 238722, "epoch": 1420} {"train_loss": -11.9510498046875, "global_step": 238723, "epoch": 1420} {"train_loss": -11.90909481048584, "global_step": 238724, "epoch": 1420} {"train_loss": -11.92603874206543, "global_step": 238725, "epoch": 1420} {"train_loss": -12.163067817687988, "global_step": 238726, "epoch": 1420} {"train_loss": -11.519790547234672, "global_step": 238727, "epoch": 1420, "val_loss": 268058.3125, "train_action_mse_error": 1.3536357879638672} {"train_loss": -12.119396209716797, "global_step": 238728, "epoch": 1421} {"train_loss": -12.086529731750488, "global_step": 238729, "epoch": 1421} {"train_loss": -11.969295501708984, "global_step": 238730, "epoch": 1421} {"train_loss": -12.249309539794922, "global_step": 238731, "epoch": 1421} {"train_loss": -12.111090660095215, "global_step": 238732, "epoch": 1421} {"train_loss": -11.964125633239746, "global_step": 238733, "epoch": 1421} {"train_loss": -12.105045318603516, "global_step": 238734, "epoch": 1421} {"train_loss": -12.076723098754883, "global_step": 238735, "epoch": 1421} {"train_loss": -12.283286094665527, "global_step": 238736, "epoch": 1421} {"train_loss": -12.130453109741211, "global_step": 238737, "epoch": 1421} {"train_loss": -12.187943458557129, "global_step": 238738, "epoch": 1421} {"train_loss": -12.000207901000977, "global_step": 238739, "epoch": 1421} {"train_loss": -12.17340087890625, "global_step": 238740, "epoch": 1421} {"train_loss": -12.119569778442383, "global_step": 238741, "epoch": 1421} {"train_loss": -12.296882629394531, "global_step": 238742, "epoch": 1421} {"train_loss": -12.096925735473633, "global_step": 238743, "epoch": 1421} {"train_loss": -12.030946731567383, "global_step": 238744, "epoch": 1421} {"train_loss": -12.219451904296875, "global_step": 238745, "epoch": 1421} {"train_loss": -12.507345199584961, "global_step": 238746, "epoch": 1421} {"train_loss": -12.379571914672852, "global_step": 238747, "epoch": 1421} {"train_loss": -12.162734985351562, "global_step": 238748, "epoch": 1421} {"train_loss": -12.380804061889648, "global_step": 238749, "epoch": 1421} {"train_loss": -11.987497329711914, "global_step": 238750, "epoch": 1421} {"train_loss": -11.228999137878418, "global_step": 238751, "epoch": 1421} {"train_loss": -11.152782440185547, "global_step": 238752, "epoch": 1421} {"train_loss": -11.927656173706055, "global_step": 238753, "epoch": 1421} {"train_loss": -11.543279647827148, "global_step": 238754, "epoch": 1421} {"train_loss": -11.212728500366211, "global_step": 238755, "epoch": 1421} {"train_loss": -11.178630828857422, "global_step": 238756, "epoch": 1421} {"train_loss": -11.876144409179688, "global_step": 238757, "epoch": 1421} {"train_loss": -11.57815170288086, "global_step": 238758, "epoch": 1421} {"train_loss": -11.143030166625977, "global_step": 238759, "epoch": 1421} {"train_loss": -10.59921932220459, "global_step": 238760, "epoch": 1421} {"train_loss": -9.63027572631836, "global_step": 238761, "epoch": 1421} {"train_loss": -10.34016227722168, "global_step": 238762, "epoch": 1421} {"train_loss": -9.751588821411133, "global_step": 238763, "epoch": 1421} {"train_loss": -9.483461380004883, "global_step": 238764, "epoch": 1421} {"train_loss": -7.98485803604126, "global_step": 238765, "epoch": 1421} {"train_loss": -10.075967788696289, "global_step": 238766, "epoch": 1421} {"train_loss": -9.785715103149414, "global_step": 238767, "epoch": 1421} {"train_loss": -9.802556037902832, "global_step": 238768, "epoch": 1421} {"train_loss": -9.907637596130371, "global_step": 238769, "epoch": 1421} {"train_loss": -10.10273551940918, "global_step": 238770, "epoch": 1421} {"train_loss": -10.4216890335083, "global_step": 238771, "epoch": 1421} {"train_loss": -10.098774909973145, "global_step": 238772, "epoch": 1421} {"train_loss": -10.246293067932129, "global_step": 238773, "epoch": 1421} {"train_loss": -8.894693374633789, "global_step": 238774, "epoch": 1421} {"train_loss": -10.380878448486328, "global_step": 238775, "epoch": 1421} {"train_loss": -10.566452026367188, "global_step": 238776, "epoch": 1421} {"train_loss": -9.83018684387207, "global_step": 238777, "epoch": 1421} {"train_loss": -11.140249252319336, "global_step": 238778, "epoch": 1421} {"train_loss": -10.64380931854248, "global_step": 238779, "epoch": 1421} {"train_loss": -11.211740493774414, "global_step": 238780, "epoch": 1421} {"train_loss": -11.02047061920166, "global_step": 238781, "epoch": 1421} {"train_loss": -10.543807029724121, "global_step": 238782, "epoch": 1421} {"train_loss": -10.301335334777832, "global_step": 238783, "epoch": 1421} {"train_loss": -10.753826141357422, "global_step": 238784, "epoch": 1421} {"train_loss": -10.571460723876953, "global_step": 238785, "epoch": 1421} {"train_loss": -10.099798202514648, "global_step": 238786, "epoch": 1421} {"train_loss": -10.829354286193848, "global_step": 238787, "epoch": 1421} {"train_loss": -10.677781105041504, "global_step": 238788, "epoch": 1421} {"train_loss": -11.376998901367188, "global_step": 238789, "epoch": 1421} {"train_loss": -10.426130294799805, "global_step": 238790, "epoch": 1421} {"train_loss": -11.136680603027344, "global_step": 238791, "epoch": 1421} {"train_loss": -11.014375686645508, "global_step": 238792, "epoch": 1421} {"train_loss": -10.901205062866211, "global_step": 238793, "epoch": 1421} {"train_loss": -11.45885181427002, "global_step": 238794, "epoch": 1421} {"train_loss": -10.994322776794434, "global_step": 238795, "epoch": 1421} {"train_loss": -11.384778022766113, "global_step": 238796, "epoch": 1421} {"train_loss": -11.081428527832031, "global_step": 238797, "epoch": 1421} {"train_loss": -11.338727951049805, "global_step": 238798, "epoch": 1421} {"train_loss": -10.875751495361328, "global_step": 238799, "epoch": 1421} {"train_loss": -11.560235977172852, "global_step": 238800, "epoch": 1421} {"train_loss": -10.718852043151855, "global_step": 238801, "epoch": 1421} {"train_loss": -11.519990921020508, "global_step": 238802, "epoch": 1421} {"train_loss": -11.258822441101074, "global_step": 238803, "epoch": 1421} {"train_loss": -11.233678817749023, "global_step": 238804, "epoch": 1421} {"train_loss": -11.120111465454102, "global_step": 238805, "epoch": 1421} {"train_loss": -11.508052825927734, "global_step": 238806, "epoch": 1421} {"train_loss": -11.356124877929688, "global_step": 238807, "epoch": 1421} {"train_loss": -11.600285530090332, "global_step": 238808, "epoch": 1421} {"train_loss": -11.361410140991211, "global_step": 238809, "epoch": 1421} {"train_loss": -11.505975723266602, "global_step": 238810, "epoch": 1421} {"train_loss": -11.379043579101562, "global_step": 238811, "epoch": 1421} {"train_loss": -11.524309158325195, "global_step": 238812, "epoch": 1421} {"train_loss": -11.594169616699219, "global_step": 238813, "epoch": 1421} {"train_loss": -11.341175079345703, "global_step": 238814, "epoch": 1421} {"train_loss": -11.694904327392578, "global_step": 238815, "epoch": 1421} {"train_loss": -11.71554183959961, "global_step": 238816, "epoch": 1421} {"train_loss": -11.495389938354492, "global_step": 238817, "epoch": 1421} {"train_loss": -11.606192588806152, "global_step": 238818, "epoch": 1421} {"train_loss": -11.233352661132812, "global_step": 238819, "epoch": 1421} {"train_loss": -11.57650375366211, "global_step": 238820, "epoch": 1421} {"train_loss": -11.734225273132324, "global_step": 238821, "epoch": 1421} {"train_loss": -11.739442825317383, "global_step": 238822, "epoch": 1421} {"train_loss": -11.820755004882812, "global_step": 238823, "epoch": 1421} {"train_loss": -11.951801300048828, "global_step": 238824, "epoch": 1421} {"train_loss": -11.84939956665039, "global_step": 238825, "epoch": 1421} {"train_loss": -11.839855194091797, "global_step": 238826, "epoch": 1421} {"train_loss": -11.64473819732666, "global_step": 238827, "epoch": 1421} {"train_loss": -11.87213134765625, "global_step": 238828, "epoch": 1421} {"train_loss": -11.746284484863281, "global_step": 238829, "epoch": 1421} {"train_loss": -11.716276168823242, "global_step": 238830, "epoch": 1421} {"train_loss": -11.933130264282227, "global_step": 238831, "epoch": 1421} {"train_loss": -11.924846649169922, "global_step": 238832, "epoch": 1421} {"train_loss": -12.121652603149414, "global_step": 238833, "epoch": 1421} {"train_loss": -11.646565437316895, "global_step": 238834, "epoch": 1421} {"train_loss": -11.840509414672852, "global_step": 238835, "epoch": 1421} {"train_loss": -11.924121856689453, "global_step": 238836, "epoch": 1421} {"train_loss": -12.029302597045898, "global_step": 238837, "epoch": 1421} {"train_loss": -12.074991226196289, "global_step": 238838, "epoch": 1421} {"train_loss": -11.99278450012207, "global_step": 238839, "epoch": 1421} {"train_loss": -11.940319061279297, "global_step": 238840, "epoch": 1421} {"train_loss": -12.050667762756348, "global_step": 238841, "epoch": 1421} {"train_loss": -11.976911544799805, "global_step": 238842, "epoch": 1421} {"train_loss": -12.039231300354004, "global_step": 238843, "epoch": 1421} {"train_loss": -12.009722709655762, "global_step": 238844, "epoch": 1421} {"train_loss": -12.049949645996094, "global_step": 238845, "epoch": 1421} {"train_loss": -12.050868034362793, "global_step": 238846, "epoch": 1421} {"train_loss": -12.064316749572754, "global_step": 238847, "epoch": 1421} {"train_loss": -12.04256820678711, "global_step": 238848, "epoch": 1421} {"train_loss": -12.077601432800293, "global_step": 238849, "epoch": 1421} {"train_loss": -11.831609725952148, "global_step": 238850, "epoch": 1421} {"train_loss": -11.92306900024414, "global_step": 238851, "epoch": 1421} {"train_loss": -11.772229194641113, "global_step": 238852, "epoch": 1421} {"train_loss": -12.212909698486328, "global_step": 238853, "epoch": 1421} {"train_loss": -12.100932121276855, "global_step": 238854, "epoch": 1421} {"train_loss": -12.164968490600586, "global_step": 238855, "epoch": 1421} {"train_loss": -12.100910186767578, "global_step": 238856, "epoch": 1421} {"train_loss": -11.96614933013916, "global_step": 238857, "epoch": 1421} {"train_loss": -12.185522079467773, "global_step": 238858, "epoch": 1421} {"train_loss": -12.000041961669922, "global_step": 238859, "epoch": 1421} {"train_loss": -12.119667053222656, "global_step": 238860, "epoch": 1421} {"train_loss": -12.145858764648438, "global_step": 238861, "epoch": 1421} {"train_loss": -12.12125015258789, "global_step": 238862, "epoch": 1421} {"train_loss": -12.243491172790527, "global_step": 238863, "epoch": 1421} {"train_loss": -12.155135154724121, "global_step": 238864, "epoch": 1421} {"train_loss": -12.150060653686523, "global_step": 238865, "epoch": 1421} {"train_loss": -12.071123123168945, "global_step": 238866, "epoch": 1421} {"train_loss": -12.08576774597168, "global_step": 238867, "epoch": 1421} {"train_loss": -12.178869247436523, "global_step": 238868, "epoch": 1421} {"train_loss": -12.083761215209961, "global_step": 238869, "epoch": 1421} {"train_loss": -12.245748519897461, "global_step": 238870, "epoch": 1421} {"train_loss": -12.113997459411621, "global_step": 238871, "epoch": 1421} {"train_loss": -12.22189712524414, "global_step": 238872, "epoch": 1421} {"train_loss": -12.14600658416748, "global_step": 238873, "epoch": 1421} {"train_loss": -11.979019165039062, "global_step": 238874, "epoch": 1421} {"train_loss": -11.8173828125, "global_step": 238875, "epoch": 1421} {"train_loss": -12.181236267089844, "global_step": 238876, "epoch": 1421} {"train_loss": -12.247570037841797, "global_step": 238877, "epoch": 1421} {"train_loss": -11.924614906311035, "global_step": 238878, "epoch": 1421} {"train_loss": -11.540239334106445, "global_step": 238879, "epoch": 1421} {"train_loss": -12.174148559570312, "global_step": 238880, "epoch": 1421} {"train_loss": -11.382518768310547, "global_step": 238881, "epoch": 1421} {"train_loss": -12.077409744262695, "global_step": 238882, "epoch": 1421} {"train_loss": -11.971435546875, "global_step": 238883, "epoch": 1421} {"train_loss": -11.583470344543457, "global_step": 238884, "epoch": 1421} {"train_loss": -11.269744873046875, "global_step": 238885, "epoch": 1421} {"train_loss": -11.522819519042969, "global_step": 238886, "epoch": 1421} {"train_loss": -10.965052604675293, "global_step": 238887, "epoch": 1421} {"train_loss": -9.77427864074707, "global_step": 238888, "epoch": 1421} {"train_loss": -10.750213623046875, "global_step": 238889, "epoch": 1421} {"train_loss": -10.228734970092773, "global_step": 238890, "epoch": 1421} {"train_loss": -9.79244613647461, "global_step": 238891, "epoch": 1421} {"train_loss": -10.20370864868164, "global_step": 238892, "epoch": 1421} {"train_loss": -10.411624908447266, "global_step": 238893, "epoch": 1421} {"train_loss": -8.229673385620117, "global_step": 238894, "epoch": 1421} {"train_loss": -11.417643737225305, "global_step": 238895, "epoch": 1421, "val_loss": 264819.875} {"train_loss": -10.069133758544922, "global_step": 238896, "epoch": 1422} {"train_loss": -10.359980583190918, "global_step": 238897, "epoch": 1422} {"train_loss": -9.368192672729492, "global_step": 238898, "epoch": 1422} {"train_loss": -11.420671463012695, "global_step": 238899, "epoch": 1422} {"train_loss": -10.173910140991211, "global_step": 238900, "epoch": 1422} {"train_loss": -11.02491283416748, "global_step": 238901, "epoch": 1422} {"train_loss": -10.384086608886719, "global_step": 238902, "epoch": 1422} {"train_loss": -10.779106140136719, "global_step": 238903, "epoch": 1422} {"train_loss": -11.01974868774414, "global_step": 238904, "epoch": 1422} {"train_loss": -9.799280166625977, "global_step": 238905, "epoch": 1422} {"train_loss": -11.105566024780273, "global_step": 238906, "epoch": 1422} {"train_loss": -10.533330917358398, "global_step": 238907, "epoch": 1422} {"train_loss": -10.923606872558594, "global_step": 238908, "epoch": 1422} {"train_loss": -11.252527236938477, "global_step": 238909, "epoch": 1422} {"train_loss": -10.254733085632324, "global_step": 238910, "epoch": 1422} {"train_loss": -11.523345947265625, "global_step": 238911, "epoch": 1422} {"train_loss": -10.714399337768555, "global_step": 238912, "epoch": 1422} {"train_loss": -11.362890243530273, "global_step": 238913, "epoch": 1422} {"train_loss": -11.047334671020508, "global_step": 238914, "epoch": 1422} {"train_loss": -11.28447151184082, "global_step": 238915, "epoch": 1422} {"train_loss": -11.430201530456543, "global_step": 238916, "epoch": 1422} {"train_loss": -11.622299194335938, "global_step": 238917, "epoch": 1422} {"train_loss": -11.303522109985352, "global_step": 238918, "epoch": 1422} {"train_loss": -11.312843322753906, "global_step": 238919, "epoch": 1422} {"train_loss": -11.191410064697266, "global_step": 238920, "epoch": 1422} {"train_loss": -11.363426208496094, "global_step": 238921, "epoch": 1422} {"train_loss": -11.288578033447266, "global_step": 238922, "epoch": 1422} {"train_loss": -11.322357177734375, "global_step": 238923, "epoch": 1422} {"train_loss": -11.209487915039062, "global_step": 238924, "epoch": 1422} {"train_loss": -11.296926498413086, "global_step": 238925, "epoch": 1422} {"train_loss": -11.200691223144531, "global_step": 238926, "epoch": 1422} {"train_loss": -11.279850006103516, "global_step": 238927, "epoch": 1422} {"train_loss": -11.81481647491455, "global_step": 238928, "epoch": 1422} {"train_loss": -11.412714004516602, "global_step": 238929, "epoch": 1422} {"train_loss": -11.558916091918945, "global_step": 238930, "epoch": 1422} {"train_loss": -11.431437492370605, "global_step": 238931, "epoch": 1422} {"train_loss": -11.511112213134766, "global_step": 238932, "epoch": 1422} {"train_loss": -11.271408081054688, "global_step": 238933, "epoch": 1422} {"train_loss": -11.676776885986328, "global_step": 238934, "epoch": 1422} {"train_loss": -11.605698585510254, "global_step": 238935, "epoch": 1422} {"train_loss": -11.438919067382812, "global_step": 238936, "epoch": 1422} {"train_loss": -11.816091537475586, "global_step": 238937, "epoch": 1422} {"train_loss": -11.460577964782715, "global_step": 238938, "epoch": 1422} {"train_loss": -11.553483963012695, "global_step": 238939, "epoch": 1422} {"train_loss": -11.711614608764648, "global_step": 238940, "epoch": 1422} {"train_loss": -11.6456298828125, "global_step": 238941, "epoch": 1422} {"train_loss": -11.53638744354248, "global_step": 238942, "epoch": 1422} {"train_loss": -11.683795928955078, "global_step": 238943, "epoch": 1422} {"train_loss": -11.436053276062012, "global_step": 238944, "epoch": 1422} {"train_loss": -11.758991241455078, "global_step": 238945, "epoch": 1422} {"train_loss": -11.415766716003418, "global_step": 238946, "epoch": 1422} {"train_loss": -11.900195121765137, "global_step": 238947, "epoch": 1422} {"train_loss": -11.666869163513184, "global_step": 238948, "epoch": 1422} {"train_loss": -11.66362476348877, "global_step": 238949, "epoch": 1422} {"train_loss": -11.531597137451172, "global_step": 238950, "epoch": 1422} {"train_loss": -11.544565200805664, "global_step": 238951, "epoch": 1422} {"train_loss": -11.800676345825195, "global_step": 238952, "epoch": 1422} {"train_loss": -11.760948181152344, "global_step": 238953, "epoch": 1422} {"train_loss": -11.667346954345703, "global_step": 238954, "epoch": 1422} {"train_loss": -11.368631362915039, "global_step": 238955, "epoch": 1422} {"train_loss": -11.937767028808594, "global_step": 238956, "epoch": 1422} {"train_loss": -11.574850082397461, "global_step": 238957, "epoch": 1422} {"train_loss": -11.948259353637695, "global_step": 238958, "epoch": 1422} {"train_loss": -11.81343936920166, "global_step": 238959, "epoch": 1422} {"train_loss": -11.578880310058594, "global_step": 238960, "epoch": 1422} {"train_loss": -11.972664833068848, "global_step": 238961, "epoch": 1422} {"train_loss": -11.346454620361328, "global_step": 238962, "epoch": 1422} {"train_loss": -11.694329261779785, "global_step": 238963, "epoch": 1422} {"train_loss": -11.725208282470703, "global_step": 238964, "epoch": 1422} {"train_loss": -11.747042655944824, "global_step": 238965, "epoch": 1422} {"train_loss": -11.695514678955078, "global_step": 238966, "epoch": 1422} {"train_loss": -11.489967346191406, "global_step": 238967, "epoch": 1422} {"train_loss": -11.693563461303711, "global_step": 238968, "epoch": 1422} {"train_loss": -11.680047988891602, "global_step": 238969, "epoch": 1422} {"train_loss": -11.772082328796387, "global_step": 238970, "epoch": 1422} {"train_loss": -11.77530288696289, "global_step": 238971, "epoch": 1422} {"train_loss": -12.07192611694336, "global_step": 238972, "epoch": 1422} {"train_loss": -11.773628234863281, "global_step": 238973, "epoch": 1422} {"train_loss": -11.950971603393555, "global_step": 238974, "epoch": 1422} {"train_loss": -11.541013717651367, "global_step": 238975, "epoch": 1422} {"train_loss": -11.867776870727539, "global_step": 238976, "epoch": 1422} {"train_loss": -11.941607475280762, "global_step": 238977, "epoch": 1422} {"train_loss": -12.03885269165039, "global_step": 238978, "epoch": 1422} {"train_loss": -11.872978210449219, "global_step": 238979, "epoch": 1422} {"train_loss": -11.74020004272461, "global_step": 238980, "epoch": 1422} {"train_loss": -11.73655891418457, "global_step": 238981, "epoch": 1422} {"train_loss": -11.604254722595215, "global_step": 238982, "epoch": 1422} {"train_loss": -11.865923881530762, "global_step": 238983, "epoch": 1422} {"train_loss": -11.684150695800781, "global_step": 238984, "epoch": 1422} {"train_loss": -11.845404624938965, "global_step": 238985, "epoch": 1422} {"train_loss": -11.91722297668457, "global_step": 238986, "epoch": 1422} {"train_loss": -11.563349723815918, "global_step": 238987, "epoch": 1422} {"train_loss": -11.620598793029785, "global_step": 238988, "epoch": 1422} {"train_loss": -11.888578414916992, "global_step": 238989, "epoch": 1422} {"train_loss": -11.154096603393555, "global_step": 238990, "epoch": 1422} {"train_loss": -11.119239807128906, "global_step": 238991, "epoch": 1422} {"train_loss": -11.916498184204102, "global_step": 238992, "epoch": 1422} {"train_loss": -10.253290176391602, "global_step": 238993, "epoch": 1422} {"train_loss": -10.12678337097168, "global_step": 238994, "epoch": 1422} {"train_loss": -10.994418144226074, "global_step": 238995, "epoch": 1422} {"train_loss": -11.429319381713867, "global_step": 238996, "epoch": 1422} {"train_loss": -11.194457054138184, "global_step": 238997, "epoch": 1422} {"train_loss": -10.841794967651367, "global_step": 238998, "epoch": 1422} {"train_loss": -11.022972106933594, "global_step": 238999, "epoch": 1422} {"train_loss": -10.675674438476562, "global_step": 239000, "epoch": 1422} {"train_loss": -11.375703811645508, "global_step": 239001, "epoch": 1422} {"train_loss": -9.42770004272461, "global_step": 239002, "epoch": 1422} {"train_loss": -10.866898536682129, "global_step": 239003, "epoch": 1422} {"train_loss": -10.568994522094727, "global_step": 239004, "epoch": 1422} {"train_loss": -10.07795238494873, "global_step": 239005, "epoch": 1422} {"train_loss": -11.64870834350586, "global_step": 239006, "epoch": 1422} {"train_loss": -10.083881378173828, "global_step": 239007, "epoch": 1422} {"train_loss": -11.411172866821289, "global_step": 239008, "epoch": 1422} {"train_loss": -9.861602783203125, "global_step": 239009, "epoch": 1422} {"train_loss": -11.550830841064453, "global_step": 239010, "epoch": 1422} {"train_loss": -9.739980697631836, "global_step": 239011, "epoch": 1422} {"train_loss": -11.044445037841797, "global_step": 239012, "epoch": 1422} {"train_loss": -9.634725570678711, "global_step": 239013, "epoch": 1422} {"train_loss": -10.943199157714844, "global_step": 239014, "epoch": 1422} {"train_loss": -9.182432174682617, "global_step": 239015, "epoch": 1422} {"train_loss": -10.710321426391602, "global_step": 239016, "epoch": 1422} {"train_loss": -10.703108787536621, "global_step": 239017, "epoch": 1422} {"train_loss": -10.852630615234375, "global_step": 239018, "epoch": 1422} {"train_loss": -10.683673858642578, "global_step": 239019, "epoch": 1422} {"train_loss": -11.0329008102417, "global_step": 239020, "epoch": 1422} {"train_loss": -10.717647552490234, "global_step": 239021, "epoch": 1422} {"train_loss": -11.136469841003418, "global_step": 239022, "epoch": 1422} {"train_loss": -11.566046714782715, "global_step": 239023, "epoch": 1422} {"train_loss": -11.151378631591797, "global_step": 239024, "epoch": 1422} {"train_loss": -11.26388168334961, "global_step": 239025, "epoch": 1422} {"train_loss": -11.347700119018555, "global_step": 239026, "epoch": 1422} {"train_loss": -11.398394584655762, "global_step": 239027, "epoch": 1422} {"train_loss": -11.197330474853516, "global_step": 239028, "epoch": 1422} {"train_loss": -11.638350486755371, "global_step": 239029, "epoch": 1422} {"train_loss": -11.360532760620117, "global_step": 239030, "epoch": 1422} {"train_loss": -11.372830390930176, "global_step": 239031, "epoch": 1422} {"train_loss": -11.409928321838379, "global_step": 239032, "epoch": 1422} {"train_loss": -11.070199012756348, "global_step": 239033, "epoch": 1422} {"train_loss": -11.17879867553711, "global_step": 239034, "epoch": 1422} {"train_loss": -11.505790710449219, "global_step": 239035, "epoch": 1422} {"train_loss": -11.55780029296875, "global_step": 239036, "epoch": 1422} {"train_loss": -11.704792022705078, "global_step": 239037, "epoch": 1422} {"train_loss": -11.313301086425781, "global_step": 239038, "epoch": 1422} {"train_loss": -11.49859619140625, "global_step": 239039, "epoch": 1422} {"train_loss": -11.598808288574219, "global_step": 239040, "epoch": 1422} {"train_loss": -11.555583953857422, "global_step": 239041, "epoch": 1422} {"train_loss": -11.617593765258789, "global_step": 239042, "epoch": 1422} {"train_loss": -11.838939666748047, "global_step": 239043, "epoch": 1422} {"train_loss": -11.536357879638672, "global_step": 239044, "epoch": 1422} {"train_loss": -11.893026351928711, "global_step": 239045, "epoch": 1422} {"train_loss": -11.879331588745117, "global_step": 239046, "epoch": 1422} {"train_loss": -11.848360061645508, "global_step": 239047, "epoch": 1422} {"train_loss": -11.834949493408203, "global_step": 239048, "epoch": 1422} {"train_loss": -11.877354621887207, "global_step": 239049, "epoch": 1422} {"train_loss": -11.727798461914062, "global_step": 239050, "epoch": 1422} {"train_loss": -11.579805374145508, "global_step": 239051, "epoch": 1422} {"train_loss": -11.876190185546875, "global_step": 239052, "epoch": 1422} {"train_loss": -11.8023099899292, "global_step": 239053, "epoch": 1422} {"train_loss": -12.015514373779297, "global_step": 239054, "epoch": 1422} {"train_loss": -11.746312141418457, "global_step": 239055, "epoch": 1422} {"train_loss": -11.845184326171875, "global_step": 239056, "epoch": 1422} {"train_loss": -11.867342948913574, "global_step": 239057, "epoch": 1422} {"train_loss": -11.756647109985352, "global_step": 239058, "epoch": 1422} {"train_loss": -11.730718612670898, "global_step": 239059, "epoch": 1422} {"train_loss": -11.970503807067871, "global_step": 239060, "epoch": 1422} {"train_loss": -11.866271018981934, "global_step": 239061, "epoch": 1422} {"train_loss": -11.98569107055664, "global_step": 239062, "epoch": 1422} {"train_loss": -11.343259720575242, "global_step": 239063, "epoch": 1422, "val_loss": 256699.3125} {"train_loss": -12.055914878845215, "global_step": 239064, "epoch": 1423} {"train_loss": -12.047422409057617, "global_step": 239065, "epoch": 1423} {"train_loss": -11.839117050170898, "global_step": 239066, "epoch": 1423} {"train_loss": -12.153646469116211, "global_step": 239067, "epoch": 1423} {"train_loss": -11.94044303894043, "global_step": 239068, "epoch": 1423} {"train_loss": -11.77107048034668, "global_step": 239069, "epoch": 1423} {"train_loss": -12.116386413574219, "global_step": 239070, "epoch": 1423} {"train_loss": -11.722067832946777, "global_step": 239071, "epoch": 1423} {"train_loss": -11.646536827087402, "global_step": 239072, "epoch": 1423} {"train_loss": -11.994089126586914, "global_step": 239073, "epoch": 1423} {"train_loss": -11.632757186889648, "global_step": 239074, "epoch": 1423} {"train_loss": -12.006136894226074, "global_step": 239075, "epoch": 1423} {"train_loss": -11.982519149780273, "global_step": 239076, "epoch": 1423} {"train_loss": -11.745895385742188, "global_step": 239077, "epoch": 1423} {"train_loss": -11.898063659667969, "global_step": 239078, "epoch": 1423} {"train_loss": -11.844746589660645, "global_step": 239079, "epoch": 1423} {"train_loss": -11.911684036254883, "global_step": 239080, "epoch": 1423} {"train_loss": -12.104532241821289, "global_step": 239081, "epoch": 1423} {"train_loss": -11.461734771728516, "global_step": 239082, "epoch": 1423} {"train_loss": -11.614633560180664, "global_step": 239083, "epoch": 1423} {"train_loss": -12.174092292785645, "global_step": 239084, "epoch": 1423} {"train_loss": -11.720295906066895, "global_step": 239085, "epoch": 1423} {"train_loss": -11.88060188293457, "global_step": 239086, "epoch": 1423} {"train_loss": -12.088921546936035, "global_step": 239087, "epoch": 1423} {"train_loss": -11.98230266571045, "global_step": 239088, "epoch": 1423} {"train_loss": -11.887789726257324, "global_step": 239089, "epoch": 1423} {"train_loss": -11.98611068725586, "global_step": 239090, "epoch": 1423} {"train_loss": -11.87990665435791, "global_step": 239091, "epoch": 1423} {"train_loss": -11.880402565002441, "global_step": 239092, "epoch": 1423} {"train_loss": -12.000823974609375, "global_step": 239093, "epoch": 1423} {"train_loss": -11.799952507019043, "global_step": 239094, "epoch": 1423} {"train_loss": -12.179216384887695, "global_step": 239095, "epoch": 1423} {"train_loss": -11.84024429321289, "global_step": 239096, "epoch": 1423} {"train_loss": -11.654229164123535, "global_step": 239097, "epoch": 1423} {"train_loss": -11.377128601074219, "global_step": 239098, "epoch": 1423} {"train_loss": -12.108609199523926, "global_step": 239099, "epoch": 1423} {"train_loss": -11.589160919189453, "global_step": 239100, "epoch": 1423} {"train_loss": -11.024869918823242, "global_step": 239101, "epoch": 1423} {"train_loss": -11.655561447143555, "global_step": 239102, "epoch": 1423} {"train_loss": -11.696220397949219, "global_step": 239103, "epoch": 1423} {"train_loss": -11.281859397888184, "global_step": 239104, "epoch": 1423} {"train_loss": -11.507835388183594, "global_step": 239105, "epoch": 1423} {"train_loss": -11.408016204833984, "global_step": 239106, "epoch": 1423} {"train_loss": -10.989742279052734, "global_step": 239107, "epoch": 1423} {"train_loss": -11.397782325744629, "global_step": 239108, "epoch": 1423} {"train_loss": -11.387432098388672, "global_step": 239109, "epoch": 1423} {"train_loss": -11.63290023803711, "global_step": 239110, "epoch": 1423} {"train_loss": -11.553667068481445, "global_step": 239111, "epoch": 1423} {"train_loss": -11.723116874694824, "global_step": 239112, "epoch": 1423} {"train_loss": -11.31700325012207, "global_step": 239113, "epoch": 1423} {"train_loss": -11.287797927856445, "global_step": 239114, "epoch": 1423} {"train_loss": -11.820622444152832, "global_step": 239115, "epoch": 1423} {"train_loss": -11.771879196166992, "global_step": 239116, "epoch": 1423} {"train_loss": -11.56048583984375, "global_step": 239117, "epoch": 1423} {"train_loss": -11.34667682647705, "global_step": 239118, "epoch": 1423} {"train_loss": -11.516935348510742, "global_step": 239119, "epoch": 1423} {"train_loss": -11.454243659973145, "global_step": 239120, "epoch": 1423} {"train_loss": -11.82973861694336, "global_step": 239121, "epoch": 1423} {"train_loss": -11.625473976135254, "global_step": 239122, "epoch": 1423} {"train_loss": -11.266226768493652, "global_step": 239123, "epoch": 1423} {"train_loss": -11.322362899780273, "global_step": 239124, "epoch": 1423} {"train_loss": -11.408178329467773, "global_step": 239125, "epoch": 1423} {"train_loss": -11.797035217285156, "global_step": 239126, "epoch": 1423} {"train_loss": -11.710420608520508, "global_step": 239127, "epoch": 1423} {"train_loss": -11.738245010375977, "global_step": 239128, "epoch": 1423} {"train_loss": -11.286819458007812, "global_step": 239129, "epoch": 1423} {"train_loss": -11.93261432647705, "global_step": 239130, "epoch": 1423} {"train_loss": -11.484046936035156, "global_step": 239131, "epoch": 1423} {"train_loss": -11.768007278442383, "global_step": 239132, "epoch": 1423} {"train_loss": -11.580955505371094, "global_step": 239133, "epoch": 1423} {"train_loss": -11.833549499511719, "global_step": 239134, "epoch": 1423} {"train_loss": -12.000616073608398, "global_step": 239135, "epoch": 1423} {"train_loss": -11.720216751098633, "global_step": 239136, "epoch": 1423} {"train_loss": -11.204865455627441, "global_step": 239137, "epoch": 1423} {"train_loss": -11.625317573547363, "global_step": 239138, "epoch": 1423} {"train_loss": -11.199750900268555, "global_step": 239139, "epoch": 1423} {"train_loss": -11.134936332702637, "global_step": 239140, "epoch": 1423} {"train_loss": -11.569823265075684, "global_step": 239141, "epoch": 1423} {"train_loss": -11.37073040008545, "global_step": 239142, "epoch": 1423} {"train_loss": -10.953781127929688, "global_step": 239143, "epoch": 1423} {"train_loss": -11.38535213470459, "global_step": 239144, "epoch": 1423} {"train_loss": -11.53637409210205, "global_step": 239145, "epoch": 1423} {"train_loss": -11.852191925048828, "global_step": 239146, "epoch": 1423} {"train_loss": -11.793516159057617, "global_step": 239147, "epoch": 1423} {"train_loss": -11.858169555664062, "global_step": 239148, "epoch": 1423} {"train_loss": -11.595144271850586, "global_step": 239149, "epoch": 1423} {"train_loss": -11.71402359008789, "global_step": 239150, "epoch": 1423} {"train_loss": -11.625677108764648, "global_step": 239151, "epoch": 1423} {"train_loss": -12.013040542602539, "global_step": 239152, "epoch": 1423} {"train_loss": -11.767000198364258, "global_step": 239153, "epoch": 1423} {"train_loss": -11.564556121826172, "global_step": 239154, "epoch": 1423} {"train_loss": -11.943166732788086, "global_step": 239155, "epoch": 1423} {"train_loss": -11.857653617858887, "global_step": 239156, "epoch": 1423} {"train_loss": -11.686164855957031, "global_step": 239157, "epoch": 1423} {"train_loss": -11.377685546875, "global_step": 239158, "epoch": 1423} {"train_loss": -11.431440353393555, "global_step": 239159, "epoch": 1423} {"train_loss": -11.280437469482422, "global_step": 239160, "epoch": 1423} {"train_loss": -11.652912139892578, "global_step": 239161, "epoch": 1423} {"train_loss": -10.784326553344727, "global_step": 239162, "epoch": 1423} {"train_loss": -10.501441955566406, "global_step": 239163, "epoch": 1423} {"train_loss": -11.363819122314453, "global_step": 239164, "epoch": 1423} {"train_loss": -9.898560523986816, "global_step": 239165, "epoch": 1423} {"train_loss": -9.379680633544922, "global_step": 239166, "epoch": 1423} {"train_loss": -11.248258590698242, "global_step": 239167, "epoch": 1423} {"train_loss": -10.059319496154785, "global_step": 239168, "epoch": 1423} {"train_loss": -11.593181610107422, "global_step": 239169, "epoch": 1423} {"train_loss": -10.88969612121582, "global_step": 239170, "epoch": 1423} {"train_loss": -11.33712387084961, "global_step": 239171, "epoch": 1423} {"train_loss": -10.778164863586426, "global_step": 239172, "epoch": 1423} {"train_loss": -10.5700044631958, "global_step": 239173, "epoch": 1423} {"train_loss": -11.27210807800293, "global_step": 239174, "epoch": 1423} {"train_loss": -11.2011137008667, "global_step": 239175, "epoch": 1423} {"train_loss": -11.738005638122559, "global_step": 239176, "epoch": 1423} {"train_loss": -10.912792205810547, "global_step": 239177, "epoch": 1423} {"train_loss": -11.447269439697266, "global_step": 239178, "epoch": 1423} {"train_loss": -11.362953186035156, "global_step": 239179, "epoch": 1423} {"train_loss": -11.736571311950684, "global_step": 239180, "epoch": 1423} {"train_loss": -11.48159408569336, "global_step": 239181, "epoch": 1423} {"train_loss": -11.633227348327637, "global_step": 239182, "epoch": 1423} {"train_loss": -11.531530380249023, "global_step": 239183, "epoch": 1423} {"train_loss": -11.543638229370117, "global_step": 239184, "epoch": 1423} {"train_loss": -11.672435760498047, "global_step": 239185, "epoch": 1423} {"train_loss": -11.348583221435547, "global_step": 239186, "epoch": 1423} {"train_loss": -11.537555694580078, "global_step": 239187, "epoch": 1423} {"train_loss": -11.124101638793945, "global_step": 239188, "epoch": 1423} {"train_loss": -11.625646591186523, "global_step": 239189, "epoch": 1423} {"train_loss": -11.357181549072266, "global_step": 239190, "epoch": 1423} {"train_loss": -11.483223915100098, "global_step": 239191, "epoch": 1423} {"train_loss": -11.273405075073242, "global_step": 239192, "epoch": 1423} {"train_loss": -11.743446350097656, "global_step": 239193, "epoch": 1423} {"train_loss": -11.362630844116211, "global_step": 239194, "epoch": 1423} {"train_loss": -11.576445579528809, "global_step": 239195, "epoch": 1423} {"train_loss": -11.609817504882812, "global_step": 239196, "epoch": 1423} {"train_loss": -11.459613800048828, "global_step": 239197, "epoch": 1423} {"train_loss": -11.83436393737793, "global_step": 239198, "epoch": 1423} {"train_loss": -11.917744636535645, "global_step": 239199, "epoch": 1423} {"train_loss": -11.808023452758789, "global_step": 239200, "epoch": 1423} {"train_loss": -11.648109436035156, "global_step": 239201, "epoch": 1423} {"train_loss": -11.805809020996094, "global_step": 239202, "epoch": 1423} {"train_loss": -11.883340835571289, "global_step": 239203, "epoch": 1423} {"train_loss": -11.874336242675781, "global_step": 239204, "epoch": 1423} {"train_loss": -11.702603340148926, "global_step": 239205, "epoch": 1423} {"train_loss": -12.081441879272461, "global_step": 239206, "epoch": 1423} {"train_loss": -11.674835205078125, "global_step": 239207, "epoch": 1423} {"train_loss": -12.030000686645508, "global_step": 239208, "epoch": 1423} {"train_loss": -11.683334350585938, "global_step": 239209, "epoch": 1423} {"train_loss": -11.949222564697266, "global_step": 239210, "epoch": 1423} {"train_loss": -12.012580871582031, "global_step": 239211, "epoch": 1423} {"train_loss": -11.950254440307617, "global_step": 239212, "epoch": 1423} {"train_loss": -11.981634140014648, "global_step": 239213, "epoch": 1423} {"train_loss": -11.897151947021484, "global_step": 239214, "epoch": 1423} {"train_loss": -11.81037425994873, "global_step": 239215, "epoch": 1423} {"train_loss": -11.98630428314209, "global_step": 239216, "epoch": 1423} {"train_loss": -11.514474868774414, "global_step": 239217, "epoch": 1423} {"train_loss": -11.665586471557617, "global_step": 239218, "epoch": 1423} {"train_loss": -11.835277557373047, "global_step": 239219, "epoch": 1423} {"train_loss": -11.760337829589844, "global_step": 239220, "epoch": 1423} {"train_loss": -11.866459846496582, "global_step": 239221, "epoch": 1423} {"train_loss": -11.99785041809082, "global_step": 239222, "epoch": 1423} {"train_loss": -11.956304550170898, "global_step": 239223, "epoch": 1423} {"train_loss": -11.896052360534668, "global_step": 239224, "epoch": 1423} {"train_loss": -11.803659439086914, "global_step": 239225, "epoch": 1423} {"train_loss": -12.137134552001953, "global_step": 239226, "epoch": 1423} {"train_loss": -11.749122619628906, "global_step": 239227, "epoch": 1423} {"train_loss": -11.970136642456055, "global_step": 239228, "epoch": 1423} {"train_loss": -11.929149627685547, "global_step": 239229, "epoch": 1423} {"train_loss": -11.448259353637695, "global_step": 239230, "epoch": 1423} {"train_loss": -11.610918203989664, "global_step": 239231, "epoch": 1423, "val_loss": 258621.5} {"train_loss": -12.193073272705078, "global_step": 239232, "epoch": 1424} {"train_loss": -11.741668701171875, "global_step": 239233, "epoch": 1424} {"train_loss": -12.036703109741211, "global_step": 239234, "epoch": 1424} {"train_loss": -12.111998558044434, "global_step": 239235, "epoch": 1424} {"train_loss": -11.754584312438965, "global_step": 239236, "epoch": 1424} {"train_loss": -12.142399787902832, "global_step": 239237, "epoch": 1424} {"train_loss": -11.739391326904297, "global_step": 239238, "epoch": 1424} {"train_loss": -11.113515853881836, "global_step": 239239, "epoch": 1424} {"train_loss": -12.007097244262695, "global_step": 239240, "epoch": 1424} {"train_loss": -11.807588577270508, "global_step": 239241, "epoch": 1424} {"train_loss": -11.16165542602539, "global_step": 239242, "epoch": 1424} {"train_loss": -11.691247940063477, "global_step": 239243, "epoch": 1424} {"train_loss": -11.758169174194336, "global_step": 239244, "epoch": 1424} {"train_loss": -10.511112213134766, "global_step": 239245, "epoch": 1424} {"train_loss": -11.328014373779297, "global_step": 239246, "epoch": 1424} {"train_loss": -11.81010627746582, "global_step": 239247, "epoch": 1424} {"train_loss": -11.413152694702148, "global_step": 239248, "epoch": 1424} {"train_loss": -10.344650268554688, "global_step": 239249, "epoch": 1424} {"train_loss": -11.64642333984375, "global_step": 239250, "epoch": 1424} {"train_loss": -9.925482749938965, "global_step": 239251, "epoch": 1424} {"train_loss": -9.367546081542969, "global_step": 239252, "epoch": 1424} {"train_loss": -8.777128219604492, "global_step": 239253, "epoch": 1424} {"train_loss": -10.657666206359863, "global_step": 239254, "epoch": 1424} {"train_loss": -10.050710678100586, "global_step": 239255, "epoch": 1424} {"train_loss": -10.198448181152344, "global_step": 239256, "epoch": 1424} {"train_loss": -9.974321365356445, "global_step": 239257, "epoch": 1424} {"train_loss": -10.076713562011719, "global_step": 239258, "epoch": 1424} {"train_loss": -10.099306106567383, "global_step": 239259, "epoch": 1424} {"train_loss": -10.809106826782227, "global_step": 239260, "epoch": 1424} {"train_loss": -10.043954849243164, "global_step": 239261, "epoch": 1424} {"train_loss": -10.18211555480957, "global_step": 239262, "epoch": 1424} {"train_loss": -10.100831985473633, "global_step": 239263, "epoch": 1424} {"train_loss": -9.202415466308594, "global_step": 239264, "epoch": 1424} {"train_loss": -9.783830642700195, "global_step": 239265, "epoch": 1424} {"train_loss": -9.143623352050781, "global_step": 239266, "epoch": 1424} {"train_loss": -9.703702926635742, "global_step": 239267, "epoch": 1424} {"train_loss": -10.011528968811035, "global_step": 239268, "epoch": 1424} {"train_loss": -9.557872772216797, "global_step": 239269, "epoch": 1424} {"train_loss": -9.781824111938477, "global_step": 239270, "epoch": 1424} {"train_loss": -10.768991470336914, "global_step": 239271, "epoch": 1424} {"train_loss": -9.156530380249023, "global_step": 239272, "epoch": 1424} {"train_loss": -10.680767059326172, "global_step": 239273, "epoch": 1424} {"train_loss": -10.204483032226562, "global_step": 239274, "epoch": 1424} {"train_loss": -10.3326997756958, "global_step": 239275, "epoch": 1424} {"train_loss": -9.813922882080078, "global_step": 239276, "epoch": 1424} {"train_loss": -11.159870147705078, "global_step": 239277, "epoch": 1424} {"train_loss": -10.031230926513672, "global_step": 239278, "epoch": 1424} {"train_loss": -10.291669845581055, "global_step": 239279, "epoch": 1424} {"train_loss": -10.621612548828125, "global_step": 239280, "epoch": 1424} {"train_loss": -10.751182556152344, "global_step": 239281, "epoch": 1424} {"train_loss": -9.996010780334473, "global_step": 239282, "epoch": 1424} {"train_loss": -11.036080360412598, "global_step": 239283, "epoch": 1424} {"train_loss": -11.002384185791016, "global_step": 239284, "epoch": 1424} {"train_loss": -9.701745986938477, "global_step": 239285, "epoch": 1424} {"train_loss": -10.560892105102539, "global_step": 239286, "epoch": 1424} {"train_loss": -10.978143692016602, "global_step": 239287, "epoch": 1424} {"train_loss": -10.581853866577148, "global_step": 239288, "epoch": 1424} {"train_loss": -10.33815860748291, "global_step": 239289, "epoch": 1424} {"train_loss": -10.412033081054688, "global_step": 239290, "epoch": 1424} {"train_loss": -10.996036529541016, "global_step": 239291, "epoch": 1424} {"train_loss": -10.410751342773438, "global_step": 239292, "epoch": 1424} {"train_loss": -10.776628494262695, "global_step": 239293, "epoch": 1424} {"train_loss": -11.420822143554688, "global_step": 239294, "epoch": 1424} {"train_loss": -10.8084077835083, "global_step": 239295, "epoch": 1424} {"train_loss": -10.774271011352539, "global_step": 239296, "epoch": 1424} {"train_loss": -11.18117618560791, "global_step": 239297, "epoch": 1424} {"train_loss": -10.93170166015625, "global_step": 239298, "epoch": 1424} {"train_loss": -11.445119857788086, "global_step": 239299, "epoch": 1424} {"train_loss": -11.214786529541016, "global_step": 239300, "epoch": 1424} {"train_loss": -11.01806640625, "global_step": 239301, "epoch": 1424} {"train_loss": -11.43582534790039, "global_step": 239302, "epoch": 1424} {"train_loss": -11.342656135559082, "global_step": 239303, "epoch": 1424} {"train_loss": -11.421234130859375, "global_step": 239304, "epoch": 1424} {"train_loss": -11.257843017578125, "global_step": 239305, "epoch": 1424} {"train_loss": -11.263557434082031, "global_step": 239306, "epoch": 1424} {"train_loss": -11.388326644897461, "global_step": 239307, "epoch": 1424} {"train_loss": -11.298720359802246, "global_step": 239308, "epoch": 1424} {"train_loss": -11.312800407409668, "global_step": 239309, "epoch": 1424} {"train_loss": -11.191253662109375, "global_step": 239310, "epoch": 1424} {"train_loss": -11.468667984008789, "global_step": 239311, "epoch": 1424} {"train_loss": -11.569442749023438, "global_step": 239312, "epoch": 1424} {"train_loss": -11.537507057189941, "global_step": 239313, "epoch": 1424} {"train_loss": -11.424118041992188, "global_step": 239314, "epoch": 1424} {"train_loss": -11.364139556884766, "global_step": 239315, "epoch": 1424} {"train_loss": -11.649195671081543, "global_step": 239316, "epoch": 1424} {"train_loss": -11.51102066040039, "global_step": 239317, "epoch": 1424} {"train_loss": -11.488618850708008, "global_step": 239318, "epoch": 1424} {"train_loss": -11.665532112121582, "global_step": 239319, "epoch": 1424} {"train_loss": -11.638646125793457, "global_step": 239320, "epoch": 1424} {"train_loss": -11.444440841674805, "global_step": 239321, "epoch": 1424} {"train_loss": -11.48206901550293, "global_step": 239322, "epoch": 1424} {"train_loss": -11.668859481811523, "global_step": 239323, "epoch": 1424} {"train_loss": -11.635640144348145, "global_step": 239324, "epoch": 1424} {"train_loss": -11.561019897460938, "global_step": 239325, "epoch": 1424} {"train_loss": -11.629792213439941, "global_step": 239326, "epoch": 1424} {"train_loss": -11.81140422821045, "global_step": 239327, "epoch": 1424} {"train_loss": -11.717727661132812, "global_step": 239328, "epoch": 1424} {"train_loss": -11.724214553833008, "global_step": 239329, "epoch": 1424} {"train_loss": -11.648056030273438, "global_step": 239330, "epoch": 1424} {"train_loss": -11.748393058776855, "global_step": 239331, "epoch": 1424} {"train_loss": -11.59708023071289, "global_step": 239332, "epoch": 1424} {"train_loss": -11.830611228942871, "global_step": 239333, "epoch": 1424} {"train_loss": -11.902128219604492, "global_step": 239334, "epoch": 1424} {"train_loss": -11.958319664001465, "global_step": 239335, "epoch": 1424} {"train_loss": -11.91366195678711, "global_step": 239336, "epoch": 1424} {"train_loss": -11.862960815429688, "global_step": 239337, "epoch": 1424} {"train_loss": -11.848465919494629, "global_step": 239338, "epoch": 1424} {"train_loss": -11.751394271850586, "global_step": 239339, "epoch": 1424} {"train_loss": -11.93404769897461, "global_step": 239340, "epoch": 1424} {"train_loss": -11.917020797729492, "global_step": 239341, "epoch": 1424} {"train_loss": -11.822284698486328, "global_step": 239342, "epoch": 1424} {"train_loss": -11.960037231445312, "global_step": 239343, "epoch": 1424} {"train_loss": -11.867695808410645, "global_step": 239344, "epoch": 1424} {"train_loss": -11.9171142578125, "global_step": 239345, "epoch": 1424} {"train_loss": -11.933916091918945, "global_step": 239346, "epoch": 1424} {"train_loss": -12.060935020446777, "global_step": 239347, "epoch": 1424} {"train_loss": -12.0359525680542, "global_step": 239348, "epoch": 1424} {"train_loss": -11.971382141113281, "global_step": 239349, "epoch": 1424} {"train_loss": -12.132303237915039, "global_step": 239350, "epoch": 1424} {"train_loss": -11.950181007385254, "global_step": 239351, "epoch": 1424} {"train_loss": -12.068001747131348, "global_step": 239352, "epoch": 1424} {"train_loss": -11.939704895019531, "global_step": 239353, "epoch": 1424} {"train_loss": -11.963199615478516, "global_step": 239354, "epoch": 1424} {"train_loss": -12.099574089050293, "global_step": 239355, "epoch": 1424} {"train_loss": -11.975611686706543, "global_step": 239356, "epoch": 1424} {"train_loss": -12.027399063110352, "global_step": 239357, "epoch": 1424} {"train_loss": -12.156333923339844, "global_step": 239358, "epoch": 1424} {"train_loss": -11.886173248291016, "global_step": 239359, "epoch": 1424} {"train_loss": -11.985427856445312, "global_step": 239360, "epoch": 1424} {"train_loss": -11.759401321411133, "global_step": 239361, "epoch": 1424} {"train_loss": -12.229755401611328, "global_step": 239362, "epoch": 1424} {"train_loss": -12.024425506591797, "global_step": 239363, "epoch": 1424} {"train_loss": -12.017654418945312, "global_step": 239364, "epoch": 1424} {"train_loss": -12.073247909545898, "global_step": 239365, "epoch": 1424} {"train_loss": -11.850652694702148, "global_step": 239366, "epoch": 1424} {"train_loss": -12.040029525756836, "global_step": 239367, "epoch": 1424} {"train_loss": -11.893016815185547, "global_step": 239368, "epoch": 1424} {"train_loss": -12.03908920288086, "global_step": 239369, "epoch": 1424} {"train_loss": -12.00638484954834, "global_step": 239370, "epoch": 1424} {"train_loss": -11.941766738891602, "global_step": 239371, "epoch": 1424} {"train_loss": -11.959118843078613, "global_step": 239372, "epoch": 1424} {"train_loss": -11.97835922241211, "global_step": 239373, "epoch": 1424} {"train_loss": -11.727604866027832, "global_step": 239374, "epoch": 1424} {"train_loss": -12.081071853637695, "global_step": 239375, "epoch": 1424} {"train_loss": -11.946311950683594, "global_step": 239376, "epoch": 1424} {"train_loss": -12.057376861572266, "global_step": 239377, "epoch": 1424} {"train_loss": -11.999658584594727, "global_step": 239378, "epoch": 1424} {"train_loss": -12.172578811645508, "global_step": 239379, "epoch": 1424} {"train_loss": -12.331789016723633, "global_step": 239380, "epoch": 1424} {"train_loss": -12.31939697265625, "global_step": 239381, "epoch": 1424} {"train_loss": -12.025729179382324, "global_step": 239382, "epoch": 1424} {"train_loss": -12.145033836364746, "global_step": 239383, "epoch": 1424} {"train_loss": -12.30438232421875, "global_step": 239384, "epoch": 1424} {"train_loss": -12.038222312927246, "global_step": 239385, "epoch": 1424} {"train_loss": -11.76659107208252, "global_step": 239386, "epoch": 1424} {"train_loss": -11.683722496032715, "global_step": 239387, "epoch": 1424} {"train_loss": -12.2675142288208, "global_step": 239388, "epoch": 1424} {"train_loss": -11.737189292907715, "global_step": 239389, "epoch": 1424} {"train_loss": -10.93195915222168, "global_step": 239390, "epoch": 1424} {"train_loss": -9.918179512023926, "global_step": 239391, "epoch": 1424} {"train_loss": -10.626044273376465, "global_step": 239392, "epoch": 1424} {"train_loss": -11.724739074707031, "global_step": 239393, "epoch": 1424} {"train_loss": -11.951982498168945, "global_step": 239394, "epoch": 1424} {"train_loss": -10.781156539916992, "global_step": 239395, "epoch": 1424} {"train_loss": -10.977439880371094, "global_step": 239396, "epoch": 1424} {"train_loss": -11.678323745727539, "global_step": 239397, "epoch": 1424} {"train_loss": -10.314737319946289, "global_step": 239398, "epoch": 1424} {"train_loss": -11.284172058105469, "global_step": 239399, "epoch": 1424, "val_loss": 260948.28125} {"train_loss": -11.34593391418457, "global_step": 239400, "epoch": 1425} {"train_loss": -11.070858001708984, "global_step": 239401, "epoch": 1425} {"train_loss": -10.727081298828125, "global_step": 239402, "epoch": 1425} {"train_loss": -10.732417106628418, "global_step": 239403, "epoch": 1425} {"train_loss": -11.571737289428711, "global_step": 239404, "epoch": 1425} {"train_loss": -10.694942474365234, "global_step": 239405, "epoch": 1425} {"train_loss": -11.28498363494873, "global_step": 239406, "epoch": 1425} {"train_loss": -11.348370552062988, "global_step": 239407, "epoch": 1425} {"train_loss": -11.278799057006836, "global_step": 239408, "epoch": 1425} {"train_loss": -11.867813110351562, "global_step": 239409, "epoch": 1425} {"train_loss": -10.468415260314941, "global_step": 239410, "epoch": 1425} {"train_loss": -10.046356201171875, "global_step": 239411, "epoch": 1425} {"train_loss": -11.294418334960938, "global_step": 239412, "epoch": 1425} {"train_loss": -9.691466331481934, "global_step": 239413, "epoch": 1425} {"train_loss": -8.700567245483398, "global_step": 239414, "epoch": 1425} {"train_loss": -9.292854309082031, "global_step": 239415, "epoch": 1425} {"train_loss": -10.39068603515625, "global_step": 239416, "epoch": 1425} {"train_loss": -9.444024085998535, "global_step": 239417, "epoch": 1425} {"train_loss": -9.229517936706543, "global_step": 239418, "epoch": 1425} {"train_loss": -10.876596450805664, "global_step": 239419, "epoch": 1425} {"train_loss": -10.692438125610352, "global_step": 239420, "epoch": 1425} {"train_loss": -9.789239883422852, "global_step": 239421, "epoch": 1425} {"train_loss": -10.725906372070312, "global_step": 239422, "epoch": 1425} {"train_loss": -10.874914169311523, "global_step": 239423, "epoch": 1425} {"train_loss": -10.011213302612305, "global_step": 239424, "epoch": 1425} {"train_loss": -10.949193954467773, "global_step": 239425, "epoch": 1425} {"train_loss": -10.452038764953613, "global_step": 239426, "epoch": 1425} {"train_loss": -10.610760688781738, "global_step": 239427, "epoch": 1425} {"train_loss": -10.710744857788086, "global_step": 239428, "epoch": 1425} {"train_loss": -10.23503589630127, "global_step": 239429, "epoch": 1425} {"train_loss": -11.298025131225586, "global_step": 239430, "epoch": 1425} {"train_loss": -10.895549774169922, "global_step": 239431, "epoch": 1425} {"train_loss": -11.100266456604004, "global_step": 239432, "epoch": 1425} {"train_loss": -11.211857795715332, "global_step": 239433, "epoch": 1425} {"train_loss": -10.904115676879883, "global_step": 239434, "epoch": 1425} {"train_loss": -11.341565132141113, "global_step": 239435, "epoch": 1425} {"train_loss": -11.027437210083008, "global_step": 239436, "epoch": 1425} {"train_loss": -11.106438636779785, "global_step": 239437, "epoch": 1425} {"train_loss": -11.472329139709473, "global_step": 239438, "epoch": 1425} {"train_loss": -10.809891700744629, "global_step": 239439, "epoch": 1425} {"train_loss": -11.322547912597656, "global_step": 239440, "epoch": 1425} {"train_loss": -11.342912673950195, "global_step": 239441, "epoch": 1425} {"train_loss": -11.129913330078125, "global_step": 239442, "epoch": 1425} {"train_loss": -11.469819068908691, "global_step": 239443, "epoch": 1425} {"train_loss": -11.423456192016602, "global_step": 239444, "epoch": 1425} {"train_loss": -11.081960678100586, "global_step": 239445, "epoch": 1425} {"train_loss": -11.553544998168945, "global_step": 239446, "epoch": 1425} {"train_loss": -11.275588989257812, "global_step": 239447, "epoch": 1425} {"train_loss": -11.427322387695312, "global_step": 239448, "epoch": 1425} {"train_loss": -11.653717041015625, "global_step": 239449, "epoch": 1425} {"train_loss": -11.488090515136719, "global_step": 239450, "epoch": 1425} {"train_loss": -11.673009872436523, "global_step": 239451, "epoch": 1425} {"train_loss": -11.682830810546875, "global_step": 239452, "epoch": 1425} {"train_loss": -11.341489791870117, "global_step": 239453, "epoch": 1425} {"train_loss": -11.504107475280762, "global_step": 239454, "epoch": 1425} {"train_loss": -11.569811820983887, "global_step": 239455, "epoch": 1425} {"train_loss": -11.607719421386719, "global_step": 239456, "epoch": 1425} {"train_loss": -11.87043571472168, "global_step": 239457, "epoch": 1425} {"train_loss": -11.886190414428711, "global_step": 239458, "epoch": 1425} {"train_loss": -11.371482849121094, "global_step": 239459, "epoch": 1425} {"train_loss": -11.387741088867188, "global_step": 239460, "epoch": 1425} {"train_loss": -11.448090553283691, "global_step": 239461, "epoch": 1425} {"train_loss": -11.455962181091309, "global_step": 239462, "epoch": 1425} {"train_loss": -11.469930648803711, "global_step": 239463, "epoch": 1425} {"train_loss": -11.472400665283203, "global_step": 239464, "epoch": 1425} {"train_loss": -11.899686813354492, "global_step": 239465, "epoch": 1425} {"train_loss": -11.364093780517578, "global_step": 239466, "epoch": 1425} {"train_loss": -11.927789688110352, "global_step": 239467, "epoch": 1425} {"train_loss": -11.413263320922852, "global_step": 239468, "epoch": 1425} {"train_loss": -11.766639709472656, "global_step": 239469, "epoch": 1425} {"train_loss": -11.041391372680664, "global_step": 239470, "epoch": 1425} {"train_loss": -11.803984642028809, "global_step": 239471, "epoch": 1425} {"train_loss": -11.542913436889648, "global_step": 239472, "epoch": 1425} {"train_loss": -11.555170059204102, "global_step": 239473, "epoch": 1425} {"train_loss": -11.678058624267578, "global_step": 239474, "epoch": 1425} {"train_loss": -11.554298400878906, "global_step": 239475, "epoch": 1425} {"train_loss": -11.692258834838867, "global_step": 239476, "epoch": 1425} {"train_loss": -11.659343719482422, "global_step": 239477, "epoch": 1425} {"train_loss": -11.464710235595703, "global_step": 239478, "epoch": 1425} {"train_loss": -11.535173416137695, "global_step": 239479, "epoch": 1425} {"train_loss": -11.687484741210938, "global_step": 239480, "epoch": 1425} {"train_loss": -11.703147888183594, "global_step": 239481, "epoch": 1425} {"train_loss": -11.573424339294434, "global_step": 239482, "epoch": 1425} {"train_loss": -11.80710220336914, "global_step": 239483, "epoch": 1425} {"train_loss": -11.65523624420166, "global_step": 239484, "epoch": 1425} {"train_loss": -11.73039436340332, "global_step": 239485, "epoch": 1425} {"train_loss": -11.943033218383789, "global_step": 239486, "epoch": 1425} {"train_loss": -11.806007385253906, "global_step": 239487, "epoch": 1425} {"train_loss": -11.965885162353516, "global_step": 239488, "epoch": 1425} {"train_loss": -11.985359191894531, "global_step": 239489, "epoch": 1425} {"train_loss": -12.051156044006348, "global_step": 239490, "epoch": 1425} {"train_loss": -11.772829055786133, "global_step": 239491, "epoch": 1425} {"train_loss": -12.0678071975708, "global_step": 239492, "epoch": 1425} {"train_loss": -11.496554374694824, "global_step": 239493, "epoch": 1425} {"train_loss": -11.910447120666504, "global_step": 239494, "epoch": 1425} {"train_loss": -11.6820707321167, "global_step": 239495, "epoch": 1425} {"train_loss": -11.853260040283203, "global_step": 239496, "epoch": 1425} {"train_loss": -11.81939697265625, "global_step": 239497, "epoch": 1425} {"train_loss": -12.0276517868042, "global_step": 239498, "epoch": 1425} {"train_loss": -11.697399139404297, "global_step": 239499, "epoch": 1425} {"train_loss": -11.913236618041992, "global_step": 239500, "epoch": 1425} {"train_loss": -12.136245727539062, "global_step": 239501, "epoch": 1425} {"train_loss": -11.783875465393066, "global_step": 239502, "epoch": 1425} {"train_loss": -12.225448608398438, "global_step": 239503, "epoch": 1425} {"train_loss": -11.834457397460938, "global_step": 239504, "epoch": 1425} {"train_loss": -12.171957969665527, "global_step": 239505, "epoch": 1425} {"train_loss": -12.03026008605957, "global_step": 239506, "epoch": 1425} {"train_loss": -11.775673866271973, "global_step": 239507, "epoch": 1425} {"train_loss": -11.83678913116455, "global_step": 239508, "epoch": 1425} {"train_loss": -11.905885696411133, "global_step": 239509, "epoch": 1425} {"train_loss": -12.019210815429688, "global_step": 239510, "epoch": 1425} {"train_loss": -11.978303909301758, "global_step": 239511, "epoch": 1425} {"train_loss": -12.158618927001953, "global_step": 239512, "epoch": 1425} {"train_loss": -12.019017219543457, "global_step": 239513, "epoch": 1425} {"train_loss": -12.25918197631836, "global_step": 239514, "epoch": 1425} {"train_loss": -12.046028137207031, "global_step": 239515, "epoch": 1425} {"train_loss": -12.029489517211914, "global_step": 239516, "epoch": 1425} {"train_loss": -11.961297988891602, "global_step": 239517, "epoch": 1425} {"train_loss": -11.93167495727539, "global_step": 239518, "epoch": 1425} {"train_loss": -12.051483154296875, "global_step": 239519, "epoch": 1425} {"train_loss": -12.1145601272583, "global_step": 239520, "epoch": 1425} {"train_loss": -12.081432342529297, "global_step": 239521, "epoch": 1425} {"train_loss": -12.081016540527344, "global_step": 239522, "epoch": 1425} {"train_loss": -11.87198257446289, "global_step": 239523, "epoch": 1425} {"train_loss": -11.631831169128418, "global_step": 239524, "epoch": 1425} {"train_loss": -11.75008773803711, "global_step": 239525, "epoch": 1425} {"train_loss": -11.806700706481934, "global_step": 239526, "epoch": 1425} {"train_loss": -11.914676666259766, "global_step": 239527, "epoch": 1425} {"train_loss": -11.887660026550293, "global_step": 239528, "epoch": 1425} {"train_loss": -11.846532821655273, "global_step": 239529, "epoch": 1425} {"train_loss": -11.309849739074707, "global_step": 239530, "epoch": 1425} {"train_loss": -12.031047821044922, "global_step": 239531, "epoch": 1425} {"train_loss": -11.662544250488281, "global_step": 239532, "epoch": 1425} {"train_loss": -11.191191673278809, "global_step": 239533, "epoch": 1425} {"train_loss": -10.901300430297852, "global_step": 239534, "epoch": 1425} {"train_loss": -11.397871017456055, "global_step": 239535, "epoch": 1425} {"train_loss": -9.04880142211914, "global_step": 239536, "epoch": 1425} {"train_loss": -10.308110237121582, "global_step": 239537, "epoch": 1425} {"train_loss": -10.906535148620605, "global_step": 239538, "epoch": 1425} {"train_loss": -8.790242195129395, "global_step": 239539, "epoch": 1425} {"train_loss": -10.799009323120117, "global_step": 239540, "epoch": 1425} {"train_loss": -9.45479965209961, "global_step": 239541, "epoch": 1425} {"train_loss": -10.097768783569336, "global_step": 239542, "epoch": 1425} {"train_loss": -9.733978271484375, "global_step": 239543, "epoch": 1425} {"train_loss": -10.141803741455078, "global_step": 239544, "epoch": 1425} {"train_loss": -9.123763084411621, "global_step": 239545, "epoch": 1425} {"train_loss": -9.564281463623047, "global_step": 239546, "epoch": 1425} {"train_loss": -9.173491477966309, "global_step": 239547, "epoch": 1425} {"train_loss": -9.594870567321777, "global_step": 239548, "epoch": 1425} {"train_loss": -7.824219703674316, "global_step": 239549, "epoch": 1425} {"train_loss": -8.187053680419922, "global_step": 239550, "epoch": 1425} {"train_loss": -8.845901489257812, "global_step": 239551, "epoch": 1425} {"train_loss": -6.892897605895996, "global_step": 239552, "epoch": 1425} {"train_loss": -7.261188983917236, "global_step": 239553, "epoch": 1425} {"train_loss": -7.84735107421875, "global_step": 239554, "epoch": 1425} {"train_loss": -8.748302459716797, "global_step": 239555, "epoch": 1425} {"train_loss": -6.79017448425293, "global_step": 239556, "epoch": 1425} {"train_loss": -7.40177583694458, "global_step": 239557, "epoch": 1425} {"train_loss": -9.339197158813477, "global_step": 239558, "epoch": 1425} {"train_loss": -7.489452362060547, "global_step": 239559, "epoch": 1425} {"train_loss": -8.48910903930664, "global_step": 239560, "epoch": 1425} {"train_loss": -10.68658447265625, "global_step": 239561, "epoch": 1425} {"train_loss": -9.167951583862305, "global_step": 239562, "epoch": 1425} {"train_loss": -9.08287239074707, "global_step": 239563, "epoch": 1425} {"train_loss": -10.224528312683105, "global_step": 239564, "epoch": 1425} {"train_loss": -9.75100040435791, "global_step": 239565, "epoch": 1425} {"train_loss": -9.654333114624023, "global_step": 239566, "epoch": 1425} {"train_loss": -10.967437658991132, "global_step": 239567, "epoch": 1425, "val_loss": 262270.375, "train_action_mse_error": 10.4635009765625} {"train_loss": -9.886120796203613, "global_step": 239568, "epoch": 1426} {"train_loss": -9.99083137512207, "global_step": 239569, "epoch": 1426} {"train_loss": -10.189266204833984, "global_step": 239570, "epoch": 1426} {"train_loss": -9.830941200256348, "global_step": 239571, "epoch": 1426} {"train_loss": -10.265188217163086, "global_step": 239572, "epoch": 1426} {"train_loss": -11.004072189331055, "global_step": 239573, "epoch": 1426} {"train_loss": -10.068548202514648, "global_step": 239574, "epoch": 1426} {"train_loss": -10.252326965332031, "global_step": 239575, "epoch": 1426} {"train_loss": -10.77409553527832, "global_step": 239576, "epoch": 1426} {"train_loss": -10.188102722167969, "global_step": 239577, "epoch": 1426} {"train_loss": -10.419856071472168, "global_step": 239578, "epoch": 1426} {"train_loss": -10.88553237915039, "global_step": 239579, "epoch": 1426} {"train_loss": -10.261404037475586, "global_step": 239580, "epoch": 1426} {"train_loss": -10.838166236877441, "global_step": 239581, "epoch": 1426} {"train_loss": -10.873476028442383, "global_step": 239582, "epoch": 1426} {"train_loss": -10.287881851196289, "global_step": 239583, "epoch": 1426} {"train_loss": -10.05913257598877, "global_step": 239584, "epoch": 1426} {"train_loss": -11.24036979675293, "global_step": 239585, "epoch": 1426} {"train_loss": -10.622637748718262, "global_step": 239586, "epoch": 1426} {"train_loss": -10.01315975189209, "global_step": 239587, "epoch": 1426} {"train_loss": -10.6478271484375, "global_step": 239588, "epoch": 1426} {"train_loss": -11.077590942382812, "global_step": 239589, "epoch": 1426} {"train_loss": -10.601005554199219, "global_step": 239590, "epoch": 1426} {"train_loss": -10.548067092895508, "global_step": 239591, "epoch": 1426} {"train_loss": -10.960125923156738, "global_step": 239592, "epoch": 1426} {"train_loss": -10.707481384277344, "global_step": 239593, "epoch": 1426} {"train_loss": -11.057283401489258, "global_step": 239594, "epoch": 1426} {"train_loss": -11.259039878845215, "global_step": 239595, "epoch": 1426} {"train_loss": -10.77841567993164, "global_step": 239596, "epoch": 1426} {"train_loss": -10.849663734436035, "global_step": 239597, "epoch": 1426} {"train_loss": -11.20916748046875, "global_step": 239598, "epoch": 1426} {"train_loss": -11.374719619750977, "global_step": 239599, "epoch": 1426} {"train_loss": -11.140812873840332, "global_step": 239600, "epoch": 1426} {"train_loss": -11.10421371459961, "global_step": 239601, "epoch": 1426} {"train_loss": -11.265058517456055, "global_step": 239602, "epoch": 1426} {"train_loss": -11.276641845703125, "global_step": 239603, "epoch": 1426} {"train_loss": -11.245367050170898, "global_step": 239604, "epoch": 1426} {"train_loss": -11.269309043884277, "global_step": 239605, "epoch": 1426} {"train_loss": -11.23193645477295, "global_step": 239606, "epoch": 1426} {"train_loss": -11.342832565307617, "global_step": 239607, "epoch": 1426} {"train_loss": -11.424591064453125, "global_step": 239608, "epoch": 1426} {"train_loss": -11.507461547851562, "global_step": 239609, "epoch": 1426} {"train_loss": -11.373615264892578, "global_step": 239610, "epoch": 1426} {"train_loss": -11.415034294128418, "global_step": 239611, "epoch": 1426} {"train_loss": -11.256641387939453, "global_step": 239612, "epoch": 1426} {"train_loss": -11.392711639404297, "global_step": 239613, "epoch": 1426} {"train_loss": -11.383391380310059, "global_step": 239614, "epoch": 1426} {"train_loss": -11.545156478881836, "global_step": 239615, "epoch": 1426} {"train_loss": -11.413214683532715, "global_step": 239616, "epoch": 1426} {"train_loss": -11.63087272644043, "global_step": 239617, "epoch": 1426} {"train_loss": -11.461570739746094, "global_step": 239618, "epoch": 1426} {"train_loss": -11.504631042480469, "global_step": 239619, "epoch": 1426} {"train_loss": -11.535208702087402, "global_step": 239620, "epoch": 1426} {"train_loss": -11.567883491516113, "global_step": 239621, "epoch": 1426} {"train_loss": -11.565666198730469, "global_step": 239622, "epoch": 1426} {"train_loss": -11.607168197631836, "global_step": 239623, "epoch": 1426} {"train_loss": -11.677189826965332, "global_step": 239624, "epoch": 1426} {"train_loss": -11.485061645507812, "global_step": 239625, "epoch": 1426} {"train_loss": -11.468981742858887, "global_step": 239626, "epoch": 1426} {"train_loss": -11.446290969848633, "global_step": 239627, "epoch": 1426} {"train_loss": -11.631650924682617, "global_step": 239628, "epoch": 1426} {"train_loss": -11.62255573272705, "global_step": 239629, "epoch": 1426} {"train_loss": -11.795116424560547, "global_step": 239630, "epoch": 1426} {"train_loss": -11.502586364746094, "global_step": 239631, "epoch": 1426} {"train_loss": -11.727121353149414, "global_step": 239632, "epoch": 1426} {"train_loss": -11.839805603027344, "global_step": 239633, "epoch": 1426} {"train_loss": -11.72435188293457, "global_step": 239634, "epoch": 1426} {"train_loss": -11.825927734375, "global_step": 239635, "epoch": 1426} {"train_loss": -11.795217514038086, "global_step": 239636, "epoch": 1426} {"train_loss": -11.651689529418945, "global_step": 239637, "epoch": 1426} {"train_loss": -11.560951232910156, "global_step": 239638, "epoch": 1426} {"train_loss": -11.830636978149414, "global_step": 239639, "epoch": 1426} {"train_loss": -11.533123016357422, "global_step": 239640, "epoch": 1426} {"train_loss": -11.80986213684082, "global_step": 239641, "epoch": 1426} {"train_loss": -11.804374694824219, "global_step": 239642, "epoch": 1426} {"train_loss": -11.913278579711914, "global_step": 239643, "epoch": 1426} {"train_loss": -11.865385055541992, "global_step": 239644, "epoch": 1426} {"train_loss": -11.800650596618652, "global_step": 239645, "epoch": 1426} {"train_loss": -11.703458786010742, "global_step": 239646, "epoch": 1426} {"train_loss": -12.009373664855957, "global_step": 239647, "epoch": 1426} {"train_loss": -12.02016544342041, "global_step": 239648, "epoch": 1426} {"train_loss": -11.871381759643555, "global_step": 239649, "epoch": 1426} {"train_loss": -11.729776382446289, "global_step": 239650, "epoch": 1426} {"train_loss": -11.668275833129883, "global_step": 239651, "epoch": 1426} {"train_loss": -11.88933277130127, "global_step": 239652, "epoch": 1426} {"train_loss": -11.901402473449707, "global_step": 239653, "epoch": 1426} {"train_loss": -11.853554725646973, "global_step": 239654, "epoch": 1426} {"train_loss": -11.996682167053223, "global_step": 239655, "epoch": 1426} {"train_loss": -11.324037551879883, "global_step": 239656, "epoch": 1426} {"train_loss": -11.807732582092285, "global_step": 239657, "epoch": 1426} {"train_loss": -11.820592880249023, "global_step": 239658, "epoch": 1426} {"train_loss": -11.894946098327637, "global_step": 239659, "epoch": 1426} {"train_loss": -11.71500015258789, "global_step": 239660, "epoch": 1426} {"train_loss": -10.99340534210205, "global_step": 239661, "epoch": 1426} {"train_loss": -10.97632884979248, "global_step": 239662, "epoch": 1426} {"train_loss": -11.869926452636719, "global_step": 239663, "epoch": 1426} {"train_loss": -10.871330261230469, "global_step": 239664, "epoch": 1426} {"train_loss": -10.366863250732422, "global_step": 239665, "epoch": 1426} {"train_loss": -11.051844596862793, "global_step": 239666, "epoch": 1426} {"train_loss": -11.467737197875977, "global_step": 239667, "epoch": 1426} {"train_loss": -10.518068313598633, "global_step": 239668, "epoch": 1426} {"train_loss": -10.587970733642578, "global_step": 239669, "epoch": 1426} {"train_loss": -11.275650024414062, "global_step": 239670, "epoch": 1426} {"train_loss": -10.880094528198242, "global_step": 239671, "epoch": 1426} {"train_loss": -10.467040061950684, "global_step": 239672, "epoch": 1426} {"train_loss": -11.731427192687988, "global_step": 239673, "epoch": 1426} {"train_loss": -11.514628410339355, "global_step": 239674, "epoch": 1426} {"train_loss": -11.578542709350586, "global_step": 239675, "epoch": 1426} {"train_loss": -11.808534622192383, "global_step": 239676, "epoch": 1426} {"train_loss": -11.351548194885254, "global_step": 239677, "epoch": 1426} {"train_loss": -10.648359298706055, "global_step": 239678, "epoch": 1426} {"train_loss": -11.716952323913574, "global_step": 239679, "epoch": 1426} {"train_loss": -10.968586921691895, "global_step": 239680, "epoch": 1426} {"train_loss": -11.128430366516113, "global_step": 239681, "epoch": 1426} {"train_loss": -11.500925064086914, "global_step": 239682, "epoch": 1426} {"train_loss": -10.775656700134277, "global_step": 239683, "epoch": 1426} {"train_loss": -11.597835540771484, "global_step": 239684, "epoch": 1426} {"train_loss": -11.183258056640625, "global_step": 239685, "epoch": 1426} {"train_loss": -10.61104965209961, "global_step": 239686, "epoch": 1426} {"train_loss": -11.65258502960205, "global_step": 239687, "epoch": 1426} {"train_loss": -11.506474494934082, "global_step": 239688, "epoch": 1426} {"train_loss": -11.01595687866211, "global_step": 239689, "epoch": 1426} {"train_loss": -11.34117317199707, "global_step": 239690, "epoch": 1426} {"train_loss": -11.488687515258789, "global_step": 239691, "epoch": 1426} {"train_loss": -11.552925109863281, "global_step": 239692, "epoch": 1426} {"train_loss": -11.501079559326172, "global_step": 239693, "epoch": 1426} {"train_loss": -11.425893783569336, "global_step": 239694, "epoch": 1426} {"train_loss": -11.546334266662598, "global_step": 239695, "epoch": 1426} {"train_loss": -11.183813095092773, "global_step": 239696, "epoch": 1426} {"train_loss": -11.209711074829102, "global_step": 239697, "epoch": 1426} {"train_loss": -11.849056243896484, "global_step": 239698, "epoch": 1426} {"train_loss": -11.601064682006836, "global_step": 239699, "epoch": 1426} {"train_loss": -11.490501403808594, "global_step": 239700, "epoch": 1426} {"train_loss": -11.540397644042969, "global_step": 239701, "epoch": 1426} {"train_loss": -11.501882553100586, "global_step": 239702, "epoch": 1426} {"train_loss": -11.901718139648438, "global_step": 239703, "epoch": 1426} {"train_loss": -11.371971130371094, "global_step": 239704, "epoch": 1426} {"train_loss": -11.878927230834961, "global_step": 239705, "epoch": 1426} {"train_loss": -11.643762588500977, "global_step": 239706, "epoch": 1426} {"train_loss": -11.79483413696289, "global_step": 239707, "epoch": 1426} {"train_loss": -11.754032135009766, "global_step": 239708, "epoch": 1426} {"train_loss": -11.801030158996582, "global_step": 239709, "epoch": 1426} {"train_loss": -11.821914672851562, "global_step": 239710, "epoch": 1426} {"train_loss": -11.532144546508789, "global_step": 239711, "epoch": 1426} {"train_loss": -11.788057327270508, "global_step": 239712, "epoch": 1426} {"train_loss": -11.501696586608887, "global_step": 239713, "epoch": 1426} {"train_loss": -11.841909408569336, "global_step": 239714, "epoch": 1426} {"train_loss": -11.745656967163086, "global_step": 239715, "epoch": 1426} {"train_loss": -11.887545585632324, "global_step": 239716, "epoch": 1426} {"train_loss": -11.544905662536621, "global_step": 239717, "epoch": 1426} {"train_loss": -11.839519500732422, "global_step": 239718, "epoch": 1426} {"train_loss": -11.40587043762207, "global_step": 239719, "epoch": 1426} {"train_loss": -12.01275634765625, "global_step": 239720, "epoch": 1426} {"train_loss": -11.50275993347168, "global_step": 239721, "epoch": 1426} {"train_loss": -11.867875099182129, "global_step": 239722, "epoch": 1426} {"train_loss": -11.52287483215332, "global_step": 239723, "epoch": 1426} {"train_loss": -11.577199935913086, "global_step": 239724, "epoch": 1426} {"train_loss": -11.98354434967041, "global_step": 239725, "epoch": 1426} {"train_loss": -11.36823844909668, "global_step": 239726, "epoch": 1426} {"train_loss": -11.691730499267578, "global_step": 239727, "epoch": 1426} {"train_loss": -11.704341888427734, "global_step": 239728, "epoch": 1426} {"train_loss": -11.957810401916504, "global_step": 239729, "epoch": 1426} {"train_loss": -11.97224235534668, "global_step": 239730, "epoch": 1426} {"train_loss": -11.97029972076416, "global_step": 239731, "epoch": 1426} {"train_loss": -11.87542724609375, "global_step": 239732, "epoch": 1426} {"train_loss": -11.467571258544922, "global_step": 239733, "epoch": 1426} {"train_loss": -11.761731147766113, "global_step": 239734, "epoch": 1426} {"train_loss": -11.349644893691654, "global_step": 239735, "epoch": 1426, "val_loss": 265650.6875} {"train_loss": -11.980693817138672, "global_step": 239736, "epoch": 1427} {"train_loss": -11.698646545410156, "global_step": 239737, "epoch": 1427} {"train_loss": -12.144893646240234, "global_step": 239738, "epoch": 1427} {"train_loss": -11.636211395263672, "global_step": 239739, "epoch": 1427} {"train_loss": -11.895808219909668, "global_step": 239740, "epoch": 1427} {"train_loss": -11.570770263671875, "global_step": 239741, "epoch": 1427} {"train_loss": -11.848532676696777, "global_step": 239742, "epoch": 1427} {"train_loss": -11.542800903320312, "global_step": 239743, "epoch": 1427} {"train_loss": -11.878812789916992, "global_step": 239744, "epoch": 1427} {"train_loss": -11.389469146728516, "global_step": 239745, "epoch": 1427} {"train_loss": -11.441155433654785, "global_step": 239746, "epoch": 1427} {"train_loss": -11.149009704589844, "global_step": 239747, "epoch": 1427} {"train_loss": -12.091559410095215, "global_step": 239748, "epoch": 1427} {"train_loss": -11.192093849182129, "global_step": 239749, "epoch": 1427} {"train_loss": -11.4270658493042, "global_step": 239750, "epoch": 1427} {"train_loss": -11.541969299316406, "global_step": 239751, "epoch": 1427} {"train_loss": -11.032958984375, "global_step": 239752, "epoch": 1427} {"train_loss": -10.28298282623291, "global_step": 239753, "epoch": 1427} {"train_loss": -11.61411190032959, "global_step": 239754, "epoch": 1427} {"train_loss": -9.506163597106934, "global_step": 239755, "epoch": 1427} {"train_loss": -10.721263885498047, "global_step": 239756, "epoch": 1427} {"train_loss": -11.530770301818848, "global_step": 239757, "epoch": 1427} {"train_loss": -10.504593849182129, "global_step": 239758, "epoch": 1427} {"train_loss": -11.66862964630127, "global_step": 239759, "epoch": 1427} {"train_loss": -10.77273941040039, "global_step": 239760, "epoch": 1427} {"train_loss": -11.400651931762695, "global_step": 239761, "epoch": 1427} {"train_loss": -11.154231071472168, "global_step": 239762, "epoch": 1427} {"train_loss": -11.489062309265137, "global_step": 239763, "epoch": 1427} {"train_loss": -11.12185287475586, "global_step": 239764, "epoch": 1427} {"train_loss": -11.497663497924805, "global_step": 239765, "epoch": 1427} {"train_loss": -11.150153160095215, "global_step": 239766, "epoch": 1427} {"train_loss": -11.130563735961914, "global_step": 239767, "epoch": 1427} {"train_loss": -11.14267349243164, "global_step": 239768, "epoch": 1427} {"train_loss": -11.100491523742676, "global_step": 239769, "epoch": 1427} {"train_loss": -10.87507438659668, "global_step": 239770, "epoch": 1427} {"train_loss": -11.197388648986816, "global_step": 239771, "epoch": 1427} {"train_loss": -10.572820663452148, "global_step": 239772, "epoch": 1427} {"train_loss": -11.384521484375, "global_step": 239773, "epoch": 1427} {"train_loss": -11.126510620117188, "global_step": 239774, "epoch": 1427} {"train_loss": -11.649580001831055, "global_step": 239775, "epoch": 1427} {"train_loss": -11.32769775390625, "global_step": 239776, "epoch": 1427} {"train_loss": -11.486959457397461, "global_step": 239777, "epoch": 1427} {"train_loss": -11.376448631286621, "global_step": 239778, "epoch": 1427} {"train_loss": -11.23318099975586, "global_step": 239779, "epoch": 1427} {"train_loss": -11.544143676757812, "global_step": 239780, "epoch": 1427} {"train_loss": -11.134190559387207, "global_step": 239781, "epoch": 1427} {"train_loss": -10.758709907531738, "global_step": 239782, "epoch": 1427} {"train_loss": -11.79039192199707, "global_step": 239783, "epoch": 1427} {"train_loss": -11.054930686950684, "global_step": 239784, "epoch": 1427} {"train_loss": -11.53156566619873, "global_step": 239785, "epoch": 1427} {"train_loss": -11.400860786437988, "global_step": 239786, "epoch": 1427} {"train_loss": -11.26455307006836, "global_step": 239787, "epoch": 1427} {"train_loss": -10.837265014648438, "global_step": 239788, "epoch": 1427} {"train_loss": -11.566712379455566, "global_step": 239789, "epoch": 1427} {"train_loss": -11.773309707641602, "global_step": 239790, "epoch": 1427} {"train_loss": -11.337934494018555, "global_step": 239791, "epoch": 1427} {"train_loss": -11.53439712524414, "global_step": 239792, "epoch": 1427} {"train_loss": -11.700392723083496, "global_step": 239793, "epoch": 1427} {"train_loss": -11.487665176391602, "global_step": 239794, "epoch": 1427} {"train_loss": -11.731074333190918, "global_step": 239795, "epoch": 1427} {"train_loss": -11.5651273727417, "global_step": 239796, "epoch": 1427} {"train_loss": -11.575847625732422, "global_step": 239797, "epoch": 1427} {"train_loss": -11.918169021606445, "global_step": 239798, "epoch": 1427} {"train_loss": -11.177507400512695, "global_step": 239799, "epoch": 1427} {"train_loss": -11.839101791381836, "global_step": 239800, "epoch": 1427} {"train_loss": -11.5512113571167, "global_step": 239801, "epoch": 1427} {"train_loss": -11.347434043884277, "global_step": 239802, "epoch": 1427} {"train_loss": -11.937214851379395, "global_step": 239803, "epoch": 1427} {"train_loss": -11.099370956420898, "global_step": 239804, "epoch": 1427} {"train_loss": -11.707794189453125, "global_step": 239805, "epoch": 1427} {"train_loss": -11.348575592041016, "global_step": 239806, "epoch": 1427} {"train_loss": -11.424250602722168, "global_step": 239807, "epoch": 1427} {"train_loss": -11.808767318725586, "global_step": 239808, "epoch": 1427} {"train_loss": -11.174636840820312, "global_step": 239809, "epoch": 1427} {"train_loss": -11.803108215332031, "global_step": 239810, "epoch": 1427} {"train_loss": -11.45009708404541, "global_step": 239811, "epoch": 1427} {"train_loss": -11.720226287841797, "global_step": 239812, "epoch": 1427} {"train_loss": -11.491827011108398, "global_step": 239813, "epoch": 1427} {"train_loss": -11.804943084716797, "global_step": 239814, "epoch": 1427} {"train_loss": -11.959624290466309, "global_step": 239815, "epoch": 1427} {"train_loss": -11.74340534210205, "global_step": 239816, "epoch": 1427} {"train_loss": -11.76053237915039, "global_step": 239817, "epoch": 1427} {"train_loss": -11.743114471435547, "global_step": 239818, "epoch": 1427} {"train_loss": -11.651273727416992, "global_step": 239819, "epoch": 1427} {"train_loss": -11.838518142700195, "global_step": 239820, "epoch": 1427} {"train_loss": -11.932609558105469, "global_step": 239821, "epoch": 1427} {"train_loss": -11.790084838867188, "global_step": 239822, "epoch": 1427} {"train_loss": -11.926139831542969, "global_step": 239823, "epoch": 1427} {"train_loss": -11.82293701171875, "global_step": 239824, "epoch": 1427} {"train_loss": -11.87215805053711, "global_step": 239825, "epoch": 1427} {"train_loss": -12.018556594848633, "global_step": 239826, "epoch": 1427} {"train_loss": -11.901758193969727, "global_step": 239827, "epoch": 1427} {"train_loss": -11.883975982666016, "global_step": 239828, "epoch": 1427} {"train_loss": -11.869321823120117, "global_step": 239829, "epoch": 1427} {"train_loss": -11.900735855102539, "global_step": 239830, "epoch": 1427} {"train_loss": -12.103191375732422, "global_step": 239831, "epoch": 1427} {"train_loss": -11.865852355957031, "global_step": 239832, "epoch": 1427} {"train_loss": -11.797246932983398, "global_step": 239833, "epoch": 1427} {"train_loss": -12.075281143188477, "global_step": 239834, "epoch": 1427} {"train_loss": -12.057525634765625, "global_step": 239835, "epoch": 1427} {"train_loss": -12.040811538696289, "global_step": 239836, "epoch": 1427} {"train_loss": -11.796723365783691, "global_step": 239837, "epoch": 1427} {"train_loss": -12.077557563781738, "global_step": 239838, "epoch": 1427} {"train_loss": -12.041027069091797, "global_step": 239839, "epoch": 1427} {"train_loss": -11.915761947631836, "global_step": 239840, "epoch": 1427} {"train_loss": -12.094931602478027, "global_step": 239841, "epoch": 1427} {"train_loss": -11.971153259277344, "global_step": 239842, "epoch": 1427} {"train_loss": -11.971435546875, "global_step": 239843, "epoch": 1427} {"train_loss": -11.880395889282227, "global_step": 239844, "epoch": 1427} {"train_loss": -12.088484764099121, "global_step": 239845, "epoch": 1427} {"train_loss": -11.999567031860352, "global_step": 239846, "epoch": 1427} {"train_loss": -11.835089683532715, "global_step": 239847, "epoch": 1427} {"train_loss": -11.766225814819336, "global_step": 239848, "epoch": 1427} {"train_loss": -12.028493881225586, "global_step": 239849, "epoch": 1427} {"train_loss": -11.845514297485352, "global_step": 239850, "epoch": 1427} {"train_loss": -11.915950775146484, "global_step": 239851, "epoch": 1427} {"train_loss": -11.486867904663086, "global_step": 239852, "epoch": 1427} {"train_loss": -12.033665657043457, "global_step": 239853, "epoch": 1427} {"train_loss": -11.95026683807373, "global_step": 239854, "epoch": 1427} {"train_loss": -11.685880661010742, "global_step": 239855, "epoch": 1427} {"train_loss": -11.23035717010498, "global_step": 239856, "epoch": 1427} {"train_loss": -11.753019332885742, "global_step": 239857, "epoch": 1427} {"train_loss": -11.852921485900879, "global_step": 239858, "epoch": 1427} {"train_loss": -11.416812896728516, "global_step": 239859, "epoch": 1427} {"train_loss": -11.534515380859375, "global_step": 239860, "epoch": 1427} {"train_loss": -11.77786922454834, "global_step": 239861, "epoch": 1427} {"train_loss": -11.62763500213623, "global_step": 239862, "epoch": 1427} {"train_loss": -11.193010330200195, "global_step": 239863, "epoch": 1427} {"train_loss": -11.1544828414917, "global_step": 239864, "epoch": 1427} {"train_loss": -11.697622299194336, "global_step": 239865, "epoch": 1427} {"train_loss": -11.340240478515625, "global_step": 239866, "epoch": 1427} {"train_loss": -11.734892845153809, "global_step": 239867, "epoch": 1427} {"train_loss": -11.469167709350586, "global_step": 239868, "epoch": 1427} {"train_loss": -11.318617820739746, "global_step": 239869, "epoch": 1427} {"train_loss": -11.51115608215332, "global_step": 239870, "epoch": 1427} {"train_loss": -11.723809242248535, "global_step": 239871, "epoch": 1427} {"train_loss": -11.384042739868164, "global_step": 239872, "epoch": 1427} {"train_loss": -11.741157531738281, "global_step": 239873, "epoch": 1427} {"train_loss": -10.752591133117676, "global_step": 239874, "epoch": 1427} {"train_loss": -10.490177154541016, "global_step": 239875, "epoch": 1427} {"train_loss": -11.522846221923828, "global_step": 239876, "epoch": 1427} {"train_loss": -10.696928024291992, "global_step": 239877, "epoch": 1427} {"train_loss": -10.716547012329102, "global_step": 239878, "epoch": 1427} {"train_loss": -11.34931468963623, "global_step": 239879, "epoch": 1427} {"train_loss": -10.220203399658203, "global_step": 239880, "epoch": 1427} {"train_loss": -10.915477752685547, "global_step": 239881, "epoch": 1427} {"train_loss": -10.460433959960938, "global_step": 239882, "epoch": 1427} {"train_loss": -10.604498863220215, "global_step": 239883, "epoch": 1427} {"train_loss": -10.54475212097168, "global_step": 239884, "epoch": 1427} {"train_loss": -10.832387924194336, "global_step": 239885, "epoch": 1427} {"train_loss": -11.359098434448242, "global_step": 239886, "epoch": 1427} {"train_loss": -10.904085159301758, "global_step": 239887, "epoch": 1427} {"train_loss": -11.308958053588867, "global_step": 239888, "epoch": 1427} {"train_loss": -11.041759490966797, "global_step": 239889, "epoch": 1427} {"train_loss": -11.017374038696289, "global_step": 239890, "epoch": 1427} {"train_loss": -11.36294937133789, "global_step": 239891, "epoch": 1427} {"train_loss": -11.040586471557617, "global_step": 239892, "epoch": 1427} {"train_loss": -11.441062927246094, "global_step": 239893, "epoch": 1427} {"train_loss": -11.626368522644043, "global_step": 239894, "epoch": 1427} {"train_loss": -11.272764205932617, "global_step": 239895, "epoch": 1427} {"train_loss": -11.241066932678223, "global_step": 239896, "epoch": 1427} {"train_loss": -11.416488647460938, "global_step": 239897, "epoch": 1427} {"train_loss": -11.057548522949219, "global_step": 239898, "epoch": 1427} {"train_loss": -11.20671272277832, "global_step": 239899, "epoch": 1427} {"train_loss": -11.323317527770996, "global_step": 239900, "epoch": 1427} {"train_loss": -11.288670539855957, "global_step": 239901, "epoch": 1427} {"train_loss": -11.300729751586914, "global_step": 239902, "epoch": 1427} {"train_loss": -11.46424933274587, "global_step": 239903, "epoch": 1427, "val_loss": 265525.40625} {"train_loss": -11.395151138305664, "global_step": 239904, "epoch": 1428} {"train_loss": -10.806943893432617, "global_step": 239905, "epoch": 1428} {"train_loss": -11.37833023071289, "global_step": 239906, "epoch": 1428} {"train_loss": -11.182621955871582, "global_step": 239907, "epoch": 1428} {"train_loss": -11.374394416809082, "global_step": 239908, "epoch": 1428} {"train_loss": -11.365930557250977, "global_step": 239909, "epoch": 1428} {"train_loss": -11.827260971069336, "global_step": 239910, "epoch": 1428} {"train_loss": -11.289233207702637, "global_step": 239911, "epoch": 1428} {"train_loss": -11.613761901855469, "global_step": 239912, "epoch": 1428} {"train_loss": -11.461724281311035, "global_step": 239913, "epoch": 1428} {"train_loss": -11.387426376342773, "global_step": 239914, "epoch": 1428} {"train_loss": -11.495177268981934, "global_step": 239915, "epoch": 1428} {"train_loss": -11.800230026245117, "global_step": 239916, "epoch": 1428} {"train_loss": -11.384370803833008, "global_step": 239917, "epoch": 1428} {"train_loss": -11.617486953735352, "global_step": 239918, "epoch": 1428} {"train_loss": -11.305614471435547, "global_step": 239919, "epoch": 1428} {"train_loss": -11.82181167602539, "global_step": 239920, "epoch": 1428} {"train_loss": -11.707611083984375, "global_step": 239921, "epoch": 1428} {"train_loss": -11.641658782958984, "global_step": 239922, "epoch": 1428} {"train_loss": -11.6566743850708, "global_step": 239923, "epoch": 1428} {"train_loss": -11.772187232971191, "global_step": 239924, "epoch": 1428} {"train_loss": -11.285809516906738, "global_step": 239925, "epoch": 1428} {"train_loss": -11.10378360748291, "global_step": 239926, "epoch": 1428} {"train_loss": -11.216089248657227, "global_step": 239927, "epoch": 1428} {"train_loss": -11.176687240600586, "global_step": 239928, "epoch": 1428} {"train_loss": -11.468400955200195, "global_step": 239929, "epoch": 1428} {"train_loss": -11.612404823303223, "global_step": 239930, "epoch": 1428} {"train_loss": -11.525215148925781, "global_step": 239931, "epoch": 1428} {"train_loss": -11.550780296325684, "global_step": 239932, "epoch": 1428} {"train_loss": -11.413610458374023, "global_step": 239933, "epoch": 1428} {"train_loss": -11.454630851745605, "global_step": 239934, "epoch": 1428} {"train_loss": -11.55423355102539, "global_step": 239935, "epoch": 1428} {"train_loss": -11.281237602233887, "global_step": 239936, "epoch": 1428} {"train_loss": -11.561997413635254, "global_step": 239937, "epoch": 1428} {"train_loss": -11.270593643188477, "global_step": 239938, "epoch": 1428} {"train_loss": -11.299463272094727, "global_step": 239939, "epoch": 1428} {"train_loss": -11.244985580444336, "global_step": 239940, "epoch": 1428} {"train_loss": -10.921762466430664, "global_step": 239941, "epoch": 1428} {"train_loss": -11.570720672607422, "global_step": 239942, "epoch": 1428} {"train_loss": -11.368532180786133, "global_step": 239943, "epoch": 1428} {"train_loss": -11.380992889404297, "global_step": 239944, "epoch": 1428} {"train_loss": -11.415603637695312, "global_step": 239945, "epoch": 1428} {"train_loss": -11.297714233398438, "global_step": 239946, "epoch": 1428} {"train_loss": -11.484928131103516, "global_step": 239947, "epoch": 1428} {"train_loss": -11.171943664550781, "global_step": 239948, "epoch": 1428} {"train_loss": -11.805381774902344, "global_step": 239949, "epoch": 1428} {"train_loss": -11.436372756958008, "global_step": 239950, "epoch": 1428} {"train_loss": -11.817963600158691, "global_step": 239951, "epoch": 1428} {"train_loss": -11.208539962768555, "global_step": 239952, "epoch": 1428} {"train_loss": -11.711366653442383, "global_step": 239953, "epoch": 1428} {"train_loss": -11.52172565460205, "global_step": 239954, "epoch": 1428} {"train_loss": -11.467935562133789, "global_step": 239955, "epoch": 1428} {"train_loss": -11.600983619689941, "global_step": 239956, "epoch": 1428} {"train_loss": -11.45900821685791, "global_step": 239957, "epoch": 1428} {"train_loss": -12.125897407531738, "global_step": 239958, "epoch": 1428} {"train_loss": -11.649580001831055, "global_step": 239959, "epoch": 1428} {"train_loss": -11.667928695678711, "global_step": 239960, "epoch": 1428} {"train_loss": -11.714887619018555, "global_step": 239961, "epoch": 1428} {"train_loss": -11.656615257263184, "global_step": 239962, "epoch": 1428} {"train_loss": -11.84591293334961, "global_step": 239963, "epoch": 1428} {"train_loss": -11.68851375579834, "global_step": 239964, "epoch": 1428} {"train_loss": -11.746662139892578, "global_step": 239965, "epoch": 1428} {"train_loss": -11.54189682006836, "global_step": 239966, "epoch": 1428} {"train_loss": -11.634513854980469, "global_step": 239967, "epoch": 1428} {"train_loss": -11.892471313476562, "global_step": 239968, "epoch": 1428} {"train_loss": -11.709371566772461, "global_step": 239969, "epoch": 1428} {"train_loss": -11.582305908203125, "global_step": 239970, "epoch": 1428} {"train_loss": -11.741726875305176, "global_step": 239971, "epoch": 1428} {"train_loss": -11.726571083068848, "global_step": 239972, "epoch": 1428} {"train_loss": -11.668293952941895, "global_step": 239973, "epoch": 1428} {"train_loss": -11.678905487060547, "global_step": 239974, "epoch": 1428} {"train_loss": -11.523052215576172, "global_step": 239975, "epoch": 1428} {"train_loss": -11.850954055786133, "global_step": 239976, "epoch": 1428} {"train_loss": -11.465993881225586, "global_step": 239977, "epoch": 1428} {"train_loss": -11.777257919311523, "global_step": 239978, "epoch": 1428} {"train_loss": -11.683490753173828, "global_step": 239979, "epoch": 1428} {"train_loss": -11.772336959838867, "global_step": 239980, "epoch": 1428} {"train_loss": -11.80610179901123, "global_step": 239981, "epoch": 1428} {"train_loss": -11.655426025390625, "global_step": 239982, "epoch": 1428} {"train_loss": -11.812088966369629, "global_step": 239983, "epoch": 1428} {"train_loss": -11.866883277893066, "global_step": 239984, "epoch": 1428} {"train_loss": -11.752969741821289, "global_step": 239985, "epoch": 1428} {"train_loss": -12.066984176635742, "global_step": 239986, "epoch": 1428} {"train_loss": -11.785818099975586, "global_step": 239987, "epoch": 1428} {"train_loss": -12.153353691101074, "global_step": 239988, "epoch": 1428} {"train_loss": -11.889135360717773, "global_step": 239989, "epoch": 1428} {"train_loss": -12.10715103149414, "global_step": 239990, "epoch": 1428} {"train_loss": -12.030303955078125, "global_step": 239991, "epoch": 1428} {"train_loss": -12.035083770751953, "global_step": 239992, "epoch": 1428} {"train_loss": -12.117554664611816, "global_step": 239993, "epoch": 1428} {"train_loss": -12.23047161102295, "global_step": 239994, "epoch": 1428} {"train_loss": -11.987810134887695, "global_step": 239995, "epoch": 1428} {"train_loss": -12.177566528320312, "global_step": 239996, "epoch": 1428} {"train_loss": -12.039403915405273, "global_step": 239997, "epoch": 1428} {"train_loss": -12.137773513793945, "global_step": 239998, "epoch": 1428} {"train_loss": -11.99648666381836, "global_step": 239999, "epoch": 1428} {"train_loss": -12.075939178466797, "global_step": 240000, "epoch": 1428} {"train_loss": -11.974945068359375, "global_step": 240001, "epoch": 1428} {"train_loss": -12.214285850524902, "global_step": 240002, "epoch": 1428} {"train_loss": -11.817299842834473, "global_step": 240003, "epoch": 1428} {"train_loss": -11.94411563873291, "global_step": 240004, "epoch": 1428} {"train_loss": -11.795587539672852, "global_step": 240005, "epoch": 1428} {"train_loss": -11.976913452148438, "global_step": 240006, "epoch": 1428} {"train_loss": -12.146684646606445, "global_step": 240007, "epoch": 1428} {"train_loss": -12.331132888793945, "global_step": 240008, "epoch": 1428} {"train_loss": -12.093019485473633, "global_step": 240009, "epoch": 1428} {"train_loss": -12.162620544433594, "global_step": 240010, "epoch": 1428} {"train_loss": -12.088354110717773, "global_step": 240011, "epoch": 1428} {"train_loss": -11.994561195373535, "global_step": 240012, "epoch": 1428} {"train_loss": -12.044498443603516, "global_step": 240013, "epoch": 1428} {"train_loss": -11.755794525146484, "global_step": 240014, "epoch": 1428} {"train_loss": -11.928363800048828, "global_step": 240015, "epoch": 1428} {"train_loss": -11.801619529724121, "global_step": 240016, "epoch": 1428} {"train_loss": -11.5293607711792, "global_step": 240017, "epoch": 1428} {"train_loss": -11.515918731689453, "global_step": 240018, "epoch": 1428} {"train_loss": -11.608783721923828, "global_step": 240019, "epoch": 1428} {"train_loss": -11.507088661193848, "global_step": 240020, "epoch": 1428} {"train_loss": -11.270709991455078, "global_step": 240021, "epoch": 1428} {"train_loss": -10.839963912963867, "global_step": 240022, "epoch": 1428} {"train_loss": -11.188255310058594, "global_step": 240023, "epoch": 1428} {"train_loss": -10.838610649108887, "global_step": 240024, "epoch": 1428} {"train_loss": -11.557785034179688, "global_step": 240025, "epoch": 1428} {"train_loss": -11.279117584228516, "global_step": 240026, "epoch": 1428} {"train_loss": -11.494403839111328, "global_step": 240027, "epoch": 1428} {"train_loss": -10.610610961914062, "global_step": 240028, "epoch": 1428} {"train_loss": -11.101804733276367, "global_step": 240029, "epoch": 1428} {"train_loss": -10.814655303955078, "global_step": 240030, "epoch": 1428} {"train_loss": -10.970548629760742, "global_step": 240031, "epoch": 1428} {"train_loss": -11.240206718444824, "global_step": 240032, "epoch": 1428} {"train_loss": -10.635525703430176, "global_step": 240033, "epoch": 1428} {"train_loss": -10.444266319274902, "global_step": 240034, "epoch": 1428} {"train_loss": -11.365263938903809, "global_step": 240035, "epoch": 1428} {"train_loss": -10.05837631225586, "global_step": 240036, "epoch": 1428} {"train_loss": -10.08145523071289, "global_step": 240037, "epoch": 1428} {"train_loss": -10.68071174621582, "global_step": 240038, "epoch": 1428} {"train_loss": -11.257732391357422, "global_step": 240039, "epoch": 1428} {"train_loss": -10.790386199951172, "global_step": 240040, "epoch": 1428} {"train_loss": -10.930801391601562, "global_step": 240041, "epoch": 1428} {"train_loss": -10.803715705871582, "global_step": 240042, "epoch": 1428} {"train_loss": -10.591482162475586, "global_step": 240043, "epoch": 1428} {"train_loss": -10.939210891723633, "global_step": 240044, "epoch": 1428} {"train_loss": -10.42092227935791, "global_step": 240045, "epoch": 1428} {"train_loss": -11.51936149597168, "global_step": 240046, "epoch": 1428} {"train_loss": -10.106905937194824, "global_step": 240047, "epoch": 1428} {"train_loss": -11.566301345825195, "global_step": 240048, "epoch": 1428} {"train_loss": -10.919356346130371, "global_step": 240049, "epoch": 1428} {"train_loss": -11.188791275024414, "global_step": 240050, "epoch": 1428} {"train_loss": -11.5101900100708, "global_step": 240051, "epoch": 1428} {"train_loss": -11.005200386047363, "global_step": 240052, "epoch": 1428} {"train_loss": -11.8848237991333, "global_step": 240053, "epoch": 1428} {"train_loss": -11.308284759521484, "global_step": 240054, "epoch": 1428} {"train_loss": -11.348409652709961, "global_step": 240055, "epoch": 1428} {"train_loss": -11.45425796508789, "global_step": 240056, "epoch": 1428} {"train_loss": -11.679136276245117, "global_step": 240057, "epoch": 1428} {"train_loss": -11.638789176940918, "global_step": 240058, "epoch": 1428} {"train_loss": -11.690998077392578, "global_step": 240059, "epoch": 1428} {"train_loss": -11.419679641723633, "global_step": 240060, "epoch": 1428} {"train_loss": -11.75245475769043, "global_step": 240061, "epoch": 1428} {"train_loss": -11.852001190185547, "global_step": 240062, "epoch": 1428} {"train_loss": -11.680925369262695, "global_step": 240063, "epoch": 1428} {"train_loss": -11.934646606445312, "global_step": 240064, "epoch": 1428} {"train_loss": -11.592001914978027, "global_step": 240065, "epoch": 1428} {"train_loss": -11.866100311279297, "global_step": 240066, "epoch": 1428} {"train_loss": -11.60032844543457, "global_step": 240067, "epoch": 1428} {"train_loss": -11.819536209106445, "global_step": 240068, "epoch": 1428} {"train_loss": -11.879377365112305, "global_step": 240069, "epoch": 1428} {"train_loss": -11.713339805603027, "global_step": 240070, "epoch": 1428} {"train_loss": -11.530722135589237, "global_step": 240071, "epoch": 1428, "val_loss": 268379.9375} {"train_loss": -11.635213851928711, "global_step": 240072, "epoch": 1429} {"train_loss": -12.033354759216309, "global_step": 240073, "epoch": 1429} {"train_loss": -11.730396270751953, "global_step": 240074, "epoch": 1429} {"train_loss": -12.090898513793945, "global_step": 240075, "epoch": 1429} {"train_loss": -12.006989479064941, "global_step": 240076, "epoch": 1429} {"train_loss": -11.465472221374512, "global_step": 240077, "epoch": 1429} {"train_loss": -12.065642356872559, "global_step": 240078, "epoch": 1429} {"train_loss": -12.0233793258667, "global_step": 240079, "epoch": 1429} {"train_loss": -11.591764450073242, "global_step": 240080, "epoch": 1429} {"train_loss": -12.084602355957031, "global_step": 240081, "epoch": 1429} {"train_loss": -11.928281784057617, "global_step": 240082, "epoch": 1429} {"train_loss": -11.98105525970459, "global_step": 240083, "epoch": 1429} {"train_loss": -11.869115829467773, "global_step": 240084, "epoch": 1429} {"train_loss": -11.912749290466309, "global_step": 240085, "epoch": 1429} {"train_loss": -12.112465858459473, "global_step": 240086, "epoch": 1429} {"train_loss": -11.78111743927002, "global_step": 240087, "epoch": 1429} {"train_loss": -12.016703605651855, "global_step": 240088, "epoch": 1429} {"train_loss": -12.08165454864502, "global_step": 240089, "epoch": 1429} {"train_loss": -11.92397689819336, "global_step": 240090, "epoch": 1429} {"train_loss": -11.996431350708008, "global_step": 240091, "epoch": 1429} {"train_loss": -11.96782112121582, "global_step": 240092, "epoch": 1429} {"train_loss": -12.059277534484863, "global_step": 240093, "epoch": 1429} {"train_loss": -11.977019309997559, "global_step": 240094, "epoch": 1429} {"train_loss": -11.935420989990234, "global_step": 240095, "epoch": 1429} {"train_loss": -11.9415283203125, "global_step": 240096, "epoch": 1429} {"train_loss": -12.045248031616211, "global_step": 240097, "epoch": 1429} {"train_loss": -12.002729415893555, "global_step": 240098, "epoch": 1429} {"train_loss": -11.961174011230469, "global_step": 240099, "epoch": 1429} {"train_loss": -11.86170768737793, "global_step": 240100, "epoch": 1429} {"train_loss": -11.458574295043945, "global_step": 240101, "epoch": 1429} {"train_loss": -12.032463073730469, "global_step": 240102, "epoch": 1429} {"train_loss": -11.716135025024414, "global_step": 240103, "epoch": 1429} {"train_loss": -11.558907508850098, "global_step": 240104, "epoch": 1429} {"train_loss": -11.996397018432617, "global_step": 240105, "epoch": 1429} {"train_loss": -11.669921875, "global_step": 240106, "epoch": 1429} {"train_loss": -10.428815841674805, "global_step": 240107, "epoch": 1429} {"train_loss": -11.252969741821289, "global_step": 240108, "epoch": 1429} {"train_loss": -11.040980339050293, "global_step": 240109, "epoch": 1429} {"train_loss": -11.784283638000488, "global_step": 240110, "epoch": 1429} {"train_loss": -10.850152969360352, "global_step": 240111, "epoch": 1429} {"train_loss": -11.854341506958008, "global_step": 240112, "epoch": 1429} {"train_loss": -11.287009239196777, "global_step": 240113, "epoch": 1429} {"train_loss": -11.904362678527832, "global_step": 240114, "epoch": 1429} {"train_loss": -10.68946361541748, "global_step": 240115, "epoch": 1429} {"train_loss": -11.920208930969238, "global_step": 240116, "epoch": 1429} {"train_loss": -10.712631225585938, "global_step": 240117, "epoch": 1429} {"train_loss": -9.749665260314941, "global_step": 240118, "epoch": 1429} {"train_loss": -11.509549140930176, "global_step": 240119, "epoch": 1429} {"train_loss": -10.755935668945312, "global_step": 240120, "epoch": 1429} {"train_loss": -10.365218162536621, "global_step": 240121, "epoch": 1429} {"train_loss": -11.82198429107666, "global_step": 240122, "epoch": 1429} {"train_loss": -11.178298950195312, "global_step": 240123, "epoch": 1429} {"train_loss": -10.278444290161133, "global_step": 240124, "epoch": 1429} {"train_loss": -10.636985778808594, "global_step": 240125, "epoch": 1429} {"train_loss": -9.487791061401367, "global_step": 240126, "epoch": 1429} {"train_loss": -10.761412620544434, "global_step": 240127, "epoch": 1429} {"train_loss": -9.111884117126465, "global_step": 240128, "epoch": 1429} {"train_loss": -11.288908004760742, "global_step": 240129, "epoch": 1429} {"train_loss": -10.192303657531738, "global_step": 240130, "epoch": 1429} {"train_loss": -11.838481903076172, "global_step": 240131, "epoch": 1429} {"train_loss": -10.353906631469727, "global_step": 240132, "epoch": 1429} {"train_loss": -11.729726791381836, "global_step": 240133, "epoch": 1429} {"train_loss": -10.681503295898438, "global_step": 240134, "epoch": 1429} {"train_loss": -11.315620422363281, "global_step": 240135, "epoch": 1429} {"train_loss": -10.854766845703125, "global_step": 240136, "epoch": 1429} {"train_loss": -11.482942581176758, "global_step": 240137, "epoch": 1429} {"train_loss": -10.489253997802734, "global_step": 240138, "epoch": 1429} {"train_loss": -11.835844039916992, "global_step": 240139, "epoch": 1429} {"train_loss": -10.39461612701416, "global_step": 240140, "epoch": 1429} {"train_loss": -11.546205520629883, "global_step": 240141, "epoch": 1429} {"train_loss": -11.18172836303711, "global_step": 240142, "epoch": 1429} {"train_loss": -10.794251441955566, "global_step": 240143, "epoch": 1429} {"train_loss": -11.336509704589844, "global_step": 240144, "epoch": 1429} {"train_loss": -10.806879043579102, "global_step": 240145, "epoch": 1429} {"train_loss": -10.665643692016602, "global_step": 240146, "epoch": 1429} {"train_loss": -11.216639518737793, "global_step": 240147, "epoch": 1429} {"train_loss": -10.726861953735352, "global_step": 240148, "epoch": 1429} {"train_loss": -11.64079475402832, "global_step": 240149, "epoch": 1429} {"train_loss": -11.151151657104492, "global_step": 240150, "epoch": 1429} {"train_loss": -10.529223442077637, "global_step": 240151, "epoch": 1429} {"train_loss": -11.825740814208984, "global_step": 240152, "epoch": 1429} {"train_loss": -10.56801986694336, "global_step": 240153, "epoch": 1429} {"train_loss": -11.244224548339844, "global_step": 240154, "epoch": 1429} {"train_loss": -10.939931869506836, "global_step": 240155, "epoch": 1429} {"train_loss": -10.771492004394531, "global_step": 240156, "epoch": 1429} {"train_loss": -11.262920379638672, "global_step": 240157, "epoch": 1429} {"train_loss": -11.255121231079102, "global_step": 240158, "epoch": 1429} {"train_loss": -11.332779884338379, "global_step": 240159, "epoch": 1429} {"train_loss": -11.221293449401855, "global_step": 240160, "epoch": 1429} {"train_loss": -11.317436218261719, "global_step": 240161, "epoch": 1429} {"train_loss": -11.718595504760742, "global_step": 240162, "epoch": 1429} {"train_loss": -11.501708030700684, "global_step": 240163, "epoch": 1429} {"train_loss": -11.394009590148926, "global_step": 240164, "epoch": 1429} {"train_loss": -11.703472137451172, "global_step": 240165, "epoch": 1429} {"train_loss": -11.595952987670898, "global_step": 240166, "epoch": 1429} {"train_loss": -11.690757751464844, "global_step": 240167, "epoch": 1429} {"train_loss": -11.862173080444336, "global_step": 240168, "epoch": 1429} {"train_loss": -11.660578727722168, "global_step": 240169, "epoch": 1429} {"train_loss": -11.687646865844727, "global_step": 240170, "epoch": 1429} {"train_loss": -11.892595291137695, "global_step": 240171, "epoch": 1429} {"train_loss": -11.858652114868164, "global_step": 240172, "epoch": 1429} {"train_loss": -11.561635971069336, "global_step": 240173, "epoch": 1429} {"train_loss": -12.047830581665039, "global_step": 240174, "epoch": 1429} {"train_loss": -11.627945899963379, "global_step": 240175, "epoch": 1429} {"train_loss": -11.96373176574707, "global_step": 240176, "epoch": 1429} {"train_loss": -11.60982894897461, "global_step": 240177, "epoch": 1429} {"train_loss": -11.781156539916992, "global_step": 240178, "epoch": 1429} {"train_loss": -11.519488334655762, "global_step": 240179, "epoch": 1429} {"train_loss": -11.587812423706055, "global_step": 240180, "epoch": 1429} {"train_loss": -11.665267944335938, "global_step": 240181, "epoch": 1429} {"train_loss": -11.387770652770996, "global_step": 240182, "epoch": 1429} {"train_loss": -11.687999725341797, "global_step": 240183, "epoch": 1429} {"train_loss": -11.657861709594727, "global_step": 240184, "epoch": 1429} {"train_loss": -11.629447937011719, "global_step": 240185, "epoch": 1429} {"train_loss": -11.582921028137207, "global_step": 240186, "epoch": 1429} {"train_loss": -11.79979419708252, "global_step": 240187, "epoch": 1429} {"train_loss": -11.730935096740723, "global_step": 240188, "epoch": 1429} {"train_loss": -11.822404861450195, "global_step": 240189, "epoch": 1429} {"train_loss": -11.64468765258789, "global_step": 240190, "epoch": 1429} {"train_loss": -11.617162704467773, "global_step": 240191, "epoch": 1429} {"train_loss": -11.535609245300293, "global_step": 240192, "epoch": 1429} {"train_loss": -11.979472160339355, "global_step": 240193, "epoch": 1429} {"train_loss": -11.15099811553955, "global_step": 240194, "epoch": 1429} {"train_loss": -11.57172679901123, "global_step": 240195, "epoch": 1429} {"train_loss": -11.149391174316406, "global_step": 240196, "epoch": 1429} {"train_loss": -11.958449363708496, "global_step": 240197, "epoch": 1429} {"train_loss": -11.541818618774414, "global_step": 240198, "epoch": 1429} {"train_loss": -12.142648696899414, "global_step": 240199, "epoch": 1429} {"train_loss": -11.872239112854004, "global_step": 240200, "epoch": 1429} {"train_loss": -11.863739967346191, "global_step": 240201, "epoch": 1429} {"train_loss": -11.463446617126465, "global_step": 240202, "epoch": 1429} {"train_loss": -11.819071769714355, "global_step": 240203, "epoch": 1429} {"train_loss": -11.826539993286133, "global_step": 240204, "epoch": 1429} {"train_loss": -11.728599548339844, "global_step": 240205, "epoch": 1429} {"train_loss": -11.869709968566895, "global_step": 240206, "epoch": 1429} {"train_loss": -11.971214294433594, "global_step": 240207, "epoch": 1429} {"train_loss": -11.584692001342773, "global_step": 240208, "epoch": 1429} {"train_loss": -11.675443649291992, "global_step": 240209, "epoch": 1429} {"train_loss": -11.65764045715332, "global_step": 240210, "epoch": 1429} {"train_loss": -11.330106735229492, "global_step": 240211, "epoch": 1429} {"train_loss": -11.330994606018066, "global_step": 240212, "epoch": 1429} {"train_loss": -11.258644104003906, "global_step": 240213, "epoch": 1429} {"train_loss": -11.281108856201172, "global_step": 240214, "epoch": 1429} {"train_loss": -11.665140151977539, "global_step": 240215, "epoch": 1429} {"train_loss": -11.238999366760254, "global_step": 240216, "epoch": 1429} {"train_loss": -11.463417053222656, "global_step": 240217, "epoch": 1429} {"train_loss": -11.424891471862793, "global_step": 240218, "epoch": 1429} {"train_loss": -11.49091911315918, "global_step": 240219, "epoch": 1429} {"train_loss": -11.046363830566406, "global_step": 240220, "epoch": 1429} {"train_loss": -11.660510063171387, "global_step": 240221, "epoch": 1429} {"train_loss": -11.432432174682617, "global_step": 240222, "epoch": 1429} {"train_loss": -11.629817962646484, "global_step": 240223, "epoch": 1429} {"train_loss": -11.43496322631836, "global_step": 240224, "epoch": 1429} {"train_loss": -11.57156753540039, "global_step": 240225, "epoch": 1429} {"train_loss": -11.352630615234375, "global_step": 240226, "epoch": 1429} {"train_loss": -11.688089370727539, "global_step": 240227, "epoch": 1429} {"train_loss": -11.479950904846191, "global_step": 240228, "epoch": 1429} {"train_loss": -11.64944839477539, "global_step": 240229, "epoch": 1429} {"train_loss": -10.848876953125, "global_step": 240230, "epoch": 1429} {"train_loss": -11.47076416015625, "global_step": 240231, "epoch": 1429} {"train_loss": -11.2062406539917, "global_step": 240232, "epoch": 1429} {"train_loss": -11.385723114013672, "global_step": 240233, "epoch": 1429} {"train_loss": -10.342269897460938, "global_step": 240234, "epoch": 1429} {"train_loss": -11.035688400268555, "global_step": 240235, "epoch": 1429} {"train_loss": -10.605642318725586, "global_step": 240236, "epoch": 1429} {"train_loss": -9.92103099822998, "global_step": 240237, "epoch": 1429} {"train_loss": -10.468940734863281, "global_step": 240238, "epoch": 1429} {"train_loss": -11.430078444026766, "global_step": 240239, "epoch": 1429, "val_loss": 267848.3125} {"train_loss": -9.802133560180664, "global_step": 240240, "epoch": 1430} {"train_loss": -10.81171703338623, "global_step": 240241, "epoch": 1430} {"train_loss": -10.670340538024902, "global_step": 240242, "epoch": 1430} {"train_loss": -10.677677154541016, "global_step": 240243, "epoch": 1430} {"train_loss": -11.076089859008789, "global_step": 240244, "epoch": 1430} {"train_loss": -10.467784881591797, "global_step": 240245, "epoch": 1430} {"train_loss": -11.37669849395752, "global_step": 240246, "epoch": 1430} {"train_loss": -10.76164436340332, "global_step": 240247, "epoch": 1430} {"train_loss": -11.418185234069824, "global_step": 240248, "epoch": 1430} {"train_loss": -10.448535919189453, "global_step": 240249, "epoch": 1430} {"train_loss": -11.376591682434082, "global_step": 240250, "epoch": 1430} {"train_loss": -11.434416770935059, "global_step": 240251, "epoch": 1430} {"train_loss": -11.379364013671875, "global_step": 240252, "epoch": 1430} {"train_loss": -11.749244689941406, "global_step": 240253, "epoch": 1430} {"train_loss": -11.251524925231934, "global_step": 240254, "epoch": 1430} {"train_loss": -11.58126449584961, "global_step": 240255, "epoch": 1430} {"train_loss": -11.135074615478516, "global_step": 240256, "epoch": 1430} {"train_loss": -11.467301368713379, "global_step": 240257, "epoch": 1430} {"train_loss": -11.502510070800781, "global_step": 240258, "epoch": 1430} {"train_loss": -11.379310607910156, "global_step": 240259, "epoch": 1430} {"train_loss": -11.518227577209473, "global_step": 240260, "epoch": 1430} {"train_loss": -11.483175277709961, "global_step": 240261, "epoch": 1430} {"train_loss": -11.215042114257812, "global_step": 240262, "epoch": 1430} {"train_loss": -11.47378921508789, "global_step": 240263, "epoch": 1430} {"train_loss": -11.600187301635742, "global_step": 240264, "epoch": 1430} {"train_loss": -11.760847091674805, "global_step": 240265, "epoch": 1430} {"train_loss": -11.633689880371094, "global_step": 240266, "epoch": 1430} {"train_loss": -11.409982681274414, "global_step": 240267, "epoch": 1430} {"train_loss": -11.826444625854492, "global_step": 240268, "epoch": 1430} {"train_loss": -11.5615234375, "global_step": 240269, "epoch": 1430} {"train_loss": -11.894638061523438, "global_step": 240270, "epoch": 1430} {"train_loss": -11.698210716247559, "global_step": 240271, "epoch": 1430} {"train_loss": -11.627105712890625, "global_step": 240272, "epoch": 1430} {"train_loss": -11.81891918182373, "global_step": 240273, "epoch": 1430} {"train_loss": -11.62295150756836, "global_step": 240274, "epoch": 1430} {"train_loss": -11.6229887008667, "global_step": 240275, "epoch": 1430} {"train_loss": -11.843236923217773, "global_step": 240276, "epoch": 1430} {"train_loss": -11.790735244750977, "global_step": 240277, "epoch": 1430} {"train_loss": -11.815893173217773, "global_step": 240278, "epoch": 1430} {"train_loss": -11.872284889221191, "global_step": 240279, "epoch": 1430} {"train_loss": -11.847184181213379, "global_step": 240280, "epoch": 1430} {"train_loss": -11.904340744018555, "global_step": 240281, "epoch": 1430} {"train_loss": -11.842827796936035, "global_step": 240282, "epoch": 1430} {"train_loss": -11.714092254638672, "global_step": 240283, "epoch": 1430} {"train_loss": -11.965921401977539, "global_step": 240284, "epoch": 1430} {"train_loss": -12.005598068237305, "global_step": 240285, "epoch": 1430} {"train_loss": -11.904653549194336, "global_step": 240286, "epoch": 1430} {"train_loss": -11.886333465576172, "global_step": 240287, "epoch": 1430} {"train_loss": -12.029346466064453, "global_step": 240288, "epoch": 1430} {"train_loss": -11.973274230957031, "global_step": 240289, "epoch": 1430} {"train_loss": -12.066591262817383, "global_step": 240290, "epoch": 1430} {"train_loss": -11.942203521728516, "global_step": 240291, "epoch": 1430} {"train_loss": -12.048600196838379, "global_step": 240292, "epoch": 1430} {"train_loss": -11.715353012084961, "global_step": 240293, "epoch": 1430} {"train_loss": -11.93000602722168, "global_step": 240294, "epoch": 1430} {"train_loss": -11.944822311401367, "global_step": 240295, "epoch": 1430} {"train_loss": -12.063389778137207, "global_step": 240296, "epoch": 1430} {"train_loss": -11.895719528198242, "global_step": 240297, "epoch": 1430} {"train_loss": -12.048540115356445, "global_step": 240298, "epoch": 1430} {"train_loss": -12.133245468139648, "global_step": 240299, "epoch": 1430} {"train_loss": -11.909536361694336, "global_step": 240300, "epoch": 1430} {"train_loss": -12.047933578491211, "global_step": 240301, "epoch": 1430} {"train_loss": -12.013124465942383, "global_step": 240302, "epoch": 1430} {"train_loss": -12.207507133483887, "global_step": 240303, "epoch": 1430} {"train_loss": -11.922222137451172, "global_step": 240304, "epoch": 1430} {"train_loss": -12.120330810546875, "global_step": 240305, "epoch": 1430} {"train_loss": -12.13821792602539, "global_step": 240306, "epoch": 1430} {"train_loss": -12.19162368774414, "global_step": 240307, "epoch": 1430} {"train_loss": -12.117480278015137, "global_step": 240308, "epoch": 1430} {"train_loss": -11.933298110961914, "global_step": 240309, "epoch": 1430} {"train_loss": -12.243962287902832, "global_step": 240310, "epoch": 1430} {"train_loss": -12.17611312866211, "global_step": 240311, "epoch": 1430} {"train_loss": -12.251267433166504, "global_step": 240312, "epoch": 1430} {"train_loss": -12.187387466430664, "global_step": 240313, "epoch": 1430} {"train_loss": -12.267014503479004, "global_step": 240314, "epoch": 1430} {"train_loss": -12.192411422729492, "global_step": 240315, "epoch": 1430} {"train_loss": -12.111778259277344, "global_step": 240316, "epoch": 1430} {"train_loss": -11.96407699584961, "global_step": 240317, "epoch": 1430} {"train_loss": -12.17757797241211, "global_step": 240318, "epoch": 1430} {"train_loss": -12.049735069274902, "global_step": 240319, "epoch": 1430} {"train_loss": -11.936716079711914, "global_step": 240320, "epoch": 1430} {"train_loss": -12.154075622558594, "global_step": 240321, "epoch": 1430} {"train_loss": -12.141478538513184, "global_step": 240322, "epoch": 1430} {"train_loss": -12.2156982421875, "global_step": 240323, "epoch": 1430} {"train_loss": -12.052117347717285, "global_step": 240324, "epoch": 1430} {"train_loss": -12.424338340759277, "global_step": 240325, "epoch": 1430} {"train_loss": -12.1353120803833, "global_step": 240326, "epoch": 1430} {"train_loss": -11.796049118041992, "global_step": 240327, "epoch": 1430} {"train_loss": -11.577380180358887, "global_step": 240328, "epoch": 1430} {"train_loss": -10.943412780761719, "global_step": 240329, "epoch": 1430} {"train_loss": -10.545454978942871, "global_step": 240330, "epoch": 1430} {"train_loss": -10.213217735290527, "global_step": 240331, "epoch": 1430} {"train_loss": -11.498064041137695, "global_step": 240332, "epoch": 1430} {"train_loss": -10.724149703979492, "global_step": 240333, "epoch": 1430} {"train_loss": -9.361869812011719, "global_step": 240334, "epoch": 1430} {"train_loss": -11.646110534667969, "global_step": 240335, "epoch": 1430} {"train_loss": -11.53072738647461, "global_step": 240336, "epoch": 1430} {"train_loss": -10.454879760742188, "global_step": 240337, "epoch": 1430} {"train_loss": -9.948168754577637, "global_step": 240338, "epoch": 1430} {"train_loss": -11.517999649047852, "global_step": 240339, "epoch": 1430} {"train_loss": -9.61849594116211, "global_step": 240340, "epoch": 1430} {"train_loss": -11.327038764953613, "global_step": 240341, "epoch": 1430} {"train_loss": -9.23604965209961, "global_step": 240342, "epoch": 1430} {"train_loss": -11.10210132598877, "global_step": 240343, "epoch": 1430} {"train_loss": -8.317495346069336, "global_step": 240344, "epoch": 1430} {"train_loss": -10.968477249145508, "global_step": 240345, "epoch": 1430} {"train_loss": -10.931062698364258, "global_step": 240346, "epoch": 1430} {"train_loss": -10.260086059570312, "global_step": 240347, "epoch": 1430} {"train_loss": -10.058853149414062, "global_step": 240348, "epoch": 1430} {"train_loss": -9.570611000061035, "global_step": 240349, "epoch": 1430} {"train_loss": -8.426300048828125, "global_step": 240350, "epoch": 1430} {"train_loss": -8.72477912902832, "global_step": 240351, "epoch": 1430} {"train_loss": -9.686995506286621, "global_step": 240352, "epoch": 1430} {"train_loss": -9.535993576049805, "global_step": 240353, "epoch": 1430} {"train_loss": -9.115488052368164, "global_step": 240354, "epoch": 1430} {"train_loss": -9.061006546020508, "global_step": 240355, "epoch": 1430} {"train_loss": -8.794615745544434, "global_step": 240356, "epoch": 1430} {"train_loss": -10.142559051513672, "global_step": 240357, "epoch": 1430} {"train_loss": -9.243041038513184, "global_step": 240358, "epoch": 1430} {"train_loss": -10.575033187866211, "global_step": 240359, "epoch": 1430} {"train_loss": -10.272958755493164, "global_step": 240360, "epoch": 1430} {"train_loss": -9.049579620361328, "global_step": 240361, "epoch": 1430} {"train_loss": -10.405509948730469, "global_step": 240362, "epoch": 1430} {"train_loss": -9.854835510253906, "global_step": 240363, "epoch": 1430} {"train_loss": -10.77010726928711, "global_step": 240364, "epoch": 1430} {"train_loss": -10.141388893127441, "global_step": 240365, "epoch": 1430} {"train_loss": -10.33707332611084, "global_step": 240366, "epoch": 1430} {"train_loss": -10.716777801513672, "global_step": 240367, "epoch": 1430} {"train_loss": -10.890542984008789, "global_step": 240368, "epoch": 1430} {"train_loss": -10.838747024536133, "global_step": 240369, "epoch": 1430} {"train_loss": -10.991070747375488, "global_step": 240370, "epoch": 1430} {"train_loss": -10.697820663452148, "global_step": 240371, "epoch": 1430} {"train_loss": -10.989022254943848, "global_step": 240372, "epoch": 1430} {"train_loss": -10.850671768188477, "global_step": 240373, "epoch": 1430} {"train_loss": -11.081119537353516, "global_step": 240374, "epoch": 1430} {"train_loss": -10.801887512207031, "global_step": 240375, "epoch": 1430} {"train_loss": -10.562810897827148, "global_step": 240376, "epoch": 1430} {"train_loss": -10.990063667297363, "global_step": 240377, "epoch": 1430} {"train_loss": -10.936511039733887, "global_step": 240378, "epoch": 1430} {"train_loss": -11.192438125610352, "global_step": 240379, "epoch": 1430} {"train_loss": -10.923469543457031, "global_step": 240380, "epoch": 1430} {"train_loss": -11.166210174560547, "global_step": 240381, "epoch": 1430} {"train_loss": -11.19568920135498, "global_step": 240382, "epoch": 1430} {"train_loss": -11.034586906433105, "global_step": 240383, "epoch": 1430} {"train_loss": -11.1700439453125, "global_step": 240384, "epoch": 1430} {"train_loss": -11.059776306152344, "global_step": 240385, "epoch": 1430} {"train_loss": -11.134764671325684, "global_step": 240386, "epoch": 1430} {"train_loss": -11.237232208251953, "global_step": 240387, "epoch": 1430} {"train_loss": -11.243515014648438, "global_step": 240388, "epoch": 1430} {"train_loss": -11.261913299560547, "global_step": 240389, "epoch": 1430} {"train_loss": -11.308158874511719, "global_step": 240390, "epoch": 1430} {"train_loss": -11.393393516540527, "global_step": 240391, "epoch": 1430} {"train_loss": -11.408662796020508, "global_step": 240392, "epoch": 1430} {"train_loss": -11.538237571716309, "global_step": 240393, "epoch": 1430} {"train_loss": -11.45635986328125, "global_step": 240394, "epoch": 1430} {"train_loss": -11.625665664672852, "global_step": 240395, "epoch": 1430} {"train_loss": -11.615065574645996, "global_step": 240396, "epoch": 1430} {"train_loss": -11.728979110717773, "global_step": 240397, "epoch": 1430} {"train_loss": -11.545952796936035, "global_step": 240398, "epoch": 1430} {"train_loss": -11.360124588012695, "global_step": 240399, "epoch": 1430} {"train_loss": -11.622812271118164, "global_step": 240400, "epoch": 1430} {"train_loss": -11.592317581176758, "global_step": 240401, "epoch": 1430} {"train_loss": -11.602211952209473, "global_step": 240402, "epoch": 1430} {"train_loss": -11.644613265991211, "global_step": 240403, "epoch": 1430} {"train_loss": -11.66296672821045, "global_step": 240404, "epoch": 1430} {"train_loss": -11.820402145385742, "global_step": 240405, "epoch": 1430} {"train_loss": -11.696711540222168, "global_step": 240406, "epoch": 1430} {"train_loss": -11.247851229849315, "global_step": 240407, "epoch": 1430, "val_loss": 257066.0625, "train_action_mse_error": 1.1251025199890137} {"train_loss": -11.572674751281738, "global_step": 240408, "epoch": 1431} {"train_loss": -11.727344512939453, "global_step": 240409, "epoch": 1431} {"train_loss": -11.532482147216797, "global_step": 240410, "epoch": 1431} {"train_loss": -11.593732833862305, "global_step": 240411, "epoch": 1431} {"train_loss": -11.805252075195312, "global_step": 240412, "epoch": 1431} {"train_loss": -11.502870559692383, "global_step": 240413, "epoch": 1431} {"train_loss": -12.019947052001953, "global_step": 240414, "epoch": 1431} {"train_loss": -11.84533405303955, "global_step": 240415, "epoch": 1431} {"train_loss": -11.844767570495605, "global_step": 240416, "epoch": 1431} {"train_loss": -11.768356323242188, "global_step": 240417, "epoch": 1431} {"train_loss": -11.631244659423828, "global_step": 240418, "epoch": 1431} {"train_loss": -11.63168716430664, "global_step": 240419, "epoch": 1431} {"train_loss": -11.515398025512695, "global_step": 240420, "epoch": 1431} {"train_loss": -12.0194730758667, "global_step": 240421, "epoch": 1431} {"train_loss": -11.675336837768555, "global_step": 240422, "epoch": 1431} {"train_loss": -11.890565872192383, "global_step": 240423, "epoch": 1431} {"train_loss": -11.746960639953613, "global_step": 240424, "epoch": 1431} {"train_loss": -11.884679794311523, "global_step": 240425, "epoch": 1431} {"train_loss": -11.818002700805664, "global_step": 240426, "epoch": 1431} {"train_loss": -11.722488403320312, "global_step": 240427, "epoch": 1431} {"train_loss": -12.020430564880371, "global_step": 240428, "epoch": 1431} {"train_loss": -11.966887474060059, "global_step": 240429, "epoch": 1431} {"train_loss": -11.861010551452637, "global_step": 240430, "epoch": 1431} {"train_loss": -12.033549308776855, "global_step": 240431, "epoch": 1431} {"train_loss": -11.772440910339355, "global_step": 240432, "epoch": 1431} {"train_loss": -11.858540534973145, "global_step": 240433, "epoch": 1431} {"train_loss": -11.988594055175781, "global_step": 240434, "epoch": 1431} {"train_loss": -12.14763069152832, "global_step": 240435, "epoch": 1431} {"train_loss": -11.93971061706543, "global_step": 240436, "epoch": 1431} {"train_loss": -12.141976356506348, "global_step": 240437, "epoch": 1431} {"train_loss": -12.003524780273438, "global_step": 240438, "epoch": 1431} {"train_loss": -11.97321605682373, "global_step": 240439, "epoch": 1431} {"train_loss": -12.094354629516602, "global_step": 240440, "epoch": 1431} {"train_loss": -11.917169570922852, "global_step": 240441, "epoch": 1431} {"train_loss": -12.003233909606934, "global_step": 240442, "epoch": 1431} {"train_loss": -11.995994567871094, "global_step": 240443, "epoch": 1431} {"train_loss": -11.962607383728027, "global_step": 240444, "epoch": 1431} {"train_loss": -11.944656372070312, "global_step": 240445, "epoch": 1431} {"train_loss": -11.944765090942383, "global_step": 240446, "epoch": 1431} {"train_loss": -11.903080940246582, "global_step": 240447, "epoch": 1431} {"train_loss": -12.102988243103027, "global_step": 240448, "epoch": 1431} {"train_loss": -12.211294174194336, "global_step": 240449, "epoch": 1431} {"train_loss": -11.947790145874023, "global_step": 240450, "epoch": 1431} {"train_loss": -12.094286918640137, "global_step": 240451, "epoch": 1431} {"train_loss": -11.697900772094727, "global_step": 240452, "epoch": 1431} {"train_loss": -12.278963088989258, "global_step": 240453, "epoch": 1431} {"train_loss": -11.854354858398438, "global_step": 240454, "epoch": 1431} {"train_loss": -11.956643104553223, "global_step": 240455, "epoch": 1431} {"train_loss": -11.907106399536133, "global_step": 240456, "epoch": 1431} {"train_loss": -11.78720474243164, "global_step": 240457, "epoch": 1431} {"train_loss": -11.78342342376709, "global_step": 240458, "epoch": 1431} {"train_loss": -12.172721862792969, "global_step": 240459, "epoch": 1431} {"train_loss": -11.662084579467773, "global_step": 240460, "epoch": 1431} {"train_loss": -11.452569961547852, "global_step": 240461, "epoch": 1431} {"train_loss": -11.99787712097168, "global_step": 240462, "epoch": 1431} {"train_loss": -11.99996280670166, "global_step": 240463, "epoch": 1431} {"train_loss": -11.753190994262695, "global_step": 240464, "epoch": 1431} {"train_loss": -11.630309104919434, "global_step": 240465, "epoch": 1431} {"train_loss": -11.900726318359375, "global_step": 240466, "epoch": 1431} {"train_loss": -11.734776496887207, "global_step": 240467, "epoch": 1431} {"train_loss": -11.996950149536133, "global_step": 240468, "epoch": 1431} {"train_loss": -11.848320960998535, "global_step": 240469, "epoch": 1431} {"train_loss": -12.18635368347168, "global_step": 240470, "epoch": 1431} {"train_loss": -11.97462272644043, "global_step": 240471, "epoch": 1431} {"train_loss": -12.123614311218262, "global_step": 240472, "epoch": 1431} {"train_loss": -11.946308135986328, "global_step": 240473, "epoch": 1431} {"train_loss": -11.696111679077148, "global_step": 240474, "epoch": 1431} {"train_loss": -11.475593566894531, "global_step": 240475, "epoch": 1431} {"train_loss": -11.944709777832031, "global_step": 240476, "epoch": 1431} {"train_loss": -12.084939956665039, "global_step": 240477, "epoch": 1431} {"train_loss": -11.26230239868164, "global_step": 240478, "epoch": 1431} {"train_loss": -10.694984436035156, "global_step": 240479, "epoch": 1431} {"train_loss": -10.94576644897461, "global_step": 240480, "epoch": 1431} {"train_loss": -11.863431930541992, "global_step": 240481, "epoch": 1431} {"train_loss": -10.160074234008789, "global_step": 240482, "epoch": 1431} {"train_loss": -10.241451263427734, "global_step": 240483, "epoch": 1431} {"train_loss": -11.93025016784668, "global_step": 240484, "epoch": 1431} {"train_loss": -11.52628231048584, "global_step": 240485, "epoch": 1431} {"train_loss": -11.67770004272461, "global_step": 240486, "epoch": 1431} {"train_loss": -11.915931701660156, "global_step": 240487, "epoch": 1431} {"train_loss": -11.598880767822266, "global_step": 240488, "epoch": 1431} {"train_loss": -11.536018371582031, "global_step": 240489, "epoch": 1431} {"train_loss": -11.89971923828125, "global_step": 240490, "epoch": 1431} {"train_loss": -11.245426177978516, "global_step": 240491, "epoch": 1431} {"train_loss": -11.669078826904297, "global_step": 240492, "epoch": 1431} {"train_loss": -12.04494857788086, "global_step": 240493, "epoch": 1431} {"train_loss": -11.859880447387695, "global_step": 240494, "epoch": 1431} {"train_loss": -11.916139602661133, "global_step": 240495, "epoch": 1431} {"train_loss": -11.62501049041748, "global_step": 240496, "epoch": 1431} {"train_loss": -12.062226295471191, "global_step": 240497, "epoch": 1431} {"train_loss": -11.817086219787598, "global_step": 240498, "epoch": 1431} {"train_loss": -11.72381591796875, "global_step": 240499, "epoch": 1431} {"train_loss": -11.817453384399414, "global_step": 240500, "epoch": 1431} {"train_loss": -11.616170883178711, "global_step": 240501, "epoch": 1431} {"train_loss": -11.921035766601562, "global_step": 240502, "epoch": 1431} {"train_loss": -12.06842041015625, "global_step": 240503, "epoch": 1431} {"train_loss": -11.706501960754395, "global_step": 240504, "epoch": 1431} {"train_loss": -11.921786308288574, "global_step": 240505, "epoch": 1431} {"train_loss": -11.688968658447266, "global_step": 240506, "epoch": 1431} {"train_loss": -11.556257247924805, "global_step": 240507, "epoch": 1431} {"train_loss": -11.853145599365234, "global_step": 240508, "epoch": 1431} {"train_loss": -11.709257125854492, "global_step": 240509, "epoch": 1431} {"train_loss": -11.919524192810059, "global_step": 240510, "epoch": 1431} {"train_loss": -11.349222183227539, "global_step": 240511, "epoch": 1431} {"train_loss": -11.626838684082031, "global_step": 240512, "epoch": 1431} {"train_loss": -11.704261779785156, "global_step": 240513, "epoch": 1431} {"train_loss": -11.468578338623047, "global_step": 240514, "epoch": 1431} {"train_loss": -11.724430084228516, "global_step": 240515, "epoch": 1431} {"train_loss": -11.796340942382812, "global_step": 240516, "epoch": 1431} {"train_loss": -11.642313957214355, "global_step": 240517, "epoch": 1431} {"train_loss": -11.985725402832031, "global_step": 240518, "epoch": 1431} {"train_loss": -11.748309135437012, "global_step": 240519, "epoch": 1431} {"train_loss": -11.709534645080566, "global_step": 240520, "epoch": 1431} {"train_loss": -11.717296600341797, "global_step": 240521, "epoch": 1431} {"train_loss": -11.35927963256836, "global_step": 240522, "epoch": 1431} {"train_loss": -11.31775951385498, "global_step": 240523, "epoch": 1431} {"train_loss": -11.41917610168457, "global_step": 240524, "epoch": 1431} {"train_loss": -11.829517364501953, "global_step": 240525, "epoch": 1431} {"train_loss": -11.136398315429688, "global_step": 240526, "epoch": 1431} {"train_loss": -11.781805038452148, "global_step": 240527, "epoch": 1431} {"train_loss": -11.342110633850098, "global_step": 240528, "epoch": 1431} {"train_loss": -11.797914505004883, "global_step": 240529, "epoch": 1431} {"train_loss": -11.24945068359375, "global_step": 240530, "epoch": 1431} {"train_loss": -11.783585548400879, "global_step": 240531, "epoch": 1431} {"train_loss": -11.89169692993164, "global_step": 240532, "epoch": 1431} {"train_loss": -11.503227233886719, "global_step": 240533, "epoch": 1431} {"train_loss": -11.5946044921875, "global_step": 240534, "epoch": 1431} {"train_loss": -11.643383026123047, "global_step": 240535, "epoch": 1431} {"train_loss": -11.838180541992188, "global_step": 240536, "epoch": 1431} {"train_loss": -11.291011810302734, "global_step": 240537, "epoch": 1431} {"train_loss": -11.758060455322266, "global_step": 240538, "epoch": 1431} {"train_loss": -11.721149444580078, "global_step": 240539, "epoch": 1431} {"train_loss": -11.179447174072266, "global_step": 240540, "epoch": 1431} {"train_loss": -10.968037605285645, "global_step": 240541, "epoch": 1431} {"train_loss": -11.5215425491333, "global_step": 240542, "epoch": 1431} {"train_loss": -11.730018615722656, "global_step": 240543, "epoch": 1431} {"train_loss": -11.122213363647461, "global_step": 240544, "epoch": 1431} {"train_loss": -10.868247032165527, "global_step": 240545, "epoch": 1431} {"train_loss": -10.098470687866211, "global_step": 240546, "epoch": 1431} {"train_loss": -10.574501991271973, "global_step": 240547, "epoch": 1431} {"train_loss": -8.456321716308594, "global_step": 240548, "epoch": 1431} {"train_loss": -9.506831169128418, "global_step": 240549, "epoch": 1431} {"train_loss": -11.197853088378906, "global_step": 240550, "epoch": 1431} {"train_loss": -9.629646301269531, "global_step": 240551, "epoch": 1431} {"train_loss": -9.214040756225586, "global_step": 240552, "epoch": 1431} {"train_loss": -10.708701133728027, "global_step": 240553, "epoch": 1431} {"train_loss": -8.994521141052246, "global_step": 240554, "epoch": 1431} {"train_loss": -9.50082015991211, "global_step": 240555, "epoch": 1431} {"train_loss": -10.714200973510742, "global_step": 240556, "epoch": 1431} {"train_loss": -8.51196002960205, "global_step": 240557, "epoch": 1431} {"train_loss": -10.659770965576172, "global_step": 240558, "epoch": 1431} {"train_loss": -10.55929946899414, "global_step": 240559, "epoch": 1431} {"train_loss": -10.034242630004883, "global_step": 240560, "epoch": 1431} {"train_loss": -10.670509338378906, "global_step": 240561, "epoch": 1431} {"train_loss": -10.724600791931152, "global_step": 240562, "epoch": 1431} {"train_loss": -9.824366569519043, "global_step": 240563, "epoch": 1431} {"train_loss": -11.231218338012695, "global_step": 240564, "epoch": 1431} {"train_loss": -9.43305778503418, "global_step": 240565, "epoch": 1431} {"train_loss": -11.38734245300293, "global_step": 240566, "epoch": 1431} {"train_loss": -10.832645416259766, "global_step": 240567, "epoch": 1431} {"train_loss": -11.124313354492188, "global_step": 240568, "epoch": 1431} {"train_loss": -10.9779052734375, "global_step": 240569, "epoch": 1431} {"train_loss": -11.071258544921875, "global_step": 240570, "epoch": 1431} {"train_loss": -11.447196960449219, "global_step": 240571, "epoch": 1431} {"train_loss": -11.526037216186523, "global_step": 240572, "epoch": 1431} {"train_loss": -11.14698314666748, "global_step": 240573, "epoch": 1431} {"train_loss": -11.424943923950195, "global_step": 240574, "epoch": 1431} {"train_loss": -11.494539624168759, "global_step": 240575, "epoch": 1431, "val_loss": 255331.703125} {"train_loss": -11.400410652160645, "global_step": 240576, "epoch": 1432} {"train_loss": -11.485275268554688, "global_step": 240577, "epoch": 1432} {"train_loss": -11.45303726196289, "global_step": 240578, "epoch": 1432} {"train_loss": -11.41415023803711, "global_step": 240579, "epoch": 1432} {"train_loss": -11.531776428222656, "global_step": 240580, "epoch": 1432} {"train_loss": -11.65021800994873, "global_step": 240581, "epoch": 1432} {"train_loss": -11.444822311401367, "global_step": 240582, "epoch": 1432} {"train_loss": -11.452065467834473, "global_step": 240583, "epoch": 1432} {"train_loss": -11.609258651733398, "global_step": 240584, "epoch": 1432} {"train_loss": -11.463037490844727, "global_step": 240585, "epoch": 1432} {"train_loss": -11.531486511230469, "global_step": 240586, "epoch": 1432} {"train_loss": -11.45417594909668, "global_step": 240587, "epoch": 1432} {"train_loss": -11.691255569458008, "global_step": 240588, "epoch": 1432} {"train_loss": -11.610282897949219, "global_step": 240589, "epoch": 1432} {"train_loss": -11.738471984863281, "global_step": 240590, "epoch": 1432} {"train_loss": -11.742016792297363, "global_step": 240591, "epoch": 1432} {"train_loss": -11.946060180664062, "global_step": 240592, "epoch": 1432} {"train_loss": -11.751784324645996, "global_step": 240593, "epoch": 1432} {"train_loss": -11.481202125549316, "global_step": 240594, "epoch": 1432} {"train_loss": -11.716864585876465, "global_step": 240595, "epoch": 1432} {"train_loss": -11.723161697387695, "global_step": 240596, "epoch": 1432} {"train_loss": -11.672508239746094, "global_step": 240597, "epoch": 1432} {"train_loss": -11.999666213989258, "global_step": 240598, "epoch": 1432} {"train_loss": -11.891798973083496, "global_step": 240599, "epoch": 1432} {"train_loss": -11.65180778503418, "global_step": 240600, "epoch": 1432} {"train_loss": -11.798049926757812, "global_step": 240601, "epoch": 1432} {"train_loss": -11.653620719909668, "global_step": 240602, "epoch": 1432} {"train_loss": -11.801990509033203, "global_step": 240603, "epoch": 1432} {"train_loss": -11.902143478393555, "global_step": 240604, "epoch": 1432} {"train_loss": -11.740983963012695, "global_step": 240605, "epoch": 1432} {"train_loss": -11.828527450561523, "global_step": 240606, "epoch": 1432} {"train_loss": -11.917685508728027, "global_step": 240607, "epoch": 1432} {"train_loss": -11.790994644165039, "global_step": 240608, "epoch": 1432} {"train_loss": -11.984358787536621, "global_step": 240609, "epoch": 1432} {"train_loss": -11.823745727539062, "global_step": 240610, "epoch": 1432} {"train_loss": -11.680886268615723, "global_step": 240611, "epoch": 1432} {"train_loss": -11.936138153076172, "global_step": 240612, "epoch": 1432} {"train_loss": -11.849624633789062, "global_step": 240613, "epoch": 1432} {"train_loss": -11.912558555603027, "global_step": 240614, "epoch": 1432} {"train_loss": -11.932132720947266, "global_step": 240615, "epoch": 1432} {"train_loss": -11.976675033569336, "global_step": 240616, "epoch": 1432} {"train_loss": -11.886327743530273, "global_step": 240617, "epoch": 1432} {"train_loss": -11.426115036010742, "global_step": 240618, "epoch": 1432} {"train_loss": -11.764592170715332, "global_step": 240619, "epoch": 1432} {"train_loss": -11.834373474121094, "global_step": 240620, "epoch": 1432} {"train_loss": -11.427865028381348, "global_step": 240621, "epoch": 1432} {"train_loss": -11.779972076416016, "global_step": 240622, "epoch": 1432} {"train_loss": -11.631780624389648, "global_step": 240623, "epoch": 1432} {"train_loss": -11.585594177246094, "global_step": 240624, "epoch": 1432} {"train_loss": -11.713624000549316, "global_step": 240625, "epoch": 1432} {"train_loss": -11.447378158569336, "global_step": 240626, "epoch": 1432} {"train_loss": -11.856332778930664, "global_step": 240627, "epoch": 1432} {"train_loss": -10.733854293823242, "global_step": 240628, "epoch": 1432} {"train_loss": -11.473902702331543, "global_step": 240629, "epoch": 1432} {"train_loss": -11.187084197998047, "global_step": 240630, "epoch": 1432} {"train_loss": -11.018058776855469, "global_step": 240631, "epoch": 1432} {"train_loss": -11.309499740600586, "global_step": 240632, "epoch": 1432} {"train_loss": -11.207108497619629, "global_step": 240633, "epoch": 1432} {"train_loss": -10.665240287780762, "global_step": 240634, "epoch": 1432} {"train_loss": -11.34238052368164, "global_step": 240635, "epoch": 1432} {"train_loss": -10.423465728759766, "global_step": 240636, "epoch": 1432} {"train_loss": -9.792762756347656, "global_step": 240637, "epoch": 1432} {"train_loss": -11.847909927368164, "global_step": 240638, "epoch": 1432} {"train_loss": -10.563003540039062, "global_step": 240639, "epoch": 1432} {"train_loss": -10.937169075012207, "global_step": 240640, "epoch": 1432} {"train_loss": -11.210803985595703, "global_step": 240641, "epoch": 1432} {"train_loss": -10.63602352142334, "global_step": 240642, "epoch": 1432} {"train_loss": -10.748785018920898, "global_step": 240643, "epoch": 1432} {"train_loss": -10.76724624633789, "global_step": 240644, "epoch": 1432} {"train_loss": -11.239297866821289, "global_step": 240645, "epoch": 1432} {"train_loss": -9.795572280883789, "global_step": 240646, "epoch": 1432} {"train_loss": -9.433645248413086, "global_step": 240647, "epoch": 1432} {"train_loss": -10.062599182128906, "global_step": 240648, "epoch": 1432} {"train_loss": -10.364553451538086, "global_step": 240649, "epoch": 1432} {"train_loss": -10.618474960327148, "global_step": 240650, "epoch": 1432} {"train_loss": -9.753576278686523, "global_step": 240651, "epoch": 1432} {"train_loss": -10.006065368652344, "global_step": 240652, "epoch": 1432} {"train_loss": -10.767823219299316, "global_step": 240653, "epoch": 1432} {"train_loss": -9.238753318786621, "global_step": 240654, "epoch": 1432} {"train_loss": -10.40066146850586, "global_step": 240655, "epoch": 1432} {"train_loss": -11.451995849609375, "global_step": 240656, "epoch": 1432} {"train_loss": -10.12677001953125, "global_step": 240657, "epoch": 1432} {"train_loss": -10.649141311645508, "global_step": 240658, "epoch": 1432} {"train_loss": -10.831802368164062, "global_step": 240659, "epoch": 1432} {"train_loss": -10.17203140258789, "global_step": 240660, "epoch": 1432} {"train_loss": -10.605754852294922, "global_step": 240661, "epoch": 1432} {"train_loss": -11.465816497802734, "global_step": 240662, "epoch": 1432} {"train_loss": -10.200019836425781, "global_step": 240663, "epoch": 1432} {"train_loss": -11.149789810180664, "global_step": 240664, "epoch": 1432} {"train_loss": -10.923555374145508, "global_step": 240665, "epoch": 1432} {"train_loss": -10.788140296936035, "global_step": 240666, "epoch": 1432} {"train_loss": -10.860358238220215, "global_step": 240667, "epoch": 1432} {"train_loss": -11.43986701965332, "global_step": 240668, "epoch": 1432} {"train_loss": -10.483264923095703, "global_step": 240669, "epoch": 1432} {"train_loss": -11.352489471435547, "global_step": 240670, "epoch": 1432} {"train_loss": -11.240911483764648, "global_step": 240671, "epoch": 1432} {"train_loss": -11.228832244873047, "global_step": 240672, "epoch": 1432} {"train_loss": -11.445596694946289, "global_step": 240673, "epoch": 1432} {"train_loss": -11.432357788085938, "global_step": 240674, "epoch": 1432} {"train_loss": -11.22287368774414, "global_step": 240675, "epoch": 1432} {"train_loss": -11.086246490478516, "global_step": 240676, "epoch": 1432} {"train_loss": -11.56527042388916, "global_step": 240677, "epoch": 1432} {"train_loss": -11.15464973449707, "global_step": 240678, "epoch": 1432} {"train_loss": -11.2601900100708, "global_step": 240679, "epoch": 1432} {"train_loss": -11.614533424377441, "global_step": 240680, "epoch": 1432} {"train_loss": -11.555591583251953, "global_step": 240681, "epoch": 1432} {"train_loss": -11.292242050170898, "global_step": 240682, "epoch": 1432} {"train_loss": -11.51373291015625, "global_step": 240683, "epoch": 1432} {"train_loss": -11.472620010375977, "global_step": 240684, "epoch": 1432} {"train_loss": -11.412246704101562, "global_step": 240685, "epoch": 1432} {"train_loss": -11.479867935180664, "global_step": 240686, "epoch": 1432} {"train_loss": -11.40785026550293, "global_step": 240687, "epoch": 1432} {"train_loss": -11.567888259887695, "global_step": 240688, "epoch": 1432} {"train_loss": -11.534857749938965, "global_step": 240689, "epoch": 1432} {"train_loss": -11.79052448272705, "global_step": 240690, "epoch": 1432} {"train_loss": -11.53847599029541, "global_step": 240691, "epoch": 1432} {"train_loss": -11.66960334777832, "global_step": 240692, "epoch": 1432} {"train_loss": -11.662376403808594, "global_step": 240693, "epoch": 1432} {"train_loss": -11.733641624450684, "global_step": 240694, "epoch": 1432} {"train_loss": -11.747451782226562, "global_step": 240695, "epoch": 1432} {"train_loss": -11.58035945892334, "global_step": 240696, "epoch": 1432} {"train_loss": -11.586641311645508, "global_step": 240697, "epoch": 1432} {"train_loss": -11.574657440185547, "global_step": 240698, "epoch": 1432} {"train_loss": -11.728776931762695, "global_step": 240699, "epoch": 1432} {"train_loss": -11.865967750549316, "global_step": 240700, "epoch": 1432} {"train_loss": -11.590248107910156, "global_step": 240701, "epoch": 1432} {"train_loss": -11.929747581481934, "global_step": 240702, "epoch": 1432} {"train_loss": -11.741302490234375, "global_step": 240703, "epoch": 1432} {"train_loss": -11.71538257598877, "global_step": 240704, "epoch": 1432} {"train_loss": -11.915270805358887, "global_step": 240705, "epoch": 1432} {"train_loss": -11.913871765136719, "global_step": 240706, "epoch": 1432} {"train_loss": -11.830842971801758, "global_step": 240707, "epoch": 1432} {"train_loss": -11.995025634765625, "global_step": 240708, "epoch": 1432} {"train_loss": -11.777886390686035, "global_step": 240709, "epoch": 1432} {"train_loss": -11.955229759216309, "global_step": 240710, "epoch": 1432} {"train_loss": -11.936834335327148, "global_step": 240711, "epoch": 1432} {"train_loss": -11.845953941345215, "global_step": 240712, "epoch": 1432} {"train_loss": -12.010002136230469, "global_step": 240713, "epoch": 1432} {"train_loss": -12.122598648071289, "global_step": 240714, "epoch": 1432} {"train_loss": -12.103788375854492, "global_step": 240715, "epoch": 1432} {"train_loss": -12.105682373046875, "global_step": 240716, "epoch": 1432} {"train_loss": -11.999810218811035, "global_step": 240717, "epoch": 1432} {"train_loss": -11.936155319213867, "global_step": 240718, "epoch": 1432} {"train_loss": -11.968713760375977, "global_step": 240719, "epoch": 1432} {"train_loss": -11.929813385009766, "global_step": 240720, "epoch": 1432} {"train_loss": -11.964235305786133, "global_step": 240721, "epoch": 1432} {"train_loss": -11.97642707824707, "global_step": 240722, "epoch": 1432} {"train_loss": -11.990544319152832, "global_step": 240723, "epoch": 1432} {"train_loss": -11.916544914245605, "global_step": 240724, "epoch": 1432} {"train_loss": -11.827834129333496, "global_step": 240725, "epoch": 1432} {"train_loss": -12.139363288879395, "global_step": 240726, "epoch": 1432} {"train_loss": -12.12353229522705, "global_step": 240727, "epoch": 1432} {"train_loss": -12.050128936767578, "global_step": 240728, "epoch": 1432} {"train_loss": -12.183877944946289, "global_step": 240729, "epoch": 1432} {"train_loss": -11.96912956237793, "global_step": 240730, "epoch": 1432} {"train_loss": -12.158138275146484, "global_step": 240731, "epoch": 1432} {"train_loss": -11.933754920959473, "global_step": 240732, "epoch": 1432} {"train_loss": -11.96223258972168, "global_step": 240733, "epoch": 1432} {"train_loss": -12.175477981567383, "global_step": 240734, "epoch": 1432} {"train_loss": -11.501533508300781, "global_step": 240735, "epoch": 1432} {"train_loss": -10.999744415283203, "global_step": 240736, "epoch": 1432} {"train_loss": -11.140998840332031, "global_step": 240737, "epoch": 1432} {"train_loss": -11.952924728393555, "global_step": 240738, "epoch": 1432} {"train_loss": -11.845690727233887, "global_step": 240739, "epoch": 1432} {"train_loss": -11.954071044921875, "global_step": 240740, "epoch": 1432} {"train_loss": -12.086520195007324, "global_step": 240741, "epoch": 1432} {"train_loss": -12.227740287780762, "global_step": 240742, "epoch": 1432} {"train_loss": -11.462447717076255, "global_step": 240743, "epoch": 1432, "val_loss": 262028.90625} {"train_loss": -11.754035949707031, "global_step": 240744, "epoch": 1433} {"train_loss": -11.962411880493164, "global_step": 240745, "epoch": 1433} {"train_loss": -12.10275650024414, "global_step": 240746, "epoch": 1433} {"train_loss": -11.854667663574219, "global_step": 240747, "epoch": 1433} {"train_loss": -11.809682846069336, "global_step": 240748, "epoch": 1433} {"train_loss": -12.101929664611816, "global_step": 240749, "epoch": 1433} {"train_loss": -10.726550102233887, "global_step": 240750, "epoch": 1433} {"train_loss": -11.993383407592773, "global_step": 240751, "epoch": 1433} {"train_loss": -12.014636993408203, "global_step": 240752, "epoch": 1433} {"train_loss": -11.592010498046875, "global_step": 240753, "epoch": 1433} {"train_loss": -11.564270973205566, "global_step": 240754, "epoch": 1433} {"train_loss": -11.57989501953125, "global_step": 240755, "epoch": 1433} {"train_loss": -11.85699462890625, "global_step": 240756, "epoch": 1433} {"train_loss": -11.523828506469727, "global_step": 240757, "epoch": 1433} {"train_loss": -12.193031311035156, "global_step": 240758, "epoch": 1433} {"train_loss": -11.461847305297852, "global_step": 240759, "epoch": 1433} {"train_loss": -11.397784233093262, "global_step": 240760, "epoch": 1433} {"train_loss": -11.75444221496582, "global_step": 240761, "epoch": 1433} {"train_loss": -11.890443801879883, "global_step": 240762, "epoch": 1433} {"train_loss": -11.75837230682373, "global_step": 240763, "epoch": 1433} {"train_loss": -11.709209442138672, "global_step": 240764, "epoch": 1433} {"train_loss": -11.405715942382812, "global_step": 240765, "epoch": 1433} {"train_loss": -11.481843948364258, "global_step": 240766, "epoch": 1433} {"train_loss": -11.713957786560059, "global_step": 240767, "epoch": 1433} {"train_loss": -11.661417007446289, "global_step": 240768, "epoch": 1433} {"train_loss": -11.232390403747559, "global_step": 240769, "epoch": 1433} {"train_loss": -11.930404663085938, "global_step": 240770, "epoch": 1433} {"train_loss": -11.27473258972168, "global_step": 240771, "epoch": 1433} {"train_loss": -11.320554733276367, "global_step": 240772, "epoch": 1433} {"train_loss": -11.144646644592285, "global_step": 240773, "epoch": 1433} {"train_loss": -11.89475154876709, "global_step": 240774, "epoch": 1433} {"train_loss": -11.382481575012207, "global_step": 240775, "epoch": 1433} {"train_loss": -11.752503395080566, "global_step": 240776, "epoch": 1433} {"train_loss": -11.462868690490723, "global_step": 240777, "epoch": 1433} {"train_loss": -11.553923606872559, "global_step": 240778, "epoch": 1433} {"train_loss": -11.899089813232422, "global_step": 240779, "epoch": 1433} {"train_loss": -11.593841552734375, "global_step": 240780, "epoch": 1433} {"train_loss": -11.658689498901367, "global_step": 240781, "epoch": 1433} {"train_loss": -11.828964233398438, "global_step": 240782, "epoch": 1433} {"train_loss": -11.879332542419434, "global_step": 240783, "epoch": 1433} {"train_loss": -11.639982223510742, "global_step": 240784, "epoch": 1433} {"train_loss": -12.016777038574219, "global_step": 240785, "epoch": 1433} {"train_loss": -11.586437225341797, "global_step": 240786, "epoch": 1433} {"train_loss": -11.994356155395508, "global_step": 240787, "epoch": 1433} {"train_loss": -11.498746871948242, "global_step": 240788, "epoch": 1433} {"train_loss": -11.893463134765625, "global_step": 240789, "epoch": 1433} {"train_loss": -11.610583305358887, "global_step": 240790, "epoch": 1433} {"train_loss": -12.070842742919922, "global_step": 240791, "epoch": 1433} {"train_loss": -11.818846702575684, "global_step": 240792, "epoch": 1433} {"train_loss": -11.843515396118164, "global_step": 240793, "epoch": 1433} {"train_loss": -11.975656509399414, "global_step": 240794, "epoch": 1433} {"train_loss": -11.973440170288086, "global_step": 240795, "epoch": 1433} {"train_loss": -11.762016296386719, "global_step": 240796, "epoch": 1433} {"train_loss": -11.850528717041016, "global_step": 240797, "epoch": 1433} {"train_loss": -11.99638557434082, "global_step": 240798, "epoch": 1433} {"train_loss": -11.838359832763672, "global_step": 240799, "epoch": 1433} {"train_loss": -11.838289260864258, "global_step": 240800, "epoch": 1433} {"train_loss": -11.528985023498535, "global_step": 240801, "epoch": 1433} {"train_loss": -11.976213455200195, "global_step": 240802, "epoch": 1433} {"train_loss": -11.77886962890625, "global_step": 240803, "epoch": 1433} {"train_loss": -12.093639373779297, "global_step": 240804, "epoch": 1433} {"train_loss": -11.817899703979492, "global_step": 240805, "epoch": 1433} {"train_loss": -11.624107360839844, "global_step": 240806, "epoch": 1433} {"train_loss": -11.839696884155273, "global_step": 240807, "epoch": 1433} {"train_loss": -12.133970260620117, "global_step": 240808, "epoch": 1433} {"train_loss": -12.068647384643555, "global_step": 240809, "epoch": 1433} {"train_loss": -11.957763671875, "global_step": 240810, "epoch": 1433} {"train_loss": -11.881662368774414, "global_step": 240811, "epoch": 1433} {"train_loss": -11.877805709838867, "global_step": 240812, "epoch": 1433} {"train_loss": -12.062076568603516, "global_step": 240813, "epoch": 1433} {"train_loss": -12.110305786132812, "global_step": 240814, "epoch": 1433} {"train_loss": -12.036386489868164, "global_step": 240815, "epoch": 1433} {"train_loss": -12.10599422454834, "global_step": 240816, "epoch": 1433} {"train_loss": -11.754440307617188, "global_step": 240817, "epoch": 1433} {"train_loss": -11.969532012939453, "global_step": 240818, "epoch": 1433} {"train_loss": -12.116007804870605, "global_step": 240819, "epoch": 1433} {"train_loss": -11.91678237915039, "global_step": 240820, "epoch": 1433} {"train_loss": -11.673282623291016, "global_step": 240821, "epoch": 1433} {"train_loss": -12.19329833984375, "global_step": 240822, "epoch": 1433} {"train_loss": -11.856536865234375, "global_step": 240823, "epoch": 1433} {"train_loss": -11.833334922790527, "global_step": 240824, "epoch": 1433} {"train_loss": -11.882816314697266, "global_step": 240825, "epoch": 1433} {"train_loss": -11.848339080810547, "global_step": 240826, "epoch": 1433} {"train_loss": -12.051332473754883, "global_step": 240827, "epoch": 1433} {"train_loss": -11.735555648803711, "global_step": 240828, "epoch": 1433} {"train_loss": -11.758965492248535, "global_step": 240829, "epoch": 1433} {"train_loss": -11.708403587341309, "global_step": 240830, "epoch": 1433} {"train_loss": -11.425909042358398, "global_step": 240831, "epoch": 1433} {"train_loss": -11.445518493652344, "global_step": 240832, "epoch": 1433} {"train_loss": -11.440702438354492, "global_step": 240833, "epoch": 1433} {"train_loss": -11.343521118164062, "global_step": 240834, "epoch": 1433} {"train_loss": -10.41547679901123, "global_step": 240835, "epoch": 1433} {"train_loss": -10.301297187805176, "global_step": 240836, "epoch": 1433} {"train_loss": -11.774185180664062, "global_step": 240837, "epoch": 1433} {"train_loss": -10.44614028930664, "global_step": 240838, "epoch": 1433} {"train_loss": -9.982416152954102, "global_step": 240839, "epoch": 1433} {"train_loss": -11.183349609375, "global_step": 240840, "epoch": 1433} {"train_loss": -9.817286491394043, "global_step": 240841, "epoch": 1433} {"train_loss": -10.999732971191406, "global_step": 240842, "epoch": 1433} {"train_loss": -11.089300155639648, "global_step": 240843, "epoch": 1433} {"train_loss": -10.582924842834473, "global_step": 240844, "epoch": 1433} {"train_loss": -10.246435165405273, "global_step": 240845, "epoch": 1433} {"train_loss": -11.128402709960938, "global_step": 240846, "epoch": 1433} {"train_loss": -10.880159378051758, "global_step": 240847, "epoch": 1433} {"train_loss": -9.721752166748047, "global_step": 240848, "epoch": 1433} {"train_loss": -11.407792091369629, "global_step": 240849, "epoch": 1433} {"train_loss": -10.039862632751465, "global_step": 240850, "epoch": 1433} {"train_loss": -10.707538604736328, "global_step": 240851, "epoch": 1433} {"train_loss": -10.248199462890625, "global_step": 240852, "epoch": 1433} {"train_loss": -10.119524002075195, "global_step": 240853, "epoch": 1433} {"train_loss": -10.486374855041504, "global_step": 240854, "epoch": 1433} {"train_loss": -10.290761947631836, "global_step": 240855, "epoch": 1433} {"train_loss": -10.930342674255371, "global_step": 240856, "epoch": 1433} {"train_loss": -10.872102737426758, "global_step": 240857, "epoch": 1433} {"train_loss": -10.487966537475586, "global_step": 240858, "epoch": 1433} {"train_loss": -11.200340270996094, "global_step": 240859, "epoch": 1433} {"train_loss": -10.99978256225586, "global_step": 240860, "epoch": 1433} {"train_loss": -10.756062507629395, "global_step": 240861, "epoch": 1433} {"train_loss": -10.604904174804688, "global_step": 240862, "epoch": 1433} {"train_loss": -11.48122501373291, "global_step": 240863, "epoch": 1433} {"train_loss": -10.387794494628906, "global_step": 240864, "epoch": 1433} {"train_loss": -10.836479187011719, "global_step": 240865, "epoch": 1433} {"train_loss": -10.92018985748291, "global_step": 240866, "epoch": 1433} {"train_loss": -10.495809555053711, "global_step": 240867, "epoch": 1433} {"train_loss": -11.19676685333252, "global_step": 240868, "epoch": 1433} {"train_loss": -10.562272071838379, "global_step": 240869, "epoch": 1433} {"train_loss": -10.976030349731445, "global_step": 240870, "epoch": 1433} {"train_loss": -11.031195640563965, "global_step": 240871, "epoch": 1433} {"train_loss": -11.121526718139648, "global_step": 240872, "epoch": 1433} {"train_loss": -11.16284465789795, "global_step": 240873, "epoch": 1433} {"train_loss": -11.354994773864746, "global_step": 240874, "epoch": 1433} {"train_loss": -11.456094741821289, "global_step": 240875, "epoch": 1433} {"train_loss": -11.077853202819824, "global_step": 240876, "epoch": 1433} {"train_loss": -11.304121017456055, "global_step": 240877, "epoch": 1433} {"train_loss": -11.517288208007812, "global_step": 240878, "epoch": 1433} {"train_loss": -11.354043960571289, "global_step": 240879, "epoch": 1433} {"train_loss": -11.4928617477417, "global_step": 240880, "epoch": 1433} {"train_loss": -11.598501205444336, "global_step": 240881, "epoch": 1433} {"train_loss": -11.37571907043457, "global_step": 240882, "epoch": 1433} {"train_loss": -11.554865837097168, "global_step": 240883, "epoch": 1433} {"train_loss": -11.496638298034668, "global_step": 240884, "epoch": 1433} {"train_loss": -11.30126667022705, "global_step": 240885, "epoch": 1433} {"train_loss": -11.96312141418457, "global_step": 240886, "epoch": 1433} {"train_loss": -11.547944068908691, "global_step": 240887, "epoch": 1433} {"train_loss": -11.678301811218262, "global_step": 240888, "epoch": 1433} {"train_loss": -11.595109939575195, "global_step": 240889, "epoch": 1433} {"train_loss": -11.647741317749023, "global_step": 240890, "epoch": 1433} {"train_loss": -11.772153854370117, "global_step": 240891, "epoch": 1433} {"train_loss": -11.664702415466309, "global_step": 240892, "epoch": 1433} {"train_loss": -11.636007308959961, "global_step": 240893, "epoch": 1433} {"train_loss": -11.626635551452637, "global_step": 240894, "epoch": 1433} {"train_loss": -11.920576095581055, "global_step": 240895, "epoch": 1433} {"train_loss": -11.738702774047852, "global_step": 240896, "epoch": 1433} {"train_loss": -11.894163131713867, "global_step": 240897, "epoch": 1433} {"train_loss": -11.91762924194336, "global_step": 240898, "epoch": 1433} {"train_loss": -11.914709091186523, "global_step": 240899, "epoch": 1433} {"train_loss": -11.992559432983398, "global_step": 240900, "epoch": 1433} {"train_loss": -11.85904598236084, "global_step": 240901, "epoch": 1433} {"train_loss": -11.903404235839844, "global_step": 240902, "epoch": 1433} {"train_loss": -12.0030517578125, "global_step": 240903, "epoch": 1433} {"train_loss": -12.107629776000977, "global_step": 240904, "epoch": 1433} {"train_loss": -11.760346412658691, "global_step": 240905, "epoch": 1433} {"train_loss": -12.014541625976562, "global_step": 240906, "epoch": 1433} {"train_loss": -11.959918975830078, "global_step": 240907, "epoch": 1433} {"train_loss": -11.722580909729004, "global_step": 240908, "epoch": 1433} {"train_loss": -12.0128812789917, "global_step": 240909, "epoch": 1433} {"train_loss": -11.71951961517334, "global_step": 240910, "epoch": 1433} {"train_loss": -11.505640268325806, "global_step": 240911, "epoch": 1433, "val_loss": 265632.375} {"train_loss": -11.721597671508789, "global_step": 240912, "epoch": 1434} {"train_loss": -11.745896339416504, "global_step": 240913, "epoch": 1434} {"train_loss": -10.973901748657227, "global_step": 240914, "epoch": 1434} {"train_loss": -11.798545837402344, "global_step": 240915, "epoch": 1434} {"train_loss": -11.28807258605957, "global_step": 240916, "epoch": 1434} {"train_loss": -11.288930892944336, "global_step": 240917, "epoch": 1434} {"train_loss": -11.541441917419434, "global_step": 240918, "epoch": 1434} {"train_loss": -11.407827377319336, "global_step": 240919, "epoch": 1434} {"train_loss": -11.570192337036133, "global_step": 240920, "epoch": 1434} {"train_loss": -11.706335067749023, "global_step": 240921, "epoch": 1434} {"train_loss": -11.629897117614746, "global_step": 240922, "epoch": 1434} {"train_loss": -11.220451354980469, "global_step": 240923, "epoch": 1434} {"train_loss": -11.526540756225586, "global_step": 240924, "epoch": 1434} {"train_loss": -11.601926803588867, "global_step": 240925, "epoch": 1434} {"train_loss": -11.408666610717773, "global_step": 240926, "epoch": 1434} {"train_loss": -12.14558219909668, "global_step": 240927, "epoch": 1434} {"train_loss": -11.48570442199707, "global_step": 240928, "epoch": 1434} {"train_loss": -11.791275024414062, "global_step": 240929, "epoch": 1434} {"train_loss": -11.650362968444824, "global_step": 240930, "epoch": 1434} {"train_loss": -11.476789474487305, "global_step": 240931, "epoch": 1434} {"train_loss": -11.927034378051758, "global_step": 240932, "epoch": 1434} {"train_loss": -11.425505638122559, "global_step": 240933, "epoch": 1434} {"train_loss": -11.854133605957031, "global_step": 240934, "epoch": 1434} {"train_loss": -11.697522163391113, "global_step": 240935, "epoch": 1434} {"train_loss": -11.357128143310547, "global_step": 240936, "epoch": 1434} {"train_loss": -12.0595703125, "global_step": 240937, "epoch": 1434} {"train_loss": -11.590946197509766, "global_step": 240938, "epoch": 1434} {"train_loss": -12.001482963562012, "global_step": 240939, "epoch": 1434} {"train_loss": -11.619818687438965, "global_step": 240940, "epoch": 1434} {"train_loss": -11.995177268981934, "global_step": 240941, "epoch": 1434} {"train_loss": -11.933116912841797, "global_step": 240942, "epoch": 1434} {"train_loss": -11.932515144348145, "global_step": 240943, "epoch": 1434} {"train_loss": -11.841815948486328, "global_step": 240944, "epoch": 1434} {"train_loss": -11.818805694580078, "global_step": 240945, "epoch": 1434} {"train_loss": -11.860063552856445, "global_step": 240946, "epoch": 1434} {"train_loss": -11.833951950073242, "global_step": 240947, "epoch": 1434} {"train_loss": -11.99059772491455, "global_step": 240948, "epoch": 1434} {"train_loss": -12.109945297241211, "global_step": 240949, "epoch": 1434} {"train_loss": -11.921957015991211, "global_step": 240950, "epoch": 1434} {"train_loss": -11.951091766357422, "global_step": 240951, "epoch": 1434} {"train_loss": -12.254322052001953, "global_step": 240952, "epoch": 1434} {"train_loss": -11.861871719360352, "global_step": 240953, "epoch": 1434} {"train_loss": -11.963099479675293, "global_step": 240954, "epoch": 1434} {"train_loss": -11.946906089782715, "global_step": 240955, "epoch": 1434} {"train_loss": -12.229828834533691, "global_step": 240956, "epoch": 1434} {"train_loss": -11.953540802001953, "global_step": 240957, "epoch": 1434} {"train_loss": -12.178033828735352, "global_step": 240958, "epoch": 1434} {"train_loss": -11.873078346252441, "global_step": 240959, "epoch": 1434} {"train_loss": -12.051376342773438, "global_step": 240960, "epoch": 1434} {"train_loss": -11.617576599121094, "global_step": 240961, "epoch": 1434} {"train_loss": -11.588024139404297, "global_step": 240962, "epoch": 1434} {"train_loss": -12.22370433807373, "global_step": 240963, "epoch": 1434} {"train_loss": -11.79996109008789, "global_step": 240964, "epoch": 1434} {"train_loss": -11.945487976074219, "global_step": 240965, "epoch": 1434} {"train_loss": -11.962323188781738, "global_step": 240966, "epoch": 1434} {"train_loss": -12.256780624389648, "global_step": 240967, "epoch": 1434} {"train_loss": -11.952611923217773, "global_step": 240968, "epoch": 1434} {"train_loss": -12.048384666442871, "global_step": 240969, "epoch": 1434} {"train_loss": -12.063810348510742, "global_step": 240970, "epoch": 1434} {"train_loss": -11.968084335327148, "global_step": 240971, "epoch": 1434} {"train_loss": -11.638870239257812, "global_step": 240972, "epoch": 1434} {"train_loss": -10.837992668151855, "global_step": 240973, "epoch": 1434} {"train_loss": -10.160888671875, "global_step": 240974, "epoch": 1434} {"train_loss": -11.43618392944336, "global_step": 240975, "epoch": 1434} {"train_loss": -9.092511177062988, "global_step": 240976, "epoch": 1434} {"train_loss": -10.56197738647461, "global_step": 240977, "epoch": 1434} {"train_loss": -9.36098861694336, "global_step": 240978, "epoch": 1434} {"train_loss": -10.75645637512207, "global_step": 240979, "epoch": 1434} {"train_loss": -9.694438934326172, "global_step": 240980, "epoch": 1434} {"train_loss": -9.45001220703125, "global_step": 240981, "epoch": 1434} {"train_loss": -7.343527317047119, "global_step": 240982, "epoch": 1434} {"train_loss": -10.424776077270508, "global_step": 240983, "epoch": 1434} {"train_loss": -7.441623687744141, "global_step": 240984, "epoch": 1434} {"train_loss": -8.82711410522461, "global_step": 240985, "epoch": 1434} {"train_loss": -7.086453914642334, "global_step": 240986, "epoch": 1434} {"train_loss": -6.408469200134277, "global_step": 240987, "epoch": 1434} {"train_loss": -6.996981620788574, "global_step": 240988, "epoch": 1434} {"train_loss": -6.846572399139404, "global_step": 240989, "epoch": 1434} {"train_loss": -8.349574089050293, "global_step": 240990, "epoch": 1434} {"train_loss": -8.331413269042969, "global_step": 240991, "epoch": 1434} {"train_loss": -8.855644226074219, "global_step": 240992, "epoch": 1434} {"train_loss": -8.381416320800781, "global_step": 240993, "epoch": 1434} {"train_loss": -8.606283187866211, "global_step": 240994, "epoch": 1434} {"train_loss": -8.209271430969238, "global_step": 240995, "epoch": 1434} {"train_loss": -8.38972282409668, "global_step": 240996, "epoch": 1434} {"train_loss": -9.39923095703125, "global_step": 240997, "epoch": 1434} {"train_loss": -8.871403694152832, "global_step": 240998, "epoch": 1434} {"train_loss": -10.455336570739746, "global_step": 240999, "epoch": 1434} {"train_loss": -10.401348114013672, "global_step": 241000, "epoch": 1434} {"train_loss": -9.46800422668457, "global_step": 241001, "epoch": 1434} {"train_loss": -9.52116584777832, "global_step": 241002, "epoch": 1434} {"train_loss": -10.558391571044922, "global_step": 241003, "epoch": 1434} {"train_loss": -9.342567443847656, "global_step": 241004, "epoch": 1434} {"train_loss": -9.380241394042969, "global_step": 241005, "epoch": 1434} {"train_loss": -10.719825744628906, "global_step": 241006, "epoch": 1434} {"train_loss": -10.540020942687988, "global_step": 241007, "epoch": 1434} {"train_loss": -9.967219352722168, "global_step": 241008, "epoch": 1434} {"train_loss": -9.884422302246094, "global_step": 241009, "epoch": 1434} {"train_loss": -10.470767974853516, "global_step": 241010, "epoch": 1434} {"train_loss": -10.465648651123047, "global_step": 241011, "epoch": 1434} {"train_loss": -10.098384857177734, "global_step": 241012, "epoch": 1434} {"train_loss": -10.707649230957031, "global_step": 241013, "epoch": 1434} {"train_loss": -10.868795394897461, "global_step": 241014, "epoch": 1434} {"train_loss": -11.041572570800781, "global_step": 241015, "epoch": 1434} {"train_loss": -10.517101287841797, "global_step": 241016, "epoch": 1434} {"train_loss": -11.1259126663208, "global_step": 241017, "epoch": 1434} {"train_loss": -11.210479736328125, "global_step": 241018, "epoch": 1434} {"train_loss": -11.098470687866211, "global_step": 241019, "epoch": 1434} {"train_loss": -11.013976097106934, "global_step": 241020, "epoch": 1434} {"train_loss": -11.23260498046875, "global_step": 241021, "epoch": 1434} {"train_loss": -11.061570167541504, "global_step": 241022, "epoch": 1434} {"train_loss": -11.149286270141602, "global_step": 241023, "epoch": 1434} {"train_loss": -11.189302444458008, "global_step": 241024, "epoch": 1434} {"train_loss": -11.221479415893555, "global_step": 241025, "epoch": 1434} {"train_loss": -11.313255310058594, "global_step": 241026, "epoch": 1434} {"train_loss": -11.171355247497559, "global_step": 241027, "epoch": 1434} {"train_loss": -11.111501693725586, "global_step": 241028, "epoch": 1434} {"train_loss": -11.178874969482422, "global_step": 241029, "epoch": 1434} {"train_loss": -11.29263687133789, "global_step": 241030, "epoch": 1434} {"train_loss": -11.437440872192383, "global_step": 241031, "epoch": 1434} {"train_loss": -11.492795944213867, "global_step": 241032, "epoch": 1434} {"train_loss": -11.503552436828613, "global_step": 241033, "epoch": 1434} {"train_loss": -11.320135116577148, "global_step": 241034, "epoch": 1434} {"train_loss": -11.367815017700195, "global_step": 241035, "epoch": 1434} {"train_loss": -11.461075782775879, "global_step": 241036, "epoch": 1434} {"train_loss": -11.478494644165039, "global_step": 241037, "epoch": 1434} {"train_loss": -11.558221817016602, "global_step": 241038, "epoch": 1434} {"train_loss": -11.555475234985352, "global_step": 241039, "epoch": 1434} {"train_loss": -11.562820434570312, "global_step": 241040, "epoch": 1434} {"train_loss": -11.70669174194336, "global_step": 241041, "epoch": 1434} {"train_loss": -11.45643424987793, "global_step": 241042, "epoch": 1434} {"train_loss": -11.534446716308594, "global_step": 241043, "epoch": 1434} {"train_loss": -11.539427757263184, "global_step": 241044, "epoch": 1434} {"train_loss": -11.620994567871094, "global_step": 241045, "epoch": 1434} {"train_loss": -11.539215087890625, "global_step": 241046, "epoch": 1434} {"train_loss": -11.68676471710205, "global_step": 241047, "epoch": 1434} {"train_loss": -11.570659637451172, "global_step": 241048, "epoch": 1434} {"train_loss": -11.609806060791016, "global_step": 241049, "epoch": 1434} {"train_loss": -11.736953735351562, "global_step": 241050, "epoch": 1434} {"train_loss": -11.806816101074219, "global_step": 241051, "epoch": 1434} {"train_loss": -11.816450119018555, "global_step": 241052, "epoch": 1434} {"train_loss": -11.719079971313477, "global_step": 241053, "epoch": 1434} {"train_loss": -11.639486312866211, "global_step": 241054, "epoch": 1434} {"train_loss": -11.841911315917969, "global_step": 241055, "epoch": 1434} {"train_loss": -11.782466888427734, "global_step": 241056, "epoch": 1434} {"train_loss": -11.773441314697266, "global_step": 241057, "epoch": 1434} {"train_loss": -11.798309326171875, "global_step": 241058, "epoch": 1434} {"train_loss": -11.864265441894531, "global_step": 241059, "epoch": 1434} {"train_loss": -11.83385181427002, "global_step": 241060, "epoch": 1434} {"train_loss": -11.716716766357422, "global_step": 241061, "epoch": 1434} {"train_loss": -11.980685234069824, "global_step": 241062, "epoch": 1434} {"train_loss": -11.927328109741211, "global_step": 241063, "epoch": 1434} {"train_loss": -12.121857643127441, "global_step": 241064, "epoch": 1434} {"train_loss": -12.051763534545898, "global_step": 241065, "epoch": 1434} {"train_loss": -11.78530502319336, "global_step": 241066, "epoch": 1434} {"train_loss": -12.043088912963867, "global_step": 241067, "epoch": 1434} {"train_loss": -11.880510330200195, "global_step": 241068, "epoch": 1434} {"train_loss": -11.93532943725586, "global_step": 241069, "epoch": 1434} {"train_loss": -12.027667999267578, "global_step": 241070, "epoch": 1434} {"train_loss": -11.979976654052734, "global_step": 241071, "epoch": 1434} {"train_loss": -12.064213752746582, "global_step": 241072, "epoch": 1434} {"train_loss": -12.018003463745117, "global_step": 241073, "epoch": 1434} {"train_loss": -12.126514434814453, "global_step": 241074, "epoch": 1434} {"train_loss": -12.033266067504883, "global_step": 241075, "epoch": 1434} {"train_loss": -12.04218864440918, "global_step": 241076, "epoch": 1434} {"train_loss": -12.07914924621582, "global_step": 241077, "epoch": 1434} {"train_loss": -12.035821914672852, "global_step": 241078, "epoch": 1434} {"train_loss": -11.109976390997568, "global_step": 241079, "epoch": 1434, "val_loss": 265008.875} {"train_loss": -11.944056510925293, "global_step": 241080, "epoch": 1435} {"train_loss": -11.98143482208252, "global_step": 241081, "epoch": 1435} {"train_loss": -12.317220687866211, "global_step": 241082, "epoch": 1435} {"train_loss": -11.927335739135742, "global_step": 241083, "epoch": 1435} {"train_loss": -12.166133880615234, "global_step": 241084, "epoch": 1435} {"train_loss": -12.136598587036133, "global_step": 241085, "epoch": 1435} {"train_loss": -12.075864791870117, "global_step": 241086, "epoch": 1435} {"train_loss": -12.04417610168457, "global_step": 241087, "epoch": 1435} {"train_loss": -12.06436538696289, "global_step": 241088, "epoch": 1435} {"train_loss": -12.051738739013672, "global_step": 241089, "epoch": 1435} {"train_loss": -11.89971923828125, "global_step": 241090, "epoch": 1435} {"train_loss": -12.149099349975586, "global_step": 241091, "epoch": 1435} {"train_loss": -12.036697387695312, "global_step": 241092, "epoch": 1435} {"train_loss": -12.046914100646973, "global_step": 241093, "epoch": 1435} {"train_loss": -11.856561660766602, "global_step": 241094, "epoch": 1435} {"train_loss": -12.109613418579102, "global_step": 241095, "epoch": 1435} {"train_loss": -11.965838432312012, "global_step": 241096, "epoch": 1435} {"train_loss": -12.035743713378906, "global_step": 241097, "epoch": 1435} {"train_loss": -11.850244522094727, "global_step": 241098, "epoch": 1435} {"train_loss": -11.476531028747559, "global_step": 241099, "epoch": 1435} {"train_loss": -11.701484680175781, "global_step": 241100, "epoch": 1435} {"train_loss": -11.86839485168457, "global_step": 241101, "epoch": 1435} {"train_loss": -11.013751983642578, "global_step": 241102, "epoch": 1435} {"train_loss": -10.326607704162598, "global_step": 241103, "epoch": 1435} {"train_loss": -11.34378433227539, "global_step": 241104, "epoch": 1435} {"train_loss": -11.61191177368164, "global_step": 241105, "epoch": 1435} {"train_loss": -11.95679759979248, "global_step": 241106, "epoch": 1435} {"train_loss": -10.611095428466797, "global_step": 241107, "epoch": 1435} {"train_loss": -11.863500595092773, "global_step": 241108, "epoch": 1435} {"train_loss": -9.683834075927734, "global_step": 241109, "epoch": 1435} {"train_loss": -11.512310028076172, "global_step": 241110, "epoch": 1435} {"train_loss": -10.026034355163574, "global_step": 241111, "epoch": 1435} {"train_loss": -11.226241111755371, "global_step": 241112, "epoch": 1435} {"train_loss": -10.396063804626465, "global_step": 241113, "epoch": 1435} {"train_loss": -10.816313743591309, "global_step": 241114, "epoch": 1435} {"train_loss": -9.478429794311523, "global_step": 241115, "epoch": 1435} {"train_loss": -9.49969482421875, "global_step": 241116, "epoch": 1435} {"train_loss": -9.991358757019043, "global_step": 241117, "epoch": 1435} {"train_loss": -9.681854248046875, "global_step": 241118, "epoch": 1435} {"train_loss": -9.550016403198242, "global_step": 241119, "epoch": 1435} {"train_loss": -8.253423690795898, "global_step": 241120, "epoch": 1435} {"train_loss": -9.189334869384766, "global_step": 241121, "epoch": 1435} {"train_loss": -10.634228706359863, "global_step": 241122, "epoch": 1435} {"train_loss": -9.475362777709961, "global_step": 241123, "epoch": 1435} {"train_loss": -10.56615924835205, "global_step": 241124, "epoch": 1435} {"train_loss": -9.843589782714844, "global_step": 241125, "epoch": 1435} {"train_loss": -10.07377815246582, "global_step": 241126, "epoch": 1435} {"train_loss": -10.545831680297852, "global_step": 241127, "epoch": 1435} {"train_loss": -9.522168159484863, "global_step": 241128, "epoch": 1435} {"train_loss": -10.350900650024414, "global_step": 241129, "epoch": 1435} {"train_loss": -10.762996673583984, "global_step": 241130, "epoch": 1435} {"train_loss": -10.687108039855957, "global_step": 241131, "epoch": 1435} {"train_loss": -9.582155227661133, "global_step": 241132, "epoch": 1435} {"train_loss": -10.626569747924805, "global_step": 241133, "epoch": 1435} {"train_loss": -10.501060485839844, "global_step": 241134, "epoch": 1435} {"train_loss": -11.039200782775879, "global_step": 241135, "epoch": 1435} {"train_loss": -10.95277214050293, "global_step": 241136, "epoch": 1435} {"train_loss": -11.337060928344727, "global_step": 241137, "epoch": 1435} {"train_loss": -10.835342407226562, "global_step": 241138, "epoch": 1435} {"train_loss": -11.191849708557129, "global_step": 241139, "epoch": 1435} {"train_loss": -11.155624389648438, "global_step": 241140, "epoch": 1435} {"train_loss": -11.529908180236816, "global_step": 241141, "epoch": 1435} {"train_loss": -11.167708396911621, "global_step": 241142, "epoch": 1435} {"train_loss": -11.349929809570312, "global_step": 241143, "epoch": 1435} {"train_loss": -11.446911811828613, "global_step": 241144, "epoch": 1435} {"train_loss": -11.493664741516113, "global_step": 241145, "epoch": 1435} {"train_loss": -11.476539611816406, "global_step": 241146, "epoch": 1435} {"train_loss": -11.36020278930664, "global_step": 241147, "epoch": 1435} {"train_loss": -10.883052825927734, "global_step": 241148, "epoch": 1435} {"train_loss": -11.360908508300781, "global_step": 241149, "epoch": 1435} {"train_loss": -11.081313133239746, "global_step": 241150, "epoch": 1435} {"train_loss": -11.416227340698242, "global_step": 241151, "epoch": 1435} {"train_loss": -11.601579666137695, "global_step": 241152, "epoch": 1435} {"train_loss": -11.364459991455078, "global_step": 241153, "epoch": 1435} {"train_loss": -11.651844024658203, "global_step": 241154, "epoch": 1435} {"train_loss": -11.510830879211426, "global_step": 241155, "epoch": 1435} {"train_loss": -11.503202438354492, "global_step": 241156, "epoch": 1435} {"train_loss": -11.470555305480957, "global_step": 241157, "epoch": 1435} {"train_loss": -11.4590425491333, "global_step": 241158, "epoch": 1435} {"train_loss": -11.305631637573242, "global_step": 241159, "epoch": 1435} {"train_loss": -11.491945266723633, "global_step": 241160, "epoch": 1435} {"train_loss": -11.570207595825195, "global_step": 241161, "epoch": 1435} {"train_loss": -11.64015007019043, "global_step": 241162, "epoch": 1435} {"train_loss": -11.425291061401367, "global_step": 241163, "epoch": 1435} {"train_loss": -11.416905403137207, "global_step": 241164, "epoch": 1435} {"train_loss": -11.813455581665039, "global_step": 241165, "epoch": 1435} {"train_loss": -11.361112594604492, "global_step": 241166, "epoch": 1435} {"train_loss": -11.969564437866211, "global_step": 241167, "epoch": 1435} {"train_loss": -11.394845962524414, "global_step": 241168, "epoch": 1435} {"train_loss": -11.446826934814453, "global_step": 241169, "epoch": 1435} {"train_loss": -11.62005615234375, "global_step": 241170, "epoch": 1435} {"train_loss": -11.559356689453125, "global_step": 241171, "epoch": 1435} {"train_loss": -11.608942985534668, "global_step": 241172, "epoch": 1435} {"train_loss": -11.832220077514648, "global_step": 241173, "epoch": 1435} {"train_loss": -11.591766357421875, "global_step": 241174, "epoch": 1435} {"train_loss": -11.702583312988281, "global_step": 241175, "epoch": 1435} {"train_loss": -11.569757461547852, "global_step": 241176, "epoch": 1435} {"train_loss": -11.57791805267334, "global_step": 241177, "epoch": 1435} {"train_loss": -11.792013168334961, "global_step": 241178, "epoch": 1435} {"train_loss": -11.716459274291992, "global_step": 241179, "epoch": 1435} {"train_loss": -11.763589859008789, "global_step": 241180, "epoch": 1435} {"train_loss": -11.793768882751465, "global_step": 241181, "epoch": 1435} {"train_loss": -11.897562026977539, "global_step": 241182, "epoch": 1435} {"train_loss": -11.979827880859375, "global_step": 241183, "epoch": 1435} {"train_loss": -11.802177429199219, "global_step": 241184, "epoch": 1435} {"train_loss": -11.491901397705078, "global_step": 241185, "epoch": 1435} {"train_loss": -11.881657600402832, "global_step": 241186, "epoch": 1435} {"train_loss": -11.86570930480957, "global_step": 241187, "epoch": 1435} {"train_loss": -11.654720306396484, "global_step": 241188, "epoch": 1435} {"train_loss": -12.031786918640137, "global_step": 241189, "epoch": 1435} {"train_loss": -11.684194564819336, "global_step": 241190, "epoch": 1435} {"train_loss": -11.956137657165527, "global_step": 241191, "epoch": 1435} {"train_loss": -11.83476448059082, "global_step": 241192, "epoch": 1435} {"train_loss": -11.673480987548828, "global_step": 241193, "epoch": 1435} {"train_loss": -11.932380676269531, "global_step": 241194, "epoch": 1435} {"train_loss": -11.449968338012695, "global_step": 241195, "epoch": 1435} {"train_loss": -11.886868476867676, "global_step": 241196, "epoch": 1435} {"train_loss": -11.688193321228027, "global_step": 241197, "epoch": 1435} {"train_loss": -11.892618179321289, "global_step": 241198, "epoch": 1435} {"train_loss": -11.48211669921875, "global_step": 241199, "epoch": 1435} {"train_loss": -11.705461502075195, "global_step": 241200, "epoch": 1435} {"train_loss": -11.778534889221191, "global_step": 241201, "epoch": 1435} {"train_loss": -11.277113914489746, "global_step": 241202, "epoch": 1435} {"train_loss": -11.941950798034668, "global_step": 241203, "epoch": 1435} {"train_loss": -11.59365463256836, "global_step": 241204, "epoch": 1435} {"train_loss": -11.934104919433594, "global_step": 241205, "epoch": 1435} {"train_loss": -11.75663948059082, "global_step": 241206, "epoch": 1435} {"train_loss": -11.724319458007812, "global_step": 241207, "epoch": 1435} {"train_loss": -12.080554962158203, "global_step": 241208, "epoch": 1435} {"train_loss": -11.886512756347656, "global_step": 241209, "epoch": 1435} {"train_loss": -11.857091903686523, "global_step": 241210, "epoch": 1435} {"train_loss": -11.837759017944336, "global_step": 241211, "epoch": 1435} {"train_loss": -12.058257102966309, "global_step": 241212, "epoch": 1435} {"train_loss": -12.051309585571289, "global_step": 241213, "epoch": 1435} {"train_loss": -12.072986602783203, "global_step": 241214, "epoch": 1435} {"train_loss": -12.118072509765625, "global_step": 241215, "epoch": 1435} {"train_loss": -11.991565704345703, "global_step": 241216, "epoch": 1435} {"train_loss": -11.897550582885742, "global_step": 241217, "epoch": 1435} {"train_loss": -12.176088333129883, "global_step": 241218, "epoch": 1435} {"train_loss": -11.87331771850586, "global_step": 241219, "epoch": 1435} {"train_loss": -11.595911979675293, "global_step": 241220, "epoch": 1435} {"train_loss": -11.647406578063965, "global_step": 241221, "epoch": 1435} {"train_loss": -11.960002899169922, "global_step": 241222, "epoch": 1435} {"train_loss": -11.333015441894531, "global_step": 241223, "epoch": 1435} {"train_loss": -11.882081985473633, "global_step": 241224, "epoch": 1435} {"train_loss": -11.643702507019043, "global_step": 241225, "epoch": 1435} {"train_loss": -10.953132629394531, "global_step": 241226, "epoch": 1435} {"train_loss": -10.656225204467773, "global_step": 241227, "epoch": 1435} {"train_loss": -11.18614387512207, "global_step": 241228, "epoch": 1435} {"train_loss": -10.60226058959961, "global_step": 241229, "epoch": 1435} {"train_loss": -9.371208190917969, "global_step": 241230, "epoch": 1435} {"train_loss": -11.299964904785156, "global_step": 241231, "epoch": 1435} {"train_loss": -9.864418029785156, "global_step": 241232, "epoch": 1435} {"train_loss": -9.618160247802734, "global_step": 241233, "epoch": 1435} {"train_loss": -10.753969192504883, "global_step": 241234, "epoch": 1435} {"train_loss": -8.972007751464844, "global_step": 241235, "epoch": 1435} {"train_loss": -9.12234115600586, "global_step": 241236, "epoch": 1435} {"train_loss": -10.37427043914795, "global_step": 241237, "epoch": 1435} {"train_loss": -10.330437660217285, "global_step": 241238, "epoch": 1435} {"train_loss": -9.451261520385742, "global_step": 241239, "epoch": 1435} {"train_loss": -8.721389770507812, "global_step": 241240, "epoch": 1435} {"train_loss": -9.42237663269043, "global_step": 241241, "epoch": 1435} {"train_loss": -9.909589767456055, "global_step": 241242, "epoch": 1435} {"train_loss": -10.961776733398438, "global_step": 241243, "epoch": 1435} {"train_loss": -9.461238861083984, "global_step": 241244, "epoch": 1435} {"train_loss": -11.096994400024414, "global_step": 241245, "epoch": 1435} {"train_loss": -10.359208106994629, "global_step": 241246, "epoch": 1435} {"train_loss": -11.228947310220628, "global_step": 241247, "epoch": 1435, "val_loss": 262138.015625, "train_action_mse_error": 1.6720085144042969} {"train_loss": -11.042410850524902, "global_step": 241248, "epoch": 1436} {"train_loss": -9.983036041259766, "global_step": 241249, "epoch": 1436} {"train_loss": -11.0581693649292, "global_step": 241250, "epoch": 1436} {"train_loss": -10.580598831176758, "global_step": 241251, "epoch": 1436} {"train_loss": -9.925291061401367, "global_step": 241252, "epoch": 1436} {"train_loss": -11.309355735778809, "global_step": 241253, "epoch": 1436} {"train_loss": -9.85788345336914, "global_step": 241254, "epoch": 1436} {"train_loss": -11.303834915161133, "global_step": 241255, "epoch": 1436} {"train_loss": -11.073867797851562, "global_step": 241256, "epoch": 1436} {"train_loss": -11.233895301818848, "global_step": 241257, "epoch": 1436} {"train_loss": -11.363340377807617, "global_step": 241258, "epoch": 1436} {"train_loss": -11.100347518920898, "global_step": 241259, "epoch": 1436} {"train_loss": -11.05354118347168, "global_step": 241260, "epoch": 1436} {"train_loss": -11.54557991027832, "global_step": 241261, "epoch": 1436} {"train_loss": -10.796317100524902, "global_step": 241262, "epoch": 1436} {"train_loss": -11.595382690429688, "global_step": 241263, "epoch": 1436} {"train_loss": -11.384061813354492, "global_step": 241264, "epoch": 1436} {"train_loss": -11.525567054748535, "global_step": 241265, "epoch": 1436} {"train_loss": -11.59245491027832, "global_step": 241266, "epoch": 1436} {"train_loss": -11.477529525756836, "global_step": 241267, "epoch": 1436} {"train_loss": -11.347597122192383, "global_step": 241268, "epoch": 1436} {"train_loss": -11.37639331817627, "global_step": 241269, "epoch": 1436} {"train_loss": -11.370437622070312, "global_step": 241270, "epoch": 1436} {"train_loss": -11.765262603759766, "global_step": 241271, "epoch": 1436} {"train_loss": -11.557096481323242, "global_step": 241272, "epoch": 1436} {"train_loss": -11.637849807739258, "global_step": 241273, "epoch": 1436} {"train_loss": -11.675140380859375, "global_step": 241274, "epoch": 1436} {"train_loss": -11.65149974822998, "global_step": 241275, "epoch": 1436} {"train_loss": -11.783693313598633, "global_step": 241276, "epoch": 1436} {"train_loss": -11.884058952331543, "global_step": 241277, "epoch": 1436} {"train_loss": -11.88151741027832, "global_step": 241278, "epoch": 1436} {"train_loss": -11.808744430541992, "global_step": 241279, "epoch": 1436} {"train_loss": -11.778071403503418, "global_step": 241280, "epoch": 1436} {"train_loss": -11.692604064941406, "global_step": 241281, "epoch": 1436} {"train_loss": -11.875874519348145, "global_step": 241282, "epoch": 1436} {"train_loss": -11.638833999633789, "global_step": 241283, "epoch": 1436} {"train_loss": -11.759522438049316, "global_step": 241284, "epoch": 1436} {"train_loss": -11.513425827026367, "global_step": 241285, "epoch": 1436} {"train_loss": -11.840971946716309, "global_step": 241286, "epoch": 1436} {"train_loss": -11.57722282409668, "global_step": 241287, "epoch": 1436} {"train_loss": -11.97445297241211, "global_step": 241288, "epoch": 1436} {"train_loss": -11.922918319702148, "global_step": 241289, "epoch": 1436} {"train_loss": -11.993566513061523, "global_step": 241290, "epoch": 1436} {"train_loss": -11.930413246154785, "global_step": 241291, "epoch": 1436} {"train_loss": -11.941267013549805, "global_step": 241292, "epoch": 1436} {"train_loss": -11.764461517333984, "global_step": 241293, "epoch": 1436} {"train_loss": -11.978151321411133, "global_step": 241294, "epoch": 1436} {"train_loss": -11.98349666595459, "global_step": 241295, "epoch": 1436} {"train_loss": -12.041421890258789, "global_step": 241296, "epoch": 1436} {"train_loss": -12.027321815490723, "global_step": 241297, "epoch": 1436} {"train_loss": -12.03976058959961, "global_step": 241298, "epoch": 1436} {"train_loss": -11.993942260742188, "global_step": 241299, "epoch": 1436} {"train_loss": -11.950814247131348, "global_step": 241300, "epoch": 1436} {"train_loss": -11.837373733520508, "global_step": 241301, "epoch": 1436} {"train_loss": -11.656269073486328, "global_step": 241302, "epoch": 1436} {"train_loss": -11.978489875793457, "global_step": 241303, "epoch": 1436} {"train_loss": -11.828975677490234, "global_step": 241304, "epoch": 1436} {"train_loss": -11.638481140136719, "global_step": 241305, "epoch": 1436} {"train_loss": -11.830916404724121, "global_step": 241306, "epoch": 1436} {"train_loss": -11.936210632324219, "global_step": 241307, "epoch": 1436} {"train_loss": -12.033145904541016, "global_step": 241308, "epoch": 1436} {"train_loss": -11.92044448852539, "global_step": 241309, "epoch": 1436} {"train_loss": -11.872925758361816, "global_step": 241310, "epoch": 1436} {"train_loss": -11.897912979125977, "global_step": 241311, "epoch": 1436} {"train_loss": -12.080926895141602, "global_step": 241312, "epoch": 1436} {"train_loss": -11.757790565490723, "global_step": 241313, "epoch": 1436} {"train_loss": -12.226856231689453, "global_step": 241314, "epoch": 1436} {"train_loss": -12.04208755493164, "global_step": 241315, "epoch": 1436} {"train_loss": -11.980277061462402, "global_step": 241316, "epoch": 1436} {"train_loss": -11.984895706176758, "global_step": 241317, "epoch": 1436} {"train_loss": -12.00299072265625, "global_step": 241318, "epoch": 1436} {"train_loss": -12.076913833618164, "global_step": 241319, "epoch": 1436} {"train_loss": -11.929722785949707, "global_step": 241320, "epoch": 1436} {"train_loss": -12.020851135253906, "global_step": 241321, "epoch": 1436} {"train_loss": -11.775875091552734, "global_step": 241322, "epoch": 1436} {"train_loss": -11.820087432861328, "global_step": 241323, "epoch": 1436} {"train_loss": -11.913554191589355, "global_step": 241324, "epoch": 1436} {"train_loss": -11.959871292114258, "global_step": 241325, "epoch": 1436} {"train_loss": -12.123083114624023, "global_step": 241326, "epoch": 1436} {"train_loss": -11.87222671508789, "global_step": 241327, "epoch": 1436} {"train_loss": -11.806352615356445, "global_step": 241328, "epoch": 1436} {"train_loss": -11.658414840698242, "global_step": 241329, "epoch": 1436} {"train_loss": -11.666071891784668, "global_step": 241330, "epoch": 1436} {"train_loss": -11.770949363708496, "global_step": 241331, "epoch": 1436} {"train_loss": -11.820856094360352, "global_step": 241332, "epoch": 1436} {"train_loss": -11.871953964233398, "global_step": 241333, "epoch": 1436} {"train_loss": -11.166923522949219, "global_step": 241334, "epoch": 1436} {"train_loss": -11.622398376464844, "global_step": 241335, "epoch": 1436} {"train_loss": -11.846663475036621, "global_step": 241336, "epoch": 1436} {"train_loss": -12.09560775756836, "global_step": 241337, "epoch": 1436} {"train_loss": -11.613473892211914, "global_step": 241338, "epoch": 1436} {"train_loss": -11.616053581237793, "global_step": 241339, "epoch": 1436} {"train_loss": -11.668455123901367, "global_step": 241340, "epoch": 1436} {"train_loss": -12.471168518066406, "global_step": 241341, "epoch": 1436} {"train_loss": -11.444060325622559, "global_step": 241342, "epoch": 1436} {"train_loss": -11.618363380432129, "global_step": 241343, "epoch": 1436} {"train_loss": -11.39236831665039, "global_step": 241344, "epoch": 1436} {"train_loss": -11.469133377075195, "global_step": 241345, "epoch": 1436} {"train_loss": -12.024012565612793, "global_step": 241346, "epoch": 1436} {"train_loss": -11.8990478515625, "global_step": 241347, "epoch": 1436} {"train_loss": -11.794994354248047, "global_step": 241348, "epoch": 1436} {"train_loss": -11.922296524047852, "global_step": 241349, "epoch": 1436} {"train_loss": -11.886724472045898, "global_step": 241350, "epoch": 1436} {"train_loss": -11.124974250793457, "global_step": 241351, "epoch": 1436} {"train_loss": -11.902441024780273, "global_step": 241352, "epoch": 1436} {"train_loss": -12.074254989624023, "global_step": 241353, "epoch": 1436} {"train_loss": -11.84019660949707, "global_step": 241354, "epoch": 1436} {"train_loss": -11.924549102783203, "global_step": 241355, "epoch": 1436} {"train_loss": -11.98948860168457, "global_step": 241356, "epoch": 1436} {"train_loss": -12.006009101867676, "global_step": 241357, "epoch": 1436} {"train_loss": -11.812885284423828, "global_step": 241358, "epoch": 1436} {"train_loss": -11.94262981414795, "global_step": 241359, "epoch": 1436} {"train_loss": -11.911836624145508, "global_step": 241360, "epoch": 1436} {"train_loss": -12.125249862670898, "global_step": 241361, "epoch": 1436} {"train_loss": -11.978093147277832, "global_step": 241362, "epoch": 1436} {"train_loss": -12.050759315490723, "global_step": 241363, "epoch": 1436} {"train_loss": -11.896256446838379, "global_step": 241364, "epoch": 1436} {"train_loss": -12.07406234741211, "global_step": 241365, "epoch": 1436} {"train_loss": -11.572334289550781, "global_step": 241366, "epoch": 1436} {"train_loss": -12.193267822265625, "global_step": 241367, "epoch": 1436} {"train_loss": -11.527510643005371, "global_step": 241368, "epoch": 1436} {"train_loss": -11.677663803100586, "global_step": 241369, "epoch": 1436} {"train_loss": -11.818838119506836, "global_step": 241370, "epoch": 1436} {"train_loss": -11.828055381774902, "global_step": 241371, "epoch": 1436} {"train_loss": -12.196022987365723, "global_step": 241372, "epoch": 1436} {"train_loss": -11.62403678894043, "global_step": 241373, "epoch": 1436} {"train_loss": -11.91038990020752, "global_step": 241374, "epoch": 1436} {"train_loss": -11.985865592956543, "global_step": 241375, "epoch": 1436} {"train_loss": -12.031009674072266, "global_step": 241376, "epoch": 1436} {"train_loss": -11.874149322509766, "global_step": 241377, "epoch": 1436} {"train_loss": -11.906012535095215, "global_step": 241378, "epoch": 1436} {"train_loss": -11.957390785217285, "global_step": 241379, "epoch": 1436} {"train_loss": -11.987390518188477, "global_step": 241380, "epoch": 1436} {"train_loss": -11.85546875, "global_step": 241381, "epoch": 1436} {"train_loss": -11.319451332092285, "global_step": 241382, "epoch": 1436} {"train_loss": -11.746931076049805, "global_step": 241383, "epoch": 1436} {"train_loss": -11.352788925170898, "global_step": 241384, "epoch": 1436} {"train_loss": -11.37495231628418, "global_step": 241385, "epoch": 1436} {"train_loss": -11.960826873779297, "global_step": 241386, "epoch": 1436} {"train_loss": -10.846183776855469, "global_step": 241387, "epoch": 1436} {"train_loss": -11.761674880981445, "global_step": 241388, "epoch": 1436} {"train_loss": -10.166804313659668, "global_step": 241389, "epoch": 1436} {"train_loss": -11.967691421508789, "global_step": 241390, "epoch": 1436} {"train_loss": -11.04317855834961, "global_step": 241391, "epoch": 1436} {"train_loss": -11.272384643554688, "global_step": 241392, "epoch": 1436} {"train_loss": -10.359679222106934, "global_step": 241393, "epoch": 1436} {"train_loss": -10.801915168762207, "global_step": 241394, "epoch": 1436} {"train_loss": -11.393205642700195, "global_step": 241395, "epoch": 1436} {"train_loss": -9.603311538696289, "global_step": 241396, "epoch": 1436} {"train_loss": -10.746100425720215, "global_step": 241397, "epoch": 1436} {"train_loss": -10.349946975708008, "global_step": 241398, "epoch": 1436} {"train_loss": -9.526185989379883, "global_step": 241399, "epoch": 1436} {"train_loss": -11.392561912536621, "global_step": 241400, "epoch": 1436} {"train_loss": -9.465896606445312, "global_step": 241401, "epoch": 1436} {"train_loss": -11.072805404663086, "global_step": 241402, "epoch": 1436} {"train_loss": -10.300782203674316, "global_step": 241403, "epoch": 1436} {"train_loss": -10.630727767944336, "global_step": 241404, "epoch": 1436} {"train_loss": -10.614052772521973, "global_step": 241405, "epoch": 1436} {"train_loss": -9.713674545288086, "global_step": 241406, "epoch": 1436} {"train_loss": -11.226638793945312, "global_step": 241407, "epoch": 1436} {"train_loss": -9.81157112121582, "global_step": 241408, "epoch": 1436} {"train_loss": -11.06930923461914, "global_step": 241409, "epoch": 1436} {"train_loss": -10.111772537231445, "global_step": 241410, "epoch": 1436} {"train_loss": -10.94312572479248, "global_step": 241411, "epoch": 1436} {"train_loss": -10.418760299682617, "global_step": 241412, "epoch": 1436} {"train_loss": -10.192910194396973, "global_step": 241413, "epoch": 1436} {"train_loss": -10.700593948364258, "global_step": 241414, "epoch": 1436} {"train_loss": -11.52355988820394, "global_step": 241415, "epoch": 1436, "val_loss": 261592.859375} {"train_loss": -10.54810905456543, "global_step": 241416, "epoch": 1437} {"train_loss": -10.354330062866211, "global_step": 241417, "epoch": 1437} {"train_loss": -11.229392051696777, "global_step": 241418, "epoch": 1437} {"train_loss": -10.63290023803711, "global_step": 241419, "epoch": 1437} {"train_loss": -11.029062271118164, "global_step": 241420, "epoch": 1437} {"train_loss": -10.777016639709473, "global_step": 241421, "epoch": 1437} {"train_loss": -10.755844116210938, "global_step": 241422, "epoch": 1437} {"train_loss": -11.057343482971191, "global_step": 241423, "epoch": 1437} {"train_loss": -10.630073547363281, "global_step": 241424, "epoch": 1437} {"train_loss": -11.158414840698242, "global_step": 241425, "epoch": 1437} {"train_loss": -10.712060928344727, "global_step": 241426, "epoch": 1437} {"train_loss": -10.794468879699707, "global_step": 241427, "epoch": 1437} {"train_loss": -10.84410572052002, "global_step": 241428, "epoch": 1437} {"train_loss": -10.962397575378418, "global_step": 241429, "epoch": 1437} {"train_loss": -10.752355575561523, "global_step": 241430, "epoch": 1437} {"train_loss": -10.941118240356445, "global_step": 241431, "epoch": 1437} {"train_loss": -11.073676109313965, "global_step": 241432, "epoch": 1437} {"train_loss": -10.950395584106445, "global_step": 241433, "epoch": 1437} {"train_loss": -11.37942886352539, "global_step": 241434, "epoch": 1437} {"train_loss": -11.180339813232422, "global_step": 241435, "epoch": 1437} {"train_loss": -11.418611526489258, "global_step": 241436, "epoch": 1437} {"train_loss": -11.352860450744629, "global_step": 241437, "epoch": 1437} {"train_loss": -11.611298561096191, "global_step": 241438, "epoch": 1437} {"train_loss": -11.537253379821777, "global_step": 241439, "epoch": 1437} {"train_loss": -11.337747573852539, "global_step": 241440, "epoch": 1437} {"train_loss": -11.51231575012207, "global_step": 241441, "epoch": 1437} {"train_loss": -11.599149703979492, "global_step": 241442, "epoch": 1437} {"train_loss": -11.266298294067383, "global_step": 241443, "epoch": 1437} {"train_loss": -11.508979797363281, "global_step": 241444, "epoch": 1437} {"train_loss": -11.516027450561523, "global_step": 241445, "epoch": 1437} {"train_loss": -11.646432876586914, "global_step": 241446, "epoch": 1437} {"train_loss": -11.631587982177734, "global_step": 241447, "epoch": 1437} {"train_loss": -11.584833145141602, "global_step": 241448, "epoch": 1437} {"train_loss": -11.382682800292969, "global_step": 241449, "epoch": 1437} {"train_loss": -11.61141586303711, "global_step": 241450, "epoch": 1437} {"train_loss": -11.577187538146973, "global_step": 241451, "epoch": 1437} {"train_loss": -11.359031677246094, "global_step": 241452, "epoch": 1437} {"train_loss": -11.863887786865234, "global_step": 241453, "epoch": 1437} {"train_loss": -11.708393096923828, "global_step": 241454, "epoch": 1437} {"train_loss": -11.678203582763672, "global_step": 241455, "epoch": 1437} {"train_loss": -11.760376930236816, "global_step": 241456, "epoch": 1437} {"train_loss": -11.732616424560547, "global_step": 241457, "epoch": 1437} {"train_loss": -11.525273323059082, "global_step": 241458, "epoch": 1437} {"train_loss": -11.834643363952637, "global_step": 241459, "epoch": 1437} {"train_loss": -11.6134614944458, "global_step": 241460, "epoch": 1437} {"train_loss": -11.843079566955566, "global_step": 241461, "epoch": 1437} {"train_loss": -11.566577911376953, "global_step": 241462, "epoch": 1437} {"train_loss": -11.649438858032227, "global_step": 241463, "epoch": 1437} {"train_loss": -11.635436058044434, "global_step": 241464, "epoch": 1437} {"train_loss": -11.56160831451416, "global_step": 241465, "epoch": 1437} {"train_loss": -11.418069839477539, "global_step": 241466, "epoch": 1437} {"train_loss": -11.975369453430176, "global_step": 241467, "epoch": 1437} {"train_loss": -11.61434555053711, "global_step": 241468, "epoch": 1437} {"train_loss": -11.418556213378906, "global_step": 241469, "epoch": 1437} {"train_loss": -11.814847946166992, "global_step": 241470, "epoch": 1437} {"train_loss": -11.436864852905273, "global_step": 241471, "epoch": 1437} {"train_loss": -11.99330997467041, "global_step": 241472, "epoch": 1437} {"train_loss": -11.668153762817383, "global_step": 241473, "epoch": 1437} {"train_loss": -11.802383422851562, "global_step": 241474, "epoch": 1437} {"train_loss": -11.824190139770508, "global_step": 241475, "epoch": 1437} {"train_loss": -11.859709739685059, "global_step": 241476, "epoch": 1437} {"train_loss": -11.709589958190918, "global_step": 241477, "epoch": 1437} {"train_loss": -11.722253799438477, "global_step": 241478, "epoch": 1437} {"train_loss": -11.928516387939453, "global_step": 241479, "epoch": 1437} {"train_loss": -11.859383583068848, "global_step": 241480, "epoch": 1437} {"train_loss": -11.911602020263672, "global_step": 241481, "epoch": 1437} {"train_loss": -11.714338302612305, "global_step": 241482, "epoch": 1437} {"train_loss": -11.925071716308594, "global_step": 241483, "epoch": 1437} {"train_loss": -12.06246566772461, "global_step": 241484, "epoch": 1437} {"train_loss": -12.18425178527832, "global_step": 241485, "epoch": 1437} {"train_loss": -11.970375061035156, "global_step": 241486, "epoch": 1437} {"train_loss": -12.149730682373047, "global_step": 241487, "epoch": 1437} {"train_loss": -11.865570068359375, "global_step": 241488, "epoch": 1437} {"train_loss": -12.190078735351562, "global_step": 241489, "epoch": 1437} {"train_loss": -12.10698413848877, "global_step": 241490, "epoch": 1437} {"train_loss": -12.079681396484375, "global_step": 241491, "epoch": 1437} {"train_loss": -11.972261428833008, "global_step": 241492, "epoch": 1437} {"train_loss": -12.112871170043945, "global_step": 241493, "epoch": 1437} {"train_loss": -12.057838439941406, "global_step": 241494, "epoch": 1437} {"train_loss": -12.038740158081055, "global_step": 241495, "epoch": 1437} {"train_loss": -11.983444213867188, "global_step": 241496, "epoch": 1437} {"train_loss": -11.852110862731934, "global_step": 241497, "epoch": 1437} {"train_loss": -11.840291976928711, "global_step": 241498, "epoch": 1437} {"train_loss": -11.95019817352295, "global_step": 241499, "epoch": 1437} {"train_loss": -12.10433292388916, "global_step": 241500, "epoch": 1437} {"train_loss": -11.675755500793457, "global_step": 241501, "epoch": 1437} {"train_loss": -11.708610534667969, "global_step": 241502, "epoch": 1437} {"train_loss": -11.865510940551758, "global_step": 241503, "epoch": 1437} {"train_loss": -11.88015365600586, "global_step": 241504, "epoch": 1437} {"train_loss": -11.425701141357422, "global_step": 241505, "epoch": 1437} {"train_loss": -11.827657699584961, "global_step": 241506, "epoch": 1437} {"train_loss": -11.73465347290039, "global_step": 241507, "epoch": 1437} {"train_loss": -11.880777359008789, "global_step": 241508, "epoch": 1437} {"train_loss": -11.821298599243164, "global_step": 241509, "epoch": 1437} {"train_loss": -12.20073127746582, "global_step": 241510, "epoch": 1437} {"train_loss": -11.760210037231445, "global_step": 241511, "epoch": 1437} {"train_loss": -12.019041061401367, "global_step": 241512, "epoch": 1437} {"train_loss": -12.019976615905762, "global_step": 241513, "epoch": 1437} {"train_loss": -12.053070068359375, "global_step": 241514, "epoch": 1437} {"train_loss": -11.58915901184082, "global_step": 241515, "epoch": 1437} {"train_loss": -11.237213134765625, "global_step": 241516, "epoch": 1437} {"train_loss": -10.825128555297852, "global_step": 241517, "epoch": 1437} {"train_loss": -11.878419876098633, "global_step": 241518, "epoch": 1437} {"train_loss": -11.547908782958984, "global_step": 241519, "epoch": 1437} {"train_loss": -11.382911682128906, "global_step": 241520, "epoch": 1437} {"train_loss": -12.107494354248047, "global_step": 241521, "epoch": 1437} {"train_loss": -11.58248519897461, "global_step": 241522, "epoch": 1437} {"train_loss": -10.72918701171875, "global_step": 241523, "epoch": 1437} {"train_loss": -11.590012550354004, "global_step": 241524, "epoch": 1437} {"train_loss": -11.293909072875977, "global_step": 241525, "epoch": 1437} {"train_loss": -10.6326322555542, "global_step": 241526, "epoch": 1437} {"train_loss": -11.854643821716309, "global_step": 241527, "epoch": 1437} {"train_loss": -10.862457275390625, "global_step": 241528, "epoch": 1437} {"train_loss": -11.060403823852539, "global_step": 241529, "epoch": 1437} {"train_loss": -11.14388370513916, "global_step": 241530, "epoch": 1437} {"train_loss": -10.707468032836914, "global_step": 241531, "epoch": 1437} {"train_loss": -11.079137802124023, "global_step": 241532, "epoch": 1437} {"train_loss": -11.344539642333984, "global_step": 241533, "epoch": 1437} {"train_loss": -11.432962417602539, "global_step": 241534, "epoch": 1437} {"train_loss": -11.612319946289062, "global_step": 241535, "epoch": 1437} {"train_loss": -11.471627235412598, "global_step": 241536, "epoch": 1437} {"train_loss": -11.299308776855469, "global_step": 241537, "epoch": 1437} {"train_loss": -11.414730072021484, "global_step": 241538, "epoch": 1437} {"train_loss": -11.648390769958496, "global_step": 241539, "epoch": 1437} {"train_loss": -12.033000946044922, "global_step": 241540, "epoch": 1437} {"train_loss": -11.747997283935547, "global_step": 241541, "epoch": 1437} {"train_loss": -12.068378448486328, "global_step": 241542, "epoch": 1437} {"train_loss": -11.79720687866211, "global_step": 241543, "epoch": 1437} {"train_loss": -11.89821720123291, "global_step": 241544, "epoch": 1437} {"train_loss": -11.871426582336426, "global_step": 241545, "epoch": 1437} {"train_loss": -11.889307022094727, "global_step": 241546, "epoch": 1437} {"train_loss": -11.852997779846191, "global_step": 241547, "epoch": 1437} {"train_loss": -11.841001510620117, "global_step": 241548, "epoch": 1437} {"train_loss": -11.480875968933105, "global_step": 241549, "epoch": 1437} {"train_loss": -11.690847396850586, "global_step": 241550, "epoch": 1437} {"train_loss": -11.862293243408203, "global_step": 241551, "epoch": 1437} {"train_loss": -11.619421005249023, "global_step": 241552, "epoch": 1437} {"train_loss": -11.5756254196167, "global_step": 241553, "epoch": 1437} {"train_loss": -11.274065971374512, "global_step": 241554, "epoch": 1437} {"train_loss": -11.855522155761719, "global_step": 241555, "epoch": 1437} {"train_loss": -11.447243690490723, "global_step": 241556, "epoch": 1437} {"train_loss": -11.449819564819336, "global_step": 241557, "epoch": 1437} {"train_loss": -11.692691802978516, "global_step": 241558, "epoch": 1437} {"train_loss": -11.329593658447266, "global_step": 241559, "epoch": 1437} {"train_loss": -11.686851501464844, "global_step": 241560, "epoch": 1437} {"train_loss": -11.74873161315918, "global_step": 241561, "epoch": 1437} {"train_loss": -11.672340393066406, "global_step": 241562, "epoch": 1437} {"train_loss": -11.518675804138184, "global_step": 241563, "epoch": 1437} {"train_loss": -11.729792594909668, "global_step": 241564, "epoch": 1437} {"train_loss": -11.838857650756836, "global_step": 241565, "epoch": 1437} {"train_loss": -11.335034370422363, "global_step": 241566, "epoch": 1437} {"train_loss": -11.311300277709961, "global_step": 241567, "epoch": 1437} {"train_loss": -11.578025817871094, "global_step": 241568, "epoch": 1437} {"train_loss": -10.93604850769043, "global_step": 241569, "epoch": 1437} {"train_loss": -11.829666137695312, "global_step": 241570, "epoch": 1437} {"train_loss": -10.96720027923584, "global_step": 241571, "epoch": 1437} {"train_loss": -11.342729568481445, "global_step": 241572, "epoch": 1437} {"train_loss": -11.236350059509277, "global_step": 241573, "epoch": 1437} {"train_loss": -12.047155380249023, "global_step": 241574, "epoch": 1437} {"train_loss": -11.596034049987793, "global_step": 241575, "epoch": 1437} {"train_loss": -11.64726448059082, "global_step": 241576, "epoch": 1437} {"train_loss": -11.479516983032227, "global_step": 241577, "epoch": 1437} {"train_loss": -11.427603721618652, "global_step": 241578, "epoch": 1437} {"train_loss": -11.697587966918945, "global_step": 241579, "epoch": 1437} {"train_loss": -11.302310943603516, "global_step": 241580, "epoch": 1437} {"train_loss": -11.686931610107422, "global_step": 241581, "epoch": 1437} {"train_loss": -11.705755233764648, "global_step": 241582, "epoch": 1437} {"train_loss": -11.555908038502647, "global_step": 241583, "epoch": 1437, "val_loss": 264528.65625} {"train_loss": -11.38351058959961, "global_step": 241584, "epoch": 1438} {"train_loss": -10.339937210083008, "global_step": 241585, "epoch": 1438} {"train_loss": -10.444086074829102, "global_step": 241586, "epoch": 1438} {"train_loss": -11.600672721862793, "global_step": 241587, "epoch": 1438} {"train_loss": -11.152989387512207, "global_step": 241588, "epoch": 1438} {"train_loss": -11.712469100952148, "global_step": 241589, "epoch": 1438} {"train_loss": -11.11551570892334, "global_step": 241590, "epoch": 1438} {"train_loss": -11.826437950134277, "global_step": 241591, "epoch": 1438} {"train_loss": -11.512727737426758, "global_step": 241592, "epoch": 1438} {"train_loss": -11.900313377380371, "global_step": 241593, "epoch": 1438} {"train_loss": -11.44890308380127, "global_step": 241594, "epoch": 1438} {"train_loss": -11.821329116821289, "global_step": 241595, "epoch": 1438} {"train_loss": -11.421873092651367, "global_step": 241596, "epoch": 1438} {"train_loss": -11.683460235595703, "global_step": 241597, "epoch": 1438} {"train_loss": -11.511999130249023, "global_step": 241598, "epoch": 1438} {"train_loss": -11.96712875366211, "global_step": 241599, "epoch": 1438} {"train_loss": -11.425801277160645, "global_step": 241600, "epoch": 1438} {"train_loss": -11.579318046569824, "global_step": 241601, "epoch": 1438} {"train_loss": -11.878055572509766, "global_step": 241602, "epoch": 1438} {"train_loss": -11.46888256072998, "global_step": 241603, "epoch": 1438} {"train_loss": -11.747352600097656, "global_step": 241604, "epoch": 1438} {"train_loss": -11.498076438903809, "global_step": 241605, "epoch": 1438} {"train_loss": -11.639263153076172, "global_step": 241606, "epoch": 1438} {"train_loss": -11.65695571899414, "global_step": 241607, "epoch": 1438} {"train_loss": -11.40822696685791, "global_step": 241608, "epoch": 1438} {"train_loss": -11.845748901367188, "global_step": 241609, "epoch": 1438} {"train_loss": -11.275838851928711, "global_step": 241610, "epoch": 1438} {"train_loss": -11.378093719482422, "global_step": 241611, "epoch": 1438} {"train_loss": -11.35358715057373, "global_step": 241612, "epoch": 1438} {"train_loss": -11.470741271972656, "global_step": 241613, "epoch": 1438} {"train_loss": -11.482277870178223, "global_step": 241614, "epoch": 1438} {"train_loss": -11.689701080322266, "global_step": 241615, "epoch": 1438} {"train_loss": -11.561107635498047, "global_step": 241616, "epoch": 1438} {"train_loss": -11.617663383483887, "global_step": 241617, "epoch": 1438} {"train_loss": -11.576845169067383, "global_step": 241618, "epoch": 1438} {"train_loss": -11.342798233032227, "global_step": 241619, "epoch": 1438} {"train_loss": -11.251956939697266, "global_step": 241620, "epoch": 1438} {"train_loss": -11.349143028259277, "global_step": 241621, "epoch": 1438} {"train_loss": -11.46896743774414, "global_step": 241622, "epoch": 1438} {"train_loss": -11.55172348022461, "global_step": 241623, "epoch": 1438} {"train_loss": -11.533198356628418, "global_step": 241624, "epoch": 1438} {"train_loss": -11.594032287597656, "global_step": 241625, "epoch": 1438} {"train_loss": -11.307979583740234, "global_step": 241626, "epoch": 1438} {"train_loss": -11.690507888793945, "global_step": 241627, "epoch": 1438} {"train_loss": -10.669986724853516, "global_step": 241628, "epoch": 1438} {"train_loss": -11.854955673217773, "global_step": 241629, "epoch": 1438} {"train_loss": -10.789743423461914, "global_step": 241630, "epoch": 1438} {"train_loss": -11.063469886779785, "global_step": 241631, "epoch": 1438} {"train_loss": -11.303596496582031, "global_step": 241632, "epoch": 1438} {"train_loss": -10.308401107788086, "global_step": 241633, "epoch": 1438} {"train_loss": -11.806936264038086, "global_step": 241634, "epoch": 1438} {"train_loss": -10.21115779876709, "global_step": 241635, "epoch": 1438} {"train_loss": -11.656319618225098, "global_step": 241636, "epoch": 1438} {"train_loss": -11.074953079223633, "global_step": 241637, "epoch": 1438} {"train_loss": -11.635575294494629, "global_step": 241638, "epoch": 1438} {"train_loss": -10.999483108520508, "global_step": 241639, "epoch": 1438} {"train_loss": -10.69759464263916, "global_step": 241640, "epoch": 1438} {"train_loss": -11.600733757019043, "global_step": 241641, "epoch": 1438} {"train_loss": -10.377857208251953, "global_step": 241642, "epoch": 1438} {"train_loss": -11.206775665283203, "global_step": 241643, "epoch": 1438} {"train_loss": -11.207300186157227, "global_step": 241644, "epoch": 1438} {"train_loss": -11.073431015014648, "global_step": 241645, "epoch": 1438} {"train_loss": -10.771382331848145, "global_step": 241646, "epoch": 1438} {"train_loss": -10.5317964553833, "global_step": 241647, "epoch": 1438} {"train_loss": -11.45796012878418, "global_step": 241648, "epoch": 1438} {"train_loss": -10.72763442993164, "global_step": 241649, "epoch": 1438} {"train_loss": -11.565500259399414, "global_step": 241650, "epoch": 1438} {"train_loss": -11.078147888183594, "global_step": 241651, "epoch": 1438} {"train_loss": -11.524030685424805, "global_step": 241652, "epoch": 1438} {"train_loss": -11.330896377563477, "global_step": 241653, "epoch": 1438} {"train_loss": -11.230936050415039, "global_step": 241654, "epoch": 1438} {"train_loss": -11.247074127197266, "global_step": 241655, "epoch": 1438} {"train_loss": -11.273529052734375, "global_step": 241656, "epoch": 1438} {"train_loss": -11.208290100097656, "global_step": 241657, "epoch": 1438} {"train_loss": -11.267942428588867, "global_step": 241658, "epoch": 1438} {"train_loss": -11.522928237915039, "global_step": 241659, "epoch": 1438} {"train_loss": -11.117541313171387, "global_step": 241660, "epoch": 1438} {"train_loss": -11.714574813842773, "global_step": 241661, "epoch": 1438} {"train_loss": -11.294485092163086, "global_step": 241662, "epoch": 1438} {"train_loss": -11.480619430541992, "global_step": 241663, "epoch": 1438} {"train_loss": -10.963214874267578, "global_step": 241664, "epoch": 1438} {"train_loss": -11.710189819335938, "global_step": 241665, "epoch": 1438} {"train_loss": -10.784826278686523, "global_step": 241666, "epoch": 1438} {"train_loss": -11.795217514038086, "global_step": 241667, "epoch": 1438} {"train_loss": -11.14168643951416, "global_step": 241668, "epoch": 1438} {"train_loss": -11.862104415893555, "global_step": 241669, "epoch": 1438} {"train_loss": -11.344171524047852, "global_step": 241670, "epoch": 1438} {"train_loss": -11.621875762939453, "global_step": 241671, "epoch": 1438} {"train_loss": -11.40390396118164, "global_step": 241672, "epoch": 1438} {"train_loss": -11.292034149169922, "global_step": 241673, "epoch": 1438} {"train_loss": -11.475862503051758, "global_step": 241674, "epoch": 1438} {"train_loss": -11.640823364257812, "global_step": 241675, "epoch": 1438} {"train_loss": -11.691184997558594, "global_step": 241676, "epoch": 1438} {"train_loss": -11.372749328613281, "global_step": 241677, "epoch": 1438} {"train_loss": -11.767879486083984, "global_step": 241678, "epoch": 1438} {"train_loss": -11.574944496154785, "global_step": 241679, "epoch": 1438} {"train_loss": -11.801424026489258, "global_step": 241680, "epoch": 1438} {"train_loss": -11.700149536132812, "global_step": 241681, "epoch": 1438} {"train_loss": -11.61372184753418, "global_step": 241682, "epoch": 1438} {"train_loss": -11.697366714477539, "global_step": 241683, "epoch": 1438} {"train_loss": -11.860176086425781, "global_step": 241684, "epoch": 1438} {"train_loss": -11.876874923706055, "global_step": 241685, "epoch": 1438} {"train_loss": -11.746368408203125, "global_step": 241686, "epoch": 1438} {"train_loss": -11.72298812866211, "global_step": 241687, "epoch": 1438} {"train_loss": -11.822941780090332, "global_step": 241688, "epoch": 1438} {"train_loss": -11.818727493286133, "global_step": 241689, "epoch": 1438} {"train_loss": -11.638886451721191, "global_step": 241690, "epoch": 1438} {"train_loss": -11.842827796936035, "global_step": 241691, "epoch": 1438} {"train_loss": -11.640302658081055, "global_step": 241692, "epoch": 1438} {"train_loss": -12.089529037475586, "global_step": 241693, "epoch": 1438} {"train_loss": -11.904093742370605, "global_step": 241694, "epoch": 1438} {"train_loss": -11.913819313049316, "global_step": 241695, "epoch": 1438} {"train_loss": -11.785392761230469, "global_step": 241696, "epoch": 1438} {"train_loss": -11.768939971923828, "global_step": 241697, "epoch": 1438} {"train_loss": -11.839412689208984, "global_step": 241698, "epoch": 1438} {"train_loss": -11.92967414855957, "global_step": 241699, "epoch": 1438} {"train_loss": -11.730461120605469, "global_step": 241700, "epoch": 1438} {"train_loss": -11.788444519042969, "global_step": 241701, "epoch": 1438} {"train_loss": -11.908562660217285, "global_step": 241702, "epoch": 1438} {"train_loss": -11.999551773071289, "global_step": 241703, "epoch": 1438} {"train_loss": -12.13077449798584, "global_step": 241704, "epoch": 1438} {"train_loss": -12.001766204833984, "global_step": 241705, "epoch": 1438} {"train_loss": -12.16323471069336, "global_step": 241706, "epoch": 1438} {"train_loss": -12.022709846496582, "global_step": 241707, "epoch": 1438} {"train_loss": -11.946928024291992, "global_step": 241708, "epoch": 1438} {"train_loss": -12.143448829650879, "global_step": 241709, "epoch": 1438} {"train_loss": -11.766814231872559, "global_step": 241710, "epoch": 1438} {"train_loss": -12.27775764465332, "global_step": 241711, "epoch": 1438} {"train_loss": -11.790464401245117, "global_step": 241712, "epoch": 1438} {"train_loss": -11.853853225708008, "global_step": 241713, "epoch": 1438} {"train_loss": -11.835176467895508, "global_step": 241714, "epoch": 1438} {"train_loss": -11.611852645874023, "global_step": 241715, "epoch": 1438} {"train_loss": -11.53948974609375, "global_step": 241716, "epoch": 1438} {"train_loss": -11.749948501586914, "global_step": 241717, "epoch": 1438} {"train_loss": -11.527050018310547, "global_step": 241718, "epoch": 1438} {"train_loss": -11.653765678405762, "global_step": 241719, "epoch": 1438} {"train_loss": -11.897176742553711, "global_step": 241720, "epoch": 1438} {"train_loss": -11.463955879211426, "global_step": 241721, "epoch": 1438} {"train_loss": -11.21285629272461, "global_step": 241722, "epoch": 1438} {"train_loss": -11.11597728729248, "global_step": 241723, "epoch": 1438} {"train_loss": -11.807347297668457, "global_step": 241724, "epoch": 1438} {"train_loss": -10.644765853881836, "global_step": 241725, "epoch": 1438} {"train_loss": -11.729947090148926, "global_step": 241726, "epoch": 1438} {"train_loss": -10.968670845031738, "global_step": 241727, "epoch": 1438} {"train_loss": -11.12504768371582, "global_step": 241728, "epoch": 1438} {"train_loss": -11.668381690979004, "global_step": 241729, "epoch": 1438} {"train_loss": -10.738565444946289, "global_step": 241730, "epoch": 1438} {"train_loss": -11.693717956542969, "global_step": 241731, "epoch": 1438} {"train_loss": -10.13072681427002, "global_step": 241732, "epoch": 1438} {"train_loss": -11.871665954589844, "global_step": 241733, "epoch": 1438} {"train_loss": -10.927288055419922, "global_step": 241734, "epoch": 1438} {"train_loss": -11.250480651855469, "global_step": 241735, "epoch": 1438} {"train_loss": -11.02468490600586, "global_step": 241736, "epoch": 1438} {"train_loss": -11.225923538208008, "global_step": 241737, "epoch": 1438} {"train_loss": -10.36722183227539, "global_step": 241738, "epoch": 1438} {"train_loss": -10.782495498657227, "global_step": 241739, "epoch": 1438} {"train_loss": -11.519638061523438, "global_step": 241740, "epoch": 1438} {"train_loss": -11.170844078063965, "global_step": 241741, "epoch": 1438} {"train_loss": -11.362776756286621, "global_step": 241742, "epoch": 1438} {"train_loss": -11.1431884765625, "global_step": 241743, "epoch": 1438} {"train_loss": -10.755362510681152, "global_step": 241744, "epoch": 1438} {"train_loss": -11.473546028137207, "global_step": 241745, "epoch": 1438} {"train_loss": -10.57308578491211, "global_step": 241746, "epoch": 1438} {"train_loss": -11.70468521118164, "global_step": 241747, "epoch": 1438} {"train_loss": -10.78552532196045, "global_step": 241748, "epoch": 1438} {"train_loss": -10.662670135498047, "global_step": 241749, "epoch": 1438} {"train_loss": -11.901801109313965, "global_step": 241750, "epoch": 1438} {"train_loss": -11.436968650136675, "global_step": 241751, "epoch": 1438, "val_loss": 266248.78125} {"train_loss": -11.92410945892334, "global_step": 241752, "epoch": 1439} {"train_loss": -11.079888343811035, "global_step": 241753, "epoch": 1439} {"train_loss": -11.51215648651123, "global_step": 241754, "epoch": 1439} {"train_loss": -11.492626190185547, "global_step": 241755, "epoch": 1439} {"train_loss": -10.881366729736328, "global_step": 241756, "epoch": 1439} {"train_loss": -11.464845657348633, "global_step": 241757, "epoch": 1439} {"train_loss": -10.403339385986328, "global_step": 241758, "epoch": 1439} {"train_loss": -11.580432891845703, "global_step": 241759, "epoch": 1439} {"train_loss": -10.588227272033691, "global_step": 241760, "epoch": 1439} {"train_loss": -11.156417846679688, "global_step": 241761, "epoch": 1439} {"train_loss": -10.759485244750977, "global_step": 241762, "epoch": 1439} {"train_loss": -10.561079978942871, "global_step": 241763, "epoch": 1439} {"train_loss": -11.191742897033691, "global_step": 241764, "epoch": 1439} {"train_loss": -10.443023681640625, "global_step": 241765, "epoch": 1439} {"train_loss": -11.240503311157227, "global_step": 241766, "epoch": 1439} {"train_loss": -10.075613021850586, "global_step": 241767, "epoch": 1439} {"train_loss": -10.59135627746582, "global_step": 241768, "epoch": 1439} {"train_loss": -11.094194412231445, "global_step": 241769, "epoch": 1439} {"train_loss": -10.460920333862305, "global_step": 241770, "epoch": 1439} {"train_loss": -11.253189086914062, "global_step": 241771, "epoch": 1439} {"train_loss": -10.947708129882812, "global_step": 241772, "epoch": 1439} {"train_loss": -11.166461944580078, "global_step": 241773, "epoch": 1439} {"train_loss": -10.980178833007812, "global_step": 241774, "epoch": 1439} {"train_loss": -11.46809196472168, "global_step": 241775, "epoch": 1439} {"train_loss": -10.975421905517578, "global_step": 241776, "epoch": 1439} {"train_loss": -11.543902397155762, "global_step": 241777, "epoch": 1439} {"train_loss": -11.39280891418457, "global_step": 241778, "epoch": 1439} {"train_loss": -11.423730850219727, "global_step": 241779, "epoch": 1439} {"train_loss": -11.176976203918457, "global_step": 241780, "epoch": 1439} {"train_loss": -11.645347595214844, "global_step": 241781, "epoch": 1439} {"train_loss": -11.07223129272461, "global_step": 241782, "epoch": 1439} {"train_loss": -11.37619400024414, "global_step": 241783, "epoch": 1439} {"train_loss": -10.933778762817383, "global_step": 241784, "epoch": 1439} {"train_loss": -11.40591812133789, "global_step": 241785, "epoch": 1439} {"train_loss": -11.274673461914062, "global_step": 241786, "epoch": 1439} {"train_loss": -11.448575019836426, "global_step": 241787, "epoch": 1439} {"train_loss": -11.264163970947266, "global_step": 241788, "epoch": 1439} {"train_loss": -11.746034622192383, "global_step": 241789, "epoch": 1439} {"train_loss": -11.52387809753418, "global_step": 241790, "epoch": 1439} {"train_loss": -11.577043533325195, "global_step": 241791, "epoch": 1439} {"train_loss": -11.618839263916016, "global_step": 241792, "epoch": 1439} {"train_loss": -11.578344345092773, "global_step": 241793, "epoch": 1439} {"train_loss": -11.8265962600708, "global_step": 241794, "epoch": 1439} {"train_loss": -11.609779357910156, "global_step": 241795, "epoch": 1439} {"train_loss": -11.585103988647461, "global_step": 241796, "epoch": 1439} {"train_loss": -11.816299438476562, "global_step": 241797, "epoch": 1439} {"train_loss": -11.575418472290039, "global_step": 241798, "epoch": 1439} {"train_loss": -11.817176818847656, "global_step": 241799, "epoch": 1439} {"train_loss": -11.691723823547363, "global_step": 241800, "epoch": 1439} {"train_loss": -11.8617525100708, "global_step": 241801, "epoch": 1439} {"train_loss": -11.806497573852539, "global_step": 241802, "epoch": 1439} {"train_loss": -11.788704872131348, "global_step": 241803, "epoch": 1439} {"train_loss": -11.792402267456055, "global_step": 241804, "epoch": 1439} {"train_loss": -11.771525382995605, "global_step": 241805, "epoch": 1439} {"train_loss": -11.655190467834473, "global_step": 241806, "epoch": 1439} {"train_loss": -11.862337112426758, "global_step": 241807, "epoch": 1439} {"train_loss": -12.027467727661133, "global_step": 241808, "epoch": 1439} {"train_loss": -11.802416801452637, "global_step": 241809, "epoch": 1439} {"train_loss": -12.049074172973633, "global_step": 241810, "epoch": 1439} {"train_loss": -11.942753791809082, "global_step": 241811, "epoch": 1439} {"train_loss": -12.103004455566406, "global_step": 241812, "epoch": 1439} {"train_loss": -12.051862716674805, "global_step": 241813, "epoch": 1439} {"train_loss": -11.790164947509766, "global_step": 241814, "epoch": 1439} {"train_loss": -12.077190399169922, "global_step": 241815, "epoch": 1439} {"train_loss": -12.122285842895508, "global_step": 241816, "epoch": 1439} {"train_loss": -12.200161933898926, "global_step": 241817, "epoch": 1439} {"train_loss": -11.906792640686035, "global_step": 241818, "epoch": 1439} {"train_loss": -12.024308204650879, "global_step": 241819, "epoch": 1439} {"train_loss": -12.199398040771484, "global_step": 241820, "epoch": 1439} {"train_loss": -12.157794952392578, "global_step": 241821, "epoch": 1439} {"train_loss": -12.069869041442871, "global_step": 241822, "epoch": 1439} {"train_loss": -12.135669708251953, "global_step": 241823, "epoch": 1439} {"train_loss": -12.146234512329102, "global_step": 241824, "epoch": 1439} {"train_loss": -12.071163177490234, "global_step": 241825, "epoch": 1439} {"train_loss": -12.110179901123047, "global_step": 241826, "epoch": 1439} {"train_loss": -12.189697265625, "global_step": 241827, "epoch": 1439} {"train_loss": -11.907415390014648, "global_step": 241828, "epoch": 1439} {"train_loss": -12.162935256958008, "global_step": 241829, "epoch": 1439} {"train_loss": -12.110782623291016, "global_step": 241830, "epoch": 1439} {"train_loss": -12.248701095581055, "global_step": 241831, "epoch": 1439} {"train_loss": -11.997540473937988, "global_step": 241832, "epoch": 1439} {"train_loss": -12.133623123168945, "global_step": 241833, "epoch": 1439} {"train_loss": -12.155987739562988, "global_step": 241834, "epoch": 1439} {"train_loss": -12.05824089050293, "global_step": 241835, "epoch": 1439} {"train_loss": -12.315774917602539, "global_step": 241836, "epoch": 1439} {"train_loss": -12.182350158691406, "global_step": 241837, "epoch": 1439} {"train_loss": -12.411670684814453, "global_step": 241838, "epoch": 1439} {"train_loss": -12.165998458862305, "global_step": 241839, "epoch": 1439} {"train_loss": -12.316372871398926, "global_step": 241840, "epoch": 1439} {"train_loss": -11.933258056640625, "global_step": 241841, "epoch": 1439} {"train_loss": -12.113271713256836, "global_step": 241842, "epoch": 1439} {"train_loss": -12.182998657226562, "global_step": 241843, "epoch": 1439} {"train_loss": -12.124385833740234, "global_step": 241844, "epoch": 1439} {"train_loss": -12.064750671386719, "global_step": 241845, "epoch": 1439} {"train_loss": -12.236431121826172, "global_step": 241846, "epoch": 1439} {"train_loss": -12.057912826538086, "global_step": 241847, "epoch": 1439} {"train_loss": -11.920204162597656, "global_step": 241848, "epoch": 1439} {"train_loss": -11.988231658935547, "global_step": 241849, "epoch": 1439} {"train_loss": -10.938225746154785, "global_step": 241850, "epoch": 1439} {"train_loss": -10.398462295532227, "global_step": 241851, "epoch": 1439} {"train_loss": -11.643369674682617, "global_step": 241852, "epoch": 1439} {"train_loss": -11.828946113586426, "global_step": 241853, "epoch": 1439} {"train_loss": -12.03813362121582, "global_step": 241854, "epoch": 1439} {"train_loss": -11.976287841796875, "global_step": 241855, "epoch": 1439} {"train_loss": -11.087613105773926, "global_step": 241856, "epoch": 1439} {"train_loss": -12.048925399780273, "global_step": 241857, "epoch": 1439} {"train_loss": -11.618612289428711, "global_step": 241858, "epoch": 1439} {"train_loss": -11.700849533081055, "global_step": 241859, "epoch": 1439} {"train_loss": -12.023365020751953, "global_step": 241860, "epoch": 1439} {"train_loss": -11.261655807495117, "global_step": 241861, "epoch": 1439} {"train_loss": -11.88945484161377, "global_step": 241862, "epoch": 1439} {"train_loss": -10.576329231262207, "global_step": 241863, "epoch": 1439} {"train_loss": -11.174806594848633, "global_step": 241864, "epoch": 1439} {"train_loss": -11.191758155822754, "global_step": 241865, "epoch": 1439} {"train_loss": -10.941791534423828, "global_step": 241866, "epoch": 1439} {"train_loss": -8.533249855041504, "global_step": 241867, "epoch": 1439} {"train_loss": -9.306974411010742, "global_step": 241868, "epoch": 1439} {"train_loss": -8.583782196044922, "global_step": 241869, "epoch": 1439} {"train_loss": -9.2870512008667, "global_step": 241870, "epoch": 1439} {"train_loss": -8.490350723266602, "global_step": 241871, "epoch": 1439} {"train_loss": -8.102516174316406, "global_step": 241872, "epoch": 1439} {"train_loss": -8.10041618347168, "global_step": 241873, "epoch": 1439} {"train_loss": -9.719328880310059, "global_step": 241874, "epoch": 1439} {"train_loss": -9.192239761352539, "global_step": 241875, "epoch": 1439} {"train_loss": -8.1900634765625, "global_step": 241876, "epoch": 1439} {"train_loss": -9.263185501098633, "global_step": 241877, "epoch": 1439} {"train_loss": -9.73794174194336, "global_step": 241878, "epoch": 1439} {"train_loss": -10.473753929138184, "global_step": 241879, "epoch": 1439} {"train_loss": -10.20267391204834, "global_step": 241880, "epoch": 1439} {"train_loss": -10.644913673400879, "global_step": 241881, "epoch": 1439} {"train_loss": -10.338016510009766, "global_step": 241882, "epoch": 1439} {"train_loss": -10.558675765991211, "global_step": 241883, "epoch": 1439} {"train_loss": -10.633913040161133, "global_step": 241884, "epoch": 1439} {"train_loss": -9.68636703491211, "global_step": 241885, "epoch": 1439} {"train_loss": -10.995121002197266, "global_step": 241886, "epoch": 1439} {"train_loss": -9.374876976013184, "global_step": 241887, "epoch": 1439} {"train_loss": -10.793302536010742, "global_step": 241888, "epoch": 1439} {"train_loss": -9.111861228942871, "global_step": 241889, "epoch": 1439} {"train_loss": -10.330894470214844, "global_step": 241890, "epoch": 1439} {"train_loss": -9.379438400268555, "global_step": 241891, "epoch": 1439} {"train_loss": -10.537471771240234, "global_step": 241892, "epoch": 1439} {"train_loss": -9.3531494140625, "global_step": 241893, "epoch": 1439} {"train_loss": -10.35887336730957, "global_step": 241894, "epoch": 1439} {"train_loss": -9.94317626953125, "global_step": 241895, "epoch": 1439} {"train_loss": -11.125320434570312, "global_step": 241896, "epoch": 1439} {"train_loss": -10.728991508483887, "global_step": 241897, "epoch": 1439} {"train_loss": -10.7422513961792, "global_step": 241898, "epoch": 1439} {"train_loss": -11.029415130615234, "global_step": 241899, "epoch": 1439} {"train_loss": -10.653807640075684, "global_step": 241900, "epoch": 1439} {"train_loss": -11.473621368408203, "global_step": 241901, "epoch": 1439} {"train_loss": -11.18958568572998, "global_step": 241902, "epoch": 1439} {"train_loss": -11.138011932373047, "global_step": 241903, "epoch": 1439} {"train_loss": -11.185911178588867, "global_step": 241904, "epoch": 1439} {"train_loss": -10.941851615905762, "global_step": 241905, "epoch": 1439} {"train_loss": -11.236891746520996, "global_step": 241906, "epoch": 1439} {"train_loss": -10.991073608398438, "global_step": 241907, "epoch": 1439} {"train_loss": -11.155805587768555, "global_step": 241908, "epoch": 1439} {"train_loss": -11.193371772766113, "global_step": 241909, "epoch": 1439} {"train_loss": -11.542924880981445, "global_step": 241910, "epoch": 1439} {"train_loss": -11.541375160217285, "global_step": 241911, "epoch": 1439} {"train_loss": -11.46940803527832, "global_step": 241912, "epoch": 1439} {"train_loss": -11.429770469665527, "global_step": 241913, "epoch": 1439} {"train_loss": -11.521585464477539, "global_step": 241914, "epoch": 1439} {"train_loss": -11.605180740356445, "global_step": 241915, "epoch": 1439} {"train_loss": -11.523366928100586, "global_step": 241916, "epoch": 1439} {"train_loss": -11.394210815429688, "global_step": 241917, "epoch": 1439} {"train_loss": -11.299650192260742, "global_step": 241918, "epoch": 1439} {"train_loss": -11.220140190351577, "global_step": 241919, "epoch": 1439, "val_loss": 260714.203125} {"train_loss": -11.721488952636719, "global_step": 241920, "epoch": 1440} {"train_loss": -11.626472473144531, "global_step": 241921, "epoch": 1440} {"train_loss": -11.377693176269531, "global_step": 241922, "epoch": 1440} {"train_loss": -11.6134672164917, "global_step": 241923, "epoch": 1440} {"train_loss": -11.677305221557617, "global_step": 241924, "epoch": 1440} {"train_loss": -11.775254249572754, "global_step": 241925, "epoch": 1440} {"train_loss": -11.604486465454102, "global_step": 241926, "epoch": 1440} {"train_loss": -11.711359977722168, "global_step": 241927, "epoch": 1440} {"train_loss": -11.466907501220703, "global_step": 241928, "epoch": 1440} {"train_loss": -11.874526977539062, "global_step": 241929, "epoch": 1440} {"train_loss": -11.646894454956055, "global_step": 241930, "epoch": 1440} {"train_loss": -11.699203491210938, "global_step": 241931, "epoch": 1440} {"train_loss": -10.949941635131836, "global_step": 241932, "epoch": 1440} {"train_loss": -11.752277374267578, "global_step": 241933, "epoch": 1440} {"train_loss": -11.936856269836426, "global_step": 241934, "epoch": 1440} {"train_loss": -11.656477928161621, "global_step": 241935, "epoch": 1440} {"train_loss": -11.586971282958984, "global_step": 241936, "epoch": 1440} {"train_loss": -11.610223770141602, "global_step": 241937, "epoch": 1440} {"train_loss": -11.90414810180664, "global_step": 241938, "epoch": 1440} {"train_loss": -11.604280471801758, "global_step": 241939, "epoch": 1440} {"train_loss": -11.786433219909668, "global_step": 241940, "epoch": 1440} {"train_loss": -11.768207550048828, "global_step": 241941, "epoch": 1440} {"train_loss": -11.681318283081055, "global_step": 241942, "epoch": 1440} {"train_loss": -11.820228576660156, "global_step": 241943, "epoch": 1440} {"train_loss": -11.762138366699219, "global_step": 241944, "epoch": 1440} {"train_loss": -11.879104614257812, "global_step": 241945, "epoch": 1440} {"train_loss": -11.68144702911377, "global_step": 241946, "epoch": 1440} {"train_loss": -11.753748893737793, "global_step": 241947, "epoch": 1440} {"train_loss": -11.431939125061035, "global_step": 241948, "epoch": 1440} {"train_loss": -11.89586067199707, "global_step": 241949, "epoch": 1440} {"train_loss": -11.604808807373047, "global_step": 241950, "epoch": 1440} {"train_loss": -11.667231559753418, "global_step": 241951, "epoch": 1440} {"train_loss": -11.843219757080078, "global_step": 241952, "epoch": 1440} {"train_loss": -12.02214241027832, "global_step": 241953, "epoch": 1440} {"train_loss": -11.962949752807617, "global_step": 241954, "epoch": 1440} {"train_loss": -11.867120742797852, "global_step": 241955, "epoch": 1440} {"train_loss": -12.011863708496094, "global_step": 241956, "epoch": 1440} {"train_loss": -11.784403800964355, "global_step": 241957, "epoch": 1440} {"train_loss": -11.867574691772461, "global_step": 241958, "epoch": 1440} {"train_loss": -11.714338302612305, "global_step": 241959, "epoch": 1440} {"train_loss": -11.74488639831543, "global_step": 241960, "epoch": 1440} {"train_loss": -11.396312713623047, "global_step": 241961, "epoch": 1440} {"train_loss": -11.964118957519531, "global_step": 241962, "epoch": 1440} {"train_loss": -11.34492015838623, "global_step": 241963, "epoch": 1440} {"train_loss": -11.637710571289062, "global_step": 241964, "epoch": 1440} {"train_loss": -11.558347702026367, "global_step": 241965, "epoch": 1440} {"train_loss": -11.585251808166504, "global_step": 241966, "epoch": 1440} {"train_loss": -11.503235816955566, "global_step": 241967, "epoch": 1440} {"train_loss": -11.980070114135742, "global_step": 241968, "epoch": 1440} {"train_loss": -11.765437126159668, "global_step": 241969, "epoch": 1440} {"train_loss": -11.865534782409668, "global_step": 241970, "epoch": 1440} {"train_loss": -11.927772521972656, "global_step": 241971, "epoch": 1440} {"train_loss": -11.180074691772461, "global_step": 241972, "epoch": 1440} {"train_loss": -12.065513610839844, "global_step": 241973, "epoch": 1440} {"train_loss": -11.056863784790039, "global_step": 241974, "epoch": 1440} {"train_loss": -11.65304946899414, "global_step": 241975, "epoch": 1440} {"train_loss": -11.287046432495117, "global_step": 241976, "epoch": 1440} {"train_loss": -11.623987197875977, "global_step": 241977, "epoch": 1440} {"train_loss": -11.689264297485352, "global_step": 241978, "epoch": 1440} {"train_loss": -11.557281494140625, "global_step": 241979, "epoch": 1440} {"train_loss": -11.758916854858398, "global_step": 241980, "epoch": 1440} {"train_loss": -11.44048023223877, "global_step": 241981, "epoch": 1440} {"train_loss": -12.183442115783691, "global_step": 241982, "epoch": 1440} {"train_loss": -11.6151123046875, "global_step": 241983, "epoch": 1440} {"train_loss": -11.904626846313477, "global_step": 241984, "epoch": 1440} {"train_loss": -11.681900024414062, "global_step": 241985, "epoch": 1440} {"train_loss": -11.985906600952148, "global_step": 241986, "epoch": 1440} {"train_loss": -11.473230361938477, "global_step": 241987, "epoch": 1440} {"train_loss": -11.878230094909668, "global_step": 241988, "epoch": 1440} {"train_loss": -11.713216781616211, "global_step": 241989, "epoch": 1440} {"train_loss": -10.932723999023438, "global_step": 241990, "epoch": 1440} {"train_loss": -11.55792236328125, "global_step": 241991, "epoch": 1440} {"train_loss": -11.542078971862793, "global_step": 241992, "epoch": 1440} {"train_loss": -11.046905517578125, "global_step": 241993, "epoch": 1440} {"train_loss": -11.308465957641602, "global_step": 241994, "epoch": 1440} {"train_loss": -12.008997917175293, "global_step": 241995, "epoch": 1440} {"train_loss": -11.557052612304688, "global_step": 241996, "epoch": 1440} {"train_loss": -11.850786209106445, "global_step": 241997, "epoch": 1440} {"train_loss": -11.650703430175781, "global_step": 241998, "epoch": 1440} {"train_loss": -11.406018257141113, "global_step": 241999, "epoch": 1440} {"train_loss": -11.721014022827148, "global_step": 242000, "epoch": 1440} {"train_loss": -11.842896461486816, "global_step": 242001, "epoch": 1440} {"train_loss": -11.6524658203125, "global_step": 242002, "epoch": 1440} {"train_loss": -11.431549072265625, "global_step": 242003, "epoch": 1440} {"train_loss": -11.775527954101562, "global_step": 242004, "epoch": 1440} {"train_loss": -11.508781433105469, "global_step": 242005, "epoch": 1440} {"train_loss": -11.72518539428711, "global_step": 242006, "epoch": 1440} {"train_loss": -11.851448059082031, "global_step": 242007, "epoch": 1440} {"train_loss": -11.345794677734375, "global_step": 242008, "epoch": 1440} {"train_loss": -11.608981132507324, "global_step": 242009, "epoch": 1440} {"train_loss": -11.371959686279297, "global_step": 242010, "epoch": 1440} {"train_loss": -11.6878080368042, "global_step": 242011, "epoch": 1440} {"train_loss": -11.516270637512207, "global_step": 242012, "epoch": 1440} {"train_loss": -10.445385932922363, "global_step": 242013, "epoch": 1440} {"train_loss": -10.896562576293945, "global_step": 242014, "epoch": 1440} {"train_loss": -10.841850280761719, "global_step": 242015, "epoch": 1440} {"train_loss": -11.484025955200195, "global_step": 242016, "epoch": 1440} {"train_loss": -10.588440895080566, "global_step": 242017, "epoch": 1440} {"train_loss": -11.107987403869629, "global_step": 242018, "epoch": 1440} {"train_loss": -11.592260360717773, "global_step": 242019, "epoch": 1440} {"train_loss": -11.222556114196777, "global_step": 242020, "epoch": 1440} {"train_loss": -11.02592945098877, "global_step": 242021, "epoch": 1440} {"train_loss": -11.213218688964844, "global_step": 242022, "epoch": 1440} {"train_loss": -10.528190612792969, "global_step": 242023, "epoch": 1440} {"train_loss": -11.322256088256836, "global_step": 242024, "epoch": 1440} {"train_loss": -10.647855758666992, "global_step": 242025, "epoch": 1440} {"train_loss": -11.443620681762695, "global_step": 242026, "epoch": 1440} {"train_loss": -10.85380744934082, "global_step": 242027, "epoch": 1440} {"train_loss": -10.901939392089844, "global_step": 242028, "epoch": 1440} {"train_loss": -11.067813873291016, "global_step": 242029, "epoch": 1440} {"train_loss": -10.934351921081543, "global_step": 242030, "epoch": 1440} {"train_loss": -11.488022804260254, "global_step": 242031, "epoch": 1440} {"train_loss": -10.747398376464844, "global_step": 242032, "epoch": 1440} {"train_loss": -11.33140754699707, "global_step": 242033, "epoch": 1440} {"train_loss": -11.102540969848633, "global_step": 242034, "epoch": 1440} {"train_loss": -10.949511528015137, "global_step": 242035, "epoch": 1440} {"train_loss": -11.126415252685547, "global_step": 242036, "epoch": 1440} {"train_loss": -11.095979690551758, "global_step": 242037, "epoch": 1440} {"train_loss": -11.518025398254395, "global_step": 242038, "epoch": 1440} {"train_loss": -11.132882118225098, "global_step": 242039, "epoch": 1440} {"train_loss": -11.71595573425293, "global_step": 242040, "epoch": 1440} {"train_loss": -11.272063255310059, "global_step": 242041, "epoch": 1440} {"train_loss": -11.291895866394043, "global_step": 242042, "epoch": 1440} {"train_loss": -11.68399715423584, "global_step": 242043, "epoch": 1440} {"train_loss": -11.289146423339844, "global_step": 242044, "epoch": 1440} {"train_loss": -11.64507007598877, "global_step": 242045, "epoch": 1440} {"train_loss": -11.161619186401367, "global_step": 242046, "epoch": 1440} {"train_loss": -11.71742057800293, "global_step": 242047, "epoch": 1440} {"train_loss": -11.787660598754883, "global_step": 242048, "epoch": 1440} {"train_loss": -11.871944427490234, "global_step": 242049, "epoch": 1440} {"train_loss": -11.819686889648438, "global_step": 242050, "epoch": 1440} {"train_loss": -11.494364738464355, "global_step": 242051, "epoch": 1440} {"train_loss": -11.639717102050781, "global_step": 242052, "epoch": 1440} {"train_loss": -11.983516693115234, "global_step": 242053, "epoch": 1440} {"train_loss": -11.546555519104004, "global_step": 242054, "epoch": 1440} {"train_loss": -11.813238143920898, "global_step": 242055, "epoch": 1440} {"train_loss": -11.615946769714355, "global_step": 242056, "epoch": 1440} {"train_loss": -11.797555923461914, "global_step": 242057, "epoch": 1440} {"train_loss": -11.837376594543457, "global_step": 242058, "epoch": 1440} {"train_loss": -11.779261589050293, "global_step": 242059, "epoch": 1440} {"train_loss": -11.903401374816895, "global_step": 242060, "epoch": 1440} {"train_loss": -11.84970474243164, "global_step": 242061, "epoch": 1440} {"train_loss": -11.85899543762207, "global_step": 242062, "epoch": 1440} {"train_loss": -11.897750854492188, "global_step": 242063, "epoch": 1440} {"train_loss": -12.003538131713867, "global_step": 242064, "epoch": 1440} {"train_loss": -11.990501403808594, "global_step": 242065, "epoch": 1440} {"train_loss": -11.602333068847656, "global_step": 242066, "epoch": 1440} {"train_loss": -11.645965576171875, "global_step": 242067, "epoch": 1440} {"train_loss": -11.936403274536133, "global_step": 242068, "epoch": 1440} {"train_loss": -11.588088989257812, "global_step": 242069, "epoch": 1440} {"train_loss": -11.728435516357422, "global_step": 242070, "epoch": 1440} {"train_loss": -11.993160247802734, "global_step": 242071, "epoch": 1440} {"train_loss": -11.58398151397705, "global_step": 242072, "epoch": 1440} {"train_loss": -12.108558654785156, "global_step": 242073, "epoch": 1440} {"train_loss": -11.381721496582031, "global_step": 242074, "epoch": 1440} {"train_loss": -12.146352767944336, "global_step": 242075, "epoch": 1440} {"train_loss": -11.621187210083008, "global_step": 242076, "epoch": 1440} {"train_loss": -11.953560829162598, "global_step": 242077, "epoch": 1440} {"train_loss": -11.740886688232422, "global_step": 242078, "epoch": 1440} {"train_loss": -11.41203498840332, "global_step": 242079, "epoch": 1440} {"train_loss": -11.712462425231934, "global_step": 242080, "epoch": 1440} {"train_loss": -11.606992721557617, "global_step": 242081, "epoch": 1440} {"train_loss": -11.834598541259766, "global_step": 242082, "epoch": 1440} {"train_loss": -12.047697067260742, "global_step": 242083, "epoch": 1440} {"train_loss": -11.864563941955566, "global_step": 242084, "epoch": 1440} {"train_loss": -11.98202896118164, "global_step": 242085, "epoch": 1440} {"train_loss": -12.005525588989258, "global_step": 242086, "epoch": 1440} {"train_loss": -11.587838785988945, "global_step": 242087, "epoch": 1440, "val_loss": 260786.25, "train_action_mse_error": 2.0373988151550293} {"train_loss": -11.935193061828613, "global_step": 242088, "epoch": 1441} {"train_loss": -12.05370807647705, "global_step": 242089, "epoch": 1441} {"train_loss": -12.110432624816895, "global_step": 242090, "epoch": 1441} {"train_loss": -12.013014793395996, "global_step": 242091, "epoch": 1441} {"train_loss": -12.001206398010254, "global_step": 242092, "epoch": 1441} {"train_loss": -12.021345138549805, "global_step": 242093, "epoch": 1441} {"train_loss": -12.004695892333984, "global_step": 242094, "epoch": 1441} {"train_loss": -12.113870620727539, "global_step": 242095, "epoch": 1441} {"train_loss": -12.029427528381348, "global_step": 242096, "epoch": 1441} {"train_loss": -12.088277816772461, "global_step": 242097, "epoch": 1441} {"train_loss": -11.674972534179688, "global_step": 242098, "epoch": 1441} {"train_loss": -11.594826698303223, "global_step": 242099, "epoch": 1441} {"train_loss": -11.787015914916992, "global_step": 242100, "epoch": 1441} {"train_loss": -11.007932662963867, "global_step": 242101, "epoch": 1441} {"train_loss": -11.327839851379395, "global_step": 242102, "epoch": 1441} {"train_loss": -11.805103302001953, "global_step": 242103, "epoch": 1441} {"train_loss": -11.634735107421875, "global_step": 242104, "epoch": 1441} {"train_loss": -11.444958686828613, "global_step": 242105, "epoch": 1441} {"train_loss": -12.13567066192627, "global_step": 242106, "epoch": 1441} {"train_loss": -12.001453399658203, "global_step": 242107, "epoch": 1441} {"train_loss": -11.718613624572754, "global_step": 242108, "epoch": 1441} {"train_loss": -11.522417068481445, "global_step": 242109, "epoch": 1441} {"train_loss": -11.989019393920898, "global_step": 242110, "epoch": 1441} {"train_loss": -11.928943634033203, "global_step": 242111, "epoch": 1441} {"train_loss": -11.895515441894531, "global_step": 242112, "epoch": 1441} {"train_loss": -11.938255310058594, "global_step": 242113, "epoch": 1441} {"train_loss": -11.669567108154297, "global_step": 242114, "epoch": 1441} {"train_loss": -12.150586128234863, "global_step": 242115, "epoch": 1441} {"train_loss": -11.378650665283203, "global_step": 242116, "epoch": 1441} {"train_loss": -11.676961898803711, "global_step": 242117, "epoch": 1441} {"train_loss": -11.33711051940918, "global_step": 242118, "epoch": 1441} {"train_loss": -11.305538177490234, "global_step": 242119, "epoch": 1441} {"train_loss": -11.316865921020508, "global_step": 242120, "epoch": 1441} {"train_loss": -11.634851455688477, "global_step": 242121, "epoch": 1441} {"train_loss": -11.141129493713379, "global_step": 242122, "epoch": 1441} {"train_loss": -11.48946762084961, "global_step": 242123, "epoch": 1441} {"train_loss": -11.267675399780273, "global_step": 242124, "epoch": 1441} {"train_loss": -11.373617172241211, "global_step": 242125, "epoch": 1441} {"train_loss": -11.89093017578125, "global_step": 242126, "epoch": 1441} {"train_loss": -11.735017776489258, "global_step": 242127, "epoch": 1441} {"train_loss": -11.488200187683105, "global_step": 242128, "epoch": 1441} {"train_loss": -11.894468307495117, "global_step": 242129, "epoch": 1441} {"train_loss": -11.73320198059082, "global_step": 242130, "epoch": 1441} {"train_loss": -11.842827796936035, "global_step": 242131, "epoch": 1441} {"train_loss": -11.69465446472168, "global_step": 242132, "epoch": 1441} {"train_loss": -11.460418701171875, "global_step": 242133, "epoch": 1441} {"train_loss": -11.312135696411133, "global_step": 242134, "epoch": 1441} {"train_loss": -11.136103630065918, "global_step": 242135, "epoch": 1441} {"train_loss": -11.200718879699707, "global_step": 242136, "epoch": 1441} {"train_loss": -11.749551773071289, "global_step": 242137, "epoch": 1441} {"train_loss": -11.186281204223633, "global_step": 242138, "epoch": 1441} {"train_loss": -11.512065887451172, "global_step": 242139, "epoch": 1441} {"train_loss": -10.897594451904297, "global_step": 242140, "epoch": 1441} {"train_loss": -11.822254180908203, "global_step": 242141, "epoch": 1441} {"train_loss": -11.081561088562012, "global_step": 242142, "epoch": 1441} {"train_loss": -11.525705337524414, "global_step": 242143, "epoch": 1441} {"train_loss": -10.463069915771484, "global_step": 242144, "epoch": 1441} {"train_loss": -11.819931983947754, "global_step": 242145, "epoch": 1441} {"train_loss": -11.140098571777344, "global_step": 242146, "epoch": 1441} {"train_loss": -10.548944473266602, "global_step": 242147, "epoch": 1441} {"train_loss": -11.220462799072266, "global_step": 242148, "epoch": 1441} {"train_loss": -11.470251083374023, "global_step": 242149, "epoch": 1441} {"train_loss": -10.998292922973633, "global_step": 242150, "epoch": 1441} {"train_loss": -10.887443542480469, "global_step": 242151, "epoch": 1441} {"train_loss": -11.145992279052734, "global_step": 242152, "epoch": 1441} {"train_loss": -10.114706039428711, "global_step": 242153, "epoch": 1441} {"train_loss": -11.68459415435791, "global_step": 242154, "epoch": 1441} {"train_loss": -10.998838424682617, "global_step": 242155, "epoch": 1441} {"train_loss": -11.084075927734375, "global_step": 242156, "epoch": 1441} {"train_loss": -11.60775375366211, "global_step": 242157, "epoch": 1441} {"train_loss": -11.062582015991211, "global_step": 242158, "epoch": 1441} {"train_loss": -11.731285095214844, "global_step": 242159, "epoch": 1441} {"train_loss": -11.685630798339844, "global_step": 242160, "epoch": 1441} {"train_loss": -11.052286148071289, "global_step": 242161, "epoch": 1441} {"train_loss": -11.612985610961914, "global_step": 242162, "epoch": 1441} {"train_loss": -11.024412155151367, "global_step": 242163, "epoch": 1441} {"train_loss": -11.491270065307617, "global_step": 242164, "epoch": 1441} {"train_loss": -11.325891494750977, "global_step": 242165, "epoch": 1441} {"train_loss": -11.292028427124023, "global_step": 242166, "epoch": 1441} {"train_loss": -11.769329071044922, "global_step": 242167, "epoch": 1441} {"train_loss": -11.503039360046387, "global_step": 242168, "epoch": 1441} {"train_loss": -11.71273136138916, "global_step": 242169, "epoch": 1441} {"train_loss": -11.502208709716797, "global_step": 242170, "epoch": 1441} {"train_loss": -11.238495826721191, "global_step": 242171, "epoch": 1441} {"train_loss": -11.60344123840332, "global_step": 242172, "epoch": 1441} {"train_loss": -11.583888053894043, "global_step": 242173, "epoch": 1441} {"train_loss": -11.599084854125977, "global_step": 242174, "epoch": 1441} {"train_loss": -11.942601203918457, "global_step": 242175, "epoch": 1441} {"train_loss": -11.658416748046875, "global_step": 242176, "epoch": 1441} {"train_loss": -11.936601638793945, "global_step": 242177, "epoch": 1441} {"train_loss": -11.471456527709961, "global_step": 242178, "epoch": 1441} {"train_loss": -11.725112915039062, "global_step": 242179, "epoch": 1441} {"train_loss": -11.744800567626953, "global_step": 242180, "epoch": 1441} {"train_loss": -11.86862564086914, "global_step": 242181, "epoch": 1441} {"train_loss": -11.777487754821777, "global_step": 242182, "epoch": 1441} {"train_loss": -11.605812072753906, "global_step": 242183, "epoch": 1441} {"train_loss": -12.060860633850098, "global_step": 242184, "epoch": 1441} {"train_loss": -11.730926513671875, "global_step": 242185, "epoch": 1441} {"train_loss": -11.888129234313965, "global_step": 242186, "epoch": 1441} {"train_loss": -11.54861068725586, "global_step": 242187, "epoch": 1441} {"train_loss": -12.012899398803711, "global_step": 242188, "epoch": 1441} {"train_loss": -11.64017105102539, "global_step": 242189, "epoch": 1441} {"train_loss": -11.826362609863281, "global_step": 242190, "epoch": 1441} {"train_loss": -11.420160293579102, "global_step": 242191, "epoch": 1441} {"train_loss": -11.738117218017578, "global_step": 242192, "epoch": 1441} {"train_loss": -11.595659255981445, "global_step": 242193, "epoch": 1441} {"train_loss": -11.172540664672852, "global_step": 242194, "epoch": 1441} {"train_loss": -11.341060638427734, "global_step": 242195, "epoch": 1441} {"train_loss": -11.678115844726562, "global_step": 242196, "epoch": 1441} {"train_loss": -11.010568618774414, "global_step": 242197, "epoch": 1441} {"train_loss": -11.461621284484863, "global_step": 242198, "epoch": 1441} {"train_loss": -11.758697509765625, "global_step": 242199, "epoch": 1441} {"train_loss": -11.165517807006836, "global_step": 242200, "epoch": 1441} {"train_loss": -11.028205871582031, "global_step": 242201, "epoch": 1441} {"train_loss": -11.58694076538086, "global_step": 242202, "epoch": 1441} {"train_loss": -10.855302810668945, "global_step": 242203, "epoch": 1441} {"train_loss": -11.90880012512207, "global_step": 242204, "epoch": 1441} {"train_loss": -10.987499237060547, "global_step": 242205, "epoch": 1441} {"train_loss": -11.69903564453125, "global_step": 242206, "epoch": 1441} {"train_loss": -11.353778839111328, "global_step": 242207, "epoch": 1441} {"train_loss": -10.883890151977539, "global_step": 242208, "epoch": 1441} {"train_loss": -11.253332138061523, "global_step": 242209, "epoch": 1441} {"train_loss": -11.82010269165039, "global_step": 242210, "epoch": 1441} {"train_loss": -11.073606491088867, "global_step": 242211, "epoch": 1441} {"train_loss": -11.657575607299805, "global_step": 242212, "epoch": 1441} {"train_loss": -11.686931610107422, "global_step": 242213, "epoch": 1441} {"train_loss": -11.587041854858398, "global_step": 242214, "epoch": 1441} {"train_loss": -11.768125534057617, "global_step": 242215, "epoch": 1441} {"train_loss": -11.63996696472168, "global_step": 242216, "epoch": 1441} {"train_loss": -11.881702423095703, "global_step": 242217, "epoch": 1441} {"train_loss": -11.939340591430664, "global_step": 242218, "epoch": 1441} {"train_loss": -11.906686782836914, "global_step": 242219, "epoch": 1441} {"train_loss": -11.910612106323242, "global_step": 242220, "epoch": 1441} {"train_loss": -11.648791313171387, "global_step": 242221, "epoch": 1441} {"train_loss": -11.929220199584961, "global_step": 242222, "epoch": 1441} {"train_loss": -11.735252380371094, "global_step": 242223, "epoch": 1441} {"train_loss": -11.942245483398438, "global_step": 242224, "epoch": 1441} {"train_loss": -11.580850601196289, "global_step": 242225, "epoch": 1441} {"train_loss": -12.176697731018066, "global_step": 242226, "epoch": 1441} {"train_loss": -11.783668518066406, "global_step": 242227, "epoch": 1441} {"train_loss": -11.766165733337402, "global_step": 242228, "epoch": 1441} {"train_loss": -11.478926658630371, "global_step": 242229, "epoch": 1441} {"train_loss": -11.666942596435547, "global_step": 242230, "epoch": 1441} {"train_loss": -11.782651901245117, "global_step": 242231, "epoch": 1441} {"train_loss": -11.545195579528809, "global_step": 242232, "epoch": 1441} {"train_loss": -11.56192398071289, "global_step": 242233, "epoch": 1441} {"train_loss": -11.361211776733398, "global_step": 242234, "epoch": 1441} {"train_loss": -11.59407901763916, "global_step": 242235, "epoch": 1441} {"train_loss": -11.74999713897705, "global_step": 242236, "epoch": 1441} {"train_loss": -11.639098167419434, "global_step": 242237, "epoch": 1441} {"train_loss": -11.565082550048828, "global_step": 242238, "epoch": 1441} {"train_loss": -11.920860290527344, "global_step": 242239, "epoch": 1441} {"train_loss": -11.710832595825195, "global_step": 242240, "epoch": 1441} {"train_loss": -11.356736183166504, "global_step": 242241, "epoch": 1441} {"train_loss": -11.961414337158203, "global_step": 242242, "epoch": 1441} {"train_loss": -11.649402618408203, "global_step": 242243, "epoch": 1441} {"train_loss": -11.648174285888672, "global_step": 242244, "epoch": 1441} {"train_loss": -11.256199836730957, "global_step": 242245, "epoch": 1441} {"train_loss": -11.281274795532227, "global_step": 242246, "epoch": 1441} {"train_loss": -11.323540687561035, "global_step": 242247, "epoch": 1441} {"train_loss": -11.411495208740234, "global_step": 242248, "epoch": 1441} {"train_loss": -11.050028800964355, "global_step": 242249, "epoch": 1441} {"train_loss": -11.354232788085938, "global_step": 242250, "epoch": 1441} {"train_loss": -11.085437774658203, "global_step": 242251, "epoch": 1441} {"train_loss": -11.612468719482422, "global_step": 242252, "epoch": 1441} {"train_loss": -11.255027770996094, "global_step": 242253, "epoch": 1441} {"train_loss": -11.25426959991455, "global_step": 242254, "epoch": 1441} {"train_loss": -11.553685926255726, "global_step": 242255, "epoch": 1441, "val_loss": 264293.84375} {"train_loss": -10.891241073608398, "global_step": 242256, "epoch": 1442} {"train_loss": -11.023832321166992, "global_step": 242257, "epoch": 1442} {"train_loss": -10.155445098876953, "global_step": 242258, "epoch": 1442} {"train_loss": -11.477154731750488, "global_step": 242259, "epoch": 1442} {"train_loss": -10.453075408935547, "global_step": 242260, "epoch": 1442} {"train_loss": -11.22757339477539, "global_step": 242261, "epoch": 1442} {"train_loss": -10.468374252319336, "global_step": 242262, "epoch": 1442} {"train_loss": -8.962969779968262, "global_step": 242263, "epoch": 1442} {"train_loss": -8.99071216583252, "global_step": 242264, "epoch": 1442} {"train_loss": -10.438274383544922, "global_step": 242265, "epoch": 1442} {"train_loss": -10.124320983886719, "global_step": 242266, "epoch": 1442} {"train_loss": -9.773347854614258, "global_step": 242267, "epoch": 1442} {"train_loss": -10.589054107666016, "global_step": 242268, "epoch": 1442} {"train_loss": -10.697636604309082, "global_step": 242269, "epoch": 1442} {"train_loss": -10.84730339050293, "global_step": 242270, "epoch": 1442} {"train_loss": -11.325018882751465, "global_step": 242271, "epoch": 1442} {"train_loss": -10.514556884765625, "global_step": 242272, "epoch": 1442} {"train_loss": -10.560341835021973, "global_step": 242273, "epoch": 1442} {"train_loss": -11.15263843536377, "global_step": 242274, "epoch": 1442} {"train_loss": -9.968076705932617, "global_step": 242275, "epoch": 1442} {"train_loss": -11.382065773010254, "global_step": 242276, "epoch": 1442} {"train_loss": -10.71748161315918, "global_step": 242277, "epoch": 1442} {"train_loss": -11.014578819274902, "global_step": 242278, "epoch": 1442} {"train_loss": -11.212204933166504, "global_step": 242279, "epoch": 1442} {"train_loss": -11.212686538696289, "global_step": 242280, "epoch": 1442} {"train_loss": -11.332890510559082, "global_step": 242281, "epoch": 1442} {"train_loss": -11.576986312866211, "global_step": 242282, "epoch": 1442} {"train_loss": -11.029623031616211, "global_step": 242283, "epoch": 1442} {"train_loss": -11.398982048034668, "global_step": 242284, "epoch": 1442} {"train_loss": -11.414445877075195, "global_step": 242285, "epoch": 1442} {"train_loss": -11.387716293334961, "global_step": 242286, "epoch": 1442} {"train_loss": -11.346368789672852, "global_step": 242287, "epoch": 1442} {"train_loss": -11.081069946289062, "global_step": 242288, "epoch": 1442} {"train_loss": -11.512927055358887, "global_step": 242289, "epoch": 1442} {"train_loss": -11.147195816040039, "global_step": 242290, "epoch": 1442} {"train_loss": -11.541560173034668, "global_step": 242291, "epoch": 1442} {"train_loss": -11.159818649291992, "global_step": 242292, "epoch": 1442} {"train_loss": -11.542654037475586, "global_step": 242293, "epoch": 1442} {"train_loss": -11.257820129394531, "global_step": 242294, "epoch": 1442} {"train_loss": -11.708833694458008, "global_step": 242295, "epoch": 1442} {"train_loss": -11.403980255126953, "global_step": 242296, "epoch": 1442} {"train_loss": -11.219503402709961, "global_step": 242297, "epoch": 1442} {"train_loss": -11.533632278442383, "global_step": 242298, "epoch": 1442} {"train_loss": -11.33100700378418, "global_step": 242299, "epoch": 1442} {"train_loss": -11.730096817016602, "global_step": 242300, "epoch": 1442} {"train_loss": -11.27187442779541, "global_step": 242301, "epoch": 1442} {"train_loss": -11.665010452270508, "global_step": 242302, "epoch": 1442} {"train_loss": -11.506204605102539, "global_step": 242303, "epoch": 1442} {"train_loss": -11.724241256713867, "global_step": 242304, "epoch": 1442} {"train_loss": -11.51715087890625, "global_step": 242305, "epoch": 1442} {"train_loss": -11.419900894165039, "global_step": 242306, "epoch": 1442} {"train_loss": -11.592813491821289, "global_step": 242307, "epoch": 1442} {"train_loss": -11.448898315429688, "global_step": 242308, "epoch": 1442} {"train_loss": -11.735629081726074, "global_step": 242309, "epoch": 1442} {"train_loss": -11.49459457397461, "global_step": 242310, "epoch": 1442} {"train_loss": -11.840810775756836, "global_step": 242311, "epoch": 1442} {"train_loss": -11.206335067749023, "global_step": 242312, "epoch": 1442} {"train_loss": -11.845831871032715, "global_step": 242313, "epoch": 1442} {"train_loss": -11.721397399902344, "global_step": 242314, "epoch": 1442} {"train_loss": -11.652867317199707, "global_step": 242315, "epoch": 1442} {"train_loss": -11.753323554992676, "global_step": 242316, "epoch": 1442} {"train_loss": -11.670949935913086, "global_step": 242317, "epoch": 1442} {"train_loss": -11.713955879211426, "global_step": 242318, "epoch": 1442} {"train_loss": -11.764379501342773, "global_step": 242319, "epoch": 1442} {"train_loss": -11.593192100524902, "global_step": 242320, "epoch": 1442} {"train_loss": -11.80029582977295, "global_step": 242321, "epoch": 1442} {"train_loss": -11.729751586914062, "global_step": 242322, "epoch": 1442} {"train_loss": -11.544153213500977, "global_step": 242323, "epoch": 1442} {"train_loss": -11.886298179626465, "global_step": 242324, "epoch": 1442} {"train_loss": -11.432722091674805, "global_step": 242325, "epoch": 1442} {"train_loss": -11.858144760131836, "global_step": 242326, "epoch": 1442} {"train_loss": -11.692895889282227, "global_step": 242327, "epoch": 1442} {"train_loss": -11.884663581848145, "global_step": 242328, "epoch": 1442} {"train_loss": -11.90295696258545, "global_step": 242329, "epoch": 1442} {"train_loss": -11.961214065551758, "global_step": 242330, "epoch": 1442} {"train_loss": -11.814677238464355, "global_step": 242331, "epoch": 1442} {"train_loss": -11.773632049560547, "global_step": 242332, "epoch": 1442} {"train_loss": -11.793798446655273, "global_step": 242333, "epoch": 1442} {"train_loss": -11.687549591064453, "global_step": 242334, "epoch": 1442} {"train_loss": -11.955602645874023, "global_step": 242335, "epoch": 1442} {"train_loss": -11.657922744750977, "global_step": 242336, "epoch": 1442} {"train_loss": -11.82435417175293, "global_step": 242337, "epoch": 1442} {"train_loss": -11.630966186523438, "global_step": 242338, "epoch": 1442} {"train_loss": -11.89400863647461, "global_step": 242339, "epoch": 1442} {"train_loss": -11.82822322845459, "global_step": 242340, "epoch": 1442} {"train_loss": -11.815220832824707, "global_step": 242341, "epoch": 1442} {"train_loss": -11.83144760131836, "global_step": 242342, "epoch": 1442} {"train_loss": -11.78769302368164, "global_step": 242343, "epoch": 1442} {"train_loss": -11.931222915649414, "global_step": 242344, "epoch": 1442} {"train_loss": -11.929312705993652, "global_step": 242345, "epoch": 1442} {"train_loss": -11.913727760314941, "global_step": 242346, "epoch": 1442} {"train_loss": -11.932306289672852, "global_step": 242347, "epoch": 1442} {"train_loss": -11.89361572265625, "global_step": 242348, "epoch": 1442} {"train_loss": -12.22415542602539, "global_step": 242349, "epoch": 1442} {"train_loss": -11.807114601135254, "global_step": 242350, "epoch": 1442} {"train_loss": -12.01036262512207, "global_step": 242351, "epoch": 1442} {"train_loss": -11.965965270996094, "global_step": 242352, "epoch": 1442} {"train_loss": -12.061473846435547, "global_step": 242353, "epoch": 1442} {"train_loss": -11.926535606384277, "global_step": 242354, "epoch": 1442} {"train_loss": -11.975714683532715, "global_step": 242355, "epoch": 1442} {"train_loss": -12.086952209472656, "global_step": 242356, "epoch": 1442} {"train_loss": -12.031899452209473, "global_step": 242357, "epoch": 1442} {"train_loss": -12.198371887207031, "global_step": 242358, "epoch": 1442} {"train_loss": -11.850954055786133, "global_step": 242359, "epoch": 1442} {"train_loss": -12.003843307495117, "global_step": 242360, "epoch": 1442} {"train_loss": -12.298211097717285, "global_step": 242361, "epoch": 1442} {"train_loss": -11.828460693359375, "global_step": 242362, "epoch": 1442} {"train_loss": -12.00520133972168, "global_step": 242363, "epoch": 1442} {"train_loss": -11.68610954284668, "global_step": 242364, "epoch": 1442} {"train_loss": -11.843748092651367, "global_step": 242365, "epoch": 1442} {"train_loss": -11.62598991394043, "global_step": 242366, "epoch": 1442} {"train_loss": -11.931185722351074, "global_step": 242367, "epoch": 1442} {"train_loss": -12.067268371582031, "global_step": 242368, "epoch": 1442} {"train_loss": -11.835229873657227, "global_step": 242369, "epoch": 1442} {"train_loss": -11.054449081420898, "global_step": 242370, "epoch": 1442} {"train_loss": -8.20460033416748, "global_step": 242371, "epoch": 1442} {"train_loss": -11.36162281036377, "global_step": 242372, "epoch": 1442} {"train_loss": -9.704092025756836, "global_step": 242373, "epoch": 1442} {"train_loss": -9.864500999450684, "global_step": 242374, "epoch": 1442} {"train_loss": -10.503009796142578, "global_step": 242375, "epoch": 1442} {"train_loss": -11.569443702697754, "global_step": 242376, "epoch": 1442} {"train_loss": -11.211181640625, "global_step": 242377, "epoch": 1442} {"train_loss": -11.134023666381836, "global_step": 242378, "epoch": 1442} {"train_loss": -11.55705451965332, "global_step": 242379, "epoch": 1442} {"train_loss": -11.187714576721191, "global_step": 242380, "epoch": 1442} {"train_loss": -10.006948471069336, "global_step": 242381, "epoch": 1442} {"train_loss": -11.1693115234375, "global_step": 242382, "epoch": 1442} {"train_loss": -10.714302062988281, "global_step": 242383, "epoch": 1442} {"train_loss": -10.217083930969238, "global_step": 242384, "epoch": 1442} {"train_loss": -10.349973678588867, "global_step": 242385, "epoch": 1442} {"train_loss": -10.722047805786133, "global_step": 242386, "epoch": 1442} {"train_loss": -9.062484741210938, "global_step": 242387, "epoch": 1442} {"train_loss": -10.638216018676758, "global_step": 242388, "epoch": 1442} {"train_loss": -8.560325622558594, "global_step": 242389, "epoch": 1442} {"train_loss": -11.263272285461426, "global_step": 242390, "epoch": 1442} {"train_loss": -10.46867847442627, "global_step": 242391, "epoch": 1442} {"train_loss": -10.643058776855469, "global_step": 242392, "epoch": 1442} {"train_loss": -11.028708457946777, "global_step": 242393, "epoch": 1442} {"train_loss": -10.754493713378906, "global_step": 242394, "epoch": 1442} {"train_loss": -10.569060325622559, "global_step": 242395, "epoch": 1442} {"train_loss": -10.948160171508789, "global_step": 242396, "epoch": 1442} {"train_loss": -9.726049423217773, "global_step": 242397, "epoch": 1442} {"train_loss": -10.83558464050293, "global_step": 242398, "epoch": 1442} {"train_loss": -11.306464195251465, "global_step": 242399, "epoch": 1442} {"train_loss": -11.269781112670898, "global_step": 242400, "epoch": 1442} {"train_loss": -11.495731353759766, "global_step": 242401, "epoch": 1442} {"train_loss": -11.323616027832031, "global_step": 242402, "epoch": 1442} {"train_loss": -10.964372634887695, "global_step": 242403, "epoch": 1442} {"train_loss": -11.617620468139648, "global_step": 242404, "epoch": 1442} {"train_loss": -10.830850601196289, "global_step": 242405, "epoch": 1442} {"train_loss": -11.57819938659668, "global_step": 242406, "epoch": 1442} {"train_loss": -11.102493286132812, "global_step": 242407, "epoch": 1442} {"train_loss": -10.985036849975586, "global_step": 242408, "epoch": 1442} {"train_loss": -11.232707977294922, "global_step": 242409, "epoch": 1442} {"train_loss": -10.634025573730469, "global_step": 242410, "epoch": 1442} {"train_loss": -11.079133987426758, "global_step": 242411, "epoch": 1442} {"train_loss": -11.195415496826172, "global_step": 242412, "epoch": 1442} {"train_loss": -10.490554809570312, "global_step": 242413, "epoch": 1442} {"train_loss": -11.299668312072754, "global_step": 242414, "epoch": 1442} {"train_loss": -10.633682250976562, "global_step": 242415, "epoch": 1442} {"train_loss": -10.592544555664062, "global_step": 242416, "epoch": 1442} {"train_loss": -11.324325561523438, "global_step": 242417, "epoch": 1442} {"train_loss": -10.595603942871094, "global_step": 242418, "epoch": 1442} {"train_loss": -10.868035316467285, "global_step": 242419, "epoch": 1442} {"train_loss": -11.558530807495117, "global_step": 242420, "epoch": 1442} {"train_loss": -10.796818733215332, "global_step": 242421, "epoch": 1442} {"train_loss": -11.210674285888672, "global_step": 242422, "epoch": 1442} {"train_loss": -11.244037196749733, "global_step": 242423, "epoch": 1442, "val_loss": 265381.625} {"train_loss": -11.159915924072266, "global_step": 242424, "epoch": 1443} {"train_loss": -11.362629890441895, "global_step": 242425, "epoch": 1443} {"train_loss": -11.606823921203613, "global_step": 242426, "epoch": 1443} {"train_loss": -11.299894332885742, "global_step": 242427, "epoch": 1443} {"train_loss": -11.590303421020508, "global_step": 242428, "epoch": 1443} {"train_loss": -11.433124542236328, "global_step": 242429, "epoch": 1443} {"train_loss": -11.435229301452637, "global_step": 242430, "epoch": 1443} {"train_loss": -11.303487777709961, "global_step": 242431, "epoch": 1443} {"train_loss": -11.696539878845215, "global_step": 242432, "epoch": 1443} {"train_loss": -11.43333625793457, "global_step": 242433, "epoch": 1443} {"train_loss": -11.737848281860352, "global_step": 242434, "epoch": 1443} {"train_loss": -11.533388137817383, "global_step": 242435, "epoch": 1443} {"train_loss": -11.512284278869629, "global_step": 242436, "epoch": 1443} {"train_loss": -11.712345123291016, "global_step": 242437, "epoch": 1443} {"train_loss": -11.713939666748047, "global_step": 242438, "epoch": 1443} {"train_loss": -11.636524200439453, "global_step": 242439, "epoch": 1443} {"train_loss": -11.537740707397461, "global_step": 242440, "epoch": 1443} {"train_loss": -11.55826187133789, "global_step": 242441, "epoch": 1443} {"train_loss": -11.604602813720703, "global_step": 242442, "epoch": 1443} {"train_loss": -11.773782730102539, "global_step": 242443, "epoch": 1443} {"train_loss": -11.753572463989258, "global_step": 242444, "epoch": 1443} {"train_loss": -11.753437042236328, "global_step": 242445, "epoch": 1443} {"train_loss": -11.559415817260742, "global_step": 242446, "epoch": 1443} {"train_loss": -11.845418930053711, "global_step": 242447, "epoch": 1443} {"train_loss": -11.826837539672852, "global_step": 242448, "epoch": 1443} {"train_loss": -11.912826538085938, "global_step": 242449, "epoch": 1443} {"train_loss": -11.961889266967773, "global_step": 242450, "epoch": 1443} {"train_loss": -11.856592178344727, "global_step": 242451, "epoch": 1443} {"train_loss": -11.996346473693848, "global_step": 242452, "epoch": 1443} {"train_loss": -12.021392822265625, "global_step": 242453, "epoch": 1443} {"train_loss": -12.036314964294434, "global_step": 242454, "epoch": 1443} {"train_loss": -12.0029878616333, "global_step": 242455, "epoch": 1443} {"train_loss": -11.967613220214844, "global_step": 242456, "epoch": 1443} {"train_loss": -11.840972900390625, "global_step": 242457, "epoch": 1443} {"train_loss": -11.80154037475586, "global_step": 242458, "epoch": 1443} {"train_loss": -11.87826919555664, "global_step": 242459, "epoch": 1443} {"train_loss": -11.763337135314941, "global_step": 242460, "epoch": 1443} {"train_loss": -11.831976890563965, "global_step": 242461, "epoch": 1443} {"train_loss": -11.917024612426758, "global_step": 242462, "epoch": 1443} {"train_loss": -11.993590354919434, "global_step": 242463, "epoch": 1443} {"train_loss": -11.76724910736084, "global_step": 242464, "epoch": 1443} {"train_loss": -12.021157264709473, "global_step": 242465, "epoch": 1443} {"train_loss": -11.83327865600586, "global_step": 242466, "epoch": 1443} {"train_loss": -12.02656078338623, "global_step": 242467, "epoch": 1443} {"train_loss": -12.059810638427734, "global_step": 242468, "epoch": 1443} {"train_loss": -11.946627616882324, "global_step": 242469, "epoch": 1443} {"train_loss": -12.080191612243652, "global_step": 242470, "epoch": 1443} {"train_loss": -12.077177047729492, "global_step": 242471, "epoch": 1443} {"train_loss": -11.733489990234375, "global_step": 242472, "epoch": 1443} {"train_loss": -12.170222282409668, "global_step": 242473, "epoch": 1443} {"train_loss": -12.028802871704102, "global_step": 242474, "epoch": 1443} {"train_loss": -12.109332084655762, "global_step": 242475, "epoch": 1443} {"train_loss": -12.037015914916992, "global_step": 242476, "epoch": 1443} {"train_loss": -12.003364562988281, "global_step": 242477, "epoch": 1443} {"train_loss": -12.13854694366455, "global_step": 242478, "epoch": 1443} {"train_loss": -12.007801055908203, "global_step": 242479, "epoch": 1443} {"train_loss": -12.201257705688477, "global_step": 242480, "epoch": 1443} {"train_loss": -11.989936828613281, "global_step": 242481, "epoch": 1443} {"train_loss": -12.280131340026855, "global_step": 242482, "epoch": 1443} {"train_loss": -11.924972534179688, "global_step": 242483, "epoch": 1443} {"train_loss": -12.21702766418457, "global_step": 242484, "epoch": 1443} {"train_loss": -12.017009735107422, "global_step": 242485, "epoch": 1443} {"train_loss": -12.175092697143555, "global_step": 242486, "epoch": 1443} {"train_loss": -12.173768043518066, "global_step": 242487, "epoch": 1443} {"train_loss": -12.112375259399414, "global_step": 242488, "epoch": 1443} {"train_loss": -11.824847221374512, "global_step": 242489, "epoch": 1443} {"train_loss": -11.994367599487305, "global_step": 242490, "epoch": 1443} {"train_loss": -12.033899307250977, "global_step": 242491, "epoch": 1443} {"train_loss": -12.249085426330566, "global_step": 242492, "epoch": 1443} {"train_loss": -11.942995071411133, "global_step": 242493, "epoch": 1443} {"train_loss": -12.16274356842041, "global_step": 242494, "epoch": 1443} {"train_loss": -11.969124794006348, "global_step": 242495, "epoch": 1443} {"train_loss": -11.906412124633789, "global_step": 242496, "epoch": 1443} {"train_loss": -11.71580696105957, "global_step": 242497, "epoch": 1443} {"train_loss": -12.169975280761719, "global_step": 242498, "epoch": 1443} {"train_loss": -11.8811616897583, "global_step": 242499, "epoch": 1443} {"train_loss": -11.223255157470703, "global_step": 242500, "epoch": 1443} {"train_loss": -11.971960067749023, "global_step": 242501, "epoch": 1443} {"train_loss": -11.987918853759766, "global_step": 242502, "epoch": 1443} {"train_loss": -12.116645812988281, "global_step": 242503, "epoch": 1443} {"train_loss": -11.558191299438477, "global_step": 242504, "epoch": 1443} {"train_loss": -11.746237754821777, "global_step": 242505, "epoch": 1443} {"train_loss": -11.981061935424805, "global_step": 242506, "epoch": 1443} {"train_loss": -11.898176193237305, "global_step": 242507, "epoch": 1443} {"train_loss": -11.862051963806152, "global_step": 242508, "epoch": 1443} {"train_loss": -11.681974411010742, "global_step": 242509, "epoch": 1443} {"train_loss": -11.470999717712402, "global_step": 242510, "epoch": 1443} {"train_loss": -11.908470153808594, "global_step": 242511, "epoch": 1443} {"train_loss": -12.229904174804688, "global_step": 242512, "epoch": 1443} {"train_loss": -11.723856925964355, "global_step": 242513, "epoch": 1443} {"train_loss": -11.630817413330078, "global_step": 242514, "epoch": 1443} {"train_loss": -11.613964080810547, "global_step": 242515, "epoch": 1443} {"train_loss": -12.075682640075684, "global_step": 242516, "epoch": 1443} {"train_loss": -11.673527717590332, "global_step": 242517, "epoch": 1443} {"train_loss": -11.755414962768555, "global_step": 242518, "epoch": 1443} {"train_loss": -12.027588844299316, "global_step": 242519, "epoch": 1443} {"train_loss": -12.021963119506836, "global_step": 242520, "epoch": 1443} {"train_loss": -11.96878433227539, "global_step": 242521, "epoch": 1443} {"train_loss": -11.75123405456543, "global_step": 242522, "epoch": 1443} {"train_loss": -11.815571784973145, "global_step": 242523, "epoch": 1443} {"train_loss": -10.949079513549805, "global_step": 242524, "epoch": 1443} {"train_loss": -10.528584480285645, "global_step": 242525, "epoch": 1443} {"train_loss": -10.4716215133667, "global_step": 242526, "epoch": 1443} {"train_loss": -10.924860000610352, "global_step": 242527, "epoch": 1443} {"train_loss": -10.04991340637207, "global_step": 242528, "epoch": 1443} {"train_loss": -10.427054405212402, "global_step": 242529, "epoch": 1443} {"train_loss": -11.19780445098877, "global_step": 242530, "epoch": 1443} {"train_loss": -8.938772201538086, "global_step": 242531, "epoch": 1443} {"train_loss": -11.537712097167969, "global_step": 242532, "epoch": 1443} {"train_loss": -7.40389347076416, "global_step": 242533, "epoch": 1443} {"train_loss": -9.595603942871094, "global_step": 242534, "epoch": 1443} {"train_loss": -9.7837495803833, "global_step": 242535, "epoch": 1443} {"train_loss": -7.709767818450928, "global_step": 242536, "epoch": 1443} {"train_loss": -7.501656532287598, "global_step": 242537, "epoch": 1443} {"train_loss": -7.738650321960449, "global_step": 242538, "epoch": 1443} {"train_loss": -8.358659744262695, "global_step": 242539, "epoch": 1443} {"train_loss": -8.426801681518555, "global_step": 242540, "epoch": 1443} {"train_loss": -8.981128692626953, "global_step": 242541, "epoch": 1443} {"train_loss": -8.063987731933594, "global_step": 242542, "epoch": 1443} {"train_loss": -9.663216590881348, "global_step": 242543, "epoch": 1443} {"train_loss": -8.32278823852539, "global_step": 242544, "epoch": 1443} {"train_loss": -9.9470796585083, "global_step": 242545, "epoch": 1443} {"train_loss": -8.760931015014648, "global_step": 242546, "epoch": 1443} {"train_loss": -10.975738525390625, "global_step": 242547, "epoch": 1443} {"train_loss": -10.657879829406738, "global_step": 242548, "epoch": 1443} {"train_loss": -10.259243965148926, "global_step": 242549, "epoch": 1443} {"train_loss": -10.52924919128418, "global_step": 242550, "epoch": 1443} {"train_loss": -10.246498107910156, "global_step": 242551, "epoch": 1443} {"train_loss": -10.605266571044922, "global_step": 242552, "epoch": 1443} {"train_loss": -10.761987686157227, "global_step": 242553, "epoch": 1443} {"train_loss": -10.949662208557129, "global_step": 242554, "epoch": 1443} {"train_loss": -10.30798625946045, "global_step": 242555, "epoch": 1443} {"train_loss": -11.041424751281738, "global_step": 242556, "epoch": 1443} {"train_loss": -10.446931838989258, "global_step": 242557, "epoch": 1443} {"train_loss": -10.614395141601562, "global_step": 242558, "epoch": 1443} {"train_loss": -10.717073440551758, "global_step": 242559, "epoch": 1443} {"train_loss": -10.328648567199707, "global_step": 242560, "epoch": 1443} {"train_loss": -10.994547843933105, "global_step": 242561, "epoch": 1443} {"train_loss": -10.93092155456543, "global_step": 242562, "epoch": 1443} {"train_loss": -11.115942001342773, "global_step": 242563, "epoch": 1443} {"train_loss": -11.069816589355469, "global_step": 242564, "epoch": 1443} {"train_loss": -11.240962028503418, "global_step": 242565, "epoch": 1443} {"train_loss": -10.98693561553955, "global_step": 242566, "epoch": 1443} {"train_loss": -10.875368118286133, "global_step": 242567, "epoch": 1443} {"train_loss": -11.296611785888672, "global_step": 242568, "epoch": 1443} {"train_loss": -11.413296699523926, "global_step": 242569, "epoch": 1443} {"train_loss": -10.797697067260742, "global_step": 242570, "epoch": 1443} {"train_loss": -11.335014343261719, "global_step": 242571, "epoch": 1443} {"train_loss": -10.998190879821777, "global_step": 242572, "epoch": 1443} {"train_loss": -11.012857437133789, "global_step": 242573, "epoch": 1443} {"train_loss": -11.465720176696777, "global_step": 242574, "epoch": 1443} {"train_loss": -11.285722732543945, "global_step": 242575, "epoch": 1443} {"train_loss": -11.349382400512695, "global_step": 242576, "epoch": 1443} {"train_loss": -11.34171199798584, "global_step": 242577, "epoch": 1443} {"train_loss": -11.366817474365234, "global_step": 242578, "epoch": 1443} {"train_loss": -11.409698486328125, "global_step": 242579, "epoch": 1443} {"train_loss": -11.292642593383789, "global_step": 242580, "epoch": 1443} {"train_loss": -11.479952812194824, "global_step": 242581, "epoch": 1443} {"train_loss": -11.409667015075684, "global_step": 242582, "epoch": 1443} {"train_loss": -11.317789077758789, "global_step": 242583, "epoch": 1443} {"train_loss": -11.731961250305176, "global_step": 242584, "epoch": 1443} {"train_loss": -11.286852836608887, "global_step": 242585, "epoch": 1443} {"train_loss": -11.510456085205078, "global_step": 242586, "epoch": 1443} {"train_loss": -11.66171932220459, "global_step": 242587, "epoch": 1443} {"train_loss": -11.478134155273438, "global_step": 242588, "epoch": 1443} {"train_loss": -11.56755256652832, "global_step": 242589, "epoch": 1443} {"train_loss": -11.434194564819336, "global_step": 242590, "epoch": 1443} {"train_loss": -11.30240508772078, "global_step": 242591, "epoch": 1443, "val_loss": 264663.84375} {"train_loss": -11.635732650756836, "global_step": 242592, "epoch": 1444} {"train_loss": -11.590154647827148, "global_step": 242593, "epoch": 1444} {"train_loss": -11.740904808044434, "global_step": 242594, "epoch": 1444} {"train_loss": -11.513921737670898, "global_step": 242595, "epoch": 1444} {"train_loss": -11.676494598388672, "global_step": 242596, "epoch": 1444} {"train_loss": -11.672908782958984, "global_step": 242597, "epoch": 1444} {"train_loss": -11.816547393798828, "global_step": 242598, "epoch": 1444} {"train_loss": -11.84237289428711, "global_step": 242599, "epoch": 1444} {"train_loss": -11.85032844543457, "global_step": 242600, "epoch": 1444} {"train_loss": -11.76777458190918, "global_step": 242601, "epoch": 1444} {"train_loss": -11.878158569335938, "global_step": 242602, "epoch": 1444} {"train_loss": -11.882661819458008, "global_step": 242603, "epoch": 1444} {"train_loss": -11.796402931213379, "global_step": 242604, "epoch": 1444} {"train_loss": -11.799501419067383, "global_step": 242605, "epoch": 1444} {"train_loss": -11.9364013671875, "global_step": 242606, "epoch": 1444} {"train_loss": -11.710777282714844, "global_step": 242607, "epoch": 1444} {"train_loss": -11.846601486206055, "global_step": 242608, "epoch": 1444} {"train_loss": -11.940847396850586, "global_step": 242609, "epoch": 1444} {"train_loss": -11.594422340393066, "global_step": 242610, "epoch": 1444} {"train_loss": -11.935164451599121, "global_step": 242611, "epoch": 1444} {"train_loss": -11.942713737487793, "global_step": 242612, "epoch": 1444} {"train_loss": -11.8707857131958, "global_step": 242613, "epoch": 1444} {"train_loss": -11.853856086730957, "global_step": 242614, "epoch": 1444} {"train_loss": -12.070808410644531, "global_step": 242615, "epoch": 1444} {"train_loss": -12.053895950317383, "global_step": 242616, "epoch": 1444} {"train_loss": -12.079141616821289, "global_step": 242617, "epoch": 1444} {"train_loss": -11.919929504394531, "global_step": 242618, "epoch": 1444} {"train_loss": -12.088730812072754, "global_step": 242619, "epoch": 1444} {"train_loss": -12.018077850341797, "global_step": 242620, "epoch": 1444} {"train_loss": -11.906705856323242, "global_step": 242621, "epoch": 1444} {"train_loss": -11.846373558044434, "global_step": 242622, "epoch": 1444} {"train_loss": -12.029427528381348, "global_step": 242623, "epoch": 1444} {"train_loss": -12.014104843139648, "global_step": 242624, "epoch": 1444} {"train_loss": -12.196174621582031, "global_step": 242625, "epoch": 1444} {"train_loss": -11.813006401062012, "global_step": 242626, "epoch": 1444} {"train_loss": -11.766544342041016, "global_step": 242627, "epoch": 1444} {"train_loss": -11.946462631225586, "global_step": 242628, "epoch": 1444} {"train_loss": -11.942360877990723, "global_step": 242629, "epoch": 1444} {"train_loss": -11.953628540039062, "global_step": 242630, "epoch": 1444} {"train_loss": -12.007710456848145, "global_step": 242631, "epoch": 1444} {"train_loss": -11.896998405456543, "global_step": 242632, "epoch": 1444} {"train_loss": -11.935011863708496, "global_step": 242633, "epoch": 1444} {"train_loss": -11.988594055175781, "global_step": 242634, "epoch": 1444} {"train_loss": -12.169610977172852, "global_step": 242635, "epoch": 1444} {"train_loss": -12.00497817993164, "global_step": 242636, "epoch": 1444} {"train_loss": -12.232402801513672, "global_step": 242637, "epoch": 1444} {"train_loss": -12.05324649810791, "global_step": 242638, "epoch": 1444} {"train_loss": -12.063369750976562, "global_step": 242639, "epoch": 1444} {"train_loss": -12.06085205078125, "global_step": 242640, "epoch": 1444} {"train_loss": -11.893535614013672, "global_step": 242641, "epoch": 1444} {"train_loss": -12.378284454345703, "global_step": 242642, "epoch": 1444} {"train_loss": -11.754975318908691, "global_step": 242643, "epoch": 1444} {"train_loss": -12.134052276611328, "global_step": 242644, "epoch": 1444} {"train_loss": -12.083370208740234, "global_step": 242645, "epoch": 1444} {"train_loss": -11.684846878051758, "global_step": 242646, "epoch": 1444} {"train_loss": -11.781929016113281, "global_step": 242647, "epoch": 1444} {"train_loss": -12.051704406738281, "global_step": 242648, "epoch": 1444} {"train_loss": -11.902925491333008, "global_step": 242649, "epoch": 1444} {"train_loss": -11.787290573120117, "global_step": 242650, "epoch": 1444} {"train_loss": -11.311478614807129, "global_step": 242651, "epoch": 1444} {"train_loss": -12.071303367614746, "global_step": 242652, "epoch": 1444} {"train_loss": -10.974554061889648, "global_step": 242653, "epoch": 1444} {"train_loss": -10.917769432067871, "global_step": 242654, "epoch": 1444} {"train_loss": -11.484344482421875, "global_step": 242655, "epoch": 1444} {"train_loss": -11.14828872680664, "global_step": 242656, "epoch": 1444} {"train_loss": -9.461359024047852, "global_step": 242657, "epoch": 1444} {"train_loss": -10.958587646484375, "global_step": 242658, "epoch": 1444} {"train_loss": -11.500958442687988, "global_step": 242659, "epoch": 1444} {"train_loss": -10.165428161621094, "global_step": 242660, "epoch": 1444} {"train_loss": -11.69483470916748, "global_step": 242661, "epoch": 1444} {"train_loss": -9.642021179199219, "global_step": 242662, "epoch": 1444} {"train_loss": -11.209871292114258, "global_step": 242663, "epoch": 1444} {"train_loss": -10.079793930053711, "global_step": 242664, "epoch": 1444} {"train_loss": -10.141172409057617, "global_step": 242665, "epoch": 1444} {"train_loss": -11.15011215209961, "global_step": 242666, "epoch": 1444} {"train_loss": -10.727171897888184, "global_step": 242667, "epoch": 1444} {"train_loss": -11.506513595581055, "global_step": 242668, "epoch": 1444} {"train_loss": -10.627009391784668, "global_step": 242669, "epoch": 1444} {"train_loss": -11.444099426269531, "global_step": 242670, "epoch": 1444} {"train_loss": -11.31277084350586, "global_step": 242671, "epoch": 1444} {"train_loss": -11.889190673828125, "global_step": 242672, "epoch": 1444} {"train_loss": -11.362010955810547, "global_step": 242673, "epoch": 1444} {"train_loss": -11.307243347167969, "global_step": 242674, "epoch": 1444} {"train_loss": -11.254655838012695, "global_step": 242675, "epoch": 1444} {"train_loss": -11.626166343688965, "global_step": 242676, "epoch": 1444} {"train_loss": -11.443236351013184, "global_step": 242677, "epoch": 1444} {"train_loss": -11.699803352355957, "global_step": 242678, "epoch": 1444} {"train_loss": -11.62094497680664, "global_step": 242679, "epoch": 1444} {"train_loss": -11.51266098022461, "global_step": 242680, "epoch": 1444} {"train_loss": -11.891593933105469, "global_step": 242681, "epoch": 1444} {"train_loss": -11.455425262451172, "global_step": 242682, "epoch": 1444} {"train_loss": -11.825353622436523, "global_step": 242683, "epoch": 1444} {"train_loss": -11.522436141967773, "global_step": 242684, "epoch": 1444} {"train_loss": -11.705047607421875, "global_step": 242685, "epoch": 1444} {"train_loss": -11.60602855682373, "global_step": 242686, "epoch": 1444} {"train_loss": -11.517499923706055, "global_step": 242687, "epoch": 1444} {"train_loss": -11.796869277954102, "global_step": 242688, "epoch": 1444} {"train_loss": -11.572771072387695, "global_step": 242689, "epoch": 1444} {"train_loss": -11.635042190551758, "global_step": 242690, "epoch": 1444} {"train_loss": -11.302302360534668, "global_step": 242691, "epoch": 1444} {"train_loss": -11.93344497680664, "global_step": 242692, "epoch": 1444} {"train_loss": -11.292360305786133, "global_step": 242693, "epoch": 1444} {"train_loss": -12.024545669555664, "global_step": 242694, "epoch": 1444} {"train_loss": -11.494479179382324, "global_step": 242695, "epoch": 1444} {"train_loss": -11.764698028564453, "global_step": 242696, "epoch": 1444} {"train_loss": -11.892860412597656, "global_step": 242697, "epoch": 1444} {"train_loss": -11.871758460998535, "global_step": 242698, "epoch": 1444} {"train_loss": -12.017977714538574, "global_step": 242699, "epoch": 1444} {"train_loss": -11.805301666259766, "global_step": 242700, "epoch": 1444} {"train_loss": -11.85184097290039, "global_step": 242701, "epoch": 1444} {"train_loss": -11.706893920898438, "global_step": 242702, "epoch": 1444} {"train_loss": -11.908562660217285, "global_step": 242703, "epoch": 1444} {"train_loss": -12.07382583618164, "global_step": 242704, "epoch": 1444} {"train_loss": -12.003939628601074, "global_step": 242705, "epoch": 1444} {"train_loss": -11.827655792236328, "global_step": 242706, "epoch": 1444} {"train_loss": -12.102083206176758, "global_step": 242707, "epoch": 1444} {"train_loss": -12.002530097961426, "global_step": 242708, "epoch": 1444} {"train_loss": -12.100167274475098, "global_step": 242709, "epoch": 1444} {"train_loss": -11.928889274597168, "global_step": 242710, "epoch": 1444} {"train_loss": -12.130393981933594, "global_step": 242711, "epoch": 1444} {"train_loss": -11.94929313659668, "global_step": 242712, "epoch": 1444} {"train_loss": -12.097736358642578, "global_step": 242713, "epoch": 1444} {"train_loss": -12.112300872802734, "global_step": 242714, "epoch": 1444} {"train_loss": -11.791034698486328, "global_step": 242715, "epoch": 1444} {"train_loss": -12.152061462402344, "global_step": 242716, "epoch": 1444} {"train_loss": -12.014394760131836, "global_step": 242717, "epoch": 1444} {"train_loss": -11.902633666992188, "global_step": 242718, "epoch": 1444} {"train_loss": -12.151874542236328, "global_step": 242719, "epoch": 1444} {"train_loss": -12.183727264404297, "global_step": 242720, "epoch": 1444} {"train_loss": -11.942485809326172, "global_step": 242721, "epoch": 1444} {"train_loss": -12.016294479370117, "global_step": 242722, "epoch": 1444} {"train_loss": -11.94333267211914, "global_step": 242723, "epoch": 1444} {"train_loss": -12.009794235229492, "global_step": 242724, "epoch": 1444} {"train_loss": -11.738783836364746, "global_step": 242725, "epoch": 1444} {"train_loss": -11.967978477478027, "global_step": 242726, "epoch": 1444} {"train_loss": -11.97732162475586, "global_step": 242727, "epoch": 1444} {"train_loss": -11.81698226928711, "global_step": 242728, "epoch": 1444} {"train_loss": -11.94015884399414, "global_step": 242729, "epoch": 1444} {"train_loss": -11.923681259155273, "global_step": 242730, "epoch": 1444} {"train_loss": -11.812350273132324, "global_step": 242731, "epoch": 1444} {"train_loss": -11.72558307647705, "global_step": 242732, "epoch": 1444} {"train_loss": -10.865023612976074, "global_step": 242733, "epoch": 1444} {"train_loss": -10.662012100219727, "global_step": 242734, "epoch": 1444} {"train_loss": -11.657880783081055, "global_step": 242735, "epoch": 1444} {"train_loss": -11.698399543762207, "global_step": 242736, "epoch": 1444} {"train_loss": -11.197298049926758, "global_step": 242737, "epoch": 1444} {"train_loss": -11.363532066345215, "global_step": 242738, "epoch": 1444} {"train_loss": -10.910850524902344, "global_step": 242739, "epoch": 1444} {"train_loss": -11.45968246459961, "global_step": 242740, "epoch": 1444} {"train_loss": -11.852624893188477, "global_step": 242741, "epoch": 1444} {"train_loss": -11.561234474182129, "global_step": 242742, "epoch": 1444} {"train_loss": -11.406500816345215, "global_step": 242743, "epoch": 1444} {"train_loss": -11.720711708068848, "global_step": 242744, "epoch": 1444} {"train_loss": -11.469377517700195, "global_step": 242745, "epoch": 1444} {"train_loss": -11.519506454467773, "global_step": 242746, "epoch": 1444} {"train_loss": -11.208921432495117, "global_step": 242747, "epoch": 1444} {"train_loss": -11.527730941772461, "global_step": 242748, "epoch": 1444} {"train_loss": -11.457529067993164, "global_step": 242749, "epoch": 1444} {"train_loss": -11.512622833251953, "global_step": 242750, "epoch": 1444} {"train_loss": -11.449748992919922, "global_step": 242751, "epoch": 1444} {"train_loss": -12.066238403320312, "global_step": 242752, "epoch": 1444} {"train_loss": -11.473282814025879, "global_step": 242753, "epoch": 1444} {"train_loss": -11.616473197937012, "global_step": 242754, "epoch": 1444} {"train_loss": -11.089794158935547, "global_step": 242755, "epoch": 1444} {"train_loss": -11.254380226135254, "global_step": 242756, "epoch": 1444} {"train_loss": -11.143632888793945, "global_step": 242757, "epoch": 1444} {"train_loss": -11.868803024291992, "global_step": 242758, "epoch": 1444} {"train_loss": -11.669364503451757, "global_step": 242759, "epoch": 1444, "val_loss": 267588.71875} {"train_loss": -11.208316802978516, "global_step": 242760, "epoch": 1445} {"train_loss": -11.454154968261719, "global_step": 242761, "epoch": 1445} {"train_loss": -11.838809967041016, "global_step": 242762, "epoch": 1445} {"train_loss": -11.401496887207031, "global_step": 242763, "epoch": 1445} {"train_loss": -11.514581680297852, "global_step": 242764, "epoch": 1445} {"train_loss": -11.548672676086426, "global_step": 242765, "epoch": 1445} {"train_loss": -11.692590713500977, "global_step": 242766, "epoch": 1445} {"train_loss": -11.481180191040039, "global_step": 242767, "epoch": 1445} {"train_loss": -11.727755546569824, "global_step": 242768, "epoch": 1445} {"train_loss": -11.188568115234375, "global_step": 242769, "epoch": 1445} {"train_loss": -11.603483200073242, "global_step": 242770, "epoch": 1445} {"train_loss": -11.51880931854248, "global_step": 242771, "epoch": 1445} {"train_loss": -11.529642105102539, "global_step": 242772, "epoch": 1445} {"train_loss": -11.671297073364258, "global_step": 242773, "epoch": 1445} {"train_loss": -11.465938568115234, "global_step": 242774, "epoch": 1445} {"train_loss": -11.918753623962402, "global_step": 242775, "epoch": 1445} {"train_loss": -11.710994720458984, "global_step": 242776, "epoch": 1445} {"train_loss": -11.768211364746094, "global_step": 242777, "epoch": 1445} {"train_loss": -11.425158500671387, "global_step": 242778, "epoch": 1445} {"train_loss": -11.637332916259766, "global_step": 242779, "epoch": 1445} {"train_loss": -11.260066986083984, "global_step": 242780, "epoch": 1445} {"train_loss": -11.549921989440918, "global_step": 242781, "epoch": 1445} {"train_loss": -11.537757873535156, "global_step": 242782, "epoch": 1445} {"train_loss": -11.613641738891602, "global_step": 242783, "epoch": 1445} {"train_loss": -11.686842918395996, "global_step": 242784, "epoch": 1445} {"train_loss": -11.17318344116211, "global_step": 242785, "epoch": 1445} {"train_loss": -11.594802856445312, "global_step": 242786, "epoch": 1445} {"train_loss": -11.255258560180664, "global_step": 242787, "epoch": 1445} {"train_loss": -11.597445487976074, "global_step": 242788, "epoch": 1445} {"train_loss": -11.34153938293457, "global_step": 242789, "epoch": 1445} {"train_loss": -11.012533187866211, "global_step": 242790, "epoch": 1445} {"train_loss": -11.473652839660645, "global_step": 242791, "epoch": 1445} {"train_loss": -11.119061470031738, "global_step": 242792, "epoch": 1445} {"train_loss": -11.726699829101562, "global_step": 242793, "epoch": 1445} {"train_loss": -11.056982040405273, "global_step": 242794, "epoch": 1445} {"train_loss": -11.614664077758789, "global_step": 242795, "epoch": 1445} {"train_loss": -11.055076599121094, "global_step": 242796, "epoch": 1445} {"train_loss": -10.63205337524414, "global_step": 242797, "epoch": 1445} {"train_loss": -11.731249809265137, "global_step": 242798, "epoch": 1445} {"train_loss": -10.696921348571777, "global_step": 242799, "epoch": 1445} {"train_loss": -11.740335464477539, "global_step": 242800, "epoch": 1445} {"train_loss": -11.193293571472168, "global_step": 242801, "epoch": 1445} {"train_loss": -11.094499588012695, "global_step": 242802, "epoch": 1445} {"train_loss": -10.852394104003906, "global_step": 242803, "epoch": 1445} {"train_loss": -10.83221435546875, "global_step": 242804, "epoch": 1445} {"train_loss": -10.667285919189453, "global_step": 242805, "epoch": 1445} {"train_loss": -11.610301971435547, "global_step": 242806, "epoch": 1445} {"train_loss": -10.687058448791504, "global_step": 242807, "epoch": 1445} {"train_loss": -11.61856746673584, "global_step": 242808, "epoch": 1445} {"train_loss": -11.159553527832031, "global_step": 242809, "epoch": 1445} {"train_loss": -11.522859573364258, "global_step": 242810, "epoch": 1445} {"train_loss": -11.609390258789062, "global_step": 242811, "epoch": 1445} {"train_loss": -11.294824600219727, "global_step": 242812, "epoch": 1445} {"train_loss": -11.382204055786133, "global_step": 242813, "epoch": 1445} {"train_loss": -10.882952690124512, "global_step": 242814, "epoch": 1445} {"train_loss": -11.451570510864258, "global_step": 242815, "epoch": 1445} {"train_loss": -10.662038803100586, "global_step": 242816, "epoch": 1445} {"train_loss": -11.711166381835938, "global_step": 242817, "epoch": 1445} {"train_loss": -10.744888305664062, "global_step": 242818, "epoch": 1445} {"train_loss": -11.577407836914062, "global_step": 242819, "epoch": 1445} {"train_loss": -11.111528396606445, "global_step": 242820, "epoch": 1445} {"train_loss": -11.435515403747559, "global_step": 242821, "epoch": 1445} {"train_loss": -11.685125350952148, "global_step": 242822, "epoch": 1445} {"train_loss": -11.080854415893555, "global_step": 242823, "epoch": 1445} {"train_loss": -11.742124557495117, "global_step": 242824, "epoch": 1445} {"train_loss": -11.385119438171387, "global_step": 242825, "epoch": 1445} {"train_loss": -11.428975105285645, "global_step": 242826, "epoch": 1445} {"train_loss": -11.870491981506348, "global_step": 242827, "epoch": 1445} {"train_loss": -11.378369331359863, "global_step": 242828, "epoch": 1445} {"train_loss": -11.964546203613281, "global_step": 242829, "epoch": 1445} {"train_loss": -11.516107559204102, "global_step": 242830, "epoch": 1445} {"train_loss": -11.665942192077637, "global_step": 242831, "epoch": 1445} {"train_loss": -11.86075210571289, "global_step": 242832, "epoch": 1445} {"train_loss": -11.61193561553955, "global_step": 242833, "epoch": 1445} {"train_loss": -11.83752155303955, "global_step": 242834, "epoch": 1445} {"train_loss": -11.747913360595703, "global_step": 242835, "epoch": 1445} {"train_loss": -11.87136173248291, "global_step": 242836, "epoch": 1445} {"train_loss": -11.720566749572754, "global_step": 242837, "epoch": 1445} {"train_loss": -11.764338493347168, "global_step": 242838, "epoch": 1445} {"train_loss": -11.894038200378418, "global_step": 242839, "epoch": 1445} {"train_loss": -11.632631301879883, "global_step": 242840, "epoch": 1445} {"train_loss": -11.860920906066895, "global_step": 242841, "epoch": 1445} {"train_loss": -11.799442291259766, "global_step": 242842, "epoch": 1445} {"train_loss": -11.878223419189453, "global_step": 242843, "epoch": 1445} {"train_loss": -11.72266674041748, "global_step": 242844, "epoch": 1445} {"train_loss": -11.71155071258545, "global_step": 242845, "epoch": 1445} {"train_loss": -11.89531135559082, "global_step": 242846, "epoch": 1445} {"train_loss": -11.940333366394043, "global_step": 242847, "epoch": 1445} {"train_loss": -12.134967803955078, "global_step": 242848, "epoch": 1445} {"train_loss": -11.659852981567383, "global_step": 242849, "epoch": 1445} {"train_loss": -11.810253143310547, "global_step": 242850, "epoch": 1445} {"train_loss": -12.081499099731445, "global_step": 242851, "epoch": 1445} {"train_loss": -12.144655227661133, "global_step": 242852, "epoch": 1445} {"train_loss": -11.903778076171875, "global_step": 242853, "epoch": 1445} {"train_loss": -12.041711807250977, "global_step": 242854, "epoch": 1445} {"train_loss": -11.818683624267578, "global_step": 242855, "epoch": 1445} {"train_loss": -12.1392183303833, "global_step": 242856, "epoch": 1445} {"train_loss": -11.912092208862305, "global_step": 242857, "epoch": 1445} {"train_loss": -11.910240173339844, "global_step": 242858, "epoch": 1445} {"train_loss": -11.719327926635742, "global_step": 242859, "epoch": 1445} {"train_loss": -12.010374069213867, "global_step": 242860, "epoch": 1445} {"train_loss": -11.858592987060547, "global_step": 242861, "epoch": 1445} {"train_loss": -11.695040702819824, "global_step": 242862, "epoch": 1445} {"train_loss": -12.173513412475586, "global_step": 242863, "epoch": 1445} {"train_loss": -11.819249153137207, "global_step": 242864, "epoch": 1445} {"train_loss": -11.481059074401855, "global_step": 242865, "epoch": 1445} {"train_loss": -11.916153907775879, "global_step": 242866, "epoch": 1445} {"train_loss": -12.143750190734863, "global_step": 242867, "epoch": 1445} {"train_loss": -11.617181777954102, "global_step": 242868, "epoch": 1445} {"train_loss": -12.144707679748535, "global_step": 242869, "epoch": 1445} {"train_loss": -12.192079544067383, "global_step": 242870, "epoch": 1445} {"train_loss": -11.547255516052246, "global_step": 242871, "epoch": 1445} {"train_loss": -11.496269226074219, "global_step": 242872, "epoch": 1445} {"train_loss": -12.168537139892578, "global_step": 242873, "epoch": 1445} {"train_loss": -11.82645034790039, "global_step": 242874, "epoch": 1445} {"train_loss": -12.049335479736328, "global_step": 242875, "epoch": 1445} {"train_loss": -11.890281677246094, "global_step": 242876, "epoch": 1445} {"train_loss": -11.777972221374512, "global_step": 242877, "epoch": 1445} {"train_loss": -11.702945709228516, "global_step": 242878, "epoch": 1445} {"train_loss": -12.11840534210205, "global_step": 242879, "epoch": 1445} {"train_loss": -11.626104354858398, "global_step": 242880, "epoch": 1445} {"train_loss": -11.74032211303711, "global_step": 242881, "epoch": 1445} {"train_loss": -11.681297302246094, "global_step": 242882, "epoch": 1445} {"train_loss": -12.239456176757812, "global_step": 242883, "epoch": 1445} {"train_loss": -11.555971145629883, "global_step": 242884, "epoch": 1445} {"train_loss": -11.686439514160156, "global_step": 242885, "epoch": 1445} {"train_loss": -11.821457862854004, "global_step": 242886, "epoch": 1445} {"train_loss": -12.069660186767578, "global_step": 242887, "epoch": 1445} {"train_loss": -11.804780960083008, "global_step": 242888, "epoch": 1445} {"train_loss": -11.906597137451172, "global_step": 242889, "epoch": 1445} {"train_loss": -12.135138511657715, "global_step": 242890, "epoch": 1445} {"train_loss": -11.92988395690918, "global_step": 242891, "epoch": 1445} {"train_loss": -11.916902542114258, "global_step": 242892, "epoch": 1445} {"train_loss": -12.30681037902832, "global_step": 242893, "epoch": 1445} {"train_loss": -11.563276290893555, "global_step": 242894, "epoch": 1445} {"train_loss": -10.8455810546875, "global_step": 242895, "epoch": 1445} {"train_loss": -11.198587417602539, "global_step": 242896, "epoch": 1445} {"train_loss": -11.522653579711914, "global_step": 242897, "epoch": 1445} {"train_loss": -9.804348945617676, "global_step": 242898, "epoch": 1445} {"train_loss": -11.284320831298828, "global_step": 242899, "epoch": 1445} {"train_loss": -10.473960876464844, "global_step": 242900, "epoch": 1445} {"train_loss": -10.700571060180664, "global_step": 242901, "epoch": 1445} {"train_loss": -11.619074821472168, "global_step": 242902, "epoch": 1445} {"train_loss": -10.03386402130127, "global_step": 242903, "epoch": 1445} {"train_loss": -11.299907684326172, "global_step": 242904, "epoch": 1445} {"train_loss": -10.517261505126953, "global_step": 242905, "epoch": 1445} {"train_loss": -10.725359916687012, "global_step": 242906, "epoch": 1445} {"train_loss": -10.589677810668945, "global_step": 242907, "epoch": 1445} {"train_loss": -9.299240112304688, "global_step": 242908, "epoch": 1445} {"train_loss": -9.271119117736816, "global_step": 242909, "epoch": 1445} {"train_loss": -8.924708366394043, "global_step": 242910, "epoch": 1445} {"train_loss": -9.545980453491211, "global_step": 242911, "epoch": 1445} {"train_loss": -9.660990715026855, "global_step": 242912, "epoch": 1445} {"train_loss": -9.005457878112793, "global_step": 242913, "epoch": 1445} {"train_loss": -10.12307357788086, "global_step": 242914, "epoch": 1445} {"train_loss": -9.582633972167969, "global_step": 242915, "epoch": 1445} {"train_loss": -9.687637329101562, "global_step": 242916, "epoch": 1445} {"train_loss": -9.645437240600586, "global_step": 242917, "epoch": 1445} {"train_loss": -9.954082489013672, "global_step": 242918, "epoch": 1445} {"train_loss": -10.522921562194824, "global_step": 242919, "epoch": 1445} {"train_loss": -10.27010726928711, "global_step": 242920, "epoch": 1445} {"train_loss": -10.953570365905762, "global_step": 242921, "epoch": 1445} {"train_loss": -10.208248138427734, "global_step": 242922, "epoch": 1445} {"train_loss": -11.33883285522461, "global_step": 242923, "epoch": 1445} {"train_loss": -10.836193084716797, "global_step": 242924, "epoch": 1445} {"train_loss": -10.483312606811523, "global_step": 242925, "epoch": 1445} {"train_loss": -10.969303131103516, "global_step": 242926, "epoch": 1445} {"train_loss": -11.370323788552056, "global_step": 242927, "epoch": 1445, "val_loss": 259197.71875, "train_action_mse_error": 0.5837104320526123} {"train_loss": -10.607717514038086, "global_step": 242928, "epoch": 1446} {"train_loss": -11.57101058959961, "global_step": 242929, "epoch": 1446} {"train_loss": -10.873037338256836, "global_step": 242930, "epoch": 1446} {"train_loss": -10.977020263671875, "global_step": 242931, "epoch": 1446} {"train_loss": -11.311803817749023, "global_step": 242932, "epoch": 1446} {"train_loss": -11.295317649841309, "global_step": 242933, "epoch": 1446} {"train_loss": -11.101958274841309, "global_step": 242934, "epoch": 1446} {"train_loss": -11.316259384155273, "global_step": 242935, "epoch": 1446} {"train_loss": -10.932819366455078, "global_step": 242936, "epoch": 1446} {"train_loss": -11.11517333984375, "global_step": 242937, "epoch": 1446} {"train_loss": -11.063142776489258, "global_step": 242938, "epoch": 1446} {"train_loss": -11.245256423950195, "global_step": 242939, "epoch": 1446} {"train_loss": -11.403154373168945, "global_step": 242940, "epoch": 1446} {"train_loss": -11.686246871948242, "global_step": 242941, "epoch": 1446} {"train_loss": -11.613635063171387, "global_step": 242942, "epoch": 1446} {"train_loss": -11.641603469848633, "global_step": 242943, "epoch": 1446} {"train_loss": -11.794573783874512, "global_step": 242944, "epoch": 1446} {"train_loss": -11.553511619567871, "global_step": 242945, "epoch": 1446} {"train_loss": -11.56142807006836, "global_step": 242946, "epoch": 1446} {"train_loss": -11.595617294311523, "global_step": 242947, "epoch": 1446} {"train_loss": -11.534875869750977, "global_step": 242948, "epoch": 1446} {"train_loss": -11.786483764648438, "global_step": 242949, "epoch": 1446} {"train_loss": -11.677604675292969, "global_step": 242950, "epoch": 1446} {"train_loss": -11.593527793884277, "global_step": 242951, "epoch": 1446} {"train_loss": -11.881927490234375, "global_step": 242952, "epoch": 1446} {"train_loss": -11.713335037231445, "global_step": 242953, "epoch": 1446} {"train_loss": -11.669057846069336, "global_step": 242954, "epoch": 1446} {"train_loss": -11.670440673828125, "global_step": 242955, "epoch": 1446} {"train_loss": -11.59970760345459, "global_step": 242956, "epoch": 1446} {"train_loss": -11.875545501708984, "global_step": 242957, "epoch": 1446} {"train_loss": -11.687281608581543, "global_step": 242958, "epoch": 1446} {"train_loss": -11.88541316986084, "global_step": 242959, "epoch": 1446} {"train_loss": -11.662460327148438, "global_step": 242960, "epoch": 1446} {"train_loss": -11.822272300720215, "global_step": 242961, "epoch": 1446} {"train_loss": -11.723551750183105, "global_step": 242962, "epoch": 1446} {"train_loss": -12.07071590423584, "global_step": 242963, "epoch": 1446} {"train_loss": -11.756258010864258, "global_step": 242964, "epoch": 1446} {"train_loss": -11.934355735778809, "global_step": 242965, "epoch": 1446} {"train_loss": -11.673820495605469, "global_step": 242966, "epoch": 1446} {"train_loss": -11.952973365783691, "global_step": 242967, "epoch": 1446} {"train_loss": -11.924932479858398, "global_step": 242968, "epoch": 1446} {"train_loss": -12.01147174835205, "global_step": 242969, "epoch": 1446} {"train_loss": -12.059196472167969, "global_step": 242970, "epoch": 1446} {"train_loss": -12.100423812866211, "global_step": 242971, "epoch": 1446} {"train_loss": -11.863822937011719, "global_step": 242972, "epoch": 1446} {"train_loss": -11.972719192504883, "global_step": 242973, "epoch": 1446} {"train_loss": -11.951055526733398, "global_step": 242974, "epoch": 1446} {"train_loss": -11.764074325561523, "global_step": 242975, "epoch": 1446} {"train_loss": -11.94820785522461, "global_step": 242976, "epoch": 1446} {"train_loss": -12.003609657287598, "global_step": 242977, "epoch": 1446} {"train_loss": -12.146385192871094, "global_step": 242978, "epoch": 1446} {"train_loss": -12.085606575012207, "global_step": 242979, "epoch": 1446} {"train_loss": -12.19832706451416, "global_step": 242980, "epoch": 1446} {"train_loss": -11.870461463928223, "global_step": 242981, "epoch": 1446} {"train_loss": -12.09133243560791, "global_step": 242982, "epoch": 1446} {"train_loss": -11.967447280883789, "global_step": 242983, "epoch": 1446} {"train_loss": -12.111499786376953, "global_step": 242984, "epoch": 1446} {"train_loss": -11.98045539855957, "global_step": 242985, "epoch": 1446} {"train_loss": -12.13265609741211, "global_step": 242986, "epoch": 1446} {"train_loss": -11.914220809936523, "global_step": 242987, "epoch": 1446} {"train_loss": -11.752700805664062, "global_step": 242988, "epoch": 1446} {"train_loss": -11.948318481445312, "global_step": 242989, "epoch": 1446} {"train_loss": -11.881080627441406, "global_step": 242990, "epoch": 1446} {"train_loss": -12.058343887329102, "global_step": 242991, "epoch": 1446} {"train_loss": -12.04144287109375, "global_step": 242992, "epoch": 1446} {"train_loss": -12.034123420715332, "global_step": 242993, "epoch": 1446} {"train_loss": -12.168702125549316, "global_step": 242994, "epoch": 1446} {"train_loss": -11.927718162536621, "global_step": 242995, "epoch": 1446} {"train_loss": -12.192276000976562, "global_step": 242996, "epoch": 1446} {"train_loss": -12.099000930786133, "global_step": 242997, "epoch": 1446} {"train_loss": -11.79043197631836, "global_step": 242998, "epoch": 1446} {"train_loss": -12.232879638671875, "global_step": 242999, "epoch": 1446} {"train_loss": -11.921056747436523, "global_step": 243000, "epoch": 1446} {"train_loss": -12.04481315612793, "global_step": 243001, "epoch": 1446} {"train_loss": -12.177068710327148, "global_step": 243002, "epoch": 1446} {"train_loss": -12.177736282348633, "global_step": 243003, "epoch": 1446} {"train_loss": -12.13035774230957, "global_step": 243004, "epoch": 1446} {"train_loss": -12.055586814880371, "global_step": 243005, "epoch": 1446} {"train_loss": -12.026289939880371, "global_step": 243006, "epoch": 1446} {"train_loss": -11.930559158325195, "global_step": 243007, "epoch": 1446} {"train_loss": -12.109405517578125, "global_step": 243008, "epoch": 1446} {"train_loss": -11.870161056518555, "global_step": 243009, "epoch": 1446} {"train_loss": -12.012413024902344, "global_step": 243010, "epoch": 1446} {"train_loss": -11.7841215133667, "global_step": 243011, "epoch": 1446} {"train_loss": -11.814066886901855, "global_step": 243012, "epoch": 1446} {"train_loss": -12.005462646484375, "global_step": 243013, "epoch": 1446} {"train_loss": -11.952374458312988, "global_step": 243014, "epoch": 1446} {"train_loss": -11.943470001220703, "global_step": 243015, "epoch": 1446} {"train_loss": -11.870849609375, "global_step": 243016, "epoch": 1446} {"train_loss": -11.882655143737793, "global_step": 243017, "epoch": 1446} {"train_loss": -12.002639770507812, "global_step": 243018, "epoch": 1446} {"train_loss": -11.566780090332031, "global_step": 243019, "epoch": 1446} {"train_loss": -11.808220863342285, "global_step": 243020, "epoch": 1446} {"train_loss": -11.146158218383789, "global_step": 243021, "epoch": 1446} {"train_loss": -11.596162796020508, "global_step": 243022, "epoch": 1446} {"train_loss": -12.136553764343262, "global_step": 243023, "epoch": 1446} {"train_loss": -11.377388000488281, "global_step": 243024, "epoch": 1446} {"train_loss": -11.231581687927246, "global_step": 243025, "epoch": 1446} {"train_loss": -11.284711837768555, "global_step": 243026, "epoch": 1446} {"train_loss": -11.474611282348633, "global_step": 243027, "epoch": 1446} {"train_loss": -11.388786315917969, "global_step": 243028, "epoch": 1446} {"train_loss": -10.589921951293945, "global_step": 243029, "epoch": 1446} {"train_loss": -8.87563419342041, "global_step": 243030, "epoch": 1446} {"train_loss": -10.757596969604492, "global_step": 243031, "epoch": 1446} {"train_loss": -8.016246795654297, "global_step": 243032, "epoch": 1446} {"train_loss": -8.901843070983887, "global_step": 243033, "epoch": 1446} {"train_loss": -7.1167683601379395, "global_step": 243034, "epoch": 1446} {"train_loss": -7.2704315185546875, "global_step": 243035, "epoch": 1446} {"train_loss": -7.760008811950684, "global_step": 243036, "epoch": 1446} {"train_loss": -9.022562026977539, "global_step": 243037, "epoch": 1446} {"train_loss": -9.364381790161133, "global_step": 243038, "epoch": 1446} {"train_loss": -9.431929588317871, "global_step": 243039, "epoch": 1446} {"train_loss": -9.5753173828125, "global_step": 243040, "epoch": 1446} {"train_loss": -10.470693588256836, "global_step": 243041, "epoch": 1446} {"train_loss": -11.121835708618164, "global_step": 243042, "epoch": 1446} {"train_loss": -11.058941841125488, "global_step": 243043, "epoch": 1446} {"train_loss": -10.51211929321289, "global_step": 243044, "epoch": 1446} {"train_loss": -9.965361595153809, "global_step": 243045, "epoch": 1446} {"train_loss": -10.933298110961914, "global_step": 243046, "epoch": 1446} {"train_loss": -11.081518173217773, "global_step": 243047, "epoch": 1446} {"train_loss": -11.116788864135742, "global_step": 243048, "epoch": 1446} {"train_loss": -11.138848304748535, "global_step": 243049, "epoch": 1446} {"train_loss": -11.211692810058594, "global_step": 243050, "epoch": 1446} {"train_loss": -10.787357330322266, "global_step": 243051, "epoch": 1446} {"train_loss": -10.852149963378906, "global_step": 243052, "epoch": 1446} {"train_loss": -11.010984420776367, "global_step": 243053, "epoch": 1446} {"train_loss": -10.87967586517334, "global_step": 243054, "epoch": 1446} {"train_loss": -11.228196144104004, "global_step": 243055, "epoch": 1446} {"train_loss": -11.050766944885254, "global_step": 243056, "epoch": 1446} {"train_loss": -11.51698112487793, "global_step": 243057, "epoch": 1446} {"train_loss": -11.123204231262207, "global_step": 243058, "epoch": 1446} {"train_loss": -11.670807838439941, "global_step": 243059, "epoch": 1446} {"train_loss": -11.378875732421875, "global_step": 243060, "epoch": 1446} {"train_loss": -11.57620620727539, "global_step": 243061, "epoch": 1446} {"train_loss": -11.356277465820312, "global_step": 243062, "epoch": 1446} {"train_loss": -11.497117042541504, "global_step": 243063, "epoch": 1446} {"train_loss": -11.470726013183594, "global_step": 243064, "epoch": 1446} {"train_loss": -11.637321472167969, "global_step": 243065, "epoch": 1446} {"train_loss": -11.589385032653809, "global_step": 243066, "epoch": 1446} {"train_loss": -11.763594627380371, "global_step": 243067, "epoch": 1446} {"train_loss": -11.562414169311523, "global_step": 243068, "epoch": 1446} {"train_loss": -11.548707962036133, "global_step": 243069, "epoch": 1446} {"train_loss": -11.508527755737305, "global_step": 243070, "epoch": 1446} {"train_loss": -11.6533203125, "global_step": 243071, "epoch": 1446} {"train_loss": -11.439994812011719, "global_step": 243072, "epoch": 1446} {"train_loss": -11.86743450164795, "global_step": 243073, "epoch": 1446} {"train_loss": -11.752641677856445, "global_step": 243074, "epoch": 1446} {"train_loss": -11.887128829956055, "global_step": 243075, "epoch": 1446} {"train_loss": -11.621745109558105, "global_step": 243076, "epoch": 1446} {"train_loss": -11.763564109802246, "global_step": 243077, "epoch": 1446} {"train_loss": -11.490171432495117, "global_step": 243078, "epoch": 1446} {"train_loss": -11.676958084106445, "global_step": 243079, "epoch": 1446} {"train_loss": -11.767533302307129, "global_step": 243080, "epoch": 1446} {"train_loss": -11.891447067260742, "global_step": 243081, "epoch": 1446} {"train_loss": -11.777608871459961, "global_step": 243082, "epoch": 1446} {"train_loss": -11.938177108764648, "global_step": 243083, "epoch": 1446} {"train_loss": -12.040740966796875, "global_step": 243084, "epoch": 1446} {"train_loss": -11.787517547607422, "global_step": 243085, "epoch": 1446} {"train_loss": -11.965662956237793, "global_step": 243086, "epoch": 1446} {"train_loss": -12.031795501708984, "global_step": 243087, "epoch": 1446} {"train_loss": -11.821205139160156, "global_step": 243088, "epoch": 1446} {"train_loss": -11.808693885803223, "global_step": 243089, "epoch": 1446} {"train_loss": -11.97839069366455, "global_step": 243090, "epoch": 1446} {"train_loss": -11.935800552368164, "global_step": 243091, "epoch": 1446} {"train_loss": -11.739416122436523, "global_step": 243092, "epoch": 1446} {"train_loss": -11.8485746383667, "global_step": 243093, "epoch": 1446} {"train_loss": -11.754964828491211, "global_step": 243094, "epoch": 1446} {"train_loss": -11.465401379835038, "global_step": 243095, "epoch": 1446, "val_loss": 261891.9375} {"train_loss": -11.80833625793457, "global_step": 243096, "epoch": 1447} {"train_loss": -12.038959503173828, "global_step": 243097, "epoch": 1447} {"train_loss": -11.987765312194824, "global_step": 243098, "epoch": 1447} {"train_loss": -12.107011795043945, "global_step": 243099, "epoch": 1447} {"train_loss": -11.773432731628418, "global_step": 243100, "epoch": 1447} {"train_loss": -11.931553840637207, "global_step": 243101, "epoch": 1447} {"train_loss": -12.16221809387207, "global_step": 243102, "epoch": 1447} {"train_loss": -11.674028396606445, "global_step": 243103, "epoch": 1447} {"train_loss": -11.981788635253906, "global_step": 243104, "epoch": 1447} {"train_loss": -12.054244041442871, "global_step": 243105, "epoch": 1447} {"train_loss": -11.732793807983398, "global_step": 243106, "epoch": 1447} {"train_loss": -11.477646827697754, "global_step": 243107, "epoch": 1447} {"train_loss": -12.072948455810547, "global_step": 243108, "epoch": 1447} {"train_loss": -11.387922286987305, "global_step": 243109, "epoch": 1447} {"train_loss": -11.290131568908691, "global_step": 243110, "epoch": 1447} {"train_loss": -11.855279922485352, "global_step": 243111, "epoch": 1447} {"train_loss": -11.688008308410645, "global_step": 243112, "epoch": 1447} {"train_loss": -11.474910736083984, "global_step": 243113, "epoch": 1447} {"train_loss": -11.309907913208008, "global_step": 243114, "epoch": 1447} {"train_loss": -11.78840446472168, "global_step": 243115, "epoch": 1447} {"train_loss": -11.451045989990234, "global_step": 243116, "epoch": 1447} {"train_loss": -11.368894577026367, "global_step": 243117, "epoch": 1447} {"train_loss": -11.642463684082031, "global_step": 243118, "epoch": 1447} {"train_loss": -11.574746131896973, "global_step": 243119, "epoch": 1447} {"train_loss": -11.737922668457031, "global_step": 243120, "epoch": 1447} {"train_loss": -11.638800621032715, "global_step": 243121, "epoch": 1447} {"train_loss": -11.68266487121582, "global_step": 243122, "epoch": 1447} {"train_loss": -11.399955749511719, "global_step": 243123, "epoch": 1447} {"train_loss": -12.133374214172363, "global_step": 243124, "epoch": 1447} {"train_loss": -11.591026306152344, "global_step": 243125, "epoch": 1447} {"train_loss": -11.501538276672363, "global_step": 243126, "epoch": 1447} {"train_loss": -11.903387069702148, "global_step": 243127, "epoch": 1447} {"train_loss": -11.874839782714844, "global_step": 243128, "epoch": 1447} {"train_loss": -11.842365264892578, "global_step": 243129, "epoch": 1447} {"train_loss": -11.598487854003906, "global_step": 243130, "epoch": 1447} {"train_loss": -11.954880714416504, "global_step": 243131, "epoch": 1447} {"train_loss": -11.61446762084961, "global_step": 243132, "epoch": 1447} {"train_loss": -11.547840118408203, "global_step": 243133, "epoch": 1447} {"train_loss": -11.759664535522461, "global_step": 243134, "epoch": 1447} {"train_loss": -11.806161880493164, "global_step": 243135, "epoch": 1447} {"train_loss": -11.92668342590332, "global_step": 243136, "epoch": 1447} {"train_loss": -12.114706039428711, "global_step": 243137, "epoch": 1447} {"train_loss": -11.649521827697754, "global_step": 243138, "epoch": 1447} {"train_loss": -11.557649612426758, "global_step": 243139, "epoch": 1447} {"train_loss": -11.642778396606445, "global_step": 243140, "epoch": 1447} {"train_loss": -11.817216873168945, "global_step": 243141, "epoch": 1447} {"train_loss": -11.528631210327148, "global_step": 243142, "epoch": 1447} {"train_loss": -11.642382621765137, "global_step": 243143, "epoch": 1447} {"train_loss": -11.52005386352539, "global_step": 243144, "epoch": 1447} {"train_loss": -10.46029281616211, "global_step": 243145, "epoch": 1447} {"train_loss": -11.599272727966309, "global_step": 243146, "epoch": 1447} {"train_loss": -10.790926933288574, "global_step": 243147, "epoch": 1447} {"train_loss": -11.502327919006348, "global_step": 243148, "epoch": 1447} {"train_loss": -10.839909553527832, "global_step": 243149, "epoch": 1447} {"train_loss": -12.034440994262695, "global_step": 243150, "epoch": 1447} {"train_loss": -11.32595443725586, "global_step": 243151, "epoch": 1447} {"train_loss": -11.184608459472656, "global_step": 243152, "epoch": 1447} {"train_loss": -11.448514938354492, "global_step": 243153, "epoch": 1447} {"train_loss": -10.9324951171875, "global_step": 243154, "epoch": 1447} {"train_loss": -11.54736328125, "global_step": 243155, "epoch": 1447} {"train_loss": -11.279825210571289, "global_step": 243156, "epoch": 1447} {"train_loss": -11.799595832824707, "global_step": 243157, "epoch": 1447} {"train_loss": -11.448452949523926, "global_step": 243158, "epoch": 1447} {"train_loss": -11.60648250579834, "global_step": 243159, "epoch": 1447} {"train_loss": -11.730135917663574, "global_step": 243160, "epoch": 1447} {"train_loss": -11.876091003417969, "global_step": 243161, "epoch": 1447} {"train_loss": -11.979719161987305, "global_step": 243162, "epoch": 1447} {"train_loss": -11.747148513793945, "global_step": 243163, "epoch": 1447} {"train_loss": -11.629717826843262, "global_step": 243164, "epoch": 1447} {"train_loss": -12.015277862548828, "global_step": 243165, "epoch": 1447} {"train_loss": -11.6228609085083, "global_step": 243166, "epoch": 1447} {"train_loss": -12.036111831665039, "global_step": 243167, "epoch": 1447} {"train_loss": -11.964337348937988, "global_step": 243168, "epoch": 1447} {"train_loss": -11.84496021270752, "global_step": 243169, "epoch": 1447} {"train_loss": -11.526567459106445, "global_step": 243170, "epoch": 1447} {"train_loss": -11.88064193725586, "global_step": 243171, "epoch": 1447} {"train_loss": -12.04544448852539, "global_step": 243172, "epoch": 1447} {"train_loss": -11.718954086303711, "global_step": 243173, "epoch": 1447} {"train_loss": -11.939048767089844, "global_step": 243174, "epoch": 1447} {"train_loss": -11.938186645507812, "global_step": 243175, "epoch": 1447} {"train_loss": -12.00306510925293, "global_step": 243176, "epoch": 1447} {"train_loss": -11.87258529663086, "global_step": 243177, "epoch": 1447} {"train_loss": -11.965751647949219, "global_step": 243178, "epoch": 1447} {"train_loss": -11.863313674926758, "global_step": 243179, "epoch": 1447} {"train_loss": -11.86408519744873, "global_step": 243180, "epoch": 1447} {"train_loss": -12.191999435424805, "global_step": 243181, "epoch": 1447} {"train_loss": -12.045698165893555, "global_step": 243182, "epoch": 1447} {"train_loss": -12.101850509643555, "global_step": 243183, "epoch": 1447} {"train_loss": -11.735612869262695, "global_step": 243184, "epoch": 1447} {"train_loss": -12.19430160522461, "global_step": 243185, "epoch": 1447} {"train_loss": -11.97262191772461, "global_step": 243186, "epoch": 1447} {"train_loss": -12.082725524902344, "global_step": 243187, "epoch": 1447} {"train_loss": -12.03453540802002, "global_step": 243188, "epoch": 1447} {"train_loss": -12.227598190307617, "global_step": 243189, "epoch": 1447} {"train_loss": -12.13125228881836, "global_step": 243190, "epoch": 1447} {"train_loss": -12.304702758789062, "global_step": 243191, "epoch": 1447} {"train_loss": -11.544450759887695, "global_step": 243192, "epoch": 1447} {"train_loss": -11.829410552978516, "global_step": 243193, "epoch": 1447} {"train_loss": -12.275834083557129, "global_step": 243194, "epoch": 1447} {"train_loss": -11.727339744567871, "global_step": 243195, "epoch": 1447} {"train_loss": -11.403120040893555, "global_step": 243196, "epoch": 1447} {"train_loss": -10.61102294921875, "global_step": 243197, "epoch": 1447} {"train_loss": -10.345918655395508, "global_step": 243198, "epoch": 1447} {"train_loss": -11.840202331542969, "global_step": 243199, "epoch": 1447} {"train_loss": -10.534515380859375, "global_step": 243200, "epoch": 1447} {"train_loss": -9.773384094238281, "global_step": 243201, "epoch": 1447} {"train_loss": -11.240989685058594, "global_step": 243202, "epoch": 1447} {"train_loss": -10.767778396606445, "global_step": 243203, "epoch": 1447} {"train_loss": -10.502191543579102, "global_step": 243204, "epoch": 1447} {"train_loss": -11.012445449829102, "global_step": 243205, "epoch": 1447} {"train_loss": -11.518293380737305, "global_step": 243206, "epoch": 1447} {"train_loss": -11.159623146057129, "global_step": 243207, "epoch": 1447} {"train_loss": -11.072908401489258, "global_step": 243208, "epoch": 1447} {"train_loss": -11.40903091430664, "global_step": 243209, "epoch": 1447} {"train_loss": -10.822606086730957, "global_step": 243210, "epoch": 1447} {"train_loss": -10.91665267944336, "global_step": 243211, "epoch": 1447} {"train_loss": -11.144962310791016, "global_step": 243212, "epoch": 1447} {"train_loss": -9.878522872924805, "global_step": 243213, "epoch": 1447} {"train_loss": -10.85567855834961, "global_step": 243214, "epoch": 1447} {"train_loss": -9.96203899383545, "global_step": 243215, "epoch": 1447} {"train_loss": -11.374406814575195, "global_step": 243216, "epoch": 1447} {"train_loss": -9.539556503295898, "global_step": 243217, "epoch": 1447} {"train_loss": -11.428789138793945, "global_step": 243218, "epoch": 1447} {"train_loss": -10.961772918701172, "global_step": 243219, "epoch": 1447} {"train_loss": -10.867042541503906, "global_step": 243220, "epoch": 1447} {"train_loss": -11.105268478393555, "global_step": 243221, "epoch": 1447} {"train_loss": -11.018268585205078, "global_step": 243222, "epoch": 1447} {"train_loss": -11.293514251708984, "global_step": 243223, "epoch": 1447} {"train_loss": -11.346532821655273, "global_step": 243224, "epoch": 1447} {"train_loss": -10.755107879638672, "global_step": 243225, "epoch": 1447} {"train_loss": -11.251124382019043, "global_step": 243226, "epoch": 1447} {"train_loss": -10.903398513793945, "global_step": 243227, "epoch": 1447} {"train_loss": -11.310003280639648, "global_step": 243228, "epoch": 1447} {"train_loss": -10.861387252807617, "global_step": 243229, "epoch": 1447} {"train_loss": -11.202398300170898, "global_step": 243230, "epoch": 1447} {"train_loss": -11.230606079101562, "global_step": 243231, "epoch": 1447} {"train_loss": -11.012601852416992, "global_step": 243232, "epoch": 1447} {"train_loss": -11.667933464050293, "global_step": 243233, "epoch": 1447} {"train_loss": -11.070205688476562, "global_step": 243234, "epoch": 1447} {"train_loss": -11.262229919433594, "global_step": 243235, "epoch": 1447} {"train_loss": -11.071575164794922, "global_step": 243236, "epoch": 1447} {"train_loss": -11.762567520141602, "global_step": 243237, "epoch": 1447} {"train_loss": -11.485481262207031, "global_step": 243238, "epoch": 1447} {"train_loss": -11.481203079223633, "global_step": 243239, "epoch": 1447} {"train_loss": -11.689838409423828, "global_step": 243240, "epoch": 1447} {"train_loss": -11.446466445922852, "global_step": 243241, "epoch": 1447} {"train_loss": -11.668943405151367, "global_step": 243242, "epoch": 1447} {"train_loss": -11.384513854980469, "global_step": 243243, "epoch": 1447} {"train_loss": -11.64438247680664, "global_step": 243244, "epoch": 1447} {"train_loss": -11.579672813415527, "global_step": 243245, "epoch": 1447} {"train_loss": -11.660207748413086, "global_step": 243246, "epoch": 1447} {"train_loss": -11.490982055664062, "global_step": 243247, "epoch": 1447} {"train_loss": -11.817562103271484, "global_step": 243248, "epoch": 1447} {"train_loss": -11.57503604888916, "global_step": 243249, "epoch": 1447} {"train_loss": -11.668190002441406, "global_step": 243250, "epoch": 1447} {"train_loss": -11.421119689941406, "global_step": 243251, "epoch": 1447} {"train_loss": -11.690507888793945, "global_step": 243252, "epoch": 1447} {"train_loss": -11.810447692871094, "global_step": 243253, "epoch": 1447} {"train_loss": -12.069711685180664, "global_step": 243254, "epoch": 1447} {"train_loss": -11.52890396118164, "global_step": 243255, "epoch": 1447} {"train_loss": -11.844261169433594, "global_step": 243256, "epoch": 1447} {"train_loss": -11.760514259338379, "global_step": 243257, "epoch": 1447} {"train_loss": -11.642744064331055, "global_step": 243258, "epoch": 1447} {"train_loss": -11.588071823120117, "global_step": 243259, "epoch": 1447} {"train_loss": -11.606529235839844, "global_step": 243260, "epoch": 1447} {"train_loss": -11.954750061035156, "global_step": 243261, "epoch": 1447} {"train_loss": -12.024812698364258, "global_step": 243262, "epoch": 1447} {"train_loss": -11.5375364224116, "global_step": 243263, "epoch": 1447, "val_loss": 266293.9375} {"train_loss": -11.904609680175781, "global_step": 243264, "epoch": 1448} {"train_loss": -11.78134822845459, "global_step": 243265, "epoch": 1448} {"train_loss": -11.851520538330078, "global_step": 243266, "epoch": 1448} {"train_loss": -12.100687026977539, "global_step": 243267, "epoch": 1448} {"train_loss": -11.86609172821045, "global_step": 243268, "epoch": 1448} {"train_loss": -11.764402389526367, "global_step": 243269, "epoch": 1448} {"train_loss": -11.94648551940918, "global_step": 243270, "epoch": 1448} {"train_loss": -11.858892440795898, "global_step": 243271, "epoch": 1448} {"train_loss": -12.011920928955078, "global_step": 243272, "epoch": 1448} {"train_loss": -12.135964393615723, "global_step": 243273, "epoch": 1448} {"train_loss": -11.859624862670898, "global_step": 243274, "epoch": 1448} {"train_loss": -11.946046829223633, "global_step": 243275, "epoch": 1448} {"train_loss": -12.105416297912598, "global_step": 243276, "epoch": 1448} {"train_loss": -11.925262451171875, "global_step": 243277, "epoch": 1448} {"train_loss": -11.990935325622559, "global_step": 243278, "epoch": 1448} {"train_loss": -12.130915641784668, "global_step": 243279, "epoch": 1448} {"train_loss": -12.006392478942871, "global_step": 243280, "epoch": 1448} {"train_loss": -12.005826950073242, "global_step": 243281, "epoch": 1448} {"train_loss": -12.154081344604492, "global_step": 243282, "epoch": 1448} {"train_loss": -12.154309272766113, "global_step": 243283, "epoch": 1448} {"train_loss": -11.940230369567871, "global_step": 243284, "epoch": 1448} {"train_loss": -12.101860046386719, "global_step": 243285, "epoch": 1448} {"train_loss": -12.047052383422852, "global_step": 243286, "epoch": 1448} {"train_loss": -12.015506744384766, "global_step": 243287, "epoch": 1448} {"train_loss": -12.209854125976562, "global_step": 243288, "epoch": 1448} {"train_loss": -12.067489624023438, "global_step": 243289, "epoch": 1448} {"train_loss": -12.218528747558594, "global_step": 243290, "epoch": 1448} {"train_loss": -12.264490127563477, "global_step": 243291, "epoch": 1448} {"train_loss": -12.089212417602539, "global_step": 243292, "epoch": 1448} {"train_loss": -12.207454681396484, "global_step": 243293, "epoch": 1448} {"train_loss": -12.099686622619629, "global_step": 243294, "epoch": 1448} {"train_loss": -12.08169937133789, "global_step": 243295, "epoch": 1448} {"train_loss": -12.14990234375, "global_step": 243296, "epoch": 1448} {"train_loss": -11.809843063354492, "global_step": 243297, "epoch": 1448} {"train_loss": -12.043718338012695, "global_step": 243298, "epoch": 1448} {"train_loss": -12.275732040405273, "global_step": 243299, "epoch": 1448} {"train_loss": -11.866741180419922, "global_step": 243300, "epoch": 1448} {"train_loss": -11.432077407836914, "global_step": 243301, "epoch": 1448} {"train_loss": -11.74538803100586, "global_step": 243302, "epoch": 1448} {"train_loss": -11.0404691696167, "global_step": 243303, "epoch": 1448} {"train_loss": -10.867112159729004, "global_step": 243304, "epoch": 1448} {"train_loss": -11.371671676635742, "global_step": 243305, "epoch": 1448} {"train_loss": -10.595026969909668, "global_step": 243306, "epoch": 1448} {"train_loss": -10.144770622253418, "global_step": 243307, "epoch": 1448} {"train_loss": -11.686602592468262, "global_step": 243308, "epoch": 1448} {"train_loss": -11.361919403076172, "global_step": 243309, "epoch": 1448} {"train_loss": -10.739023208618164, "global_step": 243310, "epoch": 1448} {"train_loss": -11.583305358886719, "global_step": 243311, "epoch": 1448} {"train_loss": -11.817117691040039, "global_step": 243312, "epoch": 1448} {"train_loss": -11.475923538208008, "global_step": 243313, "epoch": 1448} {"train_loss": -11.42938232421875, "global_step": 243314, "epoch": 1448} {"train_loss": -11.14462947845459, "global_step": 243315, "epoch": 1448} {"train_loss": -11.748767852783203, "global_step": 243316, "epoch": 1448} {"train_loss": -10.8641996383667, "global_step": 243317, "epoch": 1448} {"train_loss": -10.29515552520752, "global_step": 243318, "epoch": 1448} {"train_loss": -11.26502799987793, "global_step": 243319, "epoch": 1448} {"train_loss": -10.991832733154297, "global_step": 243320, "epoch": 1448} {"train_loss": -9.970005989074707, "global_step": 243321, "epoch": 1448} {"train_loss": -11.373908042907715, "global_step": 243322, "epoch": 1448} {"train_loss": -9.055778503417969, "global_step": 243323, "epoch": 1448} {"train_loss": -11.645441055297852, "global_step": 243324, "epoch": 1448} {"train_loss": -9.1190185546875, "global_step": 243325, "epoch": 1448} {"train_loss": -11.59714126586914, "global_step": 243326, "epoch": 1448} {"train_loss": -10.069314956665039, "global_step": 243327, "epoch": 1448} {"train_loss": -10.250072479248047, "global_step": 243328, "epoch": 1448} {"train_loss": -10.518823623657227, "global_step": 243329, "epoch": 1448} {"train_loss": -9.608168601989746, "global_step": 243330, "epoch": 1448} {"train_loss": -10.916269302368164, "global_step": 243331, "epoch": 1448} {"train_loss": -9.36250114440918, "global_step": 243332, "epoch": 1448} {"train_loss": -11.304351806640625, "global_step": 243333, "epoch": 1448} {"train_loss": -10.131595611572266, "global_step": 243334, "epoch": 1448} {"train_loss": -10.576452255249023, "global_step": 243335, "epoch": 1448} {"train_loss": -10.239066123962402, "global_step": 243336, "epoch": 1448} {"train_loss": -11.342251777648926, "global_step": 243337, "epoch": 1448} {"train_loss": -10.087191581726074, "global_step": 243338, "epoch": 1448} {"train_loss": -10.81928825378418, "global_step": 243339, "epoch": 1448} {"train_loss": -10.637089729309082, "global_step": 243340, "epoch": 1448} {"train_loss": -11.136004447937012, "global_step": 243341, "epoch": 1448} {"train_loss": -10.549748420715332, "global_step": 243342, "epoch": 1448} {"train_loss": -10.96066665649414, "global_step": 243343, "epoch": 1448} {"train_loss": -11.182276725769043, "global_step": 243344, "epoch": 1448} {"train_loss": -11.263543128967285, "global_step": 243345, "epoch": 1448} {"train_loss": -11.430707931518555, "global_step": 243346, "epoch": 1448} {"train_loss": -11.514148712158203, "global_step": 243347, "epoch": 1448} {"train_loss": -11.063944816589355, "global_step": 243348, "epoch": 1448} {"train_loss": -11.390926361083984, "global_step": 243349, "epoch": 1448} {"train_loss": -11.243900299072266, "global_step": 243350, "epoch": 1448} {"train_loss": -11.099620819091797, "global_step": 243351, "epoch": 1448} {"train_loss": -11.715845108032227, "global_step": 243352, "epoch": 1448} {"train_loss": -11.372970581054688, "global_step": 243353, "epoch": 1448} {"train_loss": -11.509045600891113, "global_step": 243354, "epoch": 1448} {"train_loss": -11.11524772644043, "global_step": 243355, "epoch": 1448} {"train_loss": -11.723325729370117, "global_step": 243356, "epoch": 1448} {"train_loss": -11.406810760498047, "global_step": 243357, "epoch": 1448} {"train_loss": -11.281717300415039, "global_step": 243358, "epoch": 1448} {"train_loss": -11.521648406982422, "global_step": 243359, "epoch": 1448} {"train_loss": -11.464792251586914, "global_step": 243360, "epoch": 1448} {"train_loss": -11.809621810913086, "global_step": 243361, "epoch": 1448} {"train_loss": -11.38679313659668, "global_step": 243362, "epoch": 1448} {"train_loss": -11.662019729614258, "global_step": 243363, "epoch": 1448} {"train_loss": -11.724797248840332, "global_step": 243364, "epoch": 1448} {"train_loss": -11.50700569152832, "global_step": 243365, "epoch": 1448} {"train_loss": -11.533157348632812, "global_step": 243366, "epoch": 1448} {"train_loss": -11.746849060058594, "global_step": 243367, "epoch": 1448} {"train_loss": -11.70849323272705, "global_step": 243368, "epoch": 1448} {"train_loss": -11.442190170288086, "global_step": 243369, "epoch": 1448} {"train_loss": -11.557432174682617, "global_step": 243370, "epoch": 1448} {"train_loss": -11.758012771606445, "global_step": 243371, "epoch": 1448} {"train_loss": -11.712778091430664, "global_step": 243372, "epoch": 1448} {"train_loss": -11.656052589416504, "global_step": 243373, "epoch": 1448} {"train_loss": -11.524778366088867, "global_step": 243374, "epoch": 1448} {"train_loss": -11.7913179397583, "global_step": 243375, "epoch": 1448} {"train_loss": -11.935503005981445, "global_step": 243376, "epoch": 1448} {"train_loss": -11.935107231140137, "global_step": 243377, "epoch": 1448} {"train_loss": -11.811532974243164, "global_step": 243378, "epoch": 1448} {"train_loss": -11.898175239562988, "global_step": 243379, "epoch": 1448} {"train_loss": -11.792705535888672, "global_step": 243380, "epoch": 1448} {"train_loss": -11.806640625, "global_step": 243381, "epoch": 1448} {"train_loss": -11.90713119506836, "global_step": 243382, "epoch": 1448} {"train_loss": -11.710517883300781, "global_step": 243383, "epoch": 1448} {"train_loss": -11.97679328918457, "global_step": 243384, "epoch": 1448} {"train_loss": -12.012065887451172, "global_step": 243385, "epoch": 1448} {"train_loss": -11.689350128173828, "global_step": 243386, "epoch": 1448} {"train_loss": -11.941967010498047, "global_step": 243387, "epoch": 1448} {"train_loss": -11.759468078613281, "global_step": 243388, "epoch": 1448} {"train_loss": -11.835941314697266, "global_step": 243389, "epoch": 1448} {"train_loss": -11.994197845458984, "global_step": 243390, "epoch": 1448} {"train_loss": -11.830955505371094, "global_step": 243391, "epoch": 1448} {"train_loss": -11.912370681762695, "global_step": 243392, "epoch": 1448} {"train_loss": -12.02795696258545, "global_step": 243393, "epoch": 1448} {"train_loss": -11.660829544067383, "global_step": 243394, "epoch": 1448} {"train_loss": -12.156268119812012, "global_step": 243395, "epoch": 1448} {"train_loss": -11.794660568237305, "global_step": 243396, "epoch": 1448} {"train_loss": -12.030166625976562, "global_step": 243397, "epoch": 1448} {"train_loss": -12.039152145385742, "global_step": 243398, "epoch": 1448} {"train_loss": -11.321385383605957, "global_step": 243399, "epoch": 1448} {"train_loss": -11.946869850158691, "global_step": 243400, "epoch": 1448} {"train_loss": -11.552497863769531, "global_step": 243401, "epoch": 1448} {"train_loss": -11.747049331665039, "global_step": 243402, "epoch": 1448} {"train_loss": -11.585590362548828, "global_step": 243403, "epoch": 1448} {"train_loss": -11.276589393615723, "global_step": 243404, "epoch": 1448} {"train_loss": -11.864728927612305, "global_step": 243405, "epoch": 1448} {"train_loss": -10.675092697143555, "global_step": 243406, "epoch": 1448} {"train_loss": -12.091072082519531, "global_step": 243407, "epoch": 1448} {"train_loss": -11.561287879943848, "global_step": 243408, "epoch": 1448} {"train_loss": -11.781765937805176, "global_step": 243409, "epoch": 1448} {"train_loss": -11.747976303100586, "global_step": 243410, "epoch": 1448} {"train_loss": -11.358733177185059, "global_step": 243411, "epoch": 1448} {"train_loss": -11.916868209838867, "global_step": 243412, "epoch": 1448} {"train_loss": -11.364324569702148, "global_step": 243413, "epoch": 1448} {"train_loss": -12.02800178527832, "global_step": 243414, "epoch": 1448} {"train_loss": -11.592412948608398, "global_step": 243415, "epoch": 1448} {"train_loss": -11.699850082397461, "global_step": 243416, "epoch": 1448} {"train_loss": -11.401957511901855, "global_step": 243417, "epoch": 1448} {"train_loss": -11.105293273925781, "global_step": 243418, "epoch": 1448} {"train_loss": -11.750972747802734, "global_step": 243419, "epoch": 1448} {"train_loss": -11.363183975219727, "global_step": 243420, "epoch": 1448} {"train_loss": -12.01248550415039, "global_step": 243421, "epoch": 1448} {"train_loss": -11.991180419921875, "global_step": 243422, "epoch": 1448} {"train_loss": -11.712562561035156, "global_step": 243423, "epoch": 1448} {"train_loss": -11.98653793334961, "global_step": 243424, "epoch": 1448} {"train_loss": -11.62325668334961, "global_step": 243425, "epoch": 1448} {"train_loss": -12.026922225952148, "global_step": 243426, "epoch": 1448} {"train_loss": -11.787318229675293, "global_step": 243427, "epoch": 1448} {"train_loss": -11.831775665283203, "global_step": 243428, "epoch": 1448} {"train_loss": -12.016464233398438, "global_step": 243429, "epoch": 1448} {"train_loss": -11.566595077514648, "global_step": 243430, "epoch": 1448} {"train_loss": -11.52429271311987, "global_step": 243431, "epoch": 1448, "val_loss": 266424.125} {"train_loss": -11.48725700378418, "global_step": 243432, "epoch": 1449} {"train_loss": -11.936518669128418, "global_step": 243433, "epoch": 1449} {"train_loss": -11.510860443115234, "global_step": 243434, "epoch": 1449} {"train_loss": -11.902694702148438, "global_step": 243435, "epoch": 1449} {"train_loss": -11.784902572631836, "global_step": 243436, "epoch": 1449} {"train_loss": -12.012367248535156, "global_step": 243437, "epoch": 1449} {"train_loss": -11.363201141357422, "global_step": 243438, "epoch": 1449} {"train_loss": -11.89272689819336, "global_step": 243439, "epoch": 1449} {"train_loss": -11.815784454345703, "global_step": 243440, "epoch": 1449} {"train_loss": -11.631546020507812, "global_step": 243441, "epoch": 1449} {"train_loss": -11.361366271972656, "global_step": 243442, "epoch": 1449} {"train_loss": -12.053871154785156, "global_step": 243443, "epoch": 1449} {"train_loss": -11.92314338684082, "global_step": 243444, "epoch": 1449} {"train_loss": -11.992888450622559, "global_step": 243445, "epoch": 1449} {"train_loss": -11.807262420654297, "global_step": 243446, "epoch": 1449} {"train_loss": -11.804084777832031, "global_step": 243447, "epoch": 1449} {"train_loss": -11.25906753540039, "global_step": 243448, "epoch": 1449} {"train_loss": -11.820145606994629, "global_step": 243449, "epoch": 1449} {"train_loss": -11.397252082824707, "global_step": 243450, "epoch": 1449} {"train_loss": -11.303146362304688, "global_step": 243451, "epoch": 1449} {"train_loss": -10.566757202148438, "global_step": 243452, "epoch": 1449} {"train_loss": -11.21610164642334, "global_step": 243453, "epoch": 1449} {"train_loss": -11.354923248291016, "global_step": 243454, "epoch": 1449} {"train_loss": -11.317621231079102, "global_step": 243455, "epoch": 1449} {"train_loss": -11.573172569274902, "global_step": 243456, "epoch": 1449} {"train_loss": -11.773784637451172, "global_step": 243457, "epoch": 1449} {"train_loss": -11.662506103515625, "global_step": 243458, "epoch": 1449} {"train_loss": -11.420355796813965, "global_step": 243459, "epoch": 1449} {"train_loss": -11.470022201538086, "global_step": 243460, "epoch": 1449} {"train_loss": -11.56620979309082, "global_step": 243461, "epoch": 1449} {"train_loss": -11.888145446777344, "global_step": 243462, "epoch": 1449} {"train_loss": -11.674295425415039, "global_step": 243463, "epoch": 1449} {"train_loss": -11.919191360473633, "global_step": 243464, "epoch": 1449} {"train_loss": -11.267204284667969, "global_step": 243465, "epoch": 1449} {"train_loss": -11.787797927856445, "global_step": 243466, "epoch": 1449} {"train_loss": -11.081071853637695, "global_step": 243467, "epoch": 1449} {"train_loss": -11.3548583984375, "global_step": 243468, "epoch": 1449} {"train_loss": -11.54791259765625, "global_step": 243469, "epoch": 1449} {"train_loss": -11.767586708068848, "global_step": 243470, "epoch": 1449} {"train_loss": -11.581536293029785, "global_step": 243471, "epoch": 1449} {"train_loss": -11.472770690917969, "global_step": 243472, "epoch": 1449} {"train_loss": -11.413618087768555, "global_step": 243473, "epoch": 1449} {"train_loss": -11.928689956665039, "global_step": 243474, "epoch": 1449} {"train_loss": -11.713459014892578, "global_step": 243475, "epoch": 1449} {"train_loss": -12.006736755371094, "global_step": 243476, "epoch": 1449} {"train_loss": -11.737749099731445, "global_step": 243477, "epoch": 1449} {"train_loss": -11.912935256958008, "global_step": 243478, "epoch": 1449} {"train_loss": -11.733245849609375, "global_step": 243479, "epoch": 1449} {"train_loss": -12.028274536132812, "global_step": 243480, "epoch": 1449} {"train_loss": -11.615814208984375, "global_step": 243481, "epoch": 1449} {"train_loss": -11.875301361083984, "global_step": 243482, "epoch": 1449} {"train_loss": -11.620828628540039, "global_step": 243483, "epoch": 1449} {"train_loss": -12.028303146362305, "global_step": 243484, "epoch": 1449} {"train_loss": -10.836341857910156, "global_step": 243485, "epoch": 1449} {"train_loss": -11.362543106079102, "global_step": 243486, "epoch": 1449} {"train_loss": -11.305896759033203, "global_step": 243487, "epoch": 1449} {"train_loss": -11.026378631591797, "global_step": 243488, "epoch": 1449} {"train_loss": -11.0963134765625, "global_step": 243489, "epoch": 1449} {"train_loss": -12.054435729980469, "global_step": 243490, "epoch": 1449} {"train_loss": -11.068602561950684, "global_step": 243491, "epoch": 1449} {"train_loss": -11.644366264343262, "global_step": 243492, "epoch": 1449} {"train_loss": -11.467679023742676, "global_step": 243493, "epoch": 1449} {"train_loss": -11.386362075805664, "global_step": 243494, "epoch": 1449} {"train_loss": -11.804346084594727, "global_step": 243495, "epoch": 1449} {"train_loss": -11.585821151733398, "global_step": 243496, "epoch": 1449} {"train_loss": -11.979308128356934, "global_step": 243497, "epoch": 1449} {"train_loss": -11.696311950683594, "global_step": 243498, "epoch": 1449} {"train_loss": -11.365909576416016, "global_step": 243499, "epoch": 1449} {"train_loss": -11.932499885559082, "global_step": 243500, "epoch": 1449} {"train_loss": -11.677469253540039, "global_step": 243501, "epoch": 1449} {"train_loss": -11.526741981506348, "global_step": 243502, "epoch": 1449} {"train_loss": -12.05021858215332, "global_step": 243503, "epoch": 1449} {"train_loss": -11.63456916809082, "global_step": 243504, "epoch": 1449} {"train_loss": -12.064667701721191, "global_step": 243505, "epoch": 1449} {"train_loss": -11.646203994750977, "global_step": 243506, "epoch": 1449} {"train_loss": -11.87999439239502, "global_step": 243507, "epoch": 1449} {"train_loss": -11.789517402648926, "global_step": 243508, "epoch": 1449} {"train_loss": -11.949559211730957, "global_step": 243509, "epoch": 1449} {"train_loss": -11.935986518859863, "global_step": 243510, "epoch": 1449} {"train_loss": -11.880584716796875, "global_step": 243511, "epoch": 1449} {"train_loss": -11.907683372497559, "global_step": 243512, "epoch": 1449} {"train_loss": -12.050497055053711, "global_step": 243513, "epoch": 1449} {"train_loss": -11.777082443237305, "global_step": 243514, "epoch": 1449} {"train_loss": -12.04902458190918, "global_step": 243515, "epoch": 1449} {"train_loss": -11.60435676574707, "global_step": 243516, "epoch": 1449} {"train_loss": -11.063196182250977, "global_step": 243517, "epoch": 1449} {"train_loss": -11.142477989196777, "global_step": 243518, "epoch": 1449} {"train_loss": -11.419679641723633, "global_step": 243519, "epoch": 1449} {"train_loss": -11.448164939880371, "global_step": 243520, "epoch": 1449} {"train_loss": -10.791455268859863, "global_step": 243521, "epoch": 1449} {"train_loss": -11.215914726257324, "global_step": 243522, "epoch": 1449} {"train_loss": -11.33080768585205, "global_step": 243523, "epoch": 1449} {"train_loss": -11.07783317565918, "global_step": 243524, "epoch": 1449} {"train_loss": -11.322543144226074, "global_step": 243525, "epoch": 1449} {"train_loss": -11.526765823364258, "global_step": 243526, "epoch": 1449} {"train_loss": -10.857059478759766, "global_step": 243527, "epoch": 1449} {"train_loss": -11.532608032226562, "global_step": 243528, "epoch": 1449} {"train_loss": -11.59106159210205, "global_step": 243529, "epoch": 1449} {"train_loss": -11.606461524963379, "global_step": 243530, "epoch": 1449} {"train_loss": -11.806954383850098, "global_step": 243531, "epoch": 1449} {"train_loss": -11.668535232543945, "global_step": 243532, "epoch": 1449} {"train_loss": -11.702262878417969, "global_step": 243533, "epoch": 1449} {"train_loss": -11.430912017822266, "global_step": 243534, "epoch": 1449} {"train_loss": -11.235170364379883, "global_step": 243535, "epoch": 1449} {"train_loss": -11.185760498046875, "global_step": 243536, "epoch": 1449} {"train_loss": -11.100528717041016, "global_step": 243537, "epoch": 1449} {"train_loss": -11.06325626373291, "global_step": 243538, "epoch": 1449} {"train_loss": -10.051340103149414, "global_step": 243539, "epoch": 1449} {"train_loss": -11.633247375488281, "global_step": 243540, "epoch": 1449} {"train_loss": -9.32408332824707, "global_step": 243541, "epoch": 1449} {"train_loss": -10.655570983886719, "global_step": 243542, "epoch": 1449} {"train_loss": -10.80741024017334, "global_step": 243543, "epoch": 1449} {"train_loss": -10.76124382019043, "global_step": 243544, "epoch": 1449} {"train_loss": -10.040997505187988, "global_step": 243545, "epoch": 1449} {"train_loss": -11.611727714538574, "global_step": 243546, "epoch": 1449} {"train_loss": -10.124921798706055, "global_step": 243547, "epoch": 1449} {"train_loss": -11.647644996643066, "global_step": 243548, "epoch": 1449} {"train_loss": -10.770174026489258, "global_step": 243549, "epoch": 1449} {"train_loss": -11.074759483337402, "global_step": 243550, "epoch": 1449} {"train_loss": -11.320856094360352, "global_step": 243551, "epoch": 1449} {"train_loss": -10.952648162841797, "global_step": 243552, "epoch": 1449} {"train_loss": -10.420028686523438, "global_step": 243553, "epoch": 1449} {"train_loss": -10.78355598449707, "global_step": 243554, "epoch": 1449} {"train_loss": -9.886398315429688, "global_step": 243555, "epoch": 1449} {"train_loss": -10.596598625183105, "global_step": 243556, "epoch": 1449} {"train_loss": -10.56866455078125, "global_step": 243557, "epoch": 1449} {"train_loss": -10.883203506469727, "global_step": 243558, "epoch": 1449} {"train_loss": -10.921279907226562, "global_step": 243559, "epoch": 1449} {"train_loss": -10.883631706237793, "global_step": 243560, "epoch": 1449} {"train_loss": -11.04147720336914, "global_step": 243561, "epoch": 1449} {"train_loss": -10.912651062011719, "global_step": 243562, "epoch": 1449} {"train_loss": -10.911029815673828, "global_step": 243563, "epoch": 1449} {"train_loss": -11.310340881347656, "global_step": 243564, "epoch": 1449} {"train_loss": -10.860672950744629, "global_step": 243565, "epoch": 1449} {"train_loss": -11.450407028198242, "global_step": 243566, "epoch": 1449} {"train_loss": -11.253754615783691, "global_step": 243567, "epoch": 1449} {"train_loss": -11.220829010009766, "global_step": 243568, "epoch": 1449} {"train_loss": -11.01470947265625, "global_step": 243569, "epoch": 1449} {"train_loss": -11.408838272094727, "global_step": 243570, "epoch": 1449} {"train_loss": -10.491281509399414, "global_step": 243571, "epoch": 1449} {"train_loss": -11.409648895263672, "global_step": 243572, "epoch": 1449} {"train_loss": -10.947367668151855, "global_step": 243573, "epoch": 1449} {"train_loss": -10.91415786743164, "global_step": 243574, "epoch": 1449} {"train_loss": -11.285520553588867, "global_step": 243575, "epoch": 1449} {"train_loss": -10.689998626708984, "global_step": 243576, "epoch": 1449} {"train_loss": -10.69304370880127, "global_step": 243577, "epoch": 1449} {"train_loss": -10.999734878540039, "global_step": 243578, "epoch": 1449} {"train_loss": -11.297626495361328, "global_step": 243579, "epoch": 1449} {"train_loss": -10.728937149047852, "global_step": 243580, "epoch": 1449} {"train_loss": -11.346845626831055, "global_step": 243581, "epoch": 1449} {"train_loss": -10.983495712280273, "global_step": 243582, "epoch": 1449} {"train_loss": -11.428095817565918, "global_step": 243583, "epoch": 1449} {"train_loss": -11.380578994750977, "global_step": 243584, "epoch": 1449} {"train_loss": -11.165619850158691, "global_step": 243585, "epoch": 1449} {"train_loss": -11.254587173461914, "global_step": 243586, "epoch": 1449} {"train_loss": -11.527962684631348, "global_step": 243587, "epoch": 1449} {"train_loss": -11.267216682434082, "global_step": 243588, "epoch": 1449} {"train_loss": -11.118900299072266, "global_step": 243589, "epoch": 1449} {"train_loss": -11.595076560974121, "global_step": 243590, "epoch": 1449} {"train_loss": -11.162601470947266, "global_step": 243591, "epoch": 1449} {"train_loss": -11.371936798095703, "global_step": 243592, "epoch": 1449} {"train_loss": -11.58909797668457, "global_step": 243593, "epoch": 1449} {"train_loss": -11.696738243103027, "global_step": 243594, "epoch": 1449} {"train_loss": -11.222827911376953, "global_step": 243595, "epoch": 1449} {"train_loss": -11.769302368164062, "global_step": 243596, "epoch": 1449} {"train_loss": -11.50361442565918, "global_step": 243597, "epoch": 1449} {"train_loss": -11.414319038391113, "global_step": 243598, "epoch": 1449} {"train_loss": -11.379664988744826, "global_step": 243599, "epoch": 1449, "val_loss": 268815.5} {"train_loss": -11.631538391113281, "global_step": 243600, "epoch": 1450} {"train_loss": -11.619731903076172, "global_step": 243601, "epoch": 1450} {"train_loss": -11.355384826660156, "global_step": 243602, "epoch": 1450} {"train_loss": -11.805282592773438, "global_step": 243603, "epoch": 1450} {"train_loss": -11.579676628112793, "global_step": 243604, "epoch": 1450} {"train_loss": -11.795900344848633, "global_step": 243605, "epoch": 1450} {"train_loss": -11.389907836914062, "global_step": 243606, "epoch": 1450} {"train_loss": -11.770025253295898, "global_step": 243607, "epoch": 1450} {"train_loss": -11.58271598815918, "global_step": 243608, "epoch": 1450} {"train_loss": -11.486435890197754, "global_step": 243609, "epoch": 1450} {"train_loss": -11.600629806518555, "global_step": 243610, "epoch": 1450} {"train_loss": -11.430803298950195, "global_step": 243611, "epoch": 1450} {"train_loss": -11.739452362060547, "global_step": 243612, "epoch": 1450} {"train_loss": -11.4605712890625, "global_step": 243613, "epoch": 1450} {"train_loss": -11.877277374267578, "global_step": 243614, "epoch": 1450} {"train_loss": -11.472387313842773, "global_step": 243615, "epoch": 1450} {"train_loss": -11.932779312133789, "global_step": 243616, "epoch": 1450} {"train_loss": -11.653022766113281, "global_step": 243617, "epoch": 1450} {"train_loss": -11.791738510131836, "global_step": 243618, "epoch": 1450} {"train_loss": -11.807609558105469, "global_step": 243619, "epoch": 1450} {"train_loss": -11.94469928741455, "global_step": 243620, "epoch": 1450} {"train_loss": -11.668513298034668, "global_step": 243621, "epoch": 1450} {"train_loss": -11.579692840576172, "global_step": 243622, "epoch": 1450} {"train_loss": -11.778776168823242, "global_step": 243623, "epoch": 1450} {"train_loss": -11.531269073486328, "global_step": 243624, "epoch": 1450} {"train_loss": -11.592239379882812, "global_step": 243625, "epoch": 1450} {"train_loss": -11.645665168762207, "global_step": 243626, "epoch": 1450} {"train_loss": -11.846955299377441, "global_step": 243627, "epoch": 1450} {"train_loss": -11.676492691040039, "global_step": 243628, "epoch": 1450} {"train_loss": -11.590347290039062, "global_step": 243629, "epoch": 1450} {"train_loss": -11.933601379394531, "global_step": 243630, "epoch": 1450} {"train_loss": -11.68212604522705, "global_step": 243631, "epoch": 1450} {"train_loss": -11.88707160949707, "global_step": 243632, "epoch": 1450} {"train_loss": -11.403339385986328, "global_step": 243633, "epoch": 1450} {"train_loss": -11.830013275146484, "global_step": 243634, "epoch": 1450} {"train_loss": -11.76658821105957, "global_step": 243635, "epoch": 1450} {"train_loss": -11.890003204345703, "global_step": 243636, "epoch": 1450} {"train_loss": -11.869789123535156, "global_step": 243637, "epoch": 1450} {"train_loss": -11.860660552978516, "global_step": 243638, "epoch": 1450} {"train_loss": -11.752492904663086, "global_step": 243639, "epoch": 1450} {"train_loss": -11.993417739868164, "global_step": 243640, "epoch": 1450} {"train_loss": -11.946982383728027, "global_step": 243641, "epoch": 1450} {"train_loss": -12.165809631347656, "global_step": 243642, "epoch": 1450} {"train_loss": -12.027031898498535, "global_step": 243643, "epoch": 1450} {"train_loss": -11.981800079345703, "global_step": 243644, "epoch": 1450} {"train_loss": -12.087041854858398, "global_step": 243645, "epoch": 1450} {"train_loss": -12.068169593811035, "global_step": 243646, "epoch": 1450} {"train_loss": -11.545331954956055, "global_step": 243647, "epoch": 1450} {"train_loss": -11.992328643798828, "global_step": 243648, "epoch": 1450} {"train_loss": -11.91435432434082, "global_step": 243649, "epoch": 1450} {"train_loss": -11.756793975830078, "global_step": 243650, "epoch": 1450} {"train_loss": -12.10820198059082, "global_step": 243651, "epoch": 1450} {"train_loss": -11.82886791229248, "global_step": 243652, "epoch": 1450} {"train_loss": -11.899528503417969, "global_step": 243653, "epoch": 1450} {"train_loss": -11.97148609161377, "global_step": 243654, "epoch": 1450} {"train_loss": -11.88667106628418, "global_step": 243655, "epoch": 1450} {"train_loss": -12.178350448608398, "global_step": 243656, "epoch": 1450} {"train_loss": -11.922072410583496, "global_step": 243657, "epoch": 1450} {"train_loss": -11.333810806274414, "global_step": 243658, "epoch": 1450} {"train_loss": -11.768024444580078, "global_step": 243659, "epoch": 1450} {"train_loss": -11.972858428955078, "global_step": 243660, "epoch": 1450} {"train_loss": -11.673248291015625, "global_step": 243661, "epoch": 1450} {"train_loss": -11.932519912719727, "global_step": 243662, "epoch": 1450} {"train_loss": -11.869302749633789, "global_step": 243663, "epoch": 1450} {"train_loss": -12.148290634155273, "global_step": 243664, "epoch": 1450} {"train_loss": -11.548851013183594, "global_step": 243665, "epoch": 1450} {"train_loss": -12.086896896362305, "global_step": 243666, "epoch": 1450} {"train_loss": -11.787755012512207, "global_step": 243667, "epoch": 1450} {"train_loss": -11.675704956054688, "global_step": 243668, "epoch": 1450} {"train_loss": -11.270992279052734, "global_step": 243669, "epoch": 1450} {"train_loss": -12.102889060974121, "global_step": 243670, "epoch": 1450} {"train_loss": -11.76357650756836, "global_step": 243671, "epoch": 1450} {"train_loss": -11.544916152954102, "global_step": 243672, "epoch": 1450} {"train_loss": -11.339054107666016, "global_step": 243673, "epoch": 1450} {"train_loss": -11.637350082397461, "global_step": 243674, "epoch": 1450} {"train_loss": -11.569595336914062, "global_step": 243675, "epoch": 1450} {"train_loss": -11.795629501342773, "global_step": 243676, "epoch": 1450} {"train_loss": -10.604915618896484, "global_step": 243677, "epoch": 1450} {"train_loss": -11.772491455078125, "global_step": 243678, "epoch": 1450} {"train_loss": -11.534369468688965, "global_step": 243679, "epoch": 1450} {"train_loss": -11.46776294708252, "global_step": 243680, "epoch": 1450} {"train_loss": -11.39215087890625, "global_step": 243681, "epoch": 1450} {"train_loss": -11.931068420410156, "global_step": 243682, "epoch": 1450} {"train_loss": -11.54312515258789, "global_step": 243683, "epoch": 1450} {"train_loss": -11.863996505737305, "global_step": 243684, "epoch": 1450} {"train_loss": -11.422056198120117, "global_step": 243685, "epoch": 1450} {"train_loss": -11.26314926147461, "global_step": 243686, "epoch": 1450} {"train_loss": -12.042524337768555, "global_step": 243687, "epoch": 1450} {"train_loss": -11.604982376098633, "global_step": 243688, "epoch": 1450} {"train_loss": -11.214005470275879, "global_step": 243689, "epoch": 1450} {"train_loss": -11.639660835266113, "global_step": 243690, "epoch": 1450} {"train_loss": -11.796127319335938, "global_step": 243691, "epoch": 1450} {"train_loss": -12.08639907836914, "global_step": 243692, "epoch": 1450} {"train_loss": -11.504522323608398, "global_step": 243693, "epoch": 1450} {"train_loss": -11.74104118347168, "global_step": 243694, "epoch": 1450} {"train_loss": -11.453121185302734, "global_step": 243695, "epoch": 1450} {"train_loss": -10.956581115722656, "global_step": 243696, "epoch": 1450} {"train_loss": -11.213361740112305, "global_step": 243697, "epoch": 1450} {"train_loss": -11.891999244689941, "global_step": 243698, "epoch": 1450} {"train_loss": -11.085441589355469, "global_step": 243699, "epoch": 1450} {"train_loss": -10.602401733398438, "global_step": 243700, "epoch": 1450} {"train_loss": -11.740438461303711, "global_step": 243701, "epoch": 1450} {"train_loss": -11.673592567443848, "global_step": 243702, "epoch": 1450} {"train_loss": -11.527013778686523, "global_step": 243703, "epoch": 1450} {"train_loss": -11.445718765258789, "global_step": 243704, "epoch": 1450} {"train_loss": -11.88471794128418, "global_step": 243705, "epoch": 1450} {"train_loss": -11.990592956542969, "global_step": 243706, "epoch": 1450} {"train_loss": -11.815263748168945, "global_step": 243707, "epoch": 1450} {"train_loss": -11.775802612304688, "global_step": 243708, "epoch": 1450} {"train_loss": -12.015684127807617, "global_step": 243709, "epoch": 1450} {"train_loss": -12.147842407226562, "global_step": 243710, "epoch": 1450} {"train_loss": -11.82267951965332, "global_step": 243711, "epoch": 1450} {"train_loss": -12.053309440612793, "global_step": 243712, "epoch": 1450} {"train_loss": -11.735345840454102, "global_step": 243713, "epoch": 1450} {"train_loss": -11.642114639282227, "global_step": 243714, "epoch": 1450} {"train_loss": -12.030611038208008, "global_step": 243715, "epoch": 1450} {"train_loss": -12.062565803527832, "global_step": 243716, "epoch": 1450} {"train_loss": -11.698474884033203, "global_step": 243717, "epoch": 1450} {"train_loss": -11.96046257019043, "global_step": 243718, "epoch": 1450} {"train_loss": -11.636690139770508, "global_step": 243719, "epoch": 1450} {"train_loss": -11.353248596191406, "global_step": 243720, "epoch": 1450} {"train_loss": -11.767987251281738, "global_step": 243721, "epoch": 1450} {"train_loss": -11.836214065551758, "global_step": 243722, "epoch": 1450} {"train_loss": -11.099299430847168, "global_step": 243723, "epoch": 1450} {"train_loss": -11.84199047088623, "global_step": 243724, "epoch": 1450} {"train_loss": -11.46877670288086, "global_step": 243725, "epoch": 1450} {"train_loss": -11.114109992980957, "global_step": 243726, "epoch": 1450} {"train_loss": -11.892427444458008, "global_step": 243727, "epoch": 1450} {"train_loss": -11.008216857910156, "global_step": 243728, "epoch": 1450} {"train_loss": -11.773961067199707, "global_step": 243729, "epoch": 1450} {"train_loss": -11.327260971069336, "global_step": 243730, "epoch": 1450} {"train_loss": -11.142356872558594, "global_step": 243731, "epoch": 1450} {"train_loss": -11.649213790893555, "global_step": 243732, "epoch": 1450} {"train_loss": -11.479787826538086, "global_step": 243733, "epoch": 1450} {"train_loss": -11.643531799316406, "global_step": 243734, "epoch": 1450} {"train_loss": -11.35281753540039, "global_step": 243735, "epoch": 1450} {"train_loss": -11.607766151428223, "global_step": 243736, "epoch": 1450} {"train_loss": -11.36237907409668, "global_step": 243737, "epoch": 1450} {"train_loss": -11.395824432373047, "global_step": 243738, "epoch": 1450} {"train_loss": -11.058574676513672, "global_step": 243739, "epoch": 1450} {"train_loss": -11.441837310791016, "global_step": 243740, "epoch": 1450} {"train_loss": -10.998735427856445, "global_step": 243741, "epoch": 1450} {"train_loss": -11.467004776000977, "global_step": 243742, "epoch": 1450} {"train_loss": -11.688371658325195, "global_step": 243743, "epoch": 1450} {"train_loss": -11.06984806060791, "global_step": 243744, "epoch": 1450} {"train_loss": -11.93961238861084, "global_step": 243745, "epoch": 1450} {"train_loss": -11.08000659942627, "global_step": 243746, "epoch": 1450} {"train_loss": -11.914678573608398, "global_step": 243747, "epoch": 1450} {"train_loss": -11.206108093261719, "global_step": 243748, "epoch": 1450} {"train_loss": -11.571163177490234, "global_step": 243749, "epoch": 1450} {"train_loss": -11.396798133850098, "global_step": 243750, "epoch": 1450} {"train_loss": -11.577611923217773, "global_step": 243751, "epoch": 1450} {"train_loss": -11.893159866333008, "global_step": 243752, "epoch": 1450} {"train_loss": -11.349958419799805, "global_step": 243753, "epoch": 1450} {"train_loss": -11.860926628112793, "global_step": 243754, "epoch": 1450} {"train_loss": -11.514022827148438, "global_step": 243755, "epoch": 1450} {"train_loss": -11.709306716918945, "global_step": 243756, "epoch": 1450} {"train_loss": -11.896356582641602, "global_step": 243757, "epoch": 1450} {"train_loss": -11.642905235290527, "global_step": 243758, "epoch": 1450} {"train_loss": -11.921557426452637, "global_step": 243759, "epoch": 1450} {"train_loss": -11.613578796386719, "global_step": 243760, "epoch": 1450} {"train_loss": -11.82453441619873, "global_step": 243761, "epoch": 1450} {"train_loss": -11.722369194030762, "global_step": 243762, "epoch": 1450} {"train_loss": -11.62996768951416, "global_step": 243763, "epoch": 1450} {"train_loss": -11.454299926757812, "global_step": 243764, "epoch": 1450} {"train_loss": -11.509215354919434, "global_step": 243765, "epoch": 1450} {"train_loss": -11.761999130249023, "global_step": 243766, "epoch": 1450} {"train_loss": -11.662459685688926, "global_step": 243767, "epoch": 1450, "train/sim_max_reward_0": 0.5320998558036961, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.11938000884042158, "train/sim_max_reward_4": 0.9651493138777412, "train/sim_max_reward_5": 0.5176274308183391, "test/sim_max_reward_4400000": 0.9839297912459425, "test/sim_max_reward_4400001": 0.36971101173178783, "test/sim_max_reward_4400002": 0.9316432724447428, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 0.7456064800130517, "test/sim_max_reward_4400005": 0.5555162631561007, "test/sim_max_reward_4400006": 0.9701105374166304, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 0.5507963375724764, "test/sim_max_reward_4400009": 0.027397513816128913, "test/sim_max_reward_4400010": 0.9643609230463317, "test/sim_max_reward_4400011": 0.9761404694248128, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.38656803656999805, "test/sim_max_reward_4400014": 0.9884153035880388, "test/sim_max_reward_4400015": 0.23376369376902714, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.8532474366432046, "test/sim_max_reward_4400019": 0.41562789164461655, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.563230298221606, "test/sim_max_reward_4400022": 0.9915138170941001, "test/sim_max_reward_4400023": 0.1752204896414274, "test/sim_max_reward_4400024": 0.42548245404408985, "test/sim_max_reward_4400025": 0.4910297070158143, "test/sim_max_reward_4400026": 0.06552612529842625, "test/sim_max_reward_4400027": 0.9522760493518617, "test/sim_max_reward_4400028": 0.17170416540490485, "test/sim_max_reward_4400029": 0.9805854057351209, "test/sim_max_reward_4400030": 0.9537264227529264, "test/sim_max_reward_4400031": 0.9858889023433103, "test/sim_max_reward_4400032": 0.03802410146360122, "test/sim_max_reward_4400033": 0.44698121137603786, "test/sim_max_reward_4400034": 0.9528877533684219, "test/sim_max_reward_4400035": 0.7655240536876987, "test/sim_max_reward_4400036": 0.41194728907836065, "test/sim_max_reward_4400037": 0.9642075825660845, "test/sim_max_reward_4400038": 0.31429369886113023, "test/sim_max_reward_4400039": 0.997364698899003, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.32055419721014455, "test/sim_max_reward_4400042": 0.03307459272394028, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.9984408509699451, "test/sim_max_reward_4400045": 0.5083232798286925, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 0.9518648486592088, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.2907587604361167, "train/mean_score": 0.5223761015566996, "test/mean_score": 0.5940695228744238, "val_loss": 264515.15625, "train_action_mse_error": 0.3730112612247467} {"train_loss": -11.864822387695312, "global_step": 243768, "epoch": 1451} {"train_loss": -11.43256664276123, "global_step": 243769, "epoch": 1451} {"train_loss": -11.81680679321289, "global_step": 243770, "epoch": 1451} {"train_loss": -11.486241340637207, "global_step": 243771, "epoch": 1451} {"train_loss": -11.659061431884766, "global_step": 243772, "epoch": 1451} {"train_loss": -11.736108779907227, "global_step": 243773, "epoch": 1451} {"train_loss": -12.007068634033203, "global_step": 243774, "epoch": 1451} {"train_loss": -11.824073791503906, "global_step": 243775, "epoch": 1451} {"train_loss": -11.461822509765625, "global_step": 243776, "epoch": 1451} {"train_loss": -12.100685119628906, "global_step": 243777, "epoch": 1451} {"train_loss": -11.545332908630371, "global_step": 243778, "epoch": 1451} {"train_loss": -11.759237289428711, "global_step": 243779, "epoch": 1451} {"train_loss": -11.894800186157227, "global_step": 243780, "epoch": 1451} {"train_loss": -11.760258674621582, "global_step": 243781, "epoch": 1451} {"train_loss": -11.73044204711914, "global_step": 243782, "epoch": 1451} {"train_loss": -11.73495101928711, "global_step": 243783, "epoch": 1451} {"train_loss": -11.41728401184082, "global_step": 243784, "epoch": 1451} {"train_loss": -11.785242080688477, "global_step": 243785, "epoch": 1451} {"train_loss": -11.651700019836426, "global_step": 243786, "epoch": 1451} {"train_loss": -11.653514862060547, "global_step": 243787, "epoch": 1451} {"train_loss": -11.544485092163086, "global_step": 243788, "epoch": 1451} {"train_loss": -11.696046829223633, "global_step": 243789, "epoch": 1451} {"train_loss": -11.749456405639648, "global_step": 243790, "epoch": 1451} {"train_loss": -11.88557243347168, "global_step": 243791, "epoch": 1451} {"train_loss": -11.552043914794922, "global_step": 243792, "epoch": 1451} {"train_loss": -11.88337230682373, "global_step": 243793, "epoch": 1451} {"train_loss": -11.753358840942383, "global_step": 243794, "epoch": 1451} {"train_loss": -11.81910228729248, "global_step": 243795, "epoch": 1451} {"train_loss": -11.354339599609375, "global_step": 243796, "epoch": 1451} {"train_loss": -11.48002815246582, "global_step": 243797, "epoch": 1451} {"train_loss": -11.947501182556152, "global_step": 243798, "epoch": 1451} {"train_loss": -10.881343841552734, "global_step": 243799, "epoch": 1451} {"train_loss": -11.522443771362305, "global_step": 243800, "epoch": 1451} {"train_loss": -11.450204849243164, "global_step": 243801, "epoch": 1451} {"train_loss": -11.891459465026855, "global_step": 243802, "epoch": 1451} {"train_loss": -11.128680229187012, "global_step": 243803, "epoch": 1451} {"train_loss": -11.03237247467041, "global_step": 243804, "epoch": 1451} {"train_loss": -11.610544204711914, "global_step": 243805, "epoch": 1451} {"train_loss": -11.831633567810059, "global_step": 243806, "epoch": 1451} {"train_loss": -11.416892051696777, "global_step": 243807, "epoch": 1451} {"train_loss": -11.435338020324707, "global_step": 243808, "epoch": 1451} {"train_loss": -12.082212448120117, "global_step": 243809, "epoch": 1451} {"train_loss": -11.581110954284668, "global_step": 243810, "epoch": 1451} {"train_loss": -11.571398735046387, "global_step": 243811, "epoch": 1451} {"train_loss": -11.667266845703125, "global_step": 243812, "epoch": 1451} {"train_loss": -10.865765571594238, "global_step": 243813, "epoch": 1451} {"train_loss": -11.056257247924805, "global_step": 243814, "epoch": 1451} {"train_loss": -11.734369277954102, "global_step": 243815, "epoch": 1451} {"train_loss": -11.31635856628418, "global_step": 243816, "epoch": 1451} {"train_loss": -10.274810791015625, "global_step": 243817, "epoch": 1451} {"train_loss": -11.067556381225586, "global_step": 243818, "epoch": 1451} {"train_loss": -10.144736289978027, "global_step": 243819, "epoch": 1451} {"train_loss": -10.363917350769043, "global_step": 243820, "epoch": 1451} {"train_loss": -10.229045867919922, "global_step": 243821, "epoch": 1451} {"train_loss": -9.837224006652832, "global_step": 243822, "epoch": 1451} {"train_loss": -10.755531311035156, "global_step": 243823, "epoch": 1451} {"train_loss": -10.138986587524414, "global_step": 243824, "epoch": 1451} {"train_loss": -10.310636520385742, "global_step": 243825, "epoch": 1451} {"train_loss": -10.302872657775879, "global_step": 243826, "epoch": 1451} {"train_loss": -10.617155075073242, "global_step": 243827, "epoch": 1451} {"train_loss": -10.562093734741211, "global_step": 243828, "epoch": 1451} {"train_loss": -9.851377487182617, "global_step": 243829, "epoch": 1451} {"train_loss": -10.958858489990234, "global_step": 243830, "epoch": 1451} {"train_loss": -9.871820449829102, "global_step": 243831, "epoch": 1451} {"train_loss": -11.376453399658203, "global_step": 243832, "epoch": 1451} {"train_loss": -10.27364730834961, "global_step": 243833, "epoch": 1451} {"train_loss": -10.849675178527832, "global_step": 243834, "epoch": 1451} {"train_loss": -10.893162727355957, "global_step": 243835, "epoch": 1451} {"train_loss": -11.268617630004883, "global_step": 243836, "epoch": 1451} {"train_loss": -11.194134712219238, "global_step": 243837, "epoch": 1451} {"train_loss": -11.602248191833496, "global_step": 243838, "epoch": 1451} {"train_loss": -11.093870162963867, "global_step": 243839, "epoch": 1451} {"train_loss": -11.601353645324707, "global_step": 243840, "epoch": 1451} {"train_loss": -11.133594512939453, "global_step": 243841, "epoch": 1451} {"train_loss": -11.217999458312988, "global_step": 243842, "epoch": 1451} {"train_loss": -11.417351722717285, "global_step": 243843, "epoch": 1451} {"train_loss": -11.246282577514648, "global_step": 243844, "epoch": 1451} {"train_loss": -11.516641616821289, "global_step": 243845, "epoch": 1451} {"train_loss": -11.720592498779297, "global_step": 243846, "epoch": 1451} {"train_loss": -11.474922180175781, "global_step": 243847, "epoch": 1451} {"train_loss": -11.72767448425293, "global_step": 243848, "epoch": 1451} {"train_loss": -11.401865005493164, "global_step": 243849, "epoch": 1451} {"train_loss": -11.355436325073242, "global_step": 243850, "epoch": 1451} {"train_loss": -11.417997360229492, "global_step": 243851, "epoch": 1451} {"train_loss": -11.72935676574707, "global_step": 243852, "epoch": 1451} {"train_loss": -11.391271591186523, "global_step": 243853, "epoch": 1451} {"train_loss": -11.66568374633789, "global_step": 243854, "epoch": 1451} {"train_loss": -11.231270790100098, "global_step": 243855, "epoch": 1451} {"train_loss": -11.654454231262207, "global_step": 243856, "epoch": 1451} {"train_loss": -11.667070388793945, "global_step": 243857, "epoch": 1451} {"train_loss": -11.767854690551758, "global_step": 243858, "epoch": 1451} {"train_loss": -11.68254280090332, "global_step": 243859, "epoch": 1451} {"train_loss": -11.727150917053223, "global_step": 243860, "epoch": 1451} {"train_loss": -11.53159236907959, "global_step": 243861, "epoch": 1451} {"train_loss": -11.943682670593262, "global_step": 243862, "epoch": 1451} {"train_loss": -11.671356201171875, "global_step": 243863, "epoch": 1451} {"train_loss": -11.79805850982666, "global_step": 243864, "epoch": 1451} {"train_loss": -11.272303581237793, "global_step": 243865, "epoch": 1451} {"train_loss": -11.858985900878906, "global_step": 243866, "epoch": 1451} {"train_loss": -11.675054550170898, "global_step": 243867, "epoch": 1451} {"train_loss": -11.746323585510254, "global_step": 243868, "epoch": 1451} {"train_loss": -11.88914680480957, "global_step": 243869, "epoch": 1451} {"train_loss": -11.799725532531738, "global_step": 243870, "epoch": 1451} {"train_loss": -11.643831253051758, "global_step": 243871, "epoch": 1451} {"train_loss": -11.8032865524292, "global_step": 243872, "epoch": 1451} {"train_loss": -11.63717269897461, "global_step": 243873, "epoch": 1451} {"train_loss": -11.924494743347168, "global_step": 243874, "epoch": 1451} {"train_loss": -11.873014450073242, "global_step": 243875, "epoch": 1451} {"train_loss": -11.800653457641602, "global_step": 243876, "epoch": 1451} {"train_loss": -11.926912307739258, "global_step": 243877, "epoch": 1451} {"train_loss": -11.893577575683594, "global_step": 243878, "epoch": 1451} {"train_loss": -11.798429489135742, "global_step": 243879, "epoch": 1451} {"train_loss": -12.005302429199219, "global_step": 243880, "epoch": 1451} {"train_loss": -11.976219177246094, "global_step": 243881, "epoch": 1451} {"train_loss": -11.871601104736328, "global_step": 243882, "epoch": 1451} {"train_loss": -11.580644607543945, "global_step": 243883, "epoch": 1451} {"train_loss": -11.827445030212402, "global_step": 243884, "epoch": 1451} {"train_loss": -11.439266204833984, "global_step": 243885, "epoch": 1451} {"train_loss": -11.949666976928711, "global_step": 243886, "epoch": 1451} {"train_loss": -11.758920669555664, "global_step": 243887, "epoch": 1451} {"train_loss": -11.813202857971191, "global_step": 243888, "epoch": 1451} {"train_loss": -11.43830394744873, "global_step": 243889, "epoch": 1451} {"train_loss": -11.525594711303711, "global_step": 243890, "epoch": 1451} {"train_loss": -11.253149032592773, "global_step": 243891, "epoch": 1451} {"train_loss": -11.37814712524414, "global_step": 243892, "epoch": 1451} {"train_loss": -11.021360397338867, "global_step": 243893, "epoch": 1451} {"train_loss": -11.503961563110352, "global_step": 243894, "epoch": 1451} {"train_loss": -11.35466194152832, "global_step": 243895, "epoch": 1451} {"train_loss": -11.812137603759766, "global_step": 243896, "epoch": 1451} {"train_loss": -11.656290054321289, "global_step": 243897, "epoch": 1451} {"train_loss": -11.82252025604248, "global_step": 243898, "epoch": 1451} {"train_loss": -11.424464225769043, "global_step": 243899, "epoch": 1451} {"train_loss": -11.77578353881836, "global_step": 243900, "epoch": 1451} {"train_loss": -11.776494026184082, "global_step": 243901, "epoch": 1451} {"train_loss": -11.66840648651123, "global_step": 243902, "epoch": 1451} {"train_loss": -11.797889709472656, "global_step": 243903, "epoch": 1451} {"train_loss": -11.506860733032227, "global_step": 243904, "epoch": 1451} {"train_loss": -12.002964973449707, "global_step": 243905, "epoch": 1451} {"train_loss": -11.344819068908691, "global_step": 243906, "epoch": 1451} {"train_loss": -10.89016342163086, "global_step": 243907, "epoch": 1451} {"train_loss": -10.990660667419434, "global_step": 243908, "epoch": 1451} {"train_loss": -11.346046447753906, "global_step": 243909, "epoch": 1451} {"train_loss": -10.79050350189209, "global_step": 243910, "epoch": 1451} {"train_loss": -11.427599906921387, "global_step": 243911, "epoch": 1451} {"train_loss": -10.739310264587402, "global_step": 243912, "epoch": 1451} {"train_loss": -11.718814849853516, "global_step": 243913, "epoch": 1451} {"train_loss": -10.66929817199707, "global_step": 243914, "epoch": 1451} {"train_loss": -11.804193496704102, "global_step": 243915, "epoch": 1451} {"train_loss": -10.870741844177246, "global_step": 243916, "epoch": 1451} {"train_loss": -11.540922164916992, "global_step": 243917, "epoch": 1451} {"train_loss": -11.3702392578125, "global_step": 243918, "epoch": 1451} {"train_loss": -11.30394172668457, "global_step": 243919, "epoch": 1451} {"train_loss": -11.518879890441895, "global_step": 243920, "epoch": 1451} {"train_loss": -11.11539077758789, "global_step": 243921, "epoch": 1451} {"train_loss": -10.319171905517578, "global_step": 243922, "epoch": 1451} {"train_loss": -11.591885566711426, "global_step": 243923, "epoch": 1451} {"train_loss": -10.260912895202637, "global_step": 243924, "epoch": 1451} {"train_loss": -11.735318183898926, "global_step": 243925, "epoch": 1451} {"train_loss": -11.257331848144531, "global_step": 243926, "epoch": 1451} {"train_loss": -10.853394508361816, "global_step": 243927, "epoch": 1451} {"train_loss": -12.05969524383545, "global_step": 243928, "epoch": 1451} {"train_loss": -11.170326232910156, "global_step": 243929, "epoch": 1451} {"train_loss": -11.645655632019043, "global_step": 243930, "epoch": 1451} {"train_loss": -11.392110824584961, "global_step": 243931, "epoch": 1451} {"train_loss": -11.612202644348145, "global_step": 243932, "epoch": 1451} {"train_loss": -11.804723739624023, "global_step": 243933, "epoch": 1451} {"train_loss": -11.65733814239502, "global_step": 243934, "epoch": 1451} {"train_loss": -11.423387902123588, "global_step": 243935, "epoch": 1451, "val_loss": 268629.34375} {"train_loss": -11.688863754272461, "global_step": 243936, "epoch": 1452} {"train_loss": -11.475625991821289, "global_step": 243937, "epoch": 1452} {"train_loss": -11.548043251037598, "global_step": 243938, "epoch": 1452} {"train_loss": -11.968498229980469, "global_step": 243939, "epoch": 1452} {"train_loss": -11.63735580444336, "global_step": 243940, "epoch": 1452} {"train_loss": -11.622260093688965, "global_step": 243941, "epoch": 1452} {"train_loss": -11.646788597106934, "global_step": 243942, "epoch": 1452} {"train_loss": -11.709431648254395, "global_step": 243943, "epoch": 1452} {"train_loss": -11.737470626831055, "global_step": 243944, "epoch": 1452} {"train_loss": -11.45706558227539, "global_step": 243945, "epoch": 1452} {"train_loss": -11.787076950073242, "global_step": 243946, "epoch": 1452} {"train_loss": -11.724441528320312, "global_step": 243947, "epoch": 1452} {"train_loss": -12.015664100646973, "global_step": 243948, "epoch": 1452} {"train_loss": -11.461935043334961, "global_step": 243949, "epoch": 1452} {"train_loss": -11.99992561340332, "global_step": 243950, "epoch": 1452} {"train_loss": -11.616637229919434, "global_step": 243951, "epoch": 1452} {"train_loss": -11.870809555053711, "global_step": 243952, "epoch": 1452} {"train_loss": -11.861551284790039, "global_step": 243953, "epoch": 1452} {"train_loss": -11.755725860595703, "global_step": 243954, "epoch": 1452} {"train_loss": -11.686418533325195, "global_step": 243955, "epoch": 1452} {"train_loss": -11.632549285888672, "global_step": 243956, "epoch": 1452} {"train_loss": -11.755233764648438, "global_step": 243957, "epoch": 1452} {"train_loss": -11.777952194213867, "global_step": 243958, "epoch": 1452} {"train_loss": -10.793537139892578, "global_step": 243959, "epoch": 1452} {"train_loss": -11.842409133911133, "global_step": 243960, "epoch": 1452} {"train_loss": -11.738321304321289, "global_step": 243961, "epoch": 1452} {"train_loss": -11.730228424072266, "global_step": 243962, "epoch": 1452} {"train_loss": -11.642427444458008, "global_step": 243963, "epoch": 1452} {"train_loss": -11.696920394897461, "global_step": 243964, "epoch": 1452} {"train_loss": -12.007917404174805, "global_step": 243965, "epoch": 1452} {"train_loss": -11.905478477478027, "global_step": 243966, "epoch": 1452} {"train_loss": -12.051149368286133, "global_step": 243967, "epoch": 1452} {"train_loss": -11.686698913574219, "global_step": 243968, "epoch": 1452} {"train_loss": -11.739609718322754, "global_step": 243969, "epoch": 1452} {"train_loss": -11.816940307617188, "global_step": 243970, "epoch": 1452} {"train_loss": -11.876344680786133, "global_step": 243971, "epoch": 1452} {"train_loss": -12.20775032043457, "global_step": 243972, "epoch": 1452} {"train_loss": -11.890908241271973, "global_step": 243973, "epoch": 1452} {"train_loss": -12.041543960571289, "global_step": 243974, "epoch": 1452} {"train_loss": -12.017820358276367, "global_step": 243975, "epoch": 1452} {"train_loss": -11.79031753540039, "global_step": 243976, "epoch": 1452} {"train_loss": -11.837529182434082, "global_step": 243977, "epoch": 1452} {"train_loss": -11.871599197387695, "global_step": 243978, "epoch": 1452} {"train_loss": -12.075996398925781, "global_step": 243979, "epoch": 1452} {"train_loss": -11.618217468261719, "global_step": 243980, "epoch": 1452} {"train_loss": -12.021028518676758, "global_step": 243981, "epoch": 1452} {"train_loss": -11.830259323120117, "global_step": 243982, "epoch": 1452} {"train_loss": -11.930397033691406, "global_step": 243983, "epoch": 1452} {"train_loss": -12.080074310302734, "global_step": 243984, "epoch": 1452} {"train_loss": -11.990324974060059, "global_step": 243985, "epoch": 1452} {"train_loss": -12.357181549072266, "global_step": 243986, "epoch": 1452} {"train_loss": -11.835898399353027, "global_step": 243987, "epoch": 1452} {"train_loss": -12.149442672729492, "global_step": 243988, "epoch": 1452} {"train_loss": -12.233179092407227, "global_step": 243989, "epoch": 1452} {"train_loss": -11.810742378234863, "global_step": 243990, "epoch": 1452} {"train_loss": -12.011459350585938, "global_step": 243991, "epoch": 1452} {"train_loss": -11.932865142822266, "global_step": 243992, "epoch": 1452} {"train_loss": -12.097078323364258, "global_step": 243993, "epoch": 1452} {"train_loss": -12.135749816894531, "global_step": 243994, "epoch": 1452} {"train_loss": -11.785154342651367, "global_step": 243995, "epoch": 1452} {"train_loss": -12.134319305419922, "global_step": 243996, "epoch": 1452} {"train_loss": -11.989049911499023, "global_step": 243997, "epoch": 1452} {"train_loss": -11.960378646850586, "global_step": 243998, "epoch": 1452} {"train_loss": -11.554620742797852, "global_step": 243999, "epoch": 1452} {"train_loss": -11.896387100219727, "global_step": 244000, "epoch": 1452} {"train_loss": -11.590559959411621, "global_step": 244001, "epoch": 1452} {"train_loss": -11.982799530029297, "global_step": 244002, "epoch": 1452} {"train_loss": -11.472696304321289, "global_step": 244003, "epoch": 1452} {"train_loss": -12.070464134216309, "global_step": 244004, "epoch": 1452} {"train_loss": -11.650964736938477, "global_step": 244005, "epoch": 1452} {"train_loss": -11.43717098236084, "global_step": 244006, "epoch": 1452} {"train_loss": -10.944269180297852, "global_step": 244007, "epoch": 1452} {"train_loss": -10.985838890075684, "global_step": 244008, "epoch": 1452} {"train_loss": -11.206871032714844, "global_step": 244009, "epoch": 1452} {"train_loss": -10.872498512268066, "global_step": 244010, "epoch": 1452} {"train_loss": -10.989602088928223, "global_step": 244011, "epoch": 1452} {"train_loss": -11.542980194091797, "global_step": 244012, "epoch": 1452} {"train_loss": -11.67912483215332, "global_step": 244013, "epoch": 1452} {"train_loss": -10.857933044433594, "global_step": 244014, "epoch": 1452} {"train_loss": -11.900978088378906, "global_step": 244015, "epoch": 1452} {"train_loss": -11.38621711730957, "global_step": 244016, "epoch": 1452} {"train_loss": -11.346115112304688, "global_step": 244017, "epoch": 1452} {"train_loss": -11.319826126098633, "global_step": 244018, "epoch": 1452} {"train_loss": -11.915983200073242, "global_step": 244019, "epoch": 1452} {"train_loss": -10.974933624267578, "global_step": 244020, "epoch": 1452} {"train_loss": -11.560726165771484, "global_step": 244021, "epoch": 1452} {"train_loss": -11.277151107788086, "global_step": 244022, "epoch": 1452} {"train_loss": -11.7584867477417, "global_step": 244023, "epoch": 1452} {"train_loss": -11.134136199951172, "global_step": 244024, "epoch": 1452} {"train_loss": -12.034370422363281, "global_step": 244025, "epoch": 1452} {"train_loss": -11.372457504272461, "global_step": 244026, "epoch": 1452} {"train_loss": -11.948982238769531, "global_step": 244027, "epoch": 1452} {"train_loss": -11.374157905578613, "global_step": 244028, "epoch": 1452} {"train_loss": -11.043882369995117, "global_step": 244029, "epoch": 1452} {"train_loss": -11.792482376098633, "global_step": 244030, "epoch": 1452} {"train_loss": -11.386886596679688, "global_step": 244031, "epoch": 1452} {"train_loss": -11.620705604553223, "global_step": 244032, "epoch": 1452} {"train_loss": -11.557218551635742, "global_step": 244033, "epoch": 1452} {"train_loss": -10.9655122756958, "global_step": 244034, "epoch": 1452} {"train_loss": -11.158233642578125, "global_step": 244035, "epoch": 1452} {"train_loss": -11.277105331420898, "global_step": 244036, "epoch": 1452} {"train_loss": -11.410961151123047, "global_step": 244037, "epoch": 1452} {"train_loss": -11.179125785827637, "global_step": 244038, "epoch": 1452} {"train_loss": -11.219255447387695, "global_step": 244039, "epoch": 1452} {"train_loss": -11.653491020202637, "global_step": 244040, "epoch": 1452} {"train_loss": -11.726337432861328, "global_step": 244041, "epoch": 1452} {"train_loss": -11.671246528625488, "global_step": 244042, "epoch": 1452} {"train_loss": -12.008545875549316, "global_step": 244043, "epoch": 1452} {"train_loss": -11.461433410644531, "global_step": 244044, "epoch": 1452} {"train_loss": -12.008578300476074, "global_step": 244045, "epoch": 1452} {"train_loss": -11.136116981506348, "global_step": 244046, "epoch": 1452} {"train_loss": -11.953939437866211, "global_step": 244047, "epoch": 1452} {"train_loss": -11.44559097290039, "global_step": 244048, "epoch": 1452} {"train_loss": -11.95685863494873, "global_step": 244049, "epoch": 1452} {"train_loss": -11.776557922363281, "global_step": 244050, "epoch": 1452} {"train_loss": -11.73193073272705, "global_step": 244051, "epoch": 1452} {"train_loss": -11.846940994262695, "global_step": 244052, "epoch": 1452} {"train_loss": -11.574466705322266, "global_step": 244053, "epoch": 1452} {"train_loss": -11.924219131469727, "global_step": 244054, "epoch": 1452} {"train_loss": -11.773872375488281, "global_step": 244055, "epoch": 1452} {"train_loss": -11.990193367004395, "global_step": 244056, "epoch": 1452} {"train_loss": -12.029412269592285, "global_step": 244057, "epoch": 1452} {"train_loss": -11.600400924682617, "global_step": 244058, "epoch": 1452} {"train_loss": -11.901834487915039, "global_step": 244059, "epoch": 1452} {"train_loss": -11.677886962890625, "global_step": 244060, "epoch": 1452} {"train_loss": -11.70967960357666, "global_step": 244061, "epoch": 1452} {"train_loss": -11.75417709350586, "global_step": 244062, "epoch": 1452} {"train_loss": -11.716438293457031, "global_step": 244063, "epoch": 1452} {"train_loss": -11.716904640197754, "global_step": 244064, "epoch": 1452} {"train_loss": -11.625675201416016, "global_step": 244065, "epoch": 1452} {"train_loss": -11.647926330566406, "global_step": 244066, "epoch": 1452} {"train_loss": -11.951859474182129, "global_step": 244067, "epoch": 1452} {"train_loss": -12.019472122192383, "global_step": 244068, "epoch": 1452} {"train_loss": -11.946610450744629, "global_step": 244069, "epoch": 1452} {"train_loss": -12.025924682617188, "global_step": 244070, "epoch": 1452} {"train_loss": -11.922584533691406, "global_step": 244071, "epoch": 1452} {"train_loss": -11.818887710571289, "global_step": 244072, "epoch": 1452} {"train_loss": -11.606159210205078, "global_step": 244073, "epoch": 1452} {"train_loss": -11.7601318359375, "global_step": 244074, "epoch": 1452} {"train_loss": -11.797369003295898, "global_step": 244075, "epoch": 1452} {"train_loss": -11.984376907348633, "global_step": 244076, "epoch": 1452} {"train_loss": -11.77920913696289, "global_step": 244077, "epoch": 1452} {"train_loss": -12.143779754638672, "global_step": 244078, "epoch": 1452} {"train_loss": -11.995858192443848, "global_step": 244079, "epoch": 1452} {"train_loss": -12.02963638305664, "global_step": 244080, "epoch": 1452} {"train_loss": -11.7030668258667, "global_step": 244081, "epoch": 1452} {"train_loss": -12.053625106811523, "global_step": 244082, "epoch": 1452} {"train_loss": -11.608238220214844, "global_step": 244083, "epoch": 1452} {"train_loss": -11.93307113647461, "global_step": 244084, "epoch": 1452} {"train_loss": -11.983148574829102, "global_step": 244085, "epoch": 1452} {"train_loss": -11.97572135925293, "global_step": 244086, "epoch": 1452} {"train_loss": -12.103116989135742, "global_step": 244087, "epoch": 1452} {"train_loss": -11.880489349365234, "global_step": 244088, "epoch": 1452} {"train_loss": -12.095438957214355, "global_step": 244089, "epoch": 1452} {"train_loss": -11.968038558959961, "global_step": 244090, "epoch": 1452} {"train_loss": -11.78058910369873, "global_step": 244091, "epoch": 1452} {"train_loss": -12.093497276306152, "global_step": 244092, "epoch": 1452} {"train_loss": -12.028189659118652, "global_step": 244093, "epoch": 1452} {"train_loss": -11.461263656616211, "global_step": 244094, "epoch": 1452} {"train_loss": -11.56422233581543, "global_step": 244095, "epoch": 1452} {"train_loss": -11.428609848022461, "global_step": 244096, "epoch": 1452} {"train_loss": -11.597862243652344, "global_step": 244097, "epoch": 1452} {"train_loss": -11.494141578674316, "global_step": 244098, "epoch": 1452} {"train_loss": -12.137920379638672, "global_step": 244099, "epoch": 1452} {"train_loss": -11.89130973815918, "global_step": 244100, "epoch": 1452} {"train_loss": -12.279340744018555, "global_step": 244101, "epoch": 1452} {"train_loss": -12.055606842041016, "global_step": 244102, "epoch": 1452} {"train_loss": -11.730922755740938, "global_step": 244103, "epoch": 1452, "val_loss": 264316.0625} {"train_loss": -11.499008178710938, "global_step": 244104, "epoch": 1453} {"train_loss": -11.551665306091309, "global_step": 244105, "epoch": 1453} {"train_loss": -11.813852310180664, "global_step": 244106, "epoch": 1453} {"train_loss": -11.591571807861328, "global_step": 244107, "epoch": 1453} {"train_loss": -11.85255241394043, "global_step": 244108, "epoch": 1453} {"train_loss": -11.388313293457031, "global_step": 244109, "epoch": 1453} {"train_loss": -11.41667366027832, "global_step": 244110, "epoch": 1453} {"train_loss": -11.344139099121094, "global_step": 244111, "epoch": 1453} {"train_loss": -11.505353927612305, "global_step": 244112, "epoch": 1453} {"train_loss": -11.034822463989258, "global_step": 244113, "epoch": 1453} {"train_loss": -11.559444427490234, "global_step": 244114, "epoch": 1453} {"train_loss": -10.843389511108398, "global_step": 244115, "epoch": 1453} {"train_loss": -12.050289154052734, "global_step": 244116, "epoch": 1453} {"train_loss": -11.204914093017578, "global_step": 244117, "epoch": 1453} {"train_loss": -11.31894302368164, "global_step": 244118, "epoch": 1453} {"train_loss": -10.712506294250488, "global_step": 244119, "epoch": 1453} {"train_loss": -11.696664810180664, "global_step": 244120, "epoch": 1453} {"train_loss": -10.729937553405762, "global_step": 244121, "epoch": 1453} {"train_loss": -10.984575271606445, "global_step": 244122, "epoch": 1453} {"train_loss": -10.452598571777344, "global_step": 244123, "epoch": 1453} {"train_loss": -11.221744537353516, "global_step": 244124, "epoch": 1453} {"train_loss": -8.814043998718262, "global_step": 244125, "epoch": 1453} {"train_loss": -8.905123710632324, "global_step": 244126, "epoch": 1453} {"train_loss": -11.030752182006836, "global_step": 244127, "epoch": 1453} {"train_loss": -9.200240135192871, "global_step": 244128, "epoch": 1453} {"train_loss": -9.149467468261719, "global_step": 244129, "epoch": 1453} {"train_loss": -8.126211166381836, "global_step": 244130, "epoch": 1453} {"train_loss": -10.875445365905762, "global_step": 244131, "epoch": 1453} {"train_loss": -8.928894996643066, "global_step": 244132, "epoch": 1453} {"train_loss": -10.558412551879883, "global_step": 244133, "epoch": 1453} {"train_loss": -9.265604972839355, "global_step": 244134, "epoch": 1453} {"train_loss": -10.596701622009277, "global_step": 244135, "epoch": 1453} {"train_loss": -9.62591552734375, "global_step": 244136, "epoch": 1453} {"train_loss": -11.011131286621094, "global_step": 244137, "epoch": 1453} {"train_loss": -10.027661323547363, "global_step": 244138, "epoch": 1453} {"train_loss": -10.258138656616211, "global_step": 244139, "epoch": 1453} {"train_loss": -10.549129486083984, "global_step": 244140, "epoch": 1453} {"train_loss": -11.019341468811035, "global_step": 244141, "epoch": 1453} {"train_loss": -10.975980758666992, "global_step": 244142, "epoch": 1453} {"train_loss": -11.067883491516113, "global_step": 244143, "epoch": 1453} {"train_loss": -11.118236541748047, "global_step": 244144, "epoch": 1453} {"train_loss": -10.963321685791016, "global_step": 244145, "epoch": 1453} {"train_loss": -11.191967010498047, "global_step": 244146, "epoch": 1453} {"train_loss": -11.324766159057617, "global_step": 244147, "epoch": 1453} {"train_loss": -11.203279495239258, "global_step": 244148, "epoch": 1453} {"train_loss": -11.324718475341797, "global_step": 244149, "epoch": 1453} {"train_loss": -11.176872253417969, "global_step": 244150, "epoch": 1453} {"train_loss": -11.605766296386719, "global_step": 244151, "epoch": 1453} {"train_loss": -11.331087112426758, "global_step": 244152, "epoch": 1453} {"train_loss": -11.220359802246094, "global_step": 244153, "epoch": 1453} {"train_loss": -11.466728210449219, "global_step": 244154, "epoch": 1453} {"train_loss": -11.683341979980469, "global_step": 244155, "epoch": 1453} {"train_loss": -11.36435604095459, "global_step": 244156, "epoch": 1453} {"train_loss": -11.637645721435547, "global_step": 244157, "epoch": 1453} {"train_loss": -11.504770278930664, "global_step": 244158, "epoch": 1453} {"train_loss": -11.278030395507812, "global_step": 244159, "epoch": 1453} {"train_loss": -11.640893936157227, "global_step": 244160, "epoch": 1453} {"train_loss": -11.554508209228516, "global_step": 244161, "epoch": 1453} {"train_loss": -11.664312362670898, "global_step": 244162, "epoch": 1453} {"train_loss": -11.519819259643555, "global_step": 244163, "epoch": 1453} {"train_loss": -11.670328140258789, "global_step": 244164, "epoch": 1453} {"train_loss": -11.666336059570312, "global_step": 244165, "epoch": 1453} {"train_loss": -11.668298721313477, "global_step": 244166, "epoch": 1453} {"train_loss": -11.867856979370117, "global_step": 244167, "epoch": 1453} {"train_loss": -11.204500198364258, "global_step": 244168, "epoch": 1453} {"train_loss": -11.956402778625488, "global_step": 244169, "epoch": 1453} {"train_loss": -11.538167953491211, "global_step": 244170, "epoch": 1453} {"train_loss": -11.896429061889648, "global_step": 244171, "epoch": 1453} {"train_loss": -11.787692070007324, "global_step": 244172, "epoch": 1453} {"train_loss": -11.970453262329102, "global_step": 244173, "epoch": 1453} {"train_loss": -11.648609161376953, "global_step": 244174, "epoch": 1453} {"train_loss": -11.765960693359375, "global_step": 244175, "epoch": 1453} {"train_loss": -11.825675964355469, "global_step": 244176, "epoch": 1453} {"train_loss": -11.740299224853516, "global_step": 244177, "epoch": 1453} {"train_loss": -11.69796371459961, "global_step": 244178, "epoch": 1453} {"train_loss": -11.904596328735352, "global_step": 244179, "epoch": 1453} {"train_loss": -12.029909133911133, "global_step": 244180, "epoch": 1453} {"train_loss": -11.814119338989258, "global_step": 244181, "epoch": 1453} {"train_loss": -12.06026840209961, "global_step": 244182, "epoch": 1453} {"train_loss": -12.028922080993652, "global_step": 244183, "epoch": 1453} {"train_loss": -11.9704008102417, "global_step": 244184, "epoch": 1453} {"train_loss": -12.082605361938477, "global_step": 244185, "epoch": 1453} {"train_loss": -11.926535606384277, "global_step": 244186, "epoch": 1453} {"train_loss": -12.131235122680664, "global_step": 244187, "epoch": 1453} {"train_loss": -12.117112159729004, "global_step": 244188, "epoch": 1453} {"train_loss": -11.92730712890625, "global_step": 244189, "epoch": 1453} {"train_loss": -11.953502655029297, "global_step": 244190, "epoch": 1453} {"train_loss": -11.905280113220215, "global_step": 244191, "epoch": 1453} {"train_loss": -12.232185363769531, "global_step": 244192, "epoch": 1453} {"train_loss": -12.120182037353516, "global_step": 244193, "epoch": 1453} {"train_loss": -12.131006240844727, "global_step": 244194, "epoch": 1453} {"train_loss": -11.953073501586914, "global_step": 244195, "epoch": 1453} {"train_loss": -12.090901374816895, "global_step": 244196, "epoch": 1453} {"train_loss": -11.977649688720703, "global_step": 244197, "epoch": 1453} {"train_loss": -11.934147834777832, "global_step": 244198, "epoch": 1453} {"train_loss": -12.215897560119629, "global_step": 244199, "epoch": 1453} {"train_loss": -12.064764022827148, "global_step": 244200, "epoch": 1453} {"train_loss": -12.202351570129395, "global_step": 244201, "epoch": 1453} {"train_loss": -12.144338607788086, "global_step": 244202, "epoch": 1453} {"train_loss": -12.167177200317383, "global_step": 244203, "epoch": 1453} {"train_loss": -12.145894050598145, "global_step": 244204, "epoch": 1453} {"train_loss": -11.87114143371582, "global_step": 244205, "epoch": 1453} {"train_loss": -12.274826049804688, "global_step": 244206, "epoch": 1453} {"train_loss": -12.066710472106934, "global_step": 244207, "epoch": 1453} {"train_loss": -12.100316047668457, "global_step": 244208, "epoch": 1453} {"train_loss": -12.021358489990234, "global_step": 244209, "epoch": 1453} {"train_loss": -12.225284576416016, "global_step": 244210, "epoch": 1453} {"train_loss": -11.927925109863281, "global_step": 244211, "epoch": 1453} {"train_loss": -11.909870147705078, "global_step": 244212, "epoch": 1453} {"train_loss": -12.228822708129883, "global_step": 244213, "epoch": 1453} {"train_loss": -12.059125900268555, "global_step": 244214, "epoch": 1453} {"train_loss": -11.734745025634766, "global_step": 244215, "epoch": 1453} {"train_loss": -11.97691822052002, "global_step": 244216, "epoch": 1453} {"train_loss": -12.03650951385498, "global_step": 244217, "epoch": 1453} {"train_loss": -11.639583587646484, "global_step": 244218, "epoch": 1453} {"train_loss": -11.155521392822266, "global_step": 244219, "epoch": 1453} {"train_loss": -11.045449256896973, "global_step": 244220, "epoch": 1453} {"train_loss": -11.885425567626953, "global_step": 244221, "epoch": 1453} {"train_loss": -12.118753433227539, "global_step": 244222, "epoch": 1453} {"train_loss": -11.191594123840332, "global_step": 244223, "epoch": 1453} {"train_loss": -11.303838729858398, "global_step": 244224, "epoch": 1453} {"train_loss": -11.647420883178711, "global_step": 244225, "epoch": 1453} {"train_loss": -11.763134002685547, "global_step": 244226, "epoch": 1453} {"train_loss": -11.839120864868164, "global_step": 244227, "epoch": 1453} {"train_loss": -11.210676193237305, "global_step": 244228, "epoch": 1453} {"train_loss": -10.35744857788086, "global_step": 244229, "epoch": 1453} {"train_loss": -10.168802261352539, "global_step": 244230, "epoch": 1453} {"train_loss": -10.687074661254883, "global_step": 244231, "epoch": 1453} {"train_loss": -9.948378562927246, "global_step": 244232, "epoch": 1453} {"train_loss": -8.91064739227295, "global_step": 244233, "epoch": 1453} {"train_loss": -11.280109405517578, "global_step": 244234, "epoch": 1453} {"train_loss": -8.433600425720215, "global_step": 244235, "epoch": 1453} {"train_loss": -11.095726013183594, "global_step": 244236, "epoch": 1453} {"train_loss": -7.076927185058594, "global_step": 244237, "epoch": 1453} {"train_loss": -6.728311538696289, "global_step": 244238, "epoch": 1453} {"train_loss": -7.821657180786133, "global_step": 244239, "epoch": 1453} {"train_loss": -9.043535232543945, "global_step": 244240, "epoch": 1453} {"train_loss": -8.649003982543945, "global_step": 244241, "epoch": 1453} {"train_loss": -8.095479965209961, "global_step": 244242, "epoch": 1453} {"train_loss": -7.591992378234863, "global_step": 244243, "epoch": 1453} {"train_loss": -9.089216232299805, "global_step": 244244, "epoch": 1453} {"train_loss": -9.283095359802246, "global_step": 244245, "epoch": 1453} {"train_loss": -9.141125679016113, "global_step": 244246, "epoch": 1453} {"train_loss": -9.48621940612793, "global_step": 244247, "epoch": 1453} {"train_loss": -9.946396827697754, "global_step": 244248, "epoch": 1453} {"train_loss": -10.486388206481934, "global_step": 244249, "epoch": 1453} {"train_loss": -9.758113861083984, "global_step": 244250, "epoch": 1453} {"train_loss": -11.06379508972168, "global_step": 244251, "epoch": 1453} {"train_loss": -10.486368179321289, "global_step": 244252, "epoch": 1453} {"train_loss": -11.046828269958496, "global_step": 244253, "epoch": 1453} {"train_loss": -11.00507926940918, "global_step": 244254, "epoch": 1453} {"train_loss": -10.851637840270996, "global_step": 244255, "epoch": 1453} {"train_loss": -10.991342544555664, "global_step": 244256, "epoch": 1453} {"train_loss": -11.124029159545898, "global_step": 244257, "epoch": 1453} {"train_loss": -11.093649864196777, "global_step": 244258, "epoch": 1453} {"train_loss": -11.137998580932617, "global_step": 244259, "epoch": 1453} {"train_loss": -11.220858573913574, "global_step": 244260, "epoch": 1453} {"train_loss": -10.747036933898926, "global_step": 244261, "epoch": 1453} {"train_loss": -11.456146240234375, "global_step": 244262, "epoch": 1453} {"train_loss": -10.730644226074219, "global_step": 244263, "epoch": 1453} {"train_loss": -11.091955184936523, "global_step": 244264, "epoch": 1453} {"train_loss": -11.031122207641602, "global_step": 244265, "epoch": 1453} {"train_loss": -11.197548866271973, "global_step": 244266, "epoch": 1453} {"train_loss": -10.960192680358887, "global_step": 244267, "epoch": 1453} {"train_loss": -11.362606048583984, "global_step": 244268, "epoch": 1453} {"train_loss": -11.203207969665527, "global_step": 244269, "epoch": 1453} {"train_loss": -11.713615417480469, "global_step": 244270, "epoch": 1453} {"train_loss": -11.09426236152649, "global_step": 244271, "epoch": 1453, "val_loss": 258355.53125} {"train_loss": -11.275604248046875, "global_step": 244272, "epoch": 1454} {"train_loss": -10.94975471496582, "global_step": 244273, "epoch": 1454} {"train_loss": -11.437848091125488, "global_step": 244274, "epoch": 1454} {"train_loss": -11.29484748840332, "global_step": 244275, "epoch": 1454} {"train_loss": -11.60951042175293, "global_step": 244276, "epoch": 1454} {"train_loss": -11.59998893737793, "global_step": 244277, "epoch": 1454} {"train_loss": -11.572341918945312, "global_step": 244278, "epoch": 1454} {"train_loss": -11.581472396850586, "global_step": 244279, "epoch": 1454} {"train_loss": -11.69266128540039, "global_step": 244280, "epoch": 1454} {"train_loss": -11.19867992401123, "global_step": 244281, "epoch": 1454} {"train_loss": -11.571131706237793, "global_step": 244282, "epoch": 1454} {"train_loss": -11.252788543701172, "global_step": 244283, "epoch": 1454} {"train_loss": -11.619231224060059, "global_step": 244284, "epoch": 1454} {"train_loss": -11.593917846679688, "global_step": 244285, "epoch": 1454} {"train_loss": -11.353878021240234, "global_step": 244286, "epoch": 1454} {"train_loss": -11.699477195739746, "global_step": 244287, "epoch": 1454} {"train_loss": -11.659140586853027, "global_step": 244288, "epoch": 1454} {"train_loss": -11.569595336914062, "global_step": 244289, "epoch": 1454} {"train_loss": -11.523820877075195, "global_step": 244290, "epoch": 1454} {"train_loss": -11.675622940063477, "global_step": 244291, "epoch": 1454} {"train_loss": -11.494268417358398, "global_step": 244292, "epoch": 1454} {"train_loss": -11.817686080932617, "global_step": 244293, "epoch": 1454} {"train_loss": -11.580151557922363, "global_step": 244294, "epoch": 1454} {"train_loss": -11.643089294433594, "global_step": 244295, "epoch": 1454} {"train_loss": -11.64035415649414, "global_step": 244296, "epoch": 1454} {"train_loss": -11.633752822875977, "global_step": 244297, "epoch": 1454} {"train_loss": -11.922744750976562, "global_step": 244298, "epoch": 1454} {"train_loss": -11.561897277832031, "global_step": 244299, "epoch": 1454} {"train_loss": -11.818737030029297, "global_step": 244300, "epoch": 1454} {"train_loss": -11.948927879333496, "global_step": 244301, "epoch": 1454} {"train_loss": -11.74156665802002, "global_step": 244302, "epoch": 1454} {"train_loss": -12.123611450195312, "global_step": 244303, "epoch": 1454} {"train_loss": -11.983314514160156, "global_step": 244304, "epoch": 1454} {"train_loss": -11.932356834411621, "global_step": 244305, "epoch": 1454} {"train_loss": -11.797979354858398, "global_step": 244306, "epoch": 1454} {"train_loss": -11.848933219909668, "global_step": 244307, "epoch": 1454} {"train_loss": -11.846046447753906, "global_step": 244308, "epoch": 1454} {"train_loss": -11.950786590576172, "global_step": 244309, "epoch": 1454} {"train_loss": -12.020828247070312, "global_step": 244310, "epoch": 1454} {"train_loss": -11.873241424560547, "global_step": 244311, "epoch": 1454} {"train_loss": -12.075250625610352, "global_step": 244312, "epoch": 1454} {"train_loss": -11.900029182434082, "global_step": 244313, "epoch": 1454} {"train_loss": -12.008074760437012, "global_step": 244314, "epoch": 1454} {"train_loss": -12.070304870605469, "global_step": 244315, "epoch": 1454} {"train_loss": -11.985677719116211, "global_step": 244316, "epoch": 1454} {"train_loss": -11.992746353149414, "global_step": 244317, "epoch": 1454} {"train_loss": -11.92054557800293, "global_step": 244318, "epoch": 1454} {"train_loss": -11.96081829071045, "global_step": 244319, "epoch": 1454} {"train_loss": -11.974615097045898, "global_step": 244320, "epoch": 1454} {"train_loss": -11.972585678100586, "global_step": 244321, "epoch": 1454} {"train_loss": -11.945821762084961, "global_step": 244322, "epoch": 1454} {"train_loss": -12.042613983154297, "global_step": 244323, "epoch": 1454} {"train_loss": -12.116979598999023, "global_step": 244324, "epoch": 1454} {"train_loss": -11.971851348876953, "global_step": 244325, "epoch": 1454} {"train_loss": -12.1416654586792, "global_step": 244326, "epoch": 1454} {"train_loss": -11.762950897216797, "global_step": 244327, "epoch": 1454} {"train_loss": -11.948558807373047, "global_step": 244328, "epoch": 1454} {"train_loss": -11.81231689453125, "global_step": 244329, "epoch": 1454} {"train_loss": -11.596622467041016, "global_step": 244330, "epoch": 1454} {"train_loss": -11.93763542175293, "global_step": 244331, "epoch": 1454} {"train_loss": -11.989697456359863, "global_step": 244332, "epoch": 1454} {"train_loss": -11.297117233276367, "global_step": 244333, "epoch": 1454} {"train_loss": -11.66883659362793, "global_step": 244334, "epoch": 1454} {"train_loss": -11.942625045776367, "global_step": 244335, "epoch": 1454} {"train_loss": -11.450416564941406, "global_step": 244336, "epoch": 1454} {"train_loss": -11.62904167175293, "global_step": 244337, "epoch": 1454} {"train_loss": -11.57188606262207, "global_step": 244338, "epoch": 1454} {"train_loss": -12.140514373779297, "global_step": 244339, "epoch": 1454} {"train_loss": -11.617378234863281, "global_step": 244340, "epoch": 1454} {"train_loss": -11.984233856201172, "global_step": 244341, "epoch": 1454} {"train_loss": -11.735095024108887, "global_step": 244342, "epoch": 1454} {"train_loss": -11.809112548828125, "global_step": 244343, "epoch": 1454} {"train_loss": -11.797266006469727, "global_step": 244344, "epoch": 1454} {"train_loss": -11.969375610351562, "global_step": 244345, "epoch": 1454} {"train_loss": -11.650203704833984, "global_step": 244346, "epoch": 1454} {"train_loss": -12.006157875061035, "global_step": 244347, "epoch": 1454} {"train_loss": -11.867650985717773, "global_step": 244348, "epoch": 1454} {"train_loss": -11.879762649536133, "global_step": 244349, "epoch": 1454} {"train_loss": -12.16375732421875, "global_step": 244350, "epoch": 1454} {"train_loss": -11.772285461425781, "global_step": 244351, "epoch": 1454} {"train_loss": -11.935791015625, "global_step": 244352, "epoch": 1454} {"train_loss": -11.487236976623535, "global_step": 244353, "epoch": 1454} {"train_loss": -11.71615982055664, "global_step": 244354, "epoch": 1454} {"train_loss": -11.17893123626709, "global_step": 244355, "epoch": 1454} {"train_loss": -11.810076713562012, "global_step": 244356, "epoch": 1454} {"train_loss": -11.26934814453125, "global_step": 244357, "epoch": 1454} {"train_loss": -11.15695858001709, "global_step": 244358, "epoch": 1454} {"train_loss": -11.9180269241333, "global_step": 244359, "epoch": 1454} {"train_loss": -11.359354019165039, "global_step": 244360, "epoch": 1454} {"train_loss": -11.455204010009766, "global_step": 244361, "epoch": 1454} {"train_loss": -11.987906455993652, "global_step": 244362, "epoch": 1454} {"train_loss": -11.804978370666504, "global_step": 244363, "epoch": 1454} {"train_loss": -11.497021675109863, "global_step": 244364, "epoch": 1454} {"train_loss": -11.649819374084473, "global_step": 244365, "epoch": 1454} {"train_loss": -11.484699249267578, "global_step": 244366, "epoch": 1454} {"train_loss": -10.877456665039062, "global_step": 244367, "epoch": 1454} {"train_loss": -11.622598648071289, "global_step": 244368, "epoch": 1454} {"train_loss": -11.738635063171387, "global_step": 244369, "epoch": 1454} {"train_loss": -11.646053314208984, "global_step": 244370, "epoch": 1454} {"train_loss": -11.692056655883789, "global_step": 244371, "epoch": 1454} {"train_loss": -11.481889724731445, "global_step": 244372, "epoch": 1454} {"train_loss": -10.835996627807617, "global_step": 244373, "epoch": 1454} {"train_loss": -10.90329647064209, "global_step": 244374, "epoch": 1454} {"train_loss": -11.923158645629883, "global_step": 244375, "epoch": 1454} {"train_loss": -10.962812423706055, "global_step": 244376, "epoch": 1454} {"train_loss": -10.922622680664062, "global_step": 244377, "epoch": 1454} {"train_loss": -11.606016159057617, "global_step": 244378, "epoch": 1454} {"train_loss": -11.277347564697266, "global_step": 244379, "epoch": 1454} {"train_loss": -10.990413665771484, "global_step": 244380, "epoch": 1454} {"train_loss": -11.601686477661133, "global_step": 244381, "epoch": 1454} {"train_loss": -10.320937156677246, "global_step": 244382, "epoch": 1454} {"train_loss": -10.512282371520996, "global_step": 244383, "epoch": 1454} {"train_loss": -11.246249198913574, "global_step": 244384, "epoch": 1454} {"train_loss": -10.137242317199707, "global_step": 244385, "epoch": 1454} {"train_loss": -11.685523986816406, "global_step": 244386, "epoch": 1454} {"train_loss": -10.9674711227417, "global_step": 244387, "epoch": 1454} {"train_loss": -11.121623992919922, "global_step": 244388, "epoch": 1454} {"train_loss": -11.414210319519043, "global_step": 244389, "epoch": 1454} {"train_loss": -11.012777328491211, "global_step": 244390, "epoch": 1454} {"train_loss": -11.763853073120117, "global_step": 244391, "epoch": 1454} {"train_loss": -10.605964660644531, "global_step": 244392, "epoch": 1454} {"train_loss": -10.99923038482666, "global_step": 244393, "epoch": 1454} {"train_loss": -11.364721298217773, "global_step": 244394, "epoch": 1454} {"train_loss": -11.416043281555176, "global_step": 244395, "epoch": 1454} {"train_loss": -11.812333106994629, "global_step": 244396, "epoch": 1454} {"train_loss": -11.055856704711914, "global_step": 244397, "epoch": 1454} {"train_loss": -11.741670608520508, "global_step": 244398, "epoch": 1454} {"train_loss": -11.691624641418457, "global_step": 244399, "epoch": 1454} {"train_loss": -11.613028526306152, "global_step": 244400, "epoch": 1454} {"train_loss": -11.753206253051758, "global_step": 244401, "epoch": 1454} {"train_loss": -11.790229797363281, "global_step": 244402, "epoch": 1454} {"train_loss": -11.858089447021484, "global_step": 244403, "epoch": 1454} {"train_loss": -12.136974334716797, "global_step": 244404, "epoch": 1454} {"train_loss": -11.406412124633789, "global_step": 244405, "epoch": 1454} {"train_loss": -11.942599296569824, "global_step": 244406, "epoch": 1454} {"train_loss": -11.700844764709473, "global_step": 244407, "epoch": 1454} {"train_loss": -11.635025024414062, "global_step": 244408, "epoch": 1454} {"train_loss": -11.764735221862793, "global_step": 244409, "epoch": 1454} {"train_loss": -11.692008972167969, "global_step": 244410, "epoch": 1454} {"train_loss": -11.871696472167969, "global_step": 244411, "epoch": 1454} {"train_loss": -11.752293586730957, "global_step": 244412, "epoch": 1454} {"train_loss": -11.815199851989746, "global_step": 244413, "epoch": 1454} {"train_loss": -11.888518333435059, "global_step": 244414, "epoch": 1454} {"train_loss": -11.644603729248047, "global_step": 244415, "epoch": 1454} {"train_loss": -11.801275253295898, "global_step": 244416, "epoch": 1454} {"train_loss": -11.916844367980957, "global_step": 244417, "epoch": 1454} {"train_loss": -12.009700775146484, "global_step": 244418, "epoch": 1454} {"train_loss": -12.015599250793457, "global_step": 244419, "epoch": 1454} {"train_loss": -11.60936164855957, "global_step": 244420, "epoch": 1454} {"train_loss": -11.974848747253418, "global_step": 244421, "epoch": 1454} {"train_loss": -12.019149780273438, "global_step": 244422, "epoch": 1454} {"train_loss": -12.01120376586914, "global_step": 244423, "epoch": 1454} {"train_loss": -11.91873550415039, "global_step": 244424, "epoch": 1454} {"train_loss": -12.19724178314209, "global_step": 244425, "epoch": 1454} {"train_loss": -11.814804077148438, "global_step": 244426, "epoch": 1454} {"train_loss": -11.916638374328613, "global_step": 244427, "epoch": 1454} {"train_loss": -11.579096794128418, "global_step": 244428, "epoch": 1454} {"train_loss": -11.96523666381836, "global_step": 244429, "epoch": 1454} {"train_loss": -11.955429077148438, "global_step": 244430, "epoch": 1454} {"train_loss": -11.869026184082031, "global_step": 244431, "epoch": 1454} {"train_loss": -11.926007270812988, "global_step": 244432, "epoch": 1454} {"train_loss": -12.06602668762207, "global_step": 244433, "epoch": 1454} {"train_loss": -11.656970024108887, "global_step": 244434, "epoch": 1454} {"train_loss": -11.904396057128906, "global_step": 244435, "epoch": 1454} {"train_loss": -11.949405670166016, "global_step": 244436, "epoch": 1454} {"train_loss": -11.865203857421875, "global_step": 244437, "epoch": 1454} {"train_loss": -11.951241493225098, "global_step": 244438, "epoch": 1454} {"train_loss": -11.662587035269965, "global_step": 244439, "epoch": 1454, "val_loss": 267658.625} {"train_loss": -12.014383316040039, "global_step": 244440, "epoch": 1455} {"train_loss": -11.437397003173828, "global_step": 244441, "epoch": 1455} {"train_loss": -11.550541877746582, "global_step": 244442, "epoch": 1455} {"train_loss": -11.884481430053711, "global_step": 244443, "epoch": 1455} {"train_loss": -12.194963455200195, "global_step": 244444, "epoch": 1455} {"train_loss": -11.49644660949707, "global_step": 244445, "epoch": 1455} {"train_loss": -12.059338569641113, "global_step": 244446, "epoch": 1455} {"train_loss": -11.952269554138184, "global_step": 244447, "epoch": 1455} {"train_loss": -11.644648551940918, "global_step": 244448, "epoch": 1455} {"train_loss": -11.817255020141602, "global_step": 244449, "epoch": 1455} {"train_loss": -11.938863754272461, "global_step": 244450, "epoch": 1455} {"train_loss": -11.990379333496094, "global_step": 244451, "epoch": 1455} {"train_loss": -11.874858856201172, "global_step": 244452, "epoch": 1455} {"train_loss": -12.03592300415039, "global_step": 244453, "epoch": 1455} {"train_loss": -11.783169746398926, "global_step": 244454, "epoch": 1455} {"train_loss": -11.984596252441406, "global_step": 244455, "epoch": 1455} {"train_loss": -11.800949096679688, "global_step": 244456, "epoch": 1455} {"train_loss": -11.917573928833008, "global_step": 244457, "epoch": 1455} {"train_loss": -11.824224472045898, "global_step": 244458, "epoch": 1455} {"train_loss": -11.716556549072266, "global_step": 244459, "epoch": 1455} {"train_loss": -11.864672660827637, "global_step": 244460, "epoch": 1455} {"train_loss": -12.15728759765625, "global_step": 244461, "epoch": 1455} {"train_loss": -11.619951248168945, "global_step": 244462, "epoch": 1455} {"train_loss": -10.892607688903809, "global_step": 244463, "epoch": 1455} {"train_loss": -11.344165802001953, "global_step": 244464, "epoch": 1455} {"train_loss": -11.679924964904785, "global_step": 244465, "epoch": 1455} {"train_loss": -11.409210205078125, "global_step": 244466, "epoch": 1455} {"train_loss": -11.250395774841309, "global_step": 244467, "epoch": 1455} {"train_loss": -11.858966827392578, "global_step": 244468, "epoch": 1455} {"train_loss": -10.459833145141602, "global_step": 244469, "epoch": 1455} {"train_loss": -11.342550277709961, "global_step": 244470, "epoch": 1455} {"train_loss": -10.607776641845703, "global_step": 244471, "epoch": 1455} {"train_loss": -10.585956573486328, "global_step": 244472, "epoch": 1455} {"train_loss": -11.686799049377441, "global_step": 244473, "epoch": 1455} {"train_loss": -9.729816436767578, "global_step": 244474, "epoch": 1455} {"train_loss": -11.637736320495605, "global_step": 244475, "epoch": 1455} {"train_loss": -11.141386985778809, "global_step": 244476, "epoch": 1455} {"train_loss": -11.040740013122559, "global_step": 244477, "epoch": 1455} {"train_loss": -11.90719223022461, "global_step": 244478, "epoch": 1455} {"train_loss": -10.996585845947266, "global_step": 244479, "epoch": 1455} {"train_loss": -11.61009693145752, "global_step": 244480, "epoch": 1455} {"train_loss": -11.687369346618652, "global_step": 244481, "epoch": 1455} {"train_loss": -11.196562767028809, "global_step": 244482, "epoch": 1455} {"train_loss": -11.58121109008789, "global_step": 244483, "epoch": 1455} {"train_loss": -11.377191543579102, "global_step": 244484, "epoch": 1455} {"train_loss": -11.541454315185547, "global_step": 244485, "epoch": 1455} {"train_loss": -11.39949893951416, "global_step": 244486, "epoch": 1455} {"train_loss": -11.548552513122559, "global_step": 244487, "epoch": 1455} {"train_loss": -11.722844123840332, "global_step": 244488, "epoch": 1455} {"train_loss": -11.927141189575195, "global_step": 244489, "epoch": 1455} {"train_loss": -11.93726921081543, "global_step": 244490, "epoch": 1455} {"train_loss": -11.886614799499512, "global_step": 244491, "epoch": 1455} {"train_loss": -11.939973831176758, "global_step": 244492, "epoch": 1455} {"train_loss": -11.96646499633789, "global_step": 244493, "epoch": 1455} {"train_loss": -11.907690048217773, "global_step": 244494, "epoch": 1455} {"train_loss": -11.727583885192871, "global_step": 244495, "epoch": 1455} {"train_loss": -12.01762580871582, "global_step": 244496, "epoch": 1455} {"train_loss": -11.670093536376953, "global_step": 244497, "epoch": 1455} {"train_loss": -11.898307800292969, "global_step": 244498, "epoch": 1455} {"train_loss": -11.885263442993164, "global_step": 244499, "epoch": 1455} {"train_loss": -11.943214416503906, "global_step": 244500, "epoch": 1455} {"train_loss": -11.904776573181152, "global_step": 244501, "epoch": 1455} {"train_loss": -11.803302764892578, "global_step": 244502, "epoch": 1455} {"train_loss": -11.766559600830078, "global_step": 244503, "epoch": 1455} {"train_loss": -11.95013427734375, "global_step": 244504, "epoch": 1455} {"train_loss": -11.816452026367188, "global_step": 244505, "epoch": 1455} {"train_loss": -12.043256759643555, "global_step": 244506, "epoch": 1455} {"train_loss": -11.811019897460938, "global_step": 244507, "epoch": 1455} {"train_loss": -11.343866348266602, "global_step": 244508, "epoch": 1455} {"train_loss": -12.082149505615234, "global_step": 244509, "epoch": 1455} {"train_loss": -11.57101821899414, "global_step": 244510, "epoch": 1455} {"train_loss": -11.487409591674805, "global_step": 244511, "epoch": 1455} {"train_loss": -11.92175006866455, "global_step": 244512, "epoch": 1455} {"train_loss": -11.023637771606445, "global_step": 244513, "epoch": 1455} {"train_loss": -11.541488647460938, "global_step": 244514, "epoch": 1455} {"train_loss": -11.537714004516602, "global_step": 244515, "epoch": 1455} {"train_loss": -11.995006561279297, "global_step": 244516, "epoch": 1455} {"train_loss": -11.812143325805664, "global_step": 244517, "epoch": 1455} {"train_loss": -11.676656723022461, "global_step": 244518, "epoch": 1455} {"train_loss": -12.071765899658203, "global_step": 244519, "epoch": 1455} {"train_loss": -11.84300422668457, "global_step": 244520, "epoch": 1455} {"train_loss": -12.009057998657227, "global_step": 244521, "epoch": 1455} {"train_loss": -11.856188774108887, "global_step": 244522, "epoch": 1455} {"train_loss": -12.126716613769531, "global_step": 244523, "epoch": 1455} {"train_loss": -11.876797676086426, "global_step": 244524, "epoch": 1455} {"train_loss": -11.703962326049805, "global_step": 244525, "epoch": 1455} {"train_loss": -11.706001281738281, "global_step": 244526, "epoch": 1455} {"train_loss": -11.623445510864258, "global_step": 244527, "epoch": 1455} {"train_loss": -11.702458381652832, "global_step": 244528, "epoch": 1455} {"train_loss": -11.372522354125977, "global_step": 244529, "epoch": 1455} {"train_loss": -11.16010570526123, "global_step": 244530, "epoch": 1455} {"train_loss": -10.938095092773438, "global_step": 244531, "epoch": 1455} {"train_loss": -10.957716941833496, "global_step": 244532, "epoch": 1455} {"train_loss": -11.26555061340332, "global_step": 244533, "epoch": 1455} {"train_loss": -10.28539752960205, "global_step": 244534, "epoch": 1455} {"train_loss": -10.757640838623047, "global_step": 244535, "epoch": 1455} {"train_loss": -11.944952011108398, "global_step": 244536, "epoch": 1455} {"train_loss": -10.431577682495117, "global_step": 244537, "epoch": 1455} {"train_loss": -11.098896026611328, "global_step": 244538, "epoch": 1455} {"train_loss": -11.551010131835938, "global_step": 244539, "epoch": 1455} {"train_loss": -10.89615535736084, "global_step": 244540, "epoch": 1455} {"train_loss": -10.821924209594727, "global_step": 244541, "epoch": 1455} {"train_loss": -11.181292533874512, "global_step": 244542, "epoch": 1455} {"train_loss": -11.314180374145508, "global_step": 244543, "epoch": 1455} {"train_loss": -11.406495094299316, "global_step": 244544, "epoch": 1455} {"train_loss": -11.602204322814941, "global_step": 244545, "epoch": 1455} {"train_loss": -11.312241554260254, "global_step": 244546, "epoch": 1455} {"train_loss": -11.734630584716797, "global_step": 244547, "epoch": 1455} {"train_loss": -11.435959815979004, "global_step": 244548, "epoch": 1455} {"train_loss": -11.630311965942383, "global_step": 244549, "epoch": 1455} {"train_loss": -11.538335800170898, "global_step": 244550, "epoch": 1455} {"train_loss": -11.316141128540039, "global_step": 244551, "epoch": 1455} {"train_loss": -11.429773330688477, "global_step": 244552, "epoch": 1455} {"train_loss": -11.297154426574707, "global_step": 244553, "epoch": 1455} {"train_loss": -11.398359298706055, "global_step": 244554, "epoch": 1455} {"train_loss": -11.77491569519043, "global_step": 244555, "epoch": 1455} {"train_loss": -11.095306396484375, "global_step": 244556, "epoch": 1455} {"train_loss": -11.647075653076172, "global_step": 244557, "epoch": 1455} {"train_loss": -11.746015548706055, "global_step": 244558, "epoch": 1455} {"train_loss": -11.785151481628418, "global_step": 244559, "epoch": 1455} {"train_loss": -11.690875053405762, "global_step": 244560, "epoch": 1455} {"train_loss": -11.778844833374023, "global_step": 244561, "epoch": 1455} {"train_loss": -11.89148998260498, "global_step": 244562, "epoch": 1455} {"train_loss": -11.693038940429688, "global_step": 244563, "epoch": 1455} {"train_loss": -11.2586669921875, "global_step": 244564, "epoch": 1455} {"train_loss": -11.756610870361328, "global_step": 244565, "epoch": 1455} {"train_loss": -11.434905052185059, "global_step": 244566, "epoch": 1455} {"train_loss": -11.726678848266602, "global_step": 244567, "epoch": 1455} {"train_loss": -11.221702575683594, "global_step": 244568, "epoch": 1455} {"train_loss": -11.895940780639648, "global_step": 244569, "epoch": 1455} {"train_loss": -11.504156112670898, "global_step": 244570, "epoch": 1455} {"train_loss": -11.882771492004395, "global_step": 244571, "epoch": 1455} {"train_loss": -11.381586074829102, "global_step": 244572, "epoch": 1455} {"train_loss": -12.037883758544922, "global_step": 244573, "epoch": 1455} {"train_loss": -11.472240447998047, "global_step": 244574, "epoch": 1455} {"train_loss": -11.65359115600586, "global_step": 244575, "epoch": 1455} {"train_loss": -11.16220474243164, "global_step": 244576, "epoch": 1455} {"train_loss": -11.919919967651367, "global_step": 244577, "epoch": 1455} {"train_loss": -10.979827880859375, "global_step": 244578, "epoch": 1455} {"train_loss": -11.732959747314453, "global_step": 244579, "epoch": 1455} {"train_loss": -11.403233528137207, "global_step": 244580, "epoch": 1455} {"train_loss": -11.490555763244629, "global_step": 244581, "epoch": 1455} {"train_loss": -11.472415924072266, "global_step": 244582, "epoch": 1455} {"train_loss": -11.19643783569336, "global_step": 244583, "epoch": 1455} {"train_loss": -11.703989028930664, "global_step": 244584, "epoch": 1455} {"train_loss": -11.607196807861328, "global_step": 244585, "epoch": 1455} {"train_loss": -11.959362030029297, "global_step": 244586, "epoch": 1455} {"train_loss": -11.58535099029541, "global_step": 244587, "epoch": 1455} {"train_loss": -11.606325149536133, "global_step": 244588, "epoch": 1455} {"train_loss": -11.450762748718262, "global_step": 244589, "epoch": 1455} {"train_loss": -11.482207298278809, "global_step": 244590, "epoch": 1455} {"train_loss": -11.727470397949219, "global_step": 244591, "epoch": 1455} {"train_loss": -11.396440505981445, "global_step": 244592, "epoch": 1455} {"train_loss": -11.575815200805664, "global_step": 244593, "epoch": 1455} {"train_loss": -11.544885635375977, "global_step": 244594, "epoch": 1455} {"train_loss": -11.93252182006836, "global_step": 244595, "epoch": 1455} {"train_loss": -11.531439781188965, "global_step": 244596, "epoch": 1455} {"train_loss": -11.802749633789062, "global_step": 244597, "epoch": 1455} {"train_loss": -11.500396728515625, "global_step": 244598, "epoch": 1455} {"train_loss": -11.816360473632812, "global_step": 244599, "epoch": 1455} {"train_loss": -11.813209533691406, "global_step": 244600, "epoch": 1455} {"train_loss": -11.970443725585938, "global_step": 244601, "epoch": 1455} {"train_loss": -11.558615684509277, "global_step": 244602, "epoch": 1455} {"train_loss": -12.005136489868164, "global_step": 244603, "epoch": 1455} {"train_loss": -11.593116760253906, "global_step": 244604, "epoch": 1455} {"train_loss": -11.81308364868164, "global_step": 244605, "epoch": 1455} {"train_loss": -11.704803466796875, "global_step": 244606, "epoch": 1455} {"train_loss": -11.584499325071063, "global_step": 244607, "epoch": 1455, "val_loss": 266469.84375, "train_action_mse_error": 2.213104724884033} {"train_loss": -11.32750129699707, "global_step": 244608, "epoch": 1456} {"train_loss": -11.945737838745117, "global_step": 244609, "epoch": 1456} {"train_loss": -11.362183570861816, "global_step": 244610, "epoch": 1456} {"train_loss": -11.856840133666992, "global_step": 244611, "epoch": 1456} {"train_loss": -11.248672485351562, "global_step": 244612, "epoch": 1456} {"train_loss": -11.76435375213623, "global_step": 244613, "epoch": 1456} {"train_loss": -11.918950080871582, "global_step": 244614, "epoch": 1456} {"train_loss": -11.603597640991211, "global_step": 244615, "epoch": 1456} {"train_loss": -11.703047752380371, "global_step": 244616, "epoch": 1456} {"train_loss": -11.491449356079102, "global_step": 244617, "epoch": 1456} {"train_loss": -11.544661521911621, "global_step": 244618, "epoch": 1456} {"train_loss": -11.126535415649414, "global_step": 244619, "epoch": 1456} {"train_loss": -11.82132339477539, "global_step": 244620, "epoch": 1456} {"train_loss": -11.407501220703125, "global_step": 244621, "epoch": 1456} {"train_loss": -11.855682373046875, "global_step": 244622, "epoch": 1456} {"train_loss": -11.293180465698242, "global_step": 244623, "epoch": 1456} {"train_loss": -11.238668441772461, "global_step": 244624, "epoch": 1456} {"train_loss": -11.893693923950195, "global_step": 244625, "epoch": 1456} {"train_loss": -11.406526565551758, "global_step": 244626, "epoch": 1456} {"train_loss": -11.119437217712402, "global_step": 244627, "epoch": 1456} {"train_loss": -11.820841789245605, "global_step": 244628, "epoch": 1456} {"train_loss": -11.297966003417969, "global_step": 244629, "epoch": 1456} {"train_loss": -11.325786590576172, "global_step": 244630, "epoch": 1456} {"train_loss": -11.640960693359375, "global_step": 244631, "epoch": 1456} {"train_loss": -11.357233047485352, "global_step": 244632, "epoch": 1456} {"train_loss": -11.674250602722168, "global_step": 244633, "epoch": 1456} {"train_loss": -11.379722595214844, "global_step": 244634, "epoch": 1456} {"train_loss": -11.642353057861328, "global_step": 244635, "epoch": 1456} {"train_loss": -10.833348274230957, "global_step": 244636, "epoch": 1456} {"train_loss": -11.582452774047852, "global_step": 244637, "epoch": 1456} {"train_loss": -10.382368087768555, "global_step": 244638, "epoch": 1456} {"train_loss": -11.868882179260254, "global_step": 244639, "epoch": 1456} {"train_loss": -10.357465744018555, "global_step": 244640, "epoch": 1456} {"train_loss": -11.21275520324707, "global_step": 244641, "epoch": 1456} {"train_loss": -11.079896926879883, "global_step": 244642, "epoch": 1456} {"train_loss": -10.571318626403809, "global_step": 244643, "epoch": 1456} {"train_loss": -10.43441104888916, "global_step": 244644, "epoch": 1456} {"train_loss": -10.185890197753906, "global_step": 244645, "epoch": 1456} {"train_loss": -11.099853515625, "global_step": 244646, "epoch": 1456} {"train_loss": -10.765193939208984, "global_step": 244647, "epoch": 1456} {"train_loss": -10.443235397338867, "global_step": 244648, "epoch": 1456} {"train_loss": -10.818920135498047, "global_step": 244649, "epoch": 1456} {"train_loss": -11.014678955078125, "global_step": 244650, "epoch": 1456} {"train_loss": -10.253087997436523, "global_step": 244651, "epoch": 1456} {"train_loss": -10.388776779174805, "global_step": 244652, "epoch": 1456} {"train_loss": -10.999716758728027, "global_step": 244653, "epoch": 1456} {"train_loss": -10.292356491088867, "global_step": 244654, "epoch": 1456} {"train_loss": -11.056928634643555, "global_step": 244655, "epoch": 1456} {"train_loss": -9.413650512695312, "global_step": 244656, "epoch": 1456} {"train_loss": -10.393393516540527, "global_step": 244657, "epoch": 1456} {"train_loss": -10.457474708557129, "global_step": 244658, "epoch": 1456} {"train_loss": -10.688520431518555, "global_step": 244659, "epoch": 1456} {"train_loss": -10.686517715454102, "global_step": 244660, "epoch": 1456} {"train_loss": -10.933174133300781, "global_step": 244661, "epoch": 1456} {"train_loss": -11.322317123413086, "global_step": 244662, "epoch": 1456} {"train_loss": -10.650703430175781, "global_step": 244663, "epoch": 1456} {"train_loss": -11.095198631286621, "global_step": 244664, "epoch": 1456} {"train_loss": -10.399008750915527, "global_step": 244665, "epoch": 1456} {"train_loss": -10.833502769470215, "global_step": 244666, "epoch": 1456} {"train_loss": -10.747883796691895, "global_step": 244667, "epoch": 1456} {"train_loss": -10.636384010314941, "global_step": 244668, "epoch": 1456} {"train_loss": -11.413537979125977, "global_step": 244669, "epoch": 1456} {"train_loss": -10.824951171875, "global_step": 244670, "epoch": 1456} {"train_loss": -11.400638580322266, "global_step": 244671, "epoch": 1456} {"train_loss": -11.440102577209473, "global_step": 244672, "epoch": 1456} {"train_loss": -11.025578498840332, "global_step": 244673, "epoch": 1456} {"train_loss": -10.974454879760742, "global_step": 244674, "epoch": 1456} {"train_loss": -11.464807510375977, "global_step": 244675, "epoch": 1456} {"train_loss": -11.093253135681152, "global_step": 244676, "epoch": 1456} {"train_loss": -11.148499488830566, "global_step": 244677, "epoch": 1456} {"train_loss": -11.542571067810059, "global_step": 244678, "epoch": 1456} {"train_loss": -11.468812942504883, "global_step": 244679, "epoch": 1456} {"train_loss": -11.154154777526855, "global_step": 244680, "epoch": 1456} {"train_loss": -11.706700325012207, "global_step": 244681, "epoch": 1456} {"train_loss": -11.461965560913086, "global_step": 244682, "epoch": 1456} {"train_loss": -11.440048217773438, "global_step": 244683, "epoch": 1456} {"train_loss": -11.461788177490234, "global_step": 244684, "epoch": 1456} {"train_loss": -11.69874382019043, "global_step": 244685, "epoch": 1456} {"train_loss": -11.320928573608398, "global_step": 244686, "epoch": 1456} {"train_loss": -11.667959213256836, "global_step": 244687, "epoch": 1456} {"train_loss": -11.634773254394531, "global_step": 244688, "epoch": 1456} {"train_loss": -11.463119506835938, "global_step": 244689, "epoch": 1456} {"train_loss": -11.470968246459961, "global_step": 244690, "epoch": 1456} {"train_loss": -11.623556137084961, "global_step": 244691, "epoch": 1456} {"train_loss": -11.50135612487793, "global_step": 244692, "epoch": 1456} {"train_loss": -11.516618728637695, "global_step": 244693, "epoch": 1456} {"train_loss": -11.613691329956055, "global_step": 244694, "epoch": 1456} {"train_loss": -11.531465530395508, "global_step": 244695, "epoch": 1456} {"train_loss": -11.73276424407959, "global_step": 244696, "epoch": 1456} {"train_loss": -11.772197723388672, "global_step": 244697, "epoch": 1456} {"train_loss": -11.41401481628418, "global_step": 244698, "epoch": 1456} {"train_loss": -11.780622482299805, "global_step": 244699, "epoch": 1456} {"train_loss": -11.84911823272705, "global_step": 244700, "epoch": 1456} {"train_loss": -11.55119514465332, "global_step": 244701, "epoch": 1456} {"train_loss": -11.803386688232422, "global_step": 244702, "epoch": 1456} {"train_loss": -11.880160331726074, "global_step": 244703, "epoch": 1456} {"train_loss": -11.74670124053955, "global_step": 244704, "epoch": 1456} {"train_loss": -11.97099494934082, "global_step": 244705, "epoch": 1456} {"train_loss": -11.85808277130127, "global_step": 244706, "epoch": 1456} {"train_loss": -11.84638786315918, "global_step": 244707, "epoch": 1456} {"train_loss": -11.919148445129395, "global_step": 244708, "epoch": 1456} {"train_loss": -11.768383026123047, "global_step": 244709, "epoch": 1456} {"train_loss": -11.912755966186523, "global_step": 244710, "epoch": 1456} {"train_loss": -11.706938743591309, "global_step": 244711, "epoch": 1456} {"train_loss": -11.762469291687012, "global_step": 244712, "epoch": 1456} {"train_loss": -12.017101287841797, "global_step": 244713, "epoch": 1456} {"train_loss": -11.77818489074707, "global_step": 244714, "epoch": 1456} {"train_loss": -12.008977890014648, "global_step": 244715, "epoch": 1456} {"train_loss": -11.94736099243164, "global_step": 244716, "epoch": 1456} {"train_loss": -11.965659141540527, "global_step": 244717, "epoch": 1456} {"train_loss": -12.092086791992188, "global_step": 244718, "epoch": 1456} {"train_loss": -12.00052261352539, "global_step": 244719, "epoch": 1456} {"train_loss": -12.189397811889648, "global_step": 244720, "epoch": 1456} {"train_loss": -12.07261848449707, "global_step": 244721, "epoch": 1456} {"train_loss": -12.150055885314941, "global_step": 244722, "epoch": 1456} {"train_loss": -12.04200267791748, "global_step": 244723, "epoch": 1456} {"train_loss": -12.125380516052246, "global_step": 244724, "epoch": 1456} {"train_loss": -12.021697998046875, "global_step": 244725, "epoch": 1456} {"train_loss": -12.078908920288086, "global_step": 244726, "epoch": 1456} {"train_loss": -12.155842781066895, "global_step": 244727, "epoch": 1456} {"train_loss": -12.091070175170898, "global_step": 244728, "epoch": 1456} {"train_loss": -12.026854515075684, "global_step": 244729, "epoch": 1456} {"train_loss": -12.146879196166992, "global_step": 244730, "epoch": 1456} {"train_loss": -12.22203254699707, "global_step": 244731, "epoch": 1456} {"train_loss": -12.124822616577148, "global_step": 244732, "epoch": 1456} {"train_loss": -12.221291542053223, "global_step": 244733, "epoch": 1456} {"train_loss": -12.159818649291992, "global_step": 244734, "epoch": 1456} {"train_loss": -11.712894439697266, "global_step": 244735, "epoch": 1456} {"train_loss": -11.88601303100586, "global_step": 244736, "epoch": 1456} {"train_loss": -11.604308128356934, "global_step": 244737, "epoch": 1456} {"train_loss": -12.085653305053711, "global_step": 244738, "epoch": 1456} {"train_loss": -11.528616905212402, "global_step": 244739, "epoch": 1456} {"train_loss": -12.113390922546387, "global_step": 244740, "epoch": 1456} {"train_loss": -11.110857963562012, "global_step": 244741, "epoch": 1456} {"train_loss": -11.385295867919922, "global_step": 244742, "epoch": 1456} {"train_loss": -10.789955139160156, "global_step": 244743, "epoch": 1456} {"train_loss": -12.132530212402344, "global_step": 244744, "epoch": 1456} {"train_loss": -10.980463027954102, "global_step": 244745, "epoch": 1456} {"train_loss": -11.611724853515625, "global_step": 244746, "epoch": 1456} {"train_loss": -10.576255798339844, "global_step": 244747, "epoch": 1456} {"train_loss": -11.865538597106934, "global_step": 244748, "epoch": 1456} {"train_loss": -10.198058128356934, "global_step": 244749, "epoch": 1456} {"train_loss": -11.018721580505371, "global_step": 244750, "epoch": 1456} {"train_loss": -10.952396392822266, "global_step": 244751, "epoch": 1456} {"train_loss": -10.206254959106445, "global_step": 244752, "epoch": 1456} {"train_loss": -10.787420272827148, "global_step": 244753, "epoch": 1456} {"train_loss": -7.650640964508057, "global_step": 244754, "epoch": 1456} {"train_loss": -8.658100128173828, "global_step": 244755, "epoch": 1456} {"train_loss": -10.997879981994629, "global_step": 244756, "epoch": 1456} {"train_loss": -8.494096755981445, "global_step": 244757, "epoch": 1456} {"train_loss": -8.20151138305664, "global_step": 244758, "epoch": 1456} {"train_loss": -6.070225715637207, "global_step": 244759, "epoch": 1456} {"train_loss": -8.820623397827148, "global_step": 244760, "epoch": 1456} {"train_loss": -7.817911148071289, "global_step": 244761, "epoch": 1456} {"train_loss": -5.2212066650390625, "global_step": 244762, "epoch": 1456} {"train_loss": -5.691318511962891, "global_step": 244763, "epoch": 1456} {"train_loss": -5.989137649536133, "global_step": 244764, "epoch": 1456} {"train_loss": -5.5379462242126465, "global_step": 244765, "epoch": 1456} {"train_loss": -5.4950151443481445, "global_step": 244766, "epoch": 1456} {"train_loss": -6.371115684509277, "global_step": 244767, "epoch": 1456} {"train_loss": -6.712920188903809, "global_step": 244768, "epoch": 1456} {"train_loss": -8.079811096191406, "global_step": 244769, "epoch": 1456} {"train_loss": -7.545241355895996, "global_step": 244770, "epoch": 1456} {"train_loss": -7.860729217529297, "global_step": 244771, "epoch": 1456} {"train_loss": -8.506875991821289, "global_step": 244772, "epoch": 1456} {"train_loss": -8.233637809753418, "global_step": 244773, "epoch": 1456} {"train_loss": -8.748573303222656, "global_step": 244774, "epoch": 1456} {"train_loss": -10.900249929655166, "global_step": 244775, "epoch": 1456, "val_loss": 260018.96875} {"train_loss": -9.529264450073242, "global_step": 244776, "epoch": 1457} {"train_loss": -9.365492820739746, "global_step": 244777, "epoch": 1457} {"train_loss": -8.744514465332031, "global_step": 244778, "epoch": 1457} {"train_loss": -10.771556854248047, "global_step": 244779, "epoch": 1457} {"train_loss": -9.817169189453125, "global_step": 244780, "epoch": 1457} {"train_loss": -10.103551864624023, "global_step": 244781, "epoch": 1457} {"train_loss": -9.881768226623535, "global_step": 244782, "epoch": 1457} {"train_loss": -10.808302879333496, "global_step": 244783, "epoch": 1457} {"train_loss": -10.067605972290039, "global_step": 244784, "epoch": 1457} {"train_loss": -9.970640182495117, "global_step": 244785, "epoch": 1457} {"train_loss": -10.948729515075684, "global_step": 244786, "epoch": 1457} {"train_loss": -10.737496376037598, "global_step": 244787, "epoch": 1457} {"train_loss": -10.29710578918457, "global_step": 244788, "epoch": 1457} {"train_loss": -10.636842727661133, "global_step": 244789, "epoch": 1457} {"train_loss": -10.592220306396484, "global_step": 244790, "epoch": 1457} {"train_loss": -10.762062072753906, "global_step": 244791, "epoch": 1457} {"train_loss": -10.68091869354248, "global_step": 244792, "epoch": 1457} {"train_loss": -10.947905540466309, "global_step": 244793, "epoch": 1457} {"train_loss": -11.180115699768066, "global_step": 244794, "epoch": 1457} {"train_loss": -10.692337036132812, "global_step": 244795, "epoch": 1457} {"train_loss": -11.054239273071289, "global_step": 244796, "epoch": 1457} {"train_loss": -11.232260704040527, "global_step": 244797, "epoch": 1457} {"train_loss": -10.944409370422363, "global_step": 244798, "epoch": 1457} {"train_loss": -10.83014965057373, "global_step": 244799, "epoch": 1457} {"train_loss": -11.010075569152832, "global_step": 244800, "epoch": 1457} {"train_loss": -11.432435989379883, "global_step": 244801, "epoch": 1457} {"train_loss": -10.880666732788086, "global_step": 244802, "epoch": 1457} {"train_loss": -11.430924415588379, "global_step": 244803, "epoch": 1457} {"train_loss": -11.282757759094238, "global_step": 244804, "epoch": 1457} {"train_loss": -11.474142074584961, "global_step": 244805, "epoch": 1457} {"train_loss": -11.33393669128418, "global_step": 244806, "epoch": 1457} {"train_loss": -11.254765510559082, "global_step": 244807, "epoch": 1457} {"train_loss": -11.431873321533203, "global_step": 244808, "epoch": 1457} {"train_loss": -11.28010368347168, "global_step": 244809, "epoch": 1457} {"train_loss": -11.410364151000977, "global_step": 244810, "epoch": 1457} {"train_loss": -11.313091278076172, "global_step": 244811, "epoch": 1457} {"train_loss": -11.423564910888672, "global_step": 244812, "epoch": 1457} {"train_loss": -11.565557479858398, "global_step": 244813, "epoch": 1457} {"train_loss": -11.524660110473633, "global_step": 244814, "epoch": 1457} {"train_loss": -11.477749824523926, "global_step": 244815, "epoch": 1457} {"train_loss": -11.520380020141602, "global_step": 244816, "epoch": 1457} {"train_loss": -11.463504791259766, "global_step": 244817, "epoch": 1457} {"train_loss": -11.711816787719727, "global_step": 244818, "epoch": 1457} {"train_loss": -11.553608894348145, "global_step": 244819, "epoch": 1457} {"train_loss": -11.693443298339844, "global_step": 244820, "epoch": 1457} {"train_loss": -11.565340042114258, "global_step": 244821, "epoch": 1457} {"train_loss": -11.592595100402832, "global_step": 244822, "epoch": 1457} {"train_loss": -11.553651809692383, "global_step": 244823, "epoch": 1457} {"train_loss": -11.728730201721191, "global_step": 244824, "epoch": 1457} {"train_loss": -11.834318161010742, "global_step": 244825, "epoch": 1457} {"train_loss": -11.575214385986328, "global_step": 244826, "epoch": 1457} {"train_loss": -11.68235969543457, "global_step": 244827, "epoch": 1457} {"train_loss": -11.89076042175293, "global_step": 244828, "epoch": 1457} {"train_loss": -11.646158218383789, "global_step": 244829, "epoch": 1457} {"train_loss": -11.772533416748047, "global_step": 244830, "epoch": 1457} {"train_loss": -11.925958633422852, "global_step": 244831, "epoch": 1457} {"train_loss": -11.781217575073242, "global_step": 244832, "epoch": 1457} {"train_loss": -11.774698257446289, "global_step": 244833, "epoch": 1457} {"train_loss": -11.822477340698242, "global_step": 244834, "epoch": 1457} {"train_loss": -11.868121147155762, "global_step": 244835, "epoch": 1457} {"train_loss": -11.723663330078125, "global_step": 244836, "epoch": 1457} {"train_loss": -11.733125686645508, "global_step": 244837, "epoch": 1457} {"train_loss": -11.921236991882324, "global_step": 244838, "epoch": 1457} {"train_loss": -11.779744148254395, "global_step": 244839, "epoch": 1457} {"train_loss": -11.760092735290527, "global_step": 244840, "epoch": 1457} {"train_loss": -11.786640167236328, "global_step": 244841, "epoch": 1457} {"train_loss": -12.07744026184082, "global_step": 244842, "epoch": 1457} {"train_loss": -11.773370742797852, "global_step": 244843, "epoch": 1457} {"train_loss": -11.933941841125488, "global_step": 244844, "epoch": 1457} {"train_loss": -11.908149719238281, "global_step": 244845, "epoch": 1457} {"train_loss": -11.872957229614258, "global_step": 244846, "epoch": 1457} {"train_loss": -11.861410140991211, "global_step": 244847, "epoch": 1457} {"train_loss": -11.773780822753906, "global_step": 244848, "epoch": 1457} {"train_loss": -12.13162612915039, "global_step": 244849, "epoch": 1457} {"train_loss": -12.017528533935547, "global_step": 244850, "epoch": 1457} {"train_loss": -12.068933486938477, "global_step": 244851, "epoch": 1457} {"train_loss": -11.954251289367676, "global_step": 244852, "epoch": 1457} {"train_loss": -11.91347599029541, "global_step": 244853, "epoch": 1457} {"train_loss": -11.971979141235352, "global_step": 244854, "epoch": 1457} {"train_loss": -12.094097137451172, "global_step": 244855, "epoch": 1457} {"train_loss": -12.049308776855469, "global_step": 244856, "epoch": 1457} {"train_loss": -11.795341491699219, "global_step": 244857, "epoch": 1457} {"train_loss": -12.252641677856445, "global_step": 244858, "epoch": 1457} {"train_loss": -11.785164833068848, "global_step": 244859, "epoch": 1457} {"train_loss": -11.824356079101562, "global_step": 244860, "epoch": 1457} {"train_loss": -12.113616943359375, "global_step": 244861, "epoch": 1457} {"train_loss": -11.981551170349121, "global_step": 244862, "epoch": 1457} {"train_loss": -12.13116455078125, "global_step": 244863, "epoch": 1457} {"train_loss": -12.025227546691895, "global_step": 244864, "epoch": 1457} {"train_loss": -12.20852279663086, "global_step": 244865, "epoch": 1457} {"train_loss": -12.18890380859375, "global_step": 244866, "epoch": 1457} {"train_loss": -12.206632614135742, "global_step": 244867, "epoch": 1457} {"train_loss": -12.193016052246094, "global_step": 244868, "epoch": 1457} {"train_loss": -11.957986831665039, "global_step": 244869, "epoch": 1457} {"train_loss": -12.346014022827148, "global_step": 244870, "epoch": 1457} {"train_loss": -12.020162582397461, "global_step": 244871, "epoch": 1457} {"train_loss": -11.863747596740723, "global_step": 244872, "epoch": 1457} {"train_loss": -11.941607475280762, "global_step": 244873, "epoch": 1457} {"train_loss": -12.254470825195312, "global_step": 244874, "epoch": 1457} {"train_loss": -11.942255020141602, "global_step": 244875, "epoch": 1457} {"train_loss": -10.514622688293457, "global_step": 244876, "epoch": 1457} {"train_loss": -11.031333923339844, "global_step": 244877, "epoch": 1457} {"train_loss": -11.812155723571777, "global_step": 244878, "epoch": 1457} {"train_loss": -11.706958770751953, "global_step": 244879, "epoch": 1457} {"train_loss": -10.326148986816406, "global_step": 244880, "epoch": 1457} {"train_loss": -8.482589721679688, "global_step": 244881, "epoch": 1457} {"train_loss": -10.931053161621094, "global_step": 244882, "epoch": 1457} {"train_loss": -7.287659645080566, "global_step": 244883, "epoch": 1457} {"train_loss": -9.057779312133789, "global_step": 244884, "epoch": 1457} {"train_loss": -7.734134674072266, "global_step": 244885, "epoch": 1457} {"train_loss": -7.876375198364258, "global_step": 244886, "epoch": 1457} {"train_loss": -7.226942539215088, "global_step": 244887, "epoch": 1457} {"train_loss": -8.639091491699219, "global_step": 244888, "epoch": 1457} {"train_loss": -9.509016036987305, "global_step": 244889, "epoch": 1457} {"train_loss": -9.01302433013916, "global_step": 244890, "epoch": 1457} {"train_loss": -8.531991958618164, "global_step": 244891, "epoch": 1457} {"train_loss": -8.860729217529297, "global_step": 244892, "epoch": 1457} {"train_loss": -8.417688369750977, "global_step": 244893, "epoch": 1457} {"train_loss": -9.16690731048584, "global_step": 244894, "epoch": 1457} {"train_loss": -10.352169036865234, "global_step": 244895, "epoch": 1457} {"train_loss": -10.389749526977539, "global_step": 244896, "epoch": 1457} {"train_loss": -10.172281265258789, "global_step": 244897, "epoch": 1457} {"train_loss": -10.880033493041992, "global_step": 244898, "epoch": 1457} {"train_loss": -10.155564308166504, "global_step": 244899, "epoch": 1457} {"train_loss": -10.800626754760742, "global_step": 244900, "epoch": 1457} {"train_loss": -10.291300773620605, "global_step": 244901, "epoch": 1457} {"train_loss": -10.430025100708008, "global_step": 244902, "epoch": 1457} {"train_loss": -10.82363510131836, "global_step": 244903, "epoch": 1457} {"train_loss": -10.141587257385254, "global_step": 244904, "epoch": 1457} {"train_loss": -11.172896385192871, "global_step": 244905, "epoch": 1457} {"train_loss": -10.321775436401367, "global_step": 244906, "epoch": 1457} {"train_loss": -10.784402847290039, "global_step": 244907, "epoch": 1457} {"train_loss": -10.418569564819336, "global_step": 244908, "epoch": 1457} {"train_loss": -10.434569358825684, "global_step": 244909, "epoch": 1457} {"train_loss": -11.044452667236328, "global_step": 244910, "epoch": 1457} {"train_loss": -11.058185577392578, "global_step": 244911, "epoch": 1457} {"train_loss": -10.729463577270508, "global_step": 244912, "epoch": 1457} {"train_loss": -11.134716987609863, "global_step": 244913, "epoch": 1457} {"train_loss": -11.071590423583984, "global_step": 244914, "epoch": 1457} {"train_loss": -11.391166687011719, "global_step": 244915, "epoch": 1457} {"train_loss": -11.583247184753418, "global_step": 244916, "epoch": 1457} {"train_loss": -11.160974502563477, "global_step": 244917, "epoch": 1457} {"train_loss": -11.069171905517578, "global_step": 244918, "epoch": 1457} {"train_loss": -11.116939544677734, "global_step": 244919, "epoch": 1457} {"train_loss": -11.395648956298828, "global_step": 244920, "epoch": 1457} {"train_loss": -11.235915184020996, "global_step": 244921, "epoch": 1457} {"train_loss": -11.281248092651367, "global_step": 244922, "epoch": 1457} {"train_loss": -11.549812316894531, "global_step": 244923, "epoch": 1457} {"train_loss": -10.986401557922363, "global_step": 244924, "epoch": 1457} {"train_loss": -11.471090316772461, "global_step": 244925, "epoch": 1457} {"train_loss": -11.400102615356445, "global_step": 244926, "epoch": 1457} {"train_loss": -11.366348266601562, "global_step": 244927, "epoch": 1457} {"train_loss": -11.467166900634766, "global_step": 244928, "epoch": 1457} {"train_loss": -11.219661712646484, "global_step": 244929, "epoch": 1457} {"train_loss": -11.640031814575195, "global_step": 244930, "epoch": 1457} {"train_loss": -11.399345397949219, "global_step": 244931, "epoch": 1457} {"train_loss": -11.446708679199219, "global_step": 244932, "epoch": 1457} {"train_loss": -11.314712524414062, "global_step": 244933, "epoch": 1457} {"train_loss": -11.63082504272461, "global_step": 244934, "epoch": 1457} {"train_loss": -11.266050338745117, "global_step": 244935, "epoch": 1457} {"train_loss": -11.620460510253906, "global_step": 244936, "epoch": 1457} {"train_loss": -11.593088150024414, "global_step": 244937, "epoch": 1457} {"train_loss": -11.526224136352539, "global_step": 244938, "epoch": 1457} {"train_loss": -11.378726959228516, "global_step": 244939, "epoch": 1457} {"train_loss": -11.624103546142578, "global_step": 244940, "epoch": 1457} {"train_loss": -11.525810241699219, "global_step": 244941, "epoch": 1457} {"train_loss": -11.536273002624512, "global_step": 244942, "epoch": 1457} {"train_loss": -11.099403162797293, "global_step": 244943, "epoch": 1457, "val_loss": 244590.9375} {"train_loss": -11.639595985412598, "global_step": 244944, "epoch": 1458} {"train_loss": -11.510309219360352, "global_step": 244945, "epoch": 1458} {"train_loss": -11.53182601928711, "global_step": 244946, "epoch": 1458} {"train_loss": -11.584336280822754, "global_step": 244947, "epoch": 1458} {"train_loss": -11.841133117675781, "global_step": 244948, "epoch": 1458} {"train_loss": -11.614923477172852, "global_step": 244949, "epoch": 1458} {"train_loss": -11.84439468383789, "global_step": 244950, "epoch": 1458} {"train_loss": -11.315435409545898, "global_step": 244951, "epoch": 1458} {"train_loss": -11.919322967529297, "global_step": 244952, "epoch": 1458} {"train_loss": -11.459105491638184, "global_step": 244953, "epoch": 1458} {"train_loss": -11.863346099853516, "global_step": 244954, "epoch": 1458} {"train_loss": -11.775652885437012, "global_step": 244955, "epoch": 1458} {"train_loss": -11.929368019104004, "global_step": 244956, "epoch": 1458} {"train_loss": -11.92287826538086, "global_step": 244957, "epoch": 1458} {"train_loss": -11.752754211425781, "global_step": 244958, "epoch": 1458} {"train_loss": -11.963123321533203, "global_step": 244959, "epoch": 1458} {"train_loss": -11.856088638305664, "global_step": 244960, "epoch": 1458} {"train_loss": -12.008543968200684, "global_step": 244961, "epoch": 1458} {"train_loss": -11.690052032470703, "global_step": 244962, "epoch": 1458} {"train_loss": -11.94515323638916, "global_step": 244963, "epoch": 1458} {"train_loss": -11.935676574707031, "global_step": 244964, "epoch": 1458} {"train_loss": -11.882301330566406, "global_step": 244965, "epoch": 1458} {"train_loss": -11.978422164916992, "global_step": 244966, "epoch": 1458} {"train_loss": -11.846307754516602, "global_step": 244967, "epoch": 1458} {"train_loss": -11.710199356079102, "global_step": 244968, "epoch": 1458} {"train_loss": -12.110885620117188, "global_step": 244969, "epoch": 1458} {"train_loss": -11.884103775024414, "global_step": 244970, "epoch": 1458} {"train_loss": -11.960027694702148, "global_step": 244971, "epoch": 1458} {"train_loss": -11.953910827636719, "global_step": 244972, "epoch": 1458} {"train_loss": -12.017581939697266, "global_step": 244973, "epoch": 1458} {"train_loss": -12.160322189331055, "global_step": 244974, "epoch": 1458} {"train_loss": -11.941746711730957, "global_step": 244975, "epoch": 1458} {"train_loss": -11.824283599853516, "global_step": 244976, "epoch": 1458} {"train_loss": -11.944110870361328, "global_step": 244977, "epoch": 1458} {"train_loss": -12.043560028076172, "global_step": 244978, "epoch": 1458} {"train_loss": -11.906412124633789, "global_step": 244979, "epoch": 1458} {"train_loss": -12.288118362426758, "global_step": 244980, "epoch": 1458} {"train_loss": -11.953657150268555, "global_step": 244981, "epoch": 1458} {"train_loss": -12.092970848083496, "global_step": 244982, "epoch": 1458} {"train_loss": -12.045711517333984, "global_step": 244983, "epoch": 1458} {"train_loss": -12.087268829345703, "global_step": 244984, "epoch": 1458} {"train_loss": -12.086483001708984, "global_step": 244985, "epoch": 1458} {"train_loss": -12.057918548583984, "global_step": 244986, "epoch": 1458} {"train_loss": -12.032271385192871, "global_step": 244987, "epoch": 1458} {"train_loss": -12.255083084106445, "global_step": 244988, "epoch": 1458} {"train_loss": -12.105766296386719, "global_step": 244989, "epoch": 1458} {"train_loss": -11.970266342163086, "global_step": 244990, "epoch": 1458} {"train_loss": -12.123503684997559, "global_step": 244991, "epoch": 1458} {"train_loss": -12.148868560791016, "global_step": 244992, "epoch": 1458} {"train_loss": -12.0980863571167, "global_step": 244993, "epoch": 1458} {"train_loss": -11.870107650756836, "global_step": 244994, "epoch": 1458} {"train_loss": -12.169840812683105, "global_step": 244995, "epoch": 1458} {"train_loss": -12.189460754394531, "global_step": 244996, "epoch": 1458} {"train_loss": -12.174816131591797, "global_step": 244997, "epoch": 1458} {"train_loss": -11.70285701751709, "global_step": 244998, "epoch": 1458} {"train_loss": -11.793872833251953, "global_step": 244999, "epoch": 1458} {"train_loss": -11.971046447753906, "global_step": 245000, "epoch": 1458} {"train_loss": -12.209650039672852, "global_step": 245001, "epoch": 1458} {"train_loss": -11.669029235839844, "global_step": 245002, "epoch": 1458} {"train_loss": -11.744636535644531, "global_step": 245003, "epoch": 1458} {"train_loss": -11.981992721557617, "global_step": 245004, "epoch": 1458} {"train_loss": -11.764547348022461, "global_step": 245005, "epoch": 1458} {"train_loss": -11.571599960327148, "global_step": 245006, "epoch": 1458} {"train_loss": -11.510830879211426, "global_step": 245007, "epoch": 1458} {"train_loss": -11.752544403076172, "global_step": 245008, "epoch": 1458} {"train_loss": -11.688713073730469, "global_step": 245009, "epoch": 1458} {"train_loss": -11.700796127319336, "global_step": 245010, "epoch": 1458} {"train_loss": -11.469481468200684, "global_step": 245011, "epoch": 1458} {"train_loss": -11.968976974487305, "global_step": 245012, "epoch": 1458} {"train_loss": -11.57169246673584, "global_step": 245013, "epoch": 1458} {"train_loss": -11.871160507202148, "global_step": 245014, "epoch": 1458} {"train_loss": -10.788198471069336, "global_step": 245015, "epoch": 1458} {"train_loss": -10.655134201049805, "global_step": 245016, "epoch": 1458} {"train_loss": -11.812492370605469, "global_step": 245017, "epoch": 1458} {"train_loss": -10.837337493896484, "global_step": 245018, "epoch": 1458} {"train_loss": -11.865560531616211, "global_step": 245019, "epoch": 1458} {"train_loss": -11.222955703735352, "global_step": 245020, "epoch": 1458} {"train_loss": -11.50791072845459, "global_step": 245021, "epoch": 1458} {"train_loss": -10.832603454589844, "global_step": 245022, "epoch": 1458} {"train_loss": -11.696125030517578, "global_step": 245023, "epoch": 1458} {"train_loss": -10.833654403686523, "global_step": 245024, "epoch": 1458} {"train_loss": -10.727036476135254, "global_step": 245025, "epoch": 1458} {"train_loss": -10.744906425476074, "global_step": 245026, "epoch": 1458} {"train_loss": -10.10798454284668, "global_step": 245027, "epoch": 1458} {"train_loss": -11.045005798339844, "global_step": 245028, "epoch": 1458} {"train_loss": -10.004517555236816, "global_step": 245029, "epoch": 1458} {"train_loss": -11.032832145690918, "global_step": 245030, "epoch": 1458} {"train_loss": -10.506478309631348, "global_step": 245031, "epoch": 1458} {"train_loss": -10.796187400817871, "global_step": 245032, "epoch": 1458} {"train_loss": -11.20807933807373, "global_step": 245033, "epoch": 1458} {"train_loss": -11.140954971313477, "global_step": 245034, "epoch": 1458} {"train_loss": -11.421708106994629, "global_step": 245035, "epoch": 1458} {"train_loss": -11.083908081054688, "global_step": 245036, "epoch": 1458} {"train_loss": -10.420151710510254, "global_step": 245037, "epoch": 1458} {"train_loss": -11.105932235717773, "global_step": 245038, "epoch": 1458} {"train_loss": -11.216879844665527, "global_step": 245039, "epoch": 1458} {"train_loss": -10.59600830078125, "global_step": 245040, "epoch": 1458} {"train_loss": -11.80282974243164, "global_step": 245041, "epoch": 1458} {"train_loss": -10.838809967041016, "global_step": 245042, "epoch": 1458} {"train_loss": -11.445502281188965, "global_step": 245043, "epoch": 1458} {"train_loss": -10.784568786621094, "global_step": 245044, "epoch": 1458} {"train_loss": -11.259584426879883, "global_step": 245045, "epoch": 1458} {"train_loss": -11.283113479614258, "global_step": 245046, "epoch": 1458} {"train_loss": -11.23315715789795, "global_step": 245047, "epoch": 1458} {"train_loss": -10.973995208740234, "global_step": 245048, "epoch": 1458} {"train_loss": -11.675766944885254, "global_step": 245049, "epoch": 1458} {"train_loss": -10.92414665222168, "global_step": 245050, "epoch": 1458} {"train_loss": -11.380697250366211, "global_step": 245051, "epoch": 1458} {"train_loss": -10.624432563781738, "global_step": 245052, "epoch": 1458} {"train_loss": -11.484415054321289, "global_step": 245053, "epoch": 1458} {"train_loss": -11.188647270202637, "global_step": 245054, "epoch": 1458} {"train_loss": -11.439273834228516, "global_step": 245055, "epoch": 1458} {"train_loss": -11.40040397644043, "global_step": 245056, "epoch": 1458} {"train_loss": -11.396461486816406, "global_step": 245057, "epoch": 1458} {"train_loss": -11.616645812988281, "global_step": 245058, "epoch": 1458} {"train_loss": -11.132919311523438, "global_step": 245059, "epoch": 1458} {"train_loss": -11.676921844482422, "global_step": 245060, "epoch": 1458} {"train_loss": -11.796815872192383, "global_step": 245061, "epoch": 1458} {"train_loss": -11.435707092285156, "global_step": 245062, "epoch": 1458} {"train_loss": -11.892725944519043, "global_step": 245063, "epoch": 1458} {"train_loss": -11.432151794433594, "global_step": 245064, "epoch": 1458} {"train_loss": -11.79195785522461, "global_step": 245065, "epoch": 1458} {"train_loss": -11.775667190551758, "global_step": 245066, "epoch": 1458} {"train_loss": -11.629284858703613, "global_step": 245067, "epoch": 1458} {"train_loss": -11.773697853088379, "global_step": 245068, "epoch": 1458} {"train_loss": -11.803262710571289, "global_step": 245069, "epoch": 1458} {"train_loss": -11.613203048706055, "global_step": 245070, "epoch": 1458} {"train_loss": -11.630345344543457, "global_step": 245071, "epoch": 1458} {"train_loss": -11.560396194458008, "global_step": 245072, "epoch": 1458} {"train_loss": -11.968267440795898, "global_step": 245073, "epoch": 1458} {"train_loss": -11.552462577819824, "global_step": 245074, "epoch": 1458} {"train_loss": -11.714345932006836, "global_step": 245075, "epoch": 1458} {"train_loss": -12.006783485412598, "global_step": 245076, "epoch": 1458} {"train_loss": -11.763675689697266, "global_step": 245077, "epoch": 1458} {"train_loss": -11.886306762695312, "global_step": 245078, "epoch": 1458} {"train_loss": -11.721918106079102, "global_step": 245079, "epoch": 1458} {"train_loss": -11.819281578063965, "global_step": 245080, "epoch": 1458} {"train_loss": -11.865406036376953, "global_step": 245081, "epoch": 1458} {"train_loss": -11.882909774780273, "global_step": 245082, "epoch": 1458} {"train_loss": -12.058236122131348, "global_step": 245083, "epoch": 1458} {"train_loss": -11.942639350891113, "global_step": 245084, "epoch": 1458} {"train_loss": -11.936270713806152, "global_step": 245085, "epoch": 1458} {"train_loss": -11.952239036560059, "global_step": 245086, "epoch": 1458} {"train_loss": -11.591468811035156, "global_step": 245087, "epoch": 1458} {"train_loss": -11.906745910644531, "global_step": 245088, "epoch": 1458} {"train_loss": -11.99429988861084, "global_step": 245089, "epoch": 1458} {"train_loss": -12.066097259521484, "global_step": 245090, "epoch": 1458} {"train_loss": -11.709393501281738, "global_step": 245091, "epoch": 1458} {"train_loss": -11.997852325439453, "global_step": 245092, "epoch": 1458} {"train_loss": -11.976963996887207, "global_step": 245093, "epoch": 1458} {"train_loss": -12.149012565612793, "global_step": 245094, "epoch": 1458} {"train_loss": -11.870018005371094, "global_step": 245095, "epoch": 1458} {"train_loss": -12.035078048706055, "global_step": 245096, "epoch": 1458} {"train_loss": -11.783380508422852, "global_step": 245097, "epoch": 1458} {"train_loss": -11.623276710510254, "global_step": 245098, "epoch": 1458} {"train_loss": -12.022205352783203, "global_step": 245099, "epoch": 1458} {"train_loss": -11.996345520019531, "global_step": 245100, "epoch": 1458} {"train_loss": -11.614095687866211, "global_step": 245101, "epoch": 1458} {"train_loss": -11.986593246459961, "global_step": 245102, "epoch": 1458} {"train_loss": -11.996841430664062, "global_step": 245103, "epoch": 1458} {"train_loss": -12.073460578918457, "global_step": 245104, "epoch": 1458} {"train_loss": -11.934076309204102, "global_step": 245105, "epoch": 1458} {"train_loss": -11.908712387084961, "global_step": 245106, "epoch": 1458} {"train_loss": -12.016386032104492, "global_step": 245107, "epoch": 1458} {"train_loss": -11.95564079284668, "global_step": 245108, "epoch": 1458} {"train_loss": -11.637929916381836, "global_step": 245109, "epoch": 1458} {"train_loss": -11.788124084472656, "global_step": 245110, "epoch": 1458} {"train_loss": -11.657178146498543, "global_step": 245111, "epoch": 1458, "val_loss": 262535.40625} {"train_loss": -11.632179260253906, "global_step": 245112, "epoch": 1459} {"train_loss": -11.046716690063477, "global_step": 245113, "epoch": 1459} {"train_loss": -11.49228572845459, "global_step": 245114, "epoch": 1459} {"train_loss": -11.223188400268555, "global_step": 245115, "epoch": 1459} {"train_loss": -11.21615219116211, "global_step": 245116, "epoch": 1459} {"train_loss": -11.207979202270508, "global_step": 245117, "epoch": 1459} {"train_loss": -10.7528076171875, "global_step": 245118, "epoch": 1459} {"train_loss": -11.788564682006836, "global_step": 245119, "epoch": 1459} {"train_loss": -10.514250755310059, "global_step": 245120, "epoch": 1459} {"train_loss": -11.32935905456543, "global_step": 245121, "epoch": 1459} {"train_loss": -11.262528419494629, "global_step": 245122, "epoch": 1459} {"train_loss": -11.716681480407715, "global_step": 245123, "epoch": 1459} {"train_loss": -11.285484313964844, "global_step": 245124, "epoch": 1459} {"train_loss": -11.365524291992188, "global_step": 245125, "epoch": 1459} {"train_loss": -11.499818801879883, "global_step": 245126, "epoch": 1459} {"train_loss": -11.105772972106934, "global_step": 245127, "epoch": 1459} {"train_loss": -11.923881530761719, "global_step": 245128, "epoch": 1459} {"train_loss": -11.31312370300293, "global_step": 245129, "epoch": 1459} {"train_loss": -11.478631973266602, "global_step": 245130, "epoch": 1459} {"train_loss": -11.51552963256836, "global_step": 245131, "epoch": 1459} {"train_loss": -11.552687644958496, "global_step": 245132, "epoch": 1459} {"train_loss": -11.058185577392578, "global_step": 245133, "epoch": 1459} {"train_loss": -11.265914916992188, "global_step": 245134, "epoch": 1459} {"train_loss": -10.913725852966309, "global_step": 245135, "epoch": 1459} {"train_loss": -11.653021812438965, "global_step": 245136, "epoch": 1459} {"train_loss": -10.558122634887695, "global_step": 245137, "epoch": 1459} {"train_loss": -11.565147399902344, "global_step": 245138, "epoch": 1459} {"train_loss": -11.103471755981445, "global_step": 245139, "epoch": 1459} {"train_loss": -11.473419189453125, "global_step": 245140, "epoch": 1459} {"train_loss": -11.715667724609375, "global_step": 245141, "epoch": 1459} {"train_loss": -10.989578247070312, "global_step": 245142, "epoch": 1459} {"train_loss": -11.52963638305664, "global_step": 245143, "epoch": 1459} {"train_loss": -11.074798583984375, "global_step": 245144, "epoch": 1459} {"train_loss": -11.560481071472168, "global_step": 245145, "epoch": 1459} {"train_loss": -11.39441204071045, "global_step": 245146, "epoch": 1459} {"train_loss": -11.133581161499023, "global_step": 245147, "epoch": 1459} {"train_loss": -11.677310943603516, "global_step": 245148, "epoch": 1459} {"train_loss": -11.537191390991211, "global_step": 245149, "epoch": 1459} {"train_loss": -11.575550079345703, "global_step": 245150, "epoch": 1459} {"train_loss": -11.249340057373047, "global_step": 245151, "epoch": 1459} {"train_loss": -11.632328987121582, "global_step": 245152, "epoch": 1459} {"train_loss": -11.535896301269531, "global_step": 245153, "epoch": 1459} {"train_loss": -11.6814546585083, "global_step": 245154, "epoch": 1459} {"train_loss": -11.525314331054688, "global_step": 245155, "epoch": 1459} {"train_loss": -11.501373291015625, "global_step": 245156, "epoch": 1459} {"train_loss": -11.60529899597168, "global_step": 245157, "epoch": 1459} {"train_loss": -11.428292274475098, "global_step": 245158, "epoch": 1459} {"train_loss": -11.776966094970703, "global_step": 245159, "epoch": 1459} {"train_loss": -11.484113693237305, "global_step": 245160, "epoch": 1459} {"train_loss": -11.691758155822754, "global_step": 245161, "epoch": 1459} {"train_loss": -11.62983512878418, "global_step": 245162, "epoch": 1459} {"train_loss": -11.46648120880127, "global_step": 245163, "epoch": 1459} {"train_loss": -11.803723335266113, "global_step": 245164, "epoch": 1459} {"train_loss": -11.404298782348633, "global_step": 245165, "epoch": 1459} {"train_loss": -11.877224922180176, "global_step": 245166, "epoch": 1459} {"train_loss": -11.588807106018066, "global_step": 245167, "epoch": 1459} {"train_loss": -11.840890884399414, "global_step": 245168, "epoch": 1459} {"train_loss": -11.739376068115234, "global_step": 245169, "epoch": 1459} {"train_loss": -11.841161727905273, "global_step": 245170, "epoch": 1459} {"train_loss": -11.862422943115234, "global_step": 245171, "epoch": 1459} {"train_loss": -11.962455749511719, "global_step": 245172, "epoch": 1459} {"train_loss": -11.789180755615234, "global_step": 245173, "epoch": 1459} {"train_loss": -11.717487335205078, "global_step": 245174, "epoch": 1459} {"train_loss": -11.594320297241211, "global_step": 245175, "epoch": 1459} {"train_loss": -11.792322158813477, "global_step": 245176, "epoch": 1459} {"train_loss": -11.86029052734375, "global_step": 245177, "epoch": 1459} {"train_loss": -11.73837661743164, "global_step": 245178, "epoch": 1459} {"train_loss": -11.851190567016602, "global_step": 245179, "epoch": 1459} {"train_loss": -11.864973068237305, "global_step": 245180, "epoch": 1459} {"train_loss": -11.820964813232422, "global_step": 245181, "epoch": 1459} {"train_loss": -11.809365272521973, "global_step": 245182, "epoch": 1459} {"train_loss": -11.577629089355469, "global_step": 245183, "epoch": 1459} {"train_loss": -11.479581832885742, "global_step": 245184, "epoch": 1459} {"train_loss": -11.847122192382812, "global_step": 245185, "epoch": 1459} {"train_loss": -11.969902038574219, "global_step": 245186, "epoch": 1459} {"train_loss": -11.96708869934082, "global_step": 245187, "epoch": 1459} {"train_loss": -11.894403457641602, "global_step": 245188, "epoch": 1459} {"train_loss": -12.00589370727539, "global_step": 245189, "epoch": 1459} {"train_loss": -11.981192588806152, "global_step": 245190, "epoch": 1459} {"train_loss": -12.142768859863281, "global_step": 245191, "epoch": 1459} {"train_loss": -12.176344871520996, "global_step": 245192, "epoch": 1459} {"train_loss": -11.72751522064209, "global_step": 245193, "epoch": 1459} {"train_loss": -12.129932403564453, "global_step": 245194, "epoch": 1459} {"train_loss": -11.956615447998047, "global_step": 245195, "epoch": 1459} {"train_loss": -11.972110748291016, "global_step": 245196, "epoch": 1459} {"train_loss": -12.020856857299805, "global_step": 245197, "epoch": 1459} {"train_loss": -11.853804588317871, "global_step": 245198, "epoch": 1459} {"train_loss": -11.730667114257812, "global_step": 245199, "epoch": 1459} {"train_loss": -12.02467155456543, "global_step": 245200, "epoch": 1459} {"train_loss": -11.760759353637695, "global_step": 245201, "epoch": 1459} {"train_loss": -12.168444633483887, "global_step": 245202, "epoch": 1459} {"train_loss": -11.924272537231445, "global_step": 245203, "epoch": 1459} {"train_loss": -12.065348625183105, "global_step": 245204, "epoch": 1459} {"train_loss": -12.081539154052734, "global_step": 245205, "epoch": 1459} {"train_loss": -11.887190818786621, "global_step": 245206, "epoch": 1459} {"train_loss": -11.96314525604248, "global_step": 245207, "epoch": 1459} {"train_loss": -11.980690002441406, "global_step": 245208, "epoch": 1459} {"train_loss": -12.09106731414795, "global_step": 245209, "epoch": 1459} {"train_loss": -11.985633850097656, "global_step": 245210, "epoch": 1459} {"train_loss": -11.750280380249023, "global_step": 245211, "epoch": 1459} {"train_loss": -12.425107955932617, "global_step": 245212, "epoch": 1459} {"train_loss": -12.082436561584473, "global_step": 245213, "epoch": 1459} {"train_loss": -11.844097137451172, "global_step": 245214, "epoch": 1459} {"train_loss": -12.142427444458008, "global_step": 245215, "epoch": 1459} {"train_loss": -12.021133422851562, "global_step": 245216, "epoch": 1459} {"train_loss": -11.516717910766602, "global_step": 245217, "epoch": 1459} {"train_loss": -11.632339477539062, "global_step": 245218, "epoch": 1459} {"train_loss": -11.37236213684082, "global_step": 245219, "epoch": 1459} {"train_loss": -11.382756233215332, "global_step": 245220, "epoch": 1459} {"train_loss": -11.410818099975586, "global_step": 245221, "epoch": 1459} {"train_loss": -12.008223533630371, "global_step": 245222, "epoch": 1459} {"train_loss": -11.426416397094727, "global_step": 245223, "epoch": 1459} {"train_loss": -11.629301071166992, "global_step": 245224, "epoch": 1459} {"train_loss": -11.64482307434082, "global_step": 245225, "epoch": 1459} {"train_loss": -11.156694412231445, "global_step": 245226, "epoch": 1459} {"train_loss": -11.351568222045898, "global_step": 245227, "epoch": 1459} {"train_loss": -11.358562469482422, "global_step": 245228, "epoch": 1459} {"train_loss": -11.881256103515625, "global_step": 245229, "epoch": 1459} {"train_loss": -11.63715934753418, "global_step": 245230, "epoch": 1459} {"train_loss": -11.71172046661377, "global_step": 245231, "epoch": 1459} {"train_loss": -11.20422077178955, "global_step": 245232, "epoch": 1459} {"train_loss": -11.386595726013184, "global_step": 245233, "epoch": 1459} {"train_loss": -11.64815902709961, "global_step": 245234, "epoch": 1459} {"train_loss": -11.053960800170898, "global_step": 245235, "epoch": 1459} {"train_loss": -10.64143180847168, "global_step": 245236, "epoch": 1459} {"train_loss": -11.762849807739258, "global_step": 245237, "epoch": 1459} {"train_loss": -11.302437782287598, "global_step": 245238, "epoch": 1459} {"train_loss": -10.653337478637695, "global_step": 245239, "epoch": 1459} {"train_loss": -11.1368408203125, "global_step": 245240, "epoch": 1459} {"train_loss": -11.509063720703125, "global_step": 245241, "epoch": 1459} {"train_loss": -11.44645881652832, "global_step": 245242, "epoch": 1459} {"train_loss": -11.54101276397705, "global_step": 245243, "epoch": 1459} {"train_loss": -11.499332427978516, "global_step": 245244, "epoch": 1459} {"train_loss": -11.237608909606934, "global_step": 245245, "epoch": 1459} {"train_loss": -11.730947494506836, "global_step": 245246, "epoch": 1459} {"train_loss": -11.770553588867188, "global_step": 245247, "epoch": 1459} {"train_loss": -11.516190528869629, "global_step": 245248, "epoch": 1459} {"train_loss": -11.556118965148926, "global_step": 245249, "epoch": 1459} {"train_loss": -10.956581115722656, "global_step": 245250, "epoch": 1459} {"train_loss": -9.130023956298828, "global_step": 245251, "epoch": 1459} {"train_loss": -12.052433013916016, "global_step": 245252, "epoch": 1459} {"train_loss": -10.392046928405762, "global_step": 245253, "epoch": 1459} {"train_loss": -10.851655006408691, "global_step": 245254, "epoch": 1459} {"train_loss": -10.907729148864746, "global_step": 245255, "epoch": 1459} {"train_loss": -10.690652847290039, "global_step": 245256, "epoch": 1459} {"train_loss": -10.33985710144043, "global_step": 245257, "epoch": 1459} {"train_loss": -10.922552108764648, "global_step": 245258, "epoch": 1459} {"train_loss": -11.0765380859375, "global_step": 245259, "epoch": 1459} {"train_loss": -11.133599281311035, "global_step": 245260, "epoch": 1459} {"train_loss": -10.909887313842773, "global_step": 245261, "epoch": 1459} {"train_loss": -11.074127197265625, "global_step": 245262, "epoch": 1459} {"train_loss": -11.197260856628418, "global_step": 245263, "epoch": 1459} {"train_loss": -11.294870376586914, "global_step": 245264, "epoch": 1459} {"train_loss": -10.481095314025879, "global_step": 245265, "epoch": 1459} {"train_loss": -11.217658996582031, "global_step": 245266, "epoch": 1459} {"train_loss": -10.363327026367188, "global_step": 245267, "epoch": 1459} {"train_loss": -10.732288360595703, "global_step": 245268, "epoch": 1459} {"train_loss": -10.757271766662598, "global_step": 245269, "epoch": 1459} {"train_loss": -10.99307632446289, "global_step": 245270, "epoch": 1459} {"train_loss": -10.930097579956055, "global_step": 245271, "epoch": 1459} {"train_loss": -11.072182655334473, "global_step": 245272, "epoch": 1459} {"train_loss": -11.349577903747559, "global_step": 245273, "epoch": 1459} {"train_loss": -10.850967407226562, "global_step": 245274, "epoch": 1459} {"train_loss": -11.526561737060547, "global_step": 245275, "epoch": 1459} {"train_loss": -10.94474983215332, "global_step": 245276, "epoch": 1459} {"train_loss": -11.594554901123047, "global_step": 245277, "epoch": 1459} {"train_loss": -11.41110610961914, "global_step": 245278, "epoch": 1459} {"train_loss": -11.481977059727623, "global_step": 245279, "epoch": 1459, "val_loss": 266542.15625} {"train_loss": -10.406169891357422, "global_step": 245280, "epoch": 1460} {"train_loss": -11.44094181060791, "global_step": 245281, "epoch": 1460} {"train_loss": -10.961836814880371, "global_step": 245282, "epoch": 1460} {"train_loss": -11.549755096435547, "global_step": 245283, "epoch": 1460} {"train_loss": -11.013254165649414, "global_step": 245284, "epoch": 1460} {"train_loss": -11.397078514099121, "global_step": 245285, "epoch": 1460} {"train_loss": -11.346830368041992, "global_step": 245286, "epoch": 1460} {"train_loss": -11.578057289123535, "global_step": 245287, "epoch": 1460} {"train_loss": -11.192203521728516, "global_step": 245288, "epoch": 1460} {"train_loss": -11.725640296936035, "global_step": 245289, "epoch": 1460} {"train_loss": -10.831887245178223, "global_step": 245290, "epoch": 1460} {"train_loss": -11.767688751220703, "global_step": 245291, "epoch": 1460} {"train_loss": -11.236344337463379, "global_step": 245292, "epoch": 1460} {"train_loss": -11.426243782043457, "global_step": 245293, "epoch": 1460} {"train_loss": -11.361735343933105, "global_step": 245294, "epoch": 1460} {"train_loss": -11.539726257324219, "global_step": 245295, "epoch": 1460} {"train_loss": -11.2008056640625, "global_step": 245296, "epoch": 1460} {"train_loss": -11.64307975769043, "global_step": 245297, "epoch": 1460} {"train_loss": -11.417509078979492, "global_step": 245298, "epoch": 1460} {"train_loss": -11.479776382446289, "global_step": 245299, "epoch": 1460} {"train_loss": -11.429569244384766, "global_step": 245300, "epoch": 1460} {"train_loss": -11.56596851348877, "global_step": 245301, "epoch": 1460} {"train_loss": -11.605088233947754, "global_step": 245302, "epoch": 1460} {"train_loss": -11.583958625793457, "global_step": 245303, "epoch": 1460} {"train_loss": -11.830955505371094, "global_step": 245304, "epoch": 1460} {"train_loss": -11.516801834106445, "global_step": 245305, "epoch": 1460} {"train_loss": -11.711719512939453, "global_step": 245306, "epoch": 1460} {"train_loss": -11.653176307678223, "global_step": 245307, "epoch": 1460} {"train_loss": -12.048559188842773, "global_step": 245308, "epoch": 1460} {"train_loss": -11.492515563964844, "global_step": 245309, "epoch": 1460} {"train_loss": -11.671468734741211, "global_step": 245310, "epoch": 1460} {"train_loss": -11.9920654296875, "global_step": 245311, "epoch": 1460} {"train_loss": -11.450175285339355, "global_step": 245312, "epoch": 1460} {"train_loss": -11.864421844482422, "global_step": 245313, "epoch": 1460} {"train_loss": -11.69017219543457, "global_step": 245314, "epoch": 1460} {"train_loss": -11.897794723510742, "global_step": 245315, "epoch": 1460} {"train_loss": -11.844244003295898, "global_step": 245316, "epoch": 1460} {"train_loss": -11.768061637878418, "global_step": 245317, "epoch": 1460} {"train_loss": -11.849685668945312, "global_step": 245318, "epoch": 1460} {"train_loss": -11.69599723815918, "global_step": 245319, "epoch": 1460} {"train_loss": -12.032343864440918, "global_step": 245320, "epoch": 1460} {"train_loss": -11.613286972045898, "global_step": 245321, "epoch": 1460} {"train_loss": -12.000675201416016, "global_step": 245322, "epoch": 1460} {"train_loss": -11.78976058959961, "global_step": 245323, "epoch": 1460} {"train_loss": -11.792739868164062, "global_step": 245324, "epoch": 1460} {"train_loss": -12.029132843017578, "global_step": 245325, "epoch": 1460} {"train_loss": -11.81096076965332, "global_step": 245326, "epoch": 1460} {"train_loss": -12.16555404663086, "global_step": 245327, "epoch": 1460} {"train_loss": -11.938145637512207, "global_step": 245328, "epoch": 1460} {"train_loss": -12.064428329467773, "global_step": 245329, "epoch": 1460} {"train_loss": -11.85464859008789, "global_step": 245330, "epoch": 1460} {"train_loss": -12.016355514526367, "global_step": 245331, "epoch": 1460} {"train_loss": -11.847230911254883, "global_step": 245332, "epoch": 1460} {"train_loss": -11.975791931152344, "global_step": 245333, "epoch": 1460} {"train_loss": -12.018415451049805, "global_step": 245334, "epoch": 1460} {"train_loss": -11.958181381225586, "global_step": 245335, "epoch": 1460} {"train_loss": -11.90732192993164, "global_step": 245336, "epoch": 1460} {"train_loss": -12.04550552368164, "global_step": 245337, "epoch": 1460} {"train_loss": -12.127606391906738, "global_step": 245338, "epoch": 1460} {"train_loss": -11.955022811889648, "global_step": 245339, "epoch": 1460} {"train_loss": -11.908219337463379, "global_step": 245340, "epoch": 1460} {"train_loss": -12.0092191696167, "global_step": 245341, "epoch": 1460} {"train_loss": -11.733784675598145, "global_step": 245342, "epoch": 1460} {"train_loss": -11.953333854675293, "global_step": 245343, "epoch": 1460} {"train_loss": -11.493049621582031, "global_step": 245344, "epoch": 1460} {"train_loss": -12.010438919067383, "global_step": 245345, "epoch": 1460} {"train_loss": -11.800566673278809, "global_step": 245346, "epoch": 1460} {"train_loss": -11.802787780761719, "global_step": 245347, "epoch": 1460} {"train_loss": -11.875970840454102, "global_step": 245348, "epoch": 1460} {"train_loss": -11.988006591796875, "global_step": 245349, "epoch": 1460} {"train_loss": -11.91682243347168, "global_step": 245350, "epoch": 1460} {"train_loss": -12.161137580871582, "global_step": 245351, "epoch": 1460} {"train_loss": -11.968137741088867, "global_step": 245352, "epoch": 1460} {"train_loss": -11.619458198547363, "global_step": 245353, "epoch": 1460} {"train_loss": -12.153168678283691, "global_step": 245354, "epoch": 1460} {"train_loss": -11.865938186645508, "global_step": 245355, "epoch": 1460} {"train_loss": -11.742610931396484, "global_step": 245356, "epoch": 1460} {"train_loss": -11.25482177734375, "global_step": 245357, "epoch": 1460} {"train_loss": -12.327256202697754, "global_step": 245358, "epoch": 1460} {"train_loss": -11.022335052490234, "global_step": 245359, "epoch": 1460} {"train_loss": -11.694513320922852, "global_step": 245360, "epoch": 1460} {"train_loss": -11.952244758605957, "global_step": 245361, "epoch": 1460} {"train_loss": -10.91187858581543, "global_step": 245362, "epoch": 1460} {"train_loss": -11.462413787841797, "global_step": 245363, "epoch": 1460} {"train_loss": -11.84829330444336, "global_step": 245364, "epoch": 1460} {"train_loss": -10.704170227050781, "global_step": 245365, "epoch": 1460} {"train_loss": -10.733110427856445, "global_step": 245366, "epoch": 1460} {"train_loss": -11.09368896484375, "global_step": 245367, "epoch": 1460} {"train_loss": -10.120573997497559, "global_step": 245368, "epoch": 1460} {"train_loss": -11.391249656677246, "global_step": 245369, "epoch": 1460} {"train_loss": -10.00332260131836, "global_step": 245370, "epoch": 1460} {"train_loss": -10.938529968261719, "global_step": 245371, "epoch": 1460} {"train_loss": -11.173640251159668, "global_step": 245372, "epoch": 1460} {"train_loss": -10.749484062194824, "global_step": 245373, "epoch": 1460} {"train_loss": -11.620454788208008, "global_step": 245374, "epoch": 1460} {"train_loss": -11.130561828613281, "global_step": 245375, "epoch": 1460} {"train_loss": -11.70910930633545, "global_step": 245376, "epoch": 1460} {"train_loss": -11.496673583984375, "global_step": 245377, "epoch": 1460} {"train_loss": -11.831082344055176, "global_step": 245378, "epoch": 1460} {"train_loss": -11.519439697265625, "global_step": 245379, "epoch": 1460} {"train_loss": -11.467024803161621, "global_step": 245380, "epoch": 1460} {"train_loss": -11.464102745056152, "global_step": 245381, "epoch": 1460} {"train_loss": -11.54854965209961, "global_step": 245382, "epoch": 1460} {"train_loss": -11.629415512084961, "global_step": 245383, "epoch": 1460} {"train_loss": -11.454673767089844, "global_step": 245384, "epoch": 1460} {"train_loss": -11.4788818359375, "global_step": 245385, "epoch": 1460} {"train_loss": -11.342912673950195, "global_step": 245386, "epoch": 1460} {"train_loss": -11.135897636413574, "global_step": 245387, "epoch": 1460} {"train_loss": -11.297481536865234, "global_step": 245388, "epoch": 1460} {"train_loss": -11.612900733947754, "global_step": 245389, "epoch": 1460} {"train_loss": -11.698837280273438, "global_step": 245390, "epoch": 1460} {"train_loss": -11.18075942993164, "global_step": 245391, "epoch": 1460} {"train_loss": -11.727897644042969, "global_step": 245392, "epoch": 1460} {"train_loss": -11.414176940917969, "global_step": 245393, "epoch": 1460} {"train_loss": -11.837576866149902, "global_step": 245394, "epoch": 1460} {"train_loss": -11.806241035461426, "global_step": 245395, "epoch": 1460} {"train_loss": -11.740909576416016, "global_step": 245396, "epoch": 1460} {"train_loss": -11.783929824829102, "global_step": 245397, "epoch": 1460} {"train_loss": -12.117706298828125, "global_step": 245398, "epoch": 1460} {"train_loss": -11.860001564025879, "global_step": 245399, "epoch": 1460} {"train_loss": -11.670537948608398, "global_step": 245400, "epoch": 1460} {"train_loss": -11.980524063110352, "global_step": 245401, "epoch": 1460} {"train_loss": -11.38599967956543, "global_step": 245402, "epoch": 1460} {"train_loss": -11.975357055664062, "global_step": 245403, "epoch": 1460} {"train_loss": -11.309331893920898, "global_step": 245404, "epoch": 1460} {"train_loss": -11.682830810546875, "global_step": 245405, "epoch": 1460} {"train_loss": -11.870697021484375, "global_step": 245406, "epoch": 1460} {"train_loss": -11.558817863464355, "global_step": 245407, "epoch": 1460} {"train_loss": -11.846888542175293, "global_step": 245408, "epoch": 1460} {"train_loss": -11.551469802856445, "global_step": 245409, "epoch": 1460} {"train_loss": -11.313217163085938, "global_step": 245410, "epoch": 1460} {"train_loss": -11.775787353515625, "global_step": 245411, "epoch": 1460} {"train_loss": -11.749191284179688, "global_step": 245412, "epoch": 1460} {"train_loss": -11.761762619018555, "global_step": 245413, "epoch": 1460} {"train_loss": -11.432241439819336, "global_step": 245414, "epoch": 1460} {"train_loss": -11.364705085754395, "global_step": 245415, "epoch": 1460} {"train_loss": -11.826215744018555, "global_step": 245416, "epoch": 1460} {"train_loss": -11.638025283813477, "global_step": 245417, "epoch": 1460} {"train_loss": -11.557048797607422, "global_step": 245418, "epoch": 1460} {"train_loss": -11.360509872436523, "global_step": 245419, "epoch": 1460} {"train_loss": -11.627941131591797, "global_step": 245420, "epoch": 1460} {"train_loss": -11.661985397338867, "global_step": 245421, "epoch": 1460} {"train_loss": -11.883563041687012, "global_step": 245422, "epoch": 1460} {"train_loss": -11.3270902633667, "global_step": 245423, "epoch": 1460} {"train_loss": -11.643220901489258, "global_step": 245424, "epoch": 1460} {"train_loss": -11.210533142089844, "global_step": 245425, "epoch": 1460} {"train_loss": -11.781990051269531, "global_step": 245426, "epoch": 1460} {"train_loss": -11.210086822509766, "global_step": 245427, "epoch": 1460} {"train_loss": -11.328813552856445, "global_step": 245428, "epoch": 1460} {"train_loss": -11.695363998413086, "global_step": 245429, "epoch": 1460} {"train_loss": -11.853083610534668, "global_step": 245430, "epoch": 1460} {"train_loss": -11.562360763549805, "global_step": 245431, "epoch": 1460} {"train_loss": -11.825159072875977, "global_step": 245432, "epoch": 1460} {"train_loss": -11.201118469238281, "global_step": 245433, "epoch": 1460} {"train_loss": -11.631662368774414, "global_step": 245434, "epoch": 1460} {"train_loss": -11.61259651184082, "global_step": 245435, "epoch": 1460} {"train_loss": -11.382316589355469, "global_step": 245436, "epoch": 1460} {"train_loss": -11.811243057250977, "global_step": 245437, "epoch": 1460} {"train_loss": -11.66246509552002, "global_step": 245438, "epoch": 1460} {"train_loss": -11.68106460571289, "global_step": 245439, "epoch": 1460} {"train_loss": -11.70766830444336, "global_step": 245440, "epoch": 1460} {"train_loss": -11.670003890991211, "global_step": 245441, "epoch": 1460} {"train_loss": -12.004817008972168, "global_step": 245442, "epoch": 1460} {"train_loss": -11.949934005737305, "global_step": 245443, "epoch": 1460} {"train_loss": -11.642948150634766, "global_step": 245444, "epoch": 1460} {"train_loss": -11.83402156829834, "global_step": 245445, "epoch": 1460} {"train_loss": -12.131094932556152, "global_step": 245446, "epoch": 1460} {"train_loss": -11.611314438638233, "global_step": 245447, "epoch": 1460, "val_loss": 269086.59375, "train_action_mse_error": 2.2735610008239746} {"train_loss": -11.802639961242676, "global_step": 245448, "epoch": 1461} {"train_loss": -11.913667678833008, "global_step": 245449, "epoch": 1461} {"train_loss": -11.93833065032959, "global_step": 245450, "epoch": 1461} {"train_loss": -11.643056869506836, "global_step": 245451, "epoch": 1461} {"train_loss": -12.027915954589844, "global_step": 245452, "epoch": 1461} {"train_loss": -12.12893295288086, "global_step": 245453, "epoch": 1461} {"train_loss": -11.92223072052002, "global_step": 245454, "epoch": 1461} {"train_loss": -12.03857135772705, "global_step": 245455, "epoch": 1461} {"train_loss": -11.849428176879883, "global_step": 245456, "epoch": 1461} {"train_loss": -11.936971664428711, "global_step": 245457, "epoch": 1461} {"train_loss": -11.945072174072266, "global_step": 245458, "epoch": 1461} {"train_loss": -12.090808868408203, "global_step": 245459, "epoch": 1461} {"train_loss": -11.816152572631836, "global_step": 245460, "epoch": 1461} {"train_loss": -11.614105224609375, "global_step": 245461, "epoch": 1461} {"train_loss": -11.697254180908203, "global_step": 245462, "epoch": 1461} {"train_loss": -11.79270076751709, "global_step": 245463, "epoch": 1461} {"train_loss": -11.699777603149414, "global_step": 245464, "epoch": 1461} {"train_loss": -11.83230209350586, "global_step": 245465, "epoch": 1461} {"train_loss": -11.491655349731445, "global_step": 245466, "epoch": 1461} {"train_loss": -11.969432830810547, "global_step": 245467, "epoch": 1461} {"train_loss": -11.350770950317383, "global_step": 245468, "epoch": 1461} {"train_loss": -11.648260116577148, "global_step": 245469, "epoch": 1461} {"train_loss": -11.679954528808594, "global_step": 245470, "epoch": 1461} {"train_loss": -11.710511207580566, "global_step": 245471, "epoch": 1461} {"train_loss": -11.224637031555176, "global_step": 245472, "epoch": 1461} {"train_loss": -11.56572151184082, "global_step": 245473, "epoch": 1461} {"train_loss": -11.18417739868164, "global_step": 245474, "epoch": 1461} {"train_loss": -11.509881019592285, "global_step": 245475, "epoch": 1461} {"train_loss": -11.796566009521484, "global_step": 245476, "epoch": 1461} {"train_loss": -11.298871040344238, "global_step": 245477, "epoch": 1461} {"train_loss": -11.921707153320312, "global_step": 245478, "epoch": 1461} {"train_loss": -11.474936485290527, "global_step": 245479, "epoch": 1461} {"train_loss": -11.604654312133789, "global_step": 245480, "epoch": 1461} {"train_loss": -11.554327011108398, "global_step": 245481, "epoch": 1461} {"train_loss": -12.08711051940918, "global_step": 245482, "epoch": 1461} {"train_loss": -11.067779541015625, "global_step": 245483, "epoch": 1461} {"train_loss": -11.648054122924805, "global_step": 245484, "epoch": 1461} {"train_loss": -11.568023681640625, "global_step": 245485, "epoch": 1461} {"train_loss": -11.598372459411621, "global_step": 245486, "epoch": 1461} {"train_loss": -10.976777076721191, "global_step": 245487, "epoch": 1461} {"train_loss": -11.738168716430664, "global_step": 245488, "epoch": 1461} {"train_loss": -11.246681213378906, "global_step": 245489, "epoch": 1461} {"train_loss": -11.449352264404297, "global_step": 245490, "epoch": 1461} {"train_loss": -11.337844848632812, "global_step": 245491, "epoch": 1461} {"train_loss": -11.168973922729492, "global_step": 245492, "epoch": 1461} {"train_loss": -10.9232177734375, "global_step": 245493, "epoch": 1461} {"train_loss": -11.476568222045898, "global_step": 245494, "epoch": 1461} {"train_loss": -11.43276596069336, "global_step": 245495, "epoch": 1461} {"train_loss": -10.839040756225586, "global_step": 245496, "epoch": 1461} {"train_loss": -11.69542121887207, "global_step": 245497, "epoch": 1461} {"train_loss": -11.561370849609375, "global_step": 245498, "epoch": 1461} {"train_loss": -11.889236450195312, "global_step": 245499, "epoch": 1461} {"train_loss": -12.045760154724121, "global_step": 245500, "epoch": 1461} {"train_loss": -11.697868347167969, "global_step": 245501, "epoch": 1461} {"train_loss": -11.664762496948242, "global_step": 245502, "epoch": 1461} {"train_loss": -11.774197578430176, "global_step": 245503, "epoch": 1461} {"train_loss": -11.973159790039062, "global_step": 245504, "epoch": 1461} {"train_loss": -11.145294189453125, "global_step": 245505, "epoch": 1461} {"train_loss": -11.82824420928955, "global_step": 245506, "epoch": 1461} {"train_loss": -11.833866119384766, "global_step": 245507, "epoch": 1461} {"train_loss": -11.635246276855469, "global_step": 245508, "epoch": 1461} {"train_loss": -11.831724166870117, "global_step": 245509, "epoch": 1461} {"train_loss": -11.811385154724121, "global_step": 245510, "epoch": 1461} {"train_loss": -11.786785125732422, "global_step": 245511, "epoch": 1461} {"train_loss": -12.036548614501953, "global_step": 245512, "epoch": 1461} {"train_loss": -12.050304412841797, "global_step": 245513, "epoch": 1461} {"train_loss": -11.931507110595703, "global_step": 245514, "epoch": 1461} {"train_loss": -11.620153427124023, "global_step": 245515, "epoch": 1461} {"train_loss": -11.732420921325684, "global_step": 245516, "epoch": 1461} {"train_loss": -11.960553169250488, "global_step": 245517, "epoch": 1461} {"train_loss": -11.74197769165039, "global_step": 245518, "epoch": 1461} {"train_loss": -11.993041038513184, "global_step": 245519, "epoch": 1461} {"train_loss": -12.119548797607422, "global_step": 245520, "epoch": 1461} {"train_loss": -11.857277870178223, "global_step": 245521, "epoch": 1461} {"train_loss": -11.971477508544922, "global_step": 245522, "epoch": 1461} {"train_loss": -12.180229187011719, "global_step": 245523, "epoch": 1461} {"train_loss": -11.888411521911621, "global_step": 245524, "epoch": 1461} {"train_loss": -12.165401458740234, "global_step": 245525, "epoch": 1461} {"train_loss": -11.922338485717773, "global_step": 245526, "epoch": 1461} {"train_loss": -11.850274085998535, "global_step": 245527, "epoch": 1461} {"train_loss": -11.96682357788086, "global_step": 245528, "epoch": 1461} {"train_loss": -12.194110870361328, "global_step": 245529, "epoch": 1461} {"train_loss": -11.977106094360352, "global_step": 245530, "epoch": 1461} {"train_loss": -11.952535629272461, "global_step": 245531, "epoch": 1461} {"train_loss": -11.923584938049316, "global_step": 245532, "epoch": 1461} {"train_loss": -11.98447322845459, "global_step": 245533, "epoch": 1461} {"train_loss": -11.605751991271973, "global_step": 245534, "epoch": 1461} {"train_loss": -11.692349433898926, "global_step": 245535, "epoch": 1461} {"train_loss": -11.829626083374023, "global_step": 245536, "epoch": 1461} {"train_loss": -11.422148704528809, "global_step": 245537, "epoch": 1461} {"train_loss": -11.599776268005371, "global_step": 245538, "epoch": 1461} {"train_loss": -11.19826889038086, "global_step": 245539, "epoch": 1461} {"train_loss": -11.980667114257812, "global_step": 245540, "epoch": 1461} {"train_loss": -11.678014755249023, "global_step": 245541, "epoch": 1461} {"train_loss": -11.650199890136719, "global_step": 245542, "epoch": 1461} {"train_loss": -11.500062942504883, "global_step": 245543, "epoch": 1461} {"train_loss": -11.866554260253906, "global_step": 245544, "epoch": 1461} {"train_loss": -11.190367698669434, "global_step": 245545, "epoch": 1461} {"train_loss": -11.023378372192383, "global_step": 245546, "epoch": 1461} {"train_loss": -11.588216781616211, "global_step": 245547, "epoch": 1461} {"train_loss": -10.839757919311523, "global_step": 245548, "epoch": 1461} {"train_loss": -11.004314422607422, "global_step": 245549, "epoch": 1461} {"train_loss": -11.267871856689453, "global_step": 245550, "epoch": 1461} {"train_loss": -10.905431747436523, "global_step": 245551, "epoch": 1461} {"train_loss": -11.487443923950195, "global_step": 245552, "epoch": 1461} {"train_loss": -11.336935043334961, "global_step": 245553, "epoch": 1461} {"train_loss": -10.673957824707031, "global_step": 245554, "epoch": 1461} {"train_loss": -11.273300170898438, "global_step": 245555, "epoch": 1461} {"train_loss": -11.275015830993652, "global_step": 245556, "epoch": 1461} {"train_loss": -11.360311508178711, "global_step": 245557, "epoch": 1461} {"train_loss": -11.442896842956543, "global_step": 245558, "epoch": 1461} {"train_loss": -11.625411987304688, "global_step": 245559, "epoch": 1461} {"train_loss": -11.45676326751709, "global_step": 245560, "epoch": 1461} {"train_loss": -11.339885711669922, "global_step": 245561, "epoch": 1461} {"train_loss": -11.706979751586914, "global_step": 245562, "epoch": 1461} {"train_loss": -11.512191772460938, "global_step": 245563, "epoch": 1461} {"train_loss": -10.76907730102539, "global_step": 245564, "epoch": 1461} {"train_loss": -11.171602249145508, "global_step": 245565, "epoch": 1461} {"train_loss": -10.971609115600586, "global_step": 245566, "epoch": 1461} {"train_loss": -11.207300186157227, "global_step": 245567, "epoch": 1461} {"train_loss": -10.650175094604492, "global_step": 245568, "epoch": 1461} {"train_loss": -11.260452270507812, "global_step": 245569, "epoch": 1461} {"train_loss": -10.67852783203125, "global_step": 245570, "epoch": 1461} {"train_loss": -10.623172760009766, "global_step": 245571, "epoch": 1461} {"train_loss": -11.515351295471191, "global_step": 245572, "epoch": 1461} {"train_loss": -10.40035629272461, "global_step": 245573, "epoch": 1461} {"train_loss": -10.849894523620605, "global_step": 245574, "epoch": 1461} {"train_loss": -10.319653511047363, "global_step": 245575, "epoch": 1461} {"train_loss": -10.95570182800293, "global_step": 245576, "epoch": 1461} {"train_loss": -10.960663795471191, "global_step": 245577, "epoch": 1461} {"train_loss": -10.370636940002441, "global_step": 245578, "epoch": 1461} {"train_loss": -11.058876991271973, "global_step": 245579, "epoch": 1461} {"train_loss": -11.306456565856934, "global_step": 245580, "epoch": 1461} {"train_loss": -10.751811981201172, "global_step": 245581, "epoch": 1461} {"train_loss": -11.715628623962402, "global_step": 245582, "epoch": 1461} {"train_loss": -10.527297019958496, "global_step": 245583, "epoch": 1461} {"train_loss": -11.73779582977295, "global_step": 245584, "epoch": 1461} {"train_loss": -11.353116035461426, "global_step": 245585, "epoch": 1461} {"train_loss": -11.11129379272461, "global_step": 245586, "epoch": 1461} {"train_loss": -11.20353889465332, "global_step": 245587, "epoch": 1461} {"train_loss": -11.33141803741455, "global_step": 245588, "epoch": 1461} {"train_loss": -11.696989059448242, "global_step": 245589, "epoch": 1461} {"train_loss": -11.045969009399414, "global_step": 245590, "epoch": 1461} {"train_loss": -11.80290412902832, "global_step": 245591, "epoch": 1461} {"train_loss": -11.482098579406738, "global_step": 245592, "epoch": 1461} {"train_loss": -11.387275695800781, "global_step": 245593, "epoch": 1461} {"train_loss": -11.599567413330078, "global_step": 245594, "epoch": 1461} {"train_loss": -11.387157440185547, "global_step": 245595, "epoch": 1461} {"train_loss": -11.750204086303711, "global_step": 245596, "epoch": 1461} {"train_loss": -11.534652709960938, "global_step": 245597, "epoch": 1461} {"train_loss": -11.778244972229004, "global_step": 245598, "epoch": 1461} {"train_loss": -11.715431213378906, "global_step": 245599, "epoch": 1461} {"train_loss": -11.761310577392578, "global_step": 245600, "epoch": 1461} {"train_loss": -11.791413307189941, "global_step": 245601, "epoch": 1461} {"train_loss": -11.865056991577148, "global_step": 245602, "epoch": 1461} {"train_loss": -12.079838752746582, "global_step": 245603, "epoch": 1461} {"train_loss": -11.75866985321045, "global_step": 245604, "epoch": 1461} {"train_loss": -11.813095092773438, "global_step": 245605, "epoch": 1461} {"train_loss": -11.957557678222656, "global_step": 245606, "epoch": 1461} {"train_loss": -11.83603286743164, "global_step": 245607, "epoch": 1461} {"train_loss": -11.88952350616455, "global_step": 245608, "epoch": 1461} {"train_loss": -11.903596878051758, "global_step": 245609, "epoch": 1461} {"train_loss": -11.893409729003906, "global_step": 245610, "epoch": 1461} {"train_loss": -12.029338836669922, "global_step": 245611, "epoch": 1461} {"train_loss": -11.881128311157227, "global_step": 245612, "epoch": 1461} {"train_loss": -12.077081680297852, "global_step": 245613, "epoch": 1461} {"train_loss": -12.081266403198242, "global_step": 245614, "epoch": 1461} {"train_loss": -11.567799193518502, "global_step": 245615, "epoch": 1461, "val_loss": 269772.25} {"train_loss": -11.735431671142578, "global_step": 245616, "epoch": 1462} {"train_loss": -11.910770416259766, "global_step": 245617, "epoch": 1462} {"train_loss": -11.628717422485352, "global_step": 245618, "epoch": 1462} {"train_loss": -11.866403579711914, "global_step": 245619, "epoch": 1462} {"train_loss": -11.615242004394531, "global_step": 245620, "epoch": 1462} {"train_loss": -11.85075569152832, "global_step": 245621, "epoch": 1462} {"train_loss": -11.397350311279297, "global_step": 245622, "epoch": 1462} {"train_loss": -11.985557556152344, "global_step": 245623, "epoch": 1462} {"train_loss": -11.667842864990234, "global_step": 245624, "epoch": 1462} {"train_loss": -11.745468139648438, "global_step": 245625, "epoch": 1462} {"train_loss": -11.9695463180542, "global_step": 245626, "epoch": 1462} {"train_loss": -10.790046691894531, "global_step": 245627, "epoch": 1462} {"train_loss": -11.578850746154785, "global_step": 245628, "epoch": 1462} {"train_loss": -11.531326293945312, "global_step": 245629, "epoch": 1462} {"train_loss": -12.159269332885742, "global_step": 245630, "epoch": 1462} {"train_loss": -11.526117324829102, "global_step": 245631, "epoch": 1462} {"train_loss": -11.960086822509766, "global_step": 245632, "epoch": 1462} {"train_loss": -11.411102294921875, "global_step": 245633, "epoch": 1462} {"train_loss": -11.523494720458984, "global_step": 245634, "epoch": 1462} {"train_loss": -11.601475715637207, "global_step": 245635, "epoch": 1462} {"train_loss": -11.619668006896973, "global_step": 245636, "epoch": 1462} {"train_loss": -12.019552230834961, "global_step": 245637, "epoch": 1462} {"train_loss": -11.367288589477539, "global_step": 245638, "epoch": 1462} {"train_loss": -11.54143238067627, "global_step": 245639, "epoch": 1462} {"train_loss": -11.471715927124023, "global_step": 245640, "epoch": 1462} {"train_loss": -11.201057434082031, "global_step": 245641, "epoch": 1462} {"train_loss": -10.915105819702148, "global_step": 245642, "epoch": 1462} {"train_loss": -11.266695022583008, "global_step": 245643, "epoch": 1462} {"train_loss": -11.32857894897461, "global_step": 245644, "epoch": 1462} {"train_loss": -11.461719512939453, "global_step": 245645, "epoch": 1462} {"train_loss": -11.501874923706055, "global_step": 245646, "epoch": 1462} {"train_loss": -10.751055717468262, "global_step": 245647, "epoch": 1462} {"train_loss": -11.020724296569824, "global_step": 245648, "epoch": 1462} {"train_loss": -11.241735458374023, "global_step": 245649, "epoch": 1462} {"train_loss": -9.815998077392578, "global_step": 245650, "epoch": 1462} {"train_loss": -10.844669342041016, "global_step": 245651, "epoch": 1462} {"train_loss": -9.376320838928223, "global_step": 245652, "epoch": 1462} {"train_loss": -10.47779655456543, "global_step": 245653, "epoch": 1462} {"train_loss": -9.037885665893555, "global_step": 245654, "epoch": 1462} {"train_loss": -9.788583755493164, "global_step": 245655, "epoch": 1462} {"train_loss": -10.242964744567871, "global_step": 245656, "epoch": 1462} {"train_loss": -10.68563175201416, "global_step": 245657, "epoch": 1462} {"train_loss": -9.770562171936035, "global_step": 245658, "epoch": 1462} {"train_loss": -10.177961349487305, "global_step": 245659, "epoch": 1462} {"train_loss": -11.134404182434082, "global_step": 245660, "epoch": 1462} {"train_loss": -9.82748031616211, "global_step": 245661, "epoch": 1462} {"train_loss": -10.524751663208008, "global_step": 245662, "epoch": 1462} {"train_loss": -11.137203216552734, "global_step": 245663, "epoch": 1462} {"train_loss": -10.252192497253418, "global_step": 245664, "epoch": 1462} {"train_loss": -9.403619766235352, "global_step": 245665, "epoch": 1462} {"train_loss": -11.508611679077148, "global_step": 245666, "epoch": 1462} {"train_loss": -10.338446617126465, "global_step": 245667, "epoch": 1462} {"train_loss": -10.809370994567871, "global_step": 245668, "epoch": 1462} {"train_loss": -10.862920761108398, "global_step": 245669, "epoch": 1462} {"train_loss": -10.964503288269043, "global_step": 245670, "epoch": 1462} {"train_loss": -11.021821975708008, "global_step": 245671, "epoch": 1462} {"train_loss": -11.297687530517578, "global_step": 245672, "epoch": 1462} {"train_loss": -11.428741455078125, "global_step": 245673, "epoch": 1462} {"train_loss": -11.01827621459961, "global_step": 245674, "epoch": 1462} {"train_loss": -11.656537055969238, "global_step": 245675, "epoch": 1462} {"train_loss": -11.471168518066406, "global_step": 245676, "epoch": 1462} {"train_loss": -11.391812324523926, "global_step": 245677, "epoch": 1462} {"train_loss": -11.359488487243652, "global_step": 245678, "epoch": 1462} {"train_loss": -11.526351928710938, "global_step": 245679, "epoch": 1462} {"train_loss": -11.500319480895996, "global_step": 245680, "epoch": 1462} {"train_loss": -11.687484741210938, "global_step": 245681, "epoch": 1462} {"train_loss": -11.502440452575684, "global_step": 245682, "epoch": 1462} {"train_loss": -11.685480117797852, "global_step": 245683, "epoch": 1462} {"train_loss": -11.617115020751953, "global_step": 245684, "epoch": 1462} {"train_loss": -11.498437881469727, "global_step": 245685, "epoch": 1462} {"train_loss": -11.608936309814453, "global_step": 245686, "epoch": 1462} {"train_loss": -11.595941543579102, "global_step": 245687, "epoch": 1462} {"train_loss": -11.774084091186523, "global_step": 245688, "epoch": 1462} {"train_loss": -11.853299140930176, "global_step": 245689, "epoch": 1462} {"train_loss": -11.90859603881836, "global_step": 245690, "epoch": 1462} {"train_loss": -11.653499603271484, "global_step": 245691, "epoch": 1462} {"train_loss": -11.639945030212402, "global_step": 245692, "epoch": 1462} {"train_loss": -11.741276741027832, "global_step": 245693, "epoch": 1462} {"train_loss": -11.820619583129883, "global_step": 245694, "epoch": 1462} {"train_loss": -12.009976387023926, "global_step": 245695, "epoch": 1462} {"train_loss": -11.794811248779297, "global_step": 245696, "epoch": 1462} {"train_loss": -11.812734603881836, "global_step": 245697, "epoch": 1462} {"train_loss": -11.968668937683105, "global_step": 245698, "epoch": 1462} {"train_loss": -12.19768238067627, "global_step": 245699, "epoch": 1462} {"train_loss": -11.944673538208008, "global_step": 245700, "epoch": 1462} {"train_loss": -11.906608581542969, "global_step": 245701, "epoch": 1462} {"train_loss": -11.996835708618164, "global_step": 245702, "epoch": 1462} {"train_loss": -11.997987747192383, "global_step": 245703, "epoch": 1462} {"train_loss": -11.899589538574219, "global_step": 245704, "epoch": 1462} {"train_loss": -11.828753471374512, "global_step": 245705, "epoch": 1462} {"train_loss": -12.052326202392578, "global_step": 245706, "epoch": 1462} {"train_loss": -11.68764877319336, "global_step": 245707, "epoch": 1462} {"train_loss": -11.990636825561523, "global_step": 245708, "epoch": 1462} {"train_loss": -11.959112167358398, "global_step": 245709, "epoch": 1462} {"train_loss": -11.7490873336792, "global_step": 245710, "epoch": 1462} {"train_loss": -12.024011611938477, "global_step": 245711, "epoch": 1462} {"train_loss": -11.602706909179688, "global_step": 245712, "epoch": 1462} {"train_loss": -12.015605926513672, "global_step": 245713, "epoch": 1462} {"train_loss": -11.992696762084961, "global_step": 245714, "epoch": 1462} {"train_loss": -12.024238586425781, "global_step": 245715, "epoch": 1462} {"train_loss": -11.899232864379883, "global_step": 245716, "epoch": 1462} {"train_loss": -11.846977233886719, "global_step": 245717, "epoch": 1462} {"train_loss": -11.849418640136719, "global_step": 245718, "epoch": 1462} {"train_loss": -12.084878921508789, "global_step": 245719, "epoch": 1462} {"train_loss": -12.082621574401855, "global_step": 245720, "epoch": 1462} {"train_loss": -11.75771427154541, "global_step": 245721, "epoch": 1462} {"train_loss": -11.363554954528809, "global_step": 245722, "epoch": 1462} {"train_loss": -11.891317367553711, "global_step": 245723, "epoch": 1462} {"train_loss": -11.786718368530273, "global_step": 245724, "epoch": 1462} {"train_loss": -11.53209400177002, "global_step": 245725, "epoch": 1462} {"train_loss": -11.489202499389648, "global_step": 245726, "epoch": 1462} {"train_loss": -11.517243385314941, "global_step": 245727, "epoch": 1462} {"train_loss": -11.939253807067871, "global_step": 245728, "epoch": 1462} {"train_loss": -11.157142639160156, "global_step": 245729, "epoch": 1462} {"train_loss": -11.748083114624023, "global_step": 245730, "epoch": 1462} {"train_loss": -11.499728202819824, "global_step": 245731, "epoch": 1462} {"train_loss": -11.039778709411621, "global_step": 245732, "epoch": 1462} {"train_loss": -10.815756797790527, "global_step": 245733, "epoch": 1462} {"train_loss": -11.686079025268555, "global_step": 245734, "epoch": 1462} {"train_loss": -10.186444282531738, "global_step": 245735, "epoch": 1462} {"train_loss": -10.704364776611328, "global_step": 245736, "epoch": 1462} {"train_loss": -10.785991668701172, "global_step": 245737, "epoch": 1462} {"train_loss": -8.8999662399292, "global_step": 245738, "epoch": 1462} {"train_loss": -9.65194320678711, "global_step": 245739, "epoch": 1462} {"train_loss": -10.364784240722656, "global_step": 245740, "epoch": 1462} {"train_loss": -8.497779846191406, "global_step": 245741, "epoch": 1462} {"train_loss": -9.861330032348633, "global_step": 245742, "epoch": 1462} {"train_loss": -7.9928693771362305, "global_step": 245743, "epoch": 1462} {"train_loss": -10.531065940856934, "global_step": 245744, "epoch": 1462} {"train_loss": -7.999394416809082, "global_step": 245745, "epoch": 1462} {"train_loss": -7.8751726150512695, "global_step": 245746, "epoch": 1462} {"train_loss": -9.026867866516113, "global_step": 245747, "epoch": 1462} {"train_loss": -9.235118865966797, "global_step": 245748, "epoch": 1462} {"train_loss": -10.395508766174316, "global_step": 245749, "epoch": 1462} {"train_loss": -9.298023223876953, "global_step": 245750, "epoch": 1462} {"train_loss": -10.647441864013672, "global_step": 245751, "epoch": 1462} {"train_loss": -9.185673713684082, "global_step": 245752, "epoch": 1462} {"train_loss": -10.915374755859375, "global_step": 245753, "epoch": 1462} {"train_loss": -10.255953788757324, "global_step": 245754, "epoch": 1462} {"train_loss": -10.43083667755127, "global_step": 245755, "epoch": 1462} {"train_loss": -10.409051895141602, "global_step": 245756, "epoch": 1462} {"train_loss": -9.208545684814453, "global_step": 245757, "epoch": 1462} {"train_loss": -10.725689888000488, "global_step": 245758, "epoch": 1462} {"train_loss": -10.52542495727539, "global_step": 245759, "epoch": 1462} {"train_loss": -10.848148345947266, "global_step": 245760, "epoch": 1462} {"train_loss": -9.908674240112305, "global_step": 245761, "epoch": 1462} {"train_loss": -10.482540130615234, "global_step": 245762, "epoch": 1462} {"train_loss": -10.427704811096191, "global_step": 245763, "epoch": 1462} {"train_loss": -10.244136810302734, "global_step": 245764, "epoch": 1462} {"train_loss": -10.951715469360352, "global_step": 245765, "epoch": 1462} {"train_loss": -10.500450134277344, "global_step": 245766, "epoch": 1462} {"train_loss": -10.988277435302734, "global_step": 245767, "epoch": 1462} {"train_loss": -10.673550605773926, "global_step": 245768, "epoch": 1462} {"train_loss": -10.907686233520508, "global_step": 245769, "epoch": 1462} {"train_loss": -11.38476848602295, "global_step": 245770, "epoch": 1462} {"train_loss": -10.765981674194336, "global_step": 245771, "epoch": 1462} {"train_loss": -11.387362480163574, "global_step": 245772, "epoch": 1462} {"train_loss": -11.348855018615723, "global_step": 245773, "epoch": 1462} {"train_loss": -11.180623054504395, "global_step": 245774, "epoch": 1462} {"train_loss": -11.395502090454102, "global_step": 245775, "epoch": 1462} {"train_loss": -11.303903579711914, "global_step": 245776, "epoch": 1462} {"train_loss": -11.258031845092773, "global_step": 245777, "epoch": 1462} {"train_loss": -11.448358535766602, "global_step": 245778, "epoch": 1462} {"train_loss": -11.150025367736816, "global_step": 245779, "epoch": 1462} {"train_loss": -11.234349250793457, "global_step": 245780, "epoch": 1462} {"train_loss": -11.580775260925293, "global_step": 245781, "epoch": 1462} {"train_loss": -11.344513893127441, "global_step": 245782, "epoch": 1462} {"train_loss": -11.103871572585334, "global_step": 245783, "epoch": 1462, "val_loss": 253879.578125} {"train_loss": -11.424066543579102, "global_step": 245784, "epoch": 1463} {"train_loss": -11.364870071411133, "global_step": 245785, "epoch": 1463} {"train_loss": -11.348040580749512, "global_step": 245786, "epoch": 1463} {"train_loss": -11.322954177856445, "global_step": 245787, "epoch": 1463} {"train_loss": -11.380047798156738, "global_step": 245788, "epoch": 1463} {"train_loss": -11.60961627960205, "global_step": 245789, "epoch": 1463} {"train_loss": -11.202451705932617, "global_step": 245790, "epoch": 1463} {"train_loss": -11.768608093261719, "global_step": 245791, "epoch": 1463} {"train_loss": -11.50804328918457, "global_step": 245792, "epoch": 1463} {"train_loss": -11.281993865966797, "global_step": 245793, "epoch": 1463} {"train_loss": -11.663470268249512, "global_step": 245794, "epoch": 1463} {"train_loss": -11.20865249633789, "global_step": 245795, "epoch": 1463} {"train_loss": -11.335203170776367, "global_step": 245796, "epoch": 1463} {"train_loss": -11.51603889465332, "global_step": 245797, "epoch": 1463} {"train_loss": -11.414466857910156, "global_step": 245798, "epoch": 1463} {"train_loss": -11.587661743164062, "global_step": 245799, "epoch": 1463} {"train_loss": -11.627107620239258, "global_step": 245800, "epoch": 1463} {"train_loss": -11.592885971069336, "global_step": 245801, "epoch": 1463} {"train_loss": -11.717348098754883, "global_step": 245802, "epoch": 1463} {"train_loss": -11.54957389831543, "global_step": 245803, "epoch": 1463} {"train_loss": -11.605173110961914, "global_step": 245804, "epoch": 1463} {"train_loss": -11.541376113891602, "global_step": 245805, "epoch": 1463} {"train_loss": -11.716114044189453, "global_step": 245806, "epoch": 1463} {"train_loss": -11.596626281738281, "global_step": 245807, "epoch": 1463} {"train_loss": -11.819306373596191, "global_step": 245808, "epoch": 1463} {"train_loss": -11.866411209106445, "global_step": 245809, "epoch": 1463} {"train_loss": -11.717166900634766, "global_step": 245810, "epoch": 1463} {"train_loss": -11.572744369506836, "global_step": 245811, "epoch": 1463} {"train_loss": -11.847890853881836, "global_step": 245812, "epoch": 1463} {"train_loss": -11.852601051330566, "global_step": 245813, "epoch": 1463} {"train_loss": -11.796642303466797, "global_step": 245814, "epoch": 1463} {"train_loss": -11.755356788635254, "global_step": 245815, "epoch": 1463} {"train_loss": -11.82979965209961, "global_step": 245816, "epoch": 1463} {"train_loss": -11.83060073852539, "global_step": 245817, "epoch": 1463} {"train_loss": -11.549480438232422, "global_step": 245818, "epoch": 1463} {"train_loss": -11.970165252685547, "global_step": 245819, "epoch": 1463} {"train_loss": -11.509683609008789, "global_step": 245820, "epoch": 1463} {"train_loss": -12.05792236328125, "global_step": 245821, "epoch": 1463} {"train_loss": -11.637611389160156, "global_step": 245822, "epoch": 1463} {"train_loss": -11.737133026123047, "global_step": 245823, "epoch": 1463} {"train_loss": -11.744120597839355, "global_step": 245824, "epoch": 1463} {"train_loss": -11.807281494140625, "global_step": 245825, "epoch": 1463} {"train_loss": -11.90841293334961, "global_step": 245826, "epoch": 1463} {"train_loss": -11.51401138305664, "global_step": 245827, "epoch": 1463} {"train_loss": -11.964014053344727, "global_step": 245828, "epoch": 1463} {"train_loss": -11.638052940368652, "global_step": 245829, "epoch": 1463} {"train_loss": -12.0037260055542, "global_step": 245830, "epoch": 1463} {"train_loss": -11.840514183044434, "global_step": 245831, "epoch": 1463} {"train_loss": -12.106943130493164, "global_step": 245832, "epoch": 1463} {"train_loss": -12.034843444824219, "global_step": 245833, "epoch": 1463} {"train_loss": -11.81702995300293, "global_step": 245834, "epoch": 1463} {"train_loss": -12.16581916809082, "global_step": 245835, "epoch": 1463} {"train_loss": -11.553701400756836, "global_step": 245836, "epoch": 1463} {"train_loss": -11.671865463256836, "global_step": 245837, "epoch": 1463} {"train_loss": -12.061351776123047, "global_step": 245838, "epoch": 1463} {"train_loss": -11.99747085571289, "global_step": 245839, "epoch": 1463} {"train_loss": -11.901519775390625, "global_step": 245840, "epoch": 1463} {"train_loss": -11.878215789794922, "global_step": 245841, "epoch": 1463} {"train_loss": -12.070497512817383, "global_step": 245842, "epoch": 1463} {"train_loss": -11.774805068969727, "global_step": 245843, "epoch": 1463} {"train_loss": -12.010913848876953, "global_step": 245844, "epoch": 1463} {"train_loss": -12.004682540893555, "global_step": 245845, "epoch": 1463} {"train_loss": -11.764176368713379, "global_step": 245846, "epoch": 1463} {"train_loss": -11.877995491027832, "global_step": 245847, "epoch": 1463} {"train_loss": -12.258682250976562, "global_step": 245848, "epoch": 1463} {"train_loss": -11.928579330444336, "global_step": 245849, "epoch": 1463} {"train_loss": -11.808292388916016, "global_step": 245850, "epoch": 1463} {"train_loss": -12.063132286071777, "global_step": 245851, "epoch": 1463} {"train_loss": -11.84908676147461, "global_step": 245852, "epoch": 1463} {"train_loss": -12.144571304321289, "global_step": 245853, "epoch": 1463} {"train_loss": -12.252182006835938, "global_step": 245854, "epoch": 1463} {"train_loss": -12.116601943969727, "global_step": 245855, "epoch": 1463} {"train_loss": -12.009328842163086, "global_step": 245856, "epoch": 1463} {"train_loss": -12.240911483764648, "global_step": 245857, "epoch": 1463} {"train_loss": -12.102226257324219, "global_step": 245858, "epoch": 1463} {"train_loss": -12.06229019165039, "global_step": 245859, "epoch": 1463} {"train_loss": -11.997184753417969, "global_step": 245860, "epoch": 1463} {"train_loss": -11.860111236572266, "global_step": 245861, "epoch": 1463} {"train_loss": -11.697097778320312, "global_step": 245862, "epoch": 1463} {"train_loss": -11.657901763916016, "global_step": 245863, "epoch": 1463} {"train_loss": -11.925811767578125, "global_step": 245864, "epoch": 1463} {"train_loss": -11.04191780090332, "global_step": 245865, "epoch": 1463} {"train_loss": -11.977678298950195, "global_step": 245866, "epoch": 1463} {"train_loss": -11.898749351501465, "global_step": 245867, "epoch": 1463} {"train_loss": -11.300031661987305, "global_step": 245868, "epoch": 1463} {"train_loss": -9.98412036895752, "global_step": 245869, "epoch": 1463} {"train_loss": -10.896207809448242, "global_step": 245870, "epoch": 1463} {"train_loss": -11.467625617980957, "global_step": 245871, "epoch": 1463} {"train_loss": -10.53754997253418, "global_step": 245872, "epoch": 1463} {"train_loss": -9.202067375183105, "global_step": 245873, "epoch": 1463} {"train_loss": -10.776123046875, "global_step": 245874, "epoch": 1463} {"train_loss": -7.222259998321533, "global_step": 245875, "epoch": 1463} {"train_loss": -7.946392059326172, "global_step": 245876, "epoch": 1463} {"train_loss": -8.036521911621094, "global_step": 245877, "epoch": 1463} {"train_loss": -10.834659576416016, "global_step": 245878, "epoch": 1463} {"train_loss": -8.421186447143555, "global_step": 245879, "epoch": 1463} {"train_loss": -9.055209159851074, "global_step": 245880, "epoch": 1463} {"train_loss": -10.74515151977539, "global_step": 245881, "epoch": 1463} {"train_loss": -8.129375457763672, "global_step": 245882, "epoch": 1463} {"train_loss": -10.266485214233398, "global_step": 245883, "epoch": 1463} {"train_loss": -10.266946792602539, "global_step": 245884, "epoch": 1463} {"train_loss": -9.140995025634766, "global_step": 245885, "epoch": 1463} {"train_loss": -11.237709045410156, "global_step": 245886, "epoch": 1463} {"train_loss": -9.852230072021484, "global_step": 245887, "epoch": 1463} {"train_loss": -9.73867416381836, "global_step": 245888, "epoch": 1463} {"train_loss": -11.149627685546875, "global_step": 245889, "epoch": 1463} {"train_loss": -10.298495292663574, "global_step": 245890, "epoch": 1463} {"train_loss": -10.509690284729004, "global_step": 245891, "epoch": 1463} {"train_loss": -10.605354309082031, "global_step": 245892, "epoch": 1463} {"train_loss": -10.584300994873047, "global_step": 245893, "epoch": 1463} {"train_loss": -10.37437629699707, "global_step": 245894, "epoch": 1463} {"train_loss": -11.1482515335083, "global_step": 245895, "epoch": 1463} {"train_loss": -10.88771915435791, "global_step": 245896, "epoch": 1463} {"train_loss": -10.888238906860352, "global_step": 245897, "epoch": 1463} {"train_loss": -11.18223762512207, "global_step": 245898, "epoch": 1463} {"train_loss": -11.05307674407959, "global_step": 245899, "epoch": 1463} {"train_loss": -10.286344528198242, "global_step": 245900, "epoch": 1463} {"train_loss": -11.29566478729248, "global_step": 245901, "epoch": 1463} {"train_loss": -11.230219841003418, "global_step": 245902, "epoch": 1463} {"train_loss": -10.96429443359375, "global_step": 245903, "epoch": 1463} {"train_loss": -11.053994178771973, "global_step": 245904, "epoch": 1463} {"train_loss": -11.363615989685059, "global_step": 245905, "epoch": 1463} {"train_loss": -11.118817329406738, "global_step": 245906, "epoch": 1463} {"train_loss": -11.096771240234375, "global_step": 245907, "epoch": 1463} {"train_loss": -11.36549186706543, "global_step": 245908, "epoch": 1463} {"train_loss": -11.354974746704102, "global_step": 245909, "epoch": 1463} {"train_loss": -11.093233108520508, "global_step": 245910, "epoch": 1463} {"train_loss": -11.643937110900879, "global_step": 245911, "epoch": 1463} {"train_loss": -11.573640823364258, "global_step": 245912, "epoch": 1463} {"train_loss": -11.472070693969727, "global_step": 245913, "epoch": 1463} {"train_loss": -11.29403018951416, "global_step": 245914, "epoch": 1463} {"train_loss": -11.676055908203125, "global_step": 245915, "epoch": 1463} {"train_loss": -11.20712661743164, "global_step": 245916, "epoch": 1463} {"train_loss": -11.613144874572754, "global_step": 245917, "epoch": 1463} {"train_loss": -11.530277252197266, "global_step": 245918, "epoch": 1463} {"train_loss": -11.515585899353027, "global_step": 245919, "epoch": 1463} {"train_loss": -11.26724624633789, "global_step": 245920, "epoch": 1463} {"train_loss": -11.611957550048828, "global_step": 245921, "epoch": 1463} {"train_loss": -11.53422737121582, "global_step": 245922, "epoch": 1463} {"train_loss": -11.361711502075195, "global_step": 245923, "epoch": 1463} {"train_loss": -11.619705200195312, "global_step": 245924, "epoch": 1463} {"train_loss": -11.370575904846191, "global_step": 245925, "epoch": 1463} {"train_loss": -11.2122802734375, "global_step": 245926, "epoch": 1463} {"train_loss": -11.488937377929688, "global_step": 245927, "epoch": 1463} {"train_loss": -11.593002319335938, "global_step": 245928, "epoch": 1463} {"train_loss": -11.541160583496094, "global_step": 245929, "epoch": 1463} {"train_loss": -11.046897888183594, "global_step": 245930, "epoch": 1463} {"train_loss": -11.736130714416504, "global_step": 245931, "epoch": 1463} {"train_loss": -11.44937515258789, "global_step": 245932, "epoch": 1463} {"train_loss": -11.52007007598877, "global_step": 245933, "epoch": 1463} {"train_loss": -11.563508987426758, "global_step": 245934, "epoch": 1463} {"train_loss": -11.723627090454102, "global_step": 245935, "epoch": 1463} {"train_loss": -11.640726089477539, "global_step": 245936, "epoch": 1463} {"train_loss": -11.29796028137207, "global_step": 245937, "epoch": 1463} {"train_loss": -11.972126007080078, "global_step": 245938, "epoch": 1463} {"train_loss": -11.7291259765625, "global_step": 245939, "epoch": 1463} {"train_loss": -11.886563301086426, "global_step": 245940, "epoch": 1463} {"train_loss": -11.751344680786133, "global_step": 245941, "epoch": 1463} {"train_loss": -11.699808120727539, "global_step": 245942, "epoch": 1463} {"train_loss": -11.891878128051758, "global_step": 245943, "epoch": 1463} {"train_loss": -11.918006896972656, "global_step": 245944, "epoch": 1463} {"train_loss": -11.579618453979492, "global_step": 245945, "epoch": 1463} {"train_loss": -11.814090728759766, "global_step": 245946, "epoch": 1463} {"train_loss": -11.815120697021484, "global_step": 245947, "epoch": 1463} {"train_loss": -11.604618072509766, "global_step": 245948, "epoch": 1463} {"train_loss": -11.728965759277344, "global_step": 245949, "epoch": 1463} {"train_loss": -11.663934707641602, "global_step": 245950, "epoch": 1463} {"train_loss": -11.362021551245736, "global_step": 245951, "epoch": 1463, "val_loss": 259343.546875} {"train_loss": -12.01092529296875, "global_step": 245952, "epoch": 1464} {"train_loss": -11.891104698181152, "global_step": 245953, "epoch": 1464} {"train_loss": -11.892936706542969, "global_step": 245954, "epoch": 1464} {"train_loss": -12.002582550048828, "global_step": 245955, "epoch": 1464} {"train_loss": -11.808795928955078, "global_step": 245956, "epoch": 1464} {"train_loss": -11.64792537689209, "global_step": 245957, "epoch": 1464} {"train_loss": -11.950557708740234, "global_step": 245958, "epoch": 1464} {"train_loss": -11.91053581237793, "global_step": 245959, "epoch": 1464} {"train_loss": -12.079235076904297, "global_step": 245960, "epoch": 1464} {"train_loss": -11.949790954589844, "global_step": 245961, "epoch": 1464} {"train_loss": -12.057680130004883, "global_step": 245962, "epoch": 1464} {"train_loss": -12.137319564819336, "global_step": 245963, "epoch": 1464} {"train_loss": -12.09644889831543, "global_step": 245964, "epoch": 1464} {"train_loss": -11.858190536499023, "global_step": 245965, "epoch": 1464} {"train_loss": -11.871955871582031, "global_step": 245966, "epoch": 1464} {"train_loss": -12.219717979431152, "global_step": 245967, "epoch": 1464} {"train_loss": -11.874080657958984, "global_step": 245968, "epoch": 1464} {"train_loss": -11.713098526000977, "global_step": 245969, "epoch": 1464} {"train_loss": -11.836662292480469, "global_step": 245970, "epoch": 1464} {"train_loss": -12.151365280151367, "global_step": 245971, "epoch": 1464} {"train_loss": -11.988088607788086, "global_step": 245972, "epoch": 1464} {"train_loss": -12.089761734008789, "global_step": 245973, "epoch": 1464} {"train_loss": -12.092607498168945, "global_step": 245974, "epoch": 1464} {"train_loss": -12.072107315063477, "global_step": 245975, "epoch": 1464} {"train_loss": -11.835020065307617, "global_step": 245976, "epoch": 1464} {"train_loss": -11.998824119567871, "global_step": 245977, "epoch": 1464} {"train_loss": -12.143930435180664, "global_step": 245978, "epoch": 1464} {"train_loss": -12.032608032226562, "global_step": 245979, "epoch": 1464} {"train_loss": -11.727397918701172, "global_step": 245980, "epoch": 1464} {"train_loss": -12.213788986206055, "global_step": 245981, "epoch": 1464} {"train_loss": -12.025840759277344, "global_step": 245982, "epoch": 1464} {"train_loss": -11.163660049438477, "global_step": 245983, "epoch": 1464} {"train_loss": -11.059514999389648, "global_step": 245984, "epoch": 1464} {"train_loss": -12.041755676269531, "global_step": 245985, "epoch": 1464} {"train_loss": -11.423806190490723, "global_step": 245986, "epoch": 1464} {"train_loss": -9.033211708068848, "global_step": 245987, "epoch": 1464} {"train_loss": -9.318262100219727, "global_step": 245988, "epoch": 1464} {"train_loss": -11.51774787902832, "global_step": 245989, "epoch": 1464} {"train_loss": -8.784212112426758, "global_step": 245990, "epoch": 1464} {"train_loss": -10.12643051147461, "global_step": 245991, "epoch": 1464} {"train_loss": -10.896241188049316, "global_step": 245992, "epoch": 1464} {"train_loss": -9.98469352722168, "global_step": 245993, "epoch": 1464} {"train_loss": -11.802509307861328, "global_step": 245994, "epoch": 1464} {"train_loss": -10.621179580688477, "global_step": 245995, "epoch": 1464} {"train_loss": -11.4800443649292, "global_step": 245996, "epoch": 1464} {"train_loss": -11.441228866577148, "global_step": 245997, "epoch": 1464} {"train_loss": -11.493818283081055, "global_step": 245998, "epoch": 1464} {"train_loss": -11.843765258789062, "global_step": 245999, "epoch": 1464} {"train_loss": -11.374991416931152, "global_step": 246000, "epoch": 1464} {"train_loss": -11.47856330871582, "global_step": 246001, "epoch": 1464} {"train_loss": -11.878335952758789, "global_step": 246002, "epoch": 1464} {"train_loss": -10.925765991210938, "global_step": 246003, "epoch": 1464} {"train_loss": -11.709235191345215, "global_step": 246004, "epoch": 1464} {"train_loss": -10.85965347290039, "global_step": 246005, "epoch": 1464} {"train_loss": -10.769537925720215, "global_step": 246006, "epoch": 1464} {"train_loss": -11.631309509277344, "global_step": 246007, "epoch": 1464} {"train_loss": -10.97474479675293, "global_step": 246008, "epoch": 1464} {"train_loss": -11.404277801513672, "global_step": 246009, "epoch": 1464} {"train_loss": -11.249191284179688, "global_step": 246010, "epoch": 1464} {"train_loss": -10.348424911499023, "global_step": 246011, "epoch": 1464} {"train_loss": -11.484729766845703, "global_step": 246012, "epoch": 1464} {"train_loss": -10.963281631469727, "global_step": 246013, "epoch": 1464} {"train_loss": -11.541215896606445, "global_step": 246014, "epoch": 1464} {"train_loss": -11.091580390930176, "global_step": 246015, "epoch": 1464} {"train_loss": -11.272459030151367, "global_step": 246016, "epoch": 1464} {"train_loss": -11.229509353637695, "global_step": 246017, "epoch": 1464} {"train_loss": -11.63163948059082, "global_step": 246018, "epoch": 1464} {"train_loss": -11.688650131225586, "global_step": 246019, "epoch": 1464} {"train_loss": -11.413692474365234, "global_step": 246020, "epoch": 1464} {"train_loss": -11.275501251220703, "global_step": 246021, "epoch": 1464} {"train_loss": -11.556844711303711, "global_step": 246022, "epoch": 1464} {"train_loss": -11.20962142944336, "global_step": 246023, "epoch": 1464} {"train_loss": -11.443546295166016, "global_step": 246024, "epoch": 1464} {"train_loss": -11.515642166137695, "global_step": 246025, "epoch": 1464} {"train_loss": -11.588991165161133, "global_step": 246026, "epoch": 1464} {"train_loss": -11.638650894165039, "global_step": 246027, "epoch": 1464} {"train_loss": -11.699450492858887, "global_step": 246028, "epoch": 1464} {"train_loss": -11.384452819824219, "global_step": 246029, "epoch": 1464} {"train_loss": -11.536367416381836, "global_step": 246030, "epoch": 1464} {"train_loss": -11.628203392028809, "global_step": 246031, "epoch": 1464} {"train_loss": -11.955641746520996, "global_step": 246032, "epoch": 1464} {"train_loss": -11.442863464355469, "global_step": 246033, "epoch": 1464} {"train_loss": -11.863481521606445, "global_step": 246034, "epoch": 1464} {"train_loss": -11.584012031555176, "global_step": 246035, "epoch": 1464} {"train_loss": -11.807060241699219, "global_step": 246036, "epoch": 1464} {"train_loss": -11.81788444519043, "global_step": 246037, "epoch": 1464} {"train_loss": -11.735116004943848, "global_step": 246038, "epoch": 1464} {"train_loss": -11.800369262695312, "global_step": 246039, "epoch": 1464} {"train_loss": -11.86048698425293, "global_step": 246040, "epoch": 1464} {"train_loss": -11.533004760742188, "global_step": 246041, "epoch": 1464} {"train_loss": -11.616340637207031, "global_step": 246042, "epoch": 1464} {"train_loss": -11.834061622619629, "global_step": 246043, "epoch": 1464} {"train_loss": -11.820024490356445, "global_step": 246044, "epoch": 1464} {"train_loss": -11.497150421142578, "global_step": 246045, "epoch": 1464} {"train_loss": -11.667745590209961, "global_step": 246046, "epoch": 1464} {"train_loss": -11.44972038269043, "global_step": 246047, "epoch": 1464} {"train_loss": -11.833016395568848, "global_step": 246048, "epoch": 1464} {"train_loss": -11.511415481567383, "global_step": 246049, "epoch": 1464} {"train_loss": -11.801210403442383, "global_step": 246050, "epoch": 1464} {"train_loss": -11.829463958740234, "global_step": 246051, "epoch": 1464} {"train_loss": -11.696836471557617, "global_step": 246052, "epoch": 1464} {"train_loss": -11.887001037597656, "global_step": 246053, "epoch": 1464} {"train_loss": -11.530255317687988, "global_step": 246054, "epoch": 1464} {"train_loss": -11.988561630249023, "global_step": 246055, "epoch": 1464} {"train_loss": -11.008874893188477, "global_step": 246056, "epoch": 1464} {"train_loss": -11.640993118286133, "global_step": 246057, "epoch": 1464} {"train_loss": -11.67203140258789, "global_step": 246058, "epoch": 1464} {"train_loss": -11.45626163482666, "global_step": 246059, "epoch": 1464} {"train_loss": -11.883950233459473, "global_step": 246060, "epoch": 1464} {"train_loss": -11.372579574584961, "global_step": 246061, "epoch": 1464} {"train_loss": -12.046319961547852, "global_step": 246062, "epoch": 1464} {"train_loss": -11.539289474487305, "global_step": 246063, "epoch": 1464} {"train_loss": -11.621526718139648, "global_step": 246064, "epoch": 1464} {"train_loss": -11.806716918945312, "global_step": 246065, "epoch": 1464} {"train_loss": -11.402469635009766, "global_step": 246066, "epoch": 1464} {"train_loss": -11.92572021484375, "global_step": 246067, "epoch": 1464} {"train_loss": -11.592355728149414, "global_step": 246068, "epoch": 1464} {"train_loss": -12.027690887451172, "global_step": 246069, "epoch": 1464} {"train_loss": -11.848527908325195, "global_step": 246070, "epoch": 1464} {"train_loss": -11.952144622802734, "global_step": 246071, "epoch": 1464} {"train_loss": -12.164379119873047, "global_step": 246072, "epoch": 1464} {"train_loss": -12.170072555541992, "global_step": 246073, "epoch": 1464} {"train_loss": -12.256847381591797, "global_step": 246074, "epoch": 1464} {"train_loss": -12.107769966125488, "global_step": 246075, "epoch": 1464} {"train_loss": -12.073187828063965, "global_step": 246076, "epoch": 1464} {"train_loss": -12.151042938232422, "global_step": 246077, "epoch": 1464} {"train_loss": -12.073013305664062, "global_step": 246078, "epoch": 1464} {"train_loss": -12.052471160888672, "global_step": 246079, "epoch": 1464} {"train_loss": -11.955238342285156, "global_step": 246080, "epoch": 1464} {"train_loss": -12.03337287902832, "global_step": 246081, "epoch": 1464} {"train_loss": -12.201433181762695, "global_step": 246082, "epoch": 1464} {"train_loss": -12.01494026184082, "global_step": 246083, "epoch": 1464} {"train_loss": -12.192651748657227, "global_step": 246084, "epoch": 1464} {"train_loss": -11.729869842529297, "global_step": 246085, "epoch": 1464} {"train_loss": -12.18691635131836, "global_step": 246086, "epoch": 1464} {"train_loss": -11.918853759765625, "global_step": 246087, "epoch": 1464} {"train_loss": -12.224306106567383, "global_step": 246088, "epoch": 1464} {"train_loss": -11.853304862976074, "global_step": 246089, "epoch": 1464} {"train_loss": -12.048919677734375, "global_step": 246090, "epoch": 1464} {"train_loss": -11.976452827453613, "global_step": 246091, "epoch": 1464} {"train_loss": -12.039605140686035, "global_step": 246092, "epoch": 1464} {"train_loss": -12.012662887573242, "global_step": 246093, "epoch": 1464} {"train_loss": -12.115489959716797, "global_step": 246094, "epoch": 1464} {"train_loss": -11.995513916015625, "global_step": 246095, "epoch": 1464} {"train_loss": -11.94651985168457, "global_step": 246096, "epoch": 1464} {"train_loss": -12.1314058303833, "global_step": 246097, "epoch": 1464} {"train_loss": -12.032001495361328, "global_step": 246098, "epoch": 1464} {"train_loss": -12.030532836914062, "global_step": 246099, "epoch": 1464} {"train_loss": -12.175575256347656, "global_step": 246100, "epoch": 1464} {"train_loss": -11.808218002319336, "global_step": 246101, "epoch": 1464} {"train_loss": -12.20954418182373, "global_step": 246102, "epoch": 1464} {"train_loss": -11.811389923095703, "global_step": 246103, "epoch": 1464} {"train_loss": -11.680085182189941, "global_step": 246104, "epoch": 1464} {"train_loss": -11.256998062133789, "global_step": 246105, "epoch": 1464} {"train_loss": -11.883156776428223, "global_step": 246106, "epoch": 1464} {"train_loss": -11.869261741638184, "global_step": 246107, "epoch": 1464} {"train_loss": -12.09843635559082, "global_step": 246108, "epoch": 1464} {"train_loss": -10.11996841430664, "global_step": 246109, "epoch": 1464} {"train_loss": -11.001836776733398, "global_step": 246110, "epoch": 1464} {"train_loss": -11.178447723388672, "global_step": 246111, "epoch": 1464} {"train_loss": -11.600069046020508, "global_step": 246112, "epoch": 1464} {"train_loss": -10.94017219543457, "global_step": 246113, "epoch": 1464} {"train_loss": -11.442838668823242, "global_step": 246114, "epoch": 1464} {"train_loss": -11.022192001342773, "global_step": 246115, "epoch": 1464} {"train_loss": -11.938579559326172, "global_step": 246116, "epoch": 1464} {"train_loss": -11.193201065063477, "global_step": 246117, "epoch": 1464} {"train_loss": -11.851638793945312, "global_step": 246118, "epoch": 1464} {"train_loss": -11.635400806154523, "global_step": 246119, "epoch": 1464, "val_loss": 260136.078125} {"train_loss": -11.365007400512695, "global_step": 246120, "epoch": 1465} {"train_loss": -11.7706937789917, "global_step": 246121, "epoch": 1465} {"train_loss": -11.209135055541992, "global_step": 246122, "epoch": 1465} {"train_loss": -11.061433792114258, "global_step": 246123, "epoch": 1465} {"train_loss": -11.344550132751465, "global_step": 246124, "epoch": 1465} {"train_loss": -11.72024917602539, "global_step": 246125, "epoch": 1465} {"train_loss": -10.803533554077148, "global_step": 246126, "epoch": 1465} {"train_loss": -10.436037063598633, "global_step": 246127, "epoch": 1465} {"train_loss": -10.941703796386719, "global_step": 246128, "epoch": 1465} {"train_loss": -10.752679824829102, "global_step": 246129, "epoch": 1465} {"train_loss": -11.322065353393555, "global_step": 246130, "epoch": 1465} {"train_loss": -10.195977210998535, "global_step": 246131, "epoch": 1465} {"train_loss": -11.440303802490234, "global_step": 246132, "epoch": 1465} {"train_loss": -10.359639167785645, "global_step": 246133, "epoch": 1465} {"train_loss": -11.287612915039062, "global_step": 246134, "epoch": 1465} {"train_loss": -11.486581802368164, "global_step": 246135, "epoch": 1465} {"train_loss": -11.280414581298828, "global_step": 246136, "epoch": 1465} {"train_loss": -11.665037155151367, "global_step": 246137, "epoch": 1465} {"train_loss": -11.261126518249512, "global_step": 246138, "epoch": 1465} {"train_loss": -11.51491641998291, "global_step": 246139, "epoch": 1465} {"train_loss": -11.624083518981934, "global_step": 246140, "epoch": 1465} {"train_loss": -11.398948669433594, "global_step": 246141, "epoch": 1465} {"train_loss": -11.113200187683105, "global_step": 246142, "epoch": 1465} {"train_loss": -11.498632431030273, "global_step": 246143, "epoch": 1465} {"train_loss": -11.342652320861816, "global_step": 246144, "epoch": 1465} {"train_loss": -11.315438270568848, "global_step": 246145, "epoch": 1465} {"train_loss": -11.582113265991211, "global_step": 246146, "epoch": 1465} {"train_loss": -10.99142074584961, "global_step": 246147, "epoch": 1465} {"train_loss": -11.683446884155273, "global_step": 246148, "epoch": 1465} {"train_loss": -10.639323234558105, "global_step": 246149, "epoch": 1465} {"train_loss": -11.620450973510742, "global_step": 246150, "epoch": 1465} {"train_loss": -10.664709091186523, "global_step": 246151, "epoch": 1465} {"train_loss": -11.734338760375977, "global_step": 246152, "epoch": 1465} {"train_loss": -10.975593566894531, "global_step": 246153, "epoch": 1465} {"train_loss": -11.386754989624023, "global_step": 246154, "epoch": 1465} {"train_loss": -11.529743194580078, "global_step": 246155, "epoch": 1465} {"train_loss": -11.188159942626953, "global_step": 246156, "epoch": 1465} {"train_loss": -11.792236328125, "global_step": 246157, "epoch": 1465} {"train_loss": -11.093451499938965, "global_step": 246158, "epoch": 1465} {"train_loss": -11.49647331237793, "global_step": 246159, "epoch": 1465} {"train_loss": -11.635096549987793, "global_step": 246160, "epoch": 1465} {"train_loss": -11.586524963378906, "global_step": 246161, "epoch": 1465} {"train_loss": -11.593854904174805, "global_step": 246162, "epoch": 1465} {"train_loss": -11.217639923095703, "global_step": 246163, "epoch": 1465} {"train_loss": -11.356122970581055, "global_step": 246164, "epoch": 1465} {"train_loss": -11.151826858520508, "global_step": 246165, "epoch": 1465} {"train_loss": -11.752399444580078, "global_step": 246166, "epoch": 1465} {"train_loss": -11.540912628173828, "global_step": 246167, "epoch": 1465} {"train_loss": -11.75368881225586, "global_step": 246168, "epoch": 1465} {"train_loss": -11.123100280761719, "global_step": 246169, "epoch": 1465} {"train_loss": -11.592049598693848, "global_step": 246170, "epoch": 1465} {"train_loss": -11.448063850402832, "global_step": 246171, "epoch": 1465} {"train_loss": -11.466102600097656, "global_step": 246172, "epoch": 1465} {"train_loss": -11.560745239257812, "global_step": 246173, "epoch": 1465} {"train_loss": -11.533129692077637, "global_step": 246174, "epoch": 1465} {"train_loss": -11.518556594848633, "global_step": 246175, "epoch": 1465} {"train_loss": -11.514583587646484, "global_step": 246176, "epoch": 1465} {"train_loss": -11.560961723327637, "global_step": 246177, "epoch": 1465} {"train_loss": -11.82876205444336, "global_step": 246178, "epoch": 1465} {"train_loss": -11.599308013916016, "global_step": 246179, "epoch": 1465} {"train_loss": -11.718151092529297, "global_step": 246180, "epoch": 1465} {"train_loss": -11.90148639678955, "global_step": 246181, "epoch": 1465} {"train_loss": -11.304018020629883, "global_step": 246182, "epoch": 1465} {"train_loss": -12.030466079711914, "global_step": 246183, "epoch": 1465} {"train_loss": -11.593820571899414, "global_step": 246184, "epoch": 1465} {"train_loss": -11.836843490600586, "global_step": 246185, "epoch": 1465} {"train_loss": -11.804220199584961, "global_step": 246186, "epoch": 1465} {"train_loss": -11.752828598022461, "global_step": 246187, "epoch": 1465} {"train_loss": -11.749618530273438, "global_step": 246188, "epoch": 1465} {"train_loss": -11.670210838317871, "global_step": 246189, "epoch": 1465} {"train_loss": -12.064367294311523, "global_step": 246190, "epoch": 1465} {"train_loss": -11.814473152160645, "global_step": 246191, "epoch": 1465} {"train_loss": -12.1027250289917, "global_step": 246192, "epoch": 1465} {"train_loss": -11.838653564453125, "global_step": 246193, "epoch": 1465} {"train_loss": -11.717325210571289, "global_step": 246194, "epoch": 1465} {"train_loss": -11.828969955444336, "global_step": 246195, "epoch": 1465} {"train_loss": -11.682477951049805, "global_step": 246196, "epoch": 1465} {"train_loss": -11.826473236083984, "global_step": 246197, "epoch": 1465} {"train_loss": -11.708039283752441, "global_step": 246198, "epoch": 1465} {"train_loss": -11.790450096130371, "global_step": 246199, "epoch": 1465} {"train_loss": -11.881311416625977, "global_step": 246200, "epoch": 1465} {"train_loss": -11.542973518371582, "global_step": 246201, "epoch": 1465} {"train_loss": -11.981246948242188, "global_step": 246202, "epoch": 1465} {"train_loss": -11.831330299377441, "global_step": 246203, "epoch": 1465} {"train_loss": -11.942133903503418, "global_step": 246204, "epoch": 1465} {"train_loss": -11.65754508972168, "global_step": 246205, "epoch": 1465} {"train_loss": -11.28592300415039, "global_step": 246206, "epoch": 1465} {"train_loss": -11.704029083251953, "global_step": 246207, "epoch": 1465} {"train_loss": -11.581535339355469, "global_step": 246208, "epoch": 1465} {"train_loss": -11.729445457458496, "global_step": 246209, "epoch": 1465} {"train_loss": -11.664673805236816, "global_step": 246210, "epoch": 1465} {"train_loss": -11.594488143920898, "global_step": 246211, "epoch": 1465} {"train_loss": -11.256750106811523, "global_step": 246212, "epoch": 1465} {"train_loss": -11.916769981384277, "global_step": 246213, "epoch": 1465} {"train_loss": -11.601062774658203, "global_step": 246214, "epoch": 1465} {"train_loss": -11.708648681640625, "global_step": 246215, "epoch": 1465} {"train_loss": -11.447958946228027, "global_step": 246216, "epoch": 1465} {"train_loss": -11.63131332397461, "global_step": 246217, "epoch": 1465} {"train_loss": -11.090517044067383, "global_step": 246218, "epoch": 1465} {"train_loss": -11.734288215637207, "global_step": 246219, "epoch": 1465} {"train_loss": -11.40443229675293, "global_step": 246220, "epoch": 1465} {"train_loss": -11.84830379486084, "global_step": 246221, "epoch": 1465} {"train_loss": -11.113183975219727, "global_step": 246222, "epoch": 1465} {"train_loss": -10.855113983154297, "global_step": 246223, "epoch": 1465} {"train_loss": -10.90700912475586, "global_step": 246224, "epoch": 1465} {"train_loss": -11.185966491699219, "global_step": 246225, "epoch": 1465} {"train_loss": -11.19929027557373, "global_step": 246226, "epoch": 1465} {"train_loss": -11.961357116699219, "global_step": 246227, "epoch": 1465} {"train_loss": -11.06554126739502, "global_step": 246228, "epoch": 1465} {"train_loss": -11.881075859069824, "global_step": 246229, "epoch": 1465} {"train_loss": -10.944758415222168, "global_step": 246230, "epoch": 1465} {"train_loss": -11.326140403747559, "global_step": 246231, "epoch": 1465} {"train_loss": -11.790525436401367, "global_step": 246232, "epoch": 1465} {"train_loss": -10.404529571533203, "global_step": 246233, "epoch": 1465} {"train_loss": -11.730717658996582, "global_step": 246234, "epoch": 1465} {"train_loss": -11.425882339477539, "global_step": 246235, "epoch": 1465} {"train_loss": -11.81142807006836, "global_step": 246236, "epoch": 1465} {"train_loss": -11.612619400024414, "global_step": 246237, "epoch": 1465} {"train_loss": -11.34349250793457, "global_step": 246238, "epoch": 1465} {"train_loss": -11.680209159851074, "global_step": 246239, "epoch": 1465} {"train_loss": -11.69025993347168, "global_step": 246240, "epoch": 1465} {"train_loss": -11.477478981018066, "global_step": 246241, "epoch": 1465} {"train_loss": -11.912100791931152, "global_step": 246242, "epoch": 1465} {"train_loss": -11.802740097045898, "global_step": 246243, "epoch": 1465} {"train_loss": -11.767094612121582, "global_step": 246244, "epoch": 1465} {"train_loss": -11.544780731201172, "global_step": 246245, "epoch": 1465} {"train_loss": -11.791220664978027, "global_step": 246246, "epoch": 1465} {"train_loss": -11.637584686279297, "global_step": 246247, "epoch": 1465} {"train_loss": -11.74206829071045, "global_step": 246248, "epoch": 1465} {"train_loss": -11.850651741027832, "global_step": 246249, "epoch": 1465} {"train_loss": -11.961530685424805, "global_step": 246250, "epoch": 1465} {"train_loss": -11.716752052307129, "global_step": 246251, "epoch": 1465} {"train_loss": -11.81283187866211, "global_step": 246252, "epoch": 1465} {"train_loss": -12.080780029296875, "global_step": 246253, "epoch": 1465} {"train_loss": -12.022333145141602, "global_step": 246254, "epoch": 1465} {"train_loss": -11.93138313293457, "global_step": 246255, "epoch": 1465} {"train_loss": -11.957611083984375, "global_step": 246256, "epoch": 1465} {"train_loss": -12.040116310119629, "global_step": 246257, "epoch": 1465} {"train_loss": -11.875760078430176, "global_step": 246258, "epoch": 1465} {"train_loss": -11.848999977111816, "global_step": 246259, "epoch": 1465} {"train_loss": -11.702423095703125, "global_step": 246260, "epoch": 1465} {"train_loss": -11.913246154785156, "global_step": 246261, "epoch": 1465} {"train_loss": -11.63262939453125, "global_step": 246262, "epoch": 1465} {"train_loss": -11.896866798400879, "global_step": 246263, "epoch": 1465} {"train_loss": -11.784635543823242, "global_step": 246264, "epoch": 1465} {"train_loss": -11.678483009338379, "global_step": 246265, "epoch": 1465} {"train_loss": -11.972801208496094, "global_step": 246266, "epoch": 1465} {"train_loss": -11.587820053100586, "global_step": 246267, "epoch": 1465} {"train_loss": -11.775592803955078, "global_step": 246268, "epoch": 1465} {"train_loss": -11.527691841125488, "global_step": 246269, "epoch": 1465} {"train_loss": -11.025163650512695, "global_step": 246270, "epoch": 1465} {"train_loss": -11.993024826049805, "global_step": 246271, "epoch": 1465} {"train_loss": -11.348503112792969, "global_step": 246272, "epoch": 1465} {"train_loss": -11.013470649719238, "global_step": 246273, "epoch": 1465} {"train_loss": -12.091711044311523, "global_step": 246274, "epoch": 1465} {"train_loss": -10.822243690490723, "global_step": 246275, "epoch": 1465} {"train_loss": -11.666748046875, "global_step": 246276, "epoch": 1465} {"train_loss": -11.367640495300293, "global_step": 246277, "epoch": 1465} {"train_loss": -11.328826904296875, "global_step": 246278, "epoch": 1465} {"train_loss": -11.617704391479492, "global_step": 246279, "epoch": 1465} {"train_loss": -11.953622817993164, "global_step": 246280, "epoch": 1465} {"train_loss": -11.302225112915039, "global_step": 246281, "epoch": 1465} {"train_loss": -11.788442611694336, "global_step": 246282, "epoch": 1465} {"train_loss": -11.584102630615234, "global_step": 246283, "epoch": 1465} {"train_loss": -11.842098236083984, "global_step": 246284, "epoch": 1465} {"train_loss": -11.685641288757324, "global_step": 246285, "epoch": 1465} {"train_loss": -12.015121459960938, "global_step": 246286, "epoch": 1465} {"train_loss": -11.538393610999698, "global_step": 246287, "epoch": 1465, "val_loss": 265480.0625, "train_action_mse_error": 1.5503485202789307} {"train_loss": -11.921953201293945, "global_step": 246288, "epoch": 1466} {"train_loss": -11.516684532165527, "global_step": 246289, "epoch": 1466} {"train_loss": -11.371790885925293, "global_step": 246290, "epoch": 1466} {"train_loss": -11.598379135131836, "global_step": 246291, "epoch": 1466} {"train_loss": -11.896310806274414, "global_step": 246292, "epoch": 1466} {"train_loss": -11.8321533203125, "global_step": 246293, "epoch": 1466} {"train_loss": -11.775707244873047, "global_step": 246294, "epoch": 1466} {"train_loss": -11.781864166259766, "global_step": 246295, "epoch": 1466} {"train_loss": -11.803447723388672, "global_step": 246296, "epoch": 1466} {"train_loss": -11.865608215332031, "global_step": 246297, "epoch": 1466} {"train_loss": -11.767520904541016, "global_step": 246298, "epoch": 1466} {"train_loss": -11.562296867370605, "global_step": 246299, "epoch": 1466} {"train_loss": -11.937007904052734, "global_step": 246300, "epoch": 1466} {"train_loss": -11.52330207824707, "global_step": 246301, "epoch": 1466} {"train_loss": -11.713269233703613, "global_step": 246302, "epoch": 1466} {"train_loss": -11.389881134033203, "global_step": 246303, "epoch": 1466} {"train_loss": -12.04316234588623, "global_step": 246304, "epoch": 1466} {"train_loss": -11.421334266662598, "global_step": 246305, "epoch": 1466} {"train_loss": -11.784794807434082, "global_step": 246306, "epoch": 1466} {"train_loss": -11.577868461608887, "global_step": 246307, "epoch": 1466} {"train_loss": -11.729595184326172, "global_step": 246308, "epoch": 1466} {"train_loss": -11.763105392456055, "global_step": 246309, "epoch": 1466} {"train_loss": -11.984107971191406, "global_step": 246310, "epoch": 1466} {"train_loss": -11.359269142150879, "global_step": 246311, "epoch": 1466} {"train_loss": -11.810806274414062, "global_step": 246312, "epoch": 1466} {"train_loss": -11.512943267822266, "global_step": 246313, "epoch": 1466} {"train_loss": -11.973974227905273, "global_step": 246314, "epoch": 1466} {"train_loss": -11.432619094848633, "global_step": 246315, "epoch": 1466} {"train_loss": -11.914803504943848, "global_step": 246316, "epoch": 1466} {"train_loss": -11.570993423461914, "global_step": 246317, "epoch": 1466} {"train_loss": -11.720439910888672, "global_step": 246318, "epoch": 1466} {"train_loss": -11.484034538269043, "global_step": 246319, "epoch": 1466} {"train_loss": -10.909661293029785, "global_step": 246320, "epoch": 1466} {"train_loss": -11.685508728027344, "global_step": 246321, "epoch": 1466} {"train_loss": -11.269124984741211, "global_step": 246322, "epoch": 1466} {"train_loss": -10.883336067199707, "global_step": 246323, "epoch": 1466} {"train_loss": -11.36512279510498, "global_step": 246324, "epoch": 1466} {"train_loss": -11.610237121582031, "global_step": 246325, "epoch": 1466} {"train_loss": -11.318193435668945, "global_step": 246326, "epoch": 1466} {"train_loss": -11.421503067016602, "global_step": 246327, "epoch": 1466} {"train_loss": -11.645666122436523, "global_step": 246328, "epoch": 1466} {"train_loss": -11.067886352539062, "global_step": 246329, "epoch": 1466} {"train_loss": -11.308527946472168, "global_step": 246330, "epoch": 1466} {"train_loss": -11.201976776123047, "global_step": 246331, "epoch": 1466} {"train_loss": -11.469706535339355, "global_step": 246332, "epoch": 1466} {"train_loss": -11.33394718170166, "global_step": 246333, "epoch": 1466} {"train_loss": -11.531744003295898, "global_step": 246334, "epoch": 1466} {"train_loss": -10.89979362487793, "global_step": 246335, "epoch": 1466} {"train_loss": -10.626266479492188, "global_step": 246336, "epoch": 1466} {"train_loss": -11.611261367797852, "global_step": 246337, "epoch": 1466} {"train_loss": -11.947121620178223, "global_step": 246338, "epoch": 1466} {"train_loss": -11.476243019104004, "global_step": 246339, "epoch": 1466} {"train_loss": -11.638781547546387, "global_step": 246340, "epoch": 1466} {"train_loss": -11.542153358459473, "global_step": 246341, "epoch": 1466} {"train_loss": -11.626594543457031, "global_step": 246342, "epoch": 1466} {"train_loss": -11.566205024719238, "global_step": 246343, "epoch": 1466} {"train_loss": -11.486482620239258, "global_step": 246344, "epoch": 1466} {"train_loss": -11.816385269165039, "global_step": 246345, "epoch": 1466} {"train_loss": -11.883110046386719, "global_step": 246346, "epoch": 1466} {"train_loss": -11.635839462280273, "global_step": 246347, "epoch": 1466} {"train_loss": -11.721487045288086, "global_step": 246348, "epoch": 1466} {"train_loss": -11.70751953125, "global_step": 246349, "epoch": 1466} {"train_loss": -11.72166919708252, "global_step": 246350, "epoch": 1466} {"train_loss": -11.81173038482666, "global_step": 246351, "epoch": 1466} {"train_loss": -11.311790466308594, "global_step": 246352, "epoch": 1466} {"train_loss": -11.622919082641602, "global_step": 246353, "epoch": 1466} {"train_loss": -11.922926902770996, "global_step": 246354, "epoch": 1466} {"train_loss": -11.31554889678955, "global_step": 246355, "epoch": 1466} {"train_loss": -11.990078926086426, "global_step": 246356, "epoch": 1466} {"train_loss": -11.49795913696289, "global_step": 246357, "epoch": 1466} {"train_loss": -11.988677978515625, "global_step": 246358, "epoch": 1466} {"train_loss": -11.616369247436523, "global_step": 246359, "epoch": 1466} {"train_loss": -11.786283493041992, "global_step": 246360, "epoch": 1466} {"train_loss": -11.925148963928223, "global_step": 246361, "epoch": 1466} {"train_loss": -11.52009391784668, "global_step": 246362, "epoch": 1466} {"train_loss": -11.52562427520752, "global_step": 246363, "epoch": 1466} {"train_loss": -11.610028266906738, "global_step": 246364, "epoch": 1466} {"train_loss": -11.802160263061523, "global_step": 246365, "epoch": 1466} {"train_loss": -11.479734420776367, "global_step": 246366, "epoch": 1466} {"train_loss": -12.004194259643555, "global_step": 246367, "epoch": 1466} {"train_loss": -11.378708839416504, "global_step": 246368, "epoch": 1466} {"train_loss": -11.977620124816895, "global_step": 246369, "epoch": 1466} {"train_loss": -11.78632926940918, "global_step": 246370, "epoch": 1466} {"train_loss": -11.683167457580566, "global_step": 246371, "epoch": 1466} {"train_loss": -11.831692695617676, "global_step": 246372, "epoch": 1466} {"train_loss": -11.909967422485352, "global_step": 246373, "epoch": 1466} {"train_loss": -11.906828880310059, "global_step": 246374, "epoch": 1466} {"train_loss": -11.511889457702637, "global_step": 246375, "epoch": 1466} {"train_loss": -11.970564842224121, "global_step": 246376, "epoch": 1466} {"train_loss": -11.753213882446289, "global_step": 246377, "epoch": 1466} {"train_loss": -11.799124717712402, "global_step": 246378, "epoch": 1466} {"train_loss": -11.725711822509766, "global_step": 246379, "epoch": 1466} {"train_loss": -11.394124984741211, "global_step": 246380, "epoch": 1466} {"train_loss": -11.843417167663574, "global_step": 246381, "epoch": 1466} {"train_loss": -11.770488739013672, "global_step": 246382, "epoch": 1466} {"train_loss": -11.342548370361328, "global_step": 246383, "epoch": 1466} {"train_loss": -11.64742374420166, "global_step": 246384, "epoch": 1466} {"train_loss": -11.908062934875488, "global_step": 246385, "epoch": 1466} {"train_loss": -11.69650650024414, "global_step": 246386, "epoch": 1466} {"train_loss": -12.047523498535156, "global_step": 246387, "epoch": 1466} {"train_loss": -11.992694854736328, "global_step": 246388, "epoch": 1466} {"train_loss": -11.934796333312988, "global_step": 246389, "epoch": 1466} {"train_loss": -11.994150161743164, "global_step": 246390, "epoch": 1466} {"train_loss": -12.026378631591797, "global_step": 246391, "epoch": 1466} {"train_loss": -12.009941101074219, "global_step": 246392, "epoch": 1466} {"train_loss": -11.992521286010742, "global_step": 246393, "epoch": 1466} {"train_loss": -12.037644386291504, "global_step": 246394, "epoch": 1466} {"train_loss": -12.078842163085938, "global_step": 246395, "epoch": 1466} {"train_loss": -11.78730583190918, "global_step": 246396, "epoch": 1466} {"train_loss": -12.032612800598145, "global_step": 246397, "epoch": 1466} {"train_loss": -12.053098678588867, "global_step": 246398, "epoch": 1466} {"train_loss": -11.875446319580078, "global_step": 246399, "epoch": 1466} {"train_loss": -11.968708992004395, "global_step": 246400, "epoch": 1466} {"train_loss": -12.007381439208984, "global_step": 246401, "epoch": 1466} {"train_loss": -12.039670944213867, "global_step": 246402, "epoch": 1466} {"train_loss": -11.926599502563477, "global_step": 246403, "epoch": 1466} {"train_loss": -12.294683456420898, "global_step": 246404, "epoch": 1466} {"train_loss": -11.647889137268066, "global_step": 246405, "epoch": 1466} {"train_loss": -12.27425765991211, "global_step": 246406, "epoch": 1466} {"train_loss": -11.995553970336914, "global_step": 246407, "epoch": 1466} {"train_loss": -11.875515937805176, "global_step": 246408, "epoch": 1466} {"train_loss": -11.738995552062988, "global_step": 246409, "epoch": 1466} {"train_loss": -12.00363540649414, "global_step": 246410, "epoch": 1466} {"train_loss": -11.86205768585205, "global_step": 246411, "epoch": 1466} {"train_loss": -11.548604965209961, "global_step": 246412, "epoch": 1466} {"train_loss": -12.074414253234863, "global_step": 246413, "epoch": 1466} {"train_loss": -11.709128379821777, "global_step": 246414, "epoch": 1466} {"train_loss": -11.5975341796875, "global_step": 246415, "epoch": 1466} {"train_loss": -11.884891510009766, "global_step": 246416, "epoch": 1466} {"train_loss": -11.83915901184082, "global_step": 246417, "epoch": 1466} {"train_loss": -12.307968139648438, "global_step": 246418, "epoch": 1466} {"train_loss": -12.251703262329102, "global_step": 246419, "epoch": 1466} {"train_loss": -11.518352508544922, "global_step": 246420, "epoch": 1466} {"train_loss": -11.424098014831543, "global_step": 246421, "epoch": 1466} {"train_loss": -11.671771049499512, "global_step": 246422, "epoch": 1466} {"train_loss": -11.149460792541504, "global_step": 246423, "epoch": 1466} {"train_loss": -12.026561737060547, "global_step": 246424, "epoch": 1466} {"train_loss": -11.232132911682129, "global_step": 246425, "epoch": 1466} {"train_loss": -11.606681823730469, "global_step": 246426, "epoch": 1466} {"train_loss": -11.386016845703125, "global_step": 246427, "epoch": 1466} {"train_loss": -11.669096946716309, "global_step": 246428, "epoch": 1466} {"train_loss": -11.220108985900879, "global_step": 246429, "epoch": 1466} {"train_loss": -11.576375961303711, "global_step": 246430, "epoch": 1466} {"train_loss": -11.483168601989746, "global_step": 246431, "epoch": 1466} {"train_loss": -11.439387321472168, "global_step": 246432, "epoch": 1466} {"train_loss": -11.954082489013672, "global_step": 246433, "epoch": 1466} {"train_loss": -11.721208572387695, "global_step": 246434, "epoch": 1466} {"train_loss": -11.843846321105957, "global_step": 246435, "epoch": 1466} {"train_loss": -11.918649673461914, "global_step": 246436, "epoch": 1466} {"train_loss": -11.278782844543457, "global_step": 246437, "epoch": 1466} {"train_loss": -11.628861427307129, "global_step": 246438, "epoch": 1466} {"train_loss": -11.547473907470703, "global_step": 246439, "epoch": 1466} {"train_loss": -11.814750671386719, "global_step": 246440, "epoch": 1466} {"train_loss": -11.1566162109375, "global_step": 246441, "epoch": 1466} {"train_loss": -11.818511962890625, "global_step": 246442, "epoch": 1466} {"train_loss": -11.740388870239258, "global_step": 246443, "epoch": 1466} {"train_loss": -11.666807174682617, "global_step": 246444, "epoch": 1466} {"train_loss": -10.305806159973145, "global_step": 246445, "epoch": 1466} {"train_loss": -8.912163734436035, "global_step": 246446, "epoch": 1466} {"train_loss": -11.253721237182617, "global_step": 246447, "epoch": 1466} {"train_loss": -11.278703689575195, "global_step": 246448, "epoch": 1466} {"train_loss": -10.581108093261719, "global_step": 246449, "epoch": 1466} {"train_loss": -10.989313125610352, "global_step": 246450, "epoch": 1466} {"train_loss": -10.442859649658203, "global_step": 246451, "epoch": 1466} {"train_loss": -11.290162086486816, "global_step": 246452, "epoch": 1466} {"train_loss": -11.219850540161133, "global_step": 246453, "epoch": 1466} {"train_loss": -11.143308639526367, "global_step": 246454, "epoch": 1466} {"train_loss": -11.623575068655468, "global_step": 246455, "epoch": 1466, "val_loss": 267699.84375} {"train_loss": -10.312519073486328, "global_step": 246456, "epoch": 1467} {"train_loss": -10.920675277709961, "global_step": 246457, "epoch": 1467} {"train_loss": -10.372259140014648, "global_step": 246458, "epoch": 1467} {"train_loss": -10.430126190185547, "global_step": 246459, "epoch": 1467} {"train_loss": -11.411654472351074, "global_step": 246460, "epoch": 1467} {"train_loss": -9.574625015258789, "global_step": 246461, "epoch": 1467} {"train_loss": -11.614248275756836, "global_step": 246462, "epoch": 1467} {"train_loss": -10.622000694274902, "global_step": 246463, "epoch": 1467} {"train_loss": -11.426586151123047, "global_step": 246464, "epoch": 1467} {"train_loss": -10.666784286499023, "global_step": 246465, "epoch": 1467} {"train_loss": -10.490636825561523, "global_step": 246466, "epoch": 1467} {"train_loss": -9.968950271606445, "global_step": 246467, "epoch": 1467} {"train_loss": -10.838998794555664, "global_step": 246468, "epoch": 1467} {"train_loss": -9.916725158691406, "global_step": 246469, "epoch": 1467} {"train_loss": -11.349801063537598, "global_step": 246470, "epoch": 1467} {"train_loss": -10.470173835754395, "global_step": 246471, "epoch": 1467} {"train_loss": -11.271435737609863, "global_step": 246472, "epoch": 1467} {"train_loss": -10.838561058044434, "global_step": 246473, "epoch": 1467} {"train_loss": -11.411396980285645, "global_step": 246474, "epoch": 1467} {"train_loss": -11.018105506896973, "global_step": 246475, "epoch": 1467} {"train_loss": -11.467416763305664, "global_step": 246476, "epoch": 1467} {"train_loss": -11.264041900634766, "global_step": 246477, "epoch": 1467} {"train_loss": -11.675132751464844, "global_step": 246478, "epoch": 1467} {"train_loss": -11.359481811523438, "global_step": 246479, "epoch": 1467} {"train_loss": -11.560949325561523, "global_step": 246480, "epoch": 1467} {"train_loss": -11.478109359741211, "global_step": 246481, "epoch": 1467} {"train_loss": -11.563024520874023, "global_step": 246482, "epoch": 1467} {"train_loss": -11.115429878234863, "global_step": 246483, "epoch": 1467} {"train_loss": -11.2257661819458, "global_step": 246484, "epoch": 1467} {"train_loss": -11.081903457641602, "global_step": 246485, "epoch": 1467} {"train_loss": -11.334165573120117, "global_step": 246486, "epoch": 1467} {"train_loss": -11.288536071777344, "global_step": 246487, "epoch": 1467} {"train_loss": -11.270994186401367, "global_step": 246488, "epoch": 1467} {"train_loss": -11.506631851196289, "global_step": 246489, "epoch": 1467} {"train_loss": -11.447890281677246, "global_step": 246490, "epoch": 1467} {"train_loss": -11.0408353805542, "global_step": 246491, "epoch": 1467} {"train_loss": -11.398733139038086, "global_step": 246492, "epoch": 1467} {"train_loss": -11.150239944458008, "global_step": 246493, "epoch": 1467} {"train_loss": -11.401932716369629, "global_step": 246494, "epoch": 1467} {"train_loss": -11.018162727355957, "global_step": 246495, "epoch": 1467} {"train_loss": -11.46535873413086, "global_step": 246496, "epoch": 1467} {"train_loss": -11.462703704833984, "global_step": 246497, "epoch": 1467} {"train_loss": -11.623867988586426, "global_step": 246498, "epoch": 1467} {"train_loss": -11.492555618286133, "global_step": 246499, "epoch": 1467} {"train_loss": -11.641912460327148, "global_step": 246500, "epoch": 1467} {"train_loss": -11.46027946472168, "global_step": 246501, "epoch": 1467} {"train_loss": -11.546640396118164, "global_step": 246502, "epoch": 1467} {"train_loss": -11.585811614990234, "global_step": 246503, "epoch": 1467} {"train_loss": -11.702220916748047, "global_step": 246504, "epoch": 1467} {"train_loss": -11.55694580078125, "global_step": 246505, "epoch": 1467} {"train_loss": -11.743581771850586, "global_step": 246506, "epoch": 1467} {"train_loss": -11.453168869018555, "global_step": 246507, "epoch": 1467} {"train_loss": -11.827722549438477, "global_step": 246508, "epoch": 1467} {"train_loss": -11.79908561706543, "global_step": 246509, "epoch": 1467} {"train_loss": -11.827947616577148, "global_step": 246510, "epoch": 1467} {"train_loss": -11.95917797088623, "global_step": 246511, "epoch": 1467} {"train_loss": -11.855804443359375, "global_step": 246512, "epoch": 1467} {"train_loss": -11.996028900146484, "global_step": 246513, "epoch": 1467} {"train_loss": -12.015750885009766, "global_step": 246514, "epoch": 1467} {"train_loss": -12.011754035949707, "global_step": 246515, "epoch": 1467} {"train_loss": -12.038867950439453, "global_step": 246516, "epoch": 1467} {"train_loss": -11.80714225769043, "global_step": 246517, "epoch": 1467} {"train_loss": -11.865660667419434, "global_step": 246518, "epoch": 1467} {"train_loss": -11.875520706176758, "global_step": 246519, "epoch": 1467} {"train_loss": -12.095354080200195, "global_step": 246520, "epoch": 1467} {"train_loss": -11.83046817779541, "global_step": 246521, "epoch": 1467} {"train_loss": -11.981481552124023, "global_step": 246522, "epoch": 1467} {"train_loss": -12.05117416381836, "global_step": 246523, "epoch": 1467} {"train_loss": -11.89471435546875, "global_step": 246524, "epoch": 1467} {"train_loss": -12.057779312133789, "global_step": 246525, "epoch": 1467} {"train_loss": -12.137816429138184, "global_step": 246526, "epoch": 1467} {"train_loss": -11.790386199951172, "global_step": 246527, "epoch": 1467} {"train_loss": -12.008138656616211, "global_step": 246528, "epoch": 1467} {"train_loss": -11.97751235961914, "global_step": 246529, "epoch": 1467} {"train_loss": -12.03615951538086, "global_step": 246530, "epoch": 1467} {"train_loss": -11.785385131835938, "global_step": 246531, "epoch": 1467} {"train_loss": -12.178802490234375, "global_step": 246532, "epoch": 1467} {"train_loss": -12.240018844604492, "global_step": 246533, "epoch": 1467} {"train_loss": -12.164285659790039, "global_step": 246534, "epoch": 1467} {"train_loss": -12.068482398986816, "global_step": 246535, "epoch": 1467} {"train_loss": -12.149792671203613, "global_step": 246536, "epoch": 1467} {"train_loss": -11.907278060913086, "global_step": 246537, "epoch": 1467} {"train_loss": -11.828886032104492, "global_step": 246538, "epoch": 1467} {"train_loss": -12.24007797241211, "global_step": 246539, "epoch": 1467} {"train_loss": -12.000753402709961, "global_step": 246540, "epoch": 1467} {"train_loss": -12.248915672302246, "global_step": 246541, "epoch": 1467} {"train_loss": -11.855146408081055, "global_step": 246542, "epoch": 1467} {"train_loss": -12.130613327026367, "global_step": 246543, "epoch": 1467} {"train_loss": -11.926198959350586, "global_step": 246544, "epoch": 1467} {"train_loss": -12.38794994354248, "global_step": 246545, "epoch": 1467} {"train_loss": -12.05903434753418, "global_step": 246546, "epoch": 1467} {"train_loss": -12.202789306640625, "global_step": 246547, "epoch": 1467} {"train_loss": -12.075791358947754, "global_step": 246548, "epoch": 1467} {"train_loss": -11.936196327209473, "global_step": 246549, "epoch": 1467} {"train_loss": -12.252264022827148, "global_step": 246550, "epoch": 1467} {"train_loss": -11.865411758422852, "global_step": 246551, "epoch": 1467} {"train_loss": -12.020380973815918, "global_step": 246552, "epoch": 1467} {"train_loss": -12.304189682006836, "global_step": 246553, "epoch": 1467} {"train_loss": -11.36683464050293, "global_step": 246554, "epoch": 1467} {"train_loss": -11.744012832641602, "global_step": 246555, "epoch": 1467} {"train_loss": -11.943418502807617, "global_step": 246556, "epoch": 1467} {"train_loss": -12.194534301757812, "global_step": 246557, "epoch": 1467} {"train_loss": -11.773504257202148, "global_step": 246558, "epoch": 1467} {"train_loss": -11.902973175048828, "global_step": 246559, "epoch": 1467} {"train_loss": -11.794533729553223, "global_step": 246560, "epoch": 1467} {"train_loss": -11.850152969360352, "global_step": 246561, "epoch": 1467} {"train_loss": -11.771674156188965, "global_step": 246562, "epoch": 1467} {"train_loss": -11.47805404663086, "global_step": 246563, "epoch": 1467} {"train_loss": -12.193788528442383, "global_step": 246564, "epoch": 1467} {"train_loss": -12.118302345275879, "global_step": 246565, "epoch": 1467} {"train_loss": -11.914141654968262, "global_step": 246566, "epoch": 1467} {"train_loss": -11.871076583862305, "global_step": 246567, "epoch": 1467} {"train_loss": -11.844179153442383, "global_step": 246568, "epoch": 1467} {"train_loss": -11.862325668334961, "global_step": 246569, "epoch": 1467} {"train_loss": -11.567301750183105, "global_step": 246570, "epoch": 1467} {"train_loss": -11.829609870910645, "global_step": 246571, "epoch": 1467} {"train_loss": -11.747407913208008, "global_step": 246572, "epoch": 1467} {"train_loss": -11.722036361694336, "global_step": 246573, "epoch": 1467} {"train_loss": -11.647623062133789, "global_step": 246574, "epoch": 1467} {"train_loss": -11.802774429321289, "global_step": 246575, "epoch": 1467} {"train_loss": -11.727495193481445, "global_step": 246576, "epoch": 1467} {"train_loss": -12.129854202270508, "global_step": 246577, "epoch": 1467} {"train_loss": -12.235357284545898, "global_step": 246578, "epoch": 1467} {"train_loss": -12.057880401611328, "global_step": 246579, "epoch": 1467} {"train_loss": -11.9608154296875, "global_step": 246580, "epoch": 1467} {"train_loss": -12.005353927612305, "global_step": 246581, "epoch": 1467} {"train_loss": -12.095067977905273, "global_step": 246582, "epoch": 1467} {"train_loss": -12.071958541870117, "global_step": 246583, "epoch": 1467} {"train_loss": -12.157062530517578, "global_step": 246584, "epoch": 1467} {"train_loss": -12.02857780456543, "global_step": 246585, "epoch": 1467} {"train_loss": -11.357190132141113, "global_step": 246586, "epoch": 1467} {"train_loss": -11.867698669433594, "global_step": 246587, "epoch": 1467} {"train_loss": -10.90734577178955, "global_step": 246588, "epoch": 1467} {"train_loss": -11.332141876220703, "global_step": 246589, "epoch": 1467} {"train_loss": -11.814061164855957, "global_step": 246590, "epoch": 1467} {"train_loss": -11.871837615966797, "global_step": 246591, "epoch": 1467} {"train_loss": -11.299732208251953, "global_step": 246592, "epoch": 1467} {"train_loss": -11.163111686706543, "global_step": 246593, "epoch": 1467} {"train_loss": -11.63577938079834, "global_step": 246594, "epoch": 1467} {"train_loss": -12.051167488098145, "global_step": 246595, "epoch": 1467} {"train_loss": -11.75110912322998, "global_step": 246596, "epoch": 1467} {"train_loss": -11.359439849853516, "global_step": 246597, "epoch": 1467} {"train_loss": -11.829191207885742, "global_step": 246598, "epoch": 1467} {"train_loss": -11.948531150817871, "global_step": 246599, "epoch": 1467} {"train_loss": -11.778304100036621, "global_step": 246600, "epoch": 1467} {"train_loss": -11.54415512084961, "global_step": 246601, "epoch": 1467} {"train_loss": -11.851309776306152, "global_step": 246602, "epoch": 1467} {"train_loss": -12.108199119567871, "global_step": 246603, "epoch": 1467} {"train_loss": -11.976892471313477, "global_step": 246604, "epoch": 1467} {"train_loss": -11.82435417175293, "global_step": 246605, "epoch": 1467} {"train_loss": -11.757063865661621, "global_step": 246606, "epoch": 1467} {"train_loss": -11.890756607055664, "global_step": 246607, "epoch": 1467} {"train_loss": -11.728726387023926, "global_step": 246608, "epoch": 1467} {"train_loss": -11.558061599731445, "global_step": 246609, "epoch": 1467} {"train_loss": -11.765815734863281, "global_step": 246610, "epoch": 1467} {"train_loss": -11.587252616882324, "global_step": 246611, "epoch": 1467} {"train_loss": -10.202780723571777, "global_step": 246612, "epoch": 1467} {"train_loss": -11.252640724182129, "global_step": 246613, "epoch": 1467} {"train_loss": -11.20474624633789, "global_step": 246614, "epoch": 1467} {"train_loss": -10.547868728637695, "global_step": 246615, "epoch": 1467} {"train_loss": -9.899843215942383, "global_step": 246616, "epoch": 1467} {"train_loss": -11.172369003295898, "global_step": 246617, "epoch": 1467} {"train_loss": -9.844407081604004, "global_step": 246618, "epoch": 1467} {"train_loss": -10.09438705444336, "global_step": 246619, "epoch": 1467} {"train_loss": -10.848038673400879, "global_step": 246620, "epoch": 1467} {"train_loss": -8.606080055236816, "global_step": 246621, "epoch": 1467} {"train_loss": -11.471427917480469, "global_step": 246622, "epoch": 1467} {"train_loss": -11.55487631048475, "global_step": 246623, "epoch": 1467, "val_loss": 269609.0} {"train_loss": -10.841157913208008, "global_step": 246624, "epoch": 1468} {"train_loss": -10.720987319946289, "global_step": 246625, "epoch": 1468} {"train_loss": -11.145525932312012, "global_step": 246626, "epoch": 1468} {"train_loss": -11.010712623596191, "global_step": 246627, "epoch": 1468} {"train_loss": -10.761274337768555, "global_step": 246628, "epoch": 1468} {"train_loss": -11.266218185424805, "global_step": 246629, "epoch": 1468} {"train_loss": -10.957685470581055, "global_step": 246630, "epoch": 1468} {"train_loss": -11.314099311828613, "global_step": 246631, "epoch": 1468} {"train_loss": -11.13280200958252, "global_step": 246632, "epoch": 1468} {"train_loss": -11.25400161743164, "global_step": 246633, "epoch": 1468} {"train_loss": -10.375245094299316, "global_step": 246634, "epoch": 1468} {"train_loss": -11.172977447509766, "global_step": 246635, "epoch": 1468} {"train_loss": -11.376953125, "global_step": 246636, "epoch": 1468} {"train_loss": -11.266523361206055, "global_step": 246637, "epoch": 1468} {"train_loss": -11.03541374206543, "global_step": 246638, "epoch": 1468} {"train_loss": -11.352080345153809, "global_step": 246639, "epoch": 1468} {"train_loss": -11.434555053710938, "global_step": 246640, "epoch": 1468} {"train_loss": -11.142391204833984, "global_step": 246641, "epoch": 1468} {"train_loss": -11.285673141479492, "global_step": 246642, "epoch": 1468} {"train_loss": -11.327630996704102, "global_step": 246643, "epoch": 1468} {"train_loss": -11.659172058105469, "global_step": 246644, "epoch": 1468} {"train_loss": -11.589277267456055, "global_step": 246645, "epoch": 1468} {"train_loss": -11.566545486450195, "global_step": 246646, "epoch": 1468} {"train_loss": -11.644315719604492, "global_step": 246647, "epoch": 1468} {"train_loss": -11.335286140441895, "global_step": 246648, "epoch": 1468} {"train_loss": -11.527292251586914, "global_step": 246649, "epoch": 1468} {"train_loss": -11.543130874633789, "global_step": 246650, "epoch": 1468} {"train_loss": -11.616966247558594, "global_step": 246651, "epoch": 1468} {"train_loss": -11.618474960327148, "global_step": 246652, "epoch": 1468} {"train_loss": -11.248369216918945, "global_step": 246653, "epoch": 1468} {"train_loss": -11.78261661529541, "global_step": 246654, "epoch": 1468} {"train_loss": -11.423964500427246, "global_step": 246655, "epoch": 1468} {"train_loss": -11.304574966430664, "global_step": 246656, "epoch": 1468} {"train_loss": -11.690364837646484, "global_step": 246657, "epoch": 1468} {"train_loss": -11.711606979370117, "global_step": 246658, "epoch": 1468} {"train_loss": -11.770248413085938, "global_step": 246659, "epoch": 1468} {"train_loss": -11.748320579528809, "global_step": 246660, "epoch": 1468} {"train_loss": -11.882287979125977, "global_step": 246661, "epoch": 1468} {"train_loss": -11.6746826171875, "global_step": 246662, "epoch": 1468} {"train_loss": -11.718368530273438, "global_step": 246663, "epoch": 1468} {"train_loss": -11.6463623046875, "global_step": 246664, "epoch": 1468} {"train_loss": -11.932332038879395, "global_step": 246665, "epoch": 1468} {"train_loss": -11.631570816040039, "global_step": 246666, "epoch": 1468} {"train_loss": -11.799583435058594, "global_step": 246667, "epoch": 1468} {"train_loss": -11.71023178100586, "global_step": 246668, "epoch": 1468} {"train_loss": -11.846031188964844, "global_step": 246669, "epoch": 1468} {"train_loss": -11.856527328491211, "global_step": 246670, "epoch": 1468} {"train_loss": -11.88766098022461, "global_step": 246671, "epoch": 1468} {"train_loss": -11.769745826721191, "global_step": 246672, "epoch": 1468} {"train_loss": -11.747682571411133, "global_step": 246673, "epoch": 1468} {"train_loss": -11.784444808959961, "global_step": 246674, "epoch": 1468} {"train_loss": -11.907417297363281, "global_step": 246675, "epoch": 1468} {"train_loss": -11.873289108276367, "global_step": 246676, "epoch": 1468} {"train_loss": -11.7371826171875, "global_step": 246677, "epoch": 1468} {"train_loss": -11.707769393920898, "global_step": 246678, "epoch": 1468} {"train_loss": -12.134117126464844, "global_step": 246679, "epoch": 1468} {"train_loss": -12.03537654876709, "global_step": 246680, "epoch": 1468} {"train_loss": -12.105613708496094, "global_step": 246681, "epoch": 1468} {"train_loss": -11.942609786987305, "global_step": 246682, "epoch": 1468} {"train_loss": -12.070606231689453, "global_step": 246683, "epoch": 1468} {"train_loss": -11.938919067382812, "global_step": 246684, "epoch": 1468} {"train_loss": -12.103139877319336, "global_step": 246685, "epoch": 1468} {"train_loss": -11.91826343536377, "global_step": 246686, "epoch": 1468} {"train_loss": -11.678777694702148, "global_step": 246687, "epoch": 1468} {"train_loss": -12.08845043182373, "global_step": 246688, "epoch": 1468} {"train_loss": -11.921295166015625, "global_step": 246689, "epoch": 1468} {"train_loss": -12.020121574401855, "global_step": 246690, "epoch": 1468} {"train_loss": -11.778929710388184, "global_step": 246691, "epoch": 1468} {"train_loss": -11.91080093383789, "global_step": 246692, "epoch": 1468} {"train_loss": -11.85084342956543, "global_step": 246693, "epoch": 1468} {"train_loss": -11.92048454284668, "global_step": 246694, "epoch": 1468} {"train_loss": -11.379429817199707, "global_step": 246695, "epoch": 1468} {"train_loss": -12.049982070922852, "global_step": 246696, "epoch": 1468} {"train_loss": -11.717391967773438, "global_step": 246697, "epoch": 1468} {"train_loss": -12.039722442626953, "global_step": 246698, "epoch": 1468} {"train_loss": -11.714704513549805, "global_step": 246699, "epoch": 1468} {"train_loss": -12.058538436889648, "global_step": 246700, "epoch": 1468} {"train_loss": -11.821290969848633, "global_step": 246701, "epoch": 1468} {"train_loss": -12.14385986328125, "global_step": 246702, "epoch": 1468} {"train_loss": -11.95833969116211, "global_step": 246703, "epoch": 1468} {"train_loss": -12.019745826721191, "global_step": 246704, "epoch": 1468} {"train_loss": -11.657389640808105, "global_step": 246705, "epoch": 1468} {"train_loss": -11.504528045654297, "global_step": 246706, "epoch": 1468} {"train_loss": -11.46251106262207, "global_step": 246707, "epoch": 1468} {"train_loss": -11.88254165649414, "global_step": 246708, "epoch": 1468} {"train_loss": -11.643293380737305, "global_step": 246709, "epoch": 1468} {"train_loss": -11.781970024108887, "global_step": 246710, "epoch": 1468} {"train_loss": -11.529203414916992, "global_step": 246711, "epoch": 1468} {"train_loss": -12.009542465209961, "global_step": 246712, "epoch": 1468} {"train_loss": -11.597121238708496, "global_step": 246713, "epoch": 1468} {"train_loss": -11.776473999023438, "global_step": 246714, "epoch": 1468} {"train_loss": -11.652725219726562, "global_step": 246715, "epoch": 1468} {"train_loss": -11.652095794677734, "global_step": 246716, "epoch": 1468} {"train_loss": -11.6839599609375, "global_step": 246717, "epoch": 1468} {"train_loss": -11.546257019042969, "global_step": 246718, "epoch": 1468} {"train_loss": -11.662713050842285, "global_step": 246719, "epoch": 1468} {"train_loss": -11.378946304321289, "global_step": 246720, "epoch": 1468} {"train_loss": -11.850692749023438, "global_step": 246721, "epoch": 1468} {"train_loss": -10.470005989074707, "global_step": 246722, "epoch": 1468} {"train_loss": -11.528852462768555, "global_step": 246723, "epoch": 1468} {"train_loss": -11.512380599975586, "global_step": 246724, "epoch": 1468} {"train_loss": -11.809206008911133, "global_step": 246725, "epoch": 1468} {"train_loss": -10.686882019042969, "global_step": 246726, "epoch": 1468} {"train_loss": -11.789787292480469, "global_step": 246727, "epoch": 1468} {"train_loss": -10.992243766784668, "global_step": 246728, "epoch": 1468} {"train_loss": -11.574294090270996, "global_step": 246729, "epoch": 1468} {"train_loss": -10.934289932250977, "global_step": 246730, "epoch": 1468} {"train_loss": -11.630409240722656, "global_step": 246731, "epoch": 1468} {"train_loss": -10.757898330688477, "global_step": 246732, "epoch": 1468} {"train_loss": -10.202568054199219, "global_step": 246733, "epoch": 1468} {"train_loss": -11.789265632629395, "global_step": 246734, "epoch": 1468} {"train_loss": -11.301572799682617, "global_step": 246735, "epoch": 1468} {"train_loss": -11.34836483001709, "global_step": 246736, "epoch": 1468} {"train_loss": -11.83709716796875, "global_step": 246737, "epoch": 1468} {"train_loss": -11.769338607788086, "global_step": 246738, "epoch": 1468} {"train_loss": -11.49372673034668, "global_step": 246739, "epoch": 1468} {"train_loss": -11.580432891845703, "global_step": 246740, "epoch": 1468} {"train_loss": -11.89714241027832, "global_step": 246741, "epoch": 1468} {"train_loss": -11.663654327392578, "global_step": 246742, "epoch": 1468} {"train_loss": -11.78689956665039, "global_step": 246743, "epoch": 1468} {"train_loss": -11.666799545288086, "global_step": 246744, "epoch": 1468} {"train_loss": -11.800344467163086, "global_step": 246745, "epoch": 1468} {"train_loss": -11.326579093933105, "global_step": 246746, "epoch": 1468} {"train_loss": -11.828924179077148, "global_step": 246747, "epoch": 1468} {"train_loss": -11.291830062866211, "global_step": 246748, "epoch": 1468} {"train_loss": -11.65219497680664, "global_step": 246749, "epoch": 1468} {"train_loss": -11.244010925292969, "global_step": 246750, "epoch": 1468} {"train_loss": -11.307605743408203, "global_step": 246751, "epoch": 1468} {"train_loss": -11.307012557983398, "global_step": 246752, "epoch": 1468} {"train_loss": -11.282987594604492, "global_step": 246753, "epoch": 1468} {"train_loss": -11.295310974121094, "global_step": 246754, "epoch": 1468} {"train_loss": -11.496726989746094, "global_step": 246755, "epoch": 1468} {"train_loss": -11.728334426879883, "global_step": 246756, "epoch": 1468} {"train_loss": -11.196200370788574, "global_step": 246757, "epoch": 1468} {"train_loss": -11.662744522094727, "global_step": 246758, "epoch": 1468} {"train_loss": -11.596635818481445, "global_step": 246759, "epoch": 1468} {"train_loss": -11.789022445678711, "global_step": 246760, "epoch": 1468} {"train_loss": -11.745655059814453, "global_step": 246761, "epoch": 1468} {"train_loss": -11.615448951721191, "global_step": 246762, "epoch": 1468} {"train_loss": -11.588955879211426, "global_step": 246763, "epoch": 1468} {"train_loss": -11.917572975158691, "global_step": 246764, "epoch": 1468} {"train_loss": -11.632511138916016, "global_step": 246765, "epoch": 1468} {"train_loss": -11.479795455932617, "global_step": 246766, "epoch": 1468} {"train_loss": -11.518232345581055, "global_step": 246767, "epoch": 1468} {"train_loss": -11.502355575561523, "global_step": 246768, "epoch": 1468} {"train_loss": -11.775066375732422, "global_step": 246769, "epoch": 1468} {"train_loss": -11.669759750366211, "global_step": 246770, "epoch": 1468} {"train_loss": -11.792709350585938, "global_step": 246771, "epoch": 1468} {"train_loss": -11.414840698242188, "global_step": 246772, "epoch": 1468} {"train_loss": -11.887350082397461, "global_step": 246773, "epoch": 1468} {"train_loss": -11.665647506713867, "global_step": 246774, "epoch": 1468} {"train_loss": -11.282878875732422, "global_step": 246775, "epoch": 1468} {"train_loss": -11.71080493927002, "global_step": 246776, "epoch": 1468} {"train_loss": -11.802641868591309, "global_step": 246777, "epoch": 1468} {"train_loss": -11.766468048095703, "global_step": 246778, "epoch": 1468} {"train_loss": -11.825661659240723, "global_step": 246779, "epoch": 1468} {"train_loss": -11.731338500976562, "global_step": 246780, "epoch": 1468} {"train_loss": -12.022141456604004, "global_step": 246781, "epoch": 1468} {"train_loss": -11.960494995117188, "global_step": 246782, "epoch": 1468} {"train_loss": -11.747657775878906, "global_step": 246783, "epoch": 1468} {"train_loss": -12.169204711914062, "global_step": 246784, "epoch": 1468} {"train_loss": -11.534801483154297, "global_step": 246785, "epoch": 1468} {"train_loss": -11.982063293457031, "global_step": 246786, "epoch": 1468} {"train_loss": -11.884029388427734, "global_step": 246787, "epoch": 1468} {"train_loss": -11.395345687866211, "global_step": 246788, "epoch": 1468} {"train_loss": -11.875751495361328, "global_step": 246789, "epoch": 1468} {"train_loss": -11.501876831054688, "global_step": 246790, "epoch": 1468} {"train_loss": -11.599207878112793, "global_step": 246791, "epoch": 1468, "val_loss": 271489.90625} {"train_loss": -11.451263427734375, "global_step": 246792, "epoch": 1469} {"train_loss": -11.884989738464355, "global_step": 246793, "epoch": 1469} {"train_loss": -11.63154125213623, "global_step": 246794, "epoch": 1469} {"train_loss": -11.843766212463379, "global_step": 246795, "epoch": 1469} {"train_loss": -11.880767822265625, "global_step": 246796, "epoch": 1469} {"train_loss": -11.766554832458496, "global_step": 246797, "epoch": 1469} {"train_loss": -12.156391143798828, "global_step": 246798, "epoch": 1469} {"train_loss": -11.718255996704102, "global_step": 246799, "epoch": 1469} {"train_loss": -11.903322219848633, "global_step": 246800, "epoch": 1469} {"train_loss": -12.094772338867188, "global_step": 246801, "epoch": 1469} {"train_loss": -11.498282432556152, "global_step": 246802, "epoch": 1469} {"train_loss": -11.951150894165039, "global_step": 246803, "epoch": 1469} {"train_loss": -11.64728832244873, "global_step": 246804, "epoch": 1469} {"train_loss": -12.018948554992676, "global_step": 246805, "epoch": 1469} {"train_loss": -11.944413185119629, "global_step": 246806, "epoch": 1469} {"train_loss": -11.923677444458008, "global_step": 246807, "epoch": 1469} {"train_loss": -11.748008728027344, "global_step": 246808, "epoch": 1469} {"train_loss": -11.612117767333984, "global_step": 246809, "epoch": 1469} {"train_loss": -12.296859741210938, "global_step": 246810, "epoch": 1469} {"train_loss": -11.780855178833008, "global_step": 246811, "epoch": 1469} {"train_loss": -12.079658508300781, "global_step": 246812, "epoch": 1469} {"train_loss": -12.143367767333984, "global_step": 246813, "epoch": 1469} {"train_loss": -12.207740783691406, "global_step": 246814, "epoch": 1469} {"train_loss": -12.200705528259277, "global_step": 246815, "epoch": 1469} {"train_loss": -12.17340087890625, "global_step": 246816, "epoch": 1469} {"train_loss": -12.09223747253418, "global_step": 246817, "epoch": 1469} {"train_loss": -12.130566596984863, "global_step": 246818, "epoch": 1469} {"train_loss": -11.999774932861328, "global_step": 246819, "epoch": 1469} {"train_loss": -11.984701156616211, "global_step": 246820, "epoch": 1469} {"train_loss": -12.274504661560059, "global_step": 246821, "epoch": 1469} {"train_loss": -11.952252388000488, "global_step": 246822, "epoch": 1469} {"train_loss": -12.266660690307617, "global_step": 246823, "epoch": 1469} {"train_loss": -12.145355224609375, "global_step": 246824, "epoch": 1469} {"train_loss": -11.961334228515625, "global_step": 246825, "epoch": 1469} {"train_loss": -12.117044448852539, "global_step": 246826, "epoch": 1469} {"train_loss": -12.039880752563477, "global_step": 246827, "epoch": 1469} {"train_loss": -11.893436431884766, "global_step": 246828, "epoch": 1469} {"train_loss": -11.003240585327148, "global_step": 246829, "epoch": 1469} {"train_loss": -12.026222229003906, "global_step": 246830, "epoch": 1469} {"train_loss": -11.949764251708984, "global_step": 246831, "epoch": 1469} {"train_loss": -11.16585922241211, "global_step": 246832, "epoch": 1469} {"train_loss": -10.825532913208008, "global_step": 246833, "epoch": 1469} {"train_loss": -11.784590721130371, "global_step": 246834, "epoch": 1469} {"train_loss": -11.14409065246582, "global_step": 246835, "epoch": 1469} {"train_loss": -9.827560424804688, "global_step": 246836, "epoch": 1469} {"train_loss": -10.728394508361816, "global_step": 246837, "epoch": 1469} {"train_loss": -11.651163101196289, "global_step": 246838, "epoch": 1469} {"train_loss": -11.231008529663086, "global_step": 246839, "epoch": 1469} {"train_loss": -10.864142417907715, "global_step": 246840, "epoch": 1469} {"train_loss": -10.234546661376953, "global_step": 246841, "epoch": 1469} {"train_loss": -9.324432373046875, "global_step": 246842, "epoch": 1469} {"train_loss": -8.513555526733398, "global_step": 246843, "epoch": 1469} {"train_loss": -10.748897552490234, "global_step": 246844, "epoch": 1469} {"train_loss": -8.974832534790039, "global_step": 246845, "epoch": 1469} {"train_loss": -10.720026016235352, "global_step": 246846, "epoch": 1469} {"train_loss": -10.047375679016113, "global_step": 246847, "epoch": 1469} {"train_loss": -9.619661331176758, "global_step": 246848, "epoch": 1469} {"train_loss": -10.38104248046875, "global_step": 246849, "epoch": 1469} {"train_loss": -10.327471733093262, "global_step": 246850, "epoch": 1469} {"train_loss": -11.058263778686523, "global_step": 246851, "epoch": 1469} {"train_loss": -10.16119384765625, "global_step": 246852, "epoch": 1469} {"train_loss": -10.589836120605469, "global_step": 246853, "epoch": 1469} {"train_loss": -10.006787300109863, "global_step": 246854, "epoch": 1469} {"train_loss": -9.329541206359863, "global_step": 246855, "epoch": 1469} {"train_loss": -11.340103149414062, "global_step": 246856, "epoch": 1469} {"train_loss": -10.124154090881348, "global_step": 246857, "epoch": 1469} {"train_loss": -10.1303129196167, "global_step": 246858, "epoch": 1469} {"train_loss": -10.445552825927734, "global_step": 246859, "epoch": 1469} {"train_loss": -9.8594331741333, "global_step": 246860, "epoch": 1469} {"train_loss": -11.020536422729492, "global_step": 246861, "epoch": 1469} {"train_loss": -10.744844436645508, "global_step": 246862, "epoch": 1469} {"train_loss": -10.636978149414062, "global_step": 246863, "epoch": 1469} {"train_loss": -11.171284675598145, "global_step": 246864, "epoch": 1469} {"train_loss": -11.115735054016113, "global_step": 246865, "epoch": 1469} {"train_loss": -10.917621612548828, "global_step": 246866, "epoch": 1469} {"train_loss": -11.251285552978516, "global_step": 246867, "epoch": 1469} {"train_loss": -10.924501419067383, "global_step": 246868, "epoch": 1469} {"train_loss": -11.357060432434082, "global_step": 246869, "epoch": 1469} {"train_loss": -11.372541427612305, "global_step": 246870, "epoch": 1469} {"train_loss": -10.743021011352539, "global_step": 246871, "epoch": 1469} {"train_loss": -11.592863082885742, "global_step": 246872, "epoch": 1469} {"train_loss": -11.280698776245117, "global_step": 246873, "epoch": 1469} {"train_loss": -11.036720275878906, "global_step": 246874, "epoch": 1469} {"train_loss": -11.118986129760742, "global_step": 246875, "epoch": 1469} {"train_loss": -11.027328491210938, "global_step": 246876, "epoch": 1469} {"train_loss": -11.25732421875, "global_step": 246877, "epoch": 1469} {"train_loss": -11.219647407531738, "global_step": 246878, "epoch": 1469} {"train_loss": -11.36861515045166, "global_step": 246879, "epoch": 1469} {"train_loss": -11.400423049926758, "global_step": 246880, "epoch": 1469} {"train_loss": -11.61772346496582, "global_step": 246881, "epoch": 1469} {"train_loss": -11.471823692321777, "global_step": 246882, "epoch": 1469} {"train_loss": -11.488752365112305, "global_step": 246883, "epoch": 1469} {"train_loss": -11.29315185546875, "global_step": 246884, "epoch": 1469} {"train_loss": -11.637656211853027, "global_step": 246885, "epoch": 1469} {"train_loss": -11.636356353759766, "global_step": 246886, "epoch": 1469} {"train_loss": -11.502029418945312, "global_step": 246887, "epoch": 1469} {"train_loss": -11.604620933532715, "global_step": 246888, "epoch": 1469} {"train_loss": -11.36709213256836, "global_step": 246889, "epoch": 1469} {"train_loss": -11.682134628295898, "global_step": 246890, "epoch": 1469} {"train_loss": -11.454715728759766, "global_step": 246891, "epoch": 1469} {"train_loss": -11.643816947937012, "global_step": 246892, "epoch": 1469} {"train_loss": -11.571439743041992, "global_step": 246893, "epoch": 1469} {"train_loss": -11.559547424316406, "global_step": 246894, "epoch": 1469} {"train_loss": -11.817078590393066, "global_step": 246895, "epoch": 1469} {"train_loss": -11.610414505004883, "global_step": 246896, "epoch": 1469} {"train_loss": -11.87066650390625, "global_step": 246897, "epoch": 1469} {"train_loss": -11.751106262207031, "global_step": 246898, "epoch": 1469} {"train_loss": -12.060685157775879, "global_step": 246899, "epoch": 1469} {"train_loss": -11.508545875549316, "global_step": 246900, "epoch": 1469} {"train_loss": -11.877815246582031, "global_step": 246901, "epoch": 1469} {"train_loss": -11.783912658691406, "global_step": 246902, "epoch": 1469} {"train_loss": -11.908467292785645, "global_step": 246903, "epoch": 1469} {"train_loss": -11.724687576293945, "global_step": 246904, "epoch": 1469} {"train_loss": -11.954914093017578, "global_step": 246905, "epoch": 1469} {"train_loss": -11.503511428833008, "global_step": 246906, "epoch": 1469} {"train_loss": -11.635622024536133, "global_step": 246907, "epoch": 1469} {"train_loss": -11.887202262878418, "global_step": 246908, "epoch": 1469} {"train_loss": -11.720354080200195, "global_step": 246909, "epoch": 1469} {"train_loss": -11.958274841308594, "global_step": 246910, "epoch": 1469} {"train_loss": -11.982099533081055, "global_step": 246911, "epoch": 1469} {"train_loss": -11.888522148132324, "global_step": 246912, "epoch": 1469} {"train_loss": -11.944243431091309, "global_step": 246913, "epoch": 1469} {"train_loss": -11.875761032104492, "global_step": 246914, "epoch": 1469} {"train_loss": -12.032891273498535, "global_step": 246915, "epoch": 1469} {"train_loss": -11.997858047485352, "global_step": 246916, "epoch": 1469} {"train_loss": -12.024992942810059, "global_step": 246917, "epoch": 1469} {"train_loss": -11.748066902160645, "global_step": 246918, "epoch": 1469} {"train_loss": -11.905136108398438, "global_step": 246919, "epoch": 1469} {"train_loss": -12.014327049255371, "global_step": 246920, "epoch": 1469} {"train_loss": -11.940853118896484, "global_step": 246921, "epoch": 1469} {"train_loss": -11.882072448730469, "global_step": 246922, "epoch": 1469} {"train_loss": -11.994182586669922, "global_step": 246923, "epoch": 1469} {"train_loss": -11.937914848327637, "global_step": 246924, "epoch": 1469} {"train_loss": -12.07486629486084, "global_step": 246925, "epoch": 1469} {"train_loss": -12.039353370666504, "global_step": 246926, "epoch": 1469} {"train_loss": -12.149260520935059, "global_step": 246927, "epoch": 1469} {"train_loss": -12.067084312438965, "global_step": 246928, "epoch": 1469} {"train_loss": -12.166524887084961, "global_step": 246929, "epoch": 1469} {"train_loss": -12.214563369750977, "global_step": 246930, "epoch": 1469} {"train_loss": -11.967016220092773, "global_step": 246931, "epoch": 1469} {"train_loss": -12.136821746826172, "global_step": 246932, "epoch": 1469} {"train_loss": -11.934030532836914, "global_step": 246933, "epoch": 1469} {"train_loss": -12.137433052062988, "global_step": 246934, "epoch": 1469} {"train_loss": -12.041646957397461, "global_step": 246935, "epoch": 1469} {"train_loss": -12.290975570678711, "global_step": 246936, "epoch": 1469} {"train_loss": -11.876810073852539, "global_step": 246937, "epoch": 1469} {"train_loss": -12.151070594787598, "global_step": 246938, "epoch": 1469} {"train_loss": -11.819046020507812, "global_step": 246939, "epoch": 1469} {"train_loss": -12.115182876586914, "global_step": 246940, "epoch": 1469} {"train_loss": -11.765615463256836, "global_step": 246941, "epoch": 1469} {"train_loss": -11.818696975708008, "global_step": 246942, "epoch": 1469} {"train_loss": -11.729764938354492, "global_step": 246943, "epoch": 1469} {"train_loss": -10.918375015258789, "global_step": 246944, "epoch": 1469} {"train_loss": -12.00212287902832, "global_step": 246945, "epoch": 1469} {"train_loss": -11.064640998840332, "global_step": 246946, "epoch": 1469} {"train_loss": -11.864356994628906, "global_step": 246947, "epoch": 1469} {"train_loss": -11.126239776611328, "global_step": 246948, "epoch": 1469} {"train_loss": -11.53758430480957, "global_step": 246949, "epoch": 1469} {"train_loss": -11.180124282836914, "global_step": 246950, "epoch": 1469} {"train_loss": -11.764301300048828, "global_step": 246951, "epoch": 1469} {"train_loss": -10.836779594421387, "global_step": 246952, "epoch": 1469} {"train_loss": -11.57513427734375, "global_step": 246953, "epoch": 1469} {"train_loss": -11.177785873413086, "global_step": 246954, "epoch": 1469} {"train_loss": -11.046428680419922, "global_step": 246955, "epoch": 1469} {"train_loss": -11.488113403320312, "global_step": 246956, "epoch": 1469} {"train_loss": -11.339578628540039, "global_step": 246957, "epoch": 1469} {"train_loss": -11.027334213256836, "global_step": 246958, "epoch": 1469} {"train_loss": -11.479203973497663, "global_step": 246959, "epoch": 1469, "val_loss": 267756.46875} {"train_loss": -10.857851028442383, "global_step": 246960, "epoch": 1470} {"train_loss": -11.803302764892578, "global_step": 246961, "epoch": 1470} {"train_loss": -11.300066947937012, "global_step": 246962, "epoch": 1470} {"train_loss": -10.36583137512207, "global_step": 246963, "epoch": 1470} {"train_loss": -10.770336151123047, "global_step": 246964, "epoch": 1470} {"train_loss": -11.172813415527344, "global_step": 246965, "epoch": 1470} {"train_loss": -11.389447212219238, "global_step": 246966, "epoch": 1470} {"train_loss": -10.270658493041992, "global_step": 246967, "epoch": 1470} {"train_loss": -11.387002944946289, "global_step": 246968, "epoch": 1470} {"train_loss": -10.664812088012695, "global_step": 246969, "epoch": 1470} {"train_loss": -11.079763412475586, "global_step": 246970, "epoch": 1470} {"train_loss": -11.297622680664062, "global_step": 246971, "epoch": 1470} {"train_loss": -10.457895278930664, "global_step": 246972, "epoch": 1470} {"train_loss": -11.85912036895752, "global_step": 246973, "epoch": 1470} {"train_loss": -10.506908416748047, "global_step": 246974, "epoch": 1470} {"train_loss": -11.582269668579102, "global_step": 246975, "epoch": 1470} {"train_loss": -10.766191482543945, "global_step": 246976, "epoch": 1470} {"train_loss": -11.416531562805176, "global_step": 246977, "epoch": 1470} {"train_loss": -11.31940746307373, "global_step": 246978, "epoch": 1470} {"train_loss": -11.386150360107422, "global_step": 246979, "epoch": 1470} {"train_loss": -11.116399765014648, "global_step": 246980, "epoch": 1470} {"train_loss": -11.735475540161133, "global_step": 246981, "epoch": 1470} {"train_loss": -10.785597801208496, "global_step": 246982, "epoch": 1470} {"train_loss": -11.428924560546875, "global_step": 246983, "epoch": 1470} {"train_loss": -11.709762573242188, "global_step": 246984, "epoch": 1470} {"train_loss": -10.947927474975586, "global_step": 246985, "epoch": 1470} {"train_loss": -11.909236907958984, "global_step": 246986, "epoch": 1470} {"train_loss": -11.14804744720459, "global_step": 246987, "epoch": 1470} {"train_loss": -11.262344360351562, "global_step": 246988, "epoch": 1470} {"train_loss": -11.57394027709961, "global_step": 246989, "epoch": 1470} {"train_loss": -10.985574722290039, "global_step": 246990, "epoch": 1470} {"train_loss": -11.874192237854004, "global_step": 246991, "epoch": 1470} {"train_loss": -11.324918746948242, "global_step": 246992, "epoch": 1470} {"train_loss": -11.810470581054688, "global_step": 246993, "epoch": 1470} {"train_loss": -11.4945707321167, "global_step": 246994, "epoch": 1470} {"train_loss": -11.496505737304688, "global_step": 246995, "epoch": 1470} {"train_loss": -11.849228858947754, "global_step": 246996, "epoch": 1470} {"train_loss": -10.73733901977539, "global_step": 246997, "epoch": 1470} {"train_loss": -11.170167922973633, "global_step": 246998, "epoch": 1470} {"train_loss": -11.351238250732422, "global_step": 246999, "epoch": 1470} {"train_loss": -11.225936889648438, "global_step": 247000, "epoch": 1470} {"train_loss": -11.774093627929688, "global_step": 247001, "epoch": 1470} {"train_loss": -11.178486824035645, "global_step": 247002, "epoch": 1470} {"train_loss": -11.476755142211914, "global_step": 247003, "epoch": 1470} {"train_loss": -11.597112655639648, "global_step": 247004, "epoch": 1470} {"train_loss": -10.968259811401367, "global_step": 247005, "epoch": 1470} {"train_loss": -11.777257919311523, "global_step": 247006, "epoch": 1470} {"train_loss": -10.945697784423828, "global_step": 247007, "epoch": 1470} {"train_loss": -11.949943542480469, "global_step": 247008, "epoch": 1470} {"train_loss": -11.320318222045898, "global_step": 247009, "epoch": 1470} {"train_loss": -11.776975631713867, "global_step": 247010, "epoch": 1470} {"train_loss": -11.660820960998535, "global_step": 247011, "epoch": 1470} {"train_loss": -11.824966430664062, "global_step": 247012, "epoch": 1470} {"train_loss": -12.003173828125, "global_step": 247013, "epoch": 1470} {"train_loss": -11.825593948364258, "global_step": 247014, "epoch": 1470} {"train_loss": -11.951533317565918, "global_step": 247015, "epoch": 1470} {"train_loss": -11.63939094543457, "global_step": 247016, "epoch": 1470} {"train_loss": -12.004289627075195, "global_step": 247017, "epoch": 1470} {"train_loss": -11.82203483581543, "global_step": 247018, "epoch": 1470} {"train_loss": -11.910198211669922, "global_step": 247019, "epoch": 1470} {"train_loss": -11.49008560180664, "global_step": 247020, "epoch": 1470} {"train_loss": -11.791030883789062, "global_step": 247021, "epoch": 1470} {"train_loss": -11.612459182739258, "global_step": 247022, "epoch": 1470} {"train_loss": -11.78937816619873, "global_step": 247023, "epoch": 1470} {"train_loss": -11.657608985900879, "global_step": 247024, "epoch": 1470} {"train_loss": -11.472814559936523, "global_step": 247025, "epoch": 1470} {"train_loss": -11.668917655944824, "global_step": 247026, "epoch": 1470} {"train_loss": -11.434919357299805, "global_step": 247027, "epoch": 1470} {"train_loss": -11.82351303100586, "global_step": 247028, "epoch": 1470} {"train_loss": -11.812555313110352, "global_step": 247029, "epoch": 1470} {"train_loss": -11.55903148651123, "global_step": 247030, "epoch": 1470} {"train_loss": -11.798233985900879, "global_step": 247031, "epoch": 1470} {"train_loss": -11.84976577758789, "global_step": 247032, "epoch": 1470} {"train_loss": -12.095298767089844, "global_step": 247033, "epoch": 1470} {"train_loss": -11.97128677368164, "global_step": 247034, "epoch": 1470} {"train_loss": -12.165884017944336, "global_step": 247035, "epoch": 1470} {"train_loss": -12.097784042358398, "global_step": 247036, "epoch": 1470} {"train_loss": -11.983219146728516, "global_step": 247037, "epoch": 1470} {"train_loss": -12.037887573242188, "global_step": 247038, "epoch": 1470} {"train_loss": -12.123556137084961, "global_step": 247039, "epoch": 1470} {"train_loss": -11.872110366821289, "global_step": 247040, "epoch": 1470} {"train_loss": -11.95811653137207, "global_step": 247041, "epoch": 1470} {"train_loss": -11.964275360107422, "global_step": 247042, "epoch": 1470} {"train_loss": -12.1498384475708, "global_step": 247043, "epoch": 1470} {"train_loss": -12.111005783081055, "global_step": 247044, "epoch": 1470} {"train_loss": -12.0391263961792, "global_step": 247045, "epoch": 1470} {"train_loss": -12.194435119628906, "global_step": 247046, "epoch": 1470} {"train_loss": -11.858142852783203, "global_step": 247047, "epoch": 1470} {"train_loss": -12.027704238891602, "global_step": 247048, "epoch": 1470} {"train_loss": -11.97434139251709, "global_step": 247049, "epoch": 1470} {"train_loss": -12.019791603088379, "global_step": 247050, "epoch": 1470} {"train_loss": -11.76179313659668, "global_step": 247051, "epoch": 1470} {"train_loss": -11.905420303344727, "global_step": 247052, "epoch": 1470} {"train_loss": -11.982511520385742, "global_step": 247053, "epoch": 1470} {"train_loss": -11.706015586853027, "global_step": 247054, "epoch": 1470} {"train_loss": -12.025382995605469, "global_step": 247055, "epoch": 1470} {"train_loss": -11.574413299560547, "global_step": 247056, "epoch": 1470} {"train_loss": -11.756027221679688, "global_step": 247057, "epoch": 1470} {"train_loss": -11.654759407043457, "global_step": 247058, "epoch": 1470} {"train_loss": -12.130284309387207, "global_step": 247059, "epoch": 1470} {"train_loss": -10.999564170837402, "global_step": 247060, "epoch": 1470} {"train_loss": -11.031855583190918, "global_step": 247061, "epoch": 1470} {"train_loss": -10.789491653442383, "global_step": 247062, "epoch": 1470} {"train_loss": -10.970399856567383, "global_step": 247063, "epoch": 1470} {"train_loss": -11.078787803649902, "global_step": 247064, "epoch": 1470} {"train_loss": -11.534236907958984, "global_step": 247065, "epoch": 1470} {"train_loss": -11.343118667602539, "global_step": 247066, "epoch": 1470} {"train_loss": -11.69244384765625, "global_step": 247067, "epoch": 1470} {"train_loss": -11.66103458404541, "global_step": 247068, "epoch": 1470} {"train_loss": -11.636573791503906, "global_step": 247069, "epoch": 1470} {"train_loss": -11.880975723266602, "global_step": 247070, "epoch": 1470} {"train_loss": -11.38493537902832, "global_step": 247071, "epoch": 1470} {"train_loss": -11.708105087280273, "global_step": 247072, "epoch": 1470} {"train_loss": -11.851325988769531, "global_step": 247073, "epoch": 1470} {"train_loss": -10.872913360595703, "global_step": 247074, "epoch": 1470} {"train_loss": -11.19186782836914, "global_step": 247075, "epoch": 1470} {"train_loss": -11.909549713134766, "global_step": 247076, "epoch": 1470} {"train_loss": -11.748039245605469, "global_step": 247077, "epoch": 1470} {"train_loss": -11.255072593688965, "global_step": 247078, "epoch": 1470} {"train_loss": -11.81621265411377, "global_step": 247079, "epoch": 1470} {"train_loss": -11.88779067993164, "global_step": 247080, "epoch": 1470} {"train_loss": -11.653543472290039, "global_step": 247081, "epoch": 1470} {"train_loss": -11.667961120605469, "global_step": 247082, "epoch": 1470} {"train_loss": -11.941473960876465, "global_step": 247083, "epoch": 1470} {"train_loss": -11.889747619628906, "global_step": 247084, "epoch": 1470} {"train_loss": -11.924474716186523, "global_step": 247085, "epoch": 1470} {"train_loss": -11.945258140563965, "global_step": 247086, "epoch": 1470} {"train_loss": -11.762462615966797, "global_step": 247087, "epoch": 1470} {"train_loss": -11.899105072021484, "global_step": 247088, "epoch": 1470} {"train_loss": -11.688541412353516, "global_step": 247089, "epoch": 1470} {"train_loss": -11.476293563842773, "global_step": 247090, "epoch": 1470} {"train_loss": -11.535051345825195, "global_step": 247091, "epoch": 1470} {"train_loss": -12.059089660644531, "global_step": 247092, "epoch": 1470} {"train_loss": -11.565418243408203, "global_step": 247093, "epoch": 1470} {"train_loss": -11.64426040649414, "global_step": 247094, "epoch": 1470} {"train_loss": -11.676698684692383, "global_step": 247095, "epoch": 1470} {"train_loss": -11.62756061553955, "global_step": 247096, "epoch": 1470} {"train_loss": -11.952749252319336, "global_step": 247097, "epoch": 1470} {"train_loss": -12.012434005737305, "global_step": 247098, "epoch": 1470} {"train_loss": -12.027154922485352, "global_step": 247099, "epoch": 1470} {"train_loss": -11.763641357421875, "global_step": 247100, "epoch": 1470} {"train_loss": -11.6446533203125, "global_step": 247101, "epoch": 1470} {"train_loss": -11.748398780822754, "global_step": 247102, "epoch": 1470} {"train_loss": -11.744804382324219, "global_step": 247103, "epoch": 1470} {"train_loss": -11.762261390686035, "global_step": 247104, "epoch": 1470} {"train_loss": -11.99348258972168, "global_step": 247105, "epoch": 1470} {"train_loss": -12.195903778076172, "global_step": 247106, "epoch": 1470} {"train_loss": -12.033355712890625, "global_step": 247107, "epoch": 1470} {"train_loss": -12.113529205322266, "global_step": 247108, "epoch": 1470} {"train_loss": -12.154802322387695, "global_step": 247109, "epoch": 1470} {"train_loss": -11.806034088134766, "global_step": 247110, "epoch": 1470} {"train_loss": -11.764823913574219, "global_step": 247111, "epoch": 1470} {"train_loss": -11.870816230773926, "global_step": 247112, "epoch": 1470} {"train_loss": -11.846799850463867, "global_step": 247113, "epoch": 1470} {"train_loss": -11.810646057128906, "global_step": 247114, "epoch": 1470} {"train_loss": -11.815570831298828, "global_step": 247115, "epoch": 1470} {"train_loss": -11.915066719055176, "global_step": 247116, "epoch": 1470} {"train_loss": -11.553503036499023, "global_step": 247117, "epoch": 1470} {"train_loss": -11.757020950317383, "global_step": 247118, "epoch": 1470} {"train_loss": -12.10915756225586, "global_step": 247119, "epoch": 1470} {"train_loss": -11.688321113586426, "global_step": 247120, "epoch": 1470} {"train_loss": -11.74089241027832, "global_step": 247121, "epoch": 1470} {"train_loss": -11.812675476074219, "global_step": 247122, "epoch": 1470} {"train_loss": -12.226736068725586, "global_step": 247123, "epoch": 1470} {"train_loss": -12.079108238220215, "global_step": 247124, "epoch": 1470} {"train_loss": -12.109519004821777, "global_step": 247125, "epoch": 1470} {"train_loss": -11.71245002746582, "global_step": 247126, "epoch": 1470} {"train_loss": -11.628872133436657, "global_step": 247127, "epoch": 1470, "val_loss": 268337.5625, "train_action_mse_error": 1.6065977811813354} {"train_loss": -11.975652694702148, "global_step": 247128, "epoch": 1471} {"train_loss": -12.027021408081055, "global_step": 247129, "epoch": 1471} {"train_loss": -11.994117736816406, "global_step": 247130, "epoch": 1471} {"train_loss": -12.03168773651123, "global_step": 247131, "epoch": 1471} {"train_loss": -11.983182907104492, "global_step": 247132, "epoch": 1471} {"train_loss": -11.745851516723633, "global_step": 247133, "epoch": 1471} {"train_loss": -11.572015762329102, "global_step": 247134, "epoch": 1471} {"train_loss": -10.953088760375977, "global_step": 247135, "epoch": 1471} {"train_loss": -10.812220573425293, "global_step": 247136, "epoch": 1471} {"train_loss": -9.994424819946289, "global_step": 247137, "epoch": 1471} {"train_loss": -10.323397636413574, "global_step": 247138, "epoch": 1471} {"train_loss": -9.300382614135742, "global_step": 247139, "epoch": 1471} {"train_loss": -9.060508728027344, "global_step": 247140, "epoch": 1471} {"train_loss": -11.352263450622559, "global_step": 247141, "epoch": 1471} {"train_loss": -9.890687942504883, "global_step": 247142, "epoch": 1471} {"train_loss": -10.811470031738281, "global_step": 247143, "epoch": 1471} {"train_loss": -10.5411376953125, "global_step": 247144, "epoch": 1471} {"train_loss": -10.592411041259766, "global_step": 247145, "epoch": 1471} {"train_loss": -10.307939529418945, "global_step": 247146, "epoch": 1471} {"train_loss": -10.256043434143066, "global_step": 247147, "epoch": 1471} {"train_loss": -9.68690299987793, "global_step": 247148, "epoch": 1471} {"train_loss": -9.992839813232422, "global_step": 247149, "epoch": 1471} {"train_loss": -10.043397903442383, "global_step": 247150, "epoch": 1471} {"train_loss": -8.108458518981934, "global_step": 247151, "epoch": 1471} {"train_loss": -10.744864463806152, "global_step": 247152, "epoch": 1471} {"train_loss": -9.846630096435547, "global_step": 247153, "epoch": 1471} {"train_loss": -9.950759887695312, "global_step": 247154, "epoch": 1471} {"train_loss": -10.99839973449707, "global_step": 247155, "epoch": 1471} {"train_loss": -10.199872970581055, "global_step": 247156, "epoch": 1471} {"train_loss": -10.622913360595703, "global_step": 247157, "epoch": 1471} {"train_loss": -11.07040023803711, "global_step": 247158, "epoch": 1471} {"train_loss": -10.779059410095215, "global_step": 247159, "epoch": 1471} {"train_loss": -11.134353637695312, "global_step": 247160, "epoch": 1471} {"train_loss": -11.294061660766602, "global_step": 247161, "epoch": 1471} {"train_loss": -11.21530818939209, "global_step": 247162, "epoch": 1471} {"train_loss": -10.996719360351562, "global_step": 247163, "epoch": 1471} {"train_loss": -11.053627014160156, "global_step": 247164, "epoch": 1471} {"train_loss": -10.76262092590332, "global_step": 247165, "epoch": 1471} {"train_loss": -11.31692123413086, "global_step": 247166, "epoch": 1471} {"train_loss": -11.140251159667969, "global_step": 247167, "epoch": 1471} {"train_loss": -10.759679794311523, "global_step": 247168, "epoch": 1471} {"train_loss": -11.530257225036621, "global_step": 247169, "epoch": 1471} {"train_loss": -11.09467887878418, "global_step": 247170, "epoch": 1471} {"train_loss": -11.24074935913086, "global_step": 247171, "epoch": 1471} {"train_loss": -11.55254077911377, "global_step": 247172, "epoch": 1471} {"train_loss": -10.914371490478516, "global_step": 247173, "epoch": 1471} {"train_loss": -11.547223091125488, "global_step": 247174, "epoch": 1471} {"train_loss": -11.299710273742676, "global_step": 247175, "epoch": 1471} {"train_loss": -10.787740707397461, "global_step": 247176, "epoch": 1471} {"train_loss": -11.582764625549316, "global_step": 247177, "epoch": 1471} {"train_loss": -11.215001106262207, "global_step": 247178, "epoch": 1471} {"train_loss": -11.442225456237793, "global_step": 247179, "epoch": 1471} {"train_loss": -11.367886543273926, "global_step": 247180, "epoch": 1471} {"train_loss": -10.872098922729492, "global_step": 247181, "epoch": 1471} {"train_loss": -11.415608406066895, "global_step": 247182, "epoch": 1471} {"train_loss": -11.051298141479492, "global_step": 247183, "epoch": 1471} {"train_loss": -11.341885566711426, "global_step": 247184, "epoch": 1471} {"train_loss": -11.467852592468262, "global_step": 247185, "epoch": 1471} {"train_loss": -11.185497283935547, "global_step": 247186, "epoch": 1471} {"train_loss": -11.82098388671875, "global_step": 247187, "epoch": 1471} {"train_loss": -11.145957946777344, "global_step": 247188, "epoch": 1471} {"train_loss": -11.453067779541016, "global_step": 247189, "epoch": 1471} {"train_loss": -11.443685531616211, "global_step": 247190, "epoch": 1471} {"train_loss": -11.40316390991211, "global_step": 247191, "epoch": 1471} {"train_loss": -11.567584991455078, "global_step": 247192, "epoch": 1471} {"train_loss": -11.433286666870117, "global_step": 247193, "epoch": 1471} {"train_loss": -11.393799781799316, "global_step": 247194, "epoch": 1471} {"train_loss": -11.60183334350586, "global_step": 247195, "epoch": 1471} {"train_loss": -11.427678108215332, "global_step": 247196, "epoch": 1471} {"train_loss": -11.700645446777344, "global_step": 247197, "epoch": 1471} {"train_loss": -11.825736999511719, "global_step": 247198, "epoch": 1471} {"train_loss": -11.598089218139648, "global_step": 247199, "epoch": 1471} {"train_loss": -11.497758865356445, "global_step": 247200, "epoch": 1471} {"train_loss": -11.700276374816895, "global_step": 247201, "epoch": 1471} {"train_loss": -11.572680473327637, "global_step": 247202, "epoch": 1471} {"train_loss": -11.72639274597168, "global_step": 247203, "epoch": 1471} {"train_loss": -11.647141456604004, "global_step": 247204, "epoch": 1471} {"train_loss": -11.822074890136719, "global_step": 247205, "epoch": 1471} {"train_loss": -11.784557342529297, "global_step": 247206, "epoch": 1471} {"train_loss": -11.814958572387695, "global_step": 247207, "epoch": 1471} {"train_loss": -11.988640785217285, "global_step": 247208, "epoch": 1471} {"train_loss": -11.825887680053711, "global_step": 247209, "epoch": 1471} {"train_loss": -11.889127731323242, "global_step": 247210, "epoch": 1471} {"train_loss": -11.917745590209961, "global_step": 247211, "epoch": 1471} {"train_loss": -11.871641159057617, "global_step": 247212, "epoch": 1471} {"train_loss": -12.072505950927734, "global_step": 247213, "epoch": 1471} {"train_loss": -11.852375030517578, "global_step": 247214, "epoch": 1471} {"train_loss": -11.988441467285156, "global_step": 247215, "epoch": 1471} {"train_loss": -11.843531608581543, "global_step": 247216, "epoch": 1471} {"train_loss": -12.046858787536621, "global_step": 247217, "epoch": 1471} {"train_loss": -12.117305755615234, "global_step": 247218, "epoch": 1471} {"train_loss": -11.973482131958008, "global_step": 247219, "epoch": 1471} {"train_loss": -11.934394836425781, "global_step": 247220, "epoch": 1471} {"train_loss": -12.141691207885742, "global_step": 247221, "epoch": 1471} {"train_loss": -12.055376052856445, "global_step": 247222, "epoch": 1471} {"train_loss": -12.033886909484863, "global_step": 247223, "epoch": 1471} {"train_loss": -12.029970169067383, "global_step": 247224, "epoch": 1471} {"train_loss": -12.216902732849121, "global_step": 247225, "epoch": 1471} {"train_loss": -12.203224182128906, "global_step": 247226, "epoch": 1471} {"train_loss": -12.103050231933594, "global_step": 247227, "epoch": 1471} {"train_loss": -12.203845977783203, "global_step": 247228, "epoch": 1471} {"train_loss": -12.251362800598145, "global_step": 247229, "epoch": 1471} {"train_loss": -12.10084342956543, "global_step": 247230, "epoch": 1471} {"train_loss": -12.104338645935059, "global_step": 247231, "epoch": 1471} {"train_loss": -12.006959915161133, "global_step": 247232, "epoch": 1471} {"train_loss": -12.03262710571289, "global_step": 247233, "epoch": 1471} {"train_loss": -12.343896865844727, "global_step": 247234, "epoch": 1471} {"train_loss": -12.268898010253906, "global_step": 247235, "epoch": 1471} {"train_loss": -12.234941482543945, "global_step": 247236, "epoch": 1471} {"train_loss": -12.206462860107422, "global_step": 247237, "epoch": 1471} {"train_loss": -12.229190826416016, "global_step": 247238, "epoch": 1471} {"train_loss": -12.154373168945312, "global_step": 247239, "epoch": 1471} {"train_loss": -12.355428695678711, "global_step": 247240, "epoch": 1471} {"train_loss": -12.109980583190918, "global_step": 247241, "epoch": 1471} {"train_loss": -12.095306396484375, "global_step": 247242, "epoch": 1471} {"train_loss": -12.064361572265625, "global_step": 247243, "epoch": 1471} {"train_loss": -12.026159286499023, "global_step": 247244, "epoch": 1471} {"train_loss": -12.189088821411133, "global_step": 247245, "epoch": 1471} {"train_loss": -12.061857223510742, "global_step": 247246, "epoch": 1471} {"train_loss": -12.069761276245117, "global_step": 247247, "epoch": 1471} {"train_loss": -12.356966972351074, "global_step": 247248, "epoch": 1471} {"train_loss": -11.745647430419922, "global_step": 247249, "epoch": 1471} {"train_loss": -11.470403671264648, "global_step": 247250, "epoch": 1471} {"train_loss": -11.633722305297852, "global_step": 247251, "epoch": 1471} {"train_loss": -11.613222122192383, "global_step": 247252, "epoch": 1471} {"train_loss": -11.901512145996094, "global_step": 247253, "epoch": 1471} {"train_loss": -12.0557222366333, "global_step": 247254, "epoch": 1471} {"train_loss": -11.271490097045898, "global_step": 247255, "epoch": 1471} {"train_loss": -12.090755462646484, "global_step": 247256, "epoch": 1471} {"train_loss": -11.620893478393555, "global_step": 247257, "epoch": 1471} {"train_loss": -11.910394668579102, "global_step": 247258, "epoch": 1471} {"train_loss": -11.373502731323242, "global_step": 247259, "epoch": 1471} {"train_loss": -11.728853225708008, "global_step": 247260, "epoch": 1471} {"train_loss": -11.14627456665039, "global_step": 247261, "epoch": 1471} {"train_loss": -11.032613754272461, "global_step": 247262, "epoch": 1471} {"train_loss": -11.329177856445312, "global_step": 247263, "epoch": 1471} {"train_loss": -11.190674781799316, "global_step": 247264, "epoch": 1471} {"train_loss": -10.554491996765137, "global_step": 247265, "epoch": 1471} {"train_loss": -10.58792781829834, "global_step": 247266, "epoch": 1471} {"train_loss": -11.645733833312988, "global_step": 247267, "epoch": 1471} {"train_loss": -10.607318878173828, "global_step": 247268, "epoch": 1471} {"train_loss": -10.477002143859863, "global_step": 247269, "epoch": 1471} {"train_loss": -9.969710350036621, "global_step": 247270, "epoch": 1471} {"train_loss": -11.268099784851074, "global_step": 247271, "epoch": 1471} {"train_loss": -11.257574081420898, "global_step": 247272, "epoch": 1471} {"train_loss": -10.499366760253906, "global_step": 247273, "epoch": 1471} {"train_loss": -9.729384422302246, "global_step": 247274, "epoch": 1471} {"train_loss": -11.636581420898438, "global_step": 247275, "epoch": 1471} {"train_loss": -10.665970802307129, "global_step": 247276, "epoch": 1471} {"train_loss": -9.95518684387207, "global_step": 247277, "epoch": 1471} {"train_loss": -11.170015335083008, "global_step": 247278, "epoch": 1471} {"train_loss": -10.979150772094727, "global_step": 247279, "epoch": 1471} {"train_loss": -11.753921508789062, "global_step": 247280, "epoch": 1471} {"train_loss": -10.534440040588379, "global_step": 247281, "epoch": 1471} {"train_loss": -11.858722686767578, "global_step": 247282, "epoch": 1471} {"train_loss": -10.81953239440918, "global_step": 247283, "epoch": 1471} {"train_loss": -11.49797248840332, "global_step": 247284, "epoch": 1471} {"train_loss": -11.498303413391113, "global_step": 247285, "epoch": 1471} {"train_loss": -11.444724082946777, "global_step": 247286, "epoch": 1471} {"train_loss": -10.93986701965332, "global_step": 247287, "epoch": 1471} {"train_loss": -10.82724666595459, "global_step": 247288, "epoch": 1471} {"train_loss": -11.456547737121582, "global_step": 247289, "epoch": 1471} {"train_loss": -10.928277015686035, "global_step": 247290, "epoch": 1471} {"train_loss": -11.038394927978516, "global_step": 247291, "epoch": 1471} {"train_loss": -11.444436073303223, "global_step": 247292, "epoch": 1471} {"train_loss": -11.044963836669922, "global_step": 247293, "epoch": 1471} {"train_loss": -11.433115005493164, "global_step": 247294, "epoch": 1471} {"train_loss": -11.352200570560637, "global_step": 247295, "epoch": 1471, "val_loss": 267629.53125} {"train_loss": -11.726278305053711, "global_step": 247296, "epoch": 1472} {"train_loss": -11.700613021850586, "global_step": 247297, "epoch": 1472} {"train_loss": -11.429991722106934, "global_step": 247298, "epoch": 1472} {"train_loss": -11.756692886352539, "global_step": 247299, "epoch": 1472} {"train_loss": -11.646198272705078, "global_step": 247300, "epoch": 1472} {"train_loss": -11.120349884033203, "global_step": 247301, "epoch": 1472} {"train_loss": -11.686873435974121, "global_step": 247302, "epoch": 1472} {"train_loss": -11.092913627624512, "global_step": 247303, "epoch": 1472} {"train_loss": -11.794525146484375, "global_step": 247304, "epoch": 1472} {"train_loss": -11.222979545593262, "global_step": 247305, "epoch": 1472} {"train_loss": -11.599845886230469, "global_step": 247306, "epoch": 1472} {"train_loss": -11.585041999816895, "global_step": 247307, "epoch": 1472} {"train_loss": -11.661266326904297, "global_step": 247308, "epoch": 1472} {"train_loss": -11.705266952514648, "global_step": 247309, "epoch": 1472} {"train_loss": -11.801928520202637, "global_step": 247310, "epoch": 1472} {"train_loss": -11.561029434204102, "global_step": 247311, "epoch": 1472} {"train_loss": -11.579565048217773, "global_step": 247312, "epoch": 1472} {"train_loss": -11.553628921508789, "global_step": 247313, "epoch": 1472} {"train_loss": -11.735491752624512, "global_step": 247314, "epoch": 1472} {"train_loss": -11.685113906860352, "global_step": 247315, "epoch": 1472} {"train_loss": -11.790853500366211, "global_step": 247316, "epoch": 1472} {"train_loss": -11.587371826171875, "global_step": 247317, "epoch": 1472} {"train_loss": -11.705423355102539, "global_step": 247318, "epoch": 1472} {"train_loss": -11.708176612854004, "global_step": 247319, "epoch": 1472} {"train_loss": -11.961552619934082, "global_step": 247320, "epoch": 1472} {"train_loss": -11.756193161010742, "global_step": 247321, "epoch": 1472} {"train_loss": -11.900747299194336, "global_step": 247322, "epoch": 1472} {"train_loss": -11.54342269897461, "global_step": 247323, "epoch": 1472} {"train_loss": -11.788656234741211, "global_step": 247324, "epoch": 1472} {"train_loss": -11.53429126739502, "global_step": 247325, "epoch": 1472} {"train_loss": -11.912734985351562, "global_step": 247326, "epoch": 1472} {"train_loss": -11.634682655334473, "global_step": 247327, "epoch": 1472} {"train_loss": -11.768587112426758, "global_step": 247328, "epoch": 1472} {"train_loss": -11.414301872253418, "global_step": 247329, "epoch": 1472} {"train_loss": -11.89017105102539, "global_step": 247330, "epoch": 1472} {"train_loss": -11.707391738891602, "global_step": 247331, "epoch": 1472} {"train_loss": -11.822515487670898, "global_step": 247332, "epoch": 1472} {"train_loss": -11.772732734680176, "global_step": 247333, "epoch": 1472} {"train_loss": -12.023338317871094, "global_step": 247334, "epoch": 1472} {"train_loss": -12.038822174072266, "global_step": 247335, "epoch": 1472} {"train_loss": -12.05527400970459, "global_step": 247336, "epoch": 1472} {"train_loss": -11.940878868103027, "global_step": 247337, "epoch": 1472} {"train_loss": -11.9447660446167, "global_step": 247338, "epoch": 1472} {"train_loss": -11.911197662353516, "global_step": 247339, "epoch": 1472} {"train_loss": -11.887673377990723, "global_step": 247340, "epoch": 1472} {"train_loss": -12.019855499267578, "global_step": 247341, "epoch": 1472} {"train_loss": -12.007908821105957, "global_step": 247342, "epoch": 1472} {"train_loss": -12.224544525146484, "global_step": 247343, "epoch": 1472} {"train_loss": -12.127212524414062, "global_step": 247344, "epoch": 1472} {"train_loss": -11.97608757019043, "global_step": 247345, "epoch": 1472} {"train_loss": -11.990435600280762, "global_step": 247346, "epoch": 1472} {"train_loss": -12.128095626831055, "global_step": 247347, "epoch": 1472} {"train_loss": -12.16946029663086, "global_step": 247348, "epoch": 1472} {"train_loss": -12.132895469665527, "global_step": 247349, "epoch": 1472} {"train_loss": -12.20846176147461, "global_step": 247350, "epoch": 1472} {"train_loss": -11.901575088500977, "global_step": 247351, "epoch": 1472} {"train_loss": -12.250961303710938, "global_step": 247352, "epoch": 1472} {"train_loss": -12.181564331054688, "global_step": 247353, "epoch": 1472} {"train_loss": -12.081586837768555, "global_step": 247354, "epoch": 1472} {"train_loss": -12.18481731414795, "global_step": 247355, "epoch": 1472} {"train_loss": -12.210960388183594, "global_step": 247356, "epoch": 1472} {"train_loss": -12.045669555664062, "global_step": 247357, "epoch": 1472} {"train_loss": -12.215776443481445, "global_step": 247358, "epoch": 1472} {"train_loss": -11.988231658935547, "global_step": 247359, "epoch": 1472} {"train_loss": -12.22961711883545, "global_step": 247360, "epoch": 1472} {"train_loss": -12.122579574584961, "global_step": 247361, "epoch": 1472} {"train_loss": -12.10883903503418, "global_step": 247362, "epoch": 1472} {"train_loss": -12.0070219039917, "global_step": 247363, "epoch": 1472} {"train_loss": -12.069493293762207, "global_step": 247364, "epoch": 1472} {"train_loss": -12.040628433227539, "global_step": 247365, "epoch": 1472} {"train_loss": -12.002094268798828, "global_step": 247366, "epoch": 1472} {"train_loss": -12.027362823486328, "global_step": 247367, "epoch": 1472} {"train_loss": -12.150643348693848, "global_step": 247368, "epoch": 1472} {"train_loss": -12.165794372558594, "global_step": 247369, "epoch": 1472} {"train_loss": -12.020435333251953, "global_step": 247370, "epoch": 1472} {"train_loss": -12.104418754577637, "global_step": 247371, "epoch": 1472} {"train_loss": -12.22903060913086, "global_step": 247372, "epoch": 1472} {"train_loss": -12.044434547424316, "global_step": 247373, "epoch": 1472} {"train_loss": -12.005781173706055, "global_step": 247374, "epoch": 1472} {"train_loss": -11.669544219970703, "global_step": 247375, "epoch": 1472} {"train_loss": -11.199501037597656, "global_step": 247376, "epoch": 1472} {"train_loss": -11.08781623840332, "global_step": 247377, "epoch": 1472} {"train_loss": -12.074139595031738, "global_step": 247378, "epoch": 1472} {"train_loss": -12.077032089233398, "global_step": 247379, "epoch": 1472} {"train_loss": -11.582967758178711, "global_step": 247380, "epoch": 1472} {"train_loss": -11.739057540893555, "global_step": 247381, "epoch": 1472} {"train_loss": -12.096351623535156, "global_step": 247382, "epoch": 1472} {"train_loss": -11.498672485351562, "global_step": 247383, "epoch": 1472} {"train_loss": -11.278931617736816, "global_step": 247384, "epoch": 1472} {"train_loss": -10.668744087219238, "global_step": 247385, "epoch": 1472} {"train_loss": -11.628746032714844, "global_step": 247386, "epoch": 1472} {"train_loss": -11.488800048828125, "global_step": 247387, "epoch": 1472} {"train_loss": -11.355430603027344, "global_step": 247388, "epoch": 1472} {"train_loss": -11.175904273986816, "global_step": 247389, "epoch": 1472} {"train_loss": -11.194870948791504, "global_step": 247390, "epoch": 1472} {"train_loss": -10.33829116821289, "global_step": 247391, "epoch": 1472} {"train_loss": -11.201385498046875, "global_step": 247392, "epoch": 1472} {"train_loss": -10.131361961364746, "global_step": 247393, "epoch": 1472} {"train_loss": -11.249909400939941, "global_step": 247394, "epoch": 1472} {"train_loss": -10.383279800415039, "global_step": 247395, "epoch": 1472} {"train_loss": -10.851301193237305, "global_step": 247396, "epoch": 1472} {"train_loss": -9.319489479064941, "global_step": 247397, "epoch": 1472} {"train_loss": -11.214499473571777, "global_step": 247398, "epoch": 1472} {"train_loss": -10.149853706359863, "global_step": 247399, "epoch": 1472} {"train_loss": -8.438672065734863, "global_step": 247400, "epoch": 1472} {"train_loss": -8.872945785522461, "global_step": 247401, "epoch": 1472} {"train_loss": -9.795537948608398, "global_step": 247402, "epoch": 1472} {"train_loss": -7.197272300720215, "global_step": 247403, "epoch": 1472} {"train_loss": -9.217638969421387, "global_step": 247404, "epoch": 1472} {"train_loss": -7.092165946960449, "global_step": 247405, "epoch": 1472} {"train_loss": -8.713854789733887, "global_step": 247406, "epoch": 1472} {"train_loss": -7.84713077545166, "global_step": 247407, "epoch": 1472} {"train_loss": -9.774285316467285, "global_step": 247408, "epoch": 1472} {"train_loss": -9.307861328125, "global_step": 247409, "epoch": 1472} {"train_loss": -8.013692855834961, "global_step": 247410, "epoch": 1472} {"train_loss": -10.269793510437012, "global_step": 247411, "epoch": 1472} {"train_loss": -10.183740615844727, "global_step": 247412, "epoch": 1472} {"train_loss": -9.019865989685059, "global_step": 247413, "epoch": 1472} {"train_loss": -10.875629425048828, "global_step": 247414, "epoch": 1472} {"train_loss": -10.42363452911377, "global_step": 247415, "epoch": 1472} {"train_loss": -9.946878433227539, "global_step": 247416, "epoch": 1472} {"train_loss": -10.578715324401855, "global_step": 247417, "epoch": 1472} {"train_loss": -10.538894653320312, "global_step": 247418, "epoch": 1472} {"train_loss": -10.484066009521484, "global_step": 247419, "epoch": 1472} {"train_loss": -10.973268508911133, "global_step": 247420, "epoch": 1472} {"train_loss": -10.88023567199707, "global_step": 247421, "epoch": 1472} {"train_loss": -10.446196556091309, "global_step": 247422, "epoch": 1472} {"train_loss": -10.914231300354004, "global_step": 247423, "epoch": 1472} {"train_loss": -11.231025695800781, "global_step": 247424, "epoch": 1472} {"train_loss": -10.669300079345703, "global_step": 247425, "epoch": 1472} {"train_loss": -10.931353569030762, "global_step": 247426, "epoch": 1472} {"train_loss": -11.333642959594727, "global_step": 247427, "epoch": 1472} {"train_loss": -10.475334167480469, "global_step": 247428, "epoch": 1472} {"train_loss": -10.749073028564453, "global_step": 247429, "epoch": 1472} {"train_loss": -11.190967559814453, "global_step": 247430, "epoch": 1472} {"train_loss": -10.902627944946289, "global_step": 247431, "epoch": 1472} {"train_loss": -10.83586311340332, "global_step": 247432, "epoch": 1472} {"train_loss": -10.50323486328125, "global_step": 247433, "epoch": 1472} {"train_loss": -11.310441970825195, "global_step": 247434, "epoch": 1472} {"train_loss": -10.574993133544922, "global_step": 247435, "epoch": 1472} {"train_loss": -10.791522979736328, "global_step": 247436, "epoch": 1472} {"train_loss": -10.881385803222656, "global_step": 247437, "epoch": 1472} {"train_loss": -10.810530662536621, "global_step": 247438, "epoch": 1472} {"train_loss": -10.96861743927002, "global_step": 247439, "epoch": 1472} {"train_loss": -10.80908489227295, "global_step": 247440, "epoch": 1472} {"train_loss": -11.204933166503906, "global_step": 247441, "epoch": 1472} {"train_loss": -10.829477310180664, "global_step": 247442, "epoch": 1472} {"train_loss": -11.047143936157227, "global_step": 247443, "epoch": 1472} {"train_loss": -11.17995834350586, "global_step": 247444, "epoch": 1472} {"train_loss": -11.200873374938965, "global_step": 247445, "epoch": 1472} {"train_loss": -11.034966468811035, "global_step": 247446, "epoch": 1472} {"train_loss": -11.34290599822998, "global_step": 247447, "epoch": 1472} {"train_loss": -11.229053497314453, "global_step": 247448, "epoch": 1472} {"train_loss": -10.922922134399414, "global_step": 247449, "epoch": 1472} {"train_loss": -11.223748207092285, "global_step": 247450, "epoch": 1472} {"train_loss": -11.298309326171875, "global_step": 247451, "epoch": 1472} {"train_loss": -11.246525764465332, "global_step": 247452, "epoch": 1472} {"train_loss": -11.364530563354492, "global_step": 247453, "epoch": 1472} {"train_loss": -11.242196083068848, "global_step": 247454, "epoch": 1472} {"train_loss": -11.445518493652344, "global_step": 247455, "epoch": 1472} {"train_loss": -11.212774276733398, "global_step": 247456, "epoch": 1472} {"train_loss": -11.226272583007812, "global_step": 247457, "epoch": 1472} {"train_loss": -11.603464126586914, "global_step": 247458, "epoch": 1472} {"train_loss": -11.299991607666016, "global_step": 247459, "epoch": 1472} {"train_loss": -11.568038940429688, "global_step": 247460, "epoch": 1472} {"train_loss": -11.430879592895508, "global_step": 247461, "epoch": 1472} {"train_loss": -11.541793823242188, "global_step": 247462, "epoch": 1472} {"train_loss": -11.253571260543097, "global_step": 247463, "epoch": 1472, "val_loss": 263829.375} {"train_loss": -11.529304504394531, "global_step": 247464, "epoch": 1473} {"train_loss": -11.70055103302002, "global_step": 247465, "epoch": 1473} {"train_loss": -11.683757781982422, "global_step": 247466, "epoch": 1473} {"train_loss": -11.649142265319824, "global_step": 247467, "epoch": 1473} {"train_loss": -11.685568809509277, "global_step": 247468, "epoch": 1473} {"train_loss": -11.60878849029541, "global_step": 247469, "epoch": 1473} {"train_loss": -11.767990112304688, "global_step": 247470, "epoch": 1473} {"train_loss": -11.751524925231934, "global_step": 247471, "epoch": 1473} {"train_loss": -11.541549682617188, "global_step": 247472, "epoch": 1473} {"train_loss": -11.742084503173828, "global_step": 247473, "epoch": 1473} {"train_loss": -11.853742599487305, "global_step": 247474, "epoch": 1473} {"train_loss": -11.591811180114746, "global_step": 247475, "epoch": 1473} {"train_loss": -11.886985778808594, "global_step": 247476, "epoch": 1473} {"train_loss": -11.917607307434082, "global_step": 247477, "epoch": 1473} {"train_loss": -11.76101016998291, "global_step": 247478, "epoch": 1473} {"train_loss": -11.84249496459961, "global_step": 247479, "epoch": 1473} {"train_loss": -11.595720291137695, "global_step": 247480, "epoch": 1473} {"train_loss": -11.665939331054688, "global_step": 247481, "epoch": 1473} {"train_loss": -11.988518714904785, "global_step": 247482, "epoch": 1473} {"train_loss": -11.753530502319336, "global_step": 247483, "epoch": 1473} {"train_loss": -12.060294151306152, "global_step": 247484, "epoch": 1473} {"train_loss": -12.049999237060547, "global_step": 247485, "epoch": 1473} {"train_loss": -11.81563663482666, "global_step": 247486, "epoch": 1473} {"train_loss": -12.006717681884766, "global_step": 247487, "epoch": 1473} {"train_loss": -11.857479095458984, "global_step": 247488, "epoch": 1473} {"train_loss": -11.889325141906738, "global_step": 247489, "epoch": 1473} {"train_loss": -11.988571166992188, "global_step": 247490, "epoch": 1473} {"train_loss": -11.846088409423828, "global_step": 247491, "epoch": 1473} {"train_loss": -12.086376190185547, "global_step": 247492, "epoch": 1473} {"train_loss": -11.872896194458008, "global_step": 247493, "epoch": 1473} {"train_loss": -12.032593727111816, "global_step": 247494, "epoch": 1473} {"train_loss": -12.025453567504883, "global_step": 247495, "epoch": 1473} {"train_loss": -11.995607376098633, "global_step": 247496, "epoch": 1473} {"train_loss": -12.10526180267334, "global_step": 247497, "epoch": 1473} {"train_loss": -11.87713623046875, "global_step": 247498, "epoch": 1473} {"train_loss": -11.99001693725586, "global_step": 247499, "epoch": 1473} {"train_loss": -12.154760360717773, "global_step": 247500, "epoch": 1473} {"train_loss": -12.00622272491455, "global_step": 247501, "epoch": 1473} {"train_loss": -12.062067031860352, "global_step": 247502, "epoch": 1473} {"train_loss": -12.16986083984375, "global_step": 247503, "epoch": 1473} {"train_loss": -12.17178726196289, "global_step": 247504, "epoch": 1473} {"train_loss": -11.801438331604004, "global_step": 247505, "epoch": 1473} {"train_loss": -12.100414276123047, "global_step": 247506, "epoch": 1473} {"train_loss": -11.924948692321777, "global_step": 247507, "epoch": 1473} {"train_loss": -12.070133209228516, "global_step": 247508, "epoch": 1473} {"train_loss": -12.366656303405762, "global_step": 247509, "epoch": 1473} {"train_loss": -11.968729019165039, "global_step": 247510, "epoch": 1473} {"train_loss": -12.142014503479004, "global_step": 247511, "epoch": 1473} {"train_loss": -12.265865325927734, "global_step": 247512, "epoch": 1473} {"train_loss": -11.692934036254883, "global_step": 247513, "epoch": 1473} {"train_loss": -12.082857131958008, "global_step": 247514, "epoch": 1473} {"train_loss": -11.745817184448242, "global_step": 247515, "epoch": 1473} {"train_loss": -11.927376747131348, "global_step": 247516, "epoch": 1473} {"train_loss": -12.304561614990234, "global_step": 247517, "epoch": 1473} {"train_loss": -12.11906623840332, "global_step": 247518, "epoch": 1473} {"train_loss": -11.924760818481445, "global_step": 247519, "epoch": 1473} {"train_loss": -12.206058502197266, "global_step": 247520, "epoch": 1473} {"train_loss": -12.105512619018555, "global_step": 247521, "epoch": 1473} {"train_loss": -11.524163246154785, "global_step": 247522, "epoch": 1473} {"train_loss": -12.027206420898438, "global_step": 247523, "epoch": 1473} {"train_loss": -12.236769676208496, "global_step": 247524, "epoch": 1473} {"train_loss": -12.039499282836914, "global_step": 247525, "epoch": 1473} {"train_loss": -12.101934432983398, "global_step": 247526, "epoch": 1473} {"train_loss": -11.97971248626709, "global_step": 247527, "epoch": 1473} {"train_loss": -12.031684875488281, "global_step": 247528, "epoch": 1473} {"train_loss": -12.078184127807617, "global_step": 247529, "epoch": 1473} {"train_loss": -11.37779426574707, "global_step": 247530, "epoch": 1473} {"train_loss": -10.65318775177002, "global_step": 247531, "epoch": 1473} {"train_loss": -11.577142715454102, "global_step": 247532, "epoch": 1473} {"train_loss": -12.064338684082031, "global_step": 247533, "epoch": 1473} {"train_loss": -11.585195541381836, "global_step": 247534, "epoch": 1473} {"train_loss": -11.573219299316406, "global_step": 247535, "epoch": 1473} {"train_loss": -11.990463256835938, "global_step": 247536, "epoch": 1473} {"train_loss": -11.683822631835938, "global_step": 247537, "epoch": 1473} {"train_loss": -12.366313934326172, "global_step": 247538, "epoch": 1473} {"train_loss": -12.274968147277832, "global_step": 247539, "epoch": 1473} {"train_loss": -12.079540252685547, "global_step": 247540, "epoch": 1473} {"train_loss": -11.986776351928711, "global_step": 247541, "epoch": 1473} {"train_loss": -12.040159225463867, "global_step": 247542, "epoch": 1473} {"train_loss": -11.968056678771973, "global_step": 247543, "epoch": 1473} {"train_loss": -11.842345237731934, "global_step": 247544, "epoch": 1473} {"train_loss": -12.054831504821777, "global_step": 247545, "epoch": 1473} {"train_loss": -12.035744667053223, "global_step": 247546, "epoch": 1473} {"train_loss": -12.077993392944336, "global_step": 247547, "epoch": 1473} {"train_loss": -12.094996452331543, "global_step": 247548, "epoch": 1473} {"train_loss": -11.854461669921875, "global_step": 247549, "epoch": 1473} {"train_loss": -12.094202041625977, "global_step": 247550, "epoch": 1473} {"train_loss": -11.794822692871094, "global_step": 247551, "epoch": 1473} {"train_loss": -11.805646896362305, "global_step": 247552, "epoch": 1473} {"train_loss": -11.758203506469727, "global_step": 247553, "epoch": 1473} {"train_loss": -12.148258209228516, "global_step": 247554, "epoch": 1473} {"train_loss": -11.352853775024414, "global_step": 247555, "epoch": 1473} {"train_loss": -12.036300659179688, "global_step": 247556, "epoch": 1473} {"train_loss": -11.70975112915039, "global_step": 247557, "epoch": 1473} {"train_loss": -11.668943405151367, "global_step": 247558, "epoch": 1473} {"train_loss": -12.014081954956055, "global_step": 247559, "epoch": 1473} {"train_loss": -11.965417861938477, "global_step": 247560, "epoch": 1473} {"train_loss": -11.627543449401855, "global_step": 247561, "epoch": 1473} {"train_loss": -11.185685157775879, "global_step": 247562, "epoch": 1473} {"train_loss": -12.226258277893066, "global_step": 247563, "epoch": 1473} {"train_loss": -11.273749351501465, "global_step": 247564, "epoch": 1473} {"train_loss": -11.33520221710205, "global_step": 247565, "epoch": 1473} {"train_loss": -11.324356079101562, "global_step": 247566, "epoch": 1473} {"train_loss": -10.898280143737793, "global_step": 247567, "epoch": 1473} {"train_loss": -10.822866439819336, "global_step": 247568, "epoch": 1473} {"train_loss": -11.677316665649414, "global_step": 247569, "epoch": 1473} {"train_loss": -11.58830738067627, "global_step": 247570, "epoch": 1473} {"train_loss": -10.826530456542969, "global_step": 247571, "epoch": 1473} {"train_loss": -11.143117904663086, "global_step": 247572, "epoch": 1473} {"train_loss": -11.990619659423828, "global_step": 247573, "epoch": 1473} {"train_loss": -10.986936569213867, "global_step": 247574, "epoch": 1473} {"train_loss": -11.090194702148438, "global_step": 247575, "epoch": 1473} {"train_loss": -11.514871597290039, "global_step": 247576, "epoch": 1473} {"train_loss": -11.133377075195312, "global_step": 247577, "epoch": 1473} {"train_loss": -11.13224983215332, "global_step": 247578, "epoch": 1473} {"train_loss": -11.014986038208008, "global_step": 247579, "epoch": 1473} {"train_loss": -12.024446487426758, "global_step": 247580, "epoch": 1473} {"train_loss": -11.35699462890625, "global_step": 247581, "epoch": 1473} {"train_loss": -11.499214172363281, "global_step": 247582, "epoch": 1473} {"train_loss": -11.35477066040039, "global_step": 247583, "epoch": 1473} {"train_loss": -9.105579376220703, "global_step": 247584, "epoch": 1473} {"train_loss": -11.417470932006836, "global_step": 247585, "epoch": 1473} {"train_loss": -10.283676147460938, "global_step": 247586, "epoch": 1473} {"train_loss": -10.389026641845703, "global_step": 247587, "epoch": 1473} {"train_loss": -10.580535888671875, "global_step": 247588, "epoch": 1473} {"train_loss": -8.646408081054688, "global_step": 247589, "epoch": 1473} {"train_loss": -8.720293045043945, "global_step": 247590, "epoch": 1473} {"train_loss": -9.362860679626465, "global_step": 247591, "epoch": 1473} {"train_loss": -9.052488327026367, "global_step": 247592, "epoch": 1473} {"train_loss": -8.397156715393066, "global_step": 247593, "epoch": 1473} {"train_loss": -8.034428596496582, "global_step": 247594, "epoch": 1473} {"train_loss": -8.031102180480957, "global_step": 247595, "epoch": 1473} {"train_loss": -7.676888942718506, "global_step": 247596, "epoch": 1473} {"train_loss": -8.631928443908691, "global_step": 247597, "epoch": 1473} {"train_loss": -8.633597373962402, "global_step": 247598, "epoch": 1473} {"train_loss": -8.893102645874023, "global_step": 247599, "epoch": 1473} {"train_loss": -8.759489059448242, "global_step": 247600, "epoch": 1473} {"train_loss": -8.842592239379883, "global_step": 247601, "epoch": 1473} {"train_loss": -10.401359558105469, "global_step": 247602, "epoch": 1473} {"train_loss": -9.743223190307617, "global_step": 247603, "epoch": 1473} {"train_loss": -10.608598709106445, "global_step": 247604, "epoch": 1473} {"train_loss": -10.037481307983398, "global_step": 247605, "epoch": 1473} {"train_loss": -9.379411697387695, "global_step": 247606, "epoch": 1473} {"train_loss": -9.870558738708496, "global_step": 247607, "epoch": 1473} {"train_loss": -10.301219940185547, "global_step": 247608, "epoch": 1473} {"train_loss": -10.263750076293945, "global_step": 247609, "epoch": 1473} {"train_loss": -10.236337661743164, "global_step": 247610, "epoch": 1473} {"train_loss": -11.254100799560547, "global_step": 247611, "epoch": 1473} {"train_loss": -10.469776153564453, "global_step": 247612, "epoch": 1473} {"train_loss": -10.52991771697998, "global_step": 247613, "epoch": 1473} {"train_loss": -10.998102188110352, "global_step": 247614, "epoch": 1473} {"train_loss": -10.4584379196167, "global_step": 247615, "epoch": 1473} {"train_loss": -11.104331016540527, "global_step": 247616, "epoch": 1473} {"train_loss": -10.833903312683105, "global_step": 247617, "epoch": 1473} {"train_loss": -10.854898452758789, "global_step": 247618, "epoch": 1473} {"train_loss": -11.204833984375, "global_step": 247619, "epoch": 1473} {"train_loss": -11.008291244506836, "global_step": 247620, "epoch": 1473} {"train_loss": -11.267082214355469, "global_step": 247621, "epoch": 1473} {"train_loss": -10.979812622070312, "global_step": 247622, "epoch": 1473} {"train_loss": -11.291613578796387, "global_step": 247623, "epoch": 1473} {"train_loss": -11.361916542053223, "global_step": 247624, "epoch": 1473} {"train_loss": -11.485849380493164, "global_step": 247625, "epoch": 1473} {"train_loss": -11.297581672668457, "global_step": 247626, "epoch": 1473} {"train_loss": -11.545848846435547, "global_step": 247627, "epoch": 1473} {"train_loss": -11.62639331817627, "global_step": 247628, "epoch": 1473} {"train_loss": -11.577676773071289, "global_step": 247629, "epoch": 1473} {"train_loss": -11.317113876342773, "global_step": 247630, "epoch": 1473} {"train_loss": -11.334017018477121, "global_step": 247631, "epoch": 1473, "val_loss": 261191.96875} {"train_loss": -11.50352954864502, "global_step": 247632, "epoch": 1474} {"train_loss": -11.357095718383789, "global_step": 247633, "epoch": 1474} {"train_loss": -11.550973892211914, "global_step": 247634, "epoch": 1474} {"train_loss": -11.584084510803223, "global_step": 247635, "epoch": 1474} {"train_loss": -11.412437438964844, "global_step": 247636, "epoch": 1474} {"train_loss": -11.504252433776855, "global_step": 247637, "epoch": 1474} {"train_loss": -11.618093490600586, "global_step": 247638, "epoch": 1474} {"train_loss": -11.804506301879883, "global_step": 247639, "epoch": 1474} {"train_loss": -11.62558650970459, "global_step": 247640, "epoch": 1474} {"train_loss": -11.47752571105957, "global_step": 247641, "epoch": 1474} {"train_loss": -11.59141731262207, "global_step": 247642, "epoch": 1474} {"train_loss": -11.724138259887695, "global_step": 247643, "epoch": 1474} {"train_loss": -11.668468475341797, "global_step": 247644, "epoch": 1474} {"train_loss": -11.915578842163086, "global_step": 247645, "epoch": 1474} {"train_loss": -11.835113525390625, "global_step": 247646, "epoch": 1474} {"train_loss": -11.637389183044434, "global_step": 247647, "epoch": 1474} {"train_loss": -11.704452514648438, "global_step": 247648, "epoch": 1474} {"train_loss": -11.677690505981445, "global_step": 247649, "epoch": 1474} {"train_loss": -11.823492050170898, "global_step": 247650, "epoch": 1474} {"train_loss": -11.683473587036133, "global_step": 247651, "epoch": 1474} {"train_loss": -11.958815574645996, "global_step": 247652, "epoch": 1474} {"train_loss": -11.813825607299805, "global_step": 247653, "epoch": 1474} {"train_loss": -11.834470748901367, "global_step": 247654, "epoch": 1474} {"train_loss": -11.95074462890625, "global_step": 247655, "epoch": 1474} {"train_loss": -11.748730659484863, "global_step": 247656, "epoch": 1474} {"train_loss": -11.80790901184082, "global_step": 247657, "epoch": 1474} {"train_loss": -11.606962203979492, "global_step": 247658, "epoch": 1474} {"train_loss": -11.779365539550781, "global_step": 247659, "epoch": 1474} {"train_loss": -11.713221549987793, "global_step": 247660, "epoch": 1474} {"train_loss": -11.868711471557617, "global_step": 247661, "epoch": 1474} {"train_loss": -11.932910919189453, "global_step": 247662, "epoch": 1474} {"train_loss": -11.972115516662598, "global_step": 247663, "epoch": 1474} {"train_loss": -12.047473907470703, "global_step": 247664, "epoch": 1474} {"train_loss": -12.042718887329102, "global_step": 247665, "epoch": 1474} {"train_loss": -12.08990478515625, "global_step": 247666, "epoch": 1474} {"train_loss": -11.98468017578125, "global_step": 247667, "epoch": 1474} {"train_loss": -11.976478576660156, "global_step": 247668, "epoch": 1474} {"train_loss": -11.925092697143555, "global_step": 247669, "epoch": 1474} {"train_loss": -11.972978591918945, "global_step": 247670, "epoch": 1474} {"train_loss": -12.150696754455566, "global_step": 247671, "epoch": 1474} {"train_loss": -12.224573135375977, "global_step": 247672, "epoch": 1474} {"train_loss": -11.89779281616211, "global_step": 247673, "epoch": 1474} {"train_loss": -12.06710433959961, "global_step": 247674, "epoch": 1474} {"train_loss": -12.046693801879883, "global_step": 247675, "epoch": 1474} {"train_loss": -12.089435577392578, "global_step": 247676, "epoch": 1474} {"train_loss": -12.19354248046875, "global_step": 247677, "epoch": 1474} {"train_loss": -12.167203903198242, "global_step": 247678, "epoch": 1474} {"train_loss": -12.110811233520508, "global_step": 247679, "epoch": 1474} {"train_loss": -12.132237434387207, "global_step": 247680, "epoch": 1474} {"train_loss": -12.178447723388672, "global_step": 247681, "epoch": 1474} {"train_loss": -12.142807006835938, "global_step": 247682, "epoch": 1474} {"train_loss": -12.207484245300293, "global_step": 247683, "epoch": 1474} {"train_loss": -12.074663162231445, "global_step": 247684, "epoch": 1474} {"train_loss": -11.925531387329102, "global_step": 247685, "epoch": 1474} {"train_loss": -12.222984313964844, "global_step": 247686, "epoch": 1474} {"train_loss": -12.05695915222168, "global_step": 247687, "epoch": 1474} {"train_loss": -11.96002197265625, "global_step": 247688, "epoch": 1474} {"train_loss": -12.145054817199707, "global_step": 247689, "epoch": 1474} {"train_loss": -11.931293487548828, "global_step": 247690, "epoch": 1474} {"train_loss": -12.263124465942383, "global_step": 247691, "epoch": 1474} {"train_loss": -11.829747200012207, "global_step": 247692, "epoch": 1474} {"train_loss": -12.14627742767334, "global_step": 247693, "epoch": 1474} {"train_loss": -12.117696762084961, "global_step": 247694, "epoch": 1474} {"train_loss": -12.174768447875977, "global_step": 247695, "epoch": 1474} {"train_loss": -12.063130378723145, "global_step": 247696, "epoch": 1474} {"train_loss": -11.410395622253418, "global_step": 247697, "epoch": 1474} {"train_loss": -12.04580020904541, "global_step": 247698, "epoch": 1474} {"train_loss": -11.844942092895508, "global_step": 247699, "epoch": 1474} {"train_loss": -11.436702728271484, "global_step": 247700, "epoch": 1474} {"train_loss": -10.887259483337402, "global_step": 247701, "epoch": 1474} {"train_loss": -11.819671630859375, "global_step": 247702, "epoch": 1474} {"train_loss": -11.465354919433594, "global_step": 247703, "epoch": 1474} {"train_loss": -12.004400253295898, "global_step": 247704, "epoch": 1474} {"train_loss": -11.219215393066406, "global_step": 247705, "epoch": 1474} {"train_loss": -11.533294677734375, "global_step": 247706, "epoch": 1474} {"train_loss": -11.75284194946289, "global_step": 247707, "epoch": 1474} {"train_loss": -12.034405708312988, "global_step": 247708, "epoch": 1474} {"train_loss": -11.800823211669922, "global_step": 247709, "epoch": 1474} {"train_loss": -11.855030059814453, "global_step": 247710, "epoch": 1474} {"train_loss": -12.001235961914062, "global_step": 247711, "epoch": 1474} {"train_loss": -12.076031684875488, "global_step": 247712, "epoch": 1474} {"train_loss": -11.827780723571777, "global_step": 247713, "epoch": 1474} {"train_loss": -12.18929672241211, "global_step": 247714, "epoch": 1474} {"train_loss": -12.035050392150879, "global_step": 247715, "epoch": 1474} {"train_loss": -11.99561595916748, "global_step": 247716, "epoch": 1474} {"train_loss": -11.809500694274902, "global_step": 247717, "epoch": 1474} {"train_loss": -12.359367370605469, "global_step": 247718, "epoch": 1474} {"train_loss": -11.755860328674316, "global_step": 247719, "epoch": 1474} {"train_loss": -11.985719680786133, "global_step": 247720, "epoch": 1474} {"train_loss": -12.139763832092285, "global_step": 247721, "epoch": 1474} {"train_loss": -11.837011337280273, "global_step": 247722, "epoch": 1474} {"train_loss": -11.535097122192383, "global_step": 247723, "epoch": 1474} {"train_loss": -11.810586929321289, "global_step": 247724, "epoch": 1474} {"train_loss": -11.45705795288086, "global_step": 247725, "epoch": 1474} {"train_loss": -11.216267585754395, "global_step": 247726, "epoch": 1474} {"train_loss": -11.691865921020508, "global_step": 247727, "epoch": 1474} {"train_loss": -11.852180480957031, "global_step": 247728, "epoch": 1474} {"train_loss": -11.419427871704102, "global_step": 247729, "epoch": 1474} {"train_loss": -11.73127555847168, "global_step": 247730, "epoch": 1474} {"train_loss": -11.841243743896484, "global_step": 247731, "epoch": 1474} {"train_loss": -10.043344497680664, "global_step": 247732, "epoch": 1474} {"train_loss": -10.350358963012695, "global_step": 247733, "epoch": 1474} {"train_loss": -11.620582580566406, "global_step": 247734, "epoch": 1474} {"train_loss": -9.882268905639648, "global_step": 247735, "epoch": 1474} {"train_loss": -10.655372619628906, "global_step": 247736, "epoch": 1474} {"train_loss": -10.868824005126953, "global_step": 247737, "epoch": 1474} {"train_loss": -10.58713150024414, "global_step": 247738, "epoch": 1474} {"train_loss": -10.820892333984375, "global_step": 247739, "epoch": 1474} {"train_loss": -11.552339553833008, "global_step": 247740, "epoch": 1474} {"train_loss": -10.8994140625, "global_step": 247741, "epoch": 1474} {"train_loss": -11.319992065429688, "global_step": 247742, "epoch": 1474} {"train_loss": -11.512916564941406, "global_step": 247743, "epoch": 1474} {"train_loss": -10.803874015808105, "global_step": 247744, "epoch": 1474} {"train_loss": -11.867841720581055, "global_step": 247745, "epoch": 1474} {"train_loss": -11.540216445922852, "global_step": 247746, "epoch": 1474} {"train_loss": -11.649059295654297, "global_step": 247747, "epoch": 1474} {"train_loss": -11.448567390441895, "global_step": 247748, "epoch": 1474} {"train_loss": -11.791627883911133, "global_step": 247749, "epoch": 1474} {"train_loss": -10.84494400024414, "global_step": 247750, "epoch": 1474} {"train_loss": -11.716376304626465, "global_step": 247751, "epoch": 1474} {"train_loss": -11.286739349365234, "global_step": 247752, "epoch": 1474} {"train_loss": -11.469327926635742, "global_step": 247753, "epoch": 1474} {"train_loss": -11.666748046875, "global_step": 247754, "epoch": 1474} {"train_loss": -10.985119819641113, "global_step": 247755, "epoch": 1474} {"train_loss": -10.38160228729248, "global_step": 247756, "epoch": 1474} {"train_loss": -11.692649841308594, "global_step": 247757, "epoch": 1474} {"train_loss": -11.060802459716797, "global_step": 247758, "epoch": 1474} {"train_loss": -11.775104522705078, "global_step": 247759, "epoch": 1474} {"train_loss": -11.676458358764648, "global_step": 247760, "epoch": 1474} {"train_loss": -11.654336929321289, "global_step": 247761, "epoch": 1474} {"train_loss": -11.487963676452637, "global_step": 247762, "epoch": 1474} {"train_loss": -11.4393892288208, "global_step": 247763, "epoch": 1474} {"train_loss": -11.617475509643555, "global_step": 247764, "epoch": 1474} {"train_loss": -11.676712036132812, "global_step": 247765, "epoch": 1474} {"train_loss": -11.772553443908691, "global_step": 247766, "epoch": 1474} {"train_loss": -11.487188339233398, "global_step": 247767, "epoch": 1474} {"train_loss": -11.768777847290039, "global_step": 247768, "epoch": 1474} {"train_loss": -11.791610717773438, "global_step": 247769, "epoch": 1474} {"train_loss": -11.848922729492188, "global_step": 247770, "epoch": 1474} {"train_loss": -11.785684585571289, "global_step": 247771, "epoch": 1474} {"train_loss": -12.013252258300781, "global_step": 247772, "epoch": 1474} {"train_loss": -11.814634323120117, "global_step": 247773, "epoch": 1474} {"train_loss": -11.846596717834473, "global_step": 247774, "epoch": 1474} {"train_loss": -11.921743392944336, "global_step": 247775, "epoch": 1474} {"train_loss": -11.80253791809082, "global_step": 247776, "epoch": 1474} {"train_loss": -11.846380233764648, "global_step": 247777, "epoch": 1474} {"train_loss": -11.928092002868652, "global_step": 247778, "epoch": 1474} {"train_loss": -11.7868013381958, "global_step": 247779, "epoch": 1474} {"train_loss": -12.070796012878418, "global_step": 247780, "epoch": 1474} {"train_loss": -11.873832702636719, "global_step": 247781, "epoch": 1474} {"train_loss": -12.067598342895508, "global_step": 247782, "epoch": 1474} {"train_loss": -12.015541076660156, "global_step": 247783, "epoch": 1474} {"train_loss": -12.057220458984375, "global_step": 247784, "epoch": 1474} {"train_loss": -12.057372093200684, "global_step": 247785, "epoch": 1474} {"train_loss": -12.170654296875, "global_step": 247786, "epoch": 1474} {"train_loss": -12.208688735961914, "global_step": 247787, "epoch": 1474} {"train_loss": -11.775092124938965, "global_step": 247788, "epoch": 1474} {"train_loss": -12.245058059692383, "global_step": 247789, "epoch": 1474} {"train_loss": -12.278331756591797, "global_step": 247790, "epoch": 1474} {"train_loss": -11.885679244995117, "global_step": 247791, "epoch": 1474} {"train_loss": -12.145838737487793, "global_step": 247792, "epoch": 1474} {"train_loss": -12.123064041137695, "global_step": 247793, "epoch": 1474} {"train_loss": -12.148783683776855, "global_step": 247794, "epoch": 1474} {"train_loss": -12.176897048950195, "global_step": 247795, "epoch": 1474} {"train_loss": -12.242352485656738, "global_step": 247796, "epoch": 1474} {"train_loss": -12.085638046264648, "global_step": 247797, "epoch": 1474} {"train_loss": -11.979345321655273, "global_step": 247798, "epoch": 1474} {"train_loss": -11.747999798683892, "global_step": 247799, "epoch": 1474, "val_loss": 267898.6875} {"train_loss": -11.863851547241211, "global_step": 247800, "epoch": 1475} {"train_loss": -11.849876403808594, "global_step": 247801, "epoch": 1475} {"train_loss": -12.020971298217773, "global_step": 247802, "epoch": 1475} {"train_loss": -11.621939659118652, "global_step": 247803, "epoch": 1475} {"train_loss": -12.010032653808594, "global_step": 247804, "epoch": 1475} {"train_loss": -11.832927703857422, "global_step": 247805, "epoch": 1475} {"train_loss": -11.741302490234375, "global_step": 247806, "epoch": 1475} {"train_loss": -12.044037818908691, "global_step": 247807, "epoch": 1475} {"train_loss": -11.651555061340332, "global_step": 247808, "epoch": 1475} {"train_loss": -11.892705917358398, "global_step": 247809, "epoch": 1475} {"train_loss": -11.856023788452148, "global_step": 247810, "epoch": 1475} {"train_loss": -12.093605041503906, "global_step": 247811, "epoch": 1475} {"train_loss": -12.062118530273438, "global_step": 247812, "epoch": 1475} {"train_loss": -11.943829536437988, "global_step": 247813, "epoch": 1475} {"train_loss": -11.793347358703613, "global_step": 247814, "epoch": 1475} {"train_loss": -12.000764846801758, "global_step": 247815, "epoch": 1475} {"train_loss": -12.089877128601074, "global_step": 247816, "epoch": 1475} {"train_loss": -12.016481399536133, "global_step": 247817, "epoch": 1475} {"train_loss": -12.113480567932129, "global_step": 247818, "epoch": 1475} {"train_loss": -11.971954345703125, "global_step": 247819, "epoch": 1475} {"train_loss": -12.064356803894043, "global_step": 247820, "epoch": 1475} {"train_loss": -11.667068481445312, "global_step": 247821, "epoch": 1475} {"train_loss": -11.889978408813477, "global_step": 247822, "epoch": 1475} {"train_loss": -12.347604751586914, "global_step": 247823, "epoch": 1475} {"train_loss": -12.124259948730469, "global_step": 247824, "epoch": 1475} {"train_loss": -11.485692977905273, "global_step": 247825, "epoch": 1475} {"train_loss": -11.648080825805664, "global_step": 247826, "epoch": 1475} {"train_loss": -11.933746337890625, "global_step": 247827, "epoch": 1475} {"train_loss": -11.811403274536133, "global_step": 247828, "epoch": 1475} {"train_loss": -12.101869583129883, "global_step": 247829, "epoch": 1475} {"train_loss": -11.690492630004883, "global_step": 247830, "epoch": 1475} {"train_loss": -12.029793739318848, "global_step": 247831, "epoch": 1475} {"train_loss": -11.836926460266113, "global_step": 247832, "epoch": 1475} {"train_loss": -11.867512702941895, "global_step": 247833, "epoch": 1475} {"train_loss": -11.44814682006836, "global_step": 247834, "epoch": 1475} {"train_loss": -10.537843704223633, "global_step": 247835, "epoch": 1475} {"train_loss": -10.857181549072266, "global_step": 247836, "epoch": 1475} {"train_loss": -11.609743118286133, "global_step": 247837, "epoch": 1475} {"train_loss": -10.418375968933105, "global_step": 247838, "epoch": 1475} {"train_loss": -10.672098159790039, "global_step": 247839, "epoch": 1475} {"train_loss": -11.586312294006348, "global_step": 247840, "epoch": 1475} {"train_loss": -11.008232116699219, "global_step": 247841, "epoch": 1475} {"train_loss": -11.990262985229492, "global_step": 247842, "epoch": 1475} {"train_loss": -11.204707145690918, "global_step": 247843, "epoch": 1475} {"train_loss": -11.757158279418945, "global_step": 247844, "epoch": 1475} {"train_loss": -11.406881332397461, "global_step": 247845, "epoch": 1475} {"train_loss": -11.067794799804688, "global_step": 247846, "epoch": 1475} {"train_loss": -11.279934883117676, "global_step": 247847, "epoch": 1475} {"train_loss": -10.216171264648438, "global_step": 247848, "epoch": 1475} {"train_loss": -11.444812774658203, "global_step": 247849, "epoch": 1475} {"train_loss": -10.401012420654297, "global_step": 247850, "epoch": 1475} {"train_loss": -10.4637451171875, "global_step": 247851, "epoch": 1475} {"train_loss": -10.083601951599121, "global_step": 247852, "epoch": 1475} {"train_loss": -11.309602737426758, "global_step": 247853, "epoch": 1475} {"train_loss": -8.940411567687988, "global_step": 247854, "epoch": 1475} {"train_loss": -10.412590980529785, "global_step": 247855, "epoch": 1475} {"train_loss": -9.263871192932129, "global_step": 247856, "epoch": 1475} {"train_loss": -9.456783294677734, "global_step": 247857, "epoch": 1475} {"train_loss": -9.406702041625977, "global_step": 247858, "epoch": 1475} {"train_loss": -10.318178176879883, "global_step": 247859, "epoch": 1475} {"train_loss": -11.161554336547852, "global_step": 247860, "epoch": 1475} {"train_loss": -10.291728973388672, "global_step": 247861, "epoch": 1475} {"train_loss": -11.515053749084473, "global_step": 247862, "epoch": 1475} {"train_loss": -9.933517456054688, "global_step": 247863, "epoch": 1475} {"train_loss": -11.164987564086914, "global_step": 247864, "epoch": 1475} {"train_loss": -11.412477493286133, "global_step": 247865, "epoch": 1475} {"train_loss": -10.216747283935547, "global_step": 247866, "epoch": 1475} {"train_loss": -11.492920875549316, "global_step": 247867, "epoch": 1475} {"train_loss": -10.933849334716797, "global_step": 247868, "epoch": 1475} {"train_loss": -11.378519058227539, "global_step": 247869, "epoch": 1475} {"train_loss": -11.233840942382812, "global_step": 247870, "epoch": 1475} {"train_loss": -10.935541152954102, "global_step": 247871, "epoch": 1475} {"train_loss": -11.52471923828125, "global_step": 247872, "epoch": 1475} {"train_loss": -11.132299423217773, "global_step": 247873, "epoch": 1475} {"train_loss": -11.551767349243164, "global_step": 247874, "epoch": 1475} {"train_loss": -11.544180870056152, "global_step": 247875, "epoch": 1475} {"train_loss": -11.303773880004883, "global_step": 247876, "epoch": 1475} {"train_loss": -11.69270133972168, "global_step": 247877, "epoch": 1475} {"train_loss": -11.584617614746094, "global_step": 247878, "epoch": 1475} {"train_loss": -11.46944808959961, "global_step": 247879, "epoch": 1475} {"train_loss": -11.818153381347656, "global_step": 247880, "epoch": 1475} {"train_loss": -11.84112548828125, "global_step": 247881, "epoch": 1475} {"train_loss": -11.559976577758789, "global_step": 247882, "epoch": 1475} {"train_loss": -11.63271427154541, "global_step": 247883, "epoch": 1475} {"train_loss": -11.769824981689453, "global_step": 247884, "epoch": 1475} {"train_loss": -11.562759399414062, "global_step": 247885, "epoch": 1475} {"train_loss": -11.945748329162598, "global_step": 247886, "epoch": 1475} {"train_loss": -11.852869033813477, "global_step": 247887, "epoch": 1475} {"train_loss": -11.622034072875977, "global_step": 247888, "epoch": 1475} {"train_loss": -11.773029327392578, "global_step": 247889, "epoch": 1475} {"train_loss": -11.755687713623047, "global_step": 247890, "epoch": 1475} {"train_loss": -11.777374267578125, "global_step": 247891, "epoch": 1475} {"train_loss": -11.933977127075195, "global_step": 247892, "epoch": 1475} {"train_loss": -11.57550048828125, "global_step": 247893, "epoch": 1475} {"train_loss": -11.58829402923584, "global_step": 247894, "epoch": 1475} {"train_loss": -11.58215618133545, "global_step": 247895, "epoch": 1475} {"train_loss": -11.703869819641113, "global_step": 247896, "epoch": 1475} {"train_loss": -11.754402160644531, "global_step": 247897, "epoch": 1475} {"train_loss": -12.086030960083008, "global_step": 247898, "epoch": 1475} {"train_loss": -11.668333053588867, "global_step": 247899, "epoch": 1475} {"train_loss": -11.955501556396484, "global_step": 247900, "epoch": 1475} {"train_loss": -11.653318405151367, "global_step": 247901, "epoch": 1475} {"train_loss": -11.881735801696777, "global_step": 247902, "epoch": 1475} {"train_loss": -11.831762313842773, "global_step": 247903, "epoch": 1475} {"train_loss": -11.618515014648438, "global_step": 247904, "epoch": 1475} {"train_loss": -11.809183120727539, "global_step": 247905, "epoch": 1475} {"train_loss": -11.444278717041016, "global_step": 247906, "epoch": 1475} {"train_loss": -11.85249137878418, "global_step": 247907, "epoch": 1475} {"train_loss": -11.50960922241211, "global_step": 247908, "epoch": 1475} {"train_loss": -11.455460548400879, "global_step": 247909, "epoch": 1475} {"train_loss": -11.621213912963867, "global_step": 247910, "epoch": 1475} {"train_loss": -11.634777069091797, "global_step": 247911, "epoch": 1475} {"train_loss": -12.146236419677734, "global_step": 247912, "epoch": 1475} {"train_loss": -11.614128112792969, "global_step": 247913, "epoch": 1475} {"train_loss": -12.091737747192383, "global_step": 247914, "epoch": 1475} {"train_loss": -11.864198684692383, "global_step": 247915, "epoch": 1475} {"train_loss": -11.547938346862793, "global_step": 247916, "epoch": 1475} {"train_loss": -12.021585464477539, "global_step": 247917, "epoch": 1475} {"train_loss": -11.716514587402344, "global_step": 247918, "epoch": 1475} {"train_loss": -11.945263862609863, "global_step": 247919, "epoch": 1475} {"train_loss": -12.013650894165039, "global_step": 247920, "epoch": 1475} {"train_loss": -11.50688362121582, "global_step": 247921, "epoch": 1475} {"train_loss": -11.885286331176758, "global_step": 247922, "epoch": 1475} {"train_loss": -11.66046142578125, "global_step": 247923, "epoch": 1475} {"train_loss": -11.808183670043945, "global_step": 247924, "epoch": 1475} {"train_loss": -11.975473403930664, "global_step": 247925, "epoch": 1475} {"train_loss": -11.99641227722168, "global_step": 247926, "epoch": 1475} {"train_loss": -11.645307540893555, "global_step": 247927, "epoch": 1475} {"train_loss": -11.966859817504883, "global_step": 247928, "epoch": 1475} {"train_loss": -11.626320838928223, "global_step": 247929, "epoch": 1475} {"train_loss": -11.906158447265625, "global_step": 247930, "epoch": 1475} {"train_loss": -11.698081970214844, "global_step": 247931, "epoch": 1475} {"train_loss": -11.259531021118164, "global_step": 247932, "epoch": 1475} {"train_loss": -11.966712951660156, "global_step": 247933, "epoch": 1475} {"train_loss": -11.669032096862793, "global_step": 247934, "epoch": 1475} {"train_loss": -11.74461555480957, "global_step": 247935, "epoch": 1475} {"train_loss": -11.762240409851074, "global_step": 247936, "epoch": 1475} {"train_loss": -11.273838996887207, "global_step": 247937, "epoch": 1475} {"train_loss": -11.908456802368164, "global_step": 247938, "epoch": 1475} {"train_loss": -12.109854698181152, "global_step": 247939, "epoch": 1475} {"train_loss": -11.63644790649414, "global_step": 247940, "epoch": 1475} {"train_loss": -11.68435287475586, "global_step": 247941, "epoch": 1475} {"train_loss": -11.719992637634277, "global_step": 247942, "epoch": 1475} {"train_loss": -11.195243835449219, "global_step": 247943, "epoch": 1475} {"train_loss": -11.409822463989258, "global_step": 247944, "epoch": 1475} {"train_loss": -11.962387084960938, "global_step": 247945, "epoch": 1475} {"train_loss": -11.17564582824707, "global_step": 247946, "epoch": 1475} {"train_loss": -11.399270057678223, "global_step": 247947, "epoch": 1475} {"train_loss": -11.623029708862305, "global_step": 247948, "epoch": 1475} {"train_loss": -11.85269832611084, "global_step": 247949, "epoch": 1475} {"train_loss": -11.999282836914062, "global_step": 247950, "epoch": 1475} {"train_loss": -11.913684844970703, "global_step": 247951, "epoch": 1475} {"train_loss": -11.574593544006348, "global_step": 247952, "epoch": 1475} {"train_loss": -11.874406814575195, "global_step": 247953, "epoch": 1475} {"train_loss": -11.602384567260742, "global_step": 247954, "epoch": 1475} {"train_loss": -11.120718002319336, "global_step": 247955, "epoch": 1475} {"train_loss": -11.611108779907227, "global_step": 247956, "epoch": 1475} {"train_loss": -11.622011184692383, "global_step": 247957, "epoch": 1475} {"train_loss": -10.798816680908203, "global_step": 247958, "epoch": 1475} {"train_loss": -11.938146591186523, "global_step": 247959, "epoch": 1475} {"train_loss": -11.881044387817383, "global_step": 247960, "epoch": 1475} {"train_loss": -11.904212951660156, "global_step": 247961, "epoch": 1475} {"train_loss": -11.72307014465332, "global_step": 247962, "epoch": 1475} {"train_loss": -11.480915069580078, "global_step": 247963, "epoch": 1475} {"train_loss": -10.830268859863281, "global_step": 247964, "epoch": 1475} {"train_loss": -11.748833656311035, "global_step": 247965, "epoch": 1475} {"train_loss": -11.054218292236328, "global_step": 247966, "epoch": 1475} {"train_loss": -11.522747232800437, "global_step": 247967, "epoch": 1475, "val_loss": 269512.34375, "train_action_mse_error": 2.282411575317383} {"train_loss": -11.961528778076172, "global_step": 247968, "epoch": 1476} {"train_loss": -11.34079647064209, "global_step": 247969, "epoch": 1476} {"train_loss": -11.285404205322266, "global_step": 247970, "epoch": 1476} {"train_loss": -11.529390335083008, "global_step": 247971, "epoch": 1476} {"train_loss": -11.346092224121094, "global_step": 247972, "epoch": 1476} {"train_loss": -11.373492240905762, "global_step": 247973, "epoch": 1476} {"train_loss": -11.569253921508789, "global_step": 247974, "epoch": 1476} {"train_loss": -11.397660255432129, "global_step": 247975, "epoch": 1476} {"train_loss": -11.07963752746582, "global_step": 247976, "epoch": 1476} {"train_loss": -11.732297897338867, "global_step": 247977, "epoch": 1476} {"train_loss": -11.013578414916992, "global_step": 247978, "epoch": 1476} {"train_loss": -11.350358963012695, "global_step": 247979, "epoch": 1476} {"train_loss": -11.075273513793945, "global_step": 247980, "epoch": 1476} {"train_loss": -10.638147354125977, "global_step": 247981, "epoch": 1476} {"train_loss": -11.76301097869873, "global_step": 247982, "epoch": 1476} {"train_loss": -11.353209495544434, "global_step": 247983, "epoch": 1476} {"train_loss": -11.781830787658691, "global_step": 247984, "epoch": 1476} {"train_loss": -11.506125450134277, "global_step": 247985, "epoch": 1476} {"train_loss": -11.304609298706055, "global_step": 247986, "epoch": 1476} {"train_loss": -11.824968338012695, "global_step": 247987, "epoch": 1476} {"train_loss": -10.889325141906738, "global_step": 247988, "epoch": 1476} {"train_loss": -11.758310317993164, "global_step": 247989, "epoch": 1476} {"train_loss": -11.158028602600098, "global_step": 247990, "epoch": 1476} {"train_loss": -11.651906967163086, "global_step": 247991, "epoch": 1476} {"train_loss": -11.255228996276855, "global_step": 247992, "epoch": 1476} {"train_loss": -11.805883407592773, "global_step": 247993, "epoch": 1476} {"train_loss": -11.272589683532715, "global_step": 247994, "epoch": 1476} {"train_loss": -11.706424713134766, "global_step": 247995, "epoch": 1476} {"train_loss": -11.880950927734375, "global_step": 247996, "epoch": 1476} {"train_loss": -11.813169479370117, "global_step": 247997, "epoch": 1476} {"train_loss": -11.860023498535156, "global_step": 247998, "epoch": 1476} {"train_loss": -11.60999584197998, "global_step": 247999, "epoch": 1476} {"train_loss": -11.696853637695312, "global_step": 248000, "epoch": 1476} {"train_loss": -11.815104484558105, "global_step": 248001, "epoch": 1476} {"train_loss": -11.801231384277344, "global_step": 248002, "epoch": 1476} {"train_loss": -11.768532752990723, "global_step": 248003, "epoch": 1476} {"train_loss": -11.46088695526123, "global_step": 248004, "epoch": 1476} {"train_loss": -11.903491020202637, "global_step": 248005, "epoch": 1476} {"train_loss": -11.493282318115234, "global_step": 248006, "epoch": 1476} {"train_loss": -11.72451114654541, "global_step": 248007, "epoch": 1476} {"train_loss": -11.122303009033203, "global_step": 248008, "epoch": 1476} {"train_loss": -11.79150390625, "global_step": 248009, "epoch": 1476} {"train_loss": -10.958268165588379, "global_step": 248010, "epoch": 1476} {"train_loss": -11.62045669555664, "global_step": 248011, "epoch": 1476} {"train_loss": -11.284109115600586, "global_step": 248012, "epoch": 1476} {"train_loss": -11.35971736907959, "global_step": 248013, "epoch": 1476} {"train_loss": -11.600604057312012, "global_step": 248014, "epoch": 1476} {"train_loss": -11.386852264404297, "global_step": 248015, "epoch": 1476} {"train_loss": -10.835634231567383, "global_step": 248016, "epoch": 1476} {"train_loss": -11.150245666503906, "global_step": 248017, "epoch": 1476} {"train_loss": -9.553705215454102, "global_step": 248018, "epoch": 1476} {"train_loss": -7.847546577453613, "global_step": 248019, "epoch": 1476} {"train_loss": -8.664468765258789, "global_step": 248020, "epoch": 1476} {"train_loss": -9.882018089294434, "global_step": 248021, "epoch": 1476} {"train_loss": -9.744478225708008, "global_step": 248022, "epoch": 1476} {"train_loss": -8.635952949523926, "global_step": 248023, "epoch": 1476} {"train_loss": -8.155487060546875, "global_step": 248024, "epoch": 1476} {"train_loss": -7.758446216583252, "global_step": 248025, "epoch": 1476} {"train_loss": -8.473844528198242, "global_step": 248026, "epoch": 1476} {"train_loss": -9.173338890075684, "global_step": 248027, "epoch": 1476} {"train_loss": -8.447242736816406, "global_step": 248028, "epoch": 1476} {"train_loss": -8.42614459991455, "global_step": 248029, "epoch": 1476} {"train_loss": -8.462940216064453, "global_step": 248030, "epoch": 1476} {"train_loss": -8.424189567565918, "global_step": 248031, "epoch": 1476} {"train_loss": -9.381521224975586, "global_step": 248032, "epoch": 1476} {"train_loss": -9.303424835205078, "global_step": 248033, "epoch": 1476} {"train_loss": -10.358884811401367, "global_step": 248034, "epoch": 1476} {"train_loss": -9.61546802520752, "global_step": 248035, "epoch": 1476} {"train_loss": -10.872783660888672, "global_step": 248036, "epoch": 1476} {"train_loss": -10.75136947631836, "global_step": 248037, "epoch": 1476} {"train_loss": -9.730923652648926, "global_step": 248038, "epoch": 1476} {"train_loss": -10.782894134521484, "global_step": 248039, "epoch": 1476} {"train_loss": -10.967351913452148, "global_step": 248040, "epoch": 1476} {"train_loss": -10.450889587402344, "global_step": 248041, "epoch": 1476} {"train_loss": -10.72110366821289, "global_step": 248042, "epoch": 1476} {"train_loss": -10.97574234008789, "global_step": 248043, "epoch": 1476} {"train_loss": -10.716794967651367, "global_step": 248044, "epoch": 1476} {"train_loss": -10.887964248657227, "global_step": 248045, "epoch": 1476} {"train_loss": -11.248710632324219, "global_step": 248046, "epoch": 1476} {"train_loss": -10.675045013427734, "global_step": 248047, "epoch": 1476} {"train_loss": -11.281606674194336, "global_step": 248048, "epoch": 1476} {"train_loss": -10.95715618133545, "global_step": 248049, "epoch": 1476} {"train_loss": -11.214372634887695, "global_step": 248050, "epoch": 1476} {"train_loss": -11.007490158081055, "global_step": 248051, "epoch": 1476} {"train_loss": -10.925497055053711, "global_step": 248052, "epoch": 1476} {"train_loss": -11.214853286743164, "global_step": 248053, "epoch": 1476} {"train_loss": -10.860223770141602, "global_step": 248054, "epoch": 1476} {"train_loss": -11.082544326782227, "global_step": 248055, "epoch": 1476} {"train_loss": -11.45993423461914, "global_step": 248056, "epoch": 1476} {"train_loss": -11.12101936340332, "global_step": 248057, "epoch": 1476} {"train_loss": -11.240447044372559, "global_step": 248058, "epoch": 1476} {"train_loss": -11.239886283874512, "global_step": 248059, "epoch": 1476} {"train_loss": -11.326786994934082, "global_step": 248060, "epoch": 1476} {"train_loss": -11.348681449890137, "global_step": 248061, "epoch": 1476} {"train_loss": -11.125213623046875, "global_step": 248062, "epoch": 1476} {"train_loss": -11.370874404907227, "global_step": 248063, "epoch": 1476} {"train_loss": -11.177894592285156, "global_step": 248064, "epoch": 1476} {"train_loss": -11.43470573425293, "global_step": 248065, "epoch": 1476} {"train_loss": -11.435726165771484, "global_step": 248066, "epoch": 1476} {"train_loss": -11.624265670776367, "global_step": 248067, "epoch": 1476} {"train_loss": -11.472993850708008, "global_step": 248068, "epoch": 1476} {"train_loss": -11.434124946594238, "global_step": 248069, "epoch": 1476} {"train_loss": -11.847536087036133, "global_step": 248070, "epoch": 1476} {"train_loss": -11.340867042541504, "global_step": 248071, "epoch": 1476} {"train_loss": -11.678650856018066, "global_step": 248072, "epoch": 1476} {"train_loss": -11.571632385253906, "global_step": 248073, "epoch": 1476} {"train_loss": -11.640541076660156, "global_step": 248074, "epoch": 1476} {"train_loss": -11.857839584350586, "global_step": 248075, "epoch": 1476} {"train_loss": -11.646736145019531, "global_step": 248076, "epoch": 1476} {"train_loss": -11.952385902404785, "global_step": 248077, "epoch": 1476} {"train_loss": -11.52011489868164, "global_step": 248078, "epoch": 1476} {"train_loss": -11.737773895263672, "global_step": 248079, "epoch": 1476} {"train_loss": -11.797978401184082, "global_step": 248080, "epoch": 1476} {"train_loss": -11.796521186828613, "global_step": 248081, "epoch": 1476} {"train_loss": -11.900655746459961, "global_step": 248082, "epoch": 1476} {"train_loss": -11.906309127807617, "global_step": 248083, "epoch": 1476} {"train_loss": -11.854724884033203, "global_step": 248084, "epoch": 1476} {"train_loss": -11.813493728637695, "global_step": 248085, "epoch": 1476} {"train_loss": -11.746633529663086, "global_step": 248086, "epoch": 1476} {"train_loss": -11.93165397644043, "global_step": 248087, "epoch": 1476} {"train_loss": -11.722672462463379, "global_step": 248088, "epoch": 1476} {"train_loss": -11.873405456542969, "global_step": 248089, "epoch": 1476} {"train_loss": -11.804132461547852, "global_step": 248090, "epoch": 1476} {"train_loss": -11.974777221679688, "global_step": 248091, "epoch": 1476} {"train_loss": -12.019336700439453, "global_step": 248092, "epoch": 1476} {"train_loss": -11.976723670959473, "global_step": 248093, "epoch": 1476} {"train_loss": -12.064680099487305, "global_step": 248094, "epoch": 1476} {"train_loss": -12.171296119689941, "global_step": 248095, "epoch": 1476} {"train_loss": -12.115817070007324, "global_step": 248096, "epoch": 1476} {"train_loss": -12.20079231262207, "global_step": 248097, "epoch": 1476} {"train_loss": -12.023706436157227, "global_step": 248098, "epoch": 1476} {"train_loss": -12.038042068481445, "global_step": 248099, "epoch": 1476} {"train_loss": -11.964289665222168, "global_step": 248100, "epoch": 1476} {"train_loss": -11.984893798828125, "global_step": 248101, "epoch": 1476} {"train_loss": -11.987300872802734, "global_step": 248102, "epoch": 1476} {"train_loss": -12.099702835083008, "global_step": 248103, "epoch": 1476} {"train_loss": -12.161087989807129, "global_step": 248104, "epoch": 1476} {"train_loss": -12.288908004760742, "global_step": 248105, "epoch": 1476} {"train_loss": -12.118110656738281, "global_step": 248106, "epoch": 1476} {"train_loss": -11.997228622436523, "global_step": 248107, "epoch": 1476} {"train_loss": -12.0006742477417, "global_step": 248108, "epoch": 1476} {"train_loss": -11.90779972076416, "global_step": 248109, "epoch": 1476} {"train_loss": -12.254813194274902, "global_step": 248110, "epoch": 1476} {"train_loss": -11.976531028747559, "global_step": 248111, "epoch": 1476} {"train_loss": -12.063578605651855, "global_step": 248112, "epoch": 1476} {"train_loss": -11.967942237854004, "global_step": 248113, "epoch": 1476} {"train_loss": -11.88409423828125, "global_step": 248114, "epoch": 1476} {"train_loss": -12.212451934814453, "global_step": 248115, "epoch": 1476} {"train_loss": -11.947566986083984, "global_step": 248116, "epoch": 1476} {"train_loss": -11.883997917175293, "global_step": 248117, "epoch": 1476} {"train_loss": -12.040595054626465, "global_step": 248118, "epoch": 1476} {"train_loss": -11.855972290039062, "global_step": 248119, "epoch": 1476} {"train_loss": -11.855915069580078, "global_step": 248120, "epoch": 1476} {"train_loss": -11.351139068603516, "global_step": 248121, "epoch": 1476} {"train_loss": -11.543323516845703, "global_step": 248122, "epoch": 1476} {"train_loss": -12.039931297302246, "global_step": 248123, "epoch": 1476} {"train_loss": -11.633435249328613, "global_step": 248124, "epoch": 1476} {"train_loss": -11.214607238769531, "global_step": 248125, "epoch": 1476} {"train_loss": -11.547894477844238, "global_step": 248126, "epoch": 1476} {"train_loss": -12.215763092041016, "global_step": 248127, "epoch": 1476} {"train_loss": -11.761425971984863, "global_step": 248128, "epoch": 1476} {"train_loss": -11.894427299499512, "global_step": 248129, "epoch": 1476} {"train_loss": -12.129667282104492, "global_step": 248130, "epoch": 1476} {"train_loss": -11.979881286621094, "global_step": 248131, "epoch": 1476} {"train_loss": -11.954164505004883, "global_step": 248132, "epoch": 1476} {"train_loss": -11.661203384399414, "global_step": 248133, "epoch": 1476} {"train_loss": -11.97298812866211, "global_step": 248134, "epoch": 1476} {"train_loss": -11.278748793261391, "global_step": 248135, "epoch": 1476, "val_loss": 260403.671875} {"train_loss": -11.988061904907227, "global_step": 248136, "epoch": 1477} {"train_loss": -11.80702018737793, "global_step": 248137, "epoch": 1477} {"train_loss": -11.85112190246582, "global_step": 248138, "epoch": 1477} {"train_loss": -12.189289093017578, "global_step": 248139, "epoch": 1477} {"train_loss": -11.736246109008789, "global_step": 248140, "epoch": 1477} {"train_loss": -12.042939186096191, "global_step": 248141, "epoch": 1477} {"train_loss": -11.992342948913574, "global_step": 248142, "epoch": 1477} {"train_loss": -11.725295066833496, "global_step": 248143, "epoch": 1477} {"train_loss": -11.133343696594238, "global_step": 248144, "epoch": 1477} {"train_loss": -11.255905151367188, "global_step": 248145, "epoch": 1477} {"train_loss": -11.585126876831055, "global_step": 248146, "epoch": 1477} {"train_loss": -11.773384094238281, "global_step": 248147, "epoch": 1477} {"train_loss": -10.914738655090332, "global_step": 248148, "epoch": 1477} {"train_loss": -10.961880683898926, "global_step": 248149, "epoch": 1477} {"train_loss": -11.060308456420898, "global_step": 248150, "epoch": 1477} {"train_loss": -8.568191528320312, "global_step": 248151, "epoch": 1477} {"train_loss": -8.445577621459961, "global_step": 248152, "epoch": 1477} {"train_loss": -8.976015090942383, "global_step": 248153, "epoch": 1477} {"train_loss": -11.399004936218262, "global_step": 248154, "epoch": 1477} {"train_loss": -9.137588500976562, "global_step": 248155, "epoch": 1477} {"train_loss": -11.071937561035156, "global_step": 248156, "epoch": 1477} {"train_loss": -10.542197227478027, "global_step": 248157, "epoch": 1477} {"train_loss": -10.528360366821289, "global_step": 248158, "epoch": 1477} {"train_loss": -10.860963821411133, "global_step": 248159, "epoch": 1477} {"train_loss": -9.906010627746582, "global_step": 248160, "epoch": 1477} {"train_loss": -11.023698806762695, "global_step": 248161, "epoch": 1477} {"train_loss": -11.069805145263672, "global_step": 248162, "epoch": 1477} {"train_loss": -11.37335205078125, "global_step": 248163, "epoch": 1477} {"train_loss": -10.966432571411133, "global_step": 248164, "epoch": 1477} {"train_loss": -10.706949234008789, "global_step": 248165, "epoch": 1477} {"train_loss": -11.376571655273438, "global_step": 248166, "epoch": 1477} {"train_loss": -10.909263610839844, "global_step": 248167, "epoch": 1477} {"train_loss": -11.66006088256836, "global_step": 248168, "epoch": 1477} {"train_loss": -10.752248764038086, "global_step": 248169, "epoch": 1477} {"train_loss": -11.498855590820312, "global_step": 248170, "epoch": 1477} {"train_loss": -11.90662956237793, "global_step": 248171, "epoch": 1477} {"train_loss": -11.06223201751709, "global_step": 248172, "epoch": 1477} {"train_loss": -11.335018157958984, "global_step": 248173, "epoch": 1477} {"train_loss": -11.818747520446777, "global_step": 248174, "epoch": 1477} {"train_loss": -11.176974296569824, "global_step": 248175, "epoch": 1477} {"train_loss": -11.209932327270508, "global_step": 248176, "epoch": 1477} {"train_loss": -11.451566696166992, "global_step": 248177, "epoch": 1477} {"train_loss": -11.495838165283203, "global_step": 248178, "epoch": 1477} {"train_loss": -11.682832717895508, "global_step": 248179, "epoch": 1477} {"train_loss": -11.600017547607422, "global_step": 248180, "epoch": 1477} {"train_loss": -11.473094940185547, "global_step": 248181, "epoch": 1477} {"train_loss": -11.866660118103027, "global_step": 248182, "epoch": 1477} {"train_loss": -11.69688892364502, "global_step": 248183, "epoch": 1477} {"train_loss": -11.577736854553223, "global_step": 248184, "epoch": 1477} {"train_loss": -11.452454566955566, "global_step": 248185, "epoch": 1477} {"train_loss": -11.807106018066406, "global_step": 248186, "epoch": 1477} {"train_loss": -11.479459762573242, "global_step": 248187, "epoch": 1477} {"train_loss": -11.499719619750977, "global_step": 248188, "epoch": 1477} {"train_loss": -11.122369766235352, "global_step": 248189, "epoch": 1477} {"train_loss": -11.677380561828613, "global_step": 248190, "epoch": 1477} {"train_loss": -11.352457046508789, "global_step": 248191, "epoch": 1477} {"train_loss": -11.615528106689453, "global_step": 248192, "epoch": 1477} {"train_loss": -11.563705444335938, "global_step": 248193, "epoch": 1477} {"train_loss": -11.295991897583008, "global_step": 248194, "epoch": 1477} {"train_loss": -11.681562423706055, "global_step": 248195, "epoch": 1477} {"train_loss": -11.555013656616211, "global_step": 248196, "epoch": 1477} {"train_loss": -11.920193672180176, "global_step": 248197, "epoch": 1477} {"train_loss": -11.671384811401367, "global_step": 248198, "epoch": 1477} {"train_loss": -11.819635391235352, "global_step": 248199, "epoch": 1477} {"train_loss": -11.695281982421875, "global_step": 248200, "epoch": 1477} {"train_loss": -11.699979782104492, "global_step": 248201, "epoch": 1477} {"train_loss": -11.70449447631836, "global_step": 248202, "epoch": 1477} {"train_loss": -11.822729110717773, "global_step": 248203, "epoch": 1477} {"train_loss": -11.767410278320312, "global_step": 248204, "epoch": 1477} {"train_loss": -11.510318756103516, "global_step": 248205, "epoch": 1477} {"train_loss": -11.52256965637207, "global_step": 248206, "epoch": 1477} {"train_loss": -11.577580451965332, "global_step": 248207, "epoch": 1477} {"train_loss": -12.019247055053711, "global_step": 248208, "epoch": 1477} {"train_loss": -11.786373138427734, "global_step": 248209, "epoch": 1477} {"train_loss": -11.793219566345215, "global_step": 248210, "epoch": 1477} {"train_loss": -11.963640213012695, "global_step": 248211, "epoch": 1477} {"train_loss": -11.906432151794434, "global_step": 248212, "epoch": 1477} {"train_loss": -11.904541015625, "global_step": 248213, "epoch": 1477} {"train_loss": -11.610766410827637, "global_step": 248214, "epoch": 1477} {"train_loss": -11.597766876220703, "global_step": 248215, "epoch": 1477} {"train_loss": -11.960678100585938, "global_step": 248216, "epoch": 1477} {"train_loss": -11.638423919677734, "global_step": 248217, "epoch": 1477} {"train_loss": -11.87527084350586, "global_step": 248218, "epoch": 1477} {"train_loss": -11.980899810791016, "global_step": 248219, "epoch": 1477} {"train_loss": -11.912468910217285, "global_step": 248220, "epoch": 1477} {"train_loss": -11.93629264831543, "global_step": 248221, "epoch": 1477} {"train_loss": -11.799558639526367, "global_step": 248222, "epoch": 1477} {"train_loss": -11.919075012207031, "global_step": 248223, "epoch": 1477} {"train_loss": -12.006388664245605, "global_step": 248224, "epoch": 1477} {"train_loss": -11.810649871826172, "global_step": 248225, "epoch": 1477} {"train_loss": -11.984551429748535, "global_step": 248226, "epoch": 1477} {"train_loss": -11.96257209777832, "global_step": 248227, "epoch": 1477} {"train_loss": -11.722661018371582, "global_step": 248228, "epoch": 1477} {"train_loss": -12.054298400878906, "global_step": 248229, "epoch": 1477} {"train_loss": -11.733792304992676, "global_step": 248230, "epoch": 1477} {"train_loss": -11.29902172088623, "global_step": 248231, "epoch": 1477} {"train_loss": -11.981189727783203, "global_step": 248232, "epoch": 1477} {"train_loss": -11.751479148864746, "global_step": 248233, "epoch": 1477} {"train_loss": -11.86400032043457, "global_step": 248234, "epoch": 1477} {"train_loss": -11.873830795288086, "global_step": 248235, "epoch": 1477} {"train_loss": -11.401987075805664, "global_step": 248236, "epoch": 1477} {"train_loss": -11.592294692993164, "global_step": 248237, "epoch": 1477} {"train_loss": -11.326517105102539, "global_step": 248238, "epoch": 1477} {"train_loss": -11.85812759399414, "global_step": 248239, "epoch": 1477} {"train_loss": -11.907215118408203, "global_step": 248240, "epoch": 1477} {"train_loss": -10.777246475219727, "global_step": 248241, "epoch": 1477} {"train_loss": -11.489385604858398, "global_step": 248242, "epoch": 1477} {"train_loss": -10.584709167480469, "global_step": 248243, "epoch": 1477} {"train_loss": -11.162166595458984, "global_step": 248244, "epoch": 1477} {"train_loss": -9.842364311218262, "global_step": 248245, "epoch": 1477} {"train_loss": -10.965970993041992, "global_step": 248246, "epoch": 1477} {"train_loss": -10.837570190429688, "global_step": 248247, "epoch": 1477} {"train_loss": -10.066675186157227, "global_step": 248248, "epoch": 1477} {"train_loss": -10.303045272827148, "global_step": 248249, "epoch": 1477} {"train_loss": -11.03915786743164, "global_step": 248250, "epoch": 1477} {"train_loss": -9.86883544921875, "global_step": 248251, "epoch": 1477} {"train_loss": -11.375107765197754, "global_step": 248252, "epoch": 1477} {"train_loss": -10.805246353149414, "global_step": 248253, "epoch": 1477} {"train_loss": -11.003817558288574, "global_step": 248254, "epoch": 1477} {"train_loss": -11.226859092712402, "global_step": 248255, "epoch": 1477} {"train_loss": -10.817957878112793, "global_step": 248256, "epoch": 1477} {"train_loss": -10.851844787597656, "global_step": 248257, "epoch": 1477} {"train_loss": -10.508843421936035, "global_step": 248258, "epoch": 1477} {"train_loss": -11.279462814331055, "global_step": 248259, "epoch": 1477} {"train_loss": -11.08078384399414, "global_step": 248260, "epoch": 1477} {"train_loss": -11.102092742919922, "global_step": 248261, "epoch": 1477} {"train_loss": -10.740899085998535, "global_step": 248262, "epoch": 1477} {"train_loss": -11.08896541595459, "global_step": 248263, "epoch": 1477} {"train_loss": -10.795877456665039, "global_step": 248264, "epoch": 1477} {"train_loss": -11.474672317504883, "global_step": 248265, "epoch": 1477} {"train_loss": -11.069059371948242, "global_step": 248266, "epoch": 1477} {"train_loss": -11.482311248779297, "global_step": 248267, "epoch": 1477} {"train_loss": -11.253816604614258, "global_step": 248268, "epoch": 1477} {"train_loss": -11.55123233795166, "global_step": 248269, "epoch": 1477} {"train_loss": -10.928021430969238, "global_step": 248270, "epoch": 1477} {"train_loss": -11.476634979248047, "global_step": 248271, "epoch": 1477} {"train_loss": -11.20952033996582, "global_step": 248272, "epoch": 1477} {"train_loss": -11.564111709594727, "global_step": 248273, "epoch": 1477} {"train_loss": -11.631383895874023, "global_step": 248274, "epoch": 1477} {"train_loss": -11.393299102783203, "global_step": 248275, "epoch": 1477} {"train_loss": -11.61119270324707, "global_step": 248276, "epoch": 1477} {"train_loss": -11.419161796569824, "global_step": 248277, "epoch": 1477} {"train_loss": -11.132404327392578, "global_step": 248278, "epoch": 1477} {"train_loss": -11.58775520324707, "global_step": 248279, "epoch": 1477} {"train_loss": -11.022468566894531, "global_step": 248280, "epoch": 1477} {"train_loss": -11.461216926574707, "global_step": 248281, "epoch": 1477} {"train_loss": -11.154379844665527, "global_step": 248282, "epoch": 1477} {"train_loss": -10.983760833740234, "global_step": 248283, "epoch": 1477} {"train_loss": -11.641756057739258, "global_step": 248284, "epoch": 1477} {"train_loss": -11.370028495788574, "global_step": 248285, "epoch": 1477} {"train_loss": -11.380898475646973, "global_step": 248286, "epoch": 1477} {"train_loss": -11.496593475341797, "global_step": 248287, "epoch": 1477} {"train_loss": -11.304839134216309, "global_step": 248288, "epoch": 1477} {"train_loss": -11.674673080444336, "global_step": 248289, "epoch": 1477} {"train_loss": -11.156475067138672, "global_step": 248290, "epoch": 1477} {"train_loss": -11.522176742553711, "global_step": 248291, "epoch": 1477} {"train_loss": -10.869239807128906, "global_step": 248292, "epoch": 1477} {"train_loss": -11.58376693725586, "global_step": 248293, "epoch": 1477} {"train_loss": -11.47006607055664, "global_step": 248294, "epoch": 1477} {"train_loss": -11.515334129333496, "global_step": 248295, "epoch": 1477} {"train_loss": -11.589385986328125, "global_step": 248296, "epoch": 1477} {"train_loss": -11.57310962677002, "global_step": 248297, "epoch": 1477} {"train_loss": -11.656013488769531, "global_step": 248298, "epoch": 1477} {"train_loss": -11.56562614440918, "global_step": 248299, "epoch": 1477} {"train_loss": -11.815725326538086, "global_step": 248300, "epoch": 1477} {"train_loss": -11.435161590576172, "global_step": 248301, "epoch": 1477} {"train_loss": -11.879834175109863, "global_step": 248302, "epoch": 1477} {"train_loss": -11.35537999016898, "global_step": 248303, "epoch": 1477, "val_loss": 263824.3125} {"train_loss": -11.694432258605957, "global_step": 248304, "epoch": 1478} {"train_loss": -11.53451156616211, "global_step": 248305, "epoch": 1478} {"train_loss": -11.918198585510254, "global_step": 248306, "epoch": 1478} {"train_loss": -11.441686630249023, "global_step": 248307, "epoch": 1478} {"train_loss": -11.651247024536133, "global_step": 248308, "epoch": 1478} {"train_loss": -11.580698013305664, "global_step": 248309, "epoch": 1478} {"train_loss": -11.787520408630371, "global_step": 248310, "epoch": 1478} {"train_loss": -11.687921524047852, "global_step": 248311, "epoch": 1478} {"train_loss": -12.008180618286133, "global_step": 248312, "epoch": 1478} {"train_loss": -11.509870529174805, "global_step": 248313, "epoch": 1478} {"train_loss": -11.878297805786133, "global_step": 248314, "epoch": 1478} {"train_loss": -11.879749298095703, "global_step": 248315, "epoch": 1478} {"train_loss": -11.906512260437012, "global_step": 248316, "epoch": 1478} {"train_loss": -12.075196266174316, "global_step": 248317, "epoch": 1478} {"train_loss": -11.869630813598633, "global_step": 248318, "epoch": 1478} {"train_loss": -11.997249603271484, "global_step": 248319, "epoch": 1478} {"train_loss": -11.826544761657715, "global_step": 248320, "epoch": 1478} {"train_loss": -11.98554801940918, "global_step": 248321, "epoch": 1478} {"train_loss": -11.74193286895752, "global_step": 248322, "epoch": 1478} {"train_loss": -11.901941299438477, "global_step": 248323, "epoch": 1478} {"train_loss": -12.045461654663086, "global_step": 248324, "epoch": 1478} {"train_loss": -11.864831924438477, "global_step": 248325, "epoch": 1478} {"train_loss": -11.901391983032227, "global_step": 248326, "epoch": 1478} {"train_loss": -11.824356079101562, "global_step": 248327, "epoch": 1478} {"train_loss": -12.106616973876953, "global_step": 248328, "epoch": 1478} {"train_loss": -11.948151588439941, "global_step": 248329, "epoch": 1478} {"train_loss": -12.090958595275879, "global_step": 248330, "epoch": 1478} {"train_loss": -12.020917892456055, "global_step": 248331, "epoch": 1478} {"train_loss": -11.902225494384766, "global_step": 248332, "epoch": 1478} {"train_loss": -11.987466812133789, "global_step": 248333, "epoch": 1478} {"train_loss": -12.06845474243164, "global_step": 248334, "epoch": 1478} {"train_loss": -11.808222770690918, "global_step": 248335, "epoch": 1478} {"train_loss": -12.242982864379883, "global_step": 248336, "epoch": 1478} {"train_loss": -11.904424667358398, "global_step": 248337, "epoch": 1478} {"train_loss": -12.13436508178711, "global_step": 248338, "epoch": 1478} {"train_loss": -11.963602066040039, "global_step": 248339, "epoch": 1478} {"train_loss": -11.9609375, "global_step": 248340, "epoch": 1478} {"train_loss": -11.776786804199219, "global_step": 248341, "epoch": 1478} {"train_loss": -12.170761108398438, "global_step": 248342, "epoch": 1478} {"train_loss": -11.95876693725586, "global_step": 248343, "epoch": 1478} {"train_loss": -11.946222305297852, "global_step": 248344, "epoch": 1478} {"train_loss": -11.898921966552734, "global_step": 248345, "epoch": 1478} {"train_loss": -11.930232048034668, "global_step": 248346, "epoch": 1478} {"train_loss": -11.977811813354492, "global_step": 248347, "epoch": 1478} {"train_loss": -11.562110900878906, "global_step": 248348, "epoch": 1478} {"train_loss": -12.057626724243164, "global_step": 248349, "epoch": 1478} {"train_loss": -11.714978218078613, "global_step": 248350, "epoch": 1478} {"train_loss": -12.023113250732422, "global_step": 248351, "epoch": 1478} {"train_loss": -11.812296867370605, "global_step": 248352, "epoch": 1478} {"train_loss": -11.44263744354248, "global_step": 248353, "epoch": 1478} {"train_loss": -11.925353050231934, "global_step": 248354, "epoch": 1478} {"train_loss": -11.926148414611816, "global_step": 248355, "epoch": 1478} {"train_loss": -11.254905700683594, "global_step": 248356, "epoch": 1478} {"train_loss": -12.100255966186523, "global_step": 248357, "epoch": 1478} {"train_loss": -11.900598526000977, "global_step": 248358, "epoch": 1478} {"train_loss": -11.468650817871094, "global_step": 248359, "epoch": 1478} {"train_loss": -11.599907875061035, "global_step": 248360, "epoch": 1478} {"train_loss": -11.581497192382812, "global_step": 248361, "epoch": 1478} {"train_loss": -9.884613990783691, "global_step": 248362, "epoch": 1478} {"train_loss": -10.551165580749512, "global_step": 248363, "epoch": 1478} {"train_loss": -11.28390884399414, "global_step": 248364, "epoch": 1478} {"train_loss": -8.523755073547363, "global_step": 248365, "epoch": 1478} {"train_loss": -9.220220565795898, "global_step": 248366, "epoch": 1478} {"train_loss": -10.011518478393555, "global_step": 248367, "epoch": 1478} {"train_loss": -10.201590538024902, "global_step": 248368, "epoch": 1478} {"train_loss": -11.181805610656738, "global_step": 248369, "epoch": 1478} {"train_loss": -10.635356903076172, "global_step": 248370, "epoch": 1478} {"train_loss": -11.329248428344727, "global_step": 248371, "epoch": 1478} {"train_loss": -10.797065734863281, "global_step": 248372, "epoch": 1478} {"train_loss": -10.436595916748047, "global_step": 248373, "epoch": 1478} {"train_loss": -11.503621101379395, "global_step": 248374, "epoch": 1478} {"train_loss": -10.63980484008789, "global_step": 248375, "epoch": 1478} {"train_loss": -11.605167388916016, "global_step": 248376, "epoch": 1478} {"train_loss": -9.797561645507812, "global_step": 248377, "epoch": 1478} {"train_loss": -10.712788581848145, "global_step": 248378, "epoch": 1478} {"train_loss": -10.299283981323242, "global_step": 248379, "epoch": 1478} {"train_loss": -10.505531311035156, "global_step": 248380, "epoch": 1478} {"train_loss": -10.768611907958984, "global_step": 248381, "epoch": 1478} {"train_loss": -10.618240356445312, "global_step": 248382, "epoch": 1478} {"train_loss": -11.379963874816895, "global_step": 248383, "epoch": 1478} {"train_loss": -11.06131649017334, "global_step": 248384, "epoch": 1478} {"train_loss": -10.888627052307129, "global_step": 248385, "epoch": 1478} {"train_loss": -11.310009002685547, "global_step": 248386, "epoch": 1478} {"train_loss": -11.619112014770508, "global_step": 248387, "epoch": 1478} {"train_loss": -11.486723899841309, "global_step": 248388, "epoch": 1478} {"train_loss": -11.736605644226074, "global_step": 248389, "epoch": 1478} {"train_loss": -11.618525505065918, "global_step": 248390, "epoch": 1478} {"train_loss": -11.774847030639648, "global_step": 248391, "epoch": 1478} {"train_loss": -11.724347114562988, "global_step": 248392, "epoch": 1478} {"train_loss": -11.574087142944336, "global_step": 248393, "epoch": 1478} {"train_loss": -11.72003173828125, "global_step": 248394, "epoch": 1478} {"train_loss": -11.665250778198242, "global_step": 248395, "epoch": 1478} {"train_loss": -11.700984954833984, "global_step": 248396, "epoch": 1478} {"train_loss": -11.841410636901855, "global_step": 248397, "epoch": 1478} {"train_loss": -11.569361686706543, "global_step": 248398, "epoch": 1478} {"train_loss": -11.898365020751953, "global_step": 248399, "epoch": 1478} {"train_loss": -11.729043960571289, "global_step": 248400, "epoch": 1478} {"train_loss": -11.873607635498047, "global_step": 248401, "epoch": 1478} {"train_loss": -11.776515007019043, "global_step": 248402, "epoch": 1478} {"train_loss": -11.883440017700195, "global_step": 248403, "epoch": 1478} {"train_loss": -11.746877670288086, "global_step": 248404, "epoch": 1478} {"train_loss": -11.977704048156738, "global_step": 248405, "epoch": 1478} {"train_loss": -11.767001152038574, "global_step": 248406, "epoch": 1478} {"train_loss": -11.789571762084961, "global_step": 248407, "epoch": 1478} {"train_loss": -11.974141120910645, "global_step": 248408, "epoch": 1478} {"train_loss": -11.746378898620605, "global_step": 248409, "epoch": 1478} {"train_loss": -12.038044929504395, "global_step": 248410, "epoch": 1478} {"train_loss": -11.870322227478027, "global_step": 248411, "epoch": 1478} {"train_loss": -11.859762191772461, "global_step": 248412, "epoch": 1478} {"train_loss": -11.713623046875, "global_step": 248413, "epoch": 1478} {"train_loss": -11.804621696472168, "global_step": 248414, "epoch": 1478} {"train_loss": -11.928760528564453, "global_step": 248415, "epoch": 1478} {"train_loss": -11.964344024658203, "global_step": 248416, "epoch": 1478} {"train_loss": -12.137001991271973, "global_step": 248417, "epoch": 1478} {"train_loss": -11.883739471435547, "global_step": 248418, "epoch": 1478} {"train_loss": -12.066045761108398, "global_step": 248419, "epoch": 1478} {"train_loss": -12.188751220703125, "global_step": 248420, "epoch": 1478} {"train_loss": -11.820862770080566, "global_step": 248421, "epoch": 1478} {"train_loss": -11.918493270874023, "global_step": 248422, "epoch": 1478} {"train_loss": -11.943126678466797, "global_step": 248423, "epoch": 1478} {"train_loss": -12.057369232177734, "global_step": 248424, "epoch": 1478} {"train_loss": -11.94413948059082, "global_step": 248425, "epoch": 1478} {"train_loss": -12.16999626159668, "global_step": 248426, "epoch": 1478} {"train_loss": -12.004270553588867, "global_step": 248427, "epoch": 1478} {"train_loss": -12.132161140441895, "global_step": 248428, "epoch": 1478} {"train_loss": -12.231552124023438, "global_step": 248429, "epoch": 1478} {"train_loss": -12.09115219116211, "global_step": 248430, "epoch": 1478} {"train_loss": -11.973054885864258, "global_step": 248431, "epoch": 1478} {"train_loss": -12.090208053588867, "global_step": 248432, "epoch": 1478} {"train_loss": -12.161545753479004, "global_step": 248433, "epoch": 1478} {"train_loss": -12.170299530029297, "global_step": 248434, "epoch": 1478} {"train_loss": -12.030356407165527, "global_step": 248435, "epoch": 1478} {"train_loss": -12.039419174194336, "global_step": 248436, "epoch": 1478} {"train_loss": -12.072030067443848, "global_step": 248437, "epoch": 1478} {"train_loss": -12.096981048583984, "global_step": 248438, "epoch": 1478} {"train_loss": -12.098363876342773, "global_step": 248439, "epoch": 1478} {"train_loss": -12.342872619628906, "global_step": 248440, "epoch": 1478} {"train_loss": -12.00666618347168, "global_step": 248441, "epoch": 1478} {"train_loss": -12.242401123046875, "global_step": 248442, "epoch": 1478} {"train_loss": -12.131402969360352, "global_step": 248443, "epoch": 1478} {"train_loss": -11.329633712768555, "global_step": 248444, "epoch": 1478} {"train_loss": -10.163080215454102, "global_step": 248445, "epoch": 1478} {"train_loss": -11.083751678466797, "global_step": 248446, "epoch": 1478} {"train_loss": -11.890241622924805, "global_step": 248447, "epoch": 1478} {"train_loss": -11.312762260437012, "global_step": 248448, "epoch": 1478} {"train_loss": -11.688201904296875, "global_step": 248449, "epoch": 1478} {"train_loss": -11.506583213806152, "global_step": 248450, "epoch": 1478} {"train_loss": -11.531318664550781, "global_step": 248451, "epoch": 1478} {"train_loss": -11.556184768676758, "global_step": 248452, "epoch": 1478} {"train_loss": -11.683698654174805, "global_step": 248453, "epoch": 1478} {"train_loss": -11.045815467834473, "global_step": 248454, "epoch": 1478} {"train_loss": -11.713842391967773, "global_step": 248455, "epoch": 1478} {"train_loss": -11.898677825927734, "global_step": 248456, "epoch": 1478} {"train_loss": -11.776209831237793, "global_step": 248457, "epoch": 1478} {"train_loss": -11.474231719970703, "global_step": 248458, "epoch": 1478} {"train_loss": -11.984990119934082, "global_step": 248459, "epoch": 1478} {"train_loss": -11.655264854431152, "global_step": 248460, "epoch": 1478} {"train_loss": -11.691146850585938, "global_step": 248461, "epoch": 1478} {"train_loss": -11.556489944458008, "global_step": 248462, "epoch": 1478} {"train_loss": -11.90680980682373, "global_step": 248463, "epoch": 1478} {"train_loss": -12.055764198303223, "global_step": 248464, "epoch": 1478} {"train_loss": -11.56679916381836, "global_step": 248465, "epoch": 1478} {"train_loss": -12.013571739196777, "global_step": 248466, "epoch": 1478} {"train_loss": -12.109092712402344, "global_step": 248467, "epoch": 1478} {"train_loss": -11.897102355957031, "global_step": 248468, "epoch": 1478} {"train_loss": -11.843435287475586, "global_step": 248469, "epoch": 1478} {"train_loss": -11.923416137695312, "global_step": 248470, "epoch": 1478} {"train_loss": -11.65484527179173, "global_step": 248471, "epoch": 1478, "val_loss": 266147.8125} {"train_loss": -11.592255592346191, "global_step": 248472, "epoch": 1479} {"train_loss": -11.74545669555664, "global_step": 248473, "epoch": 1479} {"train_loss": -11.742025375366211, "global_step": 248474, "epoch": 1479} {"train_loss": -11.736457824707031, "global_step": 248475, "epoch": 1479} {"train_loss": -11.169410705566406, "global_step": 248476, "epoch": 1479} {"train_loss": -11.51251220703125, "global_step": 248477, "epoch": 1479} {"train_loss": -11.712491989135742, "global_step": 248478, "epoch": 1479} {"train_loss": -11.185896873474121, "global_step": 248479, "epoch": 1479} {"train_loss": -11.114002227783203, "global_step": 248480, "epoch": 1479} {"train_loss": -11.583162307739258, "global_step": 248481, "epoch": 1479} {"train_loss": -10.76412296295166, "global_step": 248482, "epoch": 1479} {"train_loss": -11.143803596496582, "global_step": 248483, "epoch": 1479} {"train_loss": -11.495229721069336, "global_step": 248484, "epoch": 1479} {"train_loss": -9.821727752685547, "global_step": 248485, "epoch": 1479} {"train_loss": -11.115324020385742, "global_step": 248486, "epoch": 1479} {"train_loss": -10.304632186889648, "global_step": 248487, "epoch": 1479} {"train_loss": -10.085289001464844, "global_step": 248488, "epoch": 1479} {"train_loss": -10.836233139038086, "global_step": 248489, "epoch": 1479} {"train_loss": -10.69205379486084, "global_step": 248490, "epoch": 1479} {"train_loss": -10.384271621704102, "global_step": 248491, "epoch": 1479} {"train_loss": -11.422623634338379, "global_step": 248492, "epoch": 1479} {"train_loss": -10.656599044799805, "global_step": 248493, "epoch": 1479} {"train_loss": -11.41997241973877, "global_step": 248494, "epoch": 1479} {"train_loss": -10.330892562866211, "global_step": 248495, "epoch": 1479} {"train_loss": -11.364994049072266, "global_step": 248496, "epoch": 1479} {"train_loss": -10.236948013305664, "global_step": 248497, "epoch": 1479} {"train_loss": -10.885090827941895, "global_step": 248498, "epoch": 1479} {"train_loss": -11.20595645904541, "global_step": 248499, "epoch": 1479} {"train_loss": -10.739012718200684, "global_step": 248500, "epoch": 1479} {"train_loss": -11.301847457885742, "global_step": 248501, "epoch": 1479} {"train_loss": -10.02730941772461, "global_step": 248502, "epoch": 1479} {"train_loss": -11.164007186889648, "global_step": 248503, "epoch": 1479} {"train_loss": -10.949556350708008, "global_step": 248504, "epoch": 1479} {"train_loss": -9.801673889160156, "global_step": 248505, "epoch": 1479} {"train_loss": -11.483514785766602, "global_step": 248506, "epoch": 1479} {"train_loss": -10.366222381591797, "global_step": 248507, "epoch": 1479} {"train_loss": -10.93483829498291, "global_step": 248508, "epoch": 1479} {"train_loss": -10.758833885192871, "global_step": 248509, "epoch": 1479} {"train_loss": -10.880472183227539, "global_step": 248510, "epoch": 1479} {"train_loss": -11.260526657104492, "global_step": 248511, "epoch": 1479} {"train_loss": -11.025369644165039, "global_step": 248512, "epoch": 1479} {"train_loss": -11.166997909545898, "global_step": 248513, "epoch": 1479} {"train_loss": -11.272052764892578, "global_step": 248514, "epoch": 1479} {"train_loss": -11.079706192016602, "global_step": 248515, "epoch": 1479} {"train_loss": -11.230695724487305, "global_step": 248516, "epoch": 1479} {"train_loss": -11.562036514282227, "global_step": 248517, "epoch": 1479} {"train_loss": -11.220863342285156, "global_step": 248518, "epoch": 1479} {"train_loss": -11.345892906188965, "global_step": 248519, "epoch": 1479} {"train_loss": -11.200891494750977, "global_step": 248520, "epoch": 1479} {"train_loss": -10.809799194335938, "global_step": 248521, "epoch": 1479} {"train_loss": -11.041025161743164, "global_step": 248522, "epoch": 1479} {"train_loss": -10.925504684448242, "global_step": 248523, "epoch": 1479} {"train_loss": -11.173324584960938, "global_step": 248524, "epoch": 1479} {"train_loss": -11.277379989624023, "global_step": 248525, "epoch": 1479} {"train_loss": -11.230043411254883, "global_step": 248526, "epoch": 1479} {"train_loss": -11.294683456420898, "global_step": 248527, "epoch": 1479} {"train_loss": -11.088869094848633, "global_step": 248528, "epoch": 1479} {"train_loss": -11.555052757263184, "global_step": 248529, "epoch": 1479} {"train_loss": -11.444070816040039, "global_step": 248530, "epoch": 1479} {"train_loss": -11.500239372253418, "global_step": 248531, "epoch": 1479} {"train_loss": -11.642412185668945, "global_step": 248532, "epoch": 1479} {"train_loss": -11.55368423461914, "global_step": 248533, "epoch": 1479} {"train_loss": -11.180079460144043, "global_step": 248534, "epoch": 1479} {"train_loss": -11.816510200500488, "global_step": 248535, "epoch": 1479} {"train_loss": -11.236837387084961, "global_step": 248536, "epoch": 1479} {"train_loss": -11.796276092529297, "global_step": 248537, "epoch": 1479} {"train_loss": -11.68801212310791, "global_step": 248538, "epoch": 1479} {"train_loss": -11.735507011413574, "global_step": 248539, "epoch": 1479} {"train_loss": -11.460010528564453, "global_step": 248540, "epoch": 1479} {"train_loss": -11.692212104797363, "global_step": 248541, "epoch": 1479} {"train_loss": -11.377281188964844, "global_step": 248542, "epoch": 1479} {"train_loss": -11.932491302490234, "global_step": 248543, "epoch": 1479} {"train_loss": -11.686967849731445, "global_step": 248544, "epoch": 1479} {"train_loss": -11.780491828918457, "global_step": 248545, "epoch": 1479} {"train_loss": -11.876235961914062, "global_step": 248546, "epoch": 1479} {"train_loss": -11.726588249206543, "global_step": 248547, "epoch": 1479} {"train_loss": -11.774358749389648, "global_step": 248548, "epoch": 1479} {"train_loss": -11.769767761230469, "global_step": 248549, "epoch": 1479} {"train_loss": -11.349201202392578, "global_step": 248550, "epoch": 1479} {"train_loss": -12.076437950134277, "global_step": 248551, "epoch": 1479} {"train_loss": -11.6549711227417, "global_step": 248552, "epoch": 1479} {"train_loss": -11.811604499816895, "global_step": 248553, "epoch": 1479} {"train_loss": -11.831009864807129, "global_step": 248554, "epoch": 1479} {"train_loss": -11.545042991638184, "global_step": 248555, "epoch": 1479} {"train_loss": -12.009450912475586, "global_step": 248556, "epoch": 1479} {"train_loss": -11.556774139404297, "global_step": 248557, "epoch": 1479} {"train_loss": -11.90822982788086, "global_step": 248558, "epoch": 1479} {"train_loss": -11.729732513427734, "global_step": 248559, "epoch": 1479} {"train_loss": -11.947105407714844, "global_step": 248560, "epoch": 1479} {"train_loss": -11.655595779418945, "global_step": 248561, "epoch": 1479} {"train_loss": -11.911197662353516, "global_step": 248562, "epoch": 1479} {"train_loss": -11.81840991973877, "global_step": 248563, "epoch": 1479} {"train_loss": -11.660274505615234, "global_step": 248564, "epoch": 1479} {"train_loss": -11.67611312866211, "global_step": 248565, "epoch": 1479} {"train_loss": -11.572357177734375, "global_step": 248566, "epoch": 1479} {"train_loss": -11.954425811767578, "global_step": 248567, "epoch": 1479} {"train_loss": -11.77268123626709, "global_step": 248568, "epoch": 1479} {"train_loss": -11.904984474182129, "global_step": 248569, "epoch": 1479} {"train_loss": -12.016451835632324, "global_step": 248570, "epoch": 1479} {"train_loss": -11.974249839782715, "global_step": 248571, "epoch": 1479} {"train_loss": -11.579300880432129, "global_step": 248572, "epoch": 1479} {"train_loss": -11.961219787597656, "global_step": 248573, "epoch": 1479} {"train_loss": -11.717855453491211, "global_step": 248574, "epoch": 1479} {"train_loss": -11.864633560180664, "global_step": 248575, "epoch": 1479} {"train_loss": -11.90083122253418, "global_step": 248576, "epoch": 1479} {"train_loss": -11.638526916503906, "global_step": 248577, "epoch": 1479} {"train_loss": -12.197578430175781, "global_step": 248578, "epoch": 1479} {"train_loss": -11.639551162719727, "global_step": 248579, "epoch": 1479} {"train_loss": -12.007403373718262, "global_step": 248580, "epoch": 1479} {"train_loss": -11.573531150817871, "global_step": 248581, "epoch": 1479} {"train_loss": -11.792671203613281, "global_step": 248582, "epoch": 1479} {"train_loss": -11.696516036987305, "global_step": 248583, "epoch": 1479} {"train_loss": -11.811500549316406, "global_step": 248584, "epoch": 1479} {"train_loss": -11.964628219604492, "global_step": 248585, "epoch": 1479} {"train_loss": -12.077850341796875, "global_step": 248586, "epoch": 1479} {"train_loss": -12.181085586547852, "global_step": 248587, "epoch": 1479} {"train_loss": -11.91232681274414, "global_step": 248588, "epoch": 1479} {"train_loss": -11.934672355651855, "global_step": 248589, "epoch": 1479} {"train_loss": -11.955078125, "global_step": 248590, "epoch": 1479} {"train_loss": -12.055404663085938, "global_step": 248591, "epoch": 1479} {"train_loss": -11.856979370117188, "global_step": 248592, "epoch": 1479} {"train_loss": -12.06125259399414, "global_step": 248593, "epoch": 1479} {"train_loss": -12.047527313232422, "global_step": 248594, "epoch": 1479} {"train_loss": -12.13010025024414, "global_step": 248595, "epoch": 1479} {"train_loss": -11.705451965332031, "global_step": 248596, "epoch": 1479} {"train_loss": -11.77772045135498, "global_step": 248597, "epoch": 1479} {"train_loss": -11.779584884643555, "global_step": 248598, "epoch": 1479} {"train_loss": -11.299460411071777, "global_step": 248599, "epoch": 1479} {"train_loss": -12.002554893493652, "global_step": 248600, "epoch": 1479} {"train_loss": -11.733924865722656, "global_step": 248601, "epoch": 1479} {"train_loss": -11.971735000610352, "global_step": 248602, "epoch": 1479} {"train_loss": -11.669450759887695, "global_step": 248603, "epoch": 1479} {"train_loss": -11.003572463989258, "global_step": 248604, "epoch": 1479} {"train_loss": -11.99782943725586, "global_step": 248605, "epoch": 1479} {"train_loss": -11.547285079956055, "global_step": 248606, "epoch": 1479} {"train_loss": -11.766801834106445, "global_step": 248607, "epoch": 1479} {"train_loss": -12.100272178649902, "global_step": 248608, "epoch": 1479} {"train_loss": -11.788702964782715, "global_step": 248609, "epoch": 1479} {"train_loss": -11.663187026977539, "global_step": 248610, "epoch": 1479} {"train_loss": -11.67763900756836, "global_step": 248611, "epoch": 1479} {"train_loss": -11.331399917602539, "global_step": 248612, "epoch": 1479} {"train_loss": -12.073612213134766, "global_step": 248613, "epoch": 1479} {"train_loss": -11.707551956176758, "global_step": 248614, "epoch": 1479} {"train_loss": -11.569862365722656, "global_step": 248615, "epoch": 1479} {"train_loss": -11.870172500610352, "global_step": 248616, "epoch": 1479} {"train_loss": -11.66748046875, "global_step": 248617, "epoch": 1479} {"train_loss": -11.656559944152832, "global_step": 248618, "epoch": 1479} {"train_loss": -11.976369857788086, "global_step": 248619, "epoch": 1479} {"train_loss": -11.578035354614258, "global_step": 248620, "epoch": 1479} {"train_loss": -11.998824119567871, "global_step": 248621, "epoch": 1479} {"train_loss": -11.709467887878418, "global_step": 248622, "epoch": 1479} {"train_loss": -12.0154390335083, "global_step": 248623, "epoch": 1479} {"train_loss": -11.69633960723877, "global_step": 248624, "epoch": 1479} {"train_loss": -11.697280883789062, "global_step": 248625, "epoch": 1479} {"train_loss": -11.65365219116211, "global_step": 248626, "epoch": 1479} {"train_loss": -10.725946426391602, "global_step": 248627, "epoch": 1479} {"train_loss": -10.6431303024292, "global_step": 248628, "epoch": 1479} {"train_loss": -10.838724136352539, "global_step": 248629, "epoch": 1479} {"train_loss": -10.584991455078125, "global_step": 248630, "epoch": 1479} {"train_loss": -8.818514823913574, "global_step": 248631, "epoch": 1479} {"train_loss": -11.221576690673828, "global_step": 248632, "epoch": 1479} {"train_loss": -7.115989685058594, "global_step": 248633, "epoch": 1479} {"train_loss": -8.63793659210205, "global_step": 248634, "epoch": 1479} {"train_loss": -8.305185317993164, "global_step": 248635, "epoch": 1479} {"train_loss": -10.622979164123535, "global_step": 248636, "epoch": 1479} {"train_loss": -7.3147783279418945, "global_step": 248637, "epoch": 1479} {"train_loss": -8.186300277709961, "global_step": 248638, "epoch": 1479} {"train_loss": -11.325337764762697, "global_step": 248639, "epoch": 1479, "val_loss": 264566.34375} {"train_loss": -8.161705017089844, "global_step": 248640, "epoch": 1480} {"train_loss": -9.321662902832031, "global_step": 248641, "epoch": 1480} {"train_loss": -9.142882347106934, "global_step": 248642, "epoch": 1480} {"train_loss": -7.4112749099731445, "global_step": 248643, "epoch": 1480} {"train_loss": -9.355069160461426, "global_step": 248644, "epoch": 1480} {"train_loss": -10.061574935913086, "global_step": 248645, "epoch": 1480} {"train_loss": -8.289956092834473, "global_step": 248646, "epoch": 1480} {"train_loss": -9.055289268493652, "global_step": 248647, "epoch": 1480} {"train_loss": -9.274419784545898, "global_step": 248648, "epoch": 1480} {"train_loss": -9.518476486206055, "global_step": 248649, "epoch": 1480} {"train_loss": -9.316763877868652, "global_step": 248650, "epoch": 1480} {"train_loss": -9.658405303955078, "global_step": 248651, "epoch": 1480} {"train_loss": -10.331551551818848, "global_step": 248652, "epoch": 1480} {"train_loss": -9.674198150634766, "global_step": 248653, "epoch": 1480} {"train_loss": -10.300975799560547, "global_step": 248654, "epoch": 1480} {"train_loss": -10.558633804321289, "global_step": 248655, "epoch": 1480} {"train_loss": -10.355234146118164, "global_step": 248656, "epoch": 1480} {"train_loss": -9.807184219360352, "global_step": 248657, "epoch": 1480} {"train_loss": -10.678739547729492, "global_step": 248658, "epoch": 1480} {"train_loss": -10.56090259552002, "global_step": 248659, "epoch": 1480} {"train_loss": -10.634929656982422, "global_step": 248660, "epoch": 1480} {"train_loss": -11.171010971069336, "global_step": 248661, "epoch": 1480} {"train_loss": -10.81169605255127, "global_step": 248662, "epoch": 1480} {"train_loss": -11.144891738891602, "global_step": 248663, "epoch": 1480} {"train_loss": -10.593232154846191, "global_step": 248664, "epoch": 1480} {"train_loss": -11.09221363067627, "global_step": 248665, "epoch": 1480} {"train_loss": -11.012036323547363, "global_step": 248666, "epoch": 1480} {"train_loss": -10.8477783203125, "global_step": 248667, "epoch": 1480} {"train_loss": -11.231767654418945, "global_step": 248668, "epoch": 1480} {"train_loss": -10.972455024719238, "global_step": 248669, "epoch": 1480} {"train_loss": -11.242258071899414, "global_step": 248670, "epoch": 1480} {"train_loss": -11.019174575805664, "global_step": 248671, "epoch": 1480} {"train_loss": -11.244394302368164, "global_step": 248672, "epoch": 1480} {"train_loss": -11.195999145507812, "global_step": 248673, "epoch": 1480} {"train_loss": -11.188028335571289, "global_step": 248674, "epoch": 1480} {"train_loss": -11.482001304626465, "global_step": 248675, "epoch": 1480} {"train_loss": -11.42648696899414, "global_step": 248676, "epoch": 1480} {"train_loss": -11.198554992675781, "global_step": 248677, "epoch": 1480} {"train_loss": -11.34667682647705, "global_step": 248678, "epoch": 1480} {"train_loss": -11.2386474609375, "global_step": 248679, "epoch": 1480} {"train_loss": -11.134024620056152, "global_step": 248680, "epoch": 1480} {"train_loss": -11.396482467651367, "global_step": 248681, "epoch": 1480} {"train_loss": -11.19743824005127, "global_step": 248682, "epoch": 1480} {"train_loss": -11.156378746032715, "global_step": 248683, "epoch": 1480} {"train_loss": -11.4154052734375, "global_step": 248684, "epoch": 1480} {"train_loss": -11.333403587341309, "global_step": 248685, "epoch": 1480} {"train_loss": -11.181676864624023, "global_step": 248686, "epoch": 1480} {"train_loss": -11.471332550048828, "global_step": 248687, "epoch": 1480} {"train_loss": -11.382776260375977, "global_step": 248688, "epoch": 1480} {"train_loss": -11.290724754333496, "global_step": 248689, "epoch": 1480} {"train_loss": -11.650870323181152, "global_step": 248690, "epoch": 1480} {"train_loss": -11.372138977050781, "global_step": 248691, "epoch": 1480} {"train_loss": -11.523765563964844, "global_step": 248692, "epoch": 1480} {"train_loss": -11.492470741271973, "global_step": 248693, "epoch": 1480} {"train_loss": -11.573226928710938, "global_step": 248694, "epoch": 1480} {"train_loss": -11.570938110351562, "global_step": 248695, "epoch": 1480} {"train_loss": -11.545832633972168, "global_step": 248696, "epoch": 1480} {"train_loss": -11.59571647644043, "global_step": 248697, "epoch": 1480} {"train_loss": -11.681197166442871, "global_step": 248698, "epoch": 1480} {"train_loss": -11.602945327758789, "global_step": 248699, "epoch": 1480} {"train_loss": -11.617288589477539, "global_step": 248700, "epoch": 1480} {"train_loss": -11.759132385253906, "global_step": 248701, "epoch": 1480} {"train_loss": -11.537620544433594, "global_step": 248702, "epoch": 1480} {"train_loss": -11.831491470336914, "global_step": 248703, "epoch": 1480} {"train_loss": -11.627304077148438, "global_step": 248704, "epoch": 1480} {"train_loss": -11.894021987915039, "global_step": 248705, "epoch": 1480} {"train_loss": -11.630555152893066, "global_step": 248706, "epoch": 1480} {"train_loss": -11.757719039916992, "global_step": 248707, "epoch": 1480} {"train_loss": -11.701169967651367, "global_step": 248708, "epoch": 1480} {"train_loss": -11.718997955322266, "global_step": 248709, "epoch": 1480} {"train_loss": -11.980203628540039, "global_step": 248710, "epoch": 1480} {"train_loss": -11.923389434814453, "global_step": 248711, "epoch": 1480} {"train_loss": -11.832679748535156, "global_step": 248712, "epoch": 1480} {"train_loss": -11.527523040771484, "global_step": 248713, "epoch": 1480} {"train_loss": -12.027091026306152, "global_step": 248714, "epoch": 1480} {"train_loss": -11.59592342376709, "global_step": 248715, "epoch": 1480} {"train_loss": -11.928196907043457, "global_step": 248716, "epoch": 1480} {"train_loss": -11.573408126831055, "global_step": 248717, "epoch": 1480} {"train_loss": -11.686949729919434, "global_step": 248718, "epoch": 1480} {"train_loss": -11.469185829162598, "global_step": 248719, "epoch": 1480} {"train_loss": -12.098363876342773, "global_step": 248720, "epoch": 1480} {"train_loss": -11.560563087463379, "global_step": 248721, "epoch": 1480} {"train_loss": -12.034079551696777, "global_step": 248722, "epoch": 1480} {"train_loss": -11.704578399658203, "global_step": 248723, "epoch": 1480} {"train_loss": -11.795827865600586, "global_step": 248724, "epoch": 1480} {"train_loss": -11.921704292297363, "global_step": 248725, "epoch": 1480} {"train_loss": -11.764850616455078, "global_step": 248726, "epoch": 1480} {"train_loss": -11.920162200927734, "global_step": 248727, "epoch": 1480} {"train_loss": -11.87320327758789, "global_step": 248728, "epoch": 1480} {"train_loss": -11.903181076049805, "global_step": 248729, "epoch": 1480} {"train_loss": -11.928491592407227, "global_step": 248730, "epoch": 1480} {"train_loss": -12.035873413085938, "global_step": 248731, "epoch": 1480} {"train_loss": -11.997868537902832, "global_step": 248732, "epoch": 1480} {"train_loss": -11.981544494628906, "global_step": 248733, "epoch": 1480} {"train_loss": -11.994943618774414, "global_step": 248734, "epoch": 1480} {"train_loss": -11.80412483215332, "global_step": 248735, "epoch": 1480} {"train_loss": -12.030985832214355, "global_step": 248736, "epoch": 1480} {"train_loss": -11.822473526000977, "global_step": 248737, "epoch": 1480} {"train_loss": -11.974720001220703, "global_step": 248738, "epoch": 1480} {"train_loss": -11.799735069274902, "global_step": 248739, "epoch": 1480} {"train_loss": -12.124637603759766, "global_step": 248740, "epoch": 1480} {"train_loss": -11.86731243133545, "global_step": 248741, "epoch": 1480} {"train_loss": -12.091590881347656, "global_step": 248742, "epoch": 1480} {"train_loss": -12.146807670593262, "global_step": 248743, "epoch": 1480} {"train_loss": -11.817082405090332, "global_step": 248744, "epoch": 1480} {"train_loss": -12.189598083496094, "global_step": 248745, "epoch": 1480} {"train_loss": -11.967570304870605, "global_step": 248746, "epoch": 1480} {"train_loss": -12.138347625732422, "global_step": 248747, "epoch": 1480} {"train_loss": -12.135655403137207, "global_step": 248748, "epoch": 1480} {"train_loss": -12.075136184692383, "global_step": 248749, "epoch": 1480} {"train_loss": -11.99053955078125, "global_step": 248750, "epoch": 1480} {"train_loss": -12.012028694152832, "global_step": 248751, "epoch": 1480} {"train_loss": -12.025413513183594, "global_step": 248752, "epoch": 1480} {"train_loss": -12.21966552734375, "global_step": 248753, "epoch": 1480} {"train_loss": -12.108299255371094, "global_step": 248754, "epoch": 1480} {"train_loss": -12.185035705566406, "global_step": 248755, "epoch": 1480} {"train_loss": -11.993122100830078, "global_step": 248756, "epoch": 1480} {"train_loss": -12.160902976989746, "global_step": 248757, "epoch": 1480} {"train_loss": -12.039079666137695, "global_step": 248758, "epoch": 1480} {"train_loss": -11.797428131103516, "global_step": 248759, "epoch": 1480} {"train_loss": -12.172916412353516, "global_step": 248760, "epoch": 1480} {"train_loss": -12.10295295715332, "global_step": 248761, "epoch": 1480} {"train_loss": -11.832069396972656, "global_step": 248762, "epoch": 1480} {"train_loss": -12.30368423461914, "global_step": 248763, "epoch": 1480} {"train_loss": -11.938812255859375, "global_step": 248764, "epoch": 1480} {"train_loss": -11.589669227600098, "global_step": 248765, "epoch": 1480} {"train_loss": -11.32292366027832, "global_step": 248766, "epoch": 1480} {"train_loss": -12.365968704223633, "global_step": 248767, "epoch": 1480} {"train_loss": -11.247672080993652, "global_step": 248768, "epoch": 1480} {"train_loss": -11.495725631713867, "global_step": 248769, "epoch": 1480} {"train_loss": -10.933582305908203, "global_step": 248770, "epoch": 1480} {"train_loss": -11.763341903686523, "global_step": 248771, "epoch": 1480} {"train_loss": -11.048543930053711, "global_step": 248772, "epoch": 1480} {"train_loss": -12.034626007080078, "global_step": 248773, "epoch": 1480} {"train_loss": -11.883852005004883, "global_step": 248774, "epoch": 1480} {"train_loss": -11.35200309753418, "global_step": 248775, "epoch": 1480} {"train_loss": -11.580907821655273, "global_step": 248776, "epoch": 1480} {"train_loss": -11.742589950561523, "global_step": 248777, "epoch": 1480} {"train_loss": -11.833181381225586, "global_step": 248778, "epoch": 1480} {"train_loss": -11.700521469116211, "global_step": 248779, "epoch": 1480} {"train_loss": -11.983436584472656, "global_step": 248780, "epoch": 1480} {"train_loss": -11.704076766967773, "global_step": 248781, "epoch": 1480} {"train_loss": -11.796953201293945, "global_step": 248782, "epoch": 1480} {"train_loss": -11.400629043579102, "global_step": 248783, "epoch": 1480} {"train_loss": -11.824094772338867, "global_step": 248784, "epoch": 1480} {"train_loss": -11.691884994506836, "global_step": 248785, "epoch": 1480} {"train_loss": -11.307212829589844, "global_step": 248786, "epoch": 1480} {"train_loss": -11.83006477355957, "global_step": 248787, "epoch": 1480} {"train_loss": -11.551246643066406, "global_step": 248788, "epoch": 1480} {"train_loss": -11.856315612792969, "global_step": 248789, "epoch": 1480} {"train_loss": -11.162211418151855, "global_step": 248790, "epoch": 1480} {"train_loss": -12.124177932739258, "global_step": 248791, "epoch": 1480} {"train_loss": -11.290129661560059, "global_step": 248792, "epoch": 1480} {"train_loss": -11.573198318481445, "global_step": 248793, "epoch": 1480} {"train_loss": -11.655098915100098, "global_step": 248794, "epoch": 1480} {"train_loss": -11.91382122039795, "global_step": 248795, "epoch": 1480} {"train_loss": -10.975987434387207, "global_step": 248796, "epoch": 1480} {"train_loss": -12.126508712768555, "global_step": 248797, "epoch": 1480} {"train_loss": -11.193315505981445, "global_step": 248798, "epoch": 1480} {"train_loss": -11.381660461425781, "global_step": 248799, "epoch": 1480} {"train_loss": -10.612371444702148, "global_step": 248800, "epoch": 1480} {"train_loss": -11.595077514648438, "global_step": 248801, "epoch": 1480} {"train_loss": -10.375422477722168, "global_step": 248802, "epoch": 1480} {"train_loss": -11.116233825683594, "global_step": 248803, "epoch": 1480} {"train_loss": -10.48679256439209, "global_step": 248804, "epoch": 1480} {"train_loss": -10.48489761352539, "global_step": 248805, "epoch": 1480} {"train_loss": -11.333829879760742, "global_step": 248806, "epoch": 1480} {"train_loss": -11.355856486729213, "global_step": 248807, "epoch": 1480, "val_loss": 265951.28125, "train_action_mse_error": 2.2883925437927246} {"train_loss": -11.042097091674805, "global_step": 248808, "epoch": 1481} {"train_loss": -10.738079071044922, "global_step": 248809, "epoch": 1481} {"train_loss": -11.435635566711426, "global_step": 248810, "epoch": 1481} {"train_loss": -10.441261291503906, "global_step": 248811, "epoch": 1481} {"train_loss": -11.70036506652832, "global_step": 248812, "epoch": 1481} {"train_loss": -10.945932388305664, "global_step": 248813, "epoch": 1481} {"train_loss": -11.286399841308594, "global_step": 248814, "epoch": 1481} {"train_loss": -10.903839111328125, "global_step": 248815, "epoch": 1481} {"train_loss": -10.616195678710938, "global_step": 248816, "epoch": 1481} {"train_loss": -11.149547576904297, "global_step": 248817, "epoch": 1481} {"train_loss": -10.931493759155273, "global_step": 248818, "epoch": 1481} {"train_loss": -11.192033767700195, "global_step": 248819, "epoch": 1481} {"train_loss": -10.301240921020508, "global_step": 248820, "epoch": 1481} {"train_loss": -10.504398345947266, "global_step": 248821, "epoch": 1481} {"train_loss": -11.147308349609375, "global_step": 248822, "epoch": 1481} {"train_loss": -11.125864028930664, "global_step": 248823, "epoch": 1481} {"train_loss": -10.455116271972656, "global_step": 248824, "epoch": 1481} {"train_loss": -11.591142654418945, "global_step": 248825, "epoch": 1481} {"train_loss": -10.989700317382812, "global_step": 248826, "epoch": 1481} {"train_loss": -10.628316879272461, "global_step": 248827, "epoch": 1481} {"train_loss": -11.283000946044922, "global_step": 248828, "epoch": 1481} {"train_loss": -10.695101737976074, "global_step": 248829, "epoch": 1481} {"train_loss": -11.273296356201172, "global_step": 248830, "epoch": 1481} {"train_loss": -10.82081127166748, "global_step": 248831, "epoch": 1481} {"train_loss": -10.996269226074219, "global_step": 248832, "epoch": 1481} {"train_loss": -10.914714813232422, "global_step": 248833, "epoch": 1481} {"train_loss": -10.820195198059082, "global_step": 248834, "epoch": 1481} {"train_loss": -10.890167236328125, "global_step": 248835, "epoch": 1481} {"train_loss": -11.606884002685547, "global_step": 248836, "epoch": 1481} {"train_loss": -10.563971519470215, "global_step": 248837, "epoch": 1481} {"train_loss": -11.443721771240234, "global_step": 248838, "epoch": 1481} {"train_loss": -10.870594024658203, "global_step": 248839, "epoch": 1481} {"train_loss": -11.626487731933594, "global_step": 248840, "epoch": 1481} {"train_loss": -11.279175758361816, "global_step": 248841, "epoch": 1481} {"train_loss": -11.423505783081055, "global_step": 248842, "epoch": 1481} {"train_loss": -11.582273483276367, "global_step": 248843, "epoch": 1481} {"train_loss": -11.46212100982666, "global_step": 248844, "epoch": 1481} {"train_loss": -11.620952606201172, "global_step": 248845, "epoch": 1481} {"train_loss": -11.811188697814941, "global_step": 248846, "epoch": 1481} {"train_loss": -11.604680061340332, "global_step": 248847, "epoch": 1481} {"train_loss": -11.680451393127441, "global_step": 248848, "epoch": 1481} {"train_loss": -11.67106819152832, "global_step": 248849, "epoch": 1481} {"train_loss": -11.847742080688477, "global_step": 248850, "epoch": 1481} {"train_loss": -11.782142639160156, "global_step": 248851, "epoch": 1481} {"train_loss": -11.866096496582031, "global_step": 248852, "epoch": 1481} {"train_loss": -11.452754974365234, "global_step": 248853, "epoch": 1481} {"train_loss": -11.937545776367188, "global_step": 248854, "epoch": 1481} {"train_loss": -11.568960189819336, "global_step": 248855, "epoch": 1481} {"train_loss": -11.797073364257812, "global_step": 248856, "epoch": 1481} {"train_loss": -11.783737182617188, "global_step": 248857, "epoch": 1481} {"train_loss": -11.979242324829102, "global_step": 248858, "epoch": 1481} {"train_loss": -11.745100021362305, "global_step": 248859, "epoch": 1481} {"train_loss": -11.915843963623047, "global_step": 248860, "epoch": 1481} {"train_loss": -11.863703727722168, "global_step": 248861, "epoch": 1481} {"train_loss": -11.993025779724121, "global_step": 248862, "epoch": 1481} {"train_loss": -11.794994354248047, "global_step": 248863, "epoch": 1481} {"train_loss": -11.7658052444458, "global_step": 248864, "epoch": 1481} {"train_loss": -11.99173641204834, "global_step": 248865, "epoch": 1481} {"train_loss": -11.976274490356445, "global_step": 248866, "epoch": 1481} {"train_loss": -12.0222749710083, "global_step": 248867, "epoch": 1481} {"train_loss": -11.89634895324707, "global_step": 248868, "epoch": 1481} {"train_loss": -11.89773941040039, "global_step": 248869, "epoch": 1481} {"train_loss": -11.71203899383545, "global_step": 248870, "epoch": 1481} {"train_loss": -11.979290962219238, "global_step": 248871, "epoch": 1481} {"train_loss": -11.939072608947754, "global_step": 248872, "epoch": 1481} {"train_loss": -11.976492881774902, "global_step": 248873, "epoch": 1481} {"train_loss": -11.894533157348633, "global_step": 248874, "epoch": 1481} {"train_loss": -12.086374282836914, "global_step": 248875, "epoch": 1481} {"train_loss": -11.753382682800293, "global_step": 248876, "epoch": 1481} {"train_loss": -11.830890655517578, "global_step": 248877, "epoch": 1481} {"train_loss": -11.914974212646484, "global_step": 248878, "epoch": 1481} {"train_loss": -11.773282051086426, "global_step": 248879, "epoch": 1481} {"train_loss": -11.900739669799805, "global_step": 248880, "epoch": 1481} {"train_loss": -11.716437339782715, "global_step": 248881, "epoch": 1481} {"train_loss": -11.547174453735352, "global_step": 248882, "epoch": 1481} {"train_loss": -12.170495986938477, "global_step": 248883, "epoch": 1481} {"train_loss": -11.971553802490234, "global_step": 248884, "epoch": 1481} {"train_loss": -12.138847351074219, "global_step": 248885, "epoch": 1481} {"train_loss": -11.963716506958008, "global_step": 248886, "epoch": 1481} {"train_loss": -12.047958374023438, "global_step": 248887, "epoch": 1481} {"train_loss": -11.826171875, "global_step": 248888, "epoch": 1481} {"train_loss": -11.943574905395508, "global_step": 248889, "epoch": 1481} {"train_loss": -12.1903657913208, "global_step": 248890, "epoch": 1481} {"train_loss": -12.119056701660156, "global_step": 248891, "epoch": 1481} {"train_loss": -11.921070098876953, "global_step": 248892, "epoch": 1481} {"train_loss": -11.972314834594727, "global_step": 248893, "epoch": 1481} {"train_loss": -11.752732276916504, "global_step": 248894, "epoch": 1481} {"train_loss": -12.33731460571289, "global_step": 248895, "epoch": 1481} {"train_loss": -12.091358184814453, "global_step": 248896, "epoch": 1481} {"train_loss": -11.991033554077148, "global_step": 248897, "epoch": 1481} {"train_loss": -12.293827056884766, "global_step": 248898, "epoch": 1481} {"train_loss": -12.065621376037598, "global_step": 248899, "epoch": 1481} {"train_loss": -11.97928524017334, "global_step": 248900, "epoch": 1481} {"train_loss": -11.556745529174805, "global_step": 248901, "epoch": 1481} {"train_loss": -12.035863876342773, "global_step": 248902, "epoch": 1481} {"train_loss": -11.874180793762207, "global_step": 248903, "epoch": 1481} {"train_loss": -12.309499740600586, "global_step": 248904, "epoch": 1481} {"train_loss": -11.647150039672852, "global_step": 248905, "epoch": 1481} {"train_loss": -12.099796295166016, "global_step": 248906, "epoch": 1481} {"train_loss": -12.109025955200195, "global_step": 248907, "epoch": 1481} {"train_loss": -12.365238189697266, "global_step": 248908, "epoch": 1481} {"train_loss": -11.854571342468262, "global_step": 248909, "epoch": 1481} {"train_loss": -11.944391250610352, "global_step": 248910, "epoch": 1481} {"train_loss": -11.958412170410156, "global_step": 248911, "epoch": 1481} {"train_loss": -12.035707473754883, "global_step": 248912, "epoch": 1481} {"train_loss": -11.887277603149414, "global_step": 248913, "epoch": 1481} {"train_loss": -12.166061401367188, "global_step": 248914, "epoch": 1481} {"train_loss": -12.137319564819336, "global_step": 248915, "epoch": 1481} {"train_loss": -12.133149147033691, "global_step": 248916, "epoch": 1481} {"train_loss": -11.811748504638672, "global_step": 248917, "epoch": 1481} {"train_loss": -12.2170991897583, "global_step": 248918, "epoch": 1481} {"train_loss": -12.136981964111328, "global_step": 248919, "epoch": 1481} {"train_loss": -11.924799919128418, "global_step": 248920, "epoch": 1481} {"train_loss": -11.630195617675781, "global_step": 248921, "epoch": 1481} {"train_loss": -11.809778213500977, "global_step": 248922, "epoch": 1481} {"train_loss": -11.91493034362793, "global_step": 248923, "epoch": 1481} {"train_loss": -11.551405906677246, "global_step": 248924, "epoch": 1481} {"train_loss": -11.691609382629395, "global_step": 248925, "epoch": 1481} {"train_loss": -11.504392623901367, "global_step": 248926, "epoch": 1481} {"train_loss": -10.431406021118164, "global_step": 248927, "epoch": 1481} {"train_loss": -10.839859008789062, "global_step": 248928, "epoch": 1481} {"train_loss": -10.681190490722656, "global_step": 248929, "epoch": 1481} {"train_loss": -9.705827713012695, "global_step": 248930, "epoch": 1481} {"train_loss": -10.323753356933594, "global_step": 248931, "epoch": 1481} {"train_loss": -8.7432861328125, "global_step": 248932, "epoch": 1481} {"train_loss": -6.493993282318115, "global_step": 248933, "epoch": 1481} {"train_loss": -6.725807189941406, "global_step": 248934, "epoch": 1481} {"train_loss": -6.973882675170898, "global_step": 248935, "epoch": 1481} {"train_loss": -6.879255294799805, "global_step": 248936, "epoch": 1481} {"train_loss": -7.5319671630859375, "global_step": 248937, "epoch": 1481} {"train_loss": -8.924211502075195, "global_step": 248938, "epoch": 1481} {"train_loss": -9.57393741607666, "global_step": 248939, "epoch": 1481} {"train_loss": -8.533027648925781, "global_step": 248940, "epoch": 1481} {"train_loss": -9.014750480651855, "global_step": 248941, "epoch": 1481} {"train_loss": -10.120214462280273, "global_step": 248942, "epoch": 1481} {"train_loss": -9.364864349365234, "global_step": 248943, "epoch": 1481} {"train_loss": -10.56512451171875, "global_step": 248944, "epoch": 1481} {"train_loss": -9.298934936523438, "global_step": 248945, "epoch": 1481} {"train_loss": -10.535438537597656, "global_step": 248946, "epoch": 1481} {"train_loss": -9.382445335388184, "global_step": 248947, "epoch": 1481} {"train_loss": -9.905510902404785, "global_step": 248948, "epoch": 1481} {"train_loss": -10.080195426940918, "global_step": 248949, "epoch": 1481} {"train_loss": -11.047183990478516, "global_step": 248950, "epoch": 1481} {"train_loss": -10.013230323791504, "global_step": 248951, "epoch": 1481} {"train_loss": -10.666873931884766, "global_step": 248952, "epoch": 1481} {"train_loss": -10.52062702178955, "global_step": 248953, "epoch": 1481} {"train_loss": -10.779497146606445, "global_step": 248954, "epoch": 1481} {"train_loss": -10.633426666259766, "global_step": 248955, "epoch": 1481} {"train_loss": -10.62048625946045, "global_step": 248956, "epoch": 1481} {"train_loss": -10.216571807861328, "global_step": 248957, "epoch": 1481} {"train_loss": -10.25229549407959, "global_step": 248958, "epoch": 1481} {"train_loss": -10.769817352294922, "global_step": 248959, "epoch": 1481} {"train_loss": -10.720772743225098, "global_step": 248960, "epoch": 1481} {"train_loss": -10.562962532043457, "global_step": 248961, "epoch": 1481} {"train_loss": -9.662625312805176, "global_step": 248962, "epoch": 1481} {"train_loss": -10.20267391204834, "global_step": 248963, "epoch": 1481} {"train_loss": -10.39105224609375, "global_step": 248964, "epoch": 1481} {"train_loss": -10.197897911071777, "global_step": 248965, "epoch": 1481} {"train_loss": -9.820901870727539, "global_step": 248966, "epoch": 1481} {"train_loss": -10.371272087097168, "global_step": 248967, "epoch": 1481} {"train_loss": -10.784157752990723, "global_step": 248968, "epoch": 1481} {"train_loss": -10.15261173248291, "global_step": 248969, "epoch": 1481} {"train_loss": -10.830873489379883, "global_step": 248970, "epoch": 1481} {"train_loss": -10.909576416015625, "global_step": 248971, "epoch": 1481} {"train_loss": -10.781494140625, "global_step": 248972, "epoch": 1481} {"train_loss": -10.682415008544922, "global_step": 248973, "epoch": 1481} {"train_loss": -10.935991287231445, "global_step": 248974, "epoch": 1481} {"train_loss": -11.127355101562681, "global_step": 248975, "epoch": 1481, "val_loss": 262124.859375} {"train_loss": -10.848504066467285, "global_step": 248976, "epoch": 1482} {"train_loss": -11.006890296936035, "global_step": 248977, "epoch": 1482} {"train_loss": -11.209484100341797, "global_step": 248978, "epoch": 1482} {"train_loss": -10.882607460021973, "global_step": 248979, "epoch": 1482} {"train_loss": -11.303794860839844, "global_step": 248980, "epoch": 1482} {"train_loss": -11.357156753540039, "global_step": 248981, "epoch": 1482} {"train_loss": -11.18309211730957, "global_step": 248982, "epoch": 1482} {"train_loss": -11.213533401489258, "global_step": 248983, "epoch": 1482} {"train_loss": -11.002254486083984, "global_step": 248984, "epoch": 1482} {"train_loss": -11.457404136657715, "global_step": 248985, "epoch": 1482} {"train_loss": -11.466508865356445, "global_step": 248986, "epoch": 1482} {"train_loss": -11.28691291809082, "global_step": 248987, "epoch": 1482} {"train_loss": -11.545190811157227, "global_step": 248988, "epoch": 1482} {"train_loss": -11.250030517578125, "global_step": 248989, "epoch": 1482} {"train_loss": -11.578624725341797, "global_step": 248990, "epoch": 1482} {"train_loss": -11.427775382995605, "global_step": 248991, "epoch": 1482} {"train_loss": -11.468840599060059, "global_step": 248992, "epoch": 1482} {"train_loss": -11.476405143737793, "global_step": 248993, "epoch": 1482} {"train_loss": -11.462014198303223, "global_step": 248994, "epoch": 1482} {"train_loss": -11.648441314697266, "global_step": 248995, "epoch": 1482} {"train_loss": -11.775199890136719, "global_step": 248996, "epoch": 1482} {"train_loss": -11.539603233337402, "global_step": 248997, "epoch": 1482} {"train_loss": -11.892667770385742, "global_step": 248998, "epoch": 1482} {"train_loss": -11.675374984741211, "global_step": 248999, "epoch": 1482} {"train_loss": -11.527251243591309, "global_step": 249000, "epoch": 1482} {"train_loss": -11.792624473571777, "global_step": 249001, "epoch": 1482} {"train_loss": -11.602519989013672, "global_step": 249002, "epoch": 1482} {"train_loss": -11.810104370117188, "global_step": 249003, "epoch": 1482} {"train_loss": -11.84760570526123, "global_step": 249004, "epoch": 1482} {"train_loss": -11.73272705078125, "global_step": 249005, "epoch": 1482} {"train_loss": -11.937553405761719, "global_step": 249006, "epoch": 1482} {"train_loss": -11.835296630859375, "global_step": 249007, "epoch": 1482} {"train_loss": -11.854316711425781, "global_step": 249008, "epoch": 1482} {"train_loss": -11.790155410766602, "global_step": 249009, "epoch": 1482} {"train_loss": -12.093156814575195, "global_step": 249010, "epoch": 1482} {"train_loss": -11.886547088623047, "global_step": 249011, "epoch": 1482} {"train_loss": -11.990827560424805, "global_step": 249012, "epoch": 1482} {"train_loss": -11.826507568359375, "global_step": 249013, "epoch": 1482} {"train_loss": -12.026154518127441, "global_step": 249014, "epoch": 1482} {"train_loss": -11.82243537902832, "global_step": 249015, "epoch": 1482} {"train_loss": -11.830971717834473, "global_step": 249016, "epoch": 1482} {"train_loss": -11.82657527923584, "global_step": 249017, "epoch": 1482} {"train_loss": -11.845136642456055, "global_step": 249018, "epoch": 1482} {"train_loss": -11.800029754638672, "global_step": 249019, "epoch": 1482} {"train_loss": -12.098380088806152, "global_step": 249020, "epoch": 1482} {"train_loss": -12.02714729309082, "global_step": 249021, "epoch": 1482} {"train_loss": -11.838072776794434, "global_step": 249022, "epoch": 1482} {"train_loss": -12.018383026123047, "global_step": 249023, "epoch": 1482} {"train_loss": -11.88404369354248, "global_step": 249024, "epoch": 1482} {"train_loss": -11.976561546325684, "global_step": 249025, "epoch": 1482} {"train_loss": -11.999528884887695, "global_step": 249026, "epoch": 1482} {"train_loss": -11.787282943725586, "global_step": 249027, "epoch": 1482} {"train_loss": -11.978599548339844, "global_step": 249028, "epoch": 1482} {"train_loss": -12.005882263183594, "global_step": 249029, "epoch": 1482} {"train_loss": -12.100223541259766, "global_step": 249030, "epoch": 1482} {"train_loss": -12.048822402954102, "global_step": 249031, "epoch": 1482} {"train_loss": -12.220663070678711, "global_step": 249032, "epoch": 1482} {"train_loss": -12.085363388061523, "global_step": 249033, "epoch": 1482} {"train_loss": -12.060707092285156, "global_step": 249034, "epoch": 1482} {"train_loss": -12.016794204711914, "global_step": 249035, "epoch": 1482} {"train_loss": -12.061014175415039, "global_step": 249036, "epoch": 1482} {"train_loss": -12.010027885437012, "global_step": 249037, "epoch": 1482} {"train_loss": -12.071313858032227, "global_step": 249038, "epoch": 1482} {"train_loss": -11.958048820495605, "global_step": 249039, "epoch": 1482} {"train_loss": -11.657381057739258, "global_step": 249040, "epoch": 1482} {"train_loss": -11.892454147338867, "global_step": 249041, "epoch": 1482} {"train_loss": -12.129171371459961, "global_step": 249042, "epoch": 1482} {"train_loss": -12.059063911437988, "global_step": 249043, "epoch": 1482} {"train_loss": -12.296869277954102, "global_step": 249044, "epoch": 1482} {"train_loss": -11.910636901855469, "global_step": 249045, "epoch": 1482} {"train_loss": -11.980449676513672, "global_step": 249046, "epoch": 1482} {"train_loss": -11.808761596679688, "global_step": 249047, "epoch": 1482} {"train_loss": -11.900663375854492, "global_step": 249048, "epoch": 1482} {"train_loss": -12.185663223266602, "global_step": 249049, "epoch": 1482} {"train_loss": -12.051334381103516, "global_step": 249050, "epoch": 1482} {"train_loss": -11.995034217834473, "global_step": 249051, "epoch": 1482} {"train_loss": -11.696234703063965, "global_step": 249052, "epoch": 1482} {"train_loss": -11.272857666015625, "global_step": 249053, "epoch": 1482} {"train_loss": -12.010969161987305, "global_step": 249054, "epoch": 1482} {"train_loss": -11.714414596557617, "global_step": 249055, "epoch": 1482} {"train_loss": -11.52271842956543, "global_step": 249056, "epoch": 1482} {"train_loss": -11.296626091003418, "global_step": 249057, "epoch": 1482} {"train_loss": -11.575355529785156, "global_step": 249058, "epoch": 1482} {"train_loss": -10.471492767333984, "global_step": 249059, "epoch": 1482} {"train_loss": -8.97262191772461, "global_step": 249060, "epoch": 1482} {"train_loss": -11.10989761352539, "global_step": 249061, "epoch": 1482} {"train_loss": -10.583003997802734, "global_step": 249062, "epoch": 1482} {"train_loss": -9.360379219055176, "global_step": 249063, "epoch": 1482} {"train_loss": -11.694794654846191, "global_step": 249064, "epoch": 1482} {"train_loss": -10.942974090576172, "global_step": 249065, "epoch": 1482} {"train_loss": -9.38932991027832, "global_step": 249066, "epoch": 1482} {"train_loss": -10.781817436218262, "global_step": 249067, "epoch": 1482} {"train_loss": -11.213273048400879, "global_step": 249068, "epoch": 1482} {"train_loss": -9.756145477294922, "global_step": 249069, "epoch": 1482} {"train_loss": -11.54372787475586, "global_step": 249070, "epoch": 1482} {"train_loss": -10.717257499694824, "global_step": 249071, "epoch": 1482} {"train_loss": -9.914817810058594, "global_step": 249072, "epoch": 1482} {"train_loss": -11.009330749511719, "global_step": 249073, "epoch": 1482} {"train_loss": -9.301623344421387, "global_step": 249074, "epoch": 1482} {"train_loss": -11.386369705200195, "global_step": 249075, "epoch": 1482} {"train_loss": -9.677619934082031, "global_step": 249076, "epoch": 1482} {"train_loss": -11.254677772521973, "global_step": 249077, "epoch": 1482} {"train_loss": -8.831396102905273, "global_step": 249078, "epoch": 1482} {"train_loss": -10.553330421447754, "global_step": 249079, "epoch": 1482} {"train_loss": -9.710199356079102, "global_step": 249080, "epoch": 1482} {"train_loss": -10.654792785644531, "global_step": 249081, "epoch": 1482} {"train_loss": -9.31390380859375, "global_step": 249082, "epoch": 1482} {"train_loss": -11.037569999694824, "global_step": 249083, "epoch": 1482} {"train_loss": -9.39997673034668, "global_step": 249084, "epoch": 1482} {"train_loss": -10.460582733154297, "global_step": 249085, "epoch": 1482} {"train_loss": -8.985565185546875, "global_step": 249086, "epoch": 1482} {"train_loss": -9.98137092590332, "global_step": 249087, "epoch": 1482} {"train_loss": -10.606868743896484, "global_step": 249088, "epoch": 1482} {"train_loss": -10.507410049438477, "global_step": 249089, "epoch": 1482} {"train_loss": -10.887317657470703, "global_step": 249090, "epoch": 1482} {"train_loss": -10.534423828125, "global_step": 249091, "epoch": 1482} {"train_loss": -11.357065200805664, "global_step": 249092, "epoch": 1482} {"train_loss": -10.547607421875, "global_step": 249093, "epoch": 1482} {"train_loss": -11.554082870483398, "global_step": 249094, "epoch": 1482} {"train_loss": -11.058683395385742, "global_step": 249095, "epoch": 1482} {"train_loss": -11.590841293334961, "global_step": 249096, "epoch": 1482} {"train_loss": -11.10861587524414, "global_step": 249097, "epoch": 1482} {"train_loss": -11.316761016845703, "global_step": 249098, "epoch": 1482} {"train_loss": -11.424399375915527, "global_step": 249099, "epoch": 1482} {"train_loss": -11.353049278259277, "global_step": 249100, "epoch": 1482} {"train_loss": -11.345568656921387, "global_step": 249101, "epoch": 1482} {"train_loss": -11.59715461730957, "global_step": 249102, "epoch": 1482} {"train_loss": -11.340982437133789, "global_step": 249103, "epoch": 1482} {"train_loss": -11.466203689575195, "global_step": 249104, "epoch": 1482} {"train_loss": -11.715660095214844, "global_step": 249105, "epoch": 1482} {"train_loss": -11.543636322021484, "global_step": 249106, "epoch": 1482} {"train_loss": -11.52452564239502, "global_step": 249107, "epoch": 1482} {"train_loss": -11.854574203491211, "global_step": 249108, "epoch": 1482} {"train_loss": -11.442808151245117, "global_step": 249109, "epoch": 1482} {"train_loss": -11.734465599060059, "global_step": 249110, "epoch": 1482} {"train_loss": -11.54751205444336, "global_step": 249111, "epoch": 1482} {"train_loss": -11.843050003051758, "global_step": 249112, "epoch": 1482} {"train_loss": -11.693693161010742, "global_step": 249113, "epoch": 1482} {"train_loss": -11.731769561767578, "global_step": 249114, "epoch": 1482} {"train_loss": -11.746040344238281, "global_step": 249115, "epoch": 1482} {"train_loss": -11.61642074584961, "global_step": 249116, "epoch": 1482} {"train_loss": -11.793233871459961, "global_step": 249117, "epoch": 1482} {"train_loss": -11.925544738769531, "global_step": 249118, "epoch": 1482} {"train_loss": -11.667893409729004, "global_step": 249119, "epoch": 1482} {"train_loss": -11.599050521850586, "global_step": 249120, "epoch": 1482} {"train_loss": -11.803110122680664, "global_step": 249121, "epoch": 1482} {"train_loss": -11.655437469482422, "global_step": 249122, "epoch": 1482} {"train_loss": -11.706541061401367, "global_step": 249123, "epoch": 1482} {"train_loss": -11.827637672424316, "global_step": 249124, "epoch": 1482} {"train_loss": -11.909341812133789, "global_step": 249125, "epoch": 1482} {"train_loss": -11.871081352233887, "global_step": 249126, "epoch": 1482} {"train_loss": -11.879865646362305, "global_step": 249127, "epoch": 1482} {"train_loss": -11.901714324951172, "global_step": 249128, "epoch": 1482} {"train_loss": -12.019933700561523, "global_step": 249129, "epoch": 1482} {"train_loss": -11.839605331420898, "global_step": 249130, "epoch": 1482} {"train_loss": -11.959205627441406, "global_step": 249131, "epoch": 1482} {"train_loss": -11.979330062866211, "global_step": 249132, "epoch": 1482} {"train_loss": -11.934647560119629, "global_step": 249133, "epoch": 1482} {"train_loss": -12.185343742370605, "global_step": 249134, "epoch": 1482} {"train_loss": -11.862435340881348, "global_step": 249135, "epoch": 1482} {"train_loss": -11.898958206176758, "global_step": 249136, "epoch": 1482} {"train_loss": -12.037498474121094, "global_step": 249137, "epoch": 1482} {"train_loss": -11.905976295471191, "global_step": 249138, "epoch": 1482} {"train_loss": -12.002084732055664, "global_step": 249139, "epoch": 1482} {"train_loss": -12.082313537597656, "global_step": 249140, "epoch": 1482} {"train_loss": -12.1225004196167, "global_step": 249141, "epoch": 1482} {"train_loss": -12.092822074890137, "global_step": 249142, "epoch": 1482} {"train_loss": -11.452985695430211, "global_step": 249143, "epoch": 1482, "val_loss": 266389.71875} {"train_loss": -12.187469482421875, "global_step": 249144, "epoch": 1483} {"train_loss": -12.009722709655762, "global_step": 249145, "epoch": 1483} {"train_loss": -12.063634872436523, "global_step": 249146, "epoch": 1483} {"train_loss": -11.965786933898926, "global_step": 249147, "epoch": 1483} {"train_loss": -11.917413711547852, "global_step": 249148, "epoch": 1483} {"train_loss": -12.064836502075195, "global_step": 249149, "epoch": 1483} {"train_loss": -11.801965713500977, "global_step": 249150, "epoch": 1483} {"train_loss": -11.778572082519531, "global_step": 249151, "epoch": 1483} {"train_loss": -11.782784461975098, "global_step": 249152, "epoch": 1483} {"train_loss": -11.514020919799805, "global_step": 249153, "epoch": 1483} {"train_loss": -11.839919090270996, "global_step": 249154, "epoch": 1483} {"train_loss": -11.92410945892334, "global_step": 249155, "epoch": 1483} {"train_loss": -11.692771911621094, "global_step": 249156, "epoch": 1483} {"train_loss": -11.942279815673828, "global_step": 249157, "epoch": 1483} {"train_loss": -12.015795707702637, "global_step": 249158, "epoch": 1483} {"train_loss": -11.848089218139648, "global_step": 249159, "epoch": 1483} {"train_loss": -11.639968872070312, "global_step": 249160, "epoch": 1483} {"train_loss": -11.628194808959961, "global_step": 249161, "epoch": 1483} {"train_loss": -12.07097053527832, "global_step": 249162, "epoch": 1483} {"train_loss": -11.482063293457031, "global_step": 249163, "epoch": 1483} {"train_loss": -12.129335403442383, "global_step": 249164, "epoch": 1483} {"train_loss": -11.797418594360352, "global_step": 249165, "epoch": 1483} {"train_loss": -11.991874694824219, "global_step": 249166, "epoch": 1483} {"train_loss": -11.900947570800781, "global_step": 249167, "epoch": 1483} {"train_loss": -11.52795696258545, "global_step": 249168, "epoch": 1483} {"train_loss": -11.648551940917969, "global_step": 249169, "epoch": 1483} {"train_loss": -11.527462005615234, "global_step": 249170, "epoch": 1483} {"train_loss": -11.736408233642578, "global_step": 249171, "epoch": 1483} {"train_loss": -12.037814140319824, "global_step": 249172, "epoch": 1483} {"train_loss": -11.999208450317383, "global_step": 249173, "epoch": 1483} {"train_loss": -11.84160041809082, "global_step": 249174, "epoch": 1483} {"train_loss": -12.22677230834961, "global_step": 249175, "epoch": 1483} {"train_loss": -11.94480037689209, "global_step": 249176, "epoch": 1483} {"train_loss": -11.730632781982422, "global_step": 249177, "epoch": 1483} {"train_loss": -11.439224243164062, "global_step": 249178, "epoch": 1483} {"train_loss": -11.275348663330078, "global_step": 249179, "epoch": 1483} {"train_loss": -11.939433097839355, "global_step": 249180, "epoch": 1483} {"train_loss": -11.730218887329102, "global_step": 249181, "epoch": 1483} {"train_loss": -10.348419189453125, "global_step": 249182, "epoch": 1483} {"train_loss": -11.57935619354248, "global_step": 249183, "epoch": 1483} {"train_loss": -11.64676570892334, "global_step": 249184, "epoch": 1483} {"train_loss": -10.443851470947266, "global_step": 249185, "epoch": 1483} {"train_loss": -9.398174285888672, "global_step": 249186, "epoch": 1483} {"train_loss": -10.230844497680664, "global_step": 249187, "epoch": 1483} {"train_loss": -7.45556640625, "global_step": 249188, "epoch": 1483} {"train_loss": -7.256208896636963, "global_step": 249189, "epoch": 1483} {"train_loss": -7.53434944152832, "global_step": 249190, "epoch": 1483} {"train_loss": -7.714019775390625, "global_step": 249191, "epoch": 1483} {"train_loss": -8.47708511352539, "global_step": 249192, "epoch": 1483} {"train_loss": -8.173809051513672, "global_step": 249193, "epoch": 1483} {"train_loss": -9.062581062316895, "global_step": 249194, "epoch": 1483} {"train_loss": -9.04823112487793, "global_step": 249195, "epoch": 1483} {"train_loss": -7.744015693664551, "global_step": 249196, "epoch": 1483} {"train_loss": -8.367729187011719, "global_step": 249197, "epoch": 1483} {"train_loss": -9.118576049804688, "global_step": 249198, "epoch": 1483} {"train_loss": -8.50510025024414, "global_step": 249199, "epoch": 1483} {"train_loss": -8.355857849121094, "global_step": 249200, "epoch": 1483} {"train_loss": -9.212434768676758, "global_step": 249201, "epoch": 1483} {"train_loss": -10.367900848388672, "global_step": 249202, "epoch": 1483} {"train_loss": -10.386301040649414, "global_step": 249203, "epoch": 1483} {"train_loss": -10.226058959960938, "global_step": 249204, "epoch": 1483} {"train_loss": -10.773004531860352, "global_step": 249205, "epoch": 1483} {"train_loss": -10.339547157287598, "global_step": 249206, "epoch": 1483} {"train_loss": -10.25285530090332, "global_step": 249207, "epoch": 1483} {"train_loss": -10.72127914428711, "global_step": 249208, "epoch": 1483} {"train_loss": -10.954572677612305, "global_step": 249209, "epoch": 1483} {"train_loss": -11.014642715454102, "global_step": 249210, "epoch": 1483} {"train_loss": -10.90214729309082, "global_step": 249211, "epoch": 1483} {"train_loss": -10.278273582458496, "global_step": 249212, "epoch": 1483} {"train_loss": -11.232529640197754, "global_step": 249213, "epoch": 1483} {"train_loss": -10.89704418182373, "global_step": 249214, "epoch": 1483} {"train_loss": -11.197305679321289, "global_step": 249215, "epoch": 1483} {"train_loss": -11.233509063720703, "global_step": 249216, "epoch": 1483} {"train_loss": -11.308895111083984, "global_step": 249217, "epoch": 1483} {"train_loss": -11.342555046081543, "global_step": 249218, "epoch": 1483} {"train_loss": -11.09838581085205, "global_step": 249219, "epoch": 1483} {"train_loss": -11.492340087890625, "global_step": 249220, "epoch": 1483} {"train_loss": -11.067024230957031, "global_step": 249221, "epoch": 1483} {"train_loss": -11.488751411437988, "global_step": 249222, "epoch": 1483} {"train_loss": -11.136180877685547, "global_step": 249223, "epoch": 1483} {"train_loss": -11.179689407348633, "global_step": 249224, "epoch": 1483} {"train_loss": -11.342434883117676, "global_step": 249225, "epoch": 1483} {"train_loss": -10.923931121826172, "global_step": 249226, "epoch": 1483} {"train_loss": -11.318960189819336, "global_step": 249227, "epoch": 1483} {"train_loss": -11.529945373535156, "global_step": 249228, "epoch": 1483} {"train_loss": -11.292387962341309, "global_step": 249229, "epoch": 1483} {"train_loss": -11.439616203308105, "global_step": 249230, "epoch": 1483} {"train_loss": -11.58962631225586, "global_step": 249231, "epoch": 1483} {"train_loss": -11.503862380981445, "global_step": 249232, "epoch": 1483} {"train_loss": -11.509347915649414, "global_step": 249233, "epoch": 1483} {"train_loss": -11.41070556640625, "global_step": 249234, "epoch": 1483} {"train_loss": -11.527206420898438, "global_step": 249235, "epoch": 1483} {"train_loss": -11.708553314208984, "global_step": 249236, "epoch": 1483} {"train_loss": -11.599090576171875, "global_step": 249237, "epoch": 1483} {"train_loss": -11.53877067565918, "global_step": 249238, "epoch": 1483} {"train_loss": -11.525779724121094, "global_step": 249239, "epoch": 1483} {"train_loss": -11.859844207763672, "global_step": 249240, "epoch": 1483} {"train_loss": -11.417905807495117, "global_step": 249241, "epoch": 1483} {"train_loss": -11.918804168701172, "global_step": 249242, "epoch": 1483} {"train_loss": -11.675812721252441, "global_step": 249243, "epoch": 1483} {"train_loss": -11.61799144744873, "global_step": 249244, "epoch": 1483} {"train_loss": -11.643365859985352, "global_step": 249245, "epoch": 1483} {"train_loss": -11.551270484924316, "global_step": 249246, "epoch": 1483} {"train_loss": -11.536674499511719, "global_step": 249247, "epoch": 1483} {"train_loss": -11.730192184448242, "global_step": 249248, "epoch": 1483} {"train_loss": -11.63732624053955, "global_step": 249249, "epoch": 1483} {"train_loss": -11.68972396850586, "global_step": 249250, "epoch": 1483} {"train_loss": -11.916942596435547, "global_step": 249251, "epoch": 1483} {"train_loss": -11.691350936889648, "global_step": 249252, "epoch": 1483} {"train_loss": -11.962091445922852, "global_step": 249253, "epoch": 1483} {"train_loss": -11.598409652709961, "global_step": 249254, "epoch": 1483} {"train_loss": -11.864629745483398, "global_step": 249255, "epoch": 1483} {"train_loss": -11.832145690917969, "global_step": 249256, "epoch": 1483} {"train_loss": -12.017642974853516, "global_step": 249257, "epoch": 1483} {"train_loss": -11.937467575073242, "global_step": 249258, "epoch": 1483} {"train_loss": -12.06551456451416, "global_step": 249259, "epoch": 1483} {"train_loss": -11.922811508178711, "global_step": 249260, "epoch": 1483} {"train_loss": -11.822059631347656, "global_step": 249261, "epoch": 1483} {"train_loss": -11.719635963439941, "global_step": 249262, "epoch": 1483} {"train_loss": -12.05509090423584, "global_step": 249263, "epoch": 1483} {"train_loss": -11.899991035461426, "global_step": 249264, "epoch": 1483} {"train_loss": -12.129616737365723, "global_step": 249265, "epoch": 1483} {"train_loss": -12.018155097961426, "global_step": 249266, "epoch": 1483} {"train_loss": -11.942774772644043, "global_step": 249267, "epoch": 1483} {"train_loss": -12.00267219543457, "global_step": 249268, "epoch": 1483} {"train_loss": -11.913777351379395, "global_step": 249269, "epoch": 1483} {"train_loss": -12.035259246826172, "global_step": 249270, "epoch": 1483} {"train_loss": -12.156612396240234, "global_step": 249271, "epoch": 1483} {"train_loss": -11.95412826538086, "global_step": 249272, "epoch": 1483} {"train_loss": -11.953666687011719, "global_step": 249273, "epoch": 1483} {"train_loss": -12.126080513000488, "global_step": 249274, "epoch": 1483} {"train_loss": -11.822793006896973, "global_step": 249275, "epoch": 1483} {"train_loss": -12.08273696899414, "global_step": 249276, "epoch": 1483} {"train_loss": -11.814970016479492, "global_step": 249277, "epoch": 1483} {"train_loss": -11.7573881149292, "global_step": 249278, "epoch": 1483} {"train_loss": -12.163156509399414, "global_step": 249279, "epoch": 1483} {"train_loss": -12.0797119140625, "global_step": 249280, "epoch": 1483} {"train_loss": -12.072711944580078, "global_step": 249281, "epoch": 1483} {"train_loss": -12.044960021972656, "global_step": 249282, "epoch": 1483} {"train_loss": -12.067869186401367, "global_step": 249283, "epoch": 1483} {"train_loss": -12.131795883178711, "global_step": 249284, "epoch": 1483} {"train_loss": -11.97606086730957, "global_step": 249285, "epoch": 1483} {"train_loss": -11.842018127441406, "global_step": 249286, "epoch": 1483} {"train_loss": -12.123086929321289, "global_step": 249287, "epoch": 1483} {"train_loss": -12.232597351074219, "global_step": 249288, "epoch": 1483} {"train_loss": -12.229517936706543, "global_step": 249289, "epoch": 1483} {"train_loss": -12.059877395629883, "global_step": 249290, "epoch": 1483} {"train_loss": -12.237869262695312, "global_step": 249291, "epoch": 1483} {"train_loss": -11.957497596740723, "global_step": 249292, "epoch": 1483} {"train_loss": -11.463190078735352, "global_step": 249293, "epoch": 1483} {"train_loss": -12.308670997619629, "global_step": 249294, "epoch": 1483} {"train_loss": -11.993541717529297, "global_step": 249295, "epoch": 1483} {"train_loss": -11.645515441894531, "global_step": 249296, "epoch": 1483} {"train_loss": -11.77621841430664, "global_step": 249297, "epoch": 1483} {"train_loss": -12.141999244689941, "global_step": 249298, "epoch": 1483} {"train_loss": -11.865009307861328, "global_step": 249299, "epoch": 1483} {"train_loss": -11.329517364501953, "global_step": 249300, "epoch": 1483} {"train_loss": -10.866368293762207, "global_step": 249301, "epoch": 1483} {"train_loss": -11.56640625, "global_step": 249302, "epoch": 1483} {"train_loss": -11.17901611328125, "global_step": 249303, "epoch": 1483} {"train_loss": -11.989534378051758, "global_step": 249304, "epoch": 1483} {"train_loss": -11.06314468383789, "global_step": 249305, "epoch": 1483} {"train_loss": -11.601178169250488, "global_step": 249306, "epoch": 1483} {"train_loss": -11.384212493896484, "global_step": 249307, "epoch": 1483} {"train_loss": -12.043558120727539, "global_step": 249308, "epoch": 1483} {"train_loss": -10.813192367553711, "global_step": 249309, "epoch": 1483} {"train_loss": -12.115400314331055, "global_step": 249310, "epoch": 1483} {"train_loss": -11.333241527988797, "global_step": 249311, "epoch": 1483, "val_loss": 264879.625} {"train_loss": -11.592825889587402, "global_step": 249312, "epoch": 1484} {"train_loss": -11.365011215209961, "global_step": 249313, "epoch": 1484} {"train_loss": -11.616357803344727, "global_step": 249314, "epoch": 1484} {"train_loss": -11.338394165039062, "global_step": 249315, "epoch": 1484} {"train_loss": -11.641329765319824, "global_step": 249316, "epoch": 1484} {"train_loss": -11.701425552368164, "global_step": 249317, "epoch": 1484} {"train_loss": -11.701010704040527, "global_step": 249318, "epoch": 1484} {"train_loss": -11.554154396057129, "global_step": 249319, "epoch": 1484} {"train_loss": -11.434433937072754, "global_step": 249320, "epoch": 1484} {"train_loss": -11.440475463867188, "global_step": 249321, "epoch": 1484} {"train_loss": -11.538719177246094, "global_step": 249322, "epoch": 1484} {"train_loss": -10.373981475830078, "global_step": 249323, "epoch": 1484} {"train_loss": -10.722681999206543, "global_step": 249324, "epoch": 1484} {"train_loss": -8.869038581848145, "global_step": 249325, "epoch": 1484} {"train_loss": -9.849737167358398, "global_step": 249326, "epoch": 1484} {"train_loss": -10.078705787658691, "global_step": 249327, "epoch": 1484} {"train_loss": -9.461133003234863, "global_step": 249328, "epoch": 1484} {"train_loss": -9.316401481628418, "global_step": 249329, "epoch": 1484} {"train_loss": -9.2720947265625, "global_step": 249330, "epoch": 1484} {"train_loss": -10.798507690429688, "global_step": 249331, "epoch": 1484} {"train_loss": -8.819891929626465, "global_step": 249332, "epoch": 1484} {"train_loss": -9.231579780578613, "global_step": 249333, "epoch": 1484} {"train_loss": -9.225664138793945, "global_step": 249334, "epoch": 1484} {"train_loss": -9.883237838745117, "global_step": 249335, "epoch": 1484} {"train_loss": -10.876663208007812, "global_step": 249336, "epoch": 1484} {"train_loss": -10.723871231079102, "global_step": 249337, "epoch": 1484} {"train_loss": -11.167594909667969, "global_step": 249338, "epoch": 1484} {"train_loss": -10.643239974975586, "global_step": 249339, "epoch": 1484} {"train_loss": -10.224239349365234, "global_step": 249340, "epoch": 1484} {"train_loss": -11.089723587036133, "global_step": 249341, "epoch": 1484} {"train_loss": -9.962444305419922, "global_step": 249342, "epoch": 1484} {"train_loss": -10.89797306060791, "global_step": 249343, "epoch": 1484} {"train_loss": -11.27061939239502, "global_step": 249344, "epoch": 1484} {"train_loss": -10.336400985717773, "global_step": 249345, "epoch": 1484} {"train_loss": -11.53981876373291, "global_step": 249346, "epoch": 1484} {"train_loss": -10.851072311401367, "global_step": 249347, "epoch": 1484} {"train_loss": -11.021774291992188, "global_step": 249348, "epoch": 1484} {"train_loss": -11.405412673950195, "global_step": 249349, "epoch": 1484} {"train_loss": -10.923083305358887, "global_step": 249350, "epoch": 1484} {"train_loss": -10.888980865478516, "global_step": 249351, "epoch": 1484} {"train_loss": -11.494643211364746, "global_step": 249352, "epoch": 1484} {"train_loss": -10.948455810546875, "global_step": 249353, "epoch": 1484} {"train_loss": -11.673571586608887, "global_step": 249354, "epoch": 1484} {"train_loss": -11.263955116271973, "global_step": 249355, "epoch": 1484} {"train_loss": -11.340230941772461, "global_step": 249356, "epoch": 1484} {"train_loss": -11.619979858398438, "global_step": 249357, "epoch": 1484} {"train_loss": -11.510244369506836, "global_step": 249358, "epoch": 1484} {"train_loss": -11.407865524291992, "global_step": 249359, "epoch": 1484} {"train_loss": -11.47861385345459, "global_step": 249360, "epoch": 1484} {"train_loss": -11.767556190490723, "global_step": 249361, "epoch": 1484} {"train_loss": -11.409573554992676, "global_step": 249362, "epoch": 1484} {"train_loss": -11.884393692016602, "global_step": 249363, "epoch": 1484} {"train_loss": -11.369729995727539, "global_step": 249364, "epoch": 1484} {"train_loss": -11.646331787109375, "global_step": 249365, "epoch": 1484} {"train_loss": -11.87462043762207, "global_step": 249366, "epoch": 1484} {"train_loss": -11.507230758666992, "global_step": 249367, "epoch": 1484} {"train_loss": -11.705829620361328, "global_step": 249368, "epoch": 1484} {"train_loss": -11.849894523620605, "global_step": 249369, "epoch": 1484} {"train_loss": -11.736640930175781, "global_step": 249370, "epoch": 1484} {"train_loss": -11.681221008300781, "global_step": 249371, "epoch": 1484} {"train_loss": -11.66286849975586, "global_step": 249372, "epoch": 1484} {"train_loss": -11.665596008300781, "global_step": 249373, "epoch": 1484} {"train_loss": -11.931028366088867, "global_step": 249374, "epoch": 1484} {"train_loss": -11.603626251220703, "global_step": 249375, "epoch": 1484} {"train_loss": -11.91356086730957, "global_step": 249376, "epoch": 1484} {"train_loss": -11.168148040771484, "global_step": 249377, "epoch": 1484} {"train_loss": -11.827863693237305, "global_step": 249378, "epoch": 1484} {"train_loss": -11.844346046447754, "global_step": 249379, "epoch": 1484} {"train_loss": -11.639569282531738, "global_step": 249380, "epoch": 1484} {"train_loss": -11.800802230834961, "global_step": 249381, "epoch": 1484} {"train_loss": -11.797761917114258, "global_step": 249382, "epoch": 1484} {"train_loss": -11.728915214538574, "global_step": 249383, "epoch": 1484} {"train_loss": -12.041332244873047, "global_step": 249384, "epoch": 1484} {"train_loss": -11.571544647216797, "global_step": 249385, "epoch": 1484} {"train_loss": -11.82679271697998, "global_step": 249386, "epoch": 1484} {"train_loss": -11.952999114990234, "global_step": 249387, "epoch": 1484} {"train_loss": -11.671281814575195, "global_step": 249388, "epoch": 1484} {"train_loss": -11.965629577636719, "global_step": 249389, "epoch": 1484} {"train_loss": -11.747355461120605, "global_step": 249390, "epoch": 1484} {"train_loss": -11.828619956970215, "global_step": 249391, "epoch": 1484} {"train_loss": -11.829669952392578, "global_step": 249392, "epoch": 1484} {"train_loss": -11.802995681762695, "global_step": 249393, "epoch": 1484} {"train_loss": -12.032693862915039, "global_step": 249394, "epoch": 1484} {"train_loss": -11.692435264587402, "global_step": 249395, "epoch": 1484} {"train_loss": -11.797733306884766, "global_step": 249396, "epoch": 1484} {"train_loss": -12.033385276794434, "global_step": 249397, "epoch": 1484} {"train_loss": -11.85798454284668, "global_step": 249398, "epoch": 1484} {"train_loss": -12.049233436584473, "global_step": 249399, "epoch": 1484} {"train_loss": -11.743949890136719, "global_step": 249400, "epoch": 1484} {"train_loss": -11.79150390625, "global_step": 249401, "epoch": 1484} {"train_loss": -12.097273826599121, "global_step": 249402, "epoch": 1484} {"train_loss": -11.972880363464355, "global_step": 249403, "epoch": 1484} {"train_loss": -11.888740539550781, "global_step": 249404, "epoch": 1484} {"train_loss": -12.051803588867188, "global_step": 249405, "epoch": 1484} {"train_loss": -11.890586853027344, "global_step": 249406, "epoch": 1484} {"train_loss": -11.848662376403809, "global_step": 249407, "epoch": 1484} {"train_loss": -11.643795013427734, "global_step": 249408, "epoch": 1484} {"train_loss": -12.08049488067627, "global_step": 249409, "epoch": 1484} {"train_loss": -11.114517211914062, "global_step": 249410, "epoch": 1484} {"train_loss": -11.309465408325195, "global_step": 249411, "epoch": 1484} {"train_loss": -11.370772361755371, "global_step": 249412, "epoch": 1484} {"train_loss": -11.705184936523438, "global_step": 249413, "epoch": 1484} {"train_loss": -11.239431381225586, "global_step": 249414, "epoch": 1484} {"train_loss": -11.269654273986816, "global_step": 249415, "epoch": 1484} {"train_loss": -11.966760635375977, "global_step": 249416, "epoch": 1484} {"train_loss": -11.423603057861328, "global_step": 249417, "epoch": 1484} {"train_loss": -11.808694839477539, "global_step": 249418, "epoch": 1484} {"train_loss": -11.676117897033691, "global_step": 249419, "epoch": 1484} {"train_loss": -11.154565811157227, "global_step": 249420, "epoch": 1484} {"train_loss": -11.71353816986084, "global_step": 249421, "epoch": 1484} {"train_loss": -10.663297653198242, "global_step": 249422, "epoch": 1484} {"train_loss": -11.721034049987793, "global_step": 249423, "epoch": 1484} {"train_loss": -11.000631332397461, "global_step": 249424, "epoch": 1484} {"train_loss": -11.957462310791016, "global_step": 249425, "epoch": 1484} {"train_loss": -11.80203914642334, "global_step": 249426, "epoch": 1484} {"train_loss": -11.92015552520752, "global_step": 249427, "epoch": 1484} {"train_loss": -12.164440155029297, "global_step": 249428, "epoch": 1484} {"train_loss": -11.788450241088867, "global_step": 249429, "epoch": 1484} {"train_loss": -12.020374298095703, "global_step": 249430, "epoch": 1484} {"train_loss": -11.872764587402344, "global_step": 249431, "epoch": 1484} {"train_loss": -11.55984115600586, "global_step": 249432, "epoch": 1484} {"train_loss": -11.965433120727539, "global_step": 249433, "epoch": 1484} {"train_loss": -11.322805404663086, "global_step": 249434, "epoch": 1484} {"train_loss": -11.984150886535645, "global_step": 249435, "epoch": 1484} {"train_loss": -11.38357162475586, "global_step": 249436, "epoch": 1484} {"train_loss": -11.806549072265625, "global_step": 249437, "epoch": 1484} {"train_loss": -11.542051315307617, "global_step": 249438, "epoch": 1484} {"train_loss": -11.127384185791016, "global_step": 249439, "epoch": 1484} {"train_loss": -11.581249237060547, "global_step": 249440, "epoch": 1484} {"train_loss": -11.459348678588867, "global_step": 249441, "epoch": 1484} {"train_loss": -11.379277229309082, "global_step": 249442, "epoch": 1484} {"train_loss": -10.851940155029297, "global_step": 249443, "epoch": 1484} {"train_loss": -11.810254096984863, "global_step": 249444, "epoch": 1484} {"train_loss": -11.369248390197754, "global_step": 249445, "epoch": 1484} {"train_loss": -11.99854564666748, "global_step": 249446, "epoch": 1484} {"train_loss": -11.712696075439453, "global_step": 249447, "epoch": 1484} {"train_loss": -11.545820236206055, "global_step": 249448, "epoch": 1484} {"train_loss": -11.623610496520996, "global_step": 249449, "epoch": 1484} {"train_loss": -11.507627487182617, "global_step": 249450, "epoch": 1484} {"train_loss": -11.82149600982666, "global_step": 249451, "epoch": 1484} {"train_loss": -11.369892120361328, "global_step": 249452, "epoch": 1484} {"train_loss": -11.370617866516113, "global_step": 249453, "epoch": 1484} {"train_loss": -11.512957572937012, "global_step": 249454, "epoch": 1484} {"train_loss": -10.316091537475586, "global_step": 249455, "epoch": 1484} {"train_loss": -11.35783863067627, "global_step": 249456, "epoch": 1484} {"train_loss": -9.898152351379395, "global_step": 249457, "epoch": 1484} {"train_loss": -10.263389587402344, "global_step": 249458, "epoch": 1484} {"train_loss": -10.795845031738281, "global_step": 249459, "epoch": 1484} {"train_loss": -10.347023010253906, "global_step": 249460, "epoch": 1484} {"train_loss": -10.624900817871094, "global_step": 249461, "epoch": 1484} {"train_loss": -11.130834579467773, "global_step": 249462, "epoch": 1484} {"train_loss": -9.01991081237793, "global_step": 249463, "epoch": 1484} {"train_loss": -9.154413223266602, "global_step": 249464, "epoch": 1484} {"train_loss": -9.887561798095703, "global_step": 249465, "epoch": 1484} {"train_loss": -10.80242919921875, "global_step": 249466, "epoch": 1484} {"train_loss": -8.649398803710938, "global_step": 249467, "epoch": 1484} {"train_loss": -10.777904510498047, "global_step": 249468, "epoch": 1484} {"train_loss": -9.488658905029297, "global_step": 249469, "epoch": 1484} {"train_loss": -10.10740852355957, "global_step": 249470, "epoch": 1484} {"train_loss": -9.458362579345703, "global_step": 249471, "epoch": 1484} {"train_loss": -9.54435920715332, "global_step": 249472, "epoch": 1484} {"train_loss": -10.107074737548828, "global_step": 249473, "epoch": 1484} {"train_loss": -9.515813827514648, "global_step": 249474, "epoch": 1484} {"train_loss": -10.425114631652832, "global_step": 249475, "epoch": 1484} {"train_loss": -9.59337329864502, "global_step": 249476, "epoch": 1484} {"train_loss": -10.037873268127441, "global_step": 249477, "epoch": 1484} {"train_loss": -10.166006088256836, "global_step": 249478, "epoch": 1484} {"train_loss": -11.181613081977481, "global_step": 249479, "epoch": 1484, "val_loss": 268217.46875} {"train_loss": -10.333263397216797, "global_step": 249480, "epoch": 1485} {"train_loss": -8.891241073608398, "global_step": 249481, "epoch": 1485} {"train_loss": -9.9660005569458, "global_step": 249482, "epoch": 1485} {"train_loss": -10.264995574951172, "global_step": 249483, "epoch": 1485} {"train_loss": -8.993289947509766, "global_step": 249484, "epoch": 1485} {"train_loss": -10.479070663452148, "global_step": 249485, "epoch": 1485} {"train_loss": -10.28890609741211, "global_step": 249486, "epoch": 1485} {"train_loss": -9.781692504882812, "global_step": 249487, "epoch": 1485} {"train_loss": -10.901168823242188, "global_step": 249488, "epoch": 1485} {"train_loss": -10.371404647827148, "global_step": 249489, "epoch": 1485} {"train_loss": -10.434503555297852, "global_step": 249490, "epoch": 1485} {"train_loss": -11.02529239654541, "global_step": 249491, "epoch": 1485} {"train_loss": -10.307259559631348, "global_step": 249492, "epoch": 1485} {"train_loss": -10.977904319763184, "global_step": 249493, "epoch": 1485} {"train_loss": -11.209085464477539, "global_step": 249494, "epoch": 1485} {"train_loss": -10.271156311035156, "global_step": 249495, "epoch": 1485} {"train_loss": -11.24824047088623, "global_step": 249496, "epoch": 1485} {"train_loss": -11.076186180114746, "global_step": 249497, "epoch": 1485} {"train_loss": -10.995782852172852, "global_step": 249498, "epoch": 1485} {"train_loss": -11.468971252441406, "global_step": 249499, "epoch": 1485} {"train_loss": -11.211004257202148, "global_step": 249500, "epoch": 1485} {"train_loss": -11.137887954711914, "global_step": 249501, "epoch": 1485} {"train_loss": -11.101346969604492, "global_step": 249502, "epoch": 1485} {"train_loss": -11.142936706542969, "global_step": 249503, "epoch": 1485} {"train_loss": -11.462333679199219, "global_step": 249504, "epoch": 1485} {"train_loss": -11.296682357788086, "global_step": 249505, "epoch": 1485} {"train_loss": -11.18628215789795, "global_step": 249506, "epoch": 1485} {"train_loss": -11.248260498046875, "global_step": 249507, "epoch": 1485} {"train_loss": -11.287620544433594, "global_step": 249508, "epoch": 1485} {"train_loss": -11.504823684692383, "global_step": 249509, "epoch": 1485} {"train_loss": -11.41026782989502, "global_step": 249510, "epoch": 1485} {"train_loss": -11.502188682556152, "global_step": 249511, "epoch": 1485} {"train_loss": -11.228952407836914, "global_step": 249512, "epoch": 1485} {"train_loss": -11.559371948242188, "global_step": 249513, "epoch": 1485} {"train_loss": -11.398015022277832, "global_step": 249514, "epoch": 1485} {"train_loss": -11.439939498901367, "global_step": 249515, "epoch": 1485} {"train_loss": -11.652109146118164, "global_step": 249516, "epoch": 1485} {"train_loss": -11.40177059173584, "global_step": 249517, "epoch": 1485} {"train_loss": -11.56707763671875, "global_step": 249518, "epoch": 1485} {"train_loss": -11.324987411499023, "global_step": 249519, "epoch": 1485} {"train_loss": -11.615483283996582, "global_step": 249520, "epoch": 1485} {"train_loss": -11.574953079223633, "global_step": 249521, "epoch": 1485} {"train_loss": -11.537643432617188, "global_step": 249522, "epoch": 1485} {"train_loss": -11.561563491821289, "global_step": 249523, "epoch": 1485} {"train_loss": -11.399303436279297, "global_step": 249524, "epoch": 1485} {"train_loss": -11.64128303527832, "global_step": 249525, "epoch": 1485} {"train_loss": -11.521047592163086, "global_step": 249526, "epoch": 1485} {"train_loss": -11.543481826782227, "global_step": 249527, "epoch": 1485} {"train_loss": -11.649185180664062, "global_step": 249528, "epoch": 1485} {"train_loss": -11.663187026977539, "global_step": 249529, "epoch": 1485} {"train_loss": -11.723830223083496, "global_step": 249530, "epoch": 1485} {"train_loss": -11.45644760131836, "global_step": 249531, "epoch": 1485} {"train_loss": -11.625731468200684, "global_step": 249532, "epoch": 1485} {"train_loss": -11.811559677124023, "global_step": 249533, "epoch": 1485} {"train_loss": -11.739839553833008, "global_step": 249534, "epoch": 1485} {"train_loss": -11.788536071777344, "global_step": 249535, "epoch": 1485} {"train_loss": -11.850235939025879, "global_step": 249536, "epoch": 1485} {"train_loss": -11.640016555786133, "global_step": 249537, "epoch": 1485} {"train_loss": -11.784553527832031, "global_step": 249538, "epoch": 1485} {"train_loss": -11.68215274810791, "global_step": 249539, "epoch": 1485} {"train_loss": -11.826011657714844, "global_step": 249540, "epoch": 1485} {"train_loss": -11.722700119018555, "global_step": 249541, "epoch": 1485} {"train_loss": -11.799070358276367, "global_step": 249542, "epoch": 1485} {"train_loss": -11.7732515335083, "global_step": 249543, "epoch": 1485} {"train_loss": -11.815516471862793, "global_step": 249544, "epoch": 1485} {"train_loss": -11.676506996154785, "global_step": 249545, "epoch": 1485} {"train_loss": -11.990934371948242, "global_step": 249546, "epoch": 1485} {"train_loss": -11.697000503540039, "global_step": 249547, "epoch": 1485} {"train_loss": -11.872126579284668, "global_step": 249548, "epoch": 1485} {"train_loss": -11.683643341064453, "global_step": 249549, "epoch": 1485} {"train_loss": -11.930607795715332, "global_step": 249550, "epoch": 1485} {"train_loss": -11.599125862121582, "global_step": 249551, "epoch": 1485} {"train_loss": -11.791621208190918, "global_step": 249552, "epoch": 1485} {"train_loss": -11.827794075012207, "global_step": 249553, "epoch": 1485} {"train_loss": -11.790725708007812, "global_step": 249554, "epoch": 1485} {"train_loss": -11.75830078125, "global_step": 249555, "epoch": 1485} {"train_loss": -11.878721237182617, "global_step": 249556, "epoch": 1485} {"train_loss": -11.851215362548828, "global_step": 249557, "epoch": 1485} {"train_loss": -11.997313499450684, "global_step": 249558, "epoch": 1485} {"train_loss": -11.904474258422852, "global_step": 249559, "epoch": 1485} {"train_loss": -11.997303009033203, "global_step": 249560, "epoch": 1485} {"train_loss": -11.866455078125, "global_step": 249561, "epoch": 1485} {"train_loss": -11.947473526000977, "global_step": 249562, "epoch": 1485} {"train_loss": -12.161572456359863, "global_step": 249563, "epoch": 1485} {"train_loss": -11.975994110107422, "global_step": 249564, "epoch": 1485} {"train_loss": -11.98149299621582, "global_step": 249565, "epoch": 1485} {"train_loss": -11.943246841430664, "global_step": 249566, "epoch": 1485} {"train_loss": -11.805591583251953, "global_step": 249567, "epoch": 1485} {"train_loss": -11.860823631286621, "global_step": 249568, "epoch": 1485} {"train_loss": -11.713052749633789, "global_step": 249569, "epoch": 1485} {"train_loss": -11.899162292480469, "global_step": 249570, "epoch": 1485} {"train_loss": -12.073352813720703, "global_step": 249571, "epoch": 1485} {"train_loss": -12.046966552734375, "global_step": 249572, "epoch": 1485} {"train_loss": -12.079655647277832, "global_step": 249573, "epoch": 1485} {"train_loss": -12.02320671081543, "global_step": 249574, "epoch": 1485} {"train_loss": -12.163848876953125, "global_step": 249575, "epoch": 1485} {"train_loss": -12.18817138671875, "global_step": 249576, "epoch": 1485} {"train_loss": -11.919178009033203, "global_step": 249577, "epoch": 1485} {"train_loss": -12.097452163696289, "global_step": 249578, "epoch": 1485} {"train_loss": -11.922599792480469, "global_step": 249579, "epoch": 1485} {"train_loss": -12.04319953918457, "global_step": 249580, "epoch": 1485} {"train_loss": -12.081966400146484, "global_step": 249581, "epoch": 1485} {"train_loss": -11.919488906860352, "global_step": 249582, "epoch": 1485} {"train_loss": -12.224472045898438, "global_step": 249583, "epoch": 1485} {"train_loss": -11.984033584594727, "global_step": 249584, "epoch": 1485} {"train_loss": -12.196649551391602, "global_step": 249585, "epoch": 1485} {"train_loss": -12.215673446655273, "global_step": 249586, "epoch": 1485} {"train_loss": -12.189996719360352, "global_step": 249587, "epoch": 1485} {"train_loss": -12.300382614135742, "global_step": 249588, "epoch": 1485} {"train_loss": -12.318069458007812, "global_step": 249589, "epoch": 1485} {"train_loss": -12.035955429077148, "global_step": 249590, "epoch": 1485} {"train_loss": -12.14046573638916, "global_step": 249591, "epoch": 1485} {"train_loss": -12.001375198364258, "global_step": 249592, "epoch": 1485} {"train_loss": -12.386500358581543, "global_step": 249593, "epoch": 1485} {"train_loss": -11.952653884887695, "global_step": 249594, "epoch": 1485} {"train_loss": -11.646484375, "global_step": 249595, "epoch": 1485} {"train_loss": -12.184009552001953, "global_step": 249596, "epoch": 1485} {"train_loss": -11.965948104858398, "global_step": 249597, "epoch": 1485} {"train_loss": -11.826273918151855, "global_step": 249598, "epoch": 1485} {"train_loss": -11.466663360595703, "global_step": 249599, "epoch": 1485} {"train_loss": -11.755874633789062, "global_step": 249600, "epoch": 1485} {"train_loss": -12.193279266357422, "global_step": 249601, "epoch": 1485} {"train_loss": -12.103876113891602, "global_step": 249602, "epoch": 1485} {"train_loss": -11.736501693725586, "global_step": 249603, "epoch": 1485} {"train_loss": -12.2430419921875, "global_step": 249604, "epoch": 1485} {"train_loss": -11.98392105102539, "global_step": 249605, "epoch": 1485} {"train_loss": -11.33742904663086, "global_step": 249606, "epoch": 1485} {"train_loss": -12.062921524047852, "global_step": 249607, "epoch": 1485} {"train_loss": -11.473236083984375, "global_step": 249608, "epoch": 1485} {"train_loss": -10.464004516601562, "global_step": 249609, "epoch": 1485} {"train_loss": -10.030916213989258, "global_step": 249610, "epoch": 1485} {"train_loss": -11.61158275604248, "global_step": 249611, "epoch": 1485} {"train_loss": -10.732128143310547, "global_step": 249612, "epoch": 1485} {"train_loss": -9.750410079956055, "global_step": 249613, "epoch": 1485} {"train_loss": -11.934222221374512, "global_step": 249614, "epoch": 1485} {"train_loss": -10.129125595092773, "global_step": 249615, "epoch": 1485} {"train_loss": -10.145349502563477, "global_step": 249616, "epoch": 1485} {"train_loss": -11.237127304077148, "global_step": 249617, "epoch": 1485} {"train_loss": -9.93503475189209, "global_step": 249618, "epoch": 1485} {"train_loss": -10.755009651184082, "global_step": 249619, "epoch": 1485} {"train_loss": -10.531231880187988, "global_step": 249620, "epoch": 1485} {"train_loss": -11.231195449829102, "global_step": 249621, "epoch": 1485} {"train_loss": -11.17793083190918, "global_step": 249622, "epoch": 1485} {"train_loss": -10.535552978515625, "global_step": 249623, "epoch": 1485} {"train_loss": -11.894859313964844, "global_step": 249624, "epoch": 1485} {"train_loss": -10.960758209228516, "global_step": 249625, "epoch": 1485} {"train_loss": -11.416900634765625, "global_step": 249626, "epoch": 1485} {"train_loss": -11.316219329833984, "global_step": 249627, "epoch": 1485} {"train_loss": -11.48989486694336, "global_step": 249628, "epoch": 1485} {"train_loss": -10.652362823486328, "global_step": 249629, "epoch": 1485} {"train_loss": -11.567794799804688, "global_step": 249630, "epoch": 1485} {"train_loss": -11.26409912109375, "global_step": 249631, "epoch": 1485} {"train_loss": -11.069230079650879, "global_step": 249632, "epoch": 1485} {"train_loss": -11.383354187011719, "global_step": 249633, "epoch": 1485} {"train_loss": -10.794946670532227, "global_step": 249634, "epoch": 1485} {"train_loss": -10.874948501586914, "global_step": 249635, "epoch": 1485} {"train_loss": -10.940971374511719, "global_step": 249636, "epoch": 1485} {"train_loss": -10.93165397644043, "global_step": 249637, "epoch": 1485} {"train_loss": -10.95931625366211, "global_step": 249638, "epoch": 1485} {"train_loss": -11.108777046203613, "global_step": 249639, "epoch": 1485} {"train_loss": -11.080513000488281, "global_step": 249640, "epoch": 1485} {"train_loss": -11.100717544555664, "global_step": 249641, "epoch": 1485} {"train_loss": -10.6875581741333, "global_step": 249642, "epoch": 1485} {"train_loss": -10.875768661499023, "global_step": 249643, "epoch": 1485} {"train_loss": -11.190646171569824, "global_step": 249644, "epoch": 1485} {"train_loss": -10.04419231414795, "global_step": 249645, "epoch": 1485} {"train_loss": -10.700642585754395, "global_step": 249646, "epoch": 1485} {"train_loss": -11.417420767602467, "global_step": 249647, "epoch": 1485, "val_loss": 271201.625, "train_action_mse_error": 2.7418062686920166} {"train_loss": -9.653331756591797, "global_step": 249648, "epoch": 1486} {"train_loss": -11.069293975830078, "global_step": 249649, "epoch": 1486} {"train_loss": -9.93100357055664, "global_step": 249650, "epoch": 1486} {"train_loss": -10.673284530639648, "global_step": 249651, "epoch": 1486} {"train_loss": -10.379968643188477, "global_step": 249652, "epoch": 1486} {"train_loss": -11.426998138427734, "global_step": 249653, "epoch": 1486} {"train_loss": -10.011359214782715, "global_step": 249654, "epoch": 1486} {"train_loss": -11.642699241638184, "global_step": 249655, "epoch": 1486} {"train_loss": -10.630819320678711, "global_step": 249656, "epoch": 1486} {"train_loss": -11.446873664855957, "global_step": 249657, "epoch": 1486} {"train_loss": -11.026626586914062, "global_step": 249658, "epoch": 1486} {"train_loss": -11.409828186035156, "global_step": 249659, "epoch": 1486} {"train_loss": -11.032068252563477, "global_step": 249660, "epoch": 1486} {"train_loss": -11.172895431518555, "global_step": 249661, "epoch": 1486} {"train_loss": -10.880266189575195, "global_step": 249662, "epoch": 1486} {"train_loss": -11.368127822875977, "global_step": 249663, "epoch": 1486} {"train_loss": -10.816234588623047, "global_step": 249664, "epoch": 1486} {"train_loss": -11.081838607788086, "global_step": 249665, "epoch": 1486} {"train_loss": -11.283132553100586, "global_step": 249666, "epoch": 1486} {"train_loss": -10.96562671661377, "global_step": 249667, "epoch": 1486} {"train_loss": -11.362958908081055, "global_step": 249668, "epoch": 1486} {"train_loss": -10.993122100830078, "global_step": 249669, "epoch": 1486} {"train_loss": -11.246277809143066, "global_step": 249670, "epoch": 1486} {"train_loss": -10.89091682434082, "global_step": 249671, "epoch": 1486} {"train_loss": -11.087823867797852, "global_step": 249672, "epoch": 1486} {"train_loss": -10.984607696533203, "global_step": 249673, "epoch": 1486} {"train_loss": -11.315454483032227, "global_step": 249674, "epoch": 1486} {"train_loss": -11.16756534576416, "global_step": 249675, "epoch": 1486} {"train_loss": -11.552619934082031, "global_step": 249676, "epoch": 1486} {"train_loss": -11.17813491821289, "global_step": 249677, "epoch": 1486} {"train_loss": -11.39610481262207, "global_step": 249678, "epoch": 1486} {"train_loss": -11.539856910705566, "global_step": 249679, "epoch": 1486} {"train_loss": -10.882732391357422, "global_step": 249680, "epoch": 1486} {"train_loss": -11.460222244262695, "global_step": 249681, "epoch": 1486} {"train_loss": -11.402481079101562, "global_step": 249682, "epoch": 1486} {"train_loss": -11.544258117675781, "global_step": 249683, "epoch": 1486} {"train_loss": -11.525459289550781, "global_step": 249684, "epoch": 1486} {"train_loss": -11.250362396240234, "global_step": 249685, "epoch": 1486} {"train_loss": -11.525436401367188, "global_step": 249686, "epoch": 1486} {"train_loss": -11.429792404174805, "global_step": 249687, "epoch": 1486} {"train_loss": -11.725818634033203, "global_step": 249688, "epoch": 1486} {"train_loss": -11.825061798095703, "global_step": 249689, "epoch": 1486} {"train_loss": -11.581136703491211, "global_step": 249690, "epoch": 1486} {"train_loss": -11.602227210998535, "global_step": 249691, "epoch": 1486} {"train_loss": -11.6575927734375, "global_step": 249692, "epoch": 1486} {"train_loss": -11.528716087341309, "global_step": 249693, "epoch": 1486} {"train_loss": -11.793516159057617, "global_step": 249694, "epoch": 1486} {"train_loss": -11.739659309387207, "global_step": 249695, "epoch": 1486} {"train_loss": -11.736227035522461, "global_step": 249696, "epoch": 1486} {"train_loss": -11.876070022583008, "global_step": 249697, "epoch": 1486} {"train_loss": -11.614673614501953, "global_step": 249698, "epoch": 1486} {"train_loss": -11.610937118530273, "global_step": 249699, "epoch": 1486} {"train_loss": -11.510784149169922, "global_step": 249700, "epoch": 1486} {"train_loss": -11.445931434631348, "global_step": 249701, "epoch": 1486} {"train_loss": -11.718860626220703, "global_step": 249702, "epoch": 1486} {"train_loss": -11.663627624511719, "global_step": 249703, "epoch": 1486} {"train_loss": -11.470142364501953, "global_step": 249704, "epoch": 1486} {"train_loss": -11.898862838745117, "global_step": 249705, "epoch": 1486} {"train_loss": -11.346936225891113, "global_step": 249706, "epoch": 1486} {"train_loss": -11.768045425415039, "global_step": 249707, "epoch": 1486} {"train_loss": -11.403993606567383, "global_step": 249708, "epoch": 1486} {"train_loss": -11.621404647827148, "global_step": 249709, "epoch": 1486} {"train_loss": -11.556169509887695, "global_step": 249710, "epoch": 1486} {"train_loss": -11.872005462646484, "global_step": 249711, "epoch": 1486} {"train_loss": -11.815082550048828, "global_step": 249712, "epoch": 1486} {"train_loss": -11.423032760620117, "global_step": 249713, "epoch": 1486} {"train_loss": -11.688814163208008, "global_step": 249714, "epoch": 1486} {"train_loss": -11.599689483642578, "global_step": 249715, "epoch": 1486} {"train_loss": -11.73471450805664, "global_step": 249716, "epoch": 1486} {"train_loss": -11.506383895874023, "global_step": 249717, "epoch": 1486} {"train_loss": -11.396934509277344, "global_step": 249718, "epoch": 1486} {"train_loss": -11.485764503479004, "global_step": 249719, "epoch": 1486} {"train_loss": -11.325839042663574, "global_step": 249720, "epoch": 1486} {"train_loss": -11.892487525939941, "global_step": 249721, "epoch": 1486} {"train_loss": -11.553608894348145, "global_step": 249722, "epoch": 1486} {"train_loss": -11.68222427368164, "global_step": 249723, "epoch": 1486} {"train_loss": -11.813535690307617, "global_step": 249724, "epoch": 1486} {"train_loss": -10.221888542175293, "global_step": 249725, "epoch": 1486} {"train_loss": -11.768949508666992, "global_step": 249726, "epoch": 1486} {"train_loss": -11.376784324645996, "global_step": 249727, "epoch": 1486} {"train_loss": -11.059624671936035, "global_step": 249728, "epoch": 1486} {"train_loss": -11.63563346862793, "global_step": 249729, "epoch": 1486} {"train_loss": -11.155908584594727, "global_step": 249730, "epoch": 1486} {"train_loss": -11.71566390991211, "global_step": 249731, "epoch": 1486} {"train_loss": -11.597674369812012, "global_step": 249732, "epoch": 1486} {"train_loss": -11.47451114654541, "global_step": 249733, "epoch": 1486} {"train_loss": -11.886009216308594, "global_step": 249734, "epoch": 1486} {"train_loss": -11.646228790283203, "global_step": 249735, "epoch": 1486} {"train_loss": -11.477235794067383, "global_step": 249736, "epoch": 1486} {"train_loss": -11.406700134277344, "global_step": 249737, "epoch": 1486} {"train_loss": -11.666301727294922, "global_step": 249738, "epoch": 1486} {"train_loss": -11.467071533203125, "global_step": 249739, "epoch": 1486} {"train_loss": -11.55911922454834, "global_step": 249740, "epoch": 1486} {"train_loss": -11.907939910888672, "global_step": 249741, "epoch": 1486} {"train_loss": -11.389022827148438, "global_step": 249742, "epoch": 1486} {"train_loss": -11.309688568115234, "global_step": 249743, "epoch": 1486} {"train_loss": -11.626453399658203, "global_step": 249744, "epoch": 1486} {"train_loss": -11.89211654663086, "global_step": 249745, "epoch": 1486} {"train_loss": -11.567449569702148, "global_step": 249746, "epoch": 1486} {"train_loss": -11.701896667480469, "global_step": 249747, "epoch": 1486} {"train_loss": -11.902503967285156, "global_step": 249748, "epoch": 1486} {"train_loss": -11.393895149230957, "global_step": 249749, "epoch": 1486} {"train_loss": -11.990326881408691, "global_step": 249750, "epoch": 1486} {"train_loss": -11.839303970336914, "global_step": 249751, "epoch": 1486} {"train_loss": -11.691972732543945, "global_step": 249752, "epoch": 1486} {"train_loss": -11.88707160949707, "global_step": 249753, "epoch": 1486} {"train_loss": -11.86435317993164, "global_step": 249754, "epoch": 1486} {"train_loss": -11.71356201171875, "global_step": 249755, "epoch": 1486} {"train_loss": -12.115556716918945, "global_step": 249756, "epoch": 1486} {"train_loss": -11.724529266357422, "global_step": 249757, "epoch": 1486} {"train_loss": -12.104413986206055, "global_step": 249758, "epoch": 1486} {"train_loss": -11.86581039428711, "global_step": 249759, "epoch": 1486} {"train_loss": -11.865511894226074, "global_step": 249760, "epoch": 1486} {"train_loss": -11.525894165039062, "global_step": 249761, "epoch": 1486} {"train_loss": -11.932744979858398, "global_step": 249762, "epoch": 1486} {"train_loss": -12.084138870239258, "global_step": 249763, "epoch": 1486} {"train_loss": -11.894922256469727, "global_step": 249764, "epoch": 1486} {"train_loss": -12.08297061920166, "global_step": 249765, "epoch": 1486} {"train_loss": -12.061784744262695, "global_step": 249766, "epoch": 1486} {"train_loss": -12.070758819580078, "global_step": 249767, "epoch": 1486} {"train_loss": -12.186944007873535, "global_step": 249768, "epoch": 1486} {"train_loss": -11.65678882598877, "global_step": 249769, "epoch": 1486} {"train_loss": -11.552949905395508, "global_step": 249770, "epoch": 1486} {"train_loss": -11.742624282836914, "global_step": 249771, "epoch": 1486} {"train_loss": -11.982754707336426, "global_step": 249772, "epoch": 1486} {"train_loss": -11.184492111206055, "global_step": 249773, "epoch": 1486} {"train_loss": -11.440216064453125, "global_step": 249774, "epoch": 1486} {"train_loss": -11.453067779541016, "global_step": 249775, "epoch": 1486} {"train_loss": -10.02077579498291, "global_step": 249776, "epoch": 1486} {"train_loss": -11.806333541870117, "global_step": 249777, "epoch": 1486} {"train_loss": -11.967344284057617, "global_step": 249778, "epoch": 1486} {"train_loss": -10.775554656982422, "global_step": 249779, "epoch": 1486} {"train_loss": -11.314029693603516, "global_step": 249780, "epoch": 1486} {"train_loss": -11.288272857666016, "global_step": 249781, "epoch": 1486} {"train_loss": -9.793283462524414, "global_step": 249782, "epoch": 1486} {"train_loss": -11.074816703796387, "global_step": 249783, "epoch": 1486} {"train_loss": -11.50073528289795, "global_step": 249784, "epoch": 1486} {"train_loss": -10.764939308166504, "global_step": 249785, "epoch": 1486} {"train_loss": -11.564777374267578, "global_step": 249786, "epoch": 1486} {"train_loss": -10.457069396972656, "global_step": 249787, "epoch": 1486} {"train_loss": -10.403785705566406, "global_step": 249788, "epoch": 1486} {"train_loss": -10.005186080932617, "global_step": 249789, "epoch": 1486} {"train_loss": -10.163930892944336, "global_step": 249790, "epoch": 1486} {"train_loss": -9.947168350219727, "global_step": 249791, "epoch": 1486} {"train_loss": -10.334585189819336, "global_step": 249792, "epoch": 1486} {"train_loss": -10.394807815551758, "global_step": 249793, "epoch": 1486} {"train_loss": -11.32828426361084, "global_step": 249794, "epoch": 1486} {"train_loss": -10.263686180114746, "global_step": 249795, "epoch": 1486} {"train_loss": -10.504676818847656, "global_step": 249796, "epoch": 1486} {"train_loss": -10.613018035888672, "global_step": 249797, "epoch": 1486} {"train_loss": -10.283490180969238, "global_step": 249798, "epoch": 1486} {"train_loss": -11.405147552490234, "global_step": 249799, "epoch": 1486} {"train_loss": -10.110124588012695, "global_step": 249800, "epoch": 1486} {"train_loss": -11.313831329345703, "global_step": 249801, "epoch": 1486} {"train_loss": -10.637271881103516, "global_step": 249802, "epoch": 1486} {"train_loss": -10.86065673828125, "global_step": 249803, "epoch": 1486} {"train_loss": -11.210095405578613, "global_step": 249804, "epoch": 1486} {"train_loss": -11.203496932983398, "global_step": 249805, "epoch": 1486} {"train_loss": -11.283366203308105, "global_step": 249806, "epoch": 1486} {"train_loss": -11.422866821289062, "global_step": 249807, "epoch": 1486} {"train_loss": -11.208364486694336, "global_step": 249808, "epoch": 1486} {"train_loss": -11.73678970336914, "global_step": 249809, "epoch": 1486} {"train_loss": -11.106033325195312, "global_step": 249810, "epoch": 1486} {"train_loss": -11.594622611999512, "global_step": 249811, "epoch": 1486} {"train_loss": -11.576950073242188, "global_step": 249812, "epoch": 1486} {"train_loss": -11.223955154418945, "global_step": 249813, "epoch": 1486} {"train_loss": -11.567081451416016, "global_step": 249814, "epoch": 1486} {"train_loss": -11.349531627836681, "global_step": 249815, "epoch": 1486, "val_loss": 271395.34375} {"train_loss": -11.382978439331055, "global_step": 249816, "epoch": 1487} {"train_loss": -11.510092735290527, "global_step": 249817, "epoch": 1487} {"train_loss": -11.065084457397461, "global_step": 249818, "epoch": 1487} {"train_loss": -11.621965408325195, "global_step": 249819, "epoch": 1487} {"train_loss": -11.182779312133789, "global_step": 249820, "epoch": 1487} {"train_loss": -11.341361999511719, "global_step": 249821, "epoch": 1487} {"train_loss": -11.653825759887695, "global_step": 249822, "epoch": 1487} {"train_loss": -11.069233894348145, "global_step": 249823, "epoch": 1487} {"train_loss": -11.664630889892578, "global_step": 249824, "epoch": 1487} {"train_loss": -11.421882629394531, "global_step": 249825, "epoch": 1487} {"train_loss": -11.75600814819336, "global_step": 249826, "epoch": 1487} {"train_loss": -11.595520973205566, "global_step": 249827, "epoch": 1487} {"train_loss": -11.5550537109375, "global_step": 249828, "epoch": 1487} {"train_loss": -11.998113632202148, "global_step": 249829, "epoch": 1487} {"train_loss": -11.799436569213867, "global_step": 249830, "epoch": 1487} {"train_loss": -11.594789505004883, "global_step": 249831, "epoch": 1487} {"train_loss": -11.780863761901855, "global_step": 249832, "epoch": 1487} {"train_loss": -11.601770401000977, "global_step": 249833, "epoch": 1487} {"train_loss": -11.727331161499023, "global_step": 249834, "epoch": 1487} {"train_loss": -11.808971405029297, "global_step": 249835, "epoch": 1487} {"train_loss": -11.730199813842773, "global_step": 249836, "epoch": 1487} {"train_loss": -11.846875190734863, "global_step": 249837, "epoch": 1487} {"train_loss": -11.738449096679688, "global_step": 249838, "epoch": 1487} {"train_loss": -11.864261627197266, "global_step": 249839, "epoch": 1487} {"train_loss": -11.58132266998291, "global_step": 249840, "epoch": 1487} {"train_loss": -11.875465393066406, "global_step": 249841, "epoch": 1487} {"train_loss": -11.778521537780762, "global_step": 249842, "epoch": 1487} {"train_loss": -11.711389541625977, "global_step": 249843, "epoch": 1487} {"train_loss": -11.835674285888672, "global_step": 249844, "epoch": 1487} {"train_loss": -12.09555721282959, "global_step": 249845, "epoch": 1487} {"train_loss": -11.84231185913086, "global_step": 249846, "epoch": 1487} {"train_loss": -11.829599380493164, "global_step": 249847, "epoch": 1487} {"train_loss": -12.099388122558594, "global_step": 249848, "epoch": 1487} {"train_loss": -11.726377487182617, "global_step": 249849, "epoch": 1487} {"train_loss": -11.895513534545898, "global_step": 249850, "epoch": 1487} {"train_loss": -11.947320938110352, "global_step": 249851, "epoch": 1487} {"train_loss": -12.00578498840332, "global_step": 249852, "epoch": 1487} {"train_loss": -11.962882041931152, "global_step": 249853, "epoch": 1487} {"train_loss": -11.895392417907715, "global_step": 249854, "epoch": 1487} {"train_loss": -11.911962509155273, "global_step": 249855, "epoch": 1487} {"train_loss": -11.937010765075684, "global_step": 249856, "epoch": 1487} {"train_loss": -11.70884895324707, "global_step": 249857, "epoch": 1487} {"train_loss": -11.6336669921875, "global_step": 249858, "epoch": 1487} {"train_loss": -11.577146530151367, "global_step": 249859, "epoch": 1487} {"train_loss": -11.826504707336426, "global_step": 249860, "epoch": 1487} {"train_loss": -12.130987167358398, "global_step": 249861, "epoch": 1487} {"train_loss": -11.576169967651367, "global_step": 249862, "epoch": 1487} {"train_loss": -11.730213165283203, "global_step": 249863, "epoch": 1487} {"train_loss": -11.635339736938477, "global_step": 249864, "epoch": 1487} {"train_loss": -11.355226516723633, "global_step": 249865, "epoch": 1487} {"train_loss": -10.963113784790039, "global_step": 249866, "epoch": 1487} {"train_loss": -11.375945091247559, "global_step": 249867, "epoch": 1487} {"train_loss": -11.500574111938477, "global_step": 249868, "epoch": 1487} {"train_loss": -11.335586547851562, "global_step": 249869, "epoch": 1487} {"train_loss": -11.589386940002441, "global_step": 249870, "epoch": 1487} {"train_loss": -11.744245529174805, "global_step": 249871, "epoch": 1487} {"train_loss": -12.003995895385742, "global_step": 249872, "epoch": 1487} {"train_loss": -11.766484260559082, "global_step": 249873, "epoch": 1487} {"train_loss": -11.895142555236816, "global_step": 249874, "epoch": 1487} {"train_loss": -11.722879409790039, "global_step": 249875, "epoch": 1487} {"train_loss": -11.848626136779785, "global_step": 249876, "epoch": 1487} {"train_loss": -11.732610702514648, "global_step": 249877, "epoch": 1487} {"train_loss": -11.805998802185059, "global_step": 249878, "epoch": 1487} {"train_loss": -11.54569149017334, "global_step": 249879, "epoch": 1487} {"train_loss": -11.129663467407227, "global_step": 249880, "epoch": 1487} {"train_loss": -11.739242553710938, "global_step": 249881, "epoch": 1487} {"train_loss": -11.921765327453613, "global_step": 249882, "epoch": 1487} {"train_loss": -11.931716918945312, "global_step": 249883, "epoch": 1487} {"train_loss": -12.043246269226074, "global_step": 249884, "epoch": 1487} {"train_loss": -11.51679515838623, "global_step": 249885, "epoch": 1487} {"train_loss": -12.033203125, "global_step": 249886, "epoch": 1487} {"train_loss": -12.045246124267578, "global_step": 249887, "epoch": 1487} {"train_loss": -12.061107635498047, "global_step": 249888, "epoch": 1487} {"train_loss": -12.033646583557129, "global_step": 249889, "epoch": 1487} {"train_loss": -12.153152465820312, "global_step": 249890, "epoch": 1487} {"train_loss": -12.072315216064453, "global_step": 249891, "epoch": 1487} {"train_loss": -11.998434066772461, "global_step": 249892, "epoch": 1487} {"train_loss": -12.162766456604004, "global_step": 249893, "epoch": 1487} {"train_loss": -11.932108879089355, "global_step": 249894, "epoch": 1487} {"train_loss": -12.010749816894531, "global_step": 249895, "epoch": 1487} {"train_loss": -12.04920768737793, "global_step": 249896, "epoch": 1487} {"train_loss": -12.081705093383789, "global_step": 249897, "epoch": 1487} {"train_loss": -11.711185455322266, "global_step": 249898, "epoch": 1487} {"train_loss": -11.917266845703125, "global_step": 249899, "epoch": 1487} {"train_loss": -12.17206859588623, "global_step": 249900, "epoch": 1487} {"train_loss": -11.776385307312012, "global_step": 249901, "epoch": 1487} {"train_loss": -12.0697021484375, "global_step": 249902, "epoch": 1487} {"train_loss": -12.105236053466797, "global_step": 249903, "epoch": 1487} {"train_loss": -11.831775665283203, "global_step": 249904, "epoch": 1487} {"train_loss": -11.642149925231934, "global_step": 249905, "epoch": 1487} {"train_loss": -11.825386047363281, "global_step": 249906, "epoch": 1487} {"train_loss": -11.697839736938477, "global_step": 249907, "epoch": 1487} {"train_loss": -11.715437889099121, "global_step": 249908, "epoch": 1487} {"train_loss": -11.619806289672852, "global_step": 249909, "epoch": 1487} {"train_loss": -11.109766006469727, "global_step": 249910, "epoch": 1487} {"train_loss": -11.357269287109375, "global_step": 249911, "epoch": 1487} {"train_loss": -11.81798267364502, "global_step": 249912, "epoch": 1487} {"train_loss": -10.38035774230957, "global_step": 249913, "epoch": 1487} {"train_loss": -10.150896072387695, "global_step": 249914, "epoch": 1487} {"train_loss": -11.381561279296875, "global_step": 249915, "epoch": 1487} {"train_loss": -9.334901809692383, "global_step": 249916, "epoch": 1487} {"train_loss": -9.9896240234375, "global_step": 249917, "epoch": 1487} {"train_loss": -10.701948165893555, "global_step": 249918, "epoch": 1487} {"train_loss": -8.963363647460938, "global_step": 249919, "epoch": 1487} {"train_loss": -9.753973960876465, "global_step": 249920, "epoch": 1487} {"train_loss": -10.31843376159668, "global_step": 249921, "epoch": 1487} {"train_loss": -9.416417121887207, "global_step": 249922, "epoch": 1487} {"train_loss": -9.65605354309082, "global_step": 249923, "epoch": 1487} {"train_loss": -9.569404602050781, "global_step": 249924, "epoch": 1487} {"train_loss": -10.767838478088379, "global_step": 249925, "epoch": 1487} {"train_loss": -10.50903034210205, "global_step": 249926, "epoch": 1487} {"train_loss": -10.177043914794922, "global_step": 249927, "epoch": 1487} {"train_loss": -10.664960861206055, "global_step": 249928, "epoch": 1487} {"train_loss": -9.517824172973633, "global_step": 249929, "epoch": 1487} {"train_loss": -10.733793258666992, "global_step": 249930, "epoch": 1487} {"train_loss": -9.275270462036133, "global_step": 249931, "epoch": 1487} {"train_loss": -8.889925003051758, "global_step": 249932, "epoch": 1487} {"train_loss": -9.36309814453125, "global_step": 249933, "epoch": 1487} {"train_loss": -10.082609176635742, "global_step": 249934, "epoch": 1487} {"train_loss": -9.17445182800293, "global_step": 249935, "epoch": 1487} {"train_loss": -10.539992332458496, "global_step": 249936, "epoch": 1487} {"train_loss": -10.234792709350586, "global_step": 249937, "epoch": 1487} {"train_loss": -9.441034317016602, "global_step": 249938, "epoch": 1487} {"train_loss": -11.17786693572998, "global_step": 249939, "epoch": 1487} {"train_loss": -10.53009033203125, "global_step": 249940, "epoch": 1487} {"train_loss": -9.798164367675781, "global_step": 249941, "epoch": 1487} {"train_loss": -11.126019477844238, "global_step": 249942, "epoch": 1487} {"train_loss": -10.940496444702148, "global_step": 249943, "epoch": 1487} {"train_loss": -10.105867385864258, "global_step": 249944, "epoch": 1487} {"train_loss": -11.497194290161133, "global_step": 249945, "epoch": 1487} {"train_loss": -11.05587387084961, "global_step": 249946, "epoch": 1487} {"train_loss": -10.689491271972656, "global_step": 249947, "epoch": 1487} {"train_loss": -11.483251571655273, "global_step": 249948, "epoch": 1487} {"train_loss": -11.145017623901367, "global_step": 249949, "epoch": 1487} {"train_loss": -10.627396583557129, "global_step": 249950, "epoch": 1487} {"train_loss": -11.103490829467773, "global_step": 249951, "epoch": 1487} {"train_loss": -11.025331497192383, "global_step": 249952, "epoch": 1487} {"train_loss": -10.994378089904785, "global_step": 249953, "epoch": 1487} {"train_loss": -11.244641304016113, "global_step": 249954, "epoch": 1487} {"train_loss": -11.26447582244873, "global_step": 249955, "epoch": 1487} {"train_loss": -10.836065292358398, "global_step": 249956, "epoch": 1487} {"train_loss": -11.245049476623535, "global_step": 249957, "epoch": 1487} {"train_loss": -11.24085807800293, "global_step": 249958, "epoch": 1487} {"train_loss": -10.935447692871094, "global_step": 249959, "epoch": 1487} {"train_loss": -10.952567100524902, "global_step": 249960, "epoch": 1487} {"train_loss": -11.639697074890137, "global_step": 249961, "epoch": 1487} {"train_loss": -10.980958938598633, "global_step": 249962, "epoch": 1487} {"train_loss": -11.298674583435059, "global_step": 249963, "epoch": 1487} {"train_loss": -11.573817253112793, "global_step": 249964, "epoch": 1487} {"train_loss": -11.227651596069336, "global_step": 249965, "epoch": 1487} {"train_loss": -11.579411506652832, "global_step": 249966, "epoch": 1487} {"train_loss": -11.525947570800781, "global_step": 249967, "epoch": 1487} {"train_loss": -11.222423553466797, "global_step": 249968, "epoch": 1487} {"train_loss": -11.45134162902832, "global_step": 249969, "epoch": 1487} {"train_loss": -11.381160736083984, "global_step": 249970, "epoch": 1487} {"train_loss": -11.067060470581055, "global_step": 249971, "epoch": 1487} {"train_loss": -11.652329444885254, "global_step": 249972, "epoch": 1487} {"train_loss": -11.641985893249512, "global_step": 249973, "epoch": 1487} {"train_loss": -11.528427124023438, "global_step": 249974, "epoch": 1487} {"train_loss": -11.551803588867188, "global_step": 249975, "epoch": 1487} {"train_loss": -11.792430877685547, "global_step": 249976, "epoch": 1487} {"train_loss": -11.64599895477295, "global_step": 249977, "epoch": 1487} {"train_loss": -11.619720458984375, "global_step": 249978, "epoch": 1487} {"train_loss": -11.68998908996582, "global_step": 249979, "epoch": 1487} {"train_loss": -11.639850616455078, "global_step": 249980, "epoch": 1487} {"train_loss": -11.471603393554688, "global_step": 249981, "epoch": 1487} {"train_loss": -11.711176872253418, "global_step": 249982, "epoch": 1487} {"train_loss": -11.334194540977478, "global_step": 249983, "epoch": 1487, "val_loss": 267952.03125} {"train_loss": -11.572492599487305, "global_step": 249984, "epoch": 1488} {"train_loss": -11.820398330688477, "global_step": 249985, "epoch": 1488} {"train_loss": -11.768123626708984, "global_step": 249986, "epoch": 1488} {"train_loss": -11.787680625915527, "global_step": 249987, "epoch": 1488} {"train_loss": -11.761027336120605, "global_step": 249988, "epoch": 1488} {"train_loss": -11.992171287536621, "global_step": 249989, "epoch": 1488} {"train_loss": -11.90784740447998, "global_step": 249990, "epoch": 1488} {"train_loss": -11.838079452514648, "global_step": 249991, "epoch": 1488} {"train_loss": -11.875446319580078, "global_step": 249992, "epoch": 1488} {"train_loss": -12.031173706054688, "global_step": 249993, "epoch": 1488} {"train_loss": -11.887541770935059, "global_step": 249994, "epoch": 1488} {"train_loss": -11.61781120300293, "global_step": 249995, "epoch": 1488} {"train_loss": -11.919656753540039, "global_step": 249996, "epoch": 1488} {"train_loss": -11.873021125793457, "global_step": 249997, "epoch": 1488} {"train_loss": -12.013651847839355, "global_step": 249998, "epoch": 1488} {"train_loss": -12.046876907348633, "global_step": 249999, "epoch": 1488} {"train_loss": -11.97183609008789, "global_step": 250000, "epoch": 1488} {"train_loss": -11.95936107635498, "global_step": 250001, "epoch": 1488} {"train_loss": -12.200105667114258, "global_step": 250002, "epoch": 1488} {"train_loss": -12.061357498168945, "global_step": 250003, "epoch": 1488} {"train_loss": -11.898862838745117, "global_step": 250004, "epoch": 1488} {"train_loss": -12.105722427368164, "global_step": 250005, "epoch": 1488} {"train_loss": -12.021530151367188, "global_step": 250006, "epoch": 1488} {"train_loss": -11.931133270263672, "global_step": 250007, "epoch": 1488} {"train_loss": -11.975811004638672, "global_step": 250008, "epoch": 1488} {"train_loss": -11.95012092590332, "global_step": 250009, "epoch": 1488} {"train_loss": -12.002317428588867, "global_step": 250010, "epoch": 1488} {"train_loss": -12.075332641601562, "global_step": 250011, "epoch": 1488} {"train_loss": -12.072586059570312, "global_step": 250012, "epoch": 1488} {"train_loss": -11.941879272460938, "global_step": 250013, "epoch": 1488} {"train_loss": -11.99923324584961, "global_step": 250014, "epoch": 1488} {"train_loss": -12.27170181274414, "global_step": 250015, "epoch": 1488} {"train_loss": -12.097795486450195, "global_step": 250016, "epoch": 1488} {"train_loss": -12.134137153625488, "global_step": 250017, "epoch": 1488} {"train_loss": -12.034317970275879, "global_step": 250018, "epoch": 1488} {"train_loss": -12.063953399658203, "global_step": 250019, "epoch": 1488} {"train_loss": -11.84709358215332, "global_step": 250020, "epoch": 1488} {"train_loss": -12.056694984436035, "global_step": 250021, "epoch": 1488} {"train_loss": -11.949962615966797, "global_step": 250022, "epoch": 1488} {"train_loss": -12.184799194335938, "global_step": 250023, "epoch": 1488} {"train_loss": -12.103796005249023, "global_step": 250024, "epoch": 1488} {"train_loss": -12.229129791259766, "global_step": 250025, "epoch": 1488} {"train_loss": -11.929161071777344, "global_step": 250026, "epoch": 1488} {"train_loss": -11.978092193603516, "global_step": 250027, "epoch": 1488} {"train_loss": -11.913891792297363, "global_step": 250028, "epoch": 1488} {"train_loss": -11.993562698364258, "global_step": 250029, "epoch": 1488} {"train_loss": -12.455574989318848, "global_step": 250030, "epoch": 1488} {"train_loss": -12.26024055480957, "global_step": 250031, "epoch": 1488} {"train_loss": -12.359920501708984, "global_step": 250032, "epoch": 1488} {"train_loss": -12.386247634887695, "global_step": 250033, "epoch": 1488} {"train_loss": -12.348129272460938, "global_step": 250034, "epoch": 1488} {"train_loss": -12.077749252319336, "global_step": 250035, "epoch": 1488} {"train_loss": -12.252099990844727, "global_step": 250036, "epoch": 1488} {"train_loss": -12.224023818969727, "global_step": 250037, "epoch": 1488} {"train_loss": -12.01988410949707, "global_step": 250038, "epoch": 1488} {"train_loss": -12.124500274658203, "global_step": 250039, "epoch": 1488} {"train_loss": -11.837154388427734, "global_step": 250040, "epoch": 1488} {"train_loss": -12.016437530517578, "global_step": 250041, "epoch": 1488} {"train_loss": -11.58013916015625, "global_step": 250042, "epoch": 1488} {"train_loss": -11.70028305053711, "global_step": 250043, "epoch": 1488} {"train_loss": -11.021203994750977, "global_step": 250044, "epoch": 1488} {"train_loss": -11.627473831176758, "global_step": 250045, "epoch": 1488} {"train_loss": -11.345071792602539, "global_step": 250046, "epoch": 1488} {"train_loss": -11.712525367736816, "global_step": 250047, "epoch": 1488} {"train_loss": -11.217546463012695, "global_step": 250048, "epoch": 1488} {"train_loss": -9.648467063903809, "global_step": 250049, "epoch": 1488} {"train_loss": -8.941366195678711, "global_step": 250050, "epoch": 1488} {"train_loss": -10.022392272949219, "global_step": 250051, "epoch": 1488} {"train_loss": -9.87004280090332, "global_step": 250052, "epoch": 1488} {"train_loss": -10.145463943481445, "global_step": 250053, "epoch": 1488} {"train_loss": -9.421019554138184, "global_step": 250054, "epoch": 1488} {"train_loss": -11.064958572387695, "global_step": 250055, "epoch": 1488} {"train_loss": -10.608782768249512, "global_step": 250056, "epoch": 1488} {"train_loss": -11.501337051391602, "global_step": 250057, "epoch": 1488} {"train_loss": -10.276047706604004, "global_step": 250058, "epoch": 1488} {"train_loss": -11.487533569335938, "global_step": 250059, "epoch": 1488} {"train_loss": -10.72500228881836, "global_step": 250060, "epoch": 1488} {"train_loss": -9.256219863891602, "global_step": 250061, "epoch": 1488} {"train_loss": -11.085254669189453, "global_step": 250062, "epoch": 1488} {"train_loss": -11.036628723144531, "global_step": 250063, "epoch": 1488} {"train_loss": -11.091522216796875, "global_step": 250064, "epoch": 1488} {"train_loss": -10.406429290771484, "global_step": 250065, "epoch": 1488} {"train_loss": -10.342497825622559, "global_step": 250066, "epoch": 1488} {"train_loss": -10.492378234863281, "global_step": 250067, "epoch": 1488} {"train_loss": -10.78231143951416, "global_step": 250068, "epoch": 1488} {"train_loss": -11.20268440246582, "global_step": 250069, "epoch": 1488} {"train_loss": -10.93765640258789, "global_step": 250070, "epoch": 1488} {"train_loss": -11.384008407592773, "global_step": 250071, "epoch": 1488} {"train_loss": -11.102275848388672, "global_step": 250072, "epoch": 1488} {"train_loss": -11.520530700683594, "global_step": 250073, "epoch": 1488} {"train_loss": -11.62158203125, "global_step": 250074, "epoch": 1488} {"train_loss": -10.573440551757812, "global_step": 250075, "epoch": 1488} {"train_loss": -11.618563652038574, "global_step": 250076, "epoch": 1488} {"train_loss": -11.133966445922852, "global_step": 250077, "epoch": 1488} {"train_loss": -11.264015197753906, "global_step": 250078, "epoch": 1488} {"train_loss": -11.384420394897461, "global_step": 250079, "epoch": 1488} {"train_loss": -11.15412712097168, "global_step": 250080, "epoch": 1488} {"train_loss": -10.868729591369629, "global_step": 250081, "epoch": 1488} {"train_loss": -10.969151496887207, "global_step": 250082, "epoch": 1488} {"train_loss": -11.187417984008789, "global_step": 250083, "epoch": 1488} {"train_loss": -11.160063743591309, "global_step": 250084, "epoch": 1488} {"train_loss": -10.893892288208008, "global_step": 250085, "epoch": 1488} {"train_loss": -11.457748413085938, "global_step": 250086, "epoch": 1488} {"train_loss": -11.222050666809082, "global_step": 250087, "epoch": 1488} {"train_loss": -11.36251163482666, "global_step": 250088, "epoch": 1488} {"train_loss": -11.422683715820312, "global_step": 250089, "epoch": 1488} {"train_loss": -11.330068588256836, "global_step": 250090, "epoch": 1488} {"train_loss": -11.564491271972656, "global_step": 250091, "epoch": 1488} {"train_loss": -11.381651878356934, "global_step": 250092, "epoch": 1488} {"train_loss": -11.690685272216797, "global_step": 250093, "epoch": 1488} {"train_loss": -11.470523834228516, "global_step": 250094, "epoch": 1488} {"train_loss": -11.773123741149902, "global_step": 250095, "epoch": 1488} {"train_loss": -11.517633438110352, "global_step": 250096, "epoch": 1488} {"train_loss": -11.806573867797852, "global_step": 250097, "epoch": 1488} {"train_loss": -11.770956039428711, "global_step": 250098, "epoch": 1488} {"train_loss": -11.526334762573242, "global_step": 250099, "epoch": 1488} {"train_loss": -11.717403411865234, "global_step": 250100, "epoch": 1488} {"train_loss": -11.837596893310547, "global_step": 250101, "epoch": 1488} {"train_loss": -11.444902420043945, "global_step": 250102, "epoch": 1488} {"train_loss": -11.943151473999023, "global_step": 250103, "epoch": 1488} {"train_loss": -11.545011520385742, "global_step": 250104, "epoch": 1488} {"train_loss": -12.041252136230469, "global_step": 250105, "epoch": 1488} {"train_loss": -11.589485168457031, "global_step": 250106, "epoch": 1488} {"train_loss": -11.790024757385254, "global_step": 250107, "epoch": 1488} {"train_loss": -11.755592346191406, "global_step": 250108, "epoch": 1488} {"train_loss": -11.578432083129883, "global_step": 250109, "epoch": 1488} {"train_loss": -11.882104873657227, "global_step": 250110, "epoch": 1488} {"train_loss": -11.283199310302734, "global_step": 250111, "epoch": 1488} {"train_loss": -11.625842094421387, "global_step": 250112, "epoch": 1488} {"train_loss": -11.563599586486816, "global_step": 250113, "epoch": 1488} {"train_loss": -11.663566589355469, "global_step": 250114, "epoch": 1488} {"train_loss": -11.515884399414062, "global_step": 250115, "epoch": 1488} {"train_loss": -11.789060592651367, "global_step": 250116, "epoch": 1488} {"train_loss": -11.625417709350586, "global_step": 250117, "epoch": 1488} {"train_loss": -11.442888259887695, "global_step": 250118, "epoch": 1488} {"train_loss": -11.715113639831543, "global_step": 250119, "epoch": 1488} {"train_loss": -11.786746978759766, "global_step": 250120, "epoch": 1488} {"train_loss": -11.717633247375488, "global_step": 250121, "epoch": 1488} {"train_loss": -11.804197311401367, "global_step": 250122, "epoch": 1488} {"train_loss": -11.640127182006836, "global_step": 250123, "epoch": 1488} {"train_loss": -11.727008819580078, "global_step": 250124, "epoch": 1488} {"train_loss": -11.508909225463867, "global_step": 250125, "epoch": 1488} {"train_loss": -11.486324310302734, "global_step": 250126, "epoch": 1488} {"train_loss": -11.37087631225586, "global_step": 250127, "epoch": 1488} {"train_loss": -11.768499374389648, "global_step": 250128, "epoch": 1488} {"train_loss": -11.150604248046875, "global_step": 250129, "epoch": 1488} {"train_loss": -11.53115463256836, "global_step": 250130, "epoch": 1488} {"train_loss": -11.166707038879395, "global_step": 250131, "epoch": 1488} {"train_loss": -11.210882186889648, "global_step": 250132, "epoch": 1488} {"train_loss": -11.440013885498047, "global_step": 250133, "epoch": 1488} {"train_loss": -11.52616024017334, "global_step": 250134, "epoch": 1488} {"train_loss": -11.58726692199707, "global_step": 250135, "epoch": 1488} {"train_loss": -11.294920921325684, "global_step": 250136, "epoch": 1488} {"train_loss": -11.870048522949219, "global_step": 250137, "epoch": 1488} {"train_loss": -11.824362754821777, "global_step": 250138, "epoch": 1488} {"train_loss": -11.687577247619629, "global_step": 250139, "epoch": 1488} {"train_loss": -11.777472496032715, "global_step": 250140, "epoch": 1488} {"train_loss": -11.818153381347656, "global_step": 250141, "epoch": 1488} {"train_loss": -11.881322860717773, "global_step": 250142, "epoch": 1488} {"train_loss": -11.678176879882812, "global_step": 250143, "epoch": 1488} {"train_loss": -11.483083724975586, "global_step": 250144, "epoch": 1488} {"train_loss": -11.672773361206055, "global_step": 250145, "epoch": 1488} {"train_loss": -11.630383491516113, "global_step": 250146, "epoch": 1488} {"train_loss": -12.052935600280762, "global_step": 250147, "epoch": 1488} {"train_loss": -11.56450366973877, "global_step": 250148, "epoch": 1488} {"train_loss": -11.961114883422852, "global_step": 250149, "epoch": 1488} {"train_loss": -11.903030395507812, "global_step": 250150, "epoch": 1488} {"train_loss": -11.561974797930036, "global_step": 250151, "epoch": 1488, "val_loss": 270777.03125} {"train_loss": -11.89024543762207, "global_step": 250152, "epoch": 1489} {"train_loss": -11.9716157913208, "global_step": 250153, "epoch": 1489} {"train_loss": -11.304134368896484, "global_step": 250154, "epoch": 1489} {"train_loss": -11.321752548217773, "global_step": 250155, "epoch": 1489} {"train_loss": -11.876191139221191, "global_step": 250156, "epoch": 1489} {"train_loss": -11.436266899108887, "global_step": 250157, "epoch": 1489} {"train_loss": -11.965704917907715, "global_step": 250158, "epoch": 1489} {"train_loss": -11.324952125549316, "global_step": 250159, "epoch": 1489} {"train_loss": -11.817365646362305, "global_step": 250160, "epoch": 1489} {"train_loss": -11.633662223815918, "global_step": 250161, "epoch": 1489} {"train_loss": -11.711261749267578, "global_step": 250162, "epoch": 1489} {"train_loss": -11.921302795410156, "global_step": 250163, "epoch": 1489} {"train_loss": -11.830118179321289, "global_step": 250164, "epoch": 1489} {"train_loss": -11.942989349365234, "global_step": 250165, "epoch": 1489} {"train_loss": -12.14423942565918, "global_step": 250166, "epoch": 1489} {"train_loss": -11.804590225219727, "global_step": 250167, "epoch": 1489} {"train_loss": -11.687492370605469, "global_step": 250168, "epoch": 1489} {"train_loss": -12.153043746948242, "global_step": 250169, "epoch": 1489} {"train_loss": -12.154585838317871, "global_step": 250170, "epoch": 1489} {"train_loss": -11.939325332641602, "global_step": 250171, "epoch": 1489} {"train_loss": -12.087875366210938, "global_step": 250172, "epoch": 1489} {"train_loss": -11.940591812133789, "global_step": 250173, "epoch": 1489} {"train_loss": -12.063739776611328, "global_step": 250174, "epoch": 1489} {"train_loss": -12.377399444580078, "global_step": 250175, "epoch": 1489} {"train_loss": -12.111747741699219, "global_step": 250176, "epoch": 1489} {"train_loss": -12.104995727539062, "global_step": 250177, "epoch": 1489} {"train_loss": -11.996135711669922, "global_step": 250178, "epoch": 1489} {"train_loss": -11.632169723510742, "global_step": 250179, "epoch": 1489} {"train_loss": -12.109420776367188, "global_step": 250180, "epoch": 1489} {"train_loss": -11.966440200805664, "global_step": 250181, "epoch": 1489} {"train_loss": -11.663797378540039, "global_step": 250182, "epoch": 1489} {"train_loss": -11.95068359375, "global_step": 250183, "epoch": 1489} {"train_loss": -11.938904762268066, "global_step": 250184, "epoch": 1489} {"train_loss": -11.749044418334961, "global_step": 250185, "epoch": 1489} {"train_loss": -11.345787048339844, "global_step": 250186, "epoch": 1489} {"train_loss": -11.375341415405273, "global_step": 250187, "epoch": 1489} {"train_loss": -11.872766494750977, "global_step": 250188, "epoch": 1489} {"train_loss": -11.647636413574219, "global_step": 250189, "epoch": 1489} {"train_loss": -10.493429183959961, "global_step": 250190, "epoch": 1489} {"train_loss": -10.96954345703125, "global_step": 250191, "epoch": 1489} {"train_loss": -11.813185691833496, "global_step": 250192, "epoch": 1489} {"train_loss": -11.414450645446777, "global_step": 250193, "epoch": 1489} {"train_loss": -11.443777084350586, "global_step": 250194, "epoch": 1489} {"train_loss": -11.43985366821289, "global_step": 250195, "epoch": 1489} {"train_loss": -11.183557510375977, "global_step": 250196, "epoch": 1489} {"train_loss": -10.870948791503906, "global_step": 250197, "epoch": 1489} {"train_loss": -10.364039421081543, "global_step": 250198, "epoch": 1489} {"train_loss": -10.837878227233887, "global_step": 250199, "epoch": 1489} {"train_loss": -10.23392105102539, "global_step": 250200, "epoch": 1489} {"train_loss": -10.190946578979492, "global_step": 250201, "epoch": 1489} {"train_loss": -9.851962089538574, "global_step": 250202, "epoch": 1489} {"train_loss": -10.57188606262207, "global_step": 250203, "epoch": 1489} {"train_loss": -10.075948715209961, "global_step": 250204, "epoch": 1489} {"train_loss": -8.61794662475586, "global_step": 250205, "epoch": 1489} {"train_loss": -10.230016708374023, "global_step": 250206, "epoch": 1489} {"train_loss": -10.406560897827148, "global_step": 250207, "epoch": 1489} {"train_loss": -9.566238403320312, "global_step": 250208, "epoch": 1489} {"train_loss": -10.962752342224121, "global_step": 250209, "epoch": 1489} {"train_loss": -10.893891334533691, "global_step": 250210, "epoch": 1489} {"train_loss": -10.457758903503418, "global_step": 250211, "epoch": 1489} {"train_loss": -10.641777038574219, "global_step": 250212, "epoch": 1489} {"train_loss": -10.668739318847656, "global_step": 250213, "epoch": 1489} {"train_loss": -10.985128402709961, "global_step": 250214, "epoch": 1489} {"train_loss": -10.005739212036133, "global_step": 250215, "epoch": 1489} {"train_loss": -11.178658485412598, "global_step": 250216, "epoch": 1489} {"train_loss": -10.302359580993652, "global_step": 250217, "epoch": 1489} {"train_loss": -11.384103775024414, "global_step": 250218, "epoch": 1489} {"train_loss": -11.024568557739258, "global_step": 250219, "epoch": 1489} {"train_loss": -11.264144897460938, "global_step": 250220, "epoch": 1489} {"train_loss": -11.13956069946289, "global_step": 250221, "epoch": 1489} {"train_loss": -11.323943138122559, "global_step": 250222, "epoch": 1489} {"train_loss": -11.209453582763672, "global_step": 250223, "epoch": 1489} {"train_loss": -11.599466323852539, "global_step": 250224, "epoch": 1489} {"train_loss": -11.329853057861328, "global_step": 250225, "epoch": 1489} {"train_loss": -11.261523246765137, "global_step": 250226, "epoch": 1489} {"train_loss": -11.560081481933594, "global_step": 250227, "epoch": 1489} {"train_loss": -11.476137161254883, "global_step": 250228, "epoch": 1489} {"train_loss": -11.677618980407715, "global_step": 250229, "epoch": 1489} {"train_loss": -11.594337463378906, "global_step": 250230, "epoch": 1489} {"train_loss": -11.645071029663086, "global_step": 250231, "epoch": 1489} {"train_loss": -11.575840950012207, "global_step": 250232, "epoch": 1489} {"train_loss": -11.726032257080078, "global_step": 250233, "epoch": 1489} {"train_loss": -11.687355041503906, "global_step": 250234, "epoch": 1489} {"train_loss": -11.700955390930176, "global_step": 250235, "epoch": 1489} {"train_loss": -11.778910636901855, "global_step": 250236, "epoch": 1489} {"train_loss": -11.533598899841309, "global_step": 250237, "epoch": 1489} {"train_loss": -11.800933837890625, "global_step": 250238, "epoch": 1489} {"train_loss": -11.749211311340332, "global_step": 250239, "epoch": 1489} {"train_loss": -11.616759300231934, "global_step": 250240, "epoch": 1489} {"train_loss": -11.824738502502441, "global_step": 250241, "epoch": 1489} {"train_loss": -11.526984214782715, "global_step": 250242, "epoch": 1489} {"train_loss": -11.62667465209961, "global_step": 250243, "epoch": 1489} {"train_loss": -11.873964309692383, "global_step": 250244, "epoch": 1489} {"train_loss": -11.646284103393555, "global_step": 250245, "epoch": 1489} {"train_loss": -11.812153816223145, "global_step": 250246, "epoch": 1489} {"train_loss": -11.852622985839844, "global_step": 250247, "epoch": 1489} {"train_loss": -11.636266708374023, "global_step": 250248, "epoch": 1489} {"train_loss": -11.781778335571289, "global_step": 250249, "epoch": 1489} {"train_loss": -11.771156311035156, "global_step": 250250, "epoch": 1489} {"train_loss": -11.909640312194824, "global_step": 250251, "epoch": 1489} {"train_loss": -11.736285209655762, "global_step": 250252, "epoch": 1489} {"train_loss": -11.919211387634277, "global_step": 250253, "epoch": 1489} {"train_loss": -11.836875915527344, "global_step": 250254, "epoch": 1489} {"train_loss": -12.04336166381836, "global_step": 250255, "epoch": 1489} {"train_loss": -12.001197814941406, "global_step": 250256, "epoch": 1489} {"train_loss": -11.846985816955566, "global_step": 250257, "epoch": 1489} {"train_loss": -11.761865615844727, "global_step": 250258, "epoch": 1489} {"train_loss": -11.700722694396973, "global_step": 250259, "epoch": 1489} {"train_loss": -11.882091522216797, "global_step": 250260, "epoch": 1489} {"train_loss": -11.812582015991211, "global_step": 250261, "epoch": 1489} {"train_loss": -12.03872299194336, "global_step": 250262, "epoch": 1489} {"train_loss": -11.956748962402344, "global_step": 250263, "epoch": 1489} {"train_loss": -11.785058975219727, "global_step": 250264, "epoch": 1489} {"train_loss": -11.768085479736328, "global_step": 250265, "epoch": 1489} {"train_loss": -11.910551071166992, "global_step": 250266, "epoch": 1489} {"train_loss": -11.60021686553955, "global_step": 250267, "epoch": 1489} {"train_loss": -11.619338989257812, "global_step": 250268, "epoch": 1489} {"train_loss": -11.67180347442627, "global_step": 250269, "epoch": 1489} {"train_loss": -11.920863151550293, "global_step": 250270, "epoch": 1489} {"train_loss": -11.789690017700195, "global_step": 250271, "epoch": 1489} {"train_loss": -11.895482063293457, "global_step": 250272, "epoch": 1489} {"train_loss": -11.836191177368164, "global_step": 250273, "epoch": 1489} {"train_loss": -12.00696086883545, "global_step": 250274, "epoch": 1489} {"train_loss": -11.917951583862305, "global_step": 250275, "epoch": 1489} {"train_loss": -11.95152473449707, "global_step": 250276, "epoch": 1489} {"train_loss": -11.887592315673828, "global_step": 250277, "epoch": 1489} {"train_loss": -12.000429153442383, "global_step": 250278, "epoch": 1489} {"train_loss": -11.764848709106445, "global_step": 250279, "epoch": 1489} {"train_loss": -11.7818603515625, "global_step": 250280, "epoch": 1489} {"train_loss": -11.957218170166016, "global_step": 250281, "epoch": 1489} {"train_loss": -11.975760459899902, "global_step": 250282, "epoch": 1489} {"train_loss": -11.815925598144531, "global_step": 250283, "epoch": 1489} {"train_loss": -11.921113014221191, "global_step": 250284, "epoch": 1489} {"train_loss": -11.593328475952148, "global_step": 250285, "epoch": 1489} {"train_loss": -11.818550109863281, "global_step": 250286, "epoch": 1489} {"train_loss": -11.793829917907715, "global_step": 250287, "epoch": 1489} {"train_loss": -11.608354568481445, "global_step": 250288, "epoch": 1489} {"train_loss": -11.950096130371094, "global_step": 250289, "epoch": 1489} {"train_loss": -11.3985595703125, "global_step": 250290, "epoch": 1489} {"train_loss": -11.799932479858398, "global_step": 250291, "epoch": 1489} {"train_loss": -11.576191902160645, "global_step": 250292, "epoch": 1489} {"train_loss": -12.185676574707031, "global_step": 250293, "epoch": 1489} {"train_loss": -11.771464347839355, "global_step": 250294, "epoch": 1489} {"train_loss": -11.690555572509766, "global_step": 250295, "epoch": 1489} {"train_loss": -11.798645973205566, "global_step": 250296, "epoch": 1489} {"train_loss": -11.778976440429688, "global_step": 250297, "epoch": 1489} {"train_loss": -11.638923645019531, "global_step": 250298, "epoch": 1489} {"train_loss": -11.377890586853027, "global_step": 250299, "epoch": 1489} {"train_loss": -11.107149124145508, "global_step": 250300, "epoch": 1489} {"train_loss": -11.224555969238281, "global_step": 250301, "epoch": 1489} {"train_loss": -11.662924766540527, "global_step": 250302, "epoch": 1489} {"train_loss": -11.196327209472656, "global_step": 250303, "epoch": 1489} {"train_loss": -11.805953979492188, "global_step": 250304, "epoch": 1489} {"train_loss": -11.097010612487793, "global_step": 250305, "epoch": 1489} {"train_loss": -11.831283569335938, "global_step": 250306, "epoch": 1489} {"train_loss": -11.251440048217773, "global_step": 250307, "epoch": 1489} {"train_loss": -11.641927719116211, "global_step": 250308, "epoch": 1489} {"train_loss": -11.1804780960083, "global_step": 250309, "epoch": 1489} {"train_loss": -11.905547142028809, "global_step": 250310, "epoch": 1489} {"train_loss": -11.638687133789062, "global_step": 250311, "epoch": 1489} {"train_loss": -11.627092361450195, "global_step": 250312, "epoch": 1489} {"train_loss": -11.890046119689941, "global_step": 250313, "epoch": 1489} {"train_loss": -11.556344032287598, "global_step": 250314, "epoch": 1489} {"train_loss": -11.221904754638672, "global_step": 250315, "epoch": 1489} {"train_loss": -11.743952751159668, "global_step": 250316, "epoch": 1489} {"train_loss": -11.60665512084961, "global_step": 250317, "epoch": 1489} {"train_loss": -11.693585395812988, "global_step": 250318, "epoch": 1489} {"train_loss": -11.534458024161202, "global_step": 250319, "epoch": 1489, "val_loss": 265783.875} {"train_loss": -11.583046913146973, "global_step": 250320, "epoch": 1490} {"train_loss": -12.155816078186035, "global_step": 250321, "epoch": 1490} {"train_loss": -11.617111206054688, "global_step": 250322, "epoch": 1490} {"train_loss": -11.720232963562012, "global_step": 250323, "epoch": 1490} {"train_loss": -11.756706237792969, "global_step": 250324, "epoch": 1490} {"train_loss": -11.823134422302246, "global_step": 250325, "epoch": 1490} {"train_loss": -11.869778633117676, "global_step": 250326, "epoch": 1490} {"train_loss": -11.62034797668457, "global_step": 250327, "epoch": 1490} {"train_loss": -11.249153137207031, "global_step": 250328, "epoch": 1490} {"train_loss": -11.421863555908203, "global_step": 250329, "epoch": 1490} {"train_loss": -12.071721076965332, "global_step": 250330, "epoch": 1490} {"train_loss": -11.626679420471191, "global_step": 250331, "epoch": 1490} {"train_loss": -11.691797256469727, "global_step": 250332, "epoch": 1490} {"train_loss": -11.752351760864258, "global_step": 250333, "epoch": 1490} {"train_loss": -11.656726837158203, "global_step": 250334, "epoch": 1490} {"train_loss": -11.492683410644531, "global_step": 250335, "epoch": 1490} {"train_loss": -11.641546249389648, "global_step": 250336, "epoch": 1490} {"train_loss": -10.9536714553833, "global_step": 250337, "epoch": 1490} {"train_loss": -10.092267036437988, "global_step": 250338, "epoch": 1490} {"train_loss": -11.35269546508789, "global_step": 250339, "epoch": 1490} {"train_loss": -11.729990005493164, "global_step": 250340, "epoch": 1490} {"train_loss": -10.860698699951172, "global_step": 250341, "epoch": 1490} {"train_loss": -11.082073211669922, "global_step": 250342, "epoch": 1490} {"train_loss": -10.40703010559082, "global_step": 250343, "epoch": 1490} {"train_loss": -10.928962707519531, "global_step": 250344, "epoch": 1490} {"train_loss": -11.370485305786133, "global_step": 250345, "epoch": 1490} {"train_loss": -10.600430488586426, "global_step": 250346, "epoch": 1490} {"train_loss": -11.613496780395508, "global_step": 250347, "epoch": 1490} {"train_loss": -10.374807357788086, "global_step": 250348, "epoch": 1490} {"train_loss": -11.300342559814453, "global_step": 250349, "epoch": 1490} {"train_loss": -10.35374927520752, "global_step": 250350, "epoch": 1490} {"train_loss": -11.163593292236328, "global_step": 250351, "epoch": 1490} {"train_loss": -11.109722137451172, "global_step": 250352, "epoch": 1490} {"train_loss": -10.777003288269043, "global_step": 250353, "epoch": 1490} {"train_loss": -11.308942794799805, "global_step": 250354, "epoch": 1490} {"train_loss": -10.596002578735352, "global_step": 250355, "epoch": 1490} {"train_loss": -11.156713485717773, "global_step": 250356, "epoch": 1490} {"train_loss": -10.704179763793945, "global_step": 250357, "epoch": 1490} {"train_loss": -10.737871170043945, "global_step": 250358, "epoch": 1490} {"train_loss": -10.974824905395508, "global_step": 250359, "epoch": 1490} {"train_loss": -10.46285343170166, "global_step": 250360, "epoch": 1490} {"train_loss": -11.196590423583984, "global_step": 250361, "epoch": 1490} {"train_loss": -11.22144889831543, "global_step": 250362, "epoch": 1490} {"train_loss": -10.51474380493164, "global_step": 250363, "epoch": 1490} {"train_loss": -11.090156555175781, "global_step": 250364, "epoch": 1490} {"train_loss": -11.327112197875977, "global_step": 250365, "epoch": 1490} {"train_loss": -11.452215194702148, "global_step": 250366, "epoch": 1490} {"train_loss": -11.278332710266113, "global_step": 250367, "epoch": 1490} {"train_loss": -11.443437576293945, "global_step": 250368, "epoch": 1490} {"train_loss": -11.14710807800293, "global_step": 250369, "epoch": 1490} {"train_loss": -11.058389663696289, "global_step": 250370, "epoch": 1490} {"train_loss": -11.627235412597656, "global_step": 250371, "epoch": 1490} {"train_loss": -11.095744132995605, "global_step": 250372, "epoch": 1490} {"train_loss": -11.227789878845215, "global_step": 250373, "epoch": 1490} {"train_loss": -11.441471099853516, "global_step": 250374, "epoch": 1490} {"train_loss": -11.78498649597168, "global_step": 250375, "epoch": 1490} {"train_loss": -11.59547233581543, "global_step": 250376, "epoch": 1490} {"train_loss": -11.85815715789795, "global_step": 250377, "epoch": 1490} {"train_loss": -11.826355934143066, "global_step": 250378, "epoch": 1490} {"train_loss": -11.879981994628906, "global_step": 250379, "epoch": 1490} {"train_loss": -11.336799621582031, "global_step": 250380, "epoch": 1490} {"train_loss": -11.592375755310059, "global_step": 250381, "epoch": 1490} {"train_loss": -11.693256378173828, "global_step": 250382, "epoch": 1490} {"train_loss": -11.773956298828125, "global_step": 250383, "epoch": 1490} {"train_loss": -11.444961547851562, "global_step": 250384, "epoch": 1490} {"train_loss": -11.821287155151367, "global_step": 250385, "epoch": 1490} {"train_loss": -11.652290344238281, "global_step": 250386, "epoch": 1490} {"train_loss": -11.630921363830566, "global_step": 250387, "epoch": 1490} {"train_loss": -11.69882583618164, "global_step": 250388, "epoch": 1490} {"train_loss": -11.492708206176758, "global_step": 250389, "epoch": 1490} {"train_loss": -12.031146049499512, "global_step": 250390, "epoch": 1490} {"train_loss": -11.734132766723633, "global_step": 250391, "epoch": 1490} {"train_loss": -11.859545707702637, "global_step": 250392, "epoch": 1490} {"train_loss": -11.683343887329102, "global_step": 250393, "epoch": 1490} {"train_loss": -11.60350227355957, "global_step": 250394, "epoch": 1490} {"train_loss": -11.82611083984375, "global_step": 250395, "epoch": 1490} {"train_loss": -11.907983779907227, "global_step": 250396, "epoch": 1490} {"train_loss": -11.831964492797852, "global_step": 250397, "epoch": 1490} {"train_loss": -12.068310737609863, "global_step": 250398, "epoch": 1490} {"train_loss": -11.669099807739258, "global_step": 250399, "epoch": 1490} {"train_loss": -12.068115234375, "global_step": 250400, "epoch": 1490} {"train_loss": -11.637598991394043, "global_step": 250401, "epoch": 1490} {"train_loss": -11.913400650024414, "global_step": 250402, "epoch": 1490} {"train_loss": -11.619460105895996, "global_step": 250403, "epoch": 1490} {"train_loss": -11.50135326385498, "global_step": 250404, "epoch": 1490} {"train_loss": -11.8667573928833, "global_step": 250405, "epoch": 1490} {"train_loss": -11.601664543151855, "global_step": 250406, "epoch": 1490} {"train_loss": -11.551543235778809, "global_step": 250407, "epoch": 1490} {"train_loss": -12.102851867675781, "global_step": 250408, "epoch": 1490} {"train_loss": -11.574664115905762, "global_step": 250409, "epoch": 1490} {"train_loss": -12.01667308807373, "global_step": 250410, "epoch": 1490} {"train_loss": -11.254690170288086, "global_step": 250411, "epoch": 1490} {"train_loss": -11.907608985900879, "global_step": 250412, "epoch": 1490} {"train_loss": -11.4478759765625, "global_step": 250413, "epoch": 1490} {"train_loss": -11.684000968933105, "global_step": 250414, "epoch": 1490} {"train_loss": -11.481172561645508, "global_step": 250415, "epoch": 1490} {"train_loss": -11.70440673828125, "global_step": 250416, "epoch": 1490} {"train_loss": -11.418103218078613, "global_step": 250417, "epoch": 1490} {"train_loss": -11.662888526916504, "global_step": 250418, "epoch": 1490} {"train_loss": -11.651630401611328, "global_step": 250419, "epoch": 1490} {"train_loss": -11.90283203125, "global_step": 250420, "epoch": 1490} {"train_loss": -11.83565616607666, "global_step": 250421, "epoch": 1490} {"train_loss": -11.996540069580078, "global_step": 250422, "epoch": 1490} {"train_loss": -12.06266975402832, "global_step": 250423, "epoch": 1490} {"train_loss": -11.566420555114746, "global_step": 250424, "epoch": 1490} {"train_loss": -11.67718505859375, "global_step": 250425, "epoch": 1490} {"train_loss": -11.8684663772583, "global_step": 250426, "epoch": 1490} {"train_loss": -11.618680000305176, "global_step": 250427, "epoch": 1490} {"train_loss": -11.781563758850098, "global_step": 250428, "epoch": 1490} {"train_loss": -11.93282413482666, "global_step": 250429, "epoch": 1490} {"train_loss": -12.01218032836914, "global_step": 250430, "epoch": 1490} {"train_loss": -11.904754638671875, "global_step": 250431, "epoch": 1490} {"train_loss": -11.866966247558594, "global_step": 250432, "epoch": 1490} {"train_loss": -11.80318832397461, "global_step": 250433, "epoch": 1490} {"train_loss": -11.765192031860352, "global_step": 250434, "epoch": 1490} {"train_loss": -11.819635391235352, "global_step": 250435, "epoch": 1490} {"train_loss": -11.737066268920898, "global_step": 250436, "epoch": 1490} {"train_loss": -11.50412368774414, "global_step": 250437, "epoch": 1490} {"train_loss": -11.56949234008789, "global_step": 250438, "epoch": 1490} {"train_loss": -11.463152885437012, "global_step": 250439, "epoch": 1490} {"train_loss": -11.883724212646484, "global_step": 250440, "epoch": 1490} {"train_loss": -11.402313232421875, "global_step": 250441, "epoch": 1490} {"train_loss": -11.54904842376709, "global_step": 250442, "epoch": 1490} {"train_loss": -11.942181587219238, "global_step": 250443, "epoch": 1490} {"train_loss": -11.558820724487305, "global_step": 250444, "epoch": 1490} {"train_loss": -11.942912101745605, "global_step": 250445, "epoch": 1490} {"train_loss": -11.342633247375488, "global_step": 250446, "epoch": 1490} {"train_loss": -11.926873207092285, "global_step": 250447, "epoch": 1490} {"train_loss": -11.825018882751465, "global_step": 250448, "epoch": 1490} {"train_loss": -11.959012985229492, "global_step": 250449, "epoch": 1490} {"train_loss": -11.11772632598877, "global_step": 250450, "epoch": 1490} {"train_loss": -11.421687126159668, "global_step": 250451, "epoch": 1490} {"train_loss": -11.22774887084961, "global_step": 250452, "epoch": 1490} {"train_loss": -11.98000717163086, "global_step": 250453, "epoch": 1490} {"train_loss": -11.096769332885742, "global_step": 250454, "epoch": 1490} {"train_loss": -11.894302368164062, "global_step": 250455, "epoch": 1490} {"train_loss": -11.684776306152344, "global_step": 250456, "epoch": 1490} {"train_loss": -11.192880630493164, "global_step": 250457, "epoch": 1490} {"train_loss": -11.331854820251465, "global_step": 250458, "epoch": 1490} {"train_loss": -11.396677017211914, "global_step": 250459, "epoch": 1490} {"train_loss": -11.441469192504883, "global_step": 250460, "epoch": 1490} {"train_loss": -11.069185256958008, "global_step": 250461, "epoch": 1490} {"train_loss": -11.473138809204102, "global_step": 250462, "epoch": 1490} {"train_loss": -10.952147483825684, "global_step": 250463, "epoch": 1490} {"train_loss": -11.532219886779785, "global_step": 250464, "epoch": 1490} {"train_loss": -11.251087188720703, "global_step": 250465, "epoch": 1490} {"train_loss": -11.854557037353516, "global_step": 250466, "epoch": 1490} {"train_loss": -11.351608276367188, "global_step": 250467, "epoch": 1490} {"train_loss": -11.723626136779785, "global_step": 250468, "epoch": 1490} {"train_loss": -11.221091270446777, "global_step": 250469, "epoch": 1490} {"train_loss": -11.373760223388672, "global_step": 250470, "epoch": 1490} {"train_loss": -11.201253890991211, "global_step": 250471, "epoch": 1490} {"train_loss": -11.429328918457031, "global_step": 250472, "epoch": 1490} {"train_loss": -11.009971618652344, "global_step": 250473, "epoch": 1490} {"train_loss": -11.211677551269531, "global_step": 250474, "epoch": 1490} {"train_loss": -11.340051651000977, "global_step": 250475, "epoch": 1490} {"train_loss": -10.043006896972656, "global_step": 250476, "epoch": 1490} {"train_loss": -11.195291519165039, "global_step": 250477, "epoch": 1490} {"train_loss": -10.30562973022461, "global_step": 250478, "epoch": 1490} {"train_loss": -10.678415298461914, "global_step": 250479, "epoch": 1490} {"train_loss": -11.210575103759766, "global_step": 250480, "epoch": 1490} {"train_loss": -11.235794067382812, "global_step": 250481, "epoch": 1490} {"train_loss": -10.783356666564941, "global_step": 250482, "epoch": 1490} {"train_loss": -11.289584159851074, "global_step": 250483, "epoch": 1490} {"train_loss": -11.365129470825195, "global_step": 250484, "epoch": 1490} {"train_loss": -11.586868286132812, "global_step": 250485, "epoch": 1490} {"train_loss": -11.609567642211914, "global_step": 250486, "epoch": 1490} {"train_loss": -11.462728103001913, "global_step": 250487, "epoch": 1490, "val_loss": 269800.875, "train_action_mse_error": 0.7739385366439819} {"train_loss": -11.539993286132812, "global_step": 250488, "epoch": 1491} {"train_loss": -10.72596549987793, "global_step": 250489, "epoch": 1491} {"train_loss": -11.610532760620117, "global_step": 250490, "epoch": 1491} {"train_loss": -11.77984619140625, "global_step": 250491, "epoch": 1491} {"train_loss": -10.998037338256836, "global_step": 250492, "epoch": 1491} {"train_loss": -11.761564254760742, "global_step": 250493, "epoch": 1491} {"train_loss": -11.131816864013672, "global_step": 250494, "epoch": 1491} {"train_loss": -11.489388465881348, "global_step": 250495, "epoch": 1491} {"train_loss": -11.672621726989746, "global_step": 250496, "epoch": 1491} {"train_loss": -11.107500076293945, "global_step": 250497, "epoch": 1491} {"train_loss": -11.856249809265137, "global_step": 250498, "epoch": 1491} {"train_loss": -11.36910629272461, "global_step": 250499, "epoch": 1491} {"train_loss": -11.808642387390137, "global_step": 250500, "epoch": 1491} {"train_loss": -11.714122772216797, "global_step": 250501, "epoch": 1491} {"train_loss": -11.432001113891602, "global_step": 250502, "epoch": 1491} {"train_loss": -11.799062728881836, "global_step": 250503, "epoch": 1491} {"train_loss": -11.699895858764648, "global_step": 250504, "epoch": 1491} {"train_loss": -11.909265518188477, "global_step": 250505, "epoch": 1491} {"train_loss": -11.754349708557129, "global_step": 250506, "epoch": 1491} {"train_loss": -11.915359497070312, "global_step": 250507, "epoch": 1491} {"train_loss": -12.119474411010742, "global_step": 250508, "epoch": 1491} {"train_loss": -11.59150505065918, "global_step": 250509, "epoch": 1491} {"train_loss": -11.891499519348145, "global_step": 250510, "epoch": 1491} {"train_loss": -11.715639114379883, "global_step": 250511, "epoch": 1491} {"train_loss": -11.83390998840332, "global_step": 250512, "epoch": 1491} {"train_loss": -12.108339309692383, "global_step": 250513, "epoch": 1491} {"train_loss": -12.05461311340332, "global_step": 250514, "epoch": 1491} {"train_loss": -11.66993522644043, "global_step": 250515, "epoch": 1491} {"train_loss": -12.064990997314453, "global_step": 250516, "epoch": 1491} {"train_loss": -11.626382827758789, "global_step": 250517, "epoch": 1491} {"train_loss": -11.913846969604492, "global_step": 250518, "epoch": 1491} {"train_loss": -11.804359436035156, "global_step": 250519, "epoch": 1491} {"train_loss": -11.667428970336914, "global_step": 250520, "epoch": 1491} {"train_loss": -11.786115646362305, "global_step": 250521, "epoch": 1491} {"train_loss": -11.849832534790039, "global_step": 250522, "epoch": 1491} {"train_loss": -12.009116172790527, "global_step": 250523, "epoch": 1491} {"train_loss": -11.8447904586792, "global_step": 250524, "epoch": 1491} {"train_loss": -12.221141815185547, "global_step": 250525, "epoch": 1491} {"train_loss": -11.928606033325195, "global_step": 250526, "epoch": 1491} {"train_loss": -11.762627601623535, "global_step": 250527, "epoch": 1491} {"train_loss": -11.645380020141602, "global_step": 250528, "epoch": 1491} {"train_loss": -11.976832389831543, "global_step": 250529, "epoch": 1491} {"train_loss": -11.874985694885254, "global_step": 250530, "epoch": 1491} {"train_loss": -11.85800552368164, "global_step": 250531, "epoch": 1491} {"train_loss": -12.009590148925781, "global_step": 250532, "epoch": 1491} {"train_loss": -12.00088882446289, "global_step": 250533, "epoch": 1491} {"train_loss": -12.192551612854004, "global_step": 250534, "epoch": 1491} {"train_loss": -11.832136154174805, "global_step": 250535, "epoch": 1491} {"train_loss": -11.847887992858887, "global_step": 250536, "epoch": 1491} {"train_loss": -11.930625915527344, "global_step": 250537, "epoch": 1491} {"train_loss": -11.674928665161133, "global_step": 250538, "epoch": 1491} {"train_loss": -11.942955017089844, "global_step": 250539, "epoch": 1491} {"train_loss": -11.895960807800293, "global_step": 250540, "epoch": 1491} {"train_loss": -11.72214412689209, "global_step": 250541, "epoch": 1491} {"train_loss": -11.52806282043457, "global_step": 250542, "epoch": 1491} {"train_loss": -12.320049285888672, "global_step": 250543, "epoch": 1491} {"train_loss": -11.874106407165527, "global_step": 250544, "epoch": 1491} {"train_loss": -11.05103874206543, "global_step": 250545, "epoch": 1491} {"train_loss": -11.997495651245117, "global_step": 250546, "epoch": 1491} {"train_loss": -11.590970993041992, "global_step": 250547, "epoch": 1491} {"train_loss": -11.583391189575195, "global_step": 250548, "epoch": 1491} {"train_loss": -11.288802146911621, "global_step": 250549, "epoch": 1491} {"train_loss": -11.966602325439453, "global_step": 250550, "epoch": 1491} {"train_loss": -11.32636833190918, "global_step": 250551, "epoch": 1491} {"train_loss": -11.244462966918945, "global_step": 250552, "epoch": 1491} {"train_loss": -10.785995483398438, "global_step": 250553, "epoch": 1491} {"train_loss": -11.960168838500977, "global_step": 250554, "epoch": 1491} {"train_loss": -11.792530059814453, "global_step": 250555, "epoch": 1491} {"train_loss": -11.52560806274414, "global_step": 250556, "epoch": 1491} {"train_loss": -11.981269836425781, "global_step": 250557, "epoch": 1491} {"train_loss": -11.408402442932129, "global_step": 250558, "epoch": 1491} {"train_loss": -11.39454460144043, "global_step": 250559, "epoch": 1491} {"train_loss": -11.832411766052246, "global_step": 250560, "epoch": 1491} {"train_loss": -11.762849807739258, "global_step": 250561, "epoch": 1491} {"train_loss": -11.457901954650879, "global_step": 250562, "epoch": 1491} {"train_loss": -11.619396209716797, "global_step": 250563, "epoch": 1491} {"train_loss": -11.203910827636719, "global_step": 250564, "epoch": 1491} {"train_loss": -11.891885757446289, "global_step": 250565, "epoch": 1491} {"train_loss": -11.755102157592773, "global_step": 250566, "epoch": 1491} {"train_loss": -11.559819221496582, "global_step": 250567, "epoch": 1491} {"train_loss": -11.294370651245117, "global_step": 250568, "epoch": 1491} {"train_loss": -11.661767959594727, "global_step": 250569, "epoch": 1491} {"train_loss": -11.47533130645752, "global_step": 250570, "epoch": 1491} {"train_loss": -11.945972442626953, "global_step": 250571, "epoch": 1491} {"train_loss": -11.650360107421875, "global_step": 250572, "epoch": 1491} {"train_loss": -11.683528900146484, "global_step": 250573, "epoch": 1491} {"train_loss": -11.914966583251953, "global_step": 250574, "epoch": 1491} {"train_loss": -11.849287033081055, "global_step": 250575, "epoch": 1491} {"train_loss": -11.974100112915039, "global_step": 250576, "epoch": 1491} {"train_loss": -11.676130294799805, "global_step": 250577, "epoch": 1491} {"train_loss": -12.121515274047852, "global_step": 250578, "epoch": 1491} {"train_loss": -11.844306945800781, "global_step": 250579, "epoch": 1491} {"train_loss": -11.733736038208008, "global_step": 250580, "epoch": 1491} {"train_loss": -11.85763931274414, "global_step": 250581, "epoch": 1491} {"train_loss": -11.850165367126465, "global_step": 250582, "epoch": 1491} {"train_loss": -11.978737831115723, "global_step": 250583, "epoch": 1491} {"train_loss": -11.8453369140625, "global_step": 250584, "epoch": 1491} {"train_loss": -11.188597679138184, "global_step": 250585, "epoch": 1491} {"train_loss": -11.256280899047852, "global_step": 250586, "epoch": 1491} {"train_loss": -11.95563793182373, "global_step": 250587, "epoch": 1491} {"train_loss": -11.306903839111328, "global_step": 250588, "epoch": 1491} {"train_loss": -11.865156173706055, "global_step": 250589, "epoch": 1491} {"train_loss": -11.538726806640625, "global_step": 250590, "epoch": 1491} {"train_loss": -11.402584075927734, "global_step": 250591, "epoch": 1491} {"train_loss": -11.662361145019531, "global_step": 250592, "epoch": 1491} {"train_loss": -11.804817199707031, "global_step": 250593, "epoch": 1491} {"train_loss": -10.987518310546875, "global_step": 250594, "epoch": 1491} {"train_loss": -12.020028114318848, "global_step": 250595, "epoch": 1491} {"train_loss": -10.928964614868164, "global_step": 250596, "epoch": 1491} {"train_loss": -10.755029678344727, "global_step": 250597, "epoch": 1491} {"train_loss": -11.786239624023438, "global_step": 250598, "epoch": 1491} {"train_loss": -11.152780532836914, "global_step": 250599, "epoch": 1491} {"train_loss": -11.493169784545898, "global_step": 250600, "epoch": 1491} {"train_loss": -11.294084548950195, "global_step": 250601, "epoch": 1491} {"train_loss": -11.310909271240234, "global_step": 250602, "epoch": 1491} {"train_loss": -11.495086669921875, "global_step": 250603, "epoch": 1491} {"train_loss": -10.8702392578125, "global_step": 250604, "epoch": 1491} {"train_loss": -11.882028579711914, "global_step": 250605, "epoch": 1491} {"train_loss": -11.287694931030273, "global_step": 250606, "epoch": 1491} {"train_loss": -11.735268592834473, "global_step": 250607, "epoch": 1491} {"train_loss": -11.533417701721191, "global_step": 250608, "epoch": 1491} {"train_loss": -11.611091613769531, "global_step": 250609, "epoch": 1491} {"train_loss": -11.10988998413086, "global_step": 250610, "epoch": 1491} {"train_loss": -11.886825561523438, "global_step": 250611, "epoch": 1491} {"train_loss": -11.500619888305664, "global_step": 250612, "epoch": 1491} {"train_loss": -11.506505012512207, "global_step": 250613, "epoch": 1491} {"train_loss": -10.945899963378906, "global_step": 250614, "epoch": 1491} {"train_loss": -11.727981567382812, "global_step": 250615, "epoch": 1491} {"train_loss": -11.379257202148438, "global_step": 250616, "epoch": 1491} {"train_loss": -11.72167682647705, "global_step": 250617, "epoch": 1491} {"train_loss": -11.503701210021973, "global_step": 250618, "epoch": 1491} {"train_loss": -11.640050888061523, "global_step": 250619, "epoch": 1491} {"train_loss": -11.31247329711914, "global_step": 250620, "epoch": 1491} {"train_loss": -10.728466033935547, "global_step": 250621, "epoch": 1491} {"train_loss": -11.5687837600708, "global_step": 250622, "epoch": 1491} {"train_loss": -10.378263473510742, "global_step": 250623, "epoch": 1491} {"train_loss": -11.014923095703125, "global_step": 250624, "epoch": 1491} {"train_loss": -11.516700744628906, "global_step": 250625, "epoch": 1491} {"train_loss": -10.528454780578613, "global_step": 250626, "epoch": 1491} {"train_loss": -12.020671844482422, "global_step": 250627, "epoch": 1491} {"train_loss": -10.198156356811523, "global_step": 250628, "epoch": 1491} {"train_loss": -10.872562408447266, "global_step": 250629, "epoch": 1491} {"train_loss": -11.02093505859375, "global_step": 250630, "epoch": 1491} {"train_loss": -10.33862590789795, "global_step": 250631, "epoch": 1491} {"train_loss": -11.563352584838867, "global_step": 250632, "epoch": 1491} {"train_loss": -9.741111755371094, "global_step": 250633, "epoch": 1491} {"train_loss": -11.24761962890625, "global_step": 250634, "epoch": 1491} {"train_loss": -10.949918746948242, "global_step": 250635, "epoch": 1491} {"train_loss": -10.873237609863281, "global_step": 250636, "epoch": 1491} {"train_loss": -11.218586921691895, "global_step": 250637, "epoch": 1491} {"train_loss": -10.598803520202637, "global_step": 250638, "epoch": 1491} {"train_loss": -11.335623741149902, "global_step": 250639, "epoch": 1491} {"train_loss": -11.20080280303955, "global_step": 250640, "epoch": 1491} {"train_loss": -10.972221374511719, "global_step": 250641, "epoch": 1491} {"train_loss": -11.55486011505127, "global_step": 250642, "epoch": 1491} {"train_loss": -11.285421371459961, "global_step": 250643, "epoch": 1491} {"train_loss": -11.207511901855469, "global_step": 250644, "epoch": 1491} {"train_loss": -11.430168151855469, "global_step": 250645, "epoch": 1491} {"train_loss": -11.618291854858398, "global_step": 250646, "epoch": 1491} {"train_loss": -11.121535301208496, "global_step": 250647, "epoch": 1491} {"train_loss": -11.501110076904297, "global_step": 250648, "epoch": 1491} {"train_loss": -11.32330322265625, "global_step": 250649, "epoch": 1491} {"train_loss": -11.813461303710938, "global_step": 250650, "epoch": 1491} {"train_loss": -11.374217987060547, "global_step": 250651, "epoch": 1491} {"train_loss": -11.770587921142578, "global_step": 250652, "epoch": 1491} {"train_loss": -11.458961486816406, "global_step": 250653, "epoch": 1491} {"train_loss": -11.625476837158203, "global_step": 250654, "epoch": 1491} {"train_loss": -11.547660078321185, "global_step": 250655, "epoch": 1491, "val_loss": 268920.21875} {"train_loss": -11.80615234375, "global_step": 250656, "epoch": 1492} {"train_loss": -11.549428939819336, "global_step": 250657, "epoch": 1492} {"train_loss": -11.747480392456055, "global_step": 250658, "epoch": 1492} {"train_loss": -11.581987380981445, "global_step": 250659, "epoch": 1492} {"train_loss": -11.557758331298828, "global_step": 250660, "epoch": 1492} {"train_loss": -11.593779563903809, "global_step": 250661, "epoch": 1492} {"train_loss": -11.39175796508789, "global_step": 250662, "epoch": 1492} {"train_loss": -11.735013008117676, "global_step": 250663, "epoch": 1492} {"train_loss": -11.100872039794922, "global_step": 250664, "epoch": 1492} {"train_loss": -11.463298797607422, "global_step": 250665, "epoch": 1492} {"train_loss": -10.865131378173828, "global_step": 250666, "epoch": 1492} {"train_loss": -11.991938591003418, "global_step": 250667, "epoch": 1492} {"train_loss": -10.633161544799805, "global_step": 250668, "epoch": 1492} {"train_loss": -11.469610214233398, "global_step": 250669, "epoch": 1492} {"train_loss": -10.990614891052246, "global_step": 250670, "epoch": 1492} {"train_loss": -11.272153854370117, "global_step": 250671, "epoch": 1492} {"train_loss": -11.472992897033691, "global_step": 250672, "epoch": 1492} {"train_loss": -11.25622272491455, "global_step": 250673, "epoch": 1492} {"train_loss": -11.715991020202637, "global_step": 250674, "epoch": 1492} {"train_loss": -11.168654441833496, "global_step": 250675, "epoch": 1492} {"train_loss": -11.761459350585938, "global_step": 250676, "epoch": 1492} {"train_loss": -11.21646499633789, "global_step": 250677, "epoch": 1492} {"train_loss": -11.702305793762207, "global_step": 250678, "epoch": 1492} {"train_loss": -11.42445182800293, "global_step": 250679, "epoch": 1492} {"train_loss": -12.015742301940918, "global_step": 250680, "epoch": 1492} {"train_loss": -11.68260383605957, "global_step": 250681, "epoch": 1492} {"train_loss": -11.82278823852539, "global_step": 250682, "epoch": 1492} {"train_loss": -11.783988952636719, "global_step": 250683, "epoch": 1492} {"train_loss": -11.85091781616211, "global_step": 250684, "epoch": 1492} {"train_loss": -11.918550491333008, "global_step": 250685, "epoch": 1492} {"train_loss": -11.911749839782715, "global_step": 250686, "epoch": 1492} {"train_loss": -11.922262191772461, "global_step": 250687, "epoch": 1492} {"train_loss": -12.015613555908203, "global_step": 250688, "epoch": 1492} {"train_loss": -12.11192512512207, "global_step": 250689, "epoch": 1492} {"train_loss": -11.975336074829102, "global_step": 250690, "epoch": 1492} {"train_loss": -12.046358108520508, "global_step": 250691, "epoch": 1492} {"train_loss": -12.02467155456543, "global_step": 250692, "epoch": 1492} {"train_loss": -11.957304000854492, "global_step": 250693, "epoch": 1492} {"train_loss": -11.909756660461426, "global_step": 250694, "epoch": 1492} {"train_loss": -11.965219497680664, "global_step": 250695, "epoch": 1492} {"train_loss": -11.91122817993164, "global_step": 250696, "epoch": 1492} {"train_loss": -12.018926620483398, "global_step": 250697, "epoch": 1492} {"train_loss": -12.231136322021484, "global_step": 250698, "epoch": 1492} {"train_loss": -12.094094276428223, "global_step": 250699, "epoch": 1492} {"train_loss": -11.937051773071289, "global_step": 250700, "epoch": 1492} {"train_loss": -11.944319725036621, "global_step": 250701, "epoch": 1492} {"train_loss": -12.207859992980957, "global_step": 250702, "epoch": 1492} {"train_loss": -12.121026039123535, "global_step": 250703, "epoch": 1492} {"train_loss": -11.953207015991211, "global_step": 250704, "epoch": 1492} {"train_loss": -12.104157447814941, "global_step": 250705, "epoch": 1492} {"train_loss": -11.991064071655273, "global_step": 250706, "epoch": 1492} {"train_loss": -12.003851890563965, "global_step": 250707, "epoch": 1492} {"train_loss": -12.116575241088867, "global_step": 250708, "epoch": 1492} {"train_loss": -11.973684310913086, "global_step": 250709, "epoch": 1492} {"train_loss": -12.146783828735352, "global_step": 250710, "epoch": 1492} {"train_loss": -12.092815399169922, "global_step": 250711, "epoch": 1492} {"train_loss": -12.067771911621094, "global_step": 250712, "epoch": 1492} {"train_loss": -11.883743286132812, "global_step": 250713, "epoch": 1492} {"train_loss": -12.08513355255127, "global_step": 250714, "epoch": 1492} {"train_loss": -11.910280227661133, "global_step": 250715, "epoch": 1492} {"train_loss": -12.004104614257812, "global_step": 250716, "epoch": 1492} {"train_loss": -12.075980186462402, "global_step": 250717, "epoch": 1492} {"train_loss": -11.833440780639648, "global_step": 250718, "epoch": 1492} {"train_loss": -11.606806755065918, "global_step": 250719, "epoch": 1492} {"train_loss": -11.937372207641602, "global_step": 250720, "epoch": 1492} {"train_loss": -11.913484573364258, "global_step": 250721, "epoch": 1492} {"train_loss": -12.244873046875, "global_step": 250722, "epoch": 1492} {"train_loss": -12.033562660217285, "global_step": 250723, "epoch": 1492} {"train_loss": -11.954585075378418, "global_step": 250724, "epoch": 1492} {"train_loss": -12.069576263427734, "global_step": 250725, "epoch": 1492} {"train_loss": -11.771812438964844, "global_step": 250726, "epoch": 1492} {"train_loss": -11.50088882446289, "global_step": 250727, "epoch": 1492} {"train_loss": -11.660009384155273, "global_step": 250728, "epoch": 1492} {"train_loss": -11.926511764526367, "global_step": 250729, "epoch": 1492} {"train_loss": -11.193805694580078, "global_step": 250730, "epoch": 1492} {"train_loss": -11.632181167602539, "global_step": 250731, "epoch": 1492} {"train_loss": -11.367340087890625, "global_step": 250732, "epoch": 1492} {"train_loss": -11.054153442382812, "global_step": 250733, "epoch": 1492} {"train_loss": -11.584467887878418, "global_step": 250734, "epoch": 1492} {"train_loss": -10.458929061889648, "global_step": 250735, "epoch": 1492} {"train_loss": -9.68790054321289, "global_step": 250736, "epoch": 1492} {"train_loss": -11.0900297164917, "global_step": 250737, "epoch": 1492} {"train_loss": -10.557306289672852, "global_step": 250738, "epoch": 1492} {"train_loss": -8.947227478027344, "global_step": 250739, "epoch": 1492} {"train_loss": -10.812871932983398, "global_step": 250740, "epoch": 1492} {"train_loss": -10.095281600952148, "global_step": 250741, "epoch": 1492} {"train_loss": -10.109514236450195, "global_step": 250742, "epoch": 1492} {"train_loss": -11.33134651184082, "global_step": 250743, "epoch": 1492} {"train_loss": -11.054947853088379, "global_step": 250744, "epoch": 1492} {"train_loss": -11.535658836364746, "global_step": 250745, "epoch": 1492} {"train_loss": -11.225753784179688, "global_step": 250746, "epoch": 1492} {"train_loss": -11.518011093139648, "global_step": 250747, "epoch": 1492} {"train_loss": -11.61630630493164, "global_step": 250748, "epoch": 1492} {"train_loss": -11.418169021606445, "global_step": 250749, "epoch": 1492} {"train_loss": -11.554306030273438, "global_step": 250750, "epoch": 1492} {"train_loss": -11.648391723632812, "global_step": 250751, "epoch": 1492} {"train_loss": -11.484131813049316, "global_step": 250752, "epoch": 1492} {"train_loss": -11.190689086914062, "global_step": 250753, "epoch": 1492} {"train_loss": -11.589925765991211, "global_step": 250754, "epoch": 1492} {"train_loss": -11.131824493408203, "global_step": 250755, "epoch": 1492} {"train_loss": -11.756404876708984, "global_step": 250756, "epoch": 1492} {"train_loss": -11.237188339233398, "global_step": 250757, "epoch": 1492} {"train_loss": -11.562945365905762, "global_step": 250758, "epoch": 1492} {"train_loss": -11.289726257324219, "global_step": 250759, "epoch": 1492} {"train_loss": -11.392990112304688, "global_step": 250760, "epoch": 1492} {"train_loss": -10.857104301452637, "global_step": 250761, "epoch": 1492} {"train_loss": -11.115503311157227, "global_step": 250762, "epoch": 1492} {"train_loss": -11.034709930419922, "global_step": 250763, "epoch": 1492} {"train_loss": -10.954365730285645, "global_step": 250764, "epoch": 1492} {"train_loss": -11.801373481750488, "global_step": 250765, "epoch": 1492} {"train_loss": -10.935284614562988, "global_step": 250766, "epoch": 1492} {"train_loss": -11.557305335998535, "global_step": 250767, "epoch": 1492} {"train_loss": -10.546679496765137, "global_step": 250768, "epoch": 1492} {"train_loss": -11.34077262878418, "global_step": 250769, "epoch": 1492} {"train_loss": -11.556415557861328, "global_step": 250770, "epoch": 1492} {"train_loss": -11.290589332580566, "global_step": 250771, "epoch": 1492} {"train_loss": -11.795010566711426, "global_step": 250772, "epoch": 1492} {"train_loss": -11.300800323486328, "global_step": 250773, "epoch": 1492} {"train_loss": -11.33969497680664, "global_step": 250774, "epoch": 1492} {"train_loss": -11.160236358642578, "global_step": 250775, "epoch": 1492} {"train_loss": -11.066906929016113, "global_step": 250776, "epoch": 1492} {"train_loss": -11.227289199829102, "global_step": 250777, "epoch": 1492} {"train_loss": -10.925514221191406, "global_step": 250778, "epoch": 1492} {"train_loss": -11.549219131469727, "global_step": 250779, "epoch": 1492} {"train_loss": -11.312570571899414, "global_step": 250780, "epoch": 1492} {"train_loss": -11.585384368896484, "global_step": 250781, "epoch": 1492} {"train_loss": -11.108627319335938, "global_step": 250782, "epoch": 1492} {"train_loss": -11.455981254577637, "global_step": 250783, "epoch": 1492} {"train_loss": -10.732894897460938, "global_step": 250784, "epoch": 1492} {"train_loss": -11.88150405883789, "global_step": 250785, "epoch": 1492} {"train_loss": -11.073091506958008, "global_step": 250786, "epoch": 1492} {"train_loss": -11.69387435913086, "global_step": 250787, "epoch": 1492} {"train_loss": -11.136099815368652, "global_step": 250788, "epoch": 1492} {"train_loss": -11.685192108154297, "global_step": 250789, "epoch": 1492} {"train_loss": -11.444997787475586, "global_step": 250790, "epoch": 1492} {"train_loss": -11.585617065429688, "global_step": 250791, "epoch": 1492} {"train_loss": -11.590097427368164, "global_step": 250792, "epoch": 1492} {"train_loss": -11.620674133300781, "global_step": 250793, "epoch": 1492} {"train_loss": -11.696701049804688, "global_step": 250794, "epoch": 1492} {"train_loss": -11.72607135772705, "global_step": 250795, "epoch": 1492} {"train_loss": -11.855648040771484, "global_step": 250796, "epoch": 1492} {"train_loss": -11.624205589294434, "global_step": 250797, "epoch": 1492} {"train_loss": -11.825445175170898, "global_step": 250798, "epoch": 1492} {"train_loss": -11.634586334228516, "global_step": 250799, "epoch": 1492} {"train_loss": -11.74569320678711, "global_step": 250800, "epoch": 1492} {"train_loss": -11.748479843139648, "global_step": 250801, "epoch": 1492} {"train_loss": -11.96922492980957, "global_step": 250802, "epoch": 1492} {"train_loss": -11.732571601867676, "global_step": 250803, "epoch": 1492} {"train_loss": -11.869291305541992, "global_step": 250804, "epoch": 1492} {"train_loss": -11.845903396606445, "global_step": 250805, "epoch": 1492} {"train_loss": -12.142067909240723, "global_step": 250806, "epoch": 1492} {"train_loss": -11.754032135009766, "global_step": 250807, "epoch": 1492} {"train_loss": -11.651007652282715, "global_step": 250808, "epoch": 1492} {"train_loss": -11.818901062011719, "global_step": 250809, "epoch": 1492} {"train_loss": -11.811751365661621, "global_step": 250810, "epoch": 1492} {"train_loss": -12.004077911376953, "global_step": 250811, "epoch": 1492} {"train_loss": -11.87548542022705, "global_step": 250812, "epoch": 1492} {"train_loss": -12.294282913208008, "global_step": 250813, "epoch": 1492} {"train_loss": -11.828729629516602, "global_step": 250814, "epoch": 1492} {"train_loss": -11.973668098449707, "global_step": 250815, "epoch": 1492} {"train_loss": -11.863973617553711, "global_step": 250816, "epoch": 1492} {"train_loss": -11.970714569091797, "global_step": 250817, "epoch": 1492} {"train_loss": -12.112967491149902, "global_step": 250818, "epoch": 1492} {"train_loss": -12.055224418640137, "global_step": 250819, "epoch": 1492} {"train_loss": -11.95217514038086, "global_step": 250820, "epoch": 1492} {"train_loss": -12.113091468811035, "global_step": 250821, "epoch": 1492} {"train_loss": -11.995349884033203, "global_step": 250822, "epoch": 1492} {"train_loss": -11.587757394427346, "global_step": 250823, "epoch": 1492, "val_loss": 269291.65625} {"train_loss": -12.052253723144531, "global_step": 250824, "epoch": 1493} {"train_loss": -11.863758087158203, "global_step": 250825, "epoch": 1493} {"train_loss": -11.985095977783203, "global_step": 250826, "epoch": 1493} {"train_loss": -11.760944366455078, "global_step": 250827, "epoch": 1493} {"train_loss": -11.784109115600586, "global_step": 250828, "epoch": 1493} {"train_loss": -11.876120567321777, "global_step": 250829, "epoch": 1493} {"train_loss": -11.696165084838867, "global_step": 250830, "epoch": 1493} {"train_loss": -11.956398963928223, "global_step": 250831, "epoch": 1493} {"train_loss": -11.875953674316406, "global_step": 250832, "epoch": 1493} {"train_loss": -11.712148666381836, "global_step": 250833, "epoch": 1493} {"train_loss": -12.066581726074219, "global_step": 250834, "epoch": 1493} {"train_loss": -12.112968444824219, "global_step": 250835, "epoch": 1493} {"train_loss": -11.808165550231934, "global_step": 250836, "epoch": 1493} {"train_loss": -11.883435249328613, "global_step": 250837, "epoch": 1493} {"train_loss": -12.153887748718262, "global_step": 250838, "epoch": 1493} {"train_loss": -12.079971313476562, "global_step": 250839, "epoch": 1493} {"train_loss": -11.992708206176758, "global_step": 250840, "epoch": 1493} {"train_loss": -12.132381439208984, "global_step": 250841, "epoch": 1493} {"train_loss": -11.786432266235352, "global_step": 250842, "epoch": 1493} {"train_loss": -12.130023956298828, "global_step": 250843, "epoch": 1493} {"train_loss": -12.097583770751953, "global_step": 250844, "epoch": 1493} {"train_loss": -12.092693328857422, "global_step": 250845, "epoch": 1493} {"train_loss": -12.07954216003418, "global_step": 250846, "epoch": 1493} {"train_loss": -12.277396202087402, "global_step": 250847, "epoch": 1493} {"train_loss": -12.028390884399414, "global_step": 250848, "epoch": 1493} {"train_loss": -12.30615520477295, "global_step": 250849, "epoch": 1493} {"train_loss": -11.835304260253906, "global_step": 250850, "epoch": 1493} {"train_loss": -12.098188400268555, "global_step": 250851, "epoch": 1493} {"train_loss": -11.904982566833496, "global_step": 250852, "epoch": 1493} {"train_loss": -12.133528709411621, "global_step": 250853, "epoch": 1493} {"train_loss": -12.147188186645508, "global_step": 250854, "epoch": 1493} {"train_loss": -12.078136444091797, "global_step": 250855, "epoch": 1493} {"train_loss": -12.15976333618164, "global_step": 250856, "epoch": 1493} {"train_loss": -11.944845199584961, "global_step": 250857, "epoch": 1493} {"train_loss": -11.693190574645996, "global_step": 250858, "epoch": 1493} {"train_loss": -11.883484840393066, "global_step": 250859, "epoch": 1493} {"train_loss": -11.774760246276855, "global_step": 250860, "epoch": 1493} {"train_loss": -10.651002883911133, "global_step": 250861, "epoch": 1493} {"train_loss": -11.053278923034668, "global_step": 250862, "epoch": 1493} {"train_loss": -11.689508438110352, "global_step": 250863, "epoch": 1493} {"train_loss": -11.497822761535645, "global_step": 250864, "epoch": 1493} {"train_loss": -10.473419189453125, "global_step": 250865, "epoch": 1493} {"train_loss": -11.953717231750488, "global_step": 250866, "epoch": 1493} {"train_loss": -11.829514503479004, "global_step": 250867, "epoch": 1493} {"train_loss": -10.599957466125488, "global_step": 250868, "epoch": 1493} {"train_loss": -9.738706588745117, "global_step": 250869, "epoch": 1493} {"train_loss": -12.126041412353516, "global_step": 250870, "epoch": 1493} {"train_loss": -9.710281372070312, "global_step": 250871, "epoch": 1493} {"train_loss": -10.864152908325195, "global_step": 250872, "epoch": 1493} {"train_loss": -10.378179550170898, "global_step": 250873, "epoch": 1493} {"train_loss": -9.995073318481445, "global_step": 250874, "epoch": 1493} {"train_loss": -11.351683616638184, "global_step": 250875, "epoch": 1493} {"train_loss": -10.279722213745117, "global_step": 250876, "epoch": 1493} {"train_loss": -10.900627136230469, "global_step": 250877, "epoch": 1493} {"train_loss": -11.212769508361816, "global_step": 250878, "epoch": 1493} {"train_loss": -10.677957534790039, "global_step": 250879, "epoch": 1493} {"train_loss": -10.748485565185547, "global_step": 250880, "epoch": 1493} {"train_loss": -10.313216209411621, "global_step": 250881, "epoch": 1493} {"train_loss": -11.605789184570312, "global_step": 250882, "epoch": 1493} {"train_loss": -10.310869216918945, "global_step": 250883, "epoch": 1493} {"train_loss": -11.306255340576172, "global_step": 250884, "epoch": 1493} {"train_loss": -10.995355606079102, "global_step": 250885, "epoch": 1493} {"train_loss": -11.216758728027344, "global_step": 250886, "epoch": 1493} {"train_loss": -10.979236602783203, "global_step": 250887, "epoch": 1493} {"train_loss": -10.709972381591797, "global_step": 250888, "epoch": 1493} {"train_loss": -11.378813743591309, "global_step": 250889, "epoch": 1493} {"train_loss": -10.847908020019531, "global_step": 250890, "epoch": 1493} {"train_loss": -11.24085807800293, "global_step": 250891, "epoch": 1493} {"train_loss": -11.060441017150879, "global_step": 250892, "epoch": 1493} {"train_loss": -11.584206581115723, "global_step": 250893, "epoch": 1493} {"train_loss": -10.908099174499512, "global_step": 250894, "epoch": 1493} {"train_loss": -11.751952171325684, "global_step": 250895, "epoch": 1493} {"train_loss": -11.077895164489746, "global_step": 250896, "epoch": 1493} {"train_loss": -11.469496726989746, "global_step": 250897, "epoch": 1493} {"train_loss": -11.65546989440918, "global_step": 250898, "epoch": 1493} {"train_loss": -11.6136474609375, "global_step": 250899, "epoch": 1493} {"train_loss": -11.690547943115234, "global_step": 250900, "epoch": 1493} {"train_loss": -11.24176025390625, "global_step": 250901, "epoch": 1493} {"train_loss": -11.609676361083984, "global_step": 250902, "epoch": 1493} {"train_loss": -11.316431999206543, "global_step": 250903, "epoch": 1493} {"train_loss": -11.52954387664795, "global_step": 250904, "epoch": 1493} {"train_loss": -11.707484245300293, "global_step": 250905, "epoch": 1493} {"train_loss": -11.263837814331055, "global_step": 250906, "epoch": 1493} {"train_loss": -11.614568710327148, "global_step": 250907, "epoch": 1493} {"train_loss": -11.13787841796875, "global_step": 250908, "epoch": 1493} {"train_loss": -11.874353408813477, "global_step": 250909, "epoch": 1493} {"train_loss": -11.088077545166016, "global_step": 250910, "epoch": 1493} {"train_loss": -11.818552017211914, "global_step": 250911, "epoch": 1493} {"train_loss": -11.312370300292969, "global_step": 250912, "epoch": 1493} {"train_loss": -11.459330558776855, "global_step": 250913, "epoch": 1493} {"train_loss": -11.604730606079102, "global_step": 250914, "epoch": 1493} {"train_loss": -11.510114669799805, "global_step": 250915, "epoch": 1493} {"train_loss": -11.580388069152832, "global_step": 250916, "epoch": 1493} {"train_loss": -11.685811042785645, "global_step": 250917, "epoch": 1493} {"train_loss": -11.347949981689453, "global_step": 250918, "epoch": 1493} {"train_loss": -11.776185035705566, "global_step": 250919, "epoch": 1493} {"train_loss": -11.482748031616211, "global_step": 250920, "epoch": 1493} {"train_loss": -11.157010078430176, "global_step": 250921, "epoch": 1493} {"train_loss": -11.393507957458496, "global_step": 250922, "epoch": 1493} {"train_loss": -11.27332878112793, "global_step": 250923, "epoch": 1493} {"train_loss": -10.990291595458984, "global_step": 250924, "epoch": 1493} {"train_loss": -11.001020431518555, "global_step": 250925, "epoch": 1493} {"train_loss": -11.36611557006836, "global_step": 250926, "epoch": 1493} {"train_loss": -10.909040451049805, "global_step": 250927, "epoch": 1493} {"train_loss": -11.38680648803711, "global_step": 250928, "epoch": 1493} {"train_loss": -11.250528335571289, "global_step": 250929, "epoch": 1493} {"train_loss": -11.726815223693848, "global_step": 250930, "epoch": 1493} {"train_loss": -11.717575073242188, "global_step": 250931, "epoch": 1493} {"train_loss": -11.653833389282227, "global_step": 250932, "epoch": 1493} {"train_loss": -11.838642120361328, "global_step": 250933, "epoch": 1493} {"train_loss": -11.73562240600586, "global_step": 250934, "epoch": 1493} {"train_loss": -11.590763092041016, "global_step": 250935, "epoch": 1493} {"train_loss": -11.979010581970215, "global_step": 250936, "epoch": 1493} {"train_loss": -11.915717124938965, "global_step": 250937, "epoch": 1493} {"train_loss": -11.876041412353516, "global_step": 250938, "epoch": 1493} {"train_loss": -11.931453704833984, "global_step": 250939, "epoch": 1493} {"train_loss": -11.786260604858398, "global_step": 250940, "epoch": 1493} {"train_loss": -11.801179885864258, "global_step": 250941, "epoch": 1493} {"train_loss": -11.689799308776855, "global_step": 250942, "epoch": 1493} {"train_loss": -11.932394027709961, "global_step": 250943, "epoch": 1493} {"train_loss": -11.917867660522461, "global_step": 250944, "epoch": 1493} {"train_loss": -11.91891098022461, "global_step": 250945, "epoch": 1493} {"train_loss": -11.819936752319336, "global_step": 250946, "epoch": 1493} {"train_loss": -11.694074630737305, "global_step": 250947, "epoch": 1493} {"train_loss": -11.945135116577148, "global_step": 250948, "epoch": 1493} {"train_loss": -11.695768356323242, "global_step": 250949, "epoch": 1493} {"train_loss": -12.09255599975586, "global_step": 250950, "epoch": 1493} {"train_loss": -11.786897659301758, "global_step": 250951, "epoch": 1493} {"train_loss": -11.830060958862305, "global_step": 250952, "epoch": 1493} {"train_loss": -11.991701126098633, "global_step": 250953, "epoch": 1493} {"train_loss": -11.885810852050781, "global_step": 250954, "epoch": 1493} {"train_loss": -11.76992130279541, "global_step": 250955, "epoch": 1493} {"train_loss": -11.680660247802734, "global_step": 250956, "epoch": 1493} {"train_loss": -11.999893188476562, "global_step": 250957, "epoch": 1493} {"train_loss": -11.860128402709961, "global_step": 250958, "epoch": 1493} {"train_loss": -11.974775314331055, "global_step": 250959, "epoch": 1493} {"train_loss": -11.79568862915039, "global_step": 250960, "epoch": 1493} {"train_loss": -12.081026077270508, "global_step": 250961, "epoch": 1493} {"train_loss": -11.9700927734375, "global_step": 250962, "epoch": 1493} {"train_loss": -12.134483337402344, "global_step": 250963, "epoch": 1493} {"train_loss": -11.708681106567383, "global_step": 250964, "epoch": 1493} {"train_loss": -11.933182716369629, "global_step": 250965, "epoch": 1493} {"train_loss": -11.956047058105469, "global_step": 250966, "epoch": 1493} {"train_loss": -11.699010848999023, "global_step": 250967, "epoch": 1493} {"train_loss": -11.544608116149902, "global_step": 250968, "epoch": 1493} {"train_loss": -11.850189208984375, "global_step": 250969, "epoch": 1493} {"train_loss": -11.512918472290039, "global_step": 250970, "epoch": 1493} {"train_loss": -11.520984649658203, "global_step": 250971, "epoch": 1493} {"train_loss": -11.909515380859375, "global_step": 250972, "epoch": 1493} {"train_loss": -11.455291748046875, "global_step": 250973, "epoch": 1493} {"train_loss": -11.795762062072754, "global_step": 250974, "epoch": 1493} {"train_loss": -11.458381652832031, "global_step": 250975, "epoch": 1493} {"train_loss": -10.884817123413086, "global_step": 250976, "epoch": 1493} {"train_loss": -11.46600341796875, "global_step": 250977, "epoch": 1493} {"train_loss": -11.5103759765625, "global_step": 250978, "epoch": 1493} {"train_loss": -11.071735382080078, "global_step": 250979, "epoch": 1493} {"train_loss": -11.48531436920166, "global_step": 250980, "epoch": 1493} {"train_loss": -11.685897827148438, "global_step": 250981, "epoch": 1493} {"train_loss": -11.63640022277832, "global_step": 250982, "epoch": 1493} {"train_loss": -11.73342514038086, "global_step": 250983, "epoch": 1493} {"train_loss": -11.634839057922363, "global_step": 250984, "epoch": 1493} {"train_loss": -11.090080261230469, "global_step": 250985, "epoch": 1493} {"train_loss": -11.426886558532715, "global_step": 250986, "epoch": 1493} {"train_loss": -11.794057846069336, "global_step": 250987, "epoch": 1493} {"train_loss": -11.462594032287598, "global_step": 250988, "epoch": 1493} {"train_loss": -11.629203796386719, "global_step": 250989, "epoch": 1493} {"train_loss": -11.926076889038086, "global_step": 250990, "epoch": 1493} {"train_loss": -11.565295259157816, "global_step": 250991, "epoch": 1493, "val_loss": 268734.71875} {"train_loss": -11.374174118041992, "global_step": 250992, "epoch": 1494} {"train_loss": -11.43435287475586, "global_step": 250993, "epoch": 1494} {"train_loss": -11.783262252807617, "global_step": 250994, "epoch": 1494} {"train_loss": -11.336847305297852, "global_step": 250995, "epoch": 1494} {"train_loss": -11.734518051147461, "global_step": 250996, "epoch": 1494} {"train_loss": -12.063713073730469, "global_step": 250997, "epoch": 1494} {"train_loss": -11.712875366210938, "global_step": 250998, "epoch": 1494} {"train_loss": -12.05172061920166, "global_step": 250999, "epoch": 1494} {"train_loss": -11.255327224731445, "global_step": 251000, "epoch": 1494} {"train_loss": -11.893776893615723, "global_step": 251001, "epoch": 1494} {"train_loss": -11.750843048095703, "global_step": 251002, "epoch": 1494} {"train_loss": -11.629756927490234, "global_step": 251003, "epoch": 1494} {"train_loss": -12.032458305358887, "global_step": 251004, "epoch": 1494} {"train_loss": -11.808393478393555, "global_step": 251005, "epoch": 1494} {"train_loss": -11.736715316772461, "global_step": 251006, "epoch": 1494} {"train_loss": -11.8090181350708, "global_step": 251007, "epoch": 1494} {"train_loss": -11.715104103088379, "global_step": 251008, "epoch": 1494} {"train_loss": -11.765298843383789, "global_step": 251009, "epoch": 1494} {"train_loss": -11.83358383178711, "global_step": 251010, "epoch": 1494} {"train_loss": -11.702509880065918, "global_step": 251011, "epoch": 1494} {"train_loss": -11.596111297607422, "global_step": 251012, "epoch": 1494} {"train_loss": -11.90224838256836, "global_step": 251013, "epoch": 1494} {"train_loss": -11.868102073669434, "global_step": 251014, "epoch": 1494} {"train_loss": -11.959968566894531, "global_step": 251015, "epoch": 1494} {"train_loss": -12.01569938659668, "global_step": 251016, "epoch": 1494} {"train_loss": -11.811683654785156, "global_step": 251017, "epoch": 1494} {"train_loss": -11.632118225097656, "global_step": 251018, "epoch": 1494} {"train_loss": -12.109491348266602, "global_step": 251019, "epoch": 1494} {"train_loss": -11.57857894897461, "global_step": 251020, "epoch": 1494} {"train_loss": -11.99531364440918, "global_step": 251021, "epoch": 1494} {"train_loss": -11.82944107055664, "global_step": 251022, "epoch": 1494} {"train_loss": -11.91611099243164, "global_step": 251023, "epoch": 1494} {"train_loss": -11.715740203857422, "global_step": 251024, "epoch": 1494} {"train_loss": -11.923867225646973, "global_step": 251025, "epoch": 1494} {"train_loss": -12.061147689819336, "global_step": 251026, "epoch": 1494} {"train_loss": -11.896734237670898, "global_step": 251027, "epoch": 1494} {"train_loss": -11.942460060119629, "global_step": 251028, "epoch": 1494} {"train_loss": -12.223003387451172, "global_step": 251029, "epoch": 1494} {"train_loss": -12.051254272460938, "global_step": 251030, "epoch": 1494} {"train_loss": -12.268512725830078, "global_step": 251031, "epoch": 1494} {"train_loss": -11.957073211669922, "global_step": 251032, "epoch": 1494} {"train_loss": -12.067132949829102, "global_step": 251033, "epoch": 1494} {"train_loss": -11.943971633911133, "global_step": 251034, "epoch": 1494} {"train_loss": -11.973665237426758, "global_step": 251035, "epoch": 1494} {"train_loss": -12.213911056518555, "global_step": 251036, "epoch": 1494} {"train_loss": -12.117448806762695, "global_step": 251037, "epoch": 1494} {"train_loss": -12.222747802734375, "global_step": 251038, "epoch": 1494} {"train_loss": -12.241691589355469, "global_step": 251039, "epoch": 1494} {"train_loss": -11.9490966796875, "global_step": 251040, "epoch": 1494} {"train_loss": -12.142576217651367, "global_step": 251041, "epoch": 1494} {"train_loss": -12.269327163696289, "global_step": 251042, "epoch": 1494} {"train_loss": -11.888025283813477, "global_step": 251043, "epoch": 1494} {"train_loss": -12.083473205566406, "global_step": 251044, "epoch": 1494} {"train_loss": -12.10411548614502, "global_step": 251045, "epoch": 1494} {"train_loss": -11.92361068725586, "global_step": 251046, "epoch": 1494} {"train_loss": -12.210718154907227, "global_step": 251047, "epoch": 1494} {"train_loss": -11.79035758972168, "global_step": 251048, "epoch": 1494} {"train_loss": -11.620500564575195, "global_step": 251049, "epoch": 1494} {"train_loss": -12.0617036819458, "global_step": 251050, "epoch": 1494} {"train_loss": -12.229963302612305, "global_step": 251051, "epoch": 1494} {"train_loss": -11.890212059020996, "global_step": 251052, "epoch": 1494} {"train_loss": -11.276369094848633, "global_step": 251053, "epoch": 1494} {"train_loss": -11.346384048461914, "global_step": 251054, "epoch": 1494} {"train_loss": -11.947683334350586, "global_step": 251055, "epoch": 1494} {"train_loss": -10.92680835723877, "global_step": 251056, "epoch": 1494} {"train_loss": -11.387683868408203, "global_step": 251057, "epoch": 1494} {"train_loss": -12.071995735168457, "global_step": 251058, "epoch": 1494} {"train_loss": -11.562553405761719, "global_step": 251059, "epoch": 1494} {"train_loss": -11.612438201904297, "global_step": 251060, "epoch": 1494} {"train_loss": -11.771547317504883, "global_step": 251061, "epoch": 1494} {"train_loss": -11.809659957885742, "global_step": 251062, "epoch": 1494} {"train_loss": -11.459527969360352, "global_step": 251063, "epoch": 1494} {"train_loss": -11.438368797302246, "global_step": 251064, "epoch": 1494} {"train_loss": -11.181310653686523, "global_step": 251065, "epoch": 1494} {"train_loss": -10.694364547729492, "global_step": 251066, "epoch": 1494} {"train_loss": -8.67462158203125, "global_step": 251067, "epoch": 1494} {"train_loss": -8.27894115447998, "global_step": 251068, "epoch": 1494} {"train_loss": -9.884255409240723, "global_step": 251069, "epoch": 1494} {"train_loss": -10.033086776733398, "global_step": 251070, "epoch": 1494} {"train_loss": -9.25489616394043, "global_step": 251071, "epoch": 1494} {"train_loss": -9.468063354492188, "global_step": 251072, "epoch": 1494} {"train_loss": -9.7846097946167, "global_step": 251073, "epoch": 1494} {"train_loss": -8.674001693725586, "global_step": 251074, "epoch": 1494} {"train_loss": -10.866233825683594, "global_step": 251075, "epoch": 1494} {"train_loss": -9.334489822387695, "global_step": 251076, "epoch": 1494} {"train_loss": -9.72229290008545, "global_step": 251077, "epoch": 1494} {"train_loss": -10.490514755249023, "global_step": 251078, "epoch": 1494} {"train_loss": -9.362967491149902, "global_step": 251079, "epoch": 1494} {"train_loss": -10.002086639404297, "global_step": 251080, "epoch": 1494} {"train_loss": -10.766376495361328, "global_step": 251081, "epoch": 1494} {"train_loss": -10.933940887451172, "global_step": 251082, "epoch": 1494} {"train_loss": -10.95241928100586, "global_step": 251083, "epoch": 1494} {"train_loss": -11.101110458374023, "global_step": 251084, "epoch": 1494} {"train_loss": -10.619636535644531, "global_step": 251085, "epoch": 1494} {"train_loss": -11.106489181518555, "global_step": 251086, "epoch": 1494} {"train_loss": -11.145959854125977, "global_step": 251087, "epoch": 1494} {"train_loss": -10.599489212036133, "global_step": 251088, "epoch": 1494} {"train_loss": -11.32342529296875, "global_step": 251089, "epoch": 1494} {"train_loss": -10.574661254882812, "global_step": 251090, "epoch": 1494} {"train_loss": -11.300755500793457, "global_step": 251091, "epoch": 1494} {"train_loss": -10.83575439453125, "global_step": 251092, "epoch": 1494} {"train_loss": -11.505393981933594, "global_step": 251093, "epoch": 1494} {"train_loss": -10.939242362976074, "global_step": 251094, "epoch": 1494} {"train_loss": -11.593385696411133, "global_step": 251095, "epoch": 1494} {"train_loss": -11.576287269592285, "global_step": 251096, "epoch": 1494} {"train_loss": -11.499334335327148, "global_step": 251097, "epoch": 1494} {"train_loss": -11.570816040039062, "global_step": 251098, "epoch": 1494} {"train_loss": -11.486760139465332, "global_step": 251099, "epoch": 1494} {"train_loss": -11.681283950805664, "global_step": 251100, "epoch": 1494} {"train_loss": -11.36113452911377, "global_step": 251101, "epoch": 1494} {"train_loss": -11.596121788024902, "global_step": 251102, "epoch": 1494} {"train_loss": -11.66718864440918, "global_step": 251103, "epoch": 1494} {"train_loss": -11.515260696411133, "global_step": 251104, "epoch": 1494} {"train_loss": -11.836065292358398, "global_step": 251105, "epoch": 1494} {"train_loss": -11.347145080566406, "global_step": 251106, "epoch": 1494} {"train_loss": -11.570754051208496, "global_step": 251107, "epoch": 1494} {"train_loss": -11.492916107177734, "global_step": 251108, "epoch": 1494} {"train_loss": -11.133874893188477, "global_step": 251109, "epoch": 1494} {"train_loss": -11.729608535766602, "global_step": 251110, "epoch": 1494} {"train_loss": -11.546354293823242, "global_step": 251111, "epoch": 1494} {"train_loss": -11.571623802185059, "global_step": 251112, "epoch": 1494} {"train_loss": -11.727102279663086, "global_step": 251113, "epoch": 1494} {"train_loss": -11.7449951171875, "global_step": 251114, "epoch": 1494} {"train_loss": -11.965658187866211, "global_step": 251115, "epoch": 1494} {"train_loss": -11.796314239501953, "global_step": 251116, "epoch": 1494} {"train_loss": -11.95615005493164, "global_step": 251117, "epoch": 1494} {"train_loss": -11.754194259643555, "global_step": 251118, "epoch": 1494} {"train_loss": -11.883064270019531, "global_step": 251119, "epoch": 1494} {"train_loss": -11.783151626586914, "global_step": 251120, "epoch": 1494} {"train_loss": -11.932085990905762, "global_step": 251121, "epoch": 1494} {"train_loss": -11.672194480895996, "global_step": 251122, "epoch": 1494} {"train_loss": -11.782337188720703, "global_step": 251123, "epoch": 1494} {"train_loss": -11.9263916015625, "global_step": 251124, "epoch": 1494} {"train_loss": -12.113574028015137, "global_step": 251125, "epoch": 1494} {"train_loss": -11.828060150146484, "global_step": 251126, "epoch": 1494} {"train_loss": -11.915380477905273, "global_step": 251127, "epoch": 1494} {"train_loss": -11.908571243286133, "global_step": 251128, "epoch": 1494} {"train_loss": -11.952035903930664, "global_step": 251129, "epoch": 1494} {"train_loss": -11.824920654296875, "global_step": 251130, "epoch": 1494} {"train_loss": -12.085159301757812, "global_step": 251131, "epoch": 1494} {"train_loss": -12.028963088989258, "global_step": 251132, "epoch": 1494} {"train_loss": -11.929678916931152, "global_step": 251133, "epoch": 1494} {"train_loss": -11.855582237243652, "global_step": 251134, "epoch": 1494} {"train_loss": -11.862157821655273, "global_step": 251135, "epoch": 1494} {"train_loss": -11.847841262817383, "global_step": 251136, "epoch": 1494} {"train_loss": -12.0264892578125, "global_step": 251137, "epoch": 1494} {"train_loss": -12.063458442687988, "global_step": 251138, "epoch": 1494} {"train_loss": -11.938304901123047, "global_step": 251139, "epoch": 1494} {"train_loss": -12.157968521118164, "global_step": 251140, "epoch": 1494} {"train_loss": -11.934735298156738, "global_step": 251141, "epoch": 1494} {"train_loss": -11.983288764953613, "global_step": 251142, "epoch": 1494} {"train_loss": -12.142400741577148, "global_step": 251143, "epoch": 1494} {"train_loss": -12.141761779785156, "global_step": 251144, "epoch": 1494} {"train_loss": -12.038653373718262, "global_step": 251145, "epoch": 1494} {"train_loss": -11.904170989990234, "global_step": 251146, "epoch": 1494} {"train_loss": -11.843132972717285, "global_step": 251147, "epoch": 1494} {"train_loss": -12.273451805114746, "global_step": 251148, "epoch": 1494} {"train_loss": -12.035091400146484, "global_step": 251149, "epoch": 1494} {"train_loss": -12.093321800231934, "global_step": 251150, "epoch": 1494} {"train_loss": -12.04692268371582, "global_step": 251151, "epoch": 1494} {"train_loss": -11.92849063873291, "global_step": 251152, "epoch": 1494} {"train_loss": -11.945899963378906, "global_step": 251153, "epoch": 1494} {"train_loss": -11.921207427978516, "global_step": 251154, "epoch": 1494} {"train_loss": -11.86850357055664, "global_step": 251155, "epoch": 1494} {"train_loss": -12.011441230773926, "global_step": 251156, "epoch": 1494} {"train_loss": -11.91423511505127, "global_step": 251157, "epoch": 1494} {"train_loss": -11.887999534606934, "global_step": 251158, "epoch": 1494} {"train_loss": -11.565086103620983, "global_step": 251159, "epoch": 1494, "val_loss": 270189.90625} {"train_loss": -11.587316513061523, "global_step": 251160, "epoch": 1495} {"train_loss": -11.915834426879883, "global_step": 251161, "epoch": 1495} {"train_loss": -11.625503540039062, "global_step": 251162, "epoch": 1495} {"train_loss": -12.02261734008789, "global_step": 251163, "epoch": 1495} {"train_loss": -12.145699501037598, "global_step": 251164, "epoch": 1495} {"train_loss": -11.860496520996094, "global_step": 251165, "epoch": 1495} {"train_loss": -11.807723999023438, "global_step": 251166, "epoch": 1495} {"train_loss": -11.805135726928711, "global_step": 251167, "epoch": 1495} {"train_loss": -11.498832702636719, "global_step": 251168, "epoch": 1495} {"train_loss": -12.019880294799805, "global_step": 251169, "epoch": 1495} {"train_loss": -11.825153350830078, "global_step": 251170, "epoch": 1495} {"train_loss": -12.304057121276855, "global_step": 251171, "epoch": 1495} {"train_loss": -11.901385307312012, "global_step": 251172, "epoch": 1495} {"train_loss": -12.017507553100586, "global_step": 251173, "epoch": 1495} {"train_loss": -11.946807861328125, "global_step": 251174, "epoch": 1495} {"train_loss": -12.058244705200195, "global_step": 251175, "epoch": 1495} {"train_loss": -11.509573936462402, "global_step": 251176, "epoch": 1495} {"train_loss": -11.173552513122559, "global_step": 251177, "epoch": 1495} {"train_loss": -11.333455085754395, "global_step": 251178, "epoch": 1495} {"train_loss": -11.661271095275879, "global_step": 251179, "epoch": 1495} {"train_loss": -11.808100700378418, "global_step": 251180, "epoch": 1495} {"train_loss": -11.67869758605957, "global_step": 251181, "epoch": 1495} {"train_loss": -11.6975736618042, "global_step": 251182, "epoch": 1495} {"train_loss": -11.520570755004883, "global_step": 251183, "epoch": 1495} {"train_loss": -11.799354553222656, "global_step": 251184, "epoch": 1495} {"train_loss": -11.52503776550293, "global_step": 251185, "epoch": 1495} {"train_loss": -10.608153343200684, "global_step": 251186, "epoch": 1495} {"train_loss": -12.044388771057129, "global_step": 251187, "epoch": 1495} {"train_loss": -11.149333953857422, "global_step": 251188, "epoch": 1495} {"train_loss": -11.516847610473633, "global_step": 251189, "epoch": 1495} {"train_loss": -11.574037551879883, "global_step": 251190, "epoch": 1495} {"train_loss": -12.00245475769043, "global_step": 251191, "epoch": 1495} {"train_loss": -11.019731521606445, "global_step": 251192, "epoch": 1495} {"train_loss": -11.032548904418945, "global_step": 251193, "epoch": 1495} {"train_loss": -11.735790252685547, "global_step": 251194, "epoch": 1495} {"train_loss": -10.998580932617188, "global_step": 251195, "epoch": 1495} {"train_loss": -11.724611282348633, "global_step": 251196, "epoch": 1495} {"train_loss": -11.368474960327148, "global_step": 251197, "epoch": 1495} {"train_loss": -10.272586822509766, "global_step": 251198, "epoch": 1495} {"train_loss": -11.322086334228516, "global_step": 251199, "epoch": 1495} {"train_loss": -11.364459991455078, "global_step": 251200, "epoch": 1495} {"train_loss": -11.605551719665527, "global_step": 251201, "epoch": 1495} {"train_loss": -11.092860221862793, "global_step": 251202, "epoch": 1495} {"train_loss": -10.99771499633789, "global_step": 251203, "epoch": 1495} {"train_loss": -11.555463790893555, "global_step": 251204, "epoch": 1495} {"train_loss": -11.146366119384766, "global_step": 251205, "epoch": 1495} {"train_loss": -9.567748069763184, "global_step": 251206, "epoch": 1495} {"train_loss": -11.359553337097168, "global_step": 251207, "epoch": 1495} {"train_loss": -8.576194763183594, "global_step": 251208, "epoch": 1495} {"train_loss": -9.99683952331543, "global_step": 251209, "epoch": 1495} {"train_loss": -10.226635932922363, "global_step": 251210, "epoch": 1495} {"train_loss": -9.09453010559082, "global_step": 251211, "epoch": 1495} {"train_loss": -10.973201751708984, "global_step": 251212, "epoch": 1495} {"train_loss": -9.927787780761719, "global_step": 251213, "epoch": 1495} {"train_loss": -11.428268432617188, "global_step": 251214, "epoch": 1495} {"train_loss": -10.616601943969727, "global_step": 251215, "epoch": 1495} {"train_loss": -11.42795467376709, "global_step": 251216, "epoch": 1495} {"train_loss": -10.14381217956543, "global_step": 251217, "epoch": 1495} {"train_loss": -11.293853759765625, "global_step": 251218, "epoch": 1495} {"train_loss": -10.803868293762207, "global_step": 251219, "epoch": 1495} {"train_loss": -11.476844787597656, "global_step": 251220, "epoch": 1495} {"train_loss": -10.833234786987305, "global_step": 251221, "epoch": 1495} {"train_loss": -11.35926628112793, "global_step": 251222, "epoch": 1495} {"train_loss": -10.744344711303711, "global_step": 251223, "epoch": 1495} {"train_loss": -11.719902038574219, "global_step": 251224, "epoch": 1495} {"train_loss": -11.051298141479492, "global_step": 251225, "epoch": 1495} {"train_loss": -11.482246398925781, "global_step": 251226, "epoch": 1495} {"train_loss": -11.20263671875, "global_step": 251227, "epoch": 1495} {"train_loss": -11.5748929977417, "global_step": 251228, "epoch": 1495} {"train_loss": -11.269725799560547, "global_step": 251229, "epoch": 1495} {"train_loss": -11.32278823852539, "global_step": 251230, "epoch": 1495} {"train_loss": -11.53024673461914, "global_step": 251231, "epoch": 1495} {"train_loss": -11.379400253295898, "global_step": 251232, "epoch": 1495} {"train_loss": -11.869955062866211, "global_step": 251233, "epoch": 1495} {"train_loss": -11.393610954284668, "global_step": 251234, "epoch": 1495} {"train_loss": -11.736736297607422, "global_step": 251235, "epoch": 1495} {"train_loss": -11.484387397766113, "global_step": 251236, "epoch": 1495} {"train_loss": -11.760781288146973, "global_step": 251237, "epoch": 1495} {"train_loss": -11.639959335327148, "global_step": 251238, "epoch": 1495} {"train_loss": -11.729001998901367, "global_step": 251239, "epoch": 1495} {"train_loss": -11.471771240234375, "global_step": 251240, "epoch": 1495} {"train_loss": -11.58272647857666, "global_step": 251241, "epoch": 1495} {"train_loss": -11.44767951965332, "global_step": 251242, "epoch": 1495} {"train_loss": -11.627973556518555, "global_step": 251243, "epoch": 1495} {"train_loss": -11.603143692016602, "global_step": 251244, "epoch": 1495} {"train_loss": -11.727710723876953, "global_step": 251245, "epoch": 1495} {"train_loss": -11.913778305053711, "global_step": 251246, "epoch": 1495} {"train_loss": -11.888542175292969, "global_step": 251247, "epoch": 1495} {"train_loss": -11.866554260253906, "global_step": 251248, "epoch": 1495} {"train_loss": -11.807110786437988, "global_step": 251249, "epoch": 1495} {"train_loss": -11.888233184814453, "global_step": 251250, "epoch": 1495} {"train_loss": -11.982486724853516, "global_step": 251251, "epoch": 1495} {"train_loss": -11.81591510772705, "global_step": 251252, "epoch": 1495} {"train_loss": -11.691762924194336, "global_step": 251253, "epoch": 1495} {"train_loss": -11.838942527770996, "global_step": 251254, "epoch": 1495} {"train_loss": -11.695234298706055, "global_step": 251255, "epoch": 1495} {"train_loss": -12.074167251586914, "global_step": 251256, "epoch": 1495} {"train_loss": -11.865556716918945, "global_step": 251257, "epoch": 1495} {"train_loss": -11.961857795715332, "global_step": 251258, "epoch": 1495} {"train_loss": -11.750822067260742, "global_step": 251259, "epoch": 1495} {"train_loss": -11.765294075012207, "global_step": 251260, "epoch": 1495} {"train_loss": -11.769969940185547, "global_step": 251261, "epoch": 1495} {"train_loss": -11.988293647766113, "global_step": 251262, "epoch": 1495} {"train_loss": -12.035333633422852, "global_step": 251263, "epoch": 1495} {"train_loss": -12.04071044921875, "global_step": 251264, "epoch": 1495} {"train_loss": -11.67933177947998, "global_step": 251265, "epoch": 1495} {"train_loss": -12.030988693237305, "global_step": 251266, "epoch": 1495} {"train_loss": -11.843929290771484, "global_step": 251267, "epoch": 1495} {"train_loss": -12.227840423583984, "global_step": 251268, "epoch": 1495} {"train_loss": -12.053807258605957, "global_step": 251269, "epoch": 1495} {"train_loss": -12.000750541687012, "global_step": 251270, "epoch": 1495} {"train_loss": -12.070778846740723, "global_step": 251271, "epoch": 1495} {"train_loss": -12.07763671875, "global_step": 251272, "epoch": 1495} {"train_loss": -12.118864059448242, "global_step": 251273, "epoch": 1495} {"train_loss": -11.864727973937988, "global_step": 251274, "epoch": 1495} {"train_loss": -11.91658878326416, "global_step": 251275, "epoch": 1495} {"train_loss": -12.057849884033203, "global_step": 251276, "epoch": 1495} {"train_loss": -12.377904891967773, "global_step": 251277, "epoch": 1495} {"train_loss": -12.026721954345703, "global_step": 251278, "epoch": 1495} {"train_loss": -11.720122337341309, "global_step": 251279, "epoch": 1495} {"train_loss": -12.195582389831543, "global_step": 251280, "epoch": 1495} {"train_loss": -12.02780818939209, "global_step": 251281, "epoch": 1495} {"train_loss": -12.201244354248047, "global_step": 251282, "epoch": 1495} {"train_loss": -12.141645431518555, "global_step": 251283, "epoch": 1495} {"train_loss": -12.139083862304688, "global_step": 251284, "epoch": 1495} {"train_loss": -12.259699821472168, "global_step": 251285, "epoch": 1495} {"train_loss": -12.015679359436035, "global_step": 251286, "epoch": 1495} {"train_loss": -12.096118927001953, "global_step": 251287, "epoch": 1495} {"train_loss": -11.875956535339355, "global_step": 251288, "epoch": 1495} {"train_loss": -12.027093887329102, "global_step": 251289, "epoch": 1495} {"train_loss": -12.077065467834473, "global_step": 251290, "epoch": 1495} {"train_loss": -12.075589179992676, "global_step": 251291, "epoch": 1495} {"train_loss": -11.886878967285156, "global_step": 251292, "epoch": 1495} {"train_loss": -12.171140670776367, "global_step": 251293, "epoch": 1495} {"train_loss": -11.371184349060059, "global_step": 251294, "epoch": 1495} {"train_loss": -11.66969108581543, "global_step": 251295, "epoch": 1495} {"train_loss": -11.745586395263672, "global_step": 251296, "epoch": 1495} {"train_loss": -12.176851272583008, "global_step": 251297, "epoch": 1495} {"train_loss": -12.105819702148438, "global_step": 251298, "epoch": 1495} {"train_loss": -12.340035438537598, "global_step": 251299, "epoch": 1495} {"train_loss": -12.089530944824219, "global_step": 251300, "epoch": 1495} {"train_loss": -12.26373291015625, "global_step": 251301, "epoch": 1495} {"train_loss": -11.67794418334961, "global_step": 251302, "epoch": 1495} {"train_loss": -11.755064964294434, "global_step": 251303, "epoch": 1495} {"train_loss": -11.7325439453125, "global_step": 251304, "epoch": 1495} {"train_loss": -12.135969161987305, "global_step": 251305, "epoch": 1495} {"train_loss": -11.614706993103027, "global_step": 251306, "epoch": 1495} {"train_loss": -9.999702453613281, "global_step": 251307, "epoch": 1495} {"train_loss": -10.390655517578125, "global_step": 251308, "epoch": 1495} {"train_loss": -11.307937622070312, "global_step": 251309, "epoch": 1495} {"train_loss": -11.060148239135742, "global_step": 251310, "epoch": 1495} {"train_loss": -10.944398880004883, "global_step": 251311, "epoch": 1495} {"train_loss": -10.179428100585938, "global_step": 251312, "epoch": 1495} {"train_loss": -11.16684341430664, "global_step": 251313, "epoch": 1495} {"train_loss": -10.626224517822266, "global_step": 251314, "epoch": 1495} {"train_loss": -9.654388427734375, "global_step": 251315, "epoch": 1495} {"train_loss": -11.197612762451172, "global_step": 251316, "epoch": 1495} {"train_loss": -8.907666206359863, "global_step": 251317, "epoch": 1495} {"train_loss": -11.060375213623047, "global_step": 251318, "epoch": 1495} {"train_loss": -8.54147720336914, "global_step": 251319, "epoch": 1495} {"train_loss": -9.428918838500977, "global_step": 251320, "epoch": 1495} {"train_loss": -9.475635528564453, "global_step": 251321, "epoch": 1495} {"train_loss": -10.140998840332031, "global_step": 251322, "epoch": 1495} {"train_loss": -7.975478172302246, "global_step": 251323, "epoch": 1495} {"train_loss": -9.395514488220215, "global_step": 251324, "epoch": 1495} {"train_loss": -9.003654479980469, "global_step": 251325, "epoch": 1495} {"train_loss": -9.233013153076172, "global_step": 251326, "epoch": 1495} {"train_loss": -11.396735378674098, "global_step": 251327, "epoch": 1495, "val_loss": 267011.8125, "train_action_mse_error": 0.9019976854324341} {"train_loss": -9.458446502685547, "global_step": 251328, "epoch": 1496} {"train_loss": -9.701910018920898, "global_step": 251329, "epoch": 1496} {"train_loss": -9.687634468078613, "global_step": 251330, "epoch": 1496} {"train_loss": -10.459174156188965, "global_step": 251331, "epoch": 1496} {"train_loss": -9.934807777404785, "global_step": 251332, "epoch": 1496} {"train_loss": -10.014158248901367, "global_step": 251333, "epoch": 1496} {"train_loss": -10.470351219177246, "global_step": 251334, "epoch": 1496} {"train_loss": -10.330698013305664, "global_step": 251335, "epoch": 1496} {"train_loss": -10.095110893249512, "global_step": 251336, "epoch": 1496} {"train_loss": -11.128985404968262, "global_step": 251337, "epoch": 1496} {"train_loss": -9.612688064575195, "global_step": 251338, "epoch": 1496} {"train_loss": -10.628868103027344, "global_step": 251339, "epoch": 1496} {"train_loss": -11.416608810424805, "global_step": 251340, "epoch": 1496} {"train_loss": -9.53579044342041, "global_step": 251341, "epoch": 1496} {"train_loss": -10.578628540039062, "global_step": 251342, "epoch": 1496} {"train_loss": -10.692596435546875, "global_step": 251343, "epoch": 1496} {"train_loss": -10.437762260437012, "global_step": 251344, "epoch": 1496} {"train_loss": -10.782327651977539, "global_step": 251345, "epoch": 1496} {"train_loss": -11.185510635375977, "global_step": 251346, "epoch": 1496} {"train_loss": -10.734957695007324, "global_step": 251347, "epoch": 1496} {"train_loss": -11.122507095336914, "global_step": 251348, "epoch": 1496} {"train_loss": -11.166720390319824, "global_step": 251349, "epoch": 1496} {"train_loss": -11.058347702026367, "global_step": 251350, "epoch": 1496} {"train_loss": -11.338634490966797, "global_step": 251351, "epoch": 1496} {"train_loss": -11.335552215576172, "global_step": 251352, "epoch": 1496} {"train_loss": -10.96277904510498, "global_step": 251353, "epoch": 1496} {"train_loss": -11.65103530883789, "global_step": 251354, "epoch": 1496} {"train_loss": -11.357163429260254, "global_step": 251355, "epoch": 1496} {"train_loss": -11.294197082519531, "global_step": 251356, "epoch": 1496} {"train_loss": -11.33613395690918, "global_step": 251357, "epoch": 1496} {"train_loss": -11.524374961853027, "global_step": 251358, "epoch": 1496} {"train_loss": -11.254924774169922, "global_step": 251359, "epoch": 1496} {"train_loss": -11.409219741821289, "global_step": 251360, "epoch": 1496} {"train_loss": -11.656730651855469, "global_step": 251361, "epoch": 1496} {"train_loss": -11.161394119262695, "global_step": 251362, "epoch": 1496} {"train_loss": -11.445579528808594, "global_step": 251363, "epoch": 1496} {"train_loss": -11.491827964782715, "global_step": 251364, "epoch": 1496} {"train_loss": -11.268941879272461, "global_step": 251365, "epoch": 1496} {"train_loss": -11.455113410949707, "global_step": 251366, "epoch": 1496} {"train_loss": -11.502238273620605, "global_step": 251367, "epoch": 1496} {"train_loss": -11.349794387817383, "global_step": 251368, "epoch": 1496} {"train_loss": -11.481470108032227, "global_step": 251369, "epoch": 1496} {"train_loss": -11.564212799072266, "global_step": 251370, "epoch": 1496} {"train_loss": -11.29469108581543, "global_step": 251371, "epoch": 1496} {"train_loss": -11.606736183166504, "global_step": 251372, "epoch": 1496} {"train_loss": -11.66722297668457, "global_step": 251373, "epoch": 1496} {"train_loss": -11.556949615478516, "global_step": 251374, "epoch": 1496} {"train_loss": -11.57793140411377, "global_step": 251375, "epoch": 1496} {"train_loss": -11.64500617980957, "global_step": 251376, "epoch": 1496} {"train_loss": -11.718356132507324, "global_step": 251377, "epoch": 1496} {"train_loss": -11.773807525634766, "global_step": 251378, "epoch": 1496} {"train_loss": -11.738082885742188, "global_step": 251379, "epoch": 1496} {"train_loss": -11.703219413757324, "global_step": 251380, "epoch": 1496} {"train_loss": -11.684883117675781, "global_step": 251381, "epoch": 1496} {"train_loss": -11.88248062133789, "global_step": 251382, "epoch": 1496} {"train_loss": -11.755658149719238, "global_step": 251383, "epoch": 1496} {"train_loss": -11.574918746948242, "global_step": 251384, "epoch": 1496} {"train_loss": -11.836166381835938, "global_step": 251385, "epoch": 1496} {"train_loss": -11.685932159423828, "global_step": 251386, "epoch": 1496} {"train_loss": -11.7506685256958, "global_step": 251387, "epoch": 1496} {"train_loss": -11.880695343017578, "global_step": 251388, "epoch": 1496} {"train_loss": -11.731611251831055, "global_step": 251389, "epoch": 1496} {"train_loss": -11.865884780883789, "global_step": 251390, "epoch": 1496} {"train_loss": -11.761555671691895, "global_step": 251391, "epoch": 1496} {"train_loss": -11.840290069580078, "global_step": 251392, "epoch": 1496} {"train_loss": -11.583816528320312, "global_step": 251393, "epoch": 1496} {"train_loss": -11.97165298461914, "global_step": 251394, "epoch": 1496} {"train_loss": -11.673904418945312, "global_step": 251395, "epoch": 1496} {"train_loss": -11.625473976135254, "global_step": 251396, "epoch": 1496} {"train_loss": -11.842154502868652, "global_step": 251397, "epoch": 1496} {"train_loss": -11.99734878540039, "global_step": 251398, "epoch": 1496} {"train_loss": -11.994282722473145, "global_step": 251399, "epoch": 1496} {"train_loss": -11.913605690002441, "global_step": 251400, "epoch": 1496} {"train_loss": -11.968130111694336, "global_step": 251401, "epoch": 1496} {"train_loss": -11.954832077026367, "global_step": 251402, "epoch": 1496} {"train_loss": -12.107398986816406, "global_step": 251403, "epoch": 1496} {"train_loss": -12.017290115356445, "global_step": 251404, "epoch": 1496} {"train_loss": -12.124890327453613, "global_step": 251405, "epoch": 1496} {"train_loss": -12.112126350402832, "global_step": 251406, "epoch": 1496} {"train_loss": -12.136809349060059, "global_step": 251407, "epoch": 1496} {"train_loss": -12.151844024658203, "global_step": 251408, "epoch": 1496} {"train_loss": -12.019323348999023, "global_step": 251409, "epoch": 1496} {"train_loss": -12.182144165039062, "global_step": 251410, "epoch": 1496} {"train_loss": -11.987534523010254, "global_step": 251411, "epoch": 1496} {"train_loss": -12.164205551147461, "global_step": 251412, "epoch": 1496} {"train_loss": -11.816308975219727, "global_step": 251413, "epoch": 1496} {"train_loss": -12.079880714416504, "global_step": 251414, "epoch": 1496} {"train_loss": -12.259576797485352, "global_step": 251415, "epoch": 1496} {"train_loss": -12.003637313842773, "global_step": 251416, "epoch": 1496} {"train_loss": -11.931224822998047, "global_step": 251417, "epoch": 1496} {"train_loss": -12.023988723754883, "global_step": 251418, "epoch": 1496} {"train_loss": -11.924896240234375, "global_step": 251419, "epoch": 1496} {"train_loss": -11.455754280090332, "global_step": 251420, "epoch": 1496} {"train_loss": -11.916097640991211, "global_step": 251421, "epoch": 1496} {"train_loss": -12.035552024841309, "global_step": 251422, "epoch": 1496} {"train_loss": -12.000162124633789, "global_step": 251423, "epoch": 1496} {"train_loss": -12.096967697143555, "global_step": 251424, "epoch": 1496} {"train_loss": -12.081472396850586, "global_step": 251425, "epoch": 1496} {"train_loss": -12.226640701293945, "global_step": 251426, "epoch": 1496} {"train_loss": -12.249834060668945, "global_step": 251427, "epoch": 1496} {"train_loss": -11.95114517211914, "global_step": 251428, "epoch": 1496} {"train_loss": -12.034797668457031, "global_step": 251429, "epoch": 1496} {"train_loss": -12.047314643859863, "global_step": 251430, "epoch": 1496} {"train_loss": -12.133024215698242, "global_step": 251431, "epoch": 1496} {"train_loss": -12.223780632019043, "global_step": 251432, "epoch": 1496} {"train_loss": -12.123388290405273, "global_step": 251433, "epoch": 1496} {"train_loss": -12.22242546081543, "global_step": 251434, "epoch": 1496} {"train_loss": -12.112167358398438, "global_step": 251435, "epoch": 1496} {"train_loss": -11.983746528625488, "global_step": 251436, "epoch": 1496} {"train_loss": -12.177288055419922, "global_step": 251437, "epoch": 1496} {"train_loss": -12.294068336486816, "global_step": 251438, "epoch": 1496} {"train_loss": -12.297508239746094, "global_step": 251439, "epoch": 1496} {"train_loss": -11.846044540405273, "global_step": 251440, "epoch": 1496} {"train_loss": -11.40528392791748, "global_step": 251441, "epoch": 1496} {"train_loss": -11.763782501220703, "global_step": 251442, "epoch": 1496} {"train_loss": -12.145706176757812, "global_step": 251443, "epoch": 1496} {"train_loss": -12.086423873901367, "global_step": 251444, "epoch": 1496} {"train_loss": -11.918655395507812, "global_step": 251445, "epoch": 1496} {"train_loss": -11.597675323486328, "global_step": 251446, "epoch": 1496} {"train_loss": -11.566553115844727, "global_step": 251447, "epoch": 1496} {"train_loss": -11.679290771484375, "global_step": 251448, "epoch": 1496} {"train_loss": -11.471415519714355, "global_step": 251449, "epoch": 1496} {"train_loss": -11.725906372070312, "global_step": 251450, "epoch": 1496} {"train_loss": -10.892908096313477, "global_step": 251451, "epoch": 1496} {"train_loss": -11.973281860351562, "global_step": 251452, "epoch": 1496} {"train_loss": -11.206822395324707, "global_step": 251453, "epoch": 1496} {"train_loss": -11.342073440551758, "global_step": 251454, "epoch": 1496} {"train_loss": -10.701400756835938, "global_step": 251455, "epoch": 1496} {"train_loss": -11.46616268157959, "global_step": 251456, "epoch": 1496} {"train_loss": -10.805814743041992, "global_step": 251457, "epoch": 1496} {"train_loss": -11.898205757141113, "global_step": 251458, "epoch": 1496} {"train_loss": -10.920572280883789, "global_step": 251459, "epoch": 1496} {"train_loss": -12.042308807373047, "global_step": 251460, "epoch": 1496} {"train_loss": -11.123838424682617, "global_step": 251461, "epoch": 1496} {"train_loss": -11.929645538330078, "global_step": 251462, "epoch": 1496} {"train_loss": -11.197072982788086, "global_step": 251463, "epoch": 1496} {"train_loss": -11.533416748046875, "global_step": 251464, "epoch": 1496} {"train_loss": -11.28699016571045, "global_step": 251465, "epoch": 1496} {"train_loss": -12.022035598754883, "global_step": 251466, "epoch": 1496} {"train_loss": -11.227348327636719, "global_step": 251467, "epoch": 1496} {"train_loss": -11.233367919921875, "global_step": 251468, "epoch": 1496} {"train_loss": -10.68508529663086, "global_step": 251469, "epoch": 1496} {"train_loss": -10.386435508728027, "global_step": 251470, "epoch": 1496} {"train_loss": -11.545171737670898, "global_step": 251471, "epoch": 1496} {"train_loss": -10.664703369140625, "global_step": 251472, "epoch": 1496} {"train_loss": -11.531424522399902, "global_step": 251473, "epoch": 1496} {"train_loss": -11.220151901245117, "global_step": 251474, "epoch": 1496} {"train_loss": -11.171603202819824, "global_step": 251475, "epoch": 1496} {"train_loss": -11.093021392822266, "global_step": 251476, "epoch": 1496} {"train_loss": -11.291261672973633, "global_step": 251477, "epoch": 1496} {"train_loss": -10.933296203613281, "global_step": 251478, "epoch": 1496} {"train_loss": -11.47617244720459, "global_step": 251479, "epoch": 1496} {"train_loss": -11.240251541137695, "global_step": 251480, "epoch": 1496} {"train_loss": -11.657870292663574, "global_step": 251481, "epoch": 1496} {"train_loss": -11.408979415893555, "global_step": 251482, "epoch": 1496} {"train_loss": -11.76469898223877, "global_step": 251483, "epoch": 1496} {"train_loss": -11.171581268310547, "global_step": 251484, "epoch": 1496} {"train_loss": -11.590683937072754, "global_step": 251485, "epoch": 1496} {"train_loss": -11.561759948730469, "global_step": 251486, "epoch": 1496} {"train_loss": -11.81393051147461, "global_step": 251487, "epoch": 1496} {"train_loss": -11.661205291748047, "global_step": 251488, "epoch": 1496} {"train_loss": -11.571081161499023, "global_step": 251489, "epoch": 1496} {"train_loss": -11.516973495483398, "global_step": 251490, "epoch": 1496} {"train_loss": -12.139659881591797, "global_step": 251491, "epoch": 1496} {"train_loss": -11.679973602294922, "global_step": 251492, "epoch": 1496} {"train_loss": -11.956769943237305, "global_step": 251493, "epoch": 1496} {"train_loss": -11.961801528930664, "global_step": 251494, "epoch": 1496} {"train_loss": -11.508595903714498, "global_step": 251495, "epoch": 1496, "val_loss": 269878.03125} {"train_loss": -11.913688659667969, "global_step": 251496, "epoch": 1497} {"train_loss": -11.884696960449219, "global_step": 251497, "epoch": 1497} {"train_loss": -11.600492477416992, "global_step": 251498, "epoch": 1497} {"train_loss": -11.676278114318848, "global_step": 251499, "epoch": 1497} {"train_loss": -11.616567611694336, "global_step": 251500, "epoch": 1497} {"train_loss": -11.938243865966797, "global_step": 251501, "epoch": 1497} {"train_loss": -11.617656707763672, "global_step": 251502, "epoch": 1497} {"train_loss": -11.31777286529541, "global_step": 251503, "epoch": 1497} {"train_loss": -11.601320266723633, "global_step": 251504, "epoch": 1497} {"train_loss": -11.439815521240234, "global_step": 251505, "epoch": 1497} {"train_loss": -11.554990768432617, "global_step": 251506, "epoch": 1497} {"train_loss": -11.748592376708984, "global_step": 251507, "epoch": 1497} {"train_loss": -11.377117156982422, "global_step": 251508, "epoch": 1497} {"train_loss": -11.564870834350586, "global_step": 251509, "epoch": 1497} {"train_loss": -10.795931816101074, "global_step": 251510, "epoch": 1497} {"train_loss": -11.552244186401367, "global_step": 251511, "epoch": 1497} {"train_loss": -11.378884315490723, "global_step": 251512, "epoch": 1497} {"train_loss": -11.312870979309082, "global_step": 251513, "epoch": 1497} {"train_loss": -11.613882064819336, "global_step": 251514, "epoch": 1497} {"train_loss": -10.723538398742676, "global_step": 251515, "epoch": 1497} {"train_loss": -11.263595581054688, "global_step": 251516, "epoch": 1497} {"train_loss": -11.235801696777344, "global_step": 251517, "epoch": 1497} {"train_loss": -10.961953163146973, "global_step": 251518, "epoch": 1497} {"train_loss": -10.918527603149414, "global_step": 251519, "epoch": 1497} {"train_loss": -11.25356674194336, "global_step": 251520, "epoch": 1497} {"train_loss": -11.147258758544922, "global_step": 251521, "epoch": 1497} {"train_loss": -10.748388290405273, "global_step": 251522, "epoch": 1497} {"train_loss": -10.599864959716797, "global_step": 251523, "epoch": 1497} {"train_loss": -10.647741317749023, "global_step": 251524, "epoch": 1497} {"train_loss": -10.930817604064941, "global_step": 251525, "epoch": 1497} {"train_loss": -9.468900680541992, "global_step": 251526, "epoch": 1497} {"train_loss": -10.845189094543457, "global_step": 251527, "epoch": 1497} {"train_loss": -9.573739051818848, "global_step": 251528, "epoch": 1497} {"train_loss": -10.9490966796875, "global_step": 251529, "epoch": 1497} {"train_loss": -10.213005065917969, "global_step": 251530, "epoch": 1497} {"train_loss": -10.314361572265625, "global_step": 251531, "epoch": 1497} {"train_loss": -10.698275566101074, "global_step": 251532, "epoch": 1497} {"train_loss": -10.998437881469727, "global_step": 251533, "epoch": 1497} {"train_loss": -10.678910255432129, "global_step": 251534, "epoch": 1497} {"train_loss": -11.293121337890625, "global_step": 251535, "epoch": 1497} {"train_loss": -10.77360725402832, "global_step": 251536, "epoch": 1497} {"train_loss": -10.957235336303711, "global_step": 251537, "epoch": 1497} {"train_loss": -11.04256820678711, "global_step": 251538, "epoch": 1497} {"train_loss": -11.004650115966797, "global_step": 251539, "epoch": 1497} {"train_loss": -11.17613410949707, "global_step": 251540, "epoch": 1497} {"train_loss": -11.057609558105469, "global_step": 251541, "epoch": 1497} {"train_loss": -10.640426635742188, "global_step": 251542, "epoch": 1497} {"train_loss": -11.043832778930664, "global_step": 251543, "epoch": 1497} {"train_loss": -10.885612487792969, "global_step": 251544, "epoch": 1497} {"train_loss": -11.126562118530273, "global_step": 251545, "epoch": 1497} {"train_loss": -11.203619956970215, "global_step": 251546, "epoch": 1497} {"train_loss": -11.294745445251465, "global_step": 251547, "epoch": 1497} {"train_loss": -10.991192817687988, "global_step": 251548, "epoch": 1497} {"train_loss": -11.327247619628906, "global_step": 251549, "epoch": 1497} {"train_loss": -11.379352569580078, "global_step": 251550, "epoch": 1497} {"train_loss": -11.101115226745605, "global_step": 251551, "epoch": 1497} {"train_loss": -11.465137481689453, "global_step": 251552, "epoch": 1497} {"train_loss": -11.463706970214844, "global_step": 251553, "epoch": 1497} {"train_loss": -11.181480407714844, "global_step": 251554, "epoch": 1497} {"train_loss": -11.593303680419922, "global_step": 251555, "epoch": 1497} {"train_loss": -11.387961387634277, "global_step": 251556, "epoch": 1497} {"train_loss": -11.512977600097656, "global_step": 251557, "epoch": 1497} {"train_loss": -11.523577690124512, "global_step": 251558, "epoch": 1497} {"train_loss": -11.704452514648438, "global_step": 251559, "epoch": 1497} {"train_loss": -11.583843231201172, "global_step": 251560, "epoch": 1497} {"train_loss": -11.9010009765625, "global_step": 251561, "epoch": 1497} {"train_loss": -11.888566017150879, "global_step": 251562, "epoch": 1497} {"train_loss": -11.695877075195312, "global_step": 251563, "epoch": 1497} {"train_loss": -11.742406845092773, "global_step": 251564, "epoch": 1497} {"train_loss": -11.753793716430664, "global_step": 251565, "epoch": 1497} {"train_loss": -11.729913711547852, "global_step": 251566, "epoch": 1497} {"train_loss": -12.02394962310791, "global_step": 251567, "epoch": 1497} {"train_loss": -11.680063247680664, "global_step": 251568, "epoch": 1497} {"train_loss": -11.799844741821289, "global_step": 251569, "epoch": 1497} {"train_loss": -12.002238273620605, "global_step": 251570, "epoch": 1497} {"train_loss": -11.695919036865234, "global_step": 251571, "epoch": 1497} {"train_loss": -11.829444885253906, "global_step": 251572, "epoch": 1497} {"train_loss": -11.93892765045166, "global_step": 251573, "epoch": 1497} {"train_loss": -11.829230308532715, "global_step": 251574, "epoch": 1497} {"train_loss": -11.875465393066406, "global_step": 251575, "epoch": 1497} {"train_loss": -11.926153182983398, "global_step": 251576, "epoch": 1497} {"train_loss": -12.001935005187988, "global_step": 251577, "epoch": 1497} {"train_loss": -12.033252716064453, "global_step": 251578, "epoch": 1497} {"train_loss": -12.011866569519043, "global_step": 251579, "epoch": 1497} {"train_loss": -11.966655731201172, "global_step": 251580, "epoch": 1497} {"train_loss": -12.067861557006836, "global_step": 251581, "epoch": 1497} {"train_loss": -11.864959716796875, "global_step": 251582, "epoch": 1497} {"train_loss": -12.071792602539062, "global_step": 251583, "epoch": 1497} {"train_loss": -12.195002555847168, "global_step": 251584, "epoch": 1497} {"train_loss": -12.129277229309082, "global_step": 251585, "epoch": 1497} {"train_loss": -12.073440551757812, "global_step": 251586, "epoch": 1497} {"train_loss": -12.128618240356445, "global_step": 251587, "epoch": 1497} {"train_loss": -12.032276153564453, "global_step": 251588, "epoch": 1497} {"train_loss": -12.071495056152344, "global_step": 251589, "epoch": 1497} {"train_loss": -12.032320022583008, "global_step": 251590, "epoch": 1497} {"train_loss": -12.192800521850586, "global_step": 251591, "epoch": 1497} {"train_loss": -12.091361999511719, "global_step": 251592, "epoch": 1497} {"train_loss": -12.300765991210938, "global_step": 251593, "epoch": 1497} {"train_loss": -12.008070945739746, "global_step": 251594, "epoch": 1497} {"train_loss": -12.131771087646484, "global_step": 251595, "epoch": 1497} {"train_loss": -12.057143211364746, "global_step": 251596, "epoch": 1497} {"train_loss": -11.901382446289062, "global_step": 251597, "epoch": 1497} {"train_loss": -12.182266235351562, "global_step": 251598, "epoch": 1497} {"train_loss": -12.241000175476074, "global_step": 251599, "epoch": 1497} {"train_loss": -12.285820007324219, "global_step": 251600, "epoch": 1497} {"train_loss": -12.261919975280762, "global_step": 251601, "epoch": 1497} {"train_loss": -12.299544334411621, "global_step": 251602, "epoch": 1497} {"train_loss": -12.175920486450195, "global_step": 251603, "epoch": 1497} {"train_loss": -12.256038665771484, "global_step": 251604, "epoch": 1497} {"train_loss": -12.24791145324707, "global_step": 251605, "epoch": 1497} {"train_loss": -12.022249221801758, "global_step": 251606, "epoch": 1497} {"train_loss": -12.187376022338867, "global_step": 251607, "epoch": 1497} {"train_loss": -12.02022933959961, "global_step": 251608, "epoch": 1497} {"train_loss": -11.961111068725586, "global_step": 251609, "epoch": 1497} {"train_loss": -11.387516975402832, "global_step": 251610, "epoch": 1497} {"train_loss": -12.247964859008789, "global_step": 251611, "epoch": 1497} {"train_loss": -11.791078567504883, "global_step": 251612, "epoch": 1497} {"train_loss": -11.57174301147461, "global_step": 251613, "epoch": 1497} {"train_loss": -11.508983612060547, "global_step": 251614, "epoch": 1497} {"train_loss": -12.044677734375, "global_step": 251615, "epoch": 1497} {"train_loss": -10.619959831237793, "global_step": 251616, "epoch": 1497} {"train_loss": -9.082627296447754, "global_step": 251617, "epoch": 1497} {"train_loss": -8.902657508850098, "global_step": 251618, "epoch": 1497} {"train_loss": -11.059831619262695, "global_step": 251619, "epoch": 1497} {"train_loss": -10.056196212768555, "global_step": 251620, "epoch": 1497} {"train_loss": -11.257930755615234, "global_step": 251621, "epoch": 1497} {"train_loss": -11.112951278686523, "global_step": 251622, "epoch": 1497} {"train_loss": -10.847758293151855, "global_step": 251623, "epoch": 1497} {"train_loss": -11.703113555908203, "global_step": 251624, "epoch": 1497} {"train_loss": -11.192696571350098, "global_step": 251625, "epoch": 1497} {"train_loss": -11.504072189331055, "global_step": 251626, "epoch": 1497} {"train_loss": -11.585248947143555, "global_step": 251627, "epoch": 1497} {"train_loss": -11.789684295654297, "global_step": 251628, "epoch": 1497} {"train_loss": -11.148053169250488, "global_step": 251629, "epoch": 1497} {"train_loss": -11.841955184936523, "global_step": 251630, "epoch": 1497} {"train_loss": -11.601990699768066, "global_step": 251631, "epoch": 1497} {"train_loss": -11.986289978027344, "global_step": 251632, "epoch": 1497} {"train_loss": -11.519469261169434, "global_step": 251633, "epoch": 1497} {"train_loss": -11.575776100158691, "global_step": 251634, "epoch": 1497} {"train_loss": -11.990374565124512, "global_step": 251635, "epoch": 1497} {"train_loss": -11.683477401733398, "global_step": 251636, "epoch": 1497} {"train_loss": -11.449764251708984, "global_step": 251637, "epoch": 1497} {"train_loss": -10.401750564575195, "global_step": 251638, "epoch": 1497} {"train_loss": -10.43945026397705, "global_step": 251639, "epoch": 1497} {"train_loss": -11.49517822265625, "global_step": 251640, "epoch": 1497} {"train_loss": -11.098197937011719, "global_step": 251641, "epoch": 1497} {"train_loss": -10.59841251373291, "global_step": 251642, "epoch": 1497} {"train_loss": -11.671794891357422, "global_step": 251643, "epoch": 1497} {"train_loss": -10.862472534179688, "global_step": 251644, "epoch": 1497} {"train_loss": -11.666749954223633, "global_step": 251645, "epoch": 1497} {"train_loss": -11.097631454467773, "global_step": 251646, "epoch": 1497} {"train_loss": -11.620445251464844, "global_step": 251647, "epoch": 1497} {"train_loss": -11.513067245483398, "global_step": 251648, "epoch": 1497} {"train_loss": -11.784890174865723, "global_step": 251649, "epoch": 1497} {"train_loss": -11.719093322753906, "global_step": 251650, "epoch": 1497} {"train_loss": -11.697534561157227, "global_step": 251651, "epoch": 1497} {"train_loss": -11.77762222290039, "global_step": 251652, "epoch": 1497} {"train_loss": -11.626626968383789, "global_step": 251653, "epoch": 1497} {"train_loss": -11.680027961730957, "global_step": 251654, "epoch": 1497} {"train_loss": -11.953001022338867, "global_step": 251655, "epoch": 1497} {"train_loss": -11.878557205200195, "global_step": 251656, "epoch": 1497} {"train_loss": -11.985984802246094, "global_step": 251657, "epoch": 1497} {"train_loss": -11.746990203857422, "global_step": 251658, "epoch": 1497} {"train_loss": -11.594858169555664, "global_step": 251659, "epoch": 1497} {"train_loss": -11.817168235778809, "global_step": 251660, "epoch": 1497} {"train_loss": -12.082218170166016, "global_step": 251661, "epoch": 1497} {"train_loss": -11.94807243347168, "global_step": 251662, "epoch": 1497} {"train_loss": -11.48786419346219, "global_step": 251663, "epoch": 1497, "val_loss": 267230.0625} {"train_loss": -11.823701858520508, "global_step": 251664, "epoch": 1498} {"train_loss": -11.804502487182617, "global_step": 251665, "epoch": 1498} {"train_loss": -11.876007080078125, "global_step": 251666, "epoch": 1498} {"train_loss": -11.800086975097656, "global_step": 251667, "epoch": 1498} {"train_loss": -12.026390075683594, "global_step": 251668, "epoch": 1498} {"train_loss": -11.773822784423828, "global_step": 251669, "epoch": 1498} {"train_loss": -12.009613990783691, "global_step": 251670, "epoch": 1498} {"train_loss": -11.6958589553833, "global_step": 251671, "epoch": 1498} {"train_loss": -11.926736831665039, "global_step": 251672, "epoch": 1498} {"train_loss": -12.009821891784668, "global_step": 251673, "epoch": 1498} {"train_loss": -11.596956253051758, "global_step": 251674, "epoch": 1498} {"train_loss": -11.970880508422852, "global_step": 251675, "epoch": 1498} {"train_loss": -11.694864273071289, "global_step": 251676, "epoch": 1498} {"train_loss": -12.07334041595459, "global_step": 251677, "epoch": 1498} {"train_loss": -11.83144760131836, "global_step": 251678, "epoch": 1498} {"train_loss": -12.034505844116211, "global_step": 251679, "epoch": 1498} {"train_loss": -11.83065414428711, "global_step": 251680, "epoch": 1498} {"train_loss": -11.845993995666504, "global_step": 251681, "epoch": 1498} {"train_loss": -11.784592628479004, "global_step": 251682, "epoch": 1498} {"train_loss": -12.078757286071777, "global_step": 251683, "epoch": 1498} {"train_loss": -11.930562019348145, "global_step": 251684, "epoch": 1498} {"train_loss": -11.848431587219238, "global_step": 251685, "epoch": 1498} {"train_loss": -11.654772758483887, "global_step": 251686, "epoch": 1498} {"train_loss": -11.646132469177246, "global_step": 251687, "epoch": 1498} {"train_loss": -11.319656372070312, "global_step": 251688, "epoch": 1498} {"train_loss": -11.471372604370117, "global_step": 251689, "epoch": 1498} {"train_loss": -10.838021278381348, "global_step": 251690, "epoch": 1498} {"train_loss": -11.576044082641602, "global_step": 251691, "epoch": 1498} {"train_loss": -10.64501667022705, "global_step": 251692, "epoch": 1498} {"train_loss": -10.869085311889648, "global_step": 251693, "epoch": 1498} {"train_loss": -11.524524688720703, "global_step": 251694, "epoch": 1498} {"train_loss": -10.575563430786133, "global_step": 251695, "epoch": 1498} {"train_loss": -11.857561111450195, "global_step": 251696, "epoch": 1498} {"train_loss": -10.750151634216309, "global_step": 251697, "epoch": 1498} {"train_loss": -11.871298789978027, "global_step": 251698, "epoch": 1498} {"train_loss": -11.088384628295898, "global_step": 251699, "epoch": 1498} {"train_loss": -11.672706604003906, "global_step": 251700, "epoch": 1498} {"train_loss": -11.521501541137695, "global_step": 251701, "epoch": 1498} {"train_loss": -11.487154006958008, "global_step": 251702, "epoch": 1498} {"train_loss": -11.869232177734375, "global_step": 251703, "epoch": 1498} {"train_loss": -11.78036117553711, "global_step": 251704, "epoch": 1498} {"train_loss": -11.47352409362793, "global_step": 251705, "epoch": 1498} {"train_loss": -11.928622245788574, "global_step": 251706, "epoch": 1498} {"train_loss": -11.485623359680176, "global_step": 251707, "epoch": 1498} {"train_loss": -10.737921714782715, "global_step": 251708, "epoch": 1498} {"train_loss": -11.864568710327148, "global_step": 251709, "epoch": 1498} {"train_loss": -11.510046005249023, "global_step": 251710, "epoch": 1498} {"train_loss": -11.461442947387695, "global_step": 251711, "epoch": 1498} {"train_loss": -11.849104881286621, "global_step": 251712, "epoch": 1498} {"train_loss": -11.725137710571289, "global_step": 251713, "epoch": 1498} {"train_loss": -11.549558639526367, "global_step": 251714, "epoch": 1498} {"train_loss": -12.055660247802734, "global_step": 251715, "epoch": 1498} {"train_loss": -11.927658081054688, "global_step": 251716, "epoch": 1498} {"train_loss": -11.741568565368652, "global_step": 251717, "epoch": 1498} {"train_loss": -11.951309204101562, "global_step": 251718, "epoch": 1498} {"train_loss": -12.00861644744873, "global_step": 251719, "epoch": 1498} {"train_loss": -11.797557830810547, "global_step": 251720, "epoch": 1498} {"train_loss": -11.67393684387207, "global_step": 251721, "epoch": 1498} {"train_loss": -11.389649391174316, "global_step": 251722, "epoch": 1498} {"train_loss": -11.53464126586914, "global_step": 251723, "epoch": 1498} {"train_loss": -11.561800956726074, "global_step": 251724, "epoch": 1498} {"train_loss": -11.856924057006836, "global_step": 251725, "epoch": 1498} {"train_loss": -11.81387710571289, "global_step": 251726, "epoch": 1498} {"train_loss": -11.79759693145752, "global_step": 251727, "epoch": 1498} {"train_loss": -11.545158386230469, "global_step": 251728, "epoch": 1498} {"train_loss": -12.246379852294922, "global_step": 251729, "epoch": 1498} {"train_loss": -11.857946395874023, "global_step": 251730, "epoch": 1498} {"train_loss": -11.634851455688477, "global_step": 251731, "epoch": 1498} {"train_loss": -11.986838340759277, "global_step": 251732, "epoch": 1498} {"train_loss": -11.819562911987305, "global_step": 251733, "epoch": 1498} {"train_loss": -12.005090713500977, "global_step": 251734, "epoch": 1498} {"train_loss": -12.000829696655273, "global_step": 251735, "epoch": 1498} {"train_loss": -11.982841491699219, "global_step": 251736, "epoch": 1498} {"train_loss": -11.744818687438965, "global_step": 251737, "epoch": 1498} {"train_loss": -11.823647499084473, "global_step": 251738, "epoch": 1498} {"train_loss": -12.142143249511719, "global_step": 251739, "epoch": 1498} {"train_loss": -11.95151138305664, "global_step": 251740, "epoch": 1498} {"train_loss": -11.787694931030273, "global_step": 251741, "epoch": 1498} {"train_loss": -11.658214569091797, "global_step": 251742, "epoch": 1498} {"train_loss": -11.422990798950195, "global_step": 251743, "epoch": 1498} {"train_loss": -11.633354187011719, "global_step": 251744, "epoch": 1498} {"train_loss": -11.430635452270508, "global_step": 251745, "epoch": 1498} {"train_loss": -11.693349838256836, "global_step": 251746, "epoch": 1498} {"train_loss": -10.511672019958496, "global_step": 251747, "epoch": 1498} {"train_loss": -11.25393295288086, "global_step": 251748, "epoch": 1498} {"train_loss": -11.849238395690918, "global_step": 251749, "epoch": 1498} {"train_loss": -11.796149253845215, "global_step": 251750, "epoch": 1498} {"train_loss": -11.546627044677734, "global_step": 251751, "epoch": 1498} {"train_loss": -11.640213012695312, "global_step": 251752, "epoch": 1498} {"train_loss": -11.241937637329102, "global_step": 251753, "epoch": 1498} {"train_loss": -11.573701858520508, "global_step": 251754, "epoch": 1498} {"train_loss": -11.252182006835938, "global_step": 251755, "epoch": 1498} {"train_loss": -10.003091812133789, "global_step": 251756, "epoch": 1498} {"train_loss": -11.951580047607422, "global_step": 251757, "epoch": 1498} {"train_loss": -11.208150863647461, "global_step": 251758, "epoch": 1498} {"train_loss": -11.308077812194824, "global_step": 251759, "epoch": 1498} {"train_loss": -12.22884750366211, "global_step": 251760, "epoch": 1498} {"train_loss": -11.346016883850098, "global_step": 251761, "epoch": 1498} {"train_loss": -11.857040405273438, "global_step": 251762, "epoch": 1498} {"train_loss": -11.86479663848877, "global_step": 251763, "epoch": 1498} {"train_loss": -11.727254867553711, "global_step": 251764, "epoch": 1498} {"train_loss": -11.701921463012695, "global_step": 251765, "epoch": 1498} {"train_loss": -11.829276084899902, "global_step": 251766, "epoch": 1498} {"train_loss": -11.985977172851562, "global_step": 251767, "epoch": 1498} {"train_loss": -12.09107780456543, "global_step": 251768, "epoch": 1498} {"train_loss": -11.88461685180664, "global_step": 251769, "epoch": 1498} {"train_loss": -11.82077407836914, "global_step": 251770, "epoch": 1498} {"train_loss": -11.921289443969727, "global_step": 251771, "epoch": 1498} {"train_loss": -12.089780807495117, "global_step": 251772, "epoch": 1498} {"train_loss": -11.902478218078613, "global_step": 251773, "epoch": 1498} {"train_loss": -12.131103515625, "global_step": 251774, "epoch": 1498} {"train_loss": -11.853961944580078, "global_step": 251775, "epoch": 1498} {"train_loss": -12.171845436096191, "global_step": 251776, "epoch": 1498} {"train_loss": -11.668038368225098, "global_step": 251777, "epoch": 1498} {"train_loss": -11.929428100585938, "global_step": 251778, "epoch": 1498} {"train_loss": -11.718765258789062, "global_step": 251779, "epoch": 1498} {"train_loss": -11.946104049682617, "global_step": 251780, "epoch": 1498} {"train_loss": -11.743546485900879, "global_step": 251781, "epoch": 1498} {"train_loss": -11.932989120483398, "global_step": 251782, "epoch": 1498} {"train_loss": -11.938175201416016, "global_step": 251783, "epoch": 1498} {"train_loss": -12.063282012939453, "global_step": 251784, "epoch": 1498} {"train_loss": -12.159934997558594, "global_step": 251785, "epoch": 1498} {"train_loss": -11.865411758422852, "global_step": 251786, "epoch": 1498} {"train_loss": -12.03715705871582, "global_step": 251787, "epoch": 1498} {"train_loss": -11.822186470031738, "global_step": 251788, "epoch": 1498} {"train_loss": -11.906095504760742, "global_step": 251789, "epoch": 1498} {"train_loss": -11.785289764404297, "global_step": 251790, "epoch": 1498} {"train_loss": -12.103864669799805, "global_step": 251791, "epoch": 1498} {"train_loss": -12.106426239013672, "global_step": 251792, "epoch": 1498} {"train_loss": -12.012271881103516, "global_step": 251793, "epoch": 1498} {"train_loss": -11.84879207611084, "global_step": 251794, "epoch": 1498} {"train_loss": -11.571342468261719, "global_step": 251795, "epoch": 1498} {"train_loss": -11.800284385681152, "global_step": 251796, "epoch": 1498} {"train_loss": -11.975931167602539, "global_step": 251797, "epoch": 1498} {"train_loss": -11.381389617919922, "global_step": 251798, "epoch": 1498} {"train_loss": -11.769631385803223, "global_step": 251799, "epoch": 1498} {"train_loss": -11.509296417236328, "global_step": 251800, "epoch": 1498} {"train_loss": -11.670833587646484, "global_step": 251801, "epoch": 1498} {"train_loss": -11.768760681152344, "global_step": 251802, "epoch": 1498} {"train_loss": -11.396312713623047, "global_step": 251803, "epoch": 1498} {"train_loss": -11.199914932250977, "global_step": 251804, "epoch": 1498} {"train_loss": -10.527290344238281, "global_step": 251805, "epoch": 1498} {"train_loss": -11.393592834472656, "global_step": 251806, "epoch": 1498} {"train_loss": -11.184680938720703, "global_step": 251807, "epoch": 1498} {"train_loss": -11.750893592834473, "global_step": 251808, "epoch": 1498} {"train_loss": -11.245426177978516, "global_step": 251809, "epoch": 1498} {"train_loss": -11.516560554504395, "global_step": 251810, "epoch": 1498} {"train_loss": -11.680107116699219, "global_step": 251811, "epoch": 1498} {"train_loss": -11.449686050415039, "global_step": 251812, "epoch": 1498} {"train_loss": -11.653385162353516, "global_step": 251813, "epoch": 1498} {"train_loss": -12.054433822631836, "global_step": 251814, "epoch": 1498} {"train_loss": -11.862449645996094, "global_step": 251815, "epoch": 1498} {"train_loss": -11.966984748840332, "global_step": 251816, "epoch": 1498} {"train_loss": -11.619834899902344, "global_step": 251817, "epoch": 1498} {"train_loss": -11.686088562011719, "global_step": 251818, "epoch": 1498} {"train_loss": -12.088630676269531, "global_step": 251819, "epoch": 1498} {"train_loss": -11.535284042358398, "global_step": 251820, "epoch": 1498} {"train_loss": -11.170317649841309, "global_step": 251821, "epoch": 1498} {"train_loss": -11.306514739990234, "global_step": 251822, "epoch": 1498} {"train_loss": -11.210105895996094, "global_step": 251823, "epoch": 1498} {"train_loss": -11.262411117553711, "global_step": 251824, "epoch": 1498} {"train_loss": -11.9119234085083, "global_step": 251825, "epoch": 1498} {"train_loss": -11.458518981933594, "global_step": 251826, "epoch": 1498} {"train_loss": -11.625173568725586, "global_step": 251827, "epoch": 1498} {"train_loss": -11.514632225036621, "global_step": 251828, "epoch": 1498} {"train_loss": -10.821443557739258, "global_step": 251829, "epoch": 1498} {"train_loss": -11.973867416381836, "global_step": 251830, "epoch": 1498} {"train_loss": -11.672942030997504, "global_step": 251831, "epoch": 1498, "val_loss": 270570.53125} {"train_loss": -11.387065887451172, "global_step": 251832, "epoch": 1499} {"train_loss": -10.815896987915039, "global_step": 251833, "epoch": 1499} {"train_loss": -11.71597671508789, "global_step": 251834, "epoch": 1499} {"train_loss": -11.623292922973633, "global_step": 251835, "epoch": 1499} {"train_loss": -11.152360916137695, "global_step": 251836, "epoch": 1499} {"train_loss": -11.623063087463379, "global_step": 251837, "epoch": 1499} {"train_loss": -11.57192325592041, "global_step": 251838, "epoch": 1499} {"train_loss": -11.42074966430664, "global_step": 251839, "epoch": 1499} {"train_loss": -11.2532958984375, "global_step": 251840, "epoch": 1499} {"train_loss": -11.461616516113281, "global_step": 251841, "epoch": 1499} {"train_loss": -11.700428009033203, "global_step": 251842, "epoch": 1499} {"train_loss": -11.427597045898438, "global_step": 251843, "epoch": 1499} {"train_loss": -11.764196395874023, "global_step": 251844, "epoch": 1499} {"train_loss": -11.661956787109375, "global_step": 251845, "epoch": 1499} {"train_loss": -11.30812931060791, "global_step": 251846, "epoch": 1499} {"train_loss": -11.578956604003906, "global_step": 251847, "epoch": 1499} {"train_loss": -11.180169105529785, "global_step": 251848, "epoch": 1499} {"train_loss": -10.902774810791016, "global_step": 251849, "epoch": 1499} {"train_loss": -11.821861267089844, "global_step": 251850, "epoch": 1499} {"train_loss": -11.111162185668945, "global_step": 251851, "epoch": 1499} {"train_loss": -11.201358795166016, "global_step": 251852, "epoch": 1499} {"train_loss": -10.354076385498047, "global_step": 251853, "epoch": 1499} {"train_loss": -11.258953094482422, "global_step": 251854, "epoch": 1499} {"train_loss": -9.874077796936035, "global_step": 251855, "epoch": 1499} {"train_loss": -9.971420288085938, "global_step": 251856, "epoch": 1499} {"train_loss": -9.987019538879395, "global_step": 251857, "epoch": 1499} {"train_loss": -9.765714645385742, "global_step": 251858, "epoch": 1499} {"train_loss": -9.98127269744873, "global_step": 251859, "epoch": 1499} {"train_loss": -9.850215911865234, "global_step": 251860, "epoch": 1499} {"train_loss": -10.031291961669922, "global_step": 251861, "epoch": 1499} {"train_loss": -9.812681198120117, "global_step": 251862, "epoch": 1499} {"train_loss": -10.512187957763672, "global_step": 251863, "epoch": 1499} {"train_loss": -10.561599731445312, "global_step": 251864, "epoch": 1499} {"train_loss": -10.239871978759766, "global_step": 251865, "epoch": 1499} {"train_loss": -11.499539375305176, "global_step": 251866, "epoch": 1499} {"train_loss": -9.962193489074707, "global_step": 251867, "epoch": 1499} {"train_loss": -10.961721420288086, "global_step": 251868, "epoch": 1499} {"train_loss": -10.209585189819336, "global_step": 251869, "epoch": 1499} {"train_loss": -10.454763412475586, "global_step": 251870, "epoch": 1499} {"train_loss": -10.963025093078613, "global_step": 251871, "epoch": 1499} {"train_loss": -10.585948944091797, "global_step": 251872, "epoch": 1499} {"train_loss": -11.508682250976562, "global_step": 251873, "epoch": 1499} {"train_loss": -11.036011695861816, "global_step": 251874, "epoch": 1499} {"train_loss": -11.411884307861328, "global_step": 251875, "epoch": 1499} {"train_loss": -11.081840515136719, "global_step": 251876, "epoch": 1499} {"train_loss": -11.157907485961914, "global_step": 251877, "epoch": 1499} {"train_loss": -11.049173355102539, "global_step": 251878, "epoch": 1499} {"train_loss": -11.150520324707031, "global_step": 251879, "epoch": 1499} {"train_loss": -11.060466766357422, "global_step": 251880, "epoch": 1499} {"train_loss": -11.169164657592773, "global_step": 251881, "epoch": 1499} {"train_loss": -11.551258087158203, "global_step": 251882, "epoch": 1499} {"train_loss": -11.233528137207031, "global_step": 251883, "epoch": 1499} {"train_loss": -11.549751281738281, "global_step": 251884, "epoch": 1499} {"train_loss": -11.6721773147583, "global_step": 251885, "epoch": 1499} {"train_loss": -11.392351150512695, "global_step": 251886, "epoch": 1499} {"train_loss": -11.827262878417969, "global_step": 251887, "epoch": 1499} {"train_loss": -11.167638778686523, "global_step": 251888, "epoch": 1499} {"train_loss": -11.619905471801758, "global_step": 251889, "epoch": 1499} {"train_loss": -11.534965515136719, "global_step": 251890, "epoch": 1499} {"train_loss": -11.44237995147705, "global_step": 251891, "epoch": 1499} {"train_loss": -11.710260391235352, "global_step": 251892, "epoch": 1499} {"train_loss": -11.603876113891602, "global_step": 251893, "epoch": 1499} {"train_loss": -11.767593383789062, "global_step": 251894, "epoch": 1499} {"train_loss": -11.535407066345215, "global_step": 251895, "epoch": 1499} {"train_loss": -11.679375648498535, "global_step": 251896, "epoch": 1499} {"train_loss": -11.508516311645508, "global_step": 251897, "epoch": 1499} {"train_loss": -11.914214134216309, "global_step": 251898, "epoch": 1499} {"train_loss": -11.693498611450195, "global_step": 251899, "epoch": 1499} {"train_loss": -11.617834091186523, "global_step": 251900, "epoch": 1499} {"train_loss": -11.720069885253906, "global_step": 251901, "epoch": 1499} {"train_loss": -11.599102020263672, "global_step": 251902, "epoch": 1499} {"train_loss": -11.750310897827148, "global_step": 251903, "epoch": 1499} {"train_loss": -11.649763107299805, "global_step": 251904, "epoch": 1499} {"train_loss": -11.94123649597168, "global_step": 251905, "epoch": 1499} {"train_loss": -11.981854438781738, "global_step": 251906, "epoch": 1499} {"train_loss": -11.702232360839844, "global_step": 251907, "epoch": 1499} {"train_loss": -11.729595184326172, "global_step": 251908, "epoch": 1499} {"train_loss": -11.602685928344727, "global_step": 251909, "epoch": 1499} {"train_loss": -11.818841934204102, "global_step": 251910, "epoch": 1499} {"train_loss": -11.707992553710938, "global_step": 251911, "epoch": 1499} {"train_loss": -11.710310935974121, "global_step": 251912, "epoch": 1499} {"train_loss": -11.720739364624023, "global_step": 251913, "epoch": 1499} {"train_loss": -11.972883224487305, "global_step": 251914, "epoch": 1499} {"train_loss": -11.80984115600586, "global_step": 251915, "epoch": 1499} {"train_loss": -11.973797798156738, "global_step": 251916, "epoch": 1499} {"train_loss": -11.658685684204102, "global_step": 251917, "epoch": 1499} {"train_loss": -11.832918167114258, "global_step": 251918, "epoch": 1499} {"train_loss": -11.9646635055542, "global_step": 251919, "epoch": 1499} {"train_loss": -11.960630416870117, "global_step": 251920, "epoch": 1499} {"train_loss": -11.824725151062012, "global_step": 251921, "epoch": 1499} {"train_loss": -11.812578201293945, "global_step": 251922, "epoch": 1499} {"train_loss": -12.000728607177734, "global_step": 251923, "epoch": 1499} {"train_loss": -11.990350723266602, "global_step": 251924, "epoch": 1499} {"train_loss": -11.7621488571167, "global_step": 251925, "epoch": 1499} {"train_loss": -12.076919555664062, "global_step": 251926, "epoch": 1499} {"train_loss": -12.185322761535645, "global_step": 251927, "epoch": 1499} {"train_loss": -11.98493766784668, "global_step": 251928, "epoch": 1499} {"train_loss": -12.174436569213867, "global_step": 251929, "epoch": 1499} {"train_loss": -12.036301612854004, "global_step": 251930, "epoch": 1499} {"train_loss": -12.068499565124512, "global_step": 251931, "epoch": 1499} {"train_loss": -11.92751407623291, "global_step": 251932, "epoch": 1499} {"train_loss": -11.708932876586914, "global_step": 251933, "epoch": 1499} {"train_loss": -11.92539119720459, "global_step": 251934, "epoch": 1499} {"train_loss": -12.099505424499512, "global_step": 251935, "epoch": 1499} {"train_loss": -11.809247970581055, "global_step": 251936, "epoch": 1499} {"train_loss": -12.272104263305664, "global_step": 251937, "epoch": 1499} {"train_loss": -11.841904640197754, "global_step": 251938, "epoch": 1499} {"train_loss": -12.051958084106445, "global_step": 251939, "epoch": 1499} {"train_loss": -12.032726287841797, "global_step": 251940, "epoch": 1499} {"train_loss": -12.039555549621582, "global_step": 251941, "epoch": 1499} {"train_loss": -12.296345710754395, "global_step": 251942, "epoch": 1499} {"train_loss": -12.162920951843262, "global_step": 251943, "epoch": 1499} {"train_loss": -12.140632629394531, "global_step": 251944, "epoch": 1499} {"train_loss": -11.768468856811523, "global_step": 251945, "epoch": 1499} {"train_loss": -12.190755844116211, "global_step": 251946, "epoch": 1499} {"train_loss": -11.951898574829102, "global_step": 251947, "epoch": 1499} {"train_loss": -11.839900970458984, "global_step": 251948, "epoch": 1499} {"train_loss": -11.990455627441406, "global_step": 251949, "epoch": 1499} {"train_loss": -12.046798706054688, "global_step": 251950, "epoch": 1499} {"train_loss": -11.864317893981934, "global_step": 251951, "epoch": 1499} {"train_loss": -12.12582778930664, "global_step": 251952, "epoch": 1499} {"train_loss": -12.091736793518066, "global_step": 251953, "epoch": 1499} {"train_loss": -12.147842407226562, "global_step": 251954, "epoch": 1499} {"train_loss": -12.022933959960938, "global_step": 251955, "epoch": 1499} {"train_loss": -12.065237998962402, "global_step": 251956, "epoch": 1499} {"train_loss": -12.210076332092285, "global_step": 251957, "epoch": 1499} {"train_loss": -11.778802871704102, "global_step": 251958, "epoch": 1499} {"train_loss": -11.877888679504395, "global_step": 251959, "epoch": 1499} {"train_loss": -12.248116493225098, "global_step": 251960, "epoch": 1499} {"train_loss": -11.84138011932373, "global_step": 251961, "epoch": 1499} {"train_loss": -12.004453659057617, "global_step": 251962, "epoch": 1499} {"train_loss": -11.80976676940918, "global_step": 251963, "epoch": 1499} {"train_loss": -11.56406307220459, "global_step": 251964, "epoch": 1499} {"train_loss": -12.202507972717285, "global_step": 251965, "epoch": 1499} {"train_loss": -11.300213813781738, "global_step": 251966, "epoch": 1499} {"train_loss": -11.127471923828125, "global_step": 251967, "epoch": 1499} {"train_loss": -12.104425430297852, "global_step": 251968, "epoch": 1499} {"train_loss": -11.173721313476562, "global_step": 251969, "epoch": 1499} {"train_loss": -12.099693298339844, "global_step": 251970, "epoch": 1499} {"train_loss": -11.49028205871582, "global_step": 251971, "epoch": 1499} {"train_loss": -10.820907592773438, "global_step": 251972, "epoch": 1499} {"train_loss": -11.54481315612793, "global_step": 251973, "epoch": 1499} {"train_loss": -10.550354957580566, "global_step": 251974, "epoch": 1499} {"train_loss": -11.178481101989746, "global_step": 251975, "epoch": 1499} {"train_loss": -11.534341812133789, "global_step": 251976, "epoch": 1499} {"train_loss": -10.417811393737793, "global_step": 251977, "epoch": 1499} {"train_loss": -11.557291030883789, "global_step": 251978, "epoch": 1499} {"train_loss": -10.29881477355957, "global_step": 251979, "epoch": 1499} {"train_loss": -9.00343132019043, "global_step": 251980, "epoch": 1499} {"train_loss": -10.040063858032227, "global_step": 251981, "epoch": 1499} {"train_loss": -8.615608215332031, "global_step": 251982, "epoch": 1499} {"train_loss": -9.808504104614258, "global_step": 251983, "epoch": 1499} {"train_loss": -10.074542999267578, "global_step": 251984, "epoch": 1499} {"train_loss": -9.226436614990234, "global_step": 251985, "epoch": 1499} {"train_loss": -9.251825332641602, "global_step": 251986, "epoch": 1499} {"train_loss": -9.700315475463867, "global_step": 251987, "epoch": 1499} {"train_loss": -10.47578239440918, "global_step": 251988, "epoch": 1499} {"train_loss": -8.565333366394043, "global_step": 251989, "epoch": 1499} {"train_loss": -9.598196983337402, "global_step": 251990, "epoch": 1499} {"train_loss": -10.212810516357422, "global_step": 251991, "epoch": 1499} {"train_loss": -10.038372039794922, "global_step": 251992, "epoch": 1499} {"train_loss": -9.689160346984863, "global_step": 251993, "epoch": 1499} {"train_loss": -10.338818550109863, "global_step": 251994, "epoch": 1499} {"train_loss": -10.625877380371094, "global_step": 251995, "epoch": 1499} {"train_loss": -10.991458892822266, "global_step": 251996, "epoch": 1499} {"train_loss": -10.660726547241211, "global_step": 251997, "epoch": 1499} {"train_loss": -11.309008598327637, "global_step": 251998, "epoch": 1499} {"train_loss": -11.303602610315595, "global_step": 251999, "epoch": 1499, "val_loss": 262236.03125} {"train_loss": -10.645612716674805, "global_step": 252000, "epoch": 1500} {"train_loss": -11.281294822692871, "global_step": 252001, "epoch": 1500} {"train_loss": -10.720073699951172, "global_step": 252002, "epoch": 1500} {"train_loss": -10.950355529785156, "global_step": 252003, "epoch": 1500} {"train_loss": -11.232397079467773, "global_step": 252004, "epoch": 1500} {"train_loss": -10.992555618286133, "global_step": 252005, "epoch": 1500} {"train_loss": -10.993501663208008, "global_step": 252006, "epoch": 1500} {"train_loss": -11.175800323486328, "global_step": 252007, "epoch": 1500} {"train_loss": -10.930755615234375, "global_step": 252008, "epoch": 1500} {"train_loss": -11.177050590515137, "global_step": 252009, "epoch": 1500} {"train_loss": -11.33792495727539, "global_step": 252010, "epoch": 1500} {"train_loss": -11.48625373840332, "global_step": 252011, "epoch": 1500} {"train_loss": -11.527839660644531, "global_step": 252012, "epoch": 1500} {"train_loss": -11.526540756225586, "global_step": 252013, "epoch": 1500} {"train_loss": -11.424829483032227, "global_step": 252014, "epoch": 1500} {"train_loss": -11.507293701171875, "global_step": 252015, "epoch": 1500} {"train_loss": -11.303329467773438, "global_step": 252016, "epoch": 1500} {"train_loss": -11.381567001342773, "global_step": 252017, "epoch": 1500} {"train_loss": -11.667257308959961, "global_step": 252018, "epoch": 1500} {"train_loss": -11.503822326660156, "global_step": 252019, "epoch": 1500} {"train_loss": -11.82502555847168, "global_step": 252020, "epoch": 1500} {"train_loss": -11.464545249938965, "global_step": 252021, "epoch": 1500} {"train_loss": -11.721169471740723, "global_step": 252022, "epoch": 1500} {"train_loss": -11.552894592285156, "global_step": 252023, "epoch": 1500} {"train_loss": -11.7888822555542, "global_step": 252024, "epoch": 1500} {"train_loss": -11.873566627502441, "global_step": 252025, "epoch": 1500} {"train_loss": -11.551817893981934, "global_step": 252026, "epoch": 1500} {"train_loss": -11.677675247192383, "global_step": 252027, "epoch": 1500} {"train_loss": -11.63571548461914, "global_step": 252028, "epoch": 1500} {"train_loss": -11.84752082824707, "global_step": 252029, "epoch": 1500} {"train_loss": -11.565462112426758, "global_step": 252030, "epoch": 1500} {"train_loss": -11.699871063232422, "global_step": 252031, "epoch": 1500} {"train_loss": -11.615935325622559, "global_step": 252032, "epoch": 1500} {"train_loss": -11.864867210388184, "global_step": 252033, "epoch": 1500} {"train_loss": -11.923418045043945, "global_step": 252034, "epoch": 1500} {"train_loss": -11.8614501953125, "global_step": 252035, "epoch": 1500} {"train_loss": -11.869958877563477, "global_step": 252036, "epoch": 1500} {"train_loss": -11.810564041137695, "global_step": 252037, "epoch": 1500} {"train_loss": -11.864727020263672, "global_step": 252038, "epoch": 1500} {"train_loss": -11.679062843322754, "global_step": 252039, "epoch": 1500} {"train_loss": -11.760272979736328, "global_step": 252040, "epoch": 1500} {"train_loss": -11.721555709838867, "global_step": 252041, "epoch": 1500} {"train_loss": -11.822508811950684, "global_step": 252042, "epoch": 1500} {"train_loss": -11.709880828857422, "global_step": 252043, "epoch": 1500} {"train_loss": -11.897783279418945, "global_step": 252044, "epoch": 1500} {"train_loss": -11.941913604736328, "global_step": 252045, "epoch": 1500} {"train_loss": -11.775430679321289, "global_step": 252046, "epoch": 1500} {"train_loss": -12.191301345825195, "global_step": 252047, "epoch": 1500} {"train_loss": -11.808427810668945, "global_step": 252048, "epoch": 1500} {"train_loss": -12.013158798217773, "global_step": 252049, "epoch": 1500} {"train_loss": -12.014698028564453, "global_step": 252050, "epoch": 1500} {"train_loss": -11.938541412353516, "global_step": 252051, "epoch": 1500} {"train_loss": -12.107172012329102, "global_step": 252052, "epoch": 1500} {"train_loss": -11.797332763671875, "global_step": 252053, "epoch": 1500} {"train_loss": -11.881892204284668, "global_step": 252054, "epoch": 1500} {"train_loss": -11.964727401733398, "global_step": 252055, "epoch": 1500} {"train_loss": -11.884199142456055, "global_step": 252056, "epoch": 1500} {"train_loss": -12.061861038208008, "global_step": 252057, "epoch": 1500} {"train_loss": -12.194246292114258, "global_step": 252058, "epoch": 1500} {"train_loss": -12.039377212524414, "global_step": 252059, "epoch": 1500} {"train_loss": -11.966890335083008, "global_step": 252060, "epoch": 1500} {"train_loss": -12.063441276550293, "global_step": 252061, "epoch": 1500} {"train_loss": -11.883964538574219, "global_step": 252062, "epoch": 1500} {"train_loss": -11.967756271362305, "global_step": 252063, "epoch": 1500} {"train_loss": -12.090622901916504, "global_step": 252064, "epoch": 1500} {"train_loss": -11.945215225219727, "global_step": 252065, "epoch": 1500} {"train_loss": -11.87480354309082, "global_step": 252066, "epoch": 1500} {"train_loss": -11.957420349121094, "global_step": 252067, "epoch": 1500} {"train_loss": -12.01573371887207, "global_step": 252068, "epoch": 1500} {"train_loss": -11.905052185058594, "global_step": 252069, "epoch": 1500} {"train_loss": -11.961346626281738, "global_step": 252070, "epoch": 1500} {"train_loss": -12.212265014648438, "global_step": 252071, "epoch": 1500} {"train_loss": -11.945905685424805, "global_step": 252072, "epoch": 1500} {"train_loss": -12.307686805725098, "global_step": 252073, "epoch": 1500} {"train_loss": -11.903556823730469, "global_step": 252074, "epoch": 1500} {"train_loss": -11.768684387207031, "global_step": 252075, "epoch": 1500} {"train_loss": -11.732337951660156, "global_step": 252076, "epoch": 1500} {"train_loss": -12.135335922241211, "global_step": 252077, "epoch": 1500} {"train_loss": -12.149066925048828, "global_step": 252078, "epoch": 1500} {"train_loss": -11.696817398071289, "global_step": 252079, "epoch": 1500} {"train_loss": -11.657020568847656, "global_step": 252080, "epoch": 1500} {"train_loss": -12.057869911193848, "global_step": 252081, "epoch": 1500} {"train_loss": -11.878532409667969, "global_step": 252082, "epoch": 1500} {"train_loss": -11.378911018371582, "global_step": 252083, "epoch": 1500} {"train_loss": -11.237846374511719, "global_step": 252084, "epoch": 1500} {"train_loss": -11.60792350769043, "global_step": 252085, "epoch": 1500} {"train_loss": -11.884498596191406, "global_step": 252086, "epoch": 1500} {"train_loss": -11.117410659790039, "global_step": 252087, "epoch": 1500} {"train_loss": -11.1292724609375, "global_step": 252088, "epoch": 1500} {"train_loss": -11.510971069335938, "global_step": 252089, "epoch": 1500} {"train_loss": -11.807523727416992, "global_step": 252090, "epoch": 1500} {"train_loss": -11.626596450805664, "global_step": 252091, "epoch": 1500} {"train_loss": -11.393264770507812, "global_step": 252092, "epoch": 1500} {"train_loss": -11.569644927978516, "global_step": 252093, "epoch": 1500} {"train_loss": -11.154050827026367, "global_step": 252094, "epoch": 1500} {"train_loss": -9.955400466918945, "global_step": 252095, "epoch": 1500} {"train_loss": -11.44862174987793, "global_step": 252096, "epoch": 1500} {"train_loss": -11.523782730102539, "global_step": 252097, "epoch": 1500} {"train_loss": -10.656103134155273, "global_step": 252098, "epoch": 1500} {"train_loss": -11.252374649047852, "global_step": 252099, "epoch": 1500} {"train_loss": -11.21905517578125, "global_step": 252100, "epoch": 1500} {"train_loss": -10.991779327392578, "global_step": 252101, "epoch": 1500} {"train_loss": -11.647754669189453, "global_step": 252102, "epoch": 1500} {"train_loss": -10.857733726501465, "global_step": 252103, "epoch": 1500} {"train_loss": -10.661664009094238, "global_step": 252104, "epoch": 1500} {"train_loss": -11.939126968383789, "global_step": 252105, "epoch": 1500} {"train_loss": -11.044938087463379, "global_step": 252106, "epoch": 1500} {"train_loss": -11.63978099822998, "global_step": 252107, "epoch": 1500} {"train_loss": -11.156302452087402, "global_step": 252108, "epoch": 1500} {"train_loss": -11.704020500183105, "global_step": 252109, "epoch": 1500} {"train_loss": -11.33496379852295, "global_step": 252110, "epoch": 1500} {"train_loss": -11.031339645385742, "global_step": 252111, "epoch": 1500} {"train_loss": -11.53283405303955, "global_step": 252112, "epoch": 1500} {"train_loss": -11.740823745727539, "global_step": 252113, "epoch": 1500} {"train_loss": -11.475115776062012, "global_step": 252114, "epoch": 1500} {"train_loss": -11.668318748474121, "global_step": 252115, "epoch": 1500} {"train_loss": -11.130681991577148, "global_step": 252116, "epoch": 1500} {"train_loss": -11.794904708862305, "global_step": 252117, "epoch": 1500} {"train_loss": -11.216373443603516, "global_step": 252118, "epoch": 1500} {"train_loss": -11.440896987915039, "global_step": 252119, "epoch": 1500} {"train_loss": -11.4796724319458, "global_step": 252120, "epoch": 1500} {"train_loss": -11.247344970703125, "global_step": 252121, "epoch": 1500} {"train_loss": -11.068170547485352, "global_step": 252122, "epoch": 1500} {"train_loss": -10.477794647216797, "global_step": 252123, "epoch": 1500} {"train_loss": -11.19215202331543, "global_step": 252124, "epoch": 1500} {"train_loss": -11.709193229675293, "global_step": 252125, "epoch": 1500} {"train_loss": -10.706464767456055, "global_step": 252126, "epoch": 1500} {"train_loss": -11.891827583312988, "global_step": 252127, "epoch": 1500} {"train_loss": -11.340362548828125, "global_step": 252128, "epoch": 1500} {"train_loss": -11.418170928955078, "global_step": 252129, "epoch": 1500} {"train_loss": -11.314876556396484, "global_step": 252130, "epoch": 1500} {"train_loss": -11.55179500579834, "global_step": 252131, "epoch": 1500} {"train_loss": -11.330257415771484, "global_step": 252132, "epoch": 1500} {"train_loss": -11.513237953186035, "global_step": 252133, "epoch": 1500} {"train_loss": -11.839933395385742, "global_step": 252134, "epoch": 1500} {"train_loss": -11.61716079711914, "global_step": 252135, "epoch": 1500} {"train_loss": -11.729715347290039, "global_step": 252136, "epoch": 1500} {"train_loss": -11.934240341186523, "global_step": 252137, "epoch": 1500} {"train_loss": -11.559473037719727, "global_step": 252138, "epoch": 1500} {"train_loss": -11.883934020996094, "global_step": 252139, "epoch": 1500} {"train_loss": -11.510005950927734, "global_step": 252140, "epoch": 1500} {"train_loss": -11.790489196777344, "global_step": 252141, "epoch": 1500} {"train_loss": -11.748625755310059, "global_step": 252142, "epoch": 1500} {"train_loss": -11.737627029418945, "global_step": 252143, "epoch": 1500} {"train_loss": -11.522607803344727, "global_step": 252144, "epoch": 1500} {"train_loss": -11.815954208374023, "global_step": 252145, "epoch": 1500} {"train_loss": -11.8212890625, "global_step": 252146, "epoch": 1500} {"train_loss": -11.678284645080566, "global_step": 252147, "epoch": 1500} {"train_loss": -11.91472339630127, "global_step": 252148, "epoch": 1500} {"train_loss": -11.846879005432129, "global_step": 252149, "epoch": 1500} {"train_loss": -11.415886878967285, "global_step": 252150, "epoch": 1500} {"train_loss": -12.179861068725586, "global_step": 252151, "epoch": 1500} {"train_loss": -11.863089561462402, "global_step": 252152, "epoch": 1500} {"train_loss": -12.115687370300293, "global_step": 252153, "epoch": 1500} {"train_loss": -11.800972938537598, "global_step": 252154, "epoch": 1500} {"train_loss": -11.62130355834961, "global_step": 252155, "epoch": 1500} {"train_loss": -12.160806655883789, "global_step": 252156, "epoch": 1500} {"train_loss": -11.596735954284668, "global_step": 252157, "epoch": 1500} {"train_loss": -12.005311965942383, "global_step": 252158, "epoch": 1500} {"train_loss": -11.644065856933594, "global_step": 252159, "epoch": 1500} {"train_loss": -12.054085731506348, "global_step": 252160, "epoch": 1500} {"train_loss": -11.765449523925781, "global_step": 252161, "epoch": 1500} {"train_loss": -12.064957618713379, "global_step": 252162, "epoch": 1500} {"train_loss": -12.018579483032227, "global_step": 252163, "epoch": 1500} {"train_loss": -12.021551132202148, "global_step": 252164, "epoch": 1500} {"train_loss": -12.121070861816406, "global_step": 252165, "epoch": 1500} {"train_loss": -12.074270248413086, "global_step": 252166, "epoch": 1500} {"train_loss": -11.626223200843448, "global_step": 252167, "epoch": 1500, "train/sim_max_reward_0": 0.7177687466662198, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.4976020191277812, "train/sim_max_reward_4": 0.987033123946365, "train/sim_max_reward_5": 0.5183390441188471, "test/sim_max_reward_4400000": 0.9950876462620839, "test/sim_max_reward_4400001": 0.38249255565730816, "test/sim_max_reward_4400002": 0.07056412608905997, "test/sim_max_reward_4400003": 0.4155082310886485, "test/sim_max_reward_4400004": 0.7910897066096888, "test/sim_max_reward_4400005": 0.5837596825898794, "test/sim_max_reward_4400006": 0.30916211410043626, "test/sim_max_reward_4400007": 0.20555664575716803, "test/sim_max_reward_4400008": 0.576559439495268, "test/sim_max_reward_4400009": 0.03013808849954545, "test/sim_max_reward_4400010": 0.995307995639187, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 0.3821287325075888, "test/sim_max_reward_4400013": 0.9587609417936422, "test/sim_max_reward_4400014": 0.6405144243998816, "test/sim_max_reward_4400015": 0.7052250232519135, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.5430194781814487, "test/sim_max_reward_4400019": 0.3920701866110206, "test/sim_max_reward_4400020": 0.5243065007293929, "test/sim_max_reward_4400021": 0.7031959849396547, "test/sim_max_reward_4400022": 0.9732819643497097, "test/sim_max_reward_4400023": 0.15532535220228016, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.5100154688449344, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.6038066077764341, "test/sim_max_reward_4400028": 0.7090556912805808, "test/sim_max_reward_4400029": 1.0, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.9906987213440626, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9715103847099341, "test/sim_max_reward_4400034": 0.9475444235402762, "test/sim_max_reward_4400035": 0.9951115580744818, "test/sim_max_reward_4400036": 0.37639999096504373, "test/sim_max_reward_4400037": 0.9877200352708538, "test/sim_max_reward_4400038": 0.31865382581083274, "test/sim_max_reward_4400039": 0.9986085072725386, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.17244611278502464, "test/sim_max_reward_4400042": 0.7865830420411059, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.9867840513015307, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.9790087220185268, "test/sim_max_reward_4400047": 0.991230869742285, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.620123822309869, "test/mean_score": 0.5751307896070978, "val_loss": 271162.625, "train_action_mse_error": 2.0494844913482666} {"train_loss": -11.827119827270508, "global_step": 252168, "epoch": 1501} {"train_loss": -11.802112579345703, "global_step": 252169, "epoch": 1501} {"train_loss": -11.728983879089355, "global_step": 252170, "epoch": 1501} {"train_loss": -11.777520179748535, "global_step": 252171, "epoch": 1501} {"train_loss": -11.45433521270752, "global_step": 252172, "epoch": 1501} {"train_loss": -11.713396072387695, "global_step": 252173, "epoch": 1501} {"train_loss": -12.032753944396973, "global_step": 252174, "epoch": 1501} {"train_loss": -11.614004135131836, "global_step": 252175, "epoch": 1501} {"train_loss": -11.855817794799805, "global_step": 252176, "epoch": 1501} {"train_loss": -11.768665313720703, "global_step": 252177, "epoch": 1501} {"train_loss": -11.47392463684082, "global_step": 252178, "epoch": 1501} {"train_loss": -11.463603973388672, "global_step": 252179, "epoch": 1501} {"train_loss": -11.979397773742676, "global_step": 252180, "epoch": 1501} {"train_loss": -11.856881141662598, "global_step": 252181, "epoch": 1501} {"train_loss": -11.577439308166504, "global_step": 252182, "epoch": 1501} {"train_loss": -11.994749069213867, "global_step": 252183, "epoch": 1501} {"train_loss": -11.786147117614746, "global_step": 252184, "epoch": 1501} {"train_loss": -11.902826309204102, "global_step": 252185, "epoch": 1501} {"train_loss": -11.960710525512695, "global_step": 252186, "epoch": 1501} {"train_loss": -11.722938537597656, "global_step": 252187, "epoch": 1501} {"train_loss": -12.165562629699707, "global_step": 252188, "epoch": 1501} {"train_loss": -11.478334426879883, "global_step": 252189, "epoch": 1501} {"train_loss": -11.610179901123047, "global_step": 252190, "epoch": 1501} {"train_loss": -11.981313705444336, "global_step": 252191, "epoch": 1501} {"train_loss": -10.521717071533203, "global_step": 252192, "epoch": 1501} {"train_loss": -11.28852653503418, "global_step": 252193, "epoch": 1501} {"train_loss": -11.057584762573242, "global_step": 252194, "epoch": 1501} {"train_loss": -11.64572811126709, "global_step": 252195, "epoch": 1501} {"train_loss": -11.81344985961914, "global_step": 252196, "epoch": 1501} {"train_loss": -11.518041610717773, "global_step": 252197, "epoch": 1501} {"train_loss": -11.447992324829102, "global_step": 252198, "epoch": 1501} {"train_loss": -11.352441787719727, "global_step": 252199, "epoch": 1501} {"train_loss": -11.846662521362305, "global_step": 252200, "epoch": 1501} {"train_loss": -11.636885643005371, "global_step": 252201, "epoch": 1501} {"train_loss": -11.739781379699707, "global_step": 252202, "epoch": 1501} {"train_loss": -12.03370475769043, "global_step": 252203, "epoch": 1501} {"train_loss": -11.542825698852539, "global_step": 252204, "epoch": 1501} {"train_loss": -11.538454055786133, "global_step": 252205, "epoch": 1501} {"train_loss": -12.101703643798828, "global_step": 252206, "epoch": 1501} {"train_loss": -11.211006164550781, "global_step": 252207, "epoch": 1501} {"train_loss": -11.728853225708008, "global_step": 252208, "epoch": 1501} {"train_loss": -12.030511856079102, "global_step": 252209, "epoch": 1501} {"train_loss": -11.831296920776367, "global_step": 252210, "epoch": 1501} {"train_loss": -11.777231216430664, "global_step": 252211, "epoch": 1501} {"train_loss": -12.003341674804688, "global_step": 252212, "epoch": 1501} {"train_loss": -11.748594284057617, "global_step": 252213, "epoch": 1501} {"train_loss": -11.755491256713867, "global_step": 252214, "epoch": 1501} {"train_loss": -11.976420402526855, "global_step": 252215, "epoch": 1501} {"train_loss": -11.457662582397461, "global_step": 252216, "epoch": 1501} {"train_loss": -11.806102752685547, "global_step": 252217, "epoch": 1501} {"train_loss": -11.338578224182129, "global_step": 252218, "epoch": 1501} {"train_loss": -11.727170944213867, "global_step": 252219, "epoch": 1501} {"train_loss": -11.33197021484375, "global_step": 252220, "epoch": 1501} {"train_loss": -11.810537338256836, "global_step": 252221, "epoch": 1501} {"train_loss": -11.834335327148438, "global_step": 252222, "epoch": 1501} {"train_loss": -11.730329513549805, "global_step": 252223, "epoch": 1501} {"train_loss": -11.658699989318848, "global_step": 252224, "epoch": 1501} {"train_loss": -11.807121276855469, "global_step": 252225, "epoch": 1501} {"train_loss": -11.6282320022583, "global_step": 252226, "epoch": 1501} {"train_loss": -11.644349098205566, "global_step": 252227, "epoch": 1501} {"train_loss": -11.739361763000488, "global_step": 252228, "epoch": 1501} {"train_loss": -11.784219741821289, "global_step": 252229, "epoch": 1501} {"train_loss": -11.510078430175781, "global_step": 252230, "epoch": 1501} {"train_loss": -11.382486343383789, "global_step": 252231, "epoch": 1501} {"train_loss": -11.31112289428711, "global_step": 252232, "epoch": 1501} {"train_loss": -11.798320770263672, "global_step": 252233, "epoch": 1501} {"train_loss": -11.620985984802246, "global_step": 252234, "epoch": 1501} {"train_loss": -11.534248352050781, "global_step": 252235, "epoch": 1501} {"train_loss": -12.044339179992676, "global_step": 252236, "epoch": 1501} {"train_loss": -10.979015350341797, "global_step": 252237, "epoch": 1501} {"train_loss": -11.170393943786621, "global_step": 252238, "epoch": 1501} {"train_loss": -11.519253730773926, "global_step": 252239, "epoch": 1501} {"train_loss": -11.823314666748047, "global_step": 252240, "epoch": 1501} {"train_loss": -11.398687362670898, "global_step": 252241, "epoch": 1501} {"train_loss": -11.507508277893066, "global_step": 252242, "epoch": 1501} {"train_loss": -10.941719055175781, "global_step": 252243, "epoch": 1501} {"train_loss": -11.09842300415039, "global_step": 252244, "epoch": 1501} {"train_loss": -9.701593399047852, "global_step": 252245, "epoch": 1501} {"train_loss": -11.166543960571289, "global_step": 252246, "epoch": 1501} {"train_loss": -9.177375793457031, "global_step": 252247, "epoch": 1501} {"train_loss": -9.39219856262207, "global_step": 252248, "epoch": 1501} {"train_loss": -8.735184669494629, "global_step": 252249, "epoch": 1501} {"train_loss": -9.245155334472656, "global_step": 252250, "epoch": 1501} {"train_loss": -8.508554458618164, "global_step": 252251, "epoch": 1501} {"train_loss": -10.452300071716309, "global_step": 252252, "epoch": 1501} {"train_loss": -8.996770858764648, "global_step": 252253, "epoch": 1501} {"train_loss": -7.406663417816162, "global_step": 252254, "epoch": 1501} {"train_loss": -8.537086486816406, "global_step": 252255, "epoch": 1501} {"train_loss": -10.220491409301758, "global_step": 252256, "epoch": 1501} {"train_loss": -10.316518783569336, "global_step": 252257, "epoch": 1501} {"train_loss": -8.6300687789917, "global_step": 252258, "epoch": 1501} {"train_loss": -9.394697189331055, "global_step": 252259, "epoch": 1501} {"train_loss": -9.362096786499023, "global_step": 252260, "epoch": 1501} {"train_loss": -11.212299346923828, "global_step": 252261, "epoch": 1501} {"train_loss": -9.633256912231445, "global_step": 252262, "epoch": 1501} {"train_loss": -10.190969467163086, "global_step": 252263, "epoch": 1501} {"train_loss": -10.64574146270752, "global_step": 252264, "epoch": 1501} {"train_loss": -10.432796478271484, "global_step": 252265, "epoch": 1501} {"train_loss": -10.786760330200195, "global_step": 252266, "epoch": 1501} {"train_loss": -10.734355926513672, "global_step": 252267, "epoch": 1501} {"train_loss": -10.653486251831055, "global_step": 252268, "epoch": 1501} {"train_loss": -10.711002349853516, "global_step": 252269, "epoch": 1501} {"train_loss": -11.428821563720703, "global_step": 252270, "epoch": 1501} {"train_loss": -11.118128776550293, "global_step": 252271, "epoch": 1501} {"train_loss": -10.910720825195312, "global_step": 252272, "epoch": 1501} {"train_loss": -11.642024993896484, "global_step": 252273, "epoch": 1501} {"train_loss": -11.088224411010742, "global_step": 252274, "epoch": 1501} {"train_loss": -11.104406356811523, "global_step": 252275, "epoch": 1501} {"train_loss": -11.307479858398438, "global_step": 252276, "epoch": 1501} {"train_loss": -11.150957107543945, "global_step": 252277, "epoch": 1501} {"train_loss": -11.392047882080078, "global_step": 252278, "epoch": 1501} {"train_loss": -11.182488441467285, "global_step": 252279, "epoch": 1501} {"train_loss": -11.246662139892578, "global_step": 252280, "epoch": 1501} {"train_loss": -11.374624252319336, "global_step": 252281, "epoch": 1501} {"train_loss": -11.263418197631836, "global_step": 252282, "epoch": 1501} {"train_loss": -11.184728622436523, "global_step": 252283, "epoch": 1501} {"train_loss": -11.549590110778809, "global_step": 252284, "epoch": 1501} {"train_loss": -11.033211708068848, "global_step": 252285, "epoch": 1501} {"train_loss": -11.837896347045898, "global_step": 252286, "epoch": 1501} {"train_loss": -11.231856346130371, "global_step": 252287, "epoch": 1501} {"train_loss": -11.54237174987793, "global_step": 252288, "epoch": 1501} {"train_loss": -11.586715698242188, "global_step": 252289, "epoch": 1501} {"train_loss": -11.46213150024414, "global_step": 252290, "epoch": 1501} {"train_loss": -11.420525550842285, "global_step": 252291, "epoch": 1501} {"train_loss": -11.518977165222168, "global_step": 252292, "epoch": 1501} {"train_loss": -11.657886505126953, "global_step": 252293, "epoch": 1501} {"train_loss": -11.606542587280273, "global_step": 252294, "epoch": 1501} {"train_loss": -11.465474128723145, "global_step": 252295, "epoch": 1501} {"train_loss": -11.648683547973633, "global_step": 252296, "epoch": 1501} {"train_loss": -11.452608108520508, "global_step": 252297, "epoch": 1501} {"train_loss": -11.670308113098145, "global_step": 252298, "epoch": 1501} {"train_loss": -11.573127746582031, "global_step": 252299, "epoch": 1501} {"train_loss": -11.599802017211914, "global_step": 252300, "epoch": 1501} {"train_loss": -11.43468952178955, "global_step": 252301, "epoch": 1501} {"train_loss": -11.398672103881836, "global_step": 252302, "epoch": 1501} {"train_loss": -11.745002746582031, "global_step": 252303, "epoch": 1501} {"train_loss": -11.659648895263672, "global_step": 252304, "epoch": 1501} {"train_loss": -11.517492294311523, "global_step": 252305, "epoch": 1501} {"train_loss": -11.185660362243652, "global_step": 252306, "epoch": 1501} {"train_loss": -11.539093017578125, "global_step": 252307, "epoch": 1501} {"train_loss": -11.915098190307617, "global_step": 252308, "epoch": 1501} {"train_loss": -11.605696678161621, "global_step": 252309, "epoch": 1501} {"train_loss": -11.733906745910645, "global_step": 252310, "epoch": 1501} {"train_loss": -11.774009704589844, "global_step": 252311, "epoch": 1501} {"train_loss": -11.588403701782227, "global_step": 252312, "epoch": 1501} {"train_loss": -11.89744758605957, "global_step": 252313, "epoch": 1501} {"train_loss": -11.972200393676758, "global_step": 252314, "epoch": 1501} {"train_loss": -11.519740104675293, "global_step": 252315, "epoch": 1501} {"train_loss": -11.787206649780273, "global_step": 252316, "epoch": 1501} {"train_loss": -11.769723892211914, "global_step": 252317, "epoch": 1501} {"train_loss": -11.916318893432617, "global_step": 252318, "epoch": 1501} {"train_loss": -11.971430778503418, "global_step": 252319, "epoch": 1501} {"train_loss": -12.025092124938965, "global_step": 252320, "epoch": 1501} {"train_loss": -11.81628131866455, "global_step": 252321, "epoch": 1501} {"train_loss": -11.988625526428223, "global_step": 252322, "epoch": 1501} {"train_loss": -11.937084197998047, "global_step": 252323, "epoch": 1501} {"train_loss": -12.061895370483398, "global_step": 252324, "epoch": 1501} {"train_loss": -12.18527603149414, "global_step": 252325, "epoch": 1501} {"train_loss": -11.935805320739746, "global_step": 252326, "epoch": 1501} {"train_loss": -12.119688034057617, "global_step": 252327, "epoch": 1501} {"train_loss": -11.97896957397461, "global_step": 252328, "epoch": 1501} {"train_loss": -11.935957908630371, "global_step": 252329, "epoch": 1501} {"train_loss": -12.001466751098633, "global_step": 252330, "epoch": 1501} {"train_loss": -12.03023624420166, "global_step": 252331, "epoch": 1501} {"train_loss": -11.66137409210205, "global_step": 252332, "epoch": 1501} {"train_loss": -11.983467102050781, "global_step": 252333, "epoch": 1501} {"train_loss": -11.928509712219238, "global_step": 252334, "epoch": 1501} {"train_loss": -11.355491448016394, "global_step": 252335, "epoch": 1501, "val_loss": 265140.84375} {"train_loss": -11.985535621643066, "global_step": 252336, "epoch": 1502} {"train_loss": -11.97169303894043, "global_step": 252337, "epoch": 1502} {"train_loss": -12.07811450958252, "global_step": 252338, "epoch": 1502} {"train_loss": -12.21121883392334, "global_step": 252339, "epoch": 1502} {"train_loss": -12.114407539367676, "global_step": 252340, "epoch": 1502} {"train_loss": -12.196199417114258, "global_step": 252341, "epoch": 1502} {"train_loss": -12.0138578414917, "global_step": 252342, "epoch": 1502} {"train_loss": -12.035128593444824, "global_step": 252343, "epoch": 1502} {"train_loss": -12.144147872924805, "global_step": 252344, "epoch": 1502} {"train_loss": -12.09260368347168, "global_step": 252345, "epoch": 1502} {"train_loss": -12.179893493652344, "global_step": 252346, "epoch": 1502} {"train_loss": -12.040590286254883, "global_step": 252347, "epoch": 1502} {"train_loss": -12.269609451293945, "global_step": 252348, "epoch": 1502} {"train_loss": -11.994136810302734, "global_step": 252349, "epoch": 1502} {"train_loss": -12.14592170715332, "global_step": 252350, "epoch": 1502} {"train_loss": -12.173004150390625, "global_step": 252351, "epoch": 1502} {"train_loss": -12.057759284973145, "global_step": 252352, "epoch": 1502} {"train_loss": -12.100462913513184, "global_step": 252353, "epoch": 1502} {"train_loss": -12.034584045410156, "global_step": 252354, "epoch": 1502} {"train_loss": -12.193851470947266, "global_step": 252355, "epoch": 1502} {"train_loss": -12.08251667022705, "global_step": 252356, "epoch": 1502} {"train_loss": -12.2290678024292, "global_step": 252357, "epoch": 1502} {"train_loss": -12.39234733581543, "global_step": 252358, "epoch": 1502} {"train_loss": -12.267178535461426, "global_step": 252359, "epoch": 1502} {"train_loss": -12.222338676452637, "global_step": 252360, "epoch": 1502} {"train_loss": -12.247612953186035, "global_step": 252361, "epoch": 1502} {"train_loss": -12.308964729309082, "global_step": 252362, "epoch": 1502} {"train_loss": -11.928583145141602, "global_step": 252363, "epoch": 1502} {"train_loss": -11.665853500366211, "global_step": 252364, "epoch": 1502} {"train_loss": -11.235867500305176, "global_step": 252365, "epoch": 1502} {"train_loss": -12.025106430053711, "global_step": 252366, "epoch": 1502} {"train_loss": -12.124906539916992, "global_step": 252367, "epoch": 1502} {"train_loss": -12.171897888183594, "global_step": 252368, "epoch": 1502} {"train_loss": -11.879631042480469, "global_step": 252369, "epoch": 1502} {"train_loss": -11.634373664855957, "global_step": 252370, "epoch": 1502} {"train_loss": -11.267549514770508, "global_step": 252371, "epoch": 1502} {"train_loss": -12.075028419494629, "global_step": 252372, "epoch": 1502} {"train_loss": -12.136950492858887, "global_step": 252373, "epoch": 1502} {"train_loss": -10.930980682373047, "global_step": 252374, "epoch": 1502} {"train_loss": -10.47894287109375, "global_step": 252375, "epoch": 1502} {"train_loss": -10.381182670593262, "global_step": 252376, "epoch": 1502} {"train_loss": -12.04970932006836, "global_step": 252377, "epoch": 1502} {"train_loss": -11.676238059997559, "global_step": 252378, "epoch": 1502} {"train_loss": -11.288946151733398, "global_step": 252379, "epoch": 1502} {"train_loss": -11.258148193359375, "global_step": 252380, "epoch": 1502} {"train_loss": -11.79895305633545, "global_step": 252381, "epoch": 1502} {"train_loss": -11.833032608032227, "global_step": 252382, "epoch": 1502} {"train_loss": -11.872137069702148, "global_step": 252383, "epoch": 1502} {"train_loss": -10.88483715057373, "global_step": 252384, "epoch": 1502} {"train_loss": -12.070002555847168, "global_step": 252385, "epoch": 1502} {"train_loss": -10.76287841796875, "global_step": 252386, "epoch": 1502} {"train_loss": -12.096879959106445, "global_step": 252387, "epoch": 1502} {"train_loss": -10.483694076538086, "global_step": 252388, "epoch": 1502} {"train_loss": -11.532228469848633, "global_step": 252389, "epoch": 1502} {"train_loss": -9.540386199951172, "global_step": 252390, "epoch": 1502} {"train_loss": -11.933972358703613, "global_step": 252391, "epoch": 1502} {"train_loss": -9.5107421875, "global_step": 252392, "epoch": 1502} {"train_loss": -11.110421180725098, "global_step": 252393, "epoch": 1502} {"train_loss": -10.590120315551758, "global_step": 252394, "epoch": 1502} {"train_loss": -11.109769821166992, "global_step": 252395, "epoch": 1502} {"train_loss": -11.40413761138916, "global_step": 252396, "epoch": 1502} {"train_loss": -11.365396499633789, "global_step": 252397, "epoch": 1502} {"train_loss": -11.642692565917969, "global_step": 252398, "epoch": 1502} {"train_loss": -12.05985164642334, "global_step": 252399, "epoch": 1502} {"train_loss": -11.460108757019043, "global_step": 252400, "epoch": 1502} {"train_loss": -11.578741073608398, "global_step": 252401, "epoch": 1502} {"train_loss": -11.380471229553223, "global_step": 252402, "epoch": 1502} {"train_loss": -11.221376419067383, "global_step": 252403, "epoch": 1502} {"train_loss": -11.712059020996094, "global_step": 252404, "epoch": 1502} {"train_loss": -11.173681259155273, "global_step": 252405, "epoch": 1502} {"train_loss": -11.500726699829102, "global_step": 252406, "epoch": 1502} {"train_loss": -11.378190994262695, "global_step": 252407, "epoch": 1502} {"train_loss": -11.875176429748535, "global_step": 252408, "epoch": 1502} {"train_loss": -11.63710880279541, "global_step": 252409, "epoch": 1502} {"train_loss": -11.242177963256836, "global_step": 252410, "epoch": 1502} {"train_loss": -11.859624862670898, "global_step": 252411, "epoch": 1502} {"train_loss": -11.867359161376953, "global_step": 252412, "epoch": 1502} {"train_loss": -11.617032051086426, "global_step": 252413, "epoch": 1502} {"train_loss": -11.806497573852539, "global_step": 252414, "epoch": 1502} {"train_loss": -11.490338325500488, "global_step": 252415, "epoch": 1502} {"train_loss": -11.82061767578125, "global_step": 252416, "epoch": 1502} {"train_loss": -11.767561912536621, "global_step": 252417, "epoch": 1502} {"train_loss": -11.6776762008667, "global_step": 252418, "epoch": 1502} {"train_loss": -11.805708885192871, "global_step": 252419, "epoch": 1502} {"train_loss": -11.742635726928711, "global_step": 252420, "epoch": 1502} {"train_loss": -11.738665580749512, "global_step": 252421, "epoch": 1502} {"train_loss": -11.888275146484375, "global_step": 252422, "epoch": 1502} {"train_loss": -11.896484375, "global_step": 252423, "epoch": 1502} {"train_loss": -11.992536544799805, "global_step": 252424, "epoch": 1502} {"train_loss": -11.850629806518555, "global_step": 252425, "epoch": 1502} {"train_loss": -12.029993057250977, "global_step": 252426, "epoch": 1502} {"train_loss": -11.956135749816895, "global_step": 252427, "epoch": 1502} {"train_loss": -11.855473518371582, "global_step": 252428, "epoch": 1502} {"train_loss": -12.059673309326172, "global_step": 252429, "epoch": 1502} {"train_loss": -11.810091018676758, "global_step": 252430, "epoch": 1502} {"train_loss": -12.001384735107422, "global_step": 252431, "epoch": 1502} {"train_loss": -11.941712379455566, "global_step": 252432, "epoch": 1502} {"train_loss": -12.034153938293457, "global_step": 252433, "epoch": 1502} {"train_loss": -11.964914321899414, "global_step": 252434, "epoch": 1502} {"train_loss": -11.9315185546875, "global_step": 252435, "epoch": 1502} {"train_loss": -11.808778762817383, "global_step": 252436, "epoch": 1502} {"train_loss": -12.028890609741211, "global_step": 252437, "epoch": 1502} {"train_loss": -11.608414649963379, "global_step": 252438, "epoch": 1502} {"train_loss": -11.692716598510742, "global_step": 252439, "epoch": 1502} {"train_loss": -12.189364433288574, "global_step": 252440, "epoch": 1502} {"train_loss": -11.633953094482422, "global_step": 252441, "epoch": 1502} {"train_loss": -11.934123039245605, "global_step": 252442, "epoch": 1502} {"train_loss": -11.679302215576172, "global_step": 252443, "epoch": 1502} {"train_loss": -11.994007110595703, "global_step": 252444, "epoch": 1502} {"train_loss": -11.773061752319336, "global_step": 252445, "epoch": 1502} {"train_loss": -11.8909912109375, "global_step": 252446, "epoch": 1502} {"train_loss": -11.62076187133789, "global_step": 252447, "epoch": 1502} {"train_loss": -12.188127517700195, "global_step": 252448, "epoch": 1502} {"train_loss": -11.97961139678955, "global_step": 252449, "epoch": 1502} {"train_loss": -12.043254852294922, "global_step": 252450, "epoch": 1502} {"train_loss": -11.593183517456055, "global_step": 252451, "epoch": 1502} {"train_loss": -11.844408988952637, "global_step": 252452, "epoch": 1502} {"train_loss": -12.139827728271484, "global_step": 252453, "epoch": 1502} {"train_loss": -11.718586921691895, "global_step": 252454, "epoch": 1502} {"train_loss": -11.899662017822266, "global_step": 252455, "epoch": 1502} {"train_loss": -11.838702201843262, "global_step": 252456, "epoch": 1502} {"train_loss": -11.956003189086914, "global_step": 252457, "epoch": 1502} {"train_loss": -11.60067367553711, "global_step": 252458, "epoch": 1502} {"train_loss": -11.210888862609863, "global_step": 252459, "epoch": 1502} {"train_loss": -11.53719711303711, "global_step": 252460, "epoch": 1502} {"train_loss": -11.549530029296875, "global_step": 252461, "epoch": 1502} {"train_loss": -11.81843376159668, "global_step": 252462, "epoch": 1502} {"train_loss": -10.61396598815918, "global_step": 252463, "epoch": 1502} {"train_loss": -11.795061111450195, "global_step": 252464, "epoch": 1502} {"train_loss": -10.711092948913574, "global_step": 252465, "epoch": 1502} {"train_loss": -11.141934394836426, "global_step": 252466, "epoch": 1502} {"train_loss": -11.23337459564209, "global_step": 252467, "epoch": 1502} {"train_loss": -10.988106727600098, "global_step": 252468, "epoch": 1502} {"train_loss": -11.107954025268555, "global_step": 252469, "epoch": 1502} {"train_loss": -10.80394172668457, "global_step": 252470, "epoch": 1502} {"train_loss": -10.648465156555176, "global_step": 252471, "epoch": 1502} {"train_loss": -11.19576644897461, "global_step": 252472, "epoch": 1502} {"train_loss": -10.280059814453125, "global_step": 252473, "epoch": 1502} {"train_loss": -11.537919998168945, "global_step": 252474, "epoch": 1502} {"train_loss": -10.210359573364258, "global_step": 252475, "epoch": 1502} {"train_loss": -11.379090309143066, "global_step": 252476, "epoch": 1502} {"train_loss": -11.004851341247559, "global_step": 252477, "epoch": 1502} {"train_loss": -10.770907402038574, "global_step": 252478, "epoch": 1502} {"train_loss": -11.440677642822266, "global_step": 252479, "epoch": 1502} {"train_loss": -10.937416076660156, "global_step": 252480, "epoch": 1502} {"train_loss": -11.554872512817383, "global_step": 252481, "epoch": 1502} {"train_loss": -11.054619789123535, "global_step": 252482, "epoch": 1502} {"train_loss": -11.630706787109375, "global_step": 252483, "epoch": 1502} {"train_loss": -11.070600509643555, "global_step": 252484, "epoch": 1502} {"train_loss": -11.407814979553223, "global_step": 252485, "epoch": 1502} {"train_loss": -11.360424041748047, "global_step": 252486, "epoch": 1502} {"train_loss": -11.269306182861328, "global_step": 252487, "epoch": 1502} {"train_loss": -11.233362197875977, "global_step": 252488, "epoch": 1502} {"train_loss": -10.966852188110352, "global_step": 252489, "epoch": 1502} {"train_loss": -11.590836524963379, "global_step": 252490, "epoch": 1502} {"train_loss": -11.115740776062012, "global_step": 252491, "epoch": 1502} {"train_loss": -11.651939392089844, "global_step": 252492, "epoch": 1502} {"train_loss": -11.046379089355469, "global_step": 252493, "epoch": 1502} {"train_loss": -11.57837200164795, "global_step": 252494, "epoch": 1502} {"train_loss": -11.240007400512695, "global_step": 252495, "epoch": 1502} {"train_loss": -11.805782318115234, "global_step": 252496, "epoch": 1502} {"train_loss": -11.615316390991211, "global_step": 252497, "epoch": 1502} {"train_loss": -11.88894271850586, "global_step": 252498, "epoch": 1502} {"train_loss": -11.72901439666748, "global_step": 252499, "epoch": 1502} {"train_loss": -11.443358421325684, "global_step": 252500, "epoch": 1502} {"train_loss": -11.925863265991211, "global_step": 252501, "epoch": 1502} {"train_loss": -11.770959854125977, "global_step": 252502, "epoch": 1502} {"train_loss": -11.621123160634722, "global_step": 252503, "epoch": 1502, "val_loss": 271237.9375} {"train_loss": -11.857812881469727, "global_step": 252504, "epoch": 1503} {"train_loss": -11.498970985412598, "global_step": 252505, "epoch": 1503} {"train_loss": -11.51779556274414, "global_step": 252506, "epoch": 1503} {"train_loss": -11.70016098022461, "global_step": 252507, "epoch": 1503} {"train_loss": -11.185891151428223, "global_step": 252508, "epoch": 1503} {"train_loss": -11.809782981872559, "global_step": 252509, "epoch": 1503} {"train_loss": -11.708541870117188, "global_step": 252510, "epoch": 1503} {"train_loss": -11.709664344787598, "global_step": 252511, "epoch": 1503} {"train_loss": -11.887558937072754, "global_step": 252512, "epoch": 1503} {"train_loss": -11.421194076538086, "global_step": 252513, "epoch": 1503} {"train_loss": -11.737275123596191, "global_step": 252514, "epoch": 1503} {"train_loss": -11.807554244995117, "global_step": 252515, "epoch": 1503} {"train_loss": -11.761137008666992, "global_step": 252516, "epoch": 1503} {"train_loss": -11.681621551513672, "global_step": 252517, "epoch": 1503} {"train_loss": -11.893373489379883, "global_step": 252518, "epoch": 1503} {"train_loss": -11.576183319091797, "global_step": 252519, "epoch": 1503} {"train_loss": -11.8487548828125, "global_step": 252520, "epoch": 1503} {"train_loss": -11.710969924926758, "global_step": 252521, "epoch": 1503} {"train_loss": -11.996545791625977, "global_step": 252522, "epoch": 1503} {"train_loss": -11.701282501220703, "global_step": 252523, "epoch": 1503} {"train_loss": -11.977828979492188, "global_step": 252524, "epoch": 1503} {"train_loss": -11.829031944274902, "global_step": 252525, "epoch": 1503} {"train_loss": -11.875765800476074, "global_step": 252526, "epoch": 1503} {"train_loss": -12.058819770812988, "global_step": 252527, "epoch": 1503} {"train_loss": -11.664375305175781, "global_step": 252528, "epoch": 1503} {"train_loss": -11.990009307861328, "global_step": 252529, "epoch": 1503} {"train_loss": -11.880396842956543, "global_step": 252530, "epoch": 1503} {"train_loss": -11.89907455444336, "global_step": 252531, "epoch": 1503} {"train_loss": -11.848888397216797, "global_step": 252532, "epoch": 1503} {"train_loss": -11.917696952819824, "global_step": 252533, "epoch": 1503} {"train_loss": -12.178189277648926, "global_step": 252534, "epoch": 1503} {"train_loss": -12.065670013427734, "global_step": 252535, "epoch": 1503} {"train_loss": -11.903341293334961, "global_step": 252536, "epoch": 1503} {"train_loss": -12.142149925231934, "global_step": 252537, "epoch": 1503} {"train_loss": -11.946908950805664, "global_step": 252538, "epoch": 1503} {"train_loss": -11.919028282165527, "global_step": 252539, "epoch": 1503} {"train_loss": -11.994719505310059, "global_step": 252540, "epoch": 1503} {"train_loss": -11.905470848083496, "global_step": 252541, "epoch": 1503} {"train_loss": -12.017122268676758, "global_step": 252542, "epoch": 1503} {"train_loss": -11.998527526855469, "global_step": 252543, "epoch": 1503} {"train_loss": -12.025611877441406, "global_step": 252544, "epoch": 1503} {"train_loss": -12.112759590148926, "global_step": 252545, "epoch": 1503} {"train_loss": -12.017570495605469, "global_step": 252546, "epoch": 1503} {"train_loss": -12.075127601623535, "global_step": 252547, "epoch": 1503} {"train_loss": -12.031357765197754, "global_step": 252548, "epoch": 1503} {"train_loss": -12.345785140991211, "global_step": 252549, "epoch": 1503} {"train_loss": -12.156442642211914, "global_step": 252550, "epoch": 1503} {"train_loss": -12.048478126525879, "global_step": 252551, "epoch": 1503} {"train_loss": -12.10515308380127, "global_step": 252552, "epoch": 1503} {"train_loss": -12.047370910644531, "global_step": 252553, "epoch": 1503} {"train_loss": -12.080706596374512, "global_step": 252554, "epoch": 1503} {"train_loss": -12.319127082824707, "global_step": 252555, "epoch": 1503} {"train_loss": -12.116304397583008, "global_step": 252556, "epoch": 1503} {"train_loss": -12.316669464111328, "global_step": 252557, "epoch": 1503} {"train_loss": -12.024374008178711, "global_step": 252558, "epoch": 1503} {"train_loss": -12.02648639678955, "global_step": 252559, "epoch": 1503} {"train_loss": -11.75246524810791, "global_step": 252560, "epoch": 1503} {"train_loss": -12.27529525756836, "global_step": 252561, "epoch": 1503} {"train_loss": -12.196462631225586, "global_step": 252562, "epoch": 1503} {"train_loss": -11.739012718200684, "global_step": 252563, "epoch": 1503} {"train_loss": -10.791625022888184, "global_step": 252564, "epoch": 1503} {"train_loss": -10.36715316772461, "global_step": 252565, "epoch": 1503} {"train_loss": -11.147443771362305, "global_step": 252566, "epoch": 1503} {"train_loss": -9.440343856811523, "global_step": 252567, "epoch": 1503} {"train_loss": -7.34672212600708, "global_step": 252568, "epoch": 1503} {"train_loss": -5.700619220733643, "global_step": 252569, "epoch": 1503} {"train_loss": -6.230415344238281, "global_step": 252570, "epoch": 1503} {"train_loss": -6.507833480834961, "global_step": 252571, "epoch": 1503} {"train_loss": -6.830020904541016, "global_step": 252572, "epoch": 1503} {"train_loss": -6.068106651306152, "global_step": 252573, "epoch": 1503} {"train_loss": -7.25234842300415, "global_step": 252574, "epoch": 1503} {"train_loss": -6.583205223083496, "global_step": 252575, "epoch": 1503} {"train_loss": -7.495922088623047, "global_step": 252576, "epoch": 1503} {"train_loss": -7.700061798095703, "global_step": 252577, "epoch": 1503} {"train_loss": -8.320735931396484, "global_step": 252578, "epoch": 1503} {"train_loss": -8.19782829284668, "global_step": 252579, "epoch": 1503} {"train_loss": -8.310710906982422, "global_step": 252580, "epoch": 1503} {"train_loss": -8.693950653076172, "global_step": 252581, "epoch": 1503} {"train_loss": -8.571329116821289, "global_step": 252582, "epoch": 1503} {"train_loss": -7.731990814208984, "global_step": 252583, "epoch": 1503} {"train_loss": -7.824549674987793, "global_step": 252584, "epoch": 1503} {"train_loss": -8.585184097290039, "global_step": 252585, "epoch": 1503} {"train_loss": -9.123950958251953, "global_step": 252586, "epoch": 1503} {"train_loss": -8.318958282470703, "global_step": 252587, "epoch": 1503} {"train_loss": -9.494483947753906, "global_step": 252588, "epoch": 1503} {"train_loss": -9.070221900939941, "global_step": 252589, "epoch": 1503} {"train_loss": -10.050457000732422, "global_step": 252590, "epoch": 1503} {"train_loss": -10.682865142822266, "global_step": 252591, "epoch": 1503} {"train_loss": -9.104838371276855, "global_step": 252592, "epoch": 1503} {"train_loss": -10.894540786743164, "global_step": 252593, "epoch": 1503} {"train_loss": -8.925878524780273, "global_step": 252594, "epoch": 1503} {"train_loss": -9.491127967834473, "global_step": 252595, "epoch": 1503} {"train_loss": -8.905211448669434, "global_step": 252596, "epoch": 1503} {"train_loss": -10.133678436279297, "global_step": 252597, "epoch": 1503} {"train_loss": -9.843503952026367, "global_step": 252598, "epoch": 1503} {"train_loss": -9.780512809753418, "global_step": 252599, "epoch": 1503} {"train_loss": -11.272928237915039, "global_step": 252600, "epoch": 1503} {"train_loss": -10.722007751464844, "global_step": 252601, "epoch": 1503} {"train_loss": -10.884027481079102, "global_step": 252602, "epoch": 1503} {"train_loss": -10.621587753295898, "global_step": 252603, "epoch": 1503} {"train_loss": -10.974550247192383, "global_step": 252604, "epoch": 1503} {"train_loss": -10.948172569274902, "global_step": 252605, "epoch": 1503} {"train_loss": -11.282917022705078, "global_step": 252606, "epoch": 1503} {"train_loss": -11.264139175415039, "global_step": 252607, "epoch": 1503} {"train_loss": -11.075860977172852, "global_step": 252608, "epoch": 1503} {"train_loss": -11.170246124267578, "global_step": 252609, "epoch": 1503} {"train_loss": -11.58047866821289, "global_step": 252610, "epoch": 1503} {"train_loss": -11.07154369354248, "global_step": 252611, "epoch": 1503} {"train_loss": -11.502886772155762, "global_step": 252612, "epoch": 1503} {"train_loss": -11.573741912841797, "global_step": 252613, "epoch": 1503} {"train_loss": -11.193312644958496, "global_step": 252614, "epoch": 1503} {"train_loss": -11.228693008422852, "global_step": 252615, "epoch": 1503} {"train_loss": -11.632326126098633, "global_step": 252616, "epoch": 1503} {"train_loss": -11.437328338623047, "global_step": 252617, "epoch": 1503} {"train_loss": -11.553768157958984, "global_step": 252618, "epoch": 1503} {"train_loss": -11.515016555786133, "global_step": 252619, "epoch": 1503} {"train_loss": -11.454659461975098, "global_step": 252620, "epoch": 1503} {"train_loss": -11.702661514282227, "global_step": 252621, "epoch": 1503} {"train_loss": -11.524202346801758, "global_step": 252622, "epoch": 1503} {"train_loss": -11.788846969604492, "global_step": 252623, "epoch": 1503} {"train_loss": -11.484054565429688, "global_step": 252624, "epoch": 1503} {"train_loss": -11.68562126159668, "global_step": 252625, "epoch": 1503} {"train_loss": -11.556497573852539, "global_step": 252626, "epoch": 1503} {"train_loss": -11.442415237426758, "global_step": 252627, "epoch": 1503} {"train_loss": -12.003585815429688, "global_step": 252628, "epoch": 1503} {"train_loss": -11.531217575073242, "global_step": 252629, "epoch": 1503} {"train_loss": -11.632123947143555, "global_step": 252630, "epoch": 1503} {"train_loss": -11.63227367401123, "global_step": 252631, "epoch": 1503} {"train_loss": -11.48965072631836, "global_step": 252632, "epoch": 1503} {"train_loss": -11.6138277053833, "global_step": 252633, "epoch": 1503} {"train_loss": -11.569417953491211, "global_step": 252634, "epoch": 1503} {"train_loss": -11.7162504196167, "global_step": 252635, "epoch": 1503} {"train_loss": -11.619745254516602, "global_step": 252636, "epoch": 1503} {"train_loss": -11.895115852355957, "global_step": 252637, "epoch": 1503} {"train_loss": -11.612343788146973, "global_step": 252638, "epoch": 1503} {"train_loss": -11.9754638671875, "global_step": 252639, "epoch": 1503} {"train_loss": -11.59921646118164, "global_step": 252640, "epoch": 1503} {"train_loss": -11.844768524169922, "global_step": 252641, "epoch": 1503} {"train_loss": -11.872308731079102, "global_step": 252642, "epoch": 1503} {"train_loss": -11.789205551147461, "global_step": 252643, "epoch": 1503} {"train_loss": -11.837482452392578, "global_step": 252644, "epoch": 1503} {"train_loss": -11.86695671081543, "global_step": 252645, "epoch": 1503} {"train_loss": -11.788171768188477, "global_step": 252646, "epoch": 1503} {"train_loss": -11.797895431518555, "global_step": 252647, "epoch": 1503} {"train_loss": -11.871477127075195, "global_step": 252648, "epoch": 1503} {"train_loss": -11.848930358886719, "global_step": 252649, "epoch": 1503} {"train_loss": -11.955524444580078, "global_step": 252650, "epoch": 1503} {"train_loss": -11.851729393005371, "global_step": 252651, "epoch": 1503} {"train_loss": -11.99724006652832, "global_step": 252652, "epoch": 1503} {"train_loss": -11.647032737731934, "global_step": 252653, "epoch": 1503} {"train_loss": -11.778318405151367, "global_step": 252654, "epoch": 1503} {"train_loss": -11.802671432495117, "global_step": 252655, "epoch": 1503} {"train_loss": -11.746978759765625, "global_step": 252656, "epoch": 1503} {"train_loss": -12.006624221801758, "global_step": 252657, "epoch": 1503} {"train_loss": -12.062867164611816, "global_step": 252658, "epoch": 1503} {"train_loss": -12.074304580688477, "global_step": 252659, "epoch": 1503} {"train_loss": -12.117321014404297, "global_step": 252660, "epoch": 1503} {"train_loss": -12.345437049865723, "global_step": 252661, "epoch": 1503} {"train_loss": -12.141005516052246, "global_step": 252662, "epoch": 1503} {"train_loss": -11.84674072265625, "global_step": 252663, "epoch": 1503} {"train_loss": -11.917259216308594, "global_step": 252664, "epoch": 1503} {"train_loss": -12.003440856933594, "global_step": 252665, "epoch": 1503} {"train_loss": -12.195631980895996, "global_step": 252666, "epoch": 1503} {"train_loss": -12.285711288452148, "global_step": 252667, "epoch": 1503} {"train_loss": -12.144643783569336, "global_step": 252668, "epoch": 1503} {"train_loss": -12.089001655578613, "global_step": 252669, "epoch": 1503} {"train_loss": -11.954028129577637, "global_step": 252670, "epoch": 1503} {"train_loss": -11.09559511854535, "global_step": 252671, "epoch": 1503, "val_loss": 267043.5} {"train_loss": -12.22616958618164, "global_step": 252672, "epoch": 1504} {"train_loss": -11.918859481811523, "global_step": 252673, "epoch": 1504} {"train_loss": -12.042961120605469, "global_step": 252674, "epoch": 1504} {"train_loss": -12.108743667602539, "global_step": 252675, "epoch": 1504} {"train_loss": -12.15078353881836, "global_step": 252676, "epoch": 1504} {"train_loss": -12.136547088623047, "global_step": 252677, "epoch": 1504} {"train_loss": -12.100740432739258, "global_step": 252678, "epoch": 1504} {"train_loss": -12.24031925201416, "global_step": 252679, "epoch": 1504} {"train_loss": -12.10640811920166, "global_step": 252680, "epoch": 1504} {"train_loss": -12.097427368164062, "global_step": 252681, "epoch": 1504} {"train_loss": -12.224191665649414, "global_step": 252682, "epoch": 1504} {"train_loss": -12.168386459350586, "global_step": 252683, "epoch": 1504} {"train_loss": -12.107063293457031, "global_step": 252684, "epoch": 1504} {"train_loss": -12.214556694030762, "global_step": 252685, "epoch": 1504} {"train_loss": -12.165376663208008, "global_step": 252686, "epoch": 1504} {"train_loss": -12.003569602966309, "global_step": 252687, "epoch": 1504} {"train_loss": -12.306766510009766, "global_step": 252688, "epoch": 1504} {"train_loss": -11.409406661987305, "global_step": 252689, "epoch": 1504} {"train_loss": -11.195371627807617, "global_step": 252690, "epoch": 1504} {"train_loss": -10.113420486450195, "global_step": 252691, "epoch": 1504} {"train_loss": -9.752431869506836, "global_step": 252692, "epoch": 1504} {"train_loss": -11.39002513885498, "global_step": 252693, "epoch": 1504} {"train_loss": -11.893377304077148, "global_step": 252694, "epoch": 1504} {"train_loss": -11.199234008789062, "global_step": 252695, "epoch": 1504} {"train_loss": -10.88620662689209, "global_step": 252696, "epoch": 1504} {"train_loss": -10.569807052612305, "global_step": 252697, "epoch": 1504} {"train_loss": -11.614667892456055, "global_step": 252698, "epoch": 1504} {"train_loss": -10.712087631225586, "global_step": 252699, "epoch": 1504} {"train_loss": -10.36340618133545, "global_step": 252700, "epoch": 1504} {"train_loss": -10.688642501831055, "global_step": 252701, "epoch": 1504} {"train_loss": -11.218903541564941, "global_step": 252702, "epoch": 1504} {"train_loss": -11.13078498840332, "global_step": 252703, "epoch": 1504} {"train_loss": -9.486737251281738, "global_step": 252704, "epoch": 1504} {"train_loss": -11.091594696044922, "global_step": 252705, "epoch": 1504} {"train_loss": -10.514328002929688, "global_step": 252706, "epoch": 1504} {"train_loss": -9.638908386230469, "global_step": 252707, "epoch": 1504} {"train_loss": -10.575994491577148, "global_step": 252708, "epoch": 1504} {"train_loss": -8.798197746276855, "global_step": 252709, "epoch": 1504} {"train_loss": -9.300582885742188, "global_step": 252710, "epoch": 1504} {"train_loss": -9.489550590515137, "global_step": 252711, "epoch": 1504} {"train_loss": -10.306368827819824, "global_step": 252712, "epoch": 1504} {"train_loss": -8.660128593444824, "global_step": 252713, "epoch": 1504} {"train_loss": -9.309656143188477, "global_step": 252714, "epoch": 1504} {"train_loss": -10.50605583190918, "global_step": 252715, "epoch": 1504} {"train_loss": -10.170668601989746, "global_step": 252716, "epoch": 1504} {"train_loss": -9.852987289428711, "global_step": 252717, "epoch": 1504} {"train_loss": -9.64816665649414, "global_step": 252718, "epoch": 1504} {"train_loss": -10.638792037963867, "global_step": 252719, "epoch": 1504} {"train_loss": -10.342035293579102, "global_step": 252720, "epoch": 1504} {"train_loss": -10.71140193939209, "global_step": 252721, "epoch": 1504} {"train_loss": -10.430927276611328, "global_step": 252722, "epoch": 1504} {"train_loss": -11.361483573913574, "global_step": 252723, "epoch": 1504} {"train_loss": -10.903154373168945, "global_step": 252724, "epoch": 1504} {"train_loss": -11.426023483276367, "global_step": 252725, "epoch": 1504} {"train_loss": -10.809537887573242, "global_step": 252726, "epoch": 1504} {"train_loss": -10.663847923278809, "global_step": 252727, "epoch": 1504} {"train_loss": -10.9534273147583, "global_step": 252728, "epoch": 1504} {"train_loss": -10.63994026184082, "global_step": 252729, "epoch": 1504} {"train_loss": -11.40170669555664, "global_step": 252730, "epoch": 1504} {"train_loss": -10.826416015625, "global_step": 252731, "epoch": 1504} {"train_loss": -10.96121883392334, "global_step": 252732, "epoch": 1504} {"train_loss": -11.193398475646973, "global_step": 252733, "epoch": 1504} {"train_loss": -11.227941513061523, "global_step": 252734, "epoch": 1504} {"train_loss": -11.379517555236816, "global_step": 252735, "epoch": 1504} {"train_loss": -11.402109146118164, "global_step": 252736, "epoch": 1504} {"train_loss": -11.544623374938965, "global_step": 252737, "epoch": 1504} {"train_loss": -11.588029861450195, "global_step": 252738, "epoch": 1504} {"train_loss": -11.291971206665039, "global_step": 252739, "epoch": 1504} {"train_loss": -11.539422035217285, "global_step": 252740, "epoch": 1504} {"train_loss": -11.480489730834961, "global_step": 252741, "epoch": 1504} {"train_loss": -11.209954261779785, "global_step": 252742, "epoch": 1504} {"train_loss": -11.459003448486328, "global_step": 252743, "epoch": 1504} {"train_loss": -11.364002227783203, "global_step": 252744, "epoch": 1504} {"train_loss": -11.4127197265625, "global_step": 252745, "epoch": 1504} {"train_loss": -11.690255165100098, "global_step": 252746, "epoch": 1504} {"train_loss": -11.461053848266602, "global_step": 252747, "epoch": 1504} {"train_loss": -11.538116455078125, "global_step": 252748, "epoch": 1504} {"train_loss": -11.403179168701172, "global_step": 252749, "epoch": 1504} {"train_loss": -11.66678237915039, "global_step": 252750, "epoch": 1504} {"train_loss": -11.572463035583496, "global_step": 252751, "epoch": 1504} {"train_loss": -11.6251859664917, "global_step": 252752, "epoch": 1504} {"train_loss": -11.673796653747559, "global_step": 252753, "epoch": 1504} {"train_loss": -11.694904327392578, "global_step": 252754, "epoch": 1504} {"train_loss": -11.79448413848877, "global_step": 252755, "epoch": 1504} {"train_loss": -11.540548324584961, "global_step": 252756, "epoch": 1504} {"train_loss": -11.765861511230469, "global_step": 252757, "epoch": 1504} {"train_loss": -11.705045700073242, "global_step": 252758, "epoch": 1504} {"train_loss": -11.658226013183594, "global_step": 252759, "epoch": 1504} {"train_loss": -11.879863739013672, "global_step": 252760, "epoch": 1504} {"train_loss": -11.648744583129883, "global_step": 252761, "epoch": 1504} {"train_loss": -11.887359619140625, "global_step": 252762, "epoch": 1504} {"train_loss": -11.720251083374023, "global_step": 252763, "epoch": 1504} {"train_loss": -11.7672700881958, "global_step": 252764, "epoch": 1504} {"train_loss": -11.838926315307617, "global_step": 252765, "epoch": 1504} {"train_loss": -11.824527740478516, "global_step": 252766, "epoch": 1504} {"train_loss": -11.834944725036621, "global_step": 252767, "epoch": 1504} {"train_loss": -11.989839553833008, "global_step": 252768, "epoch": 1504} {"train_loss": -11.807708740234375, "global_step": 252769, "epoch": 1504} {"train_loss": -11.963180541992188, "global_step": 252770, "epoch": 1504} {"train_loss": -12.111783981323242, "global_step": 252771, "epoch": 1504} {"train_loss": -11.903055191040039, "global_step": 252772, "epoch": 1504} {"train_loss": -11.799161911010742, "global_step": 252773, "epoch": 1504} {"train_loss": -11.918601989746094, "global_step": 252774, "epoch": 1504} {"train_loss": -11.959867477416992, "global_step": 252775, "epoch": 1504} {"train_loss": -12.273042678833008, "global_step": 252776, "epoch": 1504} {"train_loss": -12.12601089477539, "global_step": 252777, "epoch": 1504} {"train_loss": -12.06510066986084, "global_step": 252778, "epoch": 1504} {"train_loss": -12.151237487792969, "global_step": 252779, "epoch": 1504} {"train_loss": -12.081012725830078, "global_step": 252780, "epoch": 1504} {"train_loss": -12.129922866821289, "global_step": 252781, "epoch": 1504} {"train_loss": -12.189210891723633, "global_step": 252782, "epoch": 1504} {"train_loss": -11.951871871948242, "global_step": 252783, "epoch": 1504} {"train_loss": -12.154085159301758, "global_step": 252784, "epoch": 1504} {"train_loss": -12.205904006958008, "global_step": 252785, "epoch": 1504} {"train_loss": -12.213571548461914, "global_step": 252786, "epoch": 1504} {"train_loss": -11.956890106201172, "global_step": 252787, "epoch": 1504} {"train_loss": -12.155576705932617, "global_step": 252788, "epoch": 1504} {"train_loss": -11.804893493652344, "global_step": 252789, "epoch": 1504} {"train_loss": -12.061471939086914, "global_step": 252790, "epoch": 1504} {"train_loss": -12.041372299194336, "global_step": 252791, "epoch": 1504} {"train_loss": -12.04287338256836, "global_step": 252792, "epoch": 1504} {"train_loss": -12.223323822021484, "global_step": 252793, "epoch": 1504} {"train_loss": -12.073600769042969, "global_step": 252794, "epoch": 1504} {"train_loss": -12.121479034423828, "global_step": 252795, "epoch": 1504} {"train_loss": -12.00931167602539, "global_step": 252796, "epoch": 1504} {"train_loss": -12.021158218383789, "global_step": 252797, "epoch": 1504} {"train_loss": -11.55020809173584, "global_step": 252798, "epoch": 1504} {"train_loss": -11.77444076538086, "global_step": 252799, "epoch": 1504} {"train_loss": -11.497507095336914, "global_step": 252800, "epoch": 1504} {"train_loss": -11.680376052856445, "global_step": 252801, "epoch": 1504} {"train_loss": -11.834213256835938, "global_step": 252802, "epoch": 1504} {"train_loss": -11.542346954345703, "global_step": 252803, "epoch": 1504} {"train_loss": -11.780072212219238, "global_step": 252804, "epoch": 1504} {"train_loss": -11.624503135681152, "global_step": 252805, "epoch": 1504} {"train_loss": -11.718263626098633, "global_step": 252806, "epoch": 1504} {"train_loss": -11.737648010253906, "global_step": 252807, "epoch": 1504} {"train_loss": -11.862516403198242, "global_step": 252808, "epoch": 1504} {"train_loss": -11.974512100219727, "global_step": 252809, "epoch": 1504} {"train_loss": -11.05535888671875, "global_step": 252810, "epoch": 1504} {"train_loss": -11.625696182250977, "global_step": 252811, "epoch": 1504} {"train_loss": -11.699200630187988, "global_step": 252812, "epoch": 1504} {"train_loss": -11.426368713378906, "global_step": 252813, "epoch": 1504} {"train_loss": -11.319295883178711, "global_step": 252814, "epoch": 1504} {"train_loss": -11.965347290039062, "global_step": 252815, "epoch": 1504} {"train_loss": -11.63803482055664, "global_step": 252816, "epoch": 1504} {"train_loss": -11.607165336608887, "global_step": 252817, "epoch": 1504} {"train_loss": -12.073970794677734, "global_step": 252818, "epoch": 1504} {"train_loss": -11.842195510864258, "global_step": 252819, "epoch": 1504} {"train_loss": -11.815336227416992, "global_step": 252820, "epoch": 1504} {"train_loss": -11.770574569702148, "global_step": 252821, "epoch": 1504} {"train_loss": -11.9765625, "global_step": 252822, "epoch": 1504} {"train_loss": -12.252725601196289, "global_step": 252823, "epoch": 1504} {"train_loss": -11.538789749145508, "global_step": 252824, "epoch": 1504} {"train_loss": -11.790603637695312, "global_step": 252825, "epoch": 1504} {"train_loss": -11.904195785522461, "global_step": 252826, "epoch": 1504} {"train_loss": -11.581377029418945, "global_step": 252827, "epoch": 1504} {"train_loss": -11.76516342163086, "global_step": 252828, "epoch": 1504} {"train_loss": -11.982231140136719, "global_step": 252829, "epoch": 1504} {"train_loss": -11.220695495605469, "global_step": 252830, "epoch": 1504} {"train_loss": -11.979338645935059, "global_step": 252831, "epoch": 1504} {"train_loss": -11.129803657531738, "global_step": 252832, "epoch": 1504} {"train_loss": -10.948774337768555, "global_step": 252833, "epoch": 1504} {"train_loss": -12.165355682373047, "global_step": 252834, "epoch": 1504} {"train_loss": -11.173789978027344, "global_step": 252835, "epoch": 1504} {"train_loss": -10.774572372436523, "global_step": 252836, "epoch": 1504} {"train_loss": -12.126572608947754, "global_step": 252837, "epoch": 1504} {"train_loss": -10.293279647827148, "global_step": 252838, "epoch": 1504} {"train_loss": -11.461827499525887, "global_step": 252839, "epoch": 1504, "val_loss": 265368.5} {"train_loss": -10.105202674865723, "global_step": 252840, "epoch": 1505} {"train_loss": -10.673544883728027, "global_step": 252841, "epoch": 1505} {"train_loss": -11.64906120300293, "global_step": 252842, "epoch": 1505} {"train_loss": -9.827678680419922, "global_step": 252843, "epoch": 1505} {"train_loss": -11.78857421875, "global_step": 252844, "epoch": 1505} {"train_loss": -10.197710990905762, "global_step": 252845, "epoch": 1505} {"train_loss": -11.14686393737793, "global_step": 252846, "epoch": 1505} {"train_loss": -9.88806438446045, "global_step": 252847, "epoch": 1505} {"train_loss": -10.961700439453125, "global_step": 252848, "epoch": 1505} {"train_loss": -10.820045471191406, "global_step": 252849, "epoch": 1505} {"train_loss": -11.03909683227539, "global_step": 252850, "epoch": 1505} {"train_loss": -11.504704475402832, "global_step": 252851, "epoch": 1505} {"train_loss": -10.777663230895996, "global_step": 252852, "epoch": 1505} {"train_loss": -11.116256713867188, "global_step": 252853, "epoch": 1505} {"train_loss": -10.418505668640137, "global_step": 252854, "epoch": 1505} {"train_loss": -10.910097122192383, "global_step": 252855, "epoch": 1505} {"train_loss": -10.448799133300781, "global_step": 252856, "epoch": 1505} {"train_loss": -11.350675582885742, "global_step": 252857, "epoch": 1505} {"train_loss": -10.668633460998535, "global_step": 252858, "epoch": 1505} {"train_loss": -10.948556900024414, "global_step": 252859, "epoch": 1505} {"train_loss": -10.677422523498535, "global_step": 252860, "epoch": 1505} {"train_loss": -10.829764366149902, "global_step": 252861, "epoch": 1505} {"train_loss": -11.285470962524414, "global_step": 252862, "epoch": 1505} {"train_loss": -10.98025131225586, "global_step": 252863, "epoch": 1505} {"train_loss": -11.541322708129883, "global_step": 252864, "epoch": 1505} {"train_loss": -11.284560203552246, "global_step": 252865, "epoch": 1505} {"train_loss": -11.376815795898438, "global_step": 252866, "epoch": 1505} {"train_loss": -11.55213737487793, "global_step": 252867, "epoch": 1505} {"train_loss": -11.347334861755371, "global_step": 252868, "epoch": 1505} {"train_loss": -11.237505912780762, "global_step": 252869, "epoch": 1505} {"train_loss": -11.555771827697754, "global_step": 252870, "epoch": 1505} {"train_loss": -11.293185234069824, "global_step": 252871, "epoch": 1505} {"train_loss": -11.106084823608398, "global_step": 252872, "epoch": 1505} {"train_loss": -11.602840423583984, "global_step": 252873, "epoch": 1505} {"train_loss": -10.98893928527832, "global_step": 252874, "epoch": 1505} {"train_loss": -11.676065444946289, "global_step": 252875, "epoch": 1505} {"train_loss": -11.256824493408203, "global_step": 252876, "epoch": 1505} {"train_loss": -11.332847595214844, "global_step": 252877, "epoch": 1505} {"train_loss": -11.428004264831543, "global_step": 252878, "epoch": 1505} {"train_loss": -11.50132942199707, "global_step": 252879, "epoch": 1505} {"train_loss": -11.444161415100098, "global_step": 252880, "epoch": 1505} {"train_loss": -11.539167404174805, "global_step": 252881, "epoch": 1505} {"train_loss": -11.58993911743164, "global_step": 252882, "epoch": 1505} {"train_loss": -10.999065399169922, "global_step": 252883, "epoch": 1505} {"train_loss": -11.828109741210938, "global_step": 252884, "epoch": 1505} {"train_loss": -11.385765075683594, "global_step": 252885, "epoch": 1505} {"train_loss": -11.410091400146484, "global_step": 252886, "epoch": 1505} {"train_loss": -11.748491287231445, "global_step": 252887, "epoch": 1505} {"train_loss": -11.646102905273438, "global_step": 252888, "epoch": 1505} {"train_loss": -11.709013938903809, "global_step": 252889, "epoch": 1505} {"train_loss": -11.705350875854492, "global_step": 252890, "epoch": 1505} {"train_loss": -11.625877380371094, "global_step": 252891, "epoch": 1505} {"train_loss": -11.702313423156738, "global_step": 252892, "epoch": 1505} {"train_loss": -11.731186866760254, "global_step": 252893, "epoch": 1505} {"train_loss": -11.157583236694336, "global_step": 252894, "epoch": 1505} {"train_loss": -11.61690902709961, "global_step": 252895, "epoch": 1505} {"train_loss": -11.510038375854492, "global_step": 252896, "epoch": 1505} {"train_loss": -11.662714958190918, "global_step": 252897, "epoch": 1505} {"train_loss": -11.358192443847656, "global_step": 252898, "epoch": 1505} {"train_loss": -11.698785781860352, "global_step": 252899, "epoch": 1505} {"train_loss": -11.287403106689453, "global_step": 252900, "epoch": 1505} {"train_loss": -11.672962188720703, "global_step": 252901, "epoch": 1505} {"train_loss": -11.46873664855957, "global_step": 252902, "epoch": 1505} {"train_loss": -11.342580795288086, "global_step": 252903, "epoch": 1505} {"train_loss": -11.906808853149414, "global_step": 252904, "epoch": 1505} {"train_loss": -11.124397277832031, "global_step": 252905, "epoch": 1505} {"train_loss": -11.819602966308594, "global_step": 252906, "epoch": 1505} {"train_loss": -11.544933319091797, "global_step": 252907, "epoch": 1505} {"train_loss": -11.40578842163086, "global_step": 252908, "epoch": 1505} {"train_loss": -11.81075668334961, "global_step": 252909, "epoch": 1505} {"train_loss": -11.55670166015625, "global_step": 252910, "epoch": 1505} {"train_loss": -11.772520065307617, "global_step": 252911, "epoch": 1505} {"train_loss": -11.702669143676758, "global_step": 252912, "epoch": 1505} {"train_loss": -11.905309677124023, "global_step": 252913, "epoch": 1505} {"train_loss": -11.974946975708008, "global_step": 252914, "epoch": 1505} {"train_loss": -11.835691452026367, "global_step": 252915, "epoch": 1505} {"train_loss": -11.842230796813965, "global_step": 252916, "epoch": 1505} {"train_loss": -11.926273345947266, "global_step": 252917, "epoch": 1505} {"train_loss": -12.136970520019531, "global_step": 252918, "epoch": 1505} {"train_loss": -12.012027740478516, "global_step": 252919, "epoch": 1505} {"train_loss": -12.094268798828125, "global_step": 252920, "epoch": 1505} {"train_loss": -12.058609962463379, "global_step": 252921, "epoch": 1505} {"train_loss": -11.925288200378418, "global_step": 252922, "epoch": 1505} {"train_loss": -11.998481750488281, "global_step": 252923, "epoch": 1505} {"train_loss": -11.789177894592285, "global_step": 252924, "epoch": 1505} {"train_loss": -12.05402660369873, "global_step": 252925, "epoch": 1505} {"train_loss": -11.865585327148438, "global_step": 252926, "epoch": 1505} {"train_loss": -11.827415466308594, "global_step": 252927, "epoch": 1505} {"train_loss": -11.930093765258789, "global_step": 252928, "epoch": 1505} {"train_loss": -11.904590606689453, "global_step": 252929, "epoch": 1505} {"train_loss": -11.950332641601562, "global_step": 252930, "epoch": 1505} {"train_loss": -12.071779251098633, "global_step": 252931, "epoch": 1505} {"train_loss": -12.04022216796875, "global_step": 252932, "epoch": 1505} {"train_loss": -12.034207344055176, "global_step": 252933, "epoch": 1505} {"train_loss": -11.9375, "global_step": 252934, "epoch": 1505} {"train_loss": -12.02923583984375, "global_step": 252935, "epoch": 1505} {"train_loss": -12.15937328338623, "global_step": 252936, "epoch": 1505} {"train_loss": -11.999343872070312, "global_step": 252937, "epoch": 1505} {"train_loss": -11.820733070373535, "global_step": 252938, "epoch": 1505} {"train_loss": -12.14771842956543, "global_step": 252939, "epoch": 1505} {"train_loss": -12.051746368408203, "global_step": 252940, "epoch": 1505} {"train_loss": -11.905800819396973, "global_step": 252941, "epoch": 1505} {"train_loss": -11.831762313842773, "global_step": 252942, "epoch": 1505} {"train_loss": -11.790346145629883, "global_step": 252943, "epoch": 1505} {"train_loss": -11.835643768310547, "global_step": 252944, "epoch": 1505} {"train_loss": -11.875375747680664, "global_step": 252945, "epoch": 1505} {"train_loss": -12.071317672729492, "global_step": 252946, "epoch": 1505} {"train_loss": -11.73621940612793, "global_step": 252947, "epoch": 1505} {"train_loss": -12.037229537963867, "global_step": 252948, "epoch": 1505} {"train_loss": -11.756856918334961, "global_step": 252949, "epoch": 1505} {"train_loss": -11.694317817687988, "global_step": 252950, "epoch": 1505} {"train_loss": -12.203783988952637, "global_step": 252951, "epoch": 1505} {"train_loss": -11.301309585571289, "global_step": 252952, "epoch": 1505} {"train_loss": -11.924105644226074, "global_step": 252953, "epoch": 1505} {"train_loss": -11.96116828918457, "global_step": 252954, "epoch": 1505} {"train_loss": -11.945470809936523, "global_step": 252955, "epoch": 1505} {"train_loss": -11.438715934753418, "global_step": 252956, "epoch": 1505} {"train_loss": -12.138425827026367, "global_step": 252957, "epoch": 1505} {"train_loss": -11.567102432250977, "global_step": 252958, "epoch": 1505} {"train_loss": -11.992321014404297, "global_step": 252959, "epoch": 1505} {"train_loss": -11.445799827575684, "global_step": 252960, "epoch": 1505} {"train_loss": -11.975784301757812, "global_step": 252961, "epoch": 1505} {"train_loss": -11.854454040527344, "global_step": 252962, "epoch": 1505} {"train_loss": -12.01329231262207, "global_step": 252963, "epoch": 1505} {"train_loss": -11.28792667388916, "global_step": 252964, "epoch": 1505} {"train_loss": -11.922260284423828, "global_step": 252965, "epoch": 1505} {"train_loss": -11.595985412597656, "global_step": 252966, "epoch": 1505} {"train_loss": -12.163320541381836, "global_step": 252967, "epoch": 1505} {"train_loss": -11.856094360351562, "global_step": 252968, "epoch": 1505} {"train_loss": -11.439702987670898, "global_step": 252969, "epoch": 1505} {"train_loss": -11.825397491455078, "global_step": 252970, "epoch": 1505} {"train_loss": -11.722451210021973, "global_step": 252971, "epoch": 1505} {"train_loss": -11.77637004852295, "global_step": 252972, "epoch": 1505} {"train_loss": -11.759943008422852, "global_step": 252973, "epoch": 1505} {"train_loss": -11.235001564025879, "global_step": 252974, "epoch": 1505} {"train_loss": -10.820383071899414, "global_step": 252975, "epoch": 1505} {"train_loss": -11.375469207763672, "global_step": 252976, "epoch": 1505} {"train_loss": -10.9307861328125, "global_step": 252977, "epoch": 1505} {"train_loss": -10.006917953491211, "global_step": 252978, "epoch": 1505} {"train_loss": -9.215581893920898, "global_step": 252979, "epoch": 1505} {"train_loss": -8.810951232910156, "global_step": 252980, "epoch": 1505} {"train_loss": -8.110615730285645, "global_step": 252981, "epoch": 1505} {"train_loss": -9.669986724853516, "global_step": 252982, "epoch": 1505} {"train_loss": -9.563556671142578, "global_step": 252983, "epoch": 1505} {"train_loss": -9.491806030273438, "global_step": 252984, "epoch": 1505} {"train_loss": -10.358863830566406, "global_step": 252985, "epoch": 1505} {"train_loss": -10.56814193725586, "global_step": 252986, "epoch": 1505} {"train_loss": -9.178398132324219, "global_step": 252987, "epoch": 1505} {"train_loss": -10.965198516845703, "global_step": 252988, "epoch": 1505} {"train_loss": -9.652669906616211, "global_step": 252989, "epoch": 1505} {"train_loss": -10.154304504394531, "global_step": 252990, "epoch": 1505} {"train_loss": -10.12070083618164, "global_step": 252991, "epoch": 1505} {"train_loss": -10.701350212097168, "global_step": 252992, "epoch": 1505} {"train_loss": -10.544290542602539, "global_step": 252993, "epoch": 1505} {"train_loss": -11.242538452148438, "global_step": 252994, "epoch": 1505} {"train_loss": -10.667299270629883, "global_step": 252995, "epoch": 1505} {"train_loss": -10.918656349182129, "global_step": 252996, "epoch": 1505} {"train_loss": -11.048582077026367, "global_step": 252997, "epoch": 1505} {"train_loss": -10.673168182373047, "global_step": 252998, "epoch": 1505} {"train_loss": -11.207910537719727, "global_step": 252999, "epoch": 1505} {"train_loss": -10.89525032043457, "global_step": 253000, "epoch": 1505} {"train_loss": -10.912842750549316, "global_step": 253001, "epoch": 1505} {"train_loss": -11.403905868530273, "global_step": 253002, "epoch": 1505} {"train_loss": -11.039244651794434, "global_step": 253003, "epoch": 1505} {"train_loss": -10.277774810791016, "global_step": 253004, "epoch": 1505} {"train_loss": -11.567432403564453, "global_step": 253005, "epoch": 1505} {"train_loss": -10.615470886230469, "global_step": 253006, "epoch": 1505} {"train_loss": -11.325983796800886, "global_step": 253007, "epoch": 1505, "val_loss": 262976.03125, "train_action_mse_error": 3.8695244789123535} {"train_loss": -10.868921279907227, "global_step": 253008, "epoch": 1506} {"train_loss": -10.56658935546875, "global_step": 253009, "epoch": 1506} {"train_loss": -10.739974021911621, "global_step": 253010, "epoch": 1506} {"train_loss": -11.481184005737305, "global_step": 253011, "epoch": 1506} {"train_loss": -10.932390213012695, "global_step": 253012, "epoch": 1506} {"train_loss": -11.269784927368164, "global_step": 253013, "epoch": 1506} {"train_loss": -11.101249694824219, "global_step": 253014, "epoch": 1506} {"train_loss": -10.417814254760742, "global_step": 253015, "epoch": 1506} {"train_loss": -11.515993118286133, "global_step": 253016, "epoch": 1506} {"train_loss": -10.636473655700684, "global_step": 253017, "epoch": 1506} {"train_loss": -11.518343925476074, "global_step": 253018, "epoch": 1506} {"train_loss": -11.057872772216797, "global_step": 253019, "epoch": 1506} {"train_loss": -11.65715217590332, "global_step": 253020, "epoch": 1506} {"train_loss": -11.42670726776123, "global_step": 253021, "epoch": 1506} {"train_loss": -11.555715560913086, "global_step": 253022, "epoch": 1506} {"train_loss": -11.70749568939209, "global_step": 253023, "epoch": 1506} {"train_loss": -11.636138916015625, "global_step": 253024, "epoch": 1506} {"train_loss": -11.777704238891602, "global_step": 253025, "epoch": 1506} {"train_loss": -11.39310073852539, "global_step": 253026, "epoch": 1506} {"train_loss": -11.577361106872559, "global_step": 253027, "epoch": 1506} {"train_loss": -11.40146541595459, "global_step": 253028, "epoch": 1506} {"train_loss": -11.619953155517578, "global_step": 253029, "epoch": 1506} {"train_loss": -11.609619140625, "global_step": 253030, "epoch": 1506} {"train_loss": -11.738183975219727, "global_step": 253031, "epoch": 1506} {"train_loss": -11.569629669189453, "global_step": 253032, "epoch": 1506} {"train_loss": -11.824145317077637, "global_step": 253033, "epoch": 1506} {"train_loss": -11.589566230773926, "global_step": 253034, "epoch": 1506} {"train_loss": -11.690853118896484, "global_step": 253035, "epoch": 1506} {"train_loss": -11.719489097595215, "global_step": 253036, "epoch": 1506} {"train_loss": -11.345029830932617, "global_step": 253037, "epoch": 1506} {"train_loss": -11.79844856262207, "global_step": 253038, "epoch": 1506} {"train_loss": -11.565271377563477, "global_step": 253039, "epoch": 1506} {"train_loss": -11.801765441894531, "global_step": 253040, "epoch": 1506} {"train_loss": -11.764200210571289, "global_step": 253041, "epoch": 1506} {"train_loss": -11.831024169921875, "global_step": 253042, "epoch": 1506} {"train_loss": -11.789213180541992, "global_step": 253043, "epoch": 1506} {"train_loss": -12.010305404663086, "global_step": 253044, "epoch": 1506} {"train_loss": -11.856645584106445, "global_step": 253045, "epoch": 1506} {"train_loss": -11.876922607421875, "global_step": 253046, "epoch": 1506} {"train_loss": -11.754304885864258, "global_step": 253047, "epoch": 1506} {"train_loss": -11.957174301147461, "global_step": 253048, "epoch": 1506} {"train_loss": -11.615260124206543, "global_step": 253049, "epoch": 1506} {"train_loss": -11.593609809875488, "global_step": 253050, "epoch": 1506} {"train_loss": -11.850639343261719, "global_step": 253051, "epoch": 1506} {"train_loss": -12.075549125671387, "global_step": 253052, "epoch": 1506} {"train_loss": -11.931596755981445, "global_step": 253053, "epoch": 1506} {"train_loss": -11.945512771606445, "global_step": 253054, "epoch": 1506} {"train_loss": -11.906158447265625, "global_step": 253055, "epoch": 1506} {"train_loss": -11.933855056762695, "global_step": 253056, "epoch": 1506} {"train_loss": -12.011505126953125, "global_step": 253057, "epoch": 1506} {"train_loss": -11.924436569213867, "global_step": 253058, "epoch": 1506} {"train_loss": -12.106769561767578, "global_step": 253059, "epoch": 1506} {"train_loss": -11.893610000610352, "global_step": 253060, "epoch": 1506} {"train_loss": -12.050420761108398, "global_step": 253061, "epoch": 1506} {"train_loss": -12.131660461425781, "global_step": 253062, "epoch": 1506} {"train_loss": -12.039093971252441, "global_step": 253063, "epoch": 1506} {"train_loss": -12.06268310546875, "global_step": 253064, "epoch": 1506} {"train_loss": -12.262062072753906, "global_step": 253065, "epoch": 1506} {"train_loss": -12.170787811279297, "global_step": 253066, "epoch": 1506} {"train_loss": -12.212474822998047, "global_step": 253067, "epoch": 1506} {"train_loss": -12.089841842651367, "global_step": 253068, "epoch": 1506} {"train_loss": -12.080196380615234, "global_step": 253069, "epoch": 1506} {"train_loss": -12.027050018310547, "global_step": 253070, "epoch": 1506} {"train_loss": -12.090152740478516, "global_step": 253071, "epoch": 1506} {"train_loss": -12.097646713256836, "global_step": 253072, "epoch": 1506} {"train_loss": -11.998295783996582, "global_step": 253073, "epoch": 1506} {"train_loss": -12.100407600402832, "global_step": 253074, "epoch": 1506} {"train_loss": -11.73825454711914, "global_step": 253075, "epoch": 1506} {"train_loss": -12.140734672546387, "global_step": 253076, "epoch": 1506} {"train_loss": -12.352726936340332, "global_step": 253077, "epoch": 1506} {"train_loss": -11.757076263427734, "global_step": 253078, "epoch": 1506} {"train_loss": -11.997886657714844, "global_step": 253079, "epoch": 1506} {"train_loss": -11.789978981018066, "global_step": 253080, "epoch": 1506} {"train_loss": -11.431421279907227, "global_step": 253081, "epoch": 1506} {"train_loss": -11.423789978027344, "global_step": 253082, "epoch": 1506} {"train_loss": -12.443389892578125, "global_step": 253083, "epoch": 1506} {"train_loss": -11.93202018737793, "global_step": 253084, "epoch": 1506} {"train_loss": -12.082210540771484, "global_step": 253085, "epoch": 1506} {"train_loss": -11.438898086547852, "global_step": 253086, "epoch": 1506} {"train_loss": -11.696144104003906, "global_step": 253087, "epoch": 1506} {"train_loss": -12.014371871948242, "global_step": 253088, "epoch": 1506} {"train_loss": -11.641172409057617, "global_step": 253089, "epoch": 1506} {"train_loss": -11.90715503692627, "global_step": 253090, "epoch": 1506} {"train_loss": -12.114596366882324, "global_step": 253091, "epoch": 1506} {"train_loss": -11.869857788085938, "global_step": 253092, "epoch": 1506} {"train_loss": -12.107398986816406, "global_step": 253093, "epoch": 1506} {"train_loss": -11.376936912536621, "global_step": 253094, "epoch": 1506} {"train_loss": -11.267756462097168, "global_step": 253095, "epoch": 1506} {"train_loss": -12.004647254943848, "global_step": 253096, "epoch": 1506} {"train_loss": -11.338249206542969, "global_step": 253097, "epoch": 1506} {"train_loss": -10.734796524047852, "global_step": 253098, "epoch": 1506} {"train_loss": -11.643832206726074, "global_step": 253099, "epoch": 1506} {"train_loss": -11.069246292114258, "global_step": 253100, "epoch": 1506} {"train_loss": -11.277608871459961, "global_step": 253101, "epoch": 1506} {"train_loss": -11.2899751663208, "global_step": 253102, "epoch": 1506} {"train_loss": -11.715709686279297, "global_step": 253103, "epoch": 1506} {"train_loss": -10.811835289001465, "global_step": 253104, "epoch": 1506} {"train_loss": -11.503874778747559, "global_step": 253105, "epoch": 1506} {"train_loss": -11.360162734985352, "global_step": 253106, "epoch": 1506} {"train_loss": -11.776784896850586, "global_step": 253107, "epoch": 1506} {"train_loss": -11.333921432495117, "global_step": 253108, "epoch": 1506} {"train_loss": -11.403966903686523, "global_step": 253109, "epoch": 1506} {"train_loss": -11.578701972961426, "global_step": 253110, "epoch": 1506} {"train_loss": -11.303438186645508, "global_step": 253111, "epoch": 1506} {"train_loss": -10.731032371520996, "global_step": 253112, "epoch": 1506} {"train_loss": -11.950410842895508, "global_step": 253113, "epoch": 1506} {"train_loss": -11.158011436462402, "global_step": 253114, "epoch": 1506} {"train_loss": -11.822491645812988, "global_step": 253115, "epoch": 1506} {"train_loss": -10.468280792236328, "global_step": 253116, "epoch": 1506} {"train_loss": -11.167767524719238, "global_step": 253117, "epoch": 1506} {"train_loss": -9.80459213256836, "global_step": 253118, "epoch": 1506} {"train_loss": -11.523625373840332, "global_step": 253119, "epoch": 1506} {"train_loss": -9.33609390258789, "global_step": 253120, "epoch": 1506} {"train_loss": -10.935630798339844, "global_step": 253121, "epoch": 1506} {"train_loss": -10.46103572845459, "global_step": 253122, "epoch": 1506} {"train_loss": -10.651040077209473, "global_step": 253123, "epoch": 1506} {"train_loss": -10.904569625854492, "global_step": 253124, "epoch": 1506} {"train_loss": -11.08160400390625, "global_step": 253125, "epoch": 1506} {"train_loss": -11.305187225341797, "global_step": 253126, "epoch": 1506} {"train_loss": -10.637018203735352, "global_step": 253127, "epoch": 1506} {"train_loss": -11.407880783081055, "global_step": 253128, "epoch": 1506} {"train_loss": -10.566061973571777, "global_step": 253129, "epoch": 1506} {"train_loss": -11.076227188110352, "global_step": 253130, "epoch": 1506} {"train_loss": -11.081571578979492, "global_step": 253131, "epoch": 1506} {"train_loss": -10.320221900939941, "global_step": 253132, "epoch": 1506} {"train_loss": -9.475788116455078, "global_step": 253133, "epoch": 1506} {"train_loss": -10.433889389038086, "global_step": 253134, "epoch": 1506} {"train_loss": -9.577309608459473, "global_step": 253135, "epoch": 1506} {"train_loss": -10.127193450927734, "global_step": 253136, "epoch": 1506} {"train_loss": -10.584359169006348, "global_step": 253137, "epoch": 1506} {"train_loss": -10.24262809753418, "global_step": 253138, "epoch": 1506} {"train_loss": -10.765174865722656, "global_step": 253139, "epoch": 1506} {"train_loss": -10.819537162780762, "global_step": 253140, "epoch": 1506} {"train_loss": -10.639983177185059, "global_step": 253141, "epoch": 1506} {"train_loss": -11.36627197265625, "global_step": 253142, "epoch": 1506} {"train_loss": -11.020223617553711, "global_step": 253143, "epoch": 1506} {"train_loss": -11.245326042175293, "global_step": 253144, "epoch": 1506} {"train_loss": -11.332490921020508, "global_step": 253145, "epoch": 1506} {"train_loss": -11.344303131103516, "global_step": 253146, "epoch": 1506} {"train_loss": -11.265886306762695, "global_step": 253147, "epoch": 1506} {"train_loss": -11.384222030639648, "global_step": 253148, "epoch": 1506} {"train_loss": -11.176766395568848, "global_step": 253149, "epoch": 1506} {"train_loss": -11.078954696655273, "global_step": 253150, "epoch": 1506} {"train_loss": -11.339811325073242, "global_step": 253151, "epoch": 1506} {"train_loss": -11.150108337402344, "global_step": 253152, "epoch": 1506} {"train_loss": -11.608531951904297, "global_step": 253153, "epoch": 1506} {"train_loss": -11.34741497039795, "global_step": 253154, "epoch": 1506} {"train_loss": -11.5640869140625, "global_step": 253155, "epoch": 1506} {"train_loss": -11.666720390319824, "global_step": 253156, "epoch": 1506} {"train_loss": -11.425886154174805, "global_step": 253157, "epoch": 1506} {"train_loss": -11.47484302520752, "global_step": 253158, "epoch": 1506} {"train_loss": -11.484060287475586, "global_step": 253159, "epoch": 1506} {"train_loss": -11.718440055847168, "global_step": 253160, "epoch": 1506} {"train_loss": -11.419032096862793, "global_step": 253161, "epoch": 1506} {"train_loss": -12.00913143157959, "global_step": 253162, "epoch": 1506} {"train_loss": -11.744097709655762, "global_step": 253163, "epoch": 1506} {"train_loss": -11.559776306152344, "global_step": 253164, "epoch": 1506} {"train_loss": -11.773458480834961, "global_step": 253165, "epoch": 1506} {"train_loss": -11.5822172164917, "global_step": 253166, "epoch": 1506} {"train_loss": -11.882484436035156, "global_step": 253167, "epoch": 1506} {"train_loss": -11.878023147583008, "global_step": 253168, "epoch": 1506} {"train_loss": -11.655317306518555, "global_step": 253169, "epoch": 1506} {"train_loss": -11.822768211364746, "global_step": 253170, "epoch": 1506} {"train_loss": -11.744935989379883, "global_step": 253171, "epoch": 1506} {"train_loss": -11.758857727050781, "global_step": 253172, "epoch": 1506} {"train_loss": -11.730621337890625, "global_step": 253173, "epoch": 1506} {"train_loss": -11.849843978881836, "global_step": 253174, "epoch": 1506} {"train_loss": -11.470684903008598, "global_step": 253175, "epoch": 1506, "val_loss": 271094.125} {"train_loss": -11.690183639526367, "global_step": 253176, "epoch": 1507} {"train_loss": -11.958256721496582, "global_step": 253177, "epoch": 1507} {"train_loss": -11.891912460327148, "global_step": 253178, "epoch": 1507} {"train_loss": -11.896190643310547, "global_step": 253179, "epoch": 1507} {"train_loss": -11.928577423095703, "global_step": 253180, "epoch": 1507} {"train_loss": -11.67603588104248, "global_step": 253181, "epoch": 1507} {"train_loss": -11.687494277954102, "global_step": 253182, "epoch": 1507} {"train_loss": -11.850101470947266, "global_step": 253183, "epoch": 1507} {"train_loss": -11.832584381103516, "global_step": 253184, "epoch": 1507} {"train_loss": -11.938653945922852, "global_step": 253185, "epoch": 1507} {"train_loss": -11.904472351074219, "global_step": 253186, "epoch": 1507} {"train_loss": -12.001753807067871, "global_step": 253187, "epoch": 1507} {"train_loss": -11.972726821899414, "global_step": 253188, "epoch": 1507} {"train_loss": -11.898181915283203, "global_step": 253189, "epoch": 1507} {"train_loss": -12.047199249267578, "global_step": 253190, "epoch": 1507} {"train_loss": -11.905532836914062, "global_step": 253191, "epoch": 1507} {"train_loss": -12.002043724060059, "global_step": 253192, "epoch": 1507} {"train_loss": -11.855225563049316, "global_step": 253193, "epoch": 1507} {"train_loss": -12.101837158203125, "global_step": 253194, "epoch": 1507} {"train_loss": -12.152402877807617, "global_step": 253195, "epoch": 1507} {"train_loss": -12.217338562011719, "global_step": 253196, "epoch": 1507} {"train_loss": -12.210311889648438, "global_step": 253197, "epoch": 1507} {"train_loss": -12.11808967590332, "global_step": 253198, "epoch": 1507} {"train_loss": -11.90845012664795, "global_step": 253199, "epoch": 1507} {"train_loss": -12.36898136138916, "global_step": 253200, "epoch": 1507} {"train_loss": -12.023340225219727, "global_step": 253201, "epoch": 1507} {"train_loss": -12.077217102050781, "global_step": 253202, "epoch": 1507} {"train_loss": -12.170967102050781, "global_step": 253203, "epoch": 1507} {"train_loss": -12.006782531738281, "global_step": 253204, "epoch": 1507} {"train_loss": -12.126806259155273, "global_step": 253205, "epoch": 1507} {"train_loss": -11.99909782409668, "global_step": 253206, "epoch": 1507} {"train_loss": -12.367406845092773, "global_step": 253207, "epoch": 1507} {"train_loss": -12.182686805725098, "global_step": 253208, "epoch": 1507} {"train_loss": -12.315567016601562, "global_step": 253209, "epoch": 1507} {"train_loss": -12.084556579589844, "global_step": 253210, "epoch": 1507} {"train_loss": -12.280211448669434, "global_step": 253211, "epoch": 1507} {"train_loss": -12.212844848632812, "global_step": 253212, "epoch": 1507} {"train_loss": -11.921350479125977, "global_step": 253213, "epoch": 1507} {"train_loss": -11.643522262573242, "global_step": 253214, "epoch": 1507} {"train_loss": -10.149947166442871, "global_step": 253215, "epoch": 1507} {"train_loss": -10.181337356567383, "global_step": 253216, "epoch": 1507} {"train_loss": -11.550887107849121, "global_step": 253217, "epoch": 1507} {"train_loss": -11.065269470214844, "global_step": 253218, "epoch": 1507} {"train_loss": -10.043282508850098, "global_step": 253219, "epoch": 1507} {"train_loss": -11.765710830688477, "global_step": 253220, "epoch": 1507} {"train_loss": -10.221015930175781, "global_step": 253221, "epoch": 1507} {"train_loss": -8.994083404541016, "global_step": 253222, "epoch": 1507} {"train_loss": -9.437223434448242, "global_step": 253223, "epoch": 1507} {"train_loss": -9.301773071289062, "global_step": 253224, "epoch": 1507} {"train_loss": -11.28309440612793, "global_step": 253225, "epoch": 1507} {"train_loss": -9.544333457946777, "global_step": 253226, "epoch": 1507} {"train_loss": -10.332036972045898, "global_step": 253227, "epoch": 1507} {"train_loss": -11.282703399658203, "global_step": 253228, "epoch": 1507} {"train_loss": -10.87667465209961, "global_step": 253229, "epoch": 1507} {"train_loss": -11.098648071289062, "global_step": 253230, "epoch": 1507} {"train_loss": -10.151424407958984, "global_step": 253231, "epoch": 1507} {"train_loss": -10.686113357543945, "global_step": 253232, "epoch": 1507} {"train_loss": -8.939859390258789, "global_step": 253233, "epoch": 1507} {"train_loss": -10.720442771911621, "global_step": 253234, "epoch": 1507} {"train_loss": -9.931041717529297, "global_step": 253235, "epoch": 1507} {"train_loss": -8.966632843017578, "global_step": 253236, "epoch": 1507} {"train_loss": -10.153546333312988, "global_step": 253237, "epoch": 1507} {"train_loss": -9.415693283081055, "global_step": 253238, "epoch": 1507} {"train_loss": -9.513973236083984, "global_step": 253239, "epoch": 1507} {"train_loss": -9.907894134521484, "global_step": 253240, "epoch": 1507} {"train_loss": -9.502283096313477, "global_step": 253241, "epoch": 1507} {"train_loss": -9.417596817016602, "global_step": 253242, "epoch": 1507} {"train_loss": -10.702048301696777, "global_step": 253243, "epoch": 1507} {"train_loss": -10.407331466674805, "global_step": 253244, "epoch": 1507} {"train_loss": -9.71827507019043, "global_step": 253245, "epoch": 1507} {"train_loss": -10.456296920776367, "global_step": 253246, "epoch": 1507} {"train_loss": -10.563989639282227, "global_step": 253247, "epoch": 1507} {"train_loss": -9.264269828796387, "global_step": 253248, "epoch": 1507} {"train_loss": -10.699026107788086, "global_step": 253249, "epoch": 1507} {"train_loss": -9.705711364746094, "global_step": 253250, "epoch": 1507} {"train_loss": -9.85965347290039, "global_step": 253251, "epoch": 1507} {"train_loss": -10.239907264709473, "global_step": 253252, "epoch": 1507} {"train_loss": -11.163528442382812, "global_step": 253253, "epoch": 1507} {"train_loss": -9.874530792236328, "global_step": 253254, "epoch": 1507} {"train_loss": -10.216876983642578, "global_step": 253255, "epoch": 1507} {"train_loss": -10.914249420166016, "global_step": 253256, "epoch": 1507} {"train_loss": -10.630766868591309, "global_step": 253257, "epoch": 1507} {"train_loss": -10.750886917114258, "global_step": 253258, "epoch": 1507} {"train_loss": -11.46070384979248, "global_step": 253259, "epoch": 1507} {"train_loss": -10.731002807617188, "global_step": 253260, "epoch": 1507} {"train_loss": -11.027420043945312, "global_step": 253261, "epoch": 1507} {"train_loss": -11.384370803833008, "global_step": 253262, "epoch": 1507} {"train_loss": -10.624195098876953, "global_step": 253263, "epoch": 1507} {"train_loss": -11.057117462158203, "global_step": 253264, "epoch": 1507} {"train_loss": -11.439628601074219, "global_step": 253265, "epoch": 1507} {"train_loss": -11.097906112670898, "global_step": 253266, "epoch": 1507} {"train_loss": -10.842317581176758, "global_step": 253267, "epoch": 1507} {"train_loss": -11.473512649536133, "global_step": 253268, "epoch": 1507} {"train_loss": -11.203914642333984, "global_step": 253269, "epoch": 1507} {"train_loss": -11.302657127380371, "global_step": 253270, "epoch": 1507} {"train_loss": -11.426217079162598, "global_step": 253271, "epoch": 1507} {"train_loss": -11.246695518493652, "global_step": 253272, "epoch": 1507} {"train_loss": -11.533049583435059, "global_step": 253273, "epoch": 1507} {"train_loss": -11.56450080871582, "global_step": 253274, "epoch": 1507} {"train_loss": -11.480452537536621, "global_step": 253275, "epoch": 1507} {"train_loss": -11.530866622924805, "global_step": 253276, "epoch": 1507} {"train_loss": -11.40615463256836, "global_step": 253277, "epoch": 1507} {"train_loss": -11.552724838256836, "global_step": 253278, "epoch": 1507} {"train_loss": -11.695842742919922, "global_step": 253279, "epoch": 1507} {"train_loss": -11.595144271850586, "global_step": 253280, "epoch": 1507} {"train_loss": -11.823285102844238, "global_step": 253281, "epoch": 1507} {"train_loss": -11.770037651062012, "global_step": 253282, "epoch": 1507} {"train_loss": -11.498102188110352, "global_step": 253283, "epoch": 1507} {"train_loss": -11.69771957397461, "global_step": 253284, "epoch": 1507} {"train_loss": -11.736886978149414, "global_step": 253285, "epoch": 1507} {"train_loss": -11.552282333374023, "global_step": 253286, "epoch": 1507} {"train_loss": -11.66733455657959, "global_step": 253287, "epoch": 1507} {"train_loss": -11.900337219238281, "global_step": 253288, "epoch": 1507} {"train_loss": -11.824729919433594, "global_step": 253289, "epoch": 1507} {"train_loss": -11.86355972290039, "global_step": 253290, "epoch": 1507} {"train_loss": -11.696725845336914, "global_step": 253291, "epoch": 1507} {"train_loss": -11.853290557861328, "global_step": 253292, "epoch": 1507} {"train_loss": -11.626522064208984, "global_step": 253293, "epoch": 1507} {"train_loss": -11.614518165588379, "global_step": 253294, "epoch": 1507} {"train_loss": -11.735121726989746, "global_step": 253295, "epoch": 1507} {"train_loss": -11.758099555969238, "global_step": 253296, "epoch": 1507} {"train_loss": -11.759597778320312, "global_step": 253297, "epoch": 1507} {"train_loss": -11.736648559570312, "global_step": 253298, "epoch": 1507} {"train_loss": -11.660154342651367, "global_step": 253299, "epoch": 1507} {"train_loss": -11.650142669677734, "global_step": 253300, "epoch": 1507} {"train_loss": -11.630023956298828, "global_step": 253301, "epoch": 1507} {"train_loss": -11.6534423828125, "global_step": 253302, "epoch": 1507} {"train_loss": -11.925132751464844, "global_step": 253303, "epoch": 1507} {"train_loss": -11.772048950195312, "global_step": 253304, "epoch": 1507} {"train_loss": -11.78554916381836, "global_step": 253305, "epoch": 1507} {"train_loss": -11.959601402282715, "global_step": 253306, "epoch": 1507} {"train_loss": -11.855691909790039, "global_step": 253307, "epoch": 1507} {"train_loss": -11.815447807312012, "global_step": 253308, "epoch": 1507} {"train_loss": -11.926098823547363, "global_step": 253309, "epoch": 1507} {"train_loss": -11.897985458374023, "global_step": 253310, "epoch": 1507} {"train_loss": -12.164134979248047, "global_step": 253311, "epoch": 1507} {"train_loss": -12.007062911987305, "global_step": 253312, "epoch": 1507} {"train_loss": -12.073110580444336, "global_step": 253313, "epoch": 1507} {"train_loss": -11.805553436279297, "global_step": 253314, "epoch": 1507} {"train_loss": -12.019232749938965, "global_step": 253315, "epoch": 1507} {"train_loss": -12.045110702514648, "global_step": 253316, "epoch": 1507} {"train_loss": -11.92608642578125, "global_step": 253317, "epoch": 1507} {"train_loss": -11.941312789916992, "global_step": 253318, "epoch": 1507} {"train_loss": -12.025579452514648, "global_step": 253319, "epoch": 1507} {"train_loss": -12.26664924621582, "global_step": 253320, "epoch": 1507} {"train_loss": -12.24111557006836, "global_step": 253321, "epoch": 1507} {"train_loss": -12.174527168273926, "global_step": 253322, "epoch": 1507} {"train_loss": -11.94832992553711, "global_step": 253323, "epoch": 1507} {"train_loss": -12.008102416992188, "global_step": 253324, "epoch": 1507} {"train_loss": -12.176877975463867, "global_step": 253325, "epoch": 1507} {"train_loss": -12.133668899536133, "global_step": 253326, "epoch": 1507} {"train_loss": -12.166481018066406, "global_step": 253327, "epoch": 1507} {"train_loss": -12.263202667236328, "global_step": 253328, "epoch": 1507} {"train_loss": -12.11272144317627, "global_step": 253329, "epoch": 1507} {"train_loss": -12.171208381652832, "global_step": 253330, "epoch": 1507} {"train_loss": -12.240837097167969, "global_step": 253331, "epoch": 1507} {"train_loss": -12.241171836853027, "global_step": 253332, "epoch": 1507} {"train_loss": -12.07278060913086, "global_step": 253333, "epoch": 1507} {"train_loss": -12.150073051452637, "global_step": 253334, "epoch": 1507} {"train_loss": -12.033936500549316, "global_step": 253335, "epoch": 1507} {"train_loss": -11.713340759277344, "global_step": 253336, "epoch": 1507} {"train_loss": -12.129002571105957, "global_step": 253337, "epoch": 1507} {"train_loss": -11.811190605163574, "global_step": 253338, "epoch": 1507} {"train_loss": -11.198637008666992, "global_step": 253339, "epoch": 1507} {"train_loss": -12.100757598876953, "global_step": 253340, "epoch": 1507} {"train_loss": -11.756195068359375, "global_step": 253341, "epoch": 1507} {"train_loss": -11.705364227294922, "global_step": 253342, "epoch": 1507} {"train_loss": -11.405021843456087, "global_step": 253343, "epoch": 1507, "val_loss": 270726.71875} {"train_loss": -11.182897567749023, "global_step": 253344, "epoch": 1508} {"train_loss": -11.191448211669922, "global_step": 253345, "epoch": 1508} {"train_loss": -11.699115753173828, "global_step": 253346, "epoch": 1508} {"train_loss": -11.921219825744629, "global_step": 253347, "epoch": 1508} {"train_loss": -11.098411560058594, "global_step": 253348, "epoch": 1508} {"train_loss": -11.080863952636719, "global_step": 253349, "epoch": 1508} {"train_loss": -11.531810760498047, "global_step": 253350, "epoch": 1508} {"train_loss": -11.681215286254883, "global_step": 253351, "epoch": 1508} {"train_loss": -9.429082870483398, "global_step": 253352, "epoch": 1508} {"train_loss": -11.026544570922852, "global_step": 253353, "epoch": 1508} {"train_loss": -10.99374771118164, "global_step": 253354, "epoch": 1508} {"train_loss": -9.213846206665039, "global_step": 253355, "epoch": 1508} {"train_loss": -10.58039665222168, "global_step": 253356, "epoch": 1508} {"train_loss": -8.765411376953125, "global_step": 253357, "epoch": 1508} {"train_loss": -8.872987747192383, "global_step": 253358, "epoch": 1508} {"train_loss": -9.059259414672852, "global_step": 253359, "epoch": 1508} {"train_loss": -11.060148239135742, "global_step": 253360, "epoch": 1508} {"train_loss": -8.974952697753906, "global_step": 253361, "epoch": 1508} {"train_loss": -11.015721321105957, "global_step": 253362, "epoch": 1508} {"train_loss": -10.536224365234375, "global_step": 253363, "epoch": 1508} {"train_loss": -9.946516036987305, "global_step": 253364, "epoch": 1508} {"train_loss": -9.359237670898438, "global_step": 253365, "epoch": 1508} {"train_loss": -10.748371124267578, "global_step": 253366, "epoch": 1508} {"train_loss": -9.235246658325195, "global_step": 253367, "epoch": 1508} {"train_loss": -10.47193717956543, "global_step": 253368, "epoch": 1508} {"train_loss": -8.632181167602539, "global_step": 253369, "epoch": 1508} {"train_loss": -10.323291778564453, "global_step": 253370, "epoch": 1508} {"train_loss": -8.89810562133789, "global_step": 253371, "epoch": 1508} {"train_loss": -10.374103546142578, "global_step": 253372, "epoch": 1508} {"train_loss": -9.72145938873291, "global_step": 253373, "epoch": 1508} {"train_loss": -8.586435317993164, "global_step": 253374, "epoch": 1508} {"train_loss": -10.107912063598633, "global_step": 253375, "epoch": 1508} {"train_loss": -9.651562690734863, "global_step": 253376, "epoch": 1508} {"train_loss": -8.887951850891113, "global_step": 253377, "epoch": 1508} {"train_loss": -9.428255081176758, "global_step": 253378, "epoch": 1508} {"train_loss": -10.380828857421875, "global_step": 253379, "epoch": 1508} {"train_loss": -9.228264808654785, "global_step": 253380, "epoch": 1508} {"train_loss": -9.003458023071289, "global_step": 253381, "epoch": 1508} {"train_loss": -10.800302505493164, "global_step": 253382, "epoch": 1508} {"train_loss": -7.7711181640625, "global_step": 253383, "epoch": 1508} {"train_loss": -8.777832984924316, "global_step": 253384, "epoch": 1508} {"train_loss": -10.917546272277832, "global_step": 253385, "epoch": 1508} {"train_loss": -10.313520431518555, "global_step": 253386, "epoch": 1508} {"train_loss": -9.943394660949707, "global_step": 253387, "epoch": 1508} {"train_loss": -10.911620140075684, "global_step": 253388, "epoch": 1508} {"train_loss": -10.087728500366211, "global_step": 253389, "epoch": 1508} {"train_loss": -10.635066986083984, "global_step": 253390, "epoch": 1508} {"train_loss": -11.021864891052246, "global_step": 253391, "epoch": 1508} {"train_loss": -10.045814514160156, "global_step": 253392, "epoch": 1508} {"train_loss": -10.923239707946777, "global_step": 253393, "epoch": 1508} {"train_loss": -11.102453231811523, "global_step": 253394, "epoch": 1508} {"train_loss": -10.615155220031738, "global_step": 253395, "epoch": 1508} {"train_loss": -11.19066333770752, "global_step": 253396, "epoch": 1508} {"train_loss": -10.93756103515625, "global_step": 253397, "epoch": 1508} {"train_loss": -10.805074691772461, "global_step": 253398, "epoch": 1508} {"train_loss": -11.019258499145508, "global_step": 253399, "epoch": 1508} {"train_loss": -11.084549903869629, "global_step": 253400, "epoch": 1508} {"train_loss": -10.995140075683594, "global_step": 253401, "epoch": 1508} {"train_loss": -11.02027702331543, "global_step": 253402, "epoch": 1508} {"train_loss": -10.948776245117188, "global_step": 253403, "epoch": 1508} {"train_loss": -11.055994033813477, "global_step": 253404, "epoch": 1508} {"train_loss": -11.067056655883789, "global_step": 253405, "epoch": 1508} {"train_loss": -10.911848068237305, "global_step": 253406, "epoch": 1508} {"train_loss": -11.144590377807617, "global_step": 253407, "epoch": 1508} {"train_loss": -11.21362590789795, "global_step": 253408, "epoch": 1508} {"train_loss": -11.203094482421875, "global_step": 253409, "epoch": 1508} {"train_loss": -10.995195388793945, "global_step": 253410, "epoch": 1508} {"train_loss": -10.908075332641602, "global_step": 253411, "epoch": 1508} {"train_loss": -10.9903564453125, "global_step": 253412, "epoch": 1508} {"train_loss": -11.567296028137207, "global_step": 253413, "epoch": 1508} {"train_loss": -10.769601821899414, "global_step": 253414, "epoch": 1508} {"train_loss": -11.237001419067383, "global_step": 253415, "epoch": 1508} {"train_loss": -11.295856475830078, "global_step": 253416, "epoch": 1508} {"train_loss": -11.148950576782227, "global_step": 253417, "epoch": 1508} {"train_loss": -11.272001266479492, "global_step": 253418, "epoch": 1508} {"train_loss": -11.41781997680664, "global_step": 253419, "epoch": 1508} {"train_loss": -11.27060604095459, "global_step": 253420, "epoch": 1508} {"train_loss": -11.509943962097168, "global_step": 253421, "epoch": 1508} {"train_loss": -11.428654670715332, "global_step": 253422, "epoch": 1508} {"train_loss": -11.311151504516602, "global_step": 253423, "epoch": 1508} {"train_loss": -11.46401309967041, "global_step": 253424, "epoch": 1508} {"train_loss": -11.366376876831055, "global_step": 253425, "epoch": 1508} {"train_loss": -11.380800247192383, "global_step": 253426, "epoch": 1508} {"train_loss": -11.63132095336914, "global_step": 253427, "epoch": 1508} {"train_loss": -11.776998519897461, "global_step": 253428, "epoch": 1508} {"train_loss": -11.655755996704102, "global_step": 253429, "epoch": 1508} {"train_loss": -11.5438814163208, "global_step": 253430, "epoch": 1508} {"train_loss": -11.741384506225586, "global_step": 253431, "epoch": 1508} {"train_loss": -11.689430236816406, "global_step": 253432, "epoch": 1508} {"train_loss": -11.602520942687988, "global_step": 253433, "epoch": 1508} {"train_loss": -11.58397388458252, "global_step": 253434, "epoch": 1508} {"train_loss": -11.699533462524414, "global_step": 253435, "epoch": 1508} {"train_loss": -11.817500114440918, "global_step": 253436, "epoch": 1508} {"train_loss": -11.877927780151367, "global_step": 253437, "epoch": 1508} {"train_loss": -11.818042755126953, "global_step": 253438, "epoch": 1508} {"train_loss": -11.74914264678955, "global_step": 253439, "epoch": 1508} {"train_loss": -11.86197566986084, "global_step": 253440, "epoch": 1508} {"train_loss": -11.72326946258545, "global_step": 253441, "epoch": 1508} {"train_loss": -11.798992156982422, "global_step": 253442, "epoch": 1508} {"train_loss": -11.857791900634766, "global_step": 253443, "epoch": 1508} {"train_loss": -11.938782691955566, "global_step": 253444, "epoch": 1508} {"train_loss": -11.810441970825195, "global_step": 253445, "epoch": 1508} {"train_loss": -11.797240257263184, "global_step": 253446, "epoch": 1508} {"train_loss": -11.919894218444824, "global_step": 253447, "epoch": 1508} {"train_loss": -11.729676246643066, "global_step": 253448, "epoch": 1508} {"train_loss": -12.003371238708496, "global_step": 253449, "epoch": 1508} {"train_loss": -11.902639389038086, "global_step": 253450, "epoch": 1508} {"train_loss": -11.889484405517578, "global_step": 253451, "epoch": 1508} {"train_loss": -11.97159194946289, "global_step": 253452, "epoch": 1508} {"train_loss": -11.995647430419922, "global_step": 253453, "epoch": 1508} {"train_loss": -11.997758865356445, "global_step": 253454, "epoch": 1508} {"train_loss": -11.938918113708496, "global_step": 253455, "epoch": 1508} {"train_loss": -11.81106185913086, "global_step": 253456, "epoch": 1508} {"train_loss": -12.185042381286621, "global_step": 253457, "epoch": 1508} {"train_loss": -11.916034698486328, "global_step": 253458, "epoch": 1508} {"train_loss": -11.987979888916016, "global_step": 253459, "epoch": 1508} {"train_loss": -12.0949068069458, "global_step": 253460, "epoch": 1508} {"train_loss": -11.988555908203125, "global_step": 253461, "epoch": 1508} {"train_loss": -12.239126205444336, "global_step": 253462, "epoch": 1508} {"train_loss": -12.108966827392578, "global_step": 253463, "epoch": 1508} {"train_loss": -12.179430961608887, "global_step": 253464, "epoch": 1508} {"train_loss": -12.159781455993652, "global_step": 253465, "epoch": 1508} {"train_loss": -12.217046737670898, "global_step": 253466, "epoch": 1508} {"train_loss": -11.83714485168457, "global_step": 253467, "epoch": 1508} {"train_loss": -12.125967979431152, "global_step": 253468, "epoch": 1508} {"train_loss": -11.924798965454102, "global_step": 253469, "epoch": 1508} {"train_loss": -12.130423545837402, "global_step": 253470, "epoch": 1508} {"train_loss": -12.100669860839844, "global_step": 253471, "epoch": 1508} {"train_loss": -12.051826477050781, "global_step": 253472, "epoch": 1508} {"train_loss": -12.057473182678223, "global_step": 253473, "epoch": 1508} {"train_loss": -11.722339630126953, "global_step": 253474, "epoch": 1508} {"train_loss": -11.63046646118164, "global_step": 253475, "epoch": 1508} {"train_loss": -12.255603790283203, "global_step": 253476, "epoch": 1508} {"train_loss": -11.854347229003906, "global_step": 253477, "epoch": 1508} {"train_loss": -11.513164520263672, "global_step": 253478, "epoch": 1508} {"train_loss": -11.996337890625, "global_step": 253479, "epoch": 1508} {"train_loss": -12.253203392028809, "global_step": 253480, "epoch": 1508} {"train_loss": -11.484532356262207, "global_step": 253481, "epoch": 1508} {"train_loss": -11.99224853515625, "global_step": 253482, "epoch": 1508} {"train_loss": -12.176183700561523, "global_step": 253483, "epoch": 1508} {"train_loss": -11.768390655517578, "global_step": 253484, "epoch": 1508} {"train_loss": -11.564765930175781, "global_step": 253485, "epoch": 1508} {"train_loss": -11.820201873779297, "global_step": 253486, "epoch": 1508} {"train_loss": -12.047367095947266, "global_step": 253487, "epoch": 1508} {"train_loss": -12.072487831115723, "global_step": 253488, "epoch": 1508} {"train_loss": -11.920442581176758, "global_step": 253489, "epoch": 1508} {"train_loss": -12.339889526367188, "global_step": 253490, "epoch": 1508} {"train_loss": -12.252851486206055, "global_step": 253491, "epoch": 1508} {"train_loss": -12.04057502746582, "global_step": 253492, "epoch": 1508} {"train_loss": -12.164361953735352, "global_step": 253493, "epoch": 1508} {"train_loss": -12.094461441040039, "global_step": 253494, "epoch": 1508} {"train_loss": -12.185026168823242, "global_step": 253495, "epoch": 1508} {"train_loss": -11.82184886932373, "global_step": 253496, "epoch": 1508} {"train_loss": -12.045713424682617, "global_step": 253497, "epoch": 1508} {"train_loss": -12.253159523010254, "global_step": 253498, "epoch": 1508} {"train_loss": -12.000717163085938, "global_step": 253499, "epoch": 1508} {"train_loss": -11.776931762695312, "global_step": 253500, "epoch": 1508} {"train_loss": -11.492368698120117, "global_step": 253501, "epoch": 1508} {"train_loss": -12.041924476623535, "global_step": 253502, "epoch": 1508} {"train_loss": -11.314396858215332, "global_step": 253503, "epoch": 1508} {"train_loss": -11.368973731994629, "global_step": 253504, "epoch": 1508} {"train_loss": -11.906961441040039, "global_step": 253505, "epoch": 1508} {"train_loss": -11.768162727355957, "global_step": 253506, "epoch": 1508} {"train_loss": -11.403566360473633, "global_step": 253507, "epoch": 1508} {"train_loss": -11.459463119506836, "global_step": 253508, "epoch": 1508} {"train_loss": -11.858261108398438, "global_step": 253509, "epoch": 1508} {"train_loss": -11.735149383544922, "global_step": 253510, "epoch": 1508} {"train_loss": -11.212424914042154, "global_step": 253511, "epoch": 1508, "val_loss": 266324.03125} {"train_loss": -11.165862083435059, "global_step": 253512, "epoch": 1509} {"train_loss": -10.858338356018066, "global_step": 253513, "epoch": 1509} {"train_loss": -10.841207504272461, "global_step": 253514, "epoch": 1509} {"train_loss": -11.533208847045898, "global_step": 253515, "epoch": 1509} {"train_loss": -10.284451484680176, "global_step": 253516, "epoch": 1509} {"train_loss": -10.703353881835938, "global_step": 253517, "epoch": 1509} {"train_loss": -9.58456039428711, "global_step": 253518, "epoch": 1509} {"train_loss": -10.968149185180664, "global_step": 253519, "epoch": 1509} {"train_loss": -10.331180572509766, "global_step": 253520, "epoch": 1509} {"train_loss": -9.816566467285156, "global_step": 253521, "epoch": 1509} {"train_loss": -11.304080963134766, "global_step": 253522, "epoch": 1509} {"train_loss": -9.721012115478516, "global_step": 253523, "epoch": 1509} {"train_loss": -10.30876350402832, "global_step": 253524, "epoch": 1509} {"train_loss": -9.845512390136719, "global_step": 253525, "epoch": 1509} {"train_loss": -9.724237442016602, "global_step": 253526, "epoch": 1509} {"train_loss": -9.690267562866211, "global_step": 253527, "epoch": 1509} {"train_loss": -9.600627899169922, "global_step": 253528, "epoch": 1509} {"train_loss": -9.337451934814453, "global_step": 253529, "epoch": 1509} {"train_loss": -9.855060577392578, "global_step": 253530, "epoch": 1509} {"train_loss": -9.981095314025879, "global_step": 253531, "epoch": 1509} {"train_loss": -10.617379188537598, "global_step": 253532, "epoch": 1509} {"train_loss": -9.57429027557373, "global_step": 253533, "epoch": 1509} {"train_loss": -9.332320213317871, "global_step": 253534, "epoch": 1509} {"train_loss": -10.874706268310547, "global_step": 253535, "epoch": 1509} {"train_loss": -10.1731595993042, "global_step": 253536, "epoch": 1509} {"train_loss": -10.708054542541504, "global_step": 253537, "epoch": 1509} {"train_loss": -10.174514770507812, "global_step": 253538, "epoch": 1509} {"train_loss": -10.83053207397461, "global_step": 253539, "epoch": 1509} {"train_loss": -10.066322326660156, "global_step": 253540, "epoch": 1509} {"train_loss": -11.358047485351562, "global_step": 253541, "epoch": 1509} {"train_loss": -10.831441879272461, "global_step": 253542, "epoch": 1509} {"train_loss": -11.223989486694336, "global_step": 253543, "epoch": 1509} {"train_loss": -11.023366928100586, "global_step": 253544, "epoch": 1509} {"train_loss": -11.249752044677734, "global_step": 253545, "epoch": 1509} {"train_loss": -11.2140531539917, "global_step": 253546, "epoch": 1509} {"train_loss": -11.39052963256836, "global_step": 253547, "epoch": 1509} {"train_loss": -11.144969940185547, "global_step": 253548, "epoch": 1509} {"train_loss": -11.71345329284668, "global_step": 253549, "epoch": 1509} {"train_loss": -11.71458625793457, "global_step": 253550, "epoch": 1509} {"train_loss": -11.434759140014648, "global_step": 253551, "epoch": 1509} {"train_loss": -11.64833927154541, "global_step": 253552, "epoch": 1509} {"train_loss": -11.553426742553711, "global_step": 253553, "epoch": 1509} {"train_loss": -11.516866683959961, "global_step": 253554, "epoch": 1509} {"train_loss": -11.831681251525879, "global_step": 253555, "epoch": 1509} {"train_loss": -11.557443618774414, "global_step": 253556, "epoch": 1509} {"train_loss": -11.478157997131348, "global_step": 253557, "epoch": 1509} {"train_loss": -11.500732421875, "global_step": 253558, "epoch": 1509} {"train_loss": -11.55441665649414, "global_step": 253559, "epoch": 1509} {"train_loss": -11.74891471862793, "global_step": 253560, "epoch": 1509} {"train_loss": -11.724825859069824, "global_step": 253561, "epoch": 1509} {"train_loss": -11.393680572509766, "global_step": 253562, "epoch": 1509} {"train_loss": -11.692161560058594, "global_step": 253563, "epoch": 1509} {"train_loss": -11.734262466430664, "global_step": 253564, "epoch": 1509} {"train_loss": -11.718389511108398, "global_step": 253565, "epoch": 1509} {"train_loss": -11.6823148727417, "global_step": 253566, "epoch": 1509} {"train_loss": -11.931687355041504, "global_step": 253567, "epoch": 1509} {"train_loss": -11.642541885375977, "global_step": 253568, "epoch": 1509} {"train_loss": -11.6289644241333, "global_step": 253569, "epoch": 1509} {"train_loss": -11.712041854858398, "global_step": 253570, "epoch": 1509} {"train_loss": -11.874818801879883, "global_step": 253571, "epoch": 1509} {"train_loss": -11.823172569274902, "global_step": 253572, "epoch": 1509} {"train_loss": -11.947053909301758, "global_step": 253573, "epoch": 1509} {"train_loss": -11.864957809448242, "global_step": 253574, "epoch": 1509} {"train_loss": -11.97783088684082, "global_step": 253575, "epoch": 1509} {"train_loss": -12.008115768432617, "global_step": 253576, "epoch": 1509} {"train_loss": -11.945663452148438, "global_step": 253577, "epoch": 1509} {"train_loss": -11.98161506652832, "global_step": 253578, "epoch": 1509} {"train_loss": -12.0747709274292, "global_step": 253579, "epoch": 1509} {"train_loss": -11.879644393920898, "global_step": 253580, "epoch": 1509} {"train_loss": -11.899486541748047, "global_step": 253581, "epoch": 1509} {"train_loss": -11.724544525146484, "global_step": 253582, "epoch": 1509} {"train_loss": -12.118931770324707, "global_step": 253583, "epoch": 1509} {"train_loss": -11.820643424987793, "global_step": 253584, "epoch": 1509} {"train_loss": -12.012920379638672, "global_step": 253585, "epoch": 1509} {"train_loss": -11.770048141479492, "global_step": 253586, "epoch": 1509} {"train_loss": -11.857612609863281, "global_step": 253587, "epoch": 1509} {"train_loss": -11.80476188659668, "global_step": 253588, "epoch": 1509} {"train_loss": -11.932219505310059, "global_step": 253589, "epoch": 1509} {"train_loss": -12.07844066619873, "global_step": 253590, "epoch": 1509} {"train_loss": -12.103872299194336, "global_step": 253591, "epoch": 1509} {"train_loss": -11.885810852050781, "global_step": 253592, "epoch": 1509} {"train_loss": -12.210780143737793, "global_step": 253593, "epoch": 1509} {"train_loss": -11.890044212341309, "global_step": 253594, "epoch": 1509} {"train_loss": -12.183290481567383, "global_step": 253595, "epoch": 1509} {"train_loss": -12.108773231506348, "global_step": 253596, "epoch": 1509} {"train_loss": -12.153985977172852, "global_step": 253597, "epoch": 1509} {"train_loss": -11.965275764465332, "global_step": 253598, "epoch": 1509} {"train_loss": -11.925050735473633, "global_step": 253599, "epoch": 1509} {"train_loss": -11.927482604980469, "global_step": 253600, "epoch": 1509} {"train_loss": -12.128303527832031, "global_step": 253601, "epoch": 1509} {"train_loss": -12.280208587646484, "global_step": 253602, "epoch": 1509} {"train_loss": -12.022489547729492, "global_step": 253603, "epoch": 1509} {"train_loss": -12.228617668151855, "global_step": 253604, "epoch": 1509} {"train_loss": -12.10120677947998, "global_step": 253605, "epoch": 1509} {"train_loss": -12.111688613891602, "global_step": 253606, "epoch": 1509} {"train_loss": -11.85169792175293, "global_step": 253607, "epoch": 1509} {"train_loss": -12.157029151916504, "global_step": 253608, "epoch": 1509} {"train_loss": -12.342077255249023, "global_step": 253609, "epoch": 1509} {"train_loss": -12.01529312133789, "global_step": 253610, "epoch": 1509} {"train_loss": -12.156122207641602, "global_step": 253611, "epoch": 1509} {"train_loss": -12.237961769104004, "global_step": 253612, "epoch": 1509} {"train_loss": -11.923501014709473, "global_step": 253613, "epoch": 1509} {"train_loss": -11.55384635925293, "global_step": 253614, "epoch": 1509} {"train_loss": -12.2999267578125, "global_step": 253615, "epoch": 1509} {"train_loss": -11.808255195617676, "global_step": 253616, "epoch": 1509} {"train_loss": -11.819629669189453, "global_step": 253617, "epoch": 1509} {"train_loss": -11.938337326049805, "global_step": 253618, "epoch": 1509} {"train_loss": -12.26037883758545, "global_step": 253619, "epoch": 1509} {"train_loss": -11.821235656738281, "global_step": 253620, "epoch": 1509} {"train_loss": -12.033848762512207, "global_step": 253621, "epoch": 1509} {"train_loss": -11.790464401245117, "global_step": 253622, "epoch": 1509} {"train_loss": -12.185291290283203, "global_step": 253623, "epoch": 1509} {"train_loss": -11.658732414245605, "global_step": 253624, "epoch": 1509} {"train_loss": -12.06476879119873, "global_step": 253625, "epoch": 1509} {"train_loss": -11.919713973999023, "global_step": 253626, "epoch": 1509} {"train_loss": -11.782190322875977, "global_step": 253627, "epoch": 1509} {"train_loss": -11.824423789978027, "global_step": 253628, "epoch": 1509} {"train_loss": -11.596896171569824, "global_step": 253629, "epoch": 1509} {"train_loss": -11.917961120605469, "global_step": 253630, "epoch": 1509} {"train_loss": -11.716267585754395, "global_step": 253631, "epoch": 1509} {"train_loss": -12.046098709106445, "global_step": 253632, "epoch": 1509} {"train_loss": -11.81669807434082, "global_step": 253633, "epoch": 1509} {"train_loss": -12.039336204528809, "global_step": 253634, "epoch": 1509} {"train_loss": -11.864368438720703, "global_step": 253635, "epoch": 1509} {"train_loss": -11.708234786987305, "global_step": 253636, "epoch": 1509} {"train_loss": -12.110862731933594, "global_step": 253637, "epoch": 1509} {"train_loss": -11.625534057617188, "global_step": 253638, "epoch": 1509} {"train_loss": -11.9243745803833, "global_step": 253639, "epoch": 1509} {"train_loss": -10.803556442260742, "global_step": 253640, "epoch": 1509} {"train_loss": -12.058231353759766, "global_step": 253641, "epoch": 1509} {"train_loss": -10.654525756835938, "global_step": 253642, "epoch": 1509} {"train_loss": -10.846424102783203, "global_step": 253643, "epoch": 1509} {"train_loss": -11.400121688842773, "global_step": 253644, "epoch": 1509} {"train_loss": -11.629674911499023, "global_step": 253645, "epoch": 1509} {"train_loss": -11.523351669311523, "global_step": 253646, "epoch": 1509} {"train_loss": -11.382808685302734, "global_step": 253647, "epoch": 1509} {"train_loss": -11.975600242614746, "global_step": 253648, "epoch": 1509} {"train_loss": -10.627119064331055, "global_step": 253649, "epoch": 1509} {"train_loss": -11.036648750305176, "global_step": 253650, "epoch": 1509} {"train_loss": -9.948369026184082, "global_step": 253651, "epoch": 1509} {"train_loss": -11.567346572875977, "global_step": 253652, "epoch": 1509} {"train_loss": -10.72995376586914, "global_step": 253653, "epoch": 1509} {"train_loss": -10.707025527954102, "global_step": 253654, "epoch": 1509} {"train_loss": -11.195694923400879, "global_step": 253655, "epoch": 1509} {"train_loss": -10.204254150390625, "global_step": 253656, "epoch": 1509} {"train_loss": -11.469747543334961, "global_step": 253657, "epoch": 1509} {"train_loss": -10.86445426940918, "global_step": 253658, "epoch": 1509} {"train_loss": -11.33059310913086, "global_step": 253659, "epoch": 1509} {"train_loss": -11.14106273651123, "global_step": 253660, "epoch": 1509} {"train_loss": -10.728313446044922, "global_step": 253661, "epoch": 1509} {"train_loss": -11.383720397949219, "global_step": 253662, "epoch": 1509} {"train_loss": -11.152748107910156, "global_step": 253663, "epoch": 1509} {"train_loss": -11.591865539550781, "global_step": 253664, "epoch": 1509} {"train_loss": -11.071772575378418, "global_step": 253665, "epoch": 1509} {"train_loss": -11.688786506652832, "global_step": 253666, "epoch": 1509} {"train_loss": -11.545408248901367, "global_step": 253667, "epoch": 1509} {"train_loss": -11.965553283691406, "global_step": 253668, "epoch": 1509} {"train_loss": -11.501144409179688, "global_step": 253669, "epoch": 1509} {"train_loss": -11.605141639709473, "global_step": 253670, "epoch": 1509} {"train_loss": -11.858062744140625, "global_step": 253671, "epoch": 1509} {"train_loss": -11.492177963256836, "global_step": 253672, "epoch": 1509} {"train_loss": -11.795055389404297, "global_step": 253673, "epoch": 1509} {"train_loss": -11.72512435913086, "global_step": 253674, "epoch": 1509} {"train_loss": -11.883288383483887, "global_step": 253675, "epoch": 1509} {"train_loss": -11.323684692382812, "global_step": 253676, "epoch": 1509} {"train_loss": -11.73554801940918, "global_step": 253677, "epoch": 1509} {"train_loss": -11.65189266204834, "global_step": 253678, "epoch": 1509} {"train_loss": -11.436795694487435, "global_step": 253679, "epoch": 1509, "val_loss": 269392.84375} {"train_loss": -11.875242233276367, "global_step": 253680, "epoch": 1510} {"train_loss": -11.90665054321289, "global_step": 253681, "epoch": 1510} {"train_loss": -12.074767112731934, "global_step": 253682, "epoch": 1510} {"train_loss": -11.550742149353027, "global_step": 253683, "epoch": 1510} {"train_loss": -11.593870162963867, "global_step": 253684, "epoch": 1510} {"train_loss": -11.874162673950195, "global_step": 253685, "epoch": 1510} {"train_loss": -11.51327133178711, "global_step": 253686, "epoch": 1510} {"train_loss": -11.852706909179688, "global_step": 253687, "epoch": 1510} {"train_loss": -11.792083740234375, "global_step": 253688, "epoch": 1510} {"train_loss": -11.67957592010498, "global_step": 253689, "epoch": 1510} {"train_loss": -12.015386581420898, "global_step": 253690, "epoch": 1510} {"train_loss": -11.879173278808594, "global_step": 253691, "epoch": 1510} {"train_loss": -11.990043640136719, "global_step": 253692, "epoch": 1510} {"train_loss": -11.978336334228516, "global_step": 253693, "epoch": 1510} {"train_loss": -11.895742416381836, "global_step": 253694, "epoch": 1510} {"train_loss": -11.913734436035156, "global_step": 253695, "epoch": 1510} {"train_loss": -11.606281280517578, "global_step": 253696, "epoch": 1510} {"train_loss": -12.023998260498047, "global_step": 253697, "epoch": 1510} {"train_loss": -12.020299911499023, "global_step": 253698, "epoch": 1510} {"train_loss": -11.971376419067383, "global_step": 253699, "epoch": 1510} {"train_loss": -12.100798606872559, "global_step": 253700, "epoch": 1510} {"train_loss": -11.872135162353516, "global_step": 253701, "epoch": 1510} {"train_loss": -12.270498275756836, "global_step": 253702, "epoch": 1510} {"train_loss": -12.025116920471191, "global_step": 253703, "epoch": 1510} {"train_loss": -12.14566421508789, "global_step": 253704, "epoch": 1510} {"train_loss": -12.17556381225586, "global_step": 253705, "epoch": 1510} {"train_loss": -11.843792915344238, "global_step": 253706, "epoch": 1510} {"train_loss": -11.956762313842773, "global_step": 253707, "epoch": 1510} {"train_loss": -11.85334587097168, "global_step": 253708, "epoch": 1510} {"train_loss": -12.039807319641113, "global_step": 253709, "epoch": 1510} {"train_loss": -11.697473526000977, "global_step": 253710, "epoch": 1510} {"train_loss": -12.083669662475586, "global_step": 253711, "epoch": 1510} {"train_loss": -10.747296333312988, "global_step": 253712, "epoch": 1510} {"train_loss": -10.805707931518555, "global_step": 253713, "epoch": 1510} {"train_loss": -11.244906425476074, "global_step": 253714, "epoch": 1510} {"train_loss": -11.021944999694824, "global_step": 253715, "epoch": 1510} {"train_loss": -10.151302337646484, "global_step": 253716, "epoch": 1510} {"train_loss": -11.442129135131836, "global_step": 253717, "epoch": 1510} {"train_loss": -11.739294052124023, "global_step": 253718, "epoch": 1510} {"train_loss": -11.472277641296387, "global_step": 253719, "epoch": 1510} {"train_loss": -11.019618034362793, "global_step": 253720, "epoch": 1510} {"train_loss": -11.713802337646484, "global_step": 253721, "epoch": 1510} {"train_loss": -10.794988632202148, "global_step": 253722, "epoch": 1510} {"train_loss": -10.933938980102539, "global_step": 253723, "epoch": 1510} {"train_loss": -11.678847312927246, "global_step": 253724, "epoch": 1510} {"train_loss": -10.208889961242676, "global_step": 253725, "epoch": 1510} {"train_loss": -10.071842193603516, "global_step": 253726, "epoch": 1510} {"train_loss": -11.643975257873535, "global_step": 253727, "epoch": 1510} {"train_loss": -9.691604614257812, "global_step": 253728, "epoch": 1510} {"train_loss": -11.408819198608398, "global_step": 253729, "epoch": 1510} {"train_loss": -8.461660385131836, "global_step": 253730, "epoch": 1510} {"train_loss": -9.821100234985352, "global_step": 253731, "epoch": 1510} {"train_loss": -9.531044006347656, "global_step": 253732, "epoch": 1510} {"train_loss": -10.697418212890625, "global_step": 253733, "epoch": 1510} {"train_loss": -10.432738304138184, "global_step": 253734, "epoch": 1510} {"train_loss": -10.921554565429688, "global_step": 253735, "epoch": 1510} {"train_loss": -10.418464660644531, "global_step": 253736, "epoch": 1510} {"train_loss": -10.934967041015625, "global_step": 253737, "epoch": 1510} {"train_loss": -11.000558853149414, "global_step": 253738, "epoch": 1510} {"train_loss": -9.450908660888672, "global_step": 253739, "epoch": 1510} {"train_loss": -11.20225715637207, "global_step": 253740, "epoch": 1510} {"train_loss": -9.423900604248047, "global_step": 253741, "epoch": 1510} {"train_loss": -10.974576950073242, "global_step": 253742, "epoch": 1510} {"train_loss": -10.216733932495117, "global_step": 253743, "epoch": 1510} {"train_loss": -10.024917602539062, "global_step": 253744, "epoch": 1510} {"train_loss": -11.052812576293945, "global_step": 253745, "epoch": 1510} {"train_loss": -9.636480331420898, "global_step": 253746, "epoch": 1510} {"train_loss": -10.531671524047852, "global_step": 253747, "epoch": 1510} {"train_loss": -11.74468994140625, "global_step": 253748, "epoch": 1510} {"train_loss": -10.183622360229492, "global_step": 253749, "epoch": 1510} {"train_loss": -10.869671821594238, "global_step": 253750, "epoch": 1510} {"train_loss": -11.200769424438477, "global_step": 253751, "epoch": 1510} {"train_loss": -10.683109283447266, "global_step": 253752, "epoch": 1510} {"train_loss": -10.62840747833252, "global_step": 253753, "epoch": 1510} {"train_loss": -11.627298355102539, "global_step": 253754, "epoch": 1510} {"train_loss": -10.734484672546387, "global_step": 253755, "epoch": 1510} {"train_loss": -11.036609649658203, "global_step": 253756, "epoch": 1510} {"train_loss": -11.595126152038574, "global_step": 253757, "epoch": 1510} {"train_loss": -11.34880256652832, "global_step": 253758, "epoch": 1510} {"train_loss": -10.906184196472168, "global_step": 253759, "epoch": 1510} {"train_loss": -11.17683219909668, "global_step": 253760, "epoch": 1510} {"train_loss": -10.989992141723633, "global_step": 253761, "epoch": 1510} {"train_loss": -10.30328369140625, "global_step": 253762, "epoch": 1510} {"train_loss": -11.417741775512695, "global_step": 253763, "epoch": 1510} {"train_loss": -10.568800926208496, "global_step": 253764, "epoch": 1510} {"train_loss": -11.144628524780273, "global_step": 253765, "epoch": 1510} {"train_loss": -11.385232925415039, "global_step": 253766, "epoch": 1510} {"train_loss": -11.07322883605957, "global_step": 253767, "epoch": 1510} {"train_loss": -10.54126262664795, "global_step": 253768, "epoch": 1510} {"train_loss": -11.519255638122559, "global_step": 253769, "epoch": 1510} {"train_loss": -10.846115112304688, "global_step": 253770, "epoch": 1510} {"train_loss": -10.694192886352539, "global_step": 253771, "epoch": 1510} {"train_loss": -11.45179271697998, "global_step": 253772, "epoch": 1510} {"train_loss": -10.748701095581055, "global_step": 253773, "epoch": 1510} {"train_loss": -11.325399398803711, "global_step": 253774, "epoch": 1510} {"train_loss": -11.448602676391602, "global_step": 253775, "epoch": 1510} {"train_loss": -10.995445251464844, "global_step": 253776, "epoch": 1510} {"train_loss": -11.147422790527344, "global_step": 253777, "epoch": 1510} {"train_loss": -11.174257278442383, "global_step": 253778, "epoch": 1510} {"train_loss": -11.323453903198242, "global_step": 253779, "epoch": 1510} {"train_loss": -11.217426300048828, "global_step": 253780, "epoch": 1510} {"train_loss": -11.577417373657227, "global_step": 253781, "epoch": 1510} {"train_loss": -11.740169525146484, "global_step": 253782, "epoch": 1510} {"train_loss": -11.41299057006836, "global_step": 253783, "epoch": 1510} {"train_loss": -11.662278175354004, "global_step": 253784, "epoch": 1510} {"train_loss": -11.610992431640625, "global_step": 253785, "epoch": 1510} {"train_loss": -11.623687744140625, "global_step": 253786, "epoch": 1510} {"train_loss": -11.570185661315918, "global_step": 253787, "epoch": 1510} {"train_loss": -11.74422836303711, "global_step": 253788, "epoch": 1510} {"train_loss": -11.65450382232666, "global_step": 253789, "epoch": 1510} {"train_loss": -11.779088020324707, "global_step": 253790, "epoch": 1510} {"train_loss": -11.738807678222656, "global_step": 253791, "epoch": 1510} {"train_loss": -11.780597686767578, "global_step": 253792, "epoch": 1510} {"train_loss": -11.668960571289062, "global_step": 253793, "epoch": 1510} {"train_loss": -11.6436185836792, "global_step": 253794, "epoch": 1510} {"train_loss": -11.832528114318848, "global_step": 253795, "epoch": 1510} {"train_loss": -11.979896545410156, "global_step": 253796, "epoch": 1510} {"train_loss": -11.694445610046387, "global_step": 253797, "epoch": 1510} {"train_loss": -11.737156867980957, "global_step": 253798, "epoch": 1510} {"train_loss": -11.903759956359863, "global_step": 253799, "epoch": 1510} {"train_loss": -11.878119468688965, "global_step": 253800, "epoch": 1510} {"train_loss": -11.953910827636719, "global_step": 253801, "epoch": 1510} {"train_loss": -11.950139999389648, "global_step": 253802, "epoch": 1510} {"train_loss": -11.968894958496094, "global_step": 253803, "epoch": 1510} {"train_loss": -11.935358047485352, "global_step": 253804, "epoch": 1510} {"train_loss": -12.006607055664062, "global_step": 253805, "epoch": 1510} {"train_loss": -12.040496826171875, "global_step": 253806, "epoch": 1510} {"train_loss": -11.890277862548828, "global_step": 253807, "epoch": 1510} {"train_loss": -12.094073295593262, "global_step": 253808, "epoch": 1510} {"train_loss": -12.05179500579834, "global_step": 253809, "epoch": 1510} {"train_loss": -12.068862915039062, "global_step": 253810, "epoch": 1510} {"train_loss": -12.11549186706543, "global_step": 253811, "epoch": 1510} {"train_loss": -12.00661849975586, "global_step": 253812, "epoch": 1510} {"train_loss": -12.076566696166992, "global_step": 253813, "epoch": 1510} {"train_loss": -12.062843322753906, "global_step": 253814, "epoch": 1510} {"train_loss": -12.20555591583252, "global_step": 253815, "epoch": 1510} {"train_loss": -12.101081848144531, "global_step": 253816, "epoch": 1510} {"train_loss": -12.279980659484863, "global_step": 253817, "epoch": 1510} {"train_loss": -12.125456809997559, "global_step": 253818, "epoch": 1510} {"train_loss": -12.188231468200684, "global_step": 253819, "epoch": 1510} {"train_loss": -12.13247299194336, "global_step": 253820, "epoch": 1510} {"train_loss": -12.037701606750488, "global_step": 253821, "epoch": 1510} {"train_loss": -12.124900817871094, "global_step": 253822, "epoch": 1510} {"train_loss": -12.229607582092285, "global_step": 253823, "epoch": 1510} {"train_loss": -12.091341972351074, "global_step": 253824, "epoch": 1510} {"train_loss": -12.184053421020508, "global_step": 253825, "epoch": 1510} {"train_loss": -12.120046615600586, "global_step": 253826, "epoch": 1510} {"train_loss": -12.277372360229492, "global_step": 253827, "epoch": 1510} {"train_loss": -12.156692504882812, "global_step": 253828, "epoch": 1510} {"train_loss": -12.219831466674805, "global_step": 253829, "epoch": 1510} {"train_loss": -12.203590393066406, "global_step": 253830, "epoch": 1510} {"train_loss": -12.143108367919922, "global_step": 253831, "epoch": 1510} {"train_loss": -11.987434387207031, "global_step": 253832, "epoch": 1510} {"train_loss": -12.035980224609375, "global_step": 253833, "epoch": 1510} {"train_loss": -12.218114852905273, "global_step": 253834, "epoch": 1510} {"train_loss": -12.26431655883789, "global_step": 253835, "epoch": 1510} {"train_loss": -12.008798599243164, "global_step": 253836, "epoch": 1510} {"train_loss": -12.184860229492188, "global_step": 253837, "epoch": 1510} {"train_loss": -12.40816879272461, "global_step": 253838, "epoch": 1510} {"train_loss": -12.183937072753906, "global_step": 253839, "epoch": 1510} {"train_loss": -11.981557846069336, "global_step": 253840, "epoch": 1510} {"train_loss": -11.439733505249023, "global_step": 253841, "epoch": 1510} {"train_loss": -11.065948486328125, "global_step": 253842, "epoch": 1510} {"train_loss": -11.490699768066406, "global_step": 253843, "epoch": 1510} {"train_loss": -11.92531967163086, "global_step": 253844, "epoch": 1510} {"train_loss": -11.940387725830078, "global_step": 253845, "epoch": 1510} {"train_loss": -11.500518798828125, "global_step": 253846, "epoch": 1510} {"train_loss": -11.4701292855399, "global_step": 253847, "epoch": 1510, "val_loss": 269430.3125, "train_action_mse_error": 5.614803314208984} {"train_loss": -9.721664428710938, "global_step": 253848, "epoch": 1511} {"train_loss": -11.443782806396484, "global_step": 253849, "epoch": 1511} {"train_loss": -10.114315032958984, "global_step": 253850, "epoch": 1511} {"train_loss": -10.405168533325195, "global_step": 253851, "epoch": 1511} {"train_loss": -10.330888748168945, "global_step": 253852, "epoch": 1511} {"train_loss": -9.896415710449219, "global_step": 253853, "epoch": 1511} {"train_loss": -9.330673217773438, "global_step": 253854, "epoch": 1511} {"train_loss": -8.527715682983398, "global_step": 253855, "epoch": 1511} {"train_loss": -10.914353370666504, "global_step": 253856, "epoch": 1511} {"train_loss": -9.047000885009766, "global_step": 253857, "epoch": 1511} {"train_loss": -9.302248001098633, "global_step": 253858, "epoch": 1511} {"train_loss": -9.68533706665039, "global_step": 253859, "epoch": 1511} {"train_loss": -9.577693939208984, "global_step": 253860, "epoch": 1511} {"train_loss": -8.566282272338867, "global_step": 253861, "epoch": 1511} {"train_loss": -9.00952434539795, "global_step": 253862, "epoch": 1511} {"train_loss": -8.86396312713623, "global_step": 253863, "epoch": 1511} {"train_loss": -10.975346565246582, "global_step": 253864, "epoch": 1511} {"train_loss": -9.264720916748047, "global_step": 253865, "epoch": 1511} {"train_loss": -9.50901985168457, "global_step": 253866, "epoch": 1511} {"train_loss": -10.373062133789062, "global_step": 253867, "epoch": 1511} {"train_loss": -9.816723823547363, "global_step": 253868, "epoch": 1511} {"train_loss": -9.886797904968262, "global_step": 253869, "epoch": 1511} {"train_loss": -10.225645065307617, "global_step": 253870, "epoch": 1511} {"train_loss": -10.0359525680542, "global_step": 253871, "epoch": 1511} {"train_loss": -9.958881378173828, "global_step": 253872, "epoch": 1511} {"train_loss": -10.771442413330078, "global_step": 253873, "epoch": 1511} {"train_loss": -10.070748329162598, "global_step": 253874, "epoch": 1511} {"train_loss": -10.16025161743164, "global_step": 253875, "epoch": 1511} {"train_loss": -11.013822555541992, "global_step": 253876, "epoch": 1511} {"train_loss": -10.292547225952148, "global_step": 253877, "epoch": 1511} {"train_loss": -11.025035858154297, "global_step": 253878, "epoch": 1511} {"train_loss": -10.583897590637207, "global_step": 253879, "epoch": 1511} {"train_loss": -10.666271209716797, "global_step": 253880, "epoch": 1511} {"train_loss": -11.122352600097656, "global_step": 253881, "epoch": 1511} {"train_loss": -11.242305755615234, "global_step": 253882, "epoch": 1511} {"train_loss": -11.178140640258789, "global_step": 253883, "epoch": 1511} {"train_loss": -10.949050903320312, "global_step": 253884, "epoch": 1511} {"train_loss": -11.147613525390625, "global_step": 253885, "epoch": 1511} {"train_loss": -10.785516738891602, "global_step": 253886, "epoch": 1511} {"train_loss": -10.950783729553223, "global_step": 253887, "epoch": 1511} {"train_loss": -10.757064819335938, "global_step": 253888, "epoch": 1511} {"train_loss": -11.19798755645752, "global_step": 253889, "epoch": 1511} {"train_loss": -11.04727554321289, "global_step": 253890, "epoch": 1511} {"train_loss": -10.869880676269531, "global_step": 253891, "epoch": 1511} {"train_loss": -11.286901473999023, "global_step": 253892, "epoch": 1511} {"train_loss": -11.177026748657227, "global_step": 253893, "epoch": 1511} {"train_loss": -11.042899131774902, "global_step": 253894, "epoch": 1511} {"train_loss": -11.198762893676758, "global_step": 253895, "epoch": 1511} {"train_loss": -11.32175064086914, "global_step": 253896, "epoch": 1511} {"train_loss": -11.305011749267578, "global_step": 253897, "epoch": 1511} {"train_loss": -11.432022094726562, "global_step": 253898, "epoch": 1511} {"train_loss": -11.549211502075195, "global_step": 253899, "epoch": 1511} {"train_loss": -11.552909851074219, "global_step": 253900, "epoch": 1511} {"train_loss": -11.700439453125, "global_step": 253901, "epoch": 1511} {"train_loss": -11.667678833007812, "global_step": 253902, "epoch": 1511} {"train_loss": -11.406326293945312, "global_step": 253903, "epoch": 1511} {"train_loss": -11.835589408874512, "global_step": 253904, "epoch": 1511} {"train_loss": -11.7864990234375, "global_step": 253905, "epoch": 1511} {"train_loss": -11.71203899383545, "global_step": 253906, "epoch": 1511} {"train_loss": -11.579364776611328, "global_step": 253907, "epoch": 1511} {"train_loss": -11.788524627685547, "global_step": 253908, "epoch": 1511} {"train_loss": -11.574336051940918, "global_step": 253909, "epoch": 1511} {"train_loss": -11.814495086669922, "global_step": 253910, "epoch": 1511} {"train_loss": -11.599411010742188, "global_step": 253911, "epoch": 1511} {"train_loss": -11.640146255493164, "global_step": 253912, "epoch": 1511} {"train_loss": -11.858272552490234, "global_step": 253913, "epoch": 1511} {"train_loss": -11.655682563781738, "global_step": 253914, "epoch": 1511} {"train_loss": -11.701763153076172, "global_step": 253915, "epoch": 1511} {"train_loss": -11.839738845825195, "global_step": 253916, "epoch": 1511} {"train_loss": -11.781011581420898, "global_step": 253917, "epoch": 1511} {"train_loss": -11.831541061401367, "global_step": 253918, "epoch": 1511} {"train_loss": -11.977755546569824, "global_step": 253919, "epoch": 1511} {"train_loss": -11.743995666503906, "global_step": 253920, "epoch": 1511} {"train_loss": -11.899385452270508, "global_step": 253921, "epoch": 1511} {"train_loss": -11.875272750854492, "global_step": 253922, "epoch": 1511} {"train_loss": -11.815607070922852, "global_step": 253923, "epoch": 1511} {"train_loss": -11.832897186279297, "global_step": 253924, "epoch": 1511} {"train_loss": -11.832979202270508, "global_step": 253925, "epoch": 1511} {"train_loss": -11.806756973266602, "global_step": 253926, "epoch": 1511} {"train_loss": -11.975691795349121, "global_step": 253927, "epoch": 1511} {"train_loss": -11.79507827758789, "global_step": 253928, "epoch": 1511} {"train_loss": -11.992280960083008, "global_step": 253929, "epoch": 1511} {"train_loss": -11.838062286376953, "global_step": 253930, "epoch": 1511} {"train_loss": -11.915786743164062, "global_step": 253931, "epoch": 1511} {"train_loss": -11.880859375, "global_step": 253932, "epoch": 1511} {"train_loss": -12.18267822265625, "global_step": 253933, "epoch": 1511} {"train_loss": -11.77365493774414, "global_step": 253934, "epoch": 1511} {"train_loss": -12.093158721923828, "global_step": 253935, "epoch": 1511} {"train_loss": -12.215402603149414, "global_step": 253936, "epoch": 1511} {"train_loss": -11.889904975891113, "global_step": 253937, "epoch": 1511} {"train_loss": -11.942483901977539, "global_step": 253938, "epoch": 1511} {"train_loss": -12.0020751953125, "global_step": 253939, "epoch": 1511} {"train_loss": -12.117874145507812, "global_step": 253940, "epoch": 1511} {"train_loss": -12.145119667053223, "global_step": 253941, "epoch": 1511} {"train_loss": -11.931804656982422, "global_step": 253942, "epoch": 1511} {"train_loss": -11.95742416381836, "global_step": 253943, "epoch": 1511} {"train_loss": -12.222675323486328, "global_step": 253944, "epoch": 1511} {"train_loss": -12.143630027770996, "global_step": 253945, "epoch": 1511} {"train_loss": -12.05812931060791, "global_step": 253946, "epoch": 1511} {"train_loss": -12.10621452331543, "global_step": 253947, "epoch": 1511} {"train_loss": -11.864969253540039, "global_step": 253948, "epoch": 1511} {"train_loss": -12.274520874023438, "global_step": 253949, "epoch": 1511} {"train_loss": -12.053811073303223, "global_step": 253950, "epoch": 1511} {"train_loss": -12.138083457946777, "global_step": 253951, "epoch": 1511} {"train_loss": -11.982006072998047, "global_step": 253952, "epoch": 1511} {"train_loss": -12.214723587036133, "global_step": 253953, "epoch": 1511} {"train_loss": -12.238899230957031, "global_step": 253954, "epoch": 1511} {"train_loss": -12.266193389892578, "global_step": 253955, "epoch": 1511} {"train_loss": -12.100972175598145, "global_step": 253956, "epoch": 1511} {"train_loss": -12.280363082885742, "global_step": 253957, "epoch": 1511} {"train_loss": -12.207061767578125, "global_step": 253958, "epoch": 1511} {"train_loss": -12.084871292114258, "global_step": 253959, "epoch": 1511} {"train_loss": -12.167625427246094, "global_step": 253960, "epoch": 1511} {"train_loss": -12.459604263305664, "global_step": 253961, "epoch": 1511} {"train_loss": -12.24458122253418, "global_step": 253962, "epoch": 1511} {"train_loss": -12.10097885131836, "global_step": 253963, "epoch": 1511} {"train_loss": -12.237369537353516, "global_step": 253964, "epoch": 1511} {"train_loss": -12.320077896118164, "global_step": 253965, "epoch": 1511} {"train_loss": -12.11927604675293, "global_step": 253966, "epoch": 1511} {"train_loss": -12.139225006103516, "global_step": 253967, "epoch": 1511} {"train_loss": -11.758262634277344, "global_step": 253968, "epoch": 1511} {"train_loss": -11.840124130249023, "global_step": 253969, "epoch": 1511} {"train_loss": -11.919448852539062, "global_step": 253970, "epoch": 1511} {"train_loss": -11.933658599853516, "global_step": 253971, "epoch": 1511} {"train_loss": -12.164262771606445, "global_step": 253972, "epoch": 1511} {"train_loss": -11.898509979248047, "global_step": 253973, "epoch": 1511} {"train_loss": -12.136690139770508, "global_step": 253974, "epoch": 1511} {"train_loss": -11.831022262573242, "global_step": 253975, "epoch": 1511} {"train_loss": -11.242919921875, "global_step": 253976, "epoch": 1511} {"train_loss": -11.031759262084961, "global_step": 253977, "epoch": 1511} {"train_loss": -11.774354934692383, "global_step": 253978, "epoch": 1511} {"train_loss": -11.965217590332031, "global_step": 253979, "epoch": 1511} {"train_loss": -10.730042457580566, "global_step": 253980, "epoch": 1511} {"train_loss": -11.00474739074707, "global_step": 253981, "epoch": 1511} {"train_loss": -11.854072570800781, "global_step": 253982, "epoch": 1511} {"train_loss": -11.46638011932373, "global_step": 253983, "epoch": 1511} {"train_loss": -11.48466682434082, "global_step": 253984, "epoch": 1511} {"train_loss": -11.24268913269043, "global_step": 253985, "epoch": 1511} {"train_loss": -11.122383117675781, "global_step": 253986, "epoch": 1511} {"train_loss": -10.564870834350586, "global_step": 253987, "epoch": 1511} {"train_loss": -11.710329055786133, "global_step": 253988, "epoch": 1511} {"train_loss": -10.015085220336914, "global_step": 253989, "epoch": 1511} {"train_loss": -11.206570625305176, "global_step": 253990, "epoch": 1511} {"train_loss": -11.212858200073242, "global_step": 253991, "epoch": 1511} {"train_loss": -11.131300926208496, "global_step": 253992, "epoch": 1511} {"train_loss": -11.424559593200684, "global_step": 253993, "epoch": 1511} {"train_loss": -11.074389457702637, "global_step": 253994, "epoch": 1511} {"train_loss": -11.624311447143555, "global_step": 253995, "epoch": 1511} {"train_loss": -11.39673137664795, "global_step": 253996, "epoch": 1511} {"train_loss": -11.987048149108887, "global_step": 253997, "epoch": 1511} {"train_loss": -11.688141822814941, "global_step": 253998, "epoch": 1511} {"train_loss": -11.545781135559082, "global_step": 253999, "epoch": 1511} {"train_loss": -11.241536140441895, "global_step": 254000, "epoch": 1511} {"train_loss": -11.651468276977539, "global_step": 254001, "epoch": 1511} {"train_loss": -11.361207962036133, "global_step": 254002, "epoch": 1511} {"train_loss": -11.658782958984375, "global_step": 254003, "epoch": 1511} {"train_loss": -11.181604385375977, "global_step": 254004, "epoch": 1511} {"train_loss": -11.582496643066406, "global_step": 254005, "epoch": 1511} {"train_loss": -11.080291748046875, "global_step": 254006, "epoch": 1511} {"train_loss": -11.933600425720215, "global_step": 254007, "epoch": 1511} {"train_loss": -11.287498474121094, "global_step": 254008, "epoch": 1511} {"train_loss": -11.307991027832031, "global_step": 254009, "epoch": 1511} {"train_loss": -10.608673095703125, "global_step": 254010, "epoch": 1511} {"train_loss": -11.325810432434082, "global_step": 254011, "epoch": 1511} {"train_loss": -11.540257453918457, "global_step": 254012, "epoch": 1511} {"train_loss": -10.977042198181152, "global_step": 254013, "epoch": 1511} {"train_loss": -11.582991600036621, "global_step": 254014, "epoch": 1511} {"train_loss": -11.325231597537087, "global_step": 254015, "epoch": 1511, "val_loss": 266340.25} {"train_loss": -11.619171142578125, "global_step": 254016, "epoch": 1512} {"train_loss": -11.51883316040039, "global_step": 254017, "epoch": 1512} {"train_loss": -11.88583755493164, "global_step": 254018, "epoch": 1512} {"train_loss": -11.685317039489746, "global_step": 254019, "epoch": 1512} {"train_loss": -11.398025512695312, "global_step": 254020, "epoch": 1512} {"train_loss": -11.61351490020752, "global_step": 254021, "epoch": 1512} {"train_loss": -11.732860565185547, "global_step": 254022, "epoch": 1512} {"train_loss": -11.360799789428711, "global_step": 254023, "epoch": 1512} {"train_loss": -11.65469741821289, "global_step": 254024, "epoch": 1512} {"train_loss": -11.589761734008789, "global_step": 254025, "epoch": 1512} {"train_loss": -11.635777473449707, "global_step": 254026, "epoch": 1512} {"train_loss": -11.392489433288574, "global_step": 254027, "epoch": 1512} {"train_loss": -11.111743927001953, "global_step": 254028, "epoch": 1512} {"train_loss": -11.571319580078125, "global_step": 254029, "epoch": 1512} {"train_loss": -11.30713176727295, "global_step": 254030, "epoch": 1512} {"train_loss": -11.7103853225708, "global_step": 254031, "epoch": 1512} {"train_loss": -11.027307510375977, "global_step": 254032, "epoch": 1512} {"train_loss": -11.743645668029785, "global_step": 254033, "epoch": 1512} {"train_loss": -10.71714973449707, "global_step": 254034, "epoch": 1512} {"train_loss": -10.898479461669922, "global_step": 254035, "epoch": 1512} {"train_loss": -11.678251266479492, "global_step": 254036, "epoch": 1512} {"train_loss": -10.84445858001709, "global_step": 254037, "epoch": 1512} {"train_loss": -11.88294792175293, "global_step": 254038, "epoch": 1512} {"train_loss": -10.671680450439453, "global_step": 254039, "epoch": 1512} {"train_loss": -11.753008842468262, "global_step": 254040, "epoch": 1512} {"train_loss": -10.991355895996094, "global_step": 254041, "epoch": 1512} {"train_loss": -11.435602188110352, "global_step": 254042, "epoch": 1512} {"train_loss": -11.488208770751953, "global_step": 254043, "epoch": 1512} {"train_loss": -11.084914207458496, "global_step": 254044, "epoch": 1512} {"train_loss": -11.615111351013184, "global_step": 254045, "epoch": 1512} {"train_loss": -11.298766136169434, "global_step": 254046, "epoch": 1512} {"train_loss": -11.50169563293457, "global_step": 254047, "epoch": 1512} {"train_loss": -11.407325744628906, "global_step": 254048, "epoch": 1512} {"train_loss": -11.57893180847168, "global_step": 254049, "epoch": 1512} {"train_loss": -11.647248268127441, "global_step": 254050, "epoch": 1512} {"train_loss": -11.636774063110352, "global_step": 254051, "epoch": 1512} {"train_loss": -11.704267501831055, "global_step": 254052, "epoch": 1512} {"train_loss": -11.951650619506836, "global_step": 254053, "epoch": 1512} {"train_loss": -11.661849975585938, "global_step": 254054, "epoch": 1512} {"train_loss": -11.703046798706055, "global_step": 254055, "epoch": 1512} {"train_loss": -11.665185928344727, "global_step": 254056, "epoch": 1512} {"train_loss": -11.983075141906738, "global_step": 254057, "epoch": 1512} {"train_loss": -11.634942054748535, "global_step": 254058, "epoch": 1512} {"train_loss": -11.90143871307373, "global_step": 254059, "epoch": 1512} {"train_loss": -11.867630958557129, "global_step": 254060, "epoch": 1512} {"train_loss": -11.767159461975098, "global_step": 254061, "epoch": 1512} {"train_loss": -11.908905029296875, "global_step": 254062, "epoch": 1512} {"train_loss": -10.92912483215332, "global_step": 254063, "epoch": 1512} {"train_loss": -11.866804122924805, "global_step": 254064, "epoch": 1512} {"train_loss": -11.787363052368164, "global_step": 254065, "epoch": 1512} {"train_loss": -11.6392240524292, "global_step": 254066, "epoch": 1512} {"train_loss": -11.83687686920166, "global_step": 254067, "epoch": 1512} {"train_loss": -11.660951614379883, "global_step": 254068, "epoch": 1512} {"train_loss": -12.012383460998535, "global_step": 254069, "epoch": 1512} {"train_loss": -11.46487808227539, "global_step": 254070, "epoch": 1512} {"train_loss": -11.895200729370117, "global_step": 254071, "epoch": 1512} {"train_loss": -11.617782592773438, "global_step": 254072, "epoch": 1512} {"train_loss": -12.002721786499023, "global_step": 254073, "epoch": 1512} {"train_loss": -11.83103084564209, "global_step": 254074, "epoch": 1512} {"train_loss": -11.360904693603516, "global_step": 254075, "epoch": 1512} {"train_loss": -11.841591835021973, "global_step": 254076, "epoch": 1512} {"train_loss": -11.704582214355469, "global_step": 254077, "epoch": 1512} {"train_loss": -11.921775817871094, "global_step": 254078, "epoch": 1512} {"train_loss": -12.056706428527832, "global_step": 254079, "epoch": 1512} {"train_loss": -12.049765586853027, "global_step": 254080, "epoch": 1512} {"train_loss": -12.005813598632812, "global_step": 254081, "epoch": 1512} {"train_loss": -12.062585830688477, "global_step": 254082, "epoch": 1512} {"train_loss": -11.85014533996582, "global_step": 254083, "epoch": 1512} {"train_loss": -12.076083183288574, "global_step": 254084, "epoch": 1512} {"train_loss": -11.84641170501709, "global_step": 254085, "epoch": 1512} {"train_loss": -11.876388549804688, "global_step": 254086, "epoch": 1512} {"train_loss": -11.74329662322998, "global_step": 254087, "epoch": 1512} {"train_loss": -11.818865776062012, "global_step": 254088, "epoch": 1512} {"train_loss": -12.127477645874023, "global_step": 254089, "epoch": 1512} {"train_loss": -11.712422370910645, "global_step": 254090, "epoch": 1512} {"train_loss": -11.988574981689453, "global_step": 254091, "epoch": 1512} {"train_loss": -11.873231887817383, "global_step": 254092, "epoch": 1512} {"train_loss": -12.110091209411621, "global_step": 254093, "epoch": 1512} {"train_loss": -11.46605110168457, "global_step": 254094, "epoch": 1512} {"train_loss": -11.829497337341309, "global_step": 254095, "epoch": 1512} {"train_loss": -12.00307846069336, "global_step": 254096, "epoch": 1512} {"train_loss": -11.49104118347168, "global_step": 254097, "epoch": 1512} {"train_loss": -11.94964599609375, "global_step": 254098, "epoch": 1512} {"train_loss": -11.893478393554688, "global_step": 254099, "epoch": 1512} {"train_loss": -11.859670639038086, "global_step": 254100, "epoch": 1512} {"train_loss": -11.918956756591797, "global_step": 254101, "epoch": 1512} {"train_loss": -11.582460403442383, "global_step": 254102, "epoch": 1512} {"train_loss": -12.007211685180664, "global_step": 254103, "epoch": 1512} {"train_loss": -11.53136920928955, "global_step": 254104, "epoch": 1512} {"train_loss": -12.096293449401855, "global_step": 254105, "epoch": 1512} {"train_loss": -11.055706977844238, "global_step": 254106, "epoch": 1512} {"train_loss": -11.213701248168945, "global_step": 254107, "epoch": 1512} {"train_loss": -11.507389068603516, "global_step": 254108, "epoch": 1512} {"train_loss": -11.534793853759766, "global_step": 254109, "epoch": 1512} {"train_loss": -11.020135879516602, "global_step": 254110, "epoch": 1512} {"train_loss": -11.636299133300781, "global_step": 254111, "epoch": 1512} {"train_loss": -9.687116622924805, "global_step": 254112, "epoch": 1512} {"train_loss": -10.855403900146484, "global_step": 254113, "epoch": 1512} {"train_loss": -10.03754997253418, "global_step": 254114, "epoch": 1512} {"train_loss": -9.96196460723877, "global_step": 254115, "epoch": 1512} {"train_loss": -10.488550186157227, "global_step": 254116, "epoch": 1512} {"train_loss": -9.910541534423828, "global_step": 254117, "epoch": 1512} {"train_loss": -11.3803129196167, "global_step": 254118, "epoch": 1512} {"train_loss": -10.655198097229004, "global_step": 254119, "epoch": 1512} {"train_loss": -10.802169799804688, "global_step": 254120, "epoch": 1512} {"train_loss": -10.441341400146484, "global_step": 254121, "epoch": 1512} {"train_loss": -11.348119735717773, "global_step": 254122, "epoch": 1512} {"train_loss": -10.901429176330566, "global_step": 254123, "epoch": 1512} {"train_loss": -11.652167320251465, "global_step": 254124, "epoch": 1512} {"train_loss": -10.877897262573242, "global_step": 254125, "epoch": 1512} {"train_loss": -11.392223358154297, "global_step": 254126, "epoch": 1512} {"train_loss": -11.296646118164062, "global_step": 254127, "epoch": 1512} {"train_loss": -10.989986419677734, "global_step": 254128, "epoch": 1512} {"train_loss": -11.092508316040039, "global_step": 254129, "epoch": 1512} {"train_loss": -10.558504104614258, "global_step": 254130, "epoch": 1512} {"train_loss": -11.543581008911133, "global_step": 254131, "epoch": 1512} {"train_loss": -11.055678367614746, "global_step": 254132, "epoch": 1512} {"train_loss": -11.933128356933594, "global_step": 254133, "epoch": 1512} {"train_loss": -11.54928970336914, "global_step": 254134, "epoch": 1512} {"train_loss": -11.655830383300781, "global_step": 254135, "epoch": 1512} {"train_loss": -11.604690551757812, "global_step": 254136, "epoch": 1512} {"train_loss": -11.669897079467773, "global_step": 254137, "epoch": 1512} {"train_loss": -11.535547256469727, "global_step": 254138, "epoch": 1512} {"train_loss": -11.594947814941406, "global_step": 254139, "epoch": 1512} {"train_loss": -11.660380363464355, "global_step": 254140, "epoch": 1512} {"train_loss": -11.922658920288086, "global_step": 254141, "epoch": 1512} {"train_loss": -11.517851829528809, "global_step": 254142, "epoch": 1512} {"train_loss": -12.005949020385742, "global_step": 254143, "epoch": 1512} {"train_loss": -11.222906112670898, "global_step": 254144, "epoch": 1512} {"train_loss": -11.890342712402344, "global_step": 254145, "epoch": 1512} {"train_loss": -11.413430213928223, "global_step": 254146, "epoch": 1512} {"train_loss": -11.626352310180664, "global_step": 254147, "epoch": 1512} {"train_loss": -11.568458557128906, "global_step": 254148, "epoch": 1512} {"train_loss": -11.539061546325684, "global_step": 254149, "epoch": 1512} {"train_loss": -11.71595573425293, "global_step": 254150, "epoch": 1512} {"train_loss": -11.633821487426758, "global_step": 254151, "epoch": 1512} {"train_loss": -11.359004974365234, "global_step": 254152, "epoch": 1512} {"train_loss": -11.94583511352539, "global_step": 254153, "epoch": 1512} {"train_loss": -11.390768051147461, "global_step": 254154, "epoch": 1512} {"train_loss": -11.704080581665039, "global_step": 254155, "epoch": 1512} {"train_loss": -11.673419952392578, "global_step": 254156, "epoch": 1512} {"train_loss": -11.706072807312012, "global_step": 254157, "epoch": 1512} {"train_loss": -11.813956260681152, "global_step": 254158, "epoch": 1512} {"train_loss": -11.493330001831055, "global_step": 254159, "epoch": 1512} {"train_loss": -11.684661865234375, "global_step": 254160, "epoch": 1512} {"train_loss": -11.80482006072998, "global_step": 254161, "epoch": 1512} {"train_loss": -11.565251350402832, "global_step": 254162, "epoch": 1512} {"train_loss": -11.803208351135254, "global_step": 254163, "epoch": 1512} {"train_loss": -11.175498962402344, "global_step": 254164, "epoch": 1512} {"train_loss": -11.946394920349121, "global_step": 254165, "epoch": 1512} {"train_loss": -11.61582088470459, "global_step": 254166, "epoch": 1512} {"train_loss": -11.628913879394531, "global_step": 254167, "epoch": 1512} {"train_loss": -12.025896072387695, "global_step": 254168, "epoch": 1512} {"train_loss": -11.476005554199219, "global_step": 254169, "epoch": 1512} {"train_loss": -12.009344100952148, "global_step": 254170, "epoch": 1512} {"train_loss": -11.9482421875, "global_step": 254171, "epoch": 1512} {"train_loss": -11.613094329833984, "global_step": 254172, "epoch": 1512} {"train_loss": -11.988567352294922, "global_step": 254173, "epoch": 1512} {"train_loss": -11.834566116333008, "global_step": 254174, "epoch": 1512} {"train_loss": -11.855428695678711, "global_step": 254175, "epoch": 1512} {"train_loss": -11.934549331665039, "global_step": 254176, "epoch": 1512} {"train_loss": -11.864124298095703, "global_step": 254177, "epoch": 1512} {"train_loss": -11.903732299804688, "global_step": 254178, "epoch": 1512} {"train_loss": -11.854649543762207, "global_step": 254179, "epoch": 1512} {"train_loss": -12.008455276489258, "global_step": 254180, "epoch": 1512} {"train_loss": -11.780012130737305, "global_step": 254181, "epoch": 1512} {"train_loss": -11.962444305419922, "global_step": 254182, "epoch": 1512} {"train_loss": -11.56059523991176, "global_step": 254183, "epoch": 1512, "val_loss": 272283.75} {"train_loss": -11.81519889831543, "global_step": 254184, "epoch": 1513} {"train_loss": -11.975912094116211, "global_step": 254185, "epoch": 1513} {"train_loss": -11.857087135314941, "global_step": 254186, "epoch": 1513} {"train_loss": -12.081111907958984, "global_step": 254187, "epoch": 1513} {"train_loss": -11.751008987426758, "global_step": 254188, "epoch": 1513} {"train_loss": -11.843145370483398, "global_step": 254189, "epoch": 1513} {"train_loss": -12.003457069396973, "global_step": 254190, "epoch": 1513} {"train_loss": -11.844964027404785, "global_step": 254191, "epoch": 1513} {"train_loss": -12.06043815612793, "global_step": 254192, "epoch": 1513} {"train_loss": -11.968427658081055, "global_step": 254193, "epoch": 1513} {"train_loss": -12.073103904724121, "global_step": 254194, "epoch": 1513} {"train_loss": -12.16928482055664, "global_step": 254195, "epoch": 1513} {"train_loss": -11.741657257080078, "global_step": 254196, "epoch": 1513} {"train_loss": -12.069076538085938, "global_step": 254197, "epoch": 1513} {"train_loss": -11.83360481262207, "global_step": 254198, "epoch": 1513} {"train_loss": -11.962444305419922, "global_step": 254199, "epoch": 1513} {"train_loss": -12.042007446289062, "global_step": 254200, "epoch": 1513} {"train_loss": -12.171167373657227, "global_step": 254201, "epoch": 1513} {"train_loss": -12.068181991577148, "global_step": 254202, "epoch": 1513} {"train_loss": -12.068790435791016, "global_step": 254203, "epoch": 1513} {"train_loss": -12.248088836669922, "global_step": 254204, "epoch": 1513} {"train_loss": -12.099542617797852, "global_step": 254205, "epoch": 1513} {"train_loss": -12.024148941040039, "global_step": 254206, "epoch": 1513} {"train_loss": -12.008787155151367, "global_step": 254207, "epoch": 1513} {"train_loss": -12.25013256072998, "global_step": 254208, "epoch": 1513} {"train_loss": -12.039870262145996, "global_step": 254209, "epoch": 1513} {"train_loss": -12.215608596801758, "global_step": 254210, "epoch": 1513} {"train_loss": -11.877738952636719, "global_step": 254211, "epoch": 1513} {"train_loss": -12.013442993164062, "global_step": 254212, "epoch": 1513} {"train_loss": -11.910089492797852, "global_step": 254213, "epoch": 1513} {"train_loss": -11.481134414672852, "global_step": 254214, "epoch": 1513} {"train_loss": -11.311136245727539, "global_step": 254215, "epoch": 1513} {"train_loss": -11.616059303283691, "global_step": 254216, "epoch": 1513} {"train_loss": -11.763702392578125, "global_step": 254217, "epoch": 1513} {"train_loss": -11.397651672363281, "global_step": 254218, "epoch": 1513} {"train_loss": -11.635193824768066, "global_step": 254219, "epoch": 1513} {"train_loss": -11.177671432495117, "global_step": 254220, "epoch": 1513} {"train_loss": -11.090848922729492, "global_step": 254221, "epoch": 1513} {"train_loss": -11.174352645874023, "global_step": 254222, "epoch": 1513} {"train_loss": -12.034366607666016, "global_step": 254223, "epoch": 1513} {"train_loss": -10.713531494140625, "global_step": 254224, "epoch": 1513} {"train_loss": -12.180015563964844, "global_step": 254225, "epoch": 1513} {"train_loss": -10.560239791870117, "global_step": 254226, "epoch": 1513} {"train_loss": -11.400009155273438, "global_step": 254227, "epoch": 1513} {"train_loss": -11.296749114990234, "global_step": 254228, "epoch": 1513} {"train_loss": -10.416147232055664, "global_step": 254229, "epoch": 1513} {"train_loss": -11.216609001159668, "global_step": 254230, "epoch": 1513} {"train_loss": -10.086738586425781, "global_step": 254231, "epoch": 1513} {"train_loss": -10.540742874145508, "global_step": 254232, "epoch": 1513} {"train_loss": -11.052282333374023, "global_step": 254233, "epoch": 1513} {"train_loss": -10.631961822509766, "global_step": 254234, "epoch": 1513} {"train_loss": -11.445333480834961, "global_step": 254235, "epoch": 1513} {"train_loss": -10.680610656738281, "global_step": 254236, "epoch": 1513} {"train_loss": -11.3311767578125, "global_step": 254237, "epoch": 1513} {"train_loss": -11.408038139343262, "global_step": 254238, "epoch": 1513} {"train_loss": -11.199329376220703, "global_step": 254239, "epoch": 1513} {"train_loss": -11.587258338928223, "global_step": 254240, "epoch": 1513} {"train_loss": -10.64608383178711, "global_step": 254241, "epoch": 1513} {"train_loss": -11.673349380493164, "global_step": 254242, "epoch": 1513} {"train_loss": -10.637763023376465, "global_step": 254243, "epoch": 1513} {"train_loss": -10.44202995300293, "global_step": 254244, "epoch": 1513} {"train_loss": -11.045576095581055, "global_step": 254245, "epoch": 1513} {"train_loss": -10.685113906860352, "global_step": 254246, "epoch": 1513} {"train_loss": -10.876307487487793, "global_step": 254247, "epoch": 1513} {"train_loss": -11.046670913696289, "global_step": 254248, "epoch": 1513} {"train_loss": -11.462987899780273, "global_step": 254249, "epoch": 1513} {"train_loss": -10.935400009155273, "global_step": 254250, "epoch": 1513} {"train_loss": -11.76719856262207, "global_step": 254251, "epoch": 1513} {"train_loss": -11.475852966308594, "global_step": 254252, "epoch": 1513} {"train_loss": -11.50235652923584, "global_step": 254253, "epoch": 1513} {"train_loss": -11.604928970336914, "global_step": 254254, "epoch": 1513} {"train_loss": -11.515131950378418, "global_step": 254255, "epoch": 1513} {"train_loss": -11.272734642028809, "global_step": 254256, "epoch": 1513} {"train_loss": -11.766118049621582, "global_step": 254257, "epoch": 1513} {"train_loss": -11.983826637268066, "global_step": 254258, "epoch": 1513} {"train_loss": -11.718389511108398, "global_step": 254259, "epoch": 1513} {"train_loss": -11.759256362915039, "global_step": 254260, "epoch": 1513} {"train_loss": -11.886308670043945, "global_step": 254261, "epoch": 1513} {"train_loss": -11.97161865234375, "global_step": 254262, "epoch": 1513} {"train_loss": -11.815988540649414, "global_step": 254263, "epoch": 1513} {"train_loss": -11.798368453979492, "global_step": 254264, "epoch": 1513} {"train_loss": -11.87224006652832, "global_step": 254265, "epoch": 1513} {"train_loss": -11.936049461364746, "global_step": 254266, "epoch": 1513} {"train_loss": -12.014001846313477, "global_step": 254267, "epoch": 1513} {"train_loss": -12.173377990722656, "global_step": 254268, "epoch": 1513} {"train_loss": -11.820001602172852, "global_step": 254269, "epoch": 1513} {"train_loss": -11.968940734863281, "global_step": 254270, "epoch": 1513} {"train_loss": -11.949270248413086, "global_step": 254271, "epoch": 1513} {"train_loss": -11.730047225952148, "global_step": 254272, "epoch": 1513} {"train_loss": -12.02362060546875, "global_step": 254273, "epoch": 1513} {"train_loss": -11.905803680419922, "global_step": 254274, "epoch": 1513} {"train_loss": -11.79281997680664, "global_step": 254275, "epoch": 1513} {"train_loss": -12.012516021728516, "global_step": 254276, "epoch": 1513} {"train_loss": -11.909673690795898, "global_step": 254277, "epoch": 1513} {"train_loss": -11.944156646728516, "global_step": 254278, "epoch": 1513} {"train_loss": -12.110833168029785, "global_step": 254279, "epoch": 1513} {"train_loss": -11.92049789428711, "global_step": 254280, "epoch": 1513} {"train_loss": -12.113798141479492, "global_step": 254281, "epoch": 1513} {"train_loss": -11.896068572998047, "global_step": 254282, "epoch": 1513} {"train_loss": -11.883970260620117, "global_step": 254283, "epoch": 1513} {"train_loss": -11.878753662109375, "global_step": 254284, "epoch": 1513} {"train_loss": -12.058435440063477, "global_step": 254285, "epoch": 1513} {"train_loss": -11.814421653747559, "global_step": 254286, "epoch": 1513} {"train_loss": -11.94175910949707, "global_step": 254287, "epoch": 1513} {"train_loss": -12.003650665283203, "global_step": 254288, "epoch": 1513} {"train_loss": -11.995125770568848, "global_step": 254289, "epoch": 1513} {"train_loss": -12.129617691040039, "global_step": 254290, "epoch": 1513} {"train_loss": -12.19607162475586, "global_step": 254291, "epoch": 1513} {"train_loss": -11.764692306518555, "global_step": 254292, "epoch": 1513} {"train_loss": -11.837776184082031, "global_step": 254293, "epoch": 1513} {"train_loss": -12.112290382385254, "global_step": 254294, "epoch": 1513} {"train_loss": -11.976630210876465, "global_step": 254295, "epoch": 1513} {"train_loss": -12.034248352050781, "global_step": 254296, "epoch": 1513} {"train_loss": -12.104691505432129, "global_step": 254297, "epoch": 1513} {"train_loss": -12.117944717407227, "global_step": 254298, "epoch": 1513} {"train_loss": -12.11789321899414, "global_step": 254299, "epoch": 1513} {"train_loss": -12.131959915161133, "global_step": 254300, "epoch": 1513} {"train_loss": -11.8704833984375, "global_step": 254301, "epoch": 1513} {"train_loss": -12.1618070602417, "global_step": 254302, "epoch": 1513} {"train_loss": -11.949041366577148, "global_step": 254303, "epoch": 1513} {"train_loss": -11.97165298461914, "global_step": 254304, "epoch": 1513} {"train_loss": -11.695039749145508, "global_step": 254305, "epoch": 1513} {"train_loss": -12.116621017456055, "global_step": 254306, "epoch": 1513} {"train_loss": -12.271346092224121, "global_step": 254307, "epoch": 1513} {"train_loss": -12.023921966552734, "global_step": 254308, "epoch": 1513} {"train_loss": -11.179141998291016, "global_step": 254309, "epoch": 1513} {"train_loss": -11.318519592285156, "global_step": 254310, "epoch": 1513} {"train_loss": -11.57046127319336, "global_step": 254311, "epoch": 1513} {"train_loss": -12.001689910888672, "global_step": 254312, "epoch": 1513} {"train_loss": -11.248350143432617, "global_step": 254313, "epoch": 1513} {"train_loss": -10.885883331298828, "global_step": 254314, "epoch": 1513} {"train_loss": -11.690156936645508, "global_step": 254315, "epoch": 1513} {"train_loss": -11.957242012023926, "global_step": 254316, "epoch": 1513} {"train_loss": -11.951692581176758, "global_step": 254317, "epoch": 1513} {"train_loss": -11.008889198303223, "global_step": 254318, "epoch": 1513} {"train_loss": -10.716157913208008, "global_step": 254319, "epoch": 1513} {"train_loss": -11.365078926086426, "global_step": 254320, "epoch": 1513} {"train_loss": -11.83045768737793, "global_step": 254321, "epoch": 1513} {"train_loss": -11.517143249511719, "global_step": 254322, "epoch": 1513} {"train_loss": -11.695232391357422, "global_step": 254323, "epoch": 1513} {"train_loss": -11.722049713134766, "global_step": 254324, "epoch": 1513} {"train_loss": -10.452285766601562, "global_step": 254325, "epoch": 1513} {"train_loss": -11.091594696044922, "global_step": 254326, "epoch": 1513} {"train_loss": -11.623113632202148, "global_step": 254327, "epoch": 1513} {"train_loss": -10.517387390136719, "global_step": 254328, "epoch": 1513} {"train_loss": -11.149864196777344, "global_step": 254329, "epoch": 1513} {"train_loss": -11.378337860107422, "global_step": 254330, "epoch": 1513} {"train_loss": -11.952167510986328, "global_step": 254331, "epoch": 1513} {"train_loss": -11.269792556762695, "global_step": 254332, "epoch": 1513} {"train_loss": -11.585270881652832, "global_step": 254333, "epoch": 1513} {"train_loss": -11.040175437927246, "global_step": 254334, "epoch": 1513} {"train_loss": -11.656952857971191, "global_step": 254335, "epoch": 1513} {"train_loss": -11.275861740112305, "global_step": 254336, "epoch": 1513} {"train_loss": -11.412407875061035, "global_step": 254337, "epoch": 1513} {"train_loss": -11.423904418945312, "global_step": 254338, "epoch": 1513} {"train_loss": -11.916543006896973, "global_step": 254339, "epoch": 1513} {"train_loss": -11.221986770629883, "global_step": 254340, "epoch": 1513} {"train_loss": -11.481183052062988, "global_step": 254341, "epoch": 1513} {"train_loss": -11.576902389526367, "global_step": 254342, "epoch": 1513} {"train_loss": -11.362579345703125, "global_step": 254343, "epoch": 1513} {"train_loss": -12.01211166381836, "global_step": 254344, "epoch": 1513} {"train_loss": -11.156512260437012, "global_step": 254345, "epoch": 1513} {"train_loss": -11.73032283782959, "global_step": 254346, "epoch": 1513} {"train_loss": -11.636991500854492, "global_step": 254347, "epoch": 1513} {"train_loss": -11.715888977050781, "global_step": 254348, "epoch": 1513} {"train_loss": -11.915410041809082, "global_step": 254349, "epoch": 1513} {"train_loss": -11.767440795898438, "global_step": 254350, "epoch": 1513} {"train_loss": -11.640151750473748, "global_step": 254351, "epoch": 1513, "val_loss": 270567.25} {"train_loss": -11.325130462646484, "global_step": 254352, "epoch": 1514} {"train_loss": -12.057294845581055, "global_step": 254353, "epoch": 1514} {"train_loss": -11.652872085571289, "global_step": 254354, "epoch": 1514} {"train_loss": -12.192968368530273, "global_step": 254355, "epoch": 1514} {"train_loss": -11.956279754638672, "global_step": 254356, "epoch": 1514} {"train_loss": -11.914206504821777, "global_step": 254357, "epoch": 1514} {"train_loss": -11.816627502441406, "global_step": 254358, "epoch": 1514} {"train_loss": -11.722064971923828, "global_step": 254359, "epoch": 1514} {"train_loss": -12.05206298828125, "global_step": 254360, "epoch": 1514} {"train_loss": -11.908403396606445, "global_step": 254361, "epoch": 1514} {"train_loss": -11.922447204589844, "global_step": 254362, "epoch": 1514} {"train_loss": -11.989973068237305, "global_step": 254363, "epoch": 1514} {"train_loss": -12.045541763305664, "global_step": 254364, "epoch": 1514} {"train_loss": -11.932901382446289, "global_step": 254365, "epoch": 1514} {"train_loss": -11.844520568847656, "global_step": 254366, "epoch": 1514} {"train_loss": -11.92558479309082, "global_step": 254367, "epoch": 1514} {"train_loss": -12.084951400756836, "global_step": 254368, "epoch": 1514} {"train_loss": -11.848040580749512, "global_step": 254369, "epoch": 1514} {"train_loss": -11.919938087463379, "global_step": 254370, "epoch": 1514} {"train_loss": -11.909144401550293, "global_step": 254371, "epoch": 1514} {"train_loss": -11.621511459350586, "global_step": 254372, "epoch": 1514} {"train_loss": -11.91361141204834, "global_step": 254373, "epoch": 1514} {"train_loss": -11.768282890319824, "global_step": 254374, "epoch": 1514} {"train_loss": -11.798881530761719, "global_step": 254375, "epoch": 1514} {"train_loss": -11.735574722290039, "global_step": 254376, "epoch": 1514} {"train_loss": -11.963384628295898, "global_step": 254377, "epoch": 1514} {"train_loss": -11.677879333496094, "global_step": 254378, "epoch": 1514} {"train_loss": -11.700139999389648, "global_step": 254379, "epoch": 1514} {"train_loss": -11.311676025390625, "global_step": 254380, "epoch": 1514} {"train_loss": -12.221177101135254, "global_step": 254381, "epoch": 1514} {"train_loss": -11.594398498535156, "global_step": 254382, "epoch": 1514} {"train_loss": -11.767702102661133, "global_step": 254383, "epoch": 1514} {"train_loss": -11.529350280761719, "global_step": 254384, "epoch": 1514} {"train_loss": -11.656972885131836, "global_step": 254385, "epoch": 1514} {"train_loss": -10.172760009765625, "global_step": 254386, "epoch": 1514} {"train_loss": -11.820137977600098, "global_step": 254387, "epoch": 1514} {"train_loss": -11.117645263671875, "global_step": 254388, "epoch": 1514} {"train_loss": -10.212599754333496, "global_step": 254389, "epoch": 1514} {"train_loss": -11.807718276977539, "global_step": 254390, "epoch": 1514} {"train_loss": -11.429577827453613, "global_step": 254391, "epoch": 1514} {"train_loss": -10.422117233276367, "global_step": 254392, "epoch": 1514} {"train_loss": -11.85163402557373, "global_step": 254393, "epoch": 1514} {"train_loss": -11.101579666137695, "global_step": 254394, "epoch": 1514} {"train_loss": -11.048494338989258, "global_step": 254395, "epoch": 1514} {"train_loss": -11.344266891479492, "global_step": 254396, "epoch": 1514} {"train_loss": -10.584575653076172, "global_step": 254397, "epoch": 1514} {"train_loss": -11.52824878692627, "global_step": 254398, "epoch": 1514} {"train_loss": -10.410396575927734, "global_step": 254399, "epoch": 1514} {"train_loss": -11.222030639648438, "global_step": 254400, "epoch": 1514} {"train_loss": -11.447891235351562, "global_step": 254401, "epoch": 1514} {"train_loss": -11.292829513549805, "global_step": 254402, "epoch": 1514} {"train_loss": -11.114107131958008, "global_step": 254403, "epoch": 1514} {"train_loss": -11.461204528808594, "global_step": 254404, "epoch": 1514} {"train_loss": -10.911154747009277, "global_step": 254405, "epoch": 1514} {"train_loss": -11.082810401916504, "global_step": 254406, "epoch": 1514} {"train_loss": -10.557929992675781, "global_step": 254407, "epoch": 1514} {"train_loss": -11.644366264343262, "global_step": 254408, "epoch": 1514} {"train_loss": -11.246805191040039, "global_step": 254409, "epoch": 1514} {"train_loss": -11.575630187988281, "global_step": 254410, "epoch": 1514} {"train_loss": -11.501096725463867, "global_step": 254411, "epoch": 1514} {"train_loss": -10.987516403198242, "global_step": 254412, "epoch": 1514} {"train_loss": -11.439281463623047, "global_step": 254413, "epoch": 1514} {"train_loss": -10.98178482055664, "global_step": 254414, "epoch": 1514} {"train_loss": -11.737892150878906, "global_step": 254415, "epoch": 1514} {"train_loss": -11.037603378295898, "global_step": 254416, "epoch": 1514} {"train_loss": -11.54263687133789, "global_step": 254417, "epoch": 1514} {"train_loss": -11.170066833496094, "global_step": 254418, "epoch": 1514} {"train_loss": -11.430201530456543, "global_step": 254419, "epoch": 1514} {"train_loss": -11.388586044311523, "global_step": 254420, "epoch": 1514} {"train_loss": -11.40869140625, "global_step": 254421, "epoch": 1514} {"train_loss": -11.634206771850586, "global_step": 254422, "epoch": 1514} {"train_loss": -11.542354583740234, "global_step": 254423, "epoch": 1514} {"train_loss": -11.688098907470703, "global_step": 254424, "epoch": 1514} {"train_loss": -11.144572257995605, "global_step": 254425, "epoch": 1514} {"train_loss": -11.608871459960938, "global_step": 254426, "epoch": 1514} {"train_loss": -11.344832420349121, "global_step": 254427, "epoch": 1514} {"train_loss": -11.659008026123047, "global_step": 254428, "epoch": 1514} {"train_loss": -11.420351028442383, "global_step": 254429, "epoch": 1514} {"train_loss": -11.66627025604248, "global_step": 254430, "epoch": 1514} {"train_loss": -11.451395034790039, "global_step": 254431, "epoch": 1514} {"train_loss": -11.625348091125488, "global_step": 254432, "epoch": 1514} {"train_loss": -11.477056503295898, "global_step": 254433, "epoch": 1514} {"train_loss": -11.85125732421875, "global_step": 254434, "epoch": 1514} {"train_loss": -11.32492446899414, "global_step": 254435, "epoch": 1514} {"train_loss": -11.37144660949707, "global_step": 254436, "epoch": 1514} {"train_loss": -11.375686645507812, "global_step": 254437, "epoch": 1514} {"train_loss": -11.487607955932617, "global_step": 254438, "epoch": 1514} {"train_loss": -11.656740188598633, "global_step": 254439, "epoch": 1514} {"train_loss": -11.435820579528809, "global_step": 254440, "epoch": 1514} {"train_loss": -11.480602264404297, "global_step": 254441, "epoch": 1514} {"train_loss": -11.968038558959961, "global_step": 254442, "epoch": 1514} {"train_loss": -11.55947208404541, "global_step": 254443, "epoch": 1514} {"train_loss": -11.345409393310547, "global_step": 254444, "epoch": 1514} {"train_loss": -11.807811737060547, "global_step": 254445, "epoch": 1514} {"train_loss": -11.651443481445312, "global_step": 254446, "epoch": 1514} {"train_loss": -11.783031463623047, "global_step": 254447, "epoch": 1514} {"train_loss": -11.44063663482666, "global_step": 254448, "epoch": 1514} {"train_loss": -11.959352493286133, "global_step": 254449, "epoch": 1514} {"train_loss": -11.43756103515625, "global_step": 254450, "epoch": 1514} {"train_loss": -11.830337524414062, "global_step": 254451, "epoch": 1514} {"train_loss": -11.763923645019531, "global_step": 254452, "epoch": 1514} {"train_loss": -11.661401748657227, "global_step": 254453, "epoch": 1514} {"train_loss": -11.850409507751465, "global_step": 254454, "epoch": 1514} {"train_loss": -11.597009658813477, "global_step": 254455, "epoch": 1514} {"train_loss": -11.789161682128906, "global_step": 254456, "epoch": 1514} {"train_loss": -11.9888916015625, "global_step": 254457, "epoch": 1514} {"train_loss": -11.616809844970703, "global_step": 254458, "epoch": 1514} {"train_loss": -11.979541778564453, "global_step": 254459, "epoch": 1514} {"train_loss": -12.108242988586426, "global_step": 254460, "epoch": 1514} {"train_loss": -11.742074966430664, "global_step": 254461, "epoch": 1514} {"train_loss": -11.838926315307617, "global_step": 254462, "epoch": 1514} {"train_loss": -11.89824104309082, "global_step": 254463, "epoch": 1514} {"train_loss": -11.698009490966797, "global_step": 254464, "epoch": 1514} {"train_loss": -11.977065086364746, "global_step": 254465, "epoch": 1514} {"train_loss": -12.083087921142578, "global_step": 254466, "epoch": 1514} {"train_loss": -11.916152954101562, "global_step": 254467, "epoch": 1514} {"train_loss": -12.22017765045166, "global_step": 254468, "epoch": 1514} {"train_loss": -11.992071151733398, "global_step": 254469, "epoch": 1514} {"train_loss": -12.064902305603027, "global_step": 254470, "epoch": 1514} {"train_loss": -11.97055435180664, "global_step": 254471, "epoch": 1514} {"train_loss": -11.797710418701172, "global_step": 254472, "epoch": 1514} {"train_loss": -12.114910125732422, "global_step": 254473, "epoch": 1514} {"train_loss": -11.87240982055664, "global_step": 254474, "epoch": 1514} {"train_loss": -12.061416625976562, "global_step": 254475, "epoch": 1514} {"train_loss": -11.940801620483398, "global_step": 254476, "epoch": 1514} {"train_loss": -12.152826309204102, "global_step": 254477, "epoch": 1514} {"train_loss": -12.038848876953125, "global_step": 254478, "epoch": 1514} {"train_loss": -12.086358070373535, "global_step": 254479, "epoch": 1514} {"train_loss": -12.019031524658203, "global_step": 254480, "epoch": 1514} {"train_loss": -11.904891014099121, "global_step": 254481, "epoch": 1514} {"train_loss": -12.014673233032227, "global_step": 254482, "epoch": 1514} {"train_loss": -11.99277400970459, "global_step": 254483, "epoch": 1514} {"train_loss": -12.193480491638184, "global_step": 254484, "epoch": 1514} {"train_loss": -12.205245018005371, "global_step": 254485, "epoch": 1514} {"train_loss": -11.959144592285156, "global_step": 254486, "epoch": 1514} {"train_loss": -11.879737854003906, "global_step": 254487, "epoch": 1514} {"train_loss": -11.826541900634766, "global_step": 254488, "epoch": 1514} {"train_loss": -11.920698165893555, "global_step": 254489, "epoch": 1514} {"train_loss": -11.936164855957031, "global_step": 254490, "epoch": 1514} {"train_loss": -12.021909713745117, "global_step": 254491, "epoch": 1514} {"train_loss": -11.190332412719727, "global_step": 254492, "epoch": 1514} {"train_loss": -11.859973907470703, "global_step": 254493, "epoch": 1514} {"train_loss": -11.796165466308594, "global_step": 254494, "epoch": 1514} {"train_loss": -11.606740951538086, "global_step": 254495, "epoch": 1514} {"train_loss": -11.474331855773926, "global_step": 254496, "epoch": 1514} {"train_loss": -11.604751586914062, "global_step": 254497, "epoch": 1514} {"train_loss": -10.902435302734375, "global_step": 254498, "epoch": 1514} {"train_loss": -11.807249069213867, "global_step": 254499, "epoch": 1514} {"train_loss": -11.165119171142578, "global_step": 254500, "epoch": 1514} {"train_loss": -11.408285140991211, "global_step": 254501, "epoch": 1514} {"train_loss": -11.41366958618164, "global_step": 254502, "epoch": 1514} {"train_loss": -11.24288558959961, "global_step": 254503, "epoch": 1514} {"train_loss": -11.52787971496582, "global_step": 254504, "epoch": 1514} {"train_loss": -11.376294136047363, "global_step": 254505, "epoch": 1514} {"train_loss": -11.270721435546875, "global_step": 254506, "epoch": 1514} {"train_loss": -11.738718032836914, "global_step": 254507, "epoch": 1514} {"train_loss": -10.729287147521973, "global_step": 254508, "epoch": 1514} {"train_loss": -10.630794525146484, "global_step": 254509, "epoch": 1514} {"train_loss": -11.64378547668457, "global_step": 254510, "epoch": 1514} {"train_loss": -9.97552490234375, "global_step": 254511, "epoch": 1514} {"train_loss": -10.605613708496094, "global_step": 254512, "epoch": 1514} {"train_loss": -10.853523254394531, "global_step": 254513, "epoch": 1514} {"train_loss": -10.000551223754883, "global_step": 254514, "epoch": 1514} {"train_loss": -11.16103744506836, "global_step": 254515, "epoch": 1514} {"train_loss": -10.505698204040527, "global_step": 254516, "epoch": 1514} {"train_loss": -10.527885437011719, "global_step": 254517, "epoch": 1514} {"train_loss": -10.580732345581055, "global_step": 254518, "epoch": 1514} {"train_loss": -11.5574418874014, "global_step": 254519, "epoch": 1514, "val_loss": 268744.75} {"train_loss": -9.196172714233398, "global_step": 254520, "epoch": 1515} {"train_loss": -10.950641632080078, "global_step": 254521, "epoch": 1515} {"train_loss": -9.692103385925293, "global_step": 254522, "epoch": 1515} {"train_loss": -10.752646446228027, "global_step": 254523, "epoch": 1515} {"train_loss": -10.340555191040039, "global_step": 254524, "epoch": 1515} {"train_loss": -10.18016242980957, "global_step": 254525, "epoch": 1515} {"train_loss": -9.563956260681152, "global_step": 254526, "epoch": 1515} {"train_loss": -10.600921630859375, "global_step": 254527, "epoch": 1515} {"train_loss": -10.044544219970703, "global_step": 254528, "epoch": 1515} {"train_loss": -10.435470581054688, "global_step": 254529, "epoch": 1515} {"train_loss": -10.552894592285156, "global_step": 254530, "epoch": 1515} {"train_loss": -10.908327102661133, "global_step": 254531, "epoch": 1515} {"train_loss": -10.480732917785645, "global_step": 254532, "epoch": 1515} {"train_loss": -11.003636360168457, "global_step": 254533, "epoch": 1515} {"train_loss": -10.593887329101562, "global_step": 254534, "epoch": 1515} {"train_loss": -10.720394134521484, "global_step": 254535, "epoch": 1515} {"train_loss": -10.833666801452637, "global_step": 254536, "epoch": 1515} {"train_loss": -10.868371963500977, "global_step": 254537, "epoch": 1515} {"train_loss": -10.926761627197266, "global_step": 254538, "epoch": 1515} {"train_loss": -11.21237564086914, "global_step": 254539, "epoch": 1515} {"train_loss": -10.647588729858398, "global_step": 254540, "epoch": 1515} {"train_loss": -10.808661460876465, "global_step": 254541, "epoch": 1515} {"train_loss": -10.928522109985352, "global_step": 254542, "epoch": 1515} {"train_loss": -11.117692947387695, "global_step": 254543, "epoch": 1515} {"train_loss": -11.048389434814453, "global_step": 254544, "epoch": 1515} {"train_loss": -11.062215805053711, "global_step": 254545, "epoch": 1515} {"train_loss": -11.528538703918457, "global_step": 254546, "epoch": 1515} {"train_loss": -11.146625518798828, "global_step": 254547, "epoch": 1515} {"train_loss": -11.428577423095703, "global_step": 254548, "epoch": 1515} {"train_loss": -11.458362579345703, "global_step": 254549, "epoch": 1515} {"train_loss": -11.733511924743652, "global_step": 254550, "epoch": 1515} {"train_loss": -11.638166427612305, "global_step": 254551, "epoch": 1515} {"train_loss": -11.627779960632324, "global_step": 254552, "epoch": 1515} {"train_loss": -11.28174877166748, "global_step": 254553, "epoch": 1515} {"train_loss": -11.540395736694336, "global_step": 254554, "epoch": 1515} {"train_loss": -11.607970237731934, "global_step": 254555, "epoch": 1515} {"train_loss": -11.279134750366211, "global_step": 254556, "epoch": 1515} {"train_loss": -11.748371124267578, "global_step": 254557, "epoch": 1515} {"train_loss": -11.340198516845703, "global_step": 254558, "epoch": 1515} {"train_loss": -11.718530654907227, "global_step": 254559, "epoch": 1515} {"train_loss": -11.459132194519043, "global_step": 254560, "epoch": 1515} {"train_loss": -11.702863693237305, "global_step": 254561, "epoch": 1515} {"train_loss": -11.694450378417969, "global_step": 254562, "epoch": 1515} {"train_loss": -11.67338752746582, "global_step": 254563, "epoch": 1515} {"train_loss": -11.745685577392578, "global_step": 254564, "epoch": 1515} {"train_loss": -11.66632080078125, "global_step": 254565, "epoch": 1515} {"train_loss": -11.866113662719727, "global_step": 254566, "epoch": 1515} {"train_loss": -11.940061569213867, "global_step": 254567, "epoch": 1515} {"train_loss": -11.866548538208008, "global_step": 254568, "epoch": 1515} {"train_loss": -11.85948371887207, "global_step": 254569, "epoch": 1515} {"train_loss": -11.942264556884766, "global_step": 254570, "epoch": 1515} {"train_loss": -11.79074478149414, "global_step": 254571, "epoch": 1515} {"train_loss": -11.921283721923828, "global_step": 254572, "epoch": 1515} {"train_loss": -11.934022903442383, "global_step": 254573, "epoch": 1515} {"train_loss": -11.937294006347656, "global_step": 254574, "epoch": 1515} {"train_loss": -11.802685737609863, "global_step": 254575, "epoch": 1515} {"train_loss": -12.093173027038574, "global_step": 254576, "epoch": 1515} {"train_loss": -11.793603897094727, "global_step": 254577, "epoch": 1515} {"train_loss": -11.70103645324707, "global_step": 254578, "epoch": 1515} {"train_loss": -12.0093355178833, "global_step": 254579, "epoch": 1515} {"train_loss": -11.919512748718262, "global_step": 254580, "epoch": 1515} {"train_loss": -11.851826667785645, "global_step": 254581, "epoch": 1515} {"train_loss": -12.082807540893555, "global_step": 254582, "epoch": 1515} {"train_loss": -12.043211936950684, "global_step": 254583, "epoch": 1515} {"train_loss": -12.119589805603027, "global_step": 254584, "epoch": 1515} {"train_loss": -11.998186111450195, "global_step": 254585, "epoch": 1515} {"train_loss": -12.02144718170166, "global_step": 254586, "epoch": 1515} {"train_loss": -12.016701698303223, "global_step": 254587, "epoch": 1515} {"train_loss": -11.974334716796875, "global_step": 254588, "epoch": 1515} {"train_loss": -11.949706077575684, "global_step": 254589, "epoch": 1515} {"train_loss": -11.919744491577148, "global_step": 254590, "epoch": 1515} {"train_loss": -12.002599716186523, "global_step": 254591, "epoch": 1515} {"train_loss": -12.15924072265625, "global_step": 254592, "epoch": 1515} {"train_loss": -12.183716773986816, "global_step": 254593, "epoch": 1515} {"train_loss": -12.244044303894043, "global_step": 254594, "epoch": 1515} {"train_loss": -12.017837524414062, "global_step": 254595, "epoch": 1515} {"train_loss": -12.023641586303711, "global_step": 254596, "epoch": 1515} {"train_loss": -12.035370826721191, "global_step": 254597, "epoch": 1515} {"train_loss": -11.995275497436523, "global_step": 254598, "epoch": 1515} {"train_loss": -11.88823413848877, "global_step": 254599, "epoch": 1515} {"train_loss": -12.040528297424316, "global_step": 254600, "epoch": 1515} {"train_loss": -11.768760681152344, "global_step": 254601, "epoch": 1515} {"train_loss": -12.144365310668945, "global_step": 254602, "epoch": 1515} {"train_loss": -11.835613250732422, "global_step": 254603, "epoch": 1515} {"train_loss": -11.774633407592773, "global_step": 254604, "epoch": 1515} {"train_loss": -12.258268356323242, "global_step": 254605, "epoch": 1515} {"train_loss": -11.98365592956543, "global_step": 254606, "epoch": 1515} {"train_loss": -11.797463417053223, "global_step": 254607, "epoch": 1515} {"train_loss": -12.054515838623047, "global_step": 254608, "epoch": 1515} {"train_loss": -11.864702224731445, "global_step": 254609, "epoch": 1515} {"train_loss": -11.950947761535645, "global_step": 254610, "epoch": 1515} {"train_loss": -12.177041053771973, "global_step": 254611, "epoch": 1515} {"train_loss": -11.691651344299316, "global_step": 254612, "epoch": 1515} {"train_loss": -11.991851806640625, "global_step": 254613, "epoch": 1515} {"train_loss": -12.377123832702637, "global_step": 254614, "epoch": 1515} {"train_loss": -12.028924942016602, "global_step": 254615, "epoch": 1515} {"train_loss": -12.325965881347656, "global_step": 254616, "epoch": 1515} {"train_loss": -12.034783363342285, "global_step": 254617, "epoch": 1515} {"train_loss": -11.681632995605469, "global_step": 254618, "epoch": 1515} {"train_loss": -11.92355728149414, "global_step": 254619, "epoch": 1515} {"train_loss": -11.830549240112305, "global_step": 254620, "epoch": 1515} {"train_loss": -11.510041236877441, "global_step": 254621, "epoch": 1515} {"train_loss": -11.856025695800781, "global_step": 254622, "epoch": 1515} {"train_loss": -12.242898941040039, "global_step": 254623, "epoch": 1515} {"train_loss": -12.112088203430176, "global_step": 254624, "epoch": 1515} {"train_loss": -11.949338912963867, "global_step": 254625, "epoch": 1515} {"train_loss": -12.037206649780273, "global_step": 254626, "epoch": 1515} {"train_loss": -12.120046615600586, "global_step": 254627, "epoch": 1515} {"train_loss": -11.994485855102539, "global_step": 254628, "epoch": 1515} {"train_loss": -12.073171615600586, "global_step": 254629, "epoch": 1515} {"train_loss": -11.915135383605957, "global_step": 254630, "epoch": 1515} {"train_loss": -11.956713676452637, "global_step": 254631, "epoch": 1515} {"train_loss": -12.03653335571289, "global_step": 254632, "epoch": 1515} {"train_loss": -11.618635177612305, "global_step": 254633, "epoch": 1515} {"train_loss": -11.176931381225586, "global_step": 254634, "epoch": 1515} {"train_loss": -11.336274147033691, "global_step": 254635, "epoch": 1515} {"train_loss": -11.617759704589844, "global_step": 254636, "epoch": 1515} {"train_loss": -11.331815719604492, "global_step": 254637, "epoch": 1515} {"train_loss": -10.869344711303711, "global_step": 254638, "epoch": 1515} {"train_loss": -11.858080863952637, "global_step": 254639, "epoch": 1515} {"train_loss": -11.444175720214844, "global_step": 254640, "epoch": 1515} {"train_loss": -11.619382858276367, "global_step": 254641, "epoch": 1515} {"train_loss": -11.803428649902344, "global_step": 254642, "epoch": 1515} {"train_loss": -11.459680557250977, "global_step": 254643, "epoch": 1515} {"train_loss": -11.502601623535156, "global_step": 254644, "epoch": 1515} {"train_loss": -11.55267333984375, "global_step": 254645, "epoch": 1515} {"train_loss": -11.736848831176758, "global_step": 254646, "epoch": 1515} {"train_loss": -11.679905891418457, "global_step": 254647, "epoch": 1515} {"train_loss": -11.220657348632812, "global_step": 254648, "epoch": 1515} {"train_loss": -12.086621284484863, "global_step": 254649, "epoch": 1515} {"train_loss": -11.434734344482422, "global_step": 254650, "epoch": 1515} {"train_loss": -11.35608959197998, "global_step": 254651, "epoch": 1515} {"train_loss": -11.516000747680664, "global_step": 254652, "epoch": 1515} {"train_loss": -11.884153366088867, "global_step": 254653, "epoch": 1515} {"train_loss": -11.461746215820312, "global_step": 254654, "epoch": 1515} {"train_loss": -12.018056869506836, "global_step": 254655, "epoch": 1515} {"train_loss": -11.417409896850586, "global_step": 254656, "epoch": 1515} {"train_loss": -11.608697891235352, "global_step": 254657, "epoch": 1515} {"train_loss": -11.71125602722168, "global_step": 254658, "epoch": 1515} {"train_loss": -11.487390518188477, "global_step": 254659, "epoch": 1515} {"train_loss": -11.368782997131348, "global_step": 254660, "epoch": 1515} {"train_loss": -11.628049850463867, "global_step": 254661, "epoch": 1515} {"train_loss": -11.039344787597656, "global_step": 254662, "epoch": 1515} {"train_loss": -11.389628410339355, "global_step": 254663, "epoch": 1515} {"train_loss": -11.266117095947266, "global_step": 254664, "epoch": 1515} {"train_loss": -11.087394714355469, "global_step": 254665, "epoch": 1515} {"train_loss": -11.7899808883667, "global_step": 254666, "epoch": 1515} {"train_loss": -10.714818954467773, "global_step": 254667, "epoch": 1515} {"train_loss": -11.708429336547852, "global_step": 254668, "epoch": 1515} {"train_loss": -10.424079895019531, "global_step": 254669, "epoch": 1515} {"train_loss": -10.14993953704834, "global_step": 254670, "epoch": 1515} {"train_loss": -11.607317924499512, "global_step": 254671, "epoch": 1515} {"train_loss": -9.687215805053711, "global_step": 254672, "epoch": 1515} {"train_loss": -11.697681427001953, "global_step": 254673, "epoch": 1515} {"train_loss": -10.236156463623047, "global_step": 254674, "epoch": 1515} {"train_loss": -9.967269897460938, "global_step": 254675, "epoch": 1515} {"train_loss": -10.978660583496094, "global_step": 254676, "epoch": 1515} {"train_loss": -10.390047073364258, "global_step": 254677, "epoch": 1515} {"train_loss": -10.364843368530273, "global_step": 254678, "epoch": 1515} {"train_loss": -9.9172945022583, "global_step": 254679, "epoch": 1515} {"train_loss": -10.268238067626953, "global_step": 254680, "epoch": 1515} {"train_loss": -10.294352531433105, "global_step": 254681, "epoch": 1515} {"train_loss": -11.044523239135742, "global_step": 254682, "epoch": 1515} {"train_loss": -11.037860870361328, "global_step": 254683, "epoch": 1515} {"train_loss": -11.705947875976562, "global_step": 254684, "epoch": 1515} {"train_loss": -10.347371101379395, "global_step": 254685, "epoch": 1515} {"train_loss": -11.766191482543945, "global_step": 254686, "epoch": 1515} {"train_loss": -11.461063498542423, "global_step": 254687, "epoch": 1515, "val_loss": 266942.15625, "train_action_mse_error": 1.9364972114562988} {"train_loss": -11.655546188354492, "global_step": 254688, "epoch": 1516} {"train_loss": -11.216703414916992, "global_step": 254689, "epoch": 1516} {"train_loss": -11.301994323730469, "global_step": 254690, "epoch": 1516} {"train_loss": -11.514494895935059, "global_step": 254691, "epoch": 1516} {"train_loss": -11.415343284606934, "global_step": 254692, "epoch": 1516} {"train_loss": -11.208463668823242, "global_step": 254693, "epoch": 1516} {"train_loss": -11.459378242492676, "global_step": 254694, "epoch": 1516} {"train_loss": -10.719406127929688, "global_step": 254695, "epoch": 1516} {"train_loss": -11.687483787536621, "global_step": 254696, "epoch": 1516} {"train_loss": -11.165460586547852, "global_step": 254697, "epoch": 1516} {"train_loss": -11.638011932373047, "global_step": 254698, "epoch": 1516} {"train_loss": -11.442567825317383, "global_step": 254699, "epoch": 1516} {"train_loss": -11.484763145446777, "global_step": 254700, "epoch": 1516} {"train_loss": -11.725484848022461, "global_step": 254701, "epoch": 1516} {"train_loss": -11.563410758972168, "global_step": 254702, "epoch": 1516} {"train_loss": -11.946964263916016, "global_step": 254703, "epoch": 1516} {"train_loss": -11.341617584228516, "global_step": 254704, "epoch": 1516} {"train_loss": -11.816388130187988, "global_step": 254705, "epoch": 1516} {"train_loss": -11.521613121032715, "global_step": 254706, "epoch": 1516} {"train_loss": -11.729129791259766, "global_step": 254707, "epoch": 1516} {"train_loss": -11.461454391479492, "global_step": 254708, "epoch": 1516} {"train_loss": -11.751346588134766, "global_step": 254709, "epoch": 1516} {"train_loss": -11.704669952392578, "global_step": 254710, "epoch": 1516} {"train_loss": -11.841143608093262, "global_step": 254711, "epoch": 1516} {"train_loss": -11.770110130310059, "global_step": 254712, "epoch": 1516} {"train_loss": -11.826752662658691, "global_step": 254713, "epoch": 1516} {"train_loss": -11.841451644897461, "global_step": 254714, "epoch": 1516} {"train_loss": -11.740488052368164, "global_step": 254715, "epoch": 1516} {"train_loss": -11.87956428527832, "global_step": 254716, "epoch": 1516} {"train_loss": -12.005388259887695, "global_step": 254717, "epoch": 1516} {"train_loss": -11.64876937866211, "global_step": 254718, "epoch": 1516} {"train_loss": -11.847514152526855, "global_step": 254719, "epoch": 1516} {"train_loss": -11.935651779174805, "global_step": 254720, "epoch": 1516} {"train_loss": -11.940735816955566, "global_step": 254721, "epoch": 1516} {"train_loss": -11.907739639282227, "global_step": 254722, "epoch": 1516} {"train_loss": -12.070317268371582, "global_step": 254723, "epoch": 1516} {"train_loss": -11.792253494262695, "global_step": 254724, "epoch": 1516} {"train_loss": -11.815763473510742, "global_step": 254725, "epoch": 1516} {"train_loss": -11.670818328857422, "global_step": 254726, "epoch": 1516} {"train_loss": -12.014608383178711, "global_step": 254727, "epoch": 1516} {"train_loss": -11.465618133544922, "global_step": 254728, "epoch": 1516} {"train_loss": -11.7645845413208, "global_step": 254729, "epoch": 1516} {"train_loss": -11.674626350402832, "global_step": 254730, "epoch": 1516} {"train_loss": -12.003091812133789, "global_step": 254731, "epoch": 1516} {"train_loss": -11.625725746154785, "global_step": 254732, "epoch": 1516} {"train_loss": -11.647736549377441, "global_step": 254733, "epoch": 1516} {"train_loss": -11.737444877624512, "global_step": 254734, "epoch": 1516} {"train_loss": -11.792892456054688, "global_step": 254735, "epoch": 1516} {"train_loss": -11.89677906036377, "global_step": 254736, "epoch": 1516} {"train_loss": -11.570207595825195, "global_step": 254737, "epoch": 1516} {"train_loss": -11.789291381835938, "global_step": 254738, "epoch": 1516} {"train_loss": -11.984533309936523, "global_step": 254739, "epoch": 1516} {"train_loss": -11.327705383300781, "global_step": 254740, "epoch": 1516} {"train_loss": -12.078739166259766, "global_step": 254741, "epoch": 1516} {"train_loss": -11.34533977508545, "global_step": 254742, "epoch": 1516} {"train_loss": -11.536375045776367, "global_step": 254743, "epoch": 1516} {"train_loss": -11.689971923828125, "global_step": 254744, "epoch": 1516} {"train_loss": -11.709657669067383, "global_step": 254745, "epoch": 1516} {"train_loss": -11.650276184082031, "global_step": 254746, "epoch": 1516} {"train_loss": -11.740852355957031, "global_step": 254747, "epoch": 1516} {"train_loss": -11.4644193649292, "global_step": 254748, "epoch": 1516} {"train_loss": -11.49915599822998, "global_step": 254749, "epoch": 1516} {"train_loss": -12.033486366271973, "global_step": 254750, "epoch": 1516} {"train_loss": -11.221881866455078, "global_step": 254751, "epoch": 1516} {"train_loss": -11.74337387084961, "global_step": 254752, "epoch": 1516} {"train_loss": -11.507843971252441, "global_step": 254753, "epoch": 1516} {"train_loss": -10.5816650390625, "global_step": 254754, "epoch": 1516} {"train_loss": -11.748233795166016, "global_step": 254755, "epoch": 1516} {"train_loss": -10.979043006896973, "global_step": 254756, "epoch": 1516} {"train_loss": -10.562522888183594, "global_step": 254757, "epoch": 1516} {"train_loss": -11.570138931274414, "global_step": 254758, "epoch": 1516} {"train_loss": -11.03848648071289, "global_step": 254759, "epoch": 1516} {"train_loss": -10.408851623535156, "global_step": 254760, "epoch": 1516} {"train_loss": -11.389047622680664, "global_step": 254761, "epoch": 1516} {"train_loss": -10.869429588317871, "global_step": 254762, "epoch": 1516} {"train_loss": -11.534990310668945, "global_step": 254763, "epoch": 1516} {"train_loss": -11.468204498291016, "global_step": 254764, "epoch": 1516} {"train_loss": -11.024612426757812, "global_step": 254765, "epoch": 1516} {"train_loss": -11.419656753540039, "global_step": 254766, "epoch": 1516} {"train_loss": -11.00113296508789, "global_step": 254767, "epoch": 1516} {"train_loss": -11.689051628112793, "global_step": 254768, "epoch": 1516} {"train_loss": -11.141338348388672, "global_step": 254769, "epoch": 1516} {"train_loss": -11.762947082519531, "global_step": 254770, "epoch": 1516} {"train_loss": -11.401165962219238, "global_step": 254771, "epoch": 1516} {"train_loss": -11.384529113769531, "global_step": 254772, "epoch": 1516} {"train_loss": -11.859807968139648, "global_step": 254773, "epoch": 1516} {"train_loss": -11.602930068969727, "global_step": 254774, "epoch": 1516} {"train_loss": -11.984952926635742, "global_step": 254775, "epoch": 1516} {"train_loss": -11.57501220703125, "global_step": 254776, "epoch": 1516} {"train_loss": -11.983370780944824, "global_step": 254777, "epoch": 1516} {"train_loss": -11.313081741333008, "global_step": 254778, "epoch": 1516} {"train_loss": -11.991643905639648, "global_step": 254779, "epoch": 1516} {"train_loss": -11.91922378540039, "global_step": 254780, "epoch": 1516} {"train_loss": -11.617093086242676, "global_step": 254781, "epoch": 1516} {"train_loss": -11.965208053588867, "global_step": 254782, "epoch": 1516} {"train_loss": -11.864151000976562, "global_step": 254783, "epoch": 1516} {"train_loss": -12.105998992919922, "global_step": 254784, "epoch": 1516} {"train_loss": -11.889065742492676, "global_step": 254785, "epoch": 1516} {"train_loss": -11.817256927490234, "global_step": 254786, "epoch": 1516} {"train_loss": -11.889226913452148, "global_step": 254787, "epoch": 1516} {"train_loss": -11.575592041015625, "global_step": 254788, "epoch": 1516} {"train_loss": -11.83344841003418, "global_step": 254789, "epoch": 1516} {"train_loss": -11.840951919555664, "global_step": 254790, "epoch": 1516} {"train_loss": -11.98410415649414, "global_step": 254791, "epoch": 1516} {"train_loss": -11.933138847351074, "global_step": 254792, "epoch": 1516} {"train_loss": -11.45863151550293, "global_step": 254793, "epoch": 1516} {"train_loss": -12.068646430969238, "global_step": 254794, "epoch": 1516} {"train_loss": -11.752668380737305, "global_step": 254795, "epoch": 1516} {"train_loss": -12.160335540771484, "global_step": 254796, "epoch": 1516} {"train_loss": -11.729498863220215, "global_step": 254797, "epoch": 1516} {"train_loss": -11.897289276123047, "global_step": 254798, "epoch": 1516} {"train_loss": -11.979124069213867, "global_step": 254799, "epoch": 1516} {"train_loss": -11.656021118164062, "global_step": 254800, "epoch": 1516} {"train_loss": -12.158859252929688, "global_step": 254801, "epoch": 1516} {"train_loss": -11.703789710998535, "global_step": 254802, "epoch": 1516} {"train_loss": -12.161933898925781, "global_step": 254803, "epoch": 1516} {"train_loss": -11.799421310424805, "global_step": 254804, "epoch": 1516} {"train_loss": -11.81355094909668, "global_step": 254805, "epoch": 1516} {"train_loss": -11.943357467651367, "global_step": 254806, "epoch": 1516} {"train_loss": -11.836830139160156, "global_step": 254807, "epoch": 1516} {"train_loss": -12.01705551147461, "global_step": 254808, "epoch": 1516} {"train_loss": -11.845590591430664, "global_step": 254809, "epoch": 1516} {"train_loss": -11.583145141601562, "global_step": 254810, "epoch": 1516} {"train_loss": -11.887735366821289, "global_step": 254811, "epoch": 1516} {"train_loss": -11.741912841796875, "global_step": 254812, "epoch": 1516} {"train_loss": -12.070021629333496, "global_step": 254813, "epoch": 1516} {"train_loss": -11.896303176879883, "global_step": 254814, "epoch": 1516} {"train_loss": -11.839027404785156, "global_step": 254815, "epoch": 1516} {"train_loss": -11.833196640014648, "global_step": 254816, "epoch": 1516} {"train_loss": -11.510100364685059, "global_step": 254817, "epoch": 1516} {"train_loss": -11.924139022827148, "global_step": 254818, "epoch": 1516} {"train_loss": -10.817304611206055, "global_step": 254819, "epoch": 1516} {"train_loss": -11.913501739501953, "global_step": 254820, "epoch": 1516} {"train_loss": -11.297416687011719, "global_step": 254821, "epoch": 1516} {"train_loss": -11.60793685913086, "global_step": 254822, "epoch": 1516} {"train_loss": -11.904244422912598, "global_step": 254823, "epoch": 1516} {"train_loss": -11.371828079223633, "global_step": 254824, "epoch": 1516} {"train_loss": -11.540994644165039, "global_step": 254825, "epoch": 1516} {"train_loss": -10.573232650756836, "global_step": 254826, "epoch": 1516} {"train_loss": -11.058334350585938, "global_step": 254827, "epoch": 1516} {"train_loss": -10.443437576293945, "global_step": 254828, "epoch": 1516} {"train_loss": -10.024690628051758, "global_step": 254829, "epoch": 1516} {"train_loss": -11.472992897033691, "global_step": 254830, "epoch": 1516} {"train_loss": -9.44560432434082, "global_step": 254831, "epoch": 1516} {"train_loss": -11.502670288085938, "global_step": 254832, "epoch": 1516} {"train_loss": -9.442712783813477, "global_step": 254833, "epoch": 1516} {"train_loss": -11.166189193725586, "global_step": 254834, "epoch": 1516} {"train_loss": -10.727245330810547, "global_step": 254835, "epoch": 1516} {"train_loss": -10.510465621948242, "global_step": 254836, "epoch": 1516} {"train_loss": -11.132125854492188, "global_step": 254837, "epoch": 1516} {"train_loss": -9.962352752685547, "global_step": 254838, "epoch": 1516} {"train_loss": -10.83153247833252, "global_step": 254839, "epoch": 1516} {"train_loss": -10.693034172058105, "global_step": 254840, "epoch": 1516} {"train_loss": -10.48265266418457, "global_step": 254841, "epoch": 1516} {"train_loss": -10.876158714294434, "global_step": 254842, "epoch": 1516} {"train_loss": -11.330789566040039, "global_step": 254843, "epoch": 1516} {"train_loss": -10.797772407531738, "global_step": 254844, "epoch": 1516} {"train_loss": -11.227521896362305, "global_step": 254845, "epoch": 1516} {"train_loss": -10.895709991455078, "global_step": 254846, "epoch": 1516} {"train_loss": -11.27505111694336, "global_step": 254847, "epoch": 1516} {"train_loss": -11.44253158569336, "global_step": 254848, "epoch": 1516} {"train_loss": -11.277782440185547, "global_step": 254849, "epoch": 1516} {"train_loss": -11.426556587219238, "global_step": 254850, "epoch": 1516} {"train_loss": -11.598176002502441, "global_step": 254851, "epoch": 1516} {"train_loss": -10.937932014465332, "global_step": 254852, "epoch": 1516} {"train_loss": -11.844263076782227, "global_step": 254853, "epoch": 1516} {"train_loss": -11.186022758483887, "global_step": 254854, "epoch": 1516} {"train_loss": -11.518522285279774, "global_step": 254855, "epoch": 1516, "val_loss": 271137.0625} {"train_loss": -11.742130279541016, "global_step": 254856, "epoch": 1517} {"train_loss": -11.46301555633545, "global_step": 254857, "epoch": 1517} {"train_loss": -11.677611351013184, "global_step": 254858, "epoch": 1517} {"train_loss": -11.638123512268066, "global_step": 254859, "epoch": 1517} {"train_loss": -11.629560470581055, "global_step": 254860, "epoch": 1517} {"train_loss": -11.565004348754883, "global_step": 254861, "epoch": 1517} {"train_loss": -11.59868049621582, "global_step": 254862, "epoch": 1517} {"train_loss": -11.671716690063477, "global_step": 254863, "epoch": 1517} {"train_loss": -11.458925247192383, "global_step": 254864, "epoch": 1517} {"train_loss": -11.536251068115234, "global_step": 254865, "epoch": 1517} {"train_loss": -11.370705604553223, "global_step": 254866, "epoch": 1517} {"train_loss": -11.868120193481445, "global_step": 254867, "epoch": 1517} {"train_loss": -11.583418846130371, "global_step": 254868, "epoch": 1517} {"train_loss": -11.685449600219727, "global_step": 254869, "epoch": 1517} {"train_loss": -11.334977149963379, "global_step": 254870, "epoch": 1517} {"train_loss": -11.241317749023438, "global_step": 254871, "epoch": 1517} {"train_loss": -11.580018997192383, "global_step": 254872, "epoch": 1517} {"train_loss": -11.60708236694336, "global_step": 254873, "epoch": 1517} {"train_loss": -11.22268295288086, "global_step": 254874, "epoch": 1517} {"train_loss": -11.296418190002441, "global_step": 254875, "epoch": 1517} {"train_loss": -11.53823471069336, "global_step": 254876, "epoch": 1517} {"train_loss": -11.225146293640137, "global_step": 254877, "epoch": 1517} {"train_loss": -11.812626838684082, "global_step": 254878, "epoch": 1517} {"train_loss": -11.38611888885498, "global_step": 254879, "epoch": 1517} {"train_loss": -11.92269515991211, "global_step": 254880, "epoch": 1517} {"train_loss": -11.364418029785156, "global_step": 254881, "epoch": 1517} {"train_loss": -11.941473960876465, "global_step": 254882, "epoch": 1517} {"train_loss": -11.343533515930176, "global_step": 254883, "epoch": 1517} {"train_loss": -11.901344299316406, "global_step": 254884, "epoch": 1517} {"train_loss": -11.449316024780273, "global_step": 254885, "epoch": 1517} {"train_loss": -11.948881149291992, "global_step": 254886, "epoch": 1517} {"train_loss": -11.578245162963867, "global_step": 254887, "epoch": 1517} {"train_loss": -11.833536148071289, "global_step": 254888, "epoch": 1517} {"train_loss": -11.840208053588867, "global_step": 254889, "epoch": 1517} {"train_loss": -11.831120491027832, "global_step": 254890, "epoch": 1517} {"train_loss": -11.827615737915039, "global_step": 254891, "epoch": 1517} {"train_loss": -12.04890251159668, "global_step": 254892, "epoch": 1517} {"train_loss": -11.733609199523926, "global_step": 254893, "epoch": 1517} {"train_loss": -11.75275993347168, "global_step": 254894, "epoch": 1517} {"train_loss": -11.952791213989258, "global_step": 254895, "epoch": 1517} {"train_loss": -11.79339599609375, "global_step": 254896, "epoch": 1517} {"train_loss": -11.779901504516602, "global_step": 254897, "epoch": 1517} {"train_loss": -12.108102798461914, "global_step": 254898, "epoch": 1517} {"train_loss": -12.092557907104492, "global_step": 254899, "epoch": 1517} {"train_loss": -12.068650245666504, "global_step": 254900, "epoch": 1517} {"train_loss": -12.038293838500977, "global_step": 254901, "epoch": 1517} {"train_loss": -12.050373077392578, "global_step": 254902, "epoch": 1517} {"train_loss": -12.045614242553711, "global_step": 254903, "epoch": 1517} {"train_loss": -12.034708023071289, "global_step": 254904, "epoch": 1517} {"train_loss": -12.034521102905273, "global_step": 254905, "epoch": 1517} {"train_loss": -11.953229904174805, "global_step": 254906, "epoch": 1517} {"train_loss": -12.070608139038086, "global_step": 254907, "epoch": 1517} {"train_loss": -12.021736145019531, "global_step": 254908, "epoch": 1517} {"train_loss": -12.083860397338867, "global_step": 254909, "epoch": 1517} {"train_loss": -12.170303344726562, "global_step": 254910, "epoch": 1517} {"train_loss": -12.211979866027832, "global_step": 254911, "epoch": 1517} {"train_loss": -11.970235824584961, "global_step": 254912, "epoch": 1517} {"train_loss": -12.019316673278809, "global_step": 254913, "epoch": 1517} {"train_loss": -11.780752182006836, "global_step": 254914, "epoch": 1517} {"train_loss": -12.168718338012695, "global_step": 254915, "epoch": 1517} {"train_loss": -12.047843933105469, "global_step": 254916, "epoch": 1517} {"train_loss": -11.836441040039062, "global_step": 254917, "epoch": 1517} {"train_loss": -11.8139066696167, "global_step": 254918, "epoch": 1517} {"train_loss": -11.881153106689453, "global_step": 254919, "epoch": 1517} {"train_loss": -11.839553833007812, "global_step": 254920, "epoch": 1517} {"train_loss": -12.082817077636719, "global_step": 254921, "epoch": 1517} {"train_loss": -11.769815444946289, "global_step": 254922, "epoch": 1517} {"train_loss": -11.957188606262207, "global_step": 254923, "epoch": 1517} {"train_loss": -11.816598892211914, "global_step": 254924, "epoch": 1517} {"train_loss": -11.499900817871094, "global_step": 254925, "epoch": 1517} {"train_loss": -12.134366989135742, "global_step": 254926, "epoch": 1517} {"train_loss": -11.384525299072266, "global_step": 254927, "epoch": 1517} {"train_loss": -12.028938293457031, "global_step": 254928, "epoch": 1517} {"train_loss": -11.682748794555664, "global_step": 254929, "epoch": 1517} {"train_loss": -11.972012519836426, "global_step": 254930, "epoch": 1517} {"train_loss": -11.852165222167969, "global_step": 254931, "epoch": 1517} {"train_loss": -11.908699989318848, "global_step": 254932, "epoch": 1517} {"train_loss": -12.069665908813477, "global_step": 254933, "epoch": 1517} {"train_loss": -11.907450675964355, "global_step": 254934, "epoch": 1517} {"train_loss": -12.042569160461426, "global_step": 254935, "epoch": 1517} {"train_loss": -11.71196174621582, "global_step": 254936, "epoch": 1517} {"train_loss": -11.975059509277344, "global_step": 254937, "epoch": 1517} {"train_loss": -11.960565567016602, "global_step": 254938, "epoch": 1517} {"train_loss": -11.869908332824707, "global_step": 254939, "epoch": 1517} {"train_loss": -12.058671951293945, "global_step": 254940, "epoch": 1517} {"train_loss": -11.99163818359375, "global_step": 254941, "epoch": 1517} {"train_loss": -11.648218154907227, "global_step": 254942, "epoch": 1517} {"train_loss": -12.03580093383789, "global_step": 254943, "epoch": 1517} {"train_loss": -11.928410530090332, "global_step": 254944, "epoch": 1517} {"train_loss": -12.289228439331055, "global_step": 254945, "epoch": 1517} {"train_loss": -11.93375015258789, "global_step": 254946, "epoch": 1517} {"train_loss": -11.651745796203613, "global_step": 254947, "epoch": 1517} {"train_loss": -11.643694877624512, "global_step": 254948, "epoch": 1517} {"train_loss": -11.108001708984375, "global_step": 254949, "epoch": 1517} {"train_loss": -10.82376766204834, "global_step": 254950, "epoch": 1517} {"train_loss": -11.247143745422363, "global_step": 254951, "epoch": 1517} {"train_loss": -11.891024589538574, "global_step": 254952, "epoch": 1517} {"train_loss": -11.14818286895752, "global_step": 254953, "epoch": 1517} {"train_loss": -12.018512725830078, "global_step": 254954, "epoch": 1517} {"train_loss": -11.617009162902832, "global_step": 254955, "epoch": 1517} {"train_loss": -12.040153503417969, "global_step": 254956, "epoch": 1517} {"train_loss": -12.086544036865234, "global_step": 254957, "epoch": 1517} {"train_loss": -11.797021865844727, "global_step": 254958, "epoch": 1517} {"train_loss": -11.947896003723145, "global_step": 254959, "epoch": 1517} {"train_loss": -12.061756134033203, "global_step": 254960, "epoch": 1517} {"train_loss": -11.942602157592773, "global_step": 254961, "epoch": 1517} {"train_loss": -11.032594680786133, "global_step": 254962, "epoch": 1517} {"train_loss": -11.715675354003906, "global_step": 254963, "epoch": 1517} {"train_loss": -11.589985847473145, "global_step": 254964, "epoch": 1517} {"train_loss": -11.823836326599121, "global_step": 254965, "epoch": 1517} {"train_loss": -11.58172607421875, "global_step": 254966, "epoch": 1517} {"train_loss": -11.377349853515625, "global_step": 254967, "epoch": 1517} {"train_loss": -11.529356956481934, "global_step": 254968, "epoch": 1517} {"train_loss": -11.963929176330566, "global_step": 254969, "epoch": 1517} {"train_loss": -11.384451866149902, "global_step": 254970, "epoch": 1517} {"train_loss": -11.796479225158691, "global_step": 254971, "epoch": 1517} {"train_loss": -11.605520248413086, "global_step": 254972, "epoch": 1517} {"train_loss": -11.081371307373047, "global_step": 254973, "epoch": 1517} {"train_loss": -11.246103286743164, "global_step": 254974, "epoch": 1517} {"train_loss": -11.564077377319336, "global_step": 254975, "epoch": 1517} {"train_loss": -10.578470230102539, "global_step": 254976, "epoch": 1517} {"train_loss": -11.822166442871094, "global_step": 254977, "epoch": 1517} {"train_loss": -11.308497428894043, "global_step": 254978, "epoch": 1517} {"train_loss": -10.724536895751953, "global_step": 254979, "epoch": 1517} {"train_loss": -10.598459243774414, "global_step": 254980, "epoch": 1517} {"train_loss": -11.74207878112793, "global_step": 254981, "epoch": 1517} {"train_loss": -10.604043960571289, "global_step": 254982, "epoch": 1517} {"train_loss": -11.873821258544922, "global_step": 254983, "epoch": 1517} {"train_loss": -11.002068519592285, "global_step": 254984, "epoch": 1517} {"train_loss": -11.689107894897461, "global_step": 254985, "epoch": 1517} {"train_loss": -11.201886177062988, "global_step": 254986, "epoch": 1517} {"train_loss": -11.463048934936523, "global_step": 254987, "epoch": 1517} {"train_loss": -11.437992095947266, "global_step": 254988, "epoch": 1517} {"train_loss": -11.275275230407715, "global_step": 254989, "epoch": 1517} {"train_loss": -11.75473403930664, "global_step": 254990, "epoch": 1517} {"train_loss": -10.97320556640625, "global_step": 254991, "epoch": 1517} {"train_loss": -11.44149112701416, "global_step": 254992, "epoch": 1517} {"train_loss": -11.74364185333252, "global_step": 254993, "epoch": 1517} {"train_loss": -10.847135543823242, "global_step": 254994, "epoch": 1517} {"train_loss": -11.557823181152344, "global_step": 254995, "epoch": 1517} {"train_loss": -11.056257247924805, "global_step": 254996, "epoch": 1517} {"train_loss": -11.154275894165039, "global_step": 254997, "epoch": 1517} {"train_loss": -11.239566802978516, "global_step": 254998, "epoch": 1517} {"train_loss": -11.424665451049805, "global_step": 254999, "epoch": 1517} {"train_loss": -11.588356971740723, "global_step": 255000, "epoch": 1517} {"train_loss": -10.811741828918457, "global_step": 255001, "epoch": 1517} {"train_loss": -11.854205131530762, "global_step": 255002, "epoch": 1517} {"train_loss": -10.759957313537598, "global_step": 255003, "epoch": 1517} {"train_loss": -11.500446319580078, "global_step": 255004, "epoch": 1517} {"train_loss": -11.363992691040039, "global_step": 255005, "epoch": 1517} {"train_loss": -11.21582317352295, "global_step": 255006, "epoch": 1517} {"train_loss": -11.450674057006836, "global_step": 255007, "epoch": 1517} {"train_loss": -11.453624725341797, "global_step": 255008, "epoch": 1517} {"train_loss": -11.604118347167969, "global_step": 255009, "epoch": 1517} {"train_loss": -11.26276683807373, "global_step": 255010, "epoch": 1517} {"train_loss": -11.405607223510742, "global_step": 255011, "epoch": 1517} {"train_loss": -11.317888259887695, "global_step": 255012, "epoch": 1517} {"train_loss": -11.540548324584961, "global_step": 255013, "epoch": 1517} {"train_loss": -11.370464324951172, "global_step": 255014, "epoch": 1517} {"train_loss": -11.758320808410645, "global_step": 255015, "epoch": 1517} {"train_loss": -11.504802703857422, "global_step": 255016, "epoch": 1517} {"train_loss": -11.88547420501709, "global_step": 255017, "epoch": 1517} {"train_loss": -11.17990493774414, "global_step": 255018, "epoch": 1517} {"train_loss": -11.310941696166992, "global_step": 255019, "epoch": 1517} {"train_loss": -11.668582916259766, "global_step": 255020, "epoch": 1517} {"train_loss": -11.261165618896484, "global_step": 255021, "epoch": 1517} {"train_loss": -11.601301193237305, "global_step": 255022, "epoch": 1517} {"train_loss": -11.63909109433492, "global_step": 255023, "epoch": 1517, "val_loss": 270028.65625} {"train_loss": -11.640499114990234, "global_step": 255024, "epoch": 1518} {"train_loss": -11.385191917419434, "global_step": 255025, "epoch": 1518} {"train_loss": -11.013877868652344, "global_step": 255026, "epoch": 1518} {"train_loss": -11.772624969482422, "global_step": 255027, "epoch": 1518} {"train_loss": -11.18414306640625, "global_step": 255028, "epoch": 1518} {"train_loss": -12.030726432800293, "global_step": 255029, "epoch": 1518} {"train_loss": -11.299181938171387, "global_step": 255030, "epoch": 1518} {"train_loss": -11.704662322998047, "global_step": 255031, "epoch": 1518} {"train_loss": -11.058664321899414, "global_step": 255032, "epoch": 1518} {"train_loss": -11.801709175109863, "global_step": 255033, "epoch": 1518} {"train_loss": -11.327747344970703, "global_step": 255034, "epoch": 1518} {"train_loss": -11.88879108428955, "global_step": 255035, "epoch": 1518} {"train_loss": -11.712834358215332, "global_step": 255036, "epoch": 1518} {"train_loss": -12.07243824005127, "global_step": 255037, "epoch": 1518} {"train_loss": -11.907489776611328, "global_step": 255038, "epoch": 1518} {"train_loss": -11.745538711547852, "global_step": 255039, "epoch": 1518} {"train_loss": -11.840375900268555, "global_step": 255040, "epoch": 1518} {"train_loss": -11.972707748413086, "global_step": 255041, "epoch": 1518} {"train_loss": -11.955228805541992, "global_step": 255042, "epoch": 1518} {"train_loss": -11.856678009033203, "global_step": 255043, "epoch": 1518} {"train_loss": -11.88038444519043, "global_step": 255044, "epoch": 1518} {"train_loss": -11.973400115966797, "global_step": 255045, "epoch": 1518} {"train_loss": -12.144296646118164, "global_step": 255046, "epoch": 1518} {"train_loss": -11.839790344238281, "global_step": 255047, "epoch": 1518} {"train_loss": -12.10356330871582, "global_step": 255048, "epoch": 1518} {"train_loss": -11.824061393737793, "global_step": 255049, "epoch": 1518} {"train_loss": -11.69359302520752, "global_step": 255050, "epoch": 1518} {"train_loss": -12.15346908569336, "global_step": 255051, "epoch": 1518} {"train_loss": -11.627971649169922, "global_step": 255052, "epoch": 1518} {"train_loss": -11.919574737548828, "global_step": 255053, "epoch": 1518} {"train_loss": -11.923730850219727, "global_step": 255054, "epoch": 1518} {"train_loss": -11.35955810546875, "global_step": 255055, "epoch": 1518} {"train_loss": -12.280010223388672, "global_step": 255056, "epoch": 1518} {"train_loss": -11.597421646118164, "global_step": 255057, "epoch": 1518} {"train_loss": -11.950774192810059, "global_step": 255058, "epoch": 1518} {"train_loss": -11.876826286315918, "global_step": 255059, "epoch": 1518} {"train_loss": -11.80327320098877, "global_step": 255060, "epoch": 1518} {"train_loss": -11.747821807861328, "global_step": 255061, "epoch": 1518} {"train_loss": -11.743400573730469, "global_step": 255062, "epoch": 1518} {"train_loss": -11.885285377502441, "global_step": 255063, "epoch": 1518} {"train_loss": -11.992650032043457, "global_step": 255064, "epoch": 1518} {"train_loss": -11.85120677947998, "global_step": 255065, "epoch": 1518} {"train_loss": -11.974946022033691, "global_step": 255066, "epoch": 1518} {"train_loss": -11.950492858886719, "global_step": 255067, "epoch": 1518} {"train_loss": -12.026679992675781, "global_step": 255068, "epoch": 1518} {"train_loss": -11.918258666992188, "global_step": 255069, "epoch": 1518} {"train_loss": -12.154071807861328, "global_step": 255070, "epoch": 1518} {"train_loss": -11.754989624023438, "global_step": 255071, "epoch": 1518} {"train_loss": -12.021980285644531, "global_step": 255072, "epoch": 1518} {"train_loss": -12.117382049560547, "global_step": 255073, "epoch": 1518} {"train_loss": -11.755836486816406, "global_step": 255074, "epoch": 1518} {"train_loss": -12.045881271362305, "global_step": 255075, "epoch": 1518} {"train_loss": -11.888720512390137, "global_step": 255076, "epoch": 1518} {"train_loss": -11.941965103149414, "global_step": 255077, "epoch": 1518} {"train_loss": -12.149816513061523, "global_step": 255078, "epoch": 1518} {"train_loss": -11.830374717712402, "global_step": 255079, "epoch": 1518} {"train_loss": -11.349973678588867, "global_step": 255080, "epoch": 1518} {"train_loss": -11.656498908996582, "global_step": 255081, "epoch": 1518} {"train_loss": -11.989419937133789, "global_step": 255082, "epoch": 1518} {"train_loss": -11.329713821411133, "global_step": 255083, "epoch": 1518} {"train_loss": -12.135910034179688, "global_step": 255084, "epoch": 1518} {"train_loss": -11.330025672912598, "global_step": 255085, "epoch": 1518} {"train_loss": -11.31939697265625, "global_step": 255086, "epoch": 1518} {"train_loss": -11.492362022399902, "global_step": 255087, "epoch": 1518} {"train_loss": -11.331385612487793, "global_step": 255088, "epoch": 1518} {"train_loss": -10.320699691772461, "global_step": 255089, "epoch": 1518} {"train_loss": -9.58655834197998, "global_step": 255090, "epoch": 1518} {"train_loss": -11.52669906616211, "global_step": 255091, "epoch": 1518} {"train_loss": -10.094078063964844, "global_step": 255092, "epoch": 1518} {"train_loss": -10.315780639648438, "global_step": 255093, "epoch": 1518} {"train_loss": -10.543590545654297, "global_step": 255094, "epoch": 1518} {"train_loss": -10.899169921875, "global_step": 255095, "epoch": 1518} {"train_loss": -10.72171401977539, "global_step": 255096, "epoch": 1518} {"train_loss": -10.681290626525879, "global_step": 255097, "epoch": 1518} {"train_loss": -10.992105484008789, "global_step": 255098, "epoch": 1518} {"train_loss": -10.47851276397705, "global_step": 255099, "epoch": 1518} {"train_loss": -11.07158374786377, "global_step": 255100, "epoch": 1518} {"train_loss": -10.834630012512207, "global_step": 255101, "epoch": 1518} {"train_loss": -11.100227355957031, "global_step": 255102, "epoch": 1518} {"train_loss": -11.311163902282715, "global_step": 255103, "epoch": 1518} {"train_loss": -10.776954650878906, "global_step": 255104, "epoch": 1518} {"train_loss": -11.536975860595703, "global_step": 255105, "epoch": 1518} {"train_loss": -11.073722839355469, "global_step": 255106, "epoch": 1518} {"train_loss": -11.350566864013672, "global_step": 255107, "epoch": 1518} {"train_loss": -11.078865051269531, "global_step": 255108, "epoch": 1518} {"train_loss": -11.16379451751709, "global_step": 255109, "epoch": 1518} {"train_loss": -11.546173095703125, "global_step": 255110, "epoch": 1518} {"train_loss": -11.363879203796387, "global_step": 255111, "epoch": 1518} {"train_loss": -11.496082305908203, "global_step": 255112, "epoch": 1518} {"train_loss": -11.420249938964844, "global_step": 255113, "epoch": 1518} {"train_loss": -11.491676330566406, "global_step": 255114, "epoch": 1518} {"train_loss": -11.672921180725098, "global_step": 255115, "epoch": 1518} {"train_loss": -11.654273986816406, "global_step": 255116, "epoch": 1518} {"train_loss": -11.266326904296875, "global_step": 255117, "epoch": 1518} {"train_loss": -11.579657554626465, "global_step": 255118, "epoch": 1518} {"train_loss": -11.064390182495117, "global_step": 255119, "epoch": 1518} {"train_loss": -11.349488258361816, "global_step": 255120, "epoch": 1518} {"train_loss": -11.457038879394531, "global_step": 255121, "epoch": 1518} {"train_loss": -11.079995155334473, "global_step": 255122, "epoch": 1518} {"train_loss": -11.844595909118652, "global_step": 255123, "epoch": 1518} {"train_loss": -11.52511978149414, "global_step": 255124, "epoch": 1518} {"train_loss": -11.754707336425781, "global_step": 255125, "epoch": 1518} {"train_loss": -11.546009063720703, "global_step": 255126, "epoch": 1518} {"train_loss": -11.972660064697266, "global_step": 255127, "epoch": 1518} {"train_loss": -11.744708061218262, "global_step": 255128, "epoch": 1518} {"train_loss": -11.781124114990234, "global_step": 255129, "epoch": 1518} {"train_loss": -11.753519058227539, "global_step": 255130, "epoch": 1518} {"train_loss": -11.89462661743164, "global_step": 255131, "epoch": 1518} {"train_loss": -11.681146621704102, "global_step": 255132, "epoch": 1518} {"train_loss": -11.78004264831543, "global_step": 255133, "epoch": 1518} {"train_loss": -11.765830993652344, "global_step": 255134, "epoch": 1518} {"train_loss": -11.669069290161133, "global_step": 255135, "epoch": 1518} {"train_loss": -11.747533798217773, "global_step": 255136, "epoch": 1518} {"train_loss": -11.892478942871094, "global_step": 255137, "epoch": 1518} {"train_loss": -11.47186279296875, "global_step": 255138, "epoch": 1518} {"train_loss": -11.31179141998291, "global_step": 255139, "epoch": 1518} {"train_loss": -11.580877304077148, "global_step": 255140, "epoch": 1518} {"train_loss": -11.277109146118164, "global_step": 255141, "epoch": 1518} {"train_loss": -11.709785461425781, "global_step": 255142, "epoch": 1518} {"train_loss": -11.214771270751953, "global_step": 255143, "epoch": 1518} {"train_loss": -11.495214462280273, "global_step": 255144, "epoch": 1518} {"train_loss": -11.133624076843262, "global_step": 255145, "epoch": 1518} {"train_loss": -11.638973236083984, "global_step": 255146, "epoch": 1518} {"train_loss": -11.394427299499512, "global_step": 255147, "epoch": 1518} {"train_loss": -11.500404357910156, "global_step": 255148, "epoch": 1518} {"train_loss": -11.54537582397461, "global_step": 255149, "epoch": 1518} {"train_loss": -11.758668899536133, "global_step": 255150, "epoch": 1518} {"train_loss": -11.512833595275879, "global_step": 255151, "epoch": 1518} {"train_loss": -11.28193473815918, "global_step": 255152, "epoch": 1518} {"train_loss": -11.771528244018555, "global_step": 255153, "epoch": 1518} {"train_loss": -11.625149726867676, "global_step": 255154, "epoch": 1518} {"train_loss": -11.645895004272461, "global_step": 255155, "epoch": 1518} {"train_loss": -11.801362991333008, "global_step": 255156, "epoch": 1518} {"train_loss": -11.950206756591797, "global_step": 255157, "epoch": 1518} {"train_loss": -11.905855178833008, "global_step": 255158, "epoch": 1518} {"train_loss": -11.887478828430176, "global_step": 255159, "epoch": 1518} {"train_loss": -11.873676300048828, "global_step": 255160, "epoch": 1518} {"train_loss": -11.992016792297363, "global_step": 255161, "epoch": 1518} {"train_loss": -11.969402313232422, "global_step": 255162, "epoch": 1518} {"train_loss": -11.787900924682617, "global_step": 255163, "epoch": 1518} {"train_loss": -11.91208267211914, "global_step": 255164, "epoch": 1518} {"train_loss": -12.048227310180664, "global_step": 255165, "epoch": 1518} {"train_loss": -11.536638259887695, "global_step": 255166, "epoch": 1518} {"train_loss": -12.059255599975586, "global_step": 255167, "epoch": 1518} {"train_loss": -12.082280158996582, "global_step": 255168, "epoch": 1518} {"train_loss": -11.915865898132324, "global_step": 255169, "epoch": 1518} {"train_loss": -12.023040771484375, "global_step": 255170, "epoch": 1518} {"train_loss": -11.928711891174316, "global_step": 255171, "epoch": 1518} {"train_loss": -11.80151081085205, "global_step": 255172, "epoch": 1518} {"train_loss": -11.943975448608398, "global_step": 255173, "epoch": 1518} {"train_loss": -12.142989158630371, "global_step": 255174, "epoch": 1518} {"train_loss": -12.05368423461914, "global_step": 255175, "epoch": 1518} {"train_loss": -12.025711059570312, "global_step": 255176, "epoch": 1518} {"train_loss": -12.099224090576172, "global_step": 255177, "epoch": 1518} {"train_loss": -11.979846000671387, "global_step": 255178, "epoch": 1518} {"train_loss": -12.032740592956543, "global_step": 255179, "epoch": 1518} {"train_loss": -11.932798385620117, "global_step": 255180, "epoch": 1518} {"train_loss": -12.241386413574219, "global_step": 255181, "epoch": 1518} {"train_loss": -12.036863327026367, "global_step": 255182, "epoch": 1518} {"train_loss": -12.049070358276367, "global_step": 255183, "epoch": 1518} {"train_loss": -12.124858856201172, "global_step": 255184, "epoch": 1518} {"train_loss": -11.776883125305176, "global_step": 255185, "epoch": 1518} {"train_loss": -11.72055721282959, "global_step": 255186, "epoch": 1518} {"train_loss": -11.722911834716797, "global_step": 255187, "epoch": 1518} {"train_loss": -12.110513687133789, "global_step": 255188, "epoch": 1518} {"train_loss": -11.931680679321289, "global_step": 255189, "epoch": 1518} {"train_loss": -11.981096267700195, "global_step": 255190, "epoch": 1518} {"train_loss": -11.638329068819681, "global_step": 255191, "epoch": 1518, "val_loss": 265982.375} {"train_loss": -11.250426292419434, "global_step": 255192, "epoch": 1519} {"train_loss": -11.302839279174805, "global_step": 255193, "epoch": 1519} {"train_loss": -11.68067741394043, "global_step": 255194, "epoch": 1519} {"train_loss": -10.503070831298828, "global_step": 255195, "epoch": 1519} {"train_loss": -9.991321563720703, "global_step": 255196, "epoch": 1519} {"train_loss": -11.333429336547852, "global_step": 255197, "epoch": 1519} {"train_loss": -8.979187965393066, "global_step": 255198, "epoch": 1519} {"train_loss": -8.241661071777344, "global_step": 255199, "epoch": 1519} {"train_loss": -9.43323040008545, "global_step": 255200, "epoch": 1519} {"train_loss": -9.709796905517578, "global_step": 255201, "epoch": 1519} {"train_loss": -9.402966499328613, "global_step": 255202, "epoch": 1519} {"train_loss": -8.7406005859375, "global_step": 255203, "epoch": 1519} {"train_loss": -9.866048812866211, "global_step": 255204, "epoch": 1519} {"train_loss": -9.578282356262207, "global_step": 255205, "epoch": 1519} {"train_loss": -10.714873313903809, "global_step": 255206, "epoch": 1519} {"train_loss": -9.899881362915039, "global_step": 255207, "epoch": 1519} {"train_loss": -11.168647766113281, "global_step": 255208, "epoch": 1519} {"train_loss": -10.499757766723633, "global_step": 255209, "epoch": 1519} {"train_loss": -11.00278377532959, "global_step": 255210, "epoch": 1519} {"train_loss": -9.942588806152344, "global_step": 255211, "epoch": 1519} {"train_loss": -10.557302474975586, "global_step": 255212, "epoch": 1519} {"train_loss": -10.728187561035156, "global_step": 255213, "epoch": 1519} {"train_loss": -11.36113166809082, "global_step": 255214, "epoch": 1519} {"train_loss": -11.092466354370117, "global_step": 255215, "epoch": 1519} {"train_loss": -11.247404098510742, "global_step": 255216, "epoch": 1519} {"train_loss": -10.768817901611328, "global_step": 255217, "epoch": 1519} {"train_loss": -11.440901756286621, "global_step": 255218, "epoch": 1519} {"train_loss": -11.07823371887207, "global_step": 255219, "epoch": 1519} {"train_loss": -11.352231979370117, "global_step": 255220, "epoch": 1519} {"train_loss": -10.906396865844727, "global_step": 255221, "epoch": 1519} {"train_loss": -11.128649711608887, "global_step": 255222, "epoch": 1519} {"train_loss": -11.02138614654541, "global_step": 255223, "epoch": 1519} {"train_loss": -11.408821105957031, "global_step": 255224, "epoch": 1519} {"train_loss": -11.05889892578125, "global_step": 255225, "epoch": 1519} {"train_loss": -11.523772239685059, "global_step": 255226, "epoch": 1519} {"train_loss": -10.611828804016113, "global_step": 255227, "epoch": 1519} {"train_loss": -11.737495422363281, "global_step": 255228, "epoch": 1519} {"train_loss": -11.036823272705078, "global_step": 255229, "epoch": 1519} {"train_loss": -11.469858169555664, "global_step": 255230, "epoch": 1519} {"train_loss": -11.470779418945312, "global_step": 255231, "epoch": 1519} {"train_loss": -10.889856338500977, "global_step": 255232, "epoch": 1519} {"train_loss": -11.34913444519043, "global_step": 255233, "epoch": 1519} {"train_loss": -11.357736587524414, "global_step": 255234, "epoch": 1519} {"train_loss": -11.364555358886719, "global_step": 255235, "epoch": 1519} {"train_loss": -11.101550102233887, "global_step": 255236, "epoch": 1519} {"train_loss": -11.660224914550781, "global_step": 255237, "epoch": 1519} {"train_loss": -11.45833969116211, "global_step": 255238, "epoch": 1519} {"train_loss": -11.448083877563477, "global_step": 255239, "epoch": 1519} {"train_loss": -11.752082824707031, "global_step": 255240, "epoch": 1519} {"train_loss": -11.229436874389648, "global_step": 255241, "epoch": 1519} {"train_loss": -11.616607666015625, "global_step": 255242, "epoch": 1519} {"train_loss": -11.738126754760742, "global_step": 255243, "epoch": 1519} {"train_loss": -11.88031005859375, "global_step": 255244, "epoch": 1519} {"train_loss": -11.50207233428955, "global_step": 255245, "epoch": 1519} {"train_loss": -11.343719482421875, "global_step": 255246, "epoch": 1519} {"train_loss": -11.538371086120605, "global_step": 255247, "epoch": 1519} {"train_loss": -11.578493118286133, "global_step": 255248, "epoch": 1519} {"train_loss": -11.698575019836426, "global_step": 255249, "epoch": 1519} {"train_loss": -11.398059844970703, "global_step": 255250, "epoch": 1519} {"train_loss": -11.55357837677002, "global_step": 255251, "epoch": 1519} {"train_loss": -11.598901748657227, "global_step": 255252, "epoch": 1519} {"train_loss": -11.537355422973633, "global_step": 255253, "epoch": 1519} {"train_loss": -11.545689582824707, "global_step": 255254, "epoch": 1519} {"train_loss": -12.08900260925293, "global_step": 255255, "epoch": 1519} {"train_loss": -11.760941505432129, "global_step": 255256, "epoch": 1519} {"train_loss": -11.87309455871582, "global_step": 255257, "epoch": 1519} {"train_loss": -12.009679794311523, "global_step": 255258, "epoch": 1519} {"train_loss": -11.752976417541504, "global_step": 255259, "epoch": 1519} {"train_loss": -11.94063949584961, "global_step": 255260, "epoch": 1519} {"train_loss": -11.93624210357666, "global_step": 255261, "epoch": 1519} {"train_loss": -11.92195987701416, "global_step": 255262, "epoch": 1519} {"train_loss": -11.822602272033691, "global_step": 255263, "epoch": 1519} {"train_loss": -11.911048889160156, "global_step": 255264, "epoch": 1519} {"train_loss": -11.993491172790527, "global_step": 255265, "epoch": 1519} {"train_loss": -11.926542282104492, "global_step": 255266, "epoch": 1519} {"train_loss": -12.005050659179688, "global_step": 255267, "epoch": 1519} {"train_loss": -11.655280113220215, "global_step": 255268, "epoch": 1519} {"train_loss": -11.76911735534668, "global_step": 255269, "epoch": 1519} {"train_loss": -11.51720142364502, "global_step": 255270, "epoch": 1519} {"train_loss": -11.775073051452637, "global_step": 255271, "epoch": 1519} {"train_loss": -11.740363121032715, "global_step": 255272, "epoch": 1519} {"train_loss": -11.678913116455078, "global_step": 255273, "epoch": 1519} {"train_loss": -11.926382064819336, "global_step": 255274, "epoch": 1519} {"train_loss": -11.688993453979492, "global_step": 255275, "epoch": 1519} {"train_loss": -11.738407135009766, "global_step": 255276, "epoch": 1519} {"train_loss": -11.744989395141602, "global_step": 255277, "epoch": 1519} {"train_loss": -12.086893081665039, "global_step": 255278, "epoch": 1519} {"train_loss": -11.705063819885254, "global_step": 255279, "epoch": 1519} {"train_loss": -11.828335762023926, "global_step": 255280, "epoch": 1519} {"train_loss": -11.377593994140625, "global_step": 255281, "epoch": 1519} {"train_loss": -11.929666519165039, "global_step": 255282, "epoch": 1519} {"train_loss": -11.531326293945312, "global_step": 255283, "epoch": 1519} {"train_loss": -11.898191452026367, "global_step": 255284, "epoch": 1519} {"train_loss": -11.719038009643555, "global_step": 255285, "epoch": 1519} {"train_loss": -12.22224235534668, "global_step": 255286, "epoch": 1519} {"train_loss": -11.895368576049805, "global_step": 255287, "epoch": 1519} {"train_loss": -11.888455390930176, "global_step": 255288, "epoch": 1519} {"train_loss": -11.629131317138672, "global_step": 255289, "epoch": 1519} {"train_loss": -11.029712677001953, "global_step": 255290, "epoch": 1519} {"train_loss": -11.816718101501465, "global_step": 255291, "epoch": 1519} {"train_loss": -11.903541564941406, "global_step": 255292, "epoch": 1519} {"train_loss": -11.515178680419922, "global_step": 255293, "epoch": 1519} {"train_loss": -11.625896453857422, "global_step": 255294, "epoch": 1519} {"train_loss": -11.410850524902344, "global_step": 255295, "epoch": 1519} {"train_loss": -11.580137252807617, "global_step": 255296, "epoch": 1519} {"train_loss": -10.300539016723633, "global_step": 255297, "epoch": 1519} {"train_loss": -10.231854438781738, "global_step": 255298, "epoch": 1519} {"train_loss": -9.234617233276367, "global_step": 255299, "epoch": 1519} {"train_loss": -10.121909141540527, "global_step": 255300, "epoch": 1519} {"train_loss": -9.107305526733398, "global_step": 255301, "epoch": 1519} {"train_loss": -9.978388786315918, "global_step": 255302, "epoch": 1519} {"train_loss": -10.047128677368164, "global_step": 255303, "epoch": 1519} {"train_loss": -11.006553649902344, "global_step": 255304, "epoch": 1519} {"train_loss": -10.299175262451172, "global_step": 255305, "epoch": 1519} {"train_loss": -10.694039344787598, "global_step": 255306, "epoch": 1519} {"train_loss": -9.415055274963379, "global_step": 255307, "epoch": 1519} {"train_loss": -10.829485893249512, "global_step": 255308, "epoch": 1519} {"train_loss": -10.259842872619629, "global_step": 255309, "epoch": 1519} {"train_loss": -10.853556632995605, "global_step": 255310, "epoch": 1519} {"train_loss": -10.8438720703125, "global_step": 255311, "epoch": 1519} {"train_loss": -11.003133773803711, "global_step": 255312, "epoch": 1519} {"train_loss": -10.882430076599121, "global_step": 255313, "epoch": 1519} {"train_loss": -11.027425765991211, "global_step": 255314, "epoch": 1519} {"train_loss": -11.213732719421387, "global_step": 255315, "epoch": 1519} {"train_loss": -11.47708511352539, "global_step": 255316, "epoch": 1519} {"train_loss": -11.124540328979492, "global_step": 255317, "epoch": 1519} {"train_loss": -11.028707504272461, "global_step": 255318, "epoch": 1519} {"train_loss": -11.400445938110352, "global_step": 255319, "epoch": 1519} {"train_loss": -11.050167083740234, "global_step": 255320, "epoch": 1519} {"train_loss": -11.578285217285156, "global_step": 255321, "epoch": 1519} {"train_loss": -11.075439453125, "global_step": 255322, "epoch": 1519} {"train_loss": -11.2189302444458, "global_step": 255323, "epoch": 1519} {"train_loss": -11.755270004272461, "global_step": 255324, "epoch": 1519} {"train_loss": -10.995384216308594, "global_step": 255325, "epoch": 1519} {"train_loss": -11.605619430541992, "global_step": 255326, "epoch": 1519} {"train_loss": -11.177018165588379, "global_step": 255327, "epoch": 1519} {"train_loss": -11.504213333129883, "global_step": 255328, "epoch": 1519} {"train_loss": -11.240111351013184, "global_step": 255329, "epoch": 1519} {"train_loss": -11.70142650604248, "global_step": 255330, "epoch": 1519} {"train_loss": -11.61705493927002, "global_step": 255331, "epoch": 1519} {"train_loss": -11.743447303771973, "global_step": 255332, "epoch": 1519} {"train_loss": -11.509082794189453, "global_step": 255333, "epoch": 1519} {"train_loss": -11.74966812133789, "global_step": 255334, "epoch": 1519} {"train_loss": -11.579303741455078, "global_step": 255335, "epoch": 1519} {"train_loss": -11.694183349609375, "global_step": 255336, "epoch": 1519} {"train_loss": -11.929393768310547, "global_step": 255337, "epoch": 1519} {"train_loss": -11.607526779174805, "global_step": 255338, "epoch": 1519} {"train_loss": -11.776991844177246, "global_step": 255339, "epoch": 1519} {"train_loss": -11.882181167602539, "global_step": 255340, "epoch": 1519} {"train_loss": -11.85693645477295, "global_step": 255341, "epoch": 1519} {"train_loss": -11.875433921813965, "global_step": 255342, "epoch": 1519} {"train_loss": -11.88851547241211, "global_step": 255343, "epoch": 1519} {"train_loss": -11.855358123779297, "global_step": 255344, "epoch": 1519} {"train_loss": -11.82335376739502, "global_step": 255345, "epoch": 1519} {"train_loss": -12.002388000488281, "global_step": 255346, "epoch": 1519} {"train_loss": -11.948301315307617, "global_step": 255347, "epoch": 1519} {"train_loss": -12.028532028198242, "global_step": 255348, "epoch": 1519} {"train_loss": -12.10185432434082, "global_step": 255349, "epoch": 1519} {"train_loss": -12.118768692016602, "global_step": 255350, "epoch": 1519} {"train_loss": -11.98315715789795, "global_step": 255351, "epoch": 1519} {"train_loss": -12.100984573364258, "global_step": 255352, "epoch": 1519} {"train_loss": -11.997672080993652, "global_step": 255353, "epoch": 1519} {"train_loss": -11.756036758422852, "global_step": 255354, "epoch": 1519} {"train_loss": -11.980485916137695, "global_step": 255355, "epoch": 1519} {"train_loss": -12.144497871398926, "global_step": 255356, "epoch": 1519} {"train_loss": -12.072898864746094, "global_step": 255357, "epoch": 1519} {"train_loss": -12.23581314086914, "global_step": 255358, "epoch": 1519} {"train_loss": -11.293092477889289, "global_step": 255359, "epoch": 1519, "val_loss": 269122.8125} {"train_loss": -12.183491706848145, "global_step": 255360, "epoch": 1520} {"train_loss": -12.10621452331543, "global_step": 255361, "epoch": 1520} {"train_loss": -12.010849952697754, "global_step": 255362, "epoch": 1520} {"train_loss": -12.095821380615234, "global_step": 255363, "epoch": 1520} {"train_loss": -12.124069213867188, "global_step": 255364, "epoch": 1520} {"train_loss": -12.028968811035156, "global_step": 255365, "epoch": 1520} {"train_loss": -12.18933391571045, "global_step": 255366, "epoch": 1520} {"train_loss": -12.092484474182129, "global_step": 255367, "epoch": 1520} {"train_loss": -11.857285499572754, "global_step": 255368, "epoch": 1520} {"train_loss": -12.156694412231445, "global_step": 255369, "epoch": 1520} {"train_loss": -11.855003356933594, "global_step": 255370, "epoch": 1520} {"train_loss": -12.054731369018555, "global_step": 255371, "epoch": 1520} {"train_loss": -12.127206802368164, "global_step": 255372, "epoch": 1520} {"train_loss": -12.114309310913086, "global_step": 255373, "epoch": 1520} {"train_loss": -12.284736633300781, "global_step": 255374, "epoch": 1520} {"train_loss": -12.318008422851562, "global_step": 255375, "epoch": 1520} {"train_loss": -12.282269477844238, "global_step": 255376, "epoch": 1520} {"train_loss": -12.29739761352539, "global_step": 255377, "epoch": 1520} {"train_loss": -12.298812866210938, "global_step": 255378, "epoch": 1520} {"train_loss": -12.399968147277832, "global_step": 255379, "epoch": 1520} {"train_loss": -12.253668785095215, "global_step": 255380, "epoch": 1520} {"train_loss": -12.054244995117188, "global_step": 255381, "epoch": 1520} {"train_loss": -12.171028137207031, "global_step": 255382, "epoch": 1520} {"train_loss": -12.260932922363281, "global_step": 255383, "epoch": 1520} {"train_loss": -12.026297569274902, "global_step": 255384, "epoch": 1520} {"train_loss": -12.204330444335938, "global_step": 255385, "epoch": 1520} {"train_loss": -12.280145645141602, "global_step": 255386, "epoch": 1520} {"train_loss": -12.11014461517334, "global_step": 255387, "epoch": 1520} {"train_loss": -12.291629791259766, "global_step": 255388, "epoch": 1520} {"train_loss": -12.116268157958984, "global_step": 255389, "epoch": 1520} {"train_loss": -12.182674407958984, "global_step": 255390, "epoch": 1520} {"train_loss": -12.102235794067383, "global_step": 255391, "epoch": 1520} {"train_loss": -11.564460754394531, "global_step": 255392, "epoch": 1520} {"train_loss": -12.14027214050293, "global_step": 255393, "epoch": 1520} {"train_loss": -12.119636535644531, "global_step": 255394, "epoch": 1520} {"train_loss": -11.775754928588867, "global_step": 255395, "epoch": 1520} {"train_loss": -12.122968673706055, "global_step": 255396, "epoch": 1520} {"train_loss": -11.948589324951172, "global_step": 255397, "epoch": 1520} {"train_loss": -11.921534538269043, "global_step": 255398, "epoch": 1520} {"train_loss": -11.97337818145752, "global_step": 255399, "epoch": 1520} {"train_loss": -12.245441436767578, "global_step": 255400, "epoch": 1520} {"train_loss": -11.480835914611816, "global_step": 255401, "epoch": 1520} {"train_loss": -11.884654998779297, "global_step": 255402, "epoch": 1520} {"train_loss": -11.87674331665039, "global_step": 255403, "epoch": 1520} {"train_loss": -11.2503662109375, "global_step": 255404, "epoch": 1520} {"train_loss": -10.334108352661133, "global_step": 255405, "epoch": 1520} {"train_loss": -9.829865455627441, "global_step": 255406, "epoch": 1520} {"train_loss": -11.096100807189941, "global_step": 255407, "epoch": 1520} {"train_loss": -8.169610977172852, "global_step": 255408, "epoch": 1520} {"train_loss": -10.188932418823242, "global_step": 255409, "epoch": 1520} {"train_loss": -9.38550853729248, "global_step": 255410, "epoch": 1520} {"train_loss": -9.856680870056152, "global_step": 255411, "epoch": 1520} {"train_loss": -9.827640533447266, "global_step": 255412, "epoch": 1520} {"train_loss": -10.00068473815918, "global_step": 255413, "epoch": 1520} {"train_loss": -10.856884002685547, "global_step": 255414, "epoch": 1520} {"train_loss": -8.949302673339844, "global_step": 255415, "epoch": 1520} {"train_loss": -10.376588821411133, "global_step": 255416, "epoch": 1520} {"train_loss": -8.95844841003418, "global_step": 255417, "epoch": 1520} {"train_loss": -11.037910461425781, "global_step": 255418, "epoch": 1520} {"train_loss": -10.630988121032715, "global_step": 255419, "epoch": 1520} {"train_loss": -10.761469841003418, "global_step": 255420, "epoch": 1520} {"train_loss": -10.893598556518555, "global_step": 255421, "epoch": 1520} {"train_loss": -10.590303421020508, "global_step": 255422, "epoch": 1520} {"train_loss": -10.94540023803711, "global_step": 255423, "epoch": 1520} {"train_loss": -11.055392265319824, "global_step": 255424, "epoch": 1520} {"train_loss": -10.38792610168457, "global_step": 255425, "epoch": 1520} {"train_loss": -10.833377838134766, "global_step": 255426, "epoch": 1520} {"train_loss": -11.017790794372559, "global_step": 255427, "epoch": 1520} {"train_loss": -11.376588821411133, "global_step": 255428, "epoch": 1520} {"train_loss": -10.71246337890625, "global_step": 255429, "epoch": 1520} {"train_loss": -11.405116081237793, "global_step": 255430, "epoch": 1520} {"train_loss": -11.24815559387207, "global_step": 255431, "epoch": 1520} {"train_loss": -11.177214622497559, "global_step": 255432, "epoch": 1520} {"train_loss": -11.516701698303223, "global_step": 255433, "epoch": 1520} {"train_loss": -11.341558456420898, "global_step": 255434, "epoch": 1520} {"train_loss": -11.51627254486084, "global_step": 255435, "epoch": 1520} {"train_loss": -11.20174503326416, "global_step": 255436, "epoch": 1520} {"train_loss": -11.582046508789062, "global_step": 255437, "epoch": 1520} {"train_loss": -11.114042282104492, "global_step": 255438, "epoch": 1520} {"train_loss": -11.505769729614258, "global_step": 255439, "epoch": 1520} {"train_loss": -11.234153747558594, "global_step": 255440, "epoch": 1520} {"train_loss": -11.476476669311523, "global_step": 255441, "epoch": 1520} {"train_loss": -11.175399780273438, "global_step": 255442, "epoch": 1520} {"train_loss": -11.700872421264648, "global_step": 255443, "epoch": 1520} {"train_loss": -11.497421264648438, "global_step": 255444, "epoch": 1520} {"train_loss": -11.510360717773438, "global_step": 255445, "epoch": 1520} {"train_loss": -11.636184692382812, "global_step": 255446, "epoch": 1520} {"train_loss": -11.680655479431152, "global_step": 255447, "epoch": 1520} {"train_loss": -11.831426620483398, "global_step": 255448, "epoch": 1520} {"train_loss": -11.585676193237305, "global_step": 255449, "epoch": 1520} {"train_loss": -11.534297943115234, "global_step": 255450, "epoch": 1520} {"train_loss": -11.890718460083008, "global_step": 255451, "epoch": 1520} {"train_loss": -11.590972900390625, "global_step": 255452, "epoch": 1520} {"train_loss": -12.068581581115723, "global_step": 255453, "epoch": 1520} {"train_loss": -11.631654739379883, "global_step": 255454, "epoch": 1520} {"train_loss": -11.875219345092773, "global_step": 255455, "epoch": 1520} {"train_loss": -11.913987159729004, "global_step": 255456, "epoch": 1520} {"train_loss": -11.884679794311523, "global_step": 255457, "epoch": 1520} {"train_loss": -11.707540512084961, "global_step": 255458, "epoch": 1520} {"train_loss": -11.780843734741211, "global_step": 255459, "epoch": 1520} {"train_loss": -11.732983589172363, "global_step": 255460, "epoch": 1520} {"train_loss": -11.366703033447266, "global_step": 255461, "epoch": 1520} {"train_loss": -11.738119125366211, "global_step": 255462, "epoch": 1520} {"train_loss": -11.610837936401367, "global_step": 255463, "epoch": 1520} {"train_loss": -11.578126907348633, "global_step": 255464, "epoch": 1520} {"train_loss": -11.973348617553711, "global_step": 255465, "epoch": 1520} {"train_loss": -11.814291000366211, "global_step": 255466, "epoch": 1520} {"train_loss": -11.877737045288086, "global_step": 255467, "epoch": 1520} {"train_loss": -11.525779724121094, "global_step": 255468, "epoch": 1520} {"train_loss": -11.657791137695312, "global_step": 255469, "epoch": 1520} {"train_loss": -11.716303825378418, "global_step": 255470, "epoch": 1520} {"train_loss": -11.832298278808594, "global_step": 255471, "epoch": 1520} {"train_loss": -11.854175567626953, "global_step": 255472, "epoch": 1520} {"train_loss": -11.87220573425293, "global_step": 255473, "epoch": 1520} {"train_loss": -11.691680908203125, "global_step": 255474, "epoch": 1520} {"train_loss": -11.78617000579834, "global_step": 255475, "epoch": 1520} {"train_loss": -11.79112434387207, "global_step": 255476, "epoch": 1520} {"train_loss": -11.864032745361328, "global_step": 255477, "epoch": 1520} {"train_loss": -11.414371490478516, "global_step": 255478, "epoch": 1520} {"train_loss": -12.089300155639648, "global_step": 255479, "epoch": 1520} {"train_loss": -11.588386535644531, "global_step": 255480, "epoch": 1520} {"train_loss": -12.02811050415039, "global_step": 255481, "epoch": 1520} {"train_loss": -11.811553955078125, "global_step": 255482, "epoch": 1520} {"train_loss": -11.944416046142578, "global_step": 255483, "epoch": 1520} {"train_loss": -11.806767463684082, "global_step": 255484, "epoch": 1520} {"train_loss": -11.766965866088867, "global_step": 255485, "epoch": 1520} {"train_loss": -11.917920112609863, "global_step": 255486, "epoch": 1520} {"train_loss": -11.886999130249023, "global_step": 255487, "epoch": 1520} {"train_loss": -11.905543327331543, "global_step": 255488, "epoch": 1520} {"train_loss": -11.952132225036621, "global_step": 255489, "epoch": 1520} {"train_loss": -12.228925704956055, "global_step": 255490, "epoch": 1520} {"train_loss": -11.949472427368164, "global_step": 255491, "epoch": 1520} {"train_loss": -12.061147689819336, "global_step": 255492, "epoch": 1520} {"train_loss": -11.854782104492188, "global_step": 255493, "epoch": 1520} {"train_loss": -11.972933769226074, "global_step": 255494, "epoch": 1520} {"train_loss": -12.270493507385254, "global_step": 255495, "epoch": 1520} {"train_loss": -12.075139999389648, "global_step": 255496, "epoch": 1520} {"train_loss": -12.072153091430664, "global_step": 255497, "epoch": 1520} {"train_loss": -12.144563674926758, "global_step": 255498, "epoch": 1520} {"train_loss": -12.12480640411377, "global_step": 255499, "epoch": 1520} {"train_loss": -11.986444473266602, "global_step": 255500, "epoch": 1520} {"train_loss": -11.978682518005371, "global_step": 255501, "epoch": 1520} {"train_loss": -12.093488693237305, "global_step": 255502, "epoch": 1520} {"train_loss": -12.171483039855957, "global_step": 255503, "epoch": 1520} {"train_loss": -12.07218074798584, "global_step": 255504, "epoch": 1520} {"train_loss": -12.18856430053711, "global_step": 255505, "epoch": 1520} {"train_loss": -12.071399688720703, "global_step": 255506, "epoch": 1520} {"train_loss": -11.987203598022461, "global_step": 255507, "epoch": 1520} {"train_loss": -12.237165451049805, "global_step": 255508, "epoch": 1520} {"train_loss": -12.064077377319336, "global_step": 255509, "epoch": 1520} {"train_loss": -12.32204818725586, "global_step": 255510, "epoch": 1520} {"train_loss": -12.147560119628906, "global_step": 255511, "epoch": 1520} {"train_loss": -12.124078750610352, "global_step": 255512, "epoch": 1520} {"train_loss": -12.300939559936523, "global_step": 255513, "epoch": 1520} {"train_loss": -12.058281898498535, "global_step": 255514, "epoch": 1520} {"train_loss": -12.227679252624512, "global_step": 255515, "epoch": 1520} {"train_loss": -12.330467224121094, "global_step": 255516, "epoch": 1520} {"train_loss": -12.258956909179688, "global_step": 255517, "epoch": 1520} {"train_loss": -12.173571586608887, "global_step": 255518, "epoch": 1520} {"train_loss": -12.262595176696777, "global_step": 255519, "epoch": 1520} {"train_loss": -12.222830772399902, "global_step": 255520, "epoch": 1520} {"train_loss": -12.307710647583008, "global_step": 255521, "epoch": 1520} {"train_loss": -12.228885650634766, "global_step": 255522, "epoch": 1520} {"train_loss": -12.118375778198242, "global_step": 255523, "epoch": 1520} {"train_loss": -11.945185661315918, "global_step": 255524, "epoch": 1520} {"train_loss": -11.470560073852539, "global_step": 255525, "epoch": 1520} {"train_loss": -11.43883228302002, "global_step": 255526, "epoch": 1520} {"train_loss": -11.669924469221206, "global_step": 255527, "epoch": 1520, "val_loss": 268872.90625, "train_action_mse_error": 2.0481228828430176} {"train_loss": -11.882229804992676, "global_step": 255528, "epoch": 1521} {"train_loss": -12.016443252563477, "global_step": 255529, "epoch": 1521} {"train_loss": -11.829435348510742, "global_step": 255530, "epoch": 1521} {"train_loss": -11.649740219116211, "global_step": 255531, "epoch": 1521} {"train_loss": -11.996016502380371, "global_step": 255532, "epoch": 1521} {"train_loss": -11.608880996704102, "global_step": 255533, "epoch": 1521} {"train_loss": -11.24203109741211, "global_step": 255534, "epoch": 1521} {"train_loss": -10.540823936462402, "global_step": 255535, "epoch": 1521} {"train_loss": -10.515970230102539, "global_step": 255536, "epoch": 1521} {"train_loss": -11.5261812210083, "global_step": 255537, "epoch": 1521} {"train_loss": -8.275811195373535, "global_step": 255538, "epoch": 1521} {"train_loss": -10.442760467529297, "global_step": 255539, "epoch": 1521} {"train_loss": -7.71376895904541, "global_step": 255540, "epoch": 1521} {"train_loss": -7.929714202880859, "global_step": 255541, "epoch": 1521} {"train_loss": -7.229991912841797, "global_step": 255542, "epoch": 1521} {"train_loss": -6.805992126464844, "global_step": 255543, "epoch": 1521} {"train_loss": -7.285927772521973, "global_step": 255544, "epoch": 1521} {"train_loss": -8.377935409545898, "global_step": 255545, "epoch": 1521} {"train_loss": -9.269021987915039, "global_step": 255546, "epoch": 1521} {"train_loss": -8.359975814819336, "global_step": 255547, "epoch": 1521} {"train_loss": -8.586645126342773, "global_step": 255548, "epoch": 1521} {"train_loss": -9.642690658569336, "global_step": 255549, "epoch": 1521} {"train_loss": -9.46605396270752, "global_step": 255550, "epoch": 1521} {"train_loss": -9.734127044677734, "global_step": 255551, "epoch": 1521} {"train_loss": -9.790182113647461, "global_step": 255552, "epoch": 1521} {"train_loss": -9.795516014099121, "global_step": 255553, "epoch": 1521} {"train_loss": -10.799392700195312, "global_step": 255554, "epoch": 1521} {"train_loss": -9.932938575744629, "global_step": 255555, "epoch": 1521} {"train_loss": -10.060202598571777, "global_step": 255556, "epoch": 1521} {"train_loss": -11.09113883972168, "global_step": 255557, "epoch": 1521} {"train_loss": -10.299053192138672, "global_step": 255558, "epoch": 1521} {"train_loss": -11.202526092529297, "global_step": 255559, "epoch": 1521} {"train_loss": -10.148770332336426, "global_step": 255560, "epoch": 1521} {"train_loss": -10.779916763305664, "global_step": 255561, "epoch": 1521} {"train_loss": -10.880695343017578, "global_step": 255562, "epoch": 1521} {"train_loss": -11.346186637878418, "global_step": 255563, "epoch": 1521} {"train_loss": -10.866616249084473, "global_step": 255564, "epoch": 1521} {"train_loss": -11.061517715454102, "global_step": 255565, "epoch": 1521} {"train_loss": -10.244179725646973, "global_step": 255566, "epoch": 1521} {"train_loss": -11.057683944702148, "global_step": 255567, "epoch": 1521} {"train_loss": -10.535172462463379, "global_step": 255568, "epoch": 1521} {"train_loss": -10.978219985961914, "global_step": 255569, "epoch": 1521} {"train_loss": -10.729154586791992, "global_step": 255570, "epoch": 1521} {"train_loss": -11.064654350280762, "global_step": 255571, "epoch": 1521} {"train_loss": -10.756326675415039, "global_step": 255572, "epoch": 1521} {"train_loss": -11.518983840942383, "global_step": 255573, "epoch": 1521} {"train_loss": -11.012779235839844, "global_step": 255574, "epoch": 1521} {"train_loss": -11.475282669067383, "global_step": 255575, "epoch": 1521} {"train_loss": -11.172609329223633, "global_step": 255576, "epoch": 1521} {"train_loss": -11.44516372680664, "global_step": 255577, "epoch": 1521} {"train_loss": -11.550202369689941, "global_step": 255578, "epoch": 1521} {"train_loss": -11.548791885375977, "global_step": 255579, "epoch": 1521} {"train_loss": -11.348950386047363, "global_step": 255580, "epoch": 1521} {"train_loss": -11.494036674499512, "global_step": 255581, "epoch": 1521} {"train_loss": -11.39903450012207, "global_step": 255582, "epoch": 1521} {"train_loss": -11.667264938354492, "global_step": 255583, "epoch": 1521} {"train_loss": -11.446402549743652, "global_step": 255584, "epoch": 1521} {"train_loss": -11.474746704101562, "global_step": 255585, "epoch": 1521} {"train_loss": -11.710079193115234, "global_step": 255586, "epoch": 1521} {"train_loss": -11.781213760375977, "global_step": 255587, "epoch": 1521} {"train_loss": -11.68817138671875, "global_step": 255588, "epoch": 1521} {"train_loss": -11.600062370300293, "global_step": 255589, "epoch": 1521} {"train_loss": -11.72201156616211, "global_step": 255590, "epoch": 1521} {"train_loss": -11.62590503692627, "global_step": 255591, "epoch": 1521} {"train_loss": -11.84233283996582, "global_step": 255592, "epoch": 1521} {"train_loss": -11.595415115356445, "global_step": 255593, "epoch": 1521} {"train_loss": -11.79715347290039, "global_step": 255594, "epoch": 1521} {"train_loss": -11.435014724731445, "global_step": 255595, "epoch": 1521} {"train_loss": -11.771434783935547, "global_step": 255596, "epoch": 1521} {"train_loss": -11.636459350585938, "global_step": 255597, "epoch": 1521} {"train_loss": -11.73176097869873, "global_step": 255598, "epoch": 1521} {"train_loss": -11.683018684387207, "global_step": 255599, "epoch": 1521} {"train_loss": -11.784960746765137, "global_step": 255600, "epoch": 1521} {"train_loss": -11.891704559326172, "global_step": 255601, "epoch": 1521} {"train_loss": -11.711935997009277, "global_step": 255602, "epoch": 1521} {"train_loss": -11.82791805267334, "global_step": 255603, "epoch": 1521} {"train_loss": -11.81066608428955, "global_step": 255604, "epoch": 1521} {"train_loss": -12.068275451660156, "global_step": 255605, "epoch": 1521} {"train_loss": -11.88767147064209, "global_step": 255606, "epoch": 1521} {"train_loss": -11.916851043701172, "global_step": 255607, "epoch": 1521} {"train_loss": -12.014448165893555, "global_step": 255608, "epoch": 1521} {"train_loss": -12.007774353027344, "global_step": 255609, "epoch": 1521} {"train_loss": -12.1314697265625, "global_step": 255610, "epoch": 1521} {"train_loss": -12.077783584594727, "global_step": 255611, "epoch": 1521} {"train_loss": -12.09095573425293, "global_step": 255612, "epoch": 1521} {"train_loss": -12.079328536987305, "global_step": 255613, "epoch": 1521} {"train_loss": -12.083517074584961, "global_step": 255614, "epoch": 1521} {"train_loss": -12.080936431884766, "global_step": 255615, "epoch": 1521} {"train_loss": -12.20292854309082, "global_step": 255616, "epoch": 1521} {"train_loss": -11.915037155151367, "global_step": 255617, "epoch": 1521} {"train_loss": -12.064411163330078, "global_step": 255618, "epoch": 1521} {"train_loss": -12.328568458557129, "global_step": 255619, "epoch": 1521} {"train_loss": -11.954194068908691, "global_step": 255620, "epoch": 1521} {"train_loss": -12.103010177612305, "global_step": 255621, "epoch": 1521} {"train_loss": -11.92889404296875, "global_step": 255622, "epoch": 1521} {"train_loss": -12.13740062713623, "global_step": 255623, "epoch": 1521} {"train_loss": -12.056617736816406, "global_step": 255624, "epoch": 1521} {"train_loss": -12.105802536010742, "global_step": 255625, "epoch": 1521} {"train_loss": -12.064407348632812, "global_step": 255626, "epoch": 1521} {"train_loss": -12.029529571533203, "global_step": 255627, "epoch": 1521} {"train_loss": -12.034387588500977, "global_step": 255628, "epoch": 1521} {"train_loss": -11.990371704101562, "global_step": 255629, "epoch": 1521} {"train_loss": -11.850927352905273, "global_step": 255630, "epoch": 1521} {"train_loss": -12.080995559692383, "global_step": 255631, "epoch": 1521} {"train_loss": -12.1703519821167, "global_step": 255632, "epoch": 1521} {"train_loss": -12.15727424621582, "global_step": 255633, "epoch": 1521} {"train_loss": -12.084573745727539, "global_step": 255634, "epoch": 1521} {"train_loss": -12.31829833984375, "global_step": 255635, "epoch": 1521} {"train_loss": -12.144220352172852, "global_step": 255636, "epoch": 1521} {"train_loss": -12.135656356811523, "global_step": 255637, "epoch": 1521} {"train_loss": -12.15850830078125, "global_step": 255638, "epoch": 1521} {"train_loss": -12.210402488708496, "global_step": 255639, "epoch": 1521} {"train_loss": -11.909345626831055, "global_step": 255640, "epoch": 1521} {"train_loss": -12.362001419067383, "global_step": 255641, "epoch": 1521} {"train_loss": -12.113895416259766, "global_step": 255642, "epoch": 1521} {"train_loss": -12.076674461364746, "global_step": 255643, "epoch": 1521} {"train_loss": -11.569453239440918, "global_step": 255644, "epoch": 1521} {"train_loss": -12.336002349853516, "global_step": 255645, "epoch": 1521} {"train_loss": -11.868680000305176, "global_step": 255646, "epoch": 1521} {"train_loss": -11.795251846313477, "global_step": 255647, "epoch": 1521} {"train_loss": -11.777486801147461, "global_step": 255648, "epoch": 1521} {"train_loss": -11.468116760253906, "global_step": 255649, "epoch": 1521} {"train_loss": -9.599576950073242, "global_step": 255650, "epoch": 1521} {"train_loss": -10.59422779083252, "global_step": 255651, "epoch": 1521} {"train_loss": -11.047492980957031, "global_step": 255652, "epoch": 1521} {"train_loss": -11.020362854003906, "global_step": 255653, "epoch": 1521} {"train_loss": -10.393960952758789, "global_step": 255654, "epoch": 1521} {"train_loss": -10.319351196289062, "global_step": 255655, "epoch": 1521} {"train_loss": -11.773852348327637, "global_step": 255656, "epoch": 1521} {"train_loss": -11.124616622924805, "global_step": 255657, "epoch": 1521} {"train_loss": -10.77096939086914, "global_step": 255658, "epoch": 1521} {"train_loss": -10.528812408447266, "global_step": 255659, "epoch": 1521} {"train_loss": -11.396666526794434, "global_step": 255660, "epoch": 1521} {"train_loss": -9.624555587768555, "global_step": 255661, "epoch": 1521} {"train_loss": -11.266963005065918, "global_step": 255662, "epoch": 1521} {"train_loss": -8.241689682006836, "global_step": 255663, "epoch": 1521} {"train_loss": -10.354726791381836, "global_step": 255664, "epoch": 1521} {"train_loss": -10.483823776245117, "global_step": 255665, "epoch": 1521} {"train_loss": -10.230512619018555, "global_step": 255666, "epoch": 1521} {"train_loss": -10.035719871520996, "global_step": 255667, "epoch": 1521} {"train_loss": -10.806163787841797, "global_step": 255668, "epoch": 1521} {"train_loss": -9.025177001953125, "global_step": 255669, "epoch": 1521} {"train_loss": -9.421600341796875, "global_step": 255670, "epoch": 1521} {"train_loss": -10.312171936035156, "global_step": 255671, "epoch": 1521} {"train_loss": -9.771429061889648, "global_step": 255672, "epoch": 1521} {"train_loss": -8.85936164855957, "global_step": 255673, "epoch": 1521} {"train_loss": -9.601795196533203, "global_step": 255674, "epoch": 1521} {"train_loss": -9.169974327087402, "global_step": 255675, "epoch": 1521} {"train_loss": -8.197648048400879, "global_step": 255676, "epoch": 1521} {"train_loss": -9.540648460388184, "global_step": 255677, "epoch": 1521} {"train_loss": -10.298491477966309, "global_step": 255678, "epoch": 1521} {"train_loss": -9.885762214660645, "global_step": 255679, "epoch": 1521} {"train_loss": -8.610651016235352, "global_step": 255680, "epoch": 1521} {"train_loss": -10.152080535888672, "global_step": 255681, "epoch": 1521} {"train_loss": -10.538148880004883, "global_step": 255682, "epoch": 1521} {"train_loss": -10.137619018554688, "global_step": 255683, "epoch": 1521} {"train_loss": -10.913261413574219, "global_step": 255684, "epoch": 1521} {"train_loss": -10.750683784484863, "global_step": 255685, "epoch": 1521} {"train_loss": -11.049966812133789, "global_step": 255686, "epoch": 1521} {"train_loss": -10.44883918762207, "global_step": 255687, "epoch": 1521} {"train_loss": -11.233522415161133, "global_step": 255688, "epoch": 1521} {"train_loss": -10.849804878234863, "global_step": 255689, "epoch": 1521} {"train_loss": -10.98206901550293, "global_step": 255690, "epoch": 1521} {"train_loss": -11.244056701660156, "global_step": 255691, "epoch": 1521} {"train_loss": -11.112212181091309, "global_step": 255692, "epoch": 1521} {"train_loss": -11.358572006225586, "global_step": 255693, "epoch": 1521} {"train_loss": -11.06124496459961, "global_step": 255694, "epoch": 1521} {"train_loss": -10.98897768202282, "global_step": 255695, "epoch": 1521, "val_loss": 266363.0625} {"train_loss": -11.279923439025879, "global_step": 255696, "epoch": 1522} {"train_loss": -11.26904296875, "global_step": 255697, "epoch": 1522} {"train_loss": -11.147924423217773, "global_step": 255698, "epoch": 1522} {"train_loss": -11.235814094543457, "global_step": 255699, "epoch": 1522} {"train_loss": -11.260417938232422, "global_step": 255700, "epoch": 1522} {"train_loss": -10.850324630737305, "global_step": 255701, "epoch": 1522} {"train_loss": -11.445158004760742, "global_step": 255702, "epoch": 1522} {"train_loss": -11.17038345336914, "global_step": 255703, "epoch": 1522} {"train_loss": -11.4938383102417, "global_step": 255704, "epoch": 1522} {"train_loss": -10.862552642822266, "global_step": 255705, "epoch": 1522} {"train_loss": -11.013872146606445, "global_step": 255706, "epoch": 1522} {"train_loss": -10.961313247680664, "global_step": 255707, "epoch": 1522} {"train_loss": -11.048844337463379, "global_step": 255708, "epoch": 1522} {"train_loss": -10.84758186340332, "global_step": 255709, "epoch": 1522} {"train_loss": -11.23912525177002, "global_step": 255710, "epoch": 1522} {"train_loss": -11.149271965026855, "global_step": 255711, "epoch": 1522} {"train_loss": -11.216028213500977, "global_step": 255712, "epoch": 1522} {"train_loss": -8.935674667358398, "global_step": 255713, "epoch": 1522} {"train_loss": -11.416441917419434, "global_step": 255714, "epoch": 1522} {"train_loss": -11.191150665283203, "global_step": 255715, "epoch": 1522} {"train_loss": -11.259451866149902, "global_step": 255716, "epoch": 1522} {"train_loss": -11.32547378540039, "global_step": 255717, "epoch": 1522} {"train_loss": -11.381200790405273, "global_step": 255718, "epoch": 1522} {"train_loss": -11.22437858581543, "global_step": 255719, "epoch": 1522} {"train_loss": -11.280464172363281, "global_step": 255720, "epoch": 1522} {"train_loss": -11.182920455932617, "global_step": 255721, "epoch": 1522} {"train_loss": -11.332667350769043, "global_step": 255722, "epoch": 1522} {"train_loss": -11.381059646606445, "global_step": 255723, "epoch": 1522} {"train_loss": -11.276971817016602, "global_step": 255724, "epoch": 1522} {"train_loss": -11.625112533569336, "global_step": 255725, "epoch": 1522} {"train_loss": -11.580260276794434, "global_step": 255726, "epoch": 1522} {"train_loss": -11.642289161682129, "global_step": 255727, "epoch": 1522} {"train_loss": -11.545549392700195, "global_step": 255728, "epoch": 1522} {"train_loss": -11.404134750366211, "global_step": 255729, "epoch": 1522} {"train_loss": -11.801212310791016, "global_step": 255730, "epoch": 1522} {"train_loss": -11.597460746765137, "global_step": 255731, "epoch": 1522} {"train_loss": -11.444991111755371, "global_step": 255732, "epoch": 1522} {"train_loss": -11.46065902709961, "global_step": 255733, "epoch": 1522} {"train_loss": -11.406126022338867, "global_step": 255734, "epoch": 1522} {"train_loss": -11.277657508850098, "global_step": 255735, "epoch": 1522} {"train_loss": -11.658660888671875, "global_step": 255736, "epoch": 1522} {"train_loss": -11.625289916992188, "global_step": 255737, "epoch": 1522} {"train_loss": -11.659215927124023, "global_step": 255738, "epoch": 1522} {"train_loss": -10.767126083374023, "global_step": 255739, "epoch": 1522} {"train_loss": -11.154953002929688, "global_step": 255740, "epoch": 1522} {"train_loss": -11.678060531616211, "global_step": 255741, "epoch": 1522} {"train_loss": -11.711796760559082, "global_step": 255742, "epoch": 1522} {"train_loss": -11.820377349853516, "global_step": 255743, "epoch": 1522} {"train_loss": -11.673686981201172, "global_step": 255744, "epoch": 1522} {"train_loss": -11.88117790222168, "global_step": 255745, "epoch": 1522} {"train_loss": -12.003500938415527, "global_step": 255746, "epoch": 1522} {"train_loss": -11.802764892578125, "global_step": 255747, "epoch": 1522} {"train_loss": -11.620509147644043, "global_step": 255748, "epoch": 1522} {"train_loss": -11.84605598449707, "global_step": 255749, "epoch": 1522} {"train_loss": -11.689142227172852, "global_step": 255750, "epoch": 1522} {"train_loss": -11.454303741455078, "global_step": 255751, "epoch": 1522} {"train_loss": -11.863240242004395, "global_step": 255752, "epoch": 1522} {"train_loss": -11.914045333862305, "global_step": 255753, "epoch": 1522} {"train_loss": -11.761459350585938, "global_step": 255754, "epoch": 1522} {"train_loss": -11.832869529724121, "global_step": 255755, "epoch": 1522} {"train_loss": -11.967500686645508, "global_step": 255756, "epoch": 1522} {"train_loss": -11.851615905761719, "global_step": 255757, "epoch": 1522} {"train_loss": -11.737189292907715, "global_step": 255758, "epoch": 1522} {"train_loss": -11.337006568908691, "global_step": 255759, "epoch": 1522} {"train_loss": -11.987892150878906, "global_step": 255760, "epoch": 1522} {"train_loss": -11.66016674041748, "global_step": 255761, "epoch": 1522} {"train_loss": -11.912088394165039, "global_step": 255762, "epoch": 1522} {"train_loss": -11.943527221679688, "global_step": 255763, "epoch": 1522} {"train_loss": -11.847515106201172, "global_step": 255764, "epoch": 1522} {"train_loss": -11.816307067871094, "global_step": 255765, "epoch": 1522} {"train_loss": -11.837530136108398, "global_step": 255766, "epoch": 1522} {"train_loss": -11.913406372070312, "global_step": 255767, "epoch": 1522} {"train_loss": -11.943384170532227, "global_step": 255768, "epoch": 1522} {"train_loss": -11.778154373168945, "global_step": 255769, "epoch": 1522} {"train_loss": -12.067259788513184, "global_step": 255770, "epoch": 1522} {"train_loss": -11.731070518493652, "global_step": 255771, "epoch": 1522} {"train_loss": -11.602014541625977, "global_step": 255772, "epoch": 1522} {"train_loss": -12.06170654296875, "global_step": 255773, "epoch": 1522} {"train_loss": -12.017189025878906, "global_step": 255774, "epoch": 1522} {"train_loss": -12.055071830749512, "global_step": 255775, "epoch": 1522} {"train_loss": -11.712311744689941, "global_step": 255776, "epoch": 1522} {"train_loss": -11.866291046142578, "global_step": 255777, "epoch": 1522} {"train_loss": -11.965564727783203, "global_step": 255778, "epoch": 1522} {"train_loss": -11.672874450683594, "global_step": 255779, "epoch": 1522} {"train_loss": -11.789793014526367, "global_step": 255780, "epoch": 1522} {"train_loss": -12.081862449645996, "global_step": 255781, "epoch": 1522} {"train_loss": -11.632993698120117, "global_step": 255782, "epoch": 1522} {"train_loss": -11.598369598388672, "global_step": 255783, "epoch": 1522} {"train_loss": -11.79650592803955, "global_step": 255784, "epoch": 1522} {"train_loss": -11.389055252075195, "global_step": 255785, "epoch": 1522} {"train_loss": -12.211392402648926, "global_step": 255786, "epoch": 1522} {"train_loss": -11.933815956115723, "global_step": 255787, "epoch": 1522} {"train_loss": -11.726388931274414, "global_step": 255788, "epoch": 1522} {"train_loss": -11.801767349243164, "global_step": 255789, "epoch": 1522} {"train_loss": -11.578286170959473, "global_step": 255790, "epoch": 1522} {"train_loss": -11.56122875213623, "global_step": 255791, "epoch": 1522} {"train_loss": -11.20359992980957, "global_step": 255792, "epoch": 1522} {"train_loss": -12.047357559204102, "global_step": 255793, "epoch": 1522} {"train_loss": -11.26346206665039, "global_step": 255794, "epoch": 1522} {"train_loss": -11.731569290161133, "global_step": 255795, "epoch": 1522} {"train_loss": -11.563776016235352, "global_step": 255796, "epoch": 1522} {"train_loss": -11.616690635681152, "global_step": 255797, "epoch": 1522} {"train_loss": -11.862533569335938, "global_step": 255798, "epoch": 1522} {"train_loss": -11.871129035949707, "global_step": 255799, "epoch": 1522} {"train_loss": -11.744977951049805, "global_step": 255800, "epoch": 1522} {"train_loss": -11.924084663391113, "global_step": 255801, "epoch": 1522} {"train_loss": -11.337654113769531, "global_step": 255802, "epoch": 1522} {"train_loss": -11.099964141845703, "global_step": 255803, "epoch": 1522} {"train_loss": -12.126413345336914, "global_step": 255804, "epoch": 1522} {"train_loss": -10.807746887207031, "global_step": 255805, "epoch": 1522} {"train_loss": -10.425836563110352, "global_step": 255806, "epoch": 1522} {"train_loss": -11.509111404418945, "global_step": 255807, "epoch": 1522} {"train_loss": -11.748970985412598, "global_step": 255808, "epoch": 1522} {"train_loss": -11.07446002960205, "global_step": 255809, "epoch": 1522} {"train_loss": -11.937660217285156, "global_step": 255810, "epoch": 1522} {"train_loss": -11.459360122680664, "global_step": 255811, "epoch": 1522} {"train_loss": -11.972735404968262, "global_step": 255812, "epoch": 1522} {"train_loss": -11.56576919555664, "global_step": 255813, "epoch": 1522} {"train_loss": -11.698813438415527, "global_step": 255814, "epoch": 1522} {"train_loss": -11.793279647827148, "global_step": 255815, "epoch": 1522} {"train_loss": -11.380784034729004, "global_step": 255816, "epoch": 1522} {"train_loss": -11.712912559509277, "global_step": 255817, "epoch": 1522} {"train_loss": -11.469120025634766, "global_step": 255818, "epoch": 1522} {"train_loss": -11.89852523803711, "global_step": 255819, "epoch": 1522} {"train_loss": -10.7184419631958, "global_step": 255820, "epoch": 1522} {"train_loss": -11.390888214111328, "global_step": 255821, "epoch": 1522} {"train_loss": -10.772696495056152, "global_step": 255822, "epoch": 1522} {"train_loss": -11.81968879699707, "global_step": 255823, "epoch": 1522} {"train_loss": -11.428099632263184, "global_step": 255824, "epoch": 1522} {"train_loss": -11.360859870910645, "global_step": 255825, "epoch": 1522} {"train_loss": -11.618734359741211, "global_step": 255826, "epoch": 1522} {"train_loss": -10.610282897949219, "global_step": 255827, "epoch": 1522} {"train_loss": -11.707764625549316, "global_step": 255828, "epoch": 1522} {"train_loss": -11.220832824707031, "global_step": 255829, "epoch": 1522} {"train_loss": -11.671670913696289, "global_step": 255830, "epoch": 1522} {"train_loss": -10.861958503723145, "global_step": 255831, "epoch": 1522} {"train_loss": -11.59431266784668, "global_step": 255832, "epoch": 1522} {"train_loss": -11.299285888671875, "global_step": 255833, "epoch": 1522} {"train_loss": -11.478193283081055, "global_step": 255834, "epoch": 1522} {"train_loss": -11.373978614807129, "global_step": 255835, "epoch": 1522} {"train_loss": -10.490432739257812, "global_step": 255836, "epoch": 1522} {"train_loss": -11.719636917114258, "global_step": 255837, "epoch": 1522} {"train_loss": -9.883968353271484, "global_step": 255838, "epoch": 1522} {"train_loss": -10.955708503723145, "global_step": 255839, "epoch": 1522} {"train_loss": -8.99118709564209, "global_step": 255840, "epoch": 1522} {"train_loss": -10.191542625427246, "global_step": 255841, "epoch": 1522} {"train_loss": -6.959988594055176, "global_step": 255842, "epoch": 1522} {"train_loss": -10.291634559631348, "global_step": 255843, "epoch": 1522} {"train_loss": -8.214218139648438, "global_step": 255844, "epoch": 1522} {"train_loss": -8.507288932800293, "global_step": 255845, "epoch": 1522} {"train_loss": -9.868879318237305, "global_step": 255846, "epoch": 1522} {"train_loss": -7.785378932952881, "global_step": 255847, "epoch": 1522} {"train_loss": -10.164999008178711, "global_step": 255848, "epoch": 1522} {"train_loss": -8.333127975463867, "global_step": 255849, "epoch": 1522} {"train_loss": -7.678005218505859, "global_step": 255850, "epoch": 1522} {"train_loss": -9.264947891235352, "global_step": 255851, "epoch": 1522} {"train_loss": -8.194738388061523, "global_step": 255852, "epoch": 1522} {"train_loss": -7.92429780960083, "global_step": 255853, "epoch": 1522} {"train_loss": -10.535499572753906, "global_step": 255854, "epoch": 1522} {"train_loss": -8.516786575317383, "global_step": 255855, "epoch": 1522} {"train_loss": -8.763176918029785, "global_step": 255856, "epoch": 1522} {"train_loss": -10.123397827148438, "global_step": 255857, "epoch": 1522} {"train_loss": -9.357600212097168, "global_step": 255858, "epoch": 1522} {"train_loss": -10.272722244262695, "global_step": 255859, "epoch": 1522} {"train_loss": -10.470611572265625, "global_step": 255860, "epoch": 1522} {"train_loss": -10.520294189453125, "global_step": 255861, "epoch": 1522} {"train_loss": -10.919532775878906, "global_step": 255862, "epoch": 1522} {"train_loss": -11.177054496038528, "global_step": 255863, "epoch": 1522, "val_loss": 267655.9375} {"train_loss": -11.175416946411133, "global_step": 255864, "epoch": 1523} {"train_loss": -10.515650749206543, "global_step": 255865, "epoch": 1523} {"train_loss": -11.165178298950195, "global_step": 255866, "epoch": 1523} {"train_loss": -11.244768142700195, "global_step": 255867, "epoch": 1523} {"train_loss": -10.834171295166016, "global_step": 255868, "epoch": 1523} {"train_loss": -11.289619445800781, "global_step": 255869, "epoch": 1523} {"train_loss": -11.07847785949707, "global_step": 255870, "epoch": 1523} {"train_loss": -11.15230941772461, "global_step": 255871, "epoch": 1523} {"train_loss": -11.1336669921875, "global_step": 255872, "epoch": 1523} {"train_loss": -11.049491882324219, "global_step": 255873, "epoch": 1523} {"train_loss": -11.231823921203613, "global_step": 255874, "epoch": 1523} {"train_loss": -11.390052795410156, "global_step": 255875, "epoch": 1523} {"train_loss": -11.158843994140625, "global_step": 255876, "epoch": 1523} {"train_loss": -11.193857192993164, "global_step": 255877, "epoch": 1523} {"train_loss": -11.426709175109863, "global_step": 255878, "epoch": 1523} {"train_loss": -11.123974800109863, "global_step": 255879, "epoch": 1523} {"train_loss": -11.498716354370117, "global_step": 255880, "epoch": 1523} {"train_loss": -11.488910675048828, "global_step": 255881, "epoch": 1523} {"train_loss": -11.474603652954102, "global_step": 255882, "epoch": 1523} {"train_loss": -11.483816146850586, "global_step": 255883, "epoch": 1523} {"train_loss": -11.572766304016113, "global_step": 255884, "epoch": 1523} {"train_loss": -11.428657531738281, "global_step": 255885, "epoch": 1523} {"train_loss": -11.626132011413574, "global_step": 255886, "epoch": 1523} {"train_loss": -11.523001670837402, "global_step": 255887, "epoch": 1523} {"train_loss": -11.534661293029785, "global_step": 255888, "epoch": 1523} {"train_loss": -11.628385543823242, "global_step": 255889, "epoch": 1523} {"train_loss": -11.633807182312012, "global_step": 255890, "epoch": 1523} {"train_loss": -11.580094337463379, "global_step": 255891, "epoch": 1523} {"train_loss": -11.53259563446045, "global_step": 255892, "epoch": 1523} {"train_loss": -11.340036392211914, "global_step": 255893, "epoch": 1523} {"train_loss": -11.575178146362305, "global_step": 255894, "epoch": 1523} {"train_loss": -11.706526756286621, "global_step": 255895, "epoch": 1523} {"train_loss": -11.643746376037598, "global_step": 255896, "epoch": 1523} {"train_loss": -11.693887710571289, "global_step": 255897, "epoch": 1523} {"train_loss": -11.668441772460938, "global_step": 255898, "epoch": 1523} {"train_loss": -11.758830070495605, "global_step": 255899, "epoch": 1523} {"train_loss": -11.76735782623291, "global_step": 255900, "epoch": 1523} {"train_loss": -11.744349479675293, "global_step": 255901, "epoch": 1523} {"train_loss": -11.9259614944458, "global_step": 255902, "epoch": 1523} {"train_loss": -11.699808120727539, "global_step": 255903, "epoch": 1523} {"train_loss": -11.64529037475586, "global_step": 255904, "epoch": 1523} {"train_loss": -11.959310531616211, "global_step": 255905, "epoch": 1523} {"train_loss": -11.891084671020508, "global_step": 255906, "epoch": 1523} {"train_loss": -11.864479064941406, "global_step": 255907, "epoch": 1523} {"train_loss": -11.853363037109375, "global_step": 255908, "epoch": 1523} {"train_loss": -11.67947769165039, "global_step": 255909, "epoch": 1523} {"train_loss": -11.798404693603516, "global_step": 255910, "epoch": 1523} {"train_loss": -11.80349063873291, "global_step": 255911, "epoch": 1523} {"train_loss": -11.750078201293945, "global_step": 255912, "epoch": 1523} {"train_loss": -12.025225639343262, "global_step": 255913, "epoch": 1523} {"train_loss": -11.899662017822266, "global_step": 255914, "epoch": 1523} {"train_loss": -11.913969993591309, "global_step": 255915, "epoch": 1523} {"train_loss": -11.865279197692871, "global_step": 255916, "epoch": 1523} {"train_loss": -11.897283554077148, "global_step": 255917, "epoch": 1523} {"train_loss": -11.918693542480469, "global_step": 255918, "epoch": 1523} {"train_loss": -11.901233673095703, "global_step": 255919, "epoch": 1523} {"train_loss": -12.019515991210938, "global_step": 255920, "epoch": 1523} {"train_loss": -12.163771629333496, "global_step": 255921, "epoch": 1523} {"train_loss": -12.18163776397705, "global_step": 255922, "epoch": 1523} {"train_loss": -11.890520095825195, "global_step": 255923, "epoch": 1523} {"train_loss": -12.025723457336426, "global_step": 255924, "epoch": 1523} {"train_loss": -12.074312210083008, "global_step": 255925, "epoch": 1523} {"train_loss": -12.035550117492676, "global_step": 255926, "epoch": 1523} {"train_loss": -11.951008796691895, "global_step": 255927, "epoch": 1523} {"train_loss": -12.145330429077148, "global_step": 255928, "epoch": 1523} {"train_loss": -11.796801567077637, "global_step": 255929, "epoch": 1523} {"train_loss": -12.035138130187988, "global_step": 255930, "epoch": 1523} {"train_loss": -11.689163208007812, "global_step": 255931, "epoch": 1523} {"train_loss": -12.018241882324219, "global_step": 255932, "epoch": 1523} {"train_loss": -11.978686332702637, "global_step": 255933, "epoch": 1523} {"train_loss": -11.941545486450195, "global_step": 255934, "epoch": 1523} {"train_loss": -12.215216636657715, "global_step": 255935, "epoch": 1523} {"train_loss": -11.924546241760254, "global_step": 255936, "epoch": 1523} {"train_loss": -11.951261520385742, "global_step": 255937, "epoch": 1523} {"train_loss": -12.048742294311523, "global_step": 255938, "epoch": 1523} {"train_loss": -12.15684986114502, "global_step": 255939, "epoch": 1523} {"train_loss": -12.11207389831543, "global_step": 255940, "epoch": 1523} {"train_loss": -12.147790908813477, "global_step": 255941, "epoch": 1523} {"train_loss": -12.19815444946289, "global_step": 255942, "epoch": 1523} {"train_loss": -12.025527000427246, "global_step": 255943, "epoch": 1523} {"train_loss": -12.057390213012695, "global_step": 255944, "epoch": 1523} {"train_loss": -12.035174369812012, "global_step": 255945, "epoch": 1523} {"train_loss": -12.276378631591797, "global_step": 255946, "epoch": 1523} {"train_loss": -12.026384353637695, "global_step": 255947, "epoch": 1523} {"train_loss": -11.94001579284668, "global_step": 255948, "epoch": 1523} {"train_loss": -12.165312767028809, "global_step": 255949, "epoch": 1523} {"train_loss": -12.208150863647461, "global_step": 255950, "epoch": 1523} {"train_loss": -12.108622550964355, "global_step": 255951, "epoch": 1523} {"train_loss": -12.056476593017578, "global_step": 255952, "epoch": 1523} {"train_loss": -12.087646484375, "global_step": 255953, "epoch": 1523} {"train_loss": -12.117226600646973, "global_step": 255954, "epoch": 1523} {"train_loss": -12.084798812866211, "global_step": 255955, "epoch": 1523} {"train_loss": -12.197894096374512, "global_step": 255956, "epoch": 1523} {"train_loss": -12.12114429473877, "global_step": 255957, "epoch": 1523} {"train_loss": -11.943338394165039, "global_step": 255958, "epoch": 1523} {"train_loss": -11.765541076660156, "global_step": 255959, "epoch": 1523} {"train_loss": -11.242713928222656, "global_step": 255960, "epoch": 1523} {"train_loss": -12.019847869873047, "global_step": 255961, "epoch": 1523} {"train_loss": -11.91966438293457, "global_step": 255962, "epoch": 1523} {"train_loss": -11.84063720703125, "global_step": 255963, "epoch": 1523} {"train_loss": -12.319131851196289, "global_step": 255964, "epoch": 1523} {"train_loss": -11.893308639526367, "global_step": 255965, "epoch": 1523} {"train_loss": -11.928702354431152, "global_step": 255966, "epoch": 1523} {"train_loss": -11.357133865356445, "global_step": 255967, "epoch": 1523} {"train_loss": -10.864500045776367, "global_step": 255968, "epoch": 1523} {"train_loss": -11.1127290725708, "global_step": 255969, "epoch": 1523} {"train_loss": -11.693397521972656, "global_step": 255970, "epoch": 1523} {"train_loss": -11.774975776672363, "global_step": 255971, "epoch": 1523} {"train_loss": -10.675585746765137, "global_step": 255972, "epoch": 1523} {"train_loss": -11.258681297302246, "global_step": 255973, "epoch": 1523} {"train_loss": -10.735337257385254, "global_step": 255974, "epoch": 1523} {"train_loss": -11.477044105529785, "global_step": 255975, "epoch": 1523} {"train_loss": -10.149801254272461, "global_step": 255976, "epoch": 1523} {"train_loss": -10.987563133239746, "global_step": 255977, "epoch": 1523} {"train_loss": -10.92345905303955, "global_step": 255978, "epoch": 1523} {"train_loss": -9.689743041992188, "global_step": 255979, "epoch": 1523} {"train_loss": -10.148528099060059, "global_step": 255980, "epoch": 1523} {"train_loss": -10.377185821533203, "global_step": 255981, "epoch": 1523} {"train_loss": -10.49791431427002, "global_step": 255982, "epoch": 1523} {"train_loss": -11.088726043701172, "global_step": 255983, "epoch": 1523} {"train_loss": -10.32801628112793, "global_step": 255984, "epoch": 1523} {"train_loss": -10.36558723449707, "global_step": 255985, "epoch": 1523} {"train_loss": -10.007109642028809, "global_step": 255986, "epoch": 1523} {"train_loss": -11.106134414672852, "global_step": 255987, "epoch": 1523} {"train_loss": -10.444145202636719, "global_step": 255988, "epoch": 1523} {"train_loss": -10.546903610229492, "global_step": 255989, "epoch": 1523} {"train_loss": -10.520845413208008, "global_step": 255990, "epoch": 1523} {"train_loss": -10.973905563354492, "global_step": 255991, "epoch": 1523} {"train_loss": -10.719715118408203, "global_step": 255992, "epoch": 1523} {"train_loss": -11.274587631225586, "global_step": 255993, "epoch": 1523} {"train_loss": -10.91630744934082, "global_step": 255994, "epoch": 1523} {"train_loss": -10.936582565307617, "global_step": 255995, "epoch": 1523} {"train_loss": -10.099899291992188, "global_step": 255996, "epoch": 1523} {"train_loss": -10.50741195678711, "global_step": 255997, "epoch": 1523} {"train_loss": -11.304222106933594, "global_step": 255998, "epoch": 1523} {"train_loss": -10.670814514160156, "global_step": 255999, "epoch": 1523} {"train_loss": -11.302970886230469, "global_step": 256000, "epoch": 1523} {"train_loss": -11.291494369506836, "global_step": 256001, "epoch": 1523} {"train_loss": -10.701156616210938, "global_step": 256002, "epoch": 1523} {"train_loss": -11.174859046936035, "global_step": 256003, "epoch": 1523} {"train_loss": -11.311352729797363, "global_step": 256004, "epoch": 1523} {"train_loss": -11.2891206741333, "global_step": 256005, "epoch": 1523} {"train_loss": -11.234139442443848, "global_step": 256006, "epoch": 1523} {"train_loss": -11.39940357208252, "global_step": 256007, "epoch": 1523} {"train_loss": -11.326154708862305, "global_step": 256008, "epoch": 1523} {"train_loss": -11.52062702178955, "global_step": 256009, "epoch": 1523} {"train_loss": -11.359246253967285, "global_step": 256010, "epoch": 1523} {"train_loss": -11.279067993164062, "global_step": 256011, "epoch": 1523} {"train_loss": -11.869668960571289, "global_step": 256012, "epoch": 1523} {"train_loss": -11.710424423217773, "global_step": 256013, "epoch": 1523} {"train_loss": -11.67189884185791, "global_step": 256014, "epoch": 1523} {"train_loss": -11.59564208984375, "global_step": 256015, "epoch": 1523} {"train_loss": -11.428459167480469, "global_step": 256016, "epoch": 1523} {"train_loss": -11.7298002243042, "global_step": 256017, "epoch": 1523} {"train_loss": -11.520118713378906, "global_step": 256018, "epoch": 1523} {"train_loss": -11.519800186157227, "global_step": 256019, "epoch": 1523} {"train_loss": -11.747806549072266, "global_step": 256020, "epoch": 1523} {"train_loss": -11.556954383850098, "global_step": 256021, "epoch": 1523} {"train_loss": -11.697185516357422, "global_step": 256022, "epoch": 1523} {"train_loss": -11.806134223937988, "global_step": 256023, "epoch": 1523} {"train_loss": -11.586517333984375, "global_step": 256024, "epoch": 1523} {"train_loss": -11.50583267211914, "global_step": 256025, "epoch": 1523} {"train_loss": -11.847511291503906, "global_step": 256026, "epoch": 1523} {"train_loss": -11.806102752685547, "global_step": 256027, "epoch": 1523} {"train_loss": -11.617644309997559, "global_step": 256028, "epoch": 1523} {"train_loss": -11.85838508605957, "global_step": 256029, "epoch": 1523} {"train_loss": -11.882954597473145, "global_step": 256030, "epoch": 1523} {"train_loss": -11.522044959522429, "global_step": 256031, "epoch": 1523, "val_loss": 271882.0625} {"train_loss": -11.854301452636719, "global_step": 256032, "epoch": 1524} {"train_loss": -11.638349533081055, "global_step": 256033, "epoch": 1524} {"train_loss": -11.858280181884766, "global_step": 256034, "epoch": 1524} {"train_loss": -11.673113822937012, "global_step": 256035, "epoch": 1524} {"train_loss": -12.055316925048828, "global_step": 256036, "epoch": 1524} {"train_loss": -11.92133617401123, "global_step": 256037, "epoch": 1524} {"train_loss": -11.967498779296875, "global_step": 256038, "epoch": 1524} {"train_loss": -12.072665214538574, "global_step": 256039, "epoch": 1524} {"train_loss": -12.057271003723145, "global_step": 256040, "epoch": 1524} {"train_loss": -11.883625984191895, "global_step": 256041, "epoch": 1524} {"train_loss": -11.904640197753906, "global_step": 256042, "epoch": 1524} {"train_loss": -11.914436340332031, "global_step": 256043, "epoch": 1524} {"train_loss": -11.90389633178711, "global_step": 256044, "epoch": 1524} {"train_loss": -12.230121612548828, "global_step": 256045, "epoch": 1524} {"train_loss": -11.744892120361328, "global_step": 256046, "epoch": 1524} {"train_loss": -11.835296630859375, "global_step": 256047, "epoch": 1524} {"train_loss": -11.804821014404297, "global_step": 256048, "epoch": 1524} {"train_loss": -11.84280014038086, "global_step": 256049, "epoch": 1524} {"train_loss": -11.957721710205078, "global_step": 256050, "epoch": 1524} {"train_loss": -11.89937973022461, "global_step": 256051, "epoch": 1524} {"train_loss": -12.010055541992188, "global_step": 256052, "epoch": 1524} {"train_loss": -12.013906478881836, "global_step": 256053, "epoch": 1524} {"train_loss": -11.994799613952637, "global_step": 256054, "epoch": 1524} {"train_loss": -11.973209381103516, "global_step": 256055, "epoch": 1524} {"train_loss": -11.818808555603027, "global_step": 256056, "epoch": 1524} {"train_loss": -12.003965377807617, "global_step": 256057, "epoch": 1524} {"train_loss": -11.997690200805664, "global_step": 256058, "epoch": 1524} {"train_loss": -12.029272079467773, "global_step": 256059, "epoch": 1524} {"train_loss": -12.115285873413086, "global_step": 256060, "epoch": 1524} {"train_loss": -11.95633316040039, "global_step": 256061, "epoch": 1524} {"train_loss": -12.0389986038208, "global_step": 256062, "epoch": 1524} {"train_loss": -12.031010627746582, "global_step": 256063, "epoch": 1524} {"train_loss": -11.746382713317871, "global_step": 256064, "epoch": 1524} {"train_loss": -11.994330406188965, "global_step": 256065, "epoch": 1524} {"train_loss": -11.724478721618652, "global_step": 256066, "epoch": 1524} {"train_loss": -11.73767375946045, "global_step": 256067, "epoch": 1524} {"train_loss": -12.103691101074219, "global_step": 256068, "epoch": 1524} {"train_loss": -11.640243530273438, "global_step": 256069, "epoch": 1524} {"train_loss": -11.987994194030762, "global_step": 256070, "epoch": 1524} {"train_loss": -11.897292137145996, "global_step": 256071, "epoch": 1524} {"train_loss": -11.844213485717773, "global_step": 256072, "epoch": 1524} {"train_loss": -11.722602844238281, "global_step": 256073, "epoch": 1524} {"train_loss": -11.496541023254395, "global_step": 256074, "epoch": 1524} {"train_loss": -11.858325958251953, "global_step": 256075, "epoch": 1524} {"train_loss": -11.850593566894531, "global_step": 256076, "epoch": 1524} {"train_loss": -11.39360523223877, "global_step": 256077, "epoch": 1524} {"train_loss": -12.021047592163086, "global_step": 256078, "epoch": 1524} {"train_loss": -11.82159423828125, "global_step": 256079, "epoch": 1524} {"train_loss": -12.045680046081543, "global_step": 256080, "epoch": 1524} {"train_loss": -11.395164489746094, "global_step": 256081, "epoch": 1524} {"train_loss": -11.8211669921875, "global_step": 256082, "epoch": 1524} {"train_loss": -11.373997688293457, "global_step": 256083, "epoch": 1524} {"train_loss": -11.69378662109375, "global_step": 256084, "epoch": 1524} {"train_loss": -11.876501083374023, "global_step": 256085, "epoch": 1524} {"train_loss": -11.876044273376465, "global_step": 256086, "epoch": 1524} {"train_loss": -12.053803443908691, "global_step": 256087, "epoch": 1524} {"train_loss": -10.958847045898438, "global_step": 256088, "epoch": 1524} {"train_loss": -11.312239646911621, "global_step": 256089, "epoch": 1524} {"train_loss": -11.59483528137207, "global_step": 256090, "epoch": 1524} {"train_loss": -10.874391555786133, "global_step": 256091, "epoch": 1524} {"train_loss": -11.419336318969727, "global_step": 256092, "epoch": 1524} {"train_loss": -11.207951545715332, "global_step": 256093, "epoch": 1524} {"train_loss": -10.216938018798828, "global_step": 256094, "epoch": 1524} {"train_loss": -9.934598922729492, "global_step": 256095, "epoch": 1524} {"train_loss": -10.531723022460938, "global_step": 256096, "epoch": 1524} {"train_loss": -11.131406784057617, "global_step": 256097, "epoch": 1524} {"train_loss": -10.50355052947998, "global_step": 256098, "epoch": 1524} {"train_loss": -11.205806732177734, "global_step": 256099, "epoch": 1524} {"train_loss": -11.346943855285645, "global_step": 256100, "epoch": 1524} {"train_loss": -11.017980575561523, "global_step": 256101, "epoch": 1524} {"train_loss": -11.606907844543457, "global_step": 256102, "epoch": 1524} {"train_loss": -11.33470344543457, "global_step": 256103, "epoch": 1524} {"train_loss": -10.974570274353027, "global_step": 256104, "epoch": 1524} {"train_loss": -11.09483814239502, "global_step": 256105, "epoch": 1524} {"train_loss": -11.429777145385742, "global_step": 256106, "epoch": 1524} {"train_loss": -11.592340469360352, "global_step": 256107, "epoch": 1524} {"train_loss": -11.035722732543945, "global_step": 256108, "epoch": 1524} {"train_loss": -11.31137466430664, "global_step": 256109, "epoch": 1524} {"train_loss": -11.33962631225586, "global_step": 256110, "epoch": 1524} {"train_loss": -11.521636009216309, "global_step": 256111, "epoch": 1524} {"train_loss": -11.197914123535156, "global_step": 256112, "epoch": 1524} {"train_loss": -11.410818099975586, "global_step": 256113, "epoch": 1524} {"train_loss": -11.719963073730469, "global_step": 256114, "epoch": 1524} {"train_loss": -11.196413040161133, "global_step": 256115, "epoch": 1524} {"train_loss": -11.844128608703613, "global_step": 256116, "epoch": 1524} {"train_loss": -11.124841690063477, "global_step": 256117, "epoch": 1524} {"train_loss": -11.733996391296387, "global_step": 256118, "epoch": 1524} {"train_loss": -11.231476783752441, "global_step": 256119, "epoch": 1524} {"train_loss": -11.821538925170898, "global_step": 256120, "epoch": 1524} {"train_loss": -11.51870346069336, "global_step": 256121, "epoch": 1524} {"train_loss": -11.095495223999023, "global_step": 256122, "epoch": 1524} {"train_loss": -11.534468650817871, "global_step": 256123, "epoch": 1524} {"train_loss": -11.296527862548828, "global_step": 256124, "epoch": 1524} {"train_loss": -11.673039436340332, "global_step": 256125, "epoch": 1524} {"train_loss": -11.518951416015625, "global_step": 256126, "epoch": 1524} {"train_loss": -11.554424285888672, "global_step": 256127, "epoch": 1524} {"train_loss": -11.241580963134766, "global_step": 256128, "epoch": 1524} {"train_loss": -11.754928588867188, "global_step": 256129, "epoch": 1524} {"train_loss": -11.682586669921875, "global_step": 256130, "epoch": 1524} {"train_loss": -11.546722412109375, "global_step": 256131, "epoch": 1524} {"train_loss": -11.878164291381836, "global_step": 256132, "epoch": 1524} {"train_loss": -11.267647743225098, "global_step": 256133, "epoch": 1524} {"train_loss": -11.229360580444336, "global_step": 256134, "epoch": 1524} {"train_loss": -11.497782707214355, "global_step": 256135, "epoch": 1524} {"train_loss": -11.801464080810547, "global_step": 256136, "epoch": 1524} {"train_loss": -10.933652877807617, "global_step": 256137, "epoch": 1524} {"train_loss": -11.432540893554688, "global_step": 256138, "epoch": 1524} {"train_loss": -11.425621032714844, "global_step": 256139, "epoch": 1524} {"train_loss": -11.549638748168945, "global_step": 256140, "epoch": 1524} {"train_loss": -11.20827865600586, "global_step": 256141, "epoch": 1524} {"train_loss": -11.508966445922852, "global_step": 256142, "epoch": 1524} {"train_loss": -10.629873275756836, "global_step": 256143, "epoch": 1524} {"train_loss": -11.928625106811523, "global_step": 256144, "epoch": 1524} {"train_loss": -11.544837951660156, "global_step": 256145, "epoch": 1524} {"train_loss": -11.503009796142578, "global_step": 256146, "epoch": 1524} {"train_loss": -11.953363418579102, "global_step": 256147, "epoch": 1524} {"train_loss": -11.529609680175781, "global_step": 256148, "epoch": 1524} {"train_loss": -11.903894424438477, "global_step": 256149, "epoch": 1524} {"train_loss": -11.384366989135742, "global_step": 256150, "epoch": 1524} {"train_loss": -11.4530029296875, "global_step": 256151, "epoch": 1524} {"train_loss": -11.922684669494629, "global_step": 256152, "epoch": 1524} {"train_loss": -11.54257583618164, "global_step": 256153, "epoch": 1524} {"train_loss": -11.792521476745605, "global_step": 256154, "epoch": 1524} {"train_loss": -11.900370597839355, "global_step": 256155, "epoch": 1524} {"train_loss": -11.643495559692383, "global_step": 256156, "epoch": 1524} {"train_loss": -11.834047317504883, "global_step": 256157, "epoch": 1524} {"train_loss": -11.806774139404297, "global_step": 256158, "epoch": 1524} {"train_loss": -11.715166091918945, "global_step": 256159, "epoch": 1524} {"train_loss": -11.881738662719727, "global_step": 256160, "epoch": 1524} {"train_loss": -11.616281509399414, "global_step": 256161, "epoch": 1524} {"train_loss": -11.80321216583252, "global_step": 256162, "epoch": 1524} {"train_loss": -11.720569610595703, "global_step": 256163, "epoch": 1524} {"train_loss": -11.9359130859375, "global_step": 256164, "epoch": 1524} {"train_loss": -11.818982124328613, "global_step": 256165, "epoch": 1524} {"train_loss": -11.707849502563477, "global_step": 256166, "epoch": 1524} {"train_loss": -11.72311782836914, "global_step": 256167, "epoch": 1524} {"train_loss": -12.223220825195312, "global_step": 256168, "epoch": 1524} {"train_loss": -11.627164840698242, "global_step": 256169, "epoch": 1524} {"train_loss": -12.107675552368164, "global_step": 256170, "epoch": 1524} {"train_loss": -11.703577995300293, "global_step": 256171, "epoch": 1524} {"train_loss": -11.743087768554688, "global_step": 256172, "epoch": 1524} {"train_loss": -11.98504638671875, "global_step": 256173, "epoch": 1524} {"train_loss": -11.92027473449707, "global_step": 256174, "epoch": 1524} {"train_loss": -11.917165756225586, "global_step": 256175, "epoch": 1524} {"train_loss": -11.854124069213867, "global_step": 256176, "epoch": 1524} {"train_loss": -11.955204010009766, "global_step": 256177, "epoch": 1524} {"train_loss": -11.946894645690918, "global_step": 256178, "epoch": 1524} {"train_loss": -12.097444534301758, "global_step": 256179, "epoch": 1524} {"train_loss": -11.984565734863281, "global_step": 256180, "epoch": 1524} {"train_loss": -12.063979148864746, "global_step": 256181, "epoch": 1524} {"train_loss": -12.053447723388672, "global_step": 256182, "epoch": 1524} {"train_loss": -12.048608779907227, "global_step": 256183, "epoch": 1524} {"train_loss": -11.792474746704102, "global_step": 256184, "epoch": 1524} {"train_loss": -11.997631072998047, "global_step": 256185, "epoch": 1524} {"train_loss": -12.041040420532227, "global_step": 256186, "epoch": 1524} {"train_loss": -12.217225074768066, "global_step": 256187, "epoch": 1524} {"train_loss": -12.098257064819336, "global_step": 256188, "epoch": 1524} {"train_loss": -12.166644096374512, "global_step": 256189, "epoch": 1524} {"train_loss": -12.09542179107666, "global_step": 256190, "epoch": 1524} {"train_loss": -12.098611831665039, "global_step": 256191, "epoch": 1524} {"train_loss": -12.036700248718262, "global_step": 256192, "epoch": 1524} {"train_loss": -12.263598442077637, "global_step": 256193, "epoch": 1524} {"train_loss": -11.951992988586426, "global_step": 256194, "epoch": 1524} {"train_loss": -12.01961898803711, "global_step": 256195, "epoch": 1524} {"train_loss": -12.151649475097656, "global_step": 256196, "epoch": 1524} {"train_loss": -12.238569259643555, "global_step": 256197, "epoch": 1524} {"train_loss": -11.667974472045898, "global_step": 256198, "epoch": 1524} {"train_loss": -11.685514790671212, "global_step": 256199, "epoch": 1524, "val_loss": 269737.71875} {"train_loss": -12.001611709594727, "global_step": 256200, "epoch": 1525} {"train_loss": -11.647279739379883, "global_step": 256201, "epoch": 1525} {"train_loss": -11.209861755371094, "global_step": 256202, "epoch": 1525} {"train_loss": -11.950180053710938, "global_step": 256203, "epoch": 1525} {"train_loss": -11.706100463867188, "global_step": 256204, "epoch": 1525} {"train_loss": -11.651360511779785, "global_step": 256205, "epoch": 1525} {"train_loss": -11.467960357666016, "global_step": 256206, "epoch": 1525} {"train_loss": -11.697298049926758, "global_step": 256207, "epoch": 1525} {"train_loss": -11.40087890625, "global_step": 256208, "epoch": 1525} {"train_loss": -12.073957443237305, "global_step": 256209, "epoch": 1525} {"train_loss": -10.547857284545898, "global_step": 256210, "epoch": 1525} {"train_loss": -9.213452339172363, "global_step": 256211, "epoch": 1525} {"train_loss": -10.832757949829102, "global_step": 256212, "epoch": 1525} {"train_loss": -10.770018577575684, "global_step": 256213, "epoch": 1525} {"train_loss": -8.779386520385742, "global_step": 256214, "epoch": 1525} {"train_loss": -11.150014877319336, "global_step": 256215, "epoch": 1525} {"train_loss": -8.24797248840332, "global_step": 256216, "epoch": 1525} {"train_loss": -10.85526180267334, "global_step": 256217, "epoch": 1525} {"train_loss": -9.7100248336792, "global_step": 256218, "epoch": 1525} {"train_loss": -10.642333984375, "global_step": 256219, "epoch": 1525} {"train_loss": -11.116729736328125, "global_step": 256220, "epoch": 1525} {"train_loss": -10.433012008666992, "global_step": 256221, "epoch": 1525} {"train_loss": -11.002754211425781, "global_step": 256222, "epoch": 1525} {"train_loss": -9.814715385437012, "global_step": 256223, "epoch": 1525} {"train_loss": -10.180801391601562, "global_step": 256224, "epoch": 1525} {"train_loss": -9.688647270202637, "global_step": 256225, "epoch": 1525} {"train_loss": -11.205873489379883, "global_step": 256226, "epoch": 1525} {"train_loss": -9.445917129516602, "global_step": 256227, "epoch": 1525} {"train_loss": -10.837417602539062, "global_step": 256228, "epoch": 1525} {"train_loss": -10.271356582641602, "global_step": 256229, "epoch": 1525} {"train_loss": -11.063329696655273, "global_step": 256230, "epoch": 1525} {"train_loss": -10.703245162963867, "global_step": 256231, "epoch": 1525} {"train_loss": -11.378950119018555, "global_step": 256232, "epoch": 1525} {"train_loss": -10.820575714111328, "global_step": 256233, "epoch": 1525} {"train_loss": -11.347753524780273, "global_step": 256234, "epoch": 1525} {"train_loss": -11.115717887878418, "global_step": 256235, "epoch": 1525} {"train_loss": -11.560964584350586, "global_step": 256236, "epoch": 1525} {"train_loss": -11.324516296386719, "global_step": 256237, "epoch": 1525} {"train_loss": -11.320327758789062, "global_step": 256238, "epoch": 1525} {"train_loss": -11.298126220703125, "global_step": 256239, "epoch": 1525} {"train_loss": -11.446343421936035, "global_step": 256240, "epoch": 1525} {"train_loss": -11.273788452148438, "global_step": 256241, "epoch": 1525} {"train_loss": -11.320706367492676, "global_step": 256242, "epoch": 1525} {"train_loss": -11.433649063110352, "global_step": 256243, "epoch": 1525} {"train_loss": -10.705108642578125, "global_step": 256244, "epoch": 1525} {"train_loss": -11.593502044677734, "global_step": 256245, "epoch": 1525} {"train_loss": -10.73560905456543, "global_step": 256246, "epoch": 1525} {"train_loss": -11.637996673583984, "global_step": 256247, "epoch": 1525} {"train_loss": -11.25131607055664, "global_step": 256248, "epoch": 1525} {"train_loss": -11.290523529052734, "global_step": 256249, "epoch": 1525} {"train_loss": -11.357643127441406, "global_step": 256250, "epoch": 1525} {"train_loss": -11.587726593017578, "global_step": 256251, "epoch": 1525} {"train_loss": -11.40121841430664, "global_step": 256252, "epoch": 1525} {"train_loss": -11.150789260864258, "global_step": 256253, "epoch": 1525} {"train_loss": -11.473041534423828, "global_step": 256254, "epoch": 1525} {"train_loss": -11.359743118286133, "global_step": 256255, "epoch": 1525} {"train_loss": -11.80498218536377, "global_step": 256256, "epoch": 1525} {"train_loss": -11.55607795715332, "global_step": 256257, "epoch": 1525} {"train_loss": -11.581195831298828, "global_step": 256258, "epoch": 1525} {"train_loss": -11.840713500976562, "global_step": 256259, "epoch": 1525} {"train_loss": -11.490496635437012, "global_step": 256260, "epoch": 1525} {"train_loss": -11.690080642700195, "global_step": 256261, "epoch": 1525} {"train_loss": -11.499805450439453, "global_step": 256262, "epoch": 1525} {"train_loss": -11.650400161743164, "global_step": 256263, "epoch": 1525} {"train_loss": -11.458662033081055, "global_step": 256264, "epoch": 1525} {"train_loss": -11.672642707824707, "global_step": 256265, "epoch": 1525} {"train_loss": -11.620736122131348, "global_step": 256266, "epoch": 1525} {"train_loss": -11.832756042480469, "global_step": 256267, "epoch": 1525} {"train_loss": -11.424169540405273, "global_step": 256268, "epoch": 1525} {"train_loss": -11.976842880249023, "global_step": 256269, "epoch": 1525} {"train_loss": -11.72061538696289, "global_step": 256270, "epoch": 1525} {"train_loss": -11.721853256225586, "global_step": 256271, "epoch": 1525} {"train_loss": -11.547916412353516, "global_step": 256272, "epoch": 1525} {"train_loss": -11.392189025878906, "global_step": 256273, "epoch": 1525} {"train_loss": -11.863304138183594, "global_step": 256274, "epoch": 1525} {"train_loss": -11.599407196044922, "global_step": 256275, "epoch": 1525} {"train_loss": -12.003683090209961, "global_step": 256276, "epoch": 1525} {"train_loss": -11.871688842773438, "global_step": 256277, "epoch": 1525} {"train_loss": -11.755151748657227, "global_step": 256278, "epoch": 1525} {"train_loss": -11.845458984375, "global_step": 256279, "epoch": 1525} {"train_loss": -12.035566329956055, "global_step": 256280, "epoch": 1525} {"train_loss": -11.832120895385742, "global_step": 256281, "epoch": 1525} {"train_loss": -11.936849594116211, "global_step": 256282, "epoch": 1525} {"train_loss": -11.749785423278809, "global_step": 256283, "epoch": 1525} {"train_loss": -11.917562484741211, "global_step": 256284, "epoch": 1525} {"train_loss": -11.77059555053711, "global_step": 256285, "epoch": 1525} {"train_loss": -11.998852729797363, "global_step": 256286, "epoch": 1525} {"train_loss": -11.791427612304688, "global_step": 256287, "epoch": 1525} {"train_loss": -11.923713684082031, "global_step": 256288, "epoch": 1525} {"train_loss": -11.880937576293945, "global_step": 256289, "epoch": 1525} {"train_loss": -12.15475845336914, "global_step": 256290, "epoch": 1525} {"train_loss": -11.921802520751953, "global_step": 256291, "epoch": 1525} {"train_loss": -12.131213188171387, "global_step": 256292, "epoch": 1525} {"train_loss": -12.163899421691895, "global_step": 256293, "epoch": 1525} {"train_loss": -12.105302810668945, "global_step": 256294, "epoch": 1525} {"train_loss": -12.079425811767578, "global_step": 256295, "epoch": 1525} {"train_loss": -12.169092178344727, "global_step": 256296, "epoch": 1525} {"train_loss": -12.17288589477539, "global_step": 256297, "epoch": 1525} {"train_loss": -12.025830268859863, "global_step": 256298, "epoch": 1525} {"train_loss": -12.158214569091797, "global_step": 256299, "epoch": 1525} {"train_loss": -12.249530792236328, "global_step": 256300, "epoch": 1525} {"train_loss": -11.954082489013672, "global_step": 256301, "epoch": 1525} {"train_loss": -12.190520286560059, "global_step": 256302, "epoch": 1525} {"train_loss": -11.992501258850098, "global_step": 256303, "epoch": 1525} {"train_loss": -12.391985893249512, "global_step": 256304, "epoch": 1525} {"train_loss": -12.295180320739746, "global_step": 256305, "epoch": 1525} {"train_loss": -12.158483505249023, "global_step": 256306, "epoch": 1525} {"train_loss": -12.196525573730469, "global_step": 256307, "epoch": 1525} {"train_loss": -12.050186157226562, "global_step": 256308, "epoch": 1525} {"train_loss": -12.086456298828125, "global_step": 256309, "epoch": 1525} {"train_loss": -12.068300247192383, "global_step": 256310, "epoch": 1525} {"train_loss": -11.613391876220703, "global_step": 256311, "epoch": 1525} {"train_loss": -12.012228965759277, "global_step": 256312, "epoch": 1525} {"train_loss": -12.141820907592773, "global_step": 256313, "epoch": 1525} {"train_loss": -11.549866676330566, "global_step": 256314, "epoch": 1525} {"train_loss": -11.674924850463867, "global_step": 256315, "epoch": 1525} {"train_loss": -12.037445068359375, "global_step": 256316, "epoch": 1525} {"train_loss": -12.037322998046875, "global_step": 256317, "epoch": 1525} {"train_loss": -11.726055145263672, "global_step": 256318, "epoch": 1525} {"train_loss": -11.889666557312012, "global_step": 256319, "epoch": 1525} {"train_loss": -11.885242462158203, "global_step": 256320, "epoch": 1525} {"train_loss": -11.463647842407227, "global_step": 256321, "epoch": 1525} {"train_loss": -12.020541191101074, "global_step": 256322, "epoch": 1525} {"train_loss": -11.698862075805664, "global_step": 256323, "epoch": 1525} {"train_loss": -11.578649520874023, "global_step": 256324, "epoch": 1525} {"train_loss": -12.147427558898926, "global_step": 256325, "epoch": 1525} {"train_loss": -10.946533203125, "global_step": 256326, "epoch": 1525} {"train_loss": -11.181964874267578, "global_step": 256327, "epoch": 1525} {"train_loss": -11.694147109985352, "global_step": 256328, "epoch": 1525} {"train_loss": -11.443367004394531, "global_step": 256329, "epoch": 1525} {"train_loss": -11.76223373413086, "global_step": 256330, "epoch": 1525} {"train_loss": -11.5969820022583, "global_step": 256331, "epoch": 1525} {"train_loss": -11.472658157348633, "global_step": 256332, "epoch": 1525} {"train_loss": -12.06273078918457, "global_step": 256333, "epoch": 1525} {"train_loss": -11.311050415039062, "global_step": 256334, "epoch": 1525} {"train_loss": -11.930727005004883, "global_step": 256335, "epoch": 1525} {"train_loss": -11.792691230773926, "global_step": 256336, "epoch": 1525} {"train_loss": -11.875326156616211, "global_step": 256337, "epoch": 1525} {"train_loss": -11.847189903259277, "global_step": 256338, "epoch": 1525} {"train_loss": -12.270600318908691, "global_step": 256339, "epoch": 1525} {"train_loss": -11.648212432861328, "global_step": 256340, "epoch": 1525} {"train_loss": -12.026190757751465, "global_step": 256341, "epoch": 1525} {"train_loss": -11.91358470916748, "global_step": 256342, "epoch": 1525} {"train_loss": -11.879737854003906, "global_step": 256343, "epoch": 1525} {"train_loss": -11.765748977661133, "global_step": 256344, "epoch": 1525} {"train_loss": -11.777397155761719, "global_step": 256345, "epoch": 1525} {"train_loss": -11.526796340942383, "global_step": 256346, "epoch": 1525} {"train_loss": -11.775632858276367, "global_step": 256347, "epoch": 1525} {"train_loss": -11.77785873413086, "global_step": 256348, "epoch": 1525} {"train_loss": -11.54818344116211, "global_step": 256349, "epoch": 1525} {"train_loss": -12.095349311828613, "global_step": 256350, "epoch": 1525} {"train_loss": -11.50515365600586, "global_step": 256351, "epoch": 1525} {"train_loss": -10.761383056640625, "global_step": 256352, "epoch": 1525} {"train_loss": -11.47192096710205, "global_step": 256353, "epoch": 1525} {"train_loss": -11.92766284942627, "global_step": 256354, "epoch": 1525} {"train_loss": -11.599124908447266, "global_step": 256355, "epoch": 1525} {"train_loss": -11.791959762573242, "global_step": 256356, "epoch": 1525} {"train_loss": -11.977622985839844, "global_step": 256357, "epoch": 1525} {"train_loss": -11.379185676574707, "global_step": 256358, "epoch": 1525} {"train_loss": -11.86679744720459, "global_step": 256359, "epoch": 1525} {"train_loss": -11.255847930908203, "global_step": 256360, "epoch": 1525} {"train_loss": -11.220996856689453, "global_step": 256361, "epoch": 1525} {"train_loss": -11.540000915527344, "global_step": 256362, "epoch": 1525} {"train_loss": -11.29419994354248, "global_step": 256363, "epoch": 1525} {"train_loss": -11.132891654968262, "global_step": 256364, "epoch": 1525} {"train_loss": -11.177024841308594, "global_step": 256365, "epoch": 1525} {"train_loss": -11.404084205627441, "global_step": 256366, "epoch": 1525} {"train_loss": -11.508581859724861, "global_step": 256367, "epoch": 1525, "val_loss": 269246.625, "train_action_mse_error": 0.9992234706878662} {"train_loss": -10.776193618774414, "global_step": 256368, "epoch": 1526} {"train_loss": -10.959394454956055, "global_step": 256369, "epoch": 1526} {"train_loss": -11.453371047973633, "global_step": 256370, "epoch": 1526} {"train_loss": -11.387619972229004, "global_step": 256371, "epoch": 1526} {"train_loss": -11.074602127075195, "global_step": 256372, "epoch": 1526} {"train_loss": -10.724267959594727, "global_step": 256373, "epoch": 1526} {"train_loss": -11.056580543518066, "global_step": 256374, "epoch": 1526} {"train_loss": -11.823944091796875, "global_step": 256375, "epoch": 1526} {"train_loss": -10.740030288696289, "global_step": 256376, "epoch": 1526} {"train_loss": -10.451496124267578, "global_step": 256377, "epoch": 1526} {"train_loss": -11.364778518676758, "global_step": 256378, "epoch": 1526} {"train_loss": -10.015180587768555, "global_step": 256379, "epoch": 1526} {"train_loss": -11.5242338180542, "global_step": 256380, "epoch": 1526} {"train_loss": -10.214838027954102, "global_step": 256381, "epoch": 1526} {"train_loss": -11.171812057495117, "global_step": 256382, "epoch": 1526} {"train_loss": -10.880117416381836, "global_step": 256383, "epoch": 1526} {"train_loss": -10.82425594329834, "global_step": 256384, "epoch": 1526} {"train_loss": -10.851343154907227, "global_step": 256385, "epoch": 1526} {"train_loss": -10.35348129272461, "global_step": 256386, "epoch": 1526} {"train_loss": -10.70238971710205, "global_step": 256387, "epoch": 1526} {"train_loss": -11.18700885772705, "global_step": 256388, "epoch": 1526} {"train_loss": -10.106365203857422, "global_step": 256389, "epoch": 1526} {"train_loss": -11.313091278076172, "global_step": 256390, "epoch": 1526} {"train_loss": -10.666425704956055, "global_step": 256391, "epoch": 1526} {"train_loss": -11.127239227294922, "global_step": 256392, "epoch": 1526} {"train_loss": -10.927202224731445, "global_step": 256393, "epoch": 1526} {"train_loss": -11.148857116699219, "global_step": 256394, "epoch": 1526} {"train_loss": -11.030683517456055, "global_step": 256395, "epoch": 1526} {"train_loss": -11.32520866394043, "global_step": 256396, "epoch": 1526} {"train_loss": -10.437088012695312, "global_step": 256397, "epoch": 1526} {"train_loss": -11.413664817810059, "global_step": 256398, "epoch": 1526} {"train_loss": -11.056699752807617, "global_step": 256399, "epoch": 1526} {"train_loss": -11.170564651489258, "global_step": 256400, "epoch": 1526} {"train_loss": -11.55228042602539, "global_step": 256401, "epoch": 1526} {"train_loss": -11.301884651184082, "global_step": 256402, "epoch": 1526} {"train_loss": -11.048822402954102, "global_step": 256403, "epoch": 1526} {"train_loss": -11.28262996673584, "global_step": 256404, "epoch": 1526} {"train_loss": -11.499547004699707, "global_step": 256405, "epoch": 1526} {"train_loss": -11.350826263427734, "global_step": 256406, "epoch": 1526} {"train_loss": -11.62701416015625, "global_step": 256407, "epoch": 1526} {"train_loss": -11.162454605102539, "global_step": 256408, "epoch": 1526} {"train_loss": -11.265332221984863, "global_step": 256409, "epoch": 1526} {"train_loss": -11.704015731811523, "global_step": 256410, "epoch": 1526} {"train_loss": -11.614974021911621, "global_step": 256411, "epoch": 1526} {"train_loss": -11.553150177001953, "global_step": 256412, "epoch": 1526} {"train_loss": -11.72102165222168, "global_step": 256413, "epoch": 1526} {"train_loss": -11.477136611938477, "global_step": 256414, "epoch": 1526} {"train_loss": -11.724634170532227, "global_step": 256415, "epoch": 1526} {"train_loss": -11.814593315124512, "global_step": 256416, "epoch": 1526} {"train_loss": -11.766336441040039, "global_step": 256417, "epoch": 1526} {"train_loss": -11.946643829345703, "global_step": 256418, "epoch": 1526} {"train_loss": -11.891746520996094, "global_step": 256419, "epoch": 1526} {"train_loss": -11.547196388244629, "global_step": 256420, "epoch": 1526} {"train_loss": -11.74308967590332, "global_step": 256421, "epoch": 1526} {"train_loss": -11.739910125732422, "global_step": 256422, "epoch": 1526} {"train_loss": -11.945801734924316, "global_step": 256423, "epoch": 1526} {"train_loss": -11.718070030212402, "global_step": 256424, "epoch": 1526} {"train_loss": -11.926084518432617, "global_step": 256425, "epoch": 1526} {"train_loss": -11.942834854125977, "global_step": 256426, "epoch": 1526} {"train_loss": -11.969818115234375, "global_step": 256427, "epoch": 1526} {"train_loss": -12.005104064941406, "global_step": 256428, "epoch": 1526} {"train_loss": -12.002243041992188, "global_step": 256429, "epoch": 1526} {"train_loss": -12.050783157348633, "global_step": 256430, "epoch": 1526} {"train_loss": -11.892404556274414, "global_step": 256431, "epoch": 1526} {"train_loss": -11.853170394897461, "global_step": 256432, "epoch": 1526} {"train_loss": -12.063905715942383, "global_step": 256433, "epoch": 1526} {"train_loss": -11.943559646606445, "global_step": 256434, "epoch": 1526} {"train_loss": -12.070789337158203, "global_step": 256435, "epoch": 1526} {"train_loss": -11.712721824645996, "global_step": 256436, "epoch": 1526} {"train_loss": -11.793146133422852, "global_step": 256437, "epoch": 1526} {"train_loss": -12.130666732788086, "global_step": 256438, "epoch": 1526} {"train_loss": -12.105064392089844, "global_step": 256439, "epoch": 1526} {"train_loss": -12.10577392578125, "global_step": 256440, "epoch": 1526} {"train_loss": -12.066116333007812, "global_step": 256441, "epoch": 1526} {"train_loss": -11.846725463867188, "global_step": 256442, "epoch": 1526} {"train_loss": -12.123851776123047, "global_step": 256443, "epoch": 1526} {"train_loss": -12.132112503051758, "global_step": 256444, "epoch": 1526} {"train_loss": -11.967677116394043, "global_step": 256445, "epoch": 1526} {"train_loss": -11.952326774597168, "global_step": 256446, "epoch": 1526} {"train_loss": -12.207557678222656, "global_step": 256447, "epoch": 1526} {"train_loss": -11.997856140136719, "global_step": 256448, "epoch": 1526} {"train_loss": -12.175071716308594, "global_step": 256449, "epoch": 1526} {"train_loss": -12.065960884094238, "global_step": 256450, "epoch": 1526} {"train_loss": -12.114381790161133, "global_step": 256451, "epoch": 1526} {"train_loss": -12.08223819732666, "global_step": 256452, "epoch": 1526} {"train_loss": -11.922492027282715, "global_step": 256453, "epoch": 1526} {"train_loss": -12.006092071533203, "global_step": 256454, "epoch": 1526} {"train_loss": -12.043989181518555, "global_step": 256455, "epoch": 1526} {"train_loss": -12.324713706970215, "global_step": 256456, "epoch": 1526} {"train_loss": -11.652299880981445, "global_step": 256457, "epoch": 1526} {"train_loss": -12.210628509521484, "global_step": 256458, "epoch": 1526} {"train_loss": -12.050275802612305, "global_step": 256459, "epoch": 1526} {"train_loss": -10.98298168182373, "global_step": 256460, "epoch": 1526} {"train_loss": -10.279598236083984, "global_step": 256461, "epoch": 1526} {"train_loss": -12.226126670837402, "global_step": 256462, "epoch": 1526} {"train_loss": -10.896728515625, "global_step": 256463, "epoch": 1526} {"train_loss": -11.512659072875977, "global_step": 256464, "epoch": 1526} {"train_loss": -11.937438011169434, "global_step": 256465, "epoch": 1526} {"train_loss": -11.874938011169434, "global_step": 256466, "epoch": 1526} {"train_loss": -11.503178596496582, "global_step": 256467, "epoch": 1526} {"train_loss": -11.858972549438477, "global_step": 256468, "epoch": 1526} {"train_loss": -12.083194732666016, "global_step": 256469, "epoch": 1526} {"train_loss": -11.716323852539062, "global_step": 256470, "epoch": 1526} {"train_loss": -11.977958679199219, "global_step": 256471, "epoch": 1526} {"train_loss": -11.391816139221191, "global_step": 256472, "epoch": 1526} {"train_loss": -12.108287811279297, "global_step": 256473, "epoch": 1526} {"train_loss": -11.668214797973633, "global_step": 256474, "epoch": 1526} {"train_loss": -11.240095138549805, "global_step": 256475, "epoch": 1526} {"train_loss": -11.713178634643555, "global_step": 256476, "epoch": 1526} {"train_loss": -11.144378662109375, "global_step": 256477, "epoch": 1526} {"train_loss": -10.000858306884766, "global_step": 256478, "epoch": 1526} {"train_loss": -10.296374320983887, "global_step": 256479, "epoch": 1526} {"train_loss": -11.514665603637695, "global_step": 256480, "epoch": 1526} {"train_loss": -10.573966979980469, "global_step": 256481, "epoch": 1526} {"train_loss": -11.509138107299805, "global_step": 256482, "epoch": 1526} {"train_loss": -10.098093032836914, "global_step": 256483, "epoch": 1526} {"train_loss": -10.143022537231445, "global_step": 256484, "epoch": 1526} {"train_loss": -10.777240753173828, "global_step": 256485, "epoch": 1526} {"train_loss": -10.148921966552734, "global_step": 256486, "epoch": 1526} {"train_loss": -10.09434700012207, "global_step": 256487, "epoch": 1526} {"train_loss": -9.730667114257812, "global_step": 256488, "epoch": 1526} {"train_loss": -11.112564086914062, "global_step": 256489, "epoch": 1526} {"train_loss": -10.981751441955566, "global_step": 256490, "epoch": 1526} {"train_loss": -10.992258071899414, "global_step": 256491, "epoch": 1526} {"train_loss": -9.658773422241211, "global_step": 256492, "epoch": 1526} {"train_loss": -10.182661056518555, "global_step": 256493, "epoch": 1526} {"train_loss": -10.884243965148926, "global_step": 256494, "epoch": 1526} {"train_loss": -10.61545467376709, "global_step": 256495, "epoch": 1526} {"train_loss": -11.224763870239258, "global_step": 256496, "epoch": 1526} {"train_loss": -10.748046875, "global_step": 256497, "epoch": 1526} {"train_loss": -10.823980331420898, "global_step": 256498, "epoch": 1526} {"train_loss": -11.708377838134766, "global_step": 256499, "epoch": 1526} {"train_loss": -10.528671264648438, "global_step": 256500, "epoch": 1526} {"train_loss": -11.53567123413086, "global_step": 256501, "epoch": 1526} {"train_loss": -10.676473617553711, "global_step": 256502, "epoch": 1526} {"train_loss": -10.968780517578125, "global_step": 256503, "epoch": 1526} {"train_loss": -11.432708740234375, "global_step": 256504, "epoch": 1526} {"train_loss": -10.981550216674805, "global_step": 256505, "epoch": 1526} {"train_loss": -11.519895553588867, "global_step": 256506, "epoch": 1526} {"train_loss": -11.756010055541992, "global_step": 256507, "epoch": 1526} {"train_loss": -11.191719055175781, "global_step": 256508, "epoch": 1526} {"train_loss": -11.579523086547852, "global_step": 256509, "epoch": 1526} {"train_loss": -11.203840255737305, "global_step": 256510, "epoch": 1526} {"train_loss": -11.597612380981445, "global_step": 256511, "epoch": 1526} {"train_loss": -11.67436408996582, "global_step": 256512, "epoch": 1526} {"train_loss": -11.689132690429688, "global_step": 256513, "epoch": 1526} {"train_loss": -11.693857192993164, "global_step": 256514, "epoch": 1526} {"train_loss": -11.856157302856445, "global_step": 256515, "epoch": 1526} {"train_loss": -11.526079177856445, "global_step": 256516, "epoch": 1526} {"train_loss": -11.760807037353516, "global_step": 256517, "epoch": 1526} {"train_loss": -11.754480361938477, "global_step": 256518, "epoch": 1526} {"train_loss": -11.622485160827637, "global_step": 256519, "epoch": 1526} {"train_loss": -11.864633560180664, "global_step": 256520, "epoch": 1526} {"train_loss": -11.638965606689453, "global_step": 256521, "epoch": 1526} {"train_loss": -11.742431640625, "global_step": 256522, "epoch": 1526} {"train_loss": -11.647439002990723, "global_step": 256523, "epoch": 1526} {"train_loss": -11.921831130981445, "global_step": 256524, "epoch": 1526} {"train_loss": -11.720290184020996, "global_step": 256525, "epoch": 1526} {"train_loss": -11.970596313476562, "global_step": 256526, "epoch": 1526} {"train_loss": -11.73197078704834, "global_step": 256527, "epoch": 1526} {"train_loss": -11.85726261138916, "global_step": 256528, "epoch": 1526} {"train_loss": -11.934694290161133, "global_step": 256529, "epoch": 1526} {"train_loss": -11.791166305541992, "global_step": 256530, "epoch": 1526} {"train_loss": -12.0361328125, "global_step": 256531, "epoch": 1526} {"train_loss": -11.925155639648438, "global_step": 256532, "epoch": 1526} {"train_loss": -11.765052795410156, "global_step": 256533, "epoch": 1526} {"train_loss": -11.691884994506836, "global_step": 256534, "epoch": 1526} {"train_loss": -11.42435904343923, "global_step": 256535, "epoch": 1526, "val_loss": 270050.4375} {"train_loss": -11.856874465942383, "global_step": 256536, "epoch": 1527} {"train_loss": -11.865286827087402, "global_step": 256537, "epoch": 1527} {"train_loss": -11.961774826049805, "global_step": 256538, "epoch": 1527} {"train_loss": -11.883393287658691, "global_step": 256539, "epoch": 1527} {"train_loss": -11.977025032043457, "global_step": 256540, "epoch": 1527} {"train_loss": -11.96561050415039, "global_step": 256541, "epoch": 1527} {"train_loss": -12.024262428283691, "global_step": 256542, "epoch": 1527} {"train_loss": -11.963424682617188, "global_step": 256543, "epoch": 1527} {"train_loss": -12.11281967163086, "global_step": 256544, "epoch": 1527} {"train_loss": -12.243698120117188, "global_step": 256545, "epoch": 1527} {"train_loss": -12.10788345336914, "global_step": 256546, "epoch": 1527} {"train_loss": -11.745874404907227, "global_step": 256547, "epoch": 1527} {"train_loss": -11.864294052124023, "global_step": 256548, "epoch": 1527} {"train_loss": -11.602533340454102, "global_step": 256549, "epoch": 1527} {"train_loss": -11.627788543701172, "global_step": 256550, "epoch": 1527} {"train_loss": -12.031126022338867, "global_step": 256551, "epoch": 1527} {"train_loss": -11.961885452270508, "global_step": 256552, "epoch": 1527} {"train_loss": -11.848163604736328, "global_step": 256553, "epoch": 1527} {"train_loss": -11.674018859863281, "global_step": 256554, "epoch": 1527} {"train_loss": -11.17513656616211, "global_step": 256555, "epoch": 1527} {"train_loss": -11.43993854522705, "global_step": 256556, "epoch": 1527} {"train_loss": -11.687503814697266, "global_step": 256557, "epoch": 1527} {"train_loss": -11.718582153320312, "global_step": 256558, "epoch": 1527} {"train_loss": -10.961617469787598, "global_step": 256559, "epoch": 1527} {"train_loss": -10.342438697814941, "global_step": 256560, "epoch": 1527} {"train_loss": -11.228612899780273, "global_step": 256561, "epoch": 1527} {"train_loss": -11.62576675415039, "global_step": 256562, "epoch": 1527} {"train_loss": -9.96630859375, "global_step": 256563, "epoch": 1527} {"train_loss": -11.60479736328125, "global_step": 256564, "epoch": 1527} {"train_loss": -11.233652114868164, "global_step": 256565, "epoch": 1527} {"train_loss": -10.923166275024414, "global_step": 256566, "epoch": 1527} {"train_loss": -11.897836685180664, "global_step": 256567, "epoch": 1527} {"train_loss": -11.480108261108398, "global_step": 256568, "epoch": 1527} {"train_loss": -11.779800415039062, "global_step": 256569, "epoch": 1527} {"train_loss": -11.289252281188965, "global_step": 256570, "epoch": 1527} {"train_loss": -11.995258331298828, "global_step": 256571, "epoch": 1527} {"train_loss": -11.980392456054688, "global_step": 256572, "epoch": 1527} {"train_loss": -11.689126014709473, "global_step": 256573, "epoch": 1527} {"train_loss": -11.727862358093262, "global_step": 256574, "epoch": 1527} {"train_loss": -11.722859382629395, "global_step": 256575, "epoch": 1527} {"train_loss": -11.972881317138672, "global_step": 256576, "epoch": 1527} {"train_loss": -11.77751636505127, "global_step": 256577, "epoch": 1527} {"train_loss": -12.006409645080566, "global_step": 256578, "epoch": 1527} {"train_loss": -11.798463821411133, "global_step": 256579, "epoch": 1527} {"train_loss": -11.661798477172852, "global_step": 256580, "epoch": 1527} {"train_loss": -11.785844802856445, "global_step": 256581, "epoch": 1527} {"train_loss": -11.80992603302002, "global_step": 256582, "epoch": 1527} {"train_loss": -11.729881286621094, "global_step": 256583, "epoch": 1527} {"train_loss": -11.94894027709961, "global_step": 256584, "epoch": 1527} {"train_loss": -11.659904479980469, "global_step": 256585, "epoch": 1527} {"train_loss": -12.323101043701172, "global_step": 256586, "epoch": 1527} {"train_loss": -12.068903923034668, "global_step": 256587, "epoch": 1527} {"train_loss": -12.156133651733398, "global_step": 256588, "epoch": 1527} {"train_loss": -12.053747177124023, "global_step": 256589, "epoch": 1527} {"train_loss": -11.997447967529297, "global_step": 256590, "epoch": 1527} {"train_loss": -12.202279090881348, "global_step": 256591, "epoch": 1527} {"train_loss": -12.145822525024414, "global_step": 256592, "epoch": 1527} {"train_loss": -11.948781967163086, "global_step": 256593, "epoch": 1527} {"train_loss": -11.906957626342773, "global_step": 256594, "epoch": 1527} {"train_loss": -12.060420989990234, "global_step": 256595, "epoch": 1527} {"train_loss": -12.005216598510742, "global_step": 256596, "epoch": 1527} {"train_loss": -12.057178497314453, "global_step": 256597, "epoch": 1527} {"train_loss": -11.973821640014648, "global_step": 256598, "epoch": 1527} {"train_loss": -12.196165084838867, "global_step": 256599, "epoch": 1527} {"train_loss": -12.011646270751953, "global_step": 256600, "epoch": 1527} {"train_loss": -12.239303588867188, "global_step": 256601, "epoch": 1527} {"train_loss": -12.220230102539062, "global_step": 256602, "epoch": 1527} {"train_loss": -12.059155464172363, "global_step": 256603, "epoch": 1527} {"train_loss": -12.129884719848633, "global_step": 256604, "epoch": 1527} {"train_loss": -12.129964828491211, "global_step": 256605, "epoch": 1527} {"train_loss": -11.852691650390625, "global_step": 256606, "epoch": 1527} {"train_loss": -12.016404151916504, "global_step": 256607, "epoch": 1527} {"train_loss": -12.011606216430664, "global_step": 256608, "epoch": 1527} {"train_loss": -11.981887817382812, "global_step": 256609, "epoch": 1527} {"train_loss": -12.278478622436523, "global_step": 256610, "epoch": 1527} {"train_loss": -12.01498031616211, "global_step": 256611, "epoch": 1527} {"train_loss": -12.05616569519043, "global_step": 256612, "epoch": 1527} {"train_loss": -12.078878402709961, "global_step": 256613, "epoch": 1527} {"train_loss": -12.025991439819336, "global_step": 256614, "epoch": 1527} {"train_loss": -11.997031211853027, "global_step": 256615, "epoch": 1527} {"train_loss": -11.773605346679688, "global_step": 256616, "epoch": 1527} {"train_loss": -12.121402740478516, "global_step": 256617, "epoch": 1527} {"train_loss": -11.802133560180664, "global_step": 256618, "epoch": 1527} {"train_loss": -11.779289245605469, "global_step": 256619, "epoch": 1527} {"train_loss": -11.806571960449219, "global_step": 256620, "epoch": 1527} {"train_loss": -11.746664047241211, "global_step": 256621, "epoch": 1527} {"train_loss": -11.943231582641602, "global_step": 256622, "epoch": 1527} {"train_loss": -11.675840377807617, "global_step": 256623, "epoch": 1527} {"train_loss": -12.067232131958008, "global_step": 256624, "epoch": 1527} {"train_loss": -12.098102569580078, "global_step": 256625, "epoch": 1527} {"train_loss": -11.840421676635742, "global_step": 256626, "epoch": 1527} {"train_loss": -11.62210464477539, "global_step": 256627, "epoch": 1527} {"train_loss": -12.036134719848633, "global_step": 256628, "epoch": 1527} {"train_loss": -12.024518013000488, "global_step": 256629, "epoch": 1527} {"train_loss": -11.86343002319336, "global_step": 256630, "epoch": 1527} {"train_loss": -11.877187728881836, "global_step": 256631, "epoch": 1527} {"train_loss": -12.034581184387207, "global_step": 256632, "epoch": 1527} {"train_loss": -11.32883358001709, "global_step": 256633, "epoch": 1527} {"train_loss": -11.976213455200195, "global_step": 256634, "epoch": 1527} {"train_loss": -11.652753829956055, "global_step": 256635, "epoch": 1527} {"train_loss": -11.529521942138672, "global_step": 256636, "epoch": 1527} {"train_loss": -11.606969833374023, "global_step": 256637, "epoch": 1527} {"train_loss": -10.46970272064209, "global_step": 256638, "epoch": 1527} {"train_loss": -11.704227447509766, "global_step": 256639, "epoch": 1527} {"train_loss": -11.27320671081543, "global_step": 256640, "epoch": 1527} {"train_loss": -10.651586532592773, "global_step": 256641, "epoch": 1527} {"train_loss": -11.346056938171387, "global_step": 256642, "epoch": 1527} {"train_loss": -9.642314910888672, "global_step": 256643, "epoch": 1527} {"train_loss": -11.560674667358398, "global_step": 256644, "epoch": 1527} {"train_loss": -9.9718017578125, "global_step": 256645, "epoch": 1527} {"train_loss": -10.531872749328613, "global_step": 256646, "epoch": 1527} {"train_loss": -10.222126007080078, "global_step": 256647, "epoch": 1527} {"train_loss": -10.516714096069336, "global_step": 256648, "epoch": 1527} {"train_loss": -9.834197998046875, "global_step": 256649, "epoch": 1527} {"train_loss": -10.36882209777832, "global_step": 256650, "epoch": 1527} {"train_loss": -9.265915870666504, "global_step": 256651, "epoch": 1527} {"train_loss": -7.065561294555664, "global_step": 256652, "epoch": 1527} {"train_loss": -7.013396263122559, "global_step": 256653, "epoch": 1527} {"train_loss": -7.5860443115234375, "global_step": 256654, "epoch": 1527} {"train_loss": -7.16201114654541, "global_step": 256655, "epoch": 1527} {"train_loss": -6.812732696533203, "global_step": 256656, "epoch": 1527} {"train_loss": -7.743838310241699, "global_step": 256657, "epoch": 1527} {"train_loss": -7.417372226715088, "global_step": 256658, "epoch": 1527} {"train_loss": -8.202228546142578, "global_step": 256659, "epoch": 1527} {"train_loss": -9.889772415161133, "global_step": 256660, "epoch": 1527} {"train_loss": -9.935945510864258, "global_step": 256661, "epoch": 1527} {"train_loss": -8.738380432128906, "global_step": 256662, "epoch": 1527} {"train_loss": -9.197406768798828, "global_step": 256663, "epoch": 1527} {"train_loss": -10.266923904418945, "global_step": 256664, "epoch": 1527} {"train_loss": -9.670309066772461, "global_step": 256665, "epoch": 1527} {"train_loss": -8.235326766967773, "global_step": 256666, "epoch": 1527} {"train_loss": -10.152098655700684, "global_step": 256667, "epoch": 1527} {"train_loss": -10.691036224365234, "global_step": 256668, "epoch": 1527} {"train_loss": -9.794241905212402, "global_step": 256669, "epoch": 1527} {"train_loss": -10.920515060424805, "global_step": 256670, "epoch": 1527} {"train_loss": -10.488443374633789, "global_step": 256671, "epoch": 1527} {"train_loss": -9.797076225280762, "global_step": 256672, "epoch": 1527} {"train_loss": -11.319475173950195, "global_step": 256673, "epoch": 1527} {"train_loss": -10.548393249511719, "global_step": 256674, "epoch": 1527} {"train_loss": -10.728906631469727, "global_step": 256675, "epoch": 1527} {"train_loss": -11.151714324951172, "global_step": 256676, "epoch": 1527} {"train_loss": -10.865842819213867, "global_step": 256677, "epoch": 1527} {"train_loss": -10.906380653381348, "global_step": 256678, "epoch": 1527} {"train_loss": -10.83497142791748, "global_step": 256679, "epoch": 1527} {"train_loss": -11.00732421875, "global_step": 256680, "epoch": 1527} {"train_loss": -11.176036834716797, "global_step": 256681, "epoch": 1527} {"train_loss": -11.093094825744629, "global_step": 256682, "epoch": 1527} {"train_loss": -11.177947044372559, "global_step": 256683, "epoch": 1527} {"train_loss": -11.086149215698242, "global_step": 256684, "epoch": 1527} {"train_loss": -11.306089401245117, "global_step": 256685, "epoch": 1527} {"train_loss": -11.219900131225586, "global_step": 256686, "epoch": 1527} {"train_loss": -11.501188278198242, "global_step": 256687, "epoch": 1527} {"train_loss": -11.660778045654297, "global_step": 256688, "epoch": 1527} {"train_loss": -11.537454605102539, "global_step": 256689, "epoch": 1527} {"train_loss": -11.723261833190918, "global_step": 256690, "epoch": 1527} {"train_loss": -11.390646934509277, "global_step": 256691, "epoch": 1527} {"train_loss": -11.611629486083984, "global_step": 256692, "epoch": 1527} {"train_loss": -11.573240280151367, "global_step": 256693, "epoch": 1527} {"train_loss": -11.360441207885742, "global_step": 256694, "epoch": 1527} {"train_loss": -11.754887580871582, "global_step": 256695, "epoch": 1527} {"train_loss": -11.640046119689941, "global_step": 256696, "epoch": 1527} {"train_loss": -11.450967788696289, "global_step": 256697, "epoch": 1527} {"train_loss": -11.764078140258789, "global_step": 256698, "epoch": 1527} {"train_loss": -11.842212677001953, "global_step": 256699, "epoch": 1527} {"train_loss": -11.712132453918457, "global_step": 256700, "epoch": 1527} {"train_loss": -11.59695053100586, "global_step": 256701, "epoch": 1527} {"train_loss": -11.670949935913086, "global_step": 256702, "epoch": 1527} {"train_loss": -11.263775544507164, "global_step": 256703, "epoch": 1527, "val_loss": 253161.59375} {"train_loss": -11.684405326843262, "global_step": 256704, "epoch": 1528} {"train_loss": -11.970438003540039, "global_step": 256705, "epoch": 1528} {"train_loss": -11.814037322998047, "global_step": 256706, "epoch": 1528} {"train_loss": -11.734070777893066, "global_step": 256707, "epoch": 1528} {"train_loss": -11.887020111083984, "global_step": 256708, "epoch": 1528} {"train_loss": -11.940102577209473, "global_step": 256709, "epoch": 1528} {"train_loss": -11.98105239868164, "global_step": 256710, "epoch": 1528} {"train_loss": -11.510175704956055, "global_step": 256711, "epoch": 1528} {"train_loss": -11.949625968933105, "global_step": 256712, "epoch": 1528} {"train_loss": -11.924903869628906, "global_step": 256713, "epoch": 1528} {"train_loss": -12.014253616333008, "global_step": 256714, "epoch": 1528} {"train_loss": -11.874784469604492, "global_step": 256715, "epoch": 1528} {"train_loss": -11.792481422424316, "global_step": 256716, "epoch": 1528} {"train_loss": -12.02818489074707, "global_step": 256717, "epoch": 1528} {"train_loss": -12.013387680053711, "global_step": 256718, "epoch": 1528} {"train_loss": -11.916254043579102, "global_step": 256719, "epoch": 1528} {"train_loss": -12.050882339477539, "global_step": 256720, "epoch": 1528} {"train_loss": -12.007783889770508, "global_step": 256721, "epoch": 1528} {"train_loss": -11.977039337158203, "global_step": 256722, "epoch": 1528} {"train_loss": -11.989225387573242, "global_step": 256723, "epoch": 1528} {"train_loss": -12.034351348876953, "global_step": 256724, "epoch": 1528} {"train_loss": -11.852654457092285, "global_step": 256725, "epoch": 1528} {"train_loss": -11.823835372924805, "global_step": 256726, "epoch": 1528} {"train_loss": -11.935929298400879, "global_step": 256727, "epoch": 1528} {"train_loss": -11.96406078338623, "global_step": 256728, "epoch": 1528} {"train_loss": -11.900089263916016, "global_step": 256729, "epoch": 1528} {"train_loss": -12.147314071655273, "global_step": 256730, "epoch": 1528} {"train_loss": -11.79212760925293, "global_step": 256731, "epoch": 1528} {"train_loss": -12.14374828338623, "global_step": 256732, "epoch": 1528} {"train_loss": -12.04150390625, "global_step": 256733, "epoch": 1528} {"train_loss": -11.939178466796875, "global_step": 256734, "epoch": 1528} {"train_loss": -12.152311325073242, "global_step": 256735, "epoch": 1528} {"train_loss": -12.040552139282227, "global_step": 256736, "epoch": 1528} {"train_loss": -12.055739402770996, "global_step": 256737, "epoch": 1528} {"train_loss": -12.123385429382324, "global_step": 256738, "epoch": 1528} {"train_loss": -12.02527904510498, "global_step": 256739, "epoch": 1528} {"train_loss": -11.926898956298828, "global_step": 256740, "epoch": 1528} {"train_loss": -12.182710647583008, "global_step": 256741, "epoch": 1528} {"train_loss": -11.951529502868652, "global_step": 256742, "epoch": 1528} {"train_loss": -12.152400016784668, "global_step": 256743, "epoch": 1528} {"train_loss": -11.783123016357422, "global_step": 256744, "epoch": 1528} {"train_loss": -12.02395248413086, "global_step": 256745, "epoch": 1528} {"train_loss": -11.890460014343262, "global_step": 256746, "epoch": 1528} {"train_loss": -12.213678359985352, "global_step": 256747, "epoch": 1528} {"train_loss": -11.871129035949707, "global_step": 256748, "epoch": 1528} {"train_loss": -11.607256889343262, "global_step": 256749, "epoch": 1528} {"train_loss": -11.706099510192871, "global_step": 256750, "epoch": 1528} {"train_loss": -12.1627197265625, "global_step": 256751, "epoch": 1528} {"train_loss": -12.281232833862305, "global_step": 256752, "epoch": 1528} {"train_loss": -12.092876434326172, "global_step": 256753, "epoch": 1528} {"train_loss": -12.114785194396973, "global_step": 256754, "epoch": 1528} {"train_loss": -12.295175552368164, "global_step": 256755, "epoch": 1528} {"train_loss": -12.144967079162598, "global_step": 256756, "epoch": 1528} {"train_loss": -11.948083877563477, "global_step": 256757, "epoch": 1528} {"train_loss": -12.23302936553955, "global_step": 256758, "epoch": 1528} {"train_loss": -12.259891510009766, "global_step": 256759, "epoch": 1528} {"train_loss": -12.046792984008789, "global_step": 256760, "epoch": 1528} {"train_loss": -12.068798065185547, "global_step": 256761, "epoch": 1528} {"train_loss": -12.138296127319336, "global_step": 256762, "epoch": 1528} {"train_loss": -12.14317512512207, "global_step": 256763, "epoch": 1528} {"train_loss": -12.158998489379883, "global_step": 256764, "epoch": 1528} {"train_loss": -12.313545227050781, "global_step": 256765, "epoch": 1528} {"train_loss": -12.343337059020996, "global_step": 256766, "epoch": 1528} {"train_loss": -12.273516654968262, "global_step": 256767, "epoch": 1528} {"train_loss": -12.268168449401855, "global_step": 256768, "epoch": 1528} {"train_loss": -12.118839263916016, "global_step": 256769, "epoch": 1528} {"train_loss": -12.39372444152832, "global_step": 256770, "epoch": 1528} {"train_loss": -12.298568725585938, "global_step": 256771, "epoch": 1528} {"train_loss": -12.32960033416748, "global_step": 256772, "epoch": 1528} {"train_loss": -12.404472351074219, "global_step": 256773, "epoch": 1528} {"train_loss": -12.235795974731445, "global_step": 256774, "epoch": 1528} {"train_loss": -12.428936004638672, "global_step": 256775, "epoch": 1528} {"train_loss": -12.054732322692871, "global_step": 256776, "epoch": 1528} {"train_loss": -12.346254348754883, "global_step": 256777, "epoch": 1528} {"train_loss": -12.329379081726074, "global_step": 256778, "epoch": 1528} {"train_loss": -12.260886192321777, "global_step": 256779, "epoch": 1528} {"train_loss": -12.124513626098633, "global_step": 256780, "epoch": 1528} {"train_loss": -12.168681144714355, "global_step": 256781, "epoch": 1528} {"train_loss": -12.426610946655273, "global_step": 256782, "epoch": 1528} {"train_loss": -12.14583969116211, "global_step": 256783, "epoch": 1528} {"train_loss": -11.513912200927734, "global_step": 256784, "epoch": 1528} {"train_loss": -11.999983787536621, "global_step": 256785, "epoch": 1528} {"train_loss": -10.908060073852539, "global_step": 256786, "epoch": 1528} {"train_loss": -11.180657386779785, "global_step": 256787, "epoch": 1528} {"train_loss": -8.487305641174316, "global_step": 256788, "epoch": 1528} {"train_loss": -8.306118965148926, "global_step": 256789, "epoch": 1528} {"train_loss": -8.553657531738281, "global_step": 256790, "epoch": 1528} {"train_loss": -9.143991470336914, "global_step": 256791, "epoch": 1528} {"train_loss": -11.049257278442383, "global_step": 256792, "epoch": 1528} {"train_loss": -10.375923156738281, "global_step": 256793, "epoch": 1528} {"train_loss": -10.710936546325684, "global_step": 256794, "epoch": 1528} {"train_loss": -10.874931335449219, "global_step": 256795, "epoch": 1528} {"train_loss": -9.446942329406738, "global_step": 256796, "epoch": 1528} {"train_loss": -11.35200309753418, "global_step": 256797, "epoch": 1528} {"train_loss": -10.059123992919922, "global_step": 256798, "epoch": 1528} {"train_loss": -9.929420471191406, "global_step": 256799, "epoch": 1528} {"train_loss": -9.306123733520508, "global_step": 256800, "epoch": 1528} {"train_loss": -11.601532936096191, "global_step": 256801, "epoch": 1528} {"train_loss": -8.983946800231934, "global_step": 256802, "epoch": 1528} {"train_loss": -9.822858810424805, "global_step": 256803, "epoch": 1528} {"train_loss": -10.357675552368164, "global_step": 256804, "epoch": 1528} {"train_loss": -9.218548774719238, "global_step": 256805, "epoch": 1528} {"train_loss": -9.06629467010498, "global_step": 256806, "epoch": 1528} {"train_loss": -10.75084400177002, "global_step": 256807, "epoch": 1528} {"train_loss": -8.48363971710205, "global_step": 256808, "epoch": 1528} {"train_loss": -9.88394546508789, "global_step": 256809, "epoch": 1528} {"train_loss": -9.203575134277344, "global_step": 256810, "epoch": 1528} {"train_loss": -11.240208625793457, "global_step": 256811, "epoch": 1528} {"train_loss": -9.596809387207031, "global_step": 256812, "epoch": 1528} {"train_loss": -9.665617942810059, "global_step": 256813, "epoch": 1528} {"train_loss": -9.734565734863281, "global_step": 256814, "epoch": 1528} {"train_loss": -10.602521896362305, "global_step": 256815, "epoch": 1528} {"train_loss": -9.554987907409668, "global_step": 256816, "epoch": 1528} {"train_loss": -11.221813201904297, "global_step": 256817, "epoch": 1528} {"train_loss": -10.507688522338867, "global_step": 256818, "epoch": 1528} {"train_loss": -10.528051376342773, "global_step": 256819, "epoch": 1528} {"train_loss": -11.148290634155273, "global_step": 256820, "epoch": 1528} {"train_loss": -11.23533821105957, "global_step": 256821, "epoch": 1528} {"train_loss": -10.937521934509277, "global_step": 256822, "epoch": 1528} {"train_loss": -11.372121810913086, "global_step": 256823, "epoch": 1528} {"train_loss": -10.799056053161621, "global_step": 256824, "epoch": 1528} {"train_loss": -10.662160873413086, "global_step": 256825, "epoch": 1528} {"train_loss": -11.097840309143066, "global_step": 256826, "epoch": 1528} {"train_loss": -11.135014533996582, "global_step": 256827, "epoch": 1528} {"train_loss": -10.81109619140625, "global_step": 256828, "epoch": 1528} {"train_loss": -11.196338653564453, "global_step": 256829, "epoch": 1528} {"train_loss": -11.548937797546387, "global_step": 256830, "epoch": 1528} {"train_loss": -11.308480262756348, "global_step": 256831, "epoch": 1528} {"train_loss": -11.322175979614258, "global_step": 256832, "epoch": 1528} {"train_loss": -11.541971206665039, "global_step": 256833, "epoch": 1528} {"train_loss": -11.466943740844727, "global_step": 256834, "epoch": 1528} {"train_loss": -11.214534759521484, "global_step": 256835, "epoch": 1528} {"train_loss": -11.514952659606934, "global_step": 256836, "epoch": 1528} {"train_loss": -11.566649436950684, "global_step": 256837, "epoch": 1528} {"train_loss": -11.018013954162598, "global_step": 256838, "epoch": 1528} {"train_loss": -11.130277633666992, "global_step": 256839, "epoch": 1528} {"train_loss": -11.660429000854492, "global_step": 256840, "epoch": 1528} {"train_loss": -11.422479629516602, "global_step": 256841, "epoch": 1528} {"train_loss": -11.30502700805664, "global_step": 256842, "epoch": 1528} {"train_loss": -11.804258346557617, "global_step": 256843, "epoch": 1528} {"train_loss": -11.340274810791016, "global_step": 256844, "epoch": 1528} {"train_loss": -11.710278511047363, "global_step": 256845, "epoch": 1528} {"train_loss": -11.47406005859375, "global_step": 256846, "epoch": 1528} {"train_loss": -11.468226432800293, "global_step": 256847, "epoch": 1528} {"train_loss": -11.543312072753906, "global_step": 256848, "epoch": 1528} {"train_loss": -11.554213523864746, "global_step": 256849, "epoch": 1528} {"train_loss": -11.691789627075195, "global_step": 256850, "epoch": 1528} {"train_loss": -11.482831954956055, "global_step": 256851, "epoch": 1528} {"train_loss": -11.69834041595459, "global_step": 256852, "epoch": 1528} {"train_loss": -11.894887924194336, "global_step": 256853, "epoch": 1528} {"train_loss": -11.62972640991211, "global_step": 256854, "epoch": 1528} {"train_loss": -11.713912963867188, "global_step": 256855, "epoch": 1528} {"train_loss": -11.494970321655273, "global_step": 256856, "epoch": 1528} {"train_loss": -11.633123397827148, "global_step": 256857, "epoch": 1528} {"train_loss": -11.739348411560059, "global_step": 256858, "epoch": 1528} {"train_loss": -11.57678508758545, "global_step": 256859, "epoch": 1528} {"train_loss": -11.693429946899414, "global_step": 256860, "epoch": 1528} {"train_loss": -11.644302368164062, "global_step": 256861, "epoch": 1528} {"train_loss": -11.839091300964355, "global_step": 256862, "epoch": 1528} {"train_loss": -11.797920227050781, "global_step": 256863, "epoch": 1528} {"train_loss": -11.517187118530273, "global_step": 256864, "epoch": 1528} {"train_loss": -11.855498313903809, "global_step": 256865, "epoch": 1528} {"train_loss": -11.920503616333008, "global_step": 256866, "epoch": 1528} {"train_loss": -11.866435050964355, "global_step": 256867, "epoch": 1528} {"train_loss": -11.830695152282715, "global_step": 256868, "epoch": 1528} {"train_loss": -11.914022445678711, "global_step": 256869, "epoch": 1528} {"train_loss": -11.802558898925781, "global_step": 256870, "epoch": 1528} {"train_loss": -11.458776434262594, "global_step": 256871, "epoch": 1528, "val_loss": 268544.6875} {"train_loss": -11.912287712097168, "global_step": 256872, "epoch": 1529} {"train_loss": -12.039682388305664, "global_step": 256873, "epoch": 1529} {"train_loss": -11.722555160522461, "global_step": 256874, "epoch": 1529} {"train_loss": -11.484084129333496, "global_step": 256875, "epoch": 1529} {"train_loss": -12.006429672241211, "global_step": 256876, "epoch": 1529} {"train_loss": -11.455873489379883, "global_step": 256877, "epoch": 1529} {"train_loss": -11.637452125549316, "global_step": 256878, "epoch": 1529} {"train_loss": -11.930912971496582, "global_step": 256879, "epoch": 1529} {"train_loss": -11.511395454406738, "global_step": 256880, "epoch": 1529} {"train_loss": -12.019333839416504, "global_step": 256881, "epoch": 1529} {"train_loss": -12.073892593383789, "global_step": 256882, "epoch": 1529} {"train_loss": -12.03106689453125, "global_step": 256883, "epoch": 1529} {"train_loss": -12.043084144592285, "global_step": 256884, "epoch": 1529} {"train_loss": -11.905052185058594, "global_step": 256885, "epoch": 1529} {"train_loss": -11.709243774414062, "global_step": 256886, "epoch": 1529} {"train_loss": -12.084758758544922, "global_step": 256887, "epoch": 1529} {"train_loss": -12.01921272277832, "global_step": 256888, "epoch": 1529} {"train_loss": -11.950979232788086, "global_step": 256889, "epoch": 1529} {"train_loss": -12.052906036376953, "global_step": 256890, "epoch": 1529} {"train_loss": -11.810629844665527, "global_step": 256891, "epoch": 1529} {"train_loss": -11.392839431762695, "global_step": 256892, "epoch": 1529} {"train_loss": -12.048420906066895, "global_step": 256893, "epoch": 1529} {"train_loss": -11.319201469421387, "global_step": 256894, "epoch": 1529} {"train_loss": -11.293212890625, "global_step": 256895, "epoch": 1529} {"train_loss": -12.122032165527344, "global_step": 256896, "epoch": 1529} {"train_loss": -11.963815689086914, "global_step": 256897, "epoch": 1529} {"train_loss": -11.729793548583984, "global_step": 256898, "epoch": 1529} {"train_loss": -12.202951431274414, "global_step": 256899, "epoch": 1529} {"train_loss": -11.733875274658203, "global_step": 256900, "epoch": 1529} {"train_loss": -11.728114128112793, "global_step": 256901, "epoch": 1529} {"train_loss": -11.448817253112793, "global_step": 256902, "epoch": 1529} {"train_loss": -12.100353240966797, "global_step": 256903, "epoch": 1529} {"train_loss": -11.68258285522461, "global_step": 256904, "epoch": 1529} {"train_loss": -11.708718299865723, "global_step": 256905, "epoch": 1529} {"train_loss": -12.058300018310547, "global_step": 256906, "epoch": 1529} {"train_loss": -11.390246391296387, "global_step": 256907, "epoch": 1529} {"train_loss": -12.0189208984375, "global_step": 256908, "epoch": 1529} {"train_loss": -11.13015079498291, "global_step": 256909, "epoch": 1529} {"train_loss": -11.98141098022461, "global_step": 256910, "epoch": 1529} {"train_loss": -11.785937309265137, "global_step": 256911, "epoch": 1529} {"train_loss": -11.548164367675781, "global_step": 256912, "epoch": 1529} {"train_loss": -11.619152069091797, "global_step": 256913, "epoch": 1529} {"train_loss": -12.167848587036133, "global_step": 256914, "epoch": 1529} {"train_loss": -12.179028511047363, "global_step": 256915, "epoch": 1529} {"train_loss": -11.911001205444336, "global_step": 256916, "epoch": 1529} {"train_loss": -12.203214645385742, "global_step": 256917, "epoch": 1529} {"train_loss": -11.923379898071289, "global_step": 256918, "epoch": 1529} {"train_loss": -11.416791915893555, "global_step": 256919, "epoch": 1529} {"train_loss": -11.492231369018555, "global_step": 256920, "epoch": 1529} {"train_loss": -12.180572509765625, "global_step": 256921, "epoch": 1529} {"train_loss": -11.2501802444458, "global_step": 256922, "epoch": 1529} {"train_loss": -11.632425308227539, "global_step": 256923, "epoch": 1529} {"train_loss": -11.459939956665039, "global_step": 256924, "epoch": 1529} {"train_loss": -12.034002304077148, "global_step": 256925, "epoch": 1529} {"train_loss": -11.625753402709961, "global_step": 256926, "epoch": 1529} {"train_loss": -11.17390251159668, "global_step": 256927, "epoch": 1529} {"train_loss": -11.57719898223877, "global_step": 256928, "epoch": 1529} {"train_loss": -11.687701225280762, "global_step": 256929, "epoch": 1529} {"train_loss": -10.460123062133789, "global_step": 256930, "epoch": 1529} {"train_loss": -11.503637313842773, "global_step": 256931, "epoch": 1529} {"train_loss": -10.897427558898926, "global_step": 256932, "epoch": 1529} {"train_loss": -11.302664756774902, "global_step": 256933, "epoch": 1529} {"train_loss": -11.31840705871582, "global_step": 256934, "epoch": 1529} {"train_loss": -10.403141975402832, "global_step": 256935, "epoch": 1529} {"train_loss": -11.612458229064941, "global_step": 256936, "epoch": 1529} {"train_loss": -10.819276809692383, "global_step": 256937, "epoch": 1529} {"train_loss": -11.880595207214355, "global_step": 256938, "epoch": 1529} {"train_loss": -11.103772163391113, "global_step": 256939, "epoch": 1529} {"train_loss": -11.337447166442871, "global_step": 256940, "epoch": 1529} {"train_loss": -11.78911018371582, "global_step": 256941, "epoch": 1529} {"train_loss": -11.784721374511719, "global_step": 256942, "epoch": 1529} {"train_loss": -11.477605819702148, "global_step": 256943, "epoch": 1529} {"train_loss": -11.914789199829102, "global_step": 256944, "epoch": 1529} {"train_loss": -11.697781562805176, "global_step": 256945, "epoch": 1529} {"train_loss": -11.687935829162598, "global_step": 256946, "epoch": 1529} {"train_loss": -11.742688179016113, "global_step": 256947, "epoch": 1529} {"train_loss": -11.481122016906738, "global_step": 256948, "epoch": 1529} {"train_loss": -12.062885284423828, "global_step": 256949, "epoch": 1529} {"train_loss": -11.228906631469727, "global_step": 256950, "epoch": 1529} {"train_loss": -11.081571578979492, "global_step": 256951, "epoch": 1529} {"train_loss": -12.125321388244629, "global_step": 256952, "epoch": 1529} {"train_loss": -11.265016555786133, "global_step": 256953, "epoch": 1529} {"train_loss": -11.37698745727539, "global_step": 256954, "epoch": 1529} {"train_loss": -11.467671394348145, "global_step": 256955, "epoch": 1529} {"train_loss": -11.707401275634766, "global_step": 256956, "epoch": 1529} {"train_loss": -11.130403518676758, "global_step": 256957, "epoch": 1529} {"train_loss": -11.11146068572998, "global_step": 256958, "epoch": 1529} {"train_loss": -11.27383804321289, "global_step": 256959, "epoch": 1529} {"train_loss": -10.420745849609375, "global_step": 256960, "epoch": 1529} {"train_loss": -11.060558319091797, "global_step": 256961, "epoch": 1529} {"train_loss": -10.484075546264648, "global_step": 256962, "epoch": 1529} {"train_loss": -10.984357833862305, "global_step": 256963, "epoch": 1529} {"train_loss": -10.55903148651123, "global_step": 256964, "epoch": 1529} {"train_loss": -10.980690002441406, "global_step": 256965, "epoch": 1529} {"train_loss": -11.359888076782227, "global_step": 256966, "epoch": 1529} {"train_loss": -10.713330268859863, "global_step": 256967, "epoch": 1529} {"train_loss": -11.207633018493652, "global_step": 256968, "epoch": 1529} {"train_loss": -11.602521896362305, "global_step": 256969, "epoch": 1529} {"train_loss": -11.091301918029785, "global_step": 256970, "epoch": 1529} {"train_loss": -11.755611419677734, "global_step": 256971, "epoch": 1529} {"train_loss": -11.59164047241211, "global_step": 256972, "epoch": 1529} {"train_loss": -11.661704063415527, "global_step": 256973, "epoch": 1529} {"train_loss": -11.520349502563477, "global_step": 256974, "epoch": 1529} {"train_loss": -11.72927188873291, "global_step": 256975, "epoch": 1529} {"train_loss": -11.759024620056152, "global_step": 256976, "epoch": 1529} {"train_loss": -11.68882942199707, "global_step": 256977, "epoch": 1529} {"train_loss": -11.916329383850098, "global_step": 256978, "epoch": 1529} {"train_loss": -11.745055198669434, "global_step": 256979, "epoch": 1529} {"train_loss": -11.69578742980957, "global_step": 256980, "epoch": 1529} {"train_loss": -11.930410385131836, "global_step": 256981, "epoch": 1529} {"train_loss": -11.677441596984863, "global_step": 256982, "epoch": 1529} {"train_loss": -11.853171348571777, "global_step": 256983, "epoch": 1529} {"train_loss": -11.69339656829834, "global_step": 256984, "epoch": 1529} {"train_loss": -11.849228858947754, "global_step": 256985, "epoch": 1529} {"train_loss": -11.968713760375977, "global_step": 256986, "epoch": 1529} {"train_loss": -11.58421802520752, "global_step": 256987, "epoch": 1529} {"train_loss": -11.949899673461914, "global_step": 256988, "epoch": 1529} {"train_loss": -11.809173583984375, "global_step": 256989, "epoch": 1529} {"train_loss": -11.991043090820312, "global_step": 256990, "epoch": 1529} {"train_loss": -12.018707275390625, "global_step": 256991, "epoch": 1529} {"train_loss": -11.837441444396973, "global_step": 256992, "epoch": 1529} {"train_loss": -11.992794036865234, "global_step": 256993, "epoch": 1529} {"train_loss": -11.739789962768555, "global_step": 256994, "epoch": 1529} {"train_loss": -11.876267433166504, "global_step": 256995, "epoch": 1529} {"train_loss": -11.980884552001953, "global_step": 256996, "epoch": 1529} {"train_loss": -11.832679748535156, "global_step": 256997, "epoch": 1529} {"train_loss": -11.803953170776367, "global_step": 256998, "epoch": 1529} {"train_loss": -12.031624794006348, "global_step": 256999, "epoch": 1529} {"train_loss": -11.731742858886719, "global_step": 257000, "epoch": 1529} {"train_loss": -11.829050064086914, "global_step": 257001, "epoch": 1529} {"train_loss": -11.743266105651855, "global_step": 257002, "epoch": 1529} {"train_loss": -11.787347793579102, "global_step": 257003, "epoch": 1529} {"train_loss": -11.993620872497559, "global_step": 257004, "epoch": 1529} {"train_loss": -11.63634204864502, "global_step": 257005, "epoch": 1529} {"train_loss": -11.796429634094238, "global_step": 257006, "epoch": 1529} {"train_loss": -11.65540599822998, "global_step": 257007, "epoch": 1529} {"train_loss": -11.674667358398438, "global_step": 257008, "epoch": 1529} {"train_loss": -11.36136245727539, "global_step": 257009, "epoch": 1529} {"train_loss": -11.609659194946289, "global_step": 257010, "epoch": 1529} {"train_loss": -11.883589744567871, "global_step": 257011, "epoch": 1529} {"train_loss": -11.400405883789062, "global_step": 257012, "epoch": 1529} {"train_loss": -11.727984428405762, "global_step": 257013, "epoch": 1529} {"train_loss": -11.600210189819336, "global_step": 257014, "epoch": 1529} {"train_loss": -11.44908618927002, "global_step": 257015, "epoch": 1529} {"train_loss": -11.634812355041504, "global_step": 257016, "epoch": 1529} {"train_loss": -11.775984764099121, "global_step": 257017, "epoch": 1529} {"train_loss": -11.175483703613281, "global_step": 257018, "epoch": 1529} {"train_loss": -11.56489086151123, "global_step": 257019, "epoch": 1529} {"train_loss": -11.986658096313477, "global_step": 257020, "epoch": 1529} {"train_loss": -11.405702590942383, "global_step": 257021, "epoch": 1529} {"train_loss": -11.49271297454834, "global_step": 257022, "epoch": 1529} {"train_loss": -11.916919708251953, "global_step": 257023, "epoch": 1529} {"train_loss": -11.704269409179688, "global_step": 257024, "epoch": 1529} {"train_loss": -11.790630340576172, "global_step": 257025, "epoch": 1529} {"train_loss": -11.712591171264648, "global_step": 257026, "epoch": 1529} {"train_loss": -11.93568229675293, "global_step": 257027, "epoch": 1529} {"train_loss": -12.101743698120117, "global_step": 257028, "epoch": 1529} {"train_loss": -11.76044750213623, "global_step": 257029, "epoch": 1529} {"train_loss": -12.044004440307617, "global_step": 257030, "epoch": 1529} {"train_loss": -11.540714263916016, "global_step": 257031, "epoch": 1529} {"train_loss": -12.062932968139648, "global_step": 257032, "epoch": 1529} {"train_loss": -11.599699020385742, "global_step": 257033, "epoch": 1529} {"train_loss": -12.050830841064453, "global_step": 257034, "epoch": 1529} {"train_loss": -12.074090957641602, "global_step": 257035, "epoch": 1529} {"train_loss": -12.046491622924805, "global_step": 257036, "epoch": 1529} {"train_loss": -11.969951629638672, "global_step": 257037, "epoch": 1529} {"train_loss": -12.01016902923584, "global_step": 257038, "epoch": 1529} {"train_loss": -11.658890656062535, "global_step": 257039, "epoch": 1529, "val_loss": 269557.8125} {"train_loss": -11.768425941467285, "global_step": 257040, "epoch": 1530} {"train_loss": -11.89637565612793, "global_step": 257041, "epoch": 1530} {"train_loss": -11.834667205810547, "global_step": 257042, "epoch": 1530} {"train_loss": -11.94041633605957, "global_step": 257043, "epoch": 1530} {"train_loss": -11.977977752685547, "global_step": 257044, "epoch": 1530} {"train_loss": -11.599515914916992, "global_step": 257045, "epoch": 1530} {"train_loss": -11.734724998474121, "global_step": 257046, "epoch": 1530} {"train_loss": -11.745306015014648, "global_step": 257047, "epoch": 1530} {"train_loss": -11.504849433898926, "global_step": 257048, "epoch": 1530} {"train_loss": -11.69740104675293, "global_step": 257049, "epoch": 1530} {"train_loss": -11.546894073486328, "global_step": 257050, "epoch": 1530} {"train_loss": -11.908130645751953, "global_step": 257051, "epoch": 1530} {"train_loss": -11.697555541992188, "global_step": 257052, "epoch": 1530} {"train_loss": -11.793206214904785, "global_step": 257053, "epoch": 1530} {"train_loss": -10.518173217773438, "global_step": 257054, "epoch": 1530} {"train_loss": -11.540863990783691, "global_step": 257055, "epoch": 1530} {"train_loss": -10.847309112548828, "global_step": 257056, "epoch": 1530} {"train_loss": -11.510117530822754, "global_step": 257057, "epoch": 1530} {"train_loss": -11.38823413848877, "global_step": 257058, "epoch": 1530} {"train_loss": -11.048096656799316, "global_step": 257059, "epoch": 1530} {"train_loss": -11.568503379821777, "global_step": 257060, "epoch": 1530} {"train_loss": -10.543256759643555, "global_step": 257061, "epoch": 1530} {"train_loss": -11.286005973815918, "global_step": 257062, "epoch": 1530} {"train_loss": -11.182900428771973, "global_step": 257063, "epoch": 1530} {"train_loss": -9.848308563232422, "global_step": 257064, "epoch": 1530} {"train_loss": -11.424266815185547, "global_step": 257065, "epoch": 1530} {"train_loss": -10.549938201904297, "global_step": 257066, "epoch": 1530} {"train_loss": -10.227445602416992, "global_step": 257067, "epoch": 1530} {"train_loss": -10.852706909179688, "global_step": 257068, "epoch": 1530} {"train_loss": -10.976249694824219, "global_step": 257069, "epoch": 1530} {"train_loss": -10.890363693237305, "global_step": 257070, "epoch": 1530} {"train_loss": -10.658677101135254, "global_step": 257071, "epoch": 1530} {"train_loss": -10.760601997375488, "global_step": 257072, "epoch": 1530} {"train_loss": -10.755224227905273, "global_step": 257073, "epoch": 1530} {"train_loss": -10.919224739074707, "global_step": 257074, "epoch": 1530} {"train_loss": -10.290735244750977, "global_step": 257075, "epoch": 1530} {"train_loss": -11.215258598327637, "global_step": 257076, "epoch": 1530} {"train_loss": -10.952413558959961, "global_step": 257077, "epoch": 1530} {"train_loss": -11.668481826782227, "global_step": 257078, "epoch": 1530} {"train_loss": -11.046792984008789, "global_step": 257079, "epoch": 1530} {"train_loss": -11.57675552368164, "global_step": 257080, "epoch": 1530} {"train_loss": -10.934366226196289, "global_step": 257081, "epoch": 1530} {"train_loss": -11.631535530090332, "global_step": 257082, "epoch": 1530} {"train_loss": -11.152215957641602, "global_step": 257083, "epoch": 1530} {"train_loss": -11.208059310913086, "global_step": 257084, "epoch": 1530} {"train_loss": -11.318514823913574, "global_step": 257085, "epoch": 1530} {"train_loss": -11.218742370605469, "global_step": 257086, "epoch": 1530} {"train_loss": -11.392823219299316, "global_step": 257087, "epoch": 1530} {"train_loss": -11.586544036865234, "global_step": 257088, "epoch": 1530} {"train_loss": -11.274933815002441, "global_step": 257089, "epoch": 1530} {"train_loss": -11.834380149841309, "global_step": 257090, "epoch": 1530} {"train_loss": -11.529834747314453, "global_step": 257091, "epoch": 1530} {"train_loss": -11.68498420715332, "global_step": 257092, "epoch": 1530} {"train_loss": -11.618873596191406, "global_step": 257093, "epoch": 1530} {"train_loss": -11.48669147491455, "global_step": 257094, "epoch": 1530} {"train_loss": -11.486088752746582, "global_step": 257095, "epoch": 1530} {"train_loss": -11.645413398742676, "global_step": 257096, "epoch": 1530} {"train_loss": -11.6917724609375, "global_step": 257097, "epoch": 1530} {"train_loss": -11.312178611755371, "global_step": 257098, "epoch": 1530} {"train_loss": -11.712730407714844, "global_step": 257099, "epoch": 1530} {"train_loss": -11.378040313720703, "global_step": 257100, "epoch": 1530} {"train_loss": -11.484088897705078, "global_step": 257101, "epoch": 1530} {"train_loss": -11.28558349609375, "global_step": 257102, "epoch": 1530} {"train_loss": -11.415172576904297, "global_step": 257103, "epoch": 1530} {"train_loss": -11.099848747253418, "global_step": 257104, "epoch": 1530} {"train_loss": -11.579322814941406, "global_step": 257105, "epoch": 1530} {"train_loss": -10.938678741455078, "global_step": 257106, "epoch": 1530} {"train_loss": -11.9044189453125, "global_step": 257107, "epoch": 1530} {"train_loss": -11.264638900756836, "global_step": 257108, "epoch": 1530} {"train_loss": -11.881855010986328, "global_step": 257109, "epoch": 1530} {"train_loss": -11.527359962463379, "global_step": 257110, "epoch": 1530} {"train_loss": -11.834000587463379, "global_step": 257111, "epoch": 1530} {"train_loss": -11.724513053894043, "global_step": 257112, "epoch": 1530} {"train_loss": -11.931447982788086, "global_step": 257113, "epoch": 1530} {"train_loss": -11.774368286132812, "global_step": 257114, "epoch": 1530} {"train_loss": -12.018478393554688, "global_step": 257115, "epoch": 1530} {"train_loss": -11.940057754516602, "global_step": 257116, "epoch": 1530} {"train_loss": -12.141538619995117, "global_step": 257117, "epoch": 1530} {"train_loss": -12.001644134521484, "global_step": 257118, "epoch": 1530} {"train_loss": -12.17068099975586, "global_step": 257119, "epoch": 1530} {"train_loss": -11.682891845703125, "global_step": 257120, "epoch": 1530} {"train_loss": -12.095571517944336, "global_step": 257121, "epoch": 1530} {"train_loss": -11.870149612426758, "global_step": 257122, "epoch": 1530} {"train_loss": -12.127887725830078, "global_step": 257123, "epoch": 1530} {"train_loss": -11.837900161743164, "global_step": 257124, "epoch": 1530} {"train_loss": -12.067390441894531, "global_step": 257125, "epoch": 1530} {"train_loss": -11.956318855285645, "global_step": 257126, "epoch": 1530} {"train_loss": -11.995819091796875, "global_step": 257127, "epoch": 1530} {"train_loss": -12.047714233398438, "global_step": 257128, "epoch": 1530} {"train_loss": -11.713672637939453, "global_step": 257129, "epoch": 1530} {"train_loss": -11.948522567749023, "global_step": 257130, "epoch": 1530} {"train_loss": -12.036050796508789, "global_step": 257131, "epoch": 1530} {"train_loss": -11.991637229919434, "global_step": 257132, "epoch": 1530} {"train_loss": -11.931373596191406, "global_step": 257133, "epoch": 1530} {"train_loss": -11.973881721496582, "global_step": 257134, "epoch": 1530} {"train_loss": -12.177482604980469, "global_step": 257135, "epoch": 1530} {"train_loss": -12.048591613769531, "global_step": 257136, "epoch": 1530} {"train_loss": -12.280500411987305, "global_step": 257137, "epoch": 1530} {"train_loss": -12.029115676879883, "global_step": 257138, "epoch": 1530} {"train_loss": -12.20372200012207, "global_step": 257139, "epoch": 1530} {"train_loss": -12.259136199951172, "global_step": 257140, "epoch": 1530} {"train_loss": -12.282352447509766, "global_step": 257141, "epoch": 1530} {"train_loss": -11.923736572265625, "global_step": 257142, "epoch": 1530} {"train_loss": -11.99661636352539, "global_step": 257143, "epoch": 1530} {"train_loss": -12.153505325317383, "global_step": 257144, "epoch": 1530} {"train_loss": -12.093395233154297, "global_step": 257145, "epoch": 1530} {"train_loss": -12.086050033569336, "global_step": 257146, "epoch": 1530} {"train_loss": -11.964192390441895, "global_step": 257147, "epoch": 1530} {"train_loss": -12.132271766662598, "global_step": 257148, "epoch": 1530} {"train_loss": -12.149528503417969, "global_step": 257149, "epoch": 1530} {"train_loss": -12.052895545959473, "global_step": 257150, "epoch": 1530} {"train_loss": -11.943926811218262, "global_step": 257151, "epoch": 1530} {"train_loss": -12.079498291015625, "global_step": 257152, "epoch": 1530} {"train_loss": -12.158836364746094, "global_step": 257153, "epoch": 1530} {"train_loss": -12.043405532836914, "global_step": 257154, "epoch": 1530} {"train_loss": -12.182714462280273, "global_step": 257155, "epoch": 1530} {"train_loss": -11.94882583618164, "global_step": 257156, "epoch": 1530} {"train_loss": -12.301817893981934, "global_step": 257157, "epoch": 1530} {"train_loss": -12.208930969238281, "global_step": 257158, "epoch": 1530} {"train_loss": -12.432738304138184, "global_step": 257159, "epoch": 1530} {"train_loss": -12.160557746887207, "global_step": 257160, "epoch": 1530} {"train_loss": -12.00497817993164, "global_step": 257161, "epoch": 1530} {"train_loss": -12.37183952331543, "global_step": 257162, "epoch": 1530} {"train_loss": -12.118176460266113, "global_step": 257163, "epoch": 1530} {"train_loss": -12.326208114624023, "global_step": 257164, "epoch": 1530} {"train_loss": -12.075008392333984, "global_step": 257165, "epoch": 1530} {"train_loss": -11.787306785583496, "global_step": 257166, "epoch": 1530} {"train_loss": -11.680999755859375, "global_step": 257167, "epoch": 1530} {"train_loss": -11.43604850769043, "global_step": 257168, "epoch": 1530} {"train_loss": -10.77454948425293, "global_step": 257169, "epoch": 1530} {"train_loss": -10.498702049255371, "global_step": 257170, "epoch": 1530} {"train_loss": -11.892091751098633, "global_step": 257171, "epoch": 1530} {"train_loss": -11.23297119140625, "global_step": 257172, "epoch": 1530} {"train_loss": -11.335384368896484, "global_step": 257173, "epoch": 1530} {"train_loss": -10.579099655151367, "global_step": 257174, "epoch": 1530} {"train_loss": -11.291706085205078, "global_step": 257175, "epoch": 1530} {"train_loss": -11.593088150024414, "global_step": 257176, "epoch": 1530} {"train_loss": -11.569137573242188, "global_step": 257177, "epoch": 1530} {"train_loss": -11.389552116394043, "global_step": 257178, "epoch": 1530} {"train_loss": -11.52927017211914, "global_step": 257179, "epoch": 1530} {"train_loss": -11.689692497253418, "global_step": 257180, "epoch": 1530} {"train_loss": -11.260404586791992, "global_step": 257181, "epoch": 1530} {"train_loss": -11.489568710327148, "global_step": 257182, "epoch": 1530} {"train_loss": -11.723628997802734, "global_step": 257183, "epoch": 1530} {"train_loss": -11.4490966796875, "global_step": 257184, "epoch": 1530} {"train_loss": -11.620702743530273, "global_step": 257185, "epoch": 1530} {"train_loss": -11.385665893554688, "global_step": 257186, "epoch": 1530} {"train_loss": -11.768406867980957, "global_step": 257187, "epoch": 1530} {"train_loss": -11.727144241333008, "global_step": 257188, "epoch": 1530} {"train_loss": -11.359170913696289, "global_step": 257189, "epoch": 1530} {"train_loss": -11.355766296386719, "global_step": 257190, "epoch": 1530} {"train_loss": -10.09425163269043, "global_step": 257191, "epoch": 1530} {"train_loss": -11.911547660827637, "global_step": 257192, "epoch": 1530} {"train_loss": -10.068058013916016, "global_step": 257193, "epoch": 1530} {"train_loss": -10.776965141296387, "global_step": 257194, "epoch": 1530} {"train_loss": -10.260891914367676, "global_step": 257195, "epoch": 1530} {"train_loss": -11.011758804321289, "global_step": 257196, "epoch": 1530} {"train_loss": -10.819881439208984, "global_step": 257197, "epoch": 1530} {"train_loss": -11.494401931762695, "global_step": 257198, "epoch": 1530} {"train_loss": -10.231210708618164, "global_step": 257199, "epoch": 1530} {"train_loss": -10.553669929504395, "global_step": 257200, "epoch": 1530} {"train_loss": -10.69567584991455, "global_step": 257201, "epoch": 1530} {"train_loss": -10.188655853271484, "global_step": 257202, "epoch": 1530} {"train_loss": -11.359779357910156, "global_step": 257203, "epoch": 1530} {"train_loss": -11.01318073272705, "global_step": 257204, "epoch": 1530} {"train_loss": -11.678255081176758, "global_step": 257205, "epoch": 1530} {"train_loss": -11.344005584716797, "global_step": 257206, "epoch": 1530} {"train_loss": -11.531902727626619, "global_step": 257207, "epoch": 1530, "val_loss": 270908.3125, "train_action_mse_error": 3.957381248474121} {"train_loss": -11.551979064941406, "global_step": 257208, "epoch": 1531} {"train_loss": -10.399004936218262, "global_step": 257209, "epoch": 1531} {"train_loss": -11.825105667114258, "global_step": 257210, "epoch": 1531} {"train_loss": -10.673795700073242, "global_step": 257211, "epoch": 1531} {"train_loss": -11.297582626342773, "global_step": 257212, "epoch": 1531} {"train_loss": -10.108054161071777, "global_step": 257213, "epoch": 1531} {"train_loss": -10.838964462280273, "global_step": 257214, "epoch": 1531} {"train_loss": -10.599023818969727, "global_step": 257215, "epoch": 1531} {"train_loss": -10.838970184326172, "global_step": 257216, "epoch": 1531} {"train_loss": -10.963574409484863, "global_step": 257217, "epoch": 1531} {"train_loss": -11.451054573059082, "global_step": 257218, "epoch": 1531} {"train_loss": -10.940326690673828, "global_step": 257219, "epoch": 1531} {"train_loss": -11.348222732543945, "global_step": 257220, "epoch": 1531} {"train_loss": -11.589271545410156, "global_step": 257221, "epoch": 1531} {"train_loss": -11.522787094116211, "global_step": 257222, "epoch": 1531} {"train_loss": -11.795565605163574, "global_step": 257223, "epoch": 1531} {"train_loss": -11.524890899658203, "global_step": 257224, "epoch": 1531} {"train_loss": -11.223672866821289, "global_step": 257225, "epoch": 1531} {"train_loss": -11.694089889526367, "global_step": 257226, "epoch": 1531} {"train_loss": -11.818052291870117, "global_step": 257227, "epoch": 1531} {"train_loss": -11.89558219909668, "global_step": 257228, "epoch": 1531} {"train_loss": -11.869795799255371, "global_step": 257229, "epoch": 1531} {"train_loss": -11.855528831481934, "global_step": 257230, "epoch": 1531} {"train_loss": -11.696464538574219, "global_step": 257231, "epoch": 1531} {"train_loss": -11.836885452270508, "global_step": 257232, "epoch": 1531} {"train_loss": -11.785943031311035, "global_step": 257233, "epoch": 1531} {"train_loss": -11.957571983337402, "global_step": 257234, "epoch": 1531} {"train_loss": -11.630054473876953, "global_step": 257235, "epoch": 1531} {"train_loss": -11.959722518920898, "global_step": 257236, "epoch": 1531} {"train_loss": -11.810847282409668, "global_step": 257237, "epoch": 1531} {"train_loss": -11.801513671875, "global_step": 257238, "epoch": 1531} {"train_loss": -11.957059860229492, "global_step": 257239, "epoch": 1531} {"train_loss": -12.039663314819336, "global_step": 257240, "epoch": 1531} {"train_loss": -11.970590591430664, "global_step": 257241, "epoch": 1531} {"train_loss": -12.005191802978516, "global_step": 257242, "epoch": 1531} {"train_loss": -11.954034805297852, "global_step": 257243, "epoch": 1531} {"train_loss": -12.037517547607422, "global_step": 257244, "epoch": 1531} {"train_loss": -12.124858856201172, "global_step": 257245, "epoch": 1531} {"train_loss": -11.91710376739502, "global_step": 257246, "epoch": 1531} {"train_loss": -12.21202278137207, "global_step": 257247, "epoch": 1531} {"train_loss": -11.704280853271484, "global_step": 257248, "epoch": 1531} {"train_loss": -11.72420597076416, "global_step": 257249, "epoch": 1531} {"train_loss": -12.154006958007812, "global_step": 257250, "epoch": 1531} {"train_loss": -11.91629409790039, "global_step": 257251, "epoch": 1531} {"train_loss": -11.984785079956055, "global_step": 257252, "epoch": 1531} {"train_loss": -11.997153282165527, "global_step": 257253, "epoch": 1531} {"train_loss": -12.098726272583008, "global_step": 257254, "epoch": 1531} {"train_loss": -12.020101547241211, "global_step": 257255, "epoch": 1531} {"train_loss": -12.158239364624023, "global_step": 257256, "epoch": 1531} {"train_loss": -12.145404815673828, "global_step": 257257, "epoch": 1531} {"train_loss": -12.216608047485352, "global_step": 257258, "epoch": 1531} {"train_loss": -12.204177856445312, "global_step": 257259, "epoch": 1531} {"train_loss": -12.186004638671875, "global_step": 257260, "epoch": 1531} {"train_loss": -12.20493221282959, "global_step": 257261, "epoch": 1531} {"train_loss": -12.442700386047363, "global_step": 257262, "epoch": 1531} {"train_loss": -12.106035232543945, "global_step": 257263, "epoch": 1531} {"train_loss": -12.175986289978027, "global_step": 257264, "epoch": 1531} {"train_loss": -12.327634811401367, "global_step": 257265, "epoch": 1531} {"train_loss": -12.259215354919434, "global_step": 257266, "epoch": 1531} {"train_loss": -12.124560356140137, "global_step": 257267, "epoch": 1531} {"train_loss": -12.160209655761719, "global_step": 257268, "epoch": 1531} {"train_loss": -12.20325756072998, "global_step": 257269, "epoch": 1531} {"train_loss": -12.107059478759766, "global_step": 257270, "epoch": 1531} {"train_loss": -12.028130531311035, "global_step": 257271, "epoch": 1531} {"train_loss": -12.12171745300293, "global_step": 257272, "epoch": 1531} {"train_loss": -12.069828987121582, "global_step": 257273, "epoch": 1531} {"train_loss": -12.306554794311523, "global_step": 257274, "epoch": 1531} {"train_loss": -12.236942291259766, "global_step": 257275, "epoch": 1531} {"train_loss": -12.34776496887207, "global_step": 257276, "epoch": 1531} {"train_loss": -12.315214157104492, "global_step": 257277, "epoch": 1531} {"train_loss": -12.33602237701416, "global_step": 257278, "epoch": 1531} {"train_loss": -12.169941902160645, "global_step": 257279, "epoch": 1531} {"train_loss": -11.782533645629883, "global_step": 257280, "epoch": 1531} {"train_loss": -12.283275604248047, "global_step": 257281, "epoch": 1531} {"train_loss": -12.24633502960205, "global_step": 257282, "epoch": 1531} {"train_loss": -12.108530044555664, "global_step": 257283, "epoch": 1531} {"train_loss": -12.021739959716797, "global_step": 257284, "epoch": 1531} {"train_loss": -12.381650924682617, "global_step": 257285, "epoch": 1531} {"train_loss": -12.115188598632812, "global_step": 257286, "epoch": 1531} {"train_loss": -11.80992603302002, "global_step": 257287, "epoch": 1531} {"train_loss": -11.98497486114502, "global_step": 257288, "epoch": 1531} {"train_loss": -12.12289047241211, "global_step": 257289, "epoch": 1531} {"train_loss": -11.981855392456055, "global_step": 257290, "epoch": 1531} {"train_loss": -11.48965835571289, "global_step": 257291, "epoch": 1531} {"train_loss": -11.882740020751953, "global_step": 257292, "epoch": 1531} {"train_loss": -12.215848922729492, "global_step": 257293, "epoch": 1531} {"train_loss": -12.066160202026367, "global_step": 257294, "epoch": 1531} {"train_loss": -11.650774955749512, "global_step": 257295, "epoch": 1531} {"train_loss": -11.382974624633789, "global_step": 257296, "epoch": 1531} {"train_loss": -11.177244186401367, "global_step": 257297, "epoch": 1531} {"train_loss": -11.56916618347168, "global_step": 257298, "epoch": 1531} {"train_loss": -11.908073425292969, "global_step": 257299, "epoch": 1531} {"train_loss": -11.76901626586914, "global_step": 257300, "epoch": 1531} {"train_loss": -10.818282127380371, "global_step": 257301, "epoch": 1531} {"train_loss": -9.352518081665039, "global_step": 257302, "epoch": 1531} {"train_loss": -11.060005187988281, "global_step": 257303, "epoch": 1531} {"train_loss": -9.75784969329834, "global_step": 257304, "epoch": 1531} {"train_loss": -9.993556022644043, "global_step": 257305, "epoch": 1531} {"train_loss": -10.660379409790039, "global_step": 257306, "epoch": 1531} {"train_loss": -9.730266571044922, "global_step": 257307, "epoch": 1531} {"train_loss": -10.803365707397461, "global_step": 257308, "epoch": 1531} {"train_loss": -11.654745101928711, "global_step": 257309, "epoch": 1531} {"train_loss": -11.107013702392578, "global_step": 257310, "epoch": 1531} {"train_loss": -11.594928741455078, "global_step": 257311, "epoch": 1531} {"train_loss": -11.01573371887207, "global_step": 257312, "epoch": 1531} {"train_loss": -11.935529708862305, "global_step": 257313, "epoch": 1531} {"train_loss": -11.056951522827148, "global_step": 257314, "epoch": 1531} {"train_loss": -11.455408096313477, "global_step": 257315, "epoch": 1531} {"train_loss": -11.239187240600586, "global_step": 257316, "epoch": 1531} {"train_loss": -11.391613006591797, "global_step": 257317, "epoch": 1531} {"train_loss": -11.030355453491211, "global_step": 257318, "epoch": 1531} {"train_loss": -11.13619613647461, "global_step": 257319, "epoch": 1531} {"train_loss": -10.52074909210205, "global_step": 257320, "epoch": 1531} {"train_loss": -11.532710075378418, "global_step": 257321, "epoch": 1531} {"train_loss": -11.255636215209961, "global_step": 257322, "epoch": 1531} {"train_loss": -11.521600723266602, "global_step": 257323, "epoch": 1531} {"train_loss": -11.488152503967285, "global_step": 257324, "epoch": 1531} {"train_loss": -11.492183685302734, "global_step": 257325, "epoch": 1531} {"train_loss": -11.412032127380371, "global_step": 257326, "epoch": 1531} {"train_loss": -11.695359230041504, "global_step": 257327, "epoch": 1531} {"train_loss": -11.25941276550293, "global_step": 257328, "epoch": 1531} {"train_loss": -11.96376895904541, "global_step": 257329, "epoch": 1531} {"train_loss": -10.787139892578125, "global_step": 257330, "epoch": 1531} {"train_loss": -11.400646209716797, "global_step": 257331, "epoch": 1531} {"train_loss": -10.874837875366211, "global_step": 257332, "epoch": 1531} {"train_loss": -11.04741096496582, "global_step": 257333, "epoch": 1531} {"train_loss": -11.66308307647705, "global_step": 257334, "epoch": 1531} {"train_loss": -11.220483779907227, "global_step": 257335, "epoch": 1531} {"train_loss": -11.048592567443848, "global_step": 257336, "epoch": 1531} {"train_loss": -11.228368759155273, "global_step": 257337, "epoch": 1531} {"train_loss": -11.376291275024414, "global_step": 257338, "epoch": 1531} {"train_loss": -11.568218231201172, "global_step": 257339, "epoch": 1531} {"train_loss": -10.930214881896973, "global_step": 257340, "epoch": 1531} {"train_loss": -11.402880668640137, "global_step": 257341, "epoch": 1531} {"train_loss": -10.254749298095703, "global_step": 257342, "epoch": 1531} {"train_loss": -11.752979278564453, "global_step": 257343, "epoch": 1531} {"train_loss": -10.820047378540039, "global_step": 257344, "epoch": 1531} {"train_loss": -11.319128036499023, "global_step": 257345, "epoch": 1531} {"train_loss": -11.233977317810059, "global_step": 257346, "epoch": 1531} {"train_loss": -10.750699043273926, "global_step": 257347, "epoch": 1531} {"train_loss": -11.449713706970215, "global_step": 257348, "epoch": 1531} {"train_loss": -10.923775672912598, "global_step": 257349, "epoch": 1531} {"train_loss": -11.368461608886719, "global_step": 257350, "epoch": 1531} {"train_loss": -10.748409271240234, "global_step": 257351, "epoch": 1531} {"train_loss": -11.37785530090332, "global_step": 257352, "epoch": 1531} {"train_loss": -10.789726257324219, "global_step": 257353, "epoch": 1531} {"train_loss": -11.11319351196289, "global_step": 257354, "epoch": 1531} {"train_loss": -11.25251579284668, "global_step": 257355, "epoch": 1531} {"train_loss": -11.440723419189453, "global_step": 257356, "epoch": 1531} {"train_loss": -10.665312767028809, "global_step": 257357, "epoch": 1531} {"train_loss": -11.641280174255371, "global_step": 257358, "epoch": 1531} {"train_loss": -10.979053497314453, "global_step": 257359, "epoch": 1531} {"train_loss": -11.852238655090332, "global_step": 257360, "epoch": 1531} {"train_loss": -10.976524353027344, "global_step": 257361, "epoch": 1531} {"train_loss": -11.592982292175293, "global_step": 257362, "epoch": 1531} {"train_loss": -11.657238960266113, "global_step": 257363, "epoch": 1531} {"train_loss": -11.495622634887695, "global_step": 257364, "epoch": 1531} {"train_loss": -11.621758460998535, "global_step": 257365, "epoch": 1531} {"train_loss": -11.386226654052734, "global_step": 257366, "epoch": 1531} {"train_loss": -11.476499557495117, "global_step": 257367, "epoch": 1531} {"train_loss": -11.460905075073242, "global_step": 257368, "epoch": 1531} {"train_loss": -11.28097152709961, "global_step": 257369, "epoch": 1531} {"train_loss": -11.66360855102539, "global_step": 257370, "epoch": 1531} {"train_loss": -11.219758987426758, "global_step": 257371, "epoch": 1531} {"train_loss": -11.599339485168457, "global_step": 257372, "epoch": 1531} {"train_loss": -11.165473937988281, "global_step": 257373, "epoch": 1531} {"train_loss": -11.428681373596191, "global_step": 257374, "epoch": 1531} {"train_loss": -11.546033933049156, "global_step": 257375, "epoch": 1531, "val_loss": 275065.5625} {"train_loss": -10.982162475585938, "global_step": 257376, "epoch": 1532} {"train_loss": -11.364194869995117, "global_step": 257377, "epoch": 1532} {"train_loss": -11.20016098022461, "global_step": 257378, "epoch": 1532} {"train_loss": -11.19854736328125, "global_step": 257379, "epoch": 1532} {"train_loss": -11.342287063598633, "global_step": 257380, "epoch": 1532} {"train_loss": -11.466840744018555, "global_step": 257381, "epoch": 1532} {"train_loss": -11.449075698852539, "global_step": 257382, "epoch": 1532} {"train_loss": -11.819766998291016, "global_step": 257383, "epoch": 1532} {"train_loss": -11.20510482788086, "global_step": 257384, "epoch": 1532} {"train_loss": -11.751596450805664, "global_step": 257385, "epoch": 1532} {"train_loss": -11.484373092651367, "global_step": 257386, "epoch": 1532} {"train_loss": -11.536511421203613, "global_step": 257387, "epoch": 1532} {"train_loss": -11.635488510131836, "global_step": 257388, "epoch": 1532} {"train_loss": -11.634177207946777, "global_step": 257389, "epoch": 1532} {"train_loss": -11.80334758758545, "global_step": 257390, "epoch": 1532} {"train_loss": -11.717933654785156, "global_step": 257391, "epoch": 1532} {"train_loss": -11.879528045654297, "global_step": 257392, "epoch": 1532} {"train_loss": -11.65610408782959, "global_step": 257393, "epoch": 1532} {"train_loss": -11.79640007019043, "global_step": 257394, "epoch": 1532} {"train_loss": -11.775568008422852, "global_step": 257395, "epoch": 1532} {"train_loss": -11.753641128540039, "global_step": 257396, "epoch": 1532} {"train_loss": -11.789310455322266, "global_step": 257397, "epoch": 1532} {"train_loss": -11.768803596496582, "global_step": 257398, "epoch": 1532} {"train_loss": -11.528642654418945, "global_step": 257399, "epoch": 1532} {"train_loss": -11.836372375488281, "global_step": 257400, "epoch": 1532} {"train_loss": -11.277076721191406, "global_step": 257401, "epoch": 1532} {"train_loss": -11.714641571044922, "global_step": 257402, "epoch": 1532} {"train_loss": -11.744110107421875, "global_step": 257403, "epoch": 1532} {"train_loss": -11.463494300842285, "global_step": 257404, "epoch": 1532} {"train_loss": -11.847753524780273, "global_step": 257405, "epoch": 1532} {"train_loss": -11.2990140914917, "global_step": 257406, "epoch": 1532} {"train_loss": -11.73884105682373, "global_step": 257407, "epoch": 1532} {"train_loss": -11.59619426727295, "global_step": 257408, "epoch": 1532} {"train_loss": -11.650243759155273, "global_step": 257409, "epoch": 1532} {"train_loss": -11.755280494689941, "global_step": 257410, "epoch": 1532} {"train_loss": -11.627586364746094, "global_step": 257411, "epoch": 1532} {"train_loss": -11.711498260498047, "global_step": 257412, "epoch": 1532} {"train_loss": -11.256563186645508, "global_step": 257413, "epoch": 1532} {"train_loss": -11.872809410095215, "global_step": 257414, "epoch": 1532} {"train_loss": -11.508807182312012, "global_step": 257415, "epoch": 1532} {"train_loss": -11.488924026489258, "global_step": 257416, "epoch": 1532} {"train_loss": -11.842836380004883, "global_step": 257417, "epoch": 1532} {"train_loss": -11.27987003326416, "global_step": 257418, "epoch": 1532} {"train_loss": -11.763402938842773, "global_step": 257419, "epoch": 1532} {"train_loss": -11.01378059387207, "global_step": 257420, "epoch": 1532} {"train_loss": -11.755672454833984, "global_step": 257421, "epoch": 1532} {"train_loss": -11.403675079345703, "global_step": 257422, "epoch": 1532} {"train_loss": -11.32122802734375, "global_step": 257423, "epoch": 1532} {"train_loss": -11.840487480163574, "global_step": 257424, "epoch": 1532} {"train_loss": -11.0943603515625, "global_step": 257425, "epoch": 1532} {"train_loss": -11.489359855651855, "global_step": 257426, "epoch": 1532} {"train_loss": -11.865290641784668, "global_step": 257427, "epoch": 1532} {"train_loss": -11.849300384521484, "global_step": 257428, "epoch": 1532} {"train_loss": -11.798540115356445, "global_step": 257429, "epoch": 1532} {"train_loss": -12.11640739440918, "global_step": 257430, "epoch": 1532} {"train_loss": -11.520465850830078, "global_step": 257431, "epoch": 1532} {"train_loss": -11.773863792419434, "global_step": 257432, "epoch": 1532} {"train_loss": -11.833014488220215, "global_step": 257433, "epoch": 1532} {"train_loss": -12.081705093383789, "global_step": 257434, "epoch": 1532} {"train_loss": -12.016295433044434, "global_step": 257435, "epoch": 1532} {"train_loss": -11.922513961791992, "global_step": 257436, "epoch": 1532} {"train_loss": -11.806873321533203, "global_step": 257437, "epoch": 1532} {"train_loss": -11.966285705566406, "global_step": 257438, "epoch": 1532} {"train_loss": -12.127786636352539, "global_step": 257439, "epoch": 1532} {"train_loss": -11.91640567779541, "global_step": 257440, "epoch": 1532} {"train_loss": -11.941703796386719, "global_step": 257441, "epoch": 1532} {"train_loss": -11.890030860900879, "global_step": 257442, "epoch": 1532} {"train_loss": -11.921684265136719, "global_step": 257443, "epoch": 1532} {"train_loss": -12.098823547363281, "global_step": 257444, "epoch": 1532} {"train_loss": -12.048604965209961, "global_step": 257445, "epoch": 1532} {"train_loss": -11.670550346374512, "global_step": 257446, "epoch": 1532} {"train_loss": -12.151912689208984, "global_step": 257447, "epoch": 1532} {"train_loss": -11.861421585083008, "global_step": 257448, "epoch": 1532} {"train_loss": -12.081981658935547, "global_step": 257449, "epoch": 1532} {"train_loss": -11.854585647583008, "global_step": 257450, "epoch": 1532} {"train_loss": -11.839773178100586, "global_step": 257451, "epoch": 1532} {"train_loss": -11.607134819030762, "global_step": 257452, "epoch": 1532} {"train_loss": -11.165227890014648, "global_step": 257453, "epoch": 1532} {"train_loss": -11.43200397491455, "global_step": 257454, "epoch": 1532} {"train_loss": -12.047889709472656, "global_step": 257455, "epoch": 1532} {"train_loss": -10.868707656860352, "global_step": 257456, "epoch": 1532} {"train_loss": -11.308177947998047, "global_step": 257457, "epoch": 1532} {"train_loss": -11.763898849487305, "global_step": 257458, "epoch": 1532} {"train_loss": -10.633830070495605, "global_step": 257459, "epoch": 1532} {"train_loss": -11.386710166931152, "global_step": 257460, "epoch": 1532} {"train_loss": -11.788278579711914, "global_step": 257461, "epoch": 1532} {"train_loss": -10.961967468261719, "global_step": 257462, "epoch": 1532} {"train_loss": -11.972367286682129, "global_step": 257463, "epoch": 1532} {"train_loss": -10.973508834838867, "global_step": 257464, "epoch": 1532} {"train_loss": -11.71786117553711, "global_step": 257465, "epoch": 1532} {"train_loss": -11.595148086547852, "global_step": 257466, "epoch": 1532} {"train_loss": -11.67201042175293, "global_step": 257467, "epoch": 1532} {"train_loss": -11.612920761108398, "global_step": 257468, "epoch": 1532} {"train_loss": -11.596851348876953, "global_step": 257469, "epoch": 1532} {"train_loss": -11.69575023651123, "global_step": 257470, "epoch": 1532} {"train_loss": -11.754907608032227, "global_step": 257471, "epoch": 1532} {"train_loss": -11.838048934936523, "global_step": 257472, "epoch": 1532} {"train_loss": -11.399736404418945, "global_step": 257473, "epoch": 1532} {"train_loss": -11.976390838623047, "global_step": 257474, "epoch": 1532} {"train_loss": -11.409507751464844, "global_step": 257475, "epoch": 1532} {"train_loss": -11.722047805786133, "global_step": 257476, "epoch": 1532} {"train_loss": -11.650900840759277, "global_step": 257477, "epoch": 1532} {"train_loss": -11.1285982131958, "global_step": 257478, "epoch": 1532} {"train_loss": -11.948917388916016, "global_step": 257479, "epoch": 1532} {"train_loss": -11.3004789352417, "global_step": 257480, "epoch": 1532} {"train_loss": -11.638518333435059, "global_step": 257481, "epoch": 1532} {"train_loss": -11.59752082824707, "global_step": 257482, "epoch": 1532} {"train_loss": -12.05919075012207, "global_step": 257483, "epoch": 1532} {"train_loss": -11.208006858825684, "global_step": 257484, "epoch": 1532} {"train_loss": -11.953527450561523, "global_step": 257485, "epoch": 1532} {"train_loss": -11.498109817504883, "global_step": 257486, "epoch": 1532} {"train_loss": -12.005038261413574, "global_step": 257487, "epoch": 1532} {"train_loss": -11.717707633972168, "global_step": 257488, "epoch": 1532} {"train_loss": -11.905009269714355, "global_step": 257489, "epoch": 1532} {"train_loss": -11.802083015441895, "global_step": 257490, "epoch": 1532} {"train_loss": -11.632118225097656, "global_step": 257491, "epoch": 1532} {"train_loss": -11.62195873260498, "global_step": 257492, "epoch": 1532} {"train_loss": -11.47575855255127, "global_step": 257493, "epoch": 1532} {"train_loss": -11.846653938293457, "global_step": 257494, "epoch": 1532} {"train_loss": -11.564775466918945, "global_step": 257495, "epoch": 1532} {"train_loss": -11.31577205657959, "global_step": 257496, "epoch": 1532} {"train_loss": -11.78386402130127, "global_step": 257497, "epoch": 1532} {"train_loss": -10.702181816101074, "global_step": 257498, "epoch": 1532} {"train_loss": -11.577342987060547, "global_step": 257499, "epoch": 1532} {"train_loss": -11.445197105407715, "global_step": 257500, "epoch": 1532} {"train_loss": -10.563689231872559, "global_step": 257501, "epoch": 1532} {"train_loss": -11.778253555297852, "global_step": 257502, "epoch": 1532} {"train_loss": -11.12237548828125, "global_step": 257503, "epoch": 1532} {"train_loss": -11.323347091674805, "global_step": 257504, "epoch": 1532} {"train_loss": -11.534138679504395, "global_step": 257505, "epoch": 1532} {"train_loss": -11.40153694152832, "global_step": 257506, "epoch": 1532} {"train_loss": -11.907079696655273, "global_step": 257507, "epoch": 1532} {"train_loss": -11.02834415435791, "global_step": 257508, "epoch": 1532} {"train_loss": -11.90092658996582, "global_step": 257509, "epoch": 1532} {"train_loss": -11.05532169342041, "global_step": 257510, "epoch": 1532} {"train_loss": -11.725214004516602, "global_step": 257511, "epoch": 1532} {"train_loss": -11.366130828857422, "global_step": 257512, "epoch": 1532} {"train_loss": -11.635986328125, "global_step": 257513, "epoch": 1532} {"train_loss": -11.790023803710938, "global_step": 257514, "epoch": 1532} {"train_loss": -11.233800888061523, "global_step": 257515, "epoch": 1532} {"train_loss": -11.863405227661133, "global_step": 257516, "epoch": 1532} {"train_loss": -11.586576461791992, "global_step": 257517, "epoch": 1532} {"train_loss": -11.983421325683594, "global_step": 257518, "epoch": 1532} {"train_loss": -11.781442642211914, "global_step": 257519, "epoch": 1532} {"train_loss": -11.4608154296875, "global_step": 257520, "epoch": 1532} {"train_loss": -11.136541366577148, "global_step": 257521, "epoch": 1532} {"train_loss": -11.854138374328613, "global_step": 257522, "epoch": 1532} {"train_loss": -11.101784706115723, "global_step": 257523, "epoch": 1532} {"train_loss": -11.838655471801758, "global_step": 257524, "epoch": 1532} {"train_loss": -11.062954902648926, "global_step": 257525, "epoch": 1532} {"train_loss": -11.584271430969238, "global_step": 257526, "epoch": 1532} {"train_loss": -11.319165229797363, "global_step": 257527, "epoch": 1532} {"train_loss": -11.757999420166016, "global_step": 257528, "epoch": 1532} {"train_loss": -11.892020225524902, "global_step": 257529, "epoch": 1532} {"train_loss": -11.775627136230469, "global_step": 257530, "epoch": 1532} {"train_loss": -11.69268798828125, "global_step": 257531, "epoch": 1532} {"train_loss": -11.853216171264648, "global_step": 257532, "epoch": 1532} {"train_loss": -11.326290130615234, "global_step": 257533, "epoch": 1532} {"train_loss": -11.324396133422852, "global_step": 257534, "epoch": 1532} {"train_loss": -11.82780647277832, "global_step": 257535, "epoch": 1532} {"train_loss": -11.492528915405273, "global_step": 257536, "epoch": 1532} {"train_loss": -11.284191131591797, "global_step": 257537, "epoch": 1532} {"train_loss": -11.347282409667969, "global_step": 257538, "epoch": 1532} {"train_loss": -11.842294692993164, "global_step": 257539, "epoch": 1532} {"train_loss": -10.708518981933594, "global_step": 257540, "epoch": 1532} {"train_loss": -11.858887672424316, "global_step": 257541, "epoch": 1532} {"train_loss": -10.5113525390625, "global_step": 257542, "epoch": 1532} {"train_loss": -11.594108053616115, "global_step": 257543, "epoch": 1532, "val_loss": 271225.84375} {"train_loss": -11.070409774780273, "global_step": 257544, "epoch": 1533} {"train_loss": -10.755138397216797, "global_step": 257545, "epoch": 1533} {"train_loss": -11.203361511230469, "global_step": 257546, "epoch": 1533} {"train_loss": -10.919139862060547, "global_step": 257547, "epoch": 1533} {"train_loss": -10.686241149902344, "global_step": 257548, "epoch": 1533} {"train_loss": -11.61066722869873, "global_step": 257549, "epoch": 1533} {"train_loss": -10.652687072753906, "global_step": 257550, "epoch": 1533} {"train_loss": -11.091500282287598, "global_step": 257551, "epoch": 1533} {"train_loss": -11.432943344116211, "global_step": 257552, "epoch": 1533} {"train_loss": -10.543176651000977, "global_step": 257553, "epoch": 1533} {"train_loss": -11.465667724609375, "global_step": 257554, "epoch": 1533} {"train_loss": -10.761579513549805, "global_step": 257555, "epoch": 1533} {"train_loss": -11.359247207641602, "global_step": 257556, "epoch": 1533} {"train_loss": -11.186726570129395, "global_step": 257557, "epoch": 1533} {"train_loss": -11.231718063354492, "global_step": 257558, "epoch": 1533} {"train_loss": -11.368282318115234, "global_step": 257559, "epoch": 1533} {"train_loss": -11.592428207397461, "global_step": 257560, "epoch": 1533} {"train_loss": -11.134063720703125, "global_step": 257561, "epoch": 1533} {"train_loss": -11.801555633544922, "global_step": 257562, "epoch": 1533} {"train_loss": -11.484621047973633, "global_step": 257563, "epoch": 1533} {"train_loss": -11.389580726623535, "global_step": 257564, "epoch": 1533} {"train_loss": -11.54587173461914, "global_step": 257565, "epoch": 1533} {"train_loss": -11.716754913330078, "global_step": 257566, "epoch": 1533} {"train_loss": -11.388175964355469, "global_step": 257567, "epoch": 1533} {"train_loss": -11.829484939575195, "global_step": 257568, "epoch": 1533} {"train_loss": -11.730365753173828, "global_step": 257569, "epoch": 1533} {"train_loss": -11.532699584960938, "global_step": 257570, "epoch": 1533} {"train_loss": -11.70975112915039, "global_step": 257571, "epoch": 1533} {"train_loss": -11.619024276733398, "global_step": 257572, "epoch": 1533} {"train_loss": -11.677591323852539, "global_step": 257573, "epoch": 1533} {"train_loss": -11.891040802001953, "global_step": 257574, "epoch": 1533} {"train_loss": -11.940983772277832, "global_step": 257575, "epoch": 1533} {"train_loss": -11.824027061462402, "global_step": 257576, "epoch": 1533} {"train_loss": -12.01948356628418, "global_step": 257577, "epoch": 1533} {"train_loss": -11.5084810256958, "global_step": 257578, "epoch": 1533} {"train_loss": -11.937124252319336, "global_step": 257579, "epoch": 1533} {"train_loss": -11.773330688476562, "global_step": 257580, "epoch": 1533} {"train_loss": -11.748271942138672, "global_step": 257581, "epoch": 1533} {"train_loss": -11.740228652954102, "global_step": 257582, "epoch": 1533} {"train_loss": -11.657499313354492, "global_step": 257583, "epoch": 1533} {"train_loss": -11.73654556274414, "global_step": 257584, "epoch": 1533} {"train_loss": -11.396600723266602, "global_step": 257585, "epoch": 1533} {"train_loss": -11.998885154724121, "global_step": 257586, "epoch": 1533} {"train_loss": -11.16244125366211, "global_step": 257587, "epoch": 1533} {"train_loss": -11.128209114074707, "global_step": 257588, "epoch": 1533} {"train_loss": -11.657699584960938, "global_step": 257589, "epoch": 1533} {"train_loss": -11.58487319946289, "global_step": 257590, "epoch": 1533} {"train_loss": -11.914073944091797, "global_step": 257591, "epoch": 1533} {"train_loss": -11.95495891571045, "global_step": 257592, "epoch": 1533} {"train_loss": -11.760992050170898, "global_step": 257593, "epoch": 1533} {"train_loss": -12.1375732421875, "global_step": 257594, "epoch": 1533} {"train_loss": -11.68642520904541, "global_step": 257595, "epoch": 1533} {"train_loss": -12.047304153442383, "global_step": 257596, "epoch": 1533} {"train_loss": -11.9782133102417, "global_step": 257597, "epoch": 1533} {"train_loss": -11.972155570983887, "global_step": 257598, "epoch": 1533} {"train_loss": -12.011995315551758, "global_step": 257599, "epoch": 1533} {"train_loss": -11.889938354492188, "global_step": 257600, "epoch": 1533} {"train_loss": -11.950843811035156, "global_step": 257601, "epoch": 1533} {"train_loss": -12.097286224365234, "global_step": 257602, "epoch": 1533} {"train_loss": -11.821615219116211, "global_step": 257603, "epoch": 1533} {"train_loss": -11.915654182434082, "global_step": 257604, "epoch": 1533} {"train_loss": -11.805276870727539, "global_step": 257605, "epoch": 1533} {"train_loss": -11.889373779296875, "global_step": 257606, "epoch": 1533} {"train_loss": -11.759380340576172, "global_step": 257607, "epoch": 1533} {"train_loss": -11.952886581420898, "global_step": 257608, "epoch": 1533} {"train_loss": -11.80311107635498, "global_step": 257609, "epoch": 1533} {"train_loss": -11.95290756225586, "global_step": 257610, "epoch": 1533} {"train_loss": -11.859468460083008, "global_step": 257611, "epoch": 1533} {"train_loss": -11.929109573364258, "global_step": 257612, "epoch": 1533} {"train_loss": -12.036372184753418, "global_step": 257613, "epoch": 1533} {"train_loss": -11.893386840820312, "global_step": 257614, "epoch": 1533} {"train_loss": -12.009510040283203, "global_step": 257615, "epoch": 1533} {"train_loss": -12.110492706298828, "global_step": 257616, "epoch": 1533} {"train_loss": -12.14393424987793, "global_step": 257617, "epoch": 1533} {"train_loss": -12.05355453491211, "global_step": 257618, "epoch": 1533} {"train_loss": -12.072540283203125, "global_step": 257619, "epoch": 1533} {"train_loss": -12.136090278625488, "global_step": 257620, "epoch": 1533} {"train_loss": -12.080265998840332, "global_step": 257621, "epoch": 1533} {"train_loss": -12.150772094726562, "global_step": 257622, "epoch": 1533} {"train_loss": -11.991575241088867, "global_step": 257623, "epoch": 1533} {"train_loss": -12.051895141601562, "global_step": 257624, "epoch": 1533} {"train_loss": -12.091899871826172, "global_step": 257625, "epoch": 1533} {"train_loss": -12.164079666137695, "global_step": 257626, "epoch": 1533} {"train_loss": -12.269160270690918, "global_step": 257627, "epoch": 1533} {"train_loss": -12.17733383178711, "global_step": 257628, "epoch": 1533} {"train_loss": -12.2808256149292, "global_step": 257629, "epoch": 1533} {"train_loss": -12.054323196411133, "global_step": 257630, "epoch": 1533} {"train_loss": -12.209177017211914, "global_step": 257631, "epoch": 1533} {"train_loss": -12.215285301208496, "global_step": 257632, "epoch": 1533} {"train_loss": -12.069902420043945, "global_step": 257633, "epoch": 1533} {"train_loss": -12.423458099365234, "global_step": 257634, "epoch": 1533} {"train_loss": -12.25374698638916, "global_step": 257635, "epoch": 1533} {"train_loss": -12.054239273071289, "global_step": 257636, "epoch": 1533} {"train_loss": -12.090873718261719, "global_step": 257637, "epoch": 1533} {"train_loss": -12.236419677734375, "global_step": 257638, "epoch": 1533} {"train_loss": -11.690616607666016, "global_step": 257639, "epoch": 1533} {"train_loss": -10.862526893615723, "global_step": 257640, "epoch": 1533} {"train_loss": -10.904901504516602, "global_step": 257641, "epoch": 1533} {"train_loss": -12.029919624328613, "global_step": 257642, "epoch": 1533} {"train_loss": -11.797417640686035, "global_step": 257643, "epoch": 1533} {"train_loss": -11.256217002868652, "global_step": 257644, "epoch": 1533} {"train_loss": -11.713163375854492, "global_step": 257645, "epoch": 1533} {"train_loss": -11.849227905273438, "global_step": 257646, "epoch": 1533} {"train_loss": -11.915771484375, "global_step": 257647, "epoch": 1533} {"train_loss": -11.799630165100098, "global_step": 257648, "epoch": 1533} {"train_loss": -12.134976387023926, "global_step": 257649, "epoch": 1533} {"train_loss": -11.804004669189453, "global_step": 257650, "epoch": 1533} {"train_loss": -11.94360637664795, "global_step": 257651, "epoch": 1533} {"train_loss": -11.809541702270508, "global_step": 257652, "epoch": 1533} {"train_loss": -12.1973876953125, "global_step": 257653, "epoch": 1533} {"train_loss": -12.016058921813965, "global_step": 257654, "epoch": 1533} {"train_loss": -12.111817359924316, "global_step": 257655, "epoch": 1533} {"train_loss": -12.197668075561523, "global_step": 257656, "epoch": 1533} {"train_loss": -12.04411506652832, "global_step": 257657, "epoch": 1533} {"train_loss": -12.315103530883789, "global_step": 257658, "epoch": 1533} {"train_loss": -11.898799896240234, "global_step": 257659, "epoch": 1533} {"train_loss": -11.823094367980957, "global_step": 257660, "epoch": 1533} {"train_loss": -12.156953811645508, "global_step": 257661, "epoch": 1533} {"train_loss": -12.098492622375488, "global_step": 257662, "epoch": 1533} {"train_loss": -12.223153114318848, "global_step": 257663, "epoch": 1533} {"train_loss": -12.115928649902344, "global_step": 257664, "epoch": 1533} {"train_loss": -12.108640670776367, "global_step": 257665, "epoch": 1533} {"train_loss": -12.216033935546875, "global_step": 257666, "epoch": 1533} {"train_loss": -12.208243370056152, "global_step": 257667, "epoch": 1533} {"train_loss": -12.229047775268555, "global_step": 257668, "epoch": 1533} {"train_loss": -11.996359825134277, "global_step": 257669, "epoch": 1533} {"train_loss": -12.178609848022461, "global_step": 257670, "epoch": 1533} {"train_loss": -12.268722534179688, "global_step": 257671, "epoch": 1533} {"train_loss": -11.996309280395508, "global_step": 257672, "epoch": 1533} {"train_loss": -12.018545150756836, "global_step": 257673, "epoch": 1533} {"train_loss": -12.029836654663086, "global_step": 257674, "epoch": 1533} {"train_loss": -12.03097152709961, "global_step": 257675, "epoch": 1533} {"train_loss": -11.603605270385742, "global_step": 257676, "epoch": 1533} {"train_loss": -11.79018783569336, "global_step": 257677, "epoch": 1533} {"train_loss": -11.641772270202637, "global_step": 257678, "epoch": 1533} {"train_loss": -11.149988174438477, "global_step": 257679, "epoch": 1533} {"train_loss": -10.532516479492188, "global_step": 257680, "epoch": 1533} {"train_loss": -10.72181510925293, "global_step": 257681, "epoch": 1533} {"train_loss": -12.023235321044922, "global_step": 257682, "epoch": 1533} {"train_loss": -11.74577808380127, "global_step": 257683, "epoch": 1533} {"train_loss": -11.691442489624023, "global_step": 257684, "epoch": 1533} {"train_loss": -12.023224830627441, "global_step": 257685, "epoch": 1533} {"train_loss": -11.99511432647705, "global_step": 257686, "epoch": 1533} {"train_loss": -12.053309440612793, "global_step": 257687, "epoch": 1533} {"train_loss": -11.842698097229004, "global_step": 257688, "epoch": 1533} {"train_loss": -11.860107421875, "global_step": 257689, "epoch": 1533} {"train_loss": -11.819853782653809, "global_step": 257690, "epoch": 1533} {"train_loss": -11.1400785446167, "global_step": 257691, "epoch": 1533} {"train_loss": -11.76594352722168, "global_step": 257692, "epoch": 1533} {"train_loss": -11.946640014648438, "global_step": 257693, "epoch": 1533} {"train_loss": -11.421566009521484, "global_step": 257694, "epoch": 1533} {"train_loss": -11.265556335449219, "global_step": 257695, "epoch": 1533} {"train_loss": -11.841238021850586, "global_step": 257696, "epoch": 1533} {"train_loss": -12.020088195800781, "global_step": 257697, "epoch": 1533} {"train_loss": -11.53732681274414, "global_step": 257698, "epoch": 1533} {"train_loss": -10.133148193359375, "global_step": 257699, "epoch": 1533} {"train_loss": -11.350120544433594, "global_step": 257700, "epoch": 1533} {"train_loss": -11.566644668579102, "global_step": 257701, "epoch": 1533} {"train_loss": -10.307052612304688, "global_step": 257702, "epoch": 1533} {"train_loss": -11.341547966003418, "global_step": 257703, "epoch": 1533} {"train_loss": -10.851823806762695, "global_step": 257704, "epoch": 1533} {"train_loss": -10.22608757019043, "global_step": 257705, "epoch": 1533} {"train_loss": -11.34390640258789, "global_step": 257706, "epoch": 1533} {"train_loss": -9.922819137573242, "global_step": 257707, "epoch": 1533} {"train_loss": -11.902776718139648, "global_step": 257708, "epoch": 1533} {"train_loss": -10.943216323852539, "global_step": 257709, "epoch": 1533} {"train_loss": -11.421463012695312, "global_step": 257710, "epoch": 1533} {"train_loss": -11.712105841863723, "global_step": 257711, "epoch": 1533, "val_loss": 270346.09375} {"train_loss": -10.908061981201172, "global_step": 257712, "epoch": 1534} {"train_loss": -11.663572311401367, "global_step": 257713, "epoch": 1534} {"train_loss": -10.275035858154297, "global_step": 257714, "epoch": 1534} {"train_loss": -10.938560485839844, "global_step": 257715, "epoch": 1534} {"train_loss": -11.249008178710938, "global_step": 257716, "epoch": 1534} {"train_loss": -10.111852645874023, "global_step": 257717, "epoch": 1534} {"train_loss": -11.415345191955566, "global_step": 257718, "epoch": 1534} {"train_loss": -9.725584030151367, "global_step": 257719, "epoch": 1534} {"train_loss": -10.782261848449707, "global_step": 257720, "epoch": 1534} {"train_loss": -10.195520401000977, "global_step": 257721, "epoch": 1534} {"train_loss": -10.058030128479004, "global_step": 257722, "epoch": 1534} {"train_loss": -11.230364799499512, "global_step": 257723, "epoch": 1534} {"train_loss": -9.865421295166016, "global_step": 257724, "epoch": 1534} {"train_loss": -11.635496139526367, "global_step": 257725, "epoch": 1534} {"train_loss": -10.389886856079102, "global_step": 257726, "epoch": 1534} {"train_loss": -11.302400588989258, "global_step": 257727, "epoch": 1534} {"train_loss": -10.432225227355957, "global_step": 257728, "epoch": 1534} {"train_loss": -11.194783210754395, "global_step": 257729, "epoch": 1534} {"train_loss": -10.865726470947266, "global_step": 257730, "epoch": 1534} {"train_loss": -10.833763122558594, "global_step": 257731, "epoch": 1534} {"train_loss": -10.579655647277832, "global_step": 257732, "epoch": 1534} {"train_loss": -10.938700675964355, "global_step": 257733, "epoch": 1534} {"train_loss": -10.275718688964844, "global_step": 257734, "epoch": 1534} {"train_loss": -10.638310432434082, "global_step": 257735, "epoch": 1534} {"train_loss": -10.767274856567383, "global_step": 257736, "epoch": 1534} {"train_loss": -11.223624229431152, "global_step": 257737, "epoch": 1534} {"train_loss": -10.322395324707031, "global_step": 257738, "epoch": 1534} {"train_loss": -11.348827362060547, "global_step": 257739, "epoch": 1534} {"train_loss": -10.802268981933594, "global_step": 257740, "epoch": 1534} {"train_loss": -11.153435707092285, "global_step": 257741, "epoch": 1534} {"train_loss": -10.426573753356934, "global_step": 257742, "epoch": 1534} {"train_loss": -11.496709823608398, "global_step": 257743, "epoch": 1534} {"train_loss": -10.614082336425781, "global_step": 257744, "epoch": 1534} {"train_loss": -11.638317108154297, "global_step": 257745, "epoch": 1534} {"train_loss": -10.867103576660156, "global_step": 257746, "epoch": 1534} {"train_loss": -11.159919738769531, "global_step": 257747, "epoch": 1534} {"train_loss": -11.26452350616455, "global_step": 257748, "epoch": 1534} {"train_loss": -11.364873886108398, "global_step": 257749, "epoch": 1534} {"train_loss": -11.555656433105469, "global_step": 257750, "epoch": 1534} {"train_loss": -11.083616256713867, "global_step": 257751, "epoch": 1534} {"train_loss": -11.602355003356934, "global_step": 257752, "epoch": 1534} {"train_loss": -10.745858192443848, "global_step": 257753, "epoch": 1534} {"train_loss": -11.573601722717285, "global_step": 257754, "epoch": 1534} {"train_loss": -10.758325576782227, "global_step": 257755, "epoch": 1534} {"train_loss": -11.699588775634766, "global_step": 257756, "epoch": 1534} {"train_loss": -11.292220115661621, "global_step": 257757, "epoch": 1534} {"train_loss": -11.57158088684082, "global_step": 257758, "epoch": 1534} {"train_loss": -11.611475944519043, "global_step": 257759, "epoch": 1534} {"train_loss": -11.331033706665039, "global_step": 257760, "epoch": 1534} {"train_loss": -11.712455749511719, "global_step": 257761, "epoch": 1534} {"train_loss": -11.305765151977539, "global_step": 257762, "epoch": 1534} {"train_loss": -11.340106964111328, "global_step": 257763, "epoch": 1534} {"train_loss": -11.6117582321167, "global_step": 257764, "epoch": 1534} {"train_loss": -11.444694519042969, "global_step": 257765, "epoch": 1534} {"train_loss": -11.474620819091797, "global_step": 257766, "epoch": 1534} {"train_loss": -11.923551559448242, "global_step": 257767, "epoch": 1534} {"train_loss": -11.465642929077148, "global_step": 257768, "epoch": 1534} {"train_loss": -11.840522766113281, "global_step": 257769, "epoch": 1534} {"train_loss": -11.701916694641113, "global_step": 257770, "epoch": 1534} {"train_loss": -11.651113510131836, "global_step": 257771, "epoch": 1534} {"train_loss": -11.844671249389648, "global_step": 257772, "epoch": 1534} {"train_loss": -11.554553985595703, "global_step": 257773, "epoch": 1534} {"train_loss": -11.742319107055664, "global_step": 257774, "epoch": 1534} {"train_loss": -11.930618286132812, "global_step": 257775, "epoch": 1534} {"train_loss": -12.075872421264648, "global_step": 257776, "epoch": 1534} {"train_loss": -11.68136215209961, "global_step": 257777, "epoch": 1534} {"train_loss": -12.118358612060547, "global_step": 257778, "epoch": 1534} {"train_loss": -11.4871826171875, "global_step": 257779, "epoch": 1534} {"train_loss": -11.721807479858398, "global_step": 257780, "epoch": 1534} {"train_loss": -11.824213027954102, "global_step": 257781, "epoch": 1534} {"train_loss": -11.612061500549316, "global_step": 257782, "epoch": 1534} {"train_loss": -11.901430130004883, "global_step": 257783, "epoch": 1534} {"train_loss": -11.834695816040039, "global_step": 257784, "epoch": 1534} {"train_loss": -11.929788589477539, "global_step": 257785, "epoch": 1534} {"train_loss": -11.702347755432129, "global_step": 257786, "epoch": 1534} {"train_loss": -11.818564414978027, "global_step": 257787, "epoch": 1534} {"train_loss": -12.110629081726074, "global_step": 257788, "epoch": 1534} {"train_loss": -11.916254043579102, "global_step": 257789, "epoch": 1534} {"train_loss": -11.905680656433105, "global_step": 257790, "epoch": 1534} {"train_loss": -11.982007026672363, "global_step": 257791, "epoch": 1534} {"train_loss": -11.874946594238281, "global_step": 257792, "epoch": 1534} {"train_loss": -11.784552574157715, "global_step": 257793, "epoch": 1534} {"train_loss": -12.132270812988281, "global_step": 257794, "epoch": 1534} {"train_loss": -11.727909088134766, "global_step": 257795, "epoch": 1534} {"train_loss": -12.058422088623047, "global_step": 257796, "epoch": 1534} {"train_loss": -11.8821382522583, "global_step": 257797, "epoch": 1534} {"train_loss": -12.018404960632324, "global_step": 257798, "epoch": 1534} {"train_loss": -11.850266456604004, "global_step": 257799, "epoch": 1534} {"train_loss": -12.163716316223145, "global_step": 257800, "epoch": 1534} {"train_loss": -11.83388900756836, "global_step": 257801, "epoch": 1534} {"train_loss": -12.124753952026367, "global_step": 257802, "epoch": 1534} {"train_loss": -11.7431640625, "global_step": 257803, "epoch": 1534} {"train_loss": -12.06430435180664, "global_step": 257804, "epoch": 1534} {"train_loss": -12.32767391204834, "global_step": 257805, "epoch": 1534} {"train_loss": -12.234014511108398, "global_step": 257806, "epoch": 1534} {"train_loss": -11.999670028686523, "global_step": 257807, "epoch": 1534} {"train_loss": -11.94802474975586, "global_step": 257808, "epoch": 1534} {"train_loss": -12.233726501464844, "global_step": 257809, "epoch": 1534} {"train_loss": -11.599884033203125, "global_step": 257810, "epoch": 1534} {"train_loss": -12.26420783996582, "global_step": 257811, "epoch": 1534} {"train_loss": -11.88835620880127, "global_step": 257812, "epoch": 1534} {"train_loss": -11.63888168334961, "global_step": 257813, "epoch": 1534} {"train_loss": -12.203939437866211, "global_step": 257814, "epoch": 1534} {"train_loss": -12.102108001708984, "global_step": 257815, "epoch": 1534} {"train_loss": -11.945846557617188, "global_step": 257816, "epoch": 1534} {"train_loss": -12.066046714782715, "global_step": 257817, "epoch": 1534} {"train_loss": -12.145471572875977, "global_step": 257818, "epoch": 1534} {"train_loss": -12.16336441040039, "global_step": 257819, "epoch": 1534} {"train_loss": -12.058581352233887, "global_step": 257820, "epoch": 1534} {"train_loss": -12.121374130249023, "global_step": 257821, "epoch": 1534} {"train_loss": -11.852829933166504, "global_step": 257822, "epoch": 1534} {"train_loss": -12.078798294067383, "global_step": 257823, "epoch": 1534} {"train_loss": -11.415484428405762, "global_step": 257824, "epoch": 1534} {"train_loss": -12.015388488769531, "global_step": 257825, "epoch": 1534} {"train_loss": -12.015419006347656, "global_step": 257826, "epoch": 1534} {"train_loss": -12.252670288085938, "global_step": 257827, "epoch": 1534} {"train_loss": -11.922640800476074, "global_step": 257828, "epoch": 1534} {"train_loss": -12.14976692199707, "global_step": 257829, "epoch": 1534} {"train_loss": -11.902891159057617, "global_step": 257830, "epoch": 1534} {"train_loss": -11.741222381591797, "global_step": 257831, "epoch": 1534} {"train_loss": -12.011031150817871, "global_step": 257832, "epoch": 1534} {"train_loss": -12.111252784729004, "global_step": 257833, "epoch": 1534} {"train_loss": -11.91769027709961, "global_step": 257834, "epoch": 1534} {"train_loss": -11.944849014282227, "global_step": 257835, "epoch": 1534} {"train_loss": -10.329717636108398, "global_step": 257836, "epoch": 1534} {"train_loss": -11.187751770019531, "global_step": 257837, "epoch": 1534} {"train_loss": -11.23016357421875, "global_step": 257838, "epoch": 1534} {"train_loss": -10.43237018585205, "global_step": 257839, "epoch": 1534} {"train_loss": -9.876327514648438, "global_step": 257840, "epoch": 1534} {"train_loss": -11.916130065917969, "global_step": 257841, "epoch": 1534} {"train_loss": -11.185236930847168, "global_step": 257842, "epoch": 1534} {"train_loss": -10.45920181274414, "global_step": 257843, "epoch": 1534} {"train_loss": -12.177498817443848, "global_step": 257844, "epoch": 1534} {"train_loss": -11.047935485839844, "global_step": 257845, "epoch": 1534} {"train_loss": -11.641470909118652, "global_step": 257846, "epoch": 1534} {"train_loss": -11.127760887145996, "global_step": 257847, "epoch": 1534} {"train_loss": -11.57218074798584, "global_step": 257848, "epoch": 1534} {"train_loss": -11.289371490478516, "global_step": 257849, "epoch": 1534} {"train_loss": -11.518087387084961, "global_step": 257850, "epoch": 1534} {"train_loss": -11.301055908203125, "global_step": 257851, "epoch": 1534} {"train_loss": -11.326236724853516, "global_step": 257852, "epoch": 1534} {"train_loss": -11.373063087463379, "global_step": 257853, "epoch": 1534} {"train_loss": -11.181546211242676, "global_step": 257854, "epoch": 1534} {"train_loss": -11.22403335571289, "global_step": 257855, "epoch": 1534} {"train_loss": -9.821699142456055, "global_step": 257856, "epoch": 1534} {"train_loss": -11.195873260498047, "global_step": 257857, "epoch": 1534} {"train_loss": -10.609979629516602, "global_step": 257858, "epoch": 1534} {"train_loss": -10.758138656616211, "global_step": 257859, "epoch": 1534} {"train_loss": -11.521013259887695, "global_step": 257860, "epoch": 1534} {"train_loss": -11.058636665344238, "global_step": 257861, "epoch": 1534} {"train_loss": -11.537590980529785, "global_step": 257862, "epoch": 1534} {"train_loss": -11.413324356079102, "global_step": 257863, "epoch": 1534} {"train_loss": -11.46539306640625, "global_step": 257864, "epoch": 1534} {"train_loss": -11.763411521911621, "global_step": 257865, "epoch": 1534} {"train_loss": -11.647605895996094, "global_step": 257866, "epoch": 1534} {"train_loss": -12.06371021270752, "global_step": 257867, "epoch": 1534} {"train_loss": -11.332561492919922, "global_step": 257868, "epoch": 1534} {"train_loss": -11.922746658325195, "global_step": 257869, "epoch": 1534} {"train_loss": -11.635456085205078, "global_step": 257870, "epoch": 1534} {"train_loss": -11.830179214477539, "global_step": 257871, "epoch": 1534} {"train_loss": -11.80621337890625, "global_step": 257872, "epoch": 1534} {"train_loss": -11.720773696899414, "global_step": 257873, "epoch": 1534} {"train_loss": -11.802303314208984, "global_step": 257874, "epoch": 1534} {"train_loss": -11.804605484008789, "global_step": 257875, "epoch": 1534} {"train_loss": -11.964844703674316, "global_step": 257876, "epoch": 1534} {"train_loss": -11.909220695495605, "global_step": 257877, "epoch": 1534} {"train_loss": -12.045040130615234, "global_step": 257878, "epoch": 1534} {"train_loss": -11.480275120053973, "global_step": 257879, "epoch": 1534, "val_loss": 270224.5625} {"train_loss": -12.025428771972656, "global_step": 257880, "epoch": 1535} {"train_loss": -11.971334457397461, "global_step": 257881, "epoch": 1535} {"train_loss": -12.10184097290039, "global_step": 257882, "epoch": 1535} {"train_loss": -12.197452545166016, "global_step": 257883, "epoch": 1535} {"train_loss": -11.935626983642578, "global_step": 257884, "epoch": 1535} {"train_loss": -11.731756210327148, "global_step": 257885, "epoch": 1535} {"train_loss": -12.106335639953613, "global_step": 257886, "epoch": 1535} {"train_loss": -12.000396728515625, "global_step": 257887, "epoch": 1535} {"train_loss": -12.137784004211426, "global_step": 257888, "epoch": 1535} {"train_loss": -12.077013969421387, "global_step": 257889, "epoch": 1535} {"train_loss": -12.022628784179688, "global_step": 257890, "epoch": 1535} {"train_loss": -12.18388843536377, "global_step": 257891, "epoch": 1535} {"train_loss": -12.243033409118652, "global_step": 257892, "epoch": 1535} {"train_loss": -12.030425071716309, "global_step": 257893, "epoch": 1535} {"train_loss": -12.186189651489258, "global_step": 257894, "epoch": 1535} {"train_loss": -12.305648803710938, "global_step": 257895, "epoch": 1535} {"train_loss": -12.115262985229492, "global_step": 257896, "epoch": 1535} {"train_loss": -12.196294784545898, "global_step": 257897, "epoch": 1535} {"train_loss": -12.08415412902832, "global_step": 257898, "epoch": 1535} {"train_loss": -12.232385635375977, "global_step": 257899, "epoch": 1535} {"train_loss": -11.920365333557129, "global_step": 257900, "epoch": 1535} {"train_loss": -11.997842788696289, "global_step": 257901, "epoch": 1535} {"train_loss": -12.15766716003418, "global_step": 257902, "epoch": 1535} {"train_loss": -11.916971206665039, "global_step": 257903, "epoch": 1535} {"train_loss": -12.141817092895508, "global_step": 257904, "epoch": 1535} {"train_loss": -12.282215118408203, "global_step": 257905, "epoch": 1535} {"train_loss": -12.206941604614258, "global_step": 257906, "epoch": 1535} {"train_loss": -12.186548233032227, "global_step": 257907, "epoch": 1535} {"train_loss": -12.187725067138672, "global_step": 257908, "epoch": 1535} {"train_loss": -11.99921989440918, "global_step": 257909, "epoch": 1535} {"train_loss": -11.965953826904297, "global_step": 257910, "epoch": 1535} {"train_loss": -12.0789155960083, "global_step": 257911, "epoch": 1535} {"train_loss": -11.54582691192627, "global_step": 257912, "epoch": 1535} {"train_loss": -11.738296508789062, "global_step": 257913, "epoch": 1535} {"train_loss": -12.357649803161621, "global_step": 257914, "epoch": 1535} {"train_loss": -11.552448272705078, "global_step": 257915, "epoch": 1535} {"train_loss": -11.950878143310547, "global_step": 257916, "epoch": 1535} {"train_loss": -12.267419815063477, "global_step": 257917, "epoch": 1535} {"train_loss": -11.946267127990723, "global_step": 257918, "epoch": 1535} {"train_loss": -11.222952842712402, "global_step": 257919, "epoch": 1535} {"train_loss": -11.763729095458984, "global_step": 257920, "epoch": 1535} {"train_loss": -12.299935340881348, "global_step": 257921, "epoch": 1535} {"train_loss": -11.739067077636719, "global_step": 257922, "epoch": 1535} {"train_loss": -11.774006843566895, "global_step": 257923, "epoch": 1535} {"train_loss": -12.123514175415039, "global_step": 257924, "epoch": 1535} {"train_loss": -11.419060707092285, "global_step": 257925, "epoch": 1535} {"train_loss": -12.192544937133789, "global_step": 257926, "epoch": 1535} {"train_loss": -11.722817420959473, "global_step": 257927, "epoch": 1535} {"train_loss": -11.950833320617676, "global_step": 257928, "epoch": 1535} {"train_loss": -11.601707458496094, "global_step": 257929, "epoch": 1535} {"train_loss": -10.924939155578613, "global_step": 257930, "epoch": 1535} {"train_loss": -9.870515823364258, "global_step": 257931, "epoch": 1535} {"train_loss": -11.763664245605469, "global_step": 257932, "epoch": 1535} {"train_loss": -10.548636436462402, "global_step": 257933, "epoch": 1535} {"train_loss": -10.334867477416992, "global_step": 257934, "epoch": 1535} {"train_loss": -11.444093704223633, "global_step": 257935, "epoch": 1535} {"train_loss": -11.627249717712402, "global_step": 257936, "epoch": 1535} {"train_loss": -10.458219528198242, "global_step": 257937, "epoch": 1535} {"train_loss": -11.19567584991455, "global_step": 257938, "epoch": 1535} {"train_loss": -9.294652938842773, "global_step": 257939, "epoch": 1535} {"train_loss": -9.984640121459961, "global_step": 257940, "epoch": 1535} {"train_loss": -7.292339324951172, "global_step": 257941, "epoch": 1535} {"train_loss": -10.937921524047852, "global_step": 257942, "epoch": 1535} {"train_loss": -8.266932487487793, "global_step": 257943, "epoch": 1535} {"train_loss": -10.430569648742676, "global_step": 257944, "epoch": 1535} {"train_loss": -8.84296989440918, "global_step": 257945, "epoch": 1535} {"train_loss": -10.121044158935547, "global_step": 257946, "epoch": 1535} {"train_loss": -9.011743545532227, "global_step": 257947, "epoch": 1535} {"train_loss": -10.62437629699707, "global_step": 257948, "epoch": 1535} {"train_loss": -9.97411060333252, "global_step": 257949, "epoch": 1535} {"train_loss": -10.94239330291748, "global_step": 257950, "epoch": 1535} {"train_loss": -8.949361801147461, "global_step": 257951, "epoch": 1535} {"train_loss": -10.882389068603516, "global_step": 257952, "epoch": 1535} {"train_loss": -9.821457862854004, "global_step": 257953, "epoch": 1535} {"train_loss": -10.866958618164062, "global_step": 257954, "epoch": 1535} {"train_loss": -9.984735488891602, "global_step": 257955, "epoch": 1535} {"train_loss": -11.460823059082031, "global_step": 257956, "epoch": 1535} {"train_loss": -10.637067794799805, "global_step": 257957, "epoch": 1535} {"train_loss": -11.370140075683594, "global_step": 257958, "epoch": 1535} {"train_loss": -10.908403396606445, "global_step": 257959, "epoch": 1535} {"train_loss": -11.403167724609375, "global_step": 257960, "epoch": 1535} {"train_loss": -11.356149673461914, "global_step": 257961, "epoch": 1535} {"train_loss": -11.5324125289917, "global_step": 257962, "epoch": 1535} {"train_loss": -11.106584548950195, "global_step": 257963, "epoch": 1535} {"train_loss": -11.317938804626465, "global_step": 257964, "epoch": 1535} {"train_loss": -11.355685234069824, "global_step": 257965, "epoch": 1535} {"train_loss": -11.439567565917969, "global_step": 257966, "epoch": 1535} {"train_loss": -11.633432388305664, "global_step": 257967, "epoch": 1535} {"train_loss": -11.496517181396484, "global_step": 257968, "epoch": 1535} {"train_loss": -11.758679389953613, "global_step": 257969, "epoch": 1535} {"train_loss": -11.430157661437988, "global_step": 257970, "epoch": 1535} {"train_loss": -11.510785102844238, "global_step": 257971, "epoch": 1535} {"train_loss": -11.650084495544434, "global_step": 257972, "epoch": 1535} {"train_loss": -11.606657981872559, "global_step": 257973, "epoch": 1535} {"train_loss": -11.600723266601562, "global_step": 257974, "epoch": 1535} {"train_loss": -11.671327590942383, "global_step": 257975, "epoch": 1535} {"train_loss": -11.758644104003906, "global_step": 257976, "epoch": 1535} {"train_loss": -11.679771423339844, "global_step": 257977, "epoch": 1535} {"train_loss": -11.698859214782715, "global_step": 257978, "epoch": 1535} {"train_loss": -11.65596866607666, "global_step": 257979, "epoch": 1535} {"train_loss": -11.63530158996582, "global_step": 257980, "epoch": 1535} {"train_loss": -11.84170913696289, "global_step": 257981, "epoch": 1535} {"train_loss": -11.911296844482422, "global_step": 257982, "epoch": 1535} {"train_loss": -11.939177513122559, "global_step": 257983, "epoch": 1535} {"train_loss": -11.729082107543945, "global_step": 257984, "epoch": 1535} {"train_loss": -11.894906997680664, "global_step": 257985, "epoch": 1535} {"train_loss": -11.85761833190918, "global_step": 257986, "epoch": 1535} {"train_loss": -11.881816864013672, "global_step": 257987, "epoch": 1535} {"train_loss": -11.772989273071289, "global_step": 257988, "epoch": 1535} {"train_loss": -12.010476112365723, "global_step": 257989, "epoch": 1535} {"train_loss": -11.880420684814453, "global_step": 257990, "epoch": 1535} {"train_loss": -12.1350736618042, "global_step": 257991, "epoch": 1535} {"train_loss": -11.879308700561523, "global_step": 257992, "epoch": 1535} {"train_loss": -11.93893051147461, "global_step": 257993, "epoch": 1535} {"train_loss": -11.992183685302734, "global_step": 257994, "epoch": 1535} {"train_loss": -12.026594161987305, "global_step": 257995, "epoch": 1535} {"train_loss": -12.033297538757324, "global_step": 257996, "epoch": 1535} {"train_loss": -11.946453094482422, "global_step": 257997, "epoch": 1535} {"train_loss": -11.974014282226562, "global_step": 257998, "epoch": 1535} {"train_loss": -11.706003189086914, "global_step": 257999, "epoch": 1535} {"train_loss": -12.13532829284668, "global_step": 258000, "epoch": 1535} {"train_loss": -11.847358703613281, "global_step": 258001, "epoch": 1535} {"train_loss": -12.133696556091309, "global_step": 258002, "epoch": 1535} {"train_loss": -12.034927368164062, "global_step": 258003, "epoch": 1535} {"train_loss": -11.970871925354004, "global_step": 258004, "epoch": 1535} {"train_loss": -11.822112083435059, "global_step": 258005, "epoch": 1535} {"train_loss": -11.810168266296387, "global_step": 258006, "epoch": 1535} {"train_loss": -11.753702163696289, "global_step": 258007, "epoch": 1535} {"train_loss": -11.619386672973633, "global_step": 258008, "epoch": 1535} {"train_loss": -10.261537551879883, "global_step": 258009, "epoch": 1535} {"train_loss": -11.821837425231934, "global_step": 258010, "epoch": 1535} {"train_loss": -11.14387321472168, "global_step": 258011, "epoch": 1535} {"train_loss": -10.799661636352539, "global_step": 258012, "epoch": 1535} {"train_loss": -11.686088562011719, "global_step": 258013, "epoch": 1535} {"train_loss": -11.432271957397461, "global_step": 258014, "epoch": 1535} {"train_loss": -11.202261924743652, "global_step": 258015, "epoch": 1535} {"train_loss": -11.711551666259766, "global_step": 258016, "epoch": 1535} {"train_loss": -10.966865539550781, "global_step": 258017, "epoch": 1535} {"train_loss": -11.445499420166016, "global_step": 258018, "epoch": 1535} {"train_loss": -11.033834457397461, "global_step": 258019, "epoch": 1535} {"train_loss": -11.606302261352539, "global_step": 258020, "epoch": 1535} {"train_loss": -11.60346794128418, "global_step": 258021, "epoch": 1535} {"train_loss": -11.66596508026123, "global_step": 258022, "epoch": 1535} {"train_loss": -11.738275527954102, "global_step": 258023, "epoch": 1535} {"train_loss": -11.768117904663086, "global_step": 258024, "epoch": 1535} {"train_loss": -11.679128646850586, "global_step": 258025, "epoch": 1535} {"train_loss": -11.464303970336914, "global_step": 258026, "epoch": 1535} {"train_loss": -11.290750503540039, "global_step": 258027, "epoch": 1535} {"train_loss": -11.865100860595703, "global_step": 258028, "epoch": 1535} {"train_loss": -11.31403923034668, "global_step": 258029, "epoch": 1535} {"train_loss": -11.94705867767334, "global_step": 258030, "epoch": 1535} {"train_loss": -11.69757080078125, "global_step": 258031, "epoch": 1535} {"train_loss": -11.505552291870117, "global_step": 258032, "epoch": 1535} {"train_loss": -11.979416847229004, "global_step": 258033, "epoch": 1535} {"train_loss": -11.661548614501953, "global_step": 258034, "epoch": 1535} {"train_loss": -11.980478286743164, "global_step": 258035, "epoch": 1535} {"train_loss": -11.557538986206055, "global_step": 258036, "epoch": 1535} {"train_loss": -11.814266204833984, "global_step": 258037, "epoch": 1535} {"train_loss": -11.736954689025879, "global_step": 258038, "epoch": 1535} {"train_loss": -11.65693473815918, "global_step": 258039, "epoch": 1535} {"train_loss": -11.669551849365234, "global_step": 258040, "epoch": 1535} {"train_loss": -12.05732536315918, "global_step": 258041, "epoch": 1535} {"train_loss": -12.168159484863281, "global_step": 258042, "epoch": 1535} {"train_loss": -12.117522239685059, "global_step": 258043, "epoch": 1535} {"train_loss": -11.896832466125488, "global_step": 258044, "epoch": 1535} {"train_loss": -12.06639289855957, "global_step": 258045, "epoch": 1535} {"train_loss": -12.151668548583984, "global_step": 258046, "epoch": 1535} {"train_loss": -11.534765623864674, "global_step": 258047, "epoch": 1535, "val_loss": 261616.796875, "train_action_mse_error": 3.6302366256713867} {"train_loss": -12.022080421447754, "global_step": 258048, "epoch": 1536} {"train_loss": -11.898796081542969, "global_step": 258049, "epoch": 1536} {"train_loss": -12.158714294433594, "global_step": 258050, "epoch": 1536} {"train_loss": -11.69469928741455, "global_step": 258051, "epoch": 1536} {"train_loss": -12.130245208740234, "global_step": 258052, "epoch": 1536} {"train_loss": -11.460963249206543, "global_step": 258053, "epoch": 1536} {"train_loss": -11.886199951171875, "global_step": 258054, "epoch": 1536} {"train_loss": -11.828351020812988, "global_step": 258055, "epoch": 1536} {"train_loss": -11.989426612854004, "global_step": 258056, "epoch": 1536} {"train_loss": -11.84919548034668, "global_step": 258057, "epoch": 1536} {"train_loss": -12.019137382507324, "global_step": 258058, "epoch": 1536} {"train_loss": -11.957337379455566, "global_step": 258059, "epoch": 1536} {"train_loss": -11.927682876586914, "global_step": 258060, "epoch": 1536} {"train_loss": -11.955568313598633, "global_step": 258061, "epoch": 1536} {"train_loss": -12.042207717895508, "global_step": 258062, "epoch": 1536} {"train_loss": -12.097467422485352, "global_step": 258063, "epoch": 1536} {"train_loss": -12.013605117797852, "global_step": 258064, "epoch": 1536} {"train_loss": -12.010233879089355, "global_step": 258065, "epoch": 1536} {"train_loss": -12.22563648223877, "global_step": 258066, "epoch": 1536} {"train_loss": -11.868444442749023, "global_step": 258067, "epoch": 1536} {"train_loss": -12.197229385375977, "global_step": 258068, "epoch": 1536} {"train_loss": -11.593835830688477, "global_step": 258069, "epoch": 1536} {"train_loss": -12.044448852539062, "global_step": 258070, "epoch": 1536} {"train_loss": -12.131844520568848, "global_step": 258071, "epoch": 1536} {"train_loss": -12.018771171569824, "global_step": 258072, "epoch": 1536} {"train_loss": -12.060602188110352, "global_step": 258073, "epoch": 1536} {"train_loss": -12.114825248718262, "global_step": 258074, "epoch": 1536} {"train_loss": -11.990119934082031, "global_step": 258075, "epoch": 1536} {"train_loss": -11.820629119873047, "global_step": 258076, "epoch": 1536} {"train_loss": -11.672038078308105, "global_step": 258077, "epoch": 1536} {"train_loss": -11.355545043945312, "global_step": 258078, "epoch": 1536} {"train_loss": -11.961175918579102, "global_step": 258079, "epoch": 1536} {"train_loss": -11.677231788635254, "global_step": 258080, "epoch": 1536} {"train_loss": -10.998916625976562, "global_step": 258081, "epoch": 1536} {"train_loss": -11.43091106414795, "global_step": 258082, "epoch": 1536} {"train_loss": -10.46416187286377, "global_step": 258083, "epoch": 1536} {"train_loss": -9.601642608642578, "global_step": 258084, "epoch": 1536} {"train_loss": -9.88349723815918, "global_step": 258085, "epoch": 1536} {"train_loss": -10.09196949005127, "global_step": 258086, "epoch": 1536} {"train_loss": -10.755373001098633, "global_step": 258087, "epoch": 1536} {"train_loss": -11.535411834716797, "global_step": 258088, "epoch": 1536} {"train_loss": -9.46809196472168, "global_step": 258089, "epoch": 1536} {"train_loss": -10.862428665161133, "global_step": 258090, "epoch": 1536} {"train_loss": -9.162005424499512, "global_step": 258091, "epoch": 1536} {"train_loss": -9.595647811889648, "global_step": 258092, "epoch": 1536} {"train_loss": -8.215351104736328, "global_step": 258093, "epoch": 1536} {"train_loss": -6.837390899658203, "global_step": 258094, "epoch": 1536} {"train_loss": -7.747848033905029, "global_step": 258095, "epoch": 1536} {"train_loss": -9.624670028686523, "global_step": 258096, "epoch": 1536} {"train_loss": -9.77403736114502, "global_step": 258097, "epoch": 1536} {"train_loss": -10.29044246673584, "global_step": 258098, "epoch": 1536} {"train_loss": -9.679150581359863, "global_step": 258099, "epoch": 1536} {"train_loss": -10.858217239379883, "global_step": 258100, "epoch": 1536} {"train_loss": -9.16839599609375, "global_step": 258101, "epoch": 1536} {"train_loss": -10.440374374389648, "global_step": 258102, "epoch": 1536} {"train_loss": -10.1258544921875, "global_step": 258103, "epoch": 1536} {"train_loss": -9.95766830444336, "global_step": 258104, "epoch": 1536} {"train_loss": -11.003623962402344, "global_step": 258105, "epoch": 1536} {"train_loss": -10.99658489227295, "global_step": 258106, "epoch": 1536} {"train_loss": -10.59134292602539, "global_step": 258107, "epoch": 1536} {"train_loss": -10.36008071899414, "global_step": 258108, "epoch": 1536} {"train_loss": -10.58492374420166, "global_step": 258109, "epoch": 1536} {"train_loss": -10.445598602294922, "global_step": 258110, "epoch": 1536} {"train_loss": -11.309215545654297, "global_step": 258111, "epoch": 1536} {"train_loss": -10.84980297088623, "global_step": 258112, "epoch": 1536} {"train_loss": -10.92531681060791, "global_step": 258113, "epoch": 1536} {"train_loss": -11.199657440185547, "global_step": 258114, "epoch": 1536} {"train_loss": -10.975249290466309, "global_step": 258115, "epoch": 1536} {"train_loss": -11.188576698303223, "global_step": 258116, "epoch": 1536} {"train_loss": -11.517760276794434, "global_step": 258117, "epoch": 1536} {"train_loss": -11.192858695983887, "global_step": 258118, "epoch": 1536} {"train_loss": -11.257102012634277, "global_step": 258119, "epoch": 1536} {"train_loss": -11.47957992553711, "global_step": 258120, "epoch": 1536} {"train_loss": -11.460559844970703, "global_step": 258121, "epoch": 1536} {"train_loss": -11.505656242370605, "global_step": 258122, "epoch": 1536} {"train_loss": -11.584586143493652, "global_step": 258123, "epoch": 1536} {"train_loss": -11.60006332397461, "global_step": 258124, "epoch": 1536} {"train_loss": -11.249163627624512, "global_step": 258125, "epoch": 1536} {"train_loss": -11.809679985046387, "global_step": 258126, "epoch": 1536} {"train_loss": -11.668512344360352, "global_step": 258127, "epoch": 1536} {"train_loss": -11.629281044006348, "global_step": 258128, "epoch": 1536} {"train_loss": -11.423460006713867, "global_step": 258129, "epoch": 1536} {"train_loss": -11.403572082519531, "global_step": 258130, "epoch": 1536} {"train_loss": -11.638969421386719, "global_step": 258131, "epoch": 1536} {"train_loss": -11.708841323852539, "global_step": 258132, "epoch": 1536} {"train_loss": -11.813485145568848, "global_step": 258133, "epoch": 1536} {"train_loss": -11.715780258178711, "global_step": 258134, "epoch": 1536} {"train_loss": -11.81595230102539, "global_step": 258135, "epoch": 1536} {"train_loss": -11.688139915466309, "global_step": 258136, "epoch": 1536} {"train_loss": -11.776383399963379, "global_step": 258137, "epoch": 1536} {"train_loss": -11.476430892944336, "global_step": 258138, "epoch": 1536} {"train_loss": -11.761870384216309, "global_step": 258139, "epoch": 1536} {"train_loss": -11.691560745239258, "global_step": 258140, "epoch": 1536} {"train_loss": -11.906778335571289, "global_step": 258141, "epoch": 1536} {"train_loss": -11.711633682250977, "global_step": 258142, "epoch": 1536} {"train_loss": -11.740055084228516, "global_step": 258143, "epoch": 1536} {"train_loss": -11.792228698730469, "global_step": 258144, "epoch": 1536} {"train_loss": -11.891862869262695, "global_step": 258145, "epoch": 1536} {"train_loss": -11.667201042175293, "global_step": 258146, "epoch": 1536} {"train_loss": -11.86241626739502, "global_step": 258147, "epoch": 1536} {"train_loss": -11.944683074951172, "global_step": 258148, "epoch": 1536} {"train_loss": -11.891764640808105, "global_step": 258149, "epoch": 1536} {"train_loss": -11.798324584960938, "global_step": 258150, "epoch": 1536} {"train_loss": -11.915231704711914, "global_step": 258151, "epoch": 1536} {"train_loss": -11.843341827392578, "global_step": 258152, "epoch": 1536} {"train_loss": -12.044831275939941, "global_step": 258153, "epoch": 1536} {"train_loss": -11.869806289672852, "global_step": 258154, "epoch": 1536} {"train_loss": -11.706449508666992, "global_step": 258155, "epoch": 1536} {"train_loss": -11.859796524047852, "global_step": 258156, "epoch": 1536} {"train_loss": -11.85517692565918, "global_step": 258157, "epoch": 1536} {"train_loss": -11.951870918273926, "global_step": 258158, "epoch": 1536} {"train_loss": -11.952659606933594, "global_step": 258159, "epoch": 1536} {"train_loss": -11.64919662475586, "global_step": 258160, "epoch": 1536} {"train_loss": -11.942811965942383, "global_step": 258161, "epoch": 1536} {"train_loss": -11.947687149047852, "global_step": 258162, "epoch": 1536} {"train_loss": -11.9431734085083, "global_step": 258163, "epoch": 1536} {"train_loss": -11.953421592712402, "global_step": 258164, "epoch": 1536} {"train_loss": -11.867181777954102, "global_step": 258165, "epoch": 1536} {"train_loss": -12.036587715148926, "global_step": 258166, "epoch": 1536} {"train_loss": -11.989500045776367, "global_step": 258167, "epoch": 1536} {"train_loss": -11.789616584777832, "global_step": 258168, "epoch": 1536} {"train_loss": -11.986459732055664, "global_step": 258169, "epoch": 1536} {"train_loss": -11.856490135192871, "global_step": 258170, "epoch": 1536} {"train_loss": -11.922574996948242, "global_step": 258171, "epoch": 1536} {"train_loss": -11.925434112548828, "global_step": 258172, "epoch": 1536} {"train_loss": -11.780245780944824, "global_step": 258173, "epoch": 1536} {"train_loss": -11.509443283081055, "global_step": 258174, "epoch": 1536} {"train_loss": -11.600317001342773, "global_step": 258175, "epoch": 1536} {"train_loss": -11.85224723815918, "global_step": 258176, "epoch": 1536} {"train_loss": -11.787346839904785, "global_step": 258177, "epoch": 1536} {"train_loss": -11.53143310546875, "global_step": 258178, "epoch": 1536} {"train_loss": -11.576898574829102, "global_step": 258179, "epoch": 1536} {"train_loss": -11.81285285949707, "global_step": 258180, "epoch": 1536} {"train_loss": -12.002224922180176, "global_step": 258181, "epoch": 1536} {"train_loss": -11.745562553405762, "global_step": 258182, "epoch": 1536} {"train_loss": -11.807479858398438, "global_step": 258183, "epoch": 1536} {"train_loss": -12.05879020690918, "global_step": 258184, "epoch": 1536} {"train_loss": -12.000336647033691, "global_step": 258185, "epoch": 1536} {"train_loss": -11.838232040405273, "global_step": 258186, "epoch": 1536} {"train_loss": -12.104558944702148, "global_step": 258187, "epoch": 1536} {"train_loss": -11.968281745910645, "global_step": 258188, "epoch": 1536} {"train_loss": -11.765583038330078, "global_step": 258189, "epoch": 1536} {"train_loss": -12.026152610778809, "global_step": 258190, "epoch": 1536} {"train_loss": -11.892478942871094, "global_step": 258191, "epoch": 1536} {"train_loss": -11.874886512756348, "global_step": 258192, "epoch": 1536} {"train_loss": -12.035860061645508, "global_step": 258193, "epoch": 1536} {"train_loss": -11.875387191772461, "global_step": 258194, "epoch": 1536} {"train_loss": -11.570804595947266, "global_step": 258195, "epoch": 1536} {"train_loss": -11.420703887939453, "global_step": 258196, "epoch": 1536} {"train_loss": -11.609395027160645, "global_step": 258197, "epoch": 1536} {"train_loss": -11.624038696289062, "global_step": 258198, "epoch": 1536} {"train_loss": -11.782188415527344, "global_step": 258199, "epoch": 1536} {"train_loss": -10.668580055236816, "global_step": 258200, "epoch": 1536} {"train_loss": -11.42676830291748, "global_step": 258201, "epoch": 1536} {"train_loss": -11.900726318359375, "global_step": 258202, "epoch": 1536} {"train_loss": -11.327743530273438, "global_step": 258203, "epoch": 1536} {"train_loss": -11.787345886230469, "global_step": 258204, "epoch": 1536} {"train_loss": -11.752888679504395, "global_step": 258205, "epoch": 1536} {"train_loss": -11.670772552490234, "global_step": 258206, "epoch": 1536} {"train_loss": -11.309776306152344, "global_step": 258207, "epoch": 1536} {"train_loss": -11.925850868225098, "global_step": 258208, "epoch": 1536} {"train_loss": -11.56895637512207, "global_step": 258209, "epoch": 1536} {"train_loss": -11.663423538208008, "global_step": 258210, "epoch": 1536} {"train_loss": -11.681367874145508, "global_step": 258211, "epoch": 1536} {"train_loss": -11.614774703979492, "global_step": 258212, "epoch": 1536} {"train_loss": -11.38149642944336, "global_step": 258213, "epoch": 1536} {"train_loss": -11.66512680053711, "global_step": 258214, "epoch": 1536} {"train_loss": -11.43693245876403, "global_step": 258215, "epoch": 1536, "val_loss": 267609.09375} {"train_loss": -11.648977279663086, "global_step": 258216, "epoch": 1537} {"train_loss": -11.486308097839355, "global_step": 258217, "epoch": 1537} {"train_loss": -10.969850540161133, "global_step": 258218, "epoch": 1537} {"train_loss": -11.767667770385742, "global_step": 258219, "epoch": 1537} {"train_loss": -11.826187133789062, "global_step": 258220, "epoch": 1537} {"train_loss": -11.554893493652344, "global_step": 258221, "epoch": 1537} {"train_loss": -11.755973815917969, "global_step": 258222, "epoch": 1537} {"train_loss": -11.804271697998047, "global_step": 258223, "epoch": 1537} {"train_loss": -11.790223121643066, "global_step": 258224, "epoch": 1537} {"train_loss": -11.806915283203125, "global_step": 258225, "epoch": 1537} {"train_loss": -11.904050827026367, "global_step": 258226, "epoch": 1537} {"train_loss": -11.676595687866211, "global_step": 258227, "epoch": 1537} {"train_loss": -11.680797576904297, "global_step": 258228, "epoch": 1537} {"train_loss": -11.839947700500488, "global_step": 258229, "epoch": 1537} {"train_loss": -11.741907119750977, "global_step": 258230, "epoch": 1537} {"train_loss": -11.738216400146484, "global_step": 258231, "epoch": 1537} {"train_loss": -11.879304885864258, "global_step": 258232, "epoch": 1537} {"train_loss": -11.998429298400879, "global_step": 258233, "epoch": 1537} {"train_loss": -12.075119018554688, "global_step": 258234, "epoch": 1537} {"train_loss": -12.072309494018555, "global_step": 258235, "epoch": 1537} {"train_loss": -12.202632904052734, "global_step": 258236, "epoch": 1537} {"train_loss": -12.015947341918945, "global_step": 258237, "epoch": 1537} {"train_loss": -12.053411483764648, "global_step": 258238, "epoch": 1537} {"train_loss": -11.909774780273438, "global_step": 258239, "epoch": 1537} {"train_loss": -11.909252166748047, "global_step": 258240, "epoch": 1537} {"train_loss": -12.237972259521484, "global_step": 258241, "epoch": 1537} {"train_loss": -12.172582626342773, "global_step": 258242, "epoch": 1537} {"train_loss": -12.064776420593262, "global_step": 258243, "epoch": 1537} {"train_loss": -11.906264305114746, "global_step": 258244, "epoch": 1537} {"train_loss": -12.273255348205566, "global_step": 258245, "epoch": 1537} {"train_loss": -11.804914474487305, "global_step": 258246, "epoch": 1537} {"train_loss": -11.87603759765625, "global_step": 258247, "epoch": 1537} {"train_loss": -12.164782524108887, "global_step": 258248, "epoch": 1537} {"train_loss": -11.877767562866211, "global_step": 258249, "epoch": 1537} {"train_loss": -12.111982345581055, "global_step": 258250, "epoch": 1537} {"train_loss": -12.229745864868164, "global_step": 258251, "epoch": 1537} {"train_loss": -11.981348037719727, "global_step": 258252, "epoch": 1537} {"train_loss": -11.979616165161133, "global_step": 258253, "epoch": 1537} {"train_loss": -12.14318561553955, "global_step": 258254, "epoch": 1537} {"train_loss": -11.868005752563477, "global_step": 258255, "epoch": 1537} {"train_loss": -11.728174209594727, "global_step": 258256, "epoch": 1537} {"train_loss": -12.152544021606445, "global_step": 258257, "epoch": 1537} {"train_loss": -11.883320808410645, "global_step": 258258, "epoch": 1537} {"train_loss": -11.463220596313477, "global_step": 258259, "epoch": 1537} {"train_loss": -12.065256118774414, "global_step": 258260, "epoch": 1537} {"train_loss": -12.039430618286133, "global_step": 258261, "epoch": 1537} {"train_loss": -11.855293273925781, "global_step": 258262, "epoch": 1537} {"train_loss": -11.759775161743164, "global_step": 258263, "epoch": 1537} {"train_loss": -11.917776107788086, "global_step": 258264, "epoch": 1537} {"train_loss": -11.992025375366211, "global_step": 258265, "epoch": 1537} {"train_loss": -11.988906860351562, "global_step": 258266, "epoch": 1537} {"train_loss": -12.14547348022461, "global_step": 258267, "epoch": 1537} {"train_loss": -11.784299850463867, "global_step": 258268, "epoch": 1537} {"train_loss": -11.366540908813477, "global_step": 258269, "epoch": 1537} {"train_loss": -11.729452133178711, "global_step": 258270, "epoch": 1537} {"train_loss": -11.725971221923828, "global_step": 258271, "epoch": 1537} {"train_loss": -11.450572967529297, "global_step": 258272, "epoch": 1537} {"train_loss": -12.084016799926758, "global_step": 258273, "epoch": 1537} {"train_loss": -12.075897216796875, "global_step": 258274, "epoch": 1537} {"train_loss": -12.181126594543457, "global_step": 258275, "epoch": 1537} {"train_loss": -12.030000686645508, "global_step": 258276, "epoch": 1537} {"train_loss": -12.034561157226562, "global_step": 258277, "epoch": 1537} {"train_loss": -12.193218231201172, "global_step": 258278, "epoch": 1537} {"train_loss": -11.877157211303711, "global_step": 258279, "epoch": 1537} {"train_loss": -11.46652603149414, "global_step": 258280, "epoch": 1537} {"train_loss": -11.97359561920166, "global_step": 258281, "epoch": 1537} {"train_loss": -12.10157585144043, "global_step": 258282, "epoch": 1537} {"train_loss": -11.7633056640625, "global_step": 258283, "epoch": 1537} {"train_loss": -12.012107849121094, "global_step": 258284, "epoch": 1537} {"train_loss": -12.120401382446289, "global_step": 258285, "epoch": 1537} {"train_loss": -12.043039321899414, "global_step": 258286, "epoch": 1537} {"train_loss": -11.477521896362305, "global_step": 258287, "epoch": 1537} {"train_loss": -10.845032691955566, "global_step": 258288, "epoch": 1537} {"train_loss": -10.629386901855469, "global_step": 258289, "epoch": 1537} {"train_loss": -11.993370056152344, "global_step": 258290, "epoch": 1537} {"train_loss": -11.960268020629883, "global_step": 258291, "epoch": 1537} {"train_loss": -11.605566024780273, "global_step": 258292, "epoch": 1537} {"train_loss": -11.680047988891602, "global_step": 258293, "epoch": 1537} {"train_loss": -11.820558547973633, "global_step": 258294, "epoch": 1537} {"train_loss": -11.822961807250977, "global_step": 258295, "epoch": 1537} {"train_loss": -11.590798377990723, "global_step": 258296, "epoch": 1537} {"train_loss": -11.507670402526855, "global_step": 258297, "epoch": 1537} {"train_loss": -11.809188842773438, "global_step": 258298, "epoch": 1537} {"train_loss": -12.004185676574707, "global_step": 258299, "epoch": 1537} {"train_loss": -11.615104675292969, "global_step": 258300, "epoch": 1537} {"train_loss": -11.791826248168945, "global_step": 258301, "epoch": 1537} {"train_loss": -12.10627269744873, "global_step": 258302, "epoch": 1537} {"train_loss": -11.889541625976562, "global_step": 258303, "epoch": 1537} {"train_loss": -12.053436279296875, "global_step": 258304, "epoch": 1537} {"train_loss": -12.019830703735352, "global_step": 258305, "epoch": 1537} {"train_loss": -12.182930946350098, "global_step": 258306, "epoch": 1537} {"train_loss": -12.069036483764648, "global_step": 258307, "epoch": 1537} {"train_loss": -12.050457000732422, "global_step": 258308, "epoch": 1537} {"train_loss": -12.035299301147461, "global_step": 258309, "epoch": 1537} {"train_loss": -11.989734649658203, "global_step": 258310, "epoch": 1537} {"train_loss": -11.90677261352539, "global_step": 258311, "epoch": 1537} {"train_loss": -11.590108871459961, "global_step": 258312, "epoch": 1537} {"train_loss": -11.947265625, "global_step": 258313, "epoch": 1537} {"train_loss": -11.661375045776367, "global_step": 258314, "epoch": 1537} {"train_loss": -11.712383270263672, "global_step": 258315, "epoch": 1537} {"train_loss": -12.230605125427246, "global_step": 258316, "epoch": 1537} {"train_loss": -11.47027587890625, "global_step": 258317, "epoch": 1537} {"train_loss": -11.189611434936523, "global_step": 258318, "epoch": 1537} {"train_loss": -11.650802612304688, "global_step": 258319, "epoch": 1537} {"train_loss": -11.615812301635742, "global_step": 258320, "epoch": 1537} {"train_loss": -10.525175094604492, "global_step": 258321, "epoch": 1537} {"train_loss": -12.03459358215332, "global_step": 258322, "epoch": 1537} {"train_loss": -9.515412330627441, "global_step": 258323, "epoch": 1537} {"train_loss": -9.706687927246094, "global_step": 258324, "epoch": 1537} {"train_loss": -9.898265838623047, "global_step": 258325, "epoch": 1537} {"train_loss": -10.775726318359375, "global_step": 258326, "epoch": 1537} {"train_loss": -9.958362579345703, "global_step": 258327, "epoch": 1537} {"train_loss": -8.548463821411133, "global_step": 258328, "epoch": 1537} {"train_loss": -10.481792449951172, "global_step": 258329, "epoch": 1537} {"train_loss": -9.031583786010742, "global_step": 258330, "epoch": 1537} {"train_loss": -9.283842086791992, "global_step": 258331, "epoch": 1537} {"train_loss": -9.735724449157715, "global_step": 258332, "epoch": 1537} {"train_loss": -8.545675277709961, "global_step": 258333, "epoch": 1537} {"train_loss": -9.255925178527832, "global_step": 258334, "epoch": 1537} {"train_loss": -9.503801345825195, "global_step": 258335, "epoch": 1537} {"train_loss": -9.119649887084961, "global_step": 258336, "epoch": 1537} {"train_loss": -9.994111061096191, "global_step": 258337, "epoch": 1537} {"train_loss": -10.469894409179688, "global_step": 258338, "epoch": 1537} {"train_loss": -9.847509384155273, "global_step": 258339, "epoch": 1537} {"train_loss": -10.84170150756836, "global_step": 258340, "epoch": 1537} {"train_loss": -10.50912094116211, "global_step": 258341, "epoch": 1537} {"train_loss": -11.265850067138672, "global_step": 258342, "epoch": 1537} {"train_loss": -10.95926284790039, "global_step": 258343, "epoch": 1537} {"train_loss": -11.168975830078125, "global_step": 258344, "epoch": 1537} {"train_loss": -11.272218704223633, "global_step": 258345, "epoch": 1537} {"train_loss": -11.352577209472656, "global_step": 258346, "epoch": 1537} {"train_loss": -11.511171340942383, "global_step": 258347, "epoch": 1537} {"train_loss": -11.057438850402832, "global_step": 258348, "epoch": 1537} {"train_loss": -11.535181045532227, "global_step": 258349, "epoch": 1537} {"train_loss": -11.517202377319336, "global_step": 258350, "epoch": 1537} {"train_loss": -11.545461654663086, "global_step": 258351, "epoch": 1537} {"train_loss": -11.904422760009766, "global_step": 258352, "epoch": 1537} {"train_loss": -10.946735382080078, "global_step": 258353, "epoch": 1537} {"train_loss": -11.661182403564453, "global_step": 258354, "epoch": 1537} {"train_loss": -11.383108139038086, "global_step": 258355, "epoch": 1537} {"train_loss": -11.77978229522705, "global_step": 258356, "epoch": 1537} {"train_loss": -11.474456787109375, "global_step": 258357, "epoch": 1537} {"train_loss": -11.631160736083984, "global_step": 258358, "epoch": 1537} {"train_loss": -11.486091613769531, "global_step": 258359, "epoch": 1537} {"train_loss": -11.883811950683594, "global_step": 258360, "epoch": 1537} {"train_loss": -11.664745330810547, "global_step": 258361, "epoch": 1537} {"train_loss": -11.75523853302002, "global_step": 258362, "epoch": 1537} {"train_loss": -11.659948348999023, "global_step": 258363, "epoch": 1537} {"train_loss": -11.868673324584961, "global_step": 258364, "epoch": 1537} {"train_loss": -11.606452941894531, "global_step": 258365, "epoch": 1537} {"train_loss": -11.62434196472168, "global_step": 258366, "epoch": 1537} {"train_loss": -11.331827163696289, "global_step": 258367, "epoch": 1537} {"train_loss": -11.376993179321289, "global_step": 258368, "epoch": 1537} {"train_loss": -11.711153030395508, "global_step": 258369, "epoch": 1537} {"train_loss": -11.485085487365723, "global_step": 258370, "epoch": 1537} {"train_loss": -11.621052742004395, "global_step": 258371, "epoch": 1537} {"train_loss": -11.586620330810547, "global_step": 258372, "epoch": 1537} {"train_loss": -11.881818771362305, "global_step": 258373, "epoch": 1537} {"train_loss": -11.73298454284668, "global_step": 258374, "epoch": 1537} {"train_loss": -11.80472183227539, "global_step": 258375, "epoch": 1537} {"train_loss": -11.622692108154297, "global_step": 258376, "epoch": 1537} {"train_loss": -11.96832275390625, "global_step": 258377, "epoch": 1537} {"train_loss": -11.810691833496094, "global_step": 258378, "epoch": 1537} {"train_loss": -11.765212059020996, "global_step": 258379, "epoch": 1537} {"train_loss": -11.831700325012207, "global_step": 258380, "epoch": 1537} {"train_loss": -11.922121047973633, "global_step": 258381, "epoch": 1537} {"train_loss": -11.93593978881836, "global_step": 258382, "epoch": 1537} {"train_loss": -11.538697662807646, "global_step": 258383, "epoch": 1537, "val_loss": 263477.0} {"train_loss": -11.851127624511719, "global_step": 258384, "epoch": 1538} {"train_loss": -11.978597640991211, "global_step": 258385, "epoch": 1538} {"train_loss": -11.833101272583008, "global_step": 258386, "epoch": 1538} {"train_loss": -11.96985912322998, "global_step": 258387, "epoch": 1538} {"train_loss": -12.10849380493164, "global_step": 258388, "epoch": 1538} {"train_loss": -11.99850082397461, "global_step": 258389, "epoch": 1538} {"train_loss": -12.066439628601074, "global_step": 258390, "epoch": 1538} {"train_loss": -11.999198913574219, "global_step": 258391, "epoch": 1538} {"train_loss": -11.95953369140625, "global_step": 258392, "epoch": 1538} {"train_loss": -12.10267448425293, "global_step": 258393, "epoch": 1538} {"train_loss": -11.903196334838867, "global_step": 258394, "epoch": 1538} {"train_loss": -12.002100944519043, "global_step": 258395, "epoch": 1538} {"train_loss": -11.854958534240723, "global_step": 258396, "epoch": 1538} {"train_loss": -11.977259635925293, "global_step": 258397, "epoch": 1538} {"train_loss": -12.225128173828125, "global_step": 258398, "epoch": 1538} {"train_loss": -12.00853157043457, "global_step": 258399, "epoch": 1538} {"train_loss": -12.09863567352295, "global_step": 258400, "epoch": 1538} {"train_loss": -12.197010040283203, "global_step": 258401, "epoch": 1538} {"train_loss": -11.845903396606445, "global_step": 258402, "epoch": 1538} {"train_loss": -12.02682113647461, "global_step": 258403, "epoch": 1538} {"train_loss": -11.804594039916992, "global_step": 258404, "epoch": 1538} {"train_loss": -12.015905380249023, "global_step": 258405, "epoch": 1538} {"train_loss": -12.100652694702148, "global_step": 258406, "epoch": 1538} {"train_loss": -12.099032402038574, "global_step": 258407, "epoch": 1538} {"train_loss": -11.912019729614258, "global_step": 258408, "epoch": 1538} {"train_loss": -12.040950775146484, "global_step": 258409, "epoch": 1538} {"train_loss": -12.065186500549316, "global_step": 258410, "epoch": 1538} {"train_loss": -12.262678146362305, "global_step": 258411, "epoch": 1538} {"train_loss": -12.163592338562012, "global_step": 258412, "epoch": 1538} {"train_loss": -12.106918334960938, "global_step": 258413, "epoch": 1538} {"train_loss": -12.06702995300293, "global_step": 258414, "epoch": 1538} {"train_loss": -11.887619972229004, "global_step": 258415, "epoch": 1538} {"train_loss": -12.260514259338379, "global_step": 258416, "epoch": 1538} {"train_loss": -11.76217269897461, "global_step": 258417, "epoch": 1538} {"train_loss": -12.14714241027832, "global_step": 258418, "epoch": 1538} {"train_loss": -12.140634536743164, "global_step": 258419, "epoch": 1538} {"train_loss": -11.991142272949219, "global_step": 258420, "epoch": 1538} {"train_loss": -12.222039222717285, "global_step": 258421, "epoch": 1538} {"train_loss": -12.133694648742676, "global_step": 258422, "epoch": 1538} {"train_loss": -11.974053382873535, "global_step": 258423, "epoch": 1538} {"train_loss": -12.228508949279785, "global_step": 258424, "epoch": 1538} {"train_loss": -11.868419647216797, "global_step": 258425, "epoch": 1538} {"train_loss": -12.022858619689941, "global_step": 258426, "epoch": 1538} {"train_loss": -12.266460418701172, "global_step": 258427, "epoch": 1538} {"train_loss": -12.098922729492188, "global_step": 258428, "epoch": 1538} {"train_loss": -12.122051239013672, "global_step": 258429, "epoch": 1538} {"train_loss": -12.141105651855469, "global_step": 258430, "epoch": 1538} {"train_loss": -12.108396530151367, "global_step": 258431, "epoch": 1538} {"train_loss": -12.212869644165039, "global_step": 258432, "epoch": 1538} {"train_loss": -12.14145278930664, "global_step": 258433, "epoch": 1538} {"train_loss": -12.207832336425781, "global_step": 258434, "epoch": 1538} {"train_loss": -12.117053985595703, "global_step": 258435, "epoch": 1538} {"train_loss": -12.251852035522461, "global_step": 258436, "epoch": 1538} {"train_loss": -12.163595199584961, "global_step": 258437, "epoch": 1538} {"train_loss": -12.035459518432617, "global_step": 258438, "epoch": 1538} {"train_loss": -12.169722557067871, "global_step": 258439, "epoch": 1538} {"train_loss": -12.083890914916992, "global_step": 258440, "epoch": 1538} {"train_loss": -11.761502265930176, "global_step": 258441, "epoch": 1538} {"train_loss": -12.132901191711426, "global_step": 258442, "epoch": 1538} {"train_loss": -12.15894603729248, "global_step": 258443, "epoch": 1538} {"train_loss": -12.283121109008789, "global_step": 258444, "epoch": 1538} {"train_loss": -12.020179748535156, "global_step": 258445, "epoch": 1538} {"train_loss": -12.407890319824219, "global_step": 258446, "epoch": 1538} {"train_loss": -12.12189769744873, "global_step": 258447, "epoch": 1538} {"train_loss": -12.256431579589844, "global_step": 258448, "epoch": 1538} {"train_loss": -12.083330154418945, "global_step": 258449, "epoch": 1538} {"train_loss": -11.473316192626953, "global_step": 258450, "epoch": 1538} {"train_loss": -11.096315383911133, "global_step": 258451, "epoch": 1538} {"train_loss": -10.72514820098877, "global_step": 258452, "epoch": 1538} {"train_loss": -11.209881782531738, "global_step": 258453, "epoch": 1538} {"train_loss": -11.323299407958984, "global_step": 258454, "epoch": 1538} {"train_loss": -11.409852981567383, "global_step": 258455, "epoch": 1538} {"train_loss": -11.749824523925781, "global_step": 258456, "epoch": 1538} {"train_loss": -10.568912506103516, "global_step": 258457, "epoch": 1538} {"train_loss": -11.685480117797852, "global_step": 258458, "epoch": 1538} {"train_loss": -11.045652389526367, "global_step": 258459, "epoch": 1538} {"train_loss": -11.79640007019043, "global_step": 258460, "epoch": 1538} {"train_loss": -11.128562927246094, "global_step": 258461, "epoch": 1538} {"train_loss": -11.667343139648438, "global_step": 258462, "epoch": 1538} {"train_loss": -11.584362030029297, "global_step": 258463, "epoch": 1538} {"train_loss": -11.696759223937988, "global_step": 258464, "epoch": 1538} {"train_loss": -10.555534362792969, "global_step": 258465, "epoch": 1538} {"train_loss": -11.136323928833008, "global_step": 258466, "epoch": 1538} {"train_loss": -11.437837600708008, "global_step": 258467, "epoch": 1538} {"train_loss": -11.580628395080566, "global_step": 258468, "epoch": 1538} {"train_loss": -10.841012954711914, "global_step": 258469, "epoch": 1538} {"train_loss": -11.416253089904785, "global_step": 258470, "epoch": 1538} {"train_loss": -11.952645301818848, "global_step": 258471, "epoch": 1538} {"train_loss": -11.416780471801758, "global_step": 258472, "epoch": 1538} {"train_loss": -11.738838195800781, "global_step": 258473, "epoch": 1538} {"train_loss": -11.917045593261719, "global_step": 258474, "epoch": 1538} {"train_loss": -11.471757888793945, "global_step": 258475, "epoch": 1538} {"train_loss": -11.269094467163086, "global_step": 258476, "epoch": 1538} {"train_loss": -11.38353443145752, "global_step": 258477, "epoch": 1538} {"train_loss": -10.822732925415039, "global_step": 258478, "epoch": 1538} {"train_loss": -11.262754440307617, "global_step": 258479, "epoch": 1538} {"train_loss": -11.681451797485352, "global_step": 258480, "epoch": 1538} {"train_loss": -10.706584930419922, "global_step": 258481, "epoch": 1538} {"train_loss": -10.061054229736328, "global_step": 258482, "epoch": 1538} {"train_loss": -10.384224891662598, "global_step": 258483, "epoch": 1538} {"train_loss": -7.940056324005127, "global_step": 258484, "epoch": 1538} {"train_loss": -8.453605651855469, "global_step": 258485, "epoch": 1538} {"train_loss": -8.341171264648438, "global_step": 258486, "epoch": 1538} {"train_loss": -9.636697769165039, "global_step": 258487, "epoch": 1538} {"train_loss": -8.398801803588867, "global_step": 258488, "epoch": 1538} {"train_loss": -7.774936676025391, "global_step": 258489, "epoch": 1538} {"train_loss": -8.8226318359375, "global_step": 258490, "epoch": 1538} {"train_loss": -9.345507621765137, "global_step": 258491, "epoch": 1538} {"train_loss": -10.251811981201172, "global_step": 258492, "epoch": 1538} {"train_loss": -9.687931060791016, "global_step": 258493, "epoch": 1538} {"train_loss": -10.087287902832031, "global_step": 258494, "epoch": 1538} {"train_loss": -9.472333908081055, "global_step": 258495, "epoch": 1538} {"train_loss": -9.466148376464844, "global_step": 258496, "epoch": 1538} {"train_loss": -11.031821250915527, "global_step": 258497, "epoch": 1538} {"train_loss": -9.736989974975586, "global_step": 258498, "epoch": 1538} {"train_loss": -10.183135986328125, "global_step": 258499, "epoch": 1538} {"train_loss": -11.091119766235352, "global_step": 258500, "epoch": 1538} {"train_loss": -10.940241813659668, "global_step": 258501, "epoch": 1538} {"train_loss": -10.314239501953125, "global_step": 258502, "epoch": 1538} {"train_loss": -10.831933975219727, "global_step": 258503, "epoch": 1538} {"train_loss": -10.573012351989746, "global_step": 258504, "epoch": 1538} {"train_loss": -10.851919174194336, "global_step": 258505, "epoch": 1538} {"train_loss": -11.532386779785156, "global_step": 258506, "epoch": 1538} {"train_loss": -10.701850891113281, "global_step": 258507, "epoch": 1538} {"train_loss": -11.273202896118164, "global_step": 258508, "epoch": 1538} {"train_loss": -11.478948593139648, "global_step": 258509, "epoch": 1538} {"train_loss": -10.654428482055664, "global_step": 258510, "epoch": 1538} {"train_loss": -11.372699737548828, "global_step": 258511, "epoch": 1538} {"train_loss": -11.313628196716309, "global_step": 258512, "epoch": 1538} {"train_loss": -11.33569622039795, "global_step": 258513, "epoch": 1538} {"train_loss": -11.164896011352539, "global_step": 258514, "epoch": 1538} {"train_loss": -11.533373832702637, "global_step": 258515, "epoch": 1538} {"train_loss": -11.118462562561035, "global_step": 258516, "epoch": 1538} {"train_loss": -11.495747566223145, "global_step": 258517, "epoch": 1538} {"train_loss": -11.64976692199707, "global_step": 258518, "epoch": 1538} {"train_loss": -11.378789901733398, "global_step": 258519, "epoch": 1538} {"train_loss": -11.369016647338867, "global_step": 258520, "epoch": 1538} {"train_loss": -11.590703964233398, "global_step": 258521, "epoch": 1538} {"train_loss": -11.699060440063477, "global_step": 258522, "epoch": 1538} {"train_loss": -11.574193954467773, "global_step": 258523, "epoch": 1538} {"train_loss": -11.655715942382812, "global_step": 258524, "epoch": 1538} {"train_loss": -11.568166732788086, "global_step": 258525, "epoch": 1538} {"train_loss": -11.790365219116211, "global_step": 258526, "epoch": 1538} {"train_loss": -11.840350151062012, "global_step": 258527, "epoch": 1538} {"train_loss": -11.768780708312988, "global_step": 258528, "epoch": 1538} {"train_loss": -11.653054237365723, "global_step": 258529, "epoch": 1538} {"train_loss": -11.880810737609863, "global_step": 258530, "epoch": 1538} {"train_loss": -11.63164234161377, "global_step": 258531, "epoch": 1538} {"train_loss": -11.796754837036133, "global_step": 258532, "epoch": 1538} {"train_loss": -11.889205932617188, "global_step": 258533, "epoch": 1538} {"train_loss": -11.876799583435059, "global_step": 258534, "epoch": 1538} {"train_loss": -11.721628189086914, "global_step": 258535, "epoch": 1538} {"train_loss": -11.756265640258789, "global_step": 258536, "epoch": 1538} {"train_loss": -11.703008651733398, "global_step": 258537, "epoch": 1538} {"train_loss": -11.664730072021484, "global_step": 258538, "epoch": 1538} {"train_loss": -11.59984016418457, "global_step": 258539, "epoch": 1538} {"train_loss": -11.848905563354492, "global_step": 258540, "epoch": 1538} {"train_loss": -11.687119483947754, "global_step": 258541, "epoch": 1538} {"train_loss": -11.89206314086914, "global_step": 258542, "epoch": 1538} {"train_loss": -11.627706527709961, "global_step": 258543, "epoch": 1538} {"train_loss": -11.9234619140625, "global_step": 258544, "epoch": 1538} {"train_loss": -11.681836128234863, "global_step": 258545, "epoch": 1538} {"train_loss": -11.714866638183594, "global_step": 258546, "epoch": 1538} {"train_loss": -11.720781326293945, "global_step": 258547, "epoch": 1538} {"train_loss": -11.678121566772461, "global_step": 258548, "epoch": 1538} {"train_loss": -11.922916412353516, "global_step": 258549, "epoch": 1538} {"train_loss": -11.986804962158203, "global_step": 258550, "epoch": 1538} {"train_loss": -11.46788616691317, "global_step": 258551, "epoch": 1538, "val_loss": 266450.625} {"train_loss": -11.87727165222168, "global_step": 258552, "epoch": 1539} {"train_loss": -11.876543045043945, "global_step": 258553, "epoch": 1539} {"train_loss": -12.060691833496094, "global_step": 258554, "epoch": 1539} {"train_loss": -11.747448921203613, "global_step": 258555, "epoch": 1539} {"train_loss": -11.800394058227539, "global_step": 258556, "epoch": 1539} {"train_loss": -11.887032508850098, "global_step": 258557, "epoch": 1539} {"train_loss": -12.075469970703125, "global_step": 258558, "epoch": 1539} {"train_loss": -11.867668151855469, "global_step": 258559, "epoch": 1539} {"train_loss": -11.877103805541992, "global_step": 258560, "epoch": 1539} {"train_loss": -11.438699722290039, "global_step": 258561, "epoch": 1539} {"train_loss": -11.100332260131836, "global_step": 258562, "epoch": 1539} {"train_loss": -11.520428657531738, "global_step": 258563, "epoch": 1539} {"train_loss": -11.428794860839844, "global_step": 258564, "epoch": 1539} {"train_loss": -11.753715515136719, "global_step": 258565, "epoch": 1539} {"train_loss": -11.551200866699219, "global_step": 258566, "epoch": 1539} {"train_loss": -11.588960647583008, "global_step": 258567, "epoch": 1539} {"train_loss": -11.10477066040039, "global_step": 258568, "epoch": 1539} {"train_loss": -11.627164840698242, "global_step": 258569, "epoch": 1539} {"train_loss": -10.082138061523438, "global_step": 258570, "epoch": 1539} {"train_loss": -11.524499893188477, "global_step": 258571, "epoch": 1539} {"train_loss": -10.69262409210205, "global_step": 258572, "epoch": 1539} {"train_loss": -11.134618759155273, "global_step": 258573, "epoch": 1539} {"train_loss": -10.702457427978516, "global_step": 258574, "epoch": 1539} {"train_loss": -11.228967666625977, "global_step": 258575, "epoch": 1539} {"train_loss": -11.545374870300293, "global_step": 258576, "epoch": 1539} {"train_loss": -11.465446472167969, "global_step": 258577, "epoch": 1539} {"train_loss": -11.451807022094727, "global_step": 258578, "epoch": 1539} {"train_loss": -11.791037559509277, "global_step": 258579, "epoch": 1539} {"train_loss": -11.760164260864258, "global_step": 258580, "epoch": 1539} {"train_loss": -11.561155319213867, "global_step": 258581, "epoch": 1539} {"train_loss": -11.722495079040527, "global_step": 258582, "epoch": 1539} {"train_loss": -11.632965087890625, "global_step": 258583, "epoch": 1539} {"train_loss": -11.937484741210938, "global_step": 258584, "epoch": 1539} {"train_loss": -11.40069580078125, "global_step": 258585, "epoch": 1539} {"train_loss": -11.869441986083984, "global_step": 258586, "epoch": 1539} {"train_loss": -11.655675888061523, "global_step": 258587, "epoch": 1539} {"train_loss": -11.91710090637207, "global_step": 258588, "epoch": 1539} {"train_loss": -11.771242141723633, "global_step": 258589, "epoch": 1539} {"train_loss": -11.876646995544434, "global_step": 258590, "epoch": 1539} {"train_loss": -11.92652416229248, "global_step": 258591, "epoch": 1539} {"train_loss": -11.756628036499023, "global_step": 258592, "epoch": 1539} {"train_loss": -11.783926010131836, "global_step": 258593, "epoch": 1539} {"train_loss": -11.70666790008545, "global_step": 258594, "epoch": 1539} {"train_loss": -11.948395729064941, "global_step": 258595, "epoch": 1539} {"train_loss": -11.996949195861816, "global_step": 258596, "epoch": 1539} {"train_loss": -11.977408409118652, "global_step": 258597, "epoch": 1539} {"train_loss": -12.113161087036133, "global_step": 258598, "epoch": 1539} {"train_loss": -11.968805313110352, "global_step": 258599, "epoch": 1539} {"train_loss": -11.811668395996094, "global_step": 258600, "epoch": 1539} {"train_loss": -12.05814266204834, "global_step": 258601, "epoch": 1539} {"train_loss": -12.081329345703125, "global_step": 258602, "epoch": 1539} {"train_loss": -12.10654067993164, "global_step": 258603, "epoch": 1539} {"train_loss": -12.047513961791992, "global_step": 258604, "epoch": 1539} {"train_loss": -12.195037841796875, "global_step": 258605, "epoch": 1539} {"train_loss": -11.927352905273438, "global_step": 258606, "epoch": 1539} {"train_loss": -12.083043098449707, "global_step": 258607, "epoch": 1539} {"train_loss": -11.904972076416016, "global_step": 258608, "epoch": 1539} {"train_loss": -12.214898109436035, "global_step": 258609, "epoch": 1539} {"train_loss": -11.983491897583008, "global_step": 258610, "epoch": 1539} {"train_loss": -12.141368865966797, "global_step": 258611, "epoch": 1539} {"train_loss": -12.09122371673584, "global_step": 258612, "epoch": 1539} {"train_loss": -12.018163681030273, "global_step": 258613, "epoch": 1539} {"train_loss": -11.76785659790039, "global_step": 258614, "epoch": 1539} {"train_loss": -11.70701789855957, "global_step": 258615, "epoch": 1539} {"train_loss": -12.19803237915039, "global_step": 258616, "epoch": 1539} {"train_loss": -11.916014671325684, "global_step": 258617, "epoch": 1539} {"train_loss": -12.051922798156738, "global_step": 258618, "epoch": 1539} {"train_loss": -12.071728706359863, "global_step": 258619, "epoch": 1539} {"train_loss": -11.814796447753906, "global_step": 258620, "epoch": 1539} {"train_loss": -12.149614334106445, "global_step": 258621, "epoch": 1539} {"train_loss": -12.069091796875, "global_step": 258622, "epoch": 1539} {"train_loss": -12.267378807067871, "global_step": 258623, "epoch": 1539} {"train_loss": -12.110366821289062, "global_step": 258624, "epoch": 1539} {"train_loss": -12.277047157287598, "global_step": 258625, "epoch": 1539} {"train_loss": -11.912277221679688, "global_step": 258626, "epoch": 1539} {"train_loss": -12.0584135055542, "global_step": 258627, "epoch": 1539} {"train_loss": -12.042411804199219, "global_step": 258628, "epoch": 1539} {"train_loss": -12.153497695922852, "global_step": 258629, "epoch": 1539} {"train_loss": -12.143406867980957, "global_step": 258630, "epoch": 1539} {"train_loss": -12.123064041137695, "global_step": 258631, "epoch": 1539} {"train_loss": -12.083538055419922, "global_step": 258632, "epoch": 1539} {"train_loss": -12.15609073638916, "global_step": 258633, "epoch": 1539} {"train_loss": -12.141475677490234, "global_step": 258634, "epoch": 1539} {"train_loss": -12.023783683776855, "global_step": 258635, "epoch": 1539} {"train_loss": -12.248651504516602, "global_step": 258636, "epoch": 1539} {"train_loss": -11.877403259277344, "global_step": 258637, "epoch": 1539} {"train_loss": -11.411055564880371, "global_step": 258638, "epoch": 1539} {"train_loss": -12.184046745300293, "global_step": 258639, "epoch": 1539} {"train_loss": -11.404098510742188, "global_step": 258640, "epoch": 1539} {"train_loss": -11.440537452697754, "global_step": 258641, "epoch": 1539} {"train_loss": -11.930326461791992, "global_step": 258642, "epoch": 1539} {"train_loss": -12.046778678894043, "global_step": 258643, "epoch": 1539} {"train_loss": -10.978886604309082, "global_step": 258644, "epoch": 1539} {"train_loss": -11.471790313720703, "global_step": 258645, "epoch": 1539} {"train_loss": -11.720521926879883, "global_step": 258646, "epoch": 1539} {"train_loss": -11.937355041503906, "global_step": 258647, "epoch": 1539} {"train_loss": -12.021463394165039, "global_step": 258648, "epoch": 1539} {"train_loss": -11.686967849731445, "global_step": 258649, "epoch": 1539} {"train_loss": -11.887474060058594, "global_step": 258650, "epoch": 1539} {"train_loss": -11.761817932128906, "global_step": 258651, "epoch": 1539} {"train_loss": -11.383891105651855, "global_step": 258652, "epoch": 1539} {"train_loss": -12.009573936462402, "global_step": 258653, "epoch": 1539} {"train_loss": -11.527627944946289, "global_step": 258654, "epoch": 1539} {"train_loss": -11.896339416503906, "global_step": 258655, "epoch": 1539} {"train_loss": -11.368864059448242, "global_step": 258656, "epoch": 1539} {"train_loss": -11.973733901977539, "global_step": 258657, "epoch": 1539} {"train_loss": -11.669864654541016, "global_step": 258658, "epoch": 1539} {"train_loss": -12.08161735534668, "global_step": 258659, "epoch": 1539} {"train_loss": -11.741735458374023, "global_step": 258660, "epoch": 1539} {"train_loss": -11.840429306030273, "global_step": 258661, "epoch": 1539} {"train_loss": -12.088147163391113, "global_step": 258662, "epoch": 1539} {"train_loss": -11.643078804016113, "global_step": 258663, "epoch": 1539} {"train_loss": -12.120594024658203, "global_step": 258664, "epoch": 1539} {"train_loss": -11.7496976852417, "global_step": 258665, "epoch": 1539} {"train_loss": -12.10710334777832, "global_step": 258666, "epoch": 1539} {"train_loss": -11.818458557128906, "global_step": 258667, "epoch": 1539} {"train_loss": -11.603631973266602, "global_step": 258668, "epoch": 1539} {"train_loss": -11.478157043457031, "global_step": 258669, "epoch": 1539} {"train_loss": -11.369390487670898, "global_step": 258670, "epoch": 1539} {"train_loss": -10.009329795837402, "global_step": 258671, "epoch": 1539} {"train_loss": -10.967973709106445, "global_step": 258672, "epoch": 1539} {"train_loss": -10.461181640625, "global_step": 258673, "epoch": 1539} {"train_loss": -10.627617835998535, "global_step": 258674, "epoch": 1539} {"train_loss": -10.23486328125, "global_step": 258675, "epoch": 1539} {"train_loss": -10.690380096435547, "global_step": 258676, "epoch": 1539} {"train_loss": -10.991695404052734, "global_step": 258677, "epoch": 1539} {"train_loss": -8.077877044677734, "global_step": 258678, "epoch": 1539} {"train_loss": -9.043770790100098, "global_step": 258679, "epoch": 1539} {"train_loss": -9.989863395690918, "global_step": 258680, "epoch": 1539} {"train_loss": -7.639107704162598, "global_step": 258681, "epoch": 1539} {"train_loss": -7.209123611450195, "global_step": 258682, "epoch": 1539} {"train_loss": -8.54648494720459, "global_step": 258683, "epoch": 1539} {"train_loss": -8.498130798339844, "global_step": 258684, "epoch": 1539} {"train_loss": -8.437591552734375, "global_step": 258685, "epoch": 1539} {"train_loss": -8.872490882873535, "global_step": 258686, "epoch": 1539} {"train_loss": -8.226322174072266, "global_step": 258687, "epoch": 1539} {"train_loss": -8.044631958007812, "global_step": 258688, "epoch": 1539} {"train_loss": -9.119190216064453, "global_step": 258689, "epoch": 1539} {"train_loss": -8.994955062866211, "global_step": 258690, "epoch": 1539} {"train_loss": -9.545358657836914, "global_step": 258691, "epoch": 1539} {"train_loss": -9.889941215515137, "global_step": 258692, "epoch": 1539} {"train_loss": -9.47749137878418, "global_step": 258693, "epoch": 1539} {"train_loss": -10.663450241088867, "global_step": 258694, "epoch": 1539} {"train_loss": -10.137210845947266, "global_step": 258695, "epoch": 1539} {"train_loss": -10.31155014038086, "global_step": 258696, "epoch": 1539} {"train_loss": -10.458494186401367, "global_step": 258697, "epoch": 1539} {"train_loss": -10.719454765319824, "global_step": 258698, "epoch": 1539} {"train_loss": -10.524127006530762, "global_step": 258699, "epoch": 1539} {"train_loss": -9.620737075805664, "global_step": 258700, "epoch": 1539} {"train_loss": -11.230024337768555, "global_step": 258701, "epoch": 1539} {"train_loss": -10.741544723510742, "global_step": 258702, "epoch": 1539} {"train_loss": -11.136462211608887, "global_step": 258703, "epoch": 1539} {"train_loss": -11.382471084594727, "global_step": 258704, "epoch": 1539} {"train_loss": -10.91321086883545, "global_step": 258705, "epoch": 1539} {"train_loss": -10.114864349365234, "global_step": 258706, "epoch": 1539} {"train_loss": -11.047821998596191, "global_step": 258707, "epoch": 1539} {"train_loss": -10.436904907226562, "global_step": 258708, "epoch": 1539} {"train_loss": -10.428238868713379, "global_step": 258709, "epoch": 1539} {"train_loss": -11.56914234161377, "global_step": 258710, "epoch": 1539} {"train_loss": -10.934776306152344, "global_step": 258711, "epoch": 1539} {"train_loss": -10.367912292480469, "global_step": 258712, "epoch": 1539} {"train_loss": -10.967777252197266, "global_step": 258713, "epoch": 1539} {"train_loss": -11.118523597717285, "global_step": 258714, "epoch": 1539} {"train_loss": -10.366607666015625, "global_step": 258715, "epoch": 1539} {"train_loss": -11.256963729858398, "global_step": 258716, "epoch": 1539} {"train_loss": -11.40170669555664, "global_step": 258717, "epoch": 1539} {"train_loss": -10.468816757202148, "global_step": 258718, "epoch": 1539} {"train_loss": -11.291172725813729, "global_step": 258719, "epoch": 1539, "val_loss": 261804.0} {"train_loss": -11.290433883666992, "global_step": 258720, "epoch": 1540} {"train_loss": -10.558143615722656, "global_step": 258721, "epoch": 1540} {"train_loss": -11.334806442260742, "global_step": 258722, "epoch": 1540} {"train_loss": -11.523805618286133, "global_step": 258723, "epoch": 1540} {"train_loss": -11.379317283630371, "global_step": 258724, "epoch": 1540} {"train_loss": -11.298529624938965, "global_step": 258725, "epoch": 1540} {"train_loss": -11.457717895507812, "global_step": 258726, "epoch": 1540} {"train_loss": -11.549962997436523, "global_step": 258727, "epoch": 1540} {"train_loss": -11.153676986694336, "global_step": 258728, "epoch": 1540} {"train_loss": -11.40144157409668, "global_step": 258729, "epoch": 1540} {"train_loss": -11.669519424438477, "global_step": 258730, "epoch": 1540} {"train_loss": -11.503824234008789, "global_step": 258731, "epoch": 1540} {"train_loss": -11.529060363769531, "global_step": 258732, "epoch": 1540} {"train_loss": -11.557496070861816, "global_step": 258733, "epoch": 1540} {"train_loss": -11.826299667358398, "global_step": 258734, "epoch": 1540} {"train_loss": -11.552617073059082, "global_step": 258735, "epoch": 1540} {"train_loss": -11.639179229736328, "global_step": 258736, "epoch": 1540} {"train_loss": -11.65463924407959, "global_step": 258737, "epoch": 1540} {"train_loss": -11.638908386230469, "global_step": 258738, "epoch": 1540} {"train_loss": -11.602914810180664, "global_step": 258739, "epoch": 1540} {"train_loss": -11.643594741821289, "global_step": 258740, "epoch": 1540} {"train_loss": -11.644981384277344, "global_step": 258741, "epoch": 1540} {"train_loss": -11.768692016601562, "global_step": 258742, "epoch": 1540} {"train_loss": -11.822087287902832, "global_step": 258743, "epoch": 1540} {"train_loss": -11.898963928222656, "global_step": 258744, "epoch": 1540} {"train_loss": -11.66072940826416, "global_step": 258745, "epoch": 1540} {"train_loss": -11.75411605834961, "global_step": 258746, "epoch": 1540} {"train_loss": -11.735115051269531, "global_step": 258747, "epoch": 1540} {"train_loss": -11.728944778442383, "global_step": 258748, "epoch": 1540} {"train_loss": -11.760498046875, "global_step": 258749, "epoch": 1540} {"train_loss": -11.925426483154297, "global_step": 258750, "epoch": 1540} {"train_loss": -11.746593475341797, "global_step": 258751, "epoch": 1540} {"train_loss": -11.82342529296875, "global_step": 258752, "epoch": 1540} {"train_loss": -11.81142807006836, "global_step": 258753, "epoch": 1540} {"train_loss": -11.59647274017334, "global_step": 258754, "epoch": 1540} {"train_loss": -11.85891056060791, "global_step": 258755, "epoch": 1540} {"train_loss": -11.963842391967773, "global_step": 258756, "epoch": 1540} {"train_loss": -11.882067680358887, "global_step": 258757, "epoch": 1540} {"train_loss": -11.871121406555176, "global_step": 258758, "epoch": 1540} {"train_loss": -11.976753234863281, "global_step": 258759, "epoch": 1540} {"train_loss": -12.049226760864258, "global_step": 258760, "epoch": 1540} {"train_loss": -11.928110122680664, "global_step": 258761, "epoch": 1540} {"train_loss": -12.03312873840332, "global_step": 258762, "epoch": 1540} {"train_loss": -11.872057914733887, "global_step": 258763, "epoch": 1540} {"train_loss": -12.025910377502441, "global_step": 258764, "epoch": 1540} {"train_loss": -12.057964324951172, "global_step": 258765, "epoch": 1540} {"train_loss": -11.998750686645508, "global_step": 258766, "epoch": 1540} {"train_loss": -12.0924072265625, "global_step": 258767, "epoch": 1540} {"train_loss": -11.915075302124023, "global_step": 258768, "epoch": 1540} {"train_loss": -12.059585571289062, "global_step": 258769, "epoch": 1540} {"train_loss": -11.982627868652344, "global_step": 258770, "epoch": 1540} {"train_loss": -11.591404914855957, "global_step": 258771, "epoch": 1540} {"train_loss": -12.071812629699707, "global_step": 258772, "epoch": 1540} {"train_loss": -11.848930358886719, "global_step": 258773, "epoch": 1540} {"train_loss": -11.341392517089844, "global_step": 258774, "epoch": 1540} {"train_loss": -11.686857223510742, "global_step": 258775, "epoch": 1540} {"train_loss": -11.907381057739258, "global_step": 258776, "epoch": 1540} {"train_loss": -11.764283180236816, "global_step": 258777, "epoch": 1540} {"train_loss": -12.009729385375977, "global_step": 258778, "epoch": 1540} {"train_loss": -12.026555061340332, "global_step": 258779, "epoch": 1540} {"train_loss": -11.824857711791992, "global_step": 258780, "epoch": 1540} {"train_loss": -11.477867126464844, "global_step": 258781, "epoch": 1540} {"train_loss": -11.924001693725586, "global_step": 258782, "epoch": 1540} {"train_loss": -12.359991073608398, "global_step": 258783, "epoch": 1540} {"train_loss": -11.667780876159668, "global_step": 258784, "epoch": 1540} {"train_loss": -11.93560791015625, "global_step": 258785, "epoch": 1540} {"train_loss": -12.08466625213623, "global_step": 258786, "epoch": 1540} {"train_loss": -11.778865814208984, "global_step": 258787, "epoch": 1540} {"train_loss": -12.139812469482422, "global_step": 258788, "epoch": 1540} {"train_loss": -11.970291137695312, "global_step": 258789, "epoch": 1540} {"train_loss": -11.50063419342041, "global_step": 258790, "epoch": 1540} {"train_loss": -11.276987075805664, "global_step": 258791, "epoch": 1540} {"train_loss": -11.777180671691895, "global_step": 258792, "epoch": 1540} {"train_loss": -11.910030364990234, "global_step": 258793, "epoch": 1540} {"train_loss": -11.775174140930176, "global_step": 258794, "epoch": 1540} {"train_loss": -11.844358444213867, "global_step": 258795, "epoch": 1540} {"train_loss": -11.858884811401367, "global_step": 258796, "epoch": 1540} {"train_loss": -11.627254486083984, "global_step": 258797, "epoch": 1540} {"train_loss": -11.583456039428711, "global_step": 258798, "epoch": 1540} {"train_loss": -11.994606018066406, "global_step": 258799, "epoch": 1540} {"train_loss": -11.905376434326172, "global_step": 258800, "epoch": 1540} {"train_loss": -11.235410690307617, "global_step": 258801, "epoch": 1540} {"train_loss": -11.248265266418457, "global_step": 258802, "epoch": 1540} {"train_loss": -12.036863327026367, "global_step": 258803, "epoch": 1540} {"train_loss": -11.686290740966797, "global_step": 258804, "epoch": 1540} {"train_loss": -11.33504867553711, "global_step": 258805, "epoch": 1540} {"train_loss": -11.671586990356445, "global_step": 258806, "epoch": 1540} {"train_loss": -11.986383438110352, "global_step": 258807, "epoch": 1540} {"train_loss": -11.647272109985352, "global_step": 258808, "epoch": 1540} {"train_loss": -11.353023529052734, "global_step": 258809, "epoch": 1540} {"train_loss": -11.084709167480469, "global_step": 258810, "epoch": 1540} {"train_loss": -11.68343734741211, "global_step": 258811, "epoch": 1540} {"train_loss": -11.984350204467773, "global_step": 258812, "epoch": 1540} {"train_loss": -11.906655311584473, "global_step": 258813, "epoch": 1540} {"train_loss": -11.737281799316406, "global_step": 258814, "epoch": 1540} {"train_loss": -12.113164901733398, "global_step": 258815, "epoch": 1540} {"train_loss": -11.905969619750977, "global_step": 258816, "epoch": 1540} {"train_loss": -11.962543487548828, "global_step": 258817, "epoch": 1540} {"train_loss": -12.01589584350586, "global_step": 258818, "epoch": 1540} {"train_loss": -11.733625411987305, "global_step": 258819, "epoch": 1540} {"train_loss": -11.956584930419922, "global_step": 258820, "epoch": 1540} {"train_loss": -12.002289772033691, "global_step": 258821, "epoch": 1540} {"train_loss": -11.739522933959961, "global_step": 258822, "epoch": 1540} {"train_loss": -11.710487365722656, "global_step": 258823, "epoch": 1540} {"train_loss": -11.746684074401855, "global_step": 258824, "epoch": 1540} {"train_loss": -11.330957412719727, "global_step": 258825, "epoch": 1540} {"train_loss": -11.55380630493164, "global_step": 258826, "epoch": 1540} {"train_loss": -11.779624938964844, "global_step": 258827, "epoch": 1540} {"train_loss": -11.266197204589844, "global_step": 258828, "epoch": 1540} {"train_loss": -11.882431030273438, "global_step": 258829, "epoch": 1540} {"train_loss": -11.702553749084473, "global_step": 258830, "epoch": 1540} {"train_loss": -11.900590896606445, "global_step": 258831, "epoch": 1540} {"train_loss": -12.012378692626953, "global_step": 258832, "epoch": 1540} {"train_loss": -11.653538703918457, "global_step": 258833, "epoch": 1540} {"train_loss": -11.366403579711914, "global_step": 258834, "epoch": 1540} {"train_loss": -12.007866859436035, "global_step": 258835, "epoch": 1540} {"train_loss": -11.660074234008789, "global_step": 258836, "epoch": 1540} {"train_loss": -11.975055694580078, "global_step": 258837, "epoch": 1540} {"train_loss": -11.917213439941406, "global_step": 258838, "epoch": 1540} {"train_loss": -11.565085411071777, "global_step": 258839, "epoch": 1540} {"train_loss": -11.957551956176758, "global_step": 258840, "epoch": 1540} {"train_loss": -11.413749694824219, "global_step": 258841, "epoch": 1540} {"train_loss": -11.897241592407227, "global_step": 258842, "epoch": 1540} {"train_loss": -11.969573974609375, "global_step": 258843, "epoch": 1540} {"train_loss": -11.23151683807373, "global_step": 258844, "epoch": 1540} {"train_loss": -11.534126281738281, "global_step": 258845, "epoch": 1540} {"train_loss": -11.992728233337402, "global_step": 258846, "epoch": 1540} {"train_loss": -11.66469955444336, "global_step": 258847, "epoch": 1540} {"train_loss": -11.95086669921875, "global_step": 258848, "epoch": 1540} {"train_loss": -11.665907859802246, "global_step": 258849, "epoch": 1540} {"train_loss": -11.843481063842773, "global_step": 258850, "epoch": 1540} {"train_loss": -11.654620170593262, "global_step": 258851, "epoch": 1540} {"train_loss": -11.969036102294922, "global_step": 258852, "epoch": 1540} {"train_loss": -11.681203842163086, "global_step": 258853, "epoch": 1540} {"train_loss": -11.802549362182617, "global_step": 258854, "epoch": 1540} {"train_loss": -11.648731231689453, "global_step": 258855, "epoch": 1540} {"train_loss": -11.215133666992188, "global_step": 258856, "epoch": 1540} {"train_loss": -10.810218811035156, "global_step": 258857, "epoch": 1540} {"train_loss": -11.645675659179688, "global_step": 258858, "epoch": 1540} {"train_loss": -11.599093437194824, "global_step": 258859, "epoch": 1540} {"train_loss": -11.467710494995117, "global_step": 258860, "epoch": 1540} {"train_loss": -11.684165954589844, "global_step": 258861, "epoch": 1540} {"train_loss": -11.813451766967773, "global_step": 258862, "epoch": 1540} {"train_loss": -10.707948684692383, "global_step": 258863, "epoch": 1540} {"train_loss": -11.325952529907227, "global_step": 258864, "epoch": 1540} {"train_loss": -11.759696960449219, "global_step": 258865, "epoch": 1540} {"train_loss": -10.646652221679688, "global_step": 258866, "epoch": 1540} {"train_loss": -10.216469764709473, "global_step": 258867, "epoch": 1540} {"train_loss": -11.4957914352417, "global_step": 258868, "epoch": 1540} {"train_loss": -9.884029388427734, "global_step": 258869, "epoch": 1540} {"train_loss": -11.739248275756836, "global_step": 258870, "epoch": 1540} {"train_loss": -11.38197135925293, "global_step": 258871, "epoch": 1540} {"train_loss": -11.33366870880127, "global_step": 258872, "epoch": 1540} {"train_loss": -11.676653861999512, "global_step": 258873, "epoch": 1540} {"train_loss": -11.236291885375977, "global_step": 258874, "epoch": 1540} {"train_loss": -11.873390197753906, "global_step": 258875, "epoch": 1540} {"train_loss": -11.3652925491333, "global_step": 258876, "epoch": 1540} {"train_loss": -11.79715633392334, "global_step": 258877, "epoch": 1540} {"train_loss": -11.671761512756348, "global_step": 258878, "epoch": 1540} {"train_loss": -11.432418823242188, "global_step": 258879, "epoch": 1540} {"train_loss": -11.545543670654297, "global_step": 258880, "epoch": 1540} {"train_loss": -11.589799880981445, "global_step": 258881, "epoch": 1540} {"train_loss": -11.799848556518555, "global_step": 258882, "epoch": 1540} {"train_loss": -11.12863826751709, "global_step": 258883, "epoch": 1540} {"train_loss": -11.82019329071045, "global_step": 258884, "epoch": 1540} {"train_loss": -11.337407112121582, "global_step": 258885, "epoch": 1540} {"train_loss": -11.517955780029297, "global_step": 258886, "epoch": 1540} {"train_loss": -11.671366362344651, "global_step": 258887, "epoch": 1540, "val_loss": 266450.78125, "train_action_mse_error": 3.7250418663024902} {"train_loss": -11.410985946655273, "global_step": 258888, "epoch": 1541} {"train_loss": -11.473939895629883, "global_step": 258889, "epoch": 1541} {"train_loss": -11.787166595458984, "global_step": 258890, "epoch": 1541} {"train_loss": -11.761302947998047, "global_step": 258891, "epoch": 1541} {"train_loss": -11.575660705566406, "global_step": 258892, "epoch": 1541} {"train_loss": -11.426074028015137, "global_step": 258893, "epoch": 1541} {"train_loss": -11.027477264404297, "global_step": 258894, "epoch": 1541} {"train_loss": -11.845455169677734, "global_step": 258895, "epoch": 1541} {"train_loss": -11.415838241577148, "global_step": 258896, "epoch": 1541} {"train_loss": -11.467978477478027, "global_step": 258897, "epoch": 1541} {"train_loss": -11.784737586975098, "global_step": 258898, "epoch": 1541} {"train_loss": -11.200858116149902, "global_step": 258899, "epoch": 1541} {"train_loss": -11.592846870422363, "global_step": 258900, "epoch": 1541} {"train_loss": -10.746773719787598, "global_step": 258901, "epoch": 1541} {"train_loss": -10.944862365722656, "global_step": 258902, "epoch": 1541} {"train_loss": -11.338020324707031, "global_step": 258903, "epoch": 1541} {"train_loss": -11.220909118652344, "global_step": 258904, "epoch": 1541} {"train_loss": -11.558107376098633, "global_step": 258905, "epoch": 1541} {"train_loss": -11.391729354858398, "global_step": 258906, "epoch": 1541} {"train_loss": -11.46778678894043, "global_step": 258907, "epoch": 1541} {"train_loss": -11.90190315246582, "global_step": 258908, "epoch": 1541} {"train_loss": -11.174966812133789, "global_step": 258909, "epoch": 1541} {"train_loss": -11.432210922241211, "global_step": 258910, "epoch": 1541} {"train_loss": -11.640056610107422, "global_step": 258911, "epoch": 1541} {"train_loss": -11.370260238647461, "global_step": 258912, "epoch": 1541} {"train_loss": -11.771740913391113, "global_step": 258913, "epoch": 1541} {"train_loss": -11.417023658752441, "global_step": 258914, "epoch": 1541} {"train_loss": -11.878941535949707, "global_step": 258915, "epoch": 1541} {"train_loss": -11.890294075012207, "global_step": 258916, "epoch": 1541} {"train_loss": -11.71040153503418, "global_step": 258917, "epoch": 1541} {"train_loss": -12.00789737701416, "global_step": 258918, "epoch": 1541} {"train_loss": -11.571844100952148, "global_step": 258919, "epoch": 1541} {"train_loss": -11.81025505065918, "global_step": 258920, "epoch": 1541} {"train_loss": -11.812921524047852, "global_step": 258921, "epoch": 1541} {"train_loss": -11.48309326171875, "global_step": 258922, "epoch": 1541} {"train_loss": -11.673456192016602, "global_step": 258923, "epoch": 1541} {"train_loss": -11.841035842895508, "global_step": 258924, "epoch": 1541} {"train_loss": -11.829795837402344, "global_step": 258925, "epoch": 1541} {"train_loss": -11.775995254516602, "global_step": 258926, "epoch": 1541} {"train_loss": -11.751359939575195, "global_step": 258927, "epoch": 1541} {"train_loss": -12.02322006225586, "global_step": 258928, "epoch": 1541} {"train_loss": -11.875663757324219, "global_step": 258929, "epoch": 1541} {"train_loss": -11.78408432006836, "global_step": 258930, "epoch": 1541} {"train_loss": -12.022851943969727, "global_step": 258931, "epoch": 1541} {"train_loss": -11.521747589111328, "global_step": 258932, "epoch": 1541} {"train_loss": -11.687772750854492, "global_step": 258933, "epoch": 1541} {"train_loss": -11.946473121643066, "global_step": 258934, "epoch": 1541} {"train_loss": -11.82178783416748, "global_step": 258935, "epoch": 1541} {"train_loss": -11.937493324279785, "global_step": 258936, "epoch": 1541} {"train_loss": -11.92251205444336, "global_step": 258937, "epoch": 1541} {"train_loss": -11.924001693725586, "global_step": 258938, "epoch": 1541} {"train_loss": -12.029481887817383, "global_step": 258939, "epoch": 1541} {"train_loss": -11.922529220581055, "global_step": 258940, "epoch": 1541} {"train_loss": -12.092998504638672, "global_step": 258941, "epoch": 1541} {"train_loss": -12.04993724822998, "global_step": 258942, "epoch": 1541} {"train_loss": -11.986452102661133, "global_step": 258943, "epoch": 1541} {"train_loss": -12.112188339233398, "global_step": 258944, "epoch": 1541} {"train_loss": -12.015725135803223, "global_step": 258945, "epoch": 1541} {"train_loss": -12.103242874145508, "global_step": 258946, "epoch": 1541} {"train_loss": -11.774829864501953, "global_step": 258947, "epoch": 1541} {"train_loss": -11.489442825317383, "global_step": 258948, "epoch": 1541} {"train_loss": -11.800580024719238, "global_step": 258949, "epoch": 1541} {"train_loss": -11.77169132232666, "global_step": 258950, "epoch": 1541} {"train_loss": -11.680503845214844, "global_step": 258951, "epoch": 1541} {"train_loss": -11.839609146118164, "global_step": 258952, "epoch": 1541} {"train_loss": -11.91871452331543, "global_step": 258953, "epoch": 1541} {"train_loss": -11.751213073730469, "global_step": 258954, "epoch": 1541} {"train_loss": -12.051603317260742, "global_step": 258955, "epoch": 1541} {"train_loss": -11.634453773498535, "global_step": 258956, "epoch": 1541} {"train_loss": -11.988985061645508, "global_step": 258957, "epoch": 1541} {"train_loss": -11.922937393188477, "global_step": 258958, "epoch": 1541} {"train_loss": -11.98063850402832, "global_step": 258959, "epoch": 1541} {"train_loss": -12.133512496948242, "global_step": 258960, "epoch": 1541} {"train_loss": -12.021207809448242, "global_step": 258961, "epoch": 1541} {"train_loss": -11.810201644897461, "global_step": 258962, "epoch": 1541} {"train_loss": -12.185464859008789, "global_step": 258963, "epoch": 1541} {"train_loss": -11.773079872131348, "global_step": 258964, "epoch": 1541} {"train_loss": -12.067370414733887, "global_step": 258965, "epoch": 1541} {"train_loss": -12.006562232971191, "global_step": 258966, "epoch": 1541} {"train_loss": -12.210274696350098, "global_step": 258967, "epoch": 1541} {"train_loss": -12.089624404907227, "global_step": 258968, "epoch": 1541} {"train_loss": -12.210943222045898, "global_step": 258969, "epoch": 1541} {"train_loss": -12.128250122070312, "global_step": 258970, "epoch": 1541} {"train_loss": -12.024932861328125, "global_step": 258971, "epoch": 1541} {"train_loss": -12.121413230895996, "global_step": 258972, "epoch": 1541} {"train_loss": -12.338375091552734, "global_step": 258973, "epoch": 1541} {"train_loss": -12.258745193481445, "global_step": 258974, "epoch": 1541} {"train_loss": -12.168469429016113, "global_step": 258975, "epoch": 1541} {"train_loss": -12.036934852600098, "global_step": 258976, "epoch": 1541} {"train_loss": -12.245697021484375, "global_step": 258977, "epoch": 1541} {"train_loss": -11.776055335998535, "global_step": 258978, "epoch": 1541} {"train_loss": -11.708436012268066, "global_step": 258979, "epoch": 1541} {"train_loss": -11.227856636047363, "global_step": 258980, "epoch": 1541} {"train_loss": -11.586551666259766, "global_step": 258981, "epoch": 1541} {"train_loss": -11.97633171081543, "global_step": 258982, "epoch": 1541} {"train_loss": -12.032918930053711, "global_step": 258983, "epoch": 1541} {"train_loss": -11.737617492675781, "global_step": 258984, "epoch": 1541} {"train_loss": -11.499813079833984, "global_step": 258985, "epoch": 1541} {"train_loss": -11.806163787841797, "global_step": 258986, "epoch": 1541} {"train_loss": -12.204423904418945, "global_step": 258987, "epoch": 1541} {"train_loss": -12.270240783691406, "global_step": 258988, "epoch": 1541} {"train_loss": -12.126717567443848, "global_step": 258989, "epoch": 1541} {"train_loss": -12.242061614990234, "global_step": 258990, "epoch": 1541} {"train_loss": -11.41148567199707, "global_step": 258991, "epoch": 1541} {"train_loss": -12.049951553344727, "global_step": 258992, "epoch": 1541} {"train_loss": -11.960060119628906, "global_step": 258993, "epoch": 1541} {"train_loss": -11.691242218017578, "global_step": 258994, "epoch": 1541} {"train_loss": -11.701873779296875, "global_step": 258995, "epoch": 1541} {"train_loss": -11.971414566040039, "global_step": 258996, "epoch": 1541} {"train_loss": -11.381807327270508, "global_step": 258997, "epoch": 1541} {"train_loss": -11.518467903137207, "global_step": 258998, "epoch": 1541} {"train_loss": -11.518620491027832, "global_step": 258999, "epoch": 1541} {"train_loss": -10.331588745117188, "global_step": 259000, "epoch": 1541} {"train_loss": -10.214212417602539, "global_step": 259001, "epoch": 1541} {"train_loss": -10.940885543823242, "global_step": 259002, "epoch": 1541} {"train_loss": -9.144218444824219, "global_step": 259003, "epoch": 1541} {"train_loss": -10.68597412109375, "global_step": 259004, "epoch": 1541} {"train_loss": -9.746771812438965, "global_step": 259005, "epoch": 1541} {"train_loss": -9.059744834899902, "global_step": 259006, "epoch": 1541} {"train_loss": -8.813542366027832, "global_step": 259007, "epoch": 1541} {"train_loss": -9.63627815246582, "global_step": 259008, "epoch": 1541} {"train_loss": -8.465639114379883, "global_step": 259009, "epoch": 1541} {"train_loss": -10.723678588867188, "global_step": 259010, "epoch": 1541} {"train_loss": -9.454273223876953, "global_step": 259011, "epoch": 1541} {"train_loss": -10.301979064941406, "global_step": 259012, "epoch": 1541} {"train_loss": -10.264041900634766, "global_step": 259013, "epoch": 1541} {"train_loss": -8.926167488098145, "global_step": 259014, "epoch": 1541} {"train_loss": -9.996806144714355, "global_step": 259015, "epoch": 1541} {"train_loss": -9.923133850097656, "global_step": 259016, "epoch": 1541} {"train_loss": -8.850696563720703, "global_step": 259017, "epoch": 1541} {"train_loss": -11.068370819091797, "global_step": 259018, "epoch": 1541} {"train_loss": -10.249555587768555, "global_step": 259019, "epoch": 1541} {"train_loss": -9.85379695892334, "global_step": 259020, "epoch": 1541} {"train_loss": -11.162948608398438, "global_step": 259021, "epoch": 1541} {"train_loss": -9.992302894592285, "global_step": 259022, "epoch": 1541} {"train_loss": -10.372886657714844, "global_step": 259023, "epoch": 1541} {"train_loss": -11.091594696044922, "global_step": 259024, "epoch": 1541} {"train_loss": -10.432097434997559, "global_step": 259025, "epoch": 1541} {"train_loss": -11.111804962158203, "global_step": 259026, "epoch": 1541} {"train_loss": -10.516302108764648, "global_step": 259027, "epoch": 1541} {"train_loss": -10.926015853881836, "global_step": 259028, "epoch": 1541} {"train_loss": -11.203267097473145, "global_step": 259029, "epoch": 1541} {"train_loss": -10.8546142578125, "global_step": 259030, "epoch": 1541} {"train_loss": -11.074068069458008, "global_step": 259031, "epoch": 1541} {"train_loss": -10.755607604980469, "global_step": 259032, "epoch": 1541} {"train_loss": -10.697317123413086, "global_step": 259033, "epoch": 1541} {"train_loss": -10.850069046020508, "global_step": 259034, "epoch": 1541} {"train_loss": -10.964988708496094, "global_step": 259035, "epoch": 1541} {"train_loss": -11.24338150024414, "global_step": 259036, "epoch": 1541} {"train_loss": -11.389617919921875, "global_step": 259037, "epoch": 1541} {"train_loss": -11.091243743896484, "global_step": 259038, "epoch": 1541} {"train_loss": -11.510481834411621, "global_step": 259039, "epoch": 1541} {"train_loss": -10.690922737121582, "global_step": 259040, "epoch": 1541} {"train_loss": -11.709447860717773, "global_step": 259041, "epoch": 1541} {"train_loss": -10.63619327545166, "global_step": 259042, "epoch": 1541} {"train_loss": -11.544833183288574, "global_step": 259043, "epoch": 1541} {"train_loss": -11.388381958007812, "global_step": 259044, "epoch": 1541} {"train_loss": -11.313409805297852, "global_step": 259045, "epoch": 1541} {"train_loss": -11.5654935836792, "global_step": 259046, "epoch": 1541} {"train_loss": -11.693790435791016, "global_step": 259047, "epoch": 1541} {"train_loss": -11.125201225280762, "global_step": 259048, "epoch": 1541} {"train_loss": -11.388666152954102, "global_step": 259049, "epoch": 1541} {"train_loss": -11.631830215454102, "global_step": 259050, "epoch": 1541} {"train_loss": -11.521598815917969, "global_step": 259051, "epoch": 1541} {"train_loss": -11.517192840576172, "global_step": 259052, "epoch": 1541} {"train_loss": -11.82946491241455, "global_step": 259053, "epoch": 1541} {"train_loss": -11.460844993591309, "global_step": 259054, "epoch": 1541} {"train_loss": -11.407360309646243, "global_step": 259055, "epoch": 1541, "val_loss": 272816.90625} {"train_loss": -11.610440254211426, "global_step": 259056, "epoch": 1542} {"train_loss": -11.518365859985352, "global_step": 259057, "epoch": 1542} {"train_loss": -11.770002365112305, "global_step": 259058, "epoch": 1542} {"train_loss": -11.58180046081543, "global_step": 259059, "epoch": 1542} {"train_loss": -11.622989654541016, "global_step": 259060, "epoch": 1542} {"train_loss": -11.67520523071289, "global_step": 259061, "epoch": 1542} {"train_loss": -11.849531173706055, "global_step": 259062, "epoch": 1542} {"train_loss": -11.443821907043457, "global_step": 259063, "epoch": 1542} {"train_loss": -11.972511291503906, "global_step": 259064, "epoch": 1542} {"train_loss": -11.682016372680664, "global_step": 259065, "epoch": 1542} {"train_loss": -11.907438278198242, "global_step": 259066, "epoch": 1542} {"train_loss": -11.773181915283203, "global_step": 259067, "epoch": 1542} {"train_loss": -11.967365264892578, "global_step": 259068, "epoch": 1542} {"train_loss": -11.842180252075195, "global_step": 259069, "epoch": 1542} {"train_loss": -11.913246154785156, "global_step": 259070, "epoch": 1542} {"train_loss": -11.831300735473633, "global_step": 259071, "epoch": 1542} {"train_loss": -11.923788070678711, "global_step": 259072, "epoch": 1542} {"train_loss": -11.940185546875, "global_step": 259073, "epoch": 1542} {"train_loss": -12.052282333374023, "global_step": 259074, "epoch": 1542} {"train_loss": -11.942069053649902, "global_step": 259075, "epoch": 1542} {"train_loss": -11.956235885620117, "global_step": 259076, "epoch": 1542} {"train_loss": -11.957303047180176, "global_step": 259077, "epoch": 1542} {"train_loss": -11.869836807250977, "global_step": 259078, "epoch": 1542} {"train_loss": -11.764116287231445, "global_step": 259079, "epoch": 1542} {"train_loss": -11.993764877319336, "global_step": 259080, "epoch": 1542} {"train_loss": -11.756772994995117, "global_step": 259081, "epoch": 1542} {"train_loss": -12.0386323928833, "global_step": 259082, "epoch": 1542} {"train_loss": -11.771318435668945, "global_step": 259083, "epoch": 1542} {"train_loss": -12.025009155273438, "global_step": 259084, "epoch": 1542} {"train_loss": -11.872440338134766, "global_step": 259085, "epoch": 1542} {"train_loss": -11.938501358032227, "global_step": 259086, "epoch": 1542} {"train_loss": -11.704646110534668, "global_step": 259087, "epoch": 1542} {"train_loss": -11.902353286743164, "global_step": 259088, "epoch": 1542} {"train_loss": -11.706478118896484, "global_step": 259089, "epoch": 1542} {"train_loss": -11.922656059265137, "global_step": 259090, "epoch": 1542} {"train_loss": -11.46512222290039, "global_step": 259091, "epoch": 1542} {"train_loss": -11.867734909057617, "global_step": 259092, "epoch": 1542} {"train_loss": -11.47346019744873, "global_step": 259093, "epoch": 1542} {"train_loss": -12.172595024108887, "global_step": 259094, "epoch": 1542} {"train_loss": -11.572771072387695, "global_step": 259095, "epoch": 1542} {"train_loss": -11.960039138793945, "global_step": 259096, "epoch": 1542} {"train_loss": -11.869840621948242, "global_step": 259097, "epoch": 1542} {"train_loss": -11.89537239074707, "global_step": 259098, "epoch": 1542} {"train_loss": -12.162203788757324, "global_step": 259099, "epoch": 1542} {"train_loss": -12.039575576782227, "global_step": 259100, "epoch": 1542} {"train_loss": -12.196672439575195, "global_step": 259101, "epoch": 1542} {"train_loss": -12.008499145507812, "global_step": 259102, "epoch": 1542} {"train_loss": -11.907292366027832, "global_step": 259103, "epoch": 1542} {"train_loss": -12.089824676513672, "global_step": 259104, "epoch": 1542} {"train_loss": -12.117964744567871, "global_step": 259105, "epoch": 1542} {"train_loss": -11.867612838745117, "global_step": 259106, "epoch": 1542} {"train_loss": -11.810056686401367, "global_step": 259107, "epoch": 1542} {"train_loss": -12.173726081848145, "global_step": 259108, "epoch": 1542} {"train_loss": -12.080259323120117, "global_step": 259109, "epoch": 1542} {"train_loss": -12.285682678222656, "global_step": 259110, "epoch": 1542} {"train_loss": -11.97592544555664, "global_step": 259111, "epoch": 1542} {"train_loss": -12.202211380004883, "global_step": 259112, "epoch": 1542} {"train_loss": -12.257323265075684, "global_step": 259113, "epoch": 1542} {"train_loss": -12.078275680541992, "global_step": 259114, "epoch": 1542} {"train_loss": -12.331750869750977, "global_step": 259115, "epoch": 1542} {"train_loss": -12.2274169921875, "global_step": 259116, "epoch": 1542} {"train_loss": -12.192765235900879, "global_step": 259117, "epoch": 1542} {"train_loss": -12.38217544555664, "global_step": 259118, "epoch": 1542} {"train_loss": -12.136205673217773, "global_step": 259119, "epoch": 1542} {"train_loss": -12.427197456359863, "global_step": 259120, "epoch": 1542} {"train_loss": -12.300287246704102, "global_step": 259121, "epoch": 1542} {"train_loss": -12.066125869750977, "global_step": 259122, "epoch": 1542} {"train_loss": -12.437087059020996, "global_step": 259123, "epoch": 1542} {"train_loss": -12.304750442504883, "global_step": 259124, "epoch": 1542} {"train_loss": -12.410226821899414, "global_step": 259125, "epoch": 1542} {"train_loss": -12.110788345336914, "global_step": 259126, "epoch": 1542} {"train_loss": -12.326725006103516, "global_step": 259127, "epoch": 1542} {"train_loss": -11.625129699707031, "global_step": 259128, "epoch": 1542} {"train_loss": -11.664877891540527, "global_step": 259129, "epoch": 1542} {"train_loss": -11.962713241577148, "global_step": 259130, "epoch": 1542} {"train_loss": -12.290040016174316, "global_step": 259131, "epoch": 1542} {"train_loss": -11.498860359191895, "global_step": 259132, "epoch": 1542} {"train_loss": -11.18549633026123, "global_step": 259133, "epoch": 1542} {"train_loss": -11.37568473815918, "global_step": 259134, "epoch": 1542} {"train_loss": -11.442867279052734, "global_step": 259135, "epoch": 1542} {"train_loss": -11.462360382080078, "global_step": 259136, "epoch": 1542} {"train_loss": -11.3126220703125, "global_step": 259137, "epoch": 1542} {"train_loss": -10.948282241821289, "global_step": 259138, "epoch": 1542} {"train_loss": -11.18746566772461, "global_step": 259139, "epoch": 1542} {"train_loss": -9.885703086853027, "global_step": 259140, "epoch": 1542} {"train_loss": -11.481121063232422, "global_step": 259141, "epoch": 1542} {"train_loss": -10.121796607971191, "global_step": 259142, "epoch": 1542} {"train_loss": -11.45411491394043, "global_step": 259143, "epoch": 1542} {"train_loss": -10.049772262573242, "global_step": 259144, "epoch": 1542} {"train_loss": -10.87987995147705, "global_step": 259145, "epoch": 1542} {"train_loss": -9.777774810791016, "global_step": 259146, "epoch": 1542} {"train_loss": -9.835908889770508, "global_step": 259147, "epoch": 1542} {"train_loss": -11.040451049804688, "global_step": 259148, "epoch": 1542} {"train_loss": -9.120922088623047, "global_step": 259149, "epoch": 1542} {"train_loss": -9.547155380249023, "global_step": 259150, "epoch": 1542} {"train_loss": -11.639206886291504, "global_step": 259151, "epoch": 1542} {"train_loss": -10.11460018157959, "global_step": 259152, "epoch": 1542} {"train_loss": -11.041106224060059, "global_step": 259153, "epoch": 1542} {"train_loss": -11.181070327758789, "global_step": 259154, "epoch": 1542} {"train_loss": -10.212509155273438, "global_step": 259155, "epoch": 1542} {"train_loss": -11.514939308166504, "global_step": 259156, "epoch": 1542} {"train_loss": -11.161746978759766, "global_step": 259157, "epoch": 1542} {"train_loss": -10.882743835449219, "global_step": 259158, "epoch": 1542} {"train_loss": -10.289773941040039, "global_step": 259159, "epoch": 1542} {"train_loss": -10.870951652526855, "global_step": 259160, "epoch": 1542} {"train_loss": -11.075460433959961, "global_step": 259161, "epoch": 1542} {"train_loss": -10.643255233764648, "global_step": 259162, "epoch": 1542} {"train_loss": -10.857247352600098, "global_step": 259163, "epoch": 1542} {"train_loss": -10.557921409606934, "global_step": 259164, "epoch": 1542} {"train_loss": -10.776142120361328, "global_step": 259165, "epoch": 1542} {"train_loss": -10.27673053741455, "global_step": 259166, "epoch": 1542} {"train_loss": -11.232034683227539, "global_step": 259167, "epoch": 1542} {"train_loss": -11.598291397094727, "global_step": 259168, "epoch": 1542} {"train_loss": -10.587140083312988, "global_step": 259169, "epoch": 1542} {"train_loss": -10.861200332641602, "global_step": 259170, "epoch": 1542} {"train_loss": -10.501195907592773, "global_step": 259171, "epoch": 1542} {"train_loss": -10.884124755859375, "global_step": 259172, "epoch": 1542} {"train_loss": -11.602066993713379, "global_step": 259173, "epoch": 1542} {"train_loss": -11.637669563293457, "global_step": 259174, "epoch": 1542} {"train_loss": -11.275787353515625, "global_step": 259175, "epoch": 1542} {"train_loss": -11.732186317443848, "global_step": 259176, "epoch": 1542} {"train_loss": -11.340958595275879, "global_step": 259177, "epoch": 1542} {"train_loss": -11.348152160644531, "global_step": 259178, "epoch": 1542} {"train_loss": -11.572742462158203, "global_step": 259179, "epoch": 1542} {"train_loss": -11.523423194885254, "global_step": 259180, "epoch": 1542} {"train_loss": -11.713829040527344, "global_step": 259181, "epoch": 1542} {"train_loss": -11.524547576904297, "global_step": 259182, "epoch": 1542} {"train_loss": -11.53319263458252, "global_step": 259183, "epoch": 1542} {"train_loss": -11.738183975219727, "global_step": 259184, "epoch": 1542} {"train_loss": -11.640853881835938, "global_step": 259185, "epoch": 1542} {"train_loss": -11.524547576904297, "global_step": 259186, "epoch": 1542} {"train_loss": -11.617504119873047, "global_step": 259187, "epoch": 1542} {"train_loss": -11.585222244262695, "global_step": 259188, "epoch": 1542} {"train_loss": -11.763874053955078, "global_step": 259189, "epoch": 1542} {"train_loss": -11.502344131469727, "global_step": 259190, "epoch": 1542} {"train_loss": -11.744231224060059, "global_step": 259191, "epoch": 1542} {"train_loss": -11.665831565856934, "global_step": 259192, "epoch": 1542} {"train_loss": -11.64779281616211, "global_step": 259193, "epoch": 1542} {"train_loss": -11.632177352905273, "global_step": 259194, "epoch": 1542} {"train_loss": -11.83808708190918, "global_step": 259195, "epoch": 1542} {"train_loss": -11.819722175598145, "global_step": 259196, "epoch": 1542} {"train_loss": -11.699777603149414, "global_step": 259197, "epoch": 1542} {"train_loss": -11.854082107543945, "global_step": 259198, "epoch": 1542} {"train_loss": -11.97624397277832, "global_step": 259199, "epoch": 1542} {"train_loss": -11.812225341796875, "global_step": 259200, "epoch": 1542} {"train_loss": -11.874368667602539, "global_step": 259201, "epoch": 1542} {"train_loss": -11.827799797058105, "global_step": 259202, "epoch": 1542} {"train_loss": -11.789179801940918, "global_step": 259203, "epoch": 1542} {"train_loss": -11.81041145324707, "global_step": 259204, "epoch": 1542} {"train_loss": -12.027631759643555, "global_step": 259205, "epoch": 1542} {"train_loss": -11.855566024780273, "global_step": 259206, "epoch": 1542} {"train_loss": -12.008529663085938, "global_step": 259207, "epoch": 1542} {"train_loss": -11.796295166015625, "global_step": 259208, "epoch": 1542} {"train_loss": -11.967180252075195, "global_step": 259209, "epoch": 1542} {"train_loss": -11.91002082824707, "global_step": 259210, "epoch": 1542} {"train_loss": -12.129164695739746, "global_step": 259211, "epoch": 1542} {"train_loss": -12.11007022857666, "global_step": 259212, "epoch": 1542} {"train_loss": -12.035633087158203, "global_step": 259213, "epoch": 1542} {"train_loss": -11.872781753540039, "global_step": 259214, "epoch": 1542} {"train_loss": -12.003787994384766, "global_step": 259215, "epoch": 1542} {"train_loss": -11.97634506225586, "global_step": 259216, "epoch": 1542} {"train_loss": -11.908161163330078, "global_step": 259217, "epoch": 1542} {"train_loss": -12.147812843322754, "global_step": 259218, "epoch": 1542} {"train_loss": -11.898591995239258, "global_step": 259219, "epoch": 1542} {"train_loss": -12.048583030700684, "global_step": 259220, "epoch": 1542} {"train_loss": -11.84402847290039, "global_step": 259221, "epoch": 1542} {"train_loss": -11.969406127929688, "global_step": 259222, "epoch": 1542} {"train_loss": -11.61602320557549, "global_step": 259223, "epoch": 1542, "val_loss": 272750.53125} {"train_loss": -12.01673698425293, "global_step": 259224, "epoch": 1543} {"train_loss": -12.165582656860352, "global_step": 259225, "epoch": 1543} {"train_loss": -12.19268798828125, "global_step": 259226, "epoch": 1543} {"train_loss": -12.24984359741211, "global_step": 259227, "epoch": 1543} {"train_loss": -12.155651092529297, "global_step": 259228, "epoch": 1543} {"train_loss": -12.013833999633789, "global_step": 259229, "epoch": 1543} {"train_loss": -12.024177551269531, "global_step": 259230, "epoch": 1543} {"train_loss": -12.171544075012207, "global_step": 259231, "epoch": 1543} {"train_loss": -12.02529525756836, "global_step": 259232, "epoch": 1543} {"train_loss": -12.095657348632812, "global_step": 259233, "epoch": 1543} {"train_loss": -12.137510299682617, "global_step": 259234, "epoch": 1543} {"train_loss": -11.974773406982422, "global_step": 259235, "epoch": 1543} {"train_loss": -11.926578521728516, "global_step": 259236, "epoch": 1543} {"train_loss": -11.873538970947266, "global_step": 259237, "epoch": 1543} {"train_loss": -11.938294410705566, "global_step": 259238, "epoch": 1543} {"train_loss": -12.304306030273438, "global_step": 259239, "epoch": 1543} {"train_loss": -11.99759578704834, "global_step": 259240, "epoch": 1543} {"train_loss": -11.927925109863281, "global_step": 259241, "epoch": 1543} {"train_loss": -11.777371406555176, "global_step": 259242, "epoch": 1543} {"train_loss": -11.986407279968262, "global_step": 259243, "epoch": 1543} {"train_loss": -12.159760475158691, "global_step": 259244, "epoch": 1543} {"train_loss": -11.954633712768555, "global_step": 259245, "epoch": 1543} {"train_loss": -12.2742919921875, "global_step": 259246, "epoch": 1543} {"train_loss": -11.792837142944336, "global_step": 259247, "epoch": 1543} {"train_loss": -11.949785232543945, "global_step": 259248, "epoch": 1543} {"train_loss": -12.263188362121582, "global_step": 259249, "epoch": 1543} {"train_loss": -12.16333293914795, "global_step": 259250, "epoch": 1543} {"train_loss": -12.239200592041016, "global_step": 259251, "epoch": 1543} {"train_loss": -12.188663482666016, "global_step": 259252, "epoch": 1543} {"train_loss": -12.076215744018555, "global_step": 259253, "epoch": 1543} {"train_loss": -12.157855987548828, "global_step": 259254, "epoch": 1543} {"train_loss": -12.052507400512695, "global_step": 259255, "epoch": 1543} {"train_loss": -11.970815658569336, "global_step": 259256, "epoch": 1543} {"train_loss": -11.87478256225586, "global_step": 259257, "epoch": 1543} {"train_loss": -12.143826484680176, "global_step": 259258, "epoch": 1543} {"train_loss": -11.919187545776367, "global_step": 259259, "epoch": 1543} {"train_loss": -11.93246841430664, "global_step": 259260, "epoch": 1543} {"train_loss": -11.92208480834961, "global_step": 259261, "epoch": 1543} {"train_loss": -11.92216682434082, "global_step": 259262, "epoch": 1543} {"train_loss": -11.585375785827637, "global_step": 259263, "epoch": 1543} {"train_loss": -11.410898208618164, "global_step": 259264, "epoch": 1543} {"train_loss": -11.307868957519531, "global_step": 259265, "epoch": 1543} {"train_loss": -11.42204475402832, "global_step": 259266, "epoch": 1543} {"train_loss": -11.735173225402832, "global_step": 259267, "epoch": 1543} {"train_loss": -11.38004207611084, "global_step": 259268, "epoch": 1543} {"train_loss": -9.964614868164062, "global_step": 259269, "epoch": 1543} {"train_loss": -10.298913955688477, "global_step": 259270, "epoch": 1543} {"train_loss": -8.201606750488281, "global_step": 259271, "epoch": 1543} {"train_loss": -8.8521089553833, "global_step": 259272, "epoch": 1543} {"train_loss": -8.744304656982422, "global_step": 259273, "epoch": 1543} {"train_loss": -9.712298393249512, "global_step": 259274, "epoch": 1543} {"train_loss": -9.143213272094727, "global_step": 259275, "epoch": 1543} {"train_loss": -9.776533126831055, "global_step": 259276, "epoch": 1543} {"train_loss": -9.838955879211426, "global_step": 259277, "epoch": 1543} {"train_loss": -9.548303604125977, "global_step": 259278, "epoch": 1543} {"train_loss": -8.677978515625, "global_step": 259279, "epoch": 1543} {"train_loss": -11.0706787109375, "global_step": 259280, "epoch": 1543} {"train_loss": -7.967373847961426, "global_step": 259281, "epoch": 1543} {"train_loss": -10.482154846191406, "global_step": 259282, "epoch": 1543} {"train_loss": -10.163288116455078, "global_step": 259283, "epoch": 1543} {"train_loss": -10.134296417236328, "global_step": 259284, "epoch": 1543} {"train_loss": -10.173332214355469, "global_step": 259285, "epoch": 1543} {"train_loss": -10.803010940551758, "global_step": 259286, "epoch": 1543} {"train_loss": -10.472343444824219, "global_step": 259287, "epoch": 1543} {"train_loss": -11.346023559570312, "global_step": 259288, "epoch": 1543} {"train_loss": -10.904134750366211, "global_step": 259289, "epoch": 1543} {"train_loss": -10.97412109375, "global_step": 259290, "epoch": 1543} {"train_loss": -11.462069511413574, "global_step": 259291, "epoch": 1543} {"train_loss": -11.040172576904297, "global_step": 259292, "epoch": 1543} {"train_loss": -11.362491607666016, "global_step": 259293, "epoch": 1543} {"train_loss": -11.56915283203125, "global_step": 259294, "epoch": 1543} {"train_loss": -11.051051139831543, "global_step": 259295, "epoch": 1543} {"train_loss": -11.67558765411377, "global_step": 259296, "epoch": 1543} {"train_loss": -11.672223091125488, "global_step": 259297, "epoch": 1543} {"train_loss": -11.353978157043457, "global_step": 259298, "epoch": 1543} {"train_loss": -11.72962760925293, "global_step": 259299, "epoch": 1543} {"train_loss": -11.554676055908203, "global_step": 259300, "epoch": 1543} {"train_loss": -11.373915672302246, "global_step": 259301, "epoch": 1543} {"train_loss": -11.53219985961914, "global_step": 259302, "epoch": 1543} {"train_loss": -11.647107124328613, "global_step": 259303, "epoch": 1543} {"train_loss": -11.275718688964844, "global_step": 259304, "epoch": 1543} {"train_loss": -11.542929649353027, "global_step": 259305, "epoch": 1543} {"train_loss": -11.603107452392578, "global_step": 259306, "epoch": 1543} {"train_loss": -11.625293731689453, "global_step": 259307, "epoch": 1543} {"train_loss": -11.775060653686523, "global_step": 259308, "epoch": 1543} {"train_loss": -11.3917818069458, "global_step": 259309, "epoch": 1543} {"train_loss": -11.56750202178955, "global_step": 259310, "epoch": 1543} {"train_loss": -11.764068603515625, "global_step": 259311, "epoch": 1543} {"train_loss": -12.112862586975098, "global_step": 259312, "epoch": 1543} {"train_loss": -11.846511840820312, "global_step": 259313, "epoch": 1543} {"train_loss": -11.793049812316895, "global_step": 259314, "epoch": 1543} {"train_loss": -11.801040649414062, "global_step": 259315, "epoch": 1543} {"train_loss": -11.816533088684082, "global_step": 259316, "epoch": 1543} {"train_loss": -11.739633560180664, "global_step": 259317, "epoch": 1543} {"train_loss": -11.767871856689453, "global_step": 259318, "epoch": 1543} {"train_loss": -11.956668853759766, "global_step": 259319, "epoch": 1543} {"train_loss": -11.962625503540039, "global_step": 259320, "epoch": 1543} {"train_loss": -11.834700584411621, "global_step": 259321, "epoch": 1543} {"train_loss": -11.619000434875488, "global_step": 259322, "epoch": 1543} {"train_loss": -11.925378799438477, "global_step": 259323, "epoch": 1543} {"train_loss": -11.57918643951416, "global_step": 259324, "epoch": 1543} {"train_loss": -12.073006629943848, "global_step": 259325, "epoch": 1543} {"train_loss": -11.5834379196167, "global_step": 259326, "epoch": 1543} {"train_loss": -11.801918029785156, "global_step": 259327, "epoch": 1543} {"train_loss": -12.111282348632812, "global_step": 259328, "epoch": 1543} {"train_loss": -11.815366744995117, "global_step": 259329, "epoch": 1543} {"train_loss": -12.03339958190918, "global_step": 259330, "epoch": 1543} {"train_loss": -12.031229019165039, "global_step": 259331, "epoch": 1543} {"train_loss": -11.863443374633789, "global_step": 259332, "epoch": 1543} {"train_loss": -11.862663269042969, "global_step": 259333, "epoch": 1543} {"train_loss": -12.006610870361328, "global_step": 259334, "epoch": 1543} {"train_loss": -12.0123929977417, "global_step": 259335, "epoch": 1543} {"train_loss": -11.910780906677246, "global_step": 259336, "epoch": 1543} {"train_loss": -11.7555513381958, "global_step": 259337, "epoch": 1543} {"train_loss": -12.131307601928711, "global_step": 259338, "epoch": 1543} {"train_loss": -12.179173469543457, "global_step": 259339, "epoch": 1543} {"train_loss": -11.90179443359375, "global_step": 259340, "epoch": 1543} {"train_loss": -11.91910457611084, "global_step": 259341, "epoch": 1543} {"train_loss": -11.96322250366211, "global_step": 259342, "epoch": 1543} {"train_loss": -11.607868194580078, "global_step": 259343, "epoch": 1543} {"train_loss": -12.027618408203125, "global_step": 259344, "epoch": 1543} {"train_loss": -12.119401931762695, "global_step": 259345, "epoch": 1543} {"train_loss": -12.088708877563477, "global_step": 259346, "epoch": 1543} {"train_loss": -12.052206039428711, "global_step": 259347, "epoch": 1543} {"train_loss": -11.988530158996582, "global_step": 259348, "epoch": 1543} {"train_loss": -12.157910346984863, "global_step": 259349, "epoch": 1543} {"train_loss": -12.079835891723633, "global_step": 259350, "epoch": 1543} {"train_loss": -11.97223949432373, "global_step": 259351, "epoch": 1543} {"train_loss": -11.718219757080078, "global_step": 259352, "epoch": 1543} {"train_loss": -11.724143981933594, "global_step": 259353, "epoch": 1543} {"train_loss": -12.216339111328125, "global_step": 259354, "epoch": 1543} {"train_loss": -11.622711181640625, "global_step": 259355, "epoch": 1543} {"train_loss": -11.945927619934082, "global_step": 259356, "epoch": 1543} {"train_loss": -11.192340850830078, "global_step": 259357, "epoch": 1543} {"train_loss": -11.670696258544922, "global_step": 259358, "epoch": 1543} {"train_loss": -11.222285270690918, "global_step": 259359, "epoch": 1543} {"train_loss": -11.78866195678711, "global_step": 259360, "epoch": 1543} {"train_loss": -11.599973678588867, "global_step": 259361, "epoch": 1543} {"train_loss": -11.59599494934082, "global_step": 259362, "epoch": 1543} {"train_loss": -11.571234703063965, "global_step": 259363, "epoch": 1543} {"train_loss": -11.755684852600098, "global_step": 259364, "epoch": 1543} {"train_loss": -11.191513061523438, "global_step": 259365, "epoch": 1543} {"train_loss": -12.110616683959961, "global_step": 259366, "epoch": 1543} {"train_loss": -11.327252388000488, "global_step": 259367, "epoch": 1543} {"train_loss": -11.683942794799805, "global_step": 259368, "epoch": 1543} {"train_loss": -11.075468063354492, "global_step": 259369, "epoch": 1543} {"train_loss": -11.880805969238281, "global_step": 259370, "epoch": 1543} {"train_loss": -11.32954216003418, "global_step": 259371, "epoch": 1543} {"train_loss": -11.574169158935547, "global_step": 259372, "epoch": 1543} {"train_loss": -11.719536781311035, "global_step": 259373, "epoch": 1543} {"train_loss": -11.222465515136719, "global_step": 259374, "epoch": 1543} {"train_loss": -11.676027297973633, "global_step": 259375, "epoch": 1543} {"train_loss": -11.689842224121094, "global_step": 259376, "epoch": 1543} {"train_loss": -12.08364486694336, "global_step": 259377, "epoch": 1543} {"train_loss": -11.835004806518555, "global_step": 259378, "epoch": 1543} {"train_loss": -11.897584915161133, "global_step": 259379, "epoch": 1543} {"train_loss": -11.750020027160645, "global_step": 259380, "epoch": 1543} {"train_loss": -11.33108139038086, "global_step": 259381, "epoch": 1543} {"train_loss": -11.399120330810547, "global_step": 259382, "epoch": 1543} {"train_loss": -12.058076858520508, "global_step": 259383, "epoch": 1543} {"train_loss": -11.4782075881958, "global_step": 259384, "epoch": 1543} {"train_loss": -11.728019714355469, "global_step": 259385, "epoch": 1543} {"train_loss": -11.34636116027832, "global_step": 259386, "epoch": 1543} {"train_loss": -12.021748542785645, "global_step": 259387, "epoch": 1543} {"train_loss": -11.755782127380371, "global_step": 259388, "epoch": 1543} {"train_loss": -11.826040267944336, "global_step": 259389, "epoch": 1543} {"train_loss": -11.75926399230957, "global_step": 259390, "epoch": 1543} {"train_loss": -11.550002591950554, "global_step": 259391, "epoch": 1543, "val_loss": 267902.96875} {"train_loss": -11.867815017700195, "global_step": 259392, "epoch": 1544} {"train_loss": -12.012469291687012, "global_step": 259393, "epoch": 1544} {"train_loss": -11.856071472167969, "global_step": 259394, "epoch": 1544} {"train_loss": -11.852144241333008, "global_step": 259395, "epoch": 1544} {"train_loss": -12.109701156616211, "global_step": 259396, "epoch": 1544} {"train_loss": -11.846612930297852, "global_step": 259397, "epoch": 1544} {"train_loss": -11.860136032104492, "global_step": 259398, "epoch": 1544} {"train_loss": -12.14760971069336, "global_step": 259399, "epoch": 1544} {"train_loss": -11.76266860961914, "global_step": 259400, "epoch": 1544} {"train_loss": -11.719449043273926, "global_step": 259401, "epoch": 1544} {"train_loss": -12.148463249206543, "global_step": 259402, "epoch": 1544} {"train_loss": -11.774044036865234, "global_step": 259403, "epoch": 1544} {"train_loss": -11.775644302368164, "global_step": 259404, "epoch": 1544} {"train_loss": -11.978836059570312, "global_step": 259405, "epoch": 1544} {"train_loss": -11.382673263549805, "global_step": 259406, "epoch": 1544} {"train_loss": -10.592514038085938, "global_step": 259407, "epoch": 1544} {"train_loss": -11.899140357971191, "global_step": 259408, "epoch": 1544} {"train_loss": -11.710538864135742, "global_step": 259409, "epoch": 1544} {"train_loss": -11.216859817504883, "global_step": 259410, "epoch": 1544} {"train_loss": -11.838836669921875, "global_step": 259411, "epoch": 1544} {"train_loss": -11.857288360595703, "global_step": 259412, "epoch": 1544} {"train_loss": -12.173503875732422, "global_step": 259413, "epoch": 1544} {"train_loss": -11.794767379760742, "global_step": 259414, "epoch": 1544} {"train_loss": -12.118370056152344, "global_step": 259415, "epoch": 1544} {"train_loss": -11.871709823608398, "global_step": 259416, "epoch": 1544} {"train_loss": -11.52861499786377, "global_step": 259417, "epoch": 1544} {"train_loss": -11.466894149780273, "global_step": 259418, "epoch": 1544} {"train_loss": -11.967288970947266, "global_step": 259419, "epoch": 1544} {"train_loss": -11.280451774597168, "global_step": 259420, "epoch": 1544} {"train_loss": -11.23118782043457, "global_step": 259421, "epoch": 1544} {"train_loss": -11.7335844039917, "global_step": 259422, "epoch": 1544} {"train_loss": -12.013755798339844, "global_step": 259423, "epoch": 1544} {"train_loss": -11.592620849609375, "global_step": 259424, "epoch": 1544} {"train_loss": -11.95742416381836, "global_step": 259425, "epoch": 1544} {"train_loss": -11.780176162719727, "global_step": 259426, "epoch": 1544} {"train_loss": -12.030545234680176, "global_step": 259427, "epoch": 1544} {"train_loss": -11.67987060546875, "global_step": 259428, "epoch": 1544} {"train_loss": -11.950297355651855, "global_step": 259429, "epoch": 1544} {"train_loss": -11.974143028259277, "global_step": 259430, "epoch": 1544} {"train_loss": -12.019848823547363, "global_step": 259431, "epoch": 1544} {"train_loss": -11.759794235229492, "global_step": 259432, "epoch": 1544} {"train_loss": -12.30920124053955, "global_step": 259433, "epoch": 1544} {"train_loss": -11.621405601501465, "global_step": 259434, "epoch": 1544} {"train_loss": -11.56994342803955, "global_step": 259435, "epoch": 1544} {"train_loss": -12.184850692749023, "global_step": 259436, "epoch": 1544} {"train_loss": -11.805779457092285, "global_step": 259437, "epoch": 1544} {"train_loss": -10.842058181762695, "global_step": 259438, "epoch": 1544} {"train_loss": -11.791057586669922, "global_step": 259439, "epoch": 1544} {"train_loss": -11.694723129272461, "global_step": 259440, "epoch": 1544} {"train_loss": -11.494755744934082, "global_step": 259441, "epoch": 1544} {"train_loss": -11.813955307006836, "global_step": 259442, "epoch": 1544} {"train_loss": -11.893106460571289, "global_step": 259443, "epoch": 1544} {"train_loss": -11.824737548828125, "global_step": 259444, "epoch": 1544} {"train_loss": -11.67537784576416, "global_step": 259445, "epoch": 1544} {"train_loss": -11.552423477172852, "global_step": 259446, "epoch": 1544} {"train_loss": -11.91396427154541, "global_step": 259447, "epoch": 1544} {"train_loss": -11.734155654907227, "global_step": 259448, "epoch": 1544} {"train_loss": -12.025375366210938, "global_step": 259449, "epoch": 1544} {"train_loss": -11.065422058105469, "global_step": 259450, "epoch": 1544} {"train_loss": -12.038684844970703, "global_step": 259451, "epoch": 1544} {"train_loss": -11.965160369873047, "global_step": 259452, "epoch": 1544} {"train_loss": -11.865169525146484, "global_step": 259453, "epoch": 1544} {"train_loss": -12.242105484008789, "global_step": 259454, "epoch": 1544} {"train_loss": -11.908992767333984, "global_step": 259455, "epoch": 1544} {"train_loss": -11.904953002929688, "global_step": 259456, "epoch": 1544} {"train_loss": -12.107603073120117, "global_step": 259457, "epoch": 1544} {"train_loss": -11.833877563476562, "global_step": 259458, "epoch": 1544} {"train_loss": -12.124948501586914, "global_step": 259459, "epoch": 1544} {"train_loss": -11.897512435913086, "global_step": 259460, "epoch": 1544} {"train_loss": -11.928281784057617, "global_step": 259461, "epoch": 1544} {"train_loss": -12.054849624633789, "global_step": 259462, "epoch": 1544} {"train_loss": -11.973971366882324, "global_step": 259463, "epoch": 1544} {"train_loss": -11.938589096069336, "global_step": 259464, "epoch": 1544} {"train_loss": -11.948266983032227, "global_step": 259465, "epoch": 1544} {"train_loss": -11.912158966064453, "global_step": 259466, "epoch": 1544} {"train_loss": -12.210784912109375, "global_step": 259467, "epoch": 1544} {"train_loss": -11.988875389099121, "global_step": 259468, "epoch": 1544} {"train_loss": -12.103021621704102, "global_step": 259469, "epoch": 1544} {"train_loss": -12.082244873046875, "global_step": 259470, "epoch": 1544} {"train_loss": -12.133729934692383, "global_step": 259471, "epoch": 1544} {"train_loss": -12.120988845825195, "global_step": 259472, "epoch": 1544} {"train_loss": -12.034130096435547, "global_step": 259473, "epoch": 1544} {"train_loss": -11.754034996032715, "global_step": 259474, "epoch": 1544} {"train_loss": -12.057853698730469, "global_step": 259475, "epoch": 1544} {"train_loss": -11.861429214477539, "global_step": 259476, "epoch": 1544} {"train_loss": -11.869659423828125, "global_step": 259477, "epoch": 1544} {"train_loss": -11.707714080810547, "global_step": 259478, "epoch": 1544} {"train_loss": -12.060405731201172, "global_step": 259479, "epoch": 1544} {"train_loss": -11.925108909606934, "global_step": 259480, "epoch": 1544} {"train_loss": -11.094207763671875, "global_step": 259481, "epoch": 1544} {"train_loss": -9.922760009765625, "global_step": 259482, "epoch": 1544} {"train_loss": -12.117108345031738, "global_step": 259483, "epoch": 1544} {"train_loss": -10.14426040649414, "global_step": 259484, "epoch": 1544} {"train_loss": -10.570210456848145, "global_step": 259485, "epoch": 1544} {"train_loss": -10.967296600341797, "global_step": 259486, "epoch": 1544} {"train_loss": -11.372549057006836, "global_step": 259487, "epoch": 1544} {"train_loss": -10.098247528076172, "global_step": 259488, "epoch": 1544} {"train_loss": -10.77881145477295, "global_step": 259489, "epoch": 1544} {"train_loss": -8.606346130371094, "global_step": 259490, "epoch": 1544} {"train_loss": -7.722124099731445, "global_step": 259491, "epoch": 1544} {"train_loss": -7.557287216186523, "global_step": 259492, "epoch": 1544} {"train_loss": -8.54764175415039, "global_step": 259493, "epoch": 1544} {"train_loss": -9.607542037963867, "global_step": 259494, "epoch": 1544} {"train_loss": -9.625618934631348, "global_step": 259495, "epoch": 1544} {"train_loss": -8.773626327514648, "global_step": 259496, "epoch": 1544} {"train_loss": -9.796042442321777, "global_step": 259497, "epoch": 1544} {"train_loss": -9.5418062210083, "global_step": 259498, "epoch": 1544} {"train_loss": -9.774495124816895, "global_step": 259499, "epoch": 1544} {"train_loss": -10.300745010375977, "global_step": 259500, "epoch": 1544} {"train_loss": -10.102457046508789, "global_step": 259501, "epoch": 1544} {"train_loss": -10.992963790893555, "global_step": 259502, "epoch": 1544} {"train_loss": -10.152503967285156, "global_step": 259503, "epoch": 1544} {"train_loss": -10.341064453125, "global_step": 259504, "epoch": 1544} {"train_loss": -9.754372596740723, "global_step": 259505, "epoch": 1544} {"train_loss": -10.482460975646973, "global_step": 259506, "epoch": 1544} {"train_loss": -10.935301780700684, "global_step": 259507, "epoch": 1544} {"train_loss": -11.176790237426758, "global_step": 259508, "epoch": 1544} {"train_loss": -10.573116302490234, "global_step": 259509, "epoch": 1544} {"train_loss": -11.172830581665039, "global_step": 259510, "epoch": 1544} {"train_loss": -10.791372299194336, "global_step": 259511, "epoch": 1544} {"train_loss": -11.117439270019531, "global_step": 259512, "epoch": 1544} {"train_loss": -11.356429100036621, "global_step": 259513, "epoch": 1544} {"train_loss": -11.252957344055176, "global_step": 259514, "epoch": 1544} {"train_loss": -11.563016891479492, "global_step": 259515, "epoch": 1544} {"train_loss": -11.442331314086914, "global_step": 259516, "epoch": 1544} {"train_loss": -11.631443977355957, "global_step": 259517, "epoch": 1544} {"train_loss": -11.051910400390625, "global_step": 259518, "epoch": 1544} {"train_loss": -11.792348861694336, "global_step": 259519, "epoch": 1544} {"train_loss": -11.692041397094727, "global_step": 259520, "epoch": 1544} {"train_loss": -11.712553024291992, "global_step": 259521, "epoch": 1544} {"train_loss": -11.48109245300293, "global_step": 259522, "epoch": 1544} {"train_loss": -11.945695877075195, "global_step": 259523, "epoch": 1544} {"train_loss": -11.635112762451172, "global_step": 259524, "epoch": 1544} {"train_loss": -11.792169570922852, "global_step": 259525, "epoch": 1544} {"train_loss": -11.711949348449707, "global_step": 259526, "epoch": 1544} {"train_loss": -11.82374095916748, "global_step": 259527, "epoch": 1544} {"train_loss": -11.7238130569458, "global_step": 259528, "epoch": 1544} {"train_loss": -11.939393997192383, "global_step": 259529, "epoch": 1544} {"train_loss": -11.768836975097656, "global_step": 259530, "epoch": 1544} {"train_loss": -11.972006797790527, "global_step": 259531, "epoch": 1544} {"train_loss": -11.777475357055664, "global_step": 259532, "epoch": 1544} {"train_loss": -11.950393676757812, "global_step": 259533, "epoch": 1544} {"train_loss": -11.63900089263916, "global_step": 259534, "epoch": 1544} {"train_loss": -11.972916603088379, "global_step": 259535, "epoch": 1544} {"train_loss": -11.737653732299805, "global_step": 259536, "epoch": 1544} {"train_loss": -11.919832229614258, "global_step": 259537, "epoch": 1544} {"train_loss": -11.999805450439453, "global_step": 259538, "epoch": 1544} {"train_loss": -12.051078796386719, "global_step": 259539, "epoch": 1544} {"train_loss": -11.956777572631836, "global_step": 259540, "epoch": 1544} {"train_loss": -12.091666221618652, "global_step": 259541, "epoch": 1544} {"train_loss": -12.213096618652344, "global_step": 259542, "epoch": 1544} {"train_loss": -12.089595794677734, "global_step": 259543, "epoch": 1544} {"train_loss": -11.913581848144531, "global_step": 259544, "epoch": 1544} {"train_loss": -12.102499961853027, "global_step": 259545, "epoch": 1544} {"train_loss": -12.120454788208008, "global_step": 259546, "epoch": 1544} {"train_loss": -12.111434936523438, "global_step": 259547, "epoch": 1544} {"train_loss": -11.910404205322266, "global_step": 259548, "epoch": 1544} {"train_loss": -12.12601375579834, "global_step": 259549, "epoch": 1544} {"train_loss": -12.067886352539062, "global_step": 259550, "epoch": 1544} {"train_loss": -12.210598945617676, "global_step": 259551, "epoch": 1544} {"train_loss": -12.252934455871582, "global_step": 259552, "epoch": 1544} {"train_loss": -12.07276725769043, "global_step": 259553, "epoch": 1544} {"train_loss": -11.97879409790039, "global_step": 259554, "epoch": 1544} {"train_loss": -12.06338882446289, "global_step": 259555, "epoch": 1544} {"train_loss": -12.027606964111328, "global_step": 259556, "epoch": 1544} {"train_loss": -12.223251342773438, "global_step": 259557, "epoch": 1544} {"train_loss": -12.108260154724121, "global_step": 259558, "epoch": 1544} {"train_loss": -11.524899908474513, "global_step": 259559, "epoch": 1544, "val_loss": 267895.75} {"train_loss": -12.085065841674805, "global_step": 259560, "epoch": 1545} {"train_loss": -12.064640045166016, "global_step": 259561, "epoch": 1545} {"train_loss": -12.002796173095703, "global_step": 259562, "epoch": 1545} {"train_loss": -12.135910034179688, "global_step": 259563, "epoch": 1545} {"train_loss": -12.142962455749512, "global_step": 259564, "epoch": 1545} {"train_loss": -12.294029235839844, "global_step": 259565, "epoch": 1545} {"train_loss": -12.101418495178223, "global_step": 259566, "epoch": 1545} {"train_loss": -12.107460021972656, "global_step": 259567, "epoch": 1545} {"train_loss": -12.087156295776367, "global_step": 259568, "epoch": 1545} {"train_loss": -12.272839546203613, "global_step": 259569, "epoch": 1545} {"train_loss": -12.15774154663086, "global_step": 259570, "epoch": 1545} {"train_loss": -12.312675476074219, "global_step": 259571, "epoch": 1545} {"train_loss": -12.263486862182617, "global_step": 259572, "epoch": 1545} {"train_loss": -12.153814315795898, "global_step": 259573, "epoch": 1545} {"train_loss": -12.226110458374023, "global_step": 259574, "epoch": 1545} {"train_loss": -12.328815460205078, "global_step": 259575, "epoch": 1545} {"train_loss": -12.054250717163086, "global_step": 259576, "epoch": 1545} {"train_loss": -12.42020320892334, "global_step": 259577, "epoch": 1545} {"train_loss": -12.288298606872559, "global_step": 259578, "epoch": 1545} {"train_loss": -11.795135498046875, "global_step": 259579, "epoch": 1545} {"train_loss": -12.199224472045898, "global_step": 259580, "epoch": 1545} {"train_loss": -12.040546417236328, "global_step": 259581, "epoch": 1545} {"train_loss": -12.154657363891602, "global_step": 259582, "epoch": 1545} {"train_loss": -11.570530891418457, "global_step": 259583, "epoch": 1545} {"train_loss": -11.395326614379883, "global_step": 259584, "epoch": 1545} {"train_loss": -11.871843338012695, "global_step": 259585, "epoch": 1545} {"train_loss": -11.367298126220703, "global_step": 259586, "epoch": 1545} {"train_loss": -11.61783218383789, "global_step": 259587, "epoch": 1545} {"train_loss": -10.788811683654785, "global_step": 259588, "epoch": 1545} {"train_loss": -11.646303176879883, "global_step": 259589, "epoch": 1545} {"train_loss": -11.389689445495605, "global_step": 259590, "epoch": 1545} {"train_loss": -11.620828628540039, "global_step": 259591, "epoch": 1545} {"train_loss": -11.016353607177734, "global_step": 259592, "epoch": 1545} {"train_loss": -10.40629768371582, "global_step": 259593, "epoch": 1545} {"train_loss": -10.156671524047852, "global_step": 259594, "epoch": 1545} {"train_loss": -11.56918716430664, "global_step": 259595, "epoch": 1545} {"train_loss": -11.616020202636719, "global_step": 259596, "epoch": 1545} {"train_loss": -11.631599426269531, "global_step": 259597, "epoch": 1545} {"train_loss": -10.87208366394043, "global_step": 259598, "epoch": 1545} {"train_loss": -11.423736572265625, "global_step": 259599, "epoch": 1545} {"train_loss": -11.546319961547852, "global_step": 259600, "epoch": 1545} {"train_loss": -11.329702377319336, "global_step": 259601, "epoch": 1545} {"train_loss": -11.281286239624023, "global_step": 259602, "epoch": 1545} {"train_loss": -11.844925880432129, "global_step": 259603, "epoch": 1545} {"train_loss": -11.037714004516602, "global_step": 259604, "epoch": 1545} {"train_loss": -11.384716987609863, "global_step": 259605, "epoch": 1545} {"train_loss": -11.752265930175781, "global_step": 259606, "epoch": 1545} {"train_loss": -11.431906700134277, "global_step": 259607, "epoch": 1545} {"train_loss": -11.70946216583252, "global_step": 259608, "epoch": 1545} {"train_loss": -11.372930526733398, "global_step": 259609, "epoch": 1545} {"train_loss": -10.915494918823242, "global_step": 259610, "epoch": 1545} {"train_loss": -10.521740913391113, "global_step": 259611, "epoch": 1545} {"train_loss": -12.004097938537598, "global_step": 259612, "epoch": 1545} {"train_loss": -11.195910453796387, "global_step": 259613, "epoch": 1545} {"train_loss": -11.38602066040039, "global_step": 259614, "epoch": 1545} {"train_loss": -11.059402465820312, "global_step": 259615, "epoch": 1545} {"train_loss": -10.986111640930176, "global_step": 259616, "epoch": 1545} {"train_loss": -11.186166763305664, "global_step": 259617, "epoch": 1545} {"train_loss": -10.785930633544922, "global_step": 259618, "epoch": 1545} {"train_loss": -11.419778823852539, "global_step": 259619, "epoch": 1545} {"train_loss": -10.457114219665527, "global_step": 259620, "epoch": 1545} {"train_loss": -11.424660682678223, "global_step": 259621, "epoch": 1545} {"train_loss": -10.68248176574707, "global_step": 259622, "epoch": 1545} {"train_loss": -11.27316951751709, "global_step": 259623, "epoch": 1545} {"train_loss": -10.390359878540039, "global_step": 259624, "epoch": 1545} {"train_loss": -10.87707233428955, "global_step": 259625, "epoch": 1545} {"train_loss": -11.142877578735352, "global_step": 259626, "epoch": 1545} {"train_loss": -10.157649993896484, "global_step": 259627, "epoch": 1545} {"train_loss": -11.623030662536621, "global_step": 259628, "epoch": 1545} {"train_loss": -11.283027648925781, "global_step": 259629, "epoch": 1545} {"train_loss": -11.411304473876953, "global_step": 259630, "epoch": 1545} {"train_loss": -11.373230934143066, "global_step": 259631, "epoch": 1545} {"train_loss": -11.307609558105469, "global_step": 259632, "epoch": 1545} {"train_loss": -11.293438911437988, "global_step": 259633, "epoch": 1545} {"train_loss": -10.145242691040039, "global_step": 259634, "epoch": 1545} {"train_loss": -11.484726905822754, "global_step": 259635, "epoch": 1545} {"train_loss": -10.168132781982422, "global_step": 259636, "epoch": 1545} {"train_loss": -11.313151359558105, "global_step": 259637, "epoch": 1545} {"train_loss": -10.509271621704102, "global_step": 259638, "epoch": 1545} {"train_loss": -11.168035507202148, "global_step": 259639, "epoch": 1545} {"train_loss": -10.415594100952148, "global_step": 259640, "epoch": 1545} {"train_loss": -11.126073837280273, "global_step": 259641, "epoch": 1545} {"train_loss": -11.248023986816406, "global_step": 259642, "epoch": 1545} {"train_loss": -10.73442268371582, "global_step": 259643, "epoch": 1545} {"train_loss": -11.547369956970215, "global_step": 259644, "epoch": 1545} {"train_loss": -10.791114807128906, "global_step": 259645, "epoch": 1545} {"train_loss": -11.806808471679688, "global_step": 259646, "epoch": 1545} {"train_loss": -11.362617492675781, "global_step": 259647, "epoch": 1545} {"train_loss": -11.592347145080566, "global_step": 259648, "epoch": 1545} {"train_loss": -11.280899047851562, "global_step": 259649, "epoch": 1545} {"train_loss": -11.602202415466309, "global_step": 259650, "epoch": 1545} {"train_loss": -11.421346664428711, "global_step": 259651, "epoch": 1545} {"train_loss": -11.6161470413208, "global_step": 259652, "epoch": 1545} {"train_loss": -11.416792869567871, "global_step": 259653, "epoch": 1545} {"train_loss": -11.671607971191406, "global_step": 259654, "epoch": 1545} {"train_loss": -11.519158363342285, "global_step": 259655, "epoch": 1545} {"train_loss": -11.645524978637695, "global_step": 259656, "epoch": 1545} {"train_loss": -11.588948249816895, "global_step": 259657, "epoch": 1545} {"train_loss": -11.488361358642578, "global_step": 259658, "epoch": 1545} {"train_loss": -11.739612579345703, "global_step": 259659, "epoch": 1545} {"train_loss": -11.654630661010742, "global_step": 259660, "epoch": 1545} {"train_loss": -11.894774436950684, "global_step": 259661, "epoch": 1545} {"train_loss": -11.4805326461792, "global_step": 259662, "epoch": 1545} {"train_loss": -11.933093070983887, "global_step": 259663, "epoch": 1545} {"train_loss": -11.492226600646973, "global_step": 259664, "epoch": 1545} {"train_loss": -12.033344268798828, "global_step": 259665, "epoch": 1545} {"train_loss": -11.749671936035156, "global_step": 259666, "epoch": 1545} {"train_loss": -11.883710861206055, "global_step": 259667, "epoch": 1545} {"train_loss": -11.52851676940918, "global_step": 259668, "epoch": 1545} {"train_loss": -11.858114242553711, "global_step": 259669, "epoch": 1545} {"train_loss": -11.566031455993652, "global_step": 259670, "epoch": 1545} {"train_loss": -11.573067665100098, "global_step": 259671, "epoch": 1545} {"train_loss": -11.642492294311523, "global_step": 259672, "epoch": 1545} {"train_loss": -11.490039825439453, "global_step": 259673, "epoch": 1545} {"train_loss": -11.944246292114258, "global_step": 259674, "epoch": 1545} {"train_loss": -11.713944435119629, "global_step": 259675, "epoch": 1545} {"train_loss": -11.818500518798828, "global_step": 259676, "epoch": 1545} {"train_loss": -11.836641311645508, "global_step": 259677, "epoch": 1545} {"train_loss": -12.008729934692383, "global_step": 259678, "epoch": 1545} {"train_loss": -11.899555206298828, "global_step": 259679, "epoch": 1545} {"train_loss": -11.893645286560059, "global_step": 259680, "epoch": 1545} {"train_loss": -11.924581527709961, "global_step": 259681, "epoch": 1545} {"train_loss": -11.973976135253906, "global_step": 259682, "epoch": 1545} {"train_loss": -11.879423141479492, "global_step": 259683, "epoch": 1545} {"train_loss": -11.700248718261719, "global_step": 259684, "epoch": 1545} {"train_loss": -12.0253324508667, "global_step": 259685, "epoch": 1545} {"train_loss": -11.913920402526855, "global_step": 259686, "epoch": 1545} {"train_loss": -12.23707389831543, "global_step": 259687, "epoch": 1545} {"train_loss": -12.049318313598633, "global_step": 259688, "epoch": 1545} {"train_loss": -12.029767990112305, "global_step": 259689, "epoch": 1545} {"train_loss": -12.063355445861816, "global_step": 259690, "epoch": 1545} {"train_loss": -12.00719165802002, "global_step": 259691, "epoch": 1545} {"train_loss": -12.022544860839844, "global_step": 259692, "epoch": 1545} {"train_loss": -12.209895133972168, "global_step": 259693, "epoch": 1545} {"train_loss": -12.192756652832031, "global_step": 259694, "epoch": 1545} {"train_loss": -11.995219230651855, "global_step": 259695, "epoch": 1545} {"train_loss": -12.07868480682373, "global_step": 259696, "epoch": 1545} {"train_loss": -12.207145690917969, "global_step": 259697, "epoch": 1545} {"train_loss": -12.259904861450195, "global_step": 259698, "epoch": 1545} {"train_loss": -12.289676666259766, "global_step": 259699, "epoch": 1545} {"train_loss": -12.282453536987305, "global_step": 259700, "epoch": 1545} {"train_loss": -12.112661361694336, "global_step": 259701, "epoch": 1545} {"train_loss": -12.226902961730957, "global_step": 259702, "epoch": 1545} {"train_loss": -11.99046802520752, "global_step": 259703, "epoch": 1545} {"train_loss": -11.99886703491211, "global_step": 259704, "epoch": 1545} {"train_loss": -12.258033752441406, "global_step": 259705, "epoch": 1545} {"train_loss": -12.138392448425293, "global_step": 259706, "epoch": 1545} {"train_loss": -11.698440551757812, "global_step": 259707, "epoch": 1545} {"train_loss": -12.101858139038086, "global_step": 259708, "epoch": 1545} {"train_loss": -12.04438591003418, "global_step": 259709, "epoch": 1545} {"train_loss": -12.194342613220215, "global_step": 259710, "epoch": 1545} {"train_loss": -12.051509857177734, "global_step": 259711, "epoch": 1545} {"train_loss": -11.83985710144043, "global_step": 259712, "epoch": 1545} {"train_loss": -12.13818359375, "global_step": 259713, "epoch": 1545} {"train_loss": -11.95985221862793, "global_step": 259714, "epoch": 1545} {"train_loss": -12.067020416259766, "global_step": 259715, "epoch": 1545} {"train_loss": -12.083593368530273, "global_step": 259716, "epoch": 1545} {"train_loss": -12.217292785644531, "global_step": 259717, "epoch": 1545} {"train_loss": -11.779792785644531, "global_step": 259718, "epoch": 1545} {"train_loss": -12.20195198059082, "global_step": 259719, "epoch": 1545} {"train_loss": -12.103469848632812, "global_step": 259720, "epoch": 1545} {"train_loss": -11.923105239868164, "global_step": 259721, "epoch": 1545} {"train_loss": -12.228763580322266, "global_step": 259722, "epoch": 1545} {"train_loss": -12.068792343139648, "global_step": 259723, "epoch": 1545} {"train_loss": -12.06283187866211, "global_step": 259724, "epoch": 1545} {"train_loss": -12.2805757522583, "global_step": 259725, "epoch": 1545} {"train_loss": -11.856170654296875, "global_step": 259726, "epoch": 1545} {"train_loss": -11.661559383074442, "global_step": 259727, "epoch": 1545, "val_loss": 272489.53125, "train_action_mse_error": 1.6980878114700317} {"train_loss": -12.158567428588867, "global_step": 259728, "epoch": 1546} {"train_loss": -12.070281028747559, "global_step": 259729, "epoch": 1546} {"train_loss": -11.617574691772461, "global_step": 259730, "epoch": 1546} {"train_loss": -11.558978080749512, "global_step": 259731, "epoch": 1546} {"train_loss": -11.820379257202148, "global_step": 259732, "epoch": 1546} {"train_loss": -11.636451721191406, "global_step": 259733, "epoch": 1546} {"train_loss": -11.28275203704834, "global_step": 259734, "epoch": 1546} {"train_loss": -11.348849296569824, "global_step": 259735, "epoch": 1546} {"train_loss": -11.672876358032227, "global_step": 259736, "epoch": 1546} {"train_loss": -10.72911262512207, "global_step": 259737, "epoch": 1546} {"train_loss": -10.483064651489258, "global_step": 259738, "epoch": 1546} {"train_loss": -11.331537246704102, "global_step": 259739, "epoch": 1546} {"train_loss": -10.115487098693848, "global_step": 259740, "epoch": 1546} {"train_loss": -10.37641429901123, "global_step": 259741, "epoch": 1546} {"train_loss": -10.777770042419434, "global_step": 259742, "epoch": 1546} {"train_loss": -10.39949893951416, "global_step": 259743, "epoch": 1546} {"train_loss": -10.39902114868164, "global_step": 259744, "epoch": 1546} {"train_loss": -10.343817710876465, "global_step": 259745, "epoch": 1546} {"train_loss": -11.427252769470215, "global_step": 259746, "epoch": 1546} {"train_loss": -11.149053573608398, "global_step": 259747, "epoch": 1546} {"train_loss": -11.368844032287598, "global_step": 259748, "epoch": 1546} {"train_loss": -11.402200698852539, "global_step": 259749, "epoch": 1546} {"train_loss": -11.672571182250977, "global_step": 259750, "epoch": 1546} {"train_loss": -11.529056549072266, "global_step": 259751, "epoch": 1546} {"train_loss": -11.639978408813477, "global_step": 259752, "epoch": 1546} {"train_loss": -11.260100364685059, "global_step": 259753, "epoch": 1546} {"train_loss": -11.193414688110352, "global_step": 259754, "epoch": 1546} {"train_loss": -11.543901443481445, "global_step": 259755, "epoch": 1546} {"train_loss": -11.567068099975586, "global_step": 259756, "epoch": 1546} {"train_loss": -11.046520233154297, "global_step": 259757, "epoch": 1546} {"train_loss": -11.417130470275879, "global_step": 259758, "epoch": 1546} {"train_loss": -10.883240699768066, "global_step": 259759, "epoch": 1546} {"train_loss": -11.282173156738281, "global_step": 259760, "epoch": 1546} {"train_loss": -11.455650329589844, "global_step": 259761, "epoch": 1546} {"train_loss": -11.210552215576172, "global_step": 259762, "epoch": 1546} {"train_loss": -11.690813064575195, "global_step": 259763, "epoch": 1546} {"train_loss": -11.391254425048828, "global_step": 259764, "epoch": 1546} {"train_loss": -11.516178131103516, "global_step": 259765, "epoch": 1546} {"train_loss": -11.620495796203613, "global_step": 259766, "epoch": 1546} {"train_loss": -11.399530410766602, "global_step": 259767, "epoch": 1546} {"train_loss": -11.63180923461914, "global_step": 259768, "epoch": 1546} {"train_loss": -11.876913070678711, "global_step": 259769, "epoch": 1546} {"train_loss": -11.67434310913086, "global_step": 259770, "epoch": 1546} {"train_loss": -11.828507423400879, "global_step": 259771, "epoch": 1546} {"train_loss": -11.852668762207031, "global_step": 259772, "epoch": 1546} {"train_loss": -11.520421981811523, "global_step": 259773, "epoch": 1546} {"train_loss": -11.942558288574219, "global_step": 259774, "epoch": 1546} {"train_loss": -11.823708534240723, "global_step": 259775, "epoch": 1546} {"train_loss": -11.92429256439209, "global_step": 259776, "epoch": 1546} {"train_loss": -11.850006103515625, "global_step": 259777, "epoch": 1546} {"train_loss": -12.138927459716797, "global_step": 259778, "epoch": 1546} {"train_loss": -11.962373733520508, "global_step": 259779, "epoch": 1546} {"train_loss": -12.013435363769531, "global_step": 259780, "epoch": 1546} {"train_loss": -12.151567459106445, "global_step": 259781, "epoch": 1546} {"train_loss": -12.202939987182617, "global_step": 259782, "epoch": 1546} {"train_loss": -12.093742370605469, "global_step": 259783, "epoch": 1546} {"train_loss": -12.036595344543457, "global_step": 259784, "epoch": 1546} {"train_loss": -12.018025398254395, "global_step": 259785, "epoch": 1546} {"train_loss": -11.956628799438477, "global_step": 259786, "epoch": 1546} {"train_loss": -12.154370307922363, "global_step": 259787, "epoch": 1546} {"train_loss": -11.772359848022461, "global_step": 259788, "epoch": 1546} {"train_loss": -12.023067474365234, "global_step": 259789, "epoch": 1546} {"train_loss": -12.135629653930664, "global_step": 259790, "epoch": 1546} {"train_loss": -11.987007141113281, "global_step": 259791, "epoch": 1546} {"train_loss": -12.041618347167969, "global_step": 259792, "epoch": 1546} {"train_loss": -12.013372421264648, "global_step": 259793, "epoch": 1546} {"train_loss": -11.666464805603027, "global_step": 259794, "epoch": 1546} {"train_loss": -11.657106399536133, "global_step": 259795, "epoch": 1546} {"train_loss": -12.29483699798584, "global_step": 259796, "epoch": 1546} {"train_loss": -11.601133346557617, "global_step": 259797, "epoch": 1546} {"train_loss": -12.124786376953125, "global_step": 259798, "epoch": 1546} {"train_loss": -11.687170028686523, "global_step": 259799, "epoch": 1546} {"train_loss": -11.73265266418457, "global_step": 259800, "epoch": 1546} {"train_loss": -12.104377746582031, "global_step": 259801, "epoch": 1546} {"train_loss": -11.699966430664062, "global_step": 259802, "epoch": 1546} {"train_loss": -11.648496627807617, "global_step": 259803, "epoch": 1546} {"train_loss": -11.795618057250977, "global_step": 259804, "epoch": 1546} {"train_loss": -11.805124282836914, "global_step": 259805, "epoch": 1546} {"train_loss": -11.027567863464355, "global_step": 259806, "epoch": 1546} {"train_loss": -10.780867576599121, "global_step": 259807, "epoch": 1546} {"train_loss": -11.659377098083496, "global_step": 259808, "epoch": 1546} {"train_loss": -11.051689147949219, "global_step": 259809, "epoch": 1546} {"train_loss": -11.560023307800293, "global_step": 259810, "epoch": 1546} {"train_loss": -11.010435104370117, "global_step": 259811, "epoch": 1546} {"train_loss": -11.890661239624023, "global_step": 259812, "epoch": 1546} {"train_loss": -11.753253936767578, "global_step": 259813, "epoch": 1546} {"train_loss": -11.842170715332031, "global_step": 259814, "epoch": 1546} {"train_loss": -11.66492748260498, "global_step": 259815, "epoch": 1546} {"train_loss": -11.8837890625, "global_step": 259816, "epoch": 1546} {"train_loss": -11.992704391479492, "global_step": 259817, "epoch": 1546} {"train_loss": -11.894015312194824, "global_step": 259818, "epoch": 1546} {"train_loss": -11.629156112670898, "global_step": 259819, "epoch": 1546} {"train_loss": -11.898625373840332, "global_step": 259820, "epoch": 1546} {"train_loss": -11.816320419311523, "global_step": 259821, "epoch": 1546} {"train_loss": -11.404370307922363, "global_step": 259822, "epoch": 1546} {"train_loss": -12.094499588012695, "global_step": 259823, "epoch": 1546} {"train_loss": -11.272472381591797, "global_step": 259824, "epoch": 1546} {"train_loss": -11.908773422241211, "global_step": 259825, "epoch": 1546} {"train_loss": -11.12340259552002, "global_step": 259826, "epoch": 1546} {"train_loss": -11.716039657592773, "global_step": 259827, "epoch": 1546} {"train_loss": -11.409881591796875, "global_step": 259828, "epoch": 1546} {"train_loss": -10.929048538208008, "global_step": 259829, "epoch": 1546} {"train_loss": -12.139214515686035, "global_step": 259830, "epoch": 1546} {"train_loss": -10.596610069274902, "global_step": 259831, "epoch": 1546} {"train_loss": -11.522867202758789, "global_step": 259832, "epoch": 1546} {"train_loss": -11.492271423339844, "global_step": 259833, "epoch": 1546} {"train_loss": -11.658127784729004, "global_step": 259834, "epoch": 1546} {"train_loss": -11.78770637512207, "global_step": 259835, "epoch": 1546} {"train_loss": -11.631091117858887, "global_step": 259836, "epoch": 1546} {"train_loss": -11.846039772033691, "global_step": 259837, "epoch": 1546} {"train_loss": -11.503828048706055, "global_step": 259838, "epoch": 1546} {"train_loss": -11.689006805419922, "global_step": 259839, "epoch": 1546} {"train_loss": -11.850423812866211, "global_step": 259840, "epoch": 1546} {"train_loss": -11.362419128417969, "global_step": 259841, "epoch": 1546} {"train_loss": -11.902023315429688, "global_step": 259842, "epoch": 1546} {"train_loss": -10.974011421203613, "global_step": 259843, "epoch": 1546} {"train_loss": -10.649520874023438, "global_step": 259844, "epoch": 1546} {"train_loss": -11.439704895019531, "global_step": 259845, "epoch": 1546} {"train_loss": -10.760552406311035, "global_step": 259846, "epoch": 1546} {"train_loss": -10.058427810668945, "global_step": 259847, "epoch": 1546} {"train_loss": -11.312929153442383, "global_step": 259848, "epoch": 1546} {"train_loss": -10.12643814086914, "global_step": 259849, "epoch": 1546} {"train_loss": -10.910846710205078, "global_step": 259850, "epoch": 1546} {"train_loss": -10.295644760131836, "global_step": 259851, "epoch": 1546} {"train_loss": -10.551127433776855, "global_step": 259852, "epoch": 1546} {"train_loss": -10.811175346374512, "global_step": 259853, "epoch": 1546} {"train_loss": -9.49337387084961, "global_step": 259854, "epoch": 1546} {"train_loss": -11.701876640319824, "global_step": 259855, "epoch": 1546} {"train_loss": -9.57477855682373, "global_step": 259856, "epoch": 1546} {"train_loss": -11.733198165893555, "global_step": 259857, "epoch": 1546} {"train_loss": -9.954853057861328, "global_step": 259858, "epoch": 1546} {"train_loss": -11.639398574829102, "global_step": 259859, "epoch": 1546} {"train_loss": -10.10072135925293, "global_step": 259860, "epoch": 1546} {"train_loss": -11.386348724365234, "global_step": 259861, "epoch": 1546} {"train_loss": -10.357063293457031, "global_step": 259862, "epoch": 1546} {"train_loss": -11.481165885925293, "global_step": 259863, "epoch": 1546} {"train_loss": -10.43560791015625, "global_step": 259864, "epoch": 1546} {"train_loss": -11.599565505981445, "global_step": 259865, "epoch": 1546} {"train_loss": -10.306718826293945, "global_step": 259866, "epoch": 1546} {"train_loss": -11.478456497192383, "global_step": 259867, "epoch": 1546} {"train_loss": -10.684755325317383, "global_step": 259868, "epoch": 1546} {"train_loss": -11.403314590454102, "global_step": 259869, "epoch": 1546} {"train_loss": -10.698684692382812, "global_step": 259870, "epoch": 1546} {"train_loss": -11.248645782470703, "global_step": 259871, "epoch": 1546} {"train_loss": -11.03418254852295, "global_step": 259872, "epoch": 1546} {"train_loss": -11.618263244628906, "global_step": 259873, "epoch": 1546} {"train_loss": -10.55824089050293, "global_step": 259874, "epoch": 1546} {"train_loss": -11.345361709594727, "global_step": 259875, "epoch": 1546} {"train_loss": -10.694124221801758, "global_step": 259876, "epoch": 1546} {"train_loss": -11.312045097351074, "global_step": 259877, "epoch": 1546} {"train_loss": -11.260583877563477, "global_step": 259878, "epoch": 1546} {"train_loss": -11.35889720916748, "global_step": 259879, "epoch": 1546} {"train_loss": -11.11160659790039, "global_step": 259880, "epoch": 1546} {"train_loss": -11.532541275024414, "global_step": 259881, "epoch": 1546} {"train_loss": -11.362882614135742, "global_step": 259882, "epoch": 1546} {"train_loss": -11.256635665893555, "global_step": 259883, "epoch": 1546} {"train_loss": -11.857375144958496, "global_step": 259884, "epoch": 1546} {"train_loss": -11.44206714630127, "global_step": 259885, "epoch": 1546} {"train_loss": -11.585918426513672, "global_step": 259886, "epoch": 1546} {"train_loss": -11.583539962768555, "global_step": 259887, "epoch": 1546} {"train_loss": -11.656417846679688, "global_step": 259888, "epoch": 1546} {"train_loss": -11.619314193725586, "global_step": 259889, "epoch": 1546} {"train_loss": -11.778740882873535, "global_step": 259890, "epoch": 1546} {"train_loss": -11.689474105834961, "global_step": 259891, "epoch": 1546} {"train_loss": -11.668783187866211, "global_step": 259892, "epoch": 1546} {"train_loss": -11.62356185913086, "global_step": 259893, "epoch": 1546} {"train_loss": -11.558198928833008, "global_step": 259894, "epoch": 1546} {"train_loss": -11.422656167121161, "global_step": 259895, "epoch": 1546, "val_loss": 271166.75} {"train_loss": -11.591092109680176, "global_step": 259896, "epoch": 1547} {"train_loss": -11.989286422729492, "global_step": 259897, "epoch": 1547} {"train_loss": -11.718381881713867, "global_step": 259898, "epoch": 1547} {"train_loss": -11.916658401489258, "global_step": 259899, "epoch": 1547} {"train_loss": -11.79166316986084, "global_step": 259900, "epoch": 1547} {"train_loss": -11.842320442199707, "global_step": 259901, "epoch": 1547} {"train_loss": -11.626031875610352, "global_step": 259902, "epoch": 1547} {"train_loss": -11.80081558227539, "global_step": 259903, "epoch": 1547} {"train_loss": -11.651969909667969, "global_step": 259904, "epoch": 1547} {"train_loss": -11.792893409729004, "global_step": 259905, "epoch": 1547} {"train_loss": -11.97384262084961, "global_step": 259906, "epoch": 1547} {"train_loss": -11.72273063659668, "global_step": 259907, "epoch": 1547} {"train_loss": -11.546234130859375, "global_step": 259908, "epoch": 1547} {"train_loss": -11.691024780273438, "global_step": 259909, "epoch": 1547} {"train_loss": -11.557573318481445, "global_step": 259910, "epoch": 1547} {"train_loss": -11.561741828918457, "global_step": 259911, "epoch": 1547} {"train_loss": -11.363500595092773, "global_step": 259912, "epoch": 1547} {"train_loss": -11.52180290222168, "global_step": 259913, "epoch": 1547} {"train_loss": -11.075100898742676, "global_step": 259914, "epoch": 1547} {"train_loss": -11.913865089416504, "global_step": 259915, "epoch": 1547} {"train_loss": -11.577131271362305, "global_step": 259916, "epoch": 1547} {"train_loss": -11.78776741027832, "global_step": 259917, "epoch": 1547} {"train_loss": -11.875456809997559, "global_step": 259918, "epoch": 1547} {"train_loss": -11.821481704711914, "global_step": 259919, "epoch": 1547} {"train_loss": -12.188606262207031, "global_step": 259920, "epoch": 1547} {"train_loss": -11.843868255615234, "global_step": 259921, "epoch": 1547} {"train_loss": -11.920825958251953, "global_step": 259922, "epoch": 1547} {"train_loss": -12.048535346984863, "global_step": 259923, "epoch": 1547} {"train_loss": -12.004060745239258, "global_step": 259924, "epoch": 1547} {"train_loss": -11.94982624053955, "global_step": 259925, "epoch": 1547} {"train_loss": -11.98931884765625, "global_step": 259926, "epoch": 1547} {"train_loss": -11.782516479492188, "global_step": 259927, "epoch": 1547} {"train_loss": -12.049417495727539, "global_step": 259928, "epoch": 1547} {"train_loss": -11.871561050415039, "global_step": 259929, "epoch": 1547} {"train_loss": -12.11134147644043, "global_step": 259930, "epoch": 1547} {"train_loss": -12.091873168945312, "global_step": 259931, "epoch": 1547} {"train_loss": -11.85206413269043, "global_step": 259932, "epoch": 1547} {"train_loss": -12.118257522583008, "global_step": 259933, "epoch": 1547} {"train_loss": -12.242274284362793, "global_step": 259934, "epoch": 1547} {"train_loss": -12.307230949401855, "global_step": 259935, "epoch": 1547} {"train_loss": -12.00649642944336, "global_step": 259936, "epoch": 1547} {"train_loss": -12.190673828125, "global_step": 259937, "epoch": 1547} {"train_loss": -12.208478927612305, "global_step": 259938, "epoch": 1547} {"train_loss": -12.074664115905762, "global_step": 259939, "epoch": 1547} {"train_loss": -12.171747207641602, "global_step": 259940, "epoch": 1547} {"train_loss": -12.175870895385742, "global_step": 259941, "epoch": 1547} {"train_loss": -12.110411643981934, "global_step": 259942, "epoch": 1547} {"train_loss": -12.167634963989258, "global_step": 259943, "epoch": 1547} {"train_loss": -12.246780395507812, "global_step": 259944, "epoch": 1547} {"train_loss": -12.040128707885742, "global_step": 259945, "epoch": 1547} {"train_loss": -11.990753173828125, "global_step": 259946, "epoch": 1547} {"train_loss": -12.102569580078125, "global_step": 259947, "epoch": 1547} {"train_loss": -12.029004096984863, "global_step": 259948, "epoch": 1547} {"train_loss": -12.096460342407227, "global_step": 259949, "epoch": 1547} {"train_loss": -12.062281608581543, "global_step": 259950, "epoch": 1547} {"train_loss": -12.011390686035156, "global_step": 259951, "epoch": 1547} {"train_loss": -12.22586441040039, "global_step": 259952, "epoch": 1547} {"train_loss": -11.961044311523438, "global_step": 259953, "epoch": 1547} {"train_loss": -12.064718246459961, "global_step": 259954, "epoch": 1547} {"train_loss": -12.17053508758545, "global_step": 259955, "epoch": 1547} {"train_loss": -12.243088722229004, "global_step": 259956, "epoch": 1547} {"train_loss": -12.164190292358398, "global_step": 259957, "epoch": 1547} {"train_loss": -11.731841087341309, "global_step": 259958, "epoch": 1547} {"train_loss": -12.332502365112305, "global_step": 259959, "epoch": 1547} {"train_loss": -12.234310150146484, "global_step": 259960, "epoch": 1547} {"train_loss": -12.292518615722656, "global_step": 259961, "epoch": 1547} {"train_loss": -12.052909851074219, "global_step": 259962, "epoch": 1547} {"train_loss": -12.304853439331055, "global_step": 259963, "epoch": 1547} {"train_loss": -12.049769401550293, "global_step": 259964, "epoch": 1547} {"train_loss": -12.309000015258789, "global_step": 259965, "epoch": 1547} {"train_loss": -11.872459411621094, "global_step": 259966, "epoch": 1547} {"train_loss": -12.272538185119629, "global_step": 259967, "epoch": 1547} {"train_loss": -12.008347511291504, "global_step": 259968, "epoch": 1547} {"train_loss": -12.325288772583008, "global_step": 259969, "epoch": 1547} {"train_loss": -11.895557403564453, "global_step": 259970, "epoch": 1547} {"train_loss": -12.060985565185547, "global_step": 259971, "epoch": 1547} {"train_loss": -11.996526718139648, "global_step": 259972, "epoch": 1547} {"train_loss": -12.063138961791992, "global_step": 259973, "epoch": 1547} {"train_loss": -11.559334754943848, "global_step": 259974, "epoch": 1547} {"train_loss": -11.970970153808594, "global_step": 259975, "epoch": 1547} {"train_loss": -10.645729064941406, "global_step": 259976, "epoch": 1547} {"train_loss": -10.531277656555176, "global_step": 259977, "epoch": 1547} {"train_loss": -11.851725578308105, "global_step": 259978, "epoch": 1547} {"train_loss": -9.48228645324707, "global_step": 259979, "epoch": 1547} {"train_loss": -11.126811027526855, "global_step": 259980, "epoch": 1547} {"train_loss": -6.813309192657471, "global_step": 259981, "epoch": 1547} {"train_loss": -7.996668815612793, "global_step": 259982, "epoch": 1547} {"train_loss": -6.866105556488037, "global_step": 259983, "epoch": 1547} {"train_loss": -6.881202220916748, "global_step": 259984, "epoch": 1547} {"train_loss": -7.598457336425781, "global_step": 259985, "epoch": 1547} {"train_loss": -9.828654289245605, "global_step": 259986, "epoch": 1547} {"train_loss": -9.355876922607422, "global_step": 259987, "epoch": 1547} {"train_loss": -7.406092643737793, "global_step": 259988, "epoch": 1547} {"train_loss": -7.521702289581299, "global_step": 259989, "epoch": 1547} {"train_loss": -8.352737426757812, "global_step": 259990, "epoch": 1547} {"train_loss": -9.4923095703125, "global_step": 259991, "epoch": 1547} {"train_loss": -9.060297966003418, "global_step": 259992, "epoch": 1547} {"train_loss": -8.765344619750977, "global_step": 259993, "epoch": 1547} {"train_loss": -9.462240219116211, "global_step": 259994, "epoch": 1547} {"train_loss": -10.46776294708252, "global_step": 259995, "epoch": 1547} {"train_loss": -9.852662086486816, "global_step": 259996, "epoch": 1547} {"train_loss": -10.872715950012207, "global_step": 259997, "epoch": 1547} {"train_loss": -10.455509185791016, "global_step": 259998, "epoch": 1547} {"train_loss": -8.693130493164062, "global_step": 259999, "epoch": 1547} {"train_loss": -10.489938735961914, "global_step": 260000, "epoch": 1547} {"train_loss": -9.556949615478516, "global_step": 260001, "epoch": 1547} {"train_loss": -11.007285118103027, "global_step": 260002, "epoch": 1547} {"train_loss": -10.679471969604492, "global_step": 260003, "epoch": 1547} {"train_loss": -10.783665657043457, "global_step": 260004, "epoch": 1547} {"train_loss": -10.848800659179688, "global_step": 260005, "epoch": 1547} {"train_loss": -10.857647895812988, "global_step": 260006, "epoch": 1547} {"train_loss": -10.628000259399414, "global_step": 260007, "epoch": 1547} {"train_loss": -10.440174102783203, "global_step": 260008, "epoch": 1547} {"train_loss": -10.7691011428833, "global_step": 260009, "epoch": 1547} {"train_loss": -11.038688659667969, "global_step": 260010, "epoch": 1547} {"train_loss": -11.243734359741211, "global_step": 260011, "epoch": 1547} {"train_loss": -11.274154663085938, "global_step": 260012, "epoch": 1547} {"train_loss": -10.935080528259277, "global_step": 260013, "epoch": 1547} {"train_loss": -11.471477508544922, "global_step": 260014, "epoch": 1547} {"train_loss": -11.461067199707031, "global_step": 260015, "epoch": 1547} {"train_loss": -11.410255432128906, "global_step": 260016, "epoch": 1547} {"train_loss": -11.589678764343262, "global_step": 260017, "epoch": 1547} {"train_loss": -11.301677703857422, "global_step": 260018, "epoch": 1547} {"train_loss": -11.620797157287598, "global_step": 260019, "epoch": 1547} {"train_loss": -11.601932525634766, "global_step": 260020, "epoch": 1547} {"train_loss": -11.510810852050781, "global_step": 260021, "epoch": 1547} {"train_loss": -11.439681053161621, "global_step": 260022, "epoch": 1547} {"train_loss": -11.776445388793945, "global_step": 260023, "epoch": 1547} {"train_loss": -11.446443557739258, "global_step": 260024, "epoch": 1547} {"train_loss": -11.485231399536133, "global_step": 260025, "epoch": 1547} {"train_loss": -11.651922225952148, "global_step": 260026, "epoch": 1547} {"train_loss": -11.67664909362793, "global_step": 260027, "epoch": 1547} {"train_loss": -11.5675048828125, "global_step": 260028, "epoch": 1547} {"train_loss": -11.721616744995117, "global_step": 260029, "epoch": 1547} {"train_loss": -11.667964935302734, "global_step": 260030, "epoch": 1547} {"train_loss": -11.48422622680664, "global_step": 260031, "epoch": 1547} {"train_loss": -11.632740020751953, "global_step": 260032, "epoch": 1547} {"train_loss": -11.604738235473633, "global_step": 260033, "epoch": 1547} {"train_loss": -11.656973838806152, "global_step": 260034, "epoch": 1547} {"train_loss": -11.734474182128906, "global_step": 260035, "epoch": 1547} {"train_loss": -11.850814819335938, "global_step": 260036, "epoch": 1547} {"train_loss": -11.74947738647461, "global_step": 260037, "epoch": 1547} {"train_loss": -11.734779357910156, "global_step": 260038, "epoch": 1547} {"train_loss": -11.854456901550293, "global_step": 260039, "epoch": 1547} {"train_loss": -11.898207664489746, "global_step": 260040, "epoch": 1547} {"train_loss": -11.801255226135254, "global_step": 260041, "epoch": 1547} {"train_loss": -11.954675674438477, "global_step": 260042, "epoch": 1547} {"train_loss": -11.86589241027832, "global_step": 260043, "epoch": 1547} {"train_loss": -11.71922492980957, "global_step": 260044, "epoch": 1547} {"train_loss": -12.014641761779785, "global_step": 260045, "epoch": 1547} {"train_loss": -11.978492736816406, "global_step": 260046, "epoch": 1547} {"train_loss": -11.927688598632812, "global_step": 260047, "epoch": 1547} {"train_loss": -11.771305084228516, "global_step": 260048, "epoch": 1547} {"train_loss": -12.004850387573242, "global_step": 260049, "epoch": 1547} {"train_loss": -11.932398796081543, "global_step": 260050, "epoch": 1547} {"train_loss": -11.82028579711914, "global_step": 260051, "epoch": 1547} {"train_loss": -11.896871566772461, "global_step": 260052, "epoch": 1547} {"train_loss": -11.855854034423828, "global_step": 260053, "epoch": 1547} {"train_loss": -11.998455047607422, "global_step": 260054, "epoch": 1547} {"train_loss": -11.844305038452148, "global_step": 260055, "epoch": 1547} {"train_loss": -11.992315292358398, "global_step": 260056, "epoch": 1547} {"train_loss": -12.027166366577148, "global_step": 260057, "epoch": 1547} {"train_loss": -11.997840881347656, "global_step": 260058, "epoch": 1547} {"train_loss": -12.029470443725586, "global_step": 260059, "epoch": 1547} {"train_loss": -12.141319274902344, "global_step": 260060, "epoch": 1547} {"train_loss": -12.216383934020996, "global_step": 260061, "epoch": 1547} {"train_loss": -11.993736267089844, "global_step": 260062, "epoch": 1547} {"train_loss": -11.400755859556652, "global_step": 260063, "epoch": 1547, "val_loss": 266033.84375} {"train_loss": -12.07449722290039, "global_step": 260064, "epoch": 1548} {"train_loss": -12.16934585571289, "global_step": 260065, "epoch": 1548} {"train_loss": -12.089435577392578, "global_step": 260066, "epoch": 1548} {"train_loss": -12.22445011138916, "global_step": 260067, "epoch": 1548} {"train_loss": -12.000213623046875, "global_step": 260068, "epoch": 1548} {"train_loss": -12.24038314819336, "global_step": 260069, "epoch": 1548} {"train_loss": -11.97841739654541, "global_step": 260070, "epoch": 1548} {"train_loss": -11.991750717163086, "global_step": 260071, "epoch": 1548} {"train_loss": -12.075443267822266, "global_step": 260072, "epoch": 1548} {"train_loss": -12.249231338500977, "global_step": 260073, "epoch": 1548} {"train_loss": -12.033376693725586, "global_step": 260074, "epoch": 1548} {"train_loss": -12.044692993164062, "global_step": 260075, "epoch": 1548} {"train_loss": -12.141206741333008, "global_step": 260076, "epoch": 1548} {"train_loss": -11.970428466796875, "global_step": 260077, "epoch": 1548} {"train_loss": -12.230012893676758, "global_step": 260078, "epoch": 1548} {"train_loss": -12.23421859741211, "global_step": 260079, "epoch": 1548} {"train_loss": -12.394237518310547, "global_step": 260080, "epoch": 1548} {"train_loss": -11.934383392333984, "global_step": 260081, "epoch": 1548} {"train_loss": -12.106217384338379, "global_step": 260082, "epoch": 1548} {"train_loss": -12.252824783325195, "global_step": 260083, "epoch": 1548} {"train_loss": -11.876967430114746, "global_step": 260084, "epoch": 1548} {"train_loss": -11.853349685668945, "global_step": 260085, "epoch": 1548} {"train_loss": -12.091228485107422, "global_step": 260086, "epoch": 1548} {"train_loss": -11.91826343536377, "global_step": 260087, "epoch": 1548} {"train_loss": -12.236661911010742, "global_step": 260088, "epoch": 1548} {"train_loss": -11.966628074645996, "global_step": 260089, "epoch": 1548} {"train_loss": -12.232891082763672, "global_step": 260090, "epoch": 1548} {"train_loss": -12.159561157226562, "global_step": 260091, "epoch": 1548} {"train_loss": -11.989953994750977, "global_step": 260092, "epoch": 1548} {"train_loss": -11.804866790771484, "global_step": 260093, "epoch": 1548} {"train_loss": -11.700959205627441, "global_step": 260094, "epoch": 1548} {"train_loss": -11.252500534057617, "global_step": 260095, "epoch": 1548} {"train_loss": -10.94863510131836, "global_step": 260096, "epoch": 1548} {"train_loss": -10.981802940368652, "global_step": 260097, "epoch": 1548} {"train_loss": -11.993640899658203, "global_step": 260098, "epoch": 1548} {"train_loss": -11.152032852172852, "global_step": 260099, "epoch": 1548} {"train_loss": -11.723581314086914, "global_step": 260100, "epoch": 1548} {"train_loss": -10.963984489440918, "global_step": 260101, "epoch": 1548} {"train_loss": -10.26441764831543, "global_step": 260102, "epoch": 1548} {"train_loss": -11.641692161560059, "global_step": 260103, "epoch": 1548} {"train_loss": -11.811885833740234, "global_step": 260104, "epoch": 1548} {"train_loss": -11.787282943725586, "global_step": 260105, "epoch": 1548} {"train_loss": -10.770753860473633, "global_step": 260106, "epoch": 1548} {"train_loss": -11.854869842529297, "global_step": 260107, "epoch": 1548} {"train_loss": -11.517905235290527, "global_step": 260108, "epoch": 1548} {"train_loss": -10.918533325195312, "global_step": 260109, "epoch": 1548} {"train_loss": -10.887630462646484, "global_step": 260110, "epoch": 1548} {"train_loss": -11.285965919494629, "global_step": 260111, "epoch": 1548} {"train_loss": -9.163774490356445, "global_step": 260112, "epoch": 1548} {"train_loss": -10.949346542358398, "global_step": 260113, "epoch": 1548} {"train_loss": -9.668441772460938, "global_step": 260114, "epoch": 1548} {"train_loss": -9.804922103881836, "global_step": 260115, "epoch": 1548} {"train_loss": -9.665504455566406, "global_step": 260116, "epoch": 1548} {"train_loss": -9.553850173950195, "global_step": 260117, "epoch": 1548} {"train_loss": -10.835636138916016, "global_step": 260118, "epoch": 1548} {"train_loss": -10.467580795288086, "global_step": 260119, "epoch": 1548} {"train_loss": -9.571858406066895, "global_step": 260120, "epoch": 1548} {"train_loss": -11.158796310424805, "global_step": 260121, "epoch": 1548} {"train_loss": -10.595682144165039, "global_step": 260122, "epoch": 1548} {"train_loss": -11.463839530944824, "global_step": 260123, "epoch": 1548} {"train_loss": -11.037978172302246, "global_step": 260124, "epoch": 1548} {"train_loss": -11.2747220993042, "global_step": 260125, "epoch": 1548} {"train_loss": -11.198001861572266, "global_step": 260126, "epoch": 1548} {"train_loss": -11.510437965393066, "global_step": 260127, "epoch": 1548} {"train_loss": -11.111244201660156, "global_step": 260128, "epoch": 1548} {"train_loss": -11.477435111999512, "global_step": 260129, "epoch": 1548} {"train_loss": -11.53531551361084, "global_step": 260130, "epoch": 1548} {"train_loss": -11.386261940002441, "global_step": 260131, "epoch": 1548} {"train_loss": -11.56161880493164, "global_step": 260132, "epoch": 1548} {"train_loss": -11.868345260620117, "global_step": 260133, "epoch": 1548} {"train_loss": -11.251901626586914, "global_step": 260134, "epoch": 1548} {"train_loss": -11.349756240844727, "global_step": 260135, "epoch": 1548} {"train_loss": -11.56921100616455, "global_step": 260136, "epoch": 1548} {"train_loss": -11.48345947265625, "global_step": 260137, "epoch": 1548} {"train_loss": -11.710101127624512, "global_step": 260138, "epoch": 1548} {"train_loss": -11.382227897644043, "global_step": 260139, "epoch": 1548} {"train_loss": -11.586625099182129, "global_step": 260140, "epoch": 1548} {"train_loss": -11.322172164916992, "global_step": 260141, "epoch": 1548} {"train_loss": -11.779577255249023, "global_step": 260142, "epoch": 1548} {"train_loss": -11.557214736938477, "global_step": 260143, "epoch": 1548} {"train_loss": -11.71731948852539, "global_step": 260144, "epoch": 1548} {"train_loss": -11.549705505371094, "global_step": 260145, "epoch": 1548} {"train_loss": -11.799955368041992, "global_step": 260146, "epoch": 1548} {"train_loss": -11.730043411254883, "global_step": 260147, "epoch": 1548} {"train_loss": -11.956530570983887, "global_step": 260148, "epoch": 1548} {"train_loss": -11.772732734680176, "global_step": 260149, "epoch": 1548} {"train_loss": -11.6742525100708, "global_step": 260150, "epoch": 1548} {"train_loss": -11.857213973999023, "global_step": 260151, "epoch": 1548} {"train_loss": -11.783187866210938, "global_step": 260152, "epoch": 1548} {"train_loss": -11.864562034606934, "global_step": 260153, "epoch": 1548} {"train_loss": -11.678842544555664, "global_step": 260154, "epoch": 1548} {"train_loss": -11.818195343017578, "global_step": 260155, "epoch": 1548} {"train_loss": -11.985750198364258, "global_step": 260156, "epoch": 1548} {"train_loss": -11.82999324798584, "global_step": 260157, "epoch": 1548} {"train_loss": -11.884401321411133, "global_step": 260158, "epoch": 1548} {"train_loss": -12.14106273651123, "global_step": 260159, "epoch": 1548} {"train_loss": -12.209030151367188, "global_step": 260160, "epoch": 1548} {"train_loss": -12.179452896118164, "global_step": 260161, "epoch": 1548} {"train_loss": -12.010477066040039, "global_step": 260162, "epoch": 1548} {"train_loss": -11.991559982299805, "global_step": 260163, "epoch": 1548} {"train_loss": -12.103094100952148, "global_step": 260164, "epoch": 1548} {"train_loss": -12.074234008789062, "global_step": 260165, "epoch": 1548} {"train_loss": -12.025240898132324, "global_step": 260166, "epoch": 1548} {"train_loss": -12.046747207641602, "global_step": 260167, "epoch": 1548} {"train_loss": -12.076106071472168, "global_step": 260168, "epoch": 1548} {"train_loss": -12.090667724609375, "global_step": 260169, "epoch": 1548} {"train_loss": -12.18374252319336, "global_step": 260170, "epoch": 1548} {"train_loss": -12.249246597290039, "global_step": 260171, "epoch": 1548} {"train_loss": -12.181511878967285, "global_step": 260172, "epoch": 1548} {"train_loss": -12.052388191223145, "global_step": 260173, "epoch": 1548} {"train_loss": -12.115377426147461, "global_step": 260174, "epoch": 1548} {"train_loss": -12.24204158782959, "global_step": 260175, "epoch": 1548} {"train_loss": -12.275639533996582, "global_step": 260176, "epoch": 1548} {"train_loss": -12.046652793884277, "global_step": 260177, "epoch": 1548} {"train_loss": -11.993141174316406, "global_step": 260178, "epoch": 1548} {"train_loss": -12.20030689239502, "global_step": 260179, "epoch": 1548} {"train_loss": -11.858860969543457, "global_step": 260180, "epoch": 1548} {"train_loss": -11.871566772460938, "global_step": 260181, "epoch": 1548} {"train_loss": -11.728078842163086, "global_step": 260182, "epoch": 1548} {"train_loss": -11.049033164978027, "global_step": 260183, "epoch": 1548} {"train_loss": -12.283926963806152, "global_step": 260184, "epoch": 1548} {"train_loss": -10.734945297241211, "global_step": 260185, "epoch": 1548} {"train_loss": -11.988054275512695, "global_step": 260186, "epoch": 1548} {"train_loss": -11.673938751220703, "global_step": 260187, "epoch": 1548} {"train_loss": -11.45196533203125, "global_step": 260188, "epoch": 1548} {"train_loss": -11.638928413391113, "global_step": 260189, "epoch": 1548} {"train_loss": -11.8562650680542, "global_step": 260190, "epoch": 1548} {"train_loss": -11.552227020263672, "global_step": 260191, "epoch": 1548} {"train_loss": -11.29434585571289, "global_step": 260192, "epoch": 1548} {"train_loss": -11.91386604309082, "global_step": 260193, "epoch": 1548} {"train_loss": -11.801015853881836, "global_step": 260194, "epoch": 1548} {"train_loss": -11.654712677001953, "global_step": 260195, "epoch": 1548} {"train_loss": -11.359049797058105, "global_step": 260196, "epoch": 1548} {"train_loss": -11.714746475219727, "global_step": 260197, "epoch": 1548} {"train_loss": -12.00958251953125, "global_step": 260198, "epoch": 1548} {"train_loss": -11.500856399536133, "global_step": 260199, "epoch": 1548} {"train_loss": -12.010368347167969, "global_step": 260200, "epoch": 1548} {"train_loss": -11.723922729492188, "global_step": 260201, "epoch": 1548} {"train_loss": -12.07491397857666, "global_step": 260202, "epoch": 1548} {"train_loss": -12.02503490447998, "global_step": 260203, "epoch": 1548} {"train_loss": -11.999286651611328, "global_step": 260204, "epoch": 1548} {"train_loss": -12.122215270996094, "global_step": 260205, "epoch": 1548} {"train_loss": -12.185809135437012, "global_step": 260206, "epoch": 1548} {"train_loss": -12.10509204864502, "global_step": 260207, "epoch": 1548} {"train_loss": -12.28933334350586, "global_step": 260208, "epoch": 1548} {"train_loss": -12.115287780761719, "global_step": 260209, "epoch": 1548} {"train_loss": -12.236268997192383, "global_step": 260210, "epoch": 1548} {"train_loss": -12.049703598022461, "global_step": 260211, "epoch": 1548} {"train_loss": -12.031000137329102, "global_step": 260212, "epoch": 1548} {"train_loss": -12.119966506958008, "global_step": 260213, "epoch": 1548} {"train_loss": -12.195581436157227, "global_step": 260214, "epoch": 1548} {"train_loss": -11.61848258972168, "global_step": 260215, "epoch": 1548} {"train_loss": -11.947413444519043, "global_step": 260216, "epoch": 1548} {"train_loss": -11.369888305664062, "global_step": 260217, "epoch": 1548} {"train_loss": -11.557758331298828, "global_step": 260218, "epoch": 1548} {"train_loss": -11.816947937011719, "global_step": 260219, "epoch": 1548} {"train_loss": -12.02354621887207, "global_step": 260220, "epoch": 1548} {"train_loss": -11.411772727966309, "global_step": 260221, "epoch": 1548} {"train_loss": -11.774548530578613, "global_step": 260222, "epoch": 1548} {"train_loss": -11.712076187133789, "global_step": 260223, "epoch": 1548} {"train_loss": -12.037080764770508, "global_step": 260224, "epoch": 1548} {"train_loss": -11.958261489868164, "global_step": 260225, "epoch": 1548} {"train_loss": -11.455832481384277, "global_step": 260226, "epoch": 1548} {"train_loss": -11.3870267868042, "global_step": 260227, "epoch": 1548} {"train_loss": -11.78943920135498, "global_step": 260228, "epoch": 1548} {"train_loss": -12.144365310668945, "global_step": 260229, "epoch": 1548} {"train_loss": -11.373872756958008, "global_step": 260230, "epoch": 1548} {"train_loss": -11.681128933316185, "global_step": 260231, "epoch": 1548, "val_loss": 269787.71875} {"train_loss": -11.369917869567871, "global_step": 260232, "epoch": 1549} {"train_loss": -11.954916000366211, "global_step": 260233, "epoch": 1549} {"train_loss": -11.375900268554688, "global_step": 260234, "epoch": 1549} {"train_loss": -11.149723052978516, "global_step": 260235, "epoch": 1549} {"train_loss": -11.25840950012207, "global_step": 260236, "epoch": 1549} {"train_loss": -11.820066452026367, "global_step": 260237, "epoch": 1549} {"train_loss": -11.942144393920898, "global_step": 260238, "epoch": 1549} {"train_loss": -11.53446102142334, "global_step": 260239, "epoch": 1549} {"train_loss": -11.966995239257812, "global_step": 260240, "epoch": 1549} {"train_loss": -11.758650779724121, "global_step": 260241, "epoch": 1549} {"train_loss": -11.895553588867188, "global_step": 260242, "epoch": 1549} {"train_loss": -11.957386016845703, "global_step": 260243, "epoch": 1549} {"train_loss": -11.612767219543457, "global_step": 260244, "epoch": 1549} {"train_loss": -11.721982955932617, "global_step": 260245, "epoch": 1549} {"train_loss": -11.606167793273926, "global_step": 260246, "epoch": 1549} {"train_loss": -11.53877067565918, "global_step": 260247, "epoch": 1549} {"train_loss": -10.87282943725586, "global_step": 260248, "epoch": 1549} {"train_loss": -11.586549758911133, "global_step": 260249, "epoch": 1549} {"train_loss": -11.34946346282959, "global_step": 260250, "epoch": 1549} {"train_loss": -10.166952133178711, "global_step": 260251, "epoch": 1549} {"train_loss": -11.662020683288574, "global_step": 260252, "epoch": 1549} {"train_loss": -10.988704681396484, "global_step": 260253, "epoch": 1549} {"train_loss": -10.706159591674805, "global_step": 260254, "epoch": 1549} {"train_loss": -11.466724395751953, "global_step": 260255, "epoch": 1549} {"train_loss": -9.43031120300293, "global_step": 260256, "epoch": 1549} {"train_loss": -11.17160701751709, "global_step": 260257, "epoch": 1549} {"train_loss": -10.14901351928711, "global_step": 260258, "epoch": 1549} {"train_loss": -10.567424774169922, "global_step": 260259, "epoch": 1549} {"train_loss": -11.643304824829102, "global_step": 260260, "epoch": 1549} {"train_loss": -10.065528869628906, "global_step": 260261, "epoch": 1549} {"train_loss": -11.562003135681152, "global_step": 260262, "epoch": 1549} {"train_loss": -9.54193115234375, "global_step": 260263, "epoch": 1549} {"train_loss": -10.067702293395996, "global_step": 260264, "epoch": 1549} {"train_loss": -11.113020896911621, "global_step": 260265, "epoch": 1549} {"train_loss": -10.841543197631836, "global_step": 260266, "epoch": 1549} {"train_loss": -11.73507308959961, "global_step": 260267, "epoch": 1549} {"train_loss": -11.079736709594727, "global_step": 260268, "epoch": 1549} {"train_loss": -10.557267189025879, "global_step": 260269, "epoch": 1549} {"train_loss": -11.671652793884277, "global_step": 260270, "epoch": 1549} {"train_loss": -10.336130142211914, "global_step": 260271, "epoch": 1549} {"train_loss": -11.063824653625488, "global_step": 260272, "epoch": 1549} {"train_loss": -11.081136703491211, "global_step": 260273, "epoch": 1549} {"train_loss": -10.225465774536133, "global_step": 260274, "epoch": 1549} {"train_loss": -11.47361946105957, "global_step": 260275, "epoch": 1549} {"train_loss": -11.150779724121094, "global_step": 260276, "epoch": 1549} {"train_loss": -11.331459045410156, "global_step": 260277, "epoch": 1549} {"train_loss": -11.715570449829102, "global_step": 260278, "epoch": 1549} {"train_loss": -10.912906646728516, "global_step": 260279, "epoch": 1549} {"train_loss": -11.352739334106445, "global_step": 260280, "epoch": 1549} {"train_loss": -11.247285842895508, "global_step": 260281, "epoch": 1549} {"train_loss": -11.318891525268555, "global_step": 260282, "epoch": 1549} {"train_loss": -11.362781524658203, "global_step": 260283, "epoch": 1549} {"train_loss": -11.00126838684082, "global_step": 260284, "epoch": 1549} {"train_loss": -11.26152515411377, "global_step": 260285, "epoch": 1549} {"train_loss": -11.31052017211914, "global_step": 260286, "epoch": 1549} {"train_loss": -10.830007553100586, "global_step": 260287, "epoch": 1549} {"train_loss": -11.43195915222168, "global_step": 260288, "epoch": 1549} {"train_loss": -11.044960021972656, "global_step": 260289, "epoch": 1549} {"train_loss": -11.22170352935791, "global_step": 260290, "epoch": 1549} {"train_loss": -11.40314769744873, "global_step": 260291, "epoch": 1549} {"train_loss": -11.567119598388672, "global_step": 260292, "epoch": 1549} {"train_loss": -11.466782569885254, "global_step": 260293, "epoch": 1549} {"train_loss": -11.32131290435791, "global_step": 260294, "epoch": 1549} {"train_loss": -11.594202041625977, "global_step": 260295, "epoch": 1549} {"train_loss": -11.347554206848145, "global_step": 260296, "epoch": 1549} {"train_loss": -11.648788452148438, "global_step": 260297, "epoch": 1549} {"train_loss": -11.623767852783203, "global_step": 260298, "epoch": 1549} {"train_loss": -11.689461708068848, "global_step": 260299, "epoch": 1549} {"train_loss": -11.45370101928711, "global_step": 260300, "epoch": 1549} {"train_loss": -11.945745468139648, "global_step": 260301, "epoch": 1549} {"train_loss": -11.480964660644531, "global_step": 260302, "epoch": 1549} {"train_loss": -11.701860427856445, "global_step": 260303, "epoch": 1549} {"train_loss": -11.75284194946289, "global_step": 260304, "epoch": 1549} {"train_loss": -11.666336059570312, "global_step": 260305, "epoch": 1549} {"train_loss": -11.814498901367188, "global_step": 260306, "epoch": 1549} {"train_loss": -11.220508575439453, "global_step": 260307, "epoch": 1549} {"train_loss": -11.332042694091797, "global_step": 260308, "epoch": 1549} {"train_loss": -11.64748764038086, "global_step": 260309, "epoch": 1549} {"train_loss": -11.529542922973633, "global_step": 260310, "epoch": 1549} {"train_loss": -11.783342361450195, "global_step": 260311, "epoch": 1549} {"train_loss": -11.210896492004395, "global_step": 260312, "epoch": 1549} {"train_loss": -11.655322074890137, "global_step": 260313, "epoch": 1549} {"train_loss": -11.523676872253418, "global_step": 260314, "epoch": 1549} {"train_loss": -11.532493591308594, "global_step": 260315, "epoch": 1549} {"train_loss": -12.027359008789062, "global_step": 260316, "epoch": 1549} {"train_loss": -11.816671371459961, "global_step": 260317, "epoch": 1549} {"train_loss": -11.876922607421875, "global_step": 260318, "epoch": 1549} {"train_loss": -11.78849983215332, "global_step": 260319, "epoch": 1549} {"train_loss": -11.722711563110352, "global_step": 260320, "epoch": 1549} {"train_loss": -12.082321166992188, "global_step": 260321, "epoch": 1549} {"train_loss": -11.663961410522461, "global_step": 260322, "epoch": 1549} {"train_loss": -11.436102867126465, "global_step": 260323, "epoch": 1549} {"train_loss": -11.476872444152832, "global_step": 260324, "epoch": 1549} {"train_loss": -11.431451797485352, "global_step": 260325, "epoch": 1549} {"train_loss": -11.926345825195312, "global_step": 260326, "epoch": 1549} {"train_loss": -11.561908721923828, "global_step": 260327, "epoch": 1549} {"train_loss": -11.768529891967773, "global_step": 260328, "epoch": 1549} {"train_loss": -11.802099227905273, "global_step": 260329, "epoch": 1549} {"train_loss": -11.314793586730957, "global_step": 260330, "epoch": 1549} {"train_loss": -11.900245666503906, "global_step": 260331, "epoch": 1549} {"train_loss": -11.676494598388672, "global_step": 260332, "epoch": 1549} {"train_loss": -11.62382698059082, "global_step": 260333, "epoch": 1549} {"train_loss": -11.834110260009766, "global_step": 260334, "epoch": 1549} {"train_loss": -11.621986389160156, "global_step": 260335, "epoch": 1549} {"train_loss": -11.887039184570312, "global_step": 260336, "epoch": 1549} {"train_loss": -11.739770889282227, "global_step": 260337, "epoch": 1549} {"train_loss": -11.96025562286377, "global_step": 260338, "epoch": 1549} {"train_loss": -11.764644622802734, "global_step": 260339, "epoch": 1549} {"train_loss": -12.057921409606934, "global_step": 260340, "epoch": 1549} {"train_loss": -11.751548767089844, "global_step": 260341, "epoch": 1549} {"train_loss": -11.679652214050293, "global_step": 260342, "epoch": 1549} {"train_loss": -12.185456275939941, "global_step": 260343, "epoch": 1549} {"train_loss": -11.743302345275879, "global_step": 260344, "epoch": 1549} {"train_loss": -12.14320182800293, "global_step": 260345, "epoch": 1549} {"train_loss": -11.952362060546875, "global_step": 260346, "epoch": 1549} {"train_loss": -11.905923843383789, "global_step": 260347, "epoch": 1549} {"train_loss": -12.092460632324219, "global_step": 260348, "epoch": 1549} {"train_loss": -11.845361709594727, "global_step": 260349, "epoch": 1549} {"train_loss": -12.234457015991211, "global_step": 260350, "epoch": 1549} {"train_loss": -11.755072593688965, "global_step": 260351, "epoch": 1549} {"train_loss": -12.028753280639648, "global_step": 260352, "epoch": 1549} {"train_loss": -11.879737854003906, "global_step": 260353, "epoch": 1549} {"train_loss": -12.201522827148438, "global_step": 260354, "epoch": 1549} {"train_loss": -11.939103126525879, "global_step": 260355, "epoch": 1549} {"train_loss": -12.028512954711914, "global_step": 260356, "epoch": 1549} {"train_loss": -12.151138305664062, "global_step": 260357, "epoch": 1549} {"train_loss": -12.010705947875977, "global_step": 260358, "epoch": 1549} {"train_loss": -12.086528778076172, "global_step": 260359, "epoch": 1549} {"train_loss": -12.224882125854492, "global_step": 260360, "epoch": 1549} {"train_loss": -12.029356002807617, "global_step": 260361, "epoch": 1549} {"train_loss": -12.161819458007812, "global_step": 260362, "epoch": 1549} {"train_loss": -11.768339157104492, "global_step": 260363, "epoch": 1549} {"train_loss": -12.353248596191406, "global_step": 260364, "epoch": 1549} {"train_loss": -12.030561447143555, "global_step": 260365, "epoch": 1549} {"train_loss": -12.197199821472168, "global_step": 260366, "epoch": 1549} {"train_loss": -12.037773132324219, "global_step": 260367, "epoch": 1549} {"train_loss": -11.894039154052734, "global_step": 260368, "epoch": 1549} {"train_loss": -12.008854866027832, "global_step": 260369, "epoch": 1549} {"train_loss": -12.119596481323242, "global_step": 260370, "epoch": 1549} {"train_loss": -12.139165878295898, "global_step": 260371, "epoch": 1549} {"train_loss": -12.086207389831543, "global_step": 260372, "epoch": 1549} {"train_loss": -11.963521003723145, "global_step": 260373, "epoch": 1549} {"train_loss": -12.263690948486328, "global_step": 260374, "epoch": 1549} {"train_loss": -12.281606674194336, "global_step": 260375, "epoch": 1549} {"train_loss": -12.04909896850586, "global_step": 260376, "epoch": 1549} {"train_loss": -12.035683631896973, "global_step": 260377, "epoch": 1549} {"train_loss": -11.88036823272705, "global_step": 260378, "epoch": 1549} {"train_loss": -11.727277755737305, "global_step": 260379, "epoch": 1549} {"train_loss": -12.330810546875, "global_step": 260380, "epoch": 1549} {"train_loss": -11.890178680419922, "global_step": 260381, "epoch": 1549} {"train_loss": -11.63726806640625, "global_step": 260382, "epoch": 1549} {"train_loss": -11.733829498291016, "global_step": 260383, "epoch": 1549} {"train_loss": -11.855342864990234, "global_step": 260384, "epoch": 1549} {"train_loss": -11.463929176330566, "global_step": 260385, "epoch": 1549} {"train_loss": -11.999690055847168, "global_step": 260386, "epoch": 1549} {"train_loss": -11.656641006469727, "global_step": 260387, "epoch": 1549} {"train_loss": -11.072609901428223, "global_step": 260388, "epoch": 1549} {"train_loss": -11.292798042297363, "global_step": 260389, "epoch": 1549} {"train_loss": -11.892860412597656, "global_step": 260390, "epoch": 1549} {"train_loss": -11.622920036315918, "global_step": 260391, "epoch": 1549} {"train_loss": -11.040220260620117, "global_step": 260392, "epoch": 1549} {"train_loss": -11.80877685546875, "global_step": 260393, "epoch": 1549} {"train_loss": -11.786376953125, "global_step": 260394, "epoch": 1549} {"train_loss": -12.14809799194336, "global_step": 260395, "epoch": 1549} {"train_loss": -11.623554229736328, "global_step": 260396, "epoch": 1549} {"train_loss": -11.792956352233887, "global_step": 260397, "epoch": 1549} {"train_loss": -11.5586519241333, "global_step": 260398, "epoch": 1549} {"train_loss": -11.57373533362434, "global_step": 260399, "epoch": 1549, "val_loss": 270299.03125} {"train_loss": -10.947744369506836, "global_step": 260400, "epoch": 1550} {"train_loss": -11.932504653930664, "global_step": 260401, "epoch": 1550} {"train_loss": -11.227931022644043, "global_step": 260402, "epoch": 1550} {"train_loss": -11.631939888000488, "global_step": 260403, "epoch": 1550} {"train_loss": -11.366720199584961, "global_step": 260404, "epoch": 1550} {"train_loss": -11.783304214477539, "global_step": 260405, "epoch": 1550} {"train_loss": -11.83735466003418, "global_step": 260406, "epoch": 1550} {"train_loss": -11.60963249206543, "global_step": 260407, "epoch": 1550} {"train_loss": -11.915338516235352, "global_step": 260408, "epoch": 1550} {"train_loss": -11.792014122009277, "global_step": 260409, "epoch": 1550} {"train_loss": -11.559711456298828, "global_step": 260410, "epoch": 1550} {"train_loss": -11.85655403137207, "global_step": 260411, "epoch": 1550} {"train_loss": -11.741775512695312, "global_step": 260412, "epoch": 1550} {"train_loss": -11.39537525177002, "global_step": 260413, "epoch": 1550} {"train_loss": -11.512948989868164, "global_step": 260414, "epoch": 1550} {"train_loss": -11.791885375976562, "global_step": 260415, "epoch": 1550} {"train_loss": -10.825943946838379, "global_step": 260416, "epoch": 1550} {"train_loss": -11.443881034851074, "global_step": 260417, "epoch": 1550} {"train_loss": -11.34522819519043, "global_step": 260418, "epoch": 1550} {"train_loss": -11.068857192993164, "global_step": 260419, "epoch": 1550} {"train_loss": -11.920348167419434, "global_step": 260420, "epoch": 1550} {"train_loss": -10.940130233764648, "global_step": 260421, "epoch": 1550} {"train_loss": -11.44451904296875, "global_step": 260422, "epoch": 1550} {"train_loss": -11.701883316040039, "global_step": 260423, "epoch": 1550} {"train_loss": -11.467975616455078, "global_step": 260424, "epoch": 1550} {"train_loss": -11.867952346801758, "global_step": 260425, "epoch": 1550} {"train_loss": -11.595436096191406, "global_step": 260426, "epoch": 1550} {"train_loss": -11.285943984985352, "global_step": 260427, "epoch": 1550} {"train_loss": -11.959382057189941, "global_step": 260428, "epoch": 1550} {"train_loss": -11.365903854370117, "global_step": 260429, "epoch": 1550} {"train_loss": -11.755017280578613, "global_step": 260430, "epoch": 1550} {"train_loss": -11.82705307006836, "global_step": 260431, "epoch": 1550} {"train_loss": -11.695758819580078, "global_step": 260432, "epoch": 1550} {"train_loss": -11.662471771240234, "global_step": 260433, "epoch": 1550} {"train_loss": -11.617507934570312, "global_step": 260434, "epoch": 1550} {"train_loss": -11.707651138305664, "global_step": 260435, "epoch": 1550} {"train_loss": -11.92095947265625, "global_step": 260436, "epoch": 1550} {"train_loss": -11.852682113647461, "global_step": 260437, "epoch": 1550} {"train_loss": -11.750171661376953, "global_step": 260438, "epoch": 1550} {"train_loss": -11.785045623779297, "global_step": 260439, "epoch": 1550} {"train_loss": -12.079334259033203, "global_step": 260440, "epoch": 1550} {"train_loss": -11.802305221557617, "global_step": 260441, "epoch": 1550} {"train_loss": -11.905118942260742, "global_step": 260442, "epoch": 1550} {"train_loss": -11.651062965393066, "global_step": 260443, "epoch": 1550} {"train_loss": -12.124051094055176, "global_step": 260444, "epoch": 1550} {"train_loss": -11.822486877441406, "global_step": 260445, "epoch": 1550} {"train_loss": -12.286630630493164, "global_step": 260446, "epoch": 1550} {"train_loss": -11.893577575683594, "global_step": 260447, "epoch": 1550} {"train_loss": -12.112253189086914, "global_step": 260448, "epoch": 1550} {"train_loss": -11.966801643371582, "global_step": 260449, "epoch": 1550} {"train_loss": -12.115575790405273, "global_step": 260450, "epoch": 1550} {"train_loss": -11.749159812927246, "global_step": 260451, "epoch": 1550} {"train_loss": -12.21373462677002, "global_step": 260452, "epoch": 1550} {"train_loss": -12.109025955200195, "global_step": 260453, "epoch": 1550} {"train_loss": -11.997572898864746, "global_step": 260454, "epoch": 1550} {"train_loss": -12.17842960357666, "global_step": 260455, "epoch": 1550} {"train_loss": -11.858427047729492, "global_step": 260456, "epoch": 1550} {"train_loss": -11.919742584228516, "global_step": 260457, "epoch": 1550} {"train_loss": -12.085837364196777, "global_step": 260458, "epoch": 1550} {"train_loss": -11.997169494628906, "global_step": 260459, "epoch": 1550} {"train_loss": -11.960508346557617, "global_step": 260460, "epoch": 1550} {"train_loss": -12.182379722595215, "global_step": 260461, "epoch": 1550} {"train_loss": -12.27645206451416, "global_step": 260462, "epoch": 1550} {"train_loss": -12.026712417602539, "global_step": 260463, "epoch": 1550} {"train_loss": -12.249553680419922, "global_step": 260464, "epoch": 1550} {"train_loss": -12.383026123046875, "global_step": 260465, "epoch": 1550} {"train_loss": -12.302221298217773, "global_step": 260466, "epoch": 1550} {"train_loss": -11.958162307739258, "global_step": 260467, "epoch": 1550} {"train_loss": -12.244524955749512, "global_step": 260468, "epoch": 1550} {"train_loss": -12.193315505981445, "global_step": 260469, "epoch": 1550} {"train_loss": -12.198078155517578, "global_step": 260470, "epoch": 1550} {"train_loss": -11.912391662597656, "global_step": 260471, "epoch": 1550} {"train_loss": -12.252188682556152, "global_step": 260472, "epoch": 1550} {"train_loss": -11.69047737121582, "global_step": 260473, "epoch": 1550} {"train_loss": -11.262609481811523, "global_step": 260474, "epoch": 1550} {"train_loss": -11.446943283081055, "global_step": 260475, "epoch": 1550} {"train_loss": -12.270419120788574, "global_step": 260476, "epoch": 1550} {"train_loss": -11.911235809326172, "global_step": 260477, "epoch": 1550} {"train_loss": -12.203015327453613, "global_step": 260478, "epoch": 1550} {"train_loss": -11.89688777923584, "global_step": 260479, "epoch": 1550} {"train_loss": -12.025810241699219, "global_step": 260480, "epoch": 1550} {"train_loss": -11.909656524658203, "global_step": 260481, "epoch": 1550} {"train_loss": -11.551636695861816, "global_step": 260482, "epoch": 1550} {"train_loss": -11.496047973632812, "global_step": 260483, "epoch": 1550} {"train_loss": -12.30073356628418, "global_step": 260484, "epoch": 1550} {"train_loss": -11.961280822753906, "global_step": 260485, "epoch": 1550} {"train_loss": -11.926636695861816, "global_step": 260486, "epoch": 1550} {"train_loss": -11.876696586608887, "global_step": 260487, "epoch": 1550} {"train_loss": -11.2300443649292, "global_step": 260488, "epoch": 1550} {"train_loss": -11.84200668334961, "global_step": 260489, "epoch": 1550} {"train_loss": -12.01154899597168, "global_step": 260490, "epoch": 1550} {"train_loss": -11.376052856445312, "global_step": 260491, "epoch": 1550} {"train_loss": -11.313760757446289, "global_step": 260492, "epoch": 1550} {"train_loss": -12.077483177185059, "global_step": 260493, "epoch": 1550} {"train_loss": -11.101641654968262, "global_step": 260494, "epoch": 1550} {"train_loss": -11.862773895263672, "global_step": 260495, "epoch": 1550} {"train_loss": -11.494097709655762, "global_step": 260496, "epoch": 1550} {"train_loss": -11.987930297851562, "global_step": 260497, "epoch": 1550} {"train_loss": -11.644342422485352, "global_step": 260498, "epoch": 1550} {"train_loss": -11.877470016479492, "global_step": 260499, "epoch": 1550} {"train_loss": -11.433115005493164, "global_step": 260500, "epoch": 1550} {"train_loss": -11.333869934082031, "global_step": 260501, "epoch": 1550} {"train_loss": -11.31328296661377, "global_step": 260502, "epoch": 1550} {"train_loss": -11.564834594726562, "global_step": 260503, "epoch": 1550} {"train_loss": -11.432893753051758, "global_step": 260504, "epoch": 1550} {"train_loss": -11.852584838867188, "global_step": 260505, "epoch": 1550} {"train_loss": -11.80956745147705, "global_step": 260506, "epoch": 1550} {"train_loss": -11.867137908935547, "global_step": 260507, "epoch": 1550} {"train_loss": -11.777454376220703, "global_step": 260508, "epoch": 1550} {"train_loss": -11.055397033691406, "global_step": 260509, "epoch": 1550} {"train_loss": -11.816271781921387, "global_step": 260510, "epoch": 1550} {"train_loss": -11.875396728515625, "global_step": 260511, "epoch": 1550} {"train_loss": -10.98617935180664, "global_step": 260512, "epoch": 1550} {"train_loss": -11.166109085083008, "global_step": 260513, "epoch": 1550} {"train_loss": -11.909957885742188, "global_step": 260514, "epoch": 1550} {"train_loss": -11.100650787353516, "global_step": 260515, "epoch": 1550} {"train_loss": -11.026714324951172, "global_step": 260516, "epoch": 1550} {"train_loss": -10.863852500915527, "global_step": 260517, "epoch": 1550} {"train_loss": -10.363985061645508, "global_step": 260518, "epoch": 1550} {"train_loss": -10.612837791442871, "global_step": 260519, "epoch": 1550} {"train_loss": -10.209565162658691, "global_step": 260520, "epoch": 1550} {"train_loss": -9.514457702636719, "global_step": 260521, "epoch": 1550} {"train_loss": -11.262165069580078, "global_step": 260522, "epoch": 1550} {"train_loss": -8.655011177062988, "global_step": 260523, "epoch": 1550} {"train_loss": -10.544978141784668, "global_step": 260524, "epoch": 1550} {"train_loss": -9.167451858520508, "global_step": 260525, "epoch": 1550} {"train_loss": -10.171947479248047, "global_step": 260526, "epoch": 1550} {"train_loss": -9.121424674987793, "global_step": 260527, "epoch": 1550} {"train_loss": -10.695698738098145, "global_step": 260528, "epoch": 1550} {"train_loss": -10.181638717651367, "global_step": 260529, "epoch": 1550} {"train_loss": -11.24510669708252, "global_step": 260530, "epoch": 1550} {"train_loss": -9.669269561767578, "global_step": 260531, "epoch": 1550} {"train_loss": -11.045419692993164, "global_step": 260532, "epoch": 1550} {"train_loss": -9.796693801879883, "global_step": 260533, "epoch": 1550} {"train_loss": -9.750143051147461, "global_step": 260534, "epoch": 1550} {"train_loss": -10.569786071777344, "global_step": 260535, "epoch": 1550} {"train_loss": -11.031143188476562, "global_step": 260536, "epoch": 1550} {"train_loss": -10.769475936889648, "global_step": 260537, "epoch": 1550} {"train_loss": -10.754719734191895, "global_step": 260538, "epoch": 1550} {"train_loss": -10.887564659118652, "global_step": 260539, "epoch": 1550} {"train_loss": -10.545646667480469, "global_step": 260540, "epoch": 1550} {"train_loss": -11.20050048828125, "global_step": 260541, "epoch": 1550} {"train_loss": -11.069097518920898, "global_step": 260542, "epoch": 1550} {"train_loss": -10.597773551940918, "global_step": 260543, "epoch": 1550} {"train_loss": -11.736246109008789, "global_step": 260544, "epoch": 1550} {"train_loss": -10.451745986938477, "global_step": 260545, "epoch": 1550} {"train_loss": -11.366348266601562, "global_step": 260546, "epoch": 1550} {"train_loss": -11.304014205932617, "global_step": 260547, "epoch": 1550} {"train_loss": -11.27680778503418, "global_step": 260548, "epoch": 1550} {"train_loss": -11.316155433654785, "global_step": 260549, "epoch": 1550} {"train_loss": -11.174025535583496, "global_step": 260550, "epoch": 1550} {"train_loss": -11.42362117767334, "global_step": 260551, "epoch": 1550} {"train_loss": -11.053136825561523, "global_step": 260552, "epoch": 1550} {"train_loss": -11.53715705871582, "global_step": 260553, "epoch": 1550} {"train_loss": -11.481169700622559, "global_step": 260554, "epoch": 1550} {"train_loss": -11.234098434448242, "global_step": 260555, "epoch": 1550} {"train_loss": -11.254196166992188, "global_step": 260556, "epoch": 1550} {"train_loss": -11.648807525634766, "global_step": 260557, "epoch": 1550} {"train_loss": -11.548845291137695, "global_step": 260558, "epoch": 1550} {"train_loss": -11.712299346923828, "global_step": 260559, "epoch": 1550} {"train_loss": -11.613814353942871, "global_step": 260560, "epoch": 1550} {"train_loss": -11.356689453125, "global_step": 260561, "epoch": 1550} {"train_loss": -11.798979759216309, "global_step": 260562, "epoch": 1550} {"train_loss": -11.569437026977539, "global_step": 260563, "epoch": 1550} {"train_loss": -11.697150230407715, "global_step": 260564, "epoch": 1550} {"train_loss": -11.651597023010254, "global_step": 260565, "epoch": 1550} {"train_loss": -11.801876068115234, "global_step": 260566, "epoch": 1550} {"train_loss": -11.484817510559445, "global_step": 260567, "epoch": 1550, "train/sim_max_reward_0": 0.6814351642068501, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.000602799941621592, "train/sim_max_reward_3": 0.18163846693312138, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.592728207433612, "test/sim_max_reward_4400000": 0.9692536146587069, "test/sim_max_reward_4400001": 0.37366590998276206, "test/sim_max_reward_4400002": 0.5008732333927881, "test/sim_max_reward_4400003": 0.945387793705728, "test/sim_max_reward_4400004": 0.8341499450584281, "test/sim_max_reward_4400005": 0.07193205657960355, "test/sim_max_reward_4400006": 0.9177186663158894, "test/sim_max_reward_4400007": 0.521042779825717, "test/sim_max_reward_4400008": 0.6487330126849903, "test/sim_max_reward_4400009": 0.389755681529828, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 0.28141669882051623, "test/sim_max_reward_4400012": 0.9897614438560293, "test/sim_max_reward_4400013": 0.9872427989472451, "test/sim_max_reward_4400014": 0.9825378586035313, "test/sim_max_reward_4400015": 0.5588245667533879, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.12507708322968722, "test/sim_max_reward_4400018": 0.42977127078920785, "test/sim_max_reward_4400019": 0.40729047180209255, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.6075593966996733, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.6536741334925302, "test/sim_max_reward_4400026": 0.06922732456302526, "test/sim_max_reward_4400027": 0.9945974863521517, "test/sim_max_reward_4400028": 0.9046765792862062, "test/sim_max_reward_4400029": 0.49282315589044184, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.9925644403607852, "test/sim_max_reward_4400032": 0.00020214225778002336, "test/sim_max_reward_4400033": 0.36916911229362953, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.3359210825981823, "test/sim_max_reward_4400036": 0.9642051499285095, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.4118473413750337, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.1542298030169238, "test/sim_max_reward_4400042": 0.042153207192473535, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.9881233526916914, "test/sim_max_reward_4400046": 0.830406142869821, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.5760674397525342, "test/mean_score": 0.5768824276845328, "val_loss": 269580.59375, "train_action_mse_error": 4.099532127380371} {"train_loss": -11.365575790405273, "global_step": 260568, "epoch": 1551} {"train_loss": -11.47592544555664, "global_step": 260569, "epoch": 1551} {"train_loss": -11.687877655029297, "global_step": 260570, "epoch": 1551} {"train_loss": -11.673444747924805, "global_step": 260571, "epoch": 1551} {"train_loss": -11.883745193481445, "global_step": 260572, "epoch": 1551} {"train_loss": -11.58658218383789, "global_step": 260573, "epoch": 1551} {"train_loss": -11.900461196899414, "global_step": 260574, "epoch": 1551} {"train_loss": -11.684993743896484, "global_step": 260575, "epoch": 1551} {"train_loss": -11.883414268493652, "global_step": 260576, "epoch": 1551} {"train_loss": -11.659351348876953, "global_step": 260577, "epoch": 1551} {"train_loss": -11.974464416503906, "global_step": 260578, "epoch": 1551} {"train_loss": -11.917861938476562, "global_step": 260579, "epoch": 1551} {"train_loss": -11.946708679199219, "global_step": 260580, "epoch": 1551} {"train_loss": -11.824342727661133, "global_step": 260581, "epoch": 1551} {"train_loss": -11.893080711364746, "global_step": 260582, "epoch": 1551} {"train_loss": -11.936399459838867, "global_step": 260583, "epoch": 1551} {"train_loss": -11.69147777557373, "global_step": 260584, "epoch": 1551} {"train_loss": -11.659269332885742, "global_step": 260585, "epoch": 1551} {"train_loss": -11.692743301391602, "global_step": 260586, "epoch": 1551} {"train_loss": -11.914200782775879, "global_step": 260587, "epoch": 1551} {"train_loss": -11.767160415649414, "global_step": 260588, "epoch": 1551} {"train_loss": -11.803653717041016, "global_step": 260589, "epoch": 1551} {"train_loss": -11.842430114746094, "global_step": 260590, "epoch": 1551} {"train_loss": -11.885390281677246, "global_step": 260591, "epoch": 1551} {"train_loss": -11.762144088745117, "global_step": 260592, "epoch": 1551} {"train_loss": -11.671634674072266, "global_step": 260593, "epoch": 1551} {"train_loss": -11.955570220947266, "global_step": 260594, "epoch": 1551} {"train_loss": -11.915148735046387, "global_step": 260595, "epoch": 1551} {"train_loss": -11.667458534240723, "global_step": 260596, "epoch": 1551} {"train_loss": -11.84439468383789, "global_step": 260597, "epoch": 1551} {"train_loss": -11.807424545288086, "global_step": 260598, "epoch": 1551} {"train_loss": -11.264223098754883, "global_step": 260599, "epoch": 1551} {"train_loss": -11.817481994628906, "global_step": 260600, "epoch": 1551} {"train_loss": -11.486913681030273, "global_step": 260601, "epoch": 1551} {"train_loss": -11.868383407592773, "global_step": 260602, "epoch": 1551} {"train_loss": -11.995651245117188, "global_step": 260603, "epoch": 1551} {"train_loss": -11.758184432983398, "global_step": 260604, "epoch": 1551} {"train_loss": -12.028545379638672, "global_step": 260605, "epoch": 1551} {"train_loss": -11.833839416503906, "global_step": 260606, "epoch": 1551} {"train_loss": -11.706801414489746, "global_step": 260607, "epoch": 1551} {"train_loss": -11.730914115905762, "global_step": 260608, "epoch": 1551} {"train_loss": -11.955867767333984, "global_step": 260609, "epoch": 1551} {"train_loss": -11.373235702514648, "global_step": 260610, "epoch": 1551} {"train_loss": -11.616682052612305, "global_step": 260611, "epoch": 1551} {"train_loss": -11.730488777160645, "global_step": 260612, "epoch": 1551} {"train_loss": -11.357431411743164, "global_step": 260613, "epoch": 1551} {"train_loss": -11.707047462463379, "global_step": 260614, "epoch": 1551} {"train_loss": -11.93122673034668, "global_step": 260615, "epoch": 1551} {"train_loss": -11.897867202758789, "global_step": 260616, "epoch": 1551} {"train_loss": -11.8768949508667, "global_step": 260617, "epoch": 1551} {"train_loss": -11.900657653808594, "global_step": 260618, "epoch": 1551} {"train_loss": -11.872735023498535, "global_step": 260619, "epoch": 1551} {"train_loss": -12.33840274810791, "global_step": 260620, "epoch": 1551} {"train_loss": -11.973932266235352, "global_step": 260621, "epoch": 1551} {"train_loss": -12.251334190368652, "global_step": 260622, "epoch": 1551} {"train_loss": -12.080404281616211, "global_step": 260623, "epoch": 1551} {"train_loss": -12.197803497314453, "global_step": 260624, "epoch": 1551} {"train_loss": -11.91354751586914, "global_step": 260625, "epoch": 1551} {"train_loss": -12.218338966369629, "global_step": 260626, "epoch": 1551} {"train_loss": -12.119552612304688, "global_step": 260627, "epoch": 1551} {"train_loss": -11.95632553100586, "global_step": 260628, "epoch": 1551} {"train_loss": -12.151195526123047, "global_step": 260629, "epoch": 1551} {"train_loss": -11.91653823852539, "global_step": 260630, "epoch": 1551} {"train_loss": -12.081007957458496, "global_step": 260631, "epoch": 1551} {"train_loss": -12.114710807800293, "global_step": 260632, "epoch": 1551} {"train_loss": -12.11455249786377, "global_step": 260633, "epoch": 1551} {"train_loss": -12.138253211975098, "global_step": 260634, "epoch": 1551} {"train_loss": -11.94668960571289, "global_step": 260635, "epoch": 1551} {"train_loss": -12.273674011230469, "global_step": 260636, "epoch": 1551} {"train_loss": -11.793280601501465, "global_step": 260637, "epoch": 1551} {"train_loss": -12.07899284362793, "global_step": 260638, "epoch": 1551} {"train_loss": -12.270631790161133, "global_step": 260639, "epoch": 1551} {"train_loss": -11.912542343139648, "global_step": 260640, "epoch": 1551} {"train_loss": -12.189104080200195, "global_step": 260641, "epoch": 1551} {"train_loss": -12.23631763458252, "global_step": 260642, "epoch": 1551} {"train_loss": -12.179975509643555, "global_step": 260643, "epoch": 1551} {"train_loss": -11.999015808105469, "global_step": 260644, "epoch": 1551} {"train_loss": -12.346237182617188, "global_step": 260645, "epoch": 1551} {"train_loss": -11.9779691696167, "global_step": 260646, "epoch": 1551} {"train_loss": -12.011859893798828, "global_step": 260647, "epoch": 1551} {"train_loss": -12.204636573791504, "global_step": 260648, "epoch": 1551} {"train_loss": -12.14164924621582, "global_step": 260649, "epoch": 1551} {"train_loss": -12.00432014465332, "global_step": 260650, "epoch": 1551} {"train_loss": -12.050079345703125, "global_step": 260651, "epoch": 1551} {"train_loss": -12.21145248413086, "global_step": 260652, "epoch": 1551} {"train_loss": -11.889876365661621, "global_step": 260653, "epoch": 1551} {"train_loss": -12.026773452758789, "global_step": 260654, "epoch": 1551} {"train_loss": -12.354339599609375, "global_step": 260655, "epoch": 1551} {"train_loss": -11.915611267089844, "global_step": 260656, "epoch": 1551} {"train_loss": -12.13541030883789, "global_step": 260657, "epoch": 1551} {"train_loss": -12.240326881408691, "global_step": 260658, "epoch": 1551} {"train_loss": -12.171005249023438, "global_step": 260659, "epoch": 1551} {"train_loss": -12.185148239135742, "global_step": 260660, "epoch": 1551} {"train_loss": -11.92147159576416, "global_step": 260661, "epoch": 1551} {"train_loss": -11.815888404846191, "global_step": 260662, "epoch": 1551} {"train_loss": -12.046086311340332, "global_step": 260663, "epoch": 1551} {"train_loss": -11.914461135864258, "global_step": 260664, "epoch": 1551} {"train_loss": -11.984857559204102, "global_step": 260665, "epoch": 1551} {"train_loss": -12.050405502319336, "global_step": 260666, "epoch": 1551} {"train_loss": -12.261798858642578, "global_step": 260667, "epoch": 1551} {"train_loss": -12.208243370056152, "global_step": 260668, "epoch": 1551} {"train_loss": -12.046550750732422, "global_step": 260669, "epoch": 1551} {"train_loss": -12.13139533996582, "global_step": 260670, "epoch": 1551} {"train_loss": -12.032559394836426, "global_step": 260671, "epoch": 1551} {"train_loss": -12.075733184814453, "global_step": 260672, "epoch": 1551} {"train_loss": -11.417379379272461, "global_step": 260673, "epoch": 1551} {"train_loss": -12.213140487670898, "global_step": 260674, "epoch": 1551} {"train_loss": -12.156182289123535, "global_step": 260675, "epoch": 1551} {"train_loss": -11.846704483032227, "global_step": 260676, "epoch": 1551} {"train_loss": -11.547134399414062, "global_step": 260677, "epoch": 1551} {"train_loss": -11.984716415405273, "global_step": 260678, "epoch": 1551} {"train_loss": -11.778560638427734, "global_step": 260679, "epoch": 1551} {"train_loss": -11.446473121643066, "global_step": 260680, "epoch": 1551} {"train_loss": -11.902155876159668, "global_step": 260681, "epoch": 1551} {"train_loss": -12.002901077270508, "global_step": 260682, "epoch": 1551} {"train_loss": -10.537300109863281, "global_step": 260683, "epoch": 1551} {"train_loss": -10.624170303344727, "global_step": 260684, "epoch": 1551} {"train_loss": -10.827949523925781, "global_step": 260685, "epoch": 1551} {"train_loss": -10.99842357635498, "global_step": 260686, "epoch": 1551} {"train_loss": -11.067035675048828, "global_step": 260687, "epoch": 1551} {"train_loss": -10.849040985107422, "global_step": 260688, "epoch": 1551} {"train_loss": -10.201530456542969, "global_step": 260689, "epoch": 1551} {"train_loss": -9.465592384338379, "global_step": 260690, "epoch": 1551} {"train_loss": -8.147028923034668, "global_step": 260691, "epoch": 1551} {"train_loss": -8.640169143676758, "global_step": 260692, "epoch": 1551} {"train_loss": -6.764592170715332, "global_step": 260693, "epoch": 1551} {"train_loss": -7.4615092277526855, "global_step": 260694, "epoch": 1551} {"train_loss": -6.13664436340332, "global_step": 260695, "epoch": 1551} {"train_loss": -5.4262189865112305, "global_step": 260696, "epoch": 1551} {"train_loss": -7.080297470092773, "global_step": 260697, "epoch": 1551} {"train_loss": -7.719526290893555, "global_step": 260698, "epoch": 1551} {"train_loss": -7.030952453613281, "global_step": 260699, "epoch": 1551} {"train_loss": -7.33116340637207, "global_step": 260700, "epoch": 1551} {"train_loss": -7.345943450927734, "global_step": 260701, "epoch": 1551} {"train_loss": -7.919565200805664, "global_step": 260702, "epoch": 1551} {"train_loss": -8.502300262451172, "global_step": 260703, "epoch": 1551} {"train_loss": -7.941931247711182, "global_step": 260704, "epoch": 1551} {"train_loss": -8.579697608947754, "global_step": 260705, "epoch": 1551} {"train_loss": -8.42418098449707, "global_step": 260706, "epoch": 1551} {"train_loss": -8.779815673828125, "global_step": 260707, "epoch": 1551} {"train_loss": -9.469468116760254, "global_step": 260708, "epoch": 1551} {"train_loss": -9.229835510253906, "global_step": 260709, "epoch": 1551} {"train_loss": -10.276100158691406, "global_step": 260710, "epoch": 1551} {"train_loss": -10.515104293823242, "global_step": 260711, "epoch": 1551} {"train_loss": -10.437909126281738, "global_step": 260712, "epoch": 1551} {"train_loss": -10.769688606262207, "global_step": 260713, "epoch": 1551} {"train_loss": -10.405597686767578, "global_step": 260714, "epoch": 1551} {"train_loss": -10.651137351989746, "global_step": 260715, "epoch": 1551} {"train_loss": -10.7516450881958, "global_step": 260716, "epoch": 1551} {"train_loss": -10.492895126342773, "global_step": 260717, "epoch": 1551} {"train_loss": -10.701094627380371, "global_step": 260718, "epoch": 1551} {"train_loss": -10.89900016784668, "global_step": 260719, "epoch": 1551} {"train_loss": -10.338664054870605, "global_step": 260720, "epoch": 1551} {"train_loss": -11.149543762207031, "global_step": 260721, "epoch": 1551} {"train_loss": -10.673718452453613, "global_step": 260722, "epoch": 1551} {"train_loss": -10.544801712036133, "global_step": 260723, "epoch": 1551} {"train_loss": -11.056466102600098, "global_step": 260724, "epoch": 1551} {"train_loss": -11.407206535339355, "global_step": 260725, "epoch": 1551} {"train_loss": -10.89039421081543, "global_step": 260726, "epoch": 1551} {"train_loss": -10.865283012390137, "global_step": 260727, "epoch": 1551} {"train_loss": -11.243040084838867, "global_step": 260728, "epoch": 1551} {"train_loss": -10.952956199645996, "global_step": 260729, "epoch": 1551} {"train_loss": -11.251880645751953, "global_step": 260730, "epoch": 1551} {"train_loss": -11.344600677490234, "global_step": 260731, "epoch": 1551} {"train_loss": -11.126635551452637, "global_step": 260732, "epoch": 1551} {"train_loss": -11.309045791625977, "global_step": 260733, "epoch": 1551} {"train_loss": -11.518356323242188, "global_step": 260734, "epoch": 1551} {"train_loss": -11.228793206669035, "global_step": 260735, "epoch": 1551, "val_loss": 269339.34375} {"train_loss": -11.552270889282227, "global_step": 260736, "epoch": 1552} {"train_loss": -11.534924507141113, "global_step": 260737, "epoch": 1552} {"train_loss": -11.48213005065918, "global_step": 260738, "epoch": 1552} {"train_loss": -11.474823951721191, "global_step": 260739, "epoch": 1552} {"train_loss": -11.630876541137695, "global_step": 260740, "epoch": 1552} {"train_loss": -11.400045394897461, "global_step": 260741, "epoch": 1552} {"train_loss": -11.641546249389648, "global_step": 260742, "epoch": 1552} {"train_loss": -11.347076416015625, "global_step": 260743, "epoch": 1552} {"train_loss": -11.763885498046875, "global_step": 260744, "epoch": 1552} {"train_loss": -11.562313079833984, "global_step": 260745, "epoch": 1552} {"train_loss": -11.674921035766602, "global_step": 260746, "epoch": 1552} {"train_loss": -11.851961135864258, "global_step": 260747, "epoch": 1552} {"train_loss": -11.661359786987305, "global_step": 260748, "epoch": 1552} {"train_loss": -11.733264923095703, "global_step": 260749, "epoch": 1552} {"train_loss": -11.760050773620605, "global_step": 260750, "epoch": 1552} {"train_loss": -11.42800521850586, "global_step": 260751, "epoch": 1552} {"train_loss": -11.744243621826172, "global_step": 260752, "epoch": 1552} {"train_loss": -11.724939346313477, "global_step": 260753, "epoch": 1552} {"train_loss": -11.58087158203125, "global_step": 260754, "epoch": 1552} {"train_loss": -11.55728816986084, "global_step": 260755, "epoch": 1552} {"train_loss": -11.780548095703125, "global_step": 260756, "epoch": 1552} {"train_loss": -11.742914199829102, "global_step": 260757, "epoch": 1552} {"train_loss": -11.432392120361328, "global_step": 260758, "epoch": 1552} {"train_loss": -11.84949016571045, "global_step": 260759, "epoch": 1552} {"train_loss": -11.559993743896484, "global_step": 260760, "epoch": 1552} {"train_loss": -11.741305351257324, "global_step": 260761, "epoch": 1552} {"train_loss": -11.62076187133789, "global_step": 260762, "epoch": 1552} {"train_loss": -11.777848243713379, "global_step": 260763, "epoch": 1552} {"train_loss": -11.469648361206055, "global_step": 260764, "epoch": 1552} {"train_loss": -11.59273910522461, "global_step": 260765, "epoch": 1552} {"train_loss": -11.855398178100586, "global_step": 260766, "epoch": 1552} {"train_loss": -11.504982948303223, "global_step": 260767, "epoch": 1552} {"train_loss": -11.984136581420898, "global_step": 260768, "epoch": 1552} {"train_loss": -11.750341415405273, "global_step": 260769, "epoch": 1552} {"train_loss": -12.00871467590332, "global_step": 260770, "epoch": 1552} {"train_loss": -11.692386627197266, "global_step": 260771, "epoch": 1552} {"train_loss": -12.096883773803711, "global_step": 260772, "epoch": 1552} {"train_loss": -11.613088607788086, "global_step": 260773, "epoch": 1552} {"train_loss": -12.21984577178955, "global_step": 260774, "epoch": 1552} {"train_loss": -11.76817512512207, "global_step": 260775, "epoch": 1552} {"train_loss": -12.120386123657227, "global_step": 260776, "epoch": 1552} {"train_loss": -12.090656280517578, "global_step": 260777, "epoch": 1552} {"train_loss": -11.881351470947266, "global_step": 260778, "epoch": 1552} {"train_loss": -11.953699111938477, "global_step": 260779, "epoch": 1552} {"train_loss": -11.996538162231445, "global_step": 260780, "epoch": 1552} {"train_loss": -12.025079727172852, "global_step": 260781, "epoch": 1552} {"train_loss": -12.123748779296875, "global_step": 260782, "epoch": 1552} {"train_loss": -12.176615715026855, "global_step": 260783, "epoch": 1552} {"train_loss": -12.16079044342041, "global_step": 260784, "epoch": 1552} {"train_loss": -12.105716705322266, "global_step": 260785, "epoch": 1552} {"train_loss": -12.184980392456055, "global_step": 260786, "epoch": 1552} {"train_loss": -12.120797157287598, "global_step": 260787, "epoch": 1552} {"train_loss": -12.167972564697266, "global_step": 260788, "epoch": 1552} {"train_loss": -12.2992525100708, "global_step": 260789, "epoch": 1552} {"train_loss": -11.982755661010742, "global_step": 260790, "epoch": 1552} {"train_loss": -12.070525169372559, "global_step": 260791, "epoch": 1552} {"train_loss": -12.271148681640625, "global_step": 260792, "epoch": 1552} {"train_loss": -11.935823440551758, "global_step": 260793, "epoch": 1552} {"train_loss": -11.919116973876953, "global_step": 260794, "epoch": 1552} {"train_loss": -12.14700698852539, "global_step": 260795, "epoch": 1552} {"train_loss": -12.204050064086914, "global_step": 260796, "epoch": 1552} {"train_loss": -11.902687072753906, "global_step": 260797, "epoch": 1552} {"train_loss": -12.203664779663086, "global_step": 260798, "epoch": 1552} {"train_loss": -11.997734069824219, "global_step": 260799, "epoch": 1552} {"train_loss": -12.13984203338623, "global_step": 260800, "epoch": 1552} {"train_loss": -12.138519287109375, "global_step": 260801, "epoch": 1552} {"train_loss": -11.798250198364258, "global_step": 260802, "epoch": 1552} {"train_loss": -11.723669052124023, "global_step": 260803, "epoch": 1552} {"train_loss": -12.056844711303711, "global_step": 260804, "epoch": 1552} {"train_loss": -12.068611145019531, "global_step": 260805, "epoch": 1552} {"train_loss": -12.27737045288086, "global_step": 260806, "epoch": 1552} {"train_loss": -12.171493530273438, "global_step": 260807, "epoch": 1552} {"train_loss": -12.286943435668945, "global_step": 260808, "epoch": 1552} {"train_loss": -12.224273681640625, "global_step": 260809, "epoch": 1552} {"train_loss": -12.07078742980957, "global_step": 260810, "epoch": 1552} {"train_loss": -11.594705581665039, "global_step": 260811, "epoch": 1552} {"train_loss": -12.0328369140625, "global_step": 260812, "epoch": 1552} {"train_loss": -11.953076362609863, "global_step": 260813, "epoch": 1552} {"train_loss": -11.713166236877441, "global_step": 260814, "epoch": 1552} {"train_loss": -11.766971588134766, "global_step": 260815, "epoch": 1552} {"train_loss": -12.228412628173828, "global_step": 260816, "epoch": 1552} {"train_loss": -11.271669387817383, "global_step": 260817, "epoch": 1552} {"train_loss": -10.147979736328125, "global_step": 260818, "epoch": 1552} {"train_loss": -11.048830032348633, "global_step": 260819, "epoch": 1552} {"train_loss": -10.1888427734375, "global_step": 260820, "epoch": 1552} {"train_loss": -8.587528228759766, "global_step": 260821, "epoch": 1552} {"train_loss": -9.313061714172363, "global_step": 260822, "epoch": 1552} {"train_loss": -10.059013366699219, "global_step": 260823, "epoch": 1552} {"train_loss": -10.568181037902832, "global_step": 260824, "epoch": 1552} {"train_loss": -9.916253089904785, "global_step": 260825, "epoch": 1552} {"train_loss": -8.661360740661621, "global_step": 260826, "epoch": 1552} {"train_loss": -9.12293815612793, "global_step": 260827, "epoch": 1552} {"train_loss": -9.880727767944336, "global_step": 260828, "epoch": 1552} {"train_loss": -10.16601276397705, "global_step": 260829, "epoch": 1552} {"train_loss": -8.438828468322754, "global_step": 260830, "epoch": 1552} {"train_loss": -9.27724838256836, "global_step": 260831, "epoch": 1552} {"train_loss": -8.300683975219727, "global_step": 260832, "epoch": 1552} {"train_loss": -7.036196708679199, "global_step": 260833, "epoch": 1552} {"train_loss": -8.329618453979492, "global_step": 260834, "epoch": 1552} {"train_loss": -8.489377975463867, "global_step": 260835, "epoch": 1552} {"train_loss": -10.821599960327148, "global_step": 260836, "epoch": 1552} {"train_loss": -9.601677894592285, "global_step": 260837, "epoch": 1552} {"train_loss": -9.091609954833984, "global_step": 260838, "epoch": 1552} {"train_loss": -9.877738952636719, "global_step": 260839, "epoch": 1552} {"train_loss": -10.591632843017578, "global_step": 260840, "epoch": 1552} {"train_loss": -9.389032363891602, "global_step": 260841, "epoch": 1552} {"train_loss": -10.941808700561523, "global_step": 260842, "epoch": 1552} {"train_loss": -9.517648696899414, "global_step": 260843, "epoch": 1552} {"train_loss": -10.090426445007324, "global_step": 260844, "epoch": 1552} {"train_loss": -10.62755012512207, "global_step": 260845, "epoch": 1552} {"train_loss": -10.173988342285156, "global_step": 260846, "epoch": 1552} {"train_loss": -9.797653198242188, "global_step": 260847, "epoch": 1552} {"train_loss": -11.412942886352539, "global_step": 260848, "epoch": 1552} {"train_loss": -9.596383094787598, "global_step": 260849, "epoch": 1552} {"train_loss": -10.8038330078125, "global_step": 260850, "epoch": 1552} {"train_loss": -11.135872840881348, "global_step": 260851, "epoch": 1552} {"train_loss": -10.583325386047363, "global_step": 260852, "epoch": 1552} {"train_loss": -11.035011291503906, "global_step": 260853, "epoch": 1552} {"train_loss": -10.895271301269531, "global_step": 260854, "epoch": 1552} {"train_loss": -10.632088661193848, "global_step": 260855, "epoch": 1552} {"train_loss": -10.980770111083984, "global_step": 260856, "epoch": 1552} {"train_loss": -10.976816177368164, "global_step": 260857, "epoch": 1552} {"train_loss": -11.213138580322266, "global_step": 260858, "epoch": 1552} {"train_loss": -10.722796440124512, "global_step": 260859, "epoch": 1552} {"train_loss": -11.341503143310547, "global_step": 260860, "epoch": 1552} {"train_loss": -11.170846939086914, "global_step": 260861, "epoch": 1552} {"train_loss": -11.214834213256836, "global_step": 260862, "epoch": 1552} {"train_loss": -11.196898460388184, "global_step": 260863, "epoch": 1552} {"train_loss": -11.129293441772461, "global_step": 260864, "epoch": 1552} {"train_loss": -11.737192153930664, "global_step": 260865, "epoch": 1552} {"train_loss": -11.128692626953125, "global_step": 260866, "epoch": 1552} {"train_loss": -10.958280563354492, "global_step": 260867, "epoch": 1552} {"train_loss": -11.60853385925293, "global_step": 260868, "epoch": 1552} {"train_loss": -11.368701934814453, "global_step": 260869, "epoch": 1552} {"train_loss": -11.258275032043457, "global_step": 260870, "epoch": 1552} {"train_loss": -11.662845611572266, "global_step": 260871, "epoch": 1552} {"train_loss": -11.336182594299316, "global_step": 260872, "epoch": 1552} {"train_loss": -11.61903190612793, "global_step": 260873, "epoch": 1552} {"train_loss": -11.729814529418945, "global_step": 260874, "epoch": 1552} {"train_loss": -11.600992202758789, "global_step": 260875, "epoch": 1552} {"train_loss": -11.669642448425293, "global_step": 260876, "epoch": 1552} {"train_loss": -11.442105293273926, "global_step": 260877, "epoch": 1552} {"train_loss": -11.689655303955078, "global_step": 260878, "epoch": 1552} {"train_loss": -11.445414543151855, "global_step": 260879, "epoch": 1552} {"train_loss": -11.5867280960083, "global_step": 260880, "epoch": 1552} {"train_loss": -11.4793119430542, "global_step": 260881, "epoch": 1552} {"train_loss": -11.741963386535645, "global_step": 260882, "epoch": 1552} {"train_loss": -11.695718765258789, "global_step": 260883, "epoch": 1552} {"train_loss": -11.683510780334473, "global_step": 260884, "epoch": 1552} {"train_loss": -11.813040733337402, "global_step": 260885, "epoch": 1552} {"train_loss": -11.68169116973877, "global_step": 260886, "epoch": 1552} {"train_loss": -11.715715408325195, "global_step": 260887, "epoch": 1552} {"train_loss": -11.44200611114502, "global_step": 260888, "epoch": 1552} {"train_loss": -11.747122764587402, "global_step": 260889, "epoch": 1552} {"train_loss": -11.834471702575684, "global_step": 260890, "epoch": 1552} {"train_loss": -11.868183135986328, "global_step": 260891, "epoch": 1552} {"train_loss": -11.734990119934082, "global_step": 260892, "epoch": 1552} {"train_loss": -11.999605178833008, "global_step": 260893, "epoch": 1552} {"train_loss": -11.807252883911133, "global_step": 260894, "epoch": 1552} {"train_loss": -11.977097511291504, "global_step": 260895, "epoch": 1552} {"train_loss": -12.020975112915039, "global_step": 260896, "epoch": 1552} {"train_loss": -12.019529342651367, "global_step": 260897, "epoch": 1552} {"train_loss": -12.049176216125488, "global_step": 260898, "epoch": 1552} {"train_loss": -11.93677806854248, "global_step": 260899, "epoch": 1552} {"train_loss": -11.754542350769043, "global_step": 260900, "epoch": 1552} {"train_loss": -12.001815795898438, "global_step": 260901, "epoch": 1552} {"train_loss": -11.958881378173828, "global_step": 260902, "epoch": 1552} {"train_loss": -11.324167217527117, "global_step": 260903, "epoch": 1552, "val_loss": 263991.96875} {"train_loss": -11.987174987792969, "global_step": 260904, "epoch": 1553} {"train_loss": -12.058650970458984, "global_step": 260905, "epoch": 1553} {"train_loss": -12.112885475158691, "global_step": 260906, "epoch": 1553} {"train_loss": -12.09851360321045, "global_step": 260907, "epoch": 1553} {"train_loss": -12.066293716430664, "global_step": 260908, "epoch": 1553} {"train_loss": -12.099486351013184, "global_step": 260909, "epoch": 1553} {"train_loss": -12.054080963134766, "global_step": 260910, "epoch": 1553} {"train_loss": -12.089338302612305, "global_step": 260911, "epoch": 1553} {"train_loss": -11.966405868530273, "global_step": 260912, "epoch": 1553} {"train_loss": -12.054973602294922, "global_step": 260913, "epoch": 1553} {"train_loss": -12.142486572265625, "global_step": 260914, "epoch": 1553} {"train_loss": -12.17714786529541, "global_step": 260915, "epoch": 1553} {"train_loss": -12.156448364257812, "global_step": 260916, "epoch": 1553} {"train_loss": -12.077047348022461, "global_step": 260917, "epoch": 1553} {"train_loss": -12.253860473632812, "global_step": 260918, "epoch": 1553} {"train_loss": -12.211832046508789, "global_step": 260919, "epoch": 1553} {"train_loss": -12.243968963623047, "global_step": 260920, "epoch": 1553} {"train_loss": -12.193306922912598, "global_step": 260921, "epoch": 1553} {"train_loss": -12.110456466674805, "global_step": 260922, "epoch": 1553} {"train_loss": -12.175397872924805, "global_step": 260923, "epoch": 1553} {"train_loss": -12.185206413269043, "global_step": 260924, "epoch": 1553} {"train_loss": -12.195300102233887, "global_step": 260925, "epoch": 1553} {"train_loss": -12.231130599975586, "global_step": 260926, "epoch": 1553} {"train_loss": -12.098600387573242, "global_step": 260927, "epoch": 1553} {"train_loss": -12.224164962768555, "global_step": 260928, "epoch": 1553} {"train_loss": -11.998825073242188, "global_step": 260929, "epoch": 1553} {"train_loss": -12.10399055480957, "global_step": 260930, "epoch": 1553} {"train_loss": -12.14849853515625, "global_step": 260931, "epoch": 1553} {"train_loss": -12.11381721496582, "global_step": 260932, "epoch": 1553} {"train_loss": -12.196545600891113, "global_step": 260933, "epoch": 1553} {"train_loss": -12.282164573669434, "global_step": 260934, "epoch": 1553} {"train_loss": -12.419109344482422, "global_step": 260935, "epoch": 1553} {"train_loss": -12.064726829528809, "global_step": 260936, "epoch": 1553} {"train_loss": -12.380778312683105, "global_step": 260937, "epoch": 1553} {"train_loss": -12.356907844543457, "global_step": 260938, "epoch": 1553} {"train_loss": -12.329458236694336, "global_step": 260939, "epoch": 1553} {"train_loss": -12.291728973388672, "global_step": 260940, "epoch": 1553} {"train_loss": -12.04991340637207, "global_step": 260941, "epoch": 1553} {"train_loss": -12.204828262329102, "global_step": 260942, "epoch": 1553} {"train_loss": -12.403460502624512, "global_step": 260943, "epoch": 1553} {"train_loss": -12.416196823120117, "global_step": 260944, "epoch": 1553} {"train_loss": -12.20656681060791, "global_step": 260945, "epoch": 1553} {"train_loss": -11.125758171081543, "global_step": 260946, "epoch": 1553} {"train_loss": -9.272125244140625, "global_step": 260947, "epoch": 1553} {"train_loss": -10.951817512512207, "global_step": 260948, "epoch": 1553} {"train_loss": -12.100289344787598, "global_step": 260949, "epoch": 1553} {"train_loss": -11.710134506225586, "global_step": 260950, "epoch": 1553} {"train_loss": -10.021183013916016, "global_step": 260951, "epoch": 1553} {"train_loss": -10.417104721069336, "global_step": 260952, "epoch": 1553} {"train_loss": -11.920576095581055, "global_step": 260953, "epoch": 1553} {"train_loss": -10.565170288085938, "global_step": 260954, "epoch": 1553} {"train_loss": -7.033194065093994, "global_step": 260955, "epoch": 1553} {"train_loss": -9.133613586425781, "global_step": 260956, "epoch": 1553} {"train_loss": -9.81955337524414, "global_step": 260957, "epoch": 1553} {"train_loss": -9.34273910522461, "global_step": 260958, "epoch": 1553} {"train_loss": -9.90098762512207, "global_step": 260959, "epoch": 1553} {"train_loss": -9.191049575805664, "global_step": 260960, "epoch": 1553} {"train_loss": -10.037574768066406, "global_step": 260961, "epoch": 1553} {"train_loss": -10.131367683410645, "global_step": 260962, "epoch": 1553} {"train_loss": -10.219310760498047, "global_step": 260963, "epoch": 1553} {"train_loss": -10.394645690917969, "global_step": 260964, "epoch": 1553} {"train_loss": -9.872004508972168, "global_step": 260965, "epoch": 1553} {"train_loss": -10.805122375488281, "global_step": 260966, "epoch": 1553} {"train_loss": -10.201435089111328, "global_step": 260967, "epoch": 1553} {"train_loss": -10.617965698242188, "global_step": 260968, "epoch": 1553} {"train_loss": -11.040288925170898, "global_step": 260969, "epoch": 1553} {"train_loss": -10.977828979492188, "global_step": 260970, "epoch": 1553} {"train_loss": -11.172456741333008, "global_step": 260971, "epoch": 1553} {"train_loss": -11.16653823852539, "global_step": 260972, "epoch": 1553} {"train_loss": -10.909749984741211, "global_step": 260973, "epoch": 1553} {"train_loss": -10.861412048339844, "global_step": 260974, "epoch": 1553} {"train_loss": -10.500116348266602, "global_step": 260975, "epoch": 1553} {"train_loss": -10.975342750549316, "global_step": 260976, "epoch": 1553} {"train_loss": -10.890460968017578, "global_step": 260977, "epoch": 1553} {"train_loss": -10.233577728271484, "global_step": 260978, "epoch": 1553} {"train_loss": -11.07792854309082, "global_step": 260979, "epoch": 1553} {"train_loss": -10.660955429077148, "global_step": 260980, "epoch": 1553} {"train_loss": -10.904624938964844, "global_step": 260981, "epoch": 1553} {"train_loss": -11.447266578674316, "global_step": 260982, "epoch": 1553} {"train_loss": -10.859302520751953, "global_step": 260983, "epoch": 1553} {"train_loss": -10.799308776855469, "global_step": 260984, "epoch": 1553} {"train_loss": -11.201011657714844, "global_step": 260985, "epoch": 1553} {"train_loss": -10.832605361938477, "global_step": 260986, "epoch": 1553} {"train_loss": -10.577375411987305, "global_step": 260987, "epoch": 1553} {"train_loss": -11.54177474975586, "global_step": 260988, "epoch": 1553} {"train_loss": -10.07004165649414, "global_step": 260989, "epoch": 1553} {"train_loss": -10.845076560974121, "global_step": 260990, "epoch": 1553} {"train_loss": -11.288595199584961, "global_step": 260991, "epoch": 1553} {"train_loss": -10.280937194824219, "global_step": 260992, "epoch": 1553} {"train_loss": -10.995561599731445, "global_step": 260993, "epoch": 1553} {"train_loss": -11.397560119628906, "global_step": 260994, "epoch": 1553} {"train_loss": -10.393169403076172, "global_step": 260995, "epoch": 1553} {"train_loss": -11.732934951782227, "global_step": 260996, "epoch": 1553} {"train_loss": -10.916428565979004, "global_step": 260997, "epoch": 1553} {"train_loss": -11.274789810180664, "global_step": 260998, "epoch": 1553} {"train_loss": -11.60743522644043, "global_step": 260999, "epoch": 1553} {"train_loss": -11.36069107055664, "global_step": 261000, "epoch": 1553} {"train_loss": -11.103081703186035, "global_step": 261001, "epoch": 1553} {"train_loss": -11.455696105957031, "global_step": 261002, "epoch": 1553} {"train_loss": -11.40843391418457, "global_step": 261003, "epoch": 1553} {"train_loss": -11.40279483795166, "global_step": 261004, "epoch": 1553} {"train_loss": -11.470712661743164, "global_step": 261005, "epoch": 1553} {"train_loss": -11.158172607421875, "global_step": 261006, "epoch": 1553} {"train_loss": -11.266855239868164, "global_step": 261007, "epoch": 1553} {"train_loss": -11.705219268798828, "global_step": 261008, "epoch": 1553} {"train_loss": -11.301618576049805, "global_step": 261009, "epoch": 1553} {"train_loss": -11.735652923583984, "global_step": 261010, "epoch": 1553} {"train_loss": -11.840062141418457, "global_step": 261011, "epoch": 1553} {"train_loss": -11.6913480758667, "global_step": 261012, "epoch": 1553} {"train_loss": -11.802587509155273, "global_step": 261013, "epoch": 1553} {"train_loss": -11.73544979095459, "global_step": 261014, "epoch": 1553} {"train_loss": -11.649046897888184, "global_step": 261015, "epoch": 1553} {"train_loss": -11.801913261413574, "global_step": 261016, "epoch": 1553} {"train_loss": -11.546317100524902, "global_step": 261017, "epoch": 1553} {"train_loss": -11.807392120361328, "global_step": 261018, "epoch": 1553} {"train_loss": -11.779163360595703, "global_step": 261019, "epoch": 1553} {"train_loss": -11.857439041137695, "global_step": 261020, "epoch": 1553} {"train_loss": -11.938074111938477, "global_step": 261021, "epoch": 1553} {"train_loss": -11.74902057647705, "global_step": 261022, "epoch": 1553} {"train_loss": -11.747673988342285, "global_step": 261023, "epoch": 1553} {"train_loss": -11.797948837280273, "global_step": 261024, "epoch": 1553} {"train_loss": -11.714585304260254, "global_step": 261025, "epoch": 1553} {"train_loss": -11.84610366821289, "global_step": 261026, "epoch": 1553} {"train_loss": -11.963531494140625, "global_step": 261027, "epoch": 1553} {"train_loss": -11.811262130737305, "global_step": 261028, "epoch": 1553} {"train_loss": -11.975101470947266, "global_step": 261029, "epoch": 1553} {"train_loss": -11.70370864868164, "global_step": 261030, "epoch": 1553} {"train_loss": -11.78705883026123, "global_step": 261031, "epoch": 1553} {"train_loss": -11.943507194519043, "global_step": 261032, "epoch": 1553} {"train_loss": -11.869205474853516, "global_step": 261033, "epoch": 1553} {"train_loss": -11.980384826660156, "global_step": 261034, "epoch": 1553} {"train_loss": -11.821837425231934, "global_step": 261035, "epoch": 1553} {"train_loss": -11.989300727844238, "global_step": 261036, "epoch": 1553} {"train_loss": -11.97982406616211, "global_step": 261037, "epoch": 1553} {"train_loss": -11.969385147094727, "global_step": 261038, "epoch": 1553} {"train_loss": -12.05814266204834, "global_step": 261039, "epoch": 1553} {"train_loss": -12.047125816345215, "global_step": 261040, "epoch": 1553} {"train_loss": -11.979843139648438, "global_step": 261041, "epoch": 1553} {"train_loss": -12.04886245727539, "global_step": 261042, "epoch": 1553} {"train_loss": -12.197280883789062, "global_step": 261043, "epoch": 1553} {"train_loss": -12.251380920410156, "global_step": 261044, "epoch": 1553} {"train_loss": -12.179594039916992, "global_step": 261045, "epoch": 1553} {"train_loss": -12.020517349243164, "global_step": 261046, "epoch": 1553} {"train_loss": -12.147762298583984, "global_step": 261047, "epoch": 1553} {"train_loss": -12.179167747497559, "global_step": 261048, "epoch": 1553} {"train_loss": -12.192475318908691, "global_step": 261049, "epoch": 1553} {"train_loss": -12.195672988891602, "global_step": 261050, "epoch": 1553} {"train_loss": -12.132383346557617, "global_step": 261051, "epoch": 1553} {"train_loss": -12.140713691711426, "global_step": 261052, "epoch": 1553} {"train_loss": -12.190815925598145, "global_step": 261053, "epoch": 1553} {"train_loss": -12.152725219726562, "global_step": 261054, "epoch": 1553} {"train_loss": -12.231327056884766, "global_step": 261055, "epoch": 1553} {"train_loss": -12.348410606384277, "global_step": 261056, "epoch": 1553} {"train_loss": -12.206884384155273, "global_step": 261057, "epoch": 1553} {"train_loss": -12.119691848754883, "global_step": 261058, "epoch": 1553} {"train_loss": -12.148443222045898, "global_step": 261059, "epoch": 1553} {"train_loss": -11.993497848510742, "global_step": 261060, "epoch": 1553} {"train_loss": -12.047492980957031, "global_step": 261061, "epoch": 1553} {"train_loss": -12.21681022644043, "global_step": 261062, "epoch": 1553} {"train_loss": -12.297466278076172, "global_step": 261063, "epoch": 1553} {"train_loss": -12.28144645690918, "global_step": 261064, "epoch": 1553} {"train_loss": -12.41950511932373, "global_step": 261065, "epoch": 1553} {"train_loss": -12.332154273986816, "global_step": 261066, "epoch": 1553} {"train_loss": -12.218062400817871, "global_step": 261067, "epoch": 1553} {"train_loss": -12.147941589355469, "global_step": 261068, "epoch": 1553} {"train_loss": -12.423870086669922, "global_step": 261069, "epoch": 1553} {"train_loss": -12.107160568237305, "global_step": 261070, "epoch": 1553} {"train_loss": -11.568253951413292, "global_step": 261071, "epoch": 1553, "val_loss": 271780.96875} {"train_loss": -11.940927505493164, "global_step": 261072, "epoch": 1554} {"train_loss": -12.043191909790039, "global_step": 261073, "epoch": 1554} {"train_loss": -11.973469734191895, "global_step": 261074, "epoch": 1554} {"train_loss": -12.069133758544922, "global_step": 261075, "epoch": 1554} {"train_loss": -12.326186180114746, "global_step": 261076, "epoch": 1554} {"train_loss": -11.949424743652344, "global_step": 261077, "epoch": 1554} {"train_loss": -11.957189559936523, "global_step": 261078, "epoch": 1554} {"train_loss": -12.003946304321289, "global_step": 261079, "epoch": 1554} {"train_loss": -11.84561538696289, "global_step": 261080, "epoch": 1554} {"train_loss": -11.936586380004883, "global_step": 261081, "epoch": 1554} {"train_loss": -11.758437156677246, "global_step": 261082, "epoch": 1554} {"train_loss": -11.770654678344727, "global_step": 261083, "epoch": 1554} {"train_loss": -11.845691680908203, "global_step": 261084, "epoch": 1554} {"train_loss": -11.40337085723877, "global_step": 261085, "epoch": 1554} {"train_loss": -11.539589881896973, "global_step": 261086, "epoch": 1554} {"train_loss": -11.05150032043457, "global_step": 261087, "epoch": 1554} {"train_loss": -11.183479309082031, "global_step": 261088, "epoch": 1554} {"train_loss": -11.525114059448242, "global_step": 261089, "epoch": 1554} {"train_loss": -11.933385848999023, "global_step": 261090, "epoch": 1554} {"train_loss": -11.956453323364258, "global_step": 261091, "epoch": 1554} {"train_loss": -11.701364517211914, "global_step": 261092, "epoch": 1554} {"train_loss": -11.416536331176758, "global_step": 261093, "epoch": 1554} {"train_loss": -11.958786964416504, "global_step": 261094, "epoch": 1554} {"train_loss": -12.167242050170898, "global_step": 261095, "epoch": 1554} {"train_loss": -11.899188995361328, "global_step": 261096, "epoch": 1554} {"train_loss": -11.874680519104004, "global_step": 261097, "epoch": 1554} {"train_loss": -12.087089538574219, "global_step": 261098, "epoch": 1554} {"train_loss": -11.71649169921875, "global_step": 261099, "epoch": 1554} {"train_loss": -11.913713455200195, "global_step": 261100, "epoch": 1554} {"train_loss": -12.157061576843262, "global_step": 261101, "epoch": 1554} {"train_loss": -11.668718338012695, "global_step": 261102, "epoch": 1554} {"train_loss": -11.40390396118164, "global_step": 261103, "epoch": 1554} {"train_loss": -11.695131301879883, "global_step": 261104, "epoch": 1554} {"train_loss": -10.910259246826172, "global_step": 261105, "epoch": 1554} {"train_loss": -11.357778549194336, "global_step": 261106, "epoch": 1554} {"train_loss": -11.861852645874023, "global_step": 261107, "epoch": 1554} {"train_loss": -10.85394287109375, "global_step": 261108, "epoch": 1554} {"train_loss": -11.053104400634766, "global_step": 261109, "epoch": 1554} {"train_loss": -11.487441062927246, "global_step": 261110, "epoch": 1554} {"train_loss": -11.845422744750977, "global_step": 261111, "epoch": 1554} {"train_loss": -11.603580474853516, "global_step": 261112, "epoch": 1554} {"train_loss": -11.96543025970459, "global_step": 261113, "epoch": 1554} {"train_loss": -11.95372486114502, "global_step": 261114, "epoch": 1554} {"train_loss": -11.772462844848633, "global_step": 261115, "epoch": 1554} {"train_loss": -11.813559532165527, "global_step": 261116, "epoch": 1554} {"train_loss": -11.798846244812012, "global_step": 261117, "epoch": 1554} {"train_loss": -12.326611518859863, "global_step": 261118, "epoch": 1554} {"train_loss": -11.399592399597168, "global_step": 261119, "epoch": 1554} {"train_loss": -12.170682907104492, "global_step": 261120, "epoch": 1554} {"train_loss": -11.44251823425293, "global_step": 261121, "epoch": 1554} {"train_loss": -11.33249282836914, "global_step": 261122, "epoch": 1554} {"train_loss": -11.73038101196289, "global_step": 261123, "epoch": 1554} {"train_loss": -12.004264831542969, "global_step": 261124, "epoch": 1554} {"train_loss": -10.429058074951172, "global_step": 261125, "epoch": 1554} {"train_loss": -10.734615325927734, "global_step": 261126, "epoch": 1554} {"train_loss": -11.823543548583984, "global_step": 261127, "epoch": 1554} {"train_loss": -10.728825569152832, "global_step": 261128, "epoch": 1554} {"train_loss": -10.438201904296875, "global_step": 261129, "epoch": 1554} {"train_loss": -10.108367919921875, "global_step": 261130, "epoch": 1554} {"train_loss": -9.906606674194336, "global_step": 261131, "epoch": 1554} {"train_loss": -10.054161071777344, "global_step": 261132, "epoch": 1554} {"train_loss": -10.035457611083984, "global_step": 261133, "epoch": 1554} {"train_loss": -10.322807312011719, "global_step": 261134, "epoch": 1554} {"train_loss": -8.844362258911133, "global_step": 261135, "epoch": 1554} {"train_loss": -9.913979530334473, "global_step": 261136, "epoch": 1554} {"train_loss": -11.118993759155273, "global_step": 261137, "epoch": 1554} {"train_loss": -8.942845344543457, "global_step": 261138, "epoch": 1554} {"train_loss": -9.394275665283203, "global_step": 261139, "epoch": 1554} {"train_loss": -10.342582702636719, "global_step": 261140, "epoch": 1554} {"train_loss": -10.423405647277832, "global_step": 261141, "epoch": 1554} {"train_loss": -10.358434677124023, "global_step": 261142, "epoch": 1554} {"train_loss": -10.529058456420898, "global_step": 261143, "epoch": 1554} {"train_loss": -10.877513885498047, "global_step": 261144, "epoch": 1554} {"train_loss": -10.253881454467773, "global_step": 261145, "epoch": 1554} {"train_loss": -11.383539199829102, "global_step": 261146, "epoch": 1554} {"train_loss": -10.317741394042969, "global_step": 261147, "epoch": 1554} {"train_loss": -10.903486251831055, "global_step": 261148, "epoch": 1554} {"train_loss": -11.114534378051758, "global_step": 261149, "epoch": 1554} {"train_loss": -10.78271484375, "global_step": 261150, "epoch": 1554} {"train_loss": -11.228143692016602, "global_step": 261151, "epoch": 1554} {"train_loss": -10.82933235168457, "global_step": 261152, "epoch": 1554} {"train_loss": -11.407219886779785, "global_step": 261153, "epoch": 1554} {"train_loss": -11.500137329101562, "global_step": 261154, "epoch": 1554} {"train_loss": -10.49260139465332, "global_step": 261155, "epoch": 1554} {"train_loss": -11.235919952392578, "global_step": 261156, "epoch": 1554} {"train_loss": -11.207565307617188, "global_step": 261157, "epoch": 1554} {"train_loss": -10.625991821289062, "global_step": 261158, "epoch": 1554} {"train_loss": -11.605781555175781, "global_step": 261159, "epoch": 1554} {"train_loss": -10.909217834472656, "global_step": 261160, "epoch": 1554} {"train_loss": -11.220104217529297, "global_step": 261161, "epoch": 1554} {"train_loss": -11.198041915893555, "global_step": 261162, "epoch": 1554} {"train_loss": -10.839544296264648, "global_step": 261163, "epoch": 1554} {"train_loss": -10.889917373657227, "global_step": 261164, "epoch": 1554} {"train_loss": -11.671528816223145, "global_step": 261165, "epoch": 1554} {"train_loss": -11.261007308959961, "global_step": 261166, "epoch": 1554} {"train_loss": -10.722341537475586, "global_step": 261167, "epoch": 1554} {"train_loss": -11.596359252929688, "global_step": 261168, "epoch": 1554} {"train_loss": -10.672821044921875, "global_step": 261169, "epoch": 1554} {"train_loss": -11.065059661865234, "global_step": 261170, "epoch": 1554} {"train_loss": -11.683700561523438, "global_step": 261171, "epoch": 1554} {"train_loss": -11.261750221252441, "global_step": 261172, "epoch": 1554} {"train_loss": -11.504032135009766, "global_step": 261173, "epoch": 1554} {"train_loss": -11.591324806213379, "global_step": 261174, "epoch": 1554} {"train_loss": -11.369617462158203, "global_step": 261175, "epoch": 1554} {"train_loss": -11.658050537109375, "global_step": 261176, "epoch": 1554} {"train_loss": -11.757205963134766, "global_step": 261177, "epoch": 1554} {"train_loss": -11.428529739379883, "global_step": 261178, "epoch": 1554} {"train_loss": -11.64770793914795, "global_step": 261179, "epoch": 1554} {"train_loss": -11.883980751037598, "global_step": 261180, "epoch": 1554} {"train_loss": -11.490548133850098, "global_step": 261181, "epoch": 1554} {"train_loss": -11.65462589263916, "global_step": 261182, "epoch": 1554} {"train_loss": -11.939192771911621, "global_step": 261183, "epoch": 1554} {"train_loss": -11.809904098510742, "global_step": 261184, "epoch": 1554} {"train_loss": -11.900433540344238, "global_step": 261185, "epoch": 1554} {"train_loss": -11.938515663146973, "global_step": 261186, "epoch": 1554} {"train_loss": -11.64569091796875, "global_step": 261187, "epoch": 1554} {"train_loss": -11.96436882019043, "global_step": 261188, "epoch": 1554} {"train_loss": -11.843215942382812, "global_step": 261189, "epoch": 1554} {"train_loss": -11.646988868713379, "global_step": 261190, "epoch": 1554} {"train_loss": -11.901630401611328, "global_step": 261191, "epoch": 1554} {"train_loss": -11.657535552978516, "global_step": 261192, "epoch": 1554} {"train_loss": -11.997735977172852, "global_step": 261193, "epoch": 1554} {"train_loss": -11.95832633972168, "global_step": 261194, "epoch": 1554} {"train_loss": -11.94823169708252, "global_step": 261195, "epoch": 1554} {"train_loss": -12.017547607421875, "global_step": 261196, "epoch": 1554} {"train_loss": -12.043994903564453, "global_step": 261197, "epoch": 1554} {"train_loss": -12.002996444702148, "global_step": 261198, "epoch": 1554} {"train_loss": -11.847856521606445, "global_step": 261199, "epoch": 1554} {"train_loss": -12.022909164428711, "global_step": 261200, "epoch": 1554} {"train_loss": -11.914179801940918, "global_step": 261201, "epoch": 1554} {"train_loss": -12.137088775634766, "global_step": 261202, "epoch": 1554} {"train_loss": -12.014105796813965, "global_step": 261203, "epoch": 1554} {"train_loss": -12.001550674438477, "global_step": 261204, "epoch": 1554} {"train_loss": -11.792562484741211, "global_step": 261205, "epoch": 1554} {"train_loss": -12.012346267700195, "global_step": 261206, "epoch": 1554} {"train_loss": -12.001548767089844, "global_step": 261207, "epoch": 1554} {"train_loss": -11.927966117858887, "global_step": 261208, "epoch": 1554} {"train_loss": -12.100765228271484, "global_step": 261209, "epoch": 1554} {"train_loss": -12.030266761779785, "global_step": 261210, "epoch": 1554} {"train_loss": -11.37861442565918, "global_step": 261211, "epoch": 1554} {"train_loss": -11.778026580810547, "global_step": 261212, "epoch": 1554} {"train_loss": -11.745122909545898, "global_step": 261213, "epoch": 1554} {"train_loss": -11.440202713012695, "global_step": 261214, "epoch": 1554} {"train_loss": -11.688806533813477, "global_step": 261215, "epoch": 1554} {"train_loss": -11.603292465209961, "global_step": 261216, "epoch": 1554} {"train_loss": -12.014432907104492, "global_step": 261217, "epoch": 1554} {"train_loss": -11.357370376586914, "global_step": 261218, "epoch": 1554} {"train_loss": -10.82479190826416, "global_step": 261219, "epoch": 1554} {"train_loss": -11.535350799560547, "global_step": 261220, "epoch": 1554} {"train_loss": -10.916096687316895, "global_step": 261221, "epoch": 1554} {"train_loss": -11.51296615600586, "global_step": 261222, "epoch": 1554} {"train_loss": -10.780644416809082, "global_step": 261223, "epoch": 1554} {"train_loss": -10.849756240844727, "global_step": 261224, "epoch": 1554} {"train_loss": -11.509773254394531, "global_step": 261225, "epoch": 1554} {"train_loss": -10.819426536560059, "global_step": 261226, "epoch": 1554} {"train_loss": -10.879059791564941, "global_step": 261227, "epoch": 1554} {"train_loss": -11.760393142700195, "global_step": 261228, "epoch": 1554} {"train_loss": -11.092884063720703, "global_step": 261229, "epoch": 1554} {"train_loss": -11.44208812713623, "global_step": 261230, "epoch": 1554} {"train_loss": -11.74618148803711, "global_step": 261231, "epoch": 1554} {"train_loss": -11.08154010772705, "global_step": 261232, "epoch": 1554} {"train_loss": -11.769357681274414, "global_step": 261233, "epoch": 1554} {"train_loss": -11.498416900634766, "global_step": 261234, "epoch": 1554} {"train_loss": -11.453508377075195, "global_step": 261235, "epoch": 1554} {"train_loss": -10.777027130126953, "global_step": 261236, "epoch": 1554} {"train_loss": -11.400835037231445, "global_step": 261237, "epoch": 1554} {"train_loss": -11.62540054321289, "global_step": 261238, "epoch": 1554} {"train_loss": -11.413065331322807, "global_step": 261239, "epoch": 1554, "val_loss": 267380.09375} {"train_loss": -11.789952278137207, "global_step": 261240, "epoch": 1555} {"train_loss": -11.794933319091797, "global_step": 261241, "epoch": 1555} {"train_loss": -11.48105239868164, "global_step": 261242, "epoch": 1555} {"train_loss": -11.826227188110352, "global_step": 261243, "epoch": 1555} {"train_loss": -11.406429290771484, "global_step": 261244, "epoch": 1555} {"train_loss": -11.52425479888916, "global_step": 261245, "epoch": 1555} {"train_loss": -11.79952621459961, "global_step": 261246, "epoch": 1555} {"train_loss": -11.385488510131836, "global_step": 261247, "epoch": 1555} {"train_loss": -11.699045181274414, "global_step": 261248, "epoch": 1555} {"train_loss": -11.49266242980957, "global_step": 261249, "epoch": 1555} {"train_loss": -11.640947341918945, "global_step": 261250, "epoch": 1555} {"train_loss": -11.802718162536621, "global_step": 261251, "epoch": 1555} {"train_loss": -11.88359260559082, "global_step": 261252, "epoch": 1555} {"train_loss": -11.606761932373047, "global_step": 261253, "epoch": 1555} {"train_loss": -11.693618774414062, "global_step": 261254, "epoch": 1555} {"train_loss": -11.588507652282715, "global_step": 261255, "epoch": 1555} {"train_loss": -11.873250961303711, "global_step": 261256, "epoch": 1555} {"train_loss": -11.685544967651367, "global_step": 261257, "epoch": 1555} {"train_loss": -11.409753799438477, "global_step": 261258, "epoch": 1555} {"train_loss": -11.702045440673828, "global_step": 261259, "epoch": 1555} {"train_loss": -11.40921688079834, "global_step": 261260, "epoch": 1555} {"train_loss": -11.721090316772461, "global_step": 261261, "epoch": 1555} {"train_loss": -11.800802230834961, "global_step": 261262, "epoch": 1555} {"train_loss": -11.246088027954102, "global_step": 261263, "epoch": 1555} {"train_loss": -11.76995849609375, "global_step": 261264, "epoch": 1555} {"train_loss": -11.226417541503906, "global_step": 261265, "epoch": 1555} {"train_loss": -11.995244979858398, "global_step": 261266, "epoch": 1555} {"train_loss": -11.65768814086914, "global_step": 261267, "epoch": 1555} {"train_loss": -11.896894454956055, "global_step": 261268, "epoch": 1555} {"train_loss": -11.670616149902344, "global_step": 261269, "epoch": 1555} {"train_loss": -11.477795600891113, "global_step": 261270, "epoch": 1555} {"train_loss": -11.927570343017578, "global_step": 261271, "epoch": 1555} {"train_loss": -11.567789077758789, "global_step": 261272, "epoch": 1555} {"train_loss": -11.806706428527832, "global_step": 261273, "epoch": 1555} {"train_loss": -11.922027587890625, "global_step": 261274, "epoch": 1555} {"train_loss": -11.866089820861816, "global_step": 261275, "epoch": 1555} {"train_loss": -12.047361373901367, "global_step": 261276, "epoch": 1555} {"train_loss": -11.45943832397461, "global_step": 261277, "epoch": 1555} {"train_loss": -11.98836898803711, "global_step": 261278, "epoch": 1555} {"train_loss": -11.724931716918945, "global_step": 261279, "epoch": 1555} {"train_loss": -12.108160972595215, "global_step": 261280, "epoch": 1555} {"train_loss": -11.591348648071289, "global_step": 261281, "epoch": 1555} {"train_loss": -11.763383865356445, "global_step": 261282, "epoch": 1555} {"train_loss": -12.003583908081055, "global_step": 261283, "epoch": 1555} {"train_loss": -11.641595840454102, "global_step": 261284, "epoch": 1555} {"train_loss": -11.887701034545898, "global_step": 261285, "epoch": 1555} {"train_loss": -11.88371753692627, "global_step": 261286, "epoch": 1555} {"train_loss": -11.769647598266602, "global_step": 261287, "epoch": 1555} {"train_loss": -11.610573768615723, "global_step": 261288, "epoch": 1555} {"train_loss": -12.198432922363281, "global_step": 261289, "epoch": 1555} {"train_loss": -11.678546905517578, "global_step": 261290, "epoch": 1555} {"train_loss": -11.727380752563477, "global_step": 261291, "epoch": 1555} {"train_loss": -11.90009880065918, "global_step": 261292, "epoch": 1555} {"train_loss": -12.114870071411133, "global_step": 261293, "epoch": 1555} {"train_loss": -12.010122299194336, "global_step": 261294, "epoch": 1555} {"train_loss": -12.193778991699219, "global_step": 261295, "epoch": 1555} {"train_loss": -12.010993003845215, "global_step": 261296, "epoch": 1555} {"train_loss": -12.0260591506958, "global_step": 261297, "epoch": 1555} {"train_loss": -12.080354690551758, "global_step": 261298, "epoch": 1555} {"train_loss": -11.8322172164917, "global_step": 261299, "epoch": 1555} {"train_loss": -11.732441902160645, "global_step": 261300, "epoch": 1555} {"train_loss": -11.470390319824219, "global_step": 261301, "epoch": 1555} {"train_loss": -12.130075454711914, "global_step": 261302, "epoch": 1555} {"train_loss": -11.527620315551758, "global_step": 261303, "epoch": 1555} {"train_loss": -12.012619018554688, "global_step": 261304, "epoch": 1555} {"train_loss": -11.893325805664062, "global_step": 261305, "epoch": 1555} {"train_loss": -11.167105674743652, "global_step": 261306, "epoch": 1555} {"train_loss": -11.616788864135742, "global_step": 261307, "epoch": 1555} {"train_loss": -11.570413589477539, "global_step": 261308, "epoch": 1555} {"train_loss": -11.88128662109375, "global_step": 261309, "epoch": 1555} {"train_loss": -11.621378898620605, "global_step": 261310, "epoch": 1555} {"train_loss": -11.547233581542969, "global_step": 261311, "epoch": 1555} {"train_loss": -11.87672233581543, "global_step": 261312, "epoch": 1555} {"train_loss": -11.785940170288086, "global_step": 261313, "epoch": 1555} {"train_loss": -11.782642364501953, "global_step": 261314, "epoch": 1555} {"train_loss": -12.162633895874023, "global_step": 261315, "epoch": 1555} {"train_loss": -11.981855392456055, "global_step": 261316, "epoch": 1555} {"train_loss": -11.991564750671387, "global_step": 261317, "epoch": 1555} {"train_loss": -12.011756896972656, "global_step": 261318, "epoch": 1555} {"train_loss": -11.805435180664062, "global_step": 261319, "epoch": 1555} {"train_loss": -12.026835441589355, "global_step": 261320, "epoch": 1555} {"train_loss": -11.966085433959961, "global_step": 261321, "epoch": 1555} {"train_loss": -11.815771102905273, "global_step": 261322, "epoch": 1555} {"train_loss": -11.599920272827148, "global_step": 261323, "epoch": 1555} {"train_loss": -12.161530494689941, "global_step": 261324, "epoch": 1555} {"train_loss": -11.83288860321045, "global_step": 261325, "epoch": 1555} {"train_loss": -11.832390785217285, "global_step": 261326, "epoch": 1555} {"train_loss": -12.030012130737305, "global_step": 261327, "epoch": 1555} {"train_loss": -11.459235191345215, "global_step": 261328, "epoch": 1555} {"train_loss": -11.753576278686523, "global_step": 261329, "epoch": 1555} {"train_loss": -11.926192283630371, "global_step": 261330, "epoch": 1555} {"train_loss": -11.88205623626709, "global_step": 261331, "epoch": 1555} {"train_loss": -12.137676239013672, "global_step": 261332, "epoch": 1555} {"train_loss": -12.212713241577148, "global_step": 261333, "epoch": 1555} {"train_loss": -11.95195484161377, "global_step": 261334, "epoch": 1555} {"train_loss": -12.155630111694336, "global_step": 261335, "epoch": 1555} {"train_loss": -11.826703071594238, "global_step": 261336, "epoch": 1555} {"train_loss": -12.047633171081543, "global_step": 261337, "epoch": 1555} {"train_loss": -12.106374740600586, "global_step": 261338, "epoch": 1555} {"train_loss": -12.239744186401367, "global_step": 261339, "epoch": 1555} {"train_loss": -11.823820114135742, "global_step": 261340, "epoch": 1555} {"train_loss": -11.71681022644043, "global_step": 261341, "epoch": 1555} {"train_loss": -11.773395538330078, "global_step": 261342, "epoch": 1555} {"train_loss": -12.104391098022461, "global_step": 261343, "epoch": 1555} {"train_loss": -11.648345947265625, "global_step": 261344, "epoch": 1555} {"train_loss": -10.124321937561035, "global_step": 261345, "epoch": 1555} {"train_loss": -11.13534164428711, "global_step": 261346, "epoch": 1555} {"train_loss": -11.635710716247559, "global_step": 261347, "epoch": 1555} {"train_loss": -9.343727111816406, "global_step": 261348, "epoch": 1555} {"train_loss": -11.390559196472168, "global_step": 261349, "epoch": 1555} {"train_loss": -11.089066505432129, "global_step": 261350, "epoch": 1555} {"train_loss": -10.499756813049316, "global_step": 261351, "epoch": 1555} {"train_loss": -11.643187522888184, "global_step": 261352, "epoch": 1555} {"train_loss": -10.486093521118164, "global_step": 261353, "epoch": 1555} {"train_loss": -11.176454544067383, "global_step": 261354, "epoch": 1555} {"train_loss": -10.044231414794922, "global_step": 261355, "epoch": 1555} {"train_loss": -10.954105377197266, "global_step": 261356, "epoch": 1555} {"train_loss": -10.052894592285156, "global_step": 261357, "epoch": 1555} {"train_loss": -9.366249084472656, "global_step": 261358, "epoch": 1555} {"train_loss": -10.152130126953125, "global_step": 261359, "epoch": 1555} {"train_loss": -10.705765724182129, "global_step": 261360, "epoch": 1555} {"train_loss": -10.31684684753418, "global_step": 261361, "epoch": 1555} {"train_loss": -9.824777603149414, "global_step": 261362, "epoch": 1555} {"train_loss": -10.845852851867676, "global_step": 261363, "epoch": 1555} {"train_loss": -10.325765609741211, "global_step": 261364, "epoch": 1555} {"train_loss": -11.523704528808594, "global_step": 261365, "epoch": 1555} {"train_loss": -11.223462104797363, "global_step": 261366, "epoch": 1555} {"train_loss": -11.346822738647461, "global_step": 261367, "epoch": 1555} {"train_loss": -11.559062957763672, "global_step": 261368, "epoch": 1555} {"train_loss": -10.544137954711914, "global_step": 261369, "epoch": 1555} {"train_loss": -11.463937759399414, "global_step": 261370, "epoch": 1555} {"train_loss": -11.593256950378418, "global_step": 261371, "epoch": 1555} {"train_loss": -11.20478343963623, "global_step": 261372, "epoch": 1555} {"train_loss": -11.646480560302734, "global_step": 261373, "epoch": 1555} {"train_loss": -11.046088218688965, "global_step": 261374, "epoch": 1555} {"train_loss": -11.87210464477539, "global_step": 261375, "epoch": 1555} {"train_loss": -11.61050033569336, "global_step": 261376, "epoch": 1555} {"train_loss": -11.840015411376953, "global_step": 261377, "epoch": 1555} {"train_loss": -11.827555656433105, "global_step": 261378, "epoch": 1555} {"train_loss": -11.63637924194336, "global_step": 261379, "epoch": 1555} {"train_loss": -11.692398071289062, "global_step": 261380, "epoch": 1555} {"train_loss": -11.558915138244629, "global_step": 261381, "epoch": 1555} {"train_loss": -11.856083869934082, "global_step": 261382, "epoch": 1555} {"train_loss": -11.632574081420898, "global_step": 261383, "epoch": 1555} {"train_loss": -11.538814544677734, "global_step": 261384, "epoch": 1555} {"train_loss": -11.666184425354004, "global_step": 261385, "epoch": 1555} {"train_loss": -11.59695053100586, "global_step": 261386, "epoch": 1555} {"train_loss": -11.808660507202148, "global_step": 261387, "epoch": 1555} {"train_loss": -11.724547386169434, "global_step": 261388, "epoch": 1555} {"train_loss": -11.942628860473633, "global_step": 261389, "epoch": 1555} {"train_loss": -11.830886840820312, "global_step": 261390, "epoch": 1555} {"train_loss": -11.711336135864258, "global_step": 261391, "epoch": 1555} {"train_loss": -12.110143661499023, "global_step": 261392, "epoch": 1555} {"train_loss": -11.470146179199219, "global_step": 261393, "epoch": 1555} {"train_loss": -11.929254531860352, "global_step": 261394, "epoch": 1555} {"train_loss": -11.76035213470459, "global_step": 261395, "epoch": 1555} {"train_loss": -11.699216842651367, "global_step": 261396, "epoch": 1555} {"train_loss": -11.486862182617188, "global_step": 261397, "epoch": 1555} {"train_loss": -11.536683082580566, "global_step": 261398, "epoch": 1555} {"train_loss": -11.757572174072266, "global_step": 261399, "epoch": 1555} {"train_loss": -11.555463790893555, "global_step": 261400, "epoch": 1555} {"train_loss": -11.59182357788086, "global_step": 261401, "epoch": 1555} {"train_loss": -11.658348083496094, "global_step": 261402, "epoch": 1555} {"train_loss": -11.010807037353516, "global_step": 261403, "epoch": 1555} {"train_loss": -10.560707092285156, "global_step": 261404, "epoch": 1555} {"train_loss": -11.27717399597168, "global_step": 261405, "epoch": 1555} {"train_loss": -10.894034385681152, "global_step": 261406, "epoch": 1555} {"train_loss": -11.581476484026227, "global_step": 261407, "epoch": 1555, "val_loss": 271051.875, "train_action_mse_error": 4.188928127288818} {"train_loss": -11.67180347442627, "global_step": 261408, "epoch": 1556} {"train_loss": -11.143000602722168, "global_step": 261409, "epoch": 1556} {"train_loss": -11.852654457092285, "global_step": 261410, "epoch": 1556} {"train_loss": -10.981910705566406, "global_step": 261411, "epoch": 1556} {"train_loss": -11.227155685424805, "global_step": 261412, "epoch": 1556} {"train_loss": -11.484064102172852, "global_step": 261413, "epoch": 1556} {"train_loss": -10.96182918548584, "global_step": 261414, "epoch": 1556} {"train_loss": -11.009008407592773, "global_step": 261415, "epoch": 1556} {"train_loss": -10.777128219604492, "global_step": 261416, "epoch": 1556} {"train_loss": -11.13989543914795, "global_step": 261417, "epoch": 1556} {"train_loss": -11.614156723022461, "global_step": 261418, "epoch": 1556} {"train_loss": -11.44891357421875, "global_step": 261419, "epoch": 1556} {"train_loss": -11.219152450561523, "global_step": 261420, "epoch": 1556} {"train_loss": -11.645841598510742, "global_step": 261421, "epoch": 1556} {"train_loss": -11.501558303833008, "global_step": 261422, "epoch": 1556} {"train_loss": -11.46623420715332, "global_step": 261423, "epoch": 1556} {"train_loss": -11.568075180053711, "global_step": 261424, "epoch": 1556} {"train_loss": -11.551032066345215, "global_step": 261425, "epoch": 1556} {"train_loss": -10.822280883789062, "global_step": 261426, "epoch": 1556} {"train_loss": -11.4432373046875, "global_step": 261427, "epoch": 1556} {"train_loss": -10.880047798156738, "global_step": 261428, "epoch": 1556} {"train_loss": -11.78026008605957, "global_step": 261429, "epoch": 1556} {"train_loss": -11.091178894042969, "global_step": 261430, "epoch": 1556} {"train_loss": -11.78730583190918, "global_step": 261431, "epoch": 1556} {"train_loss": -11.681949615478516, "global_step": 261432, "epoch": 1556} {"train_loss": -11.569278717041016, "global_step": 261433, "epoch": 1556} {"train_loss": -11.540094375610352, "global_step": 261434, "epoch": 1556} {"train_loss": -11.672423362731934, "global_step": 261435, "epoch": 1556} {"train_loss": -11.782270431518555, "global_step": 261436, "epoch": 1556} {"train_loss": -11.671548843383789, "global_step": 261437, "epoch": 1556} {"train_loss": -11.580780029296875, "global_step": 261438, "epoch": 1556} {"train_loss": -11.799535751342773, "global_step": 261439, "epoch": 1556} {"train_loss": -11.598345756530762, "global_step": 261440, "epoch": 1556} {"train_loss": -11.962318420410156, "global_step": 261441, "epoch": 1556} {"train_loss": -11.555509567260742, "global_step": 261442, "epoch": 1556} {"train_loss": -11.970847129821777, "global_step": 261443, "epoch": 1556} {"train_loss": -12.070889472961426, "global_step": 261444, "epoch": 1556} {"train_loss": -11.782960891723633, "global_step": 261445, "epoch": 1556} {"train_loss": -12.058713912963867, "global_step": 261446, "epoch": 1556} {"train_loss": -11.95168399810791, "global_step": 261447, "epoch": 1556} {"train_loss": -11.885177612304688, "global_step": 261448, "epoch": 1556} {"train_loss": -12.063348770141602, "global_step": 261449, "epoch": 1556} {"train_loss": -12.19584846496582, "global_step": 261450, "epoch": 1556} {"train_loss": -12.005600929260254, "global_step": 261451, "epoch": 1556} {"train_loss": -12.076471328735352, "global_step": 261452, "epoch": 1556} {"train_loss": -11.995052337646484, "global_step": 261453, "epoch": 1556} {"train_loss": -11.84117317199707, "global_step": 261454, "epoch": 1556} {"train_loss": -11.855493545532227, "global_step": 261455, "epoch": 1556} {"train_loss": -12.069429397583008, "global_step": 261456, "epoch": 1556} {"train_loss": -11.850849151611328, "global_step": 261457, "epoch": 1556} {"train_loss": -12.032987594604492, "global_step": 261458, "epoch": 1556} {"train_loss": -12.03609848022461, "global_step": 261459, "epoch": 1556} {"train_loss": -12.02918529510498, "global_step": 261460, "epoch": 1556} {"train_loss": -12.27018928527832, "global_step": 261461, "epoch": 1556} {"train_loss": -12.0639009475708, "global_step": 261462, "epoch": 1556} {"train_loss": -12.170906066894531, "global_step": 261463, "epoch": 1556} {"train_loss": -12.158781051635742, "global_step": 261464, "epoch": 1556} {"train_loss": -12.299760818481445, "global_step": 261465, "epoch": 1556} {"train_loss": -12.274925231933594, "global_step": 261466, "epoch": 1556} {"train_loss": -12.23036003112793, "global_step": 261467, "epoch": 1556} {"train_loss": -12.273674011230469, "global_step": 261468, "epoch": 1556} {"train_loss": -12.042999267578125, "global_step": 261469, "epoch": 1556} {"train_loss": -12.214982986450195, "global_step": 261470, "epoch": 1556} {"train_loss": -12.099056243896484, "global_step": 261471, "epoch": 1556} {"train_loss": -11.787181854248047, "global_step": 261472, "epoch": 1556} {"train_loss": -11.476999282836914, "global_step": 261473, "epoch": 1556} {"train_loss": -12.274430274963379, "global_step": 261474, "epoch": 1556} {"train_loss": -11.738919258117676, "global_step": 261475, "epoch": 1556} {"train_loss": -11.656846046447754, "global_step": 261476, "epoch": 1556} {"train_loss": -12.260404586791992, "global_step": 261477, "epoch": 1556} {"train_loss": -11.698887825012207, "global_step": 261478, "epoch": 1556} {"train_loss": -11.464564323425293, "global_step": 261479, "epoch": 1556} {"train_loss": -12.085451126098633, "global_step": 261480, "epoch": 1556} {"train_loss": -12.138601303100586, "global_step": 261481, "epoch": 1556} {"train_loss": -11.635976791381836, "global_step": 261482, "epoch": 1556} {"train_loss": -12.280797004699707, "global_step": 261483, "epoch": 1556} {"train_loss": -11.909578323364258, "global_step": 261484, "epoch": 1556} {"train_loss": -11.907333374023438, "global_step": 261485, "epoch": 1556} {"train_loss": -11.994241714477539, "global_step": 261486, "epoch": 1556} {"train_loss": -11.806220054626465, "global_step": 261487, "epoch": 1556} {"train_loss": -11.538827896118164, "global_step": 261488, "epoch": 1556} {"train_loss": -11.8499116897583, "global_step": 261489, "epoch": 1556} {"train_loss": -12.180789947509766, "global_step": 261490, "epoch": 1556} {"train_loss": -12.28249740600586, "global_step": 261491, "epoch": 1556} {"train_loss": -11.669468879699707, "global_step": 261492, "epoch": 1556} {"train_loss": -10.943717956542969, "global_step": 261493, "epoch": 1556} {"train_loss": -11.517459869384766, "global_step": 261494, "epoch": 1556} {"train_loss": -11.780609130859375, "global_step": 261495, "epoch": 1556} {"train_loss": -12.067720413208008, "global_step": 261496, "epoch": 1556} {"train_loss": -11.88027572631836, "global_step": 261497, "epoch": 1556} {"train_loss": -12.313624382019043, "global_step": 261498, "epoch": 1556} {"train_loss": -11.516056060791016, "global_step": 261499, "epoch": 1556} {"train_loss": -11.413588523864746, "global_step": 261500, "epoch": 1556} {"train_loss": -11.882287979125977, "global_step": 261501, "epoch": 1556} {"train_loss": -11.81024169921875, "global_step": 261502, "epoch": 1556} {"train_loss": -10.797042846679688, "global_step": 261503, "epoch": 1556} {"train_loss": -11.432209014892578, "global_step": 261504, "epoch": 1556} {"train_loss": -11.890127182006836, "global_step": 261505, "epoch": 1556} {"train_loss": -10.794392585754395, "global_step": 261506, "epoch": 1556} {"train_loss": -11.655851364135742, "global_step": 261507, "epoch": 1556} {"train_loss": -10.692113876342773, "global_step": 261508, "epoch": 1556} {"train_loss": -11.546541213989258, "global_step": 261509, "epoch": 1556} {"train_loss": -11.041013717651367, "global_step": 261510, "epoch": 1556} {"train_loss": -10.639068603515625, "global_step": 261511, "epoch": 1556} {"train_loss": -11.353984832763672, "global_step": 261512, "epoch": 1556} {"train_loss": -11.0132474899292, "global_step": 261513, "epoch": 1556} {"train_loss": -11.104837417602539, "global_step": 261514, "epoch": 1556} {"train_loss": -11.65331745147705, "global_step": 261515, "epoch": 1556} {"train_loss": -10.625267028808594, "global_step": 261516, "epoch": 1556} {"train_loss": -11.671697616577148, "global_step": 261517, "epoch": 1556} {"train_loss": -10.477058410644531, "global_step": 261518, "epoch": 1556} {"train_loss": -11.463119506835938, "global_step": 261519, "epoch": 1556} {"train_loss": -11.002824783325195, "global_step": 261520, "epoch": 1556} {"train_loss": -10.606056213378906, "global_step": 261521, "epoch": 1556} {"train_loss": -11.725788116455078, "global_step": 261522, "epoch": 1556} {"train_loss": -10.819511413574219, "global_step": 261523, "epoch": 1556} {"train_loss": -11.768543243408203, "global_step": 261524, "epoch": 1556} {"train_loss": -10.350019454956055, "global_step": 261525, "epoch": 1556} {"train_loss": -11.718847274780273, "global_step": 261526, "epoch": 1556} {"train_loss": -11.059194564819336, "global_step": 261527, "epoch": 1556} {"train_loss": -11.063003540039062, "global_step": 261528, "epoch": 1556} {"train_loss": -11.467243194580078, "global_step": 261529, "epoch": 1556} {"train_loss": -11.25641918182373, "global_step": 261530, "epoch": 1556} {"train_loss": -11.657005310058594, "global_step": 261531, "epoch": 1556} {"train_loss": -11.617576599121094, "global_step": 261532, "epoch": 1556} {"train_loss": -11.61166000366211, "global_step": 261533, "epoch": 1556} {"train_loss": -11.7496976852417, "global_step": 261534, "epoch": 1556} {"train_loss": -11.857919692993164, "global_step": 261535, "epoch": 1556} {"train_loss": -11.650449752807617, "global_step": 261536, "epoch": 1556} {"train_loss": -11.893620491027832, "global_step": 261537, "epoch": 1556} {"train_loss": -11.989055633544922, "global_step": 261538, "epoch": 1556} {"train_loss": -11.84638500213623, "global_step": 261539, "epoch": 1556} {"train_loss": -11.990659713745117, "global_step": 261540, "epoch": 1556} {"train_loss": -11.984842300415039, "global_step": 261541, "epoch": 1556} {"train_loss": -11.807854652404785, "global_step": 261542, "epoch": 1556} {"train_loss": -12.033628463745117, "global_step": 261543, "epoch": 1556} {"train_loss": -12.016201972961426, "global_step": 261544, "epoch": 1556} {"train_loss": -11.91960620880127, "global_step": 261545, "epoch": 1556} {"train_loss": -11.89619255065918, "global_step": 261546, "epoch": 1556} {"train_loss": -11.9918794631958, "global_step": 261547, "epoch": 1556} {"train_loss": -11.789974212646484, "global_step": 261548, "epoch": 1556} {"train_loss": -12.018946647644043, "global_step": 261549, "epoch": 1556} {"train_loss": -11.876157760620117, "global_step": 261550, "epoch": 1556} {"train_loss": -12.062276840209961, "global_step": 261551, "epoch": 1556} {"train_loss": -12.115402221679688, "global_step": 261552, "epoch": 1556} {"train_loss": -11.932952880859375, "global_step": 261553, "epoch": 1556} {"train_loss": -12.164793968200684, "global_step": 261554, "epoch": 1556} {"train_loss": -11.97366714477539, "global_step": 261555, "epoch": 1556} {"train_loss": -12.240764617919922, "global_step": 261556, "epoch": 1556} {"train_loss": -12.047693252563477, "global_step": 261557, "epoch": 1556} {"train_loss": -11.749159812927246, "global_step": 261558, "epoch": 1556} {"train_loss": -12.178339958190918, "global_step": 261559, "epoch": 1556} {"train_loss": -11.423890113830566, "global_step": 261560, "epoch": 1556} {"train_loss": -12.13798713684082, "global_step": 261561, "epoch": 1556} {"train_loss": -11.519115447998047, "global_step": 261562, "epoch": 1556} {"train_loss": -12.253326416015625, "global_step": 261563, "epoch": 1556} {"train_loss": -11.761781692504883, "global_step": 261564, "epoch": 1556} {"train_loss": -12.055292129516602, "global_step": 261565, "epoch": 1556} {"train_loss": -11.98072338104248, "global_step": 261566, "epoch": 1556} {"train_loss": -11.987913131713867, "global_step": 261567, "epoch": 1556} {"train_loss": -12.271870613098145, "global_step": 261568, "epoch": 1556} {"train_loss": -11.984416961669922, "global_step": 261569, "epoch": 1556} {"train_loss": -12.060537338256836, "global_step": 261570, "epoch": 1556} {"train_loss": -12.060796737670898, "global_step": 261571, "epoch": 1556} {"train_loss": -12.18202018737793, "global_step": 261572, "epoch": 1556} {"train_loss": -12.212915420532227, "global_step": 261573, "epoch": 1556} {"train_loss": -12.029661178588867, "global_step": 261574, "epoch": 1556} {"train_loss": -11.71100572177342, "global_step": 261575, "epoch": 1556, "val_loss": 271372.59375} {"train_loss": -12.332947731018066, "global_step": 261576, "epoch": 1557} {"train_loss": -12.134047508239746, "global_step": 261577, "epoch": 1557} {"train_loss": -12.221078872680664, "global_step": 261578, "epoch": 1557} {"train_loss": -12.157310485839844, "global_step": 261579, "epoch": 1557} {"train_loss": -12.377817153930664, "global_step": 261580, "epoch": 1557} {"train_loss": -11.978858947753906, "global_step": 261581, "epoch": 1557} {"train_loss": -11.792221069335938, "global_step": 261582, "epoch": 1557} {"train_loss": -11.823038101196289, "global_step": 261583, "epoch": 1557} {"train_loss": -11.790451049804688, "global_step": 261584, "epoch": 1557} {"train_loss": -10.883115768432617, "global_step": 261585, "epoch": 1557} {"train_loss": -11.061689376831055, "global_step": 261586, "epoch": 1557} {"train_loss": -11.275018692016602, "global_step": 261587, "epoch": 1557} {"train_loss": -11.81994915008545, "global_step": 261588, "epoch": 1557} {"train_loss": -11.060885429382324, "global_step": 261589, "epoch": 1557} {"train_loss": -11.417458534240723, "global_step": 261590, "epoch": 1557} {"train_loss": -11.32781982421875, "global_step": 261591, "epoch": 1557} {"train_loss": -11.680452346801758, "global_step": 261592, "epoch": 1557} {"train_loss": -10.69675064086914, "global_step": 261593, "epoch": 1557} {"train_loss": -12.005712509155273, "global_step": 261594, "epoch": 1557} {"train_loss": -10.340213775634766, "global_step": 261595, "epoch": 1557} {"train_loss": -11.119264602661133, "global_step": 261596, "epoch": 1557} {"train_loss": -11.322751998901367, "global_step": 261597, "epoch": 1557} {"train_loss": -11.891361236572266, "global_step": 261598, "epoch": 1557} {"train_loss": -11.675680160522461, "global_step": 261599, "epoch": 1557} {"train_loss": -11.496922492980957, "global_step": 261600, "epoch": 1557} {"train_loss": -11.950971603393555, "global_step": 261601, "epoch": 1557} {"train_loss": -10.357549667358398, "global_step": 261602, "epoch": 1557} {"train_loss": -11.329582214355469, "global_step": 261603, "epoch": 1557} {"train_loss": -11.738550186157227, "global_step": 261604, "epoch": 1557} {"train_loss": -11.31884479522705, "global_step": 261605, "epoch": 1557} {"train_loss": -11.6077880859375, "global_step": 261606, "epoch": 1557} {"train_loss": -11.934316635131836, "global_step": 261607, "epoch": 1557} {"train_loss": -11.871798515319824, "global_step": 261608, "epoch": 1557} {"train_loss": -11.604775428771973, "global_step": 261609, "epoch": 1557} {"train_loss": -11.727705001831055, "global_step": 261610, "epoch": 1557} {"train_loss": -11.836431503295898, "global_step": 261611, "epoch": 1557} {"train_loss": -11.616851806640625, "global_step": 261612, "epoch": 1557} {"train_loss": -11.605903625488281, "global_step": 261613, "epoch": 1557} {"train_loss": -11.820266723632812, "global_step": 261614, "epoch": 1557} {"train_loss": -11.646892547607422, "global_step": 261615, "epoch": 1557} {"train_loss": -11.56416130065918, "global_step": 261616, "epoch": 1557} {"train_loss": -11.807522773742676, "global_step": 261617, "epoch": 1557} {"train_loss": -11.717405319213867, "global_step": 261618, "epoch": 1557} {"train_loss": -11.70463752746582, "global_step": 261619, "epoch": 1557} {"train_loss": -11.89466381072998, "global_step": 261620, "epoch": 1557} {"train_loss": -11.307894706726074, "global_step": 261621, "epoch": 1557} {"train_loss": -11.731950759887695, "global_step": 261622, "epoch": 1557} {"train_loss": -12.024029731750488, "global_step": 261623, "epoch": 1557} {"train_loss": -11.675997734069824, "global_step": 261624, "epoch": 1557} {"train_loss": -11.873800277709961, "global_step": 261625, "epoch": 1557} {"train_loss": -12.098865509033203, "global_step": 261626, "epoch": 1557} {"train_loss": -11.662925720214844, "global_step": 261627, "epoch": 1557} {"train_loss": -11.727825164794922, "global_step": 261628, "epoch": 1557} {"train_loss": -11.811691284179688, "global_step": 261629, "epoch": 1557} {"train_loss": -11.471567153930664, "global_step": 261630, "epoch": 1557} {"train_loss": -12.076921463012695, "global_step": 261631, "epoch": 1557} {"train_loss": -11.70649528503418, "global_step": 261632, "epoch": 1557} {"train_loss": -11.189852714538574, "global_step": 261633, "epoch": 1557} {"train_loss": -11.532529830932617, "global_step": 261634, "epoch": 1557} {"train_loss": -11.473950386047363, "global_step": 261635, "epoch": 1557} {"train_loss": -11.193249702453613, "global_step": 261636, "epoch": 1557} {"train_loss": -12.005146026611328, "global_step": 261637, "epoch": 1557} {"train_loss": -11.279119491577148, "global_step": 261638, "epoch": 1557} {"train_loss": -11.596524238586426, "global_step": 261639, "epoch": 1557} {"train_loss": -11.504924774169922, "global_step": 261640, "epoch": 1557} {"train_loss": -11.269627571105957, "global_step": 261641, "epoch": 1557} {"train_loss": -11.62816047668457, "global_step": 261642, "epoch": 1557} {"train_loss": -11.609334945678711, "global_step": 261643, "epoch": 1557} {"train_loss": -11.277685165405273, "global_step": 261644, "epoch": 1557} {"train_loss": -11.437901496887207, "global_step": 261645, "epoch": 1557} {"train_loss": -11.644558906555176, "global_step": 261646, "epoch": 1557} {"train_loss": -11.637482643127441, "global_step": 261647, "epoch": 1557} {"train_loss": -11.713687896728516, "global_step": 261648, "epoch": 1557} {"train_loss": -11.326772689819336, "global_step": 261649, "epoch": 1557} {"train_loss": -11.723875045776367, "global_step": 261650, "epoch": 1557} {"train_loss": -11.755799293518066, "global_step": 261651, "epoch": 1557} {"train_loss": -11.2928466796875, "global_step": 261652, "epoch": 1557} {"train_loss": -11.59945297241211, "global_step": 261653, "epoch": 1557} {"train_loss": -11.878442764282227, "global_step": 261654, "epoch": 1557} {"train_loss": -11.668952941894531, "global_step": 261655, "epoch": 1557} {"train_loss": -11.190994262695312, "global_step": 261656, "epoch": 1557} {"train_loss": -11.504999160766602, "global_step": 261657, "epoch": 1557} {"train_loss": -11.725367546081543, "global_step": 261658, "epoch": 1557} {"train_loss": -11.634220123291016, "global_step": 261659, "epoch": 1557} {"train_loss": -11.854089736938477, "global_step": 261660, "epoch": 1557} {"train_loss": -11.58705997467041, "global_step": 261661, "epoch": 1557} {"train_loss": -11.653478622436523, "global_step": 261662, "epoch": 1557} {"train_loss": -11.568130493164062, "global_step": 261663, "epoch": 1557} {"train_loss": -10.886396408081055, "global_step": 261664, "epoch": 1557} {"train_loss": -11.925437927246094, "global_step": 261665, "epoch": 1557} {"train_loss": -11.065614700317383, "global_step": 261666, "epoch": 1557} {"train_loss": -10.78037166595459, "global_step": 261667, "epoch": 1557} {"train_loss": -12.092567443847656, "global_step": 261668, "epoch": 1557} {"train_loss": -10.869366645812988, "global_step": 261669, "epoch": 1557} {"train_loss": -11.109954833984375, "global_step": 261670, "epoch": 1557} {"train_loss": -10.533306121826172, "global_step": 261671, "epoch": 1557} {"train_loss": -11.098344802856445, "global_step": 261672, "epoch": 1557} {"train_loss": -9.97378158569336, "global_step": 261673, "epoch": 1557} {"train_loss": -11.073179244995117, "global_step": 261674, "epoch": 1557} {"train_loss": -10.896421432495117, "global_step": 261675, "epoch": 1557} {"train_loss": -10.156173706054688, "global_step": 261676, "epoch": 1557} {"train_loss": -11.122665405273438, "global_step": 261677, "epoch": 1557} {"train_loss": -11.045219421386719, "global_step": 261678, "epoch": 1557} {"train_loss": -9.532432556152344, "global_step": 261679, "epoch": 1557} {"train_loss": -11.829795837402344, "global_step": 261680, "epoch": 1557} {"train_loss": -10.7689208984375, "global_step": 261681, "epoch": 1557} {"train_loss": -11.00418472290039, "global_step": 261682, "epoch": 1557} {"train_loss": -11.453784942626953, "global_step": 261683, "epoch": 1557} {"train_loss": -10.80238151550293, "global_step": 261684, "epoch": 1557} {"train_loss": -11.004364013671875, "global_step": 261685, "epoch": 1557} {"train_loss": -11.447235107421875, "global_step": 261686, "epoch": 1557} {"train_loss": -11.06529426574707, "global_step": 261687, "epoch": 1557} {"train_loss": -11.649065017700195, "global_step": 261688, "epoch": 1557} {"train_loss": -11.303974151611328, "global_step": 261689, "epoch": 1557} {"train_loss": -11.179370880126953, "global_step": 261690, "epoch": 1557} {"train_loss": -11.699125289916992, "global_step": 261691, "epoch": 1557} {"train_loss": -11.155377388000488, "global_step": 261692, "epoch": 1557} {"train_loss": -11.443113327026367, "global_step": 261693, "epoch": 1557} {"train_loss": -11.416980743408203, "global_step": 261694, "epoch": 1557} {"train_loss": -11.288063049316406, "global_step": 261695, "epoch": 1557} {"train_loss": -11.530906677246094, "global_step": 261696, "epoch": 1557} {"train_loss": -11.39940071105957, "global_step": 261697, "epoch": 1557} {"train_loss": -11.295909881591797, "global_step": 261698, "epoch": 1557} {"train_loss": -11.421136856079102, "global_step": 261699, "epoch": 1557} {"train_loss": -11.532817840576172, "global_step": 261700, "epoch": 1557} {"train_loss": -11.33491325378418, "global_step": 261701, "epoch": 1557} {"train_loss": -11.503881454467773, "global_step": 261702, "epoch": 1557} {"train_loss": -11.646936416625977, "global_step": 261703, "epoch": 1557} {"train_loss": -11.186114311218262, "global_step": 261704, "epoch": 1557} {"train_loss": -11.922504425048828, "global_step": 261705, "epoch": 1557} {"train_loss": -11.398935317993164, "global_step": 261706, "epoch": 1557} {"train_loss": -11.698335647583008, "global_step": 261707, "epoch": 1557} {"train_loss": -11.713223457336426, "global_step": 261708, "epoch": 1557} {"train_loss": -11.674579620361328, "global_step": 261709, "epoch": 1557} {"train_loss": -11.572141647338867, "global_step": 261710, "epoch": 1557} {"train_loss": -11.801197052001953, "global_step": 261711, "epoch": 1557} {"train_loss": -11.872706413269043, "global_step": 261712, "epoch": 1557} {"train_loss": -11.826667785644531, "global_step": 261713, "epoch": 1557} {"train_loss": -11.946656227111816, "global_step": 261714, "epoch": 1557} {"train_loss": -11.449031829833984, "global_step": 261715, "epoch": 1557} {"train_loss": -11.717793464660645, "global_step": 261716, "epoch": 1557} {"train_loss": -11.856597900390625, "global_step": 261717, "epoch": 1557} {"train_loss": -11.61181926727295, "global_step": 261718, "epoch": 1557} {"train_loss": -11.968050003051758, "global_step": 261719, "epoch": 1557} {"train_loss": -11.73048210144043, "global_step": 261720, "epoch": 1557} {"train_loss": -11.919252395629883, "global_step": 261721, "epoch": 1557} {"train_loss": -11.824390411376953, "global_step": 261722, "epoch": 1557} {"train_loss": -11.944160461425781, "global_step": 261723, "epoch": 1557} {"train_loss": -11.730395317077637, "global_step": 261724, "epoch": 1557} {"train_loss": -11.760026931762695, "global_step": 261725, "epoch": 1557} {"train_loss": -11.097607612609863, "global_step": 261726, "epoch": 1557} {"train_loss": -11.846060752868652, "global_step": 261727, "epoch": 1557} {"train_loss": -11.270071029663086, "global_step": 261728, "epoch": 1557} {"train_loss": -11.766510009765625, "global_step": 261729, "epoch": 1557} {"train_loss": -11.436695098876953, "global_step": 261730, "epoch": 1557} {"train_loss": -12.086463928222656, "global_step": 261731, "epoch": 1557} {"train_loss": -11.612971305847168, "global_step": 261732, "epoch": 1557} {"train_loss": -11.558334350585938, "global_step": 261733, "epoch": 1557} {"train_loss": -11.863384246826172, "global_step": 261734, "epoch": 1557} {"train_loss": -11.752544403076172, "global_step": 261735, "epoch": 1557} {"train_loss": -11.669513702392578, "global_step": 261736, "epoch": 1557} {"train_loss": -12.067699432373047, "global_step": 261737, "epoch": 1557} {"train_loss": -11.95174789428711, "global_step": 261738, "epoch": 1557} {"train_loss": -11.811485290527344, "global_step": 261739, "epoch": 1557} {"train_loss": -11.87421989440918, "global_step": 261740, "epoch": 1557} {"train_loss": -11.987523078918457, "global_step": 261741, "epoch": 1557} {"train_loss": -12.003141403198242, "global_step": 261742, "epoch": 1557} {"train_loss": -11.532807060650416, "global_step": 261743, "epoch": 1557, "val_loss": 272825.9375} {"train_loss": -12.072997093200684, "global_step": 261744, "epoch": 1558} {"train_loss": -11.844478607177734, "global_step": 261745, "epoch": 1558} {"train_loss": -12.111042022705078, "global_step": 261746, "epoch": 1558} {"train_loss": -11.758722305297852, "global_step": 261747, "epoch": 1558} {"train_loss": -12.054165840148926, "global_step": 261748, "epoch": 1558} {"train_loss": -11.69964599609375, "global_step": 261749, "epoch": 1558} {"train_loss": -11.913366317749023, "global_step": 261750, "epoch": 1558} {"train_loss": -11.604389190673828, "global_step": 261751, "epoch": 1558} {"train_loss": -11.758403778076172, "global_step": 261752, "epoch": 1558} {"train_loss": -12.026847839355469, "global_step": 261753, "epoch": 1558} {"train_loss": -11.467574119567871, "global_step": 261754, "epoch": 1558} {"train_loss": -11.942205429077148, "global_step": 261755, "epoch": 1558} {"train_loss": -11.649545669555664, "global_step": 261756, "epoch": 1558} {"train_loss": -11.626821517944336, "global_step": 261757, "epoch": 1558} {"train_loss": -11.666142463684082, "global_step": 261758, "epoch": 1558} {"train_loss": -12.013214111328125, "global_step": 261759, "epoch": 1558} {"train_loss": -11.50316047668457, "global_step": 261760, "epoch": 1558} {"train_loss": -11.93084716796875, "global_step": 261761, "epoch": 1558} {"train_loss": -12.154312133789062, "global_step": 261762, "epoch": 1558} {"train_loss": -11.975248336791992, "global_step": 261763, "epoch": 1558} {"train_loss": -11.93853759765625, "global_step": 261764, "epoch": 1558} {"train_loss": -12.035382270812988, "global_step": 261765, "epoch": 1558} {"train_loss": -11.617987632751465, "global_step": 261766, "epoch": 1558} {"train_loss": -12.356649398803711, "global_step": 261767, "epoch": 1558} {"train_loss": -11.2874116897583, "global_step": 261768, "epoch": 1558} {"train_loss": -11.694880485534668, "global_step": 261769, "epoch": 1558} {"train_loss": -11.501805305480957, "global_step": 261770, "epoch": 1558} {"train_loss": -12.039773941040039, "global_step": 261771, "epoch": 1558} {"train_loss": -11.97435188293457, "global_step": 261772, "epoch": 1558} {"train_loss": -12.153818130493164, "global_step": 261773, "epoch": 1558} {"train_loss": -11.747066497802734, "global_step": 261774, "epoch": 1558} {"train_loss": -11.933601379394531, "global_step": 261775, "epoch": 1558} {"train_loss": -12.174373626708984, "global_step": 261776, "epoch": 1558} {"train_loss": -11.530838012695312, "global_step": 261777, "epoch": 1558} {"train_loss": -11.930936813354492, "global_step": 261778, "epoch": 1558} {"train_loss": -11.774236679077148, "global_step": 261779, "epoch": 1558} {"train_loss": -11.432682037353516, "global_step": 261780, "epoch": 1558} {"train_loss": -11.886702537536621, "global_step": 261781, "epoch": 1558} {"train_loss": -11.548250198364258, "global_step": 261782, "epoch": 1558} {"train_loss": -11.963080406188965, "global_step": 261783, "epoch": 1558} {"train_loss": -11.619222640991211, "global_step": 261784, "epoch": 1558} {"train_loss": -11.728108406066895, "global_step": 261785, "epoch": 1558} {"train_loss": -12.025782585144043, "global_step": 261786, "epoch": 1558} {"train_loss": -11.699620246887207, "global_step": 261787, "epoch": 1558} {"train_loss": -11.913484573364258, "global_step": 261788, "epoch": 1558} {"train_loss": -11.136467933654785, "global_step": 261789, "epoch": 1558} {"train_loss": -10.365280151367188, "global_step": 261790, "epoch": 1558} {"train_loss": -11.571861267089844, "global_step": 261791, "epoch": 1558} {"train_loss": -9.931015014648438, "global_step": 261792, "epoch": 1558} {"train_loss": -10.392206192016602, "global_step": 261793, "epoch": 1558} {"train_loss": -10.606077194213867, "global_step": 261794, "epoch": 1558} {"train_loss": -9.07472038269043, "global_step": 261795, "epoch": 1558} {"train_loss": -10.772869110107422, "global_step": 261796, "epoch": 1558} {"train_loss": -8.889137268066406, "global_step": 261797, "epoch": 1558} {"train_loss": -10.632097244262695, "global_step": 261798, "epoch": 1558} {"train_loss": -10.887989044189453, "global_step": 261799, "epoch": 1558} {"train_loss": -10.830495834350586, "global_step": 261800, "epoch": 1558} {"train_loss": -11.06527328491211, "global_step": 261801, "epoch": 1558} {"train_loss": -10.862223625183105, "global_step": 261802, "epoch": 1558} {"train_loss": -10.673456192016602, "global_step": 261803, "epoch": 1558} {"train_loss": -11.360523223876953, "global_step": 261804, "epoch": 1558} {"train_loss": -11.06652545928955, "global_step": 261805, "epoch": 1558} {"train_loss": -11.430400848388672, "global_step": 261806, "epoch": 1558} {"train_loss": -10.80976676940918, "global_step": 261807, "epoch": 1558} {"train_loss": -11.531980514526367, "global_step": 261808, "epoch": 1558} {"train_loss": -10.912712097167969, "global_step": 261809, "epoch": 1558} {"train_loss": -11.484663963317871, "global_step": 261810, "epoch": 1558} {"train_loss": -10.420928001403809, "global_step": 261811, "epoch": 1558} {"train_loss": -11.554101943969727, "global_step": 261812, "epoch": 1558} {"train_loss": -10.327999114990234, "global_step": 261813, "epoch": 1558} {"train_loss": -11.744850158691406, "global_step": 261814, "epoch": 1558} {"train_loss": -10.432622909545898, "global_step": 261815, "epoch": 1558} {"train_loss": -11.514713287353516, "global_step": 261816, "epoch": 1558} {"train_loss": -11.201099395751953, "global_step": 261817, "epoch": 1558} {"train_loss": -11.306843757629395, "global_step": 261818, "epoch": 1558} {"train_loss": -11.522724151611328, "global_step": 261819, "epoch": 1558} {"train_loss": -11.757502555847168, "global_step": 261820, "epoch": 1558} {"train_loss": -11.718717575073242, "global_step": 261821, "epoch": 1558} {"train_loss": -11.567511558532715, "global_step": 261822, "epoch": 1558} {"train_loss": -11.732181549072266, "global_step": 261823, "epoch": 1558} {"train_loss": -11.925435066223145, "global_step": 261824, "epoch": 1558} {"train_loss": -11.78259563446045, "global_step": 261825, "epoch": 1558} {"train_loss": -11.799398422241211, "global_step": 261826, "epoch": 1558} {"train_loss": -11.762006759643555, "global_step": 261827, "epoch": 1558} {"train_loss": -11.887533187866211, "global_step": 261828, "epoch": 1558} {"train_loss": -11.831355094909668, "global_step": 261829, "epoch": 1558} {"train_loss": -11.823566436767578, "global_step": 261830, "epoch": 1558} {"train_loss": -12.03049087524414, "global_step": 261831, "epoch": 1558} {"train_loss": -11.900823593139648, "global_step": 261832, "epoch": 1558} {"train_loss": -11.948875427246094, "global_step": 261833, "epoch": 1558} {"train_loss": -11.958454132080078, "global_step": 261834, "epoch": 1558} {"train_loss": -12.049836158752441, "global_step": 261835, "epoch": 1558} {"train_loss": -11.967923164367676, "global_step": 261836, "epoch": 1558} {"train_loss": -12.015092849731445, "global_step": 261837, "epoch": 1558} {"train_loss": -11.951325416564941, "global_step": 261838, "epoch": 1558} {"train_loss": -12.1627197265625, "global_step": 261839, "epoch": 1558} {"train_loss": -12.029837608337402, "global_step": 261840, "epoch": 1558} {"train_loss": -12.008737564086914, "global_step": 261841, "epoch": 1558} {"train_loss": -11.898147583007812, "global_step": 261842, "epoch": 1558} {"train_loss": -12.069640159606934, "global_step": 261843, "epoch": 1558} {"train_loss": -11.89236068725586, "global_step": 261844, "epoch": 1558} {"train_loss": -12.135905265808105, "global_step": 261845, "epoch": 1558} {"train_loss": -12.141874313354492, "global_step": 261846, "epoch": 1558} {"train_loss": -11.98019790649414, "global_step": 261847, "epoch": 1558} {"train_loss": -12.038338661193848, "global_step": 261848, "epoch": 1558} {"train_loss": -11.919814109802246, "global_step": 261849, "epoch": 1558} {"train_loss": -12.082803726196289, "global_step": 261850, "epoch": 1558} {"train_loss": -11.830092430114746, "global_step": 261851, "epoch": 1558} {"train_loss": -12.063270568847656, "global_step": 261852, "epoch": 1558} {"train_loss": -12.097912788391113, "global_step": 261853, "epoch": 1558} {"train_loss": -12.185140609741211, "global_step": 261854, "epoch": 1558} {"train_loss": -11.96848201751709, "global_step": 261855, "epoch": 1558} {"train_loss": -11.914373397827148, "global_step": 261856, "epoch": 1558} {"train_loss": -11.889335632324219, "global_step": 261857, "epoch": 1558} {"train_loss": -12.042632102966309, "global_step": 261858, "epoch": 1558} {"train_loss": -12.125506401062012, "global_step": 261859, "epoch": 1558} {"train_loss": -11.883602142333984, "global_step": 261860, "epoch": 1558} {"train_loss": -11.945426940917969, "global_step": 261861, "epoch": 1558} {"train_loss": -11.820694923400879, "global_step": 261862, "epoch": 1558} {"train_loss": -11.938535690307617, "global_step": 261863, "epoch": 1558} {"train_loss": -11.86650276184082, "global_step": 261864, "epoch": 1558} {"train_loss": -11.937053680419922, "global_step": 261865, "epoch": 1558} {"train_loss": -12.24482536315918, "global_step": 261866, "epoch": 1558} {"train_loss": -12.359603881835938, "global_step": 261867, "epoch": 1558} {"train_loss": -12.033918380737305, "global_step": 261868, "epoch": 1558} {"train_loss": -12.145491600036621, "global_step": 261869, "epoch": 1558} {"train_loss": -12.237600326538086, "global_step": 261870, "epoch": 1558} {"train_loss": -12.126920700073242, "global_step": 261871, "epoch": 1558} {"train_loss": -12.1848783493042, "global_step": 261872, "epoch": 1558} {"train_loss": -12.232657432556152, "global_step": 261873, "epoch": 1558} {"train_loss": -11.651405334472656, "global_step": 261874, "epoch": 1558} {"train_loss": -12.262445449829102, "global_step": 261875, "epoch": 1558} {"train_loss": -11.667997360229492, "global_step": 261876, "epoch": 1558} {"train_loss": -11.916844367980957, "global_step": 261877, "epoch": 1558} {"train_loss": -12.283344268798828, "global_step": 261878, "epoch": 1558} {"train_loss": -11.723257064819336, "global_step": 261879, "epoch": 1558} {"train_loss": -11.96180534362793, "global_step": 261880, "epoch": 1558} {"train_loss": -12.077314376831055, "global_step": 261881, "epoch": 1558} {"train_loss": -11.568446159362793, "global_step": 261882, "epoch": 1558} {"train_loss": -11.79334545135498, "global_step": 261883, "epoch": 1558} {"train_loss": -12.239297866821289, "global_step": 261884, "epoch": 1558} {"train_loss": -11.50700569152832, "global_step": 261885, "epoch": 1558} {"train_loss": -11.595050811767578, "global_step": 261886, "epoch": 1558} {"train_loss": -12.086262702941895, "global_step": 261887, "epoch": 1558} {"train_loss": -12.244433403015137, "global_step": 261888, "epoch": 1558} {"train_loss": -12.10531234741211, "global_step": 261889, "epoch": 1558} {"train_loss": -12.240211486816406, "global_step": 261890, "epoch": 1558} {"train_loss": -12.034969329833984, "global_step": 261891, "epoch": 1558} {"train_loss": -11.96706771850586, "global_step": 261892, "epoch": 1558} {"train_loss": -12.086587905883789, "global_step": 261893, "epoch": 1558} {"train_loss": -11.862894058227539, "global_step": 261894, "epoch": 1558} {"train_loss": -11.647161483764648, "global_step": 261895, "epoch": 1558} {"train_loss": -12.231061935424805, "global_step": 261896, "epoch": 1558} {"train_loss": -11.871705055236816, "global_step": 261897, "epoch": 1558} {"train_loss": -11.598356246948242, "global_step": 261898, "epoch": 1558} {"train_loss": -11.402996063232422, "global_step": 261899, "epoch": 1558} {"train_loss": -11.470874786376953, "global_step": 261900, "epoch": 1558} {"train_loss": -11.948200225830078, "global_step": 261901, "epoch": 1558} {"train_loss": -11.350053787231445, "global_step": 261902, "epoch": 1558} {"train_loss": -10.840583801269531, "global_step": 261903, "epoch": 1558} {"train_loss": -12.182394027709961, "global_step": 261904, "epoch": 1558} {"train_loss": -11.802691459655762, "global_step": 261905, "epoch": 1558} {"train_loss": -11.69510269165039, "global_step": 261906, "epoch": 1558} {"train_loss": -11.854242324829102, "global_step": 261907, "epoch": 1558} {"train_loss": -12.126896858215332, "global_step": 261908, "epoch": 1558} {"train_loss": -11.984701156616211, "global_step": 261909, "epoch": 1558} {"train_loss": -12.004520416259766, "global_step": 261910, "epoch": 1558} {"train_loss": -11.703008748236156, "global_step": 261911, "epoch": 1558, "val_loss": 270964.78125} {"train_loss": -12.013591766357422, "global_step": 261912, "epoch": 1559} {"train_loss": -12.152460098266602, "global_step": 261913, "epoch": 1559} {"train_loss": -12.037803649902344, "global_step": 261914, "epoch": 1559} {"train_loss": -11.94422721862793, "global_step": 261915, "epoch": 1559} {"train_loss": -12.241009712219238, "global_step": 261916, "epoch": 1559} {"train_loss": -12.190335273742676, "global_step": 261917, "epoch": 1559} {"train_loss": -11.898523330688477, "global_step": 261918, "epoch": 1559} {"train_loss": -12.202281951904297, "global_step": 261919, "epoch": 1559} {"train_loss": -11.789684295654297, "global_step": 261920, "epoch": 1559} {"train_loss": -11.540159225463867, "global_step": 261921, "epoch": 1559} {"train_loss": -12.001365661621094, "global_step": 261922, "epoch": 1559} {"train_loss": -11.186134338378906, "global_step": 261923, "epoch": 1559} {"train_loss": -10.802733421325684, "global_step": 261924, "epoch": 1559} {"train_loss": -10.748407363891602, "global_step": 261925, "epoch": 1559} {"train_loss": -12.07463550567627, "global_step": 261926, "epoch": 1559} {"train_loss": -11.20321273803711, "global_step": 261927, "epoch": 1559} {"train_loss": -11.629467010498047, "global_step": 261928, "epoch": 1559} {"train_loss": -11.770157814025879, "global_step": 261929, "epoch": 1559} {"train_loss": -11.649406433105469, "global_step": 261930, "epoch": 1559} {"train_loss": -10.433828353881836, "global_step": 261931, "epoch": 1559} {"train_loss": -11.35027027130127, "global_step": 261932, "epoch": 1559} {"train_loss": -11.099071502685547, "global_step": 261933, "epoch": 1559} {"train_loss": -10.050924301147461, "global_step": 261934, "epoch": 1559} {"train_loss": -10.121947288513184, "global_step": 261935, "epoch": 1559} {"train_loss": -11.314810752868652, "global_step": 261936, "epoch": 1559} {"train_loss": -10.126644134521484, "global_step": 261937, "epoch": 1559} {"train_loss": -11.121490478515625, "global_step": 261938, "epoch": 1559} {"train_loss": -11.371997833251953, "global_step": 261939, "epoch": 1559} {"train_loss": -10.83915901184082, "global_step": 261940, "epoch": 1559} {"train_loss": -11.165362358093262, "global_step": 261941, "epoch": 1559} {"train_loss": -10.557634353637695, "global_step": 261942, "epoch": 1559} {"train_loss": -10.79969596862793, "global_step": 261943, "epoch": 1559} {"train_loss": -11.38100814819336, "global_step": 261944, "epoch": 1559} {"train_loss": -10.793712615966797, "global_step": 261945, "epoch": 1559} {"train_loss": -11.380634307861328, "global_step": 261946, "epoch": 1559} {"train_loss": -10.895857810974121, "global_step": 261947, "epoch": 1559} {"train_loss": -11.519420623779297, "global_step": 261948, "epoch": 1559} {"train_loss": -10.952566146850586, "global_step": 261949, "epoch": 1559} {"train_loss": -11.188577651977539, "global_step": 261950, "epoch": 1559} {"train_loss": -11.005481719970703, "global_step": 261951, "epoch": 1559} {"train_loss": -11.44172477722168, "global_step": 261952, "epoch": 1559} {"train_loss": -11.254931449890137, "global_step": 261953, "epoch": 1559} {"train_loss": -11.400640487670898, "global_step": 261954, "epoch": 1559} {"train_loss": -11.526251792907715, "global_step": 261955, "epoch": 1559} {"train_loss": -10.990438461303711, "global_step": 261956, "epoch": 1559} {"train_loss": -11.721558570861816, "global_step": 261957, "epoch": 1559} {"train_loss": -11.696630477905273, "global_step": 261958, "epoch": 1559} {"train_loss": -11.4347562789917, "global_step": 261959, "epoch": 1559} {"train_loss": -11.625328063964844, "global_step": 261960, "epoch": 1559} {"train_loss": -11.273652076721191, "global_step": 261961, "epoch": 1559} {"train_loss": -11.570324897766113, "global_step": 261962, "epoch": 1559} {"train_loss": -11.55128002166748, "global_step": 261963, "epoch": 1559} {"train_loss": -11.71007251739502, "global_step": 261964, "epoch": 1559} {"train_loss": -11.350784301757812, "global_step": 261965, "epoch": 1559} {"train_loss": -11.219160079956055, "global_step": 261966, "epoch": 1559} {"train_loss": -11.440526962280273, "global_step": 261967, "epoch": 1559} {"train_loss": -10.920409202575684, "global_step": 261968, "epoch": 1559} {"train_loss": -11.738737106323242, "global_step": 261969, "epoch": 1559} {"train_loss": -11.49881362915039, "global_step": 261970, "epoch": 1559} {"train_loss": -11.495535850524902, "global_step": 261971, "epoch": 1559} {"train_loss": -11.673047065734863, "global_step": 261972, "epoch": 1559} {"train_loss": -11.370193481445312, "global_step": 261973, "epoch": 1559} {"train_loss": -11.648100852966309, "global_step": 261974, "epoch": 1559} {"train_loss": -11.600563049316406, "global_step": 261975, "epoch": 1559} {"train_loss": -11.767867088317871, "global_step": 261976, "epoch": 1559} {"train_loss": -11.62939453125, "global_step": 261977, "epoch": 1559} {"train_loss": -11.816337585449219, "global_step": 261978, "epoch": 1559} {"train_loss": -11.808633804321289, "global_step": 261979, "epoch": 1559} {"train_loss": -11.867873191833496, "global_step": 261980, "epoch": 1559} {"train_loss": -11.81374740600586, "global_step": 261981, "epoch": 1559} {"train_loss": -11.947307586669922, "global_step": 261982, "epoch": 1559} {"train_loss": -11.719354629516602, "global_step": 261983, "epoch": 1559} {"train_loss": -11.679783821105957, "global_step": 261984, "epoch": 1559} {"train_loss": -11.629887580871582, "global_step": 261985, "epoch": 1559} {"train_loss": -11.563748359680176, "global_step": 261986, "epoch": 1559} {"train_loss": -11.796833038330078, "global_step": 261987, "epoch": 1559} {"train_loss": -11.854461669921875, "global_step": 261988, "epoch": 1559} {"train_loss": -11.797591209411621, "global_step": 261989, "epoch": 1559} {"train_loss": -12.050524711608887, "global_step": 261990, "epoch": 1559} {"train_loss": -11.892480850219727, "global_step": 261991, "epoch": 1559} {"train_loss": -12.063613891601562, "global_step": 261992, "epoch": 1559} {"train_loss": -12.01031494140625, "global_step": 261993, "epoch": 1559} {"train_loss": -12.133821487426758, "global_step": 261994, "epoch": 1559} {"train_loss": -11.95938777923584, "global_step": 261995, "epoch": 1559} {"train_loss": -12.03349494934082, "global_step": 261996, "epoch": 1559} {"train_loss": -12.006396293640137, "global_step": 261997, "epoch": 1559} {"train_loss": -11.754229545593262, "global_step": 261998, "epoch": 1559} {"train_loss": -11.932954788208008, "global_step": 261999, "epoch": 1559} {"train_loss": -11.807555198669434, "global_step": 262000, "epoch": 1559} {"train_loss": -11.741072654724121, "global_step": 262001, "epoch": 1559} {"train_loss": -11.995952606201172, "global_step": 262002, "epoch": 1559} {"train_loss": -11.650102615356445, "global_step": 262003, "epoch": 1559} {"train_loss": -11.966653823852539, "global_step": 262004, "epoch": 1559} {"train_loss": -12.088798522949219, "global_step": 262005, "epoch": 1559} {"train_loss": -12.00899887084961, "global_step": 262006, "epoch": 1559} {"train_loss": -12.209257125854492, "global_step": 262007, "epoch": 1559} {"train_loss": -12.088912010192871, "global_step": 262008, "epoch": 1559} {"train_loss": -12.067346572875977, "global_step": 262009, "epoch": 1559} {"train_loss": -11.908445358276367, "global_step": 262010, "epoch": 1559} {"train_loss": -12.026323318481445, "global_step": 262011, "epoch": 1559} {"train_loss": -11.670015335083008, "global_step": 262012, "epoch": 1559} {"train_loss": -11.762628555297852, "global_step": 262013, "epoch": 1559} {"train_loss": -11.743342399597168, "global_step": 262014, "epoch": 1559} {"train_loss": -11.32201862335205, "global_step": 262015, "epoch": 1559} {"train_loss": -11.789484024047852, "global_step": 262016, "epoch": 1559} {"train_loss": -11.706063270568848, "global_step": 262017, "epoch": 1559} {"train_loss": -11.671700477600098, "global_step": 262018, "epoch": 1559} {"train_loss": -12.157337188720703, "global_step": 262019, "epoch": 1559} {"train_loss": -11.127748489379883, "global_step": 262020, "epoch": 1559} {"train_loss": -11.990036010742188, "global_step": 262021, "epoch": 1559} {"train_loss": -11.832344055175781, "global_step": 262022, "epoch": 1559} {"train_loss": -11.696651458740234, "global_step": 262023, "epoch": 1559} {"train_loss": -11.9619140625, "global_step": 262024, "epoch": 1559} {"train_loss": -11.783806800842285, "global_step": 262025, "epoch": 1559} {"train_loss": -11.99654769897461, "global_step": 262026, "epoch": 1559} {"train_loss": -11.778876304626465, "global_step": 262027, "epoch": 1559} {"train_loss": -10.922587394714355, "global_step": 262028, "epoch": 1559} {"train_loss": -11.946224212646484, "global_step": 262029, "epoch": 1559} {"train_loss": -11.064421653747559, "global_step": 262030, "epoch": 1559} {"train_loss": -11.37467098236084, "global_step": 262031, "epoch": 1559} {"train_loss": -12.005829811096191, "global_step": 262032, "epoch": 1559} {"train_loss": -10.933259963989258, "global_step": 262033, "epoch": 1559} {"train_loss": -11.499795913696289, "global_step": 262034, "epoch": 1559} {"train_loss": -11.770062446594238, "global_step": 262035, "epoch": 1559} {"train_loss": -11.050222396850586, "global_step": 262036, "epoch": 1559} {"train_loss": -11.684078216552734, "global_step": 262037, "epoch": 1559} {"train_loss": -11.609646797180176, "global_step": 262038, "epoch": 1559} {"train_loss": -11.316919326782227, "global_step": 262039, "epoch": 1559} {"train_loss": -11.487398147583008, "global_step": 262040, "epoch": 1559} {"train_loss": -10.945241928100586, "global_step": 262041, "epoch": 1559} {"train_loss": -10.830297470092773, "global_step": 262042, "epoch": 1559} {"train_loss": -11.668800354003906, "global_step": 262043, "epoch": 1559} {"train_loss": -11.22006607055664, "global_step": 262044, "epoch": 1559} {"train_loss": -11.469903945922852, "global_step": 262045, "epoch": 1559} {"train_loss": -11.731104850769043, "global_step": 262046, "epoch": 1559} {"train_loss": -11.47562313079834, "global_step": 262047, "epoch": 1559} {"train_loss": -12.107097625732422, "global_step": 262048, "epoch": 1559} {"train_loss": -11.65618896484375, "global_step": 262049, "epoch": 1559} {"train_loss": -11.801626205444336, "global_step": 262050, "epoch": 1559} {"train_loss": -11.92158317565918, "global_step": 262051, "epoch": 1559} {"train_loss": -11.468746185302734, "global_step": 262052, "epoch": 1559} {"train_loss": -11.985326766967773, "global_step": 262053, "epoch": 1559} {"train_loss": -11.833353042602539, "global_step": 262054, "epoch": 1559} {"train_loss": -11.954044342041016, "global_step": 262055, "epoch": 1559} {"train_loss": -11.651111602783203, "global_step": 262056, "epoch": 1559} {"train_loss": -12.005075454711914, "global_step": 262057, "epoch": 1559} {"train_loss": -12.204146385192871, "global_step": 262058, "epoch": 1559} {"train_loss": -12.004220008850098, "global_step": 262059, "epoch": 1559} {"train_loss": -12.204559326171875, "global_step": 262060, "epoch": 1559} {"train_loss": -11.595834732055664, "global_step": 262061, "epoch": 1559} {"train_loss": -11.890787124633789, "global_step": 262062, "epoch": 1559} {"train_loss": -11.780917167663574, "global_step": 262063, "epoch": 1559} {"train_loss": -11.490713119506836, "global_step": 262064, "epoch": 1559} {"train_loss": -11.731310844421387, "global_step": 262065, "epoch": 1559} {"train_loss": -11.454042434692383, "global_step": 262066, "epoch": 1559} {"train_loss": -11.93794059753418, "global_step": 262067, "epoch": 1559} {"train_loss": -11.645591735839844, "global_step": 262068, "epoch": 1559} {"train_loss": -12.036184310913086, "global_step": 262069, "epoch": 1559} {"train_loss": -11.775627136230469, "global_step": 262070, "epoch": 1559} {"train_loss": -11.92902946472168, "global_step": 262071, "epoch": 1559} {"train_loss": -12.01247501373291, "global_step": 262072, "epoch": 1559} {"train_loss": -11.793766021728516, "global_step": 262073, "epoch": 1559} {"train_loss": -12.018838882446289, "global_step": 262074, "epoch": 1559} {"train_loss": -12.128486633300781, "global_step": 262075, "epoch": 1559} {"train_loss": -12.17513656616211, "global_step": 262076, "epoch": 1559} {"train_loss": -11.97021484375, "global_step": 262077, "epoch": 1559} {"train_loss": -11.962620735168457, "global_step": 262078, "epoch": 1559} {"train_loss": -11.619677725292387, "global_step": 262079, "epoch": 1559, "val_loss": 273126.1875} {"train_loss": -12.108497619628906, "global_step": 262080, "epoch": 1560} {"train_loss": -12.10290813446045, "global_step": 262081, "epoch": 1560} {"train_loss": -11.727144241333008, "global_step": 262082, "epoch": 1560} {"train_loss": -12.058517456054688, "global_step": 262083, "epoch": 1560} {"train_loss": -11.8175048828125, "global_step": 262084, "epoch": 1560} {"train_loss": -11.9334135055542, "global_step": 262085, "epoch": 1560} {"train_loss": -12.004350662231445, "global_step": 262086, "epoch": 1560} {"train_loss": -12.162324905395508, "global_step": 262087, "epoch": 1560} {"train_loss": -11.912256240844727, "global_step": 262088, "epoch": 1560} {"train_loss": -12.030451774597168, "global_step": 262089, "epoch": 1560} {"train_loss": -12.097564697265625, "global_step": 262090, "epoch": 1560} {"train_loss": -12.07996940612793, "global_step": 262091, "epoch": 1560} {"train_loss": -12.069597244262695, "global_step": 262092, "epoch": 1560} {"train_loss": -12.067499160766602, "global_step": 262093, "epoch": 1560} {"train_loss": -12.185382843017578, "global_step": 262094, "epoch": 1560} {"train_loss": -12.265032768249512, "global_step": 262095, "epoch": 1560} {"train_loss": -12.058577537536621, "global_step": 262096, "epoch": 1560} {"train_loss": -12.16526985168457, "global_step": 262097, "epoch": 1560} {"train_loss": -11.92913818359375, "global_step": 262098, "epoch": 1560} {"train_loss": -11.871726989746094, "global_step": 262099, "epoch": 1560} {"train_loss": -11.950907707214355, "global_step": 262100, "epoch": 1560} {"train_loss": -12.092460632324219, "global_step": 262101, "epoch": 1560} {"train_loss": -11.772085189819336, "global_step": 262102, "epoch": 1560} {"train_loss": -11.250823020935059, "global_step": 262103, "epoch": 1560} {"train_loss": -11.07301139831543, "global_step": 262104, "epoch": 1560} {"train_loss": -11.552446365356445, "global_step": 262105, "epoch": 1560} {"train_loss": -12.02197265625, "global_step": 262106, "epoch": 1560} {"train_loss": -11.119279861450195, "global_step": 262107, "epoch": 1560} {"train_loss": -11.320389747619629, "global_step": 262108, "epoch": 1560} {"train_loss": -12.029855728149414, "global_step": 262109, "epoch": 1560} {"train_loss": -11.895065307617188, "global_step": 262110, "epoch": 1560} {"train_loss": -11.880500793457031, "global_step": 262111, "epoch": 1560} {"train_loss": -11.920204162597656, "global_step": 262112, "epoch": 1560} {"train_loss": -11.975988388061523, "global_step": 262113, "epoch": 1560} {"train_loss": -12.058653831481934, "global_step": 262114, "epoch": 1560} {"train_loss": -11.419021606445312, "global_step": 262115, "epoch": 1560} {"train_loss": -11.472855567932129, "global_step": 262116, "epoch": 1560} {"train_loss": -11.701323509216309, "global_step": 262117, "epoch": 1560} {"train_loss": -10.963586807250977, "global_step": 262118, "epoch": 1560} {"train_loss": -10.923707962036133, "global_step": 262119, "epoch": 1560} {"train_loss": -11.438362121582031, "global_step": 262120, "epoch": 1560} {"train_loss": -11.142837524414062, "global_step": 262121, "epoch": 1560} {"train_loss": -11.252191543579102, "global_step": 262122, "epoch": 1560} {"train_loss": -10.983074188232422, "global_step": 262123, "epoch": 1560} {"train_loss": -12.050912857055664, "global_step": 262124, "epoch": 1560} {"train_loss": -11.199405670166016, "global_step": 262125, "epoch": 1560} {"train_loss": -11.268856048583984, "global_step": 262126, "epoch": 1560} {"train_loss": -11.916772842407227, "global_step": 262127, "epoch": 1560} {"train_loss": -11.35977554321289, "global_step": 262128, "epoch": 1560} {"train_loss": -10.211552619934082, "global_step": 262129, "epoch": 1560} {"train_loss": -11.262310028076172, "global_step": 262130, "epoch": 1560} {"train_loss": -11.385741233825684, "global_step": 262131, "epoch": 1560} {"train_loss": -10.767730712890625, "global_step": 262132, "epoch": 1560} {"train_loss": -10.212921142578125, "global_step": 262133, "epoch": 1560} {"train_loss": -11.428418159484863, "global_step": 262134, "epoch": 1560} {"train_loss": -11.203681945800781, "global_step": 262135, "epoch": 1560} {"train_loss": -11.588079452514648, "global_step": 262136, "epoch": 1560} {"train_loss": -11.142911911010742, "global_step": 262137, "epoch": 1560} {"train_loss": -11.254840850830078, "global_step": 262138, "epoch": 1560} {"train_loss": -11.304519653320312, "global_step": 262139, "epoch": 1560} {"train_loss": -11.033042907714844, "global_step": 262140, "epoch": 1560} {"train_loss": -11.08193588256836, "global_step": 262141, "epoch": 1560} {"train_loss": -11.294706344604492, "global_step": 262142, "epoch": 1560} {"train_loss": -11.339508056640625, "global_step": 262143, "epoch": 1560} {"train_loss": -11.609785079956055, "global_step": 262144, "epoch": 1560} {"train_loss": -11.594548225402832, "global_step": 262145, "epoch": 1560} {"train_loss": -11.57813835144043, "global_step": 262146, "epoch": 1560} {"train_loss": -11.761764526367188, "global_step": 262147, "epoch": 1560} {"train_loss": -11.14942741394043, "global_step": 262148, "epoch": 1560} {"train_loss": -11.798558235168457, "global_step": 262149, "epoch": 1560} {"train_loss": -11.136041641235352, "global_step": 262150, "epoch": 1560} {"train_loss": -11.817867279052734, "global_step": 262151, "epoch": 1560} {"train_loss": -11.665693283081055, "global_step": 262152, "epoch": 1560} {"train_loss": -11.732559204101562, "global_step": 262153, "epoch": 1560} {"train_loss": -11.609492301940918, "global_step": 262154, "epoch": 1560} {"train_loss": -12.084243774414062, "global_step": 262155, "epoch": 1560} {"train_loss": -11.81678295135498, "global_step": 262156, "epoch": 1560} {"train_loss": -11.759565353393555, "global_step": 262157, "epoch": 1560} {"train_loss": -11.968408584594727, "global_step": 262158, "epoch": 1560} {"train_loss": -11.949831008911133, "global_step": 262159, "epoch": 1560} {"train_loss": -11.74611759185791, "global_step": 262160, "epoch": 1560} {"train_loss": -11.44471549987793, "global_step": 262161, "epoch": 1560} {"train_loss": -11.639968872070312, "global_step": 262162, "epoch": 1560} {"train_loss": -11.377033233642578, "global_step": 262163, "epoch": 1560} {"train_loss": -12.060649871826172, "global_step": 262164, "epoch": 1560} {"train_loss": -11.827077865600586, "global_step": 262165, "epoch": 1560} {"train_loss": -11.777578353881836, "global_step": 262166, "epoch": 1560} {"train_loss": -11.571836471557617, "global_step": 262167, "epoch": 1560} {"train_loss": -11.70655345916748, "global_step": 262168, "epoch": 1560} {"train_loss": -11.814132690429688, "global_step": 262169, "epoch": 1560} {"train_loss": -12.067734718322754, "global_step": 262170, "epoch": 1560} {"train_loss": -11.931044578552246, "global_step": 262171, "epoch": 1560} {"train_loss": -11.979761123657227, "global_step": 262172, "epoch": 1560} {"train_loss": -11.983168601989746, "global_step": 262173, "epoch": 1560} {"train_loss": -11.973541259765625, "global_step": 262174, "epoch": 1560} {"train_loss": -11.609519958496094, "global_step": 262175, "epoch": 1560} {"train_loss": -12.2418212890625, "global_step": 262176, "epoch": 1560} {"train_loss": -11.91234016418457, "global_step": 262177, "epoch": 1560} {"train_loss": -12.146810531616211, "global_step": 262178, "epoch": 1560} {"train_loss": -11.952775955200195, "global_step": 262179, "epoch": 1560} {"train_loss": -11.910991668701172, "global_step": 262180, "epoch": 1560} {"train_loss": -12.188011169433594, "global_step": 262181, "epoch": 1560} {"train_loss": -11.90207290649414, "global_step": 262182, "epoch": 1560} {"train_loss": -12.13037395477295, "global_step": 262183, "epoch": 1560} {"train_loss": -12.03245735168457, "global_step": 262184, "epoch": 1560} {"train_loss": -12.01708984375, "global_step": 262185, "epoch": 1560} {"train_loss": -12.131856918334961, "global_step": 262186, "epoch": 1560} {"train_loss": -12.080163955688477, "global_step": 262187, "epoch": 1560} {"train_loss": -12.294227600097656, "global_step": 262188, "epoch": 1560} {"train_loss": -11.918142318725586, "global_step": 262189, "epoch": 1560} {"train_loss": -12.29548454284668, "global_step": 262190, "epoch": 1560} {"train_loss": -12.258216857910156, "global_step": 262191, "epoch": 1560} {"train_loss": -12.039030075073242, "global_step": 262192, "epoch": 1560} {"train_loss": -12.401710510253906, "global_step": 262193, "epoch": 1560} {"train_loss": -12.136804580688477, "global_step": 262194, "epoch": 1560} {"train_loss": -12.044137954711914, "global_step": 262195, "epoch": 1560} {"train_loss": -11.940957069396973, "global_step": 262196, "epoch": 1560} {"train_loss": -12.119268417358398, "global_step": 262197, "epoch": 1560} {"train_loss": -11.929821968078613, "global_step": 262198, "epoch": 1560} {"train_loss": -12.245760917663574, "global_step": 262199, "epoch": 1560} {"train_loss": -12.072643280029297, "global_step": 262200, "epoch": 1560} {"train_loss": -11.999850273132324, "global_step": 262201, "epoch": 1560} {"train_loss": -11.903053283691406, "global_step": 262202, "epoch": 1560} {"train_loss": -12.110442161560059, "global_step": 262203, "epoch": 1560} {"train_loss": -12.180245399475098, "global_step": 262204, "epoch": 1560} {"train_loss": -11.010236740112305, "global_step": 262205, "epoch": 1560} {"train_loss": -11.121471405029297, "global_step": 262206, "epoch": 1560} {"train_loss": -11.936065673828125, "global_step": 262207, "epoch": 1560} {"train_loss": -11.786909103393555, "global_step": 262208, "epoch": 1560} {"train_loss": -12.160097122192383, "global_step": 262209, "epoch": 1560} {"train_loss": -11.791715621948242, "global_step": 262210, "epoch": 1560} {"train_loss": -11.73351764678955, "global_step": 262211, "epoch": 1560} {"train_loss": -11.883316040039062, "global_step": 262212, "epoch": 1560} {"train_loss": -11.897744178771973, "global_step": 262213, "epoch": 1560} {"train_loss": -11.428445816040039, "global_step": 262214, "epoch": 1560} {"train_loss": -11.684048652648926, "global_step": 262215, "epoch": 1560} {"train_loss": -11.558152198791504, "global_step": 262216, "epoch": 1560} {"train_loss": -10.865081787109375, "global_step": 262217, "epoch": 1560} {"train_loss": -10.097414016723633, "global_step": 262218, "epoch": 1560} {"train_loss": -10.69253921508789, "global_step": 262219, "epoch": 1560} {"train_loss": -11.541144371032715, "global_step": 262220, "epoch": 1560} {"train_loss": -10.58939266204834, "global_step": 262221, "epoch": 1560} {"train_loss": -11.813085556030273, "global_step": 262222, "epoch": 1560} {"train_loss": -10.676471710205078, "global_step": 262223, "epoch": 1560} {"train_loss": -11.568853378295898, "global_step": 262224, "epoch": 1560} {"train_loss": -11.10970687866211, "global_step": 262225, "epoch": 1560} {"train_loss": -10.913534164428711, "global_step": 262226, "epoch": 1560} {"train_loss": -11.554365158081055, "global_step": 262227, "epoch": 1560} {"train_loss": -10.870199203491211, "global_step": 262228, "epoch": 1560} {"train_loss": -11.753408432006836, "global_step": 262229, "epoch": 1560} {"train_loss": -11.064733505249023, "global_step": 262230, "epoch": 1560} {"train_loss": -11.146317481994629, "global_step": 262231, "epoch": 1560} {"train_loss": -11.114068984985352, "global_step": 262232, "epoch": 1560} {"train_loss": -10.501255989074707, "global_step": 262233, "epoch": 1560} {"train_loss": -11.331514358520508, "global_step": 262234, "epoch": 1560} {"train_loss": -10.897378921508789, "global_step": 262235, "epoch": 1560} {"train_loss": -11.033778190612793, "global_step": 262236, "epoch": 1560} {"train_loss": -11.416297912597656, "global_step": 262237, "epoch": 1560} {"train_loss": -10.13559341430664, "global_step": 262238, "epoch": 1560} {"train_loss": -11.095179557800293, "global_step": 262239, "epoch": 1560} {"train_loss": -10.904500007629395, "global_step": 262240, "epoch": 1560} {"train_loss": -11.21906852722168, "global_step": 262241, "epoch": 1560} {"train_loss": -10.590066909790039, "global_step": 262242, "epoch": 1560} {"train_loss": -11.235897064208984, "global_step": 262243, "epoch": 1560} {"train_loss": -10.966763496398926, "global_step": 262244, "epoch": 1560} {"train_loss": -11.299808502197266, "global_step": 262245, "epoch": 1560} {"train_loss": -10.459596633911133, "global_step": 262246, "epoch": 1560} {"train_loss": -11.606333454449972, "global_step": 262247, "epoch": 1560, "val_loss": 268110.625, "train_action_mse_error": 3.1684892177581787} {"train_loss": -11.173274993896484, "global_step": 262248, "epoch": 1561} {"train_loss": -11.296903610229492, "global_step": 262249, "epoch": 1561} {"train_loss": -11.444559097290039, "global_step": 262250, "epoch": 1561} {"train_loss": -10.84500503540039, "global_step": 262251, "epoch": 1561} {"train_loss": -11.507486343383789, "global_step": 262252, "epoch": 1561} {"train_loss": -11.474185943603516, "global_step": 262253, "epoch": 1561} {"train_loss": -11.447796821594238, "global_step": 262254, "epoch": 1561} {"train_loss": -11.787469863891602, "global_step": 262255, "epoch": 1561} {"train_loss": -11.455839157104492, "global_step": 262256, "epoch": 1561} {"train_loss": -11.430004119873047, "global_step": 262257, "epoch": 1561} {"train_loss": -12.056110382080078, "global_step": 262258, "epoch": 1561} {"train_loss": -11.383572578430176, "global_step": 262259, "epoch": 1561} {"train_loss": -11.649859428405762, "global_step": 262260, "epoch": 1561} {"train_loss": -11.665365219116211, "global_step": 262261, "epoch": 1561} {"train_loss": -11.773109436035156, "global_step": 262262, "epoch": 1561} {"train_loss": -11.795417785644531, "global_step": 262263, "epoch": 1561} {"train_loss": -11.876211166381836, "global_step": 262264, "epoch": 1561} {"train_loss": -11.695615768432617, "global_step": 262265, "epoch": 1561} {"train_loss": -11.87525749206543, "global_step": 262266, "epoch": 1561} {"train_loss": -11.554661750793457, "global_step": 262267, "epoch": 1561} {"train_loss": -11.933902740478516, "global_step": 262268, "epoch": 1561} {"train_loss": -11.510162353515625, "global_step": 262269, "epoch": 1561} {"train_loss": -11.828829765319824, "global_step": 262270, "epoch": 1561} {"train_loss": -11.758386611938477, "global_step": 262271, "epoch": 1561} {"train_loss": -11.856882095336914, "global_step": 262272, "epoch": 1561} {"train_loss": -11.934530258178711, "global_step": 262273, "epoch": 1561} {"train_loss": -11.93937873840332, "global_step": 262274, "epoch": 1561} {"train_loss": -11.913836479187012, "global_step": 262275, "epoch": 1561} {"train_loss": -11.974123001098633, "global_step": 262276, "epoch": 1561} {"train_loss": -11.899042129516602, "global_step": 262277, "epoch": 1561} {"train_loss": -11.600164413452148, "global_step": 262278, "epoch": 1561} {"train_loss": -11.599178314208984, "global_step": 262279, "epoch": 1561} {"train_loss": -11.743682861328125, "global_step": 262280, "epoch": 1561} {"train_loss": -11.548002243041992, "global_step": 262281, "epoch": 1561} {"train_loss": -11.254926681518555, "global_step": 262282, "epoch": 1561} {"train_loss": -11.180547714233398, "global_step": 262283, "epoch": 1561} {"train_loss": -10.570947647094727, "global_step": 262284, "epoch": 1561} {"train_loss": -11.307464599609375, "global_step": 262285, "epoch": 1561} {"train_loss": -10.945760726928711, "global_step": 262286, "epoch": 1561} {"train_loss": -11.188482284545898, "global_step": 262287, "epoch": 1561} {"train_loss": -11.449472427368164, "global_step": 262288, "epoch": 1561} {"train_loss": -11.089942932128906, "global_step": 262289, "epoch": 1561} {"train_loss": -10.973931312561035, "global_step": 262290, "epoch": 1561} {"train_loss": -11.493375778198242, "global_step": 262291, "epoch": 1561} {"train_loss": -11.024478912353516, "global_step": 262292, "epoch": 1561} {"train_loss": -11.673469543457031, "global_step": 262293, "epoch": 1561} {"train_loss": -10.540933609008789, "global_step": 262294, "epoch": 1561} {"train_loss": -11.208309173583984, "global_step": 262295, "epoch": 1561} {"train_loss": -10.911199569702148, "global_step": 262296, "epoch": 1561} {"train_loss": -11.44351863861084, "global_step": 262297, "epoch": 1561} {"train_loss": -10.966012001037598, "global_step": 262298, "epoch": 1561} {"train_loss": -11.6478271484375, "global_step": 262299, "epoch": 1561} {"train_loss": -11.348651885986328, "global_step": 262300, "epoch": 1561} {"train_loss": -11.585062026977539, "global_step": 262301, "epoch": 1561} {"train_loss": -10.98923397064209, "global_step": 262302, "epoch": 1561} {"train_loss": -11.876114845275879, "global_step": 262303, "epoch": 1561} {"train_loss": -11.307426452636719, "global_step": 262304, "epoch": 1561} {"train_loss": -11.934662818908691, "global_step": 262305, "epoch": 1561} {"train_loss": -11.788655281066895, "global_step": 262306, "epoch": 1561} {"train_loss": -11.6970796585083, "global_step": 262307, "epoch": 1561} {"train_loss": -11.514713287353516, "global_step": 262308, "epoch": 1561} {"train_loss": -11.94041633605957, "global_step": 262309, "epoch": 1561} {"train_loss": -11.3276948928833, "global_step": 262310, "epoch": 1561} {"train_loss": -11.832763671875, "global_step": 262311, "epoch": 1561} {"train_loss": -11.581954956054688, "global_step": 262312, "epoch": 1561} {"train_loss": -11.85207748413086, "global_step": 262313, "epoch": 1561} {"train_loss": -11.781728744506836, "global_step": 262314, "epoch": 1561} {"train_loss": -11.986482620239258, "global_step": 262315, "epoch": 1561} {"train_loss": -11.15021800994873, "global_step": 262316, "epoch": 1561} {"train_loss": -11.974319458007812, "global_step": 262317, "epoch": 1561} {"train_loss": -11.707588195800781, "global_step": 262318, "epoch": 1561} {"train_loss": -12.062416076660156, "global_step": 262319, "epoch": 1561} {"train_loss": -11.77049446105957, "global_step": 262320, "epoch": 1561} {"train_loss": -11.921579360961914, "global_step": 262321, "epoch": 1561} {"train_loss": -11.720118522644043, "global_step": 262322, "epoch": 1561} {"train_loss": -11.837371826171875, "global_step": 262323, "epoch": 1561} {"train_loss": -11.438722610473633, "global_step": 262324, "epoch": 1561} {"train_loss": -11.962250709533691, "global_step": 262325, "epoch": 1561} {"train_loss": -11.745393753051758, "global_step": 262326, "epoch": 1561} {"train_loss": -11.898782730102539, "global_step": 262327, "epoch": 1561} {"train_loss": -11.995182037353516, "global_step": 262328, "epoch": 1561} {"train_loss": -12.042181968688965, "global_step": 262329, "epoch": 1561} {"train_loss": -11.941865921020508, "global_step": 262330, "epoch": 1561} {"train_loss": -12.0309476852417, "global_step": 262331, "epoch": 1561} {"train_loss": -11.999019622802734, "global_step": 262332, "epoch": 1561} {"train_loss": -12.033905029296875, "global_step": 262333, "epoch": 1561} {"train_loss": -12.155567169189453, "global_step": 262334, "epoch": 1561} {"train_loss": -11.963013648986816, "global_step": 262335, "epoch": 1561} {"train_loss": -11.781984329223633, "global_step": 262336, "epoch": 1561} {"train_loss": -11.415945053100586, "global_step": 262337, "epoch": 1561} {"train_loss": -11.703017234802246, "global_step": 262338, "epoch": 1561} {"train_loss": -11.685456275939941, "global_step": 262339, "epoch": 1561} {"train_loss": -11.657922744750977, "global_step": 262340, "epoch": 1561} {"train_loss": -11.82730484008789, "global_step": 262341, "epoch": 1561} {"train_loss": -11.560456275939941, "global_step": 262342, "epoch": 1561} {"train_loss": -11.425374984741211, "global_step": 262343, "epoch": 1561} {"train_loss": -11.519725799560547, "global_step": 262344, "epoch": 1561} {"train_loss": -11.509204864501953, "global_step": 262345, "epoch": 1561} {"train_loss": -11.136269569396973, "global_step": 262346, "epoch": 1561} {"train_loss": -11.687578201293945, "global_step": 262347, "epoch": 1561} {"train_loss": -11.860044479370117, "global_step": 262348, "epoch": 1561} {"train_loss": -10.941954612731934, "global_step": 262349, "epoch": 1561} {"train_loss": -11.506465911865234, "global_step": 262350, "epoch": 1561} {"train_loss": -12.132584571838379, "global_step": 262351, "epoch": 1561} {"train_loss": -11.683282852172852, "global_step": 262352, "epoch": 1561} {"train_loss": -11.733789443969727, "global_step": 262353, "epoch": 1561} {"train_loss": -12.017454147338867, "global_step": 262354, "epoch": 1561} {"train_loss": -11.534652709960938, "global_step": 262355, "epoch": 1561} {"train_loss": -11.877397537231445, "global_step": 262356, "epoch": 1561} {"train_loss": -11.842206001281738, "global_step": 262357, "epoch": 1561} {"train_loss": -11.881760597229004, "global_step": 262358, "epoch": 1561} {"train_loss": -11.978408813476562, "global_step": 262359, "epoch": 1561} {"train_loss": -11.969215393066406, "global_step": 262360, "epoch": 1561} {"train_loss": -11.74629020690918, "global_step": 262361, "epoch": 1561} {"train_loss": -12.128785133361816, "global_step": 262362, "epoch": 1561} {"train_loss": -11.815489768981934, "global_step": 262363, "epoch": 1561} {"train_loss": -12.107988357543945, "global_step": 262364, "epoch": 1561} {"train_loss": -11.90424919128418, "global_step": 262365, "epoch": 1561} {"train_loss": -12.253231048583984, "global_step": 262366, "epoch": 1561} {"train_loss": -11.981765747070312, "global_step": 262367, "epoch": 1561} {"train_loss": -11.913525581359863, "global_step": 262368, "epoch": 1561} {"train_loss": -12.11727523803711, "global_step": 262369, "epoch": 1561} {"train_loss": -12.012367248535156, "global_step": 262370, "epoch": 1561} {"train_loss": -12.038185119628906, "global_step": 262371, "epoch": 1561} {"train_loss": -12.075549125671387, "global_step": 262372, "epoch": 1561} {"train_loss": -12.242079734802246, "global_step": 262373, "epoch": 1561} {"train_loss": -12.12691879272461, "global_step": 262374, "epoch": 1561} {"train_loss": -12.040811538696289, "global_step": 262375, "epoch": 1561} {"train_loss": -11.860309600830078, "global_step": 262376, "epoch": 1561} {"train_loss": -12.398903846740723, "global_step": 262377, "epoch": 1561} {"train_loss": -11.90981674194336, "global_step": 262378, "epoch": 1561} {"train_loss": -11.872486114501953, "global_step": 262379, "epoch": 1561} {"train_loss": -11.511685371398926, "global_step": 262380, "epoch": 1561} {"train_loss": -11.699779510498047, "global_step": 262381, "epoch": 1561} {"train_loss": -11.769474029541016, "global_step": 262382, "epoch": 1561} {"train_loss": -11.938020706176758, "global_step": 262383, "epoch": 1561} {"train_loss": -11.8726224899292, "global_step": 262384, "epoch": 1561} {"train_loss": -11.976398468017578, "global_step": 262385, "epoch": 1561} {"train_loss": -11.872259140014648, "global_step": 262386, "epoch": 1561} {"train_loss": -11.941856384277344, "global_step": 262387, "epoch": 1561} {"train_loss": -12.194229125976562, "global_step": 262388, "epoch": 1561} {"train_loss": -12.204894065856934, "global_step": 262389, "epoch": 1561} {"train_loss": -11.860389709472656, "global_step": 262390, "epoch": 1561} {"train_loss": -11.8037109375, "global_step": 262391, "epoch": 1561} {"train_loss": -12.058259963989258, "global_step": 262392, "epoch": 1561} {"train_loss": -12.027318000793457, "global_step": 262393, "epoch": 1561} {"train_loss": -12.139457702636719, "global_step": 262394, "epoch": 1561} {"train_loss": -11.954732894897461, "global_step": 262395, "epoch": 1561} {"train_loss": -11.940607070922852, "global_step": 262396, "epoch": 1561} {"train_loss": -11.958734512329102, "global_step": 262397, "epoch": 1561} {"train_loss": -11.686516761779785, "global_step": 262398, "epoch": 1561} {"train_loss": -11.665416717529297, "global_step": 262399, "epoch": 1561} {"train_loss": -11.453326225280762, "global_step": 262400, "epoch": 1561} {"train_loss": -11.472697257995605, "global_step": 262401, "epoch": 1561} {"train_loss": -11.518508911132812, "global_step": 262402, "epoch": 1561} {"train_loss": -11.153326034545898, "global_step": 262403, "epoch": 1561} {"train_loss": -11.063711166381836, "global_step": 262404, "epoch": 1561} {"train_loss": -11.642176628112793, "global_step": 262405, "epoch": 1561} {"train_loss": -11.63193130493164, "global_step": 262406, "epoch": 1561} {"train_loss": -11.207300186157227, "global_step": 262407, "epoch": 1561} {"train_loss": -11.358055114746094, "global_step": 262408, "epoch": 1561} {"train_loss": -10.724440574645996, "global_step": 262409, "epoch": 1561} {"train_loss": -11.63189697265625, "global_step": 262410, "epoch": 1561} {"train_loss": -11.735891342163086, "global_step": 262411, "epoch": 1561} {"train_loss": -11.193426132202148, "global_step": 262412, "epoch": 1561} {"train_loss": -11.9029541015625, "global_step": 262413, "epoch": 1561} {"train_loss": -11.046218872070312, "global_step": 262414, "epoch": 1561} {"train_loss": -11.677869314239139, "global_step": 262415, "epoch": 1561, "val_loss": 273251.9375} {"train_loss": -11.140253067016602, "global_step": 262416, "epoch": 1562} {"train_loss": -11.08938217163086, "global_step": 262417, "epoch": 1562} {"train_loss": -10.509920120239258, "global_step": 262418, "epoch": 1562} {"train_loss": -11.496484756469727, "global_step": 262419, "epoch": 1562} {"train_loss": -11.710779190063477, "global_step": 262420, "epoch": 1562} {"train_loss": -10.787199020385742, "global_step": 262421, "epoch": 1562} {"train_loss": -11.907499313354492, "global_step": 262422, "epoch": 1562} {"train_loss": -11.331901550292969, "global_step": 262423, "epoch": 1562} {"train_loss": -11.900996208190918, "global_step": 262424, "epoch": 1562} {"train_loss": -11.709946632385254, "global_step": 262425, "epoch": 1562} {"train_loss": -11.790011405944824, "global_step": 262426, "epoch": 1562} {"train_loss": -11.757561683654785, "global_step": 262427, "epoch": 1562} {"train_loss": -11.90316390991211, "global_step": 262428, "epoch": 1562} {"train_loss": -11.70393180847168, "global_step": 262429, "epoch": 1562} {"train_loss": -12.013513565063477, "global_step": 262430, "epoch": 1562} {"train_loss": -11.551395416259766, "global_step": 262431, "epoch": 1562} {"train_loss": -12.098516464233398, "global_step": 262432, "epoch": 1562} {"train_loss": -11.803792953491211, "global_step": 262433, "epoch": 1562} {"train_loss": -11.362649917602539, "global_step": 262434, "epoch": 1562} {"train_loss": -11.954906463623047, "global_step": 262435, "epoch": 1562} {"train_loss": -11.392292022705078, "global_step": 262436, "epoch": 1562} {"train_loss": -11.868672370910645, "global_step": 262437, "epoch": 1562} {"train_loss": -11.69395923614502, "global_step": 262438, "epoch": 1562} {"train_loss": -11.13003158569336, "global_step": 262439, "epoch": 1562} {"train_loss": -11.46114730834961, "global_step": 262440, "epoch": 1562} {"train_loss": -11.836395263671875, "global_step": 262441, "epoch": 1562} {"train_loss": -11.376408576965332, "global_step": 262442, "epoch": 1562} {"train_loss": -11.461578369140625, "global_step": 262443, "epoch": 1562} {"train_loss": -11.547574996948242, "global_step": 262444, "epoch": 1562} {"train_loss": -11.92005729675293, "global_step": 262445, "epoch": 1562} {"train_loss": -11.576717376708984, "global_step": 262446, "epoch": 1562} {"train_loss": -11.719892501831055, "global_step": 262447, "epoch": 1562} {"train_loss": -11.983847618103027, "global_step": 262448, "epoch": 1562} {"train_loss": -11.891544342041016, "global_step": 262449, "epoch": 1562} {"train_loss": -11.621665000915527, "global_step": 262450, "epoch": 1562} {"train_loss": -11.911083221435547, "global_step": 262451, "epoch": 1562} {"train_loss": -12.046866416931152, "global_step": 262452, "epoch": 1562} {"train_loss": -12.035327911376953, "global_step": 262453, "epoch": 1562} {"train_loss": -11.926448822021484, "global_step": 262454, "epoch": 1562} {"train_loss": -12.038934707641602, "global_step": 262455, "epoch": 1562} {"train_loss": -11.684213638305664, "global_step": 262456, "epoch": 1562} {"train_loss": -12.260464668273926, "global_step": 262457, "epoch": 1562} {"train_loss": -11.844099044799805, "global_step": 262458, "epoch": 1562} {"train_loss": -12.174917221069336, "global_step": 262459, "epoch": 1562} {"train_loss": -12.047000885009766, "global_step": 262460, "epoch": 1562} {"train_loss": -12.0238676071167, "global_step": 262461, "epoch": 1562} {"train_loss": -11.923709869384766, "global_step": 262462, "epoch": 1562} {"train_loss": -11.887439727783203, "global_step": 262463, "epoch": 1562} {"train_loss": -11.953474044799805, "global_step": 262464, "epoch": 1562} {"train_loss": -12.181938171386719, "global_step": 262465, "epoch": 1562} {"train_loss": -11.950248718261719, "global_step": 262466, "epoch": 1562} {"train_loss": -11.93906021118164, "global_step": 262467, "epoch": 1562} {"train_loss": -12.190577507019043, "global_step": 262468, "epoch": 1562} {"train_loss": -11.914381980895996, "global_step": 262469, "epoch": 1562} {"train_loss": -12.008872985839844, "global_step": 262470, "epoch": 1562} {"train_loss": -12.151687622070312, "global_step": 262471, "epoch": 1562} {"train_loss": -12.117146492004395, "global_step": 262472, "epoch": 1562} {"train_loss": -12.13299560546875, "global_step": 262473, "epoch": 1562} {"train_loss": -11.764261245727539, "global_step": 262474, "epoch": 1562} {"train_loss": -11.32723617553711, "global_step": 262475, "epoch": 1562} {"train_loss": -11.118963241577148, "global_step": 262476, "epoch": 1562} {"train_loss": -11.964701652526855, "global_step": 262477, "epoch": 1562} {"train_loss": -11.802947998046875, "global_step": 262478, "epoch": 1562} {"train_loss": -11.926324844360352, "global_step": 262479, "epoch": 1562} {"train_loss": -12.10144329071045, "global_step": 262480, "epoch": 1562} {"train_loss": -11.952837944030762, "global_step": 262481, "epoch": 1562} {"train_loss": -11.289554595947266, "global_step": 262482, "epoch": 1562} {"train_loss": -11.600809097290039, "global_step": 262483, "epoch": 1562} {"train_loss": -11.347906112670898, "global_step": 262484, "epoch": 1562} {"train_loss": -11.236474990844727, "global_step": 262485, "epoch": 1562} {"train_loss": -11.10042667388916, "global_step": 262486, "epoch": 1562} {"train_loss": -10.937606811523438, "global_step": 262487, "epoch": 1562} {"train_loss": -11.52783489227295, "global_step": 262488, "epoch": 1562} {"train_loss": -11.438774108886719, "global_step": 262489, "epoch": 1562} {"train_loss": -10.871476173400879, "global_step": 262490, "epoch": 1562} {"train_loss": -11.509445190429688, "global_step": 262491, "epoch": 1562} {"train_loss": -11.191049575805664, "global_step": 262492, "epoch": 1562} {"train_loss": -10.977591514587402, "global_step": 262493, "epoch": 1562} {"train_loss": -11.887630462646484, "global_step": 262494, "epoch": 1562} {"train_loss": -10.600715637207031, "global_step": 262495, "epoch": 1562} {"train_loss": -11.901033401489258, "global_step": 262496, "epoch": 1562} {"train_loss": -10.92688274383545, "global_step": 262497, "epoch": 1562} {"train_loss": -11.523902893066406, "global_step": 262498, "epoch": 1562} {"train_loss": -11.501992225646973, "global_step": 262499, "epoch": 1562} {"train_loss": -11.594642639160156, "global_step": 262500, "epoch": 1562} {"train_loss": -11.578216552734375, "global_step": 262501, "epoch": 1562} {"train_loss": -11.402587890625, "global_step": 262502, "epoch": 1562} {"train_loss": -11.652061462402344, "global_step": 262503, "epoch": 1562} {"train_loss": -11.961308479309082, "global_step": 262504, "epoch": 1562} {"train_loss": -10.903640747070312, "global_step": 262505, "epoch": 1562} {"train_loss": -11.893743515014648, "global_step": 262506, "epoch": 1562} {"train_loss": -11.803711891174316, "global_step": 262507, "epoch": 1562} {"train_loss": -12.186080932617188, "global_step": 262508, "epoch": 1562} {"train_loss": -11.776300430297852, "global_step": 262509, "epoch": 1562} {"train_loss": -11.792875289916992, "global_step": 262510, "epoch": 1562} {"train_loss": -11.579469680786133, "global_step": 262511, "epoch": 1562} {"train_loss": -11.689702987670898, "global_step": 262512, "epoch": 1562} {"train_loss": -11.847822189331055, "global_step": 262513, "epoch": 1562} {"train_loss": -11.890962600708008, "global_step": 262514, "epoch": 1562} {"train_loss": -11.599445343017578, "global_step": 262515, "epoch": 1562} {"train_loss": -11.878324508666992, "global_step": 262516, "epoch": 1562} {"train_loss": -11.459477424621582, "global_step": 262517, "epoch": 1562} {"train_loss": -11.043110847473145, "global_step": 262518, "epoch": 1562} {"train_loss": -11.760074615478516, "global_step": 262519, "epoch": 1562} {"train_loss": -10.819658279418945, "global_step": 262520, "epoch": 1562} {"train_loss": -11.62991714477539, "global_step": 262521, "epoch": 1562} {"train_loss": -11.15951919555664, "global_step": 262522, "epoch": 1562} {"train_loss": -11.759737968444824, "global_step": 262523, "epoch": 1562} {"train_loss": -11.3505220413208, "global_step": 262524, "epoch": 1562} {"train_loss": -11.134081840515137, "global_step": 262525, "epoch": 1562} {"train_loss": -11.87009334564209, "global_step": 262526, "epoch": 1562} {"train_loss": -10.702353477478027, "global_step": 262527, "epoch": 1562} {"train_loss": -11.852170944213867, "global_step": 262528, "epoch": 1562} {"train_loss": -10.561925888061523, "global_step": 262529, "epoch": 1562} {"train_loss": -11.4264497756958, "global_step": 262530, "epoch": 1562} {"train_loss": -11.003150939941406, "global_step": 262531, "epoch": 1562} {"train_loss": -11.554213523864746, "global_step": 262532, "epoch": 1562} {"train_loss": -11.603140830993652, "global_step": 262533, "epoch": 1562} {"train_loss": -11.533437728881836, "global_step": 262534, "epoch": 1562} {"train_loss": -11.672369003295898, "global_step": 262535, "epoch": 1562} {"train_loss": -11.173604965209961, "global_step": 262536, "epoch": 1562} {"train_loss": -11.836845397949219, "global_step": 262537, "epoch": 1562} {"train_loss": -11.780095100402832, "global_step": 262538, "epoch": 1562} {"train_loss": -11.981618881225586, "global_step": 262539, "epoch": 1562} {"train_loss": -11.77260971069336, "global_step": 262540, "epoch": 1562} {"train_loss": -11.882368087768555, "global_step": 262541, "epoch": 1562} {"train_loss": -11.938971519470215, "global_step": 262542, "epoch": 1562} {"train_loss": -11.413531303405762, "global_step": 262543, "epoch": 1562} {"train_loss": -11.690793991088867, "global_step": 262544, "epoch": 1562} {"train_loss": -11.897361755371094, "global_step": 262545, "epoch": 1562} {"train_loss": -12.025247573852539, "global_step": 262546, "epoch": 1562} {"train_loss": -11.892742156982422, "global_step": 262547, "epoch": 1562} {"train_loss": -11.55554485321045, "global_step": 262548, "epoch": 1562} {"train_loss": -11.865740776062012, "global_step": 262549, "epoch": 1562} {"train_loss": -11.70883560180664, "global_step": 262550, "epoch": 1562} {"train_loss": -11.757619857788086, "global_step": 262551, "epoch": 1562} {"train_loss": -11.754621505737305, "global_step": 262552, "epoch": 1562} {"train_loss": -11.704665184020996, "global_step": 262553, "epoch": 1562} {"train_loss": -11.410761833190918, "global_step": 262554, "epoch": 1562} {"train_loss": -11.950164794921875, "global_step": 262555, "epoch": 1562} {"train_loss": -11.923526763916016, "global_step": 262556, "epoch": 1562} {"train_loss": -11.774221420288086, "global_step": 262557, "epoch": 1562} {"train_loss": -11.966914176940918, "global_step": 262558, "epoch": 1562} {"train_loss": -11.274311065673828, "global_step": 262559, "epoch": 1562} {"train_loss": -11.899312019348145, "global_step": 262560, "epoch": 1562} {"train_loss": -11.402270317077637, "global_step": 262561, "epoch": 1562} {"train_loss": -12.017681121826172, "global_step": 262562, "epoch": 1562} {"train_loss": -11.045748710632324, "global_step": 262563, "epoch": 1562} {"train_loss": -11.895562171936035, "global_step": 262564, "epoch": 1562} {"train_loss": -11.634025573730469, "global_step": 262565, "epoch": 1562} {"train_loss": -11.985194206237793, "global_step": 262566, "epoch": 1562} {"train_loss": -11.937227249145508, "global_step": 262567, "epoch": 1562} {"train_loss": -11.820533752441406, "global_step": 262568, "epoch": 1562} {"train_loss": -12.116527557373047, "global_step": 262569, "epoch": 1562} {"train_loss": -11.727415084838867, "global_step": 262570, "epoch": 1562} {"train_loss": -12.146817207336426, "global_step": 262571, "epoch": 1562} {"train_loss": -11.81535530090332, "global_step": 262572, "epoch": 1562} {"train_loss": -12.121881484985352, "global_step": 262573, "epoch": 1562} {"train_loss": -12.194997787475586, "global_step": 262574, "epoch": 1562} {"train_loss": -11.975440979003906, "global_step": 262575, "epoch": 1562} {"train_loss": -12.061339378356934, "global_step": 262576, "epoch": 1562} {"train_loss": -12.181385040283203, "global_step": 262577, "epoch": 1562} {"train_loss": -12.00452995300293, "global_step": 262578, "epoch": 1562} {"train_loss": -12.016739845275879, "global_step": 262579, "epoch": 1562} {"train_loss": -11.516122817993164, "global_step": 262580, "epoch": 1562} {"train_loss": -11.376115798950195, "global_step": 262581, "epoch": 1562} {"train_loss": -12.006763458251953, "global_step": 262582, "epoch": 1562} {"train_loss": -11.671643132255191, "global_step": 262583, "epoch": 1562, "val_loss": 273932.8125} {"train_loss": -11.113340377807617, "global_step": 262584, "epoch": 1563} {"train_loss": -11.140172958374023, "global_step": 262585, "epoch": 1563} {"train_loss": -11.044731140136719, "global_step": 262586, "epoch": 1563} {"train_loss": -11.382635116577148, "global_step": 262587, "epoch": 1563} {"train_loss": -11.725204467773438, "global_step": 262588, "epoch": 1563} {"train_loss": -11.459203720092773, "global_step": 262589, "epoch": 1563} {"train_loss": -12.068702697753906, "global_step": 262590, "epoch": 1563} {"train_loss": -11.588040351867676, "global_step": 262591, "epoch": 1563} {"train_loss": -11.95191764831543, "global_step": 262592, "epoch": 1563} {"train_loss": -11.534273147583008, "global_step": 262593, "epoch": 1563} {"train_loss": -11.721334457397461, "global_step": 262594, "epoch": 1563} {"train_loss": -11.455259323120117, "global_step": 262595, "epoch": 1563} {"train_loss": -11.557657241821289, "global_step": 262596, "epoch": 1563} {"train_loss": -11.634139060974121, "global_step": 262597, "epoch": 1563} {"train_loss": -11.461345672607422, "global_step": 262598, "epoch": 1563} {"train_loss": -11.964369773864746, "global_step": 262599, "epoch": 1563} {"train_loss": -11.205764770507812, "global_step": 262600, "epoch": 1563} {"train_loss": -11.356783866882324, "global_step": 262601, "epoch": 1563} {"train_loss": -11.649925231933594, "global_step": 262602, "epoch": 1563} {"train_loss": -11.476114273071289, "global_step": 262603, "epoch": 1563} {"train_loss": -11.93049430847168, "global_step": 262604, "epoch": 1563} {"train_loss": -11.4136962890625, "global_step": 262605, "epoch": 1563} {"train_loss": -12.04302978515625, "global_step": 262606, "epoch": 1563} {"train_loss": -11.961358070373535, "global_step": 262607, "epoch": 1563} {"train_loss": -12.045981407165527, "global_step": 262608, "epoch": 1563} {"train_loss": -11.715106964111328, "global_step": 262609, "epoch": 1563} {"train_loss": -12.26957893371582, "global_step": 262610, "epoch": 1563} {"train_loss": -12.023122787475586, "global_step": 262611, "epoch": 1563} {"train_loss": -11.972944259643555, "global_step": 262612, "epoch": 1563} {"train_loss": -11.898176193237305, "global_step": 262613, "epoch": 1563} {"train_loss": -12.053754806518555, "global_step": 262614, "epoch": 1563} {"train_loss": -12.001009941101074, "global_step": 262615, "epoch": 1563} {"train_loss": -11.853082656860352, "global_step": 262616, "epoch": 1563} {"train_loss": -12.109956741333008, "global_step": 262617, "epoch": 1563} {"train_loss": -11.751668930053711, "global_step": 262618, "epoch": 1563} {"train_loss": -11.559682846069336, "global_step": 262619, "epoch": 1563} {"train_loss": -12.013050079345703, "global_step": 262620, "epoch": 1563} {"train_loss": -11.97182846069336, "global_step": 262621, "epoch": 1563} {"train_loss": -11.921730041503906, "global_step": 262622, "epoch": 1563} {"train_loss": -12.196731567382812, "global_step": 262623, "epoch": 1563} {"train_loss": -12.056406021118164, "global_step": 262624, "epoch": 1563} {"train_loss": -12.073101997375488, "global_step": 262625, "epoch": 1563} {"train_loss": -11.962448120117188, "global_step": 262626, "epoch": 1563} {"train_loss": -11.688230514526367, "global_step": 262627, "epoch": 1563} {"train_loss": -11.312973976135254, "global_step": 262628, "epoch": 1563} {"train_loss": -12.151126861572266, "global_step": 262629, "epoch": 1563} {"train_loss": -11.848649978637695, "global_step": 262630, "epoch": 1563} {"train_loss": -12.003801345825195, "global_step": 262631, "epoch": 1563} {"train_loss": -11.859458923339844, "global_step": 262632, "epoch": 1563} {"train_loss": -11.876311302185059, "global_step": 262633, "epoch": 1563} {"train_loss": -11.912565231323242, "global_step": 262634, "epoch": 1563} {"train_loss": -12.17555046081543, "global_step": 262635, "epoch": 1563} {"train_loss": -11.973806381225586, "global_step": 262636, "epoch": 1563} {"train_loss": -11.991414070129395, "global_step": 262637, "epoch": 1563} {"train_loss": -12.096080780029297, "global_step": 262638, "epoch": 1563} {"train_loss": -12.045979499816895, "global_step": 262639, "epoch": 1563} {"train_loss": -11.772767066955566, "global_step": 262640, "epoch": 1563} {"train_loss": -11.473834991455078, "global_step": 262641, "epoch": 1563} {"train_loss": -11.942136764526367, "global_step": 262642, "epoch": 1563} {"train_loss": -12.340896606445312, "global_step": 262643, "epoch": 1563} {"train_loss": -12.011445999145508, "global_step": 262644, "epoch": 1563} {"train_loss": -11.826064109802246, "global_step": 262645, "epoch": 1563} {"train_loss": -11.95422649383545, "global_step": 262646, "epoch": 1563} {"train_loss": -12.036478042602539, "global_step": 262647, "epoch": 1563} {"train_loss": -12.092975616455078, "global_step": 262648, "epoch": 1563} {"train_loss": -12.12590217590332, "global_step": 262649, "epoch": 1563} {"train_loss": -12.19861888885498, "global_step": 262650, "epoch": 1563} {"train_loss": -12.005216598510742, "global_step": 262651, "epoch": 1563} {"train_loss": -12.197187423706055, "global_step": 262652, "epoch": 1563} {"train_loss": -11.915619850158691, "global_step": 262653, "epoch": 1563} {"train_loss": -12.241249084472656, "global_step": 262654, "epoch": 1563} {"train_loss": -12.148981094360352, "global_step": 262655, "epoch": 1563} {"train_loss": -12.107450485229492, "global_step": 262656, "epoch": 1563} {"train_loss": -12.255012512207031, "global_step": 262657, "epoch": 1563} {"train_loss": -11.896353721618652, "global_step": 262658, "epoch": 1563} {"train_loss": -12.214090347290039, "global_step": 262659, "epoch": 1563} {"train_loss": -12.266998291015625, "global_step": 262660, "epoch": 1563} {"train_loss": -12.097862243652344, "global_step": 262661, "epoch": 1563} {"train_loss": -12.234848022460938, "global_step": 262662, "epoch": 1563} {"train_loss": -12.072010040283203, "global_step": 262663, "epoch": 1563} {"train_loss": -11.958781242370605, "global_step": 262664, "epoch": 1563} {"train_loss": -11.898330688476562, "global_step": 262665, "epoch": 1563} {"train_loss": -11.27714729309082, "global_step": 262666, "epoch": 1563} {"train_loss": -11.505578994750977, "global_step": 262667, "epoch": 1563} {"train_loss": -11.712007522583008, "global_step": 262668, "epoch": 1563} {"train_loss": -11.901851654052734, "global_step": 262669, "epoch": 1563} {"train_loss": -11.049286842346191, "global_step": 262670, "epoch": 1563} {"train_loss": -10.518558502197266, "global_step": 262671, "epoch": 1563} {"train_loss": -11.00790786743164, "global_step": 262672, "epoch": 1563} {"train_loss": -9.942404747009277, "global_step": 262673, "epoch": 1563} {"train_loss": -9.375968933105469, "global_step": 262674, "epoch": 1563} {"train_loss": -11.295909881591797, "global_step": 262675, "epoch": 1563} {"train_loss": -9.257121086120605, "global_step": 262676, "epoch": 1563} {"train_loss": -10.060750961303711, "global_step": 262677, "epoch": 1563} {"train_loss": -10.723916053771973, "global_step": 262678, "epoch": 1563} {"train_loss": -7.155201435089111, "global_step": 262679, "epoch": 1563} {"train_loss": -10.478923797607422, "global_step": 262680, "epoch": 1563} {"train_loss": -8.164955139160156, "global_step": 262681, "epoch": 1563} {"train_loss": -8.31049633026123, "global_step": 262682, "epoch": 1563} {"train_loss": -10.826595306396484, "global_step": 262683, "epoch": 1563} {"train_loss": -10.774679183959961, "global_step": 262684, "epoch": 1563} {"train_loss": -9.470359802246094, "global_step": 262685, "epoch": 1563} {"train_loss": -11.46403694152832, "global_step": 262686, "epoch": 1563} {"train_loss": -10.144990921020508, "global_step": 262687, "epoch": 1563} {"train_loss": -9.859554290771484, "global_step": 262688, "epoch": 1563} {"train_loss": -11.543445587158203, "global_step": 262689, "epoch": 1563} {"train_loss": -9.946603775024414, "global_step": 262690, "epoch": 1563} {"train_loss": -10.339166641235352, "global_step": 262691, "epoch": 1563} {"train_loss": -10.898685455322266, "global_step": 262692, "epoch": 1563} {"train_loss": -10.418974876403809, "global_step": 262693, "epoch": 1563} {"train_loss": -11.516386032104492, "global_step": 262694, "epoch": 1563} {"train_loss": -11.168603897094727, "global_step": 262695, "epoch": 1563} {"train_loss": -11.301794052124023, "global_step": 262696, "epoch": 1563} {"train_loss": -11.36946964263916, "global_step": 262697, "epoch": 1563} {"train_loss": -11.19683837890625, "global_step": 262698, "epoch": 1563} {"train_loss": -11.212169647216797, "global_step": 262699, "epoch": 1563} {"train_loss": -11.651369094848633, "global_step": 262700, "epoch": 1563} {"train_loss": -11.293670654296875, "global_step": 262701, "epoch": 1563} {"train_loss": -11.462112426757812, "global_step": 262702, "epoch": 1563} {"train_loss": -11.525687217712402, "global_step": 262703, "epoch": 1563} {"train_loss": -11.178622245788574, "global_step": 262704, "epoch": 1563} {"train_loss": -11.746578216552734, "global_step": 262705, "epoch": 1563} {"train_loss": -11.098777770996094, "global_step": 262706, "epoch": 1563} {"train_loss": -11.558942794799805, "global_step": 262707, "epoch": 1563} {"train_loss": -11.260475158691406, "global_step": 262708, "epoch": 1563} {"train_loss": -11.826092720031738, "global_step": 262709, "epoch": 1563} {"train_loss": -11.458051681518555, "global_step": 262710, "epoch": 1563} {"train_loss": -11.382533073425293, "global_step": 262711, "epoch": 1563} {"train_loss": -11.734983444213867, "global_step": 262712, "epoch": 1563} {"train_loss": -11.569626808166504, "global_step": 262713, "epoch": 1563} {"train_loss": -11.753186225891113, "global_step": 262714, "epoch": 1563} {"train_loss": -11.80830192565918, "global_step": 262715, "epoch": 1563} {"train_loss": -11.729961395263672, "global_step": 262716, "epoch": 1563} {"train_loss": -11.732121467590332, "global_step": 262717, "epoch": 1563} {"train_loss": -11.846067428588867, "global_step": 262718, "epoch": 1563} {"train_loss": -11.690130233764648, "global_step": 262719, "epoch": 1563} {"train_loss": -11.925368309020996, "global_step": 262720, "epoch": 1563} {"train_loss": -11.677032470703125, "global_step": 262721, "epoch": 1563} {"train_loss": -11.996614456176758, "global_step": 262722, "epoch": 1563} {"train_loss": -12.05793571472168, "global_step": 262723, "epoch": 1563} {"train_loss": -11.981019973754883, "global_step": 262724, "epoch": 1563} {"train_loss": -11.756341934204102, "global_step": 262725, "epoch": 1563} {"train_loss": -12.035100936889648, "global_step": 262726, "epoch": 1563} {"train_loss": -12.088714599609375, "global_step": 262727, "epoch": 1563} {"train_loss": -11.779396057128906, "global_step": 262728, "epoch": 1563} {"train_loss": -12.191360473632812, "global_step": 262729, "epoch": 1563} {"train_loss": -12.061735153198242, "global_step": 262730, "epoch": 1563} {"train_loss": -12.031255722045898, "global_step": 262731, "epoch": 1563} {"train_loss": -12.101343154907227, "global_step": 262732, "epoch": 1563} {"train_loss": -12.132095336914062, "global_step": 262733, "epoch": 1563} {"train_loss": -11.896303176879883, "global_step": 262734, "epoch": 1563} {"train_loss": -11.844244003295898, "global_step": 262735, "epoch": 1563} {"train_loss": -11.97233772277832, "global_step": 262736, "epoch": 1563} {"train_loss": -11.90756607055664, "global_step": 262737, "epoch": 1563} {"train_loss": -11.975109100341797, "global_step": 262738, "epoch": 1563} {"train_loss": -11.974780082702637, "global_step": 262739, "epoch": 1563} {"train_loss": -11.917341232299805, "global_step": 262740, "epoch": 1563} {"train_loss": -11.64717960357666, "global_step": 262741, "epoch": 1563} {"train_loss": -11.555727005004883, "global_step": 262742, "epoch": 1563} {"train_loss": -11.618816375732422, "global_step": 262743, "epoch": 1563} {"train_loss": -12.003396987915039, "global_step": 262744, "epoch": 1563} {"train_loss": -11.821317672729492, "global_step": 262745, "epoch": 1563} {"train_loss": -12.086440086364746, "global_step": 262746, "epoch": 1563} {"train_loss": -12.10630989074707, "global_step": 262747, "epoch": 1563} {"train_loss": -11.845379829406738, "global_step": 262748, "epoch": 1563} {"train_loss": -11.964643478393555, "global_step": 262749, "epoch": 1563} {"train_loss": -12.120006561279297, "global_step": 262750, "epoch": 1563} {"train_loss": -11.57108408780325, "global_step": 262751, "epoch": 1563, "val_loss": 269508.65625} {"train_loss": -12.094039916992188, "global_step": 262752, "epoch": 1564} {"train_loss": -11.920644760131836, "global_step": 262753, "epoch": 1564} {"train_loss": -12.216880798339844, "global_step": 262754, "epoch": 1564} {"train_loss": -11.90277099609375, "global_step": 262755, "epoch": 1564} {"train_loss": -11.981861114501953, "global_step": 262756, "epoch": 1564} {"train_loss": -11.875926971435547, "global_step": 262757, "epoch": 1564} {"train_loss": -11.983881950378418, "global_step": 262758, "epoch": 1564} {"train_loss": -11.74866008758545, "global_step": 262759, "epoch": 1564} {"train_loss": -12.271800994873047, "global_step": 262760, "epoch": 1564} {"train_loss": -11.840301513671875, "global_step": 262761, "epoch": 1564} {"train_loss": -12.172142028808594, "global_step": 262762, "epoch": 1564} {"train_loss": -12.043336868286133, "global_step": 262763, "epoch": 1564} {"train_loss": -11.734135627746582, "global_step": 262764, "epoch": 1564} {"train_loss": -11.893221855163574, "global_step": 262765, "epoch": 1564} {"train_loss": -11.80093002319336, "global_step": 262766, "epoch": 1564} {"train_loss": -11.932847023010254, "global_step": 262767, "epoch": 1564} {"train_loss": -11.968422889709473, "global_step": 262768, "epoch": 1564} {"train_loss": -11.773258209228516, "global_step": 262769, "epoch": 1564} {"train_loss": -11.676525115966797, "global_step": 262770, "epoch": 1564} {"train_loss": -11.831825256347656, "global_step": 262771, "epoch": 1564} {"train_loss": -11.716064453125, "global_step": 262772, "epoch": 1564} {"train_loss": -11.647542953491211, "global_step": 262773, "epoch": 1564} {"train_loss": -11.871089935302734, "global_step": 262774, "epoch": 1564} {"train_loss": -11.969953536987305, "global_step": 262775, "epoch": 1564} {"train_loss": -11.661700248718262, "global_step": 262776, "epoch": 1564} {"train_loss": -11.878304481506348, "global_step": 262777, "epoch": 1564} {"train_loss": -12.193147659301758, "global_step": 262778, "epoch": 1564} {"train_loss": -11.54615306854248, "global_step": 262779, "epoch": 1564} {"train_loss": -11.65806770324707, "global_step": 262780, "epoch": 1564} {"train_loss": -11.35700798034668, "global_step": 262781, "epoch": 1564} {"train_loss": -11.611992835998535, "global_step": 262782, "epoch": 1564} {"train_loss": -12.073942184448242, "global_step": 262783, "epoch": 1564} {"train_loss": -11.90876293182373, "global_step": 262784, "epoch": 1564} {"train_loss": -11.684535026550293, "global_step": 262785, "epoch": 1564} {"train_loss": -11.884574890136719, "global_step": 262786, "epoch": 1564} {"train_loss": -11.95893669128418, "global_step": 262787, "epoch": 1564} {"train_loss": -12.11383056640625, "global_step": 262788, "epoch": 1564} {"train_loss": -11.299535751342773, "global_step": 262789, "epoch": 1564} {"train_loss": -10.777796745300293, "global_step": 262790, "epoch": 1564} {"train_loss": -10.986287117004395, "global_step": 262791, "epoch": 1564} {"train_loss": -11.658614158630371, "global_step": 262792, "epoch": 1564} {"train_loss": -11.163040161132812, "global_step": 262793, "epoch": 1564} {"train_loss": -11.194458961486816, "global_step": 262794, "epoch": 1564} {"train_loss": -11.451268196105957, "global_step": 262795, "epoch": 1564} {"train_loss": -11.46876335144043, "global_step": 262796, "epoch": 1564} {"train_loss": -10.459548950195312, "global_step": 262797, "epoch": 1564} {"train_loss": -11.232450485229492, "global_step": 262798, "epoch": 1564} {"train_loss": -11.15913200378418, "global_step": 262799, "epoch": 1564} {"train_loss": -10.936738014221191, "global_step": 262800, "epoch": 1564} {"train_loss": -11.487943649291992, "global_step": 262801, "epoch": 1564} {"train_loss": -11.677391052246094, "global_step": 262802, "epoch": 1564} {"train_loss": -11.787064552307129, "global_step": 262803, "epoch": 1564} {"train_loss": -11.451172828674316, "global_step": 262804, "epoch": 1564} {"train_loss": -11.864502906799316, "global_step": 262805, "epoch": 1564} {"train_loss": -11.593244552612305, "global_step": 262806, "epoch": 1564} {"train_loss": -11.985878944396973, "global_step": 262807, "epoch": 1564} {"train_loss": -11.644643783569336, "global_step": 262808, "epoch": 1564} {"train_loss": -11.82362174987793, "global_step": 262809, "epoch": 1564} {"train_loss": -11.611961364746094, "global_step": 262810, "epoch": 1564} {"train_loss": -11.83475112915039, "global_step": 262811, "epoch": 1564} {"train_loss": -11.65640640258789, "global_step": 262812, "epoch": 1564} {"train_loss": -11.966169357299805, "global_step": 262813, "epoch": 1564} {"train_loss": -11.889973640441895, "global_step": 262814, "epoch": 1564} {"train_loss": -11.764175415039062, "global_step": 262815, "epoch": 1564} {"train_loss": -11.783712387084961, "global_step": 262816, "epoch": 1564} {"train_loss": -11.525564193725586, "global_step": 262817, "epoch": 1564} {"train_loss": -11.878623962402344, "global_step": 262818, "epoch": 1564} {"train_loss": -11.206668853759766, "global_step": 262819, "epoch": 1564} {"train_loss": -11.498047828674316, "global_step": 262820, "epoch": 1564} {"train_loss": -11.236092567443848, "global_step": 262821, "epoch": 1564} {"train_loss": -12.126705169677734, "global_step": 262822, "epoch": 1564} {"train_loss": -11.744895935058594, "global_step": 262823, "epoch": 1564} {"train_loss": -11.880146980285645, "global_step": 262824, "epoch": 1564} {"train_loss": -11.856082916259766, "global_step": 262825, "epoch": 1564} {"train_loss": -11.61815071105957, "global_step": 262826, "epoch": 1564} {"train_loss": -11.707515716552734, "global_step": 262827, "epoch": 1564} {"train_loss": -11.650907516479492, "global_step": 262828, "epoch": 1564} {"train_loss": -12.133495330810547, "global_step": 262829, "epoch": 1564} {"train_loss": -11.27499008178711, "global_step": 262830, "epoch": 1564} {"train_loss": -12.036230087280273, "global_step": 262831, "epoch": 1564} {"train_loss": -11.983572959899902, "global_step": 262832, "epoch": 1564} {"train_loss": -11.847755432128906, "global_step": 262833, "epoch": 1564} {"train_loss": -11.877068519592285, "global_step": 262834, "epoch": 1564} {"train_loss": -12.25444221496582, "global_step": 262835, "epoch": 1564} {"train_loss": -11.782694816589355, "global_step": 262836, "epoch": 1564} {"train_loss": -11.90041732788086, "global_step": 262837, "epoch": 1564} {"train_loss": -11.820281982421875, "global_step": 262838, "epoch": 1564} {"train_loss": -11.341535568237305, "global_step": 262839, "epoch": 1564} {"train_loss": -11.709842681884766, "global_step": 262840, "epoch": 1564} {"train_loss": -11.696794509887695, "global_step": 262841, "epoch": 1564} {"train_loss": -11.937215805053711, "global_step": 262842, "epoch": 1564} {"train_loss": -12.035889625549316, "global_step": 262843, "epoch": 1564} {"train_loss": -11.953207015991211, "global_step": 262844, "epoch": 1564} {"train_loss": -11.737184524536133, "global_step": 262845, "epoch": 1564} {"train_loss": -11.95187759399414, "global_step": 262846, "epoch": 1564} {"train_loss": -11.768144607543945, "global_step": 262847, "epoch": 1564} {"train_loss": -11.170808792114258, "global_step": 262848, "epoch": 1564} {"train_loss": -11.797685623168945, "global_step": 262849, "epoch": 1564} {"train_loss": -11.267068862915039, "global_step": 262850, "epoch": 1564} {"train_loss": -10.935467720031738, "global_step": 262851, "epoch": 1564} {"train_loss": -11.371575355529785, "global_step": 262852, "epoch": 1564} {"train_loss": -11.849925994873047, "global_step": 262853, "epoch": 1564} {"train_loss": -11.219046592712402, "global_step": 262854, "epoch": 1564} {"train_loss": -11.976486206054688, "global_step": 262855, "epoch": 1564} {"train_loss": -11.344890594482422, "global_step": 262856, "epoch": 1564} {"train_loss": -11.151288986206055, "global_step": 262857, "epoch": 1564} {"train_loss": -11.5851411819458, "global_step": 262858, "epoch": 1564} {"train_loss": -10.0490140914917, "global_step": 262859, "epoch": 1564} {"train_loss": -11.242036819458008, "global_step": 262860, "epoch": 1564} {"train_loss": -11.604631423950195, "global_step": 262861, "epoch": 1564} {"train_loss": -10.158489227294922, "global_step": 262862, "epoch": 1564} {"train_loss": -12.005964279174805, "global_step": 262863, "epoch": 1564} {"train_loss": -11.088857650756836, "global_step": 262864, "epoch": 1564} {"train_loss": -11.352256774902344, "global_step": 262865, "epoch": 1564} {"train_loss": -11.778017044067383, "global_step": 262866, "epoch": 1564} {"train_loss": -11.050280570983887, "global_step": 262867, "epoch": 1564} {"train_loss": -11.707049369812012, "global_step": 262868, "epoch": 1564} {"train_loss": -11.18830680847168, "global_step": 262869, "epoch": 1564} {"train_loss": -11.059103012084961, "global_step": 262870, "epoch": 1564} {"train_loss": -11.732351303100586, "global_step": 262871, "epoch": 1564} {"train_loss": -11.362201690673828, "global_step": 262872, "epoch": 1564} {"train_loss": -11.784126281738281, "global_step": 262873, "epoch": 1564} {"train_loss": -11.328365325927734, "global_step": 262874, "epoch": 1564} {"train_loss": -11.856595993041992, "global_step": 262875, "epoch": 1564} {"train_loss": -11.845514297485352, "global_step": 262876, "epoch": 1564} {"train_loss": -11.961325645446777, "global_step": 262877, "epoch": 1564} {"train_loss": -11.874460220336914, "global_step": 262878, "epoch": 1564} {"train_loss": -11.988275527954102, "global_step": 262879, "epoch": 1564} {"train_loss": -11.994162559509277, "global_step": 262880, "epoch": 1564} {"train_loss": -11.910388946533203, "global_step": 262881, "epoch": 1564} {"train_loss": -11.945708274841309, "global_step": 262882, "epoch": 1564} {"train_loss": -11.928089141845703, "global_step": 262883, "epoch": 1564} {"train_loss": -11.898321151733398, "global_step": 262884, "epoch": 1564} {"train_loss": -11.728302955627441, "global_step": 262885, "epoch": 1564} {"train_loss": -11.920700073242188, "global_step": 262886, "epoch": 1564} {"train_loss": -12.025810241699219, "global_step": 262887, "epoch": 1564} {"train_loss": -12.125802993774414, "global_step": 262888, "epoch": 1564} {"train_loss": -11.974660873413086, "global_step": 262889, "epoch": 1564} {"train_loss": -12.126516342163086, "global_step": 262890, "epoch": 1564} {"train_loss": -11.996435165405273, "global_step": 262891, "epoch": 1564} {"train_loss": -12.190690994262695, "global_step": 262892, "epoch": 1564} {"train_loss": -12.073066711425781, "global_step": 262893, "epoch": 1564} {"train_loss": -12.125465393066406, "global_step": 262894, "epoch": 1564} {"train_loss": -12.15938949584961, "global_step": 262895, "epoch": 1564} {"train_loss": -12.003641128540039, "global_step": 262896, "epoch": 1564} {"train_loss": -12.157646179199219, "global_step": 262897, "epoch": 1564} {"train_loss": -12.134672164916992, "global_step": 262898, "epoch": 1564} {"train_loss": -12.18587875366211, "global_step": 262899, "epoch": 1564} {"train_loss": -12.30868911743164, "global_step": 262900, "epoch": 1564} {"train_loss": -12.318502426147461, "global_step": 262901, "epoch": 1564} {"train_loss": -12.212059020996094, "global_step": 262902, "epoch": 1564} {"train_loss": -12.071158409118652, "global_step": 262903, "epoch": 1564} {"train_loss": -12.344751358032227, "global_step": 262904, "epoch": 1564} {"train_loss": -12.241081237792969, "global_step": 262905, "epoch": 1564} {"train_loss": -12.426780700683594, "global_step": 262906, "epoch": 1564} {"train_loss": -12.16727352142334, "global_step": 262907, "epoch": 1564} {"train_loss": -12.329151153564453, "global_step": 262908, "epoch": 1564} {"train_loss": -12.410402297973633, "global_step": 262909, "epoch": 1564} {"train_loss": -12.241567611694336, "global_step": 262910, "epoch": 1564} {"train_loss": -12.355734825134277, "global_step": 262911, "epoch": 1564} {"train_loss": -12.41610336303711, "global_step": 262912, "epoch": 1564} {"train_loss": -12.350687026977539, "global_step": 262913, "epoch": 1564} {"train_loss": -12.036449432373047, "global_step": 262914, "epoch": 1564} {"train_loss": -12.257970809936523, "global_step": 262915, "epoch": 1564} {"train_loss": -12.51140022277832, "global_step": 262916, "epoch": 1564} {"train_loss": -12.482704162597656, "global_step": 262917, "epoch": 1564} {"train_loss": -12.450235366821289, "global_step": 262918, "epoch": 1564} {"train_loss": -11.77420863651094, "global_step": 262919, "epoch": 1564, "val_loss": 268852.78125} {"train_loss": -12.299874305725098, "global_step": 262920, "epoch": 1565} {"train_loss": -12.269599914550781, "global_step": 262921, "epoch": 1565} {"train_loss": -12.312663078308105, "global_step": 262922, "epoch": 1565} {"train_loss": -11.802515983581543, "global_step": 262923, "epoch": 1565} {"train_loss": -12.088533401489258, "global_step": 262924, "epoch": 1565} {"train_loss": -11.827877044677734, "global_step": 262925, "epoch": 1565} {"train_loss": -11.806297302246094, "global_step": 262926, "epoch": 1565} {"train_loss": -10.735699653625488, "global_step": 262927, "epoch": 1565} {"train_loss": -11.28095817565918, "global_step": 262928, "epoch": 1565} {"train_loss": -10.939882278442383, "global_step": 262929, "epoch": 1565} {"train_loss": -11.604608535766602, "global_step": 262930, "epoch": 1565} {"train_loss": -10.666357040405273, "global_step": 262931, "epoch": 1565} {"train_loss": -10.239141464233398, "global_step": 262932, "epoch": 1565} {"train_loss": -10.344770431518555, "global_step": 262933, "epoch": 1565} {"train_loss": -10.181349754333496, "global_step": 262934, "epoch": 1565} {"train_loss": -9.262128829956055, "global_step": 262935, "epoch": 1565} {"train_loss": -9.403083801269531, "global_step": 262936, "epoch": 1565} {"train_loss": -10.388232231140137, "global_step": 262937, "epoch": 1565} {"train_loss": -10.40300178527832, "global_step": 262938, "epoch": 1565} {"train_loss": -8.888769149780273, "global_step": 262939, "epoch": 1565} {"train_loss": -11.092973709106445, "global_step": 262940, "epoch": 1565} {"train_loss": -9.612690925598145, "global_step": 262941, "epoch": 1565} {"train_loss": -10.541313171386719, "global_step": 262942, "epoch": 1565} {"train_loss": -9.747360229492188, "global_step": 262943, "epoch": 1565} {"train_loss": -11.669175148010254, "global_step": 262944, "epoch": 1565} {"train_loss": -9.833931922912598, "global_step": 262945, "epoch": 1565} {"train_loss": -10.912875175476074, "global_step": 262946, "epoch": 1565} {"train_loss": -10.717679977416992, "global_step": 262947, "epoch": 1565} {"train_loss": -10.892888069152832, "global_step": 262948, "epoch": 1565} {"train_loss": -11.088462829589844, "global_step": 262949, "epoch": 1565} {"train_loss": -10.984979629516602, "global_step": 262950, "epoch": 1565} {"train_loss": -11.656500816345215, "global_step": 262951, "epoch": 1565} {"train_loss": -10.926568031311035, "global_step": 262952, "epoch": 1565} {"train_loss": -11.73128890991211, "global_step": 262953, "epoch": 1565} {"train_loss": -10.92920207977295, "global_step": 262954, "epoch": 1565} {"train_loss": -11.555636405944824, "global_step": 262955, "epoch": 1565} {"train_loss": -11.214395523071289, "global_step": 262956, "epoch": 1565} {"train_loss": -11.67839241027832, "global_step": 262957, "epoch": 1565} {"train_loss": -11.648153305053711, "global_step": 262958, "epoch": 1565} {"train_loss": -11.733221054077148, "global_step": 262959, "epoch": 1565} {"train_loss": -11.663126945495605, "global_step": 262960, "epoch": 1565} {"train_loss": -11.489810943603516, "global_step": 262961, "epoch": 1565} {"train_loss": -11.737220764160156, "global_step": 262962, "epoch": 1565} {"train_loss": -11.61956787109375, "global_step": 262963, "epoch": 1565} {"train_loss": -11.52818489074707, "global_step": 262964, "epoch": 1565} {"train_loss": -11.677877426147461, "global_step": 262965, "epoch": 1565} {"train_loss": -11.933050155639648, "global_step": 262966, "epoch": 1565} {"train_loss": -11.7188720703125, "global_step": 262967, "epoch": 1565} {"train_loss": -11.65330696105957, "global_step": 262968, "epoch": 1565} {"train_loss": -11.836028099060059, "global_step": 262969, "epoch": 1565} {"train_loss": -11.727069854736328, "global_step": 262970, "epoch": 1565} {"train_loss": -11.838786125183105, "global_step": 262971, "epoch": 1565} {"train_loss": -11.779370307922363, "global_step": 262972, "epoch": 1565} {"train_loss": -11.789811134338379, "global_step": 262973, "epoch": 1565} {"train_loss": -11.85708236694336, "global_step": 262974, "epoch": 1565} {"train_loss": -11.636959075927734, "global_step": 262975, "epoch": 1565} {"train_loss": -11.637916564941406, "global_step": 262976, "epoch": 1565} {"train_loss": -11.707670211791992, "global_step": 262977, "epoch": 1565} {"train_loss": -11.443279266357422, "global_step": 262978, "epoch": 1565} {"train_loss": -11.78622817993164, "global_step": 262979, "epoch": 1565} {"train_loss": -11.770285606384277, "global_step": 262980, "epoch": 1565} {"train_loss": -11.834484100341797, "global_step": 262981, "epoch": 1565} {"train_loss": -11.749296188354492, "global_step": 262982, "epoch": 1565} {"train_loss": -11.945516586303711, "global_step": 262983, "epoch": 1565} {"train_loss": -11.708531379699707, "global_step": 262984, "epoch": 1565} {"train_loss": -11.829387664794922, "global_step": 262985, "epoch": 1565} {"train_loss": -11.687934875488281, "global_step": 262986, "epoch": 1565} {"train_loss": -11.619695663452148, "global_step": 262987, "epoch": 1565} {"train_loss": -11.83576774597168, "global_step": 262988, "epoch": 1565} {"train_loss": -11.94285774230957, "global_step": 262989, "epoch": 1565} {"train_loss": -12.144050598144531, "global_step": 262990, "epoch": 1565} {"train_loss": -11.684890747070312, "global_step": 262991, "epoch": 1565} {"train_loss": -11.95221996307373, "global_step": 262992, "epoch": 1565} {"train_loss": -12.0259428024292, "global_step": 262993, "epoch": 1565} {"train_loss": -11.728754043579102, "global_step": 262994, "epoch": 1565} {"train_loss": -11.77412223815918, "global_step": 262995, "epoch": 1565} {"train_loss": -12.002878189086914, "global_step": 262996, "epoch": 1565} {"train_loss": -11.472116470336914, "global_step": 262997, "epoch": 1565} {"train_loss": -12.101040840148926, "global_step": 262998, "epoch": 1565} {"train_loss": -11.930234909057617, "global_step": 262999, "epoch": 1565} {"train_loss": -11.975632667541504, "global_step": 263000, "epoch": 1565} {"train_loss": -11.580730438232422, "global_step": 263001, "epoch": 1565} {"train_loss": -11.866070747375488, "global_step": 263002, "epoch": 1565} {"train_loss": -11.716464042663574, "global_step": 263003, "epoch": 1565} {"train_loss": -12.069287300109863, "global_step": 263004, "epoch": 1565} {"train_loss": -11.922676086425781, "global_step": 263005, "epoch": 1565} {"train_loss": -11.863142013549805, "global_step": 263006, "epoch": 1565} {"train_loss": -12.162485122680664, "global_step": 263007, "epoch": 1565} {"train_loss": -11.956247329711914, "global_step": 263008, "epoch": 1565} {"train_loss": -11.918079376220703, "global_step": 263009, "epoch": 1565} {"train_loss": -11.871566772460938, "global_step": 263010, "epoch": 1565} {"train_loss": -11.677721977233887, "global_step": 263011, "epoch": 1565} {"train_loss": -10.597428321838379, "global_step": 263012, "epoch": 1565} {"train_loss": -10.392067909240723, "global_step": 263013, "epoch": 1565} {"train_loss": -10.65842056274414, "global_step": 263014, "epoch": 1565} {"train_loss": -10.774620056152344, "global_step": 263015, "epoch": 1565} {"train_loss": -11.762723922729492, "global_step": 263016, "epoch": 1565} {"train_loss": -10.899663925170898, "global_step": 263017, "epoch": 1565} {"train_loss": -11.928651809692383, "global_step": 263018, "epoch": 1565} {"train_loss": -11.098052024841309, "global_step": 263019, "epoch": 1565} {"train_loss": -11.468671798706055, "global_step": 263020, "epoch": 1565} {"train_loss": -11.850676536560059, "global_step": 263021, "epoch": 1565} {"train_loss": -11.515434265136719, "global_step": 263022, "epoch": 1565} {"train_loss": -11.948042869567871, "global_step": 263023, "epoch": 1565} {"train_loss": -11.007457733154297, "global_step": 263024, "epoch": 1565} {"train_loss": -11.982597351074219, "global_step": 263025, "epoch": 1565} {"train_loss": -11.457958221435547, "global_step": 263026, "epoch": 1565} {"train_loss": -11.681222915649414, "global_step": 263027, "epoch": 1565} {"train_loss": -11.436943054199219, "global_step": 263028, "epoch": 1565} {"train_loss": -11.42306900024414, "global_step": 263029, "epoch": 1565} {"train_loss": -11.663166046142578, "global_step": 263030, "epoch": 1565} {"train_loss": -11.706182479858398, "global_step": 263031, "epoch": 1565} {"train_loss": -11.899711608886719, "global_step": 263032, "epoch": 1565} {"train_loss": -11.737957000732422, "global_step": 263033, "epoch": 1565} {"train_loss": -11.81408977508545, "global_step": 263034, "epoch": 1565} {"train_loss": -11.924339294433594, "global_step": 263035, "epoch": 1565} {"train_loss": -11.918338775634766, "global_step": 263036, "epoch": 1565} {"train_loss": -11.871195793151855, "global_step": 263037, "epoch": 1565} {"train_loss": -11.684314727783203, "global_step": 263038, "epoch": 1565} {"train_loss": -11.885769844055176, "global_step": 263039, "epoch": 1565} {"train_loss": -11.733774185180664, "global_step": 263040, "epoch": 1565} {"train_loss": -12.145917892456055, "global_step": 263041, "epoch": 1565} {"train_loss": -11.777922630310059, "global_step": 263042, "epoch": 1565} {"train_loss": -11.881889343261719, "global_step": 263043, "epoch": 1565} {"train_loss": -11.941665649414062, "global_step": 263044, "epoch": 1565} {"train_loss": -11.917184829711914, "global_step": 263045, "epoch": 1565} {"train_loss": -11.93840217590332, "global_step": 263046, "epoch": 1565} {"train_loss": -11.677404403686523, "global_step": 263047, "epoch": 1565} {"train_loss": -12.167484283447266, "global_step": 263048, "epoch": 1565} {"train_loss": -11.57476806640625, "global_step": 263049, "epoch": 1565} {"train_loss": -12.130084991455078, "global_step": 263050, "epoch": 1565} {"train_loss": -11.921062469482422, "global_step": 263051, "epoch": 1565} {"train_loss": -11.925086975097656, "global_step": 263052, "epoch": 1565} {"train_loss": -11.88743782043457, "global_step": 263053, "epoch": 1565} {"train_loss": -11.933149337768555, "global_step": 263054, "epoch": 1565} {"train_loss": -11.919036865234375, "global_step": 263055, "epoch": 1565} {"train_loss": -12.01560115814209, "global_step": 263056, "epoch": 1565} {"train_loss": -12.187840461730957, "global_step": 263057, "epoch": 1565} {"train_loss": -12.024774551391602, "global_step": 263058, "epoch": 1565} {"train_loss": -12.208227157592773, "global_step": 263059, "epoch": 1565} {"train_loss": -12.07054328918457, "global_step": 263060, "epoch": 1565} {"train_loss": -12.25296688079834, "global_step": 263061, "epoch": 1565} {"train_loss": -12.248990058898926, "global_step": 263062, "epoch": 1565} {"train_loss": -12.080808639526367, "global_step": 263063, "epoch": 1565} {"train_loss": -12.162172317504883, "global_step": 263064, "epoch": 1565} {"train_loss": -12.289498329162598, "global_step": 263065, "epoch": 1565} {"train_loss": -12.085874557495117, "global_step": 263066, "epoch": 1565} {"train_loss": -12.234498977661133, "global_step": 263067, "epoch": 1565} {"train_loss": -11.796813011169434, "global_step": 263068, "epoch": 1565} {"train_loss": -11.721389770507812, "global_step": 263069, "epoch": 1565} {"train_loss": -12.071812629699707, "global_step": 263070, "epoch": 1565} {"train_loss": -11.764013290405273, "global_step": 263071, "epoch": 1565} {"train_loss": -12.037233352661133, "global_step": 263072, "epoch": 1565} {"train_loss": -11.894375801086426, "global_step": 263073, "epoch": 1565} {"train_loss": -11.957405090332031, "global_step": 263074, "epoch": 1565} {"train_loss": -12.280123710632324, "global_step": 263075, "epoch": 1565} {"train_loss": -11.948456764221191, "global_step": 263076, "epoch": 1565} {"train_loss": -11.935951232910156, "global_step": 263077, "epoch": 1565} {"train_loss": -11.941254615783691, "global_step": 263078, "epoch": 1565} {"train_loss": -12.235196113586426, "global_step": 263079, "epoch": 1565} {"train_loss": -12.283773422241211, "global_step": 263080, "epoch": 1565} {"train_loss": -12.346413612365723, "global_step": 263081, "epoch": 1565} {"train_loss": -12.04818344116211, "global_step": 263082, "epoch": 1565} {"train_loss": -11.960878372192383, "global_step": 263083, "epoch": 1565} {"train_loss": -11.794421195983887, "global_step": 263084, "epoch": 1565} {"train_loss": -12.124103546142578, "global_step": 263085, "epoch": 1565} {"train_loss": -11.797664642333984, "global_step": 263086, "epoch": 1565} {"train_loss": -11.606513443447295, "global_step": 263087, "epoch": 1565, "val_loss": 271515.59375, "train_action_mse_error": 4.657482624053955} {"train_loss": -12.06805419921875, "global_step": 263088, "epoch": 1566} {"train_loss": -11.757097244262695, "global_step": 263089, "epoch": 1566} {"train_loss": -11.739463806152344, "global_step": 263090, "epoch": 1566} {"train_loss": -12.011273384094238, "global_step": 263091, "epoch": 1566} {"train_loss": -11.827400207519531, "global_step": 263092, "epoch": 1566} {"train_loss": -11.943607330322266, "global_step": 263093, "epoch": 1566} {"train_loss": -11.015477180480957, "global_step": 263094, "epoch": 1566} {"train_loss": -10.657122611999512, "global_step": 263095, "epoch": 1566} {"train_loss": -11.572208404541016, "global_step": 263096, "epoch": 1566} {"train_loss": -10.050042152404785, "global_step": 263097, "epoch": 1566} {"train_loss": -10.756589889526367, "global_step": 263098, "epoch": 1566} {"train_loss": -11.102920532226562, "global_step": 263099, "epoch": 1566} {"train_loss": -10.481842041015625, "global_step": 263100, "epoch": 1566} {"train_loss": -9.54446029663086, "global_step": 263101, "epoch": 1566} {"train_loss": -10.742486953735352, "global_step": 263102, "epoch": 1566} {"train_loss": -10.835286140441895, "global_step": 263103, "epoch": 1566} {"train_loss": -9.730024337768555, "global_step": 263104, "epoch": 1566} {"train_loss": -10.469528198242188, "global_step": 263105, "epoch": 1566} {"train_loss": -10.874250411987305, "global_step": 263106, "epoch": 1566} {"train_loss": -9.351823806762695, "global_step": 263107, "epoch": 1566} {"train_loss": -10.247781753540039, "global_step": 263108, "epoch": 1566} {"train_loss": -10.84463119506836, "global_step": 263109, "epoch": 1566} {"train_loss": -10.324737548828125, "global_step": 263110, "epoch": 1566} {"train_loss": -10.299430847167969, "global_step": 263111, "epoch": 1566} {"train_loss": -9.064253807067871, "global_step": 263112, "epoch": 1566} {"train_loss": -10.3761568069458, "global_step": 263113, "epoch": 1566} {"train_loss": -10.389886856079102, "global_step": 263114, "epoch": 1566} {"train_loss": -9.649781227111816, "global_step": 263115, "epoch": 1566} {"train_loss": -10.818755149841309, "global_step": 263116, "epoch": 1566} {"train_loss": -10.36240291595459, "global_step": 263117, "epoch": 1566} {"train_loss": -9.287201881408691, "global_step": 263118, "epoch": 1566} {"train_loss": -10.78104019165039, "global_step": 263119, "epoch": 1566} {"train_loss": -9.956790924072266, "global_step": 263120, "epoch": 1566} {"train_loss": -9.140388488769531, "global_step": 263121, "epoch": 1566} {"train_loss": -10.75885009765625, "global_step": 263122, "epoch": 1566} {"train_loss": -10.233955383300781, "global_step": 263123, "epoch": 1566} {"train_loss": -10.357902526855469, "global_step": 263124, "epoch": 1566} {"train_loss": -11.166056632995605, "global_step": 263125, "epoch": 1566} {"train_loss": -10.295363426208496, "global_step": 263126, "epoch": 1566} {"train_loss": -10.988210678100586, "global_step": 263127, "epoch": 1566} {"train_loss": -10.582125663757324, "global_step": 263128, "epoch": 1566} {"train_loss": -11.06403923034668, "global_step": 263129, "epoch": 1566} {"train_loss": -10.94784927368164, "global_step": 263130, "epoch": 1566} {"train_loss": -11.1763277053833, "global_step": 263131, "epoch": 1566} {"train_loss": -11.350168228149414, "global_step": 263132, "epoch": 1566} {"train_loss": -11.359848976135254, "global_step": 263133, "epoch": 1566} {"train_loss": -11.148611068725586, "global_step": 263134, "epoch": 1566} {"train_loss": -11.621399879455566, "global_step": 263135, "epoch": 1566} {"train_loss": -11.482210159301758, "global_step": 263136, "epoch": 1566} {"train_loss": -11.440725326538086, "global_step": 263137, "epoch": 1566} {"train_loss": -11.561665534973145, "global_step": 263138, "epoch": 1566} {"train_loss": -11.520879745483398, "global_step": 263139, "epoch": 1566} {"train_loss": -11.58896255493164, "global_step": 263140, "epoch": 1566} {"train_loss": -11.725420951843262, "global_step": 263141, "epoch": 1566} {"train_loss": -11.452951431274414, "global_step": 263142, "epoch": 1566} {"train_loss": -11.689718246459961, "global_step": 263143, "epoch": 1566} {"train_loss": -11.767001152038574, "global_step": 263144, "epoch": 1566} {"train_loss": -11.76225471496582, "global_step": 263145, "epoch": 1566} {"train_loss": -11.68136215209961, "global_step": 263146, "epoch": 1566} {"train_loss": -11.76253890991211, "global_step": 263147, "epoch": 1566} {"train_loss": -11.719345092773438, "global_step": 263148, "epoch": 1566} {"train_loss": -11.728008270263672, "global_step": 263149, "epoch": 1566} {"train_loss": -11.819742202758789, "global_step": 263150, "epoch": 1566} {"train_loss": -11.813613891601562, "global_step": 263151, "epoch": 1566} {"train_loss": -11.865882873535156, "global_step": 263152, "epoch": 1566} {"train_loss": -11.83285903930664, "global_step": 263153, "epoch": 1566} {"train_loss": -11.745682716369629, "global_step": 263154, "epoch": 1566} {"train_loss": -11.637187004089355, "global_step": 263155, "epoch": 1566} {"train_loss": -11.597257614135742, "global_step": 263156, "epoch": 1566} {"train_loss": -11.978777885437012, "global_step": 263157, "epoch": 1566} {"train_loss": -11.48139476776123, "global_step": 263158, "epoch": 1566} {"train_loss": -11.711727142333984, "global_step": 263159, "epoch": 1566} {"train_loss": -11.752351760864258, "global_step": 263160, "epoch": 1566} {"train_loss": -11.702710151672363, "global_step": 263161, "epoch": 1566} {"train_loss": -11.896244049072266, "global_step": 263162, "epoch": 1566} {"train_loss": -11.78760814666748, "global_step": 263163, "epoch": 1566} {"train_loss": -11.747243881225586, "global_step": 263164, "epoch": 1566} {"train_loss": -11.937893867492676, "global_step": 263165, "epoch": 1566} {"train_loss": -11.938279151916504, "global_step": 263166, "epoch": 1566} {"train_loss": -12.0203218460083, "global_step": 263167, "epoch": 1566} {"train_loss": -11.637273788452148, "global_step": 263168, "epoch": 1566} {"train_loss": -12.049629211425781, "global_step": 263169, "epoch": 1566} {"train_loss": -11.518350601196289, "global_step": 263170, "epoch": 1566} {"train_loss": -12.105180740356445, "global_step": 263171, "epoch": 1566} {"train_loss": -11.623306274414062, "global_step": 263172, "epoch": 1566} {"train_loss": -12.171014785766602, "global_step": 263173, "epoch": 1566} {"train_loss": -11.779540061950684, "global_step": 263174, "epoch": 1566} {"train_loss": -12.152542114257812, "global_step": 263175, "epoch": 1566} {"train_loss": -12.06380844116211, "global_step": 263176, "epoch": 1566} {"train_loss": -12.160149574279785, "global_step": 263177, "epoch": 1566} {"train_loss": -11.993707656860352, "global_step": 263178, "epoch": 1566} {"train_loss": -12.054357528686523, "global_step": 263179, "epoch": 1566} {"train_loss": -11.742500305175781, "global_step": 263180, "epoch": 1566} {"train_loss": -12.245668411254883, "global_step": 263181, "epoch": 1566} {"train_loss": -12.177066802978516, "global_step": 263182, "epoch": 1566} {"train_loss": -12.002876281738281, "global_step": 263183, "epoch": 1566} {"train_loss": -12.17643928527832, "global_step": 263184, "epoch": 1566} {"train_loss": -11.996625900268555, "global_step": 263185, "epoch": 1566} {"train_loss": -12.183067321777344, "global_step": 263186, "epoch": 1566} {"train_loss": -12.241392135620117, "global_step": 263187, "epoch": 1566} {"train_loss": -12.049032211303711, "global_step": 263188, "epoch": 1566} {"train_loss": -12.219512939453125, "global_step": 263189, "epoch": 1566} {"train_loss": -12.094178199768066, "global_step": 263190, "epoch": 1566} {"train_loss": -12.116945266723633, "global_step": 263191, "epoch": 1566} {"train_loss": -12.144792556762695, "global_step": 263192, "epoch": 1566} {"train_loss": -12.059738159179688, "global_step": 263193, "epoch": 1566} {"train_loss": -12.311899185180664, "global_step": 263194, "epoch": 1566} {"train_loss": -12.0753812789917, "global_step": 263195, "epoch": 1566} {"train_loss": -12.25798225402832, "global_step": 263196, "epoch": 1566} {"train_loss": -12.236553192138672, "global_step": 263197, "epoch": 1566} {"train_loss": -12.319039344787598, "global_step": 263198, "epoch": 1566} {"train_loss": -12.171643257141113, "global_step": 263199, "epoch": 1566} {"train_loss": -12.099599838256836, "global_step": 263200, "epoch": 1566} {"train_loss": -12.344667434692383, "global_step": 263201, "epoch": 1566} {"train_loss": -12.269979476928711, "global_step": 263202, "epoch": 1566} {"train_loss": -12.293027877807617, "global_step": 263203, "epoch": 1566} {"train_loss": -12.256248474121094, "global_step": 263204, "epoch": 1566} {"train_loss": -12.393877029418945, "global_step": 263205, "epoch": 1566} {"train_loss": -12.263715744018555, "global_step": 263206, "epoch": 1566} {"train_loss": -12.341109275817871, "global_step": 263207, "epoch": 1566} {"train_loss": -12.036760330200195, "global_step": 263208, "epoch": 1566} {"train_loss": -12.382177352905273, "global_step": 263209, "epoch": 1566} {"train_loss": -12.247284889221191, "global_step": 263210, "epoch": 1566} {"train_loss": -12.35362720489502, "global_step": 263211, "epoch": 1566} {"train_loss": -12.355119705200195, "global_step": 263212, "epoch": 1566} {"train_loss": -12.227884292602539, "global_step": 263213, "epoch": 1566} {"train_loss": -12.474546432495117, "global_step": 263214, "epoch": 1566} {"train_loss": -12.35406494140625, "global_step": 263215, "epoch": 1566} {"train_loss": -12.459344863891602, "global_step": 263216, "epoch": 1566} {"train_loss": -12.210044860839844, "global_step": 263217, "epoch": 1566} {"train_loss": -12.481473922729492, "global_step": 263218, "epoch": 1566} {"train_loss": -12.393767356872559, "global_step": 263219, "epoch": 1566} {"train_loss": -12.25320053100586, "global_step": 263220, "epoch": 1566} {"train_loss": -12.219684600830078, "global_step": 263221, "epoch": 1566} {"train_loss": -12.118781089782715, "global_step": 263222, "epoch": 1566} {"train_loss": -11.815726280212402, "global_step": 263223, "epoch": 1566} {"train_loss": -10.621583938598633, "global_step": 263224, "epoch": 1566} {"train_loss": -10.496752738952637, "global_step": 263225, "epoch": 1566} {"train_loss": -11.83971118927002, "global_step": 263226, "epoch": 1566} {"train_loss": -9.299747467041016, "global_step": 263227, "epoch": 1566} {"train_loss": -9.766565322875977, "global_step": 263228, "epoch": 1566} {"train_loss": -11.191359519958496, "global_step": 263229, "epoch": 1566} {"train_loss": -7.916259765625, "global_step": 263230, "epoch": 1566} {"train_loss": -9.551630973815918, "global_step": 263231, "epoch": 1566} {"train_loss": -11.59013843536377, "global_step": 263232, "epoch": 1566} {"train_loss": -9.887325286865234, "global_step": 263233, "epoch": 1566} {"train_loss": -11.180597305297852, "global_step": 263234, "epoch": 1566} {"train_loss": -10.044783592224121, "global_step": 263235, "epoch": 1566} {"train_loss": -10.167390823364258, "global_step": 263236, "epoch": 1566} {"train_loss": -11.121089935302734, "global_step": 263237, "epoch": 1566} {"train_loss": -9.984733581542969, "global_step": 263238, "epoch": 1566} {"train_loss": -11.426142692565918, "global_step": 263239, "epoch": 1566} {"train_loss": -11.35189151763916, "global_step": 263240, "epoch": 1566} {"train_loss": -11.164210319519043, "global_step": 263241, "epoch": 1566} {"train_loss": -11.079094886779785, "global_step": 263242, "epoch": 1566} {"train_loss": -10.797687530517578, "global_step": 263243, "epoch": 1566} {"train_loss": -11.613375663757324, "global_step": 263244, "epoch": 1566} {"train_loss": -10.963432312011719, "global_step": 263245, "epoch": 1566} {"train_loss": -10.921722412109375, "global_step": 263246, "epoch": 1566} {"train_loss": -11.759344100952148, "global_step": 263247, "epoch": 1566} {"train_loss": -11.096277236938477, "global_step": 263248, "epoch": 1566} {"train_loss": -11.17223834991455, "global_step": 263249, "epoch": 1566} {"train_loss": -11.580942153930664, "global_step": 263250, "epoch": 1566} {"train_loss": -10.477169036865234, "global_step": 263251, "epoch": 1566} {"train_loss": -11.682403564453125, "global_step": 263252, "epoch": 1566} {"train_loss": -9.857593536376953, "global_step": 263253, "epoch": 1566} {"train_loss": -11.032003402709961, "global_step": 263254, "epoch": 1566} {"train_loss": -11.385882644426255, "global_step": 263255, "epoch": 1566, "val_loss": 256939.1875} {"train_loss": -11.230220794677734, "global_step": 263256, "epoch": 1567} {"train_loss": -11.667945861816406, "global_step": 263257, "epoch": 1567} {"train_loss": -11.272662162780762, "global_step": 263258, "epoch": 1567} {"train_loss": -11.717620849609375, "global_step": 263259, "epoch": 1567} {"train_loss": -11.163431167602539, "global_step": 263260, "epoch": 1567} {"train_loss": -11.667795181274414, "global_step": 263261, "epoch": 1567} {"train_loss": -11.426321029663086, "global_step": 263262, "epoch": 1567} {"train_loss": -11.438873291015625, "global_step": 263263, "epoch": 1567} {"train_loss": -11.17249870300293, "global_step": 263264, "epoch": 1567} {"train_loss": -11.206622123718262, "global_step": 263265, "epoch": 1567} {"train_loss": -11.244916915893555, "global_step": 263266, "epoch": 1567} {"train_loss": -11.475139617919922, "global_step": 263267, "epoch": 1567} {"train_loss": -11.386622428894043, "global_step": 263268, "epoch": 1567} {"train_loss": -11.447391510009766, "global_step": 263269, "epoch": 1567} {"train_loss": -11.63064193725586, "global_step": 263270, "epoch": 1567} {"train_loss": -11.474864959716797, "global_step": 263271, "epoch": 1567} {"train_loss": -11.420740127563477, "global_step": 263272, "epoch": 1567} {"train_loss": -11.58888053894043, "global_step": 263273, "epoch": 1567} {"train_loss": -11.420589447021484, "global_step": 263274, "epoch": 1567} {"train_loss": -11.871705055236816, "global_step": 263275, "epoch": 1567} {"train_loss": -11.729623794555664, "global_step": 263276, "epoch": 1567} {"train_loss": -11.52026653289795, "global_step": 263277, "epoch": 1567} {"train_loss": -11.831140518188477, "global_step": 263278, "epoch": 1567} {"train_loss": -11.747241020202637, "global_step": 263279, "epoch": 1567} {"train_loss": -11.39373779296875, "global_step": 263280, "epoch": 1567} {"train_loss": -11.896968841552734, "global_step": 263281, "epoch": 1567} {"train_loss": -11.658199310302734, "global_step": 263282, "epoch": 1567} {"train_loss": -11.824755668640137, "global_step": 263283, "epoch": 1567} {"train_loss": -11.900711059570312, "global_step": 263284, "epoch": 1567} {"train_loss": -11.751205444335938, "global_step": 263285, "epoch": 1567} {"train_loss": -11.944086074829102, "global_step": 263286, "epoch": 1567} {"train_loss": -11.881571769714355, "global_step": 263287, "epoch": 1567} {"train_loss": -11.92379379272461, "global_step": 263288, "epoch": 1567} {"train_loss": -11.948016166687012, "global_step": 263289, "epoch": 1567} {"train_loss": -11.973685264587402, "global_step": 263290, "epoch": 1567} {"train_loss": -12.030254364013672, "global_step": 263291, "epoch": 1567} {"train_loss": -11.831558227539062, "global_step": 263292, "epoch": 1567} {"train_loss": -12.045526504516602, "global_step": 263293, "epoch": 1567} {"train_loss": -12.19591236114502, "global_step": 263294, "epoch": 1567} {"train_loss": -11.981106758117676, "global_step": 263295, "epoch": 1567} {"train_loss": -12.102361679077148, "global_step": 263296, "epoch": 1567} {"train_loss": -12.068342208862305, "global_step": 263297, "epoch": 1567} {"train_loss": -11.754511833190918, "global_step": 263298, "epoch": 1567} {"train_loss": -11.898759841918945, "global_step": 263299, "epoch": 1567} {"train_loss": -11.902654647827148, "global_step": 263300, "epoch": 1567} {"train_loss": -11.464739799499512, "global_step": 263301, "epoch": 1567} {"train_loss": -11.820499420166016, "global_step": 263302, "epoch": 1567} {"train_loss": -11.688827514648438, "global_step": 263303, "epoch": 1567} {"train_loss": -11.416411399841309, "global_step": 263304, "epoch": 1567} {"train_loss": -11.815059661865234, "global_step": 263305, "epoch": 1567} {"train_loss": -12.1541748046875, "global_step": 263306, "epoch": 1567} {"train_loss": -11.644173622131348, "global_step": 263307, "epoch": 1567} {"train_loss": -12.019638061523438, "global_step": 263308, "epoch": 1567} {"train_loss": -11.874141693115234, "global_step": 263309, "epoch": 1567} {"train_loss": -11.477861404418945, "global_step": 263310, "epoch": 1567} {"train_loss": -11.854072570800781, "global_step": 263311, "epoch": 1567} {"train_loss": -11.992757797241211, "global_step": 263312, "epoch": 1567} {"train_loss": -11.93255615234375, "global_step": 263313, "epoch": 1567} {"train_loss": -11.963676452636719, "global_step": 263314, "epoch": 1567} {"train_loss": -11.873944282531738, "global_step": 263315, "epoch": 1567} {"train_loss": -11.936037063598633, "global_step": 263316, "epoch": 1567} {"train_loss": -12.027463912963867, "global_step": 263317, "epoch": 1567} {"train_loss": -12.037665367126465, "global_step": 263318, "epoch": 1567} {"train_loss": -11.935027122497559, "global_step": 263319, "epoch": 1567} {"train_loss": -11.980224609375, "global_step": 263320, "epoch": 1567} {"train_loss": -12.068049430847168, "global_step": 263321, "epoch": 1567} {"train_loss": -12.247688293457031, "global_step": 263322, "epoch": 1567} {"train_loss": -12.079423904418945, "global_step": 263323, "epoch": 1567} {"train_loss": -12.255125045776367, "global_step": 263324, "epoch": 1567} {"train_loss": -11.962278366088867, "global_step": 263325, "epoch": 1567} {"train_loss": -11.779422760009766, "global_step": 263326, "epoch": 1567} {"train_loss": -11.956034660339355, "global_step": 263327, "epoch": 1567} {"train_loss": -11.726836204528809, "global_step": 263328, "epoch": 1567} {"train_loss": -12.059585571289062, "global_step": 263329, "epoch": 1567} {"train_loss": -11.950637817382812, "global_step": 263330, "epoch": 1567} {"train_loss": -11.795482635498047, "global_step": 263331, "epoch": 1567} {"train_loss": -11.893857955932617, "global_step": 263332, "epoch": 1567} {"train_loss": -11.495757102966309, "global_step": 263333, "epoch": 1567} {"train_loss": -12.080656051635742, "global_step": 263334, "epoch": 1567} {"train_loss": -11.386632919311523, "global_step": 263335, "epoch": 1567} {"train_loss": -12.01887035369873, "global_step": 263336, "epoch": 1567} {"train_loss": -11.785325050354004, "global_step": 263337, "epoch": 1567} {"train_loss": -10.861677169799805, "global_step": 263338, "epoch": 1567} {"train_loss": -11.863105773925781, "global_step": 263339, "epoch": 1567} {"train_loss": -11.646987915039062, "global_step": 263340, "epoch": 1567} {"train_loss": -11.49073600769043, "global_step": 263341, "epoch": 1567} {"train_loss": -12.026067733764648, "global_step": 263342, "epoch": 1567} {"train_loss": -11.135509490966797, "global_step": 263343, "epoch": 1567} {"train_loss": -11.600339889526367, "global_step": 263344, "epoch": 1567} {"train_loss": -11.110818862915039, "global_step": 263345, "epoch": 1567} {"train_loss": -11.434386253356934, "global_step": 263346, "epoch": 1567} {"train_loss": -11.925459861755371, "global_step": 263347, "epoch": 1567} {"train_loss": -11.547801971435547, "global_step": 263348, "epoch": 1567} {"train_loss": -12.029098510742188, "global_step": 263349, "epoch": 1567} {"train_loss": -11.318607330322266, "global_step": 263350, "epoch": 1567} {"train_loss": -11.538555145263672, "global_step": 263351, "epoch": 1567} {"train_loss": -11.778789520263672, "global_step": 263352, "epoch": 1567} {"train_loss": -11.803237915039062, "global_step": 263353, "epoch": 1567} {"train_loss": -10.469438552856445, "global_step": 263354, "epoch": 1567} {"train_loss": -11.117605209350586, "global_step": 263355, "epoch": 1567} {"train_loss": -10.93821907043457, "global_step": 263356, "epoch": 1567} {"train_loss": -11.691699981689453, "global_step": 263357, "epoch": 1567} {"train_loss": -10.621988296508789, "global_step": 263358, "epoch": 1567} {"train_loss": -11.60739517211914, "global_step": 263359, "epoch": 1567} {"train_loss": -11.171422004699707, "global_step": 263360, "epoch": 1567} {"train_loss": -11.122570037841797, "global_step": 263361, "epoch": 1567} {"train_loss": -11.404661178588867, "global_step": 263362, "epoch": 1567} {"train_loss": -11.252405166625977, "global_step": 263363, "epoch": 1567} {"train_loss": -11.401874542236328, "global_step": 263364, "epoch": 1567} {"train_loss": -10.869855880737305, "global_step": 263365, "epoch": 1567} {"train_loss": -11.248598098754883, "global_step": 263366, "epoch": 1567} {"train_loss": -11.1242036819458, "global_step": 263367, "epoch": 1567} {"train_loss": -11.10777473449707, "global_step": 263368, "epoch": 1567} {"train_loss": -11.800302505493164, "global_step": 263369, "epoch": 1567} {"train_loss": -11.268457412719727, "global_step": 263370, "epoch": 1567} {"train_loss": -11.195209503173828, "global_step": 263371, "epoch": 1567} {"train_loss": -10.128787994384766, "global_step": 263372, "epoch": 1567} {"train_loss": -11.065807342529297, "global_step": 263373, "epoch": 1567} {"train_loss": -9.8388671875, "global_step": 263374, "epoch": 1567} {"train_loss": -9.778142929077148, "global_step": 263375, "epoch": 1567} {"train_loss": -10.785043716430664, "global_step": 263376, "epoch": 1567} {"train_loss": -10.429994583129883, "global_step": 263377, "epoch": 1567} {"train_loss": -10.316349029541016, "global_step": 263378, "epoch": 1567} {"train_loss": -10.243650436401367, "global_step": 263379, "epoch": 1567} {"train_loss": -10.635553359985352, "global_step": 263380, "epoch": 1567} {"train_loss": -10.504022598266602, "global_step": 263381, "epoch": 1567} {"train_loss": -10.810894012451172, "global_step": 263382, "epoch": 1567} {"train_loss": -10.794525146484375, "global_step": 263383, "epoch": 1567} {"train_loss": -10.814384460449219, "global_step": 263384, "epoch": 1567} {"train_loss": -11.242561340332031, "global_step": 263385, "epoch": 1567} {"train_loss": -10.33565902709961, "global_step": 263386, "epoch": 1567} {"train_loss": -11.480079650878906, "global_step": 263387, "epoch": 1567} {"train_loss": -11.174373626708984, "global_step": 263388, "epoch": 1567} {"train_loss": -10.730171203613281, "global_step": 263389, "epoch": 1567} {"train_loss": -11.226151466369629, "global_step": 263390, "epoch": 1567} {"train_loss": -11.353533744812012, "global_step": 263391, "epoch": 1567} {"train_loss": -11.028332710266113, "global_step": 263392, "epoch": 1567} {"train_loss": -11.313226699829102, "global_step": 263393, "epoch": 1567} {"train_loss": -11.572622299194336, "global_step": 263394, "epoch": 1567} {"train_loss": -11.137852668762207, "global_step": 263395, "epoch": 1567} {"train_loss": -11.497469902038574, "global_step": 263396, "epoch": 1567} {"train_loss": -11.563066482543945, "global_step": 263397, "epoch": 1567} {"train_loss": -11.420858383178711, "global_step": 263398, "epoch": 1567} {"train_loss": -11.667938232421875, "global_step": 263399, "epoch": 1567} {"train_loss": -11.94625473022461, "global_step": 263400, "epoch": 1567} {"train_loss": -11.640575408935547, "global_step": 263401, "epoch": 1567} {"train_loss": -11.657658576965332, "global_step": 263402, "epoch": 1567} {"train_loss": -11.827505111694336, "global_step": 263403, "epoch": 1567} {"train_loss": -11.548608779907227, "global_step": 263404, "epoch": 1567} {"train_loss": -11.33056926727295, "global_step": 263405, "epoch": 1567} {"train_loss": -11.748323440551758, "global_step": 263406, "epoch": 1567} {"train_loss": -11.684280395507812, "global_step": 263407, "epoch": 1567} {"train_loss": -11.608478546142578, "global_step": 263408, "epoch": 1567} {"train_loss": -12.036896705627441, "global_step": 263409, "epoch": 1567} {"train_loss": -11.680073738098145, "global_step": 263410, "epoch": 1567} {"train_loss": -11.389827728271484, "global_step": 263411, "epoch": 1567} {"train_loss": -11.923323631286621, "global_step": 263412, "epoch": 1567} {"train_loss": -11.967923164367676, "global_step": 263413, "epoch": 1567} {"train_loss": -11.661966323852539, "global_step": 263414, "epoch": 1567} {"train_loss": -11.710619926452637, "global_step": 263415, "epoch": 1567} {"train_loss": -11.90317153930664, "global_step": 263416, "epoch": 1567} {"train_loss": -11.97778606414795, "global_step": 263417, "epoch": 1567} {"train_loss": -11.942066192626953, "global_step": 263418, "epoch": 1567} {"train_loss": -12.173259735107422, "global_step": 263419, "epoch": 1567} {"train_loss": -11.925861358642578, "global_step": 263420, "epoch": 1567} {"train_loss": -12.004133224487305, "global_step": 263421, "epoch": 1567} {"train_loss": -12.054582595825195, "global_step": 263422, "epoch": 1567} {"train_loss": -11.54591407094683, "global_step": 263423, "epoch": 1567, "val_loss": 265606.875} {"train_loss": -12.066890716552734, "global_step": 263424, "epoch": 1568} {"train_loss": -11.973787307739258, "global_step": 263425, "epoch": 1568} {"train_loss": -12.068443298339844, "global_step": 263426, "epoch": 1568} {"train_loss": -12.125235557556152, "global_step": 263427, "epoch": 1568} {"train_loss": -11.928674697875977, "global_step": 263428, "epoch": 1568} {"train_loss": -12.01832389831543, "global_step": 263429, "epoch": 1568} {"train_loss": -12.072187423706055, "global_step": 263430, "epoch": 1568} {"train_loss": -11.981599807739258, "global_step": 263431, "epoch": 1568} {"train_loss": -12.215357780456543, "global_step": 263432, "epoch": 1568} {"train_loss": -12.107161521911621, "global_step": 263433, "epoch": 1568} {"train_loss": -11.90726375579834, "global_step": 263434, "epoch": 1568} {"train_loss": -12.04366683959961, "global_step": 263435, "epoch": 1568} {"train_loss": -11.76732349395752, "global_step": 263436, "epoch": 1568} {"train_loss": -11.579378128051758, "global_step": 263437, "epoch": 1568} {"train_loss": -12.044109344482422, "global_step": 263438, "epoch": 1568} {"train_loss": -11.907541275024414, "global_step": 263439, "epoch": 1568} {"train_loss": -11.501932144165039, "global_step": 263440, "epoch": 1568} {"train_loss": -12.158798217773438, "global_step": 263441, "epoch": 1568} {"train_loss": -11.803176879882812, "global_step": 263442, "epoch": 1568} {"train_loss": -11.633417129516602, "global_step": 263443, "epoch": 1568} {"train_loss": -12.207829475402832, "global_step": 263444, "epoch": 1568} {"train_loss": -11.692188262939453, "global_step": 263445, "epoch": 1568} {"train_loss": -12.072275161743164, "global_step": 263446, "epoch": 1568} {"train_loss": -12.09310531616211, "global_step": 263447, "epoch": 1568} {"train_loss": -11.875375747680664, "global_step": 263448, "epoch": 1568} {"train_loss": -11.955609321594238, "global_step": 263449, "epoch": 1568} {"train_loss": -11.786646842956543, "global_step": 263450, "epoch": 1568} {"train_loss": -11.77586841583252, "global_step": 263451, "epoch": 1568} {"train_loss": -11.8502197265625, "global_step": 263452, "epoch": 1568} {"train_loss": -11.831727027893066, "global_step": 263453, "epoch": 1568} {"train_loss": -11.324074745178223, "global_step": 263454, "epoch": 1568} {"train_loss": -12.195919036865234, "global_step": 263455, "epoch": 1568} {"train_loss": -11.532002449035645, "global_step": 263456, "epoch": 1568} {"train_loss": -11.561702728271484, "global_step": 263457, "epoch": 1568} {"train_loss": -11.734477996826172, "global_step": 263458, "epoch": 1568} {"train_loss": -11.795833587646484, "global_step": 263459, "epoch": 1568} {"train_loss": -11.507781982421875, "global_step": 263460, "epoch": 1568} {"train_loss": -12.14529800415039, "global_step": 263461, "epoch": 1568} {"train_loss": -11.941156387329102, "global_step": 263462, "epoch": 1568} {"train_loss": -11.96008014678955, "global_step": 263463, "epoch": 1568} {"train_loss": -11.672042846679688, "global_step": 263464, "epoch": 1568} {"train_loss": -11.832437515258789, "global_step": 263465, "epoch": 1568} {"train_loss": -11.905717849731445, "global_step": 263466, "epoch": 1568} {"train_loss": -12.033621788024902, "global_step": 263467, "epoch": 1568} {"train_loss": -11.393506050109863, "global_step": 263468, "epoch": 1568} {"train_loss": -11.861059188842773, "global_step": 263469, "epoch": 1568} {"train_loss": -11.561729431152344, "global_step": 263470, "epoch": 1568} {"train_loss": -11.979662895202637, "global_step": 263471, "epoch": 1568} {"train_loss": -12.022810935974121, "global_step": 263472, "epoch": 1568} {"train_loss": -12.066166877746582, "global_step": 263473, "epoch": 1568} {"train_loss": -11.501925468444824, "global_step": 263474, "epoch": 1568} {"train_loss": -12.20816421508789, "global_step": 263475, "epoch": 1568} {"train_loss": -11.779953002929688, "global_step": 263476, "epoch": 1568} {"train_loss": -12.066744804382324, "global_step": 263477, "epoch": 1568} {"train_loss": -11.769298553466797, "global_step": 263478, "epoch": 1568} {"train_loss": -11.70283031463623, "global_step": 263479, "epoch": 1568} {"train_loss": -11.263071060180664, "global_step": 263480, "epoch": 1568} {"train_loss": -11.991969108581543, "global_step": 263481, "epoch": 1568} {"train_loss": -11.580297470092773, "global_step": 263482, "epoch": 1568} {"train_loss": -11.36384391784668, "global_step": 263483, "epoch": 1568} {"train_loss": -11.760420799255371, "global_step": 263484, "epoch": 1568} {"train_loss": -11.065786361694336, "global_step": 263485, "epoch": 1568} {"train_loss": -11.429089546203613, "global_step": 263486, "epoch": 1568} {"train_loss": -11.194647789001465, "global_step": 263487, "epoch": 1568} {"train_loss": -11.159421920776367, "global_step": 263488, "epoch": 1568} {"train_loss": -11.03805160522461, "global_step": 263489, "epoch": 1568} {"train_loss": -11.21358585357666, "global_step": 263490, "epoch": 1568} {"train_loss": -9.549871444702148, "global_step": 263491, "epoch": 1568} {"train_loss": -11.638827323913574, "global_step": 263492, "epoch": 1568} {"train_loss": -9.95313549041748, "global_step": 263493, "epoch": 1568} {"train_loss": -10.042760848999023, "global_step": 263494, "epoch": 1568} {"train_loss": -10.701370239257812, "global_step": 263495, "epoch": 1568} {"train_loss": -10.116849899291992, "global_step": 263496, "epoch": 1568} {"train_loss": -10.595848083496094, "global_step": 263497, "epoch": 1568} {"train_loss": -10.92588996887207, "global_step": 263498, "epoch": 1568} {"train_loss": -10.981012344360352, "global_step": 263499, "epoch": 1568} {"train_loss": -10.569770812988281, "global_step": 263500, "epoch": 1568} {"train_loss": -11.119073867797852, "global_step": 263501, "epoch": 1568} {"train_loss": -10.753890991210938, "global_step": 263502, "epoch": 1568} {"train_loss": -10.541593551635742, "global_step": 263503, "epoch": 1568} {"train_loss": -10.768706321716309, "global_step": 263504, "epoch": 1568} {"train_loss": -11.145647048950195, "global_step": 263505, "epoch": 1568} {"train_loss": -10.054912567138672, "global_step": 263506, "epoch": 1568} {"train_loss": -11.449603080749512, "global_step": 263507, "epoch": 1568} {"train_loss": -10.411922454833984, "global_step": 263508, "epoch": 1568} {"train_loss": -11.414894104003906, "global_step": 263509, "epoch": 1568} {"train_loss": -10.821573257446289, "global_step": 263510, "epoch": 1568} {"train_loss": -10.96423625946045, "global_step": 263511, "epoch": 1568} {"train_loss": -10.9634428024292, "global_step": 263512, "epoch": 1568} {"train_loss": -10.790119171142578, "global_step": 263513, "epoch": 1568} {"train_loss": -11.16654109954834, "global_step": 263514, "epoch": 1568} {"train_loss": -11.377582550048828, "global_step": 263515, "epoch": 1568} {"train_loss": -11.158939361572266, "global_step": 263516, "epoch": 1568} {"train_loss": -11.37855339050293, "global_step": 263517, "epoch": 1568} {"train_loss": -11.623477935791016, "global_step": 263518, "epoch": 1568} {"train_loss": -10.883848190307617, "global_step": 263519, "epoch": 1568} {"train_loss": -11.893418312072754, "global_step": 263520, "epoch": 1568} {"train_loss": -10.93582820892334, "global_step": 263521, "epoch": 1568} {"train_loss": -11.658451080322266, "global_step": 263522, "epoch": 1568} {"train_loss": -11.557644844055176, "global_step": 263523, "epoch": 1568} {"train_loss": -11.714648246765137, "global_step": 263524, "epoch": 1568} {"train_loss": -11.683554649353027, "global_step": 263525, "epoch": 1568} {"train_loss": -11.779690742492676, "global_step": 263526, "epoch": 1568} {"train_loss": -11.942774772644043, "global_step": 263527, "epoch": 1568} {"train_loss": -11.819055557250977, "global_step": 263528, "epoch": 1568} {"train_loss": -11.754961013793945, "global_step": 263529, "epoch": 1568} {"train_loss": -11.700957298278809, "global_step": 263530, "epoch": 1568} {"train_loss": -11.908613204956055, "global_step": 263531, "epoch": 1568} {"train_loss": -11.97154426574707, "global_step": 263532, "epoch": 1568} {"train_loss": -11.659354209899902, "global_step": 263533, "epoch": 1568} {"train_loss": -11.973163604736328, "global_step": 263534, "epoch": 1568} {"train_loss": -11.872529983520508, "global_step": 263535, "epoch": 1568} {"train_loss": -11.55729866027832, "global_step": 263536, "epoch": 1568} {"train_loss": -11.869935989379883, "global_step": 263537, "epoch": 1568} {"train_loss": -11.672037124633789, "global_step": 263538, "epoch": 1568} {"train_loss": -11.862245559692383, "global_step": 263539, "epoch": 1568} {"train_loss": -12.006540298461914, "global_step": 263540, "epoch": 1568} {"train_loss": -12.082144737243652, "global_step": 263541, "epoch": 1568} {"train_loss": -11.653615951538086, "global_step": 263542, "epoch": 1568} {"train_loss": -11.676643371582031, "global_step": 263543, "epoch": 1568} {"train_loss": -11.715417861938477, "global_step": 263544, "epoch": 1568} {"train_loss": -11.714069366455078, "global_step": 263545, "epoch": 1568} {"train_loss": -11.821574211120605, "global_step": 263546, "epoch": 1568} {"train_loss": -11.822206497192383, "global_step": 263547, "epoch": 1568} {"train_loss": -11.93526840209961, "global_step": 263548, "epoch": 1568} {"train_loss": -11.781837463378906, "global_step": 263549, "epoch": 1568} {"train_loss": -12.092081069946289, "global_step": 263550, "epoch": 1568} {"train_loss": -12.009888648986816, "global_step": 263551, "epoch": 1568} {"train_loss": -11.987184524536133, "global_step": 263552, "epoch": 1568} {"train_loss": -11.961650848388672, "global_step": 263553, "epoch": 1568} {"train_loss": -12.043500900268555, "global_step": 263554, "epoch": 1568} {"train_loss": -12.252601623535156, "global_step": 263555, "epoch": 1568} {"train_loss": -12.217245101928711, "global_step": 263556, "epoch": 1568} {"train_loss": -12.019123077392578, "global_step": 263557, "epoch": 1568} {"train_loss": -12.173660278320312, "global_step": 263558, "epoch": 1568} {"train_loss": -11.941179275512695, "global_step": 263559, "epoch": 1568} {"train_loss": -12.189066886901855, "global_step": 263560, "epoch": 1568} {"train_loss": -12.04493522644043, "global_step": 263561, "epoch": 1568} {"train_loss": -12.162214279174805, "global_step": 263562, "epoch": 1568} {"train_loss": -12.320565223693848, "global_step": 263563, "epoch": 1568} {"train_loss": -12.278451919555664, "global_step": 263564, "epoch": 1568} {"train_loss": -12.249427795410156, "global_step": 263565, "epoch": 1568} {"train_loss": -12.367389678955078, "global_step": 263566, "epoch": 1568} {"train_loss": -12.154207229614258, "global_step": 263567, "epoch": 1568} {"train_loss": -12.047975540161133, "global_step": 263568, "epoch": 1568} {"train_loss": -12.264005661010742, "global_step": 263569, "epoch": 1568} {"train_loss": -11.979413032531738, "global_step": 263570, "epoch": 1568} {"train_loss": -12.290023803710938, "global_step": 263571, "epoch": 1568} {"train_loss": -12.154837608337402, "global_step": 263572, "epoch": 1568} {"train_loss": -12.390681266784668, "global_step": 263573, "epoch": 1568} {"train_loss": -12.237062454223633, "global_step": 263574, "epoch": 1568} {"train_loss": -12.418085098266602, "global_step": 263575, "epoch": 1568} {"train_loss": -12.15324592590332, "global_step": 263576, "epoch": 1568} {"train_loss": -12.271230697631836, "global_step": 263577, "epoch": 1568} {"train_loss": -12.18854808807373, "global_step": 263578, "epoch": 1568} {"train_loss": -12.329174041748047, "global_step": 263579, "epoch": 1568} {"train_loss": -12.23689079284668, "global_step": 263580, "epoch": 1568} {"train_loss": -11.83387565612793, "global_step": 263581, "epoch": 1568} {"train_loss": -11.551377296447754, "global_step": 263582, "epoch": 1568} {"train_loss": -11.549585342407227, "global_step": 263583, "epoch": 1568} {"train_loss": -11.081079483032227, "global_step": 263584, "epoch": 1568} {"train_loss": -12.106511116027832, "global_step": 263585, "epoch": 1568} {"train_loss": -11.232385635375977, "global_step": 263586, "epoch": 1568} {"train_loss": -10.608651161193848, "global_step": 263587, "epoch": 1568} {"train_loss": -9.28593635559082, "global_step": 263588, "epoch": 1568} {"train_loss": -10.782252311706543, "global_step": 263589, "epoch": 1568} {"train_loss": -11.310407638549805, "global_step": 263590, "epoch": 1568} {"train_loss": -11.649800215448652, "global_step": 263591, "epoch": 1568, "val_loss": 283151.625} {"train_loss": -10.993064880371094, "global_step": 263592, "epoch": 1569} {"train_loss": -11.093379020690918, "global_step": 263593, "epoch": 1569} {"train_loss": -11.344531059265137, "global_step": 263594, "epoch": 1569} {"train_loss": -10.697734832763672, "global_step": 263595, "epoch": 1569} {"train_loss": -10.985392570495605, "global_step": 263596, "epoch": 1569} {"train_loss": -11.433238983154297, "global_step": 263597, "epoch": 1569} {"train_loss": -10.742748260498047, "global_step": 263598, "epoch": 1569} {"train_loss": -11.63813591003418, "global_step": 263599, "epoch": 1569} {"train_loss": -11.245573997497559, "global_step": 263600, "epoch": 1569} {"train_loss": -11.024215698242188, "global_step": 263601, "epoch": 1569} {"train_loss": -11.362104415893555, "global_step": 263602, "epoch": 1569} {"train_loss": -11.229223251342773, "global_step": 263603, "epoch": 1569} {"train_loss": -11.461027145385742, "global_step": 263604, "epoch": 1569} {"train_loss": -11.331341743469238, "global_step": 263605, "epoch": 1569} {"train_loss": -10.950567245483398, "global_step": 263606, "epoch": 1569} {"train_loss": -11.375630378723145, "global_step": 263607, "epoch": 1569} {"train_loss": -10.548688888549805, "global_step": 263608, "epoch": 1569} {"train_loss": -10.872257232666016, "global_step": 263609, "epoch": 1569} {"train_loss": -11.320714950561523, "global_step": 263610, "epoch": 1569} {"train_loss": -11.675886154174805, "global_step": 263611, "epoch": 1569} {"train_loss": -11.6248779296875, "global_step": 263612, "epoch": 1569} {"train_loss": -11.76601505279541, "global_step": 263613, "epoch": 1569} {"train_loss": -11.545242309570312, "global_step": 263614, "epoch": 1569} {"train_loss": -11.515108108520508, "global_step": 263615, "epoch": 1569} {"train_loss": -11.403507232666016, "global_step": 263616, "epoch": 1569} {"train_loss": -11.291688919067383, "global_step": 263617, "epoch": 1569} {"train_loss": -11.28447151184082, "global_step": 263618, "epoch": 1569} {"train_loss": -11.308321952819824, "global_step": 263619, "epoch": 1569} {"train_loss": -10.969547271728516, "global_step": 263620, "epoch": 1569} {"train_loss": -11.24522876739502, "global_step": 263621, "epoch": 1569} {"train_loss": -11.203310012817383, "global_step": 263622, "epoch": 1569} {"train_loss": -10.094183921813965, "global_step": 263623, "epoch": 1569} {"train_loss": -11.438132286071777, "global_step": 263624, "epoch": 1569} {"train_loss": -10.552835464477539, "global_step": 263625, "epoch": 1569} {"train_loss": -11.476242065429688, "global_step": 263626, "epoch": 1569} {"train_loss": -10.71917724609375, "global_step": 263627, "epoch": 1569} {"train_loss": -10.960245132446289, "global_step": 263628, "epoch": 1569} {"train_loss": -10.332983016967773, "global_step": 263629, "epoch": 1569} {"train_loss": -11.111040115356445, "global_step": 263630, "epoch": 1569} {"train_loss": -10.355878829956055, "global_step": 263631, "epoch": 1569} {"train_loss": -11.38344669342041, "global_step": 263632, "epoch": 1569} {"train_loss": -10.38382625579834, "global_step": 263633, "epoch": 1569} {"train_loss": -11.338744163513184, "global_step": 263634, "epoch": 1569} {"train_loss": -11.278573989868164, "global_step": 263635, "epoch": 1569} {"train_loss": -11.256526947021484, "global_step": 263636, "epoch": 1569} {"train_loss": -11.29588508605957, "global_step": 263637, "epoch": 1569} {"train_loss": -11.047931671142578, "global_step": 263638, "epoch": 1569} {"train_loss": -11.404704093933105, "global_step": 263639, "epoch": 1569} {"train_loss": -11.669055938720703, "global_step": 263640, "epoch": 1569} {"train_loss": -11.432437896728516, "global_step": 263641, "epoch": 1569} {"train_loss": -11.795345306396484, "global_step": 263642, "epoch": 1569} {"train_loss": -11.280645370483398, "global_step": 263643, "epoch": 1569} {"train_loss": -11.301847457885742, "global_step": 263644, "epoch": 1569} {"train_loss": -11.554527282714844, "global_step": 263645, "epoch": 1569} {"train_loss": -11.512896537780762, "global_step": 263646, "epoch": 1569} {"train_loss": -11.569343566894531, "global_step": 263647, "epoch": 1569} {"train_loss": -11.588435173034668, "global_step": 263648, "epoch": 1569} {"train_loss": -11.301212310791016, "global_step": 263649, "epoch": 1569} {"train_loss": -11.670923233032227, "global_step": 263650, "epoch": 1569} {"train_loss": -11.628518104553223, "global_step": 263651, "epoch": 1569} {"train_loss": -11.705734252929688, "global_step": 263652, "epoch": 1569} {"train_loss": -11.697641372680664, "global_step": 263653, "epoch": 1569} {"train_loss": -11.636770248413086, "global_step": 263654, "epoch": 1569} {"train_loss": -11.171147346496582, "global_step": 263655, "epoch": 1569} {"train_loss": -11.578433990478516, "global_step": 263656, "epoch": 1569} {"train_loss": -11.411287307739258, "global_step": 263657, "epoch": 1569} {"train_loss": -11.899561882019043, "global_step": 263658, "epoch": 1569} {"train_loss": -11.769638061523438, "global_step": 263659, "epoch": 1569} {"train_loss": -11.893982887268066, "global_step": 263660, "epoch": 1569} {"train_loss": -11.770435333251953, "global_step": 263661, "epoch": 1569} {"train_loss": -11.536930084228516, "global_step": 263662, "epoch": 1569} {"train_loss": -11.78382682800293, "global_step": 263663, "epoch": 1569} {"train_loss": -11.84846305847168, "global_step": 263664, "epoch": 1569} {"train_loss": -11.525691986083984, "global_step": 263665, "epoch": 1569} {"train_loss": -11.844943046569824, "global_step": 263666, "epoch": 1569} {"train_loss": -11.744671821594238, "global_step": 263667, "epoch": 1569} {"train_loss": -11.743806838989258, "global_step": 263668, "epoch": 1569} {"train_loss": -11.833415985107422, "global_step": 263669, "epoch": 1569} {"train_loss": -11.786550521850586, "global_step": 263670, "epoch": 1569} {"train_loss": -11.764932632446289, "global_step": 263671, "epoch": 1569} {"train_loss": -11.833419799804688, "global_step": 263672, "epoch": 1569} {"train_loss": -11.725686073303223, "global_step": 263673, "epoch": 1569} {"train_loss": -11.754568099975586, "global_step": 263674, "epoch": 1569} {"train_loss": -11.749431610107422, "global_step": 263675, "epoch": 1569} {"train_loss": -11.86680793762207, "global_step": 263676, "epoch": 1569} {"train_loss": -11.994522094726562, "global_step": 263677, "epoch": 1569} {"train_loss": -11.835502624511719, "global_step": 263678, "epoch": 1569} {"train_loss": -11.693294525146484, "global_step": 263679, "epoch": 1569} {"train_loss": -11.569402694702148, "global_step": 263680, "epoch": 1569} {"train_loss": -11.016420364379883, "global_step": 263681, "epoch": 1569} {"train_loss": -11.393701553344727, "global_step": 263682, "epoch": 1569} {"train_loss": -11.039496421813965, "global_step": 263683, "epoch": 1569} {"train_loss": -11.585234642028809, "global_step": 263684, "epoch": 1569} {"train_loss": -10.923385620117188, "global_step": 263685, "epoch": 1569} {"train_loss": -11.531732559204102, "global_step": 263686, "epoch": 1569} {"train_loss": -11.556591033935547, "global_step": 263687, "epoch": 1569} {"train_loss": -11.71666145324707, "global_step": 263688, "epoch": 1569} {"train_loss": -11.543891906738281, "global_step": 263689, "epoch": 1569} {"train_loss": -11.944830894470215, "global_step": 263690, "epoch": 1569} {"train_loss": -11.96251106262207, "global_step": 263691, "epoch": 1569} {"train_loss": -12.068167686462402, "global_step": 263692, "epoch": 1569} {"train_loss": -11.87092113494873, "global_step": 263693, "epoch": 1569} {"train_loss": -11.804973602294922, "global_step": 263694, "epoch": 1569} {"train_loss": -11.97414779663086, "global_step": 263695, "epoch": 1569} {"train_loss": -11.71397876739502, "global_step": 263696, "epoch": 1569} {"train_loss": -12.026321411132812, "global_step": 263697, "epoch": 1569} {"train_loss": -11.956400871276855, "global_step": 263698, "epoch": 1569} {"train_loss": -12.145466804504395, "global_step": 263699, "epoch": 1569} {"train_loss": -12.056930541992188, "global_step": 263700, "epoch": 1569} {"train_loss": -12.188102722167969, "global_step": 263701, "epoch": 1569} {"train_loss": -12.131139755249023, "global_step": 263702, "epoch": 1569} {"train_loss": -12.081293106079102, "global_step": 263703, "epoch": 1569} {"train_loss": -12.268556594848633, "global_step": 263704, "epoch": 1569} {"train_loss": -12.211143493652344, "global_step": 263705, "epoch": 1569} {"train_loss": -12.155889511108398, "global_step": 263706, "epoch": 1569} {"train_loss": -12.21104907989502, "global_step": 263707, "epoch": 1569} {"train_loss": -12.247394561767578, "global_step": 263708, "epoch": 1569} {"train_loss": -11.968549728393555, "global_step": 263709, "epoch": 1569} {"train_loss": -12.122846603393555, "global_step": 263710, "epoch": 1569} {"train_loss": -12.325481414794922, "global_step": 263711, "epoch": 1569} {"train_loss": -12.145872116088867, "global_step": 263712, "epoch": 1569} {"train_loss": -11.98179817199707, "global_step": 263713, "epoch": 1569} {"train_loss": -12.151872634887695, "global_step": 263714, "epoch": 1569} {"train_loss": -12.064647674560547, "global_step": 263715, "epoch": 1569} {"train_loss": -12.27440071105957, "global_step": 263716, "epoch": 1569} {"train_loss": -12.110153198242188, "global_step": 263717, "epoch": 1569} {"train_loss": -11.97012996673584, "global_step": 263718, "epoch": 1569} {"train_loss": -12.128520011901855, "global_step": 263719, "epoch": 1569} {"train_loss": -12.308656692504883, "global_step": 263720, "epoch": 1569} {"train_loss": -11.850753784179688, "global_step": 263721, "epoch": 1569} {"train_loss": -11.893043518066406, "global_step": 263722, "epoch": 1569} {"train_loss": -12.330480575561523, "global_step": 263723, "epoch": 1569} {"train_loss": -11.380006790161133, "global_step": 263724, "epoch": 1569} {"train_loss": -10.603128433227539, "global_step": 263725, "epoch": 1569} {"train_loss": -11.84174919128418, "global_step": 263726, "epoch": 1569} {"train_loss": -11.642080307006836, "global_step": 263727, "epoch": 1569} {"train_loss": -10.257851600646973, "global_step": 263728, "epoch": 1569} {"train_loss": -10.073785781860352, "global_step": 263729, "epoch": 1569} {"train_loss": -11.10567569732666, "global_step": 263730, "epoch": 1569} {"train_loss": -10.444150924682617, "global_step": 263731, "epoch": 1569} {"train_loss": -10.95727825164795, "global_step": 263732, "epoch": 1569} {"train_loss": -10.95166301727295, "global_step": 263733, "epoch": 1569} {"train_loss": -11.645742416381836, "global_step": 263734, "epoch": 1569} {"train_loss": -11.084754943847656, "global_step": 263735, "epoch": 1569} {"train_loss": -11.143131256103516, "global_step": 263736, "epoch": 1569} {"train_loss": -11.496143341064453, "global_step": 263737, "epoch": 1569} {"train_loss": -11.262008666992188, "global_step": 263738, "epoch": 1569} {"train_loss": -10.795339584350586, "global_step": 263739, "epoch": 1569} {"train_loss": -10.220226287841797, "global_step": 263740, "epoch": 1569} {"train_loss": -9.607650756835938, "global_step": 263741, "epoch": 1569} {"train_loss": -10.093095779418945, "global_step": 263742, "epoch": 1569} {"train_loss": -10.271415710449219, "global_step": 263743, "epoch": 1569} {"train_loss": -9.714059829711914, "global_step": 263744, "epoch": 1569} {"train_loss": -10.79666805267334, "global_step": 263745, "epoch": 1569} {"train_loss": -9.096527099609375, "global_step": 263746, "epoch": 1569} {"train_loss": -11.40388011932373, "global_step": 263747, "epoch": 1569} {"train_loss": -10.025153160095215, "global_step": 263748, "epoch": 1569} {"train_loss": -10.290557861328125, "global_step": 263749, "epoch": 1569} {"train_loss": -10.06912612915039, "global_step": 263750, "epoch": 1569} {"train_loss": -10.514640808105469, "global_step": 263751, "epoch": 1569} {"train_loss": -9.913835525512695, "global_step": 263752, "epoch": 1569} {"train_loss": -11.207122802734375, "global_step": 263753, "epoch": 1569} {"train_loss": -10.043785095214844, "global_step": 263754, "epoch": 1569} {"train_loss": -10.789582252502441, "global_step": 263755, "epoch": 1569} {"train_loss": -9.907548904418945, "global_step": 263756, "epoch": 1569} {"train_loss": -10.497359275817871, "global_step": 263757, "epoch": 1569} {"train_loss": -11.056236267089844, "global_step": 263758, "epoch": 1569} {"train_loss": -11.364218831062317, "global_step": 263759, "epoch": 1569, "val_loss": 267776.0625} {"train_loss": -11.299376487731934, "global_step": 263760, "epoch": 1570} {"train_loss": -10.391277313232422, "global_step": 263761, "epoch": 1570} {"train_loss": -11.548887252807617, "global_step": 263762, "epoch": 1570} {"train_loss": -10.045816421508789, "global_step": 263763, "epoch": 1570} {"train_loss": -11.844786643981934, "global_step": 263764, "epoch": 1570} {"train_loss": -10.774404525756836, "global_step": 263765, "epoch": 1570} {"train_loss": -11.259044647216797, "global_step": 263766, "epoch": 1570} {"train_loss": -11.373074531555176, "global_step": 263767, "epoch": 1570} {"train_loss": -11.430484771728516, "global_step": 263768, "epoch": 1570} {"train_loss": -11.666845321655273, "global_step": 263769, "epoch": 1570} {"train_loss": -11.350781440734863, "global_step": 263770, "epoch": 1570} {"train_loss": -11.64692497253418, "global_step": 263771, "epoch": 1570} {"train_loss": -11.54733657836914, "global_step": 263772, "epoch": 1570} {"train_loss": -11.447419166564941, "global_step": 263773, "epoch": 1570} {"train_loss": -11.684995651245117, "global_step": 263774, "epoch": 1570} {"train_loss": -11.436975479125977, "global_step": 263775, "epoch": 1570} {"train_loss": -11.632793426513672, "global_step": 263776, "epoch": 1570} {"train_loss": -11.487700462341309, "global_step": 263777, "epoch": 1570} {"train_loss": -11.832904815673828, "global_step": 263778, "epoch": 1570} {"train_loss": -11.502222061157227, "global_step": 263779, "epoch": 1570} {"train_loss": -11.685199737548828, "global_step": 263780, "epoch": 1570} {"train_loss": -11.972759246826172, "global_step": 263781, "epoch": 1570} {"train_loss": -11.44428825378418, "global_step": 263782, "epoch": 1570} {"train_loss": -11.866938591003418, "global_step": 263783, "epoch": 1570} {"train_loss": -11.761298179626465, "global_step": 263784, "epoch": 1570} {"train_loss": -11.888882637023926, "global_step": 263785, "epoch": 1570} {"train_loss": -11.933516502380371, "global_step": 263786, "epoch": 1570} {"train_loss": -11.916315078735352, "global_step": 263787, "epoch": 1570} {"train_loss": -12.132946968078613, "global_step": 263788, "epoch": 1570} {"train_loss": -11.963362693786621, "global_step": 263789, "epoch": 1570} {"train_loss": -11.874255180358887, "global_step": 263790, "epoch": 1570} {"train_loss": -11.984588623046875, "global_step": 263791, "epoch": 1570} {"train_loss": -11.847389221191406, "global_step": 263792, "epoch": 1570} {"train_loss": -11.995844841003418, "global_step": 263793, "epoch": 1570} {"train_loss": -11.717462539672852, "global_step": 263794, "epoch": 1570} {"train_loss": -11.9118013381958, "global_step": 263795, "epoch": 1570} {"train_loss": -11.821101188659668, "global_step": 263796, "epoch": 1570} {"train_loss": -11.992094039916992, "global_step": 263797, "epoch": 1570} {"train_loss": -11.9404935836792, "global_step": 263798, "epoch": 1570} {"train_loss": -11.839350700378418, "global_step": 263799, "epoch": 1570} {"train_loss": -11.90863037109375, "global_step": 263800, "epoch": 1570} {"train_loss": -11.88563346862793, "global_step": 263801, "epoch": 1570} {"train_loss": -11.917713165283203, "global_step": 263802, "epoch": 1570} {"train_loss": -11.861164093017578, "global_step": 263803, "epoch": 1570} {"train_loss": -12.06601333618164, "global_step": 263804, "epoch": 1570} {"train_loss": -11.820718765258789, "global_step": 263805, "epoch": 1570} {"train_loss": -11.900653839111328, "global_step": 263806, "epoch": 1570} {"train_loss": -11.843706130981445, "global_step": 263807, "epoch": 1570} {"train_loss": -11.833440780639648, "global_step": 263808, "epoch": 1570} {"train_loss": -12.040451049804688, "global_step": 263809, "epoch": 1570} {"train_loss": -11.986310958862305, "global_step": 263810, "epoch": 1570} {"train_loss": -12.13608169555664, "global_step": 263811, "epoch": 1570} {"train_loss": -11.869457244873047, "global_step": 263812, "epoch": 1570} {"train_loss": -12.098698616027832, "global_step": 263813, "epoch": 1570} {"train_loss": -11.891613006591797, "global_step": 263814, "epoch": 1570} {"train_loss": -12.13039779663086, "global_step": 263815, "epoch": 1570} {"train_loss": -11.532303810119629, "global_step": 263816, "epoch": 1570} {"train_loss": -12.127653121948242, "global_step": 263817, "epoch": 1570} {"train_loss": -11.817132949829102, "global_step": 263818, "epoch": 1570} {"train_loss": -12.041276931762695, "global_step": 263819, "epoch": 1570} {"train_loss": -11.719456672668457, "global_step": 263820, "epoch": 1570} {"train_loss": -11.838227272033691, "global_step": 263821, "epoch": 1570} {"train_loss": -11.763219833374023, "global_step": 263822, "epoch": 1570} {"train_loss": -12.095592498779297, "global_step": 263823, "epoch": 1570} {"train_loss": -11.87979507446289, "global_step": 263824, "epoch": 1570} {"train_loss": -12.177267074584961, "global_step": 263825, "epoch": 1570} {"train_loss": -12.011983871459961, "global_step": 263826, "epoch": 1570} {"train_loss": -12.147953033447266, "global_step": 263827, "epoch": 1570} {"train_loss": -11.768784523010254, "global_step": 263828, "epoch": 1570} {"train_loss": -12.165176391601562, "global_step": 263829, "epoch": 1570} {"train_loss": -11.871578216552734, "global_step": 263830, "epoch": 1570} {"train_loss": -12.021020889282227, "global_step": 263831, "epoch": 1570} {"train_loss": -11.955644607543945, "global_step": 263832, "epoch": 1570} {"train_loss": -11.90347957611084, "global_step": 263833, "epoch": 1570} {"train_loss": -11.643884658813477, "global_step": 263834, "epoch": 1570} {"train_loss": -11.774903297424316, "global_step": 263835, "epoch": 1570} {"train_loss": -11.923779487609863, "global_step": 263836, "epoch": 1570} {"train_loss": -11.774169921875, "global_step": 263837, "epoch": 1570} {"train_loss": -12.034326553344727, "global_step": 263838, "epoch": 1570} {"train_loss": -11.952634811401367, "global_step": 263839, "epoch": 1570} {"train_loss": -11.811746597290039, "global_step": 263840, "epoch": 1570} {"train_loss": -12.179201126098633, "global_step": 263841, "epoch": 1570} {"train_loss": -11.348264694213867, "global_step": 263842, "epoch": 1570} {"train_loss": -11.999856948852539, "global_step": 263843, "epoch": 1570} {"train_loss": -11.564783096313477, "global_step": 263844, "epoch": 1570} {"train_loss": -12.036511421203613, "global_step": 263845, "epoch": 1570} {"train_loss": -11.930410385131836, "global_step": 263846, "epoch": 1570} {"train_loss": -11.78207015991211, "global_step": 263847, "epoch": 1570} {"train_loss": -11.930078506469727, "global_step": 263848, "epoch": 1570} {"train_loss": -11.783742904663086, "global_step": 263849, "epoch": 1570} {"train_loss": -11.86711311340332, "global_step": 263850, "epoch": 1570} {"train_loss": -11.458106994628906, "global_step": 263851, "epoch": 1570} {"train_loss": -11.981664657592773, "global_step": 263852, "epoch": 1570} {"train_loss": -12.042603492736816, "global_step": 263853, "epoch": 1570} {"train_loss": -11.783206939697266, "global_step": 263854, "epoch": 1570} {"train_loss": -11.101980209350586, "global_step": 263855, "epoch": 1570} {"train_loss": -11.684019088745117, "global_step": 263856, "epoch": 1570} {"train_loss": -11.83607292175293, "global_step": 263857, "epoch": 1570} {"train_loss": -11.443235397338867, "global_step": 263858, "epoch": 1570} {"train_loss": -9.872949600219727, "global_step": 263859, "epoch": 1570} {"train_loss": -10.621099472045898, "global_step": 263860, "epoch": 1570} {"train_loss": -11.882854461669922, "global_step": 263861, "epoch": 1570} {"train_loss": -11.57908821105957, "global_step": 263862, "epoch": 1570} {"train_loss": -11.388873100280762, "global_step": 263863, "epoch": 1570} {"train_loss": -11.239877700805664, "global_step": 263864, "epoch": 1570} {"train_loss": -11.934280395507812, "global_step": 263865, "epoch": 1570} {"train_loss": -11.194622039794922, "global_step": 263866, "epoch": 1570} {"train_loss": -11.247965812683105, "global_step": 263867, "epoch": 1570} {"train_loss": -11.831384658813477, "global_step": 263868, "epoch": 1570} {"train_loss": -11.915993690490723, "global_step": 263869, "epoch": 1570} {"train_loss": -11.754481315612793, "global_step": 263870, "epoch": 1570} {"train_loss": -11.39692497253418, "global_step": 263871, "epoch": 1570} {"train_loss": -11.880093574523926, "global_step": 263872, "epoch": 1570} {"train_loss": -11.760590553283691, "global_step": 263873, "epoch": 1570} {"train_loss": -11.144537925720215, "global_step": 263874, "epoch": 1570} {"train_loss": -11.013561248779297, "global_step": 263875, "epoch": 1570} {"train_loss": -11.756600379943848, "global_step": 263876, "epoch": 1570} {"train_loss": -11.782135009765625, "global_step": 263877, "epoch": 1570} {"train_loss": -11.30721664428711, "global_step": 263878, "epoch": 1570} {"train_loss": -10.839576721191406, "global_step": 263879, "epoch": 1570} {"train_loss": -12.089338302612305, "global_step": 263880, "epoch": 1570} {"train_loss": -11.587858200073242, "global_step": 263881, "epoch": 1570} {"train_loss": -11.921913146972656, "global_step": 263882, "epoch": 1570} {"train_loss": -11.770672798156738, "global_step": 263883, "epoch": 1570} {"train_loss": -11.204651832580566, "global_step": 263884, "epoch": 1570} {"train_loss": -11.146897315979004, "global_step": 263885, "epoch": 1570} {"train_loss": -11.953259468078613, "global_step": 263886, "epoch": 1570} {"train_loss": -10.413334846496582, "global_step": 263887, "epoch": 1570} {"train_loss": -11.068007469177246, "global_step": 263888, "epoch": 1570} {"train_loss": -11.791929244995117, "global_step": 263889, "epoch": 1570} {"train_loss": -11.735698699951172, "global_step": 263890, "epoch": 1570} {"train_loss": -11.698068618774414, "global_step": 263891, "epoch": 1570} {"train_loss": -11.925862312316895, "global_step": 263892, "epoch": 1570} {"train_loss": -11.74227237701416, "global_step": 263893, "epoch": 1570} {"train_loss": -11.808355331420898, "global_step": 263894, "epoch": 1570} {"train_loss": -11.863059997558594, "global_step": 263895, "epoch": 1570} {"train_loss": -11.732280731201172, "global_step": 263896, "epoch": 1570} {"train_loss": -12.070947647094727, "global_step": 263897, "epoch": 1570} {"train_loss": -11.840744018554688, "global_step": 263898, "epoch": 1570} {"train_loss": -11.874366760253906, "global_step": 263899, "epoch": 1570} {"train_loss": -11.844100952148438, "global_step": 263900, "epoch": 1570} {"train_loss": -11.807775497436523, "global_step": 263901, "epoch": 1570} {"train_loss": -12.115337371826172, "global_step": 263902, "epoch": 1570} {"train_loss": -12.051262855529785, "global_step": 263903, "epoch": 1570} {"train_loss": -11.976116180419922, "global_step": 263904, "epoch": 1570} {"train_loss": -11.946243286132812, "global_step": 263905, "epoch": 1570} {"train_loss": -11.831515312194824, "global_step": 263906, "epoch": 1570} {"train_loss": -11.795921325683594, "global_step": 263907, "epoch": 1570} {"train_loss": -11.883124351501465, "global_step": 263908, "epoch": 1570} {"train_loss": -11.728567123413086, "global_step": 263909, "epoch": 1570} {"train_loss": -11.29765510559082, "global_step": 263910, "epoch": 1570} {"train_loss": -11.802289962768555, "global_step": 263911, "epoch": 1570} {"train_loss": -11.301336288452148, "global_step": 263912, "epoch": 1570} {"train_loss": -11.563302993774414, "global_step": 263913, "epoch": 1570} {"train_loss": -11.647684097290039, "global_step": 263914, "epoch": 1570} {"train_loss": -11.601277351379395, "global_step": 263915, "epoch": 1570} {"train_loss": -11.41034984588623, "global_step": 263916, "epoch": 1570} {"train_loss": -11.702034950256348, "global_step": 263917, "epoch": 1570} {"train_loss": -10.901055335998535, "global_step": 263918, "epoch": 1570} {"train_loss": -11.923490524291992, "global_step": 263919, "epoch": 1570} {"train_loss": -11.5974760055542, "global_step": 263920, "epoch": 1570} {"train_loss": -12.03902816772461, "global_step": 263921, "epoch": 1570} {"train_loss": -11.862348556518555, "global_step": 263922, "epoch": 1570} {"train_loss": -11.562722206115723, "global_step": 263923, "epoch": 1570} {"train_loss": -11.951010704040527, "global_step": 263924, "epoch": 1570} {"train_loss": -11.925220489501953, "global_step": 263925, "epoch": 1570} {"train_loss": -11.760251998901367, "global_step": 263926, "epoch": 1570} {"train_loss": -11.703684329986572, "global_step": 263927, "epoch": 1570, "val_loss": 271179.8125, "train_action_mse_error": 2.968472480773926} {"train_loss": -12.022234916687012, "global_step": 263928, "epoch": 1571} {"train_loss": -12.1167573928833, "global_step": 263929, "epoch": 1571} {"train_loss": -11.611954689025879, "global_step": 263930, "epoch": 1571} {"train_loss": -12.009187698364258, "global_step": 263931, "epoch": 1571} {"train_loss": -11.22106647491455, "global_step": 263932, "epoch": 1571} {"train_loss": -11.701284408569336, "global_step": 263933, "epoch": 1571} {"train_loss": -11.632672309875488, "global_step": 263934, "epoch": 1571} {"train_loss": -11.80541706085205, "global_step": 263935, "epoch": 1571} {"train_loss": -11.525184631347656, "global_step": 263936, "epoch": 1571} {"train_loss": -11.250368118286133, "global_step": 263937, "epoch": 1571} {"train_loss": -11.363311767578125, "global_step": 263938, "epoch": 1571} {"train_loss": -11.94865608215332, "global_step": 263939, "epoch": 1571} {"train_loss": -11.536116600036621, "global_step": 263940, "epoch": 1571} {"train_loss": -11.59658432006836, "global_step": 263941, "epoch": 1571} {"train_loss": -11.896010398864746, "global_step": 263942, "epoch": 1571} {"train_loss": -11.353471755981445, "global_step": 263943, "epoch": 1571} {"train_loss": -11.733960151672363, "global_step": 263944, "epoch": 1571} {"train_loss": -11.422212600708008, "global_step": 263945, "epoch": 1571} {"train_loss": -11.785161972045898, "global_step": 263946, "epoch": 1571} {"train_loss": -11.870477676391602, "global_step": 263947, "epoch": 1571} {"train_loss": -11.759368896484375, "global_step": 263948, "epoch": 1571} {"train_loss": -11.645047187805176, "global_step": 263949, "epoch": 1571} {"train_loss": -11.432991027832031, "global_step": 263950, "epoch": 1571} {"train_loss": -11.602424621582031, "global_step": 263951, "epoch": 1571} {"train_loss": -11.466532707214355, "global_step": 263952, "epoch": 1571} {"train_loss": -11.289666175842285, "global_step": 263953, "epoch": 1571} {"train_loss": -11.589463233947754, "global_step": 263954, "epoch": 1571} {"train_loss": -11.212556838989258, "global_step": 263955, "epoch": 1571} {"train_loss": -11.424095153808594, "global_step": 263956, "epoch": 1571} {"train_loss": -11.801097869873047, "global_step": 263957, "epoch": 1571} {"train_loss": -10.950937271118164, "global_step": 263958, "epoch": 1571} {"train_loss": -11.845627784729004, "global_step": 263959, "epoch": 1571} {"train_loss": -11.328837394714355, "global_step": 263960, "epoch": 1571} {"train_loss": -11.810455322265625, "global_step": 263961, "epoch": 1571} {"train_loss": -11.318232536315918, "global_step": 263962, "epoch": 1571} {"train_loss": -11.210321426391602, "global_step": 263963, "epoch": 1571} {"train_loss": -10.846931457519531, "global_step": 263964, "epoch": 1571} {"train_loss": -11.987555503845215, "global_step": 263965, "epoch": 1571} {"train_loss": -11.134765625, "global_step": 263966, "epoch": 1571} {"train_loss": -11.530122756958008, "global_step": 263967, "epoch": 1571} {"train_loss": -11.303589820861816, "global_step": 263968, "epoch": 1571} {"train_loss": -11.295856475830078, "global_step": 263969, "epoch": 1571} {"train_loss": -11.5706787109375, "global_step": 263970, "epoch": 1571} {"train_loss": -11.398696899414062, "global_step": 263971, "epoch": 1571} {"train_loss": -11.488689422607422, "global_step": 263972, "epoch": 1571} {"train_loss": -11.71566390991211, "global_step": 263973, "epoch": 1571} {"train_loss": -11.772865295410156, "global_step": 263974, "epoch": 1571} {"train_loss": -11.633350372314453, "global_step": 263975, "epoch": 1571} {"train_loss": -11.855009078979492, "global_step": 263976, "epoch": 1571} {"train_loss": -11.510856628417969, "global_step": 263977, "epoch": 1571} {"train_loss": -11.956170082092285, "global_step": 263978, "epoch": 1571} {"train_loss": -11.803143501281738, "global_step": 263979, "epoch": 1571} {"train_loss": -11.657038688659668, "global_step": 263980, "epoch": 1571} {"train_loss": -11.741853713989258, "global_step": 263981, "epoch": 1571} {"train_loss": -11.745372772216797, "global_step": 263982, "epoch": 1571} {"train_loss": -11.25124740600586, "global_step": 263983, "epoch": 1571} {"train_loss": -12.073781967163086, "global_step": 263984, "epoch": 1571} {"train_loss": -11.80380630493164, "global_step": 263985, "epoch": 1571} {"train_loss": -11.938835144042969, "global_step": 263986, "epoch": 1571} {"train_loss": -11.8033447265625, "global_step": 263987, "epoch": 1571} {"train_loss": -11.645904541015625, "global_step": 263988, "epoch": 1571} {"train_loss": -12.082799911499023, "global_step": 263989, "epoch": 1571} {"train_loss": -11.89449405670166, "global_step": 263990, "epoch": 1571} {"train_loss": -11.847243309020996, "global_step": 263991, "epoch": 1571} {"train_loss": -11.654350280761719, "global_step": 263992, "epoch": 1571} {"train_loss": -11.729642868041992, "global_step": 263993, "epoch": 1571} {"train_loss": -11.938076972961426, "global_step": 263994, "epoch": 1571} {"train_loss": -11.54288101196289, "global_step": 263995, "epoch": 1571} {"train_loss": -12.133064270019531, "global_step": 263996, "epoch": 1571} {"train_loss": -11.92132568359375, "global_step": 263997, "epoch": 1571} {"train_loss": -12.145965576171875, "global_step": 263998, "epoch": 1571} {"train_loss": -11.87864875793457, "global_step": 263999, "epoch": 1571} {"train_loss": -11.96561336517334, "global_step": 264000, "epoch": 1571} {"train_loss": -12.091080665588379, "global_step": 264001, "epoch": 1571} {"train_loss": -11.653993606567383, "global_step": 264002, "epoch": 1571} {"train_loss": -12.176782608032227, "global_step": 264003, "epoch": 1571} {"train_loss": -11.744522094726562, "global_step": 264004, "epoch": 1571} {"train_loss": -11.871817588806152, "global_step": 264005, "epoch": 1571} {"train_loss": -11.929845809936523, "global_step": 264006, "epoch": 1571} {"train_loss": -11.761353492736816, "global_step": 264007, "epoch": 1571} {"train_loss": -11.772163391113281, "global_step": 264008, "epoch": 1571} {"train_loss": -12.053617477416992, "global_step": 264009, "epoch": 1571} {"train_loss": -11.458906173706055, "global_step": 264010, "epoch": 1571} {"train_loss": -11.892132759094238, "global_step": 264011, "epoch": 1571} {"train_loss": -10.866253852844238, "global_step": 264012, "epoch": 1571} {"train_loss": -11.10708999633789, "global_step": 264013, "epoch": 1571} {"train_loss": -11.543466567993164, "global_step": 264014, "epoch": 1571} {"train_loss": -11.237016677856445, "global_step": 264015, "epoch": 1571} {"train_loss": -11.435876846313477, "global_step": 264016, "epoch": 1571} {"train_loss": -11.354369163513184, "global_step": 264017, "epoch": 1571} {"train_loss": -11.457390785217285, "global_step": 264018, "epoch": 1571} {"train_loss": -11.52558708190918, "global_step": 264019, "epoch": 1571} {"train_loss": -11.479400634765625, "global_step": 264020, "epoch": 1571} {"train_loss": -11.833808898925781, "global_step": 264021, "epoch": 1571} {"train_loss": -11.533855438232422, "global_step": 264022, "epoch": 1571} {"train_loss": -12.096351623535156, "global_step": 264023, "epoch": 1571} {"train_loss": -11.659873962402344, "global_step": 264024, "epoch": 1571} {"train_loss": -12.133440017700195, "global_step": 264025, "epoch": 1571} {"train_loss": -11.781882286071777, "global_step": 264026, "epoch": 1571} {"train_loss": -11.820488929748535, "global_step": 264027, "epoch": 1571} {"train_loss": -11.282752990722656, "global_step": 264028, "epoch": 1571} {"train_loss": -11.990007400512695, "global_step": 264029, "epoch": 1571} {"train_loss": -11.706223487854004, "global_step": 264030, "epoch": 1571} {"train_loss": -11.99424934387207, "global_step": 264031, "epoch": 1571} {"train_loss": -12.171993255615234, "global_step": 264032, "epoch": 1571} {"train_loss": -11.748368263244629, "global_step": 264033, "epoch": 1571} {"train_loss": -12.15365219116211, "global_step": 264034, "epoch": 1571} {"train_loss": -11.960163116455078, "global_step": 264035, "epoch": 1571} {"train_loss": -12.054848670959473, "global_step": 264036, "epoch": 1571} {"train_loss": -12.025430679321289, "global_step": 264037, "epoch": 1571} {"train_loss": -11.789230346679688, "global_step": 264038, "epoch": 1571} {"train_loss": -12.096797943115234, "global_step": 264039, "epoch": 1571} {"train_loss": -11.981880187988281, "global_step": 264040, "epoch": 1571} {"train_loss": -11.63279914855957, "global_step": 264041, "epoch": 1571} {"train_loss": -12.191390991210938, "global_step": 264042, "epoch": 1571} {"train_loss": -11.582698822021484, "global_step": 264043, "epoch": 1571} {"train_loss": -12.100882530212402, "global_step": 264044, "epoch": 1571} {"train_loss": -11.962303161621094, "global_step": 264045, "epoch": 1571} {"train_loss": -11.828121185302734, "global_step": 264046, "epoch": 1571} {"train_loss": -12.188043594360352, "global_step": 264047, "epoch": 1571} {"train_loss": -11.95730209350586, "global_step": 264048, "epoch": 1571} {"train_loss": -11.783933639526367, "global_step": 264049, "epoch": 1571} {"train_loss": -11.954084396362305, "global_step": 264050, "epoch": 1571} {"train_loss": -11.541367530822754, "global_step": 264051, "epoch": 1571} {"train_loss": -11.698007583618164, "global_step": 264052, "epoch": 1571} {"train_loss": -12.041507720947266, "global_step": 264053, "epoch": 1571} {"train_loss": -11.62777328491211, "global_step": 264054, "epoch": 1571} {"train_loss": -11.88581657409668, "global_step": 264055, "epoch": 1571} {"train_loss": -11.913229942321777, "global_step": 264056, "epoch": 1571} {"train_loss": -11.572717666625977, "global_step": 264057, "epoch": 1571} {"train_loss": -11.468035697937012, "global_step": 264058, "epoch": 1571} {"train_loss": -11.860130310058594, "global_step": 264059, "epoch": 1571} {"train_loss": -10.063196182250977, "global_step": 264060, "epoch": 1571} {"train_loss": -11.447484970092773, "global_step": 264061, "epoch": 1571} {"train_loss": -10.618172645568848, "global_step": 264062, "epoch": 1571} {"train_loss": -10.693960189819336, "global_step": 264063, "epoch": 1571} {"train_loss": -11.545366287231445, "global_step": 264064, "epoch": 1571} {"train_loss": -10.125467300415039, "global_step": 264065, "epoch": 1571} {"train_loss": -11.716608047485352, "global_step": 264066, "epoch": 1571} {"train_loss": -10.590837478637695, "global_step": 264067, "epoch": 1571} {"train_loss": -11.059130668640137, "global_step": 264068, "epoch": 1571} {"train_loss": -10.521608352661133, "global_step": 264069, "epoch": 1571} {"train_loss": -11.216714859008789, "global_step": 264070, "epoch": 1571} {"train_loss": -11.087764739990234, "global_step": 264071, "epoch": 1571} {"train_loss": -10.6714448928833, "global_step": 264072, "epoch": 1571} {"train_loss": -11.728299140930176, "global_step": 264073, "epoch": 1571} {"train_loss": -11.245647430419922, "global_step": 264074, "epoch": 1571} {"train_loss": -11.863632202148438, "global_step": 264075, "epoch": 1571} {"train_loss": -11.457260131835938, "global_step": 264076, "epoch": 1571} {"train_loss": -11.712193489074707, "global_step": 264077, "epoch": 1571} {"train_loss": -11.63576602935791, "global_step": 264078, "epoch": 1571} {"train_loss": -11.34164047241211, "global_step": 264079, "epoch": 1571} {"train_loss": -11.86025333404541, "global_step": 264080, "epoch": 1571} {"train_loss": -11.803412437438965, "global_step": 264081, "epoch": 1571} {"train_loss": -11.687971115112305, "global_step": 264082, "epoch": 1571} {"train_loss": -11.970901489257812, "global_step": 264083, "epoch": 1571} {"train_loss": -11.716331481933594, "global_step": 264084, "epoch": 1571} {"train_loss": -12.00920581817627, "global_step": 264085, "epoch": 1571} {"train_loss": -11.772428512573242, "global_step": 264086, "epoch": 1571} {"train_loss": -11.300210952758789, "global_step": 264087, "epoch": 1571} {"train_loss": -11.62508487701416, "global_step": 264088, "epoch": 1571} {"train_loss": -11.757852554321289, "global_step": 264089, "epoch": 1571} {"train_loss": -11.528375625610352, "global_step": 264090, "epoch": 1571} {"train_loss": -12.014305114746094, "global_step": 264091, "epoch": 1571} {"train_loss": -11.669388771057129, "global_step": 264092, "epoch": 1571} {"train_loss": -11.973176956176758, "global_step": 264093, "epoch": 1571} {"train_loss": -11.641587257385254, "global_step": 264094, "epoch": 1571} {"train_loss": -11.642400332859584, "global_step": 264095, "epoch": 1571, "val_loss": 272652.21875} {"train_loss": -11.812196731567383, "global_step": 264096, "epoch": 1572} {"train_loss": -11.858463287353516, "global_step": 264097, "epoch": 1572} {"train_loss": -11.619329452514648, "global_step": 264098, "epoch": 1572} {"train_loss": -11.701247215270996, "global_step": 264099, "epoch": 1572} {"train_loss": -11.864914894104004, "global_step": 264100, "epoch": 1572} {"train_loss": -11.480730056762695, "global_step": 264101, "epoch": 1572} {"train_loss": -11.85963249206543, "global_step": 264102, "epoch": 1572} {"train_loss": -11.391936302185059, "global_step": 264103, "epoch": 1572} {"train_loss": -11.881048202514648, "global_step": 264104, "epoch": 1572} {"train_loss": -11.502006530761719, "global_step": 264105, "epoch": 1572} {"train_loss": -11.98046875, "global_step": 264106, "epoch": 1572} {"train_loss": -11.73959732055664, "global_step": 264107, "epoch": 1572} {"train_loss": -12.096639633178711, "global_step": 264108, "epoch": 1572} {"train_loss": -11.923821449279785, "global_step": 264109, "epoch": 1572} {"train_loss": -11.864773750305176, "global_step": 264110, "epoch": 1572} {"train_loss": -11.70711898803711, "global_step": 264111, "epoch": 1572} {"train_loss": -11.988567352294922, "global_step": 264112, "epoch": 1572} {"train_loss": -11.568877220153809, "global_step": 264113, "epoch": 1572} {"train_loss": -11.66023063659668, "global_step": 264114, "epoch": 1572} {"train_loss": -11.21946907043457, "global_step": 264115, "epoch": 1572} {"train_loss": -11.400189399719238, "global_step": 264116, "epoch": 1572} {"train_loss": -10.360174179077148, "global_step": 264117, "epoch": 1572} {"train_loss": -11.904109954833984, "global_step": 264118, "epoch": 1572} {"train_loss": -10.725443840026855, "global_step": 264119, "epoch": 1572} {"train_loss": -11.738006591796875, "global_step": 264120, "epoch": 1572} {"train_loss": -11.396728515625, "global_step": 264121, "epoch": 1572} {"train_loss": -9.875651359558105, "global_step": 264122, "epoch": 1572} {"train_loss": -11.727099418640137, "global_step": 264123, "epoch": 1572} {"train_loss": -10.575380325317383, "global_step": 264124, "epoch": 1572} {"train_loss": -11.299875259399414, "global_step": 264125, "epoch": 1572} {"train_loss": -11.237537384033203, "global_step": 264126, "epoch": 1572} {"train_loss": -10.765552520751953, "global_step": 264127, "epoch": 1572} {"train_loss": -11.670442581176758, "global_step": 264128, "epoch": 1572} {"train_loss": -11.045674324035645, "global_step": 264129, "epoch": 1572} {"train_loss": -11.481014251708984, "global_step": 264130, "epoch": 1572} {"train_loss": -11.409613609313965, "global_step": 264131, "epoch": 1572} {"train_loss": -11.618648529052734, "global_step": 264132, "epoch": 1572} {"train_loss": -11.643123626708984, "global_step": 264133, "epoch": 1572} {"train_loss": -11.602632522583008, "global_step": 264134, "epoch": 1572} {"train_loss": -11.681845664978027, "global_step": 264135, "epoch": 1572} {"train_loss": -11.527719497680664, "global_step": 264136, "epoch": 1572} {"train_loss": -11.358123779296875, "global_step": 264137, "epoch": 1572} {"train_loss": -11.546339988708496, "global_step": 264138, "epoch": 1572} {"train_loss": -11.40469741821289, "global_step": 264139, "epoch": 1572} {"train_loss": -11.646678924560547, "global_step": 264140, "epoch": 1572} {"train_loss": -11.601253509521484, "global_step": 264141, "epoch": 1572} {"train_loss": -11.865278244018555, "global_step": 264142, "epoch": 1572} {"train_loss": -11.635862350463867, "global_step": 264143, "epoch": 1572} {"train_loss": -11.889425277709961, "global_step": 264144, "epoch": 1572} {"train_loss": -11.587603569030762, "global_step": 264145, "epoch": 1572} {"train_loss": -11.570104598999023, "global_step": 264146, "epoch": 1572} {"train_loss": -11.819721221923828, "global_step": 264147, "epoch": 1572} {"train_loss": -11.22066879272461, "global_step": 264148, "epoch": 1572} {"train_loss": -11.981473922729492, "global_step": 264149, "epoch": 1572} {"train_loss": -11.529810905456543, "global_step": 264150, "epoch": 1572} {"train_loss": -11.772431373596191, "global_step": 264151, "epoch": 1572} {"train_loss": -11.863049507141113, "global_step": 264152, "epoch": 1572} {"train_loss": -11.771854400634766, "global_step": 264153, "epoch": 1572} {"train_loss": -11.733524322509766, "global_step": 264154, "epoch": 1572} {"train_loss": -11.712822914123535, "global_step": 264155, "epoch": 1572} {"train_loss": -11.915639877319336, "global_step": 264156, "epoch": 1572} {"train_loss": -12.009239196777344, "global_step": 264157, "epoch": 1572} {"train_loss": -12.01961898803711, "global_step": 264158, "epoch": 1572} {"train_loss": -11.945602416992188, "global_step": 264159, "epoch": 1572} {"train_loss": -11.861366271972656, "global_step": 264160, "epoch": 1572} {"train_loss": -11.986433029174805, "global_step": 264161, "epoch": 1572} {"train_loss": -12.088794708251953, "global_step": 264162, "epoch": 1572} {"train_loss": -11.968963623046875, "global_step": 264163, "epoch": 1572} {"train_loss": -12.287612915039062, "global_step": 264164, "epoch": 1572} {"train_loss": -11.772832870483398, "global_step": 264165, "epoch": 1572} {"train_loss": -12.15787124633789, "global_step": 264166, "epoch": 1572} {"train_loss": -12.116447448730469, "global_step": 264167, "epoch": 1572} {"train_loss": -11.880494117736816, "global_step": 264168, "epoch": 1572} {"train_loss": -11.932650566101074, "global_step": 264169, "epoch": 1572} {"train_loss": -12.008722305297852, "global_step": 264170, "epoch": 1572} {"train_loss": -12.20500659942627, "global_step": 264171, "epoch": 1572} {"train_loss": -12.381855010986328, "global_step": 264172, "epoch": 1572} {"train_loss": -11.996763229370117, "global_step": 264173, "epoch": 1572} {"train_loss": -12.078169822692871, "global_step": 264174, "epoch": 1572} {"train_loss": -12.340511322021484, "global_step": 264175, "epoch": 1572} {"train_loss": -12.10183334350586, "global_step": 264176, "epoch": 1572} {"train_loss": -12.069128036499023, "global_step": 264177, "epoch": 1572} {"train_loss": -12.080179214477539, "global_step": 264178, "epoch": 1572} {"train_loss": -11.871158599853516, "global_step": 264179, "epoch": 1572} {"train_loss": -12.22970199584961, "global_step": 264180, "epoch": 1572} {"train_loss": -12.174473762512207, "global_step": 264181, "epoch": 1572} {"train_loss": -12.353403091430664, "global_step": 264182, "epoch": 1572} {"train_loss": -12.063799858093262, "global_step": 264183, "epoch": 1572} {"train_loss": -12.356971740722656, "global_step": 264184, "epoch": 1572} {"train_loss": -12.111246109008789, "global_step": 264185, "epoch": 1572} {"train_loss": -12.132774353027344, "global_step": 264186, "epoch": 1572} {"train_loss": -12.285411834716797, "global_step": 264187, "epoch": 1572} {"train_loss": -11.54554557800293, "global_step": 264188, "epoch": 1572} {"train_loss": -11.943758010864258, "global_step": 264189, "epoch": 1572} {"train_loss": -12.15947437286377, "global_step": 264190, "epoch": 1572} {"train_loss": -12.091777801513672, "global_step": 264191, "epoch": 1572} {"train_loss": -11.668915748596191, "global_step": 264192, "epoch": 1572} {"train_loss": -12.463199615478516, "global_step": 264193, "epoch": 1572} {"train_loss": -12.223125457763672, "global_step": 264194, "epoch": 1572} {"train_loss": -12.076738357543945, "global_step": 264195, "epoch": 1572} {"train_loss": -12.058457374572754, "global_step": 264196, "epoch": 1572} {"train_loss": -12.066370964050293, "global_step": 264197, "epoch": 1572} {"train_loss": -11.97358226776123, "global_step": 264198, "epoch": 1572} {"train_loss": -12.315132141113281, "global_step": 264199, "epoch": 1572} {"train_loss": -12.31786823272705, "global_step": 264200, "epoch": 1572} {"train_loss": -12.396429061889648, "global_step": 264201, "epoch": 1572} {"train_loss": -12.08697509765625, "global_step": 264202, "epoch": 1572} {"train_loss": -12.444223403930664, "global_step": 264203, "epoch": 1572} {"train_loss": -12.068580627441406, "global_step": 264204, "epoch": 1572} {"train_loss": -12.193069458007812, "global_step": 264205, "epoch": 1572} {"train_loss": -11.544120788574219, "global_step": 264206, "epoch": 1572} {"train_loss": -11.281766891479492, "global_step": 264207, "epoch": 1572} {"train_loss": -11.591196060180664, "global_step": 264208, "epoch": 1572} {"train_loss": -12.316699028015137, "global_step": 264209, "epoch": 1572} {"train_loss": -11.35020637512207, "global_step": 264210, "epoch": 1572} {"train_loss": -11.049932479858398, "global_step": 264211, "epoch": 1572} {"train_loss": -10.864822387695312, "global_step": 264212, "epoch": 1572} {"train_loss": -11.387472152709961, "global_step": 264213, "epoch": 1572} {"train_loss": -10.258684158325195, "global_step": 264214, "epoch": 1572} {"train_loss": -11.350292205810547, "global_step": 264215, "epoch": 1572} {"train_loss": -11.4908447265625, "global_step": 264216, "epoch": 1572} {"train_loss": -9.761795043945312, "global_step": 264217, "epoch": 1572} {"train_loss": -11.139491081237793, "global_step": 264218, "epoch": 1572} {"train_loss": -11.063079833984375, "global_step": 264219, "epoch": 1572} {"train_loss": -8.604202270507812, "global_step": 264220, "epoch": 1572} {"train_loss": -10.586255073547363, "global_step": 264221, "epoch": 1572} {"train_loss": -8.719522476196289, "global_step": 264222, "epoch": 1572} {"train_loss": -9.38973617553711, "global_step": 264223, "epoch": 1572} {"train_loss": -10.205787658691406, "global_step": 264224, "epoch": 1572} {"train_loss": -9.602523803710938, "global_step": 264225, "epoch": 1572} {"train_loss": -9.544036865234375, "global_step": 264226, "epoch": 1572} {"train_loss": -10.19509220123291, "global_step": 264227, "epoch": 1572} {"train_loss": -8.748906135559082, "global_step": 264228, "epoch": 1572} {"train_loss": -8.532424926757812, "global_step": 264229, "epoch": 1572} {"train_loss": -10.365375518798828, "global_step": 264230, "epoch": 1572} {"train_loss": -10.155101776123047, "global_step": 264231, "epoch": 1572} {"train_loss": -9.93301010131836, "global_step": 264232, "epoch": 1572} {"train_loss": -10.790493965148926, "global_step": 264233, "epoch": 1572} {"train_loss": -11.043746948242188, "global_step": 264234, "epoch": 1572} {"train_loss": -10.618664741516113, "global_step": 264235, "epoch": 1572} {"train_loss": -11.005878448486328, "global_step": 264236, "epoch": 1572} {"train_loss": -10.414039611816406, "global_step": 264237, "epoch": 1572} {"train_loss": -11.24832820892334, "global_step": 264238, "epoch": 1572} {"train_loss": -10.604485511779785, "global_step": 264239, "epoch": 1572} {"train_loss": -11.305323600769043, "global_step": 264240, "epoch": 1572} {"train_loss": -11.351144790649414, "global_step": 264241, "epoch": 1572} {"train_loss": -11.239166259765625, "global_step": 264242, "epoch": 1572} {"train_loss": -11.1715726852417, "global_step": 264243, "epoch": 1572} {"train_loss": -11.755067825317383, "global_step": 264244, "epoch": 1572} {"train_loss": -11.052873611450195, "global_step": 264245, "epoch": 1572} {"train_loss": -11.590749740600586, "global_step": 264246, "epoch": 1572} {"train_loss": -11.414831161499023, "global_step": 264247, "epoch": 1572} {"train_loss": -11.697539329528809, "global_step": 264248, "epoch": 1572} {"train_loss": -11.423894882202148, "global_step": 264249, "epoch": 1572} {"train_loss": -11.321917533874512, "global_step": 264250, "epoch": 1572} {"train_loss": -11.469915390014648, "global_step": 264251, "epoch": 1572} {"train_loss": -11.597662925720215, "global_step": 264252, "epoch": 1572} {"train_loss": -11.584247589111328, "global_step": 264253, "epoch": 1572} {"train_loss": -11.838418006896973, "global_step": 264254, "epoch": 1572} {"train_loss": -11.620203018188477, "global_step": 264255, "epoch": 1572} {"train_loss": -11.792488098144531, "global_step": 264256, "epoch": 1572} {"train_loss": -11.77975082397461, "global_step": 264257, "epoch": 1572} {"train_loss": -11.832927703857422, "global_step": 264258, "epoch": 1572} {"train_loss": -11.68016242980957, "global_step": 264259, "epoch": 1572} {"train_loss": -11.512398719787598, "global_step": 264260, "epoch": 1572} {"train_loss": -11.968297958374023, "global_step": 264261, "epoch": 1572} {"train_loss": -11.915277481079102, "global_step": 264262, "epoch": 1572} {"train_loss": -11.501821387381781, "global_step": 264263, "epoch": 1572, "val_loss": 262508.6875} {"train_loss": -11.699152946472168, "global_step": 264264, "epoch": 1573} {"train_loss": -11.509796142578125, "global_step": 264265, "epoch": 1573} {"train_loss": -11.892274856567383, "global_step": 264266, "epoch": 1573} {"train_loss": -11.955711364746094, "global_step": 264267, "epoch": 1573} {"train_loss": -12.069271087646484, "global_step": 264268, "epoch": 1573} {"train_loss": -12.051142692565918, "global_step": 264269, "epoch": 1573} {"train_loss": -11.940598487854004, "global_step": 264270, "epoch": 1573} {"train_loss": -12.089592933654785, "global_step": 264271, "epoch": 1573} {"train_loss": -11.84557819366455, "global_step": 264272, "epoch": 1573} {"train_loss": -11.76045036315918, "global_step": 264273, "epoch": 1573} {"train_loss": -11.970481872558594, "global_step": 264274, "epoch": 1573} {"train_loss": -11.98349380493164, "global_step": 264275, "epoch": 1573} {"train_loss": -11.759693145751953, "global_step": 264276, "epoch": 1573} {"train_loss": -11.968488693237305, "global_step": 264277, "epoch": 1573} {"train_loss": -11.816704750061035, "global_step": 264278, "epoch": 1573} {"train_loss": -12.105884552001953, "global_step": 264279, "epoch": 1573} {"train_loss": -12.126777648925781, "global_step": 264280, "epoch": 1573} {"train_loss": -12.066840171813965, "global_step": 264281, "epoch": 1573} {"train_loss": -12.054854393005371, "global_step": 264282, "epoch": 1573} {"train_loss": -12.085758209228516, "global_step": 264283, "epoch": 1573} {"train_loss": -12.104628562927246, "global_step": 264284, "epoch": 1573} {"train_loss": -12.167055130004883, "global_step": 264285, "epoch": 1573} {"train_loss": -12.284599304199219, "global_step": 264286, "epoch": 1573} {"train_loss": -12.274163246154785, "global_step": 264287, "epoch": 1573} {"train_loss": -12.164215087890625, "global_step": 264288, "epoch": 1573} {"train_loss": -12.190320014953613, "global_step": 264289, "epoch": 1573} {"train_loss": -12.246498107910156, "global_step": 264290, "epoch": 1573} {"train_loss": -12.266340255737305, "global_step": 264291, "epoch": 1573} {"train_loss": -12.336080551147461, "global_step": 264292, "epoch": 1573} {"train_loss": -11.991212844848633, "global_step": 264293, "epoch": 1573} {"train_loss": -12.376924514770508, "global_step": 264294, "epoch": 1573} {"train_loss": -12.199382781982422, "global_step": 264295, "epoch": 1573} {"train_loss": -12.172269821166992, "global_step": 264296, "epoch": 1573} {"train_loss": -12.247303009033203, "global_step": 264297, "epoch": 1573} {"train_loss": -12.098527908325195, "global_step": 264298, "epoch": 1573} {"train_loss": -12.157110214233398, "global_step": 264299, "epoch": 1573} {"train_loss": -12.087976455688477, "global_step": 264300, "epoch": 1573} {"train_loss": -11.939874649047852, "global_step": 264301, "epoch": 1573} {"train_loss": -12.411490440368652, "global_step": 264302, "epoch": 1573} {"train_loss": -12.209653854370117, "global_step": 264303, "epoch": 1573} {"train_loss": -12.189102172851562, "global_step": 264304, "epoch": 1573} {"train_loss": -12.17113971710205, "global_step": 264305, "epoch": 1573} {"train_loss": -11.83296012878418, "global_step": 264306, "epoch": 1573} {"train_loss": -11.998329162597656, "global_step": 264307, "epoch": 1573} {"train_loss": -11.493156433105469, "global_step": 264308, "epoch": 1573} {"train_loss": -11.399275779724121, "global_step": 264309, "epoch": 1573} {"train_loss": -12.475768089294434, "global_step": 264310, "epoch": 1573} {"train_loss": -11.440352439880371, "global_step": 264311, "epoch": 1573} {"train_loss": -12.186628341674805, "global_step": 264312, "epoch": 1573} {"train_loss": -11.578304290771484, "global_step": 264313, "epoch": 1573} {"train_loss": -11.362855911254883, "global_step": 264314, "epoch": 1573} {"train_loss": -11.030946731567383, "global_step": 264315, "epoch": 1573} {"train_loss": -11.690314292907715, "global_step": 264316, "epoch": 1573} {"train_loss": -11.269303321838379, "global_step": 264317, "epoch": 1573} {"train_loss": -10.119667053222656, "global_step": 264318, "epoch": 1573} {"train_loss": -11.291746139526367, "global_step": 264319, "epoch": 1573} {"train_loss": -11.26104736328125, "global_step": 264320, "epoch": 1573} {"train_loss": -10.70744514465332, "global_step": 264321, "epoch": 1573} {"train_loss": -11.46226692199707, "global_step": 264322, "epoch": 1573} {"train_loss": -11.594033241271973, "global_step": 264323, "epoch": 1573} {"train_loss": -11.049604415893555, "global_step": 264324, "epoch": 1573} {"train_loss": -11.707164764404297, "global_step": 264325, "epoch": 1573} {"train_loss": -11.65841293334961, "global_step": 264326, "epoch": 1573} {"train_loss": -11.038505554199219, "global_step": 264327, "epoch": 1573} {"train_loss": -12.009481430053711, "global_step": 264328, "epoch": 1573} {"train_loss": -10.252578735351562, "global_step": 264329, "epoch": 1573} {"train_loss": -10.69533920288086, "global_step": 264330, "epoch": 1573} {"train_loss": -11.581149101257324, "global_step": 264331, "epoch": 1573} {"train_loss": -10.554930686950684, "global_step": 264332, "epoch": 1573} {"train_loss": -11.816377639770508, "global_step": 264333, "epoch": 1573} {"train_loss": -10.2749662399292, "global_step": 264334, "epoch": 1573} {"train_loss": -11.633322715759277, "global_step": 264335, "epoch": 1573} {"train_loss": -11.612972259521484, "global_step": 264336, "epoch": 1573} {"train_loss": -11.062187194824219, "global_step": 264337, "epoch": 1573} {"train_loss": -11.623727798461914, "global_step": 264338, "epoch": 1573} {"train_loss": -10.71126651763916, "global_step": 264339, "epoch": 1573} {"train_loss": -11.847933769226074, "global_step": 264340, "epoch": 1573} {"train_loss": -10.953210830688477, "global_step": 264341, "epoch": 1573} {"train_loss": -11.837850570678711, "global_step": 264342, "epoch": 1573} {"train_loss": -11.343997955322266, "global_step": 264343, "epoch": 1573} {"train_loss": -10.85738754272461, "global_step": 264344, "epoch": 1573} {"train_loss": -11.532532691955566, "global_step": 264345, "epoch": 1573} {"train_loss": -11.144577026367188, "global_step": 264346, "epoch": 1573} {"train_loss": -11.916082382202148, "global_step": 264347, "epoch": 1573} {"train_loss": -11.286945343017578, "global_step": 264348, "epoch": 1573} {"train_loss": -11.931035041809082, "global_step": 264349, "epoch": 1573} {"train_loss": -11.787107467651367, "global_step": 264350, "epoch": 1573} {"train_loss": -11.374490737915039, "global_step": 264351, "epoch": 1573} {"train_loss": -11.7423677444458, "global_step": 264352, "epoch": 1573} {"train_loss": -11.719852447509766, "global_step": 264353, "epoch": 1573} {"train_loss": -11.528594970703125, "global_step": 264354, "epoch": 1573} {"train_loss": -11.934940338134766, "global_step": 264355, "epoch": 1573} {"train_loss": -11.67119026184082, "global_step": 264356, "epoch": 1573} {"train_loss": -11.986396789550781, "global_step": 264357, "epoch": 1573} {"train_loss": -11.727075576782227, "global_step": 264358, "epoch": 1573} {"train_loss": -12.013287544250488, "global_step": 264359, "epoch": 1573} {"train_loss": -11.726932525634766, "global_step": 264360, "epoch": 1573} {"train_loss": -11.806873321533203, "global_step": 264361, "epoch": 1573} {"train_loss": -11.984184265136719, "global_step": 264362, "epoch": 1573} {"train_loss": -12.04505443572998, "global_step": 264363, "epoch": 1573} {"train_loss": -12.125646591186523, "global_step": 264364, "epoch": 1573} {"train_loss": -12.065225601196289, "global_step": 264365, "epoch": 1573} {"train_loss": -11.92385196685791, "global_step": 264366, "epoch": 1573} {"train_loss": -11.958518981933594, "global_step": 264367, "epoch": 1573} {"train_loss": -11.99873161315918, "global_step": 264368, "epoch": 1573} {"train_loss": -12.057914733886719, "global_step": 264369, "epoch": 1573} {"train_loss": -12.043900489807129, "global_step": 264370, "epoch": 1573} {"train_loss": -12.03801155090332, "global_step": 264371, "epoch": 1573} {"train_loss": -12.108312606811523, "global_step": 264372, "epoch": 1573} {"train_loss": -12.16209602355957, "global_step": 264373, "epoch": 1573} {"train_loss": -11.866589546203613, "global_step": 264374, "epoch": 1573} {"train_loss": -11.948068618774414, "global_step": 264375, "epoch": 1573} {"train_loss": -11.984950065612793, "global_step": 264376, "epoch": 1573} {"train_loss": -11.967479705810547, "global_step": 264377, "epoch": 1573} {"train_loss": -12.100868225097656, "global_step": 264378, "epoch": 1573} {"train_loss": -12.195740699768066, "global_step": 264379, "epoch": 1573} {"train_loss": -12.13853645324707, "global_step": 264380, "epoch": 1573} {"train_loss": -11.9654541015625, "global_step": 264381, "epoch": 1573} {"train_loss": -12.114469528198242, "global_step": 264382, "epoch": 1573} {"train_loss": -12.098749160766602, "global_step": 264383, "epoch": 1573} {"train_loss": -12.32086181640625, "global_step": 264384, "epoch": 1573} {"train_loss": -11.875670433044434, "global_step": 264385, "epoch": 1573} {"train_loss": -11.887022018432617, "global_step": 264386, "epoch": 1573} {"train_loss": -12.014469146728516, "global_step": 264387, "epoch": 1573} {"train_loss": -12.014930725097656, "global_step": 264388, "epoch": 1573} {"train_loss": -11.994805335998535, "global_step": 264389, "epoch": 1573} {"train_loss": -11.933899879455566, "global_step": 264390, "epoch": 1573} {"train_loss": -11.89578628540039, "global_step": 264391, "epoch": 1573} {"train_loss": -11.823358535766602, "global_step": 264392, "epoch": 1573} {"train_loss": -11.894682884216309, "global_step": 264393, "epoch": 1573} {"train_loss": -11.857585906982422, "global_step": 264394, "epoch": 1573} {"train_loss": -11.63609790802002, "global_step": 264395, "epoch": 1573} {"train_loss": -11.589969635009766, "global_step": 264396, "epoch": 1573} {"train_loss": -11.175469398498535, "global_step": 264397, "epoch": 1573} {"train_loss": -12.09345817565918, "global_step": 264398, "epoch": 1573} {"train_loss": -11.633581161499023, "global_step": 264399, "epoch": 1573} {"train_loss": -12.019105911254883, "global_step": 264400, "epoch": 1573} {"train_loss": -11.000141143798828, "global_step": 264401, "epoch": 1573} {"train_loss": -12.152063369750977, "global_step": 264402, "epoch": 1573} {"train_loss": -11.148265838623047, "global_step": 264403, "epoch": 1573} {"train_loss": -11.91756820678711, "global_step": 264404, "epoch": 1573} {"train_loss": -11.340119361877441, "global_step": 264405, "epoch": 1573} {"train_loss": -11.331321716308594, "global_step": 264406, "epoch": 1573} {"train_loss": -10.751134872436523, "global_step": 264407, "epoch": 1573} {"train_loss": -10.382318496704102, "global_step": 264408, "epoch": 1573} {"train_loss": -11.07260513305664, "global_step": 264409, "epoch": 1573} {"train_loss": -9.538908958435059, "global_step": 264410, "epoch": 1573} {"train_loss": -12.137149810791016, "global_step": 264411, "epoch": 1573} {"train_loss": -10.851794242858887, "global_step": 264412, "epoch": 1573} {"train_loss": -10.846107482910156, "global_step": 264413, "epoch": 1573} {"train_loss": -11.285120010375977, "global_step": 264414, "epoch": 1573} {"train_loss": -10.857344627380371, "global_step": 264415, "epoch": 1573} {"train_loss": -11.771003723144531, "global_step": 264416, "epoch": 1573} {"train_loss": -10.657398223876953, "global_step": 264417, "epoch": 1573} {"train_loss": -11.677322387695312, "global_step": 264418, "epoch": 1573} {"train_loss": -9.990638732910156, "global_step": 264419, "epoch": 1573} {"train_loss": -11.495650291442871, "global_step": 264420, "epoch": 1573} {"train_loss": -11.193994522094727, "global_step": 264421, "epoch": 1573} {"train_loss": -11.872676849365234, "global_step": 264422, "epoch": 1573} {"train_loss": -11.134833335876465, "global_step": 264423, "epoch": 1573} {"train_loss": -11.402830123901367, "global_step": 264424, "epoch": 1573} {"train_loss": -11.479151725769043, "global_step": 264425, "epoch": 1573} {"train_loss": -11.22854995727539, "global_step": 264426, "epoch": 1573} {"train_loss": -11.789695739746094, "global_step": 264427, "epoch": 1573} {"train_loss": -11.311453819274902, "global_step": 264428, "epoch": 1573} {"train_loss": -11.393556594848633, "global_step": 264429, "epoch": 1573} {"train_loss": -11.654973030090332, "global_step": 264430, "epoch": 1573} {"train_loss": -11.683377810886928, "global_step": 264431, "epoch": 1573, "val_loss": 268553.71875} {"train_loss": -11.76106071472168, "global_step": 264432, "epoch": 1574} {"train_loss": -11.169598579406738, "global_step": 264433, "epoch": 1574} {"train_loss": -11.78294563293457, "global_step": 264434, "epoch": 1574} {"train_loss": -11.127342224121094, "global_step": 264435, "epoch": 1574} {"train_loss": -11.659626007080078, "global_step": 264436, "epoch": 1574} {"train_loss": -11.117755889892578, "global_step": 264437, "epoch": 1574} {"train_loss": -10.885494232177734, "global_step": 264438, "epoch": 1574} {"train_loss": -11.546304702758789, "global_step": 264439, "epoch": 1574} {"train_loss": -10.98383903503418, "global_step": 264440, "epoch": 1574} {"train_loss": -11.591164588928223, "global_step": 264441, "epoch": 1574} {"train_loss": -11.137458801269531, "global_step": 264442, "epoch": 1574} {"train_loss": -11.481488227844238, "global_step": 264443, "epoch": 1574} {"train_loss": -11.432493209838867, "global_step": 264444, "epoch": 1574} {"train_loss": -11.3531494140625, "global_step": 264445, "epoch": 1574} {"train_loss": -11.81417179107666, "global_step": 264446, "epoch": 1574} {"train_loss": -11.502166748046875, "global_step": 264447, "epoch": 1574} {"train_loss": -11.569694519042969, "global_step": 264448, "epoch": 1574} {"train_loss": -11.756366729736328, "global_step": 264449, "epoch": 1574} {"train_loss": -11.554155349731445, "global_step": 264450, "epoch": 1574} {"train_loss": -11.317633628845215, "global_step": 264451, "epoch": 1574} {"train_loss": -11.329557418823242, "global_step": 264452, "epoch": 1574} {"train_loss": -11.272331237792969, "global_step": 264453, "epoch": 1574} {"train_loss": -10.91245174407959, "global_step": 264454, "epoch": 1574} {"train_loss": -11.614753723144531, "global_step": 264455, "epoch": 1574} {"train_loss": -11.239155769348145, "global_step": 264456, "epoch": 1574} {"train_loss": -12.030786514282227, "global_step": 264457, "epoch": 1574} {"train_loss": -11.03702163696289, "global_step": 264458, "epoch": 1574} {"train_loss": -11.673266410827637, "global_step": 264459, "epoch": 1574} {"train_loss": -11.997098922729492, "global_step": 264460, "epoch": 1574} {"train_loss": -11.656818389892578, "global_step": 264461, "epoch": 1574} {"train_loss": -11.872170448303223, "global_step": 264462, "epoch": 1574} {"train_loss": -11.649371147155762, "global_step": 264463, "epoch": 1574} {"train_loss": -11.959907531738281, "global_step": 264464, "epoch": 1574} {"train_loss": -11.82624626159668, "global_step": 264465, "epoch": 1574} {"train_loss": -11.869268417358398, "global_step": 264466, "epoch": 1574} {"train_loss": -11.67984390258789, "global_step": 264467, "epoch": 1574} {"train_loss": -11.929654121398926, "global_step": 264468, "epoch": 1574} {"train_loss": -11.995614051818848, "global_step": 264469, "epoch": 1574} {"train_loss": -11.760552406311035, "global_step": 264470, "epoch": 1574} {"train_loss": -11.942584991455078, "global_step": 264471, "epoch": 1574} {"train_loss": -11.662922859191895, "global_step": 264472, "epoch": 1574} {"train_loss": -11.99581527709961, "global_step": 264473, "epoch": 1574} {"train_loss": -11.601284980773926, "global_step": 264474, "epoch": 1574} {"train_loss": -12.108421325683594, "global_step": 264475, "epoch": 1574} {"train_loss": -12.135305404663086, "global_step": 264476, "epoch": 1574} {"train_loss": -11.646873474121094, "global_step": 264477, "epoch": 1574} {"train_loss": -12.001277923583984, "global_step": 264478, "epoch": 1574} {"train_loss": -11.936283111572266, "global_step": 264479, "epoch": 1574} {"train_loss": -11.752225875854492, "global_step": 264480, "epoch": 1574} {"train_loss": -11.900562286376953, "global_step": 264481, "epoch": 1574} {"train_loss": -11.707523345947266, "global_step": 264482, "epoch": 1574} {"train_loss": -11.886490821838379, "global_step": 264483, "epoch": 1574} {"train_loss": -11.836420059204102, "global_step": 264484, "epoch": 1574} {"train_loss": -11.867238998413086, "global_step": 264485, "epoch": 1574} {"train_loss": -11.82815170288086, "global_step": 264486, "epoch": 1574} {"train_loss": -11.913156509399414, "global_step": 264487, "epoch": 1574} {"train_loss": -11.932631492614746, "global_step": 264488, "epoch": 1574} {"train_loss": -12.221537590026855, "global_step": 264489, "epoch": 1574} {"train_loss": -12.180368423461914, "global_step": 264490, "epoch": 1574} {"train_loss": -12.213455200195312, "global_step": 264491, "epoch": 1574} {"train_loss": -12.309812545776367, "global_step": 264492, "epoch": 1574} {"train_loss": -12.12104606628418, "global_step": 264493, "epoch": 1574} {"train_loss": -12.236137390136719, "global_step": 264494, "epoch": 1574} {"train_loss": -12.113882064819336, "global_step": 264495, "epoch": 1574} {"train_loss": -12.343908309936523, "global_step": 264496, "epoch": 1574} {"train_loss": -12.34378433227539, "global_step": 264497, "epoch": 1574} {"train_loss": -12.354790687561035, "global_step": 264498, "epoch": 1574} {"train_loss": -12.23725700378418, "global_step": 264499, "epoch": 1574} {"train_loss": -12.228948593139648, "global_step": 264500, "epoch": 1574} {"train_loss": -12.20359992980957, "global_step": 264501, "epoch": 1574} {"train_loss": -12.270218849182129, "global_step": 264502, "epoch": 1574} {"train_loss": -12.360015869140625, "global_step": 264503, "epoch": 1574} {"train_loss": -12.165443420410156, "global_step": 264504, "epoch": 1574} {"train_loss": -12.213164329528809, "global_step": 264505, "epoch": 1574} {"train_loss": -12.188336372375488, "global_step": 264506, "epoch": 1574} {"train_loss": -12.11634635925293, "global_step": 264507, "epoch": 1574} {"train_loss": -12.306350708007812, "global_step": 264508, "epoch": 1574} {"train_loss": -12.264396667480469, "global_step": 264509, "epoch": 1574} {"train_loss": -12.319822311401367, "global_step": 264510, "epoch": 1574} {"train_loss": -12.223392486572266, "global_step": 264511, "epoch": 1574} {"train_loss": -12.044401168823242, "global_step": 264512, "epoch": 1574} {"train_loss": -12.17723560333252, "global_step": 264513, "epoch": 1574} {"train_loss": -12.182819366455078, "global_step": 264514, "epoch": 1574} {"train_loss": -12.094308853149414, "global_step": 264515, "epoch": 1574} {"train_loss": -12.067428588867188, "global_step": 264516, "epoch": 1574} {"train_loss": -11.652923583984375, "global_step": 264517, "epoch": 1574} {"train_loss": -11.15970230102539, "global_step": 264518, "epoch": 1574} {"train_loss": -11.673418045043945, "global_step": 264519, "epoch": 1574} {"train_loss": -11.546089172363281, "global_step": 264520, "epoch": 1574} {"train_loss": -9.865215301513672, "global_step": 264521, "epoch": 1574} {"train_loss": -9.012558937072754, "global_step": 264522, "epoch": 1574} {"train_loss": -10.82283878326416, "global_step": 264523, "epoch": 1574} {"train_loss": -6.814001083374023, "global_step": 264524, "epoch": 1574} {"train_loss": -7.6349029541015625, "global_step": 264525, "epoch": 1574} {"train_loss": -8.484682083129883, "global_step": 264526, "epoch": 1574} {"train_loss": -7.073031902313232, "global_step": 264527, "epoch": 1574} {"train_loss": -9.096583366394043, "global_step": 264528, "epoch": 1574} {"train_loss": -7.039595603942871, "global_step": 264529, "epoch": 1574} {"train_loss": -7.153144836425781, "global_step": 264530, "epoch": 1574} {"train_loss": -8.081933975219727, "global_step": 264531, "epoch": 1574} {"train_loss": -9.96946907043457, "global_step": 264532, "epoch": 1574} {"train_loss": -9.05034351348877, "global_step": 264533, "epoch": 1574} {"train_loss": -8.471004486083984, "global_step": 264534, "epoch": 1574} {"train_loss": -9.422710418701172, "global_step": 264535, "epoch": 1574} {"train_loss": -10.94644546508789, "global_step": 264536, "epoch": 1574} {"train_loss": -9.035832405090332, "global_step": 264537, "epoch": 1574} {"train_loss": -10.670570373535156, "global_step": 264538, "epoch": 1574} {"train_loss": -10.495912551879883, "global_step": 264539, "epoch": 1574} {"train_loss": -10.114286422729492, "global_step": 264540, "epoch": 1574} {"train_loss": -10.862313270568848, "global_step": 264541, "epoch": 1574} {"train_loss": -11.085367202758789, "global_step": 264542, "epoch": 1574} {"train_loss": -9.616077423095703, "global_step": 264543, "epoch": 1574} {"train_loss": -10.659266471862793, "global_step": 264544, "epoch": 1574} {"train_loss": -10.769021034240723, "global_step": 264545, "epoch": 1574} {"train_loss": -9.833951950073242, "global_step": 264546, "epoch": 1574} {"train_loss": -11.144152641296387, "global_step": 264547, "epoch": 1574} {"train_loss": -10.61097526550293, "global_step": 264548, "epoch": 1574} {"train_loss": -10.95566463470459, "global_step": 264549, "epoch": 1574} {"train_loss": -11.00134563446045, "global_step": 264550, "epoch": 1574} {"train_loss": -11.242724418640137, "global_step": 264551, "epoch": 1574} {"train_loss": -10.92109489440918, "global_step": 264552, "epoch": 1574} {"train_loss": -11.446046829223633, "global_step": 264553, "epoch": 1574} {"train_loss": -11.674941062927246, "global_step": 264554, "epoch": 1574} {"train_loss": -11.2722806930542, "global_step": 264555, "epoch": 1574} {"train_loss": -11.473058700561523, "global_step": 264556, "epoch": 1574} {"train_loss": -11.422834396362305, "global_step": 264557, "epoch": 1574} {"train_loss": -11.211729049682617, "global_step": 264558, "epoch": 1574} {"train_loss": -11.434890747070312, "global_step": 264559, "epoch": 1574} {"train_loss": -11.51374626159668, "global_step": 264560, "epoch": 1574} {"train_loss": -11.405769348144531, "global_step": 264561, "epoch": 1574} {"train_loss": -11.653630256652832, "global_step": 264562, "epoch": 1574} {"train_loss": -11.733846664428711, "global_step": 264563, "epoch": 1574} {"train_loss": -11.580992698669434, "global_step": 264564, "epoch": 1574} {"train_loss": -11.684022903442383, "global_step": 264565, "epoch": 1574} {"train_loss": -11.645378112792969, "global_step": 264566, "epoch": 1574} {"train_loss": -11.464503288269043, "global_step": 264567, "epoch": 1574} {"train_loss": -11.77952766418457, "global_step": 264568, "epoch": 1574} {"train_loss": -11.53757095336914, "global_step": 264569, "epoch": 1574} {"train_loss": -11.637728691101074, "global_step": 264570, "epoch": 1574} {"train_loss": -11.77856159210205, "global_step": 264571, "epoch": 1574} {"train_loss": -11.621411323547363, "global_step": 264572, "epoch": 1574} {"train_loss": -11.798222541809082, "global_step": 264573, "epoch": 1574} {"train_loss": -11.572785377502441, "global_step": 264574, "epoch": 1574} {"train_loss": -11.559764862060547, "global_step": 264575, "epoch": 1574} {"train_loss": -11.725923538208008, "global_step": 264576, "epoch": 1574} {"train_loss": -11.463285446166992, "global_step": 264577, "epoch": 1574} {"train_loss": -11.573724746704102, "global_step": 264578, "epoch": 1574} {"train_loss": -11.790151596069336, "global_step": 264579, "epoch": 1574} {"train_loss": -11.669656753540039, "global_step": 264580, "epoch": 1574} {"train_loss": -11.590702056884766, "global_step": 264581, "epoch": 1574} {"train_loss": -11.716418266296387, "global_step": 264582, "epoch": 1574} {"train_loss": -11.745875358581543, "global_step": 264583, "epoch": 1574} {"train_loss": -12.063643455505371, "global_step": 264584, "epoch": 1574} {"train_loss": -11.536062240600586, "global_step": 264585, "epoch": 1574} {"train_loss": -11.723735809326172, "global_step": 264586, "epoch": 1574} {"train_loss": -11.92397689819336, "global_step": 264587, "epoch": 1574} {"train_loss": -11.779109954833984, "global_step": 264588, "epoch": 1574} {"train_loss": -11.694232940673828, "global_step": 264589, "epoch": 1574} {"train_loss": -11.952901840209961, "global_step": 264590, "epoch": 1574} {"train_loss": -11.702425003051758, "global_step": 264591, "epoch": 1574} {"train_loss": -11.721273422241211, "global_step": 264592, "epoch": 1574} {"train_loss": -12.022680282592773, "global_step": 264593, "epoch": 1574} {"train_loss": -11.945984840393066, "global_step": 264594, "epoch": 1574} {"train_loss": -11.730408668518066, "global_step": 264595, "epoch": 1574} {"train_loss": -11.934623718261719, "global_step": 264596, "epoch": 1574} {"train_loss": -11.77617359161377, "global_step": 264597, "epoch": 1574} {"train_loss": -11.89423942565918, "global_step": 264598, "epoch": 1574} {"train_loss": -11.357228236539024, "global_step": 264599, "epoch": 1574, "val_loss": 264821.84375} {"train_loss": -11.888532638549805, "global_step": 264600, "epoch": 1575} {"train_loss": -12.059951782226562, "global_step": 264601, "epoch": 1575} {"train_loss": -11.79597282409668, "global_step": 264602, "epoch": 1575} {"train_loss": -12.00220012664795, "global_step": 264603, "epoch": 1575} {"train_loss": -11.892898559570312, "global_step": 264604, "epoch": 1575} {"train_loss": -11.926803588867188, "global_step": 264605, "epoch": 1575} {"train_loss": -11.663320541381836, "global_step": 264606, "epoch": 1575} {"train_loss": -11.843694686889648, "global_step": 264607, "epoch": 1575} {"train_loss": -11.845991134643555, "global_step": 264608, "epoch": 1575} {"train_loss": -12.065418243408203, "global_step": 264609, "epoch": 1575} {"train_loss": -11.93239974975586, "global_step": 264610, "epoch": 1575} {"train_loss": -12.201826095581055, "global_step": 264611, "epoch": 1575} {"train_loss": -12.157524108886719, "global_step": 264612, "epoch": 1575} {"train_loss": -12.052194595336914, "global_step": 264613, "epoch": 1575} {"train_loss": -11.873276710510254, "global_step": 264614, "epoch": 1575} {"train_loss": -12.16617488861084, "global_step": 264615, "epoch": 1575} {"train_loss": -12.141923904418945, "global_step": 264616, "epoch": 1575} {"train_loss": -12.14466667175293, "global_step": 264617, "epoch": 1575} {"train_loss": -11.893247604370117, "global_step": 264618, "epoch": 1575} {"train_loss": -12.186782836914062, "global_step": 264619, "epoch": 1575} {"train_loss": -12.082348823547363, "global_step": 264620, "epoch": 1575} {"train_loss": -12.158889770507812, "global_step": 264621, "epoch": 1575} {"train_loss": -12.028341293334961, "global_step": 264622, "epoch": 1575} {"train_loss": -12.299444198608398, "global_step": 264623, "epoch": 1575} {"train_loss": -11.958100318908691, "global_step": 264624, "epoch": 1575} {"train_loss": -11.732157707214355, "global_step": 264625, "epoch": 1575} {"train_loss": -11.897138595581055, "global_step": 264626, "epoch": 1575} {"train_loss": -12.136507034301758, "global_step": 264627, "epoch": 1575} {"train_loss": -11.362547874450684, "global_step": 264628, "epoch": 1575} {"train_loss": -11.000638961791992, "global_step": 264629, "epoch": 1575} {"train_loss": -12.012786865234375, "global_step": 264630, "epoch": 1575} {"train_loss": -11.035773277282715, "global_step": 264631, "epoch": 1575} {"train_loss": -11.267223358154297, "global_step": 264632, "epoch": 1575} {"train_loss": -11.95175838470459, "global_step": 264633, "epoch": 1575} {"train_loss": -11.2636137008667, "global_step": 264634, "epoch": 1575} {"train_loss": -11.678948402404785, "global_step": 264635, "epoch": 1575} {"train_loss": -11.155572891235352, "global_step": 264636, "epoch": 1575} {"train_loss": -10.533446311950684, "global_step": 264637, "epoch": 1575} {"train_loss": -11.493780136108398, "global_step": 264638, "epoch": 1575} {"train_loss": -11.111673355102539, "global_step": 264639, "epoch": 1575} {"train_loss": -11.302877426147461, "global_step": 264640, "epoch": 1575} {"train_loss": -11.709884643554688, "global_step": 264641, "epoch": 1575} {"train_loss": -11.13355827331543, "global_step": 264642, "epoch": 1575} {"train_loss": -10.668143272399902, "global_step": 264643, "epoch": 1575} {"train_loss": -11.408781051635742, "global_step": 264644, "epoch": 1575} {"train_loss": -10.463623046875, "global_step": 264645, "epoch": 1575} {"train_loss": -11.097110748291016, "global_step": 264646, "epoch": 1575} {"train_loss": -11.427319526672363, "global_step": 264647, "epoch": 1575} {"train_loss": -11.085705757141113, "global_step": 264648, "epoch": 1575} {"train_loss": -11.051263809204102, "global_step": 264649, "epoch": 1575} {"train_loss": -10.837590217590332, "global_step": 264650, "epoch": 1575} {"train_loss": -11.411914825439453, "global_step": 264651, "epoch": 1575} {"train_loss": -11.136628150939941, "global_step": 264652, "epoch": 1575} {"train_loss": -11.788178443908691, "global_step": 264653, "epoch": 1575} {"train_loss": -11.118412017822266, "global_step": 264654, "epoch": 1575} {"train_loss": -11.532093048095703, "global_step": 264655, "epoch": 1575} {"train_loss": -10.635702133178711, "global_step": 264656, "epoch": 1575} {"train_loss": -11.633964538574219, "global_step": 264657, "epoch": 1575} {"train_loss": -10.78952407836914, "global_step": 264658, "epoch": 1575} {"train_loss": -10.933074951171875, "global_step": 264659, "epoch": 1575} {"train_loss": -10.672761917114258, "global_step": 264660, "epoch": 1575} {"train_loss": -10.7549409866333, "global_step": 264661, "epoch": 1575} {"train_loss": -11.059117317199707, "global_step": 264662, "epoch": 1575} {"train_loss": -11.046928405761719, "global_step": 264663, "epoch": 1575} {"train_loss": -11.494531631469727, "global_step": 264664, "epoch": 1575} {"train_loss": -11.092267036437988, "global_step": 264665, "epoch": 1575} {"train_loss": -11.414047241210938, "global_step": 264666, "epoch": 1575} {"train_loss": -11.568479537963867, "global_step": 264667, "epoch": 1575} {"train_loss": -11.621621131896973, "global_step": 264668, "epoch": 1575} {"train_loss": -11.702455520629883, "global_step": 264669, "epoch": 1575} {"train_loss": -11.741600036621094, "global_step": 264670, "epoch": 1575} {"train_loss": -11.259828567504883, "global_step": 264671, "epoch": 1575} {"train_loss": -11.622949600219727, "global_step": 264672, "epoch": 1575} {"train_loss": -11.076251029968262, "global_step": 264673, "epoch": 1575} {"train_loss": -12.060007095336914, "global_step": 264674, "epoch": 1575} {"train_loss": -11.439013481140137, "global_step": 264675, "epoch": 1575} {"train_loss": -11.874536514282227, "global_step": 264676, "epoch": 1575} {"train_loss": -11.852909088134766, "global_step": 264677, "epoch": 1575} {"train_loss": -11.742176055908203, "global_step": 264678, "epoch": 1575} {"train_loss": -12.054044723510742, "global_step": 264679, "epoch": 1575} {"train_loss": -11.632123947143555, "global_step": 264680, "epoch": 1575} {"train_loss": -12.078575134277344, "global_step": 264681, "epoch": 1575} {"train_loss": -11.928326606750488, "global_step": 264682, "epoch": 1575} {"train_loss": -11.734796524047852, "global_step": 264683, "epoch": 1575} {"train_loss": -11.973548889160156, "global_step": 264684, "epoch": 1575} {"train_loss": -11.906757354736328, "global_step": 264685, "epoch": 1575} {"train_loss": -12.027750968933105, "global_step": 264686, "epoch": 1575} {"train_loss": -11.83145523071289, "global_step": 264687, "epoch": 1575} {"train_loss": -12.047800064086914, "global_step": 264688, "epoch": 1575} {"train_loss": -11.980961799621582, "global_step": 264689, "epoch": 1575} {"train_loss": -11.919936180114746, "global_step": 264690, "epoch": 1575} {"train_loss": -12.067804336547852, "global_step": 264691, "epoch": 1575} {"train_loss": -11.911954879760742, "global_step": 264692, "epoch": 1575} {"train_loss": -11.949714660644531, "global_step": 264693, "epoch": 1575} {"train_loss": -12.232677459716797, "global_step": 264694, "epoch": 1575} {"train_loss": -12.069324493408203, "global_step": 264695, "epoch": 1575} {"train_loss": -12.115970611572266, "global_step": 264696, "epoch": 1575} {"train_loss": -12.079753875732422, "global_step": 264697, "epoch": 1575} {"train_loss": -12.181859970092773, "global_step": 264698, "epoch": 1575} {"train_loss": -11.9188814163208, "global_step": 264699, "epoch": 1575} {"train_loss": -11.98182487487793, "global_step": 264700, "epoch": 1575} {"train_loss": -11.972322463989258, "global_step": 264701, "epoch": 1575} {"train_loss": -12.078685760498047, "global_step": 264702, "epoch": 1575} {"train_loss": -12.135553359985352, "global_step": 264703, "epoch": 1575} {"train_loss": -12.007296562194824, "global_step": 264704, "epoch": 1575} {"train_loss": -12.110334396362305, "global_step": 264705, "epoch": 1575} {"train_loss": -12.14360237121582, "global_step": 264706, "epoch": 1575} {"train_loss": -11.937797546386719, "global_step": 264707, "epoch": 1575} {"train_loss": -12.082283973693848, "global_step": 264708, "epoch": 1575} {"train_loss": -11.952388763427734, "global_step": 264709, "epoch": 1575} {"train_loss": -12.220863342285156, "global_step": 264710, "epoch": 1575} {"train_loss": -12.301399230957031, "global_step": 264711, "epoch": 1575} {"train_loss": -12.129413604736328, "global_step": 264712, "epoch": 1575} {"train_loss": -12.043170928955078, "global_step": 264713, "epoch": 1575} {"train_loss": -12.2027587890625, "global_step": 264714, "epoch": 1575} {"train_loss": -12.427687644958496, "global_step": 264715, "epoch": 1575} {"train_loss": -12.453307151794434, "global_step": 264716, "epoch": 1575} {"train_loss": -12.256166458129883, "global_step": 264717, "epoch": 1575} {"train_loss": -12.20505428314209, "global_step": 264718, "epoch": 1575} {"train_loss": -12.171526908874512, "global_step": 264719, "epoch": 1575} {"train_loss": -12.127557754516602, "global_step": 264720, "epoch": 1575} {"train_loss": -12.08997631072998, "global_step": 264721, "epoch": 1575} {"train_loss": -12.198918342590332, "global_step": 264722, "epoch": 1575} {"train_loss": -12.025301933288574, "global_step": 264723, "epoch": 1575} {"train_loss": -12.162149429321289, "global_step": 264724, "epoch": 1575} {"train_loss": -11.435806274414062, "global_step": 264725, "epoch": 1575} {"train_loss": -11.6314697265625, "global_step": 264726, "epoch": 1575} {"train_loss": -12.478986740112305, "global_step": 264727, "epoch": 1575} {"train_loss": -12.181714057922363, "global_step": 264728, "epoch": 1575} {"train_loss": -11.454504013061523, "global_step": 264729, "epoch": 1575} {"train_loss": -11.424111366271973, "global_step": 264730, "epoch": 1575} {"train_loss": -12.174118041992188, "global_step": 264731, "epoch": 1575} {"train_loss": -12.162181854248047, "global_step": 264732, "epoch": 1575} {"train_loss": -12.398295402526855, "global_step": 264733, "epoch": 1575} {"train_loss": -12.2764892578125, "global_step": 264734, "epoch": 1575} {"train_loss": -12.080946922302246, "global_step": 264735, "epoch": 1575} {"train_loss": -12.194823265075684, "global_step": 264736, "epoch": 1575} {"train_loss": -12.300640106201172, "global_step": 264737, "epoch": 1575} {"train_loss": -12.362014770507812, "global_step": 264738, "epoch": 1575} {"train_loss": -11.905664443969727, "global_step": 264739, "epoch": 1575} {"train_loss": -11.948925971984863, "global_step": 264740, "epoch": 1575} {"train_loss": -12.149681091308594, "global_step": 264741, "epoch": 1575} {"train_loss": -12.025274276733398, "global_step": 264742, "epoch": 1575} {"train_loss": -12.112581253051758, "global_step": 264743, "epoch": 1575} {"train_loss": -11.658766746520996, "global_step": 264744, "epoch": 1575} {"train_loss": -11.687609672546387, "global_step": 264745, "epoch": 1575} {"train_loss": -12.152870178222656, "global_step": 264746, "epoch": 1575} {"train_loss": -11.490867614746094, "global_step": 264747, "epoch": 1575} {"train_loss": -11.512513160705566, "global_step": 264748, "epoch": 1575} {"train_loss": -11.854484558105469, "global_step": 264749, "epoch": 1575} {"train_loss": -12.097527503967285, "global_step": 264750, "epoch": 1575} {"train_loss": -10.249112129211426, "global_step": 264751, "epoch": 1575} {"train_loss": -10.808307647705078, "global_step": 264752, "epoch": 1575} {"train_loss": -11.853524208068848, "global_step": 264753, "epoch": 1575} {"train_loss": -10.011249542236328, "global_step": 264754, "epoch": 1575} {"train_loss": -10.199923515319824, "global_step": 264755, "epoch": 1575} {"train_loss": -11.001565933227539, "global_step": 264756, "epoch": 1575} {"train_loss": -10.36559772491455, "global_step": 264757, "epoch": 1575} {"train_loss": -9.743813514709473, "global_step": 264758, "epoch": 1575} {"train_loss": -9.789802551269531, "global_step": 264759, "epoch": 1575} {"train_loss": -10.014399528503418, "global_step": 264760, "epoch": 1575} {"train_loss": -9.723943710327148, "global_step": 264761, "epoch": 1575} {"train_loss": -10.128596305847168, "global_step": 264762, "epoch": 1575} {"train_loss": -11.099069595336914, "global_step": 264763, "epoch": 1575} {"train_loss": -9.414731979370117, "global_step": 264764, "epoch": 1575} {"train_loss": -11.025832176208496, "global_step": 264765, "epoch": 1575} {"train_loss": -9.44202995300293, "global_step": 264766, "epoch": 1575} {"train_loss": -11.630165134157453, "global_step": 264767, "epoch": 1575, "val_loss": 272075.875, "train_action_mse_error": 2.471900463104248} {"train_loss": -10.142803192138672, "global_step": 264768, "epoch": 1576} {"train_loss": -10.795219421386719, "global_step": 264769, "epoch": 1576} {"train_loss": -10.988449096679688, "global_step": 264770, "epoch": 1576} {"train_loss": -10.725570678710938, "global_step": 264771, "epoch": 1576} {"train_loss": -10.570547103881836, "global_step": 264772, "epoch": 1576} {"train_loss": -10.915952682495117, "global_step": 264773, "epoch": 1576} {"train_loss": -10.385417938232422, "global_step": 264774, "epoch": 1576} {"train_loss": -10.593498229980469, "global_step": 264775, "epoch": 1576} {"train_loss": -10.629735946655273, "global_step": 264776, "epoch": 1576} {"train_loss": -11.046089172363281, "global_step": 264777, "epoch": 1576} {"train_loss": -10.856363296508789, "global_step": 264778, "epoch": 1576} {"train_loss": -11.157289505004883, "global_step": 264779, "epoch": 1576} {"train_loss": -10.391735076904297, "global_step": 264780, "epoch": 1576} {"train_loss": -11.386290550231934, "global_step": 264781, "epoch": 1576} {"train_loss": -10.119551658630371, "global_step": 264782, "epoch": 1576} {"train_loss": -11.365205764770508, "global_step": 264783, "epoch": 1576} {"train_loss": -10.644933700561523, "global_step": 264784, "epoch": 1576} {"train_loss": -11.42234992980957, "global_step": 264785, "epoch": 1576} {"train_loss": -11.097947120666504, "global_step": 264786, "epoch": 1576} {"train_loss": -11.549942016601562, "global_step": 264787, "epoch": 1576} {"train_loss": -10.97056770324707, "global_step": 264788, "epoch": 1576} {"train_loss": -11.26356315612793, "global_step": 264789, "epoch": 1576} {"train_loss": -11.006357192993164, "global_step": 264790, "epoch": 1576} {"train_loss": -11.37921142578125, "global_step": 264791, "epoch": 1576} {"train_loss": -10.605304718017578, "global_step": 264792, "epoch": 1576} {"train_loss": -11.600085258483887, "global_step": 264793, "epoch": 1576} {"train_loss": -10.662212371826172, "global_step": 264794, "epoch": 1576} {"train_loss": -11.527382850646973, "global_step": 264795, "epoch": 1576} {"train_loss": -10.730020523071289, "global_step": 264796, "epoch": 1576} {"train_loss": -10.81309700012207, "global_step": 264797, "epoch": 1576} {"train_loss": -11.481483459472656, "global_step": 264798, "epoch": 1576} {"train_loss": -11.320340156555176, "global_step": 264799, "epoch": 1576} {"train_loss": -11.473968505859375, "global_step": 264800, "epoch": 1576} {"train_loss": -11.447454452514648, "global_step": 264801, "epoch": 1576} {"train_loss": -11.657395362854004, "global_step": 264802, "epoch": 1576} {"train_loss": -11.530902862548828, "global_step": 264803, "epoch": 1576} {"train_loss": -11.698345184326172, "global_step": 264804, "epoch": 1576} {"train_loss": -11.43429183959961, "global_step": 264805, "epoch": 1576} {"train_loss": -11.7303466796875, "global_step": 264806, "epoch": 1576} {"train_loss": -11.77830696105957, "global_step": 264807, "epoch": 1576} {"train_loss": -11.825706481933594, "global_step": 264808, "epoch": 1576} {"train_loss": -11.809175491333008, "global_step": 264809, "epoch": 1576} {"train_loss": -11.910905838012695, "global_step": 264810, "epoch": 1576} {"train_loss": -11.795282363891602, "global_step": 264811, "epoch": 1576} {"train_loss": -11.733108520507812, "global_step": 264812, "epoch": 1576} {"train_loss": -11.658467292785645, "global_step": 264813, "epoch": 1576} {"train_loss": -11.893562316894531, "global_step": 264814, "epoch": 1576} {"train_loss": -11.840376853942871, "global_step": 264815, "epoch": 1576} {"train_loss": -11.903420448303223, "global_step": 264816, "epoch": 1576} {"train_loss": -12.01024055480957, "global_step": 264817, "epoch": 1576} {"train_loss": -12.024478912353516, "global_step": 264818, "epoch": 1576} {"train_loss": -12.16855239868164, "global_step": 264819, "epoch": 1576} {"train_loss": -12.054975509643555, "global_step": 264820, "epoch": 1576} {"train_loss": -11.809612274169922, "global_step": 264821, "epoch": 1576} {"train_loss": -12.062047958374023, "global_step": 264822, "epoch": 1576} {"train_loss": -12.101722717285156, "global_step": 264823, "epoch": 1576} {"train_loss": -12.133800506591797, "global_step": 264824, "epoch": 1576} {"train_loss": -12.037184715270996, "global_step": 264825, "epoch": 1576} {"train_loss": -12.008565902709961, "global_step": 264826, "epoch": 1576} {"train_loss": -12.214247703552246, "global_step": 264827, "epoch": 1576} {"train_loss": -12.20358943939209, "global_step": 264828, "epoch": 1576} {"train_loss": -11.96271800994873, "global_step": 264829, "epoch": 1576} {"train_loss": -12.06794261932373, "global_step": 264830, "epoch": 1576} {"train_loss": -12.02984619140625, "global_step": 264831, "epoch": 1576} {"train_loss": -12.142714500427246, "global_step": 264832, "epoch": 1576} {"train_loss": -12.129947662353516, "global_step": 264833, "epoch": 1576} {"train_loss": -11.946444511413574, "global_step": 264834, "epoch": 1576} {"train_loss": -12.153480529785156, "global_step": 264835, "epoch": 1576} {"train_loss": -12.20942497253418, "global_step": 264836, "epoch": 1576} {"train_loss": -12.231714248657227, "global_step": 264837, "epoch": 1576} {"train_loss": -12.097417831420898, "global_step": 264838, "epoch": 1576} {"train_loss": -12.195453643798828, "global_step": 264839, "epoch": 1576} {"train_loss": -12.211431503295898, "global_step": 264840, "epoch": 1576} {"train_loss": -12.254724502563477, "global_step": 264841, "epoch": 1576} {"train_loss": -12.064732551574707, "global_step": 264842, "epoch": 1576} {"train_loss": -12.325783729553223, "global_step": 264843, "epoch": 1576} {"train_loss": -12.197275161743164, "global_step": 264844, "epoch": 1576} {"train_loss": -12.165863037109375, "global_step": 264845, "epoch": 1576} {"train_loss": -12.276811599731445, "global_step": 264846, "epoch": 1576} {"train_loss": -12.357657432556152, "global_step": 264847, "epoch": 1576} {"train_loss": -12.269198417663574, "global_step": 264848, "epoch": 1576} {"train_loss": -12.409591674804688, "global_step": 264849, "epoch": 1576} {"train_loss": -12.307258605957031, "global_step": 264850, "epoch": 1576} {"train_loss": -12.260702133178711, "global_step": 264851, "epoch": 1576} {"train_loss": -12.203689575195312, "global_step": 264852, "epoch": 1576} {"train_loss": -12.372391700744629, "global_step": 264853, "epoch": 1576} {"train_loss": -12.283102035522461, "global_step": 264854, "epoch": 1576} {"train_loss": -12.405195236206055, "global_step": 264855, "epoch": 1576} {"train_loss": -12.464479446411133, "global_step": 264856, "epoch": 1576} {"train_loss": -12.319668769836426, "global_step": 264857, "epoch": 1576} {"train_loss": -12.065656661987305, "global_step": 264858, "epoch": 1576} {"train_loss": -12.307464599609375, "global_step": 264859, "epoch": 1576} {"train_loss": -12.30023193359375, "global_step": 264860, "epoch": 1576} {"train_loss": -12.372434616088867, "global_step": 264861, "epoch": 1576} {"train_loss": -12.446313858032227, "global_step": 264862, "epoch": 1576} {"train_loss": -11.827463150024414, "global_step": 264863, "epoch": 1576} {"train_loss": -12.394004821777344, "global_step": 264864, "epoch": 1576} {"train_loss": -12.478511810302734, "global_step": 264865, "epoch": 1576} {"train_loss": -11.936248779296875, "global_step": 264866, "epoch": 1576} {"train_loss": -12.309228897094727, "global_step": 264867, "epoch": 1576} {"train_loss": -11.93061351776123, "global_step": 264868, "epoch": 1576} {"train_loss": -12.392221450805664, "global_step": 264869, "epoch": 1576} {"train_loss": -12.205589294433594, "global_step": 264870, "epoch": 1576} {"train_loss": -12.081971168518066, "global_step": 264871, "epoch": 1576} {"train_loss": -12.48116683959961, "global_step": 264872, "epoch": 1576} {"train_loss": -12.23049545288086, "global_step": 264873, "epoch": 1576} {"train_loss": -12.182733535766602, "global_step": 264874, "epoch": 1576} {"train_loss": -12.463685035705566, "global_step": 264875, "epoch": 1576} {"train_loss": -11.990455627441406, "global_step": 264876, "epoch": 1576} {"train_loss": -12.341861724853516, "global_step": 264877, "epoch": 1576} {"train_loss": -12.303201675415039, "global_step": 264878, "epoch": 1576} {"train_loss": -12.149163246154785, "global_step": 264879, "epoch": 1576} {"train_loss": -12.170713424682617, "global_step": 264880, "epoch": 1576} {"train_loss": -12.311013221740723, "global_step": 264881, "epoch": 1576} {"train_loss": -12.061915397644043, "global_step": 264882, "epoch": 1576} {"train_loss": -12.007373809814453, "global_step": 264883, "epoch": 1576} {"train_loss": -11.860742568969727, "global_step": 264884, "epoch": 1576} {"train_loss": -12.055408477783203, "global_step": 264885, "epoch": 1576} {"train_loss": -12.033716201782227, "global_step": 264886, "epoch": 1576} {"train_loss": -12.181215286254883, "global_step": 264887, "epoch": 1576} {"train_loss": -11.520641326904297, "global_step": 264888, "epoch": 1576} {"train_loss": -10.671552658081055, "global_step": 264889, "epoch": 1576} {"train_loss": -10.7129487991333, "global_step": 264890, "epoch": 1576} {"train_loss": -11.313411712646484, "global_step": 264891, "epoch": 1576} {"train_loss": -11.754246711730957, "global_step": 264892, "epoch": 1576} {"train_loss": -10.823652267456055, "global_step": 264893, "epoch": 1576} {"train_loss": -9.642090797424316, "global_step": 264894, "epoch": 1576} {"train_loss": -11.351325035095215, "global_step": 264895, "epoch": 1576} {"train_loss": -11.572449684143066, "global_step": 264896, "epoch": 1576} {"train_loss": -11.690031051635742, "global_step": 264897, "epoch": 1576} {"train_loss": -10.919157981872559, "global_step": 264898, "epoch": 1576} {"train_loss": -10.72214412689209, "global_step": 264899, "epoch": 1576} {"train_loss": -11.12734603881836, "global_step": 264900, "epoch": 1576} {"train_loss": -11.368391990661621, "global_step": 264901, "epoch": 1576} {"train_loss": -11.926607131958008, "global_step": 264902, "epoch": 1576} {"train_loss": -10.607063293457031, "global_step": 264903, "epoch": 1576} {"train_loss": -11.253817558288574, "global_step": 264904, "epoch": 1576} {"train_loss": -10.568517684936523, "global_step": 264905, "epoch": 1576} {"train_loss": -11.313234329223633, "global_step": 264906, "epoch": 1576} {"train_loss": -10.89564037322998, "global_step": 264907, "epoch": 1576} {"train_loss": -11.542387008666992, "global_step": 264908, "epoch": 1576} {"train_loss": -10.348339080810547, "global_step": 264909, "epoch": 1576} {"train_loss": -11.178452491760254, "global_step": 264910, "epoch": 1576} {"train_loss": -11.025471687316895, "global_step": 264911, "epoch": 1576} {"train_loss": -9.547607421875, "global_step": 264912, "epoch": 1576} {"train_loss": -10.862997055053711, "global_step": 264913, "epoch": 1576} {"train_loss": -10.31411361694336, "global_step": 264914, "epoch": 1576} {"train_loss": -10.6140718460083, "global_step": 264915, "epoch": 1576} {"train_loss": -10.158793449401855, "global_step": 264916, "epoch": 1576} {"train_loss": -10.153564453125, "global_step": 264917, "epoch": 1576} {"train_loss": -10.942349433898926, "global_step": 264918, "epoch": 1576} {"train_loss": -10.733436584472656, "global_step": 264919, "epoch": 1576} {"train_loss": -11.226983070373535, "global_step": 264920, "epoch": 1576} {"train_loss": -11.461402893066406, "global_step": 264921, "epoch": 1576} {"train_loss": -10.835588455200195, "global_step": 264922, "epoch": 1576} {"train_loss": -11.431644439697266, "global_step": 264923, "epoch": 1576} {"train_loss": -11.174410820007324, "global_step": 264924, "epoch": 1576} {"train_loss": -11.049464225769043, "global_step": 264925, "epoch": 1576} {"train_loss": -11.511077880859375, "global_step": 264926, "epoch": 1576} {"train_loss": -11.224843978881836, "global_step": 264927, "epoch": 1576} {"train_loss": -11.792217254638672, "global_step": 264928, "epoch": 1576} {"train_loss": -11.397653579711914, "global_step": 264929, "epoch": 1576} {"train_loss": -11.710412979125977, "global_step": 264930, "epoch": 1576} {"train_loss": -11.741639137268066, "global_step": 264931, "epoch": 1576} {"train_loss": -11.188207626342773, "global_step": 264932, "epoch": 1576} {"train_loss": -11.726613998413086, "global_step": 264933, "epoch": 1576} {"train_loss": -11.123086929321289, "global_step": 264934, "epoch": 1576} {"train_loss": -11.579410076141357, "global_step": 264935, "epoch": 1576, "val_loss": 272944.59375} {"train_loss": -11.275036811828613, "global_step": 264936, "epoch": 1577} {"train_loss": -10.790382385253906, "global_step": 264937, "epoch": 1577} {"train_loss": -11.330143928527832, "global_step": 264938, "epoch": 1577} {"train_loss": -10.572240829467773, "global_step": 264939, "epoch": 1577} {"train_loss": -10.838088989257812, "global_step": 264940, "epoch": 1577} {"train_loss": -10.97862434387207, "global_step": 264941, "epoch": 1577} {"train_loss": -11.429101943969727, "global_step": 264942, "epoch": 1577} {"train_loss": -10.790082931518555, "global_step": 264943, "epoch": 1577} {"train_loss": -11.050697326660156, "global_step": 264944, "epoch": 1577} {"train_loss": -11.03073501586914, "global_step": 264945, "epoch": 1577} {"train_loss": -10.440433502197266, "global_step": 264946, "epoch": 1577} {"train_loss": -11.497957229614258, "global_step": 264947, "epoch": 1577} {"train_loss": -10.60057258605957, "global_step": 264948, "epoch": 1577} {"train_loss": -11.136860847473145, "global_step": 264949, "epoch": 1577} {"train_loss": -11.27786922454834, "global_step": 264950, "epoch": 1577} {"train_loss": -11.157268524169922, "global_step": 264951, "epoch": 1577} {"train_loss": -11.604536056518555, "global_step": 264952, "epoch": 1577} {"train_loss": -10.431766510009766, "global_step": 264953, "epoch": 1577} {"train_loss": -11.80223274230957, "global_step": 264954, "epoch": 1577} {"train_loss": -11.092554092407227, "global_step": 264955, "epoch": 1577} {"train_loss": -11.527321815490723, "global_step": 264956, "epoch": 1577} {"train_loss": -11.245490074157715, "global_step": 264957, "epoch": 1577} {"train_loss": -11.32517147064209, "global_step": 264958, "epoch": 1577} {"train_loss": -10.910892486572266, "global_step": 264959, "epoch": 1577} {"train_loss": -11.650653839111328, "global_step": 264960, "epoch": 1577} {"train_loss": -10.600202560424805, "global_step": 264961, "epoch": 1577} {"train_loss": -11.782934188842773, "global_step": 264962, "epoch": 1577} {"train_loss": -11.146142959594727, "global_step": 264963, "epoch": 1577} {"train_loss": -11.73398208618164, "global_step": 264964, "epoch": 1577} {"train_loss": -11.436746597290039, "global_step": 264965, "epoch": 1577} {"train_loss": -11.563769340515137, "global_step": 264966, "epoch": 1577} {"train_loss": -11.691797256469727, "global_step": 264967, "epoch": 1577} {"train_loss": -11.85821533203125, "global_step": 264968, "epoch": 1577} {"train_loss": -11.263679504394531, "global_step": 264969, "epoch": 1577} {"train_loss": -11.604204177856445, "global_step": 264970, "epoch": 1577} {"train_loss": -11.539488792419434, "global_step": 264971, "epoch": 1577} {"train_loss": -11.571395874023438, "global_step": 264972, "epoch": 1577} {"train_loss": -11.378972053527832, "global_step": 264973, "epoch": 1577} {"train_loss": -11.671703338623047, "global_step": 264974, "epoch": 1577} {"train_loss": -11.467352867126465, "global_step": 264975, "epoch": 1577} {"train_loss": -11.420798301696777, "global_step": 264976, "epoch": 1577} {"train_loss": -11.924748420715332, "global_step": 264977, "epoch": 1577} {"train_loss": -11.481778144836426, "global_step": 264978, "epoch": 1577} {"train_loss": -11.740934371948242, "global_step": 264979, "epoch": 1577} {"train_loss": -11.770576477050781, "global_step": 264980, "epoch": 1577} {"train_loss": -11.898665428161621, "global_step": 264981, "epoch": 1577} {"train_loss": -11.835733413696289, "global_step": 264982, "epoch": 1577} {"train_loss": -11.769304275512695, "global_step": 264983, "epoch": 1577} {"train_loss": -11.898904800415039, "global_step": 264984, "epoch": 1577} {"train_loss": -11.947911262512207, "global_step": 264985, "epoch": 1577} {"train_loss": -11.885290145874023, "global_step": 264986, "epoch": 1577} {"train_loss": -12.04149055480957, "global_step": 264987, "epoch": 1577} {"train_loss": -12.035058975219727, "global_step": 264988, "epoch": 1577} {"train_loss": -12.01601791381836, "global_step": 264989, "epoch": 1577} {"train_loss": -11.681722640991211, "global_step": 264990, "epoch": 1577} {"train_loss": -11.902326583862305, "global_step": 264991, "epoch": 1577} {"train_loss": -11.945175170898438, "global_step": 264992, "epoch": 1577} {"train_loss": -11.777435302734375, "global_step": 264993, "epoch": 1577} {"train_loss": -12.109933853149414, "global_step": 264994, "epoch": 1577} {"train_loss": -11.859701156616211, "global_step": 264995, "epoch": 1577} {"train_loss": -12.160968780517578, "global_step": 264996, "epoch": 1577} {"train_loss": -11.892428398132324, "global_step": 264997, "epoch": 1577} {"train_loss": -12.056182861328125, "global_step": 264998, "epoch": 1577} {"train_loss": -12.285995483398438, "global_step": 264999, "epoch": 1577} {"train_loss": -12.176387786865234, "global_step": 265000, "epoch": 1577} {"train_loss": -11.992244720458984, "global_step": 265001, "epoch": 1577} {"train_loss": -11.972969055175781, "global_step": 265002, "epoch": 1577} {"train_loss": -11.989526748657227, "global_step": 265003, "epoch": 1577} {"train_loss": -11.7731351852417, "global_step": 265004, "epoch": 1577} {"train_loss": -11.868453979492188, "global_step": 265005, "epoch": 1577} {"train_loss": -11.918933868408203, "global_step": 265006, "epoch": 1577} {"train_loss": -12.27686882019043, "global_step": 265007, "epoch": 1577} {"train_loss": -12.00689697265625, "global_step": 265008, "epoch": 1577} {"train_loss": -12.075052261352539, "global_step": 265009, "epoch": 1577} {"train_loss": -12.072154998779297, "global_step": 265010, "epoch": 1577} {"train_loss": -12.202262878417969, "global_step": 265011, "epoch": 1577} {"train_loss": -11.911909103393555, "global_step": 265012, "epoch": 1577} {"train_loss": -11.991832733154297, "global_step": 265013, "epoch": 1577} {"train_loss": -12.079898834228516, "global_step": 265014, "epoch": 1577} {"train_loss": -12.094810485839844, "global_step": 265015, "epoch": 1577} {"train_loss": -11.980077743530273, "global_step": 265016, "epoch": 1577} {"train_loss": -12.320348739624023, "global_step": 265017, "epoch": 1577} {"train_loss": -12.146133422851562, "global_step": 265018, "epoch": 1577} {"train_loss": -12.251321792602539, "global_step": 265019, "epoch": 1577} {"train_loss": -12.245561599731445, "global_step": 265020, "epoch": 1577} {"train_loss": -12.308536529541016, "global_step": 265021, "epoch": 1577} {"train_loss": -12.160579681396484, "global_step": 265022, "epoch": 1577} {"train_loss": -12.206718444824219, "global_step": 265023, "epoch": 1577} {"train_loss": -12.26596450805664, "global_step": 265024, "epoch": 1577} {"train_loss": -11.950485229492188, "global_step": 265025, "epoch": 1577} {"train_loss": -12.136162757873535, "global_step": 265026, "epoch": 1577} {"train_loss": -12.195246696472168, "global_step": 265027, "epoch": 1577} {"train_loss": -12.358748435974121, "global_step": 265028, "epoch": 1577} {"train_loss": -12.248193740844727, "global_step": 265029, "epoch": 1577} {"train_loss": -12.139904022216797, "global_step": 265030, "epoch": 1577} {"train_loss": -12.234458923339844, "global_step": 265031, "epoch": 1577} {"train_loss": -12.262935638427734, "global_step": 265032, "epoch": 1577} {"train_loss": -12.103456497192383, "global_step": 265033, "epoch": 1577} {"train_loss": -12.351461410522461, "global_step": 265034, "epoch": 1577} {"train_loss": -11.943853378295898, "global_step": 265035, "epoch": 1577} {"train_loss": -12.17111587524414, "global_step": 265036, "epoch": 1577} {"train_loss": -12.370661735534668, "global_step": 265037, "epoch": 1577} {"train_loss": -12.16522216796875, "global_step": 265038, "epoch": 1577} {"train_loss": -12.146011352539062, "global_step": 265039, "epoch": 1577} {"train_loss": -12.166948318481445, "global_step": 265040, "epoch": 1577} {"train_loss": -11.190919876098633, "global_step": 265041, "epoch": 1577} {"train_loss": -11.860858917236328, "global_step": 265042, "epoch": 1577} {"train_loss": -12.259743690490723, "global_step": 265043, "epoch": 1577} {"train_loss": -12.071915626525879, "global_step": 265044, "epoch": 1577} {"train_loss": -11.886404037475586, "global_step": 265045, "epoch": 1577} {"train_loss": -11.805553436279297, "global_step": 265046, "epoch": 1577} {"train_loss": -11.81507396697998, "global_step": 265047, "epoch": 1577} {"train_loss": -12.088480949401855, "global_step": 265048, "epoch": 1577} {"train_loss": -11.796989440917969, "global_step": 265049, "epoch": 1577} {"train_loss": -11.893771171569824, "global_step": 265050, "epoch": 1577} {"train_loss": -11.754268646240234, "global_step": 265051, "epoch": 1577} {"train_loss": -12.056070327758789, "global_step": 265052, "epoch": 1577} {"train_loss": -11.56226921081543, "global_step": 265053, "epoch": 1577} {"train_loss": -11.891292572021484, "global_step": 265054, "epoch": 1577} {"train_loss": -11.617525100708008, "global_step": 265055, "epoch": 1577} {"train_loss": -11.740660667419434, "global_step": 265056, "epoch": 1577} {"train_loss": -12.001358032226562, "global_step": 265057, "epoch": 1577} {"train_loss": -11.636962890625, "global_step": 265058, "epoch": 1577} {"train_loss": -11.125505447387695, "global_step": 265059, "epoch": 1577} {"train_loss": -11.171576499938965, "global_step": 265060, "epoch": 1577} {"train_loss": -11.997695922851562, "global_step": 265061, "epoch": 1577} {"train_loss": -10.91849422454834, "global_step": 265062, "epoch": 1577} {"train_loss": -9.483652114868164, "global_step": 265063, "epoch": 1577} {"train_loss": -10.15202808380127, "global_step": 265064, "epoch": 1577} {"train_loss": -8.946882247924805, "global_step": 265065, "epoch": 1577} {"train_loss": -10.080972671508789, "global_step": 265066, "epoch": 1577} {"train_loss": -8.072369575500488, "global_step": 265067, "epoch": 1577} {"train_loss": -8.817939758300781, "global_step": 265068, "epoch": 1577} {"train_loss": -9.824880599975586, "global_step": 265069, "epoch": 1577} {"train_loss": -9.950212478637695, "global_step": 265070, "epoch": 1577} {"train_loss": -10.615645408630371, "global_step": 265071, "epoch": 1577} {"train_loss": -8.34599781036377, "global_step": 265072, "epoch": 1577} {"train_loss": -9.799540519714355, "global_step": 265073, "epoch": 1577} {"train_loss": -9.675983428955078, "global_step": 265074, "epoch": 1577} {"train_loss": -10.410158157348633, "global_step": 265075, "epoch": 1577} {"train_loss": -8.916897773742676, "global_step": 265076, "epoch": 1577} {"train_loss": -10.604894638061523, "global_step": 265077, "epoch": 1577} {"train_loss": -9.78886604309082, "global_step": 265078, "epoch": 1577} {"train_loss": -9.132421493530273, "global_step": 265079, "epoch": 1577} {"train_loss": -10.181419372558594, "global_step": 265080, "epoch": 1577} {"train_loss": -10.59891414642334, "global_step": 265081, "epoch": 1577} {"train_loss": -9.541107177734375, "global_step": 265082, "epoch": 1577} {"train_loss": -10.579933166503906, "global_step": 265083, "epoch": 1577} {"train_loss": -10.200813293457031, "global_step": 265084, "epoch": 1577} {"train_loss": -9.48907470703125, "global_step": 265085, "epoch": 1577} {"train_loss": -10.617975234985352, "global_step": 265086, "epoch": 1577} {"train_loss": -9.04631519317627, "global_step": 265087, "epoch": 1577} {"train_loss": -9.43757438659668, "global_step": 265088, "epoch": 1577} {"train_loss": -11.285299301147461, "global_step": 265089, "epoch": 1577} {"train_loss": -10.285839080810547, "global_step": 265090, "epoch": 1577} {"train_loss": -10.615560531616211, "global_step": 265091, "epoch": 1577} {"train_loss": -11.222042083740234, "global_step": 265092, "epoch": 1577} {"train_loss": -10.282200813293457, "global_step": 265093, "epoch": 1577} {"train_loss": -10.577945709228516, "global_step": 265094, "epoch": 1577} {"train_loss": -11.085302352905273, "global_step": 265095, "epoch": 1577} {"train_loss": -10.76626968383789, "global_step": 265096, "epoch": 1577} {"train_loss": -11.439675331115723, "global_step": 265097, "epoch": 1577} {"train_loss": -11.450050354003906, "global_step": 265098, "epoch": 1577} {"train_loss": -11.16176700592041, "global_step": 265099, "epoch": 1577} {"train_loss": -11.352779388427734, "global_step": 265100, "epoch": 1577} {"train_loss": -11.279586791992188, "global_step": 265101, "epoch": 1577} {"train_loss": -11.05489730834961, "global_step": 265102, "epoch": 1577} {"train_loss": -11.359601037842888, "global_step": 265103, "epoch": 1577, "val_loss": 260096.5625} {"train_loss": -11.211408615112305, "global_step": 265104, "epoch": 1578} {"train_loss": -11.33200454711914, "global_step": 265105, "epoch": 1578} {"train_loss": -11.414636611938477, "global_step": 265106, "epoch": 1578} {"train_loss": -11.312708854675293, "global_step": 265107, "epoch": 1578} {"train_loss": -11.278789520263672, "global_step": 265108, "epoch": 1578} {"train_loss": -11.604013442993164, "global_step": 265109, "epoch": 1578} {"train_loss": -11.649633407592773, "global_step": 265110, "epoch": 1578} {"train_loss": -11.565796852111816, "global_step": 265111, "epoch": 1578} {"train_loss": -11.545167922973633, "global_step": 265112, "epoch": 1578} {"train_loss": -11.486051559448242, "global_step": 265113, "epoch": 1578} {"train_loss": -11.575007438659668, "global_step": 265114, "epoch": 1578} {"train_loss": -11.518458366394043, "global_step": 265115, "epoch": 1578} {"train_loss": -11.67689323425293, "global_step": 265116, "epoch": 1578} {"train_loss": -11.722060203552246, "global_step": 265117, "epoch": 1578} {"train_loss": -11.54349136352539, "global_step": 265118, "epoch": 1578} {"train_loss": -11.731971740722656, "global_step": 265119, "epoch": 1578} {"train_loss": -11.790281295776367, "global_step": 265120, "epoch": 1578} {"train_loss": -11.661852836608887, "global_step": 265121, "epoch": 1578} {"train_loss": -11.590963363647461, "global_step": 265122, "epoch": 1578} {"train_loss": -11.735486030578613, "global_step": 265123, "epoch": 1578} {"train_loss": -11.901387214660645, "global_step": 265124, "epoch": 1578} {"train_loss": -11.803553581237793, "global_step": 265125, "epoch": 1578} {"train_loss": -11.760836601257324, "global_step": 265126, "epoch": 1578} {"train_loss": -11.900382995605469, "global_step": 265127, "epoch": 1578} {"train_loss": -11.669380187988281, "global_step": 265128, "epoch": 1578} {"train_loss": -11.973712921142578, "global_step": 265129, "epoch": 1578} {"train_loss": -11.707112312316895, "global_step": 265130, "epoch": 1578} {"train_loss": -11.82042121887207, "global_step": 265131, "epoch": 1578} {"train_loss": -11.843189239501953, "global_step": 265132, "epoch": 1578} {"train_loss": -11.976998329162598, "global_step": 265133, "epoch": 1578} {"train_loss": -11.848196029663086, "global_step": 265134, "epoch": 1578} {"train_loss": -11.889558792114258, "global_step": 265135, "epoch": 1578} {"train_loss": -11.957436561584473, "global_step": 265136, "epoch": 1578} {"train_loss": -11.964308738708496, "global_step": 265137, "epoch": 1578} {"train_loss": -11.907052993774414, "global_step": 265138, "epoch": 1578} {"train_loss": -11.884064674377441, "global_step": 265139, "epoch": 1578} {"train_loss": -12.134740829467773, "global_step": 265140, "epoch": 1578} {"train_loss": -11.94672966003418, "global_step": 265141, "epoch": 1578} {"train_loss": -12.143424987792969, "global_step": 265142, "epoch": 1578} {"train_loss": -12.138071060180664, "global_step": 265143, "epoch": 1578} {"train_loss": -12.08208179473877, "global_step": 265144, "epoch": 1578} {"train_loss": -12.158233642578125, "global_step": 265145, "epoch": 1578} {"train_loss": -12.032672882080078, "global_step": 265146, "epoch": 1578} {"train_loss": -12.210472106933594, "global_step": 265147, "epoch": 1578} {"train_loss": -11.953340530395508, "global_step": 265148, "epoch": 1578} {"train_loss": -11.927499771118164, "global_step": 265149, "epoch": 1578} {"train_loss": -12.128213882446289, "global_step": 265150, "epoch": 1578} {"train_loss": -12.18813419342041, "global_step": 265151, "epoch": 1578} {"train_loss": -12.00227165222168, "global_step": 265152, "epoch": 1578} {"train_loss": -11.865367889404297, "global_step": 265153, "epoch": 1578} {"train_loss": -12.169965744018555, "global_step": 265154, "epoch": 1578} {"train_loss": -11.90184211730957, "global_step": 265155, "epoch": 1578} {"train_loss": -12.160857200622559, "global_step": 265156, "epoch": 1578} {"train_loss": -12.194211959838867, "global_step": 265157, "epoch": 1578} {"train_loss": -12.182276725769043, "global_step": 265158, "epoch": 1578} {"train_loss": -12.33098316192627, "global_step": 265159, "epoch": 1578} {"train_loss": -12.207510948181152, "global_step": 265160, "epoch": 1578} {"train_loss": -12.27633285522461, "global_step": 265161, "epoch": 1578} {"train_loss": -12.212732315063477, "global_step": 265162, "epoch": 1578} {"train_loss": -12.277753829956055, "global_step": 265163, "epoch": 1578} {"train_loss": -12.42342758178711, "global_step": 265164, "epoch": 1578} {"train_loss": -12.301429748535156, "global_step": 265165, "epoch": 1578} {"train_loss": -12.225469589233398, "global_step": 265166, "epoch": 1578} {"train_loss": -12.330108642578125, "global_step": 265167, "epoch": 1578} {"train_loss": -12.19906234741211, "global_step": 265168, "epoch": 1578} {"train_loss": -12.199234008789062, "global_step": 265169, "epoch": 1578} {"train_loss": -12.135761260986328, "global_step": 265170, "epoch": 1578} {"train_loss": -11.942115783691406, "global_step": 265171, "epoch": 1578} {"train_loss": -11.857695579528809, "global_step": 265172, "epoch": 1578} {"train_loss": -11.930198669433594, "global_step": 265173, "epoch": 1578} {"train_loss": -12.255534172058105, "global_step": 265174, "epoch": 1578} {"train_loss": -12.010599136352539, "global_step": 265175, "epoch": 1578} {"train_loss": -11.87308406829834, "global_step": 265176, "epoch": 1578} {"train_loss": -12.136174201965332, "global_step": 265177, "epoch": 1578} {"train_loss": -12.467991828918457, "global_step": 265178, "epoch": 1578} {"train_loss": -12.227132797241211, "global_step": 265179, "epoch": 1578} {"train_loss": -11.922818183898926, "global_step": 265180, "epoch": 1578} {"train_loss": -12.014183044433594, "global_step": 265181, "epoch": 1578} {"train_loss": -12.1906156539917, "global_step": 265182, "epoch": 1578} {"train_loss": -12.08961296081543, "global_step": 265183, "epoch": 1578} {"train_loss": -12.20086669921875, "global_step": 265184, "epoch": 1578} {"train_loss": -12.337291717529297, "global_step": 265185, "epoch": 1578} {"train_loss": -12.387088775634766, "global_step": 265186, "epoch": 1578} {"train_loss": -12.399085998535156, "global_step": 265187, "epoch": 1578} {"train_loss": -12.2200927734375, "global_step": 265188, "epoch": 1578} {"train_loss": -12.468315124511719, "global_step": 265189, "epoch": 1578} {"train_loss": -11.926526069641113, "global_step": 265190, "epoch": 1578} {"train_loss": -12.05477237701416, "global_step": 265191, "epoch": 1578} {"train_loss": -12.098533630371094, "global_step": 265192, "epoch": 1578} {"train_loss": -11.835530281066895, "global_step": 265193, "epoch": 1578} {"train_loss": -11.663211822509766, "global_step": 265194, "epoch": 1578} {"train_loss": -11.794477462768555, "global_step": 265195, "epoch": 1578} {"train_loss": -11.333844184875488, "global_step": 265196, "epoch": 1578} {"train_loss": -9.94846248626709, "global_step": 265197, "epoch": 1578} {"train_loss": -9.382813453674316, "global_step": 265198, "epoch": 1578} {"train_loss": -10.2275390625, "global_step": 265199, "epoch": 1578} {"train_loss": -8.653246879577637, "global_step": 265200, "epoch": 1578} {"train_loss": -9.244355201721191, "global_step": 265201, "epoch": 1578} {"train_loss": -9.954822540283203, "global_step": 265202, "epoch": 1578} {"train_loss": -9.500494003295898, "global_step": 265203, "epoch": 1578} {"train_loss": -7.510658264160156, "global_step": 265204, "epoch": 1578} {"train_loss": -8.826709747314453, "global_step": 265205, "epoch": 1578} {"train_loss": -9.115631103515625, "global_step": 265206, "epoch": 1578} {"train_loss": -10.358170509338379, "global_step": 265207, "epoch": 1578} {"train_loss": -8.604850769042969, "global_step": 265208, "epoch": 1578} {"train_loss": -7.723891258239746, "global_step": 265209, "epoch": 1578} {"train_loss": -8.117887496948242, "global_step": 265210, "epoch": 1578} {"train_loss": -10.08906364440918, "global_step": 265211, "epoch": 1578} {"train_loss": -10.711959838867188, "global_step": 265212, "epoch": 1578} {"train_loss": -10.024410247802734, "global_step": 265213, "epoch": 1578} {"train_loss": -10.377144813537598, "global_step": 265214, "epoch": 1578} {"train_loss": -11.318138122558594, "global_step": 265215, "epoch": 1578} {"train_loss": -10.633544921875, "global_step": 265216, "epoch": 1578} {"train_loss": -10.301149368286133, "global_step": 265217, "epoch": 1578} {"train_loss": -11.159810066223145, "global_step": 265218, "epoch": 1578} {"train_loss": -11.267480850219727, "global_step": 265219, "epoch": 1578} {"train_loss": -11.026790618896484, "global_step": 265220, "epoch": 1578} {"train_loss": -11.113715171813965, "global_step": 265221, "epoch": 1578} {"train_loss": -11.10486888885498, "global_step": 265222, "epoch": 1578} {"train_loss": -11.242439270019531, "global_step": 265223, "epoch": 1578} {"train_loss": -10.703739166259766, "global_step": 265224, "epoch": 1578} {"train_loss": -11.052984237670898, "global_step": 265225, "epoch": 1578} {"train_loss": -11.238645553588867, "global_step": 265226, "epoch": 1578} {"train_loss": -11.728170394897461, "global_step": 265227, "epoch": 1578} {"train_loss": -11.189607620239258, "global_step": 265228, "epoch": 1578} {"train_loss": -11.191629409790039, "global_step": 265229, "epoch": 1578} {"train_loss": -11.219268798828125, "global_step": 265230, "epoch": 1578} {"train_loss": -11.60538101196289, "global_step": 265231, "epoch": 1578} {"train_loss": -11.140419006347656, "global_step": 265232, "epoch": 1578} {"train_loss": -11.415522575378418, "global_step": 265233, "epoch": 1578} {"train_loss": -11.16297721862793, "global_step": 265234, "epoch": 1578} {"train_loss": -11.400360107421875, "global_step": 265235, "epoch": 1578} {"train_loss": -10.935234069824219, "global_step": 265236, "epoch": 1578} {"train_loss": -11.349318504333496, "global_step": 265237, "epoch": 1578} {"train_loss": -11.277624130249023, "global_step": 265238, "epoch": 1578} {"train_loss": -11.1077241897583, "global_step": 265239, "epoch": 1578} {"train_loss": -11.282354354858398, "global_step": 265240, "epoch": 1578} {"train_loss": -11.278451919555664, "global_step": 265241, "epoch": 1578} {"train_loss": -11.379975318908691, "global_step": 265242, "epoch": 1578} {"train_loss": -11.667957305908203, "global_step": 265243, "epoch": 1578} {"train_loss": -11.141140937805176, "global_step": 265244, "epoch": 1578} {"train_loss": -11.939071655273438, "global_step": 265245, "epoch": 1578} {"train_loss": -11.465076446533203, "global_step": 265246, "epoch": 1578} {"train_loss": -11.661720275878906, "global_step": 265247, "epoch": 1578} {"train_loss": -11.535017013549805, "global_step": 265248, "epoch": 1578} {"train_loss": -11.561325073242188, "global_step": 265249, "epoch": 1578} {"train_loss": -11.469000816345215, "global_step": 265250, "epoch": 1578} {"train_loss": -11.386089324951172, "global_step": 265251, "epoch": 1578} {"train_loss": -11.83105182647705, "global_step": 265252, "epoch": 1578} {"train_loss": -11.446011543273926, "global_step": 265253, "epoch": 1578} {"train_loss": -11.75111198425293, "global_step": 265254, "epoch": 1578} {"train_loss": -11.928577423095703, "global_step": 265255, "epoch": 1578} {"train_loss": -11.795631408691406, "global_step": 265256, "epoch": 1578} {"train_loss": -11.613935470581055, "global_step": 265257, "epoch": 1578} {"train_loss": -11.759780883789062, "global_step": 265258, "epoch": 1578} {"train_loss": -11.728221893310547, "global_step": 265259, "epoch": 1578} {"train_loss": -11.844914436340332, "global_step": 265260, "epoch": 1578} {"train_loss": -11.854227066040039, "global_step": 265261, "epoch": 1578} {"train_loss": -11.984513282775879, "global_step": 265262, "epoch": 1578} {"train_loss": -11.777584075927734, "global_step": 265263, "epoch": 1578} {"train_loss": -11.820587158203125, "global_step": 265264, "epoch": 1578} {"train_loss": -11.887331008911133, "global_step": 265265, "epoch": 1578} {"train_loss": -11.961228370666504, "global_step": 265266, "epoch": 1578} {"train_loss": -12.083584785461426, "global_step": 265267, "epoch": 1578} {"train_loss": -11.917299270629883, "global_step": 265268, "epoch": 1578} {"train_loss": -11.865612983703613, "global_step": 265269, "epoch": 1578} {"train_loss": -11.788411140441895, "global_step": 265270, "epoch": 1578} {"train_loss": -11.505024569375175, "global_step": 265271, "epoch": 1578, "val_loss": 267739.0625} {"train_loss": -11.953594207763672, "global_step": 265272, "epoch": 1579} {"train_loss": -12.121565818786621, "global_step": 265273, "epoch": 1579} {"train_loss": -12.010376930236816, "global_step": 265274, "epoch": 1579} {"train_loss": -12.258588790893555, "global_step": 265275, "epoch": 1579} {"train_loss": -12.157658576965332, "global_step": 265276, "epoch": 1579} {"train_loss": -11.979772567749023, "global_step": 265277, "epoch": 1579} {"train_loss": -12.2991361618042, "global_step": 265278, "epoch": 1579} {"train_loss": -11.900593757629395, "global_step": 265279, "epoch": 1579} {"train_loss": -12.001986503601074, "global_step": 265280, "epoch": 1579} {"train_loss": -12.09241771697998, "global_step": 265281, "epoch": 1579} {"train_loss": -11.960630416870117, "global_step": 265282, "epoch": 1579} {"train_loss": -12.167966842651367, "global_step": 265283, "epoch": 1579} {"train_loss": -12.092533111572266, "global_step": 265284, "epoch": 1579} {"train_loss": -11.939600944519043, "global_step": 265285, "epoch": 1579} {"train_loss": -12.041975975036621, "global_step": 265286, "epoch": 1579} {"train_loss": -12.046598434448242, "global_step": 265287, "epoch": 1579} {"train_loss": -12.17347526550293, "global_step": 265288, "epoch": 1579} {"train_loss": -11.998578071594238, "global_step": 265289, "epoch": 1579} {"train_loss": -12.251716613769531, "global_step": 265290, "epoch": 1579} {"train_loss": -11.99250316619873, "global_step": 265291, "epoch": 1579} {"train_loss": -11.941884994506836, "global_step": 265292, "epoch": 1579} {"train_loss": -12.025989532470703, "global_step": 265293, "epoch": 1579} {"train_loss": -12.096490859985352, "global_step": 265294, "epoch": 1579} {"train_loss": -11.723058700561523, "global_step": 265295, "epoch": 1579} {"train_loss": -12.12646484375, "global_step": 265296, "epoch": 1579} {"train_loss": -12.066732406616211, "global_step": 265297, "epoch": 1579} {"train_loss": -11.78380298614502, "global_step": 265298, "epoch": 1579} {"train_loss": -12.23703384399414, "global_step": 265299, "epoch": 1579} {"train_loss": -11.994853973388672, "global_step": 265300, "epoch": 1579} {"train_loss": -12.166720390319824, "global_step": 265301, "epoch": 1579} {"train_loss": -12.20799732208252, "global_step": 265302, "epoch": 1579} {"train_loss": -12.11979866027832, "global_step": 265303, "epoch": 1579} {"train_loss": -12.258106231689453, "global_step": 265304, "epoch": 1579} {"train_loss": -12.327818870544434, "global_step": 265305, "epoch": 1579} {"train_loss": -12.042387008666992, "global_step": 265306, "epoch": 1579} {"train_loss": -11.915498733520508, "global_step": 265307, "epoch": 1579} {"train_loss": -12.169574737548828, "global_step": 265308, "epoch": 1579} {"train_loss": -11.788177490234375, "global_step": 265309, "epoch": 1579} {"train_loss": -12.024744033813477, "global_step": 265310, "epoch": 1579} {"train_loss": -12.255687713623047, "global_step": 265311, "epoch": 1579} {"train_loss": -11.97242259979248, "global_step": 265312, "epoch": 1579} {"train_loss": -11.521263122558594, "global_step": 265313, "epoch": 1579} {"train_loss": -11.532873153686523, "global_step": 265314, "epoch": 1579} {"train_loss": -12.408252716064453, "global_step": 265315, "epoch": 1579} {"train_loss": -11.528768539428711, "global_step": 265316, "epoch": 1579} {"train_loss": -11.486370086669922, "global_step": 265317, "epoch": 1579} {"train_loss": -11.901732444763184, "global_step": 265318, "epoch": 1579} {"train_loss": -11.290139198303223, "global_step": 265319, "epoch": 1579} {"train_loss": -11.886545181274414, "global_step": 265320, "epoch": 1579} {"train_loss": -11.761463165283203, "global_step": 265321, "epoch": 1579} {"train_loss": -12.114331245422363, "global_step": 265322, "epoch": 1579} {"train_loss": -11.88845157623291, "global_step": 265323, "epoch": 1579} {"train_loss": -11.735355377197266, "global_step": 265324, "epoch": 1579} {"train_loss": -11.514347076416016, "global_step": 265325, "epoch": 1579} {"train_loss": -12.204668045043945, "global_step": 265326, "epoch": 1579} {"train_loss": -11.956661224365234, "global_step": 265327, "epoch": 1579} {"train_loss": -11.792551040649414, "global_step": 265328, "epoch": 1579} {"train_loss": -11.92689323425293, "global_step": 265329, "epoch": 1579} {"train_loss": -12.157992362976074, "global_step": 265330, "epoch": 1579} {"train_loss": -11.84364128112793, "global_step": 265331, "epoch": 1579} {"train_loss": -12.136030197143555, "global_step": 265332, "epoch": 1579} {"train_loss": -12.106287002563477, "global_step": 265333, "epoch": 1579} {"train_loss": -11.469761848449707, "global_step": 265334, "epoch": 1579} {"train_loss": -11.364219665527344, "global_step": 265335, "epoch": 1579} {"train_loss": -12.265718460083008, "global_step": 265336, "epoch": 1579} {"train_loss": -11.668828964233398, "global_step": 265337, "epoch": 1579} {"train_loss": -11.550178527832031, "global_step": 265338, "epoch": 1579} {"train_loss": -12.096151351928711, "global_step": 265339, "epoch": 1579} {"train_loss": -11.89739990234375, "global_step": 265340, "epoch": 1579} {"train_loss": -11.398710250854492, "global_step": 265341, "epoch": 1579} {"train_loss": -11.632994651794434, "global_step": 265342, "epoch": 1579} {"train_loss": -11.45898723602295, "global_step": 265343, "epoch": 1579} {"train_loss": -10.959264755249023, "global_step": 265344, "epoch": 1579} {"train_loss": -11.373674392700195, "global_step": 265345, "epoch": 1579} {"train_loss": -11.38858413696289, "global_step": 265346, "epoch": 1579} {"train_loss": -11.599651336669922, "global_step": 265347, "epoch": 1579} {"train_loss": -11.162362098693848, "global_step": 265348, "epoch": 1579} {"train_loss": -11.197751998901367, "global_step": 265349, "epoch": 1579} {"train_loss": -10.715251922607422, "global_step": 265350, "epoch": 1579} {"train_loss": -9.975176811218262, "global_step": 265351, "epoch": 1579} {"train_loss": -10.079793930053711, "global_step": 265352, "epoch": 1579} {"train_loss": -11.514579772949219, "global_step": 265353, "epoch": 1579} {"train_loss": -9.969189643859863, "global_step": 265354, "epoch": 1579} {"train_loss": -11.085981369018555, "global_step": 265355, "epoch": 1579} {"train_loss": -9.782602310180664, "global_step": 265356, "epoch": 1579} {"train_loss": -10.55950927734375, "global_step": 265357, "epoch": 1579} {"train_loss": -9.331981658935547, "global_step": 265358, "epoch": 1579} {"train_loss": -10.72189712524414, "global_step": 265359, "epoch": 1579} {"train_loss": -8.215646743774414, "global_step": 265360, "epoch": 1579} {"train_loss": -10.358976364135742, "global_step": 265361, "epoch": 1579} {"train_loss": -9.32983684539795, "global_step": 265362, "epoch": 1579} {"train_loss": -9.447433471679688, "global_step": 265363, "epoch": 1579} {"train_loss": -6.982320785522461, "global_step": 265364, "epoch": 1579} {"train_loss": -9.016332626342773, "global_step": 265365, "epoch": 1579} {"train_loss": -9.30315113067627, "global_step": 265366, "epoch": 1579} {"train_loss": -8.376392364501953, "global_step": 265367, "epoch": 1579} {"train_loss": -10.204534530639648, "global_step": 265368, "epoch": 1579} {"train_loss": -8.547685623168945, "global_step": 265369, "epoch": 1579} {"train_loss": -10.69401741027832, "global_step": 265370, "epoch": 1579} {"train_loss": -10.184955596923828, "global_step": 265371, "epoch": 1579} {"train_loss": -10.548140525817871, "global_step": 265372, "epoch": 1579} {"train_loss": -10.67366886138916, "global_step": 265373, "epoch": 1579} {"train_loss": -10.094823837280273, "global_step": 265374, "epoch": 1579} {"train_loss": -10.636276245117188, "global_step": 265375, "epoch": 1579} {"train_loss": -10.337187767028809, "global_step": 265376, "epoch": 1579} {"train_loss": -11.210190773010254, "global_step": 265377, "epoch": 1579} {"train_loss": -10.857767105102539, "global_step": 265378, "epoch": 1579} {"train_loss": -11.42854118347168, "global_step": 265379, "epoch": 1579} {"train_loss": -11.372086524963379, "global_step": 265380, "epoch": 1579} {"train_loss": -11.353321075439453, "global_step": 265381, "epoch": 1579} {"train_loss": -11.624124526977539, "global_step": 265382, "epoch": 1579} {"train_loss": -11.249951362609863, "global_step": 265383, "epoch": 1579} {"train_loss": -11.40103530883789, "global_step": 265384, "epoch": 1579} {"train_loss": -10.829713821411133, "global_step": 265385, "epoch": 1579} {"train_loss": -11.355447769165039, "global_step": 265386, "epoch": 1579} {"train_loss": -11.328254699707031, "global_step": 265387, "epoch": 1579} {"train_loss": -11.493133544921875, "global_step": 265388, "epoch": 1579} {"train_loss": -11.448482513427734, "global_step": 265389, "epoch": 1579} {"train_loss": -11.321762084960938, "global_step": 265390, "epoch": 1579} {"train_loss": -11.299936294555664, "global_step": 265391, "epoch": 1579} {"train_loss": -11.451828002929688, "global_step": 265392, "epoch": 1579} {"train_loss": -11.388102531433105, "global_step": 265393, "epoch": 1579} {"train_loss": -11.460012435913086, "global_step": 265394, "epoch": 1579} {"train_loss": -11.532865524291992, "global_step": 265395, "epoch": 1579} {"train_loss": -11.297222137451172, "global_step": 265396, "epoch": 1579} {"train_loss": -11.750240325927734, "global_step": 265397, "epoch": 1579} {"train_loss": -11.14005184173584, "global_step": 265398, "epoch": 1579} {"train_loss": -11.50629997253418, "global_step": 265399, "epoch": 1579} {"train_loss": -11.704675674438477, "global_step": 265400, "epoch": 1579} {"train_loss": -11.709875106811523, "global_step": 265401, "epoch": 1579} {"train_loss": -11.8560791015625, "global_step": 265402, "epoch": 1579} {"train_loss": -11.666274070739746, "global_step": 265403, "epoch": 1579} {"train_loss": -11.954463005065918, "global_step": 265404, "epoch": 1579} {"train_loss": -11.912619590759277, "global_step": 265405, "epoch": 1579} {"train_loss": -11.680213928222656, "global_step": 265406, "epoch": 1579} {"train_loss": -11.727482795715332, "global_step": 265407, "epoch": 1579} {"train_loss": -11.86894702911377, "global_step": 265408, "epoch": 1579} {"train_loss": -11.783939361572266, "global_step": 265409, "epoch": 1579} {"train_loss": -11.82533073425293, "global_step": 265410, "epoch": 1579} {"train_loss": -11.911730766296387, "global_step": 265411, "epoch": 1579} {"train_loss": -11.483116149902344, "global_step": 265412, "epoch": 1579} {"train_loss": -11.788614273071289, "global_step": 265413, "epoch": 1579} {"train_loss": -11.80620288848877, "global_step": 265414, "epoch": 1579} {"train_loss": -11.883363723754883, "global_step": 265415, "epoch": 1579} {"train_loss": -12.0104398727417, "global_step": 265416, "epoch": 1579} {"train_loss": -11.724288940429688, "global_step": 265417, "epoch": 1579} {"train_loss": -11.9108247756958, "global_step": 265418, "epoch": 1579} {"train_loss": -11.797066688537598, "global_step": 265419, "epoch": 1579} {"train_loss": -11.946810722351074, "global_step": 265420, "epoch": 1579} {"train_loss": -11.741286277770996, "global_step": 265421, "epoch": 1579} {"train_loss": -11.89168930053711, "global_step": 265422, "epoch": 1579} {"train_loss": -11.879783630371094, "global_step": 265423, "epoch": 1579} {"train_loss": -12.05263900756836, "global_step": 265424, "epoch": 1579} {"train_loss": -11.891031265258789, "global_step": 265425, "epoch": 1579} {"train_loss": -12.105457305908203, "global_step": 265426, "epoch": 1579} {"train_loss": -12.061384201049805, "global_step": 265427, "epoch": 1579} {"train_loss": -12.154522895812988, "global_step": 265428, "epoch": 1579} {"train_loss": -12.094305038452148, "global_step": 265429, "epoch": 1579} {"train_loss": -12.218429565429688, "global_step": 265430, "epoch": 1579} {"train_loss": -12.15060806274414, "global_step": 265431, "epoch": 1579} {"train_loss": -12.106710433959961, "global_step": 265432, "epoch": 1579} {"train_loss": -12.03935718536377, "global_step": 265433, "epoch": 1579} {"train_loss": -12.143669128417969, "global_step": 265434, "epoch": 1579} {"train_loss": -12.095309257507324, "global_step": 265435, "epoch": 1579} {"train_loss": -12.32002067565918, "global_step": 265436, "epoch": 1579} {"train_loss": -12.112329483032227, "global_step": 265437, "epoch": 1579} {"train_loss": -12.244632720947266, "global_step": 265438, "epoch": 1579} {"train_loss": -11.50654913697924, "global_step": 265439, "epoch": 1579, "val_loss": 271695.53125} {"train_loss": -12.194999694824219, "global_step": 265440, "epoch": 1580} {"train_loss": -12.208420753479004, "global_step": 265441, "epoch": 1580} {"train_loss": -12.204898834228516, "global_step": 265442, "epoch": 1580} {"train_loss": -12.03481674194336, "global_step": 265443, "epoch": 1580} {"train_loss": -12.262762069702148, "global_step": 265444, "epoch": 1580} {"train_loss": -12.203483581542969, "global_step": 265445, "epoch": 1580} {"train_loss": -12.26883316040039, "global_step": 265446, "epoch": 1580} {"train_loss": -12.275296211242676, "global_step": 265447, "epoch": 1580} {"train_loss": -12.090494155883789, "global_step": 265448, "epoch": 1580} {"train_loss": -12.359248161315918, "global_step": 265449, "epoch": 1580} {"train_loss": -12.238306045532227, "global_step": 265450, "epoch": 1580} {"train_loss": -12.252555847167969, "global_step": 265451, "epoch": 1580} {"train_loss": -12.347583770751953, "global_step": 265452, "epoch": 1580} {"train_loss": -12.328777313232422, "global_step": 265453, "epoch": 1580} {"train_loss": -12.376770973205566, "global_step": 265454, "epoch": 1580} {"train_loss": -12.354642868041992, "global_step": 265455, "epoch": 1580} {"train_loss": -12.275605201721191, "global_step": 265456, "epoch": 1580} {"train_loss": -12.012862205505371, "global_step": 265457, "epoch": 1580} {"train_loss": -12.211871147155762, "global_step": 265458, "epoch": 1580} {"train_loss": -12.286457061767578, "global_step": 265459, "epoch": 1580} {"train_loss": -12.176753997802734, "global_step": 265460, "epoch": 1580} {"train_loss": -11.963143348693848, "global_step": 265461, "epoch": 1580} {"train_loss": -11.631649017333984, "global_step": 265462, "epoch": 1580} {"train_loss": -11.773313522338867, "global_step": 265463, "epoch": 1580} {"train_loss": -12.147966384887695, "global_step": 265464, "epoch": 1580} {"train_loss": -11.98649787902832, "global_step": 265465, "epoch": 1580} {"train_loss": -11.86638355255127, "global_step": 265466, "epoch": 1580} {"train_loss": -11.42570686340332, "global_step": 265467, "epoch": 1580} {"train_loss": -11.95473861694336, "global_step": 265468, "epoch": 1580} {"train_loss": -11.978446006774902, "global_step": 265469, "epoch": 1580} {"train_loss": -11.341772079467773, "global_step": 265470, "epoch": 1580} {"train_loss": -12.223036766052246, "global_step": 265471, "epoch": 1580} {"train_loss": -10.49039077758789, "global_step": 265472, "epoch": 1580} {"train_loss": -10.784400939941406, "global_step": 265473, "epoch": 1580} {"train_loss": -11.497634887695312, "global_step": 265474, "epoch": 1580} {"train_loss": -11.22607421875, "global_step": 265475, "epoch": 1580} {"train_loss": -11.472677230834961, "global_step": 265476, "epoch": 1580} {"train_loss": -11.091157913208008, "global_step": 265477, "epoch": 1580} {"train_loss": -11.23945426940918, "global_step": 265478, "epoch": 1580} {"train_loss": -11.949026107788086, "global_step": 265479, "epoch": 1580} {"train_loss": -11.116209030151367, "global_step": 265480, "epoch": 1580} {"train_loss": -11.432705879211426, "global_step": 265481, "epoch": 1580} {"train_loss": -11.863302230834961, "global_step": 265482, "epoch": 1580} {"train_loss": -11.06330680847168, "global_step": 265483, "epoch": 1580} {"train_loss": -12.104364395141602, "global_step": 265484, "epoch": 1580} {"train_loss": -11.435943603515625, "global_step": 265485, "epoch": 1580} {"train_loss": -11.558464050292969, "global_step": 265486, "epoch": 1580} {"train_loss": -11.716304779052734, "global_step": 265487, "epoch": 1580} {"train_loss": -11.359504699707031, "global_step": 265488, "epoch": 1580} {"train_loss": -11.48120403289795, "global_step": 265489, "epoch": 1580} {"train_loss": -11.852642059326172, "global_step": 265490, "epoch": 1580} {"train_loss": -10.876777648925781, "global_step": 265491, "epoch": 1580} {"train_loss": -11.68064022064209, "global_step": 265492, "epoch": 1580} {"train_loss": -11.408294677734375, "global_step": 265493, "epoch": 1580} {"train_loss": -12.227540969848633, "global_step": 265494, "epoch": 1580} {"train_loss": -11.126928329467773, "global_step": 265495, "epoch": 1580} {"train_loss": -11.491819381713867, "global_step": 265496, "epoch": 1580} {"train_loss": -11.452583312988281, "global_step": 265497, "epoch": 1580} {"train_loss": -10.61543083190918, "global_step": 265498, "epoch": 1580} {"train_loss": -11.30197811126709, "global_step": 265499, "epoch": 1580} {"train_loss": -10.248035430908203, "global_step": 265500, "epoch": 1580} {"train_loss": -10.626504898071289, "global_step": 265501, "epoch": 1580} {"train_loss": -11.347954750061035, "global_step": 265502, "epoch": 1580} {"train_loss": -11.060871124267578, "global_step": 265503, "epoch": 1580} {"train_loss": -11.098569869995117, "global_step": 265504, "epoch": 1580} {"train_loss": -10.95364761352539, "global_step": 265505, "epoch": 1580} {"train_loss": -10.836263656616211, "global_step": 265506, "epoch": 1580} {"train_loss": -11.021571159362793, "global_step": 265507, "epoch": 1580} {"train_loss": -11.144433975219727, "global_step": 265508, "epoch": 1580} {"train_loss": -11.18613052368164, "global_step": 265509, "epoch": 1580} {"train_loss": -11.002988815307617, "global_step": 265510, "epoch": 1580} {"train_loss": -11.648492813110352, "global_step": 265511, "epoch": 1580} {"train_loss": -11.293436050415039, "global_step": 265512, "epoch": 1580} {"train_loss": -10.821043014526367, "global_step": 265513, "epoch": 1580} {"train_loss": -11.50711727142334, "global_step": 265514, "epoch": 1580} {"train_loss": -10.883134841918945, "global_step": 265515, "epoch": 1580} {"train_loss": -11.389575958251953, "global_step": 265516, "epoch": 1580} {"train_loss": -11.489593505859375, "global_step": 265517, "epoch": 1580} {"train_loss": -11.11994743347168, "global_step": 265518, "epoch": 1580} {"train_loss": -11.449972152709961, "global_step": 265519, "epoch": 1580} {"train_loss": -11.161813735961914, "global_step": 265520, "epoch": 1580} {"train_loss": -11.566116333007812, "global_step": 265521, "epoch": 1580} {"train_loss": -11.750490188598633, "global_step": 265522, "epoch": 1580} {"train_loss": -11.594030380249023, "global_step": 265523, "epoch": 1580} {"train_loss": -11.41462230682373, "global_step": 265524, "epoch": 1580} {"train_loss": -11.62704849243164, "global_step": 265525, "epoch": 1580} {"train_loss": -11.519109725952148, "global_step": 265526, "epoch": 1580} {"train_loss": -11.76311206817627, "global_step": 265527, "epoch": 1580} {"train_loss": -11.525650024414062, "global_step": 265528, "epoch": 1580} {"train_loss": -11.356311798095703, "global_step": 265529, "epoch": 1580} {"train_loss": -11.540450096130371, "global_step": 265530, "epoch": 1580} {"train_loss": -11.546026229858398, "global_step": 265531, "epoch": 1580} {"train_loss": -11.581287384033203, "global_step": 265532, "epoch": 1580} {"train_loss": -11.200730323791504, "global_step": 265533, "epoch": 1580} {"train_loss": -11.699944496154785, "global_step": 265534, "epoch": 1580} {"train_loss": -11.516298294067383, "global_step": 265535, "epoch": 1580} {"train_loss": -11.860513687133789, "global_step": 265536, "epoch": 1580} {"train_loss": -11.309072494506836, "global_step": 265537, "epoch": 1580} {"train_loss": -11.916431427001953, "global_step": 265538, "epoch": 1580} {"train_loss": -11.546963691711426, "global_step": 265539, "epoch": 1580} {"train_loss": -11.771987915039062, "global_step": 265540, "epoch": 1580} {"train_loss": -11.841976165771484, "global_step": 265541, "epoch": 1580} {"train_loss": -11.847167015075684, "global_step": 265542, "epoch": 1580} {"train_loss": -11.99909782409668, "global_step": 265543, "epoch": 1580} {"train_loss": -11.691577911376953, "global_step": 265544, "epoch": 1580} {"train_loss": -11.86253547668457, "global_step": 265545, "epoch": 1580} {"train_loss": -11.626532554626465, "global_step": 265546, "epoch": 1580} {"train_loss": -11.668598175048828, "global_step": 265547, "epoch": 1580} {"train_loss": -11.762344360351562, "global_step": 265548, "epoch": 1580} {"train_loss": -11.972576141357422, "global_step": 265549, "epoch": 1580} {"train_loss": -11.389867782592773, "global_step": 265550, "epoch": 1580} {"train_loss": -11.753619194030762, "global_step": 265551, "epoch": 1580} {"train_loss": -11.5762357711792, "global_step": 265552, "epoch": 1580} {"train_loss": -11.824596405029297, "global_step": 265553, "epoch": 1580} {"train_loss": -11.831741333007812, "global_step": 265554, "epoch": 1580} {"train_loss": -11.88225269317627, "global_step": 265555, "epoch": 1580} {"train_loss": -11.977810859680176, "global_step": 265556, "epoch": 1580} {"train_loss": -11.819345474243164, "global_step": 265557, "epoch": 1580} {"train_loss": -12.080575942993164, "global_step": 265558, "epoch": 1580} {"train_loss": -11.98076343536377, "global_step": 265559, "epoch": 1580} {"train_loss": -12.12387466430664, "global_step": 265560, "epoch": 1580} {"train_loss": -11.898648262023926, "global_step": 265561, "epoch": 1580} {"train_loss": -12.21573257446289, "global_step": 265562, "epoch": 1580} {"train_loss": -12.15005874633789, "global_step": 265563, "epoch": 1580} {"train_loss": -12.192899703979492, "global_step": 265564, "epoch": 1580} {"train_loss": -12.06167221069336, "global_step": 265565, "epoch": 1580} {"train_loss": -11.87169361114502, "global_step": 265566, "epoch": 1580} {"train_loss": -12.256661415100098, "global_step": 265567, "epoch": 1580} {"train_loss": -12.368074417114258, "global_step": 265568, "epoch": 1580} {"train_loss": -12.112710952758789, "global_step": 265569, "epoch": 1580} {"train_loss": -12.048310279846191, "global_step": 265570, "epoch": 1580} {"train_loss": -12.09177017211914, "global_step": 265571, "epoch": 1580} {"train_loss": -12.222469329833984, "global_step": 265572, "epoch": 1580} {"train_loss": -12.064044952392578, "global_step": 265573, "epoch": 1580} {"train_loss": -12.132532119750977, "global_step": 265574, "epoch": 1580} {"train_loss": -12.13212776184082, "global_step": 265575, "epoch": 1580} {"train_loss": -12.18492317199707, "global_step": 265576, "epoch": 1580} {"train_loss": -12.152023315429688, "global_step": 265577, "epoch": 1580} {"train_loss": -12.178755760192871, "global_step": 265578, "epoch": 1580} {"train_loss": -11.832027435302734, "global_step": 265579, "epoch": 1580} {"train_loss": -12.167899131774902, "global_step": 265580, "epoch": 1580} {"train_loss": -11.966880798339844, "global_step": 265581, "epoch": 1580} {"train_loss": -12.097823143005371, "global_step": 265582, "epoch": 1580} {"train_loss": -12.224628448486328, "global_step": 265583, "epoch": 1580} {"train_loss": -11.788543701171875, "global_step": 265584, "epoch": 1580} {"train_loss": -12.018898010253906, "global_step": 265585, "epoch": 1580} {"train_loss": -11.90623664855957, "global_step": 265586, "epoch": 1580} {"train_loss": -12.006052017211914, "global_step": 265587, "epoch": 1580} {"train_loss": -11.926876068115234, "global_step": 265588, "epoch": 1580} {"train_loss": -11.876384735107422, "global_step": 265589, "epoch": 1580} {"train_loss": -12.185437202453613, "global_step": 265590, "epoch": 1580} {"train_loss": -12.021421432495117, "global_step": 265591, "epoch": 1580} {"train_loss": -11.913494110107422, "global_step": 265592, "epoch": 1580} {"train_loss": -11.429880142211914, "global_step": 265593, "epoch": 1580} {"train_loss": -12.158637046813965, "global_step": 265594, "epoch": 1580} {"train_loss": -11.856857299804688, "global_step": 265595, "epoch": 1580} {"train_loss": -12.325387954711914, "global_step": 265596, "epoch": 1580} {"train_loss": -11.644721031188965, "global_step": 265597, "epoch": 1580} {"train_loss": -11.85964298248291, "global_step": 265598, "epoch": 1580} {"train_loss": -11.36669921875, "global_step": 265599, "epoch": 1580} {"train_loss": -10.796064376831055, "global_step": 265600, "epoch": 1580} {"train_loss": -11.43960189819336, "global_step": 265601, "epoch": 1580} {"train_loss": -11.271150588989258, "global_step": 265602, "epoch": 1580} {"train_loss": -10.915848731994629, "global_step": 265603, "epoch": 1580} {"train_loss": -11.327493667602539, "global_step": 265604, "epoch": 1580} {"train_loss": -10.349764823913574, "global_step": 265605, "epoch": 1580} {"train_loss": -11.147299766540527, "global_step": 265606, "epoch": 1580} {"train_loss": -11.695663253466288, "global_step": 265607, "epoch": 1580, "val_loss": 269099.0625, "train_action_mse_error": 1.0860003232955933} {"train_loss": -11.517592430114746, "global_step": 265608, "epoch": 1581} {"train_loss": -10.634207725524902, "global_step": 265609, "epoch": 1581} {"train_loss": -10.532212257385254, "global_step": 265610, "epoch": 1581} {"train_loss": -11.829973220825195, "global_step": 265611, "epoch": 1581} {"train_loss": -10.839933395385742, "global_step": 265612, "epoch": 1581} {"train_loss": -10.332134246826172, "global_step": 265613, "epoch": 1581} {"train_loss": -10.91323471069336, "global_step": 265614, "epoch": 1581} {"train_loss": -8.577093124389648, "global_step": 265615, "epoch": 1581} {"train_loss": -9.605697631835938, "global_step": 265616, "epoch": 1581} {"train_loss": -9.928251266479492, "global_step": 265617, "epoch": 1581} {"train_loss": -10.159953117370605, "global_step": 265618, "epoch": 1581} {"train_loss": -10.037494659423828, "global_step": 265619, "epoch": 1581} {"train_loss": -11.682453155517578, "global_step": 265620, "epoch": 1581} {"train_loss": -10.71425724029541, "global_step": 265621, "epoch": 1581} {"train_loss": -11.03604507446289, "global_step": 265622, "epoch": 1581} {"train_loss": -10.90606689453125, "global_step": 265623, "epoch": 1581} {"train_loss": -10.527581214904785, "global_step": 265624, "epoch": 1581} {"train_loss": -11.542967796325684, "global_step": 265625, "epoch": 1581} {"train_loss": -10.675086975097656, "global_step": 265626, "epoch": 1581} {"train_loss": -11.567522048950195, "global_step": 265627, "epoch": 1581} {"train_loss": -11.089942932128906, "global_step": 265628, "epoch": 1581} {"train_loss": -11.565771102905273, "global_step": 265629, "epoch": 1581} {"train_loss": -11.423564910888672, "global_step": 265630, "epoch": 1581} {"train_loss": -11.76221752166748, "global_step": 265631, "epoch": 1581} {"train_loss": -11.674676895141602, "global_step": 265632, "epoch": 1581} {"train_loss": -11.745254516601562, "global_step": 265633, "epoch": 1581} {"train_loss": -11.741453170776367, "global_step": 265634, "epoch": 1581} {"train_loss": -11.831137657165527, "global_step": 265635, "epoch": 1581} {"train_loss": -11.870187759399414, "global_step": 265636, "epoch": 1581} {"train_loss": -11.856325149536133, "global_step": 265637, "epoch": 1581} {"train_loss": -11.848381042480469, "global_step": 265638, "epoch": 1581} {"train_loss": -11.84604263305664, "global_step": 265639, "epoch": 1581} {"train_loss": -11.826736450195312, "global_step": 265640, "epoch": 1581} {"train_loss": -11.869327545166016, "global_step": 265641, "epoch": 1581} {"train_loss": -11.926717758178711, "global_step": 265642, "epoch": 1581} {"train_loss": -11.984256744384766, "global_step": 265643, "epoch": 1581} {"train_loss": -11.735780715942383, "global_step": 265644, "epoch": 1581} {"train_loss": -12.06472110748291, "global_step": 265645, "epoch": 1581} {"train_loss": -11.751286506652832, "global_step": 265646, "epoch": 1581} {"train_loss": -11.774465560913086, "global_step": 265647, "epoch": 1581} {"train_loss": -11.907106399536133, "global_step": 265648, "epoch": 1581} {"train_loss": -11.977148056030273, "global_step": 265649, "epoch": 1581} {"train_loss": -11.914356231689453, "global_step": 265650, "epoch": 1581} {"train_loss": -11.807760238647461, "global_step": 265651, "epoch": 1581} {"train_loss": -12.085713386535645, "global_step": 265652, "epoch": 1581} {"train_loss": -11.809163093566895, "global_step": 265653, "epoch": 1581} {"train_loss": -12.086042404174805, "global_step": 265654, "epoch": 1581} {"train_loss": -12.03033447265625, "global_step": 265655, "epoch": 1581} {"train_loss": -12.044965744018555, "global_step": 265656, "epoch": 1581} {"train_loss": -12.045247077941895, "global_step": 265657, "epoch": 1581} {"train_loss": -12.052371978759766, "global_step": 265658, "epoch": 1581} {"train_loss": -12.021961212158203, "global_step": 265659, "epoch": 1581} {"train_loss": -11.858336448669434, "global_step": 265660, "epoch": 1581} {"train_loss": -12.032598495483398, "global_step": 265661, "epoch": 1581} {"train_loss": -12.037923812866211, "global_step": 265662, "epoch": 1581} {"train_loss": -11.826162338256836, "global_step": 265663, "epoch": 1581} {"train_loss": -11.98348617553711, "global_step": 265664, "epoch": 1581} {"train_loss": -11.939080238342285, "global_step": 265665, "epoch": 1581} {"train_loss": -11.892383575439453, "global_step": 265666, "epoch": 1581} {"train_loss": -12.081552505493164, "global_step": 265667, "epoch": 1581} {"train_loss": -11.820075035095215, "global_step": 265668, "epoch": 1581} {"train_loss": -11.645090103149414, "global_step": 265669, "epoch": 1581} {"train_loss": -12.156033515930176, "global_step": 265670, "epoch": 1581} {"train_loss": -11.870824813842773, "global_step": 265671, "epoch": 1581} {"train_loss": -11.959622383117676, "global_step": 265672, "epoch": 1581} {"train_loss": -12.033525466918945, "global_step": 265673, "epoch": 1581} {"train_loss": -12.142409324645996, "global_step": 265674, "epoch": 1581} {"train_loss": -12.209221839904785, "global_step": 265675, "epoch": 1581} {"train_loss": -11.940008163452148, "global_step": 265676, "epoch": 1581} {"train_loss": -12.065465927124023, "global_step": 265677, "epoch": 1581} {"train_loss": -11.93325424194336, "global_step": 265678, "epoch": 1581} {"train_loss": -12.114151954650879, "global_step": 265679, "epoch": 1581} {"train_loss": -12.182727813720703, "global_step": 265680, "epoch": 1581} {"train_loss": -11.92605209350586, "global_step": 265681, "epoch": 1581} {"train_loss": -11.815863609313965, "global_step": 265682, "epoch": 1581} {"train_loss": -12.096611022949219, "global_step": 265683, "epoch": 1581} {"train_loss": -12.22514533996582, "global_step": 265684, "epoch": 1581} {"train_loss": -11.938543319702148, "global_step": 265685, "epoch": 1581} {"train_loss": -12.207260131835938, "global_step": 265686, "epoch": 1581} {"train_loss": -12.096763610839844, "global_step": 265687, "epoch": 1581} {"train_loss": -12.224184036254883, "global_step": 265688, "epoch": 1581} {"train_loss": -12.1481294631958, "global_step": 265689, "epoch": 1581} {"train_loss": -11.959311485290527, "global_step": 265690, "epoch": 1581} {"train_loss": -11.880904197692871, "global_step": 265691, "epoch": 1581} {"train_loss": -12.090449333190918, "global_step": 265692, "epoch": 1581} {"train_loss": -12.139055252075195, "global_step": 265693, "epoch": 1581} {"train_loss": -12.324108123779297, "global_step": 265694, "epoch": 1581} {"train_loss": -12.125288009643555, "global_step": 265695, "epoch": 1581} {"train_loss": -11.922913551330566, "global_step": 265696, "epoch": 1581} {"train_loss": -11.99593448638916, "global_step": 265697, "epoch": 1581} {"train_loss": -12.074382781982422, "global_step": 265698, "epoch": 1581} {"train_loss": -11.89689826965332, "global_step": 265699, "epoch": 1581} {"train_loss": -11.912994384765625, "global_step": 265700, "epoch": 1581} {"train_loss": -11.221874237060547, "global_step": 265701, "epoch": 1581} {"train_loss": -11.324912071228027, "global_step": 265702, "epoch": 1581} {"train_loss": -11.70412826538086, "global_step": 265703, "epoch": 1581} {"train_loss": -12.0181884765625, "global_step": 265704, "epoch": 1581} {"train_loss": -10.777134895324707, "global_step": 265705, "epoch": 1581} {"train_loss": -11.190553665161133, "global_step": 265706, "epoch": 1581} {"train_loss": -11.823871612548828, "global_step": 265707, "epoch": 1581} {"train_loss": -11.209676742553711, "global_step": 265708, "epoch": 1581} {"train_loss": -9.810991287231445, "global_step": 265709, "epoch": 1581} {"train_loss": -10.644977569580078, "global_step": 265710, "epoch": 1581} {"train_loss": -11.469259262084961, "global_step": 265711, "epoch": 1581} {"train_loss": -11.212230682373047, "global_step": 265712, "epoch": 1581} {"train_loss": -10.555691719055176, "global_step": 265713, "epoch": 1581} {"train_loss": -10.973026275634766, "global_step": 265714, "epoch": 1581} {"train_loss": -11.392727851867676, "global_step": 265715, "epoch": 1581} {"train_loss": -11.007505416870117, "global_step": 265716, "epoch": 1581} {"train_loss": -10.507274627685547, "global_step": 265717, "epoch": 1581} {"train_loss": -11.681642532348633, "global_step": 265718, "epoch": 1581} {"train_loss": -10.604859352111816, "global_step": 265719, "epoch": 1581} {"train_loss": -11.40692138671875, "global_step": 265720, "epoch": 1581} {"train_loss": -11.35558795928955, "global_step": 265721, "epoch": 1581} {"train_loss": -10.939595222473145, "global_step": 265722, "epoch": 1581} {"train_loss": -11.32741928100586, "global_step": 265723, "epoch": 1581} {"train_loss": -11.686081886291504, "global_step": 265724, "epoch": 1581} {"train_loss": -11.144725799560547, "global_step": 265725, "epoch": 1581} {"train_loss": -11.589508056640625, "global_step": 265726, "epoch": 1581} {"train_loss": -11.730489730834961, "global_step": 265727, "epoch": 1581} {"train_loss": -11.546725273132324, "global_step": 265728, "epoch": 1581} {"train_loss": -11.565536499023438, "global_step": 265729, "epoch": 1581} {"train_loss": -11.301153182983398, "global_step": 265730, "epoch": 1581} {"train_loss": -11.967414855957031, "global_step": 265731, "epoch": 1581} {"train_loss": -11.511712074279785, "global_step": 265732, "epoch": 1581} {"train_loss": -11.729933738708496, "global_step": 265733, "epoch": 1581} {"train_loss": -11.579557418823242, "global_step": 265734, "epoch": 1581} {"train_loss": -11.510623931884766, "global_step": 265735, "epoch": 1581} {"train_loss": -11.609233856201172, "global_step": 265736, "epoch": 1581} {"train_loss": -11.760315895080566, "global_step": 265737, "epoch": 1581} {"train_loss": -11.352890014648438, "global_step": 265738, "epoch": 1581} {"train_loss": -11.672334671020508, "global_step": 265739, "epoch": 1581} {"train_loss": -11.749062538146973, "global_step": 265740, "epoch": 1581} {"train_loss": -11.270530700683594, "global_step": 265741, "epoch": 1581} {"train_loss": -11.575494766235352, "global_step": 265742, "epoch": 1581} {"train_loss": -11.634597778320312, "global_step": 265743, "epoch": 1581} {"train_loss": -11.749459266662598, "global_step": 265744, "epoch": 1581} {"train_loss": -11.284646987915039, "global_step": 265745, "epoch": 1581} {"train_loss": -11.567144393920898, "global_step": 265746, "epoch": 1581} {"train_loss": -11.57498550415039, "global_step": 265747, "epoch": 1581} {"train_loss": -12.022140502929688, "global_step": 265748, "epoch": 1581} {"train_loss": -11.634364128112793, "global_step": 265749, "epoch": 1581} {"train_loss": -11.712236404418945, "global_step": 265750, "epoch": 1581} {"train_loss": -12.023639678955078, "global_step": 265751, "epoch": 1581} {"train_loss": -11.62654972076416, "global_step": 265752, "epoch": 1581} {"train_loss": -12.179045677185059, "global_step": 265753, "epoch": 1581} {"train_loss": -11.615389823913574, "global_step": 265754, "epoch": 1581} {"train_loss": -11.920202255249023, "global_step": 265755, "epoch": 1581} {"train_loss": -11.897233963012695, "global_step": 265756, "epoch": 1581} {"train_loss": -11.893592834472656, "global_step": 265757, "epoch": 1581} {"train_loss": -12.018701553344727, "global_step": 265758, "epoch": 1581} {"train_loss": -12.13414192199707, "global_step": 265759, "epoch": 1581} {"train_loss": -12.005062103271484, "global_step": 265760, "epoch": 1581} {"train_loss": -12.17757797241211, "global_step": 265761, "epoch": 1581} {"train_loss": -11.995864868164062, "global_step": 265762, "epoch": 1581} {"train_loss": -12.181583404541016, "global_step": 265763, "epoch": 1581} {"train_loss": -12.135453224182129, "global_step": 265764, "epoch": 1581} {"train_loss": -11.87939739227295, "global_step": 265765, "epoch": 1581} {"train_loss": -11.974773406982422, "global_step": 265766, "epoch": 1581} {"train_loss": -12.139066696166992, "global_step": 265767, "epoch": 1581} {"train_loss": -11.836307525634766, "global_step": 265768, "epoch": 1581} {"train_loss": -11.950722694396973, "global_step": 265769, "epoch": 1581} {"train_loss": -11.854475021362305, "global_step": 265770, "epoch": 1581} {"train_loss": -11.579988479614258, "global_step": 265771, "epoch": 1581} {"train_loss": -12.25710678100586, "global_step": 265772, "epoch": 1581} {"train_loss": -11.996313095092773, "global_step": 265773, "epoch": 1581} {"train_loss": -12.112728118896484, "global_step": 265774, "epoch": 1581} {"train_loss": -11.630603580247788, "global_step": 265775, "epoch": 1581, "val_loss": 271127.59375} {"train_loss": -11.888254165649414, "global_step": 265776, "epoch": 1582} {"train_loss": -12.048467636108398, "global_step": 265777, "epoch": 1582} {"train_loss": -12.032529830932617, "global_step": 265778, "epoch": 1582} {"train_loss": -12.163846969604492, "global_step": 265779, "epoch": 1582} {"train_loss": -12.144580841064453, "global_step": 265780, "epoch": 1582} {"train_loss": -12.355522155761719, "global_step": 265781, "epoch": 1582} {"train_loss": -12.21090316772461, "global_step": 265782, "epoch": 1582} {"train_loss": -12.275640487670898, "global_step": 265783, "epoch": 1582} {"train_loss": -12.139493942260742, "global_step": 265784, "epoch": 1582} {"train_loss": -11.879518508911133, "global_step": 265785, "epoch": 1582} {"train_loss": -12.281664848327637, "global_step": 265786, "epoch": 1582} {"train_loss": -12.31208324432373, "global_step": 265787, "epoch": 1582} {"train_loss": -11.879222869873047, "global_step": 265788, "epoch": 1582} {"train_loss": -12.065620422363281, "global_step": 265789, "epoch": 1582} {"train_loss": -12.428123474121094, "global_step": 265790, "epoch": 1582} {"train_loss": -12.207099914550781, "global_step": 265791, "epoch": 1582} {"train_loss": -12.171843528747559, "global_step": 265792, "epoch": 1582} {"train_loss": -12.162169456481934, "global_step": 265793, "epoch": 1582} {"train_loss": -12.251269340515137, "global_step": 265794, "epoch": 1582} {"train_loss": -12.200433731079102, "global_step": 265795, "epoch": 1582} {"train_loss": -12.186293601989746, "global_step": 265796, "epoch": 1582} {"train_loss": -11.941964149475098, "global_step": 265797, "epoch": 1582} {"train_loss": -12.235424041748047, "global_step": 265798, "epoch": 1582} {"train_loss": -12.167939186096191, "global_step": 265799, "epoch": 1582} {"train_loss": -11.867131233215332, "global_step": 265800, "epoch": 1582} {"train_loss": -11.800223350524902, "global_step": 265801, "epoch": 1582} {"train_loss": -12.279726028442383, "global_step": 265802, "epoch": 1582} {"train_loss": -11.544824600219727, "global_step": 265803, "epoch": 1582} {"train_loss": -12.247824668884277, "global_step": 265804, "epoch": 1582} {"train_loss": -12.014528274536133, "global_step": 265805, "epoch": 1582} {"train_loss": -11.717859268188477, "global_step": 265806, "epoch": 1582} {"train_loss": -11.205194473266602, "global_step": 265807, "epoch": 1582} {"train_loss": -12.109973907470703, "global_step": 265808, "epoch": 1582} {"train_loss": -11.730600357055664, "global_step": 265809, "epoch": 1582} {"train_loss": -11.307083129882812, "global_step": 265810, "epoch": 1582} {"train_loss": -12.0001220703125, "global_step": 265811, "epoch": 1582} {"train_loss": -11.932523727416992, "global_step": 265812, "epoch": 1582} {"train_loss": -11.893693923950195, "global_step": 265813, "epoch": 1582} {"train_loss": -12.022761344909668, "global_step": 265814, "epoch": 1582} {"train_loss": -11.850342750549316, "global_step": 265815, "epoch": 1582} {"train_loss": -11.720100402832031, "global_step": 265816, "epoch": 1582} {"train_loss": -11.578535079956055, "global_step": 265817, "epoch": 1582} {"train_loss": -11.921361923217773, "global_step": 265818, "epoch": 1582} {"train_loss": -11.391345977783203, "global_step": 265819, "epoch": 1582} {"train_loss": -11.66007137298584, "global_step": 265820, "epoch": 1582} {"train_loss": -11.8642578125, "global_step": 265821, "epoch": 1582} {"train_loss": -11.469841957092285, "global_step": 265822, "epoch": 1582} {"train_loss": -11.871214866638184, "global_step": 265823, "epoch": 1582} {"train_loss": -10.394140243530273, "global_step": 265824, "epoch": 1582} {"train_loss": -11.167215347290039, "global_step": 265825, "epoch": 1582} {"train_loss": -11.740861892700195, "global_step": 265826, "epoch": 1582} {"train_loss": -11.359716415405273, "global_step": 265827, "epoch": 1582} {"train_loss": -10.512371063232422, "global_step": 265828, "epoch": 1582} {"train_loss": -10.090727806091309, "global_step": 265829, "epoch": 1582} {"train_loss": -10.214719772338867, "global_step": 265830, "epoch": 1582} {"train_loss": -10.805981636047363, "global_step": 265831, "epoch": 1582} {"train_loss": -10.913297653198242, "global_step": 265832, "epoch": 1582} {"train_loss": -10.820625305175781, "global_step": 265833, "epoch": 1582} {"train_loss": -11.196937561035156, "global_step": 265834, "epoch": 1582} {"train_loss": -11.605642318725586, "global_step": 265835, "epoch": 1582} {"train_loss": -11.453781127929688, "global_step": 265836, "epoch": 1582} {"train_loss": -11.610322952270508, "global_step": 265837, "epoch": 1582} {"train_loss": -11.789417266845703, "global_step": 265838, "epoch": 1582} {"train_loss": -11.971807479858398, "global_step": 265839, "epoch": 1582} {"train_loss": -11.598684310913086, "global_step": 265840, "epoch": 1582} {"train_loss": -11.939064025878906, "global_step": 265841, "epoch": 1582} {"train_loss": -11.466266632080078, "global_step": 265842, "epoch": 1582} {"train_loss": -11.936408042907715, "global_step": 265843, "epoch": 1582} {"train_loss": -11.718606948852539, "global_step": 265844, "epoch": 1582} {"train_loss": -11.657657623291016, "global_step": 265845, "epoch": 1582} {"train_loss": -11.654661178588867, "global_step": 265846, "epoch": 1582} {"train_loss": -11.536263465881348, "global_step": 265847, "epoch": 1582} {"train_loss": -11.66827392578125, "global_step": 265848, "epoch": 1582} {"train_loss": -11.715319633483887, "global_step": 265849, "epoch": 1582} {"train_loss": -11.844578742980957, "global_step": 265850, "epoch": 1582} {"train_loss": -12.053491592407227, "global_step": 265851, "epoch": 1582} {"train_loss": -11.651252746582031, "global_step": 265852, "epoch": 1582} {"train_loss": -11.916160583496094, "global_step": 265853, "epoch": 1582} {"train_loss": -11.992690086364746, "global_step": 265854, "epoch": 1582} {"train_loss": -11.41661262512207, "global_step": 265855, "epoch": 1582} {"train_loss": -12.06467056274414, "global_step": 265856, "epoch": 1582} {"train_loss": -11.636974334716797, "global_step": 265857, "epoch": 1582} {"train_loss": -11.644643783569336, "global_step": 265858, "epoch": 1582} {"train_loss": -11.591357231140137, "global_step": 265859, "epoch": 1582} {"train_loss": -11.576469421386719, "global_step": 265860, "epoch": 1582} {"train_loss": -11.977452278137207, "global_step": 265861, "epoch": 1582} {"train_loss": -12.024468421936035, "global_step": 265862, "epoch": 1582} {"train_loss": -11.776786804199219, "global_step": 265863, "epoch": 1582} {"train_loss": -12.139142036437988, "global_step": 265864, "epoch": 1582} {"train_loss": -11.543572425842285, "global_step": 265865, "epoch": 1582} {"train_loss": -12.077911376953125, "global_step": 265866, "epoch": 1582} {"train_loss": -11.91209602355957, "global_step": 265867, "epoch": 1582} {"train_loss": -11.935751914978027, "global_step": 265868, "epoch": 1582} {"train_loss": -11.991410255432129, "global_step": 265869, "epoch": 1582} {"train_loss": -11.81219482421875, "global_step": 265870, "epoch": 1582} {"train_loss": -11.879066467285156, "global_step": 265871, "epoch": 1582} {"train_loss": -12.052392959594727, "global_step": 265872, "epoch": 1582} {"train_loss": -11.47027587890625, "global_step": 265873, "epoch": 1582} {"train_loss": -12.009098052978516, "global_step": 265874, "epoch": 1582} {"train_loss": -11.142868041992188, "global_step": 265875, "epoch": 1582} {"train_loss": -10.318840026855469, "global_step": 265876, "epoch": 1582} {"train_loss": -11.569732666015625, "global_step": 265877, "epoch": 1582} {"train_loss": -10.997466087341309, "global_step": 265878, "epoch": 1582} {"train_loss": -11.282936096191406, "global_step": 265879, "epoch": 1582} {"train_loss": -11.03519058227539, "global_step": 265880, "epoch": 1582} {"train_loss": -11.023513793945312, "global_step": 265881, "epoch": 1582} {"train_loss": -10.918769836425781, "global_step": 265882, "epoch": 1582} {"train_loss": -10.014047622680664, "global_step": 265883, "epoch": 1582} {"train_loss": -11.36742115020752, "global_step": 265884, "epoch": 1582} {"train_loss": -10.860090255737305, "global_step": 265885, "epoch": 1582} {"train_loss": -11.36256217956543, "global_step": 265886, "epoch": 1582} {"train_loss": -11.611244201660156, "global_step": 265887, "epoch": 1582} {"train_loss": -11.312272071838379, "global_step": 265888, "epoch": 1582} {"train_loss": -11.554929733276367, "global_step": 265889, "epoch": 1582} {"train_loss": -11.792966842651367, "global_step": 265890, "epoch": 1582} {"train_loss": -11.696921348571777, "global_step": 265891, "epoch": 1582} {"train_loss": -11.225105285644531, "global_step": 265892, "epoch": 1582} {"train_loss": -11.62391185760498, "global_step": 265893, "epoch": 1582} {"train_loss": -11.67162799835205, "global_step": 265894, "epoch": 1582} {"train_loss": -11.81979751586914, "global_step": 265895, "epoch": 1582} {"train_loss": -11.746829986572266, "global_step": 265896, "epoch": 1582} {"train_loss": -11.63305950164795, "global_step": 265897, "epoch": 1582} {"train_loss": -11.80888557434082, "global_step": 265898, "epoch": 1582} {"train_loss": -11.351144790649414, "global_step": 265899, "epoch": 1582} {"train_loss": -11.943879127502441, "global_step": 265900, "epoch": 1582} {"train_loss": -11.602912902832031, "global_step": 265901, "epoch": 1582} {"train_loss": -11.354133605957031, "global_step": 265902, "epoch": 1582} {"train_loss": -11.564347267150879, "global_step": 265903, "epoch": 1582} {"train_loss": -11.657367706298828, "global_step": 265904, "epoch": 1582} {"train_loss": -11.387300491333008, "global_step": 265905, "epoch": 1582} {"train_loss": -11.269268035888672, "global_step": 265906, "epoch": 1582} {"train_loss": -11.959558486938477, "global_step": 265907, "epoch": 1582} {"train_loss": -11.725223541259766, "global_step": 265908, "epoch": 1582} {"train_loss": -11.654413223266602, "global_step": 265909, "epoch": 1582} {"train_loss": -11.29173469543457, "global_step": 265910, "epoch": 1582} {"train_loss": -11.72746467590332, "global_step": 265911, "epoch": 1582} {"train_loss": -11.712751388549805, "global_step": 265912, "epoch": 1582} {"train_loss": -11.724178314208984, "global_step": 265913, "epoch": 1582} {"train_loss": -11.753040313720703, "global_step": 265914, "epoch": 1582} {"train_loss": -11.637832641601562, "global_step": 265915, "epoch": 1582} {"train_loss": -11.932025909423828, "global_step": 265916, "epoch": 1582} {"train_loss": -11.901073455810547, "global_step": 265917, "epoch": 1582} {"train_loss": -11.801989555358887, "global_step": 265918, "epoch": 1582} {"train_loss": -11.73843765258789, "global_step": 265919, "epoch": 1582} {"train_loss": -11.683858871459961, "global_step": 265920, "epoch": 1582} {"train_loss": -11.90781021118164, "global_step": 265921, "epoch": 1582} {"train_loss": -11.932323455810547, "global_step": 265922, "epoch": 1582} {"train_loss": -11.782808303833008, "global_step": 265923, "epoch": 1582} {"train_loss": -11.963350296020508, "global_step": 265924, "epoch": 1582} {"train_loss": -11.831108093261719, "global_step": 265925, "epoch": 1582} {"train_loss": -12.205098152160645, "global_step": 265926, "epoch": 1582} {"train_loss": -11.888484954833984, "global_step": 265927, "epoch": 1582} {"train_loss": -12.08458137512207, "global_step": 265928, "epoch": 1582} {"train_loss": -12.025090217590332, "global_step": 265929, "epoch": 1582} {"train_loss": -11.882946968078613, "global_step": 265930, "epoch": 1582} {"train_loss": -12.123832702636719, "global_step": 265931, "epoch": 1582} {"train_loss": -11.986580848693848, "global_step": 265932, "epoch": 1582} {"train_loss": -12.30415153503418, "global_step": 265933, "epoch": 1582} {"train_loss": -11.965282440185547, "global_step": 265934, "epoch": 1582} {"train_loss": -11.842385292053223, "global_step": 265935, "epoch": 1582} {"train_loss": -12.173892974853516, "global_step": 265936, "epoch": 1582} {"train_loss": -12.0479097366333, "global_step": 265937, "epoch": 1582} {"train_loss": -11.95792007446289, "global_step": 265938, "epoch": 1582} {"train_loss": -11.937247276306152, "global_step": 265939, "epoch": 1582} {"train_loss": -12.088883399963379, "global_step": 265940, "epoch": 1582} {"train_loss": -11.401089668273926, "global_step": 265941, "epoch": 1582} {"train_loss": -12.072664260864258, "global_step": 265942, "epoch": 1582} {"train_loss": -11.71475564865839, "global_step": 265943, "epoch": 1582, "val_loss": 274013.9375} {"train_loss": -11.87025260925293, "global_step": 265944, "epoch": 1583} {"train_loss": -11.822599411010742, "global_step": 265945, "epoch": 1583} {"train_loss": -11.665133476257324, "global_step": 265946, "epoch": 1583} {"train_loss": -12.114457130432129, "global_step": 265947, "epoch": 1583} {"train_loss": -11.808615684509277, "global_step": 265948, "epoch": 1583} {"train_loss": -12.30543327331543, "global_step": 265949, "epoch": 1583} {"train_loss": -12.175138473510742, "global_step": 265950, "epoch": 1583} {"train_loss": -12.077037811279297, "global_step": 265951, "epoch": 1583} {"train_loss": -12.145149230957031, "global_step": 265952, "epoch": 1583} {"train_loss": -12.183412551879883, "global_step": 265953, "epoch": 1583} {"train_loss": -12.203670501708984, "global_step": 265954, "epoch": 1583} {"train_loss": -12.277700424194336, "global_step": 265955, "epoch": 1583} {"train_loss": -12.28012466430664, "global_step": 265956, "epoch": 1583} {"train_loss": -12.301003456115723, "global_step": 265957, "epoch": 1583} {"train_loss": -12.05648136138916, "global_step": 265958, "epoch": 1583} {"train_loss": -12.265846252441406, "global_step": 265959, "epoch": 1583} {"train_loss": -11.800167083740234, "global_step": 265960, "epoch": 1583} {"train_loss": -12.014582633972168, "global_step": 265961, "epoch": 1583} {"train_loss": -11.58238410949707, "global_step": 265962, "epoch": 1583} {"train_loss": -11.715768814086914, "global_step": 265963, "epoch": 1583} {"train_loss": -11.076562881469727, "global_step": 265964, "epoch": 1583} {"train_loss": -10.953215599060059, "global_step": 265965, "epoch": 1583} {"train_loss": -11.769862174987793, "global_step": 265966, "epoch": 1583} {"train_loss": -10.84570026397705, "global_step": 265967, "epoch": 1583} {"train_loss": -10.100103378295898, "global_step": 265968, "epoch": 1583} {"train_loss": -11.864971160888672, "global_step": 265969, "epoch": 1583} {"train_loss": -11.460508346557617, "global_step": 265970, "epoch": 1583} {"train_loss": -11.294206619262695, "global_step": 265971, "epoch": 1583} {"train_loss": -11.24527645111084, "global_step": 265972, "epoch": 1583} {"train_loss": -11.609286308288574, "global_step": 265973, "epoch": 1583} {"train_loss": -11.353128433227539, "global_step": 265974, "epoch": 1583} {"train_loss": -11.298852920532227, "global_step": 265975, "epoch": 1583} {"train_loss": -11.920502662658691, "global_step": 265976, "epoch": 1583} {"train_loss": -11.216578483581543, "global_step": 265977, "epoch": 1583} {"train_loss": -11.20152473449707, "global_step": 265978, "epoch": 1583} {"train_loss": -11.82608413696289, "global_step": 265979, "epoch": 1583} {"train_loss": -11.178040504455566, "global_step": 265980, "epoch": 1583} {"train_loss": -11.242721557617188, "global_step": 265981, "epoch": 1583} {"train_loss": -11.279775619506836, "global_step": 265982, "epoch": 1583} {"train_loss": -11.292604446411133, "global_step": 265983, "epoch": 1583} {"train_loss": -11.208907127380371, "global_step": 265984, "epoch": 1583} {"train_loss": -11.695746421813965, "global_step": 265985, "epoch": 1583} {"train_loss": -10.215078353881836, "global_step": 265986, "epoch": 1583} {"train_loss": -11.52910327911377, "global_step": 265987, "epoch": 1583} {"train_loss": -8.560189247131348, "global_step": 265988, "epoch": 1583} {"train_loss": -11.736738204956055, "global_step": 265989, "epoch": 1583} {"train_loss": -10.051619529724121, "global_step": 265990, "epoch": 1583} {"train_loss": -11.462135314941406, "global_step": 265991, "epoch": 1583} {"train_loss": -11.046283721923828, "global_step": 265992, "epoch": 1583} {"train_loss": -10.683220863342285, "global_step": 265993, "epoch": 1583} {"train_loss": -11.075139999389648, "global_step": 265994, "epoch": 1583} {"train_loss": -10.848398208618164, "global_step": 265995, "epoch": 1583} {"train_loss": -11.243998527526855, "global_step": 265996, "epoch": 1583} {"train_loss": -11.488430976867676, "global_step": 265997, "epoch": 1583} {"train_loss": -11.052606582641602, "global_step": 265998, "epoch": 1583} {"train_loss": -11.209756851196289, "global_step": 265999, "epoch": 1583} {"train_loss": -11.274763107299805, "global_step": 266000, "epoch": 1583} {"train_loss": -11.516498565673828, "global_step": 266001, "epoch": 1583} {"train_loss": -11.290800094604492, "global_step": 266002, "epoch": 1583} {"train_loss": -11.538396835327148, "global_step": 266003, "epoch": 1583} {"train_loss": -11.38577651977539, "global_step": 266004, "epoch": 1583} {"train_loss": -11.516563415527344, "global_step": 266005, "epoch": 1583} {"train_loss": -11.599275588989258, "global_step": 266006, "epoch": 1583} {"train_loss": -11.128305435180664, "global_step": 266007, "epoch": 1583} {"train_loss": -11.785453796386719, "global_step": 266008, "epoch": 1583} {"train_loss": -11.193592071533203, "global_step": 266009, "epoch": 1583} {"train_loss": -11.662559509277344, "global_step": 266010, "epoch": 1583} {"train_loss": -11.486701965332031, "global_step": 266011, "epoch": 1583} {"train_loss": -11.153602600097656, "global_step": 266012, "epoch": 1583} {"train_loss": -11.745166778564453, "global_step": 266013, "epoch": 1583} {"train_loss": -10.968098640441895, "global_step": 266014, "epoch": 1583} {"train_loss": -11.733530044555664, "global_step": 266015, "epoch": 1583} {"train_loss": -11.257352828979492, "global_step": 266016, "epoch": 1583} {"train_loss": -11.702391624450684, "global_step": 266017, "epoch": 1583} {"train_loss": -11.602028846740723, "global_step": 266018, "epoch": 1583} {"train_loss": -11.581345558166504, "global_step": 266019, "epoch": 1583} {"train_loss": -11.755603790283203, "global_step": 266020, "epoch": 1583} {"train_loss": -11.331575393676758, "global_step": 266021, "epoch": 1583} {"train_loss": -11.6881685256958, "global_step": 266022, "epoch": 1583} {"train_loss": -11.402273178100586, "global_step": 266023, "epoch": 1583} {"train_loss": -11.174409866333008, "global_step": 266024, "epoch": 1583} {"train_loss": -11.694219589233398, "global_step": 266025, "epoch": 1583} {"train_loss": -11.134439468383789, "global_step": 266026, "epoch": 1583} {"train_loss": -12.039237022399902, "global_step": 266027, "epoch": 1583} {"train_loss": -11.195783615112305, "global_step": 266028, "epoch": 1583} {"train_loss": -11.49519157409668, "global_step": 266029, "epoch": 1583} {"train_loss": -11.436373710632324, "global_step": 266030, "epoch": 1583} {"train_loss": -11.071767807006836, "global_step": 266031, "epoch": 1583} {"train_loss": -12.16282844543457, "global_step": 266032, "epoch": 1583} {"train_loss": -10.588920593261719, "global_step": 266033, "epoch": 1583} {"train_loss": -11.669757843017578, "global_step": 266034, "epoch": 1583} {"train_loss": -11.36882495880127, "global_step": 266035, "epoch": 1583} {"train_loss": -11.65165901184082, "global_step": 266036, "epoch": 1583} {"train_loss": -11.43763542175293, "global_step": 266037, "epoch": 1583} {"train_loss": -11.821843147277832, "global_step": 266038, "epoch": 1583} {"train_loss": -11.229179382324219, "global_step": 266039, "epoch": 1583} {"train_loss": -11.73764419555664, "global_step": 266040, "epoch": 1583} {"train_loss": -11.60919189453125, "global_step": 266041, "epoch": 1583} {"train_loss": -11.56519603729248, "global_step": 266042, "epoch": 1583} {"train_loss": -11.862980842590332, "global_step": 266043, "epoch": 1583} {"train_loss": -11.606180191040039, "global_step": 266044, "epoch": 1583} {"train_loss": -12.029033660888672, "global_step": 266045, "epoch": 1583} {"train_loss": -11.18740463256836, "global_step": 266046, "epoch": 1583} {"train_loss": -11.537243843078613, "global_step": 266047, "epoch": 1583} {"train_loss": -11.85527515411377, "global_step": 266048, "epoch": 1583} {"train_loss": -11.206511497497559, "global_step": 266049, "epoch": 1583} {"train_loss": -11.74872875213623, "global_step": 266050, "epoch": 1583} {"train_loss": -11.726696014404297, "global_step": 266051, "epoch": 1583} {"train_loss": -11.587095260620117, "global_step": 266052, "epoch": 1583} {"train_loss": -11.576668739318848, "global_step": 266053, "epoch": 1583} {"train_loss": -11.630773544311523, "global_step": 266054, "epoch": 1583} {"train_loss": -11.762269020080566, "global_step": 266055, "epoch": 1583} {"train_loss": -11.901334762573242, "global_step": 266056, "epoch": 1583} {"train_loss": -11.74266242980957, "global_step": 266057, "epoch": 1583} {"train_loss": -11.983431816101074, "global_step": 266058, "epoch": 1583} {"train_loss": -11.671802520751953, "global_step": 266059, "epoch": 1583} {"train_loss": -11.951351165771484, "global_step": 266060, "epoch": 1583} {"train_loss": -11.965404510498047, "global_step": 266061, "epoch": 1583} {"train_loss": -12.024604797363281, "global_step": 266062, "epoch": 1583} {"train_loss": -12.056365013122559, "global_step": 266063, "epoch": 1583} {"train_loss": -11.851273536682129, "global_step": 266064, "epoch": 1583} {"train_loss": -11.954496383666992, "global_step": 266065, "epoch": 1583} {"train_loss": -11.811673164367676, "global_step": 266066, "epoch": 1583} {"train_loss": -11.756770133972168, "global_step": 266067, "epoch": 1583} {"train_loss": -12.062954902648926, "global_step": 266068, "epoch": 1583} {"train_loss": -11.637458801269531, "global_step": 266069, "epoch": 1583} {"train_loss": -12.070536613464355, "global_step": 266070, "epoch": 1583} {"train_loss": -11.817606925964355, "global_step": 266071, "epoch": 1583} {"train_loss": -11.8969087600708, "global_step": 266072, "epoch": 1583} {"train_loss": -12.018804550170898, "global_step": 266073, "epoch": 1583} {"train_loss": -12.046037673950195, "global_step": 266074, "epoch": 1583} {"train_loss": -11.955953598022461, "global_step": 266075, "epoch": 1583} {"train_loss": -12.01472282409668, "global_step": 266076, "epoch": 1583} {"train_loss": -11.937711715698242, "global_step": 266077, "epoch": 1583} {"train_loss": -12.261197090148926, "global_step": 266078, "epoch": 1583} {"train_loss": -11.950746536254883, "global_step": 266079, "epoch": 1583} {"train_loss": -12.251022338867188, "global_step": 266080, "epoch": 1583} {"train_loss": -12.147947311401367, "global_step": 266081, "epoch": 1583} {"train_loss": -11.908707618713379, "global_step": 266082, "epoch": 1583} {"train_loss": -12.127573013305664, "global_step": 266083, "epoch": 1583} {"train_loss": -11.961648941040039, "global_step": 266084, "epoch": 1583} {"train_loss": -12.079024314880371, "global_step": 266085, "epoch": 1583} {"train_loss": -12.141743659973145, "global_step": 266086, "epoch": 1583} {"train_loss": -12.109964370727539, "global_step": 266087, "epoch": 1583} {"train_loss": -12.232593536376953, "global_step": 266088, "epoch": 1583} {"train_loss": -12.157674789428711, "global_step": 266089, "epoch": 1583} {"train_loss": -12.211577415466309, "global_step": 266090, "epoch": 1583} {"train_loss": -12.151832580566406, "global_step": 266091, "epoch": 1583} {"train_loss": -12.29574966430664, "global_step": 266092, "epoch": 1583} {"train_loss": -11.97266960144043, "global_step": 266093, "epoch": 1583} {"train_loss": -12.249269485473633, "global_step": 266094, "epoch": 1583} {"train_loss": -12.142704010009766, "global_step": 266095, "epoch": 1583} {"train_loss": -11.956165313720703, "global_step": 266096, "epoch": 1583} {"train_loss": -11.962993621826172, "global_step": 266097, "epoch": 1583} {"train_loss": -12.011001586914062, "global_step": 266098, "epoch": 1583} {"train_loss": -11.447906494140625, "global_step": 266099, "epoch": 1583} {"train_loss": -11.795463562011719, "global_step": 266100, "epoch": 1583} {"train_loss": -12.188680648803711, "global_step": 266101, "epoch": 1583} {"train_loss": -11.82634449005127, "global_step": 266102, "epoch": 1583} {"train_loss": -12.2589111328125, "global_step": 266103, "epoch": 1583} {"train_loss": -12.14441967010498, "global_step": 266104, "epoch": 1583} {"train_loss": -11.962150573730469, "global_step": 266105, "epoch": 1583} {"train_loss": -12.029460906982422, "global_step": 266106, "epoch": 1583} {"train_loss": -12.258243560791016, "global_step": 266107, "epoch": 1583} {"train_loss": -12.19954776763916, "global_step": 266108, "epoch": 1583} {"train_loss": -12.198817253112793, "global_step": 266109, "epoch": 1583} {"train_loss": -12.228594779968262, "global_step": 266110, "epoch": 1583} {"train_loss": -11.664532054038276, "global_step": 266111, "epoch": 1583, "val_loss": 271671.15625} {"train_loss": -12.144699096679688, "global_step": 266112, "epoch": 1584} {"train_loss": -11.409069061279297, "global_step": 266113, "epoch": 1584} {"train_loss": -11.441900253295898, "global_step": 266114, "epoch": 1584} {"train_loss": -12.095317840576172, "global_step": 266115, "epoch": 1584} {"train_loss": -11.932207107543945, "global_step": 266116, "epoch": 1584} {"train_loss": -11.829222679138184, "global_step": 266117, "epoch": 1584} {"train_loss": -11.934159278869629, "global_step": 266118, "epoch": 1584} {"train_loss": -11.98748779296875, "global_step": 266119, "epoch": 1584} {"train_loss": -11.928462982177734, "global_step": 266120, "epoch": 1584} {"train_loss": -12.097949981689453, "global_step": 266121, "epoch": 1584} {"train_loss": -12.051298141479492, "global_step": 266122, "epoch": 1584} {"train_loss": -12.335649490356445, "global_step": 266123, "epoch": 1584} {"train_loss": -11.750443458557129, "global_step": 266124, "epoch": 1584} {"train_loss": -11.696671485900879, "global_step": 266125, "epoch": 1584} {"train_loss": -11.91179084777832, "global_step": 266126, "epoch": 1584} {"train_loss": -11.130086898803711, "global_step": 266127, "epoch": 1584} {"train_loss": -10.962322235107422, "global_step": 266128, "epoch": 1584} {"train_loss": -11.848682403564453, "global_step": 266129, "epoch": 1584} {"train_loss": -11.575540542602539, "global_step": 266130, "epoch": 1584} {"train_loss": -10.887341499328613, "global_step": 266131, "epoch": 1584} {"train_loss": -11.51283073425293, "global_step": 266132, "epoch": 1584} {"train_loss": -11.783303260803223, "global_step": 266133, "epoch": 1584} {"train_loss": -11.386922836303711, "global_step": 266134, "epoch": 1584} {"train_loss": -11.755783081054688, "global_step": 266135, "epoch": 1584} {"train_loss": -11.423517227172852, "global_step": 266136, "epoch": 1584} {"train_loss": -10.962570190429688, "global_step": 266137, "epoch": 1584} {"train_loss": -11.795049667358398, "global_step": 266138, "epoch": 1584} {"train_loss": -11.014785766601562, "global_step": 266139, "epoch": 1584} {"train_loss": -10.600476264953613, "global_step": 266140, "epoch": 1584} {"train_loss": -11.767579078674316, "global_step": 266141, "epoch": 1584} {"train_loss": -11.758427619934082, "global_step": 266142, "epoch": 1584} {"train_loss": -10.57359504699707, "global_step": 266143, "epoch": 1584} {"train_loss": -9.835739135742188, "global_step": 266144, "epoch": 1584} {"train_loss": -11.83594036102295, "global_step": 266145, "epoch": 1584} {"train_loss": -9.868895530700684, "global_step": 266146, "epoch": 1584} {"train_loss": -11.366231918334961, "global_step": 266147, "epoch": 1584} {"train_loss": -11.038655281066895, "global_step": 266148, "epoch": 1584} {"train_loss": -11.532258987426758, "global_step": 266149, "epoch": 1584} {"train_loss": -11.063640594482422, "global_step": 266150, "epoch": 1584} {"train_loss": -11.594931602478027, "global_step": 266151, "epoch": 1584} {"train_loss": -11.45185375213623, "global_step": 266152, "epoch": 1584} {"train_loss": -11.328481674194336, "global_step": 266153, "epoch": 1584} {"train_loss": -11.549161911010742, "global_step": 266154, "epoch": 1584} {"train_loss": -11.16111946105957, "global_step": 266155, "epoch": 1584} {"train_loss": -11.361557006835938, "global_step": 266156, "epoch": 1584} {"train_loss": -11.55003547668457, "global_step": 266157, "epoch": 1584} {"train_loss": -11.436180114746094, "global_step": 266158, "epoch": 1584} {"train_loss": -11.379206657409668, "global_step": 266159, "epoch": 1584} {"train_loss": -11.52269172668457, "global_step": 266160, "epoch": 1584} {"train_loss": -11.316859245300293, "global_step": 266161, "epoch": 1584} {"train_loss": -11.366652488708496, "global_step": 266162, "epoch": 1584} {"train_loss": -11.822412490844727, "global_step": 266163, "epoch": 1584} {"train_loss": -11.826639175415039, "global_step": 266164, "epoch": 1584} {"train_loss": -11.799497604370117, "global_step": 266165, "epoch": 1584} {"train_loss": -11.5980224609375, "global_step": 266166, "epoch": 1584} {"train_loss": -11.550301551818848, "global_step": 266167, "epoch": 1584} {"train_loss": -11.551119804382324, "global_step": 266168, "epoch": 1584} {"train_loss": -11.447624206542969, "global_step": 266169, "epoch": 1584} {"train_loss": -12.012247085571289, "global_step": 266170, "epoch": 1584} {"train_loss": -10.71000862121582, "global_step": 266171, "epoch": 1584} {"train_loss": -11.831262588500977, "global_step": 266172, "epoch": 1584} {"train_loss": -11.76626205444336, "global_step": 266173, "epoch": 1584} {"train_loss": -11.741170883178711, "global_step": 266174, "epoch": 1584} {"train_loss": -10.716592788696289, "global_step": 266175, "epoch": 1584} {"train_loss": -11.097063064575195, "global_step": 266176, "epoch": 1584} {"train_loss": -10.956302642822266, "global_step": 266177, "epoch": 1584} {"train_loss": -11.35621452331543, "global_step": 266178, "epoch": 1584} {"train_loss": -11.620075225830078, "global_step": 266179, "epoch": 1584} {"train_loss": -11.478401184082031, "global_step": 266180, "epoch": 1584} {"train_loss": -11.465956687927246, "global_step": 266181, "epoch": 1584} {"train_loss": -11.026561737060547, "global_step": 266182, "epoch": 1584} {"train_loss": -11.028434753417969, "global_step": 266183, "epoch": 1584} {"train_loss": -11.55205249786377, "global_step": 266184, "epoch": 1584} {"train_loss": -11.136972427368164, "global_step": 266185, "epoch": 1584} {"train_loss": -11.093883514404297, "global_step": 266186, "epoch": 1584} {"train_loss": -11.577376365661621, "global_step": 266187, "epoch": 1584} {"train_loss": -11.689067840576172, "global_step": 266188, "epoch": 1584} {"train_loss": -11.871232986450195, "global_step": 266189, "epoch": 1584} {"train_loss": -11.432347297668457, "global_step": 266190, "epoch": 1584} {"train_loss": -11.64594841003418, "global_step": 266191, "epoch": 1584} {"train_loss": -11.897866249084473, "global_step": 266192, "epoch": 1584} {"train_loss": -11.903360366821289, "global_step": 266193, "epoch": 1584} {"train_loss": -11.609207153320312, "global_step": 266194, "epoch": 1584} {"train_loss": -11.682901382446289, "global_step": 266195, "epoch": 1584} {"train_loss": -11.979889869689941, "global_step": 266196, "epoch": 1584} {"train_loss": -11.54207706451416, "global_step": 266197, "epoch": 1584} {"train_loss": -11.889364242553711, "global_step": 266198, "epoch": 1584} {"train_loss": -11.61670207977295, "global_step": 266199, "epoch": 1584} {"train_loss": -11.786214828491211, "global_step": 266200, "epoch": 1584} {"train_loss": -11.832050323486328, "global_step": 266201, "epoch": 1584} {"train_loss": -11.535323143005371, "global_step": 266202, "epoch": 1584} {"train_loss": -11.99242115020752, "global_step": 266203, "epoch": 1584} {"train_loss": -11.790328025817871, "global_step": 266204, "epoch": 1584} {"train_loss": -11.989285469055176, "global_step": 266205, "epoch": 1584} {"train_loss": -11.887286186218262, "global_step": 266206, "epoch": 1584} {"train_loss": -12.07824420928955, "global_step": 266207, "epoch": 1584} {"train_loss": -11.836429595947266, "global_step": 266208, "epoch": 1584} {"train_loss": -11.815380096435547, "global_step": 266209, "epoch": 1584} {"train_loss": -11.972740173339844, "global_step": 266210, "epoch": 1584} {"train_loss": -12.053224563598633, "global_step": 266211, "epoch": 1584} {"train_loss": -11.886592864990234, "global_step": 266212, "epoch": 1584} {"train_loss": -11.778044700622559, "global_step": 266213, "epoch": 1584} {"train_loss": -12.048927307128906, "global_step": 266214, "epoch": 1584} {"train_loss": -11.980844497680664, "global_step": 266215, "epoch": 1584} {"train_loss": -11.854253768920898, "global_step": 266216, "epoch": 1584} {"train_loss": -11.372429847717285, "global_step": 266217, "epoch": 1584} {"train_loss": -11.91394329071045, "global_step": 266218, "epoch": 1584} {"train_loss": -11.959033012390137, "global_step": 266219, "epoch": 1584} {"train_loss": -11.862722396850586, "global_step": 266220, "epoch": 1584} {"train_loss": -11.739761352539062, "global_step": 266221, "epoch": 1584} {"train_loss": -11.610294342041016, "global_step": 266222, "epoch": 1584} {"train_loss": -12.099264144897461, "global_step": 266223, "epoch": 1584} {"train_loss": -11.679530143737793, "global_step": 266224, "epoch": 1584} {"train_loss": -12.076070785522461, "global_step": 266225, "epoch": 1584} {"train_loss": -11.795867919921875, "global_step": 266226, "epoch": 1584} {"train_loss": -11.874517440795898, "global_step": 266227, "epoch": 1584} {"train_loss": -11.725312232971191, "global_step": 266228, "epoch": 1584} {"train_loss": -12.009896278381348, "global_step": 266229, "epoch": 1584} {"train_loss": -12.009525299072266, "global_step": 266230, "epoch": 1584} {"train_loss": -11.792157173156738, "global_step": 266231, "epoch": 1584} {"train_loss": -11.720870971679688, "global_step": 266232, "epoch": 1584} {"train_loss": -12.082550048828125, "global_step": 266233, "epoch": 1584} {"train_loss": -12.128686904907227, "global_step": 266234, "epoch": 1584} {"train_loss": -12.01152515411377, "global_step": 266235, "epoch": 1584} {"train_loss": -11.97900390625, "global_step": 266236, "epoch": 1584} {"train_loss": -12.196371078491211, "global_step": 266237, "epoch": 1584} {"train_loss": -11.827574729919434, "global_step": 266238, "epoch": 1584} {"train_loss": -11.850668907165527, "global_step": 266239, "epoch": 1584} {"train_loss": -11.895628929138184, "global_step": 266240, "epoch": 1584} {"train_loss": -12.033706665039062, "global_step": 266241, "epoch": 1584} {"train_loss": -11.94878101348877, "global_step": 266242, "epoch": 1584} {"train_loss": -12.180593490600586, "global_step": 266243, "epoch": 1584} {"train_loss": -11.666366577148438, "global_step": 266244, "epoch": 1584} {"train_loss": -11.97535514831543, "global_step": 266245, "epoch": 1584} {"train_loss": -11.827446937561035, "global_step": 266246, "epoch": 1584} {"train_loss": -11.670112609863281, "global_step": 266247, "epoch": 1584} {"train_loss": -11.643349647521973, "global_step": 266248, "epoch": 1584} {"train_loss": -12.107760429382324, "global_step": 266249, "epoch": 1584} {"train_loss": -11.669734954833984, "global_step": 266250, "epoch": 1584} {"train_loss": -12.111175537109375, "global_step": 266251, "epoch": 1584} {"train_loss": -11.607220649719238, "global_step": 266252, "epoch": 1584} {"train_loss": -11.891952514648438, "global_step": 266253, "epoch": 1584} {"train_loss": -11.761682510375977, "global_step": 266254, "epoch": 1584} {"train_loss": -11.951690673828125, "global_step": 266255, "epoch": 1584} {"train_loss": -12.06175422668457, "global_step": 266256, "epoch": 1584} {"train_loss": -11.358501434326172, "global_step": 266257, "epoch": 1584} {"train_loss": -11.227818489074707, "global_step": 266258, "epoch": 1584} {"train_loss": -11.342536926269531, "global_step": 266259, "epoch": 1584} {"train_loss": -11.709087371826172, "global_step": 266260, "epoch": 1584} {"train_loss": -11.862554550170898, "global_step": 266261, "epoch": 1584} {"train_loss": -10.709467887878418, "global_step": 266262, "epoch": 1584} {"train_loss": -10.99588394165039, "global_step": 266263, "epoch": 1584} {"train_loss": -10.392019271850586, "global_step": 266264, "epoch": 1584} {"train_loss": -11.777917861938477, "global_step": 266265, "epoch": 1584} {"train_loss": -11.187137603759766, "global_step": 266266, "epoch": 1584} {"train_loss": -11.626031875610352, "global_step": 266267, "epoch": 1584} {"train_loss": -11.679939270019531, "global_step": 266268, "epoch": 1584} {"train_loss": -11.762088775634766, "global_step": 266269, "epoch": 1584} {"train_loss": -11.654853820800781, "global_step": 266270, "epoch": 1584} {"train_loss": -11.934087753295898, "global_step": 266271, "epoch": 1584} {"train_loss": -11.29723072052002, "global_step": 266272, "epoch": 1584} {"train_loss": -11.956238746643066, "global_step": 266273, "epoch": 1584} {"train_loss": -11.508650779724121, "global_step": 266274, "epoch": 1584} {"train_loss": -11.560834884643555, "global_step": 266275, "epoch": 1584} {"train_loss": -11.8973388671875, "global_step": 266276, "epoch": 1584} {"train_loss": -11.1136474609375, "global_step": 266277, "epoch": 1584} {"train_loss": -11.888294219970703, "global_step": 266278, "epoch": 1584} {"train_loss": -11.624364149002801, "global_step": 266279, "epoch": 1584, "val_loss": 273145.8125} {"train_loss": -11.63815975189209, "global_step": 266280, "epoch": 1585} {"train_loss": -11.849631309509277, "global_step": 266281, "epoch": 1585} {"train_loss": -11.889846801757812, "global_step": 266282, "epoch": 1585} {"train_loss": -11.786014556884766, "global_step": 266283, "epoch": 1585} {"train_loss": -11.864824295043945, "global_step": 266284, "epoch": 1585} {"train_loss": -11.345224380493164, "global_step": 266285, "epoch": 1585} {"train_loss": -11.830925941467285, "global_step": 266286, "epoch": 1585} {"train_loss": -11.765607833862305, "global_step": 266287, "epoch": 1585} {"train_loss": -12.1396484375, "global_step": 266288, "epoch": 1585} {"train_loss": -11.807092666625977, "global_step": 266289, "epoch": 1585} {"train_loss": -11.626145362854004, "global_step": 266290, "epoch": 1585} {"train_loss": -11.89961051940918, "global_step": 266291, "epoch": 1585} {"train_loss": -12.161852836608887, "global_step": 266292, "epoch": 1585} {"train_loss": -11.605579376220703, "global_step": 266293, "epoch": 1585} {"train_loss": -11.20130729675293, "global_step": 266294, "epoch": 1585} {"train_loss": -12.093381881713867, "global_step": 266295, "epoch": 1585} {"train_loss": -11.536571502685547, "global_step": 266296, "epoch": 1585} {"train_loss": -11.488357543945312, "global_step": 266297, "epoch": 1585} {"train_loss": -11.150337219238281, "global_step": 266298, "epoch": 1585} {"train_loss": -11.608701705932617, "global_step": 266299, "epoch": 1585} {"train_loss": -11.307655334472656, "global_step": 266300, "epoch": 1585} {"train_loss": -11.062725067138672, "global_step": 266301, "epoch": 1585} {"train_loss": -11.710572242736816, "global_step": 266302, "epoch": 1585} {"train_loss": -10.460434913635254, "global_step": 266303, "epoch": 1585} {"train_loss": -11.565082550048828, "global_step": 266304, "epoch": 1585} {"train_loss": -10.739510536193848, "global_step": 266305, "epoch": 1585} {"train_loss": -11.062255859375, "global_step": 266306, "epoch": 1585} {"train_loss": -11.905594825744629, "global_step": 266307, "epoch": 1585} {"train_loss": -10.639366149902344, "global_step": 266308, "epoch": 1585} {"train_loss": -10.884162902832031, "global_step": 266309, "epoch": 1585} {"train_loss": -11.149681091308594, "global_step": 266310, "epoch": 1585} {"train_loss": -10.204521179199219, "global_step": 266311, "epoch": 1585} {"train_loss": -11.431251525878906, "global_step": 266312, "epoch": 1585} {"train_loss": -10.291155815124512, "global_step": 266313, "epoch": 1585} {"train_loss": -11.2884521484375, "global_step": 266314, "epoch": 1585} {"train_loss": -9.914054870605469, "global_step": 266315, "epoch": 1585} {"train_loss": -10.704330444335938, "global_step": 266316, "epoch": 1585} {"train_loss": -10.745173454284668, "global_step": 266317, "epoch": 1585} {"train_loss": -10.346126556396484, "global_step": 266318, "epoch": 1585} {"train_loss": -10.216485977172852, "global_step": 266319, "epoch": 1585} {"train_loss": -11.159982681274414, "global_step": 266320, "epoch": 1585} {"train_loss": -9.861678123474121, "global_step": 266321, "epoch": 1585} {"train_loss": -10.44647216796875, "global_step": 266322, "epoch": 1585} {"train_loss": -10.579023361206055, "global_step": 266323, "epoch": 1585} {"train_loss": -10.662896156311035, "global_step": 266324, "epoch": 1585} {"train_loss": -10.933201789855957, "global_step": 266325, "epoch": 1585} {"train_loss": -10.88654613494873, "global_step": 266326, "epoch": 1585} {"train_loss": -11.535663604736328, "global_step": 266327, "epoch": 1585} {"train_loss": -11.638945579528809, "global_step": 266328, "epoch": 1585} {"train_loss": -11.580805778503418, "global_step": 266329, "epoch": 1585} {"train_loss": -11.602128028869629, "global_step": 266330, "epoch": 1585} {"train_loss": -11.346467971801758, "global_step": 266331, "epoch": 1585} {"train_loss": -11.518606185913086, "global_step": 266332, "epoch": 1585} {"train_loss": -11.666879653930664, "global_step": 266333, "epoch": 1585} {"train_loss": -11.769402503967285, "global_step": 266334, "epoch": 1585} {"train_loss": -11.409317016601562, "global_step": 266335, "epoch": 1585} {"train_loss": -11.59988784790039, "global_step": 266336, "epoch": 1585} {"train_loss": -11.811929702758789, "global_step": 266337, "epoch": 1585} {"train_loss": -11.674858093261719, "global_step": 266338, "epoch": 1585} {"train_loss": -11.858537673950195, "global_step": 266339, "epoch": 1585} {"train_loss": -11.93048095703125, "global_step": 266340, "epoch": 1585} {"train_loss": -11.943142890930176, "global_step": 266341, "epoch": 1585} {"train_loss": -11.822895050048828, "global_step": 266342, "epoch": 1585} {"train_loss": -11.629901885986328, "global_step": 266343, "epoch": 1585} {"train_loss": -11.759767532348633, "global_step": 266344, "epoch": 1585} {"train_loss": -11.633920669555664, "global_step": 266345, "epoch": 1585} {"train_loss": -11.821168899536133, "global_step": 266346, "epoch": 1585} {"train_loss": -12.066625595092773, "global_step": 266347, "epoch": 1585} {"train_loss": -11.841176986694336, "global_step": 266348, "epoch": 1585} {"train_loss": -11.854987144470215, "global_step": 266349, "epoch": 1585} {"train_loss": -12.10351276397705, "global_step": 266350, "epoch": 1585} {"train_loss": -12.01814079284668, "global_step": 266351, "epoch": 1585} {"train_loss": -12.272035598754883, "global_step": 266352, "epoch": 1585} {"train_loss": -11.832489013671875, "global_step": 266353, "epoch": 1585} {"train_loss": -12.053958892822266, "global_step": 266354, "epoch": 1585} {"train_loss": -11.92373275756836, "global_step": 266355, "epoch": 1585} {"train_loss": -12.037962913513184, "global_step": 266356, "epoch": 1585} {"train_loss": -12.177480697631836, "global_step": 266357, "epoch": 1585} {"train_loss": -12.085269927978516, "global_step": 266358, "epoch": 1585} {"train_loss": -12.21140193939209, "global_step": 266359, "epoch": 1585} {"train_loss": -11.98973274230957, "global_step": 266360, "epoch": 1585} {"train_loss": -12.105908393859863, "global_step": 266361, "epoch": 1585} {"train_loss": -12.183765411376953, "global_step": 266362, "epoch": 1585} {"train_loss": -12.151056289672852, "global_step": 266363, "epoch": 1585} {"train_loss": -12.143444061279297, "global_step": 266364, "epoch": 1585} {"train_loss": -12.155704498291016, "global_step": 266365, "epoch": 1585} {"train_loss": -12.04586124420166, "global_step": 266366, "epoch": 1585} {"train_loss": -12.105525970458984, "global_step": 266367, "epoch": 1585} {"train_loss": -11.921470642089844, "global_step": 266368, "epoch": 1585} {"train_loss": -12.13576889038086, "global_step": 266369, "epoch": 1585} {"train_loss": -11.783842086791992, "global_step": 266370, "epoch": 1585} {"train_loss": -12.201774597167969, "global_step": 266371, "epoch": 1585} {"train_loss": -12.064188003540039, "global_step": 266372, "epoch": 1585} {"train_loss": -11.908056259155273, "global_step": 266373, "epoch": 1585} {"train_loss": -11.813819885253906, "global_step": 266374, "epoch": 1585} {"train_loss": -12.057168006896973, "global_step": 266375, "epoch": 1585} {"train_loss": -12.25333309173584, "global_step": 266376, "epoch": 1585} {"train_loss": -12.201881408691406, "global_step": 266377, "epoch": 1585} {"train_loss": -12.130789756774902, "global_step": 266378, "epoch": 1585} {"train_loss": -12.029428482055664, "global_step": 266379, "epoch": 1585} {"train_loss": -12.208290100097656, "global_step": 266380, "epoch": 1585} {"train_loss": -12.046670913696289, "global_step": 266381, "epoch": 1585} {"train_loss": -12.133469581604004, "global_step": 266382, "epoch": 1585} {"train_loss": -11.81644058227539, "global_step": 266383, "epoch": 1585} {"train_loss": -12.030346870422363, "global_step": 266384, "epoch": 1585} {"train_loss": -11.757527351379395, "global_step": 266385, "epoch": 1585} {"train_loss": -12.121551513671875, "global_step": 266386, "epoch": 1585} {"train_loss": -11.906991958618164, "global_step": 266387, "epoch": 1585} {"train_loss": -11.644457817077637, "global_step": 266388, "epoch": 1585} {"train_loss": -11.715895652770996, "global_step": 266389, "epoch": 1585} {"train_loss": -12.102266311645508, "global_step": 266390, "epoch": 1585} {"train_loss": -11.086864471435547, "global_step": 266391, "epoch": 1585} {"train_loss": -11.579663276672363, "global_step": 266392, "epoch": 1585} {"train_loss": -10.636419296264648, "global_step": 266393, "epoch": 1585} {"train_loss": -11.293066024780273, "global_step": 266394, "epoch": 1585} {"train_loss": -11.763742446899414, "global_step": 266395, "epoch": 1585} {"train_loss": -11.997774124145508, "global_step": 266396, "epoch": 1585} {"train_loss": -11.879866600036621, "global_step": 266397, "epoch": 1585} {"train_loss": -12.118003845214844, "global_step": 266398, "epoch": 1585} {"train_loss": -11.631633758544922, "global_step": 266399, "epoch": 1585} {"train_loss": -11.606002807617188, "global_step": 266400, "epoch": 1585} {"train_loss": -11.305130004882812, "global_step": 266401, "epoch": 1585} {"train_loss": -11.640913009643555, "global_step": 266402, "epoch": 1585} {"train_loss": -11.570063591003418, "global_step": 266403, "epoch": 1585} {"train_loss": -11.711742401123047, "global_step": 266404, "epoch": 1585} {"train_loss": -11.811500549316406, "global_step": 266405, "epoch": 1585} {"train_loss": -11.889119148254395, "global_step": 266406, "epoch": 1585} {"train_loss": -11.84366512298584, "global_step": 266407, "epoch": 1585} {"train_loss": -11.129465103149414, "global_step": 266408, "epoch": 1585} {"train_loss": -11.97382640838623, "global_step": 266409, "epoch": 1585} {"train_loss": -11.769220352172852, "global_step": 266410, "epoch": 1585} {"train_loss": -11.334716796875, "global_step": 266411, "epoch": 1585} {"train_loss": -11.577205657958984, "global_step": 266412, "epoch": 1585} {"train_loss": -11.722736358642578, "global_step": 266413, "epoch": 1585} {"train_loss": -11.626750946044922, "global_step": 266414, "epoch": 1585} {"train_loss": -11.798271179199219, "global_step": 266415, "epoch": 1585} {"train_loss": -11.363765716552734, "global_step": 266416, "epoch": 1585} {"train_loss": -11.617055892944336, "global_step": 266417, "epoch": 1585} {"train_loss": -11.746442794799805, "global_step": 266418, "epoch": 1585} {"train_loss": -11.343339920043945, "global_step": 266419, "epoch": 1585} {"train_loss": -11.4689302444458, "global_step": 266420, "epoch": 1585} {"train_loss": -12.01887321472168, "global_step": 266421, "epoch": 1585} {"train_loss": -11.249773025512695, "global_step": 266422, "epoch": 1585} {"train_loss": -11.665647506713867, "global_step": 266423, "epoch": 1585} {"train_loss": -11.255226135253906, "global_step": 266424, "epoch": 1585} {"train_loss": -10.974433898925781, "global_step": 266425, "epoch": 1585} {"train_loss": -11.667791366577148, "global_step": 266426, "epoch": 1585} {"train_loss": -10.75004768371582, "global_step": 266427, "epoch": 1585} {"train_loss": -11.517374992370605, "global_step": 266428, "epoch": 1585} {"train_loss": -11.494460105895996, "global_step": 266429, "epoch": 1585} {"train_loss": -11.322797775268555, "global_step": 266430, "epoch": 1585} {"train_loss": -11.711196899414062, "global_step": 266431, "epoch": 1585} {"train_loss": -11.402860641479492, "global_step": 266432, "epoch": 1585} {"train_loss": -11.360679626464844, "global_step": 266433, "epoch": 1585} {"train_loss": -11.374853134155273, "global_step": 266434, "epoch": 1585} {"train_loss": -10.972267150878906, "global_step": 266435, "epoch": 1585} {"train_loss": -11.692953109741211, "global_step": 266436, "epoch": 1585} {"train_loss": -11.137924194335938, "global_step": 266437, "epoch": 1585} {"train_loss": -11.733758926391602, "global_step": 266438, "epoch": 1585} {"train_loss": -11.567121505737305, "global_step": 266439, "epoch": 1585} {"train_loss": -11.392555236816406, "global_step": 266440, "epoch": 1585} {"train_loss": -11.447245597839355, "global_step": 266441, "epoch": 1585} {"train_loss": -11.363734245300293, "global_step": 266442, "epoch": 1585} {"train_loss": -11.764002799987793, "global_step": 266443, "epoch": 1585} {"train_loss": -11.562543869018555, "global_step": 266444, "epoch": 1585} {"train_loss": -11.801883697509766, "global_step": 266445, "epoch": 1585} {"train_loss": -11.790300369262695, "global_step": 266446, "epoch": 1585} {"train_loss": -11.58576968738011, "global_step": 266447, "epoch": 1585, "val_loss": 272232.40625, "train_action_mse_error": 5.340298652648926} {"train_loss": -11.936460494995117, "global_step": 266448, "epoch": 1586} {"train_loss": -11.656248092651367, "global_step": 266449, "epoch": 1586} {"train_loss": -11.814348220825195, "global_step": 266450, "epoch": 1586} {"train_loss": -11.501703262329102, "global_step": 266451, "epoch": 1586} {"train_loss": -11.949824333190918, "global_step": 266452, "epoch": 1586} {"train_loss": -11.890257835388184, "global_step": 266453, "epoch": 1586} {"train_loss": -11.805444717407227, "global_step": 266454, "epoch": 1586} {"train_loss": -12.127035140991211, "global_step": 266455, "epoch": 1586} {"train_loss": -11.824542999267578, "global_step": 266456, "epoch": 1586} {"train_loss": -11.738388061523438, "global_step": 266457, "epoch": 1586} {"train_loss": -11.868019104003906, "global_step": 266458, "epoch": 1586} {"train_loss": -11.731156349182129, "global_step": 266459, "epoch": 1586} {"train_loss": -11.880987167358398, "global_step": 266460, "epoch": 1586} {"train_loss": -11.863737106323242, "global_step": 266461, "epoch": 1586} {"train_loss": -11.731103897094727, "global_step": 266462, "epoch": 1586} {"train_loss": -11.96679973602295, "global_step": 266463, "epoch": 1586} {"train_loss": -11.855700492858887, "global_step": 266464, "epoch": 1586} {"train_loss": -11.86931037902832, "global_step": 266465, "epoch": 1586} {"train_loss": -11.979451179504395, "global_step": 266466, "epoch": 1586} {"train_loss": -12.067545890808105, "global_step": 266467, "epoch": 1586} {"train_loss": -11.457098007202148, "global_step": 266468, "epoch": 1586} {"train_loss": -11.396930694580078, "global_step": 266469, "epoch": 1586} {"train_loss": -11.734477043151855, "global_step": 266470, "epoch": 1586} {"train_loss": -11.627278327941895, "global_step": 266471, "epoch": 1586} {"train_loss": -11.87104320526123, "global_step": 266472, "epoch": 1586} {"train_loss": -11.126550674438477, "global_step": 266473, "epoch": 1586} {"train_loss": -11.728214263916016, "global_step": 266474, "epoch": 1586} {"train_loss": -10.74455738067627, "global_step": 266475, "epoch": 1586} {"train_loss": -11.572341918945312, "global_step": 266476, "epoch": 1586} {"train_loss": -11.64706802368164, "global_step": 266477, "epoch": 1586} {"train_loss": -11.209229469299316, "global_step": 266478, "epoch": 1586} {"train_loss": -11.571563720703125, "global_step": 266479, "epoch": 1586} {"train_loss": -11.078027725219727, "global_step": 266480, "epoch": 1586} {"train_loss": -11.732622146606445, "global_step": 266481, "epoch": 1586} {"train_loss": -11.167217254638672, "global_step": 266482, "epoch": 1586} {"train_loss": -11.750692367553711, "global_step": 266483, "epoch": 1586} {"train_loss": -11.186158180236816, "global_step": 266484, "epoch": 1586} {"train_loss": -11.950340270996094, "global_step": 266485, "epoch": 1586} {"train_loss": -11.637697219848633, "global_step": 266486, "epoch": 1586} {"train_loss": -11.544300079345703, "global_step": 266487, "epoch": 1586} {"train_loss": -11.710405349731445, "global_step": 266488, "epoch": 1586} {"train_loss": -11.834869384765625, "global_step": 266489, "epoch": 1586} {"train_loss": -11.914022445678711, "global_step": 266490, "epoch": 1586} {"train_loss": -12.018404006958008, "global_step": 266491, "epoch": 1586} {"train_loss": -11.798540115356445, "global_step": 266492, "epoch": 1586} {"train_loss": -11.878164291381836, "global_step": 266493, "epoch": 1586} {"train_loss": -12.080533981323242, "global_step": 266494, "epoch": 1586} {"train_loss": -11.997833251953125, "global_step": 266495, "epoch": 1586} {"train_loss": -11.864559173583984, "global_step": 266496, "epoch": 1586} {"train_loss": -11.920156478881836, "global_step": 266497, "epoch": 1586} {"train_loss": -11.948458671569824, "global_step": 266498, "epoch": 1586} {"train_loss": -11.853860855102539, "global_step": 266499, "epoch": 1586} {"train_loss": -11.999467849731445, "global_step": 266500, "epoch": 1586} {"train_loss": -11.791889190673828, "global_step": 266501, "epoch": 1586} {"train_loss": -11.746530532836914, "global_step": 266502, "epoch": 1586} {"train_loss": -12.058917045593262, "global_step": 266503, "epoch": 1586} {"train_loss": -11.707111358642578, "global_step": 266504, "epoch": 1586} {"train_loss": -12.019613265991211, "global_step": 266505, "epoch": 1586} {"train_loss": -11.499490737915039, "global_step": 266506, "epoch": 1586} {"train_loss": -12.096879959106445, "global_step": 266507, "epoch": 1586} {"train_loss": -12.058795928955078, "global_step": 266508, "epoch": 1586} {"train_loss": -12.147326469421387, "global_step": 266509, "epoch": 1586} {"train_loss": -12.068367004394531, "global_step": 266510, "epoch": 1586} {"train_loss": -11.978071212768555, "global_step": 266511, "epoch": 1586} {"train_loss": -12.033153533935547, "global_step": 266512, "epoch": 1586} {"train_loss": -12.0285062789917, "global_step": 266513, "epoch": 1586} {"train_loss": -11.892895698547363, "global_step": 266514, "epoch": 1586} {"train_loss": -12.020822525024414, "global_step": 266515, "epoch": 1586} {"train_loss": -12.056535720825195, "global_step": 266516, "epoch": 1586} {"train_loss": -11.921398162841797, "global_step": 266517, "epoch": 1586} {"train_loss": -12.222429275512695, "global_step": 266518, "epoch": 1586} {"train_loss": -12.046371459960938, "global_step": 266519, "epoch": 1586} {"train_loss": -12.07806396484375, "global_step": 266520, "epoch": 1586} {"train_loss": -12.144550323486328, "global_step": 266521, "epoch": 1586} {"train_loss": -12.213074684143066, "global_step": 266522, "epoch": 1586} {"train_loss": -12.068187713623047, "global_step": 266523, "epoch": 1586} {"train_loss": -11.963702201843262, "global_step": 266524, "epoch": 1586} {"train_loss": -11.950349807739258, "global_step": 266525, "epoch": 1586} {"train_loss": -12.327685356140137, "global_step": 266526, "epoch": 1586} {"train_loss": -12.281732559204102, "global_step": 266527, "epoch": 1586} {"train_loss": -12.073034286499023, "global_step": 266528, "epoch": 1586} {"train_loss": -12.246874809265137, "global_step": 266529, "epoch": 1586} {"train_loss": -12.337783813476562, "global_step": 266530, "epoch": 1586} {"train_loss": -12.353181838989258, "global_step": 266531, "epoch": 1586} {"train_loss": -12.098030090332031, "global_step": 266532, "epoch": 1586} {"train_loss": -12.209832191467285, "global_step": 266533, "epoch": 1586} {"train_loss": -12.130350112915039, "global_step": 266534, "epoch": 1586} {"train_loss": -12.251303672790527, "global_step": 266535, "epoch": 1586} {"train_loss": -12.36330795288086, "global_step": 266536, "epoch": 1586} {"train_loss": -12.372419357299805, "global_step": 266537, "epoch": 1586} {"train_loss": -12.078144073486328, "global_step": 266538, "epoch": 1586} {"train_loss": -12.29376220703125, "global_step": 266539, "epoch": 1586} {"train_loss": -11.904817581176758, "global_step": 266540, "epoch": 1586} {"train_loss": -12.261279106140137, "global_step": 266541, "epoch": 1586} {"train_loss": -11.769693374633789, "global_step": 266542, "epoch": 1586} {"train_loss": -12.142541885375977, "global_step": 266543, "epoch": 1586} {"train_loss": -11.987166404724121, "global_step": 266544, "epoch": 1586} {"train_loss": -11.941162109375, "global_step": 266545, "epoch": 1586} {"train_loss": -11.794815063476562, "global_step": 266546, "epoch": 1586} {"train_loss": -11.977251052856445, "global_step": 266547, "epoch": 1586} {"train_loss": -11.644968032836914, "global_step": 266548, "epoch": 1586} {"train_loss": -11.244895935058594, "global_step": 266549, "epoch": 1586} {"train_loss": -11.461841583251953, "global_step": 266550, "epoch": 1586} {"train_loss": -11.576438903808594, "global_step": 266551, "epoch": 1586} {"train_loss": -12.045976638793945, "global_step": 266552, "epoch": 1586} {"train_loss": -11.102563858032227, "global_step": 266553, "epoch": 1586} {"train_loss": -12.15921401977539, "global_step": 266554, "epoch": 1586} {"train_loss": -11.224956512451172, "global_step": 266555, "epoch": 1586} {"train_loss": -11.89329719543457, "global_step": 266556, "epoch": 1586} {"train_loss": -10.996159553527832, "global_step": 266557, "epoch": 1586} {"train_loss": -11.629554748535156, "global_step": 266558, "epoch": 1586} {"train_loss": -11.625755310058594, "global_step": 266559, "epoch": 1586} {"train_loss": -11.144744873046875, "global_step": 266560, "epoch": 1586} {"train_loss": -10.74898624420166, "global_step": 266561, "epoch": 1586} {"train_loss": -12.01780891418457, "global_step": 266562, "epoch": 1586} {"train_loss": -11.574806213378906, "global_step": 266563, "epoch": 1586} {"train_loss": -12.279399871826172, "global_step": 266564, "epoch": 1586} {"train_loss": -11.478517532348633, "global_step": 266565, "epoch": 1586} {"train_loss": -12.439748764038086, "global_step": 266566, "epoch": 1586} {"train_loss": -12.042377471923828, "global_step": 266567, "epoch": 1586} {"train_loss": -12.133621215820312, "global_step": 266568, "epoch": 1586} {"train_loss": -12.05420970916748, "global_step": 266569, "epoch": 1586} {"train_loss": -12.138553619384766, "global_step": 266570, "epoch": 1586} {"train_loss": -11.474738121032715, "global_step": 266571, "epoch": 1586} {"train_loss": -11.551387786865234, "global_step": 266572, "epoch": 1586} {"train_loss": -12.21605396270752, "global_step": 266573, "epoch": 1586} {"train_loss": -11.093109130859375, "global_step": 266574, "epoch": 1586} {"train_loss": -10.953453063964844, "global_step": 266575, "epoch": 1586} {"train_loss": -11.193918228149414, "global_step": 266576, "epoch": 1586} {"train_loss": -12.001011848449707, "global_step": 266577, "epoch": 1586} {"train_loss": -11.162626266479492, "global_step": 266578, "epoch": 1586} {"train_loss": -11.765420913696289, "global_step": 266579, "epoch": 1586} {"train_loss": -11.601490020751953, "global_step": 266580, "epoch": 1586} {"train_loss": -12.090145111083984, "global_step": 266581, "epoch": 1586} {"train_loss": -11.94867992401123, "global_step": 266582, "epoch": 1586} {"train_loss": -11.62380599975586, "global_step": 266583, "epoch": 1586} {"train_loss": -12.090007781982422, "global_step": 266584, "epoch": 1586} {"train_loss": -11.225793838500977, "global_step": 266585, "epoch": 1586} {"train_loss": -11.749191284179688, "global_step": 266586, "epoch": 1586} {"train_loss": -11.038095474243164, "global_step": 266587, "epoch": 1586} {"train_loss": -11.916443824768066, "global_step": 266588, "epoch": 1586} {"train_loss": -10.999679565429688, "global_step": 266589, "epoch": 1586} {"train_loss": -11.016083717346191, "global_step": 266590, "epoch": 1586} {"train_loss": -10.183832168579102, "global_step": 266591, "epoch": 1586} {"train_loss": -11.072739601135254, "global_step": 266592, "epoch": 1586} {"train_loss": -10.658546447753906, "global_step": 266593, "epoch": 1586} {"train_loss": -11.743789672851562, "global_step": 266594, "epoch": 1586} {"train_loss": -11.44161319732666, "global_step": 266595, "epoch": 1586} {"train_loss": -11.770835876464844, "global_step": 266596, "epoch": 1586} {"train_loss": -11.556440353393555, "global_step": 266597, "epoch": 1586} {"train_loss": -11.681984901428223, "global_step": 266598, "epoch": 1586} {"train_loss": -11.730545043945312, "global_step": 266599, "epoch": 1586} {"train_loss": -11.545875549316406, "global_step": 266600, "epoch": 1586} {"train_loss": -11.914494514465332, "global_step": 266601, "epoch": 1586} {"train_loss": -12.000728607177734, "global_step": 266602, "epoch": 1586} {"train_loss": -12.208423614501953, "global_step": 266603, "epoch": 1586} {"train_loss": -11.970707893371582, "global_step": 266604, "epoch": 1586} {"train_loss": -11.764575958251953, "global_step": 266605, "epoch": 1586} {"train_loss": -11.765886306762695, "global_step": 266606, "epoch": 1586} {"train_loss": -12.045825958251953, "global_step": 266607, "epoch": 1586} {"train_loss": -11.940458297729492, "global_step": 266608, "epoch": 1586} {"train_loss": -11.94718074798584, "global_step": 266609, "epoch": 1586} {"train_loss": -12.032169342041016, "global_step": 266610, "epoch": 1586} {"train_loss": -11.871174812316895, "global_step": 266611, "epoch": 1586} {"train_loss": -12.123332977294922, "global_step": 266612, "epoch": 1586} {"train_loss": -11.768682479858398, "global_step": 266613, "epoch": 1586} {"train_loss": -11.669357299804688, "global_step": 266614, "epoch": 1586} {"train_loss": -11.785191371327354, "global_step": 266615, "epoch": 1586, "val_loss": 274583.4375} {"train_loss": -12.166902542114258, "global_step": 266616, "epoch": 1587} {"train_loss": -11.454917907714844, "global_step": 266617, "epoch": 1587} {"train_loss": -11.738164901733398, "global_step": 266618, "epoch": 1587} {"train_loss": -11.729991912841797, "global_step": 266619, "epoch": 1587} {"train_loss": -11.568523406982422, "global_step": 266620, "epoch": 1587} {"train_loss": -11.368739128112793, "global_step": 266621, "epoch": 1587} {"train_loss": -12.049129486083984, "global_step": 266622, "epoch": 1587} {"train_loss": -11.614964485168457, "global_step": 266623, "epoch": 1587} {"train_loss": -11.664926528930664, "global_step": 266624, "epoch": 1587} {"train_loss": -11.689362525939941, "global_step": 266625, "epoch": 1587} {"train_loss": -11.515563011169434, "global_step": 266626, "epoch": 1587} {"train_loss": -11.903650283813477, "global_step": 266627, "epoch": 1587} {"train_loss": -11.99117660522461, "global_step": 266628, "epoch": 1587} {"train_loss": -11.89706802368164, "global_step": 266629, "epoch": 1587} {"train_loss": -11.67806625366211, "global_step": 266630, "epoch": 1587} {"train_loss": -11.785035133361816, "global_step": 266631, "epoch": 1587} {"train_loss": -12.025286674499512, "global_step": 266632, "epoch": 1587} {"train_loss": -11.840977668762207, "global_step": 266633, "epoch": 1587} {"train_loss": -11.561670303344727, "global_step": 266634, "epoch": 1587} {"train_loss": -11.819165229797363, "global_step": 266635, "epoch": 1587} {"train_loss": -11.800898551940918, "global_step": 266636, "epoch": 1587} {"train_loss": -11.764728546142578, "global_step": 266637, "epoch": 1587} {"train_loss": -12.093907356262207, "global_step": 266638, "epoch": 1587} {"train_loss": -12.03944206237793, "global_step": 266639, "epoch": 1587} {"train_loss": -11.964390754699707, "global_step": 266640, "epoch": 1587} {"train_loss": -12.07865047454834, "global_step": 266641, "epoch": 1587} {"train_loss": -12.049667358398438, "global_step": 266642, "epoch": 1587} {"train_loss": -12.235697746276855, "global_step": 266643, "epoch": 1587} {"train_loss": -12.250903129577637, "global_step": 266644, "epoch": 1587} {"train_loss": -12.120133399963379, "global_step": 266645, "epoch": 1587} {"train_loss": -12.048484802246094, "global_step": 266646, "epoch": 1587} {"train_loss": -12.136289596557617, "global_step": 266647, "epoch": 1587} {"train_loss": -12.117151260375977, "global_step": 266648, "epoch": 1587} {"train_loss": -11.539438247680664, "global_step": 266649, "epoch": 1587} {"train_loss": -11.677773475646973, "global_step": 266650, "epoch": 1587} {"train_loss": -12.17123794555664, "global_step": 266651, "epoch": 1587} {"train_loss": -11.79690933227539, "global_step": 266652, "epoch": 1587} {"train_loss": -12.151346206665039, "global_step": 266653, "epoch": 1587} {"train_loss": -11.978182792663574, "global_step": 266654, "epoch": 1587} {"train_loss": -11.594938278198242, "global_step": 266655, "epoch": 1587} {"train_loss": -11.973569869995117, "global_step": 266656, "epoch": 1587} {"train_loss": -10.988571166992188, "global_step": 266657, "epoch": 1587} {"train_loss": -11.310683250427246, "global_step": 266658, "epoch": 1587} {"train_loss": -12.162261962890625, "global_step": 266659, "epoch": 1587} {"train_loss": -11.428799629211426, "global_step": 266660, "epoch": 1587} {"train_loss": -11.715448379516602, "global_step": 266661, "epoch": 1587} {"train_loss": -12.051864624023438, "global_step": 266662, "epoch": 1587} {"train_loss": -11.549087524414062, "global_step": 266663, "epoch": 1587} {"train_loss": -11.992598533630371, "global_step": 266664, "epoch": 1587} {"train_loss": -11.417814254760742, "global_step": 266665, "epoch": 1587} {"train_loss": -11.14291763305664, "global_step": 266666, "epoch": 1587} {"train_loss": -12.099289894104004, "global_step": 266667, "epoch": 1587} {"train_loss": -11.219606399536133, "global_step": 266668, "epoch": 1587} {"train_loss": -11.880692481994629, "global_step": 266669, "epoch": 1587} {"train_loss": -11.580198287963867, "global_step": 266670, "epoch": 1587} {"train_loss": -11.799835205078125, "global_step": 266671, "epoch": 1587} {"train_loss": -11.617935180664062, "global_step": 266672, "epoch": 1587} {"train_loss": -11.47209644317627, "global_step": 266673, "epoch": 1587} {"train_loss": -11.013710021972656, "global_step": 266674, "epoch": 1587} {"train_loss": -11.64816665649414, "global_step": 266675, "epoch": 1587} {"train_loss": -11.500188827514648, "global_step": 266676, "epoch": 1587} {"train_loss": -11.178661346435547, "global_step": 266677, "epoch": 1587} {"train_loss": -11.159845352172852, "global_step": 266678, "epoch": 1587} {"train_loss": -11.268593788146973, "global_step": 266679, "epoch": 1587} {"train_loss": -10.6285400390625, "global_step": 266680, "epoch": 1587} {"train_loss": -11.610519409179688, "global_step": 266681, "epoch": 1587} {"train_loss": -10.040830612182617, "global_step": 266682, "epoch": 1587} {"train_loss": -11.707388877868652, "global_step": 266683, "epoch": 1587} {"train_loss": -11.026276588439941, "global_step": 266684, "epoch": 1587} {"train_loss": -10.978713989257812, "global_step": 266685, "epoch": 1587} {"train_loss": -11.615554809570312, "global_step": 266686, "epoch": 1587} {"train_loss": -11.324039459228516, "global_step": 266687, "epoch": 1587} {"train_loss": -11.406325340270996, "global_step": 266688, "epoch": 1587} {"train_loss": -11.579963684082031, "global_step": 266689, "epoch": 1587} {"train_loss": -11.849833488464355, "global_step": 266690, "epoch": 1587} {"train_loss": -11.609868049621582, "global_step": 266691, "epoch": 1587} {"train_loss": -11.793754577636719, "global_step": 266692, "epoch": 1587} {"train_loss": -11.85622787475586, "global_step": 266693, "epoch": 1587} {"train_loss": -11.614913940429688, "global_step": 266694, "epoch": 1587} {"train_loss": -12.148994445800781, "global_step": 266695, "epoch": 1587} {"train_loss": -11.995922088623047, "global_step": 266696, "epoch": 1587} {"train_loss": -11.929998397827148, "global_step": 266697, "epoch": 1587} {"train_loss": -12.092915534973145, "global_step": 266698, "epoch": 1587} {"train_loss": -11.94089412689209, "global_step": 266699, "epoch": 1587} {"train_loss": -11.63369083404541, "global_step": 266700, "epoch": 1587} {"train_loss": -12.04719352722168, "global_step": 266701, "epoch": 1587} {"train_loss": -12.1207275390625, "global_step": 266702, "epoch": 1587} {"train_loss": -11.863375663757324, "global_step": 266703, "epoch": 1587} {"train_loss": -11.787107467651367, "global_step": 266704, "epoch": 1587} {"train_loss": -11.794687271118164, "global_step": 266705, "epoch": 1587} {"train_loss": -12.223381996154785, "global_step": 266706, "epoch": 1587} {"train_loss": -12.15141773223877, "global_step": 266707, "epoch": 1587} {"train_loss": -11.852663040161133, "global_step": 266708, "epoch": 1587} {"train_loss": -12.168966293334961, "global_step": 266709, "epoch": 1587} {"train_loss": -11.873025894165039, "global_step": 266710, "epoch": 1587} {"train_loss": -12.30474853515625, "global_step": 266711, "epoch": 1587} {"train_loss": -12.220720291137695, "global_step": 266712, "epoch": 1587} {"train_loss": -12.209487915039062, "global_step": 266713, "epoch": 1587} {"train_loss": -12.059064865112305, "global_step": 266714, "epoch": 1587} {"train_loss": -12.25482177734375, "global_step": 266715, "epoch": 1587} {"train_loss": -11.929651260375977, "global_step": 266716, "epoch": 1587} {"train_loss": -12.218873977661133, "global_step": 266717, "epoch": 1587} {"train_loss": -12.140764236450195, "global_step": 266718, "epoch": 1587} {"train_loss": -12.019933700561523, "global_step": 266719, "epoch": 1587} {"train_loss": -12.082263946533203, "global_step": 266720, "epoch": 1587} {"train_loss": -12.021257400512695, "global_step": 266721, "epoch": 1587} {"train_loss": -12.02448844909668, "global_step": 266722, "epoch": 1587} {"train_loss": -12.25261402130127, "global_step": 266723, "epoch": 1587} {"train_loss": -12.304152488708496, "global_step": 266724, "epoch": 1587} {"train_loss": -11.761628150939941, "global_step": 266725, "epoch": 1587} {"train_loss": -12.385516166687012, "global_step": 266726, "epoch": 1587} {"train_loss": -12.046274185180664, "global_step": 266727, "epoch": 1587} {"train_loss": -12.215731620788574, "global_step": 266728, "epoch": 1587} {"train_loss": -12.149344444274902, "global_step": 266729, "epoch": 1587} {"train_loss": -11.997295379638672, "global_step": 266730, "epoch": 1587} {"train_loss": -12.008882522583008, "global_step": 266731, "epoch": 1587} {"train_loss": -11.794644355773926, "global_step": 266732, "epoch": 1587} {"train_loss": -11.94123363494873, "global_step": 266733, "epoch": 1587} {"train_loss": -12.094733238220215, "global_step": 266734, "epoch": 1587} {"train_loss": -12.202482223510742, "global_step": 266735, "epoch": 1587} {"train_loss": -11.99618911743164, "global_step": 266736, "epoch": 1587} {"train_loss": -12.248065948486328, "global_step": 266737, "epoch": 1587} {"train_loss": -12.278177261352539, "global_step": 266738, "epoch": 1587} {"train_loss": -12.401063919067383, "global_step": 266739, "epoch": 1587} {"train_loss": -12.023783683776855, "global_step": 266740, "epoch": 1587} {"train_loss": -12.176569938659668, "global_step": 266741, "epoch": 1587} {"train_loss": -12.345603942871094, "global_step": 266742, "epoch": 1587} {"train_loss": -12.060528755187988, "global_step": 266743, "epoch": 1587} {"train_loss": -12.357563018798828, "global_step": 266744, "epoch": 1587} {"train_loss": -12.002734184265137, "global_step": 266745, "epoch": 1587} {"train_loss": -12.299734115600586, "global_step": 266746, "epoch": 1587} {"train_loss": -12.15626335144043, "global_step": 266747, "epoch": 1587} {"train_loss": -11.547340393066406, "global_step": 266748, "epoch": 1587} {"train_loss": -11.644189834594727, "global_step": 266749, "epoch": 1587} {"train_loss": -11.828800201416016, "global_step": 266750, "epoch": 1587} {"train_loss": -12.009356498718262, "global_step": 266751, "epoch": 1587} {"train_loss": -11.439708709716797, "global_step": 266752, "epoch": 1587} {"train_loss": -10.614951133728027, "global_step": 266753, "epoch": 1587} {"train_loss": -12.070428848266602, "global_step": 266754, "epoch": 1587} {"train_loss": -11.319894790649414, "global_step": 266755, "epoch": 1587} {"train_loss": -10.257265090942383, "global_step": 266756, "epoch": 1587} {"train_loss": -10.87111759185791, "global_step": 266757, "epoch": 1587} {"train_loss": -11.47774600982666, "global_step": 266758, "epoch": 1587} {"train_loss": -11.365538597106934, "global_step": 266759, "epoch": 1587} {"train_loss": -11.676369667053223, "global_step": 266760, "epoch": 1587} {"train_loss": -10.817432403564453, "global_step": 266761, "epoch": 1587} {"train_loss": -10.833181381225586, "global_step": 266762, "epoch": 1587} {"train_loss": -10.854276657104492, "global_step": 266763, "epoch": 1587} {"train_loss": -11.29216194152832, "global_step": 266764, "epoch": 1587} {"train_loss": -10.55019760131836, "global_step": 266765, "epoch": 1587} {"train_loss": -10.316563606262207, "global_step": 266766, "epoch": 1587} {"train_loss": -11.024974822998047, "global_step": 266767, "epoch": 1587} {"train_loss": -10.719024658203125, "global_step": 266768, "epoch": 1587} {"train_loss": -10.610366821289062, "global_step": 266769, "epoch": 1587} {"train_loss": -11.022048950195312, "global_step": 266770, "epoch": 1587} {"train_loss": -11.383382797241211, "global_step": 266771, "epoch": 1587} {"train_loss": -10.974611282348633, "global_step": 266772, "epoch": 1587} {"train_loss": -10.669655799865723, "global_step": 266773, "epoch": 1587} {"train_loss": -9.72400188446045, "global_step": 266774, "epoch": 1587} {"train_loss": -10.731058120727539, "global_step": 266775, "epoch": 1587} {"train_loss": -9.919944763183594, "global_step": 266776, "epoch": 1587} {"train_loss": -11.235143661499023, "global_step": 266777, "epoch": 1587} {"train_loss": -10.612916946411133, "global_step": 266778, "epoch": 1587} {"train_loss": -10.200607299804688, "global_step": 266779, "epoch": 1587} {"train_loss": -9.516229629516602, "global_step": 266780, "epoch": 1587} {"train_loss": -10.382577896118164, "global_step": 266781, "epoch": 1587} {"train_loss": -9.155585289001465, "global_step": 266782, "epoch": 1587} {"train_loss": -11.630211744989667, "global_step": 266783, "epoch": 1587, "val_loss": 272976.59375} {"train_loss": -10.85242748260498, "global_step": 266784, "epoch": 1588} {"train_loss": -9.408415794372559, "global_step": 266785, "epoch": 1588} {"train_loss": -10.226615905761719, "global_step": 266786, "epoch": 1588} {"train_loss": -11.383159637451172, "global_step": 266787, "epoch": 1588} {"train_loss": -10.890172004699707, "global_step": 266788, "epoch": 1588} {"train_loss": -11.64742374420166, "global_step": 266789, "epoch": 1588} {"train_loss": -10.828203201293945, "global_step": 266790, "epoch": 1588} {"train_loss": -11.52200698852539, "global_step": 266791, "epoch": 1588} {"train_loss": -11.373300552368164, "global_step": 266792, "epoch": 1588} {"train_loss": -11.699758529663086, "global_step": 266793, "epoch": 1588} {"train_loss": -11.163305282592773, "global_step": 266794, "epoch": 1588} {"train_loss": -11.506120681762695, "global_step": 266795, "epoch": 1588} {"train_loss": -11.463375091552734, "global_step": 266796, "epoch": 1588} {"train_loss": -11.663789749145508, "global_step": 266797, "epoch": 1588} {"train_loss": -11.472343444824219, "global_step": 266798, "epoch": 1588} {"train_loss": -11.52580738067627, "global_step": 266799, "epoch": 1588} {"train_loss": -11.29457950592041, "global_step": 266800, "epoch": 1588} {"train_loss": -11.676194190979004, "global_step": 266801, "epoch": 1588} {"train_loss": -11.743545532226562, "global_step": 266802, "epoch": 1588} {"train_loss": -11.908517837524414, "global_step": 266803, "epoch": 1588} {"train_loss": -11.747121810913086, "global_step": 266804, "epoch": 1588} {"train_loss": -11.884040832519531, "global_step": 266805, "epoch": 1588} {"train_loss": -11.862665176391602, "global_step": 266806, "epoch": 1588} {"train_loss": -11.77062702178955, "global_step": 266807, "epoch": 1588} {"train_loss": -11.677946090698242, "global_step": 266808, "epoch": 1588} {"train_loss": -11.710731506347656, "global_step": 266809, "epoch": 1588} {"train_loss": -11.843326568603516, "global_step": 266810, "epoch": 1588} {"train_loss": -11.661664962768555, "global_step": 266811, "epoch": 1588} {"train_loss": -11.78521728515625, "global_step": 266812, "epoch": 1588} {"train_loss": -11.848222732543945, "global_step": 266813, "epoch": 1588} {"train_loss": -11.876199722290039, "global_step": 266814, "epoch": 1588} {"train_loss": -11.839570999145508, "global_step": 266815, "epoch": 1588} {"train_loss": -11.882701873779297, "global_step": 266816, "epoch": 1588} {"train_loss": -12.058738708496094, "global_step": 266817, "epoch": 1588} {"train_loss": -11.865609169006348, "global_step": 266818, "epoch": 1588} {"train_loss": -11.993640899658203, "global_step": 266819, "epoch": 1588} {"train_loss": -12.062908172607422, "global_step": 266820, "epoch": 1588} {"train_loss": -12.063365936279297, "global_step": 266821, "epoch": 1588} {"train_loss": -12.137679100036621, "global_step": 266822, "epoch": 1588} {"train_loss": -12.16817569732666, "global_step": 266823, "epoch": 1588} {"train_loss": -12.000221252441406, "global_step": 266824, "epoch": 1588} {"train_loss": -12.24085807800293, "global_step": 266825, "epoch": 1588} {"train_loss": -12.245675086975098, "global_step": 266826, "epoch": 1588} {"train_loss": -12.108621597290039, "global_step": 266827, "epoch": 1588} {"train_loss": -12.21469497680664, "global_step": 266828, "epoch": 1588} {"train_loss": -11.902254104614258, "global_step": 266829, "epoch": 1588} {"train_loss": -12.169790267944336, "global_step": 266830, "epoch": 1588} {"train_loss": -12.00832462310791, "global_step": 266831, "epoch": 1588} {"train_loss": -12.001383781433105, "global_step": 266832, "epoch": 1588} {"train_loss": -12.056673049926758, "global_step": 266833, "epoch": 1588} {"train_loss": -12.253702163696289, "global_step": 266834, "epoch": 1588} {"train_loss": -12.209879875183105, "global_step": 266835, "epoch": 1588} {"train_loss": -12.327425003051758, "global_step": 266836, "epoch": 1588} {"train_loss": -12.230554580688477, "global_step": 266837, "epoch": 1588} {"train_loss": -12.04293155670166, "global_step": 266838, "epoch": 1588} {"train_loss": -12.282712936401367, "global_step": 266839, "epoch": 1588} {"train_loss": -12.170368194580078, "global_step": 266840, "epoch": 1588} {"train_loss": -12.142812728881836, "global_step": 266841, "epoch": 1588} {"train_loss": -12.008056640625, "global_step": 266842, "epoch": 1588} {"train_loss": -12.226713180541992, "global_step": 266843, "epoch": 1588} {"train_loss": -12.201167106628418, "global_step": 266844, "epoch": 1588} {"train_loss": -12.393411636352539, "global_step": 266845, "epoch": 1588} {"train_loss": -12.388797760009766, "global_step": 266846, "epoch": 1588} {"train_loss": -12.318624496459961, "global_step": 266847, "epoch": 1588} {"train_loss": -12.112724304199219, "global_step": 266848, "epoch": 1588} {"train_loss": -12.377618789672852, "global_step": 266849, "epoch": 1588} {"train_loss": -12.305973052978516, "global_step": 266850, "epoch": 1588} {"train_loss": -12.33353328704834, "global_step": 266851, "epoch": 1588} {"train_loss": -12.096413612365723, "global_step": 266852, "epoch": 1588} {"train_loss": -11.999272346496582, "global_step": 266853, "epoch": 1588} {"train_loss": -12.030281066894531, "global_step": 266854, "epoch": 1588} {"train_loss": -12.262899398803711, "global_step": 266855, "epoch": 1588} {"train_loss": -11.960136413574219, "global_step": 266856, "epoch": 1588} {"train_loss": -12.322656631469727, "global_step": 266857, "epoch": 1588} {"train_loss": -12.194005966186523, "global_step": 266858, "epoch": 1588} {"train_loss": -12.279695510864258, "global_step": 266859, "epoch": 1588} {"train_loss": -12.100931167602539, "global_step": 266860, "epoch": 1588} {"train_loss": -11.943049430847168, "global_step": 266861, "epoch": 1588} {"train_loss": -12.052313804626465, "global_step": 266862, "epoch": 1588} {"train_loss": -12.018570899963379, "global_step": 266863, "epoch": 1588} {"train_loss": -11.990726470947266, "global_step": 266864, "epoch": 1588} {"train_loss": -12.31789779663086, "global_step": 266865, "epoch": 1588} {"train_loss": -11.988080024719238, "global_step": 266866, "epoch": 1588} {"train_loss": -11.809070587158203, "global_step": 266867, "epoch": 1588} {"train_loss": -12.294750213623047, "global_step": 266868, "epoch": 1588} {"train_loss": -12.211790084838867, "global_step": 266869, "epoch": 1588} {"train_loss": -11.73967170715332, "global_step": 266870, "epoch": 1588} {"train_loss": -12.014131546020508, "global_step": 266871, "epoch": 1588} {"train_loss": -12.33331298828125, "global_step": 266872, "epoch": 1588} {"train_loss": -12.168817520141602, "global_step": 266873, "epoch": 1588} {"train_loss": -12.222827911376953, "global_step": 266874, "epoch": 1588} {"train_loss": -12.490728378295898, "global_step": 266875, "epoch": 1588} {"train_loss": -12.341286659240723, "global_step": 266876, "epoch": 1588} {"train_loss": -12.38096809387207, "global_step": 266877, "epoch": 1588} {"train_loss": -12.2335844039917, "global_step": 266878, "epoch": 1588} {"train_loss": -12.314933776855469, "global_step": 266879, "epoch": 1588} {"train_loss": -12.217369079589844, "global_step": 266880, "epoch": 1588} {"train_loss": -12.396933555603027, "global_step": 266881, "epoch": 1588} {"train_loss": -12.052877426147461, "global_step": 266882, "epoch": 1588} {"train_loss": -11.912651062011719, "global_step": 266883, "epoch": 1588} {"train_loss": -11.825685501098633, "global_step": 266884, "epoch": 1588} {"train_loss": -12.087041854858398, "global_step": 266885, "epoch": 1588} {"train_loss": -11.813095092773438, "global_step": 266886, "epoch": 1588} {"train_loss": -11.351579666137695, "global_step": 266887, "epoch": 1588} {"train_loss": -12.051702499389648, "global_step": 266888, "epoch": 1588} {"train_loss": -12.206958770751953, "global_step": 266889, "epoch": 1588} {"train_loss": -11.83084487915039, "global_step": 266890, "epoch": 1588} {"train_loss": -10.721712112426758, "global_step": 266891, "epoch": 1588} {"train_loss": -12.1347017288208, "global_step": 266892, "epoch": 1588} {"train_loss": -11.844444274902344, "global_step": 266893, "epoch": 1588} {"train_loss": -11.821854591369629, "global_step": 266894, "epoch": 1588} {"train_loss": -11.399759292602539, "global_step": 266895, "epoch": 1588} {"train_loss": -10.244226455688477, "global_step": 266896, "epoch": 1588} {"train_loss": -10.464710235595703, "global_step": 266897, "epoch": 1588} {"train_loss": -10.47256851196289, "global_step": 266898, "epoch": 1588} {"train_loss": -9.354767799377441, "global_step": 266899, "epoch": 1588} {"train_loss": -7.7920708656311035, "global_step": 266900, "epoch": 1588} {"train_loss": -7.492684841156006, "global_step": 266901, "epoch": 1588} {"train_loss": -7.229748249053955, "global_step": 266902, "epoch": 1588} {"train_loss": -8.554760932922363, "global_step": 266903, "epoch": 1588} {"train_loss": -8.630051612854004, "global_step": 266904, "epoch": 1588} {"train_loss": -8.479291915893555, "global_step": 266905, "epoch": 1588} {"train_loss": -9.169259071350098, "global_step": 266906, "epoch": 1588} {"train_loss": -9.466691970825195, "global_step": 266907, "epoch": 1588} {"train_loss": -8.383909225463867, "global_step": 266908, "epoch": 1588} {"train_loss": -9.464303970336914, "global_step": 266909, "epoch": 1588} {"train_loss": -10.826719284057617, "global_step": 266910, "epoch": 1588} {"train_loss": -9.674352645874023, "global_step": 266911, "epoch": 1588} {"train_loss": -11.234009742736816, "global_step": 266912, "epoch": 1588} {"train_loss": -9.850859642028809, "global_step": 266913, "epoch": 1588} {"train_loss": -10.45664119720459, "global_step": 266914, "epoch": 1588} {"train_loss": -10.25877571105957, "global_step": 266915, "epoch": 1588} {"train_loss": -10.244088172912598, "global_step": 266916, "epoch": 1588} {"train_loss": -10.975432395935059, "global_step": 266917, "epoch": 1588} {"train_loss": -10.49154281616211, "global_step": 266918, "epoch": 1588} {"train_loss": -10.303654670715332, "global_step": 266919, "epoch": 1588} {"train_loss": -10.945741653442383, "global_step": 266920, "epoch": 1588} {"train_loss": -10.86635971069336, "global_step": 266921, "epoch": 1588} {"train_loss": -10.899011611938477, "global_step": 266922, "epoch": 1588} {"train_loss": -11.29234790802002, "global_step": 266923, "epoch": 1588} {"train_loss": -10.672882080078125, "global_step": 266924, "epoch": 1588} {"train_loss": -11.495453834533691, "global_step": 266925, "epoch": 1588} {"train_loss": -11.369714736938477, "global_step": 266926, "epoch": 1588} {"train_loss": -10.751608848571777, "global_step": 266927, "epoch": 1588} {"train_loss": -11.06742000579834, "global_step": 266928, "epoch": 1588} {"train_loss": -11.195541381835938, "global_step": 266929, "epoch": 1588} {"train_loss": -11.030195236206055, "global_step": 266930, "epoch": 1588} {"train_loss": -11.577220916748047, "global_step": 266931, "epoch": 1588} {"train_loss": -11.472009658813477, "global_step": 266932, "epoch": 1588} {"train_loss": -10.95479965209961, "global_step": 266933, "epoch": 1588} {"train_loss": -11.31709098815918, "global_step": 266934, "epoch": 1588} {"train_loss": -11.321640014648438, "global_step": 266935, "epoch": 1588} {"train_loss": -11.166038513183594, "global_step": 266936, "epoch": 1588} {"train_loss": -11.644740104675293, "global_step": 266937, "epoch": 1588} {"train_loss": -11.71349811553955, "global_step": 266938, "epoch": 1588} {"train_loss": -11.131549835205078, "global_step": 266939, "epoch": 1588} {"train_loss": -11.457758903503418, "global_step": 266940, "epoch": 1588} {"train_loss": -11.621308326721191, "global_step": 266941, "epoch": 1588} {"train_loss": -11.572253227233887, "global_step": 266942, "epoch": 1588} {"train_loss": -11.875263214111328, "global_step": 266943, "epoch": 1588} {"train_loss": -11.769124984741211, "global_step": 266944, "epoch": 1588} {"train_loss": -11.699882507324219, "global_step": 266945, "epoch": 1588} {"train_loss": -11.82474136352539, "global_step": 266946, "epoch": 1588} {"train_loss": -11.70879077911377, "global_step": 266947, "epoch": 1588} {"train_loss": -11.833951950073242, "global_step": 266948, "epoch": 1588} {"train_loss": -11.75841999053955, "global_step": 266949, "epoch": 1588} {"train_loss": -11.876496315002441, "global_step": 266950, "epoch": 1588} {"train_loss": -11.478063637302036, "global_step": 266951, "epoch": 1588, "val_loss": 267980.15625} {"train_loss": -11.7921781539917, "global_step": 266952, "epoch": 1589} {"train_loss": -12.01610279083252, "global_step": 266953, "epoch": 1589} {"train_loss": -11.800827026367188, "global_step": 266954, "epoch": 1589} {"train_loss": -11.87257194519043, "global_step": 266955, "epoch": 1589} {"train_loss": -11.881644248962402, "global_step": 266956, "epoch": 1589} {"train_loss": -12.052312850952148, "global_step": 266957, "epoch": 1589} {"train_loss": -11.989080429077148, "global_step": 266958, "epoch": 1589} {"train_loss": -12.010339736938477, "global_step": 266959, "epoch": 1589} {"train_loss": -11.632372856140137, "global_step": 266960, "epoch": 1589} {"train_loss": -11.628976821899414, "global_step": 266961, "epoch": 1589} {"train_loss": -12.09925651550293, "global_step": 266962, "epoch": 1589} {"train_loss": -11.621105194091797, "global_step": 266963, "epoch": 1589} {"train_loss": -11.736251831054688, "global_step": 266964, "epoch": 1589} {"train_loss": -11.607809066772461, "global_step": 266965, "epoch": 1589} {"train_loss": -11.508070945739746, "global_step": 266966, "epoch": 1589} {"train_loss": -11.700833320617676, "global_step": 266967, "epoch": 1589} {"train_loss": -11.521318435668945, "global_step": 266968, "epoch": 1589} {"train_loss": -11.49392032623291, "global_step": 266969, "epoch": 1589} {"train_loss": -10.801201820373535, "global_step": 266970, "epoch": 1589} {"train_loss": -11.380611419677734, "global_step": 266971, "epoch": 1589} {"train_loss": -11.515312194824219, "global_step": 266972, "epoch": 1589} {"train_loss": -11.025381088256836, "global_step": 266973, "epoch": 1589} {"train_loss": -11.784133911132812, "global_step": 266974, "epoch": 1589} {"train_loss": -10.933187484741211, "global_step": 266975, "epoch": 1589} {"train_loss": -11.690610885620117, "global_step": 266976, "epoch": 1589} {"train_loss": -11.148505210876465, "global_step": 266977, "epoch": 1589} {"train_loss": -11.68805980682373, "global_step": 266978, "epoch": 1589} {"train_loss": -11.828706741333008, "global_step": 266979, "epoch": 1589} {"train_loss": -11.509943008422852, "global_step": 266980, "epoch": 1589} {"train_loss": -11.788908004760742, "global_step": 266981, "epoch": 1589} {"train_loss": -11.358131408691406, "global_step": 266982, "epoch": 1589} {"train_loss": -12.113784790039062, "global_step": 266983, "epoch": 1589} {"train_loss": -11.297621726989746, "global_step": 266984, "epoch": 1589} {"train_loss": -11.724538803100586, "global_step": 266985, "epoch": 1589} {"train_loss": -11.861839294433594, "global_step": 266986, "epoch": 1589} {"train_loss": -11.57233715057373, "global_step": 266987, "epoch": 1589} {"train_loss": -11.589254379272461, "global_step": 266988, "epoch": 1589} {"train_loss": -11.219953536987305, "global_step": 266989, "epoch": 1589} {"train_loss": -11.74481201171875, "global_step": 266990, "epoch": 1589} {"train_loss": -11.557418823242188, "global_step": 266991, "epoch": 1589} {"train_loss": -11.729719161987305, "global_step": 266992, "epoch": 1589} {"train_loss": -11.600400924682617, "global_step": 266993, "epoch": 1589} {"train_loss": -11.47889232635498, "global_step": 266994, "epoch": 1589} {"train_loss": -11.946464538574219, "global_step": 266995, "epoch": 1589} {"train_loss": -11.705739974975586, "global_step": 266996, "epoch": 1589} {"train_loss": -11.586238861083984, "global_step": 266997, "epoch": 1589} {"train_loss": -11.586263656616211, "global_step": 266998, "epoch": 1589} {"train_loss": -12.007708549499512, "global_step": 266999, "epoch": 1589} {"train_loss": -11.269935607910156, "global_step": 267000, "epoch": 1589} {"train_loss": -11.948722839355469, "global_step": 267001, "epoch": 1589} {"train_loss": -11.477648735046387, "global_step": 267002, "epoch": 1589} {"train_loss": -11.858007431030273, "global_step": 267003, "epoch": 1589} {"train_loss": -12.023784637451172, "global_step": 267004, "epoch": 1589} {"train_loss": -11.424154281616211, "global_step": 267005, "epoch": 1589} {"train_loss": -12.012537002563477, "global_step": 267006, "epoch": 1589} {"train_loss": -11.844907760620117, "global_step": 267007, "epoch": 1589} {"train_loss": -12.078279495239258, "global_step": 267008, "epoch": 1589} {"train_loss": -11.756248474121094, "global_step": 267009, "epoch": 1589} {"train_loss": -11.718851089477539, "global_step": 267010, "epoch": 1589} {"train_loss": -11.853952407836914, "global_step": 267011, "epoch": 1589} {"train_loss": -11.97804069519043, "global_step": 267012, "epoch": 1589} {"train_loss": -11.744776725769043, "global_step": 267013, "epoch": 1589} {"train_loss": -11.865385055541992, "global_step": 267014, "epoch": 1589} {"train_loss": -11.984416961669922, "global_step": 267015, "epoch": 1589} {"train_loss": -12.078516006469727, "global_step": 267016, "epoch": 1589} {"train_loss": -12.197647094726562, "global_step": 267017, "epoch": 1589} {"train_loss": -11.95713996887207, "global_step": 267018, "epoch": 1589} {"train_loss": -11.909059524536133, "global_step": 267019, "epoch": 1589} {"train_loss": -12.013179779052734, "global_step": 267020, "epoch": 1589} {"train_loss": -12.140772819519043, "global_step": 267021, "epoch": 1589} {"train_loss": -12.079633712768555, "global_step": 267022, "epoch": 1589} {"train_loss": -12.204853057861328, "global_step": 267023, "epoch": 1589} {"train_loss": -12.07210922241211, "global_step": 267024, "epoch": 1589} {"train_loss": -11.916122436523438, "global_step": 267025, "epoch": 1589} {"train_loss": -12.195837020874023, "global_step": 267026, "epoch": 1589} {"train_loss": -12.099322319030762, "global_step": 267027, "epoch": 1589} {"train_loss": -12.192723274230957, "global_step": 267028, "epoch": 1589} {"train_loss": -12.18911361694336, "global_step": 267029, "epoch": 1589} {"train_loss": -12.116849899291992, "global_step": 267030, "epoch": 1589} {"train_loss": -12.137824058532715, "global_step": 267031, "epoch": 1589} {"train_loss": -12.18497085571289, "global_step": 267032, "epoch": 1589} {"train_loss": -12.134734153747559, "global_step": 267033, "epoch": 1589} {"train_loss": -12.404092788696289, "global_step": 267034, "epoch": 1589} {"train_loss": -12.182439804077148, "global_step": 267035, "epoch": 1589} {"train_loss": -12.262662887573242, "global_step": 267036, "epoch": 1589} {"train_loss": -12.165223121643066, "global_step": 267037, "epoch": 1589} {"train_loss": -12.26169204711914, "global_step": 267038, "epoch": 1589} {"train_loss": -11.885271072387695, "global_step": 267039, "epoch": 1589} {"train_loss": -12.25611686706543, "global_step": 267040, "epoch": 1589} {"train_loss": -11.927164077758789, "global_step": 267041, "epoch": 1589} {"train_loss": -12.021867752075195, "global_step": 267042, "epoch": 1589} {"train_loss": -12.27717113494873, "global_step": 267043, "epoch": 1589} {"train_loss": -12.014039039611816, "global_step": 267044, "epoch": 1589} {"train_loss": -11.612754821777344, "global_step": 267045, "epoch": 1589} {"train_loss": -11.656248092651367, "global_step": 267046, "epoch": 1589} {"train_loss": -10.735565185546875, "global_step": 267047, "epoch": 1589} {"train_loss": -11.671524047851562, "global_step": 267048, "epoch": 1589} {"train_loss": -10.738311767578125, "global_step": 267049, "epoch": 1589} {"train_loss": -10.940475463867188, "global_step": 267050, "epoch": 1589} {"train_loss": -11.302009582519531, "global_step": 267051, "epoch": 1589} {"train_loss": -11.26419448852539, "global_step": 267052, "epoch": 1589} {"train_loss": -10.629236221313477, "global_step": 267053, "epoch": 1589} {"train_loss": -11.17856216430664, "global_step": 267054, "epoch": 1589} {"train_loss": -10.742707252502441, "global_step": 267055, "epoch": 1589} {"train_loss": -11.152923583984375, "global_step": 267056, "epoch": 1589} {"train_loss": -11.093910217285156, "global_step": 267057, "epoch": 1589} {"train_loss": -11.254079818725586, "global_step": 267058, "epoch": 1589} {"train_loss": -11.05964469909668, "global_step": 267059, "epoch": 1589} {"train_loss": -10.441804885864258, "global_step": 267060, "epoch": 1589} {"train_loss": -12.012565612792969, "global_step": 267061, "epoch": 1589} {"train_loss": -10.27658748626709, "global_step": 267062, "epoch": 1589} {"train_loss": -11.310805320739746, "global_step": 267063, "epoch": 1589} {"train_loss": -11.48598861694336, "global_step": 267064, "epoch": 1589} {"train_loss": -10.531326293945312, "global_step": 267065, "epoch": 1589} {"train_loss": -11.663773536682129, "global_step": 267066, "epoch": 1589} {"train_loss": -11.310831069946289, "global_step": 267067, "epoch": 1589} {"train_loss": -10.97331428527832, "global_step": 267068, "epoch": 1589} {"train_loss": -11.781187057495117, "global_step": 267069, "epoch": 1589} {"train_loss": -10.984249114990234, "global_step": 267070, "epoch": 1589} {"train_loss": -11.663688659667969, "global_step": 267071, "epoch": 1589} {"train_loss": -10.700414657592773, "global_step": 267072, "epoch": 1589} {"train_loss": -11.679596900939941, "global_step": 267073, "epoch": 1589} {"train_loss": -10.82213306427002, "global_step": 267074, "epoch": 1589} {"train_loss": -11.562414169311523, "global_step": 267075, "epoch": 1589} {"train_loss": -11.791305541992188, "global_step": 267076, "epoch": 1589} {"train_loss": -11.016826629638672, "global_step": 267077, "epoch": 1589} {"train_loss": -11.924911499023438, "global_step": 267078, "epoch": 1589} {"train_loss": -11.506000518798828, "global_step": 267079, "epoch": 1589} {"train_loss": -11.927724838256836, "global_step": 267080, "epoch": 1589} {"train_loss": -11.630189895629883, "global_step": 267081, "epoch": 1589} {"train_loss": -11.882698059082031, "global_step": 267082, "epoch": 1589} {"train_loss": -11.587732315063477, "global_step": 267083, "epoch": 1589} {"train_loss": -12.01842212677002, "global_step": 267084, "epoch": 1589} {"train_loss": -11.759988784790039, "global_step": 267085, "epoch": 1589} {"train_loss": -11.749231338500977, "global_step": 267086, "epoch": 1589} {"train_loss": -11.541735649108887, "global_step": 267087, "epoch": 1589} {"train_loss": -11.81364631652832, "global_step": 267088, "epoch": 1589} {"train_loss": -11.898984909057617, "global_step": 267089, "epoch": 1589} {"train_loss": -11.95022201538086, "global_step": 267090, "epoch": 1589} {"train_loss": -12.099039077758789, "global_step": 267091, "epoch": 1589} {"train_loss": -11.933012008666992, "global_step": 267092, "epoch": 1589} {"train_loss": -12.029909133911133, "global_step": 267093, "epoch": 1589} {"train_loss": -11.938106536865234, "global_step": 267094, "epoch": 1589} {"train_loss": -11.94019603729248, "global_step": 267095, "epoch": 1589} {"train_loss": -11.997108459472656, "global_step": 267096, "epoch": 1589} {"train_loss": -11.796523094177246, "global_step": 267097, "epoch": 1589} {"train_loss": -12.102762222290039, "global_step": 267098, "epoch": 1589} {"train_loss": -11.867743492126465, "global_step": 267099, "epoch": 1589} {"train_loss": -12.045843124389648, "global_step": 267100, "epoch": 1589} {"train_loss": -12.139632225036621, "global_step": 267101, "epoch": 1589} {"train_loss": -12.163009643554688, "global_step": 267102, "epoch": 1589} {"train_loss": -12.125100135803223, "global_step": 267103, "epoch": 1589} {"train_loss": -12.121591567993164, "global_step": 267104, "epoch": 1589} {"train_loss": -12.07887077331543, "global_step": 267105, "epoch": 1589} {"train_loss": -12.136201858520508, "global_step": 267106, "epoch": 1589} {"train_loss": -12.137331008911133, "global_step": 267107, "epoch": 1589} {"train_loss": -11.798213958740234, "global_step": 267108, "epoch": 1589} {"train_loss": -11.994861602783203, "global_step": 267109, "epoch": 1589} {"train_loss": -11.939831733703613, "global_step": 267110, "epoch": 1589} {"train_loss": -11.568790435791016, "global_step": 267111, "epoch": 1589} {"train_loss": -11.790916442871094, "global_step": 267112, "epoch": 1589} {"train_loss": -11.888710975646973, "global_step": 267113, "epoch": 1589} {"train_loss": -11.919455528259277, "global_step": 267114, "epoch": 1589} {"train_loss": -11.451335906982422, "global_step": 267115, "epoch": 1589} {"train_loss": -11.911169052124023, "global_step": 267116, "epoch": 1589} {"train_loss": -11.53831958770752, "global_step": 267117, "epoch": 1589} {"train_loss": -12.194939613342285, "global_step": 267118, "epoch": 1589} {"train_loss": -11.713368268240066, "global_step": 267119, "epoch": 1589, "val_loss": 273291.75} {"train_loss": -11.448128700256348, "global_step": 267120, "epoch": 1590} {"train_loss": -11.665398597717285, "global_step": 267121, "epoch": 1590} {"train_loss": -11.366689682006836, "global_step": 267122, "epoch": 1590} {"train_loss": -12.07448959350586, "global_step": 267123, "epoch": 1590} {"train_loss": -11.49678897857666, "global_step": 267124, "epoch": 1590} {"train_loss": -12.078819274902344, "global_step": 267125, "epoch": 1590} {"train_loss": -11.765528678894043, "global_step": 267126, "epoch": 1590} {"train_loss": -11.927935600280762, "global_step": 267127, "epoch": 1590} {"train_loss": -11.80035400390625, "global_step": 267128, "epoch": 1590} {"train_loss": -11.340996742248535, "global_step": 267129, "epoch": 1590} {"train_loss": -11.822836875915527, "global_step": 267130, "epoch": 1590} {"train_loss": -11.504756927490234, "global_step": 267131, "epoch": 1590} {"train_loss": -11.741302490234375, "global_step": 267132, "epoch": 1590} {"train_loss": -11.21658706665039, "global_step": 267133, "epoch": 1590} {"train_loss": -11.909218788146973, "global_step": 267134, "epoch": 1590} {"train_loss": -12.138147354125977, "global_step": 267135, "epoch": 1590} {"train_loss": -11.286847114562988, "global_step": 267136, "epoch": 1590} {"train_loss": -11.738958358764648, "global_step": 267137, "epoch": 1590} {"train_loss": -11.289877891540527, "global_step": 267138, "epoch": 1590} {"train_loss": -11.829193115234375, "global_step": 267139, "epoch": 1590} {"train_loss": -11.316728591918945, "global_step": 267140, "epoch": 1590} {"train_loss": -11.606805801391602, "global_step": 267141, "epoch": 1590} {"train_loss": -11.24503231048584, "global_step": 267142, "epoch": 1590} {"train_loss": -11.190834999084473, "global_step": 267143, "epoch": 1590} {"train_loss": -11.88035774230957, "global_step": 267144, "epoch": 1590} {"train_loss": -11.78720474243164, "global_step": 267145, "epoch": 1590} {"train_loss": -11.878625869750977, "global_step": 267146, "epoch": 1590} {"train_loss": -11.89138126373291, "global_step": 267147, "epoch": 1590} {"train_loss": -11.923502922058105, "global_step": 267148, "epoch": 1590} {"train_loss": -12.198189735412598, "global_step": 267149, "epoch": 1590} {"train_loss": -12.101485252380371, "global_step": 267150, "epoch": 1590} {"train_loss": -11.862180709838867, "global_step": 267151, "epoch": 1590} {"train_loss": -11.680322647094727, "global_step": 267152, "epoch": 1590} {"train_loss": -11.887495994567871, "global_step": 267153, "epoch": 1590} {"train_loss": -11.445793151855469, "global_step": 267154, "epoch": 1590} {"train_loss": -11.844219207763672, "global_step": 267155, "epoch": 1590} {"train_loss": -11.486770629882812, "global_step": 267156, "epoch": 1590} {"train_loss": -11.950218200683594, "global_step": 267157, "epoch": 1590} {"train_loss": -11.52277946472168, "global_step": 267158, "epoch": 1590} {"train_loss": -11.944622993469238, "global_step": 267159, "epoch": 1590} {"train_loss": -11.719491004943848, "global_step": 267160, "epoch": 1590} {"train_loss": -12.086748123168945, "global_step": 267161, "epoch": 1590} {"train_loss": -11.989295959472656, "global_step": 267162, "epoch": 1590} {"train_loss": -11.760154724121094, "global_step": 267163, "epoch": 1590} {"train_loss": -12.10965347290039, "global_step": 267164, "epoch": 1590} {"train_loss": -11.616939544677734, "global_step": 267165, "epoch": 1590} {"train_loss": -11.959758758544922, "global_step": 267166, "epoch": 1590} {"train_loss": -11.632274627685547, "global_step": 267167, "epoch": 1590} {"train_loss": -11.96031379699707, "global_step": 267168, "epoch": 1590} {"train_loss": -12.113204956054688, "global_step": 267169, "epoch": 1590} {"train_loss": -11.828514099121094, "global_step": 267170, "epoch": 1590} {"train_loss": -11.836624145507812, "global_step": 267171, "epoch": 1590} {"train_loss": -12.180027961730957, "global_step": 267172, "epoch": 1590} {"train_loss": -11.81967544555664, "global_step": 267173, "epoch": 1590} {"train_loss": -12.209671020507812, "global_step": 267174, "epoch": 1590} {"train_loss": -11.893547058105469, "global_step": 267175, "epoch": 1590} {"train_loss": -12.132108688354492, "global_step": 267176, "epoch": 1590} {"train_loss": -11.843400955200195, "global_step": 267177, "epoch": 1590} {"train_loss": -12.366308212280273, "global_step": 267178, "epoch": 1590} {"train_loss": -11.883468627929688, "global_step": 267179, "epoch": 1590} {"train_loss": -12.28345775604248, "global_step": 267180, "epoch": 1590} {"train_loss": -12.155953407287598, "global_step": 267181, "epoch": 1590} {"train_loss": -12.027115821838379, "global_step": 267182, "epoch": 1590} {"train_loss": -11.878852844238281, "global_step": 267183, "epoch": 1590} {"train_loss": -12.223366737365723, "global_step": 267184, "epoch": 1590} {"train_loss": -12.241710662841797, "global_step": 267185, "epoch": 1590} {"train_loss": -12.114265441894531, "global_step": 267186, "epoch": 1590} {"train_loss": -11.951597213745117, "global_step": 267187, "epoch": 1590} {"train_loss": -12.212743759155273, "global_step": 267188, "epoch": 1590} {"train_loss": -12.098968505859375, "global_step": 267189, "epoch": 1590} {"train_loss": -12.039660453796387, "global_step": 267190, "epoch": 1590} {"train_loss": -12.46756649017334, "global_step": 267191, "epoch": 1590} {"train_loss": -11.955371856689453, "global_step": 267192, "epoch": 1590} {"train_loss": -11.657108306884766, "global_step": 267193, "epoch": 1590} {"train_loss": -12.287938117980957, "global_step": 267194, "epoch": 1590} {"train_loss": -11.949316024780273, "global_step": 267195, "epoch": 1590} {"train_loss": -11.786240577697754, "global_step": 267196, "epoch": 1590} {"train_loss": -12.185007095336914, "global_step": 267197, "epoch": 1590} {"train_loss": -11.631245613098145, "global_step": 267198, "epoch": 1590} {"train_loss": -11.090276718139648, "global_step": 267199, "epoch": 1590} {"train_loss": -11.460916519165039, "global_step": 267200, "epoch": 1590} {"train_loss": -11.665075302124023, "global_step": 267201, "epoch": 1590} {"train_loss": -9.800609588623047, "global_step": 267202, "epoch": 1590} {"train_loss": -10.941875457763672, "global_step": 267203, "epoch": 1590} {"train_loss": -11.491281509399414, "global_step": 267204, "epoch": 1590} {"train_loss": -9.926345825195312, "global_step": 267205, "epoch": 1590} {"train_loss": -11.574697494506836, "global_step": 267206, "epoch": 1590} {"train_loss": -10.900004386901855, "global_step": 267207, "epoch": 1590} {"train_loss": -10.779865264892578, "global_step": 267208, "epoch": 1590} {"train_loss": -11.228804588317871, "global_step": 267209, "epoch": 1590} {"train_loss": -11.258838653564453, "global_step": 267210, "epoch": 1590} {"train_loss": -10.298385620117188, "global_step": 267211, "epoch": 1590} {"train_loss": -11.512057304382324, "global_step": 267212, "epoch": 1590} {"train_loss": -10.09074878692627, "global_step": 267213, "epoch": 1590} {"train_loss": -10.662642478942871, "global_step": 267214, "epoch": 1590} {"train_loss": -11.411832809448242, "global_step": 267215, "epoch": 1590} {"train_loss": -10.618375778198242, "global_step": 267216, "epoch": 1590} {"train_loss": -11.549836158752441, "global_step": 267217, "epoch": 1590} {"train_loss": -11.396488189697266, "global_step": 267218, "epoch": 1590} {"train_loss": -11.136406898498535, "global_step": 267219, "epoch": 1590} {"train_loss": -11.116912841796875, "global_step": 267220, "epoch": 1590} {"train_loss": -11.417241096496582, "global_step": 267221, "epoch": 1590} {"train_loss": -11.259042739868164, "global_step": 267222, "epoch": 1590} {"train_loss": -11.554367065429688, "global_step": 267223, "epoch": 1590} {"train_loss": -11.289678573608398, "global_step": 267224, "epoch": 1590} {"train_loss": -11.547754287719727, "global_step": 267225, "epoch": 1590} {"train_loss": -11.558083534240723, "global_step": 267226, "epoch": 1590} {"train_loss": -11.11455249786377, "global_step": 267227, "epoch": 1590} {"train_loss": -11.545281410217285, "global_step": 267228, "epoch": 1590} {"train_loss": -11.228742599487305, "global_step": 267229, "epoch": 1590} {"train_loss": -11.77738094329834, "global_step": 267230, "epoch": 1590} {"train_loss": -11.478389739990234, "global_step": 267231, "epoch": 1590} {"train_loss": -11.99293327331543, "global_step": 267232, "epoch": 1590} {"train_loss": -11.920543670654297, "global_step": 267233, "epoch": 1590} {"train_loss": -11.750125885009766, "global_step": 267234, "epoch": 1590} {"train_loss": -11.846511840820312, "global_step": 267235, "epoch": 1590} {"train_loss": -11.987326622009277, "global_step": 267236, "epoch": 1590} {"train_loss": -11.67548942565918, "global_step": 267237, "epoch": 1590} {"train_loss": -11.722352981567383, "global_step": 267238, "epoch": 1590} {"train_loss": -11.884306907653809, "global_step": 267239, "epoch": 1590} {"train_loss": -11.760127067565918, "global_step": 267240, "epoch": 1590} {"train_loss": -12.027099609375, "global_step": 267241, "epoch": 1590} {"train_loss": -11.832191467285156, "global_step": 267242, "epoch": 1590} {"train_loss": -11.946054458618164, "global_step": 267243, "epoch": 1590} {"train_loss": -11.986370086669922, "global_step": 267244, "epoch": 1590} {"train_loss": -11.84778118133545, "global_step": 267245, "epoch": 1590} {"train_loss": -11.949514389038086, "global_step": 267246, "epoch": 1590} {"train_loss": -11.925455093383789, "global_step": 267247, "epoch": 1590} {"train_loss": -11.902454376220703, "global_step": 267248, "epoch": 1590} {"train_loss": -11.71588134765625, "global_step": 267249, "epoch": 1590} {"train_loss": -12.199097633361816, "global_step": 267250, "epoch": 1590} {"train_loss": -11.874454498291016, "global_step": 267251, "epoch": 1590} {"train_loss": -12.140227317810059, "global_step": 267252, "epoch": 1590} {"train_loss": -12.010091781616211, "global_step": 267253, "epoch": 1590} {"train_loss": -11.858759880065918, "global_step": 267254, "epoch": 1590} {"train_loss": -12.101780891418457, "global_step": 267255, "epoch": 1590} {"train_loss": -12.070764541625977, "global_step": 267256, "epoch": 1590} {"train_loss": -12.152737617492676, "global_step": 267257, "epoch": 1590} {"train_loss": -12.068219184875488, "global_step": 267258, "epoch": 1590} {"train_loss": -12.178438186645508, "global_step": 267259, "epoch": 1590} {"train_loss": -12.266014099121094, "global_step": 267260, "epoch": 1590} {"train_loss": -12.214111328125, "global_step": 267261, "epoch": 1590} {"train_loss": -12.0227632522583, "global_step": 267262, "epoch": 1590} {"train_loss": -12.330413818359375, "global_step": 267263, "epoch": 1590} {"train_loss": -12.257844924926758, "global_step": 267264, "epoch": 1590} {"train_loss": -12.248684883117676, "global_step": 267265, "epoch": 1590} {"train_loss": -12.25940227508545, "global_step": 267266, "epoch": 1590} {"train_loss": -12.12198257446289, "global_step": 267267, "epoch": 1590} {"train_loss": -12.246400833129883, "global_step": 267268, "epoch": 1590} {"train_loss": -12.128095626831055, "global_step": 267269, "epoch": 1590} {"train_loss": -12.113039016723633, "global_step": 267270, "epoch": 1590} {"train_loss": -12.113163948059082, "global_step": 267271, "epoch": 1590} {"train_loss": -12.060005187988281, "global_step": 267272, "epoch": 1590} {"train_loss": -12.111601829528809, "global_step": 267273, "epoch": 1590} {"train_loss": -12.00562858581543, "global_step": 267274, "epoch": 1590} {"train_loss": -12.327156066894531, "global_step": 267275, "epoch": 1590} {"train_loss": -11.79515266418457, "global_step": 267276, "epoch": 1590} {"train_loss": -12.272056579589844, "global_step": 267277, "epoch": 1590} {"train_loss": -12.181256294250488, "global_step": 267278, "epoch": 1590} {"train_loss": -12.13906192779541, "global_step": 267279, "epoch": 1590} {"train_loss": -11.991952896118164, "global_step": 267280, "epoch": 1590} {"train_loss": -12.343233108520508, "global_step": 267281, "epoch": 1590} {"train_loss": -12.106193542480469, "global_step": 267282, "epoch": 1590} {"train_loss": -12.369117736816406, "global_step": 267283, "epoch": 1590} {"train_loss": -12.027420043945312, "global_step": 267284, "epoch": 1590} {"train_loss": -11.82181167602539, "global_step": 267285, "epoch": 1590} {"train_loss": -12.201445579528809, "global_step": 267286, "epoch": 1590} {"train_loss": -11.77176022529602, "global_step": 267287, "epoch": 1590, "val_loss": 274203.125, "train_action_mse_error": 5.335143566131592} {"train_loss": -11.327173233032227, "global_step": 267288, "epoch": 1591} {"train_loss": -11.50999641418457, "global_step": 267289, "epoch": 1591} {"train_loss": -11.650979995727539, "global_step": 267290, "epoch": 1591} {"train_loss": -12.030437469482422, "global_step": 267291, "epoch": 1591} {"train_loss": -11.533635139465332, "global_step": 267292, "epoch": 1591} {"train_loss": -12.215856552124023, "global_step": 267293, "epoch": 1591} {"train_loss": -11.093328475952148, "global_step": 267294, "epoch": 1591} {"train_loss": -11.759771347045898, "global_step": 267295, "epoch": 1591} {"train_loss": -11.431527137756348, "global_step": 267296, "epoch": 1591} {"train_loss": -11.473209381103516, "global_step": 267297, "epoch": 1591} {"train_loss": -11.836807250976562, "global_step": 267298, "epoch": 1591} {"train_loss": -11.45705795288086, "global_step": 267299, "epoch": 1591} {"train_loss": -11.753549575805664, "global_step": 267300, "epoch": 1591} {"train_loss": -10.248950004577637, "global_step": 267301, "epoch": 1591} {"train_loss": -10.916748046875, "global_step": 267302, "epoch": 1591} {"train_loss": -11.317656517028809, "global_step": 267303, "epoch": 1591} {"train_loss": -9.214790344238281, "global_step": 267304, "epoch": 1591} {"train_loss": -11.50876235961914, "global_step": 267305, "epoch": 1591} {"train_loss": -11.749565124511719, "global_step": 267306, "epoch": 1591} {"train_loss": -10.126839637756348, "global_step": 267307, "epoch": 1591} {"train_loss": -10.521760940551758, "global_step": 267308, "epoch": 1591} {"train_loss": -11.772666931152344, "global_step": 267309, "epoch": 1591} {"train_loss": -11.55009651184082, "global_step": 267310, "epoch": 1591} {"train_loss": -10.98305892944336, "global_step": 267311, "epoch": 1591} {"train_loss": -11.6205415725708, "global_step": 267312, "epoch": 1591} {"train_loss": -11.906233787536621, "global_step": 267313, "epoch": 1591} {"train_loss": -11.432388305664062, "global_step": 267314, "epoch": 1591} {"train_loss": -11.83230972290039, "global_step": 267315, "epoch": 1591} {"train_loss": -11.846757888793945, "global_step": 267316, "epoch": 1591} {"train_loss": -11.618825912475586, "global_step": 267317, "epoch": 1591} {"train_loss": -11.015589714050293, "global_step": 267318, "epoch": 1591} {"train_loss": -11.62570571899414, "global_step": 267319, "epoch": 1591} {"train_loss": -11.230674743652344, "global_step": 267320, "epoch": 1591} {"train_loss": -11.483814239501953, "global_step": 267321, "epoch": 1591} {"train_loss": -11.294901847839355, "global_step": 267322, "epoch": 1591} {"train_loss": -11.294143676757812, "global_step": 267323, "epoch": 1591} {"train_loss": -11.420452117919922, "global_step": 267324, "epoch": 1591} {"train_loss": -11.295204162597656, "global_step": 267325, "epoch": 1591} {"train_loss": -11.380629539489746, "global_step": 267326, "epoch": 1591} {"train_loss": -11.02519702911377, "global_step": 267327, "epoch": 1591} {"train_loss": -11.743492126464844, "global_step": 267328, "epoch": 1591} {"train_loss": -9.212697982788086, "global_step": 267329, "epoch": 1591} {"train_loss": -11.120962142944336, "global_step": 267330, "epoch": 1591} {"train_loss": -10.98614501953125, "global_step": 267331, "epoch": 1591} {"train_loss": -10.67219352722168, "global_step": 267332, "epoch": 1591} {"train_loss": -10.986929893493652, "global_step": 267333, "epoch": 1591} {"train_loss": -9.536367416381836, "global_step": 267334, "epoch": 1591} {"train_loss": -10.94301986694336, "global_step": 267335, "epoch": 1591} {"train_loss": -10.428754806518555, "global_step": 267336, "epoch": 1591} {"train_loss": -11.05513858795166, "global_step": 267337, "epoch": 1591} {"train_loss": -10.814615249633789, "global_step": 267338, "epoch": 1591} {"train_loss": -11.274808883666992, "global_step": 267339, "epoch": 1591} {"train_loss": -11.062034606933594, "global_step": 267340, "epoch": 1591} {"train_loss": -11.477095603942871, "global_step": 267341, "epoch": 1591} {"train_loss": -10.788236618041992, "global_step": 267342, "epoch": 1591} {"train_loss": -11.75752067565918, "global_step": 267343, "epoch": 1591} {"train_loss": -10.783958435058594, "global_step": 267344, "epoch": 1591} {"train_loss": -11.431198120117188, "global_step": 267345, "epoch": 1591} {"train_loss": -11.05902099609375, "global_step": 267346, "epoch": 1591} {"train_loss": -11.603219985961914, "global_step": 267347, "epoch": 1591} {"train_loss": -11.770051002502441, "global_step": 267348, "epoch": 1591} {"train_loss": -11.205591201782227, "global_step": 267349, "epoch": 1591} {"train_loss": -11.65809440612793, "global_step": 267350, "epoch": 1591} {"train_loss": -11.1490478515625, "global_step": 267351, "epoch": 1591} {"train_loss": -11.65308952331543, "global_step": 267352, "epoch": 1591} {"train_loss": -11.613936424255371, "global_step": 267353, "epoch": 1591} {"train_loss": -11.337564468383789, "global_step": 267354, "epoch": 1591} {"train_loss": -11.241561889648438, "global_step": 267355, "epoch": 1591} {"train_loss": -11.312088012695312, "global_step": 267356, "epoch": 1591} {"train_loss": -11.479628562927246, "global_step": 267357, "epoch": 1591} {"train_loss": -11.481119155883789, "global_step": 267358, "epoch": 1591} {"train_loss": -11.534488677978516, "global_step": 267359, "epoch": 1591} {"train_loss": -11.409951210021973, "global_step": 267360, "epoch": 1591} {"train_loss": -11.745800018310547, "global_step": 267361, "epoch": 1591} {"train_loss": -11.503652572631836, "global_step": 267362, "epoch": 1591} {"train_loss": -11.83760929107666, "global_step": 267363, "epoch": 1591} {"train_loss": -11.58970832824707, "global_step": 267364, "epoch": 1591} {"train_loss": -11.824010848999023, "global_step": 267365, "epoch": 1591} {"train_loss": -11.724178314208984, "global_step": 267366, "epoch": 1591} {"train_loss": -11.658769607543945, "global_step": 267367, "epoch": 1591} {"train_loss": -11.7753324508667, "global_step": 267368, "epoch": 1591} {"train_loss": -11.51719856262207, "global_step": 267369, "epoch": 1591} {"train_loss": -11.808572769165039, "global_step": 267370, "epoch": 1591} {"train_loss": -11.520889282226562, "global_step": 267371, "epoch": 1591} {"train_loss": -11.662398338317871, "global_step": 267372, "epoch": 1591} {"train_loss": -11.839841842651367, "global_step": 267373, "epoch": 1591} {"train_loss": -11.599300384521484, "global_step": 267374, "epoch": 1591} {"train_loss": -11.768121719360352, "global_step": 267375, "epoch": 1591} {"train_loss": -11.769933700561523, "global_step": 267376, "epoch": 1591} {"train_loss": -11.716716766357422, "global_step": 267377, "epoch": 1591} {"train_loss": -11.766389846801758, "global_step": 267378, "epoch": 1591} {"train_loss": -11.509657859802246, "global_step": 267379, "epoch": 1591} {"train_loss": -11.82105541229248, "global_step": 267380, "epoch": 1591} {"train_loss": -11.678790092468262, "global_step": 267381, "epoch": 1591} {"train_loss": -11.326295852661133, "global_step": 267382, "epoch": 1591} {"train_loss": -11.974821090698242, "global_step": 267383, "epoch": 1591} {"train_loss": -11.530478477478027, "global_step": 267384, "epoch": 1591} {"train_loss": -11.689384460449219, "global_step": 267385, "epoch": 1591} {"train_loss": -11.505327224731445, "global_step": 267386, "epoch": 1591} {"train_loss": -11.277355194091797, "global_step": 267387, "epoch": 1591} {"train_loss": -11.905776023864746, "global_step": 267388, "epoch": 1591} {"train_loss": -11.280771255493164, "global_step": 267389, "epoch": 1591} {"train_loss": -11.84087085723877, "global_step": 267390, "epoch": 1591} {"train_loss": -11.848509788513184, "global_step": 267391, "epoch": 1591} {"train_loss": -11.83845329284668, "global_step": 267392, "epoch": 1591} {"train_loss": -11.944786071777344, "global_step": 267393, "epoch": 1591} {"train_loss": -11.958078384399414, "global_step": 267394, "epoch": 1591} {"train_loss": -12.022233009338379, "global_step": 267395, "epoch": 1591} {"train_loss": -11.934107780456543, "global_step": 267396, "epoch": 1591} {"train_loss": -11.970758438110352, "global_step": 267397, "epoch": 1591} {"train_loss": -11.922486305236816, "global_step": 267398, "epoch": 1591} {"train_loss": -12.07400131225586, "global_step": 267399, "epoch": 1591} {"train_loss": -12.075925827026367, "global_step": 267400, "epoch": 1591} {"train_loss": -11.849437713623047, "global_step": 267401, "epoch": 1591} {"train_loss": -12.05168342590332, "global_step": 267402, "epoch": 1591} {"train_loss": -11.921571731567383, "global_step": 267403, "epoch": 1591} {"train_loss": -11.869548797607422, "global_step": 267404, "epoch": 1591} {"train_loss": -11.902042388916016, "global_step": 267405, "epoch": 1591} {"train_loss": -12.312487602233887, "global_step": 267406, "epoch": 1591} {"train_loss": -11.94913101196289, "global_step": 267407, "epoch": 1591} {"train_loss": -12.098030090332031, "global_step": 267408, "epoch": 1591} {"train_loss": -11.997422218322754, "global_step": 267409, "epoch": 1591} {"train_loss": -12.048074722290039, "global_step": 267410, "epoch": 1591} {"train_loss": -12.265626907348633, "global_step": 267411, "epoch": 1591} {"train_loss": -11.976861000061035, "global_step": 267412, "epoch": 1591} {"train_loss": -12.204103469848633, "global_step": 267413, "epoch": 1591} {"train_loss": -12.175308227539062, "global_step": 267414, "epoch": 1591} {"train_loss": -12.043415069580078, "global_step": 267415, "epoch": 1591} {"train_loss": -12.368274688720703, "global_step": 267416, "epoch": 1591} {"train_loss": -12.249719619750977, "global_step": 267417, "epoch": 1591} {"train_loss": -12.350397109985352, "global_step": 267418, "epoch": 1591} {"train_loss": -12.213033676147461, "global_step": 267419, "epoch": 1591} {"train_loss": -12.31582260131836, "global_step": 267420, "epoch": 1591} {"train_loss": -12.236884117126465, "global_step": 267421, "epoch": 1591} {"train_loss": -12.188576698303223, "global_step": 267422, "epoch": 1591} {"train_loss": -12.260152816772461, "global_step": 267423, "epoch": 1591} {"train_loss": -12.237129211425781, "global_step": 267424, "epoch": 1591} {"train_loss": -12.298848152160645, "global_step": 267425, "epoch": 1591} {"train_loss": -12.303231239318848, "global_step": 267426, "epoch": 1591} {"train_loss": -12.040154457092285, "global_step": 267427, "epoch": 1591} {"train_loss": -11.987527847290039, "global_step": 267428, "epoch": 1591} {"train_loss": -11.809091567993164, "global_step": 267429, "epoch": 1591} {"train_loss": -11.800697326660156, "global_step": 267430, "epoch": 1591} {"train_loss": -12.218058586120605, "global_step": 267431, "epoch": 1591} {"train_loss": -11.360126495361328, "global_step": 267432, "epoch": 1591} {"train_loss": -11.448358535766602, "global_step": 267433, "epoch": 1591} {"train_loss": -12.421314239501953, "global_step": 267434, "epoch": 1591} {"train_loss": -11.712942123413086, "global_step": 267435, "epoch": 1591} {"train_loss": -11.214432716369629, "global_step": 267436, "epoch": 1591} {"train_loss": -12.100156784057617, "global_step": 267437, "epoch": 1591} {"train_loss": -12.11661148071289, "global_step": 267438, "epoch": 1591} {"train_loss": -11.256454467773438, "global_step": 267439, "epoch": 1591} {"train_loss": -11.415323257446289, "global_step": 267440, "epoch": 1591} {"train_loss": -12.358607292175293, "global_step": 267441, "epoch": 1591} {"train_loss": -11.687299728393555, "global_step": 267442, "epoch": 1591} {"train_loss": -11.938858032226562, "global_step": 267443, "epoch": 1591} {"train_loss": -11.902329444885254, "global_step": 267444, "epoch": 1591} {"train_loss": -12.007404327392578, "global_step": 267445, "epoch": 1591} {"train_loss": -11.251839637756348, "global_step": 267446, "epoch": 1591} {"train_loss": -11.97368335723877, "global_step": 267447, "epoch": 1591} {"train_loss": -11.781700134277344, "global_step": 267448, "epoch": 1591} {"train_loss": -11.684592247009277, "global_step": 267449, "epoch": 1591} {"train_loss": -11.934778213500977, "global_step": 267450, "epoch": 1591} {"train_loss": -11.185836791992188, "global_step": 267451, "epoch": 1591} {"train_loss": -11.609989166259766, "global_step": 267452, "epoch": 1591} {"train_loss": -12.004862785339355, "global_step": 267453, "epoch": 1591} {"train_loss": -11.071386337280273, "global_step": 267454, "epoch": 1591} {"train_loss": -11.594428987730117, "global_step": 267455, "epoch": 1591, "val_loss": 268212.3125} {"train_loss": -11.18348503112793, "global_step": 267456, "epoch": 1592} {"train_loss": -11.250879287719727, "global_step": 267457, "epoch": 1592} {"train_loss": -11.52226448059082, "global_step": 267458, "epoch": 1592} {"train_loss": -11.134317398071289, "global_step": 267459, "epoch": 1592} {"train_loss": -11.65910530090332, "global_step": 267460, "epoch": 1592} {"train_loss": -11.212830543518066, "global_step": 267461, "epoch": 1592} {"train_loss": -10.358053207397461, "global_step": 267462, "epoch": 1592} {"train_loss": -11.923856735229492, "global_step": 267463, "epoch": 1592} {"train_loss": -10.100906372070312, "global_step": 267464, "epoch": 1592} {"train_loss": -10.786581039428711, "global_step": 267465, "epoch": 1592} {"train_loss": -11.283490180969238, "global_step": 267466, "epoch": 1592} {"train_loss": -11.394634246826172, "global_step": 267467, "epoch": 1592} {"train_loss": -10.43613338470459, "global_step": 267468, "epoch": 1592} {"train_loss": -11.212581634521484, "global_step": 267469, "epoch": 1592} {"train_loss": -10.599252700805664, "global_step": 267470, "epoch": 1592} {"train_loss": -11.490724563598633, "global_step": 267471, "epoch": 1592} {"train_loss": -10.957523345947266, "global_step": 267472, "epoch": 1592} {"train_loss": -10.698516845703125, "global_step": 267473, "epoch": 1592} {"train_loss": -11.413361549377441, "global_step": 267474, "epoch": 1592} {"train_loss": -11.088022232055664, "global_step": 267475, "epoch": 1592} {"train_loss": -12.008041381835938, "global_step": 267476, "epoch": 1592} {"train_loss": -10.807132720947266, "global_step": 267477, "epoch": 1592} {"train_loss": -11.773204803466797, "global_step": 267478, "epoch": 1592} {"train_loss": -11.310434341430664, "global_step": 267479, "epoch": 1592} {"train_loss": -11.458377838134766, "global_step": 267480, "epoch": 1592} {"train_loss": -11.012737274169922, "global_step": 267481, "epoch": 1592} {"train_loss": -11.372285842895508, "global_step": 267482, "epoch": 1592} {"train_loss": -11.117754936218262, "global_step": 267483, "epoch": 1592} {"train_loss": -11.011197090148926, "global_step": 267484, "epoch": 1592} {"train_loss": -11.423867225646973, "global_step": 267485, "epoch": 1592} {"train_loss": -11.552711486816406, "global_step": 267486, "epoch": 1592} {"train_loss": -11.625246047973633, "global_step": 267487, "epoch": 1592} {"train_loss": -11.754955291748047, "global_step": 267488, "epoch": 1592} {"train_loss": -11.667587280273438, "global_step": 267489, "epoch": 1592} {"train_loss": -11.181941986083984, "global_step": 267490, "epoch": 1592} {"train_loss": -11.833051681518555, "global_step": 267491, "epoch": 1592} {"train_loss": -11.655277252197266, "global_step": 267492, "epoch": 1592} {"train_loss": -11.715932846069336, "global_step": 267493, "epoch": 1592} {"train_loss": -11.7479829788208, "global_step": 267494, "epoch": 1592} {"train_loss": -11.628301620483398, "global_step": 267495, "epoch": 1592} {"train_loss": -12.151346206665039, "global_step": 267496, "epoch": 1592} {"train_loss": -11.707856178283691, "global_step": 267497, "epoch": 1592} {"train_loss": -11.63827133178711, "global_step": 267498, "epoch": 1592} {"train_loss": -12.137187957763672, "global_step": 267499, "epoch": 1592} {"train_loss": -11.658814430236816, "global_step": 267500, "epoch": 1592} {"train_loss": -11.807235717773438, "global_step": 267501, "epoch": 1592} {"train_loss": -11.762685775756836, "global_step": 267502, "epoch": 1592} {"train_loss": -11.731707572937012, "global_step": 267503, "epoch": 1592} {"train_loss": -11.948064804077148, "global_step": 267504, "epoch": 1592} {"train_loss": -11.801568031311035, "global_step": 267505, "epoch": 1592} {"train_loss": -12.029022216796875, "global_step": 267506, "epoch": 1592} {"train_loss": -11.82626724243164, "global_step": 267507, "epoch": 1592} {"train_loss": -11.677759170532227, "global_step": 267508, "epoch": 1592} {"train_loss": -12.016481399536133, "global_step": 267509, "epoch": 1592} {"train_loss": -12.053133010864258, "global_step": 267510, "epoch": 1592} {"train_loss": -11.747685432434082, "global_step": 267511, "epoch": 1592} {"train_loss": -12.023763656616211, "global_step": 267512, "epoch": 1592} {"train_loss": -11.797591209411621, "global_step": 267513, "epoch": 1592} {"train_loss": -11.332125663757324, "global_step": 267514, "epoch": 1592} {"train_loss": -11.465385437011719, "global_step": 267515, "epoch": 1592} {"train_loss": -11.493231773376465, "global_step": 267516, "epoch": 1592} {"train_loss": -11.902037620544434, "global_step": 267517, "epoch": 1592} {"train_loss": -11.513522148132324, "global_step": 267518, "epoch": 1592} {"train_loss": -12.168061256408691, "global_step": 267519, "epoch": 1592} {"train_loss": -11.53375244140625, "global_step": 267520, "epoch": 1592} {"train_loss": -12.218734741210938, "global_step": 267521, "epoch": 1592} {"train_loss": -11.673938751220703, "global_step": 267522, "epoch": 1592} {"train_loss": -11.995681762695312, "global_step": 267523, "epoch": 1592} {"train_loss": -11.882040977478027, "global_step": 267524, "epoch": 1592} {"train_loss": -11.656744003295898, "global_step": 267525, "epoch": 1592} {"train_loss": -11.320089340209961, "global_step": 267526, "epoch": 1592} {"train_loss": -11.119138717651367, "global_step": 267527, "epoch": 1592} {"train_loss": -12.013574600219727, "global_step": 267528, "epoch": 1592} {"train_loss": -11.784656524658203, "global_step": 267529, "epoch": 1592} {"train_loss": -12.15723991394043, "global_step": 267530, "epoch": 1592} {"train_loss": -11.383407592773438, "global_step": 267531, "epoch": 1592} {"train_loss": -11.727294921875, "global_step": 267532, "epoch": 1592} {"train_loss": -12.067987442016602, "global_step": 267533, "epoch": 1592} {"train_loss": -11.691398620605469, "global_step": 267534, "epoch": 1592} {"train_loss": -12.091785430908203, "global_step": 267535, "epoch": 1592} {"train_loss": -11.93039608001709, "global_step": 267536, "epoch": 1592} {"train_loss": -11.870904922485352, "global_step": 267537, "epoch": 1592} {"train_loss": -11.735511779785156, "global_step": 267538, "epoch": 1592} {"train_loss": -10.848275184631348, "global_step": 267539, "epoch": 1592} {"train_loss": -11.709075927734375, "global_step": 267540, "epoch": 1592} {"train_loss": -11.20756721496582, "global_step": 267541, "epoch": 1592} {"train_loss": -10.773752212524414, "global_step": 267542, "epoch": 1592} {"train_loss": -12.183157920837402, "global_step": 267543, "epoch": 1592} {"train_loss": -11.051576614379883, "global_step": 267544, "epoch": 1592} {"train_loss": -11.717886924743652, "global_step": 267545, "epoch": 1592} {"train_loss": -11.89274787902832, "global_step": 267546, "epoch": 1592} {"train_loss": -10.909424781799316, "global_step": 267547, "epoch": 1592} {"train_loss": -11.883932113647461, "global_step": 267548, "epoch": 1592} {"train_loss": -12.010734558105469, "global_step": 267549, "epoch": 1592} {"train_loss": -11.52293586730957, "global_step": 267550, "epoch": 1592} {"train_loss": -12.024425506591797, "global_step": 267551, "epoch": 1592} {"train_loss": -11.601250648498535, "global_step": 267552, "epoch": 1592} {"train_loss": -11.60235595703125, "global_step": 267553, "epoch": 1592} {"train_loss": -11.777275085449219, "global_step": 267554, "epoch": 1592} {"train_loss": -10.963905334472656, "global_step": 267555, "epoch": 1592} {"train_loss": -11.799351692199707, "global_step": 267556, "epoch": 1592} {"train_loss": -11.231880187988281, "global_step": 267557, "epoch": 1592} {"train_loss": -11.947059631347656, "global_step": 267558, "epoch": 1592} {"train_loss": -11.390459060668945, "global_step": 267559, "epoch": 1592} {"train_loss": -11.462387084960938, "global_step": 267560, "epoch": 1592} {"train_loss": -11.624923706054688, "global_step": 267561, "epoch": 1592} {"train_loss": -11.629383087158203, "global_step": 267562, "epoch": 1592} {"train_loss": -11.674715042114258, "global_step": 267563, "epoch": 1592} {"train_loss": -11.898015975952148, "global_step": 267564, "epoch": 1592} {"train_loss": -11.434480667114258, "global_step": 267565, "epoch": 1592} {"train_loss": -11.651168823242188, "global_step": 267566, "epoch": 1592} {"train_loss": -12.003026962280273, "global_step": 267567, "epoch": 1592} {"train_loss": -11.586885452270508, "global_step": 267568, "epoch": 1592} {"train_loss": -11.956937789916992, "global_step": 267569, "epoch": 1592} {"train_loss": -11.56636905670166, "global_step": 267570, "epoch": 1592} {"train_loss": -12.12885856628418, "global_step": 267571, "epoch": 1592} {"train_loss": -11.744918823242188, "global_step": 267572, "epoch": 1592} {"train_loss": -11.711268424987793, "global_step": 267573, "epoch": 1592} {"train_loss": -11.480734825134277, "global_step": 267574, "epoch": 1592} {"train_loss": -11.668167114257812, "global_step": 267575, "epoch": 1592} {"train_loss": -11.603979110717773, "global_step": 267576, "epoch": 1592} {"train_loss": -11.775544166564941, "global_step": 267577, "epoch": 1592} {"train_loss": -10.915803909301758, "global_step": 267578, "epoch": 1592} {"train_loss": -11.923395156860352, "global_step": 267579, "epoch": 1592} {"train_loss": -11.627815246582031, "global_step": 267580, "epoch": 1592} {"train_loss": -12.039278030395508, "global_step": 267581, "epoch": 1592} {"train_loss": -11.405881881713867, "global_step": 267582, "epoch": 1592} {"train_loss": -11.29941177368164, "global_step": 267583, "epoch": 1592} {"train_loss": -11.687814712524414, "global_step": 267584, "epoch": 1592} {"train_loss": -11.844575881958008, "global_step": 267585, "epoch": 1592} {"train_loss": -11.882108688354492, "global_step": 267586, "epoch": 1592} {"train_loss": -11.599132537841797, "global_step": 267587, "epoch": 1592} {"train_loss": -11.869421005249023, "global_step": 267588, "epoch": 1592} {"train_loss": -11.479114532470703, "global_step": 267589, "epoch": 1592} {"train_loss": -11.902255058288574, "global_step": 267590, "epoch": 1592} {"train_loss": -11.559059143066406, "global_step": 267591, "epoch": 1592} {"train_loss": -11.364873886108398, "global_step": 267592, "epoch": 1592} {"train_loss": -11.551215171813965, "global_step": 267593, "epoch": 1592} {"train_loss": -11.038949966430664, "global_step": 267594, "epoch": 1592} {"train_loss": -11.598892211914062, "global_step": 267595, "epoch": 1592} {"train_loss": -11.47182846069336, "global_step": 267596, "epoch": 1592} {"train_loss": -11.344291687011719, "global_step": 267597, "epoch": 1592} {"train_loss": -11.960418701171875, "global_step": 267598, "epoch": 1592} {"train_loss": -11.346026420593262, "global_step": 267599, "epoch": 1592} {"train_loss": -11.839973449707031, "global_step": 267600, "epoch": 1592} {"train_loss": -11.454523086547852, "global_step": 267601, "epoch": 1592} {"train_loss": -12.060379028320312, "global_step": 267602, "epoch": 1592} {"train_loss": -11.929759979248047, "global_step": 267603, "epoch": 1592} {"train_loss": -11.993496894836426, "global_step": 267604, "epoch": 1592} {"train_loss": -12.071167945861816, "global_step": 267605, "epoch": 1592} {"train_loss": -11.847814559936523, "global_step": 267606, "epoch": 1592} {"train_loss": -11.998783111572266, "global_step": 267607, "epoch": 1592} {"train_loss": -12.137824058532715, "global_step": 267608, "epoch": 1592} {"train_loss": -11.995144844055176, "global_step": 267609, "epoch": 1592} {"train_loss": -12.032843589782715, "global_step": 267610, "epoch": 1592} {"train_loss": -12.094200134277344, "global_step": 267611, "epoch": 1592} {"train_loss": -11.709698677062988, "global_step": 267612, "epoch": 1592} {"train_loss": -11.946964263916016, "global_step": 267613, "epoch": 1592} {"train_loss": -11.680426597595215, "global_step": 267614, "epoch": 1592} {"train_loss": -12.05170726776123, "global_step": 267615, "epoch": 1592} {"train_loss": -11.771564483642578, "global_step": 267616, "epoch": 1592} {"train_loss": -12.156322479248047, "global_step": 267617, "epoch": 1592} {"train_loss": -11.838159561157227, "global_step": 267618, "epoch": 1592} {"train_loss": -11.814847946166992, "global_step": 267619, "epoch": 1592} {"train_loss": -11.932127952575684, "global_step": 267620, "epoch": 1592} {"train_loss": -11.557845115661621, "global_step": 267621, "epoch": 1592} {"train_loss": -11.925020217895508, "global_step": 267622, "epoch": 1592} {"train_loss": -11.618981684957232, "global_step": 267623, "epoch": 1592, "val_loss": 275614.25} {"train_loss": -11.643854141235352, "global_step": 267624, "epoch": 1593} {"train_loss": -11.665840148925781, "global_step": 267625, "epoch": 1593} {"train_loss": -11.719260215759277, "global_step": 267626, "epoch": 1593} {"train_loss": -11.984321594238281, "global_step": 267627, "epoch": 1593} {"train_loss": -11.772549629211426, "global_step": 267628, "epoch": 1593} {"train_loss": -11.847583770751953, "global_step": 267629, "epoch": 1593} {"train_loss": -11.705144882202148, "global_step": 267630, "epoch": 1593} {"train_loss": -12.196008682250977, "global_step": 267631, "epoch": 1593} {"train_loss": -11.35144329071045, "global_step": 267632, "epoch": 1593} {"train_loss": -12.258909225463867, "global_step": 267633, "epoch": 1593} {"train_loss": -12.102470397949219, "global_step": 267634, "epoch": 1593} {"train_loss": -11.59101676940918, "global_step": 267635, "epoch": 1593} {"train_loss": -11.892953872680664, "global_step": 267636, "epoch": 1593} {"train_loss": -11.926685333251953, "global_step": 267637, "epoch": 1593} {"train_loss": -11.967899322509766, "global_step": 267638, "epoch": 1593} {"train_loss": -11.76662826538086, "global_step": 267639, "epoch": 1593} {"train_loss": -11.606691360473633, "global_step": 267640, "epoch": 1593} {"train_loss": -11.616493225097656, "global_step": 267641, "epoch": 1593} {"train_loss": -12.30923080444336, "global_step": 267642, "epoch": 1593} {"train_loss": -11.532012939453125, "global_step": 267643, "epoch": 1593} {"train_loss": -11.827255249023438, "global_step": 267644, "epoch": 1593} {"train_loss": -12.095195770263672, "global_step": 267645, "epoch": 1593} {"train_loss": -11.918794631958008, "global_step": 267646, "epoch": 1593} {"train_loss": -12.212461471557617, "global_step": 267647, "epoch": 1593} {"train_loss": -11.51986026763916, "global_step": 267648, "epoch": 1593} {"train_loss": -11.678422927856445, "global_step": 267649, "epoch": 1593} {"train_loss": -11.868011474609375, "global_step": 267650, "epoch": 1593} {"train_loss": -11.580890655517578, "global_step": 267651, "epoch": 1593} {"train_loss": -11.151283264160156, "global_step": 267652, "epoch": 1593} {"train_loss": -11.564708709716797, "global_step": 267653, "epoch": 1593} {"train_loss": -11.286602020263672, "global_step": 267654, "epoch": 1593} {"train_loss": -10.967151641845703, "global_step": 267655, "epoch": 1593} {"train_loss": -11.166078567504883, "global_step": 267656, "epoch": 1593} {"train_loss": -10.471731185913086, "global_step": 267657, "epoch": 1593} {"train_loss": -11.482553482055664, "global_step": 267658, "epoch": 1593} {"train_loss": -11.200634956359863, "global_step": 267659, "epoch": 1593} {"train_loss": -10.211374282836914, "global_step": 267660, "epoch": 1593} {"train_loss": -10.351932525634766, "global_step": 267661, "epoch": 1593} {"train_loss": -11.813676834106445, "global_step": 267662, "epoch": 1593} {"train_loss": -10.506570816040039, "global_step": 267663, "epoch": 1593} {"train_loss": -11.486898422241211, "global_step": 267664, "epoch": 1593} {"train_loss": -11.08543872833252, "global_step": 267665, "epoch": 1593} {"train_loss": -11.607486724853516, "global_step": 267666, "epoch": 1593} {"train_loss": -11.415725708007812, "global_step": 267667, "epoch": 1593} {"train_loss": -11.629467964172363, "global_step": 267668, "epoch": 1593} {"train_loss": -11.385209083557129, "global_step": 267669, "epoch": 1593} {"train_loss": -11.617996215820312, "global_step": 267670, "epoch": 1593} {"train_loss": -11.424627304077148, "global_step": 267671, "epoch": 1593} {"train_loss": -11.718473434448242, "global_step": 267672, "epoch": 1593} {"train_loss": -11.799539566040039, "global_step": 267673, "epoch": 1593} {"train_loss": -11.718778610229492, "global_step": 267674, "epoch": 1593} {"train_loss": -11.87960147857666, "global_step": 267675, "epoch": 1593} {"train_loss": -11.543479919433594, "global_step": 267676, "epoch": 1593} {"train_loss": -10.966245651245117, "global_step": 267677, "epoch": 1593} {"train_loss": -11.582014083862305, "global_step": 267678, "epoch": 1593} {"train_loss": -11.455066680908203, "global_step": 267679, "epoch": 1593} {"train_loss": -11.430442810058594, "global_step": 267680, "epoch": 1593} {"train_loss": -11.663827896118164, "global_step": 267681, "epoch": 1593} {"train_loss": -11.621108055114746, "global_step": 267682, "epoch": 1593} {"train_loss": -11.552345275878906, "global_step": 267683, "epoch": 1593} {"train_loss": -11.738842010498047, "global_step": 267684, "epoch": 1593} {"train_loss": -11.187649726867676, "global_step": 267685, "epoch": 1593} {"train_loss": -11.741090774536133, "global_step": 267686, "epoch": 1593} {"train_loss": -11.385259628295898, "global_step": 267687, "epoch": 1593} {"train_loss": -11.684606552124023, "global_step": 267688, "epoch": 1593} {"train_loss": -11.789037704467773, "global_step": 267689, "epoch": 1593} {"train_loss": -11.749933242797852, "global_step": 267690, "epoch": 1593} {"train_loss": -11.737515449523926, "global_step": 267691, "epoch": 1593} {"train_loss": -11.569862365722656, "global_step": 267692, "epoch": 1593} {"train_loss": -11.69957160949707, "global_step": 267693, "epoch": 1593} {"train_loss": -11.439496994018555, "global_step": 267694, "epoch": 1593} {"train_loss": -12.021718978881836, "global_step": 267695, "epoch": 1593} {"train_loss": -11.452967643737793, "global_step": 267696, "epoch": 1593} {"train_loss": -11.971266746520996, "global_step": 267697, "epoch": 1593} {"train_loss": -11.625750541687012, "global_step": 267698, "epoch": 1593} {"train_loss": -11.876764297485352, "global_step": 267699, "epoch": 1593} {"train_loss": -11.597360610961914, "global_step": 267700, "epoch": 1593} {"train_loss": -11.938371658325195, "global_step": 267701, "epoch": 1593} {"train_loss": -11.990317344665527, "global_step": 267702, "epoch": 1593} {"train_loss": -11.886703491210938, "global_step": 267703, "epoch": 1593} {"train_loss": -11.783058166503906, "global_step": 267704, "epoch": 1593} {"train_loss": -11.886148452758789, "global_step": 267705, "epoch": 1593} {"train_loss": -11.843960762023926, "global_step": 267706, "epoch": 1593} {"train_loss": -11.93922233581543, "global_step": 267707, "epoch": 1593} {"train_loss": -11.910453796386719, "global_step": 267708, "epoch": 1593} {"train_loss": -11.849797248840332, "global_step": 267709, "epoch": 1593} {"train_loss": -11.96389389038086, "global_step": 267710, "epoch": 1593} {"train_loss": -11.797534942626953, "global_step": 267711, "epoch": 1593} {"train_loss": -12.167919158935547, "global_step": 267712, "epoch": 1593} {"train_loss": -11.651260375976562, "global_step": 267713, "epoch": 1593} {"train_loss": -12.20022201538086, "global_step": 267714, "epoch": 1593} {"train_loss": -11.870773315429688, "global_step": 267715, "epoch": 1593} {"train_loss": -12.15721321105957, "global_step": 267716, "epoch": 1593} {"train_loss": -11.955459594726562, "global_step": 267717, "epoch": 1593} {"train_loss": -12.161825180053711, "global_step": 267718, "epoch": 1593} {"train_loss": -11.888628005981445, "global_step": 267719, "epoch": 1593} {"train_loss": -12.106082916259766, "global_step": 267720, "epoch": 1593} {"train_loss": -11.826712608337402, "global_step": 267721, "epoch": 1593} {"train_loss": -11.898263931274414, "global_step": 267722, "epoch": 1593} {"train_loss": -11.682721138000488, "global_step": 267723, "epoch": 1593} {"train_loss": -12.090847969055176, "global_step": 267724, "epoch": 1593} {"train_loss": -11.86148738861084, "global_step": 267725, "epoch": 1593} {"train_loss": -12.11228084564209, "global_step": 267726, "epoch": 1593} {"train_loss": -12.075180053710938, "global_step": 267727, "epoch": 1593} {"train_loss": -11.967647552490234, "global_step": 267728, "epoch": 1593} {"train_loss": -12.283746719360352, "global_step": 267729, "epoch": 1593} {"train_loss": -12.126546859741211, "global_step": 267730, "epoch": 1593} {"train_loss": -12.15650749206543, "global_step": 267731, "epoch": 1593} {"train_loss": -11.96210765838623, "global_step": 267732, "epoch": 1593} {"train_loss": -12.122954368591309, "global_step": 267733, "epoch": 1593} {"train_loss": -12.029196739196777, "global_step": 267734, "epoch": 1593} {"train_loss": -12.199962615966797, "global_step": 267735, "epoch": 1593} {"train_loss": -11.796743392944336, "global_step": 267736, "epoch": 1593} {"train_loss": -12.247085571289062, "global_step": 267737, "epoch": 1593} {"train_loss": -11.597480773925781, "global_step": 267738, "epoch": 1593} {"train_loss": -12.101675033569336, "global_step": 267739, "epoch": 1593} {"train_loss": -11.953620910644531, "global_step": 267740, "epoch": 1593} {"train_loss": -12.136964797973633, "global_step": 267741, "epoch": 1593} {"train_loss": -11.887434005737305, "global_step": 267742, "epoch": 1593} {"train_loss": -12.231939315795898, "global_step": 267743, "epoch": 1593} {"train_loss": -11.855449676513672, "global_step": 267744, "epoch": 1593} {"train_loss": -11.690009117126465, "global_step": 267745, "epoch": 1593} {"train_loss": -11.62342643737793, "global_step": 267746, "epoch": 1593} {"train_loss": -11.763455390930176, "global_step": 267747, "epoch": 1593} {"train_loss": -12.065383911132812, "global_step": 267748, "epoch": 1593} {"train_loss": -11.800134658813477, "global_step": 267749, "epoch": 1593} {"train_loss": -12.15534496307373, "global_step": 267750, "epoch": 1593} {"train_loss": -11.732121467590332, "global_step": 267751, "epoch": 1593} {"train_loss": -11.470170974731445, "global_step": 267752, "epoch": 1593} {"train_loss": -12.199533462524414, "global_step": 267753, "epoch": 1593} {"train_loss": -11.949776649475098, "global_step": 267754, "epoch": 1593} {"train_loss": -11.971564292907715, "global_step": 267755, "epoch": 1593} {"train_loss": -12.29119873046875, "global_step": 267756, "epoch": 1593} {"train_loss": -11.884700775146484, "global_step": 267757, "epoch": 1593} {"train_loss": -11.427834510803223, "global_step": 267758, "epoch": 1593} {"train_loss": -12.037843704223633, "global_step": 267759, "epoch": 1593} {"train_loss": -11.908954620361328, "global_step": 267760, "epoch": 1593} {"train_loss": -11.676786422729492, "global_step": 267761, "epoch": 1593} {"train_loss": -11.937549591064453, "global_step": 267762, "epoch": 1593} {"train_loss": -12.125682830810547, "global_step": 267763, "epoch": 1593} {"train_loss": -12.234000205993652, "global_step": 267764, "epoch": 1593} {"train_loss": -12.030330657958984, "global_step": 267765, "epoch": 1593} {"train_loss": -12.141489028930664, "global_step": 267766, "epoch": 1593} {"train_loss": -12.209342956542969, "global_step": 267767, "epoch": 1593} {"train_loss": -12.26047134399414, "global_step": 267768, "epoch": 1593} {"train_loss": -12.140701293945312, "global_step": 267769, "epoch": 1593} {"train_loss": -12.23765754699707, "global_step": 267770, "epoch": 1593} {"train_loss": -12.055858612060547, "global_step": 267771, "epoch": 1593} {"train_loss": -12.208919525146484, "global_step": 267772, "epoch": 1593} {"train_loss": -12.16562271118164, "global_step": 267773, "epoch": 1593} {"train_loss": -12.067145347595215, "global_step": 267774, "epoch": 1593} {"train_loss": -12.2098388671875, "global_step": 267775, "epoch": 1593} {"train_loss": -11.727508544921875, "global_step": 267776, "epoch": 1593} {"train_loss": -11.54637622833252, "global_step": 267777, "epoch": 1593} {"train_loss": -11.766544342041016, "global_step": 267778, "epoch": 1593} {"train_loss": -12.281139373779297, "global_step": 267779, "epoch": 1593} {"train_loss": -11.634883880615234, "global_step": 267780, "epoch": 1593} {"train_loss": -12.168094635009766, "global_step": 267781, "epoch": 1593} {"train_loss": -12.270508766174316, "global_step": 267782, "epoch": 1593} {"train_loss": -11.728832244873047, "global_step": 267783, "epoch": 1593} {"train_loss": -11.777135848999023, "global_step": 267784, "epoch": 1593} {"train_loss": -12.207174301147461, "global_step": 267785, "epoch": 1593} {"train_loss": -12.114263534545898, "global_step": 267786, "epoch": 1593} {"train_loss": -12.002155303955078, "global_step": 267787, "epoch": 1593} {"train_loss": -11.732904434204102, "global_step": 267788, "epoch": 1593} {"train_loss": -12.001346588134766, "global_step": 267789, "epoch": 1593} {"train_loss": -11.870664596557617, "global_step": 267790, "epoch": 1593} {"train_loss": -11.797592838605246, "global_step": 267791, "epoch": 1593, "val_loss": 271670.4375} {"train_loss": -11.949569702148438, "global_step": 267792, "epoch": 1594} {"train_loss": -11.90241527557373, "global_step": 267793, "epoch": 1594} {"train_loss": -12.36931037902832, "global_step": 267794, "epoch": 1594} {"train_loss": -11.797882080078125, "global_step": 267795, "epoch": 1594} {"train_loss": -11.631814956665039, "global_step": 267796, "epoch": 1594} {"train_loss": -11.91385555267334, "global_step": 267797, "epoch": 1594} {"train_loss": -10.399458885192871, "global_step": 267798, "epoch": 1594} {"train_loss": -10.964925765991211, "global_step": 267799, "epoch": 1594} {"train_loss": -9.738374710083008, "global_step": 267800, "epoch": 1594} {"train_loss": -10.930453300476074, "global_step": 267801, "epoch": 1594} {"train_loss": -9.958044052124023, "global_step": 267802, "epoch": 1594} {"train_loss": -10.6753568649292, "global_step": 267803, "epoch": 1594} {"train_loss": -8.257818222045898, "global_step": 267804, "epoch": 1594} {"train_loss": -8.013925552368164, "global_step": 267805, "epoch": 1594} {"train_loss": -7.300581455230713, "global_step": 267806, "epoch": 1594} {"train_loss": -7.636113166809082, "global_step": 267807, "epoch": 1594} {"train_loss": -7.2200927734375, "global_step": 267808, "epoch": 1594} {"train_loss": -7.991510391235352, "global_step": 267809, "epoch": 1594} {"train_loss": -9.353050231933594, "global_step": 267810, "epoch": 1594} {"train_loss": -7.876481056213379, "global_step": 267811, "epoch": 1594} {"train_loss": -8.554647445678711, "global_step": 267812, "epoch": 1594} {"train_loss": -8.484672546386719, "global_step": 267813, "epoch": 1594} {"train_loss": -9.907855987548828, "global_step": 267814, "epoch": 1594} {"train_loss": -10.040121078491211, "global_step": 267815, "epoch": 1594} {"train_loss": -10.223834991455078, "global_step": 267816, "epoch": 1594} {"train_loss": -10.913375854492188, "global_step": 267817, "epoch": 1594} {"train_loss": -11.07542610168457, "global_step": 267818, "epoch": 1594} {"train_loss": -9.582124710083008, "global_step": 267819, "epoch": 1594} {"train_loss": -10.297451972961426, "global_step": 267820, "epoch": 1594} {"train_loss": -10.607357025146484, "global_step": 267821, "epoch": 1594} {"train_loss": -10.827180862426758, "global_step": 267822, "epoch": 1594} {"train_loss": -9.636335372924805, "global_step": 267823, "epoch": 1594} {"train_loss": -10.935596466064453, "global_step": 267824, "epoch": 1594} {"train_loss": -8.096756935119629, "global_step": 267825, "epoch": 1594} {"train_loss": -11.316560745239258, "global_step": 267826, "epoch": 1594} {"train_loss": -8.856325149536133, "global_step": 267827, "epoch": 1594} {"train_loss": -10.570796966552734, "global_step": 267828, "epoch": 1594} {"train_loss": -9.240928649902344, "global_step": 267829, "epoch": 1594} {"train_loss": -9.685951232910156, "global_step": 267830, "epoch": 1594} {"train_loss": -9.031684875488281, "global_step": 267831, "epoch": 1594} {"train_loss": -10.52556037902832, "global_step": 267832, "epoch": 1594} {"train_loss": -10.6554536819458, "global_step": 267833, "epoch": 1594} {"train_loss": -10.64809513092041, "global_step": 267834, "epoch": 1594} {"train_loss": -11.371222496032715, "global_step": 267835, "epoch": 1594} {"train_loss": -10.280369758605957, "global_step": 267836, "epoch": 1594} {"train_loss": -10.996776580810547, "global_step": 267837, "epoch": 1594} {"train_loss": -11.127863883972168, "global_step": 267838, "epoch": 1594} {"train_loss": -11.061734199523926, "global_step": 267839, "epoch": 1594} {"train_loss": -10.888910293579102, "global_step": 267840, "epoch": 1594} {"train_loss": -11.163810729980469, "global_step": 267841, "epoch": 1594} {"train_loss": -11.092901229858398, "global_step": 267842, "epoch": 1594} {"train_loss": -10.673120498657227, "global_step": 267843, "epoch": 1594} {"train_loss": -11.368291854858398, "global_step": 267844, "epoch": 1594} {"train_loss": -10.877172470092773, "global_step": 267845, "epoch": 1594} {"train_loss": -11.128246307373047, "global_step": 267846, "epoch": 1594} {"train_loss": -11.55192756652832, "global_step": 267847, "epoch": 1594} {"train_loss": -10.870509147644043, "global_step": 267848, "epoch": 1594} {"train_loss": -11.708978652954102, "global_step": 267849, "epoch": 1594} {"train_loss": -11.589811325073242, "global_step": 267850, "epoch": 1594} {"train_loss": -11.53121566772461, "global_step": 267851, "epoch": 1594} {"train_loss": -11.612913131713867, "global_step": 267852, "epoch": 1594} {"train_loss": -11.780162811279297, "global_step": 267853, "epoch": 1594} {"train_loss": -11.530878067016602, "global_step": 267854, "epoch": 1594} {"train_loss": -11.619559288024902, "global_step": 267855, "epoch": 1594} {"train_loss": -11.828095436096191, "global_step": 267856, "epoch": 1594} {"train_loss": -11.655319213867188, "global_step": 267857, "epoch": 1594} {"train_loss": -11.55727481842041, "global_step": 267858, "epoch": 1594} {"train_loss": -11.53495979309082, "global_step": 267859, "epoch": 1594} {"train_loss": -11.718488693237305, "global_step": 267860, "epoch": 1594} {"train_loss": -11.736934661865234, "global_step": 267861, "epoch": 1594} {"train_loss": -11.863207817077637, "global_step": 267862, "epoch": 1594} {"train_loss": -11.907490730285645, "global_step": 267863, "epoch": 1594} {"train_loss": -11.71255111694336, "global_step": 267864, "epoch": 1594} {"train_loss": -11.698500633239746, "global_step": 267865, "epoch": 1594} {"train_loss": -11.771031379699707, "global_step": 267866, "epoch": 1594} {"train_loss": -11.947336196899414, "global_step": 267867, "epoch": 1594} {"train_loss": -11.648311614990234, "global_step": 267868, "epoch": 1594} {"train_loss": -11.846844673156738, "global_step": 267869, "epoch": 1594} {"train_loss": -11.934503555297852, "global_step": 267870, "epoch": 1594} {"train_loss": -11.927095413208008, "global_step": 267871, "epoch": 1594} {"train_loss": -12.082391738891602, "global_step": 267872, "epoch": 1594} {"train_loss": -11.939910888671875, "global_step": 267873, "epoch": 1594} {"train_loss": -12.104413986206055, "global_step": 267874, "epoch": 1594} {"train_loss": -12.003105163574219, "global_step": 267875, "epoch": 1594} {"train_loss": -11.966852188110352, "global_step": 267876, "epoch": 1594} {"train_loss": -12.043227195739746, "global_step": 267877, "epoch": 1594} {"train_loss": -12.168909072875977, "global_step": 267878, "epoch": 1594} {"train_loss": -12.026172637939453, "global_step": 267879, "epoch": 1594} {"train_loss": -12.028736114501953, "global_step": 267880, "epoch": 1594} {"train_loss": -11.846424102783203, "global_step": 267881, "epoch": 1594} {"train_loss": -12.080418586730957, "global_step": 267882, "epoch": 1594} {"train_loss": -12.038945198059082, "global_step": 267883, "epoch": 1594} {"train_loss": -11.957270622253418, "global_step": 267884, "epoch": 1594} {"train_loss": -12.143461227416992, "global_step": 267885, "epoch": 1594} {"train_loss": -12.13980484008789, "global_step": 267886, "epoch": 1594} {"train_loss": -12.022839546203613, "global_step": 267887, "epoch": 1594} {"train_loss": -12.135478973388672, "global_step": 267888, "epoch": 1594} {"train_loss": -12.28384017944336, "global_step": 267889, "epoch": 1594} {"train_loss": -12.004518508911133, "global_step": 267890, "epoch": 1594} {"train_loss": -12.025106430053711, "global_step": 267891, "epoch": 1594} {"train_loss": -12.099166870117188, "global_step": 267892, "epoch": 1594} {"train_loss": -12.36149787902832, "global_step": 267893, "epoch": 1594} {"train_loss": -12.151529312133789, "global_step": 267894, "epoch": 1594} {"train_loss": -12.091958999633789, "global_step": 267895, "epoch": 1594} {"train_loss": -12.245244979858398, "global_step": 267896, "epoch": 1594} {"train_loss": -12.270536422729492, "global_step": 267897, "epoch": 1594} {"train_loss": -12.25680923461914, "global_step": 267898, "epoch": 1594} {"train_loss": -12.36530590057373, "global_step": 267899, "epoch": 1594} {"train_loss": -12.2821044921875, "global_step": 267900, "epoch": 1594} {"train_loss": -12.255997657775879, "global_step": 267901, "epoch": 1594} {"train_loss": -12.257792472839355, "global_step": 267902, "epoch": 1594} {"train_loss": -11.678297996520996, "global_step": 267903, "epoch": 1594} {"train_loss": -12.300320625305176, "global_step": 267904, "epoch": 1594} {"train_loss": -12.218049049377441, "global_step": 267905, "epoch": 1594} {"train_loss": -12.229336738586426, "global_step": 267906, "epoch": 1594} {"train_loss": -12.240240097045898, "global_step": 267907, "epoch": 1594} {"train_loss": -12.134536743164062, "global_step": 267908, "epoch": 1594} {"train_loss": -12.084256172180176, "global_step": 267909, "epoch": 1594} {"train_loss": -11.958046913146973, "global_step": 267910, "epoch": 1594} {"train_loss": -12.122779846191406, "global_step": 267911, "epoch": 1594} {"train_loss": -12.28165054321289, "global_step": 267912, "epoch": 1594} {"train_loss": -12.094913482666016, "global_step": 267913, "epoch": 1594} {"train_loss": -12.044888496398926, "global_step": 267914, "epoch": 1594} {"train_loss": -11.884346008300781, "global_step": 267915, "epoch": 1594} {"train_loss": -11.553396224975586, "global_step": 267916, "epoch": 1594} {"train_loss": -12.16378402709961, "global_step": 267917, "epoch": 1594} {"train_loss": -11.839143753051758, "global_step": 267918, "epoch": 1594} {"train_loss": -11.846960067749023, "global_step": 267919, "epoch": 1594} {"train_loss": -10.132049560546875, "global_step": 267920, "epoch": 1594} {"train_loss": -11.074777603149414, "global_step": 267921, "epoch": 1594} {"train_loss": -9.811448097229004, "global_step": 267922, "epoch": 1594} {"train_loss": -11.15704345703125, "global_step": 267923, "epoch": 1594} {"train_loss": -11.705353736877441, "global_step": 267924, "epoch": 1594} {"train_loss": -11.131187438964844, "global_step": 267925, "epoch": 1594} {"train_loss": -9.270207405090332, "global_step": 267926, "epoch": 1594} {"train_loss": -10.662055969238281, "global_step": 267927, "epoch": 1594} {"train_loss": -11.766164779663086, "global_step": 267928, "epoch": 1594} {"train_loss": -10.968209266662598, "global_step": 267929, "epoch": 1594} {"train_loss": -9.870920181274414, "global_step": 267930, "epoch": 1594} {"train_loss": -11.613529205322266, "global_step": 267931, "epoch": 1594} {"train_loss": -11.540929794311523, "global_step": 267932, "epoch": 1594} {"train_loss": -11.426689147949219, "global_step": 267933, "epoch": 1594} {"train_loss": -11.747472763061523, "global_step": 267934, "epoch": 1594} {"train_loss": -11.703401565551758, "global_step": 267935, "epoch": 1594} {"train_loss": -11.534048080444336, "global_step": 267936, "epoch": 1594} {"train_loss": -11.654189109802246, "global_step": 267937, "epoch": 1594} {"train_loss": -11.260618209838867, "global_step": 267938, "epoch": 1594} {"train_loss": -11.309793472290039, "global_step": 267939, "epoch": 1594} {"train_loss": -11.841499328613281, "global_step": 267940, "epoch": 1594} {"train_loss": -11.274974822998047, "global_step": 267941, "epoch": 1594} {"train_loss": -11.140783309936523, "global_step": 267942, "epoch": 1594} {"train_loss": -11.821126937866211, "global_step": 267943, "epoch": 1594} {"train_loss": -11.288792610168457, "global_step": 267944, "epoch": 1594} {"train_loss": -11.952936172485352, "global_step": 267945, "epoch": 1594} {"train_loss": -11.700599670410156, "global_step": 267946, "epoch": 1594} {"train_loss": -11.212800979614258, "global_step": 267947, "epoch": 1594} {"train_loss": -11.784449577331543, "global_step": 267948, "epoch": 1594} {"train_loss": -11.115852355957031, "global_step": 267949, "epoch": 1594} {"train_loss": -11.712212562561035, "global_step": 267950, "epoch": 1594} {"train_loss": -11.651585578918457, "global_step": 267951, "epoch": 1594} {"train_loss": -11.540494918823242, "global_step": 267952, "epoch": 1594} {"train_loss": -12.137214660644531, "global_step": 267953, "epoch": 1594} {"train_loss": -11.541772842407227, "global_step": 267954, "epoch": 1594} {"train_loss": -11.944477081298828, "global_step": 267955, "epoch": 1594} {"train_loss": -11.880837440490723, "global_step": 267956, "epoch": 1594} {"train_loss": -12.05670166015625, "global_step": 267957, "epoch": 1594} {"train_loss": -12.086219787597656, "global_step": 267958, "epoch": 1594} {"train_loss": -11.231040378411612, "global_step": 267959, "epoch": 1594, "val_loss": 263403.46875} {"train_loss": -11.649218559265137, "global_step": 267960, "epoch": 1595} {"train_loss": -11.742080688476562, "global_step": 267961, "epoch": 1595} {"train_loss": -11.755426406860352, "global_step": 267962, "epoch": 1595} {"train_loss": -11.541885375976562, "global_step": 267963, "epoch": 1595} {"train_loss": -11.923763275146484, "global_step": 267964, "epoch": 1595} {"train_loss": -11.601724624633789, "global_step": 267965, "epoch": 1595} {"train_loss": -11.990921020507812, "global_step": 267966, "epoch": 1595} {"train_loss": -11.148587226867676, "global_step": 267967, "epoch": 1595} {"train_loss": -11.524520874023438, "global_step": 267968, "epoch": 1595} {"train_loss": -11.636276245117188, "global_step": 267969, "epoch": 1595} {"train_loss": -11.453445434570312, "global_step": 267970, "epoch": 1595} {"train_loss": -11.72685432434082, "global_step": 267971, "epoch": 1595} {"train_loss": -11.649816513061523, "global_step": 267972, "epoch": 1595} {"train_loss": -11.79655647277832, "global_step": 267973, "epoch": 1595} {"train_loss": -11.207145690917969, "global_step": 267974, "epoch": 1595} {"train_loss": -12.030435562133789, "global_step": 267975, "epoch": 1595} {"train_loss": -11.44188117980957, "global_step": 267976, "epoch": 1595} {"train_loss": -11.883180618286133, "global_step": 267977, "epoch": 1595} {"train_loss": -11.991100311279297, "global_step": 267978, "epoch": 1595} {"train_loss": -11.72585678100586, "global_step": 267979, "epoch": 1595} {"train_loss": -12.102164268493652, "global_step": 267980, "epoch": 1595} {"train_loss": -11.964460372924805, "global_step": 267981, "epoch": 1595} {"train_loss": -11.798118591308594, "global_step": 267982, "epoch": 1595} {"train_loss": -12.067676544189453, "global_step": 267983, "epoch": 1595} {"train_loss": -11.696735382080078, "global_step": 267984, "epoch": 1595} {"train_loss": -12.14901065826416, "global_step": 267985, "epoch": 1595} {"train_loss": -11.784688949584961, "global_step": 267986, "epoch": 1595} {"train_loss": -12.097458839416504, "global_step": 267987, "epoch": 1595} {"train_loss": -11.657539367675781, "global_step": 267988, "epoch": 1595} {"train_loss": -12.082881927490234, "global_step": 267989, "epoch": 1595} {"train_loss": -11.735679626464844, "global_step": 267990, "epoch": 1595} {"train_loss": -11.597376823425293, "global_step": 267991, "epoch": 1595} {"train_loss": -12.08253288269043, "global_step": 267992, "epoch": 1595} {"train_loss": -11.208330154418945, "global_step": 267993, "epoch": 1595} {"train_loss": -12.137225151062012, "global_step": 267994, "epoch": 1595} {"train_loss": -11.515443801879883, "global_step": 267995, "epoch": 1595} {"train_loss": -11.973791122436523, "global_step": 267996, "epoch": 1595} {"train_loss": -11.504644393920898, "global_step": 267997, "epoch": 1595} {"train_loss": -11.427499771118164, "global_step": 267998, "epoch": 1595} {"train_loss": -11.540470123291016, "global_step": 267999, "epoch": 1595} {"train_loss": -11.868169784545898, "global_step": 268000, "epoch": 1595} {"train_loss": -11.640823364257812, "global_step": 268001, "epoch": 1595} {"train_loss": -11.584431648254395, "global_step": 268002, "epoch": 1595} {"train_loss": -11.984292030334473, "global_step": 268003, "epoch": 1595} {"train_loss": -12.043450355529785, "global_step": 268004, "epoch": 1595} {"train_loss": -11.950443267822266, "global_step": 268005, "epoch": 1595} {"train_loss": -11.698802947998047, "global_step": 268006, "epoch": 1595} {"train_loss": -12.063244819641113, "global_step": 268007, "epoch": 1595} {"train_loss": -11.838247299194336, "global_step": 268008, "epoch": 1595} {"train_loss": -11.921628952026367, "global_step": 268009, "epoch": 1595} {"train_loss": -12.309194564819336, "global_step": 268010, "epoch": 1595} {"train_loss": -12.01690673828125, "global_step": 268011, "epoch": 1595} {"train_loss": -12.166242599487305, "global_step": 268012, "epoch": 1595} {"train_loss": -12.00600814819336, "global_step": 268013, "epoch": 1595} {"train_loss": -12.08383846282959, "global_step": 268014, "epoch": 1595} {"train_loss": -12.126290321350098, "global_step": 268015, "epoch": 1595} {"train_loss": -12.185997009277344, "global_step": 268016, "epoch": 1595} {"train_loss": -12.069150924682617, "global_step": 268017, "epoch": 1595} {"train_loss": -12.124269485473633, "global_step": 268018, "epoch": 1595} {"train_loss": -11.734935760498047, "global_step": 268019, "epoch": 1595} {"train_loss": -12.179936408996582, "global_step": 268020, "epoch": 1595} {"train_loss": -12.188858032226562, "global_step": 268021, "epoch": 1595} {"train_loss": -12.362310409545898, "global_step": 268022, "epoch": 1595} {"train_loss": -12.322026252746582, "global_step": 268023, "epoch": 1595} {"train_loss": -12.299528121948242, "global_step": 268024, "epoch": 1595} {"train_loss": -12.232598304748535, "global_step": 268025, "epoch": 1595} {"train_loss": -12.187322616577148, "global_step": 268026, "epoch": 1595} {"train_loss": -12.223905563354492, "global_step": 268027, "epoch": 1595} {"train_loss": -12.195213317871094, "global_step": 268028, "epoch": 1595} {"train_loss": -12.316600799560547, "global_step": 268029, "epoch": 1595} {"train_loss": -12.073759078979492, "global_step": 268030, "epoch": 1595} {"train_loss": -12.246313095092773, "global_step": 268031, "epoch": 1595} {"train_loss": -12.09141731262207, "global_step": 268032, "epoch": 1595} {"train_loss": -12.503255844116211, "global_step": 268033, "epoch": 1595} {"train_loss": -12.04241943359375, "global_step": 268034, "epoch": 1595} {"train_loss": -12.066953659057617, "global_step": 268035, "epoch": 1595} {"train_loss": -12.171717643737793, "global_step": 268036, "epoch": 1595} {"train_loss": -12.30213737487793, "global_step": 268037, "epoch": 1595} {"train_loss": -12.150951385498047, "global_step": 268038, "epoch": 1595} {"train_loss": -12.263823509216309, "global_step": 268039, "epoch": 1595} {"train_loss": -12.332149505615234, "global_step": 268040, "epoch": 1595} {"train_loss": -12.397560119628906, "global_step": 268041, "epoch": 1595} {"train_loss": -12.211341857910156, "global_step": 268042, "epoch": 1595} {"train_loss": -12.04254150390625, "global_step": 268043, "epoch": 1595} {"train_loss": -12.214516639709473, "global_step": 268044, "epoch": 1595} {"train_loss": -12.126182556152344, "global_step": 268045, "epoch": 1595} {"train_loss": -11.997568130493164, "global_step": 268046, "epoch": 1595} {"train_loss": -12.013971328735352, "global_step": 268047, "epoch": 1595} {"train_loss": -12.381829261779785, "global_step": 268048, "epoch": 1595} {"train_loss": -12.38687515258789, "global_step": 268049, "epoch": 1595} {"train_loss": -12.106218338012695, "global_step": 268050, "epoch": 1595} {"train_loss": -11.934986114501953, "global_step": 268051, "epoch": 1595} {"train_loss": -12.356439590454102, "global_step": 268052, "epoch": 1595} {"train_loss": -12.032320976257324, "global_step": 268053, "epoch": 1595} {"train_loss": -10.400960922241211, "global_step": 268054, "epoch": 1595} {"train_loss": -10.290849685668945, "global_step": 268055, "epoch": 1595} {"train_loss": -11.75429916381836, "global_step": 268056, "epoch": 1595} {"train_loss": -10.676939010620117, "global_step": 268057, "epoch": 1595} {"train_loss": -11.07221508026123, "global_step": 268058, "epoch": 1595} {"train_loss": -10.702188491821289, "global_step": 268059, "epoch": 1595} {"train_loss": -11.796236038208008, "global_step": 268060, "epoch": 1595} {"train_loss": -9.975964546203613, "global_step": 268061, "epoch": 1595} {"train_loss": -9.4845552444458, "global_step": 268062, "epoch": 1595} {"train_loss": -10.00109577178955, "global_step": 268063, "epoch": 1595} {"train_loss": -8.81378173828125, "global_step": 268064, "epoch": 1595} {"train_loss": -8.524931907653809, "global_step": 268065, "epoch": 1595} {"train_loss": -5.7501678466796875, "global_step": 268066, "epoch": 1595} {"train_loss": -7.08607292175293, "global_step": 268067, "epoch": 1595} {"train_loss": -7.423964023590088, "global_step": 268068, "epoch": 1595} {"train_loss": -8.813410758972168, "global_step": 268069, "epoch": 1595} {"train_loss": -9.440754890441895, "global_step": 268070, "epoch": 1595} {"train_loss": -7.387879371643066, "global_step": 268071, "epoch": 1595} {"train_loss": -8.654958724975586, "global_step": 268072, "epoch": 1595} {"train_loss": -7.641552448272705, "global_step": 268073, "epoch": 1595} {"train_loss": -9.587602615356445, "global_step": 268074, "epoch": 1595} {"train_loss": -10.078781127929688, "global_step": 268075, "epoch": 1595} {"train_loss": -9.968390464782715, "global_step": 268076, "epoch": 1595} {"train_loss": -9.921686172485352, "global_step": 268077, "epoch": 1595} {"train_loss": -10.075167655944824, "global_step": 268078, "epoch": 1595} {"train_loss": -9.872713088989258, "global_step": 268079, "epoch": 1595} {"train_loss": -8.862548828125, "global_step": 268080, "epoch": 1595} {"train_loss": -10.429960250854492, "global_step": 268081, "epoch": 1595} {"train_loss": -8.808094024658203, "global_step": 268082, "epoch": 1595} {"train_loss": -10.938202857971191, "global_step": 268083, "epoch": 1595} {"train_loss": -10.005800247192383, "global_step": 268084, "epoch": 1595} {"train_loss": -9.60621452331543, "global_step": 268085, "epoch": 1595} {"train_loss": -10.64997386932373, "global_step": 268086, "epoch": 1595} {"train_loss": -9.989557266235352, "global_step": 268087, "epoch": 1595} {"train_loss": -11.144278526306152, "global_step": 268088, "epoch": 1595} {"train_loss": -10.006229400634766, "global_step": 268089, "epoch": 1595} {"train_loss": -10.82815933227539, "global_step": 268090, "epoch": 1595} {"train_loss": -10.508705139160156, "global_step": 268091, "epoch": 1595} {"train_loss": -10.66375732421875, "global_step": 268092, "epoch": 1595} {"train_loss": -11.053926467895508, "global_step": 268093, "epoch": 1595} {"train_loss": -10.845306396484375, "global_step": 268094, "epoch": 1595} {"train_loss": -10.817729949951172, "global_step": 268095, "epoch": 1595} {"train_loss": -11.034866333007812, "global_step": 268096, "epoch": 1595} {"train_loss": -10.666145324707031, "global_step": 268097, "epoch": 1595} {"train_loss": -10.946022987365723, "global_step": 268098, "epoch": 1595} {"train_loss": -11.3426513671875, "global_step": 268099, "epoch": 1595} {"train_loss": -11.247276306152344, "global_step": 268100, "epoch": 1595} {"train_loss": -11.379684448242188, "global_step": 268101, "epoch": 1595} {"train_loss": -11.55581283569336, "global_step": 268102, "epoch": 1595} {"train_loss": -11.473172187805176, "global_step": 268103, "epoch": 1595} {"train_loss": -11.387114524841309, "global_step": 268104, "epoch": 1595} {"train_loss": -11.365304946899414, "global_step": 268105, "epoch": 1595} {"train_loss": -11.52938461303711, "global_step": 268106, "epoch": 1595} {"train_loss": -11.353374481201172, "global_step": 268107, "epoch": 1595} {"train_loss": -11.564050674438477, "global_step": 268108, "epoch": 1595} {"train_loss": -11.569825172424316, "global_step": 268109, "epoch": 1595} {"train_loss": -11.467828750610352, "global_step": 268110, "epoch": 1595} {"train_loss": -11.591901779174805, "global_step": 268111, "epoch": 1595} {"train_loss": -11.585470199584961, "global_step": 268112, "epoch": 1595} {"train_loss": -11.520079612731934, "global_step": 268113, "epoch": 1595} {"train_loss": -11.676389694213867, "global_step": 268114, "epoch": 1595} {"train_loss": -11.602926254272461, "global_step": 268115, "epoch": 1595} {"train_loss": -11.650291442871094, "global_step": 268116, "epoch": 1595} {"train_loss": -11.804094314575195, "global_step": 268117, "epoch": 1595} {"train_loss": -11.480457305908203, "global_step": 268118, "epoch": 1595} {"train_loss": -11.642190933227539, "global_step": 268119, "epoch": 1595} {"train_loss": -11.570076942443848, "global_step": 268120, "epoch": 1595} {"train_loss": -11.64467716217041, "global_step": 268121, "epoch": 1595} {"train_loss": -11.458661079406738, "global_step": 268122, "epoch": 1595} {"train_loss": -11.761821746826172, "global_step": 268123, "epoch": 1595} {"train_loss": -11.733085632324219, "global_step": 268124, "epoch": 1595} {"train_loss": -11.68517017364502, "global_step": 268125, "epoch": 1595} {"train_loss": -11.779821395874023, "global_step": 268126, "epoch": 1595} {"train_loss": -11.322900073868889, "global_step": 268127, "epoch": 1595, "val_loss": 268777.375, "train_action_mse_error": 1.3056424856185913} {"train_loss": -11.603309631347656, "global_step": 268128, "epoch": 1596} {"train_loss": -11.707136154174805, "global_step": 268129, "epoch": 1596} {"train_loss": -11.658581733703613, "global_step": 268130, "epoch": 1596} {"train_loss": -11.705168724060059, "global_step": 268131, "epoch": 1596} {"train_loss": -12.023759841918945, "global_step": 268132, "epoch": 1596} {"train_loss": -11.827047348022461, "global_step": 268133, "epoch": 1596} {"train_loss": -11.789152145385742, "global_step": 268134, "epoch": 1596} {"train_loss": -11.91529655456543, "global_step": 268135, "epoch": 1596} {"train_loss": -11.905485153198242, "global_step": 268136, "epoch": 1596} {"train_loss": -11.789456367492676, "global_step": 268137, "epoch": 1596} {"train_loss": -11.703516006469727, "global_step": 268138, "epoch": 1596} {"train_loss": -11.917282104492188, "global_step": 268139, "epoch": 1596} {"train_loss": -11.773293495178223, "global_step": 268140, "epoch": 1596} {"train_loss": -12.010746955871582, "global_step": 268141, "epoch": 1596} {"train_loss": -11.734868049621582, "global_step": 268142, "epoch": 1596} {"train_loss": -11.967781066894531, "global_step": 268143, "epoch": 1596} {"train_loss": -12.06613540649414, "global_step": 268144, "epoch": 1596} {"train_loss": -12.074987411499023, "global_step": 268145, "epoch": 1596} {"train_loss": -12.027430534362793, "global_step": 268146, "epoch": 1596} {"train_loss": -12.069942474365234, "global_step": 268147, "epoch": 1596} {"train_loss": -12.126697540283203, "global_step": 268148, "epoch": 1596} {"train_loss": -11.884994506835938, "global_step": 268149, "epoch": 1596} {"train_loss": -12.036182403564453, "global_step": 268150, "epoch": 1596} {"train_loss": -12.110363006591797, "global_step": 268151, "epoch": 1596} {"train_loss": -12.02821159362793, "global_step": 268152, "epoch": 1596} {"train_loss": -12.099905014038086, "global_step": 268153, "epoch": 1596} {"train_loss": -12.10820198059082, "global_step": 268154, "epoch": 1596} {"train_loss": -12.104743957519531, "global_step": 268155, "epoch": 1596} {"train_loss": -12.092662811279297, "global_step": 268156, "epoch": 1596} {"train_loss": -11.858682632446289, "global_step": 268157, "epoch": 1596} {"train_loss": -12.147862434387207, "global_step": 268158, "epoch": 1596} {"train_loss": -12.161025047302246, "global_step": 268159, "epoch": 1596} {"train_loss": -12.183801651000977, "global_step": 268160, "epoch": 1596} {"train_loss": -12.136896133422852, "global_step": 268161, "epoch": 1596} {"train_loss": -12.188308715820312, "global_step": 268162, "epoch": 1596} {"train_loss": -12.263886451721191, "global_step": 268163, "epoch": 1596} {"train_loss": -12.293720245361328, "global_step": 268164, "epoch": 1596} {"train_loss": -12.374555587768555, "global_step": 268165, "epoch": 1596} {"train_loss": -12.308738708496094, "global_step": 268166, "epoch": 1596} {"train_loss": -12.109182357788086, "global_step": 268167, "epoch": 1596} {"train_loss": -12.24241828918457, "global_step": 268168, "epoch": 1596} {"train_loss": -12.101101875305176, "global_step": 268169, "epoch": 1596} {"train_loss": -12.203948974609375, "global_step": 268170, "epoch": 1596} {"train_loss": -12.366584777832031, "global_step": 268171, "epoch": 1596} {"train_loss": -12.237890243530273, "global_step": 268172, "epoch": 1596} {"train_loss": -12.308917999267578, "global_step": 268173, "epoch": 1596} {"train_loss": -12.027315139770508, "global_step": 268174, "epoch": 1596} {"train_loss": -12.060588836669922, "global_step": 268175, "epoch": 1596} {"train_loss": -12.25643253326416, "global_step": 268176, "epoch": 1596} {"train_loss": -12.241808891296387, "global_step": 268177, "epoch": 1596} {"train_loss": -12.270837783813477, "global_step": 268178, "epoch": 1596} {"train_loss": -12.118667602539062, "global_step": 268179, "epoch": 1596} {"train_loss": -12.314323425292969, "global_step": 268180, "epoch": 1596} {"train_loss": -12.034399032592773, "global_step": 268181, "epoch": 1596} {"train_loss": -12.236970901489258, "global_step": 268182, "epoch": 1596} {"train_loss": -12.288885116577148, "global_step": 268183, "epoch": 1596} {"train_loss": -12.487077713012695, "global_step": 268184, "epoch": 1596} {"train_loss": -12.05384635925293, "global_step": 268185, "epoch": 1596} {"train_loss": -12.196687698364258, "global_step": 268186, "epoch": 1596} {"train_loss": -12.438406944274902, "global_step": 268187, "epoch": 1596} {"train_loss": -12.105451583862305, "global_step": 268188, "epoch": 1596} {"train_loss": -12.148940086364746, "global_step": 268189, "epoch": 1596} {"train_loss": -12.384066581726074, "global_step": 268190, "epoch": 1596} {"train_loss": -12.052254676818848, "global_step": 268191, "epoch": 1596} {"train_loss": -11.95937442779541, "global_step": 268192, "epoch": 1596} {"train_loss": -11.88311767578125, "global_step": 268193, "epoch": 1596} {"train_loss": -12.177605628967285, "global_step": 268194, "epoch": 1596} {"train_loss": -11.984928131103516, "global_step": 268195, "epoch": 1596} {"train_loss": -12.30866527557373, "global_step": 268196, "epoch": 1596} {"train_loss": -12.237115859985352, "global_step": 268197, "epoch": 1596} {"train_loss": -12.36943244934082, "global_step": 268198, "epoch": 1596} {"train_loss": -12.057840347290039, "global_step": 268199, "epoch": 1596} {"train_loss": -11.45662784576416, "global_step": 268200, "epoch": 1596} {"train_loss": -11.808921813964844, "global_step": 268201, "epoch": 1596} {"train_loss": -11.978715896606445, "global_step": 268202, "epoch": 1596} {"train_loss": -10.47427749633789, "global_step": 268203, "epoch": 1596} {"train_loss": -11.472236633300781, "global_step": 268204, "epoch": 1596} {"train_loss": -11.504249572753906, "global_step": 268205, "epoch": 1596} {"train_loss": -11.045517921447754, "global_step": 268206, "epoch": 1596} {"train_loss": -10.167006492614746, "global_step": 268207, "epoch": 1596} {"train_loss": -11.868328094482422, "global_step": 268208, "epoch": 1596} {"train_loss": -11.403834342956543, "global_step": 268209, "epoch": 1596} {"train_loss": -11.104313850402832, "global_step": 268210, "epoch": 1596} {"train_loss": -11.230510711669922, "global_step": 268211, "epoch": 1596} {"train_loss": -11.511469841003418, "global_step": 268212, "epoch": 1596} {"train_loss": -11.853076934814453, "global_step": 268213, "epoch": 1596} {"train_loss": -11.482818603515625, "global_step": 268214, "epoch": 1596} {"train_loss": -11.79752254486084, "global_step": 268215, "epoch": 1596} {"train_loss": -11.72628402709961, "global_step": 268216, "epoch": 1596} {"train_loss": -11.043501853942871, "global_step": 268217, "epoch": 1596} {"train_loss": -11.23508071899414, "global_step": 268218, "epoch": 1596} {"train_loss": -11.610122680664062, "global_step": 268219, "epoch": 1596} {"train_loss": -11.304092407226562, "global_step": 268220, "epoch": 1596} {"train_loss": -11.766817092895508, "global_step": 268221, "epoch": 1596} {"train_loss": -11.585865020751953, "global_step": 268222, "epoch": 1596} {"train_loss": -11.661117553710938, "global_step": 268223, "epoch": 1596} {"train_loss": -11.53521728515625, "global_step": 268224, "epoch": 1596} {"train_loss": -11.223313331604004, "global_step": 268225, "epoch": 1596} {"train_loss": -11.586885452270508, "global_step": 268226, "epoch": 1596} {"train_loss": -11.625798225402832, "global_step": 268227, "epoch": 1596} {"train_loss": -11.335837364196777, "global_step": 268228, "epoch": 1596} {"train_loss": -11.532915115356445, "global_step": 268229, "epoch": 1596} {"train_loss": -11.154777526855469, "global_step": 268230, "epoch": 1596} {"train_loss": -11.624574661254883, "global_step": 268231, "epoch": 1596} {"train_loss": -11.332490921020508, "global_step": 268232, "epoch": 1596} {"train_loss": -11.568029403686523, "global_step": 268233, "epoch": 1596} {"train_loss": -11.488566398620605, "global_step": 268234, "epoch": 1596} {"train_loss": -11.477684020996094, "global_step": 268235, "epoch": 1596} {"train_loss": -11.231989860534668, "global_step": 268236, "epoch": 1596} {"train_loss": -11.290325164794922, "global_step": 268237, "epoch": 1596} {"train_loss": -10.294740676879883, "global_step": 268238, "epoch": 1596} {"train_loss": -11.558025360107422, "global_step": 268239, "epoch": 1596} {"train_loss": -11.35087776184082, "global_step": 268240, "epoch": 1596} {"train_loss": -11.623603820800781, "global_step": 268241, "epoch": 1596} {"train_loss": -11.073293685913086, "global_step": 268242, "epoch": 1596} {"train_loss": -10.56610107421875, "global_step": 268243, "epoch": 1596} {"train_loss": -11.083245277404785, "global_step": 268244, "epoch": 1596} {"train_loss": -9.710685729980469, "global_step": 268245, "epoch": 1596} {"train_loss": -11.819320678710938, "global_step": 268246, "epoch": 1596} {"train_loss": -9.437662124633789, "global_step": 268247, "epoch": 1596} {"train_loss": -11.748296737670898, "global_step": 268248, "epoch": 1596} {"train_loss": -9.703617095947266, "global_step": 268249, "epoch": 1596} {"train_loss": -11.504895210266113, "global_step": 268250, "epoch": 1596} {"train_loss": -10.101839065551758, "global_step": 268251, "epoch": 1596} {"train_loss": -11.418718338012695, "global_step": 268252, "epoch": 1596} {"train_loss": -11.283243179321289, "global_step": 268253, "epoch": 1596} {"train_loss": -11.3834228515625, "global_step": 268254, "epoch": 1596} {"train_loss": -11.512105941772461, "global_step": 268255, "epoch": 1596} {"train_loss": -11.235586166381836, "global_step": 268256, "epoch": 1596} {"train_loss": -11.62491226196289, "global_step": 268257, "epoch": 1596} {"train_loss": -11.196269989013672, "global_step": 268258, "epoch": 1596} {"train_loss": -11.75507640838623, "global_step": 268259, "epoch": 1596} {"train_loss": -11.488114356994629, "global_step": 268260, "epoch": 1596} {"train_loss": -11.280025482177734, "global_step": 268261, "epoch": 1596} {"train_loss": -11.860053062438965, "global_step": 268262, "epoch": 1596} {"train_loss": -11.233530044555664, "global_step": 268263, "epoch": 1596} {"train_loss": -11.745759963989258, "global_step": 268264, "epoch": 1596} {"train_loss": -11.708442687988281, "global_step": 268265, "epoch": 1596} {"train_loss": -11.755197525024414, "global_step": 268266, "epoch": 1596} {"train_loss": -11.908590316772461, "global_step": 268267, "epoch": 1596} {"train_loss": -11.77006721496582, "global_step": 268268, "epoch": 1596} {"train_loss": -12.014387130737305, "global_step": 268269, "epoch": 1596} {"train_loss": -11.867597579956055, "global_step": 268270, "epoch": 1596} {"train_loss": -12.185648918151855, "global_step": 268271, "epoch": 1596} {"train_loss": -11.826045989990234, "global_step": 268272, "epoch": 1596} {"train_loss": -11.964275360107422, "global_step": 268273, "epoch": 1596} {"train_loss": -11.902819633483887, "global_step": 268274, "epoch": 1596} {"train_loss": -11.98996353149414, "global_step": 268275, "epoch": 1596} {"train_loss": -11.83317756652832, "global_step": 268276, "epoch": 1596} {"train_loss": -11.974291801452637, "global_step": 268277, "epoch": 1596} {"train_loss": -11.740326881408691, "global_step": 268278, "epoch": 1596} {"train_loss": -11.76613712310791, "global_step": 268279, "epoch": 1596} {"train_loss": -11.865165710449219, "global_step": 268280, "epoch": 1596} {"train_loss": -11.54191780090332, "global_step": 268281, "epoch": 1596} {"train_loss": -12.047972679138184, "global_step": 268282, "epoch": 1596} {"train_loss": -11.693807601928711, "global_step": 268283, "epoch": 1596} {"train_loss": -11.877427101135254, "global_step": 268284, "epoch": 1596} {"train_loss": -11.849991798400879, "global_step": 268285, "epoch": 1596} {"train_loss": -11.629712104797363, "global_step": 268286, "epoch": 1596} {"train_loss": -11.97653579711914, "global_step": 268287, "epoch": 1596} {"train_loss": -11.696971893310547, "global_step": 268288, "epoch": 1596} {"train_loss": -11.798054695129395, "global_step": 268289, "epoch": 1596} {"train_loss": -11.680509567260742, "global_step": 268290, "epoch": 1596} {"train_loss": -11.86485481262207, "global_step": 268291, "epoch": 1596} {"train_loss": -11.465429306030273, "global_step": 268292, "epoch": 1596} {"train_loss": -12.143396377563477, "global_step": 268293, "epoch": 1596} {"train_loss": -11.461135864257812, "global_step": 268294, "epoch": 1596} {"train_loss": -11.733552694320679, "global_step": 268295, "epoch": 1596, "val_loss": 272837.5} {"train_loss": -11.793769836425781, "global_step": 268296, "epoch": 1597} {"train_loss": -11.736223220825195, "global_step": 268297, "epoch": 1597} {"train_loss": -11.811483383178711, "global_step": 268298, "epoch": 1597} {"train_loss": -11.646738052368164, "global_step": 268299, "epoch": 1597} {"train_loss": -11.613851547241211, "global_step": 268300, "epoch": 1597} {"train_loss": -11.684587478637695, "global_step": 268301, "epoch": 1597} {"train_loss": -10.993049621582031, "global_step": 268302, "epoch": 1597} {"train_loss": -11.97619915008545, "global_step": 268303, "epoch": 1597} {"train_loss": -10.896354675292969, "global_step": 268304, "epoch": 1597} {"train_loss": -11.646254539489746, "global_step": 268305, "epoch": 1597} {"train_loss": -11.097114562988281, "global_step": 268306, "epoch": 1597} {"train_loss": -11.15772819519043, "global_step": 268307, "epoch": 1597} {"train_loss": -11.118895530700684, "global_step": 268308, "epoch": 1597} {"train_loss": -11.33273696899414, "global_step": 268309, "epoch": 1597} {"train_loss": -11.543107986450195, "global_step": 268310, "epoch": 1597} {"train_loss": -11.449978828430176, "global_step": 268311, "epoch": 1597} {"train_loss": -11.686870574951172, "global_step": 268312, "epoch": 1597} {"train_loss": -10.927337646484375, "global_step": 268313, "epoch": 1597} {"train_loss": -11.616800308227539, "global_step": 268314, "epoch": 1597} {"train_loss": -11.443832397460938, "global_step": 268315, "epoch": 1597} {"train_loss": -11.718854904174805, "global_step": 268316, "epoch": 1597} {"train_loss": -11.583246231079102, "global_step": 268317, "epoch": 1597} {"train_loss": -11.623759269714355, "global_step": 268318, "epoch": 1597} {"train_loss": -11.62474250793457, "global_step": 268319, "epoch": 1597} {"train_loss": -11.67905044555664, "global_step": 268320, "epoch": 1597} {"train_loss": -11.412402153015137, "global_step": 268321, "epoch": 1597} {"train_loss": -11.816911697387695, "global_step": 268322, "epoch": 1597} {"train_loss": -11.386075019836426, "global_step": 268323, "epoch": 1597} {"train_loss": -11.633770942687988, "global_step": 268324, "epoch": 1597} {"train_loss": -11.646374702453613, "global_step": 268325, "epoch": 1597} {"train_loss": -11.786611557006836, "global_step": 268326, "epoch": 1597} {"train_loss": -11.595331192016602, "global_step": 268327, "epoch": 1597} {"train_loss": -11.94318675994873, "global_step": 268328, "epoch": 1597} {"train_loss": -11.919638633728027, "global_step": 268329, "epoch": 1597} {"train_loss": -11.510747909545898, "global_step": 268330, "epoch": 1597} {"train_loss": -11.947778701782227, "global_step": 268331, "epoch": 1597} {"train_loss": -11.51026439666748, "global_step": 268332, "epoch": 1597} {"train_loss": -12.182459831237793, "global_step": 268333, "epoch": 1597} {"train_loss": -11.747934341430664, "global_step": 268334, "epoch": 1597} {"train_loss": -12.120264053344727, "global_step": 268335, "epoch": 1597} {"train_loss": -11.988229751586914, "global_step": 268336, "epoch": 1597} {"train_loss": -11.932228088378906, "global_step": 268337, "epoch": 1597} {"train_loss": -11.988149642944336, "global_step": 268338, "epoch": 1597} {"train_loss": -11.756685256958008, "global_step": 268339, "epoch": 1597} {"train_loss": -11.986335754394531, "global_step": 268340, "epoch": 1597} {"train_loss": -12.029481887817383, "global_step": 268341, "epoch": 1597} {"train_loss": -11.954427719116211, "global_step": 268342, "epoch": 1597} {"train_loss": -11.872138977050781, "global_step": 268343, "epoch": 1597} {"train_loss": -12.064796447753906, "global_step": 268344, "epoch": 1597} {"train_loss": -11.956622123718262, "global_step": 268345, "epoch": 1597} {"train_loss": -11.928144454956055, "global_step": 268346, "epoch": 1597} {"train_loss": -11.958259582519531, "global_step": 268347, "epoch": 1597} {"train_loss": -11.83592414855957, "global_step": 268348, "epoch": 1597} {"train_loss": -11.934019088745117, "global_step": 268349, "epoch": 1597} {"train_loss": -11.973424911499023, "global_step": 268350, "epoch": 1597} {"train_loss": -12.09183120727539, "global_step": 268351, "epoch": 1597} {"train_loss": -12.03549861907959, "global_step": 268352, "epoch": 1597} {"train_loss": -12.230833053588867, "global_step": 268353, "epoch": 1597} {"train_loss": -12.186986923217773, "global_step": 268354, "epoch": 1597} {"train_loss": -12.077306747436523, "global_step": 268355, "epoch": 1597} {"train_loss": -12.161432266235352, "global_step": 268356, "epoch": 1597} {"train_loss": -12.098844528198242, "global_step": 268357, "epoch": 1597} {"train_loss": -12.14783000946045, "global_step": 268358, "epoch": 1597} {"train_loss": -12.08849048614502, "global_step": 268359, "epoch": 1597} {"train_loss": -11.95554256439209, "global_step": 268360, "epoch": 1597} {"train_loss": -11.875555992126465, "global_step": 268361, "epoch": 1597} {"train_loss": -11.931529998779297, "global_step": 268362, "epoch": 1597} {"train_loss": -12.156057357788086, "global_step": 268363, "epoch": 1597} {"train_loss": -11.828115463256836, "global_step": 268364, "epoch": 1597} {"train_loss": -12.320212364196777, "global_step": 268365, "epoch": 1597} {"train_loss": -11.891887664794922, "global_step": 268366, "epoch": 1597} {"train_loss": -12.194692611694336, "global_step": 268367, "epoch": 1597} {"train_loss": -11.85169506072998, "global_step": 268368, "epoch": 1597} {"train_loss": -12.251877784729004, "global_step": 268369, "epoch": 1597} {"train_loss": -12.083329200744629, "global_step": 268370, "epoch": 1597} {"train_loss": -11.786285400390625, "global_step": 268371, "epoch": 1597} {"train_loss": -12.058815956115723, "global_step": 268372, "epoch": 1597} {"train_loss": -11.533700942993164, "global_step": 268373, "epoch": 1597} {"train_loss": -11.210763931274414, "global_step": 268374, "epoch": 1597} {"train_loss": -11.488931655883789, "global_step": 268375, "epoch": 1597} {"train_loss": -12.035568237304688, "global_step": 268376, "epoch": 1597} {"train_loss": -11.518241882324219, "global_step": 268377, "epoch": 1597} {"train_loss": -11.325794219970703, "global_step": 268378, "epoch": 1597} {"train_loss": -12.071456909179688, "global_step": 268379, "epoch": 1597} {"train_loss": -11.860185623168945, "global_step": 268380, "epoch": 1597} {"train_loss": -11.556760787963867, "global_step": 268381, "epoch": 1597} {"train_loss": -11.803901672363281, "global_step": 268382, "epoch": 1597} {"train_loss": -12.234966278076172, "global_step": 268383, "epoch": 1597} {"train_loss": -11.199745178222656, "global_step": 268384, "epoch": 1597} {"train_loss": -10.36384105682373, "global_step": 268385, "epoch": 1597} {"train_loss": -10.107513427734375, "global_step": 268386, "epoch": 1597} {"train_loss": -11.616410255432129, "global_step": 268387, "epoch": 1597} {"train_loss": -10.914714813232422, "global_step": 268388, "epoch": 1597} {"train_loss": -11.357330322265625, "global_step": 268389, "epoch": 1597} {"train_loss": -10.430774688720703, "global_step": 268390, "epoch": 1597} {"train_loss": -10.468488693237305, "global_step": 268391, "epoch": 1597} {"train_loss": -10.607738494873047, "global_step": 268392, "epoch": 1597} {"train_loss": -9.079763412475586, "global_step": 268393, "epoch": 1597} {"train_loss": -9.857526779174805, "global_step": 268394, "epoch": 1597} {"train_loss": -10.137521743774414, "global_step": 268395, "epoch": 1597} {"train_loss": -11.109649658203125, "global_step": 268396, "epoch": 1597} {"train_loss": -10.859977722167969, "global_step": 268397, "epoch": 1597} {"train_loss": -10.982406616210938, "global_step": 268398, "epoch": 1597} {"train_loss": -11.445448875427246, "global_step": 268399, "epoch": 1597} {"train_loss": -11.744720458984375, "global_step": 268400, "epoch": 1597} {"train_loss": -11.240335464477539, "global_step": 268401, "epoch": 1597} {"train_loss": -11.762256622314453, "global_step": 268402, "epoch": 1597} {"train_loss": -10.939409255981445, "global_step": 268403, "epoch": 1597} {"train_loss": -10.93191909790039, "global_step": 268404, "epoch": 1597} {"train_loss": -11.094741821289062, "global_step": 268405, "epoch": 1597} {"train_loss": -10.553098678588867, "global_step": 268406, "epoch": 1597} {"train_loss": -11.007454872131348, "global_step": 268407, "epoch": 1597} {"train_loss": -10.421478271484375, "global_step": 268408, "epoch": 1597} {"train_loss": -11.188558578491211, "global_step": 268409, "epoch": 1597} {"train_loss": -11.042893409729004, "global_step": 268410, "epoch": 1597} {"train_loss": -10.786648750305176, "global_step": 268411, "epoch": 1597} {"train_loss": -11.57937240600586, "global_step": 268412, "epoch": 1597} {"train_loss": -11.08538818359375, "global_step": 268413, "epoch": 1597} {"train_loss": -10.838301658630371, "global_step": 268414, "epoch": 1597} {"train_loss": -11.669584274291992, "global_step": 268415, "epoch": 1597} {"train_loss": -11.146444320678711, "global_step": 268416, "epoch": 1597} {"train_loss": -11.09496784210205, "global_step": 268417, "epoch": 1597} {"train_loss": -11.632294654846191, "global_step": 268418, "epoch": 1597} {"train_loss": -11.289437294006348, "global_step": 268419, "epoch": 1597} {"train_loss": -11.782622337341309, "global_step": 268420, "epoch": 1597} {"train_loss": -11.701661109924316, "global_step": 268421, "epoch": 1597} {"train_loss": -11.563159942626953, "global_step": 268422, "epoch": 1597} {"train_loss": -11.802923202514648, "global_step": 268423, "epoch": 1597} {"train_loss": -11.71672248840332, "global_step": 268424, "epoch": 1597} {"train_loss": -11.977774620056152, "global_step": 268425, "epoch": 1597} {"train_loss": -11.725471496582031, "global_step": 268426, "epoch": 1597} {"train_loss": -11.620317459106445, "global_step": 268427, "epoch": 1597} {"train_loss": -11.871309280395508, "global_step": 268428, "epoch": 1597} {"train_loss": -11.860636711120605, "global_step": 268429, "epoch": 1597} {"train_loss": -11.971370697021484, "global_step": 268430, "epoch": 1597} {"train_loss": -11.868298530578613, "global_step": 268431, "epoch": 1597} {"train_loss": -11.849006652832031, "global_step": 268432, "epoch": 1597} {"train_loss": -11.794538497924805, "global_step": 268433, "epoch": 1597} {"train_loss": -11.994280815124512, "global_step": 268434, "epoch": 1597} {"train_loss": -12.000442504882812, "global_step": 268435, "epoch": 1597} {"train_loss": -11.865962982177734, "global_step": 268436, "epoch": 1597} {"train_loss": -12.132466316223145, "global_step": 268437, "epoch": 1597} {"train_loss": -11.868335723876953, "global_step": 268438, "epoch": 1597} {"train_loss": -11.945589065551758, "global_step": 268439, "epoch": 1597} {"train_loss": -12.108678817749023, "global_step": 268440, "epoch": 1597} {"train_loss": -12.097458839416504, "global_step": 268441, "epoch": 1597} {"train_loss": -12.016791343688965, "global_step": 268442, "epoch": 1597} {"train_loss": -12.017602920532227, "global_step": 268443, "epoch": 1597} {"train_loss": -12.058520317077637, "global_step": 268444, "epoch": 1597} {"train_loss": -12.02786636352539, "global_step": 268445, "epoch": 1597} {"train_loss": -12.106049537658691, "global_step": 268446, "epoch": 1597} {"train_loss": -11.921098709106445, "global_step": 268447, "epoch": 1597} {"train_loss": -12.124709129333496, "global_step": 268448, "epoch": 1597} {"train_loss": -12.027767181396484, "global_step": 268449, "epoch": 1597} {"train_loss": -11.941394805908203, "global_step": 268450, "epoch": 1597} {"train_loss": -11.913156509399414, "global_step": 268451, "epoch": 1597} {"train_loss": -12.154780387878418, "global_step": 268452, "epoch": 1597} {"train_loss": -12.113004684448242, "global_step": 268453, "epoch": 1597} {"train_loss": -11.938740730285645, "global_step": 268454, "epoch": 1597} {"train_loss": -11.739019393920898, "global_step": 268455, "epoch": 1597} {"train_loss": -11.85273265838623, "global_step": 268456, "epoch": 1597} {"train_loss": -12.107758522033691, "global_step": 268457, "epoch": 1597} {"train_loss": -11.911540985107422, "global_step": 268458, "epoch": 1597} {"train_loss": -12.206329345703125, "global_step": 268459, "epoch": 1597} {"train_loss": -11.982513427734375, "global_step": 268460, "epoch": 1597} {"train_loss": -12.081565856933594, "global_step": 268461, "epoch": 1597} {"train_loss": -11.97012710571289, "global_step": 268462, "epoch": 1597} {"train_loss": -11.639479688235692, "global_step": 268463, "epoch": 1597, "val_loss": 273824.5} {"train_loss": -12.016242027282715, "global_step": 268464, "epoch": 1598} {"train_loss": -12.068904876708984, "global_step": 268465, "epoch": 1598} {"train_loss": -12.418159484863281, "global_step": 268466, "epoch": 1598} {"train_loss": -12.00103759765625, "global_step": 268467, "epoch": 1598} {"train_loss": -12.276141166687012, "global_step": 268468, "epoch": 1598} {"train_loss": -12.194143295288086, "global_step": 268469, "epoch": 1598} {"train_loss": -11.818735122680664, "global_step": 268470, "epoch": 1598} {"train_loss": -12.161142349243164, "global_step": 268471, "epoch": 1598} {"train_loss": -12.199126243591309, "global_step": 268472, "epoch": 1598} {"train_loss": -11.82497787475586, "global_step": 268473, "epoch": 1598} {"train_loss": -11.900191307067871, "global_step": 268474, "epoch": 1598} {"train_loss": -11.591791152954102, "global_step": 268475, "epoch": 1598} {"train_loss": -12.19166374206543, "global_step": 268476, "epoch": 1598} {"train_loss": -12.17365550994873, "global_step": 268477, "epoch": 1598} {"train_loss": -12.132731437683105, "global_step": 268478, "epoch": 1598} {"train_loss": -11.989030838012695, "global_step": 268479, "epoch": 1598} {"train_loss": -11.990250587463379, "global_step": 268480, "epoch": 1598} {"train_loss": -11.99502944946289, "global_step": 268481, "epoch": 1598} {"train_loss": -11.776712417602539, "global_step": 268482, "epoch": 1598} {"train_loss": -12.383834838867188, "global_step": 268483, "epoch": 1598} {"train_loss": -12.086009979248047, "global_step": 268484, "epoch": 1598} {"train_loss": -12.145841598510742, "global_step": 268485, "epoch": 1598} {"train_loss": -12.249262809753418, "global_step": 268486, "epoch": 1598} {"train_loss": -12.341791152954102, "global_step": 268487, "epoch": 1598} {"train_loss": -12.43402099609375, "global_step": 268488, "epoch": 1598} {"train_loss": -12.245967864990234, "global_step": 268489, "epoch": 1598} {"train_loss": -12.121089935302734, "global_step": 268490, "epoch": 1598} {"train_loss": -11.878347396850586, "global_step": 268491, "epoch": 1598} {"train_loss": -11.966187477111816, "global_step": 268492, "epoch": 1598} {"train_loss": -12.140474319458008, "global_step": 268493, "epoch": 1598} {"train_loss": -12.048334121704102, "global_step": 268494, "epoch": 1598} {"train_loss": -11.931007385253906, "global_step": 268495, "epoch": 1598} {"train_loss": -11.82397747039795, "global_step": 268496, "epoch": 1598} {"train_loss": -12.276853561401367, "global_step": 268497, "epoch": 1598} {"train_loss": -12.09544563293457, "global_step": 268498, "epoch": 1598} {"train_loss": -11.387367248535156, "global_step": 268499, "epoch": 1598} {"train_loss": -11.195878982543945, "global_step": 268500, "epoch": 1598} {"train_loss": -11.827187538146973, "global_step": 268501, "epoch": 1598} {"train_loss": -11.394826889038086, "global_step": 268502, "epoch": 1598} {"train_loss": -10.628854751586914, "global_step": 268503, "epoch": 1598} {"train_loss": -10.991659164428711, "global_step": 268504, "epoch": 1598} {"train_loss": -10.134138107299805, "global_step": 268505, "epoch": 1598} {"train_loss": -9.498183250427246, "global_step": 268506, "epoch": 1598} {"train_loss": -10.9042329788208, "global_step": 268507, "epoch": 1598} {"train_loss": -8.748434066772461, "global_step": 268508, "epoch": 1598} {"train_loss": -9.085914611816406, "global_step": 268509, "epoch": 1598} {"train_loss": -9.926839828491211, "global_step": 268510, "epoch": 1598} {"train_loss": -8.800127983093262, "global_step": 268511, "epoch": 1598} {"train_loss": -8.153827667236328, "global_step": 268512, "epoch": 1598} {"train_loss": -6.395878791809082, "global_step": 268513, "epoch": 1598} {"train_loss": -7.614267826080322, "global_step": 268514, "epoch": 1598} {"train_loss": -7.280633449554443, "global_step": 268515, "epoch": 1598} {"train_loss": -6.840250492095947, "global_step": 268516, "epoch": 1598} {"train_loss": -8.546299934387207, "global_step": 268517, "epoch": 1598} {"train_loss": -9.105061531066895, "global_step": 268518, "epoch": 1598} {"train_loss": -8.745445251464844, "global_step": 268519, "epoch": 1598} {"train_loss": -9.238901138305664, "global_step": 268520, "epoch": 1598} {"train_loss": -9.148004531860352, "global_step": 268521, "epoch": 1598} {"train_loss": -10.962648391723633, "global_step": 268522, "epoch": 1598} {"train_loss": -9.346944808959961, "global_step": 268523, "epoch": 1598} {"train_loss": -10.372136116027832, "global_step": 268524, "epoch": 1598} {"train_loss": -9.387365341186523, "global_step": 268525, "epoch": 1598} {"train_loss": -10.381285667419434, "global_step": 268526, "epoch": 1598} {"train_loss": -9.663883209228516, "global_step": 268527, "epoch": 1598} {"train_loss": -10.879410743713379, "global_step": 268528, "epoch": 1598} {"train_loss": -9.5376558303833, "global_step": 268529, "epoch": 1598} {"train_loss": -10.466581344604492, "global_step": 268530, "epoch": 1598} {"train_loss": -10.384586334228516, "global_step": 268531, "epoch": 1598} {"train_loss": -9.69670295715332, "global_step": 268532, "epoch": 1598} {"train_loss": -11.203516006469727, "global_step": 268533, "epoch": 1598} {"train_loss": -10.801046371459961, "global_step": 268534, "epoch": 1598} {"train_loss": -9.621423721313477, "global_step": 268535, "epoch": 1598} {"train_loss": -11.209311485290527, "global_step": 268536, "epoch": 1598} {"train_loss": -10.367700576782227, "global_step": 268537, "epoch": 1598} {"train_loss": -11.03834342956543, "global_step": 268538, "epoch": 1598} {"train_loss": -10.938165664672852, "global_step": 268539, "epoch": 1598} {"train_loss": -10.965045928955078, "global_step": 268540, "epoch": 1598} {"train_loss": -11.096818923950195, "global_step": 268541, "epoch": 1598} {"train_loss": -11.005544662475586, "global_step": 268542, "epoch": 1598} {"train_loss": -11.35932731628418, "global_step": 268543, "epoch": 1598} {"train_loss": -11.098749160766602, "global_step": 268544, "epoch": 1598} {"train_loss": -10.972221374511719, "global_step": 268545, "epoch": 1598} {"train_loss": -11.222294807434082, "global_step": 268546, "epoch": 1598} {"train_loss": -11.042186737060547, "global_step": 268547, "epoch": 1598} {"train_loss": -11.73654842376709, "global_step": 268548, "epoch": 1598} {"train_loss": -11.222612380981445, "global_step": 268549, "epoch": 1598} {"train_loss": -11.145135879516602, "global_step": 268550, "epoch": 1598} {"train_loss": -11.271944046020508, "global_step": 268551, "epoch": 1598} {"train_loss": -11.559572219848633, "global_step": 268552, "epoch": 1598} {"train_loss": -11.123939514160156, "global_step": 268553, "epoch": 1598} {"train_loss": -11.302122116088867, "global_step": 268554, "epoch": 1598} {"train_loss": -11.690679550170898, "global_step": 268555, "epoch": 1598} {"train_loss": -11.518230438232422, "global_step": 268556, "epoch": 1598} {"train_loss": -11.381799697875977, "global_step": 268557, "epoch": 1598} {"train_loss": -11.544740676879883, "global_step": 268558, "epoch": 1598} {"train_loss": -11.653063774108887, "global_step": 268559, "epoch": 1598} {"train_loss": -11.490324020385742, "global_step": 268560, "epoch": 1598} {"train_loss": -11.532295227050781, "global_step": 268561, "epoch": 1598} {"train_loss": -11.823304176330566, "global_step": 268562, "epoch": 1598} {"train_loss": -11.645572662353516, "global_step": 268563, "epoch": 1598} {"train_loss": -11.578964233398438, "global_step": 268564, "epoch": 1598} {"train_loss": -11.881994247436523, "global_step": 268565, "epoch": 1598} {"train_loss": -11.813074111938477, "global_step": 268566, "epoch": 1598} {"train_loss": -11.623739242553711, "global_step": 268567, "epoch": 1598} {"train_loss": -11.861132621765137, "global_step": 268568, "epoch": 1598} {"train_loss": -11.854673385620117, "global_step": 268569, "epoch": 1598} {"train_loss": -11.528669357299805, "global_step": 268570, "epoch": 1598} {"train_loss": -11.741130828857422, "global_step": 268571, "epoch": 1598} {"train_loss": -11.934865951538086, "global_step": 268572, "epoch": 1598} {"train_loss": -11.826065063476562, "global_step": 268573, "epoch": 1598} {"train_loss": -11.773893356323242, "global_step": 268574, "epoch": 1598} {"train_loss": -11.870384216308594, "global_step": 268575, "epoch": 1598} {"train_loss": -11.974664688110352, "global_step": 268576, "epoch": 1598} {"train_loss": -11.822929382324219, "global_step": 268577, "epoch": 1598} {"train_loss": -11.79636001586914, "global_step": 268578, "epoch": 1598} {"train_loss": -11.805015563964844, "global_step": 268579, "epoch": 1598} {"train_loss": -11.872791290283203, "global_step": 268580, "epoch": 1598} {"train_loss": -11.924217224121094, "global_step": 268581, "epoch": 1598} {"train_loss": -11.937888145446777, "global_step": 268582, "epoch": 1598} {"train_loss": -11.952232360839844, "global_step": 268583, "epoch": 1598} {"train_loss": -11.981878280639648, "global_step": 268584, "epoch": 1598} {"train_loss": -11.796296119689941, "global_step": 268585, "epoch": 1598} {"train_loss": -11.98836898803711, "global_step": 268586, "epoch": 1598} {"train_loss": -12.030020713806152, "global_step": 268587, "epoch": 1598} {"train_loss": -12.046850204467773, "global_step": 268588, "epoch": 1598} {"train_loss": -12.101299285888672, "global_step": 268589, "epoch": 1598} {"train_loss": -12.051573753356934, "global_step": 268590, "epoch": 1598} {"train_loss": -12.054115295410156, "global_step": 268591, "epoch": 1598} {"train_loss": -12.01568603515625, "global_step": 268592, "epoch": 1598} {"train_loss": -12.175504684448242, "global_step": 268593, "epoch": 1598} {"train_loss": -12.285544395446777, "global_step": 268594, "epoch": 1598} {"train_loss": -12.017425537109375, "global_step": 268595, "epoch": 1598} {"train_loss": -12.148893356323242, "global_step": 268596, "epoch": 1598} {"train_loss": -12.133923530578613, "global_step": 268597, "epoch": 1598} {"train_loss": -11.94157600402832, "global_step": 268598, "epoch": 1598} {"train_loss": -12.122404098510742, "global_step": 268599, "epoch": 1598} {"train_loss": -11.950332641601562, "global_step": 268600, "epoch": 1598} {"train_loss": -12.143733978271484, "global_step": 268601, "epoch": 1598} {"train_loss": -12.18641471862793, "global_step": 268602, "epoch": 1598} {"train_loss": -12.109806060791016, "global_step": 268603, "epoch": 1598} {"train_loss": -12.266888618469238, "global_step": 268604, "epoch": 1598} {"train_loss": -12.29832649230957, "global_step": 268605, "epoch": 1598} {"train_loss": -12.266029357910156, "global_step": 268606, "epoch": 1598} {"train_loss": -12.28622055053711, "global_step": 268607, "epoch": 1598} {"train_loss": -12.3483247756958, "global_step": 268608, "epoch": 1598} {"train_loss": -12.28131103515625, "global_step": 268609, "epoch": 1598} {"train_loss": -12.246444702148438, "global_step": 268610, "epoch": 1598} {"train_loss": -12.366920471191406, "global_step": 268611, "epoch": 1598} {"train_loss": -12.132793426513672, "global_step": 268612, "epoch": 1598} {"train_loss": -12.372713088989258, "global_step": 268613, "epoch": 1598} {"train_loss": -12.411293983459473, "global_step": 268614, "epoch": 1598} {"train_loss": -12.524863243103027, "global_step": 268615, "epoch": 1598} {"train_loss": -12.228595733642578, "global_step": 268616, "epoch": 1598} {"train_loss": -12.231435775756836, "global_step": 268617, "epoch": 1598} {"train_loss": -12.348875045776367, "global_step": 268618, "epoch": 1598} {"train_loss": -12.295965194702148, "global_step": 268619, "epoch": 1598} {"train_loss": -12.510777473449707, "global_step": 268620, "epoch": 1598} {"train_loss": -12.404495239257812, "global_step": 268621, "epoch": 1598} {"train_loss": -12.185861587524414, "global_step": 268622, "epoch": 1598} {"train_loss": -12.310234069824219, "global_step": 268623, "epoch": 1598} {"train_loss": -12.337268829345703, "global_step": 268624, "epoch": 1598} {"train_loss": -12.190410614013672, "global_step": 268625, "epoch": 1598} {"train_loss": -12.190345764160156, "global_step": 268626, "epoch": 1598} {"train_loss": -11.707270622253418, "global_step": 268627, "epoch": 1598} {"train_loss": -11.278572082519531, "global_step": 268628, "epoch": 1598} {"train_loss": -11.237532615661621, "global_step": 268629, "epoch": 1598} {"train_loss": -10.609243392944336, "global_step": 268630, "epoch": 1598} {"train_loss": -11.388700085026878, "global_step": 268631, "epoch": 1598, "val_loss": 262952.375} {"train_loss": -11.472612380981445, "global_step": 268632, "epoch": 1599} {"train_loss": -11.789796829223633, "global_step": 268633, "epoch": 1599} {"train_loss": -12.057391166687012, "global_step": 268634, "epoch": 1599} {"train_loss": -12.021207809448242, "global_step": 268635, "epoch": 1599} {"train_loss": -11.843666076660156, "global_step": 268636, "epoch": 1599} {"train_loss": -12.156522750854492, "global_step": 268637, "epoch": 1599} {"train_loss": -11.303781509399414, "global_step": 268638, "epoch": 1599} {"train_loss": -12.291084289550781, "global_step": 268639, "epoch": 1599} {"train_loss": -11.733306884765625, "global_step": 268640, "epoch": 1599} {"train_loss": -12.175941467285156, "global_step": 268641, "epoch": 1599} {"train_loss": -11.742630004882812, "global_step": 268642, "epoch": 1599} {"train_loss": -11.706692695617676, "global_step": 268643, "epoch": 1599} {"train_loss": -12.174362182617188, "global_step": 268644, "epoch": 1599} {"train_loss": -12.11180591583252, "global_step": 268645, "epoch": 1599} {"train_loss": -11.712726593017578, "global_step": 268646, "epoch": 1599} {"train_loss": -11.927757263183594, "global_step": 268647, "epoch": 1599} {"train_loss": -12.099702835083008, "global_step": 268648, "epoch": 1599} {"train_loss": -10.678831100463867, "global_step": 268649, "epoch": 1599} {"train_loss": -10.085489273071289, "global_step": 268650, "epoch": 1599} {"train_loss": -11.747228622436523, "global_step": 268651, "epoch": 1599} {"train_loss": -10.595352172851562, "global_step": 268652, "epoch": 1599} {"train_loss": -11.119132995605469, "global_step": 268653, "epoch": 1599} {"train_loss": -11.011202812194824, "global_step": 268654, "epoch": 1599} {"train_loss": -9.404345512390137, "global_step": 268655, "epoch": 1599} {"train_loss": -10.44209098815918, "global_step": 268656, "epoch": 1599} {"train_loss": -11.415512084960938, "global_step": 268657, "epoch": 1599} {"train_loss": -10.793703079223633, "global_step": 268658, "epoch": 1599} {"train_loss": -11.293571472167969, "global_step": 268659, "epoch": 1599} {"train_loss": -10.951417922973633, "global_step": 268660, "epoch": 1599} {"train_loss": -11.035104751586914, "global_step": 268661, "epoch": 1599} {"train_loss": -11.271669387817383, "global_step": 268662, "epoch": 1599} {"train_loss": -10.769909858703613, "global_step": 268663, "epoch": 1599} {"train_loss": -11.806999206542969, "global_step": 268664, "epoch": 1599} {"train_loss": -10.736494064331055, "global_step": 268665, "epoch": 1599} {"train_loss": -11.09121036529541, "global_step": 268666, "epoch": 1599} {"train_loss": -11.241853713989258, "global_step": 268667, "epoch": 1599} {"train_loss": -11.613203048706055, "global_step": 268668, "epoch": 1599} {"train_loss": -11.163867950439453, "global_step": 268669, "epoch": 1599} {"train_loss": -11.746267318725586, "global_step": 268670, "epoch": 1599} {"train_loss": -10.906637191772461, "global_step": 268671, "epoch": 1599} {"train_loss": -11.832201957702637, "global_step": 268672, "epoch": 1599} {"train_loss": -10.18663215637207, "global_step": 268673, "epoch": 1599} {"train_loss": -11.444748878479004, "global_step": 268674, "epoch": 1599} {"train_loss": -10.965511322021484, "global_step": 268675, "epoch": 1599} {"train_loss": -11.327573776245117, "global_step": 268676, "epoch": 1599} {"train_loss": -11.629293441772461, "global_step": 268677, "epoch": 1599} {"train_loss": -10.62883186340332, "global_step": 268678, "epoch": 1599} {"train_loss": -11.706131935119629, "global_step": 268679, "epoch": 1599} {"train_loss": -10.612041473388672, "global_step": 268680, "epoch": 1599} {"train_loss": -11.674489974975586, "global_step": 268681, "epoch": 1599} {"train_loss": -11.518056869506836, "global_step": 268682, "epoch": 1599} {"train_loss": -11.252739906311035, "global_step": 268683, "epoch": 1599} {"train_loss": -11.509567260742188, "global_step": 268684, "epoch": 1599} {"train_loss": -11.26720905303955, "global_step": 268685, "epoch": 1599} {"train_loss": -11.797449111938477, "global_step": 268686, "epoch": 1599} {"train_loss": -11.515890121459961, "global_step": 268687, "epoch": 1599} {"train_loss": -11.772579193115234, "global_step": 268688, "epoch": 1599} {"train_loss": -11.87833023071289, "global_step": 268689, "epoch": 1599} {"train_loss": -11.719924926757812, "global_step": 268690, "epoch": 1599} {"train_loss": -11.791072845458984, "global_step": 268691, "epoch": 1599} {"train_loss": -11.521581649780273, "global_step": 268692, "epoch": 1599} {"train_loss": -11.360467910766602, "global_step": 268693, "epoch": 1599} {"train_loss": -11.536369323730469, "global_step": 268694, "epoch": 1599} {"train_loss": -11.816645622253418, "global_step": 268695, "epoch": 1599} {"train_loss": -11.654322624206543, "global_step": 268696, "epoch": 1599} {"train_loss": -11.797033309936523, "global_step": 268697, "epoch": 1599} {"train_loss": -11.691471099853516, "global_step": 268698, "epoch": 1599} {"train_loss": -12.063130378723145, "global_step": 268699, "epoch": 1599} {"train_loss": -11.821267127990723, "global_step": 268700, "epoch": 1599} {"train_loss": -11.591796875, "global_step": 268701, "epoch": 1599} {"train_loss": -11.931170463562012, "global_step": 268702, "epoch": 1599} {"train_loss": -11.683466911315918, "global_step": 268703, "epoch": 1599} {"train_loss": -11.84981918334961, "global_step": 268704, "epoch": 1599} {"train_loss": -11.6068115234375, "global_step": 268705, "epoch": 1599} {"train_loss": -11.96231746673584, "global_step": 268706, "epoch": 1599} {"train_loss": -11.914775848388672, "global_step": 268707, "epoch": 1599} {"train_loss": -11.684511184692383, "global_step": 268708, "epoch": 1599} {"train_loss": -11.881620407104492, "global_step": 268709, "epoch": 1599} {"train_loss": -11.992080688476562, "global_step": 268710, "epoch": 1599} {"train_loss": -11.918076515197754, "global_step": 268711, "epoch": 1599} {"train_loss": -11.854272842407227, "global_step": 268712, "epoch": 1599} {"train_loss": -11.866615295410156, "global_step": 268713, "epoch": 1599} {"train_loss": -11.962892532348633, "global_step": 268714, "epoch": 1599} {"train_loss": -11.872526168823242, "global_step": 268715, "epoch": 1599} {"train_loss": -12.107812881469727, "global_step": 268716, "epoch": 1599} {"train_loss": -11.88593864440918, "global_step": 268717, "epoch": 1599} {"train_loss": -12.218238830566406, "global_step": 268718, "epoch": 1599} {"train_loss": -12.08306884765625, "global_step": 268719, "epoch": 1599} {"train_loss": -11.842467308044434, "global_step": 268720, "epoch": 1599} {"train_loss": -11.929840087890625, "global_step": 268721, "epoch": 1599} {"train_loss": -12.152732849121094, "global_step": 268722, "epoch": 1599} {"train_loss": -11.927207946777344, "global_step": 268723, "epoch": 1599} {"train_loss": -12.094446182250977, "global_step": 268724, "epoch": 1599} {"train_loss": -12.144553184509277, "global_step": 268725, "epoch": 1599} {"train_loss": -11.629608154296875, "global_step": 268726, "epoch": 1599} {"train_loss": -12.118005752563477, "global_step": 268727, "epoch": 1599} {"train_loss": -12.068294525146484, "global_step": 268728, "epoch": 1599} {"train_loss": -11.662030220031738, "global_step": 268729, "epoch": 1599} {"train_loss": -12.168355941772461, "global_step": 268730, "epoch": 1599} {"train_loss": -11.471893310546875, "global_step": 268731, "epoch": 1599} {"train_loss": -11.970354080200195, "global_step": 268732, "epoch": 1599} {"train_loss": -11.894438743591309, "global_step": 268733, "epoch": 1599} {"train_loss": -11.81002426147461, "global_step": 268734, "epoch": 1599} {"train_loss": -11.747962951660156, "global_step": 268735, "epoch": 1599} {"train_loss": -11.760103225708008, "global_step": 268736, "epoch": 1599} {"train_loss": -12.003877639770508, "global_step": 268737, "epoch": 1599} {"train_loss": -12.210362434387207, "global_step": 268738, "epoch": 1599} {"train_loss": -12.099559783935547, "global_step": 268739, "epoch": 1599} {"train_loss": -11.877679824829102, "global_step": 268740, "epoch": 1599} {"train_loss": -12.1964111328125, "global_step": 268741, "epoch": 1599} {"train_loss": -12.002304077148438, "global_step": 268742, "epoch": 1599} {"train_loss": -11.826969146728516, "global_step": 268743, "epoch": 1599} {"train_loss": -12.412774085998535, "global_step": 268744, "epoch": 1599} {"train_loss": -11.941911697387695, "global_step": 268745, "epoch": 1599} {"train_loss": -12.266887664794922, "global_step": 268746, "epoch": 1599} {"train_loss": -12.090734481811523, "global_step": 268747, "epoch": 1599} {"train_loss": -11.946712493896484, "global_step": 268748, "epoch": 1599} {"train_loss": -12.18765640258789, "global_step": 268749, "epoch": 1599} {"train_loss": -11.969625473022461, "global_step": 268750, "epoch": 1599} {"train_loss": -11.924336433410645, "global_step": 268751, "epoch": 1599} {"train_loss": -12.369579315185547, "global_step": 268752, "epoch": 1599} {"train_loss": -12.186417579650879, "global_step": 268753, "epoch": 1599} {"train_loss": -12.018209457397461, "global_step": 268754, "epoch": 1599} {"train_loss": -12.193655014038086, "global_step": 268755, "epoch": 1599} {"train_loss": -11.655960083007812, "global_step": 268756, "epoch": 1599} {"train_loss": -11.599437713623047, "global_step": 268757, "epoch": 1599} {"train_loss": -12.072250366210938, "global_step": 268758, "epoch": 1599} {"train_loss": -11.969499588012695, "global_step": 268759, "epoch": 1599} {"train_loss": -11.838260650634766, "global_step": 268760, "epoch": 1599} {"train_loss": -12.162445068359375, "global_step": 268761, "epoch": 1599} {"train_loss": -11.844575881958008, "global_step": 268762, "epoch": 1599} {"train_loss": -12.203594207763672, "global_step": 268763, "epoch": 1599} {"train_loss": -12.070276260375977, "global_step": 268764, "epoch": 1599} {"train_loss": -10.584416389465332, "global_step": 268765, "epoch": 1599} {"train_loss": -11.228991508483887, "global_step": 268766, "epoch": 1599} {"train_loss": -11.982110977172852, "global_step": 268767, "epoch": 1599} {"train_loss": -10.187260627746582, "global_step": 268768, "epoch": 1599} {"train_loss": -11.713661193847656, "global_step": 268769, "epoch": 1599} {"train_loss": -10.471085548400879, "global_step": 268770, "epoch": 1599} {"train_loss": -10.732433319091797, "global_step": 268771, "epoch": 1599} {"train_loss": -11.643922805786133, "global_step": 268772, "epoch": 1599} {"train_loss": -10.219074249267578, "global_step": 268773, "epoch": 1599} {"train_loss": -11.14598274230957, "global_step": 268774, "epoch": 1599} {"train_loss": -10.426822662353516, "global_step": 268775, "epoch": 1599} {"train_loss": -10.02352237701416, "global_step": 268776, "epoch": 1599} {"train_loss": -10.500101089477539, "global_step": 268777, "epoch": 1599} {"train_loss": -8.841440200805664, "global_step": 268778, "epoch": 1599} {"train_loss": -8.873119354248047, "global_step": 268779, "epoch": 1599} {"train_loss": -10.861773490905762, "global_step": 268780, "epoch": 1599} {"train_loss": -9.695575714111328, "global_step": 268781, "epoch": 1599} {"train_loss": -9.376585006713867, "global_step": 268782, "epoch": 1599} {"train_loss": -10.21420669555664, "global_step": 268783, "epoch": 1599} {"train_loss": -10.532526016235352, "global_step": 268784, "epoch": 1599} {"train_loss": -10.76817512512207, "global_step": 268785, "epoch": 1599} {"train_loss": -10.40528678894043, "global_step": 268786, "epoch": 1599} {"train_loss": -10.228068351745605, "global_step": 268787, "epoch": 1599} {"train_loss": -10.237886428833008, "global_step": 268788, "epoch": 1599} {"train_loss": -10.587000846862793, "global_step": 268789, "epoch": 1599} {"train_loss": -10.902063369750977, "global_step": 268790, "epoch": 1599} {"train_loss": -10.300756454467773, "global_step": 268791, "epoch": 1599} {"train_loss": -10.423181533813477, "global_step": 268792, "epoch": 1599} {"train_loss": -10.923019409179688, "global_step": 268793, "epoch": 1599} {"train_loss": -9.696195602416992, "global_step": 268794, "epoch": 1599} {"train_loss": -11.326712608337402, "global_step": 268795, "epoch": 1599} {"train_loss": -10.697778701782227, "global_step": 268796, "epoch": 1599} {"train_loss": -11.268997192382812, "global_step": 268797, "epoch": 1599} {"train_loss": -11.557758331298828, "global_step": 268798, "epoch": 1599} {"train_loss": -11.451012577329363, "global_step": 268799, "epoch": 1599, "val_loss": 267868.875} {"train_loss": -11.384217262268066, "global_step": 268800, "epoch": 1600} {"train_loss": -11.508829116821289, "global_step": 268801, "epoch": 1600} {"train_loss": -11.348491668701172, "global_step": 268802, "epoch": 1600} {"train_loss": -11.611385345458984, "global_step": 268803, "epoch": 1600} {"train_loss": -11.619379043579102, "global_step": 268804, "epoch": 1600} {"train_loss": -11.562359809875488, "global_step": 268805, "epoch": 1600} {"train_loss": -11.670909881591797, "global_step": 268806, "epoch": 1600} {"train_loss": -11.490445137023926, "global_step": 268807, "epoch": 1600} {"train_loss": -11.412267684936523, "global_step": 268808, "epoch": 1600} {"train_loss": -11.792365074157715, "global_step": 268809, "epoch": 1600} {"train_loss": -11.626296997070312, "global_step": 268810, "epoch": 1600} {"train_loss": -11.461116790771484, "global_step": 268811, "epoch": 1600} {"train_loss": -11.878673553466797, "global_step": 268812, "epoch": 1600} {"train_loss": -11.508726119995117, "global_step": 268813, "epoch": 1600} {"train_loss": -11.95738697052002, "global_step": 268814, "epoch": 1600} {"train_loss": -11.626766204833984, "global_step": 268815, "epoch": 1600} {"train_loss": -11.86492919921875, "global_step": 268816, "epoch": 1600} {"train_loss": -11.670902252197266, "global_step": 268817, "epoch": 1600} {"train_loss": -11.81507682800293, "global_step": 268818, "epoch": 1600} {"train_loss": -11.59881591796875, "global_step": 268819, "epoch": 1600} {"train_loss": -11.742704391479492, "global_step": 268820, "epoch": 1600} {"train_loss": -11.743097305297852, "global_step": 268821, "epoch": 1600} {"train_loss": -11.867599487304688, "global_step": 268822, "epoch": 1600} {"train_loss": -11.737339973449707, "global_step": 268823, "epoch": 1600} {"train_loss": -11.778450012207031, "global_step": 268824, "epoch": 1600} {"train_loss": -12.07944107055664, "global_step": 268825, "epoch": 1600} {"train_loss": -11.912948608398438, "global_step": 268826, "epoch": 1600} {"train_loss": -11.901927947998047, "global_step": 268827, "epoch": 1600} {"train_loss": -12.010126113891602, "global_step": 268828, "epoch": 1600} {"train_loss": -12.197954177856445, "global_step": 268829, "epoch": 1600} {"train_loss": -12.150390625, "global_step": 268830, "epoch": 1600} {"train_loss": -11.993865966796875, "global_step": 268831, "epoch": 1600} {"train_loss": -12.115825653076172, "global_step": 268832, "epoch": 1600} {"train_loss": -11.939530372619629, "global_step": 268833, "epoch": 1600} {"train_loss": -12.193341255187988, "global_step": 268834, "epoch": 1600} {"train_loss": -12.075357437133789, "global_step": 268835, "epoch": 1600} {"train_loss": -12.088363647460938, "global_step": 268836, "epoch": 1600} {"train_loss": -12.151277542114258, "global_step": 268837, "epoch": 1600} {"train_loss": -12.279141426086426, "global_step": 268838, "epoch": 1600} {"train_loss": -11.970279693603516, "global_step": 268839, "epoch": 1600} {"train_loss": -11.927924156188965, "global_step": 268840, "epoch": 1600} {"train_loss": -12.013729095458984, "global_step": 268841, "epoch": 1600} {"train_loss": -12.172526359558105, "global_step": 268842, "epoch": 1600} {"train_loss": -12.004785537719727, "global_step": 268843, "epoch": 1600} {"train_loss": -12.144684791564941, "global_step": 268844, "epoch": 1600} {"train_loss": -12.168474197387695, "global_step": 268845, "epoch": 1600} {"train_loss": -12.053960800170898, "global_step": 268846, "epoch": 1600} {"train_loss": -11.921745300292969, "global_step": 268847, "epoch": 1600} {"train_loss": -11.948638916015625, "global_step": 268848, "epoch": 1600} {"train_loss": -12.065938949584961, "global_step": 268849, "epoch": 1600} {"train_loss": -12.16930866241455, "global_step": 268850, "epoch": 1600} {"train_loss": -11.9622163772583, "global_step": 268851, "epoch": 1600} {"train_loss": -11.852692604064941, "global_step": 268852, "epoch": 1600} {"train_loss": -12.258291244506836, "global_step": 268853, "epoch": 1600} {"train_loss": -12.030086517333984, "global_step": 268854, "epoch": 1600} {"train_loss": -12.19216251373291, "global_step": 268855, "epoch": 1600} {"train_loss": -12.116947174072266, "global_step": 268856, "epoch": 1600} {"train_loss": -11.77271842956543, "global_step": 268857, "epoch": 1600} {"train_loss": -11.413238525390625, "global_step": 268858, "epoch": 1600} {"train_loss": -11.410232543945312, "global_step": 268859, "epoch": 1600} {"train_loss": -12.100456237792969, "global_step": 268860, "epoch": 1600} {"train_loss": -11.132291793823242, "global_step": 268861, "epoch": 1600} {"train_loss": -11.708209991455078, "global_step": 268862, "epoch": 1600} {"train_loss": -11.950912475585938, "global_step": 268863, "epoch": 1600} {"train_loss": -11.590299606323242, "global_step": 268864, "epoch": 1600} {"train_loss": -12.087000846862793, "global_step": 268865, "epoch": 1600} {"train_loss": -12.037504196166992, "global_step": 268866, "epoch": 1600} {"train_loss": -11.912054061889648, "global_step": 268867, "epoch": 1600} {"train_loss": -11.774816513061523, "global_step": 268868, "epoch": 1600} {"train_loss": -11.945815086364746, "global_step": 268869, "epoch": 1600} {"train_loss": -11.470869064331055, "global_step": 268870, "epoch": 1600} {"train_loss": -11.621713638305664, "global_step": 268871, "epoch": 1600} {"train_loss": -11.897388458251953, "global_step": 268872, "epoch": 1600} {"train_loss": -11.832062721252441, "global_step": 268873, "epoch": 1600} {"train_loss": -12.03618049621582, "global_step": 268874, "epoch": 1600} {"train_loss": -12.065471649169922, "global_step": 268875, "epoch": 1600} {"train_loss": -11.985433578491211, "global_step": 268876, "epoch": 1600} {"train_loss": -11.795760154724121, "global_step": 268877, "epoch": 1600} {"train_loss": -12.068368911743164, "global_step": 268878, "epoch": 1600} {"train_loss": -12.094453811645508, "global_step": 268879, "epoch": 1600} {"train_loss": -11.864377975463867, "global_step": 268880, "epoch": 1600} {"train_loss": -11.96998119354248, "global_step": 268881, "epoch": 1600} {"train_loss": -11.779787063598633, "global_step": 268882, "epoch": 1600} {"train_loss": -12.143001556396484, "global_step": 268883, "epoch": 1600} {"train_loss": -11.520541191101074, "global_step": 268884, "epoch": 1600} {"train_loss": -11.926823616027832, "global_step": 268885, "epoch": 1600} {"train_loss": -11.73918628692627, "global_step": 268886, "epoch": 1600} {"train_loss": -11.361909866333008, "global_step": 268887, "epoch": 1600} {"train_loss": -11.586597442626953, "global_step": 268888, "epoch": 1600} {"train_loss": -12.054264068603516, "global_step": 268889, "epoch": 1600} {"train_loss": -11.692485809326172, "global_step": 268890, "epoch": 1600} {"train_loss": -11.6226224899292, "global_step": 268891, "epoch": 1600} {"train_loss": -11.89588737487793, "global_step": 268892, "epoch": 1600} {"train_loss": -11.580608367919922, "global_step": 268893, "epoch": 1600} {"train_loss": -10.616596221923828, "global_step": 268894, "epoch": 1600} {"train_loss": -12.09416389465332, "global_step": 268895, "epoch": 1600} {"train_loss": -11.811027526855469, "global_step": 268896, "epoch": 1600} {"train_loss": -11.378141403198242, "global_step": 268897, "epoch": 1600} {"train_loss": -11.857419967651367, "global_step": 268898, "epoch": 1600} {"train_loss": -11.959714889526367, "global_step": 268899, "epoch": 1600} {"train_loss": -11.007221221923828, "global_step": 268900, "epoch": 1600} {"train_loss": -11.392019271850586, "global_step": 268901, "epoch": 1600} {"train_loss": -11.482158660888672, "global_step": 268902, "epoch": 1600} {"train_loss": -11.98952865600586, "global_step": 268903, "epoch": 1600} {"train_loss": -11.57386302947998, "global_step": 268904, "epoch": 1600} {"train_loss": -12.152137756347656, "global_step": 268905, "epoch": 1600} {"train_loss": -11.356995582580566, "global_step": 268906, "epoch": 1600} {"train_loss": -11.55201244354248, "global_step": 268907, "epoch": 1600} {"train_loss": -11.839415550231934, "global_step": 268908, "epoch": 1600} {"train_loss": -11.410627365112305, "global_step": 268909, "epoch": 1600} {"train_loss": -11.645318984985352, "global_step": 268910, "epoch": 1600} {"train_loss": -11.250874519348145, "global_step": 268911, "epoch": 1600} {"train_loss": -11.497230529785156, "global_step": 268912, "epoch": 1600} {"train_loss": -11.123757362365723, "global_step": 268913, "epoch": 1600} {"train_loss": -11.20830249786377, "global_step": 268914, "epoch": 1600} {"train_loss": -11.654495239257812, "global_step": 268915, "epoch": 1600} {"train_loss": -11.41246223449707, "global_step": 268916, "epoch": 1600} {"train_loss": -11.60749626159668, "global_step": 268917, "epoch": 1600} {"train_loss": -11.902074813842773, "global_step": 268918, "epoch": 1600} {"train_loss": -11.626869201660156, "global_step": 268919, "epoch": 1600} {"train_loss": -11.362783432006836, "global_step": 268920, "epoch": 1600} {"train_loss": -11.748032569885254, "global_step": 268921, "epoch": 1600} {"train_loss": -11.066576957702637, "global_step": 268922, "epoch": 1600} {"train_loss": -11.64338207244873, "global_step": 268923, "epoch": 1600} {"train_loss": -11.6420316696167, "global_step": 268924, "epoch": 1600} {"train_loss": -11.658824920654297, "global_step": 268925, "epoch": 1600} {"train_loss": -11.706024169921875, "global_step": 268926, "epoch": 1600} {"train_loss": -11.675087928771973, "global_step": 268927, "epoch": 1600} {"train_loss": -11.54715633392334, "global_step": 268928, "epoch": 1600} {"train_loss": -11.484832763671875, "global_step": 268929, "epoch": 1600} {"train_loss": -11.5618896484375, "global_step": 268930, "epoch": 1600} {"train_loss": -11.76414680480957, "global_step": 268931, "epoch": 1600} {"train_loss": -11.63352108001709, "global_step": 268932, "epoch": 1600} {"train_loss": -11.306882858276367, "global_step": 268933, "epoch": 1600} {"train_loss": -11.64645767211914, "global_step": 268934, "epoch": 1600} {"train_loss": -11.361003875732422, "global_step": 268935, "epoch": 1600} {"train_loss": -12.298040390014648, "global_step": 268936, "epoch": 1600} {"train_loss": -11.435556411743164, "global_step": 268937, "epoch": 1600} {"train_loss": -11.855823516845703, "global_step": 268938, "epoch": 1600} {"train_loss": -11.825467109680176, "global_step": 268939, "epoch": 1600} {"train_loss": -11.897391319274902, "global_step": 268940, "epoch": 1600} {"train_loss": -12.049270629882812, "global_step": 268941, "epoch": 1600} {"train_loss": -12.033474922180176, "global_step": 268942, "epoch": 1600} {"train_loss": -12.015028953552246, "global_step": 268943, "epoch": 1600} {"train_loss": -11.767108917236328, "global_step": 268944, "epoch": 1600} {"train_loss": -12.078636169433594, "global_step": 268945, "epoch": 1600} {"train_loss": -11.86593246459961, "global_step": 268946, "epoch": 1600} {"train_loss": -11.770194053649902, "global_step": 268947, "epoch": 1600} {"train_loss": -11.80965805053711, "global_step": 268948, "epoch": 1600} {"train_loss": -12.171512603759766, "global_step": 268949, "epoch": 1600} {"train_loss": -11.881138801574707, "global_step": 268950, "epoch": 1600} {"train_loss": -12.126656532287598, "global_step": 268951, "epoch": 1600} {"train_loss": -12.043498992919922, "global_step": 268952, "epoch": 1600} {"train_loss": -12.201055526733398, "global_step": 268953, "epoch": 1600} {"train_loss": -12.332225799560547, "global_step": 268954, "epoch": 1600} {"train_loss": -12.183900833129883, "global_step": 268955, "epoch": 1600} {"train_loss": -12.119836807250977, "global_step": 268956, "epoch": 1600} {"train_loss": -12.064937591552734, "global_step": 268957, "epoch": 1600} {"train_loss": -12.208148956298828, "global_step": 268958, "epoch": 1600} {"train_loss": -11.982072830200195, "global_step": 268959, "epoch": 1600} {"train_loss": -12.04902458190918, "global_step": 268960, "epoch": 1600} {"train_loss": -12.137635231018066, "global_step": 268961, "epoch": 1600} {"train_loss": -12.053363800048828, "global_step": 268962, "epoch": 1600} {"train_loss": -12.045904159545898, "global_step": 268963, "epoch": 1600} {"train_loss": -12.091756820678711, "global_step": 268964, "epoch": 1600} {"train_loss": -12.009294509887695, "global_step": 268965, "epoch": 1600} {"train_loss": -12.397150039672852, "global_step": 268966, "epoch": 1600} {"train_loss": -11.80945618947347, "global_step": 268967, "epoch": 1600, "train/sim_max_reward_0": 0.6534873424640336, "train/sim_max_reward_1": 0.9775269489666367, "train/sim_max_reward_2": 0.038498226895886216, "train/sim_max_reward_3": 0.4330319751528148, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.6149785587123247, "test/sim_max_reward_4400000": 0.9205765192146065, "test/sim_max_reward_4400001": 0.9797274172543725, "test/sim_max_reward_4400002": 0.9613457760933806, "test/sim_max_reward_4400003": 0.3047482881728313, "test/sim_max_reward_4400004": 0.9352338251378525, "test/sim_max_reward_4400005": 0.08546281152486279, "test/sim_max_reward_4400006": 0.28082357322773177, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 0.6418514097908801, "test/sim_max_reward_4400009": 0.033271939399465086, "test/sim_max_reward_4400010": 0.41730426804988074, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 0.553432287193606, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.9598271310076231, "test/sim_max_reward_4400015": 0.9883967218887332, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9430716219994623, "test/sim_max_reward_4400019": 0.17330248990047295, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 1.0, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.8516200780531015, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.5688677365611667, "test/sim_max_reward_4400026": 0.20139825713858747, "test/sim_max_reward_4400027": 0.5560346822727408, "test/sim_max_reward_4400028": 0.7021411442066546, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.15382221362104576, "test/sim_max_reward_4400033": 0.5047164168373076, "test/sim_max_reward_4400034": 0.9879180021206349, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.36521482262477384, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.9010856237056343, "test/sim_max_reward_4400039": 0.41181861961087174, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.16971452552386798, "test/sim_max_reward_4400042": 0.018265008433339593, "test/sim_max_reward_4400043": 0.025813085108960746, "test/sim_max_reward_4400044": 0.34288915322427993, "test/sim_max_reward_4400045": 0.0, "test/sim_max_reward_4400046": 0.9811381880474986, "test/sim_max_reward_4400047": 0.9549961606145863, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.004960780004079279, "train/mean_score": 0.6195871753652826, "test/mean_score": 0.5252726646872977, "val_loss": 271905.625, "train_action_mse_error": 1.1383183002471924} {"train_loss": -12.415878295898438, "global_step": 268968, "epoch": 1601} {"train_loss": -12.275890350341797, "global_step": 268969, "epoch": 1601} {"train_loss": -12.02780532836914, "global_step": 268970, "epoch": 1601} {"train_loss": -11.893653869628906, "global_step": 268971, "epoch": 1601} {"train_loss": -12.111194610595703, "global_step": 268972, "epoch": 1601} {"train_loss": -12.052854537963867, "global_step": 268973, "epoch": 1601} {"train_loss": -12.128206253051758, "global_step": 268974, "epoch": 1601} {"train_loss": -12.126810073852539, "global_step": 268975, "epoch": 1601} {"train_loss": -12.185121536254883, "global_step": 268976, "epoch": 1601} {"train_loss": -12.213651657104492, "global_step": 268977, "epoch": 1601} {"train_loss": -12.221962928771973, "global_step": 268978, "epoch": 1601} {"train_loss": -11.913093566894531, "global_step": 268979, "epoch": 1601} {"train_loss": -12.290342330932617, "global_step": 268980, "epoch": 1601} {"train_loss": -12.117469787597656, "global_step": 268981, "epoch": 1601} {"train_loss": -12.06321907043457, "global_step": 268982, "epoch": 1601} {"train_loss": -11.93182373046875, "global_step": 268983, "epoch": 1601} {"train_loss": -12.341279029846191, "global_step": 268984, "epoch": 1601} {"train_loss": -12.316776275634766, "global_step": 268985, "epoch": 1601} {"train_loss": -11.774600982666016, "global_step": 268986, "epoch": 1601} {"train_loss": -12.289694786071777, "global_step": 268987, "epoch": 1601} {"train_loss": -11.784039497375488, "global_step": 268988, "epoch": 1601} {"train_loss": -11.883260726928711, "global_step": 268989, "epoch": 1601} {"train_loss": -11.361778259277344, "global_step": 268990, "epoch": 1601} {"train_loss": -10.281509399414062, "global_step": 268991, "epoch": 1601} {"train_loss": -11.060223579406738, "global_step": 268992, "epoch": 1601} {"train_loss": -10.745792388916016, "global_step": 268993, "epoch": 1601} {"train_loss": -11.104715347290039, "global_step": 268994, "epoch": 1601} {"train_loss": -11.318967819213867, "global_step": 268995, "epoch": 1601} {"train_loss": -9.571181297302246, "global_step": 268996, "epoch": 1601} {"train_loss": -10.966835975646973, "global_step": 268997, "epoch": 1601} {"train_loss": -7.75177001953125, "global_step": 268998, "epoch": 1601} {"train_loss": -7.60651969909668, "global_step": 268999, "epoch": 1601} {"train_loss": -8.22905445098877, "global_step": 269000, "epoch": 1601} {"train_loss": -10.220108032226562, "global_step": 269001, "epoch": 1601} {"train_loss": -8.8675537109375, "global_step": 269002, "epoch": 1601} {"train_loss": -7.842039108276367, "global_step": 269003, "epoch": 1601} {"train_loss": -7.1916608810424805, "global_step": 269004, "epoch": 1601} {"train_loss": -6.998957633972168, "global_step": 269005, "epoch": 1601} {"train_loss": -8.522241592407227, "global_step": 269006, "epoch": 1601} {"train_loss": -7.655841827392578, "global_step": 269007, "epoch": 1601} {"train_loss": -7.369958877563477, "global_step": 269008, "epoch": 1601} {"train_loss": -7.299446105957031, "global_step": 269009, "epoch": 1601} {"train_loss": -7.334498405456543, "global_step": 269010, "epoch": 1601} {"train_loss": -8.224286079406738, "global_step": 269011, "epoch": 1601} {"train_loss": -8.408348083496094, "global_step": 269012, "epoch": 1601} {"train_loss": -7.69342041015625, "global_step": 269013, "epoch": 1601} {"train_loss": -8.131851196289062, "global_step": 269014, "epoch": 1601} {"train_loss": -10.018594741821289, "global_step": 269015, "epoch": 1601} {"train_loss": -9.376455307006836, "global_step": 269016, "epoch": 1601} {"train_loss": -10.818805694580078, "global_step": 269017, "epoch": 1601} {"train_loss": -9.938749313354492, "global_step": 269018, "epoch": 1601} {"train_loss": -9.87353801727295, "global_step": 269019, "epoch": 1601} {"train_loss": -10.225200653076172, "global_step": 269020, "epoch": 1601} {"train_loss": -10.66292953491211, "global_step": 269021, "epoch": 1601} {"train_loss": -9.582839965820312, "global_step": 269022, "epoch": 1601} {"train_loss": -10.255391120910645, "global_step": 269023, "epoch": 1601} {"train_loss": -10.745125770568848, "global_step": 269024, "epoch": 1601} {"train_loss": -10.692935943603516, "global_step": 269025, "epoch": 1601} {"train_loss": -11.229537010192871, "global_step": 269026, "epoch": 1601} {"train_loss": -10.539731979370117, "global_step": 269027, "epoch": 1601} {"train_loss": -10.613112449645996, "global_step": 269028, "epoch": 1601} {"train_loss": -10.524582862854004, "global_step": 269029, "epoch": 1601} {"train_loss": -10.770503044128418, "global_step": 269030, "epoch": 1601} {"train_loss": -10.592350006103516, "global_step": 269031, "epoch": 1601} {"train_loss": -10.798261642456055, "global_step": 269032, "epoch": 1601} {"train_loss": -11.213802337646484, "global_step": 269033, "epoch": 1601} {"train_loss": -11.077017784118652, "global_step": 269034, "epoch": 1601} {"train_loss": -11.301557540893555, "global_step": 269035, "epoch": 1601} {"train_loss": -11.475380897521973, "global_step": 269036, "epoch": 1601} {"train_loss": -11.023321151733398, "global_step": 269037, "epoch": 1601} {"train_loss": -11.079751968383789, "global_step": 269038, "epoch": 1601} {"train_loss": -11.36134147644043, "global_step": 269039, "epoch": 1601} {"train_loss": -11.275653839111328, "global_step": 269040, "epoch": 1601} {"train_loss": -11.2591552734375, "global_step": 269041, "epoch": 1601} {"train_loss": -11.496620178222656, "global_step": 269042, "epoch": 1601} {"train_loss": -11.471904754638672, "global_step": 269043, "epoch": 1601} {"train_loss": -11.362894058227539, "global_step": 269044, "epoch": 1601} {"train_loss": -11.584171295166016, "global_step": 269045, "epoch": 1601} {"train_loss": -11.41131591796875, "global_step": 269046, "epoch": 1601} {"train_loss": -11.270208358764648, "global_step": 269047, "epoch": 1601} {"train_loss": -11.726943016052246, "global_step": 269048, "epoch": 1601} {"train_loss": -11.59562873840332, "global_step": 269049, "epoch": 1601} {"train_loss": -11.517511367797852, "global_step": 269050, "epoch": 1601} {"train_loss": -11.488334655761719, "global_step": 269051, "epoch": 1601} {"train_loss": -11.563399314880371, "global_step": 269052, "epoch": 1601} {"train_loss": -11.620627403259277, "global_step": 269053, "epoch": 1601} {"train_loss": -11.486063003540039, "global_step": 269054, "epoch": 1601} {"train_loss": -11.780014038085938, "global_step": 269055, "epoch": 1601} {"train_loss": -11.75703239440918, "global_step": 269056, "epoch": 1601} {"train_loss": -11.499738693237305, "global_step": 269057, "epoch": 1601} {"train_loss": -11.574016571044922, "global_step": 269058, "epoch": 1601} {"train_loss": -11.310344696044922, "global_step": 269059, "epoch": 1601} {"train_loss": -11.816560745239258, "global_step": 269060, "epoch": 1601} {"train_loss": -11.5987548828125, "global_step": 269061, "epoch": 1601} {"train_loss": -11.592388153076172, "global_step": 269062, "epoch": 1601} {"train_loss": -11.323728561401367, "global_step": 269063, "epoch": 1601} {"train_loss": -11.651058197021484, "global_step": 269064, "epoch": 1601} {"train_loss": -11.748136520385742, "global_step": 269065, "epoch": 1601} {"train_loss": -11.651369094848633, "global_step": 269066, "epoch": 1601} {"train_loss": -11.883068084716797, "global_step": 269067, "epoch": 1601} {"train_loss": -11.608274459838867, "global_step": 269068, "epoch": 1601} {"train_loss": -11.796493530273438, "global_step": 269069, "epoch": 1601} {"train_loss": -11.827640533447266, "global_step": 269070, "epoch": 1601} {"train_loss": -11.614217758178711, "global_step": 269071, "epoch": 1601} {"train_loss": -11.45915699005127, "global_step": 269072, "epoch": 1601} {"train_loss": -11.735513687133789, "global_step": 269073, "epoch": 1601} {"train_loss": -11.70941162109375, "global_step": 269074, "epoch": 1601} {"train_loss": -11.553045272827148, "global_step": 269075, "epoch": 1601} {"train_loss": -11.764513969421387, "global_step": 269076, "epoch": 1601} {"train_loss": -11.879907608032227, "global_step": 269077, "epoch": 1601} {"train_loss": -11.574042320251465, "global_step": 269078, "epoch": 1601} {"train_loss": -11.968603134155273, "global_step": 269079, "epoch": 1601} {"train_loss": -11.716618537902832, "global_step": 269080, "epoch": 1601} {"train_loss": -11.850720405578613, "global_step": 269081, "epoch": 1601} {"train_loss": -11.788540840148926, "global_step": 269082, "epoch": 1601} {"train_loss": -12.032391548156738, "global_step": 269083, "epoch": 1601} {"train_loss": -11.810121536254883, "global_step": 269084, "epoch": 1601} {"train_loss": -11.968873977661133, "global_step": 269085, "epoch": 1601} {"train_loss": -11.874202728271484, "global_step": 269086, "epoch": 1601} {"train_loss": -11.919458389282227, "global_step": 269087, "epoch": 1601} {"train_loss": -11.932217597961426, "global_step": 269088, "epoch": 1601} {"train_loss": -12.080575942993164, "global_step": 269089, "epoch": 1601} {"train_loss": -12.033357620239258, "global_step": 269090, "epoch": 1601} {"train_loss": -12.267395973205566, "global_step": 269091, "epoch": 1601} {"train_loss": -11.860857963562012, "global_step": 269092, "epoch": 1601} {"train_loss": -11.915121078491211, "global_step": 269093, "epoch": 1601} {"train_loss": -11.840354919433594, "global_step": 269094, "epoch": 1601} {"train_loss": -11.98759651184082, "global_step": 269095, "epoch": 1601} {"train_loss": -11.903005599975586, "global_step": 269096, "epoch": 1601} {"train_loss": -12.013714790344238, "global_step": 269097, "epoch": 1601} {"train_loss": -11.838826179504395, "global_step": 269098, "epoch": 1601} {"train_loss": -12.2282133102417, "global_step": 269099, "epoch": 1601} {"train_loss": -12.098424911499023, "global_step": 269100, "epoch": 1601} {"train_loss": -12.074813842773438, "global_step": 269101, "epoch": 1601} {"train_loss": -12.13612174987793, "global_step": 269102, "epoch": 1601} {"train_loss": -11.924548149108887, "global_step": 269103, "epoch": 1601} {"train_loss": -12.202922821044922, "global_step": 269104, "epoch": 1601} {"train_loss": -12.031450271606445, "global_step": 269105, "epoch": 1601} {"train_loss": -12.020623207092285, "global_step": 269106, "epoch": 1601} {"train_loss": -12.320099830627441, "global_step": 269107, "epoch": 1601} {"train_loss": -11.957208633422852, "global_step": 269108, "epoch": 1601} {"train_loss": -11.934982299804688, "global_step": 269109, "epoch": 1601} {"train_loss": -12.116876602172852, "global_step": 269110, "epoch": 1601} {"train_loss": -12.040529251098633, "global_step": 269111, "epoch": 1601} {"train_loss": -12.371522903442383, "global_step": 269112, "epoch": 1601} {"train_loss": -12.246570587158203, "global_step": 269113, "epoch": 1601} {"train_loss": -12.147180557250977, "global_step": 269114, "epoch": 1601} {"train_loss": -12.168336868286133, "global_step": 269115, "epoch": 1601} {"train_loss": -12.216602325439453, "global_step": 269116, "epoch": 1601} {"train_loss": -12.16104793548584, "global_step": 269117, "epoch": 1601} {"train_loss": -12.019458770751953, "global_step": 269118, "epoch": 1601} {"train_loss": -12.295121192932129, "global_step": 269119, "epoch": 1601} {"train_loss": -12.072437286376953, "global_step": 269120, "epoch": 1601} {"train_loss": -11.911508560180664, "global_step": 269121, "epoch": 1601} {"train_loss": -12.160951614379883, "global_step": 269122, "epoch": 1601} {"train_loss": -11.906896591186523, "global_step": 269123, "epoch": 1601} {"train_loss": -12.209051132202148, "global_step": 269124, "epoch": 1601} {"train_loss": -12.044755935668945, "global_step": 269125, "epoch": 1601} {"train_loss": -12.385217666625977, "global_step": 269126, "epoch": 1601} {"train_loss": -11.840043067932129, "global_step": 269127, "epoch": 1601} {"train_loss": -11.468305587768555, "global_step": 269128, "epoch": 1601} {"train_loss": -12.04781723022461, "global_step": 269129, "epoch": 1601} {"train_loss": -12.28628158569336, "global_step": 269130, "epoch": 1601} {"train_loss": -11.909996032714844, "global_step": 269131, "epoch": 1601} {"train_loss": -11.920271873474121, "global_step": 269132, "epoch": 1601} {"train_loss": -12.242105484008789, "global_step": 269133, "epoch": 1601} {"train_loss": -12.039667129516602, "global_step": 269134, "epoch": 1601} {"train_loss": -11.259574969609579, "global_step": 269135, "epoch": 1601, "val_loss": 270746.84375} {"train_loss": -11.336505889892578, "global_step": 269136, "epoch": 1602} {"train_loss": -11.273408889770508, "global_step": 269137, "epoch": 1602} {"train_loss": -11.624746322631836, "global_step": 269138, "epoch": 1602} {"train_loss": -11.173675537109375, "global_step": 269139, "epoch": 1602} {"train_loss": -11.889171600341797, "global_step": 269140, "epoch": 1602} {"train_loss": -11.224603652954102, "global_step": 269141, "epoch": 1602} {"train_loss": -11.751871109008789, "global_step": 269142, "epoch": 1602} {"train_loss": -11.781668663024902, "global_step": 269143, "epoch": 1602} {"train_loss": -10.988286972045898, "global_step": 269144, "epoch": 1602} {"train_loss": -12.069354057312012, "global_step": 269145, "epoch": 1602} {"train_loss": -10.55694580078125, "global_step": 269146, "epoch": 1602} {"train_loss": -11.074800491333008, "global_step": 269147, "epoch": 1602} {"train_loss": -10.61705207824707, "global_step": 269148, "epoch": 1602} {"train_loss": -11.553926467895508, "global_step": 269149, "epoch": 1602} {"train_loss": -10.825994491577148, "global_step": 269150, "epoch": 1602} {"train_loss": -10.921221733093262, "global_step": 269151, "epoch": 1602} {"train_loss": -11.245319366455078, "global_step": 269152, "epoch": 1602} {"train_loss": -11.288509368896484, "global_step": 269153, "epoch": 1602} {"train_loss": -11.573531150817871, "global_step": 269154, "epoch": 1602} {"train_loss": -11.490631103515625, "global_step": 269155, "epoch": 1602} {"train_loss": -11.544139862060547, "global_step": 269156, "epoch": 1602} {"train_loss": -11.251182556152344, "global_step": 269157, "epoch": 1602} {"train_loss": -11.479543685913086, "global_step": 269158, "epoch": 1602} {"train_loss": -11.775856018066406, "global_step": 269159, "epoch": 1602} {"train_loss": -11.5901460647583, "global_step": 269160, "epoch": 1602} {"train_loss": -11.36041259765625, "global_step": 269161, "epoch": 1602} {"train_loss": -11.190950393676758, "global_step": 269162, "epoch": 1602} {"train_loss": -11.023748397827148, "global_step": 269163, "epoch": 1602} {"train_loss": -11.57183837890625, "global_step": 269164, "epoch": 1602} {"train_loss": -11.790061950683594, "global_step": 269165, "epoch": 1602} {"train_loss": -11.001468658447266, "global_step": 269166, "epoch": 1602} {"train_loss": -10.988885879516602, "global_step": 269167, "epoch": 1602} {"train_loss": -11.515006065368652, "global_step": 269168, "epoch": 1602} {"train_loss": -11.129207611083984, "global_step": 269169, "epoch": 1602} {"train_loss": -11.783416748046875, "global_step": 269170, "epoch": 1602} {"train_loss": -11.538904190063477, "global_step": 269171, "epoch": 1602} {"train_loss": -11.555875778198242, "global_step": 269172, "epoch": 1602} {"train_loss": -11.420906066894531, "global_step": 269173, "epoch": 1602} {"train_loss": -11.817325592041016, "global_step": 269174, "epoch": 1602} {"train_loss": -11.618356704711914, "global_step": 269175, "epoch": 1602} {"train_loss": -11.714365005493164, "global_step": 269176, "epoch": 1602} {"train_loss": -11.292062759399414, "global_step": 269177, "epoch": 1602} {"train_loss": -11.607658386230469, "global_step": 269178, "epoch": 1602} {"train_loss": -11.691842079162598, "global_step": 269179, "epoch": 1602} {"train_loss": -11.346712112426758, "global_step": 269180, "epoch": 1602} {"train_loss": -11.941545486450195, "global_step": 269181, "epoch": 1602} {"train_loss": -11.926916122436523, "global_step": 269182, "epoch": 1602} {"train_loss": -11.991450309753418, "global_step": 269183, "epoch": 1602} {"train_loss": -12.010580062866211, "global_step": 269184, "epoch": 1602} {"train_loss": -12.035684585571289, "global_step": 269185, "epoch": 1602} {"train_loss": -11.63210678100586, "global_step": 269186, "epoch": 1602} {"train_loss": -11.98727035522461, "global_step": 269187, "epoch": 1602} {"train_loss": -11.940187454223633, "global_step": 269188, "epoch": 1602} {"train_loss": -11.80191707611084, "global_step": 269189, "epoch": 1602} {"train_loss": -12.188687324523926, "global_step": 269190, "epoch": 1602} {"train_loss": -11.69194221496582, "global_step": 269191, "epoch": 1602} {"train_loss": -11.949416160583496, "global_step": 269192, "epoch": 1602} {"train_loss": -11.887062072753906, "global_step": 269193, "epoch": 1602} {"train_loss": -12.159650802612305, "global_step": 269194, "epoch": 1602} {"train_loss": -11.856096267700195, "global_step": 269195, "epoch": 1602} {"train_loss": -11.810344696044922, "global_step": 269196, "epoch": 1602} {"train_loss": -12.023404121398926, "global_step": 269197, "epoch": 1602} {"train_loss": -11.973846435546875, "global_step": 269198, "epoch": 1602} {"train_loss": -11.777575492858887, "global_step": 269199, "epoch": 1602} {"train_loss": -12.02472972869873, "global_step": 269200, "epoch": 1602} {"train_loss": -11.892620086669922, "global_step": 269201, "epoch": 1602} {"train_loss": -12.045387268066406, "global_step": 269202, "epoch": 1602} {"train_loss": -11.992735862731934, "global_step": 269203, "epoch": 1602} {"train_loss": -11.986273765563965, "global_step": 269204, "epoch": 1602} {"train_loss": -12.032379150390625, "global_step": 269205, "epoch": 1602} {"train_loss": -12.115608215332031, "global_step": 269206, "epoch": 1602} {"train_loss": -12.148316383361816, "global_step": 269207, "epoch": 1602} {"train_loss": -11.730502128601074, "global_step": 269208, "epoch": 1602} {"train_loss": -11.940007209777832, "global_step": 269209, "epoch": 1602} {"train_loss": -12.200019836425781, "global_step": 269210, "epoch": 1602} {"train_loss": -12.075517654418945, "global_step": 269211, "epoch": 1602} {"train_loss": -12.243391990661621, "global_step": 269212, "epoch": 1602} {"train_loss": -12.026200294494629, "global_step": 269213, "epoch": 1602} {"train_loss": -11.844303131103516, "global_step": 269214, "epoch": 1602} {"train_loss": -12.210665702819824, "global_step": 269215, "epoch": 1602} {"train_loss": -11.520038604736328, "global_step": 269216, "epoch": 1602} {"train_loss": -11.392203330993652, "global_step": 269217, "epoch": 1602} {"train_loss": -11.632911682128906, "global_step": 269218, "epoch": 1602} {"train_loss": -11.643807411193848, "global_step": 269219, "epoch": 1602} {"train_loss": -10.965543746948242, "global_step": 269220, "epoch": 1602} {"train_loss": -11.910614967346191, "global_step": 269221, "epoch": 1602} {"train_loss": -11.040576934814453, "global_step": 269222, "epoch": 1602} {"train_loss": -11.102540969848633, "global_step": 269223, "epoch": 1602} {"train_loss": -12.025012016296387, "global_step": 269224, "epoch": 1602} {"train_loss": -10.848644256591797, "global_step": 269225, "epoch": 1602} {"train_loss": -10.693198204040527, "global_step": 269226, "epoch": 1602} {"train_loss": -11.329984664916992, "global_step": 269227, "epoch": 1602} {"train_loss": -11.155214309692383, "global_step": 269228, "epoch": 1602} {"train_loss": -10.130422592163086, "global_step": 269229, "epoch": 1602} {"train_loss": -11.591986656188965, "global_step": 269230, "epoch": 1602} {"train_loss": -10.113434791564941, "global_step": 269231, "epoch": 1602} {"train_loss": -9.508468627929688, "global_step": 269232, "epoch": 1602} {"train_loss": -10.669940948486328, "global_step": 269233, "epoch": 1602} {"train_loss": -9.863293647766113, "global_step": 269234, "epoch": 1602} {"train_loss": -10.104106903076172, "global_step": 269235, "epoch": 1602} {"train_loss": -11.215862274169922, "global_step": 269236, "epoch": 1602} {"train_loss": -10.027677536010742, "global_step": 269237, "epoch": 1602} {"train_loss": -11.306821823120117, "global_step": 269238, "epoch": 1602} {"train_loss": -10.507858276367188, "global_step": 269239, "epoch": 1602} {"train_loss": -11.549692153930664, "global_step": 269240, "epoch": 1602} {"train_loss": -11.091375350952148, "global_step": 269241, "epoch": 1602} {"train_loss": -11.10142707824707, "global_step": 269242, "epoch": 1602} {"train_loss": -10.861872673034668, "global_step": 269243, "epoch": 1602} {"train_loss": -10.915918350219727, "global_step": 269244, "epoch": 1602} {"train_loss": -11.66726016998291, "global_step": 269245, "epoch": 1602} {"train_loss": -11.195759773254395, "global_step": 269246, "epoch": 1602} {"train_loss": -11.01658821105957, "global_step": 269247, "epoch": 1602} {"train_loss": -11.108161926269531, "global_step": 269248, "epoch": 1602} {"train_loss": -11.455604553222656, "global_step": 269249, "epoch": 1602} {"train_loss": -11.6319580078125, "global_step": 269250, "epoch": 1602} {"train_loss": -11.287120819091797, "global_step": 269251, "epoch": 1602} {"train_loss": -11.42055892944336, "global_step": 269252, "epoch": 1602} {"train_loss": -11.402399063110352, "global_step": 269253, "epoch": 1602} {"train_loss": -11.710868835449219, "global_step": 269254, "epoch": 1602} {"train_loss": -11.727167129516602, "global_step": 269255, "epoch": 1602} {"train_loss": -12.091085433959961, "global_step": 269256, "epoch": 1602} {"train_loss": -11.47102165222168, "global_step": 269257, "epoch": 1602} {"train_loss": -11.900678634643555, "global_step": 269258, "epoch": 1602} {"train_loss": -11.68851089477539, "global_step": 269259, "epoch": 1602} {"train_loss": -12.07423210144043, "global_step": 269260, "epoch": 1602} {"train_loss": -11.937997817993164, "global_step": 269261, "epoch": 1602} {"train_loss": -11.905689239501953, "global_step": 269262, "epoch": 1602} {"train_loss": -11.990964889526367, "global_step": 269263, "epoch": 1602} {"train_loss": -11.929496765136719, "global_step": 269264, "epoch": 1602} {"train_loss": -11.96847915649414, "global_step": 269265, "epoch": 1602} {"train_loss": -12.069829940795898, "global_step": 269266, "epoch": 1602} {"train_loss": -11.759645462036133, "global_step": 269267, "epoch": 1602} {"train_loss": -12.181471824645996, "global_step": 269268, "epoch": 1602} {"train_loss": -11.963211059570312, "global_step": 269269, "epoch": 1602} {"train_loss": -11.986976623535156, "global_step": 269270, "epoch": 1602} {"train_loss": -11.936065673828125, "global_step": 269271, "epoch": 1602} {"train_loss": -12.172536849975586, "global_step": 269272, "epoch": 1602} {"train_loss": -12.047225952148438, "global_step": 269273, "epoch": 1602} {"train_loss": -12.006168365478516, "global_step": 269274, "epoch": 1602} {"train_loss": -12.207550048828125, "global_step": 269275, "epoch": 1602} {"train_loss": -12.018125534057617, "global_step": 269276, "epoch": 1602} {"train_loss": -11.878641128540039, "global_step": 269277, "epoch": 1602} {"train_loss": -12.23790168762207, "global_step": 269278, "epoch": 1602} {"train_loss": -12.15123176574707, "global_step": 269279, "epoch": 1602} {"train_loss": -12.106460571289062, "global_step": 269280, "epoch": 1602} {"train_loss": -11.921346664428711, "global_step": 269281, "epoch": 1602} {"train_loss": -11.775716781616211, "global_step": 269282, "epoch": 1602} {"train_loss": -11.937217712402344, "global_step": 269283, "epoch": 1602} {"train_loss": -12.045694351196289, "global_step": 269284, "epoch": 1602} {"train_loss": -11.871076583862305, "global_step": 269285, "epoch": 1602} {"train_loss": -11.977703094482422, "global_step": 269286, "epoch": 1602} {"train_loss": -11.798229217529297, "global_step": 269287, "epoch": 1602} {"train_loss": -11.749855995178223, "global_step": 269288, "epoch": 1602} {"train_loss": -12.013578414916992, "global_step": 269289, "epoch": 1602} {"train_loss": -11.686151504516602, "global_step": 269290, "epoch": 1602} {"train_loss": -11.705341339111328, "global_step": 269291, "epoch": 1602} {"train_loss": -11.542646408081055, "global_step": 269292, "epoch": 1602} {"train_loss": -11.021114349365234, "global_step": 269293, "epoch": 1602} {"train_loss": -11.981014251708984, "global_step": 269294, "epoch": 1602} {"train_loss": -11.44909381866455, "global_step": 269295, "epoch": 1602} {"train_loss": -11.857332229614258, "global_step": 269296, "epoch": 1602} {"train_loss": -11.32585620880127, "global_step": 269297, "epoch": 1602} {"train_loss": -11.46716594696045, "global_step": 269298, "epoch": 1602} {"train_loss": -10.915019989013672, "global_step": 269299, "epoch": 1602} {"train_loss": -10.536735534667969, "global_step": 269300, "epoch": 1602} {"train_loss": -11.040016174316406, "global_step": 269301, "epoch": 1602} {"train_loss": -11.26499080657959, "global_step": 269302, "epoch": 1602} {"train_loss": -11.552056079819089, "global_step": 269303, "epoch": 1602, "val_loss": 276945.71875} {"train_loss": -9.053084373474121, "global_step": 269304, "epoch": 1603} {"train_loss": -10.38357162475586, "global_step": 269305, "epoch": 1603} {"train_loss": -10.670574188232422, "global_step": 269306, "epoch": 1603} {"train_loss": -10.07992935180664, "global_step": 269307, "epoch": 1603} {"train_loss": -9.955997467041016, "global_step": 269308, "epoch": 1603} {"train_loss": -10.84141731262207, "global_step": 269309, "epoch": 1603} {"train_loss": -10.637369155883789, "global_step": 269310, "epoch": 1603} {"train_loss": -11.172693252563477, "global_step": 269311, "epoch": 1603} {"train_loss": -10.982688903808594, "global_step": 269312, "epoch": 1603} {"train_loss": -10.701634407043457, "global_step": 269313, "epoch": 1603} {"train_loss": -10.760183334350586, "global_step": 269314, "epoch": 1603} {"train_loss": -10.839115142822266, "global_step": 269315, "epoch": 1603} {"train_loss": -11.332956314086914, "global_step": 269316, "epoch": 1603} {"train_loss": -10.915142059326172, "global_step": 269317, "epoch": 1603} {"train_loss": -11.516358375549316, "global_step": 269318, "epoch": 1603} {"train_loss": -11.505783081054688, "global_step": 269319, "epoch": 1603} {"train_loss": -11.068709373474121, "global_step": 269320, "epoch": 1603} {"train_loss": -11.250591278076172, "global_step": 269321, "epoch": 1603} {"train_loss": -11.12039566040039, "global_step": 269322, "epoch": 1603} {"train_loss": -11.739133834838867, "global_step": 269323, "epoch": 1603} {"train_loss": -11.391369819641113, "global_step": 269324, "epoch": 1603} {"train_loss": -11.64406967163086, "global_step": 269325, "epoch": 1603} {"train_loss": -11.568286895751953, "global_step": 269326, "epoch": 1603} {"train_loss": -11.707503318786621, "global_step": 269327, "epoch": 1603} {"train_loss": -11.694755554199219, "global_step": 269328, "epoch": 1603} {"train_loss": -11.821544647216797, "global_step": 269329, "epoch": 1603} {"train_loss": -11.77022933959961, "global_step": 269330, "epoch": 1603} {"train_loss": -11.753929138183594, "global_step": 269331, "epoch": 1603} {"train_loss": -11.707698822021484, "global_step": 269332, "epoch": 1603} {"train_loss": -12.06089973449707, "global_step": 269333, "epoch": 1603} {"train_loss": -11.844053268432617, "global_step": 269334, "epoch": 1603} {"train_loss": -11.87061882019043, "global_step": 269335, "epoch": 1603} {"train_loss": -11.740713119506836, "global_step": 269336, "epoch": 1603} {"train_loss": -11.799386024475098, "global_step": 269337, "epoch": 1603} {"train_loss": -11.90621566772461, "global_step": 269338, "epoch": 1603} {"train_loss": -12.045095443725586, "global_step": 269339, "epoch": 1603} {"train_loss": -12.122328758239746, "global_step": 269340, "epoch": 1603} {"train_loss": -11.955854415893555, "global_step": 269341, "epoch": 1603} {"train_loss": -11.93940544128418, "global_step": 269342, "epoch": 1603} {"train_loss": -11.639717102050781, "global_step": 269343, "epoch": 1603} {"train_loss": -11.897899627685547, "global_step": 269344, "epoch": 1603} {"train_loss": -12.049165725708008, "global_step": 269345, "epoch": 1603} {"train_loss": -12.028966903686523, "global_step": 269346, "epoch": 1603} {"train_loss": -12.150113105773926, "global_step": 269347, "epoch": 1603} {"train_loss": -11.960817337036133, "global_step": 269348, "epoch": 1603} {"train_loss": -12.207876205444336, "global_step": 269349, "epoch": 1603} {"train_loss": -12.133914947509766, "global_step": 269350, "epoch": 1603} {"train_loss": -12.108518600463867, "global_step": 269351, "epoch": 1603} {"train_loss": -12.19468879699707, "global_step": 269352, "epoch": 1603} {"train_loss": -12.079530715942383, "global_step": 269353, "epoch": 1603} {"train_loss": -11.97749137878418, "global_step": 269354, "epoch": 1603} {"train_loss": -11.869747161865234, "global_step": 269355, "epoch": 1603} {"train_loss": -11.81712532043457, "global_step": 269356, "epoch": 1603} {"train_loss": -11.997184753417969, "global_step": 269357, "epoch": 1603} {"train_loss": -12.078436851501465, "global_step": 269358, "epoch": 1603} {"train_loss": -11.759654998779297, "global_step": 269359, "epoch": 1603} {"train_loss": -11.996694564819336, "global_step": 269360, "epoch": 1603} {"train_loss": -12.035152435302734, "global_step": 269361, "epoch": 1603} {"train_loss": -11.699703216552734, "global_step": 269362, "epoch": 1603} {"train_loss": -12.019208908081055, "global_step": 269363, "epoch": 1603} {"train_loss": -11.646121978759766, "global_step": 269364, "epoch": 1603} {"train_loss": -11.13585376739502, "global_step": 269365, "epoch": 1603} {"train_loss": -11.210394859313965, "global_step": 269366, "epoch": 1603} {"train_loss": -11.2069091796875, "global_step": 269367, "epoch": 1603} {"train_loss": -10.831982612609863, "global_step": 269368, "epoch": 1603} {"train_loss": -11.604728698730469, "global_step": 269369, "epoch": 1603} {"train_loss": -10.360137939453125, "global_step": 269370, "epoch": 1603} {"train_loss": -10.141721725463867, "global_step": 269371, "epoch": 1603} {"train_loss": -9.99028491973877, "global_step": 269372, "epoch": 1603} {"train_loss": -9.81448745727539, "global_step": 269373, "epoch": 1603} {"train_loss": -9.536493301391602, "global_step": 269374, "epoch": 1603} {"train_loss": -9.995115280151367, "global_step": 269375, "epoch": 1603} {"train_loss": -10.108598709106445, "global_step": 269376, "epoch": 1603} {"train_loss": -10.380533218383789, "global_step": 269377, "epoch": 1603} {"train_loss": -10.678784370422363, "global_step": 269378, "epoch": 1603} {"train_loss": -10.403179168701172, "global_step": 269379, "epoch": 1603} {"train_loss": -10.805974960327148, "global_step": 269380, "epoch": 1603} {"train_loss": -10.408576011657715, "global_step": 269381, "epoch": 1603} {"train_loss": -10.991744995117188, "global_step": 269382, "epoch": 1603} {"train_loss": -10.822035789489746, "global_step": 269383, "epoch": 1603} {"train_loss": -11.237632751464844, "global_step": 269384, "epoch": 1603} {"train_loss": -10.785626411437988, "global_step": 269385, "epoch": 1603} {"train_loss": -11.073039054870605, "global_step": 269386, "epoch": 1603} {"train_loss": -11.37863540649414, "global_step": 269387, "epoch": 1603} {"train_loss": -11.341285705566406, "global_step": 269388, "epoch": 1603} {"train_loss": -11.48961067199707, "global_step": 269389, "epoch": 1603} {"train_loss": -11.527910232543945, "global_step": 269390, "epoch": 1603} {"train_loss": -11.424147605895996, "global_step": 269391, "epoch": 1603} {"train_loss": -11.7633638381958, "global_step": 269392, "epoch": 1603} {"train_loss": -11.170171737670898, "global_step": 269393, "epoch": 1603} {"train_loss": -11.555316925048828, "global_step": 269394, "epoch": 1603} {"train_loss": -11.584821701049805, "global_step": 269395, "epoch": 1603} {"train_loss": -11.350801467895508, "global_step": 269396, "epoch": 1603} {"train_loss": -11.720327377319336, "global_step": 269397, "epoch": 1603} {"train_loss": -11.38181209564209, "global_step": 269398, "epoch": 1603} {"train_loss": -11.753658294677734, "global_step": 269399, "epoch": 1603} {"train_loss": -11.774253845214844, "global_step": 269400, "epoch": 1603} {"train_loss": -11.732398986816406, "global_step": 269401, "epoch": 1603} {"train_loss": -11.972458839416504, "global_step": 269402, "epoch": 1603} {"train_loss": -11.89045524597168, "global_step": 269403, "epoch": 1603} {"train_loss": -11.797409057617188, "global_step": 269404, "epoch": 1603} {"train_loss": -12.079083442687988, "global_step": 269405, "epoch": 1603} {"train_loss": -11.693597793579102, "global_step": 269406, "epoch": 1603} {"train_loss": -11.9102783203125, "global_step": 269407, "epoch": 1603} {"train_loss": -11.639845848083496, "global_step": 269408, "epoch": 1603} {"train_loss": -11.813753128051758, "global_step": 269409, "epoch": 1603} {"train_loss": -11.728147506713867, "global_step": 269410, "epoch": 1603} {"train_loss": -12.063337326049805, "global_step": 269411, "epoch": 1603} {"train_loss": -11.779619216918945, "global_step": 269412, "epoch": 1603} {"train_loss": -12.074604034423828, "global_step": 269413, "epoch": 1603} {"train_loss": -11.933023452758789, "global_step": 269414, "epoch": 1603} {"train_loss": -12.178812026977539, "global_step": 269415, "epoch": 1603} {"train_loss": -12.303722381591797, "global_step": 269416, "epoch": 1603} {"train_loss": -11.81644058227539, "global_step": 269417, "epoch": 1603} {"train_loss": -12.069917678833008, "global_step": 269418, "epoch": 1603} {"train_loss": -11.906868934631348, "global_step": 269419, "epoch": 1603} {"train_loss": -12.128440856933594, "global_step": 269420, "epoch": 1603} {"train_loss": -12.088217735290527, "global_step": 269421, "epoch": 1603} {"train_loss": -11.85517692565918, "global_step": 269422, "epoch": 1603} {"train_loss": -12.046987533569336, "global_step": 269423, "epoch": 1603} {"train_loss": -11.830585479736328, "global_step": 269424, "epoch": 1603} {"train_loss": -11.944123268127441, "global_step": 269425, "epoch": 1603} {"train_loss": -11.998900413513184, "global_step": 269426, "epoch": 1603} {"train_loss": -11.940427780151367, "global_step": 269427, "epoch": 1603} {"train_loss": -12.130376815795898, "global_step": 269428, "epoch": 1603} {"train_loss": -11.798917770385742, "global_step": 269429, "epoch": 1603} {"train_loss": -12.02503776550293, "global_step": 269430, "epoch": 1603} {"train_loss": -11.765748023986816, "global_step": 269431, "epoch": 1603} {"train_loss": -12.052478790283203, "global_step": 269432, "epoch": 1603} {"train_loss": -12.158430099487305, "global_step": 269433, "epoch": 1603} {"train_loss": -11.892488479614258, "global_step": 269434, "epoch": 1603} {"train_loss": -12.269392013549805, "global_step": 269435, "epoch": 1603} {"train_loss": -11.820087432861328, "global_step": 269436, "epoch": 1603} {"train_loss": -12.241247177124023, "global_step": 269437, "epoch": 1603} {"train_loss": -11.763020515441895, "global_step": 269438, "epoch": 1603} {"train_loss": -11.613733291625977, "global_step": 269439, "epoch": 1603} {"train_loss": -11.819896697998047, "global_step": 269440, "epoch": 1603} {"train_loss": -11.720113754272461, "global_step": 269441, "epoch": 1603} {"train_loss": -11.953288078308105, "global_step": 269442, "epoch": 1603} {"train_loss": -11.746870994567871, "global_step": 269443, "epoch": 1603} {"train_loss": -11.614618301391602, "global_step": 269444, "epoch": 1603} {"train_loss": -12.110462188720703, "global_step": 269445, "epoch": 1603} {"train_loss": -11.627616882324219, "global_step": 269446, "epoch": 1603} {"train_loss": -11.263752937316895, "global_step": 269447, "epoch": 1603} {"train_loss": -12.170193672180176, "global_step": 269448, "epoch": 1603} {"train_loss": -11.48633861541748, "global_step": 269449, "epoch": 1603} {"train_loss": -10.892553329467773, "global_step": 269450, "epoch": 1603} {"train_loss": -11.971988677978516, "global_step": 269451, "epoch": 1603} {"train_loss": -11.449121475219727, "global_step": 269452, "epoch": 1603} {"train_loss": -11.53792667388916, "global_step": 269453, "epoch": 1603} {"train_loss": -11.615901947021484, "global_step": 269454, "epoch": 1603} {"train_loss": -11.571887969970703, "global_step": 269455, "epoch": 1603} {"train_loss": -11.309459686279297, "global_step": 269456, "epoch": 1603} {"train_loss": -12.15757942199707, "global_step": 269457, "epoch": 1603} {"train_loss": -11.331964492797852, "global_step": 269458, "epoch": 1603} {"train_loss": -12.156469345092773, "global_step": 269459, "epoch": 1603} {"train_loss": -11.466943740844727, "global_step": 269460, "epoch": 1603} {"train_loss": -11.642950057983398, "global_step": 269461, "epoch": 1603} {"train_loss": -12.053699493408203, "global_step": 269462, "epoch": 1603} {"train_loss": -11.7763090133667, "global_step": 269463, "epoch": 1603} {"train_loss": -12.243431091308594, "global_step": 269464, "epoch": 1603} {"train_loss": -11.550294876098633, "global_step": 269465, "epoch": 1603} {"train_loss": -11.688304901123047, "global_step": 269466, "epoch": 1603} {"train_loss": -11.798402786254883, "global_step": 269467, "epoch": 1603} {"train_loss": -11.717447280883789, "global_step": 269468, "epoch": 1603} {"train_loss": -10.283358573913574, "global_step": 269469, "epoch": 1603} {"train_loss": -11.758710861206055, "global_step": 269470, "epoch": 1603} {"train_loss": -11.529151553199405, "global_step": 269471, "epoch": 1603, "val_loss": 275447.71875} {"train_loss": -10.552298545837402, "global_step": 269472, "epoch": 1604} {"train_loss": -11.76057243347168, "global_step": 269473, "epoch": 1604} {"train_loss": -9.871627807617188, "global_step": 269474, "epoch": 1604} {"train_loss": -10.576667785644531, "global_step": 269475, "epoch": 1604} {"train_loss": -10.434717178344727, "global_step": 269476, "epoch": 1604} {"train_loss": -10.459035873413086, "global_step": 269477, "epoch": 1604} {"train_loss": -9.148977279663086, "global_step": 269478, "epoch": 1604} {"train_loss": -11.473804473876953, "global_step": 269479, "epoch": 1604} {"train_loss": -9.97589111328125, "global_step": 269480, "epoch": 1604} {"train_loss": -10.895949363708496, "global_step": 269481, "epoch": 1604} {"train_loss": -11.092975616455078, "global_step": 269482, "epoch": 1604} {"train_loss": -10.198705673217773, "global_step": 269483, "epoch": 1604} {"train_loss": -10.527860641479492, "global_step": 269484, "epoch": 1604} {"train_loss": -11.416258811950684, "global_step": 269485, "epoch": 1604} {"train_loss": -10.576129913330078, "global_step": 269486, "epoch": 1604} {"train_loss": -11.25124740600586, "global_step": 269487, "epoch": 1604} {"train_loss": -11.608539581298828, "global_step": 269488, "epoch": 1604} {"train_loss": -10.917591094970703, "global_step": 269489, "epoch": 1604} {"train_loss": -11.650303840637207, "global_step": 269490, "epoch": 1604} {"train_loss": -10.778435707092285, "global_step": 269491, "epoch": 1604} {"train_loss": -11.428083419799805, "global_step": 269492, "epoch": 1604} {"train_loss": -11.470587730407715, "global_step": 269493, "epoch": 1604} {"train_loss": -11.214946746826172, "global_step": 269494, "epoch": 1604} {"train_loss": -11.66580581665039, "global_step": 269495, "epoch": 1604} {"train_loss": -11.00589370727539, "global_step": 269496, "epoch": 1604} {"train_loss": -10.74706745147705, "global_step": 269497, "epoch": 1604} {"train_loss": -11.210363388061523, "global_step": 269498, "epoch": 1604} {"train_loss": -10.552874565124512, "global_step": 269499, "epoch": 1604} {"train_loss": -11.394984245300293, "global_step": 269500, "epoch": 1604} {"train_loss": -11.170392036437988, "global_step": 269501, "epoch": 1604} {"train_loss": -11.236793518066406, "global_step": 269502, "epoch": 1604} {"train_loss": -11.347635269165039, "global_step": 269503, "epoch": 1604} {"train_loss": -10.473541259765625, "global_step": 269504, "epoch": 1604} {"train_loss": -11.663665771484375, "global_step": 269505, "epoch": 1604} {"train_loss": -10.481752395629883, "global_step": 269506, "epoch": 1604} {"train_loss": -11.406647682189941, "global_step": 269507, "epoch": 1604} {"train_loss": -11.71706771850586, "global_step": 269508, "epoch": 1604} {"train_loss": -11.35359001159668, "global_step": 269509, "epoch": 1604} {"train_loss": -11.74844741821289, "global_step": 269510, "epoch": 1604} {"train_loss": -11.312795639038086, "global_step": 269511, "epoch": 1604} {"train_loss": -11.531587600708008, "global_step": 269512, "epoch": 1604} {"train_loss": -11.62954044342041, "global_step": 269513, "epoch": 1604} {"train_loss": -11.584400177001953, "global_step": 269514, "epoch": 1604} {"train_loss": -11.220638275146484, "global_step": 269515, "epoch": 1604} {"train_loss": -11.72884464263916, "global_step": 269516, "epoch": 1604} {"train_loss": -11.466073989868164, "global_step": 269517, "epoch": 1604} {"train_loss": -12.081016540527344, "global_step": 269518, "epoch": 1604} {"train_loss": -11.738896369934082, "global_step": 269519, "epoch": 1604} {"train_loss": -11.902884483337402, "global_step": 269520, "epoch": 1604} {"train_loss": -11.93515682220459, "global_step": 269521, "epoch": 1604} {"train_loss": -11.694929122924805, "global_step": 269522, "epoch": 1604} {"train_loss": -11.70921802520752, "global_step": 269523, "epoch": 1604} {"train_loss": -11.506131172180176, "global_step": 269524, "epoch": 1604} {"train_loss": -12.02235221862793, "global_step": 269525, "epoch": 1604} {"train_loss": -11.877921104431152, "global_step": 269526, "epoch": 1604} {"train_loss": -11.704619407653809, "global_step": 269527, "epoch": 1604} {"train_loss": -11.890753746032715, "global_step": 269528, "epoch": 1604} {"train_loss": -11.743060111999512, "global_step": 269529, "epoch": 1604} {"train_loss": -11.847481727600098, "global_step": 269530, "epoch": 1604} {"train_loss": -11.740549087524414, "global_step": 269531, "epoch": 1604} {"train_loss": -11.887832641601562, "global_step": 269532, "epoch": 1604} {"train_loss": -11.971534729003906, "global_step": 269533, "epoch": 1604} {"train_loss": -11.811514854431152, "global_step": 269534, "epoch": 1604} {"train_loss": -12.207587242126465, "global_step": 269535, "epoch": 1604} {"train_loss": -11.950532913208008, "global_step": 269536, "epoch": 1604} {"train_loss": -11.773225784301758, "global_step": 269537, "epoch": 1604} {"train_loss": -12.145357131958008, "global_step": 269538, "epoch": 1604} {"train_loss": -12.014582633972168, "global_step": 269539, "epoch": 1604} {"train_loss": -12.027763366699219, "global_step": 269540, "epoch": 1604} {"train_loss": -12.153105735778809, "global_step": 269541, "epoch": 1604} {"train_loss": -11.940486907958984, "global_step": 269542, "epoch": 1604} {"train_loss": -12.034435272216797, "global_step": 269543, "epoch": 1604} {"train_loss": -12.090814590454102, "global_step": 269544, "epoch": 1604} {"train_loss": -12.070291519165039, "global_step": 269545, "epoch": 1604} {"train_loss": -12.03892993927002, "global_step": 269546, "epoch": 1604} {"train_loss": -11.792181015014648, "global_step": 269547, "epoch": 1604} {"train_loss": -12.095808029174805, "global_step": 269548, "epoch": 1604} {"train_loss": -12.300582885742188, "global_step": 269549, "epoch": 1604} {"train_loss": -12.31550407409668, "global_step": 269550, "epoch": 1604} {"train_loss": -12.137578964233398, "global_step": 269551, "epoch": 1604} {"train_loss": -12.196308135986328, "global_step": 269552, "epoch": 1604} {"train_loss": -12.343626022338867, "global_step": 269553, "epoch": 1604} {"train_loss": -11.965437889099121, "global_step": 269554, "epoch": 1604} {"train_loss": -12.328056335449219, "global_step": 269555, "epoch": 1604} {"train_loss": -12.283767700195312, "global_step": 269556, "epoch": 1604} {"train_loss": -12.225985527038574, "global_step": 269557, "epoch": 1604} {"train_loss": -12.296685218811035, "global_step": 269558, "epoch": 1604} {"train_loss": -12.280168533325195, "global_step": 269559, "epoch": 1604} {"train_loss": -12.353348731994629, "global_step": 269560, "epoch": 1604} {"train_loss": -12.291284561157227, "global_step": 269561, "epoch": 1604} {"train_loss": -12.373312950134277, "global_step": 269562, "epoch": 1604} {"train_loss": -12.328938484191895, "global_step": 269563, "epoch": 1604} {"train_loss": -12.35116195678711, "global_step": 269564, "epoch": 1604} {"train_loss": -12.391461372375488, "global_step": 269565, "epoch": 1604} {"train_loss": -12.416316986083984, "global_step": 269566, "epoch": 1604} {"train_loss": -12.336490631103516, "global_step": 269567, "epoch": 1604} {"train_loss": -12.434791564941406, "global_step": 269568, "epoch": 1604} {"train_loss": -12.47005558013916, "global_step": 269569, "epoch": 1604} {"train_loss": -12.257476806640625, "global_step": 269570, "epoch": 1604} {"train_loss": -12.461323738098145, "global_step": 269571, "epoch": 1604} {"train_loss": -12.323593139648438, "global_step": 269572, "epoch": 1604} {"train_loss": -12.56568717956543, "global_step": 269573, "epoch": 1604} {"train_loss": -12.237634658813477, "global_step": 269574, "epoch": 1604} {"train_loss": -12.448501586914062, "global_step": 269575, "epoch": 1604} {"train_loss": -12.299602508544922, "global_step": 269576, "epoch": 1604} {"train_loss": -12.375816345214844, "global_step": 269577, "epoch": 1604} {"train_loss": -12.164544105529785, "global_step": 269578, "epoch": 1604} {"train_loss": -12.296285629272461, "global_step": 269579, "epoch": 1604} {"train_loss": -12.551128387451172, "global_step": 269580, "epoch": 1604} {"train_loss": -12.598485946655273, "global_step": 269581, "epoch": 1604} {"train_loss": -12.455147743225098, "global_step": 269582, "epoch": 1604} {"train_loss": -12.180868148803711, "global_step": 269583, "epoch": 1604} {"train_loss": -12.3513765335083, "global_step": 269584, "epoch": 1604} {"train_loss": -12.24643611907959, "global_step": 269585, "epoch": 1604} {"train_loss": -11.798116683959961, "global_step": 269586, "epoch": 1604} {"train_loss": -11.40428638458252, "global_step": 269587, "epoch": 1604} {"train_loss": -10.562228202819824, "global_step": 269588, "epoch": 1604} {"train_loss": -10.904598236083984, "global_step": 269589, "epoch": 1604} {"train_loss": -11.82618522644043, "global_step": 269590, "epoch": 1604} {"train_loss": -11.959755897521973, "global_step": 269591, "epoch": 1604} {"train_loss": -11.756722450256348, "global_step": 269592, "epoch": 1604} {"train_loss": -11.243179321289062, "global_step": 269593, "epoch": 1604} {"train_loss": -11.877243041992188, "global_step": 269594, "epoch": 1604} {"train_loss": -11.612600326538086, "global_step": 269595, "epoch": 1604} {"train_loss": -11.951813697814941, "global_step": 269596, "epoch": 1604} {"train_loss": -11.43238353729248, "global_step": 269597, "epoch": 1604} {"train_loss": -11.141733169555664, "global_step": 269598, "epoch": 1604} {"train_loss": -8.987360000610352, "global_step": 269599, "epoch": 1604} {"train_loss": -11.16783332824707, "global_step": 269600, "epoch": 1604} {"train_loss": -11.409453392028809, "global_step": 269601, "epoch": 1604} {"train_loss": -10.614053726196289, "global_step": 269602, "epoch": 1604} {"train_loss": -9.891494750976562, "global_step": 269603, "epoch": 1604} {"train_loss": -11.058538436889648, "global_step": 269604, "epoch": 1604} {"train_loss": -9.040656089782715, "global_step": 269605, "epoch": 1604} {"train_loss": -10.973453521728516, "global_step": 269606, "epoch": 1604} {"train_loss": -9.62801742553711, "global_step": 269607, "epoch": 1604} {"train_loss": -10.536176681518555, "global_step": 269608, "epoch": 1604} {"train_loss": -10.321146011352539, "global_step": 269609, "epoch": 1604} {"train_loss": -10.327808380126953, "global_step": 269610, "epoch": 1604} {"train_loss": -9.583805084228516, "global_step": 269611, "epoch": 1604} {"train_loss": -8.52241039276123, "global_step": 269612, "epoch": 1604} {"train_loss": -10.090991973876953, "global_step": 269613, "epoch": 1604} {"train_loss": -10.099811553955078, "global_step": 269614, "epoch": 1604} {"train_loss": -9.717545509338379, "global_step": 269615, "epoch": 1604} {"train_loss": -9.866034507751465, "global_step": 269616, "epoch": 1604} {"train_loss": -9.651388168334961, "global_step": 269617, "epoch": 1604} {"train_loss": -10.338692665100098, "global_step": 269618, "epoch": 1604} {"train_loss": -10.13884162902832, "global_step": 269619, "epoch": 1604} {"train_loss": -11.319307327270508, "global_step": 269620, "epoch": 1604} {"train_loss": -10.502336502075195, "global_step": 269621, "epoch": 1604} {"train_loss": -11.105775833129883, "global_step": 269622, "epoch": 1604} {"train_loss": -10.809283256530762, "global_step": 269623, "epoch": 1604} {"train_loss": -10.882722854614258, "global_step": 269624, "epoch": 1604} {"train_loss": -10.82241439819336, "global_step": 269625, "epoch": 1604} {"train_loss": -10.73209285736084, "global_step": 269626, "epoch": 1604} {"train_loss": -10.960359573364258, "global_step": 269627, "epoch": 1604} {"train_loss": -11.373147964477539, "global_step": 269628, "epoch": 1604} {"train_loss": -11.008986473083496, "global_step": 269629, "epoch": 1604} {"train_loss": -11.469058990478516, "global_step": 269630, "epoch": 1604} {"train_loss": -11.001480102539062, "global_step": 269631, "epoch": 1604} {"train_loss": -10.920405387878418, "global_step": 269632, "epoch": 1604} {"train_loss": -11.13461971282959, "global_step": 269633, "epoch": 1604} {"train_loss": -11.385154724121094, "global_step": 269634, "epoch": 1604} {"train_loss": -11.541060447692871, "global_step": 269635, "epoch": 1604} {"train_loss": -11.846187591552734, "global_step": 269636, "epoch": 1604} {"train_loss": -11.295266151428223, "global_step": 269637, "epoch": 1604} {"train_loss": -11.521790504455566, "global_step": 269638, "epoch": 1604} {"train_loss": -11.423869632539295, "global_step": 269639, "epoch": 1604, "val_loss": 275151.40625} {"train_loss": -11.610050201416016, "global_step": 269640, "epoch": 1605} {"train_loss": -11.771166801452637, "global_step": 269641, "epoch": 1605} {"train_loss": -11.333370208740234, "global_step": 269642, "epoch": 1605} {"train_loss": -11.65218448638916, "global_step": 269643, "epoch": 1605} {"train_loss": -11.516618728637695, "global_step": 269644, "epoch": 1605} {"train_loss": -11.965767860412598, "global_step": 269645, "epoch": 1605} {"train_loss": -11.479002952575684, "global_step": 269646, "epoch": 1605} {"train_loss": -11.813166618347168, "global_step": 269647, "epoch": 1605} {"train_loss": -11.79342269897461, "global_step": 269648, "epoch": 1605} {"train_loss": -11.874547004699707, "global_step": 269649, "epoch": 1605} {"train_loss": -11.813125610351562, "global_step": 269650, "epoch": 1605} {"train_loss": -11.733750343322754, "global_step": 269651, "epoch": 1605} {"train_loss": -11.666206359863281, "global_step": 269652, "epoch": 1605} {"train_loss": -11.897546768188477, "global_step": 269653, "epoch": 1605} {"train_loss": -11.925713539123535, "global_step": 269654, "epoch": 1605} {"train_loss": -11.917877197265625, "global_step": 269655, "epoch": 1605} {"train_loss": -11.951773643493652, "global_step": 269656, "epoch": 1605} {"train_loss": -11.942424774169922, "global_step": 269657, "epoch": 1605} {"train_loss": -11.86527156829834, "global_step": 269658, "epoch": 1605} {"train_loss": -11.911334037780762, "global_step": 269659, "epoch": 1605} {"train_loss": -11.886085510253906, "global_step": 269660, "epoch": 1605} {"train_loss": -11.734695434570312, "global_step": 269661, "epoch": 1605} {"train_loss": -11.795825958251953, "global_step": 269662, "epoch": 1605} {"train_loss": -12.115911483764648, "global_step": 269663, "epoch": 1605} {"train_loss": -11.92049789428711, "global_step": 269664, "epoch": 1605} {"train_loss": -11.939682960510254, "global_step": 269665, "epoch": 1605} {"train_loss": -12.164422988891602, "global_step": 269666, "epoch": 1605} {"train_loss": -12.07302474975586, "global_step": 269667, "epoch": 1605} {"train_loss": -12.227351188659668, "global_step": 269668, "epoch": 1605} {"train_loss": -12.072002410888672, "global_step": 269669, "epoch": 1605} {"train_loss": -12.0576171875, "global_step": 269670, "epoch": 1605} {"train_loss": -12.19006061553955, "global_step": 269671, "epoch": 1605} {"train_loss": -12.055624008178711, "global_step": 269672, "epoch": 1605} {"train_loss": -12.259607315063477, "global_step": 269673, "epoch": 1605} {"train_loss": -12.07132339477539, "global_step": 269674, "epoch": 1605} {"train_loss": -12.156839370727539, "global_step": 269675, "epoch": 1605} {"train_loss": -12.15275764465332, "global_step": 269676, "epoch": 1605} {"train_loss": -11.860630989074707, "global_step": 269677, "epoch": 1605} {"train_loss": -12.2406587600708, "global_step": 269678, "epoch": 1605} {"train_loss": -12.074353218078613, "global_step": 269679, "epoch": 1605} {"train_loss": -12.123624801635742, "global_step": 269680, "epoch": 1605} {"train_loss": -11.877408981323242, "global_step": 269681, "epoch": 1605} {"train_loss": -11.87637710571289, "global_step": 269682, "epoch": 1605} {"train_loss": -12.29751968383789, "global_step": 269683, "epoch": 1605} {"train_loss": -12.022092819213867, "global_step": 269684, "epoch": 1605} {"train_loss": -12.248138427734375, "global_step": 269685, "epoch": 1605} {"train_loss": -12.023683547973633, "global_step": 269686, "epoch": 1605} {"train_loss": -12.180304527282715, "global_step": 269687, "epoch": 1605} {"train_loss": -12.013081550598145, "global_step": 269688, "epoch": 1605} {"train_loss": -12.168476104736328, "global_step": 269689, "epoch": 1605} {"train_loss": -12.019795417785645, "global_step": 269690, "epoch": 1605} {"train_loss": -12.148022651672363, "global_step": 269691, "epoch": 1605} {"train_loss": -11.840544700622559, "global_step": 269692, "epoch": 1605} {"train_loss": -11.929086685180664, "global_step": 269693, "epoch": 1605} {"train_loss": -11.96101188659668, "global_step": 269694, "epoch": 1605} {"train_loss": -11.838332176208496, "global_step": 269695, "epoch": 1605} {"train_loss": -11.685768127441406, "global_step": 269696, "epoch": 1605} {"train_loss": -11.000621795654297, "global_step": 269697, "epoch": 1605} {"train_loss": -12.188169479370117, "global_step": 269698, "epoch": 1605} {"train_loss": -11.428050994873047, "global_step": 269699, "epoch": 1605} {"train_loss": -11.567190170288086, "global_step": 269700, "epoch": 1605} {"train_loss": -10.980182647705078, "global_step": 269701, "epoch": 1605} {"train_loss": -12.089221000671387, "global_step": 269702, "epoch": 1605} {"train_loss": -11.527814865112305, "global_step": 269703, "epoch": 1605} {"train_loss": -11.216630935668945, "global_step": 269704, "epoch": 1605} {"train_loss": -10.666082382202148, "global_step": 269705, "epoch": 1605} {"train_loss": -11.331130981445312, "global_step": 269706, "epoch": 1605} {"train_loss": -10.19235897064209, "global_step": 269707, "epoch": 1605} {"train_loss": -11.507013320922852, "global_step": 269708, "epoch": 1605} {"train_loss": -11.064289093017578, "global_step": 269709, "epoch": 1605} {"train_loss": -10.9514741897583, "global_step": 269710, "epoch": 1605} {"train_loss": -11.400287628173828, "global_step": 269711, "epoch": 1605} {"train_loss": -9.276285171508789, "global_step": 269712, "epoch": 1605} {"train_loss": -11.41797924041748, "global_step": 269713, "epoch": 1605} {"train_loss": -9.92654037475586, "global_step": 269714, "epoch": 1605} {"train_loss": -10.115352630615234, "global_step": 269715, "epoch": 1605} {"train_loss": -10.057685852050781, "global_step": 269716, "epoch": 1605} {"train_loss": -10.903846740722656, "global_step": 269717, "epoch": 1605} {"train_loss": -10.757129669189453, "global_step": 269718, "epoch": 1605} {"train_loss": -11.089387893676758, "global_step": 269719, "epoch": 1605} {"train_loss": -9.929271697998047, "global_step": 269720, "epoch": 1605} {"train_loss": -11.074838638305664, "global_step": 269721, "epoch": 1605} {"train_loss": -10.247002601623535, "global_step": 269722, "epoch": 1605} {"train_loss": -11.081414222717285, "global_step": 269723, "epoch": 1605} {"train_loss": -11.814119338989258, "global_step": 269724, "epoch": 1605} {"train_loss": -10.670230865478516, "global_step": 269725, "epoch": 1605} {"train_loss": -11.71371841430664, "global_step": 269726, "epoch": 1605} {"train_loss": -11.280157089233398, "global_step": 269727, "epoch": 1605} {"train_loss": -11.737037658691406, "global_step": 269728, "epoch": 1605} {"train_loss": -11.796034812927246, "global_step": 269729, "epoch": 1605} {"train_loss": -11.536059379577637, "global_step": 269730, "epoch": 1605} {"train_loss": -11.664165496826172, "global_step": 269731, "epoch": 1605} {"train_loss": -11.472166061401367, "global_step": 269732, "epoch": 1605} {"train_loss": -11.865448951721191, "global_step": 269733, "epoch": 1605} {"train_loss": -12.001531600952148, "global_step": 269734, "epoch": 1605} {"train_loss": -11.799708366394043, "global_step": 269735, "epoch": 1605} {"train_loss": -11.85831069946289, "global_step": 269736, "epoch": 1605} {"train_loss": -11.603486061096191, "global_step": 269737, "epoch": 1605} {"train_loss": -11.847250938415527, "global_step": 269738, "epoch": 1605} {"train_loss": -11.99244499206543, "global_step": 269739, "epoch": 1605} {"train_loss": -11.952534675598145, "global_step": 269740, "epoch": 1605} {"train_loss": -12.090788841247559, "global_step": 269741, "epoch": 1605} {"train_loss": -11.768933296203613, "global_step": 269742, "epoch": 1605} {"train_loss": -12.08377456665039, "global_step": 269743, "epoch": 1605} {"train_loss": -12.092264175415039, "global_step": 269744, "epoch": 1605} {"train_loss": -12.00324821472168, "global_step": 269745, "epoch": 1605} {"train_loss": -11.874568939208984, "global_step": 269746, "epoch": 1605} {"train_loss": -11.789103507995605, "global_step": 269747, "epoch": 1605} {"train_loss": -12.013656616210938, "global_step": 269748, "epoch": 1605} {"train_loss": -11.76202392578125, "global_step": 269749, "epoch": 1605} {"train_loss": -11.925878524780273, "global_step": 269750, "epoch": 1605} {"train_loss": -11.74022102355957, "global_step": 269751, "epoch": 1605} {"train_loss": -11.972808837890625, "global_step": 269752, "epoch": 1605} {"train_loss": -12.06753921508789, "global_step": 269753, "epoch": 1605} {"train_loss": -11.899490356445312, "global_step": 269754, "epoch": 1605} {"train_loss": -11.943673133850098, "global_step": 269755, "epoch": 1605} {"train_loss": -11.95555591583252, "global_step": 269756, "epoch": 1605} {"train_loss": -11.875923156738281, "global_step": 269757, "epoch": 1605} {"train_loss": -12.045315742492676, "global_step": 269758, "epoch": 1605} {"train_loss": -11.921239852905273, "global_step": 269759, "epoch": 1605} {"train_loss": -11.905000686645508, "global_step": 269760, "epoch": 1605} {"train_loss": -12.02310562133789, "global_step": 269761, "epoch": 1605} {"train_loss": -12.05634880065918, "global_step": 269762, "epoch": 1605} {"train_loss": -12.163799285888672, "global_step": 269763, "epoch": 1605} {"train_loss": -12.15458869934082, "global_step": 269764, "epoch": 1605} {"train_loss": -12.21425724029541, "global_step": 269765, "epoch": 1605} {"train_loss": -12.105734825134277, "global_step": 269766, "epoch": 1605} {"train_loss": -12.096261978149414, "global_step": 269767, "epoch": 1605} {"train_loss": -12.009431838989258, "global_step": 269768, "epoch": 1605} {"train_loss": -12.111680030822754, "global_step": 269769, "epoch": 1605} {"train_loss": -11.916783332824707, "global_step": 269770, "epoch": 1605} {"train_loss": -12.11447811126709, "global_step": 269771, "epoch": 1605} {"train_loss": -11.997096061706543, "global_step": 269772, "epoch": 1605} {"train_loss": -12.005380630493164, "global_step": 269773, "epoch": 1605} {"train_loss": -12.205207824707031, "global_step": 269774, "epoch": 1605} {"train_loss": -11.997562408447266, "global_step": 269775, "epoch": 1605} {"train_loss": -12.134674072265625, "global_step": 269776, "epoch": 1605} {"train_loss": -12.232102394104004, "global_step": 269777, "epoch": 1605} {"train_loss": -11.999616622924805, "global_step": 269778, "epoch": 1605} {"train_loss": -12.169086456298828, "global_step": 269779, "epoch": 1605} {"train_loss": -12.048300743103027, "global_step": 269780, "epoch": 1605} {"train_loss": -12.119102478027344, "global_step": 269781, "epoch": 1605} {"train_loss": -12.134723663330078, "global_step": 269782, "epoch": 1605} {"train_loss": -11.982523918151855, "global_step": 269783, "epoch": 1605} {"train_loss": -11.871186256408691, "global_step": 269784, "epoch": 1605} {"train_loss": -12.354758262634277, "global_step": 269785, "epoch": 1605} {"train_loss": -11.85138988494873, "global_step": 269786, "epoch": 1605} {"train_loss": -12.244400978088379, "global_step": 269787, "epoch": 1605} {"train_loss": -12.037113189697266, "global_step": 269788, "epoch": 1605} {"train_loss": -12.355865478515625, "global_step": 269789, "epoch": 1605} {"train_loss": -12.106413841247559, "global_step": 269790, "epoch": 1605} {"train_loss": -12.292121887207031, "global_step": 269791, "epoch": 1605} {"train_loss": -12.352546691894531, "global_step": 269792, "epoch": 1605} {"train_loss": -12.097175598144531, "global_step": 269793, "epoch": 1605} {"train_loss": -12.230470657348633, "global_step": 269794, "epoch": 1605} {"train_loss": -11.962738037109375, "global_step": 269795, "epoch": 1605} {"train_loss": -12.179189682006836, "global_step": 269796, "epoch": 1605} {"train_loss": -12.247516632080078, "global_step": 269797, "epoch": 1605} {"train_loss": -12.158202171325684, "global_step": 269798, "epoch": 1605} {"train_loss": -12.150859832763672, "global_step": 269799, "epoch": 1605} {"train_loss": -11.70197868347168, "global_step": 269800, "epoch": 1605} {"train_loss": -11.756484985351562, "global_step": 269801, "epoch": 1605} {"train_loss": -11.107487678527832, "global_step": 269802, "epoch": 1605} {"train_loss": -10.141494750976562, "global_step": 269803, "epoch": 1605} {"train_loss": -10.920232772827148, "global_step": 269804, "epoch": 1605} {"train_loss": -11.506568908691406, "global_step": 269805, "epoch": 1605} {"train_loss": -10.361108779907227, "global_step": 269806, "epoch": 1605} {"train_loss": -11.738158907209124, "global_step": 269807, "epoch": 1605, "val_loss": 274505.40625, "train_action_mse_error": 1.9938249588012695} {"train_loss": -11.270271301269531, "global_step": 269808, "epoch": 1606} {"train_loss": -8.13828182220459, "global_step": 269809, "epoch": 1606} {"train_loss": -7.249284744262695, "global_step": 269810, "epoch": 1606} {"train_loss": -7.111326217651367, "global_step": 269811, "epoch": 1606} {"train_loss": -7.006451606750488, "global_step": 269812, "epoch": 1606} {"train_loss": -7.492832183837891, "global_step": 269813, "epoch": 1606} {"train_loss": -9.797520637512207, "global_step": 269814, "epoch": 1606} {"train_loss": -5.757117748260498, "global_step": 269815, "epoch": 1606} {"train_loss": -6.702578544616699, "global_step": 269816, "epoch": 1606} {"train_loss": -5.841741561889648, "global_step": 269817, "epoch": 1606} {"train_loss": -5.639781951904297, "global_step": 269818, "epoch": 1606} {"train_loss": -6.051972389221191, "global_step": 269819, "epoch": 1606} {"train_loss": -5.536623477935791, "global_step": 269820, "epoch": 1606} {"train_loss": -5.9523725509643555, "global_step": 269821, "epoch": 1606} {"train_loss": -6.759130001068115, "global_step": 269822, "epoch": 1606} {"train_loss": -7.818206310272217, "global_step": 269823, "epoch": 1606} {"train_loss": -7.001866340637207, "global_step": 269824, "epoch": 1606} {"train_loss": -7.546040058135986, "global_step": 269825, "epoch": 1606} {"train_loss": -7.473114013671875, "global_step": 269826, "epoch": 1606} {"train_loss": -7.885939121246338, "global_step": 269827, "epoch": 1606} {"train_loss": -8.259969711303711, "global_step": 269828, "epoch": 1606} {"train_loss": -6.769493103027344, "global_step": 269829, "epoch": 1606} {"train_loss": -8.063419342041016, "global_step": 269830, "epoch": 1606} {"train_loss": -7.720787525177002, "global_step": 269831, "epoch": 1606} {"train_loss": -8.281412124633789, "global_step": 269832, "epoch": 1606} {"train_loss": -9.204593658447266, "global_step": 269833, "epoch": 1606} {"train_loss": -9.110198974609375, "global_step": 269834, "epoch": 1606} {"train_loss": -8.69742202758789, "global_step": 269835, "epoch": 1606} {"train_loss": -9.650976181030273, "global_step": 269836, "epoch": 1606} {"train_loss": -9.392358779907227, "global_step": 269837, "epoch": 1606} {"train_loss": -9.869216918945312, "global_step": 269838, "epoch": 1606} {"train_loss": -10.39798355102539, "global_step": 269839, "epoch": 1606} {"train_loss": -10.41444206237793, "global_step": 269840, "epoch": 1606} {"train_loss": -10.763534545898438, "global_step": 269841, "epoch": 1606} {"train_loss": -10.582094192504883, "global_step": 269842, "epoch": 1606} {"train_loss": -10.633913040161133, "global_step": 269843, "epoch": 1606} {"train_loss": -10.791435241699219, "global_step": 269844, "epoch": 1606} {"train_loss": -10.767868995666504, "global_step": 269845, "epoch": 1606} {"train_loss": -10.728033065795898, "global_step": 269846, "epoch": 1606} {"train_loss": -10.944491386413574, "global_step": 269847, "epoch": 1606} {"train_loss": -10.974668502807617, "global_step": 269848, "epoch": 1606} {"train_loss": -11.06405258178711, "global_step": 269849, "epoch": 1606} {"train_loss": -11.068787574768066, "global_step": 269850, "epoch": 1606} {"train_loss": -10.86562442779541, "global_step": 269851, "epoch": 1606} {"train_loss": -11.265825271606445, "global_step": 269852, "epoch": 1606} {"train_loss": -11.086647987365723, "global_step": 269853, "epoch": 1606} {"train_loss": -11.377388000488281, "global_step": 269854, "epoch": 1606} {"train_loss": -11.316079139709473, "global_step": 269855, "epoch": 1606} {"train_loss": -11.519920349121094, "global_step": 269856, "epoch": 1606} {"train_loss": -11.105329513549805, "global_step": 269857, "epoch": 1606} {"train_loss": -11.25415325164795, "global_step": 269858, "epoch": 1606} {"train_loss": -11.152652740478516, "global_step": 269859, "epoch": 1606} {"train_loss": -11.600502014160156, "global_step": 269860, "epoch": 1606} {"train_loss": -11.386637687683105, "global_step": 269861, "epoch": 1606} {"train_loss": -11.631717681884766, "global_step": 269862, "epoch": 1606} {"train_loss": -11.43309211730957, "global_step": 269863, "epoch": 1606} {"train_loss": -11.33741569519043, "global_step": 269864, "epoch": 1606} {"train_loss": -11.063681602478027, "global_step": 269865, "epoch": 1606} {"train_loss": -11.355796813964844, "global_step": 269866, "epoch": 1606} {"train_loss": -11.62115478515625, "global_step": 269867, "epoch": 1606} {"train_loss": -11.600533485412598, "global_step": 269868, "epoch": 1606} {"train_loss": -11.471700668334961, "global_step": 269869, "epoch": 1606} {"train_loss": -11.005548477172852, "global_step": 269870, "epoch": 1606} {"train_loss": -11.433555603027344, "global_step": 269871, "epoch": 1606} {"train_loss": -11.472167015075684, "global_step": 269872, "epoch": 1606} {"train_loss": -11.705390930175781, "global_step": 269873, "epoch": 1606} {"train_loss": -11.820796966552734, "global_step": 269874, "epoch": 1606} {"train_loss": -11.760049819946289, "global_step": 269875, "epoch": 1606} {"train_loss": -11.871126174926758, "global_step": 269876, "epoch": 1606} {"train_loss": -11.688287734985352, "global_step": 269877, "epoch": 1606} {"train_loss": -11.754291534423828, "global_step": 269878, "epoch": 1606} {"train_loss": -11.697430610656738, "global_step": 269879, "epoch": 1606} {"train_loss": -11.73707103729248, "global_step": 269880, "epoch": 1606} {"train_loss": -12.024333953857422, "global_step": 269881, "epoch": 1606} {"train_loss": -11.751385688781738, "global_step": 269882, "epoch": 1606} {"train_loss": -11.982234954833984, "global_step": 269883, "epoch": 1606} {"train_loss": -11.642951011657715, "global_step": 269884, "epoch": 1606} {"train_loss": -11.824773788452148, "global_step": 269885, "epoch": 1606} {"train_loss": -12.034928321838379, "global_step": 269886, "epoch": 1606} {"train_loss": -12.007874488830566, "global_step": 269887, "epoch": 1606} {"train_loss": -11.863304138183594, "global_step": 269888, "epoch": 1606} {"train_loss": -11.98137092590332, "global_step": 269889, "epoch": 1606} {"train_loss": -11.873265266418457, "global_step": 269890, "epoch": 1606} {"train_loss": -11.879267692565918, "global_step": 269891, "epoch": 1606} {"train_loss": -12.003667831420898, "global_step": 269892, "epoch": 1606} {"train_loss": -11.726835250854492, "global_step": 269893, "epoch": 1606} {"train_loss": -12.071081161499023, "global_step": 269894, "epoch": 1606} {"train_loss": -12.008346557617188, "global_step": 269895, "epoch": 1606} {"train_loss": -11.919881820678711, "global_step": 269896, "epoch": 1606} {"train_loss": -12.019886016845703, "global_step": 269897, "epoch": 1606} {"train_loss": -12.12510871887207, "global_step": 269898, "epoch": 1606} {"train_loss": -11.945505142211914, "global_step": 269899, "epoch": 1606} {"train_loss": -12.237886428833008, "global_step": 269900, "epoch": 1606} {"train_loss": -11.93307113647461, "global_step": 269901, "epoch": 1606} {"train_loss": -12.09339427947998, "global_step": 269902, "epoch": 1606} {"train_loss": -11.815603256225586, "global_step": 269903, "epoch": 1606} {"train_loss": -12.139982223510742, "global_step": 269904, "epoch": 1606} {"train_loss": -11.977240562438965, "global_step": 269905, "epoch": 1606} {"train_loss": -11.759371757507324, "global_step": 269906, "epoch": 1606} {"train_loss": -12.061075210571289, "global_step": 269907, "epoch": 1606} {"train_loss": -11.847461700439453, "global_step": 269908, "epoch": 1606} {"train_loss": -11.989753723144531, "global_step": 269909, "epoch": 1606} {"train_loss": -12.07066822052002, "global_step": 269910, "epoch": 1606} {"train_loss": -11.820695877075195, "global_step": 269911, "epoch": 1606} {"train_loss": -11.965871810913086, "global_step": 269912, "epoch": 1606} {"train_loss": -12.049308776855469, "global_step": 269913, "epoch": 1606} {"train_loss": -11.289130210876465, "global_step": 269914, "epoch": 1606} {"train_loss": -12.139463424682617, "global_step": 269915, "epoch": 1606} {"train_loss": -11.452580451965332, "global_step": 269916, "epoch": 1606} {"train_loss": -10.656700134277344, "global_step": 269917, "epoch": 1606} {"train_loss": -11.76750373840332, "global_step": 269918, "epoch": 1606} {"train_loss": -11.16573715209961, "global_step": 269919, "epoch": 1606} {"train_loss": -10.845526695251465, "global_step": 269920, "epoch": 1606} {"train_loss": -10.552118301391602, "global_step": 269921, "epoch": 1606} {"train_loss": -10.525010108947754, "global_step": 269922, "epoch": 1606} {"train_loss": -10.134389877319336, "global_step": 269923, "epoch": 1606} {"train_loss": -10.947922706604004, "global_step": 269924, "epoch": 1606} {"train_loss": -10.380308151245117, "global_step": 269925, "epoch": 1606} {"train_loss": -10.81248664855957, "global_step": 269926, "epoch": 1606} {"train_loss": -10.82234001159668, "global_step": 269927, "epoch": 1606} {"train_loss": -10.545138359069824, "global_step": 269928, "epoch": 1606} {"train_loss": -11.466387748718262, "global_step": 269929, "epoch": 1606} {"train_loss": -10.583362579345703, "global_step": 269930, "epoch": 1606} {"train_loss": -11.356653213500977, "global_step": 269931, "epoch": 1606} {"train_loss": -9.086528778076172, "global_step": 269932, "epoch": 1606} {"train_loss": -11.176065444946289, "global_step": 269933, "epoch": 1606} {"train_loss": -10.531221389770508, "global_step": 269934, "epoch": 1606} {"train_loss": -10.426237106323242, "global_step": 269935, "epoch": 1606} {"train_loss": -8.736125946044922, "global_step": 269936, "epoch": 1606} {"train_loss": -10.106888771057129, "global_step": 269937, "epoch": 1606} {"train_loss": -8.419292449951172, "global_step": 269938, "epoch": 1606} {"train_loss": -10.646876335144043, "global_step": 269939, "epoch": 1606} {"train_loss": -8.9454345703125, "global_step": 269940, "epoch": 1606} {"train_loss": -9.433286666870117, "global_step": 269941, "epoch": 1606} {"train_loss": -10.264444351196289, "global_step": 269942, "epoch": 1606} {"train_loss": -9.044692039489746, "global_step": 269943, "epoch": 1606} {"train_loss": -11.291460037231445, "global_step": 269944, "epoch": 1606} {"train_loss": -8.600177764892578, "global_step": 269945, "epoch": 1606} {"train_loss": -10.164178848266602, "global_step": 269946, "epoch": 1606} {"train_loss": -9.542787551879883, "global_step": 269947, "epoch": 1606} {"train_loss": -10.48045539855957, "global_step": 269948, "epoch": 1606} {"train_loss": -9.621415138244629, "global_step": 269949, "epoch": 1606} {"train_loss": -9.338232040405273, "global_step": 269950, "epoch": 1606} {"train_loss": -11.178672790527344, "global_step": 269951, "epoch": 1606} {"train_loss": -10.003108978271484, "global_step": 269952, "epoch": 1606} {"train_loss": -10.119386672973633, "global_step": 269953, "epoch": 1606} {"train_loss": -11.025094985961914, "global_step": 269954, "epoch": 1606} {"train_loss": -10.739334106445312, "global_step": 269955, "epoch": 1606} {"train_loss": -10.396160125732422, "global_step": 269956, "epoch": 1606} {"train_loss": -11.102550506591797, "global_step": 269957, "epoch": 1606} {"train_loss": -10.316402435302734, "global_step": 269958, "epoch": 1606} {"train_loss": -11.52901554107666, "global_step": 269959, "epoch": 1606} {"train_loss": -10.49027156829834, "global_step": 269960, "epoch": 1606} {"train_loss": -11.273494720458984, "global_step": 269961, "epoch": 1606} {"train_loss": -10.788074493408203, "global_step": 269962, "epoch": 1606} {"train_loss": -10.658631324768066, "global_step": 269963, "epoch": 1606} {"train_loss": -11.479799270629883, "global_step": 269964, "epoch": 1606} {"train_loss": -10.594049453735352, "global_step": 269965, "epoch": 1606} {"train_loss": -11.447086334228516, "global_step": 269966, "epoch": 1606} {"train_loss": -11.043222427368164, "global_step": 269967, "epoch": 1606} {"train_loss": -11.062016487121582, "global_step": 269968, "epoch": 1606} {"train_loss": -11.454072952270508, "global_step": 269969, "epoch": 1606} {"train_loss": -11.032808303833008, "global_step": 269970, "epoch": 1606} {"train_loss": -11.296698570251465, "global_step": 269971, "epoch": 1606} {"train_loss": -11.464395523071289, "global_step": 269972, "epoch": 1606} {"train_loss": -11.333560943603516, "global_step": 269973, "epoch": 1606} {"train_loss": -11.685580253601074, "global_step": 269974, "epoch": 1606} {"train_loss": -10.500478134268807, "global_step": 269975, "epoch": 1606, "val_loss": 273187.3125} {"train_loss": -11.316896438598633, "global_step": 269976, "epoch": 1607} {"train_loss": -11.72240924835205, "global_step": 269977, "epoch": 1607} {"train_loss": -10.85761547088623, "global_step": 269978, "epoch": 1607} {"train_loss": -11.548483848571777, "global_step": 269979, "epoch": 1607} {"train_loss": -11.561302185058594, "global_step": 269980, "epoch": 1607} {"train_loss": -11.32028579711914, "global_step": 269981, "epoch": 1607} {"train_loss": -11.591665267944336, "global_step": 269982, "epoch": 1607} {"train_loss": -11.447731018066406, "global_step": 269983, "epoch": 1607} {"train_loss": -11.353536605834961, "global_step": 269984, "epoch": 1607} {"train_loss": -11.642284393310547, "global_step": 269985, "epoch": 1607} {"train_loss": -11.357463836669922, "global_step": 269986, "epoch": 1607} {"train_loss": -11.553657531738281, "global_step": 269987, "epoch": 1607} {"train_loss": -11.738022804260254, "global_step": 269988, "epoch": 1607} {"train_loss": -11.253368377685547, "global_step": 269989, "epoch": 1607} {"train_loss": -11.733514785766602, "global_step": 269990, "epoch": 1607} {"train_loss": -11.559188842773438, "global_step": 269991, "epoch": 1607} {"train_loss": -11.612295150756836, "global_step": 269992, "epoch": 1607} {"train_loss": -11.779659271240234, "global_step": 269993, "epoch": 1607} {"train_loss": -11.445842742919922, "global_step": 269994, "epoch": 1607} {"train_loss": -11.817682266235352, "global_step": 269995, "epoch": 1607} {"train_loss": -11.71400260925293, "global_step": 269996, "epoch": 1607} {"train_loss": -11.726905822753906, "global_step": 269997, "epoch": 1607} {"train_loss": -11.781476974487305, "global_step": 269998, "epoch": 1607} {"train_loss": -11.566280364990234, "global_step": 269999, "epoch": 1607} {"train_loss": -11.55051326751709, "global_step": 270000, "epoch": 1607} {"train_loss": -11.853063583374023, "global_step": 270001, "epoch": 1607} {"train_loss": -11.701459884643555, "global_step": 270002, "epoch": 1607} {"train_loss": -11.895872116088867, "global_step": 270003, "epoch": 1607} {"train_loss": -11.824216842651367, "global_step": 270004, "epoch": 1607} {"train_loss": -11.843473434448242, "global_step": 270005, "epoch": 1607} {"train_loss": -11.868722915649414, "global_step": 270006, "epoch": 1607} {"train_loss": -11.646726608276367, "global_step": 270007, "epoch": 1607} {"train_loss": -12.014596939086914, "global_step": 270008, "epoch": 1607} {"train_loss": -11.702766418457031, "global_step": 270009, "epoch": 1607} {"train_loss": -11.970212936401367, "global_step": 270010, "epoch": 1607} {"train_loss": -11.850773811340332, "global_step": 270011, "epoch": 1607} {"train_loss": -12.016504287719727, "global_step": 270012, "epoch": 1607} {"train_loss": -11.907540321350098, "global_step": 270013, "epoch": 1607} {"train_loss": -11.977943420410156, "global_step": 270014, "epoch": 1607} {"train_loss": -11.92282485961914, "global_step": 270015, "epoch": 1607} {"train_loss": -12.030416488647461, "global_step": 270016, "epoch": 1607} {"train_loss": -12.055320739746094, "global_step": 270017, "epoch": 1607} {"train_loss": -12.017633438110352, "global_step": 270018, "epoch": 1607} {"train_loss": -12.225301742553711, "global_step": 270019, "epoch": 1607} {"train_loss": -12.005878448486328, "global_step": 270020, "epoch": 1607} {"train_loss": -11.764303207397461, "global_step": 270021, "epoch": 1607} {"train_loss": -11.956413269042969, "global_step": 270022, "epoch": 1607} {"train_loss": -11.924958229064941, "global_step": 270023, "epoch": 1607} {"train_loss": -12.124977111816406, "global_step": 270024, "epoch": 1607} {"train_loss": -11.861429214477539, "global_step": 270025, "epoch": 1607} {"train_loss": -12.012150764465332, "global_step": 270026, "epoch": 1607} {"train_loss": -11.909004211425781, "global_step": 270027, "epoch": 1607} {"train_loss": -11.896793365478516, "global_step": 270028, "epoch": 1607} {"train_loss": -11.860958099365234, "global_step": 270029, "epoch": 1607} {"train_loss": -11.715901374816895, "global_step": 270030, "epoch": 1607} {"train_loss": -11.974535942077637, "global_step": 270031, "epoch": 1607} {"train_loss": -11.77969741821289, "global_step": 270032, "epoch": 1607} {"train_loss": -12.17454719543457, "global_step": 270033, "epoch": 1607} {"train_loss": -11.838293075561523, "global_step": 270034, "epoch": 1607} {"train_loss": -12.061585426330566, "global_step": 270035, "epoch": 1607} {"train_loss": -11.865615844726562, "global_step": 270036, "epoch": 1607} {"train_loss": -12.181748390197754, "global_step": 270037, "epoch": 1607} {"train_loss": -12.01014232635498, "global_step": 270038, "epoch": 1607} {"train_loss": -11.982797622680664, "global_step": 270039, "epoch": 1607} {"train_loss": -11.986553192138672, "global_step": 270040, "epoch": 1607} {"train_loss": -11.44537353515625, "global_step": 270041, "epoch": 1607} {"train_loss": -12.139047622680664, "global_step": 270042, "epoch": 1607} {"train_loss": -12.075087547302246, "global_step": 270043, "epoch": 1607} {"train_loss": -12.212740898132324, "global_step": 270044, "epoch": 1607} {"train_loss": -12.021015167236328, "global_step": 270045, "epoch": 1607} {"train_loss": -12.067815780639648, "global_step": 270046, "epoch": 1607} {"train_loss": -11.66943359375, "global_step": 270047, "epoch": 1607} {"train_loss": -11.05980110168457, "global_step": 270048, "epoch": 1607} {"train_loss": -11.2322416305542, "global_step": 270049, "epoch": 1607} {"train_loss": -11.24279499053955, "global_step": 270050, "epoch": 1607} {"train_loss": -9.380178451538086, "global_step": 270051, "epoch": 1607} {"train_loss": -9.053831100463867, "global_step": 270052, "epoch": 1607} {"train_loss": -8.848767280578613, "global_step": 270053, "epoch": 1607} {"train_loss": -11.513477325439453, "global_step": 270054, "epoch": 1607} {"train_loss": -8.509105682373047, "global_step": 270055, "epoch": 1607} {"train_loss": -8.5989990234375, "global_step": 270056, "epoch": 1607} {"train_loss": -10.076504707336426, "global_step": 270057, "epoch": 1607} {"train_loss": -10.4691801071167, "global_step": 270058, "epoch": 1607} {"train_loss": -9.103418350219727, "global_step": 270059, "epoch": 1607} {"train_loss": -10.284725189208984, "global_step": 270060, "epoch": 1607} {"train_loss": -10.295297622680664, "global_step": 270061, "epoch": 1607} {"train_loss": -9.20051383972168, "global_step": 270062, "epoch": 1607} {"train_loss": -10.03957748413086, "global_step": 270063, "epoch": 1607} {"train_loss": -9.031071662902832, "global_step": 270064, "epoch": 1607} {"train_loss": -10.20928955078125, "global_step": 270065, "epoch": 1607} {"train_loss": -10.553364753723145, "global_step": 270066, "epoch": 1607} {"train_loss": -10.474472045898438, "global_step": 270067, "epoch": 1607} {"train_loss": -10.970044136047363, "global_step": 270068, "epoch": 1607} {"train_loss": -11.151987075805664, "global_step": 270069, "epoch": 1607} {"train_loss": -10.868659019470215, "global_step": 270070, "epoch": 1607} {"train_loss": -11.294614791870117, "global_step": 270071, "epoch": 1607} {"train_loss": -10.88521957397461, "global_step": 270072, "epoch": 1607} {"train_loss": -11.351795196533203, "global_step": 270073, "epoch": 1607} {"train_loss": -11.587167739868164, "global_step": 270074, "epoch": 1607} {"train_loss": -10.92469310760498, "global_step": 270075, "epoch": 1607} {"train_loss": -11.236846923828125, "global_step": 270076, "epoch": 1607} {"train_loss": -11.266283988952637, "global_step": 270077, "epoch": 1607} {"train_loss": -11.513093948364258, "global_step": 270078, "epoch": 1607} {"train_loss": -11.288783073425293, "global_step": 270079, "epoch": 1607} {"train_loss": -11.771855354309082, "global_step": 270080, "epoch": 1607} {"train_loss": -11.185770034790039, "global_step": 270081, "epoch": 1607} {"train_loss": -11.64402961730957, "global_step": 270082, "epoch": 1607} {"train_loss": -11.465446472167969, "global_step": 270083, "epoch": 1607} {"train_loss": -11.596843719482422, "global_step": 270084, "epoch": 1607} {"train_loss": -11.489126205444336, "global_step": 270085, "epoch": 1607} {"train_loss": -11.477537155151367, "global_step": 270086, "epoch": 1607} {"train_loss": -11.544644355773926, "global_step": 270087, "epoch": 1607} {"train_loss": -11.639265060424805, "global_step": 270088, "epoch": 1607} {"train_loss": -11.764276504516602, "global_step": 270089, "epoch": 1607} {"train_loss": -11.571452140808105, "global_step": 270090, "epoch": 1607} {"train_loss": -11.642385482788086, "global_step": 270091, "epoch": 1607} {"train_loss": -11.774232864379883, "global_step": 270092, "epoch": 1607} {"train_loss": -11.677213668823242, "global_step": 270093, "epoch": 1607} {"train_loss": -11.863693237304688, "global_step": 270094, "epoch": 1607} {"train_loss": -11.584615707397461, "global_step": 270095, "epoch": 1607} {"train_loss": -11.567686080932617, "global_step": 270096, "epoch": 1607} {"train_loss": -11.698925971984863, "global_step": 270097, "epoch": 1607} {"train_loss": -11.623441696166992, "global_step": 270098, "epoch": 1607} {"train_loss": -11.822181701660156, "global_step": 270099, "epoch": 1607} {"train_loss": -11.653348922729492, "global_step": 270100, "epoch": 1607} {"train_loss": -11.841398239135742, "global_step": 270101, "epoch": 1607} {"train_loss": -11.887060165405273, "global_step": 270102, "epoch": 1607} {"train_loss": -11.804165840148926, "global_step": 270103, "epoch": 1607} {"train_loss": -11.995240211486816, "global_step": 270104, "epoch": 1607} {"train_loss": -11.84862995147705, "global_step": 270105, "epoch": 1607} {"train_loss": -12.028261184692383, "global_step": 270106, "epoch": 1607} {"train_loss": -11.607223510742188, "global_step": 270107, "epoch": 1607} {"train_loss": -11.986865997314453, "global_step": 270108, "epoch": 1607} {"train_loss": -11.786324501037598, "global_step": 270109, "epoch": 1607} {"train_loss": -11.86653995513916, "global_step": 270110, "epoch": 1607} {"train_loss": -12.043619155883789, "global_step": 270111, "epoch": 1607} {"train_loss": -11.812841415405273, "global_step": 270112, "epoch": 1607} {"train_loss": -11.968109130859375, "global_step": 270113, "epoch": 1607} {"train_loss": -11.744256973266602, "global_step": 270114, "epoch": 1607} {"train_loss": -11.778061866760254, "global_step": 270115, "epoch": 1607} {"train_loss": -12.013113021850586, "global_step": 270116, "epoch": 1607} {"train_loss": -11.750277519226074, "global_step": 270117, "epoch": 1607} {"train_loss": -11.986194610595703, "global_step": 270118, "epoch": 1607} {"train_loss": -11.989633560180664, "global_step": 270119, "epoch": 1607} {"train_loss": -11.829487800598145, "global_step": 270120, "epoch": 1607} {"train_loss": -12.084920883178711, "global_step": 270121, "epoch": 1607} {"train_loss": -11.807701110839844, "global_step": 270122, "epoch": 1607} {"train_loss": -12.177618026733398, "global_step": 270123, "epoch": 1607} {"train_loss": -11.937042236328125, "global_step": 270124, "epoch": 1607} {"train_loss": -12.017196655273438, "global_step": 270125, "epoch": 1607} {"train_loss": -12.232339859008789, "global_step": 270126, "epoch": 1607} {"train_loss": -12.132984161376953, "global_step": 270127, "epoch": 1607} {"train_loss": -12.187848091125488, "global_step": 270128, "epoch": 1607} {"train_loss": -12.013604164123535, "global_step": 270129, "epoch": 1607} {"train_loss": -12.131092071533203, "global_step": 270130, "epoch": 1607} {"train_loss": -12.136886596679688, "global_step": 270131, "epoch": 1607} {"train_loss": -12.060171127319336, "global_step": 270132, "epoch": 1607} {"train_loss": -12.314473152160645, "global_step": 270133, "epoch": 1607} {"train_loss": -12.17405891418457, "global_step": 270134, "epoch": 1607} {"train_loss": -12.226480484008789, "global_step": 270135, "epoch": 1607} {"train_loss": -12.19238567352295, "global_step": 270136, "epoch": 1607} {"train_loss": -12.173788070678711, "global_step": 270137, "epoch": 1607} {"train_loss": -12.292920112609863, "global_step": 270138, "epoch": 1607} {"train_loss": -12.128203392028809, "global_step": 270139, "epoch": 1607} {"train_loss": -12.194058418273926, "global_step": 270140, "epoch": 1607} {"train_loss": -12.149160385131836, "global_step": 270141, "epoch": 1607} {"train_loss": -12.166746139526367, "global_step": 270142, "epoch": 1607} {"train_loss": -11.56896680309659, "global_step": 270143, "epoch": 1607, "val_loss": 269397.1875} {"train_loss": -12.034313201904297, "global_step": 270144, "epoch": 1608} {"train_loss": -12.22273063659668, "global_step": 270145, "epoch": 1608} {"train_loss": -12.19106674194336, "global_step": 270146, "epoch": 1608} {"train_loss": -11.962303161621094, "global_step": 270147, "epoch": 1608} {"train_loss": -12.08049201965332, "global_step": 270148, "epoch": 1608} {"train_loss": -12.228569030761719, "global_step": 270149, "epoch": 1608} {"train_loss": -12.02621841430664, "global_step": 270150, "epoch": 1608} {"train_loss": -12.248311996459961, "global_step": 270151, "epoch": 1608} {"train_loss": -12.099282264709473, "global_step": 270152, "epoch": 1608} {"train_loss": -11.980759620666504, "global_step": 270153, "epoch": 1608} {"train_loss": -11.748455047607422, "global_step": 270154, "epoch": 1608} {"train_loss": -12.142303466796875, "global_step": 270155, "epoch": 1608} {"train_loss": -11.761482238769531, "global_step": 270156, "epoch": 1608} {"train_loss": -11.540573120117188, "global_step": 270157, "epoch": 1608} {"train_loss": -11.520310401916504, "global_step": 270158, "epoch": 1608} {"train_loss": -12.160276412963867, "global_step": 270159, "epoch": 1608} {"train_loss": -12.044061660766602, "global_step": 270160, "epoch": 1608} {"train_loss": -11.716524124145508, "global_step": 270161, "epoch": 1608} {"train_loss": -11.827285766601562, "global_step": 270162, "epoch": 1608} {"train_loss": -11.93021011352539, "global_step": 270163, "epoch": 1608} {"train_loss": -12.153578758239746, "global_step": 270164, "epoch": 1608} {"train_loss": -11.716238021850586, "global_step": 270165, "epoch": 1608} {"train_loss": -11.225520133972168, "global_step": 270166, "epoch": 1608} {"train_loss": -12.040322303771973, "global_step": 270167, "epoch": 1608} {"train_loss": -11.979446411132812, "global_step": 270168, "epoch": 1608} {"train_loss": -12.029341697692871, "global_step": 270169, "epoch": 1608} {"train_loss": -12.063380241394043, "global_step": 270170, "epoch": 1608} {"train_loss": -11.953356742858887, "global_step": 270171, "epoch": 1608} {"train_loss": -11.8546142578125, "global_step": 270172, "epoch": 1608} {"train_loss": -11.976072311401367, "global_step": 270173, "epoch": 1608} {"train_loss": -12.017671585083008, "global_step": 270174, "epoch": 1608} {"train_loss": -10.673053741455078, "global_step": 270175, "epoch": 1608} {"train_loss": -11.495351791381836, "global_step": 270176, "epoch": 1608} {"train_loss": -12.075848579406738, "global_step": 270177, "epoch": 1608} {"train_loss": -11.048870086669922, "global_step": 270178, "epoch": 1608} {"train_loss": -11.529945373535156, "global_step": 270179, "epoch": 1608} {"train_loss": -11.776397705078125, "global_step": 270180, "epoch": 1608} {"train_loss": -11.245502471923828, "global_step": 270181, "epoch": 1608} {"train_loss": -11.687522888183594, "global_step": 270182, "epoch": 1608} {"train_loss": -11.320502281188965, "global_step": 270183, "epoch": 1608} {"train_loss": -11.275894165039062, "global_step": 270184, "epoch": 1608} {"train_loss": -11.828603744506836, "global_step": 270185, "epoch": 1608} {"train_loss": -11.218400955200195, "global_step": 270186, "epoch": 1608} {"train_loss": -11.920619010925293, "global_step": 270187, "epoch": 1608} {"train_loss": -11.071653366088867, "global_step": 270188, "epoch": 1608} {"train_loss": -11.4315767288208, "global_step": 270189, "epoch": 1608} {"train_loss": -10.88249397277832, "global_step": 270190, "epoch": 1608} {"train_loss": -11.80687141418457, "global_step": 270191, "epoch": 1608} {"train_loss": -11.155536651611328, "global_step": 270192, "epoch": 1608} {"train_loss": -11.855232238769531, "global_step": 270193, "epoch": 1608} {"train_loss": -11.064766883850098, "global_step": 270194, "epoch": 1608} {"train_loss": -11.478857040405273, "global_step": 270195, "epoch": 1608} {"train_loss": -10.994901657104492, "global_step": 270196, "epoch": 1608} {"train_loss": -11.205634117126465, "global_step": 270197, "epoch": 1608} {"train_loss": -10.610614776611328, "global_step": 270198, "epoch": 1608} {"train_loss": -10.84719467163086, "global_step": 270199, "epoch": 1608} {"train_loss": -11.198518753051758, "global_step": 270200, "epoch": 1608} {"train_loss": -11.271617889404297, "global_step": 270201, "epoch": 1608} {"train_loss": -11.371017456054688, "global_step": 270202, "epoch": 1608} {"train_loss": -11.421768188476562, "global_step": 270203, "epoch": 1608} {"train_loss": -11.298418045043945, "global_step": 270204, "epoch": 1608} {"train_loss": -11.900217056274414, "global_step": 270205, "epoch": 1608} {"train_loss": -11.156883239746094, "global_step": 270206, "epoch": 1608} {"train_loss": -11.179871559143066, "global_step": 270207, "epoch": 1608} {"train_loss": -11.239846229553223, "global_step": 270208, "epoch": 1608} {"train_loss": -11.839937210083008, "global_step": 270209, "epoch": 1608} {"train_loss": -11.27230453491211, "global_step": 270210, "epoch": 1608} {"train_loss": -11.728191375732422, "global_step": 270211, "epoch": 1608} {"train_loss": -11.44621467590332, "global_step": 270212, "epoch": 1608} {"train_loss": -11.507902145385742, "global_step": 270213, "epoch": 1608} {"train_loss": -11.68267822265625, "global_step": 270214, "epoch": 1608} {"train_loss": -10.840110778808594, "global_step": 270215, "epoch": 1608} {"train_loss": -11.615496635437012, "global_step": 270216, "epoch": 1608} {"train_loss": -10.620244026184082, "global_step": 270217, "epoch": 1608} {"train_loss": -11.689590454101562, "global_step": 270218, "epoch": 1608} {"train_loss": -10.947938919067383, "global_step": 270219, "epoch": 1608} {"train_loss": -10.743477821350098, "global_step": 270220, "epoch": 1608} {"train_loss": -11.535694122314453, "global_step": 270221, "epoch": 1608} {"train_loss": -11.051374435424805, "global_step": 270222, "epoch": 1608} {"train_loss": -11.568408012390137, "global_step": 270223, "epoch": 1608} {"train_loss": -11.086991310119629, "global_step": 270224, "epoch": 1608} {"train_loss": -11.445853233337402, "global_step": 270225, "epoch": 1608} {"train_loss": -11.593162536621094, "global_step": 270226, "epoch": 1608} {"train_loss": -11.49820327758789, "global_step": 270227, "epoch": 1608} {"train_loss": -11.496734619140625, "global_step": 270228, "epoch": 1608} {"train_loss": -11.515202522277832, "global_step": 270229, "epoch": 1608} {"train_loss": -11.512031555175781, "global_step": 270230, "epoch": 1608} {"train_loss": -11.437559127807617, "global_step": 270231, "epoch": 1608} {"train_loss": -11.685391426086426, "global_step": 270232, "epoch": 1608} {"train_loss": -11.24782657623291, "global_step": 270233, "epoch": 1608} {"train_loss": -11.726522445678711, "global_step": 270234, "epoch": 1608} {"train_loss": -11.110248565673828, "global_step": 270235, "epoch": 1608} {"train_loss": -11.616785049438477, "global_step": 270236, "epoch": 1608} {"train_loss": -11.552749633789062, "global_step": 270237, "epoch": 1608} {"train_loss": -11.611490249633789, "global_step": 270238, "epoch": 1608} {"train_loss": -11.879585266113281, "global_step": 270239, "epoch": 1608} {"train_loss": -11.7112455368042, "global_step": 270240, "epoch": 1608} {"train_loss": -11.718972206115723, "global_step": 270241, "epoch": 1608} {"train_loss": -11.930429458618164, "global_step": 270242, "epoch": 1608} {"train_loss": -11.85396957397461, "global_step": 270243, "epoch": 1608} {"train_loss": -11.888072967529297, "global_step": 270244, "epoch": 1608} {"train_loss": -11.969049453735352, "global_step": 270245, "epoch": 1608} {"train_loss": -11.852582931518555, "global_step": 270246, "epoch": 1608} {"train_loss": -11.900001525878906, "global_step": 270247, "epoch": 1608} {"train_loss": -11.90463638305664, "global_step": 270248, "epoch": 1608} {"train_loss": -11.805034637451172, "global_step": 270249, "epoch": 1608} {"train_loss": -11.976749420166016, "global_step": 270250, "epoch": 1608} {"train_loss": -11.781335830688477, "global_step": 270251, "epoch": 1608} {"train_loss": -11.943879127502441, "global_step": 270252, "epoch": 1608} {"train_loss": -12.118152618408203, "global_step": 270253, "epoch": 1608} {"train_loss": -11.734182357788086, "global_step": 270254, "epoch": 1608} {"train_loss": -12.067464828491211, "global_step": 270255, "epoch": 1608} {"train_loss": -11.827363967895508, "global_step": 270256, "epoch": 1608} {"train_loss": -11.797184944152832, "global_step": 270257, "epoch": 1608} {"train_loss": -11.876855850219727, "global_step": 270258, "epoch": 1608} {"train_loss": -12.136804580688477, "global_step": 270259, "epoch": 1608} {"train_loss": -11.829097747802734, "global_step": 270260, "epoch": 1608} {"train_loss": -11.75760555267334, "global_step": 270261, "epoch": 1608} {"train_loss": -12.14785385131836, "global_step": 270262, "epoch": 1608} {"train_loss": -12.012370109558105, "global_step": 270263, "epoch": 1608} {"train_loss": -11.8578462600708, "global_step": 270264, "epoch": 1608} {"train_loss": -11.84896469116211, "global_step": 270265, "epoch": 1608} {"train_loss": -11.63763427734375, "global_step": 270266, "epoch": 1608} {"train_loss": -11.89721965789795, "global_step": 270267, "epoch": 1608} {"train_loss": -11.843409538269043, "global_step": 270268, "epoch": 1608} {"train_loss": -12.127470016479492, "global_step": 270269, "epoch": 1608} {"train_loss": -11.822784423828125, "global_step": 270270, "epoch": 1608} {"train_loss": -11.779558181762695, "global_step": 270271, "epoch": 1608} {"train_loss": -11.923307418823242, "global_step": 270272, "epoch": 1608} {"train_loss": -11.626249313354492, "global_step": 270273, "epoch": 1608} {"train_loss": -11.503864288330078, "global_step": 270274, "epoch": 1608} {"train_loss": -11.312173843383789, "global_step": 270275, "epoch": 1608} {"train_loss": -11.463146209716797, "global_step": 270276, "epoch": 1608} {"train_loss": -11.291356086730957, "global_step": 270277, "epoch": 1608} {"train_loss": -10.77772331237793, "global_step": 270278, "epoch": 1608} {"train_loss": -11.259214401245117, "global_step": 270279, "epoch": 1608} {"train_loss": -11.683735847473145, "global_step": 270280, "epoch": 1608} {"train_loss": -10.776627540588379, "global_step": 270281, "epoch": 1608} {"train_loss": -11.429689407348633, "global_step": 270282, "epoch": 1608} {"train_loss": -10.889388084411621, "global_step": 270283, "epoch": 1608} {"train_loss": -11.62606143951416, "global_step": 270284, "epoch": 1608} {"train_loss": -11.226049423217773, "global_step": 270285, "epoch": 1608} {"train_loss": -11.411785125732422, "global_step": 270286, "epoch": 1608} {"train_loss": -11.84031867980957, "global_step": 270287, "epoch": 1608} {"train_loss": -11.184825897216797, "global_step": 270288, "epoch": 1608} {"train_loss": -11.143470764160156, "global_step": 270289, "epoch": 1608} {"train_loss": -11.117849349975586, "global_step": 270290, "epoch": 1608} {"train_loss": -11.051433563232422, "global_step": 270291, "epoch": 1608} {"train_loss": -10.622513771057129, "global_step": 270292, "epoch": 1608} {"train_loss": -12.012605667114258, "global_step": 270293, "epoch": 1608} {"train_loss": -10.577737808227539, "global_step": 270294, "epoch": 1608} {"train_loss": -11.958230972290039, "global_step": 270295, "epoch": 1608} {"train_loss": -11.40556526184082, "global_step": 270296, "epoch": 1608} {"train_loss": -11.838821411132812, "global_step": 270297, "epoch": 1608} {"train_loss": -11.681882858276367, "global_step": 270298, "epoch": 1608} {"train_loss": -11.355217933654785, "global_step": 270299, "epoch": 1608} {"train_loss": -11.792279243469238, "global_step": 270300, "epoch": 1608} {"train_loss": -11.6278657913208, "global_step": 270301, "epoch": 1608} {"train_loss": -12.118985176086426, "global_step": 270302, "epoch": 1608} {"train_loss": -11.424439430236816, "global_step": 270303, "epoch": 1608} {"train_loss": -11.672077178955078, "global_step": 270304, "epoch": 1608} {"train_loss": -11.776863098144531, "global_step": 270305, "epoch": 1608} {"train_loss": -11.631766319274902, "global_step": 270306, "epoch": 1608} {"train_loss": -12.103487014770508, "global_step": 270307, "epoch": 1608} {"train_loss": -11.838237762451172, "global_step": 270308, "epoch": 1608} {"train_loss": -11.813972473144531, "global_step": 270309, "epoch": 1608} {"train_loss": -12.05607795715332, "global_step": 270310, "epoch": 1608} {"train_loss": -11.60864812419528, "global_step": 270311, "epoch": 1608, "val_loss": 274350.46875} {"train_loss": -11.53628158569336, "global_step": 270312, "epoch": 1609} {"train_loss": -11.772790908813477, "global_step": 270313, "epoch": 1609} {"train_loss": -11.334802627563477, "global_step": 270314, "epoch": 1609} {"train_loss": -11.91087532043457, "global_step": 270315, "epoch": 1609} {"train_loss": -11.505605697631836, "global_step": 270316, "epoch": 1609} {"train_loss": -11.439556121826172, "global_step": 270317, "epoch": 1609} {"train_loss": -11.82485294342041, "global_step": 270318, "epoch": 1609} {"train_loss": -11.171432495117188, "global_step": 270319, "epoch": 1609} {"train_loss": -11.572441101074219, "global_step": 270320, "epoch": 1609} {"train_loss": -10.72254467010498, "global_step": 270321, "epoch": 1609} {"train_loss": -9.752859115600586, "global_step": 270322, "epoch": 1609} {"train_loss": -12.048402786254883, "global_step": 270323, "epoch": 1609} {"train_loss": -9.877685546875, "global_step": 270324, "epoch": 1609} {"train_loss": -11.495035171508789, "global_step": 270325, "epoch": 1609} {"train_loss": -10.097600936889648, "global_step": 270326, "epoch": 1609} {"train_loss": -10.539229393005371, "global_step": 270327, "epoch": 1609} {"train_loss": -10.097578048706055, "global_step": 270328, "epoch": 1609} {"train_loss": -11.810784339904785, "global_step": 270329, "epoch": 1609} {"train_loss": -10.241369247436523, "global_step": 270330, "epoch": 1609} {"train_loss": -11.108102798461914, "global_step": 270331, "epoch": 1609} {"train_loss": -11.582786560058594, "global_step": 270332, "epoch": 1609} {"train_loss": -11.16978931427002, "global_step": 270333, "epoch": 1609} {"train_loss": -11.206354141235352, "global_step": 270334, "epoch": 1609} {"train_loss": -11.879585266113281, "global_step": 270335, "epoch": 1609} {"train_loss": -11.138285636901855, "global_step": 270336, "epoch": 1609} {"train_loss": -12.01966667175293, "global_step": 270337, "epoch": 1609} {"train_loss": -11.4365234375, "global_step": 270338, "epoch": 1609} {"train_loss": -11.813268661499023, "global_step": 270339, "epoch": 1609} {"train_loss": -11.579093933105469, "global_step": 270340, "epoch": 1609} {"train_loss": -11.640888214111328, "global_step": 270341, "epoch": 1609} {"train_loss": -11.870697975158691, "global_step": 270342, "epoch": 1609} {"train_loss": -11.619813919067383, "global_step": 270343, "epoch": 1609} {"train_loss": -11.918684959411621, "global_step": 270344, "epoch": 1609} {"train_loss": -11.805407524108887, "global_step": 270345, "epoch": 1609} {"train_loss": -11.745826721191406, "global_step": 270346, "epoch": 1609} {"train_loss": -12.108309745788574, "global_step": 270347, "epoch": 1609} {"train_loss": -11.65410041809082, "global_step": 270348, "epoch": 1609} {"train_loss": -11.744983673095703, "global_step": 270349, "epoch": 1609} {"train_loss": -11.852317810058594, "global_step": 270350, "epoch": 1609} {"train_loss": -11.577849388122559, "global_step": 270351, "epoch": 1609} {"train_loss": -12.047828674316406, "global_step": 270352, "epoch": 1609} {"train_loss": -11.717703819274902, "global_step": 270353, "epoch": 1609} {"train_loss": -12.115890502929688, "global_step": 270354, "epoch": 1609} {"train_loss": -11.956658363342285, "global_step": 270355, "epoch": 1609} {"train_loss": -11.91211986541748, "global_step": 270356, "epoch": 1609} {"train_loss": -11.795450210571289, "global_step": 270357, "epoch": 1609} {"train_loss": -11.873895645141602, "global_step": 270358, "epoch": 1609} {"train_loss": -11.634584426879883, "global_step": 270359, "epoch": 1609} {"train_loss": -11.769556999206543, "global_step": 270360, "epoch": 1609} {"train_loss": -11.636129379272461, "global_step": 270361, "epoch": 1609} {"train_loss": -11.965206146240234, "global_step": 270362, "epoch": 1609} {"train_loss": -12.023681640625, "global_step": 270363, "epoch": 1609} {"train_loss": -11.975667953491211, "global_step": 270364, "epoch": 1609} {"train_loss": -12.015301704406738, "global_step": 270365, "epoch": 1609} {"train_loss": -11.870330810546875, "global_step": 270366, "epoch": 1609} {"train_loss": -12.016773223876953, "global_step": 270367, "epoch": 1609} {"train_loss": -11.933755874633789, "global_step": 270368, "epoch": 1609} {"train_loss": -11.694981575012207, "global_step": 270369, "epoch": 1609} {"train_loss": -11.863039016723633, "global_step": 270370, "epoch": 1609} {"train_loss": -11.869282722473145, "global_step": 270371, "epoch": 1609} {"train_loss": -11.587782859802246, "global_step": 270372, "epoch": 1609} {"train_loss": -11.980031967163086, "global_step": 270373, "epoch": 1609} {"train_loss": -11.57528305053711, "global_step": 270374, "epoch": 1609} {"train_loss": -12.097954750061035, "global_step": 270375, "epoch": 1609} {"train_loss": -11.596830368041992, "global_step": 270376, "epoch": 1609} {"train_loss": -11.93224811553955, "global_step": 270377, "epoch": 1609} {"train_loss": -11.781951904296875, "global_step": 270378, "epoch": 1609} {"train_loss": -11.866731643676758, "global_step": 270379, "epoch": 1609} {"train_loss": -12.314447402954102, "global_step": 270380, "epoch": 1609} {"train_loss": -11.77351188659668, "global_step": 270381, "epoch": 1609} {"train_loss": -12.050097465515137, "global_step": 270382, "epoch": 1609} {"train_loss": -11.794588088989258, "global_step": 270383, "epoch": 1609} {"train_loss": -11.464534759521484, "global_step": 270384, "epoch": 1609} {"train_loss": -11.806844711303711, "global_step": 270385, "epoch": 1609} {"train_loss": -11.543257713317871, "global_step": 270386, "epoch": 1609} {"train_loss": -12.121482849121094, "global_step": 270387, "epoch": 1609} {"train_loss": -11.225847244262695, "global_step": 270388, "epoch": 1609} {"train_loss": -11.921615600585938, "global_step": 270389, "epoch": 1609} {"train_loss": -12.062630653381348, "global_step": 270390, "epoch": 1609} {"train_loss": -11.37109661102295, "global_step": 270391, "epoch": 1609} {"train_loss": -11.977598190307617, "global_step": 270392, "epoch": 1609} {"train_loss": -11.718156814575195, "global_step": 270393, "epoch": 1609} {"train_loss": -11.980378150939941, "global_step": 270394, "epoch": 1609} {"train_loss": -11.544363021850586, "global_step": 270395, "epoch": 1609} {"train_loss": -11.944084167480469, "global_step": 270396, "epoch": 1609} {"train_loss": -12.079187393188477, "global_step": 270397, "epoch": 1609} {"train_loss": -12.012933731079102, "global_step": 270398, "epoch": 1609} {"train_loss": -12.022485733032227, "global_step": 270399, "epoch": 1609} {"train_loss": -12.195663452148438, "global_step": 270400, "epoch": 1609} {"train_loss": -11.964393615722656, "global_step": 270401, "epoch": 1609} {"train_loss": -12.196046829223633, "global_step": 270402, "epoch": 1609} {"train_loss": -12.021395683288574, "global_step": 270403, "epoch": 1609} {"train_loss": -11.957622528076172, "global_step": 270404, "epoch": 1609} {"train_loss": -11.634004592895508, "global_step": 270405, "epoch": 1609} {"train_loss": -11.706254005432129, "global_step": 270406, "epoch": 1609} {"train_loss": -11.374792098999023, "global_step": 270407, "epoch": 1609} {"train_loss": -11.856643676757812, "global_step": 270408, "epoch": 1609} {"train_loss": -12.076850891113281, "global_step": 270409, "epoch": 1609} {"train_loss": -11.92271900177002, "global_step": 270410, "epoch": 1609} {"train_loss": -11.951417922973633, "global_step": 270411, "epoch": 1609} {"train_loss": -11.804582595825195, "global_step": 270412, "epoch": 1609} {"train_loss": -10.931997299194336, "global_step": 270413, "epoch": 1609} {"train_loss": -11.289421081542969, "global_step": 270414, "epoch": 1609} {"train_loss": -11.903608322143555, "global_step": 270415, "epoch": 1609} {"train_loss": -11.29281997680664, "global_step": 270416, "epoch": 1609} {"train_loss": -10.853415489196777, "global_step": 270417, "epoch": 1609} {"train_loss": -11.491106986999512, "global_step": 270418, "epoch": 1609} {"train_loss": -12.012811660766602, "global_step": 270419, "epoch": 1609} {"train_loss": -11.21380615234375, "global_step": 270420, "epoch": 1609} {"train_loss": -11.93886947631836, "global_step": 270421, "epoch": 1609} {"train_loss": -11.371591567993164, "global_step": 270422, "epoch": 1609} {"train_loss": -11.89341926574707, "global_step": 270423, "epoch": 1609} {"train_loss": -11.87321662902832, "global_step": 270424, "epoch": 1609} {"train_loss": -11.454609870910645, "global_step": 270425, "epoch": 1609} {"train_loss": -10.670387268066406, "global_step": 270426, "epoch": 1609} {"train_loss": -11.971689224243164, "global_step": 270427, "epoch": 1609} {"train_loss": -11.43301773071289, "global_step": 270428, "epoch": 1609} {"train_loss": -10.859476089477539, "global_step": 270429, "epoch": 1609} {"train_loss": -11.434286117553711, "global_step": 270430, "epoch": 1609} {"train_loss": -9.413283348083496, "global_step": 270431, "epoch": 1609} {"train_loss": -10.435873031616211, "global_step": 270432, "epoch": 1609} {"train_loss": -11.739789962768555, "global_step": 270433, "epoch": 1609} {"train_loss": -10.76567554473877, "global_step": 270434, "epoch": 1609} {"train_loss": -10.029454231262207, "global_step": 270435, "epoch": 1609} {"train_loss": -11.359733581542969, "global_step": 270436, "epoch": 1609} {"train_loss": -9.804462432861328, "global_step": 270437, "epoch": 1609} {"train_loss": -10.306011199951172, "global_step": 270438, "epoch": 1609} {"train_loss": -11.13294792175293, "global_step": 270439, "epoch": 1609} {"train_loss": -10.841259956359863, "global_step": 270440, "epoch": 1609} {"train_loss": -10.423742294311523, "global_step": 270441, "epoch": 1609} {"train_loss": -11.477478981018066, "global_step": 270442, "epoch": 1609} {"train_loss": -10.912005424499512, "global_step": 270443, "epoch": 1609} {"train_loss": -10.460432052612305, "global_step": 270444, "epoch": 1609} {"train_loss": -11.741386413574219, "global_step": 270445, "epoch": 1609} {"train_loss": -10.647504806518555, "global_step": 270446, "epoch": 1609} {"train_loss": -11.725791931152344, "global_step": 270447, "epoch": 1609} {"train_loss": -10.128564834594727, "global_step": 270448, "epoch": 1609} {"train_loss": -11.691289901733398, "global_step": 270449, "epoch": 1609} {"train_loss": -10.856947898864746, "global_step": 270450, "epoch": 1609} {"train_loss": -11.29433536529541, "global_step": 270451, "epoch": 1609} {"train_loss": -11.57846450805664, "global_step": 270452, "epoch": 1609} {"train_loss": -11.469537734985352, "global_step": 270453, "epoch": 1609} {"train_loss": -11.747715950012207, "global_step": 270454, "epoch": 1609} {"train_loss": -11.730985641479492, "global_step": 270455, "epoch": 1609} {"train_loss": -11.331925392150879, "global_step": 270456, "epoch": 1609} {"train_loss": -11.485420227050781, "global_step": 270457, "epoch": 1609} {"train_loss": -11.529211044311523, "global_step": 270458, "epoch": 1609} {"train_loss": -11.6173734664917, "global_step": 270459, "epoch": 1609} {"train_loss": -11.6475830078125, "global_step": 270460, "epoch": 1609} {"train_loss": -11.697654724121094, "global_step": 270461, "epoch": 1609} {"train_loss": -11.57417106628418, "global_step": 270462, "epoch": 1609} {"train_loss": -11.698497772216797, "global_step": 270463, "epoch": 1609} {"train_loss": -11.406025886535645, "global_step": 270464, "epoch": 1609} {"train_loss": -11.699073791503906, "global_step": 270465, "epoch": 1609} {"train_loss": -11.490942001342773, "global_step": 270466, "epoch": 1609} {"train_loss": -11.077576637268066, "global_step": 270467, "epoch": 1609} {"train_loss": -11.807107925415039, "global_step": 270468, "epoch": 1609} {"train_loss": -11.158720970153809, "global_step": 270469, "epoch": 1609} {"train_loss": -11.93843936920166, "global_step": 270470, "epoch": 1609} {"train_loss": -11.337895393371582, "global_step": 270471, "epoch": 1609} {"train_loss": -11.788101196289062, "global_step": 270472, "epoch": 1609} {"train_loss": -11.541111946105957, "global_step": 270473, "epoch": 1609} {"train_loss": -11.732234001159668, "global_step": 270474, "epoch": 1609} {"train_loss": -11.71388053894043, "global_step": 270475, "epoch": 1609} {"train_loss": -11.771446228027344, "global_step": 270476, "epoch": 1609} {"train_loss": -11.736899375915527, "global_step": 270477, "epoch": 1609} {"train_loss": -11.776406288146973, "global_step": 270478, "epoch": 1609} {"train_loss": -11.527255608921958, "global_step": 270479, "epoch": 1609, "val_loss": 270588.90625} {"train_loss": -11.773494720458984, "global_step": 270480, "epoch": 1610} {"train_loss": -11.729524612426758, "global_step": 270481, "epoch": 1610} {"train_loss": -11.997159004211426, "global_step": 270482, "epoch": 1610} {"train_loss": -11.770804405212402, "global_step": 270483, "epoch": 1610} {"train_loss": -11.61939525604248, "global_step": 270484, "epoch": 1610} {"train_loss": -12.051856994628906, "global_step": 270485, "epoch": 1610} {"train_loss": -11.81871223449707, "global_step": 270486, "epoch": 1610} {"train_loss": -12.014894485473633, "global_step": 270487, "epoch": 1610} {"train_loss": -11.976310729980469, "global_step": 270488, "epoch": 1610} {"train_loss": -12.170358657836914, "global_step": 270489, "epoch": 1610} {"train_loss": -11.83942985534668, "global_step": 270490, "epoch": 1610} {"train_loss": -11.852800369262695, "global_step": 270491, "epoch": 1610} {"train_loss": -11.492279052734375, "global_step": 270492, "epoch": 1610} {"train_loss": -11.88520336151123, "global_step": 270493, "epoch": 1610} {"train_loss": -11.833674430847168, "global_step": 270494, "epoch": 1610} {"train_loss": -11.760822296142578, "global_step": 270495, "epoch": 1610} {"train_loss": -11.92530632019043, "global_step": 270496, "epoch": 1610} {"train_loss": -12.032752990722656, "global_step": 270497, "epoch": 1610} {"train_loss": -12.073750495910645, "global_step": 270498, "epoch": 1610} {"train_loss": -12.101619720458984, "global_step": 270499, "epoch": 1610} {"train_loss": -11.924030303955078, "global_step": 270500, "epoch": 1610} {"train_loss": -11.772863388061523, "global_step": 270501, "epoch": 1610} {"train_loss": -11.763029098510742, "global_step": 270502, "epoch": 1610} {"train_loss": -11.982107162475586, "global_step": 270503, "epoch": 1610} {"train_loss": -12.0322904586792, "global_step": 270504, "epoch": 1610} {"train_loss": -12.006665229797363, "global_step": 270505, "epoch": 1610} {"train_loss": -12.150671005249023, "global_step": 270506, "epoch": 1610} {"train_loss": -12.090127944946289, "global_step": 270507, "epoch": 1610} {"train_loss": -12.15805435180664, "global_step": 270508, "epoch": 1610} {"train_loss": -12.166467666625977, "global_step": 270509, "epoch": 1610} {"train_loss": -11.862722396850586, "global_step": 270510, "epoch": 1610} {"train_loss": -12.106353759765625, "global_step": 270511, "epoch": 1610} {"train_loss": -12.100992202758789, "global_step": 270512, "epoch": 1610} {"train_loss": -12.18166732788086, "global_step": 270513, "epoch": 1610} {"train_loss": -12.371882438659668, "global_step": 270514, "epoch": 1610} {"train_loss": -12.229743957519531, "global_step": 270515, "epoch": 1610} {"train_loss": -12.256219863891602, "global_step": 270516, "epoch": 1610} {"train_loss": -12.24737548828125, "global_step": 270517, "epoch": 1610} {"train_loss": -11.831335067749023, "global_step": 270518, "epoch": 1610} {"train_loss": -12.274380683898926, "global_step": 270519, "epoch": 1610} {"train_loss": -12.235734939575195, "global_step": 270520, "epoch": 1610} {"train_loss": -11.879863739013672, "global_step": 270521, "epoch": 1610} {"train_loss": -12.066193580627441, "global_step": 270522, "epoch": 1610} {"train_loss": -12.289325714111328, "global_step": 270523, "epoch": 1610} {"train_loss": -11.884454727172852, "global_step": 270524, "epoch": 1610} {"train_loss": -12.222644805908203, "global_step": 270525, "epoch": 1610} {"train_loss": -12.102995872497559, "global_step": 270526, "epoch": 1610} {"train_loss": -11.873745918273926, "global_step": 270527, "epoch": 1610} {"train_loss": -12.194172859191895, "global_step": 270528, "epoch": 1610} {"train_loss": -11.9136381149292, "global_step": 270529, "epoch": 1610} {"train_loss": -12.10872745513916, "global_step": 270530, "epoch": 1610} {"train_loss": -12.437028884887695, "global_step": 270531, "epoch": 1610} {"train_loss": -12.239590644836426, "global_step": 270532, "epoch": 1610} {"train_loss": -12.39029312133789, "global_step": 270533, "epoch": 1610} {"train_loss": -12.299707412719727, "global_step": 270534, "epoch": 1610} {"train_loss": -12.47059440612793, "global_step": 270535, "epoch": 1610} {"train_loss": -12.187918663024902, "global_step": 270536, "epoch": 1610} {"train_loss": -12.456175804138184, "global_step": 270537, "epoch": 1610} {"train_loss": -11.945588111877441, "global_step": 270538, "epoch": 1610} {"train_loss": -12.27612018585205, "global_step": 270539, "epoch": 1610} {"train_loss": -12.153934478759766, "global_step": 270540, "epoch": 1610} {"train_loss": -12.240492820739746, "global_step": 270541, "epoch": 1610} {"train_loss": -12.294363021850586, "global_step": 270542, "epoch": 1610} {"train_loss": -12.341924667358398, "global_step": 270543, "epoch": 1610} {"train_loss": -12.306406021118164, "global_step": 270544, "epoch": 1610} {"train_loss": -12.164104461669922, "global_step": 270545, "epoch": 1610} {"train_loss": -11.832159042358398, "global_step": 270546, "epoch": 1610} {"train_loss": -11.928918838500977, "global_step": 270547, "epoch": 1610} {"train_loss": -12.299921035766602, "global_step": 270548, "epoch": 1610} {"train_loss": -12.494705200195312, "global_step": 270549, "epoch": 1610} {"train_loss": -12.280977249145508, "global_step": 270550, "epoch": 1610} {"train_loss": -12.245649337768555, "global_step": 270551, "epoch": 1610} {"train_loss": -12.139999389648438, "global_step": 270552, "epoch": 1610} {"train_loss": -11.721843719482422, "global_step": 270553, "epoch": 1610} {"train_loss": -12.117481231689453, "global_step": 270554, "epoch": 1610} {"train_loss": -12.106085777282715, "global_step": 270555, "epoch": 1610} {"train_loss": -12.160894393920898, "global_step": 270556, "epoch": 1610} {"train_loss": -11.702005386352539, "global_step": 270557, "epoch": 1610} {"train_loss": -11.71388053894043, "global_step": 270558, "epoch": 1610} {"train_loss": -11.239862442016602, "global_step": 270559, "epoch": 1610} {"train_loss": -10.714035987854004, "global_step": 270560, "epoch": 1610} {"train_loss": -12.10376262664795, "global_step": 270561, "epoch": 1610} {"train_loss": -11.384613037109375, "global_step": 270562, "epoch": 1610} {"train_loss": -9.750492095947266, "global_step": 270563, "epoch": 1610} {"train_loss": -10.502023696899414, "global_step": 270564, "epoch": 1610} {"train_loss": -11.700517654418945, "global_step": 270565, "epoch": 1610} {"train_loss": -9.801148414611816, "global_step": 270566, "epoch": 1610} {"train_loss": -10.465259552001953, "global_step": 270567, "epoch": 1610} {"train_loss": -11.016414642333984, "global_step": 270568, "epoch": 1610} {"train_loss": -11.684459686279297, "global_step": 270569, "epoch": 1610} {"train_loss": -10.268627166748047, "global_step": 270570, "epoch": 1610} {"train_loss": -11.524740219116211, "global_step": 270571, "epoch": 1610} {"train_loss": -10.509848594665527, "global_step": 270572, "epoch": 1610} {"train_loss": -11.629417419433594, "global_step": 270573, "epoch": 1610} {"train_loss": -10.451126098632812, "global_step": 270574, "epoch": 1610} {"train_loss": -11.138618469238281, "global_step": 270575, "epoch": 1610} {"train_loss": -10.907270431518555, "global_step": 270576, "epoch": 1610} {"train_loss": -11.885534286499023, "global_step": 270577, "epoch": 1610} {"train_loss": -11.195225715637207, "global_step": 270578, "epoch": 1610} {"train_loss": -11.405684471130371, "global_step": 270579, "epoch": 1610} {"train_loss": -11.546784400939941, "global_step": 270580, "epoch": 1610} {"train_loss": -11.13725757598877, "global_step": 270581, "epoch": 1610} {"train_loss": -10.532028198242188, "global_step": 270582, "epoch": 1610} {"train_loss": -10.57130241394043, "global_step": 270583, "epoch": 1610} {"train_loss": -10.996255874633789, "global_step": 270584, "epoch": 1610} {"train_loss": -10.48841667175293, "global_step": 270585, "epoch": 1610} {"train_loss": -11.053804397583008, "global_step": 270586, "epoch": 1610} {"train_loss": -10.442310333251953, "global_step": 270587, "epoch": 1610} {"train_loss": -10.632596015930176, "global_step": 270588, "epoch": 1610} {"train_loss": -10.913354873657227, "global_step": 270589, "epoch": 1610} {"train_loss": -10.335432052612305, "global_step": 270590, "epoch": 1610} {"train_loss": -11.024693489074707, "global_step": 270591, "epoch": 1610} {"train_loss": -10.334449768066406, "global_step": 270592, "epoch": 1610} {"train_loss": -10.70785140991211, "global_step": 270593, "epoch": 1610} {"train_loss": -10.97586441040039, "global_step": 270594, "epoch": 1610} {"train_loss": -10.331279754638672, "global_step": 270595, "epoch": 1610} {"train_loss": -11.340726852416992, "global_step": 270596, "epoch": 1610} {"train_loss": -10.352110862731934, "global_step": 270597, "epoch": 1610} {"train_loss": -11.111783981323242, "global_step": 270598, "epoch": 1610} {"train_loss": -10.819929122924805, "global_step": 270599, "epoch": 1610} {"train_loss": -10.845806121826172, "global_step": 270600, "epoch": 1610} {"train_loss": -11.340250015258789, "global_step": 270601, "epoch": 1610} {"train_loss": -10.805578231811523, "global_step": 270602, "epoch": 1610} {"train_loss": -10.543006896972656, "global_step": 270603, "epoch": 1610} {"train_loss": -11.161530494689941, "global_step": 270604, "epoch": 1610} {"train_loss": -10.902055740356445, "global_step": 270605, "epoch": 1610} {"train_loss": -11.185218811035156, "global_step": 270606, "epoch": 1610} {"train_loss": -11.221126556396484, "global_step": 270607, "epoch": 1610} {"train_loss": -10.765562057495117, "global_step": 270608, "epoch": 1610} {"train_loss": -11.750123023986816, "global_step": 270609, "epoch": 1610} {"train_loss": -11.296001434326172, "global_step": 270610, "epoch": 1610} {"train_loss": -11.589132308959961, "global_step": 270611, "epoch": 1610} {"train_loss": -11.74871826171875, "global_step": 270612, "epoch": 1610} {"train_loss": -11.25234317779541, "global_step": 270613, "epoch": 1610} {"train_loss": -11.485265731811523, "global_step": 270614, "epoch": 1610} {"train_loss": -11.478185653686523, "global_step": 270615, "epoch": 1610} {"train_loss": -11.763572692871094, "global_step": 270616, "epoch": 1610} {"train_loss": -11.424009323120117, "global_step": 270617, "epoch": 1610} {"train_loss": -11.670491218566895, "global_step": 270618, "epoch": 1610} {"train_loss": -11.745477676391602, "global_step": 270619, "epoch": 1610} {"train_loss": -11.666240692138672, "global_step": 270620, "epoch": 1610} {"train_loss": -11.717874526977539, "global_step": 270621, "epoch": 1610} {"train_loss": -11.561212539672852, "global_step": 270622, "epoch": 1610} {"train_loss": -11.680398941040039, "global_step": 270623, "epoch": 1610} {"train_loss": -11.831661224365234, "global_step": 270624, "epoch": 1610} {"train_loss": -11.690073013305664, "global_step": 270625, "epoch": 1610} {"train_loss": -11.896282196044922, "global_step": 270626, "epoch": 1610} {"train_loss": -11.737115859985352, "global_step": 270627, "epoch": 1610} {"train_loss": -11.932452201843262, "global_step": 270628, "epoch": 1610} {"train_loss": -11.719890594482422, "global_step": 270629, "epoch": 1610} {"train_loss": -11.750543594360352, "global_step": 270630, "epoch": 1610} {"train_loss": -11.996749877929688, "global_step": 270631, "epoch": 1610} {"train_loss": -11.458803176879883, "global_step": 270632, "epoch": 1610} {"train_loss": -11.791714668273926, "global_step": 270633, "epoch": 1610} {"train_loss": -11.504958152770996, "global_step": 270634, "epoch": 1610} {"train_loss": -11.948125839233398, "global_step": 270635, "epoch": 1610} {"train_loss": -11.586259841918945, "global_step": 270636, "epoch": 1610} {"train_loss": -11.660075187683105, "global_step": 270637, "epoch": 1610} {"train_loss": -11.58152961730957, "global_step": 270638, "epoch": 1610} {"train_loss": -11.685078620910645, "global_step": 270639, "epoch": 1610} {"train_loss": -11.775089263916016, "global_step": 270640, "epoch": 1610} {"train_loss": -11.308686256408691, "global_step": 270641, "epoch": 1610} {"train_loss": -11.6259126663208, "global_step": 270642, "epoch": 1610} {"train_loss": -11.593839645385742, "global_step": 270643, "epoch": 1610} {"train_loss": -11.53023910522461, "global_step": 270644, "epoch": 1610} {"train_loss": -12.022595405578613, "global_step": 270645, "epoch": 1610} {"train_loss": -11.683725357055664, "global_step": 270646, "epoch": 1610} {"train_loss": -11.629710725375585, "global_step": 270647, "epoch": 1610, "val_loss": 273423.15625, "train_action_mse_error": 1.6806890964508057} {"train_loss": -11.652612686157227, "global_step": 270648, "epoch": 1611} {"train_loss": -11.954731941223145, "global_step": 270649, "epoch": 1611} {"train_loss": -11.906970977783203, "global_step": 270650, "epoch": 1611} {"train_loss": -11.579633712768555, "global_step": 270651, "epoch": 1611} {"train_loss": -11.940441131591797, "global_step": 270652, "epoch": 1611} {"train_loss": -11.921832084655762, "global_step": 270653, "epoch": 1611} {"train_loss": -11.789651870727539, "global_step": 270654, "epoch": 1611} {"train_loss": -11.734390258789062, "global_step": 270655, "epoch": 1611} {"train_loss": -11.63742446899414, "global_step": 270656, "epoch": 1611} {"train_loss": -11.757686614990234, "global_step": 270657, "epoch": 1611} {"train_loss": -11.792123794555664, "global_step": 270658, "epoch": 1611} {"train_loss": -11.732583999633789, "global_step": 270659, "epoch": 1611} {"train_loss": -11.777976989746094, "global_step": 270660, "epoch": 1611} {"train_loss": -11.753305435180664, "global_step": 270661, "epoch": 1611} {"train_loss": -11.884310722351074, "global_step": 270662, "epoch": 1611} {"train_loss": -11.643961906433105, "global_step": 270663, "epoch": 1611} {"train_loss": -12.274590492248535, "global_step": 270664, "epoch": 1611} {"train_loss": -11.497491836547852, "global_step": 270665, "epoch": 1611} {"train_loss": -12.11706256866455, "global_step": 270666, "epoch": 1611} {"train_loss": -11.849907875061035, "global_step": 270667, "epoch": 1611} {"train_loss": -11.964483261108398, "global_step": 270668, "epoch": 1611} {"train_loss": -12.029586791992188, "global_step": 270669, "epoch": 1611} {"train_loss": -11.824586868286133, "global_step": 270670, "epoch": 1611} {"train_loss": -11.845955848693848, "global_step": 270671, "epoch": 1611} {"train_loss": -11.737135887145996, "global_step": 270672, "epoch": 1611} {"train_loss": -11.789429664611816, "global_step": 270673, "epoch": 1611} {"train_loss": -11.18543529510498, "global_step": 270674, "epoch": 1611} {"train_loss": -10.531852722167969, "global_step": 270675, "epoch": 1611} {"train_loss": -11.977602005004883, "global_step": 270676, "epoch": 1611} {"train_loss": -10.50094985961914, "global_step": 270677, "epoch": 1611} {"train_loss": -11.210436820983887, "global_step": 270678, "epoch": 1611} {"train_loss": -11.583288192749023, "global_step": 270679, "epoch": 1611} {"train_loss": -10.487743377685547, "global_step": 270680, "epoch": 1611} {"train_loss": -11.996832847595215, "global_step": 270681, "epoch": 1611} {"train_loss": -10.554119110107422, "global_step": 270682, "epoch": 1611} {"train_loss": -12.075307846069336, "global_step": 270683, "epoch": 1611} {"train_loss": -10.901467323303223, "global_step": 270684, "epoch": 1611} {"train_loss": -11.468610763549805, "global_step": 270685, "epoch": 1611} {"train_loss": -11.695333480834961, "global_step": 270686, "epoch": 1611} {"train_loss": -10.675350189208984, "global_step": 270687, "epoch": 1611} {"train_loss": -11.988981246948242, "global_step": 270688, "epoch": 1611} {"train_loss": -10.78940200805664, "global_step": 270689, "epoch": 1611} {"train_loss": -11.765844345092773, "global_step": 270690, "epoch": 1611} {"train_loss": -11.414621353149414, "global_step": 270691, "epoch": 1611} {"train_loss": -11.188631057739258, "global_step": 270692, "epoch": 1611} {"train_loss": -11.80225944519043, "global_step": 270693, "epoch": 1611} {"train_loss": -10.935270309448242, "global_step": 270694, "epoch": 1611} {"train_loss": -12.033151626586914, "global_step": 270695, "epoch": 1611} {"train_loss": -11.349958419799805, "global_step": 270696, "epoch": 1611} {"train_loss": -12.014341354370117, "global_step": 270697, "epoch": 1611} {"train_loss": -11.241521835327148, "global_step": 270698, "epoch": 1611} {"train_loss": -11.887697219848633, "global_step": 270699, "epoch": 1611} {"train_loss": -11.524105072021484, "global_step": 270700, "epoch": 1611} {"train_loss": -11.352039337158203, "global_step": 270701, "epoch": 1611} {"train_loss": -11.118996620178223, "global_step": 270702, "epoch": 1611} {"train_loss": -10.892976760864258, "global_step": 270703, "epoch": 1611} {"train_loss": -12.076855659484863, "global_step": 270704, "epoch": 1611} {"train_loss": -11.295711517333984, "global_step": 270705, "epoch": 1611} {"train_loss": -11.326650619506836, "global_step": 270706, "epoch": 1611} {"train_loss": -11.061820030212402, "global_step": 270707, "epoch": 1611} {"train_loss": -11.361695289611816, "global_step": 270708, "epoch": 1611} {"train_loss": -11.426796913146973, "global_step": 270709, "epoch": 1611} {"train_loss": -11.006540298461914, "global_step": 270710, "epoch": 1611} {"train_loss": -10.987288475036621, "global_step": 270711, "epoch": 1611} {"train_loss": -11.4202880859375, "global_step": 270712, "epoch": 1611} {"train_loss": -11.609525680541992, "global_step": 270713, "epoch": 1611} {"train_loss": -11.283212661743164, "global_step": 270714, "epoch": 1611} {"train_loss": -11.169266700744629, "global_step": 270715, "epoch": 1611} {"train_loss": -11.718093872070312, "global_step": 270716, "epoch": 1611} {"train_loss": -11.222765922546387, "global_step": 270717, "epoch": 1611} {"train_loss": -11.865096092224121, "global_step": 270718, "epoch": 1611} {"train_loss": -11.560376167297363, "global_step": 270719, "epoch": 1611} {"train_loss": -11.540433883666992, "global_step": 270720, "epoch": 1611} {"train_loss": -11.745168685913086, "global_step": 270721, "epoch": 1611} {"train_loss": -11.471205711364746, "global_step": 270722, "epoch": 1611} {"train_loss": -11.733772277832031, "global_step": 270723, "epoch": 1611} {"train_loss": -11.733640670776367, "global_step": 270724, "epoch": 1611} {"train_loss": -11.779025077819824, "global_step": 270725, "epoch": 1611} {"train_loss": -11.978080749511719, "global_step": 270726, "epoch": 1611} {"train_loss": -11.66683292388916, "global_step": 270727, "epoch": 1611} {"train_loss": -11.862654685974121, "global_step": 270728, "epoch": 1611} {"train_loss": -11.518108367919922, "global_step": 270729, "epoch": 1611} {"train_loss": -11.857451438903809, "global_step": 270730, "epoch": 1611} {"train_loss": -11.748878479003906, "global_step": 270731, "epoch": 1611} {"train_loss": -11.671777725219727, "global_step": 270732, "epoch": 1611} {"train_loss": -12.173362731933594, "global_step": 270733, "epoch": 1611} {"train_loss": -11.841560363769531, "global_step": 270734, "epoch": 1611} {"train_loss": -12.0883207321167, "global_step": 270735, "epoch": 1611} {"train_loss": -11.873685836791992, "global_step": 270736, "epoch": 1611} {"train_loss": -11.905991554260254, "global_step": 270737, "epoch": 1611} {"train_loss": -12.013986587524414, "global_step": 270738, "epoch": 1611} {"train_loss": -12.110616683959961, "global_step": 270739, "epoch": 1611} {"train_loss": -12.114700317382812, "global_step": 270740, "epoch": 1611} {"train_loss": -12.111734390258789, "global_step": 270741, "epoch": 1611} {"train_loss": -11.927835464477539, "global_step": 270742, "epoch": 1611} {"train_loss": -12.2025146484375, "global_step": 270743, "epoch": 1611} {"train_loss": -11.954781532287598, "global_step": 270744, "epoch": 1611} {"train_loss": -12.019562721252441, "global_step": 270745, "epoch": 1611} {"train_loss": -11.865547180175781, "global_step": 270746, "epoch": 1611} {"train_loss": -11.936017036437988, "global_step": 270747, "epoch": 1611} {"train_loss": -11.926191329956055, "global_step": 270748, "epoch": 1611} {"train_loss": -11.916177749633789, "global_step": 270749, "epoch": 1611} {"train_loss": -12.19658374786377, "global_step": 270750, "epoch": 1611} {"train_loss": -11.890987396240234, "global_step": 270751, "epoch": 1611} {"train_loss": -12.278380393981934, "global_step": 270752, "epoch": 1611} {"train_loss": -11.796823501586914, "global_step": 270753, "epoch": 1611} {"train_loss": -11.909674644470215, "global_step": 270754, "epoch": 1611} {"train_loss": -12.274506568908691, "global_step": 270755, "epoch": 1611} {"train_loss": -11.975783348083496, "global_step": 270756, "epoch": 1611} {"train_loss": -12.139497756958008, "global_step": 270757, "epoch": 1611} {"train_loss": -12.095663070678711, "global_step": 270758, "epoch": 1611} {"train_loss": -12.020626068115234, "global_step": 270759, "epoch": 1611} {"train_loss": -11.926390647888184, "global_step": 270760, "epoch": 1611} {"train_loss": -12.369455337524414, "global_step": 270761, "epoch": 1611} {"train_loss": -11.84947395324707, "global_step": 270762, "epoch": 1611} {"train_loss": -12.137067794799805, "global_step": 270763, "epoch": 1611} {"train_loss": -12.010566711425781, "global_step": 270764, "epoch": 1611} {"train_loss": -12.24378776550293, "global_step": 270765, "epoch": 1611} {"train_loss": -11.933303833007812, "global_step": 270766, "epoch": 1611} {"train_loss": -11.784738540649414, "global_step": 270767, "epoch": 1611} {"train_loss": -12.19186782836914, "global_step": 270768, "epoch": 1611} {"train_loss": -12.022729873657227, "global_step": 270769, "epoch": 1611} {"train_loss": -11.838031768798828, "global_step": 270770, "epoch": 1611} {"train_loss": -12.260977745056152, "global_step": 270771, "epoch": 1611} {"train_loss": -12.13268756866455, "global_step": 270772, "epoch": 1611} {"train_loss": -11.745495796203613, "global_step": 270773, "epoch": 1611} {"train_loss": -12.026298522949219, "global_step": 270774, "epoch": 1611} {"train_loss": -12.295589447021484, "global_step": 270775, "epoch": 1611} {"train_loss": -11.588109970092773, "global_step": 270776, "epoch": 1611} {"train_loss": -11.833229064941406, "global_step": 270777, "epoch": 1611} {"train_loss": -11.919163703918457, "global_step": 270778, "epoch": 1611} {"train_loss": -12.299050331115723, "global_step": 270779, "epoch": 1611} {"train_loss": -11.636754989624023, "global_step": 270780, "epoch": 1611} {"train_loss": -11.822494506835938, "global_step": 270781, "epoch": 1611} {"train_loss": -12.116111755371094, "global_step": 270782, "epoch": 1611} {"train_loss": -12.096590995788574, "global_step": 270783, "epoch": 1611} {"train_loss": -11.793680191040039, "global_step": 270784, "epoch": 1611} {"train_loss": -11.762554168701172, "global_step": 270785, "epoch": 1611} {"train_loss": -11.830816268920898, "global_step": 270786, "epoch": 1611} {"train_loss": -11.49059772491455, "global_step": 270787, "epoch": 1611} {"train_loss": -11.558090209960938, "global_step": 270788, "epoch": 1611} {"train_loss": -11.969503402709961, "global_step": 270789, "epoch": 1611} {"train_loss": -11.67542839050293, "global_step": 270790, "epoch": 1611} {"train_loss": -11.959906578063965, "global_step": 270791, "epoch": 1611} {"train_loss": -11.674372673034668, "global_step": 270792, "epoch": 1611} {"train_loss": -11.988471984863281, "global_step": 270793, "epoch": 1611} {"train_loss": -11.665048599243164, "global_step": 270794, "epoch": 1611} {"train_loss": -11.516294479370117, "global_step": 270795, "epoch": 1611} {"train_loss": -11.368412017822266, "global_step": 270796, "epoch": 1611} {"train_loss": -11.905145645141602, "global_step": 270797, "epoch": 1611} {"train_loss": -11.656034469604492, "global_step": 270798, "epoch": 1611} {"train_loss": -12.057798385620117, "global_step": 270799, "epoch": 1611} {"train_loss": -12.008270263671875, "global_step": 270800, "epoch": 1611} {"train_loss": -12.27846908569336, "global_step": 270801, "epoch": 1611} {"train_loss": -11.930428504943848, "global_step": 270802, "epoch": 1611} {"train_loss": -11.874473571777344, "global_step": 270803, "epoch": 1611} {"train_loss": -11.43406867980957, "global_step": 270804, "epoch": 1611} {"train_loss": -11.565507888793945, "global_step": 270805, "epoch": 1611} {"train_loss": -11.693593978881836, "global_step": 270806, "epoch": 1611} {"train_loss": -10.817501068115234, "global_step": 270807, "epoch": 1611} {"train_loss": -10.481159210205078, "global_step": 270808, "epoch": 1611} {"train_loss": -11.159049987792969, "global_step": 270809, "epoch": 1611} {"train_loss": -9.793487548828125, "global_step": 270810, "epoch": 1611} {"train_loss": -11.356099128723145, "global_step": 270811, "epoch": 1611} {"train_loss": -11.109430313110352, "global_step": 270812, "epoch": 1611} {"train_loss": -11.156942367553711, "global_step": 270813, "epoch": 1611} {"train_loss": -11.607687950134277, "global_step": 270814, "epoch": 1611} {"train_loss": -11.687465525808788, "global_step": 270815, "epoch": 1611, "val_loss": 276475.34375} {"train_loss": -11.095559120178223, "global_step": 270816, "epoch": 1612} {"train_loss": -11.232908248901367, "global_step": 270817, "epoch": 1612} {"train_loss": -10.12260627746582, "global_step": 270818, "epoch": 1612} {"train_loss": -11.805667877197266, "global_step": 270819, "epoch": 1612} {"train_loss": -10.30567455291748, "global_step": 270820, "epoch": 1612} {"train_loss": -11.481626510620117, "global_step": 270821, "epoch": 1612} {"train_loss": -10.57667350769043, "global_step": 270822, "epoch": 1612} {"train_loss": -10.170382499694824, "global_step": 270823, "epoch": 1612} {"train_loss": -11.06739616394043, "global_step": 270824, "epoch": 1612} {"train_loss": -9.312332153320312, "global_step": 270825, "epoch": 1612} {"train_loss": -10.782243728637695, "global_step": 270826, "epoch": 1612} {"train_loss": -10.899446487426758, "global_step": 270827, "epoch": 1612} {"train_loss": -10.610313415527344, "global_step": 270828, "epoch": 1612} {"train_loss": -11.261985778808594, "global_step": 270829, "epoch": 1612} {"train_loss": -10.023504257202148, "global_step": 270830, "epoch": 1612} {"train_loss": -11.36212158203125, "global_step": 270831, "epoch": 1612} {"train_loss": -11.311483383178711, "global_step": 270832, "epoch": 1612} {"train_loss": -10.785175323486328, "global_step": 270833, "epoch": 1612} {"train_loss": -11.628057479858398, "global_step": 270834, "epoch": 1612} {"train_loss": -10.37369155883789, "global_step": 270835, "epoch": 1612} {"train_loss": -11.066510200500488, "global_step": 270836, "epoch": 1612} {"train_loss": -11.367568016052246, "global_step": 270837, "epoch": 1612} {"train_loss": -11.185187339782715, "global_step": 270838, "epoch": 1612} {"train_loss": -11.157500267028809, "global_step": 270839, "epoch": 1612} {"train_loss": -11.302045822143555, "global_step": 270840, "epoch": 1612} {"train_loss": -10.81086540222168, "global_step": 270841, "epoch": 1612} {"train_loss": -10.696104049682617, "global_step": 270842, "epoch": 1612} {"train_loss": -11.551414489746094, "global_step": 270843, "epoch": 1612} {"train_loss": -10.989435195922852, "global_step": 270844, "epoch": 1612} {"train_loss": -10.940773010253906, "global_step": 270845, "epoch": 1612} {"train_loss": -11.67464542388916, "global_step": 270846, "epoch": 1612} {"train_loss": -10.955816268920898, "global_step": 270847, "epoch": 1612} {"train_loss": -11.723570823669434, "global_step": 270848, "epoch": 1612} {"train_loss": -11.660778045654297, "global_step": 270849, "epoch": 1612} {"train_loss": -10.911541938781738, "global_step": 270850, "epoch": 1612} {"train_loss": -11.640669822692871, "global_step": 270851, "epoch": 1612} {"train_loss": -11.325146675109863, "global_step": 270852, "epoch": 1612} {"train_loss": -11.124396324157715, "global_step": 270853, "epoch": 1612} {"train_loss": -11.607942581176758, "global_step": 270854, "epoch": 1612} {"train_loss": -11.56639575958252, "global_step": 270855, "epoch": 1612} {"train_loss": -11.492432594299316, "global_step": 270856, "epoch": 1612} {"train_loss": -11.766935348510742, "global_step": 270857, "epoch": 1612} {"train_loss": -11.52430248260498, "global_step": 270858, "epoch": 1612} {"train_loss": -11.5214262008667, "global_step": 270859, "epoch": 1612} {"train_loss": -11.608686447143555, "global_step": 270860, "epoch": 1612} {"train_loss": -11.944293022155762, "global_step": 270861, "epoch": 1612} {"train_loss": -11.288249969482422, "global_step": 270862, "epoch": 1612} {"train_loss": -11.944971084594727, "global_step": 270863, "epoch": 1612} {"train_loss": -11.607378959655762, "global_step": 270864, "epoch": 1612} {"train_loss": -11.801250457763672, "global_step": 270865, "epoch": 1612} {"train_loss": -11.793914794921875, "global_step": 270866, "epoch": 1612} {"train_loss": -11.375199317932129, "global_step": 270867, "epoch": 1612} {"train_loss": -11.730896949768066, "global_step": 270868, "epoch": 1612} {"train_loss": -11.753339767456055, "global_step": 270869, "epoch": 1612} {"train_loss": -11.544373512268066, "global_step": 270870, "epoch": 1612} {"train_loss": -11.510665893554688, "global_step": 270871, "epoch": 1612} {"train_loss": -11.701234817504883, "global_step": 270872, "epoch": 1612} {"train_loss": -11.594427108764648, "global_step": 270873, "epoch": 1612} {"train_loss": -12.049287796020508, "global_step": 270874, "epoch": 1612} {"train_loss": -11.559328079223633, "global_step": 270875, "epoch": 1612} {"train_loss": -11.638202667236328, "global_step": 270876, "epoch": 1612} {"train_loss": -11.749866485595703, "global_step": 270877, "epoch": 1612} {"train_loss": -11.559147834777832, "global_step": 270878, "epoch": 1612} {"train_loss": -11.754579544067383, "global_step": 270879, "epoch": 1612} {"train_loss": -11.922935485839844, "global_step": 270880, "epoch": 1612} {"train_loss": -11.997864723205566, "global_step": 270881, "epoch": 1612} {"train_loss": -11.894086837768555, "global_step": 270882, "epoch": 1612} {"train_loss": -11.867559432983398, "global_step": 270883, "epoch": 1612} {"train_loss": -12.091520309448242, "global_step": 270884, "epoch": 1612} {"train_loss": -11.709691047668457, "global_step": 270885, "epoch": 1612} {"train_loss": -12.0926513671875, "global_step": 270886, "epoch": 1612} {"train_loss": -11.877899169921875, "global_step": 270887, "epoch": 1612} {"train_loss": -11.817514419555664, "global_step": 270888, "epoch": 1612} {"train_loss": -11.692764282226562, "global_step": 270889, "epoch": 1612} {"train_loss": -11.391624450683594, "global_step": 270890, "epoch": 1612} {"train_loss": -11.992691993713379, "global_step": 270891, "epoch": 1612} {"train_loss": -11.849004745483398, "global_step": 270892, "epoch": 1612} {"train_loss": -12.071906089782715, "global_step": 270893, "epoch": 1612} {"train_loss": -11.873181343078613, "global_step": 270894, "epoch": 1612} {"train_loss": -12.084711074829102, "global_step": 270895, "epoch": 1612} {"train_loss": -11.82052993774414, "global_step": 270896, "epoch": 1612} {"train_loss": -12.028535842895508, "global_step": 270897, "epoch": 1612} {"train_loss": -12.018559455871582, "global_step": 270898, "epoch": 1612} {"train_loss": -11.981841087341309, "global_step": 270899, "epoch": 1612} {"train_loss": -12.093750953674316, "global_step": 270900, "epoch": 1612} {"train_loss": -12.05480670928955, "global_step": 270901, "epoch": 1612} {"train_loss": -11.940496444702148, "global_step": 270902, "epoch": 1612} {"train_loss": -12.023275375366211, "global_step": 270903, "epoch": 1612} {"train_loss": -11.83514404296875, "global_step": 270904, "epoch": 1612} {"train_loss": -12.178974151611328, "global_step": 270905, "epoch": 1612} {"train_loss": -12.107198715209961, "global_step": 270906, "epoch": 1612} {"train_loss": -11.721013069152832, "global_step": 270907, "epoch": 1612} {"train_loss": -10.986440658569336, "global_step": 270908, "epoch": 1612} {"train_loss": -11.968759536743164, "global_step": 270909, "epoch": 1612} {"train_loss": -11.428043365478516, "global_step": 270910, "epoch": 1612} {"train_loss": -10.153627395629883, "global_step": 270911, "epoch": 1612} {"train_loss": -11.342308044433594, "global_step": 270912, "epoch": 1612} {"train_loss": -11.075231552124023, "global_step": 270913, "epoch": 1612} {"train_loss": -8.838448524475098, "global_step": 270914, "epoch": 1612} {"train_loss": -9.502090454101562, "global_step": 270915, "epoch": 1612} {"train_loss": -10.48144817352295, "global_step": 270916, "epoch": 1612} {"train_loss": -7.064422607421875, "global_step": 270917, "epoch": 1612} {"train_loss": -7.271973609924316, "global_step": 270918, "epoch": 1612} {"train_loss": -9.930649757385254, "global_step": 270919, "epoch": 1612} {"train_loss": -8.57229232788086, "global_step": 270920, "epoch": 1612} {"train_loss": -8.465311050415039, "global_step": 270921, "epoch": 1612} {"train_loss": -7.709542274475098, "global_step": 270922, "epoch": 1612} {"train_loss": -10.280128479003906, "global_step": 270923, "epoch": 1612} {"train_loss": -8.644327163696289, "global_step": 270924, "epoch": 1612} {"train_loss": -9.754846572875977, "global_step": 270925, "epoch": 1612} {"train_loss": -9.14029312133789, "global_step": 270926, "epoch": 1612} {"train_loss": -10.725754737854004, "global_step": 270927, "epoch": 1612} {"train_loss": -9.84486198425293, "global_step": 270928, "epoch": 1612} {"train_loss": -9.54351806640625, "global_step": 270929, "epoch": 1612} {"train_loss": -10.303543090820312, "global_step": 270930, "epoch": 1612} {"train_loss": -9.889005661010742, "global_step": 270931, "epoch": 1612} {"train_loss": -9.68417739868164, "global_step": 270932, "epoch": 1612} {"train_loss": -11.094398498535156, "global_step": 270933, "epoch": 1612} {"train_loss": -11.113016128540039, "global_step": 270934, "epoch": 1612} {"train_loss": -10.054055213928223, "global_step": 270935, "epoch": 1612} {"train_loss": -11.267679214477539, "global_step": 270936, "epoch": 1612} {"train_loss": -10.827533721923828, "global_step": 270937, "epoch": 1612} {"train_loss": -10.09367847442627, "global_step": 270938, "epoch": 1612} {"train_loss": -11.286453247070312, "global_step": 270939, "epoch": 1612} {"train_loss": -11.169124603271484, "global_step": 270940, "epoch": 1612} {"train_loss": -10.938023567199707, "global_step": 270941, "epoch": 1612} {"train_loss": -11.633172035217285, "global_step": 270942, "epoch": 1612} {"train_loss": -11.174877166748047, "global_step": 270943, "epoch": 1612} {"train_loss": -11.242609024047852, "global_step": 270944, "epoch": 1612} {"train_loss": -11.455184936523438, "global_step": 270945, "epoch": 1612} {"train_loss": -11.476301193237305, "global_step": 270946, "epoch": 1612} {"train_loss": -10.724893569946289, "global_step": 270947, "epoch": 1612} {"train_loss": -11.470617294311523, "global_step": 270948, "epoch": 1612} {"train_loss": -11.65243911743164, "global_step": 270949, "epoch": 1612} {"train_loss": -11.06442642211914, "global_step": 270950, "epoch": 1612} {"train_loss": -11.609245300292969, "global_step": 270951, "epoch": 1612} {"train_loss": -11.153714179992676, "global_step": 270952, "epoch": 1612} {"train_loss": -11.538480758666992, "global_step": 270953, "epoch": 1612} {"train_loss": -11.567052841186523, "global_step": 270954, "epoch": 1612} {"train_loss": -11.713530540466309, "global_step": 270955, "epoch": 1612} {"train_loss": -11.291948318481445, "global_step": 270956, "epoch": 1612} {"train_loss": -11.83489990234375, "global_step": 270957, "epoch": 1612} {"train_loss": -11.54261589050293, "global_step": 270958, "epoch": 1612} {"train_loss": -11.470494270324707, "global_step": 270959, "epoch": 1612} {"train_loss": -11.73286247253418, "global_step": 270960, "epoch": 1612} {"train_loss": -11.92824935913086, "global_step": 270961, "epoch": 1612} {"train_loss": -11.580092430114746, "global_step": 270962, "epoch": 1612} {"train_loss": -11.780011177062988, "global_step": 270963, "epoch": 1612} {"train_loss": -11.634997367858887, "global_step": 270964, "epoch": 1612} {"train_loss": -11.77560806274414, "global_step": 270965, "epoch": 1612} {"train_loss": -11.82664966583252, "global_step": 270966, "epoch": 1612} {"train_loss": -11.638917922973633, "global_step": 270967, "epoch": 1612} {"train_loss": -11.804583549499512, "global_step": 270968, "epoch": 1612} {"train_loss": -11.826340675354004, "global_step": 270969, "epoch": 1612} {"train_loss": -11.81280517578125, "global_step": 270970, "epoch": 1612} {"train_loss": -11.829870223999023, "global_step": 270971, "epoch": 1612} {"train_loss": -11.913424491882324, "global_step": 270972, "epoch": 1612} {"train_loss": -11.856365203857422, "global_step": 270973, "epoch": 1612} {"train_loss": -11.906028747558594, "global_step": 270974, "epoch": 1612} {"train_loss": -12.004350662231445, "global_step": 270975, "epoch": 1612} {"train_loss": -11.938872337341309, "global_step": 270976, "epoch": 1612} {"train_loss": -12.076536178588867, "global_step": 270977, "epoch": 1612} {"train_loss": -11.919029235839844, "global_step": 270978, "epoch": 1612} {"train_loss": -11.960878372192383, "global_step": 270979, "epoch": 1612} {"train_loss": -11.995840072631836, "global_step": 270980, "epoch": 1612} {"train_loss": -12.030963897705078, "global_step": 270981, "epoch": 1612} {"train_loss": -12.293279647827148, "global_step": 270982, "epoch": 1612} {"train_loss": -11.225641994249253, "global_step": 270983, "epoch": 1612, "val_loss": 274547.78125} {"train_loss": -12.0658540725708, "global_step": 270984, "epoch": 1613} {"train_loss": -12.026508331298828, "global_step": 270985, "epoch": 1613} {"train_loss": -12.147042274475098, "global_step": 270986, "epoch": 1613} {"train_loss": -11.911955833435059, "global_step": 270987, "epoch": 1613} {"train_loss": -12.040456771850586, "global_step": 270988, "epoch": 1613} {"train_loss": -12.175052642822266, "global_step": 270989, "epoch": 1613} {"train_loss": -12.090705871582031, "global_step": 270990, "epoch": 1613} {"train_loss": -12.188913345336914, "global_step": 270991, "epoch": 1613} {"train_loss": -12.136857986450195, "global_step": 270992, "epoch": 1613} {"train_loss": -11.98066520690918, "global_step": 270993, "epoch": 1613} {"train_loss": -12.092653274536133, "global_step": 270994, "epoch": 1613} {"train_loss": -12.165035247802734, "global_step": 270995, "epoch": 1613} {"train_loss": -12.308292388916016, "global_step": 270996, "epoch": 1613} {"train_loss": -12.322881698608398, "global_step": 270997, "epoch": 1613} {"train_loss": -12.323102951049805, "global_step": 270998, "epoch": 1613} {"train_loss": -12.089176177978516, "global_step": 270999, "epoch": 1613} {"train_loss": -12.261619567871094, "global_step": 271000, "epoch": 1613} {"train_loss": -12.173837661743164, "global_step": 271001, "epoch": 1613} {"train_loss": -12.249267578125, "global_step": 271002, "epoch": 1613} {"train_loss": -12.056370735168457, "global_step": 271003, "epoch": 1613} {"train_loss": -12.308204650878906, "global_step": 271004, "epoch": 1613} {"train_loss": -12.392860412597656, "global_step": 271005, "epoch": 1613} {"train_loss": -12.389177322387695, "global_step": 271006, "epoch": 1613} {"train_loss": -12.08785629272461, "global_step": 271007, "epoch": 1613} {"train_loss": -12.322017669677734, "global_step": 271008, "epoch": 1613} {"train_loss": -12.260011672973633, "global_step": 271009, "epoch": 1613} {"train_loss": -11.97001838684082, "global_step": 271010, "epoch": 1613} {"train_loss": -12.277710914611816, "global_step": 271011, "epoch": 1613} {"train_loss": -12.310850143432617, "global_step": 271012, "epoch": 1613} {"train_loss": -12.252425193786621, "global_step": 271013, "epoch": 1613} {"train_loss": -11.952102661132812, "global_step": 271014, "epoch": 1613} {"train_loss": -12.2905912399292, "global_step": 271015, "epoch": 1613} {"train_loss": -11.953920364379883, "global_step": 271016, "epoch": 1613} {"train_loss": -12.458264350891113, "global_step": 271017, "epoch": 1613} {"train_loss": -11.93008041381836, "global_step": 271018, "epoch": 1613} {"train_loss": -12.155967712402344, "global_step": 271019, "epoch": 1613} {"train_loss": -12.380400657653809, "global_step": 271020, "epoch": 1613} {"train_loss": -12.141542434692383, "global_step": 271021, "epoch": 1613} {"train_loss": -12.184028625488281, "global_step": 271022, "epoch": 1613} {"train_loss": -11.646499633789062, "global_step": 271023, "epoch": 1613} {"train_loss": -11.0458402633667, "global_step": 271024, "epoch": 1613} {"train_loss": -11.135092735290527, "global_step": 271025, "epoch": 1613} {"train_loss": -10.945232391357422, "global_step": 271026, "epoch": 1613} {"train_loss": -11.75752067565918, "global_step": 271027, "epoch": 1613} {"train_loss": -12.008291244506836, "global_step": 271028, "epoch": 1613} {"train_loss": -11.11398696899414, "global_step": 271029, "epoch": 1613} {"train_loss": -10.036396026611328, "global_step": 271030, "epoch": 1613} {"train_loss": -11.558280944824219, "global_step": 271031, "epoch": 1613} {"train_loss": -10.484540939331055, "global_step": 271032, "epoch": 1613} {"train_loss": -11.095968246459961, "global_step": 271033, "epoch": 1613} {"train_loss": -11.776256561279297, "global_step": 271034, "epoch": 1613} {"train_loss": -10.15715217590332, "global_step": 271035, "epoch": 1613} {"train_loss": -11.366436004638672, "global_step": 271036, "epoch": 1613} {"train_loss": -11.119207382202148, "global_step": 271037, "epoch": 1613} {"train_loss": -11.847230911254883, "global_step": 271038, "epoch": 1613} {"train_loss": -11.161785125732422, "global_step": 271039, "epoch": 1613} {"train_loss": -11.385560035705566, "global_step": 271040, "epoch": 1613} {"train_loss": -11.346412658691406, "global_step": 271041, "epoch": 1613} {"train_loss": -10.937286376953125, "global_step": 271042, "epoch": 1613} {"train_loss": -11.633105278015137, "global_step": 271043, "epoch": 1613} {"train_loss": -11.514890670776367, "global_step": 271044, "epoch": 1613} {"train_loss": -11.261510848999023, "global_step": 271045, "epoch": 1613} {"train_loss": -11.495099067687988, "global_step": 271046, "epoch": 1613} {"train_loss": -10.871594429016113, "global_step": 271047, "epoch": 1613} {"train_loss": -11.328325271606445, "global_step": 271048, "epoch": 1613} {"train_loss": -11.331860542297363, "global_step": 271049, "epoch": 1613} {"train_loss": -11.066732406616211, "global_step": 271050, "epoch": 1613} {"train_loss": -11.41386604309082, "global_step": 271051, "epoch": 1613} {"train_loss": -11.148698806762695, "global_step": 271052, "epoch": 1613} {"train_loss": -11.515426635742188, "global_step": 271053, "epoch": 1613} {"train_loss": -11.706459045410156, "global_step": 271054, "epoch": 1613} {"train_loss": -11.599193572998047, "global_step": 271055, "epoch": 1613} {"train_loss": -11.82730484008789, "global_step": 271056, "epoch": 1613} {"train_loss": -11.622020721435547, "global_step": 271057, "epoch": 1613} {"train_loss": -11.84733772277832, "global_step": 271058, "epoch": 1613} {"train_loss": -11.696200370788574, "global_step": 271059, "epoch": 1613} {"train_loss": -11.999832153320312, "global_step": 271060, "epoch": 1613} {"train_loss": -12.005963325500488, "global_step": 271061, "epoch": 1613} {"train_loss": -11.485187530517578, "global_step": 271062, "epoch": 1613} {"train_loss": -12.10912799835205, "global_step": 271063, "epoch": 1613} {"train_loss": -11.933879852294922, "global_step": 271064, "epoch": 1613} {"train_loss": -11.993946075439453, "global_step": 271065, "epoch": 1613} {"train_loss": -11.980517387390137, "global_step": 271066, "epoch": 1613} {"train_loss": -11.875486373901367, "global_step": 271067, "epoch": 1613} {"train_loss": -11.786998748779297, "global_step": 271068, "epoch": 1613} {"train_loss": -11.906633377075195, "global_step": 271069, "epoch": 1613} {"train_loss": -11.90494155883789, "global_step": 271070, "epoch": 1613} {"train_loss": -11.905714988708496, "global_step": 271071, "epoch": 1613} {"train_loss": -11.725714683532715, "global_step": 271072, "epoch": 1613} {"train_loss": -12.040876388549805, "global_step": 271073, "epoch": 1613} {"train_loss": -11.89992904663086, "global_step": 271074, "epoch": 1613} {"train_loss": -11.913398742675781, "global_step": 271075, "epoch": 1613} {"train_loss": -11.544499397277832, "global_step": 271076, "epoch": 1613} {"train_loss": -11.981461524963379, "global_step": 271077, "epoch": 1613} {"train_loss": -11.740056991577148, "global_step": 271078, "epoch": 1613} {"train_loss": -11.873865127563477, "global_step": 271079, "epoch": 1613} {"train_loss": -11.561552047729492, "global_step": 271080, "epoch": 1613} {"train_loss": -11.495248794555664, "global_step": 271081, "epoch": 1613} {"train_loss": -11.724843978881836, "global_step": 271082, "epoch": 1613} {"train_loss": -11.45269775390625, "global_step": 271083, "epoch": 1613} {"train_loss": -11.75723648071289, "global_step": 271084, "epoch": 1613} {"train_loss": -11.684378623962402, "global_step": 271085, "epoch": 1613} {"train_loss": -11.837308883666992, "global_step": 271086, "epoch": 1613} {"train_loss": -11.832733154296875, "global_step": 271087, "epoch": 1613} {"train_loss": -11.295458793640137, "global_step": 271088, "epoch": 1613} {"train_loss": -11.48784065246582, "global_step": 271089, "epoch": 1613} {"train_loss": -11.289395332336426, "global_step": 271090, "epoch": 1613} {"train_loss": -10.579850196838379, "global_step": 271091, "epoch": 1613} {"train_loss": -10.80029010772705, "global_step": 271092, "epoch": 1613} {"train_loss": -10.762163162231445, "global_step": 271093, "epoch": 1613} {"train_loss": -10.389816284179688, "global_step": 271094, "epoch": 1613} {"train_loss": -11.093718528747559, "global_step": 271095, "epoch": 1613} {"train_loss": -10.799768447875977, "global_step": 271096, "epoch": 1613} {"train_loss": -11.812822341918945, "global_step": 271097, "epoch": 1613} {"train_loss": -10.978964805603027, "global_step": 271098, "epoch": 1613} {"train_loss": -10.742700576782227, "global_step": 271099, "epoch": 1613} {"train_loss": -11.856002807617188, "global_step": 271100, "epoch": 1613} {"train_loss": -10.54687213897705, "global_step": 271101, "epoch": 1613} {"train_loss": -10.561208724975586, "global_step": 271102, "epoch": 1613} {"train_loss": -11.775866508483887, "global_step": 271103, "epoch": 1613} {"train_loss": -10.378300666809082, "global_step": 271104, "epoch": 1613} {"train_loss": -12.037888526916504, "global_step": 271105, "epoch": 1613} {"train_loss": -10.349248886108398, "global_step": 271106, "epoch": 1613} {"train_loss": -11.563794136047363, "global_step": 271107, "epoch": 1613} {"train_loss": -11.431291580200195, "global_step": 271108, "epoch": 1613} {"train_loss": -10.824739456176758, "global_step": 271109, "epoch": 1613} {"train_loss": -11.064338684082031, "global_step": 271110, "epoch": 1613} {"train_loss": -11.611541748046875, "global_step": 271111, "epoch": 1613} {"train_loss": -11.142974853515625, "global_step": 271112, "epoch": 1613} {"train_loss": -11.681962966918945, "global_step": 271113, "epoch": 1613} {"train_loss": -10.789422988891602, "global_step": 271114, "epoch": 1613} {"train_loss": -11.13522720336914, "global_step": 271115, "epoch": 1613} {"train_loss": -11.376565933227539, "global_step": 271116, "epoch": 1613} {"train_loss": -11.333136558532715, "global_step": 271117, "epoch": 1613} {"train_loss": -11.850896835327148, "global_step": 271118, "epoch": 1613} {"train_loss": -11.364919662475586, "global_step": 271119, "epoch": 1613} {"train_loss": -11.480283737182617, "global_step": 271120, "epoch": 1613} {"train_loss": -11.642925262451172, "global_step": 271121, "epoch": 1613} {"train_loss": -11.51978588104248, "global_step": 271122, "epoch": 1613} {"train_loss": -11.2448148727417, "global_step": 271123, "epoch": 1613} {"train_loss": -11.118888854980469, "global_step": 271124, "epoch": 1613} {"train_loss": -11.420406341552734, "global_step": 271125, "epoch": 1613} {"train_loss": -11.410744667053223, "global_step": 271126, "epoch": 1613} {"train_loss": -11.481241226196289, "global_step": 271127, "epoch": 1613} {"train_loss": -11.48057746887207, "global_step": 271128, "epoch": 1613} {"train_loss": -11.929224967956543, "global_step": 271129, "epoch": 1613} {"train_loss": -11.863565444946289, "global_step": 271130, "epoch": 1613} {"train_loss": -11.768458366394043, "global_step": 271131, "epoch": 1613} {"train_loss": -12.019512176513672, "global_step": 271132, "epoch": 1613} {"train_loss": -12.109707832336426, "global_step": 271133, "epoch": 1613} {"train_loss": -11.914124488830566, "global_step": 271134, "epoch": 1613} {"train_loss": -11.917160034179688, "global_step": 271135, "epoch": 1613} {"train_loss": -11.909059524536133, "global_step": 271136, "epoch": 1613} {"train_loss": -11.947538375854492, "global_step": 271137, "epoch": 1613} {"train_loss": -11.878326416015625, "global_step": 271138, "epoch": 1613} {"train_loss": -11.999192237854004, "global_step": 271139, "epoch": 1613} {"train_loss": -11.978067398071289, "global_step": 271140, "epoch": 1613} {"train_loss": -11.822225570678711, "global_step": 271141, "epoch": 1613} {"train_loss": -11.920947074890137, "global_step": 271142, "epoch": 1613} {"train_loss": -12.028280258178711, "global_step": 271143, "epoch": 1613} {"train_loss": -12.104082107543945, "global_step": 271144, "epoch": 1613} {"train_loss": -11.839085578918457, "global_step": 271145, "epoch": 1613} {"train_loss": -12.222552299499512, "global_step": 271146, "epoch": 1613} {"train_loss": -12.063709259033203, "global_step": 271147, "epoch": 1613} {"train_loss": -11.857481956481934, "global_step": 271148, "epoch": 1613} {"train_loss": -12.213353157043457, "global_step": 271149, "epoch": 1613} {"train_loss": -11.902874946594238, "global_step": 271150, "epoch": 1613} {"train_loss": -11.66366060007186, "global_step": 271151, "epoch": 1613, "val_loss": 275861.6875} {"train_loss": -11.873590469360352, "global_step": 271152, "epoch": 1614} {"train_loss": -12.057775497436523, "global_step": 271153, "epoch": 1614} {"train_loss": -12.12918758392334, "global_step": 271154, "epoch": 1614} {"train_loss": -11.914621353149414, "global_step": 271155, "epoch": 1614} {"train_loss": -12.197029113769531, "global_step": 271156, "epoch": 1614} {"train_loss": -12.323062896728516, "global_step": 271157, "epoch": 1614} {"train_loss": -11.762454986572266, "global_step": 271158, "epoch": 1614} {"train_loss": -12.044721603393555, "global_step": 271159, "epoch": 1614} {"train_loss": -12.047957420349121, "global_step": 271160, "epoch": 1614} {"train_loss": -11.699209213256836, "global_step": 271161, "epoch": 1614} {"train_loss": -12.045811653137207, "global_step": 271162, "epoch": 1614} {"train_loss": -11.981221199035645, "global_step": 271163, "epoch": 1614} {"train_loss": -11.58777904510498, "global_step": 271164, "epoch": 1614} {"train_loss": -11.736246109008789, "global_step": 271165, "epoch": 1614} {"train_loss": -12.171956062316895, "global_step": 271166, "epoch": 1614} {"train_loss": -11.475395202636719, "global_step": 271167, "epoch": 1614} {"train_loss": -11.480018615722656, "global_step": 271168, "epoch": 1614} {"train_loss": -11.828314781188965, "global_step": 271169, "epoch": 1614} {"train_loss": -11.377863883972168, "global_step": 271170, "epoch": 1614} {"train_loss": -10.864426612854004, "global_step": 271171, "epoch": 1614} {"train_loss": -12.045141220092773, "global_step": 271172, "epoch": 1614} {"train_loss": -11.070573806762695, "global_step": 271173, "epoch": 1614} {"train_loss": -11.016878128051758, "global_step": 271174, "epoch": 1614} {"train_loss": -11.986379623413086, "global_step": 271175, "epoch": 1614} {"train_loss": -11.866704940795898, "global_step": 271176, "epoch": 1614} {"train_loss": -11.495519638061523, "global_step": 271177, "epoch": 1614} {"train_loss": -11.695426940917969, "global_step": 271178, "epoch": 1614} {"train_loss": -12.052495002746582, "global_step": 271179, "epoch": 1614} {"train_loss": -12.026813507080078, "global_step": 271180, "epoch": 1614} {"train_loss": -12.083588600158691, "global_step": 271181, "epoch": 1614} {"train_loss": -11.984722137451172, "global_step": 271182, "epoch": 1614} {"train_loss": -11.783589363098145, "global_step": 271183, "epoch": 1614} {"train_loss": -12.13209056854248, "global_step": 271184, "epoch": 1614} {"train_loss": -11.664679527282715, "global_step": 271185, "epoch": 1614} {"train_loss": -11.833086013793945, "global_step": 271186, "epoch": 1614} {"train_loss": -12.12788200378418, "global_step": 271187, "epoch": 1614} {"train_loss": -11.740880966186523, "global_step": 271188, "epoch": 1614} {"train_loss": -12.201765060424805, "global_step": 271189, "epoch": 1614} {"train_loss": -11.74004077911377, "global_step": 271190, "epoch": 1614} {"train_loss": -12.011707305908203, "global_step": 271191, "epoch": 1614} {"train_loss": -12.17441177368164, "global_step": 271192, "epoch": 1614} {"train_loss": -11.906730651855469, "global_step": 271193, "epoch": 1614} {"train_loss": -11.925501823425293, "global_step": 271194, "epoch": 1614} {"train_loss": -11.579011917114258, "global_step": 271195, "epoch": 1614} {"train_loss": -11.970856666564941, "global_step": 271196, "epoch": 1614} {"train_loss": -11.76190185546875, "global_step": 271197, "epoch": 1614} {"train_loss": -11.94068717956543, "global_step": 271198, "epoch": 1614} {"train_loss": -11.413800239562988, "global_step": 271199, "epoch": 1614} {"train_loss": -11.654979705810547, "global_step": 271200, "epoch": 1614} {"train_loss": -11.536420822143555, "global_step": 271201, "epoch": 1614} {"train_loss": -11.854666709899902, "global_step": 271202, "epoch": 1614} {"train_loss": -11.447123527526855, "global_step": 271203, "epoch": 1614} {"train_loss": -12.117975234985352, "global_step": 271204, "epoch": 1614} {"train_loss": -11.608755111694336, "global_step": 271205, "epoch": 1614} {"train_loss": -12.157567977905273, "global_step": 271206, "epoch": 1614} {"train_loss": -11.557580947875977, "global_step": 271207, "epoch": 1614} {"train_loss": -12.153205871582031, "global_step": 271208, "epoch": 1614} {"train_loss": -11.885135650634766, "global_step": 271209, "epoch": 1614} {"train_loss": -11.907681465148926, "global_step": 271210, "epoch": 1614} {"train_loss": -11.773386001586914, "global_step": 271211, "epoch": 1614} {"train_loss": -11.792671203613281, "global_step": 271212, "epoch": 1614} {"train_loss": -11.500936508178711, "global_step": 271213, "epoch": 1614} {"train_loss": -11.601190567016602, "global_step": 271214, "epoch": 1614} {"train_loss": -11.553935050964355, "global_step": 271215, "epoch": 1614} {"train_loss": -10.894540786743164, "global_step": 271216, "epoch": 1614} {"train_loss": -11.789124488830566, "global_step": 271217, "epoch": 1614} {"train_loss": -10.459853172302246, "global_step": 271218, "epoch": 1614} {"train_loss": -11.326683044433594, "global_step": 271219, "epoch": 1614} {"train_loss": -11.082443237304688, "global_step": 271220, "epoch": 1614} {"train_loss": -10.178287506103516, "global_step": 271221, "epoch": 1614} {"train_loss": -11.728877067565918, "global_step": 271222, "epoch": 1614} {"train_loss": -10.9855318069458, "global_step": 271223, "epoch": 1614} {"train_loss": -11.054496765136719, "global_step": 271224, "epoch": 1614} {"train_loss": -11.955339431762695, "global_step": 271225, "epoch": 1614} {"train_loss": -10.521526336669922, "global_step": 271226, "epoch": 1614} {"train_loss": -11.791074752807617, "global_step": 271227, "epoch": 1614} {"train_loss": -11.053848266601562, "global_step": 271228, "epoch": 1614} {"train_loss": -11.16956901550293, "global_step": 271229, "epoch": 1614} {"train_loss": -11.714540481567383, "global_step": 271230, "epoch": 1614} {"train_loss": -10.547274589538574, "global_step": 271231, "epoch": 1614} {"train_loss": -11.125462532043457, "global_step": 271232, "epoch": 1614} {"train_loss": -11.364025115966797, "global_step": 271233, "epoch": 1614} {"train_loss": -11.872504234313965, "global_step": 271234, "epoch": 1614} {"train_loss": -11.318960189819336, "global_step": 271235, "epoch": 1614} {"train_loss": -10.956634521484375, "global_step": 271236, "epoch": 1614} {"train_loss": -11.512411117553711, "global_step": 271237, "epoch": 1614} {"train_loss": -11.135537147521973, "global_step": 271238, "epoch": 1614} {"train_loss": -11.054363250732422, "global_step": 271239, "epoch": 1614} {"train_loss": -11.743897438049316, "global_step": 271240, "epoch": 1614} {"train_loss": -11.782716751098633, "global_step": 271241, "epoch": 1614} {"train_loss": -11.742547035217285, "global_step": 271242, "epoch": 1614} {"train_loss": -11.788957595825195, "global_step": 271243, "epoch": 1614} {"train_loss": -11.677288055419922, "global_step": 271244, "epoch": 1614} {"train_loss": -11.509718894958496, "global_step": 271245, "epoch": 1614} {"train_loss": -11.696489334106445, "global_step": 271246, "epoch": 1614} {"train_loss": -11.875591278076172, "global_step": 271247, "epoch": 1614} {"train_loss": -11.39293098449707, "global_step": 271248, "epoch": 1614} {"train_loss": -11.865049362182617, "global_step": 271249, "epoch": 1614} {"train_loss": -11.576728820800781, "global_step": 271250, "epoch": 1614} {"train_loss": -12.023262977600098, "global_step": 271251, "epoch": 1614} {"train_loss": -12.002344131469727, "global_step": 271252, "epoch": 1614} {"train_loss": -12.02267837524414, "global_step": 271253, "epoch": 1614} {"train_loss": -11.836404800415039, "global_step": 271254, "epoch": 1614} {"train_loss": -11.774300575256348, "global_step": 271255, "epoch": 1614} {"train_loss": -11.964208602905273, "global_step": 271256, "epoch": 1614} {"train_loss": -11.71847152709961, "global_step": 271257, "epoch": 1614} {"train_loss": -12.065411567687988, "global_step": 271258, "epoch": 1614} {"train_loss": -11.861654281616211, "global_step": 271259, "epoch": 1614} {"train_loss": -12.104388236999512, "global_step": 271260, "epoch": 1614} {"train_loss": -11.919261932373047, "global_step": 271261, "epoch": 1614} {"train_loss": -12.073259353637695, "global_step": 271262, "epoch": 1614} {"train_loss": -11.949233055114746, "global_step": 271263, "epoch": 1614} {"train_loss": -11.837991714477539, "global_step": 271264, "epoch": 1614} {"train_loss": -12.104215621948242, "global_step": 271265, "epoch": 1614} {"train_loss": -11.944711685180664, "global_step": 271266, "epoch": 1614} {"train_loss": -12.09965991973877, "global_step": 271267, "epoch": 1614} {"train_loss": -12.017548561096191, "global_step": 271268, "epoch": 1614} {"train_loss": -12.177159309387207, "global_step": 271269, "epoch": 1614} {"train_loss": -12.086870193481445, "global_step": 271270, "epoch": 1614} {"train_loss": -11.954401016235352, "global_step": 271271, "epoch": 1614} {"train_loss": -12.148399353027344, "global_step": 271272, "epoch": 1614} {"train_loss": -12.028289794921875, "global_step": 271273, "epoch": 1614} {"train_loss": -11.85460376739502, "global_step": 271274, "epoch": 1614} {"train_loss": -12.27098560333252, "global_step": 271275, "epoch": 1614} {"train_loss": -11.960824012756348, "global_step": 271276, "epoch": 1614} {"train_loss": -12.160679817199707, "global_step": 271277, "epoch": 1614} {"train_loss": -11.917726516723633, "global_step": 271278, "epoch": 1614} {"train_loss": -12.094520568847656, "global_step": 271279, "epoch": 1614} {"train_loss": -12.038330078125, "global_step": 271280, "epoch": 1614} {"train_loss": -12.192142486572266, "global_step": 271281, "epoch": 1614} {"train_loss": -12.168781280517578, "global_step": 271282, "epoch": 1614} {"train_loss": -12.105268478393555, "global_step": 271283, "epoch": 1614} {"train_loss": -12.120319366455078, "global_step": 271284, "epoch": 1614} {"train_loss": -12.188425064086914, "global_step": 271285, "epoch": 1614} {"train_loss": -11.755813598632812, "global_step": 271286, "epoch": 1614} {"train_loss": -11.870613098144531, "global_step": 271287, "epoch": 1614} {"train_loss": -12.414412498474121, "global_step": 271288, "epoch": 1614} {"train_loss": -12.10935115814209, "global_step": 271289, "epoch": 1614} {"train_loss": -11.930293083190918, "global_step": 271290, "epoch": 1614} {"train_loss": -12.044326782226562, "global_step": 271291, "epoch": 1614} {"train_loss": -12.00684928894043, "global_step": 271292, "epoch": 1614} {"train_loss": -12.075589179992676, "global_step": 271293, "epoch": 1614} {"train_loss": -11.723003387451172, "global_step": 271294, "epoch": 1614} {"train_loss": -11.92944622039795, "global_step": 271295, "epoch": 1614} {"train_loss": -12.044631958007812, "global_step": 271296, "epoch": 1614} {"train_loss": -12.185310363769531, "global_step": 271297, "epoch": 1614} {"train_loss": -12.169032096862793, "global_step": 271298, "epoch": 1614} {"train_loss": -12.312724113464355, "global_step": 271299, "epoch": 1614} {"train_loss": -12.086228370666504, "global_step": 271300, "epoch": 1614} {"train_loss": -11.574247360229492, "global_step": 271301, "epoch": 1614} {"train_loss": -11.98421859741211, "global_step": 271302, "epoch": 1614} {"train_loss": -11.828554153442383, "global_step": 271303, "epoch": 1614} {"train_loss": -11.314334869384766, "global_step": 271304, "epoch": 1614} {"train_loss": -11.219755172729492, "global_step": 271305, "epoch": 1614} {"train_loss": -11.497421264648438, "global_step": 271306, "epoch": 1614} {"train_loss": -11.625795364379883, "global_step": 271307, "epoch": 1614} {"train_loss": -11.370147705078125, "global_step": 271308, "epoch": 1614} {"train_loss": -10.860490798950195, "global_step": 271309, "epoch": 1614} {"train_loss": -11.1581449508667, "global_step": 271310, "epoch": 1614} {"train_loss": -11.362031936645508, "global_step": 271311, "epoch": 1614} {"train_loss": -10.78117561340332, "global_step": 271312, "epoch": 1614} {"train_loss": -11.278468132019043, "global_step": 271313, "epoch": 1614} {"train_loss": -11.577878952026367, "global_step": 271314, "epoch": 1614} {"train_loss": -11.142127990722656, "global_step": 271315, "epoch": 1614} {"train_loss": -11.357202529907227, "global_step": 271316, "epoch": 1614} {"train_loss": -12.13693618774414, "global_step": 271317, "epoch": 1614} {"train_loss": -11.071829795837402, "global_step": 271318, "epoch": 1614} {"train_loss": -11.736327177002316, "global_step": 271319, "epoch": 1614, "val_loss": 275999.03125} {"train_loss": -11.274388313293457, "global_step": 271320, "epoch": 1615} {"train_loss": -11.813907623291016, "global_step": 271321, "epoch": 1615} {"train_loss": -11.501564025878906, "global_step": 271322, "epoch": 1615} {"train_loss": -11.56354808807373, "global_step": 271323, "epoch": 1615} {"train_loss": -11.853649139404297, "global_step": 271324, "epoch": 1615} {"train_loss": -11.86268424987793, "global_step": 271325, "epoch": 1615} {"train_loss": -11.51739501953125, "global_step": 271326, "epoch": 1615} {"train_loss": -11.476461410522461, "global_step": 271327, "epoch": 1615} {"train_loss": -11.89029312133789, "global_step": 271328, "epoch": 1615} {"train_loss": -11.87901496887207, "global_step": 271329, "epoch": 1615} {"train_loss": -11.83845329284668, "global_step": 271330, "epoch": 1615} {"train_loss": -11.987489700317383, "global_step": 271331, "epoch": 1615} {"train_loss": -11.776019096374512, "global_step": 271332, "epoch": 1615} {"train_loss": -12.05679702758789, "global_step": 271333, "epoch": 1615} {"train_loss": -11.969521522521973, "global_step": 271334, "epoch": 1615} {"train_loss": -11.69870376586914, "global_step": 271335, "epoch": 1615} {"train_loss": -11.871591567993164, "global_step": 271336, "epoch": 1615} {"train_loss": -12.011493682861328, "global_step": 271337, "epoch": 1615} {"train_loss": -11.968828201293945, "global_step": 271338, "epoch": 1615} {"train_loss": -11.829734802246094, "global_step": 271339, "epoch": 1615} {"train_loss": -11.818361282348633, "global_step": 271340, "epoch": 1615} {"train_loss": -12.056669235229492, "global_step": 271341, "epoch": 1615} {"train_loss": -11.679466247558594, "global_step": 271342, "epoch": 1615} {"train_loss": -12.157472610473633, "global_step": 271343, "epoch": 1615} {"train_loss": -11.997431755065918, "global_step": 271344, "epoch": 1615} {"train_loss": -11.58067512512207, "global_step": 271345, "epoch": 1615} {"train_loss": -11.697091102600098, "global_step": 271346, "epoch": 1615} {"train_loss": -12.032029151916504, "global_step": 271347, "epoch": 1615} {"train_loss": -11.46738338470459, "global_step": 271348, "epoch": 1615} {"train_loss": -11.973233222961426, "global_step": 271349, "epoch": 1615} {"train_loss": -11.384971618652344, "global_step": 271350, "epoch": 1615} {"train_loss": -11.392659187316895, "global_step": 271351, "epoch": 1615} {"train_loss": -12.12509536743164, "global_step": 271352, "epoch": 1615} {"train_loss": -11.124528884887695, "global_step": 271353, "epoch": 1615} {"train_loss": -11.084672927856445, "global_step": 271354, "epoch": 1615} {"train_loss": -11.052525520324707, "global_step": 271355, "epoch": 1615} {"train_loss": -11.163862228393555, "global_step": 271356, "epoch": 1615} {"train_loss": -11.272506713867188, "global_step": 271357, "epoch": 1615} {"train_loss": -12.028463363647461, "global_step": 271358, "epoch": 1615} {"train_loss": -11.631156921386719, "global_step": 271359, "epoch": 1615} {"train_loss": -11.627870559692383, "global_step": 271360, "epoch": 1615} {"train_loss": -11.567946434020996, "global_step": 271361, "epoch": 1615} {"train_loss": -11.38654899597168, "global_step": 271362, "epoch": 1615} {"train_loss": -11.78258228302002, "global_step": 271363, "epoch": 1615} {"train_loss": -11.194435119628906, "global_step": 271364, "epoch": 1615} {"train_loss": -12.270339965820312, "global_step": 271365, "epoch": 1615} {"train_loss": -11.049068450927734, "global_step": 271366, "epoch": 1615} {"train_loss": -11.945635795593262, "global_step": 271367, "epoch": 1615} {"train_loss": -11.511610984802246, "global_step": 271368, "epoch": 1615} {"train_loss": -10.882346153259277, "global_step": 271369, "epoch": 1615} {"train_loss": -11.718950271606445, "global_step": 271370, "epoch": 1615} {"train_loss": -11.287495613098145, "global_step": 271371, "epoch": 1615} {"train_loss": -11.523331642150879, "global_step": 271372, "epoch": 1615} {"train_loss": -11.529891014099121, "global_step": 271373, "epoch": 1615} {"train_loss": -11.446282386779785, "global_step": 271374, "epoch": 1615} {"train_loss": -11.048233032226562, "global_step": 271375, "epoch": 1615} {"train_loss": -11.895890235900879, "global_step": 271376, "epoch": 1615} {"train_loss": -10.86861801147461, "global_step": 271377, "epoch": 1615} {"train_loss": -11.912839889526367, "global_step": 271378, "epoch": 1615} {"train_loss": -11.686897277832031, "global_step": 271379, "epoch": 1615} {"train_loss": -11.231958389282227, "global_step": 271380, "epoch": 1615} {"train_loss": -11.234227180480957, "global_step": 271381, "epoch": 1615} {"train_loss": -11.52476692199707, "global_step": 271382, "epoch": 1615} {"train_loss": -11.15186595916748, "global_step": 271383, "epoch": 1615} {"train_loss": -11.094636917114258, "global_step": 271384, "epoch": 1615} {"train_loss": -11.504162788391113, "global_step": 271385, "epoch": 1615} {"train_loss": -11.26252555847168, "global_step": 271386, "epoch": 1615} {"train_loss": -11.850046157836914, "global_step": 271387, "epoch": 1615} {"train_loss": -11.09719181060791, "global_step": 271388, "epoch": 1615} {"train_loss": -10.545804023742676, "global_step": 271389, "epoch": 1615} {"train_loss": -11.177458763122559, "global_step": 271390, "epoch": 1615} {"train_loss": -11.35793685913086, "global_step": 271391, "epoch": 1615} {"train_loss": -11.382732391357422, "global_step": 271392, "epoch": 1615} {"train_loss": -12.006481170654297, "global_step": 271393, "epoch": 1615} {"train_loss": -11.97247314453125, "global_step": 271394, "epoch": 1615} {"train_loss": -11.702238082885742, "global_step": 271395, "epoch": 1615} {"train_loss": -12.000396728515625, "global_step": 271396, "epoch": 1615} {"train_loss": -11.47954273223877, "global_step": 271397, "epoch": 1615} {"train_loss": -11.926515579223633, "global_step": 271398, "epoch": 1615} {"train_loss": -11.654088020324707, "global_step": 271399, "epoch": 1615} {"train_loss": -11.881221771240234, "global_step": 271400, "epoch": 1615} {"train_loss": -12.007253646850586, "global_step": 271401, "epoch": 1615} {"train_loss": -11.604850769042969, "global_step": 271402, "epoch": 1615} {"train_loss": -11.626858711242676, "global_step": 271403, "epoch": 1615} {"train_loss": -11.632797241210938, "global_step": 271404, "epoch": 1615} {"train_loss": -11.7006254196167, "global_step": 271405, "epoch": 1615} {"train_loss": -11.919953346252441, "global_step": 271406, "epoch": 1615} {"train_loss": -11.415775299072266, "global_step": 271407, "epoch": 1615} {"train_loss": -11.748819351196289, "global_step": 271408, "epoch": 1615} {"train_loss": -12.077005386352539, "global_step": 271409, "epoch": 1615} {"train_loss": -12.103050231933594, "global_step": 271410, "epoch": 1615} {"train_loss": -11.750974655151367, "global_step": 271411, "epoch": 1615} {"train_loss": -11.55117416381836, "global_step": 271412, "epoch": 1615} {"train_loss": -12.074291229248047, "global_step": 271413, "epoch": 1615} {"train_loss": -11.54703140258789, "global_step": 271414, "epoch": 1615} {"train_loss": -11.938274383544922, "global_step": 271415, "epoch": 1615} {"train_loss": -11.853349685668945, "global_step": 271416, "epoch": 1615} {"train_loss": -12.284707069396973, "global_step": 271417, "epoch": 1615} {"train_loss": -12.01628303527832, "global_step": 271418, "epoch": 1615} {"train_loss": -11.966475486755371, "global_step": 271419, "epoch": 1615} {"train_loss": -12.054880142211914, "global_step": 271420, "epoch": 1615} {"train_loss": -12.101043701171875, "global_step": 271421, "epoch": 1615} {"train_loss": -11.855400085449219, "global_step": 271422, "epoch": 1615} {"train_loss": -12.061300277709961, "global_step": 271423, "epoch": 1615} {"train_loss": -12.160905838012695, "global_step": 271424, "epoch": 1615} {"train_loss": -11.612622261047363, "global_step": 271425, "epoch": 1615} {"train_loss": -12.111658096313477, "global_step": 271426, "epoch": 1615} {"train_loss": -11.954488754272461, "global_step": 271427, "epoch": 1615} {"train_loss": -11.869874954223633, "global_step": 271428, "epoch": 1615} {"train_loss": -12.100652694702148, "global_step": 271429, "epoch": 1615} {"train_loss": -11.949649810791016, "global_step": 271430, "epoch": 1615} {"train_loss": -11.668413162231445, "global_step": 271431, "epoch": 1615} {"train_loss": -12.120965003967285, "global_step": 271432, "epoch": 1615} {"train_loss": -11.790398597717285, "global_step": 271433, "epoch": 1615} {"train_loss": -11.921695709228516, "global_step": 271434, "epoch": 1615} {"train_loss": -12.005474090576172, "global_step": 271435, "epoch": 1615} {"train_loss": -11.654861450195312, "global_step": 271436, "epoch": 1615} {"train_loss": -11.05466079711914, "global_step": 271437, "epoch": 1615} {"train_loss": -11.301395416259766, "global_step": 271438, "epoch": 1615} {"train_loss": -12.112966537475586, "global_step": 271439, "epoch": 1615} {"train_loss": -11.517274856567383, "global_step": 271440, "epoch": 1615} {"train_loss": -12.013267517089844, "global_step": 271441, "epoch": 1615} {"train_loss": -11.984609603881836, "global_step": 271442, "epoch": 1615} {"train_loss": -11.912532806396484, "global_step": 271443, "epoch": 1615} {"train_loss": -12.180887222290039, "global_step": 271444, "epoch": 1615} {"train_loss": -12.127388954162598, "global_step": 271445, "epoch": 1615} {"train_loss": -11.9554443359375, "global_step": 271446, "epoch": 1615} {"train_loss": -12.237669944763184, "global_step": 271447, "epoch": 1615} {"train_loss": -11.863399505615234, "global_step": 271448, "epoch": 1615} {"train_loss": -11.995323181152344, "global_step": 271449, "epoch": 1615} {"train_loss": -12.110708236694336, "global_step": 271450, "epoch": 1615} {"train_loss": -12.06368637084961, "global_step": 271451, "epoch": 1615} {"train_loss": -11.924972534179688, "global_step": 271452, "epoch": 1615} {"train_loss": -12.047043800354004, "global_step": 271453, "epoch": 1615} {"train_loss": -12.142830848693848, "global_step": 271454, "epoch": 1615} {"train_loss": -12.171930313110352, "global_step": 271455, "epoch": 1615} {"train_loss": -11.571157455444336, "global_step": 271456, "epoch": 1615} {"train_loss": -11.691675186157227, "global_step": 271457, "epoch": 1615} {"train_loss": -11.565606117248535, "global_step": 271458, "epoch": 1615} {"train_loss": -12.026351928710938, "global_step": 271459, "epoch": 1615} {"train_loss": -11.084192276000977, "global_step": 271460, "epoch": 1615} {"train_loss": -11.964046478271484, "global_step": 271461, "epoch": 1615} {"train_loss": -11.760455131530762, "global_step": 271462, "epoch": 1615} {"train_loss": -11.401784896850586, "global_step": 271463, "epoch": 1615} {"train_loss": -11.636163711547852, "global_step": 271464, "epoch": 1615} {"train_loss": -11.433748245239258, "global_step": 271465, "epoch": 1615} {"train_loss": -11.501850128173828, "global_step": 271466, "epoch": 1615} {"train_loss": -11.193604469299316, "global_step": 271467, "epoch": 1615} {"train_loss": -11.432607650756836, "global_step": 271468, "epoch": 1615} {"train_loss": -11.12462043762207, "global_step": 271469, "epoch": 1615} {"train_loss": -11.866301536560059, "global_step": 271470, "epoch": 1615} {"train_loss": -11.367289543151855, "global_step": 271471, "epoch": 1615} {"train_loss": -11.242330551147461, "global_step": 271472, "epoch": 1615} {"train_loss": -11.7684907913208, "global_step": 271473, "epoch": 1615} {"train_loss": -11.760772705078125, "global_step": 271474, "epoch": 1615} {"train_loss": -11.559964179992676, "global_step": 271475, "epoch": 1615} {"train_loss": -11.495796203613281, "global_step": 271476, "epoch": 1615} {"train_loss": -11.181371688842773, "global_step": 271477, "epoch": 1615} {"train_loss": -11.741155624389648, "global_step": 271478, "epoch": 1615} {"train_loss": -11.607603073120117, "global_step": 271479, "epoch": 1615} {"train_loss": -11.576057434082031, "global_step": 271480, "epoch": 1615} {"train_loss": -11.275287628173828, "global_step": 271481, "epoch": 1615} {"train_loss": -11.41469955444336, "global_step": 271482, "epoch": 1615} {"train_loss": -11.856555938720703, "global_step": 271483, "epoch": 1615} {"train_loss": -11.942550659179688, "global_step": 271484, "epoch": 1615} {"train_loss": -11.839163780212402, "global_step": 271485, "epoch": 1615} {"train_loss": -11.321874618530273, "global_step": 271486, "epoch": 1615} {"train_loss": -11.692754558154515, "global_step": 271487, "epoch": 1615, "val_loss": 274396.25, "train_action_mse_error": 1.2981359958648682} {"train_loss": -11.654407501220703, "global_step": 271488, "epoch": 1616} {"train_loss": -11.748902320861816, "global_step": 271489, "epoch": 1616} {"train_loss": -11.861696243286133, "global_step": 271490, "epoch": 1616} {"train_loss": -11.921113967895508, "global_step": 271491, "epoch": 1616} {"train_loss": -11.759258270263672, "global_step": 271492, "epoch": 1616} {"train_loss": -11.747349739074707, "global_step": 271493, "epoch": 1616} {"train_loss": -12.079026222229004, "global_step": 271494, "epoch": 1616} {"train_loss": -11.996076583862305, "global_step": 271495, "epoch": 1616} {"train_loss": -11.948907852172852, "global_step": 271496, "epoch": 1616} {"train_loss": -12.040384292602539, "global_step": 271497, "epoch": 1616} {"train_loss": -11.805356979370117, "global_step": 271498, "epoch": 1616} {"train_loss": -11.805986404418945, "global_step": 271499, "epoch": 1616} {"train_loss": -11.889636993408203, "global_step": 271500, "epoch": 1616} {"train_loss": -11.882349014282227, "global_step": 271501, "epoch": 1616} {"train_loss": -11.504827499389648, "global_step": 271502, "epoch": 1616} {"train_loss": -12.291526794433594, "global_step": 271503, "epoch": 1616} {"train_loss": -11.97110366821289, "global_step": 271504, "epoch": 1616} {"train_loss": -11.926395416259766, "global_step": 271505, "epoch": 1616} {"train_loss": -11.770597457885742, "global_step": 271506, "epoch": 1616} {"train_loss": -12.028596878051758, "global_step": 271507, "epoch": 1616} {"train_loss": -11.980338096618652, "global_step": 271508, "epoch": 1616} {"train_loss": -11.816068649291992, "global_step": 271509, "epoch": 1616} {"train_loss": -11.7471342086792, "global_step": 271510, "epoch": 1616} {"train_loss": -12.15566349029541, "global_step": 271511, "epoch": 1616} {"train_loss": -11.917856216430664, "global_step": 271512, "epoch": 1616} {"train_loss": -12.111024856567383, "global_step": 271513, "epoch": 1616} {"train_loss": -11.564859390258789, "global_step": 271514, "epoch": 1616} {"train_loss": -12.254228591918945, "global_step": 271515, "epoch": 1616} {"train_loss": -11.598909378051758, "global_step": 271516, "epoch": 1616} {"train_loss": -11.785812377929688, "global_step": 271517, "epoch": 1616} {"train_loss": -11.766295433044434, "global_step": 271518, "epoch": 1616} {"train_loss": -11.136011123657227, "global_step": 271519, "epoch": 1616} {"train_loss": -10.922977447509766, "global_step": 271520, "epoch": 1616} {"train_loss": -11.03620719909668, "global_step": 271521, "epoch": 1616} {"train_loss": -10.214176177978516, "global_step": 271522, "epoch": 1616} {"train_loss": -10.913737297058105, "global_step": 271523, "epoch": 1616} {"train_loss": -11.198127746582031, "global_step": 271524, "epoch": 1616} {"train_loss": -10.38441276550293, "global_step": 271525, "epoch": 1616} {"train_loss": -11.28338623046875, "global_step": 271526, "epoch": 1616} {"train_loss": -10.276076316833496, "global_step": 271527, "epoch": 1616} {"train_loss": -11.607872009277344, "global_step": 271528, "epoch": 1616} {"train_loss": -11.667214393615723, "global_step": 271529, "epoch": 1616} {"train_loss": -10.840860366821289, "global_step": 271530, "epoch": 1616} {"train_loss": -10.808647155761719, "global_step": 271531, "epoch": 1616} {"train_loss": -10.742223739624023, "global_step": 271532, "epoch": 1616} {"train_loss": -11.143595695495605, "global_step": 271533, "epoch": 1616} {"train_loss": -10.728095054626465, "global_step": 271534, "epoch": 1616} {"train_loss": -11.469940185546875, "global_step": 271535, "epoch": 1616} {"train_loss": -10.54109001159668, "global_step": 271536, "epoch": 1616} {"train_loss": -11.570141792297363, "global_step": 271537, "epoch": 1616} {"train_loss": -10.562775611877441, "global_step": 271538, "epoch": 1616} {"train_loss": -10.997090339660645, "global_step": 271539, "epoch": 1616} {"train_loss": -10.386932373046875, "global_step": 271540, "epoch": 1616} {"train_loss": -10.636878967285156, "global_step": 271541, "epoch": 1616} {"train_loss": -10.704678535461426, "global_step": 271542, "epoch": 1616} {"train_loss": -8.850855827331543, "global_step": 271543, "epoch": 1616} {"train_loss": -9.973949432373047, "global_step": 271544, "epoch": 1616} {"train_loss": -11.050358772277832, "global_step": 271545, "epoch": 1616} {"train_loss": -9.153463363647461, "global_step": 271546, "epoch": 1616} {"train_loss": -10.17341136932373, "global_step": 271547, "epoch": 1616} {"train_loss": -10.832058906555176, "global_step": 271548, "epoch": 1616} {"train_loss": -8.841462135314941, "global_step": 271549, "epoch": 1616} {"train_loss": -9.379851341247559, "global_step": 271550, "epoch": 1616} {"train_loss": -10.351645469665527, "global_step": 271551, "epoch": 1616} {"train_loss": -9.992805480957031, "global_step": 271552, "epoch": 1616} {"train_loss": -9.227426528930664, "global_step": 271553, "epoch": 1616} {"train_loss": -10.707818984985352, "global_step": 271554, "epoch": 1616} {"train_loss": -10.411103248596191, "global_step": 271555, "epoch": 1616} {"train_loss": -10.312601089477539, "global_step": 271556, "epoch": 1616} {"train_loss": -10.086606979370117, "global_step": 271557, "epoch": 1616} {"train_loss": -11.17171859741211, "global_step": 271558, "epoch": 1616} {"train_loss": -10.217508316040039, "global_step": 271559, "epoch": 1616} {"train_loss": -9.675392150878906, "global_step": 271560, "epoch": 1616} {"train_loss": -9.728768348693848, "global_step": 271561, "epoch": 1616} {"train_loss": -10.60387134552002, "global_step": 271562, "epoch": 1616} {"train_loss": -10.510557174682617, "global_step": 271563, "epoch": 1616} {"train_loss": -9.71377944946289, "global_step": 271564, "epoch": 1616} {"train_loss": -10.389723777770996, "global_step": 271565, "epoch": 1616} {"train_loss": -11.047958374023438, "global_step": 271566, "epoch": 1616} {"train_loss": -10.1917724609375, "global_step": 271567, "epoch": 1616} {"train_loss": -9.693136215209961, "global_step": 271568, "epoch": 1616} {"train_loss": -11.051494598388672, "global_step": 271569, "epoch": 1616} {"train_loss": -10.641969680786133, "global_step": 271570, "epoch": 1616} {"train_loss": -10.205835342407227, "global_step": 271571, "epoch": 1616} {"train_loss": -10.914449691772461, "global_step": 271572, "epoch": 1616} {"train_loss": -11.225252151489258, "global_step": 271573, "epoch": 1616} {"train_loss": -10.268390655517578, "global_step": 271574, "epoch": 1616} {"train_loss": -10.820568084716797, "global_step": 271575, "epoch": 1616} {"train_loss": -11.387569427490234, "global_step": 271576, "epoch": 1616} {"train_loss": -11.058887481689453, "global_step": 271577, "epoch": 1616} {"train_loss": -10.851909637451172, "global_step": 271578, "epoch": 1616} {"train_loss": -11.549854278564453, "global_step": 271579, "epoch": 1616} {"train_loss": -11.747257232666016, "global_step": 271580, "epoch": 1616} {"train_loss": -11.040258407592773, "global_step": 271581, "epoch": 1616} {"train_loss": -11.137943267822266, "global_step": 271582, "epoch": 1616} {"train_loss": -11.655101776123047, "global_step": 271583, "epoch": 1616} {"train_loss": -11.474393844604492, "global_step": 271584, "epoch": 1616} {"train_loss": -11.222307205200195, "global_step": 271585, "epoch": 1616} {"train_loss": -11.302512168884277, "global_step": 271586, "epoch": 1616} {"train_loss": -11.60888671875, "global_step": 271587, "epoch": 1616} {"train_loss": -11.544699668884277, "global_step": 271588, "epoch": 1616} {"train_loss": -11.434115409851074, "global_step": 271589, "epoch": 1616} {"train_loss": -11.781394004821777, "global_step": 271590, "epoch": 1616} {"train_loss": -11.730143547058105, "global_step": 271591, "epoch": 1616} {"train_loss": -11.455316543579102, "global_step": 271592, "epoch": 1616} {"train_loss": -11.559415817260742, "global_step": 271593, "epoch": 1616} {"train_loss": -11.677896499633789, "global_step": 271594, "epoch": 1616} {"train_loss": -11.540285110473633, "global_step": 271595, "epoch": 1616} {"train_loss": -11.749334335327148, "global_step": 271596, "epoch": 1616} {"train_loss": -11.602642059326172, "global_step": 271597, "epoch": 1616} {"train_loss": -11.656265258789062, "global_step": 271598, "epoch": 1616} {"train_loss": -11.773550033569336, "global_step": 271599, "epoch": 1616} {"train_loss": -11.705793380737305, "global_step": 271600, "epoch": 1616} {"train_loss": -11.488338470458984, "global_step": 271601, "epoch": 1616} {"train_loss": -11.84371280670166, "global_step": 271602, "epoch": 1616} {"train_loss": -11.472152709960938, "global_step": 271603, "epoch": 1616} {"train_loss": -11.964600563049316, "global_step": 271604, "epoch": 1616} {"train_loss": -11.885744094848633, "global_step": 271605, "epoch": 1616} {"train_loss": -12.103521347045898, "global_step": 271606, "epoch": 1616} {"train_loss": -11.802535057067871, "global_step": 271607, "epoch": 1616} {"train_loss": -11.99733829498291, "global_step": 271608, "epoch": 1616} {"train_loss": -11.739291191101074, "global_step": 271609, "epoch": 1616} {"train_loss": -12.061408042907715, "global_step": 271610, "epoch": 1616} {"train_loss": -11.767536163330078, "global_step": 271611, "epoch": 1616} {"train_loss": -11.875391006469727, "global_step": 271612, "epoch": 1616} {"train_loss": -11.813850402832031, "global_step": 271613, "epoch": 1616} {"train_loss": -11.936857223510742, "global_step": 271614, "epoch": 1616} {"train_loss": -12.131436347961426, "global_step": 271615, "epoch": 1616} {"train_loss": -11.945707321166992, "global_step": 271616, "epoch": 1616} {"train_loss": -11.873897552490234, "global_step": 271617, "epoch": 1616} {"train_loss": -11.678672790527344, "global_step": 271618, "epoch": 1616} {"train_loss": -11.989645004272461, "global_step": 271619, "epoch": 1616} {"train_loss": -12.103659629821777, "global_step": 271620, "epoch": 1616} {"train_loss": -11.99793529510498, "global_step": 271621, "epoch": 1616} {"train_loss": -11.899484634399414, "global_step": 271622, "epoch": 1616} {"train_loss": -11.896846771240234, "global_step": 271623, "epoch": 1616} {"train_loss": -12.11058521270752, "global_step": 271624, "epoch": 1616} {"train_loss": -12.025583267211914, "global_step": 271625, "epoch": 1616} {"train_loss": -12.061306953430176, "global_step": 271626, "epoch": 1616} {"train_loss": -11.947649002075195, "global_step": 271627, "epoch": 1616} {"train_loss": -12.141719818115234, "global_step": 271628, "epoch": 1616} {"train_loss": -11.94737720489502, "global_step": 271629, "epoch": 1616} {"train_loss": -12.150050163269043, "global_step": 271630, "epoch": 1616} {"train_loss": -12.03885269165039, "global_step": 271631, "epoch": 1616} {"train_loss": -12.130901336669922, "global_step": 271632, "epoch": 1616} {"train_loss": -12.137399673461914, "global_step": 271633, "epoch": 1616} {"train_loss": -12.213027000427246, "global_step": 271634, "epoch": 1616} {"train_loss": -12.195652961730957, "global_step": 271635, "epoch": 1616} {"train_loss": -12.242539405822754, "global_step": 271636, "epoch": 1616} {"train_loss": -12.150165557861328, "global_step": 271637, "epoch": 1616} {"train_loss": -12.004430770874023, "global_step": 271638, "epoch": 1616} {"train_loss": -11.916635513305664, "global_step": 271639, "epoch": 1616} {"train_loss": -11.78396987915039, "global_step": 271640, "epoch": 1616} {"train_loss": -12.171930313110352, "global_step": 271641, "epoch": 1616} {"train_loss": -12.010990142822266, "global_step": 271642, "epoch": 1616} {"train_loss": -12.07907485961914, "global_step": 271643, "epoch": 1616} {"train_loss": -12.290071487426758, "global_step": 271644, "epoch": 1616} {"train_loss": -11.808563232421875, "global_step": 271645, "epoch": 1616} {"train_loss": -12.097860336303711, "global_step": 271646, "epoch": 1616} {"train_loss": -12.129192352294922, "global_step": 271647, "epoch": 1616} {"train_loss": -12.174369812011719, "global_step": 271648, "epoch": 1616} {"train_loss": -11.987296104431152, "global_step": 271649, "epoch": 1616} {"train_loss": -12.028959274291992, "global_step": 271650, "epoch": 1616} {"train_loss": -11.207478523254395, "global_step": 271651, "epoch": 1616} {"train_loss": -11.052938461303711, "global_step": 271652, "epoch": 1616} {"train_loss": -11.441537857055664, "global_step": 271653, "epoch": 1616} {"train_loss": -11.790990829467773, "global_step": 271654, "epoch": 1616} {"train_loss": -11.374174418903532, "global_step": 271655, "epoch": 1616, "val_loss": 267653.75} {"train_loss": -10.994449615478516, "global_step": 271656, "epoch": 1617} {"train_loss": -11.71422290802002, "global_step": 271657, "epoch": 1617} {"train_loss": -10.657828330993652, "global_step": 271658, "epoch": 1617} {"train_loss": -11.899035453796387, "global_step": 271659, "epoch": 1617} {"train_loss": -10.617119789123535, "global_step": 271660, "epoch": 1617} {"train_loss": -7.987979888916016, "global_step": 271661, "epoch": 1617} {"train_loss": -11.282227516174316, "global_step": 271662, "epoch": 1617} {"train_loss": -7.002188205718994, "global_step": 271663, "epoch": 1617} {"train_loss": -11.446807861328125, "global_step": 271664, "epoch": 1617} {"train_loss": -8.226608276367188, "global_step": 271665, "epoch": 1617} {"train_loss": -8.984273910522461, "global_step": 271666, "epoch": 1617} {"train_loss": -5.849590301513672, "global_step": 271667, "epoch": 1617} {"train_loss": -5.893280982971191, "global_step": 271668, "epoch": 1617} {"train_loss": -6.87344217300415, "global_step": 271669, "epoch": 1617} {"train_loss": -6.939511299133301, "global_step": 271670, "epoch": 1617} {"train_loss": -5.8469109535217285, "global_step": 271671, "epoch": 1617} {"train_loss": -5.504162788391113, "global_step": 271672, "epoch": 1617} {"train_loss": -6.045051574707031, "global_step": 271673, "epoch": 1617} {"train_loss": -6.627938270568848, "global_step": 271674, "epoch": 1617} {"train_loss": -7.88451623916626, "global_step": 271675, "epoch": 1617} {"train_loss": -8.998977661132812, "global_step": 271676, "epoch": 1617} {"train_loss": -8.716696739196777, "global_step": 271677, "epoch": 1617} {"train_loss": -8.874099731445312, "global_step": 271678, "epoch": 1617} {"train_loss": -10.4362154006958, "global_step": 271679, "epoch": 1617} {"train_loss": -10.116965293884277, "global_step": 271680, "epoch": 1617} {"train_loss": -9.792562484741211, "global_step": 271681, "epoch": 1617} {"train_loss": -10.795520782470703, "global_step": 271682, "epoch": 1617} {"train_loss": -10.555805206298828, "global_step": 271683, "epoch": 1617} {"train_loss": -9.341472625732422, "global_step": 271684, "epoch": 1617} {"train_loss": -11.105835914611816, "global_step": 271685, "epoch": 1617} {"train_loss": -10.320655822753906, "global_step": 271686, "epoch": 1617} {"train_loss": -10.50631332397461, "global_step": 271687, "epoch": 1617} {"train_loss": -10.658573150634766, "global_step": 271688, "epoch": 1617} {"train_loss": -10.430204391479492, "global_step": 271689, "epoch": 1617} {"train_loss": -10.4764404296875, "global_step": 271690, "epoch": 1617} {"train_loss": -11.019979476928711, "global_step": 271691, "epoch": 1617} {"train_loss": -10.781658172607422, "global_step": 271692, "epoch": 1617} {"train_loss": -10.661806106567383, "global_step": 271693, "epoch": 1617} {"train_loss": -11.214923858642578, "global_step": 271694, "epoch": 1617} {"train_loss": -11.02720832824707, "global_step": 271695, "epoch": 1617} {"train_loss": -11.23106575012207, "global_step": 271696, "epoch": 1617} {"train_loss": -11.124507904052734, "global_step": 271697, "epoch": 1617} {"train_loss": -10.946983337402344, "global_step": 271698, "epoch": 1617} {"train_loss": -11.378582000732422, "global_step": 271699, "epoch": 1617} {"train_loss": -11.1070556640625, "global_step": 271700, "epoch": 1617} {"train_loss": -11.32666301727295, "global_step": 271701, "epoch": 1617} {"train_loss": -11.58892822265625, "global_step": 271702, "epoch": 1617} {"train_loss": -11.648070335388184, "global_step": 271703, "epoch": 1617} {"train_loss": -11.276618003845215, "global_step": 271704, "epoch": 1617} {"train_loss": -11.589561462402344, "global_step": 271705, "epoch": 1617} {"train_loss": -11.295357704162598, "global_step": 271706, "epoch": 1617} {"train_loss": -11.462928771972656, "global_step": 271707, "epoch": 1617} {"train_loss": -11.608993530273438, "global_step": 271708, "epoch": 1617} {"train_loss": -11.625357627868652, "global_step": 271709, "epoch": 1617} {"train_loss": -11.506053924560547, "global_step": 271710, "epoch": 1617} {"train_loss": -11.516637802124023, "global_step": 271711, "epoch": 1617} {"train_loss": -11.803215980529785, "global_step": 271712, "epoch": 1617} {"train_loss": -11.552484512329102, "global_step": 271713, "epoch": 1617} {"train_loss": -11.671220779418945, "global_step": 271714, "epoch": 1617} {"train_loss": -11.628885269165039, "global_step": 271715, "epoch": 1617} {"train_loss": -11.537256240844727, "global_step": 271716, "epoch": 1617} {"train_loss": -11.927789688110352, "global_step": 271717, "epoch": 1617} {"train_loss": -11.79874038696289, "global_step": 271718, "epoch": 1617} {"train_loss": -11.615200996398926, "global_step": 271719, "epoch": 1617} {"train_loss": -11.797211647033691, "global_step": 271720, "epoch": 1617} {"train_loss": -11.630455017089844, "global_step": 271721, "epoch": 1617} {"train_loss": -11.654406547546387, "global_step": 271722, "epoch": 1617} {"train_loss": -11.851042747497559, "global_step": 271723, "epoch": 1617} {"train_loss": -11.818191528320312, "global_step": 271724, "epoch": 1617} {"train_loss": -11.855264663696289, "global_step": 271725, "epoch": 1617} {"train_loss": -11.677032470703125, "global_step": 271726, "epoch": 1617} {"train_loss": -11.721429824829102, "global_step": 271727, "epoch": 1617} {"train_loss": -11.940787315368652, "global_step": 271728, "epoch": 1617} {"train_loss": -11.868562698364258, "global_step": 271729, "epoch": 1617} {"train_loss": -12.037957191467285, "global_step": 271730, "epoch": 1617} {"train_loss": -11.978373527526855, "global_step": 271731, "epoch": 1617} {"train_loss": -12.002418518066406, "global_step": 271732, "epoch": 1617} {"train_loss": -11.878876686096191, "global_step": 271733, "epoch": 1617} {"train_loss": -11.936580657958984, "global_step": 271734, "epoch": 1617} {"train_loss": -11.885098457336426, "global_step": 271735, "epoch": 1617} {"train_loss": -11.90493392944336, "global_step": 271736, "epoch": 1617} {"train_loss": -11.969831466674805, "global_step": 271737, "epoch": 1617} {"train_loss": -11.943931579589844, "global_step": 271738, "epoch": 1617} {"train_loss": -12.101692199707031, "global_step": 271739, "epoch": 1617} {"train_loss": -11.987300872802734, "global_step": 271740, "epoch": 1617} {"train_loss": -11.879619598388672, "global_step": 271741, "epoch": 1617} {"train_loss": -12.141702651977539, "global_step": 271742, "epoch": 1617} {"train_loss": -11.878900527954102, "global_step": 271743, "epoch": 1617} {"train_loss": -11.98613166809082, "global_step": 271744, "epoch": 1617} {"train_loss": -12.042652130126953, "global_step": 271745, "epoch": 1617} {"train_loss": -11.948165893554688, "global_step": 271746, "epoch": 1617} {"train_loss": -11.988824844360352, "global_step": 271747, "epoch": 1617} {"train_loss": -12.096301078796387, "global_step": 271748, "epoch": 1617} {"train_loss": -12.210250854492188, "global_step": 271749, "epoch": 1617} {"train_loss": -12.202932357788086, "global_step": 271750, "epoch": 1617} {"train_loss": -12.195205688476562, "global_step": 271751, "epoch": 1617} {"train_loss": -12.139677047729492, "global_step": 271752, "epoch": 1617} {"train_loss": -12.216438293457031, "global_step": 271753, "epoch": 1617} {"train_loss": -12.272531509399414, "global_step": 271754, "epoch": 1617} {"train_loss": -12.295658111572266, "global_step": 271755, "epoch": 1617} {"train_loss": -11.99631404876709, "global_step": 271756, "epoch": 1617} {"train_loss": -12.161406517028809, "global_step": 271757, "epoch": 1617} {"train_loss": -12.302789688110352, "global_step": 271758, "epoch": 1617} {"train_loss": -12.180438995361328, "global_step": 271759, "epoch": 1617} {"train_loss": -12.193023681640625, "global_step": 271760, "epoch": 1617} {"train_loss": -12.288052558898926, "global_step": 271761, "epoch": 1617} {"train_loss": -12.212491035461426, "global_step": 271762, "epoch": 1617} {"train_loss": -12.184892654418945, "global_step": 271763, "epoch": 1617} {"train_loss": -12.194788932800293, "global_step": 271764, "epoch": 1617} {"train_loss": -12.378377914428711, "global_step": 271765, "epoch": 1617} {"train_loss": -12.246804237365723, "global_step": 271766, "epoch": 1617} {"train_loss": -12.20085620880127, "global_step": 271767, "epoch": 1617} {"train_loss": -12.00714111328125, "global_step": 271768, "epoch": 1617} {"train_loss": -12.161420822143555, "global_step": 271769, "epoch": 1617} {"train_loss": -12.141172409057617, "global_step": 271770, "epoch": 1617} {"train_loss": -12.40264892578125, "global_step": 271771, "epoch": 1617} {"train_loss": -12.188333511352539, "global_step": 271772, "epoch": 1617} {"train_loss": -12.126256942749023, "global_step": 271773, "epoch": 1617} {"train_loss": -12.088980674743652, "global_step": 271774, "epoch": 1617} {"train_loss": -12.21220588684082, "global_step": 271775, "epoch": 1617} {"train_loss": -12.33891487121582, "global_step": 271776, "epoch": 1617} {"train_loss": -12.247520446777344, "global_step": 271777, "epoch": 1617} {"train_loss": -12.184394836425781, "global_step": 271778, "epoch": 1617} {"train_loss": -12.172540664672852, "global_step": 271779, "epoch": 1617} {"train_loss": -12.098668098449707, "global_step": 271780, "epoch": 1617} {"train_loss": -11.723489761352539, "global_step": 271781, "epoch": 1617} {"train_loss": -12.044775009155273, "global_step": 271782, "epoch": 1617} {"train_loss": -11.758872032165527, "global_step": 271783, "epoch": 1617} {"train_loss": -11.64550495147705, "global_step": 271784, "epoch": 1617} {"train_loss": -11.746175765991211, "global_step": 271785, "epoch": 1617} {"train_loss": -11.164665222167969, "global_step": 271786, "epoch": 1617} {"train_loss": -11.825834274291992, "global_step": 271787, "epoch": 1617} {"train_loss": -11.735109329223633, "global_step": 271788, "epoch": 1617} {"train_loss": -12.16395378112793, "global_step": 271789, "epoch": 1617} {"train_loss": -11.608935356140137, "global_step": 271790, "epoch": 1617} {"train_loss": -11.840566635131836, "global_step": 271791, "epoch": 1617} {"train_loss": -11.825170516967773, "global_step": 271792, "epoch": 1617} {"train_loss": -11.770764350891113, "global_step": 271793, "epoch": 1617} {"train_loss": -11.803285598754883, "global_step": 271794, "epoch": 1617} {"train_loss": -11.722549438476562, "global_step": 271795, "epoch": 1617} {"train_loss": -11.917362213134766, "global_step": 271796, "epoch": 1617} {"train_loss": -11.772584915161133, "global_step": 271797, "epoch": 1617} {"train_loss": -11.621805191040039, "global_step": 271798, "epoch": 1617} {"train_loss": -11.822564125061035, "global_step": 271799, "epoch": 1617} {"train_loss": -12.016700744628906, "global_step": 271800, "epoch": 1617} {"train_loss": -11.680329322814941, "global_step": 271801, "epoch": 1617} {"train_loss": -10.968141555786133, "global_step": 271802, "epoch": 1617} {"train_loss": -11.411663055419922, "global_step": 271803, "epoch": 1617} {"train_loss": -10.998180389404297, "global_step": 271804, "epoch": 1617} {"train_loss": -9.122586250305176, "global_step": 271805, "epoch": 1617} {"train_loss": -10.908631324768066, "global_step": 271806, "epoch": 1617} {"train_loss": -11.437726974487305, "global_step": 271807, "epoch": 1617} {"train_loss": -11.19710922241211, "global_step": 271808, "epoch": 1617} {"train_loss": -11.367331504821777, "global_step": 271809, "epoch": 1617} {"train_loss": -11.581124305725098, "global_step": 271810, "epoch": 1617} {"train_loss": -11.708984375, "global_step": 271811, "epoch": 1617} {"train_loss": -11.709207534790039, "global_step": 271812, "epoch": 1617} {"train_loss": -11.623420715332031, "global_step": 271813, "epoch": 1617} {"train_loss": -11.506208419799805, "global_step": 271814, "epoch": 1617} {"train_loss": -11.571707725524902, "global_step": 271815, "epoch": 1617} {"train_loss": -12.042356491088867, "global_step": 271816, "epoch": 1617} {"train_loss": -11.621278762817383, "global_step": 271817, "epoch": 1617} {"train_loss": -11.83666706085205, "global_step": 271818, "epoch": 1617} {"train_loss": -12.18651008605957, "global_step": 271819, "epoch": 1617} {"train_loss": -11.920921325683594, "global_step": 271820, "epoch": 1617} {"train_loss": -11.833062171936035, "global_step": 271821, "epoch": 1617} {"train_loss": -11.89944839477539, "global_step": 271822, "epoch": 1617} {"train_loss": -11.22150939419156, "global_step": 271823, "epoch": 1617, "val_loss": 271628.375} {"train_loss": -11.77836799621582, "global_step": 271824, "epoch": 1618} {"train_loss": -11.820201873779297, "global_step": 271825, "epoch": 1618} {"train_loss": -11.568643569946289, "global_step": 271826, "epoch": 1618} {"train_loss": -11.725648880004883, "global_step": 271827, "epoch": 1618} {"train_loss": -11.902681350708008, "global_step": 271828, "epoch": 1618} {"train_loss": -11.496451377868652, "global_step": 271829, "epoch": 1618} {"train_loss": -11.623897552490234, "global_step": 271830, "epoch": 1618} {"train_loss": -11.499744415283203, "global_step": 271831, "epoch": 1618} {"train_loss": -11.740400314331055, "global_step": 271832, "epoch": 1618} {"train_loss": -11.498392105102539, "global_step": 271833, "epoch": 1618} {"train_loss": -11.903493881225586, "global_step": 271834, "epoch": 1618} {"train_loss": -10.909807205200195, "global_step": 271835, "epoch": 1618} {"train_loss": -11.663137435913086, "global_step": 271836, "epoch": 1618} {"train_loss": -11.285032272338867, "global_step": 271837, "epoch": 1618} {"train_loss": -11.529142379760742, "global_step": 271838, "epoch": 1618} {"train_loss": -10.065154075622559, "global_step": 271839, "epoch": 1618} {"train_loss": -11.484840393066406, "global_step": 271840, "epoch": 1618} {"train_loss": -10.474123001098633, "global_step": 271841, "epoch": 1618} {"train_loss": -11.339588165283203, "global_step": 271842, "epoch": 1618} {"train_loss": -9.90882396697998, "global_step": 271843, "epoch": 1618} {"train_loss": -11.562047004699707, "global_step": 271844, "epoch": 1618} {"train_loss": -10.293922424316406, "global_step": 271845, "epoch": 1618} {"train_loss": -10.787351608276367, "global_step": 271846, "epoch": 1618} {"train_loss": -10.280452728271484, "global_step": 271847, "epoch": 1618} {"train_loss": -10.316062927246094, "global_step": 271848, "epoch": 1618} {"train_loss": -10.456986427307129, "global_step": 271849, "epoch": 1618} {"train_loss": -11.02290153503418, "global_step": 271850, "epoch": 1618} {"train_loss": -10.250231742858887, "global_step": 271851, "epoch": 1618} {"train_loss": -10.962528228759766, "global_step": 271852, "epoch": 1618} {"train_loss": -11.342107772827148, "global_step": 271853, "epoch": 1618} {"train_loss": -11.043341636657715, "global_step": 271854, "epoch": 1618} {"train_loss": -11.531514167785645, "global_step": 271855, "epoch": 1618} {"train_loss": -11.077047348022461, "global_step": 271856, "epoch": 1618} {"train_loss": -11.728591918945312, "global_step": 271857, "epoch": 1618} {"train_loss": -11.219152450561523, "global_step": 271858, "epoch": 1618} {"train_loss": -11.600433349609375, "global_step": 271859, "epoch": 1618} {"train_loss": -11.190937995910645, "global_step": 271860, "epoch": 1618} {"train_loss": -11.660737037658691, "global_step": 271861, "epoch": 1618} {"train_loss": -11.006604194641113, "global_step": 271862, "epoch": 1618} {"train_loss": -11.804144859313965, "global_step": 271863, "epoch": 1618} {"train_loss": -11.785337448120117, "global_step": 271864, "epoch": 1618} {"train_loss": -11.908195495605469, "global_step": 271865, "epoch": 1618} {"train_loss": -11.689735412597656, "global_step": 271866, "epoch": 1618} {"train_loss": -11.818471908569336, "global_step": 271867, "epoch": 1618} {"train_loss": -11.789770126342773, "global_step": 271868, "epoch": 1618} {"train_loss": -11.809255599975586, "global_step": 271869, "epoch": 1618} {"train_loss": -11.915250778198242, "global_step": 271870, "epoch": 1618} {"train_loss": -11.709627151489258, "global_step": 271871, "epoch": 1618} {"train_loss": -11.642431259155273, "global_step": 271872, "epoch": 1618} {"train_loss": -11.696123123168945, "global_step": 271873, "epoch": 1618} {"train_loss": -11.811936378479004, "global_step": 271874, "epoch": 1618} {"train_loss": -11.69332218170166, "global_step": 271875, "epoch": 1618} {"train_loss": -11.865774154663086, "global_step": 271876, "epoch": 1618} {"train_loss": -11.784059524536133, "global_step": 271877, "epoch": 1618} {"train_loss": -12.068073272705078, "global_step": 271878, "epoch": 1618} {"train_loss": -11.946216583251953, "global_step": 271879, "epoch": 1618} {"train_loss": -11.892080307006836, "global_step": 271880, "epoch": 1618} {"train_loss": -12.151322364807129, "global_step": 271881, "epoch": 1618} {"train_loss": -11.798639297485352, "global_step": 271882, "epoch": 1618} {"train_loss": -12.128718376159668, "global_step": 271883, "epoch": 1618} {"train_loss": -11.8382568359375, "global_step": 271884, "epoch": 1618} {"train_loss": -11.983577728271484, "global_step": 271885, "epoch": 1618} {"train_loss": -12.144613265991211, "global_step": 271886, "epoch": 1618} {"train_loss": -12.011032104492188, "global_step": 271887, "epoch": 1618} {"train_loss": -12.095046997070312, "global_step": 271888, "epoch": 1618} {"train_loss": -12.094615936279297, "global_step": 271889, "epoch": 1618} {"train_loss": -12.275575637817383, "global_step": 271890, "epoch": 1618} {"train_loss": -12.161134719848633, "global_step": 271891, "epoch": 1618} {"train_loss": -12.20870590209961, "global_step": 271892, "epoch": 1618} {"train_loss": -12.209957122802734, "global_step": 271893, "epoch": 1618} {"train_loss": -12.082242012023926, "global_step": 271894, "epoch": 1618} {"train_loss": -11.993181228637695, "global_step": 271895, "epoch": 1618} {"train_loss": -12.262425422668457, "global_step": 271896, "epoch": 1618} {"train_loss": -12.191999435424805, "global_step": 271897, "epoch": 1618} {"train_loss": -12.086395263671875, "global_step": 271898, "epoch": 1618} {"train_loss": -12.22195816040039, "global_step": 271899, "epoch": 1618} {"train_loss": -11.825550079345703, "global_step": 271900, "epoch": 1618} {"train_loss": -12.285877227783203, "global_step": 271901, "epoch": 1618} {"train_loss": -12.239526748657227, "global_step": 271902, "epoch": 1618} {"train_loss": -12.120098114013672, "global_step": 271903, "epoch": 1618} {"train_loss": -12.27779769897461, "global_step": 271904, "epoch": 1618} {"train_loss": -12.249593734741211, "global_step": 271905, "epoch": 1618} {"train_loss": -12.33513069152832, "global_step": 271906, "epoch": 1618} {"train_loss": -12.317163467407227, "global_step": 271907, "epoch": 1618} {"train_loss": -12.16171646118164, "global_step": 271908, "epoch": 1618} {"train_loss": -12.135032653808594, "global_step": 271909, "epoch": 1618} {"train_loss": -12.251142501831055, "global_step": 271910, "epoch": 1618} {"train_loss": -12.445524215698242, "global_step": 271911, "epoch": 1618} {"train_loss": -12.383955955505371, "global_step": 271912, "epoch": 1618} {"train_loss": -11.962303161621094, "global_step": 271913, "epoch": 1618} {"train_loss": -12.383526802062988, "global_step": 271914, "epoch": 1618} {"train_loss": -12.199636459350586, "global_step": 271915, "epoch": 1618} {"train_loss": -12.227372169494629, "global_step": 271916, "epoch": 1618} {"train_loss": -12.46318244934082, "global_step": 271917, "epoch": 1618} {"train_loss": -12.411127090454102, "global_step": 271918, "epoch": 1618} {"train_loss": -12.416383743286133, "global_step": 271919, "epoch": 1618} {"train_loss": -12.268655776977539, "global_step": 271920, "epoch": 1618} {"train_loss": -12.426124572753906, "global_step": 271921, "epoch": 1618} {"train_loss": -11.984402656555176, "global_step": 271922, "epoch": 1618} {"train_loss": -10.860011100769043, "global_step": 271923, "epoch": 1618} {"train_loss": -11.472599983215332, "global_step": 271924, "epoch": 1618} {"train_loss": -11.74506950378418, "global_step": 271925, "epoch": 1618} {"train_loss": -10.538476943969727, "global_step": 271926, "epoch": 1618} {"train_loss": -11.050176620483398, "global_step": 271927, "epoch": 1618} {"train_loss": -11.610038757324219, "global_step": 271928, "epoch": 1618} {"train_loss": -12.103862762451172, "global_step": 271929, "epoch": 1618} {"train_loss": -11.262207984924316, "global_step": 271930, "epoch": 1618} {"train_loss": -11.487313270568848, "global_step": 271931, "epoch": 1618} {"train_loss": -11.315958976745605, "global_step": 271932, "epoch": 1618} {"train_loss": -11.805339813232422, "global_step": 271933, "epoch": 1618} {"train_loss": -10.78059196472168, "global_step": 271934, "epoch": 1618} {"train_loss": -11.162955284118652, "global_step": 271935, "epoch": 1618} {"train_loss": -11.127021789550781, "global_step": 271936, "epoch": 1618} {"train_loss": -11.849533081054688, "global_step": 271937, "epoch": 1618} {"train_loss": -10.926752090454102, "global_step": 271938, "epoch": 1618} {"train_loss": -11.213640213012695, "global_step": 271939, "epoch": 1618} {"train_loss": -12.081535339355469, "global_step": 271940, "epoch": 1618} {"train_loss": -11.984882354736328, "global_step": 271941, "epoch": 1618} {"train_loss": -12.003776550292969, "global_step": 271942, "epoch": 1618} {"train_loss": -11.85993766784668, "global_step": 271943, "epoch": 1618} {"train_loss": -12.047752380371094, "global_step": 271944, "epoch": 1618} {"train_loss": -11.837718963623047, "global_step": 271945, "epoch": 1618} {"train_loss": -11.800069808959961, "global_step": 271946, "epoch": 1618} {"train_loss": -11.888025283813477, "global_step": 271947, "epoch": 1618} {"train_loss": -12.051053047180176, "global_step": 271948, "epoch": 1618} {"train_loss": -11.519241333007812, "global_step": 271949, "epoch": 1618} {"train_loss": -11.078041076660156, "global_step": 271950, "epoch": 1618} {"train_loss": -11.812793731689453, "global_step": 271951, "epoch": 1618} {"train_loss": -10.583203315734863, "global_step": 271952, "epoch": 1618} {"train_loss": -11.609600067138672, "global_step": 271953, "epoch": 1618} {"train_loss": -11.42772102355957, "global_step": 271954, "epoch": 1618} {"train_loss": -11.384309768676758, "global_step": 271955, "epoch": 1618} {"train_loss": -11.555366516113281, "global_step": 271956, "epoch": 1618} {"train_loss": -11.566699981689453, "global_step": 271957, "epoch": 1618} {"train_loss": -11.552140235900879, "global_step": 271958, "epoch": 1618} {"train_loss": -12.006331443786621, "global_step": 271959, "epoch": 1618} {"train_loss": -11.731773376464844, "global_step": 271960, "epoch": 1618} {"train_loss": -11.92034912109375, "global_step": 271961, "epoch": 1618} {"train_loss": -11.903359413146973, "global_step": 271962, "epoch": 1618} {"train_loss": -12.090123176574707, "global_step": 271963, "epoch": 1618} {"train_loss": -11.95078182220459, "global_step": 271964, "epoch": 1618} {"train_loss": -12.100963592529297, "global_step": 271965, "epoch": 1618} {"train_loss": -11.689449310302734, "global_step": 271966, "epoch": 1618} {"train_loss": -12.047775268554688, "global_step": 271967, "epoch": 1618} {"train_loss": -11.739880561828613, "global_step": 271968, "epoch": 1618} {"train_loss": -11.350715637207031, "global_step": 271969, "epoch": 1618} {"train_loss": -11.427139282226562, "global_step": 271970, "epoch": 1618} {"train_loss": -11.857234954833984, "global_step": 271971, "epoch": 1618} {"train_loss": -11.24830436706543, "global_step": 271972, "epoch": 1618} {"train_loss": -11.738969802856445, "global_step": 271973, "epoch": 1618} {"train_loss": -11.466337203979492, "global_step": 271974, "epoch": 1618} {"train_loss": -10.475116729736328, "global_step": 271975, "epoch": 1618} {"train_loss": -11.881739616394043, "global_step": 271976, "epoch": 1618} {"train_loss": -11.803184509277344, "global_step": 271977, "epoch": 1618} {"train_loss": -11.428504943847656, "global_step": 271978, "epoch": 1618} {"train_loss": -11.59636116027832, "global_step": 271979, "epoch": 1618} {"train_loss": -12.090391159057617, "global_step": 271980, "epoch": 1618} {"train_loss": -11.912979125976562, "global_step": 271981, "epoch": 1618} {"train_loss": -12.052986145019531, "global_step": 271982, "epoch": 1618} {"train_loss": -12.105875015258789, "global_step": 271983, "epoch": 1618} {"train_loss": -11.781699180603027, "global_step": 271984, "epoch": 1618} {"train_loss": -12.054637908935547, "global_step": 271985, "epoch": 1618} {"train_loss": -12.193496704101562, "global_step": 271986, "epoch": 1618} {"train_loss": -11.817327499389648, "global_step": 271987, "epoch": 1618} {"train_loss": -11.96872329711914, "global_step": 271988, "epoch": 1618} {"train_loss": -12.116018295288086, "global_step": 271989, "epoch": 1618} {"train_loss": -11.954133033752441, "global_step": 271990, "epoch": 1618} {"train_loss": -11.691605715524583, "global_step": 271991, "epoch": 1618, "val_loss": 272077.3125} {"train_loss": -11.714954376220703, "global_step": 271992, "epoch": 1619} {"train_loss": -11.880111694335938, "global_step": 271993, "epoch": 1619} {"train_loss": -11.692312240600586, "global_step": 271994, "epoch": 1619} {"train_loss": -11.782381057739258, "global_step": 271995, "epoch": 1619} {"train_loss": -11.591110229492188, "global_step": 271996, "epoch": 1619} {"train_loss": -11.648685455322266, "global_step": 271997, "epoch": 1619} {"train_loss": -11.779870986938477, "global_step": 271998, "epoch": 1619} {"train_loss": -11.216842651367188, "global_step": 271999, "epoch": 1619} {"train_loss": -11.58266544342041, "global_step": 272000, "epoch": 1619} {"train_loss": -11.58128547668457, "global_step": 272001, "epoch": 1619} {"train_loss": -11.8799467086792, "global_step": 272002, "epoch": 1619} {"train_loss": -11.741996765136719, "global_step": 272003, "epoch": 1619} {"train_loss": -11.564340591430664, "global_step": 272004, "epoch": 1619} {"train_loss": -12.14356803894043, "global_step": 272005, "epoch": 1619} {"train_loss": -11.593585968017578, "global_step": 272006, "epoch": 1619} {"train_loss": -11.618766784667969, "global_step": 272007, "epoch": 1619} {"train_loss": -12.171934127807617, "global_step": 272008, "epoch": 1619} {"train_loss": -11.544291496276855, "global_step": 272009, "epoch": 1619} {"train_loss": -11.880755424499512, "global_step": 272010, "epoch": 1619} {"train_loss": -11.837032318115234, "global_step": 272011, "epoch": 1619} {"train_loss": -11.317974090576172, "global_step": 272012, "epoch": 1619} {"train_loss": -11.837539672851562, "global_step": 272013, "epoch": 1619} {"train_loss": -11.499162673950195, "global_step": 272014, "epoch": 1619} {"train_loss": -11.842267036437988, "global_step": 272015, "epoch": 1619} {"train_loss": -11.96509075164795, "global_step": 272016, "epoch": 1619} {"train_loss": -11.649534225463867, "global_step": 272017, "epoch": 1619} {"train_loss": -11.915290832519531, "global_step": 272018, "epoch": 1619} {"train_loss": -11.825799942016602, "global_step": 272019, "epoch": 1619} {"train_loss": -11.864049911499023, "global_step": 272020, "epoch": 1619} {"train_loss": -12.045927047729492, "global_step": 272021, "epoch": 1619} {"train_loss": -11.518831253051758, "global_step": 272022, "epoch": 1619} {"train_loss": -11.873886108398438, "global_step": 272023, "epoch": 1619} {"train_loss": -11.346271514892578, "global_step": 272024, "epoch": 1619} {"train_loss": -11.406316757202148, "global_step": 272025, "epoch": 1619} {"train_loss": -12.06550407409668, "global_step": 272026, "epoch": 1619} {"train_loss": -11.065439224243164, "global_step": 272027, "epoch": 1619} {"train_loss": -11.492005348205566, "global_step": 272028, "epoch": 1619} {"train_loss": -11.973235130310059, "global_step": 272029, "epoch": 1619} {"train_loss": -10.89602279663086, "global_step": 272030, "epoch": 1619} {"train_loss": -11.38965892791748, "global_step": 272031, "epoch": 1619} {"train_loss": -11.769217491149902, "global_step": 272032, "epoch": 1619} {"train_loss": -10.522798538208008, "global_step": 272033, "epoch": 1619} {"train_loss": -12.067399978637695, "global_step": 272034, "epoch": 1619} {"train_loss": -10.508453369140625, "global_step": 272035, "epoch": 1619} {"train_loss": -11.005062103271484, "global_step": 272036, "epoch": 1619} {"train_loss": -11.643401145935059, "global_step": 272037, "epoch": 1619} {"train_loss": -11.220829010009766, "global_step": 272038, "epoch": 1619} {"train_loss": -11.437702178955078, "global_step": 272039, "epoch": 1619} {"train_loss": -10.978588104248047, "global_step": 272040, "epoch": 1619} {"train_loss": -11.566483497619629, "global_step": 272041, "epoch": 1619} {"train_loss": -11.083577156066895, "global_step": 272042, "epoch": 1619} {"train_loss": -11.161767959594727, "global_step": 272043, "epoch": 1619} {"train_loss": -11.407323837280273, "global_step": 272044, "epoch": 1619} {"train_loss": -11.35068130493164, "global_step": 272045, "epoch": 1619} {"train_loss": -10.975564002990723, "global_step": 272046, "epoch": 1619} {"train_loss": -11.710561752319336, "global_step": 272047, "epoch": 1619} {"train_loss": -9.906213760375977, "global_step": 272048, "epoch": 1619} {"train_loss": -11.211893081665039, "global_step": 272049, "epoch": 1619} {"train_loss": -11.192122459411621, "global_step": 272050, "epoch": 1619} {"train_loss": -10.648494720458984, "global_step": 272051, "epoch": 1619} {"train_loss": -11.823629379272461, "global_step": 272052, "epoch": 1619} {"train_loss": -11.175493240356445, "global_step": 272053, "epoch": 1619} {"train_loss": -11.574447631835938, "global_step": 272054, "epoch": 1619} {"train_loss": -11.706788063049316, "global_step": 272055, "epoch": 1619} {"train_loss": -11.25210189819336, "global_step": 272056, "epoch": 1619} {"train_loss": -11.511222839355469, "global_step": 272057, "epoch": 1619} {"train_loss": -11.693802833557129, "global_step": 272058, "epoch": 1619} {"train_loss": -11.768467903137207, "global_step": 272059, "epoch": 1619} {"train_loss": -11.367984771728516, "global_step": 272060, "epoch": 1619} {"train_loss": -10.879359245300293, "global_step": 272061, "epoch": 1619} {"train_loss": -11.912468910217285, "global_step": 272062, "epoch": 1619} {"train_loss": -11.544381141662598, "global_step": 272063, "epoch": 1619} {"train_loss": -11.764894485473633, "global_step": 272064, "epoch": 1619} {"train_loss": -11.933368682861328, "global_step": 272065, "epoch": 1619} {"train_loss": -11.806201934814453, "global_step": 272066, "epoch": 1619} {"train_loss": -11.773573875427246, "global_step": 272067, "epoch": 1619} {"train_loss": -11.75621509552002, "global_step": 272068, "epoch": 1619} {"train_loss": -11.825664520263672, "global_step": 272069, "epoch": 1619} {"train_loss": -11.853845596313477, "global_step": 272070, "epoch": 1619} {"train_loss": -12.015308380126953, "global_step": 272071, "epoch": 1619} {"train_loss": -12.150270462036133, "global_step": 272072, "epoch": 1619} {"train_loss": -11.952491760253906, "global_step": 272073, "epoch": 1619} {"train_loss": -12.077363014221191, "global_step": 272074, "epoch": 1619} {"train_loss": -12.099705696105957, "global_step": 272075, "epoch": 1619} {"train_loss": -11.981050491333008, "global_step": 272076, "epoch": 1619} {"train_loss": -12.210535049438477, "global_step": 272077, "epoch": 1619} {"train_loss": -11.934005737304688, "global_step": 272078, "epoch": 1619} {"train_loss": -12.03115463256836, "global_step": 272079, "epoch": 1619} {"train_loss": -12.10159683227539, "global_step": 272080, "epoch": 1619} {"train_loss": -12.105711936950684, "global_step": 272081, "epoch": 1619} {"train_loss": -11.887398719787598, "global_step": 272082, "epoch": 1619} {"train_loss": -11.857633590698242, "global_step": 272083, "epoch": 1619} {"train_loss": -12.041196823120117, "global_step": 272084, "epoch": 1619} {"train_loss": -12.18006706237793, "global_step": 272085, "epoch": 1619} {"train_loss": -11.984586715698242, "global_step": 272086, "epoch": 1619} {"train_loss": -11.954712867736816, "global_step": 272087, "epoch": 1619} {"train_loss": -11.889939308166504, "global_step": 272088, "epoch": 1619} {"train_loss": -12.093172073364258, "global_step": 272089, "epoch": 1619} {"train_loss": -11.866414070129395, "global_step": 272090, "epoch": 1619} {"train_loss": -12.353822708129883, "global_step": 272091, "epoch": 1619} {"train_loss": -11.79829216003418, "global_step": 272092, "epoch": 1619} {"train_loss": -11.61288833618164, "global_step": 272093, "epoch": 1619} {"train_loss": -11.961368560791016, "global_step": 272094, "epoch": 1619} {"train_loss": -11.226104736328125, "global_step": 272095, "epoch": 1619} {"train_loss": -11.82555866241455, "global_step": 272096, "epoch": 1619} {"train_loss": -11.513006210327148, "global_step": 272097, "epoch": 1619} {"train_loss": -11.421113967895508, "global_step": 272098, "epoch": 1619} {"train_loss": -11.651294708251953, "global_step": 272099, "epoch": 1619} {"train_loss": -11.710407257080078, "global_step": 272100, "epoch": 1619} {"train_loss": -11.776002883911133, "global_step": 272101, "epoch": 1619} {"train_loss": -11.454825401306152, "global_step": 272102, "epoch": 1619} {"train_loss": -10.828730583190918, "global_step": 272103, "epoch": 1619} {"train_loss": -10.362085342407227, "global_step": 272104, "epoch": 1619} {"train_loss": -11.544960021972656, "global_step": 272105, "epoch": 1619} {"train_loss": -11.00680923461914, "global_step": 272106, "epoch": 1619} {"train_loss": -11.820755004882812, "global_step": 272107, "epoch": 1619} {"train_loss": -11.188358306884766, "global_step": 272108, "epoch": 1619} {"train_loss": -11.624954223632812, "global_step": 272109, "epoch": 1619} {"train_loss": -10.911139488220215, "global_step": 272110, "epoch": 1619} {"train_loss": -11.377429962158203, "global_step": 272111, "epoch": 1619} {"train_loss": -11.845649719238281, "global_step": 272112, "epoch": 1619} {"train_loss": -10.967082977294922, "global_step": 272113, "epoch": 1619} {"train_loss": -11.617486953735352, "global_step": 272114, "epoch": 1619} {"train_loss": -10.365642547607422, "global_step": 272115, "epoch": 1619} {"train_loss": -11.273113250732422, "global_step": 272116, "epoch": 1619} {"train_loss": -10.926342010498047, "global_step": 272117, "epoch": 1619} {"train_loss": -10.984389305114746, "global_step": 272118, "epoch": 1619} {"train_loss": -11.452072143554688, "global_step": 272119, "epoch": 1619} {"train_loss": -11.288451194763184, "global_step": 272120, "epoch": 1619} {"train_loss": -11.60944938659668, "global_step": 272121, "epoch": 1619} {"train_loss": -11.154481887817383, "global_step": 272122, "epoch": 1619} {"train_loss": -11.533632278442383, "global_step": 272123, "epoch": 1619} {"train_loss": -10.965099334716797, "global_step": 272124, "epoch": 1619} {"train_loss": -11.819706916809082, "global_step": 272125, "epoch": 1619} {"train_loss": -11.61043930053711, "global_step": 272126, "epoch": 1619} {"train_loss": -11.70604133605957, "global_step": 272127, "epoch": 1619} {"train_loss": -11.686026573181152, "global_step": 272128, "epoch": 1619} {"train_loss": -12.00729751586914, "global_step": 272129, "epoch": 1619} {"train_loss": -11.648969650268555, "global_step": 272130, "epoch": 1619} {"train_loss": -11.938596725463867, "global_step": 272131, "epoch": 1619} {"train_loss": -11.69025993347168, "global_step": 272132, "epoch": 1619} {"train_loss": -11.70513916015625, "global_step": 272133, "epoch": 1619} {"train_loss": -11.877467155456543, "global_step": 272134, "epoch": 1619} {"train_loss": -11.767789840698242, "global_step": 272135, "epoch": 1619} {"train_loss": -11.644309997558594, "global_step": 272136, "epoch": 1619} {"train_loss": -11.92715835571289, "global_step": 272137, "epoch": 1619} {"train_loss": -11.866811752319336, "global_step": 272138, "epoch": 1619} {"train_loss": -11.959396362304688, "global_step": 272139, "epoch": 1619} {"train_loss": -11.92372989654541, "global_step": 272140, "epoch": 1619} {"train_loss": -11.906854629516602, "global_step": 272141, "epoch": 1619} {"train_loss": -12.024539947509766, "global_step": 272142, "epoch": 1619} {"train_loss": -12.109460830688477, "global_step": 272143, "epoch": 1619} {"train_loss": -12.017526626586914, "global_step": 272144, "epoch": 1619} {"train_loss": -11.868207931518555, "global_step": 272145, "epoch": 1619} {"train_loss": -12.05741024017334, "global_step": 272146, "epoch": 1619} {"train_loss": -12.076066970825195, "global_step": 272147, "epoch": 1619} {"train_loss": -12.11707878112793, "global_step": 272148, "epoch": 1619} {"train_loss": -11.876779556274414, "global_step": 272149, "epoch": 1619} {"train_loss": -12.009212493896484, "global_step": 272150, "epoch": 1619} {"train_loss": -12.300348281860352, "global_step": 272151, "epoch": 1619} {"train_loss": -12.16024398803711, "global_step": 272152, "epoch": 1619} {"train_loss": -12.192079544067383, "global_step": 272153, "epoch": 1619} {"train_loss": -12.0042724609375, "global_step": 272154, "epoch": 1619} {"train_loss": -12.146146774291992, "global_step": 272155, "epoch": 1619} {"train_loss": -12.220735549926758, "global_step": 272156, "epoch": 1619} {"train_loss": -12.158172607421875, "global_step": 272157, "epoch": 1619} {"train_loss": -12.134340286254883, "global_step": 272158, "epoch": 1619} {"train_loss": -11.649849238849821, "global_step": 272159, "epoch": 1619, "val_loss": 276811.34375} {"train_loss": -12.090312957763672, "global_step": 272160, "epoch": 1620} {"train_loss": -11.873190879821777, "global_step": 272161, "epoch": 1620} {"train_loss": -12.129766464233398, "global_step": 272162, "epoch": 1620} {"train_loss": -11.514593124389648, "global_step": 272163, "epoch": 1620} {"train_loss": -11.777055740356445, "global_step": 272164, "epoch": 1620} {"train_loss": -12.0509672164917, "global_step": 272165, "epoch": 1620} {"train_loss": -11.897205352783203, "global_step": 272166, "epoch": 1620} {"train_loss": -12.068570137023926, "global_step": 272167, "epoch": 1620} {"train_loss": -11.90072250366211, "global_step": 272168, "epoch": 1620} {"train_loss": -12.040374755859375, "global_step": 272169, "epoch": 1620} {"train_loss": -11.986898422241211, "global_step": 272170, "epoch": 1620} {"train_loss": -12.04759693145752, "global_step": 272171, "epoch": 1620} {"train_loss": -12.098400115966797, "global_step": 272172, "epoch": 1620} {"train_loss": -12.148361206054688, "global_step": 272173, "epoch": 1620} {"train_loss": -11.743172645568848, "global_step": 272174, "epoch": 1620} {"train_loss": -11.917827606201172, "global_step": 272175, "epoch": 1620} {"train_loss": -11.979771614074707, "global_step": 272176, "epoch": 1620} {"train_loss": -11.912660598754883, "global_step": 272177, "epoch": 1620} {"train_loss": -11.823991775512695, "global_step": 272178, "epoch": 1620} {"train_loss": -11.446981430053711, "global_step": 272179, "epoch": 1620} {"train_loss": -11.99925422668457, "global_step": 272180, "epoch": 1620} {"train_loss": -11.710697174072266, "global_step": 272181, "epoch": 1620} {"train_loss": -11.271018981933594, "global_step": 272182, "epoch": 1620} {"train_loss": -11.701131820678711, "global_step": 272183, "epoch": 1620} {"train_loss": -10.525444030761719, "global_step": 272184, "epoch": 1620} {"train_loss": -11.236143112182617, "global_step": 272185, "epoch": 1620} {"train_loss": -11.26976203918457, "global_step": 272186, "epoch": 1620} {"train_loss": -10.850358963012695, "global_step": 272187, "epoch": 1620} {"train_loss": -10.8446044921875, "global_step": 272188, "epoch": 1620} {"train_loss": -10.307857513427734, "global_step": 272189, "epoch": 1620} {"train_loss": -10.877218246459961, "global_step": 272190, "epoch": 1620} {"train_loss": -10.039291381835938, "global_step": 272191, "epoch": 1620} {"train_loss": -11.926288604736328, "global_step": 272192, "epoch": 1620} {"train_loss": -10.57412338256836, "global_step": 272193, "epoch": 1620} {"train_loss": -10.865825653076172, "global_step": 272194, "epoch": 1620} {"train_loss": -10.916708946228027, "global_step": 272195, "epoch": 1620} {"train_loss": -11.129667282104492, "global_step": 272196, "epoch": 1620} {"train_loss": -11.643832206726074, "global_step": 272197, "epoch": 1620} {"train_loss": -11.285650253295898, "global_step": 272198, "epoch": 1620} {"train_loss": -11.753156661987305, "global_step": 272199, "epoch": 1620} {"train_loss": -11.212944030761719, "global_step": 272200, "epoch": 1620} {"train_loss": -11.767133712768555, "global_step": 272201, "epoch": 1620} {"train_loss": -11.505928993225098, "global_step": 272202, "epoch": 1620} {"train_loss": -11.322837829589844, "global_step": 272203, "epoch": 1620} {"train_loss": -11.395055770874023, "global_step": 272204, "epoch": 1620} {"train_loss": -11.200638771057129, "global_step": 272205, "epoch": 1620} {"train_loss": -11.686635971069336, "global_step": 272206, "epoch": 1620} {"train_loss": -11.07368278503418, "global_step": 272207, "epoch": 1620} {"train_loss": -11.472813606262207, "global_step": 272208, "epoch": 1620} {"train_loss": -11.354158401489258, "global_step": 272209, "epoch": 1620} {"train_loss": -11.365863800048828, "global_step": 272210, "epoch": 1620} {"train_loss": -11.49652099609375, "global_step": 272211, "epoch": 1620} {"train_loss": -11.319132804870605, "global_step": 272212, "epoch": 1620} {"train_loss": -11.404040336608887, "global_step": 272213, "epoch": 1620} {"train_loss": -11.558801651000977, "global_step": 272214, "epoch": 1620} {"train_loss": -11.251117706298828, "global_step": 272215, "epoch": 1620} {"train_loss": -11.846410751342773, "global_step": 272216, "epoch": 1620} {"train_loss": -11.683477401733398, "global_step": 272217, "epoch": 1620} {"train_loss": -11.284828186035156, "global_step": 272218, "epoch": 1620} {"train_loss": -11.860260009765625, "global_step": 272219, "epoch": 1620} {"train_loss": -11.533226013183594, "global_step": 272220, "epoch": 1620} {"train_loss": -11.857986450195312, "global_step": 272221, "epoch": 1620} {"train_loss": -10.966611862182617, "global_step": 272222, "epoch": 1620} {"train_loss": -11.890822410583496, "global_step": 272223, "epoch": 1620} {"train_loss": -11.856388092041016, "global_step": 272224, "epoch": 1620} {"train_loss": -11.420005798339844, "global_step": 272225, "epoch": 1620} {"train_loss": -11.445239067077637, "global_step": 272226, "epoch": 1620} {"train_loss": -11.566205024719238, "global_step": 272227, "epoch": 1620} {"train_loss": -11.893407821655273, "global_step": 272228, "epoch": 1620} {"train_loss": -11.54809284210205, "global_step": 272229, "epoch": 1620} {"train_loss": -11.617189407348633, "global_step": 272230, "epoch": 1620} {"train_loss": -11.356887817382812, "global_step": 272231, "epoch": 1620} {"train_loss": -11.82170295715332, "global_step": 272232, "epoch": 1620} {"train_loss": -12.003188133239746, "global_step": 272233, "epoch": 1620} {"train_loss": -11.658012390136719, "global_step": 272234, "epoch": 1620} {"train_loss": -11.895589828491211, "global_step": 272235, "epoch": 1620} {"train_loss": -11.696735382080078, "global_step": 272236, "epoch": 1620} {"train_loss": -11.900273323059082, "global_step": 272237, "epoch": 1620} {"train_loss": -11.609354972839355, "global_step": 272238, "epoch": 1620} {"train_loss": -11.766641616821289, "global_step": 272239, "epoch": 1620} {"train_loss": -12.05299186706543, "global_step": 272240, "epoch": 1620} {"train_loss": -11.644874572753906, "global_step": 272241, "epoch": 1620} {"train_loss": -12.094715118408203, "global_step": 272242, "epoch": 1620} {"train_loss": -11.874410629272461, "global_step": 272243, "epoch": 1620} {"train_loss": -11.735119819641113, "global_step": 272244, "epoch": 1620} {"train_loss": -11.807323455810547, "global_step": 272245, "epoch": 1620} {"train_loss": -11.667534828186035, "global_step": 272246, "epoch": 1620} {"train_loss": -11.926401138305664, "global_step": 272247, "epoch": 1620} {"train_loss": -12.007161140441895, "global_step": 272248, "epoch": 1620} {"train_loss": -11.630388259887695, "global_step": 272249, "epoch": 1620} {"train_loss": -12.064348220825195, "global_step": 272250, "epoch": 1620} {"train_loss": -11.819253921508789, "global_step": 272251, "epoch": 1620} {"train_loss": -12.063027381896973, "global_step": 272252, "epoch": 1620} {"train_loss": -11.763410568237305, "global_step": 272253, "epoch": 1620} {"train_loss": -11.876201629638672, "global_step": 272254, "epoch": 1620} {"train_loss": -11.909845352172852, "global_step": 272255, "epoch": 1620} {"train_loss": -12.23738956451416, "global_step": 272256, "epoch": 1620} {"train_loss": -11.741899490356445, "global_step": 272257, "epoch": 1620} {"train_loss": -11.88714599609375, "global_step": 272258, "epoch": 1620} {"train_loss": -11.963385581970215, "global_step": 272259, "epoch": 1620} {"train_loss": -12.084619522094727, "global_step": 272260, "epoch": 1620} {"train_loss": -12.175216674804688, "global_step": 272261, "epoch": 1620} {"train_loss": -11.663930892944336, "global_step": 272262, "epoch": 1620} {"train_loss": -12.039728164672852, "global_step": 272263, "epoch": 1620} {"train_loss": -12.116003036499023, "global_step": 272264, "epoch": 1620} {"train_loss": -11.880796432495117, "global_step": 272265, "epoch": 1620} {"train_loss": -11.990180969238281, "global_step": 272266, "epoch": 1620} {"train_loss": -11.78546142578125, "global_step": 272267, "epoch": 1620} {"train_loss": -11.26357650756836, "global_step": 272268, "epoch": 1620} {"train_loss": -12.195476531982422, "global_step": 272269, "epoch": 1620} {"train_loss": -11.942578315734863, "global_step": 272270, "epoch": 1620} {"train_loss": -11.452803611755371, "global_step": 272271, "epoch": 1620} {"train_loss": -11.690950393676758, "global_step": 272272, "epoch": 1620} {"train_loss": -12.241231918334961, "global_step": 272273, "epoch": 1620} {"train_loss": -11.722127914428711, "global_step": 272274, "epoch": 1620} {"train_loss": -11.489551544189453, "global_step": 272275, "epoch": 1620} {"train_loss": -12.103878021240234, "global_step": 272276, "epoch": 1620} {"train_loss": -12.026724815368652, "global_step": 272277, "epoch": 1620} {"train_loss": -11.672199249267578, "global_step": 272278, "epoch": 1620} {"train_loss": -11.270949363708496, "global_step": 272279, "epoch": 1620} {"train_loss": -12.144721984863281, "global_step": 272280, "epoch": 1620} {"train_loss": -11.600839614868164, "global_step": 272281, "epoch": 1620} {"train_loss": -12.239252090454102, "global_step": 272282, "epoch": 1620} {"train_loss": -12.038759231567383, "global_step": 272283, "epoch": 1620} {"train_loss": -11.801118850708008, "global_step": 272284, "epoch": 1620} {"train_loss": -11.950218200683594, "global_step": 272285, "epoch": 1620} {"train_loss": -12.266782760620117, "global_step": 272286, "epoch": 1620} {"train_loss": -11.795446395874023, "global_step": 272287, "epoch": 1620} {"train_loss": -11.879405975341797, "global_step": 272288, "epoch": 1620} {"train_loss": -11.935367584228516, "global_step": 272289, "epoch": 1620} {"train_loss": -11.88682746887207, "global_step": 272290, "epoch": 1620} {"train_loss": -11.974708557128906, "global_step": 272291, "epoch": 1620} {"train_loss": -12.081292152404785, "global_step": 272292, "epoch": 1620} {"train_loss": -11.952109336853027, "global_step": 272293, "epoch": 1620} {"train_loss": -11.978109359741211, "global_step": 272294, "epoch": 1620} {"train_loss": -12.301898956298828, "global_step": 272295, "epoch": 1620} {"train_loss": -12.055309295654297, "global_step": 272296, "epoch": 1620} {"train_loss": -12.141654968261719, "global_step": 272297, "epoch": 1620} {"train_loss": -12.033967018127441, "global_step": 272298, "epoch": 1620} {"train_loss": -12.226598739624023, "global_step": 272299, "epoch": 1620} {"train_loss": -11.969118118286133, "global_step": 272300, "epoch": 1620} {"train_loss": -11.938922882080078, "global_step": 272301, "epoch": 1620} {"train_loss": -11.920635223388672, "global_step": 272302, "epoch": 1620} {"train_loss": -12.254518508911133, "global_step": 272303, "epoch": 1620} {"train_loss": -11.906721115112305, "global_step": 272304, "epoch": 1620} {"train_loss": -12.003925323486328, "global_step": 272305, "epoch": 1620} {"train_loss": -12.156251907348633, "global_step": 272306, "epoch": 1620} {"train_loss": -12.259395599365234, "global_step": 272307, "epoch": 1620} {"train_loss": -11.974982261657715, "global_step": 272308, "epoch": 1620} {"train_loss": -11.53860092163086, "global_step": 272309, "epoch": 1620} {"train_loss": -11.315739631652832, "global_step": 272310, "epoch": 1620} {"train_loss": -11.960648536682129, "global_step": 272311, "epoch": 1620} {"train_loss": -12.227333068847656, "global_step": 272312, "epoch": 1620} {"train_loss": -11.857831001281738, "global_step": 272313, "epoch": 1620} {"train_loss": -11.947263717651367, "global_step": 272314, "epoch": 1620} {"train_loss": -11.61592960357666, "global_step": 272315, "epoch": 1620} {"train_loss": -11.973777770996094, "global_step": 272316, "epoch": 1620} {"train_loss": -11.509437561035156, "global_step": 272317, "epoch": 1620} {"train_loss": -12.168689727783203, "global_step": 272318, "epoch": 1620} {"train_loss": -11.693585395812988, "global_step": 272319, "epoch": 1620} {"train_loss": -11.712769508361816, "global_step": 272320, "epoch": 1620} {"train_loss": -11.841886520385742, "global_step": 272321, "epoch": 1620} {"train_loss": -11.847135543823242, "global_step": 272322, "epoch": 1620} {"train_loss": -11.727407455444336, "global_step": 272323, "epoch": 1620} {"train_loss": -12.043394088745117, "global_step": 272324, "epoch": 1620} {"train_loss": -11.664594650268555, "global_step": 272325, "epoch": 1620} {"train_loss": -12.261300086975098, "global_step": 272326, "epoch": 1620} {"train_loss": -11.737762808799744, "global_step": 272327, "epoch": 1620, "val_loss": 273106.53125, "train_action_mse_error": 3.931032419204712} {"train_loss": -11.75503921508789, "global_step": 272328, "epoch": 1621} {"train_loss": -11.75101089477539, "global_step": 272329, "epoch": 1621} {"train_loss": -12.300436019897461, "global_step": 272330, "epoch": 1621} {"train_loss": -11.917409896850586, "global_step": 272331, "epoch": 1621} {"train_loss": -11.769536972045898, "global_step": 272332, "epoch": 1621} {"train_loss": -12.023475646972656, "global_step": 272333, "epoch": 1621} {"train_loss": -11.929101943969727, "global_step": 272334, "epoch": 1621} {"train_loss": -11.61294174194336, "global_step": 272335, "epoch": 1621} {"train_loss": -12.143449783325195, "global_step": 272336, "epoch": 1621} {"train_loss": -11.56768798828125, "global_step": 272337, "epoch": 1621} {"train_loss": -11.905948638916016, "global_step": 272338, "epoch": 1621} {"train_loss": -11.747662544250488, "global_step": 272339, "epoch": 1621} {"train_loss": -11.818532943725586, "global_step": 272340, "epoch": 1621} {"train_loss": -11.468515396118164, "global_step": 272341, "epoch": 1621} {"train_loss": -11.978763580322266, "global_step": 272342, "epoch": 1621} {"train_loss": -11.42541790008545, "global_step": 272343, "epoch": 1621} {"train_loss": -11.810684204101562, "global_step": 272344, "epoch": 1621} {"train_loss": -11.911982536315918, "global_step": 272345, "epoch": 1621} {"train_loss": -11.843282699584961, "global_step": 272346, "epoch": 1621} {"train_loss": -11.667545318603516, "global_step": 272347, "epoch": 1621} {"train_loss": -11.54035472869873, "global_step": 272348, "epoch": 1621} {"train_loss": -11.079774856567383, "global_step": 272349, "epoch": 1621} {"train_loss": -11.28854751586914, "global_step": 272350, "epoch": 1621} {"train_loss": -11.65311050415039, "global_step": 272351, "epoch": 1621} {"train_loss": -11.625391006469727, "global_step": 272352, "epoch": 1621} {"train_loss": -11.7287015914917, "global_step": 272353, "epoch": 1621} {"train_loss": -11.34725570678711, "global_step": 272354, "epoch": 1621} {"train_loss": -11.163501739501953, "global_step": 272355, "epoch": 1621} {"train_loss": -11.770895004272461, "global_step": 272356, "epoch": 1621} {"train_loss": -11.852154731750488, "global_step": 272357, "epoch": 1621} {"train_loss": -10.945547103881836, "global_step": 272358, "epoch": 1621} {"train_loss": -11.484283447265625, "global_step": 272359, "epoch": 1621} {"train_loss": -11.221624374389648, "global_step": 272360, "epoch": 1621} {"train_loss": -12.075359344482422, "global_step": 272361, "epoch": 1621} {"train_loss": -11.608978271484375, "global_step": 272362, "epoch": 1621} {"train_loss": -11.691420555114746, "global_step": 272363, "epoch": 1621} {"train_loss": -11.888004302978516, "global_step": 272364, "epoch": 1621} {"train_loss": -11.933036804199219, "global_step": 272365, "epoch": 1621} {"train_loss": -11.791540145874023, "global_step": 272366, "epoch": 1621} {"train_loss": -11.820005416870117, "global_step": 272367, "epoch": 1621} {"train_loss": -11.581315994262695, "global_step": 272368, "epoch": 1621} {"train_loss": -11.569917678833008, "global_step": 272369, "epoch": 1621} {"train_loss": -11.85183334350586, "global_step": 272370, "epoch": 1621} {"train_loss": -11.79388427734375, "global_step": 272371, "epoch": 1621} {"train_loss": -11.505170822143555, "global_step": 272372, "epoch": 1621} {"train_loss": -12.000110626220703, "global_step": 272373, "epoch": 1621} {"train_loss": -11.643882751464844, "global_step": 272374, "epoch": 1621} {"train_loss": -11.528841972351074, "global_step": 272375, "epoch": 1621} {"train_loss": -11.603414535522461, "global_step": 272376, "epoch": 1621} {"train_loss": -11.928095817565918, "global_step": 272377, "epoch": 1621} {"train_loss": -12.035604476928711, "global_step": 272378, "epoch": 1621} {"train_loss": -11.503515243530273, "global_step": 272379, "epoch": 1621} {"train_loss": -12.000261306762695, "global_step": 272380, "epoch": 1621} {"train_loss": -11.57809066772461, "global_step": 272381, "epoch": 1621} {"train_loss": -11.390226364135742, "global_step": 272382, "epoch": 1621} {"train_loss": -12.049382209777832, "global_step": 272383, "epoch": 1621} {"train_loss": -11.917787551879883, "global_step": 272384, "epoch": 1621} {"train_loss": -11.604394912719727, "global_step": 272385, "epoch": 1621} {"train_loss": -11.85302734375, "global_step": 272386, "epoch": 1621} {"train_loss": -11.98910140991211, "global_step": 272387, "epoch": 1621} {"train_loss": -11.306632041931152, "global_step": 272388, "epoch": 1621} {"train_loss": -11.476043701171875, "global_step": 272389, "epoch": 1621} {"train_loss": -11.775249481201172, "global_step": 272390, "epoch": 1621} {"train_loss": -11.268902778625488, "global_step": 272391, "epoch": 1621} {"train_loss": -11.521455764770508, "global_step": 272392, "epoch": 1621} {"train_loss": -12.222085952758789, "global_step": 272393, "epoch": 1621} {"train_loss": -11.971532821655273, "global_step": 272394, "epoch": 1621} {"train_loss": -12.047531127929688, "global_step": 272395, "epoch": 1621} {"train_loss": -12.342153549194336, "global_step": 272396, "epoch": 1621} {"train_loss": -12.018835067749023, "global_step": 272397, "epoch": 1621} {"train_loss": -12.301424980163574, "global_step": 272398, "epoch": 1621} {"train_loss": -12.191717147827148, "global_step": 272399, "epoch": 1621} {"train_loss": -12.029458999633789, "global_step": 272400, "epoch": 1621} {"train_loss": -12.0958833694458, "global_step": 272401, "epoch": 1621} {"train_loss": -12.065441131591797, "global_step": 272402, "epoch": 1621} {"train_loss": -11.673779487609863, "global_step": 272403, "epoch": 1621} {"train_loss": -12.063940048217773, "global_step": 272404, "epoch": 1621} {"train_loss": -12.267226219177246, "global_step": 272405, "epoch": 1621} {"train_loss": -12.027087211608887, "global_step": 272406, "epoch": 1621} {"train_loss": -12.15849494934082, "global_step": 272407, "epoch": 1621} {"train_loss": -12.263201713562012, "global_step": 272408, "epoch": 1621} {"train_loss": -11.373626708984375, "global_step": 272409, "epoch": 1621} {"train_loss": -11.809637069702148, "global_step": 272410, "epoch": 1621} {"train_loss": -12.145990371704102, "global_step": 272411, "epoch": 1621} {"train_loss": -11.314772605895996, "global_step": 272412, "epoch": 1621} {"train_loss": -11.499922752380371, "global_step": 272413, "epoch": 1621} {"train_loss": -11.818079948425293, "global_step": 272414, "epoch": 1621} {"train_loss": -11.25602912902832, "global_step": 272415, "epoch": 1621} {"train_loss": -11.17340087890625, "global_step": 272416, "epoch": 1621} {"train_loss": -11.860884666442871, "global_step": 272417, "epoch": 1621} {"train_loss": -11.980447769165039, "global_step": 272418, "epoch": 1621} {"train_loss": -11.083162307739258, "global_step": 272419, "epoch": 1621} {"train_loss": -11.598998069763184, "global_step": 272420, "epoch": 1621} {"train_loss": -11.656025886535645, "global_step": 272421, "epoch": 1621} {"train_loss": -11.968915939331055, "global_step": 272422, "epoch": 1621} {"train_loss": -11.686521530151367, "global_step": 272423, "epoch": 1621} {"train_loss": -12.303321838378906, "global_step": 272424, "epoch": 1621} {"train_loss": -11.766159057617188, "global_step": 272425, "epoch": 1621} {"train_loss": -11.659709930419922, "global_step": 272426, "epoch": 1621} {"train_loss": -11.831893920898438, "global_step": 272427, "epoch": 1621} {"train_loss": -11.888697624206543, "global_step": 272428, "epoch": 1621} {"train_loss": -12.144807815551758, "global_step": 272429, "epoch": 1621} {"train_loss": -11.673423767089844, "global_step": 272430, "epoch": 1621} {"train_loss": -11.990999221801758, "global_step": 272431, "epoch": 1621} {"train_loss": -11.625635147094727, "global_step": 272432, "epoch": 1621} {"train_loss": -12.00473403930664, "global_step": 272433, "epoch": 1621} {"train_loss": -11.293560981750488, "global_step": 272434, "epoch": 1621} {"train_loss": -11.392462730407715, "global_step": 272435, "epoch": 1621} {"train_loss": -11.777643203735352, "global_step": 272436, "epoch": 1621} {"train_loss": -11.75153923034668, "global_step": 272437, "epoch": 1621} {"train_loss": -11.429224014282227, "global_step": 272438, "epoch": 1621} {"train_loss": -11.369951248168945, "global_step": 272439, "epoch": 1621} {"train_loss": -11.267515182495117, "global_step": 272440, "epoch": 1621} {"train_loss": -10.861196517944336, "global_step": 272441, "epoch": 1621} {"train_loss": -11.259591102600098, "global_step": 272442, "epoch": 1621} {"train_loss": -11.228100776672363, "global_step": 272443, "epoch": 1621} {"train_loss": -11.472537994384766, "global_step": 272444, "epoch": 1621} {"train_loss": -10.928140640258789, "global_step": 272445, "epoch": 1621} {"train_loss": -11.504968643188477, "global_step": 272446, "epoch": 1621} {"train_loss": -10.01374340057373, "global_step": 272447, "epoch": 1621} {"train_loss": -10.9505615234375, "global_step": 272448, "epoch": 1621} {"train_loss": -10.021869659423828, "global_step": 272449, "epoch": 1621} {"train_loss": -11.139463424682617, "global_step": 272450, "epoch": 1621} {"train_loss": -10.602371215820312, "global_step": 272451, "epoch": 1621} {"train_loss": -11.399894714355469, "global_step": 272452, "epoch": 1621} {"train_loss": -10.136463165283203, "global_step": 272453, "epoch": 1621} {"train_loss": -10.575243949890137, "global_step": 272454, "epoch": 1621} {"train_loss": -10.852561950683594, "global_step": 272455, "epoch": 1621} {"train_loss": -10.377994537353516, "global_step": 272456, "epoch": 1621} {"train_loss": -10.851323127746582, "global_step": 272457, "epoch": 1621} {"train_loss": -10.842000961303711, "global_step": 272458, "epoch": 1621} {"train_loss": -10.78333568572998, "global_step": 272459, "epoch": 1621} {"train_loss": -11.500466346740723, "global_step": 272460, "epoch": 1621} {"train_loss": -11.454630851745605, "global_step": 272461, "epoch": 1621} {"train_loss": -11.259953498840332, "global_step": 272462, "epoch": 1621} {"train_loss": -11.781270980834961, "global_step": 272463, "epoch": 1621} {"train_loss": -11.175032615661621, "global_step": 272464, "epoch": 1621} {"train_loss": -11.732627868652344, "global_step": 272465, "epoch": 1621} {"train_loss": -11.51999568939209, "global_step": 272466, "epoch": 1621} {"train_loss": -11.770198822021484, "global_step": 272467, "epoch": 1621} {"train_loss": -11.800880432128906, "global_step": 272468, "epoch": 1621} {"train_loss": -11.514791488647461, "global_step": 272469, "epoch": 1621} {"train_loss": -11.802511215209961, "global_step": 272470, "epoch": 1621} {"train_loss": -11.660377502441406, "global_step": 272471, "epoch": 1621} {"train_loss": -11.757102966308594, "global_step": 272472, "epoch": 1621} {"train_loss": -11.757923126220703, "global_step": 272473, "epoch": 1621} {"train_loss": -11.920063972473145, "global_step": 272474, "epoch": 1621} {"train_loss": -11.652179718017578, "global_step": 272475, "epoch": 1621} {"train_loss": -11.572694778442383, "global_step": 272476, "epoch": 1621} {"train_loss": -11.730953216552734, "global_step": 272477, "epoch": 1621} {"train_loss": -11.769819259643555, "global_step": 272478, "epoch": 1621} {"train_loss": -11.894227981567383, "global_step": 272479, "epoch": 1621} {"train_loss": -11.42253303527832, "global_step": 272480, "epoch": 1621} {"train_loss": -11.809076309204102, "global_step": 272481, "epoch": 1621} {"train_loss": -11.633234024047852, "global_step": 272482, "epoch": 1621} {"train_loss": -11.889325141906738, "global_step": 272483, "epoch": 1621} {"train_loss": -11.544925689697266, "global_step": 272484, "epoch": 1621} {"train_loss": -11.758016586303711, "global_step": 272485, "epoch": 1621} {"train_loss": -11.695574760437012, "global_step": 272486, "epoch": 1621} {"train_loss": -11.814453125, "global_step": 272487, "epoch": 1621} {"train_loss": -11.36453628540039, "global_step": 272488, "epoch": 1621} {"train_loss": -11.56391716003418, "global_step": 272489, "epoch": 1621} {"train_loss": -11.769271850585938, "global_step": 272490, "epoch": 1621} {"train_loss": -11.875261306762695, "global_step": 272491, "epoch": 1621} {"train_loss": -11.507721900939941, "global_step": 272492, "epoch": 1621} {"train_loss": -11.957198143005371, "global_step": 272493, "epoch": 1621} {"train_loss": -11.88284969329834, "global_step": 272494, "epoch": 1621} {"train_loss": -11.624815969240098, "global_step": 272495, "epoch": 1621, "val_loss": 272742.125} {"train_loss": -11.495428085327148, "global_step": 272496, "epoch": 1622} {"train_loss": -11.803117752075195, "global_step": 272497, "epoch": 1622} {"train_loss": -11.432659149169922, "global_step": 272498, "epoch": 1622} {"train_loss": -12.104177474975586, "global_step": 272499, "epoch": 1622} {"train_loss": -11.639104843139648, "global_step": 272500, "epoch": 1622} {"train_loss": -11.81098747253418, "global_step": 272501, "epoch": 1622} {"train_loss": -11.640493392944336, "global_step": 272502, "epoch": 1622} {"train_loss": -11.895642280578613, "global_step": 272503, "epoch": 1622} {"train_loss": -12.00197696685791, "global_step": 272504, "epoch": 1622} {"train_loss": -11.979813575744629, "global_step": 272505, "epoch": 1622} {"train_loss": -11.994908332824707, "global_step": 272506, "epoch": 1622} {"train_loss": -11.934289932250977, "global_step": 272507, "epoch": 1622} {"train_loss": -12.195205688476562, "global_step": 272508, "epoch": 1622} {"train_loss": -12.149940490722656, "global_step": 272509, "epoch": 1622} {"train_loss": -12.162164688110352, "global_step": 272510, "epoch": 1622} {"train_loss": -12.001683235168457, "global_step": 272511, "epoch": 1622} {"train_loss": -11.599932670593262, "global_step": 272512, "epoch": 1622} {"train_loss": -12.093405723571777, "global_step": 272513, "epoch": 1622} {"train_loss": -11.903924942016602, "global_step": 272514, "epoch": 1622} {"train_loss": -12.153078079223633, "global_step": 272515, "epoch": 1622} {"train_loss": -12.026617050170898, "global_step": 272516, "epoch": 1622} {"train_loss": -12.21304988861084, "global_step": 272517, "epoch": 1622} {"train_loss": -12.145692825317383, "global_step": 272518, "epoch": 1622} {"train_loss": -11.854801177978516, "global_step": 272519, "epoch": 1622} {"train_loss": -12.160778999328613, "global_step": 272520, "epoch": 1622} {"train_loss": -12.211170196533203, "global_step": 272521, "epoch": 1622} {"train_loss": -11.986769676208496, "global_step": 272522, "epoch": 1622} {"train_loss": -11.991571426391602, "global_step": 272523, "epoch": 1622} {"train_loss": -12.09809684753418, "global_step": 272524, "epoch": 1622} {"train_loss": -12.139352798461914, "global_step": 272525, "epoch": 1622} {"train_loss": -12.175952911376953, "global_step": 272526, "epoch": 1622} {"train_loss": -11.991207122802734, "global_step": 272527, "epoch": 1622} {"train_loss": -12.278680801391602, "global_step": 272528, "epoch": 1622} {"train_loss": -11.858970642089844, "global_step": 272529, "epoch": 1622} {"train_loss": -11.695024490356445, "global_step": 272530, "epoch": 1622} {"train_loss": -12.234831809997559, "global_step": 272531, "epoch": 1622} {"train_loss": -11.608800888061523, "global_step": 272532, "epoch": 1622} {"train_loss": -12.157951354980469, "global_step": 272533, "epoch": 1622} {"train_loss": -12.167842864990234, "global_step": 272534, "epoch": 1622} {"train_loss": -12.17782211303711, "global_step": 272535, "epoch": 1622} {"train_loss": -12.371602058410645, "global_step": 272536, "epoch": 1622} {"train_loss": -12.055196762084961, "global_step": 272537, "epoch": 1622} {"train_loss": -12.392497062683105, "global_step": 272538, "epoch": 1622} {"train_loss": -12.282388687133789, "global_step": 272539, "epoch": 1622} {"train_loss": -12.143386840820312, "global_step": 272540, "epoch": 1622} {"train_loss": -12.030147552490234, "global_step": 272541, "epoch": 1622} {"train_loss": -12.109792709350586, "global_step": 272542, "epoch": 1622} {"train_loss": -12.392768859863281, "global_step": 272543, "epoch": 1622} {"train_loss": -11.999460220336914, "global_step": 272544, "epoch": 1622} {"train_loss": -12.184917449951172, "global_step": 272545, "epoch": 1622} {"train_loss": -12.147520065307617, "global_step": 272546, "epoch": 1622} {"train_loss": -12.158750534057617, "global_step": 272547, "epoch": 1622} {"train_loss": -12.202035903930664, "global_step": 272548, "epoch": 1622} {"train_loss": -11.888155937194824, "global_step": 272549, "epoch": 1622} {"train_loss": -12.110233306884766, "global_step": 272550, "epoch": 1622} {"train_loss": -12.175996780395508, "global_step": 272551, "epoch": 1622} {"train_loss": -11.64586353302002, "global_step": 272552, "epoch": 1622} {"train_loss": -12.034721374511719, "global_step": 272553, "epoch": 1622} {"train_loss": -12.114887237548828, "global_step": 272554, "epoch": 1622} {"train_loss": -11.826662063598633, "global_step": 272555, "epoch": 1622} {"train_loss": -12.212846755981445, "global_step": 272556, "epoch": 1622} {"train_loss": -12.399677276611328, "global_step": 272557, "epoch": 1622} {"train_loss": -12.049781799316406, "global_step": 272558, "epoch": 1622} {"train_loss": -11.884361267089844, "global_step": 272559, "epoch": 1622} {"train_loss": -11.829819679260254, "global_step": 272560, "epoch": 1622} {"train_loss": -12.245083808898926, "global_step": 272561, "epoch": 1622} {"train_loss": -11.957818031311035, "global_step": 272562, "epoch": 1622} {"train_loss": -11.302946090698242, "global_step": 272563, "epoch": 1622} {"train_loss": -11.448288917541504, "global_step": 272564, "epoch": 1622} {"train_loss": -12.198511123657227, "global_step": 272565, "epoch": 1622} {"train_loss": -11.46676254272461, "global_step": 272566, "epoch": 1622} {"train_loss": -11.696290969848633, "global_step": 272567, "epoch": 1622} {"train_loss": -11.708160400390625, "global_step": 272568, "epoch": 1622} {"train_loss": -11.851353645324707, "global_step": 272569, "epoch": 1622} {"train_loss": -11.366933822631836, "global_step": 272570, "epoch": 1622} {"train_loss": -11.459078788757324, "global_step": 272571, "epoch": 1622} {"train_loss": -11.889049530029297, "global_step": 272572, "epoch": 1622} {"train_loss": -11.734253883361816, "global_step": 272573, "epoch": 1622} {"train_loss": -11.120841979980469, "global_step": 272574, "epoch": 1622} {"train_loss": -11.126504898071289, "global_step": 272575, "epoch": 1622} {"train_loss": -12.131240844726562, "global_step": 272576, "epoch": 1622} {"train_loss": -11.515706062316895, "global_step": 272577, "epoch": 1622} {"train_loss": -10.955465316772461, "global_step": 272578, "epoch": 1622} {"train_loss": -11.53360366821289, "global_step": 272579, "epoch": 1622} {"train_loss": -11.905535697937012, "global_step": 272580, "epoch": 1622} {"train_loss": -9.954526901245117, "global_step": 272581, "epoch": 1622} {"train_loss": -11.215411186218262, "global_step": 272582, "epoch": 1622} {"train_loss": -11.32578182220459, "global_step": 272583, "epoch": 1622} {"train_loss": -11.56667709350586, "global_step": 272584, "epoch": 1622} {"train_loss": -11.370838165283203, "global_step": 272585, "epoch": 1622} {"train_loss": -11.361259460449219, "global_step": 272586, "epoch": 1622} {"train_loss": -11.19174575805664, "global_step": 272587, "epoch": 1622} {"train_loss": -11.322610855102539, "global_step": 272588, "epoch": 1622} {"train_loss": -10.729009628295898, "global_step": 272589, "epoch": 1622} {"train_loss": -10.584512710571289, "global_step": 272590, "epoch": 1622} {"train_loss": -10.63545036315918, "global_step": 272591, "epoch": 1622} {"train_loss": -11.181304931640625, "global_step": 272592, "epoch": 1622} {"train_loss": -10.10621452331543, "global_step": 272593, "epoch": 1622} {"train_loss": -11.090120315551758, "global_step": 272594, "epoch": 1622} {"train_loss": -11.045406341552734, "global_step": 272595, "epoch": 1622} {"train_loss": -9.838264465332031, "global_step": 272596, "epoch": 1622} {"train_loss": -10.785457611083984, "global_step": 272597, "epoch": 1622} {"train_loss": -10.003620147705078, "global_step": 272598, "epoch": 1622} {"train_loss": -10.225855827331543, "global_step": 272599, "epoch": 1622} {"train_loss": -10.36657428741455, "global_step": 272600, "epoch": 1622} {"train_loss": -10.95501708984375, "global_step": 272601, "epoch": 1622} {"train_loss": -10.551708221435547, "global_step": 272602, "epoch": 1622} {"train_loss": -11.310403823852539, "global_step": 272603, "epoch": 1622} {"train_loss": -10.147760391235352, "global_step": 272604, "epoch": 1622} {"train_loss": -11.595474243164062, "global_step": 272605, "epoch": 1622} {"train_loss": -10.743110656738281, "global_step": 272606, "epoch": 1622} {"train_loss": -11.310356140136719, "global_step": 272607, "epoch": 1622} {"train_loss": -11.4042329788208, "global_step": 272608, "epoch": 1622} {"train_loss": -11.473261833190918, "global_step": 272609, "epoch": 1622} {"train_loss": -11.47109603881836, "global_step": 272610, "epoch": 1622} {"train_loss": -11.139700889587402, "global_step": 272611, "epoch": 1622} {"train_loss": -11.287409782409668, "global_step": 272612, "epoch": 1622} {"train_loss": -11.47950553894043, "global_step": 272613, "epoch": 1622} {"train_loss": -11.404011726379395, "global_step": 272614, "epoch": 1622} {"train_loss": -12.01803207397461, "global_step": 272615, "epoch": 1622} {"train_loss": -11.564342498779297, "global_step": 272616, "epoch": 1622} {"train_loss": -11.73106861114502, "global_step": 272617, "epoch": 1622} {"train_loss": -11.61181640625, "global_step": 272618, "epoch": 1622} {"train_loss": -11.593233108520508, "global_step": 272619, "epoch": 1622} {"train_loss": -11.794261932373047, "global_step": 272620, "epoch": 1622} {"train_loss": -11.82113265991211, "global_step": 272621, "epoch": 1622} {"train_loss": -11.861712455749512, "global_step": 272622, "epoch": 1622} {"train_loss": -11.75411605834961, "global_step": 272623, "epoch": 1622} {"train_loss": -11.70406723022461, "global_step": 272624, "epoch": 1622} {"train_loss": -11.86992073059082, "global_step": 272625, "epoch": 1622} {"train_loss": -11.899389266967773, "global_step": 272626, "epoch": 1622} {"train_loss": -11.886402130126953, "global_step": 272627, "epoch": 1622} {"train_loss": -11.88378620147705, "global_step": 272628, "epoch": 1622} {"train_loss": -11.933258056640625, "global_step": 272629, "epoch": 1622} {"train_loss": -11.866388320922852, "global_step": 272630, "epoch": 1622} {"train_loss": -11.87968635559082, "global_step": 272631, "epoch": 1622} {"train_loss": -11.873104095458984, "global_step": 272632, "epoch": 1622} {"train_loss": -11.66207218170166, "global_step": 272633, "epoch": 1622} {"train_loss": -11.87095832824707, "global_step": 272634, "epoch": 1622} {"train_loss": -11.919864654541016, "global_step": 272635, "epoch": 1622} {"train_loss": -11.971097946166992, "global_step": 272636, "epoch": 1622} {"train_loss": -11.819316864013672, "global_step": 272637, "epoch": 1622} {"train_loss": -11.878013610839844, "global_step": 272638, "epoch": 1622} {"train_loss": -12.022765159606934, "global_step": 272639, "epoch": 1622} {"train_loss": -12.022073745727539, "global_step": 272640, "epoch": 1622} {"train_loss": -12.13523006439209, "global_step": 272641, "epoch": 1622} {"train_loss": -11.956134796142578, "global_step": 272642, "epoch": 1622} {"train_loss": -11.900016784667969, "global_step": 272643, "epoch": 1622} {"train_loss": -11.842726707458496, "global_step": 272644, "epoch": 1622} {"train_loss": -12.284749984741211, "global_step": 272645, "epoch": 1622} {"train_loss": -12.012659072875977, "global_step": 272646, "epoch": 1622} {"train_loss": -12.173521041870117, "global_step": 272647, "epoch": 1622} {"train_loss": -11.914793014526367, "global_step": 272648, "epoch": 1622} {"train_loss": -12.373409271240234, "global_step": 272649, "epoch": 1622} {"train_loss": -11.794419288635254, "global_step": 272650, "epoch": 1622} {"train_loss": -11.923665046691895, "global_step": 272651, "epoch": 1622} {"train_loss": -11.920858383178711, "global_step": 272652, "epoch": 1622} {"train_loss": -12.00629997253418, "global_step": 272653, "epoch": 1622} {"train_loss": -11.690977096557617, "global_step": 272654, "epoch": 1622} {"train_loss": -11.8719482421875, "global_step": 272655, "epoch": 1622} {"train_loss": -12.076916694641113, "global_step": 272656, "epoch": 1622} {"train_loss": -11.568986892700195, "global_step": 272657, "epoch": 1622} {"train_loss": -11.827882766723633, "global_step": 272658, "epoch": 1622} {"train_loss": -11.60910701751709, "global_step": 272659, "epoch": 1622} {"train_loss": -11.90837574005127, "global_step": 272660, "epoch": 1622} {"train_loss": -11.105426788330078, "global_step": 272661, "epoch": 1622} {"train_loss": -11.284652709960938, "global_step": 272662, "epoch": 1622} {"train_loss": -11.709097794124059, "global_step": 272663, "epoch": 1622, "val_loss": 274732.03125} {"train_loss": -10.17947006225586, "global_step": 272664, "epoch": 1623} {"train_loss": -11.62761116027832, "global_step": 272665, "epoch": 1623} {"train_loss": -10.690526962280273, "global_step": 272666, "epoch": 1623} {"train_loss": -11.592413902282715, "global_step": 272667, "epoch": 1623} {"train_loss": -11.46096134185791, "global_step": 272668, "epoch": 1623} {"train_loss": -11.792106628417969, "global_step": 272669, "epoch": 1623} {"train_loss": -11.05966854095459, "global_step": 272670, "epoch": 1623} {"train_loss": -11.926114082336426, "global_step": 272671, "epoch": 1623} {"train_loss": -11.416306495666504, "global_step": 272672, "epoch": 1623} {"train_loss": -11.570510864257812, "global_step": 272673, "epoch": 1623} {"train_loss": -11.795879364013672, "global_step": 272674, "epoch": 1623} {"train_loss": -10.931815147399902, "global_step": 272675, "epoch": 1623} {"train_loss": -11.967747688293457, "global_step": 272676, "epoch": 1623} {"train_loss": -11.037327766418457, "global_step": 272677, "epoch": 1623} {"train_loss": -11.478324890136719, "global_step": 272678, "epoch": 1623} {"train_loss": -11.398597717285156, "global_step": 272679, "epoch": 1623} {"train_loss": -11.760579109191895, "global_step": 272680, "epoch": 1623} {"train_loss": -11.538701057434082, "global_step": 272681, "epoch": 1623} {"train_loss": -12.039888381958008, "global_step": 272682, "epoch": 1623} {"train_loss": -11.088415145874023, "global_step": 272683, "epoch": 1623} {"train_loss": -11.943552017211914, "global_step": 272684, "epoch": 1623} {"train_loss": -11.489222526550293, "global_step": 272685, "epoch": 1623} {"train_loss": -11.765439987182617, "global_step": 272686, "epoch": 1623} {"train_loss": -11.485723495483398, "global_step": 272687, "epoch": 1623} {"train_loss": -11.836939811706543, "global_step": 272688, "epoch": 1623} {"train_loss": -11.926032066345215, "global_step": 272689, "epoch": 1623} {"train_loss": -11.665763854980469, "global_step": 272690, "epoch": 1623} {"train_loss": -11.885679244995117, "global_step": 272691, "epoch": 1623} {"train_loss": -11.789260864257812, "global_step": 272692, "epoch": 1623} {"train_loss": -11.79855728149414, "global_step": 272693, "epoch": 1623} {"train_loss": -11.847552299499512, "global_step": 272694, "epoch": 1623} {"train_loss": -11.767809867858887, "global_step": 272695, "epoch": 1623} {"train_loss": -12.032279014587402, "global_step": 272696, "epoch": 1623} {"train_loss": -11.43914794921875, "global_step": 272697, "epoch": 1623} {"train_loss": -12.153980255126953, "global_step": 272698, "epoch": 1623} {"train_loss": -11.583318710327148, "global_step": 272699, "epoch": 1623} {"train_loss": -12.05420207977295, "global_step": 272700, "epoch": 1623} {"train_loss": -11.91791820526123, "global_step": 272701, "epoch": 1623} {"train_loss": -11.499022483825684, "global_step": 272702, "epoch": 1623} {"train_loss": -11.05862045288086, "global_step": 272703, "epoch": 1623} {"train_loss": -11.96853256225586, "global_step": 272704, "epoch": 1623} {"train_loss": -11.262828826904297, "global_step": 272705, "epoch": 1623} {"train_loss": -11.759325981140137, "global_step": 272706, "epoch": 1623} {"train_loss": -11.085870742797852, "global_step": 272707, "epoch": 1623} {"train_loss": -10.986777305603027, "global_step": 272708, "epoch": 1623} {"train_loss": -11.454477310180664, "global_step": 272709, "epoch": 1623} {"train_loss": -11.454357147216797, "global_step": 272710, "epoch": 1623} {"train_loss": -11.820741653442383, "global_step": 272711, "epoch": 1623} {"train_loss": -11.572607040405273, "global_step": 272712, "epoch": 1623} {"train_loss": -12.268442153930664, "global_step": 272713, "epoch": 1623} {"train_loss": -11.420854568481445, "global_step": 272714, "epoch": 1623} {"train_loss": -12.214380264282227, "global_step": 272715, "epoch": 1623} {"train_loss": -11.419321060180664, "global_step": 272716, "epoch": 1623} {"train_loss": -12.134389877319336, "global_step": 272717, "epoch": 1623} {"train_loss": -11.904899597167969, "global_step": 272718, "epoch": 1623} {"train_loss": -12.140223503112793, "global_step": 272719, "epoch": 1623} {"train_loss": -11.791301727294922, "global_step": 272720, "epoch": 1623} {"train_loss": -12.043963432312012, "global_step": 272721, "epoch": 1623} {"train_loss": -11.781570434570312, "global_step": 272722, "epoch": 1623} {"train_loss": -11.9623384475708, "global_step": 272723, "epoch": 1623} {"train_loss": -11.863146781921387, "global_step": 272724, "epoch": 1623} {"train_loss": -11.809389114379883, "global_step": 272725, "epoch": 1623} {"train_loss": -11.52831745147705, "global_step": 272726, "epoch": 1623} {"train_loss": -12.11795425415039, "global_step": 272727, "epoch": 1623} {"train_loss": -11.647541046142578, "global_step": 272728, "epoch": 1623} {"train_loss": -12.291122436523438, "global_step": 272729, "epoch": 1623} {"train_loss": -11.83470630645752, "global_step": 272730, "epoch": 1623} {"train_loss": -11.865800857543945, "global_step": 272731, "epoch": 1623} {"train_loss": -11.901407241821289, "global_step": 272732, "epoch": 1623} {"train_loss": -11.814598083496094, "global_step": 272733, "epoch": 1623} {"train_loss": -11.888494491577148, "global_step": 272734, "epoch": 1623} {"train_loss": -10.317489624023438, "global_step": 272735, "epoch": 1623} {"train_loss": -11.728154182434082, "global_step": 272736, "epoch": 1623} {"train_loss": -11.697454452514648, "global_step": 272737, "epoch": 1623} {"train_loss": -11.168004035949707, "global_step": 272738, "epoch": 1623} {"train_loss": -11.291566848754883, "global_step": 272739, "epoch": 1623} {"train_loss": -11.760910987854004, "global_step": 272740, "epoch": 1623} {"train_loss": -11.358516693115234, "global_step": 272741, "epoch": 1623} {"train_loss": -11.72966480255127, "global_step": 272742, "epoch": 1623} {"train_loss": -11.220935821533203, "global_step": 272743, "epoch": 1623} {"train_loss": -11.282146453857422, "global_step": 272744, "epoch": 1623} {"train_loss": -11.10184097290039, "global_step": 272745, "epoch": 1623} {"train_loss": -10.009027481079102, "global_step": 272746, "epoch": 1623} {"train_loss": -11.849891662597656, "global_step": 272747, "epoch": 1623} {"train_loss": -9.905217170715332, "global_step": 272748, "epoch": 1623} {"train_loss": -10.766498565673828, "global_step": 272749, "epoch": 1623} {"train_loss": -10.423919677734375, "global_step": 272750, "epoch": 1623} {"train_loss": -10.250486373901367, "global_step": 272751, "epoch": 1623} {"train_loss": -11.144088745117188, "global_step": 272752, "epoch": 1623} {"train_loss": -10.795883178710938, "global_step": 272753, "epoch": 1623} {"train_loss": -10.94731330871582, "global_step": 272754, "epoch": 1623} {"train_loss": -10.154312133789062, "global_step": 272755, "epoch": 1623} {"train_loss": -11.278162002563477, "global_step": 272756, "epoch": 1623} {"train_loss": -10.637378692626953, "global_step": 272757, "epoch": 1623} {"train_loss": -11.42944049835205, "global_step": 272758, "epoch": 1623} {"train_loss": -10.26846694946289, "global_step": 272759, "epoch": 1623} {"train_loss": -10.936936378479004, "global_step": 272760, "epoch": 1623} {"train_loss": -11.01467514038086, "global_step": 272761, "epoch": 1623} {"train_loss": -11.424123764038086, "global_step": 272762, "epoch": 1623} {"train_loss": -10.893983840942383, "global_step": 272763, "epoch": 1623} {"train_loss": -10.49867057800293, "global_step": 272764, "epoch": 1623} {"train_loss": -10.837279319763184, "global_step": 272765, "epoch": 1623} {"train_loss": -11.0477294921875, "global_step": 272766, "epoch": 1623} {"train_loss": -10.41873550415039, "global_step": 272767, "epoch": 1623} {"train_loss": -11.523139953613281, "global_step": 272768, "epoch": 1623} {"train_loss": -11.096004486083984, "global_step": 272769, "epoch": 1623} {"train_loss": -11.280824661254883, "global_step": 272770, "epoch": 1623} {"train_loss": -11.444801330566406, "global_step": 272771, "epoch": 1623} {"train_loss": -11.228273391723633, "global_step": 272772, "epoch": 1623} {"train_loss": -11.726037979125977, "global_step": 272773, "epoch": 1623} {"train_loss": -11.596600532531738, "global_step": 272774, "epoch": 1623} {"train_loss": -11.465456008911133, "global_step": 272775, "epoch": 1623} {"train_loss": -11.703205108642578, "global_step": 272776, "epoch": 1623} {"train_loss": -11.414945602416992, "global_step": 272777, "epoch": 1623} {"train_loss": -11.523265838623047, "global_step": 272778, "epoch": 1623} {"train_loss": -11.594802856445312, "global_step": 272779, "epoch": 1623} {"train_loss": -11.675302505493164, "global_step": 272780, "epoch": 1623} {"train_loss": -11.886066436767578, "global_step": 272781, "epoch": 1623} {"train_loss": -11.775978088378906, "global_step": 272782, "epoch": 1623} {"train_loss": -11.920597076416016, "global_step": 272783, "epoch": 1623} {"train_loss": -11.802395820617676, "global_step": 272784, "epoch": 1623} {"train_loss": -11.925104141235352, "global_step": 272785, "epoch": 1623} {"train_loss": -12.062736511230469, "global_step": 272786, "epoch": 1623} {"train_loss": -12.020563125610352, "global_step": 272787, "epoch": 1623} {"train_loss": -12.019124984741211, "global_step": 272788, "epoch": 1623} {"train_loss": -12.148548126220703, "global_step": 272789, "epoch": 1623} {"train_loss": -11.901091575622559, "global_step": 272790, "epoch": 1623} {"train_loss": -12.098945617675781, "global_step": 272791, "epoch": 1623} {"train_loss": -12.144380569458008, "global_step": 272792, "epoch": 1623} {"train_loss": -11.963460922241211, "global_step": 272793, "epoch": 1623} {"train_loss": -12.05144214630127, "global_step": 272794, "epoch": 1623} {"train_loss": -12.046351432800293, "global_step": 272795, "epoch": 1623} {"train_loss": -11.895343780517578, "global_step": 272796, "epoch": 1623} {"train_loss": -12.13140869140625, "global_step": 272797, "epoch": 1623} {"train_loss": -11.966435432434082, "global_step": 272798, "epoch": 1623} {"train_loss": -12.154029846191406, "global_step": 272799, "epoch": 1623} {"train_loss": -12.139021873474121, "global_step": 272800, "epoch": 1623} {"train_loss": -12.23595142364502, "global_step": 272801, "epoch": 1623} {"train_loss": -12.146926879882812, "global_step": 272802, "epoch": 1623} {"train_loss": -11.945682525634766, "global_step": 272803, "epoch": 1623} {"train_loss": -12.230440139770508, "global_step": 272804, "epoch": 1623} {"train_loss": -12.095080375671387, "global_step": 272805, "epoch": 1623} {"train_loss": -12.238840103149414, "global_step": 272806, "epoch": 1623} {"train_loss": -12.276628494262695, "global_step": 272807, "epoch": 1623} {"train_loss": -12.445157051086426, "global_step": 272808, "epoch": 1623} {"train_loss": -12.098089218139648, "global_step": 272809, "epoch": 1623} {"train_loss": -12.222166061401367, "global_step": 272810, "epoch": 1623} {"train_loss": -12.223228454589844, "global_step": 272811, "epoch": 1623} {"train_loss": -12.230451583862305, "global_step": 272812, "epoch": 1623} {"train_loss": -12.106233596801758, "global_step": 272813, "epoch": 1623} {"train_loss": -12.166664123535156, "global_step": 272814, "epoch": 1623} {"train_loss": -12.26123046875, "global_step": 272815, "epoch": 1623} {"train_loss": -12.033119201660156, "global_step": 272816, "epoch": 1623} {"train_loss": -12.370094299316406, "global_step": 272817, "epoch": 1623} {"train_loss": -12.36482048034668, "global_step": 272818, "epoch": 1623} {"train_loss": -12.499067306518555, "global_step": 272819, "epoch": 1623} {"train_loss": -12.309423446655273, "global_step": 272820, "epoch": 1623} {"train_loss": -12.29672622680664, "global_step": 272821, "epoch": 1623} {"train_loss": -12.328960418701172, "global_step": 272822, "epoch": 1623} {"train_loss": -12.316606521606445, "global_step": 272823, "epoch": 1623} {"train_loss": -12.149789810180664, "global_step": 272824, "epoch": 1623} {"train_loss": -12.080337524414062, "global_step": 272825, "epoch": 1623} {"train_loss": -12.02255630493164, "global_step": 272826, "epoch": 1623} {"train_loss": -12.150128364562988, "global_step": 272827, "epoch": 1623} {"train_loss": -12.220197677612305, "global_step": 272828, "epoch": 1623} {"train_loss": -12.07665729522705, "global_step": 272829, "epoch": 1623} {"train_loss": -11.77132511138916, "global_step": 272830, "epoch": 1623} {"train_loss": -11.647593123572213, "global_step": 272831, "epoch": 1623, "val_loss": 274414.125} {"train_loss": -12.259873390197754, "global_step": 272832, "epoch": 1624} {"train_loss": -12.126126289367676, "global_step": 272833, "epoch": 1624} {"train_loss": -11.94165325164795, "global_step": 272834, "epoch": 1624} {"train_loss": -12.096538543701172, "global_step": 272835, "epoch": 1624} {"train_loss": -11.821773529052734, "global_step": 272836, "epoch": 1624} {"train_loss": -11.316765785217285, "global_step": 272837, "epoch": 1624} {"train_loss": -12.201004028320312, "global_step": 272838, "epoch": 1624} {"train_loss": -10.83619213104248, "global_step": 272839, "epoch": 1624} {"train_loss": -10.295360565185547, "global_step": 272840, "epoch": 1624} {"train_loss": -11.874069213867188, "global_step": 272841, "epoch": 1624} {"train_loss": -11.899236679077148, "global_step": 272842, "epoch": 1624} {"train_loss": -11.213430404663086, "global_step": 272843, "epoch": 1624} {"train_loss": -11.973480224609375, "global_step": 272844, "epoch": 1624} {"train_loss": -11.132197380065918, "global_step": 272845, "epoch": 1624} {"train_loss": -11.211935997009277, "global_step": 272846, "epoch": 1624} {"train_loss": -11.72653579711914, "global_step": 272847, "epoch": 1624} {"train_loss": -11.666399002075195, "global_step": 272848, "epoch": 1624} {"train_loss": -11.615228652954102, "global_step": 272849, "epoch": 1624} {"train_loss": -12.081585884094238, "global_step": 272850, "epoch": 1624} {"train_loss": -11.274680137634277, "global_step": 272851, "epoch": 1624} {"train_loss": -11.397744178771973, "global_step": 272852, "epoch": 1624} {"train_loss": -11.714323997497559, "global_step": 272853, "epoch": 1624} {"train_loss": -11.319347381591797, "global_step": 272854, "epoch": 1624} {"train_loss": -11.873292922973633, "global_step": 272855, "epoch": 1624} {"train_loss": -11.588981628417969, "global_step": 272856, "epoch": 1624} {"train_loss": -11.829883575439453, "global_step": 272857, "epoch": 1624} {"train_loss": -11.734691619873047, "global_step": 272858, "epoch": 1624} {"train_loss": -11.567901611328125, "global_step": 272859, "epoch": 1624} {"train_loss": -11.685506820678711, "global_step": 272860, "epoch": 1624} {"train_loss": -12.129533767700195, "global_step": 272861, "epoch": 1624} {"train_loss": -11.300230026245117, "global_step": 272862, "epoch": 1624} {"train_loss": -11.557500839233398, "global_step": 272863, "epoch": 1624} {"train_loss": -11.377214431762695, "global_step": 272864, "epoch": 1624} {"train_loss": -11.670862197875977, "global_step": 272865, "epoch": 1624} {"train_loss": -11.425369262695312, "global_step": 272866, "epoch": 1624} {"train_loss": -11.376205444335938, "global_step": 272867, "epoch": 1624} {"train_loss": -11.740428924560547, "global_step": 272868, "epoch": 1624} {"train_loss": -11.472060203552246, "global_step": 272869, "epoch": 1624} {"train_loss": -11.976834297180176, "global_step": 272870, "epoch": 1624} {"train_loss": -11.504657745361328, "global_step": 272871, "epoch": 1624} {"train_loss": -12.156517028808594, "global_step": 272872, "epoch": 1624} {"train_loss": -11.664346694946289, "global_step": 272873, "epoch": 1624} {"train_loss": -11.735891342163086, "global_step": 272874, "epoch": 1624} {"train_loss": -11.968507766723633, "global_step": 272875, "epoch": 1624} {"train_loss": -12.206042289733887, "global_step": 272876, "epoch": 1624} {"train_loss": -11.789840698242188, "global_step": 272877, "epoch": 1624} {"train_loss": -12.038475036621094, "global_step": 272878, "epoch": 1624} {"train_loss": -12.01551628112793, "global_step": 272879, "epoch": 1624} {"train_loss": -12.145652770996094, "global_step": 272880, "epoch": 1624} {"train_loss": -11.882930755615234, "global_step": 272881, "epoch": 1624} {"train_loss": -12.016189575195312, "global_step": 272882, "epoch": 1624} {"train_loss": -12.102463722229004, "global_step": 272883, "epoch": 1624} {"train_loss": -11.949560165405273, "global_step": 272884, "epoch": 1624} {"train_loss": -12.00103759765625, "global_step": 272885, "epoch": 1624} {"train_loss": -12.084314346313477, "global_step": 272886, "epoch": 1624} {"train_loss": -11.783953666687012, "global_step": 272887, "epoch": 1624} {"train_loss": -12.029605865478516, "global_step": 272888, "epoch": 1624} {"train_loss": -12.042471885681152, "global_step": 272889, "epoch": 1624} {"train_loss": -12.127527236938477, "global_step": 272890, "epoch": 1624} {"train_loss": -12.391542434692383, "global_step": 272891, "epoch": 1624} {"train_loss": -11.975381851196289, "global_step": 272892, "epoch": 1624} {"train_loss": -11.94729995727539, "global_step": 272893, "epoch": 1624} {"train_loss": -12.05581283569336, "global_step": 272894, "epoch": 1624} {"train_loss": -11.985164642333984, "global_step": 272895, "epoch": 1624} {"train_loss": -11.970002174377441, "global_step": 272896, "epoch": 1624} {"train_loss": -11.96900749206543, "global_step": 272897, "epoch": 1624} {"train_loss": -12.254777908325195, "global_step": 272898, "epoch": 1624} {"train_loss": -11.696186065673828, "global_step": 272899, "epoch": 1624} {"train_loss": -12.362046241760254, "global_step": 272900, "epoch": 1624} {"train_loss": -11.366143226623535, "global_step": 272901, "epoch": 1624} {"train_loss": -11.580873489379883, "global_step": 272902, "epoch": 1624} {"train_loss": -11.76037883758545, "global_step": 272903, "epoch": 1624} {"train_loss": -11.567432403564453, "global_step": 272904, "epoch": 1624} {"train_loss": -11.763622283935547, "global_step": 272905, "epoch": 1624} {"train_loss": -11.901909828186035, "global_step": 272906, "epoch": 1624} {"train_loss": -11.144906997680664, "global_step": 272907, "epoch": 1624} {"train_loss": -11.957725524902344, "global_step": 272908, "epoch": 1624} {"train_loss": -11.336016654968262, "global_step": 272909, "epoch": 1624} {"train_loss": -11.60360336303711, "global_step": 272910, "epoch": 1624} {"train_loss": -11.509827613830566, "global_step": 272911, "epoch": 1624} {"train_loss": -11.109933853149414, "global_step": 272912, "epoch": 1624} {"train_loss": -11.266866683959961, "global_step": 272913, "epoch": 1624} {"train_loss": -11.731566429138184, "global_step": 272914, "epoch": 1624} {"train_loss": -11.44937515258789, "global_step": 272915, "epoch": 1624} {"train_loss": -11.858427047729492, "global_step": 272916, "epoch": 1624} {"train_loss": -11.509398460388184, "global_step": 272917, "epoch": 1624} {"train_loss": -11.835016250610352, "global_step": 272918, "epoch": 1624} {"train_loss": -12.063384056091309, "global_step": 272919, "epoch": 1624} {"train_loss": -11.630891799926758, "global_step": 272920, "epoch": 1624} {"train_loss": -11.734310150146484, "global_step": 272921, "epoch": 1624} {"train_loss": -11.745187759399414, "global_step": 272922, "epoch": 1624} {"train_loss": -12.1525239944458, "global_step": 272923, "epoch": 1624} {"train_loss": -11.725500106811523, "global_step": 272924, "epoch": 1624} {"train_loss": -12.113788604736328, "global_step": 272925, "epoch": 1624} {"train_loss": -11.838191986083984, "global_step": 272926, "epoch": 1624} {"train_loss": -12.187732696533203, "global_step": 272927, "epoch": 1624} {"train_loss": -12.073823928833008, "global_step": 272928, "epoch": 1624} {"train_loss": -11.927669525146484, "global_step": 272929, "epoch": 1624} {"train_loss": -11.948759078979492, "global_step": 272930, "epoch": 1624} {"train_loss": -12.152528762817383, "global_step": 272931, "epoch": 1624} {"train_loss": -11.948331832885742, "global_step": 272932, "epoch": 1624} {"train_loss": -11.419855117797852, "global_step": 272933, "epoch": 1624} {"train_loss": -12.084068298339844, "global_step": 272934, "epoch": 1624} {"train_loss": -11.878592491149902, "global_step": 272935, "epoch": 1624} {"train_loss": -11.48432445526123, "global_step": 272936, "epoch": 1624} {"train_loss": -12.214967727661133, "global_step": 272937, "epoch": 1624} {"train_loss": -11.84931468963623, "global_step": 272938, "epoch": 1624} {"train_loss": -11.774415969848633, "global_step": 272939, "epoch": 1624} {"train_loss": -11.7518949508667, "global_step": 272940, "epoch": 1624} {"train_loss": -11.892599105834961, "global_step": 272941, "epoch": 1624} {"train_loss": -11.893594741821289, "global_step": 272942, "epoch": 1624} {"train_loss": -11.998153686523438, "global_step": 272943, "epoch": 1624} {"train_loss": -11.715255737304688, "global_step": 272944, "epoch": 1624} {"train_loss": -11.986164093017578, "global_step": 272945, "epoch": 1624} {"train_loss": -12.216991424560547, "global_step": 272946, "epoch": 1624} {"train_loss": -11.226078987121582, "global_step": 272947, "epoch": 1624} {"train_loss": -11.953340530395508, "global_step": 272948, "epoch": 1624} {"train_loss": -11.91168212890625, "global_step": 272949, "epoch": 1624} {"train_loss": -11.797277450561523, "global_step": 272950, "epoch": 1624} {"train_loss": -11.953901290893555, "global_step": 272951, "epoch": 1624} {"train_loss": -11.629825592041016, "global_step": 272952, "epoch": 1624} {"train_loss": -10.923025131225586, "global_step": 272953, "epoch": 1624} {"train_loss": -10.964117050170898, "global_step": 272954, "epoch": 1624} {"train_loss": -12.103599548339844, "global_step": 272955, "epoch": 1624} {"train_loss": -11.335729598999023, "global_step": 272956, "epoch": 1624} {"train_loss": -11.802467346191406, "global_step": 272957, "epoch": 1624} {"train_loss": -11.79803466796875, "global_step": 272958, "epoch": 1624} {"train_loss": -11.801410675048828, "global_step": 272959, "epoch": 1624} {"train_loss": -11.816384315490723, "global_step": 272960, "epoch": 1624} {"train_loss": -11.974157333374023, "global_step": 272961, "epoch": 1624} {"train_loss": -11.857797622680664, "global_step": 272962, "epoch": 1624} {"train_loss": -11.739888191223145, "global_step": 272963, "epoch": 1624} {"train_loss": -11.922637939453125, "global_step": 272964, "epoch": 1624} {"train_loss": -11.805554389953613, "global_step": 272965, "epoch": 1624} {"train_loss": -11.496893882751465, "global_step": 272966, "epoch": 1624} {"train_loss": -11.281554222106934, "global_step": 272967, "epoch": 1624} {"train_loss": -11.91054916381836, "global_step": 272968, "epoch": 1624} {"train_loss": -12.080667495727539, "global_step": 272969, "epoch": 1624} {"train_loss": -11.538440704345703, "global_step": 272970, "epoch": 1624} {"train_loss": -12.18116569519043, "global_step": 272971, "epoch": 1624} {"train_loss": -11.678564071655273, "global_step": 272972, "epoch": 1624} {"train_loss": -12.251628875732422, "global_step": 272973, "epoch": 1624} {"train_loss": -11.969894409179688, "global_step": 272974, "epoch": 1624} {"train_loss": -12.027667045593262, "global_step": 272975, "epoch": 1624} {"train_loss": -11.969206809997559, "global_step": 272976, "epoch": 1624} {"train_loss": -12.048856735229492, "global_step": 272977, "epoch": 1624} {"train_loss": -11.99606704711914, "global_step": 272978, "epoch": 1624} {"train_loss": -12.038061141967773, "global_step": 272979, "epoch": 1624} {"train_loss": -12.035980224609375, "global_step": 272980, "epoch": 1624} {"train_loss": -11.596799850463867, "global_step": 272981, "epoch": 1624} {"train_loss": -12.060903549194336, "global_step": 272982, "epoch": 1624} {"train_loss": -11.991576194763184, "global_step": 272983, "epoch": 1624} {"train_loss": -11.901391983032227, "global_step": 272984, "epoch": 1624} {"train_loss": -11.914199829101562, "global_step": 272985, "epoch": 1624} {"train_loss": -12.128978729248047, "global_step": 272986, "epoch": 1624} {"train_loss": -11.509536743164062, "global_step": 272987, "epoch": 1624} {"train_loss": -11.933746337890625, "global_step": 272988, "epoch": 1624} {"train_loss": -12.085460662841797, "global_step": 272989, "epoch": 1624} {"train_loss": -11.890161514282227, "global_step": 272990, "epoch": 1624} {"train_loss": -11.484115600585938, "global_step": 272991, "epoch": 1624} {"train_loss": -12.269359588623047, "global_step": 272992, "epoch": 1624} {"train_loss": -11.259761810302734, "global_step": 272993, "epoch": 1624} {"train_loss": -12.13756275177002, "global_step": 272994, "epoch": 1624} {"train_loss": -11.9795560836792, "global_step": 272995, "epoch": 1624} {"train_loss": -12.067955017089844, "global_step": 272996, "epoch": 1624} {"train_loss": -11.753419876098633, "global_step": 272997, "epoch": 1624} {"train_loss": -11.637483596801758, "global_step": 272998, "epoch": 1624} {"train_loss": -11.788601761772519, "global_step": 272999, "epoch": 1624, "val_loss": 273089.84375} {"train_loss": -12.171561241149902, "global_step": 273000, "epoch": 1625} {"train_loss": -11.23031234741211, "global_step": 273001, "epoch": 1625} {"train_loss": -11.493894577026367, "global_step": 273002, "epoch": 1625} {"train_loss": -11.952484130859375, "global_step": 273003, "epoch": 1625} {"train_loss": -11.678279876708984, "global_step": 273004, "epoch": 1625} {"train_loss": -11.97134017944336, "global_step": 273005, "epoch": 1625} {"train_loss": -11.959760665893555, "global_step": 273006, "epoch": 1625} {"train_loss": -11.900390625, "global_step": 273007, "epoch": 1625} {"train_loss": -11.776984214782715, "global_step": 273008, "epoch": 1625} {"train_loss": -12.027324676513672, "global_step": 273009, "epoch": 1625} {"train_loss": -11.65723991394043, "global_step": 273010, "epoch": 1625} {"train_loss": -11.749519348144531, "global_step": 273011, "epoch": 1625} {"train_loss": -12.022798538208008, "global_step": 273012, "epoch": 1625} {"train_loss": -11.648360252380371, "global_step": 273013, "epoch": 1625} {"train_loss": -12.201637268066406, "global_step": 273014, "epoch": 1625} {"train_loss": -12.223182678222656, "global_step": 273015, "epoch": 1625} {"train_loss": -12.08928108215332, "global_step": 273016, "epoch": 1625} {"train_loss": -12.11128044128418, "global_step": 273017, "epoch": 1625} {"train_loss": -11.85276985168457, "global_step": 273018, "epoch": 1625} {"train_loss": -12.30087661743164, "global_step": 273019, "epoch": 1625} {"train_loss": -11.938871383666992, "global_step": 273020, "epoch": 1625} {"train_loss": -12.284719467163086, "global_step": 273021, "epoch": 1625} {"train_loss": -12.060965538024902, "global_step": 273022, "epoch": 1625} {"train_loss": -11.930448532104492, "global_step": 273023, "epoch": 1625} {"train_loss": -12.140195846557617, "global_step": 273024, "epoch": 1625} {"train_loss": -12.14507007598877, "global_step": 273025, "epoch": 1625} {"train_loss": -12.061097145080566, "global_step": 273026, "epoch": 1625} {"train_loss": -12.082355499267578, "global_step": 273027, "epoch": 1625} {"train_loss": -12.074483871459961, "global_step": 273028, "epoch": 1625} {"train_loss": -11.944931983947754, "global_step": 273029, "epoch": 1625} {"train_loss": -12.073023796081543, "global_step": 273030, "epoch": 1625} {"train_loss": -12.120658874511719, "global_step": 273031, "epoch": 1625} {"train_loss": -12.058717727661133, "global_step": 273032, "epoch": 1625} {"train_loss": -12.1812162399292, "global_step": 273033, "epoch": 1625} {"train_loss": -11.592653274536133, "global_step": 273034, "epoch": 1625} {"train_loss": -11.331315994262695, "global_step": 273035, "epoch": 1625} {"train_loss": -11.674877166748047, "global_step": 273036, "epoch": 1625} {"train_loss": -11.663036346435547, "global_step": 273037, "epoch": 1625} {"train_loss": -10.682130813598633, "global_step": 273038, "epoch": 1625} {"train_loss": -12.021631240844727, "global_step": 273039, "epoch": 1625} {"train_loss": -11.012548446655273, "global_step": 273040, "epoch": 1625} {"train_loss": -10.986591339111328, "global_step": 273041, "epoch": 1625} {"train_loss": -11.155010223388672, "global_step": 273042, "epoch": 1625} {"train_loss": -11.718524932861328, "global_step": 273043, "epoch": 1625} {"train_loss": -10.998758316040039, "global_step": 273044, "epoch": 1625} {"train_loss": -11.75993537902832, "global_step": 273045, "epoch": 1625} {"train_loss": -10.550630569458008, "global_step": 273046, "epoch": 1625} {"train_loss": -10.850198745727539, "global_step": 273047, "epoch": 1625} {"train_loss": -12.143470764160156, "global_step": 273048, "epoch": 1625} {"train_loss": -11.745742797851562, "global_step": 273049, "epoch": 1625} {"train_loss": -12.055662155151367, "global_step": 273050, "epoch": 1625} {"train_loss": -11.507213592529297, "global_step": 273051, "epoch": 1625} {"train_loss": -12.03268814086914, "global_step": 273052, "epoch": 1625} {"train_loss": -11.698410034179688, "global_step": 273053, "epoch": 1625} {"train_loss": -11.927845001220703, "global_step": 273054, "epoch": 1625} {"train_loss": -11.828075408935547, "global_step": 273055, "epoch": 1625} {"train_loss": -11.95621109008789, "global_step": 273056, "epoch": 1625} {"train_loss": -12.001212120056152, "global_step": 273057, "epoch": 1625} {"train_loss": -12.071441650390625, "global_step": 273058, "epoch": 1625} {"train_loss": -12.186954498291016, "global_step": 273059, "epoch": 1625} {"train_loss": -11.930030822753906, "global_step": 273060, "epoch": 1625} {"train_loss": -12.036323547363281, "global_step": 273061, "epoch": 1625} {"train_loss": -11.63230037689209, "global_step": 273062, "epoch": 1625} {"train_loss": -12.102956771850586, "global_step": 273063, "epoch": 1625} {"train_loss": -11.727736473083496, "global_step": 273064, "epoch": 1625} {"train_loss": -11.814085960388184, "global_step": 273065, "epoch": 1625} {"train_loss": -11.978246688842773, "global_step": 273066, "epoch": 1625} {"train_loss": -11.834100723266602, "global_step": 273067, "epoch": 1625} {"train_loss": -11.887699127197266, "global_step": 273068, "epoch": 1625} {"train_loss": -11.88957691192627, "global_step": 273069, "epoch": 1625} {"train_loss": -11.91238021850586, "global_step": 273070, "epoch": 1625} {"train_loss": -11.680744171142578, "global_step": 273071, "epoch": 1625} {"train_loss": -11.498690605163574, "global_step": 273072, "epoch": 1625} {"train_loss": -11.766752243041992, "global_step": 273073, "epoch": 1625} {"train_loss": -12.089733123779297, "global_step": 273074, "epoch": 1625} {"train_loss": -11.04596996307373, "global_step": 273075, "epoch": 1625} {"train_loss": -11.748181343078613, "global_step": 273076, "epoch": 1625} {"train_loss": -12.025283813476562, "global_step": 273077, "epoch": 1625} {"train_loss": -12.08735466003418, "global_step": 273078, "epoch": 1625} {"train_loss": -11.504928588867188, "global_step": 273079, "epoch": 1625} {"train_loss": -11.398392677307129, "global_step": 273080, "epoch": 1625} {"train_loss": -12.032166481018066, "global_step": 273081, "epoch": 1625} {"train_loss": -11.830028533935547, "global_step": 273082, "epoch": 1625} {"train_loss": -11.309415817260742, "global_step": 273083, "epoch": 1625} {"train_loss": -11.793291091918945, "global_step": 273084, "epoch": 1625} {"train_loss": -11.705753326416016, "global_step": 273085, "epoch": 1625} {"train_loss": -10.665750503540039, "global_step": 273086, "epoch": 1625} {"train_loss": -11.536580085754395, "global_step": 273087, "epoch": 1625} {"train_loss": -11.389934539794922, "global_step": 273088, "epoch": 1625} {"train_loss": -11.178903579711914, "global_step": 273089, "epoch": 1625} {"train_loss": -11.092406272888184, "global_step": 273090, "epoch": 1625} {"train_loss": -11.679313659667969, "global_step": 273091, "epoch": 1625} {"train_loss": -10.799476623535156, "global_step": 273092, "epoch": 1625} {"train_loss": -10.919455528259277, "global_step": 273093, "epoch": 1625} {"train_loss": -11.86115550994873, "global_step": 273094, "epoch": 1625} {"train_loss": -11.199380874633789, "global_step": 273095, "epoch": 1625} {"train_loss": -11.538187026977539, "global_step": 273096, "epoch": 1625} {"train_loss": -11.934026718139648, "global_step": 273097, "epoch": 1625} {"train_loss": -12.01174259185791, "global_step": 273098, "epoch": 1625} {"train_loss": -11.59897232055664, "global_step": 273099, "epoch": 1625} {"train_loss": -11.59068489074707, "global_step": 273100, "epoch": 1625} {"train_loss": -11.550167083740234, "global_step": 273101, "epoch": 1625} {"train_loss": -11.521750450134277, "global_step": 273102, "epoch": 1625} {"train_loss": -10.787450790405273, "global_step": 273103, "epoch": 1625} {"train_loss": -11.443704605102539, "global_step": 273104, "epoch": 1625} {"train_loss": -11.552870750427246, "global_step": 273105, "epoch": 1625} {"train_loss": -11.140616416931152, "global_step": 273106, "epoch": 1625} {"train_loss": -12.092643737792969, "global_step": 273107, "epoch": 1625} {"train_loss": -11.153559684753418, "global_step": 273108, "epoch": 1625} {"train_loss": -11.916254043579102, "global_step": 273109, "epoch": 1625} {"train_loss": -11.399675369262695, "global_step": 273110, "epoch": 1625} {"train_loss": -11.51571273803711, "global_step": 273111, "epoch": 1625} {"train_loss": -11.359081268310547, "global_step": 273112, "epoch": 1625} {"train_loss": -11.63380241394043, "global_step": 273113, "epoch": 1625} {"train_loss": -11.323972702026367, "global_step": 273114, "epoch": 1625} {"train_loss": -11.956836700439453, "global_step": 273115, "epoch": 1625} {"train_loss": -11.600406646728516, "global_step": 273116, "epoch": 1625} {"train_loss": -11.423908233642578, "global_step": 273117, "epoch": 1625} {"train_loss": -11.275843620300293, "global_step": 273118, "epoch": 1625} {"train_loss": -11.510412216186523, "global_step": 273119, "epoch": 1625} {"train_loss": -9.150877952575684, "global_step": 273120, "epoch": 1625} {"train_loss": -11.10903263092041, "global_step": 273121, "epoch": 1625} {"train_loss": -11.148988723754883, "global_step": 273122, "epoch": 1625} {"train_loss": -9.412830352783203, "global_step": 273123, "epoch": 1625} {"train_loss": -9.798250198364258, "global_step": 273124, "epoch": 1625} {"train_loss": -11.360055923461914, "global_step": 273125, "epoch": 1625} {"train_loss": -9.810922622680664, "global_step": 273126, "epoch": 1625} {"train_loss": -10.451801300048828, "global_step": 273127, "epoch": 1625} {"train_loss": -11.437664031982422, "global_step": 273128, "epoch": 1625} {"train_loss": -10.329771041870117, "global_step": 273129, "epoch": 1625} {"train_loss": -11.69044017791748, "global_step": 273130, "epoch": 1625} {"train_loss": -11.579816818237305, "global_step": 273131, "epoch": 1625} {"train_loss": -10.97462272644043, "global_step": 273132, "epoch": 1625} {"train_loss": -11.547073364257812, "global_step": 273133, "epoch": 1625} {"train_loss": -10.966217994689941, "global_step": 273134, "epoch": 1625} {"train_loss": -11.72647476196289, "global_step": 273135, "epoch": 1625} {"train_loss": -11.392599105834961, "global_step": 273136, "epoch": 1625} {"train_loss": -11.252744674682617, "global_step": 273137, "epoch": 1625} {"train_loss": -11.788890838623047, "global_step": 273138, "epoch": 1625} {"train_loss": -11.66508674621582, "global_step": 273139, "epoch": 1625} {"train_loss": -11.886178970336914, "global_step": 273140, "epoch": 1625} {"train_loss": -12.003729820251465, "global_step": 273141, "epoch": 1625} {"train_loss": -11.648658752441406, "global_step": 273142, "epoch": 1625} {"train_loss": -11.817899703979492, "global_step": 273143, "epoch": 1625} {"train_loss": -11.743852615356445, "global_step": 273144, "epoch": 1625} {"train_loss": -11.708124160766602, "global_step": 273145, "epoch": 1625} {"train_loss": -12.184381484985352, "global_step": 273146, "epoch": 1625} {"train_loss": -11.828512191772461, "global_step": 273147, "epoch": 1625} {"train_loss": -11.771818161010742, "global_step": 273148, "epoch": 1625} {"train_loss": -11.907261848449707, "global_step": 273149, "epoch": 1625} {"train_loss": -11.961488723754883, "global_step": 273150, "epoch": 1625} {"train_loss": -11.673493385314941, "global_step": 273151, "epoch": 1625} {"train_loss": -12.06529426574707, "global_step": 273152, "epoch": 1625} {"train_loss": -11.939475059509277, "global_step": 273153, "epoch": 1625} {"train_loss": -11.975244522094727, "global_step": 273154, "epoch": 1625} {"train_loss": -11.988199234008789, "global_step": 273155, "epoch": 1625} {"train_loss": -12.16066837310791, "global_step": 273156, "epoch": 1625} {"train_loss": -11.86760139465332, "global_step": 273157, "epoch": 1625} {"train_loss": -11.867183685302734, "global_step": 273158, "epoch": 1625} {"train_loss": -11.922430038452148, "global_step": 273159, "epoch": 1625} {"train_loss": -12.071011543273926, "global_step": 273160, "epoch": 1625} {"train_loss": -12.092262268066406, "global_step": 273161, "epoch": 1625} {"train_loss": -12.106780052185059, "global_step": 273162, "epoch": 1625} {"train_loss": -12.086055755615234, "global_step": 273163, "epoch": 1625} {"train_loss": -12.063562393188477, "global_step": 273164, "epoch": 1625} {"train_loss": -11.880697250366211, "global_step": 273165, "epoch": 1625} {"train_loss": -12.022367477416992, "global_step": 273166, "epoch": 1625} {"train_loss": -11.645619046120416, "global_step": 273167, "epoch": 1625, "val_loss": 263381.28125, "train_action_mse_error": 1.2149344682693481} {"train_loss": -11.914072036743164, "global_step": 273168, "epoch": 1626} {"train_loss": -11.73037338256836, "global_step": 273169, "epoch": 1626} {"train_loss": -11.772192001342773, "global_step": 273170, "epoch": 1626} {"train_loss": -12.232207298278809, "global_step": 273171, "epoch": 1626} {"train_loss": -12.162796020507812, "global_step": 273172, "epoch": 1626} {"train_loss": -12.115482330322266, "global_step": 273173, "epoch": 1626} {"train_loss": -12.226736068725586, "global_step": 273174, "epoch": 1626} {"train_loss": -12.02787971496582, "global_step": 273175, "epoch": 1626} {"train_loss": -12.02828598022461, "global_step": 273176, "epoch": 1626} {"train_loss": -12.449116706848145, "global_step": 273177, "epoch": 1626} {"train_loss": -11.978802680969238, "global_step": 273178, "epoch": 1626} {"train_loss": -12.064885139465332, "global_step": 273179, "epoch": 1626} {"train_loss": -11.940240859985352, "global_step": 273180, "epoch": 1626} {"train_loss": -12.322084426879883, "global_step": 273181, "epoch": 1626} {"train_loss": -12.192577362060547, "global_step": 273182, "epoch": 1626} {"train_loss": -12.213489532470703, "global_step": 273183, "epoch": 1626} {"train_loss": -12.09775447845459, "global_step": 273184, "epoch": 1626} {"train_loss": -11.987438201904297, "global_step": 273185, "epoch": 1626} {"train_loss": -11.75790786743164, "global_step": 273186, "epoch": 1626} {"train_loss": -12.213936805725098, "global_step": 273187, "epoch": 1626} {"train_loss": -12.266465187072754, "global_step": 273188, "epoch": 1626} {"train_loss": -11.942861557006836, "global_step": 273189, "epoch": 1626} {"train_loss": -11.976296424865723, "global_step": 273190, "epoch": 1626} {"train_loss": -11.722318649291992, "global_step": 273191, "epoch": 1626} {"train_loss": -12.293745994567871, "global_step": 273192, "epoch": 1626} {"train_loss": -12.104513168334961, "global_step": 273193, "epoch": 1626} {"train_loss": -12.140469551086426, "global_step": 273194, "epoch": 1626} {"train_loss": -12.227909088134766, "global_step": 273195, "epoch": 1626} {"train_loss": -11.971441268920898, "global_step": 273196, "epoch": 1626} {"train_loss": -12.172615051269531, "global_step": 273197, "epoch": 1626} {"train_loss": -12.038647651672363, "global_step": 273198, "epoch": 1626} {"train_loss": -11.648904800415039, "global_step": 273199, "epoch": 1626} {"train_loss": -12.158464431762695, "global_step": 273200, "epoch": 1626} {"train_loss": -11.767681121826172, "global_step": 273201, "epoch": 1626} {"train_loss": -11.264795303344727, "global_step": 273202, "epoch": 1626} {"train_loss": -11.698183059692383, "global_step": 273203, "epoch": 1626} {"train_loss": -11.764875411987305, "global_step": 273204, "epoch": 1626} {"train_loss": -12.197803497314453, "global_step": 273205, "epoch": 1626} {"train_loss": -11.690778732299805, "global_step": 273206, "epoch": 1626} {"train_loss": -12.282021522521973, "global_step": 273207, "epoch": 1626} {"train_loss": -11.998379707336426, "global_step": 273208, "epoch": 1626} {"train_loss": -12.048224449157715, "global_step": 273209, "epoch": 1626} {"train_loss": -12.1068115234375, "global_step": 273210, "epoch": 1626} {"train_loss": -12.266725540161133, "global_step": 273211, "epoch": 1626} {"train_loss": -12.151365280151367, "global_step": 273212, "epoch": 1626} {"train_loss": -11.98682975769043, "global_step": 273213, "epoch": 1626} {"train_loss": -11.958250999450684, "global_step": 273214, "epoch": 1626} {"train_loss": -12.229342460632324, "global_step": 273215, "epoch": 1626} {"train_loss": -12.036134719848633, "global_step": 273216, "epoch": 1626} {"train_loss": -11.853283882141113, "global_step": 273217, "epoch": 1626} {"train_loss": -12.056009292602539, "global_step": 273218, "epoch": 1626} {"train_loss": -12.059103012084961, "global_step": 273219, "epoch": 1626} {"train_loss": -12.071659088134766, "global_step": 273220, "epoch": 1626} {"train_loss": -12.418489456176758, "global_step": 273221, "epoch": 1626} {"train_loss": -11.901576042175293, "global_step": 273222, "epoch": 1626} {"train_loss": -11.582338333129883, "global_step": 273223, "epoch": 1626} {"train_loss": -12.092199325561523, "global_step": 273224, "epoch": 1626} {"train_loss": -11.757826805114746, "global_step": 273225, "epoch": 1626} {"train_loss": -11.809896469116211, "global_step": 273226, "epoch": 1626} {"train_loss": -12.076299667358398, "global_step": 273227, "epoch": 1626} {"train_loss": -11.602227210998535, "global_step": 273228, "epoch": 1626} {"train_loss": -11.863399505615234, "global_step": 273229, "epoch": 1626} {"train_loss": -11.85970687866211, "global_step": 273230, "epoch": 1626} {"train_loss": -11.89494514465332, "global_step": 273231, "epoch": 1626} {"train_loss": -11.738141059875488, "global_step": 273232, "epoch": 1626} {"train_loss": -11.630688667297363, "global_step": 273233, "epoch": 1626} {"train_loss": -11.886114120483398, "global_step": 273234, "epoch": 1626} {"train_loss": -11.277447700500488, "global_step": 273235, "epoch": 1626} {"train_loss": -11.536983489990234, "global_step": 273236, "epoch": 1626} {"train_loss": -11.79544448852539, "global_step": 273237, "epoch": 1626} {"train_loss": -11.960238456726074, "global_step": 273238, "epoch": 1626} {"train_loss": -12.04451847076416, "global_step": 273239, "epoch": 1626} {"train_loss": -11.911828994750977, "global_step": 273240, "epoch": 1626} {"train_loss": -12.022367477416992, "global_step": 273241, "epoch": 1626} {"train_loss": -12.158292770385742, "global_step": 273242, "epoch": 1626} {"train_loss": -12.031190872192383, "global_step": 273243, "epoch": 1626} {"train_loss": -11.538386344909668, "global_step": 273244, "epoch": 1626} {"train_loss": -11.127029418945312, "global_step": 273245, "epoch": 1626} {"train_loss": -11.439453125, "global_step": 273246, "epoch": 1626} {"train_loss": -11.721019744873047, "global_step": 273247, "epoch": 1626} {"train_loss": -11.505728721618652, "global_step": 273248, "epoch": 1626} {"train_loss": -11.967779159545898, "global_step": 273249, "epoch": 1626} {"train_loss": -11.384925842285156, "global_step": 273250, "epoch": 1626} {"train_loss": -11.70065689086914, "global_step": 273251, "epoch": 1626} {"train_loss": -11.203818321228027, "global_step": 273252, "epoch": 1626} {"train_loss": -10.091072082519531, "global_step": 273253, "epoch": 1626} {"train_loss": -11.033647537231445, "global_step": 273254, "epoch": 1626} {"train_loss": -9.744861602783203, "global_step": 273255, "epoch": 1626} {"train_loss": -9.068464279174805, "global_step": 273256, "epoch": 1626} {"train_loss": -9.457338333129883, "global_step": 273257, "epoch": 1626} {"train_loss": -10.836055755615234, "global_step": 273258, "epoch": 1626} {"train_loss": -8.795064926147461, "global_step": 273259, "epoch": 1626} {"train_loss": -10.428890228271484, "global_step": 273260, "epoch": 1626} {"train_loss": -10.054912567138672, "global_step": 273261, "epoch": 1626} {"train_loss": -9.60055923461914, "global_step": 273262, "epoch": 1626} {"train_loss": -10.229757308959961, "global_step": 273263, "epoch": 1626} {"train_loss": -10.195841789245605, "global_step": 273264, "epoch": 1626} {"train_loss": -11.072851181030273, "global_step": 273265, "epoch": 1626} {"train_loss": -10.675066947937012, "global_step": 273266, "epoch": 1626} {"train_loss": -11.288366317749023, "global_step": 273267, "epoch": 1626} {"train_loss": -10.691624641418457, "global_step": 273268, "epoch": 1626} {"train_loss": -11.922406196594238, "global_step": 273269, "epoch": 1626} {"train_loss": -11.442835807800293, "global_step": 273270, "epoch": 1626} {"train_loss": -11.630772590637207, "global_step": 273271, "epoch": 1626} {"train_loss": -11.556686401367188, "global_step": 273272, "epoch": 1626} {"train_loss": -11.325056076049805, "global_step": 273273, "epoch": 1626} {"train_loss": -11.845746040344238, "global_step": 273274, "epoch": 1626} {"train_loss": -11.209587097167969, "global_step": 273275, "epoch": 1626} {"train_loss": -12.055641174316406, "global_step": 273276, "epoch": 1626} {"train_loss": -11.542879104614258, "global_step": 273277, "epoch": 1626} {"train_loss": -11.672670364379883, "global_step": 273278, "epoch": 1626} {"train_loss": -11.693864822387695, "global_step": 273279, "epoch": 1626} {"train_loss": -11.561605453491211, "global_step": 273280, "epoch": 1626} {"train_loss": -11.912191390991211, "global_step": 273281, "epoch": 1626} {"train_loss": -11.779325485229492, "global_step": 273282, "epoch": 1626} {"train_loss": -11.548482894897461, "global_step": 273283, "epoch": 1626} {"train_loss": -11.819433212280273, "global_step": 273284, "epoch": 1626} {"train_loss": -11.32723617553711, "global_step": 273285, "epoch": 1626} {"train_loss": -11.83615493774414, "global_step": 273286, "epoch": 1626} {"train_loss": -11.606781005859375, "global_step": 273287, "epoch": 1626} {"train_loss": -11.785520553588867, "global_step": 273288, "epoch": 1626} {"train_loss": -11.632890701293945, "global_step": 273289, "epoch": 1626} {"train_loss": -11.59864616394043, "global_step": 273290, "epoch": 1626} {"train_loss": -11.782042503356934, "global_step": 273291, "epoch": 1626} {"train_loss": -11.85926628112793, "global_step": 273292, "epoch": 1626} {"train_loss": -11.512458801269531, "global_step": 273293, "epoch": 1626} {"train_loss": -11.912239074707031, "global_step": 273294, "epoch": 1626} {"train_loss": -11.897064208984375, "global_step": 273295, "epoch": 1626} {"train_loss": -11.93374252319336, "global_step": 273296, "epoch": 1626} {"train_loss": -11.683028221130371, "global_step": 273297, "epoch": 1626} {"train_loss": -11.601642608642578, "global_step": 273298, "epoch": 1626} {"train_loss": -12.04560661315918, "global_step": 273299, "epoch": 1626} {"train_loss": -11.943821907043457, "global_step": 273300, "epoch": 1626} {"train_loss": -12.152936935424805, "global_step": 273301, "epoch": 1626} {"train_loss": -11.853986740112305, "global_step": 273302, "epoch": 1626} {"train_loss": -11.96990966796875, "global_step": 273303, "epoch": 1626} {"train_loss": -11.864388465881348, "global_step": 273304, "epoch": 1626} {"train_loss": -12.112532615661621, "global_step": 273305, "epoch": 1626} {"train_loss": -11.928803443908691, "global_step": 273306, "epoch": 1626} {"train_loss": -12.204290390014648, "global_step": 273307, "epoch": 1626} {"train_loss": -12.09483528137207, "global_step": 273308, "epoch": 1626} {"train_loss": -11.731962203979492, "global_step": 273309, "epoch": 1626} {"train_loss": -11.796468734741211, "global_step": 273310, "epoch": 1626} {"train_loss": -11.935844421386719, "global_step": 273311, "epoch": 1626} {"train_loss": -11.667031288146973, "global_step": 273312, "epoch": 1626} {"train_loss": -11.839305877685547, "global_step": 273313, "epoch": 1626} {"train_loss": -12.17728042602539, "global_step": 273314, "epoch": 1626} {"train_loss": -11.57075023651123, "global_step": 273315, "epoch": 1626} {"train_loss": -12.130578994750977, "global_step": 273316, "epoch": 1626} {"train_loss": -12.172906875610352, "global_step": 273317, "epoch": 1626} {"train_loss": -12.05057144165039, "global_step": 273318, "epoch": 1626} {"train_loss": -11.7720365524292, "global_step": 273319, "epoch": 1626} {"train_loss": -11.99410629272461, "global_step": 273320, "epoch": 1626} {"train_loss": -11.872944831848145, "global_step": 273321, "epoch": 1626} {"train_loss": -12.042407989501953, "global_step": 273322, "epoch": 1626} {"train_loss": -12.049224853515625, "global_step": 273323, "epoch": 1626} {"train_loss": -11.895462036132812, "global_step": 273324, "epoch": 1626} {"train_loss": -11.920696258544922, "global_step": 273325, "epoch": 1626} {"train_loss": -11.978246688842773, "global_step": 273326, "epoch": 1626} {"train_loss": -11.456533432006836, "global_step": 273327, "epoch": 1626} {"train_loss": -12.173980712890625, "global_step": 273328, "epoch": 1626} {"train_loss": -11.621145248413086, "global_step": 273329, "epoch": 1626} {"train_loss": -11.767443656921387, "global_step": 273330, "epoch": 1626} {"train_loss": -11.879913330078125, "global_step": 273331, "epoch": 1626} {"train_loss": -11.956212997436523, "global_step": 273332, "epoch": 1626} {"train_loss": -11.87995719909668, "global_step": 273333, "epoch": 1626} {"train_loss": -12.092188835144043, "global_step": 273334, "epoch": 1626} {"train_loss": -11.72108032589867, "global_step": 273335, "epoch": 1626, "val_loss": 265478.46875} {"train_loss": -12.059869766235352, "global_step": 273336, "epoch": 1627} {"train_loss": -11.817159652709961, "global_step": 273337, "epoch": 1627} {"train_loss": -12.014385223388672, "global_step": 273338, "epoch": 1627} {"train_loss": -12.034839630126953, "global_step": 273339, "epoch": 1627} {"train_loss": -11.705789566040039, "global_step": 273340, "epoch": 1627} {"train_loss": -11.705070495605469, "global_step": 273341, "epoch": 1627} {"train_loss": -11.788787841796875, "global_step": 273342, "epoch": 1627} {"train_loss": -11.494025230407715, "global_step": 273343, "epoch": 1627} {"train_loss": -11.831912994384766, "global_step": 273344, "epoch": 1627} {"train_loss": -12.027084350585938, "global_step": 273345, "epoch": 1627} {"train_loss": -11.613982200622559, "global_step": 273346, "epoch": 1627} {"train_loss": -12.261313438415527, "global_step": 273347, "epoch": 1627} {"train_loss": -11.404325485229492, "global_step": 273348, "epoch": 1627} {"train_loss": -11.693305969238281, "global_step": 273349, "epoch": 1627} {"train_loss": -11.742691993713379, "global_step": 273350, "epoch": 1627} {"train_loss": -11.992240905761719, "global_step": 273351, "epoch": 1627} {"train_loss": -11.517057418823242, "global_step": 273352, "epoch": 1627} {"train_loss": -12.194253921508789, "global_step": 273353, "epoch": 1627} {"train_loss": -11.195928573608398, "global_step": 273354, "epoch": 1627} {"train_loss": -12.030832290649414, "global_step": 273355, "epoch": 1627} {"train_loss": -11.225228309631348, "global_step": 273356, "epoch": 1627} {"train_loss": -11.877334594726562, "global_step": 273357, "epoch": 1627} {"train_loss": -11.579643249511719, "global_step": 273358, "epoch": 1627} {"train_loss": -12.03618049621582, "global_step": 273359, "epoch": 1627} {"train_loss": -11.384380340576172, "global_step": 273360, "epoch": 1627} {"train_loss": -11.659967422485352, "global_step": 273361, "epoch": 1627} {"train_loss": -11.44073486328125, "global_step": 273362, "epoch": 1627} {"train_loss": -11.8297119140625, "global_step": 273363, "epoch": 1627} {"train_loss": -11.77739429473877, "global_step": 273364, "epoch": 1627} {"train_loss": -11.649614334106445, "global_step": 273365, "epoch": 1627} {"train_loss": -11.766592025756836, "global_step": 273366, "epoch": 1627} {"train_loss": -11.697158813476562, "global_step": 273367, "epoch": 1627} {"train_loss": -12.024808883666992, "global_step": 273368, "epoch": 1627} {"train_loss": -11.839109420776367, "global_step": 273369, "epoch": 1627} {"train_loss": -11.812246322631836, "global_step": 273370, "epoch": 1627} {"train_loss": -11.721385955810547, "global_step": 273371, "epoch": 1627} {"train_loss": -11.890107154846191, "global_step": 273372, "epoch": 1627} {"train_loss": -11.05278205871582, "global_step": 273373, "epoch": 1627} {"train_loss": -11.904304504394531, "global_step": 273374, "epoch": 1627} {"train_loss": -11.464778900146484, "global_step": 273375, "epoch": 1627} {"train_loss": -11.590841293334961, "global_step": 273376, "epoch": 1627} {"train_loss": -11.549982070922852, "global_step": 273377, "epoch": 1627} {"train_loss": -12.104217529296875, "global_step": 273378, "epoch": 1627} {"train_loss": -11.477731704711914, "global_step": 273379, "epoch": 1627} {"train_loss": -12.104269027709961, "global_step": 273380, "epoch": 1627} {"train_loss": -11.037269592285156, "global_step": 273381, "epoch": 1627} {"train_loss": -11.835578918457031, "global_step": 273382, "epoch": 1627} {"train_loss": -11.5451078414917, "global_step": 273383, "epoch": 1627} {"train_loss": -11.520807266235352, "global_step": 273384, "epoch": 1627} {"train_loss": -11.413956642150879, "global_step": 273385, "epoch": 1627} {"train_loss": -11.762897491455078, "global_step": 273386, "epoch": 1627} {"train_loss": -11.361129760742188, "global_step": 273387, "epoch": 1627} {"train_loss": -11.550909042358398, "global_step": 273388, "epoch": 1627} {"train_loss": -11.784887313842773, "global_step": 273389, "epoch": 1627} {"train_loss": -11.676546096801758, "global_step": 273390, "epoch": 1627} {"train_loss": -11.701109886169434, "global_step": 273391, "epoch": 1627} {"train_loss": -11.312833786010742, "global_step": 273392, "epoch": 1627} {"train_loss": -11.640788078308105, "global_step": 273393, "epoch": 1627} {"train_loss": -11.393486022949219, "global_step": 273394, "epoch": 1627} {"train_loss": -11.514215469360352, "global_step": 273395, "epoch": 1627} {"train_loss": -11.243053436279297, "global_step": 273396, "epoch": 1627} {"train_loss": -11.342039108276367, "global_step": 273397, "epoch": 1627} {"train_loss": -11.569511413574219, "global_step": 273398, "epoch": 1627} {"train_loss": -11.47160530090332, "global_step": 273399, "epoch": 1627} {"train_loss": -11.714346885681152, "global_step": 273400, "epoch": 1627} {"train_loss": -11.602253913879395, "global_step": 273401, "epoch": 1627} {"train_loss": -11.74327278137207, "global_step": 273402, "epoch": 1627} {"train_loss": -10.507444381713867, "global_step": 273403, "epoch": 1627} {"train_loss": -11.823023796081543, "global_step": 273404, "epoch": 1627} {"train_loss": -10.928030014038086, "global_step": 273405, "epoch": 1627} {"train_loss": -11.785993576049805, "global_step": 273406, "epoch": 1627} {"train_loss": -11.823902130126953, "global_step": 273407, "epoch": 1627} {"train_loss": -11.691718101501465, "global_step": 273408, "epoch": 1627} {"train_loss": -11.794654846191406, "global_step": 273409, "epoch": 1627} {"train_loss": -11.613222122192383, "global_step": 273410, "epoch": 1627} {"train_loss": -12.162691116333008, "global_step": 273411, "epoch": 1627} {"train_loss": -11.935626983642578, "global_step": 273412, "epoch": 1627} {"train_loss": -11.833786010742188, "global_step": 273413, "epoch": 1627} {"train_loss": -11.79037094116211, "global_step": 273414, "epoch": 1627} {"train_loss": -11.796747207641602, "global_step": 273415, "epoch": 1627} {"train_loss": -11.841196060180664, "global_step": 273416, "epoch": 1627} {"train_loss": -11.778203010559082, "global_step": 273417, "epoch": 1627} {"train_loss": -11.557251930236816, "global_step": 273418, "epoch": 1627} {"train_loss": -11.95291519165039, "global_step": 273419, "epoch": 1627} {"train_loss": -11.967327117919922, "global_step": 273420, "epoch": 1627} {"train_loss": -11.934526443481445, "global_step": 273421, "epoch": 1627} {"train_loss": -11.946242332458496, "global_step": 273422, "epoch": 1627} {"train_loss": -11.94326400756836, "global_step": 273423, "epoch": 1627} {"train_loss": -12.109037399291992, "global_step": 273424, "epoch": 1627} {"train_loss": -11.932744979858398, "global_step": 273425, "epoch": 1627} {"train_loss": -11.966886520385742, "global_step": 273426, "epoch": 1627} {"train_loss": -11.941658020019531, "global_step": 273427, "epoch": 1627} {"train_loss": -12.11549186706543, "global_step": 273428, "epoch": 1627} {"train_loss": -11.94898796081543, "global_step": 273429, "epoch": 1627} {"train_loss": -11.837732315063477, "global_step": 273430, "epoch": 1627} {"train_loss": -12.034235000610352, "global_step": 273431, "epoch": 1627} {"train_loss": -12.00057315826416, "global_step": 273432, "epoch": 1627} {"train_loss": -11.933547973632812, "global_step": 273433, "epoch": 1627} {"train_loss": -12.145153045654297, "global_step": 273434, "epoch": 1627} {"train_loss": -11.922836303710938, "global_step": 273435, "epoch": 1627} {"train_loss": -11.819727897644043, "global_step": 273436, "epoch": 1627} {"train_loss": -12.237728118896484, "global_step": 273437, "epoch": 1627} {"train_loss": -11.7769136428833, "global_step": 273438, "epoch": 1627} {"train_loss": -11.607890129089355, "global_step": 273439, "epoch": 1627} {"train_loss": -12.060959815979004, "global_step": 273440, "epoch": 1627} {"train_loss": -11.616868019104004, "global_step": 273441, "epoch": 1627} {"train_loss": -11.950603485107422, "global_step": 273442, "epoch": 1627} {"train_loss": -12.005252838134766, "global_step": 273443, "epoch": 1627} {"train_loss": -11.670522689819336, "global_step": 273444, "epoch": 1627} {"train_loss": -11.7806396484375, "global_step": 273445, "epoch": 1627} {"train_loss": -12.008539199829102, "global_step": 273446, "epoch": 1627} {"train_loss": -11.310460090637207, "global_step": 273447, "epoch": 1627} {"train_loss": -11.796334266662598, "global_step": 273448, "epoch": 1627} {"train_loss": -12.060155868530273, "global_step": 273449, "epoch": 1627} {"train_loss": -11.764835357666016, "global_step": 273450, "epoch": 1627} {"train_loss": -12.250877380371094, "global_step": 273451, "epoch": 1627} {"train_loss": -11.234875679016113, "global_step": 273452, "epoch": 1627} {"train_loss": -11.60484790802002, "global_step": 273453, "epoch": 1627} {"train_loss": -11.180435180664062, "global_step": 273454, "epoch": 1627} {"train_loss": -11.739352226257324, "global_step": 273455, "epoch": 1627} {"train_loss": -11.92645263671875, "global_step": 273456, "epoch": 1627} {"train_loss": -11.801570892333984, "global_step": 273457, "epoch": 1627} {"train_loss": -11.879119873046875, "global_step": 273458, "epoch": 1627} {"train_loss": -11.899141311645508, "global_step": 273459, "epoch": 1627} {"train_loss": -11.78490924835205, "global_step": 273460, "epoch": 1627} {"train_loss": -12.235398292541504, "global_step": 273461, "epoch": 1627} {"train_loss": -11.471517562866211, "global_step": 273462, "epoch": 1627} {"train_loss": -12.052373886108398, "global_step": 273463, "epoch": 1627} {"train_loss": -12.190224647521973, "global_step": 273464, "epoch": 1627} {"train_loss": -11.731895446777344, "global_step": 273465, "epoch": 1627} {"train_loss": -12.043466567993164, "global_step": 273466, "epoch": 1627} {"train_loss": -12.148632049560547, "global_step": 273467, "epoch": 1627} {"train_loss": -11.826116561889648, "global_step": 273468, "epoch": 1627} {"train_loss": -12.285628318786621, "global_step": 273469, "epoch": 1627} {"train_loss": -12.061380386352539, "global_step": 273470, "epoch": 1627} {"train_loss": -11.128636360168457, "global_step": 273471, "epoch": 1627} {"train_loss": -12.1571626663208, "global_step": 273472, "epoch": 1627} {"train_loss": -11.896100044250488, "global_step": 273473, "epoch": 1627} {"train_loss": -11.783329963684082, "global_step": 273474, "epoch": 1627} {"train_loss": -11.805023193359375, "global_step": 273475, "epoch": 1627} {"train_loss": -11.170065879821777, "global_step": 273476, "epoch": 1627} {"train_loss": -11.621505737304688, "global_step": 273477, "epoch": 1627} {"train_loss": -12.172904014587402, "global_step": 273478, "epoch": 1627} {"train_loss": -11.08399772644043, "global_step": 273479, "epoch": 1627} {"train_loss": -12.265893936157227, "global_step": 273480, "epoch": 1627} {"train_loss": -11.784421920776367, "global_step": 273481, "epoch": 1627} {"train_loss": -11.923373222351074, "global_step": 273482, "epoch": 1627} {"train_loss": -11.968649864196777, "global_step": 273483, "epoch": 1627} {"train_loss": -11.349514961242676, "global_step": 273484, "epoch": 1627} {"train_loss": -12.139650344848633, "global_step": 273485, "epoch": 1627} {"train_loss": -11.698474884033203, "global_step": 273486, "epoch": 1627} {"train_loss": -11.894944190979004, "global_step": 273487, "epoch": 1627} {"train_loss": -12.021743774414062, "global_step": 273488, "epoch": 1627} {"train_loss": -11.821221351623535, "global_step": 273489, "epoch": 1627} {"train_loss": -11.82754135131836, "global_step": 273490, "epoch": 1627} {"train_loss": -12.271729469299316, "global_step": 273491, "epoch": 1627} {"train_loss": -11.882887840270996, "global_step": 273492, "epoch": 1627} {"train_loss": -12.349905014038086, "global_step": 273493, "epoch": 1627} {"train_loss": -11.879737854003906, "global_step": 273494, "epoch": 1627} {"train_loss": -11.60598373413086, "global_step": 273495, "epoch": 1627} {"train_loss": -12.192232131958008, "global_step": 273496, "epoch": 1627} {"train_loss": -11.617515563964844, "global_step": 273497, "epoch": 1627} {"train_loss": -12.152502059936523, "global_step": 273498, "epoch": 1627} {"train_loss": -11.965560913085938, "global_step": 273499, "epoch": 1627} {"train_loss": -11.503734588623047, "global_step": 273500, "epoch": 1627} {"train_loss": -12.389114379882812, "global_step": 273501, "epoch": 1627} {"train_loss": -11.865304946899414, "global_step": 273502, "epoch": 1627} {"train_loss": -11.779018175034295, "global_step": 273503, "epoch": 1627, "val_loss": 270381.40625} {"train_loss": -11.956427574157715, "global_step": 273504, "epoch": 1628} {"train_loss": -12.12218189239502, "global_step": 273505, "epoch": 1628} {"train_loss": -12.42885971069336, "global_step": 273506, "epoch": 1628} {"train_loss": -12.008715629577637, "global_step": 273507, "epoch": 1628} {"train_loss": -12.088520050048828, "global_step": 273508, "epoch": 1628} {"train_loss": -11.989818572998047, "global_step": 273509, "epoch": 1628} {"train_loss": -12.029511451721191, "global_step": 273510, "epoch": 1628} {"train_loss": -12.17497444152832, "global_step": 273511, "epoch": 1628} {"train_loss": -11.962485313415527, "global_step": 273512, "epoch": 1628} {"train_loss": -12.399785995483398, "global_step": 273513, "epoch": 1628} {"train_loss": -12.047987937927246, "global_step": 273514, "epoch": 1628} {"train_loss": -12.085081100463867, "global_step": 273515, "epoch": 1628} {"train_loss": -12.208175659179688, "global_step": 273516, "epoch": 1628} {"train_loss": -11.905450820922852, "global_step": 273517, "epoch": 1628} {"train_loss": -11.701509475708008, "global_step": 273518, "epoch": 1628} {"train_loss": -11.784395217895508, "global_step": 273519, "epoch": 1628} {"train_loss": -11.964694023132324, "global_step": 273520, "epoch": 1628} {"train_loss": -11.758668899536133, "global_step": 273521, "epoch": 1628} {"train_loss": -11.600746154785156, "global_step": 273522, "epoch": 1628} {"train_loss": -11.364705085754395, "global_step": 273523, "epoch": 1628} {"train_loss": -12.017131805419922, "global_step": 273524, "epoch": 1628} {"train_loss": -11.219233512878418, "global_step": 273525, "epoch": 1628} {"train_loss": -11.426551818847656, "global_step": 273526, "epoch": 1628} {"train_loss": -11.175726890563965, "global_step": 273527, "epoch": 1628} {"train_loss": -11.336807250976562, "global_step": 273528, "epoch": 1628} {"train_loss": -11.586271286010742, "global_step": 273529, "epoch": 1628} {"train_loss": -11.283132553100586, "global_step": 273530, "epoch": 1628} {"train_loss": -11.046892166137695, "global_step": 273531, "epoch": 1628} {"train_loss": -11.82261848449707, "global_step": 273532, "epoch": 1628} {"train_loss": -10.915943145751953, "global_step": 273533, "epoch": 1628} {"train_loss": -10.870189666748047, "global_step": 273534, "epoch": 1628} {"train_loss": -11.580065727233887, "global_step": 273535, "epoch": 1628} {"train_loss": -10.875499725341797, "global_step": 273536, "epoch": 1628} {"train_loss": -11.744152069091797, "global_step": 273537, "epoch": 1628} {"train_loss": -10.837108612060547, "global_step": 273538, "epoch": 1628} {"train_loss": -11.612004280090332, "global_step": 273539, "epoch": 1628} {"train_loss": -11.213159561157227, "global_step": 273540, "epoch": 1628} {"train_loss": -10.810081481933594, "global_step": 273541, "epoch": 1628} {"train_loss": -11.694831848144531, "global_step": 273542, "epoch": 1628} {"train_loss": -10.573713302612305, "global_step": 273543, "epoch": 1628} {"train_loss": -11.542431831359863, "global_step": 273544, "epoch": 1628} {"train_loss": -10.800335884094238, "global_step": 273545, "epoch": 1628} {"train_loss": -10.583925247192383, "global_step": 273546, "epoch": 1628} {"train_loss": -10.066530227661133, "global_step": 273547, "epoch": 1628} {"train_loss": -11.381010055541992, "global_step": 273548, "epoch": 1628} {"train_loss": -10.200692176818848, "global_step": 273549, "epoch": 1628} {"train_loss": -10.399062156677246, "global_step": 273550, "epoch": 1628} {"train_loss": -11.054766654968262, "global_step": 273551, "epoch": 1628} {"train_loss": -10.389263153076172, "global_step": 273552, "epoch": 1628} {"train_loss": -11.883251190185547, "global_step": 273553, "epoch": 1628} {"train_loss": -10.393882751464844, "global_step": 273554, "epoch": 1628} {"train_loss": -9.490461349487305, "global_step": 273555, "epoch": 1628} {"train_loss": -11.133155822753906, "global_step": 273556, "epoch": 1628} {"train_loss": -10.046907424926758, "global_step": 273557, "epoch": 1628} {"train_loss": -10.913125991821289, "global_step": 273558, "epoch": 1628} {"train_loss": -11.67580795288086, "global_step": 273559, "epoch": 1628} {"train_loss": -10.359521865844727, "global_step": 273560, "epoch": 1628} {"train_loss": -11.409236907958984, "global_step": 273561, "epoch": 1628} {"train_loss": -10.942174911499023, "global_step": 273562, "epoch": 1628} {"train_loss": -11.024944305419922, "global_step": 273563, "epoch": 1628} {"train_loss": -11.71681022644043, "global_step": 273564, "epoch": 1628} {"train_loss": -10.978716850280762, "global_step": 273565, "epoch": 1628} {"train_loss": -11.588876724243164, "global_step": 273566, "epoch": 1628} {"train_loss": -11.241660118103027, "global_step": 273567, "epoch": 1628} {"train_loss": -11.481413841247559, "global_step": 273568, "epoch": 1628} {"train_loss": -11.413853645324707, "global_step": 273569, "epoch": 1628} {"train_loss": -11.343807220458984, "global_step": 273570, "epoch": 1628} {"train_loss": -11.331538200378418, "global_step": 273571, "epoch": 1628} {"train_loss": -10.89443588256836, "global_step": 273572, "epoch": 1628} {"train_loss": -11.527839660644531, "global_step": 273573, "epoch": 1628} {"train_loss": -10.736297607421875, "global_step": 273574, "epoch": 1628} {"train_loss": -11.626996994018555, "global_step": 273575, "epoch": 1628} {"train_loss": -10.970756530761719, "global_step": 273576, "epoch": 1628} {"train_loss": -11.714351654052734, "global_step": 273577, "epoch": 1628} {"train_loss": -11.279168128967285, "global_step": 273578, "epoch": 1628} {"train_loss": -11.34154987335205, "global_step": 273579, "epoch": 1628} {"train_loss": -11.510225296020508, "global_step": 273580, "epoch": 1628} {"train_loss": -11.64846420288086, "global_step": 273581, "epoch": 1628} {"train_loss": -11.677927017211914, "global_step": 273582, "epoch": 1628} {"train_loss": -12.044869422912598, "global_step": 273583, "epoch": 1628} {"train_loss": -11.636309623718262, "global_step": 273584, "epoch": 1628} {"train_loss": -11.705867767333984, "global_step": 273585, "epoch": 1628} {"train_loss": -11.906503677368164, "global_step": 273586, "epoch": 1628} {"train_loss": -11.66588020324707, "global_step": 273587, "epoch": 1628} {"train_loss": -11.812883377075195, "global_step": 273588, "epoch": 1628} {"train_loss": -11.846756935119629, "global_step": 273589, "epoch": 1628} {"train_loss": -11.701465606689453, "global_step": 273590, "epoch": 1628} {"train_loss": -11.866783142089844, "global_step": 273591, "epoch": 1628} {"train_loss": -11.467123031616211, "global_step": 273592, "epoch": 1628} {"train_loss": -11.583282470703125, "global_step": 273593, "epoch": 1628} {"train_loss": -11.4981107711792, "global_step": 273594, "epoch": 1628} {"train_loss": -11.56277847290039, "global_step": 273595, "epoch": 1628} {"train_loss": -11.347332000732422, "global_step": 273596, "epoch": 1628} {"train_loss": -11.382932662963867, "global_step": 273597, "epoch": 1628} {"train_loss": -10.958331108093262, "global_step": 273598, "epoch": 1628} {"train_loss": -11.374418258666992, "global_step": 273599, "epoch": 1628} {"train_loss": -11.005367279052734, "global_step": 273600, "epoch": 1628} {"train_loss": -11.512332916259766, "global_step": 273601, "epoch": 1628} {"train_loss": -10.958229064941406, "global_step": 273602, "epoch": 1628} {"train_loss": -11.412328720092773, "global_step": 273603, "epoch": 1628} {"train_loss": -10.875377655029297, "global_step": 273604, "epoch": 1628} {"train_loss": -12.131820678710938, "global_step": 273605, "epoch": 1628} {"train_loss": -11.009590148925781, "global_step": 273606, "epoch": 1628} {"train_loss": -11.914386749267578, "global_step": 273607, "epoch": 1628} {"train_loss": -11.436851501464844, "global_step": 273608, "epoch": 1628} {"train_loss": -11.639673233032227, "global_step": 273609, "epoch": 1628} {"train_loss": -11.455934524536133, "global_step": 273610, "epoch": 1628} {"train_loss": -11.760878562927246, "global_step": 273611, "epoch": 1628} {"train_loss": -11.272984504699707, "global_step": 273612, "epoch": 1628} {"train_loss": -11.867025375366211, "global_step": 273613, "epoch": 1628} {"train_loss": -11.663777351379395, "global_step": 273614, "epoch": 1628} {"train_loss": -11.677796363830566, "global_step": 273615, "epoch": 1628} {"train_loss": -11.510519981384277, "global_step": 273616, "epoch": 1628} {"train_loss": -11.93801498413086, "global_step": 273617, "epoch": 1628} {"train_loss": -11.75883674621582, "global_step": 273618, "epoch": 1628} {"train_loss": -11.72026252746582, "global_step": 273619, "epoch": 1628} {"train_loss": -11.871271133422852, "global_step": 273620, "epoch": 1628} {"train_loss": -11.597359657287598, "global_step": 273621, "epoch": 1628} {"train_loss": -12.039254188537598, "global_step": 273622, "epoch": 1628} {"train_loss": -11.597524642944336, "global_step": 273623, "epoch": 1628} {"train_loss": -11.797388076782227, "global_step": 273624, "epoch": 1628} {"train_loss": -11.813796043395996, "global_step": 273625, "epoch": 1628} {"train_loss": -12.000646591186523, "global_step": 273626, "epoch": 1628} {"train_loss": -11.860527038574219, "global_step": 273627, "epoch": 1628} {"train_loss": -11.953409194946289, "global_step": 273628, "epoch": 1628} {"train_loss": -11.961578369140625, "global_step": 273629, "epoch": 1628} {"train_loss": -11.973489761352539, "global_step": 273630, "epoch": 1628} {"train_loss": -11.81027603149414, "global_step": 273631, "epoch": 1628} {"train_loss": -11.984085083007812, "global_step": 273632, "epoch": 1628} {"train_loss": -11.631792068481445, "global_step": 273633, "epoch": 1628} {"train_loss": -12.197000503540039, "global_step": 273634, "epoch": 1628} {"train_loss": -11.921411514282227, "global_step": 273635, "epoch": 1628} {"train_loss": -12.016054153442383, "global_step": 273636, "epoch": 1628} {"train_loss": -12.005300521850586, "global_step": 273637, "epoch": 1628} {"train_loss": -11.968061447143555, "global_step": 273638, "epoch": 1628} {"train_loss": -12.036758422851562, "global_step": 273639, "epoch": 1628} {"train_loss": -12.054412841796875, "global_step": 273640, "epoch": 1628} {"train_loss": -12.193626403808594, "global_step": 273641, "epoch": 1628} {"train_loss": -11.715627670288086, "global_step": 273642, "epoch": 1628} {"train_loss": -12.004682540893555, "global_step": 273643, "epoch": 1628} {"train_loss": -11.79952621459961, "global_step": 273644, "epoch": 1628} {"train_loss": -12.084970474243164, "global_step": 273645, "epoch": 1628} {"train_loss": -12.247840881347656, "global_step": 273646, "epoch": 1628} {"train_loss": -12.123725891113281, "global_step": 273647, "epoch": 1628} {"train_loss": -12.26742935180664, "global_step": 273648, "epoch": 1628} {"train_loss": -12.394746780395508, "global_step": 273649, "epoch": 1628} {"train_loss": -12.188570976257324, "global_step": 273650, "epoch": 1628} {"train_loss": -12.353992462158203, "global_step": 273651, "epoch": 1628} {"train_loss": -12.28347396850586, "global_step": 273652, "epoch": 1628} {"train_loss": -12.298882484436035, "global_step": 273653, "epoch": 1628} {"train_loss": -12.099077224731445, "global_step": 273654, "epoch": 1628} {"train_loss": -12.253386497497559, "global_step": 273655, "epoch": 1628} {"train_loss": -12.249011039733887, "global_step": 273656, "epoch": 1628} {"train_loss": -12.15471076965332, "global_step": 273657, "epoch": 1628} {"train_loss": -12.296056747436523, "global_step": 273658, "epoch": 1628} {"train_loss": -12.27859115600586, "global_step": 273659, "epoch": 1628} {"train_loss": -12.263774871826172, "global_step": 273660, "epoch": 1628} {"train_loss": -12.288694381713867, "global_step": 273661, "epoch": 1628} {"train_loss": -12.116159439086914, "global_step": 273662, "epoch": 1628} {"train_loss": -12.080255508422852, "global_step": 273663, "epoch": 1628} {"train_loss": -12.088600158691406, "global_step": 273664, "epoch": 1628} {"train_loss": -12.234542846679688, "global_step": 273665, "epoch": 1628} {"train_loss": -11.996634483337402, "global_step": 273666, "epoch": 1628} {"train_loss": -12.227457046508789, "global_step": 273667, "epoch": 1628} {"train_loss": -12.296195983886719, "global_step": 273668, "epoch": 1628} {"train_loss": -12.263951301574707, "global_step": 273669, "epoch": 1628} {"train_loss": -12.407096862792969, "global_step": 273670, "epoch": 1628} {"train_loss": -11.624656319618225, "global_step": 273671, "epoch": 1628, "val_loss": 272391.125} {"train_loss": -12.083413124084473, "global_step": 273672, "epoch": 1629} {"train_loss": -12.354223251342773, "global_step": 273673, "epoch": 1629} {"train_loss": -11.928085327148438, "global_step": 273674, "epoch": 1629} {"train_loss": -12.114999771118164, "global_step": 273675, "epoch": 1629} {"train_loss": -11.978521347045898, "global_step": 273676, "epoch": 1629} {"train_loss": -11.845830917358398, "global_step": 273677, "epoch": 1629} {"train_loss": -11.515983581542969, "global_step": 273678, "epoch": 1629} {"train_loss": -12.251707077026367, "global_step": 273679, "epoch": 1629} {"train_loss": -11.885555267333984, "global_step": 273680, "epoch": 1629} {"train_loss": -11.3729248046875, "global_step": 273681, "epoch": 1629} {"train_loss": -11.503814697265625, "global_step": 273682, "epoch": 1629} {"train_loss": -10.675448417663574, "global_step": 273683, "epoch": 1629} {"train_loss": -11.205479621887207, "global_step": 273684, "epoch": 1629} {"train_loss": -10.689672470092773, "global_step": 273685, "epoch": 1629} {"train_loss": -12.0970458984375, "global_step": 273686, "epoch": 1629} {"train_loss": -11.359030723571777, "global_step": 273687, "epoch": 1629} {"train_loss": -11.436073303222656, "global_step": 273688, "epoch": 1629} {"train_loss": -11.032584190368652, "global_step": 273689, "epoch": 1629} {"train_loss": -10.985115051269531, "global_step": 273690, "epoch": 1629} {"train_loss": -10.62779426574707, "global_step": 273691, "epoch": 1629} {"train_loss": -12.03473949432373, "global_step": 273692, "epoch": 1629} {"train_loss": -10.9646577835083, "global_step": 273693, "epoch": 1629} {"train_loss": -12.115079879760742, "global_step": 273694, "epoch": 1629} {"train_loss": -10.773778915405273, "global_step": 273695, "epoch": 1629} {"train_loss": -12.048531532287598, "global_step": 273696, "epoch": 1629} {"train_loss": -11.321876525878906, "global_step": 273697, "epoch": 1629} {"train_loss": -11.833930969238281, "global_step": 273698, "epoch": 1629} {"train_loss": -11.309343338012695, "global_step": 273699, "epoch": 1629} {"train_loss": -11.464376449584961, "global_step": 273700, "epoch": 1629} {"train_loss": -11.811701774597168, "global_step": 273701, "epoch": 1629} {"train_loss": -10.937187194824219, "global_step": 273702, "epoch": 1629} {"train_loss": -11.964391708374023, "global_step": 273703, "epoch": 1629} {"train_loss": -11.202213287353516, "global_step": 273704, "epoch": 1629} {"train_loss": -11.889617919921875, "global_step": 273705, "epoch": 1629} {"train_loss": -11.449982643127441, "global_step": 273706, "epoch": 1629} {"train_loss": -10.847171783447266, "global_step": 273707, "epoch": 1629} {"train_loss": -11.348737716674805, "global_step": 273708, "epoch": 1629} {"train_loss": -10.507160186767578, "global_step": 273709, "epoch": 1629} {"train_loss": -11.10781478881836, "global_step": 273710, "epoch": 1629} {"train_loss": -11.083019256591797, "global_step": 273711, "epoch": 1629} {"train_loss": -11.142965316772461, "global_step": 273712, "epoch": 1629} {"train_loss": -11.35155200958252, "global_step": 273713, "epoch": 1629} {"train_loss": -11.220272064208984, "global_step": 273714, "epoch": 1629} {"train_loss": -11.72873306274414, "global_step": 273715, "epoch": 1629} {"train_loss": -10.889890670776367, "global_step": 273716, "epoch": 1629} {"train_loss": -11.003946304321289, "global_step": 273717, "epoch": 1629} {"train_loss": -11.838479995727539, "global_step": 273718, "epoch": 1629} {"train_loss": -10.85633659362793, "global_step": 273719, "epoch": 1629} {"train_loss": -11.681108474731445, "global_step": 273720, "epoch": 1629} {"train_loss": -11.119048118591309, "global_step": 273721, "epoch": 1629} {"train_loss": -9.916401863098145, "global_step": 273722, "epoch": 1629} {"train_loss": -11.925414085388184, "global_step": 273723, "epoch": 1629} {"train_loss": -10.760201454162598, "global_step": 273724, "epoch": 1629} {"train_loss": -11.710620880126953, "global_step": 273725, "epoch": 1629} {"train_loss": -11.46071720123291, "global_step": 273726, "epoch": 1629} {"train_loss": -11.302332878112793, "global_step": 273727, "epoch": 1629} {"train_loss": -11.758079528808594, "global_step": 273728, "epoch": 1629} {"train_loss": -11.416141510009766, "global_step": 273729, "epoch": 1629} {"train_loss": -11.347322463989258, "global_step": 273730, "epoch": 1629} {"train_loss": -11.931018829345703, "global_step": 273731, "epoch": 1629} {"train_loss": -11.269336700439453, "global_step": 273732, "epoch": 1629} {"train_loss": -11.66126537322998, "global_step": 273733, "epoch": 1629} {"train_loss": -11.933780670166016, "global_step": 273734, "epoch": 1629} {"train_loss": -11.000667572021484, "global_step": 273735, "epoch": 1629} {"train_loss": -11.600414276123047, "global_step": 273736, "epoch": 1629} {"train_loss": -11.93526840209961, "global_step": 273737, "epoch": 1629} {"train_loss": -10.852322578430176, "global_step": 273738, "epoch": 1629} {"train_loss": -11.28781509399414, "global_step": 273739, "epoch": 1629} {"train_loss": -11.309682846069336, "global_step": 273740, "epoch": 1629} {"train_loss": -10.870613098144531, "global_step": 273741, "epoch": 1629} {"train_loss": -11.699068069458008, "global_step": 273742, "epoch": 1629} {"train_loss": -11.372163772583008, "global_step": 273743, "epoch": 1629} {"train_loss": -10.799566268920898, "global_step": 273744, "epoch": 1629} {"train_loss": -11.495500564575195, "global_step": 273745, "epoch": 1629} {"train_loss": -11.238542556762695, "global_step": 273746, "epoch": 1629} {"train_loss": -11.69827651977539, "global_step": 273747, "epoch": 1629} {"train_loss": -11.311731338500977, "global_step": 273748, "epoch": 1629} {"train_loss": -11.935810089111328, "global_step": 273749, "epoch": 1629} {"train_loss": -11.57696533203125, "global_step": 273750, "epoch": 1629} {"train_loss": -11.674407958984375, "global_step": 273751, "epoch": 1629} {"train_loss": -11.760553359985352, "global_step": 273752, "epoch": 1629} {"train_loss": -11.614968299865723, "global_step": 273753, "epoch": 1629} {"train_loss": -11.648500442504883, "global_step": 273754, "epoch": 1629} {"train_loss": -11.975944519042969, "global_step": 273755, "epoch": 1629} {"train_loss": -11.583006858825684, "global_step": 273756, "epoch": 1629} {"train_loss": -12.028121948242188, "global_step": 273757, "epoch": 1629} {"train_loss": -11.52200698852539, "global_step": 273758, "epoch": 1629} {"train_loss": -11.60470962524414, "global_step": 273759, "epoch": 1629} {"train_loss": -12.0487060546875, "global_step": 273760, "epoch": 1629} {"train_loss": -11.951787948608398, "global_step": 273761, "epoch": 1629} {"train_loss": -11.785123825073242, "global_step": 273762, "epoch": 1629} {"train_loss": -12.037102699279785, "global_step": 273763, "epoch": 1629} {"train_loss": -11.885642051696777, "global_step": 273764, "epoch": 1629} {"train_loss": -11.610279083251953, "global_step": 273765, "epoch": 1629} {"train_loss": -12.010287284851074, "global_step": 273766, "epoch": 1629} {"train_loss": -12.09117603302002, "global_step": 273767, "epoch": 1629} {"train_loss": -12.045248031616211, "global_step": 273768, "epoch": 1629} {"train_loss": -12.369447708129883, "global_step": 273769, "epoch": 1629} {"train_loss": -12.154226303100586, "global_step": 273770, "epoch": 1629} {"train_loss": -12.070454597473145, "global_step": 273771, "epoch": 1629} {"train_loss": -12.234789848327637, "global_step": 273772, "epoch": 1629} {"train_loss": -12.204070091247559, "global_step": 273773, "epoch": 1629} {"train_loss": -12.21250057220459, "global_step": 273774, "epoch": 1629} {"train_loss": -12.067591667175293, "global_step": 273775, "epoch": 1629} {"train_loss": -12.185050964355469, "global_step": 273776, "epoch": 1629} {"train_loss": -12.143128395080566, "global_step": 273777, "epoch": 1629} {"train_loss": -12.321493148803711, "global_step": 273778, "epoch": 1629} {"train_loss": -11.911565780639648, "global_step": 273779, "epoch": 1629} {"train_loss": -12.0546875, "global_step": 273780, "epoch": 1629} {"train_loss": -12.409656524658203, "global_step": 273781, "epoch": 1629} {"train_loss": -11.880905151367188, "global_step": 273782, "epoch": 1629} {"train_loss": -11.886981964111328, "global_step": 273783, "epoch": 1629} {"train_loss": -12.281148910522461, "global_step": 273784, "epoch": 1629} {"train_loss": -12.078628540039062, "global_step": 273785, "epoch": 1629} {"train_loss": -11.714659690856934, "global_step": 273786, "epoch": 1629} {"train_loss": -12.060539245605469, "global_step": 273787, "epoch": 1629} {"train_loss": -12.180097579956055, "global_step": 273788, "epoch": 1629} {"train_loss": -12.156288146972656, "global_step": 273789, "epoch": 1629} {"train_loss": -12.231321334838867, "global_step": 273790, "epoch": 1629} {"train_loss": -12.14553451538086, "global_step": 273791, "epoch": 1629} {"train_loss": -12.274065017700195, "global_step": 273792, "epoch": 1629} {"train_loss": -11.989989280700684, "global_step": 273793, "epoch": 1629} {"train_loss": -12.166155815124512, "global_step": 273794, "epoch": 1629} {"train_loss": -11.718399047851562, "global_step": 273795, "epoch": 1629} {"train_loss": -12.136212348937988, "global_step": 273796, "epoch": 1629} {"train_loss": -12.118586540222168, "global_step": 273797, "epoch": 1629} {"train_loss": -11.634688377380371, "global_step": 273798, "epoch": 1629} {"train_loss": -11.483104705810547, "global_step": 273799, "epoch": 1629} {"train_loss": -12.056366920471191, "global_step": 273800, "epoch": 1629} {"train_loss": -12.343730926513672, "global_step": 273801, "epoch": 1629} {"train_loss": -11.647040367126465, "global_step": 273802, "epoch": 1629} {"train_loss": -10.504786491394043, "global_step": 273803, "epoch": 1629} {"train_loss": -11.862360954284668, "global_step": 273804, "epoch": 1629} {"train_loss": -11.980056762695312, "global_step": 273805, "epoch": 1629} {"train_loss": -11.32475757598877, "global_step": 273806, "epoch": 1629} {"train_loss": -11.513446807861328, "global_step": 273807, "epoch": 1629} {"train_loss": -11.722264289855957, "global_step": 273808, "epoch": 1629} {"train_loss": -12.297379493713379, "global_step": 273809, "epoch": 1629} {"train_loss": -11.58851146697998, "global_step": 273810, "epoch": 1629} {"train_loss": -11.3551025390625, "global_step": 273811, "epoch": 1629} {"train_loss": -11.749648094177246, "global_step": 273812, "epoch": 1629} {"train_loss": -11.927125930786133, "global_step": 273813, "epoch": 1629} {"train_loss": -10.920443534851074, "global_step": 273814, "epoch": 1629} {"train_loss": -12.320878028869629, "global_step": 273815, "epoch": 1629} {"train_loss": -11.406266212463379, "global_step": 273816, "epoch": 1629} {"train_loss": -11.728097915649414, "global_step": 273817, "epoch": 1629} {"train_loss": -11.820911407470703, "global_step": 273818, "epoch": 1629} {"train_loss": -11.820446968078613, "global_step": 273819, "epoch": 1629} {"train_loss": -11.978388786315918, "global_step": 273820, "epoch": 1629} {"train_loss": -11.878588676452637, "global_step": 273821, "epoch": 1629} {"train_loss": -12.088756561279297, "global_step": 273822, "epoch": 1629} {"train_loss": -11.844747543334961, "global_step": 273823, "epoch": 1629} {"train_loss": -12.138994216918945, "global_step": 273824, "epoch": 1629} {"train_loss": -11.775331497192383, "global_step": 273825, "epoch": 1629} {"train_loss": -12.052148818969727, "global_step": 273826, "epoch": 1629} {"train_loss": -11.786495208740234, "global_step": 273827, "epoch": 1629} {"train_loss": -12.023025512695312, "global_step": 273828, "epoch": 1629} {"train_loss": -11.694997787475586, "global_step": 273829, "epoch": 1629} {"train_loss": -12.229375839233398, "global_step": 273830, "epoch": 1629} {"train_loss": -11.478889465332031, "global_step": 273831, "epoch": 1629} {"train_loss": -11.935647964477539, "global_step": 273832, "epoch": 1629} {"train_loss": -12.037388801574707, "global_step": 273833, "epoch": 1629} {"train_loss": -11.94687557220459, "global_step": 273834, "epoch": 1629} {"train_loss": -11.153793334960938, "global_step": 273835, "epoch": 1629} {"train_loss": -11.98045539855957, "global_step": 273836, "epoch": 1629} {"train_loss": -12.246445655822754, "global_step": 273837, "epoch": 1629} {"train_loss": -11.594444274902344, "global_step": 273838, "epoch": 1629} {"train_loss": -11.672868694577899, "global_step": 273839, "epoch": 1629, "val_loss": 275340.03125} {"train_loss": -12.056570053100586, "global_step": 273840, "epoch": 1630} {"train_loss": -11.86534309387207, "global_step": 273841, "epoch": 1630} {"train_loss": -11.758369445800781, "global_step": 273842, "epoch": 1630} {"train_loss": -11.645926475524902, "global_step": 273843, "epoch": 1630} {"train_loss": -11.383256912231445, "global_step": 273844, "epoch": 1630} {"train_loss": -11.793647766113281, "global_step": 273845, "epoch": 1630} {"train_loss": -12.24551773071289, "global_step": 273846, "epoch": 1630} {"train_loss": -11.815742492675781, "global_step": 273847, "epoch": 1630} {"train_loss": -12.305397987365723, "global_step": 273848, "epoch": 1630} {"train_loss": -11.58697509765625, "global_step": 273849, "epoch": 1630} {"train_loss": -11.812959671020508, "global_step": 273850, "epoch": 1630} {"train_loss": -11.872846603393555, "global_step": 273851, "epoch": 1630} {"train_loss": -11.746234893798828, "global_step": 273852, "epoch": 1630} {"train_loss": -11.534516334533691, "global_step": 273853, "epoch": 1630} {"train_loss": -11.286901473999023, "global_step": 273854, "epoch": 1630} {"train_loss": -12.265429496765137, "global_step": 273855, "epoch": 1630} {"train_loss": -11.81460952758789, "global_step": 273856, "epoch": 1630} {"train_loss": -11.885540008544922, "global_step": 273857, "epoch": 1630} {"train_loss": -11.986291885375977, "global_step": 273858, "epoch": 1630} {"train_loss": -12.060809135437012, "global_step": 273859, "epoch": 1630} {"train_loss": -11.20642375946045, "global_step": 273860, "epoch": 1630} {"train_loss": -12.307403564453125, "global_step": 273861, "epoch": 1630} {"train_loss": -11.796276092529297, "global_step": 273862, "epoch": 1630} {"train_loss": -12.053630828857422, "global_step": 273863, "epoch": 1630} {"train_loss": -12.110635757446289, "global_step": 273864, "epoch": 1630} {"train_loss": -11.688382148742676, "global_step": 273865, "epoch": 1630} {"train_loss": -11.363809585571289, "global_step": 273866, "epoch": 1630} {"train_loss": -12.17598819732666, "global_step": 273867, "epoch": 1630} {"train_loss": -11.685348510742188, "global_step": 273868, "epoch": 1630} {"train_loss": -11.605249404907227, "global_step": 273869, "epoch": 1630} {"train_loss": -12.043643951416016, "global_step": 273870, "epoch": 1630} {"train_loss": -11.649889945983887, "global_step": 273871, "epoch": 1630} {"train_loss": -11.745361328125, "global_step": 273872, "epoch": 1630} {"train_loss": -12.267077445983887, "global_step": 273873, "epoch": 1630} {"train_loss": -11.242525100708008, "global_step": 273874, "epoch": 1630} {"train_loss": -11.940671920776367, "global_step": 273875, "epoch": 1630} {"train_loss": -11.860967636108398, "global_step": 273876, "epoch": 1630} {"train_loss": -11.256208419799805, "global_step": 273877, "epoch": 1630} {"train_loss": -11.620599746704102, "global_step": 273878, "epoch": 1630} {"train_loss": -11.893457412719727, "global_step": 273879, "epoch": 1630} {"train_loss": -11.209341049194336, "global_step": 273880, "epoch": 1630} {"train_loss": -12.026937484741211, "global_step": 273881, "epoch": 1630} {"train_loss": -11.727039337158203, "global_step": 273882, "epoch": 1630} {"train_loss": -11.708940505981445, "global_step": 273883, "epoch": 1630} {"train_loss": -12.01226806640625, "global_step": 273884, "epoch": 1630} {"train_loss": -11.482678413391113, "global_step": 273885, "epoch": 1630} {"train_loss": -11.450114250183105, "global_step": 273886, "epoch": 1630} {"train_loss": -12.172502517700195, "global_step": 273887, "epoch": 1630} {"train_loss": -11.459704399108887, "global_step": 273888, "epoch": 1630} {"train_loss": -11.797515869140625, "global_step": 273889, "epoch": 1630} {"train_loss": -12.254737854003906, "global_step": 273890, "epoch": 1630} {"train_loss": -11.441472053527832, "global_step": 273891, "epoch": 1630} {"train_loss": -11.817800521850586, "global_step": 273892, "epoch": 1630} {"train_loss": -11.975893020629883, "global_step": 273893, "epoch": 1630} {"train_loss": -11.759668350219727, "global_step": 273894, "epoch": 1630} {"train_loss": -12.18233871459961, "global_step": 273895, "epoch": 1630} {"train_loss": -11.950390815734863, "global_step": 273896, "epoch": 1630} {"train_loss": -11.772527694702148, "global_step": 273897, "epoch": 1630} {"train_loss": -12.31619644165039, "global_step": 273898, "epoch": 1630} {"train_loss": -11.865251541137695, "global_step": 273899, "epoch": 1630} {"train_loss": -11.824432373046875, "global_step": 273900, "epoch": 1630} {"train_loss": -11.988726615905762, "global_step": 273901, "epoch": 1630} {"train_loss": -12.0658540725708, "global_step": 273902, "epoch": 1630} {"train_loss": -12.137086868286133, "global_step": 273903, "epoch": 1630} {"train_loss": -12.016461372375488, "global_step": 273904, "epoch": 1630} {"train_loss": -12.014020919799805, "global_step": 273905, "epoch": 1630} {"train_loss": -11.865070343017578, "global_step": 273906, "epoch": 1630} {"train_loss": -12.115555763244629, "global_step": 273907, "epoch": 1630} {"train_loss": -12.003425598144531, "global_step": 273908, "epoch": 1630} {"train_loss": -11.727485656738281, "global_step": 273909, "epoch": 1630} {"train_loss": -12.033244132995605, "global_step": 273910, "epoch": 1630} {"train_loss": -11.735899925231934, "global_step": 273911, "epoch": 1630} {"train_loss": -11.051620483398438, "global_step": 273912, "epoch": 1630} {"train_loss": -11.970403671264648, "global_step": 273913, "epoch": 1630} {"train_loss": -10.652303695678711, "global_step": 273914, "epoch": 1630} {"train_loss": -10.972586631774902, "global_step": 273915, "epoch": 1630} {"train_loss": -11.189867973327637, "global_step": 273916, "epoch": 1630} {"train_loss": -8.952183723449707, "global_step": 273917, "epoch": 1630} {"train_loss": -9.852130889892578, "global_step": 273918, "epoch": 1630} {"train_loss": -9.513029098510742, "global_step": 273919, "epoch": 1630} {"train_loss": -11.115825653076172, "global_step": 273920, "epoch": 1630} {"train_loss": -9.181619644165039, "global_step": 273921, "epoch": 1630} {"train_loss": -10.308917045593262, "global_step": 273922, "epoch": 1630} {"train_loss": -7.949403762817383, "global_step": 273923, "epoch": 1630} {"train_loss": -10.246705055236816, "global_step": 273924, "epoch": 1630} {"train_loss": -8.7402925491333, "global_step": 273925, "epoch": 1630} {"train_loss": -10.648646354675293, "global_step": 273926, "epoch": 1630} {"train_loss": -9.318718910217285, "global_step": 273927, "epoch": 1630} {"train_loss": -11.338579177856445, "global_step": 273928, "epoch": 1630} {"train_loss": -10.41041088104248, "global_step": 273929, "epoch": 1630} {"train_loss": -11.249015808105469, "global_step": 273930, "epoch": 1630} {"train_loss": -10.783171653747559, "global_step": 273931, "epoch": 1630} {"train_loss": -10.142193794250488, "global_step": 273932, "epoch": 1630} {"train_loss": -11.334739685058594, "global_step": 273933, "epoch": 1630} {"train_loss": -11.24454402923584, "global_step": 273934, "epoch": 1630} {"train_loss": -11.06356143951416, "global_step": 273935, "epoch": 1630} {"train_loss": -11.71997356414795, "global_step": 273936, "epoch": 1630} {"train_loss": -11.414972305297852, "global_step": 273937, "epoch": 1630} {"train_loss": -10.98873519897461, "global_step": 273938, "epoch": 1630} {"train_loss": -11.667835235595703, "global_step": 273939, "epoch": 1630} {"train_loss": -10.884214401245117, "global_step": 273940, "epoch": 1630} {"train_loss": -11.739192962646484, "global_step": 273941, "epoch": 1630} {"train_loss": -11.393172264099121, "global_step": 273942, "epoch": 1630} {"train_loss": -11.672279357910156, "global_step": 273943, "epoch": 1630} {"train_loss": -11.51435375213623, "global_step": 273944, "epoch": 1630} {"train_loss": -11.797872543334961, "global_step": 273945, "epoch": 1630} {"train_loss": -11.804603576660156, "global_step": 273946, "epoch": 1630} {"train_loss": -11.720298767089844, "global_step": 273947, "epoch": 1630} {"train_loss": -11.78262996673584, "global_step": 273948, "epoch": 1630} {"train_loss": -11.828178405761719, "global_step": 273949, "epoch": 1630} {"train_loss": -11.901103973388672, "global_step": 273950, "epoch": 1630} {"train_loss": -11.717039108276367, "global_step": 273951, "epoch": 1630} {"train_loss": -11.782155990600586, "global_step": 273952, "epoch": 1630} {"train_loss": -11.797158241271973, "global_step": 273953, "epoch": 1630} {"train_loss": -11.949771881103516, "global_step": 273954, "epoch": 1630} {"train_loss": -11.8975191116333, "global_step": 273955, "epoch": 1630} {"train_loss": -12.003263473510742, "global_step": 273956, "epoch": 1630} {"train_loss": -12.142380714416504, "global_step": 273957, "epoch": 1630} {"train_loss": -11.918925285339355, "global_step": 273958, "epoch": 1630} {"train_loss": -11.927397727966309, "global_step": 273959, "epoch": 1630} {"train_loss": -12.120407104492188, "global_step": 273960, "epoch": 1630} {"train_loss": -12.121986389160156, "global_step": 273961, "epoch": 1630} {"train_loss": -12.000170707702637, "global_step": 273962, "epoch": 1630} {"train_loss": -11.812156677246094, "global_step": 273963, "epoch": 1630} {"train_loss": -11.859936714172363, "global_step": 273964, "epoch": 1630} {"train_loss": -12.025420188903809, "global_step": 273965, "epoch": 1630} {"train_loss": -12.100038528442383, "global_step": 273966, "epoch": 1630} {"train_loss": -11.846399307250977, "global_step": 273967, "epoch": 1630} {"train_loss": -12.015665054321289, "global_step": 273968, "epoch": 1630} {"train_loss": -11.882392883300781, "global_step": 273969, "epoch": 1630} {"train_loss": -11.85930061340332, "global_step": 273970, "epoch": 1630} {"train_loss": -11.994122505187988, "global_step": 273971, "epoch": 1630} {"train_loss": -11.796628952026367, "global_step": 273972, "epoch": 1630} {"train_loss": -11.976662635803223, "global_step": 273973, "epoch": 1630} {"train_loss": -11.899687767028809, "global_step": 273974, "epoch": 1630} {"train_loss": -11.911925315856934, "global_step": 273975, "epoch": 1630} {"train_loss": -12.094112396240234, "global_step": 273976, "epoch": 1630} {"train_loss": -12.103923797607422, "global_step": 273977, "epoch": 1630} {"train_loss": -12.22988510131836, "global_step": 273978, "epoch": 1630} {"train_loss": -12.132304191589355, "global_step": 273979, "epoch": 1630} {"train_loss": -11.971672058105469, "global_step": 273980, "epoch": 1630} {"train_loss": -12.160392761230469, "global_step": 273981, "epoch": 1630} {"train_loss": -12.073875427246094, "global_step": 273982, "epoch": 1630} {"train_loss": -12.09554672241211, "global_step": 273983, "epoch": 1630} {"train_loss": -12.347661018371582, "global_step": 273984, "epoch": 1630} {"train_loss": -12.139410018920898, "global_step": 273985, "epoch": 1630} {"train_loss": -12.167915344238281, "global_step": 273986, "epoch": 1630} {"train_loss": -11.973458290100098, "global_step": 273987, "epoch": 1630} {"train_loss": -12.195377349853516, "global_step": 273988, "epoch": 1630} {"train_loss": -12.304539680480957, "global_step": 273989, "epoch": 1630} {"train_loss": -12.038010597229004, "global_step": 273990, "epoch": 1630} {"train_loss": -12.268444061279297, "global_step": 273991, "epoch": 1630} {"train_loss": -11.932287216186523, "global_step": 273992, "epoch": 1630} {"train_loss": -12.294681549072266, "global_step": 273993, "epoch": 1630} {"train_loss": -12.018945693969727, "global_step": 273994, "epoch": 1630} {"train_loss": -12.339628219604492, "global_step": 273995, "epoch": 1630} {"train_loss": -12.13235855102539, "global_step": 273996, "epoch": 1630} {"train_loss": -12.167911529541016, "global_step": 273997, "epoch": 1630} {"train_loss": -12.10399055480957, "global_step": 273998, "epoch": 1630} {"train_loss": -12.281965255737305, "global_step": 273999, "epoch": 1630} {"train_loss": -12.1663818359375, "global_step": 274000, "epoch": 1630} {"train_loss": -11.955122947692871, "global_step": 274001, "epoch": 1630} {"train_loss": -11.920963287353516, "global_step": 274002, "epoch": 1630} {"train_loss": -11.746580123901367, "global_step": 274003, "epoch": 1630} {"train_loss": -12.130305290222168, "global_step": 274004, "epoch": 1630} {"train_loss": -11.879392623901367, "global_step": 274005, "epoch": 1630} {"train_loss": -11.412223815917969, "global_step": 274006, "epoch": 1630} {"train_loss": -11.669134066218422, "global_step": 274007, "epoch": 1630, "val_loss": 272902.5625, "train_action_mse_error": 6.360795974731445} {"train_loss": -11.514618873596191, "global_step": 274008, "epoch": 1631} {"train_loss": -12.182162284851074, "global_step": 274009, "epoch": 1631} {"train_loss": -12.096710205078125, "global_step": 274010, "epoch": 1631} {"train_loss": -11.779386520385742, "global_step": 274011, "epoch": 1631} {"train_loss": -11.994035720825195, "global_step": 274012, "epoch": 1631} {"train_loss": -11.08508586883545, "global_step": 274013, "epoch": 1631} {"train_loss": -11.22220230102539, "global_step": 274014, "epoch": 1631} {"train_loss": -12.197154998779297, "global_step": 274015, "epoch": 1631} {"train_loss": -11.117544174194336, "global_step": 274016, "epoch": 1631} {"train_loss": -11.672359466552734, "global_step": 274017, "epoch": 1631} {"train_loss": -11.799839973449707, "global_step": 274018, "epoch": 1631} {"train_loss": -10.588665008544922, "global_step": 274019, "epoch": 1631} {"train_loss": -12.089534759521484, "global_step": 274020, "epoch": 1631} {"train_loss": -10.96670913696289, "global_step": 274021, "epoch": 1631} {"train_loss": -11.178295135498047, "global_step": 274022, "epoch": 1631} {"train_loss": -11.299863815307617, "global_step": 274023, "epoch": 1631} {"train_loss": -11.11671257019043, "global_step": 274024, "epoch": 1631} {"train_loss": -11.27817440032959, "global_step": 274025, "epoch": 1631} {"train_loss": -11.02392578125, "global_step": 274026, "epoch": 1631} {"train_loss": -11.415775299072266, "global_step": 274027, "epoch": 1631} {"train_loss": -11.513544082641602, "global_step": 274028, "epoch": 1631} {"train_loss": -11.53213119506836, "global_step": 274029, "epoch": 1631} {"train_loss": -11.798888206481934, "global_step": 274030, "epoch": 1631} {"train_loss": -11.59975528717041, "global_step": 274031, "epoch": 1631} {"train_loss": -11.871383666992188, "global_step": 274032, "epoch": 1631} {"train_loss": -11.589285850524902, "global_step": 274033, "epoch": 1631} {"train_loss": -11.816356658935547, "global_step": 274034, "epoch": 1631} {"train_loss": -11.721391677856445, "global_step": 274035, "epoch": 1631} {"train_loss": -12.040355682373047, "global_step": 274036, "epoch": 1631} {"train_loss": -12.092994689941406, "global_step": 274037, "epoch": 1631} {"train_loss": -12.131795883178711, "global_step": 274038, "epoch": 1631} {"train_loss": -12.083061218261719, "global_step": 274039, "epoch": 1631} {"train_loss": -11.920007705688477, "global_step": 274040, "epoch": 1631} {"train_loss": -12.063963890075684, "global_step": 274041, "epoch": 1631} {"train_loss": -12.173099517822266, "global_step": 274042, "epoch": 1631} {"train_loss": -12.134871482849121, "global_step": 274043, "epoch": 1631} {"train_loss": -12.056387901306152, "global_step": 274044, "epoch": 1631} {"train_loss": -11.74416732788086, "global_step": 274045, "epoch": 1631} {"train_loss": -12.014033317565918, "global_step": 274046, "epoch": 1631} {"train_loss": -12.255624771118164, "global_step": 274047, "epoch": 1631} {"train_loss": -11.821537017822266, "global_step": 274048, "epoch": 1631} {"train_loss": -12.061372756958008, "global_step": 274049, "epoch": 1631} {"train_loss": -11.866519927978516, "global_step": 274050, "epoch": 1631} {"train_loss": -12.264394760131836, "global_step": 274051, "epoch": 1631} {"train_loss": -12.134563446044922, "global_step": 274052, "epoch": 1631} {"train_loss": -11.941866874694824, "global_step": 274053, "epoch": 1631} {"train_loss": -12.417469024658203, "global_step": 274054, "epoch": 1631} {"train_loss": -11.899456024169922, "global_step": 274055, "epoch": 1631} {"train_loss": -11.953763008117676, "global_step": 274056, "epoch": 1631} {"train_loss": -11.955240249633789, "global_step": 274057, "epoch": 1631} {"train_loss": -12.265594482421875, "global_step": 274058, "epoch": 1631} {"train_loss": -11.754003524780273, "global_step": 274059, "epoch": 1631} {"train_loss": -11.941417694091797, "global_step": 274060, "epoch": 1631} {"train_loss": -11.955864906311035, "global_step": 274061, "epoch": 1631} {"train_loss": -12.031106948852539, "global_step": 274062, "epoch": 1631} {"train_loss": -11.316287994384766, "global_step": 274063, "epoch": 1631} {"train_loss": -12.244521141052246, "global_step": 274064, "epoch": 1631} {"train_loss": -11.929319381713867, "global_step": 274065, "epoch": 1631} {"train_loss": -11.79478645324707, "global_step": 274066, "epoch": 1631} {"train_loss": -12.112524032592773, "global_step": 274067, "epoch": 1631} {"train_loss": -11.874579429626465, "global_step": 274068, "epoch": 1631} {"train_loss": -11.321840286254883, "global_step": 274069, "epoch": 1631} {"train_loss": -11.690256118774414, "global_step": 274070, "epoch": 1631} {"train_loss": -10.963210105895996, "global_step": 274071, "epoch": 1631} {"train_loss": -10.977903366088867, "global_step": 274072, "epoch": 1631} {"train_loss": -11.728458404541016, "global_step": 274073, "epoch": 1631} {"train_loss": -10.991658210754395, "global_step": 274074, "epoch": 1631} {"train_loss": -10.871889114379883, "global_step": 274075, "epoch": 1631} {"train_loss": -12.191023826599121, "global_step": 274076, "epoch": 1631} {"train_loss": -10.804092407226562, "global_step": 274077, "epoch": 1631} {"train_loss": -11.049091339111328, "global_step": 274078, "epoch": 1631} {"train_loss": -10.794243812561035, "global_step": 274079, "epoch": 1631} {"train_loss": -10.45362377166748, "global_step": 274080, "epoch": 1631} {"train_loss": -11.606555938720703, "global_step": 274081, "epoch": 1631} {"train_loss": -10.254806518554688, "global_step": 274082, "epoch": 1631} {"train_loss": -10.995474815368652, "global_step": 274083, "epoch": 1631} {"train_loss": -11.271079063415527, "global_step": 274084, "epoch": 1631} {"train_loss": -9.860034942626953, "global_step": 274085, "epoch": 1631} {"train_loss": -11.69349193572998, "global_step": 274086, "epoch": 1631} {"train_loss": -10.27641487121582, "global_step": 274087, "epoch": 1631} {"train_loss": -11.156134605407715, "global_step": 274088, "epoch": 1631} {"train_loss": -11.07076644897461, "global_step": 274089, "epoch": 1631} {"train_loss": -11.19666576385498, "global_step": 274090, "epoch": 1631} {"train_loss": -11.542313575744629, "global_step": 274091, "epoch": 1631} {"train_loss": -11.06243896484375, "global_step": 274092, "epoch": 1631} {"train_loss": -11.684700012207031, "global_step": 274093, "epoch": 1631} {"train_loss": -11.531148910522461, "global_step": 274094, "epoch": 1631} {"train_loss": -11.731986999511719, "global_step": 274095, "epoch": 1631} {"train_loss": -11.669502258300781, "global_step": 274096, "epoch": 1631} {"train_loss": -11.583017349243164, "global_step": 274097, "epoch": 1631} {"train_loss": -11.736510276794434, "global_step": 274098, "epoch": 1631} {"train_loss": -11.716897010803223, "global_step": 274099, "epoch": 1631} {"train_loss": -11.984387397766113, "global_step": 274100, "epoch": 1631} {"train_loss": -11.803120613098145, "global_step": 274101, "epoch": 1631} {"train_loss": -11.736173629760742, "global_step": 274102, "epoch": 1631} {"train_loss": -11.801373481750488, "global_step": 274103, "epoch": 1631} {"train_loss": -12.037605285644531, "global_step": 274104, "epoch": 1631} {"train_loss": -12.106270790100098, "global_step": 274105, "epoch": 1631} {"train_loss": -11.663130760192871, "global_step": 274106, "epoch": 1631} {"train_loss": -12.057679176330566, "global_step": 274107, "epoch": 1631} {"train_loss": -11.870903015136719, "global_step": 274108, "epoch": 1631} {"train_loss": -12.09721851348877, "global_step": 274109, "epoch": 1631} {"train_loss": -11.959601402282715, "global_step": 274110, "epoch": 1631} {"train_loss": -11.723860740661621, "global_step": 274111, "epoch": 1631} {"train_loss": -12.267159461975098, "global_step": 274112, "epoch": 1631} {"train_loss": -11.727222442626953, "global_step": 274113, "epoch": 1631} {"train_loss": -11.986754417419434, "global_step": 274114, "epoch": 1631} {"train_loss": -11.876701354980469, "global_step": 274115, "epoch": 1631} {"train_loss": -11.951638221740723, "global_step": 274116, "epoch": 1631} {"train_loss": -11.946101188659668, "global_step": 274117, "epoch": 1631} {"train_loss": -11.953256607055664, "global_step": 274118, "epoch": 1631} {"train_loss": -12.005647659301758, "global_step": 274119, "epoch": 1631} {"train_loss": -12.014339447021484, "global_step": 274120, "epoch": 1631} {"train_loss": -11.978141784667969, "global_step": 274121, "epoch": 1631} {"train_loss": -12.098207473754883, "global_step": 274122, "epoch": 1631} {"train_loss": -11.74325180053711, "global_step": 274123, "epoch": 1631} {"train_loss": -12.049652099609375, "global_step": 274124, "epoch": 1631} {"train_loss": -12.221267700195312, "global_step": 274125, "epoch": 1631} {"train_loss": -11.900896072387695, "global_step": 274126, "epoch": 1631} {"train_loss": -12.228226661682129, "global_step": 274127, "epoch": 1631} {"train_loss": -11.862383842468262, "global_step": 274128, "epoch": 1631} {"train_loss": -12.151639938354492, "global_step": 274129, "epoch": 1631} {"train_loss": -12.043752670288086, "global_step": 274130, "epoch": 1631} {"train_loss": -12.001441955566406, "global_step": 274131, "epoch": 1631} {"train_loss": -12.079519271850586, "global_step": 274132, "epoch": 1631} {"train_loss": -12.22938346862793, "global_step": 274133, "epoch": 1631} {"train_loss": -12.177879333496094, "global_step": 274134, "epoch": 1631} {"train_loss": -12.09057331085205, "global_step": 274135, "epoch": 1631} {"train_loss": -12.117594718933105, "global_step": 274136, "epoch": 1631} {"train_loss": -11.986753463745117, "global_step": 274137, "epoch": 1631} {"train_loss": -12.199396133422852, "global_step": 274138, "epoch": 1631} {"train_loss": -12.104884147644043, "global_step": 274139, "epoch": 1631} {"train_loss": -12.02907943725586, "global_step": 274140, "epoch": 1631} {"train_loss": -12.1935453414917, "global_step": 274141, "epoch": 1631} {"train_loss": -11.780169486999512, "global_step": 274142, "epoch": 1631} {"train_loss": -11.961448669433594, "global_step": 274143, "epoch": 1631} {"train_loss": -12.132019996643066, "global_step": 274144, "epoch": 1631} {"train_loss": -11.934990882873535, "global_step": 274145, "epoch": 1631} {"train_loss": -12.056621551513672, "global_step": 274146, "epoch": 1631} {"train_loss": -12.291064262390137, "global_step": 274147, "epoch": 1631} {"train_loss": -11.490105628967285, "global_step": 274148, "epoch": 1631} {"train_loss": -12.025177001953125, "global_step": 274149, "epoch": 1631} {"train_loss": -11.878746032714844, "global_step": 274150, "epoch": 1631} {"train_loss": -11.85856819152832, "global_step": 274151, "epoch": 1631} {"train_loss": -11.80405044555664, "global_step": 274152, "epoch": 1631} {"train_loss": -12.154702186584473, "global_step": 274153, "epoch": 1631} {"train_loss": -11.61367416381836, "global_step": 274154, "epoch": 1631} {"train_loss": -12.204591751098633, "global_step": 274155, "epoch": 1631} {"train_loss": -11.280726432800293, "global_step": 274156, "epoch": 1631} {"train_loss": -11.347614288330078, "global_step": 274157, "epoch": 1631} {"train_loss": -11.85360050201416, "global_step": 274158, "epoch": 1631} {"train_loss": -11.739151954650879, "global_step": 274159, "epoch": 1631} {"train_loss": -11.9433012008667, "global_step": 274160, "epoch": 1631} {"train_loss": -11.824780464172363, "global_step": 274161, "epoch": 1631} {"train_loss": -12.025125503540039, "global_step": 274162, "epoch": 1631} {"train_loss": -12.082038879394531, "global_step": 274163, "epoch": 1631} {"train_loss": -12.057611465454102, "global_step": 274164, "epoch": 1631} {"train_loss": -12.241376876831055, "global_step": 274165, "epoch": 1631} {"train_loss": -12.116134643554688, "global_step": 274166, "epoch": 1631} {"train_loss": -12.160860061645508, "global_step": 274167, "epoch": 1631} {"train_loss": -11.979822158813477, "global_step": 274168, "epoch": 1631} {"train_loss": -12.004627227783203, "global_step": 274169, "epoch": 1631} {"train_loss": -11.673574447631836, "global_step": 274170, "epoch": 1631} {"train_loss": -12.164220809936523, "global_step": 274171, "epoch": 1631} {"train_loss": -11.815210342407227, "global_step": 274172, "epoch": 1631} {"train_loss": -11.880061149597168, "global_step": 274173, "epoch": 1631} {"train_loss": -12.304431915283203, "global_step": 274174, "epoch": 1631} {"train_loss": -11.765337223098392, "global_step": 274175, "epoch": 1631, "val_loss": 276641.28125} {"train_loss": -12.209991455078125, "global_step": 274176, "epoch": 1632} {"train_loss": -12.464126586914062, "global_step": 274177, "epoch": 1632} {"train_loss": -12.157648086547852, "global_step": 274178, "epoch": 1632} {"train_loss": -12.258581161499023, "global_step": 274179, "epoch": 1632} {"train_loss": -12.14420223236084, "global_step": 274180, "epoch": 1632} {"train_loss": -12.058361053466797, "global_step": 274181, "epoch": 1632} {"train_loss": -12.22099494934082, "global_step": 274182, "epoch": 1632} {"train_loss": -12.101213455200195, "global_step": 274183, "epoch": 1632} {"train_loss": -12.096461296081543, "global_step": 274184, "epoch": 1632} {"train_loss": -11.799296379089355, "global_step": 274185, "epoch": 1632} {"train_loss": -11.658661842346191, "global_step": 274186, "epoch": 1632} {"train_loss": -11.804032325744629, "global_step": 274187, "epoch": 1632} {"train_loss": -11.086804389953613, "global_step": 274188, "epoch": 1632} {"train_loss": -11.621892929077148, "global_step": 274189, "epoch": 1632} {"train_loss": -11.685365676879883, "global_step": 274190, "epoch": 1632} {"train_loss": -10.24516487121582, "global_step": 274191, "epoch": 1632} {"train_loss": -11.445116996765137, "global_step": 274192, "epoch": 1632} {"train_loss": -10.552064895629883, "global_step": 274193, "epoch": 1632} {"train_loss": -10.110062599182129, "global_step": 274194, "epoch": 1632} {"train_loss": -11.757253646850586, "global_step": 274195, "epoch": 1632} {"train_loss": -10.807388305664062, "global_step": 274196, "epoch": 1632} {"train_loss": -11.709549903869629, "global_step": 274197, "epoch": 1632} {"train_loss": -11.234710693359375, "global_step": 274198, "epoch": 1632} {"train_loss": -10.565722465515137, "global_step": 274199, "epoch": 1632} {"train_loss": -11.795849800109863, "global_step": 274200, "epoch": 1632} {"train_loss": -11.05770206451416, "global_step": 274201, "epoch": 1632} {"train_loss": -11.725492477416992, "global_step": 274202, "epoch": 1632} {"train_loss": -11.766773223876953, "global_step": 274203, "epoch": 1632} {"train_loss": -11.69626235961914, "global_step": 274204, "epoch": 1632} {"train_loss": -11.778435707092285, "global_step": 274205, "epoch": 1632} {"train_loss": -11.599977493286133, "global_step": 274206, "epoch": 1632} {"train_loss": -11.879932403564453, "global_step": 274207, "epoch": 1632} {"train_loss": -11.348505020141602, "global_step": 274208, "epoch": 1632} {"train_loss": -12.18868637084961, "global_step": 274209, "epoch": 1632} {"train_loss": -11.267446517944336, "global_step": 274210, "epoch": 1632} {"train_loss": -11.316718101501465, "global_step": 274211, "epoch": 1632} {"train_loss": -11.35531997680664, "global_step": 274212, "epoch": 1632} {"train_loss": -12.06049633026123, "global_step": 274213, "epoch": 1632} {"train_loss": -11.466287612915039, "global_step": 274214, "epoch": 1632} {"train_loss": -11.871997833251953, "global_step": 274215, "epoch": 1632} {"train_loss": -11.822956085205078, "global_step": 274216, "epoch": 1632} {"train_loss": -11.694509506225586, "global_step": 274217, "epoch": 1632} {"train_loss": -11.518570899963379, "global_step": 274218, "epoch": 1632} {"train_loss": -11.494271278381348, "global_step": 274219, "epoch": 1632} {"train_loss": -11.404690742492676, "global_step": 274220, "epoch": 1632} {"train_loss": -11.913883209228516, "global_step": 274221, "epoch": 1632} {"train_loss": -11.417659759521484, "global_step": 274222, "epoch": 1632} {"train_loss": -11.792235374450684, "global_step": 274223, "epoch": 1632} {"train_loss": -11.911792755126953, "global_step": 274224, "epoch": 1632} {"train_loss": -11.714190483093262, "global_step": 274225, "epoch": 1632} {"train_loss": -12.123412132263184, "global_step": 274226, "epoch": 1632} {"train_loss": -11.618671417236328, "global_step": 274227, "epoch": 1632} {"train_loss": -11.843201637268066, "global_step": 274228, "epoch": 1632} {"train_loss": -11.91330337524414, "global_step": 274229, "epoch": 1632} {"train_loss": -11.854766845703125, "global_step": 274230, "epoch": 1632} {"train_loss": -12.097064971923828, "global_step": 274231, "epoch": 1632} {"train_loss": -12.00141716003418, "global_step": 274232, "epoch": 1632} {"train_loss": -11.792920112609863, "global_step": 274233, "epoch": 1632} {"train_loss": -11.939960479736328, "global_step": 274234, "epoch": 1632} {"train_loss": -11.78123664855957, "global_step": 274235, "epoch": 1632} {"train_loss": -11.836254119873047, "global_step": 274236, "epoch": 1632} {"train_loss": -11.744771957397461, "global_step": 274237, "epoch": 1632} {"train_loss": -11.755776405334473, "global_step": 274238, "epoch": 1632} {"train_loss": -11.782833099365234, "global_step": 274239, "epoch": 1632} {"train_loss": -11.943465232849121, "global_step": 274240, "epoch": 1632} {"train_loss": -11.599441528320312, "global_step": 274241, "epoch": 1632} {"train_loss": -11.889837265014648, "global_step": 274242, "epoch": 1632} {"train_loss": -12.00937271118164, "global_step": 274243, "epoch": 1632} {"train_loss": -11.80546760559082, "global_step": 274244, "epoch": 1632} {"train_loss": -11.816814422607422, "global_step": 274245, "epoch": 1632} {"train_loss": -12.248062133789062, "global_step": 274246, "epoch": 1632} {"train_loss": -12.003412246704102, "global_step": 274247, "epoch": 1632} {"train_loss": -11.860734939575195, "global_step": 274248, "epoch": 1632} {"train_loss": -12.230541229248047, "global_step": 274249, "epoch": 1632} {"train_loss": -12.182666778564453, "global_step": 274250, "epoch": 1632} {"train_loss": -12.200252532958984, "global_step": 274251, "epoch": 1632} {"train_loss": -12.041531562805176, "global_step": 274252, "epoch": 1632} {"train_loss": -12.170694351196289, "global_step": 274253, "epoch": 1632} {"train_loss": -11.975522994995117, "global_step": 274254, "epoch": 1632} {"train_loss": -11.437481880187988, "global_step": 274255, "epoch": 1632} {"train_loss": -11.830613136291504, "global_step": 274256, "epoch": 1632} {"train_loss": -11.886542320251465, "global_step": 274257, "epoch": 1632} {"train_loss": -12.363088607788086, "global_step": 274258, "epoch": 1632} {"train_loss": -11.768349647521973, "global_step": 274259, "epoch": 1632} {"train_loss": -12.12661361694336, "global_step": 274260, "epoch": 1632} {"train_loss": -11.922040939331055, "global_step": 274261, "epoch": 1632} {"train_loss": -12.019842147827148, "global_step": 274262, "epoch": 1632} {"train_loss": -12.109528541564941, "global_step": 274263, "epoch": 1632} {"train_loss": -11.499238967895508, "global_step": 274264, "epoch": 1632} {"train_loss": -11.818459510803223, "global_step": 274265, "epoch": 1632} {"train_loss": -11.918095588684082, "global_step": 274266, "epoch": 1632} {"train_loss": -11.849733352661133, "global_step": 274267, "epoch": 1632} {"train_loss": -11.741037368774414, "global_step": 274268, "epoch": 1632} {"train_loss": -11.833988189697266, "global_step": 274269, "epoch": 1632} {"train_loss": -11.73404598236084, "global_step": 274270, "epoch": 1632} {"train_loss": -10.797388076782227, "global_step": 274271, "epoch": 1632} {"train_loss": -11.799783706665039, "global_step": 274272, "epoch": 1632} {"train_loss": -11.866941452026367, "global_step": 274273, "epoch": 1632} {"train_loss": -10.960065841674805, "global_step": 274274, "epoch": 1632} {"train_loss": -11.429417610168457, "global_step": 274275, "epoch": 1632} {"train_loss": -12.110333442687988, "global_step": 274276, "epoch": 1632} {"train_loss": -10.722760200500488, "global_step": 274277, "epoch": 1632} {"train_loss": -11.153181076049805, "global_step": 274278, "epoch": 1632} {"train_loss": -11.734561920166016, "global_step": 274279, "epoch": 1632} {"train_loss": -11.983049392700195, "global_step": 274280, "epoch": 1632} {"train_loss": -11.262052536010742, "global_step": 274281, "epoch": 1632} {"train_loss": -12.084267616271973, "global_step": 274282, "epoch": 1632} {"train_loss": -11.591619491577148, "global_step": 274283, "epoch": 1632} {"train_loss": -11.813968658447266, "global_step": 274284, "epoch": 1632} {"train_loss": -12.02489185333252, "global_step": 274285, "epoch": 1632} {"train_loss": -11.33130931854248, "global_step": 274286, "epoch": 1632} {"train_loss": -11.701138496398926, "global_step": 274287, "epoch": 1632} {"train_loss": -11.890934944152832, "global_step": 274288, "epoch": 1632} {"train_loss": -11.620818138122559, "global_step": 274289, "epoch": 1632} {"train_loss": -11.958576202392578, "global_step": 274290, "epoch": 1632} {"train_loss": -11.61450481414795, "global_step": 274291, "epoch": 1632} {"train_loss": -11.014992713928223, "global_step": 274292, "epoch": 1632} {"train_loss": -11.942691802978516, "global_step": 274293, "epoch": 1632} {"train_loss": -11.25214958190918, "global_step": 274294, "epoch": 1632} {"train_loss": -12.025777816772461, "global_step": 274295, "epoch": 1632} {"train_loss": -11.722848892211914, "global_step": 274296, "epoch": 1632} {"train_loss": -11.781967163085938, "global_step": 274297, "epoch": 1632} {"train_loss": -11.540239334106445, "global_step": 274298, "epoch": 1632} {"train_loss": -11.271799087524414, "global_step": 274299, "epoch": 1632} {"train_loss": -12.024544715881348, "global_step": 274300, "epoch": 1632} {"train_loss": -11.524345397949219, "global_step": 274301, "epoch": 1632} {"train_loss": -12.111703872680664, "global_step": 274302, "epoch": 1632} {"train_loss": -11.602226257324219, "global_step": 274303, "epoch": 1632} {"train_loss": -11.69720458984375, "global_step": 274304, "epoch": 1632} {"train_loss": -11.933635711669922, "global_step": 274305, "epoch": 1632} {"train_loss": -11.82513427734375, "global_step": 274306, "epoch": 1632} {"train_loss": -11.759092330932617, "global_step": 274307, "epoch": 1632} {"train_loss": -11.783039093017578, "global_step": 274308, "epoch": 1632} {"train_loss": -11.100564956665039, "global_step": 274309, "epoch": 1632} {"train_loss": -11.703836441040039, "global_step": 274310, "epoch": 1632} {"train_loss": -11.528472900390625, "global_step": 274311, "epoch": 1632} {"train_loss": -10.98300552368164, "global_step": 274312, "epoch": 1632} {"train_loss": -11.708057403564453, "global_step": 274313, "epoch": 1632} {"train_loss": -10.28175163269043, "global_step": 274314, "epoch": 1632} {"train_loss": -11.920909881591797, "global_step": 274315, "epoch": 1632} {"train_loss": -11.47264289855957, "global_step": 274316, "epoch": 1632} {"train_loss": -11.526640892028809, "global_step": 274317, "epoch": 1632} {"train_loss": -11.859601020812988, "global_step": 274318, "epoch": 1632} {"train_loss": -11.618342399597168, "global_step": 274319, "epoch": 1632} {"train_loss": -12.137874603271484, "global_step": 274320, "epoch": 1632} {"train_loss": -11.761148452758789, "global_step": 274321, "epoch": 1632} {"train_loss": -12.113959312438965, "global_step": 274322, "epoch": 1632} {"train_loss": -11.2583646774292, "global_step": 274323, "epoch": 1632} {"train_loss": -12.297399520874023, "global_step": 274324, "epoch": 1632} {"train_loss": -11.578689575195312, "global_step": 274325, "epoch": 1632} {"train_loss": -11.936182975769043, "global_step": 274326, "epoch": 1632} {"train_loss": -12.035636901855469, "global_step": 274327, "epoch": 1632} {"train_loss": -12.114713668823242, "global_step": 274328, "epoch": 1632} {"train_loss": -11.818754196166992, "global_step": 274329, "epoch": 1632} {"train_loss": -11.781025886535645, "global_step": 274330, "epoch": 1632} {"train_loss": -12.065756797790527, "global_step": 274331, "epoch": 1632} {"train_loss": -11.988563537597656, "global_step": 274332, "epoch": 1632} {"train_loss": -12.0091552734375, "global_step": 274333, "epoch": 1632} {"train_loss": -12.065346717834473, "global_step": 274334, "epoch": 1632} {"train_loss": -12.282539367675781, "global_step": 274335, "epoch": 1632} {"train_loss": -12.198108673095703, "global_step": 274336, "epoch": 1632} {"train_loss": -12.240196228027344, "global_step": 274337, "epoch": 1632} {"train_loss": -12.094813346862793, "global_step": 274338, "epoch": 1632} {"train_loss": -12.08316421508789, "global_step": 274339, "epoch": 1632} {"train_loss": -12.052047729492188, "global_step": 274340, "epoch": 1632} {"train_loss": -12.15200424194336, "global_step": 274341, "epoch": 1632} {"train_loss": -12.173188209533691, "global_step": 274342, "epoch": 1632} {"train_loss": -11.743469363167172, "global_step": 274343, "epoch": 1632, "val_loss": 277591.96875} {"train_loss": -11.752466201782227, "global_step": 274344, "epoch": 1633} {"train_loss": -12.045597076416016, "global_step": 274345, "epoch": 1633} {"train_loss": -11.982561111450195, "global_step": 274346, "epoch": 1633} {"train_loss": -12.115682601928711, "global_step": 274347, "epoch": 1633} {"train_loss": -11.986263275146484, "global_step": 274348, "epoch": 1633} {"train_loss": -12.140037536621094, "global_step": 274349, "epoch": 1633} {"train_loss": -12.105035781860352, "global_step": 274350, "epoch": 1633} {"train_loss": -12.201454162597656, "global_step": 274351, "epoch": 1633} {"train_loss": -12.136874198913574, "global_step": 274352, "epoch": 1633} {"train_loss": -12.168756484985352, "global_step": 274353, "epoch": 1633} {"train_loss": -11.983022689819336, "global_step": 274354, "epoch": 1633} {"train_loss": -12.267511367797852, "global_step": 274355, "epoch": 1633} {"train_loss": -12.132792472839355, "global_step": 274356, "epoch": 1633} {"train_loss": -11.90497875213623, "global_step": 274357, "epoch": 1633} {"train_loss": -12.212517738342285, "global_step": 274358, "epoch": 1633} {"train_loss": -12.161968231201172, "global_step": 274359, "epoch": 1633} {"train_loss": -12.070844650268555, "global_step": 274360, "epoch": 1633} {"train_loss": -12.132044792175293, "global_step": 274361, "epoch": 1633} {"train_loss": -12.152414321899414, "global_step": 274362, "epoch": 1633} {"train_loss": -12.356069564819336, "global_step": 274363, "epoch": 1633} {"train_loss": -12.287150382995605, "global_step": 274364, "epoch": 1633} {"train_loss": -12.295171737670898, "global_step": 274365, "epoch": 1633} {"train_loss": -12.230683326721191, "global_step": 274366, "epoch": 1633} {"train_loss": -12.197165489196777, "global_step": 274367, "epoch": 1633} {"train_loss": -12.182792663574219, "global_step": 274368, "epoch": 1633} {"train_loss": -11.734811782836914, "global_step": 274369, "epoch": 1633} {"train_loss": -11.672046661376953, "global_step": 274370, "epoch": 1633} {"train_loss": -11.845856666564941, "global_step": 274371, "epoch": 1633} {"train_loss": -12.291942596435547, "global_step": 274372, "epoch": 1633} {"train_loss": -12.13918399810791, "global_step": 274373, "epoch": 1633} {"train_loss": -12.043783187866211, "global_step": 274374, "epoch": 1633} {"train_loss": -11.350971221923828, "global_step": 274375, "epoch": 1633} {"train_loss": -12.151225090026855, "global_step": 274376, "epoch": 1633} {"train_loss": -10.308696746826172, "global_step": 274377, "epoch": 1633} {"train_loss": -11.923879623413086, "global_step": 274378, "epoch": 1633} {"train_loss": -11.917078018188477, "global_step": 274379, "epoch": 1633} {"train_loss": -10.922090530395508, "global_step": 274380, "epoch": 1633} {"train_loss": -11.520517349243164, "global_step": 274381, "epoch": 1633} {"train_loss": -12.121650695800781, "global_step": 274382, "epoch": 1633} {"train_loss": -10.95280647277832, "global_step": 274383, "epoch": 1633} {"train_loss": -11.787873268127441, "global_step": 274384, "epoch": 1633} {"train_loss": -11.350560188293457, "global_step": 274385, "epoch": 1633} {"train_loss": -9.449068069458008, "global_step": 274386, "epoch": 1633} {"train_loss": -9.37562370300293, "global_step": 274387, "epoch": 1633} {"train_loss": -9.133871078491211, "global_step": 274388, "epoch": 1633} {"train_loss": -11.187919616699219, "global_step": 274389, "epoch": 1633} {"train_loss": -8.245161056518555, "global_step": 274390, "epoch": 1633} {"train_loss": -9.68463134765625, "global_step": 274391, "epoch": 1633} {"train_loss": -8.761762619018555, "global_step": 274392, "epoch": 1633} {"train_loss": -9.965601921081543, "global_step": 274393, "epoch": 1633} {"train_loss": -10.156379699707031, "global_step": 274394, "epoch": 1633} {"train_loss": -10.291072845458984, "global_step": 274395, "epoch": 1633} {"train_loss": -10.741259574890137, "global_step": 274396, "epoch": 1633} {"train_loss": -11.249296188354492, "global_step": 274397, "epoch": 1633} {"train_loss": -10.433526039123535, "global_step": 274398, "epoch": 1633} {"train_loss": -10.986190795898438, "global_step": 274399, "epoch": 1633} {"train_loss": -11.108434677124023, "global_step": 274400, "epoch": 1633} {"train_loss": -11.009635925292969, "global_step": 274401, "epoch": 1633} {"train_loss": -11.125310897827148, "global_step": 274402, "epoch": 1633} {"train_loss": -10.84226131439209, "global_step": 274403, "epoch": 1633} {"train_loss": -10.756148338317871, "global_step": 274404, "epoch": 1633} {"train_loss": -11.228974342346191, "global_step": 274405, "epoch": 1633} {"train_loss": -11.072864532470703, "global_step": 274406, "epoch": 1633} {"train_loss": -11.126506805419922, "global_step": 274407, "epoch": 1633} {"train_loss": -11.593416213989258, "global_step": 274408, "epoch": 1633} {"train_loss": -10.644481658935547, "global_step": 274409, "epoch": 1633} {"train_loss": -11.745658874511719, "global_step": 274410, "epoch": 1633} {"train_loss": -11.224479675292969, "global_step": 274411, "epoch": 1633} {"train_loss": -11.228242874145508, "global_step": 274412, "epoch": 1633} {"train_loss": -11.823709487915039, "global_step": 274413, "epoch": 1633} {"train_loss": -10.943205833435059, "global_step": 274414, "epoch": 1633} {"train_loss": -11.738740921020508, "global_step": 274415, "epoch": 1633} {"train_loss": -11.356663703918457, "global_step": 274416, "epoch": 1633} {"train_loss": -10.949270248413086, "global_step": 274417, "epoch": 1633} {"train_loss": -11.608115196228027, "global_step": 274418, "epoch": 1633} {"train_loss": -11.208871841430664, "global_step": 274419, "epoch": 1633} {"train_loss": -11.250619888305664, "global_step": 274420, "epoch": 1633} {"train_loss": -11.830961227416992, "global_step": 274421, "epoch": 1633} {"train_loss": -11.299396514892578, "global_step": 274422, "epoch": 1633} {"train_loss": -11.862884521484375, "global_step": 274423, "epoch": 1633} {"train_loss": -11.404695510864258, "global_step": 274424, "epoch": 1633} {"train_loss": -11.60399341583252, "global_step": 274425, "epoch": 1633} {"train_loss": -12.002397537231445, "global_step": 274426, "epoch": 1633} {"train_loss": -11.761992454528809, "global_step": 274427, "epoch": 1633} {"train_loss": -11.840156555175781, "global_step": 274428, "epoch": 1633} {"train_loss": -11.768527030944824, "global_step": 274429, "epoch": 1633} {"train_loss": -11.877751350402832, "global_step": 274430, "epoch": 1633} {"train_loss": -11.939043998718262, "global_step": 274431, "epoch": 1633} {"train_loss": -11.836233139038086, "global_step": 274432, "epoch": 1633} {"train_loss": -11.64520263671875, "global_step": 274433, "epoch": 1633} {"train_loss": -12.095613479614258, "global_step": 274434, "epoch": 1633} {"train_loss": -11.75490951538086, "global_step": 274435, "epoch": 1633} {"train_loss": -11.820858001708984, "global_step": 274436, "epoch": 1633} {"train_loss": -11.832907676696777, "global_step": 274437, "epoch": 1633} {"train_loss": -12.028106689453125, "global_step": 274438, "epoch": 1633} {"train_loss": -11.767780303955078, "global_step": 274439, "epoch": 1633} {"train_loss": -12.091712951660156, "global_step": 274440, "epoch": 1633} {"train_loss": -11.99241828918457, "global_step": 274441, "epoch": 1633} {"train_loss": -11.85434341430664, "global_step": 274442, "epoch": 1633} {"train_loss": -11.939523696899414, "global_step": 274443, "epoch": 1633} {"train_loss": -11.885066986083984, "global_step": 274444, "epoch": 1633} {"train_loss": -12.144201278686523, "global_step": 274445, "epoch": 1633} {"train_loss": -12.04190731048584, "global_step": 274446, "epoch": 1633} {"train_loss": -11.797906875610352, "global_step": 274447, "epoch": 1633} {"train_loss": -12.16408920288086, "global_step": 274448, "epoch": 1633} {"train_loss": -12.040215492248535, "global_step": 274449, "epoch": 1633} {"train_loss": -11.98940658569336, "global_step": 274450, "epoch": 1633} {"train_loss": -12.10936164855957, "global_step": 274451, "epoch": 1633} {"train_loss": -12.11113166809082, "global_step": 274452, "epoch": 1633} {"train_loss": -12.196710586547852, "global_step": 274453, "epoch": 1633} {"train_loss": -12.061077117919922, "global_step": 274454, "epoch": 1633} {"train_loss": -11.932376861572266, "global_step": 274455, "epoch": 1633} {"train_loss": -12.192842483520508, "global_step": 274456, "epoch": 1633} {"train_loss": -12.07005500793457, "global_step": 274457, "epoch": 1633} {"train_loss": -12.111705780029297, "global_step": 274458, "epoch": 1633} {"train_loss": -11.943002700805664, "global_step": 274459, "epoch": 1633} {"train_loss": -11.995574951171875, "global_step": 274460, "epoch": 1633} {"train_loss": -12.011419296264648, "global_step": 274461, "epoch": 1633} {"train_loss": -11.896976470947266, "global_step": 274462, "epoch": 1633} {"train_loss": -12.328091621398926, "global_step": 274463, "epoch": 1633} {"train_loss": -11.872514724731445, "global_step": 274464, "epoch": 1633} {"train_loss": -12.137150764465332, "global_step": 274465, "epoch": 1633} {"train_loss": -11.99978256225586, "global_step": 274466, "epoch": 1633} {"train_loss": -12.02402114868164, "global_step": 274467, "epoch": 1633} {"train_loss": -12.17003059387207, "global_step": 274468, "epoch": 1633} {"train_loss": -12.232053756713867, "global_step": 274469, "epoch": 1633} {"train_loss": -11.933728218078613, "global_step": 274470, "epoch": 1633} {"train_loss": -11.823660850524902, "global_step": 274471, "epoch": 1633} {"train_loss": -12.164440155029297, "global_step": 274472, "epoch": 1633} {"train_loss": -12.109762191772461, "global_step": 274473, "epoch": 1633} {"train_loss": -12.15972900390625, "global_step": 274474, "epoch": 1633} {"train_loss": -12.127998352050781, "global_step": 274475, "epoch": 1633} {"train_loss": -12.28813648223877, "global_step": 274476, "epoch": 1633} {"train_loss": -11.886829376220703, "global_step": 274477, "epoch": 1633} {"train_loss": -12.177999496459961, "global_step": 274478, "epoch": 1633} {"train_loss": -12.366416931152344, "global_step": 274479, "epoch": 1633} {"train_loss": -12.188030242919922, "global_step": 274480, "epoch": 1633} {"train_loss": -12.358861923217773, "global_step": 274481, "epoch": 1633} {"train_loss": -12.295709609985352, "global_step": 274482, "epoch": 1633} {"train_loss": -12.054510116577148, "global_step": 274483, "epoch": 1633} {"train_loss": -12.060285568237305, "global_step": 274484, "epoch": 1633} {"train_loss": -12.281413078308105, "global_step": 274485, "epoch": 1633} {"train_loss": -12.307966232299805, "global_step": 274486, "epoch": 1633} {"train_loss": -11.43810749053955, "global_step": 274487, "epoch": 1633} {"train_loss": -11.192209243774414, "global_step": 274488, "epoch": 1633} {"train_loss": -11.681737899780273, "global_step": 274489, "epoch": 1633} {"train_loss": -12.260669708251953, "global_step": 274490, "epoch": 1633} {"train_loss": -12.298690795898438, "global_step": 274491, "epoch": 1633} {"train_loss": -12.268871307373047, "global_step": 274492, "epoch": 1633} {"train_loss": -11.689661026000977, "global_step": 274493, "epoch": 1633} {"train_loss": -11.852508544921875, "global_step": 274494, "epoch": 1633} {"train_loss": -11.991458892822266, "global_step": 274495, "epoch": 1633} {"train_loss": -12.318684577941895, "global_step": 274496, "epoch": 1633} {"train_loss": -12.113887786865234, "global_step": 274497, "epoch": 1633} {"train_loss": -11.958813667297363, "global_step": 274498, "epoch": 1633} {"train_loss": -12.204278945922852, "global_step": 274499, "epoch": 1633} {"train_loss": -12.081979751586914, "global_step": 274500, "epoch": 1633} {"train_loss": -12.080717086791992, "global_step": 274501, "epoch": 1633} {"train_loss": -12.343842506408691, "global_step": 274502, "epoch": 1633} {"train_loss": -12.356161117553711, "global_step": 274503, "epoch": 1633} {"train_loss": -12.125510215759277, "global_step": 274504, "epoch": 1633} {"train_loss": -11.870637893676758, "global_step": 274505, "epoch": 1633} {"train_loss": -12.04077434539795, "global_step": 274506, "epoch": 1633} {"train_loss": -12.414629936218262, "global_step": 274507, "epoch": 1633} {"train_loss": -12.022278785705566, "global_step": 274508, "epoch": 1633} {"train_loss": -12.260387420654297, "global_step": 274509, "epoch": 1633} {"train_loss": -12.062721252441406, "global_step": 274510, "epoch": 1633} {"train_loss": -11.71983704112825, "global_step": 274511, "epoch": 1633, "val_loss": 266350.59375} {"train_loss": -11.37697982788086, "global_step": 274512, "epoch": 1634} {"train_loss": -11.984376907348633, "global_step": 274513, "epoch": 1634} {"train_loss": -11.66964340209961, "global_step": 274514, "epoch": 1634} {"train_loss": -11.537598609924316, "global_step": 274515, "epoch": 1634} {"train_loss": -11.76245403289795, "global_step": 274516, "epoch": 1634} {"train_loss": -11.00558853149414, "global_step": 274517, "epoch": 1634} {"train_loss": -11.996175765991211, "global_step": 274518, "epoch": 1634} {"train_loss": -11.527456283569336, "global_step": 274519, "epoch": 1634} {"train_loss": -11.004343032836914, "global_step": 274520, "epoch": 1634} {"train_loss": -12.004920959472656, "global_step": 274521, "epoch": 1634} {"train_loss": -11.186172485351562, "global_step": 274522, "epoch": 1634} {"train_loss": -11.626102447509766, "global_step": 274523, "epoch": 1634} {"train_loss": -11.973794937133789, "global_step": 274524, "epoch": 1634} {"train_loss": -11.852815628051758, "global_step": 274525, "epoch": 1634} {"train_loss": -11.93812370300293, "global_step": 274526, "epoch": 1634} {"train_loss": -12.20805835723877, "global_step": 274527, "epoch": 1634} {"train_loss": -11.918251037597656, "global_step": 274528, "epoch": 1634} {"train_loss": -12.055938720703125, "global_step": 274529, "epoch": 1634} {"train_loss": -12.17575454711914, "global_step": 274530, "epoch": 1634} {"train_loss": -11.923245429992676, "global_step": 274531, "epoch": 1634} {"train_loss": -11.67516803741455, "global_step": 274532, "epoch": 1634} {"train_loss": -11.790032386779785, "global_step": 274533, "epoch": 1634} {"train_loss": -11.478818893432617, "global_step": 274534, "epoch": 1634} {"train_loss": -10.857634544372559, "global_step": 274535, "epoch": 1634} {"train_loss": -11.295855522155762, "global_step": 274536, "epoch": 1634} {"train_loss": -11.898984909057617, "global_step": 274537, "epoch": 1634} {"train_loss": -11.704998016357422, "global_step": 274538, "epoch": 1634} {"train_loss": -11.576480865478516, "global_step": 274539, "epoch": 1634} {"train_loss": -11.643220901489258, "global_step": 274540, "epoch": 1634} {"train_loss": -11.438077926635742, "global_step": 274541, "epoch": 1634} {"train_loss": -11.675153732299805, "global_step": 274542, "epoch": 1634} {"train_loss": -11.240304946899414, "global_step": 274543, "epoch": 1634} {"train_loss": -11.170635223388672, "global_step": 274544, "epoch": 1634} {"train_loss": -12.199884414672852, "global_step": 274545, "epoch": 1634} {"train_loss": -10.816543579101562, "global_step": 274546, "epoch": 1634} {"train_loss": -11.777424812316895, "global_step": 274547, "epoch": 1634} {"train_loss": -11.361385345458984, "global_step": 274548, "epoch": 1634} {"train_loss": -10.985821723937988, "global_step": 274549, "epoch": 1634} {"train_loss": -11.261932373046875, "global_step": 274550, "epoch": 1634} {"train_loss": -11.561487197875977, "global_step": 274551, "epoch": 1634} {"train_loss": -10.8563871383667, "global_step": 274552, "epoch": 1634} {"train_loss": -11.340700149536133, "global_step": 274553, "epoch": 1634} {"train_loss": -11.423681259155273, "global_step": 274554, "epoch": 1634} {"train_loss": -11.286319732666016, "global_step": 274555, "epoch": 1634} {"train_loss": -10.065889358520508, "global_step": 274556, "epoch": 1634} {"train_loss": -11.629999160766602, "global_step": 274557, "epoch": 1634} {"train_loss": -10.474035263061523, "global_step": 274558, "epoch": 1634} {"train_loss": -10.619657516479492, "global_step": 274559, "epoch": 1634} {"train_loss": -10.458776473999023, "global_step": 274560, "epoch": 1634} {"train_loss": -10.673417091369629, "global_step": 274561, "epoch": 1634} {"train_loss": -10.257375717163086, "global_step": 274562, "epoch": 1634} {"train_loss": -11.287749290466309, "global_step": 274563, "epoch": 1634} {"train_loss": -10.36465835571289, "global_step": 274564, "epoch": 1634} {"train_loss": -11.022592544555664, "global_step": 274565, "epoch": 1634} {"train_loss": -11.083677291870117, "global_step": 274566, "epoch": 1634} {"train_loss": -11.024297714233398, "global_step": 274567, "epoch": 1634} {"train_loss": -11.289449691772461, "global_step": 274568, "epoch": 1634} {"train_loss": -10.519824981689453, "global_step": 274569, "epoch": 1634} {"train_loss": -11.47142219543457, "global_step": 274570, "epoch": 1634} {"train_loss": -11.011823654174805, "global_step": 274571, "epoch": 1634} {"train_loss": -11.567177772521973, "global_step": 274572, "epoch": 1634} {"train_loss": -11.254825592041016, "global_step": 274573, "epoch": 1634} {"train_loss": -11.702788352966309, "global_step": 274574, "epoch": 1634} {"train_loss": -11.470523834228516, "global_step": 274575, "epoch": 1634} {"train_loss": -11.681482315063477, "global_step": 274576, "epoch": 1634} {"train_loss": -11.534490585327148, "global_step": 274577, "epoch": 1634} {"train_loss": -11.80129623413086, "global_step": 274578, "epoch": 1634} {"train_loss": -11.585609436035156, "global_step": 274579, "epoch": 1634} {"train_loss": -11.94382095336914, "global_step": 274580, "epoch": 1634} {"train_loss": -11.789236068725586, "global_step": 274581, "epoch": 1634} {"train_loss": -11.507397651672363, "global_step": 274582, "epoch": 1634} {"train_loss": -11.733747482299805, "global_step": 274583, "epoch": 1634} {"train_loss": -11.824421882629395, "global_step": 274584, "epoch": 1634} {"train_loss": -11.748046875, "global_step": 274585, "epoch": 1634} {"train_loss": -11.740501403808594, "global_step": 274586, "epoch": 1634} {"train_loss": -11.36159896850586, "global_step": 274587, "epoch": 1634} {"train_loss": -11.509791374206543, "global_step": 274588, "epoch": 1634} {"train_loss": -11.91218090057373, "global_step": 274589, "epoch": 1634} {"train_loss": -11.861133575439453, "global_step": 274590, "epoch": 1634} {"train_loss": -11.652074813842773, "global_step": 274591, "epoch": 1634} {"train_loss": -11.744470596313477, "global_step": 274592, "epoch": 1634} {"train_loss": -11.743827819824219, "global_step": 274593, "epoch": 1634} {"train_loss": -11.332733154296875, "global_step": 274594, "epoch": 1634} {"train_loss": -11.709024429321289, "global_step": 274595, "epoch": 1634} {"train_loss": -11.930252075195312, "global_step": 274596, "epoch": 1634} {"train_loss": -11.643280029296875, "global_step": 274597, "epoch": 1634} {"train_loss": -11.964988708496094, "global_step": 274598, "epoch": 1634} {"train_loss": -11.511277198791504, "global_step": 274599, "epoch": 1634} {"train_loss": -11.81102180480957, "global_step": 274600, "epoch": 1634} {"train_loss": -11.470460891723633, "global_step": 274601, "epoch": 1634} {"train_loss": -11.776727676391602, "global_step": 274602, "epoch": 1634} {"train_loss": -11.678888320922852, "global_step": 274603, "epoch": 1634} {"train_loss": -11.52127456665039, "global_step": 274604, "epoch": 1634} {"train_loss": -12.097002983093262, "global_step": 274605, "epoch": 1634} {"train_loss": -11.604920387268066, "global_step": 274606, "epoch": 1634} {"train_loss": -12.239737510681152, "global_step": 274607, "epoch": 1634} {"train_loss": -11.511299133300781, "global_step": 274608, "epoch": 1634} {"train_loss": -11.969282150268555, "global_step": 274609, "epoch": 1634} {"train_loss": -11.859325408935547, "global_step": 274610, "epoch": 1634} {"train_loss": -11.720425605773926, "global_step": 274611, "epoch": 1634} {"train_loss": -11.972585678100586, "global_step": 274612, "epoch": 1634} {"train_loss": -11.906869888305664, "global_step": 274613, "epoch": 1634} {"train_loss": -12.329828262329102, "global_step": 274614, "epoch": 1634} {"train_loss": -11.85843276977539, "global_step": 274615, "epoch": 1634} {"train_loss": -11.92608642578125, "global_step": 274616, "epoch": 1634} {"train_loss": -11.836203575134277, "global_step": 274617, "epoch": 1634} {"train_loss": -12.077630996704102, "global_step": 274618, "epoch": 1634} {"train_loss": -12.176790237426758, "global_step": 274619, "epoch": 1634} {"train_loss": -12.213152885437012, "global_step": 274620, "epoch": 1634} {"train_loss": -12.283132553100586, "global_step": 274621, "epoch": 1634} {"train_loss": -12.133575439453125, "global_step": 274622, "epoch": 1634} {"train_loss": -11.923945426940918, "global_step": 274623, "epoch": 1634} {"train_loss": -12.068488121032715, "global_step": 274624, "epoch": 1634} {"train_loss": -12.221220016479492, "global_step": 274625, "epoch": 1634} {"train_loss": -12.090167045593262, "global_step": 274626, "epoch": 1634} {"train_loss": -12.259580612182617, "global_step": 274627, "epoch": 1634} {"train_loss": -12.347684860229492, "global_step": 274628, "epoch": 1634} {"train_loss": -12.252996444702148, "global_step": 274629, "epoch": 1634} {"train_loss": -12.01336669921875, "global_step": 274630, "epoch": 1634} {"train_loss": -12.16796875, "global_step": 274631, "epoch": 1634} {"train_loss": -12.207071304321289, "global_step": 274632, "epoch": 1634} {"train_loss": -12.374334335327148, "global_step": 274633, "epoch": 1634} {"train_loss": -12.339831352233887, "global_step": 274634, "epoch": 1634} {"train_loss": -12.436775207519531, "global_step": 274635, "epoch": 1634} {"train_loss": -12.176767349243164, "global_step": 274636, "epoch": 1634} {"train_loss": -12.416837692260742, "global_step": 274637, "epoch": 1634} {"train_loss": -12.108283996582031, "global_step": 274638, "epoch": 1634} {"train_loss": -12.309326171875, "global_step": 274639, "epoch": 1634} {"train_loss": -12.337091445922852, "global_step": 274640, "epoch": 1634} {"train_loss": -12.337303161621094, "global_step": 274641, "epoch": 1634} {"train_loss": -11.920101165771484, "global_step": 274642, "epoch": 1634} {"train_loss": -12.11362075805664, "global_step": 274643, "epoch": 1634} {"train_loss": -12.254682540893555, "global_step": 274644, "epoch": 1634} {"train_loss": -12.11996078491211, "global_step": 274645, "epoch": 1634} {"train_loss": -12.199649810791016, "global_step": 274646, "epoch": 1634} {"train_loss": -12.014689445495605, "global_step": 274647, "epoch": 1634} {"train_loss": -12.131519317626953, "global_step": 274648, "epoch": 1634} {"train_loss": -11.427379608154297, "global_step": 274649, "epoch": 1634} {"train_loss": -10.933307647705078, "global_step": 274650, "epoch": 1634} {"train_loss": -10.900936126708984, "global_step": 274651, "epoch": 1634} {"train_loss": -11.85003662109375, "global_step": 274652, "epoch": 1634} {"train_loss": -11.253328323364258, "global_step": 274653, "epoch": 1634} {"train_loss": -11.621049880981445, "global_step": 274654, "epoch": 1634} {"train_loss": -11.019742965698242, "global_step": 274655, "epoch": 1634} {"train_loss": -12.087657928466797, "global_step": 274656, "epoch": 1634} {"train_loss": -10.79544448852539, "global_step": 274657, "epoch": 1634} {"train_loss": -11.047412872314453, "global_step": 274658, "epoch": 1634} {"train_loss": -11.43073844909668, "global_step": 274659, "epoch": 1634} {"train_loss": -11.117029190063477, "global_step": 274660, "epoch": 1634} {"train_loss": -10.403404235839844, "global_step": 274661, "epoch": 1634} {"train_loss": -11.658689498901367, "global_step": 274662, "epoch": 1634} {"train_loss": -11.754417419433594, "global_step": 274663, "epoch": 1634} {"train_loss": -11.174781799316406, "global_step": 274664, "epoch": 1634} {"train_loss": -11.85849380493164, "global_step": 274665, "epoch": 1634} {"train_loss": -11.567244529724121, "global_step": 274666, "epoch": 1634} {"train_loss": -11.531763076782227, "global_step": 274667, "epoch": 1634} {"train_loss": -11.940471649169922, "global_step": 274668, "epoch": 1634} {"train_loss": -10.866601943969727, "global_step": 274669, "epoch": 1634} {"train_loss": -11.908180236816406, "global_step": 274670, "epoch": 1634} {"train_loss": -11.130478858947754, "global_step": 274671, "epoch": 1634} {"train_loss": -12.18731689453125, "global_step": 274672, "epoch": 1634} {"train_loss": -11.757027626037598, "global_step": 274673, "epoch": 1634} {"train_loss": -11.78958511352539, "global_step": 274674, "epoch": 1634} {"train_loss": -11.959383010864258, "global_step": 274675, "epoch": 1634} {"train_loss": -11.695405960083008, "global_step": 274676, "epoch": 1634} {"train_loss": -11.772976875305176, "global_step": 274677, "epoch": 1634} {"train_loss": -11.72022819519043, "global_step": 274678, "epoch": 1634} {"train_loss": -11.640514549754915, "global_step": 274679, "epoch": 1634, "val_loss": 268328.1875} {"train_loss": -11.810977935791016, "global_step": 274680, "epoch": 1635} {"train_loss": -11.3591947555542, "global_step": 274681, "epoch": 1635} {"train_loss": -11.31086540222168, "global_step": 274682, "epoch": 1635} {"train_loss": -11.681329727172852, "global_step": 274683, "epoch": 1635} {"train_loss": -11.894943237304688, "global_step": 274684, "epoch": 1635} {"train_loss": -11.142328262329102, "global_step": 274685, "epoch": 1635} {"train_loss": -10.510377883911133, "global_step": 274686, "epoch": 1635} {"train_loss": -10.890286445617676, "global_step": 274687, "epoch": 1635} {"train_loss": -11.2202787399292, "global_step": 274688, "epoch": 1635} {"train_loss": -10.581719398498535, "global_step": 274689, "epoch": 1635} {"train_loss": -10.269437789916992, "global_step": 274690, "epoch": 1635} {"train_loss": -10.556110382080078, "global_step": 274691, "epoch": 1635} {"train_loss": -10.779945373535156, "global_step": 274692, "epoch": 1635} {"train_loss": -9.876700401306152, "global_step": 274693, "epoch": 1635} {"train_loss": -10.925332069396973, "global_step": 274694, "epoch": 1635} {"train_loss": -10.593364715576172, "global_step": 274695, "epoch": 1635} {"train_loss": -10.185565948486328, "global_step": 274696, "epoch": 1635} {"train_loss": -10.080316543579102, "global_step": 274697, "epoch": 1635} {"train_loss": -11.332836151123047, "global_step": 274698, "epoch": 1635} {"train_loss": -10.296574592590332, "global_step": 274699, "epoch": 1635} {"train_loss": -11.005012512207031, "global_step": 274700, "epoch": 1635} {"train_loss": -10.61483097076416, "global_step": 274701, "epoch": 1635} {"train_loss": -9.922624588012695, "global_step": 274702, "epoch": 1635} {"train_loss": -11.420663833618164, "global_step": 274703, "epoch": 1635} {"train_loss": -9.640909194946289, "global_step": 274704, "epoch": 1635} {"train_loss": -11.067071914672852, "global_step": 274705, "epoch": 1635} {"train_loss": -10.286355018615723, "global_step": 274706, "epoch": 1635} {"train_loss": -9.9591703414917, "global_step": 274707, "epoch": 1635} {"train_loss": -11.315281867980957, "global_step": 274708, "epoch": 1635} {"train_loss": -10.993098258972168, "global_step": 274709, "epoch": 1635} {"train_loss": -10.99023723602295, "global_step": 274710, "epoch": 1635} {"train_loss": -10.927165985107422, "global_step": 274711, "epoch": 1635} {"train_loss": -11.127735137939453, "global_step": 274712, "epoch": 1635} {"train_loss": -11.036783218383789, "global_step": 274713, "epoch": 1635} {"train_loss": -11.662158012390137, "global_step": 274714, "epoch": 1635} {"train_loss": -10.837394714355469, "global_step": 274715, "epoch": 1635} {"train_loss": -11.64194107055664, "global_step": 274716, "epoch": 1635} {"train_loss": -11.553047180175781, "global_step": 274717, "epoch": 1635} {"train_loss": -11.05642318725586, "global_step": 274718, "epoch": 1635} {"train_loss": -11.752742767333984, "global_step": 274719, "epoch": 1635} {"train_loss": -11.609443664550781, "global_step": 274720, "epoch": 1635} {"train_loss": -11.333797454833984, "global_step": 274721, "epoch": 1635} {"train_loss": -11.700071334838867, "global_step": 274722, "epoch": 1635} {"train_loss": -11.452620506286621, "global_step": 274723, "epoch": 1635} {"train_loss": -11.64781379699707, "global_step": 274724, "epoch": 1635} {"train_loss": -11.370174407958984, "global_step": 274725, "epoch": 1635} {"train_loss": -11.677925109863281, "global_step": 274726, "epoch": 1635} {"train_loss": -11.541952133178711, "global_step": 274727, "epoch": 1635} {"train_loss": -11.686233520507812, "global_step": 274728, "epoch": 1635} {"train_loss": -11.815652847290039, "global_step": 274729, "epoch": 1635} {"train_loss": -11.513538360595703, "global_step": 274730, "epoch": 1635} {"train_loss": -11.81312370300293, "global_step": 274731, "epoch": 1635} {"train_loss": -11.672359466552734, "global_step": 274732, "epoch": 1635} {"train_loss": -11.824743270874023, "global_step": 274733, "epoch": 1635} {"train_loss": -11.68256950378418, "global_step": 274734, "epoch": 1635} {"train_loss": -11.836441993713379, "global_step": 274735, "epoch": 1635} {"train_loss": -11.593915939331055, "global_step": 274736, "epoch": 1635} {"train_loss": -11.90523910522461, "global_step": 274737, "epoch": 1635} {"train_loss": -12.049187660217285, "global_step": 274738, "epoch": 1635} {"train_loss": -11.925206184387207, "global_step": 274739, "epoch": 1635} {"train_loss": -11.893301963806152, "global_step": 274740, "epoch": 1635} {"train_loss": -11.851539611816406, "global_step": 274741, "epoch": 1635} {"train_loss": -12.130020141601562, "global_step": 274742, "epoch": 1635} {"train_loss": -12.120903015136719, "global_step": 274743, "epoch": 1635} {"train_loss": -11.89958381652832, "global_step": 274744, "epoch": 1635} {"train_loss": -11.985953330993652, "global_step": 274745, "epoch": 1635} {"train_loss": -12.019145011901855, "global_step": 274746, "epoch": 1635} {"train_loss": -11.865126609802246, "global_step": 274747, "epoch": 1635} {"train_loss": -12.335843086242676, "global_step": 274748, "epoch": 1635} {"train_loss": -11.942745208740234, "global_step": 274749, "epoch": 1635} {"train_loss": -11.80257797241211, "global_step": 274750, "epoch": 1635} {"train_loss": -12.16197395324707, "global_step": 274751, "epoch": 1635} {"train_loss": -12.2545747756958, "global_step": 274752, "epoch": 1635} {"train_loss": -12.15158748626709, "global_step": 274753, "epoch": 1635} {"train_loss": -12.113901138305664, "global_step": 274754, "epoch": 1635} {"train_loss": -11.995363235473633, "global_step": 274755, "epoch": 1635} {"train_loss": -12.088501930236816, "global_step": 274756, "epoch": 1635} {"train_loss": -12.2590970993042, "global_step": 274757, "epoch": 1635} {"train_loss": -12.100431442260742, "global_step": 274758, "epoch": 1635} {"train_loss": -12.17083740234375, "global_step": 274759, "epoch": 1635} {"train_loss": -12.038750648498535, "global_step": 274760, "epoch": 1635} {"train_loss": -12.115102767944336, "global_step": 274761, "epoch": 1635} {"train_loss": -12.247016906738281, "global_step": 274762, "epoch": 1635} {"train_loss": -12.086257934570312, "global_step": 274763, "epoch": 1635} {"train_loss": -12.291560173034668, "global_step": 274764, "epoch": 1635} {"train_loss": -12.220558166503906, "global_step": 274765, "epoch": 1635} {"train_loss": -12.385123252868652, "global_step": 274766, "epoch": 1635} {"train_loss": -12.21932315826416, "global_step": 274767, "epoch": 1635} {"train_loss": -12.396153450012207, "global_step": 274768, "epoch": 1635} {"train_loss": -12.114140510559082, "global_step": 274769, "epoch": 1635} {"train_loss": -12.177190780639648, "global_step": 274770, "epoch": 1635} {"train_loss": -12.25351619720459, "global_step": 274771, "epoch": 1635} {"train_loss": -12.084056854248047, "global_step": 274772, "epoch": 1635} {"train_loss": -12.252290725708008, "global_step": 274773, "epoch": 1635} {"train_loss": -12.23714828491211, "global_step": 274774, "epoch": 1635} {"train_loss": -12.013955116271973, "global_step": 274775, "epoch": 1635} {"train_loss": -11.833739280700684, "global_step": 274776, "epoch": 1635} {"train_loss": -12.40563678741455, "global_step": 274777, "epoch": 1635} {"train_loss": -11.936649322509766, "global_step": 274778, "epoch": 1635} {"train_loss": -12.046228408813477, "global_step": 274779, "epoch": 1635} {"train_loss": -11.620824813842773, "global_step": 274780, "epoch": 1635} {"train_loss": -12.139642715454102, "global_step": 274781, "epoch": 1635} {"train_loss": -11.30301284790039, "global_step": 274782, "epoch": 1635} {"train_loss": -10.851593017578125, "global_step": 274783, "epoch": 1635} {"train_loss": -11.382284164428711, "global_step": 274784, "epoch": 1635} {"train_loss": -11.996511459350586, "global_step": 274785, "epoch": 1635} {"train_loss": -11.880546569824219, "global_step": 274786, "epoch": 1635} {"train_loss": -11.962311744689941, "global_step": 274787, "epoch": 1635} {"train_loss": -11.58173942565918, "global_step": 274788, "epoch": 1635} {"train_loss": -12.017182350158691, "global_step": 274789, "epoch": 1635} {"train_loss": -11.831158638000488, "global_step": 274790, "epoch": 1635} {"train_loss": -11.7796630859375, "global_step": 274791, "epoch": 1635} {"train_loss": -11.857566833496094, "global_step": 274792, "epoch": 1635} {"train_loss": -12.037712097167969, "global_step": 274793, "epoch": 1635} {"train_loss": -11.749954223632812, "global_step": 274794, "epoch": 1635} {"train_loss": -11.694013595581055, "global_step": 274795, "epoch": 1635} {"train_loss": -11.584909439086914, "global_step": 274796, "epoch": 1635} {"train_loss": -12.16008186340332, "global_step": 274797, "epoch": 1635} {"train_loss": -11.902493476867676, "global_step": 274798, "epoch": 1635} {"train_loss": -12.17638111114502, "global_step": 274799, "epoch": 1635} {"train_loss": -12.075246810913086, "global_step": 274800, "epoch": 1635} {"train_loss": -11.847908973693848, "global_step": 274801, "epoch": 1635} {"train_loss": -12.246081352233887, "global_step": 274802, "epoch": 1635} {"train_loss": -11.841309547424316, "global_step": 274803, "epoch": 1635} {"train_loss": -11.843146324157715, "global_step": 274804, "epoch": 1635} {"train_loss": -11.915367126464844, "global_step": 274805, "epoch": 1635} {"train_loss": -10.727313995361328, "global_step": 274806, "epoch": 1635} {"train_loss": -12.089481353759766, "global_step": 274807, "epoch": 1635} {"train_loss": -11.80337905883789, "global_step": 274808, "epoch": 1635} {"train_loss": -11.947023391723633, "global_step": 274809, "epoch": 1635} {"train_loss": -11.739680290222168, "global_step": 274810, "epoch": 1635} {"train_loss": -11.554688453674316, "global_step": 274811, "epoch": 1635} {"train_loss": -11.323077201843262, "global_step": 274812, "epoch": 1635} {"train_loss": -12.022907257080078, "global_step": 274813, "epoch": 1635} {"train_loss": -12.217056274414062, "global_step": 274814, "epoch": 1635} {"train_loss": -11.593521118164062, "global_step": 274815, "epoch": 1635} {"train_loss": -10.871088027954102, "global_step": 274816, "epoch": 1635} {"train_loss": -11.230043411254883, "global_step": 274817, "epoch": 1635} {"train_loss": -12.06875228881836, "global_step": 274818, "epoch": 1635} {"train_loss": -9.341310501098633, "global_step": 274819, "epoch": 1635} {"train_loss": -9.185766220092773, "global_step": 274820, "epoch": 1635} {"train_loss": -12.12464714050293, "global_step": 274821, "epoch": 1635} {"train_loss": -9.482813835144043, "global_step": 274822, "epoch": 1635} {"train_loss": -9.717046737670898, "global_step": 274823, "epoch": 1635} {"train_loss": -10.244773864746094, "global_step": 274824, "epoch": 1635} {"train_loss": -8.464106559753418, "global_step": 274825, "epoch": 1635} {"train_loss": -9.372525215148926, "global_step": 274826, "epoch": 1635} {"train_loss": -11.39037799835205, "global_step": 274827, "epoch": 1635} {"train_loss": -7.586948871612549, "global_step": 274828, "epoch": 1635} {"train_loss": -8.3015718460083, "global_step": 274829, "epoch": 1635} {"train_loss": -9.045095443725586, "global_step": 274830, "epoch": 1635} {"train_loss": -9.873068809509277, "global_step": 274831, "epoch": 1635} {"train_loss": -8.57769775390625, "global_step": 274832, "epoch": 1635} {"train_loss": -9.131768226623535, "global_step": 274833, "epoch": 1635} {"train_loss": -9.637170791625977, "global_step": 274834, "epoch": 1635} {"train_loss": -9.408991813659668, "global_step": 274835, "epoch": 1635} {"train_loss": -8.94083023071289, "global_step": 274836, "epoch": 1635} {"train_loss": -9.863690376281738, "global_step": 274837, "epoch": 1635} {"train_loss": -9.506355285644531, "global_step": 274838, "epoch": 1635} {"train_loss": -7.945361137390137, "global_step": 274839, "epoch": 1635} {"train_loss": -7.597118377685547, "global_step": 274840, "epoch": 1635} {"train_loss": -7.1418914794921875, "global_step": 274841, "epoch": 1635} {"train_loss": -9.103788375854492, "global_step": 274842, "epoch": 1635} {"train_loss": -9.952713012695312, "global_step": 274843, "epoch": 1635} {"train_loss": -8.795228004455566, "global_step": 274844, "epoch": 1635} {"train_loss": -8.989144325256348, "global_step": 274845, "epoch": 1635} {"train_loss": -8.72031021118164, "global_step": 274846, "epoch": 1635} {"train_loss": -11.190017356759025, "global_step": 274847, "epoch": 1635, "val_loss": 270298.53125, "train_action_mse_error": 2.147954225540161} {"train_loss": -8.980695724487305, "global_step": 274848, "epoch": 1636} {"train_loss": -8.582919120788574, "global_step": 274849, "epoch": 1636} {"train_loss": -8.38457202911377, "global_step": 274850, "epoch": 1636} {"train_loss": -9.396669387817383, "global_step": 274851, "epoch": 1636} {"train_loss": -10.096461296081543, "global_step": 274852, "epoch": 1636} {"train_loss": -10.229133605957031, "global_step": 274853, "epoch": 1636} {"train_loss": -9.617073059082031, "global_step": 274854, "epoch": 1636} {"train_loss": -9.502758026123047, "global_step": 274855, "epoch": 1636} {"train_loss": -10.419289588928223, "global_step": 274856, "epoch": 1636} {"train_loss": -10.743555068969727, "global_step": 274857, "epoch": 1636} {"train_loss": -10.685646057128906, "global_step": 274858, "epoch": 1636} {"train_loss": -10.538557052612305, "global_step": 274859, "epoch": 1636} {"train_loss": -10.809037208557129, "global_step": 274860, "epoch": 1636} {"train_loss": -10.744585037231445, "global_step": 274861, "epoch": 1636} {"train_loss": -11.313055038452148, "global_step": 274862, "epoch": 1636} {"train_loss": -11.152215957641602, "global_step": 274863, "epoch": 1636} {"train_loss": -11.135370254516602, "global_step": 274864, "epoch": 1636} {"train_loss": -10.86301326751709, "global_step": 274865, "epoch": 1636} {"train_loss": -11.090643882751465, "global_step": 274866, "epoch": 1636} {"train_loss": -11.377934455871582, "global_step": 274867, "epoch": 1636} {"train_loss": -10.709716796875, "global_step": 274868, "epoch": 1636} {"train_loss": -11.26672077178955, "global_step": 274869, "epoch": 1636} {"train_loss": -11.170869827270508, "global_step": 274870, "epoch": 1636} {"train_loss": -11.269927978515625, "global_step": 274871, "epoch": 1636} {"train_loss": -11.30331039428711, "global_step": 274872, "epoch": 1636} {"train_loss": -11.25435733795166, "global_step": 274873, "epoch": 1636} {"train_loss": -11.216729164123535, "global_step": 274874, "epoch": 1636} {"train_loss": -11.417677879333496, "global_step": 274875, "epoch": 1636} {"train_loss": -11.225034713745117, "global_step": 274876, "epoch": 1636} {"train_loss": -11.279518127441406, "global_step": 274877, "epoch": 1636} {"train_loss": -11.621545791625977, "global_step": 274878, "epoch": 1636} {"train_loss": -11.48360538482666, "global_step": 274879, "epoch": 1636} {"train_loss": -11.474006652832031, "global_step": 274880, "epoch": 1636} {"train_loss": -11.615466117858887, "global_step": 274881, "epoch": 1636} {"train_loss": -11.64028549194336, "global_step": 274882, "epoch": 1636} {"train_loss": -11.554344177246094, "global_step": 274883, "epoch": 1636} {"train_loss": -11.627811431884766, "global_step": 274884, "epoch": 1636} {"train_loss": -11.609840393066406, "global_step": 274885, "epoch": 1636} {"train_loss": -11.776836395263672, "global_step": 274886, "epoch": 1636} {"train_loss": -11.765474319458008, "global_step": 274887, "epoch": 1636} {"train_loss": -11.64857292175293, "global_step": 274888, "epoch": 1636} {"train_loss": -11.730401992797852, "global_step": 274889, "epoch": 1636} {"train_loss": -11.833479881286621, "global_step": 274890, "epoch": 1636} {"train_loss": -11.711915016174316, "global_step": 274891, "epoch": 1636} {"train_loss": -11.636951446533203, "global_step": 274892, "epoch": 1636} {"train_loss": -11.578320503234863, "global_step": 274893, "epoch": 1636} {"train_loss": -11.811878204345703, "global_step": 274894, "epoch": 1636} {"train_loss": -11.920675277709961, "global_step": 274895, "epoch": 1636} {"train_loss": -11.871420860290527, "global_step": 274896, "epoch": 1636} {"train_loss": -11.75521469116211, "global_step": 274897, "epoch": 1636} {"train_loss": -11.699377059936523, "global_step": 274898, "epoch": 1636} {"train_loss": -11.970426559448242, "global_step": 274899, "epoch": 1636} {"train_loss": -11.7885103225708, "global_step": 274900, "epoch": 1636} {"train_loss": -11.840890884399414, "global_step": 274901, "epoch": 1636} {"train_loss": -11.87728500366211, "global_step": 274902, "epoch": 1636} {"train_loss": -11.94688892364502, "global_step": 274903, "epoch": 1636} {"train_loss": -12.05087661743164, "global_step": 274904, "epoch": 1636} {"train_loss": -11.955883026123047, "global_step": 274905, "epoch": 1636} {"train_loss": -11.769868850708008, "global_step": 274906, "epoch": 1636} {"train_loss": -12.01618480682373, "global_step": 274907, "epoch": 1636} {"train_loss": -12.031023979187012, "global_step": 274908, "epoch": 1636} {"train_loss": -12.021551132202148, "global_step": 274909, "epoch": 1636} {"train_loss": -11.917378425598145, "global_step": 274910, "epoch": 1636} {"train_loss": -12.01385498046875, "global_step": 274911, "epoch": 1636} {"train_loss": -11.891217231750488, "global_step": 274912, "epoch": 1636} {"train_loss": -11.995805740356445, "global_step": 274913, "epoch": 1636} {"train_loss": -11.991893768310547, "global_step": 274914, "epoch": 1636} {"train_loss": -12.059591293334961, "global_step": 274915, "epoch": 1636} {"train_loss": -12.135891914367676, "global_step": 274916, "epoch": 1636} {"train_loss": -11.763176918029785, "global_step": 274917, "epoch": 1636} {"train_loss": -12.121354103088379, "global_step": 274918, "epoch": 1636} {"train_loss": -12.121857643127441, "global_step": 274919, "epoch": 1636} {"train_loss": -11.782329559326172, "global_step": 274920, "epoch": 1636} {"train_loss": -12.14365005493164, "global_step": 274921, "epoch": 1636} {"train_loss": -12.06070327758789, "global_step": 274922, "epoch": 1636} {"train_loss": -12.109334945678711, "global_step": 274923, "epoch": 1636} {"train_loss": -12.042034149169922, "global_step": 274924, "epoch": 1636} {"train_loss": -12.109664916992188, "global_step": 274925, "epoch": 1636} {"train_loss": -12.250814437866211, "global_step": 274926, "epoch": 1636} {"train_loss": -12.186409950256348, "global_step": 274927, "epoch": 1636} {"train_loss": -12.264113426208496, "global_step": 274928, "epoch": 1636} {"train_loss": -12.192583084106445, "global_step": 274929, "epoch": 1636} {"train_loss": -12.086847305297852, "global_step": 274930, "epoch": 1636} {"train_loss": -12.108333587646484, "global_step": 274931, "epoch": 1636} {"train_loss": -12.163466453552246, "global_step": 274932, "epoch": 1636} {"train_loss": -12.289451599121094, "global_step": 274933, "epoch": 1636} {"train_loss": -12.030384063720703, "global_step": 274934, "epoch": 1636} {"train_loss": -12.240827560424805, "global_step": 274935, "epoch": 1636} {"train_loss": -12.00479507446289, "global_step": 274936, "epoch": 1636} {"train_loss": -12.407514572143555, "global_step": 274937, "epoch": 1636} {"train_loss": -12.324075698852539, "global_step": 274938, "epoch": 1636} {"train_loss": -12.27081298828125, "global_step": 274939, "epoch": 1636} {"train_loss": -12.205411911010742, "global_step": 274940, "epoch": 1636} {"train_loss": -12.421165466308594, "global_step": 274941, "epoch": 1636} {"train_loss": -12.403818130493164, "global_step": 274942, "epoch": 1636} {"train_loss": -12.454602241516113, "global_step": 274943, "epoch": 1636} {"train_loss": -12.373329162597656, "global_step": 274944, "epoch": 1636} {"train_loss": -12.280792236328125, "global_step": 274945, "epoch": 1636} {"train_loss": -12.364845275878906, "global_step": 274946, "epoch": 1636} {"train_loss": -12.463064193725586, "global_step": 274947, "epoch": 1636} {"train_loss": -12.518227577209473, "global_step": 274948, "epoch": 1636} {"train_loss": -12.415473937988281, "global_step": 274949, "epoch": 1636} {"train_loss": -12.346541404724121, "global_step": 274950, "epoch": 1636} {"train_loss": -12.384493827819824, "global_step": 274951, "epoch": 1636} {"train_loss": -12.359029769897461, "global_step": 274952, "epoch": 1636} {"train_loss": -12.150979042053223, "global_step": 274953, "epoch": 1636} {"train_loss": -11.944835662841797, "global_step": 274954, "epoch": 1636} {"train_loss": -11.854973793029785, "global_step": 274955, "epoch": 1636} {"train_loss": -12.30571460723877, "global_step": 274956, "epoch": 1636} {"train_loss": -12.18095874786377, "global_step": 274957, "epoch": 1636} {"train_loss": -11.831672668457031, "global_step": 274958, "epoch": 1636} {"train_loss": -10.57784652709961, "global_step": 274959, "epoch": 1636} {"train_loss": -10.543355941772461, "global_step": 274960, "epoch": 1636} {"train_loss": -9.443730354309082, "global_step": 274961, "epoch": 1636} {"train_loss": -11.248689651489258, "global_step": 274962, "epoch": 1636} {"train_loss": -9.947515487670898, "global_step": 274963, "epoch": 1636} {"train_loss": -7.84841775894165, "global_step": 274964, "epoch": 1636} {"train_loss": -11.554960250854492, "global_step": 274965, "epoch": 1636} {"train_loss": -9.567296028137207, "global_step": 274966, "epoch": 1636} {"train_loss": -9.888486862182617, "global_step": 274967, "epoch": 1636} {"train_loss": -11.086464881896973, "global_step": 274968, "epoch": 1636} {"train_loss": -8.561174392700195, "global_step": 274969, "epoch": 1636} {"train_loss": -11.33082389831543, "global_step": 274970, "epoch": 1636} {"train_loss": -10.222249984741211, "global_step": 274971, "epoch": 1636} {"train_loss": -10.288850784301758, "global_step": 274972, "epoch": 1636} {"train_loss": -11.017221450805664, "global_step": 274973, "epoch": 1636} {"train_loss": -9.009544372558594, "global_step": 274974, "epoch": 1636} {"train_loss": -10.646187782287598, "global_step": 274975, "epoch": 1636} {"train_loss": -11.279212951660156, "global_step": 274976, "epoch": 1636} {"train_loss": -8.799003601074219, "global_step": 274977, "epoch": 1636} {"train_loss": -10.490379333496094, "global_step": 274978, "epoch": 1636} {"train_loss": -9.645486831665039, "global_step": 274979, "epoch": 1636} {"train_loss": -9.081456184387207, "global_step": 274980, "epoch": 1636} {"train_loss": -8.737548828125, "global_step": 274981, "epoch": 1636} {"train_loss": -10.888568878173828, "global_step": 274982, "epoch": 1636} {"train_loss": -9.222959518432617, "global_step": 274983, "epoch": 1636} {"train_loss": -9.082992553710938, "global_step": 274984, "epoch": 1636} {"train_loss": -11.187374114990234, "global_step": 274985, "epoch": 1636} {"train_loss": -9.268352508544922, "global_step": 274986, "epoch": 1636} {"train_loss": -10.407820701599121, "global_step": 274987, "epoch": 1636} {"train_loss": -11.192642211914062, "global_step": 274988, "epoch": 1636} {"train_loss": -9.912334442138672, "global_step": 274989, "epoch": 1636} {"train_loss": -10.36707878112793, "global_step": 274990, "epoch": 1636} {"train_loss": -11.07595443725586, "global_step": 274991, "epoch": 1636} {"train_loss": -10.418767929077148, "global_step": 274992, "epoch": 1636} {"train_loss": -10.217287063598633, "global_step": 274993, "epoch": 1636} {"train_loss": -11.287168502807617, "global_step": 274994, "epoch": 1636} {"train_loss": -10.761100769042969, "global_step": 274995, "epoch": 1636} {"train_loss": -10.606451034545898, "global_step": 274996, "epoch": 1636} {"train_loss": -11.435402870178223, "global_step": 274997, "epoch": 1636} {"train_loss": -11.197894096374512, "global_step": 274998, "epoch": 1636} {"train_loss": -11.10466194152832, "global_step": 274999, "epoch": 1636} {"train_loss": -11.143181800842285, "global_step": 275000, "epoch": 1636} {"train_loss": -11.046073913574219, "global_step": 275001, "epoch": 1636} {"train_loss": -11.534612655639648, "global_step": 275002, "epoch": 1636} {"train_loss": -11.36915397644043, "global_step": 275003, "epoch": 1636} {"train_loss": -11.59402084350586, "global_step": 275004, "epoch": 1636} {"train_loss": -11.084159851074219, "global_step": 275005, "epoch": 1636} {"train_loss": -11.744829177856445, "global_step": 275006, "epoch": 1636} {"train_loss": -11.495742797851562, "global_step": 275007, "epoch": 1636} {"train_loss": -11.557777404785156, "global_step": 275008, "epoch": 1636} {"train_loss": -11.543335914611816, "global_step": 275009, "epoch": 1636} {"train_loss": -11.577919006347656, "global_step": 275010, "epoch": 1636} {"train_loss": -11.871587753295898, "global_step": 275011, "epoch": 1636} {"train_loss": -11.503213882446289, "global_step": 275012, "epoch": 1636} {"train_loss": -11.724977493286133, "global_step": 275013, "epoch": 1636} {"train_loss": -11.82707405090332, "global_step": 275014, "epoch": 1636} {"train_loss": -11.283808898358117, "global_step": 275015, "epoch": 1636, "val_loss": 269849.125} {"train_loss": -11.816400527954102, "global_step": 275016, "epoch": 1637} {"train_loss": -11.954812049865723, "global_step": 275017, "epoch": 1637} {"train_loss": -11.811090469360352, "global_step": 275018, "epoch": 1637} {"train_loss": -11.902950286865234, "global_step": 275019, "epoch": 1637} {"train_loss": -11.695051193237305, "global_step": 275020, "epoch": 1637} {"train_loss": -11.746038436889648, "global_step": 275021, "epoch": 1637} {"train_loss": -11.897846221923828, "global_step": 275022, "epoch": 1637} {"train_loss": -11.82925033569336, "global_step": 275023, "epoch": 1637} {"train_loss": -11.948984146118164, "global_step": 275024, "epoch": 1637} {"train_loss": -11.761077880859375, "global_step": 275025, "epoch": 1637} {"train_loss": -12.033269882202148, "global_step": 275026, "epoch": 1637} {"train_loss": -11.841079711914062, "global_step": 275027, "epoch": 1637} {"train_loss": -11.971839904785156, "global_step": 275028, "epoch": 1637} {"train_loss": -12.015098571777344, "global_step": 275029, "epoch": 1637} {"train_loss": -12.000152587890625, "global_step": 275030, "epoch": 1637} {"train_loss": -11.931450843811035, "global_step": 275031, "epoch": 1637} {"train_loss": -11.925277709960938, "global_step": 275032, "epoch": 1637} {"train_loss": -12.015342712402344, "global_step": 275033, "epoch": 1637} {"train_loss": -11.889713287353516, "global_step": 275034, "epoch": 1637} {"train_loss": -12.012587547302246, "global_step": 275035, "epoch": 1637} {"train_loss": -12.145933151245117, "global_step": 275036, "epoch": 1637} {"train_loss": -12.137130737304688, "global_step": 275037, "epoch": 1637} {"train_loss": -11.914834022521973, "global_step": 275038, "epoch": 1637} {"train_loss": -12.237133979797363, "global_step": 275039, "epoch": 1637} {"train_loss": -12.102157592773438, "global_step": 275040, "epoch": 1637} {"train_loss": -12.137101173400879, "global_step": 275041, "epoch": 1637} {"train_loss": -11.89228630065918, "global_step": 275042, "epoch": 1637} {"train_loss": -12.170167922973633, "global_step": 275043, "epoch": 1637} {"train_loss": -11.894728660583496, "global_step": 275044, "epoch": 1637} {"train_loss": -12.14432144165039, "global_step": 275045, "epoch": 1637} {"train_loss": -12.025555610656738, "global_step": 275046, "epoch": 1637} {"train_loss": -12.018877029418945, "global_step": 275047, "epoch": 1637} {"train_loss": -12.063333511352539, "global_step": 275048, "epoch": 1637} {"train_loss": -12.226140975952148, "global_step": 275049, "epoch": 1637} {"train_loss": -12.01828384399414, "global_step": 275050, "epoch": 1637} {"train_loss": -12.028409957885742, "global_step": 275051, "epoch": 1637} {"train_loss": -11.712963104248047, "global_step": 275052, "epoch": 1637} {"train_loss": -11.897299766540527, "global_step": 275053, "epoch": 1637} {"train_loss": -12.105987548828125, "global_step": 275054, "epoch": 1637} {"train_loss": -12.156709671020508, "global_step": 275055, "epoch": 1637} {"train_loss": -12.315303802490234, "global_step": 275056, "epoch": 1637} {"train_loss": -12.19533920288086, "global_step": 275057, "epoch": 1637} {"train_loss": -12.275940895080566, "global_step": 275058, "epoch": 1637} {"train_loss": -12.284551620483398, "global_step": 275059, "epoch": 1637} {"train_loss": -12.377448081970215, "global_step": 275060, "epoch": 1637} {"train_loss": -12.174629211425781, "global_step": 275061, "epoch": 1637} {"train_loss": -12.339069366455078, "global_step": 275062, "epoch": 1637} {"train_loss": -12.195917129516602, "global_step": 275063, "epoch": 1637} {"train_loss": -12.272293090820312, "global_step": 275064, "epoch": 1637} {"train_loss": -12.227609634399414, "global_step": 275065, "epoch": 1637} {"train_loss": -12.464838027954102, "global_step": 275066, "epoch": 1637} {"train_loss": -12.436273574829102, "global_step": 275067, "epoch": 1637} {"train_loss": -12.408270835876465, "global_step": 275068, "epoch": 1637} {"train_loss": -12.193876266479492, "global_step": 275069, "epoch": 1637} {"train_loss": -12.445545196533203, "global_step": 275070, "epoch": 1637} {"train_loss": -12.287225723266602, "global_step": 275071, "epoch": 1637} {"train_loss": -12.381402969360352, "global_step": 275072, "epoch": 1637} {"train_loss": -12.352787017822266, "global_step": 275073, "epoch": 1637} {"train_loss": -12.334321975708008, "global_step": 275074, "epoch": 1637} {"train_loss": -12.09107780456543, "global_step": 275075, "epoch": 1637} {"train_loss": -12.089883804321289, "global_step": 275076, "epoch": 1637} {"train_loss": -12.195247650146484, "global_step": 275077, "epoch": 1637} {"train_loss": -11.99160385131836, "global_step": 275078, "epoch": 1637} {"train_loss": -11.894758224487305, "global_step": 275079, "epoch": 1637} {"train_loss": -11.887929916381836, "global_step": 275080, "epoch": 1637} {"train_loss": -12.461160659790039, "global_step": 275081, "epoch": 1637} {"train_loss": -12.199614524841309, "global_step": 275082, "epoch": 1637} {"train_loss": -12.173286437988281, "global_step": 275083, "epoch": 1637} {"train_loss": -12.432794570922852, "global_step": 275084, "epoch": 1637} {"train_loss": -12.233986854553223, "global_step": 275085, "epoch": 1637} {"train_loss": -12.305461883544922, "global_step": 275086, "epoch": 1637} {"train_loss": -12.409032821655273, "global_step": 275087, "epoch": 1637} {"train_loss": -12.005905151367188, "global_step": 275088, "epoch": 1637} {"train_loss": -12.155117988586426, "global_step": 275089, "epoch": 1637} {"train_loss": -12.208779335021973, "global_step": 275090, "epoch": 1637} {"train_loss": -11.850814819335938, "global_step": 275091, "epoch": 1637} {"train_loss": -12.192710876464844, "global_step": 275092, "epoch": 1637} {"train_loss": -12.358634948730469, "global_step": 275093, "epoch": 1637} {"train_loss": -11.597551345825195, "global_step": 275094, "epoch": 1637} {"train_loss": -12.000244140625, "global_step": 275095, "epoch": 1637} {"train_loss": -12.080568313598633, "global_step": 275096, "epoch": 1637} {"train_loss": -10.660171508789062, "global_step": 275097, "epoch": 1637} {"train_loss": -10.868820190429688, "global_step": 275098, "epoch": 1637} {"train_loss": -11.737224578857422, "global_step": 275099, "epoch": 1637} {"train_loss": -10.286094665527344, "global_step": 275100, "epoch": 1637} {"train_loss": -11.186820983886719, "global_step": 275101, "epoch": 1637} {"train_loss": -11.85583782196045, "global_step": 275102, "epoch": 1637} {"train_loss": -11.12700366973877, "global_step": 275103, "epoch": 1637} {"train_loss": -11.206869125366211, "global_step": 275104, "epoch": 1637} {"train_loss": -11.745281219482422, "global_step": 275105, "epoch": 1637} {"train_loss": -9.983369827270508, "global_step": 275106, "epoch": 1637} {"train_loss": -11.54090404510498, "global_step": 275107, "epoch": 1637} {"train_loss": -11.218873977661133, "global_step": 275108, "epoch": 1637} {"train_loss": -11.005897521972656, "global_step": 275109, "epoch": 1637} {"train_loss": -11.363359451293945, "global_step": 275110, "epoch": 1637} {"train_loss": -10.550750732421875, "global_step": 275111, "epoch": 1637} {"train_loss": -11.55971908569336, "global_step": 275112, "epoch": 1637} {"train_loss": -9.84644889831543, "global_step": 275113, "epoch": 1637} {"train_loss": -11.01793098449707, "global_step": 275114, "epoch": 1637} {"train_loss": -11.53705883026123, "global_step": 275115, "epoch": 1637} {"train_loss": -10.7891845703125, "global_step": 275116, "epoch": 1637} {"train_loss": -11.654701232910156, "global_step": 275117, "epoch": 1637} {"train_loss": -11.488492965698242, "global_step": 275118, "epoch": 1637} {"train_loss": -10.663375854492188, "global_step": 275119, "epoch": 1637} {"train_loss": -11.32979679107666, "global_step": 275120, "epoch": 1637} {"train_loss": -11.709891319274902, "global_step": 275121, "epoch": 1637} {"train_loss": -10.636065483093262, "global_step": 275122, "epoch": 1637} {"train_loss": -11.49327564239502, "global_step": 275123, "epoch": 1637} {"train_loss": -11.911879539489746, "global_step": 275124, "epoch": 1637} {"train_loss": -10.386310577392578, "global_step": 275125, "epoch": 1637} {"train_loss": -11.674368858337402, "global_step": 275126, "epoch": 1637} {"train_loss": -11.310428619384766, "global_step": 275127, "epoch": 1637} {"train_loss": -11.421642303466797, "global_step": 275128, "epoch": 1637} {"train_loss": -11.46460247039795, "global_step": 275129, "epoch": 1637} {"train_loss": -11.017141342163086, "global_step": 275130, "epoch": 1637} {"train_loss": -12.029420852661133, "global_step": 275131, "epoch": 1637} {"train_loss": -11.418403625488281, "global_step": 275132, "epoch": 1637} {"train_loss": -11.55894947052002, "global_step": 275133, "epoch": 1637} {"train_loss": -10.976604461669922, "global_step": 275134, "epoch": 1637} {"train_loss": -11.851364135742188, "global_step": 275135, "epoch": 1637} {"train_loss": -10.786271095275879, "global_step": 275136, "epoch": 1637} {"train_loss": -11.153116226196289, "global_step": 275137, "epoch": 1637} {"train_loss": -11.703607559204102, "global_step": 275138, "epoch": 1637} {"train_loss": -10.784425735473633, "global_step": 275139, "epoch": 1637} {"train_loss": -11.820795059204102, "global_step": 275140, "epoch": 1637} {"train_loss": -10.271814346313477, "global_step": 275141, "epoch": 1637} {"train_loss": -11.825763702392578, "global_step": 275142, "epoch": 1637} {"train_loss": -10.72389030456543, "global_step": 275143, "epoch": 1637} {"train_loss": -11.59670352935791, "global_step": 275144, "epoch": 1637} {"train_loss": -11.121140480041504, "global_step": 275145, "epoch": 1637} {"train_loss": -11.09443187713623, "global_step": 275146, "epoch": 1637} {"train_loss": -11.81762409210205, "global_step": 275147, "epoch": 1637} {"train_loss": -10.787630081176758, "global_step": 275148, "epoch": 1637} {"train_loss": -11.767053604125977, "global_step": 275149, "epoch": 1637} {"train_loss": -10.869449615478516, "global_step": 275150, "epoch": 1637} {"train_loss": -11.651823997497559, "global_step": 275151, "epoch": 1637} {"train_loss": -11.455663681030273, "global_step": 275152, "epoch": 1637} {"train_loss": -11.673412322998047, "global_step": 275153, "epoch": 1637} {"train_loss": -11.580824851989746, "global_step": 275154, "epoch": 1637} {"train_loss": -11.491279602050781, "global_step": 275155, "epoch": 1637} {"train_loss": -11.249417304992676, "global_step": 275156, "epoch": 1637} {"train_loss": -11.703383445739746, "global_step": 275157, "epoch": 1637} {"train_loss": -10.969871520996094, "global_step": 275158, "epoch": 1637} {"train_loss": -11.604496002197266, "global_step": 275159, "epoch": 1637} {"train_loss": -11.275298118591309, "global_step": 275160, "epoch": 1637} {"train_loss": -11.606575012207031, "global_step": 275161, "epoch": 1637} {"train_loss": -11.112874984741211, "global_step": 275162, "epoch": 1637} {"train_loss": -11.734832763671875, "global_step": 275163, "epoch": 1637} {"train_loss": -11.144349098205566, "global_step": 275164, "epoch": 1637} {"train_loss": -11.585676193237305, "global_step": 275165, "epoch": 1637} {"train_loss": -10.947722434997559, "global_step": 275166, "epoch": 1637} {"train_loss": -11.910451889038086, "global_step": 275167, "epoch": 1637} {"train_loss": -11.767890930175781, "global_step": 275168, "epoch": 1637} {"train_loss": -11.461524963378906, "global_step": 275169, "epoch": 1637} {"train_loss": -11.764622688293457, "global_step": 275170, "epoch": 1637} {"train_loss": -11.253686904907227, "global_step": 275171, "epoch": 1637} {"train_loss": -11.376317977905273, "global_step": 275172, "epoch": 1637} {"train_loss": -11.675779342651367, "global_step": 275173, "epoch": 1637} {"train_loss": -11.511338233947754, "global_step": 275174, "epoch": 1637} {"train_loss": -11.185747146606445, "global_step": 275175, "epoch": 1637} {"train_loss": -11.392757415771484, "global_step": 275176, "epoch": 1637} {"train_loss": -11.376846313476562, "global_step": 275177, "epoch": 1637} {"train_loss": -11.623398780822754, "global_step": 275178, "epoch": 1637} {"train_loss": -11.392242431640625, "global_step": 275179, "epoch": 1637} {"train_loss": -11.66578483581543, "global_step": 275180, "epoch": 1637} {"train_loss": -11.617792129516602, "global_step": 275181, "epoch": 1637} {"train_loss": -11.630559921264648, "global_step": 275182, "epoch": 1637} {"train_loss": -11.690952891395206, "global_step": 275183, "epoch": 1637, "val_loss": 271306.96875} {"train_loss": -11.338227272033691, "global_step": 275184, "epoch": 1638} {"train_loss": -11.87108039855957, "global_step": 275185, "epoch": 1638} {"train_loss": -11.620071411132812, "global_step": 275186, "epoch": 1638} {"train_loss": -11.954421997070312, "global_step": 275187, "epoch": 1638} {"train_loss": -11.600025177001953, "global_step": 275188, "epoch": 1638} {"train_loss": -11.87508773803711, "global_step": 275189, "epoch": 1638} {"train_loss": -11.735840797424316, "global_step": 275190, "epoch": 1638} {"train_loss": -11.828332901000977, "global_step": 275191, "epoch": 1638} {"train_loss": -12.035980224609375, "global_step": 275192, "epoch": 1638} {"train_loss": -11.928598403930664, "global_step": 275193, "epoch": 1638} {"train_loss": -12.13336181640625, "global_step": 275194, "epoch": 1638} {"train_loss": -11.949075698852539, "global_step": 275195, "epoch": 1638} {"train_loss": -12.06999683380127, "global_step": 275196, "epoch": 1638} {"train_loss": -11.7736234664917, "global_step": 275197, "epoch": 1638} {"train_loss": -11.936418533325195, "global_step": 275198, "epoch": 1638} {"train_loss": -11.7264404296875, "global_step": 275199, "epoch": 1638} {"train_loss": -11.967254638671875, "global_step": 275200, "epoch": 1638} {"train_loss": -11.989363670349121, "global_step": 275201, "epoch": 1638} {"train_loss": -12.025769233703613, "global_step": 275202, "epoch": 1638} {"train_loss": -11.868372917175293, "global_step": 275203, "epoch": 1638} {"train_loss": -12.058361053466797, "global_step": 275204, "epoch": 1638} {"train_loss": -11.979776382446289, "global_step": 275205, "epoch": 1638} {"train_loss": -11.868316650390625, "global_step": 275206, "epoch": 1638} {"train_loss": -11.991937637329102, "global_step": 275207, "epoch": 1638} {"train_loss": -12.038459777832031, "global_step": 275208, "epoch": 1638} {"train_loss": -12.182561874389648, "global_step": 275209, "epoch": 1638} {"train_loss": -12.101480484008789, "global_step": 275210, "epoch": 1638} {"train_loss": -12.178279876708984, "global_step": 275211, "epoch": 1638} {"train_loss": -12.128490447998047, "global_step": 275212, "epoch": 1638} {"train_loss": -12.14842414855957, "global_step": 275213, "epoch": 1638} {"train_loss": -12.21268081665039, "global_step": 275214, "epoch": 1638} {"train_loss": -12.248527526855469, "global_step": 275215, "epoch": 1638} {"train_loss": -12.204978942871094, "global_step": 275216, "epoch": 1638} {"train_loss": -12.287657737731934, "global_step": 275217, "epoch": 1638} {"train_loss": -12.123636245727539, "global_step": 275218, "epoch": 1638} {"train_loss": -12.110372543334961, "global_step": 275219, "epoch": 1638} {"train_loss": -12.267914772033691, "global_step": 275220, "epoch": 1638} {"train_loss": -12.159422874450684, "global_step": 275221, "epoch": 1638} {"train_loss": -11.938016891479492, "global_step": 275222, "epoch": 1638} {"train_loss": -12.256296157836914, "global_step": 275223, "epoch": 1638} {"train_loss": -12.313032150268555, "global_step": 275224, "epoch": 1638} {"train_loss": -12.125527381896973, "global_step": 275225, "epoch": 1638} {"train_loss": -12.269575119018555, "global_step": 275226, "epoch": 1638} {"train_loss": -12.458606719970703, "global_step": 275227, "epoch": 1638} {"train_loss": -12.327125549316406, "global_step": 275228, "epoch": 1638} {"train_loss": -12.375982284545898, "global_step": 275229, "epoch": 1638} {"train_loss": -12.36703109741211, "global_step": 275230, "epoch": 1638} {"train_loss": -12.27130126953125, "global_step": 275231, "epoch": 1638} {"train_loss": -12.208247184753418, "global_step": 275232, "epoch": 1638} {"train_loss": -12.31873893737793, "global_step": 275233, "epoch": 1638} {"train_loss": -12.404769897460938, "global_step": 275234, "epoch": 1638} {"train_loss": -12.25194263458252, "global_step": 275235, "epoch": 1638} {"train_loss": -12.19340705871582, "global_step": 275236, "epoch": 1638} {"train_loss": -12.309322357177734, "global_step": 275237, "epoch": 1638} {"train_loss": -12.294622421264648, "global_step": 275238, "epoch": 1638} {"train_loss": -12.24462890625, "global_step": 275239, "epoch": 1638} {"train_loss": -12.35034465789795, "global_step": 275240, "epoch": 1638} {"train_loss": -12.327367782592773, "global_step": 275241, "epoch": 1638} {"train_loss": -12.134021759033203, "global_step": 275242, "epoch": 1638} {"train_loss": -12.373311996459961, "global_step": 275243, "epoch": 1638} {"train_loss": -12.183280944824219, "global_step": 275244, "epoch": 1638} {"train_loss": -12.33843994140625, "global_step": 275245, "epoch": 1638} {"train_loss": -12.309492111206055, "global_step": 275246, "epoch": 1638} {"train_loss": -12.444574356079102, "global_step": 275247, "epoch": 1638} {"train_loss": -12.358955383300781, "global_step": 275248, "epoch": 1638} {"train_loss": -12.177069664001465, "global_step": 275249, "epoch": 1638} {"train_loss": -12.374717712402344, "global_step": 275250, "epoch": 1638} {"train_loss": -12.458040237426758, "global_step": 275251, "epoch": 1638} {"train_loss": -12.027292251586914, "global_step": 275252, "epoch": 1638} {"train_loss": -12.449756622314453, "global_step": 275253, "epoch": 1638} {"train_loss": -12.109407424926758, "global_step": 275254, "epoch": 1638} {"train_loss": -12.45504379272461, "global_step": 275255, "epoch": 1638} {"train_loss": -12.364701271057129, "global_step": 275256, "epoch": 1638} {"train_loss": -12.09694766998291, "global_step": 275257, "epoch": 1638} {"train_loss": -12.106340408325195, "global_step": 275258, "epoch": 1638} {"train_loss": -12.48038387298584, "global_step": 275259, "epoch": 1638} {"train_loss": -12.371864318847656, "global_step": 275260, "epoch": 1638} {"train_loss": -12.433595657348633, "global_step": 275261, "epoch": 1638} {"train_loss": -12.10244369506836, "global_step": 275262, "epoch": 1638} {"train_loss": -12.354347229003906, "global_step": 275263, "epoch": 1638} {"train_loss": -12.083273887634277, "global_step": 275264, "epoch": 1638} {"train_loss": -11.926346778869629, "global_step": 275265, "epoch": 1638} {"train_loss": -12.236984252929688, "global_step": 275266, "epoch": 1638} {"train_loss": -12.353229522705078, "global_step": 275267, "epoch": 1638} {"train_loss": -11.794979095458984, "global_step": 275268, "epoch": 1638} {"train_loss": -11.234442710876465, "global_step": 275269, "epoch": 1638} {"train_loss": -11.678905487060547, "global_step": 275270, "epoch": 1638} {"train_loss": -11.134489059448242, "global_step": 275271, "epoch": 1638} {"train_loss": -11.41562271118164, "global_step": 275272, "epoch": 1638} {"train_loss": -10.277436256408691, "global_step": 275273, "epoch": 1638} {"train_loss": -11.903045654296875, "global_step": 275274, "epoch": 1638} {"train_loss": -9.442604064941406, "global_step": 275275, "epoch": 1638} {"train_loss": -9.962385177612305, "global_step": 275276, "epoch": 1638} {"train_loss": -10.231216430664062, "global_step": 275277, "epoch": 1638} {"train_loss": -9.177515983581543, "global_step": 275278, "epoch": 1638} {"train_loss": -10.930176734924316, "global_step": 275279, "epoch": 1638} {"train_loss": -10.446310043334961, "global_step": 275280, "epoch": 1638} {"train_loss": -10.662099838256836, "global_step": 275281, "epoch": 1638} {"train_loss": -11.128210067749023, "global_step": 275282, "epoch": 1638} {"train_loss": -11.665630340576172, "global_step": 275283, "epoch": 1638} {"train_loss": -11.616934776306152, "global_step": 275284, "epoch": 1638} {"train_loss": -11.203422546386719, "global_step": 275285, "epoch": 1638} {"train_loss": -11.399687767028809, "global_step": 275286, "epoch": 1638} {"train_loss": -11.676628112792969, "global_step": 275287, "epoch": 1638} {"train_loss": -11.655652046203613, "global_step": 275288, "epoch": 1638} {"train_loss": -11.428763389587402, "global_step": 275289, "epoch": 1638} {"train_loss": -11.821722030639648, "global_step": 275290, "epoch": 1638} {"train_loss": -11.481124877929688, "global_step": 275291, "epoch": 1638} {"train_loss": -11.306053161621094, "global_step": 275292, "epoch": 1638} {"train_loss": -11.40931510925293, "global_step": 275293, "epoch": 1638} {"train_loss": -11.044161796569824, "global_step": 275294, "epoch": 1638} {"train_loss": -11.321111679077148, "global_step": 275295, "epoch": 1638} {"train_loss": -10.161576271057129, "global_step": 275296, "epoch": 1638} {"train_loss": -11.247867584228516, "global_step": 275297, "epoch": 1638} {"train_loss": -11.174654006958008, "global_step": 275298, "epoch": 1638} {"train_loss": -10.562553405761719, "global_step": 275299, "epoch": 1638} {"train_loss": -11.756254196166992, "global_step": 275300, "epoch": 1638} {"train_loss": -10.133039474487305, "global_step": 275301, "epoch": 1638} {"train_loss": -11.519170761108398, "global_step": 275302, "epoch": 1638} {"train_loss": -10.949661254882812, "global_step": 275303, "epoch": 1638} {"train_loss": -11.368881225585938, "global_step": 275304, "epoch": 1638} {"train_loss": -11.45881462097168, "global_step": 275305, "epoch": 1638} {"train_loss": -10.467716217041016, "global_step": 275306, "epoch": 1638} {"train_loss": -10.985662460327148, "global_step": 275307, "epoch": 1638} {"train_loss": -10.878469467163086, "global_step": 275308, "epoch": 1638} {"train_loss": -10.723976135253906, "global_step": 275309, "epoch": 1638} {"train_loss": -11.222192764282227, "global_step": 275310, "epoch": 1638} {"train_loss": -10.84277057647705, "global_step": 275311, "epoch": 1638} {"train_loss": -11.418817520141602, "global_step": 275312, "epoch": 1638} {"train_loss": -11.209175109863281, "global_step": 275313, "epoch": 1638} {"train_loss": -11.540846824645996, "global_step": 275314, "epoch": 1638} {"train_loss": -11.401603698730469, "global_step": 275315, "epoch": 1638} {"train_loss": -11.445566177368164, "global_step": 275316, "epoch": 1638} {"train_loss": -11.481008529663086, "global_step": 275317, "epoch": 1638} {"train_loss": -11.3544282913208, "global_step": 275318, "epoch": 1638} {"train_loss": -11.93244457244873, "global_step": 275319, "epoch": 1638} {"train_loss": -11.351360321044922, "global_step": 275320, "epoch": 1638} {"train_loss": -11.703119277954102, "global_step": 275321, "epoch": 1638} {"train_loss": -11.676130294799805, "global_step": 275322, "epoch": 1638} {"train_loss": -11.607433319091797, "global_step": 275323, "epoch": 1638} {"train_loss": -11.736976623535156, "global_step": 275324, "epoch": 1638} {"train_loss": -11.421649932861328, "global_step": 275325, "epoch": 1638} {"train_loss": -11.608152389526367, "global_step": 275326, "epoch": 1638} {"train_loss": -11.91057014465332, "global_step": 275327, "epoch": 1638} {"train_loss": -11.504236221313477, "global_step": 275328, "epoch": 1638} {"train_loss": -11.677644729614258, "global_step": 275329, "epoch": 1638} {"train_loss": -11.468420028686523, "global_step": 275330, "epoch": 1638} {"train_loss": -11.818770408630371, "global_step": 275331, "epoch": 1638} {"train_loss": -11.807506561279297, "global_step": 275332, "epoch": 1638} {"train_loss": -11.852788925170898, "global_step": 275333, "epoch": 1638} {"train_loss": -11.755675315856934, "global_step": 275334, "epoch": 1638} {"train_loss": -12.048739433288574, "global_step": 275335, "epoch": 1638} {"train_loss": -11.891895294189453, "global_step": 275336, "epoch": 1638} {"train_loss": -11.8848876953125, "global_step": 275337, "epoch": 1638} {"train_loss": -12.025712966918945, "global_step": 275338, "epoch": 1638} {"train_loss": -11.783451080322266, "global_step": 275339, "epoch": 1638} {"train_loss": -12.00812816619873, "global_step": 275340, "epoch": 1638} {"train_loss": -11.90075397491455, "global_step": 275341, "epoch": 1638} {"train_loss": -11.941314697265625, "global_step": 275342, "epoch": 1638} {"train_loss": -11.887426376342773, "global_step": 275343, "epoch": 1638} {"train_loss": -12.04273796081543, "global_step": 275344, "epoch": 1638} {"train_loss": -12.220504760742188, "global_step": 275345, "epoch": 1638} {"train_loss": -12.105043411254883, "global_step": 275346, "epoch": 1638} {"train_loss": -12.017699241638184, "global_step": 275347, "epoch": 1638} {"train_loss": -12.11524772644043, "global_step": 275348, "epoch": 1638} {"train_loss": -12.09391975402832, "global_step": 275349, "epoch": 1638} {"train_loss": -12.05024242401123, "global_step": 275350, "epoch": 1638} {"train_loss": -11.766696833428883, "global_step": 275351, "epoch": 1638, "val_loss": 272381.9375} {"train_loss": -11.972982406616211, "global_step": 275352, "epoch": 1639} {"train_loss": -12.133295059204102, "global_step": 275353, "epoch": 1639} {"train_loss": -12.150110244750977, "global_step": 275354, "epoch": 1639} {"train_loss": -12.100131034851074, "global_step": 275355, "epoch": 1639} {"train_loss": -12.102315902709961, "global_step": 275356, "epoch": 1639} {"train_loss": -12.047746658325195, "global_step": 275357, "epoch": 1639} {"train_loss": -11.756901741027832, "global_step": 275358, "epoch": 1639} {"train_loss": -12.08150577545166, "global_step": 275359, "epoch": 1639} {"train_loss": -11.960618019104004, "global_step": 275360, "epoch": 1639} {"train_loss": -12.099421501159668, "global_step": 275361, "epoch": 1639} {"train_loss": -11.960031509399414, "global_step": 275362, "epoch": 1639} {"train_loss": -12.139039993286133, "global_step": 275363, "epoch": 1639} {"train_loss": -11.714052200317383, "global_step": 275364, "epoch": 1639} {"train_loss": -12.238922119140625, "global_step": 275365, "epoch": 1639} {"train_loss": -12.106786727905273, "global_step": 275366, "epoch": 1639} {"train_loss": -11.99099349975586, "global_step": 275367, "epoch": 1639} {"train_loss": -12.419745445251465, "global_step": 275368, "epoch": 1639} {"train_loss": -12.253621101379395, "global_step": 275369, "epoch": 1639} {"train_loss": -12.270121574401855, "global_step": 275370, "epoch": 1639} {"train_loss": -12.214422225952148, "global_step": 275371, "epoch": 1639} {"train_loss": -12.063493728637695, "global_step": 275372, "epoch": 1639} {"train_loss": -12.23377799987793, "global_step": 275373, "epoch": 1639} {"train_loss": -12.010285377502441, "global_step": 275374, "epoch": 1639} {"train_loss": -12.301580429077148, "global_step": 275375, "epoch": 1639} {"train_loss": -12.102303504943848, "global_step": 275376, "epoch": 1639} {"train_loss": -11.867761611938477, "global_step": 275377, "epoch": 1639} {"train_loss": -12.31220531463623, "global_step": 275378, "epoch": 1639} {"train_loss": -12.219511032104492, "global_step": 275379, "epoch": 1639} {"train_loss": -12.08454704284668, "global_step": 275380, "epoch": 1639} {"train_loss": -12.059038162231445, "global_step": 275381, "epoch": 1639} {"train_loss": -12.049402236938477, "global_step": 275382, "epoch": 1639} {"train_loss": -12.572126388549805, "global_step": 275383, "epoch": 1639} {"train_loss": -12.16372299194336, "global_step": 275384, "epoch": 1639} {"train_loss": -12.039482116699219, "global_step": 275385, "epoch": 1639} {"train_loss": -12.34720230102539, "global_step": 275386, "epoch": 1639} {"train_loss": -12.395299911499023, "global_step": 275387, "epoch": 1639} {"train_loss": -12.013626098632812, "global_step": 275388, "epoch": 1639} {"train_loss": -12.036662101745605, "global_step": 275389, "epoch": 1639} {"train_loss": -12.262870788574219, "global_step": 275390, "epoch": 1639} {"train_loss": -12.08160400390625, "global_step": 275391, "epoch": 1639} {"train_loss": -11.607996940612793, "global_step": 275392, "epoch": 1639} {"train_loss": -12.136953353881836, "global_step": 275393, "epoch": 1639} {"train_loss": -12.214591979980469, "global_step": 275394, "epoch": 1639} {"train_loss": -11.462335586547852, "global_step": 275395, "epoch": 1639} {"train_loss": -11.495019912719727, "global_step": 275396, "epoch": 1639} {"train_loss": -12.24589729309082, "global_step": 275397, "epoch": 1639} {"train_loss": -11.028717041015625, "global_step": 275398, "epoch": 1639} {"train_loss": -11.467281341552734, "global_step": 275399, "epoch": 1639} {"train_loss": -12.444746017456055, "global_step": 275400, "epoch": 1639} {"train_loss": -12.151731491088867, "global_step": 275401, "epoch": 1639} {"train_loss": -11.933263778686523, "global_step": 275402, "epoch": 1639} {"train_loss": -11.356670379638672, "global_step": 275403, "epoch": 1639} {"train_loss": -11.198587417602539, "global_step": 275404, "epoch": 1639} {"train_loss": -12.003056526184082, "global_step": 275405, "epoch": 1639} {"train_loss": -11.620044708251953, "global_step": 275406, "epoch": 1639} {"train_loss": -10.220893859863281, "global_step": 275407, "epoch": 1639} {"train_loss": -11.727890014648438, "global_step": 275408, "epoch": 1639} {"train_loss": -11.880481719970703, "global_step": 275409, "epoch": 1639} {"train_loss": -11.08095932006836, "global_step": 275410, "epoch": 1639} {"train_loss": -11.05489444732666, "global_step": 275411, "epoch": 1639} {"train_loss": -12.236458778381348, "global_step": 275412, "epoch": 1639} {"train_loss": -11.3231201171875, "global_step": 275413, "epoch": 1639} {"train_loss": -11.483388900756836, "global_step": 275414, "epoch": 1639} {"train_loss": -11.719948768615723, "global_step": 275415, "epoch": 1639} {"train_loss": -11.67798900604248, "global_step": 275416, "epoch": 1639} {"train_loss": -11.516937255859375, "global_step": 275417, "epoch": 1639} {"train_loss": -12.012572288513184, "global_step": 275418, "epoch": 1639} {"train_loss": -11.744125366210938, "global_step": 275419, "epoch": 1639} {"train_loss": -11.364455223083496, "global_step": 275420, "epoch": 1639} {"train_loss": -11.947848320007324, "global_step": 275421, "epoch": 1639} {"train_loss": -11.789016723632812, "global_step": 275422, "epoch": 1639} {"train_loss": -12.016263961791992, "global_step": 275423, "epoch": 1639} {"train_loss": -11.910223960876465, "global_step": 275424, "epoch": 1639} {"train_loss": -12.052416801452637, "global_step": 275425, "epoch": 1639} {"train_loss": -11.771081924438477, "global_step": 275426, "epoch": 1639} {"train_loss": -11.561623573303223, "global_step": 275427, "epoch": 1639} {"train_loss": -11.798439979553223, "global_step": 275428, "epoch": 1639} {"train_loss": -11.718244552612305, "global_step": 275429, "epoch": 1639} {"train_loss": -11.368598937988281, "global_step": 275430, "epoch": 1639} {"train_loss": -11.852499008178711, "global_step": 275431, "epoch": 1639} {"train_loss": -10.979321479797363, "global_step": 275432, "epoch": 1639} {"train_loss": -11.768917083740234, "global_step": 275433, "epoch": 1639} {"train_loss": -12.19946002960205, "global_step": 275434, "epoch": 1639} {"train_loss": -10.93269157409668, "global_step": 275435, "epoch": 1639} {"train_loss": -11.531169891357422, "global_step": 275436, "epoch": 1639} {"train_loss": -11.930440902709961, "global_step": 275437, "epoch": 1639} {"train_loss": -11.629315376281738, "global_step": 275438, "epoch": 1639} {"train_loss": -11.66213321685791, "global_step": 275439, "epoch": 1639} {"train_loss": -11.46395492553711, "global_step": 275440, "epoch": 1639} {"train_loss": -11.755578994750977, "global_step": 275441, "epoch": 1639} {"train_loss": -11.853816032409668, "global_step": 275442, "epoch": 1639} {"train_loss": -11.810812950134277, "global_step": 275443, "epoch": 1639} {"train_loss": -11.570484161376953, "global_step": 275444, "epoch": 1639} {"train_loss": -11.77787971496582, "global_step": 275445, "epoch": 1639} {"train_loss": -11.718216896057129, "global_step": 275446, "epoch": 1639} {"train_loss": -11.73902702331543, "global_step": 275447, "epoch": 1639} {"train_loss": -11.96981143951416, "global_step": 275448, "epoch": 1639} {"train_loss": -11.83456802368164, "global_step": 275449, "epoch": 1639} {"train_loss": -11.944414138793945, "global_step": 275450, "epoch": 1639} {"train_loss": -12.051237106323242, "global_step": 275451, "epoch": 1639} {"train_loss": -11.886903762817383, "global_step": 275452, "epoch": 1639} {"train_loss": -11.934861183166504, "global_step": 275453, "epoch": 1639} {"train_loss": -11.843174934387207, "global_step": 275454, "epoch": 1639} {"train_loss": -12.123696327209473, "global_step": 275455, "epoch": 1639} {"train_loss": -12.20402717590332, "global_step": 275456, "epoch": 1639} {"train_loss": -11.934911727905273, "global_step": 275457, "epoch": 1639} {"train_loss": -11.939762115478516, "global_step": 275458, "epoch": 1639} {"train_loss": -12.06086254119873, "global_step": 275459, "epoch": 1639} {"train_loss": -12.159952163696289, "global_step": 275460, "epoch": 1639} {"train_loss": -12.313074111938477, "global_step": 275461, "epoch": 1639} {"train_loss": -12.188948631286621, "global_step": 275462, "epoch": 1639} {"train_loss": -12.265645980834961, "global_step": 275463, "epoch": 1639} {"train_loss": -12.073391914367676, "global_step": 275464, "epoch": 1639} {"train_loss": -12.077384948730469, "global_step": 275465, "epoch": 1639} {"train_loss": -11.602105140686035, "global_step": 275466, "epoch": 1639} {"train_loss": -12.334001541137695, "global_step": 275467, "epoch": 1639} {"train_loss": -12.052421569824219, "global_step": 275468, "epoch": 1639} {"train_loss": -11.953481674194336, "global_step": 275469, "epoch": 1639} {"train_loss": -12.12718391418457, "global_step": 275470, "epoch": 1639} {"train_loss": -12.145675659179688, "global_step": 275471, "epoch": 1639} {"train_loss": -12.111194610595703, "global_step": 275472, "epoch": 1639} {"train_loss": -11.960938453674316, "global_step": 275473, "epoch": 1639} {"train_loss": -11.906885147094727, "global_step": 275474, "epoch": 1639} {"train_loss": -12.258684158325195, "global_step": 275475, "epoch": 1639} {"train_loss": -12.034035682678223, "global_step": 275476, "epoch": 1639} {"train_loss": -12.04919719696045, "global_step": 275477, "epoch": 1639} {"train_loss": -11.796393394470215, "global_step": 275478, "epoch": 1639} {"train_loss": -11.883100509643555, "global_step": 275479, "epoch": 1639} {"train_loss": -11.971466064453125, "global_step": 275480, "epoch": 1639} {"train_loss": -12.074377059936523, "global_step": 275481, "epoch": 1639} {"train_loss": -11.44848346710205, "global_step": 275482, "epoch": 1639} {"train_loss": -12.005289077758789, "global_step": 275483, "epoch": 1639} {"train_loss": -11.802364349365234, "global_step": 275484, "epoch": 1639} {"train_loss": -10.877445220947266, "global_step": 275485, "epoch": 1639} {"train_loss": -11.959961891174316, "global_step": 275486, "epoch": 1639} {"train_loss": -11.426299095153809, "global_step": 275487, "epoch": 1639} {"train_loss": -11.122499465942383, "global_step": 275488, "epoch": 1639} {"train_loss": -11.637773513793945, "global_step": 275489, "epoch": 1639} {"train_loss": -11.647709846496582, "global_step": 275490, "epoch": 1639} {"train_loss": -10.859781265258789, "global_step": 275491, "epoch": 1639} {"train_loss": -11.869972229003906, "global_step": 275492, "epoch": 1639} {"train_loss": -11.269768714904785, "global_step": 275493, "epoch": 1639} {"train_loss": -10.598464012145996, "global_step": 275494, "epoch": 1639} {"train_loss": -11.68950080871582, "global_step": 275495, "epoch": 1639} {"train_loss": -11.62613582611084, "global_step": 275496, "epoch": 1639} {"train_loss": -10.524681091308594, "global_step": 275497, "epoch": 1639} {"train_loss": -10.684137344360352, "global_step": 275498, "epoch": 1639} {"train_loss": -9.779865264892578, "global_step": 275499, "epoch": 1639} {"train_loss": -11.531253814697266, "global_step": 275500, "epoch": 1639} {"train_loss": -11.078876495361328, "global_step": 275501, "epoch": 1639} {"train_loss": -10.929332733154297, "global_step": 275502, "epoch": 1639} {"train_loss": -11.591405868530273, "global_step": 275503, "epoch": 1639} {"train_loss": -10.697798728942871, "global_step": 275504, "epoch": 1639} {"train_loss": -11.633319854736328, "global_step": 275505, "epoch": 1639} {"train_loss": -11.335071563720703, "global_step": 275506, "epoch": 1639} {"train_loss": -11.814714431762695, "global_step": 275507, "epoch": 1639} {"train_loss": -11.343058586120605, "global_step": 275508, "epoch": 1639} {"train_loss": -11.937814712524414, "global_step": 275509, "epoch": 1639} {"train_loss": -11.750726699829102, "global_step": 275510, "epoch": 1639} {"train_loss": -11.824007987976074, "global_step": 275511, "epoch": 1639} {"train_loss": -11.83365249633789, "global_step": 275512, "epoch": 1639} {"train_loss": -11.86983585357666, "global_step": 275513, "epoch": 1639} {"train_loss": -11.844018936157227, "global_step": 275514, "epoch": 1639} {"train_loss": -11.76378345489502, "global_step": 275515, "epoch": 1639} {"train_loss": -12.139448165893555, "global_step": 275516, "epoch": 1639} {"train_loss": -11.852374076843262, "global_step": 275517, "epoch": 1639} {"train_loss": -11.864021301269531, "global_step": 275518, "epoch": 1639} {"train_loss": -11.80227468127296, "global_step": 275519, "epoch": 1639, "val_loss": 274732.25} {"train_loss": -12.016124725341797, "global_step": 275520, "epoch": 1640} {"train_loss": -12.132671356201172, "global_step": 275521, "epoch": 1640} {"train_loss": -11.834564208984375, "global_step": 275522, "epoch": 1640} {"train_loss": -11.912212371826172, "global_step": 275523, "epoch": 1640} {"train_loss": -12.084831237792969, "global_step": 275524, "epoch": 1640} {"train_loss": -11.897465705871582, "global_step": 275525, "epoch": 1640} {"train_loss": -12.354779243469238, "global_step": 275526, "epoch": 1640} {"train_loss": -11.9835205078125, "global_step": 275527, "epoch": 1640} {"train_loss": -12.107258796691895, "global_step": 275528, "epoch": 1640} {"train_loss": -12.048727035522461, "global_step": 275529, "epoch": 1640} {"train_loss": -12.001846313476562, "global_step": 275530, "epoch": 1640} {"train_loss": -11.875844955444336, "global_step": 275531, "epoch": 1640} {"train_loss": -12.104267120361328, "global_step": 275532, "epoch": 1640} {"train_loss": -11.692249298095703, "global_step": 275533, "epoch": 1640} {"train_loss": -12.009702682495117, "global_step": 275534, "epoch": 1640} {"train_loss": -11.968994140625, "global_step": 275535, "epoch": 1640} {"train_loss": -11.924530029296875, "global_step": 275536, "epoch": 1640} {"train_loss": -12.068853378295898, "global_step": 275537, "epoch": 1640} {"train_loss": -11.921493530273438, "global_step": 275538, "epoch": 1640} {"train_loss": -12.211514472961426, "global_step": 275539, "epoch": 1640} {"train_loss": -11.66891098022461, "global_step": 275540, "epoch": 1640} {"train_loss": -11.974098205566406, "global_step": 275541, "epoch": 1640} {"train_loss": -11.88798713684082, "global_step": 275542, "epoch": 1640} {"train_loss": -12.094611167907715, "global_step": 275543, "epoch": 1640} {"train_loss": -12.226102828979492, "global_step": 275544, "epoch": 1640} {"train_loss": -11.927864074707031, "global_step": 275545, "epoch": 1640} {"train_loss": -12.003344535827637, "global_step": 275546, "epoch": 1640} {"train_loss": -11.881693840026855, "global_step": 275547, "epoch": 1640} {"train_loss": -11.965980529785156, "global_step": 275548, "epoch": 1640} {"train_loss": -12.267285346984863, "global_step": 275549, "epoch": 1640} {"train_loss": -12.364816665649414, "global_step": 275550, "epoch": 1640} {"train_loss": -12.26715087890625, "global_step": 275551, "epoch": 1640} {"train_loss": -12.128411293029785, "global_step": 275552, "epoch": 1640} {"train_loss": -12.262120246887207, "global_step": 275553, "epoch": 1640} {"train_loss": -12.345044136047363, "global_step": 275554, "epoch": 1640} {"train_loss": -12.338601112365723, "global_step": 275555, "epoch": 1640} {"train_loss": -12.307159423828125, "global_step": 275556, "epoch": 1640} {"train_loss": -12.242696762084961, "global_step": 275557, "epoch": 1640} {"train_loss": -12.228950500488281, "global_step": 275558, "epoch": 1640} {"train_loss": -12.361103057861328, "global_step": 275559, "epoch": 1640} {"train_loss": -12.41024398803711, "global_step": 275560, "epoch": 1640} {"train_loss": -11.856637954711914, "global_step": 275561, "epoch": 1640} {"train_loss": -11.864385604858398, "global_step": 275562, "epoch": 1640} {"train_loss": -12.213493347167969, "global_step": 275563, "epoch": 1640} {"train_loss": -12.195743560791016, "global_step": 275564, "epoch": 1640} {"train_loss": -12.389381408691406, "global_step": 275565, "epoch": 1640} {"train_loss": -12.174407958984375, "global_step": 275566, "epoch": 1640} {"train_loss": -12.460126876831055, "global_step": 275567, "epoch": 1640} {"train_loss": -12.201764106750488, "global_step": 275568, "epoch": 1640} {"train_loss": -12.312625885009766, "global_step": 275569, "epoch": 1640} {"train_loss": -11.790698051452637, "global_step": 275570, "epoch": 1640} {"train_loss": -12.311897277832031, "global_step": 275571, "epoch": 1640} {"train_loss": -11.645639419555664, "global_step": 275572, "epoch": 1640} {"train_loss": -10.685785293579102, "global_step": 275573, "epoch": 1640} {"train_loss": -12.175063133239746, "global_step": 275574, "epoch": 1640} {"train_loss": -11.749025344848633, "global_step": 275575, "epoch": 1640} {"train_loss": -11.995665550231934, "global_step": 275576, "epoch": 1640} {"train_loss": -11.447052001953125, "global_step": 275577, "epoch": 1640} {"train_loss": -11.55015754699707, "global_step": 275578, "epoch": 1640} {"train_loss": -11.893024444580078, "global_step": 275579, "epoch": 1640} {"train_loss": -11.568609237670898, "global_step": 275580, "epoch": 1640} {"train_loss": -11.483733177185059, "global_step": 275581, "epoch": 1640} {"train_loss": -9.255006790161133, "global_step": 275582, "epoch": 1640} {"train_loss": -11.970417022705078, "global_step": 275583, "epoch": 1640} {"train_loss": -9.05828857421875, "global_step": 275584, "epoch": 1640} {"train_loss": -10.093881607055664, "global_step": 275585, "epoch": 1640} {"train_loss": -7.888369560241699, "global_step": 275586, "epoch": 1640} {"train_loss": -6.523740768432617, "global_step": 275587, "epoch": 1640} {"train_loss": -6.743927001953125, "global_step": 275588, "epoch": 1640} {"train_loss": -7.121110916137695, "global_step": 275589, "epoch": 1640} {"train_loss": -7.913427352905273, "global_step": 275590, "epoch": 1640} {"train_loss": -8.692344665527344, "global_step": 275591, "epoch": 1640} {"train_loss": -9.094971656799316, "global_step": 275592, "epoch": 1640} {"train_loss": -9.182889938354492, "global_step": 275593, "epoch": 1640} {"train_loss": -9.026057243347168, "global_step": 275594, "epoch": 1640} {"train_loss": -9.54429817199707, "global_step": 275595, "epoch": 1640} {"train_loss": -9.630144119262695, "global_step": 275596, "epoch": 1640} {"train_loss": -9.82314682006836, "global_step": 275597, "epoch": 1640} {"train_loss": -11.018840789794922, "global_step": 275598, "epoch": 1640} {"train_loss": -9.598175048828125, "global_step": 275599, "epoch": 1640} {"train_loss": -9.38626480102539, "global_step": 275600, "epoch": 1640} {"train_loss": -11.0533447265625, "global_step": 275601, "epoch": 1640} {"train_loss": -9.871838569641113, "global_step": 275602, "epoch": 1640} {"train_loss": -9.968045234680176, "global_step": 275603, "epoch": 1640} {"train_loss": -10.880411148071289, "global_step": 275604, "epoch": 1640} {"train_loss": -10.158971786499023, "global_step": 275605, "epoch": 1640} {"train_loss": -10.202933311462402, "global_step": 275606, "epoch": 1640} {"train_loss": -11.634381294250488, "global_step": 275607, "epoch": 1640} {"train_loss": -10.379581451416016, "global_step": 275608, "epoch": 1640} {"train_loss": -10.844256401062012, "global_step": 275609, "epoch": 1640} {"train_loss": -11.274425506591797, "global_step": 275610, "epoch": 1640} {"train_loss": -10.498905181884766, "global_step": 275611, "epoch": 1640} {"train_loss": -10.74023151397705, "global_step": 275612, "epoch": 1640} {"train_loss": -11.293193817138672, "global_step": 275613, "epoch": 1640} {"train_loss": -11.40349006652832, "global_step": 275614, "epoch": 1640} {"train_loss": -11.46537971496582, "global_step": 275615, "epoch": 1640} {"train_loss": -11.75724983215332, "global_step": 275616, "epoch": 1640} {"train_loss": -11.584735870361328, "global_step": 275617, "epoch": 1640} {"train_loss": -11.503419876098633, "global_step": 275618, "epoch": 1640} {"train_loss": -11.469468116760254, "global_step": 275619, "epoch": 1640} {"train_loss": -11.310162544250488, "global_step": 275620, "epoch": 1640} {"train_loss": -11.04167652130127, "global_step": 275621, "epoch": 1640} {"train_loss": -11.644261360168457, "global_step": 275622, "epoch": 1640} {"train_loss": -11.2898530960083, "global_step": 275623, "epoch": 1640} {"train_loss": -11.873525619506836, "global_step": 275624, "epoch": 1640} {"train_loss": -11.446452140808105, "global_step": 275625, "epoch": 1640} {"train_loss": -11.782905578613281, "global_step": 275626, "epoch": 1640} {"train_loss": -11.863348007202148, "global_step": 275627, "epoch": 1640} {"train_loss": -11.586355209350586, "global_step": 275628, "epoch": 1640} {"train_loss": -11.735750198364258, "global_step": 275629, "epoch": 1640} {"train_loss": -11.486564636230469, "global_step": 275630, "epoch": 1640} {"train_loss": -11.696847915649414, "global_step": 275631, "epoch": 1640} {"train_loss": -11.700695037841797, "global_step": 275632, "epoch": 1640} {"train_loss": -11.638145446777344, "global_step": 275633, "epoch": 1640} {"train_loss": -11.493946075439453, "global_step": 275634, "epoch": 1640} {"train_loss": -11.335039138793945, "global_step": 275635, "epoch": 1640} {"train_loss": -11.539819717407227, "global_step": 275636, "epoch": 1640} {"train_loss": -11.409279823303223, "global_step": 275637, "epoch": 1640} {"train_loss": -11.565678596496582, "global_step": 275638, "epoch": 1640} {"train_loss": -11.536516189575195, "global_step": 275639, "epoch": 1640} {"train_loss": -11.55550765991211, "global_step": 275640, "epoch": 1640} {"train_loss": -11.751426696777344, "global_step": 275641, "epoch": 1640} {"train_loss": -11.528358459472656, "global_step": 275642, "epoch": 1640} {"train_loss": -11.361639976501465, "global_step": 275643, "epoch": 1640} {"train_loss": -11.766613006591797, "global_step": 275644, "epoch": 1640} {"train_loss": -11.599296569824219, "global_step": 275645, "epoch": 1640} {"train_loss": -11.917685508728027, "global_step": 275646, "epoch": 1640} {"train_loss": -11.667049407958984, "global_step": 275647, "epoch": 1640} {"train_loss": -11.777303695678711, "global_step": 275648, "epoch": 1640} {"train_loss": -11.912885665893555, "global_step": 275649, "epoch": 1640} {"train_loss": -12.058500289916992, "global_step": 275650, "epoch": 1640} {"train_loss": -11.750466346740723, "global_step": 275651, "epoch": 1640} {"train_loss": -11.912211418151855, "global_step": 275652, "epoch": 1640} {"train_loss": -11.785588264465332, "global_step": 275653, "epoch": 1640} {"train_loss": -11.924511909484863, "global_step": 275654, "epoch": 1640} {"train_loss": -11.974184036254883, "global_step": 275655, "epoch": 1640} {"train_loss": -12.12086296081543, "global_step": 275656, "epoch": 1640} {"train_loss": -11.863576889038086, "global_step": 275657, "epoch": 1640} {"train_loss": -12.041141510009766, "global_step": 275658, "epoch": 1640} {"train_loss": -12.00107192993164, "global_step": 275659, "epoch": 1640} {"train_loss": -12.037018775939941, "global_step": 275660, "epoch": 1640} {"train_loss": -11.793968200683594, "global_step": 275661, "epoch": 1640} {"train_loss": -12.12617301940918, "global_step": 275662, "epoch": 1640} {"train_loss": -12.000651359558105, "global_step": 275663, "epoch": 1640} {"train_loss": -11.877265930175781, "global_step": 275664, "epoch": 1640} {"train_loss": -12.046612739562988, "global_step": 275665, "epoch": 1640} {"train_loss": -11.533011436462402, "global_step": 275666, "epoch": 1640} {"train_loss": -11.927396774291992, "global_step": 275667, "epoch": 1640} {"train_loss": -11.580503463745117, "global_step": 275668, "epoch": 1640} {"train_loss": -11.523964881896973, "global_step": 275669, "epoch": 1640} {"train_loss": -11.847233772277832, "global_step": 275670, "epoch": 1640} {"train_loss": -11.494096755981445, "global_step": 275671, "epoch": 1640} {"train_loss": -11.587745666503906, "global_step": 275672, "epoch": 1640} {"train_loss": -11.846345901489258, "global_step": 275673, "epoch": 1640} {"train_loss": -11.556716918945312, "global_step": 275674, "epoch": 1640} {"train_loss": -11.722326278686523, "global_step": 275675, "epoch": 1640} {"train_loss": -11.774272918701172, "global_step": 275676, "epoch": 1640} {"train_loss": -11.916665077209473, "global_step": 275677, "epoch": 1640} {"train_loss": -11.725189208984375, "global_step": 275678, "epoch": 1640} {"train_loss": -12.087574005126953, "global_step": 275679, "epoch": 1640} {"train_loss": -11.505943298339844, "global_step": 275680, "epoch": 1640} {"train_loss": -11.679752349853516, "global_step": 275681, "epoch": 1640} {"train_loss": -11.864954948425293, "global_step": 275682, "epoch": 1640} {"train_loss": -11.697296142578125, "global_step": 275683, "epoch": 1640} {"train_loss": -11.916483879089355, "global_step": 275684, "epoch": 1640} {"train_loss": -11.053939819335938, "global_step": 275685, "epoch": 1640} {"train_loss": -11.564918518066406, "global_step": 275686, "epoch": 1640} {"train_loss": -11.437561023802985, "global_step": 275687, "epoch": 1640, "val_loss": 270071.59375, "train_action_mse_error": 1.84043288230896} {"train_loss": -11.044384002685547, "global_step": 275688, "epoch": 1641} {"train_loss": -11.714115142822266, "global_step": 275689, "epoch": 1641} {"train_loss": -11.861185073852539, "global_step": 275690, "epoch": 1641} {"train_loss": -11.670082092285156, "global_step": 275691, "epoch": 1641} {"train_loss": -12.060041427612305, "global_step": 275692, "epoch": 1641} {"train_loss": -11.824606895446777, "global_step": 275693, "epoch": 1641} {"train_loss": -12.079344749450684, "global_step": 275694, "epoch": 1641} {"train_loss": -11.842849731445312, "global_step": 275695, "epoch": 1641} {"train_loss": -12.189693450927734, "global_step": 275696, "epoch": 1641} {"train_loss": -12.014131546020508, "global_step": 275697, "epoch": 1641} {"train_loss": -12.014984130859375, "global_step": 275698, "epoch": 1641} {"train_loss": -12.217439651489258, "global_step": 275699, "epoch": 1641} {"train_loss": -12.214035034179688, "global_step": 275700, "epoch": 1641} {"train_loss": -12.141706466674805, "global_step": 275701, "epoch": 1641} {"train_loss": -12.001019477844238, "global_step": 275702, "epoch": 1641} {"train_loss": -12.01318359375, "global_step": 275703, "epoch": 1641} {"train_loss": -12.128984451293945, "global_step": 275704, "epoch": 1641} {"train_loss": -12.309242248535156, "global_step": 275705, "epoch": 1641} {"train_loss": -11.962900161743164, "global_step": 275706, "epoch": 1641} {"train_loss": -12.065555572509766, "global_step": 275707, "epoch": 1641} {"train_loss": -12.175895690917969, "global_step": 275708, "epoch": 1641} {"train_loss": -12.137727737426758, "global_step": 275709, "epoch": 1641} {"train_loss": -12.039449691772461, "global_step": 275710, "epoch": 1641} {"train_loss": -12.186185836791992, "global_step": 275711, "epoch": 1641} {"train_loss": -12.238490104675293, "global_step": 275712, "epoch": 1641} {"train_loss": -12.254484176635742, "global_step": 275713, "epoch": 1641} {"train_loss": -12.366443634033203, "global_step": 275714, "epoch": 1641} {"train_loss": -12.114826202392578, "global_step": 275715, "epoch": 1641} {"train_loss": -12.200307846069336, "global_step": 275716, "epoch": 1641} {"train_loss": -12.005992889404297, "global_step": 275717, "epoch": 1641} {"train_loss": -12.29987907409668, "global_step": 275718, "epoch": 1641} {"train_loss": -12.134681701660156, "global_step": 275719, "epoch": 1641} {"train_loss": -12.144943237304688, "global_step": 275720, "epoch": 1641} {"train_loss": -12.16079044342041, "global_step": 275721, "epoch": 1641} {"train_loss": -12.296709060668945, "global_step": 275722, "epoch": 1641} {"train_loss": -12.013656616210938, "global_step": 275723, "epoch": 1641} {"train_loss": -12.40216064453125, "global_step": 275724, "epoch": 1641} {"train_loss": -12.218935012817383, "global_step": 275725, "epoch": 1641} {"train_loss": -12.272567749023438, "global_step": 275726, "epoch": 1641} {"train_loss": -12.120100975036621, "global_step": 275727, "epoch": 1641} {"train_loss": -12.176077842712402, "global_step": 275728, "epoch": 1641} {"train_loss": -12.235662460327148, "global_step": 275729, "epoch": 1641} {"train_loss": -12.223221778869629, "global_step": 275730, "epoch": 1641} {"train_loss": -11.824586868286133, "global_step": 275731, "epoch": 1641} {"train_loss": -10.997096061706543, "global_step": 275732, "epoch": 1641} {"train_loss": -11.590192794799805, "global_step": 275733, "epoch": 1641} {"train_loss": -11.66983413696289, "global_step": 275734, "epoch": 1641} {"train_loss": -9.82119369506836, "global_step": 275735, "epoch": 1641} {"train_loss": -11.355461120605469, "global_step": 275736, "epoch": 1641} {"train_loss": -10.985715866088867, "global_step": 275737, "epoch": 1641} {"train_loss": -11.440465927124023, "global_step": 275738, "epoch": 1641} {"train_loss": -11.357460975646973, "global_step": 275739, "epoch": 1641} {"train_loss": -11.215377807617188, "global_step": 275740, "epoch": 1641} {"train_loss": -11.838107109069824, "global_step": 275741, "epoch": 1641} {"train_loss": -11.5968017578125, "global_step": 275742, "epoch": 1641} {"train_loss": -11.94290542602539, "global_step": 275743, "epoch": 1641} {"train_loss": -11.50519847869873, "global_step": 275744, "epoch": 1641} {"train_loss": -11.846857070922852, "global_step": 275745, "epoch": 1641} {"train_loss": -11.683828353881836, "global_step": 275746, "epoch": 1641} {"train_loss": -12.02238655090332, "global_step": 275747, "epoch": 1641} {"train_loss": -11.804483413696289, "global_step": 275748, "epoch": 1641} {"train_loss": -11.433015823364258, "global_step": 275749, "epoch": 1641} {"train_loss": -11.508331298828125, "global_step": 275750, "epoch": 1641} {"train_loss": -11.290477752685547, "global_step": 275751, "epoch": 1641} {"train_loss": -9.914804458618164, "global_step": 275752, "epoch": 1641} {"train_loss": -9.909388542175293, "global_step": 275753, "epoch": 1641} {"train_loss": -10.841442108154297, "global_step": 275754, "epoch": 1641} {"train_loss": -9.627342224121094, "global_step": 275755, "epoch": 1641} {"train_loss": -9.878111839294434, "global_step": 275756, "epoch": 1641} {"train_loss": -11.672513961791992, "global_step": 275757, "epoch": 1641} {"train_loss": -10.90080738067627, "global_step": 275758, "epoch": 1641} {"train_loss": -11.61148452758789, "global_step": 275759, "epoch": 1641} {"train_loss": -10.679140090942383, "global_step": 275760, "epoch": 1641} {"train_loss": -9.674764633178711, "global_step": 275761, "epoch": 1641} {"train_loss": -10.512324333190918, "global_step": 275762, "epoch": 1641} {"train_loss": -10.691093444824219, "global_step": 275763, "epoch": 1641} {"train_loss": -10.110016822814941, "global_step": 275764, "epoch": 1641} {"train_loss": -9.961386680603027, "global_step": 275765, "epoch": 1641} {"train_loss": -10.391607284545898, "global_step": 275766, "epoch": 1641} {"train_loss": -11.293569564819336, "global_step": 275767, "epoch": 1641} {"train_loss": -11.80607795715332, "global_step": 275768, "epoch": 1641} {"train_loss": -11.541170120239258, "global_step": 275769, "epoch": 1641} {"train_loss": -11.59946060180664, "global_step": 275770, "epoch": 1641} {"train_loss": -11.368370056152344, "global_step": 275771, "epoch": 1641} {"train_loss": -11.658454895019531, "global_step": 275772, "epoch": 1641} {"train_loss": -11.871025085449219, "global_step": 275773, "epoch": 1641} {"train_loss": -11.500526428222656, "global_step": 275774, "epoch": 1641} {"train_loss": -11.812051773071289, "global_step": 275775, "epoch": 1641} {"train_loss": -11.523487091064453, "global_step": 275776, "epoch": 1641} {"train_loss": -11.453042984008789, "global_step": 275777, "epoch": 1641} {"train_loss": -11.555309295654297, "global_step": 275778, "epoch": 1641} {"train_loss": -11.727226257324219, "global_step": 275779, "epoch": 1641} {"train_loss": -11.440206527709961, "global_step": 275780, "epoch": 1641} {"train_loss": -11.632791519165039, "global_step": 275781, "epoch": 1641} {"train_loss": -11.445991516113281, "global_step": 275782, "epoch": 1641} {"train_loss": -11.541279792785645, "global_step": 275783, "epoch": 1641} {"train_loss": -11.80438232421875, "global_step": 275784, "epoch": 1641} {"train_loss": -11.780879974365234, "global_step": 275785, "epoch": 1641} {"train_loss": -12.189582824707031, "global_step": 275786, "epoch": 1641} {"train_loss": -12.005542755126953, "global_step": 275787, "epoch": 1641} {"train_loss": -11.787882804870605, "global_step": 275788, "epoch": 1641} {"train_loss": -12.009414672851562, "global_step": 275789, "epoch": 1641} {"train_loss": -11.96467113494873, "global_step": 275790, "epoch": 1641} {"train_loss": -11.933387756347656, "global_step": 275791, "epoch": 1641} {"train_loss": -11.98227596282959, "global_step": 275792, "epoch": 1641} {"train_loss": -11.938846588134766, "global_step": 275793, "epoch": 1641} {"train_loss": -12.057909965515137, "global_step": 275794, "epoch": 1641} {"train_loss": -12.142148971557617, "global_step": 275795, "epoch": 1641} {"train_loss": -12.270959854125977, "global_step": 275796, "epoch": 1641} {"train_loss": -12.158012390136719, "global_step": 275797, "epoch": 1641} {"train_loss": -12.036746978759766, "global_step": 275798, "epoch": 1641} {"train_loss": -12.256845474243164, "global_step": 275799, "epoch": 1641} {"train_loss": -12.050359725952148, "global_step": 275800, "epoch": 1641} {"train_loss": -12.127384185791016, "global_step": 275801, "epoch": 1641} {"train_loss": -12.098906517028809, "global_step": 275802, "epoch": 1641} {"train_loss": -12.154756546020508, "global_step": 275803, "epoch": 1641} {"train_loss": -12.132253646850586, "global_step": 275804, "epoch": 1641} {"train_loss": -12.0359468460083, "global_step": 275805, "epoch": 1641} {"train_loss": -12.234014511108398, "global_step": 275806, "epoch": 1641} {"train_loss": -11.896138191223145, "global_step": 275807, "epoch": 1641} {"train_loss": -12.167366027832031, "global_step": 275808, "epoch": 1641} {"train_loss": -11.906192779541016, "global_step": 275809, "epoch": 1641} {"train_loss": -12.055892944335938, "global_step": 275810, "epoch": 1641} {"train_loss": -11.921260833740234, "global_step": 275811, "epoch": 1641} {"train_loss": -11.416542053222656, "global_step": 275812, "epoch": 1641} {"train_loss": -12.219059944152832, "global_step": 275813, "epoch": 1641} {"train_loss": -11.547805786132812, "global_step": 275814, "epoch": 1641} {"train_loss": -11.663612365722656, "global_step": 275815, "epoch": 1641} {"train_loss": -12.096047401428223, "global_step": 275816, "epoch": 1641} {"train_loss": -11.496065139770508, "global_step": 275817, "epoch": 1641} {"train_loss": -11.980390548706055, "global_step": 275818, "epoch": 1641} {"train_loss": -11.993605613708496, "global_step": 275819, "epoch": 1641} {"train_loss": -12.168527603149414, "global_step": 275820, "epoch": 1641} {"train_loss": -11.948437690734863, "global_step": 275821, "epoch": 1641} {"train_loss": -12.044748306274414, "global_step": 275822, "epoch": 1641} {"train_loss": -12.064374923706055, "global_step": 275823, "epoch": 1641} {"train_loss": -12.244623184204102, "global_step": 275824, "epoch": 1641} {"train_loss": -12.127363204956055, "global_step": 275825, "epoch": 1641} {"train_loss": -12.217462539672852, "global_step": 275826, "epoch": 1641} {"train_loss": -11.944669723510742, "global_step": 275827, "epoch": 1641} {"train_loss": -12.487184524536133, "global_step": 275828, "epoch": 1641} {"train_loss": -12.05036735534668, "global_step": 275829, "epoch": 1641} {"train_loss": -12.171690940856934, "global_step": 275830, "epoch": 1641} {"train_loss": -12.139626502990723, "global_step": 275831, "epoch": 1641} {"train_loss": -12.065511703491211, "global_step": 275832, "epoch": 1641} {"train_loss": -12.245004653930664, "global_step": 275833, "epoch": 1641} {"train_loss": -12.323244094848633, "global_step": 275834, "epoch": 1641} {"train_loss": -11.820476531982422, "global_step": 275835, "epoch": 1641} {"train_loss": -11.771141052246094, "global_step": 275836, "epoch": 1641} {"train_loss": -12.22433090209961, "global_step": 275837, "epoch": 1641} {"train_loss": -11.928949356079102, "global_step": 275838, "epoch": 1641} {"train_loss": -11.224740982055664, "global_step": 275839, "epoch": 1641} {"train_loss": -11.96750545501709, "global_step": 275840, "epoch": 1641} {"train_loss": -12.035982131958008, "global_step": 275841, "epoch": 1641} {"train_loss": -11.375871658325195, "global_step": 275842, "epoch": 1641} {"train_loss": -11.602193832397461, "global_step": 275843, "epoch": 1641} {"train_loss": -11.998276710510254, "global_step": 275844, "epoch": 1641} {"train_loss": -11.628114700317383, "global_step": 275845, "epoch": 1641} {"train_loss": -12.020343780517578, "global_step": 275846, "epoch": 1641} {"train_loss": -11.95008659362793, "global_step": 275847, "epoch": 1641} {"train_loss": -11.864852905273438, "global_step": 275848, "epoch": 1641} {"train_loss": -11.953203201293945, "global_step": 275849, "epoch": 1641} {"train_loss": -11.447113037109375, "global_step": 275850, "epoch": 1641} {"train_loss": -12.02655029296875, "global_step": 275851, "epoch": 1641} {"train_loss": -11.528047561645508, "global_step": 275852, "epoch": 1641} {"train_loss": -11.892553329467773, "global_step": 275853, "epoch": 1641} {"train_loss": -11.538827896118164, "global_step": 275854, "epoch": 1641} {"train_loss": -11.757120700109573, "global_step": 275855, "epoch": 1641, "val_loss": 274969.46875} {"train_loss": -11.635159492492676, "global_step": 275856, "epoch": 1642} {"train_loss": -11.89450740814209, "global_step": 275857, "epoch": 1642} {"train_loss": -11.76356029510498, "global_step": 275858, "epoch": 1642} {"train_loss": -11.641992568969727, "global_step": 275859, "epoch": 1642} {"train_loss": -12.243775367736816, "global_step": 275860, "epoch": 1642} {"train_loss": -11.567201614379883, "global_step": 275861, "epoch": 1642} {"train_loss": -12.006479263305664, "global_step": 275862, "epoch": 1642} {"train_loss": -11.729937553405762, "global_step": 275863, "epoch": 1642} {"train_loss": -11.859654426574707, "global_step": 275864, "epoch": 1642} {"train_loss": -11.970531463623047, "global_step": 275865, "epoch": 1642} {"train_loss": -10.989974021911621, "global_step": 275866, "epoch": 1642} {"train_loss": -12.185084342956543, "global_step": 275867, "epoch": 1642} {"train_loss": -10.390646934509277, "global_step": 275868, "epoch": 1642} {"train_loss": -11.954736709594727, "global_step": 275869, "epoch": 1642} {"train_loss": -11.482425689697266, "global_step": 275870, "epoch": 1642} {"train_loss": -10.609102249145508, "global_step": 275871, "epoch": 1642} {"train_loss": -11.032093048095703, "global_step": 275872, "epoch": 1642} {"train_loss": -11.938777923583984, "global_step": 275873, "epoch": 1642} {"train_loss": -10.84315013885498, "global_step": 275874, "epoch": 1642} {"train_loss": -11.958745956420898, "global_step": 275875, "epoch": 1642} {"train_loss": -11.302068710327148, "global_step": 275876, "epoch": 1642} {"train_loss": -10.666448593139648, "global_step": 275877, "epoch": 1642} {"train_loss": -10.817695617675781, "global_step": 275878, "epoch": 1642} {"train_loss": -11.295431137084961, "global_step": 275879, "epoch": 1642} {"train_loss": -10.238162994384766, "global_step": 275880, "epoch": 1642} {"train_loss": -11.815544128417969, "global_step": 275881, "epoch": 1642} {"train_loss": -9.66485595703125, "global_step": 275882, "epoch": 1642} {"train_loss": -10.592843055725098, "global_step": 275883, "epoch": 1642} {"train_loss": -10.925701141357422, "global_step": 275884, "epoch": 1642} {"train_loss": -9.89682388305664, "global_step": 275885, "epoch": 1642} {"train_loss": -10.937064170837402, "global_step": 275886, "epoch": 1642} {"train_loss": -9.810657501220703, "global_step": 275887, "epoch": 1642} {"train_loss": -11.054201126098633, "global_step": 275888, "epoch": 1642} {"train_loss": -9.918188095092773, "global_step": 275889, "epoch": 1642} {"train_loss": -10.33090591430664, "global_step": 275890, "epoch": 1642} {"train_loss": -11.06640911102295, "global_step": 275891, "epoch": 1642} {"train_loss": -10.379518508911133, "global_step": 275892, "epoch": 1642} {"train_loss": -10.591753005981445, "global_step": 275893, "epoch": 1642} {"train_loss": -10.6064453125, "global_step": 275894, "epoch": 1642} {"train_loss": -10.328164100646973, "global_step": 275895, "epoch": 1642} {"train_loss": -9.940980911254883, "global_step": 275896, "epoch": 1642} {"train_loss": -10.457036972045898, "global_step": 275897, "epoch": 1642} {"train_loss": -9.961420059204102, "global_step": 275898, "epoch": 1642} {"train_loss": -10.701085090637207, "global_step": 275899, "epoch": 1642} {"train_loss": -10.255464553833008, "global_step": 275900, "epoch": 1642} {"train_loss": -11.05506706237793, "global_step": 275901, "epoch": 1642} {"train_loss": -10.956296920776367, "global_step": 275902, "epoch": 1642} {"train_loss": -10.55923843383789, "global_step": 275903, "epoch": 1642} {"train_loss": -11.156636238098145, "global_step": 275904, "epoch": 1642} {"train_loss": -10.361863136291504, "global_step": 275905, "epoch": 1642} {"train_loss": -11.424052238464355, "global_step": 275906, "epoch": 1642} {"train_loss": -10.677011489868164, "global_step": 275907, "epoch": 1642} {"train_loss": -11.718578338623047, "global_step": 275908, "epoch": 1642} {"train_loss": -11.311546325683594, "global_step": 275909, "epoch": 1642} {"train_loss": -11.560530662536621, "global_step": 275910, "epoch": 1642} {"train_loss": -11.546329498291016, "global_step": 275911, "epoch": 1642} {"train_loss": -11.736669540405273, "global_step": 275912, "epoch": 1642} {"train_loss": -11.618705749511719, "global_step": 275913, "epoch": 1642} {"train_loss": -11.43979263305664, "global_step": 275914, "epoch": 1642} {"train_loss": -11.56633186340332, "global_step": 275915, "epoch": 1642} {"train_loss": -11.755558967590332, "global_step": 275916, "epoch": 1642} {"train_loss": -11.766397476196289, "global_step": 275917, "epoch": 1642} {"train_loss": -11.682095527648926, "global_step": 275918, "epoch": 1642} {"train_loss": -11.571743965148926, "global_step": 275919, "epoch": 1642} {"train_loss": -11.673789978027344, "global_step": 275920, "epoch": 1642} {"train_loss": -11.404767036437988, "global_step": 275921, "epoch": 1642} {"train_loss": -11.835223197937012, "global_step": 275922, "epoch": 1642} {"train_loss": -11.518904685974121, "global_step": 275923, "epoch": 1642} {"train_loss": -12.064109802246094, "global_step": 275924, "epoch": 1642} {"train_loss": -11.376452445983887, "global_step": 275925, "epoch": 1642} {"train_loss": -12.013660430908203, "global_step": 275926, "epoch": 1642} {"train_loss": -11.649007797241211, "global_step": 275927, "epoch": 1642} {"train_loss": -11.56396484375, "global_step": 275928, "epoch": 1642} {"train_loss": -11.924330711364746, "global_step": 275929, "epoch": 1642} {"train_loss": -11.745627403259277, "global_step": 275930, "epoch": 1642} {"train_loss": -11.91728401184082, "global_step": 275931, "epoch": 1642} {"train_loss": -11.84269905090332, "global_step": 275932, "epoch": 1642} {"train_loss": -11.996147155761719, "global_step": 275933, "epoch": 1642} {"train_loss": -11.810689926147461, "global_step": 275934, "epoch": 1642} {"train_loss": -11.803430557250977, "global_step": 275935, "epoch": 1642} {"train_loss": -12.014205932617188, "global_step": 275936, "epoch": 1642} {"train_loss": -11.62515640258789, "global_step": 275937, "epoch": 1642} {"train_loss": -12.01805305480957, "global_step": 275938, "epoch": 1642} {"train_loss": -11.854253768920898, "global_step": 275939, "epoch": 1642} {"train_loss": -12.22563362121582, "global_step": 275940, "epoch": 1642} {"train_loss": -11.902413368225098, "global_step": 275941, "epoch": 1642} {"train_loss": -12.04100227355957, "global_step": 275942, "epoch": 1642} {"train_loss": -11.887386322021484, "global_step": 275943, "epoch": 1642} {"train_loss": -11.857349395751953, "global_step": 275944, "epoch": 1642} {"train_loss": -11.920086860656738, "global_step": 275945, "epoch": 1642} {"train_loss": -11.985103607177734, "global_step": 275946, "epoch": 1642} {"train_loss": -12.078524589538574, "global_step": 275947, "epoch": 1642} {"train_loss": -11.777698516845703, "global_step": 275948, "epoch": 1642} {"train_loss": -12.004523277282715, "global_step": 275949, "epoch": 1642} {"train_loss": -11.980563163757324, "global_step": 275950, "epoch": 1642} {"train_loss": -12.155545234680176, "global_step": 275951, "epoch": 1642} {"train_loss": -12.05776309967041, "global_step": 275952, "epoch": 1642} {"train_loss": -12.077539443969727, "global_step": 275953, "epoch": 1642} {"train_loss": -12.033241271972656, "global_step": 275954, "epoch": 1642} {"train_loss": -12.001351356506348, "global_step": 275955, "epoch": 1642} {"train_loss": -11.931168556213379, "global_step": 275956, "epoch": 1642} {"train_loss": -12.027917861938477, "global_step": 275957, "epoch": 1642} {"train_loss": -11.85186767578125, "global_step": 275958, "epoch": 1642} {"train_loss": -12.068363189697266, "global_step": 275959, "epoch": 1642} {"train_loss": -11.908368110656738, "global_step": 275960, "epoch": 1642} {"train_loss": -11.838247299194336, "global_step": 275961, "epoch": 1642} {"train_loss": -12.174461364746094, "global_step": 275962, "epoch": 1642} {"train_loss": -11.954763412475586, "global_step": 275963, "epoch": 1642} {"train_loss": -12.170402526855469, "global_step": 275964, "epoch": 1642} {"train_loss": -12.02490234375, "global_step": 275965, "epoch": 1642} {"train_loss": -12.194024085998535, "global_step": 275966, "epoch": 1642} {"train_loss": -12.246252059936523, "global_step": 275967, "epoch": 1642} {"train_loss": -12.374042510986328, "global_step": 275968, "epoch": 1642} {"train_loss": -12.289913177490234, "global_step": 275969, "epoch": 1642} {"train_loss": -12.149892807006836, "global_step": 275970, "epoch": 1642} {"train_loss": -12.291061401367188, "global_step": 275971, "epoch": 1642} {"train_loss": -12.253195762634277, "global_step": 275972, "epoch": 1642} {"train_loss": -12.32064437866211, "global_step": 275973, "epoch": 1642} {"train_loss": -12.180411338806152, "global_step": 275974, "epoch": 1642} {"train_loss": -12.153202056884766, "global_step": 275975, "epoch": 1642} {"train_loss": -12.330326080322266, "global_step": 275976, "epoch": 1642} {"train_loss": -12.134242057800293, "global_step": 275977, "epoch": 1642} {"train_loss": -12.246828079223633, "global_step": 275978, "epoch": 1642} {"train_loss": -12.375448226928711, "global_step": 275979, "epoch": 1642} {"train_loss": -12.331503868103027, "global_step": 275980, "epoch": 1642} {"train_loss": -12.278594970703125, "global_step": 275981, "epoch": 1642} {"train_loss": -12.377310752868652, "global_step": 275982, "epoch": 1642} {"train_loss": -12.331953048706055, "global_step": 275983, "epoch": 1642} {"train_loss": -12.335329055786133, "global_step": 275984, "epoch": 1642} {"train_loss": -12.080571174621582, "global_step": 275985, "epoch": 1642} {"train_loss": -12.250157356262207, "global_step": 275986, "epoch": 1642} {"train_loss": -11.864082336425781, "global_step": 275987, "epoch": 1642} {"train_loss": -12.359169006347656, "global_step": 275988, "epoch": 1642} {"train_loss": -12.031917572021484, "global_step": 275989, "epoch": 1642} {"train_loss": -11.78885269165039, "global_step": 275990, "epoch": 1642} {"train_loss": -12.047657012939453, "global_step": 275991, "epoch": 1642} {"train_loss": -12.466246604919434, "global_step": 275992, "epoch": 1642} {"train_loss": -11.921506881713867, "global_step": 275993, "epoch": 1642} {"train_loss": -12.325599670410156, "global_step": 275994, "epoch": 1642} {"train_loss": -11.709572792053223, "global_step": 275995, "epoch": 1642} {"train_loss": -12.124515533447266, "global_step": 275996, "epoch": 1642} {"train_loss": -12.018428802490234, "global_step": 275997, "epoch": 1642} {"train_loss": -11.938592910766602, "global_step": 275998, "epoch": 1642} {"train_loss": -12.267576217651367, "global_step": 275999, "epoch": 1642} {"train_loss": -12.1508207321167, "global_step": 276000, "epoch": 1642} {"train_loss": -12.401476860046387, "global_step": 276001, "epoch": 1642} {"train_loss": -12.375414848327637, "global_step": 276002, "epoch": 1642} {"train_loss": -12.2728271484375, "global_step": 276003, "epoch": 1642} {"train_loss": -12.355854034423828, "global_step": 276004, "epoch": 1642} {"train_loss": -12.290096282958984, "global_step": 276005, "epoch": 1642} {"train_loss": -12.250934600830078, "global_step": 276006, "epoch": 1642} {"train_loss": -11.977458000183105, "global_step": 276007, "epoch": 1642} {"train_loss": -12.180914878845215, "global_step": 276008, "epoch": 1642} {"train_loss": -12.376754760742188, "global_step": 276009, "epoch": 1642} {"train_loss": -12.062052726745605, "global_step": 276010, "epoch": 1642} {"train_loss": -11.85473918914795, "global_step": 276011, "epoch": 1642} {"train_loss": -12.292010307312012, "global_step": 276012, "epoch": 1642} {"train_loss": -11.754637718200684, "global_step": 276013, "epoch": 1642} {"train_loss": -11.948738098144531, "global_step": 276014, "epoch": 1642} {"train_loss": -11.492156982421875, "global_step": 276015, "epoch": 1642} {"train_loss": -11.409134864807129, "global_step": 276016, "epoch": 1642} {"train_loss": -12.240968704223633, "global_step": 276017, "epoch": 1642} {"train_loss": -11.968291282653809, "global_step": 276018, "epoch": 1642} {"train_loss": -12.182137489318848, "global_step": 276019, "epoch": 1642} {"train_loss": -11.632362365722656, "global_step": 276020, "epoch": 1642} {"train_loss": -11.779243469238281, "global_step": 276021, "epoch": 1642} {"train_loss": -11.88497257232666, "global_step": 276022, "epoch": 1642} {"train_loss": -11.677576587313698, "global_step": 276023, "epoch": 1642, "val_loss": 274623.625} {"train_loss": -12.05557632446289, "global_step": 276024, "epoch": 1643} {"train_loss": -11.745281219482422, "global_step": 276025, "epoch": 1643} {"train_loss": -11.944656372070312, "global_step": 276026, "epoch": 1643} {"train_loss": -11.806915283203125, "global_step": 276027, "epoch": 1643} {"train_loss": -12.201823234558105, "global_step": 276028, "epoch": 1643} {"train_loss": -11.924379348754883, "global_step": 276029, "epoch": 1643} {"train_loss": -12.302535057067871, "global_step": 276030, "epoch": 1643} {"train_loss": -12.345110893249512, "global_step": 276031, "epoch": 1643} {"train_loss": -11.956319808959961, "global_step": 276032, "epoch": 1643} {"train_loss": -12.02212905883789, "global_step": 276033, "epoch": 1643} {"train_loss": -11.934341430664062, "global_step": 276034, "epoch": 1643} {"train_loss": -12.256824493408203, "global_step": 276035, "epoch": 1643} {"train_loss": -11.566722869873047, "global_step": 276036, "epoch": 1643} {"train_loss": -10.24313735961914, "global_step": 276037, "epoch": 1643} {"train_loss": -11.022867202758789, "global_step": 276038, "epoch": 1643} {"train_loss": -10.426121711730957, "global_step": 276039, "epoch": 1643} {"train_loss": -11.272927284240723, "global_step": 276040, "epoch": 1643} {"train_loss": -11.006406784057617, "global_step": 276041, "epoch": 1643} {"train_loss": -8.643274307250977, "global_step": 276042, "epoch": 1643} {"train_loss": -10.437196731567383, "global_step": 276043, "epoch": 1643} {"train_loss": -10.130128860473633, "global_step": 276044, "epoch": 1643} {"train_loss": -10.760114669799805, "global_step": 276045, "epoch": 1643} {"train_loss": -11.290709495544434, "global_step": 276046, "epoch": 1643} {"train_loss": -11.220622062683105, "global_step": 276047, "epoch": 1643} {"train_loss": -11.06601333618164, "global_step": 276048, "epoch": 1643} {"train_loss": -11.032686233520508, "global_step": 276049, "epoch": 1643} {"train_loss": -10.08115005493164, "global_step": 276050, "epoch": 1643} {"train_loss": -10.475184440612793, "global_step": 276051, "epoch": 1643} {"train_loss": -10.54345703125, "global_step": 276052, "epoch": 1643} {"train_loss": -8.11788558959961, "global_step": 276053, "epoch": 1643} {"train_loss": -9.67765998840332, "global_step": 276054, "epoch": 1643} {"train_loss": -11.125076293945312, "global_step": 276055, "epoch": 1643} {"train_loss": -9.840213775634766, "global_step": 276056, "epoch": 1643} {"train_loss": -9.764392852783203, "global_step": 276057, "epoch": 1643} {"train_loss": -11.403585433959961, "global_step": 276058, "epoch": 1643} {"train_loss": -10.010252952575684, "global_step": 276059, "epoch": 1643} {"train_loss": -10.384138107299805, "global_step": 276060, "epoch": 1643} {"train_loss": -10.521072387695312, "global_step": 276061, "epoch": 1643} {"train_loss": -11.197845458984375, "global_step": 276062, "epoch": 1643} {"train_loss": -10.526798248291016, "global_step": 276063, "epoch": 1643} {"train_loss": -11.299915313720703, "global_step": 276064, "epoch": 1643} {"train_loss": -11.242786407470703, "global_step": 276065, "epoch": 1643} {"train_loss": -10.53113079071045, "global_step": 276066, "epoch": 1643} {"train_loss": -11.534390449523926, "global_step": 276067, "epoch": 1643} {"train_loss": -11.113000869750977, "global_step": 276068, "epoch": 1643} {"train_loss": -11.156797409057617, "global_step": 276069, "epoch": 1643} {"train_loss": -11.715303421020508, "global_step": 276070, "epoch": 1643} {"train_loss": -11.09680461883545, "global_step": 276071, "epoch": 1643} {"train_loss": -11.494312286376953, "global_step": 276072, "epoch": 1643} {"train_loss": -11.61416244506836, "global_step": 276073, "epoch": 1643} {"train_loss": -11.206085205078125, "global_step": 276074, "epoch": 1643} {"train_loss": -11.71134090423584, "global_step": 276075, "epoch": 1643} {"train_loss": -11.38547134399414, "global_step": 276076, "epoch": 1643} {"train_loss": -11.440400123596191, "global_step": 276077, "epoch": 1643} {"train_loss": -11.71969223022461, "global_step": 276078, "epoch": 1643} {"train_loss": -11.574695587158203, "global_step": 276079, "epoch": 1643} {"train_loss": -11.77462100982666, "global_step": 276080, "epoch": 1643} {"train_loss": -11.817207336425781, "global_step": 276081, "epoch": 1643} {"train_loss": -11.94781494140625, "global_step": 276082, "epoch": 1643} {"train_loss": -11.688762664794922, "global_step": 276083, "epoch": 1643} {"train_loss": -11.777695655822754, "global_step": 276084, "epoch": 1643} {"train_loss": -11.653059005737305, "global_step": 276085, "epoch": 1643} {"train_loss": -11.845321655273438, "global_step": 276086, "epoch": 1643} {"train_loss": -11.75704574584961, "global_step": 276087, "epoch": 1643} {"train_loss": -11.336807250976562, "global_step": 276088, "epoch": 1643} {"train_loss": -11.708667755126953, "global_step": 276089, "epoch": 1643} {"train_loss": -11.67430305480957, "global_step": 276090, "epoch": 1643} {"train_loss": -11.73845100402832, "global_step": 276091, "epoch": 1643} {"train_loss": -12.00467300415039, "global_step": 276092, "epoch": 1643} {"train_loss": -11.41651725769043, "global_step": 276093, "epoch": 1643} {"train_loss": -12.042614936828613, "global_step": 276094, "epoch": 1643} {"train_loss": -11.932804107666016, "global_step": 276095, "epoch": 1643} {"train_loss": -11.851491928100586, "global_step": 276096, "epoch": 1643} {"train_loss": -11.810157775878906, "global_step": 276097, "epoch": 1643} {"train_loss": -12.029918670654297, "global_step": 276098, "epoch": 1643} {"train_loss": -11.842041015625, "global_step": 276099, "epoch": 1643} {"train_loss": -12.095199584960938, "global_step": 276100, "epoch": 1643} {"train_loss": -11.879024505615234, "global_step": 276101, "epoch": 1643} {"train_loss": -12.064010620117188, "global_step": 276102, "epoch": 1643} {"train_loss": -12.183182716369629, "global_step": 276103, "epoch": 1643} {"train_loss": -11.983144760131836, "global_step": 276104, "epoch": 1643} {"train_loss": -12.05820083618164, "global_step": 276105, "epoch": 1643} {"train_loss": -11.846686363220215, "global_step": 276106, "epoch": 1643} {"train_loss": -11.986763000488281, "global_step": 276107, "epoch": 1643} {"train_loss": -12.363306045532227, "global_step": 276108, "epoch": 1643} {"train_loss": -12.051666259765625, "global_step": 276109, "epoch": 1643} {"train_loss": -12.148092269897461, "global_step": 276110, "epoch": 1643} {"train_loss": -12.287484169006348, "global_step": 276111, "epoch": 1643} {"train_loss": -12.120903015136719, "global_step": 276112, "epoch": 1643} {"train_loss": -12.181585311889648, "global_step": 276113, "epoch": 1643} {"train_loss": -12.065727233886719, "global_step": 276114, "epoch": 1643} {"train_loss": -12.15170669555664, "global_step": 276115, "epoch": 1643} {"train_loss": -12.286548614501953, "global_step": 276116, "epoch": 1643} {"train_loss": -12.32262897491455, "global_step": 276117, "epoch": 1643} {"train_loss": -12.010801315307617, "global_step": 276118, "epoch": 1643} {"train_loss": -12.036626815795898, "global_step": 276119, "epoch": 1643} {"train_loss": -11.878396987915039, "global_step": 276120, "epoch": 1643} {"train_loss": -12.004922866821289, "global_step": 276121, "epoch": 1643} {"train_loss": -12.107857704162598, "global_step": 276122, "epoch": 1643} {"train_loss": -12.285669326782227, "global_step": 276123, "epoch": 1643} {"train_loss": -12.041020393371582, "global_step": 276124, "epoch": 1643} {"train_loss": -11.598918914794922, "global_step": 276125, "epoch": 1643} {"train_loss": -11.944747924804688, "global_step": 276126, "epoch": 1643} {"train_loss": -12.219501495361328, "global_step": 276127, "epoch": 1643} {"train_loss": -11.502816200256348, "global_step": 276128, "epoch": 1643} {"train_loss": -11.2283353805542, "global_step": 276129, "epoch": 1643} {"train_loss": -11.307121276855469, "global_step": 276130, "epoch": 1643} {"train_loss": -10.332332611083984, "global_step": 276131, "epoch": 1643} {"train_loss": -11.881589889526367, "global_step": 276132, "epoch": 1643} {"train_loss": -10.710002899169922, "global_step": 276133, "epoch": 1643} {"train_loss": -9.54824447631836, "global_step": 276134, "epoch": 1643} {"train_loss": -12.153559684753418, "global_step": 276135, "epoch": 1643} {"train_loss": -10.32833480834961, "global_step": 276136, "epoch": 1643} {"train_loss": -10.44357681274414, "global_step": 276137, "epoch": 1643} {"train_loss": -11.31533145904541, "global_step": 276138, "epoch": 1643} {"train_loss": -10.230234146118164, "global_step": 276139, "epoch": 1643} {"train_loss": -10.097268104553223, "global_step": 276140, "epoch": 1643} {"train_loss": -9.739593505859375, "global_step": 276141, "epoch": 1643} {"train_loss": -8.48984432220459, "global_step": 276142, "epoch": 1643} {"train_loss": -9.228897094726562, "global_step": 276143, "epoch": 1643} {"train_loss": -10.952374458312988, "global_step": 276144, "epoch": 1643} {"train_loss": -9.451074600219727, "global_step": 276145, "epoch": 1643} {"train_loss": -9.813957214355469, "global_step": 276146, "epoch": 1643} {"train_loss": -10.169763565063477, "global_step": 276147, "epoch": 1643} {"train_loss": -10.066162109375, "global_step": 276148, "epoch": 1643} {"train_loss": -10.25532054901123, "global_step": 276149, "epoch": 1643} {"train_loss": -9.982048988342285, "global_step": 276150, "epoch": 1643} {"train_loss": -10.009028434753418, "global_step": 276151, "epoch": 1643} {"train_loss": -9.42408561706543, "global_step": 276152, "epoch": 1643} {"train_loss": -9.28607177734375, "global_step": 276153, "epoch": 1643} {"train_loss": -10.514105796813965, "global_step": 276154, "epoch": 1643} {"train_loss": -10.585943222045898, "global_step": 276155, "epoch": 1643} {"train_loss": -10.464771270751953, "global_step": 276156, "epoch": 1643} {"train_loss": -10.241837501525879, "global_step": 276157, "epoch": 1643} {"train_loss": -10.613053321838379, "global_step": 276158, "epoch": 1643} {"train_loss": -11.019037246704102, "global_step": 276159, "epoch": 1643} {"train_loss": -10.441266059875488, "global_step": 276160, "epoch": 1643} {"train_loss": -11.256962776184082, "global_step": 276161, "epoch": 1643} {"train_loss": -11.061986923217773, "global_step": 276162, "epoch": 1643} {"train_loss": -11.220553398132324, "global_step": 276163, "epoch": 1643} {"train_loss": -11.025086402893066, "global_step": 276164, "epoch": 1643} {"train_loss": -11.051483154296875, "global_step": 276165, "epoch": 1643} {"train_loss": -11.05957317352295, "global_step": 276166, "epoch": 1643} {"train_loss": -11.527092933654785, "global_step": 276167, "epoch": 1643} {"train_loss": -11.40643310546875, "global_step": 276168, "epoch": 1643} {"train_loss": -11.464336395263672, "global_step": 276169, "epoch": 1643} {"train_loss": -11.583481788635254, "global_step": 276170, "epoch": 1643} {"train_loss": -11.24575424194336, "global_step": 276171, "epoch": 1643} {"train_loss": -11.757955551147461, "global_step": 276172, "epoch": 1643} {"train_loss": -11.566082954406738, "global_step": 276173, "epoch": 1643} {"train_loss": -11.609193801879883, "global_step": 276174, "epoch": 1643} {"train_loss": -11.726356506347656, "global_step": 276175, "epoch": 1643} {"train_loss": -11.497692108154297, "global_step": 276176, "epoch": 1643} {"train_loss": -11.574676513671875, "global_step": 276177, "epoch": 1643} {"train_loss": -11.642538070678711, "global_step": 276178, "epoch": 1643} {"train_loss": -11.8861083984375, "global_step": 276179, "epoch": 1643} {"train_loss": -11.868704795837402, "global_step": 276180, "epoch": 1643} {"train_loss": -11.817506790161133, "global_step": 276181, "epoch": 1643} {"train_loss": -11.612508773803711, "global_step": 276182, "epoch": 1643} {"train_loss": -11.908376693725586, "global_step": 276183, "epoch": 1643} {"train_loss": -11.739028930664062, "global_step": 276184, "epoch": 1643} {"train_loss": -11.652594566345215, "global_step": 276185, "epoch": 1643} {"train_loss": -11.81619644165039, "global_step": 276186, "epoch": 1643} {"train_loss": -11.761119842529297, "global_step": 276187, "epoch": 1643} {"train_loss": -11.934409141540527, "global_step": 276188, "epoch": 1643} {"train_loss": -11.853609085083008, "global_step": 276189, "epoch": 1643} {"train_loss": -12.015769958496094, "global_step": 276190, "epoch": 1643} {"train_loss": -11.279121608961196, "global_step": 276191, "epoch": 1643, "val_loss": 274080.125} {"train_loss": -11.836702346801758, "global_step": 276192, "epoch": 1644} {"train_loss": -11.91024112701416, "global_step": 276193, "epoch": 1644} {"train_loss": -12.040017127990723, "global_step": 276194, "epoch": 1644} {"train_loss": -11.894771575927734, "global_step": 276195, "epoch": 1644} {"train_loss": -11.835797309875488, "global_step": 276196, "epoch": 1644} {"train_loss": -11.706077575683594, "global_step": 276197, "epoch": 1644} {"train_loss": -11.709310531616211, "global_step": 276198, "epoch": 1644} {"train_loss": -11.820150375366211, "global_step": 276199, "epoch": 1644} {"train_loss": -12.136354446411133, "global_step": 276200, "epoch": 1644} {"train_loss": -12.041269302368164, "global_step": 276201, "epoch": 1644} {"train_loss": -12.14551830291748, "global_step": 276202, "epoch": 1644} {"train_loss": -12.002275466918945, "global_step": 276203, "epoch": 1644} {"train_loss": -12.129193305969238, "global_step": 276204, "epoch": 1644} {"train_loss": -12.091836929321289, "global_step": 276205, "epoch": 1644} {"train_loss": -12.031346321105957, "global_step": 276206, "epoch": 1644} {"train_loss": -12.051064491271973, "global_step": 276207, "epoch": 1644} {"train_loss": -11.91946792602539, "global_step": 276208, "epoch": 1644} {"train_loss": -12.0872802734375, "global_step": 276209, "epoch": 1644} {"train_loss": -11.919475555419922, "global_step": 276210, "epoch": 1644} {"train_loss": -11.997520446777344, "global_step": 276211, "epoch": 1644} {"train_loss": -11.758010864257812, "global_step": 276212, "epoch": 1644} {"train_loss": -12.118307113647461, "global_step": 276213, "epoch": 1644} {"train_loss": -12.081072807312012, "global_step": 276214, "epoch": 1644} {"train_loss": -11.965384483337402, "global_step": 276215, "epoch": 1644} {"train_loss": -11.973808288574219, "global_step": 276216, "epoch": 1644} {"train_loss": -12.048627853393555, "global_step": 276217, "epoch": 1644} {"train_loss": -12.16946792602539, "global_step": 276218, "epoch": 1644} {"train_loss": -12.012574195861816, "global_step": 276219, "epoch": 1644} {"train_loss": -12.050882339477539, "global_step": 276220, "epoch": 1644} {"train_loss": -11.81625747680664, "global_step": 276221, "epoch": 1644} {"train_loss": -12.264059066772461, "global_step": 276222, "epoch": 1644} {"train_loss": -11.87460708618164, "global_step": 276223, "epoch": 1644} {"train_loss": -11.97336196899414, "global_step": 276224, "epoch": 1644} {"train_loss": -11.904441833496094, "global_step": 276225, "epoch": 1644} {"train_loss": -12.06232738494873, "global_step": 276226, "epoch": 1644} {"train_loss": -11.726523399353027, "global_step": 276227, "epoch": 1644} {"train_loss": -11.41217041015625, "global_step": 276228, "epoch": 1644} {"train_loss": -11.566308975219727, "global_step": 276229, "epoch": 1644} {"train_loss": -12.016130447387695, "global_step": 276230, "epoch": 1644} {"train_loss": -11.987464904785156, "global_step": 276231, "epoch": 1644} {"train_loss": -12.015040397644043, "global_step": 276232, "epoch": 1644} {"train_loss": -12.212361335754395, "global_step": 276233, "epoch": 1644} {"train_loss": -11.880030632019043, "global_step": 276234, "epoch": 1644} {"train_loss": -12.204324722290039, "global_step": 276235, "epoch": 1644} {"train_loss": -12.161842346191406, "global_step": 276236, "epoch": 1644} {"train_loss": -11.921368598937988, "global_step": 276237, "epoch": 1644} {"train_loss": -12.195980072021484, "global_step": 276238, "epoch": 1644} {"train_loss": -12.307462692260742, "global_step": 276239, "epoch": 1644} {"train_loss": -11.975519180297852, "global_step": 276240, "epoch": 1644} {"train_loss": -12.009329795837402, "global_step": 276241, "epoch": 1644} {"train_loss": -11.697216033935547, "global_step": 276242, "epoch": 1644} {"train_loss": -11.835494995117188, "global_step": 276243, "epoch": 1644} {"train_loss": -11.777037620544434, "global_step": 276244, "epoch": 1644} {"train_loss": -12.059762954711914, "global_step": 276245, "epoch": 1644} {"train_loss": -12.08618450164795, "global_step": 276246, "epoch": 1644} {"train_loss": -12.072625160217285, "global_step": 276247, "epoch": 1644} {"train_loss": -12.04200267791748, "global_step": 276248, "epoch": 1644} {"train_loss": -12.01474380493164, "global_step": 276249, "epoch": 1644} {"train_loss": -12.00532341003418, "global_step": 276250, "epoch": 1644} {"train_loss": -11.852314949035645, "global_step": 276251, "epoch": 1644} {"train_loss": -12.073104858398438, "global_step": 276252, "epoch": 1644} {"train_loss": -12.0659818649292, "global_step": 276253, "epoch": 1644} {"train_loss": -11.839679718017578, "global_step": 276254, "epoch": 1644} {"train_loss": -12.175798416137695, "global_step": 276255, "epoch": 1644} {"train_loss": -11.876082420349121, "global_step": 276256, "epoch": 1644} {"train_loss": -12.04374885559082, "global_step": 276257, "epoch": 1644} {"train_loss": -11.840776443481445, "global_step": 276258, "epoch": 1644} {"train_loss": -11.78970718383789, "global_step": 276259, "epoch": 1644} {"train_loss": -11.67022705078125, "global_step": 276260, "epoch": 1644} {"train_loss": -11.896713256835938, "global_step": 276261, "epoch": 1644} {"train_loss": -11.311206817626953, "global_step": 276262, "epoch": 1644} {"train_loss": -11.965201377868652, "global_step": 276263, "epoch": 1644} {"train_loss": -11.526348114013672, "global_step": 276264, "epoch": 1644} {"train_loss": -11.547816276550293, "global_step": 276265, "epoch": 1644} {"train_loss": -11.660490036010742, "global_step": 276266, "epoch": 1644} {"train_loss": -11.536478042602539, "global_step": 276267, "epoch": 1644} {"train_loss": -10.79570198059082, "global_step": 276268, "epoch": 1644} {"train_loss": -10.425368309020996, "global_step": 276269, "epoch": 1644} {"train_loss": -9.757822036743164, "global_step": 276270, "epoch": 1644} {"train_loss": -9.226438522338867, "global_step": 276271, "epoch": 1644} {"train_loss": -10.859186172485352, "global_step": 276272, "epoch": 1644} {"train_loss": -8.45853328704834, "global_step": 276273, "epoch": 1644} {"train_loss": -9.851042747497559, "global_step": 276274, "epoch": 1644} {"train_loss": -10.51843547821045, "global_step": 276275, "epoch": 1644} {"train_loss": -10.310094833374023, "global_step": 276276, "epoch": 1644} {"train_loss": -9.458597183227539, "global_step": 276277, "epoch": 1644} {"train_loss": -10.298530578613281, "global_step": 276278, "epoch": 1644} {"train_loss": -9.909339904785156, "global_step": 276279, "epoch": 1644} {"train_loss": -10.421642303466797, "global_step": 276280, "epoch": 1644} {"train_loss": -10.025321960449219, "global_step": 276281, "epoch": 1644} {"train_loss": -9.383651733398438, "global_step": 276282, "epoch": 1644} {"train_loss": -10.02681827545166, "global_step": 276283, "epoch": 1644} {"train_loss": -9.918184280395508, "global_step": 276284, "epoch": 1644} {"train_loss": -10.207138061523438, "global_step": 276285, "epoch": 1644} {"train_loss": -9.618265151977539, "global_step": 276286, "epoch": 1644} {"train_loss": -10.73682689666748, "global_step": 276287, "epoch": 1644} {"train_loss": -10.058595657348633, "global_step": 276288, "epoch": 1644} {"train_loss": -10.744207382202148, "global_step": 276289, "epoch": 1644} {"train_loss": -10.627537727355957, "global_step": 276290, "epoch": 1644} {"train_loss": -10.650717735290527, "global_step": 276291, "epoch": 1644} {"train_loss": -10.892908096313477, "global_step": 276292, "epoch": 1644} {"train_loss": -10.725067138671875, "global_step": 276293, "epoch": 1644} {"train_loss": -10.97930908203125, "global_step": 276294, "epoch": 1644} {"train_loss": -11.342461585998535, "global_step": 276295, "epoch": 1644} {"train_loss": -11.023653030395508, "global_step": 276296, "epoch": 1644} {"train_loss": -11.357831001281738, "global_step": 276297, "epoch": 1644} {"train_loss": -11.252243041992188, "global_step": 276298, "epoch": 1644} {"train_loss": -11.478989601135254, "global_step": 276299, "epoch": 1644} {"train_loss": -11.437324523925781, "global_step": 276300, "epoch": 1644} {"train_loss": -11.677919387817383, "global_step": 276301, "epoch": 1644} {"train_loss": -11.413928985595703, "global_step": 276302, "epoch": 1644} {"train_loss": -11.500421524047852, "global_step": 276303, "epoch": 1644} {"train_loss": -11.356587409973145, "global_step": 276304, "epoch": 1644} {"train_loss": -11.152135848999023, "global_step": 276305, "epoch": 1644} {"train_loss": -11.707365036010742, "global_step": 276306, "epoch": 1644} {"train_loss": -11.503178596496582, "global_step": 276307, "epoch": 1644} {"train_loss": -11.353744506835938, "global_step": 276308, "epoch": 1644} {"train_loss": -11.52614688873291, "global_step": 276309, "epoch": 1644} {"train_loss": -11.77787971496582, "global_step": 276310, "epoch": 1644} {"train_loss": -11.340099334716797, "global_step": 276311, "epoch": 1644} {"train_loss": -11.836099624633789, "global_step": 276312, "epoch": 1644} {"train_loss": -11.332738876342773, "global_step": 276313, "epoch": 1644} {"train_loss": -11.876507759094238, "global_step": 276314, "epoch": 1644} {"train_loss": -11.412397384643555, "global_step": 276315, "epoch": 1644} {"train_loss": -11.847318649291992, "global_step": 276316, "epoch": 1644} {"train_loss": -11.71085262298584, "global_step": 276317, "epoch": 1644} {"train_loss": -11.618688583374023, "global_step": 276318, "epoch": 1644} {"train_loss": -11.622392654418945, "global_step": 276319, "epoch": 1644} {"train_loss": -11.288061141967773, "global_step": 276320, "epoch": 1644} {"train_loss": -11.676995277404785, "global_step": 276321, "epoch": 1644} {"train_loss": -11.569375991821289, "global_step": 276322, "epoch": 1644} {"train_loss": -11.586482048034668, "global_step": 276323, "epoch": 1644} {"train_loss": -11.875051498413086, "global_step": 276324, "epoch": 1644} {"train_loss": -11.62317180633545, "global_step": 276325, "epoch": 1644} {"train_loss": -11.650821685791016, "global_step": 276326, "epoch": 1644} {"train_loss": -11.721689224243164, "global_step": 276327, "epoch": 1644} {"train_loss": -11.588668823242188, "global_step": 276328, "epoch": 1644} {"train_loss": -11.812522888183594, "global_step": 276329, "epoch": 1644} {"train_loss": -11.786301612854004, "global_step": 276330, "epoch": 1644} {"train_loss": -11.787595748901367, "global_step": 276331, "epoch": 1644} {"train_loss": -11.884784698486328, "global_step": 276332, "epoch": 1644} {"train_loss": -11.827924728393555, "global_step": 276333, "epoch": 1644} {"train_loss": -12.032279014587402, "global_step": 276334, "epoch": 1644} {"train_loss": -11.959638595581055, "global_step": 276335, "epoch": 1644} {"train_loss": -12.062206268310547, "global_step": 276336, "epoch": 1644} {"train_loss": -11.836000442504883, "global_step": 276337, "epoch": 1644} {"train_loss": -11.931047439575195, "global_step": 276338, "epoch": 1644} {"train_loss": -12.12832260131836, "global_step": 276339, "epoch": 1644} {"train_loss": -11.923571586608887, "global_step": 276340, "epoch": 1644} {"train_loss": -11.962770462036133, "global_step": 276341, "epoch": 1644} {"train_loss": -11.967924118041992, "global_step": 276342, "epoch": 1644} {"train_loss": -12.244089126586914, "global_step": 276343, "epoch": 1644} {"train_loss": -12.123401641845703, "global_step": 276344, "epoch": 1644} {"train_loss": -12.269567489624023, "global_step": 276345, "epoch": 1644} {"train_loss": -12.054677963256836, "global_step": 276346, "epoch": 1644} {"train_loss": -11.95114517211914, "global_step": 276347, "epoch": 1644} {"train_loss": -12.177831649780273, "global_step": 276348, "epoch": 1644} {"train_loss": -12.346019744873047, "global_step": 276349, "epoch": 1644} {"train_loss": -12.225847244262695, "global_step": 276350, "epoch": 1644} {"train_loss": -12.147932052612305, "global_step": 276351, "epoch": 1644} {"train_loss": -11.927531242370605, "global_step": 276352, "epoch": 1644} {"train_loss": -12.17766284942627, "global_step": 276353, "epoch": 1644} {"train_loss": -12.398751258850098, "global_step": 276354, "epoch": 1644} {"train_loss": -12.271517753601074, "global_step": 276355, "epoch": 1644} {"train_loss": -12.390586853027344, "global_step": 276356, "epoch": 1644} {"train_loss": -12.329206466674805, "global_step": 276357, "epoch": 1644} {"train_loss": -12.110797882080078, "global_step": 276358, "epoch": 1644} {"train_loss": -11.59751452150799, "global_step": 276359, "epoch": 1644, "val_loss": 274298.0625} {"train_loss": -12.219438552856445, "global_step": 276360, "epoch": 1645} {"train_loss": -12.338138580322266, "global_step": 276361, "epoch": 1645} {"train_loss": -12.155481338500977, "global_step": 276362, "epoch": 1645} {"train_loss": -12.317442893981934, "global_step": 276363, "epoch": 1645} {"train_loss": -12.245514869689941, "global_step": 276364, "epoch": 1645} {"train_loss": -12.145196914672852, "global_step": 276365, "epoch": 1645} {"train_loss": -12.31158447265625, "global_step": 276366, "epoch": 1645} {"train_loss": -12.306295394897461, "global_step": 276367, "epoch": 1645} {"train_loss": -12.132813453674316, "global_step": 276368, "epoch": 1645} {"train_loss": -12.2598876953125, "global_step": 276369, "epoch": 1645} {"train_loss": -11.883916854858398, "global_step": 276370, "epoch": 1645} {"train_loss": -12.0179443359375, "global_step": 276371, "epoch": 1645} {"train_loss": -12.198528289794922, "global_step": 276372, "epoch": 1645} {"train_loss": -11.835899353027344, "global_step": 276373, "epoch": 1645} {"train_loss": -12.260833740234375, "global_step": 276374, "epoch": 1645} {"train_loss": -12.018829345703125, "global_step": 276375, "epoch": 1645} {"train_loss": -11.684062004089355, "global_step": 276376, "epoch": 1645} {"train_loss": -12.644256591796875, "global_step": 276377, "epoch": 1645} {"train_loss": -11.920690536499023, "global_step": 276378, "epoch": 1645} {"train_loss": -12.048698425292969, "global_step": 276379, "epoch": 1645} {"train_loss": -12.22790813446045, "global_step": 276380, "epoch": 1645} {"train_loss": -11.680203437805176, "global_step": 276381, "epoch": 1645} {"train_loss": -11.842422485351562, "global_step": 276382, "epoch": 1645} {"train_loss": -12.1973876953125, "global_step": 276383, "epoch": 1645} {"train_loss": -12.249841690063477, "global_step": 276384, "epoch": 1645} {"train_loss": -12.084858894348145, "global_step": 276385, "epoch": 1645} {"train_loss": -12.079071998596191, "global_step": 276386, "epoch": 1645} {"train_loss": -11.930841445922852, "global_step": 276387, "epoch": 1645} {"train_loss": -12.156669616699219, "global_step": 276388, "epoch": 1645} {"train_loss": -12.231670379638672, "global_step": 276389, "epoch": 1645} {"train_loss": -11.720123291015625, "global_step": 276390, "epoch": 1645} {"train_loss": -12.06410026550293, "global_step": 276391, "epoch": 1645} {"train_loss": -12.293386459350586, "global_step": 276392, "epoch": 1645} {"train_loss": -12.063931465148926, "global_step": 276393, "epoch": 1645} {"train_loss": -11.83526611328125, "global_step": 276394, "epoch": 1645} {"train_loss": -11.805209159851074, "global_step": 276395, "epoch": 1645} {"train_loss": -12.080641746520996, "global_step": 276396, "epoch": 1645} {"train_loss": -11.467353820800781, "global_step": 276397, "epoch": 1645} {"train_loss": -12.085260391235352, "global_step": 276398, "epoch": 1645} {"train_loss": -12.013622283935547, "global_step": 276399, "epoch": 1645} {"train_loss": -12.034055709838867, "global_step": 276400, "epoch": 1645} {"train_loss": -10.97046947479248, "global_step": 276401, "epoch": 1645} {"train_loss": -11.993513107299805, "global_step": 276402, "epoch": 1645} {"train_loss": -10.926895141601562, "global_step": 276403, "epoch": 1645} {"train_loss": -11.81958293914795, "global_step": 276404, "epoch": 1645} {"train_loss": -11.540226936340332, "global_step": 276405, "epoch": 1645} {"train_loss": -10.75770378112793, "global_step": 276406, "epoch": 1645} {"train_loss": -11.509806632995605, "global_step": 276407, "epoch": 1645} {"train_loss": -11.013315200805664, "global_step": 276408, "epoch": 1645} {"train_loss": -11.468443870544434, "global_step": 276409, "epoch": 1645} {"train_loss": -10.549041748046875, "global_step": 276410, "epoch": 1645} {"train_loss": -11.174559593200684, "global_step": 276411, "epoch": 1645} {"train_loss": -10.411568641662598, "global_step": 276412, "epoch": 1645} {"train_loss": -10.297175407409668, "global_step": 276413, "epoch": 1645} {"train_loss": -11.776372909545898, "global_step": 276414, "epoch": 1645} {"train_loss": -10.277240753173828, "global_step": 276415, "epoch": 1645} {"train_loss": -10.598133087158203, "global_step": 276416, "epoch": 1645} {"train_loss": -10.64273452758789, "global_step": 276417, "epoch": 1645} {"train_loss": -11.208259582519531, "global_step": 276418, "epoch": 1645} {"train_loss": -10.534662246704102, "global_step": 276419, "epoch": 1645} {"train_loss": -11.149723052978516, "global_step": 276420, "epoch": 1645} {"train_loss": -10.11756420135498, "global_step": 276421, "epoch": 1645} {"train_loss": -11.626948356628418, "global_step": 276422, "epoch": 1645} {"train_loss": -11.040355682373047, "global_step": 276423, "epoch": 1645} {"train_loss": -10.970157623291016, "global_step": 276424, "epoch": 1645} {"train_loss": -11.650824546813965, "global_step": 276425, "epoch": 1645} {"train_loss": -10.843127250671387, "global_step": 276426, "epoch": 1645} {"train_loss": -11.620361328125, "global_step": 276427, "epoch": 1645} {"train_loss": -11.068604469299316, "global_step": 276428, "epoch": 1645} {"train_loss": -10.504456520080566, "global_step": 276429, "epoch": 1645} {"train_loss": -11.348115921020508, "global_step": 276430, "epoch": 1645} {"train_loss": -10.82446575164795, "global_step": 276431, "epoch": 1645} {"train_loss": -11.446718215942383, "global_step": 276432, "epoch": 1645} {"train_loss": -10.98033332824707, "global_step": 276433, "epoch": 1645} {"train_loss": -11.374265670776367, "global_step": 276434, "epoch": 1645} {"train_loss": -11.360158920288086, "global_step": 276435, "epoch": 1645} {"train_loss": -11.596123695373535, "global_step": 276436, "epoch": 1645} {"train_loss": -11.201043128967285, "global_step": 276437, "epoch": 1645} {"train_loss": -11.474983215332031, "global_step": 276438, "epoch": 1645} {"train_loss": -11.62881851196289, "global_step": 276439, "epoch": 1645} {"train_loss": -11.493104934692383, "global_step": 276440, "epoch": 1645} {"train_loss": -11.783671379089355, "global_step": 276441, "epoch": 1645} {"train_loss": -11.935870170593262, "global_step": 276442, "epoch": 1645} {"train_loss": -11.897716522216797, "global_step": 276443, "epoch": 1645} {"train_loss": -11.69151496887207, "global_step": 276444, "epoch": 1645} {"train_loss": -11.785422325134277, "global_step": 276445, "epoch": 1645} {"train_loss": -11.887088775634766, "global_step": 276446, "epoch": 1645} {"train_loss": -11.688834190368652, "global_step": 276447, "epoch": 1645} {"train_loss": -11.575637817382812, "global_step": 276448, "epoch": 1645} {"train_loss": -11.74012565612793, "global_step": 276449, "epoch": 1645} {"train_loss": -11.650354385375977, "global_step": 276450, "epoch": 1645} {"train_loss": -11.998150825500488, "global_step": 276451, "epoch": 1645} {"train_loss": -11.848154067993164, "global_step": 276452, "epoch": 1645} {"train_loss": -12.000545501708984, "global_step": 276453, "epoch": 1645} {"train_loss": -11.808996200561523, "global_step": 276454, "epoch": 1645} {"train_loss": -11.619462966918945, "global_step": 276455, "epoch": 1645} {"train_loss": -11.686447143554688, "global_step": 276456, "epoch": 1645} {"train_loss": -12.223965644836426, "global_step": 276457, "epoch": 1645} {"train_loss": -11.543661117553711, "global_step": 276458, "epoch": 1645} {"train_loss": -12.166940689086914, "global_step": 276459, "epoch": 1645} {"train_loss": -11.952751159667969, "global_step": 276460, "epoch": 1645} {"train_loss": -11.965435028076172, "global_step": 276461, "epoch": 1645} {"train_loss": -11.743614196777344, "global_step": 276462, "epoch": 1645} {"train_loss": -12.001103401184082, "global_step": 276463, "epoch": 1645} {"train_loss": -11.897470474243164, "global_step": 276464, "epoch": 1645} {"train_loss": -12.06009292602539, "global_step": 276465, "epoch": 1645} {"train_loss": -11.863314628601074, "global_step": 276466, "epoch": 1645} {"train_loss": -11.623556137084961, "global_step": 276467, "epoch": 1645} {"train_loss": -11.929403305053711, "global_step": 276468, "epoch": 1645} {"train_loss": -11.96926498413086, "global_step": 276469, "epoch": 1645} {"train_loss": -11.89558219909668, "global_step": 276470, "epoch": 1645} {"train_loss": -11.92738151550293, "global_step": 276471, "epoch": 1645} {"train_loss": -12.358509063720703, "global_step": 276472, "epoch": 1645} {"train_loss": -11.937235832214355, "global_step": 276473, "epoch": 1645} {"train_loss": -12.228846549987793, "global_step": 276474, "epoch": 1645} {"train_loss": -11.042797088623047, "global_step": 276475, "epoch": 1645} {"train_loss": -12.218488693237305, "global_step": 276476, "epoch": 1645} {"train_loss": -12.096145629882812, "global_step": 276477, "epoch": 1645} {"train_loss": -12.161392211914062, "global_step": 276478, "epoch": 1645} {"train_loss": -11.925993919372559, "global_step": 276479, "epoch": 1645} {"train_loss": -11.890003204345703, "global_step": 276480, "epoch": 1645} {"train_loss": -12.130258560180664, "global_step": 276481, "epoch": 1645} {"train_loss": -11.991552352905273, "global_step": 276482, "epoch": 1645} {"train_loss": -12.053409576416016, "global_step": 276483, "epoch": 1645} {"train_loss": -11.742406845092773, "global_step": 276484, "epoch": 1645} {"train_loss": -12.279913902282715, "global_step": 276485, "epoch": 1645} {"train_loss": -12.2227144241333, "global_step": 276486, "epoch": 1645} {"train_loss": -11.978612899780273, "global_step": 276487, "epoch": 1645} {"train_loss": -12.070682525634766, "global_step": 276488, "epoch": 1645} {"train_loss": -12.33845329284668, "global_step": 276489, "epoch": 1645} {"train_loss": -12.141484260559082, "global_step": 276490, "epoch": 1645} {"train_loss": -11.972721099853516, "global_step": 276491, "epoch": 1645} {"train_loss": -12.203208923339844, "global_step": 276492, "epoch": 1645} {"train_loss": -12.095227241516113, "global_step": 276493, "epoch": 1645} {"train_loss": -11.4827880859375, "global_step": 276494, "epoch": 1645} {"train_loss": -11.395740509033203, "global_step": 276495, "epoch": 1645} {"train_loss": -11.993376731872559, "global_step": 276496, "epoch": 1645} {"train_loss": -11.715372085571289, "global_step": 276497, "epoch": 1645} {"train_loss": -10.927608489990234, "global_step": 276498, "epoch": 1645} {"train_loss": -12.146474838256836, "global_step": 276499, "epoch": 1645} {"train_loss": -11.01781177520752, "global_step": 276500, "epoch": 1645} {"train_loss": -11.694219589233398, "global_step": 276501, "epoch": 1645} {"train_loss": -11.832327842712402, "global_step": 276502, "epoch": 1645} {"train_loss": -11.729188919067383, "global_step": 276503, "epoch": 1645} {"train_loss": -11.444906234741211, "global_step": 276504, "epoch": 1645} {"train_loss": -10.121959686279297, "global_step": 276505, "epoch": 1645} {"train_loss": -11.901344299316406, "global_step": 276506, "epoch": 1645} {"train_loss": -10.379682540893555, "global_step": 276507, "epoch": 1645} {"train_loss": -11.861846923828125, "global_step": 276508, "epoch": 1645} {"train_loss": -10.464998245239258, "global_step": 276509, "epoch": 1645} {"train_loss": -9.860057830810547, "global_step": 276510, "epoch": 1645} {"train_loss": -10.862174987792969, "global_step": 276511, "epoch": 1645} {"train_loss": -9.904155731201172, "global_step": 276512, "epoch": 1645} {"train_loss": -9.999748229980469, "global_step": 276513, "epoch": 1645} {"train_loss": -10.219098091125488, "global_step": 276514, "epoch": 1645} {"train_loss": -8.838872909545898, "global_step": 276515, "epoch": 1645} {"train_loss": -11.203493118286133, "global_step": 276516, "epoch": 1645} {"train_loss": -9.699597358703613, "global_step": 276517, "epoch": 1645} {"train_loss": -10.641243934631348, "global_step": 276518, "epoch": 1645} {"train_loss": -10.864173889160156, "global_step": 276519, "epoch": 1645} {"train_loss": -10.797765731811523, "global_step": 276520, "epoch": 1645} {"train_loss": -10.648056030273438, "global_step": 276521, "epoch": 1645} {"train_loss": -10.495777130126953, "global_step": 276522, "epoch": 1645} {"train_loss": -11.533662796020508, "global_step": 276523, "epoch": 1645} {"train_loss": -9.782649993896484, "global_step": 276524, "epoch": 1645} {"train_loss": -11.047199249267578, "global_step": 276525, "epoch": 1645} {"train_loss": -10.983858108520508, "global_step": 276526, "epoch": 1645} {"train_loss": -11.562101273309617, "global_step": 276527, "epoch": 1645, "val_loss": 271298.90625, "train_action_mse_error": 0.6541115045547485} {"train_loss": -11.631080627441406, "global_step": 276528, "epoch": 1646} {"train_loss": -9.85322380065918, "global_step": 276529, "epoch": 1646} {"train_loss": -11.263797760009766, "global_step": 276530, "epoch": 1646} {"train_loss": -10.001445770263672, "global_step": 276531, "epoch": 1646} {"train_loss": -11.200515747070312, "global_step": 276532, "epoch": 1646} {"train_loss": -10.476863861083984, "global_step": 276533, "epoch": 1646} {"train_loss": -10.35818099975586, "global_step": 276534, "epoch": 1646} {"train_loss": -11.248205184936523, "global_step": 276535, "epoch": 1646} {"train_loss": -10.592974662780762, "global_step": 276536, "epoch": 1646} {"train_loss": -10.384466171264648, "global_step": 276537, "epoch": 1646} {"train_loss": -10.94173526763916, "global_step": 276538, "epoch": 1646} {"train_loss": -10.851478576660156, "global_step": 276539, "epoch": 1646} {"train_loss": -10.902061462402344, "global_step": 276540, "epoch": 1646} {"train_loss": -11.535588264465332, "global_step": 276541, "epoch": 1646} {"train_loss": -11.11076545715332, "global_step": 276542, "epoch": 1646} {"train_loss": -11.469379425048828, "global_step": 276543, "epoch": 1646} {"train_loss": -11.413291931152344, "global_step": 276544, "epoch": 1646} {"train_loss": -11.340051651000977, "global_step": 276545, "epoch": 1646} {"train_loss": -11.507692337036133, "global_step": 276546, "epoch": 1646} {"train_loss": -11.036709785461426, "global_step": 276547, "epoch": 1646} {"train_loss": -11.294807434082031, "global_step": 276548, "epoch": 1646} {"train_loss": -11.706870079040527, "global_step": 276549, "epoch": 1646} {"train_loss": -11.47785758972168, "global_step": 276550, "epoch": 1646} {"train_loss": -11.82535171508789, "global_step": 276551, "epoch": 1646} {"train_loss": -11.567607879638672, "global_step": 276552, "epoch": 1646} {"train_loss": -11.72035026550293, "global_step": 276553, "epoch": 1646} {"train_loss": -11.581377029418945, "global_step": 276554, "epoch": 1646} {"train_loss": -11.533590316772461, "global_step": 276555, "epoch": 1646} {"train_loss": -11.636610984802246, "global_step": 276556, "epoch": 1646} {"train_loss": -11.468605995178223, "global_step": 276557, "epoch": 1646} {"train_loss": -11.455879211425781, "global_step": 276558, "epoch": 1646} {"train_loss": -11.880634307861328, "global_step": 276559, "epoch": 1646} {"train_loss": -11.372941970825195, "global_step": 276560, "epoch": 1646} {"train_loss": -11.795924186706543, "global_step": 276561, "epoch": 1646} {"train_loss": -11.46976089477539, "global_step": 276562, "epoch": 1646} {"train_loss": -11.691902160644531, "global_step": 276563, "epoch": 1646} {"train_loss": -11.69570541381836, "global_step": 276564, "epoch": 1646} {"train_loss": -11.77913761138916, "global_step": 276565, "epoch": 1646} {"train_loss": -11.797142028808594, "global_step": 276566, "epoch": 1646} {"train_loss": -11.897990226745605, "global_step": 276567, "epoch": 1646} {"train_loss": -11.784038543701172, "global_step": 276568, "epoch": 1646} {"train_loss": -11.869575500488281, "global_step": 276569, "epoch": 1646} {"train_loss": -11.741036415100098, "global_step": 276570, "epoch": 1646} {"train_loss": -11.955904006958008, "global_step": 276571, "epoch": 1646} {"train_loss": -11.933540344238281, "global_step": 276572, "epoch": 1646} {"train_loss": -11.892229080200195, "global_step": 276573, "epoch": 1646} {"train_loss": -12.011611938476562, "global_step": 276574, "epoch": 1646} {"train_loss": -11.633630752563477, "global_step": 276575, "epoch": 1646} {"train_loss": -11.732830047607422, "global_step": 276576, "epoch": 1646} {"train_loss": -11.645261764526367, "global_step": 276577, "epoch": 1646} {"train_loss": -11.783086776733398, "global_step": 276578, "epoch": 1646} {"train_loss": -11.778162956237793, "global_step": 276579, "epoch": 1646} {"train_loss": -11.663947105407715, "global_step": 276580, "epoch": 1646} {"train_loss": -11.93791389465332, "global_step": 276581, "epoch": 1646} {"train_loss": -11.763042449951172, "global_step": 276582, "epoch": 1646} {"train_loss": -11.847768783569336, "global_step": 276583, "epoch": 1646} {"train_loss": -11.732234954833984, "global_step": 276584, "epoch": 1646} {"train_loss": -12.182907104492188, "global_step": 276585, "epoch": 1646} {"train_loss": -11.718282699584961, "global_step": 276586, "epoch": 1646} {"train_loss": -11.878290176391602, "global_step": 276587, "epoch": 1646} {"train_loss": -11.773760795593262, "global_step": 276588, "epoch": 1646} {"train_loss": -11.995611190795898, "global_step": 276589, "epoch": 1646} {"train_loss": -12.086531639099121, "global_step": 276590, "epoch": 1646} {"train_loss": -11.816615104675293, "global_step": 276591, "epoch": 1646} {"train_loss": -12.197772026062012, "global_step": 276592, "epoch": 1646} {"train_loss": -12.068041801452637, "global_step": 276593, "epoch": 1646} {"train_loss": -12.152801513671875, "global_step": 276594, "epoch": 1646} {"train_loss": -12.136898040771484, "global_step": 276595, "epoch": 1646} {"train_loss": -11.967183113098145, "global_step": 276596, "epoch": 1646} {"train_loss": -11.96664810180664, "global_step": 276597, "epoch": 1646} {"train_loss": -12.073569297790527, "global_step": 276598, "epoch": 1646} {"train_loss": -12.284826278686523, "global_step": 276599, "epoch": 1646} {"train_loss": -12.103967666625977, "global_step": 276600, "epoch": 1646} {"train_loss": -12.4176025390625, "global_step": 276601, "epoch": 1646} {"train_loss": -12.113029479980469, "global_step": 276602, "epoch": 1646} {"train_loss": -12.199287414550781, "global_step": 276603, "epoch": 1646} {"train_loss": -11.975120544433594, "global_step": 276604, "epoch": 1646} {"train_loss": -11.7628173828125, "global_step": 276605, "epoch": 1646} {"train_loss": -12.239181518554688, "global_step": 276606, "epoch": 1646} {"train_loss": -12.032515525817871, "global_step": 276607, "epoch": 1646} {"train_loss": -12.425056457519531, "global_step": 276608, "epoch": 1646} {"train_loss": -11.90980339050293, "global_step": 276609, "epoch": 1646} {"train_loss": -12.094646453857422, "global_step": 276610, "epoch": 1646} {"train_loss": -12.172646522521973, "global_step": 276611, "epoch": 1646} {"train_loss": -12.189013481140137, "global_step": 276612, "epoch": 1646} {"train_loss": -11.828363418579102, "global_step": 276613, "epoch": 1646} {"train_loss": -12.221420288085938, "global_step": 276614, "epoch": 1646} {"train_loss": -12.233924865722656, "global_step": 276615, "epoch": 1646} {"train_loss": -12.075204849243164, "global_step": 276616, "epoch": 1646} {"train_loss": -12.208142280578613, "global_step": 276617, "epoch": 1646} {"train_loss": -12.038644790649414, "global_step": 276618, "epoch": 1646} {"train_loss": -11.888300895690918, "global_step": 276619, "epoch": 1646} {"train_loss": -12.286298751831055, "global_step": 276620, "epoch": 1646} {"train_loss": -12.16946792602539, "global_step": 276621, "epoch": 1646} {"train_loss": -11.904112815856934, "global_step": 276622, "epoch": 1646} {"train_loss": -12.231513977050781, "global_step": 276623, "epoch": 1646} {"train_loss": -12.242591857910156, "global_step": 276624, "epoch": 1646} {"train_loss": -12.019067764282227, "global_step": 276625, "epoch": 1646} {"train_loss": -12.23710823059082, "global_step": 276626, "epoch": 1646} {"train_loss": -12.046302795410156, "global_step": 276627, "epoch": 1646} {"train_loss": -11.965681076049805, "global_step": 276628, "epoch": 1646} {"train_loss": -11.918658256530762, "global_step": 276629, "epoch": 1646} {"train_loss": -12.323732376098633, "global_step": 276630, "epoch": 1646} {"train_loss": -11.857412338256836, "global_step": 276631, "epoch": 1646} {"train_loss": -11.9555082321167, "global_step": 276632, "epoch": 1646} {"train_loss": -12.217676162719727, "global_step": 276633, "epoch": 1646} {"train_loss": -12.190282821655273, "global_step": 276634, "epoch": 1646} {"train_loss": -12.379180908203125, "global_step": 276635, "epoch": 1646} {"train_loss": -12.357995986938477, "global_step": 276636, "epoch": 1646} {"train_loss": -11.994022369384766, "global_step": 276637, "epoch": 1646} {"train_loss": -12.107616424560547, "global_step": 276638, "epoch": 1646} {"train_loss": -12.417341232299805, "global_step": 276639, "epoch": 1646} {"train_loss": -12.38409423828125, "global_step": 276640, "epoch": 1646} {"train_loss": -12.132294654846191, "global_step": 276641, "epoch": 1646} {"train_loss": -11.861773490905762, "global_step": 276642, "epoch": 1646} {"train_loss": -11.6991605758667, "global_step": 276643, "epoch": 1646} {"train_loss": -12.131315231323242, "global_step": 276644, "epoch": 1646} {"train_loss": -11.888320922851562, "global_step": 276645, "epoch": 1646} {"train_loss": -11.87105941772461, "global_step": 276646, "epoch": 1646} {"train_loss": -12.357606887817383, "global_step": 276647, "epoch": 1646} {"train_loss": -11.974651336669922, "global_step": 276648, "epoch": 1646} {"train_loss": -11.821876525878906, "global_step": 276649, "epoch": 1646} {"train_loss": -12.180126190185547, "global_step": 276650, "epoch": 1646} {"train_loss": -12.117928504943848, "global_step": 276651, "epoch": 1646} {"train_loss": -11.879356384277344, "global_step": 276652, "epoch": 1646} {"train_loss": -11.854743003845215, "global_step": 276653, "epoch": 1646} {"train_loss": -12.143973350524902, "global_step": 276654, "epoch": 1646} {"train_loss": -11.768453598022461, "global_step": 276655, "epoch": 1646} {"train_loss": -12.040641784667969, "global_step": 276656, "epoch": 1646} {"train_loss": -11.620058059692383, "global_step": 276657, "epoch": 1646} {"train_loss": -11.3461332321167, "global_step": 276658, "epoch": 1646} {"train_loss": -11.594210624694824, "global_step": 276659, "epoch": 1646} {"train_loss": -11.023042678833008, "global_step": 276660, "epoch": 1646} {"train_loss": -9.641521453857422, "global_step": 276661, "epoch": 1646} {"train_loss": -9.985146522521973, "global_step": 276662, "epoch": 1646} {"train_loss": -9.572999954223633, "global_step": 276663, "epoch": 1646} {"train_loss": -10.236074447631836, "global_step": 276664, "epoch": 1646} {"train_loss": -9.55723762512207, "global_step": 276665, "epoch": 1646} {"train_loss": -10.825777053833008, "global_step": 276666, "epoch": 1646} {"train_loss": -11.323567390441895, "global_step": 276667, "epoch": 1646} {"train_loss": -11.464566230773926, "global_step": 276668, "epoch": 1646} {"train_loss": -11.406071662902832, "global_step": 276669, "epoch": 1646} {"train_loss": -11.15368366241455, "global_step": 276670, "epoch": 1646} {"train_loss": -11.377812385559082, "global_step": 276671, "epoch": 1646} {"train_loss": -11.567359924316406, "global_step": 276672, "epoch": 1646} {"train_loss": -11.583541870117188, "global_step": 276673, "epoch": 1646} {"train_loss": -11.90708065032959, "global_step": 276674, "epoch": 1646} {"train_loss": -11.242874145507812, "global_step": 276675, "epoch": 1646} {"train_loss": -11.478876113891602, "global_step": 276676, "epoch": 1646} {"train_loss": -11.561702728271484, "global_step": 276677, "epoch": 1646} {"train_loss": -10.842376708984375, "global_step": 276678, "epoch": 1646} {"train_loss": -11.786506652832031, "global_step": 276679, "epoch": 1646} {"train_loss": -11.361907958984375, "global_step": 276680, "epoch": 1646} {"train_loss": -11.3659029006958, "global_step": 276681, "epoch": 1646} {"train_loss": -11.597203254699707, "global_step": 276682, "epoch": 1646} {"train_loss": -10.693154335021973, "global_step": 276683, "epoch": 1646} {"train_loss": -11.425558090209961, "global_step": 276684, "epoch": 1646} {"train_loss": -11.217764854431152, "global_step": 276685, "epoch": 1646} {"train_loss": -10.646782875061035, "global_step": 276686, "epoch": 1646} {"train_loss": -11.848275184631348, "global_step": 276687, "epoch": 1646} {"train_loss": -10.474291801452637, "global_step": 276688, "epoch": 1646} {"train_loss": -11.470563888549805, "global_step": 276689, "epoch": 1646} {"train_loss": -11.196327209472656, "global_step": 276690, "epoch": 1646} {"train_loss": -11.378631591796875, "global_step": 276691, "epoch": 1646} {"train_loss": -11.814868927001953, "global_step": 276692, "epoch": 1646} {"train_loss": -11.197725296020508, "global_step": 276693, "epoch": 1646} {"train_loss": -11.825485229492188, "global_step": 276694, "epoch": 1646} {"train_loss": -11.647747107914515, "global_step": 276695, "epoch": 1646, "val_loss": 273648.6875} {"train_loss": -11.37330436706543, "global_step": 276696, "epoch": 1647} {"train_loss": -11.40850830078125, "global_step": 276697, "epoch": 1647} {"train_loss": -11.344467163085938, "global_step": 276698, "epoch": 1647} {"train_loss": -11.513544082641602, "global_step": 276699, "epoch": 1647} {"train_loss": -11.70396614074707, "global_step": 276700, "epoch": 1647} {"train_loss": -11.705400466918945, "global_step": 276701, "epoch": 1647} {"train_loss": -11.725933074951172, "global_step": 276702, "epoch": 1647} {"train_loss": -11.752116203308105, "global_step": 276703, "epoch": 1647} {"train_loss": -11.914228439331055, "global_step": 276704, "epoch": 1647} {"train_loss": -11.878716468811035, "global_step": 276705, "epoch": 1647} {"train_loss": -12.198869705200195, "global_step": 276706, "epoch": 1647} {"train_loss": -11.96178913116455, "global_step": 276707, "epoch": 1647} {"train_loss": -12.022245407104492, "global_step": 276708, "epoch": 1647} {"train_loss": -11.644002914428711, "global_step": 276709, "epoch": 1647} {"train_loss": -12.010772705078125, "global_step": 276710, "epoch": 1647} {"train_loss": -11.925508499145508, "global_step": 276711, "epoch": 1647} {"train_loss": -11.879712104797363, "global_step": 276712, "epoch": 1647} {"train_loss": -12.119880676269531, "global_step": 276713, "epoch": 1647} {"train_loss": -11.949236869812012, "global_step": 276714, "epoch": 1647} {"train_loss": -11.93292236328125, "global_step": 276715, "epoch": 1647} {"train_loss": -12.161643028259277, "global_step": 276716, "epoch": 1647} {"train_loss": -11.805540084838867, "global_step": 276717, "epoch": 1647} {"train_loss": -12.185748100280762, "global_step": 276718, "epoch": 1647} {"train_loss": -11.907663345336914, "global_step": 276719, "epoch": 1647} {"train_loss": -12.16289234161377, "global_step": 276720, "epoch": 1647} {"train_loss": -12.283227920532227, "global_step": 276721, "epoch": 1647} {"train_loss": -11.866344451904297, "global_step": 276722, "epoch": 1647} {"train_loss": -12.011564254760742, "global_step": 276723, "epoch": 1647} {"train_loss": -11.966716766357422, "global_step": 276724, "epoch": 1647} {"train_loss": -11.817882537841797, "global_step": 276725, "epoch": 1647} {"train_loss": -11.973838806152344, "global_step": 276726, "epoch": 1647} {"train_loss": -12.12215805053711, "global_step": 276727, "epoch": 1647} {"train_loss": -12.025219917297363, "global_step": 276728, "epoch": 1647} {"train_loss": -11.693700790405273, "global_step": 276729, "epoch": 1647} {"train_loss": -12.154138565063477, "global_step": 276730, "epoch": 1647} {"train_loss": -11.922351837158203, "global_step": 276731, "epoch": 1647} {"train_loss": -12.004913330078125, "global_step": 276732, "epoch": 1647} {"train_loss": -12.32457160949707, "global_step": 276733, "epoch": 1647} {"train_loss": -11.899824142456055, "global_step": 276734, "epoch": 1647} {"train_loss": -12.092472076416016, "global_step": 276735, "epoch": 1647} {"train_loss": -12.2461576461792, "global_step": 276736, "epoch": 1647} {"train_loss": -12.185328483581543, "global_step": 276737, "epoch": 1647} {"train_loss": -12.23239517211914, "global_step": 276738, "epoch": 1647} {"train_loss": -12.039159774780273, "global_step": 276739, "epoch": 1647} {"train_loss": -12.127518653869629, "global_step": 276740, "epoch": 1647} {"train_loss": -12.063375473022461, "global_step": 276741, "epoch": 1647} {"train_loss": -11.944207191467285, "global_step": 276742, "epoch": 1647} {"train_loss": -12.100663185119629, "global_step": 276743, "epoch": 1647} {"train_loss": -12.369546890258789, "global_step": 276744, "epoch": 1647} {"train_loss": -12.011955261230469, "global_step": 276745, "epoch": 1647} {"train_loss": -12.220964431762695, "global_step": 276746, "epoch": 1647} {"train_loss": -12.087766647338867, "global_step": 276747, "epoch": 1647} {"train_loss": -12.12333869934082, "global_step": 276748, "epoch": 1647} {"train_loss": -12.209446907043457, "global_step": 276749, "epoch": 1647} {"train_loss": -12.387619018554688, "global_step": 276750, "epoch": 1647} {"train_loss": -12.081857681274414, "global_step": 276751, "epoch": 1647} {"train_loss": -12.196971893310547, "global_step": 276752, "epoch": 1647} {"train_loss": -12.26655387878418, "global_step": 276753, "epoch": 1647} {"train_loss": -12.295072555541992, "global_step": 276754, "epoch": 1647} {"train_loss": -12.241065979003906, "global_step": 276755, "epoch": 1647} {"train_loss": -12.283136367797852, "global_step": 276756, "epoch": 1647} {"train_loss": -12.231922149658203, "global_step": 276757, "epoch": 1647} {"train_loss": -12.141656875610352, "global_step": 276758, "epoch": 1647} {"train_loss": -12.166268348693848, "global_step": 276759, "epoch": 1647} {"train_loss": -12.221342086791992, "global_step": 276760, "epoch": 1647} {"train_loss": -11.857978820800781, "global_step": 276761, "epoch": 1647} {"train_loss": -11.460387229919434, "global_step": 276762, "epoch": 1647} {"train_loss": -11.770845413208008, "global_step": 276763, "epoch": 1647} {"train_loss": -11.95840072631836, "global_step": 276764, "epoch": 1647} {"train_loss": -11.588106155395508, "global_step": 276765, "epoch": 1647} {"train_loss": -12.094728469848633, "global_step": 276766, "epoch": 1647} {"train_loss": -11.295494079589844, "global_step": 276767, "epoch": 1647} {"train_loss": -10.348245620727539, "global_step": 276768, "epoch": 1647} {"train_loss": -10.680068969726562, "global_step": 276769, "epoch": 1647} {"train_loss": -10.977642059326172, "global_step": 276770, "epoch": 1647} {"train_loss": -9.022655487060547, "global_step": 276771, "epoch": 1647} {"train_loss": -8.863200187683105, "global_step": 276772, "epoch": 1647} {"train_loss": -10.352327346801758, "global_step": 276773, "epoch": 1647} {"train_loss": -9.883056640625, "global_step": 276774, "epoch": 1647} {"train_loss": -10.301910400390625, "global_step": 276775, "epoch": 1647} {"train_loss": -8.944432258605957, "global_step": 276776, "epoch": 1647} {"train_loss": -11.036880493164062, "global_step": 276777, "epoch": 1647} {"train_loss": -9.433758735656738, "global_step": 276778, "epoch": 1647} {"train_loss": -10.593948364257812, "global_step": 276779, "epoch": 1647} {"train_loss": -10.654150009155273, "global_step": 276780, "epoch": 1647} {"train_loss": -10.969793319702148, "global_step": 276781, "epoch": 1647} {"train_loss": -10.150655746459961, "global_step": 276782, "epoch": 1647} {"train_loss": -11.367521286010742, "global_step": 276783, "epoch": 1647} {"train_loss": -11.125593185424805, "global_step": 276784, "epoch": 1647} {"train_loss": -10.939018249511719, "global_step": 276785, "epoch": 1647} {"train_loss": -11.168663024902344, "global_step": 276786, "epoch": 1647} {"train_loss": -11.582060813903809, "global_step": 276787, "epoch": 1647} {"train_loss": -11.286859512329102, "global_step": 276788, "epoch": 1647} {"train_loss": -11.552652359008789, "global_step": 276789, "epoch": 1647} {"train_loss": -11.611970901489258, "global_step": 276790, "epoch": 1647} {"train_loss": -11.065836906433105, "global_step": 276791, "epoch": 1647} {"train_loss": -11.079276084899902, "global_step": 276792, "epoch": 1647} {"train_loss": -11.145252227783203, "global_step": 276793, "epoch": 1647} {"train_loss": -10.520499229431152, "global_step": 276794, "epoch": 1647} {"train_loss": -11.599365234375, "global_step": 276795, "epoch": 1647} {"train_loss": -10.932028770446777, "global_step": 276796, "epoch": 1647} {"train_loss": -11.61421012878418, "global_step": 276797, "epoch": 1647} {"train_loss": -10.985477447509766, "global_step": 276798, "epoch": 1647} {"train_loss": -11.021280288696289, "global_step": 276799, "epoch": 1647} {"train_loss": -11.313955307006836, "global_step": 276800, "epoch": 1647} {"train_loss": -11.59052848815918, "global_step": 276801, "epoch": 1647} {"train_loss": -11.568150520324707, "global_step": 276802, "epoch": 1647} {"train_loss": -11.611373901367188, "global_step": 276803, "epoch": 1647} {"train_loss": -11.162701606750488, "global_step": 276804, "epoch": 1647} {"train_loss": -11.833562850952148, "global_step": 276805, "epoch": 1647} {"train_loss": -11.293882369995117, "global_step": 276806, "epoch": 1647} {"train_loss": -11.24561595916748, "global_step": 276807, "epoch": 1647} {"train_loss": -11.552248001098633, "global_step": 276808, "epoch": 1647} {"train_loss": -10.592296600341797, "global_step": 276809, "epoch": 1647} {"train_loss": -11.909713745117188, "global_step": 276810, "epoch": 1647} {"train_loss": -11.224358558654785, "global_step": 276811, "epoch": 1647} {"train_loss": -11.635114669799805, "global_step": 276812, "epoch": 1647} {"train_loss": -11.728416442871094, "global_step": 276813, "epoch": 1647} {"train_loss": -11.772071838378906, "global_step": 276814, "epoch": 1647} {"train_loss": -11.730629920959473, "global_step": 276815, "epoch": 1647} {"train_loss": -12.123531341552734, "global_step": 276816, "epoch": 1647} {"train_loss": -11.845405578613281, "global_step": 276817, "epoch": 1647} {"train_loss": -12.002979278564453, "global_step": 276818, "epoch": 1647} {"train_loss": -11.764015197753906, "global_step": 276819, "epoch": 1647} {"train_loss": -11.982881546020508, "global_step": 276820, "epoch": 1647} {"train_loss": -12.18945598602295, "global_step": 276821, "epoch": 1647} {"train_loss": -11.914624214172363, "global_step": 276822, "epoch": 1647} {"train_loss": -11.959997177124023, "global_step": 276823, "epoch": 1647} {"train_loss": -12.0877103805542, "global_step": 276824, "epoch": 1647} {"train_loss": -11.761802673339844, "global_step": 276825, "epoch": 1647} {"train_loss": -11.88079833984375, "global_step": 276826, "epoch": 1647} {"train_loss": -11.822111129760742, "global_step": 276827, "epoch": 1647} {"train_loss": -12.045879364013672, "global_step": 276828, "epoch": 1647} {"train_loss": -11.886455535888672, "global_step": 276829, "epoch": 1647} {"train_loss": -11.880857467651367, "global_step": 276830, "epoch": 1647} {"train_loss": -12.03168773651123, "global_step": 276831, "epoch": 1647} {"train_loss": -11.903165817260742, "global_step": 276832, "epoch": 1647} {"train_loss": -12.24636459350586, "global_step": 276833, "epoch": 1647} {"train_loss": -11.757628440856934, "global_step": 276834, "epoch": 1647} {"train_loss": -12.065465927124023, "global_step": 276835, "epoch": 1647} {"train_loss": -12.00954818725586, "global_step": 276836, "epoch": 1647} {"train_loss": -11.816773414611816, "global_step": 276837, "epoch": 1647} {"train_loss": -11.958560943603516, "global_step": 276838, "epoch": 1647} {"train_loss": -11.97854232788086, "global_step": 276839, "epoch": 1647} {"train_loss": -12.073830604553223, "global_step": 276840, "epoch": 1647} {"train_loss": -11.913222312927246, "global_step": 276841, "epoch": 1647} {"train_loss": -12.13192081451416, "global_step": 276842, "epoch": 1647} {"train_loss": -12.076472282409668, "global_step": 276843, "epoch": 1647} {"train_loss": -12.195722579956055, "global_step": 276844, "epoch": 1647} {"train_loss": -12.144405364990234, "global_step": 276845, "epoch": 1647} {"train_loss": -12.176570892333984, "global_step": 276846, "epoch": 1647} {"train_loss": -12.091009140014648, "global_step": 276847, "epoch": 1647} {"train_loss": -12.086451530456543, "global_step": 276848, "epoch": 1647} {"train_loss": -12.031984329223633, "global_step": 276849, "epoch": 1647} {"train_loss": -12.13609504699707, "global_step": 276850, "epoch": 1647} {"train_loss": -12.224912643432617, "global_step": 276851, "epoch": 1647} {"train_loss": -11.858399391174316, "global_step": 276852, "epoch": 1647} {"train_loss": -11.991926193237305, "global_step": 276853, "epoch": 1647} {"train_loss": -12.090139389038086, "global_step": 276854, "epoch": 1647} {"train_loss": -12.345142364501953, "global_step": 276855, "epoch": 1647} {"train_loss": -12.054475784301758, "global_step": 276856, "epoch": 1647} {"train_loss": -11.967924118041992, "global_step": 276857, "epoch": 1647} {"train_loss": -11.959390640258789, "global_step": 276858, "epoch": 1647} {"train_loss": -12.083734512329102, "global_step": 276859, "epoch": 1647} {"train_loss": -11.879918098449707, "global_step": 276860, "epoch": 1647} {"train_loss": -11.829733848571777, "global_step": 276861, "epoch": 1647} {"train_loss": -12.042789459228516, "global_step": 276862, "epoch": 1647} {"train_loss": -11.702002735365005, "global_step": 276863, "epoch": 1647, "val_loss": 276432.90625} {"train_loss": -11.97795295715332, "global_step": 276864, "epoch": 1648} {"train_loss": -12.16849136352539, "global_step": 276865, "epoch": 1648} {"train_loss": -12.198169708251953, "global_step": 276866, "epoch": 1648} {"train_loss": -12.104362487792969, "global_step": 276867, "epoch": 1648} {"train_loss": -11.821701049804688, "global_step": 276868, "epoch": 1648} {"train_loss": -12.23259162902832, "global_step": 276869, "epoch": 1648} {"train_loss": -12.391570091247559, "global_step": 276870, "epoch": 1648} {"train_loss": -11.7937650680542, "global_step": 276871, "epoch": 1648} {"train_loss": -11.718582153320312, "global_step": 276872, "epoch": 1648} {"train_loss": -11.566070556640625, "global_step": 276873, "epoch": 1648} {"train_loss": -12.148702621459961, "global_step": 276874, "epoch": 1648} {"train_loss": -11.662001609802246, "global_step": 276875, "epoch": 1648} {"train_loss": -11.55142593383789, "global_step": 276876, "epoch": 1648} {"train_loss": -12.142021179199219, "global_step": 276877, "epoch": 1648} {"train_loss": -11.467313766479492, "global_step": 276878, "epoch": 1648} {"train_loss": -11.964351654052734, "global_step": 276879, "epoch": 1648} {"train_loss": -10.939995765686035, "global_step": 276880, "epoch": 1648} {"train_loss": -11.024480819702148, "global_step": 276881, "epoch": 1648} {"train_loss": -10.74390983581543, "global_step": 276882, "epoch": 1648} {"train_loss": -11.625049591064453, "global_step": 276883, "epoch": 1648} {"train_loss": -10.138909339904785, "global_step": 276884, "epoch": 1648} {"train_loss": -10.87833309173584, "global_step": 276885, "epoch": 1648} {"train_loss": -10.706521987915039, "global_step": 276886, "epoch": 1648} {"train_loss": -8.857711791992188, "global_step": 276887, "epoch": 1648} {"train_loss": -10.693846702575684, "global_step": 276888, "epoch": 1648} {"train_loss": -11.483831405639648, "global_step": 276889, "epoch": 1648} {"train_loss": -10.837166786193848, "global_step": 276890, "epoch": 1648} {"train_loss": -11.690975189208984, "global_step": 276891, "epoch": 1648} {"train_loss": -11.117115020751953, "global_step": 276892, "epoch": 1648} {"train_loss": -10.623037338256836, "global_step": 276893, "epoch": 1648} {"train_loss": -12.041683197021484, "global_step": 276894, "epoch": 1648} {"train_loss": -10.866870880126953, "global_step": 276895, "epoch": 1648} {"train_loss": -11.536828994750977, "global_step": 276896, "epoch": 1648} {"train_loss": -11.672442436218262, "global_step": 276897, "epoch": 1648} {"train_loss": -10.846582412719727, "global_step": 276898, "epoch": 1648} {"train_loss": -11.579753875732422, "global_step": 276899, "epoch": 1648} {"train_loss": -11.617286682128906, "global_step": 276900, "epoch": 1648} {"train_loss": -11.599960327148438, "global_step": 276901, "epoch": 1648} {"train_loss": -11.20716667175293, "global_step": 276902, "epoch": 1648} {"train_loss": -10.844680786132812, "global_step": 276903, "epoch": 1648} {"train_loss": -10.166275024414062, "global_step": 276904, "epoch": 1648} {"train_loss": -9.539258003234863, "global_step": 276905, "epoch": 1648} {"train_loss": -10.877166748046875, "global_step": 276906, "epoch": 1648} {"train_loss": -9.473207473754883, "global_step": 276907, "epoch": 1648} {"train_loss": -11.385305404663086, "global_step": 276908, "epoch": 1648} {"train_loss": -8.605159759521484, "global_step": 276909, "epoch": 1648} {"train_loss": -9.541523933410645, "global_step": 276910, "epoch": 1648} {"train_loss": -10.029348373413086, "global_step": 276911, "epoch": 1648} {"train_loss": -11.318537712097168, "global_step": 276912, "epoch": 1648} {"train_loss": -9.906425476074219, "global_step": 276913, "epoch": 1648} {"train_loss": -10.319425582885742, "global_step": 276914, "epoch": 1648} {"train_loss": -11.183528900146484, "global_step": 276915, "epoch": 1648} {"train_loss": -10.435898780822754, "global_step": 276916, "epoch": 1648} {"train_loss": -11.167732238769531, "global_step": 276917, "epoch": 1648} {"train_loss": -11.469386100769043, "global_step": 276918, "epoch": 1648} {"train_loss": -11.079490661621094, "global_step": 276919, "epoch": 1648} {"train_loss": -10.8944730758667, "global_step": 276920, "epoch": 1648} {"train_loss": -10.59428882598877, "global_step": 276921, "epoch": 1648} {"train_loss": -10.148799896240234, "global_step": 276922, "epoch": 1648} {"train_loss": -11.65553092956543, "global_step": 276923, "epoch": 1648} {"train_loss": -11.266008377075195, "global_step": 276924, "epoch": 1648} {"train_loss": -10.44211483001709, "global_step": 276925, "epoch": 1648} {"train_loss": -11.835442543029785, "global_step": 276926, "epoch": 1648} {"train_loss": -10.959663391113281, "global_step": 276927, "epoch": 1648} {"train_loss": -10.909001350402832, "global_step": 276928, "epoch": 1648} {"train_loss": -11.465200424194336, "global_step": 276929, "epoch": 1648} {"train_loss": -10.847883224487305, "global_step": 276930, "epoch": 1648} {"train_loss": -11.398478507995605, "global_step": 276931, "epoch": 1648} {"train_loss": -11.504822731018066, "global_step": 276932, "epoch": 1648} {"train_loss": -11.280826568603516, "global_step": 276933, "epoch": 1648} {"train_loss": -11.530343055725098, "global_step": 276934, "epoch": 1648} {"train_loss": -11.709933280944824, "global_step": 276935, "epoch": 1648} {"train_loss": -11.447284698486328, "global_step": 276936, "epoch": 1648} {"train_loss": -11.627668380737305, "global_step": 276937, "epoch": 1648} {"train_loss": -11.901525497436523, "global_step": 276938, "epoch": 1648} {"train_loss": -11.724422454833984, "global_step": 276939, "epoch": 1648} {"train_loss": -11.746742248535156, "global_step": 276940, "epoch": 1648} {"train_loss": -11.925384521484375, "global_step": 276941, "epoch": 1648} {"train_loss": -11.578866004943848, "global_step": 276942, "epoch": 1648} {"train_loss": -11.480313301086426, "global_step": 276943, "epoch": 1648} {"train_loss": -12.008858680725098, "global_step": 276944, "epoch": 1648} {"train_loss": -11.581279754638672, "global_step": 276945, "epoch": 1648} {"train_loss": -11.943788528442383, "global_step": 276946, "epoch": 1648} {"train_loss": -12.060949325561523, "global_step": 276947, "epoch": 1648} {"train_loss": -11.809675216674805, "global_step": 276948, "epoch": 1648} {"train_loss": -11.888958930969238, "global_step": 276949, "epoch": 1648} {"train_loss": -11.929885864257812, "global_step": 276950, "epoch": 1648} {"train_loss": -11.91458797454834, "global_step": 276951, "epoch": 1648} {"train_loss": -11.75436782836914, "global_step": 276952, "epoch": 1648} {"train_loss": -11.844409942626953, "global_step": 276953, "epoch": 1648} {"train_loss": -12.011345863342285, "global_step": 276954, "epoch": 1648} {"train_loss": -11.97688102722168, "global_step": 276955, "epoch": 1648} {"train_loss": -11.803567886352539, "global_step": 276956, "epoch": 1648} {"train_loss": -12.149066925048828, "global_step": 276957, "epoch": 1648} {"train_loss": -12.230794906616211, "global_step": 276958, "epoch": 1648} {"train_loss": -12.096702575683594, "global_step": 276959, "epoch": 1648} {"train_loss": -11.919459342956543, "global_step": 276960, "epoch": 1648} {"train_loss": -12.073352813720703, "global_step": 276961, "epoch": 1648} {"train_loss": -12.213680267333984, "global_step": 276962, "epoch": 1648} {"train_loss": -12.12404727935791, "global_step": 276963, "epoch": 1648} {"train_loss": -12.238471984863281, "global_step": 276964, "epoch": 1648} {"train_loss": -12.237899780273438, "global_step": 276965, "epoch": 1648} {"train_loss": -12.175975799560547, "global_step": 276966, "epoch": 1648} {"train_loss": -12.210336685180664, "global_step": 276967, "epoch": 1648} {"train_loss": -11.836955070495605, "global_step": 276968, "epoch": 1648} {"train_loss": -12.281176567077637, "global_step": 276969, "epoch": 1648} {"train_loss": -12.309991836547852, "global_step": 276970, "epoch": 1648} {"train_loss": -12.034831047058105, "global_step": 276971, "epoch": 1648} {"train_loss": -12.170125961303711, "global_step": 276972, "epoch": 1648} {"train_loss": -12.217443466186523, "global_step": 276973, "epoch": 1648} {"train_loss": -12.150019645690918, "global_step": 276974, "epoch": 1648} {"train_loss": -12.229724884033203, "global_step": 276975, "epoch": 1648} {"train_loss": -12.021825790405273, "global_step": 276976, "epoch": 1648} {"train_loss": -12.149953842163086, "global_step": 276977, "epoch": 1648} {"train_loss": -12.220767974853516, "global_step": 276978, "epoch": 1648} {"train_loss": -12.297733306884766, "global_step": 276979, "epoch": 1648} {"train_loss": -12.061651229858398, "global_step": 276980, "epoch": 1648} {"train_loss": -12.253576278686523, "global_step": 276981, "epoch": 1648} {"train_loss": -12.401325225830078, "global_step": 276982, "epoch": 1648} {"train_loss": -12.035200119018555, "global_step": 276983, "epoch": 1648} {"train_loss": -12.146245956420898, "global_step": 276984, "epoch": 1648} {"train_loss": -12.43561840057373, "global_step": 276985, "epoch": 1648} {"train_loss": -12.485457420349121, "global_step": 276986, "epoch": 1648} {"train_loss": -11.96139144897461, "global_step": 276987, "epoch": 1648} {"train_loss": -11.796099662780762, "global_step": 276988, "epoch": 1648} {"train_loss": -11.890542030334473, "global_step": 276989, "epoch": 1648} {"train_loss": -11.917943954467773, "global_step": 276990, "epoch": 1648} {"train_loss": -11.894383430480957, "global_step": 276991, "epoch": 1648} {"train_loss": -12.070453643798828, "global_step": 276992, "epoch": 1648} {"train_loss": -11.841934204101562, "global_step": 276993, "epoch": 1648} {"train_loss": -9.942693710327148, "global_step": 276994, "epoch": 1648} {"train_loss": -10.259101867675781, "global_step": 276995, "epoch": 1648} {"train_loss": -11.830249786376953, "global_step": 276996, "epoch": 1648} {"train_loss": -11.03239631652832, "global_step": 276997, "epoch": 1648} {"train_loss": -10.69125747680664, "global_step": 276998, "epoch": 1648} {"train_loss": -11.683141708374023, "global_step": 276999, "epoch": 1648} {"train_loss": -11.372334480285645, "global_step": 277000, "epoch": 1648} {"train_loss": -11.158324241638184, "global_step": 277001, "epoch": 1648} {"train_loss": -11.794084548950195, "global_step": 277002, "epoch": 1648} {"train_loss": -11.47775650024414, "global_step": 277003, "epoch": 1648} {"train_loss": -11.050080299377441, "global_step": 277004, "epoch": 1648} {"train_loss": -11.604104995727539, "global_step": 277005, "epoch": 1648} {"train_loss": -11.466520309448242, "global_step": 277006, "epoch": 1648} {"train_loss": -11.233107566833496, "global_step": 277007, "epoch": 1648} {"train_loss": -11.874632835388184, "global_step": 277008, "epoch": 1648} {"train_loss": -11.4854154586792, "global_step": 277009, "epoch": 1648} {"train_loss": -11.710268020629883, "global_step": 277010, "epoch": 1648} {"train_loss": -11.845903396606445, "global_step": 277011, "epoch": 1648} {"train_loss": -12.104610443115234, "global_step": 277012, "epoch": 1648} {"train_loss": -12.18105697631836, "global_step": 277013, "epoch": 1648} {"train_loss": -12.103493690490723, "global_step": 277014, "epoch": 1648} {"train_loss": -11.996007919311523, "global_step": 277015, "epoch": 1648} {"train_loss": -12.137795448303223, "global_step": 277016, "epoch": 1648} {"train_loss": -12.124006271362305, "global_step": 277017, "epoch": 1648} {"train_loss": -12.206623077392578, "global_step": 277018, "epoch": 1648} {"train_loss": -12.172808647155762, "global_step": 277019, "epoch": 1648} {"train_loss": -12.059469223022461, "global_step": 277020, "epoch": 1648} {"train_loss": -12.408470153808594, "global_step": 277021, "epoch": 1648} {"train_loss": -12.050154685974121, "global_step": 277022, "epoch": 1648} {"train_loss": -12.313785552978516, "global_step": 277023, "epoch": 1648} {"train_loss": -11.979297637939453, "global_step": 277024, "epoch": 1648} {"train_loss": -12.156266212463379, "global_step": 277025, "epoch": 1648} {"train_loss": -12.23927116394043, "global_step": 277026, "epoch": 1648} {"train_loss": -12.08807373046875, "global_step": 277027, "epoch": 1648} {"train_loss": -12.138832092285156, "global_step": 277028, "epoch": 1648} {"train_loss": -12.15713119506836, "global_step": 277029, "epoch": 1648} {"train_loss": -11.997968673706055, "global_step": 277030, "epoch": 1648} {"train_loss": -11.569972918147133, "global_step": 277031, "epoch": 1648, "val_loss": 275017.5} {"train_loss": -12.170721054077148, "global_step": 277032, "epoch": 1649} {"train_loss": -12.039909362792969, "global_step": 277033, "epoch": 1649} {"train_loss": -12.084125518798828, "global_step": 277034, "epoch": 1649} {"train_loss": -12.193228721618652, "global_step": 277035, "epoch": 1649} {"train_loss": -12.121501922607422, "global_step": 277036, "epoch": 1649} {"train_loss": -12.268838882446289, "global_step": 277037, "epoch": 1649} {"train_loss": -12.218772888183594, "global_step": 277038, "epoch": 1649} {"train_loss": -12.129796981811523, "global_step": 277039, "epoch": 1649} {"train_loss": -12.283784866333008, "global_step": 277040, "epoch": 1649} {"train_loss": -12.19975471496582, "global_step": 277041, "epoch": 1649} {"train_loss": -12.220890998840332, "global_step": 277042, "epoch": 1649} {"train_loss": -12.037054061889648, "global_step": 277043, "epoch": 1649} {"train_loss": -12.312402725219727, "global_step": 277044, "epoch": 1649} {"train_loss": -12.26036262512207, "global_step": 277045, "epoch": 1649} {"train_loss": -12.149539947509766, "global_step": 277046, "epoch": 1649} {"train_loss": -11.793468475341797, "global_step": 277047, "epoch": 1649} {"train_loss": -11.182781219482422, "global_step": 277048, "epoch": 1649} {"train_loss": -11.82732105255127, "global_step": 277049, "epoch": 1649} {"train_loss": -12.166715621948242, "global_step": 277050, "epoch": 1649} {"train_loss": -10.82785415649414, "global_step": 277051, "epoch": 1649} {"train_loss": -11.40689468383789, "global_step": 277052, "epoch": 1649} {"train_loss": -11.656795501708984, "global_step": 277053, "epoch": 1649} {"train_loss": -9.73353099822998, "global_step": 277054, "epoch": 1649} {"train_loss": -10.231718063354492, "global_step": 277055, "epoch": 1649} {"train_loss": -11.478385925292969, "global_step": 277056, "epoch": 1649} {"train_loss": -10.643962860107422, "global_step": 277057, "epoch": 1649} {"train_loss": -11.49261474609375, "global_step": 277058, "epoch": 1649} {"train_loss": -9.71852970123291, "global_step": 277059, "epoch": 1649} {"train_loss": -10.692387580871582, "global_step": 277060, "epoch": 1649} {"train_loss": -10.254331588745117, "global_step": 277061, "epoch": 1649} {"train_loss": -10.375779151916504, "global_step": 277062, "epoch": 1649} {"train_loss": -11.111553192138672, "global_step": 277063, "epoch": 1649} {"train_loss": -10.251554489135742, "global_step": 277064, "epoch": 1649} {"train_loss": -10.786155700683594, "global_step": 277065, "epoch": 1649} {"train_loss": -10.533733367919922, "global_step": 277066, "epoch": 1649} {"train_loss": -10.656249046325684, "global_step": 277067, "epoch": 1649} {"train_loss": -9.344600677490234, "global_step": 277068, "epoch": 1649} {"train_loss": -9.83287239074707, "global_step": 277069, "epoch": 1649} {"train_loss": -9.107124328613281, "global_step": 277070, "epoch": 1649} {"train_loss": -9.790042877197266, "global_step": 277071, "epoch": 1649} {"train_loss": -9.360152244567871, "global_step": 277072, "epoch": 1649} {"train_loss": -9.40128231048584, "global_step": 277073, "epoch": 1649} {"train_loss": -9.371905326843262, "global_step": 277074, "epoch": 1649} {"train_loss": -10.658271789550781, "global_step": 277075, "epoch": 1649} {"train_loss": -9.427515983581543, "global_step": 277076, "epoch": 1649} {"train_loss": -8.94389820098877, "global_step": 277077, "epoch": 1649} {"train_loss": -11.306495666503906, "global_step": 277078, "epoch": 1649} {"train_loss": -10.252073287963867, "global_step": 277079, "epoch": 1649} {"train_loss": -9.990304946899414, "global_step": 277080, "epoch": 1649} {"train_loss": -9.787311553955078, "global_step": 277081, "epoch": 1649} {"train_loss": -10.796157836914062, "global_step": 277082, "epoch": 1649} {"train_loss": -10.674053192138672, "global_step": 277083, "epoch": 1649} {"train_loss": -10.807321548461914, "global_step": 277084, "epoch": 1649} {"train_loss": -10.776949882507324, "global_step": 277085, "epoch": 1649} {"train_loss": -11.077829360961914, "global_step": 277086, "epoch": 1649} {"train_loss": -11.081949234008789, "global_step": 277087, "epoch": 1649} {"train_loss": -11.132381439208984, "global_step": 277088, "epoch": 1649} {"train_loss": -10.598831176757812, "global_step": 277089, "epoch": 1649} {"train_loss": -10.94155502319336, "global_step": 277090, "epoch": 1649} {"train_loss": -10.326152801513672, "global_step": 277091, "epoch": 1649} {"train_loss": -10.464820861816406, "global_step": 277092, "epoch": 1649} {"train_loss": -11.246064186096191, "global_step": 277093, "epoch": 1649} {"train_loss": -10.804283142089844, "global_step": 277094, "epoch": 1649} {"train_loss": -10.472696304321289, "global_step": 277095, "epoch": 1649} {"train_loss": -11.494767189025879, "global_step": 277096, "epoch": 1649} {"train_loss": -11.076878547668457, "global_step": 277097, "epoch": 1649} {"train_loss": -10.436857223510742, "global_step": 277098, "epoch": 1649} {"train_loss": -11.367626190185547, "global_step": 277099, "epoch": 1649} {"train_loss": -11.005228042602539, "global_step": 277100, "epoch": 1649} {"train_loss": -10.445194244384766, "global_step": 277101, "epoch": 1649} {"train_loss": -11.577659606933594, "global_step": 277102, "epoch": 1649} {"train_loss": -11.612098693847656, "global_step": 277103, "epoch": 1649} {"train_loss": -11.02463150024414, "global_step": 277104, "epoch": 1649} {"train_loss": -11.811562538146973, "global_step": 277105, "epoch": 1649} {"train_loss": -11.485966682434082, "global_step": 277106, "epoch": 1649} {"train_loss": -11.536864280700684, "global_step": 277107, "epoch": 1649} {"train_loss": -11.693603515625, "global_step": 277108, "epoch": 1649} {"train_loss": -11.770282745361328, "global_step": 277109, "epoch": 1649} {"train_loss": -11.764829635620117, "global_step": 277110, "epoch": 1649} {"train_loss": -11.456245422363281, "global_step": 277111, "epoch": 1649} {"train_loss": -11.72166633605957, "global_step": 277112, "epoch": 1649} {"train_loss": -11.72774887084961, "global_step": 277113, "epoch": 1649} {"train_loss": -11.753229141235352, "global_step": 277114, "epoch": 1649} {"train_loss": -11.937515258789062, "global_step": 277115, "epoch": 1649} {"train_loss": -11.871271133422852, "global_step": 277116, "epoch": 1649} {"train_loss": -11.625131607055664, "global_step": 277117, "epoch": 1649} {"train_loss": -11.794736862182617, "global_step": 277118, "epoch": 1649} {"train_loss": -11.900992393493652, "global_step": 277119, "epoch": 1649} {"train_loss": -11.922563552856445, "global_step": 277120, "epoch": 1649} {"train_loss": -11.870945930480957, "global_step": 277121, "epoch": 1649} {"train_loss": -11.983444213867188, "global_step": 277122, "epoch": 1649} {"train_loss": -12.014947891235352, "global_step": 277123, "epoch": 1649} {"train_loss": -11.886198043823242, "global_step": 277124, "epoch": 1649} {"train_loss": -11.747932434082031, "global_step": 277125, "epoch": 1649} {"train_loss": -11.99592399597168, "global_step": 277126, "epoch": 1649} {"train_loss": -11.893811225891113, "global_step": 277127, "epoch": 1649} {"train_loss": -11.894876480102539, "global_step": 277128, "epoch": 1649} {"train_loss": -11.911931037902832, "global_step": 277129, "epoch": 1649} {"train_loss": -11.823452949523926, "global_step": 277130, "epoch": 1649} {"train_loss": -11.918024063110352, "global_step": 277131, "epoch": 1649} {"train_loss": -11.990086555480957, "global_step": 277132, "epoch": 1649} {"train_loss": -11.911247253417969, "global_step": 277133, "epoch": 1649} {"train_loss": -11.985156059265137, "global_step": 277134, "epoch": 1649} {"train_loss": -11.91264820098877, "global_step": 277135, "epoch": 1649} {"train_loss": -12.036314010620117, "global_step": 277136, "epoch": 1649} {"train_loss": -11.86345386505127, "global_step": 277137, "epoch": 1649} {"train_loss": -12.079198837280273, "global_step": 277138, "epoch": 1649} {"train_loss": -11.871910095214844, "global_step": 277139, "epoch": 1649} {"train_loss": -12.220918655395508, "global_step": 277140, "epoch": 1649} {"train_loss": -12.0586576461792, "global_step": 277141, "epoch": 1649} {"train_loss": -12.082742691040039, "global_step": 277142, "epoch": 1649} {"train_loss": -12.095664024353027, "global_step": 277143, "epoch": 1649} {"train_loss": -12.22636890411377, "global_step": 277144, "epoch": 1649} {"train_loss": -12.253868103027344, "global_step": 277145, "epoch": 1649} {"train_loss": -12.013223648071289, "global_step": 277146, "epoch": 1649} {"train_loss": -12.093489646911621, "global_step": 277147, "epoch": 1649} {"train_loss": -12.243751525878906, "global_step": 277148, "epoch": 1649} {"train_loss": -12.163431167602539, "global_step": 277149, "epoch": 1649} {"train_loss": -12.032217979431152, "global_step": 277150, "epoch": 1649} {"train_loss": -11.993207931518555, "global_step": 277151, "epoch": 1649} {"train_loss": -12.1783447265625, "global_step": 277152, "epoch": 1649} {"train_loss": -12.322103500366211, "global_step": 277153, "epoch": 1649} {"train_loss": -12.107948303222656, "global_step": 277154, "epoch": 1649} {"train_loss": -12.09786605834961, "global_step": 277155, "epoch": 1649} {"train_loss": -12.20556640625, "global_step": 277156, "epoch": 1649} {"train_loss": -12.252819061279297, "global_step": 277157, "epoch": 1649} {"train_loss": -12.202310562133789, "global_step": 277158, "epoch": 1649} {"train_loss": -12.294692993164062, "global_step": 277159, "epoch": 1649} {"train_loss": -12.363000869750977, "global_step": 277160, "epoch": 1649} {"train_loss": -12.080362319946289, "global_step": 277161, "epoch": 1649} {"train_loss": -12.355722427368164, "global_step": 277162, "epoch": 1649} {"train_loss": -12.264086723327637, "global_step": 277163, "epoch": 1649} {"train_loss": -12.312898635864258, "global_step": 277164, "epoch": 1649} {"train_loss": -12.423669815063477, "global_step": 277165, "epoch": 1649} {"train_loss": -12.164113998413086, "global_step": 277166, "epoch": 1649} {"train_loss": -11.946784973144531, "global_step": 277167, "epoch": 1649} {"train_loss": -12.100361824035645, "global_step": 277168, "epoch": 1649} {"train_loss": -12.020761489868164, "global_step": 277169, "epoch": 1649} {"train_loss": -11.902792930603027, "global_step": 277170, "epoch": 1649} {"train_loss": -12.242475509643555, "global_step": 277171, "epoch": 1649} {"train_loss": -12.111459732055664, "global_step": 277172, "epoch": 1649} {"train_loss": -12.378837585449219, "global_step": 277173, "epoch": 1649} {"train_loss": -12.075699806213379, "global_step": 277174, "epoch": 1649} {"train_loss": -12.561997413635254, "global_step": 277175, "epoch": 1649} {"train_loss": -12.362497329711914, "global_step": 277176, "epoch": 1649} {"train_loss": -11.9613676071167, "global_step": 277177, "epoch": 1649} {"train_loss": -11.946989059448242, "global_step": 277178, "epoch": 1649} {"train_loss": -10.447707176208496, "global_step": 277179, "epoch": 1649} {"train_loss": -11.017823219299316, "global_step": 277180, "epoch": 1649} {"train_loss": -10.553000450134277, "global_step": 277181, "epoch": 1649} {"train_loss": -12.045025825500488, "global_step": 277182, "epoch": 1649} {"train_loss": -9.49276351928711, "global_step": 277183, "epoch": 1649} {"train_loss": -11.889837265014648, "global_step": 277184, "epoch": 1649} {"train_loss": -10.841371536254883, "global_step": 277185, "epoch": 1649} {"train_loss": -11.819433212280273, "global_step": 277186, "epoch": 1649} {"train_loss": -11.328899383544922, "global_step": 277187, "epoch": 1649} {"train_loss": -10.92148208618164, "global_step": 277188, "epoch": 1649} {"train_loss": -11.094860076904297, "global_step": 277189, "epoch": 1649} {"train_loss": -11.535791397094727, "global_step": 277190, "epoch": 1649} {"train_loss": -11.043667793273926, "global_step": 277191, "epoch": 1649} {"train_loss": -10.72224235534668, "global_step": 277192, "epoch": 1649} {"train_loss": -11.430996894836426, "global_step": 277193, "epoch": 1649} {"train_loss": -11.708108901977539, "global_step": 277194, "epoch": 1649} {"train_loss": -11.602458953857422, "global_step": 277195, "epoch": 1649} {"train_loss": -11.062417984008789, "global_step": 277196, "epoch": 1649} {"train_loss": -12.036138534545898, "global_step": 277197, "epoch": 1649} {"train_loss": -10.861013412475586, "global_step": 277198, "epoch": 1649} {"train_loss": -11.451218298503331, "global_step": 277199, "epoch": 1649, "val_loss": 273521.40625} {"train_loss": -11.07321548461914, "global_step": 277200, "epoch": 1650} {"train_loss": -11.279626846313477, "global_step": 277201, "epoch": 1650} {"train_loss": -11.893722534179688, "global_step": 277202, "epoch": 1650} {"train_loss": -12.052804946899414, "global_step": 277203, "epoch": 1650} {"train_loss": -11.924271583557129, "global_step": 277204, "epoch": 1650} {"train_loss": -11.566117286682129, "global_step": 277205, "epoch": 1650} {"train_loss": -11.86785888671875, "global_step": 277206, "epoch": 1650} {"train_loss": -11.601310729980469, "global_step": 277207, "epoch": 1650} {"train_loss": -11.570220947265625, "global_step": 277208, "epoch": 1650} {"train_loss": -11.924115180969238, "global_step": 277209, "epoch": 1650} {"train_loss": -11.520222663879395, "global_step": 277210, "epoch": 1650} {"train_loss": -11.28348159790039, "global_step": 277211, "epoch": 1650} {"train_loss": -12.080745697021484, "global_step": 277212, "epoch": 1650} {"train_loss": -11.569597244262695, "global_step": 277213, "epoch": 1650} {"train_loss": -10.952116012573242, "global_step": 277214, "epoch": 1650} {"train_loss": -11.90214729309082, "global_step": 277215, "epoch": 1650} {"train_loss": -12.173696517944336, "global_step": 277216, "epoch": 1650} {"train_loss": -11.984708786010742, "global_step": 277217, "epoch": 1650} {"train_loss": -12.087698936462402, "global_step": 277218, "epoch": 1650} {"train_loss": -12.256731033325195, "global_step": 277219, "epoch": 1650} {"train_loss": -11.786773681640625, "global_step": 277220, "epoch": 1650} {"train_loss": -12.026119232177734, "global_step": 277221, "epoch": 1650} {"train_loss": -11.96763801574707, "global_step": 277222, "epoch": 1650} {"train_loss": -12.07014274597168, "global_step": 277223, "epoch": 1650} {"train_loss": -11.965471267700195, "global_step": 277224, "epoch": 1650} {"train_loss": -12.093417167663574, "global_step": 277225, "epoch": 1650} {"train_loss": -11.756394386291504, "global_step": 277226, "epoch": 1650} {"train_loss": -12.347789764404297, "global_step": 277227, "epoch": 1650} {"train_loss": -11.723861694335938, "global_step": 277228, "epoch": 1650} {"train_loss": -12.204748153686523, "global_step": 277229, "epoch": 1650} {"train_loss": -12.204862594604492, "global_step": 277230, "epoch": 1650} {"train_loss": -11.798591613769531, "global_step": 277231, "epoch": 1650} {"train_loss": -12.056331634521484, "global_step": 277232, "epoch": 1650} {"train_loss": -12.098384857177734, "global_step": 277233, "epoch": 1650} {"train_loss": -11.897677421569824, "global_step": 277234, "epoch": 1650} {"train_loss": -12.182943344116211, "global_step": 277235, "epoch": 1650} {"train_loss": -11.969684600830078, "global_step": 277236, "epoch": 1650} {"train_loss": -11.940300941467285, "global_step": 277237, "epoch": 1650} {"train_loss": -12.250798225402832, "global_step": 277238, "epoch": 1650} {"train_loss": -11.870643615722656, "global_step": 277239, "epoch": 1650} {"train_loss": -11.924195289611816, "global_step": 277240, "epoch": 1650} {"train_loss": -12.351776123046875, "global_step": 277241, "epoch": 1650} {"train_loss": -11.946693420410156, "global_step": 277242, "epoch": 1650} {"train_loss": -12.245259284973145, "global_step": 277243, "epoch": 1650} {"train_loss": -11.947233200073242, "global_step": 277244, "epoch": 1650} {"train_loss": -12.318334579467773, "global_step": 277245, "epoch": 1650} {"train_loss": -11.983726501464844, "global_step": 277246, "epoch": 1650} {"train_loss": -12.345632553100586, "global_step": 277247, "epoch": 1650} {"train_loss": -12.060101509094238, "global_step": 277248, "epoch": 1650} {"train_loss": -12.191095352172852, "global_step": 277249, "epoch": 1650} {"train_loss": -11.966678619384766, "global_step": 277250, "epoch": 1650} {"train_loss": -12.303933143615723, "global_step": 277251, "epoch": 1650} {"train_loss": -12.107797622680664, "global_step": 277252, "epoch": 1650} {"train_loss": -11.314645767211914, "global_step": 277253, "epoch": 1650} {"train_loss": -10.853245735168457, "global_step": 277254, "epoch": 1650} {"train_loss": -11.759430885314941, "global_step": 277255, "epoch": 1650} {"train_loss": -12.05081558227539, "global_step": 277256, "epoch": 1650} {"train_loss": -12.055602073669434, "global_step": 277257, "epoch": 1650} {"train_loss": -11.851607322692871, "global_step": 277258, "epoch": 1650} {"train_loss": -12.13280963897705, "global_step": 277259, "epoch": 1650} {"train_loss": -11.883017539978027, "global_step": 277260, "epoch": 1650} {"train_loss": -11.570077896118164, "global_step": 277261, "epoch": 1650} {"train_loss": -11.735416412353516, "global_step": 277262, "epoch": 1650} {"train_loss": -11.728133201599121, "global_step": 277263, "epoch": 1650} {"train_loss": -10.623050689697266, "global_step": 277264, "epoch": 1650} {"train_loss": -12.084805488586426, "global_step": 277265, "epoch": 1650} {"train_loss": -10.87923812866211, "global_step": 277266, "epoch": 1650} {"train_loss": -11.77785873413086, "global_step": 277267, "epoch": 1650} {"train_loss": -11.809040069580078, "global_step": 277268, "epoch": 1650} {"train_loss": -11.754210472106934, "global_step": 277269, "epoch": 1650} {"train_loss": -11.926758766174316, "global_step": 277270, "epoch": 1650} {"train_loss": -11.755960464477539, "global_step": 277271, "epoch": 1650} {"train_loss": -11.365335464477539, "global_step": 277272, "epoch": 1650} {"train_loss": -11.229848861694336, "global_step": 277273, "epoch": 1650} {"train_loss": -11.427891731262207, "global_step": 277274, "epoch": 1650} {"train_loss": -10.112977981567383, "global_step": 277275, "epoch": 1650} {"train_loss": -10.618375778198242, "global_step": 277276, "epoch": 1650} {"train_loss": -9.715694427490234, "global_step": 277277, "epoch": 1650} {"train_loss": -11.638412475585938, "global_step": 277278, "epoch": 1650} {"train_loss": -7.833152770996094, "global_step": 277279, "epoch": 1650} {"train_loss": -8.715374946594238, "global_step": 277280, "epoch": 1650} {"train_loss": -8.473791122436523, "global_step": 277281, "epoch": 1650} {"train_loss": -9.843501091003418, "global_step": 277282, "epoch": 1650} {"train_loss": -9.480123519897461, "global_step": 277283, "epoch": 1650} {"train_loss": -8.233732223510742, "global_step": 277284, "epoch": 1650} {"train_loss": -10.512073516845703, "global_step": 277285, "epoch": 1650} {"train_loss": -10.083370208740234, "global_step": 277286, "epoch": 1650} {"train_loss": -9.84709644317627, "global_step": 277287, "epoch": 1650} {"train_loss": -9.852359771728516, "global_step": 277288, "epoch": 1650} {"train_loss": -10.842103958129883, "global_step": 277289, "epoch": 1650} {"train_loss": -10.406122207641602, "global_step": 277290, "epoch": 1650} {"train_loss": -10.80189323425293, "global_step": 277291, "epoch": 1650} {"train_loss": -9.841331481933594, "global_step": 277292, "epoch": 1650} {"train_loss": -9.53839111328125, "global_step": 277293, "epoch": 1650} {"train_loss": -11.072736740112305, "global_step": 277294, "epoch": 1650} {"train_loss": -10.442229270935059, "global_step": 277295, "epoch": 1650} {"train_loss": -10.826040267944336, "global_step": 277296, "epoch": 1650} {"train_loss": -11.197370529174805, "global_step": 277297, "epoch": 1650} {"train_loss": -11.413511276245117, "global_step": 277298, "epoch": 1650} {"train_loss": -10.68562126159668, "global_step": 277299, "epoch": 1650} {"train_loss": -11.745454788208008, "global_step": 277300, "epoch": 1650} {"train_loss": -10.999215126037598, "global_step": 277301, "epoch": 1650} {"train_loss": -11.529273986816406, "global_step": 277302, "epoch": 1650} {"train_loss": -11.432624816894531, "global_step": 277303, "epoch": 1650} {"train_loss": -11.46015453338623, "global_step": 277304, "epoch": 1650} {"train_loss": -11.348008155822754, "global_step": 277305, "epoch": 1650} {"train_loss": -11.431295394897461, "global_step": 277306, "epoch": 1650} {"train_loss": -11.632903099060059, "global_step": 277307, "epoch": 1650} {"train_loss": -11.730080604553223, "global_step": 277308, "epoch": 1650} {"train_loss": -11.671037673950195, "global_step": 277309, "epoch": 1650} {"train_loss": -11.547121047973633, "global_step": 277310, "epoch": 1650} {"train_loss": -11.804372787475586, "global_step": 277311, "epoch": 1650} {"train_loss": -11.53246784210205, "global_step": 277312, "epoch": 1650} {"train_loss": -11.77816390991211, "global_step": 277313, "epoch": 1650} {"train_loss": -11.820085525512695, "global_step": 277314, "epoch": 1650} {"train_loss": -11.685165405273438, "global_step": 277315, "epoch": 1650} {"train_loss": -11.685930252075195, "global_step": 277316, "epoch": 1650} {"train_loss": -11.827951431274414, "global_step": 277317, "epoch": 1650} {"train_loss": -12.01822280883789, "global_step": 277318, "epoch": 1650} {"train_loss": -12.076720237731934, "global_step": 277319, "epoch": 1650} {"train_loss": -11.845643043518066, "global_step": 277320, "epoch": 1650} {"train_loss": -11.703559875488281, "global_step": 277321, "epoch": 1650} {"train_loss": -12.004972457885742, "global_step": 277322, "epoch": 1650} {"train_loss": -11.849969863891602, "global_step": 277323, "epoch": 1650} {"train_loss": -11.94202995300293, "global_step": 277324, "epoch": 1650} {"train_loss": -11.834781646728516, "global_step": 277325, "epoch": 1650} {"train_loss": -12.01162338256836, "global_step": 277326, "epoch": 1650} {"train_loss": -11.91826057434082, "global_step": 277327, "epoch": 1650} {"train_loss": -12.132206916809082, "global_step": 277328, "epoch": 1650} {"train_loss": -12.022995948791504, "global_step": 277329, "epoch": 1650} {"train_loss": -11.899150848388672, "global_step": 277330, "epoch": 1650} {"train_loss": -12.08833122253418, "global_step": 277331, "epoch": 1650} {"train_loss": -11.910788536071777, "global_step": 277332, "epoch": 1650} {"train_loss": -11.814321517944336, "global_step": 277333, "epoch": 1650} {"train_loss": -12.025673866271973, "global_step": 277334, "epoch": 1650} {"train_loss": -12.085775375366211, "global_step": 277335, "epoch": 1650} {"train_loss": -11.97538948059082, "global_step": 277336, "epoch": 1650} {"train_loss": -12.053167343139648, "global_step": 277337, "epoch": 1650} {"train_loss": -12.158164978027344, "global_step": 277338, "epoch": 1650} {"train_loss": -12.177181243896484, "global_step": 277339, "epoch": 1650} {"train_loss": -12.03955078125, "global_step": 277340, "epoch": 1650} {"train_loss": -12.178045272827148, "global_step": 277341, "epoch": 1650} {"train_loss": -12.175016403198242, "global_step": 277342, "epoch": 1650} {"train_loss": -12.154657363891602, "global_step": 277343, "epoch": 1650} {"train_loss": -11.968238830566406, "global_step": 277344, "epoch": 1650} {"train_loss": -12.061928749084473, "global_step": 277345, "epoch": 1650} {"train_loss": -12.025344848632812, "global_step": 277346, "epoch": 1650} {"train_loss": -11.96356201171875, "global_step": 277347, "epoch": 1650} {"train_loss": -12.060882568359375, "global_step": 277348, "epoch": 1650} {"train_loss": -12.06297492980957, "global_step": 277349, "epoch": 1650} {"train_loss": -11.978589057922363, "global_step": 277350, "epoch": 1650} {"train_loss": -12.206961631774902, "global_step": 277351, "epoch": 1650} {"train_loss": -12.30828857421875, "global_step": 277352, "epoch": 1650} {"train_loss": -11.847949981689453, "global_step": 277353, "epoch": 1650} {"train_loss": -11.99616527557373, "global_step": 277354, "epoch": 1650} {"train_loss": -12.081249237060547, "global_step": 277355, "epoch": 1650} {"train_loss": -12.088095664978027, "global_step": 277356, "epoch": 1650} {"train_loss": -12.218539237976074, "global_step": 277357, "epoch": 1650} {"train_loss": -12.259675979614258, "global_step": 277358, "epoch": 1650} {"train_loss": -12.116361618041992, "global_step": 277359, "epoch": 1650} {"train_loss": -12.264001846313477, "global_step": 277360, "epoch": 1650} {"train_loss": -12.191581726074219, "global_step": 277361, "epoch": 1650} {"train_loss": -12.123748779296875, "global_step": 277362, "epoch": 1650} {"train_loss": -11.9482421875, "global_step": 277363, "epoch": 1650} {"train_loss": -11.76580810546875, "global_step": 277364, "epoch": 1650} {"train_loss": -11.694330215454102, "global_step": 277365, "epoch": 1650} {"train_loss": -11.652708053588867, "global_step": 277366, "epoch": 1650} {"train_loss": -11.60633306843894, "global_step": 277367, "epoch": 1650, "train/sim_max_reward_0": 0.9737629803750709, "train/sim_max_reward_1": 0.8859898828923052, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.4498783588730226, "train/sim_max_reward_4": 0.9532994059952205, "train/sim_max_reward_5": 0.2036364797377513, "test/sim_max_reward_4400000": 0.9887914852331957, "test/sim_max_reward_4400001": 0.3728000097722279, "test/sim_max_reward_4400002": 0.9755991299165245, "test/sim_max_reward_4400003": 0.03999383635987242, "test/sim_max_reward_4400004": 0.4116562970831811, "test/sim_max_reward_4400005": 0.6689633173878208, "test/sim_max_reward_4400006": 0.27538435516288834, "test/sim_max_reward_4400007": 0.4904413845803266, "test/sim_max_reward_4400008": 0.696556456143506, "test/sim_max_reward_4400009": 0.3402782546096005, "test/sim_max_reward_4400010": 0.9940955715041931, "test/sim_max_reward_4400011": 0.28646022263110754, "test/sim_max_reward_4400012": 0.9843375201324639, "test/sim_max_reward_4400013": 0.9739162051690862, "test/sim_max_reward_4400014": 0.9744540730911562, "test/sim_max_reward_4400015": 0.27900830164480744, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.11675944466257261, "test/sim_max_reward_4400018": 0.9967175711632763, "test/sim_max_reward_4400019": 0.5862081870423378, "test/sim_max_reward_4400020": 0.3293273359403163, "test/sim_max_reward_4400021": 0.9743374726641963, "test/sim_max_reward_4400022": 0.9555690515605739, "test/sim_max_reward_4400023": 0.9825735020279258, "test/sim_max_reward_4400024": 0.9961657623168075, "test/sim_max_reward_4400025": 0.5488177987945969, "test/sim_max_reward_4400026": 0.057557137314668855, "test/sim_max_reward_4400027": 0.4421877907341756, "test/sim_max_reward_4400028": 0.7036182233324516, "test/sim_max_reward_4400029": 0.6300823713331541, "test/sim_max_reward_4400030": 0.9660517049232753, "test/sim_max_reward_4400031": 0.9965296084073134, "test/sim_max_reward_4400032": 0.12878158794415898, "test/sim_max_reward_4400033": 0.38308560328020164, "test/sim_max_reward_4400034": 0.5002254695499843, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.3655108407148261, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.3154656278589681, "test/sim_max_reward_4400039": 0.9635068494980711, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.16444135588572775, "test/sim_max_reward_4400042": 0.06229146956926054, "test/sim_max_reward_4400043": 0.9839782959207857, "test/sim_max_reward_4400044": 0.6322290877025757, "test/sim_max_reward_4400045": 0.4979837980180886, "test/sim_max_reward_4400046": 0.9620829785759384, "test/sim_max_reward_4400047": 0.9941853003756244, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.3574051828115779, "train/mean_score": 0.5777611846455617, "test/mean_score": 0.5726147682943483, "val_loss": 273635.3125, "train_action_mse_error": 2.052745819091797} {"train_loss": -10.848381042480469, "global_step": 277368, "epoch": 1651} {"train_loss": -10.998197555541992, "global_step": 277369, "epoch": 1651} {"train_loss": -11.35837173461914, "global_step": 277370, "epoch": 1651} {"train_loss": -10.31797981262207, "global_step": 277371, "epoch": 1651} {"train_loss": -10.952482223510742, "global_step": 277372, "epoch": 1651} {"train_loss": -11.306585311889648, "global_step": 277373, "epoch": 1651} {"train_loss": -9.015091896057129, "global_step": 277374, "epoch": 1651} {"train_loss": -10.257261276245117, "global_step": 277375, "epoch": 1651} {"train_loss": -8.802535057067871, "global_step": 277376, "epoch": 1651} {"train_loss": -8.361307144165039, "global_step": 277377, "epoch": 1651} {"train_loss": -8.29937744140625, "global_step": 277378, "epoch": 1651} {"train_loss": -8.023200988769531, "global_step": 277379, "epoch": 1651} {"train_loss": -9.77664566040039, "global_step": 277380, "epoch": 1651} {"train_loss": -9.745172500610352, "global_step": 277381, "epoch": 1651} {"train_loss": -8.014263153076172, "global_step": 277382, "epoch": 1651} {"train_loss": -8.90212345123291, "global_step": 277383, "epoch": 1651} {"train_loss": -7.4930009841918945, "global_step": 277384, "epoch": 1651} {"train_loss": -9.900854110717773, "global_step": 277385, "epoch": 1651} {"train_loss": -8.303605079650879, "global_step": 277386, "epoch": 1651} {"train_loss": -9.731870651245117, "global_step": 277387, "epoch": 1651} {"train_loss": -9.014202117919922, "global_step": 277388, "epoch": 1651} {"train_loss": -10.128579139709473, "global_step": 277389, "epoch": 1651} {"train_loss": -9.92854118347168, "global_step": 277390, "epoch": 1651} {"train_loss": -9.531198501586914, "global_step": 277391, "epoch": 1651} {"train_loss": -9.836172103881836, "global_step": 277392, "epoch": 1651} {"train_loss": -10.605110168457031, "global_step": 277393, "epoch": 1651} {"train_loss": -9.882071495056152, "global_step": 277394, "epoch": 1651} {"train_loss": -9.331789016723633, "global_step": 277395, "epoch": 1651} {"train_loss": -10.62451171875, "global_step": 277396, "epoch": 1651} {"train_loss": -10.32187271118164, "global_step": 277397, "epoch": 1651} {"train_loss": -9.873953819274902, "global_step": 277398, "epoch": 1651} {"train_loss": -10.590143203735352, "global_step": 277399, "epoch": 1651} {"train_loss": -10.540374755859375, "global_step": 277400, "epoch": 1651} {"train_loss": -10.795144081115723, "global_step": 277401, "epoch": 1651} {"train_loss": -11.013290405273438, "global_step": 277402, "epoch": 1651} {"train_loss": -10.542072296142578, "global_step": 277403, "epoch": 1651} {"train_loss": -10.905259132385254, "global_step": 277404, "epoch": 1651} {"train_loss": -10.65493106842041, "global_step": 277405, "epoch": 1651} {"train_loss": -10.556344032287598, "global_step": 277406, "epoch": 1651} {"train_loss": -11.567405700683594, "global_step": 277407, "epoch": 1651} {"train_loss": -10.730992317199707, "global_step": 277408, "epoch": 1651} {"train_loss": -11.14554214477539, "global_step": 277409, "epoch": 1651} {"train_loss": -11.129615783691406, "global_step": 277410, "epoch": 1651} {"train_loss": -11.049638748168945, "global_step": 277411, "epoch": 1651} {"train_loss": -11.297070503234863, "global_step": 277412, "epoch": 1651} {"train_loss": -11.187023162841797, "global_step": 277413, "epoch": 1651} {"train_loss": -11.197419166564941, "global_step": 277414, "epoch": 1651} {"train_loss": -11.303707122802734, "global_step": 277415, "epoch": 1651} {"train_loss": -11.377429962158203, "global_step": 277416, "epoch": 1651} {"train_loss": -11.564692497253418, "global_step": 277417, "epoch": 1651} {"train_loss": -11.277993202209473, "global_step": 277418, "epoch": 1651} {"train_loss": -11.335580825805664, "global_step": 277419, "epoch": 1651} {"train_loss": -11.372739791870117, "global_step": 277420, "epoch": 1651} {"train_loss": -11.466812133789062, "global_step": 277421, "epoch": 1651} {"train_loss": -11.659010887145996, "global_step": 277422, "epoch": 1651} {"train_loss": -11.46009635925293, "global_step": 277423, "epoch": 1651} {"train_loss": -11.647611618041992, "global_step": 277424, "epoch": 1651} {"train_loss": -11.405405044555664, "global_step": 277425, "epoch": 1651} {"train_loss": -11.624205589294434, "global_step": 277426, "epoch": 1651} {"train_loss": -11.63552188873291, "global_step": 277427, "epoch": 1651} {"train_loss": -11.312112808227539, "global_step": 277428, "epoch": 1651} {"train_loss": -11.646833419799805, "global_step": 277429, "epoch": 1651} {"train_loss": -11.71075439453125, "global_step": 277430, "epoch": 1651} {"train_loss": -11.522822380065918, "global_step": 277431, "epoch": 1651} {"train_loss": -11.5390625, "global_step": 277432, "epoch": 1651} {"train_loss": -11.877567291259766, "global_step": 277433, "epoch": 1651} {"train_loss": -11.563129425048828, "global_step": 277434, "epoch": 1651} {"train_loss": -11.804193496704102, "global_step": 277435, "epoch": 1651} {"train_loss": -11.71141242980957, "global_step": 277436, "epoch": 1651} {"train_loss": -11.878466606140137, "global_step": 277437, "epoch": 1651} {"train_loss": -11.781991958618164, "global_step": 277438, "epoch": 1651} {"train_loss": -11.904953002929688, "global_step": 277439, "epoch": 1651} {"train_loss": -11.805669784545898, "global_step": 277440, "epoch": 1651} {"train_loss": -11.799713134765625, "global_step": 277441, "epoch": 1651} {"train_loss": -11.542925834655762, "global_step": 277442, "epoch": 1651} {"train_loss": -11.817456245422363, "global_step": 277443, "epoch": 1651} {"train_loss": -11.819690704345703, "global_step": 277444, "epoch": 1651} {"train_loss": -11.98441219329834, "global_step": 277445, "epoch": 1651} {"train_loss": -11.845619201660156, "global_step": 277446, "epoch": 1651} {"train_loss": -11.880166053771973, "global_step": 277447, "epoch": 1651} {"train_loss": -11.863887786865234, "global_step": 277448, "epoch": 1651} {"train_loss": -11.910513877868652, "global_step": 277449, "epoch": 1651} {"train_loss": -12.015861511230469, "global_step": 277450, "epoch": 1651} {"train_loss": -11.84091567993164, "global_step": 277451, "epoch": 1651} {"train_loss": -11.981285095214844, "global_step": 277452, "epoch": 1651} {"train_loss": -12.097221374511719, "global_step": 277453, "epoch": 1651} {"train_loss": -11.783975601196289, "global_step": 277454, "epoch": 1651} {"train_loss": -12.117042541503906, "global_step": 277455, "epoch": 1651} {"train_loss": -12.034441947937012, "global_step": 277456, "epoch": 1651} {"train_loss": -11.930086135864258, "global_step": 277457, "epoch": 1651} {"train_loss": -12.024738311767578, "global_step": 277458, "epoch": 1651} {"train_loss": -12.072111129760742, "global_step": 277459, "epoch": 1651} {"train_loss": -12.065088272094727, "global_step": 277460, "epoch": 1651} {"train_loss": -12.205520629882812, "global_step": 277461, "epoch": 1651} {"train_loss": -12.07458782196045, "global_step": 277462, "epoch": 1651} {"train_loss": -11.979873657226562, "global_step": 277463, "epoch": 1651} {"train_loss": -12.162860870361328, "global_step": 277464, "epoch": 1651} {"train_loss": -12.132399559020996, "global_step": 277465, "epoch": 1651} {"train_loss": -12.125703811645508, "global_step": 277466, "epoch": 1651} {"train_loss": -11.789974212646484, "global_step": 277467, "epoch": 1651} {"train_loss": -12.193449974060059, "global_step": 277468, "epoch": 1651} {"train_loss": -12.02134895324707, "global_step": 277469, "epoch": 1651} {"train_loss": -12.295343399047852, "global_step": 277470, "epoch": 1651} {"train_loss": -12.160503387451172, "global_step": 277471, "epoch": 1651} {"train_loss": -12.048648834228516, "global_step": 277472, "epoch": 1651} {"train_loss": -12.131021499633789, "global_step": 277473, "epoch": 1651} {"train_loss": -12.363365173339844, "global_step": 277474, "epoch": 1651} {"train_loss": -12.093475341796875, "global_step": 277475, "epoch": 1651} {"train_loss": -12.264972686767578, "global_step": 277476, "epoch": 1651} {"train_loss": -12.10152816772461, "global_step": 277477, "epoch": 1651} {"train_loss": -12.187732696533203, "global_step": 277478, "epoch": 1651} {"train_loss": -12.375829696655273, "global_step": 277479, "epoch": 1651} {"train_loss": -12.197099685668945, "global_step": 277480, "epoch": 1651} {"train_loss": -12.24101734161377, "global_step": 277481, "epoch": 1651} {"train_loss": -12.200630187988281, "global_step": 277482, "epoch": 1651} {"train_loss": -12.115547180175781, "global_step": 277483, "epoch": 1651} {"train_loss": -12.41700267791748, "global_step": 277484, "epoch": 1651} {"train_loss": -12.21571159362793, "global_step": 277485, "epoch": 1651} {"train_loss": -12.320489883422852, "global_step": 277486, "epoch": 1651} {"train_loss": -12.324600219726562, "global_step": 277487, "epoch": 1651} {"train_loss": -11.865431785583496, "global_step": 277488, "epoch": 1651} {"train_loss": -12.279829025268555, "global_step": 277489, "epoch": 1651} {"train_loss": -12.077640533447266, "global_step": 277490, "epoch": 1651} {"train_loss": -12.355569839477539, "global_step": 277491, "epoch": 1651} {"train_loss": -12.03894329071045, "global_step": 277492, "epoch": 1651} {"train_loss": -11.977806091308594, "global_step": 277493, "epoch": 1651} {"train_loss": -12.196366310119629, "global_step": 277494, "epoch": 1651} {"train_loss": -12.037639617919922, "global_step": 277495, "epoch": 1651} {"train_loss": -12.02878189086914, "global_step": 277496, "epoch": 1651} {"train_loss": -11.997326850891113, "global_step": 277497, "epoch": 1651} {"train_loss": -12.210556030273438, "global_step": 277498, "epoch": 1651} {"train_loss": -12.089957237243652, "global_step": 277499, "epoch": 1651} {"train_loss": -11.999332427978516, "global_step": 277500, "epoch": 1651} {"train_loss": -11.903583526611328, "global_step": 277501, "epoch": 1651} {"train_loss": -12.419015884399414, "global_step": 277502, "epoch": 1651} {"train_loss": -11.7830171585083, "global_step": 277503, "epoch": 1651} {"train_loss": -11.574676513671875, "global_step": 277504, "epoch": 1651} {"train_loss": -11.60183048248291, "global_step": 277505, "epoch": 1651} {"train_loss": -11.715517044067383, "global_step": 277506, "epoch": 1651} {"train_loss": -11.716930389404297, "global_step": 277507, "epoch": 1651} {"train_loss": -11.834835052490234, "global_step": 277508, "epoch": 1651} {"train_loss": -12.029352188110352, "global_step": 277509, "epoch": 1651} {"train_loss": -12.244552612304688, "global_step": 277510, "epoch": 1651} {"train_loss": -11.91952133178711, "global_step": 277511, "epoch": 1651} {"train_loss": -11.781545639038086, "global_step": 277512, "epoch": 1651} {"train_loss": -11.889248847961426, "global_step": 277513, "epoch": 1651} {"train_loss": -11.948833465576172, "global_step": 277514, "epoch": 1651} {"train_loss": -11.665385246276855, "global_step": 277515, "epoch": 1651} {"train_loss": -11.847596168518066, "global_step": 277516, "epoch": 1651} {"train_loss": -11.854293823242188, "global_step": 277517, "epoch": 1651} {"train_loss": -12.060420989990234, "global_step": 277518, "epoch": 1651} {"train_loss": -12.013643264770508, "global_step": 277519, "epoch": 1651} {"train_loss": -12.194812774658203, "global_step": 277520, "epoch": 1651} {"train_loss": -12.252983093261719, "global_step": 277521, "epoch": 1651} {"train_loss": -12.044635772705078, "global_step": 277522, "epoch": 1651} {"train_loss": -11.862610816955566, "global_step": 277523, "epoch": 1651} {"train_loss": -12.075876235961914, "global_step": 277524, "epoch": 1651} {"train_loss": -12.006717681884766, "global_step": 277525, "epoch": 1651} {"train_loss": -11.971969604492188, "global_step": 277526, "epoch": 1651} {"train_loss": -11.720908164978027, "global_step": 277527, "epoch": 1651} {"train_loss": -12.432682037353516, "global_step": 277528, "epoch": 1651} {"train_loss": -11.936272621154785, "global_step": 277529, "epoch": 1651} {"train_loss": -11.691701889038086, "global_step": 277530, "epoch": 1651} {"train_loss": -12.230846405029297, "global_step": 277531, "epoch": 1651} {"train_loss": -12.284692764282227, "global_step": 277532, "epoch": 1651} {"train_loss": -11.871417999267578, "global_step": 277533, "epoch": 1651} {"train_loss": -10.967411041259766, "global_step": 277534, "epoch": 1651} {"train_loss": -11.412314102763222, "global_step": 277535, "epoch": 1651, "val_loss": 268228.65625} {"train_loss": -11.14769172668457, "global_step": 277536, "epoch": 1652} {"train_loss": -9.394489288330078, "global_step": 277537, "epoch": 1652} {"train_loss": -11.73099136352539, "global_step": 277538, "epoch": 1652} {"train_loss": -10.550796508789062, "global_step": 277539, "epoch": 1652} {"train_loss": -10.475133895874023, "global_step": 277540, "epoch": 1652} {"train_loss": -11.395256042480469, "global_step": 277541, "epoch": 1652} {"train_loss": -9.214920043945312, "global_step": 277542, "epoch": 1652} {"train_loss": -10.952888488769531, "global_step": 277543, "epoch": 1652} {"train_loss": -10.711462020874023, "global_step": 277544, "epoch": 1652} {"train_loss": -9.341072082519531, "global_step": 277545, "epoch": 1652} {"train_loss": -10.29002571105957, "global_step": 277546, "epoch": 1652} {"train_loss": -8.72491455078125, "global_step": 277547, "epoch": 1652} {"train_loss": -11.075135231018066, "global_step": 277548, "epoch": 1652} {"train_loss": -9.938331604003906, "global_step": 277549, "epoch": 1652} {"train_loss": -11.069784164428711, "global_step": 277550, "epoch": 1652} {"train_loss": -10.282812118530273, "global_step": 277551, "epoch": 1652} {"train_loss": -11.466065406799316, "global_step": 277552, "epoch": 1652} {"train_loss": -10.73245906829834, "global_step": 277553, "epoch": 1652} {"train_loss": -10.6226806640625, "global_step": 277554, "epoch": 1652} {"train_loss": -11.22958755493164, "global_step": 277555, "epoch": 1652} {"train_loss": -10.417402267456055, "global_step": 277556, "epoch": 1652} {"train_loss": -11.645201683044434, "global_step": 277557, "epoch": 1652} {"train_loss": -11.280601501464844, "global_step": 277558, "epoch": 1652} {"train_loss": -11.499092102050781, "global_step": 277559, "epoch": 1652} {"train_loss": -11.639656066894531, "global_step": 277560, "epoch": 1652} {"train_loss": -11.269695281982422, "global_step": 277561, "epoch": 1652} {"train_loss": -11.632303237915039, "global_step": 277562, "epoch": 1652} {"train_loss": -11.597977638244629, "global_step": 277563, "epoch": 1652} {"train_loss": -11.264833450317383, "global_step": 277564, "epoch": 1652} {"train_loss": -11.430883407592773, "global_step": 277565, "epoch": 1652} {"train_loss": -11.306026458740234, "global_step": 277566, "epoch": 1652} {"train_loss": -11.644012451171875, "global_step": 277567, "epoch": 1652} {"train_loss": -11.485554695129395, "global_step": 277568, "epoch": 1652} {"train_loss": -11.729337692260742, "global_step": 277569, "epoch": 1652} {"train_loss": -11.507919311523438, "global_step": 277570, "epoch": 1652} {"train_loss": -11.935998916625977, "global_step": 277571, "epoch": 1652} {"train_loss": -11.73419189453125, "global_step": 277572, "epoch": 1652} {"train_loss": -11.817463874816895, "global_step": 277573, "epoch": 1652} {"train_loss": -11.659310340881348, "global_step": 277574, "epoch": 1652} {"train_loss": -11.812625885009766, "global_step": 277575, "epoch": 1652} {"train_loss": -11.822040557861328, "global_step": 277576, "epoch": 1652} {"train_loss": -11.868450164794922, "global_step": 277577, "epoch": 1652} {"train_loss": -11.564485549926758, "global_step": 277578, "epoch": 1652} {"train_loss": -11.879244804382324, "global_step": 277579, "epoch": 1652} {"train_loss": -11.875312805175781, "global_step": 277580, "epoch": 1652} {"train_loss": -11.769952774047852, "global_step": 277581, "epoch": 1652} {"train_loss": -11.792816162109375, "global_step": 277582, "epoch": 1652} {"train_loss": -11.810192108154297, "global_step": 277583, "epoch": 1652} {"train_loss": -11.858062744140625, "global_step": 277584, "epoch": 1652} {"train_loss": -11.689981460571289, "global_step": 277585, "epoch": 1652} {"train_loss": -12.140119552612305, "global_step": 277586, "epoch": 1652} {"train_loss": -11.864476203918457, "global_step": 277587, "epoch": 1652} {"train_loss": -11.980650901794434, "global_step": 277588, "epoch": 1652} {"train_loss": -11.891107559204102, "global_step": 277589, "epoch": 1652} {"train_loss": -11.96347427368164, "global_step": 277590, "epoch": 1652} {"train_loss": -11.939958572387695, "global_step": 277591, "epoch": 1652} {"train_loss": -11.991999626159668, "global_step": 277592, "epoch": 1652} {"train_loss": -12.001596450805664, "global_step": 277593, "epoch": 1652} {"train_loss": -11.886940002441406, "global_step": 277594, "epoch": 1652} {"train_loss": -12.003778457641602, "global_step": 277595, "epoch": 1652} {"train_loss": -12.080785751342773, "global_step": 277596, "epoch": 1652} {"train_loss": -11.849857330322266, "global_step": 277597, "epoch": 1652} {"train_loss": -11.918359756469727, "global_step": 277598, "epoch": 1652} {"train_loss": -11.409490585327148, "global_step": 277599, "epoch": 1652} {"train_loss": -11.88490104675293, "global_step": 277600, "epoch": 1652} {"train_loss": -11.628068923950195, "global_step": 277601, "epoch": 1652} {"train_loss": -11.861074447631836, "global_step": 277602, "epoch": 1652} {"train_loss": -11.293806076049805, "global_step": 277603, "epoch": 1652} {"train_loss": -12.246841430664062, "global_step": 277604, "epoch": 1652} {"train_loss": -11.545397758483887, "global_step": 277605, "epoch": 1652} {"train_loss": -11.70645523071289, "global_step": 277606, "epoch": 1652} {"train_loss": -11.488298416137695, "global_step": 277607, "epoch": 1652} {"train_loss": -11.724517822265625, "global_step": 277608, "epoch": 1652} {"train_loss": -11.247358322143555, "global_step": 277609, "epoch": 1652} {"train_loss": -12.025040626525879, "global_step": 277610, "epoch": 1652} {"train_loss": -11.456463813781738, "global_step": 277611, "epoch": 1652} {"train_loss": -11.290487289428711, "global_step": 277612, "epoch": 1652} {"train_loss": -12.118208885192871, "global_step": 277613, "epoch": 1652} {"train_loss": -11.249221801757812, "global_step": 277614, "epoch": 1652} {"train_loss": -12.13308334350586, "global_step": 277615, "epoch": 1652} {"train_loss": -11.865270614624023, "global_step": 277616, "epoch": 1652} {"train_loss": -11.910390853881836, "global_step": 277617, "epoch": 1652} {"train_loss": -11.897368431091309, "global_step": 277618, "epoch": 1652} {"train_loss": -11.686614990234375, "global_step": 277619, "epoch": 1652} {"train_loss": -11.945459365844727, "global_step": 277620, "epoch": 1652} {"train_loss": -11.836747169494629, "global_step": 277621, "epoch": 1652} {"train_loss": -11.61994743347168, "global_step": 277622, "epoch": 1652} {"train_loss": -12.124847412109375, "global_step": 277623, "epoch": 1652} {"train_loss": -10.912397384643555, "global_step": 277624, "epoch": 1652} {"train_loss": -11.660896301269531, "global_step": 277625, "epoch": 1652} {"train_loss": -11.797748565673828, "global_step": 277626, "epoch": 1652} {"train_loss": -11.333137512207031, "global_step": 277627, "epoch": 1652} {"train_loss": -11.791492462158203, "global_step": 277628, "epoch": 1652} {"train_loss": -11.689239501953125, "global_step": 277629, "epoch": 1652} {"train_loss": -11.531225204467773, "global_step": 277630, "epoch": 1652} {"train_loss": -11.815393447875977, "global_step": 277631, "epoch": 1652} {"train_loss": -11.375764846801758, "global_step": 277632, "epoch": 1652} {"train_loss": -11.584463119506836, "global_step": 277633, "epoch": 1652} {"train_loss": -11.670024871826172, "global_step": 277634, "epoch": 1652} {"train_loss": -11.57118034362793, "global_step": 277635, "epoch": 1652} {"train_loss": -11.926326751708984, "global_step": 277636, "epoch": 1652} {"train_loss": -11.731082916259766, "global_step": 277637, "epoch": 1652} {"train_loss": -12.104052543640137, "global_step": 277638, "epoch": 1652} {"train_loss": -11.830257415771484, "global_step": 277639, "epoch": 1652} {"train_loss": -12.160602569580078, "global_step": 277640, "epoch": 1652} {"train_loss": -11.71181869506836, "global_step": 277641, "epoch": 1652} {"train_loss": -11.95895004272461, "global_step": 277642, "epoch": 1652} {"train_loss": -12.084651947021484, "global_step": 277643, "epoch": 1652} {"train_loss": -12.071910858154297, "global_step": 277644, "epoch": 1652} {"train_loss": -11.893331527709961, "global_step": 277645, "epoch": 1652} {"train_loss": -12.072259902954102, "global_step": 277646, "epoch": 1652} {"train_loss": -12.122198104858398, "global_step": 277647, "epoch": 1652} {"train_loss": -12.156103134155273, "global_step": 277648, "epoch": 1652} {"train_loss": -11.990242004394531, "global_step": 277649, "epoch": 1652} {"train_loss": -12.084417343139648, "global_step": 277650, "epoch": 1652} {"train_loss": -12.216728210449219, "global_step": 277651, "epoch": 1652} {"train_loss": -12.3306303024292, "global_step": 277652, "epoch": 1652} {"train_loss": -12.071307182312012, "global_step": 277653, "epoch": 1652} {"train_loss": -12.015905380249023, "global_step": 277654, "epoch": 1652} {"train_loss": -12.153768539428711, "global_step": 277655, "epoch": 1652} {"train_loss": -12.100741386413574, "global_step": 277656, "epoch": 1652} {"train_loss": -11.848560333251953, "global_step": 277657, "epoch": 1652} {"train_loss": -12.148078918457031, "global_step": 277658, "epoch": 1652} {"train_loss": -12.173805236816406, "global_step": 277659, "epoch": 1652} {"train_loss": -12.117324829101562, "global_step": 277660, "epoch": 1652} {"train_loss": -11.90427017211914, "global_step": 277661, "epoch": 1652} {"train_loss": -11.956625938415527, "global_step": 277662, "epoch": 1652} {"train_loss": -12.137603759765625, "global_step": 277663, "epoch": 1652} {"train_loss": -12.132670402526855, "global_step": 277664, "epoch": 1652} {"train_loss": -12.047815322875977, "global_step": 277665, "epoch": 1652} {"train_loss": -12.090356826782227, "global_step": 277666, "epoch": 1652} {"train_loss": -12.461429595947266, "global_step": 277667, "epoch": 1652} {"train_loss": -12.22062873840332, "global_step": 277668, "epoch": 1652} {"train_loss": -12.198997497558594, "global_step": 277669, "epoch": 1652} {"train_loss": -11.836456298828125, "global_step": 277670, "epoch": 1652} {"train_loss": -11.997984886169434, "global_step": 277671, "epoch": 1652} {"train_loss": -12.101303100585938, "global_step": 277672, "epoch": 1652} {"train_loss": -12.257232666015625, "global_step": 277673, "epoch": 1652} {"train_loss": -12.234333038330078, "global_step": 277674, "epoch": 1652} {"train_loss": -12.116637229919434, "global_step": 277675, "epoch": 1652} {"train_loss": -12.169841766357422, "global_step": 277676, "epoch": 1652} {"train_loss": -12.004670143127441, "global_step": 277677, "epoch": 1652} {"train_loss": -12.232519149780273, "global_step": 277678, "epoch": 1652} {"train_loss": -11.696151733398438, "global_step": 277679, "epoch": 1652} {"train_loss": -12.166162490844727, "global_step": 277680, "epoch": 1652} {"train_loss": -11.875833511352539, "global_step": 277681, "epoch": 1652} {"train_loss": -11.819450378417969, "global_step": 277682, "epoch": 1652} {"train_loss": -11.67407512664795, "global_step": 277683, "epoch": 1652} {"train_loss": -11.434856414794922, "global_step": 277684, "epoch": 1652} {"train_loss": -9.797935485839844, "global_step": 277685, "epoch": 1652} {"train_loss": -9.529744148254395, "global_step": 277686, "epoch": 1652} {"train_loss": -11.110626220703125, "global_step": 277687, "epoch": 1652} {"train_loss": -9.865219116210938, "global_step": 277688, "epoch": 1652} {"train_loss": -8.652578353881836, "global_step": 277689, "epoch": 1652} {"train_loss": -9.805986404418945, "global_step": 277690, "epoch": 1652} {"train_loss": -10.115133285522461, "global_step": 277691, "epoch": 1652} {"train_loss": -11.164045333862305, "global_step": 277692, "epoch": 1652} {"train_loss": -8.863519668579102, "global_step": 277693, "epoch": 1652} {"train_loss": -11.040915489196777, "global_step": 277694, "epoch": 1652} {"train_loss": -8.972736358642578, "global_step": 277695, "epoch": 1652} {"train_loss": -9.788296699523926, "global_step": 277696, "epoch": 1652} {"train_loss": -6.8707170486450195, "global_step": 277697, "epoch": 1652} {"train_loss": -7.059179782867432, "global_step": 277698, "epoch": 1652} {"train_loss": -6.339780807495117, "global_step": 277699, "epoch": 1652} {"train_loss": -6.0167236328125, "global_step": 277700, "epoch": 1652} {"train_loss": -5.954824447631836, "global_step": 277701, "epoch": 1652} {"train_loss": -5.769094467163086, "global_step": 277702, "epoch": 1652} {"train_loss": -11.301563262939453, "global_step": 277703, "epoch": 1652, "val_loss": 268522.53125} {"train_loss": -6.644220352172852, "global_step": 277704, "epoch": 1653} {"train_loss": -6.966529846191406, "global_step": 277705, "epoch": 1653} {"train_loss": -7.228949069976807, "global_step": 277706, "epoch": 1653} {"train_loss": -7.334834098815918, "global_step": 277707, "epoch": 1653} {"train_loss": -7.803685188293457, "global_step": 277708, "epoch": 1653} {"train_loss": -7.806861877441406, "global_step": 277709, "epoch": 1653} {"train_loss": -8.423437118530273, "global_step": 277710, "epoch": 1653} {"train_loss": -8.010480880737305, "global_step": 277711, "epoch": 1653} {"train_loss": -8.426427841186523, "global_step": 277712, "epoch": 1653} {"train_loss": -8.171010971069336, "global_step": 277713, "epoch": 1653} {"train_loss": -7.94450569152832, "global_step": 277714, "epoch": 1653} {"train_loss": -8.459035873413086, "global_step": 277715, "epoch": 1653} {"train_loss": -8.701253890991211, "global_step": 277716, "epoch": 1653} {"train_loss": -8.630487442016602, "global_step": 277717, "epoch": 1653} {"train_loss": -9.13595962524414, "global_step": 277718, "epoch": 1653} {"train_loss": -9.352174758911133, "global_step": 277719, "epoch": 1653} {"train_loss": -9.616579055786133, "global_step": 277720, "epoch": 1653} {"train_loss": -9.928400039672852, "global_step": 277721, "epoch": 1653} {"train_loss": -9.764073371887207, "global_step": 277722, "epoch": 1653} {"train_loss": -9.951163291931152, "global_step": 277723, "epoch": 1653} {"train_loss": -10.228584289550781, "global_step": 277724, "epoch": 1653} {"train_loss": -10.453096389770508, "global_step": 277725, "epoch": 1653} {"train_loss": -10.774846076965332, "global_step": 277726, "epoch": 1653} {"train_loss": -10.859722137451172, "global_step": 277727, "epoch": 1653} {"train_loss": -10.786113739013672, "global_step": 277728, "epoch": 1653} {"train_loss": -11.173600196838379, "global_step": 277729, "epoch": 1653} {"train_loss": -10.977453231811523, "global_step": 277730, "epoch": 1653} {"train_loss": -10.917928695678711, "global_step": 277731, "epoch": 1653} {"train_loss": -10.762889862060547, "global_step": 277732, "epoch": 1653} {"train_loss": -11.375897407531738, "global_step": 277733, "epoch": 1653} {"train_loss": -11.280351638793945, "global_step": 277734, "epoch": 1653} {"train_loss": -11.46841812133789, "global_step": 277735, "epoch": 1653} {"train_loss": -11.421809196472168, "global_step": 277736, "epoch": 1653} {"train_loss": -11.478690147399902, "global_step": 277737, "epoch": 1653} {"train_loss": -11.493764877319336, "global_step": 277738, "epoch": 1653} {"train_loss": -11.183923721313477, "global_step": 277739, "epoch": 1653} {"train_loss": -11.4161958694458, "global_step": 277740, "epoch": 1653} {"train_loss": -11.589299201965332, "global_step": 277741, "epoch": 1653} {"train_loss": -11.725324630737305, "global_step": 277742, "epoch": 1653} {"train_loss": -11.582880020141602, "global_step": 277743, "epoch": 1653} {"train_loss": -11.595589637756348, "global_step": 277744, "epoch": 1653} {"train_loss": -11.422966957092285, "global_step": 277745, "epoch": 1653} {"train_loss": -11.418572425842285, "global_step": 277746, "epoch": 1653} {"train_loss": -11.696229934692383, "global_step": 277747, "epoch": 1653} {"train_loss": -11.532632827758789, "global_step": 277748, "epoch": 1653} {"train_loss": -11.602178573608398, "global_step": 277749, "epoch": 1653} {"train_loss": -11.619868278503418, "global_step": 277750, "epoch": 1653} {"train_loss": -11.488512992858887, "global_step": 277751, "epoch": 1653} {"train_loss": -11.624187469482422, "global_step": 277752, "epoch": 1653} {"train_loss": -11.6815824508667, "global_step": 277753, "epoch": 1653} {"train_loss": -11.609062194824219, "global_step": 277754, "epoch": 1653} {"train_loss": -11.598249435424805, "global_step": 277755, "epoch": 1653} {"train_loss": -11.854427337646484, "global_step": 277756, "epoch": 1653} {"train_loss": -11.466451644897461, "global_step": 277757, "epoch": 1653} {"train_loss": -11.620309829711914, "global_step": 277758, "epoch": 1653} {"train_loss": -11.918450355529785, "global_step": 277759, "epoch": 1653} {"train_loss": -11.648996353149414, "global_step": 277760, "epoch": 1653} {"train_loss": -11.749872207641602, "global_step": 277761, "epoch": 1653} {"train_loss": -11.865551948547363, "global_step": 277762, "epoch": 1653} {"train_loss": -11.885417938232422, "global_step": 277763, "epoch": 1653} {"train_loss": -11.685452461242676, "global_step": 277764, "epoch": 1653} {"train_loss": -11.940217018127441, "global_step": 277765, "epoch": 1653} {"train_loss": -11.902777671813965, "global_step": 277766, "epoch": 1653} {"train_loss": -11.972057342529297, "global_step": 277767, "epoch": 1653} {"train_loss": -12.080488204956055, "global_step": 277768, "epoch": 1653} {"train_loss": -12.185426712036133, "global_step": 277769, "epoch": 1653} {"train_loss": -11.874637603759766, "global_step": 277770, "epoch": 1653} {"train_loss": -12.080326080322266, "global_step": 277771, "epoch": 1653} {"train_loss": -11.809614181518555, "global_step": 277772, "epoch": 1653} {"train_loss": -11.667268753051758, "global_step": 277773, "epoch": 1653} {"train_loss": -12.081864356994629, "global_step": 277774, "epoch": 1653} {"train_loss": -11.756669044494629, "global_step": 277775, "epoch": 1653} {"train_loss": -12.122894287109375, "global_step": 277776, "epoch": 1653} {"train_loss": -11.979965209960938, "global_step": 277777, "epoch": 1653} {"train_loss": -11.912278175354004, "global_step": 277778, "epoch": 1653} {"train_loss": -12.109652519226074, "global_step": 277779, "epoch": 1653} {"train_loss": -12.228105545043945, "global_step": 277780, "epoch": 1653} {"train_loss": -12.027430534362793, "global_step": 277781, "epoch": 1653} {"train_loss": -11.996733665466309, "global_step": 277782, "epoch": 1653} {"train_loss": -11.986273765563965, "global_step": 277783, "epoch": 1653} {"train_loss": -12.1182861328125, "global_step": 277784, "epoch": 1653} {"train_loss": -12.089818000793457, "global_step": 277785, "epoch": 1653} {"train_loss": -12.013585090637207, "global_step": 277786, "epoch": 1653} {"train_loss": -11.88222885131836, "global_step": 277787, "epoch": 1653} {"train_loss": -12.024543762207031, "global_step": 277788, "epoch": 1653} {"train_loss": -11.863869667053223, "global_step": 277789, "epoch": 1653} {"train_loss": -12.071223258972168, "global_step": 277790, "epoch": 1653} {"train_loss": -12.321490287780762, "global_step": 277791, "epoch": 1653} {"train_loss": -12.14879035949707, "global_step": 277792, "epoch": 1653} {"train_loss": -12.302921295166016, "global_step": 277793, "epoch": 1653} {"train_loss": -11.990891456604004, "global_step": 277794, "epoch": 1653} {"train_loss": -12.2103853225708, "global_step": 277795, "epoch": 1653} {"train_loss": -12.056596755981445, "global_step": 277796, "epoch": 1653} {"train_loss": -12.325349807739258, "global_step": 277797, "epoch": 1653} {"train_loss": -12.305755615234375, "global_step": 277798, "epoch": 1653} {"train_loss": -12.38288402557373, "global_step": 277799, "epoch": 1653} {"train_loss": -12.188882827758789, "global_step": 277800, "epoch": 1653} {"train_loss": -12.147647857666016, "global_step": 277801, "epoch": 1653} {"train_loss": -12.26596450805664, "global_step": 277802, "epoch": 1653} {"train_loss": -12.136640548706055, "global_step": 277803, "epoch": 1653} {"train_loss": -12.025315284729004, "global_step": 277804, "epoch": 1653} {"train_loss": -12.246442794799805, "global_step": 277805, "epoch": 1653} {"train_loss": -12.134836196899414, "global_step": 277806, "epoch": 1653} {"train_loss": -12.354413986206055, "global_step": 277807, "epoch": 1653} {"train_loss": -12.250967979431152, "global_step": 277808, "epoch": 1653} {"train_loss": -11.90317153930664, "global_step": 277809, "epoch": 1653} {"train_loss": -11.87232494354248, "global_step": 277810, "epoch": 1653} {"train_loss": -12.231191635131836, "global_step": 277811, "epoch": 1653} {"train_loss": -11.750455856323242, "global_step": 277812, "epoch": 1653} {"train_loss": -10.933660507202148, "global_step": 277813, "epoch": 1653} {"train_loss": -10.972162246704102, "global_step": 277814, "epoch": 1653} {"train_loss": -11.7863187789917, "global_step": 277815, "epoch": 1653} {"train_loss": -10.210142135620117, "global_step": 277816, "epoch": 1653} {"train_loss": -10.415114402770996, "global_step": 277817, "epoch": 1653} {"train_loss": -11.358685493469238, "global_step": 277818, "epoch": 1653} {"train_loss": -11.690837860107422, "global_step": 277819, "epoch": 1653} {"train_loss": -11.560115814208984, "global_step": 277820, "epoch": 1653} {"train_loss": -11.629067420959473, "global_step": 277821, "epoch": 1653} {"train_loss": -12.230268478393555, "global_step": 277822, "epoch": 1653} {"train_loss": -11.25273323059082, "global_step": 277823, "epoch": 1653} {"train_loss": -12.112113952636719, "global_step": 277824, "epoch": 1653} {"train_loss": -11.146278381347656, "global_step": 277825, "epoch": 1653} {"train_loss": -11.942838668823242, "global_step": 277826, "epoch": 1653} {"train_loss": -11.280328750610352, "global_step": 277827, "epoch": 1653} {"train_loss": -11.363659858703613, "global_step": 277828, "epoch": 1653} {"train_loss": -11.052160263061523, "global_step": 277829, "epoch": 1653} {"train_loss": -11.80622673034668, "global_step": 277830, "epoch": 1653} {"train_loss": -10.201272964477539, "global_step": 277831, "epoch": 1653} {"train_loss": -12.058012008666992, "global_step": 277832, "epoch": 1653} {"train_loss": -10.931934356689453, "global_step": 277833, "epoch": 1653} {"train_loss": -11.77741527557373, "global_step": 277834, "epoch": 1653} {"train_loss": -10.68368148803711, "global_step": 277835, "epoch": 1653} {"train_loss": -11.84477710723877, "global_step": 277836, "epoch": 1653} {"train_loss": -11.19064712524414, "global_step": 277837, "epoch": 1653} {"train_loss": -12.107684135437012, "global_step": 277838, "epoch": 1653} {"train_loss": -11.47075080871582, "global_step": 277839, "epoch": 1653} {"train_loss": -11.653411865234375, "global_step": 277840, "epoch": 1653} {"train_loss": -11.562467575073242, "global_step": 277841, "epoch": 1653} {"train_loss": -11.550670623779297, "global_step": 277842, "epoch": 1653} {"train_loss": -11.756990432739258, "global_step": 277843, "epoch": 1653} {"train_loss": -11.919893264770508, "global_step": 277844, "epoch": 1653} {"train_loss": -11.898892402648926, "global_step": 277845, "epoch": 1653} {"train_loss": -11.911819458007812, "global_step": 277846, "epoch": 1653} {"train_loss": -11.898794174194336, "global_step": 277847, "epoch": 1653} {"train_loss": -11.950942039489746, "global_step": 277848, "epoch": 1653} {"train_loss": -12.244501113891602, "global_step": 277849, "epoch": 1653} {"train_loss": -12.036300659179688, "global_step": 277850, "epoch": 1653} {"train_loss": -12.26333999633789, "global_step": 277851, "epoch": 1653} {"train_loss": -12.21131420135498, "global_step": 277852, "epoch": 1653} {"train_loss": -12.141021728515625, "global_step": 277853, "epoch": 1653} {"train_loss": -12.266809463500977, "global_step": 277854, "epoch": 1653} {"train_loss": -12.156349182128906, "global_step": 277855, "epoch": 1653} {"train_loss": -12.201122283935547, "global_step": 277856, "epoch": 1653} {"train_loss": -12.12087345123291, "global_step": 277857, "epoch": 1653} {"train_loss": -11.876514434814453, "global_step": 277858, "epoch": 1653} {"train_loss": -11.99241828918457, "global_step": 277859, "epoch": 1653} {"train_loss": -11.773507118225098, "global_step": 277860, "epoch": 1653} {"train_loss": -11.965109825134277, "global_step": 277861, "epoch": 1653} {"train_loss": -11.762229919433594, "global_step": 277862, "epoch": 1653} {"train_loss": -11.776898384094238, "global_step": 277863, "epoch": 1653} {"train_loss": -11.8635892868042, "global_step": 277864, "epoch": 1653} {"train_loss": -12.286641120910645, "global_step": 277865, "epoch": 1653} {"train_loss": -11.965312957763672, "global_step": 277866, "epoch": 1653} {"train_loss": -12.05371379852295, "global_step": 277867, "epoch": 1653} {"train_loss": -11.920015335083008, "global_step": 277868, "epoch": 1653} {"train_loss": -12.298425674438477, "global_step": 277869, "epoch": 1653} {"train_loss": -12.08292293548584, "global_step": 277870, "epoch": 1653} {"train_loss": -11.343042206196557, "global_step": 277871, "epoch": 1653, "val_loss": 274390.0} {"train_loss": -11.835190773010254, "global_step": 277872, "epoch": 1654} {"train_loss": -12.235054016113281, "global_step": 277873, "epoch": 1654} {"train_loss": -11.60841178894043, "global_step": 277874, "epoch": 1654} {"train_loss": -12.228326797485352, "global_step": 277875, "epoch": 1654} {"train_loss": -11.690184593200684, "global_step": 277876, "epoch": 1654} {"train_loss": -11.71691608428955, "global_step": 277877, "epoch": 1654} {"train_loss": -10.091741561889648, "global_step": 277878, "epoch": 1654} {"train_loss": -11.290440559387207, "global_step": 277879, "epoch": 1654} {"train_loss": -9.823497772216797, "global_step": 277880, "epoch": 1654} {"train_loss": -10.801847457885742, "global_step": 277881, "epoch": 1654} {"train_loss": -11.349302291870117, "global_step": 277882, "epoch": 1654} {"train_loss": -10.043142318725586, "global_step": 277883, "epoch": 1654} {"train_loss": -9.723252296447754, "global_step": 277884, "epoch": 1654} {"train_loss": -10.54951286315918, "global_step": 277885, "epoch": 1654} {"train_loss": -10.958837509155273, "global_step": 277886, "epoch": 1654} {"train_loss": -10.835607528686523, "global_step": 277887, "epoch": 1654} {"train_loss": -11.35363483428955, "global_step": 277888, "epoch": 1654} {"train_loss": -10.845941543579102, "global_step": 277889, "epoch": 1654} {"train_loss": -10.509136199951172, "global_step": 277890, "epoch": 1654} {"train_loss": -11.640579223632812, "global_step": 277891, "epoch": 1654} {"train_loss": -10.751884460449219, "global_step": 277892, "epoch": 1654} {"train_loss": -11.659303665161133, "global_step": 277893, "epoch": 1654} {"train_loss": -11.062588691711426, "global_step": 277894, "epoch": 1654} {"train_loss": -11.876638412475586, "global_step": 277895, "epoch": 1654} {"train_loss": -11.417613983154297, "global_step": 277896, "epoch": 1654} {"train_loss": -11.845988273620605, "global_step": 277897, "epoch": 1654} {"train_loss": -11.551301956176758, "global_step": 277898, "epoch": 1654} {"train_loss": -11.827448844909668, "global_step": 277899, "epoch": 1654} {"train_loss": -11.345867156982422, "global_step": 277900, "epoch": 1654} {"train_loss": -11.4346342086792, "global_step": 277901, "epoch": 1654} {"train_loss": -12.021207809448242, "global_step": 277902, "epoch": 1654} {"train_loss": -11.210973739624023, "global_step": 277903, "epoch": 1654} {"train_loss": -11.772235870361328, "global_step": 277904, "epoch": 1654} {"train_loss": -11.872625350952148, "global_step": 277905, "epoch": 1654} {"train_loss": -11.559995651245117, "global_step": 277906, "epoch": 1654} {"train_loss": -11.829422950744629, "global_step": 277907, "epoch": 1654} {"train_loss": -11.704662322998047, "global_step": 277908, "epoch": 1654} {"train_loss": -11.981379508972168, "global_step": 277909, "epoch": 1654} {"train_loss": -12.002954483032227, "global_step": 277910, "epoch": 1654} {"train_loss": -11.988029479980469, "global_step": 277911, "epoch": 1654} {"train_loss": -11.803438186645508, "global_step": 277912, "epoch": 1654} {"train_loss": -11.932621002197266, "global_step": 277913, "epoch": 1654} {"train_loss": -11.97781753540039, "global_step": 277914, "epoch": 1654} {"train_loss": -11.890190124511719, "global_step": 277915, "epoch": 1654} {"train_loss": -11.95113754272461, "global_step": 277916, "epoch": 1654} {"train_loss": -11.832071304321289, "global_step": 277917, "epoch": 1654} {"train_loss": -11.810371398925781, "global_step": 277918, "epoch": 1654} {"train_loss": -11.717246055603027, "global_step": 277919, "epoch": 1654} {"train_loss": -12.132144927978516, "global_step": 277920, "epoch": 1654} {"train_loss": -11.615410804748535, "global_step": 277921, "epoch": 1654} {"train_loss": -11.8759765625, "global_step": 277922, "epoch": 1654} {"train_loss": -12.123137474060059, "global_step": 277923, "epoch": 1654} {"train_loss": -11.579595565795898, "global_step": 277924, "epoch": 1654} {"train_loss": -12.020329475402832, "global_step": 277925, "epoch": 1654} {"train_loss": -11.729632377624512, "global_step": 277926, "epoch": 1654} {"train_loss": -12.000507354736328, "global_step": 277927, "epoch": 1654} {"train_loss": -12.046138763427734, "global_step": 277928, "epoch": 1654} {"train_loss": -12.37765121459961, "global_step": 277929, "epoch": 1654} {"train_loss": -12.172297477722168, "global_step": 277930, "epoch": 1654} {"train_loss": -12.141590118408203, "global_step": 277931, "epoch": 1654} {"train_loss": -11.870311737060547, "global_step": 277932, "epoch": 1654} {"train_loss": -12.132892608642578, "global_step": 277933, "epoch": 1654} {"train_loss": -12.039892196655273, "global_step": 277934, "epoch": 1654} {"train_loss": -12.04371166229248, "global_step": 277935, "epoch": 1654} {"train_loss": -12.084054946899414, "global_step": 277936, "epoch": 1654} {"train_loss": -12.113547325134277, "global_step": 277937, "epoch": 1654} {"train_loss": -11.82810115814209, "global_step": 277938, "epoch": 1654} {"train_loss": -12.007105827331543, "global_step": 277939, "epoch": 1654} {"train_loss": -12.118744850158691, "global_step": 277940, "epoch": 1654} {"train_loss": -12.09109115600586, "global_step": 277941, "epoch": 1654} {"train_loss": -11.981383323669434, "global_step": 277942, "epoch": 1654} {"train_loss": -12.132083892822266, "global_step": 277943, "epoch": 1654} {"train_loss": -12.143277168273926, "global_step": 277944, "epoch": 1654} {"train_loss": -12.249296188354492, "global_step": 277945, "epoch": 1654} {"train_loss": -12.218111038208008, "global_step": 277946, "epoch": 1654} {"train_loss": -12.003961563110352, "global_step": 277947, "epoch": 1654} {"train_loss": -11.97221565246582, "global_step": 277948, "epoch": 1654} {"train_loss": -11.98746109008789, "global_step": 277949, "epoch": 1654} {"train_loss": -12.04050350189209, "global_step": 277950, "epoch": 1654} {"train_loss": -11.806354522705078, "global_step": 277951, "epoch": 1654} {"train_loss": -12.27873706817627, "global_step": 277952, "epoch": 1654} {"train_loss": -11.923404693603516, "global_step": 277953, "epoch": 1654} {"train_loss": -11.84045124053955, "global_step": 277954, "epoch": 1654} {"train_loss": -10.978713989257812, "global_step": 277955, "epoch": 1654} {"train_loss": -11.962118148803711, "global_step": 277956, "epoch": 1654} {"train_loss": -11.678102493286133, "global_step": 277957, "epoch": 1654} {"train_loss": -11.058326721191406, "global_step": 277958, "epoch": 1654} {"train_loss": -10.023679733276367, "global_step": 277959, "epoch": 1654} {"train_loss": -11.77603530883789, "global_step": 277960, "epoch": 1654} {"train_loss": -9.427927017211914, "global_step": 277961, "epoch": 1654} {"train_loss": -9.31103515625, "global_step": 277962, "epoch": 1654} {"train_loss": -7.687893867492676, "global_step": 277963, "epoch": 1654} {"train_loss": -9.825187683105469, "global_step": 277964, "epoch": 1654} {"train_loss": -6.736758232116699, "global_step": 277965, "epoch": 1654} {"train_loss": -8.368473052978516, "global_step": 277966, "epoch": 1654} {"train_loss": -8.51005744934082, "global_step": 277967, "epoch": 1654} {"train_loss": -8.200607299804688, "global_step": 277968, "epoch": 1654} {"train_loss": -9.18420696258545, "global_step": 277969, "epoch": 1654} {"train_loss": -8.786640167236328, "global_step": 277970, "epoch": 1654} {"train_loss": -8.575702667236328, "global_step": 277971, "epoch": 1654} {"train_loss": -9.180573463439941, "global_step": 277972, "epoch": 1654} {"train_loss": -9.408445358276367, "global_step": 277973, "epoch": 1654} {"train_loss": -8.860916137695312, "global_step": 277974, "epoch": 1654} {"train_loss": -9.935367584228516, "global_step": 277975, "epoch": 1654} {"train_loss": -9.863716125488281, "global_step": 277976, "epoch": 1654} {"train_loss": -10.671904563903809, "global_step": 277977, "epoch": 1654} {"train_loss": -10.056046485900879, "global_step": 277978, "epoch": 1654} {"train_loss": -11.215252876281738, "global_step": 277979, "epoch": 1654} {"train_loss": -10.358525276184082, "global_step": 277980, "epoch": 1654} {"train_loss": -10.910249710083008, "global_step": 277981, "epoch": 1654} {"train_loss": -10.692391395568848, "global_step": 277982, "epoch": 1654} {"train_loss": -10.724441528320312, "global_step": 277983, "epoch": 1654} {"train_loss": -11.11739730834961, "global_step": 277984, "epoch": 1654} {"train_loss": -11.089942932128906, "global_step": 277985, "epoch": 1654} {"train_loss": -10.72012996673584, "global_step": 277986, "epoch": 1654} {"train_loss": -11.246480941772461, "global_step": 277987, "epoch": 1654} {"train_loss": -10.840141296386719, "global_step": 277988, "epoch": 1654} {"train_loss": -11.073391914367676, "global_step": 277989, "epoch": 1654} {"train_loss": -11.480703353881836, "global_step": 277990, "epoch": 1654} {"train_loss": -11.192802429199219, "global_step": 277991, "epoch": 1654} {"train_loss": -11.137517929077148, "global_step": 277992, "epoch": 1654} {"train_loss": -11.383091926574707, "global_step": 277993, "epoch": 1654} {"train_loss": -11.436616897583008, "global_step": 277994, "epoch": 1654} {"train_loss": -11.304405212402344, "global_step": 277995, "epoch": 1654} {"train_loss": -11.623891830444336, "global_step": 277996, "epoch": 1654} {"train_loss": -11.189887046813965, "global_step": 277997, "epoch": 1654} {"train_loss": -11.372579574584961, "global_step": 277998, "epoch": 1654} {"train_loss": -11.482965469360352, "global_step": 277999, "epoch": 1654} {"train_loss": -11.348434448242188, "global_step": 278000, "epoch": 1654} {"train_loss": -11.704553604125977, "global_step": 278001, "epoch": 1654} {"train_loss": -11.68017864227295, "global_step": 278002, "epoch": 1654} {"train_loss": -11.788761138916016, "global_step": 278003, "epoch": 1654} {"train_loss": -11.676871299743652, "global_step": 278004, "epoch": 1654} {"train_loss": -12.025045394897461, "global_step": 278005, "epoch": 1654} {"train_loss": -11.592154502868652, "global_step": 278006, "epoch": 1654} {"train_loss": -11.770669937133789, "global_step": 278007, "epoch": 1654} {"train_loss": -11.951532363891602, "global_step": 278008, "epoch": 1654} {"train_loss": -11.876897811889648, "global_step": 278009, "epoch": 1654} {"train_loss": -11.784952163696289, "global_step": 278010, "epoch": 1654} {"train_loss": -11.968871116638184, "global_step": 278011, "epoch": 1654} {"train_loss": -11.829607009887695, "global_step": 278012, "epoch": 1654} {"train_loss": -12.021352767944336, "global_step": 278013, "epoch": 1654} {"train_loss": -11.918760299682617, "global_step": 278014, "epoch": 1654} {"train_loss": -11.884171485900879, "global_step": 278015, "epoch": 1654} {"train_loss": -11.872644424438477, "global_step": 278016, "epoch": 1654} {"train_loss": -11.968762397766113, "global_step": 278017, "epoch": 1654} {"train_loss": -12.05280876159668, "global_step": 278018, "epoch": 1654} {"train_loss": -12.134489059448242, "global_step": 278019, "epoch": 1654} {"train_loss": -12.08881664276123, "global_step": 278020, "epoch": 1654} {"train_loss": -12.073362350463867, "global_step": 278021, "epoch": 1654} {"train_loss": -12.018072128295898, "global_step": 278022, "epoch": 1654} {"train_loss": -12.015449523925781, "global_step": 278023, "epoch": 1654} {"train_loss": -12.206799507141113, "global_step": 278024, "epoch": 1654} {"train_loss": -12.312731742858887, "global_step": 278025, "epoch": 1654} {"train_loss": -12.155895233154297, "global_step": 278026, "epoch": 1654} {"train_loss": -12.248329162597656, "global_step": 278027, "epoch": 1654} {"train_loss": -12.214147567749023, "global_step": 278028, "epoch": 1654} {"train_loss": -12.238675117492676, "global_step": 278029, "epoch": 1654} {"train_loss": -12.301488876342773, "global_step": 278030, "epoch": 1654} {"train_loss": -12.241368293762207, "global_step": 278031, "epoch": 1654} {"train_loss": -12.336006164550781, "global_step": 278032, "epoch": 1654} {"train_loss": -12.291540145874023, "global_step": 278033, "epoch": 1654} {"train_loss": -12.14826774597168, "global_step": 278034, "epoch": 1654} {"train_loss": -12.380748748779297, "global_step": 278035, "epoch": 1654} {"train_loss": -12.339462280273438, "global_step": 278036, "epoch": 1654} {"train_loss": -12.283062934875488, "global_step": 278037, "epoch": 1654} {"train_loss": -12.437684059143066, "global_step": 278038, "epoch": 1654} {"train_loss": -11.397464332126436, "global_step": 278039, "epoch": 1654, "val_loss": 269875.0} {"train_loss": -12.490163803100586, "global_step": 278040, "epoch": 1655} {"train_loss": -12.37332534790039, "global_step": 278041, "epoch": 1655} {"train_loss": -12.283923149108887, "global_step": 278042, "epoch": 1655} {"train_loss": -12.265196800231934, "global_step": 278043, "epoch": 1655} {"train_loss": -12.40643310546875, "global_step": 278044, "epoch": 1655} {"train_loss": -12.434497833251953, "global_step": 278045, "epoch": 1655} {"train_loss": -12.366536140441895, "global_step": 278046, "epoch": 1655} {"train_loss": -12.392997741699219, "global_step": 278047, "epoch": 1655} {"train_loss": -12.228950500488281, "global_step": 278048, "epoch": 1655} {"train_loss": -12.415929794311523, "global_step": 278049, "epoch": 1655} {"train_loss": -12.338289260864258, "global_step": 278050, "epoch": 1655} {"train_loss": -12.338761329650879, "global_step": 278051, "epoch": 1655} {"train_loss": -12.419024467468262, "global_step": 278052, "epoch": 1655} {"train_loss": -12.306374549865723, "global_step": 278053, "epoch": 1655} {"train_loss": -12.384824752807617, "global_step": 278054, "epoch": 1655} {"train_loss": -12.257524490356445, "global_step": 278055, "epoch": 1655} {"train_loss": -12.274182319641113, "global_step": 278056, "epoch": 1655} {"train_loss": -12.140124320983887, "global_step": 278057, "epoch": 1655} {"train_loss": -12.435154914855957, "global_step": 278058, "epoch": 1655} {"train_loss": -12.129846572875977, "global_step": 278059, "epoch": 1655} {"train_loss": -11.951713562011719, "global_step": 278060, "epoch": 1655} {"train_loss": -11.83082103729248, "global_step": 278061, "epoch": 1655} {"train_loss": -11.674616813659668, "global_step": 278062, "epoch": 1655} {"train_loss": -12.510469436645508, "global_step": 278063, "epoch": 1655} {"train_loss": -12.187315940856934, "global_step": 278064, "epoch": 1655} {"train_loss": -11.736810684204102, "global_step": 278065, "epoch": 1655} {"train_loss": -11.753789901733398, "global_step": 278066, "epoch": 1655} {"train_loss": -11.782394409179688, "global_step": 278067, "epoch": 1655} {"train_loss": -12.170357704162598, "global_step": 278068, "epoch": 1655} {"train_loss": -11.866621017456055, "global_step": 278069, "epoch": 1655} {"train_loss": -12.349603652954102, "global_step": 278070, "epoch": 1655} {"train_loss": -11.874410629272461, "global_step": 278071, "epoch": 1655} {"train_loss": -11.436622619628906, "global_step": 278072, "epoch": 1655} {"train_loss": -10.223247528076172, "global_step": 278073, "epoch": 1655} {"train_loss": -9.39759349822998, "global_step": 278074, "epoch": 1655} {"train_loss": -11.790180206298828, "global_step": 278075, "epoch": 1655} {"train_loss": -10.718313217163086, "global_step": 278076, "epoch": 1655} {"train_loss": -9.599019050598145, "global_step": 278077, "epoch": 1655} {"train_loss": -11.460896492004395, "global_step": 278078, "epoch": 1655} {"train_loss": -10.91065788269043, "global_step": 278079, "epoch": 1655} {"train_loss": -10.243700981140137, "global_step": 278080, "epoch": 1655} {"train_loss": -10.137533187866211, "global_step": 278081, "epoch": 1655} {"train_loss": -11.034198760986328, "global_step": 278082, "epoch": 1655} {"train_loss": -10.645601272583008, "global_step": 278083, "epoch": 1655} {"train_loss": -10.740731239318848, "global_step": 278084, "epoch": 1655} {"train_loss": -10.218048095703125, "global_step": 278085, "epoch": 1655} {"train_loss": -11.404762268066406, "global_step": 278086, "epoch": 1655} {"train_loss": -10.511550903320312, "global_step": 278087, "epoch": 1655} {"train_loss": -11.747480392456055, "global_step": 278088, "epoch": 1655} {"train_loss": -11.765575408935547, "global_step": 278089, "epoch": 1655} {"train_loss": -10.767351150512695, "global_step": 278090, "epoch": 1655} {"train_loss": -11.286465644836426, "global_step": 278091, "epoch": 1655} {"train_loss": -10.873848915100098, "global_step": 278092, "epoch": 1655} {"train_loss": -11.290231704711914, "global_step": 278093, "epoch": 1655} {"train_loss": -10.428606033325195, "global_step": 278094, "epoch": 1655} {"train_loss": -11.913224220275879, "global_step": 278095, "epoch": 1655} {"train_loss": -11.123289108276367, "global_step": 278096, "epoch": 1655} {"train_loss": -11.617754936218262, "global_step": 278097, "epoch": 1655} {"train_loss": -11.743834495544434, "global_step": 278098, "epoch": 1655} {"train_loss": -11.504152297973633, "global_step": 278099, "epoch": 1655} {"train_loss": -11.567593574523926, "global_step": 278100, "epoch": 1655} {"train_loss": -11.766773223876953, "global_step": 278101, "epoch": 1655} {"train_loss": -11.982734680175781, "global_step": 278102, "epoch": 1655} {"train_loss": -11.727436065673828, "global_step": 278103, "epoch": 1655} {"train_loss": -12.120500564575195, "global_step": 278104, "epoch": 1655} {"train_loss": -11.695960998535156, "global_step": 278105, "epoch": 1655} {"train_loss": -11.968091011047363, "global_step": 278106, "epoch": 1655} {"train_loss": -11.511478424072266, "global_step": 278107, "epoch": 1655} {"train_loss": -11.979446411132812, "global_step": 278108, "epoch": 1655} {"train_loss": -11.709115028381348, "global_step": 278109, "epoch": 1655} {"train_loss": -11.889537811279297, "global_step": 278110, "epoch": 1655} {"train_loss": -11.867134094238281, "global_step": 278111, "epoch": 1655} {"train_loss": -11.835821151733398, "global_step": 278112, "epoch": 1655} {"train_loss": -11.630709648132324, "global_step": 278113, "epoch": 1655} {"train_loss": -11.96040153503418, "global_step": 278114, "epoch": 1655} {"train_loss": -11.693748474121094, "global_step": 278115, "epoch": 1655} {"train_loss": -12.01077938079834, "global_step": 278116, "epoch": 1655} {"train_loss": -11.885536193847656, "global_step": 278117, "epoch": 1655} {"train_loss": -12.0198974609375, "global_step": 278118, "epoch": 1655} {"train_loss": -12.018051147460938, "global_step": 278119, "epoch": 1655} {"train_loss": -12.038881301879883, "global_step": 278120, "epoch": 1655} {"train_loss": -12.022090911865234, "global_step": 278121, "epoch": 1655} {"train_loss": -11.963171005249023, "global_step": 278122, "epoch": 1655} {"train_loss": -12.102180480957031, "global_step": 278123, "epoch": 1655} {"train_loss": -12.205087661743164, "global_step": 278124, "epoch": 1655} {"train_loss": -12.015819549560547, "global_step": 278125, "epoch": 1655} {"train_loss": -11.841344833374023, "global_step": 278126, "epoch": 1655} {"train_loss": -11.58840560913086, "global_step": 278127, "epoch": 1655} {"train_loss": -12.01371955871582, "global_step": 278128, "epoch": 1655} {"train_loss": -12.302759170532227, "global_step": 278129, "epoch": 1655} {"train_loss": -11.84680461883545, "global_step": 278130, "epoch": 1655} {"train_loss": -12.323776245117188, "global_step": 278131, "epoch": 1655} {"train_loss": -11.961344718933105, "global_step": 278132, "epoch": 1655} {"train_loss": -11.973445892333984, "global_step": 278133, "epoch": 1655} {"train_loss": -12.016667366027832, "global_step": 278134, "epoch": 1655} {"train_loss": -12.322620391845703, "global_step": 278135, "epoch": 1655} {"train_loss": -11.828383445739746, "global_step": 278136, "epoch": 1655} {"train_loss": -12.278022766113281, "global_step": 278137, "epoch": 1655} {"train_loss": -11.880440711975098, "global_step": 278138, "epoch": 1655} {"train_loss": -11.967177391052246, "global_step": 278139, "epoch": 1655} {"train_loss": -12.055383682250977, "global_step": 278140, "epoch": 1655} {"train_loss": -11.8688383102417, "global_step": 278141, "epoch": 1655} {"train_loss": -12.170086860656738, "global_step": 278142, "epoch": 1655} {"train_loss": -11.92190170288086, "global_step": 278143, "epoch": 1655} {"train_loss": -11.70107650756836, "global_step": 278144, "epoch": 1655} {"train_loss": -12.013030052185059, "global_step": 278145, "epoch": 1655} {"train_loss": -12.036334991455078, "global_step": 278146, "epoch": 1655} {"train_loss": -11.856754302978516, "global_step": 278147, "epoch": 1655} {"train_loss": -11.876564979553223, "global_step": 278148, "epoch": 1655} {"train_loss": -11.82867431640625, "global_step": 278149, "epoch": 1655} {"train_loss": -11.760859489440918, "global_step": 278150, "epoch": 1655} {"train_loss": -12.251269340515137, "global_step": 278151, "epoch": 1655} {"train_loss": -11.893539428710938, "global_step": 278152, "epoch": 1655} {"train_loss": -12.143207550048828, "global_step": 278153, "epoch": 1655} {"train_loss": -12.208430290222168, "global_step": 278154, "epoch": 1655} {"train_loss": -12.171455383300781, "global_step": 278155, "epoch": 1655} {"train_loss": -12.015803337097168, "global_step": 278156, "epoch": 1655} {"train_loss": -12.271926879882812, "global_step": 278157, "epoch": 1655} {"train_loss": -11.880058288574219, "global_step": 278158, "epoch": 1655} {"train_loss": -12.373010635375977, "global_step": 278159, "epoch": 1655} {"train_loss": -11.925640106201172, "global_step": 278160, "epoch": 1655} {"train_loss": -12.031026840209961, "global_step": 278161, "epoch": 1655} {"train_loss": -11.87203598022461, "global_step": 278162, "epoch": 1655} {"train_loss": -11.785605430603027, "global_step": 278163, "epoch": 1655} {"train_loss": -12.01169490814209, "global_step": 278164, "epoch": 1655} {"train_loss": -11.941082000732422, "global_step": 278165, "epoch": 1655} {"train_loss": -12.008275032043457, "global_step": 278166, "epoch": 1655} {"train_loss": -11.995075225830078, "global_step": 278167, "epoch": 1655} {"train_loss": -12.24761962890625, "global_step": 278168, "epoch": 1655} {"train_loss": -11.78550910949707, "global_step": 278169, "epoch": 1655} {"train_loss": -11.963516235351562, "global_step": 278170, "epoch": 1655} {"train_loss": -11.873618125915527, "global_step": 278171, "epoch": 1655} {"train_loss": -11.614706039428711, "global_step": 278172, "epoch": 1655} {"train_loss": -11.544390678405762, "global_step": 278173, "epoch": 1655} {"train_loss": -11.452596664428711, "global_step": 278174, "epoch": 1655} {"train_loss": -11.776280403137207, "global_step": 278175, "epoch": 1655} {"train_loss": -11.858774185180664, "global_step": 278176, "epoch": 1655} {"train_loss": -11.767549514770508, "global_step": 278177, "epoch": 1655} {"train_loss": -12.171052932739258, "global_step": 278178, "epoch": 1655} {"train_loss": -12.095996856689453, "global_step": 278179, "epoch": 1655} {"train_loss": -11.639389991760254, "global_step": 278180, "epoch": 1655} {"train_loss": -11.821818351745605, "global_step": 278181, "epoch": 1655} {"train_loss": -12.283052444458008, "global_step": 278182, "epoch": 1655} {"train_loss": -11.887670516967773, "global_step": 278183, "epoch": 1655} {"train_loss": -11.97688102722168, "global_step": 278184, "epoch": 1655} {"train_loss": -12.216641426086426, "global_step": 278185, "epoch": 1655} {"train_loss": -11.98103141784668, "global_step": 278186, "epoch": 1655} {"train_loss": -11.557414054870605, "global_step": 278187, "epoch": 1655} {"train_loss": -11.570699691772461, "global_step": 278188, "epoch": 1655} {"train_loss": -11.967218399047852, "global_step": 278189, "epoch": 1655} {"train_loss": -11.893301010131836, "global_step": 278190, "epoch": 1655} {"train_loss": -11.39024543762207, "global_step": 278191, "epoch": 1655} {"train_loss": -12.119558334350586, "global_step": 278192, "epoch": 1655} {"train_loss": -11.647764205932617, "global_step": 278193, "epoch": 1655} {"train_loss": -12.115324020385742, "global_step": 278194, "epoch": 1655} {"train_loss": -11.309831619262695, "global_step": 278195, "epoch": 1655} {"train_loss": -11.89583969116211, "global_step": 278196, "epoch": 1655} {"train_loss": -11.928449630737305, "global_step": 278197, "epoch": 1655} {"train_loss": -11.829673767089844, "global_step": 278198, "epoch": 1655} {"train_loss": -10.936332702636719, "global_step": 278199, "epoch": 1655} {"train_loss": -9.428306579589844, "global_step": 278200, "epoch": 1655} {"train_loss": -8.925077438354492, "global_step": 278201, "epoch": 1655} {"train_loss": -9.615091323852539, "global_step": 278202, "epoch": 1655} {"train_loss": -9.45889663696289, "global_step": 278203, "epoch": 1655} {"train_loss": -10.84988784790039, "global_step": 278204, "epoch": 1655} {"train_loss": -9.956987380981445, "global_step": 278205, "epoch": 1655} {"train_loss": -10.513320922851562, "global_step": 278206, "epoch": 1655} {"train_loss": -11.716091700962611, "global_step": 278207, "epoch": 1655, "val_loss": 269252.0625, "train_action_mse_error": 5.383930683135986} {"train_loss": -10.403009414672852, "global_step": 278208, "epoch": 1656} {"train_loss": -11.027219772338867, "global_step": 278209, "epoch": 1656} {"train_loss": -10.548786163330078, "global_step": 278210, "epoch": 1656} {"train_loss": -10.088281631469727, "global_step": 278211, "epoch": 1656} {"train_loss": -11.360003471374512, "global_step": 278212, "epoch": 1656} {"train_loss": -10.864421844482422, "global_step": 278213, "epoch": 1656} {"train_loss": -11.212862968444824, "global_step": 278214, "epoch": 1656} {"train_loss": -9.887296676635742, "global_step": 278215, "epoch": 1656} {"train_loss": -11.04665470123291, "global_step": 278216, "epoch": 1656} {"train_loss": -9.507613182067871, "global_step": 278217, "epoch": 1656} {"train_loss": -10.436948776245117, "global_step": 278218, "epoch": 1656} {"train_loss": -10.590557098388672, "global_step": 278219, "epoch": 1656} {"train_loss": -10.78342056274414, "global_step": 278220, "epoch": 1656} {"train_loss": -9.815153121948242, "global_step": 278221, "epoch": 1656} {"train_loss": -10.469038963317871, "global_step": 278222, "epoch": 1656} {"train_loss": -10.876771926879883, "global_step": 278223, "epoch": 1656} {"train_loss": -11.206851959228516, "global_step": 278224, "epoch": 1656} {"train_loss": -10.40999984741211, "global_step": 278225, "epoch": 1656} {"train_loss": -10.251945495605469, "global_step": 278226, "epoch": 1656} {"train_loss": -11.28628158569336, "global_step": 278227, "epoch": 1656} {"train_loss": -11.193408012390137, "global_step": 278228, "epoch": 1656} {"train_loss": -11.661506652832031, "global_step": 278229, "epoch": 1656} {"train_loss": -10.68826675415039, "global_step": 278230, "epoch": 1656} {"train_loss": -11.308748245239258, "global_step": 278231, "epoch": 1656} {"train_loss": -10.810234069824219, "global_step": 278232, "epoch": 1656} {"train_loss": -11.354924201965332, "global_step": 278233, "epoch": 1656} {"train_loss": -11.17014217376709, "global_step": 278234, "epoch": 1656} {"train_loss": -11.26491928100586, "global_step": 278235, "epoch": 1656} {"train_loss": -11.412254333496094, "global_step": 278236, "epoch": 1656} {"train_loss": -11.707213401794434, "global_step": 278237, "epoch": 1656} {"train_loss": -11.376070022583008, "global_step": 278238, "epoch": 1656} {"train_loss": -11.805309295654297, "global_step": 278239, "epoch": 1656} {"train_loss": -11.420980453491211, "global_step": 278240, "epoch": 1656} {"train_loss": -11.483844757080078, "global_step": 278241, "epoch": 1656} {"train_loss": -11.736210823059082, "global_step": 278242, "epoch": 1656} {"train_loss": -11.494775772094727, "global_step": 278243, "epoch": 1656} {"train_loss": -11.991952896118164, "global_step": 278244, "epoch": 1656} {"train_loss": -11.462047576904297, "global_step": 278245, "epoch": 1656} {"train_loss": -11.61392593383789, "global_step": 278246, "epoch": 1656} {"train_loss": -11.791994094848633, "global_step": 278247, "epoch": 1656} {"train_loss": -11.71622085571289, "global_step": 278248, "epoch": 1656} {"train_loss": -11.670818328857422, "global_step": 278249, "epoch": 1656} {"train_loss": -11.840431213378906, "global_step": 278250, "epoch": 1656} {"train_loss": -11.460922241210938, "global_step": 278251, "epoch": 1656} {"train_loss": -11.960217475891113, "global_step": 278252, "epoch": 1656} {"train_loss": -11.680485725402832, "global_step": 278253, "epoch": 1656} {"train_loss": -11.703189849853516, "global_step": 278254, "epoch": 1656} {"train_loss": -11.774239540100098, "global_step": 278255, "epoch": 1656} {"train_loss": -11.904228210449219, "global_step": 278256, "epoch": 1656} {"train_loss": -12.013976097106934, "global_step": 278257, "epoch": 1656} {"train_loss": -11.63431167602539, "global_step": 278258, "epoch": 1656} {"train_loss": -11.993192672729492, "global_step": 278259, "epoch": 1656} {"train_loss": -11.437349319458008, "global_step": 278260, "epoch": 1656} {"train_loss": -12.08693790435791, "global_step": 278261, "epoch": 1656} {"train_loss": -11.932440757751465, "global_step": 278262, "epoch": 1656} {"train_loss": -11.799732208251953, "global_step": 278263, "epoch": 1656} {"train_loss": -11.81638240814209, "global_step": 278264, "epoch": 1656} {"train_loss": -11.922242164611816, "global_step": 278265, "epoch": 1656} {"train_loss": -11.854236602783203, "global_step": 278266, "epoch": 1656} {"train_loss": -11.957101821899414, "global_step": 278267, "epoch": 1656} {"train_loss": -11.900186538696289, "global_step": 278268, "epoch": 1656} {"train_loss": -12.071842193603516, "global_step": 278269, "epoch": 1656} {"train_loss": -11.77674674987793, "global_step": 278270, "epoch": 1656} {"train_loss": -12.102210998535156, "global_step": 278271, "epoch": 1656} {"train_loss": -11.972505569458008, "global_step": 278272, "epoch": 1656} {"train_loss": -12.119266510009766, "global_step": 278273, "epoch": 1656} {"train_loss": -11.984909057617188, "global_step": 278274, "epoch": 1656} {"train_loss": -11.985550880432129, "global_step": 278275, "epoch": 1656} {"train_loss": -11.95798110961914, "global_step": 278276, "epoch": 1656} {"train_loss": -12.180388450622559, "global_step": 278277, "epoch": 1656} {"train_loss": -12.24676513671875, "global_step": 278278, "epoch": 1656} {"train_loss": -12.073122024536133, "global_step": 278279, "epoch": 1656} {"train_loss": -12.051252365112305, "global_step": 278280, "epoch": 1656} {"train_loss": -12.002311706542969, "global_step": 278281, "epoch": 1656} {"train_loss": -11.787002563476562, "global_step": 278282, "epoch": 1656} {"train_loss": -12.169073104858398, "global_step": 278283, "epoch": 1656} {"train_loss": -12.311524391174316, "global_step": 278284, "epoch": 1656} {"train_loss": -11.867584228515625, "global_step": 278285, "epoch": 1656} {"train_loss": -12.079429626464844, "global_step": 278286, "epoch": 1656} {"train_loss": -11.905689239501953, "global_step": 278287, "epoch": 1656} {"train_loss": -12.184968948364258, "global_step": 278288, "epoch": 1656} {"train_loss": -12.133369445800781, "global_step": 278289, "epoch": 1656} {"train_loss": -12.266292572021484, "global_step": 278290, "epoch": 1656} {"train_loss": -12.13194465637207, "global_step": 278291, "epoch": 1656} {"train_loss": -12.07370662689209, "global_step": 278292, "epoch": 1656} {"train_loss": -12.29149055480957, "global_step": 278293, "epoch": 1656} {"train_loss": -11.859370231628418, "global_step": 278294, "epoch": 1656} {"train_loss": -12.04703140258789, "global_step": 278295, "epoch": 1656} {"train_loss": -11.897998809814453, "global_step": 278296, "epoch": 1656} {"train_loss": -12.313679695129395, "global_step": 278297, "epoch": 1656} {"train_loss": -11.99140739440918, "global_step": 278298, "epoch": 1656} {"train_loss": -12.159479141235352, "global_step": 278299, "epoch": 1656} {"train_loss": -12.213483810424805, "global_step": 278300, "epoch": 1656} {"train_loss": -12.347223281860352, "global_step": 278301, "epoch": 1656} {"train_loss": -12.187835693359375, "global_step": 278302, "epoch": 1656} {"train_loss": -11.996065139770508, "global_step": 278303, "epoch": 1656} {"train_loss": -12.002068519592285, "global_step": 278304, "epoch": 1656} {"train_loss": -11.99238395690918, "global_step": 278305, "epoch": 1656} {"train_loss": -12.294269561767578, "global_step": 278306, "epoch": 1656} {"train_loss": -12.013471603393555, "global_step": 278307, "epoch": 1656} {"train_loss": -12.077005386352539, "global_step": 278308, "epoch": 1656} {"train_loss": -12.310820579528809, "global_step": 278309, "epoch": 1656} {"train_loss": -12.203384399414062, "global_step": 278310, "epoch": 1656} {"train_loss": -11.952065467834473, "global_step": 278311, "epoch": 1656} {"train_loss": -11.731207847595215, "global_step": 278312, "epoch": 1656} {"train_loss": -11.967605590820312, "global_step": 278313, "epoch": 1656} {"train_loss": -12.05843448638916, "global_step": 278314, "epoch": 1656} {"train_loss": -11.998292922973633, "global_step": 278315, "epoch": 1656} {"train_loss": -11.945454597473145, "global_step": 278316, "epoch": 1656} {"train_loss": -11.725198745727539, "global_step": 278317, "epoch": 1656} {"train_loss": -11.522615432739258, "global_step": 278318, "epoch": 1656} {"train_loss": -11.817753791809082, "global_step": 278319, "epoch": 1656} {"train_loss": -11.828176498413086, "global_step": 278320, "epoch": 1656} {"train_loss": -11.86842155456543, "global_step": 278321, "epoch": 1656} {"train_loss": -12.045467376708984, "global_step": 278322, "epoch": 1656} {"train_loss": -11.937039375305176, "global_step": 278323, "epoch": 1656} {"train_loss": -12.272537231445312, "global_step": 278324, "epoch": 1656} {"train_loss": -11.81995964050293, "global_step": 278325, "epoch": 1656} {"train_loss": -11.186243057250977, "global_step": 278326, "epoch": 1656} {"train_loss": -12.049846649169922, "global_step": 278327, "epoch": 1656} {"train_loss": -11.22755241394043, "global_step": 278328, "epoch": 1656} {"train_loss": -10.572647094726562, "global_step": 278329, "epoch": 1656} {"train_loss": -11.976381301879883, "global_step": 278330, "epoch": 1656} {"train_loss": -9.570572853088379, "global_step": 278331, "epoch": 1656} {"train_loss": -10.803487777709961, "global_step": 278332, "epoch": 1656} {"train_loss": -10.83384895324707, "global_step": 278333, "epoch": 1656} {"train_loss": -10.339113235473633, "global_step": 278334, "epoch": 1656} {"train_loss": -9.062626838684082, "global_step": 278335, "epoch": 1656} {"train_loss": -10.556002616882324, "global_step": 278336, "epoch": 1656} {"train_loss": -9.19559097290039, "global_step": 278337, "epoch": 1656} {"train_loss": -9.150895118713379, "global_step": 278338, "epoch": 1656} {"train_loss": -9.983985900878906, "global_step": 278339, "epoch": 1656} {"train_loss": -9.93311882019043, "global_step": 278340, "epoch": 1656} {"train_loss": -8.35439682006836, "global_step": 278341, "epoch": 1656} {"train_loss": -9.909835815429688, "global_step": 278342, "epoch": 1656} {"train_loss": -9.444177627563477, "global_step": 278343, "epoch": 1656} {"train_loss": -9.39755916595459, "global_step": 278344, "epoch": 1656} {"train_loss": -10.074262619018555, "global_step": 278345, "epoch": 1656} {"train_loss": -8.96261978149414, "global_step": 278346, "epoch": 1656} {"train_loss": -8.726932525634766, "global_step": 278347, "epoch": 1656} {"train_loss": -10.935176849365234, "global_step": 278348, "epoch": 1656} {"train_loss": -9.949828147888184, "global_step": 278349, "epoch": 1656} {"train_loss": -10.181941986083984, "global_step": 278350, "epoch": 1656} {"train_loss": -9.921531677246094, "global_step": 278351, "epoch": 1656} {"train_loss": -10.762381553649902, "global_step": 278352, "epoch": 1656} {"train_loss": -10.359731674194336, "global_step": 278353, "epoch": 1656} {"train_loss": -11.54486083984375, "global_step": 278354, "epoch": 1656} {"train_loss": -10.30925464630127, "global_step": 278355, "epoch": 1656} {"train_loss": -11.112361907958984, "global_step": 278356, "epoch": 1656} {"train_loss": -10.505395889282227, "global_step": 278357, "epoch": 1656} {"train_loss": -11.591935157775879, "global_step": 278358, "epoch": 1656} {"train_loss": -10.821084976196289, "global_step": 278359, "epoch": 1656} {"train_loss": -11.36074447631836, "global_step": 278360, "epoch": 1656} {"train_loss": -11.556524276733398, "global_step": 278361, "epoch": 1656} {"train_loss": -11.616928100585938, "global_step": 278362, "epoch": 1656} {"train_loss": -11.511452674865723, "global_step": 278363, "epoch": 1656} {"train_loss": -11.65009880065918, "global_step": 278364, "epoch": 1656} {"train_loss": -11.526861190795898, "global_step": 278365, "epoch": 1656} {"train_loss": -11.55593490600586, "global_step": 278366, "epoch": 1656} {"train_loss": -11.766128540039062, "global_step": 278367, "epoch": 1656} {"train_loss": -11.645208358764648, "global_step": 278368, "epoch": 1656} {"train_loss": -11.535811424255371, "global_step": 278369, "epoch": 1656} {"train_loss": -11.554443359375, "global_step": 278370, "epoch": 1656} {"train_loss": -11.70322036743164, "global_step": 278371, "epoch": 1656} {"train_loss": -11.715224266052246, "global_step": 278372, "epoch": 1656} {"train_loss": -11.650083541870117, "global_step": 278373, "epoch": 1656} {"train_loss": -11.790290832519531, "global_step": 278374, "epoch": 1656} {"train_loss": -11.368489231382098, "global_step": 278375, "epoch": 1656, "val_loss": 268089.21875} {"train_loss": -11.861746788024902, "global_step": 278376, "epoch": 1657} {"train_loss": -11.769668579101562, "global_step": 278377, "epoch": 1657} {"train_loss": -11.97410774230957, "global_step": 278378, "epoch": 1657} {"train_loss": -11.716897964477539, "global_step": 278379, "epoch": 1657} {"train_loss": -11.98210334777832, "global_step": 278380, "epoch": 1657} {"train_loss": -11.592803001403809, "global_step": 278381, "epoch": 1657} {"train_loss": -11.903560638427734, "global_step": 278382, "epoch": 1657} {"train_loss": -11.946828842163086, "global_step": 278383, "epoch": 1657} {"train_loss": -11.902366638183594, "global_step": 278384, "epoch": 1657} {"train_loss": -11.942441940307617, "global_step": 278385, "epoch": 1657} {"train_loss": -11.976598739624023, "global_step": 278386, "epoch": 1657} {"train_loss": -11.723764419555664, "global_step": 278387, "epoch": 1657} {"train_loss": -12.150057792663574, "global_step": 278388, "epoch": 1657} {"train_loss": -11.947479248046875, "global_step": 278389, "epoch": 1657} {"train_loss": -11.826889038085938, "global_step": 278390, "epoch": 1657} {"train_loss": -11.843218803405762, "global_step": 278391, "epoch": 1657} {"train_loss": -11.945785522460938, "global_step": 278392, "epoch": 1657} {"train_loss": -11.863565444946289, "global_step": 278393, "epoch": 1657} {"train_loss": -12.061857223510742, "global_step": 278394, "epoch": 1657} {"train_loss": -12.209067344665527, "global_step": 278395, "epoch": 1657} {"train_loss": -11.92817497253418, "global_step": 278396, "epoch": 1657} {"train_loss": -11.92779541015625, "global_step": 278397, "epoch": 1657} {"train_loss": -11.953191757202148, "global_step": 278398, "epoch": 1657} {"train_loss": -12.077962875366211, "global_step": 278399, "epoch": 1657} {"train_loss": -12.119668006896973, "global_step": 278400, "epoch": 1657} {"train_loss": -12.115720748901367, "global_step": 278401, "epoch": 1657} {"train_loss": -12.11331558227539, "global_step": 278402, "epoch": 1657} {"train_loss": -12.24997329711914, "global_step": 278403, "epoch": 1657} {"train_loss": -12.185357093811035, "global_step": 278404, "epoch": 1657} {"train_loss": -12.031737327575684, "global_step": 278405, "epoch": 1657} {"train_loss": -12.197935104370117, "global_step": 278406, "epoch": 1657} {"train_loss": -12.192548751831055, "global_step": 278407, "epoch": 1657} {"train_loss": -12.200682640075684, "global_step": 278408, "epoch": 1657} {"train_loss": -12.19918441772461, "global_step": 278409, "epoch": 1657} {"train_loss": -12.061363220214844, "global_step": 278410, "epoch": 1657} {"train_loss": -12.328251838684082, "global_step": 278411, "epoch": 1657} {"train_loss": -12.06662368774414, "global_step": 278412, "epoch": 1657} {"train_loss": -12.226739883422852, "global_step": 278413, "epoch": 1657} {"train_loss": -12.088074684143066, "global_step": 278414, "epoch": 1657} {"train_loss": -11.985499382019043, "global_step": 278415, "epoch": 1657} {"train_loss": -12.153685569763184, "global_step": 278416, "epoch": 1657} {"train_loss": -11.415427207946777, "global_step": 278417, "epoch": 1657} {"train_loss": -12.123172760009766, "global_step": 278418, "epoch": 1657} {"train_loss": -12.053665161132812, "global_step": 278419, "epoch": 1657} {"train_loss": -11.792547225952148, "global_step": 278420, "epoch": 1657} {"train_loss": -12.132532119750977, "global_step": 278421, "epoch": 1657} {"train_loss": -11.874574661254883, "global_step": 278422, "epoch": 1657} {"train_loss": -12.212996482849121, "global_step": 278423, "epoch": 1657} {"train_loss": -12.19747543334961, "global_step": 278424, "epoch": 1657} {"train_loss": -12.397050857543945, "global_step": 278425, "epoch": 1657} {"train_loss": -12.222301483154297, "global_step": 278426, "epoch": 1657} {"train_loss": -12.257014274597168, "global_step": 278427, "epoch": 1657} {"train_loss": -12.286589622497559, "global_step": 278428, "epoch": 1657} {"train_loss": -11.835916519165039, "global_step": 278429, "epoch": 1657} {"train_loss": -12.005642890930176, "global_step": 278430, "epoch": 1657} {"train_loss": -12.24930477142334, "global_step": 278431, "epoch": 1657} {"train_loss": -12.298652648925781, "global_step": 278432, "epoch": 1657} {"train_loss": -11.961458206176758, "global_step": 278433, "epoch": 1657} {"train_loss": -12.319318771362305, "global_step": 278434, "epoch": 1657} {"train_loss": -12.364168167114258, "global_step": 278435, "epoch": 1657} {"train_loss": -12.199397087097168, "global_step": 278436, "epoch": 1657} {"train_loss": -12.360607147216797, "global_step": 278437, "epoch": 1657} {"train_loss": -12.358758926391602, "global_step": 278438, "epoch": 1657} {"train_loss": -12.36525821685791, "global_step": 278439, "epoch": 1657} {"train_loss": -12.313291549682617, "global_step": 278440, "epoch": 1657} {"train_loss": -12.40534782409668, "global_step": 278441, "epoch": 1657} {"train_loss": -12.164229393005371, "global_step": 278442, "epoch": 1657} {"train_loss": -12.31234359741211, "global_step": 278443, "epoch": 1657} {"train_loss": -12.104070663452148, "global_step": 278444, "epoch": 1657} {"train_loss": -12.19594955444336, "global_step": 278445, "epoch": 1657} {"train_loss": -12.464399337768555, "global_step": 278446, "epoch": 1657} {"train_loss": -12.561179161071777, "global_step": 278447, "epoch": 1657} {"train_loss": -12.393963813781738, "global_step": 278448, "epoch": 1657} {"train_loss": -12.277854919433594, "global_step": 278449, "epoch": 1657} {"train_loss": -12.481151580810547, "global_step": 278450, "epoch": 1657} {"train_loss": -12.473538398742676, "global_step": 278451, "epoch": 1657} {"train_loss": -12.191987037658691, "global_step": 278452, "epoch": 1657} {"train_loss": -12.315549850463867, "global_step": 278453, "epoch": 1657} {"train_loss": -12.42756462097168, "global_step": 278454, "epoch": 1657} {"train_loss": -12.447568893432617, "global_step": 278455, "epoch": 1657} {"train_loss": -12.398295402526855, "global_step": 278456, "epoch": 1657} {"train_loss": -12.187919616699219, "global_step": 278457, "epoch": 1657} {"train_loss": -12.199708938598633, "global_step": 278458, "epoch": 1657} {"train_loss": -12.23857307434082, "global_step": 278459, "epoch": 1657} {"train_loss": -12.144043922424316, "global_step": 278460, "epoch": 1657} {"train_loss": -12.19009017944336, "global_step": 278461, "epoch": 1657} {"train_loss": -12.403255462646484, "global_step": 278462, "epoch": 1657} {"train_loss": -12.321099281311035, "global_step": 278463, "epoch": 1657} {"train_loss": -12.022665977478027, "global_step": 278464, "epoch": 1657} {"train_loss": -11.82302188873291, "global_step": 278465, "epoch": 1657} {"train_loss": -12.340376853942871, "global_step": 278466, "epoch": 1657} {"train_loss": -12.115610122680664, "global_step": 278467, "epoch": 1657} {"train_loss": -11.832876205444336, "global_step": 278468, "epoch": 1657} {"train_loss": -11.597695350646973, "global_step": 278469, "epoch": 1657} {"train_loss": -12.034293174743652, "global_step": 278470, "epoch": 1657} {"train_loss": -12.09952163696289, "global_step": 278471, "epoch": 1657} {"train_loss": -12.284082412719727, "global_step": 278472, "epoch": 1657} {"train_loss": -12.072380065917969, "global_step": 278473, "epoch": 1657} {"train_loss": -12.384410858154297, "global_step": 278474, "epoch": 1657} {"train_loss": -11.410832405090332, "global_step": 278475, "epoch": 1657} {"train_loss": -10.007814407348633, "global_step": 278476, "epoch": 1657} {"train_loss": -10.154013633728027, "global_step": 278477, "epoch": 1657} {"train_loss": -9.815279006958008, "global_step": 278478, "epoch": 1657} {"train_loss": -9.276588439941406, "global_step": 278479, "epoch": 1657} {"train_loss": -11.601970672607422, "global_step": 278480, "epoch": 1657} {"train_loss": -7.5602874755859375, "global_step": 278481, "epoch": 1657} {"train_loss": -9.511541366577148, "global_step": 278482, "epoch": 1657} {"train_loss": -8.62909984588623, "global_step": 278483, "epoch": 1657} {"train_loss": -8.749532699584961, "global_step": 278484, "epoch": 1657} {"train_loss": -6.892948150634766, "global_step": 278485, "epoch": 1657} {"train_loss": -6.5268707275390625, "global_step": 278486, "epoch": 1657} {"train_loss": -7.0338029861450195, "global_step": 278487, "epoch": 1657} {"train_loss": -7.307008743286133, "global_step": 278488, "epoch": 1657} {"train_loss": -8.356657028198242, "global_step": 278489, "epoch": 1657} {"train_loss": -7.274444580078125, "global_step": 278490, "epoch": 1657} {"train_loss": -7.648945331573486, "global_step": 278491, "epoch": 1657} {"train_loss": -7.165065765380859, "global_step": 278492, "epoch": 1657} {"train_loss": -7.0319671630859375, "global_step": 278493, "epoch": 1657} {"train_loss": -7.1466240882873535, "global_step": 278494, "epoch": 1657} {"train_loss": -7.248123645782471, "global_step": 278495, "epoch": 1657} {"train_loss": -7.948775291442871, "global_step": 278496, "epoch": 1657} {"train_loss": -7.861575126647949, "global_step": 278497, "epoch": 1657} {"train_loss": -7.2127790451049805, "global_step": 278498, "epoch": 1657} {"train_loss": -8.06272029876709, "global_step": 278499, "epoch": 1657} {"train_loss": -8.461511611938477, "global_step": 278500, "epoch": 1657} {"train_loss": -8.126614570617676, "global_step": 278501, "epoch": 1657} {"train_loss": -8.940848350524902, "global_step": 278502, "epoch": 1657} {"train_loss": -8.620162963867188, "global_step": 278503, "epoch": 1657} {"train_loss": -8.554325103759766, "global_step": 278504, "epoch": 1657} {"train_loss": -9.236452102661133, "global_step": 278505, "epoch": 1657} {"train_loss": -9.629438400268555, "global_step": 278506, "epoch": 1657} {"train_loss": -8.503795623779297, "global_step": 278507, "epoch": 1657} {"train_loss": -9.285957336425781, "global_step": 278508, "epoch": 1657} {"train_loss": -10.144697189331055, "global_step": 278509, "epoch": 1657} {"train_loss": -9.331790924072266, "global_step": 278510, "epoch": 1657} {"train_loss": -9.894659042358398, "global_step": 278511, "epoch": 1657} {"train_loss": -10.49404239654541, "global_step": 278512, "epoch": 1657} {"train_loss": -10.114641189575195, "global_step": 278513, "epoch": 1657} {"train_loss": -10.77046012878418, "global_step": 278514, "epoch": 1657} {"train_loss": -9.939935684204102, "global_step": 278515, "epoch": 1657} {"train_loss": -10.215353965759277, "global_step": 278516, "epoch": 1657} {"train_loss": -10.615163803100586, "global_step": 278517, "epoch": 1657} {"train_loss": -9.725726127624512, "global_step": 278518, "epoch": 1657} {"train_loss": -10.827816009521484, "global_step": 278519, "epoch": 1657} {"train_loss": -10.606978416442871, "global_step": 278520, "epoch": 1657} {"train_loss": -10.69301700592041, "global_step": 278521, "epoch": 1657} {"train_loss": -10.270960807800293, "global_step": 278522, "epoch": 1657} {"train_loss": -11.133563041687012, "global_step": 278523, "epoch": 1657} {"train_loss": -11.177316665649414, "global_step": 278524, "epoch": 1657} {"train_loss": -11.004042625427246, "global_step": 278525, "epoch": 1657} {"train_loss": -11.119656562805176, "global_step": 278526, "epoch": 1657} {"train_loss": -11.579804420471191, "global_step": 278527, "epoch": 1657} {"train_loss": -11.473990440368652, "global_step": 278528, "epoch": 1657} {"train_loss": -11.458253860473633, "global_step": 278529, "epoch": 1657} {"train_loss": -11.133539199829102, "global_step": 278530, "epoch": 1657} {"train_loss": -11.517599105834961, "global_step": 278531, "epoch": 1657} {"train_loss": -11.452752113342285, "global_step": 278532, "epoch": 1657} {"train_loss": -11.54350757598877, "global_step": 278533, "epoch": 1657} {"train_loss": -11.526960372924805, "global_step": 278534, "epoch": 1657} {"train_loss": -11.075218200683594, "global_step": 278535, "epoch": 1657} {"train_loss": -11.476110458374023, "global_step": 278536, "epoch": 1657} {"train_loss": -11.658636093139648, "global_step": 278537, "epoch": 1657} {"train_loss": -11.486288070678711, "global_step": 278538, "epoch": 1657} {"train_loss": -11.529058456420898, "global_step": 278539, "epoch": 1657} {"train_loss": -11.837475776672363, "global_step": 278540, "epoch": 1657} {"train_loss": -11.653593063354492, "global_step": 278541, "epoch": 1657} {"train_loss": -11.414300918579102, "global_step": 278542, "epoch": 1657} {"train_loss": -11.13228959980465, "global_step": 278543, "epoch": 1657, "val_loss": 276567.59375} {"train_loss": -11.752952575683594, "global_step": 278544, "epoch": 1658} {"train_loss": -11.56161880493164, "global_step": 278545, "epoch": 1658} {"train_loss": -11.644491195678711, "global_step": 278546, "epoch": 1658} {"train_loss": -11.655818939208984, "global_step": 278547, "epoch": 1658} {"train_loss": -11.689165115356445, "global_step": 278548, "epoch": 1658} {"train_loss": -11.881080627441406, "global_step": 278549, "epoch": 1658} {"train_loss": -11.646271705627441, "global_step": 278550, "epoch": 1658} {"train_loss": -11.750598907470703, "global_step": 278551, "epoch": 1658} {"train_loss": -11.623857498168945, "global_step": 278552, "epoch": 1658} {"train_loss": -11.850177764892578, "global_step": 278553, "epoch": 1658} {"train_loss": -11.780095100402832, "global_step": 278554, "epoch": 1658} {"train_loss": -11.634991645812988, "global_step": 278555, "epoch": 1658} {"train_loss": -11.828912734985352, "global_step": 278556, "epoch": 1658} {"train_loss": -11.76118278503418, "global_step": 278557, "epoch": 1658} {"train_loss": -11.95077896118164, "global_step": 278558, "epoch": 1658} {"train_loss": -11.930912017822266, "global_step": 278559, "epoch": 1658} {"train_loss": -11.779889106750488, "global_step": 278560, "epoch": 1658} {"train_loss": -11.881929397583008, "global_step": 278561, "epoch": 1658} {"train_loss": -11.933539390563965, "global_step": 278562, "epoch": 1658} {"train_loss": -11.830110549926758, "global_step": 278563, "epoch": 1658} {"train_loss": -11.998123168945312, "global_step": 278564, "epoch": 1658} {"train_loss": -11.862491607666016, "global_step": 278565, "epoch": 1658} {"train_loss": -11.996660232543945, "global_step": 278566, "epoch": 1658} {"train_loss": -11.923537254333496, "global_step": 278567, "epoch": 1658} {"train_loss": -12.020898818969727, "global_step": 278568, "epoch": 1658} {"train_loss": -12.06344223022461, "global_step": 278569, "epoch": 1658} {"train_loss": -11.939596176147461, "global_step": 278570, "epoch": 1658} {"train_loss": -11.761737823486328, "global_step": 278571, "epoch": 1658} {"train_loss": -12.11069107055664, "global_step": 278572, "epoch": 1658} {"train_loss": -11.847915649414062, "global_step": 278573, "epoch": 1658} {"train_loss": -12.005192756652832, "global_step": 278574, "epoch": 1658} {"train_loss": -11.870737075805664, "global_step": 278575, "epoch": 1658} {"train_loss": -12.084205627441406, "global_step": 278576, "epoch": 1658} {"train_loss": -12.012052536010742, "global_step": 278577, "epoch": 1658} {"train_loss": -12.14161491394043, "global_step": 278578, "epoch": 1658} {"train_loss": -11.742507934570312, "global_step": 278579, "epoch": 1658} {"train_loss": -12.202333450317383, "global_step": 278580, "epoch": 1658} {"train_loss": -11.870194435119629, "global_step": 278581, "epoch": 1658} {"train_loss": -12.137489318847656, "global_step": 278582, "epoch": 1658} {"train_loss": -12.030130386352539, "global_step": 278583, "epoch": 1658} {"train_loss": -12.185317993164062, "global_step": 278584, "epoch": 1658} {"train_loss": -12.1047945022583, "global_step": 278585, "epoch": 1658} {"train_loss": -12.26313591003418, "global_step": 278586, "epoch": 1658} {"train_loss": -12.253422737121582, "global_step": 278587, "epoch": 1658} {"train_loss": -12.35416316986084, "global_step": 278588, "epoch": 1658} {"train_loss": -12.136835098266602, "global_step": 278589, "epoch": 1658} {"train_loss": -12.07027530670166, "global_step": 278590, "epoch": 1658} {"train_loss": -12.305413246154785, "global_step": 278591, "epoch": 1658} {"train_loss": -12.157546997070312, "global_step": 278592, "epoch": 1658} {"train_loss": -11.972784042358398, "global_step": 278593, "epoch": 1658} {"train_loss": -12.133197784423828, "global_step": 278594, "epoch": 1658} {"train_loss": -12.112707138061523, "global_step": 278595, "epoch": 1658} {"train_loss": -11.746126174926758, "global_step": 278596, "epoch": 1658} {"train_loss": -11.883049964904785, "global_step": 278597, "epoch": 1658} {"train_loss": -11.743125915527344, "global_step": 278598, "epoch": 1658} {"train_loss": -11.632383346557617, "global_step": 278599, "epoch": 1658} {"train_loss": -10.757162094116211, "global_step": 278600, "epoch": 1658} {"train_loss": -11.385162353515625, "global_step": 278601, "epoch": 1658} {"train_loss": -11.29676342010498, "global_step": 278602, "epoch": 1658} {"train_loss": -11.950305938720703, "global_step": 278603, "epoch": 1658} {"train_loss": -11.040655136108398, "global_step": 278604, "epoch": 1658} {"train_loss": -10.721985816955566, "global_step": 278605, "epoch": 1658} {"train_loss": -10.838105201721191, "global_step": 278606, "epoch": 1658} {"train_loss": -8.40338134765625, "global_step": 278607, "epoch": 1658} {"train_loss": -10.540590286254883, "global_step": 278608, "epoch": 1658} {"train_loss": -7.706565856933594, "global_step": 278609, "epoch": 1658} {"train_loss": -10.438456535339355, "global_step": 278610, "epoch": 1658} {"train_loss": -9.4302339553833, "global_step": 278611, "epoch": 1658} {"train_loss": -10.054647445678711, "global_step": 278612, "epoch": 1658} {"train_loss": -9.954622268676758, "global_step": 278613, "epoch": 1658} {"train_loss": -11.665410041809082, "global_step": 278614, "epoch": 1658} {"train_loss": -9.820418357849121, "global_step": 278615, "epoch": 1658} {"train_loss": -10.1525297164917, "global_step": 278616, "epoch": 1658} {"train_loss": -9.918652534484863, "global_step": 278617, "epoch": 1658} {"train_loss": -9.431482315063477, "global_step": 278618, "epoch": 1658} {"train_loss": -10.465642929077148, "global_step": 278619, "epoch": 1658} {"train_loss": -9.232474327087402, "global_step": 278620, "epoch": 1658} {"train_loss": -10.719507217407227, "global_step": 278621, "epoch": 1658} {"train_loss": -10.032076835632324, "global_step": 278622, "epoch": 1658} {"train_loss": -9.675615310668945, "global_step": 278623, "epoch": 1658} {"train_loss": -11.056010246276855, "global_step": 278624, "epoch": 1658} {"train_loss": -11.002674102783203, "global_step": 278625, "epoch": 1658} {"train_loss": -11.502294540405273, "global_step": 278626, "epoch": 1658} {"train_loss": -11.639387130737305, "global_step": 278627, "epoch": 1658} {"train_loss": -11.21463394165039, "global_step": 278628, "epoch": 1658} {"train_loss": -10.733642578125, "global_step": 278629, "epoch": 1658} {"train_loss": -11.299283027648926, "global_step": 278630, "epoch": 1658} {"train_loss": -11.403581619262695, "global_step": 278631, "epoch": 1658} {"train_loss": -11.3612642288208, "global_step": 278632, "epoch": 1658} {"train_loss": -11.438301086425781, "global_step": 278633, "epoch": 1658} {"train_loss": -11.718317031860352, "global_step": 278634, "epoch": 1658} {"train_loss": -11.513280868530273, "global_step": 278635, "epoch": 1658} {"train_loss": -11.112528800964355, "global_step": 278636, "epoch": 1658} {"train_loss": -11.569072723388672, "global_step": 278637, "epoch": 1658} {"train_loss": -11.475868225097656, "global_step": 278638, "epoch": 1658} {"train_loss": -11.806241989135742, "global_step": 278639, "epoch": 1658} {"train_loss": -11.28271770477295, "global_step": 278640, "epoch": 1658} {"train_loss": -11.741548538208008, "global_step": 278641, "epoch": 1658} {"train_loss": -11.45868968963623, "global_step": 278642, "epoch": 1658} {"train_loss": -11.44278335571289, "global_step": 278643, "epoch": 1658} {"train_loss": -11.685038566589355, "global_step": 278644, "epoch": 1658} {"train_loss": -11.679986000061035, "global_step": 278645, "epoch": 1658} {"train_loss": -11.143856048583984, "global_step": 278646, "epoch": 1658} {"train_loss": -11.1878080368042, "global_step": 278647, "epoch": 1658} {"train_loss": -11.614303588867188, "global_step": 278648, "epoch": 1658} {"train_loss": -11.601879119873047, "global_step": 278649, "epoch": 1658} {"train_loss": -11.609762191772461, "global_step": 278650, "epoch": 1658} {"train_loss": -11.26249885559082, "global_step": 278651, "epoch": 1658} {"train_loss": -11.540898323059082, "global_step": 278652, "epoch": 1658} {"train_loss": -11.759160995483398, "global_step": 278653, "epoch": 1658} {"train_loss": -11.477136611938477, "global_step": 278654, "epoch": 1658} {"train_loss": -11.72657585144043, "global_step": 278655, "epoch": 1658} {"train_loss": -11.87578010559082, "global_step": 278656, "epoch": 1658} {"train_loss": -11.596324920654297, "global_step": 278657, "epoch": 1658} {"train_loss": -12.091716766357422, "global_step": 278658, "epoch": 1658} {"train_loss": -11.997541427612305, "global_step": 278659, "epoch": 1658} {"train_loss": -11.834986686706543, "global_step": 278660, "epoch": 1658} {"train_loss": -11.876615524291992, "global_step": 278661, "epoch": 1658} {"train_loss": -11.980245590209961, "global_step": 278662, "epoch": 1658} {"train_loss": -11.953941345214844, "global_step": 278663, "epoch": 1658} {"train_loss": -12.093756675720215, "global_step": 278664, "epoch": 1658} {"train_loss": -12.336603164672852, "global_step": 278665, "epoch": 1658} {"train_loss": -12.185359954833984, "global_step": 278666, "epoch": 1658} {"train_loss": -11.958476066589355, "global_step": 278667, "epoch": 1658} {"train_loss": -12.064687728881836, "global_step": 278668, "epoch": 1658} {"train_loss": -12.087392807006836, "global_step": 278669, "epoch": 1658} {"train_loss": -12.02750301361084, "global_step": 278670, "epoch": 1658} {"train_loss": -12.037090301513672, "global_step": 278671, "epoch": 1658} {"train_loss": -11.95570182800293, "global_step": 278672, "epoch": 1658} {"train_loss": -11.934957504272461, "global_step": 278673, "epoch": 1658} {"train_loss": -12.248638153076172, "global_step": 278674, "epoch": 1658} {"train_loss": -12.050107955932617, "global_step": 278675, "epoch": 1658} {"train_loss": -12.296051025390625, "global_step": 278676, "epoch": 1658} {"train_loss": -12.205205917358398, "global_step": 278677, "epoch": 1658} {"train_loss": -11.932641983032227, "global_step": 278678, "epoch": 1658} {"train_loss": -12.17161750793457, "global_step": 278679, "epoch": 1658} {"train_loss": -11.828705787658691, "global_step": 278680, "epoch": 1658} {"train_loss": -12.188318252563477, "global_step": 278681, "epoch": 1658} {"train_loss": -11.900989532470703, "global_step": 278682, "epoch": 1658} {"train_loss": -12.264596939086914, "global_step": 278683, "epoch": 1658} {"train_loss": -12.010221481323242, "global_step": 278684, "epoch": 1658} {"train_loss": -11.971512794494629, "global_step": 278685, "epoch": 1658} {"train_loss": -11.551011085510254, "global_step": 278686, "epoch": 1658} {"train_loss": -11.89603042602539, "global_step": 278687, "epoch": 1658} {"train_loss": -11.917252540588379, "global_step": 278688, "epoch": 1658} {"train_loss": -11.938629150390625, "global_step": 278689, "epoch": 1658} {"train_loss": -12.179479598999023, "global_step": 278690, "epoch": 1658} {"train_loss": -12.229972839355469, "global_step": 278691, "epoch": 1658} {"train_loss": -12.136270523071289, "global_step": 278692, "epoch": 1658} {"train_loss": -12.065702438354492, "global_step": 278693, "epoch": 1658} {"train_loss": -12.260038375854492, "global_step": 278694, "epoch": 1658} {"train_loss": -12.01882553100586, "global_step": 278695, "epoch": 1658} {"train_loss": -12.27883529663086, "global_step": 278696, "epoch": 1658} {"train_loss": -12.239541053771973, "global_step": 278697, "epoch": 1658} {"train_loss": -12.162178039550781, "global_step": 278698, "epoch": 1658} {"train_loss": -12.057615280151367, "global_step": 278699, "epoch": 1658} {"train_loss": -12.277374267578125, "global_step": 278700, "epoch": 1658} {"train_loss": -12.460990905761719, "global_step": 278701, "epoch": 1658} {"train_loss": -12.478731155395508, "global_step": 278702, "epoch": 1658} {"train_loss": -12.504989624023438, "global_step": 278703, "epoch": 1658} {"train_loss": -12.238302230834961, "global_step": 278704, "epoch": 1658} {"train_loss": -12.38791275024414, "global_step": 278705, "epoch": 1658} {"train_loss": -12.25732421875, "global_step": 278706, "epoch": 1658} {"train_loss": -12.220648765563965, "global_step": 278707, "epoch": 1658} {"train_loss": -12.048364639282227, "global_step": 278708, "epoch": 1658} {"train_loss": -12.30069351196289, "global_step": 278709, "epoch": 1658} {"train_loss": -12.387979507446289, "global_step": 278710, "epoch": 1658} {"train_loss": -11.652168342045375, "global_step": 278711, "epoch": 1658, "val_loss": 273748.15625} {"train_loss": -11.583150863647461, "global_step": 278712, "epoch": 1659} {"train_loss": -11.450782775878906, "global_step": 278713, "epoch": 1659} {"train_loss": -11.846555709838867, "global_step": 278714, "epoch": 1659} {"train_loss": -12.213309288024902, "global_step": 278715, "epoch": 1659} {"train_loss": -11.896093368530273, "global_step": 278716, "epoch": 1659} {"train_loss": -11.563811302185059, "global_step": 278717, "epoch": 1659} {"train_loss": -11.220462799072266, "global_step": 278718, "epoch": 1659} {"train_loss": -11.994251251220703, "global_step": 278719, "epoch": 1659} {"train_loss": -11.618158340454102, "global_step": 278720, "epoch": 1659} {"train_loss": -10.072678565979004, "global_step": 278721, "epoch": 1659} {"train_loss": -12.105026245117188, "global_step": 278722, "epoch": 1659} {"train_loss": -10.712568283081055, "global_step": 278723, "epoch": 1659} {"train_loss": -9.600271224975586, "global_step": 278724, "epoch": 1659} {"train_loss": -9.973455429077148, "global_step": 278725, "epoch": 1659} {"train_loss": -10.408777236938477, "global_step": 278726, "epoch": 1659} {"train_loss": -11.063161849975586, "global_step": 278727, "epoch": 1659} {"train_loss": -9.776330947875977, "global_step": 278728, "epoch": 1659} {"train_loss": -10.919817924499512, "global_step": 278729, "epoch": 1659} {"train_loss": -10.232975006103516, "global_step": 278730, "epoch": 1659} {"train_loss": -9.978394508361816, "global_step": 278731, "epoch": 1659} {"train_loss": -11.549065589904785, "global_step": 278732, "epoch": 1659} {"train_loss": -11.132797241210938, "global_step": 278733, "epoch": 1659} {"train_loss": -11.65793228149414, "global_step": 278734, "epoch": 1659} {"train_loss": -11.09425163269043, "global_step": 278735, "epoch": 1659} {"train_loss": -11.011733055114746, "global_step": 278736, "epoch": 1659} {"train_loss": -11.279605865478516, "global_step": 278737, "epoch": 1659} {"train_loss": -11.673948287963867, "global_step": 278738, "epoch": 1659} {"train_loss": -11.743831634521484, "global_step": 278739, "epoch": 1659} {"train_loss": -11.137369155883789, "global_step": 278740, "epoch": 1659} {"train_loss": -11.408495903015137, "global_step": 278741, "epoch": 1659} {"train_loss": -11.454587936401367, "global_step": 278742, "epoch": 1659} {"train_loss": -11.358070373535156, "global_step": 278743, "epoch": 1659} {"train_loss": -11.90956974029541, "global_step": 278744, "epoch": 1659} {"train_loss": -11.48721981048584, "global_step": 278745, "epoch": 1659} {"train_loss": -12.03656005859375, "global_step": 278746, "epoch": 1659} {"train_loss": -11.796216011047363, "global_step": 278747, "epoch": 1659} {"train_loss": -11.775654792785645, "global_step": 278748, "epoch": 1659} {"train_loss": -11.288177490234375, "global_step": 278749, "epoch": 1659} {"train_loss": -11.934511184692383, "global_step": 278750, "epoch": 1659} {"train_loss": -11.714634895324707, "global_step": 278751, "epoch": 1659} {"train_loss": -11.848481178283691, "global_step": 278752, "epoch": 1659} {"train_loss": -12.115413665771484, "global_step": 278753, "epoch": 1659} {"train_loss": -11.83643913269043, "global_step": 278754, "epoch": 1659} {"train_loss": -11.80607795715332, "global_step": 278755, "epoch": 1659} {"train_loss": -11.847782135009766, "global_step": 278756, "epoch": 1659} {"train_loss": -11.841700553894043, "global_step": 278757, "epoch": 1659} {"train_loss": -12.017536163330078, "global_step": 278758, "epoch": 1659} {"train_loss": -11.602534294128418, "global_step": 278759, "epoch": 1659} {"train_loss": -11.418106079101562, "global_step": 278760, "epoch": 1659} {"train_loss": -11.814154624938965, "global_step": 278761, "epoch": 1659} {"train_loss": -11.712554931640625, "global_step": 278762, "epoch": 1659} {"train_loss": -11.912276268005371, "global_step": 278763, "epoch": 1659} {"train_loss": -11.547051429748535, "global_step": 278764, "epoch": 1659} {"train_loss": -11.845266342163086, "global_step": 278765, "epoch": 1659} {"train_loss": -11.510089874267578, "global_step": 278766, "epoch": 1659} {"train_loss": -11.260019302368164, "global_step": 278767, "epoch": 1659} {"train_loss": -11.897891998291016, "global_step": 278768, "epoch": 1659} {"train_loss": -11.149020195007324, "global_step": 278769, "epoch": 1659} {"train_loss": -11.940545082092285, "global_step": 278770, "epoch": 1659} {"train_loss": -11.686735153198242, "global_step": 278771, "epoch": 1659} {"train_loss": -11.807059288024902, "global_step": 278772, "epoch": 1659} {"train_loss": -11.616218566894531, "global_step": 278773, "epoch": 1659} {"train_loss": -11.754533767700195, "global_step": 278774, "epoch": 1659} {"train_loss": -11.829291343688965, "global_step": 278775, "epoch": 1659} {"train_loss": -11.42916488647461, "global_step": 278776, "epoch": 1659} {"train_loss": -11.670942306518555, "global_step": 278777, "epoch": 1659} {"train_loss": -11.882427215576172, "global_step": 278778, "epoch": 1659} {"train_loss": -11.920080184936523, "global_step": 278779, "epoch": 1659} {"train_loss": -12.049943923950195, "global_step": 278780, "epoch": 1659} {"train_loss": -11.926409721374512, "global_step": 278781, "epoch": 1659} {"train_loss": -11.896864891052246, "global_step": 278782, "epoch": 1659} {"train_loss": -12.0205659866333, "global_step": 278783, "epoch": 1659} {"train_loss": -11.833893775939941, "global_step": 278784, "epoch": 1659} {"train_loss": -11.867389678955078, "global_step": 278785, "epoch": 1659} {"train_loss": -12.041221618652344, "global_step": 278786, "epoch": 1659} {"train_loss": -11.819419860839844, "global_step": 278787, "epoch": 1659} {"train_loss": -12.18262767791748, "global_step": 278788, "epoch": 1659} {"train_loss": -11.930867195129395, "global_step": 278789, "epoch": 1659} {"train_loss": -12.175348281860352, "global_step": 278790, "epoch": 1659} {"train_loss": -12.217613220214844, "global_step": 278791, "epoch": 1659} {"train_loss": -12.075708389282227, "global_step": 278792, "epoch": 1659} {"train_loss": -12.251747131347656, "global_step": 278793, "epoch": 1659} {"train_loss": -12.351959228515625, "global_step": 278794, "epoch": 1659} {"train_loss": -12.24228286743164, "global_step": 278795, "epoch": 1659} {"train_loss": -12.25259017944336, "global_step": 278796, "epoch": 1659} {"train_loss": -12.299985885620117, "global_step": 278797, "epoch": 1659} {"train_loss": -12.309879302978516, "global_step": 278798, "epoch": 1659} {"train_loss": -12.143798828125, "global_step": 278799, "epoch": 1659} {"train_loss": -11.973382949829102, "global_step": 278800, "epoch": 1659} {"train_loss": -12.222319602966309, "global_step": 278801, "epoch": 1659} {"train_loss": -12.004444122314453, "global_step": 278802, "epoch": 1659} {"train_loss": -12.1644868850708, "global_step": 278803, "epoch": 1659} {"train_loss": -12.16851806640625, "global_step": 278804, "epoch": 1659} {"train_loss": -11.971704483032227, "global_step": 278805, "epoch": 1659} {"train_loss": -11.290261268615723, "global_step": 278806, "epoch": 1659} {"train_loss": -11.709047317504883, "global_step": 278807, "epoch": 1659} {"train_loss": -11.948808670043945, "global_step": 278808, "epoch": 1659} {"train_loss": -10.984976768493652, "global_step": 278809, "epoch": 1659} {"train_loss": -10.781497955322266, "global_step": 278810, "epoch": 1659} {"train_loss": -12.127120971679688, "global_step": 278811, "epoch": 1659} {"train_loss": -11.85467529296875, "global_step": 278812, "epoch": 1659} {"train_loss": -12.075944900512695, "global_step": 278813, "epoch": 1659} {"train_loss": -11.573213577270508, "global_step": 278814, "epoch": 1659} {"train_loss": -12.105572700500488, "global_step": 278815, "epoch": 1659} {"train_loss": -11.73275089263916, "global_step": 278816, "epoch": 1659} {"train_loss": -12.005289077758789, "global_step": 278817, "epoch": 1659} {"train_loss": -11.722363471984863, "global_step": 278818, "epoch": 1659} {"train_loss": -12.041565895080566, "global_step": 278819, "epoch": 1659} {"train_loss": -11.88441276550293, "global_step": 278820, "epoch": 1659} {"train_loss": -12.023687362670898, "global_step": 278821, "epoch": 1659} {"train_loss": -11.729825973510742, "global_step": 278822, "epoch": 1659} {"train_loss": -11.955843925476074, "global_step": 278823, "epoch": 1659} {"train_loss": -11.675863265991211, "global_step": 278824, "epoch": 1659} {"train_loss": -11.961712837219238, "global_step": 278825, "epoch": 1659} {"train_loss": -11.457010269165039, "global_step": 278826, "epoch": 1659} {"train_loss": -11.85844612121582, "global_step": 278827, "epoch": 1659} {"train_loss": -12.009273529052734, "global_step": 278828, "epoch": 1659} {"train_loss": -12.082149505615234, "global_step": 278829, "epoch": 1659} {"train_loss": -11.951642990112305, "global_step": 278830, "epoch": 1659} {"train_loss": -11.815418243408203, "global_step": 278831, "epoch": 1659} {"train_loss": -11.64328384399414, "global_step": 278832, "epoch": 1659} {"train_loss": -11.972749710083008, "global_step": 278833, "epoch": 1659} {"train_loss": -11.963153839111328, "global_step": 278834, "epoch": 1659} {"train_loss": -12.1975736618042, "global_step": 278835, "epoch": 1659} {"train_loss": -11.911663055419922, "global_step": 278836, "epoch": 1659} {"train_loss": -12.09634780883789, "global_step": 278837, "epoch": 1659} {"train_loss": -12.105969429016113, "global_step": 278838, "epoch": 1659} {"train_loss": -11.977017402648926, "global_step": 278839, "epoch": 1659} {"train_loss": -12.008666038513184, "global_step": 278840, "epoch": 1659} {"train_loss": -12.064105033874512, "global_step": 278841, "epoch": 1659} {"train_loss": -12.058256149291992, "global_step": 278842, "epoch": 1659} {"train_loss": -12.227685928344727, "global_step": 278843, "epoch": 1659} {"train_loss": -12.140207290649414, "global_step": 278844, "epoch": 1659} {"train_loss": -11.828994750976562, "global_step": 278845, "epoch": 1659} {"train_loss": -12.176976203918457, "global_step": 278846, "epoch": 1659} {"train_loss": -11.97137451171875, "global_step": 278847, "epoch": 1659} {"train_loss": -12.26060676574707, "global_step": 278848, "epoch": 1659} {"train_loss": -11.943890571594238, "global_step": 278849, "epoch": 1659} {"train_loss": -12.087709426879883, "global_step": 278850, "epoch": 1659} {"train_loss": -11.936010360717773, "global_step": 278851, "epoch": 1659} {"train_loss": -11.34122085571289, "global_step": 278852, "epoch": 1659} {"train_loss": -11.425498008728027, "global_step": 278853, "epoch": 1659} {"train_loss": -11.717318534851074, "global_step": 278854, "epoch": 1659} {"train_loss": -11.445366859436035, "global_step": 278855, "epoch": 1659} {"train_loss": -11.144628524780273, "global_step": 278856, "epoch": 1659} {"train_loss": -11.353850364685059, "global_step": 278857, "epoch": 1659} {"train_loss": -11.76890754699707, "global_step": 278858, "epoch": 1659} {"train_loss": -11.965028762817383, "global_step": 278859, "epoch": 1659} {"train_loss": -11.50041675567627, "global_step": 278860, "epoch": 1659} {"train_loss": -10.747649192810059, "global_step": 278861, "epoch": 1659} {"train_loss": -10.225690841674805, "global_step": 278862, "epoch": 1659} {"train_loss": -9.505555152893066, "global_step": 278863, "epoch": 1659} {"train_loss": -9.678945541381836, "global_step": 278864, "epoch": 1659} {"train_loss": -10.490301132202148, "global_step": 278865, "epoch": 1659} {"train_loss": -8.682487487792969, "global_step": 278866, "epoch": 1659} {"train_loss": -8.305365562438965, "global_step": 278867, "epoch": 1659} {"train_loss": -9.72717571258545, "global_step": 278868, "epoch": 1659} {"train_loss": -10.752326965332031, "global_step": 278869, "epoch": 1659} {"train_loss": -9.78863525390625, "global_step": 278870, "epoch": 1659} {"train_loss": -10.55169677734375, "global_step": 278871, "epoch": 1659} {"train_loss": -8.209142684936523, "global_step": 278872, "epoch": 1659} {"train_loss": -8.641060829162598, "global_step": 278873, "epoch": 1659} {"train_loss": -10.143289566040039, "global_step": 278874, "epoch": 1659} {"train_loss": -7.179378986358643, "global_step": 278875, "epoch": 1659} {"train_loss": -10.091148376464844, "global_step": 278876, "epoch": 1659} {"train_loss": -6.96458625793457, "global_step": 278877, "epoch": 1659} {"train_loss": -8.752761840820312, "global_step": 278878, "epoch": 1659} {"train_loss": -11.434564712501707, "global_step": 278879, "epoch": 1659, "val_loss": 271954.40625} {"train_loss": -8.405546188354492, "global_step": 278880, "epoch": 1660} {"train_loss": -10.218871116638184, "global_step": 278881, "epoch": 1660} {"train_loss": -7.997814178466797, "global_step": 278882, "epoch": 1660} {"train_loss": -8.347223281860352, "global_step": 278883, "epoch": 1660} {"train_loss": -9.235443115234375, "global_step": 278884, "epoch": 1660} {"train_loss": -9.13044548034668, "global_step": 278885, "epoch": 1660} {"train_loss": -8.63073444366455, "global_step": 278886, "epoch": 1660} {"train_loss": -9.173429489135742, "global_step": 278887, "epoch": 1660} {"train_loss": -10.785072326660156, "global_step": 278888, "epoch": 1660} {"train_loss": -10.145209312438965, "global_step": 278889, "epoch": 1660} {"train_loss": -10.00252914428711, "global_step": 278890, "epoch": 1660} {"train_loss": -11.10944938659668, "global_step": 278891, "epoch": 1660} {"train_loss": -10.681156158447266, "global_step": 278892, "epoch": 1660} {"train_loss": -10.149361610412598, "global_step": 278893, "epoch": 1660} {"train_loss": -11.166485786437988, "global_step": 278894, "epoch": 1660} {"train_loss": -10.492376327514648, "global_step": 278895, "epoch": 1660} {"train_loss": -10.538875579833984, "global_step": 278896, "epoch": 1660} {"train_loss": -11.234838485717773, "global_step": 278897, "epoch": 1660} {"train_loss": -11.137341499328613, "global_step": 278898, "epoch": 1660} {"train_loss": -10.786663055419922, "global_step": 278899, "epoch": 1660} {"train_loss": -11.346874237060547, "global_step": 278900, "epoch": 1660} {"train_loss": -11.496479034423828, "global_step": 278901, "epoch": 1660} {"train_loss": -11.393033981323242, "global_step": 278902, "epoch": 1660} {"train_loss": -11.355844497680664, "global_step": 278903, "epoch": 1660} {"train_loss": -11.568841934204102, "global_step": 278904, "epoch": 1660} {"train_loss": -11.342819213867188, "global_step": 278905, "epoch": 1660} {"train_loss": -11.547734260559082, "global_step": 278906, "epoch": 1660} {"train_loss": -11.438868522644043, "global_step": 278907, "epoch": 1660} {"train_loss": -11.218158721923828, "global_step": 278908, "epoch": 1660} {"train_loss": -11.426469802856445, "global_step": 278909, "epoch": 1660} {"train_loss": -11.579882621765137, "global_step": 278910, "epoch": 1660} {"train_loss": -11.667856216430664, "global_step": 278911, "epoch": 1660} {"train_loss": -11.531560897827148, "global_step": 278912, "epoch": 1660} {"train_loss": -11.62544059753418, "global_step": 278913, "epoch": 1660} {"train_loss": -11.648384094238281, "global_step": 278914, "epoch": 1660} {"train_loss": -11.648820877075195, "global_step": 278915, "epoch": 1660} {"train_loss": -11.658823013305664, "global_step": 278916, "epoch": 1660} {"train_loss": -11.748167037963867, "global_step": 278917, "epoch": 1660} {"train_loss": -11.779650688171387, "global_step": 278918, "epoch": 1660} {"train_loss": -11.665556907653809, "global_step": 278919, "epoch": 1660} {"train_loss": -11.813047409057617, "global_step": 278920, "epoch": 1660} {"train_loss": -11.919853210449219, "global_step": 278921, "epoch": 1660} {"train_loss": -11.849544525146484, "global_step": 278922, "epoch": 1660} {"train_loss": -11.845630645751953, "global_step": 278923, "epoch": 1660} {"train_loss": -11.89486312866211, "global_step": 278924, "epoch": 1660} {"train_loss": -11.517338752746582, "global_step": 278925, "epoch": 1660} {"train_loss": -11.939680099487305, "global_step": 278926, "epoch": 1660} {"train_loss": -11.763216018676758, "global_step": 278927, "epoch": 1660} {"train_loss": -11.911828994750977, "global_step": 278928, "epoch": 1660} {"train_loss": -11.816910743713379, "global_step": 278929, "epoch": 1660} {"train_loss": -11.817419052124023, "global_step": 278930, "epoch": 1660} {"train_loss": -11.845175743103027, "global_step": 278931, "epoch": 1660} {"train_loss": -12.053717613220215, "global_step": 278932, "epoch": 1660} {"train_loss": -11.887166023254395, "global_step": 278933, "epoch": 1660} {"train_loss": -12.005876541137695, "global_step": 278934, "epoch": 1660} {"train_loss": -11.956216812133789, "global_step": 278935, "epoch": 1660} {"train_loss": -11.994503021240234, "global_step": 278936, "epoch": 1660} {"train_loss": -12.072212219238281, "global_step": 278937, "epoch": 1660} {"train_loss": -12.000926971435547, "global_step": 278938, "epoch": 1660} {"train_loss": -12.006340026855469, "global_step": 278939, "epoch": 1660} {"train_loss": -12.135939598083496, "global_step": 278940, "epoch": 1660} {"train_loss": -12.176141738891602, "global_step": 278941, "epoch": 1660} {"train_loss": -11.848409652709961, "global_step": 278942, "epoch": 1660} {"train_loss": -12.115558624267578, "global_step": 278943, "epoch": 1660} {"train_loss": -12.085115432739258, "global_step": 278944, "epoch": 1660} {"train_loss": -12.017242431640625, "global_step": 278945, "epoch": 1660} {"train_loss": -12.018875122070312, "global_step": 278946, "epoch": 1660} {"train_loss": -11.922693252563477, "global_step": 278947, "epoch": 1660} {"train_loss": -11.92738151550293, "global_step": 278948, "epoch": 1660} {"train_loss": -12.17696762084961, "global_step": 278949, "epoch": 1660} {"train_loss": -12.026979446411133, "global_step": 278950, "epoch": 1660} {"train_loss": -12.026344299316406, "global_step": 278951, "epoch": 1660} {"train_loss": -12.157848358154297, "global_step": 278952, "epoch": 1660} {"train_loss": -12.105332374572754, "global_step": 278953, "epoch": 1660} {"train_loss": -11.977198600769043, "global_step": 278954, "epoch": 1660} {"train_loss": -12.02223014831543, "global_step": 278955, "epoch": 1660} {"train_loss": -12.160104751586914, "global_step": 278956, "epoch": 1660} {"train_loss": -12.051345825195312, "global_step": 278957, "epoch": 1660} {"train_loss": -12.2891845703125, "global_step": 278958, "epoch": 1660} {"train_loss": -12.036346435546875, "global_step": 278959, "epoch": 1660} {"train_loss": -12.079139709472656, "global_step": 278960, "epoch": 1660} {"train_loss": -12.0624418258667, "global_step": 278961, "epoch": 1660} {"train_loss": -12.035375595092773, "global_step": 278962, "epoch": 1660} {"train_loss": -12.274240493774414, "global_step": 278963, "epoch": 1660} {"train_loss": -12.096064567565918, "global_step": 278964, "epoch": 1660} {"train_loss": -12.271204948425293, "global_step": 278965, "epoch": 1660} {"train_loss": -12.241440773010254, "global_step": 278966, "epoch": 1660} {"train_loss": -12.234310150146484, "global_step": 278967, "epoch": 1660} {"train_loss": -12.039533615112305, "global_step": 278968, "epoch": 1660} {"train_loss": -12.10342025756836, "global_step": 278969, "epoch": 1660} {"train_loss": -12.35245418548584, "global_step": 278970, "epoch": 1660} {"train_loss": -12.323440551757812, "global_step": 278971, "epoch": 1660} {"train_loss": -12.222627639770508, "global_step": 278972, "epoch": 1660} {"train_loss": -11.90450668334961, "global_step": 278973, "epoch": 1660} {"train_loss": -12.20012378692627, "global_step": 278974, "epoch": 1660} {"train_loss": -11.824736595153809, "global_step": 278975, "epoch": 1660} {"train_loss": -12.273061752319336, "global_step": 278976, "epoch": 1660} {"train_loss": -12.254016876220703, "global_step": 278977, "epoch": 1660} {"train_loss": -12.287696838378906, "global_step": 278978, "epoch": 1660} {"train_loss": -12.347192764282227, "global_step": 278979, "epoch": 1660} {"train_loss": -12.302755355834961, "global_step": 278980, "epoch": 1660} {"train_loss": -11.86050796508789, "global_step": 278981, "epoch": 1660} {"train_loss": -12.324769973754883, "global_step": 278982, "epoch": 1660} {"train_loss": -12.060626983642578, "global_step": 278983, "epoch": 1660} {"train_loss": -11.647830963134766, "global_step": 278984, "epoch": 1660} {"train_loss": -10.963777542114258, "global_step": 278985, "epoch": 1660} {"train_loss": -11.50019645690918, "global_step": 278986, "epoch": 1660} {"train_loss": -11.494518280029297, "global_step": 278987, "epoch": 1660} {"train_loss": -11.90412712097168, "global_step": 278988, "epoch": 1660} {"train_loss": -11.97314739227295, "global_step": 278989, "epoch": 1660} {"train_loss": -11.622121810913086, "global_step": 278990, "epoch": 1660} {"train_loss": -11.638596534729004, "global_step": 278991, "epoch": 1660} {"train_loss": -12.237064361572266, "global_step": 278992, "epoch": 1660} {"train_loss": -12.022660255432129, "global_step": 278993, "epoch": 1660} {"train_loss": -12.053483963012695, "global_step": 278994, "epoch": 1660} {"train_loss": -11.948467254638672, "global_step": 278995, "epoch": 1660} {"train_loss": -11.612905502319336, "global_step": 278996, "epoch": 1660} {"train_loss": -10.781379699707031, "global_step": 278997, "epoch": 1660} {"train_loss": -11.772753715515137, "global_step": 278998, "epoch": 1660} {"train_loss": -12.154610633850098, "global_step": 278999, "epoch": 1660} {"train_loss": -11.562533378601074, "global_step": 279000, "epoch": 1660} {"train_loss": -11.72262191772461, "global_step": 279001, "epoch": 1660} {"train_loss": -12.026108741760254, "global_step": 279002, "epoch": 1660} {"train_loss": -11.431068420410156, "global_step": 279003, "epoch": 1660} {"train_loss": -11.605249404907227, "global_step": 279004, "epoch": 1660} {"train_loss": -11.681753158569336, "global_step": 279005, "epoch": 1660} {"train_loss": -11.708231925964355, "global_step": 279006, "epoch": 1660} {"train_loss": -11.620094299316406, "global_step": 279007, "epoch": 1660} {"train_loss": -11.838934898376465, "global_step": 279008, "epoch": 1660} {"train_loss": -11.626157760620117, "global_step": 279009, "epoch": 1660} {"train_loss": -11.842101097106934, "global_step": 279010, "epoch": 1660} {"train_loss": -11.832584381103516, "global_step": 279011, "epoch": 1660} {"train_loss": -11.831949234008789, "global_step": 279012, "epoch": 1660} {"train_loss": -11.788980484008789, "global_step": 279013, "epoch": 1660} {"train_loss": -10.478814125061035, "global_step": 279014, "epoch": 1660} {"train_loss": -11.826869010925293, "global_step": 279015, "epoch": 1660} {"train_loss": -11.961416244506836, "global_step": 279016, "epoch": 1660} {"train_loss": -10.65829086303711, "global_step": 279017, "epoch": 1660} {"train_loss": -10.759588241577148, "global_step": 279018, "epoch": 1660} {"train_loss": -11.653402328491211, "global_step": 279019, "epoch": 1660} {"train_loss": -11.856618881225586, "global_step": 279020, "epoch": 1660} {"train_loss": -11.878446578979492, "global_step": 279021, "epoch": 1660} {"train_loss": -11.70700454711914, "global_step": 279022, "epoch": 1660} {"train_loss": -11.440892219543457, "global_step": 279023, "epoch": 1660} {"train_loss": -11.110124588012695, "global_step": 279024, "epoch": 1660} {"train_loss": -10.682551383972168, "global_step": 279025, "epoch": 1660} {"train_loss": -11.37722396850586, "global_step": 279026, "epoch": 1660} {"train_loss": -11.355883598327637, "global_step": 279027, "epoch": 1660} {"train_loss": -11.373604774475098, "global_step": 279028, "epoch": 1660} {"train_loss": -9.474634170532227, "global_step": 279029, "epoch": 1660} {"train_loss": -11.540655136108398, "global_step": 279030, "epoch": 1660} {"train_loss": -11.30408763885498, "global_step": 279031, "epoch": 1660} {"train_loss": -10.930425643920898, "global_step": 279032, "epoch": 1660} {"train_loss": -11.198299407958984, "global_step": 279033, "epoch": 1660} {"train_loss": -10.151433944702148, "global_step": 279034, "epoch": 1660} {"train_loss": -11.477721214294434, "global_step": 279035, "epoch": 1660} {"train_loss": -10.267669677734375, "global_step": 279036, "epoch": 1660} {"train_loss": -11.39948558807373, "global_step": 279037, "epoch": 1660} {"train_loss": -11.196273803710938, "global_step": 279038, "epoch": 1660} {"train_loss": -11.395066261291504, "global_step": 279039, "epoch": 1660} {"train_loss": -11.320297241210938, "global_step": 279040, "epoch": 1660} {"train_loss": -10.96267318725586, "global_step": 279041, "epoch": 1660} {"train_loss": -11.363871574401855, "global_step": 279042, "epoch": 1660} {"train_loss": -10.417770385742188, "global_step": 279043, "epoch": 1660} {"train_loss": -10.466310501098633, "global_step": 279044, "epoch": 1660} {"train_loss": -10.251557350158691, "global_step": 279045, "epoch": 1660} {"train_loss": -10.548910140991211, "global_step": 279046, "epoch": 1660} {"train_loss": -11.485758520307995, "global_step": 279047, "epoch": 1660, "val_loss": 277549.9375, "train_action_mse_error": 4.368386745452881} {"train_loss": -10.996955871582031, "global_step": 279048, "epoch": 1661} {"train_loss": -10.54626178741455, "global_step": 279049, "epoch": 1661} {"train_loss": -10.55865478515625, "global_step": 279050, "epoch": 1661} {"train_loss": -10.895467758178711, "global_step": 279051, "epoch": 1661} {"train_loss": -10.998510360717773, "global_step": 279052, "epoch": 1661} {"train_loss": -10.366636276245117, "global_step": 279053, "epoch": 1661} {"train_loss": -11.09837532043457, "global_step": 279054, "epoch": 1661} {"train_loss": -10.46618366241455, "global_step": 279055, "epoch": 1661} {"train_loss": -11.303962707519531, "global_step": 279056, "epoch": 1661} {"train_loss": -10.663761138916016, "global_step": 279057, "epoch": 1661} {"train_loss": -11.005220413208008, "global_step": 279058, "epoch": 1661} {"train_loss": -10.853590965270996, "global_step": 279059, "epoch": 1661} {"train_loss": -10.963468551635742, "global_step": 279060, "epoch": 1661} {"train_loss": -10.80445671081543, "global_step": 279061, "epoch": 1661} {"train_loss": -11.111215591430664, "global_step": 279062, "epoch": 1661} {"train_loss": -11.152915954589844, "global_step": 279063, "epoch": 1661} {"train_loss": -11.074689865112305, "global_step": 279064, "epoch": 1661} {"train_loss": -11.092205047607422, "global_step": 279065, "epoch": 1661} {"train_loss": -10.425137519836426, "global_step": 279066, "epoch": 1661} {"train_loss": -11.243897438049316, "global_step": 279067, "epoch": 1661} {"train_loss": -10.996079444885254, "global_step": 279068, "epoch": 1661} {"train_loss": -11.473573684692383, "global_step": 279069, "epoch": 1661} {"train_loss": -11.167598724365234, "global_step": 279070, "epoch": 1661} {"train_loss": -10.986810684204102, "global_step": 279071, "epoch": 1661} {"train_loss": -10.300634384155273, "global_step": 279072, "epoch": 1661} {"train_loss": -11.162501335144043, "global_step": 279073, "epoch": 1661} {"train_loss": -10.779393196105957, "global_step": 279074, "epoch": 1661} {"train_loss": -11.619144439697266, "global_step": 279075, "epoch": 1661} {"train_loss": -10.738988876342773, "global_step": 279076, "epoch": 1661} {"train_loss": -10.980941772460938, "global_step": 279077, "epoch": 1661} {"train_loss": -11.463687896728516, "global_step": 279078, "epoch": 1661} {"train_loss": -11.251810073852539, "global_step": 279079, "epoch": 1661} {"train_loss": -11.193046569824219, "global_step": 279080, "epoch": 1661} {"train_loss": -10.297727584838867, "global_step": 279081, "epoch": 1661} {"train_loss": -11.388762474060059, "global_step": 279082, "epoch": 1661} {"train_loss": -10.85300350189209, "global_step": 279083, "epoch": 1661} {"train_loss": -11.45535659790039, "global_step": 279084, "epoch": 1661} {"train_loss": -10.26034927368164, "global_step": 279085, "epoch": 1661} {"train_loss": -11.443059921264648, "global_step": 279086, "epoch": 1661} {"train_loss": -10.518290519714355, "global_step": 279087, "epoch": 1661} {"train_loss": -11.425968170166016, "global_step": 279088, "epoch": 1661} {"train_loss": -10.751166343688965, "global_step": 279089, "epoch": 1661} {"train_loss": -10.770445823669434, "global_step": 279090, "epoch": 1661} {"train_loss": -11.402424812316895, "global_step": 279091, "epoch": 1661} {"train_loss": -11.161294937133789, "global_step": 279092, "epoch": 1661} {"train_loss": -11.063702583312988, "global_step": 279093, "epoch": 1661} {"train_loss": -10.982295036315918, "global_step": 279094, "epoch": 1661} {"train_loss": -11.371179580688477, "global_step": 279095, "epoch": 1661} {"train_loss": -11.321318626403809, "global_step": 279096, "epoch": 1661} {"train_loss": -11.368156433105469, "global_step": 279097, "epoch": 1661} {"train_loss": -11.410805702209473, "global_step": 279098, "epoch": 1661} {"train_loss": -11.689645767211914, "global_step": 279099, "epoch": 1661} {"train_loss": -11.428936958312988, "global_step": 279100, "epoch": 1661} {"train_loss": -11.466985702514648, "global_step": 279101, "epoch": 1661} {"train_loss": -11.285776138305664, "global_step": 279102, "epoch": 1661} {"train_loss": -11.704297065734863, "global_step": 279103, "epoch": 1661} {"train_loss": -11.550032615661621, "global_step": 279104, "epoch": 1661} {"train_loss": -11.70728588104248, "global_step": 279105, "epoch": 1661} {"train_loss": -11.877741813659668, "global_step": 279106, "epoch": 1661} {"train_loss": -11.706010818481445, "global_step": 279107, "epoch": 1661} {"train_loss": -11.808042526245117, "global_step": 279108, "epoch": 1661} {"train_loss": -11.703907012939453, "global_step": 279109, "epoch": 1661} {"train_loss": -11.91238784790039, "global_step": 279110, "epoch": 1661} {"train_loss": -11.877431869506836, "global_step": 279111, "epoch": 1661} {"train_loss": -11.683448791503906, "global_step": 279112, "epoch": 1661} {"train_loss": -11.433137893676758, "global_step": 279113, "epoch": 1661} {"train_loss": -12.030342102050781, "global_step": 279114, "epoch": 1661} {"train_loss": -11.723960876464844, "global_step": 279115, "epoch": 1661} {"train_loss": -11.738119125366211, "global_step": 279116, "epoch": 1661} {"train_loss": -11.654293060302734, "global_step": 279117, "epoch": 1661} {"train_loss": -11.726973533630371, "global_step": 279118, "epoch": 1661} {"train_loss": -12.058598518371582, "global_step": 279119, "epoch": 1661} {"train_loss": -11.780282974243164, "global_step": 279120, "epoch": 1661} {"train_loss": -11.959269523620605, "global_step": 279121, "epoch": 1661} {"train_loss": -11.735898971557617, "global_step": 279122, "epoch": 1661} {"train_loss": -11.952817916870117, "global_step": 279123, "epoch": 1661} {"train_loss": -11.725183486938477, "global_step": 279124, "epoch": 1661} {"train_loss": -11.85099983215332, "global_step": 279125, "epoch": 1661} {"train_loss": -11.823122024536133, "global_step": 279126, "epoch": 1661} {"train_loss": -12.092317581176758, "global_step": 279127, "epoch": 1661} {"train_loss": -12.103754043579102, "global_step": 279128, "epoch": 1661} {"train_loss": -12.06295394897461, "global_step": 279129, "epoch": 1661} {"train_loss": -11.896655082702637, "global_step": 279130, "epoch": 1661} {"train_loss": -12.008316040039062, "global_step": 279131, "epoch": 1661} {"train_loss": -12.029184341430664, "global_step": 279132, "epoch": 1661} {"train_loss": -11.939517974853516, "global_step": 279133, "epoch": 1661} {"train_loss": -11.83444595336914, "global_step": 279134, "epoch": 1661} {"train_loss": -11.947598457336426, "global_step": 279135, "epoch": 1661} {"train_loss": -12.194931030273438, "global_step": 279136, "epoch": 1661} {"train_loss": -11.7322998046875, "global_step": 279137, "epoch": 1661} {"train_loss": -11.955865859985352, "global_step": 279138, "epoch": 1661} {"train_loss": -11.99512767791748, "global_step": 279139, "epoch": 1661} {"train_loss": -11.736472129821777, "global_step": 279140, "epoch": 1661} {"train_loss": -12.074968338012695, "global_step": 279141, "epoch": 1661} {"train_loss": -12.099529266357422, "global_step": 279142, "epoch": 1661} {"train_loss": -12.18657112121582, "global_step": 279143, "epoch": 1661} {"train_loss": -11.989349365234375, "global_step": 279144, "epoch": 1661} {"train_loss": -12.153372764587402, "global_step": 279145, "epoch": 1661} {"train_loss": -12.155596733093262, "global_step": 279146, "epoch": 1661} {"train_loss": -12.11410903930664, "global_step": 279147, "epoch": 1661} {"train_loss": -11.90179443359375, "global_step": 279148, "epoch": 1661} {"train_loss": -12.103586196899414, "global_step": 279149, "epoch": 1661} {"train_loss": -12.366270065307617, "global_step": 279150, "epoch": 1661} {"train_loss": -12.10572338104248, "global_step": 279151, "epoch": 1661} {"train_loss": -12.213032722473145, "global_step": 279152, "epoch": 1661} {"train_loss": -11.874394416809082, "global_step": 279153, "epoch": 1661} {"train_loss": -11.668272972106934, "global_step": 279154, "epoch": 1661} {"train_loss": -11.769246101379395, "global_step": 279155, "epoch": 1661} {"train_loss": -12.319093704223633, "global_step": 279156, "epoch": 1661} {"train_loss": -11.956708908081055, "global_step": 279157, "epoch": 1661} {"train_loss": -11.99966812133789, "global_step": 279158, "epoch": 1661} {"train_loss": -12.03158950805664, "global_step": 279159, "epoch": 1661} {"train_loss": -12.019826889038086, "global_step": 279160, "epoch": 1661} {"train_loss": -11.905176162719727, "global_step": 279161, "epoch": 1661} {"train_loss": -12.056713104248047, "global_step": 279162, "epoch": 1661} {"train_loss": -12.341489791870117, "global_step": 279163, "epoch": 1661} {"train_loss": -11.838401794433594, "global_step": 279164, "epoch": 1661} {"train_loss": -11.552443504333496, "global_step": 279165, "epoch": 1661} {"train_loss": -11.910993576049805, "global_step": 279166, "epoch": 1661} {"train_loss": -12.229072570800781, "global_step": 279167, "epoch": 1661} {"train_loss": -11.738224029541016, "global_step": 279168, "epoch": 1661} {"train_loss": -11.54401683807373, "global_step": 279169, "epoch": 1661} {"train_loss": -11.236472129821777, "global_step": 279170, "epoch": 1661} {"train_loss": -11.407699584960938, "global_step": 279171, "epoch": 1661} {"train_loss": -11.20509147644043, "global_step": 279172, "epoch": 1661} {"train_loss": -10.912065505981445, "global_step": 279173, "epoch": 1661} {"train_loss": -12.029190063476562, "global_step": 279174, "epoch": 1661} {"train_loss": -10.248394012451172, "global_step": 279175, "epoch": 1661} {"train_loss": -11.229002952575684, "global_step": 279176, "epoch": 1661} {"train_loss": -11.870594024658203, "global_step": 279177, "epoch": 1661} {"train_loss": -11.812488555908203, "global_step": 279178, "epoch": 1661} {"train_loss": -11.058633804321289, "global_step": 279179, "epoch": 1661} {"train_loss": -11.19056224822998, "global_step": 279180, "epoch": 1661} {"train_loss": -11.996871948242188, "global_step": 279181, "epoch": 1661} {"train_loss": -11.265801429748535, "global_step": 279182, "epoch": 1661} {"train_loss": -10.174039840698242, "global_step": 279183, "epoch": 1661} {"train_loss": -10.994041442871094, "global_step": 279184, "epoch": 1661} {"train_loss": -11.072751998901367, "global_step": 279185, "epoch": 1661} {"train_loss": -11.25515079498291, "global_step": 279186, "epoch": 1661} {"train_loss": -11.39284610748291, "global_step": 279187, "epoch": 1661} {"train_loss": -10.912522315979004, "global_step": 279188, "epoch": 1661} {"train_loss": -11.55413818359375, "global_step": 279189, "epoch": 1661} {"train_loss": -10.145044326782227, "global_step": 279190, "epoch": 1661} {"train_loss": -11.26230239868164, "global_step": 279191, "epoch": 1661} {"train_loss": -10.914320945739746, "global_step": 279192, "epoch": 1661} {"train_loss": -10.904068946838379, "global_step": 279193, "epoch": 1661} {"train_loss": -11.422823905944824, "global_step": 279194, "epoch": 1661} {"train_loss": -11.052937507629395, "global_step": 279195, "epoch": 1661} {"train_loss": -11.121203422546387, "global_step": 279196, "epoch": 1661} {"train_loss": -10.821786880493164, "global_step": 279197, "epoch": 1661} {"train_loss": -10.9817476272583, "global_step": 279198, "epoch": 1661} {"train_loss": -11.15206527709961, "global_step": 279199, "epoch": 1661} {"train_loss": -10.394674301147461, "global_step": 279200, "epoch": 1661} {"train_loss": -11.506473541259766, "global_step": 279201, "epoch": 1661} {"train_loss": -11.219539642333984, "global_step": 279202, "epoch": 1661} {"train_loss": -11.182680130004883, "global_step": 279203, "epoch": 1661} {"train_loss": -11.708642959594727, "global_step": 279204, "epoch": 1661} {"train_loss": -10.728288650512695, "global_step": 279205, "epoch": 1661} {"train_loss": -11.744475364685059, "global_step": 279206, "epoch": 1661} {"train_loss": -10.795768737792969, "global_step": 279207, "epoch": 1661} {"train_loss": -11.572212219238281, "global_step": 279208, "epoch": 1661} {"train_loss": -10.64144515991211, "global_step": 279209, "epoch": 1661} {"train_loss": -11.492581367492676, "global_step": 279210, "epoch": 1661} {"train_loss": -10.659173965454102, "global_step": 279211, "epoch": 1661} {"train_loss": -11.693241119384766, "global_step": 279212, "epoch": 1661} {"train_loss": -10.626968383789062, "global_step": 279213, "epoch": 1661} {"train_loss": -11.08968734741211, "global_step": 279214, "epoch": 1661} {"train_loss": -11.415035372688656, "global_step": 279215, "epoch": 1661, "val_loss": 277913.5} {"train_loss": -11.040507316589355, "global_step": 279216, "epoch": 1662} {"train_loss": -10.984769821166992, "global_step": 279217, "epoch": 1662} {"train_loss": -11.1264066696167, "global_step": 279218, "epoch": 1662} {"train_loss": -11.401850700378418, "global_step": 279219, "epoch": 1662} {"train_loss": -11.063282012939453, "global_step": 279220, "epoch": 1662} {"train_loss": -11.213147163391113, "global_step": 279221, "epoch": 1662} {"train_loss": -10.781341552734375, "global_step": 279222, "epoch": 1662} {"train_loss": -10.800495147705078, "global_step": 279223, "epoch": 1662} {"train_loss": -11.275179862976074, "global_step": 279224, "epoch": 1662} {"train_loss": -10.821433067321777, "global_step": 279225, "epoch": 1662} {"train_loss": -11.363718032836914, "global_step": 279226, "epoch": 1662} {"train_loss": -11.126031875610352, "global_step": 279227, "epoch": 1662} {"train_loss": -11.13000202178955, "global_step": 279228, "epoch": 1662} {"train_loss": -11.423454284667969, "global_step": 279229, "epoch": 1662} {"train_loss": -11.304656982421875, "global_step": 279230, "epoch": 1662} {"train_loss": -11.350775718688965, "global_step": 279231, "epoch": 1662} {"train_loss": -11.94886302947998, "global_step": 279232, "epoch": 1662} {"train_loss": -10.977582931518555, "global_step": 279233, "epoch": 1662} {"train_loss": -11.72836685180664, "global_step": 279234, "epoch": 1662} {"train_loss": -11.46723747253418, "global_step": 279235, "epoch": 1662} {"train_loss": -11.652265548706055, "global_step": 279236, "epoch": 1662} {"train_loss": -11.667439460754395, "global_step": 279237, "epoch": 1662} {"train_loss": -11.543268203735352, "global_step": 279238, "epoch": 1662} {"train_loss": -11.721315383911133, "global_step": 279239, "epoch": 1662} {"train_loss": -11.621570587158203, "global_step": 279240, "epoch": 1662} {"train_loss": -11.690832138061523, "global_step": 279241, "epoch": 1662} {"train_loss": -11.735533714294434, "global_step": 279242, "epoch": 1662} {"train_loss": -11.796897888183594, "global_step": 279243, "epoch": 1662} {"train_loss": -11.819742202758789, "global_step": 279244, "epoch": 1662} {"train_loss": -11.845117568969727, "global_step": 279245, "epoch": 1662} {"train_loss": -11.919877052307129, "global_step": 279246, "epoch": 1662} {"train_loss": -12.027961730957031, "global_step": 279247, "epoch": 1662} {"train_loss": -11.849562644958496, "global_step": 279248, "epoch": 1662} {"train_loss": -11.970697402954102, "global_step": 279249, "epoch": 1662} {"train_loss": -11.769454002380371, "global_step": 279250, "epoch": 1662} {"train_loss": -11.854125022888184, "global_step": 279251, "epoch": 1662} {"train_loss": -12.048882484436035, "global_step": 279252, "epoch": 1662} {"train_loss": -11.818675994873047, "global_step": 279253, "epoch": 1662} {"train_loss": -12.064687728881836, "global_step": 279254, "epoch": 1662} {"train_loss": -11.803543090820312, "global_step": 279255, "epoch": 1662} {"train_loss": -12.10108757019043, "global_step": 279256, "epoch": 1662} {"train_loss": -11.672323226928711, "global_step": 279257, "epoch": 1662} {"train_loss": -11.607210159301758, "global_step": 279258, "epoch": 1662} {"train_loss": -11.973943710327148, "global_step": 279259, "epoch": 1662} {"train_loss": -11.873021125793457, "global_step": 279260, "epoch": 1662} {"train_loss": -12.032333374023438, "global_step": 279261, "epoch": 1662} {"train_loss": -11.753493309020996, "global_step": 279262, "epoch": 1662} {"train_loss": -12.204338073730469, "global_step": 279263, "epoch": 1662} {"train_loss": -11.560234069824219, "global_step": 279264, "epoch": 1662} {"train_loss": -11.827363967895508, "global_step": 279265, "epoch": 1662} {"train_loss": -11.936028480529785, "global_step": 279266, "epoch": 1662} {"train_loss": -11.69087028503418, "global_step": 279267, "epoch": 1662} {"train_loss": -11.731857299804688, "global_step": 279268, "epoch": 1662} {"train_loss": -11.67216968536377, "global_step": 279269, "epoch": 1662} {"train_loss": -11.604308128356934, "global_step": 279270, "epoch": 1662} {"train_loss": -11.59115219116211, "global_step": 279271, "epoch": 1662} {"train_loss": -11.807943344116211, "global_step": 279272, "epoch": 1662} {"train_loss": -11.806346893310547, "global_step": 279273, "epoch": 1662} {"train_loss": -12.140266418457031, "global_step": 279274, "epoch": 1662} {"train_loss": -11.852602005004883, "global_step": 279275, "epoch": 1662} {"train_loss": -12.102306365966797, "global_step": 279276, "epoch": 1662} {"train_loss": -11.783706665039062, "global_step": 279277, "epoch": 1662} {"train_loss": -12.212738990783691, "global_step": 279278, "epoch": 1662} {"train_loss": -11.981689453125, "global_step": 279279, "epoch": 1662} {"train_loss": -12.19437026977539, "global_step": 279280, "epoch": 1662} {"train_loss": -12.174993515014648, "global_step": 279281, "epoch": 1662} {"train_loss": -12.08224105834961, "global_step": 279282, "epoch": 1662} {"train_loss": -12.009624481201172, "global_step": 279283, "epoch": 1662} {"train_loss": -12.219079971313477, "global_step": 279284, "epoch": 1662} {"train_loss": -12.069347381591797, "global_step": 279285, "epoch": 1662} {"train_loss": -12.262331008911133, "global_step": 279286, "epoch": 1662} {"train_loss": -12.387967109680176, "global_step": 279287, "epoch": 1662} {"train_loss": -12.300843238830566, "global_step": 279288, "epoch": 1662} {"train_loss": -12.137354850769043, "global_step": 279289, "epoch": 1662} {"train_loss": -12.351408004760742, "global_step": 279290, "epoch": 1662} {"train_loss": -12.174999237060547, "global_step": 279291, "epoch": 1662} {"train_loss": -12.0033597946167, "global_step": 279292, "epoch": 1662} {"train_loss": -12.027762413024902, "global_step": 279293, "epoch": 1662} {"train_loss": -12.384560585021973, "global_step": 279294, "epoch": 1662} {"train_loss": -11.906988143920898, "global_step": 279295, "epoch": 1662} {"train_loss": -11.952022552490234, "global_step": 279296, "epoch": 1662} {"train_loss": -11.880045890808105, "global_step": 279297, "epoch": 1662} {"train_loss": -12.235238075256348, "global_step": 279298, "epoch": 1662} {"train_loss": -12.121652603149414, "global_step": 279299, "epoch": 1662} {"train_loss": -11.130783081054688, "global_step": 279300, "epoch": 1662} {"train_loss": -12.297534942626953, "global_step": 279301, "epoch": 1662} {"train_loss": -11.805793762207031, "global_step": 279302, "epoch": 1662} {"train_loss": -11.908527374267578, "global_step": 279303, "epoch": 1662} {"train_loss": -11.689284324645996, "global_step": 279304, "epoch": 1662} {"train_loss": -12.154969215393066, "global_step": 279305, "epoch": 1662} {"train_loss": -11.607370376586914, "global_step": 279306, "epoch": 1662} {"train_loss": -11.992708206176758, "global_step": 279307, "epoch": 1662} {"train_loss": -11.863237380981445, "global_step": 279308, "epoch": 1662} {"train_loss": -12.029674530029297, "global_step": 279309, "epoch": 1662} {"train_loss": -12.113948822021484, "global_step": 279310, "epoch": 1662} {"train_loss": -12.380634307861328, "global_step": 279311, "epoch": 1662} {"train_loss": -11.864099502563477, "global_step": 279312, "epoch": 1662} {"train_loss": -12.021047592163086, "global_step": 279313, "epoch": 1662} {"train_loss": -12.307547569274902, "global_step": 279314, "epoch": 1662} {"train_loss": -12.37863826751709, "global_step": 279315, "epoch": 1662} {"train_loss": -12.187068939208984, "global_step": 279316, "epoch": 1662} {"train_loss": -12.184976577758789, "global_step": 279317, "epoch": 1662} {"train_loss": -12.309626579284668, "global_step": 279318, "epoch": 1662} {"train_loss": -12.261198997497559, "global_step": 279319, "epoch": 1662} {"train_loss": -12.239076614379883, "global_step": 279320, "epoch": 1662} {"train_loss": -12.263322830200195, "global_step": 279321, "epoch": 1662} {"train_loss": -11.826351165771484, "global_step": 279322, "epoch": 1662} {"train_loss": -12.177837371826172, "global_step": 279323, "epoch": 1662} {"train_loss": -12.170997619628906, "global_step": 279324, "epoch": 1662} {"train_loss": -12.47964859008789, "global_step": 279325, "epoch": 1662} {"train_loss": -12.292425155639648, "global_step": 279326, "epoch": 1662} {"train_loss": -12.214293479919434, "global_step": 279327, "epoch": 1662} {"train_loss": -12.283766746520996, "global_step": 279328, "epoch": 1662} {"train_loss": -12.287464141845703, "global_step": 279329, "epoch": 1662} {"train_loss": -12.347443580627441, "global_step": 279330, "epoch": 1662} {"train_loss": -12.364381790161133, "global_step": 279331, "epoch": 1662} {"train_loss": -11.765220642089844, "global_step": 279332, "epoch": 1662} {"train_loss": -12.426065444946289, "global_step": 279333, "epoch": 1662} {"train_loss": -11.997840881347656, "global_step": 279334, "epoch": 1662} {"train_loss": -12.239739418029785, "global_step": 279335, "epoch": 1662} {"train_loss": -11.879409790039062, "global_step": 279336, "epoch": 1662} {"train_loss": -11.890327453613281, "global_step": 279337, "epoch": 1662} {"train_loss": -11.61484432220459, "global_step": 279338, "epoch": 1662} {"train_loss": -12.216374397277832, "global_step": 279339, "epoch": 1662} {"train_loss": -11.901390075683594, "global_step": 279340, "epoch": 1662} {"train_loss": -11.922720909118652, "global_step": 279341, "epoch": 1662} {"train_loss": -11.457148551940918, "global_step": 279342, "epoch": 1662} {"train_loss": -10.904060363769531, "global_step": 279343, "epoch": 1662} {"train_loss": -11.757232666015625, "global_step": 279344, "epoch": 1662} {"train_loss": -11.116279602050781, "global_step": 279345, "epoch": 1662} {"train_loss": -11.594283103942871, "global_step": 279346, "epoch": 1662} {"train_loss": -10.714208602905273, "global_step": 279347, "epoch": 1662} {"train_loss": -11.887971878051758, "global_step": 279348, "epoch": 1662} {"train_loss": -11.053229331970215, "global_step": 279349, "epoch": 1662} {"train_loss": -12.110455513000488, "global_step": 279350, "epoch": 1662} {"train_loss": -11.676654815673828, "global_step": 279351, "epoch": 1662} {"train_loss": -11.347297668457031, "global_step": 279352, "epoch": 1662} {"train_loss": -11.12139892578125, "global_step": 279353, "epoch": 1662} {"train_loss": -11.753118515014648, "global_step": 279354, "epoch": 1662} {"train_loss": -10.996915817260742, "global_step": 279355, "epoch": 1662} {"train_loss": -11.70930004119873, "global_step": 279356, "epoch": 1662} {"train_loss": -11.118005752563477, "global_step": 279357, "epoch": 1662} {"train_loss": -11.399565696716309, "global_step": 279358, "epoch": 1662} {"train_loss": -10.883197784423828, "global_step": 279359, "epoch": 1662} {"train_loss": -11.913775444030762, "global_step": 279360, "epoch": 1662} {"train_loss": -11.294181823730469, "global_step": 279361, "epoch": 1662} {"train_loss": -11.233175277709961, "global_step": 279362, "epoch": 1662} {"train_loss": -11.384197235107422, "global_step": 279363, "epoch": 1662} {"train_loss": -11.250126838684082, "global_step": 279364, "epoch": 1662} {"train_loss": -10.94962215423584, "global_step": 279365, "epoch": 1662} {"train_loss": -11.165077209472656, "global_step": 279366, "epoch": 1662} {"train_loss": -11.339778900146484, "global_step": 279367, "epoch": 1662} {"train_loss": -10.878941535949707, "global_step": 279368, "epoch": 1662} {"train_loss": -11.897706031799316, "global_step": 279369, "epoch": 1662} {"train_loss": -11.429696083068848, "global_step": 279370, "epoch": 1662} {"train_loss": -11.483492851257324, "global_step": 279371, "epoch": 1662} {"train_loss": -11.72909927368164, "global_step": 279372, "epoch": 1662} {"train_loss": -11.998897552490234, "global_step": 279373, "epoch": 1662} {"train_loss": -11.644718170166016, "global_step": 279374, "epoch": 1662} {"train_loss": -11.62537670135498, "global_step": 279375, "epoch": 1662} {"train_loss": -11.54334545135498, "global_step": 279376, "epoch": 1662} {"train_loss": -11.58575439453125, "global_step": 279377, "epoch": 1662} {"train_loss": -11.293533325195312, "global_step": 279378, "epoch": 1662} {"train_loss": -11.569463729858398, "global_step": 279379, "epoch": 1662} {"train_loss": -11.62507438659668, "global_step": 279380, "epoch": 1662} {"train_loss": -11.503788948059082, "global_step": 279381, "epoch": 1662} {"train_loss": -11.454798698425293, "global_step": 279382, "epoch": 1662} {"train_loss": -11.758753487042018, "global_step": 279383, "epoch": 1662, "val_loss": 278316.09375} {"train_loss": -11.182870864868164, "global_step": 279384, "epoch": 1663} {"train_loss": -11.282455444335938, "global_step": 279385, "epoch": 1663} {"train_loss": -11.488181114196777, "global_step": 279386, "epoch": 1663} {"train_loss": -11.244241714477539, "global_step": 279387, "epoch": 1663} {"train_loss": -11.948343276977539, "global_step": 279388, "epoch": 1663} {"train_loss": -11.594709396362305, "global_step": 279389, "epoch": 1663} {"train_loss": -11.8212308883667, "global_step": 279390, "epoch": 1663} {"train_loss": -11.916468620300293, "global_step": 279391, "epoch": 1663} {"train_loss": -11.555479049682617, "global_step": 279392, "epoch": 1663} {"train_loss": -11.829126358032227, "global_step": 279393, "epoch": 1663} {"train_loss": -11.811692237854004, "global_step": 279394, "epoch": 1663} {"train_loss": -11.821657180786133, "global_step": 279395, "epoch": 1663} {"train_loss": -11.71441650390625, "global_step": 279396, "epoch": 1663} {"train_loss": -11.380542755126953, "global_step": 279397, "epoch": 1663} {"train_loss": -11.593454360961914, "global_step": 279398, "epoch": 1663} {"train_loss": -11.913604736328125, "global_step": 279399, "epoch": 1663} {"train_loss": -11.952083587646484, "global_step": 279400, "epoch": 1663} {"train_loss": -11.780238151550293, "global_step": 279401, "epoch": 1663} {"train_loss": -11.822509765625, "global_step": 279402, "epoch": 1663} {"train_loss": -12.113485336303711, "global_step": 279403, "epoch": 1663} {"train_loss": -11.87117862701416, "global_step": 279404, "epoch": 1663} {"train_loss": -11.894989967346191, "global_step": 279405, "epoch": 1663} {"train_loss": -11.899810791015625, "global_step": 279406, "epoch": 1663} {"train_loss": -11.517948150634766, "global_step": 279407, "epoch": 1663} {"train_loss": -12.25075912475586, "global_step": 279408, "epoch": 1663} {"train_loss": -11.965319633483887, "global_step": 279409, "epoch": 1663} {"train_loss": -11.948219299316406, "global_step": 279410, "epoch": 1663} {"train_loss": -12.127310752868652, "global_step": 279411, "epoch": 1663} {"train_loss": -11.997819900512695, "global_step": 279412, "epoch": 1663} {"train_loss": -11.927505493164062, "global_step": 279413, "epoch": 1663} {"train_loss": -11.967378616333008, "global_step": 279414, "epoch": 1663} {"train_loss": -12.039796829223633, "global_step": 279415, "epoch": 1663} {"train_loss": -12.210747718811035, "global_step": 279416, "epoch": 1663} {"train_loss": -12.20750904083252, "global_step": 279417, "epoch": 1663} {"train_loss": -12.114873886108398, "global_step": 279418, "epoch": 1663} {"train_loss": -12.09272575378418, "global_step": 279419, "epoch": 1663} {"train_loss": -11.990135192871094, "global_step": 279420, "epoch": 1663} {"train_loss": -12.131163597106934, "global_step": 279421, "epoch": 1663} {"train_loss": -11.64931869506836, "global_step": 279422, "epoch": 1663} {"train_loss": -12.175192832946777, "global_step": 279423, "epoch": 1663} {"train_loss": -11.769966125488281, "global_step": 279424, "epoch": 1663} {"train_loss": -11.882740020751953, "global_step": 279425, "epoch": 1663} {"train_loss": -12.03302001953125, "global_step": 279426, "epoch": 1663} {"train_loss": -11.862506866455078, "global_step": 279427, "epoch": 1663} {"train_loss": -11.933526039123535, "global_step": 279428, "epoch": 1663} {"train_loss": -11.76738166809082, "global_step": 279429, "epoch": 1663} {"train_loss": -11.747053146362305, "global_step": 279430, "epoch": 1663} {"train_loss": -12.138483047485352, "global_step": 279431, "epoch": 1663} {"train_loss": -11.658857345581055, "global_step": 279432, "epoch": 1663} {"train_loss": -11.501508712768555, "global_step": 279433, "epoch": 1663} {"train_loss": -11.957573890686035, "global_step": 279434, "epoch": 1663} {"train_loss": -11.94686222076416, "global_step": 279435, "epoch": 1663} {"train_loss": -11.006918907165527, "global_step": 279436, "epoch": 1663} {"train_loss": -12.26382827758789, "global_step": 279437, "epoch": 1663} {"train_loss": -11.647205352783203, "global_step": 279438, "epoch": 1663} {"train_loss": -11.96634578704834, "global_step": 279439, "epoch": 1663} {"train_loss": -11.709423065185547, "global_step": 279440, "epoch": 1663} {"train_loss": -11.886435508728027, "global_step": 279441, "epoch": 1663} {"train_loss": -11.52549934387207, "global_step": 279442, "epoch": 1663} {"train_loss": -11.890892028808594, "global_step": 279443, "epoch": 1663} {"train_loss": -11.622089385986328, "global_step": 279444, "epoch": 1663} {"train_loss": -11.798730850219727, "global_step": 279445, "epoch": 1663} {"train_loss": -11.845621109008789, "global_step": 279446, "epoch": 1663} {"train_loss": -12.15536117553711, "global_step": 279447, "epoch": 1663} {"train_loss": -11.961341857910156, "global_step": 279448, "epoch": 1663} {"train_loss": -12.248237609863281, "global_step": 279449, "epoch": 1663} {"train_loss": -12.14455795288086, "global_step": 279450, "epoch": 1663} {"train_loss": -11.891746520996094, "global_step": 279451, "epoch": 1663} {"train_loss": -12.179657936096191, "global_step": 279452, "epoch": 1663} {"train_loss": -11.956588745117188, "global_step": 279453, "epoch": 1663} {"train_loss": -11.45380973815918, "global_step": 279454, "epoch": 1663} {"train_loss": -11.177530288696289, "global_step": 279455, "epoch": 1663} {"train_loss": -11.369172096252441, "global_step": 279456, "epoch": 1663} {"train_loss": -9.919282913208008, "global_step": 279457, "epoch": 1663} {"train_loss": -11.232725143432617, "global_step": 279458, "epoch": 1663} {"train_loss": -11.410582542419434, "global_step": 279459, "epoch": 1663} {"train_loss": -10.42403507232666, "global_step": 279460, "epoch": 1663} {"train_loss": -11.697083473205566, "global_step": 279461, "epoch": 1663} {"train_loss": -10.432290077209473, "global_step": 279462, "epoch": 1663} {"train_loss": -10.653888702392578, "global_step": 279463, "epoch": 1663} {"train_loss": -11.376811981201172, "global_step": 279464, "epoch": 1663} {"train_loss": -10.484920501708984, "global_step": 279465, "epoch": 1663} {"train_loss": -10.868892669677734, "global_step": 279466, "epoch": 1663} {"train_loss": -12.017748832702637, "global_step": 279467, "epoch": 1663} {"train_loss": -10.481908798217773, "global_step": 279468, "epoch": 1663} {"train_loss": -12.050027847290039, "global_step": 279469, "epoch": 1663} {"train_loss": -9.818992614746094, "global_step": 279470, "epoch": 1663} {"train_loss": -11.678962707519531, "global_step": 279471, "epoch": 1663} {"train_loss": -10.160531044006348, "global_step": 279472, "epoch": 1663} {"train_loss": -11.256372451782227, "global_step": 279473, "epoch": 1663} {"train_loss": -10.739013671875, "global_step": 279474, "epoch": 1663} {"train_loss": -10.97551155090332, "global_step": 279475, "epoch": 1663} {"train_loss": -11.246331214904785, "global_step": 279476, "epoch": 1663} {"train_loss": -10.51834774017334, "global_step": 279477, "epoch": 1663} {"train_loss": -11.492237091064453, "global_step": 279478, "epoch": 1663} {"train_loss": -10.335994720458984, "global_step": 279479, "epoch": 1663} {"train_loss": -11.292440414428711, "global_step": 279480, "epoch": 1663} {"train_loss": -11.484277725219727, "global_step": 279481, "epoch": 1663} {"train_loss": -11.333303451538086, "global_step": 279482, "epoch": 1663} {"train_loss": -10.89200210571289, "global_step": 279483, "epoch": 1663} {"train_loss": -10.74487590789795, "global_step": 279484, "epoch": 1663} {"train_loss": -11.070272445678711, "global_step": 279485, "epoch": 1663} {"train_loss": -9.94343376159668, "global_step": 279486, "epoch": 1663} {"train_loss": -10.597440719604492, "global_step": 279487, "epoch": 1663} {"train_loss": -10.753743171691895, "global_step": 279488, "epoch": 1663} {"train_loss": -10.93753433227539, "global_step": 279489, "epoch": 1663} {"train_loss": -11.241952896118164, "global_step": 279490, "epoch": 1663} {"train_loss": -11.062633514404297, "global_step": 279491, "epoch": 1663} {"train_loss": -11.115340232849121, "global_step": 279492, "epoch": 1663} {"train_loss": -11.498123168945312, "global_step": 279493, "epoch": 1663} {"train_loss": -11.500505447387695, "global_step": 279494, "epoch": 1663} {"train_loss": -11.5086088180542, "global_step": 279495, "epoch": 1663} {"train_loss": -11.349370002746582, "global_step": 279496, "epoch": 1663} {"train_loss": -11.126380920410156, "global_step": 279497, "epoch": 1663} {"train_loss": -11.538415908813477, "global_step": 279498, "epoch": 1663} {"train_loss": -11.503828048706055, "global_step": 279499, "epoch": 1663} {"train_loss": -11.461959838867188, "global_step": 279500, "epoch": 1663} {"train_loss": -11.838624954223633, "global_step": 279501, "epoch": 1663} {"train_loss": -11.82078742980957, "global_step": 279502, "epoch": 1663} {"train_loss": -11.72400188446045, "global_step": 279503, "epoch": 1663} {"train_loss": -11.716991424560547, "global_step": 279504, "epoch": 1663} {"train_loss": -11.858173370361328, "global_step": 279505, "epoch": 1663} {"train_loss": -11.925979614257812, "global_step": 279506, "epoch": 1663} {"train_loss": -11.924701690673828, "global_step": 279507, "epoch": 1663} {"train_loss": -11.94692325592041, "global_step": 279508, "epoch": 1663} {"train_loss": -11.9872465133667, "global_step": 279509, "epoch": 1663} {"train_loss": -11.80105972290039, "global_step": 279510, "epoch": 1663} {"train_loss": -11.905298233032227, "global_step": 279511, "epoch": 1663} {"train_loss": -12.065826416015625, "global_step": 279512, "epoch": 1663} {"train_loss": -11.94610595703125, "global_step": 279513, "epoch": 1663} {"train_loss": -11.903030395507812, "global_step": 279514, "epoch": 1663} {"train_loss": -12.012168884277344, "global_step": 279515, "epoch": 1663} {"train_loss": -11.980071067810059, "global_step": 279516, "epoch": 1663} {"train_loss": -12.084086418151855, "global_step": 279517, "epoch": 1663} {"train_loss": -12.101164817810059, "global_step": 279518, "epoch": 1663} {"train_loss": -12.186599731445312, "global_step": 279519, "epoch": 1663} {"train_loss": -12.076562881469727, "global_step": 279520, "epoch": 1663} {"train_loss": -11.948229789733887, "global_step": 279521, "epoch": 1663} {"train_loss": -11.967766761779785, "global_step": 279522, "epoch": 1663} {"train_loss": -11.838314056396484, "global_step": 279523, "epoch": 1663} {"train_loss": -12.296005249023438, "global_step": 279524, "epoch": 1663} {"train_loss": -11.923798561096191, "global_step": 279525, "epoch": 1663} {"train_loss": -12.140872955322266, "global_step": 279526, "epoch": 1663} {"train_loss": -12.177465438842773, "global_step": 279527, "epoch": 1663} {"train_loss": -12.196403503417969, "global_step": 279528, "epoch": 1663} {"train_loss": -12.12553596496582, "global_step": 279529, "epoch": 1663} {"train_loss": -12.299385070800781, "global_step": 279530, "epoch": 1663} {"train_loss": -12.311911582946777, "global_step": 279531, "epoch": 1663} {"train_loss": -12.27316951751709, "global_step": 279532, "epoch": 1663} {"train_loss": -12.168707847595215, "global_step": 279533, "epoch": 1663} {"train_loss": -12.088336944580078, "global_step": 279534, "epoch": 1663} {"train_loss": -12.21347713470459, "global_step": 279535, "epoch": 1663} {"train_loss": -12.225542068481445, "global_step": 279536, "epoch": 1663} {"train_loss": -12.364337921142578, "global_step": 279537, "epoch": 1663} {"train_loss": -12.273422241210938, "global_step": 279538, "epoch": 1663} {"train_loss": -12.207121849060059, "global_step": 279539, "epoch": 1663} {"train_loss": -12.454532623291016, "global_step": 279540, "epoch": 1663} {"train_loss": -12.165937423706055, "global_step": 279541, "epoch": 1663} {"train_loss": -12.338142395019531, "global_step": 279542, "epoch": 1663} {"train_loss": -12.299352645874023, "global_step": 279543, "epoch": 1663} {"train_loss": -12.162626266479492, "global_step": 279544, "epoch": 1663} {"train_loss": -12.268938064575195, "global_step": 279545, "epoch": 1663} {"train_loss": -12.457435607910156, "global_step": 279546, "epoch": 1663} {"train_loss": -11.726503372192383, "global_step": 279547, "epoch": 1663} {"train_loss": -11.978515625, "global_step": 279548, "epoch": 1663} {"train_loss": -12.10824966430664, "global_step": 279549, "epoch": 1663} {"train_loss": -12.278697967529297, "global_step": 279550, "epoch": 1663} {"train_loss": -11.696844441550118, "global_step": 279551, "epoch": 1663, "val_loss": 276424.125} {"train_loss": -12.196495056152344, "global_step": 279552, "epoch": 1664} {"train_loss": -12.077278137207031, "global_step": 279553, "epoch": 1664} {"train_loss": -12.185628890991211, "global_step": 279554, "epoch": 1664} {"train_loss": -12.254777908325195, "global_step": 279555, "epoch": 1664} {"train_loss": -11.658382415771484, "global_step": 279556, "epoch": 1664} {"train_loss": -11.665868759155273, "global_step": 279557, "epoch": 1664} {"train_loss": -12.138733863830566, "global_step": 279558, "epoch": 1664} {"train_loss": -11.897727966308594, "global_step": 279559, "epoch": 1664} {"train_loss": -11.426471710205078, "global_step": 279560, "epoch": 1664} {"train_loss": -11.406536102294922, "global_step": 279561, "epoch": 1664} {"train_loss": -11.747392654418945, "global_step": 279562, "epoch": 1664} {"train_loss": -11.954858779907227, "global_step": 279563, "epoch": 1664} {"train_loss": -10.430837631225586, "global_step": 279564, "epoch": 1664} {"train_loss": -10.765459060668945, "global_step": 279565, "epoch": 1664} {"train_loss": -11.821290969848633, "global_step": 279566, "epoch": 1664} {"train_loss": -9.969313621520996, "global_step": 279567, "epoch": 1664} {"train_loss": -11.083444595336914, "global_step": 279568, "epoch": 1664} {"train_loss": -8.902986526489258, "global_step": 279569, "epoch": 1664} {"train_loss": -9.603202819824219, "global_step": 279570, "epoch": 1664} {"train_loss": -8.26963996887207, "global_step": 279571, "epoch": 1664} {"train_loss": -8.487747192382812, "global_step": 279572, "epoch": 1664} {"train_loss": -9.275375366210938, "global_step": 279573, "epoch": 1664} {"train_loss": -10.93649959564209, "global_step": 279574, "epoch": 1664} {"train_loss": -8.939091682434082, "global_step": 279575, "epoch": 1664} {"train_loss": -9.84605598449707, "global_step": 279576, "epoch": 1664} {"train_loss": -9.910734176635742, "global_step": 279577, "epoch": 1664} {"train_loss": -10.089197158813477, "global_step": 279578, "epoch": 1664} {"train_loss": -10.29292106628418, "global_step": 279579, "epoch": 1664} {"train_loss": -9.974160194396973, "global_step": 279580, "epoch": 1664} {"train_loss": -10.530106544494629, "global_step": 279581, "epoch": 1664} {"train_loss": -10.378937721252441, "global_step": 279582, "epoch": 1664} {"train_loss": -10.430604934692383, "global_step": 279583, "epoch": 1664} {"train_loss": -10.979028701782227, "global_step": 279584, "epoch": 1664} {"train_loss": -10.361326217651367, "global_step": 279585, "epoch": 1664} {"train_loss": -11.46446418762207, "global_step": 279586, "epoch": 1664} {"train_loss": -11.076658248901367, "global_step": 279587, "epoch": 1664} {"train_loss": -10.899290084838867, "global_step": 279588, "epoch": 1664} {"train_loss": -11.375936508178711, "global_step": 279589, "epoch": 1664} {"train_loss": -10.651273727416992, "global_step": 279590, "epoch": 1664} {"train_loss": -11.417394638061523, "global_step": 279591, "epoch": 1664} {"train_loss": -11.68175220489502, "global_step": 279592, "epoch": 1664} {"train_loss": -11.255280494689941, "global_step": 279593, "epoch": 1664} {"train_loss": -11.635043144226074, "global_step": 279594, "epoch": 1664} {"train_loss": -11.334636688232422, "global_step": 279595, "epoch": 1664} {"train_loss": -11.511736869812012, "global_step": 279596, "epoch": 1664} {"train_loss": -10.917288780212402, "global_step": 279597, "epoch": 1664} {"train_loss": -11.687252044677734, "global_step": 279598, "epoch": 1664} {"train_loss": -11.349655151367188, "global_step": 279599, "epoch": 1664} {"train_loss": -11.478063583374023, "global_step": 279600, "epoch": 1664} {"train_loss": -11.54544448852539, "global_step": 279601, "epoch": 1664} {"train_loss": -11.50918960571289, "global_step": 279602, "epoch": 1664} {"train_loss": -11.857556343078613, "global_step": 279603, "epoch": 1664} {"train_loss": -11.329033851623535, "global_step": 279604, "epoch": 1664} {"train_loss": -11.729381561279297, "global_step": 279605, "epoch": 1664} {"train_loss": -11.189584732055664, "global_step": 279606, "epoch": 1664} {"train_loss": -11.62269401550293, "global_step": 279607, "epoch": 1664} {"train_loss": -11.316070556640625, "global_step": 279608, "epoch": 1664} {"train_loss": -11.884603500366211, "global_step": 279609, "epoch": 1664} {"train_loss": -11.557998657226562, "global_step": 279610, "epoch": 1664} {"train_loss": -11.847785949707031, "global_step": 279611, "epoch": 1664} {"train_loss": -11.81717586517334, "global_step": 279612, "epoch": 1664} {"train_loss": -11.963676452636719, "global_step": 279613, "epoch": 1664} {"train_loss": -11.727579116821289, "global_step": 279614, "epoch": 1664} {"train_loss": -12.00531005859375, "global_step": 279615, "epoch": 1664} {"train_loss": -11.860248565673828, "global_step": 279616, "epoch": 1664} {"train_loss": -11.937976837158203, "global_step": 279617, "epoch": 1664} {"train_loss": -11.994163513183594, "global_step": 279618, "epoch": 1664} {"train_loss": -11.940165519714355, "global_step": 279619, "epoch": 1664} {"train_loss": -12.140079498291016, "global_step": 279620, "epoch": 1664} {"train_loss": -11.773181915283203, "global_step": 279621, "epoch": 1664} {"train_loss": -11.946285247802734, "global_step": 279622, "epoch": 1664} {"train_loss": -11.834190368652344, "global_step": 279623, "epoch": 1664} {"train_loss": -11.824041366577148, "global_step": 279624, "epoch": 1664} {"train_loss": -12.050642013549805, "global_step": 279625, "epoch": 1664} {"train_loss": -11.897989273071289, "global_step": 279626, "epoch": 1664} {"train_loss": -11.994424819946289, "global_step": 279627, "epoch": 1664} {"train_loss": -11.80929946899414, "global_step": 279628, "epoch": 1664} {"train_loss": -12.013931274414062, "global_step": 279629, "epoch": 1664} {"train_loss": -11.78520393371582, "global_step": 279630, "epoch": 1664} {"train_loss": -11.898079872131348, "global_step": 279631, "epoch": 1664} {"train_loss": -12.043449401855469, "global_step": 279632, "epoch": 1664} {"train_loss": -12.187034606933594, "global_step": 279633, "epoch": 1664} {"train_loss": -12.247346878051758, "global_step": 279634, "epoch": 1664} {"train_loss": -12.135274887084961, "global_step": 279635, "epoch": 1664} {"train_loss": -12.207748413085938, "global_step": 279636, "epoch": 1664} {"train_loss": -12.177897453308105, "global_step": 279637, "epoch": 1664} {"train_loss": -12.278404235839844, "global_step": 279638, "epoch": 1664} {"train_loss": -12.029162406921387, "global_step": 279639, "epoch": 1664} {"train_loss": -12.147333145141602, "global_step": 279640, "epoch": 1664} {"train_loss": -12.182083129882812, "global_step": 279641, "epoch": 1664} {"train_loss": -12.058143615722656, "global_step": 279642, "epoch": 1664} {"train_loss": -12.055042266845703, "global_step": 279643, "epoch": 1664} {"train_loss": -11.905476570129395, "global_step": 279644, "epoch": 1664} {"train_loss": -11.764867782592773, "global_step": 279645, "epoch": 1664} {"train_loss": -12.086026191711426, "global_step": 279646, "epoch": 1664} {"train_loss": -12.250452041625977, "global_step": 279647, "epoch": 1664} {"train_loss": -12.037738800048828, "global_step": 279648, "epoch": 1664} {"train_loss": -12.391813278198242, "global_step": 279649, "epoch": 1664} {"train_loss": -12.010666847229004, "global_step": 279650, "epoch": 1664} {"train_loss": -12.138766288757324, "global_step": 279651, "epoch": 1664} {"train_loss": -12.151029586791992, "global_step": 279652, "epoch": 1664} {"train_loss": -12.277137756347656, "global_step": 279653, "epoch": 1664} {"train_loss": -11.948637008666992, "global_step": 279654, "epoch": 1664} {"train_loss": -12.037802696228027, "global_step": 279655, "epoch": 1664} {"train_loss": -12.139777183532715, "global_step": 279656, "epoch": 1664} {"train_loss": -12.019901275634766, "global_step": 279657, "epoch": 1664} {"train_loss": -12.005718231201172, "global_step": 279658, "epoch": 1664} {"train_loss": -11.447250366210938, "global_step": 279659, "epoch": 1664} {"train_loss": -11.823468208312988, "global_step": 279660, "epoch": 1664} {"train_loss": -11.343620300292969, "global_step": 279661, "epoch": 1664} {"train_loss": -11.463685989379883, "global_step": 279662, "epoch": 1664} {"train_loss": -11.462711334228516, "global_step": 279663, "epoch": 1664} {"train_loss": -10.778373718261719, "global_step": 279664, "epoch": 1664} {"train_loss": -11.910003662109375, "global_step": 279665, "epoch": 1664} {"train_loss": -11.339744567871094, "global_step": 279666, "epoch": 1664} {"train_loss": -10.17609691619873, "global_step": 279667, "epoch": 1664} {"train_loss": -11.785284042358398, "global_step": 279668, "epoch": 1664} {"train_loss": -10.272384643554688, "global_step": 279669, "epoch": 1664} {"train_loss": -10.999250411987305, "global_step": 279670, "epoch": 1664} {"train_loss": -10.923135757446289, "global_step": 279671, "epoch": 1664} {"train_loss": -11.341470718383789, "global_step": 279672, "epoch": 1664} {"train_loss": -10.535228729248047, "global_step": 279673, "epoch": 1664} {"train_loss": -9.97245979309082, "global_step": 279674, "epoch": 1664} {"train_loss": -10.312435150146484, "global_step": 279675, "epoch": 1664} {"train_loss": -10.726927757263184, "global_step": 279676, "epoch": 1664} {"train_loss": -8.78774642944336, "global_step": 279677, "epoch": 1664} {"train_loss": -11.037192344665527, "global_step": 279678, "epoch": 1664} {"train_loss": -9.881786346435547, "global_step": 279679, "epoch": 1664} {"train_loss": -11.168331146240234, "global_step": 279680, "epoch": 1664} {"train_loss": -9.930277824401855, "global_step": 279681, "epoch": 1664} {"train_loss": -11.290202140808105, "global_step": 279682, "epoch": 1664} {"train_loss": -10.585264205932617, "global_step": 279683, "epoch": 1664} {"train_loss": -11.537162780761719, "global_step": 279684, "epoch": 1664} {"train_loss": -11.102577209472656, "global_step": 279685, "epoch": 1664} {"train_loss": -11.112306594848633, "global_step": 279686, "epoch": 1664} {"train_loss": -10.856977462768555, "global_step": 279687, "epoch": 1664} {"train_loss": -11.804203987121582, "global_step": 279688, "epoch": 1664} {"train_loss": -10.964698791503906, "global_step": 279689, "epoch": 1664} {"train_loss": -11.862466812133789, "global_step": 279690, "epoch": 1664} {"train_loss": -11.149421691894531, "global_step": 279691, "epoch": 1664} {"train_loss": -11.549816131591797, "global_step": 279692, "epoch": 1664} {"train_loss": -11.686443328857422, "global_step": 279693, "epoch": 1664} {"train_loss": -11.231767654418945, "global_step": 279694, "epoch": 1664} {"train_loss": -11.514577865600586, "global_step": 279695, "epoch": 1664} {"train_loss": -11.6460542678833, "global_step": 279696, "epoch": 1664} {"train_loss": -11.258655548095703, "global_step": 279697, "epoch": 1664} {"train_loss": -11.846813201904297, "global_step": 279698, "epoch": 1664} {"train_loss": -11.303916931152344, "global_step": 279699, "epoch": 1664} {"train_loss": -11.70403003692627, "global_step": 279700, "epoch": 1664} {"train_loss": -11.012317657470703, "global_step": 279701, "epoch": 1664} {"train_loss": -11.322061538696289, "global_step": 279702, "epoch": 1664} {"train_loss": -11.855241775512695, "global_step": 279703, "epoch": 1664} {"train_loss": -11.105106353759766, "global_step": 279704, "epoch": 1664} {"train_loss": -11.604791641235352, "global_step": 279705, "epoch": 1664} {"train_loss": -11.174819946289062, "global_step": 279706, "epoch": 1664} {"train_loss": -11.461366653442383, "global_step": 279707, "epoch": 1664} {"train_loss": -11.477741241455078, "global_step": 279708, "epoch": 1664} {"train_loss": -11.406405448913574, "global_step": 279709, "epoch": 1664} {"train_loss": -11.323497772216797, "global_step": 279710, "epoch": 1664} {"train_loss": -11.82602596282959, "global_step": 279711, "epoch": 1664} {"train_loss": -10.93895149230957, "global_step": 279712, "epoch": 1664} {"train_loss": -11.594718933105469, "global_step": 279713, "epoch": 1664} {"train_loss": -11.152358055114746, "global_step": 279714, "epoch": 1664} {"train_loss": -11.672433853149414, "global_step": 279715, "epoch": 1664} {"train_loss": -11.559885025024414, "global_step": 279716, "epoch": 1664} {"train_loss": -11.613181114196777, "global_step": 279717, "epoch": 1664} {"train_loss": -11.603276252746582, "global_step": 279718, "epoch": 1664} {"train_loss": -11.364183669998532, "global_step": 279719, "epoch": 1664, "val_loss": 276907.9375} {"train_loss": -11.913032531738281, "global_step": 279720, "epoch": 1665} {"train_loss": -11.729608535766602, "global_step": 279721, "epoch": 1665} {"train_loss": -12.0562744140625, "global_step": 279722, "epoch": 1665} {"train_loss": -11.827410697937012, "global_step": 279723, "epoch": 1665} {"train_loss": -11.973699569702148, "global_step": 279724, "epoch": 1665} {"train_loss": -12.05807876586914, "global_step": 279725, "epoch": 1665} {"train_loss": -11.943561553955078, "global_step": 279726, "epoch": 1665} {"train_loss": -12.026432037353516, "global_step": 279727, "epoch": 1665} {"train_loss": -11.872161865234375, "global_step": 279728, "epoch": 1665} {"train_loss": -12.069681167602539, "global_step": 279729, "epoch": 1665} {"train_loss": -11.969552993774414, "global_step": 279730, "epoch": 1665} {"train_loss": -11.940340995788574, "global_step": 279731, "epoch": 1665} {"train_loss": -12.134706497192383, "global_step": 279732, "epoch": 1665} {"train_loss": -12.030431747436523, "global_step": 279733, "epoch": 1665} {"train_loss": -12.064289093017578, "global_step": 279734, "epoch": 1665} {"train_loss": -12.064115524291992, "global_step": 279735, "epoch": 1665} {"train_loss": -12.009063720703125, "global_step": 279736, "epoch": 1665} {"train_loss": -11.915618896484375, "global_step": 279737, "epoch": 1665} {"train_loss": -12.292766571044922, "global_step": 279738, "epoch": 1665} {"train_loss": -12.109182357788086, "global_step": 279739, "epoch": 1665} {"train_loss": -12.079524993896484, "global_step": 279740, "epoch": 1665} {"train_loss": -12.212180137634277, "global_step": 279741, "epoch": 1665} {"train_loss": -11.978938102722168, "global_step": 279742, "epoch": 1665} {"train_loss": -12.400470733642578, "global_step": 279743, "epoch": 1665} {"train_loss": -12.083853721618652, "global_step": 279744, "epoch": 1665} {"train_loss": -12.320930480957031, "global_step": 279745, "epoch": 1665} {"train_loss": -11.951536178588867, "global_step": 279746, "epoch": 1665} {"train_loss": -12.22594165802002, "global_step": 279747, "epoch": 1665} {"train_loss": -12.074190139770508, "global_step": 279748, "epoch": 1665} {"train_loss": -12.019387245178223, "global_step": 279749, "epoch": 1665} {"train_loss": -11.920969009399414, "global_step": 279750, "epoch": 1665} {"train_loss": -12.205530166625977, "global_step": 279751, "epoch": 1665} {"train_loss": -11.961607933044434, "global_step": 279752, "epoch": 1665} {"train_loss": -12.308097839355469, "global_step": 279753, "epoch": 1665} {"train_loss": -12.050996780395508, "global_step": 279754, "epoch": 1665} {"train_loss": -12.10930061340332, "global_step": 279755, "epoch": 1665} {"train_loss": -11.855987548828125, "global_step": 279756, "epoch": 1665} {"train_loss": -11.719921112060547, "global_step": 279757, "epoch": 1665} {"train_loss": -12.013657569885254, "global_step": 279758, "epoch": 1665} {"train_loss": -11.92746639251709, "global_step": 279759, "epoch": 1665} {"train_loss": -11.710052490234375, "global_step": 279760, "epoch": 1665} {"train_loss": -12.095748901367188, "global_step": 279761, "epoch": 1665} {"train_loss": -11.991708755493164, "global_step": 279762, "epoch": 1665} {"train_loss": -11.611198425292969, "global_step": 279763, "epoch": 1665} {"train_loss": -11.561002731323242, "global_step": 279764, "epoch": 1665} {"train_loss": -11.782889366149902, "global_step": 279765, "epoch": 1665} {"train_loss": -11.756570816040039, "global_step": 279766, "epoch": 1665} {"train_loss": -11.776778221130371, "global_step": 279767, "epoch": 1665} {"train_loss": -11.56447696685791, "global_step": 279768, "epoch": 1665} {"train_loss": -11.83580493927002, "global_step": 279769, "epoch": 1665} {"train_loss": -10.680047035217285, "global_step": 279770, "epoch": 1665} {"train_loss": -11.70468521118164, "global_step": 279771, "epoch": 1665} {"train_loss": -11.549688339233398, "global_step": 279772, "epoch": 1665} {"train_loss": -11.112957000732422, "global_step": 279773, "epoch": 1665} {"train_loss": -11.813125610351562, "global_step": 279774, "epoch": 1665} {"train_loss": -11.59531021118164, "global_step": 279775, "epoch": 1665} {"train_loss": -11.252739906311035, "global_step": 279776, "epoch": 1665} {"train_loss": -11.89413833618164, "global_step": 279777, "epoch": 1665} {"train_loss": -10.993038177490234, "global_step": 279778, "epoch": 1665} {"train_loss": -11.916744232177734, "global_step": 279779, "epoch": 1665} {"train_loss": -10.937915802001953, "global_step": 279780, "epoch": 1665} {"train_loss": -11.552495956420898, "global_step": 279781, "epoch": 1665} {"train_loss": -10.242609024047852, "global_step": 279782, "epoch": 1665} {"train_loss": -11.347344398498535, "global_step": 279783, "epoch": 1665} {"train_loss": -11.188364028930664, "global_step": 279784, "epoch": 1665} {"train_loss": -10.552642822265625, "global_step": 279785, "epoch": 1665} {"train_loss": -10.75086784362793, "global_step": 279786, "epoch": 1665} {"train_loss": -10.651123046875, "global_step": 279787, "epoch": 1665} {"train_loss": -11.534406661987305, "global_step": 279788, "epoch": 1665} {"train_loss": -10.525341033935547, "global_step": 279789, "epoch": 1665} {"train_loss": -10.914271354675293, "global_step": 279790, "epoch": 1665} {"train_loss": -10.237203598022461, "global_step": 279791, "epoch": 1665} {"train_loss": -9.89297103881836, "global_step": 279792, "epoch": 1665} {"train_loss": -9.369415283203125, "global_step": 279793, "epoch": 1665} {"train_loss": -11.066287994384766, "global_step": 279794, "epoch": 1665} {"train_loss": -8.536966323852539, "global_step": 279795, "epoch": 1665} {"train_loss": -8.94717788696289, "global_step": 279796, "epoch": 1665} {"train_loss": -10.55369758605957, "global_step": 279797, "epoch": 1665} {"train_loss": -9.129152297973633, "global_step": 279798, "epoch": 1665} {"train_loss": -10.00332260131836, "global_step": 279799, "epoch": 1665} {"train_loss": -10.634246826171875, "global_step": 279800, "epoch": 1665} {"train_loss": -10.500608444213867, "global_step": 279801, "epoch": 1665} {"train_loss": -10.48099136352539, "global_step": 279802, "epoch": 1665} {"train_loss": -11.265377044677734, "global_step": 279803, "epoch": 1665} {"train_loss": -11.377836227416992, "global_step": 279804, "epoch": 1665} {"train_loss": -11.698088645935059, "global_step": 279805, "epoch": 1665} {"train_loss": -11.00262451171875, "global_step": 279806, "epoch": 1665} {"train_loss": -11.366617202758789, "global_step": 279807, "epoch": 1665} {"train_loss": -11.250856399536133, "global_step": 279808, "epoch": 1665} {"train_loss": -10.871749877929688, "global_step": 279809, "epoch": 1665} {"train_loss": -11.671346664428711, "global_step": 279810, "epoch": 1665} {"train_loss": -11.165191650390625, "global_step": 279811, "epoch": 1665} {"train_loss": -11.548744201660156, "global_step": 279812, "epoch": 1665} {"train_loss": -11.479324340820312, "global_step": 279813, "epoch": 1665} {"train_loss": -11.640506744384766, "global_step": 279814, "epoch": 1665} {"train_loss": -11.982059478759766, "global_step": 279815, "epoch": 1665} {"train_loss": -11.619607925415039, "global_step": 279816, "epoch": 1665} {"train_loss": -11.742049217224121, "global_step": 279817, "epoch": 1665} {"train_loss": -11.506959915161133, "global_step": 279818, "epoch": 1665} {"train_loss": -11.919219970703125, "global_step": 279819, "epoch": 1665} {"train_loss": -11.372842788696289, "global_step": 279820, "epoch": 1665} {"train_loss": -11.45318603515625, "global_step": 279821, "epoch": 1665} {"train_loss": -11.336181640625, "global_step": 279822, "epoch": 1665} {"train_loss": -11.705667495727539, "global_step": 279823, "epoch": 1665} {"train_loss": -11.794891357421875, "global_step": 279824, "epoch": 1665} {"train_loss": -11.525335311889648, "global_step": 279825, "epoch": 1665} {"train_loss": -11.654031753540039, "global_step": 279826, "epoch": 1665} {"train_loss": -11.530349731445312, "global_step": 279827, "epoch": 1665} {"train_loss": -11.326679229736328, "global_step": 279828, "epoch": 1665} {"train_loss": -11.642496109008789, "global_step": 279829, "epoch": 1665} {"train_loss": -11.69102668762207, "global_step": 279830, "epoch": 1665} {"train_loss": -11.855213165283203, "global_step": 279831, "epoch": 1665} {"train_loss": -11.899825096130371, "global_step": 279832, "epoch": 1665} {"train_loss": -11.454788208007812, "global_step": 279833, "epoch": 1665} {"train_loss": -11.930667877197266, "global_step": 279834, "epoch": 1665} {"train_loss": -11.96041488647461, "global_step": 279835, "epoch": 1665} {"train_loss": -11.869630813598633, "global_step": 279836, "epoch": 1665} {"train_loss": -12.097967147827148, "global_step": 279837, "epoch": 1665} {"train_loss": -11.784244537353516, "global_step": 279838, "epoch": 1665} {"train_loss": -12.079854965209961, "global_step": 279839, "epoch": 1665} {"train_loss": -12.16408920288086, "global_step": 279840, "epoch": 1665} {"train_loss": -11.965627670288086, "global_step": 279841, "epoch": 1665} {"train_loss": -12.159540176391602, "global_step": 279842, "epoch": 1665} {"train_loss": -11.883970260620117, "global_step": 279843, "epoch": 1665} {"train_loss": -12.096450805664062, "global_step": 279844, "epoch": 1665} {"train_loss": -11.962849617004395, "global_step": 279845, "epoch": 1665} {"train_loss": -11.777935028076172, "global_step": 279846, "epoch": 1665} {"train_loss": -11.920732498168945, "global_step": 279847, "epoch": 1665} {"train_loss": -11.919353485107422, "global_step": 279848, "epoch": 1665} {"train_loss": -12.093290328979492, "global_step": 279849, "epoch": 1665} {"train_loss": -12.159385681152344, "global_step": 279850, "epoch": 1665} {"train_loss": -11.84329605102539, "global_step": 279851, "epoch": 1665} {"train_loss": -11.865516662597656, "global_step": 279852, "epoch": 1665} {"train_loss": -12.088791847229004, "global_step": 279853, "epoch": 1665} {"train_loss": -12.233427047729492, "global_step": 279854, "epoch": 1665} {"train_loss": -12.18569564819336, "global_step": 279855, "epoch": 1665} {"train_loss": -12.010255813598633, "global_step": 279856, "epoch": 1665} {"train_loss": -12.182830810546875, "global_step": 279857, "epoch": 1665} {"train_loss": -12.155633926391602, "global_step": 279858, "epoch": 1665} {"train_loss": -12.184070587158203, "global_step": 279859, "epoch": 1665} {"train_loss": -11.91346549987793, "global_step": 279860, "epoch": 1665} {"train_loss": -12.302223205566406, "global_step": 279861, "epoch": 1665} {"train_loss": -12.10908317565918, "global_step": 279862, "epoch": 1665} {"train_loss": -11.986251831054688, "global_step": 279863, "epoch": 1665} {"train_loss": -12.077730178833008, "global_step": 279864, "epoch": 1665} {"train_loss": -12.201982498168945, "global_step": 279865, "epoch": 1665} {"train_loss": -11.814315795898438, "global_step": 279866, "epoch": 1665} {"train_loss": -12.11611270904541, "global_step": 279867, "epoch": 1665} {"train_loss": -11.865686416625977, "global_step": 279868, "epoch": 1665} {"train_loss": -11.666902542114258, "global_step": 279869, "epoch": 1665} {"train_loss": -12.431135177612305, "global_step": 279870, "epoch": 1665} {"train_loss": -11.745437622070312, "global_step": 279871, "epoch": 1665} {"train_loss": -12.043211936950684, "global_step": 279872, "epoch": 1665} {"train_loss": -11.976912498474121, "global_step": 279873, "epoch": 1665} {"train_loss": -12.033417701721191, "global_step": 279874, "epoch": 1665} {"train_loss": -11.716352462768555, "global_step": 279875, "epoch": 1665} {"train_loss": -12.210369110107422, "global_step": 279876, "epoch": 1665} {"train_loss": -12.000025749206543, "global_step": 279877, "epoch": 1665} {"train_loss": -12.037313461303711, "global_step": 279878, "epoch": 1665} {"train_loss": -12.067413330078125, "global_step": 279879, "epoch": 1665} {"train_loss": -11.895942687988281, "global_step": 279880, "epoch": 1665} {"train_loss": -12.005366325378418, "global_step": 279881, "epoch": 1665} {"train_loss": -12.04305648803711, "global_step": 279882, "epoch": 1665} {"train_loss": -12.335657119750977, "global_step": 279883, "epoch": 1665} {"train_loss": -11.605186462402344, "global_step": 279884, "epoch": 1665} {"train_loss": -11.527280807495117, "global_step": 279885, "epoch": 1665} {"train_loss": -11.920406341552734, "global_step": 279886, "epoch": 1665} {"train_loss": -11.652535149029323, "global_step": 279887, "epoch": 1665, "val_loss": 271758.875, "train_action_mse_error": 3.1481287479400635} {"train_loss": -10.720433235168457, "global_step": 279888, "epoch": 1666} {"train_loss": -11.494561195373535, "global_step": 279889, "epoch": 1666} {"train_loss": -10.41390609741211, "global_step": 279890, "epoch": 1666} {"train_loss": -10.847396850585938, "global_step": 279891, "epoch": 1666} {"train_loss": -11.461034774780273, "global_step": 279892, "epoch": 1666} {"train_loss": -10.034814834594727, "global_step": 279893, "epoch": 1666} {"train_loss": -9.519269943237305, "global_step": 279894, "epoch": 1666} {"train_loss": -10.2622709274292, "global_step": 279895, "epoch": 1666} {"train_loss": -10.475854873657227, "global_step": 279896, "epoch": 1666} {"train_loss": -10.641580581665039, "global_step": 279897, "epoch": 1666} {"train_loss": -9.138946533203125, "global_step": 279898, "epoch": 1666} {"train_loss": -9.710354804992676, "global_step": 279899, "epoch": 1666} {"train_loss": -7.37299919128418, "global_step": 279900, "epoch": 1666} {"train_loss": -8.199393272399902, "global_step": 279901, "epoch": 1666} {"train_loss": -10.64935302734375, "global_step": 279902, "epoch": 1666} {"train_loss": -9.662384033203125, "global_step": 279903, "epoch": 1666} {"train_loss": -10.099588394165039, "global_step": 279904, "epoch": 1666} {"train_loss": -9.988654136657715, "global_step": 279905, "epoch": 1666} {"train_loss": -10.507170677185059, "global_step": 279906, "epoch": 1666} {"train_loss": -10.124564170837402, "global_step": 279907, "epoch": 1666} {"train_loss": -11.440330505371094, "global_step": 279908, "epoch": 1666} {"train_loss": -10.545422554016113, "global_step": 279909, "epoch": 1666} {"train_loss": -11.529754638671875, "global_step": 279910, "epoch": 1666} {"train_loss": -10.52474594116211, "global_step": 279911, "epoch": 1666} {"train_loss": -10.71320915222168, "global_step": 279912, "epoch": 1666} {"train_loss": -11.076521873474121, "global_step": 279913, "epoch": 1666} {"train_loss": -11.081075668334961, "global_step": 279914, "epoch": 1666} {"train_loss": -11.731459617614746, "global_step": 279915, "epoch": 1666} {"train_loss": -11.627028465270996, "global_step": 279916, "epoch": 1666} {"train_loss": -11.30063533782959, "global_step": 279917, "epoch": 1666} {"train_loss": -11.577497482299805, "global_step": 279918, "epoch": 1666} {"train_loss": -11.333735466003418, "global_step": 279919, "epoch": 1666} {"train_loss": -11.25024700164795, "global_step": 279920, "epoch": 1666} {"train_loss": -11.902351379394531, "global_step": 279921, "epoch": 1666} {"train_loss": -11.519683837890625, "global_step": 279922, "epoch": 1666} {"train_loss": -11.711175918579102, "global_step": 279923, "epoch": 1666} {"train_loss": -11.478487968444824, "global_step": 279924, "epoch": 1666} {"train_loss": -11.553600311279297, "global_step": 279925, "epoch": 1666} {"train_loss": -11.575931549072266, "global_step": 279926, "epoch": 1666} {"train_loss": -11.816396713256836, "global_step": 279927, "epoch": 1666} {"train_loss": -11.942075729370117, "global_step": 279928, "epoch": 1666} {"train_loss": -11.677438735961914, "global_step": 279929, "epoch": 1666} {"train_loss": -12.064774513244629, "global_step": 279930, "epoch": 1666} {"train_loss": -11.583663940429688, "global_step": 279931, "epoch": 1666} {"train_loss": -11.825358390808105, "global_step": 279932, "epoch": 1666} {"train_loss": -11.995338439941406, "global_step": 279933, "epoch": 1666} {"train_loss": -12.077252388000488, "global_step": 279934, "epoch": 1666} {"train_loss": -11.943198204040527, "global_step": 279935, "epoch": 1666} {"train_loss": -12.01205062866211, "global_step": 279936, "epoch": 1666} {"train_loss": -11.854119300842285, "global_step": 279937, "epoch": 1666} {"train_loss": -12.003974914550781, "global_step": 279938, "epoch": 1666} {"train_loss": -12.125526428222656, "global_step": 279939, "epoch": 1666} {"train_loss": -11.899246215820312, "global_step": 279940, "epoch": 1666} {"train_loss": -11.995532035827637, "global_step": 279941, "epoch": 1666} {"train_loss": -11.899980545043945, "global_step": 279942, "epoch": 1666} {"train_loss": -11.999253273010254, "global_step": 279943, "epoch": 1666} {"train_loss": -11.949625015258789, "global_step": 279944, "epoch": 1666} {"train_loss": -11.743049621582031, "global_step": 279945, "epoch": 1666} {"train_loss": -12.09274959564209, "global_step": 279946, "epoch": 1666} {"train_loss": -12.016014099121094, "global_step": 279947, "epoch": 1666} {"train_loss": -11.775016784667969, "global_step": 279948, "epoch": 1666} {"train_loss": -12.179572105407715, "global_step": 279949, "epoch": 1666} {"train_loss": -11.999397277832031, "global_step": 279950, "epoch": 1666} {"train_loss": -12.255882263183594, "global_step": 279951, "epoch": 1666} {"train_loss": -12.05827522277832, "global_step": 279952, "epoch": 1666} {"train_loss": -12.28024959564209, "global_step": 279953, "epoch": 1666} {"train_loss": -12.081883430480957, "global_step": 279954, "epoch": 1666} {"train_loss": -12.138864517211914, "global_step": 279955, "epoch": 1666} {"train_loss": -12.050012588500977, "global_step": 279956, "epoch": 1666} {"train_loss": -12.11406421661377, "global_step": 279957, "epoch": 1666} {"train_loss": -11.88059139251709, "global_step": 279958, "epoch": 1666} {"train_loss": -12.271770477294922, "global_step": 279959, "epoch": 1666} {"train_loss": -11.990211486816406, "global_step": 279960, "epoch": 1666} {"train_loss": -12.19038200378418, "global_step": 279961, "epoch": 1666} {"train_loss": -11.963449478149414, "global_step": 279962, "epoch": 1666} {"train_loss": -12.148160934448242, "global_step": 279963, "epoch": 1666} {"train_loss": -12.358579635620117, "global_step": 279964, "epoch": 1666} {"train_loss": -12.327749252319336, "global_step": 279965, "epoch": 1666} {"train_loss": -12.198548316955566, "global_step": 279966, "epoch": 1666} {"train_loss": -12.167045593261719, "global_step": 279967, "epoch": 1666} {"train_loss": -12.380563735961914, "global_step": 279968, "epoch": 1666} {"train_loss": -12.242697715759277, "global_step": 279969, "epoch": 1666} {"train_loss": -12.330336570739746, "global_step": 279970, "epoch": 1666} {"train_loss": -12.083850860595703, "global_step": 279971, "epoch": 1666} {"train_loss": -12.338512420654297, "global_step": 279972, "epoch": 1666} {"train_loss": -12.395868301391602, "global_step": 279973, "epoch": 1666} {"train_loss": -12.262274742126465, "global_step": 279974, "epoch": 1666} {"train_loss": -12.490904808044434, "global_step": 279975, "epoch": 1666} {"train_loss": -12.366268157958984, "global_step": 279976, "epoch": 1666} {"train_loss": -12.222574234008789, "global_step": 279977, "epoch": 1666} {"train_loss": -12.307905197143555, "global_step": 279978, "epoch": 1666} {"train_loss": -12.363090515136719, "global_step": 279979, "epoch": 1666} {"train_loss": -12.171817779541016, "global_step": 279980, "epoch": 1666} {"train_loss": -12.245439529418945, "global_step": 279981, "epoch": 1666} {"train_loss": -12.619345664978027, "global_step": 279982, "epoch": 1666} {"train_loss": -12.214154243469238, "global_step": 279983, "epoch": 1666} {"train_loss": -12.289823532104492, "global_step": 279984, "epoch": 1666} {"train_loss": -11.881948471069336, "global_step": 279985, "epoch": 1666} {"train_loss": -11.418432235717773, "global_step": 279986, "epoch": 1666} {"train_loss": -11.103876113891602, "global_step": 279987, "epoch": 1666} {"train_loss": -11.65636920928955, "global_step": 279988, "epoch": 1666} {"train_loss": -12.244534492492676, "global_step": 279989, "epoch": 1666} {"train_loss": -11.360551834106445, "global_step": 279990, "epoch": 1666} {"train_loss": -11.118535995483398, "global_step": 279991, "epoch": 1666} {"train_loss": -10.592342376708984, "global_step": 279992, "epoch": 1666} {"train_loss": -11.68855094909668, "global_step": 279993, "epoch": 1666} {"train_loss": -11.907625198364258, "global_step": 279994, "epoch": 1666} {"train_loss": -10.102998733520508, "global_step": 279995, "epoch": 1666} {"train_loss": -12.005813598632812, "global_step": 279996, "epoch": 1666} {"train_loss": -11.771944046020508, "global_step": 279997, "epoch": 1666} {"train_loss": -11.923938751220703, "global_step": 279998, "epoch": 1666} {"train_loss": -11.516669273376465, "global_step": 279999, "epoch": 1666} {"train_loss": -10.683947563171387, "global_step": 280000, "epoch": 1666} {"train_loss": -11.721263885498047, "global_step": 280001, "epoch": 1666} {"train_loss": -11.101261138916016, "global_step": 280002, "epoch": 1666} {"train_loss": -11.766992568969727, "global_step": 280003, "epoch": 1666} {"train_loss": -10.72118854522705, "global_step": 280004, "epoch": 1666} {"train_loss": -11.416482925415039, "global_step": 280005, "epoch": 1666} {"train_loss": -8.403167724609375, "global_step": 280006, "epoch": 1666} {"train_loss": -9.929023742675781, "global_step": 280007, "epoch": 1666} {"train_loss": -9.893404006958008, "global_step": 280008, "epoch": 1666} {"train_loss": -11.022193908691406, "global_step": 280009, "epoch": 1666} {"train_loss": -11.418428421020508, "global_step": 280010, "epoch": 1666} {"train_loss": -10.172441482543945, "global_step": 280011, "epoch": 1666} {"train_loss": -10.259202003479004, "global_step": 280012, "epoch": 1666} {"train_loss": -12.082910537719727, "global_step": 280013, "epoch": 1666} {"train_loss": -10.887258529663086, "global_step": 280014, "epoch": 1666} {"train_loss": -11.31013011932373, "global_step": 280015, "epoch": 1666} {"train_loss": -11.650047302246094, "global_step": 280016, "epoch": 1666} {"train_loss": -11.371280670166016, "global_step": 280017, "epoch": 1666} {"train_loss": -11.46657657623291, "global_step": 280018, "epoch": 1666} {"train_loss": -11.207298278808594, "global_step": 280019, "epoch": 1666} {"train_loss": -11.220739364624023, "global_step": 280020, "epoch": 1666} {"train_loss": -11.708097457885742, "global_step": 280021, "epoch": 1666} {"train_loss": -11.716718673706055, "global_step": 280022, "epoch": 1666} {"train_loss": -11.738245964050293, "global_step": 280023, "epoch": 1666} {"train_loss": -11.950620651245117, "global_step": 280024, "epoch": 1666} {"train_loss": -11.214932441711426, "global_step": 280025, "epoch": 1666} {"train_loss": -12.017494201660156, "global_step": 280026, "epoch": 1666} {"train_loss": -11.911821365356445, "global_step": 280027, "epoch": 1666} {"train_loss": -11.612152099609375, "global_step": 280028, "epoch": 1666} {"train_loss": -11.889020919799805, "global_step": 280029, "epoch": 1666} {"train_loss": -11.509876251220703, "global_step": 280030, "epoch": 1666} {"train_loss": -11.78665828704834, "global_step": 280031, "epoch": 1666} {"train_loss": -11.225343704223633, "global_step": 280032, "epoch": 1666} {"train_loss": -11.594176292419434, "global_step": 280033, "epoch": 1666} {"train_loss": -11.695372581481934, "global_step": 280034, "epoch": 1666} {"train_loss": -11.15463638305664, "global_step": 280035, "epoch": 1666} {"train_loss": -11.491903305053711, "global_step": 280036, "epoch": 1666} {"train_loss": -11.604307174682617, "global_step": 280037, "epoch": 1666} {"train_loss": -11.395990371704102, "global_step": 280038, "epoch": 1666} {"train_loss": -11.927193641662598, "global_step": 280039, "epoch": 1666} {"train_loss": -11.641802787780762, "global_step": 280040, "epoch": 1666} {"train_loss": -11.703392028808594, "global_step": 280041, "epoch": 1666} {"train_loss": -11.213550567626953, "global_step": 280042, "epoch": 1666} {"train_loss": -11.207854270935059, "global_step": 280043, "epoch": 1666} {"train_loss": -11.285574913024902, "global_step": 280044, "epoch": 1666} {"train_loss": -11.243946075439453, "global_step": 280045, "epoch": 1666} {"train_loss": -11.558481216430664, "global_step": 280046, "epoch": 1666} {"train_loss": -11.356132507324219, "global_step": 280047, "epoch": 1666} {"train_loss": -12.04503345489502, "global_step": 280048, "epoch": 1666} {"train_loss": -11.407683372497559, "global_step": 280049, "epoch": 1666} {"train_loss": -11.693414688110352, "global_step": 280050, "epoch": 1666} {"train_loss": -11.655261993408203, "global_step": 280051, "epoch": 1666} {"train_loss": -11.633798599243164, "global_step": 280052, "epoch": 1666} {"train_loss": -11.617284774780273, "global_step": 280053, "epoch": 1666} {"train_loss": -11.887965202331543, "global_step": 280054, "epoch": 1666} {"train_loss": -11.471206568536305, "global_step": 280055, "epoch": 1666, "val_loss": 271057.71875} {"train_loss": -12.213071823120117, "global_step": 280056, "epoch": 1667} {"train_loss": -11.248428344726562, "global_step": 280057, "epoch": 1667} {"train_loss": -12.003555297851562, "global_step": 280058, "epoch": 1667} {"train_loss": -11.53744125366211, "global_step": 280059, "epoch": 1667} {"train_loss": -12.297855377197266, "global_step": 280060, "epoch": 1667} {"train_loss": -11.522455215454102, "global_step": 280061, "epoch": 1667} {"train_loss": -11.910102844238281, "global_step": 280062, "epoch": 1667} {"train_loss": -11.775160789489746, "global_step": 280063, "epoch": 1667} {"train_loss": -11.960719108581543, "global_step": 280064, "epoch": 1667} {"train_loss": -11.926756858825684, "global_step": 280065, "epoch": 1667} {"train_loss": -12.064918518066406, "global_step": 280066, "epoch": 1667} {"train_loss": -11.998903274536133, "global_step": 280067, "epoch": 1667} {"train_loss": -11.760538101196289, "global_step": 280068, "epoch": 1667} {"train_loss": -12.071880340576172, "global_step": 280069, "epoch": 1667} {"train_loss": -11.803094863891602, "global_step": 280070, "epoch": 1667} {"train_loss": -12.089456558227539, "global_step": 280071, "epoch": 1667} {"train_loss": -12.015336990356445, "global_step": 280072, "epoch": 1667} {"train_loss": -12.315671920776367, "global_step": 280073, "epoch": 1667} {"train_loss": -12.03075122833252, "global_step": 280074, "epoch": 1667} {"train_loss": -11.89596176147461, "global_step": 280075, "epoch": 1667} {"train_loss": -11.859304428100586, "global_step": 280076, "epoch": 1667} {"train_loss": -12.216093063354492, "global_step": 280077, "epoch": 1667} {"train_loss": -12.03500747680664, "global_step": 280078, "epoch": 1667} {"train_loss": -12.152298927307129, "global_step": 280079, "epoch": 1667} {"train_loss": -12.151885986328125, "global_step": 280080, "epoch": 1667} {"train_loss": -11.954830169677734, "global_step": 280081, "epoch": 1667} {"train_loss": -12.092154502868652, "global_step": 280082, "epoch": 1667} {"train_loss": -12.032583236694336, "global_step": 280083, "epoch": 1667} {"train_loss": -12.286343574523926, "global_step": 280084, "epoch": 1667} {"train_loss": -11.949551582336426, "global_step": 280085, "epoch": 1667} {"train_loss": -11.900079727172852, "global_step": 280086, "epoch": 1667} {"train_loss": -11.493511199951172, "global_step": 280087, "epoch": 1667} {"train_loss": -11.925776481628418, "global_step": 280088, "epoch": 1667} {"train_loss": -11.714975357055664, "global_step": 280089, "epoch": 1667} {"train_loss": -11.817805290222168, "global_step": 280090, "epoch": 1667} {"train_loss": -11.59326171875, "global_step": 280091, "epoch": 1667} {"train_loss": -11.792871475219727, "global_step": 280092, "epoch": 1667} {"train_loss": -10.984498023986816, "global_step": 280093, "epoch": 1667} {"train_loss": -11.028421401977539, "global_step": 280094, "epoch": 1667} {"train_loss": -11.825281143188477, "global_step": 280095, "epoch": 1667} {"train_loss": -11.678912162780762, "global_step": 280096, "epoch": 1667} {"train_loss": -11.56928825378418, "global_step": 280097, "epoch": 1667} {"train_loss": -11.593085289001465, "global_step": 280098, "epoch": 1667} {"train_loss": -11.950284004211426, "global_step": 280099, "epoch": 1667} {"train_loss": -11.51660442352295, "global_step": 280100, "epoch": 1667} {"train_loss": -12.000910758972168, "global_step": 280101, "epoch": 1667} {"train_loss": -11.531454086303711, "global_step": 280102, "epoch": 1667} {"train_loss": -12.167537689208984, "global_step": 280103, "epoch": 1667} {"train_loss": -12.162528038024902, "global_step": 280104, "epoch": 1667} {"train_loss": -11.886981010437012, "global_step": 280105, "epoch": 1667} {"train_loss": -12.222591400146484, "global_step": 280106, "epoch": 1667} {"train_loss": -11.150979995727539, "global_step": 280107, "epoch": 1667} {"train_loss": -11.860918045043945, "global_step": 280108, "epoch": 1667} {"train_loss": -11.821040153503418, "global_step": 280109, "epoch": 1667} {"train_loss": -11.73704719543457, "global_step": 280110, "epoch": 1667} {"train_loss": -11.505582809448242, "global_step": 280111, "epoch": 1667} {"train_loss": -11.955169677734375, "global_step": 280112, "epoch": 1667} {"train_loss": -11.920562744140625, "global_step": 280113, "epoch": 1667} {"train_loss": -11.745471954345703, "global_step": 280114, "epoch": 1667} {"train_loss": -12.253238677978516, "global_step": 280115, "epoch": 1667} {"train_loss": -11.518268585205078, "global_step": 280116, "epoch": 1667} {"train_loss": -11.925174713134766, "global_step": 280117, "epoch": 1667} {"train_loss": -11.399286270141602, "global_step": 280118, "epoch": 1667} {"train_loss": -11.83399486541748, "global_step": 280119, "epoch": 1667} {"train_loss": -11.516273498535156, "global_step": 280120, "epoch": 1667} {"train_loss": -11.525529861450195, "global_step": 280121, "epoch": 1667} {"train_loss": -11.50639820098877, "global_step": 280122, "epoch": 1667} {"train_loss": -12.31117057800293, "global_step": 280123, "epoch": 1667} {"train_loss": -11.507549285888672, "global_step": 280124, "epoch": 1667} {"train_loss": -11.889347076416016, "global_step": 280125, "epoch": 1667} {"train_loss": -11.827789306640625, "global_step": 280126, "epoch": 1667} {"train_loss": -11.636003494262695, "global_step": 280127, "epoch": 1667} {"train_loss": -11.960439682006836, "global_step": 280128, "epoch": 1667} {"train_loss": -11.745817184448242, "global_step": 280129, "epoch": 1667} {"train_loss": -12.2179536819458, "global_step": 280130, "epoch": 1667} {"train_loss": -11.36257553100586, "global_step": 280131, "epoch": 1667} {"train_loss": -11.510980606079102, "global_step": 280132, "epoch": 1667} {"train_loss": -11.511725425720215, "global_step": 280133, "epoch": 1667} {"train_loss": -11.703625679016113, "global_step": 280134, "epoch": 1667} {"train_loss": -11.186724662780762, "global_step": 280135, "epoch": 1667} {"train_loss": -11.659589767456055, "global_step": 280136, "epoch": 1667} {"train_loss": -10.967147827148438, "global_step": 280137, "epoch": 1667} {"train_loss": -10.418920516967773, "global_step": 280138, "epoch": 1667} {"train_loss": -11.370092391967773, "global_step": 280139, "epoch": 1667} {"train_loss": -8.758273124694824, "global_step": 280140, "epoch": 1667} {"train_loss": -11.006908416748047, "global_step": 280141, "epoch": 1667} {"train_loss": -9.348121643066406, "global_step": 280142, "epoch": 1667} {"train_loss": -9.529714584350586, "global_step": 280143, "epoch": 1667} {"train_loss": -9.603863716125488, "global_step": 280144, "epoch": 1667} {"train_loss": -9.481924057006836, "global_step": 280145, "epoch": 1667} {"train_loss": -9.85037612915039, "global_step": 280146, "epoch": 1667} {"train_loss": -10.845393180847168, "global_step": 280147, "epoch": 1667} {"train_loss": -10.893187522888184, "global_step": 280148, "epoch": 1667} {"train_loss": -10.690206527709961, "global_step": 280149, "epoch": 1667} {"train_loss": -11.246696472167969, "global_step": 280150, "epoch": 1667} {"train_loss": -10.312599182128906, "global_step": 280151, "epoch": 1667} {"train_loss": -10.832136154174805, "global_step": 280152, "epoch": 1667} {"train_loss": -10.396984100341797, "global_step": 280153, "epoch": 1667} {"train_loss": -10.609649658203125, "global_step": 280154, "epoch": 1667} {"train_loss": -11.480596542358398, "global_step": 280155, "epoch": 1667} {"train_loss": -10.692111015319824, "global_step": 280156, "epoch": 1667} {"train_loss": -10.938291549682617, "global_step": 280157, "epoch": 1667} {"train_loss": -11.616718292236328, "global_step": 280158, "epoch": 1667} {"train_loss": -10.342483520507812, "global_step": 280159, "epoch": 1667} {"train_loss": -11.333385467529297, "global_step": 280160, "epoch": 1667} {"train_loss": -10.643752098083496, "global_step": 280161, "epoch": 1667} {"train_loss": -10.42774772644043, "global_step": 280162, "epoch": 1667} {"train_loss": -11.644267082214355, "global_step": 280163, "epoch": 1667} {"train_loss": -10.959005355834961, "global_step": 280164, "epoch": 1667} {"train_loss": -11.181453704833984, "global_step": 280165, "epoch": 1667} {"train_loss": -11.112186431884766, "global_step": 280166, "epoch": 1667} {"train_loss": -11.343507766723633, "global_step": 280167, "epoch": 1667} {"train_loss": -11.104010581970215, "global_step": 280168, "epoch": 1667} {"train_loss": -11.63088607788086, "global_step": 280169, "epoch": 1667} {"train_loss": -11.536590576171875, "global_step": 280170, "epoch": 1667} {"train_loss": -11.355743408203125, "global_step": 280171, "epoch": 1667} {"train_loss": -11.637398719787598, "global_step": 280172, "epoch": 1667} {"train_loss": -11.520925521850586, "global_step": 280173, "epoch": 1667} {"train_loss": -11.499906539916992, "global_step": 280174, "epoch": 1667} {"train_loss": -11.433908462524414, "global_step": 280175, "epoch": 1667} {"train_loss": -11.736289978027344, "global_step": 280176, "epoch": 1667} {"train_loss": -11.328361511230469, "global_step": 280177, "epoch": 1667} {"train_loss": -11.6068696975708, "global_step": 280178, "epoch": 1667} {"train_loss": -11.202733039855957, "global_step": 280179, "epoch": 1667} {"train_loss": -11.56359577178955, "global_step": 280180, "epoch": 1667} {"train_loss": -11.380319595336914, "global_step": 280181, "epoch": 1667} {"train_loss": -11.429303169250488, "global_step": 280182, "epoch": 1667} {"train_loss": -11.4428071975708, "global_step": 280183, "epoch": 1667} {"train_loss": -11.61131477355957, "global_step": 280184, "epoch": 1667} {"train_loss": -11.337753295898438, "global_step": 280185, "epoch": 1667} {"train_loss": -11.785566329956055, "global_step": 280186, "epoch": 1667} {"train_loss": -11.645090103149414, "global_step": 280187, "epoch": 1667} {"train_loss": -11.393669128417969, "global_step": 280188, "epoch": 1667} {"train_loss": -11.742267608642578, "global_step": 280189, "epoch": 1667} {"train_loss": -11.42386245727539, "global_step": 280190, "epoch": 1667} {"train_loss": -11.50412368774414, "global_step": 280191, "epoch": 1667} {"train_loss": -11.396400451660156, "global_step": 280192, "epoch": 1667} {"train_loss": -11.71507740020752, "global_step": 280193, "epoch": 1667} {"train_loss": -11.852272033691406, "global_step": 280194, "epoch": 1667} {"train_loss": -11.553129196166992, "global_step": 280195, "epoch": 1667} {"train_loss": -11.654343605041504, "global_step": 280196, "epoch": 1667} {"train_loss": -11.494245529174805, "global_step": 280197, "epoch": 1667} {"train_loss": -11.852615356445312, "global_step": 280198, "epoch": 1667} {"train_loss": -11.636098861694336, "global_step": 280199, "epoch": 1667} {"train_loss": -11.622671127319336, "global_step": 280200, "epoch": 1667} {"train_loss": -11.738968849182129, "global_step": 280201, "epoch": 1667} {"train_loss": -11.548273086547852, "global_step": 280202, "epoch": 1667} {"train_loss": -11.820058822631836, "global_step": 280203, "epoch": 1667} {"train_loss": -11.468985557556152, "global_step": 280204, "epoch": 1667} {"train_loss": -11.602173805236816, "global_step": 280205, "epoch": 1667} {"train_loss": -11.771652221679688, "global_step": 280206, "epoch": 1667} {"train_loss": -11.773577690124512, "global_step": 280207, "epoch": 1667} {"train_loss": -11.855978012084961, "global_step": 280208, "epoch": 1667} {"train_loss": -11.243341445922852, "global_step": 280209, "epoch": 1667} {"train_loss": -11.329354286193848, "global_step": 280210, "epoch": 1667} {"train_loss": -11.232171058654785, "global_step": 280211, "epoch": 1667} {"train_loss": -11.542080879211426, "global_step": 280212, "epoch": 1667} {"train_loss": -10.90677261352539, "global_step": 280213, "epoch": 1667} {"train_loss": -11.727263450622559, "global_step": 280214, "epoch": 1667} {"train_loss": -11.223165512084961, "global_step": 280215, "epoch": 1667} {"train_loss": -11.333507537841797, "global_step": 280216, "epoch": 1667} {"train_loss": -11.531205177307129, "global_step": 280217, "epoch": 1667} {"train_loss": -11.283426284790039, "global_step": 280218, "epoch": 1667} {"train_loss": -11.520848274230957, "global_step": 280219, "epoch": 1667} {"train_loss": -11.680362701416016, "global_step": 280220, "epoch": 1667} {"train_loss": -11.256032943725586, "global_step": 280221, "epoch": 1667} {"train_loss": -11.94920539855957, "global_step": 280222, "epoch": 1667} {"train_loss": -11.500133877708798, "global_step": 280223, "epoch": 1667, "val_loss": 268345.25} {"train_loss": -11.931007385253906, "global_step": 280224, "epoch": 1668} {"train_loss": -11.811681747436523, "global_step": 280225, "epoch": 1668} {"train_loss": -11.887563705444336, "global_step": 280226, "epoch": 1668} {"train_loss": -12.0120267868042, "global_step": 280227, "epoch": 1668} {"train_loss": -11.929764747619629, "global_step": 280228, "epoch": 1668} {"train_loss": -11.732309341430664, "global_step": 280229, "epoch": 1668} {"train_loss": -11.775018692016602, "global_step": 280230, "epoch": 1668} {"train_loss": -11.999629974365234, "global_step": 280231, "epoch": 1668} {"train_loss": -11.869085311889648, "global_step": 280232, "epoch": 1668} {"train_loss": -12.128181457519531, "global_step": 280233, "epoch": 1668} {"train_loss": -11.732279777526855, "global_step": 280234, "epoch": 1668} {"train_loss": -12.063926696777344, "global_step": 280235, "epoch": 1668} {"train_loss": -11.784357070922852, "global_step": 280236, "epoch": 1668} {"train_loss": -11.91830062866211, "global_step": 280237, "epoch": 1668} {"train_loss": -11.843862533569336, "global_step": 280238, "epoch": 1668} {"train_loss": -12.042470932006836, "global_step": 280239, "epoch": 1668} {"train_loss": -12.165336608886719, "global_step": 280240, "epoch": 1668} {"train_loss": -11.990266799926758, "global_step": 280241, "epoch": 1668} {"train_loss": -12.217208862304688, "global_step": 280242, "epoch": 1668} {"train_loss": -11.755912780761719, "global_step": 280243, "epoch": 1668} {"train_loss": -12.153970718383789, "global_step": 280244, "epoch": 1668} {"train_loss": -12.07306957244873, "global_step": 280245, "epoch": 1668} {"train_loss": -12.211650848388672, "global_step": 280246, "epoch": 1668} {"train_loss": -11.879125595092773, "global_step": 280247, "epoch": 1668} {"train_loss": -11.825794219970703, "global_step": 280248, "epoch": 1668} {"train_loss": -12.243827819824219, "global_step": 280249, "epoch": 1668} {"train_loss": -11.802568435668945, "global_step": 280250, "epoch": 1668} {"train_loss": -12.138507843017578, "global_step": 280251, "epoch": 1668} {"train_loss": -11.862503051757812, "global_step": 280252, "epoch": 1668} {"train_loss": -11.926143646240234, "global_step": 280253, "epoch": 1668} {"train_loss": -12.218494415283203, "global_step": 280254, "epoch": 1668} {"train_loss": -11.80978012084961, "global_step": 280255, "epoch": 1668} {"train_loss": -12.215971946716309, "global_step": 280256, "epoch": 1668} {"train_loss": -11.954889297485352, "global_step": 280257, "epoch": 1668} {"train_loss": -11.780350685119629, "global_step": 280258, "epoch": 1668} {"train_loss": -12.317480087280273, "global_step": 280259, "epoch": 1668} {"train_loss": -11.92306900024414, "global_step": 280260, "epoch": 1668} {"train_loss": -12.043323516845703, "global_step": 280261, "epoch": 1668} {"train_loss": -12.216812133789062, "global_step": 280262, "epoch": 1668} {"train_loss": -11.74711799621582, "global_step": 280263, "epoch": 1668} {"train_loss": -12.225503921508789, "global_step": 280264, "epoch": 1668} {"train_loss": -12.249434471130371, "global_step": 280265, "epoch": 1668} {"train_loss": -12.030550956726074, "global_step": 280266, "epoch": 1668} {"train_loss": -12.159967422485352, "global_step": 280267, "epoch": 1668} {"train_loss": -12.142751693725586, "global_step": 280268, "epoch": 1668} {"train_loss": -11.985807418823242, "global_step": 280269, "epoch": 1668} {"train_loss": -12.151224136352539, "global_step": 280270, "epoch": 1668} {"train_loss": -11.930612564086914, "global_step": 280271, "epoch": 1668} {"train_loss": -12.174814224243164, "global_step": 280272, "epoch": 1668} {"train_loss": -12.052244186401367, "global_step": 280273, "epoch": 1668} {"train_loss": -12.2335205078125, "global_step": 280274, "epoch": 1668} {"train_loss": -11.990375518798828, "global_step": 280275, "epoch": 1668} {"train_loss": -12.184385299682617, "global_step": 280276, "epoch": 1668} {"train_loss": -12.294368743896484, "global_step": 280277, "epoch": 1668} {"train_loss": -12.213939666748047, "global_step": 280278, "epoch": 1668} {"train_loss": -12.199813842773438, "global_step": 280279, "epoch": 1668} {"train_loss": -12.252341270446777, "global_step": 280280, "epoch": 1668} {"train_loss": -12.109789848327637, "global_step": 280281, "epoch": 1668} {"train_loss": -12.390605926513672, "global_step": 280282, "epoch": 1668} {"train_loss": -12.483356475830078, "global_step": 280283, "epoch": 1668} {"train_loss": -12.291961669921875, "global_step": 280284, "epoch": 1668} {"train_loss": -11.841958999633789, "global_step": 280285, "epoch": 1668} {"train_loss": -11.524894714355469, "global_step": 280286, "epoch": 1668} {"train_loss": -12.343473434448242, "global_step": 280287, "epoch": 1668} {"train_loss": -11.247457504272461, "global_step": 280288, "epoch": 1668} {"train_loss": -11.751901626586914, "global_step": 280289, "epoch": 1668} {"train_loss": -12.087571144104004, "global_step": 280290, "epoch": 1668} {"train_loss": -11.95394515991211, "global_step": 280291, "epoch": 1668} {"train_loss": -11.28164291381836, "global_step": 280292, "epoch": 1668} {"train_loss": -11.308218955993652, "global_step": 280293, "epoch": 1668} {"train_loss": -11.928641319274902, "global_step": 280294, "epoch": 1668} {"train_loss": -11.085441589355469, "global_step": 280295, "epoch": 1668} {"train_loss": -11.718896865844727, "global_step": 280296, "epoch": 1668} {"train_loss": -10.912342071533203, "global_step": 280297, "epoch": 1668} {"train_loss": -9.11678695678711, "global_step": 280298, "epoch": 1668} {"train_loss": -11.884661674499512, "global_step": 280299, "epoch": 1668} {"train_loss": -10.711380004882812, "global_step": 280300, "epoch": 1668} {"train_loss": -10.841381072998047, "global_step": 280301, "epoch": 1668} {"train_loss": -12.047021865844727, "global_step": 280302, "epoch": 1668} {"train_loss": -10.566192626953125, "global_step": 280303, "epoch": 1668} {"train_loss": -11.956859588623047, "global_step": 280304, "epoch": 1668} {"train_loss": -10.617191314697266, "global_step": 280305, "epoch": 1668} {"train_loss": -10.89825439453125, "global_step": 280306, "epoch": 1668} {"train_loss": -12.08186149597168, "global_step": 280307, "epoch": 1668} {"train_loss": -10.77766227722168, "global_step": 280308, "epoch": 1668} {"train_loss": -11.85200309753418, "global_step": 280309, "epoch": 1668} {"train_loss": -10.62713623046875, "global_step": 280310, "epoch": 1668} {"train_loss": -11.08983039855957, "global_step": 280311, "epoch": 1668} {"train_loss": -11.60630989074707, "global_step": 280312, "epoch": 1668} {"train_loss": -10.304986000061035, "global_step": 280313, "epoch": 1668} {"train_loss": -12.038917541503906, "global_step": 280314, "epoch": 1668} {"train_loss": -11.057147026062012, "global_step": 280315, "epoch": 1668} {"train_loss": -11.13022232055664, "global_step": 280316, "epoch": 1668} {"train_loss": -11.794137001037598, "global_step": 280317, "epoch": 1668} {"train_loss": -11.298965454101562, "global_step": 280318, "epoch": 1668} {"train_loss": -11.768024444580078, "global_step": 280319, "epoch": 1668} {"train_loss": -11.458756446838379, "global_step": 280320, "epoch": 1668} {"train_loss": -11.782633781433105, "global_step": 280321, "epoch": 1668} {"train_loss": -11.492165565490723, "global_step": 280322, "epoch": 1668} {"train_loss": -11.481893539428711, "global_step": 280323, "epoch": 1668} {"train_loss": -11.755851745605469, "global_step": 280324, "epoch": 1668} {"train_loss": -11.952129364013672, "global_step": 280325, "epoch": 1668} {"train_loss": -11.513692855834961, "global_step": 280326, "epoch": 1668} {"train_loss": -12.187365531921387, "global_step": 280327, "epoch": 1668} {"train_loss": -11.745871543884277, "global_step": 280328, "epoch": 1668} {"train_loss": -12.056407928466797, "global_step": 280329, "epoch": 1668} {"train_loss": -11.868490219116211, "global_step": 280330, "epoch": 1668} {"train_loss": -12.04450511932373, "global_step": 280331, "epoch": 1668} {"train_loss": -12.015938758850098, "global_step": 280332, "epoch": 1668} {"train_loss": -11.99742317199707, "global_step": 280333, "epoch": 1668} {"train_loss": -12.086043357849121, "global_step": 280334, "epoch": 1668} {"train_loss": -11.900836944580078, "global_step": 280335, "epoch": 1668} {"train_loss": -11.913177490234375, "global_step": 280336, "epoch": 1668} {"train_loss": -11.984689712524414, "global_step": 280337, "epoch": 1668} {"train_loss": -12.12369155883789, "global_step": 280338, "epoch": 1668} {"train_loss": -11.947690963745117, "global_step": 280339, "epoch": 1668} {"train_loss": -11.636926651000977, "global_step": 280340, "epoch": 1668} {"train_loss": -12.085383415222168, "global_step": 280341, "epoch": 1668} {"train_loss": -11.963948249816895, "global_step": 280342, "epoch": 1668} {"train_loss": -12.182245254516602, "global_step": 280343, "epoch": 1668} {"train_loss": -12.206235885620117, "global_step": 280344, "epoch": 1668} {"train_loss": -12.145944595336914, "global_step": 280345, "epoch": 1668} {"train_loss": -12.321463584899902, "global_step": 280346, "epoch": 1668} {"train_loss": -12.244245529174805, "global_step": 280347, "epoch": 1668} {"train_loss": -12.311540603637695, "global_step": 280348, "epoch": 1668} {"train_loss": -12.165916442871094, "global_step": 280349, "epoch": 1668} {"train_loss": -12.167459487915039, "global_step": 280350, "epoch": 1668} {"train_loss": -12.206029891967773, "global_step": 280351, "epoch": 1668} {"train_loss": -12.00908374786377, "global_step": 280352, "epoch": 1668} {"train_loss": -12.065948486328125, "global_step": 280353, "epoch": 1668} {"train_loss": -12.200204849243164, "global_step": 280354, "epoch": 1668} {"train_loss": -11.845617294311523, "global_step": 280355, "epoch": 1668} {"train_loss": -11.971770286560059, "global_step": 280356, "epoch": 1668} {"train_loss": -12.215142250061035, "global_step": 280357, "epoch": 1668} {"train_loss": -11.736564636230469, "global_step": 280358, "epoch": 1668} {"train_loss": -11.71048355102539, "global_step": 280359, "epoch": 1668} {"train_loss": -11.773305892944336, "global_step": 280360, "epoch": 1668} {"train_loss": -11.925009727478027, "global_step": 280361, "epoch": 1668} {"train_loss": -11.785017013549805, "global_step": 280362, "epoch": 1668} {"train_loss": -11.780394554138184, "global_step": 280363, "epoch": 1668} {"train_loss": -11.850128173828125, "global_step": 280364, "epoch": 1668} {"train_loss": -11.696941375732422, "global_step": 280365, "epoch": 1668} {"train_loss": -11.513757705688477, "global_step": 280366, "epoch": 1668} {"train_loss": -12.26179313659668, "global_step": 280367, "epoch": 1668} {"train_loss": -12.0252103805542, "global_step": 280368, "epoch": 1668} {"train_loss": -12.080039978027344, "global_step": 280369, "epoch": 1668} {"train_loss": -11.966121673583984, "global_step": 280370, "epoch": 1668} {"train_loss": -11.861605644226074, "global_step": 280371, "epoch": 1668} {"train_loss": -11.863633155822754, "global_step": 280372, "epoch": 1668} {"train_loss": -12.035006523132324, "global_step": 280373, "epoch": 1668} {"train_loss": -11.886056900024414, "global_step": 280374, "epoch": 1668} {"train_loss": -11.783738136291504, "global_step": 280375, "epoch": 1668} {"train_loss": -11.805940628051758, "global_step": 280376, "epoch": 1668} {"train_loss": -11.865866661071777, "global_step": 280377, "epoch": 1668} {"train_loss": -11.781586647033691, "global_step": 280378, "epoch": 1668} {"train_loss": -10.167203903198242, "global_step": 280379, "epoch": 1668} {"train_loss": -11.55930233001709, "global_step": 280380, "epoch": 1668} {"train_loss": -11.11984634399414, "global_step": 280381, "epoch": 1668} {"train_loss": -10.54859733581543, "global_step": 280382, "epoch": 1668} {"train_loss": -10.493978500366211, "global_step": 280383, "epoch": 1668} {"train_loss": -11.279945373535156, "global_step": 280384, "epoch": 1668} {"train_loss": -10.835405349731445, "global_step": 280385, "epoch": 1668} {"train_loss": -11.441753387451172, "global_step": 280386, "epoch": 1668} {"train_loss": -11.471511840820312, "global_step": 280387, "epoch": 1668} {"train_loss": -11.133279800415039, "global_step": 280388, "epoch": 1668} {"train_loss": -11.248418807983398, "global_step": 280389, "epoch": 1668} {"train_loss": -11.629683494567871, "global_step": 280390, "epoch": 1668} {"train_loss": -11.786997624805995, "global_step": 280391, "epoch": 1668, "val_loss": 273244.5625} {"train_loss": -11.317268371582031, "global_step": 280392, "epoch": 1669} {"train_loss": -11.158028602600098, "global_step": 280393, "epoch": 1669} {"train_loss": -11.466299057006836, "global_step": 280394, "epoch": 1669} {"train_loss": -11.425817489624023, "global_step": 280395, "epoch": 1669} {"train_loss": -10.572355270385742, "global_step": 280396, "epoch": 1669} {"train_loss": -11.534910202026367, "global_step": 280397, "epoch": 1669} {"train_loss": -10.755455017089844, "global_step": 280398, "epoch": 1669} {"train_loss": -11.156412124633789, "global_step": 280399, "epoch": 1669} {"train_loss": -11.70966911315918, "global_step": 280400, "epoch": 1669} {"train_loss": -11.719736099243164, "global_step": 280401, "epoch": 1669} {"train_loss": -11.510979652404785, "global_step": 280402, "epoch": 1669} {"train_loss": -11.834641456604004, "global_step": 280403, "epoch": 1669} {"train_loss": -11.208561897277832, "global_step": 280404, "epoch": 1669} {"train_loss": -11.724557876586914, "global_step": 280405, "epoch": 1669} {"train_loss": -11.69087028503418, "global_step": 280406, "epoch": 1669} {"train_loss": -11.144622802734375, "global_step": 280407, "epoch": 1669} {"train_loss": -12.007827758789062, "global_step": 280408, "epoch": 1669} {"train_loss": -11.63282585144043, "global_step": 280409, "epoch": 1669} {"train_loss": -11.505416870117188, "global_step": 280410, "epoch": 1669} {"train_loss": -11.97732162475586, "global_step": 280411, "epoch": 1669} {"train_loss": -11.80301284790039, "global_step": 280412, "epoch": 1669} {"train_loss": -12.020597457885742, "global_step": 280413, "epoch": 1669} {"train_loss": -11.443137168884277, "global_step": 280414, "epoch": 1669} {"train_loss": -11.901501655578613, "global_step": 280415, "epoch": 1669} {"train_loss": -11.875622749328613, "global_step": 280416, "epoch": 1669} {"train_loss": -11.959625244140625, "global_step": 280417, "epoch": 1669} {"train_loss": -11.697486877441406, "global_step": 280418, "epoch": 1669} {"train_loss": -12.008233070373535, "global_step": 280419, "epoch": 1669} {"train_loss": -11.959196090698242, "global_step": 280420, "epoch": 1669} {"train_loss": -11.80570125579834, "global_step": 280421, "epoch": 1669} {"train_loss": -11.790910720825195, "global_step": 280422, "epoch": 1669} {"train_loss": -11.284980773925781, "global_step": 280423, "epoch": 1669} {"train_loss": -12.040822982788086, "global_step": 280424, "epoch": 1669} {"train_loss": -11.431482315063477, "global_step": 280425, "epoch": 1669} {"train_loss": -11.736260414123535, "global_step": 280426, "epoch": 1669} {"train_loss": -11.827718734741211, "global_step": 280427, "epoch": 1669} {"train_loss": -11.633339881896973, "global_step": 280428, "epoch": 1669} {"train_loss": -12.209175109863281, "global_step": 280429, "epoch": 1669} {"train_loss": -11.480438232421875, "global_step": 280430, "epoch": 1669} {"train_loss": -11.58098030090332, "global_step": 280431, "epoch": 1669} {"train_loss": -12.014145851135254, "global_step": 280432, "epoch": 1669} {"train_loss": -11.551752090454102, "global_step": 280433, "epoch": 1669} {"train_loss": -12.109151840209961, "global_step": 280434, "epoch": 1669} {"train_loss": -11.320693969726562, "global_step": 280435, "epoch": 1669} {"train_loss": -12.129399299621582, "global_step": 280436, "epoch": 1669} {"train_loss": -11.845542907714844, "global_step": 280437, "epoch": 1669} {"train_loss": -12.193218231201172, "global_step": 280438, "epoch": 1669} {"train_loss": -11.841629028320312, "global_step": 280439, "epoch": 1669} {"train_loss": -11.822681427001953, "global_step": 280440, "epoch": 1669} {"train_loss": -12.138391494750977, "global_step": 280441, "epoch": 1669} {"train_loss": -12.151211738586426, "global_step": 280442, "epoch": 1669} {"train_loss": -11.43679141998291, "global_step": 280443, "epoch": 1669} {"train_loss": -11.650960922241211, "global_step": 280444, "epoch": 1669} {"train_loss": -12.143758773803711, "global_step": 280445, "epoch": 1669} {"train_loss": -11.551207542419434, "global_step": 280446, "epoch": 1669} {"train_loss": -11.730337142944336, "global_step": 280447, "epoch": 1669} {"train_loss": -11.397394180297852, "global_step": 280448, "epoch": 1669} {"train_loss": -12.018556594848633, "global_step": 280449, "epoch": 1669} {"train_loss": -11.851548194885254, "global_step": 280450, "epoch": 1669} {"train_loss": -12.181406021118164, "global_step": 280451, "epoch": 1669} {"train_loss": -12.063087463378906, "global_step": 280452, "epoch": 1669} {"train_loss": -11.878700256347656, "global_step": 280453, "epoch": 1669} {"train_loss": -12.4073486328125, "global_step": 280454, "epoch": 1669} {"train_loss": -11.854165077209473, "global_step": 280455, "epoch": 1669} {"train_loss": -12.077268600463867, "global_step": 280456, "epoch": 1669} {"train_loss": -11.734901428222656, "global_step": 280457, "epoch": 1669} {"train_loss": -12.201372146606445, "global_step": 280458, "epoch": 1669} {"train_loss": -11.61709976196289, "global_step": 280459, "epoch": 1669} {"train_loss": -12.082599639892578, "global_step": 280460, "epoch": 1669} {"train_loss": -12.084367752075195, "global_step": 280461, "epoch": 1669} {"train_loss": -11.859477996826172, "global_step": 280462, "epoch": 1669} {"train_loss": -11.566360473632812, "global_step": 280463, "epoch": 1669} {"train_loss": -11.694040298461914, "global_step": 280464, "epoch": 1669} {"train_loss": -12.047173500061035, "global_step": 280465, "epoch": 1669} {"train_loss": -11.99876880645752, "global_step": 280466, "epoch": 1669} {"train_loss": -12.096050262451172, "global_step": 280467, "epoch": 1669} {"train_loss": -12.000358581542969, "global_step": 280468, "epoch": 1669} {"train_loss": -11.9924955368042, "global_step": 280469, "epoch": 1669} {"train_loss": -11.818615913391113, "global_step": 280470, "epoch": 1669} {"train_loss": -11.992592811584473, "global_step": 280471, "epoch": 1669} {"train_loss": -12.063953399658203, "global_step": 280472, "epoch": 1669} {"train_loss": -11.705101013183594, "global_step": 280473, "epoch": 1669} {"train_loss": -11.330070495605469, "global_step": 280474, "epoch": 1669} {"train_loss": -12.070684432983398, "global_step": 280475, "epoch": 1669} {"train_loss": -11.659854888916016, "global_step": 280476, "epoch": 1669} {"train_loss": -11.168682098388672, "global_step": 280477, "epoch": 1669} {"train_loss": -11.445974349975586, "global_step": 280478, "epoch": 1669} {"train_loss": -11.86905288696289, "global_step": 280479, "epoch": 1669} {"train_loss": -10.978114128112793, "global_step": 280480, "epoch": 1669} {"train_loss": -11.444091796875, "global_step": 280481, "epoch": 1669} {"train_loss": -12.04465389251709, "global_step": 280482, "epoch": 1669} {"train_loss": -9.961181640625, "global_step": 280483, "epoch": 1669} {"train_loss": -10.08414077758789, "global_step": 280484, "epoch": 1669} {"train_loss": -10.984589576721191, "global_step": 280485, "epoch": 1669} {"train_loss": -11.854082107543945, "global_step": 280486, "epoch": 1669} {"train_loss": -10.864299774169922, "global_step": 280487, "epoch": 1669} {"train_loss": -11.85042953491211, "global_step": 280488, "epoch": 1669} {"train_loss": -11.317941665649414, "global_step": 280489, "epoch": 1669} {"train_loss": -11.394721984863281, "global_step": 280490, "epoch": 1669} {"train_loss": -11.807164192199707, "global_step": 280491, "epoch": 1669} {"train_loss": -11.893669128417969, "global_step": 280492, "epoch": 1669} {"train_loss": -11.611370086669922, "global_step": 280493, "epoch": 1669} {"train_loss": -11.667330741882324, "global_step": 280494, "epoch": 1669} {"train_loss": -11.505879402160645, "global_step": 280495, "epoch": 1669} {"train_loss": -10.395072937011719, "global_step": 280496, "epoch": 1669} {"train_loss": -11.197232246398926, "global_step": 280497, "epoch": 1669} {"train_loss": -11.187263488769531, "global_step": 280498, "epoch": 1669} {"train_loss": -10.619739532470703, "global_step": 280499, "epoch": 1669} {"train_loss": -11.682001113891602, "global_step": 280500, "epoch": 1669} {"train_loss": -10.294551849365234, "global_step": 280501, "epoch": 1669} {"train_loss": -10.62749195098877, "global_step": 280502, "epoch": 1669} {"train_loss": -11.722373962402344, "global_step": 280503, "epoch": 1669} {"train_loss": -11.090435028076172, "global_step": 280504, "epoch": 1669} {"train_loss": -11.54312801361084, "global_step": 280505, "epoch": 1669} {"train_loss": -11.54686164855957, "global_step": 280506, "epoch": 1669} {"train_loss": -10.898130416870117, "global_step": 280507, "epoch": 1669} {"train_loss": -11.497358322143555, "global_step": 280508, "epoch": 1669} {"train_loss": -11.425514221191406, "global_step": 280509, "epoch": 1669} {"train_loss": -11.386577606201172, "global_step": 280510, "epoch": 1669} {"train_loss": -11.54471492767334, "global_step": 280511, "epoch": 1669} {"train_loss": -10.214561462402344, "global_step": 280512, "epoch": 1669} {"train_loss": -11.625965118408203, "global_step": 280513, "epoch": 1669} {"train_loss": -10.917625427246094, "global_step": 280514, "epoch": 1669} {"train_loss": -12.141685485839844, "global_step": 280515, "epoch": 1669} {"train_loss": -11.22385025024414, "global_step": 280516, "epoch": 1669} {"train_loss": -11.412161827087402, "global_step": 280517, "epoch": 1669} {"train_loss": -11.188036918640137, "global_step": 280518, "epoch": 1669} {"train_loss": -11.456253051757812, "global_step": 280519, "epoch": 1669} {"train_loss": -11.782387733459473, "global_step": 280520, "epoch": 1669} {"train_loss": -11.157624244689941, "global_step": 280521, "epoch": 1669} {"train_loss": -11.752791404724121, "global_step": 280522, "epoch": 1669} {"train_loss": -11.704080581665039, "global_step": 280523, "epoch": 1669} {"train_loss": -11.494476318359375, "global_step": 280524, "epoch": 1669} {"train_loss": -11.85566520690918, "global_step": 280525, "epoch": 1669} {"train_loss": -11.671002388000488, "global_step": 280526, "epoch": 1669} {"train_loss": -11.58631420135498, "global_step": 280527, "epoch": 1669} {"train_loss": -12.114995002746582, "global_step": 280528, "epoch": 1669} {"train_loss": -11.287087440490723, "global_step": 280529, "epoch": 1669} {"train_loss": -11.811196327209473, "global_step": 280530, "epoch": 1669} {"train_loss": -11.437681198120117, "global_step": 280531, "epoch": 1669} {"train_loss": -11.842809677124023, "global_step": 280532, "epoch": 1669} {"train_loss": -11.92617416381836, "global_step": 280533, "epoch": 1669} {"train_loss": -11.810251235961914, "global_step": 280534, "epoch": 1669} {"train_loss": -11.842363357543945, "global_step": 280535, "epoch": 1669} {"train_loss": -11.491353988647461, "global_step": 280536, "epoch": 1669} {"train_loss": -12.015897750854492, "global_step": 280537, "epoch": 1669} {"train_loss": -11.882351875305176, "global_step": 280538, "epoch": 1669} {"train_loss": -11.915779113769531, "global_step": 280539, "epoch": 1669} {"train_loss": -12.031454086303711, "global_step": 280540, "epoch": 1669} {"train_loss": -11.896554946899414, "global_step": 280541, "epoch": 1669} {"train_loss": -11.8763427734375, "global_step": 280542, "epoch": 1669} {"train_loss": -12.118118286132812, "global_step": 280543, "epoch": 1669} {"train_loss": -12.150991439819336, "global_step": 280544, "epoch": 1669} {"train_loss": -12.112386703491211, "global_step": 280545, "epoch": 1669} {"train_loss": -11.980497360229492, "global_step": 280546, "epoch": 1669} {"train_loss": -12.13567066192627, "global_step": 280547, "epoch": 1669} {"train_loss": -12.166385650634766, "global_step": 280548, "epoch": 1669} {"train_loss": -12.230286598205566, "global_step": 280549, "epoch": 1669} {"train_loss": -12.352965354919434, "global_step": 280550, "epoch": 1669} {"train_loss": -12.230241775512695, "global_step": 280551, "epoch": 1669} {"train_loss": -12.154253005981445, "global_step": 280552, "epoch": 1669} {"train_loss": -12.291158676147461, "global_step": 280553, "epoch": 1669} {"train_loss": -12.339194297790527, "global_step": 280554, "epoch": 1669} {"train_loss": -12.26827621459961, "global_step": 280555, "epoch": 1669} {"train_loss": -12.229684829711914, "global_step": 280556, "epoch": 1669} {"train_loss": -12.0546236038208, "global_step": 280557, "epoch": 1669} {"train_loss": -12.08633804321289, "global_step": 280558, "epoch": 1669} {"train_loss": -11.675165897323971, "global_step": 280559, "epoch": 1669, "val_loss": 274910.6875} {"train_loss": -12.217206954956055, "global_step": 280560, "epoch": 1670} {"train_loss": -12.345321655273438, "global_step": 280561, "epoch": 1670} {"train_loss": -12.271811485290527, "global_step": 280562, "epoch": 1670} {"train_loss": -12.13258171081543, "global_step": 280563, "epoch": 1670} {"train_loss": -11.988907814025879, "global_step": 280564, "epoch": 1670} {"train_loss": -12.313443183898926, "global_step": 280565, "epoch": 1670} {"train_loss": -12.327190399169922, "global_step": 280566, "epoch": 1670} {"train_loss": -11.962327003479004, "global_step": 280567, "epoch": 1670} {"train_loss": -11.755532264709473, "global_step": 280568, "epoch": 1670} {"train_loss": -12.226717948913574, "global_step": 280569, "epoch": 1670} {"train_loss": -11.525046348571777, "global_step": 280570, "epoch": 1670} {"train_loss": -10.319734573364258, "global_step": 280571, "epoch": 1670} {"train_loss": -11.569229125976562, "global_step": 280572, "epoch": 1670} {"train_loss": -12.106718063354492, "global_step": 280573, "epoch": 1670} {"train_loss": -11.677022933959961, "global_step": 280574, "epoch": 1670} {"train_loss": -11.687686920166016, "global_step": 280575, "epoch": 1670} {"train_loss": -11.848690032958984, "global_step": 280576, "epoch": 1670} {"train_loss": -11.340007781982422, "global_step": 280577, "epoch": 1670} {"train_loss": -11.1376953125, "global_step": 280578, "epoch": 1670} {"train_loss": -11.789734840393066, "global_step": 280579, "epoch": 1670} {"train_loss": -11.56905746459961, "global_step": 280580, "epoch": 1670} {"train_loss": -11.118643760681152, "global_step": 280581, "epoch": 1670} {"train_loss": -12.239049911499023, "global_step": 280582, "epoch": 1670} {"train_loss": -11.418649673461914, "global_step": 280583, "epoch": 1670} {"train_loss": -10.5950927734375, "global_step": 280584, "epoch": 1670} {"train_loss": -11.067731857299805, "global_step": 280585, "epoch": 1670} {"train_loss": -11.750585556030273, "global_step": 280586, "epoch": 1670} {"train_loss": -11.272642135620117, "global_step": 280587, "epoch": 1670} {"train_loss": -11.590973854064941, "global_step": 280588, "epoch": 1670} {"train_loss": -12.105769157409668, "global_step": 280589, "epoch": 1670} {"train_loss": -11.30984115600586, "global_step": 280590, "epoch": 1670} {"train_loss": -12.326196670532227, "global_step": 280591, "epoch": 1670} {"train_loss": -11.818732261657715, "global_step": 280592, "epoch": 1670} {"train_loss": -12.195688247680664, "global_step": 280593, "epoch": 1670} {"train_loss": -11.827674865722656, "global_step": 280594, "epoch": 1670} {"train_loss": -11.911145210266113, "global_step": 280595, "epoch": 1670} {"train_loss": -11.930688858032227, "global_step": 280596, "epoch": 1670} {"train_loss": -11.695514678955078, "global_step": 280597, "epoch": 1670} {"train_loss": -11.686373710632324, "global_step": 280598, "epoch": 1670} {"train_loss": -11.721210479736328, "global_step": 280599, "epoch": 1670} {"train_loss": -11.625654220581055, "global_step": 280600, "epoch": 1670} {"train_loss": -11.682740211486816, "global_step": 280601, "epoch": 1670} {"train_loss": -11.374645233154297, "global_step": 280602, "epoch": 1670} {"train_loss": -11.500529289245605, "global_step": 280603, "epoch": 1670} {"train_loss": -11.07248306274414, "global_step": 280604, "epoch": 1670} {"train_loss": -11.875335693359375, "global_step": 280605, "epoch": 1670} {"train_loss": -11.015594482421875, "global_step": 280606, "epoch": 1670} {"train_loss": -11.832368850708008, "global_step": 280607, "epoch": 1670} {"train_loss": -11.198188781738281, "global_step": 280608, "epoch": 1670} {"train_loss": -11.225024223327637, "global_step": 280609, "epoch": 1670} {"train_loss": -11.81373405456543, "global_step": 280610, "epoch": 1670} {"train_loss": -11.193255424499512, "global_step": 280611, "epoch": 1670} {"train_loss": -11.855655670166016, "global_step": 280612, "epoch": 1670} {"train_loss": -11.725048065185547, "global_step": 280613, "epoch": 1670} {"train_loss": -11.848321914672852, "global_step": 280614, "epoch": 1670} {"train_loss": -11.649517059326172, "global_step": 280615, "epoch": 1670} {"train_loss": -11.679014205932617, "global_step": 280616, "epoch": 1670} {"train_loss": -11.286866188049316, "global_step": 280617, "epoch": 1670} {"train_loss": -11.979443550109863, "global_step": 280618, "epoch": 1670} {"train_loss": -11.673757553100586, "global_step": 280619, "epoch": 1670} {"train_loss": -11.545890808105469, "global_step": 280620, "epoch": 1670} {"train_loss": -11.596263885498047, "global_step": 280621, "epoch": 1670} {"train_loss": -12.06233024597168, "global_step": 280622, "epoch": 1670} {"train_loss": -12.028034210205078, "global_step": 280623, "epoch": 1670} {"train_loss": -12.321608543395996, "global_step": 280624, "epoch": 1670} {"train_loss": -12.068045616149902, "global_step": 280625, "epoch": 1670} {"train_loss": -12.133590698242188, "global_step": 280626, "epoch": 1670} {"train_loss": -11.931047439575195, "global_step": 280627, "epoch": 1670} {"train_loss": -12.033775329589844, "global_step": 280628, "epoch": 1670} {"train_loss": -11.799853324890137, "global_step": 280629, "epoch": 1670} {"train_loss": -11.979436874389648, "global_step": 280630, "epoch": 1670} {"train_loss": -11.843141555786133, "global_step": 280631, "epoch": 1670} {"train_loss": -12.240452766418457, "global_step": 280632, "epoch": 1670} {"train_loss": -11.578502655029297, "global_step": 280633, "epoch": 1670} {"train_loss": -11.514429092407227, "global_step": 280634, "epoch": 1670} {"train_loss": -11.834929466247559, "global_step": 280635, "epoch": 1670} {"train_loss": -11.488479614257812, "global_step": 280636, "epoch": 1670} {"train_loss": -11.95772933959961, "global_step": 280637, "epoch": 1670} {"train_loss": -12.036369323730469, "global_step": 280638, "epoch": 1670} {"train_loss": -11.910285949707031, "global_step": 280639, "epoch": 1670} {"train_loss": -12.202951431274414, "global_step": 280640, "epoch": 1670} {"train_loss": -11.84300422668457, "global_step": 280641, "epoch": 1670} {"train_loss": -12.079011917114258, "global_step": 280642, "epoch": 1670} {"train_loss": -11.980951309204102, "global_step": 280643, "epoch": 1670} {"train_loss": -12.230100631713867, "global_step": 280644, "epoch": 1670} {"train_loss": -12.127042770385742, "global_step": 280645, "epoch": 1670} {"train_loss": -12.10515022277832, "global_step": 280646, "epoch": 1670} {"train_loss": -12.051824569702148, "global_step": 280647, "epoch": 1670} {"train_loss": -11.902175903320312, "global_step": 280648, "epoch": 1670} {"train_loss": -12.183173179626465, "global_step": 280649, "epoch": 1670} {"train_loss": -11.99854564666748, "global_step": 280650, "epoch": 1670} {"train_loss": -12.110088348388672, "global_step": 280651, "epoch": 1670} {"train_loss": -12.19969654083252, "global_step": 280652, "epoch": 1670} {"train_loss": -12.307290077209473, "global_step": 280653, "epoch": 1670} {"train_loss": -12.133952140808105, "global_step": 280654, "epoch": 1670} {"train_loss": -12.07542610168457, "global_step": 280655, "epoch": 1670} {"train_loss": -12.274149894714355, "global_step": 280656, "epoch": 1670} {"train_loss": -11.743958473205566, "global_step": 280657, "epoch": 1670} {"train_loss": -12.330489158630371, "global_step": 280658, "epoch": 1670} {"train_loss": -12.127985954284668, "global_step": 280659, "epoch": 1670} {"train_loss": -12.20290756225586, "global_step": 280660, "epoch": 1670} {"train_loss": -11.829834938049316, "global_step": 280661, "epoch": 1670} {"train_loss": -12.138301849365234, "global_step": 280662, "epoch": 1670} {"train_loss": -12.089605331420898, "global_step": 280663, "epoch": 1670} {"train_loss": -12.327929496765137, "global_step": 280664, "epoch": 1670} {"train_loss": -12.218437194824219, "global_step": 280665, "epoch": 1670} {"train_loss": -11.88673210144043, "global_step": 280666, "epoch": 1670} {"train_loss": -12.243725776672363, "global_step": 280667, "epoch": 1670} {"train_loss": -12.344027519226074, "global_step": 280668, "epoch": 1670} {"train_loss": -11.733177185058594, "global_step": 280669, "epoch": 1670} {"train_loss": -11.798673629760742, "global_step": 280670, "epoch": 1670} {"train_loss": -12.41364574432373, "global_step": 280671, "epoch": 1670} {"train_loss": -11.989778518676758, "global_step": 280672, "epoch": 1670} {"train_loss": -12.201025009155273, "global_step": 280673, "epoch": 1670} {"train_loss": -12.236449241638184, "global_step": 280674, "epoch": 1670} {"train_loss": -11.812360763549805, "global_step": 280675, "epoch": 1670} {"train_loss": -12.075299263000488, "global_step": 280676, "epoch": 1670} {"train_loss": -12.094206809997559, "global_step": 280677, "epoch": 1670} {"train_loss": -11.328221321105957, "global_step": 280678, "epoch": 1670} {"train_loss": -11.530677795410156, "global_step": 280679, "epoch": 1670} {"train_loss": -12.18856430053711, "global_step": 280680, "epoch": 1670} {"train_loss": -11.423542022705078, "global_step": 280681, "epoch": 1670} {"train_loss": -11.683648109436035, "global_step": 280682, "epoch": 1670} {"train_loss": -11.949660301208496, "global_step": 280683, "epoch": 1670} {"train_loss": -12.00570297241211, "global_step": 280684, "epoch": 1670} {"train_loss": -11.934310913085938, "global_step": 280685, "epoch": 1670} {"train_loss": -12.126945495605469, "global_step": 280686, "epoch": 1670} {"train_loss": -11.738151550292969, "global_step": 280687, "epoch": 1670} {"train_loss": -12.068378448486328, "global_step": 280688, "epoch": 1670} {"train_loss": -12.273953437805176, "global_step": 280689, "epoch": 1670} {"train_loss": -12.054557800292969, "global_step": 280690, "epoch": 1670} {"train_loss": -12.151887893676758, "global_step": 280691, "epoch": 1670} {"train_loss": -11.736640930175781, "global_step": 280692, "epoch": 1670} {"train_loss": -11.839574813842773, "global_step": 280693, "epoch": 1670} {"train_loss": -12.16047477722168, "global_step": 280694, "epoch": 1670} {"train_loss": -12.166574478149414, "global_step": 280695, "epoch": 1670} {"train_loss": -12.215584754943848, "global_step": 280696, "epoch": 1670} {"train_loss": -12.048273086547852, "global_step": 280697, "epoch": 1670} {"train_loss": -12.087231636047363, "global_step": 280698, "epoch": 1670} {"train_loss": -12.162379264831543, "global_step": 280699, "epoch": 1670} {"train_loss": -11.894439697265625, "global_step": 280700, "epoch": 1670} {"train_loss": -11.898752212524414, "global_step": 280701, "epoch": 1670} {"train_loss": -12.036846160888672, "global_step": 280702, "epoch": 1670} {"train_loss": -11.961462020874023, "global_step": 280703, "epoch": 1670} {"train_loss": -11.78931999206543, "global_step": 280704, "epoch": 1670} {"train_loss": -12.292047500610352, "global_step": 280705, "epoch": 1670} {"train_loss": -11.955893516540527, "global_step": 280706, "epoch": 1670} {"train_loss": -12.444734573364258, "global_step": 280707, "epoch": 1670} {"train_loss": -12.028903007507324, "global_step": 280708, "epoch": 1670} {"train_loss": -12.27505111694336, "global_step": 280709, "epoch": 1670} {"train_loss": -11.979061126708984, "global_step": 280710, "epoch": 1670} {"train_loss": -11.948318481445312, "global_step": 280711, "epoch": 1670} {"train_loss": -12.100224494934082, "global_step": 280712, "epoch": 1670} {"train_loss": -12.064521789550781, "global_step": 280713, "epoch": 1670} {"train_loss": -11.62440299987793, "global_step": 280714, "epoch": 1670} {"train_loss": -10.404632568359375, "global_step": 280715, "epoch": 1670} {"train_loss": -11.18912124633789, "global_step": 280716, "epoch": 1670} {"train_loss": -11.939556121826172, "global_step": 280717, "epoch": 1670} {"train_loss": -10.920853614807129, "global_step": 280718, "epoch": 1670} {"train_loss": -10.370349884033203, "global_step": 280719, "epoch": 1670} {"train_loss": -12.414030075073242, "global_step": 280720, "epoch": 1670} {"train_loss": -11.105358123779297, "global_step": 280721, "epoch": 1670} {"train_loss": -10.863395690917969, "global_step": 280722, "epoch": 1670} {"train_loss": -11.551675796508789, "global_step": 280723, "epoch": 1670} {"train_loss": -11.807079315185547, "global_step": 280724, "epoch": 1670} {"train_loss": -11.902278900146484, "global_step": 280725, "epoch": 1670} {"train_loss": -11.693610191345215, "global_step": 280726, "epoch": 1670} {"train_loss": -11.842588265736898, "global_step": 280727, "epoch": 1670, "val_loss": 273719.84375, "train_action_mse_error": 2.0103094577789307} {"train_loss": -11.813346862792969, "global_step": 280728, "epoch": 1671} {"train_loss": -11.32174301147461, "global_step": 280729, "epoch": 1671} {"train_loss": -11.832244873046875, "global_step": 280730, "epoch": 1671} {"train_loss": -11.509416580200195, "global_step": 280731, "epoch": 1671} {"train_loss": -11.622577667236328, "global_step": 280732, "epoch": 1671} {"train_loss": -12.27244758605957, "global_step": 280733, "epoch": 1671} {"train_loss": -11.610219955444336, "global_step": 280734, "epoch": 1671} {"train_loss": -11.409741401672363, "global_step": 280735, "epoch": 1671} {"train_loss": -11.830181121826172, "global_step": 280736, "epoch": 1671} {"train_loss": -10.993586540222168, "global_step": 280737, "epoch": 1671} {"train_loss": -11.92403793334961, "global_step": 280738, "epoch": 1671} {"train_loss": -11.01794147491455, "global_step": 280739, "epoch": 1671} {"train_loss": -11.498552322387695, "global_step": 280740, "epoch": 1671} {"train_loss": -11.694640159606934, "global_step": 280741, "epoch": 1671} {"train_loss": -10.251022338867188, "global_step": 280742, "epoch": 1671} {"train_loss": -11.030838966369629, "global_step": 280743, "epoch": 1671} {"train_loss": -11.96048355102539, "global_step": 280744, "epoch": 1671} {"train_loss": -10.92317008972168, "global_step": 280745, "epoch": 1671} {"train_loss": -10.834964752197266, "global_step": 280746, "epoch": 1671} {"train_loss": -11.237838745117188, "global_step": 280747, "epoch": 1671} {"train_loss": -11.730864524841309, "global_step": 280748, "epoch": 1671} {"train_loss": -11.433019638061523, "global_step": 280749, "epoch": 1671} {"train_loss": -11.72297191619873, "global_step": 280750, "epoch": 1671} {"train_loss": -11.976190567016602, "global_step": 280751, "epoch": 1671} {"train_loss": -11.507186889648438, "global_step": 280752, "epoch": 1671} {"train_loss": -11.589433670043945, "global_step": 280753, "epoch": 1671} {"train_loss": -11.911822319030762, "global_step": 280754, "epoch": 1671} {"train_loss": -11.87299919128418, "global_step": 280755, "epoch": 1671} {"train_loss": -11.682662010192871, "global_step": 280756, "epoch": 1671} {"train_loss": -11.955731391906738, "global_step": 280757, "epoch": 1671} {"train_loss": -11.844782829284668, "global_step": 280758, "epoch": 1671} {"train_loss": -12.045979499816895, "global_step": 280759, "epoch": 1671} {"train_loss": -11.997844696044922, "global_step": 280760, "epoch": 1671} {"train_loss": -11.840924263000488, "global_step": 280761, "epoch": 1671} {"train_loss": -11.934579849243164, "global_step": 280762, "epoch": 1671} {"train_loss": -11.913864135742188, "global_step": 280763, "epoch": 1671} {"train_loss": -11.691178321838379, "global_step": 280764, "epoch": 1671} {"train_loss": -11.957157135009766, "global_step": 280765, "epoch": 1671} {"train_loss": -12.130044937133789, "global_step": 280766, "epoch": 1671} {"train_loss": -12.210529327392578, "global_step": 280767, "epoch": 1671} {"train_loss": -11.974381446838379, "global_step": 280768, "epoch": 1671} {"train_loss": -12.130093574523926, "global_step": 280769, "epoch": 1671} {"train_loss": -12.065446853637695, "global_step": 280770, "epoch": 1671} {"train_loss": -11.826696395874023, "global_step": 280771, "epoch": 1671} {"train_loss": -12.208964347839355, "global_step": 280772, "epoch": 1671} {"train_loss": -11.990812301635742, "global_step": 280773, "epoch": 1671} {"train_loss": -12.20976734161377, "global_step": 280774, "epoch": 1671} {"train_loss": -12.050928115844727, "global_step": 280775, "epoch": 1671} {"train_loss": -11.887453079223633, "global_step": 280776, "epoch": 1671} {"train_loss": -12.165534019470215, "global_step": 280777, "epoch": 1671} {"train_loss": -12.165975570678711, "global_step": 280778, "epoch": 1671} {"train_loss": -11.957196235656738, "global_step": 280779, "epoch": 1671} {"train_loss": -12.373233795166016, "global_step": 280780, "epoch": 1671} {"train_loss": -12.098213195800781, "global_step": 280781, "epoch": 1671} {"train_loss": -12.370133399963379, "global_step": 280782, "epoch": 1671} {"train_loss": -12.328914642333984, "global_step": 280783, "epoch": 1671} {"train_loss": -12.196958541870117, "global_step": 280784, "epoch": 1671} {"train_loss": -12.174188613891602, "global_step": 280785, "epoch": 1671} {"train_loss": -12.10676383972168, "global_step": 280786, "epoch": 1671} {"train_loss": -12.185150146484375, "global_step": 280787, "epoch": 1671} {"train_loss": -12.396451950073242, "global_step": 280788, "epoch": 1671} {"train_loss": -11.75680923461914, "global_step": 280789, "epoch": 1671} {"train_loss": -11.156370162963867, "global_step": 280790, "epoch": 1671} {"train_loss": -11.629155158996582, "global_step": 280791, "epoch": 1671} {"train_loss": -11.999567031860352, "global_step": 280792, "epoch": 1671} {"train_loss": -11.3351411819458, "global_step": 280793, "epoch": 1671} {"train_loss": -10.867514610290527, "global_step": 280794, "epoch": 1671} {"train_loss": -11.688913345336914, "global_step": 280795, "epoch": 1671} {"train_loss": -12.229497909545898, "global_step": 280796, "epoch": 1671} {"train_loss": -12.21961784362793, "global_step": 280797, "epoch": 1671} {"train_loss": -11.86945915222168, "global_step": 280798, "epoch": 1671} {"train_loss": -12.235997200012207, "global_step": 280799, "epoch": 1671} {"train_loss": -12.056848526000977, "global_step": 280800, "epoch": 1671} {"train_loss": -12.07848072052002, "global_step": 280801, "epoch": 1671} {"train_loss": -12.349851608276367, "global_step": 280802, "epoch": 1671} {"train_loss": -12.281885147094727, "global_step": 280803, "epoch": 1671} {"train_loss": -12.351034164428711, "global_step": 280804, "epoch": 1671} {"train_loss": -12.370221138000488, "global_step": 280805, "epoch": 1671} {"train_loss": -12.3855562210083, "global_step": 280806, "epoch": 1671} {"train_loss": -12.184722900390625, "global_step": 280807, "epoch": 1671} {"train_loss": -12.199546813964844, "global_step": 280808, "epoch": 1671} {"train_loss": -11.446100234985352, "global_step": 280809, "epoch": 1671} {"train_loss": -10.730381965637207, "global_step": 280810, "epoch": 1671} {"train_loss": -10.823516845703125, "global_step": 280811, "epoch": 1671} {"train_loss": -11.924549102783203, "global_step": 280812, "epoch": 1671} {"train_loss": -9.60108470916748, "global_step": 280813, "epoch": 1671} {"train_loss": -10.505783081054688, "global_step": 280814, "epoch": 1671} {"train_loss": -11.723718643188477, "global_step": 280815, "epoch": 1671} {"train_loss": -9.58301067352295, "global_step": 280816, "epoch": 1671} {"train_loss": -11.44027328491211, "global_step": 280817, "epoch": 1671} {"train_loss": -10.926822662353516, "global_step": 280818, "epoch": 1671} {"train_loss": -10.282129287719727, "global_step": 280819, "epoch": 1671} {"train_loss": -11.036712646484375, "global_step": 280820, "epoch": 1671} {"train_loss": -10.392465591430664, "global_step": 280821, "epoch": 1671} {"train_loss": -9.931264877319336, "global_step": 280822, "epoch": 1671} {"train_loss": -11.150801658630371, "global_step": 280823, "epoch": 1671} {"train_loss": -10.65867805480957, "global_step": 280824, "epoch": 1671} {"train_loss": -11.233369827270508, "global_step": 280825, "epoch": 1671} {"train_loss": -10.508075714111328, "global_step": 280826, "epoch": 1671} {"train_loss": -10.736129760742188, "global_step": 280827, "epoch": 1671} {"train_loss": -10.183828353881836, "global_step": 280828, "epoch": 1671} {"train_loss": -10.773113250732422, "global_step": 280829, "epoch": 1671} {"train_loss": -10.107847213745117, "global_step": 280830, "epoch": 1671} {"train_loss": -10.432605743408203, "global_step": 280831, "epoch": 1671} {"train_loss": -10.915477752685547, "global_step": 280832, "epoch": 1671} {"train_loss": -11.178420066833496, "global_step": 280833, "epoch": 1671} {"train_loss": -10.941483497619629, "global_step": 280834, "epoch": 1671} {"train_loss": -10.984763145446777, "global_step": 280835, "epoch": 1671} {"train_loss": -10.82701301574707, "global_step": 280836, "epoch": 1671} {"train_loss": -10.906017303466797, "global_step": 280837, "epoch": 1671} {"train_loss": -10.694282531738281, "global_step": 280838, "epoch": 1671} {"train_loss": -10.405683517456055, "global_step": 280839, "epoch": 1671} {"train_loss": -10.839393615722656, "global_step": 280840, "epoch": 1671} {"train_loss": -11.171441078186035, "global_step": 280841, "epoch": 1671} {"train_loss": -10.511575698852539, "global_step": 280842, "epoch": 1671} {"train_loss": -11.158390998840332, "global_step": 280843, "epoch": 1671} {"train_loss": -10.911489486694336, "global_step": 280844, "epoch": 1671} {"train_loss": -11.242462158203125, "global_step": 280845, "epoch": 1671} {"train_loss": -11.58975887298584, "global_step": 280846, "epoch": 1671} {"train_loss": -11.419048309326172, "global_step": 280847, "epoch": 1671} {"train_loss": -11.682226181030273, "global_step": 280848, "epoch": 1671} {"train_loss": -11.583296775817871, "global_step": 280849, "epoch": 1671} {"train_loss": -11.5743408203125, "global_step": 280850, "epoch": 1671} {"train_loss": -11.545759201049805, "global_step": 280851, "epoch": 1671} {"train_loss": -11.302906036376953, "global_step": 280852, "epoch": 1671} {"train_loss": -11.90410041809082, "global_step": 280853, "epoch": 1671} {"train_loss": -11.1310396194458, "global_step": 280854, "epoch": 1671} {"train_loss": -11.540523529052734, "global_step": 280855, "epoch": 1671} {"train_loss": -11.46705436706543, "global_step": 280856, "epoch": 1671} {"train_loss": -11.437870025634766, "global_step": 280857, "epoch": 1671} {"train_loss": -11.710201263427734, "global_step": 280858, "epoch": 1671} {"train_loss": -11.794447898864746, "global_step": 280859, "epoch": 1671} {"train_loss": -11.899116516113281, "global_step": 280860, "epoch": 1671} {"train_loss": -11.833257675170898, "global_step": 280861, "epoch": 1671} {"train_loss": -11.856138229370117, "global_step": 280862, "epoch": 1671} {"train_loss": -11.782463073730469, "global_step": 280863, "epoch": 1671} {"train_loss": -11.898625373840332, "global_step": 280864, "epoch": 1671} {"train_loss": -11.822391510009766, "global_step": 280865, "epoch": 1671} {"train_loss": -11.723418235778809, "global_step": 280866, "epoch": 1671} {"train_loss": -11.924315452575684, "global_step": 280867, "epoch": 1671} {"train_loss": -11.749464988708496, "global_step": 280868, "epoch": 1671} {"train_loss": -11.77801513671875, "global_step": 280869, "epoch": 1671} {"train_loss": -11.771265029907227, "global_step": 280870, "epoch": 1671} {"train_loss": -11.898382186889648, "global_step": 280871, "epoch": 1671} {"train_loss": -11.741888999938965, "global_step": 280872, "epoch": 1671} {"train_loss": -12.039437294006348, "global_step": 280873, "epoch": 1671} {"train_loss": -11.98857593536377, "global_step": 280874, "epoch": 1671} {"train_loss": -11.944698333740234, "global_step": 280875, "epoch": 1671} {"train_loss": -12.04796314239502, "global_step": 280876, "epoch": 1671} {"train_loss": -11.82613754272461, "global_step": 280877, "epoch": 1671} {"train_loss": -12.059884071350098, "global_step": 280878, "epoch": 1671} {"train_loss": -11.884309768676758, "global_step": 280879, "epoch": 1671} {"train_loss": -11.877985000610352, "global_step": 280880, "epoch": 1671} {"train_loss": -12.044219970703125, "global_step": 280881, "epoch": 1671} {"train_loss": -12.24072265625, "global_step": 280882, "epoch": 1671} {"train_loss": -12.010980606079102, "global_step": 280883, "epoch": 1671} {"train_loss": -12.172983169555664, "global_step": 280884, "epoch": 1671} {"train_loss": -12.077764511108398, "global_step": 280885, "epoch": 1671} {"train_loss": -12.144170761108398, "global_step": 280886, "epoch": 1671} {"train_loss": -12.369342803955078, "global_step": 280887, "epoch": 1671} {"train_loss": -12.37594985961914, "global_step": 280888, "epoch": 1671} {"train_loss": -12.160871505737305, "global_step": 280889, "epoch": 1671} {"train_loss": -12.324576377868652, "global_step": 280890, "epoch": 1671} {"train_loss": -12.186515808105469, "global_step": 280891, "epoch": 1671} {"train_loss": -12.187112808227539, "global_step": 280892, "epoch": 1671} {"train_loss": -12.307101249694824, "global_step": 280893, "epoch": 1671} {"train_loss": -12.401935577392578, "global_step": 280894, "epoch": 1671} {"train_loss": -11.622200999941144, "global_step": 280895, "epoch": 1671, "val_loss": 277123.75} {"train_loss": -12.249619483947754, "global_step": 280896, "epoch": 1672} {"train_loss": -12.338617324829102, "global_step": 280897, "epoch": 1672} {"train_loss": -12.338085174560547, "global_step": 280898, "epoch": 1672} {"train_loss": -12.36583137512207, "global_step": 280899, "epoch": 1672} {"train_loss": -12.135376930236816, "global_step": 280900, "epoch": 1672} {"train_loss": -12.299291610717773, "global_step": 280901, "epoch": 1672} {"train_loss": -12.12881088256836, "global_step": 280902, "epoch": 1672} {"train_loss": -12.146992683410645, "global_step": 280903, "epoch": 1672} {"train_loss": -12.256693840026855, "global_step": 280904, "epoch": 1672} {"train_loss": -12.255855560302734, "global_step": 280905, "epoch": 1672} {"train_loss": -11.687812805175781, "global_step": 280906, "epoch": 1672} {"train_loss": -12.394248962402344, "global_step": 280907, "epoch": 1672} {"train_loss": -11.824915885925293, "global_step": 280908, "epoch": 1672} {"train_loss": -11.293706893920898, "global_step": 280909, "epoch": 1672} {"train_loss": -10.9127197265625, "global_step": 280910, "epoch": 1672} {"train_loss": -11.622745513916016, "global_step": 280911, "epoch": 1672} {"train_loss": -11.831910133361816, "global_step": 280912, "epoch": 1672} {"train_loss": -11.32181453704834, "global_step": 280913, "epoch": 1672} {"train_loss": -12.255908012390137, "global_step": 280914, "epoch": 1672} {"train_loss": -11.494670867919922, "global_step": 280915, "epoch": 1672} {"train_loss": -11.500692367553711, "global_step": 280916, "epoch": 1672} {"train_loss": -11.583840370178223, "global_step": 280917, "epoch": 1672} {"train_loss": -11.906514167785645, "global_step": 280918, "epoch": 1672} {"train_loss": -10.793058395385742, "global_step": 280919, "epoch": 1672} {"train_loss": -11.685617446899414, "global_step": 280920, "epoch": 1672} {"train_loss": -11.071420669555664, "global_step": 280921, "epoch": 1672} {"train_loss": -12.296884536743164, "global_step": 280922, "epoch": 1672} {"train_loss": -10.961764335632324, "global_step": 280923, "epoch": 1672} {"train_loss": -11.196601867675781, "global_step": 280924, "epoch": 1672} {"train_loss": -11.855735778808594, "global_step": 280925, "epoch": 1672} {"train_loss": -11.36439037322998, "global_step": 280926, "epoch": 1672} {"train_loss": -11.42625617980957, "global_step": 280927, "epoch": 1672} {"train_loss": -11.342510223388672, "global_step": 280928, "epoch": 1672} {"train_loss": -11.914714813232422, "global_step": 280929, "epoch": 1672} {"train_loss": -10.563612937927246, "global_step": 280930, "epoch": 1672} {"train_loss": -12.02723217010498, "global_step": 280931, "epoch": 1672} {"train_loss": -11.167631149291992, "global_step": 280932, "epoch": 1672} {"train_loss": -9.918625831604004, "global_step": 280933, "epoch": 1672} {"train_loss": -11.312698364257812, "global_step": 280934, "epoch": 1672} {"train_loss": -9.546659469604492, "global_step": 280935, "epoch": 1672} {"train_loss": -11.365388870239258, "global_step": 280936, "epoch": 1672} {"train_loss": -9.03489875793457, "global_step": 280937, "epoch": 1672} {"train_loss": -11.730070114135742, "global_step": 280938, "epoch": 1672} {"train_loss": -11.132248878479004, "global_step": 280939, "epoch": 1672} {"train_loss": -11.20245361328125, "global_step": 280940, "epoch": 1672} {"train_loss": -11.309537887573242, "global_step": 280941, "epoch": 1672} {"train_loss": -11.679757118225098, "global_step": 280942, "epoch": 1672} {"train_loss": -11.182339668273926, "global_step": 280943, "epoch": 1672} {"train_loss": -12.171128273010254, "global_step": 280944, "epoch": 1672} {"train_loss": -11.785667419433594, "global_step": 280945, "epoch": 1672} {"train_loss": -11.419210433959961, "global_step": 280946, "epoch": 1672} {"train_loss": -11.66787338256836, "global_step": 280947, "epoch": 1672} {"train_loss": -11.914064407348633, "global_step": 280948, "epoch": 1672} {"train_loss": -12.152694702148438, "global_step": 280949, "epoch": 1672} {"train_loss": -11.665918350219727, "global_step": 280950, "epoch": 1672} {"train_loss": -11.888541221618652, "global_step": 280951, "epoch": 1672} {"train_loss": -11.84743881225586, "global_step": 280952, "epoch": 1672} {"train_loss": -11.781307220458984, "global_step": 280953, "epoch": 1672} {"train_loss": -12.090085983276367, "global_step": 280954, "epoch": 1672} {"train_loss": -12.173397064208984, "global_step": 280955, "epoch": 1672} {"train_loss": -11.605487823486328, "global_step": 280956, "epoch": 1672} {"train_loss": -12.185287475585938, "global_step": 280957, "epoch": 1672} {"train_loss": -11.294351577758789, "global_step": 280958, "epoch": 1672} {"train_loss": -12.084785461425781, "global_step": 280959, "epoch": 1672} {"train_loss": -11.80976676940918, "global_step": 280960, "epoch": 1672} {"train_loss": -11.84233283996582, "global_step": 280961, "epoch": 1672} {"train_loss": -11.74958610534668, "global_step": 280962, "epoch": 1672} {"train_loss": -11.582080841064453, "global_step": 280963, "epoch": 1672} {"train_loss": -11.744215965270996, "global_step": 280964, "epoch": 1672} {"train_loss": -11.636262893676758, "global_step": 280965, "epoch": 1672} {"train_loss": -11.522010803222656, "global_step": 280966, "epoch": 1672} {"train_loss": -11.783817291259766, "global_step": 280967, "epoch": 1672} {"train_loss": -11.668375015258789, "global_step": 280968, "epoch": 1672} {"train_loss": -11.874100685119629, "global_step": 280969, "epoch": 1672} {"train_loss": -11.72058391571045, "global_step": 280970, "epoch": 1672} {"train_loss": -11.991741180419922, "global_step": 280971, "epoch": 1672} {"train_loss": -11.610267639160156, "global_step": 280972, "epoch": 1672} {"train_loss": -11.725688934326172, "global_step": 280973, "epoch": 1672} {"train_loss": -11.225004196166992, "global_step": 280974, "epoch": 1672} {"train_loss": -11.820152282714844, "global_step": 280975, "epoch": 1672} {"train_loss": -11.834588050842285, "global_step": 280976, "epoch": 1672} {"train_loss": -11.474008560180664, "global_step": 280977, "epoch": 1672} {"train_loss": -11.682329177856445, "global_step": 280978, "epoch": 1672} {"train_loss": -11.802492141723633, "global_step": 280979, "epoch": 1672} {"train_loss": -11.426782608032227, "global_step": 280980, "epoch": 1672} {"train_loss": -12.086090087890625, "global_step": 280981, "epoch": 1672} {"train_loss": -11.396653175354004, "global_step": 280982, "epoch": 1672} {"train_loss": -11.759167671203613, "global_step": 280983, "epoch": 1672} {"train_loss": -11.74791145324707, "global_step": 280984, "epoch": 1672} {"train_loss": -11.952608108520508, "global_step": 280985, "epoch": 1672} {"train_loss": -12.165779113769531, "global_step": 280986, "epoch": 1672} {"train_loss": -12.053670883178711, "global_step": 280987, "epoch": 1672} {"train_loss": -12.335423469543457, "global_step": 280988, "epoch": 1672} {"train_loss": -12.105476379394531, "global_step": 280989, "epoch": 1672} {"train_loss": -12.05416488647461, "global_step": 280990, "epoch": 1672} {"train_loss": -12.214797973632812, "global_step": 280991, "epoch": 1672} {"train_loss": -11.971823692321777, "global_step": 280992, "epoch": 1672} {"train_loss": -12.20368480682373, "global_step": 280993, "epoch": 1672} {"train_loss": -11.963932037353516, "global_step": 280994, "epoch": 1672} {"train_loss": -12.225412368774414, "global_step": 280995, "epoch": 1672} {"train_loss": -12.142648696899414, "global_step": 280996, "epoch": 1672} {"train_loss": -12.123348236083984, "global_step": 280997, "epoch": 1672} {"train_loss": -12.199604034423828, "global_step": 280998, "epoch": 1672} {"train_loss": -12.350149154663086, "global_step": 280999, "epoch": 1672} {"train_loss": -12.345695495605469, "global_step": 281000, "epoch": 1672} {"train_loss": -12.147441864013672, "global_step": 281001, "epoch": 1672} {"train_loss": -12.250935554504395, "global_step": 281002, "epoch": 1672} {"train_loss": -12.186795234680176, "global_step": 281003, "epoch": 1672} {"train_loss": -12.332893371582031, "global_step": 281004, "epoch": 1672} {"train_loss": -12.285884857177734, "global_step": 281005, "epoch": 1672} {"train_loss": -11.884425163269043, "global_step": 281006, "epoch": 1672} {"train_loss": -11.85556411743164, "global_step": 281007, "epoch": 1672} {"train_loss": -12.171034812927246, "global_step": 281008, "epoch": 1672} {"train_loss": -12.194581985473633, "global_step": 281009, "epoch": 1672} {"train_loss": -12.251299858093262, "global_step": 281010, "epoch": 1672} {"train_loss": -12.104961395263672, "global_step": 281011, "epoch": 1672} {"train_loss": -12.23931884765625, "global_step": 281012, "epoch": 1672} {"train_loss": -12.291071891784668, "global_step": 281013, "epoch": 1672} {"train_loss": -12.030435562133789, "global_step": 281014, "epoch": 1672} {"train_loss": -11.804110527038574, "global_step": 281015, "epoch": 1672} {"train_loss": -11.667104721069336, "global_step": 281016, "epoch": 1672} {"train_loss": -11.875500679016113, "global_step": 281017, "epoch": 1672} {"train_loss": -12.075491905212402, "global_step": 281018, "epoch": 1672} {"train_loss": -12.205184936523438, "global_step": 281019, "epoch": 1672} {"train_loss": -11.05257511138916, "global_step": 281020, "epoch": 1672} {"train_loss": -11.5662841796875, "global_step": 281021, "epoch": 1672} {"train_loss": -11.424932479858398, "global_step": 281022, "epoch": 1672} {"train_loss": -9.709345817565918, "global_step": 281023, "epoch": 1672} {"train_loss": -11.390997886657715, "global_step": 281024, "epoch": 1672} {"train_loss": -9.513318061828613, "global_step": 281025, "epoch": 1672} {"train_loss": -10.984363555908203, "global_step": 281026, "epoch": 1672} {"train_loss": -11.097723960876465, "global_step": 281027, "epoch": 1672} {"train_loss": -10.363751411437988, "global_step": 281028, "epoch": 1672} {"train_loss": -11.4367036819458, "global_step": 281029, "epoch": 1672} {"train_loss": -11.247238159179688, "global_step": 281030, "epoch": 1672} {"train_loss": -11.061720848083496, "global_step": 281031, "epoch": 1672} {"train_loss": -11.945823669433594, "global_step": 281032, "epoch": 1672} {"train_loss": -11.005691528320312, "global_step": 281033, "epoch": 1672} {"train_loss": -11.101207733154297, "global_step": 281034, "epoch": 1672} {"train_loss": -11.14621353149414, "global_step": 281035, "epoch": 1672} {"train_loss": -11.825098037719727, "global_step": 281036, "epoch": 1672} {"train_loss": -11.578300476074219, "global_step": 281037, "epoch": 1672} {"train_loss": -11.28267765045166, "global_step": 281038, "epoch": 1672} {"train_loss": -11.230218887329102, "global_step": 281039, "epoch": 1672} {"train_loss": -10.838357925415039, "global_step": 281040, "epoch": 1672} {"train_loss": -10.990764617919922, "global_step": 281041, "epoch": 1672} {"train_loss": -10.372196197509766, "global_step": 281042, "epoch": 1672} {"train_loss": -11.205915451049805, "global_step": 281043, "epoch": 1672} {"train_loss": -10.127409934997559, "global_step": 281044, "epoch": 1672} {"train_loss": -11.303821563720703, "global_step": 281045, "epoch": 1672} {"train_loss": -10.581302642822266, "global_step": 281046, "epoch": 1672} {"train_loss": -10.556421279907227, "global_step": 281047, "epoch": 1672} {"train_loss": -11.243715286254883, "global_step": 281048, "epoch": 1672} {"train_loss": -10.412137985229492, "global_step": 281049, "epoch": 1672} {"train_loss": -11.420506477355957, "global_step": 281050, "epoch": 1672} {"train_loss": -10.847137451171875, "global_step": 281051, "epoch": 1672} {"train_loss": -11.464800834655762, "global_step": 281052, "epoch": 1672} {"train_loss": -11.528888702392578, "global_step": 281053, "epoch": 1672} {"train_loss": -11.915717124938965, "global_step": 281054, "epoch": 1672} {"train_loss": -11.486759185791016, "global_step": 281055, "epoch": 1672} {"train_loss": -11.795024871826172, "global_step": 281056, "epoch": 1672} {"train_loss": -11.675300598144531, "global_step": 281057, "epoch": 1672} {"train_loss": -11.544079780578613, "global_step": 281058, "epoch": 1672} {"train_loss": -11.888236999511719, "global_step": 281059, "epoch": 1672} {"train_loss": -11.587757110595703, "global_step": 281060, "epoch": 1672} {"train_loss": -11.821952819824219, "global_step": 281061, "epoch": 1672} {"train_loss": -11.698690414428711, "global_step": 281062, "epoch": 1672} {"train_loss": -11.617213680630638, "global_step": 281063, "epoch": 1672, "val_loss": 276326.84375} {"train_loss": -11.703584671020508, "global_step": 281064, "epoch": 1673} {"train_loss": -11.716389656066895, "global_step": 281065, "epoch": 1673} {"train_loss": -11.598627090454102, "global_step": 281066, "epoch": 1673} {"train_loss": -11.816535949707031, "global_step": 281067, "epoch": 1673} {"train_loss": -11.067960739135742, "global_step": 281068, "epoch": 1673} {"train_loss": -11.729806900024414, "global_step": 281069, "epoch": 1673} {"train_loss": -11.28866195678711, "global_step": 281070, "epoch": 1673} {"train_loss": -11.57970142364502, "global_step": 281071, "epoch": 1673} {"train_loss": -11.58100414276123, "global_step": 281072, "epoch": 1673} {"train_loss": -11.571660995483398, "global_step": 281073, "epoch": 1673} {"train_loss": -11.814023971557617, "global_step": 281074, "epoch": 1673} {"train_loss": -11.482208251953125, "global_step": 281075, "epoch": 1673} {"train_loss": -11.571051597595215, "global_step": 281076, "epoch": 1673} {"train_loss": -11.70680046081543, "global_step": 281077, "epoch": 1673} {"train_loss": -11.78998851776123, "global_step": 281078, "epoch": 1673} {"train_loss": -12.057714462280273, "global_step": 281079, "epoch": 1673} {"train_loss": -11.739702224731445, "global_step": 281080, "epoch": 1673} {"train_loss": -12.054346084594727, "global_step": 281081, "epoch": 1673} {"train_loss": -12.109794616699219, "global_step": 281082, "epoch": 1673} {"train_loss": -12.188871383666992, "global_step": 281083, "epoch": 1673} {"train_loss": -11.992326736450195, "global_step": 281084, "epoch": 1673} {"train_loss": -12.254142761230469, "global_step": 281085, "epoch": 1673} {"train_loss": -12.264188766479492, "global_step": 281086, "epoch": 1673} {"train_loss": -11.895525932312012, "global_step": 281087, "epoch": 1673} {"train_loss": -12.136899948120117, "global_step": 281088, "epoch": 1673} {"train_loss": -12.131771087646484, "global_step": 281089, "epoch": 1673} {"train_loss": -11.992948532104492, "global_step": 281090, "epoch": 1673} {"train_loss": -11.966629028320312, "global_step": 281091, "epoch": 1673} {"train_loss": -12.056234359741211, "global_step": 281092, "epoch": 1673} {"train_loss": -12.137800216674805, "global_step": 281093, "epoch": 1673} {"train_loss": -12.032930374145508, "global_step": 281094, "epoch": 1673} {"train_loss": -12.176355361938477, "global_step": 281095, "epoch": 1673} {"train_loss": -12.331411361694336, "global_step": 281096, "epoch": 1673} {"train_loss": -12.21359920501709, "global_step": 281097, "epoch": 1673} {"train_loss": -12.392265319824219, "global_step": 281098, "epoch": 1673} {"train_loss": -12.104936599731445, "global_step": 281099, "epoch": 1673} {"train_loss": -12.082841873168945, "global_step": 281100, "epoch": 1673} {"train_loss": -12.248222351074219, "global_step": 281101, "epoch": 1673} {"train_loss": -12.409932136535645, "global_step": 281102, "epoch": 1673} {"train_loss": -12.372815132141113, "global_step": 281103, "epoch": 1673} {"train_loss": -12.17495346069336, "global_step": 281104, "epoch": 1673} {"train_loss": -12.275208473205566, "global_step": 281105, "epoch": 1673} {"train_loss": -12.42990493774414, "global_step": 281106, "epoch": 1673} {"train_loss": -12.33188247680664, "global_step": 281107, "epoch": 1673} {"train_loss": -12.194463729858398, "global_step": 281108, "epoch": 1673} {"train_loss": -12.398292541503906, "global_step": 281109, "epoch": 1673} {"train_loss": -12.545909881591797, "global_step": 281110, "epoch": 1673} {"train_loss": -12.533981323242188, "global_step": 281111, "epoch": 1673} {"train_loss": -12.211027145385742, "global_step": 281112, "epoch": 1673} {"train_loss": -12.447677612304688, "global_step": 281113, "epoch": 1673} {"train_loss": -12.307355880737305, "global_step": 281114, "epoch": 1673} {"train_loss": -12.22260570526123, "global_step": 281115, "epoch": 1673} {"train_loss": -12.435827255249023, "global_step": 281116, "epoch": 1673} {"train_loss": -12.185529708862305, "global_step": 281117, "epoch": 1673} {"train_loss": -12.27605152130127, "global_step": 281118, "epoch": 1673} {"train_loss": -12.152388572692871, "global_step": 281119, "epoch": 1673} {"train_loss": -12.176258087158203, "global_step": 281120, "epoch": 1673} {"train_loss": -12.342442512512207, "global_step": 281121, "epoch": 1673} {"train_loss": -12.152421951293945, "global_step": 281122, "epoch": 1673} {"train_loss": -11.905351638793945, "global_step": 281123, "epoch": 1673} {"train_loss": -11.891833305358887, "global_step": 281124, "epoch": 1673} {"train_loss": -12.29371166229248, "global_step": 281125, "epoch": 1673} {"train_loss": -11.928216934204102, "global_step": 281126, "epoch": 1673} {"train_loss": -12.217178344726562, "global_step": 281127, "epoch": 1673} {"train_loss": -11.855997085571289, "global_step": 281128, "epoch": 1673} {"train_loss": -11.582209587097168, "global_step": 281129, "epoch": 1673} {"train_loss": -11.831697463989258, "global_step": 281130, "epoch": 1673} {"train_loss": -12.061834335327148, "global_step": 281131, "epoch": 1673} {"train_loss": -12.017088890075684, "global_step": 281132, "epoch": 1673} {"train_loss": -11.854914665222168, "global_step": 281133, "epoch": 1673} {"train_loss": -11.691963195800781, "global_step": 281134, "epoch": 1673} {"train_loss": -11.975358963012695, "global_step": 281135, "epoch": 1673} {"train_loss": -12.232819557189941, "global_step": 281136, "epoch": 1673} {"train_loss": -11.797722816467285, "global_step": 281137, "epoch": 1673} {"train_loss": -11.300863265991211, "global_step": 281138, "epoch": 1673} {"train_loss": -11.96196174621582, "global_step": 281139, "epoch": 1673} {"train_loss": -12.202499389648438, "global_step": 281140, "epoch": 1673} {"train_loss": -11.87704849243164, "global_step": 281141, "epoch": 1673} {"train_loss": -11.748434066772461, "global_step": 281142, "epoch": 1673} {"train_loss": -11.674127578735352, "global_step": 281143, "epoch": 1673} {"train_loss": -12.081336975097656, "global_step": 281144, "epoch": 1673} {"train_loss": -11.996306419372559, "global_step": 281145, "epoch": 1673} {"train_loss": -11.997471809387207, "global_step": 281146, "epoch": 1673} {"train_loss": -11.748723983764648, "global_step": 281147, "epoch": 1673} {"train_loss": -11.630796432495117, "global_step": 281148, "epoch": 1673} {"train_loss": -11.183243751525879, "global_step": 281149, "epoch": 1673} {"train_loss": -11.043196678161621, "global_step": 281150, "epoch": 1673} {"train_loss": -11.572298049926758, "global_step": 281151, "epoch": 1673} {"train_loss": -11.242704391479492, "global_step": 281152, "epoch": 1673} {"train_loss": -10.646448135375977, "global_step": 281153, "epoch": 1673} {"train_loss": -11.162796020507812, "global_step": 281154, "epoch": 1673} {"train_loss": -11.32965087890625, "global_step": 281155, "epoch": 1673} {"train_loss": -10.327895164489746, "global_step": 281156, "epoch": 1673} {"train_loss": -11.808416366577148, "global_step": 281157, "epoch": 1673} {"train_loss": -10.755731582641602, "global_step": 281158, "epoch": 1673} {"train_loss": -10.892951965332031, "global_step": 281159, "epoch": 1673} {"train_loss": -11.539543151855469, "global_step": 281160, "epoch": 1673} {"train_loss": -11.174936294555664, "global_step": 281161, "epoch": 1673} {"train_loss": -11.887646675109863, "global_step": 281162, "epoch": 1673} {"train_loss": -11.136228561401367, "global_step": 281163, "epoch": 1673} {"train_loss": -11.639561653137207, "global_step": 281164, "epoch": 1673} {"train_loss": -11.460958480834961, "global_step": 281165, "epoch": 1673} {"train_loss": -11.195899963378906, "global_step": 281166, "epoch": 1673} {"train_loss": -11.565932273864746, "global_step": 281167, "epoch": 1673} {"train_loss": -10.890567779541016, "global_step": 281168, "epoch": 1673} {"train_loss": -11.613395690917969, "global_step": 281169, "epoch": 1673} {"train_loss": -11.01585578918457, "global_step": 281170, "epoch": 1673} {"train_loss": -10.983708381652832, "global_step": 281171, "epoch": 1673} {"train_loss": -11.38227653503418, "global_step": 281172, "epoch": 1673} {"train_loss": -11.465753555297852, "global_step": 281173, "epoch": 1673} {"train_loss": -10.89307975769043, "global_step": 281174, "epoch": 1673} {"train_loss": -11.319714546203613, "global_step": 281175, "epoch": 1673} {"train_loss": -10.436208724975586, "global_step": 281176, "epoch": 1673} {"train_loss": -10.261024475097656, "global_step": 281177, "epoch": 1673} {"train_loss": -9.24919319152832, "global_step": 281178, "epoch": 1673} {"train_loss": -9.715983390808105, "global_step": 281179, "epoch": 1673} {"train_loss": -8.915340423583984, "global_step": 281180, "epoch": 1673} {"train_loss": -11.25144100189209, "global_step": 281181, "epoch": 1673} {"train_loss": -9.910016059875488, "global_step": 281182, "epoch": 1673} {"train_loss": -9.389793395996094, "global_step": 281183, "epoch": 1673} {"train_loss": -11.554450035095215, "global_step": 281184, "epoch": 1673} {"train_loss": -9.534820556640625, "global_step": 281185, "epoch": 1673} {"train_loss": -11.089960098266602, "global_step": 281186, "epoch": 1673} {"train_loss": -11.213495254516602, "global_step": 281187, "epoch": 1673} {"train_loss": -10.811511039733887, "global_step": 281188, "epoch": 1673} {"train_loss": -11.584129333496094, "global_step": 281189, "epoch": 1673} {"train_loss": -10.572973251342773, "global_step": 281190, "epoch": 1673} {"train_loss": -10.899223327636719, "global_step": 281191, "epoch": 1673} {"train_loss": -11.470046043395996, "global_step": 281192, "epoch": 1673} {"train_loss": -10.910273551940918, "global_step": 281193, "epoch": 1673} {"train_loss": -11.232904434204102, "global_step": 281194, "epoch": 1673} {"train_loss": -10.934326171875, "global_step": 281195, "epoch": 1673} {"train_loss": -11.100048065185547, "global_step": 281196, "epoch": 1673} {"train_loss": -11.360191345214844, "global_step": 281197, "epoch": 1673} {"train_loss": -11.072219848632812, "global_step": 281198, "epoch": 1673} {"train_loss": -11.198909759521484, "global_step": 281199, "epoch": 1673} {"train_loss": -11.389472961425781, "global_step": 281200, "epoch": 1673} {"train_loss": -11.465900421142578, "global_step": 281201, "epoch": 1673} {"train_loss": -11.851058959960938, "global_step": 281202, "epoch": 1673} {"train_loss": -11.664020538330078, "global_step": 281203, "epoch": 1673} {"train_loss": -11.813043594360352, "global_step": 281204, "epoch": 1673} {"train_loss": -11.771821975708008, "global_step": 281205, "epoch": 1673} {"train_loss": -11.870887756347656, "global_step": 281206, "epoch": 1673} {"train_loss": -11.635187149047852, "global_step": 281207, "epoch": 1673} {"train_loss": -11.744138717651367, "global_step": 281208, "epoch": 1673} {"train_loss": -11.731762886047363, "global_step": 281209, "epoch": 1673} {"train_loss": -11.916732788085938, "global_step": 281210, "epoch": 1673} {"train_loss": -11.952743530273438, "global_step": 281211, "epoch": 1673} {"train_loss": -11.933952331542969, "global_step": 281212, "epoch": 1673} {"train_loss": -12.053953170776367, "global_step": 281213, "epoch": 1673} {"train_loss": -11.605001449584961, "global_step": 281214, "epoch": 1673} {"train_loss": -11.976442337036133, "global_step": 281215, "epoch": 1673} {"train_loss": -12.139270782470703, "global_step": 281216, "epoch": 1673} {"train_loss": -12.057973861694336, "global_step": 281217, "epoch": 1673} {"train_loss": -11.979815483093262, "global_step": 281218, "epoch": 1673} {"train_loss": -12.081829071044922, "global_step": 281219, "epoch": 1673} {"train_loss": -11.900121688842773, "global_step": 281220, "epoch": 1673} {"train_loss": -11.737622261047363, "global_step": 281221, "epoch": 1673} {"train_loss": -11.936811447143555, "global_step": 281222, "epoch": 1673} {"train_loss": -12.036845207214355, "global_step": 281223, "epoch": 1673} {"train_loss": -11.947486877441406, "global_step": 281224, "epoch": 1673} {"train_loss": -11.991719245910645, "global_step": 281225, "epoch": 1673} {"train_loss": -12.10614013671875, "global_step": 281226, "epoch": 1673} {"train_loss": -12.050239562988281, "global_step": 281227, "epoch": 1673} {"train_loss": -11.90872859954834, "global_step": 281228, "epoch": 1673} {"train_loss": -12.129840850830078, "global_step": 281229, "epoch": 1673} {"train_loss": -12.058698654174805, "global_step": 281230, "epoch": 1673} {"train_loss": -11.665783831051417, "global_step": 281231, "epoch": 1673, "val_loss": 273086.09375} {"train_loss": -12.244745254516602, "global_step": 281232, "epoch": 1674} {"train_loss": -11.928339004516602, "global_step": 281233, "epoch": 1674} {"train_loss": -12.151006698608398, "global_step": 281234, "epoch": 1674} {"train_loss": -12.019159317016602, "global_step": 281235, "epoch": 1674} {"train_loss": -12.233686447143555, "global_step": 281236, "epoch": 1674} {"train_loss": -12.160749435424805, "global_step": 281237, "epoch": 1674} {"train_loss": -12.222782135009766, "global_step": 281238, "epoch": 1674} {"train_loss": -12.146453857421875, "global_step": 281239, "epoch": 1674} {"train_loss": -12.4016752243042, "global_step": 281240, "epoch": 1674} {"train_loss": -12.239645957946777, "global_step": 281241, "epoch": 1674} {"train_loss": -12.21362590789795, "global_step": 281242, "epoch": 1674} {"train_loss": -12.342317581176758, "global_step": 281243, "epoch": 1674} {"train_loss": -12.398478507995605, "global_step": 281244, "epoch": 1674} {"train_loss": -12.386281967163086, "global_step": 281245, "epoch": 1674} {"train_loss": -12.104317665100098, "global_step": 281246, "epoch": 1674} {"train_loss": -12.323371887207031, "global_step": 281247, "epoch": 1674} {"train_loss": -12.146137237548828, "global_step": 281248, "epoch": 1674} {"train_loss": -12.33920669555664, "global_step": 281249, "epoch": 1674} {"train_loss": -12.293719291687012, "global_step": 281250, "epoch": 1674} {"train_loss": -12.338846206665039, "global_step": 281251, "epoch": 1674} {"train_loss": -12.142644882202148, "global_step": 281252, "epoch": 1674} {"train_loss": -12.418892860412598, "global_step": 281253, "epoch": 1674} {"train_loss": -12.316774368286133, "global_step": 281254, "epoch": 1674} {"train_loss": -12.347641944885254, "global_step": 281255, "epoch": 1674} {"train_loss": -11.959644317626953, "global_step": 281256, "epoch": 1674} {"train_loss": -12.412229537963867, "global_step": 281257, "epoch": 1674} {"train_loss": -12.189042091369629, "global_step": 281258, "epoch": 1674} {"train_loss": -12.293912887573242, "global_step": 281259, "epoch": 1674} {"train_loss": -12.4464693069458, "global_step": 281260, "epoch": 1674} {"train_loss": -12.101495742797852, "global_step": 281261, "epoch": 1674} {"train_loss": -12.08165168762207, "global_step": 281262, "epoch": 1674} {"train_loss": -12.198738098144531, "global_step": 281263, "epoch": 1674} {"train_loss": -12.168558120727539, "global_step": 281264, "epoch": 1674} {"train_loss": -12.069683074951172, "global_step": 281265, "epoch": 1674} {"train_loss": -12.375246047973633, "global_step": 281266, "epoch": 1674} {"train_loss": -11.985708236694336, "global_step": 281267, "epoch": 1674} {"train_loss": -12.35265064239502, "global_step": 281268, "epoch": 1674} {"train_loss": -12.319581031799316, "global_step": 281269, "epoch": 1674} {"train_loss": -12.10053825378418, "global_step": 281270, "epoch": 1674} {"train_loss": -11.358426094055176, "global_step": 281271, "epoch": 1674} {"train_loss": -11.476015090942383, "global_step": 281272, "epoch": 1674} {"train_loss": -11.905542373657227, "global_step": 281273, "epoch": 1674} {"train_loss": -11.719507217407227, "global_step": 281274, "epoch": 1674} {"train_loss": -10.282236099243164, "global_step": 281275, "epoch": 1674} {"train_loss": -11.358053207397461, "global_step": 281276, "epoch": 1674} {"train_loss": -12.160539627075195, "global_step": 281277, "epoch": 1674} {"train_loss": -11.945062637329102, "global_step": 281278, "epoch": 1674} {"train_loss": -11.8203706741333, "global_step": 281279, "epoch": 1674} {"train_loss": -11.545625686645508, "global_step": 281280, "epoch": 1674} {"train_loss": -11.518864631652832, "global_step": 281281, "epoch": 1674} {"train_loss": -11.637346267700195, "global_step": 281282, "epoch": 1674} {"train_loss": -11.985374450683594, "global_step": 281283, "epoch": 1674} {"train_loss": -11.568168640136719, "global_step": 281284, "epoch": 1674} {"train_loss": -11.946274757385254, "global_step": 281285, "epoch": 1674} {"train_loss": -11.998003005981445, "global_step": 281286, "epoch": 1674} {"train_loss": -10.439641952514648, "global_step": 281287, "epoch": 1674} {"train_loss": -11.346304893493652, "global_step": 281288, "epoch": 1674} {"train_loss": -11.235472679138184, "global_step": 281289, "epoch": 1674} {"train_loss": -10.815117835998535, "global_step": 281290, "epoch": 1674} {"train_loss": -11.675217628479004, "global_step": 281291, "epoch": 1674} {"train_loss": -11.671907424926758, "global_step": 281292, "epoch": 1674} {"train_loss": -10.961944580078125, "global_step": 281293, "epoch": 1674} {"train_loss": -11.550701141357422, "global_step": 281294, "epoch": 1674} {"train_loss": -11.618941307067871, "global_step": 281295, "epoch": 1674} {"train_loss": -11.41177749633789, "global_step": 281296, "epoch": 1674} {"train_loss": -11.889864921569824, "global_step": 281297, "epoch": 1674} {"train_loss": -11.49231243133545, "global_step": 281298, "epoch": 1674} {"train_loss": -11.704498291015625, "global_step": 281299, "epoch": 1674} {"train_loss": -12.080967903137207, "global_step": 281300, "epoch": 1674} {"train_loss": -11.601183891296387, "global_step": 281301, "epoch": 1674} {"train_loss": -12.174579620361328, "global_step": 281302, "epoch": 1674} {"train_loss": -11.99589729309082, "global_step": 281303, "epoch": 1674} {"train_loss": -11.894308090209961, "global_step": 281304, "epoch": 1674} {"train_loss": -11.765382766723633, "global_step": 281305, "epoch": 1674} {"train_loss": -11.842867851257324, "global_step": 281306, "epoch": 1674} {"train_loss": -11.40771198272705, "global_step": 281307, "epoch": 1674} {"train_loss": -11.751416206359863, "global_step": 281308, "epoch": 1674} {"train_loss": -11.226533889770508, "global_step": 281309, "epoch": 1674} {"train_loss": -11.459684371948242, "global_step": 281310, "epoch": 1674} {"train_loss": -12.13486099243164, "global_step": 281311, "epoch": 1674} {"train_loss": -12.128053665161133, "global_step": 281312, "epoch": 1674} {"train_loss": -12.234970092773438, "global_step": 281313, "epoch": 1674} {"train_loss": -12.036714553833008, "global_step": 281314, "epoch": 1674} {"train_loss": -11.921095848083496, "global_step": 281315, "epoch": 1674} {"train_loss": -12.097667694091797, "global_step": 281316, "epoch": 1674} {"train_loss": -11.782581329345703, "global_step": 281317, "epoch": 1674} {"train_loss": -11.9569673538208, "global_step": 281318, "epoch": 1674} {"train_loss": -11.798477172851562, "global_step": 281319, "epoch": 1674} {"train_loss": -11.965262413024902, "global_step": 281320, "epoch": 1674} {"train_loss": -11.940973281860352, "global_step": 281321, "epoch": 1674} {"train_loss": -11.85740852355957, "global_step": 281322, "epoch": 1674} {"train_loss": -11.777738571166992, "global_step": 281323, "epoch": 1674} {"train_loss": -12.089688301086426, "global_step": 281324, "epoch": 1674} {"train_loss": -11.981475830078125, "global_step": 281325, "epoch": 1674} {"train_loss": -11.966864585876465, "global_step": 281326, "epoch": 1674} {"train_loss": -12.090227127075195, "global_step": 281327, "epoch": 1674} {"train_loss": -11.510038375854492, "global_step": 281328, "epoch": 1674} {"train_loss": -11.067229270935059, "global_step": 281329, "epoch": 1674} {"train_loss": -12.013450622558594, "global_step": 281330, "epoch": 1674} {"train_loss": -11.403274536132812, "global_step": 281331, "epoch": 1674} {"train_loss": -11.863155364990234, "global_step": 281332, "epoch": 1674} {"train_loss": -11.848710060119629, "global_step": 281333, "epoch": 1674} {"train_loss": -11.530593872070312, "global_step": 281334, "epoch": 1674} {"train_loss": -11.717508316040039, "global_step": 281335, "epoch": 1674} {"train_loss": -12.132728576660156, "global_step": 281336, "epoch": 1674} {"train_loss": -11.8369722366333, "global_step": 281337, "epoch": 1674} {"train_loss": -11.394449234008789, "global_step": 281338, "epoch": 1674} {"train_loss": -12.214566230773926, "global_step": 281339, "epoch": 1674} {"train_loss": -11.722432136535645, "global_step": 281340, "epoch": 1674} {"train_loss": -11.777994155883789, "global_step": 281341, "epoch": 1674} {"train_loss": -11.660064697265625, "global_step": 281342, "epoch": 1674} {"train_loss": -10.427153587341309, "global_step": 281343, "epoch": 1674} {"train_loss": -10.849989891052246, "global_step": 281344, "epoch": 1674} {"train_loss": -11.046222686767578, "global_step": 281345, "epoch": 1674} {"train_loss": -9.520509719848633, "global_step": 281346, "epoch": 1674} {"train_loss": -11.576948165893555, "global_step": 281347, "epoch": 1674} {"train_loss": -9.776604652404785, "global_step": 281348, "epoch": 1674} {"train_loss": -10.91728401184082, "global_step": 281349, "epoch": 1674} {"train_loss": -10.029250144958496, "global_step": 281350, "epoch": 1674} {"train_loss": -9.880813598632812, "global_step": 281351, "epoch": 1674} {"train_loss": -10.790355682373047, "global_step": 281352, "epoch": 1674} {"train_loss": -8.23713207244873, "global_step": 281353, "epoch": 1674} {"train_loss": -7.909760475158691, "global_step": 281354, "epoch": 1674} {"train_loss": -8.326082229614258, "global_step": 281355, "epoch": 1674} {"train_loss": -8.58658218383789, "global_step": 281356, "epoch": 1674} {"train_loss": -9.956435203552246, "global_step": 281357, "epoch": 1674} {"train_loss": -8.868536949157715, "global_step": 281358, "epoch": 1674} {"train_loss": -8.232224464416504, "global_step": 281359, "epoch": 1674} {"train_loss": -7.855982303619385, "global_step": 281360, "epoch": 1674} {"train_loss": -9.179281234741211, "global_step": 281361, "epoch": 1674} {"train_loss": -10.328950881958008, "global_step": 281362, "epoch": 1674} {"train_loss": -10.635093688964844, "global_step": 281363, "epoch": 1674} {"train_loss": -9.774552345275879, "global_step": 281364, "epoch": 1674} {"train_loss": -10.414668083190918, "global_step": 281365, "epoch": 1674} {"train_loss": -10.334001541137695, "global_step": 281366, "epoch": 1674} {"train_loss": -10.960344314575195, "global_step": 281367, "epoch": 1674} {"train_loss": -11.208633422851562, "global_step": 281368, "epoch": 1674} {"train_loss": -11.229461669921875, "global_step": 281369, "epoch": 1674} {"train_loss": -11.167976379394531, "global_step": 281370, "epoch": 1674} {"train_loss": -11.005669593811035, "global_step": 281371, "epoch": 1674} {"train_loss": -11.537797927856445, "global_step": 281372, "epoch": 1674} {"train_loss": -11.205509185791016, "global_step": 281373, "epoch": 1674} {"train_loss": -11.45205020904541, "global_step": 281374, "epoch": 1674} {"train_loss": -11.738534927368164, "global_step": 281375, "epoch": 1674} {"train_loss": -11.499414443969727, "global_step": 281376, "epoch": 1674} {"train_loss": -11.460983276367188, "global_step": 281377, "epoch": 1674} {"train_loss": -11.446353912353516, "global_step": 281378, "epoch": 1674} {"train_loss": -11.492643356323242, "global_step": 281379, "epoch": 1674} {"train_loss": -11.458321571350098, "global_step": 281380, "epoch": 1674} {"train_loss": -11.809284210205078, "global_step": 281381, "epoch": 1674} {"train_loss": -11.741143226623535, "global_step": 281382, "epoch": 1674} {"train_loss": -11.540003776550293, "global_step": 281383, "epoch": 1674} {"train_loss": -11.577927589416504, "global_step": 281384, "epoch": 1674} {"train_loss": -11.480123519897461, "global_step": 281385, "epoch": 1674} {"train_loss": -11.216625213623047, "global_step": 281386, "epoch": 1674} {"train_loss": -11.349461555480957, "global_step": 281387, "epoch": 1674} {"train_loss": -11.280782699584961, "global_step": 281388, "epoch": 1674} {"train_loss": -11.454133987426758, "global_step": 281389, "epoch": 1674} {"train_loss": -11.699891090393066, "global_step": 281390, "epoch": 1674} {"train_loss": -11.89174747467041, "global_step": 281391, "epoch": 1674} {"train_loss": -11.684135437011719, "global_step": 281392, "epoch": 1674} {"train_loss": -11.956602096557617, "global_step": 281393, "epoch": 1674} {"train_loss": -11.619686126708984, "global_step": 281394, "epoch": 1674} {"train_loss": -11.654058456420898, "global_step": 281395, "epoch": 1674} {"train_loss": -11.94349479675293, "global_step": 281396, "epoch": 1674} {"train_loss": -11.5819730758667, "global_step": 281397, "epoch": 1674} {"train_loss": -11.789678573608398, "global_step": 281398, "epoch": 1674} {"train_loss": -11.505334016822633, "global_step": 281399, "epoch": 1674, "val_loss": 272781.96875} {"train_loss": -11.952492713928223, "global_step": 281400, "epoch": 1675} {"train_loss": -11.528047561645508, "global_step": 281401, "epoch": 1675} {"train_loss": -12.010181427001953, "global_step": 281402, "epoch": 1675} {"train_loss": -11.561068534851074, "global_step": 281403, "epoch": 1675} {"train_loss": -11.860673904418945, "global_step": 281404, "epoch": 1675} {"train_loss": -11.633447647094727, "global_step": 281405, "epoch": 1675} {"train_loss": -12.058008193969727, "global_step": 281406, "epoch": 1675} {"train_loss": -11.699031829833984, "global_step": 281407, "epoch": 1675} {"train_loss": -11.75086784362793, "global_step": 281408, "epoch": 1675} {"train_loss": -12.121252059936523, "global_step": 281409, "epoch": 1675} {"train_loss": -11.799534797668457, "global_step": 281410, "epoch": 1675} {"train_loss": -12.020149230957031, "global_step": 281411, "epoch": 1675} {"train_loss": -11.769096374511719, "global_step": 281412, "epoch": 1675} {"train_loss": -12.010635375976562, "global_step": 281413, "epoch": 1675} {"train_loss": -11.860309600830078, "global_step": 281414, "epoch": 1675} {"train_loss": -11.994671821594238, "global_step": 281415, "epoch": 1675} {"train_loss": -11.976739883422852, "global_step": 281416, "epoch": 1675} {"train_loss": -12.074928283691406, "global_step": 281417, "epoch": 1675} {"train_loss": -12.129610061645508, "global_step": 281418, "epoch": 1675} {"train_loss": -12.123008728027344, "global_step": 281419, "epoch": 1675} {"train_loss": -12.158466339111328, "global_step": 281420, "epoch": 1675} {"train_loss": -12.06425666809082, "global_step": 281421, "epoch": 1675} {"train_loss": -12.062261581420898, "global_step": 281422, "epoch": 1675} {"train_loss": -12.062265396118164, "global_step": 281423, "epoch": 1675} {"train_loss": -11.981990814208984, "global_step": 281424, "epoch": 1675} {"train_loss": -11.830998420715332, "global_step": 281425, "epoch": 1675} {"train_loss": -12.210432052612305, "global_step": 281426, "epoch": 1675} {"train_loss": -12.041221618652344, "global_step": 281427, "epoch": 1675} {"train_loss": -12.318033218383789, "global_step": 281428, "epoch": 1675} {"train_loss": -12.088314056396484, "global_step": 281429, "epoch": 1675} {"train_loss": -12.325791358947754, "global_step": 281430, "epoch": 1675} {"train_loss": -12.28450870513916, "global_step": 281431, "epoch": 1675} {"train_loss": -12.158918380737305, "global_step": 281432, "epoch": 1675} {"train_loss": -12.22702693939209, "global_step": 281433, "epoch": 1675} {"train_loss": -12.410746574401855, "global_step": 281434, "epoch": 1675} {"train_loss": -11.931854248046875, "global_step": 281435, "epoch": 1675} {"train_loss": -12.059455871582031, "global_step": 281436, "epoch": 1675} {"train_loss": -12.313413619995117, "global_step": 281437, "epoch": 1675} {"train_loss": -12.482673645019531, "global_step": 281438, "epoch": 1675} {"train_loss": -12.261588096618652, "global_step": 281439, "epoch": 1675} {"train_loss": -12.114624977111816, "global_step": 281440, "epoch": 1675} {"train_loss": -11.961885452270508, "global_step": 281441, "epoch": 1675} {"train_loss": -11.992666244506836, "global_step": 281442, "epoch": 1675} {"train_loss": -12.274481773376465, "global_step": 281443, "epoch": 1675} {"train_loss": -12.235279083251953, "global_step": 281444, "epoch": 1675} {"train_loss": -12.284297943115234, "global_step": 281445, "epoch": 1675} {"train_loss": -12.034088134765625, "global_step": 281446, "epoch": 1675} {"train_loss": -11.935322761535645, "global_step": 281447, "epoch": 1675} {"train_loss": -11.950681686401367, "global_step": 281448, "epoch": 1675} {"train_loss": -11.654317855834961, "global_step": 281449, "epoch": 1675} {"train_loss": -12.188769340515137, "global_step": 281450, "epoch": 1675} {"train_loss": -11.699875831604004, "global_step": 281451, "epoch": 1675} {"train_loss": -11.105676651000977, "global_step": 281452, "epoch": 1675} {"train_loss": -11.275415420532227, "global_step": 281453, "epoch": 1675} {"train_loss": -11.086785316467285, "global_step": 281454, "epoch": 1675} {"train_loss": -11.591965675354004, "global_step": 281455, "epoch": 1675} {"train_loss": -10.917253494262695, "global_step": 281456, "epoch": 1675} {"train_loss": -10.946313858032227, "global_step": 281457, "epoch": 1675} {"train_loss": -11.34333610534668, "global_step": 281458, "epoch": 1675} {"train_loss": -11.2479887008667, "global_step": 281459, "epoch": 1675} {"train_loss": -10.76158618927002, "global_step": 281460, "epoch": 1675} {"train_loss": -10.834672927856445, "global_step": 281461, "epoch": 1675} {"train_loss": -11.80246353149414, "global_step": 281462, "epoch": 1675} {"train_loss": -10.028116226196289, "global_step": 281463, "epoch": 1675} {"train_loss": -11.27219009399414, "global_step": 281464, "epoch": 1675} {"train_loss": -10.86522388458252, "global_step": 281465, "epoch": 1675} {"train_loss": -11.355525970458984, "global_step": 281466, "epoch": 1675} {"train_loss": -10.558905601501465, "global_step": 281467, "epoch": 1675} {"train_loss": -10.7593355178833, "global_step": 281468, "epoch": 1675} {"train_loss": -10.98556137084961, "global_step": 281469, "epoch": 1675} {"train_loss": -11.011837005615234, "global_step": 281470, "epoch": 1675} {"train_loss": -10.941425323486328, "global_step": 281471, "epoch": 1675} {"train_loss": -11.193387031555176, "global_step": 281472, "epoch": 1675} {"train_loss": -9.784228324890137, "global_step": 281473, "epoch": 1675} {"train_loss": -10.110067367553711, "global_step": 281474, "epoch": 1675} {"train_loss": -10.664287567138672, "global_step": 281475, "epoch": 1675} {"train_loss": -10.478433609008789, "global_step": 281476, "epoch": 1675} {"train_loss": -9.670541763305664, "global_step": 281477, "epoch": 1675} {"train_loss": -10.489740371704102, "global_step": 281478, "epoch": 1675} {"train_loss": -11.027029037475586, "global_step": 281479, "epoch": 1675} {"train_loss": -11.172497749328613, "global_step": 281480, "epoch": 1675} {"train_loss": -10.823091506958008, "global_step": 281481, "epoch": 1675} {"train_loss": -11.289429664611816, "global_step": 281482, "epoch": 1675} {"train_loss": -10.760900497436523, "global_step": 281483, "epoch": 1675} {"train_loss": -11.676469802856445, "global_step": 281484, "epoch": 1675} {"train_loss": -10.301101684570312, "global_step": 281485, "epoch": 1675} {"train_loss": -11.537591934204102, "global_step": 281486, "epoch": 1675} {"train_loss": -11.325552940368652, "global_step": 281487, "epoch": 1675} {"train_loss": -11.628427505493164, "global_step": 281488, "epoch": 1675} {"train_loss": -10.36153793334961, "global_step": 281489, "epoch": 1675} {"train_loss": -11.658820152282715, "global_step": 281490, "epoch": 1675} {"train_loss": -10.209413528442383, "global_step": 281491, "epoch": 1675} {"train_loss": -11.426639556884766, "global_step": 281492, "epoch": 1675} {"train_loss": -11.023314476013184, "global_step": 281493, "epoch": 1675} {"train_loss": -11.83338451385498, "global_step": 281494, "epoch": 1675} {"train_loss": -11.587471961975098, "global_step": 281495, "epoch": 1675} {"train_loss": -11.7583589553833, "global_step": 281496, "epoch": 1675} {"train_loss": -11.692181587219238, "global_step": 281497, "epoch": 1675} {"train_loss": -11.685554504394531, "global_step": 281498, "epoch": 1675} {"train_loss": -11.368402481079102, "global_step": 281499, "epoch": 1675} {"train_loss": -11.817291259765625, "global_step": 281500, "epoch": 1675} {"train_loss": -11.714481353759766, "global_step": 281501, "epoch": 1675} {"train_loss": -11.660927772521973, "global_step": 281502, "epoch": 1675} {"train_loss": -11.716043472290039, "global_step": 281503, "epoch": 1675} {"train_loss": -11.827098846435547, "global_step": 281504, "epoch": 1675} {"train_loss": -11.767687797546387, "global_step": 281505, "epoch": 1675} {"train_loss": -11.857433319091797, "global_step": 281506, "epoch": 1675} {"train_loss": -11.948692321777344, "global_step": 281507, "epoch": 1675} {"train_loss": -11.78127384185791, "global_step": 281508, "epoch": 1675} {"train_loss": -11.949825286865234, "global_step": 281509, "epoch": 1675} {"train_loss": -11.920165061950684, "global_step": 281510, "epoch": 1675} {"train_loss": -11.817089080810547, "global_step": 281511, "epoch": 1675} {"train_loss": -12.115669250488281, "global_step": 281512, "epoch": 1675} {"train_loss": -12.039904594421387, "global_step": 281513, "epoch": 1675} {"train_loss": -11.99283218383789, "global_step": 281514, "epoch": 1675} {"train_loss": -12.052604675292969, "global_step": 281515, "epoch": 1675} {"train_loss": -12.180048942565918, "global_step": 281516, "epoch": 1675} {"train_loss": -12.081893920898438, "global_step": 281517, "epoch": 1675} {"train_loss": -12.267879486083984, "global_step": 281518, "epoch": 1675} {"train_loss": -12.144383430480957, "global_step": 281519, "epoch": 1675} {"train_loss": -11.917196273803711, "global_step": 281520, "epoch": 1675} {"train_loss": -11.961372375488281, "global_step": 281521, "epoch": 1675} {"train_loss": -11.847129821777344, "global_step": 281522, "epoch": 1675} {"train_loss": -12.161706924438477, "global_step": 281523, "epoch": 1675} {"train_loss": -11.942306518554688, "global_step": 281524, "epoch": 1675} {"train_loss": -12.082982063293457, "global_step": 281525, "epoch": 1675} {"train_loss": -12.253345489501953, "global_step": 281526, "epoch": 1675} {"train_loss": -12.079938888549805, "global_step": 281527, "epoch": 1675} {"train_loss": -12.161117553710938, "global_step": 281528, "epoch": 1675} {"train_loss": -12.15236759185791, "global_step": 281529, "epoch": 1675} {"train_loss": -12.22225570678711, "global_step": 281530, "epoch": 1675} {"train_loss": -12.222366333007812, "global_step": 281531, "epoch": 1675} {"train_loss": -12.135354042053223, "global_step": 281532, "epoch": 1675} {"train_loss": -12.334893226623535, "global_step": 281533, "epoch": 1675} {"train_loss": -12.24542236328125, "global_step": 281534, "epoch": 1675} {"train_loss": -12.314390182495117, "global_step": 281535, "epoch": 1675} {"train_loss": -11.896657943725586, "global_step": 281536, "epoch": 1675} {"train_loss": -12.39596939086914, "global_step": 281537, "epoch": 1675} {"train_loss": -11.996931076049805, "global_step": 281538, "epoch": 1675} {"train_loss": -12.353569030761719, "global_step": 281539, "epoch": 1675} {"train_loss": -11.958358764648438, "global_step": 281540, "epoch": 1675} {"train_loss": -12.098011016845703, "global_step": 281541, "epoch": 1675} {"train_loss": -12.098616600036621, "global_step": 281542, "epoch": 1675} {"train_loss": -12.314062118530273, "global_step": 281543, "epoch": 1675} {"train_loss": -12.237114906311035, "global_step": 281544, "epoch": 1675} {"train_loss": -12.094870567321777, "global_step": 281545, "epoch": 1675} {"train_loss": -12.187841415405273, "global_step": 281546, "epoch": 1675} {"train_loss": -12.197351455688477, "global_step": 281547, "epoch": 1675} {"train_loss": -12.340184211730957, "global_step": 281548, "epoch": 1675} {"train_loss": -12.24326229095459, "global_step": 281549, "epoch": 1675} {"train_loss": -12.05002212524414, "global_step": 281550, "epoch": 1675} {"train_loss": -12.25313663482666, "global_step": 281551, "epoch": 1675} {"train_loss": -11.975227355957031, "global_step": 281552, "epoch": 1675} {"train_loss": -12.092845916748047, "global_step": 281553, "epoch": 1675} {"train_loss": -11.771400451660156, "global_step": 281554, "epoch": 1675} {"train_loss": -12.139459609985352, "global_step": 281555, "epoch": 1675} {"train_loss": -11.765068054199219, "global_step": 281556, "epoch": 1675} {"train_loss": -11.980566024780273, "global_step": 281557, "epoch": 1675} {"train_loss": -11.56029987335205, "global_step": 281558, "epoch": 1675} {"train_loss": -12.223134994506836, "global_step": 281559, "epoch": 1675} {"train_loss": -11.805633544921875, "global_step": 281560, "epoch": 1675} {"train_loss": -12.158285140991211, "global_step": 281561, "epoch": 1675} {"train_loss": -12.182635307312012, "global_step": 281562, "epoch": 1675} {"train_loss": -12.171148300170898, "global_step": 281563, "epoch": 1675} {"train_loss": -11.327932357788086, "global_step": 281564, "epoch": 1675} {"train_loss": -11.079004287719727, "global_step": 281565, "epoch": 1675} {"train_loss": -11.6870698928833, "global_step": 281566, "epoch": 1675} {"train_loss": -11.731107093039013, "global_step": 281567, "epoch": 1675, "val_loss": 277526.25, "train_action_mse_error": 4.318631172180176} {"train_loss": -8.1865816116333, "global_step": 281568, "epoch": 1676} {"train_loss": -10.885141372680664, "global_step": 281569, "epoch": 1676} {"train_loss": -10.505404472351074, "global_step": 281570, "epoch": 1676} {"train_loss": -11.434247970581055, "global_step": 281571, "epoch": 1676} {"train_loss": -10.833452224731445, "global_step": 281572, "epoch": 1676} {"train_loss": -11.136407852172852, "global_step": 281573, "epoch": 1676} {"train_loss": -11.893407821655273, "global_step": 281574, "epoch": 1676} {"train_loss": -10.669851303100586, "global_step": 281575, "epoch": 1676} {"train_loss": -11.06631851196289, "global_step": 281576, "epoch": 1676} {"train_loss": -11.803906440734863, "global_step": 281577, "epoch": 1676} {"train_loss": -11.34763240814209, "global_step": 281578, "epoch": 1676} {"train_loss": -11.435464859008789, "global_step": 281579, "epoch": 1676} {"train_loss": -11.557680130004883, "global_step": 281580, "epoch": 1676} {"train_loss": -11.195741653442383, "global_step": 281581, "epoch": 1676} {"train_loss": -11.534360885620117, "global_step": 281582, "epoch": 1676} {"train_loss": -11.523534774780273, "global_step": 281583, "epoch": 1676} {"train_loss": -11.211155891418457, "global_step": 281584, "epoch": 1676} {"train_loss": -10.912628173828125, "global_step": 281585, "epoch": 1676} {"train_loss": -12.018336296081543, "global_step": 281586, "epoch": 1676} {"train_loss": -11.355600357055664, "global_step": 281587, "epoch": 1676} {"train_loss": -12.03387451171875, "global_step": 281588, "epoch": 1676} {"train_loss": -11.44980239868164, "global_step": 281589, "epoch": 1676} {"train_loss": -11.841489791870117, "global_step": 281590, "epoch": 1676} {"train_loss": -11.613655090332031, "global_step": 281591, "epoch": 1676} {"train_loss": -11.72400188446045, "global_step": 281592, "epoch": 1676} {"train_loss": -11.744324684143066, "global_step": 281593, "epoch": 1676} {"train_loss": -11.798932075500488, "global_step": 281594, "epoch": 1676} {"train_loss": -11.705666542053223, "global_step": 281595, "epoch": 1676} {"train_loss": -11.553205490112305, "global_step": 281596, "epoch": 1676} {"train_loss": -12.088957786560059, "global_step": 281597, "epoch": 1676} {"train_loss": -11.641773223876953, "global_step": 281598, "epoch": 1676} {"train_loss": -12.01047134399414, "global_step": 281599, "epoch": 1676} {"train_loss": -11.534219741821289, "global_step": 281600, "epoch": 1676} {"train_loss": -11.291049003601074, "global_step": 281601, "epoch": 1676} {"train_loss": -12.075665473937988, "global_step": 281602, "epoch": 1676} {"train_loss": -11.668006896972656, "global_step": 281603, "epoch": 1676} {"train_loss": -11.847549438476562, "global_step": 281604, "epoch": 1676} {"train_loss": -11.640409469604492, "global_step": 281605, "epoch": 1676} {"train_loss": -12.019035339355469, "global_step": 281606, "epoch": 1676} {"train_loss": -11.956510543823242, "global_step": 281607, "epoch": 1676} {"train_loss": -11.941648483276367, "global_step": 281608, "epoch": 1676} {"train_loss": -11.95763111114502, "global_step": 281609, "epoch": 1676} {"train_loss": -11.392939567565918, "global_step": 281610, "epoch": 1676} {"train_loss": -12.161564826965332, "global_step": 281611, "epoch": 1676} {"train_loss": -11.760997772216797, "global_step": 281612, "epoch": 1676} {"train_loss": -11.942683219909668, "global_step": 281613, "epoch": 1676} {"train_loss": -11.753963470458984, "global_step": 281614, "epoch": 1676} {"train_loss": -11.847272872924805, "global_step": 281615, "epoch": 1676} {"train_loss": -11.981042861938477, "global_step": 281616, "epoch": 1676} {"train_loss": -12.340372085571289, "global_step": 281617, "epoch": 1676} {"train_loss": -12.10814094543457, "global_step": 281618, "epoch": 1676} {"train_loss": -11.969420433044434, "global_step": 281619, "epoch": 1676} {"train_loss": -11.667030334472656, "global_step": 281620, "epoch": 1676} {"train_loss": -12.011844635009766, "global_step": 281621, "epoch": 1676} {"train_loss": -11.973526000976562, "global_step": 281622, "epoch": 1676} {"train_loss": -12.141141891479492, "global_step": 281623, "epoch": 1676} {"train_loss": -12.044435501098633, "global_step": 281624, "epoch": 1676} {"train_loss": -11.788076400756836, "global_step": 281625, "epoch": 1676} {"train_loss": -12.352534294128418, "global_step": 281626, "epoch": 1676} {"train_loss": -12.133543968200684, "global_step": 281627, "epoch": 1676} {"train_loss": -12.120964050292969, "global_step": 281628, "epoch": 1676} {"train_loss": -11.892102241516113, "global_step": 281629, "epoch": 1676} {"train_loss": -12.44097900390625, "global_step": 281630, "epoch": 1676} {"train_loss": -11.95583724975586, "global_step": 281631, "epoch": 1676} {"train_loss": -12.198957443237305, "global_step": 281632, "epoch": 1676} {"train_loss": -11.98689079284668, "global_step": 281633, "epoch": 1676} {"train_loss": -11.986083030700684, "global_step": 281634, "epoch": 1676} {"train_loss": -12.100115776062012, "global_step": 281635, "epoch": 1676} {"train_loss": -11.844358444213867, "global_step": 281636, "epoch": 1676} {"train_loss": -12.309786796569824, "global_step": 281637, "epoch": 1676} {"train_loss": -11.810302734375, "global_step": 281638, "epoch": 1676} {"train_loss": -12.05054759979248, "global_step": 281639, "epoch": 1676} {"train_loss": -12.214729309082031, "global_step": 281640, "epoch": 1676} {"train_loss": -11.958029747009277, "global_step": 281641, "epoch": 1676} {"train_loss": -12.033388137817383, "global_step": 281642, "epoch": 1676} {"train_loss": -11.959965705871582, "global_step": 281643, "epoch": 1676} {"train_loss": -12.309496879577637, "global_step": 281644, "epoch": 1676} {"train_loss": -12.289058685302734, "global_step": 281645, "epoch": 1676} {"train_loss": -12.082355499267578, "global_step": 281646, "epoch": 1676} {"train_loss": -12.526996612548828, "global_step": 281647, "epoch": 1676} {"train_loss": -12.105915069580078, "global_step": 281648, "epoch": 1676} {"train_loss": -12.1848783493042, "global_step": 281649, "epoch": 1676} {"train_loss": -12.451108932495117, "global_step": 281650, "epoch": 1676} {"train_loss": -12.08963680267334, "global_step": 281651, "epoch": 1676} {"train_loss": -11.980116844177246, "global_step": 281652, "epoch": 1676} {"train_loss": -12.021364212036133, "global_step": 281653, "epoch": 1676} {"train_loss": -12.185158729553223, "global_step": 281654, "epoch": 1676} {"train_loss": -12.055435180664062, "global_step": 281655, "epoch": 1676} {"train_loss": -12.186079978942871, "global_step": 281656, "epoch": 1676} {"train_loss": -12.134870529174805, "global_step": 281657, "epoch": 1676} {"train_loss": -12.16758918762207, "global_step": 281658, "epoch": 1676} {"train_loss": -12.07656478881836, "global_step": 281659, "epoch": 1676} {"train_loss": -11.956130981445312, "global_step": 281660, "epoch": 1676} {"train_loss": -12.379737854003906, "global_step": 281661, "epoch": 1676} {"train_loss": -12.09471321105957, "global_step": 281662, "epoch": 1676} {"train_loss": -12.08859634399414, "global_step": 281663, "epoch": 1676} {"train_loss": -12.276704788208008, "global_step": 281664, "epoch": 1676} {"train_loss": -12.037729263305664, "global_step": 281665, "epoch": 1676} {"train_loss": -12.238523483276367, "global_step": 281666, "epoch": 1676} {"train_loss": -12.153254508972168, "global_step": 281667, "epoch": 1676} {"train_loss": -11.805233001708984, "global_step": 281668, "epoch": 1676} {"train_loss": -12.341876983642578, "global_step": 281669, "epoch": 1676} {"train_loss": -11.598639488220215, "global_step": 281670, "epoch": 1676} {"train_loss": -10.912225723266602, "global_step": 281671, "epoch": 1676} {"train_loss": -11.571269035339355, "global_step": 281672, "epoch": 1676} {"train_loss": -10.65170669555664, "global_step": 281673, "epoch": 1676} {"train_loss": -11.009068489074707, "global_step": 281674, "epoch": 1676} {"train_loss": -11.667010307312012, "global_step": 281675, "epoch": 1676} {"train_loss": -11.27784252166748, "global_step": 281676, "epoch": 1676} {"train_loss": -11.174821853637695, "global_step": 281677, "epoch": 1676} {"train_loss": -11.3698091506958, "global_step": 281678, "epoch": 1676} {"train_loss": -11.610286712646484, "global_step": 281679, "epoch": 1676} {"train_loss": -11.377628326416016, "global_step": 281680, "epoch": 1676} {"train_loss": -11.259204864501953, "global_step": 281681, "epoch": 1676} {"train_loss": -10.7117919921875, "global_step": 281682, "epoch": 1676} {"train_loss": -11.171629905700684, "global_step": 281683, "epoch": 1676} {"train_loss": -11.053509712219238, "global_step": 281684, "epoch": 1676} {"train_loss": -11.634581565856934, "global_step": 281685, "epoch": 1676} {"train_loss": -11.438332557678223, "global_step": 281686, "epoch": 1676} {"train_loss": -11.410921096801758, "global_step": 281687, "epoch": 1676} {"train_loss": -11.724294662475586, "global_step": 281688, "epoch": 1676} {"train_loss": -10.381147384643555, "global_step": 281689, "epoch": 1676} {"train_loss": -11.393741607666016, "global_step": 281690, "epoch": 1676} {"train_loss": -12.166504859924316, "global_step": 281691, "epoch": 1676} {"train_loss": -11.707295417785645, "global_step": 281692, "epoch": 1676} {"train_loss": -11.889245986938477, "global_step": 281693, "epoch": 1676} {"train_loss": -11.820711135864258, "global_step": 281694, "epoch": 1676} {"train_loss": -11.54191780090332, "global_step": 281695, "epoch": 1676} {"train_loss": -12.047880172729492, "global_step": 281696, "epoch": 1676} {"train_loss": -11.574614524841309, "global_step": 281697, "epoch": 1676} {"train_loss": -12.19874382019043, "global_step": 281698, "epoch": 1676} {"train_loss": -11.99452018737793, "global_step": 281699, "epoch": 1676} {"train_loss": -12.080865859985352, "global_step": 281700, "epoch": 1676} {"train_loss": -12.048097610473633, "global_step": 281701, "epoch": 1676} {"train_loss": -11.833976745605469, "global_step": 281702, "epoch": 1676} {"train_loss": -11.91030502319336, "global_step": 281703, "epoch": 1676} {"train_loss": -11.325521469116211, "global_step": 281704, "epoch": 1676} {"train_loss": -12.023576736450195, "global_step": 281705, "epoch": 1676} {"train_loss": -11.63975715637207, "global_step": 281706, "epoch": 1676} {"train_loss": -11.958173751831055, "global_step": 281707, "epoch": 1676} {"train_loss": -11.630472183227539, "global_step": 281708, "epoch": 1676} {"train_loss": -11.58132553100586, "global_step": 281709, "epoch": 1676} {"train_loss": -11.776248931884766, "global_step": 281710, "epoch": 1676} {"train_loss": -11.339942932128906, "global_step": 281711, "epoch": 1676} {"train_loss": -12.018447875976562, "global_step": 281712, "epoch": 1676} {"train_loss": -10.733283996582031, "global_step": 281713, "epoch": 1676} {"train_loss": -11.806544303894043, "global_step": 281714, "epoch": 1676} {"train_loss": -11.84122371673584, "global_step": 281715, "epoch": 1676} {"train_loss": -11.686530113220215, "global_step": 281716, "epoch": 1676} {"train_loss": -11.551856994628906, "global_step": 281717, "epoch": 1676} {"train_loss": -12.224181175231934, "global_step": 281718, "epoch": 1676} {"train_loss": -11.449365615844727, "global_step": 281719, "epoch": 1676} {"train_loss": -11.814017295837402, "global_step": 281720, "epoch": 1676} {"train_loss": -11.93901252746582, "global_step": 281721, "epoch": 1676} {"train_loss": -11.847648620605469, "global_step": 281722, "epoch": 1676} {"train_loss": -12.072755813598633, "global_step": 281723, "epoch": 1676} {"train_loss": -10.855817794799805, "global_step": 281724, "epoch": 1676} {"train_loss": -11.355817794799805, "global_step": 281725, "epoch": 1676} {"train_loss": -11.699800491333008, "global_step": 281726, "epoch": 1676} {"train_loss": -11.035493850708008, "global_step": 281727, "epoch": 1676} {"train_loss": -11.091508865356445, "global_step": 281728, "epoch": 1676} {"train_loss": -11.83447265625, "global_step": 281729, "epoch": 1676} {"train_loss": -10.894920349121094, "global_step": 281730, "epoch": 1676} {"train_loss": -11.402135848999023, "global_step": 281731, "epoch": 1676} {"train_loss": -11.578788757324219, "global_step": 281732, "epoch": 1676} {"train_loss": -11.525896072387695, "global_step": 281733, "epoch": 1676} {"train_loss": -11.722942352294922, "global_step": 281734, "epoch": 1676} {"train_loss": -11.712577030772255, "global_step": 281735, "epoch": 1676, "val_loss": 277591.875} {"train_loss": -11.527701377868652, "global_step": 281736, "epoch": 1677} {"train_loss": -11.644472122192383, "global_step": 281737, "epoch": 1677} {"train_loss": -11.842159271240234, "global_step": 281738, "epoch": 1677} {"train_loss": -11.369220733642578, "global_step": 281739, "epoch": 1677} {"train_loss": -11.383434295654297, "global_step": 281740, "epoch": 1677} {"train_loss": -12.04080867767334, "global_step": 281741, "epoch": 1677} {"train_loss": -11.756853103637695, "global_step": 281742, "epoch": 1677} {"train_loss": -11.671436309814453, "global_step": 281743, "epoch": 1677} {"train_loss": -11.73108196258545, "global_step": 281744, "epoch": 1677} {"train_loss": -11.367618560791016, "global_step": 281745, "epoch": 1677} {"train_loss": -11.744205474853516, "global_step": 281746, "epoch": 1677} {"train_loss": -11.399486541748047, "global_step": 281747, "epoch": 1677} {"train_loss": -10.893189430236816, "global_step": 281748, "epoch": 1677} {"train_loss": -11.542407989501953, "global_step": 281749, "epoch": 1677} {"train_loss": -11.41549301147461, "global_step": 281750, "epoch": 1677} {"train_loss": -11.716781616210938, "global_step": 281751, "epoch": 1677} {"train_loss": -11.720026969909668, "global_step": 281752, "epoch": 1677} {"train_loss": -11.556161880493164, "global_step": 281753, "epoch": 1677} {"train_loss": -11.699329376220703, "global_step": 281754, "epoch": 1677} {"train_loss": -11.622086524963379, "global_step": 281755, "epoch": 1677} {"train_loss": -11.951615333557129, "global_step": 281756, "epoch": 1677} {"train_loss": -11.55886173248291, "global_step": 281757, "epoch": 1677} {"train_loss": -12.107479095458984, "global_step": 281758, "epoch": 1677} {"train_loss": -11.819835662841797, "global_step": 281759, "epoch": 1677} {"train_loss": -12.225364685058594, "global_step": 281760, "epoch": 1677} {"train_loss": -11.87186050415039, "global_step": 281761, "epoch": 1677} {"train_loss": -12.358949661254883, "global_step": 281762, "epoch": 1677} {"train_loss": -11.763801574707031, "global_step": 281763, "epoch": 1677} {"train_loss": -12.313972473144531, "global_step": 281764, "epoch": 1677} {"train_loss": -12.118829727172852, "global_step": 281765, "epoch": 1677} {"train_loss": -12.019573211669922, "global_step": 281766, "epoch": 1677} {"train_loss": -12.318313598632812, "global_step": 281767, "epoch": 1677} {"train_loss": -12.231781005859375, "global_step": 281768, "epoch": 1677} {"train_loss": -12.366250038146973, "global_step": 281769, "epoch": 1677} {"train_loss": -12.154966354370117, "global_step": 281770, "epoch": 1677} {"train_loss": -12.083620071411133, "global_step": 281771, "epoch": 1677} {"train_loss": -11.909900665283203, "global_step": 281772, "epoch": 1677} {"train_loss": -12.2573881149292, "global_step": 281773, "epoch": 1677} {"train_loss": -12.101276397705078, "global_step": 281774, "epoch": 1677} {"train_loss": -12.12639045715332, "global_step": 281775, "epoch": 1677} {"train_loss": -12.318588256835938, "global_step": 281776, "epoch": 1677} {"train_loss": -12.119123458862305, "global_step": 281777, "epoch": 1677} {"train_loss": -12.26046085357666, "global_step": 281778, "epoch": 1677} {"train_loss": -11.97095775604248, "global_step": 281779, "epoch": 1677} {"train_loss": -12.053616523742676, "global_step": 281780, "epoch": 1677} {"train_loss": -11.839862823486328, "global_step": 281781, "epoch": 1677} {"train_loss": -12.041349411010742, "global_step": 281782, "epoch": 1677} {"train_loss": -12.33144760131836, "global_step": 281783, "epoch": 1677} {"train_loss": -12.035408973693848, "global_step": 281784, "epoch": 1677} {"train_loss": -12.112574577331543, "global_step": 281785, "epoch": 1677} {"train_loss": -12.086918830871582, "global_step": 281786, "epoch": 1677} {"train_loss": -11.570725440979004, "global_step": 281787, "epoch": 1677} {"train_loss": -11.780562400817871, "global_step": 281788, "epoch": 1677} {"train_loss": -12.20478630065918, "global_step": 281789, "epoch": 1677} {"train_loss": -11.660045623779297, "global_step": 281790, "epoch": 1677} {"train_loss": -11.541038513183594, "global_step": 281791, "epoch": 1677} {"train_loss": -11.893875122070312, "global_step": 281792, "epoch": 1677} {"train_loss": -11.97568130493164, "global_step": 281793, "epoch": 1677} {"train_loss": -11.551311492919922, "global_step": 281794, "epoch": 1677} {"train_loss": -12.263214111328125, "global_step": 281795, "epoch": 1677} {"train_loss": -12.253414154052734, "global_step": 281796, "epoch": 1677} {"train_loss": -12.215668678283691, "global_step": 281797, "epoch": 1677} {"train_loss": -12.307119369506836, "global_step": 281798, "epoch": 1677} {"train_loss": -12.424453735351562, "global_step": 281799, "epoch": 1677} {"train_loss": -12.139944076538086, "global_step": 281800, "epoch": 1677} {"train_loss": -12.249649047851562, "global_step": 281801, "epoch": 1677} {"train_loss": -12.292627334594727, "global_step": 281802, "epoch": 1677} {"train_loss": -11.804999351501465, "global_step": 281803, "epoch": 1677} {"train_loss": -12.275094985961914, "global_step": 281804, "epoch": 1677} {"train_loss": -12.013761520385742, "global_step": 281805, "epoch": 1677} {"train_loss": -12.275240898132324, "global_step": 281806, "epoch": 1677} {"train_loss": -12.086370468139648, "global_step": 281807, "epoch": 1677} {"train_loss": -12.266498565673828, "global_step": 281808, "epoch": 1677} {"train_loss": -11.72885799407959, "global_step": 281809, "epoch": 1677} {"train_loss": -12.411306381225586, "global_step": 281810, "epoch": 1677} {"train_loss": -12.005546569824219, "global_step": 281811, "epoch": 1677} {"train_loss": -11.6776123046875, "global_step": 281812, "epoch": 1677} {"train_loss": -11.806598663330078, "global_step": 281813, "epoch": 1677} {"train_loss": -12.262483596801758, "global_step": 281814, "epoch": 1677} {"train_loss": -11.122905731201172, "global_step": 281815, "epoch": 1677} {"train_loss": -10.969581604003906, "global_step": 281816, "epoch": 1677} {"train_loss": -12.108777046203613, "global_step": 281817, "epoch": 1677} {"train_loss": -11.264486312866211, "global_step": 281818, "epoch": 1677} {"train_loss": -12.087636947631836, "global_step": 281819, "epoch": 1677} {"train_loss": -11.882728576660156, "global_step": 281820, "epoch": 1677} {"train_loss": -12.162178039550781, "global_step": 281821, "epoch": 1677} {"train_loss": -11.676273345947266, "global_step": 281822, "epoch": 1677} {"train_loss": -12.157441139221191, "global_step": 281823, "epoch": 1677} {"train_loss": -11.900997161865234, "global_step": 281824, "epoch": 1677} {"train_loss": -12.311817169189453, "global_step": 281825, "epoch": 1677} {"train_loss": -12.108768463134766, "global_step": 281826, "epoch": 1677} {"train_loss": -11.911741256713867, "global_step": 281827, "epoch": 1677} {"train_loss": -11.598494529724121, "global_step": 281828, "epoch": 1677} {"train_loss": -11.599211692810059, "global_step": 281829, "epoch": 1677} {"train_loss": -11.443743705749512, "global_step": 281830, "epoch": 1677} {"train_loss": -12.101686477661133, "global_step": 281831, "epoch": 1677} {"train_loss": -11.565942764282227, "global_step": 281832, "epoch": 1677} {"train_loss": -11.876110076904297, "global_step": 281833, "epoch": 1677} {"train_loss": -11.571611404418945, "global_step": 281834, "epoch": 1677} {"train_loss": -10.93787956237793, "global_step": 281835, "epoch": 1677} {"train_loss": -11.978158950805664, "global_step": 281836, "epoch": 1677} {"train_loss": -10.805072784423828, "global_step": 281837, "epoch": 1677} {"train_loss": -11.095714569091797, "global_step": 281838, "epoch": 1677} {"train_loss": -11.902803421020508, "global_step": 281839, "epoch": 1677} {"train_loss": -11.021787643432617, "global_step": 281840, "epoch": 1677} {"train_loss": -10.881132125854492, "global_step": 281841, "epoch": 1677} {"train_loss": -12.2108154296875, "global_step": 281842, "epoch": 1677} {"train_loss": -11.62048625946045, "global_step": 281843, "epoch": 1677} {"train_loss": -11.876852035522461, "global_step": 281844, "epoch": 1677} {"train_loss": -11.699247360229492, "global_step": 281845, "epoch": 1677} {"train_loss": -11.700769424438477, "global_step": 281846, "epoch": 1677} {"train_loss": -11.496429443359375, "global_step": 281847, "epoch": 1677} {"train_loss": -11.272255897521973, "global_step": 281848, "epoch": 1677} {"train_loss": -11.555169105529785, "global_step": 281849, "epoch": 1677} {"train_loss": -10.957728385925293, "global_step": 281850, "epoch": 1677} {"train_loss": -10.245097160339355, "global_step": 281851, "epoch": 1677} {"train_loss": -10.036384582519531, "global_step": 281852, "epoch": 1677} {"train_loss": -10.507617950439453, "global_step": 281853, "epoch": 1677} {"train_loss": -10.200273513793945, "global_step": 281854, "epoch": 1677} {"train_loss": -9.84050178527832, "global_step": 281855, "epoch": 1677} {"train_loss": -11.275069236755371, "global_step": 281856, "epoch": 1677} {"train_loss": -10.923562049865723, "global_step": 281857, "epoch": 1677} {"train_loss": -11.51118278503418, "global_step": 281858, "epoch": 1677} {"train_loss": -10.80489444732666, "global_step": 281859, "epoch": 1677} {"train_loss": -11.632596969604492, "global_step": 281860, "epoch": 1677} {"train_loss": -11.391561508178711, "global_step": 281861, "epoch": 1677} {"train_loss": -11.948709487915039, "global_step": 281862, "epoch": 1677} {"train_loss": -10.751220703125, "global_step": 281863, "epoch": 1677} {"train_loss": -11.092355728149414, "global_step": 281864, "epoch": 1677} {"train_loss": -11.339529991149902, "global_step": 281865, "epoch": 1677} {"train_loss": -11.843541145324707, "global_step": 281866, "epoch": 1677} {"train_loss": -11.405628204345703, "global_step": 281867, "epoch": 1677} {"train_loss": -11.04892349243164, "global_step": 281868, "epoch": 1677} {"train_loss": -11.38926887512207, "global_step": 281869, "epoch": 1677} {"train_loss": -11.431357383728027, "global_step": 281870, "epoch": 1677} {"train_loss": -11.918787956237793, "global_step": 281871, "epoch": 1677} {"train_loss": -11.425214767456055, "global_step": 281872, "epoch": 1677} {"train_loss": -12.000415802001953, "global_step": 281873, "epoch": 1677} {"train_loss": -11.291231155395508, "global_step": 281874, "epoch": 1677} {"train_loss": -11.823699951171875, "global_step": 281875, "epoch": 1677} {"train_loss": -11.72679615020752, "global_step": 281876, "epoch": 1677} {"train_loss": -11.688959121704102, "global_step": 281877, "epoch": 1677} {"train_loss": -11.95279598236084, "global_step": 281878, "epoch": 1677} {"train_loss": -11.692119598388672, "global_step": 281879, "epoch": 1677} {"train_loss": -11.632671356201172, "global_step": 281880, "epoch": 1677} {"train_loss": -11.611161231994629, "global_step": 281881, "epoch": 1677} {"train_loss": -11.513566970825195, "global_step": 281882, "epoch": 1677} {"train_loss": -11.839523315429688, "global_step": 281883, "epoch": 1677} {"train_loss": -11.597479820251465, "global_step": 281884, "epoch": 1677} {"train_loss": -11.788650512695312, "global_step": 281885, "epoch": 1677} {"train_loss": -11.725614547729492, "global_step": 281886, "epoch": 1677} {"train_loss": -12.005359649658203, "global_step": 281887, "epoch": 1677} {"train_loss": -11.773365020751953, "global_step": 281888, "epoch": 1677} {"train_loss": -12.023263931274414, "global_step": 281889, "epoch": 1677} {"train_loss": -11.823832511901855, "global_step": 281890, "epoch": 1677} {"train_loss": -11.843509674072266, "global_step": 281891, "epoch": 1677} {"train_loss": -11.735485076904297, "global_step": 281892, "epoch": 1677} {"train_loss": -12.000706672668457, "global_step": 281893, "epoch": 1677} {"train_loss": -12.068408966064453, "global_step": 281894, "epoch": 1677} {"train_loss": -12.029211044311523, "global_step": 281895, "epoch": 1677} {"train_loss": -12.10883903503418, "global_step": 281896, "epoch": 1677} {"train_loss": -11.773704528808594, "global_step": 281897, "epoch": 1677} {"train_loss": -12.342445373535156, "global_step": 281898, "epoch": 1677} {"train_loss": -11.861209869384766, "global_step": 281899, "epoch": 1677} {"train_loss": -12.062819480895996, "global_step": 281900, "epoch": 1677} {"train_loss": -12.231744766235352, "global_step": 281901, "epoch": 1677} {"train_loss": -12.127067565917969, "global_step": 281902, "epoch": 1677} {"train_loss": -11.748535491171337, "global_step": 281903, "epoch": 1677, "val_loss": 277042.5} {"train_loss": -12.160387992858887, "global_step": 281904, "epoch": 1678} {"train_loss": -12.211366653442383, "global_step": 281905, "epoch": 1678} {"train_loss": -12.205927848815918, "global_step": 281906, "epoch": 1678} {"train_loss": -12.114785194396973, "global_step": 281907, "epoch": 1678} {"train_loss": -12.132951736450195, "global_step": 281908, "epoch": 1678} {"train_loss": -12.192035675048828, "global_step": 281909, "epoch": 1678} {"train_loss": -12.359832763671875, "global_step": 281910, "epoch": 1678} {"train_loss": -12.246591567993164, "global_step": 281911, "epoch": 1678} {"train_loss": -12.210758209228516, "global_step": 281912, "epoch": 1678} {"train_loss": -12.225391387939453, "global_step": 281913, "epoch": 1678} {"train_loss": -11.978934288024902, "global_step": 281914, "epoch": 1678} {"train_loss": -12.113411903381348, "global_step": 281915, "epoch": 1678} {"train_loss": -12.432323455810547, "global_step": 281916, "epoch": 1678} {"train_loss": -12.24245834350586, "global_step": 281917, "epoch": 1678} {"train_loss": -12.290349006652832, "global_step": 281918, "epoch": 1678} {"train_loss": -12.18023681640625, "global_step": 281919, "epoch": 1678} {"train_loss": -12.405251502990723, "global_step": 281920, "epoch": 1678} {"train_loss": -12.26901626586914, "global_step": 281921, "epoch": 1678} {"train_loss": -12.25326156616211, "global_step": 281922, "epoch": 1678} {"train_loss": -12.293883323669434, "global_step": 281923, "epoch": 1678} {"train_loss": -12.23942756652832, "global_step": 281924, "epoch": 1678} {"train_loss": -12.397140502929688, "global_step": 281925, "epoch": 1678} {"train_loss": -12.342967987060547, "global_step": 281926, "epoch": 1678} {"train_loss": -12.352075576782227, "global_step": 281927, "epoch": 1678} {"train_loss": -12.381893157958984, "global_step": 281928, "epoch": 1678} {"train_loss": -12.151360511779785, "global_step": 281929, "epoch": 1678} {"train_loss": -12.178726196289062, "global_step": 281930, "epoch": 1678} {"train_loss": -12.347480773925781, "global_step": 281931, "epoch": 1678} {"train_loss": -12.318414688110352, "global_step": 281932, "epoch": 1678} {"train_loss": -12.170500755310059, "global_step": 281933, "epoch": 1678} {"train_loss": -12.468263626098633, "global_step": 281934, "epoch": 1678} {"train_loss": -12.266014099121094, "global_step": 281935, "epoch": 1678} {"train_loss": -12.369014739990234, "global_step": 281936, "epoch": 1678} {"train_loss": -12.215619087219238, "global_step": 281937, "epoch": 1678} {"train_loss": -12.132712364196777, "global_step": 281938, "epoch": 1678} {"train_loss": -12.008031845092773, "global_step": 281939, "epoch": 1678} {"train_loss": -11.613543510437012, "global_step": 281940, "epoch": 1678} {"train_loss": -11.66175651550293, "global_step": 281941, "epoch": 1678} {"train_loss": -12.380655288696289, "global_step": 281942, "epoch": 1678} {"train_loss": -11.878887176513672, "global_step": 281943, "epoch": 1678} {"train_loss": -11.14996337890625, "global_step": 281944, "epoch": 1678} {"train_loss": -11.72279167175293, "global_step": 281945, "epoch": 1678} {"train_loss": -11.606966018676758, "global_step": 281946, "epoch": 1678} {"train_loss": -11.499943733215332, "global_step": 281947, "epoch": 1678} {"train_loss": -11.970905303955078, "global_step": 281948, "epoch": 1678} {"train_loss": -11.167341232299805, "global_step": 281949, "epoch": 1678} {"train_loss": -11.128172874450684, "global_step": 281950, "epoch": 1678} {"train_loss": -11.862005233764648, "global_step": 281951, "epoch": 1678} {"train_loss": -11.405675888061523, "global_step": 281952, "epoch": 1678} {"train_loss": -10.990581512451172, "global_step": 281953, "epoch": 1678} {"train_loss": -10.908668518066406, "global_step": 281954, "epoch": 1678} {"train_loss": -10.867887496948242, "global_step": 281955, "epoch": 1678} {"train_loss": -11.020587921142578, "global_step": 281956, "epoch": 1678} {"train_loss": -11.28281307220459, "global_step": 281957, "epoch": 1678} {"train_loss": -10.824552536010742, "global_step": 281958, "epoch": 1678} {"train_loss": -11.933218002319336, "global_step": 281959, "epoch": 1678} {"train_loss": -11.405586242675781, "global_step": 281960, "epoch": 1678} {"train_loss": -11.304407119750977, "global_step": 281961, "epoch": 1678} {"train_loss": -11.302620887756348, "global_step": 281962, "epoch": 1678} {"train_loss": -11.18923568725586, "global_step": 281963, "epoch": 1678} {"train_loss": -11.488175392150879, "global_step": 281964, "epoch": 1678} {"train_loss": -11.858026504516602, "global_step": 281965, "epoch": 1678} {"train_loss": -11.204517364501953, "global_step": 281966, "epoch": 1678} {"train_loss": -11.649663925170898, "global_step": 281967, "epoch": 1678} {"train_loss": -10.887313842773438, "global_step": 281968, "epoch": 1678} {"train_loss": -10.581295013427734, "global_step": 281969, "epoch": 1678} {"train_loss": -11.241888046264648, "global_step": 281970, "epoch": 1678} {"train_loss": -9.638683319091797, "global_step": 281971, "epoch": 1678} {"train_loss": -11.471717834472656, "global_step": 281972, "epoch": 1678} {"train_loss": -10.39969539642334, "global_step": 281973, "epoch": 1678} {"train_loss": -11.02958869934082, "global_step": 281974, "epoch": 1678} {"train_loss": -10.475776672363281, "global_step": 281975, "epoch": 1678} {"train_loss": -11.398494720458984, "global_step": 281976, "epoch": 1678} {"train_loss": -10.608898162841797, "global_step": 281977, "epoch": 1678} {"train_loss": -11.73499584197998, "global_step": 281978, "epoch": 1678} {"train_loss": -10.774129867553711, "global_step": 281979, "epoch": 1678} {"train_loss": -11.517302513122559, "global_step": 281980, "epoch": 1678} {"train_loss": -10.859824180603027, "global_step": 281981, "epoch": 1678} {"train_loss": -11.09217643737793, "global_step": 281982, "epoch": 1678} {"train_loss": -10.831001281738281, "global_step": 281983, "epoch": 1678} {"train_loss": -11.180830955505371, "global_step": 281984, "epoch": 1678} {"train_loss": -11.590789794921875, "global_step": 281985, "epoch": 1678} {"train_loss": -11.305215835571289, "global_step": 281986, "epoch": 1678} {"train_loss": -11.568224906921387, "global_step": 281987, "epoch": 1678} {"train_loss": -11.459177017211914, "global_step": 281988, "epoch": 1678} {"train_loss": -11.778390884399414, "global_step": 281989, "epoch": 1678} {"train_loss": -11.387859344482422, "global_step": 281990, "epoch": 1678} {"train_loss": -11.700281143188477, "global_step": 281991, "epoch": 1678} {"train_loss": -11.507027626037598, "global_step": 281992, "epoch": 1678} {"train_loss": -11.697186470031738, "global_step": 281993, "epoch": 1678} {"train_loss": -11.623552322387695, "global_step": 281994, "epoch": 1678} {"train_loss": -11.911703109741211, "global_step": 281995, "epoch": 1678} {"train_loss": -11.114516258239746, "global_step": 281996, "epoch": 1678} {"train_loss": -12.089082717895508, "global_step": 281997, "epoch": 1678} {"train_loss": -11.047941207885742, "global_step": 281998, "epoch": 1678} {"train_loss": -11.388900756835938, "global_step": 281999, "epoch": 1678} {"train_loss": -11.668088912963867, "global_step": 282000, "epoch": 1678} {"train_loss": -11.460502624511719, "global_step": 282001, "epoch": 1678} {"train_loss": -11.612115859985352, "global_step": 282002, "epoch": 1678} {"train_loss": -11.700996398925781, "global_step": 282003, "epoch": 1678} {"train_loss": -11.78819465637207, "global_step": 282004, "epoch": 1678} {"train_loss": -12.068384170532227, "global_step": 282005, "epoch": 1678} {"train_loss": -11.545772552490234, "global_step": 282006, "epoch": 1678} {"train_loss": -11.734428405761719, "global_step": 282007, "epoch": 1678} {"train_loss": -12.108107566833496, "global_step": 282008, "epoch": 1678} {"train_loss": -11.762510299682617, "global_step": 282009, "epoch": 1678} {"train_loss": -11.984062194824219, "global_step": 282010, "epoch": 1678} {"train_loss": -11.63960075378418, "global_step": 282011, "epoch": 1678} {"train_loss": -11.719070434570312, "global_step": 282012, "epoch": 1678} {"train_loss": -11.99686050415039, "global_step": 282013, "epoch": 1678} {"train_loss": -11.615987777709961, "global_step": 282014, "epoch": 1678} {"train_loss": -12.031184196472168, "global_step": 282015, "epoch": 1678} {"train_loss": -11.519039154052734, "global_step": 282016, "epoch": 1678} {"train_loss": -11.840902328491211, "global_step": 282017, "epoch": 1678} {"train_loss": -11.717925071716309, "global_step": 282018, "epoch": 1678} {"train_loss": -11.914234161376953, "global_step": 282019, "epoch": 1678} {"train_loss": -11.822998046875, "global_step": 282020, "epoch": 1678} {"train_loss": -11.730127334594727, "global_step": 282021, "epoch": 1678} {"train_loss": -11.932561874389648, "global_step": 282022, "epoch": 1678} {"train_loss": -11.812950134277344, "global_step": 282023, "epoch": 1678} {"train_loss": -12.040122985839844, "global_step": 282024, "epoch": 1678} {"train_loss": -11.724979400634766, "global_step": 282025, "epoch": 1678} {"train_loss": -11.274579048156738, "global_step": 282026, "epoch": 1678} {"train_loss": -11.95742130279541, "global_step": 282027, "epoch": 1678} {"train_loss": -11.402975082397461, "global_step": 282028, "epoch": 1678} {"train_loss": -11.557662963867188, "global_step": 282029, "epoch": 1678} {"train_loss": -11.546930313110352, "global_step": 282030, "epoch": 1678} {"train_loss": -10.646759033203125, "global_step": 282031, "epoch": 1678} {"train_loss": -11.929424285888672, "global_step": 282032, "epoch": 1678} {"train_loss": -11.329715728759766, "global_step": 282033, "epoch": 1678} {"train_loss": -11.954084396362305, "global_step": 282034, "epoch": 1678} {"train_loss": -11.782449722290039, "global_step": 282035, "epoch": 1678} {"train_loss": -11.629509925842285, "global_step": 282036, "epoch": 1678} {"train_loss": -12.046934127807617, "global_step": 282037, "epoch": 1678} {"train_loss": -11.462088584899902, "global_step": 282038, "epoch": 1678} {"train_loss": -12.225542068481445, "global_step": 282039, "epoch": 1678} {"train_loss": -11.32451343536377, "global_step": 282040, "epoch": 1678} {"train_loss": -10.897518157958984, "global_step": 282041, "epoch": 1678} {"train_loss": -11.737913131713867, "global_step": 282042, "epoch": 1678} {"train_loss": -10.735576629638672, "global_step": 282043, "epoch": 1678} {"train_loss": -11.766721725463867, "global_step": 282044, "epoch": 1678} {"train_loss": -11.431745529174805, "global_step": 282045, "epoch": 1678} {"train_loss": -11.782867431640625, "global_step": 282046, "epoch": 1678} {"train_loss": -11.937570571899414, "global_step": 282047, "epoch": 1678} {"train_loss": -11.772068977355957, "global_step": 282048, "epoch": 1678} {"train_loss": -12.206086158752441, "global_step": 282049, "epoch": 1678} {"train_loss": -11.176132202148438, "global_step": 282050, "epoch": 1678} {"train_loss": -11.73278522491455, "global_step": 282051, "epoch": 1678} {"train_loss": -11.871076583862305, "global_step": 282052, "epoch": 1678} {"train_loss": -11.539999008178711, "global_step": 282053, "epoch": 1678} {"train_loss": -11.906229019165039, "global_step": 282054, "epoch": 1678} {"train_loss": -11.822989463806152, "global_step": 282055, "epoch": 1678} {"train_loss": -12.034795761108398, "global_step": 282056, "epoch": 1678} {"train_loss": -11.797113418579102, "global_step": 282057, "epoch": 1678} {"train_loss": -11.86110782623291, "global_step": 282058, "epoch": 1678} {"train_loss": -12.229705810546875, "global_step": 282059, "epoch": 1678} {"train_loss": -12.123346328735352, "global_step": 282060, "epoch": 1678} {"train_loss": -11.921022415161133, "global_step": 282061, "epoch": 1678} {"train_loss": -11.959199905395508, "global_step": 282062, "epoch": 1678} {"train_loss": -12.334417343139648, "global_step": 282063, "epoch": 1678} {"train_loss": -11.868398666381836, "global_step": 282064, "epoch": 1678} {"train_loss": -12.22502326965332, "global_step": 282065, "epoch": 1678} {"train_loss": -12.253923416137695, "global_step": 282066, "epoch": 1678} {"train_loss": -12.117719650268555, "global_step": 282067, "epoch": 1678} {"train_loss": -11.921863555908203, "global_step": 282068, "epoch": 1678} {"train_loss": -12.139358520507812, "global_step": 282069, "epoch": 1678} {"train_loss": -12.13252067565918, "global_step": 282070, "epoch": 1678} {"train_loss": -11.714856584866842, "global_step": 282071, "epoch": 1678, "val_loss": 277816.40625} {"train_loss": -12.172160148620605, "global_step": 282072, "epoch": 1679} {"train_loss": -12.243700981140137, "global_step": 282073, "epoch": 1679} {"train_loss": -12.173954010009766, "global_step": 282074, "epoch": 1679} {"train_loss": -12.123307228088379, "global_step": 282075, "epoch": 1679} {"train_loss": -12.290075302124023, "global_step": 282076, "epoch": 1679} {"train_loss": -12.29751205444336, "global_step": 282077, "epoch": 1679} {"train_loss": -12.190485000610352, "global_step": 282078, "epoch": 1679} {"train_loss": -11.770793914794922, "global_step": 282079, "epoch": 1679} {"train_loss": -12.302624702453613, "global_step": 282080, "epoch": 1679} {"train_loss": -11.523942947387695, "global_step": 282081, "epoch": 1679} {"train_loss": -11.906874656677246, "global_step": 282082, "epoch": 1679} {"train_loss": -12.24471378326416, "global_step": 282083, "epoch": 1679} {"train_loss": -11.78122615814209, "global_step": 282084, "epoch": 1679} {"train_loss": -12.217222213745117, "global_step": 282085, "epoch": 1679} {"train_loss": -11.927678108215332, "global_step": 282086, "epoch": 1679} {"train_loss": -11.309704780578613, "global_step": 282087, "epoch": 1679} {"train_loss": -12.009082794189453, "global_step": 282088, "epoch": 1679} {"train_loss": -11.58441162109375, "global_step": 282089, "epoch": 1679} {"train_loss": -11.639341354370117, "global_step": 282090, "epoch": 1679} {"train_loss": -12.071542739868164, "global_step": 282091, "epoch": 1679} {"train_loss": -11.171011924743652, "global_step": 282092, "epoch": 1679} {"train_loss": -12.307886123657227, "global_step": 282093, "epoch": 1679} {"train_loss": -10.615985870361328, "global_step": 282094, "epoch": 1679} {"train_loss": -11.579378128051758, "global_step": 282095, "epoch": 1679} {"train_loss": -11.86384105682373, "global_step": 282096, "epoch": 1679} {"train_loss": -10.634294509887695, "global_step": 282097, "epoch": 1679} {"train_loss": -12.022499084472656, "global_step": 282098, "epoch": 1679} {"train_loss": -10.640787124633789, "global_step": 282099, "epoch": 1679} {"train_loss": -11.227804183959961, "global_step": 282100, "epoch": 1679} {"train_loss": -11.551393508911133, "global_step": 282101, "epoch": 1679} {"train_loss": -11.02125358581543, "global_step": 282102, "epoch": 1679} {"train_loss": -11.507220268249512, "global_step": 282103, "epoch": 1679} {"train_loss": -10.768219947814941, "global_step": 282104, "epoch": 1679} {"train_loss": -11.706327438354492, "global_step": 282105, "epoch": 1679} {"train_loss": -11.843714714050293, "global_step": 282106, "epoch": 1679} {"train_loss": -11.646629333496094, "global_step": 282107, "epoch": 1679} {"train_loss": -11.682243347167969, "global_step": 282108, "epoch": 1679} {"train_loss": -11.592877388000488, "global_step": 282109, "epoch": 1679} {"train_loss": -11.35655689239502, "global_step": 282110, "epoch": 1679} {"train_loss": -11.643716812133789, "global_step": 282111, "epoch": 1679} {"train_loss": -11.482610702514648, "global_step": 282112, "epoch": 1679} {"train_loss": -12.067276000976562, "global_step": 282113, "epoch": 1679} {"train_loss": -11.246450424194336, "global_step": 282114, "epoch": 1679} {"train_loss": -11.723509788513184, "global_step": 282115, "epoch": 1679} {"train_loss": -11.90428352355957, "global_step": 282116, "epoch": 1679} {"train_loss": -11.588285446166992, "global_step": 282117, "epoch": 1679} {"train_loss": -11.968055725097656, "global_step": 282118, "epoch": 1679} {"train_loss": -11.683891296386719, "global_step": 282119, "epoch": 1679} {"train_loss": -11.280489921569824, "global_step": 282120, "epoch": 1679} {"train_loss": -11.851760864257812, "global_step": 282121, "epoch": 1679} {"train_loss": -11.770633697509766, "global_step": 282122, "epoch": 1679} {"train_loss": -10.505311965942383, "global_step": 282123, "epoch": 1679} {"train_loss": -11.0908203125, "global_step": 282124, "epoch": 1679} {"train_loss": -10.666095733642578, "global_step": 282125, "epoch": 1679} {"train_loss": -11.345931053161621, "global_step": 282126, "epoch": 1679} {"train_loss": -10.925660133361816, "global_step": 282127, "epoch": 1679} {"train_loss": -11.12069034576416, "global_step": 282128, "epoch": 1679} {"train_loss": -11.212386131286621, "global_step": 282129, "epoch": 1679} {"train_loss": -11.315836906433105, "global_step": 282130, "epoch": 1679} {"train_loss": -11.331517219543457, "global_step": 282131, "epoch": 1679} {"train_loss": -11.334493637084961, "global_step": 282132, "epoch": 1679} {"train_loss": -11.658409118652344, "global_step": 282133, "epoch": 1679} {"train_loss": -11.32373332977295, "global_step": 282134, "epoch": 1679} {"train_loss": -10.857986450195312, "global_step": 282135, "epoch": 1679} {"train_loss": -10.90715503692627, "global_step": 282136, "epoch": 1679} {"train_loss": -10.621855735778809, "global_step": 282137, "epoch": 1679} {"train_loss": -11.571562767028809, "global_step": 282138, "epoch": 1679} {"train_loss": -11.210721969604492, "global_step": 282139, "epoch": 1679} {"train_loss": -11.826462745666504, "global_step": 282140, "epoch": 1679} {"train_loss": -11.729345321655273, "global_step": 282141, "epoch": 1679} {"train_loss": -11.43960189819336, "global_step": 282142, "epoch": 1679} {"train_loss": -11.438295364379883, "global_step": 282143, "epoch": 1679} {"train_loss": -11.267557144165039, "global_step": 282144, "epoch": 1679} {"train_loss": -11.292338371276855, "global_step": 282145, "epoch": 1679} {"train_loss": -11.597698211669922, "global_step": 282146, "epoch": 1679} {"train_loss": -11.235601425170898, "global_step": 282147, "epoch": 1679} {"train_loss": -11.52488899230957, "global_step": 282148, "epoch": 1679} {"train_loss": -11.132293701171875, "global_step": 282149, "epoch": 1679} {"train_loss": -11.584341049194336, "global_step": 282150, "epoch": 1679} {"train_loss": -11.412312507629395, "global_step": 282151, "epoch": 1679} {"train_loss": -12.004573822021484, "global_step": 282152, "epoch": 1679} {"train_loss": -11.7236328125, "global_step": 282153, "epoch": 1679} {"train_loss": -11.978371620178223, "global_step": 282154, "epoch": 1679} {"train_loss": -11.845829010009766, "global_step": 282155, "epoch": 1679} {"train_loss": -11.752056121826172, "global_step": 282156, "epoch": 1679} {"train_loss": -11.846818923950195, "global_step": 282157, "epoch": 1679} {"train_loss": -11.791736602783203, "global_step": 282158, "epoch": 1679} {"train_loss": -12.244222640991211, "global_step": 282159, "epoch": 1679} {"train_loss": -12.157613754272461, "global_step": 282160, "epoch": 1679} {"train_loss": -12.114656448364258, "global_step": 282161, "epoch": 1679} {"train_loss": -12.181379318237305, "global_step": 282162, "epoch": 1679} {"train_loss": -11.953923225402832, "global_step": 282163, "epoch": 1679} {"train_loss": -12.067296981811523, "global_step": 282164, "epoch": 1679} {"train_loss": -12.059402465820312, "global_step": 282165, "epoch": 1679} {"train_loss": -12.223758697509766, "global_step": 282166, "epoch": 1679} {"train_loss": -12.129045486450195, "global_step": 282167, "epoch": 1679} {"train_loss": -12.369030952453613, "global_step": 282168, "epoch": 1679} {"train_loss": -12.20283317565918, "global_step": 282169, "epoch": 1679} {"train_loss": -12.091329574584961, "global_step": 282170, "epoch": 1679} {"train_loss": -12.160928726196289, "global_step": 282171, "epoch": 1679} {"train_loss": -12.229692459106445, "global_step": 282172, "epoch": 1679} {"train_loss": -12.355447769165039, "global_step": 282173, "epoch": 1679} {"train_loss": -12.327330589294434, "global_step": 282174, "epoch": 1679} {"train_loss": -12.355804443359375, "global_step": 282175, "epoch": 1679} {"train_loss": -11.9715576171875, "global_step": 282176, "epoch": 1679} {"train_loss": -12.238227844238281, "global_step": 282177, "epoch": 1679} {"train_loss": -12.271519660949707, "global_step": 282178, "epoch": 1679} {"train_loss": -12.00460433959961, "global_step": 282179, "epoch": 1679} {"train_loss": -12.390188217163086, "global_step": 282180, "epoch": 1679} {"train_loss": -12.15243911743164, "global_step": 282181, "epoch": 1679} {"train_loss": -12.262853622436523, "global_step": 282182, "epoch": 1679} {"train_loss": -12.41034984588623, "global_step": 282183, "epoch": 1679} {"train_loss": -12.270547866821289, "global_step": 282184, "epoch": 1679} {"train_loss": -12.068592071533203, "global_step": 282185, "epoch": 1679} {"train_loss": -11.96618938446045, "global_step": 282186, "epoch": 1679} {"train_loss": -12.229866027832031, "global_step": 282187, "epoch": 1679} {"train_loss": -12.42000961303711, "global_step": 282188, "epoch": 1679} {"train_loss": -12.228303909301758, "global_step": 282189, "epoch": 1679} {"train_loss": -12.289710998535156, "global_step": 282190, "epoch": 1679} {"train_loss": -12.208457946777344, "global_step": 282191, "epoch": 1679} {"train_loss": -12.044258117675781, "global_step": 282192, "epoch": 1679} {"train_loss": -11.877241134643555, "global_step": 282193, "epoch": 1679} {"train_loss": -12.173040390014648, "global_step": 282194, "epoch": 1679} {"train_loss": -12.343973159790039, "global_step": 282195, "epoch": 1679} {"train_loss": -12.41440200805664, "global_step": 282196, "epoch": 1679} {"train_loss": -12.324411392211914, "global_step": 282197, "epoch": 1679} {"train_loss": -12.206685066223145, "global_step": 282198, "epoch": 1679} {"train_loss": -12.343595504760742, "global_step": 282199, "epoch": 1679} {"train_loss": -12.162198066711426, "global_step": 282200, "epoch": 1679} {"train_loss": -12.474971771240234, "global_step": 282201, "epoch": 1679} {"train_loss": -12.548786163330078, "global_step": 282202, "epoch": 1679} {"train_loss": -12.459370613098145, "global_step": 282203, "epoch": 1679} {"train_loss": -12.52027416229248, "global_step": 282204, "epoch": 1679} {"train_loss": -12.477399826049805, "global_step": 282205, "epoch": 1679} {"train_loss": -12.410407066345215, "global_step": 282206, "epoch": 1679} {"train_loss": -12.263525009155273, "global_step": 282207, "epoch": 1679} {"train_loss": -12.409212112426758, "global_step": 282208, "epoch": 1679} {"train_loss": -12.230560302734375, "global_step": 282209, "epoch": 1679} {"train_loss": -12.316583633422852, "global_step": 282210, "epoch": 1679} {"train_loss": -12.567222595214844, "global_step": 282211, "epoch": 1679} {"train_loss": -12.38661003112793, "global_step": 282212, "epoch": 1679} {"train_loss": -12.564277648925781, "global_step": 282213, "epoch": 1679} {"train_loss": -12.703910827636719, "global_step": 282214, "epoch": 1679} {"train_loss": -12.482025146484375, "global_step": 282215, "epoch": 1679} {"train_loss": -12.415285110473633, "global_step": 282216, "epoch": 1679} {"train_loss": -12.443800926208496, "global_step": 282217, "epoch": 1679} {"train_loss": -12.500517845153809, "global_step": 282218, "epoch": 1679} {"train_loss": -12.52203369140625, "global_step": 282219, "epoch": 1679} {"train_loss": -12.472625732421875, "global_step": 282220, "epoch": 1679} {"train_loss": -12.446236610412598, "global_step": 282221, "epoch": 1679} {"train_loss": -12.41649055480957, "global_step": 282222, "epoch": 1679} {"train_loss": -12.3798828125, "global_step": 282223, "epoch": 1679} {"train_loss": -12.285842895507812, "global_step": 282224, "epoch": 1679} {"train_loss": -12.384695053100586, "global_step": 282225, "epoch": 1679} {"train_loss": -12.462759017944336, "global_step": 282226, "epoch": 1679} {"train_loss": -12.358491897583008, "global_step": 282227, "epoch": 1679} {"train_loss": -12.285599708557129, "global_step": 282228, "epoch": 1679} {"train_loss": -12.391805648803711, "global_step": 282229, "epoch": 1679} {"train_loss": -12.172616958618164, "global_step": 282230, "epoch": 1679} {"train_loss": -12.191298484802246, "global_step": 282231, "epoch": 1679} {"train_loss": -11.85904312133789, "global_step": 282232, "epoch": 1679} {"train_loss": -10.68263053894043, "global_step": 282233, "epoch": 1679} {"train_loss": -10.321529388427734, "global_step": 282234, "epoch": 1679} {"train_loss": -11.647439956665039, "global_step": 282235, "epoch": 1679} {"train_loss": -12.154013633728027, "global_step": 282236, "epoch": 1679} {"train_loss": -10.086868286132812, "global_step": 282237, "epoch": 1679} {"train_loss": -7.508598327636719, "global_step": 282238, "epoch": 1679} {"train_loss": -11.820315562543415, "global_step": 282239, "epoch": 1679, "val_loss": 277966.625} {"train_loss": -7.285679817199707, "global_step": 282240, "epoch": 1680} {"train_loss": -7.558381080627441, "global_step": 282241, "epoch": 1680} {"train_loss": -8.85721206665039, "global_step": 282242, "epoch": 1680} {"train_loss": -7.445956230163574, "global_step": 282243, "epoch": 1680} {"train_loss": -7.211033821105957, "global_step": 282244, "epoch": 1680} {"train_loss": -6.793935775756836, "global_step": 282245, "epoch": 1680} {"train_loss": -7.633141994476318, "global_step": 282246, "epoch": 1680} {"train_loss": -9.405437469482422, "global_step": 282247, "epoch": 1680} {"train_loss": -7.931504249572754, "global_step": 282248, "epoch": 1680} {"train_loss": -7.609658241271973, "global_step": 282249, "epoch": 1680} {"train_loss": -7.84176778793335, "global_step": 282250, "epoch": 1680} {"train_loss": -8.81269645690918, "global_step": 282251, "epoch": 1680} {"train_loss": -9.596814155578613, "global_step": 282252, "epoch": 1680} {"train_loss": -9.473041534423828, "global_step": 282253, "epoch": 1680} {"train_loss": -9.804702758789062, "global_step": 282254, "epoch": 1680} {"train_loss": -10.789318084716797, "global_step": 282255, "epoch": 1680} {"train_loss": -10.033950805664062, "global_step": 282256, "epoch": 1680} {"train_loss": -10.30670166015625, "global_step": 282257, "epoch": 1680} {"train_loss": -10.580366134643555, "global_step": 282258, "epoch": 1680} {"train_loss": -10.817178726196289, "global_step": 282259, "epoch": 1680} {"train_loss": -10.18879508972168, "global_step": 282260, "epoch": 1680} {"train_loss": -10.788359642028809, "global_step": 282261, "epoch": 1680} {"train_loss": -10.730413436889648, "global_step": 282262, "epoch": 1680} {"train_loss": -11.406255722045898, "global_step": 282263, "epoch": 1680} {"train_loss": -11.148557662963867, "global_step": 282264, "epoch": 1680} {"train_loss": -10.981651306152344, "global_step": 282265, "epoch": 1680} {"train_loss": -10.587503433227539, "global_step": 282266, "epoch": 1680} {"train_loss": -11.223572731018066, "global_step": 282267, "epoch": 1680} {"train_loss": -10.97622013092041, "global_step": 282268, "epoch": 1680} {"train_loss": -11.273674011230469, "global_step": 282269, "epoch": 1680} {"train_loss": -10.805892944335938, "global_step": 282270, "epoch": 1680} {"train_loss": -10.802299499511719, "global_step": 282271, "epoch": 1680} {"train_loss": -11.131458282470703, "global_step": 282272, "epoch": 1680} {"train_loss": -10.680133819580078, "global_step": 282273, "epoch": 1680} {"train_loss": -10.591459274291992, "global_step": 282274, "epoch": 1680} {"train_loss": -11.045404434204102, "global_step": 282275, "epoch": 1680} {"train_loss": -10.504919052124023, "global_step": 282276, "epoch": 1680} {"train_loss": -11.149471282958984, "global_step": 282277, "epoch": 1680} {"train_loss": -10.956624031066895, "global_step": 282278, "epoch": 1680} {"train_loss": -11.215547561645508, "global_step": 282279, "epoch": 1680} {"train_loss": -10.68165397644043, "global_step": 282280, "epoch": 1680} {"train_loss": -11.543843269348145, "global_step": 282281, "epoch": 1680} {"train_loss": -10.820039749145508, "global_step": 282282, "epoch": 1680} {"train_loss": -11.462492942810059, "global_step": 282283, "epoch": 1680} {"train_loss": -10.71143913269043, "global_step": 282284, "epoch": 1680} {"train_loss": -11.444730758666992, "global_step": 282285, "epoch": 1680} {"train_loss": -11.262353897094727, "global_step": 282286, "epoch": 1680} {"train_loss": -11.587356567382812, "global_step": 282287, "epoch": 1680} {"train_loss": -11.44135570526123, "global_step": 282288, "epoch": 1680} {"train_loss": -11.540939331054688, "global_step": 282289, "epoch": 1680} {"train_loss": -11.415437698364258, "global_step": 282290, "epoch": 1680} {"train_loss": -11.339933395385742, "global_step": 282291, "epoch": 1680} {"train_loss": -11.636484146118164, "global_step": 282292, "epoch": 1680} {"train_loss": -11.732749938964844, "global_step": 282293, "epoch": 1680} {"train_loss": -11.567206382751465, "global_step": 282294, "epoch": 1680} {"train_loss": -11.537971496582031, "global_step": 282295, "epoch": 1680} {"train_loss": -11.527215957641602, "global_step": 282296, "epoch": 1680} {"train_loss": -11.664458274841309, "global_step": 282297, "epoch": 1680} {"train_loss": -11.634906768798828, "global_step": 282298, "epoch": 1680} {"train_loss": -11.79213809967041, "global_step": 282299, "epoch": 1680} {"train_loss": -11.692864418029785, "global_step": 282300, "epoch": 1680} {"train_loss": -11.899848937988281, "global_step": 282301, "epoch": 1680} {"train_loss": -11.738361358642578, "global_step": 282302, "epoch": 1680} {"train_loss": -11.598584175109863, "global_step": 282303, "epoch": 1680} {"train_loss": -11.604269027709961, "global_step": 282304, "epoch": 1680} {"train_loss": -11.992555618286133, "global_step": 282305, "epoch": 1680} {"train_loss": -11.612983703613281, "global_step": 282306, "epoch": 1680} {"train_loss": -11.918245315551758, "global_step": 282307, "epoch": 1680} {"train_loss": -11.631404876708984, "global_step": 282308, "epoch": 1680} {"train_loss": -11.897448539733887, "global_step": 282309, "epoch": 1680} {"train_loss": -11.945231437683105, "global_step": 282310, "epoch": 1680} {"train_loss": -11.533052444458008, "global_step": 282311, "epoch": 1680} {"train_loss": -11.938507080078125, "global_step": 282312, "epoch": 1680} {"train_loss": -11.854904174804688, "global_step": 282313, "epoch": 1680} {"train_loss": -12.041487693786621, "global_step": 282314, "epoch": 1680} {"train_loss": -12.009574890136719, "global_step": 282315, "epoch": 1680} {"train_loss": -11.888529777526855, "global_step": 282316, "epoch": 1680} {"train_loss": -11.915909767150879, "global_step": 282317, "epoch": 1680} {"train_loss": -12.013354301452637, "global_step": 282318, "epoch": 1680} {"train_loss": -11.826370239257812, "global_step": 282319, "epoch": 1680} {"train_loss": -11.810443878173828, "global_step": 282320, "epoch": 1680} {"train_loss": -11.420966148376465, "global_step": 282321, "epoch": 1680} {"train_loss": -11.771639823913574, "global_step": 282322, "epoch": 1680} {"train_loss": -12.142413139343262, "global_step": 282323, "epoch": 1680} {"train_loss": -11.536230087280273, "global_step": 282324, "epoch": 1680} {"train_loss": -11.951772689819336, "global_step": 282325, "epoch": 1680} {"train_loss": -12.149724006652832, "global_step": 282326, "epoch": 1680} {"train_loss": -12.067117691040039, "global_step": 282327, "epoch": 1680} {"train_loss": -12.034257888793945, "global_step": 282328, "epoch": 1680} {"train_loss": -11.752358436584473, "global_step": 282329, "epoch": 1680} {"train_loss": -12.05671501159668, "global_step": 282330, "epoch": 1680} {"train_loss": -12.089244842529297, "global_step": 282331, "epoch": 1680} {"train_loss": -12.001913070678711, "global_step": 282332, "epoch": 1680} {"train_loss": -12.215949058532715, "global_step": 282333, "epoch": 1680} {"train_loss": -11.89166259765625, "global_step": 282334, "epoch": 1680} {"train_loss": -12.142433166503906, "global_step": 282335, "epoch": 1680} {"train_loss": -11.87311840057373, "global_step": 282336, "epoch": 1680} {"train_loss": -12.16445541381836, "global_step": 282337, "epoch": 1680} {"train_loss": -12.083869934082031, "global_step": 282338, "epoch": 1680} {"train_loss": -12.202476501464844, "global_step": 282339, "epoch": 1680} {"train_loss": -11.893880844116211, "global_step": 282340, "epoch": 1680} {"train_loss": -11.887069702148438, "global_step": 282341, "epoch": 1680} {"train_loss": -12.138975143432617, "global_step": 282342, "epoch": 1680} {"train_loss": -11.975736618041992, "global_step": 282343, "epoch": 1680} {"train_loss": -12.28020191192627, "global_step": 282344, "epoch": 1680} {"train_loss": -11.917903900146484, "global_step": 282345, "epoch": 1680} {"train_loss": -12.210343360900879, "global_step": 282346, "epoch": 1680} {"train_loss": -12.181699752807617, "global_step": 282347, "epoch": 1680} {"train_loss": -12.14997673034668, "global_step": 282348, "epoch": 1680} {"train_loss": -12.273323059082031, "global_step": 282349, "epoch": 1680} {"train_loss": -12.249536514282227, "global_step": 282350, "epoch": 1680} {"train_loss": -12.308935165405273, "global_step": 282351, "epoch": 1680} {"train_loss": -11.891523361206055, "global_step": 282352, "epoch": 1680} {"train_loss": -12.167901992797852, "global_step": 282353, "epoch": 1680} {"train_loss": -12.17216968536377, "global_step": 282354, "epoch": 1680} {"train_loss": -12.313316345214844, "global_step": 282355, "epoch": 1680} {"train_loss": -12.31978988647461, "global_step": 282356, "epoch": 1680} {"train_loss": -11.96697998046875, "global_step": 282357, "epoch": 1680} {"train_loss": -12.126791000366211, "global_step": 282358, "epoch": 1680} {"train_loss": -12.26345443725586, "global_step": 282359, "epoch": 1680} {"train_loss": -12.282862663269043, "global_step": 282360, "epoch": 1680} {"train_loss": -12.263749122619629, "global_step": 282361, "epoch": 1680} {"train_loss": -12.17205810546875, "global_step": 282362, "epoch": 1680} {"train_loss": -12.008883476257324, "global_step": 282363, "epoch": 1680} {"train_loss": -11.978324890136719, "global_step": 282364, "epoch": 1680} {"train_loss": -12.217880249023438, "global_step": 282365, "epoch": 1680} {"train_loss": -12.069256782531738, "global_step": 282366, "epoch": 1680} {"train_loss": -12.197205543518066, "global_step": 282367, "epoch": 1680} {"train_loss": -11.926576614379883, "global_step": 282368, "epoch": 1680} {"train_loss": -12.259588241577148, "global_step": 282369, "epoch": 1680} {"train_loss": -12.068073272705078, "global_step": 282370, "epoch": 1680} {"train_loss": -11.93265151977539, "global_step": 282371, "epoch": 1680} {"train_loss": -11.686704635620117, "global_step": 282372, "epoch": 1680} {"train_loss": -11.754047393798828, "global_step": 282373, "epoch": 1680} {"train_loss": -10.91614818572998, "global_step": 282374, "epoch": 1680} {"train_loss": -10.906912803649902, "global_step": 282375, "epoch": 1680} {"train_loss": -11.416328430175781, "global_step": 282376, "epoch": 1680} {"train_loss": -11.898927688598633, "global_step": 282377, "epoch": 1680} {"train_loss": -11.327516555786133, "global_step": 282378, "epoch": 1680} {"train_loss": -10.099309921264648, "global_step": 282379, "epoch": 1680} {"train_loss": -10.09606647491455, "global_step": 282380, "epoch": 1680} {"train_loss": -11.498059272766113, "global_step": 282381, "epoch": 1680} {"train_loss": -10.235671997070312, "global_step": 282382, "epoch": 1680} {"train_loss": -12.069334030151367, "global_step": 282383, "epoch": 1680} {"train_loss": -11.03909969329834, "global_step": 282384, "epoch": 1680} {"train_loss": -11.291330337524414, "global_step": 282385, "epoch": 1680} {"train_loss": -11.637837409973145, "global_step": 282386, "epoch": 1680} {"train_loss": -11.948760986328125, "global_step": 282387, "epoch": 1680} {"train_loss": -11.294685363769531, "global_step": 282388, "epoch": 1680} {"train_loss": -11.510473251342773, "global_step": 282389, "epoch": 1680} {"train_loss": -11.670272827148438, "global_step": 282390, "epoch": 1680} {"train_loss": -11.359646797180176, "global_step": 282391, "epoch": 1680} {"train_loss": -11.451318740844727, "global_step": 282392, "epoch": 1680} {"train_loss": -11.905292510986328, "global_step": 282393, "epoch": 1680} {"train_loss": -11.642579078674316, "global_step": 282394, "epoch": 1680} {"train_loss": -11.189693450927734, "global_step": 282395, "epoch": 1680} {"train_loss": -11.627874374389648, "global_step": 282396, "epoch": 1680} {"train_loss": -11.910075187683105, "global_step": 282397, "epoch": 1680} {"train_loss": -11.542196273803711, "global_step": 282398, "epoch": 1680} {"train_loss": -11.999723434448242, "global_step": 282399, "epoch": 1680} {"train_loss": -11.620794296264648, "global_step": 282400, "epoch": 1680} {"train_loss": -10.766728401184082, "global_step": 282401, "epoch": 1680} {"train_loss": -11.455831527709961, "global_step": 282402, "epoch": 1680} {"train_loss": -11.254730224609375, "global_step": 282403, "epoch": 1680} {"train_loss": -10.32944107055664, "global_step": 282404, "epoch": 1680} {"train_loss": -11.749299049377441, "global_step": 282405, "epoch": 1680} {"train_loss": -11.131245613098145, "global_step": 282406, "epoch": 1680} {"train_loss": -11.281344669205803, "global_step": 282407, "epoch": 1680, "val_loss": 271582.28125, "train_action_mse_error": 1.9550777673721313} {"train_loss": -11.415708541870117, "global_step": 282408, "epoch": 1681} {"train_loss": -11.032999038696289, "global_step": 282409, "epoch": 1681} {"train_loss": -11.769246101379395, "global_step": 282410, "epoch": 1681} {"train_loss": -10.97252082824707, "global_step": 282411, "epoch": 1681} {"train_loss": -11.785356521606445, "global_step": 282412, "epoch": 1681} {"train_loss": -11.548274993896484, "global_step": 282413, "epoch": 1681} {"train_loss": -10.866026878356934, "global_step": 282414, "epoch": 1681} {"train_loss": -11.425104141235352, "global_step": 282415, "epoch": 1681} {"train_loss": -11.166954040527344, "global_step": 282416, "epoch": 1681} {"train_loss": -11.653945922851562, "global_step": 282417, "epoch": 1681} {"train_loss": -10.864474296569824, "global_step": 282418, "epoch": 1681} {"train_loss": -12.047203063964844, "global_step": 282419, "epoch": 1681} {"train_loss": -11.714241027832031, "global_step": 282420, "epoch": 1681} {"train_loss": -11.481695175170898, "global_step": 282421, "epoch": 1681} {"train_loss": -11.408796310424805, "global_step": 282422, "epoch": 1681} {"train_loss": -11.431538581848145, "global_step": 282423, "epoch": 1681} {"train_loss": -12.05698013305664, "global_step": 282424, "epoch": 1681} {"train_loss": -11.247167587280273, "global_step": 282425, "epoch": 1681} {"train_loss": -11.953217506408691, "global_step": 282426, "epoch": 1681} {"train_loss": -11.571660995483398, "global_step": 282427, "epoch": 1681} {"train_loss": -11.972463607788086, "global_step": 282428, "epoch": 1681} {"train_loss": -11.834619522094727, "global_step": 282429, "epoch": 1681} {"train_loss": -11.823614120483398, "global_step": 282430, "epoch": 1681} {"train_loss": -11.798257827758789, "global_step": 282431, "epoch": 1681} {"train_loss": -11.900985717773438, "global_step": 282432, "epoch": 1681} {"train_loss": -11.787506103515625, "global_step": 282433, "epoch": 1681} {"train_loss": -12.176156044006348, "global_step": 282434, "epoch": 1681} {"train_loss": -11.849204063415527, "global_step": 282435, "epoch": 1681} {"train_loss": -12.059127807617188, "global_step": 282436, "epoch": 1681} {"train_loss": -11.70569133758545, "global_step": 282437, "epoch": 1681} {"train_loss": -11.856706619262695, "global_step": 282438, "epoch": 1681} {"train_loss": -11.619729995727539, "global_step": 282439, "epoch": 1681} {"train_loss": -11.977962493896484, "global_step": 282440, "epoch": 1681} {"train_loss": -11.580726623535156, "global_step": 282441, "epoch": 1681} {"train_loss": -11.805120468139648, "global_step": 282442, "epoch": 1681} {"train_loss": -11.397928237915039, "global_step": 282443, "epoch": 1681} {"train_loss": -11.979978561401367, "global_step": 282444, "epoch": 1681} {"train_loss": -11.678458213806152, "global_step": 282445, "epoch": 1681} {"train_loss": -12.069226264953613, "global_step": 282446, "epoch": 1681} {"train_loss": -11.862956047058105, "global_step": 282447, "epoch": 1681} {"train_loss": -11.895506858825684, "global_step": 282448, "epoch": 1681} {"train_loss": -11.90782642364502, "global_step": 282449, "epoch": 1681} {"train_loss": -11.910306930541992, "global_step": 282450, "epoch": 1681} {"train_loss": -11.5366792678833, "global_step": 282451, "epoch": 1681} {"train_loss": -12.090740203857422, "global_step": 282452, "epoch": 1681} {"train_loss": -11.434343338012695, "global_step": 282453, "epoch": 1681} {"train_loss": -11.787254333496094, "global_step": 282454, "epoch": 1681} {"train_loss": -11.455594062805176, "global_step": 282455, "epoch": 1681} {"train_loss": -12.034189224243164, "global_step": 282456, "epoch": 1681} {"train_loss": -11.680530548095703, "global_step": 282457, "epoch": 1681} {"train_loss": -11.726583480834961, "global_step": 282458, "epoch": 1681} {"train_loss": -11.962383270263672, "global_step": 282459, "epoch": 1681} {"train_loss": -11.958794593811035, "global_step": 282460, "epoch": 1681} {"train_loss": -11.845087051391602, "global_step": 282461, "epoch": 1681} {"train_loss": -11.672399520874023, "global_step": 282462, "epoch": 1681} {"train_loss": -11.812040328979492, "global_step": 282463, "epoch": 1681} {"train_loss": -11.962617874145508, "global_step": 282464, "epoch": 1681} {"train_loss": -11.695982933044434, "global_step": 282465, "epoch": 1681} {"train_loss": -12.231300354003906, "global_step": 282466, "epoch": 1681} {"train_loss": -11.636228561401367, "global_step": 282467, "epoch": 1681} {"train_loss": -12.081367492675781, "global_step": 282468, "epoch": 1681} {"train_loss": -11.721776962280273, "global_step": 282469, "epoch": 1681} {"train_loss": -12.006567001342773, "global_step": 282470, "epoch": 1681} {"train_loss": -11.827184677124023, "global_step": 282471, "epoch": 1681} {"train_loss": -12.05896282196045, "global_step": 282472, "epoch": 1681} {"train_loss": -11.941171646118164, "global_step": 282473, "epoch": 1681} {"train_loss": -12.028860092163086, "global_step": 282474, "epoch": 1681} {"train_loss": -11.833179473876953, "global_step": 282475, "epoch": 1681} {"train_loss": -12.232876777648926, "global_step": 282476, "epoch": 1681} {"train_loss": -11.813211441040039, "global_step": 282477, "epoch": 1681} {"train_loss": -12.11007308959961, "global_step": 282478, "epoch": 1681} {"train_loss": -12.00917911529541, "global_step": 282479, "epoch": 1681} {"train_loss": -11.952787399291992, "global_step": 282480, "epoch": 1681} {"train_loss": -12.201541900634766, "global_step": 282481, "epoch": 1681} {"train_loss": -12.025087356567383, "global_step": 282482, "epoch": 1681} {"train_loss": -11.970159530639648, "global_step": 282483, "epoch": 1681} {"train_loss": -12.061677932739258, "global_step": 282484, "epoch": 1681} {"train_loss": -12.138930320739746, "global_step": 282485, "epoch": 1681} {"train_loss": -11.459088325500488, "global_step": 282486, "epoch": 1681} {"train_loss": -11.842996597290039, "global_step": 282487, "epoch": 1681} {"train_loss": -11.951192855834961, "global_step": 282488, "epoch": 1681} {"train_loss": -10.574028015136719, "global_step": 282489, "epoch": 1681} {"train_loss": -11.537272453308105, "global_step": 282490, "epoch": 1681} {"train_loss": -11.422754287719727, "global_step": 282491, "epoch": 1681} {"train_loss": -11.41235637664795, "global_step": 282492, "epoch": 1681} {"train_loss": -11.068272590637207, "global_step": 282493, "epoch": 1681} {"train_loss": -11.711084365844727, "global_step": 282494, "epoch": 1681} {"train_loss": -9.855182647705078, "global_step": 282495, "epoch": 1681} {"train_loss": -10.822534561157227, "global_step": 282496, "epoch": 1681} {"train_loss": -10.849233627319336, "global_step": 282497, "epoch": 1681} {"train_loss": -11.233972549438477, "global_step": 282498, "epoch": 1681} {"train_loss": -8.89316177368164, "global_step": 282499, "epoch": 1681} {"train_loss": -10.925739288330078, "global_step": 282500, "epoch": 1681} {"train_loss": -9.643486022949219, "global_step": 282501, "epoch": 1681} {"train_loss": -9.64057731628418, "global_step": 282502, "epoch": 1681} {"train_loss": -8.608488082885742, "global_step": 282503, "epoch": 1681} {"train_loss": -10.559118270874023, "global_step": 282504, "epoch": 1681} {"train_loss": -8.19035530090332, "global_step": 282505, "epoch": 1681} {"train_loss": -9.877334594726562, "global_step": 282506, "epoch": 1681} {"train_loss": -8.025043487548828, "global_step": 282507, "epoch": 1681} {"train_loss": -9.541606903076172, "global_step": 282508, "epoch": 1681} {"train_loss": -9.263952255249023, "global_step": 282509, "epoch": 1681} {"train_loss": -9.694297790527344, "global_step": 282510, "epoch": 1681} {"train_loss": -10.368263244628906, "global_step": 282511, "epoch": 1681} {"train_loss": -9.083833694458008, "global_step": 282512, "epoch": 1681} {"train_loss": -10.684826850891113, "global_step": 282513, "epoch": 1681} {"train_loss": -9.560771942138672, "global_step": 282514, "epoch": 1681} {"train_loss": -10.228532791137695, "global_step": 282515, "epoch": 1681} {"train_loss": -10.203325271606445, "global_step": 282516, "epoch": 1681} {"train_loss": -9.981603622436523, "global_step": 282517, "epoch": 1681} {"train_loss": -10.10489273071289, "global_step": 282518, "epoch": 1681} {"train_loss": -9.861126899719238, "global_step": 282519, "epoch": 1681} {"train_loss": -9.80627155303955, "global_step": 282520, "epoch": 1681} {"train_loss": -10.706344604492188, "global_step": 282521, "epoch": 1681} {"train_loss": -10.938188552856445, "global_step": 282522, "epoch": 1681} {"train_loss": -10.020795822143555, "global_step": 282523, "epoch": 1681} {"train_loss": -11.1541166305542, "global_step": 282524, "epoch": 1681} {"train_loss": -10.558969497680664, "global_step": 282525, "epoch": 1681} {"train_loss": -9.846983909606934, "global_step": 282526, "epoch": 1681} {"train_loss": -11.274516105651855, "global_step": 282527, "epoch": 1681} {"train_loss": -10.393223762512207, "global_step": 282528, "epoch": 1681} {"train_loss": -10.576749801635742, "global_step": 282529, "epoch": 1681} {"train_loss": -10.716997146606445, "global_step": 282530, "epoch": 1681} {"train_loss": -10.926880836486816, "global_step": 282531, "epoch": 1681} {"train_loss": -10.465911865234375, "global_step": 282532, "epoch": 1681} {"train_loss": -11.328388214111328, "global_step": 282533, "epoch": 1681} {"train_loss": -11.198010444641113, "global_step": 282534, "epoch": 1681} {"train_loss": -10.831621170043945, "global_step": 282535, "epoch": 1681} {"train_loss": -11.290056228637695, "global_step": 282536, "epoch": 1681} {"train_loss": -11.23117446899414, "global_step": 282537, "epoch": 1681} {"train_loss": -11.175637245178223, "global_step": 282538, "epoch": 1681} {"train_loss": -11.263318061828613, "global_step": 282539, "epoch": 1681} {"train_loss": -11.623336791992188, "global_step": 282540, "epoch": 1681} {"train_loss": -11.333868026733398, "global_step": 282541, "epoch": 1681} {"train_loss": -11.303359985351562, "global_step": 282542, "epoch": 1681} {"train_loss": -11.398904800415039, "global_step": 282543, "epoch": 1681} {"train_loss": -11.467061996459961, "global_step": 282544, "epoch": 1681} {"train_loss": -11.337897300720215, "global_step": 282545, "epoch": 1681} {"train_loss": -11.634795188903809, "global_step": 282546, "epoch": 1681} {"train_loss": -11.50632095336914, "global_step": 282547, "epoch": 1681} {"train_loss": -11.58572006225586, "global_step": 282548, "epoch": 1681} {"train_loss": -11.63823413848877, "global_step": 282549, "epoch": 1681} {"train_loss": -11.784833908081055, "global_step": 282550, "epoch": 1681} {"train_loss": -11.637778282165527, "global_step": 282551, "epoch": 1681} {"train_loss": -11.298988342285156, "global_step": 282552, "epoch": 1681} {"train_loss": -11.717231750488281, "global_step": 282553, "epoch": 1681} {"train_loss": -11.737159729003906, "global_step": 282554, "epoch": 1681} {"train_loss": -11.465819358825684, "global_step": 282555, "epoch": 1681} {"train_loss": -11.777830123901367, "global_step": 282556, "epoch": 1681} {"train_loss": -11.55583667755127, "global_step": 282557, "epoch": 1681} {"train_loss": -11.661797523498535, "global_step": 282558, "epoch": 1681} {"train_loss": -11.749133110046387, "global_step": 282559, "epoch": 1681} {"train_loss": -11.645559310913086, "global_step": 282560, "epoch": 1681} {"train_loss": -11.458955764770508, "global_step": 282561, "epoch": 1681} {"train_loss": -11.733380317687988, "global_step": 282562, "epoch": 1681} {"train_loss": -11.58879280090332, "global_step": 282563, "epoch": 1681} {"train_loss": -11.71678352355957, "global_step": 282564, "epoch": 1681} {"train_loss": -12.041547775268555, "global_step": 282565, "epoch": 1681} {"train_loss": -11.872234344482422, "global_step": 282566, "epoch": 1681} {"train_loss": -11.895259857177734, "global_step": 282567, "epoch": 1681} {"train_loss": -11.745853424072266, "global_step": 282568, "epoch": 1681} {"train_loss": -11.962133407592773, "global_step": 282569, "epoch": 1681} {"train_loss": -12.0245361328125, "global_step": 282570, "epoch": 1681} {"train_loss": -11.835512161254883, "global_step": 282571, "epoch": 1681} {"train_loss": -12.073514938354492, "global_step": 282572, "epoch": 1681} {"train_loss": -12.093420028686523, "global_step": 282573, "epoch": 1681} {"train_loss": -11.947698593139648, "global_step": 282574, "epoch": 1681} {"train_loss": -11.331873859677996, "global_step": 282575, "epoch": 1681, "val_loss": 266646.625} {"train_loss": -12.08119010925293, "global_step": 282576, "epoch": 1682} {"train_loss": -11.611923217773438, "global_step": 282577, "epoch": 1682} {"train_loss": -12.013527870178223, "global_step": 282578, "epoch": 1682} {"train_loss": -11.976882934570312, "global_step": 282579, "epoch": 1682} {"train_loss": -12.014115333557129, "global_step": 282580, "epoch": 1682} {"train_loss": -12.067789077758789, "global_step": 282581, "epoch": 1682} {"train_loss": -12.073280334472656, "global_step": 282582, "epoch": 1682} {"train_loss": -12.050018310546875, "global_step": 282583, "epoch": 1682} {"train_loss": -12.18886947631836, "global_step": 282584, "epoch": 1682} {"train_loss": -12.06153392791748, "global_step": 282585, "epoch": 1682} {"train_loss": -12.238261222839355, "global_step": 282586, "epoch": 1682} {"train_loss": -12.053062438964844, "global_step": 282587, "epoch": 1682} {"train_loss": -12.231979370117188, "global_step": 282588, "epoch": 1682} {"train_loss": -12.215072631835938, "global_step": 282589, "epoch": 1682} {"train_loss": -12.352429389953613, "global_step": 282590, "epoch": 1682} {"train_loss": -12.142500877380371, "global_step": 282591, "epoch": 1682} {"train_loss": -12.037666320800781, "global_step": 282592, "epoch": 1682} {"train_loss": -12.302797317504883, "global_step": 282593, "epoch": 1682} {"train_loss": -12.26889419555664, "global_step": 282594, "epoch": 1682} {"train_loss": -12.305909156799316, "global_step": 282595, "epoch": 1682} {"train_loss": -12.290767669677734, "global_step": 282596, "epoch": 1682} {"train_loss": -11.935379028320312, "global_step": 282597, "epoch": 1682} {"train_loss": -12.196840286254883, "global_step": 282598, "epoch": 1682} {"train_loss": -12.142601013183594, "global_step": 282599, "epoch": 1682} {"train_loss": -12.255313873291016, "global_step": 282600, "epoch": 1682} {"train_loss": -12.080509185791016, "global_step": 282601, "epoch": 1682} {"train_loss": -12.372444152832031, "global_step": 282602, "epoch": 1682} {"train_loss": -12.25347900390625, "global_step": 282603, "epoch": 1682} {"train_loss": -12.260825157165527, "global_step": 282604, "epoch": 1682} {"train_loss": -12.206792831420898, "global_step": 282605, "epoch": 1682} {"train_loss": -12.15017318725586, "global_step": 282606, "epoch": 1682} {"train_loss": -12.312223434448242, "global_step": 282607, "epoch": 1682} {"train_loss": -12.43071460723877, "global_step": 282608, "epoch": 1682} {"train_loss": -12.168743133544922, "global_step": 282609, "epoch": 1682} {"train_loss": -12.259663581848145, "global_step": 282610, "epoch": 1682} {"train_loss": -12.062509536743164, "global_step": 282611, "epoch": 1682} {"train_loss": -12.063743591308594, "global_step": 282612, "epoch": 1682} {"train_loss": -12.026838302612305, "global_step": 282613, "epoch": 1682} {"train_loss": -12.291753768920898, "global_step": 282614, "epoch": 1682} {"train_loss": -12.159815788269043, "global_step": 282615, "epoch": 1682} {"train_loss": -11.85378646850586, "global_step": 282616, "epoch": 1682} {"train_loss": -12.452234268188477, "global_step": 282617, "epoch": 1682} {"train_loss": -11.98093032836914, "global_step": 282618, "epoch": 1682} {"train_loss": -11.89552116394043, "global_step": 282619, "epoch": 1682} {"train_loss": -12.060449600219727, "global_step": 282620, "epoch": 1682} {"train_loss": -12.294148445129395, "global_step": 282621, "epoch": 1682} {"train_loss": -11.891427993774414, "global_step": 282622, "epoch": 1682} {"train_loss": -12.194448471069336, "global_step": 282623, "epoch": 1682} {"train_loss": -12.055768966674805, "global_step": 282624, "epoch": 1682} {"train_loss": -11.400035858154297, "global_step": 282625, "epoch": 1682} {"train_loss": -11.814483642578125, "global_step": 282626, "epoch": 1682} {"train_loss": -12.089661598205566, "global_step": 282627, "epoch": 1682} {"train_loss": -11.36607551574707, "global_step": 282628, "epoch": 1682} {"train_loss": -11.574508666992188, "global_step": 282629, "epoch": 1682} {"train_loss": -12.262861251831055, "global_step": 282630, "epoch": 1682} {"train_loss": -11.775997161865234, "global_step": 282631, "epoch": 1682} {"train_loss": -11.56794548034668, "global_step": 282632, "epoch": 1682} {"train_loss": -11.785897254943848, "global_step": 282633, "epoch": 1682} {"train_loss": -11.670357704162598, "global_step": 282634, "epoch": 1682} {"train_loss": -11.205062866210938, "global_step": 282635, "epoch": 1682} {"train_loss": -11.794219970703125, "global_step": 282636, "epoch": 1682} {"train_loss": -11.330803871154785, "global_step": 282637, "epoch": 1682} {"train_loss": -10.924381256103516, "global_step": 282638, "epoch": 1682} {"train_loss": -11.601780891418457, "global_step": 282639, "epoch": 1682} {"train_loss": -9.336797714233398, "global_step": 282640, "epoch": 1682} {"train_loss": -10.027206420898438, "global_step": 282641, "epoch": 1682} {"train_loss": -9.208627700805664, "global_step": 282642, "epoch": 1682} {"train_loss": -8.402458190917969, "global_step": 282643, "epoch": 1682} {"train_loss": -9.964485168457031, "global_step": 282644, "epoch": 1682} {"train_loss": -10.215065002441406, "global_step": 282645, "epoch": 1682} {"train_loss": -10.236064910888672, "global_step": 282646, "epoch": 1682} {"train_loss": -9.19247817993164, "global_step": 282647, "epoch": 1682} {"train_loss": -10.635468482971191, "global_step": 282648, "epoch": 1682} {"train_loss": -8.303873062133789, "global_step": 282649, "epoch": 1682} {"train_loss": -10.647228240966797, "global_step": 282650, "epoch": 1682} {"train_loss": -8.522802352905273, "global_step": 282651, "epoch": 1682} {"train_loss": -8.948172569274902, "global_step": 282652, "epoch": 1682} {"train_loss": -9.929869651794434, "global_step": 282653, "epoch": 1682} {"train_loss": -8.00202751159668, "global_step": 282654, "epoch": 1682} {"train_loss": -9.025086402893066, "global_step": 282655, "epoch": 1682} {"train_loss": -8.291585922241211, "global_step": 282656, "epoch": 1682} {"train_loss": -10.081031799316406, "global_step": 282657, "epoch": 1682} {"train_loss": -9.293834686279297, "global_step": 282658, "epoch": 1682} {"train_loss": -9.168680191040039, "global_step": 282659, "epoch": 1682} {"train_loss": -8.979164123535156, "global_step": 282660, "epoch": 1682} {"train_loss": -9.671597480773926, "global_step": 282661, "epoch": 1682} {"train_loss": -10.486889839172363, "global_step": 282662, "epoch": 1682} {"train_loss": -8.696682929992676, "global_step": 282663, "epoch": 1682} {"train_loss": -10.844890594482422, "global_step": 282664, "epoch": 1682} {"train_loss": -9.897762298583984, "global_step": 282665, "epoch": 1682} {"train_loss": -10.229896545410156, "global_step": 282666, "epoch": 1682} {"train_loss": -11.16104507446289, "global_step": 282667, "epoch": 1682} {"train_loss": -10.884908676147461, "global_step": 282668, "epoch": 1682} {"train_loss": -10.779928207397461, "global_step": 282669, "epoch": 1682} {"train_loss": -11.170450210571289, "global_step": 282670, "epoch": 1682} {"train_loss": -10.771356582641602, "global_step": 282671, "epoch": 1682} {"train_loss": -10.97247314453125, "global_step": 282672, "epoch": 1682} {"train_loss": -10.723583221435547, "global_step": 282673, "epoch": 1682} {"train_loss": -11.376365661621094, "global_step": 282674, "epoch": 1682} {"train_loss": -11.218119621276855, "global_step": 282675, "epoch": 1682} {"train_loss": -11.368621826171875, "global_step": 282676, "epoch": 1682} {"train_loss": -11.336305618286133, "global_step": 282677, "epoch": 1682} {"train_loss": -11.40750789642334, "global_step": 282678, "epoch": 1682} {"train_loss": -11.209108352661133, "global_step": 282679, "epoch": 1682} {"train_loss": -11.528882026672363, "global_step": 282680, "epoch": 1682} {"train_loss": -11.391280174255371, "global_step": 282681, "epoch": 1682} {"train_loss": -11.38630485534668, "global_step": 282682, "epoch": 1682} {"train_loss": -11.644149780273438, "global_step": 282683, "epoch": 1682} {"train_loss": -11.58459758758545, "global_step": 282684, "epoch": 1682} {"train_loss": -11.667840003967285, "global_step": 282685, "epoch": 1682} {"train_loss": -11.499281883239746, "global_step": 282686, "epoch": 1682} {"train_loss": -11.54224681854248, "global_step": 282687, "epoch": 1682} {"train_loss": -11.656240463256836, "global_step": 282688, "epoch": 1682} {"train_loss": -11.713191986083984, "global_step": 282689, "epoch": 1682} {"train_loss": -11.627735137939453, "global_step": 282690, "epoch": 1682} {"train_loss": -11.570113182067871, "global_step": 282691, "epoch": 1682} {"train_loss": -11.539794921875, "global_step": 282692, "epoch": 1682} {"train_loss": -11.729920387268066, "global_step": 282693, "epoch": 1682} {"train_loss": -11.719535827636719, "global_step": 282694, "epoch": 1682} {"train_loss": -11.743898391723633, "global_step": 282695, "epoch": 1682} {"train_loss": -11.7814302444458, "global_step": 282696, "epoch": 1682} {"train_loss": -11.74410629272461, "global_step": 282697, "epoch": 1682} {"train_loss": -11.855951309204102, "global_step": 282698, "epoch": 1682} {"train_loss": -11.664651870727539, "global_step": 282699, "epoch": 1682} {"train_loss": -11.968352317810059, "global_step": 282700, "epoch": 1682} {"train_loss": -11.684391975402832, "global_step": 282701, "epoch": 1682} {"train_loss": -11.684194564819336, "global_step": 282702, "epoch": 1682} {"train_loss": -11.936843872070312, "global_step": 282703, "epoch": 1682} {"train_loss": -11.99632453918457, "global_step": 282704, "epoch": 1682} {"train_loss": -11.934782981872559, "global_step": 282705, "epoch": 1682} {"train_loss": -11.907307624816895, "global_step": 282706, "epoch": 1682} {"train_loss": -11.913212776184082, "global_step": 282707, "epoch": 1682} {"train_loss": -11.83344841003418, "global_step": 282708, "epoch": 1682} {"train_loss": -11.773963928222656, "global_step": 282709, "epoch": 1682} {"train_loss": -12.123895645141602, "global_step": 282710, "epoch": 1682} {"train_loss": -11.862191200256348, "global_step": 282711, "epoch": 1682} {"train_loss": -11.77318000793457, "global_step": 282712, "epoch": 1682} {"train_loss": -11.925276756286621, "global_step": 282713, "epoch": 1682} {"train_loss": -11.929924011230469, "global_step": 282714, "epoch": 1682} {"train_loss": -12.119168281555176, "global_step": 282715, "epoch": 1682} {"train_loss": -11.897734642028809, "global_step": 282716, "epoch": 1682} {"train_loss": -11.997255325317383, "global_step": 282717, "epoch": 1682} {"train_loss": -11.985618591308594, "global_step": 282718, "epoch": 1682} {"train_loss": -11.846414566040039, "global_step": 282719, "epoch": 1682} {"train_loss": -12.001712799072266, "global_step": 282720, "epoch": 1682} {"train_loss": -11.963302612304688, "global_step": 282721, "epoch": 1682} {"train_loss": -12.023813247680664, "global_step": 282722, "epoch": 1682} {"train_loss": -12.14926528930664, "global_step": 282723, "epoch": 1682} {"train_loss": -12.0675048828125, "global_step": 282724, "epoch": 1682} {"train_loss": -12.193182945251465, "global_step": 282725, "epoch": 1682} {"train_loss": -11.999771118164062, "global_step": 282726, "epoch": 1682} {"train_loss": -12.00790786743164, "global_step": 282727, "epoch": 1682} {"train_loss": -12.028299331665039, "global_step": 282728, "epoch": 1682} {"train_loss": -12.101869583129883, "global_step": 282729, "epoch": 1682} {"train_loss": -12.058879852294922, "global_step": 282730, "epoch": 1682} {"train_loss": -12.132390975952148, "global_step": 282731, "epoch": 1682} {"train_loss": -11.940694808959961, "global_step": 282732, "epoch": 1682} {"train_loss": -12.084948539733887, "global_step": 282733, "epoch": 1682} {"train_loss": -12.192598342895508, "global_step": 282734, "epoch": 1682} {"train_loss": -11.92580795288086, "global_step": 282735, "epoch": 1682} {"train_loss": -12.021636962890625, "global_step": 282736, "epoch": 1682} {"train_loss": -12.011600494384766, "global_step": 282737, "epoch": 1682} {"train_loss": -12.098743438720703, "global_step": 282738, "epoch": 1682} {"train_loss": -12.019099235534668, "global_step": 282739, "epoch": 1682} {"train_loss": -11.941290855407715, "global_step": 282740, "epoch": 1682} {"train_loss": -12.134700775146484, "global_step": 282741, "epoch": 1682} {"train_loss": -12.194913864135742, "global_step": 282742, "epoch": 1682} {"train_loss": -11.485473087855748, "global_step": 282743, "epoch": 1682, "val_loss": 273658.46875} {"train_loss": -11.85233211517334, "global_step": 282744, "epoch": 1683} {"train_loss": -12.333642959594727, "global_step": 282745, "epoch": 1683} {"train_loss": -11.973698616027832, "global_step": 282746, "epoch": 1683} {"train_loss": -12.20626163482666, "global_step": 282747, "epoch": 1683} {"train_loss": -11.917262077331543, "global_step": 282748, "epoch": 1683} {"train_loss": -12.176887512207031, "global_step": 282749, "epoch": 1683} {"train_loss": -12.11696720123291, "global_step": 282750, "epoch": 1683} {"train_loss": -12.365819931030273, "global_step": 282751, "epoch": 1683} {"train_loss": -12.343414306640625, "global_step": 282752, "epoch": 1683} {"train_loss": -12.23015308380127, "global_step": 282753, "epoch": 1683} {"train_loss": -12.113995552062988, "global_step": 282754, "epoch": 1683} {"train_loss": -12.12269115447998, "global_step": 282755, "epoch": 1683} {"train_loss": -12.16475772857666, "global_step": 282756, "epoch": 1683} {"train_loss": -12.343826293945312, "global_step": 282757, "epoch": 1683} {"train_loss": -12.28535270690918, "global_step": 282758, "epoch": 1683} {"train_loss": -12.328463554382324, "global_step": 282759, "epoch": 1683} {"train_loss": -12.082807540893555, "global_step": 282760, "epoch": 1683} {"train_loss": -12.489982604980469, "global_step": 282761, "epoch": 1683} {"train_loss": -11.974322319030762, "global_step": 282762, "epoch": 1683} {"train_loss": -12.080489158630371, "global_step": 282763, "epoch": 1683} {"train_loss": -12.048904418945312, "global_step": 282764, "epoch": 1683} {"train_loss": -11.805248260498047, "global_step": 282765, "epoch": 1683} {"train_loss": -11.658843994140625, "global_step": 282766, "epoch": 1683} {"train_loss": -11.706863403320312, "global_step": 282767, "epoch": 1683} {"train_loss": -11.699003219604492, "global_step": 282768, "epoch": 1683} {"train_loss": -11.389999389648438, "global_step": 282769, "epoch": 1683} {"train_loss": -11.461272239685059, "global_step": 282770, "epoch": 1683} {"train_loss": -11.752276420593262, "global_step": 282771, "epoch": 1683} {"train_loss": -11.630413055419922, "global_step": 282772, "epoch": 1683} {"train_loss": -11.495447158813477, "global_step": 282773, "epoch": 1683} {"train_loss": -11.856986999511719, "global_step": 282774, "epoch": 1683} {"train_loss": -11.612995147705078, "global_step": 282775, "epoch": 1683} {"train_loss": -10.730496406555176, "global_step": 282776, "epoch": 1683} {"train_loss": -10.38692855834961, "global_step": 282777, "epoch": 1683} {"train_loss": -12.113201141357422, "global_step": 282778, "epoch": 1683} {"train_loss": -10.253194808959961, "global_step": 282779, "epoch": 1683} {"train_loss": -8.859166145324707, "global_step": 282780, "epoch": 1683} {"train_loss": -8.916996955871582, "global_step": 282781, "epoch": 1683} {"train_loss": -9.585147857666016, "global_step": 282782, "epoch": 1683} {"train_loss": -10.997459411621094, "global_step": 282783, "epoch": 1683} {"train_loss": -8.264442443847656, "global_step": 282784, "epoch": 1683} {"train_loss": -9.05572509765625, "global_step": 282785, "epoch": 1683} {"train_loss": -10.199763298034668, "global_step": 282786, "epoch": 1683} {"train_loss": -10.113723754882812, "global_step": 282787, "epoch": 1683} {"train_loss": -10.516037940979004, "global_step": 282788, "epoch": 1683} {"train_loss": -10.62930679321289, "global_step": 282789, "epoch": 1683} {"train_loss": -9.439284324645996, "global_step": 282790, "epoch": 1683} {"train_loss": -10.045944213867188, "global_step": 282791, "epoch": 1683} {"train_loss": -10.175043106079102, "global_step": 282792, "epoch": 1683} {"train_loss": -10.37846565246582, "global_step": 282793, "epoch": 1683} {"train_loss": -10.004444122314453, "global_step": 282794, "epoch": 1683} {"train_loss": -11.18659782409668, "global_step": 282795, "epoch": 1683} {"train_loss": -10.075469970703125, "global_step": 282796, "epoch": 1683} {"train_loss": -11.727774620056152, "global_step": 282797, "epoch": 1683} {"train_loss": -10.561105728149414, "global_step": 282798, "epoch": 1683} {"train_loss": -10.753166198730469, "global_step": 282799, "epoch": 1683} {"train_loss": -9.737893104553223, "global_step": 282800, "epoch": 1683} {"train_loss": -11.254949569702148, "global_step": 282801, "epoch": 1683} {"train_loss": -9.59697151184082, "global_step": 282802, "epoch": 1683} {"train_loss": -11.466793060302734, "global_step": 282803, "epoch": 1683} {"train_loss": -9.729751586914062, "global_step": 282804, "epoch": 1683} {"train_loss": -10.985928535461426, "global_step": 282805, "epoch": 1683} {"train_loss": -10.299651145935059, "global_step": 282806, "epoch": 1683} {"train_loss": -11.159370422363281, "global_step": 282807, "epoch": 1683} {"train_loss": -11.020030975341797, "global_step": 282808, "epoch": 1683} {"train_loss": -10.672834396362305, "global_step": 282809, "epoch": 1683} {"train_loss": -11.41021728515625, "global_step": 282810, "epoch": 1683} {"train_loss": -10.813737869262695, "global_step": 282811, "epoch": 1683} {"train_loss": -11.275934219360352, "global_step": 282812, "epoch": 1683} {"train_loss": -10.827713966369629, "global_step": 282813, "epoch": 1683} {"train_loss": -11.379926681518555, "global_step": 282814, "epoch": 1683} {"train_loss": -10.788743019104004, "global_step": 282815, "epoch": 1683} {"train_loss": -11.106670379638672, "global_step": 282816, "epoch": 1683} {"train_loss": -11.510995864868164, "global_step": 282817, "epoch": 1683} {"train_loss": -10.724359512329102, "global_step": 282818, "epoch": 1683} {"train_loss": -11.631963729858398, "global_step": 282819, "epoch": 1683} {"train_loss": -10.432036399841309, "global_step": 282820, "epoch": 1683} {"train_loss": -11.333475112915039, "global_step": 282821, "epoch": 1683} {"train_loss": -10.251559257507324, "global_step": 282822, "epoch": 1683} {"train_loss": -11.4638032913208, "global_step": 282823, "epoch": 1683} {"train_loss": -11.074545860290527, "global_step": 282824, "epoch": 1683} {"train_loss": -10.866842269897461, "global_step": 282825, "epoch": 1683} {"train_loss": -11.618457794189453, "global_step": 282826, "epoch": 1683} {"train_loss": -10.847702026367188, "global_step": 282827, "epoch": 1683} {"train_loss": -11.647547721862793, "global_step": 282828, "epoch": 1683} {"train_loss": -11.469097137451172, "global_step": 282829, "epoch": 1683} {"train_loss": -11.545109748840332, "global_step": 282830, "epoch": 1683} {"train_loss": -11.350318908691406, "global_step": 282831, "epoch": 1683} {"train_loss": -11.826022148132324, "global_step": 282832, "epoch": 1683} {"train_loss": -11.47391128540039, "global_step": 282833, "epoch": 1683} {"train_loss": -11.861893653869629, "global_step": 282834, "epoch": 1683} {"train_loss": -11.763946533203125, "global_step": 282835, "epoch": 1683} {"train_loss": -11.66037654876709, "global_step": 282836, "epoch": 1683} {"train_loss": -11.769916534423828, "global_step": 282837, "epoch": 1683} {"train_loss": -11.853667259216309, "global_step": 282838, "epoch": 1683} {"train_loss": -11.886167526245117, "global_step": 282839, "epoch": 1683} {"train_loss": -11.907323837280273, "global_step": 282840, "epoch": 1683} {"train_loss": -11.923131942749023, "global_step": 282841, "epoch": 1683} {"train_loss": -11.838088989257812, "global_step": 282842, "epoch": 1683} {"train_loss": -11.985407829284668, "global_step": 282843, "epoch": 1683} {"train_loss": -11.862947463989258, "global_step": 282844, "epoch": 1683} {"train_loss": -11.932777404785156, "global_step": 282845, "epoch": 1683} {"train_loss": -12.13453483581543, "global_step": 282846, "epoch": 1683} {"train_loss": -11.816120147705078, "global_step": 282847, "epoch": 1683} {"train_loss": -12.013616561889648, "global_step": 282848, "epoch": 1683} {"train_loss": -12.092204093933105, "global_step": 282849, "epoch": 1683} {"train_loss": -11.845149040222168, "global_step": 282850, "epoch": 1683} {"train_loss": -11.946147918701172, "global_step": 282851, "epoch": 1683} {"train_loss": -11.97903060913086, "global_step": 282852, "epoch": 1683} {"train_loss": -11.896744728088379, "global_step": 282853, "epoch": 1683} {"train_loss": -11.869626998901367, "global_step": 282854, "epoch": 1683} {"train_loss": -11.858478546142578, "global_step": 282855, "epoch": 1683} {"train_loss": -12.093835830688477, "global_step": 282856, "epoch": 1683} {"train_loss": -12.114407539367676, "global_step": 282857, "epoch": 1683} {"train_loss": -11.960603713989258, "global_step": 282858, "epoch": 1683} {"train_loss": -12.058326721191406, "global_step": 282859, "epoch": 1683} {"train_loss": -12.03885269165039, "global_step": 282860, "epoch": 1683} {"train_loss": -11.96902084350586, "global_step": 282861, "epoch": 1683} {"train_loss": -11.922958374023438, "global_step": 282862, "epoch": 1683} {"train_loss": -12.2122163772583, "global_step": 282863, "epoch": 1683} {"train_loss": -12.278082847595215, "global_step": 282864, "epoch": 1683} {"train_loss": -11.919084548950195, "global_step": 282865, "epoch": 1683} {"train_loss": -12.18452262878418, "global_step": 282866, "epoch": 1683} {"train_loss": -12.206315994262695, "global_step": 282867, "epoch": 1683} {"train_loss": -12.181873321533203, "global_step": 282868, "epoch": 1683} {"train_loss": -12.34300708770752, "global_step": 282869, "epoch": 1683} {"train_loss": -12.154500007629395, "global_step": 282870, "epoch": 1683} {"train_loss": -12.229218482971191, "global_step": 282871, "epoch": 1683} {"train_loss": -12.317167282104492, "global_step": 282872, "epoch": 1683} {"train_loss": -12.09813117980957, "global_step": 282873, "epoch": 1683} {"train_loss": -12.250353813171387, "global_step": 282874, "epoch": 1683} {"train_loss": -12.033395767211914, "global_step": 282875, "epoch": 1683} {"train_loss": -12.213136672973633, "global_step": 282876, "epoch": 1683} {"train_loss": -12.288022994995117, "global_step": 282877, "epoch": 1683} {"train_loss": -12.288747787475586, "global_step": 282878, "epoch": 1683} {"train_loss": -12.241447448730469, "global_step": 282879, "epoch": 1683} {"train_loss": -12.22697639465332, "global_step": 282880, "epoch": 1683} {"train_loss": -12.24348258972168, "global_step": 282881, "epoch": 1683} {"train_loss": -12.372138977050781, "global_step": 282882, "epoch": 1683} {"train_loss": -12.239896774291992, "global_step": 282883, "epoch": 1683} {"train_loss": -12.372825622558594, "global_step": 282884, "epoch": 1683} {"train_loss": -12.390369415283203, "global_step": 282885, "epoch": 1683} {"train_loss": -12.374671936035156, "global_step": 282886, "epoch": 1683} {"train_loss": -12.28769588470459, "global_step": 282887, "epoch": 1683} {"train_loss": -12.309768676757812, "global_step": 282888, "epoch": 1683} {"train_loss": -12.293627738952637, "global_step": 282889, "epoch": 1683} {"train_loss": -12.360085487365723, "global_step": 282890, "epoch": 1683} {"train_loss": -11.735757827758789, "global_step": 282891, "epoch": 1683} {"train_loss": -12.170073509216309, "global_step": 282892, "epoch": 1683} {"train_loss": -12.033681869506836, "global_step": 282893, "epoch": 1683} {"train_loss": -12.004175186157227, "global_step": 282894, "epoch": 1683} {"train_loss": -10.664056777954102, "global_step": 282895, "epoch": 1683} {"train_loss": -9.696683883666992, "global_step": 282896, "epoch": 1683} {"train_loss": -12.087095260620117, "global_step": 282897, "epoch": 1683} {"train_loss": -11.033245086669922, "global_step": 282898, "epoch": 1683} {"train_loss": -9.490568161010742, "global_step": 282899, "epoch": 1683} {"train_loss": -11.71884822845459, "global_step": 282900, "epoch": 1683} {"train_loss": -11.250107765197754, "global_step": 282901, "epoch": 1683} {"train_loss": -10.958318710327148, "global_step": 282902, "epoch": 1683} {"train_loss": -11.36066722869873, "global_step": 282903, "epoch": 1683} {"train_loss": -11.350606918334961, "global_step": 282904, "epoch": 1683} {"train_loss": -8.885578155517578, "global_step": 282905, "epoch": 1683} {"train_loss": -8.755661010742188, "global_step": 282906, "epoch": 1683} {"train_loss": -10.773797988891602, "global_step": 282907, "epoch": 1683} {"train_loss": -11.100034713745117, "global_step": 282908, "epoch": 1683} {"train_loss": -10.445969581604004, "global_step": 282909, "epoch": 1683} {"train_loss": -8.246692657470703, "global_step": 282910, "epoch": 1683} {"train_loss": -11.418402353922525, "global_step": 282911, "epoch": 1683, "val_loss": 273765.3125} {"train_loss": -11.635273933410645, "global_step": 282912, "epoch": 1684} {"train_loss": -9.867801666259766, "global_step": 282913, "epoch": 1684} {"train_loss": -10.645492553710938, "global_step": 282914, "epoch": 1684} {"train_loss": -10.951498985290527, "global_step": 282915, "epoch": 1684} {"train_loss": -9.923173904418945, "global_step": 282916, "epoch": 1684} {"train_loss": -10.747157096862793, "global_step": 282917, "epoch": 1684} {"train_loss": -10.12687873840332, "global_step": 282918, "epoch": 1684} {"train_loss": -10.959744453430176, "global_step": 282919, "epoch": 1684} {"train_loss": -11.133665084838867, "global_step": 282920, "epoch": 1684} {"train_loss": -10.62960147857666, "global_step": 282921, "epoch": 1684} {"train_loss": -11.265603065490723, "global_step": 282922, "epoch": 1684} {"train_loss": -10.054325103759766, "global_step": 282923, "epoch": 1684} {"train_loss": -10.911441802978516, "global_step": 282924, "epoch": 1684} {"train_loss": -9.955375671386719, "global_step": 282925, "epoch": 1684} {"train_loss": -10.902671813964844, "global_step": 282926, "epoch": 1684} {"train_loss": -10.51384449005127, "global_step": 282927, "epoch": 1684} {"train_loss": -10.52823257446289, "global_step": 282928, "epoch": 1684} {"train_loss": -10.413503646850586, "global_step": 282929, "epoch": 1684} {"train_loss": -10.45872974395752, "global_step": 282930, "epoch": 1684} {"train_loss": -10.386163711547852, "global_step": 282931, "epoch": 1684} {"train_loss": -11.34772777557373, "global_step": 282932, "epoch": 1684} {"train_loss": -10.738869667053223, "global_step": 282933, "epoch": 1684} {"train_loss": -10.569580078125, "global_step": 282934, "epoch": 1684} {"train_loss": -10.312414169311523, "global_step": 282935, "epoch": 1684} {"train_loss": -10.986852645874023, "global_step": 282936, "epoch": 1684} {"train_loss": -10.1802978515625, "global_step": 282937, "epoch": 1684} {"train_loss": -10.434816360473633, "global_step": 282938, "epoch": 1684} {"train_loss": -11.329471588134766, "global_step": 282939, "epoch": 1684} {"train_loss": -10.46566390991211, "global_step": 282940, "epoch": 1684} {"train_loss": -10.511730194091797, "global_step": 282941, "epoch": 1684} {"train_loss": -11.02658462524414, "global_step": 282942, "epoch": 1684} {"train_loss": -10.309391021728516, "global_step": 282943, "epoch": 1684} {"train_loss": -10.565921783447266, "global_step": 282944, "epoch": 1684} {"train_loss": -11.352582931518555, "global_step": 282945, "epoch": 1684} {"train_loss": -9.668744087219238, "global_step": 282946, "epoch": 1684} {"train_loss": -11.054374694824219, "global_step": 282947, "epoch": 1684} {"train_loss": -11.127832412719727, "global_step": 282948, "epoch": 1684} {"train_loss": -10.44035816192627, "global_step": 282949, "epoch": 1684} {"train_loss": -11.592741966247559, "global_step": 282950, "epoch": 1684} {"train_loss": -11.10548210144043, "global_step": 282951, "epoch": 1684} {"train_loss": -10.846415519714355, "global_step": 282952, "epoch": 1684} {"train_loss": -11.444457054138184, "global_step": 282953, "epoch": 1684} {"train_loss": -11.565229415893555, "global_step": 282954, "epoch": 1684} {"train_loss": -11.18666934967041, "global_step": 282955, "epoch": 1684} {"train_loss": -11.481727600097656, "global_step": 282956, "epoch": 1684} {"train_loss": -11.589128494262695, "global_step": 282957, "epoch": 1684} {"train_loss": -11.623085021972656, "global_step": 282958, "epoch": 1684} {"train_loss": -11.368526458740234, "global_step": 282959, "epoch": 1684} {"train_loss": -11.605377197265625, "global_step": 282960, "epoch": 1684} {"train_loss": -11.291391372680664, "global_step": 282961, "epoch": 1684} {"train_loss": -11.637555122375488, "global_step": 282962, "epoch": 1684} {"train_loss": -11.613029479980469, "global_step": 282963, "epoch": 1684} {"train_loss": -11.615521430969238, "global_step": 282964, "epoch": 1684} {"train_loss": -11.760875701904297, "global_step": 282965, "epoch": 1684} {"train_loss": -11.757292747497559, "global_step": 282966, "epoch": 1684} {"train_loss": -11.659749031066895, "global_step": 282967, "epoch": 1684} {"train_loss": -11.771122932434082, "global_step": 282968, "epoch": 1684} {"train_loss": -11.949031829833984, "global_step": 282969, "epoch": 1684} {"train_loss": -11.719071388244629, "global_step": 282970, "epoch": 1684} {"train_loss": -11.850135803222656, "global_step": 282971, "epoch": 1684} {"train_loss": -12.009170532226562, "global_step": 282972, "epoch": 1684} {"train_loss": -11.685113906860352, "global_step": 282973, "epoch": 1684} {"train_loss": -11.800507545471191, "global_step": 282974, "epoch": 1684} {"train_loss": -11.875948905944824, "global_step": 282975, "epoch": 1684} {"train_loss": -11.94844913482666, "global_step": 282976, "epoch": 1684} {"train_loss": -11.674786567687988, "global_step": 282977, "epoch": 1684} {"train_loss": -11.976282119750977, "global_step": 282978, "epoch": 1684} {"train_loss": -11.90144157409668, "global_step": 282979, "epoch": 1684} {"train_loss": -11.934687614440918, "global_step": 282980, "epoch": 1684} {"train_loss": -11.775321960449219, "global_step": 282981, "epoch": 1684} {"train_loss": -11.821493148803711, "global_step": 282982, "epoch": 1684} {"train_loss": -12.013172149658203, "global_step": 282983, "epoch": 1684} {"train_loss": -12.020124435424805, "global_step": 282984, "epoch": 1684} {"train_loss": -11.940021514892578, "global_step": 282985, "epoch": 1684} {"train_loss": -11.80815315246582, "global_step": 282986, "epoch": 1684} {"train_loss": -11.872808456420898, "global_step": 282987, "epoch": 1684} {"train_loss": -12.018411636352539, "global_step": 282988, "epoch": 1684} {"train_loss": -11.892631530761719, "global_step": 282989, "epoch": 1684} {"train_loss": -12.094284057617188, "global_step": 282990, "epoch": 1684} {"train_loss": -11.95356559753418, "global_step": 282991, "epoch": 1684} {"train_loss": -12.018253326416016, "global_step": 282992, "epoch": 1684} {"train_loss": -11.981843948364258, "global_step": 282993, "epoch": 1684} {"train_loss": -11.98491096496582, "global_step": 282994, "epoch": 1684} {"train_loss": -12.200396537780762, "global_step": 282995, "epoch": 1684} {"train_loss": -12.0770263671875, "global_step": 282996, "epoch": 1684} {"train_loss": -12.209732055664062, "global_step": 282997, "epoch": 1684} {"train_loss": -11.768017768859863, "global_step": 282998, "epoch": 1684} {"train_loss": -12.012369155883789, "global_step": 282999, "epoch": 1684} {"train_loss": -12.19548225402832, "global_step": 283000, "epoch": 1684} {"train_loss": -12.06648063659668, "global_step": 283001, "epoch": 1684} {"train_loss": -11.94980525970459, "global_step": 283002, "epoch": 1684} {"train_loss": -12.12561321258545, "global_step": 283003, "epoch": 1684} {"train_loss": -11.566621780395508, "global_step": 283004, "epoch": 1684} {"train_loss": -11.785608291625977, "global_step": 283005, "epoch": 1684} {"train_loss": -12.211776733398438, "global_step": 283006, "epoch": 1684} {"train_loss": -11.919883728027344, "global_step": 283007, "epoch": 1684} {"train_loss": -12.188362121582031, "global_step": 283008, "epoch": 1684} {"train_loss": -12.102287292480469, "global_step": 283009, "epoch": 1684} {"train_loss": -12.278484344482422, "global_step": 283010, "epoch": 1684} {"train_loss": -12.073650360107422, "global_step": 283011, "epoch": 1684} {"train_loss": -12.156311988830566, "global_step": 283012, "epoch": 1684} {"train_loss": -12.046571731567383, "global_step": 283013, "epoch": 1684} {"train_loss": -12.24618148803711, "global_step": 283014, "epoch": 1684} {"train_loss": -12.209817886352539, "global_step": 283015, "epoch": 1684} {"train_loss": -12.073579788208008, "global_step": 283016, "epoch": 1684} {"train_loss": -12.12563705444336, "global_step": 283017, "epoch": 1684} {"train_loss": -11.911707878112793, "global_step": 283018, "epoch": 1684} {"train_loss": -12.114105224609375, "global_step": 283019, "epoch": 1684} {"train_loss": -12.037860870361328, "global_step": 283020, "epoch": 1684} {"train_loss": -12.342183113098145, "global_step": 283021, "epoch": 1684} {"train_loss": -11.538444519042969, "global_step": 283022, "epoch": 1684} {"train_loss": -11.975927352905273, "global_step": 283023, "epoch": 1684} {"train_loss": -11.683395385742188, "global_step": 283024, "epoch": 1684} {"train_loss": -12.209829330444336, "global_step": 283025, "epoch": 1684} {"train_loss": -11.982400894165039, "global_step": 283026, "epoch": 1684} {"train_loss": -12.186695098876953, "global_step": 283027, "epoch": 1684} {"train_loss": -12.20030403137207, "global_step": 283028, "epoch": 1684} {"train_loss": -11.579071044921875, "global_step": 283029, "epoch": 1684} {"train_loss": -12.065818786621094, "global_step": 283030, "epoch": 1684} {"train_loss": -11.80771255493164, "global_step": 283031, "epoch": 1684} {"train_loss": -11.423734664916992, "global_step": 283032, "epoch": 1684} {"train_loss": -11.794611930847168, "global_step": 283033, "epoch": 1684} {"train_loss": -11.381317138671875, "global_step": 283034, "epoch": 1684} {"train_loss": -12.204713821411133, "global_step": 283035, "epoch": 1684} {"train_loss": -11.818817138671875, "global_step": 283036, "epoch": 1684} {"train_loss": -11.9569673538208, "global_step": 283037, "epoch": 1684} {"train_loss": -11.933425903320312, "global_step": 283038, "epoch": 1684} {"train_loss": -11.929436683654785, "global_step": 283039, "epoch": 1684} {"train_loss": -12.253320693969727, "global_step": 283040, "epoch": 1684} {"train_loss": -11.585393905639648, "global_step": 283041, "epoch": 1684} {"train_loss": -11.429670333862305, "global_step": 283042, "epoch": 1684} {"train_loss": -11.346263885498047, "global_step": 283043, "epoch": 1684} {"train_loss": -12.170927047729492, "global_step": 283044, "epoch": 1684} {"train_loss": -12.298589706420898, "global_step": 283045, "epoch": 1684} {"train_loss": -12.014806747436523, "global_step": 283046, "epoch": 1684} {"train_loss": -11.473258018493652, "global_step": 283047, "epoch": 1684} {"train_loss": -11.882489204406738, "global_step": 283048, "epoch": 1684} {"train_loss": -12.367080688476562, "global_step": 283049, "epoch": 1684} {"train_loss": -11.986552238464355, "global_step": 283050, "epoch": 1684} {"train_loss": -11.453333854675293, "global_step": 283051, "epoch": 1684} {"train_loss": -11.904001235961914, "global_step": 283052, "epoch": 1684} {"train_loss": -11.768926620483398, "global_step": 283053, "epoch": 1684} {"train_loss": -12.269031524658203, "global_step": 283054, "epoch": 1684} {"train_loss": -12.199419021606445, "global_step": 283055, "epoch": 1684} {"train_loss": -11.853378295898438, "global_step": 283056, "epoch": 1684} {"train_loss": -11.960212707519531, "global_step": 283057, "epoch": 1684} {"train_loss": -11.98037052154541, "global_step": 283058, "epoch": 1684} {"train_loss": -11.992856979370117, "global_step": 283059, "epoch": 1684} {"train_loss": -12.182446479797363, "global_step": 283060, "epoch": 1684} {"train_loss": -12.075136184692383, "global_step": 283061, "epoch": 1684} {"train_loss": -12.050453186035156, "global_step": 283062, "epoch": 1684} {"train_loss": -12.017210006713867, "global_step": 283063, "epoch": 1684} {"train_loss": -11.816015243530273, "global_step": 283064, "epoch": 1684} {"train_loss": -10.175682067871094, "global_step": 283065, "epoch": 1684} {"train_loss": -11.667444229125977, "global_step": 283066, "epoch": 1684} {"train_loss": -10.736392974853516, "global_step": 283067, "epoch": 1684} {"train_loss": -11.141709327697754, "global_step": 283068, "epoch": 1684} {"train_loss": -9.853906631469727, "global_step": 283069, "epoch": 1684} {"train_loss": -11.136544227600098, "global_step": 283070, "epoch": 1684} {"train_loss": -11.446009635925293, "global_step": 283071, "epoch": 1684} {"train_loss": -11.339371681213379, "global_step": 283072, "epoch": 1684} {"train_loss": -11.473003387451172, "global_step": 283073, "epoch": 1684} {"train_loss": -11.6051025390625, "global_step": 283074, "epoch": 1684} {"train_loss": -11.478111267089844, "global_step": 283075, "epoch": 1684} {"train_loss": -11.542459487915039, "global_step": 283076, "epoch": 1684} {"train_loss": -11.503573417663574, "global_step": 283077, "epoch": 1684} {"train_loss": -11.291120529174805, "global_step": 283078, "epoch": 1684} {"train_loss": -11.538893909681411, "global_step": 283079, "epoch": 1684, "val_loss": 273274.65625} {"train_loss": -11.122819900512695, "global_step": 283080, "epoch": 1685} {"train_loss": -11.041204452514648, "global_step": 283081, "epoch": 1685} {"train_loss": -10.254009246826172, "global_step": 283082, "epoch": 1685} {"train_loss": -10.70434856414795, "global_step": 283083, "epoch": 1685} {"train_loss": -11.121299743652344, "global_step": 283084, "epoch": 1685} {"train_loss": -9.973791122436523, "global_step": 283085, "epoch": 1685} {"train_loss": -10.87942123413086, "global_step": 283086, "epoch": 1685} {"train_loss": -8.807640075683594, "global_step": 283087, "epoch": 1685} {"train_loss": -8.218996047973633, "global_step": 283088, "epoch": 1685} {"train_loss": -10.671497344970703, "global_step": 283089, "epoch": 1685} {"train_loss": -8.729491233825684, "global_step": 283090, "epoch": 1685} {"train_loss": -8.54934310913086, "global_step": 283091, "epoch": 1685} {"train_loss": -7.944321632385254, "global_step": 283092, "epoch": 1685} {"train_loss": -8.728669166564941, "global_step": 283093, "epoch": 1685} {"train_loss": -9.563554763793945, "global_step": 283094, "epoch": 1685} {"train_loss": -8.699946403503418, "global_step": 283095, "epoch": 1685} {"train_loss": -9.871522903442383, "global_step": 283096, "epoch": 1685} {"train_loss": -10.881170272827148, "global_step": 283097, "epoch": 1685} {"train_loss": -10.472204208374023, "global_step": 283098, "epoch": 1685} {"train_loss": -10.636143684387207, "global_step": 283099, "epoch": 1685} {"train_loss": -10.335871696472168, "global_step": 283100, "epoch": 1685} {"train_loss": -10.273990631103516, "global_step": 283101, "epoch": 1685} {"train_loss": -11.543086051940918, "global_step": 283102, "epoch": 1685} {"train_loss": -9.939146995544434, "global_step": 283103, "epoch": 1685} {"train_loss": -11.281160354614258, "global_step": 283104, "epoch": 1685} {"train_loss": -11.29761028289795, "global_step": 283105, "epoch": 1685} {"train_loss": -10.535972595214844, "global_step": 283106, "epoch": 1685} {"train_loss": -11.375415802001953, "global_step": 283107, "epoch": 1685} {"train_loss": -10.815107345581055, "global_step": 283108, "epoch": 1685} {"train_loss": -11.12115478515625, "global_step": 283109, "epoch": 1685} {"train_loss": -11.102640151977539, "global_step": 283110, "epoch": 1685} {"train_loss": -11.430811882019043, "global_step": 283111, "epoch": 1685} {"train_loss": -11.270170211791992, "global_step": 283112, "epoch": 1685} {"train_loss": -11.543924331665039, "global_step": 283113, "epoch": 1685} {"train_loss": -11.322620391845703, "global_step": 283114, "epoch": 1685} {"train_loss": -11.50787353515625, "global_step": 283115, "epoch": 1685} {"train_loss": -11.71816635131836, "global_step": 283116, "epoch": 1685} {"train_loss": -11.61972427368164, "global_step": 283117, "epoch": 1685} {"train_loss": -11.573143005371094, "global_step": 283118, "epoch": 1685} {"train_loss": -11.612325668334961, "global_step": 283119, "epoch": 1685} {"train_loss": -11.712778091430664, "global_step": 283120, "epoch": 1685} {"train_loss": -11.599047660827637, "global_step": 283121, "epoch": 1685} {"train_loss": -11.859405517578125, "global_step": 283122, "epoch": 1685} {"train_loss": -11.855352401733398, "global_step": 283123, "epoch": 1685} {"train_loss": -11.613466262817383, "global_step": 283124, "epoch": 1685} {"train_loss": -11.861809730529785, "global_step": 283125, "epoch": 1685} {"train_loss": -11.744028091430664, "global_step": 283126, "epoch": 1685} {"train_loss": -12.08357048034668, "global_step": 283127, "epoch": 1685} {"train_loss": -11.842925071716309, "global_step": 283128, "epoch": 1685} {"train_loss": -11.882194519042969, "global_step": 283129, "epoch": 1685} {"train_loss": -11.842950820922852, "global_step": 283130, "epoch": 1685} {"train_loss": -12.236349105834961, "global_step": 283131, "epoch": 1685} {"train_loss": -11.687713623046875, "global_step": 283132, "epoch": 1685} {"train_loss": -12.059507369995117, "global_step": 283133, "epoch": 1685} {"train_loss": -11.909107208251953, "global_step": 283134, "epoch": 1685} {"train_loss": -11.960193634033203, "global_step": 283135, "epoch": 1685} {"train_loss": -11.906770706176758, "global_step": 283136, "epoch": 1685} {"train_loss": -11.88827896118164, "global_step": 283137, "epoch": 1685} {"train_loss": -12.176177978515625, "global_step": 283138, "epoch": 1685} {"train_loss": -11.965010643005371, "global_step": 283139, "epoch": 1685} {"train_loss": -12.081395149230957, "global_step": 283140, "epoch": 1685} {"train_loss": -12.023117065429688, "global_step": 283141, "epoch": 1685} {"train_loss": -11.863570213317871, "global_step": 283142, "epoch": 1685} {"train_loss": -12.011147499084473, "global_step": 283143, "epoch": 1685} {"train_loss": -11.720819473266602, "global_step": 283144, "epoch": 1685} {"train_loss": -12.158658981323242, "global_step": 283145, "epoch": 1685} {"train_loss": -11.865421295166016, "global_step": 283146, "epoch": 1685} {"train_loss": -11.956690788269043, "global_step": 283147, "epoch": 1685} {"train_loss": -12.117990493774414, "global_step": 283148, "epoch": 1685} {"train_loss": -12.105321884155273, "global_step": 283149, "epoch": 1685} {"train_loss": -12.10774040222168, "global_step": 283150, "epoch": 1685} {"train_loss": -11.945201873779297, "global_step": 283151, "epoch": 1685} {"train_loss": -12.165815353393555, "global_step": 283152, "epoch": 1685} {"train_loss": -12.364606857299805, "global_step": 283153, "epoch": 1685} {"train_loss": -12.120328903198242, "global_step": 283154, "epoch": 1685} {"train_loss": -12.275524139404297, "global_step": 283155, "epoch": 1685} {"train_loss": -12.145849227905273, "global_step": 283156, "epoch": 1685} {"train_loss": -12.271130561828613, "global_step": 283157, "epoch": 1685} {"train_loss": -12.269758224487305, "global_step": 283158, "epoch": 1685} {"train_loss": -12.261762619018555, "global_step": 283159, "epoch": 1685} {"train_loss": -12.342735290527344, "global_step": 283160, "epoch": 1685} {"train_loss": -12.10523796081543, "global_step": 283161, "epoch": 1685} {"train_loss": -12.390642166137695, "global_step": 283162, "epoch": 1685} {"train_loss": -12.392539978027344, "global_step": 283163, "epoch": 1685} {"train_loss": -12.233260154724121, "global_step": 283164, "epoch": 1685} {"train_loss": -12.391565322875977, "global_step": 283165, "epoch": 1685} {"train_loss": -12.342695236206055, "global_step": 283166, "epoch": 1685} {"train_loss": -12.239080429077148, "global_step": 283167, "epoch": 1685} {"train_loss": -12.426597595214844, "global_step": 283168, "epoch": 1685} {"train_loss": -12.017783164978027, "global_step": 283169, "epoch": 1685} {"train_loss": -12.00974178314209, "global_step": 283170, "epoch": 1685} {"train_loss": -12.273987770080566, "global_step": 283171, "epoch": 1685} {"train_loss": -12.390182495117188, "global_step": 283172, "epoch": 1685} {"train_loss": -12.361064910888672, "global_step": 283173, "epoch": 1685} {"train_loss": -12.31612777709961, "global_step": 283174, "epoch": 1685} {"train_loss": -12.243191719055176, "global_step": 283175, "epoch": 1685} {"train_loss": -12.177276611328125, "global_step": 283176, "epoch": 1685} {"train_loss": -11.93006420135498, "global_step": 283177, "epoch": 1685} {"train_loss": -12.384300231933594, "global_step": 283178, "epoch": 1685} {"train_loss": -11.910712242126465, "global_step": 283179, "epoch": 1685} {"train_loss": -12.1038236618042, "global_step": 283180, "epoch": 1685} {"train_loss": -11.483383178710938, "global_step": 283181, "epoch": 1685} {"train_loss": -12.05244255065918, "global_step": 283182, "epoch": 1685} {"train_loss": -11.268129348754883, "global_step": 283183, "epoch": 1685} {"train_loss": -10.37615966796875, "global_step": 283184, "epoch": 1685} {"train_loss": -10.457693099975586, "global_step": 283185, "epoch": 1685} {"train_loss": -11.0971097946167, "global_step": 283186, "epoch": 1685} {"train_loss": -11.977346420288086, "global_step": 283187, "epoch": 1685} {"train_loss": -11.451516151428223, "global_step": 283188, "epoch": 1685} {"train_loss": -11.857219696044922, "global_step": 283189, "epoch": 1685} {"train_loss": -11.522064208984375, "global_step": 283190, "epoch": 1685} {"train_loss": -11.607223510742188, "global_step": 283191, "epoch": 1685} {"train_loss": -11.320259094238281, "global_step": 283192, "epoch": 1685} {"train_loss": -11.521259307861328, "global_step": 283193, "epoch": 1685} {"train_loss": -11.815850257873535, "global_step": 283194, "epoch": 1685} {"train_loss": -11.501431465148926, "global_step": 283195, "epoch": 1685} {"train_loss": -11.743734359741211, "global_step": 283196, "epoch": 1685} {"train_loss": -11.144025802612305, "global_step": 283197, "epoch": 1685} {"train_loss": -10.771002769470215, "global_step": 283198, "epoch": 1685} {"train_loss": -10.825469017028809, "global_step": 283199, "epoch": 1685} {"train_loss": -10.339845657348633, "global_step": 283200, "epoch": 1685} {"train_loss": -11.615961074829102, "global_step": 283201, "epoch": 1685} {"train_loss": -10.581119537353516, "global_step": 283202, "epoch": 1685} {"train_loss": -10.972759246826172, "global_step": 283203, "epoch": 1685} {"train_loss": -11.394445419311523, "global_step": 283204, "epoch": 1685} {"train_loss": -10.891088485717773, "global_step": 283205, "epoch": 1685} {"train_loss": -11.09556770324707, "global_step": 283206, "epoch": 1685} {"train_loss": -11.789899826049805, "global_step": 283207, "epoch": 1685} {"train_loss": -11.712705612182617, "global_step": 283208, "epoch": 1685} {"train_loss": -11.920265197753906, "global_step": 283209, "epoch": 1685} {"train_loss": -11.618741989135742, "global_step": 283210, "epoch": 1685} {"train_loss": -11.917655944824219, "global_step": 283211, "epoch": 1685} {"train_loss": -11.72575569152832, "global_step": 283212, "epoch": 1685} {"train_loss": -11.920162200927734, "global_step": 283213, "epoch": 1685} {"train_loss": -11.808008193969727, "global_step": 283214, "epoch": 1685} {"train_loss": -11.889260292053223, "global_step": 283215, "epoch": 1685} {"train_loss": -11.957246780395508, "global_step": 283216, "epoch": 1685} {"train_loss": -12.017929077148438, "global_step": 283217, "epoch": 1685} {"train_loss": -11.905559539794922, "global_step": 283218, "epoch": 1685} {"train_loss": -11.947610855102539, "global_step": 283219, "epoch": 1685} {"train_loss": -12.228822708129883, "global_step": 283220, "epoch": 1685} {"train_loss": -11.993002891540527, "global_step": 283221, "epoch": 1685} {"train_loss": -12.30459976196289, "global_step": 283222, "epoch": 1685} {"train_loss": -11.918134689331055, "global_step": 283223, "epoch": 1685} {"train_loss": -12.01149845123291, "global_step": 283224, "epoch": 1685} {"train_loss": -12.167133331298828, "global_step": 283225, "epoch": 1685} {"train_loss": -11.866743087768555, "global_step": 283226, "epoch": 1685} {"train_loss": -11.93387222290039, "global_step": 283227, "epoch": 1685} {"train_loss": -11.83902359008789, "global_step": 283228, "epoch": 1685} {"train_loss": -12.026122093200684, "global_step": 283229, "epoch": 1685} {"train_loss": -11.443109512329102, "global_step": 283230, "epoch": 1685} {"train_loss": -12.209856033325195, "global_step": 283231, "epoch": 1685} {"train_loss": -11.448915481567383, "global_step": 283232, "epoch": 1685} {"train_loss": -12.07501220703125, "global_step": 283233, "epoch": 1685} {"train_loss": -11.876087188720703, "global_step": 283234, "epoch": 1685} {"train_loss": -11.765235900878906, "global_step": 283235, "epoch": 1685} {"train_loss": -11.999951362609863, "global_step": 283236, "epoch": 1685} {"train_loss": -11.420868873596191, "global_step": 283237, "epoch": 1685} {"train_loss": -12.026065826416016, "global_step": 283238, "epoch": 1685} {"train_loss": -11.962503433227539, "global_step": 283239, "epoch": 1685} {"train_loss": -11.992515563964844, "global_step": 283240, "epoch": 1685} {"train_loss": -12.038200378417969, "global_step": 283241, "epoch": 1685} {"train_loss": -11.943531036376953, "global_step": 283242, "epoch": 1685} {"train_loss": -11.997450828552246, "global_step": 283243, "epoch": 1685} {"train_loss": -11.992238998413086, "global_step": 283244, "epoch": 1685} {"train_loss": -11.328721046447754, "global_step": 283245, "epoch": 1685} {"train_loss": -12.233345031738281, "global_step": 283246, "epoch": 1685} {"train_loss": -11.527946182659694, "global_step": 283247, "epoch": 1685, "val_loss": 276836.71875, "train_action_mse_error": 0.6710467338562012} {"train_loss": -11.969017028808594, "global_step": 283248, "epoch": 1686} {"train_loss": -12.103522300720215, "global_step": 283249, "epoch": 1686} {"train_loss": -11.709589004516602, "global_step": 283250, "epoch": 1686} {"train_loss": -12.095388412475586, "global_step": 283251, "epoch": 1686} {"train_loss": -11.275300979614258, "global_step": 283252, "epoch": 1686} {"train_loss": -11.489801406860352, "global_step": 283253, "epoch": 1686} {"train_loss": -12.115006446838379, "global_step": 283254, "epoch": 1686} {"train_loss": -11.778802871704102, "global_step": 283255, "epoch": 1686} {"train_loss": -11.56047248840332, "global_step": 283256, "epoch": 1686} {"train_loss": -12.045019149780273, "global_step": 283257, "epoch": 1686} {"train_loss": -11.67922592163086, "global_step": 283258, "epoch": 1686} {"train_loss": -11.879999160766602, "global_step": 283259, "epoch": 1686} {"train_loss": -11.69640827178955, "global_step": 283260, "epoch": 1686} {"train_loss": -11.973002433776855, "global_step": 283261, "epoch": 1686} {"train_loss": -11.988201141357422, "global_step": 283262, "epoch": 1686} {"train_loss": -11.293810844421387, "global_step": 283263, "epoch": 1686} {"train_loss": -11.548824310302734, "global_step": 283264, "epoch": 1686} {"train_loss": -12.076475143432617, "global_step": 283265, "epoch": 1686} {"train_loss": -10.999427795410156, "global_step": 283266, "epoch": 1686} {"train_loss": -11.803277969360352, "global_step": 283267, "epoch": 1686} {"train_loss": -10.274322509765625, "global_step": 283268, "epoch": 1686} {"train_loss": -10.901877403259277, "global_step": 283269, "epoch": 1686} {"train_loss": -11.352643966674805, "global_step": 283270, "epoch": 1686} {"train_loss": -10.820212364196777, "global_step": 283271, "epoch": 1686} {"train_loss": -11.522171020507812, "global_step": 283272, "epoch": 1686} {"train_loss": -10.505889892578125, "global_step": 283273, "epoch": 1686} {"train_loss": -11.590995788574219, "global_step": 283274, "epoch": 1686} {"train_loss": -11.133807182312012, "global_step": 283275, "epoch": 1686} {"train_loss": -10.69798469543457, "global_step": 283276, "epoch": 1686} {"train_loss": -11.767629623413086, "global_step": 283277, "epoch": 1686} {"train_loss": -10.618237495422363, "global_step": 283278, "epoch": 1686} {"train_loss": -11.013758659362793, "global_step": 283279, "epoch": 1686} {"train_loss": -10.114008903503418, "global_step": 283280, "epoch": 1686} {"train_loss": -11.136819839477539, "global_step": 283281, "epoch": 1686} {"train_loss": -10.14689826965332, "global_step": 283282, "epoch": 1686} {"train_loss": -10.6756010055542, "global_step": 283283, "epoch": 1686} {"train_loss": -9.4649658203125, "global_step": 283284, "epoch": 1686} {"train_loss": -11.260787010192871, "global_step": 283285, "epoch": 1686} {"train_loss": -8.921259880065918, "global_step": 283286, "epoch": 1686} {"train_loss": -11.422168731689453, "global_step": 283287, "epoch": 1686} {"train_loss": -9.617986679077148, "global_step": 283288, "epoch": 1686} {"train_loss": -9.920531272888184, "global_step": 283289, "epoch": 1686} {"train_loss": -10.215333938598633, "global_step": 283290, "epoch": 1686} {"train_loss": -8.655364990234375, "global_step": 283291, "epoch": 1686} {"train_loss": -10.436563491821289, "global_step": 283292, "epoch": 1686} {"train_loss": -10.489520072937012, "global_step": 283293, "epoch": 1686} {"train_loss": -10.957935333251953, "global_step": 283294, "epoch": 1686} {"train_loss": -9.694191932678223, "global_step": 283295, "epoch": 1686} {"train_loss": -10.978742599487305, "global_step": 283296, "epoch": 1686} {"train_loss": -11.027719497680664, "global_step": 283297, "epoch": 1686} {"train_loss": -10.190740585327148, "global_step": 283298, "epoch": 1686} {"train_loss": -11.262505531311035, "global_step": 283299, "epoch": 1686} {"train_loss": -10.921162605285645, "global_step": 283300, "epoch": 1686} {"train_loss": -10.529047012329102, "global_step": 283301, "epoch": 1686} {"train_loss": -11.472835540771484, "global_step": 283302, "epoch": 1686} {"train_loss": -11.42994499206543, "global_step": 283303, "epoch": 1686} {"train_loss": -10.927509307861328, "global_step": 283304, "epoch": 1686} {"train_loss": -11.43419075012207, "global_step": 283305, "epoch": 1686} {"train_loss": -11.510461807250977, "global_step": 283306, "epoch": 1686} {"train_loss": -10.899879455566406, "global_step": 283307, "epoch": 1686} {"train_loss": -11.572175979614258, "global_step": 283308, "epoch": 1686} {"train_loss": -11.452544212341309, "global_step": 283309, "epoch": 1686} {"train_loss": -10.954854965209961, "global_step": 283310, "epoch": 1686} {"train_loss": -11.368391990661621, "global_step": 283311, "epoch": 1686} {"train_loss": -11.594404220581055, "global_step": 283312, "epoch": 1686} {"train_loss": -11.569766998291016, "global_step": 283313, "epoch": 1686} {"train_loss": -11.436790466308594, "global_step": 283314, "epoch": 1686} {"train_loss": -11.713438034057617, "global_step": 283315, "epoch": 1686} {"train_loss": -11.693987846374512, "global_step": 283316, "epoch": 1686} {"train_loss": -11.055234909057617, "global_step": 283317, "epoch": 1686} {"train_loss": -11.8923921585083, "global_step": 283318, "epoch": 1686} {"train_loss": -11.514808654785156, "global_step": 283319, "epoch": 1686} {"train_loss": -11.691530227661133, "global_step": 283320, "epoch": 1686} {"train_loss": -11.730698585510254, "global_step": 283321, "epoch": 1686} {"train_loss": -11.754241943359375, "global_step": 283322, "epoch": 1686} {"train_loss": -11.567707061767578, "global_step": 283323, "epoch": 1686} {"train_loss": -11.673344612121582, "global_step": 283324, "epoch": 1686} {"train_loss": -11.928478240966797, "global_step": 283325, "epoch": 1686} {"train_loss": -11.44736099243164, "global_step": 283326, "epoch": 1686} {"train_loss": -11.873566627502441, "global_step": 283327, "epoch": 1686} {"train_loss": -11.870783805847168, "global_step": 283328, "epoch": 1686} {"train_loss": -11.507786750793457, "global_step": 283329, "epoch": 1686} {"train_loss": -11.951881408691406, "global_step": 283330, "epoch": 1686} {"train_loss": -11.612393379211426, "global_step": 283331, "epoch": 1686} {"train_loss": -11.935236930847168, "global_step": 283332, "epoch": 1686} {"train_loss": -11.870857238769531, "global_step": 283333, "epoch": 1686} {"train_loss": -11.999076843261719, "global_step": 283334, "epoch": 1686} {"train_loss": -11.930782318115234, "global_step": 283335, "epoch": 1686} {"train_loss": -11.774272918701172, "global_step": 283336, "epoch": 1686} {"train_loss": -12.167064666748047, "global_step": 283337, "epoch": 1686} {"train_loss": -11.763445854187012, "global_step": 283338, "epoch": 1686} {"train_loss": -11.9376859664917, "global_step": 283339, "epoch": 1686} {"train_loss": -11.82815170288086, "global_step": 283340, "epoch": 1686} {"train_loss": -11.594671249389648, "global_step": 283341, "epoch": 1686} {"train_loss": -12.044713973999023, "global_step": 283342, "epoch": 1686} {"train_loss": -11.617326736450195, "global_step": 283343, "epoch": 1686} {"train_loss": -11.96578598022461, "global_step": 283344, "epoch": 1686} {"train_loss": -11.69674301147461, "global_step": 283345, "epoch": 1686} {"train_loss": -12.213181495666504, "global_step": 283346, "epoch": 1686} {"train_loss": -12.008076667785645, "global_step": 283347, "epoch": 1686} {"train_loss": -11.998723983764648, "global_step": 283348, "epoch": 1686} {"train_loss": -12.027750968933105, "global_step": 283349, "epoch": 1686} {"train_loss": -11.875041961669922, "global_step": 283350, "epoch": 1686} {"train_loss": -11.818985939025879, "global_step": 283351, "epoch": 1686} {"train_loss": -11.982420921325684, "global_step": 283352, "epoch": 1686} {"train_loss": -12.05001449584961, "global_step": 283353, "epoch": 1686} {"train_loss": -11.720239639282227, "global_step": 283354, "epoch": 1686} {"train_loss": -12.17287826538086, "global_step": 283355, "epoch": 1686} {"train_loss": -11.436077117919922, "global_step": 283356, "epoch": 1686} {"train_loss": -12.028068542480469, "global_step": 283357, "epoch": 1686} {"train_loss": -12.120599746704102, "global_step": 283358, "epoch": 1686} {"train_loss": -11.741193771362305, "global_step": 283359, "epoch": 1686} {"train_loss": -11.821765899658203, "global_step": 283360, "epoch": 1686} {"train_loss": -12.24953842163086, "global_step": 283361, "epoch": 1686} {"train_loss": -12.21853256225586, "global_step": 283362, "epoch": 1686} {"train_loss": -12.029869079589844, "global_step": 283363, "epoch": 1686} {"train_loss": -12.239914894104004, "global_step": 283364, "epoch": 1686} {"train_loss": -12.12834358215332, "global_step": 283365, "epoch": 1686} {"train_loss": -12.159709930419922, "global_step": 283366, "epoch": 1686} {"train_loss": -12.277178764343262, "global_step": 283367, "epoch": 1686} {"train_loss": -12.314998626708984, "global_step": 283368, "epoch": 1686} {"train_loss": -12.226655006408691, "global_step": 283369, "epoch": 1686} {"train_loss": -12.059776306152344, "global_step": 283370, "epoch": 1686} {"train_loss": -11.961607933044434, "global_step": 283371, "epoch": 1686} {"train_loss": -12.412853240966797, "global_step": 283372, "epoch": 1686} {"train_loss": -12.029064178466797, "global_step": 283373, "epoch": 1686} {"train_loss": -11.450902938842773, "global_step": 283374, "epoch": 1686} {"train_loss": -11.78165340423584, "global_step": 283375, "epoch": 1686} {"train_loss": -12.324746131896973, "global_step": 283376, "epoch": 1686} {"train_loss": -11.648120880126953, "global_step": 283377, "epoch": 1686} {"train_loss": -11.124472618103027, "global_step": 283378, "epoch": 1686} {"train_loss": -11.769935607910156, "global_step": 283379, "epoch": 1686} {"train_loss": -11.871883392333984, "global_step": 283380, "epoch": 1686} {"train_loss": -12.158382415771484, "global_step": 283381, "epoch": 1686} {"train_loss": -11.364694595336914, "global_step": 283382, "epoch": 1686} {"train_loss": -11.956110954284668, "global_step": 283383, "epoch": 1686} {"train_loss": -12.025402069091797, "global_step": 283384, "epoch": 1686} {"train_loss": -12.026840209960938, "global_step": 283385, "epoch": 1686} {"train_loss": -12.251948356628418, "global_step": 283386, "epoch": 1686} {"train_loss": -11.394537925720215, "global_step": 283387, "epoch": 1686} {"train_loss": -11.230173110961914, "global_step": 283388, "epoch": 1686} {"train_loss": -11.641576766967773, "global_step": 283389, "epoch": 1686} {"train_loss": -11.542388916015625, "global_step": 283390, "epoch": 1686} {"train_loss": -9.77043628692627, "global_step": 283391, "epoch": 1686} {"train_loss": -10.5348482131958, "global_step": 283392, "epoch": 1686} {"train_loss": -11.911407470703125, "global_step": 283393, "epoch": 1686} {"train_loss": -8.936433792114258, "global_step": 283394, "epoch": 1686} {"train_loss": -10.516399383544922, "global_step": 283395, "epoch": 1686} {"train_loss": -9.89017105102539, "global_step": 283396, "epoch": 1686} {"train_loss": -9.295087814331055, "global_step": 283397, "epoch": 1686} {"train_loss": -10.833234786987305, "global_step": 283398, "epoch": 1686} {"train_loss": -10.178096771240234, "global_step": 283399, "epoch": 1686} {"train_loss": -10.946083068847656, "global_step": 283400, "epoch": 1686} {"train_loss": -10.23948860168457, "global_step": 283401, "epoch": 1686} {"train_loss": -11.440818786621094, "global_step": 283402, "epoch": 1686} {"train_loss": -9.816243171691895, "global_step": 283403, "epoch": 1686} {"train_loss": -10.005680084228516, "global_step": 283404, "epoch": 1686} {"train_loss": -10.837337493896484, "global_step": 283405, "epoch": 1686} {"train_loss": -8.348197937011719, "global_step": 283406, "epoch": 1686} {"train_loss": -9.930072784423828, "global_step": 283407, "epoch": 1686} {"train_loss": -10.899938583374023, "global_step": 283408, "epoch": 1686} {"train_loss": -10.383901596069336, "global_step": 283409, "epoch": 1686} {"train_loss": -10.786364555358887, "global_step": 283410, "epoch": 1686} {"train_loss": -11.369888305664062, "global_step": 283411, "epoch": 1686} {"train_loss": -10.419172286987305, "global_step": 283412, "epoch": 1686} {"train_loss": -11.723631858825684, "global_step": 283413, "epoch": 1686} {"train_loss": -10.987679481506348, "global_step": 283414, "epoch": 1686} {"train_loss": -11.341108838717142, "global_step": 283415, "epoch": 1686, "val_loss": 278428.59375} {"train_loss": -11.141142845153809, "global_step": 283416, "epoch": 1687} {"train_loss": -10.866302490234375, "global_step": 283417, "epoch": 1687} {"train_loss": -11.597753524780273, "global_step": 283418, "epoch": 1687} {"train_loss": -11.038225173950195, "global_step": 283419, "epoch": 1687} {"train_loss": -11.110960006713867, "global_step": 283420, "epoch": 1687} {"train_loss": -10.98362922668457, "global_step": 283421, "epoch": 1687} {"train_loss": -11.216743469238281, "global_step": 283422, "epoch": 1687} {"train_loss": -10.765318870544434, "global_step": 283423, "epoch": 1687} {"train_loss": -11.751148223876953, "global_step": 283424, "epoch": 1687} {"train_loss": -10.586048126220703, "global_step": 283425, "epoch": 1687} {"train_loss": -11.688618659973145, "global_step": 283426, "epoch": 1687} {"train_loss": -10.996253967285156, "global_step": 283427, "epoch": 1687} {"train_loss": -11.80705451965332, "global_step": 283428, "epoch": 1687} {"train_loss": -11.263105392456055, "global_step": 283429, "epoch": 1687} {"train_loss": -11.573969841003418, "global_step": 283430, "epoch": 1687} {"train_loss": -11.257527351379395, "global_step": 283431, "epoch": 1687} {"train_loss": -11.571941375732422, "global_step": 283432, "epoch": 1687} {"train_loss": -11.59713363647461, "global_step": 283433, "epoch": 1687} {"train_loss": -11.810659408569336, "global_step": 283434, "epoch": 1687} {"train_loss": -11.710174560546875, "global_step": 283435, "epoch": 1687} {"train_loss": -11.847399711608887, "global_step": 283436, "epoch": 1687} {"train_loss": -11.772664070129395, "global_step": 283437, "epoch": 1687} {"train_loss": -11.728437423706055, "global_step": 283438, "epoch": 1687} {"train_loss": -11.667497634887695, "global_step": 283439, "epoch": 1687} {"train_loss": -11.846820831298828, "global_step": 283440, "epoch": 1687} {"train_loss": -11.529258728027344, "global_step": 283441, "epoch": 1687} {"train_loss": -11.746392250061035, "global_step": 283442, "epoch": 1687} {"train_loss": -11.744104385375977, "global_step": 283443, "epoch": 1687} {"train_loss": -11.915407180786133, "global_step": 283444, "epoch": 1687} {"train_loss": -11.58160400390625, "global_step": 283445, "epoch": 1687} {"train_loss": -12.037044525146484, "global_step": 283446, "epoch": 1687} {"train_loss": -11.772340774536133, "global_step": 283447, "epoch": 1687} {"train_loss": -12.090799331665039, "global_step": 283448, "epoch": 1687} {"train_loss": -11.914413452148438, "global_step": 283449, "epoch": 1687} {"train_loss": -11.932979583740234, "global_step": 283450, "epoch": 1687} {"train_loss": -12.010261535644531, "global_step": 283451, "epoch": 1687} {"train_loss": -11.804851531982422, "global_step": 283452, "epoch": 1687} {"train_loss": -11.8927583694458, "global_step": 283453, "epoch": 1687} {"train_loss": -11.943361282348633, "global_step": 283454, "epoch": 1687} {"train_loss": -12.073884010314941, "global_step": 283455, "epoch": 1687} {"train_loss": -12.121188163757324, "global_step": 283456, "epoch": 1687} {"train_loss": -11.949905395507812, "global_step": 283457, "epoch": 1687} {"train_loss": -11.998642921447754, "global_step": 283458, "epoch": 1687} {"train_loss": -11.83163070678711, "global_step": 283459, "epoch": 1687} {"train_loss": -12.129780769348145, "global_step": 283460, "epoch": 1687} {"train_loss": -12.070982933044434, "global_step": 283461, "epoch": 1687} {"train_loss": -12.109346389770508, "global_step": 283462, "epoch": 1687} {"train_loss": -12.093559265136719, "global_step": 283463, "epoch": 1687} {"train_loss": -12.23128890991211, "global_step": 283464, "epoch": 1687} {"train_loss": -12.082837104797363, "global_step": 283465, "epoch": 1687} {"train_loss": -12.025489807128906, "global_step": 283466, "epoch": 1687} {"train_loss": -12.066933631896973, "global_step": 283467, "epoch": 1687} {"train_loss": -12.335833549499512, "global_step": 283468, "epoch": 1687} {"train_loss": -12.181316375732422, "global_step": 283469, "epoch": 1687} {"train_loss": -12.218559265136719, "global_step": 283470, "epoch": 1687} {"train_loss": -12.277796745300293, "global_step": 283471, "epoch": 1687} {"train_loss": -12.050436019897461, "global_step": 283472, "epoch": 1687} {"train_loss": -12.303688049316406, "global_step": 283473, "epoch": 1687} {"train_loss": -12.306766510009766, "global_step": 283474, "epoch": 1687} {"train_loss": -12.199189186096191, "global_step": 283475, "epoch": 1687} {"train_loss": -12.183425903320312, "global_step": 283476, "epoch": 1687} {"train_loss": -12.298757553100586, "global_step": 283477, "epoch": 1687} {"train_loss": -12.278066635131836, "global_step": 283478, "epoch": 1687} {"train_loss": -12.155637741088867, "global_step": 283479, "epoch": 1687} {"train_loss": -12.356500625610352, "global_step": 283480, "epoch": 1687} {"train_loss": -12.156965255737305, "global_step": 283481, "epoch": 1687} {"train_loss": -12.043610572814941, "global_step": 283482, "epoch": 1687} {"train_loss": -12.337516784667969, "global_step": 283483, "epoch": 1687} {"train_loss": -12.245145797729492, "global_step": 283484, "epoch": 1687} {"train_loss": -11.938739776611328, "global_step": 283485, "epoch": 1687} {"train_loss": -12.427534103393555, "global_step": 283486, "epoch": 1687} {"train_loss": -12.021843910217285, "global_step": 283487, "epoch": 1687} {"train_loss": -12.326313018798828, "global_step": 283488, "epoch": 1687} {"train_loss": -12.000420570373535, "global_step": 283489, "epoch": 1687} {"train_loss": -11.968952178955078, "global_step": 283490, "epoch": 1687} {"train_loss": -12.076766967773438, "global_step": 283491, "epoch": 1687} {"train_loss": -12.352827072143555, "global_step": 283492, "epoch": 1687} {"train_loss": -12.404519081115723, "global_step": 283493, "epoch": 1687} {"train_loss": -12.400476455688477, "global_step": 283494, "epoch": 1687} {"train_loss": -12.237709045410156, "global_step": 283495, "epoch": 1687} {"train_loss": -12.416945457458496, "global_step": 283496, "epoch": 1687} {"train_loss": -12.323326110839844, "global_step": 283497, "epoch": 1687} {"train_loss": -12.149087905883789, "global_step": 283498, "epoch": 1687} {"train_loss": -12.329019546508789, "global_step": 283499, "epoch": 1687} {"train_loss": -12.366989135742188, "global_step": 283500, "epoch": 1687} {"train_loss": -12.294086456298828, "global_step": 283501, "epoch": 1687} {"train_loss": -12.329898834228516, "global_step": 283502, "epoch": 1687} {"train_loss": -12.357948303222656, "global_step": 283503, "epoch": 1687} {"train_loss": -12.19459056854248, "global_step": 283504, "epoch": 1687} {"train_loss": -12.270784378051758, "global_step": 283505, "epoch": 1687} {"train_loss": -12.353992462158203, "global_step": 283506, "epoch": 1687} {"train_loss": -12.104202270507812, "global_step": 283507, "epoch": 1687} {"train_loss": -12.311418533325195, "global_step": 283508, "epoch": 1687} {"train_loss": -12.108139038085938, "global_step": 283509, "epoch": 1687} {"train_loss": -12.537610054016113, "global_step": 283510, "epoch": 1687} {"train_loss": -12.060422897338867, "global_step": 283511, "epoch": 1687} {"train_loss": -12.427115440368652, "global_step": 283512, "epoch": 1687} {"train_loss": -12.214631080627441, "global_step": 283513, "epoch": 1687} {"train_loss": -12.231939315795898, "global_step": 283514, "epoch": 1687} {"train_loss": -11.574831008911133, "global_step": 283515, "epoch": 1687} {"train_loss": -11.955265045166016, "global_step": 283516, "epoch": 1687} {"train_loss": -12.155545234680176, "global_step": 283517, "epoch": 1687} {"train_loss": -11.585628509521484, "global_step": 283518, "epoch": 1687} {"train_loss": -11.590280532836914, "global_step": 283519, "epoch": 1687} {"train_loss": -11.228165626525879, "global_step": 283520, "epoch": 1687} {"train_loss": -10.765131950378418, "global_step": 283521, "epoch": 1687} {"train_loss": -12.055082321166992, "global_step": 283522, "epoch": 1687} {"train_loss": -10.084466934204102, "global_step": 283523, "epoch": 1687} {"train_loss": -10.955320358276367, "global_step": 283524, "epoch": 1687} {"train_loss": -11.608415603637695, "global_step": 283525, "epoch": 1687} {"train_loss": -10.50234317779541, "global_step": 283526, "epoch": 1687} {"train_loss": -10.091899871826172, "global_step": 283527, "epoch": 1687} {"train_loss": -11.847799301147461, "global_step": 283528, "epoch": 1687} {"train_loss": -10.452043533325195, "global_step": 283529, "epoch": 1687} {"train_loss": -9.42129135131836, "global_step": 283530, "epoch": 1687} {"train_loss": -10.309614181518555, "global_step": 283531, "epoch": 1687} {"train_loss": -11.110730171203613, "global_step": 283532, "epoch": 1687} {"train_loss": -9.87678050994873, "global_step": 283533, "epoch": 1687} {"train_loss": -10.047079086303711, "global_step": 283534, "epoch": 1687} {"train_loss": -11.461015701293945, "global_step": 283535, "epoch": 1687} {"train_loss": -10.784738540649414, "global_step": 283536, "epoch": 1687} {"train_loss": -11.37281322479248, "global_step": 283537, "epoch": 1687} {"train_loss": -9.904747009277344, "global_step": 283538, "epoch": 1687} {"train_loss": -9.226563453674316, "global_step": 283539, "epoch": 1687} {"train_loss": -10.254154205322266, "global_step": 283540, "epoch": 1687} {"train_loss": -10.248043060302734, "global_step": 283541, "epoch": 1687} {"train_loss": -10.692968368530273, "global_step": 283542, "epoch": 1687} {"train_loss": -10.349750518798828, "global_step": 283543, "epoch": 1687} {"train_loss": -11.029366493225098, "global_step": 283544, "epoch": 1687} {"train_loss": -10.668359756469727, "global_step": 283545, "epoch": 1687} {"train_loss": -11.36402702331543, "global_step": 283546, "epoch": 1687} {"train_loss": -10.947103500366211, "global_step": 283547, "epoch": 1687} {"train_loss": -11.503623962402344, "global_step": 283548, "epoch": 1687} {"train_loss": -10.923120498657227, "global_step": 283549, "epoch": 1687} {"train_loss": -11.128355026245117, "global_step": 283550, "epoch": 1687} {"train_loss": -10.964072227478027, "global_step": 283551, "epoch": 1687} {"train_loss": -11.626805305480957, "global_step": 283552, "epoch": 1687} {"train_loss": -11.09239387512207, "global_step": 283553, "epoch": 1687} {"train_loss": -11.159952163696289, "global_step": 283554, "epoch": 1687} {"train_loss": -11.027486801147461, "global_step": 283555, "epoch": 1687} {"train_loss": -11.291772842407227, "global_step": 283556, "epoch": 1687} {"train_loss": -10.930513381958008, "global_step": 283557, "epoch": 1687} {"train_loss": -11.507309913635254, "global_step": 283558, "epoch": 1687} {"train_loss": -11.310522079467773, "global_step": 283559, "epoch": 1687} {"train_loss": -11.648124694824219, "global_step": 283560, "epoch": 1687} {"train_loss": -11.33022403717041, "global_step": 283561, "epoch": 1687} {"train_loss": -11.467601776123047, "global_step": 283562, "epoch": 1687} {"train_loss": -11.485109329223633, "global_step": 283563, "epoch": 1687} {"train_loss": -11.844993591308594, "global_step": 283564, "epoch": 1687} {"train_loss": -11.620772361755371, "global_step": 283565, "epoch": 1687} {"train_loss": -11.876799583435059, "global_step": 283566, "epoch": 1687} {"train_loss": -11.491715431213379, "global_step": 283567, "epoch": 1687} {"train_loss": -11.515414237976074, "global_step": 283568, "epoch": 1687} {"train_loss": -11.61229419708252, "global_step": 283569, "epoch": 1687} {"train_loss": -11.296283721923828, "global_step": 283570, "epoch": 1687} {"train_loss": -11.737239837646484, "global_step": 283571, "epoch": 1687} {"train_loss": -11.458765983581543, "global_step": 283572, "epoch": 1687} {"train_loss": -11.91089153289795, "global_step": 283573, "epoch": 1687} {"train_loss": -11.619270324707031, "global_step": 283574, "epoch": 1687} {"train_loss": -12.060920715332031, "global_step": 283575, "epoch": 1687} {"train_loss": -11.681249618530273, "global_step": 283576, "epoch": 1687} {"train_loss": -11.479360580444336, "global_step": 283577, "epoch": 1687} {"train_loss": -11.523361206054688, "global_step": 283578, "epoch": 1687} {"train_loss": -11.320487976074219, "global_step": 283579, "epoch": 1687} {"train_loss": -11.359701156616211, "global_step": 283580, "epoch": 1687} {"train_loss": -11.864028930664062, "global_step": 283581, "epoch": 1687} {"train_loss": -11.498506546020508, "global_step": 283582, "epoch": 1687} {"train_loss": -11.628768818719047, "global_step": 283583, "epoch": 1687, "val_loss": 276195.53125} {"train_loss": -11.52580451965332, "global_step": 283584, "epoch": 1688} {"train_loss": -11.620807647705078, "global_step": 283585, "epoch": 1688} {"train_loss": -11.181024551391602, "global_step": 283586, "epoch": 1688} {"train_loss": -11.767369270324707, "global_step": 283587, "epoch": 1688} {"train_loss": -11.67031478881836, "global_step": 283588, "epoch": 1688} {"train_loss": -11.942750930786133, "global_step": 283589, "epoch": 1688} {"train_loss": -11.680259704589844, "global_step": 283590, "epoch": 1688} {"train_loss": -11.628517150878906, "global_step": 283591, "epoch": 1688} {"train_loss": -11.868282318115234, "global_step": 283592, "epoch": 1688} {"train_loss": -11.293289184570312, "global_step": 283593, "epoch": 1688} {"train_loss": -11.935563087463379, "global_step": 283594, "epoch": 1688} {"train_loss": -11.770377159118652, "global_step": 283595, "epoch": 1688} {"train_loss": -11.714370727539062, "global_step": 283596, "epoch": 1688} {"train_loss": -11.931300163269043, "global_step": 283597, "epoch": 1688} {"train_loss": -11.6892671585083, "global_step": 283598, "epoch": 1688} {"train_loss": -12.14431381225586, "global_step": 283599, "epoch": 1688} {"train_loss": -11.991243362426758, "global_step": 283600, "epoch": 1688} {"train_loss": -11.90924072265625, "global_step": 283601, "epoch": 1688} {"train_loss": -12.001677513122559, "global_step": 283602, "epoch": 1688} {"train_loss": -12.001893997192383, "global_step": 283603, "epoch": 1688} {"train_loss": -12.175257682800293, "global_step": 283604, "epoch": 1688} {"train_loss": -11.777993202209473, "global_step": 283605, "epoch": 1688} {"train_loss": -11.936521530151367, "global_step": 283606, "epoch": 1688} {"train_loss": -11.9066743850708, "global_step": 283607, "epoch": 1688} {"train_loss": -12.193838119506836, "global_step": 283608, "epoch": 1688} {"train_loss": -12.003122329711914, "global_step": 283609, "epoch": 1688} {"train_loss": -12.100713729858398, "global_step": 283610, "epoch": 1688} {"train_loss": -11.869672775268555, "global_step": 283611, "epoch": 1688} {"train_loss": -11.880691528320312, "global_step": 283612, "epoch": 1688} {"train_loss": -12.004972457885742, "global_step": 283613, "epoch": 1688} {"train_loss": -11.444890975952148, "global_step": 283614, "epoch": 1688} {"train_loss": -11.955179214477539, "global_step": 283615, "epoch": 1688} {"train_loss": -11.812021255493164, "global_step": 283616, "epoch": 1688} {"train_loss": -11.556732177734375, "global_step": 283617, "epoch": 1688} {"train_loss": -11.882657051086426, "global_step": 283618, "epoch": 1688} {"train_loss": -11.937901496887207, "global_step": 283619, "epoch": 1688} {"train_loss": -11.816751480102539, "global_step": 283620, "epoch": 1688} {"train_loss": -11.833197593688965, "global_step": 283621, "epoch": 1688} {"train_loss": -11.734573364257812, "global_step": 283622, "epoch": 1688} {"train_loss": -12.00745964050293, "global_step": 283623, "epoch": 1688} {"train_loss": -12.009612083435059, "global_step": 283624, "epoch": 1688} {"train_loss": -12.03614616394043, "global_step": 283625, "epoch": 1688} {"train_loss": -11.603214263916016, "global_step": 283626, "epoch": 1688} {"train_loss": -12.016641616821289, "global_step": 283627, "epoch": 1688} {"train_loss": -11.860407829284668, "global_step": 283628, "epoch": 1688} {"train_loss": -12.345817565917969, "global_step": 283629, "epoch": 1688} {"train_loss": -12.04364013671875, "global_step": 283630, "epoch": 1688} {"train_loss": -12.063711166381836, "global_step": 283631, "epoch": 1688} {"train_loss": -11.956304550170898, "global_step": 283632, "epoch": 1688} {"train_loss": -12.212108612060547, "global_step": 283633, "epoch": 1688} {"train_loss": -11.927303314208984, "global_step": 283634, "epoch": 1688} {"train_loss": -12.02248477935791, "global_step": 283635, "epoch": 1688} {"train_loss": -11.92611312866211, "global_step": 283636, "epoch": 1688} {"train_loss": -12.052953720092773, "global_step": 283637, "epoch": 1688} {"train_loss": -11.935405731201172, "global_step": 283638, "epoch": 1688} {"train_loss": -11.772411346435547, "global_step": 283639, "epoch": 1688} {"train_loss": -12.317253112792969, "global_step": 283640, "epoch": 1688} {"train_loss": -11.822107315063477, "global_step": 283641, "epoch": 1688} {"train_loss": -12.11552906036377, "global_step": 283642, "epoch": 1688} {"train_loss": -11.593118667602539, "global_step": 283643, "epoch": 1688} {"train_loss": -11.871501922607422, "global_step": 283644, "epoch": 1688} {"train_loss": -11.664661407470703, "global_step": 283645, "epoch": 1688} {"train_loss": -12.132311820983887, "global_step": 283646, "epoch": 1688} {"train_loss": -11.74941635131836, "global_step": 283647, "epoch": 1688} {"train_loss": -11.7306547164917, "global_step": 283648, "epoch": 1688} {"train_loss": -12.262048721313477, "global_step": 283649, "epoch": 1688} {"train_loss": -11.609612464904785, "global_step": 283650, "epoch": 1688} {"train_loss": -12.229026794433594, "global_step": 283651, "epoch": 1688} {"train_loss": -12.035682678222656, "global_step": 283652, "epoch": 1688} {"train_loss": -12.146598815917969, "global_step": 283653, "epoch": 1688} {"train_loss": -11.947663307189941, "global_step": 283654, "epoch": 1688} {"train_loss": -11.68303108215332, "global_step": 283655, "epoch": 1688} {"train_loss": -12.096124649047852, "global_step": 283656, "epoch": 1688} {"train_loss": -11.821752548217773, "global_step": 283657, "epoch": 1688} {"train_loss": -12.294696807861328, "global_step": 283658, "epoch": 1688} {"train_loss": -11.788429260253906, "global_step": 283659, "epoch": 1688} {"train_loss": -12.356969833374023, "global_step": 283660, "epoch": 1688} {"train_loss": -12.134133338928223, "global_step": 283661, "epoch": 1688} {"train_loss": -12.227453231811523, "global_step": 283662, "epoch": 1688} {"train_loss": -12.015013694763184, "global_step": 283663, "epoch": 1688} {"train_loss": -12.352521896362305, "global_step": 283664, "epoch": 1688} {"train_loss": -12.011323928833008, "global_step": 283665, "epoch": 1688} {"train_loss": -10.97445297241211, "global_step": 283666, "epoch": 1688} {"train_loss": -11.672060012817383, "global_step": 283667, "epoch": 1688} {"train_loss": -12.236961364746094, "global_step": 283668, "epoch": 1688} {"train_loss": -11.541519165039062, "global_step": 283669, "epoch": 1688} {"train_loss": -11.798908233642578, "global_step": 283670, "epoch": 1688} {"train_loss": -12.412817001342773, "global_step": 283671, "epoch": 1688} {"train_loss": -11.789815902709961, "global_step": 283672, "epoch": 1688} {"train_loss": -12.122373580932617, "global_step": 283673, "epoch": 1688} {"train_loss": -12.016263008117676, "global_step": 283674, "epoch": 1688} {"train_loss": -11.913043022155762, "global_step": 283675, "epoch": 1688} {"train_loss": -12.235000610351562, "global_step": 283676, "epoch": 1688} {"train_loss": -11.989870071411133, "global_step": 283677, "epoch": 1688} {"train_loss": -12.284191131591797, "global_step": 283678, "epoch": 1688} {"train_loss": -11.864163398742676, "global_step": 283679, "epoch": 1688} {"train_loss": -12.232808113098145, "global_step": 283680, "epoch": 1688} {"train_loss": -12.14193344116211, "global_step": 283681, "epoch": 1688} {"train_loss": -12.272871017456055, "global_step": 283682, "epoch": 1688} {"train_loss": -12.0324125289917, "global_step": 283683, "epoch": 1688} {"train_loss": -12.17600154876709, "global_step": 283684, "epoch": 1688} {"train_loss": -11.97024917602539, "global_step": 283685, "epoch": 1688} {"train_loss": -12.254240989685059, "global_step": 283686, "epoch": 1688} {"train_loss": -12.092256546020508, "global_step": 283687, "epoch": 1688} {"train_loss": -11.925765991210938, "global_step": 283688, "epoch": 1688} {"train_loss": -12.169214248657227, "global_step": 283689, "epoch": 1688} {"train_loss": -12.111249923706055, "global_step": 283690, "epoch": 1688} {"train_loss": -12.10175895690918, "global_step": 283691, "epoch": 1688} {"train_loss": -12.156204223632812, "global_step": 283692, "epoch": 1688} {"train_loss": -12.329317092895508, "global_step": 283693, "epoch": 1688} {"train_loss": -12.065107345581055, "global_step": 283694, "epoch": 1688} {"train_loss": -12.172800064086914, "global_step": 283695, "epoch": 1688} {"train_loss": -12.390103340148926, "global_step": 283696, "epoch": 1688} {"train_loss": -11.87864875793457, "global_step": 283697, "epoch": 1688} {"train_loss": -11.995830535888672, "global_step": 283698, "epoch": 1688} {"train_loss": -12.431455612182617, "global_step": 283699, "epoch": 1688} {"train_loss": -12.04678726196289, "global_step": 283700, "epoch": 1688} {"train_loss": -12.156562805175781, "global_step": 283701, "epoch": 1688} {"train_loss": -12.415497779846191, "global_step": 283702, "epoch": 1688} {"train_loss": -12.369060516357422, "global_step": 283703, "epoch": 1688} {"train_loss": -12.238662719726562, "global_step": 283704, "epoch": 1688} {"train_loss": -12.073806762695312, "global_step": 283705, "epoch": 1688} {"train_loss": -11.882978439331055, "global_step": 283706, "epoch": 1688} {"train_loss": -11.662059783935547, "global_step": 283707, "epoch": 1688} {"train_loss": -12.280746459960938, "global_step": 283708, "epoch": 1688} {"train_loss": -12.155860900878906, "global_step": 283709, "epoch": 1688} {"train_loss": -12.061942100524902, "global_step": 283710, "epoch": 1688} {"train_loss": -11.848718643188477, "global_step": 283711, "epoch": 1688} {"train_loss": -11.782069206237793, "global_step": 283712, "epoch": 1688} {"train_loss": -11.649286270141602, "global_step": 283713, "epoch": 1688} {"train_loss": -11.360095977783203, "global_step": 283714, "epoch": 1688} {"train_loss": -11.839597702026367, "global_step": 283715, "epoch": 1688} {"train_loss": -11.993921279907227, "global_step": 283716, "epoch": 1688} {"train_loss": -11.137434005737305, "global_step": 283717, "epoch": 1688} {"train_loss": -11.491081237792969, "global_step": 283718, "epoch": 1688} {"train_loss": -11.778125762939453, "global_step": 283719, "epoch": 1688} {"train_loss": -10.919657707214355, "global_step": 283720, "epoch": 1688} {"train_loss": -10.19111442565918, "global_step": 283721, "epoch": 1688} {"train_loss": -11.41970443725586, "global_step": 283722, "epoch": 1688} {"train_loss": -10.521415710449219, "global_step": 283723, "epoch": 1688} {"train_loss": -11.096517562866211, "global_step": 283724, "epoch": 1688} {"train_loss": -10.897979736328125, "global_step": 283725, "epoch": 1688} {"train_loss": -10.680816650390625, "global_step": 283726, "epoch": 1688} {"train_loss": -10.01382827758789, "global_step": 283727, "epoch": 1688} {"train_loss": -11.278308868408203, "global_step": 283728, "epoch": 1688} {"train_loss": -9.780206680297852, "global_step": 283729, "epoch": 1688} {"train_loss": -10.99748420715332, "global_step": 283730, "epoch": 1688} {"train_loss": -9.11902141571045, "global_step": 283731, "epoch": 1688} {"train_loss": -9.812349319458008, "global_step": 283732, "epoch": 1688} {"train_loss": -10.427513122558594, "global_step": 283733, "epoch": 1688} {"train_loss": -9.669622421264648, "global_step": 283734, "epoch": 1688} {"train_loss": -10.582269668579102, "global_step": 283735, "epoch": 1688} {"train_loss": -10.636003494262695, "global_step": 283736, "epoch": 1688} {"train_loss": -10.151642799377441, "global_step": 283737, "epoch": 1688} {"train_loss": -10.384283065795898, "global_step": 283738, "epoch": 1688} {"train_loss": -10.26743221282959, "global_step": 283739, "epoch": 1688} {"train_loss": -10.938382148742676, "global_step": 283740, "epoch": 1688} {"train_loss": -10.573650360107422, "global_step": 283741, "epoch": 1688} {"train_loss": -10.740217208862305, "global_step": 283742, "epoch": 1688} {"train_loss": -10.909133911132812, "global_step": 283743, "epoch": 1688} {"train_loss": -11.122836112976074, "global_step": 283744, "epoch": 1688} {"train_loss": -11.306727409362793, "global_step": 283745, "epoch": 1688} {"train_loss": -11.391975402832031, "global_step": 283746, "epoch": 1688} {"train_loss": -11.076166152954102, "global_step": 283747, "epoch": 1688} {"train_loss": -11.63845443725586, "global_step": 283748, "epoch": 1688} {"train_loss": -11.695562362670898, "global_step": 283749, "epoch": 1688} {"train_loss": -11.39328670501709, "global_step": 283750, "epoch": 1688} {"train_loss": -11.714450370697747, "global_step": 283751, "epoch": 1688, "val_loss": 273731.3125} {"train_loss": -11.286360740661621, "global_step": 283752, "epoch": 1689} {"train_loss": -11.754583358764648, "global_step": 283753, "epoch": 1689} {"train_loss": -11.584918022155762, "global_step": 283754, "epoch": 1689} {"train_loss": -11.767457962036133, "global_step": 283755, "epoch": 1689} {"train_loss": -11.499902725219727, "global_step": 283756, "epoch": 1689} {"train_loss": -11.403427124023438, "global_step": 283757, "epoch": 1689} {"train_loss": -11.997167587280273, "global_step": 283758, "epoch": 1689} {"train_loss": -11.378567695617676, "global_step": 283759, "epoch": 1689} {"train_loss": -11.898299217224121, "global_step": 283760, "epoch": 1689} {"train_loss": -11.586264610290527, "global_step": 283761, "epoch": 1689} {"train_loss": -11.669564247131348, "global_step": 283762, "epoch": 1689} {"train_loss": -11.639159202575684, "global_step": 283763, "epoch": 1689} {"train_loss": -11.467473983764648, "global_step": 283764, "epoch": 1689} {"train_loss": -11.491477012634277, "global_step": 283765, "epoch": 1689} {"train_loss": -11.883368492126465, "global_step": 283766, "epoch": 1689} {"train_loss": -11.028739929199219, "global_step": 283767, "epoch": 1689} {"train_loss": -11.606245040893555, "global_step": 283768, "epoch": 1689} {"train_loss": -11.277114868164062, "global_step": 283769, "epoch": 1689} {"train_loss": -11.42809009552002, "global_step": 283770, "epoch": 1689} {"train_loss": -11.576743125915527, "global_step": 283771, "epoch": 1689} {"train_loss": -11.189876556396484, "global_step": 283772, "epoch": 1689} {"train_loss": -11.324180603027344, "global_step": 283773, "epoch": 1689} {"train_loss": -11.234749794006348, "global_step": 283774, "epoch": 1689} {"train_loss": -11.695359230041504, "global_step": 283775, "epoch": 1689} {"train_loss": -10.829760551452637, "global_step": 283776, "epoch": 1689} {"train_loss": -11.77631950378418, "global_step": 283777, "epoch": 1689} {"train_loss": -10.996684074401855, "global_step": 283778, "epoch": 1689} {"train_loss": -11.850744247436523, "global_step": 283779, "epoch": 1689} {"train_loss": -11.446197509765625, "global_step": 283780, "epoch": 1689} {"train_loss": -11.170368194580078, "global_step": 283781, "epoch": 1689} {"train_loss": -11.784992218017578, "global_step": 283782, "epoch": 1689} {"train_loss": -11.207456588745117, "global_step": 283783, "epoch": 1689} {"train_loss": -11.552687644958496, "global_step": 283784, "epoch": 1689} {"train_loss": -10.903465270996094, "global_step": 283785, "epoch": 1689} {"train_loss": -10.428672790527344, "global_step": 283786, "epoch": 1689} {"train_loss": -11.364822387695312, "global_step": 283787, "epoch": 1689} {"train_loss": -10.972999572753906, "global_step": 283788, "epoch": 1689} {"train_loss": -11.126676559448242, "global_step": 283789, "epoch": 1689} {"train_loss": -11.145597457885742, "global_step": 283790, "epoch": 1689} {"train_loss": -10.638664245605469, "global_step": 283791, "epoch": 1689} {"train_loss": -11.661454200744629, "global_step": 283792, "epoch": 1689} {"train_loss": -10.747617721557617, "global_step": 283793, "epoch": 1689} {"train_loss": -11.88864517211914, "global_step": 283794, "epoch": 1689} {"train_loss": -11.2344331741333, "global_step": 283795, "epoch": 1689} {"train_loss": -11.895116806030273, "global_step": 283796, "epoch": 1689} {"train_loss": -11.507719039916992, "global_step": 283797, "epoch": 1689} {"train_loss": -11.522310256958008, "global_step": 283798, "epoch": 1689} {"train_loss": -11.629276275634766, "global_step": 283799, "epoch": 1689} {"train_loss": -11.746076583862305, "global_step": 283800, "epoch": 1689} {"train_loss": -11.815376281738281, "global_step": 283801, "epoch": 1689} {"train_loss": -11.627552032470703, "global_step": 283802, "epoch": 1689} {"train_loss": -11.83509635925293, "global_step": 283803, "epoch": 1689} {"train_loss": -11.880523681640625, "global_step": 283804, "epoch": 1689} {"train_loss": -11.744619369506836, "global_step": 283805, "epoch": 1689} {"train_loss": -11.658112525939941, "global_step": 283806, "epoch": 1689} {"train_loss": -11.600544929504395, "global_step": 283807, "epoch": 1689} {"train_loss": -11.635316848754883, "global_step": 283808, "epoch": 1689} {"train_loss": -11.943737030029297, "global_step": 283809, "epoch": 1689} {"train_loss": -11.787485122680664, "global_step": 283810, "epoch": 1689} {"train_loss": -11.930721282958984, "global_step": 283811, "epoch": 1689} {"train_loss": -11.932069778442383, "global_step": 283812, "epoch": 1689} {"train_loss": -12.0686616897583, "global_step": 283813, "epoch": 1689} {"train_loss": -11.670572280883789, "global_step": 283814, "epoch": 1689} {"train_loss": -12.05569076538086, "global_step": 283815, "epoch": 1689} {"train_loss": -11.82288932800293, "global_step": 283816, "epoch": 1689} {"train_loss": -11.964921951293945, "global_step": 283817, "epoch": 1689} {"train_loss": -11.675493240356445, "global_step": 283818, "epoch": 1689} {"train_loss": -11.982210159301758, "global_step": 283819, "epoch": 1689} {"train_loss": -11.879106521606445, "global_step": 283820, "epoch": 1689} {"train_loss": -11.923812866210938, "global_step": 283821, "epoch": 1689} {"train_loss": -12.059772491455078, "global_step": 283822, "epoch": 1689} {"train_loss": -11.911989212036133, "global_step": 283823, "epoch": 1689} {"train_loss": -11.790236473083496, "global_step": 283824, "epoch": 1689} {"train_loss": -12.140758514404297, "global_step": 283825, "epoch": 1689} {"train_loss": -12.179130554199219, "global_step": 283826, "epoch": 1689} {"train_loss": -12.033707618713379, "global_step": 283827, "epoch": 1689} {"train_loss": -12.070385932922363, "global_step": 283828, "epoch": 1689} {"train_loss": -12.238042831420898, "global_step": 283829, "epoch": 1689} {"train_loss": -11.961406707763672, "global_step": 283830, "epoch": 1689} {"train_loss": -12.340494155883789, "global_step": 283831, "epoch": 1689} {"train_loss": -12.284873962402344, "global_step": 283832, "epoch": 1689} {"train_loss": -11.956281661987305, "global_step": 283833, "epoch": 1689} {"train_loss": -12.396322250366211, "global_step": 283834, "epoch": 1689} {"train_loss": -12.280455589294434, "global_step": 283835, "epoch": 1689} {"train_loss": -12.121650695800781, "global_step": 283836, "epoch": 1689} {"train_loss": -12.109870910644531, "global_step": 283837, "epoch": 1689} {"train_loss": -12.189469337463379, "global_step": 283838, "epoch": 1689} {"train_loss": -12.118722915649414, "global_step": 283839, "epoch": 1689} {"train_loss": -12.27023696899414, "global_step": 283840, "epoch": 1689} {"train_loss": -11.986738204956055, "global_step": 283841, "epoch": 1689} {"train_loss": -12.254587173461914, "global_step": 283842, "epoch": 1689} {"train_loss": -12.16971492767334, "global_step": 283843, "epoch": 1689} {"train_loss": -12.16050910949707, "global_step": 283844, "epoch": 1689} {"train_loss": -12.327579498291016, "global_step": 283845, "epoch": 1689} {"train_loss": -12.093942642211914, "global_step": 283846, "epoch": 1689} {"train_loss": -12.274030685424805, "global_step": 283847, "epoch": 1689} {"train_loss": -12.363353729248047, "global_step": 283848, "epoch": 1689} {"train_loss": -12.07817268371582, "global_step": 283849, "epoch": 1689} {"train_loss": -12.145916938781738, "global_step": 283850, "epoch": 1689} {"train_loss": -12.066948890686035, "global_step": 283851, "epoch": 1689} {"train_loss": -12.48594856262207, "global_step": 283852, "epoch": 1689} {"train_loss": -12.355677604675293, "global_step": 283853, "epoch": 1689} {"train_loss": -12.489700317382812, "global_step": 283854, "epoch": 1689} {"train_loss": -12.35158920288086, "global_step": 283855, "epoch": 1689} {"train_loss": -12.162833213806152, "global_step": 283856, "epoch": 1689} {"train_loss": -12.305856704711914, "global_step": 283857, "epoch": 1689} {"train_loss": -12.34925651550293, "global_step": 283858, "epoch": 1689} {"train_loss": -12.329899787902832, "global_step": 283859, "epoch": 1689} {"train_loss": -12.541481018066406, "global_step": 283860, "epoch": 1689} {"train_loss": -12.377181053161621, "global_step": 283861, "epoch": 1689} {"train_loss": -11.951308250427246, "global_step": 283862, "epoch": 1689} {"train_loss": -12.332099914550781, "global_step": 283863, "epoch": 1689} {"train_loss": -12.267919540405273, "global_step": 283864, "epoch": 1689} {"train_loss": -12.454191207885742, "global_step": 283865, "epoch": 1689} {"train_loss": -12.48360824584961, "global_step": 283866, "epoch": 1689} {"train_loss": -12.3690767288208, "global_step": 283867, "epoch": 1689} {"train_loss": -12.478358268737793, "global_step": 283868, "epoch": 1689} {"train_loss": -12.34802532196045, "global_step": 283869, "epoch": 1689} {"train_loss": -12.436400413513184, "global_step": 283870, "epoch": 1689} {"train_loss": -12.455629348754883, "global_step": 283871, "epoch": 1689} {"train_loss": -12.392133712768555, "global_step": 283872, "epoch": 1689} {"train_loss": -12.150774955749512, "global_step": 283873, "epoch": 1689} {"train_loss": -12.579163551330566, "global_step": 283874, "epoch": 1689} {"train_loss": -12.544136047363281, "global_step": 283875, "epoch": 1689} {"train_loss": -12.495806694030762, "global_step": 283876, "epoch": 1689} {"train_loss": -11.9878568649292, "global_step": 283877, "epoch": 1689} {"train_loss": -12.218497276306152, "global_step": 283878, "epoch": 1689} {"train_loss": -11.583915710449219, "global_step": 283879, "epoch": 1689} {"train_loss": -11.091802597045898, "global_step": 283880, "epoch": 1689} {"train_loss": -11.896395683288574, "global_step": 283881, "epoch": 1689} {"train_loss": -11.5192232131958, "global_step": 283882, "epoch": 1689} {"train_loss": -11.324051856994629, "global_step": 283883, "epoch": 1689} {"train_loss": -10.300897598266602, "global_step": 283884, "epoch": 1689} {"train_loss": -11.464751243591309, "global_step": 283885, "epoch": 1689} {"train_loss": -10.450494766235352, "global_step": 283886, "epoch": 1689} {"train_loss": -9.42286205291748, "global_step": 283887, "epoch": 1689} {"train_loss": -10.839113235473633, "global_step": 283888, "epoch": 1689} {"train_loss": -10.380084991455078, "global_step": 283889, "epoch": 1689} {"train_loss": -11.689948081970215, "global_step": 283890, "epoch": 1689} {"train_loss": -9.889435768127441, "global_step": 283891, "epoch": 1689} {"train_loss": -11.385323524475098, "global_step": 283892, "epoch": 1689} {"train_loss": -11.228841781616211, "global_step": 283893, "epoch": 1689} {"train_loss": -10.832533836364746, "global_step": 283894, "epoch": 1689} {"train_loss": -10.552846908569336, "global_step": 283895, "epoch": 1689} {"train_loss": -11.771333694458008, "global_step": 283896, "epoch": 1689} {"train_loss": -10.26822280883789, "global_step": 283897, "epoch": 1689} {"train_loss": -10.343978881835938, "global_step": 283898, "epoch": 1689} {"train_loss": -11.53581428527832, "global_step": 283899, "epoch": 1689} {"train_loss": -10.739459991455078, "global_step": 283900, "epoch": 1689} {"train_loss": -10.164298057556152, "global_step": 283901, "epoch": 1689} {"train_loss": -10.97446346282959, "global_step": 283902, "epoch": 1689} {"train_loss": -11.259452819824219, "global_step": 283903, "epoch": 1689} {"train_loss": -10.819671630859375, "global_step": 283904, "epoch": 1689} {"train_loss": -11.708395004272461, "global_step": 283905, "epoch": 1689} {"train_loss": -11.167381286621094, "global_step": 283906, "epoch": 1689} {"train_loss": -11.037872314453125, "global_step": 283907, "epoch": 1689} {"train_loss": -11.436681747436523, "global_step": 283908, "epoch": 1689} {"train_loss": -10.867532730102539, "global_step": 283909, "epoch": 1689} {"train_loss": -10.934938430786133, "global_step": 283910, "epoch": 1689} {"train_loss": -10.819250106811523, "global_step": 283911, "epoch": 1689} {"train_loss": -10.782187461853027, "global_step": 283912, "epoch": 1689} {"train_loss": -11.096097946166992, "global_step": 283913, "epoch": 1689} {"train_loss": -10.8980073928833, "global_step": 283914, "epoch": 1689} {"train_loss": -11.41518783569336, "global_step": 283915, "epoch": 1689} {"train_loss": -11.072107315063477, "global_step": 283916, "epoch": 1689} {"train_loss": -11.273438453674316, "global_step": 283917, "epoch": 1689} {"train_loss": -11.222297668457031, "global_step": 283918, "epoch": 1689} {"train_loss": -11.645560537065778, "global_step": 283919, "epoch": 1689, "val_loss": 275919.65625} {"train_loss": -11.258960723876953, "global_step": 283920, "epoch": 1690} {"train_loss": -11.190044403076172, "global_step": 283921, "epoch": 1690} {"train_loss": -11.410146713256836, "global_step": 283922, "epoch": 1690} {"train_loss": -11.276437759399414, "global_step": 283923, "epoch": 1690} {"train_loss": -11.374238967895508, "global_step": 283924, "epoch": 1690} {"train_loss": -11.803651809692383, "global_step": 283925, "epoch": 1690} {"train_loss": -11.818710327148438, "global_step": 283926, "epoch": 1690} {"train_loss": -11.685096740722656, "global_step": 283927, "epoch": 1690} {"train_loss": -11.521392822265625, "global_step": 283928, "epoch": 1690} {"train_loss": -11.658629417419434, "global_step": 283929, "epoch": 1690} {"train_loss": -11.070241928100586, "global_step": 283930, "epoch": 1690} {"train_loss": -11.906654357910156, "global_step": 283931, "epoch": 1690} {"train_loss": -11.58726978302002, "global_step": 283932, "epoch": 1690} {"train_loss": -11.763093948364258, "global_step": 283933, "epoch": 1690} {"train_loss": -11.671464920043945, "global_step": 283934, "epoch": 1690} {"train_loss": -11.870784759521484, "global_step": 283935, "epoch": 1690} {"train_loss": -11.686906814575195, "global_step": 283936, "epoch": 1690} {"train_loss": -11.777480125427246, "global_step": 283937, "epoch": 1690} {"train_loss": -11.787094116210938, "global_step": 283938, "epoch": 1690} {"train_loss": -11.771319389343262, "global_step": 283939, "epoch": 1690} {"train_loss": -11.58543586730957, "global_step": 283940, "epoch": 1690} {"train_loss": -11.800989151000977, "global_step": 283941, "epoch": 1690} {"train_loss": -11.911800384521484, "global_step": 283942, "epoch": 1690} {"train_loss": -11.914423942565918, "global_step": 283943, "epoch": 1690} {"train_loss": -11.93497371673584, "global_step": 283944, "epoch": 1690} {"train_loss": -11.83449649810791, "global_step": 283945, "epoch": 1690} {"train_loss": -12.259428024291992, "global_step": 283946, "epoch": 1690} {"train_loss": -11.682540893554688, "global_step": 283947, "epoch": 1690} {"train_loss": -12.054512977600098, "global_step": 283948, "epoch": 1690} {"train_loss": -11.660245895385742, "global_step": 283949, "epoch": 1690} {"train_loss": -12.141075134277344, "global_step": 283950, "epoch": 1690} {"train_loss": -11.522056579589844, "global_step": 283951, "epoch": 1690} {"train_loss": -11.803552627563477, "global_step": 283952, "epoch": 1690} {"train_loss": -11.479684829711914, "global_step": 283953, "epoch": 1690} {"train_loss": -11.533059120178223, "global_step": 283954, "epoch": 1690} {"train_loss": -11.481802940368652, "global_step": 283955, "epoch": 1690} {"train_loss": -11.533191680908203, "global_step": 283956, "epoch": 1690} {"train_loss": -11.52027702331543, "global_step": 283957, "epoch": 1690} {"train_loss": -11.801307678222656, "global_step": 283958, "epoch": 1690} {"train_loss": -11.84577751159668, "global_step": 283959, "epoch": 1690} {"train_loss": -11.704172134399414, "global_step": 283960, "epoch": 1690} {"train_loss": -11.799858093261719, "global_step": 283961, "epoch": 1690} {"train_loss": -11.88764762878418, "global_step": 283962, "epoch": 1690} {"train_loss": -11.863080978393555, "global_step": 283963, "epoch": 1690} {"train_loss": -11.961528778076172, "global_step": 283964, "epoch": 1690} {"train_loss": -11.854623794555664, "global_step": 283965, "epoch": 1690} {"train_loss": -11.929939270019531, "global_step": 283966, "epoch": 1690} {"train_loss": -12.079389572143555, "global_step": 283967, "epoch": 1690} {"train_loss": -11.955035209655762, "global_step": 283968, "epoch": 1690} {"train_loss": -12.153827667236328, "global_step": 283969, "epoch": 1690} {"train_loss": -12.047966003417969, "global_step": 283970, "epoch": 1690} {"train_loss": -12.178666114807129, "global_step": 283971, "epoch": 1690} {"train_loss": -12.053647994995117, "global_step": 283972, "epoch": 1690} {"train_loss": -12.398504257202148, "global_step": 283973, "epoch": 1690} {"train_loss": -12.085845947265625, "global_step": 283974, "epoch": 1690} {"train_loss": -12.178022384643555, "global_step": 283975, "epoch": 1690} {"train_loss": -12.237747192382812, "global_step": 283976, "epoch": 1690} {"train_loss": -12.288276672363281, "global_step": 283977, "epoch": 1690} {"train_loss": -12.477981567382812, "global_step": 283978, "epoch": 1690} {"train_loss": -12.134340286254883, "global_step": 283979, "epoch": 1690} {"train_loss": -12.345855712890625, "global_step": 283980, "epoch": 1690} {"train_loss": -12.201112747192383, "global_step": 283981, "epoch": 1690} {"train_loss": -12.129528045654297, "global_step": 283982, "epoch": 1690} {"train_loss": -12.136970520019531, "global_step": 283983, "epoch": 1690} {"train_loss": -12.314067840576172, "global_step": 283984, "epoch": 1690} {"train_loss": -12.153671264648438, "global_step": 283985, "epoch": 1690} {"train_loss": -12.087442398071289, "global_step": 283986, "epoch": 1690} {"train_loss": -12.324387550354004, "global_step": 283987, "epoch": 1690} {"train_loss": -12.180322647094727, "global_step": 283988, "epoch": 1690} {"train_loss": -12.062124252319336, "global_step": 283989, "epoch": 1690} {"train_loss": -12.041645050048828, "global_step": 283990, "epoch": 1690} {"train_loss": -12.335397720336914, "global_step": 283991, "epoch": 1690} {"train_loss": -12.324252128601074, "global_step": 283992, "epoch": 1690} {"train_loss": -11.938637733459473, "global_step": 283993, "epoch": 1690} {"train_loss": -12.09584903717041, "global_step": 283994, "epoch": 1690} {"train_loss": -11.78541374206543, "global_step": 283995, "epoch": 1690} {"train_loss": -11.387385368347168, "global_step": 283996, "epoch": 1690} {"train_loss": -11.847116470336914, "global_step": 283997, "epoch": 1690} {"train_loss": -11.883007049560547, "global_step": 283998, "epoch": 1690} {"train_loss": -11.151095390319824, "global_step": 283999, "epoch": 1690} {"train_loss": -11.613414764404297, "global_step": 284000, "epoch": 1690} {"train_loss": -10.356725692749023, "global_step": 284001, "epoch": 1690} {"train_loss": -9.832207679748535, "global_step": 284002, "epoch": 1690} {"train_loss": -11.643521308898926, "global_step": 284003, "epoch": 1690} {"train_loss": -11.042566299438477, "global_step": 284004, "epoch": 1690} {"train_loss": -11.309974670410156, "global_step": 284005, "epoch": 1690} {"train_loss": -10.96530532836914, "global_step": 284006, "epoch": 1690} {"train_loss": -12.15261459350586, "global_step": 284007, "epoch": 1690} {"train_loss": -11.050480842590332, "global_step": 284008, "epoch": 1690} {"train_loss": -12.01783561706543, "global_step": 284009, "epoch": 1690} {"train_loss": -11.346256256103516, "global_step": 284010, "epoch": 1690} {"train_loss": -11.917291641235352, "global_step": 284011, "epoch": 1690} {"train_loss": -11.82862663269043, "global_step": 284012, "epoch": 1690} {"train_loss": -11.804778099060059, "global_step": 284013, "epoch": 1690} {"train_loss": -11.670486450195312, "global_step": 284014, "epoch": 1690} {"train_loss": -11.733200073242188, "global_step": 284015, "epoch": 1690} {"train_loss": -12.049860000610352, "global_step": 284016, "epoch": 1690} {"train_loss": -11.702723503112793, "global_step": 284017, "epoch": 1690} {"train_loss": -11.935813903808594, "global_step": 284018, "epoch": 1690} {"train_loss": -11.819927215576172, "global_step": 284019, "epoch": 1690} {"train_loss": -12.239522933959961, "global_step": 284020, "epoch": 1690} {"train_loss": -12.106697082519531, "global_step": 284021, "epoch": 1690} {"train_loss": -11.943670272827148, "global_step": 284022, "epoch": 1690} {"train_loss": -12.304479598999023, "global_step": 284023, "epoch": 1690} {"train_loss": -11.769811630249023, "global_step": 284024, "epoch": 1690} {"train_loss": -12.187665939331055, "global_step": 284025, "epoch": 1690} {"train_loss": -11.906944274902344, "global_step": 284026, "epoch": 1690} {"train_loss": -11.88505744934082, "global_step": 284027, "epoch": 1690} {"train_loss": -12.172201156616211, "global_step": 284028, "epoch": 1690} {"train_loss": -11.887307167053223, "global_step": 284029, "epoch": 1690} {"train_loss": -12.020120620727539, "global_step": 284030, "epoch": 1690} {"train_loss": -12.181111335754395, "global_step": 284031, "epoch": 1690} {"train_loss": -11.543951034545898, "global_step": 284032, "epoch": 1690} {"train_loss": -11.18783950805664, "global_step": 284033, "epoch": 1690} {"train_loss": -12.045522689819336, "global_step": 284034, "epoch": 1690} {"train_loss": -10.53618335723877, "global_step": 284035, "epoch": 1690} {"train_loss": -9.696621894836426, "global_step": 284036, "epoch": 1690} {"train_loss": -11.549189567565918, "global_step": 284037, "epoch": 1690} {"train_loss": -10.224588394165039, "global_step": 284038, "epoch": 1690} {"train_loss": -10.415275573730469, "global_step": 284039, "epoch": 1690} {"train_loss": -10.363653182983398, "global_step": 284040, "epoch": 1690} {"train_loss": -11.631528854370117, "global_step": 284041, "epoch": 1690} {"train_loss": -10.480157852172852, "global_step": 284042, "epoch": 1690} {"train_loss": -11.39808464050293, "global_step": 284043, "epoch": 1690} {"train_loss": -8.826354026794434, "global_step": 284044, "epoch": 1690} {"train_loss": -11.15938949584961, "global_step": 284045, "epoch": 1690} {"train_loss": -9.73758602142334, "global_step": 284046, "epoch": 1690} {"train_loss": -11.211885452270508, "global_step": 284047, "epoch": 1690} {"train_loss": -10.290669441223145, "global_step": 284048, "epoch": 1690} {"train_loss": -10.151802062988281, "global_step": 284049, "epoch": 1690} {"train_loss": -11.299569129943848, "global_step": 284050, "epoch": 1690} {"train_loss": -11.280911445617676, "global_step": 284051, "epoch": 1690} {"train_loss": -11.384286880493164, "global_step": 284052, "epoch": 1690} {"train_loss": -11.45734977722168, "global_step": 284053, "epoch": 1690} {"train_loss": -11.746572494506836, "global_step": 284054, "epoch": 1690} {"train_loss": -11.097108840942383, "global_step": 284055, "epoch": 1690} {"train_loss": -11.631359100341797, "global_step": 284056, "epoch": 1690} {"train_loss": -11.38105583190918, "global_step": 284057, "epoch": 1690} {"train_loss": -11.710420608520508, "global_step": 284058, "epoch": 1690} {"train_loss": -11.34378433227539, "global_step": 284059, "epoch": 1690} {"train_loss": -11.698925018310547, "global_step": 284060, "epoch": 1690} {"train_loss": -11.831933975219727, "global_step": 284061, "epoch": 1690} {"train_loss": -11.47750473022461, "global_step": 284062, "epoch": 1690} {"train_loss": -11.772178649902344, "global_step": 284063, "epoch": 1690} {"train_loss": -11.765628814697266, "global_step": 284064, "epoch": 1690} {"train_loss": -11.788318634033203, "global_step": 284065, "epoch": 1690} {"train_loss": -12.011722564697266, "global_step": 284066, "epoch": 1690} {"train_loss": -11.777603149414062, "global_step": 284067, "epoch": 1690} {"train_loss": -11.964288711547852, "global_step": 284068, "epoch": 1690} {"train_loss": -12.060098648071289, "global_step": 284069, "epoch": 1690} {"train_loss": -11.703927993774414, "global_step": 284070, "epoch": 1690} {"train_loss": -12.102654457092285, "global_step": 284071, "epoch": 1690} {"train_loss": -11.669307708740234, "global_step": 284072, "epoch": 1690} {"train_loss": -11.846567153930664, "global_step": 284073, "epoch": 1690} {"train_loss": -11.840049743652344, "global_step": 284074, "epoch": 1690} {"train_loss": -11.978851318359375, "global_step": 284075, "epoch": 1690} {"train_loss": -12.103522300720215, "global_step": 284076, "epoch": 1690} {"train_loss": -11.88688850402832, "global_step": 284077, "epoch": 1690} {"train_loss": -12.12011432647705, "global_step": 284078, "epoch": 1690} {"train_loss": -12.039815902709961, "global_step": 284079, "epoch": 1690} {"train_loss": -12.074872016906738, "global_step": 284080, "epoch": 1690} {"train_loss": -12.066232681274414, "global_step": 284081, "epoch": 1690} {"train_loss": -12.169370651245117, "global_step": 284082, "epoch": 1690} {"train_loss": -12.1071195602417, "global_step": 284083, "epoch": 1690} {"train_loss": -12.271173477172852, "global_step": 284084, "epoch": 1690} {"train_loss": -11.935736656188965, "global_step": 284085, "epoch": 1690} {"train_loss": -12.209766387939453, "global_step": 284086, "epoch": 1690} {"train_loss": -11.695920359520684, "global_step": 284087, "epoch": 1690, "val_loss": 276043.875, "train_action_mse_error": 2.256908416748047} {"train_loss": -12.157621383666992, "global_step": 284088, "epoch": 1691} {"train_loss": -12.116585731506348, "global_step": 284089, "epoch": 1691} {"train_loss": -12.135869979858398, "global_step": 284090, "epoch": 1691} {"train_loss": -12.24032974243164, "global_step": 284091, "epoch": 1691} {"train_loss": -12.214433670043945, "global_step": 284092, "epoch": 1691} {"train_loss": -12.121316909790039, "global_step": 284093, "epoch": 1691} {"train_loss": -12.309024810791016, "global_step": 284094, "epoch": 1691} {"train_loss": -11.971090316772461, "global_step": 284095, "epoch": 1691} {"train_loss": -12.340538024902344, "global_step": 284096, "epoch": 1691} {"train_loss": -12.075299263000488, "global_step": 284097, "epoch": 1691} {"train_loss": -12.18353271484375, "global_step": 284098, "epoch": 1691} {"train_loss": -12.161751747131348, "global_step": 284099, "epoch": 1691} {"train_loss": -12.067487716674805, "global_step": 284100, "epoch": 1691} {"train_loss": -12.353264808654785, "global_step": 284101, "epoch": 1691} {"train_loss": -12.213725090026855, "global_step": 284102, "epoch": 1691} {"train_loss": -12.248250961303711, "global_step": 284103, "epoch": 1691} {"train_loss": -12.266156196594238, "global_step": 284104, "epoch": 1691} {"train_loss": -12.111430168151855, "global_step": 284105, "epoch": 1691} {"train_loss": -12.166841506958008, "global_step": 284106, "epoch": 1691} {"train_loss": -12.19466495513916, "global_step": 284107, "epoch": 1691} {"train_loss": -12.249680519104004, "global_step": 284108, "epoch": 1691} {"train_loss": -12.044124603271484, "global_step": 284109, "epoch": 1691} {"train_loss": -12.363482475280762, "global_step": 284110, "epoch": 1691} {"train_loss": -12.332904815673828, "global_step": 284111, "epoch": 1691} {"train_loss": -12.400480270385742, "global_step": 284112, "epoch": 1691} {"train_loss": -12.250645637512207, "global_step": 284113, "epoch": 1691} {"train_loss": -12.366678237915039, "global_step": 284114, "epoch": 1691} {"train_loss": -12.077606201171875, "global_step": 284115, "epoch": 1691} {"train_loss": -12.459318161010742, "global_step": 284116, "epoch": 1691} {"train_loss": -12.496038436889648, "global_step": 284117, "epoch": 1691} {"train_loss": -12.347274780273438, "global_step": 284118, "epoch": 1691} {"train_loss": -12.23412799835205, "global_step": 284119, "epoch": 1691} {"train_loss": -12.262381553649902, "global_step": 284120, "epoch": 1691} {"train_loss": -12.493998527526855, "global_step": 284121, "epoch": 1691} {"train_loss": -12.23731803894043, "global_step": 284122, "epoch": 1691} {"train_loss": -12.512712478637695, "global_step": 284123, "epoch": 1691} {"train_loss": -12.315373420715332, "global_step": 284124, "epoch": 1691} {"train_loss": -12.140148162841797, "global_step": 284125, "epoch": 1691} {"train_loss": -12.236812591552734, "global_step": 284126, "epoch": 1691} {"train_loss": -12.473902702331543, "global_step": 284127, "epoch": 1691} {"train_loss": -12.15727710723877, "global_step": 284128, "epoch": 1691} {"train_loss": -12.376928329467773, "global_step": 284129, "epoch": 1691} {"train_loss": -12.574407577514648, "global_step": 284130, "epoch": 1691} {"train_loss": -12.300400733947754, "global_step": 284131, "epoch": 1691} {"train_loss": -12.19979476928711, "global_step": 284132, "epoch": 1691} {"train_loss": -12.245494842529297, "global_step": 284133, "epoch": 1691} {"train_loss": -12.495378494262695, "global_step": 284134, "epoch": 1691} {"train_loss": -12.498044967651367, "global_step": 284135, "epoch": 1691} {"train_loss": -12.548012733459473, "global_step": 284136, "epoch": 1691} {"train_loss": -12.34088134765625, "global_step": 284137, "epoch": 1691} {"train_loss": -12.336338996887207, "global_step": 284138, "epoch": 1691} {"train_loss": -12.20977783203125, "global_step": 284139, "epoch": 1691} {"train_loss": -12.36950397491455, "global_step": 284140, "epoch": 1691} {"train_loss": -12.367287635803223, "global_step": 284141, "epoch": 1691} {"train_loss": -11.89595890045166, "global_step": 284142, "epoch": 1691} {"train_loss": -12.06332015991211, "global_step": 284143, "epoch": 1691} {"train_loss": -12.115026473999023, "global_step": 284144, "epoch": 1691} {"train_loss": -11.894145965576172, "global_step": 284145, "epoch": 1691} {"train_loss": -11.746971130371094, "global_step": 284146, "epoch": 1691} {"train_loss": -11.976844787597656, "global_step": 284147, "epoch": 1691} {"train_loss": -12.101354598999023, "global_step": 284148, "epoch": 1691} {"train_loss": -11.58868408203125, "global_step": 284149, "epoch": 1691} {"train_loss": -10.247174263000488, "global_step": 284150, "epoch": 1691} {"train_loss": -9.630293846130371, "global_step": 284151, "epoch": 1691} {"train_loss": -11.29793643951416, "global_step": 284152, "epoch": 1691} {"train_loss": -10.513970375061035, "global_step": 284153, "epoch": 1691} {"train_loss": -9.326949119567871, "global_step": 284154, "epoch": 1691} {"train_loss": -9.84339714050293, "global_step": 284155, "epoch": 1691} {"train_loss": -10.64178466796875, "global_step": 284156, "epoch": 1691} {"train_loss": -11.756978988647461, "global_step": 284157, "epoch": 1691} {"train_loss": -10.185102462768555, "global_step": 284158, "epoch": 1691} {"train_loss": -11.548484802246094, "global_step": 284159, "epoch": 1691} {"train_loss": -10.509404182434082, "global_step": 284160, "epoch": 1691} {"train_loss": -10.735153198242188, "global_step": 284161, "epoch": 1691} {"train_loss": -10.320185661315918, "global_step": 284162, "epoch": 1691} {"train_loss": -10.666223526000977, "global_step": 284163, "epoch": 1691} {"train_loss": -10.621448516845703, "global_step": 284164, "epoch": 1691} {"train_loss": -10.409531593322754, "global_step": 284165, "epoch": 1691} {"train_loss": -11.500011444091797, "global_step": 284166, "epoch": 1691} {"train_loss": -10.67873764038086, "global_step": 284167, "epoch": 1691} {"train_loss": -10.680670738220215, "global_step": 284168, "epoch": 1691} {"train_loss": -11.436080932617188, "global_step": 284169, "epoch": 1691} {"train_loss": -10.477594375610352, "global_step": 284170, "epoch": 1691} {"train_loss": -9.97135066986084, "global_step": 284171, "epoch": 1691} {"train_loss": -10.836396217346191, "global_step": 284172, "epoch": 1691} {"train_loss": -10.294560432434082, "global_step": 284173, "epoch": 1691} {"train_loss": -11.170434951782227, "global_step": 284174, "epoch": 1691} {"train_loss": -11.484670639038086, "global_step": 284175, "epoch": 1691} {"train_loss": -11.107479095458984, "global_step": 284176, "epoch": 1691} {"train_loss": -11.627009391784668, "global_step": 284177, "epoch": 1691} {"train_loss": -11.157007217407227, "global_step": 284178, "epoch": 1691} {"train_loss": -11.742307662963867, "global_step": 284179, "epoch": 1691} {"train_loss": -10.873428344726562, "global_step": 284180, "epoch": 1691} {"train_loss": -11.026996612548828, "global_step": 284181, "epoch": 1691} {"train_loss": -11.447091102600098, "global_step": 284182, "epoch": 1691} {"train_loss": -11.136643409729004, "global_step": 284183, "epoch": 1691} {"train_loss": -11.157015800476074, "global_step": 284184, "epoch": 1691} {"train_loss": -11.334412574768066, "global_step": 284185, "epoch": 1691} {"train_loss": -11.226984977722168, "global_step": 284186, "epoch": 1691} {"train_loss": -11.743852615356445, "global_step": 284187, "epoch": 1691} {"train_loss": -11.207809448242188, "global_step": 284188, "epoch": 1691} {"train_loss": -11.781208992004395, "global_step": 284189, "epoch": 1691} {"train_loss": -11.626534461975098, "global_step": 284190, "epoch": 1691} {"train_loss": -11.691658973693848, "global_step": 284191, "epoch": 1691} {"train_loss": -11.666479110717773, "global_step": 284192, "epoch": 1691} {"train_loss": -11.509227752685547, "global_step": 284193, "epoch": 1691} {"train_loss": -11.49083137512207, "global_step": 284194, "epoch": 1691} {"train_loss": -11.714136123657227, "global_step": 284195, "epoch": 1691} {"train_loss": -11.28622055053711, "global_step": 284196, "epoch": 1691} {"train_loss": -11.815255165100098, "global_step": 284197, "epoch": 1691} {"train_loss": -11.445758819580078, "global_step": 284198, "epoch": 1691} {"train_loss": -12.010335922241211, "global_step": 284199, "epoch": 1691} {"train_loss": -12.195228576660156, "global_step": 284200, "epoch": 1691} {"train_loss": -11.73461627960205, "global_step": 284201, "epoch": 1691} {"train_loss": -11.548846244812012, "global_step": 284202, "epoch": 1691} {"train_loss": -11.94261360168457, "global_step": 284203, "epoch": 1691} {"train_loss": -12.062861442565918, "global_step": 284204, "epoch": 1691} {"train_loss": -12.129433631896973, "global_step": 284205, "epoch": 1691} {"train_loss": -12.071237564086914, "global_step": 284206, "epoch": 1691} {"train_loss": -12.016372680664062, "global_step": 284207, "epoch": 1691} {"train_loss": -12.250739097595215, "global_step": 284208, "epoch": 1691} {"train_loss": -12.067235946655273, "global_step": 284209, "epoch": 1691} {"train_loss": -11.980095863342285, "global_step": 284210, "epoch": 1691} {"train_loss": -12.130253791809082, "global_step": 284211, "epoch": 1691} {"train_loss": -12.111703872680664, "global_step": 284212, "epoch": 1691} {"train_loss": -12.064668655395508, "global_step": 284213, "epoch": 1691} {"train_loss": -12.148828506469727, "global_step": 284214, "epoch": 1691} {"train_loss": -12.337892532348633, "global_step": 284215, "epoch": 1691} {"train_loss": -12.049539566040039, "global_step": 284216, "epoch": 1691} {"train_loss": -12.064962387084961, "global_step": 284217, "epoch": 1691} {"train_loss": -11.963932037353516, "global_step": 284218, "epoch": 1691} {"train_loss": -12.119160652160645, "global_step": 284219, "epoch": 1691} {"train_loss": -12.320566177368164, "global_step": 284220, "epoch": 1691} {"train_loss": -12.134513854980469, "global_step": 284221, "epoch": 1691} {"train_loss": -12.268714904785156, "global_step": 284222, "epoch": 1691} {"train_loss": -11.924849510192871, "global_step": 284223, "epoch": 1691} {"train_loss": -12.258415222167969, "global_step": 284224, "epoch": 1691} {"train_loss": -12.1309232711792, "global_step": 284225, "epoch": 1691} {"train_loss": -12.225966453552246, "global_step": 284226, "epoch": 1691} {"train_loss": -12.030054092407227, "global_step": 284227, "epoch": 1691} {"train_loss": -12.140865325927734, "global_step": 284228, "epoch": 1691} {"train_loss": -12.068808555603027, "global_step": 284229, "epoch": 1691} {"train_loss": -12.464019775390625, "global_step": 284230, "epoch": 1691} {"train_loss": -12.326797485351562, "global_step": 284231, "epoch": 1691} {"train_loss": -12.149593353271484, "global_step": 284232, "epoch": 1691} {"train_loss": -12.171990394592285, "global_step": 284233, "epoch": 1691} {"train_loss": -12.357284545898438, "global_step": 284234, "epoch": 1691} {"train_loss": -11.884671211242676, "global_step": 284235, "epoch": 1691} {"train_loss": -11.93071174621582, "global_step": 284236, "epoch": 1691} {"train_loss": -11.9566650390625, "global_step": 284237, "epoch": 1691} {"train_loss": -11.906289100646973, "global_step": 284238, "epoch": 1691} {"train_loss": -12.073976516723633, "global_step": 284239, "epoch": 1691} {"train_loss": -12.003738403320312, "global_step": 284240, "epoch": 1691} {"train_loss": -12.067869186401367, "global_step": 284241, "epoch": 1691} {"train_loss": -12.249568939208984, "global_step": 284242, "epoch": 1691} {"train_loss": -12.012822151184082, "global_step": 284243, "epoch": 1691} {"train_loss": -11.93635368347168, "global_step": 284244, "epoch": 1691} {"train_loss": -12.187859535217285, "global_step": 284245, "epoch": 1691} {"train_loss": -11.266258239746094, "global_step": 284246, "epoch": 1691} {"train_loss": -12.292303085327148, "global_step": 284247, "epoch": 1691} {"train_loss": -11.8410005569458, "global_step": 284248, "epoch": 1691} {"train_loss": -12.009652137756348, "global_step": 284249, "epoch": 1691} {"train_loss": -11.648384094238281, "global_step": 284250, "epoch": 1691} {"train_loss": -11.683643341064453, "global_step": 284251, "epoch": 1691} {"train_loss": -11.988054275512695, "global_step": 284252, "epoch": 1691} {"train_loss": -11.91283893585205, "global_step": 284253, "epoch": 1691} {"train_loss": -11.71212387084961, "global_step": 284254, "epoch": 1691} {"train_loss": -11.810291829563322, "global_step": 284255, "epoch": 1691, "val_loss": 275618.6875} {"train_loss": -11.591506958007812, "global_step": 284256, "epoch": 1692} {"train_loss": -10.956603050231934, "global_step": 284257, "epoch": 1692} {"train_loss": -12.085692405700684, "global_step": 284258, "epoch": 1692} {"train_loss": -11.047083854675293, "global_step": 284259, "epoch": 1692} {"train_loss": -11.906861305236816, "global_step": 284260, "epoch": 1692} {"train_loss": -10.63128662109375, "global_step": 284261, "epoch": 1692} {"train_loss": -10.214378356933594, "global_step": 284262, "epoch": 1692} {"train_loss": -9.770830154418945, "global_step": 284263, "epoch": 1692} {"train_loss": -10.464237213134766, "global_step": 284264, "epoch": 1692} {"train_loss": -9.219796180725098, "global_step": 284265, "epoch": 1692} {"train_loss": -10.93173599243164, "global_step": 284266, "epoch": 1692} {"train_loss": -9.130366325378418, "global_step": 284267, "epoch": 1692} {"train_loss": -9.926661491394043, "global_step": 284268, "epoch": 1692} {"train_loss": -11.338050842285156, "global_step": 284269, "epoch": 1692} {"train_loss": -10.232465744018555, "global_step": 284270, "epoch": 1692} {"train_loss": -10.300682067871094, "global_step": 284271, "epoch": 1692} {"train_loss": -10.432071685791016, "global_step": 284272, "epoch": 1692} {"train_loss": -10.682040214538574, "global_step": 284273, "epoch": 1692} {"train_loss": -10.529329299926758, "global_step": 284274, "epoch": 1692} {"train_loss": -10.058666229248047, "global_step": 284275, "epoch": 1692} {"train_loss": -11.228330612182617, "global_step": 284276, "epoch": 1692} {"train_loss": -10.330622673034668, "global_step": 284277, "epoch": 1692} {"train_loss": -11.120777130126953, "global_step": 284278, "epoch": 1692} {"train_loss": -10.652627944946289, "global_step": 284279, "epoch": 1692} {"train_loss": -9.14417839050293, "global_step": 284280, "epoch": 1692} {"train_loss": -10.457773208618164, "global_step": 284281, "epoch": 1692} {"train_loss": -10.471076965332031, "global_step": 284282, "epoch": 1692} {"train_loss": -9.822275161743164, "global_step": 284283, "epoch": 1692} {"train_loss": -10.381170272827148, "global_step": 284284, "epoch": 1692} {"train_loss": -11.052799224853516, "global_step": 284285, "epoch": 1692} {"train_loss": -10.971242904663086, "global_step": 284286, "epoch": 1692} {"train_loss": -10.040542602539062, "global_step": 284287, "epoch": 1692} {"train_loss": -10.219486236572266, "global_step": 284288, "epoch": 1692} {"train_loss": -10.500904083251953, "global_step": 284289, "epoch": 1692} {"train_loss": -10.436094284057617, "global_step": 284290, "epoch": 1692} {"train_loss": -10.088855743408203, "global_step": 284291, "epoch": 1692} {"train_loss": -9.910101890563965, "global_step": 284292, "epoch": 1692} {"train_loss": -10.600664138793945, "global_step": 284293, "epoch": 1692} {"train_loss": -10.937159538269043, "global_step": 284294, "epoch": 1692} {"train_loss": -10.566944122314453, "global_step": 284295, "epoch": 1692} {"train_loss": -10.581693649291992, "global_step": 284296, "epoch": 1692} {"train_loss": -11.067193984985352, "global_step": 284297, "epoch": 1692} {"train_loss": -11.368995666503906, "global_step": 284298, "epoch": 1692} {"train_loss": -10.918329238891602, "global_step": 284299, "epoch": 1692} {"train_loss": -11.041385650634766, "global_step": 284300, "epoch": 1692} {"train_loss": -11.571178436279297, "global_step": 284301, "epoch": 1692} {"train_loss": -11.232358932495117, "global_step": 284302, "epoch": 1692} {"train_loss": -11.04448127746582, "global_step": 284303, "epoch": 1692} {"train_loss": -11.71603775024414, "global_step": 284304, "epoch": 1692} {"train_loss": -11.41236686706543, "global_step": 284305, "epoch": 1692} {"train_loss": -11.225196838378906, "global_step": 284306, "epoch": 1692} {"train_loss": -11.741629600524902, "global_step": 284307, "epoch": 1692} {"train_loss": -11.501652717590332, "global_step": 284308, "epoch": 1692} {"train_loss": -11.231197357177734, "global_step": 284309, "epoch": 1692} {"train_loss": -11.73928451538086, "global_step": 284310, "epoch": 1692} {"train_loss": -11.491471290588379, "global_step": 284311, "epoch": 1692} {"train_loss": -11.683551788330078, "global_step": 284312, "epoch": 1692} {"train_loss": -11.662757873535156, "global_step": 284313, "epoch": 1692} {"train_loss": -11.686095237731934, "global_step": 284314, "epoch": 1692} {"train_loss": -11.696962356567383, "global_step": 284315, "epoch": 1692} {"train_loss": -11.838518142700195, "global_step": 284316, "epoch": 1692} {"train_loss": -11.881452560424805, "global_step": 284317, "epoch": 1692} {"train_loss": -11.70431900024414, "global_step": 284318, "epoch": 1692} {"train_loss": -11.697031021118164, "global_step": 284319, "epoch": 1692} {"train_loss": -11.826536178588867, "global_step": 284320, "epoch": 1692} {"train_loss": -11.718097686767578, "global_step": 284321, "epoch": 1692} {"train_loss": -12.010610580444336, "global_step": 284322, "epoch": 1692} {"train_loss": -11.794218063354492, "global_step": 284323, "epoch": 1692} {"train_loss": -11.838785171508789, "global_step": 284324, "epoch": 1692} {"train_loss": -11.861238479614258, "global_step": 284325, "epoch": 1692} {"train_loss": -12.109963417053223, "global_step": 284326, "epoch": 1692} {"train_loss": -11.770421981811523, "global_step": 284327, "epoch": 1692} {"train_loss": -11.82773208618164, "global_step": 284328, "epoch": 1692} {"train_loss": -11.669615745544434, "global_step": 284329, "epoch": 1692} {"train_loss": -11.994977951049805, "global_step": 284330, "epoch": 1692} {"train_loss": -11.907642364501953, "global_step": 284331, "epoch": 1692} {"train_loss": -12.111553192138672, "global_step": 284332, "epoch": 1692} {"train_loss": -11.922635078430176, "global_step": 284333, "epoch": 1692} {"train_loss": -11.979406356811523, "global_step": 284334, "epoch": 1692} {"train_loss": -11.831742286682129, "global_step": 284335, "epoch": 1692} {"train_loss": -12.00391960144043, "global_step": 284336, "epoch": 1692} {"train_loss": -12.143014907836914, "global_step": 284337, "epoch": 1692} {"train_loss": -12.002103805541992, "global_step": 284338, "epoch": 1692} {"train_loss": -12.150259017944336, "global_step": 284339, "epoch": 1692} {"train_loss": -12.007555961608887, "global_step": 284340, "epoch": 1692} {"train_loss": -12.302013397216797, "global_step": 284341, "epoch": 1692} {"train_loss": -12.25014877319336, "global_step": 284342, "epoch": 1692} {"train_loss": -12.095344543457031, "global_step": 284343, "epoch": 1692} {"train_loss": -11.930387496948242, "global_step": 284344, "epoch": 1692} {"train_loss": -12.173995018005371, "global_step": 284345, "epoch": 1692} {"train_loss": -12.101097106933594, "global_step": 284346, "epoch": 1692} {"train_loss": -12.297615051269531, "global_step": 284347, "epoch": 1692} {"train_loss": -12.248268127441406, "global_step": 284348, "epoch": 1692} {"train_loss": -12.265129089355469, "global_step": 284349, "epoch": 1692} {"train_loss": -12.048056602478027, "global_step": 284350, "epoch": 1692} {"train_loss": -12.177385330200195, "global_step": 284351, "epoch": 1692} {"train_loss": -12.189249038696289, "global_step": 284352, "epoch": 1692} {"train_loss": -12.10911750793457, "global_step": 284353, "epoch": 1692} {"train_loss": -12.22523307800293, "global_step": 284354, "epoch": 1692} {"train_loss": -12.342806816101074, "global_step": 284355, "epoch": 1692} {"train_loss": -12.116429328918457, "global_step": 284356, "epoch": 1692} {"train_loss": -12.26534366607666, "global_step": 284357, "epoch": 1692} {"train_loss": -12.313087463378906, "global_step": 284358, "epoch": 1692} {"train_loss": -12.405067443847656, "global_step": 284359, "epoch": 1692} {"train_loss": -12.338756561279297, "global_step": 284360, "epoch": 1692} {"train_loss": -12.515592575073242, "global_step": 284361, "epoch": 1692} {"train_loss": -12.141785621643066, "global_step": 284362, "epoch": 1692} {"train_loss": -12.425346374511719, "global_step": 284363, "epoch": 1692} {"train_loss": -12.398113250732422, "global_step": 284364, "epoch": 1692} {"train_loss": -12.428420066833496, "global_step": 284365, "epoch": 1692} {"train_loss": -12.314533233642578, "global_step": 284366, "epoch": 1692} {"train_loss": -12.197540283203125, "global_step": 284367, "epoch": 1692} {"train_loss": -12.323553085327148, "global_step": 284368, "epoch": 1692} {"train_loss": -12.465635299682617, "global_step": 284369, "epoch": 1692} {"train_loss": -12.394318580627441, "global_step": 284370, "epoch": 1692} {"train_loss": -12.313217163085938, "global_step": 284371, "epoch": 1692} {"train_loss": -12.227415084838867, "global_step": 284372, "epoch": 1692} {"train_loss": -12.327079772949219, "global_step": 284373, "epoch": 1692} {"train_loss": -12.270824432373047, "global_step": 284374, "epoch": 1692} {"train_loss": -12.020296096801758, "global_step": 284375, "epoch": 1692} {"train_loss": -12.258459091186523, "global_step": 284376, "epoch": 1692} {"train_loss": -12.426657676696777, "global_step": 284377, "epoch": 1692} {"train_loss": -12.296318054199219, "global_step": 284378, "epoch": 1692} {"train_loss": -12.097532272338867, "global_step": 284379, "epoch": 1692} {"train_loss": -12.161524772644043, "global_step": 284380, "epoch": 1692} {"train_loss": -12.145071029663086, "global_step": 284381, "epoch": 1692} {"train_loss": -11.71973705291748, "global_step": 284382, "epoch": 1692} {"train_loss": -11.313273429870605, "global_step": 284383, "epoch": 1692} {"train_loss": -12.044021606445312, "global_step": 284384, "epoch": 1692} {"train_loss": -12.05935287475586, "global_step": 284385, "epoch": 1692} {"train_loss": -11.425193786621094, "global_step": 284386, "epoch": 1692} {"train_loss": -12.103425979614258, "global_step": 284387, "epoch": 1692} {"train_loss": -12.06908893585205, "global_step": 284388, "epoch": 1692} {"train_loss": -11.648021697998047, "global_step": 284389, "epoch": 1692} {"train_loss": -12.313393592834473, "global_step": 284390, "epoch": 1692} {"train_loss": -12.301521301269531, "global_step": 284391, "epoch": 1692} {"train_loss": -12.077173233032227, "global_step": 284392, "epoch": 1692} {"train_loss": -11.994309425354004, "global_step": 284393, "epoch": 1692} {"train_loss": -11.746228218078613, "global_step": 284394, "epoch": 1692} {"train_loss": -10.675597190856934, "global_step": 284395, "epoch": 1692} {"train_loss": -11.836341857910156, "global_step": 284396, "epoch": 1692} {"train_loss": -11.857696533203125, "global_step": 284397, "epoch": 1692} {"train_loss": -11.688573837280273, "global_step": 284398, "epoch": 1692} {"train_loss": -10.097049713134766, "global_step": 284399, "epoch": 1692} {"train_loss": -11.97944450378418, "global_step": 284400, "epoch": 1692} {"train_loss": -11.053226470947266, "global_step": 284401, "epoch": 1692} {"train_loss": -11.20625114440918, "global_step": 284402, "epoch": 1692} {"train_loss": -11.036111831665039, "global_step": 284403, "epoch": 1692} {"train_loss": -11.704870223999023, "global_step": 284404, "epoch": 1692} {"train_loss": -11.626167297363281, "global_step": 284405, "epoch": 1692} {"train_loss": -10.739204406738281, "global_step": 284406, "epoch": 1692} {"train_loss": -11.545818328857422, "global_step": 284407, "epoch": 1692} {"train_loss": -11.43852424621582, "global_step": 284408, "epoch": 1692} {"train_loss": -11.57183837890625, "global_step": 284409, "epoch": 1692} {"train_loss": -11.388528823852539, "global_step": 284410, "epoch": 1692} {"train_loss": -11.978798866271973, "global_step": 284411, "epoch": 1692} {"train_loss": -11.421442031860352, "global_step": 284412, "epoch": 1692} {"train_loss": -11.22663402557373, "global_step": 284413, "epoch": 1692} {"train_loss": -12.032316207885742, "global_step": 284414, "epoch": 1692} {"train_loss": -11.291793823242188, "global_step": 284415, "epoch": 1692} {"train_loss": -11.880098342895508, "global_step": 284416, "epoch": 1692} {"train_loss": -11.85673999786377, "global_step": 284417, "epoch": 1692} {"train_loss": -11.405313491821289, "global_step": 284418, "epoch": 1692} {"train_loss": -11.851591110229492, "global_step": 284419, "epoch": 1692} {"train_loss": -12.075023651123047, "global_step": 284420, "epoch": 1692} {"train_loss": -11.91115665435791, "global_step": 284421, "epoch": 1692} {"train_loss": -11.693901062011719, "global_step": 284422, "epoch": 1692} {"train_loss": -11.527465417271568, "global_step": 284423, "epoch": 1692, "val_loss": 276826.1875} {"train_loss": -11.917437553405762, "global_step": 284424, "epoch": 1693} {"train_loss": -11.548003196716309, "global_step": 284425, "epoch": 1693} {"train_loss": -12.039819717407227, "global_step": 284426, "epoch": 1693} {"train_loss": -11.656320571899414, "global_step": 284427, "epoch": 1693} {"train_loss": -11.488801956176758, "global_step": 284428, "epoch": 1693} {"train_loss": -11.76165771484375, "global_step": 284429, "epoch": 1693} {"train_loss": -11.799376487731934, "global_step": 284430, "epoch": 1693} {"train_loss": -11.120492935180664, "global_step": 284431, "epoch": 1693} {"train_loss": -11.412498474121094, "global_step": 284432, "epoch": 1693} {"train_loss": -11.163804054260254, "global_step": 284433, "epoch": 1693} {"train_loss": -11.313943862915039, "global_step": 284434, "epoch": 1693} {"train_loss": -11.767752647399902, "global_step": 284435, "epoch": 1693} {"train_loss": -10.046462059020996, "global_step": 284436, "epoch": 1693} {"train_loss": -11.140426635742188, "global_step": 284437, "epoch": 1693} {"train_loss": -11.119373321533203, "global_step": 284438, "epoch": 1693} {"train_loss": -11.62059211730957, "global_step": 284439, "epoch": 1693} {"train_loss": -11.892990112304688, "global_step": 284440, "epoch": 1693} {"train_loss": -11.546770095825195, "global_step": 284441, "epoch": 1693} {"train_loss": -11.533439636230469, "global_step": 284442, "epoch": 1693} {"train_loss": -11.715373039245605, "global_step": 284443, "epoch": 1693} {"train_loss": -11.998860359191895, "global_step": 284444, "epoch": 1693} {"train_loss": -10.753171920776367, "global_step": 284445, "epoch": 1693} {"train_loss": -11.97407054901123, "global_step": 284446, "epoch": 1693} {"train_loss": -11.272448539733887, "global_step": 284447, "epoch": 1693} {"train_loss": -11.806060791015625, "global_step": 284448, "epoch": 1693} {"train_loss": -11.883604049682617, "global_step": 284449, "epoch": 1693} {"train_loss": -11.135885238647461, "global_step": 284450, "epoch": 1693} {"train_loss": -12.14765453338623, "global_step": 284451, "epoch": 1693} {"train_loss": -11.437700271606445, "global_step": 284452, "epoch": 1693} {"train_loss": -12.066810607910156, "global_step": 284453, "epoch": 1693} {"train_loss": -11.627374649047852, "global_step": 284454, "epoch": 1693} {"train_loss": -11.724194526672363, "global_step": 284455, "epoch": 1693} {"train_loss": -11.956178665161133, "global_step": 284456, "epoch": 1693} {"train_loss": -11.496708869934082, "global_step": 284457, "epoch": 1693} {"train_loss": -11.91968059539795, "global_step": 284458, "epoch": 1693} {"train_loss": -12.060295104980469, "global_step": 284459, "epoch": 1693} {"train_loss": -11.83631420135498, "global_step": 284460, "epoch": 1693} {"train_loss": -12.21893310546875, "global_step": 284461, "epoch": 1693} {"train_loss": -11.611364364624023, "global_step": 284462, "epoch": 1693} {"train_loss": -12.076576232910156, "global_step": 284463, "epoch": 1693} {"train_loss": -11.998629570007324, "global_step": 284464, "epoch": 1693} {"train_loss": -11.890313148498535, "global_step": 284465, "epoch": 1693} {"train_loss": -12.271265029907227, "global_step": 284466, "epoch": 1693} {"train_loss": -11.525714874267578, "global_step": 284467, "epoch": 1693} {"train_loss": -11.965417861938477, "global_step": 284468, "epoch": 1693} {"train_loss": -11.62642765045166, "global_step": 284469, "epoch": 1693} {"train_loss": -10.913287162780762, "global_step": 284470, "epoch": 1693} {"train_loss": -12.035754203796387, "global_step": 284471, "epoch": 1693} {"train_loss": -10.254676818847656, "global_step": 284472, "epoch": 1693} {"train_loss": -12.26235580444336, "global_step": 284473, "epoch": 1693} {"train_loss": -10.554941177368164, "global_step": 284474, "epoch": 1693} {"train_loss": -11.100028991699219, "global_step": 284475, "epoch": 1693} {"train_loss": -12.220065116882324, "global_step": 284476, "epoch": 1693} {"train_loss": -11.125730514526367, "global_step": 284477, "epoch": 1693} {"train_loss": -11.84967041015625, "global_step": 284478, "epoch": 1693} {"train_loss": -11.625995635986328, "global_step": 284479, "epoch": 1693} {"train_loss": -11.740537643432617, "global_step": 284480, "epoch": 1693} {"train_loss": -11.771780967712402, "global_step": 284481, "epoch": 1693} {"train_loss": -11.186272621154785, "global_step": 284482, "epoch": 1693} {"train_loss": -11.924766540527344, "global_step": 284483, "epoch": 1693} {"train_loss": -11.275470733642578, "global_step": 284484, "epoch": 1693} {"train_loss": -11.287212371826172, "global_step": 284485, "epoch": 1693} {"train_loss": -11.757741928100586, "global_step": 284486, "epoch": 1693} {"train_loss": -10.384451866149902, "global_step": 284487, "epoch": 1693} {"train_loss": -11.978057861328125, "global_step": 284488, "epoch": 1693} {"train_loss": -10.62522029876709, "global_step": 284489, "epoch": 1693} {"train_loss": -11.751562118530273, "global_step": 284490, "epoch": 1693} {"train_loss": -11.549200057983398, "global_step": 284491, "epoch": 1693} {"train_loss": -10.55909538269043, "global_step": 284492, "epoch": 1693} {"train_loss": -11.789469718933105, "global_step": 284493, "epoch": 1693} {"train_loss": -10.942999839782715, "global_step": 284494, "epoch": 1693} {"train_loss": -11.915129661560059, "global_step": 284495, "epoch": 1693} {"train_loss": -11.156726837158203, "global_step": 284496, "epoch": 1693} {"train_loss": -12.094213485717773, "global_step": 284497, "epoch": 1693} {"train_loss": -11.085970878601074, "global_step": 284498, "epoch": 1693} {"train_loss": -11.841333389282227, "global_step": 284499, "epoch": 1693} {"train_loss": -11.815524101257324, "global_step": 284500, "epoch": 1693} {"train_loss": -11.759245872497559, "global_step": 284501, "epoch": 1693} {"train_loss": -11.92120361328125, "global_step": 284502, "epoch": 1693} {"train_loss": -11.61258316040039, "global_step": 284503, "epoch": 1693} {"train_loss": -11.618104934692383, "global_step": 284504, "epoch": 1693} {"train_loss": -11.874190330505371, "global_step": 284505, "epoch": 1693} {"train_loss": -11.995611190795898, "global_step": 284506, "epoch": 1693} {"train_loss": -11.960405349731445, "global_step": 284507, "epoch": 1693} {"train_loss": -11.864969253540039, "global_step": 284508, "epoch": 1693} {"train_loss": -12.05196762084961, "global_step": 284509, "epoch": 1693} {"train_loss": -12.115411758422852, "global_step": 284510, "epoch": 1693} {"train_loss": -11.778324127197266, "global_step": 284511, "epoch": 1693} {"train_loss": -12.102764129638672, "global_step": 284512, "epoch": 1693} {"train_loss": -11.972118377685547, "global_step": 284513, "epoch": 1693} {"train_loss": -11.799981117248535, "global_step": 284514, "epoch": 1693} {"train_loss": -12.088038444519043, "global_step": 284515, "epoch": 1693} {"train_loss": -12.002605438232422, "global_step": 284516, "epoch": 1693} {"train_loss": -12.29697036743164, "global_step": 284517, "epoch": 1693} {"train_loss": -12.109027862548828, "global_step": 284518, "epoch": 1693} {"train_loss": -12.195903778076172, "global_step": 284519, "epoch": 1693} {"train_loss": -11.949275970458984, "global_step": 284520, "epoch": 1693} {"train_loss": -12.17796516418457, "global_step": 284521, "epoch": 1693} {"train_loss": -12.109390258789062, "global_step": 284522, "epoch": 1693} {"train_loss": -12.235917091369629, "global_step": 284523, "epoch": 1693} {"train_loss": -12.088075637817383, "global_step": 284524, "epoch": 1693} {"train_loss": -12.160503387451172, "global_step": 284525, "epoch": 1693} {"train_loss": -12.249717712402344, "global_step": 284526, "epoch": 1693} {"train_loss": -11.922801971435547, "global_step": 284527, "epoch": 1693} {"train_loss": -12.171488761901855, "global_step": 284528, "epoch": 1693} {"train_loss": -12.236837387084961, "global_step": 284529, "epoch": 1693} {"train_loss": -12.03148078918457, "global_step": 284530, "epoch": 1693} {"train_loss": -12.183853149414062, "global_step": 284531, "epoch": 1693} {"train_loss": -12.141322135925293, "global_step": 284532, "epoch": 1693} {"train_loss": -12.13471794128418, "global_step": 284533, "epoch": 1693} {"train_loss": -12.157735824584961, "global_step": 284534, "epoch": 1693} {"train_loss": -12.53454875946045, "global_step": 284535, "epoch": 1693} {"train_loss": -12.126090049743652, "global_step": 284536, "epoch": 1693} {"train_loss": -12.278125762939453, "global_step": 284537, "epoch": 1693} {"train_loss": -12.172511100769043, "global_step": 284538, "epoch": 1693} {"train_loss": -11.975415229797363, "global_step": 284539, "epoch": 1693} {"train_loss": -12.284273147583008, "global_step": 284540, "epoch": 1693} {"train_loss": -12.06997299194336, "global_step": 284541, "epoch": 1693} {"train_loss": -12.33936882019043, "global_step": 284542, "epoch": 1693} {"train_loss": -12.296487808227539, "global_step": 284543, "epoch": 1693} {"train_loss": -12.345094680786133, "global_step": 284544, "epoch": 1693} {"train_loss": -12.248083114624023, "global_step": 284545, "epoch": 1693} {"train_loss": -12.281521797180176, "global_step": 284546, "epoch": 1693} {"train_loss": -12.233501434326172, "global_step": 284547, "epoch": 1693} {"train_loss": -12.134764671325684, "global_step": 284548, "epoch": 1693} {"train_loss": -12.13096809387207, "global_step": 284549, "epoch": 1693} {"train_loss": -12.43884563446045, "global_step": 284550, "epoch": 1693} {"train_loss": -12.273780822753906, "global_step": 284551, "epoch": 1693} {"train_loss": -12.090424537658691, "global_step": 284552, "epoch": 1693} {"train_loss": -12.151082992553711, "global_step": 284553, "epoch": 1693} {"train_loss": -12.341254234313965, "global_step": 284554, "epoch": 1693} {"train_loss": -11.988883972167969, "global_step": 284555, "epoch": 1693} {"train_loss": -12.052024841308594, "global_step": 284556, "epoch": 1693} {"train_loss": -11.930145263671875, "global_step": 284557, "epoch": 1693} {"train_loss": -11.941459655761719, "global_step": 284558, "epoch": 1693} {"train_loss": -11.778398513793945, "global_step": 284559, "epoch": 1693} {"train_loss": -12.432540893554688, "global_step": 284560, "epoch": 1693} {"train_loss": -12.247529029846191, "global_step": 284561, "epoch": 1693} {"train_loss": -11.898958206176758, "global_step": 284562, "epoch": 1693} {"train_loss": -11.779434204101562, "global_step": 284563, "epoch": 1693} {"train_loss": -11.849800109863281, "global_step": 284564, "epoch": 1693} {"train_loss": -11.595516204833984, "global_step": 284565, "epoch": 1693} {"train_loss": -11.008867263793945, "global_step": 284566, "epoch": 1693} {"train_loss": -12.195133209228516, "global_step": 284567, "epoch": 1693} {"train_loss": -11.930375099182129, "global_step": 284568, "epoch": 1693} {"train_loss": -10.852136611938477, "global_step": 284569, "epoch": 1693} {"train_loss": -11.278521537780762, "global_step": 284570, "epoch": 1693} {"train_loss": -12.188720703125, "global_step": 284571, "epoch": 1693} {"train_loss": -11.787790298461914, "global_step": 284572, "epoch": 1693} {"train_loss": -11.517117500305176, "global_step": 284573, "epoch": 1693} {"train_loss": -12.182535171508789, "global_step": 284574, "epoch": 1693} {"train_loss": -12.191612243652344, "global_step": 284575, "epoch": 1693} {"train_loss": -11.70147705078125, "global_step": 284576, "epoch": 1693} {"train_loss": -11.692092895507812, "global_step": 284577, "epoch": 1693} {"train_loss": -12.003307342529297, "global_step": 284578, "epoch": 1693} {"train_loss": -11.719467163085938, "global_step": 284579, "epoch": 1693} {"train_loss": -11.569601058959961, "global_step": 284580, "epoch": 1693} {"train_loss": -11.667778968811035, "global_step": 284581, "epoch": 1693} {"train_loss": -12.06810188293457, "global_step": 284582, "epoch": 1693} {"train_loss": -11.35136604309082, "global_step": 284583, "epoch": 1693} {"train_loss": -11.978559494018555, "global_step": 284584, "epoch": 1693} {"train_loss": -11.142424583435059, "global_step": 284585, "epoch": 1693} {"train_loss": -11.609664916992188, "global_step": 284586, "epoch": 1693} {"train_loss": -11.71851921081543, "global_step": 284587, "epoch": 1693} {"train_loss": -11.71729850769043, "global_step": 284588, "epoch": 1693} {"train_loss": -11.871038436889648, "global_step": 284589, "epoch": 1693} {"train_loss": -11.856206893920898, "global_step": 284590, "epoch": 1693} {"train_loss": -11.785340042341323, "global_step": 284591, "epoch": 1693, "val_loss": 276752.65625} {"train_loss": -11.918560028076172, "global_step": 284592, "epoch": 1694} {"train_loss": -11.745540618896484, "global_step": 284593, "epoch": 1694} {"train_loss": -12.039827346801758, "global_step": 284594, "epoch": 1694} {"train_loss": -11.822478294372559, "global_step": 284595, "epoch": 1694} {"train_loss": -11.452188491821289, "global_step": 284596, "epoch": 1694} {"train_loss": -12.079132080078125, "global_step": 284597, "epoch": 1694} {"train_loss": -11.680944442749023, "global_step": 284598, "epoch": 1694} {"train_loss": -12.001091957092285, "global_step": 284599, "epoch": 1694} {"train_loss": -11.756264686584473, "global_step": 284600, "epoch": 1694} {"train_loss": -11.835406303405762, "global_step": 284601, "epoch": 1694} {"train_loss": -11.902482986450195, "global_step": 284602, "epoch": 1694} {"train_loss": -11.916982650756836, "global_step": 284603, "epoch": 1694} {"train_loss": -11.66972827911377, "global_step": 284604, "epoch": 1694} {"train_loss": -12.033744812011719, "global_step": 284605, "epoch": 1694} {"train_loss": -12.049837112426758, "global_step": 284606, "epoch": 1694} {"train_loss": -11.93580436706543, "global_step": 284607, "epoch": 1694} {"train_loss": -11.913134574890137, "global_step": 284608, "epoch": 1694} {"train_loss": -11.939961433410645, "global_step": 284609, "epoch": 1694} {"train_loss": -11.855477333068848, "global_step": 284610, "epoch": 1694} {"train_loss": -11.627405166625977, "global_step": 284611, "epoch": 1694} {"train_loss": -12.093778610229492, "global_step": 284612, "epoch": 1694} {"train_loss": -11.348838806152344, "global_step": 284613, "epoch": 1694} {"train_loss": -11.882354736328125, "global_step": 284614, "epoch": 1694} {"train_loss": -11.404499053955078, "global_step": 284615, "epoch": 1694} {"train_loss": -11.769512176513672, "global_step": 284616, "epoch": 1694} {"train_loss": -11.854507446289062, "global_step": 284617, "epoch": 1694} {"train_loss": -11.483674049377441, "global_step": 284618, "epoch": 1694} {"train_loss": -11.89917278289795, "global_step": 284619, "epoch": 1694} {"train_loss": -11.875717163085938, "global_step": 284620, "epoch": 1694} {"train_loss": -11.773555755615234, "global_step": 284621, "epoch": 1694} {"train_loss": -12.123762130737305, "global_step": 284622, "epoch": 1694} {"train_loss": -11.887815475463867, "global_step": 284623, "epoch": 1694} {"train_loss": -12.127521514892578, "global_step": 284624, "epoch": 1694} {"train_loss": -11.88884162902832, "global_step": 284625, "epoch": 1694} {"train_loss": -12.180608749389648, "global_step": 284626, "epoch": 1694} {"train_loss": -11.839061737060547, "global_step": 284627, "epoch": 1694} {"train_loss": -11.96447467803955, "global_step": 284628, "epoch": 1694} {"train_loss": -12.09762191772461, "global_step": 284629, "epoch": 1694} {"train_loss": -11.914043426513672, "global_step": 284630, "epoch": 1694} {"train_loss": -12.009832382202148, "global_step": 284631, "epoch": 1694} {"train_loss": -11.824666976928711, "global_step": 284632, "epoch": 1694} {"train_loss": -11.874292373657227, "global_step": 284633, "epoch": 1694} {"train_loss": -12.196250915527344, "global_step": 284634, "epoch": 1694} {"train_loss": -11.96696662902832, "global_step": 284635, "epoch": 1694} {"train_loss": -11.107938766479492, "global_step": 284636, "epoch": 1694} {"train_loss": -11.687772750854492, "global_step": 284637, "epoch": 1694} {"train_loss": -11.487943649291992, "global_step": 284638, "epoch": 1694} {"train_loss": -11.877005577087402, "global_step": 284639, "epoch": 1694} {"train_loss": -11.843984603881836, "global_step": 284640, "epoch": 1694} {"train_loss": -11.627331733703613, "global_step": 284641, "epoch": 1694} {"train_loss": -12.01074504852295, "global_step": 284642, "epoch": 1694} {"train_loss": -11.857274055480957, "global_step": 284643, "epoch": 1694} {"train_loss": -12.133978843688965, "global_step": 284644, "epoch": 1694} {"train_loss": -11.914562225341797, "global_step": 284645, "epoch": 1694} {"train_loss": -11.79630184173584, "global_step": 284646, "epoch": 1694} {"train_loss": -11.955190658569336, "global_step": 284647, "epoch": 1694} {"train_loss": -12.092329025268555, "global_step": 284648, "epoch": 1694} {"train_loss": -11.867819786071777, "global_step": 284649, "epoch": 1694} {"train_loss": -11.788249015808105, "global_step": 284650, "epoch": 1694} {"train_loss": -12.105239868164062, "global_step": 284651, "epoch": 1694} {"train_loss": -11.417930603027344, "global_step": 284652, "epoch": 1694} {"train_loss": -11.892179489135742, "global_step": 284653, "epoch": 1694} {"train_loss": -11.919000625610352, "global_step": 284654, "epoch": 1694} {"train_loss": -11.671932220458984, "global_step": 284655, "epoch": 1694} {"train_loss": -12.011137962341309, "global_step": 284656, "epoch": 1694} {"train_loss": -12.016613006591797, "global_step": 284657, "epoch": 1694} {"train_loss": -11.007108688354492, "global_step": 284658, "epoch": 1694} {"train_loss": -11.607056617736816, "global_step": 284659, "epoch": 1694} {"train_loss": -11.81257438659668, "global_step": 284660, "epoch": 1694} {"train_loss": -10.986265182495117, "global_step": 284661, "epoch": 1694} {"train_loss": -11.438369750976562, "global_step": 284662, "epoch": 1694} {"train_loss": -11.715435028076172, "global_step": 284663, "epoch": 1694} {"train_loss": -11.557387351989746, "global_step": 284664, "epoch": 1694} {"train_loss": -10.523003578186035, "global_step": 284665, "epoch": 1694} {"train_loss": -11.631046295166016, "global_step": 284666, "epoch": 1694} {"train_loss": -11.08060073852539, "global_step": 284667, "epoch": 1694} {"train_loss": -11.01452350616455, "global_step": 284668, "epoch": 1694} {"train_loss": -11.220394134521484, "global_step": 284669, "epoch": 1694} {"train_loss": -11.191466331481934, "global_step": 284670, "epoch": 1694} {"train_loss": -12.069001197814941, "global_step": 284671, "epoch": 1694} {"train_loss": -11.307638168334961, "global_step": 284672, "epoch": 1694} {"train_loss": -12.144590377807617, "global_step": 284673, "epoch": 1694} {"train_loss": -11.25360107421875, "global_step": 284674, "epoch": 1694} {"train_loss": -11.90237808227539, "global_step": 284675, "epoch": 1694} {"train_loss": -11.011968612670898, "global_step": 284676, "epoch": 1694} {"train_loss": -11.696105003356934, "global_step": 284677, "epoch": 1694} {"train_loss": -11.314314842224121, "global_step": 284678, "epoch": 1694} {"train_loss": -11.645369529724121, "global_step": 284679, "epoch": 1694} {"train_loss": -11.821439743041992, "global_step": 284680, "epoch": 1694} {"train_loss": -11.403504371643066, "global_step": 284681, "epoch": 1694} {"train_loss": -11.393518447875977, "global_step": 284682, "epoch": 1694} {"train_loss": -11.96579647064209, "global_step": 284683, "epoch": 1694} {"train_loss": -11.66500186920166, "global_step": 284684, "epoch": 1694} {"train_loss": -11.939987182617188, "global_step": 284685, "epoch": 1694} {"train_loss": -11.680505752563477, "global_step": 284686, "epoch": 1694} {"train_loss": -11.737173080444336, "global_step": 284687, "epoch": 1694} {"train_loss": -11.693330764770508, "global_step": 284688, "epoch": 1694} {"train_loss": -11.610240936279297, "global_step": 284689, "epoch": 1694} {"train_loss": -11.667570114135742, "global_step": 284690, "epoch": 1694} {"train_loss": -11.704130172729492, "global_step": 284691, "epoch": 1694} {"train_loss": -11.705309867858887, "global_step": 284692, "epoch": 1694} {"train_loss": -11.577150344848633, "global_step": 284693, "epoch": 1694} {"train_loss": -12.005115509033203, "global_step": 284694, "epoch": 1694} {"train_loss": -11.50290584564209, "global_step": 284695, "epoch": 1694} {"train_loss": -12.037654876708984, "global_step": 284696, "epoch": 1694} {"train_loss": -11.657156944274902, "global_step": 284697, "epoch": 1694} {"train_loss": -11.890411376953125, "global_step": 284698, "epoch": 1694} {"train_loss": -11.600198745727539, "global_step": 284699, "epoch": 1694} {"train_loss": -11.744512557983398, "global_step": 284700, "epoch": 1694} {"train_loss": -11.227696418762207, "global_step": 284701, "epoch": 1694} {"train_loss": -11.862648963928223, "global_step": 284702, "epoch": 1694} {"train_loss": -11.538858413696289, "global_step": 284703, "epoch": 1694} {"train_loss": -11.483316421508789, "global_step": 284704, "epoch": 1694} {"train_loss": -11.719515800476074, "global_step": 284705, "epoch": 1694} {"train_loss": -11.997114181518555, "global_step": 284706, "epoch": 1694} {"train_loss": -11.631879806518555, "global_step": 284707, "epoch": 1694} {"train_loss": -12.037328720092773, "global_step": 284708, "epoch": 1694} {"train_loss": -11.502175331115723, "global_step": 284709, "epoch": 1694} {"train_loss": -11.7784423828125, "global_step": 284710, "epoch": 1694} {"train_loss": -11.71308708190918, "global_step": 284711, "epoch": 1694} {"train_loss": -12.14436149597168, "global_step": 284712, "epoch": 1694} {"train_loss": -11.699892044067383, "global_step": 284713, "epoch": 1694} {"train_loss": -11.438887596130371, "global_step": 284714, "epoch": 1694} {"train_loss": -11.98942756652832, "global_step": 284715, "epoch": 1694} {"train_loss": -12.073966026306152, "global_step": 284716, "epoch": 1694} {"train_loss": -11.734225273132324, "global_step": 284717, "epoch": 1694} {"train_loss": -12.03627872467041, "global_step": 284718, "epoch": 1694} {"train_loss": -11.752294540405273, "global_step": 284719, "epoch": 1694} {"train_loss": -11.844426155090332, "global_step": 284720, "epoch": 1694} {"train_loss": -12.134871482849121, "global_step": 284721, "epoch": 1694} {"train_loss": -12.014862060546875, "global_step": 284722, "epoch": 1694} {"train_loss": -11.767709732055664, "global_step": 284723, "epoch": 1694} {"train_loss": -11.906635284423828, "global_step": 284724, "epoch": 1694} {"train_loss": -11.47723388671875, "global_step": 284725, "epoch": 1694} {"train_loss": -11.745646476745605, "global_step": 284726, "epoch": 1694} {"train_loss": -11.867719650268555, "global_step": 284727, "epoch": 1694} {"train_loss": -10.749187469482422, "global_step": 284728, "epoch": 1694} {"train_loss": -11.72962760925293, "global_step": 284729, "epoch": 1694} {"train_loss": -11.76910400390625, "global_step": 284730, "epoch": 1694} {"train_loss": -11.932616233825684, "global_step": 284731, "epoch": 1694} {"train_loss": -11.842363357543945, "global_step": 284732, "epoch": 1694} {"train_loss": -11.8573637008667, "global_step": 284733, "epoch": 1694} {"train_loss": -12.142411231994629, "global_step": 284734, "epoch": 1694} {"train_loss": -11.36832332611084, "global_step": 284735, "epoch": 1694} {"train_loss": -11.96010971069336, "global_step": 284736, "epoch": 1694} {"train_loss": -11.811422348022461, "global_step": 284737, "epoch": 1694} {"train_loss": -11.43920612335205, "global_step": 284738, "epoch": 1694} {"train_loss": -11.894609451293945, "global_step": 284739, "epoch": 1694} {"train_loss": -11.387106895446777, "global_step": 284740, "epoch": 1694} {"train_loss": -11.818119049072266, "global_step": 284741, "epoch": 1694} {"train_loss": -11.495660781860352, "global_step": 284742, "epoch": 1694} {"train_loss": -11.444293975830078, "global_step": 284743, "epoch": 1694} {"train_loss": -10.952741622924805, "global_step": 284744, "epoch": 1694} {"train_loss": -12.011089324951172, "global_step": 284745, "epoch": 1694} {"train_loss": -11.139423370361328, "global_step": 284746, "epoch": 1694} {"train_loss": -11.479576110839844, "global_step": 284747, "epoch": 1694} {"train_loss": -11.088624954223633, "global_step": 284748, "epoch": 1694} {"train_loss": -11.91183853149414, "global_step": 284749, "epoch": 1694} {"train_loss": -11.025193214416504, "global_step": 284750, "epoch": 1694} {"train_loss": -10.843315124511719, "global_step": 284751, "epoch": 1694} {"train_loss": -10.833474159240723, "global_step": 284752, "epoch": 1694} {"train_loss": -10.870160102844238, "global_step": 284753, "epoch": 1694} {"train_loss": -12.014219284057617, "global_step": 284754, "epoch": 1694} {"train_loss": -11.120525360107422, "global_step": 284755, "epoch": 1694} {"train_loss": -11.635939598083496, "global_step": 284756, "epoch": 1694} {"train_loss": -11.429241180419922, "global_step": 284757, "epoch": 1694} {"train_loss": -11.161300659179688, "global_step": 284758, "epoch": 1694} {"train_loss": -11.692806487991696, "global_step": 284759, "epoch": 1694, "val_loss": 279307.34375} {"train_loss": -10.716146469116211, "global_step": 284760, "epoch": 1695} {"train_loss": -11.532098770141602, "global_step": 284761, "epoch": 1695} {"train_loss": -10.534900665283203, "global_step": 284762, "epoch": 1695} {"train_loss": -11.401338577270508, "global_step": 284763, "epoch": 1695} {"train_loss": -11.228129386901855, "global_step": 284764, "epoch": 1695} {"train_loss": -11.532060623168945, "global_step": 284765, "epoch": 1695} {"train_loss": -10.917545318603516, "global_step": 284766, "epoch": 1695} {"train_loss": -11.704289436340332, "global_step": 284767, "epoch": 1695} {"train_loss": -11.142909049987793, "global_step": 284768, "epoch": 1695} {"train_loss": -11.727104187011719, "global_step": 284769, "epoch": 1695} {"train_loss": -11.083035469055176, "global_step": 284770, "epoch": 1695} {"train_loss": -11.11121654510498, "global_step": 284771, "epoch": 1695} {"train_loss": -11.537252426147461, "global_step": 284772, "epoch": 1695} {"train_loss": -10.658343315124512, "global_step": 284773, "epoch": 1695} {"train_loss": -11.723483085632324, "global_step": 284774, "epoch": 1695} {"train_loss": -11.139565467834473, "global_step": 284775, "epoch": 1695} {"train_loss": -11.378774642944336, "global_step": 284776, "epoch": 1695} {"train_loss": -11.363075256347656, "global_step": 284777, "epoch": 1695} {"train_loss": -11.484430313110352, "global_step": 284778, "epoch": 1695} {"train_loss": -11.424861907958984, "global_step": 284779, "epoch": 1695} {"train_loss": -11.427047729492188, "global_step": 284780, "epoch": 1695} {"train_loss": -11.688875198364258, "global_step": 284781, "epoch": 1695} {"train_loss": -11.731229782104492, "global_step": 284782, "epoch": 1695} {"train_loss": -11.779243469238281, "global_step": 284783, "epoch": 1695} {"train_loss": -12.063882827758789, "global_step": 284784, "epoch": 1695} {"train_loss": -11.746833801269531, "global_step": 284785, "epoch": 1695} {"train_loss": -11.9238920211792, "global_step": 284786, "epoch": 1695} {"train_loss": -11.813179016113281, "global_step": 284787, "epoch": 1695} {"train_loss": -11.779556274414062, "global_step": 284788, "epoch": 1695} {"train_loss": -11.81925106048584, "global_step": 284789, "epoch": 1695} {"train_loss": -11.87066650390625, "global_step": 284790, "epoch": 1695} {"train_loss": -11.652785301208496, "global_step": 284791, "epoch": 1695} {"train_loss": -11.802582740783691, "global_step": 284792, "epoch": 1695} {"train_loss": -11.775754928588867, "global_step": 284793, "epoch": 1695} {"train_loss": -12.137168884277344, "global_step": 284794, "epoch": 1695} {"train_loss": -11.731878280639648, "global_step": 284795, "epoch": 1695} {"train_loss": -11.962514877319336, "global_step": 284796, "epoch": 1695} {"train_loss": -11.938547134399414, "global_step": 284797, "epoch": 1695} {"train_loss": -11.639001846313477, "global_step": 284798, "epoch": 1695} {"train_loss": -11.66301155090332, "global_step": 284799, "epoch": 1695} {"train_loss": -11.883052825927734, "global_step": 284800, "epoch": 1695} {"train_loss": -11.96358585357666, "global_step": 284801, "epoch": 1695} {"train_loss": -11.975982666015625, "global_step": 284802, "epoch": 1695} {"train_loss": -12.046884536743164, "global_step": 284803, "epoch": 1695} {"train_loss": -11.932611465454102, "global_step": 284804, "epoch": 1695} {"train_loss": -12.16343879699707, "global_step": 284805, "epoch": 1695} {"train_loss": -12.050661087036133, "global_step": 284806, "epoch": 1695} {"train_loss": -12.119009971618652, "global_step": 284807, "epoch": 1695} {"train_loss": -12.055556297302246, "global_step": 284808, "epoch": 1695} {"train_loss": -12.03476333618164, "global_step": 284809, "epoch": 1695} {"train_loss": -12.187238693237305, "global_step": 284810, "epoch": 1695} {"train_loss": -11.973567962646484, "global_step": 284811, "epoch": 1695} {"train_loss": -12.20711898803711, "global_step": 284812, "epoch": 1695} {"train_loss": -11.968870162963867, "global_step": 284813, "epoch": 1695} {"train_loss": -12.193929672241211, "global_step": 284814, "epoch": 1695} {"train_loss": -12.209760665893555, "global_step": 284815, "epoch": 1695} {"train_loss": -12.16246223449707, "global_step": 284816, "epoch": 1695} {"train_loss": -12.299833297729492, "global_step": 284817, "epoch": 1695} {"train_loss": -12.318181991577148, "global_step": 284818, "epoch": 1695} {"train_loss": -12.414556503295898, "global_step": 284819, "epoch": 1695} {"train_loss": -12.137462615966797, "global_step": 284820, "epoch": 1695} {"train_loss": -12.105533599853516, "global_step": 284821, "epoch": 1695} {"train_loss": -12.17657470703125, "global_step": 284822, "epoch": 1695} {"train_loss": -12.007135391235352, "global_step": 284823, "epoch": 1695} {"train_loss": -12.334446907043457, "global_step": 284824, "epoch": 1695} {"train_loss": -12.29621696472168, "global_step": 284825, "epoch": 1695} {"train_loss": -12.294576644897461, "global_step": 284826, "epoch": 1695} {"train_loss": -12.163200378417969, "global_step": 284827, "epoch": 1695} {"train_loss": -12.195061683654785, "global_step": 284828, "epoch": 1695} {"train_loss": -12.287436485290527, "global_step": 284829, "epoch": 1695} {"train_loss": -12.310708045959473, "global_step": 284830, "epoch": 1695} {"train_loss": -12.016098022460938, "global_step": 284831, "epoch": 1695} {"train_loss": -12.27098560333252, "global_step": 284832, "epoch": 1695} {"train_loss": -11.897359848022461, "global_step": 284833, "epoch": 1695} {"train_loss": -12.061336517333984, "global_step": 284834, "epoch": 1695} {"train_loss": -11.379825592041016, "global_step": 284835, "epoch": 1695} {"train_loss": -11.622828483581543, "global_step": 284836, "epoch": 1695} {"train_loss": -12.360363006591797, "global_step": 284837, "epoch": 1695} {"train_loss": -11.482126235961914, "global_step": 284838, "epoch": 1695} {"train_loss": -12.110986709594727, "global_step": 284839, "epoch": 1695} {"train_loss": -11.694551467895508, "global_step": 284840, "epoch": 1695} {"train_loss": -11.133125305175781, "global_step": 284841, "epoch": 1695} {"train_loss": -12.224052429199219, "global_step": 284842, "epoch": 1695} {"train_loss": -11.772899627685547, "global_step": 284843, "epoch": 1695} {"train_loss": -11.7640380859375, "global_step": 284844, "epoch": 1695} {"train_loss": -11.82443618774414, "global_step": 284845, "epoch": 1695} {"train_loss": -11.608551025390625, "global_step": 284846, "epoch": 1695} {"train_loss": -11.50288200378418, "global_step": 284847, "epoch": 1695} {"train_loss": -12.204626083374023, "global_step": 284848, "epoch": 1695} {"train_loss": -11.725286483764648, "global_step": 284849, "epoch": 1695} {"train_loss": -11.944425582885742, "global_step": 284850, "epoch": 1695} {"train_loss": -11.661520004272461, "global_step": 284851, "epoch": 1695} {"train_loss": -12.240789413452148, "global_step": 284852, "epoch": 1695} {"train_loss": -11.884572982788086, "global_step": 284853, "epoch": 1695} {"train_loss": -12.384235382080078, "global_step": 284854, "epoch": 1695} {"train_loss": -12.026895523071289, "global_step": 284855, "epoch": 1695} {"train_loss": -12.300415992736816, "global_step": 284856, "epoch": 1695} {"train_loss": -12.013309478759766, "global_step": 284857, "epoch": 1695} {"train_loss": -12.262933731079102, "global_step": 284858, "epoch": 1695} {"train_loss": -12.154464721679688, "global_step": 284859, "epoch": 1695} {"train_loss": -12.087835311889648, "global_step": 284860, "epoch": 1695} {"train_loss": -11.942477226257324, "global_step": 284861, "epoch": 1695} {"train_loss": -12.296335220336914, "global_step": 284862, "epoch": 1695} {"train_loss": -12.269367218017578, "global_step": 284863, "epoch": 1695} {"train_loss": -12.166675567626953, "global_step": 284864, "epoch": 1695} {"train_loss": -11.990045547485352, "global_step": 284865, "epoch": 1695} {"train_loss": -12.367853164672852, "global_step": 284866, "epoch": 1695} {"train_loss": -11.872803688049316, "global_step": 284867, "epoch": 1695} {"train_loss": -12.243457794189453, "global_step": 284868, "epoch": 1695} {"train_loss": -11.666793823242188, "global_step": 284869, "epoch": 1695} {"train_loss": -11.875514030456543, "global_step": 284870, "epoch": 1695} {"train_loss": -11.842267990112305, "global_step": 284871, "epoch": 1695} {"train_loss": -12.340372085571289, "global_step": 284872, "epoch": 1695} {"train_loss": -12.170502662658691, "global_step": 284873, "epoch": 1695} {"train_loss": -12.05274772644043, "global_step": 284874, "epoch": 1695} {"train_loss": -12.135391235351562, "global_step": 284875, "epoch": 1695} {"train_loss": -12.071380615234375, "global_step": 284876, "epoch": 1695} {"train_loss": -11.864706993103027, "global_step": 284877, "epoch": 1695} {"train_loss": -12.277374267578125, "global_step": 284878, "epoch": 1695} {"train_loss": -12.058016777038574, "global_step": 284879, "epoch": 1695} {"train_loss": -11.372184753417969, "global_step": 284880, "epoch": 1695} {"train_loss": -11.682363510131836, "global_step": 284881, "epoch": 1695} {"train_loss": -11.832603454589844, "global_step": 284882, "epoch": 1695} {"train_loss": -10.598724365234375, "global_step": 284883, "epoch": 1695} {"train_loss": -11.361988067626953, "global_step": 284884, "epoch": 1695} {"train_loss": -11.905111312866211, "global_step": 284885, "epoch": 1695} {"train_loss": -10.960881233215332, "global_step": 284886, "epoch": 1695} {"train_loss": -11.7264404296875, "global_step": 284887, "epoch": 1695} {"train_loss": -11.563024520874023, "global_step": 284888, "epoch": 1695} {"train_loss": -12.028595924377441, "global_step": 284889, "epoch": 1695} {"train_loss": -11.975360870361328, "global_step": 284890, "epoch": 1695} {"train_loss": -11.869271278381348, "global_step": 284891, "epoch": 1695} {"train_loss": -11.892141342163086, "global_step": 284892, "epoch": 1695} {"train_loss": -11.565288543701172, "global_step": 284893, "epoch": 1695} {"train_loss": -11.155635833740234, "global_step": 284894, "epoch": 1695} {"train_loss": -11.224971771240234, "global_step": 284895, "epoch": 1695} {"train_loss": -11.68404483795166, "global_step": 284896, "epoch": 1695} {"train_loss": -11.687667846679688, "global_step": 284897, "epoch": 1695} {"train_loss": -11.346169471740723, "global_step": 284898, "epoch": 1695} {"train_loss": -11.998273849487305, "global_step": 284899, "epoch": 1695} {"train_loss": -11.54779052734375, "global_step": 284900, "epoch": 1695} {"train_loss": -11.76606559753418, "global_step": 284901, "epoch": 1695} {"train_loss": -11.661523818969727, "global_step": 284902, "epoch": 1695} {"train_loss": -11.408121109008789, "global_step": 284903, "epoch": 1695} {"train_loss": -11.914957046508789, "global_step": 284904, "epoch": 1695} {"train_loss": -11.12060832977295, "global_step": 284905, "epoch": 1695} {"train_loss": -11.339583396911621, "global_step": 284906, "epoch": 1695} {"train_loss": -11.760986328125, "global_step": 284907, "epoch": 1695} {"train_loss": -11.507791519165039, "global_step": 284908, "epoch": 1695} {"train_loss": -11.815742492675781, "global_step": 284909, "epoch": 1695} {"train_loss": -11.820022583007812, "global_step": 284910, "epoch": 1695} {"train_loss": -10.648639678955078, "global_step": 284911, "epoch": 1695} {"train_loss": -12.003072738647461, "global_step": 284912, "epoch": 1695} {"train_loss": -11.176219940185547, "global_step": 284913, "epoch": 1695} {"train_loss": -11.459196090698242, "global_step": 284914, "epoch": 1695} {"train_loss": -11.429805755615234, "global_step": 284915, "epoch": 1695} {"train_loss": -11.69746208190918, "global_step": 284916, "epoch": 1695} {"train_loss": -11.726112365722656, "global_step": 284917, "epoch": 1695} {"train_loss": -11.55497932434082, "global_step": 284918, "epoch": 1695} {"train_loss": -11.34621810913086, "global_step": 284919, "epoch": 1695} {"train_loss": -11.229752540588379, "global_step": 284920, "epoch": 1695} {"train_loss": -11.295613288879395, "global_step": 284921, "epoch": 1695} {"train_loss": -11.365852355957031, "global_step": 284922, "epoch": 1695} {"train_loss": -11.008994102478027, "global_step": 284923, "epoch": 1695} {"train_loss": -11.763395309448242, "global_step": 284924, "epoch": 1695} {"train_loss": -10.640271186828613, "global_step": 284925, "epoch": 1695} {"train_loss": -11.187588691711426, "global_step": 284926, "epoch": 1695} {"train_loss": -11.764866931097847, "global_step": 284927, "epoch": 1695, "val_loss": 276769.1875, "train_action_mse_error": 0.9981558322906494} {"train_loss": -11.038403511047363, "global_step": 284928, "epoch": 1696} {"train_loss": -11.138832092285156, "global_step": 284929, "epoch": 1696} {"train_loss": -10.766193389892578, "global_step": 284930, "epoch": 1696} {"train_loss": -11.424615859985352, "global_step": 284931, "epoch": 1696} {"train_loss": -10.544858932495117, "global_step": 284932, "epoch": 1696} {"train_loss": -11.293283462524414, "global_step": 284933, "epoch": 1696} {"train_loss": -11.08094310760498, "global_step": 284934, "epoch": 1696} {"train_loss": -11.080108642578125, "global_step": 284935, "epoch": 1696} {"train_loss": -11.103364944458008, "global_step": 284936, "epoch": 1696} {"train_loss": -11.9915771484375, "global_step": 284937, "epoch": 1696} {"train_loss": -10.893592834472656, "global_step": 284938, "epoch": 1696} {"train_loss": -11.518827438354492, "global_step": 284939, "epoch": 1696} {"train_loss": -10.9810152053833, "global_step": 284940, "epoch": 1696} {"train_loss": -11.412236213684082, "global_step": 284941, "epoch": 1696} {"train_loss": -11.255622863769531, "global_step": 284942, "epoch": 1696} {"train_loss": -11.480677604675293, "global_step": 284943, "epoch": 1696} {"train_loss": -11.045841217041016, "global_step": 284944, "epoch": 1696} {"train_loss": -11.418333053588867, "global_step": 284945, "epoch": 1696} {"train_loss": -10.8153657913208, "global_step": 284946, "epoch": 1696} {"train_loss": -11.100065231323242, "global_step": 284947, "epoch": 1696} {"train_loss": -10.942353248596191, "global_step": 284948, "epoch": 1696} {"train_loss": -11.416070938110352, "global_step": 284949, "epoch": 1696} {"train_loss": -11.312849044799805, "global_step": 284950, "epoch": 1696} {"train_loss": -11.709693908691406, "global_step": 284951, "epoch": 1696} {"train_loss": -11.392166137695312, "global_step": 284952, "epoch": 1696} {"train_loss": -11.507262229919434, "global_step": 284953, "epoch": 1696} {"train_loss": -11.325927734375, "global_step": 284954, "epoch": 1696} {"train_loss": -11.619025230407715, "global_step": 284955, "epoch": 1696} {"train_loss": -11.45273494720459, "global_step": 284956, "epoch": 1696} {"train_loss": -11.494771003723145, "global_step": 284957, "epoch": 1696} {"train_loss": -11.504677772521973, "global_step": 284958, "epoch": 1696} {"train_loss": -11.56476879119873, "global_step": 284959, "epoch": 1696} {"train_loss": -11.502059936523438, "global_step": 284960, "epoch": 1696} {"train_loss": -11.713188171386719, "global_step": 284961, "epoch": 1696} {"train_loss": -11.958915710449219, "global_step": 284962, "epoch": 1696} {"train_loss": -11.502307891845703, "global_step": 284963, "epoch": 1696} {"train_loss": -11.89242935180664, "global_step": 284964, "epoch": 1696} {"train_loss": -11.500141143798828, "global_step": 284965, "epoch": 1696} {"train_loss": -11.985759735107422, "global_step": 284966, "epoch": 1696} {"train_loss": -11.336164474487305, "global_step": 284967, "epoch": 1696} {"train_loss": -11.691795349121094, "global_step": 284968, "epoch": 1696} {"train_loss": -11.89295768737793, "global_step": 284969, "epoch": 1696} {"train_loss": -11.73616886138916, "global_step": 284970, "epoch": 1696} {"train_loss": -11.702326774597168, "global_step": 284971, "epoch": 1696} {"train_loss": -11.795051574707031, "global_step": 284972, "epoch": 1696} {"train_loss": -11.902414321899414, "global_step": 284973, "epoch": 1696} {"train_loss": -11.667393684387207, "global_step": 284974, "epoch": 1696} {"train_loss": -12.087119102478027, "global_step": 284975, "epoch": 1696} {"train_loss": -11.828545570373535, "global_step": 284976, "epoch": 1696} {"train_loss": -12.039772987365723, "global_step": 284977, "epoch": 1696} {"train_loss": -11.967178344726562, "global_step": 284978, "epoch": 1696} {"train_loss": -12.184412956237793, "global_step": 284979, "epoch": 1696} {"train_loss": -12.015533447265625, "global_step": 284980, "epoch": 1696} {"train_loss": -12.038427352905273, "global_step": 284981, "epoch": 1696} {"train_loss": -12.032564163208008, "global_step": 284982, "epoch": 1696} {"train_loss": -12.078617095947266, "global_step": 284983, "epoch": 1696} {"train_loss": -11.96816635131836, "global_step": 284984, "epoch": 1696} {"train_loss": -12.114204406738281, "global_step": 284985, "epoch": 1696} {"train_loss": -11.838228225708008, "global_step": 284986, "epoch": 1696} {"train_loss": -12.063018798828125, "global_step": 284987, "epoch": 1696} {"train_loss": -12.212810516357422, "global_step": 284988, "epoch": 1696} {"train_loss": -12.029443740844727, "global_step": 284989, "epoch": 1696} {"train_loss": -12.076643943786621, "global_step": 284990, "epoch": 1696} {"train_loss": -11.956174850463867, "global_step": 284991, "epoch": 1696} {"train_loss": -11.998420715332031, "global_step": 284992, "epoch": 1696} {"train_loss": -12.063243865966797, "global_step": 284993, "epoch": 1696} {"train_loss": -12.165283203125, "global_step": 284994, "epoch": 1696} {"train_loss": -12.192632675170898, "global_step": 284995, "epoch": 1696} {"train_loss": -12.008386611938477, "global_step": 284996, "epoch": 1696} {"train_loss": -12.021987915039062, "global_step": 284997, "epoch": 1696} {"train_loss": -11.979546546936035, "global_step": 284998, "epoch": 1696} {"train_loss": -12.343267440795898, "global_step": 284999, "epoch": 1696} {"train_loss": -11.829235076904297, "global_step": 285000, "epoch": 1696} {"train_loss": -12.262866020202637, "global_step": 285001, "epoch": 1696} {"train_loss": -12.084074020385742, "global_step": 285002, "epoch": 1696} {"train_loss": -11.996212005615234, "global_step": 285003, "epoch": 1696} {"train_loss": -11.999861717224121, "global_step": 285004, "epoch": 1696} {"train_loss": -12.21293830871582, "global_step": 285005, "epoch": 1696} {"train_loss": -12.085262298583984, "global_step": 285006, "epoch": 1696} {"train_loss": -11.948525428771973, "global_step": 285007, "epoch": 1696} {"train_loss": -12.314146041870117, "global_step": 285008, "epoch": 1696} {"train_loss": -12.173704147338867, "global_step": 285009, "epoch": 1696} {"train_loss": -11.694769859313965, "global_step": 285010, "epoch": 1696} {"train_loss": -11.99401569366455, "global_step": 285011, "epoch": 1696} {"train_loss": -12.141059875488281, "global_step": 285012, "epoch": 1696} {"train_loss": -12.083487510681152, "global_step": 285013, "epoch": 1696} {"train_loss": -11.77418041229248, "global_step": 285014, "epoch": 1696} {"train_loss": -11.828193664550781, "global_step": 285015, "epoch": 1696} {"train_loss": -11.833931922912598, "global_step": 285016, "epoch": 1696} {"train_loss": -12.20419692993164, "global_step": 285017, "epoch": 1696} {"train_loss": -12.135960578918457, "global_step": 285018, "epoch": 1696} {"train_loss": -11.755067825317383, "global_step": 285019, "epoch": 1696} {"train_loss": -11.994952201843262, "global_step": 285020, "epoch": 1696} {"train_loss": -11.894048690795898, "global_step": 285021, "epoch": 1696} {"train_loss": -11.683094024658203, "global_step": 285022, "epoch": 1696} {"train_loss": -11.726905822753906, "global_step": 285023, "epoch": 1696} {"train_loss": -12.10287094116211, "global_step": 285024, "epoch": 1696} {"train_loss": -12.113332748413086, "global_step": 285025, "epoch": 1696} {"train_loss": -11.816141128540039, "global_step": 285026, "epoch": 1696} {"train_loss": -12.095417022705078, "global_step": 285027, "epoch": 1696} {"train_loss": -11.474523544311523, "global_step": 285028, "epoch": 1696} {"train_loss": -11.67171573638916, "global_step": 285029, "epoch": 1696} {"train_loss": -12.352621078491211, "global_step": 285030, "epoch": 1696} {"train_loss": -11.765523910522461, "global_step": 285031, "epoch": 1696} {"train_loss": -12.00645637512207, "global_step": 285032, "epoch": 1696} {"train_loss": -12.128093719482422, "global_step": 285033, "epoch": 1696} {"train_loss": -11.993570327758789, "global_step": 285034, "epoch": 1696} {"train_loss": -12.415924072265625, "global_step": 285035, "epoch": 1696} {"train_loss": -12.046224594116211, "global_step": 285036, "epoch": 1696} {"train_loss": -11.894669532775879, "global_step": 285037, "epoch": 1696} {"train_loss": -12.240946769714355, "global_step": 285038, "epoch": 1696} {"train_loss": -11.635149955749512, "global_step": 285039, "epoch": 1696} {"train_loss": -11.97046184539795, "global_step": 285040, "epoch": 1696} {"train_loss": -12.098518371582031, "global_step": 285041, "epoch": 1696} {"train_loss": -12.288045883178711, "global_step": 285042, "epoch": 1696} {"train_loss": -12.00403118133545, "global_step": 285043, "epoch": 1696} {"train_loss": -12.082050323486328, "global_step": 285044, "epoch": 1696} {"train_loss": -11.907291412353516, "global_step": 285045, "epoch": 1696} {"train_loss": -12.069486618041992, "global_step": 285046, "epoch": 1696} {"train_loss": -12.280094146728516, "global_step": 285047, "epoch": 1696} {"train_loss": -12.10030746459961, "global_step": 285048, "epoch": 1696} {"train_loss": -12.152482986450195, "global_step": 285049, "epoch": 1696} {"train_loss": -12.371600151062012, "global_step": 285050, "epoch": 1696} {"train_loss": -12.01565170288086, "global_step": 285051, "epoch": 1696} {"train_loss": -12.189281463623047, "global_step": 285052, "epoch": 1696} {"train_loss": -12.146480560302734, "global_step": 285053, "epoch": 1696} {"train_loss": -11.471696853637695, "global_step": 285054, "epoch": 1696} {"train_loss": -11.236383438110352, "global_step": 285055, "epoch": 1696} {"train_loss": -11.865747451782227, "global_step": 285056, "epoch": 1696} {"train_loss": -11.899630546569824, "global_step": 285057, "epoch": 1696} {"train_loss": -11.278335571289062, "global_step": 285058, "epoch": 1696} {"train_loss": -11.89864730834961, "global_step": 285059, "epoch": 1696} {"train_loss": -10.980049133300781, "global_step": 285060, "epoch": 1696} {"train_loss": -11.834699630737305, "global_step": 285061, "epoch": 1696} {"train_loss": -11.449856758117676, "global_step": 285062, "epoch": 1696} {"train_loss": -12.044734954833984, "global_step": 285063, "epoch": 1696} {"train_loss": -11.219013214111328, "global_step": 285064, "epoch": 1696} {"train_loss": -11.831825256347656, "global_step": 285065, "epoch": 1696} {"train_loss": -10.83001708984375, "global_step": 285066, "epoch": 1696} {"train_loss": -10.691282272338867, "global_step": 285067, "epoch": 1696} {"train_loss": -11.4071683883667, "global_step": 285068, "epoch": 1696} {"train_loss": -11.303325653076172, "global_step": 285069, "epoch": 1696} {"train_loss": -10.996052742004395, "global_step": 285070, "epoch": 1696} {"train_loss": -11.230789184570312, "global_step": 285071, "epoch": 1696} {"train_loss": -10.825316429138184, "global_step": 285072, "epoch": 1696} {"train_loss": -11.326332092285156, "global_step": 285073, "epoch": 1696} {"train_loss": -10.854682922363281, "global_step": 285074, "epoch": 1696} {"train_loss": -10.188629150390625, "global_step": 285075, "epoch": 1696} {"train_loss": -11.360326766967773, "global_step": 285076, "epoch": 1696} {"train_loss": -10.412100791931152, "global_step": 285077, "epoch": 1696} {"train_loss": -11.794565200805664, "global_step": 285078, "epoch": 1696} {"train_loss": -11.422826766967773, "global_step": 285079, "epoch": 1696} {"train_loss": -11.596589088439941, "global_step": 285080, "epoch": 1696} {"train_loss": -11.619810104370117, "global_step": 285081, "epoch": 1696} {"train_loss": -11.937542915344238, "global_step": 285082, "epoch": 1696} {"train_loss": -11.303316116333008, "global_step": 285083, "epoch": 1696} {"train_loss": -11.825672149658203, "global_step": 285084, "epoch": 1696} {"train_loss": -11.364297866821289, "global_step": 285085, "epoch": 1696} {"train_loss": -11.710878372192383, "global_step": 285086, "epoch": 1696} {"train_loss": -11.538488388061523, "global_step": 285087, "epoch": 1696} {"train_loss": -11.27894401550293, "global_step": 285088, "epoch": 1696} {"train_loss": -11.86831283569336, "global_step": 285089, "epoch": 1696} {"train_loss": -11.317974090576172, "global_step": 285090, "epoch": 1696} {"train_loss": -11.749104499816895, "global_step": 285091, "epoch": 1696} {"train_loss": -11.325111389160156, "global_step": 285092, "epoch": 1696} {"train_loss": -11.926912307739258, "global_step": 285093, "epoch": 1696} {"train_loss": -11.413891792297363, "global_step": 285094, "epoch": 1696} {"train_loss": -11.704258430571784, "global_step": 285095, "epoch": 1696, "val_loss": 277701.84375} {"train_loss": -11.918598175048828, "global_step": 285096, "epoch": 1697} {"train_loss": -11.691609382629395, "global_step": 285097, "epoch": 1697} {"train_loss": -11.844478607177734, "global_step": 285098, "epoch": 1697} {"train_loss": -11.828861236572266, "global_step": 285099, "epoch": 1697} {"train_loss": -11.920690536499023, "global_step": 285100, "epoch": 1697} {"train_loss": -11.831300735473633, "global_step": 285101, "epoch": 1697} {"train_loss": -11.767611503601074, "global_step": 285102, "epoch": 1697} {"train_loss": -11.653536796569824, "global_step": 285103, "epoch": 1697} {"train_loss": -12.095518112182617, "global_step": 285104, "epoch": 1697} {"train_loss": -11.613876342773438, "global_step": 285105, "epoch": 1697} {"train_loss": -12.122699737548828, "global_step": 285106, "epoch": 1697} {"train_loss": -11.71877670288086, "global_step": 285107, "epoch": 1697} {"train_loss": -11.771748542785645, "global_step": 285108, "epoch": 1697} {"train_loss": -11.680912017822266, "global_step": 285109, "epoch": 1697} {"train_loss": -11.543645858764648, "global_step": 285110, "epoch": 1697} {"train_loss": -11.482111930847168, "global_step": 285111, "epoch": 1697} {"train_loss": -11.147013664245605, "global_step": 285112, "epoch": 1697} {"train_loss": -12.117044448852539, "global_step": 285113, "epoch": 1697} {"train_loss": -11.65731430053711, "global_step": 285114, "epoch": 1697} {"train_loss": -12.065987586975098, "global_step": 285115, "epoch": 1697} {"train_loss": -11.790566444396973, "global_step": 285116, "epoch": 1697} {"train_loss": -11.699479103088379, "global_step": 285117, "epoch": 1697} {"train_loss": -12.129155158996582, "global_step": 285118, "epoch": 1697} {"train_loss": -11.679222106933594, "global_step": 285119, "epoch": 1697} {"train_loss": -12.122903823852539, "global_step": 285120, "epoch": 1697} {"train_loss": -11.99199390411377, "global_step": 285121, "epoch": 1697} {"train_loss": -11.41915512084961, "global_step": 285122, "epoch": 1697} {"train_loss": -11.905570030212402, "global_step": 285123, "epoch": 1697} {"train_loss": -11.405718803405762, "global_step": 285124, "epoch": 1697} {"train_loss": -10.971933364868164, "global_step": 285125, "epoch": 1697} {"train_loss": -10.789581298828125, "global_step": 285126, "epoch": 1697} {"train_loss": -10.405975341796875, "global_step": 285127, "epoch": 1697} {"train_loss": -11.652032852172852, "global_step": 285128, "epoch": 1697} {"train_loss": -11.008177757263184, "global_step": 285129, "epoch": 1697} {"train_loss": -11.17341136932373, "global_step": 285130, "epoch": 1697} {"train_loss": -11.790369987487793, "global_step": 285131, "epoch": 1697} {"train_loss": -11.173834800720215, "global_step": 285132, "epoch": 1697} {"train_loss": -11.669498443603516, "global_step": 285133, "epoch": 1697} {"train_loss": -11.630064010620117, "global_step": 285134, "epoch": 1697} {"train_loss": -11.783002853393555, "global_step": 285135, "epoch": 1697} {"train_loss": -11.669300079345703, "global_step": 285136, "epoch": 1697} {"train_loss": -11.694344520568848, "global_step": 285137, "epoch": 1697} {"train_loss": -11.542684555053711, "global_step": 285138, "epoch": 1697} {"train_loss": -11.999786376953125, "global_step": 285139, "epoch": 1697} {"train_loss": -11.99306869506836, "global_step": 285140, "epoch": 1697} {"train_loss": -11.859140396118164, "global_step": 285141, "epoch": 1697} {"train_loss": -12.026369094848633, "global_step": 285142, "epoch": 1697} {"train_loss": -12.110831260681152, "global_step": 285143, "epoch": 1697} {"train_loss": -12.279807090759277, "global_step": 285144, "epoch": 1697} {"train_loss": -12.22629165649414, "global_step": 285145, "epoch": 1697} {"train_loss": -12.123393058776855, "global_step": 285146, "epoch": 1697} {"train_loss": -12.265267372131348, "global_step": 285147, "epoch": 1697} {"train_loss": -11.928302764892578, "global_step": 285148, "epoch": 1697} {"train_loss": -12.155991554260254, "global_step": 285149, "epoch": 1697} {"train_loss": -12.175101280212402, "global_step": 285150, "epoch": 1697} {"train_loss": -12.280256271362305, "global_step": 285151, "epoch": 1697} {"train_loss": -12.288395881652832, "global_step": 285152, "epoch": 1697} {"train_loss": -12.2841796875, "global_step": 285153, "epoch": 1697} {"train_loss": -12.262544631958008, "global_step": 285154, "epoch": 1697} {"train_loss": -12.247480392456055, "global_step": 285155, "epoch": 1697} {"train_loss": -12.474695205688477, "global_step": 285156, "epoch": 1697} {"train_loss": -12.203316688537598, "global_step": 285157, "epoch": 1697} {"train_loss": -12.134368896484375, "global_step": 285158, "epoch": 1697} {"train_loss": -12.239376068115234, "global_step": 285159, "epoch": 1697} {"train_loss": -12.269027709960938, "global_step": 285160, "epoch": 1697} {"train_loss": -12.090362548828125, "global_step": 285161, "epoch": 1697} {"train_loss": -12.364269256591797, "global_step": 285162, "epoch": 1697} {"train_loss": -12.367034912109375, "global_step": 285163, "epoch": 1697} {"train_loss": -12.187782287597656, "global_step": 285164, "epoch": 1697} {"train_loss": -12.305289268493652, "global_step": 285165, "epoch": 1697} {"train_loss": -12.168588638305664, "global_step": 285166, "epoch": 1697} {"train_loss": -12.071765899658203, "global_step": 285167, "epoch": 1697} {"train_loss": -11.647666931152344, "global_step": 285168, "epoch": 1697} {"train_loss": -12.352079391479492, "global_step": 285169, "epoch": 1697} {"train_loss": -11.970071792602539, "global_step": 285170, "epoch": 1697} {"train_loss": -12.329795837402344, "global_step": 285171, "epoch": 1697} {"train_loss": -12.213217735290527, "global_step": 285172, "epoch": 1697} {"train_loss": -12.27734375, "global_step": 285173, "epoch": 1697} {"train_loss": -11.897443771362305, "global_step": 285174, "epoch": 1697} {"train_loss": -12.123348236083984, "global_step": 285175, "epoch": 1697} {"train_loss": -12.106809616088867, "global_step": 285176, "epoch": 1697} {"train_loss": -12.200576782226562, "global_step": 285177, "epoch": 1697} {"train_loss": -11.859240531921387, "global_step": 285178, "epoch": 1697} {"train_loss": -12.258699417114258, "global_step": 285179, "epoch": 1697} {"train_loss": -12.200077056884766, "global_step": 285180, "epoch": 1697} {"train_loss": -11.865238189697266, "global_step": 285181, "epoch": 1697} {"train_loss": -11.885982513427734, "global_step": 285182, "epoch": 1697} {"train_loss": -11.81622314453125, "global_step": 285183, "epoch": 1697} {"train_loss": -11.396720886230469, "global_step": 285184, "epoch": 1697} {"train_loss": -12.111241340637207, "global_step": 285185, "epoch": 1697} {"train_loss": -11.514366149902344, "global_step": 285186, "epoch": 1697} {"train_loss": -11.215082168579102, "global_step": 285187, "epoch": 1697} {"train_loss": -11.931488037109375, "global_step": 285188, "epoch": 1697} {"train_loss": -11.646648406982422, "global_step": 285189, "epoch": 1697} {"train_loss": -11.745922088623047, "global_step": 285190, "epoch": 1697} {"train_loss": -11.903738021850586, "global_step": 285191, "epoch": 1697} {"train_loss": -11.418248176574707, "global_step": 285192, "epoch": 1697} {"train_loss": -11.869296073913574, "global_step": 285193, "epoch": 1697} {"train_loss": -11.683414459228516, "global_step": 285194, "epoch": 1697} {"train_loss": -10.856552124023438, "global_step": 285195, "epoch": 1697} {"train_loss": -11.83364486694336, "global_step": 285196, "epoch": 1697} {"train_loss": -10.81541633605957, "global_step": 285197, "epoch": 1697} {"train_loss": -11.707762718200684, "global_step": 285198, "epoch": 1697} {"train_loss": -11.280763626098633, "global_step": 285199, "epoch": 1697} {"train_loss": -11.443400382995605, "global_step": 285200, "epoch": 1697} {"train_loss": -11.844383239746094, "global_step": 285201, "epoch": 1697} {"train_loss": -11.912946701049805, "global_step": 285202, "epoch": 1697} {"train_loss": -11.600776672363281, "global_step": 285203, "epoch": 1697} {"train_loss": -11.833243370056152, "global_step": 285204, "epoch": 1697} {"train_loss": -12.054665565490723, "global_step": 285205, "epoch": 1697} {"train_loss": -11.72964096069336, "global_step": 285206, "epoch": 1697} {"train_loss": -12.197484970092773, "global_step": 285207, "epoch": 1697} {"train_loss": -11.857463836669922, "global_step": 285208, "epoch": 1697} {"train_loss": -12.335285186767578, "global_step": 285209, "epoch": 1697} {"train_loss": -12.089315414428711, "global_step": 285210, "epoch": 1697} {"train_loss": -12.269177436828613, "global_step": 285211, "epoch": 1697} {"train_loss": -12.010900497436523, "global_step": 285212, "epoch": 1697} {"train_loss": -12.34561538696289, "global_step": 285213, "epoch": 1697} {"train_loss": -12.190560340881348, "global_step": 285214, "epoch": 1697} {"train_loss": -12.241691589355469, "global_step": 285215, "epoch": 1697} {"train_loss": -12.440119743347168, "global_step": 285216, "epoch": 1697} {"train_loss": -12.371803283691406, "global_step": 285217, "epoch": 1697} {"train_loss": -12.345069885253906, "global_step": 285218, "epoch": 1697} {"train_loss": -12.394434928894043, "global_step": 285219, "epoch": 1697} {"train_loss": -12.254522323608398, "global_step": 285220, "epoch": 1697} {"train_loss": -12.172712326049805, "global_step": 285221, "epoch": 1697} {"train_loss": -12.384766578674316, "global_step": 285222, "epoch": 1697} {"train_loss": -12.229911804199219, "global_step": 285223, "epoch": 1697} {"train_loss": -12.41878890991211, "global_step": 285224, "epoch": 1697} {"train_loss": -12.384765625, "global_step": 285225, "epoch": 1697} {"train_loss": -12.298919677734375, "global_step": 285226, "epoch": 1697} {"train_loss": -11.623326301574707, "global_step": 285227, "epoch": 1697} {"train_loss": -11.424314498901367, "global_step": 285228, "epoch": 1697} {"train_loss": -11.948976516723633, "global_step": 285229, "epoch": 1697} {"train_loss": -12.372613906860352, "global_step": 285230, "epoch": 1697} {"train_loss": -11.332706451416016, "global_step": 285231, "epoch": 1697} {"train_loss": -12.03346061706543, "global_step": 285232, "epoch": 1697} {"train_loss": -11.529025077819824, "global_step": 285233, "epoch": 1697} {"train_loss": -11.400945663452148, "global_step": 285234, "epoch": 1697} {"train_loss": -11.298181533813477, "global_step": 285235, "epoch": 1697} {"train_loss": -11.135847091674805, "global_step": 285236, "epoch": 1697} {"train_loss": -11.060005187988281, "global_step": 285237, "epoch": 1697} {"train_loss": -11.286794662475586, "global_step": 285238, "epoch": 1697} {"train_loss": -11.432969093322754, "global_step": 285239, "epoch": 1697} {"train_loss": -10.695194244384766, "global_step": 285240, "epoch": 1697} {"train_loss": -12.0308256149292, "global_step": 285241, "epoch": 1697} {"train_loss": -10.846782684326172, "global_step": 285242, "epoch": 1697} {"train_loss": -11.455221176147461, "global_step": 285243, "epoch": 1697} {"train_loss": -11.60360336303711, "global_step": 285244, "epoch": 1697} {"train_loss": -11.417670249938965, "global_step": 285245, "epoch": 1697} {"train_loss": -10.884845733642578, "global_step": 285246, "epoch": 1697} {"train_loss": -10.528556823730469, "global_step": 285247, "epoch": 1697} {"train_loss": -12.020546913146973, "global_step": 285248, "epoch": 1697} {"train_loss": -10.657676696777344, "global_step": 285249, "epoch": 1697} {"train_loss": -11.334747314453125, "global_step": 285250, "epoch": 1697} {"train_loss": -10.562843322753906, "global_step": 285251, "epoch": 1697} {"train_loss": -9.553118705749512, "global_step": 285252, "epoch": 1697} {"train_loss": -10.012288093566895, "global_step": 285253, "epoch": 1697} {"train_loss": -10.304950714111328, "global_step": 285254, "epoch": 1697} {"train_loss": -9.064329147338867, "global_step": 285255, "epoch": 1697} {"train_loss": -9.19073486328125, "global_step": 285256, "epoch": 1697} {"train_loss": -11.228761672973633, "global_step": 285257, "epoch": 1697} {"train_loss": -8.923624992370605, "global_step": 285258, "epoch": 1697} {"train_loss": -10.7884521484375, "global_step": 285259, "epoch": 1697} {"train_loss": -8.318451881408691, "global_step": 285260, "epoch": 1697} {"train_loss": -9.52912712097168, "global_step": 285261, "epoch": 1697} {"train_loss": -9.555074691772461, "global_step": 285262, "epoch": 1697} {"train_loss": -11.672102996281215, "global_step": 285263, "epoch": 1697, "val_loss": 276548.5625} {"train_loss": -9.52634048461914, "global_step": 285264, "epoch": 1698} {"train_loss": -10.17255687713623, "global_step": 285265, "epoch": 1698} {"train_loss": -10.790213584899902, "global_step": 285266, "epoch": 1698} {"train_loss": -10.100784301757812, "global_step": 285267, "epoch": 1698} {"train_loss": -11.286211013793945, "global_step": 285268, "epoch": 1698} {"train_loss": -10.123503684997559, "global_step": 285269, "epoch": 1698} {"train_loss": -11.10930061340332, "global_step": 285270, "epoch": 1698} {"train_loss": -10.927431106567383, "global_step": 285271, "epoch": 1698} {"train_loss": -11.540457725524902, "global_step": 285272, "epoch": 1698} {"train_loss": -11.016551971435547, "global_step": 285273, "epoch": 1698} {"train_loss": -11.434346199035645, "global_step": 285274, "epoch": 1698} {"train_loss": -11.124715805053711, "global_step": 285275, "epoch": 1698} {"train_loss": -11.418530464172363, "global_step": 285276, "epoch": 1698} {"train_loss": -11.167095184326172, "global_step": 285277, "epoch": 1698} {"train_loss": -11.495904922485352, "global_step": 285278, "epoch": 1698} {"train_loss": -11.556682586669922, "global_step": 285279, "epoch": 1698} {"train_loss": -11.149166107177734, "global_step": 285280, "epoch": 1698} {"train_loss": -11.477745056152344, "global_step": 285281, "epoch": 1698} {"train_loss": -11.537612915039062, "global_step": 285282, "epoch": 1698} {"train_loss": -11.568178176879883, "global_step": 285283, "epoch": 1698} {"train_loss": -11.632894515991211, "global_step": 285284, "epoch": 1698} {"train_loss": -11.682130813598633, "global_step": 285285, "epoch": 1698} {"train_loss": -11.557340621948242, "global_step": 285286, "epoch": 1698} {"train_loss": -11.382009506225586, "global_step": 285287, "epoch": 1698} {"train_loss": -11.864307403564453, "global_step": 285288, "epoch": 1698} {"train_loss": -11.098651885986328, "global_step": 285289, "epoch": 1698} {"train_loss": -11.829309463500977, "global_step": 285290, "epoch": 1698} {"train_loss": -11.50035572052002, "global_step": 285291, "epoch": 1698} {"train_loss": -11.562824249267578, "global_step": 285292, "epoch": 1698} {"train_loss": -11.462200164794922, "global_step": 285293, "epoch": 1698} {"train_loss": -11.651521682739258, "global_step": 285294, "epoch": 1698} {"train_loss": -11.638384819030762, "global_step": 285295, "epoch": 1698} {"train_loss": -11.77754020690918, "global_step": 285296, "epoch": 1698} {"train_loss": -11.819543838500977, "global_step": 285297, "epoch": 1698} {"train_loss": -11.835119247436523, "global_step": 285298, "epoch": 1698} {"train_loss": -12.024847984313965, "global_step": 285299, "epoch": 1698} {"train_loss": -11.917729377746582, "global_step": 285300, "epoch": 1698} {"train_loss": -12.07217788696289, "global_step": 285301, "epoch": 1698} {"train_loss": -12.058464050292969, "global_step": 285302, "epoch": 1698} {"train_loss": -12.136180877685547, "global_step": 285303, "epoch": 1698} {"train_loss": -11.93737506866455, "global_step": 285304, "epoch": 1698} {"train_loss": -12.132801055908203, "global_step": 285305, "epoch": 1698} {"train_loss": -12.009222030639648, "global_step": 285306, "epoch": 1698} {"train_loss": -11.968563079833984, "global_step": 285307, "epoch": 1698} {"train_loss": -12.130918502807617, "global_step": 285308, "epoch": 1698} {"train_loss": -12.020426750183105, "global_step": 285309, "epoch": 1698} {"train_loss": -12.190061569213867, "global_step": 285310, "epoch": 1698} {"train_loss": -11.991353988647461, "global_step": 285311, "epoch": 1698} {"train_loss": -12.160083770751953, "global_step": 285312, "epoch": 1698} {"train_loss": -12.205737113952637, "global_step": 285313, "epoch": 1698} {"train_loss": -12.33939266204834, "global_step": 285314, "epoch": 1698} {"train_loss": -12.106989860534668, "global_step": 285315, "epoch": 1698} {"train_loss": -12.149375915527344, "global_step": 285316, "epoch": 1698} {"train_loss": -12.067460060119629, "global_step": 285317, "epoch": 1698} {"train_loss": -12.200263977050781, "global_step": 285318, "epoch": 1698} {"train_loss": -12.126916885375977, "global_step": 285319, "epoch": 1698} {"train_loss": -12.322999954223633, "global_step": 285320, "epoch": 1698} {"train_loss": -12.310772895812988, "global_step": 285321, "epoch": 1698} {"train_loss": -12.288135528564453, "global_step": 285322, "epoch": 1698} {"train_loss": -12.17003059387207, "global_step": 285323, "epoch": 1698} {"train_loss": -12.20920181274414, "global_step": 285324, "epoch": 1698} {"train_loss": -12.33119010925293, "global_step": 285325, "epoch": 1698} {"train_loss": -12.262990951538086, "global_step": 285326, "epoch": 1698} {"train_loss": -12.362695693969727, "global_step": 285327, "epoch": 1698} {"train_loss": -12.194904327392578, "global_step": 285328, "epoch": 1698} {"train_loss": -12.299041748046875, "global_step": 285329, "epoch": 1698} {"train_loss": -12.253891944885254, "global_step": 285330, "epoch": 1698} {"train_loss": -12.349029541015625, "global_step": 285331, "epoch": 1698} {"train_loss": -12.271849632263184, "global_step": 285332, "epoch": 1698} {"train_loss": -12.319369316101074, "global_step": 285333, "epoch": 1698} {"train_loss": -12.269968032836914, "global_step": 285334, "epoch": 1698} {"train_loss": -12.146907806396484, "global_step": 285335, "epoch": 1698} {"train_loss": -12.581872940063477, "global_step": 285336, "epoch": 1698} {"train_loss": -12.410764694213867, "global_step": 285337, "epoch": 1698} {"train_loss": -12.254426956176758, "global_step": 285338, "epoch": 1698} {"train_loss": -12.298489570617676, "global_step": 285339, "epoch": 1698} {"train_loss": -12.16754150390625, "global_step": 285340, "epoch": 1698} {"train_loss": -12.602173805236816, "global_step": 285341, "epoch": 1698} {"train_loss": -12.397676467895508, "global_step": 285342, "epoch": 1698} {"train_loss": -12.309516906738281, "global_step": 285343, "epoch": 1698} {"train_loss": -12.498039245605469, "global_step": 285344, "epoch": 1698} {"train_loss": -12.29246711730957, "global_step": 285345, "epoch": 1698} {"train_loss": -12.311671257019043, "global_step": 285346, "epoch": 1698} {"train_loss": -12.330511093139648, "global_step": 285347, "epoch": 1698} {"train_loss": -12.260293960571289, "global_step": 285348, "epoch": 1698} {"train_loss": -12.295112609863281, "global_step": 285349, "epoch": 1698} {"train_loss": -12.306154251098633, "global_step": 285350, "epoch": 1698} {"train_loss": -12.557748794555664, "global_step": 285351, "epoch": 1698} {"train_loss": -12.302659034729004, "global_step": 285352, "epoch": 1698} {"train_loss": -12.515558242797852, "global_step": 285353, "epoch": 1698} {"train_loss": -12.45286750793457, "global_step": 285354, "epoch": 1698} {"train_loss": -12.333331108093262, "global_step": 285355, "epoch": 1698} {"train_loss": -12.28034782409668, "global_step": 285356, "epoch": 1698} {"train_loss": -12.17323112487793, "global_step": 285357, "epoch": 1698} {"train_loss": -12.393755912780762, "global_step": 285358, "epoch": 1698} {"train_loss": -12.38278579711914, "global_step": 285359, "epoch": 1698} {"train_loss": -12.239904403686523, "global_step": 285360, "epoch": 1698} {"train_loss": -12.249004364013672, "global_step": 285361, "epoch": 1698} {"train_loss": -12.344637870788574, "global_step": 285362, "epoch": 1698} {"train_loss": -12.235331535339355, "global_step": 285363, "epoch": 1698} {"train_loss": -12.39043140411377, "global_step": 285364, "epoch": 1698} {"train_loss": -12.360149383544922, "global_step": 285365, "epoch": 1698} {"train_loss": -12.426668167114258, "global_step": 285366, "epoch": 1698} {"train_loss": -12.057340621948242, "global_step": 285367, "epoch": 1698} {"train_loss": -11.847307205200195, "global_step": 285368, "epoch": 1698} {"train_loss": -11.893610000610352, "global_step": 285369, "epoch": 1698} {"train_loss": -12.241835594177246, "global_step": 285370, "epoch": 1698} {"train_loss": -11.92366886138916, "global_step": 285371, "epoch": 1698} {"train_loss": -12.118654251098633, "global_step": 285372, "epoch": 1698} {"train_loss": -11.3297758102417, "global_step": 285373, "epoch": 1698} {"train_loss": -12.412933349609375, "global_step": 285374, "epoch": 1698} {"train_loss": -11.129888534545898, "global_step": 285375, "epoch": 1698} {"train_loss": -11.196653366088867, "global_step": 285376, "epoch": 1698} {"train_loss": -10.69737720489502, "global_step": 285377, "epoch": 1698} {"train_loss": -11.7716646194458, "global_step": 285378, "epoch": 1698} {"train_loss": -10.667837142944336, "global_step": 285379, "epoch": 1698} {"train_loss": -11.508882522583008, "global_step": 285380, "epoch": 1698} {"train_loss": -11.345390319824219, "global_step": 285381, "epoch": 1698} {"train_loss": -9.107675552368164, "global_step": 285382, "epoch": 1698} {"train_loss": -10.498083114624023, "global_step": 285383, "epoch": 1698} {"train_loss": -9.465141296386719, "global_step": 285384, "epoch": 1698} {"train_loss": -10.24327278137207, "global_step": 285385, "epoch": 1698} {"train_loss": -11.397997856140137, "global_step": 285386, "epoch": 1698} {"train_loss": -8.278478622436523, "global_step": 285387, "epoch": 1698} {"train_loss": -10.336923599243164, "global_step": 285388, "epoch": 1698} {"train_loss": -8.736156463623047, "global_step": 285389, "epoch": 1698} {"train_loss": -7.751698017120361, "global_step": 285390, "epoch": 1698} {"train_loss": -7.252870559692383, "global_step": 285391, "epoch": 1698} {"train_loss": -6.827858924865723, "global_step": 285392, "epoch": 1698} {"train_loss": -8.290428161621094, "global_step": 285393, "epoch": 1698} {"train_loss": -6.915463447570801, "global_step": 285394, "epoch": 1698} {"train_loss": -7.987064838409424, "global_step": 285395, "epoch": 1698} {"train_loss": -8.250753402709961, "global_step": 285396, "epoch": 1698} {"train_loss": -8.150647163391113, "global_step": 285397, "epoch": 1698} {"train_loss": -8.24472427368164, "global_step": 285398, "epoch": 1698} {"train_loss": -8.595284461975098, "global_step": 285399, "epoch": 1698} {"train_loss": -9.30293083190918, "global_step": 285400, "epoch": 1698} {"train_loss": -8.783437728881836, "global_step": 285401, "epoch": 1698} {"train_loss": -10.2446928024292, "global_step": 285402, "epoch": 1698} {"train_loss": -10.652105331420898, "global_step": 285403, "epoch": 1698} {"train_loss": -8.957941055297852, "global_step": 285404, "epoch": 1698} {"train_loss": -10.232065200805664, "global_step": 285405, "epoch": 1698} {"train_loss": -10.004467964172363, "global_step": 285406, "epoch": 1698} {"train_loss": -9.710596084594727, "global_step": 285407, "epoch": 1698} {"train_loss": -10.483826637268066, "global_step": 285408, "epoch": 1698} {"train_loss": -10.79722785949707, "global_step": 285409, "epoch": 1698} {"train_loss": -10.319808006286621, "global_step": 285410, "epoch": 1698} {"train_loss": -10.39577865600586, "global_step": 285411, "epoch": 1698} {"train_loss": -10.474000930786133, "global_step": 285412, "epoch": 1698} {"train_loss": -11.149432182312012, "global_step": 285413, "epoch": 1698} {"train_loss": -10.669439315795898, "global_step": 285414, "epoch": 1698} {"train_loss": -10.672429084777832, "global_step": 285415, "epoch": 1698} {"train_loss": -11.229939460754395, "global_step": 285416, "epoch": 1698} {"train_loss": -10.792699813842773, "global_step": 285417, "epoch": 1698} {"train_loss": -11.174867630004883, "global_step": 285418, "epoch": 1698} {"train_loss": -10.606491088867188, "global_step": 285419, "epoch": 1698} {"train_loss": -11.167378425598145, "global_step": 285420, "epoch": 1698} {"train_loss": -10.812090873718262, "global_step": 285421, "epoch": 1698} {"train_loss": -11.060287475585938, "global_step": 285422, "epoch": 1698} {"train_loss": -11.137290954589844, "global_step": 285423, "epoch": 1698} {"train_loss": -11.107985496520996, "global_step": 285424, "epoch": 1698} {"train_loss": -11.285415649414062, "global_step": 285425, "epoch": 1698} {"train_loss": -11.033040046691895, "global_step": 285426, "epoch": 1698} {"train_loss": -10.947941780090332, "global_step": 285427, "epoch": 1698} {"train_loss": -11.513736724853516, "global_step": 285428, "epoch": 1698} {"train_loss": -11.154447555541992, "global_step": 285429, "epoch": 1698} {"train_loss": -11.302652359008789, "global_step": 285430, "epoch": 1698} {"train_loss": -11.303401890255156, "global_step": 285431, "epoch": 1698, "val_loss": 257149.25} {"train_loss": -11.1143798828125, "global_step": 285432, "epoch": 1699} {"train_loss": -11.712262153625488, "global_step": 285433, "epoch": 1699} {"train_loss": -11.00345230102539, "global_step": 285434, "epoch": 1699} {"train_loss": -11.359552383422852, "global_step": 285435, "epoch": 1699} {"train_loss": -11.382966041564941, "global_step": 285436, "epoch": 1699} {"train_loss": -11.269193649291992, "global_step": 285437, "epoch": 1699} {"train_loss": -11.538103103637695, "global_step": 285438, "epoch": 1699} {"train_loss": -11.57175064086914, "global_step": 285439, "epoch": 1699} {"train_loss": -11.257464408874512, "global_step": 285440, "epoch": 1699} {"train_loss": -11.627713203430176, "global_step": 285441, "epoch": 1699} {"train_loss": -11.666557312011719, "global_step": 285442, "epoch": 1699} {"train_loss": -11.962352752685547, "global_step": 285443, "epoch": 1699} {"train_loss": -11.651891708374023, "global_step": 285444, "epoch": 1699} {"train_loss": -11.690793991088867, "global_step": 285445, "epoch": 1699} {"train_loss": -11.841917991638184, "global_step": 285446, "epoch": 1699} {"train_loss": -11.737564086914062, "global_step": 285447, "epoch": 1699} {"train_loss": -11.69684886932373, "global_step": 285448, "epoch": 1699} {"train_loss": -11.454333305358887, "global_step": 285449, "epoch": 1699} {"train_loss": -11.52564811706543, "global_step": 285450, "epoch": 1699} {"train_loss": -11.80176830291748, "global_step": 285451, "epoch": 1699} {"train_loss": -11.729079246520996, "global_step": 285452, "epoch": 1699} {"train_loss": -11.458297729492188, "global_step": 285453, "epoch": 1699} {"train_loss": -11.884218215942383, "global_step": 285454, "epoch": 1699} {"train_loss": -11.609084129333496, "global_step": 285455, "epoch": 1699} {"train_loss": -11.85600471496582, "global_step": 285456, "epoch": 1699} {"train_loss": -11.798267364501953, "global_step": 285457, "epoch": 1699} {"train_loss": -11.68832015991211, "global_step": 285458, "epoch": 1699} {"train_loss": -11.906534194946289, "global_step": 285459, "epoch": 1699} {"train_loss": -11.771097183227539, "global_step": 285460, "epoch": 1699} {"train_loss": -11.657440185546875, "global_step": 285461, "epoch": 1699} {"train_loss": -11.566091537475586, "global_step": 285462, "epoch": 1699} {"train_loss": -11.410463333129883, "global_step": 285463, "epoch": 1699} {"train_loss": -11.61190414428711, "global_step": 285464, "epoch": 1699} {"train_loss": -11.626310348510742, "global_step": 285465, "epoch": 1699} {"train_loss": -11.681375503540039, "global_step": 285466, "epoch": 1699} {"train_loss": -11.319266319274902, "global_step": 285467, "epoch": 1699} {"train_loss": -11.953545570373535, "global_step": 285468, "epoch": 1699} {"train_loss": -11.734642028808594, "global_step": 285469, "epoch": 1699} {"train_loss": -11.687882423400879, "global_step": 285470, "epoch": 1699} {"train_loss": -11.784258842468262, "global_step": 285471, "epoch": 1699} {"train_loss": -11.630846977233887, "global_step": 285472, "epoch": 1699} {"train_loss": -11.61684799194336, "global_step": 285473, "epoch": 1699} {"train_loss": -11.800220489501953, "global_step": 285474, "epoch": 1699} {"train_loss": -11.628636360168457, "global_step": 285475, "epoch": 1699} {"train_loss": -11.933924674987793, "global_step": 285476, "epoch": 1699} {"train_loss": -11.754323959350586, "global_step": 285477, "epoch": 1699} {"train_loss": -11.546433448791504, "global_step": 285478, "epoch": 1699} {"train_loss": -12.114009857177734, "global_step": 285479, "epoch": 1699} {"train_loss": -11.666247367858887, "global_step": 285480, "epoch": 1699} {"train_loss": -11.949029922485352, "global_step": 285481, "epoch": 1699} {"train_loss": -11.84410285949707, "global_step": 285482, "epoch": 1699} {"train_loss": -12.147887229919434, "global_step": 285483, "epoch": 1699} {"train_loss": -12.099370956420898, "global_step": 285484, "epoch": 1699} {"train_loss": -12.088638305664062, "global_step": 285485, "epoch": 1699} {"train_loss": -12.031730651855469, "global_step": 285486, "epoch": 1699} {"train_loss": -11.707975387573242, "global_step": 285487, "epoch": 1699} {"train_loss": -12.019208908081055, "global_step": 285488, "epoch": 1699} {"train_loss": -11.975096702575684, "global_step": 285489, "epoch": 1699} {"train_loss": -12.14990520477295, "global_step": 285490, "epoch": 1699} {"train_loss": -12.02552318572998, "global_step": 285491, "epoch": 1699} {"train_loss": -12.159419059753418, "global_step": 285492, "epoch": 1699} {"train_loss": -12.056279182434082, "global_step": 285493, "epoch": 1699} {"train_loss": -12.170963287353516, "global_step": 285494, "epoch": 1699} {"train_loss": -11.856281280517578, "global_step": 285495, "epoch": 1699} {"train_loss": -12.025800704956055, "global_step": 285496, "epoch": 1699} {"train_loss": -12.177345275878906, "global_step": 285497, "epoch": 1699} {"train_loss": -11.877947807312012, "global_step": 285498, "epoch": 1699} {"train_loss": -12.306632995605469, "global_step": 285499, "epoch": 1699} {"train_loss": -12.142488479614258, "global_step": 285500, "epoch": 1699} {"train_loss": -12.383899688720703, "global_step": 285501, "epoch": 1699} {"train_loss": -12.168309211730957, "global_step": 285502, "epoch": 1699} {"train_loss": -12.156597137451172, "global_step": 285503, "epoch": 1699} {"train_loss": -12.171438217163086, "global_step": 285504, "epoch": 1699} {"train_loss": -12.25118637084961, "global_step": 285505, "epoch": 1699} {"train_loss": -12.320262908935547, "global_step": 285506, "epoch": 1699} {"train_loss": -12.248029708862305, "global_step": 285507, "epoch": 1699} {"train_loss": -12.151779174804688, "global_step": 285508, "epoch": 1699} {"train_loss": -12.213138580322266, "global_step": 285509, "epoch": 1699} {"train_loss": -12.251911163330078, "global_step": 285510, "epoch": 1699} {"train_loss": -11.875264167785645, "global_step": 285511, "epoch": 1699} {"train_loss": -12.375481605529785, "global_step": 285512, "epoch": 1699} {"train_loss": -12.240896224975586, "global_step": 285513, "epoch": 1699} {"train_loss": -12.203285217285156, "global_step": 285514, "epoch": 1699} {"train_loss": -12.167342185974121, "global_step": 285515, "epoch": 1699} {"train_loss": -12.079704284667969, "global_step": 285516, "epoch": 1699} {"train_loss": -12.153246879577637, "global_step": 285517, "epoch": 1699} {"train_loss": -12.279422760009766, "global_step": 285518, "epoch": 1699} {"train_loss": -11.96579647064209, "global_step": 285519, "epoch": 1699} {"train_loss": -12.186312675476074, "global_step": 285520, "epoch": 1699} {"train_loss": -12.144354820251465, "global_step": 285521, "epoch": 1699} {"train_loss": -11.903076171875, "global_step": 285522, "epoch": 1699} {"train_loss": -12.074018478393555, "global_step": 285523, "epoch": 1699} {"train_loss": -11.90716552734375, "global_step": 285524, "epoch": 1699} {"train_loss": -12.281344413757324, "global_step": 285525, "epoch": 1699} {"train_loss": -12.146413803100586, "global_step": 285526, "epoch": 1699} {"train_loss": -12.14106273651123, "global_step": 285527, "epoch": 1699} {"train_loss": -12.350553512573242, "global_step": 285528, "epoch": 1699} {"train_loss": -12.244714736938477, "global_step": 285529, "epoch": 1699} {"train_loss": -12.255257606506348, "global_step": 285530, "epoch": 1699} {"train_loss": -12.16995620727539, "global_step": 285531, "epoch": 1699} {"train_loss": -12.201165199279785, "global_step": 285532, "epoch": 1699} {"train_loss": -12.064289093017578, "global_step": 285533, "epoch": 1699} {"train_loss": -12.196089744567871, "global_step": 285534, "epoch": 1699} {"train_loss": -12.076545715332031, "global_step": 285535, "epoch": 1699} {"train_loss": -12.46545124053955, "global_step": 285536, "epoch": 1699} {"train_loss": -12.083620071411133, "global_step": 285537, "epoch": 1699} {"train_loss": -12.198101043701172, "global_step": 285538, "epoch": 1699} {"train_loss": -12.319642066955566, "global_step": 285539, "epoch": 1699} {"train_loss": -12.050239562988281, "global_step": 285540, "epoch": 1699} {"train_loss": -11.900915145874023, "global_step": 285541, "epoch": 1699} {"train_loss": -11.798048973083496, "global_step": 285542, "epoch": 1699} {"train_loss": -11.970179557800293, "global_step": 285543, "epoch": 1699} {"train_loss": -11.333671569824219, "global_step": 285544, "epoch": 1699} {"train_loss": -12.062477111816406, "global_step": 285545, "epoch": 1699} {"train_loss": -11.364992141723633, "global_step": 285546, "epoch": 1699} {"train_loss": -11.829322814941406, "global_step": 285547, "epoch": 1699} {"train_loss": -11.593400955200195, "global_step": 285548, "epoch": 1699} {"train_loss": -10.996708869934082, "global_step": 285549, "epoch": 1699} {"train_loss": -11.116046905517578, "global_step": 285550, "epoch": 1699} {"train_loss": -11.398818016052246, "global_step": 285551, "epoch": 1699} {"train_loss": -10.074710845947266, "global_step": 285552, "epoch": 1699} {"train_loss": -11.222272872924805, "global_step": 285553, "epoch": 1699} {"train_loss": -10.931955337524414, "global_step": 285554, "epoch": 1699} {"train_loss": -11.07834529876709, "global_step": 285555, "epoch": 1699} {"train_loss": -10.193674087524414, "global_step": 285556, "epoch": 1699} {"train_loss": -11.28368091583252, "global_step": 285557, "epoch": 1699} {"train_loss": -10.554037094116211, "global_step": 285558, "epoch": 1699} {"train_loss": -11.002784729003906, "global_step": 285559, "epoch": 1699} {"train_loss": -10.452924728393555, "global_step": 285560, "epoch": 1699} {"train_loss": -11.139657974243164, "global_step": 285561, "epoch": 1699} {"train_loss": -9.717150688171387, "global_step": 285562, "epoch": 1699} {"train_loss": -10.877305030822754, "global_step": 285563, "epoch": 1699} {"train_loss": -11.471933364868164, "global_step": 285564, "epoch": 1699} {"train_loss": -10.403142929077148, "global_step": 285565, "epoch": 1699} {"train_loss": -11.812629699707031, "global_step": 285566, "epoch": 1699} {"train_loss": -11.047784805297852, "global_step": 285567, "epoch": 1699} {"train_loss": -11.112427711486816, "global_step": 285568, "epoch": 1699} {"train_loss": -11.30270004272461, "global_step": 285569, "epoch": 1699} {"train_loss": -11.44156265258789, "global_step": 285570, "epoch": 1699} {"train_loss": -11.139355659484863, "global_step": 285571, "epoch": 1699} {"train_loss": -11.851581573486328, "global_step": 285572, "epoch": 1699} {"train_loss": -11.358063697814941, "global_step": 285573, "epoch": 1699} {"train_loss": -11.509713172912598, "global_step": 285574, "epoch": 1699} {"train_loss": -11.50728702545166, "global_step": 285575, "epoch": 1699} {"train_loss": -11.327413558959961, "global_step": 285576, "epoch": 1699} {"train_loss": -11.600456237792969, "global_step": 285577, "epoch": 1699} {"train_loss": -11.156648635864258, "global_step": 285578, "epoch": 1699} {"train_loss": -11.468297004699707, "global_step": 285579, "epoch": 1699} {"train_loss": -11.278656005859375, "global_step": 285580, "epoch": 1699} {"train_loss": -11.366320610046387, "global_step": 285581, "epoch": 1699} {"train_loss": -11.49118423461914, "global_step": 285582, "epoch": 1699} {"train_loss": -11.520967483520508, "global_step": 285583, "epoch": 1699} {"train_loss": -11.929910659790039, "global_step": 285584, "epoch": 1699} {"train_loss": -11.728531837463379, "global_step": 285585, "epoch": 1699} {"train_loss": -11.622488021850586, "global_step": 285586, "epoch": 1699} {"train_loss": -11.471356391906738, "global_step": 285587, "epoch": 1699} {"train_loss": -11.813704490661621, "global_step": 285588, "epoch": 1699} {"train_loss": -11.860888481140137, "global_step": 285589, "epoch": 1699} {"train_loss": -11.834468841552734, "global_step": 285590, "epoch": 1699} {"train_loss": -11.63536262512207, "global_step": 285591, "epoch": 1699} {"train_loss": -11.795151710510254, "global_step": 285592, "epoch": 1699} {"train_loss": -11.841897964477539, "global_step": 285593, "epoch": 1699} {"train_loss": -12.054494857788086, "global_step": 285594, "epoch": 1699} {"train_loss": -11.582962036132812, "global_step": 285595, "epoch": 1699} {"train_loss": -11.783918380737305, "global_step": 285596, "epoch": 1699} {"train_loss": -11.899740219116211, "global_step": 285597, "epoch": 1699} {"train_loss": -12.012624740600586, "global_step": 285598, "epoch": 1699} {"train_loss": -11.725834528605143, "global_step": 285599, "epoch": 1699, "val_loss": 263336.15625} {"train_loss": -11.903307914733887, "global_step": 285600, "epoch": 1700} {"train_loss": -11.627533912658691, "global_step": 285601, "epoch": 1700} {"train_loss": -11.493666648864746, "global_step": 285602, "epoch": 1700} {"train_loss": -11.714153289794922, "global_step": 285603, "epoch": 1700} {"train_loss": -11.730521202087402, "global_step": 285604, "epoch": 1700} {"train_loss": -11.794809341430664, "global_step": 285605, "epoch": 1700} {"train_loss": -11.668195724487305, "global_step": 285606, "epoch": 1700} {"train_loss": -11.288911819458008, "global_step": 285607, "epoch": 1700} {"train_loss": -11.997218132019043, "global_step": 285608, "epoch": 1700} {"train_loss": -11.540275573730469, "global_step": 285609, "epoch": 1700} {"train_loss": -12.066713333129883, "global_step": 285610, "epoch": 1700} {"train_loss": -11.609824180603027, "global_step": 285611, "epoch": 1700} {"train_loss": -11.727413177490234, "global_step": 285612, "epoch": 1700} {"train_loss": -11.70309829711914, "global_step": 285613, "epoch": 1700} {"train_loss": -11.339704513549805, "global_step": 285614, "epoch": 1700} {"train_loss": -11.815820693969727, "global_step": 285615, "epoch": 1700} {"train_loss": -11.694116592407227, "global_step": 285616, "epoch": 1700} {"train_loss": -12.120001792907715, "global_step": 285617, "epoch": 1700} {"train_loss": -11.6148042678833, "global_step": 285618, "epoch": 1700} {"train_loss": -11.495285034179688, "global_step": 285619, "epoch": 1700} {"train_loss": -11.663650512695312, "global_step": 285620, "epoch": 1700} {"train_loss": -11.920880317687988, "global_step": 285621, "epoch": 1700} {"train_loss": -10.842212677001953, "global_step": 285622, "epoch": 1700} {"train_loss": -11.567567825317383, "global_step": 285623, "epoch": 1700} {"train_loss": -11.266489028930664, "global_step": 285624, "epoch": 1700} {"train_loss": -11.427976608276367, "global_step": 285625, "epoch": 1700} {"train_loss": -11.370431900024414, "global_step": 285626, "epoch": 1700} {"train_loss": -11.956720352172852, "global_step": 285627, "epoch": 1700} {"train_loss": -11.333864212036133, "global_step": 285628, "epoch": 1700} {"train_loss": -12.209912300109863, "global_step": 285629, "epoch": 1700} {"train_loss": -11.500835418701172, "global_step": 285630, "epoch": 1700} {"train_loss": -11.631942749023438, "global_step": 285631, "epoch": 1700} {"train_loss": -11.661286354064941, "global_step": 285632, "epoch": 1700} {"train_loss": -11.431793212890625, "global_step": 285633, "epoch": 1700} {"train_loss": -12.15139389038086, "global_step": 285634, "epoch": 1700} {"train_loss": -11.330215454101562, "global_step": 285635, "epoch": 1700} {"train_loss": -11.61889934539795, "global_step": 285636, "epoch": 1700} {"train_loss": -11.150697708129883, "global_step": 285637, "epoch": 1700} {"train_loss": -11.3003511428833, "global_step": 285638, "epoch": 1700} {"train_loss": -11.53465461730957, "global_step": 285639, "epoch": 1700} {"train_loss": -11.651565551757812, "global_step": 285640, "epoch": 1700} {"train_loss": -11.649527549743652, "global_step": 285641, "epoch": 1700} {"train_loss": -11.750227928161621, "global_step": 285642, "epoch": 1700} {"train_loss": -10.971189498901367, "global_step": 285643, "epoch": 1700} {"train_loss": -11.538816452026367, "global_step": 285644, "epoch": 1700} {"train_loss": -11.840561866760254, "global_step": 285645, "epoch": 1700} {"train_loss": -10.885149002075195, "global_step": 285646, "epoch": 1700} {"train_loss": -11.752840042114258, "global_step": 285647, "epoch": 1700} {"train_loss": -10.877227783203125, "global_step": 285648, "epoch": 1700} {"train_loss": -11.252185821533203, "global_step": 285649, "epoch": 1700} {"train_loss": -11.685869216918945, "global_step": 285650, "epoch": 1700} {"train_loss": -10.900060653686523, "global_step": 285651, "epoch": 1700} {"train_loss": -11.76695728302002, "global_step": 285652, "epoch": 1700} {"train_loss": -10.76997184753418, "global_step": 285653, "epoch": 1700} {"train_loss": -11.94377613067627, "global_step": 285654, "epoch": 1700} {"train_loss": -11.710285186767578, "global_step": 285655, "epoch": 1700} {"train_loss": -11.708488464355469, "global_step": 285656, "epoch": 1700} {"train_loss": -11.980186462402344, "global_step": 285657, "epoch": 1700} {"train_loss": -11.195648193359375, "global_step": 285658, "epoch": 1700} {"train_loss": -12.179895401000977, "global_step": 285659, "epoch": 1700} {"train_loss": -11.21136474609375, "global_step": 285660, "epoch": 1700} {"train_loss": -12.145180702209473, "global_step": 285661, "epoch": 1700} {"train_loss": -11.414434432983398, "global_step": 285662, "epoch": 1700} {"train_loss": -11.929790496826172, "global_step": 285663, "epoch": 1700} {"train_loss": -11.209312438964844, "global_step": 285664, "epoch": 1700} {"train_loss": -11.682527542114258, "global_step": 285665, "epoch": 1700} {"train_loss": -11.018150329589844, "global_step": 285666, "epoch": 1700} {"train_loss": -10.5206298828125, "global_step": 285667, "epoch": 1700} {"train_loss": -11.043943405151367, "global_step": 285668, "epoch": 1700} {"train_loss": -11.141634941101074, "global_step": 285669, "epoch": 1700} {"train_loss": -11.886781692504883, "global_step": 285670, "epoch": 1700} {"train_loss": -11.17160701751709, "global_step": 285671, "epoch": 1700} {"train_loss": -11.818885803222656, "global_step": 285672, "epoch": 1700} {"train_loss": -11.270561218261719, "global_step": 285673, "epoch": 1700} {"train_loss": -12.012401580810547, "global_step": 285674, "epoch": 1700} {"train_loss": -11.096237182617188, "global_step": 285675, "epoch": 1700} {"train_loss": -11.617597579956055, "global_step": 285676, "epoch": 1700} {"train_loss": -11.088537216186523, "global_step": 285677, "epoch": 1700} {"train_loss": -11.90805721282959, "global_step": 285678, "epoch": 1700} {"train_loss": -10.790283203125, "global_step": 285679, "epoch": 1700} {"train_loss": -12.200248718261719, "global_step": 285680, "epoch": 1700} {"train_loss": -10.965486526489258, "global_step": 285681, "epoch": 1700} {"train_loss": -11.816683769226074, "global_step": 285682, "epoch": 1700} {"train_loss": -10.93659496307373, "global_step": 285683, "epoch": 1700} {"train_loss": -11.983818054199219, "global_step": 285684, "epoch": 1700} {"train_loss": -10.765647888183594, "global_step": 285685, "epoch": 1700} {"train_loss": -12.031639099121094, "global_step": 285686, "epoch": 1700} {"train_loss": -10.606433868408203, "global_step": 285687, "epoch": 1700} {"train_loss": -11.948908805847168, "global_step": 285688, "epoch": 1700} {"train_loss": -10.605459213256836, "global_step": 285689, "epoch": 1700} {"train_loss": -11.94527816772461, "global_step": 285690, "epoch": 1700} {"train_loss": -11.116783142089844, "global_step": 285691, "epoch": 1700} {"train_loss": -11.711505889892578, "global_step": 285692, "epoch": 1700} {"train_loss": -11.62476634979248, "global_step": 285693, "epoch": 1700} {"train_loss": -11.526437759399414, "global_step": 285694, "epoch": 1700} {"train_loss": -11.804842948913574, "global_step": 285695, "epoch": 1700} {"train_loss": -12.070676803588867, "global_step": 285696, "epoch": 1700} {"train_loss": -11.630173683166504, "global_step": 285697, "epoch": 1700} {"train_loss": -12.192764282226562, "global_step": 285698, "epoch": 1700} {"train_loss": -11.792730331420898, "global_step": 285699, "epoch": 1700} {"train_loss": -12.051980018615723, "global_step": 285700, "epoch": 1700} {"train_loss": -11.866880416870117, "global_step": 285701, "epoch": 1700} {"train_loss": -11.89185619354248, "global_step": 285702, "epoch": 1700} {"train_loss": -12.048849105834961, "global_step": 285703, "epoch": 1700} {"train_loss": -11.872288703918457, "global_step": 285704, "epoch": 1700} {"train_loss": -11.929645538330078, "global_step": 285705, "epoch": 1700} {"train_loss": -12.014726638793945, "global_step": 285706, "epoch": 1700} {"train_loss": -12.195252418518066, "global_step": 285707, "epoch": 1700} {"train_loss": -12.052452087402344, "global_step": 285708, "epoch": 1700} {"train_loss": -11.967281341552734, "global_step": 285709, "epoch": 1700} {"train_loss": -11.879379272460938, "global_step": 285710, "epoch": 1700} {"train_loss": -12.067237854003906, "global_step": 285711, "epoch": 1700} {"train_loss": -12.01327133178711, "global_step": 285712, "epoch": 1700} {"train_loss": -12.117281913757324, "global_step": 285713, "epoch": 1700} {"train_loss": -11.958670616149902, "global_step": 285714, "epoch": 1700} {"train_loss": -12.123706817626953, "global_step": 285715, "epoch": 1700} {"train_loss": -12.029022216796875, "global_step": 285716, "epoch": 1700} {"train_loss": -11.939445495605469, "global_step": 285717, "epoch": 1700} {"train_loss": -12.159049987792969, "global_step": 285718, "epoch": 1700} {"train_loss": -12.03582763671875, "global_step": 285719, "epoch": 1700} {"train_loss": -12.031487464904785, "global_step": 285720, "epoch": 1700} {"train_loss": -11.996685028076172, "global_step": 285721, "epoch": 1700} {"train_loss": -12.204792022705078, "global_step": 285722, "epoch": 1700} {"train_loss": -12.301119804382324, "global_step": 285723, "epoch": 1700} {"train_loss": -12.084787368774414, "global_step": 285724, "epoch": 1700} {"train_loss": -12.158467292785645, "global_step": 285725, "epoch": 1700} {"train_loss": -12.003917694091797, "global_step": 285726, "epoch": 1700} {"train_loss": -12.075273513793945, "global_step": 285727, "epoch": 1700} {"train_loss": -11.927751541137695, "global_step": 285728, "epoch": 1700} {"train_loss": -12.207283973693848, "global_step": 285729, "epoch": 1700} {"train_loss": -11.842121124267578, "global_step": 285730, "epoch": 1700} {"train_loss": -11.97783088684082, "global_step": 285731, "epoch": 1700} {"train_loss": -11.865643501281738, "global_step": 285732, "epoch": 1700} {"train_loss": -12.255170822143555, "global_step": 285733, "epoch": 1700} {"train_loss": -11.861845016479492, "global_step": 285734, "epoch": 1700} {"train_loss": -11.930316925048828, "global_step": 285735, "epoch": 1700} {"train_loss": -11.922121047973633, "global_step": 285736, "epoch": 1700} {"train_loss": -12.180658340454102, "global_step": 285737, "epoch": 1700} {"train_loss": -12.210728645324707, "global_step": 285738, "epoch": 1700} {"train_loss": -11.817339897155762, "global_step": 285739, "epoch": 1700} {"train_loss": -12.250432968139648, "global_step": 285740, "epoch": 1700} {"train_loss": -12.02932357788086, "global_step": 285741, "epoch": 1700} {"train_loss": -12.05125617980957, "global_step": 285742, "epoch": 1700} {"train_loss": -12.09494400024414, "global_step": 285743, "epoch": 1700} {"train_loss": -11.528142929077148, "global_step": 285744, "epoch": 1700} {"train_loss": -11.673481941223145, "global_step": 285745, "epoch": 1700} {"train_loss": -12.128263473510742, "global_step": 285746, "epoch": 1700} {"train_loss": -12.151456832885742, "global_step": 285747, "epoch": 1700} {"train_loss": -11.875724792480469, "global_step": 285748, "epoch": 1700} {"train_loss": -12.12197208404541, "global_step": 285749, "epoch": 1700} {"train_loss": -11.9953031539917, "global_step": 285750, "epoch": 1700} {"train_loss": -12.200094223022461, "global_step": 285751, "epoch": 1700} {"train_loss": -11.944592475891113, "global_step": 285752, "epoch": 1700} {"train_loss": -12.087066650390625, "global_step": 285753, "epoch": 1700} {"train_loss": -11.846755981445312, "global_step": 285754, "epoch": 1700} {"train_loss": -12.344730377197266, "global_step": 285755, "epoch": 1700} {"train_loss": -12.306146621704102, "global_step": 285756, "epoch": 1700} {"train_loss": -12.098201751708984, "global_step": 285757, "epoch": 1700} {"train_loss": -12.383967399597168, "global_step": 285758, "epoch": 1700} {"train_loss": -12.331557273864746, "global_step": 285759, "epoch": 1700} {"train_loss": -11.625396728515625, "global_step": 285760, "epoch": 1700} {"train_loss": -11.735343933105469, "global_step": 285761, "epoch": 1700} {"train_loss": -12.174083709716797, "global_step": 285762, "epoch": 1700} {"train_loss": -11.054706573486328, "global_step": 285763, "epoch": 1700} {"train_loss": -10.98947811126709, "global_step": 285764, "epoch": 1700} {"train_loss": -12.301714897155762, "global_step": 285765, "epoch": 1700} {"train_loss": -11.827173233032227, "global_step": 285766, "epoch": 1700} {"train_loss": -11.725912264415197, "global_step": 285767, "epoch": 1700, "train/sim_max_reward_0": 0.5855178719852211, "train/sim_max_reward_1": 0.9967184017224114, "train/sim_max_reward_2": 0.00143070686615398, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.9453450163344363, "train/sim_max_reward_5": 0.5084093847505514, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.39273004947263046, "test/sim_max_reward_4400002": 0.44355132088263766, "test/sim_max_reward_4400003": 0.9901430599532085, "test/sim_max_reward_4400004": 0.4086012800016136, "test/sim_max_reward_4400005": 0.980490329659816, "test/sim_max_reward_4400006": 0.2774302642260835, "test/sim_max_reward_4400007": 0.5095333325352951, "test/sim_max_reward_4400008": 0.6303983850448657, "test/sim_max_reward_4400009": 0.028134675564313268, "test/sim_max_reward_4400010": 0.9579187470466315, "test/sim_max_reward_4400011": 0.2753987659421291, "test/sim_max_reward_4400012": 0.9656858639475236, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.5274195718387613, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 0.1709711299158335, "test/sim_max_reward_4400020": 0.35828098829415667, "test/sim_max_reward_4400021": 1.0, "test/sim_max_reward_4400022": 0.9901496627105082, "test/sim_max_reward_4400023": 0.12158993776529237, "test/sim_max_reward_4400024": 0.9238787186169491, "test/sim_max_reward_4400025": 0.5381112640007822, "test/sim_max_reward_4400026": 0.6179686333698379, "test/sim_max_reward_4400027": 0.17817054762895138, "test/sim_max_reward_4400028": 1.0, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9395190031365737, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.38884105723491297, "test/sim_max_reward_4400034": 0.9967405654494619, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.36209580725803603, "test/sim_max_reward_4400037": 0.9440344819211143, "test/sim_max_reward_4400038": 0.9669689017567589, "test/sim_max_reward_4400039": 0.41162798979943527, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9660522349468649, "test/sim_max_reward_4400042": 0.6132229043767692, "test/sim_max_reward_4400043": 0.12635994352507865, "test/sim_max_reward_4400044": 0.2763874896508356, "test/sim_max_reward_4400045": 0.9700160192390276, "test/sim_max_reward_4400046": 0.007607413321685858, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6729035636097959, "test/mean_score": 0.550807118488128, "val_loss": 267651.5625, "train_action_mse_error": 3.1086058616638184} {"train_loss": -12.199278831481934, "global_step": 285768, "epoch": 1701} {"train_loss": -11.676636695861816, "global_step": 285769, "epoch": 1701} {"train_loss": -11.423847198486328, "global_step": 285770, "epoch": 1701} {"train_loss": -11.991161346435547, "global_step": 285771, "epoch": 1701} {"train_loss": -11.976327896118164, "global_step": 285772, "epoch": 1701} {"train_loss": -11.478311538696289, "global_step": 285773, "epoch": 1701} {"train_loss": -11.893024444580078, "global_step": 285774, "epoch": 1701} {"train_loss": -11.779169082641602, "global_step": 285775, "epoch": 1701} {"train_loss": -11.71784496307373, "global_step": 285776, "epoch": 1701} {"train_loss": -12.236074447631836, "global_step": 285777, "epoch": 1701} {"train_loss": -12.033473014831543, "global_step": 285778, "epoch": 1701} {"train_loss": -11.080024719238281, "global_step": 285779, "epoch": 1701} {"train_loss": -11.725849151611328, "global_step": 285780, "epoch": 1701} {"train_loss": -11.646099090576172, "global_step": 285781, "epoch": 1701} {"train_loss": -11.092085838317871, "global_step": 285782, "epoch": 1701} {"train_loss": -11.904397964477539, "global_step": 285783, "epoch": 1701} {"train_loss": -11.972282409667969, "global_step": 285784, "epoch": 1701} {"train_loss": -11.805122375488281, "global_step": 285785, "epoch": 1701} {"train_loss": -11.981010437011719, "global_step": 285786, "epoch": 1701} {"train_loss": -11.87234115600586, "global_step": 285787, "epoch": 1701} {"train_loss": -11.553079605102539, "global_step": 285788, "epoch": 1701} {"train_loss": -11.683796882629395, "global_step": 285789, "epoch": 1701} {"train_loss": -12.01777458190918, "global_step": 285790, "epoch": 1701} {"train_loss": -11.603755950927734, "global_step": 285791, "epoch": 1701} {"train_loss": -11.860281944274902, "global_step": 285792, "epoch": 1701} {"train_loss": -11.699411392211914, "global_step": 285793, "epoch": 1701} {"train_loss": -12.083598136901855, "global_step": 285794, "epoch": 1701} {"train_loss": -12.006613731384277, "global_step": 285795, "epoch": 1701} {"train_loss": -11.885394096374512, "global_step": 285796, "epoch": 1701} {"train_loss": -12.054971694946289, "global_step": 285797, "epoch": 1701} {"train_loss": -11.71206283569336, "global_step": 285798, "epoch": 1701} {"train_loss": -11.882926940917969, "global_step": 285799, "epoch": 1701} {"train_loss": -11.636953353881836, "global_step": 285800, "epoch": 1701} {"train_loss": -12.111527442932129, "global_step": 285801, "epoch": 1701} {"train_loss": -11.191600799560547, "global_step": 285802, "epoch": 1701} {"train_loss": -12.03167724609375, "global_step": 285803, "epoch": 1701} {"train_loss": -10.893978118896484, "global_step": 285804, "epoch": 1701} {"train_loss": -11.239791870117188, "global_step": 285805, "epoch": 1701} {"train_loss": -10.745058059692383, "global_step": 285806, "epoch": 1701} {"train_loss": -11.23431396484375, "global_step": 285807, "epoch": 1701} {"train_loss": -11.149556159973145, "global_step": 285808, "epoch": 1701} {"train_loss": -11.192117691040039, "global_step": 285809, "epoch": 1701} {"train_loss": -9.68997573852539, "global_step": 285810, "epoch": 1701} {"train_loss": -9.621404647827148, "global_step": 285811, "epoch": 1701} {"train_loss": -11.414257049560547, "global_step": 285812, "epoch": 1701} {"train_loss": -9.771841049194336, "global_step": 285813, "epoch": 1701} {"train_loss": -11.361461639404297, "global_step": 285814, "epoch": 1701} {"train_loss": -11.521524429321289, "global_step": 285815, "epoch": 1701} {"train_loss": -10.502533912658691, "global_step": 285816, "epoch": 1701} {"train_loss": -11.530450820922852, "global_step": 285817, "epoch": 1701} {"train_loss": -11.296113967895508, "global_step": 285818, "epoch": 1701} {"train_loss": -11.430965423583984, "global_step": 285819, "epoch": 1701} {"train_loss": -11.257369995117188, "global_step": 285820, "epoch": 1701} {"train_loss": -11.063272476196289, "global_step": 285821, "epoch": 1701} {"train_loss": -11.33758544921875, "global_step": 285822, "epoch": 1701} {"train_loss": -11.493892669677734, "global_step": 285823, "epoch": 1701} {"train_loss": -11.382644653320312, "global_step": 285824, "epoch": 1701} {"train_loss": -11.86709213256836, "global_step": 285825, "epoch": 1701} {"train_loss": -10.988153457641602, "global_step": 285826, "epoch": 1701} {"train_loss": -11.771793365478516, "global_step": 285827, "epoch": 1701} {"train_loss": -11.572287559509277, "global_step": 285828, "epoch": 1701} {"train_loss": -11.796050071716309, "global_step": 285829, "epoch": 1701} {"train_loss": -11.72378921508789, "global_step": 285830, "epoch": 1701} {"train_loss": -11.626123428344727, "global_step": 285831, "epoch": 1701} {"train_loss": -11.786314964294434, "global_step": 285832, "epoch": 1701} {"train_loss": -11.360694885253906, "global_step": 285833, "epoch": 1701} {"train_loss": -11.29610538482666, "global_step": 285834, "epoch": 1701} {"train_loss": -11.759391784667969, "global_step": 285835, "epoch": 1701} {"train_loss": -11.321295738220215, "global_step": 285836, "epoch": 1701} {"train_loss": -11.948861122131348, "global_step": 285837, "epoch": 1701} {"train_loss": -11.704194068908691, "global_step": 285838, "epoch": 1701} {"train_loss": -11.781670570373535, "global_step": 285839, "epoch": 1701} {"train_loss": -11.905291557312012, "global_step": 285840, "epoch": 1701} {"train_loss": -11.732452392578125, "global_step": 285841, "epoch": 1701} {"train_loss": -11.831127166748047, "global_step": 285842, "epoch": 1701} {"train_loss": -11.757305145263672, "global_step": 285843, "epoch": 1701} {"train_loss": -11.81316089630127, "global_step": 285844, "epoch": 1701} {"train_loss": -11.524870872497559, "global_step": 285845, "epoch": 1701} {"train_loss": -11.842055320739746, "global_step": 285846, "epoch": 1701} {"train_loss": -11.702873229980469, "global_step": 285847, "epoch": 1701} {"train_loss": -12.106782913208008, "global_step": 285848, "epoch": 1701} {"train_loss": -11.744478225708008, "global_step": 285849, "epoch": 1701} {"train_loss": -11.868715286254883, "global_step": 285850, "epoch": 1701} {"train_loss": -12.102518081665039, "global_step": 285851, "epoch": 1701} {"train_loss": -12.01188850402832, "global_step": 285852, "epoch": 1701} {"train_loss": -11.752446174621582, "global_step": 285853, "epoch": 1701} {"train_loss": -12.032888412475586, "global_step": 285854, "epoch": 1701} {"train_loss": -12.120590209960938, "global_step": 285855, "epoch": 1701} {"train_loss": -11.824075698852539, "global_step": 285856, "epoch": 1701} {"train_loss": -12.220056533813477, "global_step": 285857, "epoch": 1701} {"train_loss": -11.802242279052734, "global_step": 285858, "epoch": 1701} {"train_loss": -12.161109924316406, "global_step": 285859, "epoch": 1701} {"train_loss": -12.017073631286621, "global_step": 285860, "epoch": 1701} {"train_loss": -11.757514953613281, "global_step": 285861, "epoch": 1701} {"train_loss": -11.90868854522705, "global_step": 285862, "epoch": 1701} {"train_loss": -11.867203712463379, "global_step": 285863, "epoch": 1701} {"train_loss": -11.687037467956543, "global_step": 285864, "epoch": 1701} {"train_loss": -12.226780891418457, "global_step": 285865, "epoch": 1701} {"train_loss": -12.17711067199707, "global_step": 285866, "epoch": 1701} {"train_loss": -11.98109245300293, "global_step": 285867, "epoch": 1701} {"train_loss": -11.984031677246094, "global_step": 285868, "epoch": 1701} {"train_loss": -12.09537124633789, "global_step": 285869, "epoch": 1701} {"train_loss": -12.170284271240234, "global_step": 285870, "epoch": 1701} {"train_loss": -12.103132247924805, "global_step": 285871, "epoch": 1701} {"train_loss": -12.144445419311523, "global_step": 285872, "epoch": 1701} {"train_loss": -12.121865272521973, "global_step": 285873, "epoch": 1701} {"train_loss": -12.263635635375977, "global_step": 285874, "epoch": 1701} {"train_loss": -12.313228607177734, "global_step": 285875, "epoch": 1701} {"train_loss": -12.326571464538574, "global_step": 285876, "epoch": 1701} {"train_loss": -12.300268173217773, "global_step": 285877, "epoch": 1701} {"train_loss": -12.266300201416016, "global_step": 285878, "epoch": 1701} {"train_loss": -12.476531028747559, "global_step": 285879, "epoch": 1701} {"train_loss": -12.220179557800293, "global_step": 285880, "epoch": 1701} {"train_loss": -12.057050704956055, "global_step": 285881, "epoch": 1701} {"train_loss": -12.148445129394531, "global_step": 285882, "epoch": 1701} {"train_loss": -12.059746742248535, "global_step": 285883, "epoch": 1701} {"train_loss": -11.956243515014648, "global_step": 285884, "epoch": 1701} {"train_loss": -12.036988258361816, "global_step": 285885, "epoch": 1701} {"train_loss": -11.893386840820312, "global_step": 285886, "epoch": 1701} {"train_loss": -11.923580169677734, "global_step": 285887, "epoch": 1701} {"train_loss": -12.291933059692383, "global_step": 285888, "epoch": 1701} {"train_loss": -12.216400146484375, "global_step": 285889, "epoch": 1701} {"train_loss": -11.903966903686523, "global_step": 285890, "epoch": 1701} {"train_loss": -12.105292320251465, "global_step": 285891, "epoch": 1701} {"train_loss": -12.319438934326172, "global_step": 285892, "epoch": 1701} {"train_loss": -12.192182540893555, "global_step": 285893, "epoch": 1701} {"train_loss": -12.126075744628906, "global_step": 285894, "epoch": 1701} {"train_loss": -12.369109153747559, "global_step": 285895, "epoch": 1701} {"train_loss": -11.562941551208496, "global_step": 285896, "epoch": 1701} {"train_loss": -11.726543426513672, "global_step": 285897, "epoch": 1701} {"train_loss": -11.893858909606934, "global_step": 285898, "epoch": 1701} {"train_loss": -12.155543327331543, "global_step": 285899, "epoch": 1701} {"train_loss": -12.073619842529297, "global_step": 285900, "epoch": 1701} {"train_loss": -12.211939811706543, "global_step": 285901, "epoch": 1701} {"train_loss": -12.268716812133789, "global_step": 285902, "epoch": 1701} {"train_loss": -12.101770401000977, "global_step": 285903, "epoch": 1701} {"train_loss": -12.105371475219727, "global_step": 285904, "epoch": 1701} {"train_loss": -12.069857597351074, "global_step": 285905, "epoch": 1701} {"train_loss": -12.20320987701416, "global_step": 285906, "epoch": 1701} {"train_loss": -12.136072158813477, "global_step": 285907, "epoch": 1701} {"train_loss": -12.391505241394043, "global_step": 285908, "epoch": 1701} {"train_loss": -12.354753494262695, "global_step": 285909, "epoch": 1701} {"train_loss": -12.24360466003418, "global_step": 285910, "epoch": 1701} {"train_loss": -11.980337142944336, "global_step": 285911, "epoch": 1701} {"train_loss": -11.725500106811523, "global_step": 285912, "epoch": 1701} {"train_loss": -11.586637496948242, "global_step": 285913, "epoch": 1701} {"train_loss": -12.155633926391602, "global_step": 285914, "epoch": 1701} {"train_loss": -11.982481002807617, "global_step": 285915, "epoch": 1701} {"train_loss": -11.470698356628418, "global_step": 285916, "epoch": 1701} {"train_loss": -11.564483642578125, "global_step": 285917, "epoch": 1701} {"train_loss": -11.909750938415527, "global_step": 285918, "epoch": 1701} {"train_loss": -12.188135147094727, "global_step": 285919, "epoch": 1701} {"train_loss": -12.231441497802734, "global_step": 285920, "epoch": 1701} {"train_loss": -12.244861602783203, "global_step": 285921, "epoch": 1701} {"train_loss": -11.91530990600586, "global_step": 285922, "epoch": 1701} {"train_loss": -12.16440200805664, "global_step": 285923, "epoch": 1701} {"train_loss": -12.42509651184082, "global_step": 285924, "epoch": 1701} {"train_loss": -11.601552963256836, "global_step": 285925, "epoch": 1701} {"train_loss": -11.125272750854492, "global_step": 285926, "epoch": 1701} {"train_loss": -10.481587409973145, "global_step": 285927, "epoch": 1701} {"train_loss": -11.845848083496094, "global_step": 285928, "epoch": 1701} {"train_loss": -10.068674087524414, "global_step": 285929, "epoch": 1701} {"train_loss": -11.756322860717773, "global_step": 285930, "epoch": 1701} {"train_loss": -11.860426902770996, "global_step": 285931, "epoch": 1701} {"train_loss": -10.935047149658203, "global_step": 285932, "epoch": 1701} {"train_loss": -11.205543518066406, "global_step": 285933, "epoch": 1701} {"train_loss": -11.480514526367188, "global_step": 285934, "epoch": 1701} {"train_loss": -11.766285300254822, "global_step": 285935, "epoch": 1701, "val_loss": 268069.0625} {"train_loss": -10.628450393676758, "global_step": 285936, "epoch": 1702} {"train_loss": -11.09870433807373, "global_step": 285937, "epoch": 1702} {"train_loss": -11.013816833496094, "global_step": 285938, "epoch": 1702} {"train_loss": -11.323482513427734, "global_step": 285939, "epoch": 1702} {"train_loss": -10.754837989807129, "global_step": 285940, "epoch": 1702} {"train_loss": -11.290084838867188, "global_step": 285941, "epoch": 1702} {"train_loss": -10.867433547973633, "global_step": 285942, "epoch": 1702} {"train_loss": -10.552285194396973, "global_step": 285943, "epoch": 1702} {"train_loss": -11.339179992675781, "global_step": 285944, "epoch": 1702} {"train_loss": -11.453702926635742, "global_step": 285945, "epoch": 1702} {"train_loss": -11.180014610290527, "global_step": 285946, "epoch": 1702} {"train_loss": -12.054401397705078, "global_step": 285947, "epoch": 1702} {"train_loss": -11.449676513671875, "global_step": 285948, "epoch": 1702} {"train_loss": -11.145739555358887, "global_step": 285949, "epoch": 1702} {"train_loss": -11.778675079345703, "global_step": 285950, "epoch": 1702} {"train_loss": -10.947786331176758, "global_step": 285951, "epoch": 1702} {"train_loss": -11.976944923400879, "global_step": 285952, "epoch": 1702} {"train_loss": -11.545158386230469, "global_step": 285953, "epoch": 1702} {"train_loss": -11.790586471557617, "global_step": 285954, "epoch": 1702} {"train_loss": -11.355205535888672, "global_step": 285955, "epoch": 1702} {"train_loss": -11.831121444702148, "global_step": 285956, "epoch": 1702} {"train_loss": -11.210391998291016, "global_step": 285957, "epoch": 1702} {"train_loss": -11.947654724121094, "global_step": 285958, "epoch": 1702} {"train_loss": -11.666202545166016, "global_step": 285959, "epoch": 1702} {"train_loss": -11.642471313476562, "global_step": 285960, "epoch": 1702} {"train_loss": -11.811256408691406, "global_step": 285961, "epoch": 1702} {"train_loss": -11.77765941619873, "global_step": 285962, "epoch": 1702} {"train_loss": -12.149900436401367, "global_step": 285963, "epoch": 1702} {"train_loss": -11.838323593139648, "global_step": 285964, "epoch": 1702} {"train_loss": -12.063197135925293, "global_step": 285965, "epoch": 1702} {"train_loss": -12.27629280090332, "global_step": 285966, "epoch": 1702} {"train_loss": -12.260899543762207, "global_step": 285967, "epoch": 1702} {"train_loss": -12.073394775390625, "global_step": 285968, "epoch": 1702} {"train_loss": -12.188068389892578, "global_step": 285969, "epoch": 1702} {"train_loss": -11.87131118774414, "global_step": 285970, "epoch": 1702} {"train_loss": -11.879971504211426, "global_step": 285971, "epoch": 1702} {"train_loss": -11.917093276977539, "global_step": 285972, "epoch": 1702} {"train_loss": -12.074968338012695, "global_step": 285973, "epoch": 1702} {"train_loss": -12.30495548248291, "global_step": 285974, "epoch": 1702} {"train_loss": -12.244138717651367, "global_step": 285975, "epoch": 1702} {"train_loss": -12.260627746582031, "global_step": 285976, "epoch": 1702} {"train_loss": -11.992790222167969, "global_step": 285977, "epoch": 1702} {"train_loss": -12.371576309204102, "global_step": 285978, "epoch": 1702} {"train_loss": -12.193487167358398, "global_step": 285979, "epoch": 1702} {"train_loss": -12.044007301330566, "global_step": 285980, "epoch": 1702} {"train_loss": -12.14043140411377, "global_step": 285981, "epoch": 1702} {"train_loss": -11.805257797241211, "global_step": 285982, "epoch": 1702} {"train_loss": -11.790162086486816, "global_step": 285983, "epoch": 1702} {"train_loss": -12.208329200744629, "global_step": 285984, "epoch": 1702} {"train_loss": -11.845300674438477, "global_step": 285985, "epoch": 1702} {"train_loss": -11.974079132080078, "global_step": 285986, "epoch": 1702} {"train_loss": -12.100643157958984, "global_step": 285987, "epoch": 1702} {"train_loss": -12.205986022949219, "global_step": 285988, "epoch": 1702} {"train_loss": -12.102055549621582, "global_step": 285989, "epoch": 1702} {"train_loss": -12.119743347167969, "global_step": 285990, "epoch": 1702} {"train_loss": -12.218143463134766, "global_step": 285991, "epoch": 1702} {"train_loss": -12.073086738586426, "global_step": 285992, "epoch": 1702} {"train_loss": -12.316879272460938, "global_step": 285993, "epoch": 1702} {"train_loss": -12.202132225036621, "global_step": 285994, "epoch": 1702} {"train_loss": -11.993684768676758, "global_step": 285995, "epoch": 1702} {"train_loss": -11.823404312133789, "global_step": 285996, "epoch": 1702} {"train_loss": -11.455554008483887, "global_step": 285997, "epoch": 1702} {"train_loss": -12.199506759643555, "global_step": 285998, "epoch": 1702} {"train_loss": -11.356206893920898, "global_step": 285999, "epoch": 1702} {"train_loss": -11.739652633666992, "global_step": 286000, "epoch": 1702} {"train_loss": -12.133214950561523, "global_step": 286001, "epoch": 1702} {"train_loss": -11.257217407226562, "global_step": 286002, "epoch": 1702} {"train_loss": -11.839420318603516, "global_step": 286003, "epoch": 1702} {"train_loss": -12.057249069213867, "global_step": 286004, "epoch": 1702} {"train_loss": -12.09931468963623, "global_step": 286005, "epoch": 1702} {"train_loss": -12.230525970458984, "global_step": 286006, "epoch": 1702} {"train_loss": -12.305170059204102, "global_step": 286007, "epoch": 1702} {"train_loss": -12.067370414733887, "global_step": 286008, "epoch": 1702} {"train_loss": -12.065372467041016, "global_step": 286009, "epoch": 1702} {"train_loss": -12.050943374633789, "global_step": 286010, "epoch": 1702} {"train_loss": -11.39603328704834, "global_step": 286011, "epoch": 1702} {"train_loss": -12.303497314453125, "global_step": 286012, "epoch": 1702} {"train_loss": -11.713010787963867, "global_step": 286013, "epoch": 1702} {"train_loss": -12.196516036987305, "global_step": 286014, "epoch": 1702} {"train_loss": -11.983606338500977, "global_step": 286015, "epoch": 1702} {"train_loss": -11.736846923828125, "global_step": 286016, "epoch": 1702} {"train_loss": -12.066071510314941, "global_step": 286017, "epoch": 1702} {"train_loss": -11.159626007080078, "global_step": 286018, "epoch": 1702} {"train_loss": -11.92509651184082, "global_step": 286019, "epoch": 1702} {"train_loss": -11.032861709594727, "global_step": 286020, "epoch": 1702} {"train_loss": -12.15125560760498, "global_step": 286021, "epoch": 1702} {"train_loss": -11.525810241699219, "global_step": 286022, "epoch": 1702} {"train_loss": -11.842144966125488, "global_step": 286023, "epoch": 1702} {"train_loss": -12.304986953735352, "global_step": 286024, "epoch": 1702} {"train_loss": -11.739604949951172, "global_step": 286025, "epoch": 1702} {"train_loss": -11.556095123291016, "global_step": 286026, "epoch": 1702} {"train_loss": -11.97806453704834, "global_step": 286027, "epoch": 1702} {"train_loss": -11.608481407165527, "global_step": 286028, "epoch": 1702} {"train_loss": -11.81236457824707, "global_step": 286029, "epoch": 1702} {"train_loss": -11.606584548950195, "global_step": 286030, "epoch": 1702} {"train_loss": -11.779685974121094, "global_step": 286031, "epoch": 1702} {"train_loss": -11.235316276550293, "global_step": 286032, "epoch": 1702} {"train_loss": -11.338061332702637, "global_step": 286033, "epoch": 1702} {"train_loss": -11.695022583007812, "global_step": 286034, "epoch": 1702} {"train_loss": -11.89858627319336, "global_step": 286035, "epoch": 1702} {"train_loss": -11.182939529418945, "global_step": 286036, "epoch": 1702} {"train_loss": -11.337425231933594, "global_step": 286037, "epoch": 1702} {"train_loss": -11.432708740234375, "global_step": 286038, "epoch": 1702} {"train_loss": -11.76620101928711, "global_step": 286039, "epoch": 1702} {"train_loss": -11.757716178894043, "global_step": 286040, "epoch": 1702} {"train_loss": -11.453392028808594, "global_step": 286041, "epoch": 1702} {"train_loss": -11.553657531738281, "global_step": 286042, "epoch": 1702} {"train_loss": -11.834171295166016, "global_step": 286043, "epoch": 1702} {"train_loss": -11.502880096435547, "global_step": 286044, "epoch": 1702} {"train_loss": -11.375066757202148, "global_step": 286045, "epoch": 1702} {"train_loss": -11.736010551452637, "global_step": 286046, "epoch": 1702} {"train_loss": -11.928197860717773, "global_step": 286047, "epoch": 1702} {"train_loss": -11.902443885803223, "global_step": 286048, "epoch": 1702} {"train_loss": -12.009332656860352, "global_step": 286049, "epoch": 1702} {"train_loss": -11.928889274597168, "global_step": 286050, "epoch": 1702} {"train_loss": -11.419988632202148, "global_step": 286051, "epoch": 1702} {"train_loss": -12.414844512939453, "global_step": 286052, "epoch": 1702} {"train_loss": -11.645340919494629, "global_step": 286053, "epoch": 1702} {"train_loss": -11.714583396911621, "global_step": 286054, "epoch": 1702} {"train_loss": -11.953079223632812, "global_step": 286055, "epoch": 1702} {"train_loss": -11.958345413208008, "global_step": 286056, "epoch": 1702} {"train_loss": -12.240135192871094, "global_step": 286057, "epoch": 1702} {"train_loss": -12.143733978271484, "global_step": 286058, "epoch": 1702} {"train_loss": -12.372819900512695, "global_step": 286059, "epoch": 1702} {"train_loss": -11.843587875366211, "global_step": 286060, "epoch": 1702} {"train_loss": -12.189119338989258, "global_step": 286061, "epoch": 1702} {"train_loss": -11.759885787963867, "global_step": 286062, "epoch": 1702} {"train_loss": -11.42253303527832, "global_step": 286063, "epoch": 1702} {"train_loss": -11.175891876220703, "global_step": 286064, "epoch": 1702} {"train_loss": -11.860978126525879, "global_step": 286065, "epoch": 1702} {"train_loss": -11.289824485778809, "global_step": 286066, "epoch": 1702} {"train_loss": -11.315319061279297, "global_step": 286067, "epoch": 1702} {"train_loss": -11.595376968383789, "global_step": 286068, "epoch": 1702} {"train_loss": -11.36015510559082, "global_step": 286069, "epoch": 1702} {"train_loss": -11.283690452575684, "global_step": 286070, "epoch": 1702} {"train_loss": -11.474900245666504, "global_step": 286071, "epoch": 1702} {"train_loss": -10.032013893127441, "global_step": 286072, "epoch": 1702} {"train_loss": -11.1730375289917, "global_step": 286073, "epoch": 1702} {"train_loss": -9.813322067260742, "global_step": 286074, "epoch": 1702} {"train_loss": -10.53738784790039, "global_step": 286075, "epoch": 1702} {"train_loss": -10.56326675415039, "global_step": 286076, "epoch": 1702} {"train_loss": -9.65848159790039, "global_step": 286077, "epoch": 1702} {"train_loss": -10.424034118652344, "global_step": 286078, "epoch": 1702} {"train_loss": -9.421260833740234, "global_step": 286079, "epoch": 1702} {"train_loss": -11.211040496826172, "global_step": 286080, "epoch": 1702} {"train_loss": -9.752681732177734, "global_step": 286081, "epoch": 1702} {"train_loss": -10.934635162353516, "global_step": 286082, "epoch": 1702} {"train_loss": -10.695837020874023, "global_step": 286083, "epoch": 1702} {"train_loss": -11.372602462768555, "global_step": 286084, "epoch": 1702} {"train_loss": -10.956320762634277, "global_step": 286085, "epoch": 1702} {"train_loss": -11.17009449005127, "global_step": 286086, "epoch": 1702} {"train_loss": -10.80077838897705, "global_step": 286087, "epoch": 1702} {"train_loss": -11.33804702758789, "global_step": 286088, "epoch": 1702} {"train_loss": -11.428386688232422, "global_step": 286089, "epoch": 1702} {"train_loss": -11.590505599975586, "global_step": 286090, "epoch": 1702} {"train_loss": -11.521937370300293, "global_step": 286091, "epoch": 1702} {"train_loss": -11.700571060180664, "global_step": 286092, "epoch": 1702} {"train_loss": -11.18708610534668, "global_step": 286093, "epoch": 1702} {"train_loss": -12.007081985473633, "global_step": 286094, "epoch": 1702} {"train_loss": -11.114431381225586, "global_step": 286095, "epoch": 1702} {"train_loss": -11.895244598388672, "global_step": 286096, "epoch": 1702} {"train_loss": -11.529458999633789, "global_step": 286097, "epoch": 1702} {"train_loss": -12.092439651489258, "global_step": 286098, "epoch": 1702} {"train_loss": -11.772181510925293, "global_step": 286099, "epoch": 1702} {"train_loss": -11.686347961425781, "global_step": 286100, "epoch": 1702} {"train_loss": -11.735246658325195, "global_step": 286101, "epoch": 1702} {"train_loss": -11.88801383972168, "global_step": 286102, "epoch": 1702} {"train_loss": -11.636084408987136, "global_step": 286103, "epoch": 1702, "val_loss": 275209.84375} {"train_loss": -11.957680702209473, "global_step": 286104, "epoch": 1703} {"train_loss": -11.786771774291992, "global_step": 286105, "epoch": 1703} {"train_loss": -11.880417823791504, "global_step": 286106, "epoch": 1703} {"train_loss": -12.067634582519531, "global_step": 286107, "epoch": 1703} {"train_loss": -12.180231094360352, "global_step": 286108, "epoch": 1703} {"train_loss": -11.728583335876465, "global_step": 286109, "epoch": 1703} {"train_loss": -11.890652656555176, "global_step": 286110, "epoch": 1703} {"train_loss": -11.78756332397461, "global_step": 286111, "epoch": 1703} {"train_loss": -11.976613998413086, "global_step": 286112, "epoch": 1703} {"train_loss": -11.834512710571289, "global_step": 286113, "epoch": 1703} {"train_loss": -12.224735260009766, "global_step": 286114, "epoch": 1703} {"train_loss": -11.82634162902832, "global_step": 286115, "epoch": 1703} {"train_loss": -12.196962356567383, "global_step": 286116, "epoch": 1703} {"train_loss": -11.895421981811523, "global_step": 286117, "epoch": 1703} {"train_loss": -11.983766555786133, "global_step": 286118, "epoch": 1703} {"train_loss": -12.200136184692383, "global_step": 286119, "epoch": 1703} {"train_loss": -12.06544303894043, "global_step": 286120, "epoch": 1703} {"train_loss": -12.02495002746582, "global_step": 286121, "epoch": 1703} {"train_loss": -12.0518798828125, "global_step": 286122, "epoch": 1703} {"train_loss": -11.904275894165039, "global_step": 286123, "epoch": 1703} {"train_loss": -12.107303619384766, "global_step": 286124, "epoch": 1703} {"train_loss": -12.252912521362305, "global_step": 286125, "epoch": 1703} {"train_loss": -12.18720817565918, "global_step": 286126, "epoch": 1703} {"train_loss": -12.06776237487793, "global_step": 286127, "epoch": 1703} {"train_loss": -12.294950485229492, "global_step": 286128, "epoch": 1703} {"train_loss": -12.089994430541992, "global_step": 286129, "epoch": 1703} {"train_loss": -12.289445877075195, "global_step": 286130, "epoch": 1703} {"train_loss": -12.176448822021484, "global_step": 286131, "epoch": 1703} {"train_loss": -12.153726577758789, "global_step": 286132, "epoch": 1703} {"train_loss": -12.111490249633789, "global_step": 286133, "epoch": 1703} {"train_loss": -12.220730781555176, "global_step": 286134, "epoch": 1703} {"train_loss": -11.980561256408691, "global_step": 286135, "epoch": 1703} {"train_loss": -12.047600746154785, "global_step": 286136, "epoch": 1703} {"train_loss": -12.123286247253418, "global_step": 286137, "epoch": 1703} {"train_loss": -12.101383209228516, "global_step": 286138, "epoch": 1703} {"train_loss": -12.297966003417969, "global_step": 286139, "epoch": 1703} {"train_loss": -12.356544494628906, "global_step": 286140, "epoch": 1703} {"train_loss": -12.40079402923584, "global_step": 286141, "epoch": 1703} {"train_loss": -12.276233673095703, "global_step": 286142, "epoch": 1703} {"train_loss": -12.388566970825195, "global_step": 286143, "epoch": 1703} {"train_loss": -12.329473495483398, "global_step": 286144, "epoch": 1703} {"train_loss": -12.19382095336914, "global_step": 286145, "epoch": 1703} {"train_loss": -12.237009048461914, "global_step": 286146, "epoch": 1703} {"train_loss": -11.930618286132812, "global_step": 286147, "epoch": 1703} {"train_loss": -12.419451713562012, "global_step": 286148, "epoch": 1703} {"train_loss": -12.296222686767578, "global_step": 286149, "epoch": 1703} {"train_loss": -12.224591255187988, "global_step": 286150, "epoch": 1703} {"train_loss": -12.30333423614502, "global_step": 286151, "epoch": 1703} {"train_loss": -12.191816329956055, "global_step": 286152, "epoch": 1703} {"train_loss": -12.320865631103516, "global_step": 286153, "epoch": 1703} {"train_loss": -12.43569278717041, "global_step": 286154, "epoch": 1703} {"train_loss": -12.24955940246582, "global_step": 286155, "epoch": 1703} {"train_loss": -12.37260627746582, "global_step": 286156, "epoch": 1703} {"train_loss": -12.344768524169922, "global_step": 286157, "epoch": 1703} {"train_loss": -12.24641227722168, "global_step": 286158, "epoch": 1703} {"train_loss": -12.361005783081055, "global_step": 286159, "epoch": 1703} {"train_loss": -12.405496597290039, "global_step": 286160, "epoch": 1703} {"train_loss": -12.581904411315918, "global_step": 286161, "epoch": 1703} {"train_loss": -12.438139915466309, "global_step": 286162, "epoch": 1703} {"train_loss": -12.374711990356445, "global_step": 286163, "epoch": 1703} {"train_loss": -12.52042007446289, "global_step": 286164, "epoch": 1703} {"train_loss": -12.014518737792969, "global_step": 286165, "epoch": 1703} {"train_loss": -12.645244598388672, "global_step": 286166, "epoch": 1703} {"train_loss": -12.336697578430176, "global_step": 286167, "epoch": 1703} {"train_loss": -12.402082443237305, "global_step": 286168, "epoch": 1703} {"train_loss": -12.213428497314453, "global_step": 286169, "epoch": 1703} {"train_loss": -12.485994338989258, "global_step": 286170, "epoch": 1703} {"train_loss": -12.325307846069336, "global_step": 286171, "epoch": 1703} {"train_loss": -12.469451904296875, "global_step": 286172, "epoch": 1703} {"train_loss": -12.107115745544434, "global_step": 286173, "epoch": 1703} {"train_loss": -12.098762512207031, "global_step": 286174, "epoch": 1703} {"train_loss": -12.460015296936035, "global_step": 286175, "epoch": 1703} {"train_loss": -12.321450233459473, "global_step": 286176, "epoch": 1703} {"train_loss": -12.566902160644531, "global_step": 286177, "epoch": 1703} {"train_loss": -12.466303825378418, "global_step": 286178, "epoch": 1703} {"train_loss": -12.435503005981445, "global_step": 286179, "epoch": 1703} {"train_loss": -12.481622695922852, "global_step": 286180, "epoch": 1703} {"train_loss": -12.063783645629883, "global_step": 286181, "epoch": 1703} {"train_loss": -11.809591293334961, "global_step": 286182, "epoch": 1703} {"train_loss": -10.86868953704834, "global_step": 286183, "epoch": 1703} {"train_loss": -11.950865745544434, "global_step": 286184, "epoch": 1703} {"train_loss": -12.445985794067383, "global_step": 286185, "epoch": 1703} {"train_loss": -12.364395141601562, "global_step": 286186, "epoch": 1703} {"train_loss": -11.9034423828125, "global_step": 286187, "epoch": 1703} {"train_loss": -11.53929328918457, "global_step": 286188, "epoch": 1703} {"train_loss": -10.794651985168457, "global_step": 286189, "epoch": 1703} {"train_loss": -10.061205863952637, "global_step": 286190, "epoch": 1703} {"train_loss": -11.268869400024414, "global_step": 286191, "epoch": 1703} {"train_loss": -12.097900390625, "global_step": 286192, "epoch": 1703} {"train_loss": -11.738858222961426, "global_step": 286193, "epoch": 1703} {"train_loss": -11.900639533996582, "global_step": 286194, "epoch": 1703} {"train_loss": -11.800911903381348, "global_step": 286195, "epoch": 1703} {"train_loss": -11.962681770324707, "global_step": 286196, "epoch": 1703} {"train_loss": -11.990842819213867, "global_step": 286197, "epoch": 1703} {"train_loss": -11.897102355957031, "global_step": 286198, "epoch": 1703} {"train_loss": -11.800640106201172, "global_step": 286199, "epoch": 1703} {"train_loss": -11.186139106750488, "global_step": 286200, "epoch": 1703} {"train_loss": -11.418115615844727, "global_step": 286201, "epoch": 1703} {"train_loss": -11.913135528564453, "global_step": 286202, "epoch": 1703} {"train_loss": -11.964746475219727, "global_step": 286203, "epoch": 1703} {"train_loss": -11.875268936157227, "global_step": 286204, "epoch": 1703} {"train_loss": -11.613340377807617, "global_step": 286205, "epoch": 1703} {"train_loss": -11.370098114013672, "global_step": 286206, "epoch": 1703} {"train_loss": -11.701225280761719, "global_step": 286207, "epoch": 1703} {"train_loss": -11.84052562713623, "global_step": 286208, "epoch": 1703} {"train_loss": -12.213891983032227, "global_step": 286209, "epoch": 1703} {"train_loss": -11.669312477111816, "global_step": 286210, "epoch": 1703} {"train_loss": -12.222945213317871, "global_step": 286211, "epoch": 1703} {"train_loss": -11.527836799621582, "global_step": 286212, "epoch": 1703} {"train_loss": -11.483636856079102, "global_step": 286213, "epoch": 1703} {"train_loss": -12.042245864868164, "global_step": 286214, "epoch": 1703} {"train_loss": -11.947738647460938, "global_step": 286215, "epoch": 1703} {"train_loss": -12.241928100585938, "global_step": 286216, "epoch": 1703} {"train_loss": -11.634000778198242, "global_step": 286217, "epoch": 1703} {"train_loss": -12.078475952148438, "global_step": 286218, "epoch": 1703} {"train_loss": -11.336941719055176, "global_step": 286219, "epoch": 1703} {"train_loss": -10.985458374023438, "global_step": 286220, "epoch": 1703} {"train_loss": -11.13960075378418, "global_step": 286221, "epoch": 1703} {"train_loss": -11.717061996459961, "global_step": 286222, "epoch": 1703} {"train_loss": -11.372781753540039, "global_step": 286223, "epoch": 1703} {"train_loss": -11.512919425964355, "global_step": 286224, "epoch": 1703} {"train_loss": -12.251443862915039, "global_step": 286225, "epoch": 1703} {"train_loss": -11.465511322021484, "global_step": 286226, "epoch": 1703} {"train_loss": -12.241364479064941, "global_step": 286227, "epoch": 1703} {"train_loss": -11.645544052124023, "global_step": 286228, "epoch": 1703} {"train_loss": -11.724332809448242, "global_step": 286229, "epoch": 1703} {"train_loss": -11.004960060119629, "global_step": 286230, "epoch": 1703} {"train_loss": -12.076303482055664, "global_step": 286231, "epoch": 1703} {"train_loss": -11.524152755737305, "global_step": 286232, "epoch": 1703} {"train_loss": -11.77855396270752, "global_step": 286233, "epoch": 1703} {"train_loss": -11.234362602233887, "global_step": 286234, "epoch": 1703} {"train_loss": -10.994178771972656, "global_step": 286235, "epoch": 1703} {"train_loss": -11.645767211914062, "global_step": 286236, "epoch": 1703} {"train_loss": -11.163090705871582, "global_step": 286237, "epoch": 1703} {"train_loss": -11.315303802490234, "global_step": 286238, "epoch": 1703} {"train_loss": -10.686351776123047, "global_step": 286239, "epoch": 1703} {"train_loss": -9.881272315979004, "global_step": 286240, "epoch": 1703} {"train_loss": -11.778848648071289, "global_step": 286241, "epoch": 1703} {"train_loss": -10.603681564331055, "global_step": 286242, "epoch": 1703} {"train_loss": -11.64858627319336, "global_step": 286243, "epoch": 1703} {"train_loss": -11.053644180297852, "global_step": 286244, "epoch": 1703} {"train_loss": -11.487895965576172, "global_step": 286245, "epoch": 1703} {"train_loss": -11.602201461791992, "global_step": 286246, "epoch": 1703} {"train_loss": -11.867938995361328, "global_step": 286247, "epoch": 1703} {"train_loss": -11.968650817871094, "global_step": 286248, "epoch": 1703} {"train_loss": -12.057050704956055, "global_step": 286249, "epoch": 1703} {"train_loss": -11.80910873413086, "global_step": 286250, "epoch": 1703} {"train_loss": -11.719709396362305, "global_step": 286251, "epoch": 1703} {"train_loss": -11.720222473144531, "global_step": 286252, "epoch": 1703} {"train_loss": -11.83924674987793, "global_step": 286253, "epoch": 1703} {"train_loss": -11.987106323242188, "global_step": 286254, "epoch": 1703} {"train_loss": -11.728153228759766, "global_step": 286255, "epoch": 1703} {"train_loss": -12.068925857543945, "global_step": 286256, "epoch": 1703} {"train_loss": -11.406518936157227, "global_step": 286257, "epoch": 1703} {"train_loss": -12.035650253295898, "global_step": 286258, "epoch": 1703} {"train_loss": -11.701414108276367, "global_step": 286259, "epoch": 1703} {"train_loss": -12.228923797607422, "global_step": 286260, "epoch": 1703} {"train_loss": -11.768260955810547, "global_step": 286261, "epoch": 1703} {"train_loss": -12.158981323242188, "global_step": 286262, "epoch": 1703} {"train_loss": -11.86178970336914, "global_step": 286263, "epoch": 1703} {"train_loss": -12.39638900756836, "global_step": 286264, "epoch": 1703} {"train_loss": -12.147459030151367, "global_step": 286265, "epoch": 1703} {"train_loss": -11.804500579833984, "global_step": 286266, "epoch": 1703} {"train_loss": -12.052019119262695, "global_step": 286267, "epoch": 1703} {"train_loss": -11.696670532226562, "global_step": 286268, "epoch": 1703} {"train_loss": -11.908398628234863, "global_step": 286269, "epoch": 1703} {"train_loss": -11.827251434326172, "global_step": 286270, "epoch": 1703} {"train_loss": -11.921427278291612, "global_step": 286271, "epoch": 1703, "val_loss": 273887.15625} {"train_loss": -11.953630447387695, "global_step": 286272, "epoch": 1704} {"train_loss": -11.638812065124512, "global_step": 286273, "epoch": 1704} {"train_loss": -11.781729698181152, "global_step": 286274, "epoch": 1704} {"train_loss": -11.92918872833252, "global_step": 286275, "epoch": 1704} {"train_loss": -11.77194595336914, "global_step": 286276, "epoch": 1704} {"train_loss": -11.823516845703125, "global_step": 286277, "epoch": 1704} {"train_loss": -11.698434829711914, "global_step": 286278, "epoch": 1704} {"train_loss": -11.966706275939941, "global_step": 286279, "epoch": 1704} {"train_loss": -12.061180114746094, "global_step": 286280, "epoch": 1704} {"train_loss": -11.501293182373047, "global_step": 286281, "epoch": 1704} {"train_loss": -11.295997619628906, "global_step": 286282, "epoch": 1704} {"train_loss": -11.629040718078613, "global_step": 286283, "epoch": 1704} {"train_loss": -11.470720291137695, "global_step": 286284, "epoch": 1704} {"train_loss": -11.66270923614502, "global_step": 286285, "epoch": 1704} {"train_loss": -11.916293144226074, "global_step": 286286, "epoch": 1704} {"train_loss": -11.12930965423584, "global_step": 286287, "epoch": 1704} {"train_loss": -11.983635902404785, "global_step": 286288, "epoch": 1704} {"train_loss": -10.486119270324707, "global_step": 286289, "epoch": 1704} {"train_loss": -12.192009925842285, "global_step": 286290, "epoch": 1704} {"train_loss": -11.477556228637695, "global_step": 286291, "epoch": 1704} {"train_loss": -11.202369689941406, "global_step": 286292, "epoch": 1704} {"train_loss": -12.034197807312012, "global_step": 286293, "epoch": 1704} {"train_loss": -10.916662216186523, "global_step": 286294, "epoch": 1704} {"train_loss": -12.234097480773926, "global_step": 286295, "epoch": 1704} {"train_loss": -11.617792129516602, "global_step": 286296, "epoch": 1704} {"train_loss": -11.83578109741211, "global_step": 286297, "epoch": 1704} {"train_loss": -11.819000244140625, "global_step": 286298, "epoch": 1704} {"train_loss": -11.884725570678711, "global_step": 286299, "epoch": 1704} {"train_loss": -11.59674072265625, "global_step": 286300, "epoch": 1704} {"train_loss": -11.867019653320312, "global_step": 286301, "epoch": 1704} {"train_loss": -11.553425788879395, "global_step": 286302, "epoch": 1704} {"train_loss": -11.973938941955566, "global_step": 286303, "epoch": 1704} {"train_loss": -11.743294715881348, "global_step": 286304, "epoch": 1704} {"train_loss": -11.68699836730957, "global_step": 286305, "epoch": 1704} {"train_loss": -11.806282043457031, "global_step": 286306, "epoch": 1704} {"train_loss": -11.507020950317383, "global_step": 286307, "epoch": 1704} {"train_loss": -11.419918060302734, "global_step": 286308, "epoch": 1704} {"train_loss": -11.909623146057129, "global_step": 286309, "epoch": 1704} {"train_loss": -11.434223175048828, "global_step": 286310, "epoch": 1704} {"train_loss": -11.254520416259766, "global_step": 286311, "epoch": 1704} {"train_loss": -11.95509147644043, "global_step": 286312, "epoch": 1704} {"train_loss": -11.157686233520508, "global_step": 286313, "epoch": 1704} {"train_loss": -11.771427154541016, "global_step": 286314, "epoch": 1704} {"train_loss": -11.492232322692871, "global_step": 286315, "epoch": 1704} {"train_loss": -11.85948371887207, "global_step": 286316, "epoch": 1704} {"train_loss": -11.840105056762695, "global_step": 286317, "epoch": 1704} {"train_loss": -11.41598129272461, "global_step": 286318, "epoch": 1704} {"train_loss": -11.982637405395508, "global_step": 286319, "epoch": 1704} {"train_loss": -11.5938720703125, "global_step": 286320, "epoch": 1704} {"train_loss": -11.767190933227539, "global_step": 286321, "epoch": 1704} {"train_loss": -11.857702255249023, "global_step": 286322, "epoch": 1704} {"train_loss": -11.848783493041992, "global_step": 286323, "epoch": 1704} {"train_loss": -11.525550842285156, "global_step": 286324, "epoch": 1704} {"train_loss": -11.630949974060059, "global_step": 286325, "epoch": 1704} {"train_loss": -11.773452758789062, "global_step": 286326, "epoch": 1704} {"train_loss": -11.942296981811523, "global_step": 286327, "epoch": 1704} {"train_loss": -11.774785995483398, "global_step": 286328, "epoch": 1704} {"train_loss": -11.915291786193848, "global_step": 286329, "epoch": 1704} {"train_loss": -12.011075973510742, "global_step": 286330, "epoch": 1704} {"train_loss": -11.388772010803223, "global_step": 286331, "epoch": 1704} {"train_loss": -11.247934341430664, "global_step": 286332, "epoch": 1704} {"train_loss": -11.382564544677734, "global_step": 286333, "epoch": 1704} {"train_loss": -12.048194885253906, "global_step": 286334, "epoch": 1704} {"train_loss": -11.212028503417969, "global_step": 286335, "epoch": 1704} {"train_loss": -11.530387878417969, "global_step": 286336, "epoch": 1704} {"train_loss": -11.622469902038574, "global_step": 286337, "epoch": 1704} {"train_loss": -11.37582015991211, "global_step": 286338, "epoch": 1704} {"train_loss": -12.096596717834473, "global_step": 286339, "epoch": 1704} {"train_loss": -11.68239974975586, "global_step": 286340, "epoch": 1704} {"train_loss": -11.600940704345703, "global_step": 286341, "epoch": 1704} {"train_loss": -11.776947021484375, "global_step": 286342, "epoch": 1704} {"train_loss": -11.154125213623047, "global_step": 286343, "epoch": 1704} {"train_loss": -11.858070373535156, "global_step": 286344, "epoch": 1704} {"train_loss": -11.561437606811523, "global_step": 286345, "epoch": 1704} {"train_loss": -11.996142387390137, "global_step": 286346, "epoch": 1704} {"train_loss": -11.356598854064941, "global_step": 286347, "epoch": 1704} {"train_loss": -11.809477806091309, "global_step": 286348, "epoch": 1704} {"train_loss": -11.649948120117188, "global_step": 286349, "epoch": 1704} {"train_loss": -11.650379180908203, "global_step": 286350, "epoch": 1704} {"train_loss": -11.73794937133789, "global_step": 286351, "epoch": 1704} {"train_loss": -11.471664428710938, "global_step": 286352, "epoch": 1704} {"train_loss": -11.414594650268555, "global_step": 286353, "epoch": 1704} {"train_loss": -11.582529067993164, "global_step": 286354, "epoch": 1704} {"train_loss": -11.761375427246094, "global_step": 286355, "epoch": 1704} {"train_loss": -10.91737174987793, "global_step": 286356, "epoch": 1704} {"train_loss": -9.783226013183594, "global_step": 286357, "epoch": 1704} {"train_loss": -11.833725929260254, "global_step": 286358, "epoch": 1704} {"train_loss": -11.114039421081543, "global_step": 286359, "epoch": 1704} {"train_loss": -10.829693794250488, "global_step": 286360, "epoch": 1704} {"train_loss": -10.76140308380127, "global_step": 286361, "epoch": 1704} {"train_loss": -10.39591121673584, "global_step": 286362, "epoch": 1704} {"train_loss": -10.828190803527832, "global_step": 286363, "epoch": 1704} {"train_loss": -10.995444297790527, "global_step": 286364, "epoch": 1704} {"train_loss": -10.49465560913086, "global_step": 286365, "epoch": 1704} {"train_loss": -10.316246032714844, "global_step": 286366, "epoch": 1704} {"train_loss": -10.060201644897461, "global_step": 286367, "epoch": 1704} {"train_loss": -10.388258934020996, "global_step": 286368, "epoch": 1704} {"train_loss": -11.59903335571289, "global_step": 286369, "epoch": 1704} {"train_loss": -10.245189666748047, "global_step": 286370, "epoch": 1704} {"train_loss": -11.705229759216309, "global_step": 286371, "epoch": 1704} {"train_loss": -10.60529613494873, "global_step": 286372, "epoch": 1704} {"train_loss": -11.544830322265625, "global_step": 286373, "epoch": 1704} {"train_loss": -11.098630905151367, "global_step": 286374, "epoch": 1704} {"train_loss": -11.401115417480469, "global_step": 286375, "epoch": 1704} {"train_loss": -11.473930358886719, "global_step": 286376, "epoch": 1704} {"train_loss": -11.627643585205078, "global_step": 286377, "epoch": 1704} {"train_loss": -11.12471866607666, "global_step": 286378, "epoch": 1704} {"train_loss": -11.752543449401855, "global_step": 286379, "epoch": 1704} {"train_loss": -11.715824127197266, "global_step": 286380, "epoch": 1704} {"train_loss": -11.776527404785156, "global_step": 286381, "epoch": 1704} {"train_loss": -11.723188400268555, "global_step": 286382, "epoch": 1704} {"train_loss": -11.814302444458008, "global_step": 286383, "epoch": 1704} {"train_loss": -11.591943740844727, "global_step": 286384, "epoch": 1704} {"train_loss": -11.913129806518555, "global_step": 286385, "epoch": 1704} {"train_loss": -11.80009651184082, "global_step": 286386, "epoch": 1704} {"train_loss": -11.901871681213379, "global_step": 286387, "epoch": 1704} {"train_loss": -11.843351364135742, "global_step": 286388, "epoch": 1704} {"train_loss": -11.796223640441895, "global_step": 286389, "epoch": 1704} {"train_loss": -11.845802307128906, "global_step": 286390, "epoch": 1704} {"train_loss": -12.014154434204102, "global_step": 286391, "epoch": 1704} {"train_loss": -11.72828483581543, "global_step": 286392, "epoch": 1704} {"train_loss": -12.12374496459961, "global_step": 286393, "epoch": 1704} {"train_loss": -11.728132247924805, "global_step": 286394, "epoch": 1704} {"train_loss": -11.842917442321777, "global_step": 286395, "epoch": 1704} {"train_loss": -11.96473217010498, "global_step": 286396, "epoch": 1704} {"train_loss": -12.04462718963623, "global_step": 286397, "epoch": 1704} {"train_loss": -11.946426391601562, "global_step": 286398, "epoch": 1704} {"train_loss": -12.072447776794434, "global_step": 286399, "epoch": 1704} {"train_loss": -12.101811408996582, "global_step": 286400, "epoch": 1704} {"train_loss": -12.127408981323242, "global_step": 286401, "epoch": 1704} {"train_loss": -12.09451675415039, "global_step": 286402, "epoch": 1704} {"train_loss": -12.11418628692627, "global_step": 286403, "epoch": 1704} {"train_loss": -12.280183792114258, "global_step": 286404, "epoch": 1704} {"train_loss": -12.044379234313965, "global_step": 286405, "epoch": 1704} {"train_loss": -12.10262393951416, "global_step": 286406, "epoch": 1704} {"train_loss": -12.217592239379883, "global_step": 286407, "epoch": 1704} {"train_loss": -12.032661437988281, "global_step": 286408, "epoch": 1704} {"train_loss": -12.192615509033203, "global_step": 286409, "epoch": 1704} {"train_loss": -12.290862083435059, "global_step": 286410, "epoch": 1704} {"train_loss": -12.019023895263672, "global_step": 286411, "epoch": 1704} {"train_loss": -12.123046875, "global_step": 286412, "epoch": 1704} {"train_loss": -12.168539047241211, "global_step": 286413, "epoch": 1704} {"train_loss": -12.306319236755371, "global_step": 286414, "epoch": 1704} {"train_loss": -12.103363037109375, "global_step": 286415, "epoch": 1704} {"train_loss": -12.234066009521484, "global_step": 286416, "epoch": 1704} {"train_loss": -12.061466217041016, "global_step": 286417, "epoch": 1704} {"train_loss": -12.330436706542969, "global_step": 286418, "epoch": 1704} {"train_loss": -12.331442832946777, "global_step": 286419, "epoch": 1704} {"train_loss": -12.352739334106445, "global_step": 286420, "epoch": 1704} {"train_loss": -12.184012413024902, "global_step": 286421, "epoch": 1704} {"train_loss": -12.36920166015625, "global_step": 286422, "epoch": 1704} {"train_loss": -11.983098983764648, "global_step": 286423, "epoch": 1704} {"train_loss": -12.062435150146484, "global_step": 286424, "epoch": 1704} {"train_loss": -12.339981079101562, "global_step": 286425, "epoch": 1704} {"train_loss": -12.165735244750977, "global_step": 286426, "epoch": 1704} {"train_loss": -12.32270336151123, "global_step": 286427, "epoch": 1704} {"train_loss": -12.181577682495117, "global_step": 286428, "epoch": 1704} {"train_loss": -12.308666229248047, "global_step": 286429, "epoch": 1704} {"train_loss": -12.23157787322998, "global_step": 286430, "epoch": 1704} {"train_loss": -12.284611701965332, "global_step": 286431, "epoch": 1704} {"train_loss": -12.410058975219727, "global_step": 286432, "epoch": 1704} {"train_loss": -12.397716522216797, "global_step": 286433, "epoch": 1704} {"train_loss": -12.410745620727539, "global_step": 286434, "epoch": 1704} {"train_loss": -12.357854843139648, "global_step": 286435, "epoch": 1704} {"train_loss": -12.575559616088867, "global_step": 286436, "epoch": 1704} {"train_loss": -12.310832977294922, "global_step": 286437, "epoch": 1704} {"train_loss": -12.338895797729492, "global_step": 286438, "epoch": 1704} {"train_loss": -11.720198483694167, "global_step": 286439, "epoch": 1704, "val_loss": 275291.625} {"train_loss": -12.36237907409668, "global_step": 286440, "epoch": 1705} {"train_loss": -12.326984405517578, "global_step": 286441, "epoch": 1705} {"train_loss": -12.148463249206543, "global_step": 286442, "epoch": 1705} {"train_loss": -12.489582061767578, "global_step": 286443, "epoch": 1705} {"train_loss": -12.422009468078613, "global_step": 286444, "epoch": 1705} {"train_loss": -12.338220596313477, "global_step": 286445, "epoch": 1705} {"train_loss": -12.407953262329102, "global_step": 286446, "epoch": 1705} {"train_loss": -12.24363899230957, "global_step": 286447, "epoch": 1705} {"train_loss": -12.481342315673828, "global_step": 286448, "epoch": 1705} {"train_loss": -12.211950302124023, "global_step": 286449, "epoch": 1705} {"train_loss": -11.741703987121582, "global_step": 286450, "epoch": 1705} {"train_loss": -12.121627807617188, "global_step": 286451, "epoch": 1705} {"train_loss": -12.127189636230469, "global_step": 286452, "epoch": 1705} {"train_loss": -12.128677368164062, "global_step": 286453, "epoch": 1705} {"train_loss": -12.050081253051758, "global_step": 286454, "epoch": 1705} {"train_loss": -12.207208633422852, "global_step": 286455, "epoch": 1705} {"train_loss": -11.85404109954834, "global_step": 286456, "epoch": 1705} {"train_loss": -11.099298477172852, "global_step": 286457, "epoch": 1705} {"train_loss": -12.201351165771484, "global_step": 286458, "epoch": 1705} {"train_loss": -11.828349113464355, "global_step": 286459, "epoch": 1705} {"train_loss": -12.004777908325195, "global_step": 286460, "epoch": 1705} {"train_loss": -11.617647171020508, "global_step": 286461, "epoch": 1705} {"train_loss": -11.897451400756836, "global_step": 286462, "epoch": 1705} {"train_loss": -11.887065887451172, "global_step": 286463, "epoch": 1705} {"train_loss": -11.441839218139648, "global_step": 286464, "epoch": 1705} {"train_loss": -12.263189315795898, "global_step": 286465, "epoch": 1705} {"train_loss": -12.101237297058105, "global_step": 286466, "epoch": 1705} {"train_loss": -12.165655136108398, "global_step": 286467, "epoch": 1705} {"train_loss": -10.320685386657715, "global_step": 286468, "epoch": 1705} {"train_loss": -10.739788055419922, "global_step": 286469, "epoch": 1705} {"train_loss": -11.776424407958984, "global_step": 286470, "epoch": 1705} {"train_loss": -11.818864822387695, "global_step": 286471, "epoch": 1705} {"train_loss": -10.658540725708008, "global_step": 286472, "epoch": 1705} {"train_loss": -11.167869567871094, "global_step": 286473, "epoch": 1705} {"train_loss": -11.611204147338867, "global_step": 286474, "epoch": 1705} {"train_loss": -10.724562644958496, "global_step": 286475, "epoch": 1705} {"train_loss": -11.698518753051758, "global_step": 286476, "epoch": 1705} {"train_loss": -11.410481452941895, "global_step": 286477, "epoch": 1705} {"train_loss": -11.571867942810059, "global_step": 286478, "epoch": 1705} {"train_loss": -11.539899826049805, "global_step": 286479, "epoch": 1705} {"train_loss": -11.424581527709961, "global_step": 286480, "epoch": 1705} {"train_loss": -11.280757904052734, "global_step": 286481, "epoch": 1705} {"train_loss": -11.110773086547852, "global_step": 286482, "epoch": 1705} {"train_loss": -11.595613479614258, "global_step": 286483, "epoch": 1705} {"train_loss": -11.172435760498047, "global_step": 286484, "epoch": 1705} {"train_loss": -10.725395202636719, "global_step": 286485, "epoch": 1705} {"train_loss": -10.301830291748047, "global_step": 286486, "epoch": 1705} {"train_loss": -11.684438705444336, "global_step": 286487, "epoch": 1705} {"train_loss": -10.712350845336914, "global_step": 286488, "epoch": 1705} {"train_loss": -11.271509170532227, "global_step": 286489, "epoch": 1705} {"train_loss": -11.430943489074707, "global_step": 286490, "epoch": 1705} {"train_loss": -10.947608947753906, "global_step": 286491, "epoch": 1705} {"train_loss": -11.18223762512207, "global_step": 286492, "epoch": 1705} {"train_loss": -9.86077880859375, "global_step": 286493, "epoch": 1705} {"train_loss": -11.804389953613281, "global_step": 286494, "epoch": 1705} {"train_loss": -9.947845458984375, "global_step": 286495, "epoch": 1705} {"train_loss": -11.609487533569336, "global_step": 286496, "epoch": 1705} {"train_loss": -10.439879417419434, "global_step": 286497, "epoch": 1705} {"train_loss": -10.652742385864258, "global_step": 286498, "epoch": 1705} {"train_loss": -10.608633995056152, "global_step": 286499, "epoch": 1705} {"train_loss": -10.803594589233398, "global_step": 286500, "epoch": 1705} {"train_loss": -11.448507308959961, "global_step": 286501, "epoch": 1705} {"train_loss": -11.171175003051758, "global_step": 286502, "epoch": 1705} {"train_loss": -9.79544448852539, "global_step": 286503, "epoch": 1705} {"train_loss": -10.351799011230469, "global_step": 286504, "epoch": 1705} {"train_loss": -10.558378219604492, "global_step": 286505, "epoch": 1705} {"train_loss": -10.078986167907715, "global_step": 286506, "epoch": 1705} {"train_loss": -11.175971984863281, "global_step": 286507, "epoch": 1705} {"train_loss": -10.358028411865234, "global_step": 286508, "epoch": 1705} {"train_loss": -10.485973358154297, "global_step": 286509, "epoch": 1705} {"train_loss": -10.98570442199707, "global_step": 286510, "epoch": 1705} {"train_loss": -10.388258934020996, "global_step": 286511, "epoch": 1705} {"train_loss": -11.265280723571777, "global_step": 286512, "epoch": 1705} {"train_loss": -10.36148452758789, "global_step": 286513, "epoch": 1705} {"train_loss": -11.54841423034668, "global_step": 286514, "epoch": 1705} {"train_loss": -10.856664657592773, "global_step": 286515, "epoch": 1705} {"train_loss": -11.146967887878418, "global_step": 286516, "epoch": 1705} {"train_loss": -10.682723045349121, "global_step": 286517, "epoch": 1705} {"train_loss": -11.361531257629395, "global_step": 286518, "epoch": 1705} {"train_loss": -10.722412109375, "global_step": 286519, "epoch": 1705} {"train_loss": -11.641392707824707, "global_step": 286520, "epoch": 1705} {"train_loss": -11.512961387634277, "global_step": 286521, "epoch": 1705} {"train_loss": -11.106185913085938, "global_step": 286522, "epoch": 1705} {"train_loss": -11.415755271911621, "global_step": 286523, "epoch": 1705} {"train_loss": -11.472108840942383, "global_step": 286524, "epoch": 1705} {"train_loss": -11.68756103515625, "global_step": 286525, "epoch": 1705} {"train_loss": -11.164831161499023, "global_step": 286526, "epoch": 1705} {"train_loss": -11.72095775604248, "global_step": 286527, "epoch": 1705} {"train_loss": -11.484607696533203, "global_step": 286528, "epoch": 1705} {"train_loss": -11.453540802001953, "global_step": 286529, "epoch": 1705} {"train_loss": -11.701274871826172, "global_step": 286530, "epoch": 1705} {"train_loss": -11.323330879211426, "global_step": 286531, "epoch": 1705} {"train_loss": -11.456598281860352, "global_step": 286532, "epoch": 1705} {"train_loss": -11.602973937988281, "global_step": 286533, "epoch": 1705} {"train_loss": -11.971244812011719, "global_step": 286534, "epoch": 1705} {"train_loss": -11.586660385131836, "global_step": 286535, "epoch": 1705} {"train_loss": -11.789227485656738, "global_step": 286536, "epoch": 1705} {"train_loss": -11.829789161682129, "global_step": 286537, "epoch": 1705} {"train_loss": -11.739631652832031, "global_step": 286538, "epoch": 1705} {"train_loss": -11.872794151306152, "global_step": 286539, "epoch": 1705} {"train_loss": -12.14028549194336, "global_step": 286540, "epoch": 1705} {"train_loss": -11.819534301757812, "global_step": 286541, "epoch": 1705} {"train_loss": -11.808050155639648, "global_step": 286542, "epoch": 1705} {"train_loss": -11.949689865112305, "global_step": 286543, "epoch": 1705} {"train_loss": -12.036420822143555, "global_step": 286544, "epoch": 1705} {"train_loss": -11.8642578125, "global_step": 286545, "epoch": 1705} {"train_loss": -11.667715072631836, "global_step": 286546, "epoch": 1705} {"train_loss": -11.997631072998047, "global_step": 286547, "epoch": 1705} {"train_loss": -11.901249885559082, "global_step": 286548, "epoch": 1705} {"train_loss": -12.006908416748047, "global_step": 286549, "epoch": 1705} {"train_loss": -11.916135787963867, "global_step": 286550, "epoch": 1705} {"train_loss": -12.042281150817871, "global_step": 286551, "epoch": 1705} {"train_loss": -12.182483673095703, "global_step": 286552, "epoch": 1705} {"train_loss": -11.879660606384277, "global_step": 286553, "epoch": 1705} {"train_loss": -12.196215629577637, "global_step": 286554, "epoch": 1705} {"train_loss": -11.99860954284668, "global_step": 286555, "epoch": 1705} {"train_loss": -12.035051345825195, "global_step": 286556, "epoch": 1705} {"train_loss": -12.091167449951172, "global_step": 286557, "epoch": 1705} {"train_loss": -11.804443359375, "global_step": 286558, "epoch": 1705} {"train_loss": -11.994375228881836, "global_step": 286559, "epoch": 1705} {"train_loss": -12.141437530517578, "global_step": 286560, "epoch": 1705} {"train_loss": -12.212174415588379, "global_step": 286561, "epoch": 1705} {"train_loss": -11.99944019317627, "global_step": 286562, "epoch": 1705} {"train_loss": -12.084750175476074, "global_step": 286563, "epoch": 1705} {"train_loss": -12.258731842041016, "global_step": 286564, "epoch": 1705} {"train_loss": -12.003817558288574, "global_step": 286565, "epoch": 1705} {"train_loss": -12.269972801208496, "global_step": 286566, "epoch": 1705} {"train_loss": -12.178504943847656, "global_step": 286567, "epoch": 1705} {"train_loss": -12.195987701416016, "global_step": 286568, "epoch": 1705} {"train_loss": -12.166080474853516, "global_step": 286569, "epoch": 1705} {"train_loss": -12.165385246276855, "global_step": 286570, "epoch": 1705} {"train_loss": -12.158388137817383, "global_step": 286571, "epoch": 1705} {"train_loss": -12.263535499572754, "global_step": 286572, "epoch": 1705} {"train_loss": -11.868402481079102, "global_step": 286573, "epoch": 1705} {"train_loss": -12.250447273254395, "global_step": 286574, "epoch": 1705} {"train_loss": -11.738664627075195, "global_step": 286575, "epoch": 1705} {"train_loss": -12.072835922241211, "global_step": 286576, "epoch": 1705} {"train_loss": -12.135826110839844, "global_step": 286577, "epoch": 1705} {"train_loss": -12.054719924926758, "global_step": 286578, "epoch": 1705} {"train_loss": -11.612871170043945, "global_step": 286579, "epoch": 1705} {"train_loss": -12.286823272705078, "global_step": 286580, "epoch": 1705} {"train_loss": -11.413869857788086, "global_step": 286581, "epoch": 1705} {"train_loss": -11.82741928100586, "global_step": 286582, "epoch": 1705} {"train_loss": -11.951581954956055, "global_step": 286583, "epoch": 1705} {"train_loss": -11.868982315063477, "global_step": 286584, "epoch": 1705} {"train_loss": -11.992317199707031, "global_step": 286585, "epoch": 1705} {"train_loss": -12.14560317993164, "global_step": 286586, "epoch": 1705} {"train_loss": -11.7811918258667, "global_step": 286587, "epoch": 1705} {"train_loss": -11.515911102294922, "global_step": 286588, "epoch": 1705} {"train_loss": -12.06124210357666, "global_step": 286589, "epoch": 1705} {"train_loss": -12.031340599060059, "global_step": 286590, "epoch": 1705} {"train_loss": -11.696743965148926, "global_step": 286591, "epoch": 1705} {"train_loss": -12.106892585754395, "global_step": 286592, "epoch": 1705} {"train_loss": -11.77518081665039, "global_step": 286593, "epoch": 1705} {"train_loss": -11.255831718444824, "global_step": 286594, "epoch": 1705} {"train_loss": -10.590998649597168, "global_step": 286595, "epoch": 1705} {"train_loss": -12.301593780517578, "global_step": 286596, "epoch": 1705} {"train_loss": -11.555010795593262, "global_step": 286597, "epoch": 1705} {"train_loss": -11.974015235900879, "global_step": 286598, "epoch": 1705} {"train_loss": -12.10551643371582, "global_step": 286599, "epoch": 1705} {"train_loss": -11.844522476196289, "global_step": 286600, "epoch": 1705} {"train_loss": -11.372265815734863, "global_step": 286601, "epoch": 1705} {"train_loss": -11.798197746276855, "global_step": 286602, "epoch": 1705} {"train_loss": -11.8361234664917, "global_step": 286603, "epoch": 1705} {"train_loss": -11.210904121398926, "global_step": 286604, "epoch": 1705} {"train_loss": -11.006584167480469, "global_step": 286605, "epoch": 1705} {"train_loss": -10.774162292480469, "global_step": 286606, "epoch": 1705} {"train_loss": -11.598854524748665, "global_step": 286607, "epoch": 1705, "val_loss": 276034.625, "train_action_mse_error": 0.7092276811599731} {"train_loss": -10.24882698059082, "global_step": 286608, "epoch": 1706} {"train_loss": -10.686320304870605, "global_step": 286609, "epoch": 1706} {"train_loss": -11.34577751159668, "global_step": 286610, "epoch": 1706} {"train_loss": -10.412138938903809, "global_step": 286611, "epoch": 1706} {"train_loss": -11.554733276367188, "global_step": 286612, "epoch": 1706} {"train_loss": -10.724709510803223, "global_step": 286613, "epoch": 1706} {"train_loss": -11.630352020263672, "global_step": 286614, "epoch": 1706} {"train_loss": -10.447339057922363, "global_step": 286615, "epoch": 1706} {"train_loss": -10.888534545898438, "global_step": 286616, "epoch": 1706} {"train_loss": -11.729005813598633, "global_step": 286617, "epoch": 1706} {"train_loss": -10.331871032714844, "global_step": 286618, "epoch": 1706} {"train_loss": -11.558099746704102, "global_step": 286619, "epoch": 1706} {"train_loss": -11.232332229614258, "global_step": 286620, "epoch": 1706} {"train_loss": -11.556477546691895, "global_step": 286621, "epoch": 1706} {"train_loss": -10.828640937805176, "global_step": 286622, "epoch": 1706} {"train_loss": -10.99852466583252, "global_step": 286623, "epoch": 1706} {"train_loss": -11.360245704650879, "global_step": 286624, "epoch": 1706} {"train_loss": -10.947344779968262, "global_step": 286625, "epoch": 1706} {"train_loss": -11.76589298248291, "global_step": 286626, "epoch": 1706} {"train_loss": -11.55328369140625, "global_step": 286627, "epoch": 1706} {"train_loss": -10.71854019165039, "global_step": 286628, "epoch": 1706} {"train_loss": -11.227279663085938, "global_step": 286629, "epoch": 1706} {"train_loss": -11.383495330810547, "global_step": 286630, "epoch": 1706} {"train_loss": -10.401365280151367, "global_step": 286631, "epoch": 1706} {"train_loss": -11.981222152709961, "global_step": 286632, "epoch": 1706} {"train_loss": -10.374164581298828, "global_step": 286633, "epoch": 1706} {"train_loss": -11.342147827148438, "global_step": 286634, "epoch": 1706} {"train_loss": -11.607402801513672, "global_step": 286635, "epoch": 1706} {"train_loss": -11.205940246582031, "global_step": 286636, "epoch": 1706} {"train_loss": -11.6092529296875, "global_step": 286637, "epoch": 1706} {"train_loss": -11.376762390136719, "global_step": 286638, "epoch": 1706} {"train_loss": -11.27786636352539, "global_step": 286639, "epoch": 1706} {"train_loss": -11.282867431640625, "global_step": 286640, "epoch": 1706} {"train_loss": -11.604934692382812, "global_step": 286641, "epoch": 1706} {"train_loss": -11.843425750732422, "global_step": 286642, "epoch": 1706} {"train_loss": -11.6465425491333, "global_step": 286643, "epoch": 1706} {"train_loss": -12.029048919677734, "global_step": 286644, "epoch": 1706} {"train_loss": -11.743349075317383, "global_step": 286645, "epoch": 1706} {"train_loss": -11.834765434265137, "global_step": 286646, "epoch": 1706} {"train_loss": -12.117236137390137, "global_step": 286647, "epoch": 1706} {"train_loss": -12.013306617736816, "global_step": 286648, "epoch": 1706} {"train_loss": -11.774964332580566, "global_step": 286649, "epoch": 1706} {"train_loss": -11.86614990234375, "global_step": 286650, "epoch": 1706} {"train_loss": -11.975407600402832, "global_step": 286651, "epoch": 1706} {"train_loss": -11.937385559082031, "global_step": 286652, "epoch": 1706} {"train_loss": -11.92190170288086, "global_step": 286653, "epoch": 1706} {"train_loss": -12.1259126663208, "global_step": 286654, "epoch": 1706} {"train_loss": -11.982572555541992, "global_step": 286655, "epoch": 1706} {"train_loss": -12.02818489074707, "global_step": 286656, "epoch": 1706} {"train_loss": -11.811258316040039, "global_step": 286657, "epoch": 1706} {"train_loss": -12.001226425170898, "global_step": 286658, "epoch": 1706} {"train_loss": -12.090229034423828, "global_step": 286659, "epoch": 1706} {"train_loss": -12.2197265625, "global_step": 286660, "epoch": 1706} {"train_loss": -11.673188209533691, "global_step": 286661, "epoch": 1706} {"train_loss": -11.962943077087402, "global_step": 286662, "epoch": 1706} {"train_loss": -11.192644119262695, "global_step": 286663, "epoch": 1706} {"train_loss": -11.79223346710205, "global_step": 286664, "epoch": 1706} {"train_loss": -11.817296981811523, "global_step": 286665, "epoch": 1706} {"train_loss": -11.751028060913086, "global_step": 286666, "epoch": 1706} {"train_loss": -11.926935195922852, "global_step": 286667, "epoch": 1706} {"train_loss": -11.856266021728516, "global_step": 286668, "epoch": 1706} {"train_loss": -11.998945236206055, "global_step": 286669, "epoch": 1706} {"train_loss": -11.99165153503418, "global_step": 286670, "epoch": 1706} {"train_loss": -12.18275260925293, "global_step": 286671, "epoch": 1706} {"train_loss": -12.196731567382812, "global_step": 286672, "epoch": 1706} {"train_loss": -12.2413330078125, "global_step": 286673, "epoch": 1706} {"train_loss": -12.150846481323242, "global_step": 286674, "epoch": 1706} {"train_loss": -12.261180877685547, "global_step": 286675, "epoch": 1706} {"train_loss": -12.310827255249023, "global_step": 286676, "epoch": 1706} {"train_loss": -12.183089256286621, "global_step": 286677, "epoch": 1706} {"train_loss": -12.131265640258789, "global_step": 286678, "epoch": 1706} {"train_loss": -12.374175071716309, "global_step": 286679, "epoch": 1706} {"train_loss": -11.991911888122559, "global_step": 286680, "epoch": 1706} {"train_loss": -12.13784408569336, "global_step": 286681, "epoch": 1706} {"train_loss": -12.322481155395508, "global_step": 286682, "epoch": 1706} {"train_loss": -12.337272644042969, "global_step": 286683, "epoch": 1706} {"train_loss": -12.330894470214844, "global_step": 286684, "epoch": 1706} {"train_loss": -12.41661262512207, "global_step": 286685, "epoch": 1706} {"train_loss": -12.198049545288086, "global_step": 286686, "epoch": 1706} {"train_loss": -12.253658294677734, "global_step": 286687, "epoch": 1706} {"train_loss": -12.304449081420898, "global_step": 286688, "epoch": 1706} {"train_loss": -12.28215503692627, "global_step": 286689, "epoch": 1706} {"train_loss": -12.386734962463379, "global_step": 286690, "epoch": 1706} {"train_loss": -12.353374481201172, "global_step": 286691, "epoch": 1706} {"train_loss": -12.475082397460938, "global_step": 286692, "epoch": 1706} {"train_loss": -12.443382263183594, "global_step": 286693, "epoch": 1706} {"train_loss": -12.494074821472168, "global_step": 286694, "epoch": 1706} {"train_loss": -12.557438850402832, "global_step": 286695, "epoch": 1706} {"train_loss": -12.39263916015625, "global_step": 286696, "epoch": 1706} {"train_loss": -12.302724838256836, "global_step": 286697, "epoch": 1706} {"train_loss": -12.477933883666992, "global_step": 286698, "epoch": 1706} {"train_loss": -12.333118438720703, "global_step": 286699, "epoch": 1706} {"train_loss": -12.292267799377441, "global_step": 286700, "epoch": 1706} {"train_loss": -12.409557342529297, "global_step": 286701, "epoch": 1706} {"train_loss": -12.315864562988281, "global_step": 286702, "epoch": 1706} {"train_loss": -12.504301071166992, "global_step": 286703, "epoch": 1706} {"train_loss": -12.132823944091797, "global_step": 286704, "epoch": 1706} {"train_loss": -12.49898910522461, "global_step": 286705, "epoch": 1706} {"train_loss": -12.386689186096191, "global_step": 286706, "epoch": 1706} {"train_loss": -12.322983741760254, "global_step": 286707, "epoch": 1706} {"train_loss": -11.528402328491211, "global_step": 286708, "epoch": 1706} {"train_loss": -11.139257431030273, "global_step": 286709, "epoch": 1706} {"train_loss": -11.963343620300293, "global_step": 286710, "epoch": 1706} {"train_loss": -12.45550537109375, "global_step": 286711, "epoch": 1706} {"train_loss": -11.930023193359375, "global_step": 286712, "epoch": 1706} {"train_loss": -11.570947647094727, "global_step": 286713, "epoch": 1706} {"train_loss": -11.613250732421875, "global_step": 286714, "epoch": 1706} {"train_loss": -12.549049377441406, "global_step": 286715, "epoch": 1706} {"train_loss": -11.401459693908691, "global_step": 286716, "epoch": 1706} {"train_loss": -11.818060874938965, "global_step": 286717, "epoch": 1706} {"train_loss": -12.056062698364258, "global_step": 286718, "epoch": 1706} {"train_loss": -11.889032363891602, "global_step": 286719, "epoch": 1706} {"train_loss": -11.913984298706055, "global_step": 286720, "epoch": 1706} {"train_loss": -12.376561164855957, "global_step": 286721, "epoch": 1706} {"train_loss": -11.910099029541016, "global_step": 286722, "epoch": 1706} {"train_loss": -11.948688507080078, "global_step": 286723, "epoch": 1706} {"train_loss": -11.865240097045898, "global_step": 286724, "epoch": 1706} {"train_loss": -12.336921691894531, "global_step": 286725, "epoch": 1706} {"train_loss": -11.78944206237793, "global_step": 286726, "epoch": 1706} {"train_loss": -11.610309600830078, "global_step": 286727, "epoch": 1706} {"train_loss": -11.874024391174316, "global_step": 286728, "epoch": 1706} {"train_loss": -11.666450500488281, "global_step": 286729, "epoch": 1706} {"train_loss": -12.512828826904297, "global_step": 286730, "epoch": 1706} {"train_loss": -12.198348999023438, "global_step": 286731, "epoch": 1706} {"train_loss": -12.016990661621094, "global_step": 286732, "epoch": 1706} {"train_loss": -11.791290283203125, "global_step": 286733, "epoch": 1706} {"train_loss": -12.256799697875977, "global_step": 286734, "epoch": 1706} {"train_loss": -11.561480522155762, "global_step": 286735, "epoch": 1706} {"train_loss": -11.879847526550293, "global_step": 286736, "epoch": 1706} {"train_loss": -11.80244255065918, "global_step": 286737, "epoch": 1706} {"train_loss": -12.28786849975586, "global_step": 286738, "epoch": 1706} {"train_loss": -11.899747848510742, "global_step": 286739, "epoch": 1706} {"train_loss": -11.321704864501953, "global_step": 286740, "epoch": 1706} {"train_loss": -12.215396881103516, "global_step": 286741, "epoch": 1706} {"train_loss": -12.049301147460938, "global_step": 286742, "epoch": 1706} {"train_loss": -10.982020378112793, "global_step": 286743, "epoch": 1706} {"train_loss": -11.826630592346191, "global_step": 286744, "epoch": 1706} {"train_loss": -11.489339828491211, "global_step": 286745, "epoch": 1706} {"train_loss": -10.297922134399414, "global_step": 286746, "epoch": 1706} {"train_loss": -11.917825698852539, "global_step": 286747, "epoch": 1706} {"train_loss": -11.397867202758789, "global_step": 286748, "epoch": 1706} {"train_loss": -10.947604179382324, "global_step": 286749, "epoch": 1706} {"train_loss": -12.011898040771484, "global_step": 286750, "epoch": 1706} {"train_loss": -11.459749221801758, "global_step": 286751, "epoch": 1706} {"train_loss": -10.750255584716797, "global_step": 286752, "epoch": 1706} {"train_loss": -12.075061798095703, "global_step": 286753, "epoch": 1706} {"train_loss": -10.235158920288086, "global_step": 286754, "epoch": 1706} {"train_loss": -9.838682174682617, "global_step": 286755, "epoch": 1706} {"train_loss": -11.537160873413086, "global_step": 286756, "epoch": 1706} {"train_loss": -10.41921329498291, "global_step": 286757, "epoch": 1706} {"train_loss": -11.231459617614746, "global_step": 286758, "epoch": 1706} {"train_loss": -11.424959182739258, "global_step": 286759, "epoch": 1706} {"train_loss": -11.508584976196289, "global_step": 286760, "epoch": 1706} {"train_loss": -11.923206329345703, "global_step": 286761, "epoch": 1706} {"train_loss": -11.086736679077148, "global_step": 286762, "epoch": 1706} {"train_loss": -12.257763862609863, "global_step": 286763, "epoch": 1706} {"train_loss": -11.524271011352539, "global_step": 286764, "epoch": 1706} {"train_loss": -11.359212875366211, "global_step": 286765, "epoch": 1706} {"train_loss": -11.482110023498535, "global_step": 286766, "epoch": 1706} {"train_loss": -11.611042976379395, "global_step": 286767, "epoch": 1706} {"train_loss": -11.94818115234375, "global_step": 286768, "epoch": 1706} {"train_loss": -11.565327644348145, "global_step": 286769, "epoch": 1706} {"train_loss": -11.617826461791992, "global_step": 286770, "epoch": 1706} {"train_loss": -11.705509185791016, "global_step": 286771, "epoch": 1706} {"train_loss": -11.775714874267578, "global_step": 286772, "epoch": 1706} {"train_loss": -12.063596725463867, "global_step": 286773, "epoch": 1706} {"train_loss": -11.491771697998047, "global_step": 286774, "epoch": 1706} {"train_loss": -11.743510603904724, "global_step": 286775, "epoch": 1706, "val_loss": 275733.375} {"train_loss": -11.851107597351074, "global_step": 286776, "epoch": 1707} {"train_loss": -11.50869083404541, "global_step": 286777, "epoch": 1707} {"train_loss": -11.59046745300293, "global_step": 286778, "epoch": 1707} {"train_loss": -11.086606979370117, "global_step": 286779, "epoch": 1707} {"train_loss": -11.943445205688477, "global_step": 286780, "epoch": 1707} {"train_loss": -10.924114227294922, "global_step": 286781, "epoch": 1707} {"train_loss": -11.741231918334961, "global_step": 286782, "epoch": 1707} {"train_loss": -11.340781211853027, "global_step": 286783, "epoch": 1707} {"train_loss": -11.682985305786133, "global_step": 286784, "epoch": 1707} {"train_loss": -11.396736145019531, "global_step": 286785, "epoch": 1707} {"train_loss": -11.83278751373291, "global_step": 286786, "epoch": 1707} {"train_loss": -11.839054107666016, "global_step": 286787, "epoch": 1707} {"train_loss": -11.864191055297852, "global_step": 286788, "epoch": 1707} {"train_loss": -12.255525588989258, "global_step": 286789, "epoch": 1707} {"train_loss": -11.775054931640625, "global_step": 286790, "epoch": 1707} {"train_loss": -11.965311050415039, "global_step": 286791, "epoch": 1707} {"train_loss": -11.877405166625977, "global_step": 286792, "epoch": 1707} {"train_loss": -11.992229461669922, "global_step": 286793, "epoch": 1707} {"train_loss": -12.09521770477295, "global_step": 286794, "epoch": 1707} {"train_loss": -11.982812881469727, "global_step": 286795, "epoch": 1707} {"train_loss": -11.997010231018066, "global_step": 286796, "epoch": 1707} {"train_loss": -12.143613815307617, "global_step": 286797, "epoch": 1707} {"train_loss": -12.023417472839355, "global_step": 286798, "epoch": 1707} {"train_loss": -11.799921035766602, "global_step": 286799, "epoch": 1707} {"train_loss": -12.047438621520996, "global_step": 286800, "epoch": 1707} {"train_loss": -12.09994888305664, "global_step": 286801, "epoch": 1707} {"train_loss": -12.16152572631836, "global_step": 286802, "epoch": 1707} {"train_loss": -12.061367988586426, "global_step": 286803, "epoch": 1707} {"train_loss": -12.109797477722168, "global_step": 286804, "epoch": 1707} {"train_loss": -12.217215538024902, "global_step": 286805, "epoch": 1707} {"train_loss": -12.089964866638184, "global_step": 286806, "epoch": 1707} {"train_loss": -12.281778335571289, "global_step": 286807, "epoch": 1707} {"train_loss": -11.998503684997559, "global_step": 286808, "epoch": 1707} {"train_loss": -12.229406356811523, "global_step": 286809, "epoch": 1707} {"train_loss": -12.07827091217041, "global_step": 286810, "epoch": 1707} {"train_loss": -12.36067008972168, "global_step": 286811, "epoch": 1707} {"train_loss": -12.104635238647461, "global_step": 286812, "epoch": 1707} {"train_loss": -12.192696571350098, "global_step": 286813, "epoch": 1707} {"train_loss": -12.135387420654297, "global_step": 286814, "epoch": 1707} {"train_loss": -12.13306999206543, "global_step": 286815, "epoch": 1707} {"train_loss": -12.177421569824219, "global_step": 286816, "epoch": 1707} {"train_loss": -12.373154640197754, "global_step": 286817, "epoch": 1707} {"train_loss": -12.244922637939453, "global_step": 286818, "epoch": 1707} {"train_loss": -12.396289825439453, "global_step": 286819, "epoch": 1707} {"train_loss": -12.436178207397461, "global_step": 286820, "epoch": 1707} {"train_loss": -11.934562683105469, "global_step": 286821, "epoch": 1707} {"train_loss": -11.836424827575684, "global_step": 286822, "epoch": 1707} {"train_loss": -12.249068260192871, "global_step": 286823, "epoch": 1707} {"train_loss": -12.353776931762695, "global_step": 286824, "epoch": 1707} {"train_loss": -12.089012145996094, "global_step": 286825, "epoch": 1707} {"train_loss": -12.28731918334961, "global_step": 286826, "epoch": 1707} {"train_loss": -12.019381523132324, "global_step": 286827, "epoch": 1707} {"train_loss": -11.802019119262695, "global_step": 286828, "epoch": 1707} {"train_loss": -11.581995010375977, "global_step": 286829, "epoch": 1707} {"train_loss": -12.333502769470215, "global_step": 286830, "epoch": 1707} {"train_loss": -11.614765167236328, "global_step": 286831, "epoch": 1707} {"train_loss": -11.905115127563477, "global_step": 286832, "epoch": 1707} {"train_loss": -12.142314910888672, "global_step": 286833, "epoch": 1707} {"train_loss": -11.494546890258789, "global_step": 286834, "epoch": 1707} {"train_loss": -10.346480369567871, "global_step": 286835, "epoch": 1707} {"train_loss": -11.77437973022461, "global_step": 286836, "epoch": 1707} {"train_loss": -11.957826614379883, "global_step": 286837, "epoch": 1707} {"train_loss": -10.970121383666992, "global_step": 286838, "epoch": 1707} {"train_loss": -10.953250885009766, "global_step": 286839, "epoch": 1707} {"train_loss": -11.376276016235352, "global_step": 286840, "epoch": 1707} {"train_loss": -10.517873764038086, "global_step": 286841, "epoch": 1707} {"train_loss": -11.520349502563477, "global_step": 286842, "epoch": 1707} {"train_loss": -11.194068908691406, "global_step": 286843, "epoch": 1707} {"train_loss": -10.4457426071167, "global_step": 286844, "epoch": 1707} {"train_loss": -10.5186128616333, "global_step": 286845, "epoch": 1707} {"train_loss": -11.727781295776367, "global_step": 286846, "epoch": 1707} {"train_loss": -10.717561721801758, "global_step": 286847, "epoch": 1707} {"train_loss": -11.646763801574707, "global_step": 286848, "epoch": 1707} {"train_loss": -11.277111053466797, "global_step": 286849, "epoch": 1707} {"train_loss": -11.857124328613281, "global_step": 286850, "epoch": 1707} {"train_loss": -10.988349914550781, "global_step": 286851, "epoch": 1707} {"train_loss": -11.7118558883667, "global_step": 286852, "epoch": 1707} {"train_loss": -11.398274421691895, "global_step": 286853, "epoch": 1707} {"train_loss": -11.831697463989258, "global_step": 286854, "epoch": 1707} {"train_loss": -11.782387733459473, "global_step": 286855, "epoch": 1707} {"train_loss": -12.060423851013184, "global_step": 286856, "epoch": 1707} {"train_loss": -11.690495491027832, "global_step": 286857, "epoch": 1707} {"train_loss": -11.441648483276367, "global_step": 286858, "epoch": 1707} {"train_loss": -11.669569969177246, "global_step": 286859, "epoch": 1707} {"train_loss": -11.935049057006836, "global_step": 286860, "epoch": 1707} {"train_loss": -11.961559295654297, "global_step": 286861, "epoch": 1707} {"train_loss": -11.779333114624023, "global_step": 286862, "epoch": 1707} {"train_loss": -11.813928604125977, "global_step": 286863, "epoch": 1707} {"train_loss": -11.487283706665039, "global_step": 286864, "epoch": 1707} {"train_loss": -11.847738265991211, "global_step": 286865, "epoch": 1707} {"train_loss": -11.44378662109375, "global_step": 286866, "epoch": 1707} {"train_loss": -12.096271514892578, "global_step": 286867, "epoch": 1707} {"train_loss": -11.317005157470703, "global_step": 286868, "epoch": 1707} {"train_loss": -11.987561225891113, "global_step": 286869, "epoch": 1707} {"train_loss": -11.513385772705078, "global_step": 286870, "epoch": 1707} {"train_loss": -12.072675704956055, "global_step": 286871, "epoch": 1707} {"train_loss": -11.795340538024902, "global_step": 286872, "epoch": 1707} {"train_loss": -12.149271011352539, "global_step": 286873, "epoch": 1707} {"train_loss": -11.774213790893555, "global_step": 286874, "epoch": 1707} {"train_loss": -11.850744247436523, "global_step": 286875, "epoch": 1707} {"train_loss": -12.229705810546875, "global_step": 286876, "epoch": 1707} {"train_loss": -11.758295059204102, "global_step": 286877, "epoch": 1707} {"train_loss": -12.19494915008545, "global_step": 286878, "epoch": 1707} {"train_loss": -11.810271263122559, "global_step": 286879, "epoch": 1707} {"train_loss": -12.095231056213379, "global_step": 286880, "epoch": 1707} {"train_loss": -12.006741523742676, "global_step": 286881, "epoch": 1707} {"train_loss": -11.834968566894531, "global_step": 286882, "epoch": 1707} {"train_loss": -12.18830394744873, "global_step": 286883, "epoch": 1707} {"train_loss": -12.041078567504883, "global_step": 286884, "epoch": 1707} {"train_loss": -12.244956016540527, "global_step": 286885, "epoch": 1707} {"train_loss": -12.214010238647461, "global_step": 286886, "epoch": 1707} {"train_loss": -12.198261260986328, "global_step": 286887, "epoch": 1707} {"train_loss": -12.188706398010254, "global_step": 286888, "epoch": 1707} {"train_loss": -12.213865280151367, "global_step": 286889, "epoch": 1707} {"train_loss": -12.142106056213379, "global_step": 286890, "epoch": 1707} {"train_loss": -12.306565284729004, "global_step": 286891, "epoch": 1707} {"train_loss": -12.039237022399902, "global_step": 286892, "epoch": 1707} {"train_loss": -12.28746509552002, "global_step": 286893, "epoch": 1707} {"train_loss": -11.874747276306152, "global_step": 286894, "epoch": 1707} {"train_loss": -12.140108108520508, "global_step": 286895, "epoch": 1707} {"train_loss": -12.205196380615234, "global_step": 286896, "epoch": 1707} {"train_loss": -12.07109546661377, "global_step": 286897, "epoch": 1707} {"train_loss": -12.254382133483887, "global_step": 286898, "epoch": 1707} {"train_loss": -12.333603858947754, "global_step": 286899, "epoch": 1707} {"train_loss": -12.343183517456055, "global_step": 286900, "epoch": 1707} {"train_loss": -12.056503295898438, "global_step": 286901, "epoch": 1707} {"train_loss": -12.404500007629395, "global_step": 286902, "epoch": 1707} {"train_loss": -12.351293563842773, "global_step": 286903, "epoch": 1707} {"train_loss": -12.315502166748047, "global_step": 286904, "epoch": 1707} {"train_loss": -12.240554809570312, "global_step": 286905, "epoch": 1707} {"train_loss": -12.206235885620117, "global_step": 286906, "epoch": 1707} {"train_loss": -12.10481071472168, "global_step": 286907, "epoch": 1707} {"train_loss": -12.224302291870117, "global_step": 286908, "epoch": 1707} {"train_loss": -12.199572563171387, "global_step": 286909, "epoch": 1707} {"train_loss": -12.373918533325195, "global_step": 286910, "epoch": 1707} {"train_loss": -12.572986602783203, "global_step": 286911, "epoch": 1707} {"train_loss": -12.351170539855957, "global_step": 286912, "epoch": 1707} {"train_loss": -12.455621719360352, "global_step": 286913, "epoch": 1707} {"train_loss": -12.130434036254883, "global_step": 286914, "epoch": 1707} {"train_loss": -12.191792488098145, "global_step": 286915, "epoch": 1707} {"train_loss": -11.936105728149414, "global_step": 286916, "epoch": 1707} {"train_loss": -11.625092506408691, "global_step": 286917, "epoch": 1707} {"train_loss": -11.66327953338623, "global_step": 286918, "epoch": 1707} {"train_loss": -12.217533111572266, "global_step": 286919, "epoch": 1707} {"train_loss": -11.97265911102295, "global_step": 286920, "epoch": 1707} {"train_loss": -11.943437576293945, "global_step": 286921, "epoch": 1707} {"train_loss": -11.784231185913086, "global_step": 286922, "epoch": 1707} {"train_loss": -12.142127990722656, "global_step": 286923, "epoch": 1707} {"train_loss": -11.847175598144531, "global_step": 286924, "epoch": 1707} {"train_loss": -11.60466194152832, "global_step": 286925, "epoch": 1707} {"train_loss": -12.129793167114258, "global_step": 286926, "epoch": 1707} {"train_loss": -11.714029312133789, "global_step": 286927, "epoch": 1707} {"train_loss": -11.863590240478516, "global_step": 286928, "epoch": 1707} {"train_loss": -12.031009674072266, "global_step": 286929, "epoch": 1707} {"train_loss": -12.06990909576416, "global_step": 286930, "epoch": 1707} {"train_loss": -11.711739540100098, "global_step": 286931, "epoch": 1707} {"train_loss": -11.473052978515625, "global_step": 286932, "epoch": 1707} {"train_loss": -11.563392639160156, "global_step": 286933, "epoch": 1707} {"train_loss": -12.02333927154541, "global_step": 286934, "epoch": 1707} {"train_loss": -10.73098087310791, "global_step": 286935, "epoch": 1707} {"train_loss": -11.544780731201172, "global_step": 286936, "epoch": 1707} {"train_loss": -11.70870590209961, "global_step": 286937, "epoch": 1707} {"train_loss": -11.748950958251953, "global_step": 286938, "epoch": 1707} {"train_loss": -11.691457748413086, "global_step": 286939, "epoch": 1707} {"train_loss": -11.981396675109863, "global_step": 286940, "epoch": 1707} {"train_loss": -11.56790542602539, "global_step": 286941, "epoch": 1707} {"train_loss": -11.872968673706055, "global_step": 286942, "epoch": 1707} {"train_loss": -11.88051848752158, "global_step": 286943, "epoch": 1707, "val_loss": 277488.65625} {"train_loss": -11.263826370239258, "global_step": 286944, "epoch": 1708} {"train_loss": -12.155169486999512, "global_step": 286945, "epoch": 1708} {"train_loss": -11.045475006103516, "global_step": 286946, "epoch": 1708} {"train_loss": -10.877851486206055, "global_step": 286947, "epoch": 1708} {"train_loss": -11.795634269714355, "global_step": 286948, "epoch": 1708} {"train_loss": -10.505468368530273, "global_step": 286949, "epoch": 1708} {"train_loss": -11.92034912109375, "global_step": 286950, "epoch": 1708} {"train_loss": -10.85877513885498, "global_step": 286951, "epoch": 1708} {"train_loss": -11.27554702758789, "global_step": 286952, "epoch": 1708} {"train_loss": -11.68449592590332, "global_step": 286953, "epoch": 1708} {"train_loss": -10.998014450073242, "global_step": 286954, "epoch": 1708} {"train_loss": -11.376832962036133, "global_step": 286955, "epoch": 1708} {"train_loss": -11.027310371398926, "global_step": 286956, "epoch": 1708} {"train_loss": -11.683427810668945, "global_step": 286957, "epoch": 1708} {"train_loss": -11.554315567016602, "global_step": 286958, "epoch": 1708} {"train_loss": -11.050832748413086, "global_step": 286959, "epoch": 1708} {"train_loss": -11.71533203125, "global_step": 286960, "epoch": 1708} {"train_loss": -11.148700714111328, "global_step": 286961, "epoch": 1708} {"train_loss": -11.944616317749023, "global_step": 286962, "epoch": 1708} {"train_loss": -10.95803451538086, "global_step": 286963, "epoch": 1708} {"train_loss": -11.921358108520508, "global_step": 286964, "epoch": 1708} {"train_loss": -11.428913116455078, "global_step": 286965, "epoch": 1708} {"train_loss": -11.545696258544922, "global_step": 286966, "epoch": 1708} {"train_loss": -11.34708023071289, "global_step": 286967, "epoch": 1708} {"train_loss": -11.320206642150879, "global_step": 286968, "epoch": 1708} {"train_loss": -11.68904972076416, "global_step": 286969, "epoch": 1708} {"train_loss": -11.395597457885742, "global_step": 286970, "epoch": 1708} {"train_loss": -11.471427917480469, "global_step": 286971, "epoch": 1708} {"train_loss": -11.813834190368652, "global_step": 286972, "epoch": 1708} {"train_loss": -10.762371063232422, "global_step": 286973, "epoch": 1708} {"train_loss": -11.593181610107422, "global_step": 286974, "epoch": 1708} {"train_loss": -11.202301025390625, "global_step": 286975, "epoch": 1708} {"train_loss": -11.796772003173828, "global_step": 286976, "epoch": 1708} {"train_loss": -11.192117691040039, "global_step": 286977, "epoch": 1708} {"train_loss": -11.578563690185547, "global_step": 286978, "epoch": 1708} {"train_loss": -11.705716133117676, "global_step": 286979, "epoch": 1708} {"train_loss": -11.62876033782959, "global_step": 286980, "epoch": 1708} {"train_loss": -12.029990196228027, "global_step": 286981, "epoch": 1708} {"train_loss": -11.88730239868164, "global_step": 286982, "epoch": 1708} {"train_loss": -11.539453506469727, "global_step": 286983, "epoch": 1708} {"train_loss": -11.925559997558594, "global_step": 286984, "epoch": 1708} {"train_loss": -11.595996856689453, "global_step": 286985, "epoch": 1708} {"train_loss": -11.862533569335938, "global_step": 286986, "epoch": 1708} {"train_loss": -11.793460845947266, "global_step": 286987, "epoch": 1708} {"train_loss": -11.515575408935547, "global_step": 286988, "epoch": 1708} {"train_loss": -11.883020401000977, "global_step": 286989, "epoch": 1708} {"train_loss": -11.364584922790527, "global_step": 286990, "epoch": 1708} {"train_loss": -11.983633041381836, "global_step": 286991, "epoch": 1708} {"train_loss": -11.8773832321167, "global_step": 286992, "epoch": 1708} {"train_loss": -11.999092102050781, "global_step": 286993, "epoch": 1708} {"train_loss": -11.9552640914917, "global_step": 286994, "epoch": 1708} {"train_loss": -12.037816047668457, "global_step": 286995, "epoch": 1708} {"train_loss": -11.939634323120117, "global_step": 286996, "epoch": 1708} {"train_loss": -11.921157836914062, "global_step": 286997, "epoch": 1708} {"train_loss": -12.181143760681152, "global_step": 286998, "epoch": 1708} {"train_loss": -11.888626098632812, "global_step": 286999, "epoch": 1708} {"train_loss": -12.353324890136719, "global_step": 287000, "epoch": 1708} {"train_loss": -12.110477447509766, "global_step": 287001, "epoch": 1708} {"train_loss": -12.062332153320312, "global_step": 287002, "epoch": 1708} {"train_loss": -11.787903785705566, "global_step": 287003, "epoch": 1708} {"train_loss": -12.244619369506836, "global_step": 287004, "epoch": 1708} {"train_loss": -11.84195327758789, "global_step": 287005, "epoch": 1708} {"train_loss": -11.762163162231445, "global_step": 287006, "epoch": 1708} {"train_loss": -12.1454439163208, "global_step": 287007, "epoch": 1708} {"train_loss": -11.733263969421387, "global_step": 287008, "epoch": 1708} {"train_loss": -12.153136253356934, "global_step": 287009, "epoch": 1708} {"train_loss": -12.143698692321777, "global_step": 287010, "epoch": 1708} {"train_loss": -11.778517723083496, "global_step": 287011, "epoch": 1708} {"train_loss": -11.695859909057617, "global_step": 287012, "epoch": 1708} {"train_loss": -12.241569519042969, "global_step": 287013, "epoch": 1708} {"train_loss": -11.744155883789062, "global_step": 287014, "epoch": 1708} {"train_loss": -11.848423957824707, "global_step": 287015, "epoch": 1708} {"train_loss": -12.369575500488281, "global_step": 287016, "epoch": 1708} {"train_loss": -11.948805809020996, "global_step": 287017, "epoch": 1708} {"train_loss": -12.05277156829834, "global_step": 287018, "epoch": 1708} {"train_loss": -12.379472732543945, "global_step": 287019, "epoch": 1708} {"train_loss": -11.94078254699707, "global_step": 287020, "epoch": 1708} {"train_loss": -12.098779678344727, "global_step": 287021, "epoch": 1708} {"train_loss": -12.399042129516602, "global_step": 287022, "epoch": 1708} {"train_loss": -12.089066505432129, "global_step": 287023, "epoch": 1708} {"train_loss": -12.427974700927734, "global_step": 287024, "epoch": 1708} {"train_loss": -12.126021385192871, "global_step": 287025, "epoch": 1708} {"train_loss": -12.319099426269531, "global_step": 287026, "epoch": 1708} {"train_loss": -12.285850524902344, "global_step": 287027, "epoch": 1708} {"train_loss": -12.406148910522461, "global_step": 287028, "epoch": 1708} {"train_loss": -12.380168914794922, "global_step": 287029, "epoch": 1708} {"train_loss": -12.388931274414062, "global_step": 287030, "epoch": 1708} {"train_loss": -12.426576614379883, "global_step": 287031, "epoch": 1708} {"train_loss": -12.446727752685547, "global_step": 287032, "epoch": 1708} {"train_loss": -12.451519966125488, "global_step": 287033, "epoch": 1708} {"train_loss": -12.41496753692627, "global_step": 287034, "epoch": 1708} {"train_loss": -12.165014266967773, "global_step": 287035, "epoch": 1708} {"train_loss": -12.327278137207031, "global_step": 287036, "epoch": 1708} {"train_loss": -12.211756706237793, "global_step": 287037, "epoch": 1708} {"train_loss": -12.244721412658691, "global_step": 287038, "epoch": 1708} {"train_loss": -11.872859954833984, "global_step": 287039, "epoch": 1708} {"train_loss": -12.175703048706055, "global_step": 287040, "epoch": 1708} {"train_loss": -11.840447425842285, "global_step": 287041, "epoch": 1708} {"train_loss": -12.350616455078125, "global_step": 287042, "epoch": 1708} {"train_loss": -11.839818954467773, "global_step": 287043, "epoch": 1708} {"train_loss": -12.322046279907227, "global_step": 287044, "epoch": 1708} {"train_loss": -12.210380554199219, "global_step": 287045, "epoch": 1708} {"train_loss": -12.336864471435547, "global_step": 287046, "epoch": 1708} {"train_loss": -12.267232894897461, "global_step": 287047, "epoch": 1708} {"train_loss": -12.300068855285645, "global_step": 287048, "epoch": 1708} {"train_loss": -12.52293586730957, "global_step": 287049, "epoch": 1708} {"train_loss": -12.279708862304688, "global_step": 287050, "epoch": 1708} {"train_loss": -12.335709571838379, "global_step": 287051, "epoch": 1708} {"train_loss": -11.971563339233398, "global_step": 287052, "epoch": 1708} {"train_loss": -12.034560203552246, "global_step": 287053, "epoch": 1708} {"train_loss": -12.032051086425781, "global_step": 287054, "epoch": 1708} {"train_loss": -12.085455894470215, "global_step": 287055, "epoch": 1708} {"train_loss": -11.916352272033691, "global_step": 287056, "epoch": 1708} {"train_loss": -10.716924667358398, "global_step": 287057, "epoch": 1708} {"train_loss": -11.75699234008789, "global_step": 287058, "epoch": 1708} {"train_loss": -10.567938804626465, "global_step": 287059, "epoch": 1708} {"train_loss": -10.103095054626465, "global_step": 287060, "epoch": 1708} {"train_loss": -11.01616096496582, "global_step": 287061, "epoch": 1708} {"train_loss": -11.489733695983887, "global_step": 287062, "epoch": 1708} {"train_loss": -9.140401840209961, "global_step": 287063, "epoch": 1708} {"train_loss": -10.79296875, "global_step": 287064, "epoch": 1708} {"train_loss": -11.1503267288208, "global_step": 287065, "epoch": 1708} {"train_loss": -9.464859962463379, "global_step": 287066, "epoch": 1708} {"train_loss": -9.73733139038086, "global_step": 287067, "epoch": 1708} {"train_loss": -11.61281967163086, "global_step": 287068, "epoch": 1708} {"train_loss": -10.070194244384766, "global_step": 287069, "epoch": 1708} {"train_loss": -11.133241653442383, "global_step": 287070, "epoch": 1708} {"train_loss": -11.111927032470703, "global_step": 287071, "epoch": 1708} {"train_loss": -9.462173461914062, "global_step": 287072, "epoch": 1708} {"train_loss": -11.403234481811523, "global_step": 287073, "epoch": 1708} {"train_loss": -9.837230682373047, "global_step": 287074, "epoch": 1708} {"train_loss": -11.11915111541748, "global_step": 287075, "epoch": 1708} {"train_loss": -10.424087524414062, "global_step": 287076, "epoch": 1708} {"train_loss": -9.83344841003418, "global_step": 287077, "epoch": 1708} {"train_loss": -11.54664134979248, "global_step": 287078, "epoch": 1708} {"train_loss": -9.424736976623535, "global_step": 287079, "epoch": 1708} {"train_loss": -11.571090698242188, "global_step": 287080, "epoch": 1708} {"train_loss": -9.537675857543945, "global_step": 287081, "epoch": 1708} {"train_loss": -11.080265045166016, "global_step": 287082, "epoch": 1708} {"train_loss": -9.801441192626953, "global_step": 287083, "epoch": 1708} {"train_loss": -11.122132301330566, "global_step": 287084, "epoch": 1708} {"train_loss": -11.262779235839844, "global_step": 287085, "epoch": 1708} {"train_loss": -11.280881881713867, "global_step": 287086, "epoch": 1708} {"train_loss": -11.19888973236084, "global_step": 287087, "epoch": 1708} {"train_loss": -11.137039184570312, "global_step": 287088, "epoch": 1708} {"train_loss": -11.186330795288086, "global_step": 287089, "epoch": 1708} {"train_loss": -11.312456130981445, "global_step": 287090, "epoch": 1708} {"train_loss": -11.499736785888672, "global_step": 287091, "epoch": 1708} {"train_loss": -11.287975311279297, "global_step": 287092, "epoch": 1708} {"train_loss": -11.352428436279297, "global_step": 287093, "epoch": 1708} {"train_loss": -11.570598602294922, "global_step": 287094, "epoch": 1708} {"train_loss": -11.5458345413208, "global_step": 287095, "epoch": 1708} {"train_loss": -11.205352783203125, "global_step": 287096, "epoch": 1708} {"train_loss": -11.823188781738281, "global_step": 287097, "epoch": 1708} {"train_loss": -11.35493278503418, "global_step": 287098, "epoch": 1708} {"train_loss": -11.869884490966797, "global_step": 287099, "epoch": 1708} {"train_loss": -11.48328971862793, "global_step": 287100, "epoch": 1708} {"train_loss": -11.504414558410645, "global_step": 287101, "epoch": 1708} {"train_loss": -11.665628433227539, "global_step": 287102, "epoch": 1708} {"train_loss": -11.259456634521484, "global_step": 287103, "epoch": 1708} {"train_loss": -11.617766380310059, "global_step": 287104, "epoch": 1708} {"train_loss": -11.72262954711914, "global_step": 287105, "epoch": 1708} {"train_loss": -11.456422805786133, "global_step": 287106, "epoch": 1708} {"train_loss": -11.84227180480957, "global_step": 287107, "epoch": 1708} {"train_loss": -11.436561584472656, "global_step": 287108, "epoch": 1708} {"train_loss": -11.733955383300781, "global_step": 287109, "epoch": 1708} {"train_loss": -12.050626754760742, "global_step": 287110, "epoch": 1708} {"train_loss": -11.586923962547665, "global_step": 287111, "epoch": 1708, "val_loss": 266930.53125} {"train_loss": -11.885000228881836, "global_step": 287112, "epoch": 1709} {"train_loss": -11.93593978881836, "global_step": 287113, "epoch": 1709} {"train_loss": -11.759506225585938, "global_step": 287114, "epoch": 1709} {"train_loss": -11.795395851135254, "global_step": 287115, "epoch": 1709} {"train_loss": -12.107620239257812, "global_step": 287116, "epoch": 1709} {"train_loss": -12.152250289916992, "global_step": 287117, "epoch": 1709} {"train_loss": -12.242120742797852, "global_step": 287118, "epoch": 1709} {"train_loss": -12.266180038452148, "global_step": 287119, "epoch": 1709} {"train_loss": -12.06808853149414, "global_step": 287120, "epoch": 1709} {"train_loss": -12.03369140625, "global_step": 287121, "epoch": 1709} {"train_loss": -11.839134216308594, "global_step": 287122, "epoch": 1709} {"train_loss": -12.187280654907227, "global_step": 287123, "epoch": 1709} {"train_loss": -11.901860237121582, "global_step": 287124, "epoch": 1709} {"train_loss": -12.21635913848877, "global_step": 287125, "epoch": 1709} {"train_loss": -11.878805160522461, "global_step": 287126, "epoch": 1709} {"train_loss": -12.064288139343262, "global_step": 287127, "epoch": 1709} {"train_loss": -12.022552490234375, "global_step": 287128, "epoch": 1709} {"train_loss": -11.78964614868164, "global_step": 287129, "epoch": 1709} {"train_loss": -12.248719215393066, "global_step": 287130, "epoch": 1709} {"train_loss": -11.967987060546875, "global_step": 287131, "epoch": 1709} {"train_loss": -12.15632438659668, "global_step": 287132, "epoch": 1709} {"train_loss": -12.015237808227539, "global_step": 287133, "epoch": 1709} {"train_loss": -12.165811538696289, "global_step": 287134, "epoch": 1709} {"train_loss": -11.955940246582031, "global_step": 287135, "epoch": 1709} {"train_loss": -11.960807800292969, "global_step": 287136, "epoch": 1709} {"train_loss": -12.04963493347168, "global_step": 287137, "epoch": 1709} {"train_loss": -12.184429168701172, "global_step": 287138, "epoch": 1709} {"train_loss": -12.272479057312012, "global_step": 287139, "epoch": 1709} {"train_loss": -12.07269287109375, "global_step": 287140, "epoch": 1709} {"train_loss": -12.273602485656738, "global_step": 287141, "epoch": 1709} {"train_loss": -11.987424850463867, "global_step": 287142, "epoch": 1709} {"train_loss": -12.21690559387207, "global_step": 287143, "epoch": 1709} {"train_loss": -12.023811340332031, "global_step": 287144, "epoch": 1709} {"train_loss": -12.232759475708008, "global_step": 287145, "epoch": 1709} {"train_loss": -11.79588508605957, "global_step": 287146, "epoch": 1709} {"train_loss": -12.473812103271484, "global_step": 287147, "epoch": 1709} {"train_loss": -12.204324722290039, "global_step": 287148, "epoch": 1709} {"train_loss": -12.290294647216797, "global_step": 287149, "epoch": 1709} {"train_loss": -12.296107292175293, "global_step": 287150, "epoch": 1709} {"train_loss": -12.25190544128418, "global_step": 287151, "epoch": 1709} {"train_loss": -12.422433853149414, "global_step": 287152, "epoch": 1709} {"train_loss": -12.417169570922852, "global_step": 287153, "epoch": 1709} {"train_loss": -12.222028732299805, "global_step": 287154, "epoch": 1709} {"train_loss": -12.010554313659668, "global_step": 287155, "epoch": 1709} {"train_loss": -12.18910026550293, "global_step": 287156, "epoch": 1709} {"train_loss": -11.598222732543945, "global_step": 287157, "epoch": 1709} {"train_loss": -12.024906158447266, "global_step": 287158, "epoch": 1709} {"train_loss": -12.200763702392578, "global_step": 287159, "epoch": 1709} {"train_loss": -11.846809387207031, "global_step": 287160, "epoch": 1709} {"train_loss": -12.1276273727417, "global_step": 287161, "epoch": 1709} {"train_loss": -12.206242561340332, "global_step": 287162, "epoch": 1709} {"train_loss": -12.12618637084961, "global_step": 287163, "epoch": 1709} {"train_loss": -12.120122909545898, "global_step": 287164, "epoch": 1709} {"train_loss": -10.97407341003418, "global_step": 287165, "epoch": 1709} {"train_loss": -12.459051132202148, "global_step": 287166, "epoch": 1709} {"train_loss": -11.673297882080078, "global_step": 287167, "epoch": 1709} {"train_loss": -11.711587905883789, "global_step": 287168, "epoch": 1709} {"train_loss": -12.228373527526855, "global_step": 287169, "epoch": 1709} {"train_loss": -12.130762100219727, "global_step": 287170, "epoch": 1709} {"train_loss": -11.603619575500488, "global_step": 287171, "epoch": 1709} {"train_loss": -12.176538467407227, "global_step": 287172, "epoch": 1709} {"train_loss": -12.15113353729248, "global_step": 287173, "epoch": 1709} {"train_loss": -11.853303909301758, "global_step": 287174, "epoch": 1709} {"train_loss": -11.974838256835938, "global_step": 287175, "epoch": 1709} {"train_loss": -12.153217315673828, "global_step": 287176, "epoch": 1709} {"train_loss": -11.77336311340332, "global_step": 287177, "epoch": 1709} {"train_loss": -12.191959381103516, "global_step": 287178, "epoch": 1709} {"train_loss": -12.098812103271484, "global_step": 287179, "epoch": 1709} {"train_loss": -12.16806411743164, "global_step": 287180, "epoch": 1709} {"train_loss": -11.990119934082031, "global_step": 287181, "epoch": 1709} {"train_loss": -12.355218887329102, "global_step": 287182, "epoch": 1709} {"train_loss": -12.406291961669922, "global_step": 287183, "epoch": 1709} {"train_loss": -12.34202766418457, "global_step": 287184, "epoch": 1709} {"train_loss": -12.106677055358887, "global_step": 287185, "epoch": 1709} {"train_loss": -12.344646453857422, "global_step": 287186, "epoch": 1709} {"train_loss": -11.976694107055664, "global_step": 287187, "epoch": 1709} {"train_loss": -11.957855224609375, "global_step": 287188, "epoch": 1709} {"train_loss": -12.25584602355957, "global_step": 287189, "epoch": 1709} {"train_loss": -11.812646865844727, "global_step": 287190, "epoch": 1709} {"train_loss": -11.791179656982422, "global_step": 287191, "epoch": 1709} {"train_loss": -12.32163143157959, "global_step": 287192, "epoch": 1709} {"train_loss": -12.067117691040039, "global_step": 287193, "epoch": 1709} {"train_loss": -12.204460144042969, "global_step": 287194, "epoch": 1709} {"train_loss": -12.177169799804688, "global_step": 287195, "epoch": 1709} {"train_loss": -12.427964210510254, "global_step": 287196, "epoch": 1709} {"train_loss": -11.901262283325195, "global_step": 287197, "epoch": 1709} {"train_loss": -12.470020294189453, "global_step": 287198, "epoch": 1709} {"train_loss": -12.438461303710938, "global_step": 287199, "epoch": 1709} {"train_loss": -12.223876953125, "global_step": 287200, "epoch": 1709} {"train_loss": -12.376020431518555, "global_step": 287201, "epoch": 1709} {"train_loss": -12.289440155029297, "global_step": 287202, "epoch": 1709} {"train_loss": -12.467069625854492, "global_step": 287203, "epoch": 1709} {"train_loss": -12.251346588134766, "global_step": 287204, "epoch": 1709} {"train_loss": -12.125961303710938, "global_step": 287205, "epoch": 1709} {"train_loss": -12.25748062133789, "global_step": 287206, "epoch": 1709} {"train_loss": -12.07425308227539, "global_step": 287207, "epoch": 1709} {"train_loss": -12.416534423828125, "global_step": 287208, "epoch": 1709} {"train_loss": -12.28856372833252, "global_step": 287209, "epoch": 1709} {"train_loss": -12.181131362915039, "global_step": 287210, "epoch": 1709} {"train_loss": -11.678516387939453, "global_step": 287211, "epoch": 1709} {"train_loss": -11.811652183532715, "global_step": 287212, "epoch": 1709} {"train_loss": -11.95718002319336, "global_step": 287213, "epoch": 1709} {"train_loss": -12.34775161743164, "global_step": 287214, "epoch": 1709} {"train_loss": -11.88315486907959, "global_step": 287215, "epoch": 1709} {"train_loss": -11.612844467163086, "global_step": 287216, "epoch": 1709} {"train_loss": -12.304089546203613, "global_step": 287217, "epoch": 1709} {"train_loss": -11.942022323608398, "global_step": 287218, "epoch": 1709} {"train_loss": -11.202256202697754, "global_step": 287219, "epoch": 1709} {"train_loss": -11.931360244750977, "global_step": 287220, "epoch": 1709} {"train_loss": -10.745265007019043, "global_step": 287221, "epoch": 1709} {"train_loss": -9.259382247924805, "global_step": 287222, "epoch": 1709} {"train_loss": -11.46645736694336, "global_step": 287223, "epoch": 1709} {"train_loss": -8.862947463989258, "global_step": 287224, "epoch": 1709} {"train_loss": -8.738973617553711, "global_step": 287225, "epoch": 1709} {"train_loss": -11.622461318969727, "global_step": 287226, "epoch": 1709} {"train_loss": -8.514680862426758, "global_step": 287227, "epoch": 1709} {"train_loss": -8.621726989746094, "global_step": 287228, "epoch": 1709} {"train_loss": -8.295467376708984, "global_step": 287229, "epoch": 1709} {"train_loss": -9.444432258605957, "global_step": 287230, "epoch": 1709} {"train_loss": -7.241855621337891, "global_step": 287231, "epoch": 1709} {"train_loss": -9.29547119140625, "global_step": 287232, "epoch": 1709} {"train_loss": -8.49844741821289, "global_step": 287233, "epoch": 1709} {"train_loss": -7.933539867401123, "global_step": 287234, "epoch": 1709} {"train_loss": -9.81971549987793, "global_step": 287235, "epoch": 1709} {"train_loss": -8.627477645874023, "global_step": 287236, "epoch": 1709} {"train_loss": -10.167718887329102, "global_step": 287237, "epoch": 1709} {"train_loss": -8.639004707336426, "global_step": 287238, "epoch": 1709} {"train_loss": -9.695213317871094, "global_step": 287239, "epoch": 1709} {"train_loss": -9.448409080505371, "global_step": 287240, "epoch": 1709} {"train_loss": -9.818761825561523, "global_step": 287241, "epoch": 1709} {"train_loss": -9.544534683227539, "global_step": 287242, "epoch": 1709} {"train_loss": -9.097406387329102, "global_step": 287243, "epoch": 1709} {"train_loss": -10.467172622680664, "global_step": 287244, "epoch": 1709} {"train_loss": -10.057229995727539, "global_step": 287245, "epoch": 1709} {"train_loss": -9.29519271850586, "global_step": 287246, "epoch": 1709} {"train_loss": -10.842044830322266, "global_step": 287247, "epoch": 1709} {"train_loss": -9.870440483093262, "global_step": 287248, "epoch": 1709} {"train_loss": -10.739571571350098, "global_step": 287249, "epoch": 1709} {"train_loss": -10.509800910949707, "global_step": 287250, "epoch": 1709} {"train_loss": -11.035614013671875, "global_step": 287251, "epoch": 1709} {"train_loss": -10.639927864074707, "global_step": 287252, "epoch": 1709} {"train_loss": -10.801198959350586, "global_step": 287253, "epoch": 1709} {"train_loss": -10.784082412719727, "global_step": 287254, "epoch": 1709} {"train_loss": -10.322427749633789, "global_step": 287255, "epoch": 1709} {"train_loss": -11.33913803100586, "global_step": 287256, "epoch": 1709} {"train_loss": -10.357349395751953, "global_step": 287257, "epoch": 1709} {"train_loss": -10.747129440307617, "global_step": 287258, "epoch": 1709} {"train_loss": -10.907670974731445, "global_step": 287259, "epoch": 1709} {"train_loss": -10.490164756774902, "global_step": 287260, "epoch": 1709} {"train_loss": -10.842048645019531, "global_step": 287261, "epoch": 1709} {"train_loss": -10.322837829589844, "global_step": 287262, "epoch": 1709} {"train_loss": -10.791126251220703, "global_step": 287263, "epoch": 1709} {"train_loss": -11.075437545776367, "global_step": 287264, "epoch": 1709} {"train_loss": -10.287220001220703, "global_step": 287265, "epoch": 1709} {"train_loss": -10.932915687561035, "global_step": 287266, "epoch": 1709} {"train_loss": -10.975622177124023, "global_step": 287267, "epoch": 1709} {"train_loss": -10.7152099609375, "global_step": 287268, "epoch": 1709} {"train_loss": -10.948986053466797, "global_step": 287269, "epoch": 1709} {"train_loss": -10.724446296691895, "global_step": 287270, "epoch": 1709} {"train_loss": -11.421829223632812, "global_step": 287271, "epoch": 1709} {"train_loss": -11.102916717529297, "global_step": 287272, "epoch": 1709} {"train_loss": -10.970186233520508, "global_step": 287273, "epoch": 1709} {"train_loss": -11.780684471130371, "global_step": 287274, "epoch": 1709} {"train_loss": -10.940649032592773, "global_step": 287275, "epoch": 1709} {"train_loss": -11.376300811767578, "global_step": 287276, "epoch": 1709} {"train_loss": -11.542191505432129, "global_step": 287277, "epoch": 1709} {"train_loss": -11.32751750946045, "global_step": 287278, "epoch": 1709} {"train_loss": -11.423844294888633, "global_step": 287279, "epoch": 1709, "val_loss": 272604.03125} {"train_loss": -11.564074516296387, "global_step": 287280, "epoch": 1710} {"train_loss": -11.483318328857422, "global_step": 287281, "epoch": 1710} {"train_loss": -11.699348449707031, "global_step": 287282, "epoch": 1710} {"train_loss": -11.739643096923828, "global_step": 287283, "epoch": 1710} {"train_loss": -11.63410472869873, "global_step": 287284, "epoch": 1710} {"train_loss": -11.424201965332031, "global_step": 287285, "epoch": 1710} {"train_loss": -11.580429077148438, "global_step": 287286, "epoch": 1710} {"train_loss": -11.678857803344727, "global_step": 287287, "epoch": 1710} {"train_loss": -11.907681465148926, "global_step": 287288, "epoch": 1710} {"train_loss": -11.861202239990234, "global_step": 287289, "epoch": 1710} {"train_loss": -11.759062767028809, "global_step": 287290, "epoch": 1710} {"train_loss": -11.643808364868164, "global_step": 287291, "epoch": 1710} {"train_loss": -11.783849716186523, "global_step": 287292, "epoch": 1710} {"train_loss": -11.728022575378418, "global_step": 287293, "epoch": 1710} {"train_loss": -11.64033031463623, "global_step": 287294, "epoch": 1710} {"train_loss": -11.741643905639648, "global_step": 287295, "epoch": 1710} {"train_loss": -11.799924850463867, "global_step": 287296, "epoch": 1710} {"train_loss": -11.758523941040039, "global_step": 287297, "epoch": 1710} {"train_loss": -11.843744277954102, "global_step": 287298, "epoch": 1710} {"train_loss": -11.87923526763916, "global_step": 287299, "epoch": 1710} {"train_loss": -11.94403076171875, "global_step": 287300, "epoch": 1710} {"train_loss": -11.9862642288208, "global_step": 287301, "epoch": 1710} {"train_loss": -11.775162696838379, "global_step": 287302, "epoch": 1710} {"train_loss": -12.002599716186523, "global_step": 287303, "epoch": 1710} {"train_loss": -11.942183494567871, "global_step": 287304, "epoch": 1710} {"train_loss": -12.063835144042969, "global_step": 287305, "epoch": 1710} {"train_loss": -11.99964427947998, "global_step": 287306, "epoch": 1710} {"train_loss": -11.731414794921875, "global_step": 287307, "epoch": 1710} {"train_loss": -12.027576446533203, "global_step": 287308, "epoch": 1710} {"train_loss": -11.959444046020508, "global_step": 287309, "epoch": 1710} {"train_loss": -12.04216194152832, "global_step": 287310, "epoch": 1710} {"train_loss": -12.032392501831055, "global_step": 287311, "epoch": 1710} {"train_loss": -12.086409568786621, "global_step": 287312, "epoch": 1710} {"train_loss": -12.075300216674805, "global_step": 287313, "epoch": 1710} {"train_loss": -12.201681137084961, "global_step": 287314, "epoch": 1710} {"train_loss": -12.119584083557129, "global_step": 287315, "epoch": 1710} {"train_loss": -12.016166687011719, "global_step": 287316, "epoch": 1710} {"train_loss": -12.201362609863281, "global_step": 287317, "epoch": 1710} {"train_loss": -12.015990257263184, "global_step": 287318, "epoch": 1710} {"train_loss": -12.266643524169922, "global_step": 287319, "epoch": 1710} {"train_loss": -12.074965476989746, "global_step": 287320, "epoch": 1710} {"train_loss": -12.237859725952148, "global_step": 287321, "epoch": 1710} {"train_loss": -12.063919067382812, "global_step": 287322, "epoch": 1710} {"train_loss": -12.182519912719727, "global_step": 287323, "epoch": 1710} {"train_loss": -12.143598556518555, "global_step": 287324, "epoch": 1710} {"train_loss": -12.340787887573242, "global_step": 287325, "epoch": 1710} {"train_loss": -12.167158126831055, "global_step": 287326, "epoch": 1710} {"train_loss": -12.149611473083496, "global_step": 287327, "epoch": 1710} {"train_loss": -12.350748062133789, "global_step": 287328, "epoch": 1710} {"train_loss": -12.258251190185547, "global_step": 287329, "epoch": 1710} {"train_loss": -12.160117149353027, "global_step": 287330, "epoch": 1710} {"train_loss": -12.445905685424805, "global_step": 287331, "epoch": 1710} {"train_loss": -12.234991073608398, "global_step": 287332, "epoch": 1710} {"train_loss": -12.347855567932129, "global_step": 287333, "epoch": 1710} {"train_loss": -12.360321044921875, "global_step": 287334, "epoch": 1710} {"train_loss": -12.427831649780273, "global_step": 287335, "epoch": 1710} {"train_loss": -12.322137832641602, "global_step": 287336, "epoch": 1710} {"train_loss": -12.370233535766602, "global_step": 287337, "epoch": 1710} {"train_loss": -12.452518463134766, "global_step": 287338, "epoch": 1710} {"train_loss": -12.144638061523438, "global_step": 287339, "epoch": 1710} {"train_loss": -12.261868476867676, "global_step": 287340, "epoch": 1710} {"train_loss": -12.351428985595703, "global_step": 287341, "epoch": 1710} {"train_loss": -12.30398941040039, "global_step": 287342, "epoch": 1710} {"train_loss": -12.560966491699219, "global_step": 287343, "epoch": 1710} {"train_loss": -12.409441947937012, "global_step": 287344, "epoch": 1710} {"train_loss": -12.372669219970703, "global_step": 287345, "epoch": 1710} {"train_loss": -12.583754539489746, "global_step": 287346, "epoch": 1710} {"train_loss": -12.310325622558594, "global_step": 287347, "epoch": 1710} {"train_loss": -12.467552185058594, "global_step": 287348, "epoch": 1710} {"train_loss": -12.549842834472656, "global_step": 287349, "epoch": 1710} {"train_loss": -12.30109977722168, "global_step": 287350, "epoch": 1710} {"train_loss": -12.462602615356445, "global_step": 287351, "epoch": 1710} {"train_loss": -12.459342956542969, "global_step": 287352, "epoch": 1710} {"train_loss": -12.314233779907227, "global_step": 287353, "epoch": 1710} {"train_loss": -12.143047332763672, "global_step": 287354, "epoch": 1710} {"train_loss": -12.374034881591797, "global_step": 287355, "epoch": 1710} {"train_loss": -12.526887893676758, "global_step": 287356, "epoch": 1710} {"train_loss": -12.235769271850586, "global_step": 287357, "epoch": 1710} {"train_loss": -12.426244735717773, "global_step": 287358, "epoch": 1710} {"train_loss": -12.515270233154297, "global_step": 287359, "epoch": 1710} {"train_loss": -12.328161239624023, "global_step": 287360, "epoch": 1710} {"train_loss": -12.256917953491211, "global_step": 287361, "epoch": 1710} {"train_loss": -12.173698425292969, "global_step": 287362, "epoch": 1710} {"train_loss": -12.363058090209961, "global_step": 287363, "epoch": 1710} {"train_loss": -12.434995651245117, "global_step": 287364, "epoch": 1710} {"train_loss": -12.351676940917969, "global_step": 287365, "epoch": 1710} {"train_loss": -12.40878963470459, "global_step": 287366, "epoch": 1710} {"train_loss": -12.228975296020508, "global_step": 287367, "epoch": 1710} {"train_loss": -12.346174240112305, "global_step": 287368, "epoch": 1710} {"train_loss": -12.35893440246582, "global_step": 287369, "epoch": 1710} {"train_loss": -12.182985305786133, "global_step": 287370, "epoch": 1710} {"train_loss": -11.303106307983398, "global_step": 287371, "epoch": 1710} {"train_loss": -10.9584379196167, "global_step": 287372, "epoch": 1710} {"train_loss": -12.10953140258789, "global_step": 287373, "epoch": 1710} {"train_loss": -11.326781272888184, "global_step": 287374, "epoch": 1710} {"train_loss": -10.848905563354492, "global_step": 287375, "epoch": 1710} {"train_loss": -10.580663681030273, "global_step": 287376, "epoch": 1710} {"train_loss": -9.915203094482422, "global_step": 287377, "epoch": 1710} {"train_loss": -11.496623992919922, "global_step": 287378, "epoch": 1710} {"train_loss": -8.882051467895508, "global_step": 287379, "epoch": 1710} {"train_loss": -7.8842620849609375, "global_step": 287380, "epoch": 1710} {"train_loss": -8.757335662841797, "global_step": 287381, "epoch": 1710} {"train_loss": -10.26209545135498, "global_step": 287382, "epoch": 1710} {"train_loss": -9.183479309082031, "global_step": 287383, "epoch": 1710} {"train_loss": -10.05740737915039, "global_step": 287384, "epoch": 1710} {"train_loss": -10.758363723754883, "global_step": 287385, "epoch": 1710} {"train_loss": -9.254018783569336, "global_step": 287386, "epoch": 1710} {"train_loss": -11.579216003417969, "global_step": 287387, "epoch": 1710} {"train_loss": -9.089410781860352, "global_step": 287388, "epoch": 1710} {"train_loss": -10.847705841064453, "global_step": 287389, "epoch": 1710} {"train_loss": -9.389959335327148, "global_step": 287390, "epoch": 1710} {"train_loss": -9.539104461669922, "global_step": 287391, "epoch": 1710} {"train_loss": -10.859902381896973, "global_step": 287392, "epoch": 1710} {"train_loss": -7.854187488555908, "global_step": 287393, "epoch": 1710} {"train_loss": -11.543207168579102, "global_step": 287394, "epoch": 1710} {"train_loss": -8.897001266479492, "global_step": 287395, "epoch": 1710} {"train_loss": -11.084717750549316, "global_step": 287396, "epoch": 1710} {"train_loss": -9.783978462219238, "global_step": 287397, "epoch": 1710} {"train_loss": -10.219087600708008, "global_step": 287398, "epoch": 1710} {"train_loss": -10.463715553283691, "global_step": 287399, "epoch": 1710} {"train_loss": -11.173580169677734, "global_step": 287400, "epoch": 1710} {"train_loss": -10.897104263305664, "global_step": 287401, "epoch": 1710} {"train_loss": -11.322351455688477, "global_step": 287402, "epoch": 1710} {"train_loss": -11.05116081237793, "global_step": 287403, "epoch": 1710} {"train_loss": -11.158534049987793, "global_step": 287404, "epoch": 1710} {"train_loss": -11.117471694946289, "global_step": 287405, "epoch": 1710} {"train_loss": -11.341644287109375, "global_step": 287406, "epoch": 1710} {"train_loss": -10.825533866882324, "global_step": 287407, "epoch": 1710} {"train_loss": -11.741218566894531, "global_step": 287408, "epoch": 1710} {"train_loss": -11.084182739257812, "global_step": 287409, "epoch": 1710} {"train_loss": -11.727474212646484, "global_step": 287410, "epoch": 1710} {"train_loss": -11.387990951538086, "global_step": 287411, "epoch": 1710} {"train_loss": -11.465986251831055, "global_step": 287412, "epoch": 1710} {"train_loss": -11.380048751831055, "global_step": 287413, "epoch": 1710} {"train_loss": -11.532487869262695, "global_step": 287414, "epoch": 1710} {"train_loss": -11.658626556396484, "global_step": 287415, "epoch": 1710} {"train_loss": -11.524261474609375, "global_step": 287416, "epoch": 1710} {"train_loss": -11.801013946533203, "global_step": 287417, "epoch": 1710} {"train_loss": -11.716177940368652, "global_step": 287418, "epoch": 1710} {"train_loss": -11.748160362243652, "global_step": 287419, "epoch": 1710} {"train_loss": -12.007275581359863, "global_step": 287420, "epoch": 1710} {"train_loss": -11.693815231323242, "global_step": 287421, "epoch": 1710} {"train_loss": -11.864742279052734, "global_step": 287422, "epoch": 1710} {"train_loss": -11.870341300964355, "global_step": 287423, "epoch": 1710} {"train_loss": -11.896255493164062, "global_step": 287424, "epoch": 1710} {"train_loss": -11.907793045043945, "global_step": 287425, "epoch": 1710} {"train_loss": -11.955734252929688, "global_step": 287426, "epoch": 1710} {"train_loss": -12.07879638671875, "global_step": 287427, "epoch": 1710} {"train_loss": -11.877017974853516, "global_step": 287428, "epoch": 1710} {"train_loss": -11.741188049316406, "global_step": 287429, "epoch": 1710} {"train_loss": -11.971770286560059, "global_step": 287430, "epoch": 1710} {"train_loss": -12.00384521484375, "global_step": 287431, "epoch": 1710} {"train_loss": -11.831315040588379, "global_step": 287432, "epoch": 1710} {"train_loss": -11.958114624023438, "global_step": 287433, "epoch": 1710} {"train_loss": -12.017426490783691, "global_step": 287434, "epoch": 1710} {"train_loss": -12.050765037536621, "global_step": 287435, "epoch": 1710} {"train_loss": -11.910894393920898, "global_step": 287436, "epoch": 1710} {"train_loss": -12.133889198303223, "global_step": 287437, "epoch": 1710} {"train_loss": -12.18140983581543, "global_step": 287438, "epoch": 1710} {"train_loss": -11.826606750488281, "global_step": 287439, "epoch": 1710} {"train_loss": -12.30771255493164, "global_step": 287440, "epoch": 1710} {"train_loss": -12.206323623657227, "global_step": 287441, "epoch": 1710} {"train_loss": -12.340679168701172, "global_step": 287442, "epoch": 1710} {"train_loss": -12.096842765808105, "global_step": 287443, "epoch": 1710} {"train_loss": -11.976198196411133, "global_step": 287444, "epoch": 1710} {"train_loss": -11.989426612854004, "global_step": 287445, "epoch": 1710} {"train_loss": -12.154455184936523, "global_step": 287446, "epoch": 1710} {"train_loss": -11.677122811476389, "global_step": 287447, "epoch": 1710, "val_loss": 275281.1875, "train_action_mse_error": 4.074514389038086} {"train_loss": -12.01194953918457, "global_step": 287448, "epoch": 1711} {"train_loss": -12.374044418334961, "global_step": 287449, "epoch": 1711} {"train_loss": -12.052887916564941, "global_step": 287450, "epoch": 1711} {"train_loss": -12.093023300170898, "global_step": 287451, "epoch": 1711} {"train_loss": -12.263221740722656, "global_step": 287452, "epoch": 1711} {"train_loss": -12.281257629394531, "global_step": 287453, "epoch": 1711} {"train_loss": -12.318232536315918, "global_step": 287454, "epoch": 1711} {"train_loss": -12.021184921264648, "global_step": 287455, "epoch": 1711} {"train_loss": -11.934688568115234, "global_step": 287456, "epoch": 1711} {"train_loss": -12.311220169067383, "global_step": 287457, "epoch": 1711} {"train_loss": -12.381025314331055, "global_step": 287458, "epoch": 1711} {"train_loss": -12.159168243408203, "global_step": 287459, "epoch": 1711} {"train_loss": -12.253488540649414, "global_step": 287460, "epoch": 1711} {"train_loss": -12.171491622924805, "global_step": 287461, "epoch": 1711} {"train_loss": -12.149322509765625, "global_step": 287462, "epoch": 1711} {"train_loss": -12.245940208435059, "global_step": 287463, "epoch": 1711} {"train_loss": -12.295193672180176, "global_step": 287464, "epoch": 1711} {"train_loss": -12.11729621887207, "global_step": 287465, "epoch": 1711} {"train_loss": -12.273801803588867, "global_step": 287466, "epoch": 1711} {"train_loss": -12.258329391479492, "global_step": 287467, "epoch": 1711} {"train_loss": -12.15627670288086, "global_step": 287468, "epoch": 1711} {"train_loss": -12.426848411560059, "global_step": 287469, "epoch": 1711} {"train_loss": -12.382047653198242, "global_step": 287470, "epoch": 1711} {"train_loss": -12.252923965454102, "global_step": 287471, "epoch": 1711} {"train_loss": -12.344955444335938, "global_step": 287472, "epoch": 1711} {"train_loss": -12.449569702148438, "global_step": 287473, "epoch": 1711} {"train_loss": -12.271427154541016, "global_step": 287474, "epoch": 1711} {"train_loss": -12.272918701171875, "global_step": 287475, "epoch": 1711} {"train_loss": -12.239047050476074, "global_step": 287476, "epoch": 1711} {"train_loss": -12.593435287475586, "global_step": 287477, "epoch": 1711} {"train_loss": -12.38765811920166, "global_step": 287478, "epoch": 1711} {"train_loss": -12.41390609741211, "global_step": 287479, "epoch": 1711} {"train_loss": -12.449216842651367, "global_step": 287480, "epoch": 1711} {"train_loss": -12.363622665405273, "global_step": 287481, "epoch": 1711} {"train_loss": -12.303363800048828, "global_step": 287482, "epoch": 1711} {"train_loss": -12.456707000732422, "global_step": 287483, "epoch": 1711} {"train_loss": -12.449430465698242, "global_step": 287484, "epoch": 1711} {"train_loss": -12.496990203857422, "global_step": 287485, "epoch": 1711} {"train_loss": -12.468966484069824, "global_step": 287486, "epoch": 1711} {"train_loss": -12.298179626464844, "global_step": 287487, "epoch": 1711} {"train_loss": -12.224780082702637, "global_step": 287488, "epoch": 1711} {"train_loss": -12.327834129333496, "global_step": 287489, "epoch": 1711} {"train_loss": -12.435907363891602, "global_step": 287490, "epoch": 1711} {"train_loss": -12.176362991333008, "global_step": 287491, "epoch": 1711} {"train_loss": -12.37745475769043, "global_step": 287492, "epoch": 1711} {"train_loss": -11.987783432006836, "global_step": 287493, "epoch": 1711} {"train_loss": -10.586418151855469, "global_step": 287494, "epoch": 1711} {"train_loss": -11.528589248657227, "global_step": 287495, "epoch": 1711} {"train_loss": -12.295512199401855, "global_step": 287496, "epoch": 1711} {"train_loss": -11.905688285827637, "global_step": 287497, "epoch": 1711} {"train_loss": -11.427610397338867, "global_step": 287498, "epoch": 1711} {"train_loss": -12.275796890258789, "global_step": 287499, "epoch": 1711} {"train_loss": -12.230146408081055, "global_step": 287500, "epoch": 1711} {"train_loss": -11.155915260314941, "global_step": 287501, "epoch": 1711} {"train_loss": -11.833329200744629, "global_step": 287502, "epoch": 1711} {"train_loss": -11.878434181213379, "global_step": 287503, "epoch": 1711} {"train_loss": -11.850944519042969, "global_step": 287504, "epoch": 1711} {"train_loss": -11.495645523071289, "global_step": 287505, "epoch": 1711} {"train_loss": -11.874600410461426, "global_step": 287506, "epoch": 1711} {"train_loss": -12.070415496826172, "global_step": 287507, "epoch": 1711} {"train_loss": -11.639120101928711, "global_step": 287508, "epoch": 1711} {"train_loss": -12.219612121582031, "global_step": 287509, "epoch": 1711} {"train_loss": -11.578939437866211, "global_step": 287510, "epoch": 1711} {"train_loss": -11.335641860961914, "global_step": 287511, "epoch": 1711} {"train_loss": -11.812553405761719, "global_step": 287512, "epoch": 1711} {"train_loss": -12.042524337768555, "global_step": 287513, "epoch": 1711} {"train_loss": -10.909732818603516, "global_step": 287514, "epoch": 1711} {"train_loss": -12.217330932617188, "global_step": 287515, "epoch": 1711} {"train_loss": -11.886701583862305, "global_step": 287516, "epoch": 1711} {"train_loss": -11.236881256103516, "global_step": 287517, "epoch": 1711} {"train_loss": -11.267471313476562, "global_step": 287518, "epoch": 1711} {"train_loss": -12.093685150146484, "global_step": 287519, "epoch": 1711} {"train_loss": -10.478302001953125, "global_step": 287520, "epoch": 1711} {"train_loss": -11.151270866394043, "global_step": 287521, "epoch": 1711} {"train_loss": -11.767757415771484, "global_step": 287522, "epoch": 1711} {"train_loss": -10.826618194580078, "global_step": 287523, "epoch": 1711} {"train_loss": -11.275280952453613, "global_step": 287524, "epoch": 1711} {"train_loss": -11.088820457458496, "global_step": 287525, "epoch": 1711} {"train_loss": -9.417734146118164, "global_step": 287526, "epoch": 1711} {"train_loss": -10.435722351074219, "global_step": 287527, "epoch": 1711} {"train_loss": -9.620269775390625, "global_step": 287528, "epoch": 1711} {"train_loss": -11.256756782531738, "global_step": 287529, "epoch": 1711} {"train_loss": -10.13457202911377, "global_step": 287530, "epoch": 1711} {"train_loss": -9.480971336364746, "global_step": 287531, "epoch": 1711} {"train_loss": -10.764087677001953, "global_step": 287532, "epoch": 1711} {"train_loss": -10.970484733581543, "global_step": 287533, "epoch": 1711} {"train_loss": -9.960210800170898, "global_step": 287534, "epoch": 1711} {"train_loss": -11.725288391113281, "global_step": 287535, "epoch": 1711} {"train_loss": -10.901278495788574, "global_step": 287536, "epoch": 1711} {"train_loss": -11.808860778808594, "global_step": 287537, "epoch": 1711} {"train_loss": -11.46451187133789, "global_step": 287538, "epoch": 1711} {"train_loss": -10.734480857849121, "global_step": 287539, "epoch": 1711} {"train_loss": -12.05395221710205, "global_step": 287540, "epoch": 1711} {"train_loss": -11.038712501525879, "global_step": 287541, "epoch": 1711} {"train_loss": -11.713109970092773, "global_step": 287542, "epoch": 1711} {"train_loss": -11.603165626525879, "global_step": 287543, "epoch": 1711} {"train_loss": -11.457047462463379, "global_step": 287544, "epoch": 1711} {"train_loss": -11.686335563659668, "global_step": 287545, "epoch": 1711} {"train_loss": -11.56135368347168, "global_step": 287546, "epoch": 1711} {"train_loss": -11.74178695678711, "global_step": 287547, "epoch": 1711} {"train_loss": -11.919069290161133, "global_step": 287548, "epoch": 1711} {"train_loss": -11.7526216506958, "global_step": 287549, "epoch": 1711} {"train_loss": -11.648926734924316, "global_step": 287550, "epoch": 1711} {"train_loss": -11.57391357421875, "global_step": 287551, "epoch": 1711} {"train_loss": -11.542076110839844, "global_step": 287552, "epoch": 1711} {"train_loss": -11.620126724243164, "global_step": 287553, "epoch": 1711} {"train_loss": -11.79714298248291, "global_step": 287554, "epoch": 1711} {"train_loss": -11.739083290100098, "global_step": 287555, "epoch": 1711} {"train_loss": -11.494400024414062, "global_step": 287556, "epoch": 1711} {"train_loss": -11.84351634979248, "global_step": 287557, "epoch": 1711} {"train_loss": -12.123980522155762, "global_step": 287558, "epoch": 1711} {"train_loss": -11.821864128112793, "global_step": 287559, "epoch": 1711} {"train_loss": -11.868354797363281, "global_step": 287560, "epoch": 1711} {"train_loss": -11.89157485961914, "global_step": 287561, "epoch": 1711} {"train_loss": -11.874605178833008, "global_step": 287562, "epoch": 1711} {"train_loss": -12.093792915344238, "global_step": 287563, "epoch": 1711} {"train_loss": -12.096500396728516, "global_step": 287564, "epoch": 1711} {"train_loss": -11.968109130859375, "global_step": 287565, "epoch": 1711} {"train_loss": -12.129724502563477, "global_step": 287566, "epoch": 1711} {"train_loss": -11.940876960754395, "global_step": 287567, "epoch": 1711} {"train_loss": -11.922962188720703, "global_step": 287568, "epoch": 1711} {"train_loss": -12.14356803894043, "global_step": 287569, "epoch": 1711} {"train_loss": -12.316146850585938, "global_step": 287570, "epoch": 1711} {"train_loss": -12.246434211730957, "global_step": 287571, "epoch": 1711} {"train_loss": -12.202735900878906, "global_step": 287572, "epoch": 1711} {"train_loss": -12.062225341796875, "global_step": 287573, "epoch": 1711} {"train_loss": -12.163801193237305, "global_step": 287574, "epoch": 1711} {"train_loss": -12.110913276672363, "global_step": 287575, "epoch": 1711} {"train_loss": -12.026262283325195, "global_step": 287576, "epoch": 1711} {"train_loss": -12.076578140258789, "global_step": 287577, "epoch": 1711} {"train_loss": -12.242761611938477, "global_step": 287578, "epoch": 1711} {"train_loss": -11.937833786010742, "global_step": 287579, "epoch": 1711} {"train_loss": -11.894767761230469, "global_step": 287580, "epoch": 1711} {"train_loss": -11.948498725891113, "global_step": 287581, "epoch": 1711} {"train_loss": -12.38104248046875, "global_step": 287582, "epoch": 1711} {"train_loss": -11.90581226348877, "global_step": 287583, "epoch": 1711} {"train_loss": -12.229700088500977, "global_step": 287584, "epoch": 1711} {"train_loss": -11.851438522338867, "global_step": 287585, "epoch": 1711} {"train_loss": -11.563497543334961, "global_step": 287586, "epoch": 1711} {"train_loss": -12.132885932922363, "global_step": 287587, "epoch": 1711} {"train_loss": -11.636672019958496, "global_step": 287588, "epoch": 1711} {"train_loss": -11.924662590026855, "global_step": 287589, "epoch": 1711} {"train_loss": -12.213500022888184, "global_step": 287590, "epoch": 1711} {"train_loss": -11.82801342010498, "global_step": 287591, "epoch": 1711} {"train_loss": -11.99787425994873, "global_step": 287592, "epoch": 1711} {"train_loss": -12.175609588623047, "global_step": 287593, "epoch": 1711} {"train_loss": -12.172967910766602, "global_step": 287594, "epoch": 1711} {"train_loss": -11.938623428344727, "global_step": 287595, "epoch": 1711} {"train_loss": -11.83736515045166, "global_step": 287596, "epoch": 1711} {"train_loss": -11.791980743408203, "global_step": 287597, "epoch": 1711} {"train_loss": -12.11086368560791, "global_step": 287598, "epoch": 1711} {"train_loss": -12.334895133972168, "global_step": 287599, "epoch": 1711} {"train_loss": -11.847208023071289, "global_step": 287600, "epoch": 1711} {"train_loss": -12.231947898864746, "global_step": 287601, "epoch": 1711} {"train_loss": -12.051137924194336, "global_step": 287602, "epoch": 1711} {"train_loss": -11.969013214111328, "global_step": 287603, "epoch": 1711} {"train_loss": -12.127420425415039, "global_step": 287604, "epoch": 1711} {"train_loss": -12.227043151855469, "global_step": 287605, "epoch": 1711} {"train_loss": -12.291353225708008, "global_step": 287606, "epoch": 1711} {"train_loss": -12.058923721313477, "global_step": 287607, "epoch": 1711} {"train_loss": -12.16900634765625, "global_step": 287608, "epoch": 1711} {"train_loss": -12.2242431640625, "global_step": 287609, "epoch": 1711} {"train_loss": -12.009407997131348, "global_step": 287610, "epoch": 1711} {"train_loss": -12.414192199707031, "global_step": 287611, "epoch": 1711} {"train_loss": -12.169092178344727, "global_step": 287612, "epoch": 1711} {"train_loss": -12.348663330078125, "global_step": 287613, "epoch": 1711} {"train_loss": -12.316374778747559, "global_step": 287614, "epoch": 1711} {"train_loss": -11.872716398466201, "global_step": 287615, "epoch": 1711, "val_loss": 275361.1875} {"train_loss": -11.952116012573242, "global_step": 287616, "epoch": 1712} {"train_loss": -12.238994598388672, "global_step": 287617, "epoch": 1712} {"train_loss": -12.243457794189453, "global_step": 287618, "epoch": 1712} {"train_loss": -12.362764358520508, "global_step": 287619, "epoch": 1712} {"train_loss": -12.27376937866211, "global_step": 287620, "epoch": 1712} {"train_loss": -11.992390632629395, "global_step": 287621, "epoch": 1712} {"train_loss": -12.416509628295898, "global_step": 287622, "epoch": 1712} {"train_loss": -12.225805282592773, "global_step": 287623, "epoch": 1712} {"train_loss": -12.367986679077148, "global_step": 287624, "epoch": 1712} {"train_loss": -12.21503734588623, "global_step": 287625, "epoch": 1712} {"train_loss": -11.815814971923828, "global_step": 287626, "epoch": 1712} {"train_loss": -12.375310897827148, "global_step": 287627, "epoch": 1712} {"train_loss": -12.300479888916016, "global_step": 287628, "epoch": 1712} {"train_loss": -12.013565063476562, "global_step": 287629, "epoch": 1712} {"train_loss": -11.79887580871582, "global_step": 287630, "epoch": 1712} {"train_loss": -12.06538200378418, "global_step": 287631, "epoch": 1712} {"train_loss": -12.331850051879883, "global_step": 287632, "epoch": 1712} {"train_loss": -11.795700073242188, "global_step": 287633, "epoch": 1712} {"train_loss": -12.518767356872559, "global_step": 287634, "epoch": 1712} {"train_loss": -12.356971740722656, "global_step": 287635, "epoch": 1712} {"train_loss": -12.359254837036133, "global_step": 287636, "epoch": 1712} {"train_loss": -11.550468444824219, "global_step": 287637, "epoch": 1712} {"train_loss": -11.918313980102539, "global_step": 287638, "epoch": 1712} {"train_loss": -12.22256088256836, "global_step": 287639, "epoch": 1712} {"train_loss": -12.27012825012207, "global_step": 287640, "epoch": 1712} {"train_loss": -12.333695411682129, "global_step": 287641, "epoch": 1712} {"train_loss": -12.37424373626709, "global_step": 287642, "epoch": 1712} {"train_loss": -12.433738708496094, "global_step": 287643, "epoch": 1712} {"train_loss": -12.12872314453125, "global_step": 287644, "epoch": 1712} {"train_loss": -12.328035354614258, "global_step": 287645, "epoch": 1712} {"train_loss": -12.149225234985352, "global_step": 287646, "epoch": 1712} {"train_loss": -12.270280838012695, "global_step": 287647, "epoch": 1712} {"train_loss": -12.296721458435059, "global_step": 287648, "epoch": 1712} {"train_loss": -12.264066696166992, "global_step": 287649, "epoch": 1712} {"train_loss": -12.136425018310547, "global_step": 287650, "epoch": 1712} {"train_loss": -11.824671745300293, "global_step": 287651, "epoch": 1712} {"train_loss": -12.37989616394043, "global_step": 287652, "epoch": 1712} {"train_loss": -11.680179595947266, "global_step": 287653, "epoch": 1712} {"train_loss": -11.731355667114258, "global_step": 287654, "epoch": 1712} {"train_loss": -11.531387329101562, "global_step": 287655, "epoch": 1712} {"train_loss": -10.773823738098145, "global_step": 287656, "epoch": 1712} {"train_loss": -11.036453247070312, "global_step": 287657, "epoch": 1712} {"train_loss": -10.375205993652344, "global_step": 287658, "epoch": 1712} {"train_loss": -11.833224296569824, "global_step": 287659, "epoch": 1712} {"train_loss": -11.807023048400879, "global_step": 287660, "epoch": 1712} {"train_loss": -11.975664138793945, "global_step": 287661, "epoch": 1712} {"train_loss": -11.26296615600586, "global_step": 287662, "epoch": 1712} {"train_loss": -11.239259719848633, "global_step": 287663, "epoch": 1712} {"train_loss": -11.514965057373047, "global_step": 287664, "epoch": 1712} {"train_loss": -12.244556427001953, "global_step": 287665, "epoch": 1712} {"train_loss": -11.192764282226562, "global_step": 287666, "epoch": 1712} {"train_loss": -11.478296279907227, "global_step": 287667, "epoch": 1712} {"train_loss": -11.649332046508789, "global_step": 287668, "epoch": 1712} {"train_loss": -11.692426681518555, "global_step": 287669, "epoch": 1712} {"train_loss": -11.074868202209473, "global_step": 287670, "epoch": 1712} {"train_loss": -11.370996475219727, "global_step": 287671, "epoch": 1712} {"train_loss": -12.082319259643555, "global_step": 287672, "epoch": 1712} {"train_loss": -11.765928268432617, "global_step": 287673, "epoch": 1712} {"train_loss": -11.944976806640625, "global_step": 287674, "epoch": 1712} {"train_loss": -12.245678901672363, "global_step": 287675, "epoch": 1712} {"train_loss": -12.126998901367188, "global_step": 287676, "epoch": 1712} {"train_loss": -12.199928283691406, "global_step": 287677, "epoch": 1712} {"train_loss": -12.013826370239258, "global_step": 287678, "epoch": 1712} {"train_loss": -11.632144927978516, "global_step": 287679, "epoch": 1712} {"train_loss": -12.201732635498047, "global_step": 287680, "epoch": 1712} {"train_loss": -12.130149841308594, "global_step": 287681, "epoch": 1712} {"train_loss": -11.93363094329834, "global_step": 287682, "epoch": 1712} {"train_loss": -11.98002815246582, "global_step": 287683, "epoch": 1712} {"train_loss": -12.153961181640625, "global_step": 287684, "epoch": 1712} {"train_loss": -12.293998718261719, "global_step": 287685, "epoch": 1712} {"train_loss": -12.04200553894043, "global_step": 287686, "epoch": 1712} {"train_loss": -11.985695838928223, "global_step": 287687, "epoch": 1712} {"train_loss": -12.030950546264648, "global_step": 287688, "epoch": 1712} {"train_loss": -12.203255653381348, "global_step": 287689, "epoch": 1712} {"train_loss": -12.040670394897461, "global_step": 287690, "epoch": 1712} {"train_loss": -12.143512725830078, "global_step": 287691, "epoch": 1712} {"train_loss": -12.253826141357422, "global_step": 287692, "epoch": 1712} {"train_loss": -11.891425132751465, "global_step": 287693, "epoch": 1712} {"train_loss": -11.957530975341797, "global_step": 287694, "epoch": 1712} {"train_loss": -11.724037170410156, "global_step": 287695, "epoch": 1712} {"train_loss": -12.001839637756348, "global_step": 287696, "epoch": 1712} {"train_loss": -11.659454345703125, "global_step": 287697, "epoch": 1712} {"train_loss": -12.094266891479492, "global_step": 287698, "epoch": 1712} {"train_loss": -11.322717666625977, "global_step": 287699, "epoch": 1712} {"train_loss": -11.688492774963379, "global_step": 287700, "epoch": 1712} {"train_loss": -11.407893180847168, "global_step": 287701, "epoch": 1712} {"train_loss": -11.891875267028809, "global_step": 287702, "epoch": 1712} {"train_loss": -11.551368713378906, "global_step": 287703, "epoch": 1712} {"train_loss": -12.046146392822266, "global_step": 287704, "epoch": 1712} {"train_loss": -11.780792236328125, "global_step": 287705, "epoch": 1712} {"train_loss": -11.859973907470703, "global_step": 287706, "epoch": 1712} {"train_loss": -11.34681510925293, "global_step": 287707, "epoch": 1712} {"train_loss": -10.948269844055176, "global_step": 287708, "epoch": 1712} {"train_loss": -11.680768966674805, "global_step": 287709, "epoch": 1712} {"train_loss": -12.289302825927734, "global_step": 287710, "epoch": 1712} {"train_loss": -10.862711906433105, "global_step": 287711, "epoch": 1712} {"train_loss": -11.498014450073242, "global_step": 287712, "epoch": 1712} {"train_loss": -11.146538734436035, "global_step": 287713, "epoch": 1712} {"train_loss": -11.4506196975708, "global_step": 287714, "epoch": 1712} {"train_loss": -10.624300956726074, "global_step": 287715, "epoch": 1712} {"train_loss": -12.006485939025879, "global_step": 287716, "epoch": 1712} {"train_loss": -10.699104309082031, "global_step": 287717, "epoch": 1712} {"train_loss": -11.314364433288574, "global_step": 287718, "epoch": 1712} {"train_loss": -11.701801300048828, "global_step": 287719, "epoch": 1712} {"train_loss": -10.942005157470703, "global_step": 287720, "epoch": 1712} {"train_loss": -11.059869766235352, "global_step": 287721, "epoch": 1712} {"train_loss": -11.931520462036133, "global_step": 287722, "epoch": 1712} {"train_loss": -11.25268840789795, "global_step": 287723, "epoch": 1712} {"train_loss": -11.418242454528809, "global_step": 287724, "epoch": 1712} {"train_loss": -11.744245529174805, "global_step": 287725, "epoch": 1712} {"train_loss": -11.601900100708008, "global_step": 287726, "epoch": 1712} {"train_loss": -11.76835823059082, "global_step": 287727, "epoch": 1712} {"train_loss": -11.679338455200195, "global_step": 287728, "epoch": 1712} {"train_loss": -11.41697883605957, "global_step": 287729, "epoch": 1712} {"train_loss": -12.029443740844727, "global_step": 287730, "epoch": 1712} {"train_loss": -11.926326751708984, "global_step": 287731, "epoch": 1712} {"train_loss": -11.251391410827637, "global_step": 287732, "epoch": 1712} {"train_loss": -11.71293830871582, "global_step": 287733, "epoch": 1712} {"train_loss": -12.09998893737793, "global_step": 287734, "epoch": 1712} {"train_loss": -11.481863975524902, "global_step": 287735, "epoch": 1712} {"train_loss": -11.959875106811523, "global_step": 287736, "epoch": 1712} {"train_loss": -11.446112632751465, "global_step": 287737, "epoch": 1712} {"train_loss": -11.93350601196289, "global_step": 287738, "epoch": 1712} {"train_loss": -11.627922058105469, "global_step": 287739, "epoch": 1712} {"train_loss": -11.767127990722656, "global_step": 287740, "epoch": 1712} {"train_loss": -11.568761825561523, "global_step": 287741, "epoch": 1712} {"train_loss": -11.609380722045898, "global_step": 287742, "epoch": 1712} {"train_loss": -11.443439483642578, "global_step": 287743, "epoch": 1712} {"train_loss": -11.617438316345215, "global_step": 287744, "epoch": 1712} {"train_loss": -11.666053771972656, "global_step": 287745, "epoch": 1712} {"train_loss": -11.306962966918945, "global_step": 287746, "epoch": 1712} {"train_loss": -12.111119270324707, "global_step": 287747, "epoch": 1712} {"train_loss": -11.403704643249512, "global_step": 287748, "epoch": 1712} {"train_loss": -11.560304641723633, "global_step": 287749, "epoch": 1712} {"train_loss": -11.627449989318848, "global_step": 287750, "epoch": 1712} {"train_loss": -11.921154975891113, "global_step": 287751, "epoch": 1712} {"train_loss": -11.837568283081055, "global_step": 287752, "epoch": 1712} {"train_loss": -11.907432556152344, "global_step": 287753, "epoch": 1712} {"train_loss": -11.886202812194824, "global_step": 287754, "epoch": 1712} {"train_loss": -12.125710487365723, "global_step": 287755, "epoch": 1712} {"train_loss": -12.172213554382324, "global_step": 287756, "epoch": 1712} {"train_loss": -12.073579788208008, "global_step": 287757, "epoch": 1712} {"train_loss": -11.823132514953613, "global_step": 287758, "epoch": 1712} {"train_loss": -12.020549774169922, "global_step": 287759, "epoch": 1712} {"train_loss": -11.94726848602295, "global_step": 287760, "epoch": 1712} {"train_loss": -11.985054969787598, "global_step": 287761, "epoch": 1712} {"train_loss": -11.757144927978516, "global_step": 287762, "epoch": 1712} {"train_loss": -11.728095054626465, "global_step": 287763, "epoch": 1712} {"train_loss": -11.664912223815918, "global_step": 287764, "epoch": 1712} {"train_loss": -11.992965698242188, "global_step": 287765, "epoch": 1712} {"train_loss": -12.233091354370117, "global_step": 287766, "epoch": 1712} {"train_loss": -11.904446601867676, "global_step": 287767, "epoch": 1712} {"train_loss": -11.935637474060059, "global_step": 287768, "epoch": 1712} {"train_loss": -12.102965354919434, "global_step": 287769, "epoch": 1712} {"train_loss": -11.83880615234375, "global_step": 287770, "epoch": 1712} {"train_loss": -11.897639274597168, "global_step": 287771, "epoch": 1712} {"train_loss": -11.777950286865234, "global_step": 287772, "epoch": 1712} {"train_loss": -11.716437339782715, "global_step": 287773, "epoch": 1712} {"train_loss": -11.953710556030273, "global_step": 287774, "epoch": 1712} {"train_loss": -12.013494491577148, "global_step": 287775, "epoch": 1712} {"train_loss": -11.876476287841797, "global_step": 287776, "epoch": 1712} {"train_loss": -12.17279052734375, "global_step": 287777, "epoch": 1712} {"train_loss": -11.861627578735352, "global_step": 287778, "epoch": 1712} {"train_loss": -11.754373550415039, "global_step": 287779, "epoch": 1712} {"train_loss": -12.020415306091309, "global_step": 287780, "epoch": 1712} {"train_loss": -12.02014446258545, "global_step": 287781, "epoch": 1712} {"train_loss": -12.116589546203613, "global_step": 287782, "epoch": 1712} {"train_loss": -11.834604439281282, "global_step": 287783, "epoch": 1712, "val_loss": 279081.5} {"train_loss": -11.877030372619629, "global_step": 287784, "epoch": 1713} {"train_loss": -12.20248794555664, "global_step": 287785, "epoch": 1713} {"train_loss": -12.228727340698242, "global_step": 287786, "epoch": 1713} {"train_loss": -12.370699882507324, "global_step": 287787, "epoch": 1713} {"train_loss": -12.182280540466309, "global_step": 287788, "epoch": 1713} {"train_loss": -12.108952522277832, "global_step": 287789, "epoch": 1713} {"train_loss": -12.0606689453125, "global_step": 287790, "epoch": 1713} {"train_loss": -12.282106399536133, "global_step": 287791, "epoch": 1713} {"train_loss": -12.364213943481445, "global_step": 287792, "epoch": 1713} {"train_loss": -12.160703659057617, "global_step": 287793, "epoch": 1713} {"train_loss": -12.371474266052246, "global_step": 287794, "epoch": 1713} {"train_loss": -12.389991760253906, "global_step": 287795, "epoch": 1713} {"train_loss": -12.460975646972656, "global_step": 287796, "epoch": 1713} {"train_loss": -12.263627052307129, "global_step": 287797, "epoch": 1713} {"train_loss": -12.197528839111328, "global_step": 287798, "epoch": 1713} {"train_loss": -12.197599411010742, "global_step": 287799, "epoch": 1713} {"train_loss": -12.059650421142578, "global_step": 287800, "epoch": 1713} {"train_loss": -12.111372947692871, "global_step": 287801, "epoch": 1713} {"train_loss": -12.45688533782959, "global_step": 287802, "epoch": 1713} {"train_loss": -12.295567512512207, "global_step": 287803, "epoch": 1713} {"train_loss": -12.362641334533691, "global_step": 287804, "epoch": 1713} {"train_loss": -12.336841583251953, "global_step": 287805, "epoch": 1713} {"train_loss": -12.402326583862305, "global_step": 287806, "epoch": 1713} {"train_loss": -12.255619049072266, "global_step": 287807, "epoch": 1713} {"train_loss": -12.123767852783203, "global_step": 287808, "epoch": 1713} {"train_loss": -12.497398376464844, "global_step": 287809, "epoch": 1713} {"train_loss": -12.327917098999023, "global_step": 287810, "epoch": 1713} {"train_loss": -12.069723129272461, "global_step": 287811, "epoch": 1713} {"train_loss": -12.506980895996094, "global_step": 287812, "epoch": 1713} {"train_loss": -12.552518844604492, "global_step": 287813, "epoch": 1713} {"train_loss": -11.994022369384766, "global_step": 287814, "epoch": 1713} {"train_loss": -12.288484573364258, "global_step": 287815, "epoch": 1713} {"train_loss": -12.397552490234375, "global_step": 287816, "epoch": 1713} {"train_loss": -12.524600982666016, "global_step": 287817, "epoch": 1713} {"train_loss": -12.18415641784668, "global_step": 287818, "epoch": 1713} {"train_loss": -12.458152770996094, "global_step": 287819, "epoch": 1713} {"train_loss": -12.227500915527344, "global_step": 287820, "epoch": 1713} {"train_loss": -12.209552764892578, "global_step": 287821, "epoch": 1713} {"train_loss": -12.379533767700195, "global_step": 287822, "epoch": 1713} {"train_loss": -12.343914031982422, "global_step": 287823, "epoch": 1713} {"train_loss": -12.452205657958984, "global_step": 287824, "epoch": 1713} {"train_loss": -12.537206649780273, "global_step": 287825, "epoch": 1713} {"train_loss": -12.207825660705566, "global_step": 287826, "epoch": 1713} {"train_loss": -11.94866943359375, "global_step": 287827, "epoch": 1713} {"train_loss": -12.267911911010742, "global_step": 287828, "epoch": 1713} {"train_loss": -12.260942459106445, "global_step": 287829, "epoch": 1713} {"train_loss": -11.590898513793945, "global_step": 287830, "epoch": 1713} {"train_loss": -10.493383407592773, "global_step": 287831, "epoch": 1713} {"train_loss": -11.092784881591797, "global_step": 287832, "epoch": 1713} {"train_loss": -11.536245346069336, "global_step": 287833, "epoch": 1713} {"train_loss": -10.52725601196289, "global_step": 287834, "epoch": 1713} {"train_loss": -9.29667854309082, "global_step": 287835, "epoch": 1713} {"train_loss": -10.96174430847168, "global_step": 287836, "epoch": 1713} {"train_loss": -8.498340606689453, "global_step": 287837, "epoch": 1713} {"train_loss": -9.122692108154297, "global_step": 287838, "epoch": 1713} {"train_loss": -7.740673065185547, "global_step": 287839, "epoch": 1713} {"train_loss": -8.98021411895752, "global_step": 287840, "epoch": 1713} {"train_loss": -8.093267440795898, "global_step": 287841, "epoch": 1713} {"train_loss": -7.927674770355225, "global_step": 287842, "epoch": 1713} {"train_loss": -10.508883476257324, "global_step": 287843, "epoch": 1713} {"train_loss": -9.708342552185059, "global_step": 287844, "epoch": 1713} {"train_loss": -9.949063301086426, "global_step": 287845, "epoch": 1713} {"train_loss": -9.472254753112793, "global_step": 287846, "epoch": 1713} {"train_loss": -11.15030288696289, "global_step": 287847, "epoch": 1713} {"train_loss": -9.952534675598145, "global_step": 287848, "epoch": 1713} {"train_loss": -11.251852035522461, "global_step": 287849, "epoch": 1713} {"train_loss": -10.495771408081055, "global_step": 287850, "epoch": 1713} {"train_loss": -10.107501029968262, "global_step": 287851, "epoch": 1713} {"train_loss": -11.129276275634766, "global_step": 287852, "epoch": 1713} {"train_loss": -10.512445449829102, "global_step": 287853, "epoch": 1713} {"train_loss": -10.483227729797363, "global_step": 287854, "epoch": 1713} {"train_loss": -10.6065034866333, "global_step": 287855, "epoch": 1713} {"train_loss": -10.3441162109375, "global_step": 287856, "epoch": 1713} {"train_loss": -11.020195007324219, "global_step": 287857, "epoch": 1713} {"train_loss": -11.145418167114258, "global_step": 287858, "epoch": 1713} {"train_loss": -10.980192184448242, "global_step": 287859, "epoch": 1713} {"train_loss": -11.51784610748291, "global_step": 287860, "epoch": 1713} {"train_loss": -11.130792617797852, "global_step": 287861, "epoch": 1713} {"train_loss": -11.285761833190918, "global_step": 287862, "epoch": 1713} {"train_loss": -11.385016441345215, "global_step": 287863, "epoch": 1713} {"train_loss": -11.541757583618164, "global_step": 287864, "epoch": 1713} {"train_loss": -11.71390151977539, "global_step": 287865, "epoch": 1713} {"train_loss": -11.612798690795898, "global_step": 287866, "epoch": 1713} {"train_loss": -11.645515441894531, "global_step": 287867, "epoch": 1713} {"train_loss": -11.819100379943848, "global_step": 287868, "epoch": 1713} {"train_loss": -11.381677627563477, "global_step": 287869, "epoch": 1713} {"train_loss": -11.445233345031738, "global_step": 287870, "epoch": 1713} {"train_loss": -11.372316360473633, "global_step": 287871, "epoch": 1713} {"train_loss": -11.722094535827637, "global_step": 287872, "epoch": 1713} {"train_loss": -11.648740768432617, "global_step": 287873, "epoch": 1713} {"train_loss": -11.701536178588867, "global_step": 287874, "epoch": 1713} {"train_loss": -11.650533676147461, "global_step": 287875, "epoch": 1713} {"train_loss": -11.582700729370117, "global_step": 287876, "epoch": 1713} {"train_loss": -11.99584674835205, "global_step": 287877, "epoch": 1713} {"train_loss": -11.866357803344727, "global_step": 287878, "epoch": 1713} {"train_loss": -11.727883338928223, "global_step": 287879, "epoch": 1713} {"train_loss": -11.994749069213867, "global_step": 287880, "epoch": 1713} {"train_loss": -11.891829490661621, "global_step": 287881, "epoch": 1713} {"train_loss": -11.77504825592041, "global_step": 287882, "epoch": 1713} {"train_loss": -11.863927841186523, "global_step": 287883, "epoch": 1713} {"train_loss": -11.7119722366333, "global_step": 287884, "epoch": 1713} {"train_loss": -12.058388710021973, "global_step": 287885, "epoch": 1713} {"train_loss": -11.75440788269043, "global_step": 287886, "epoch": 1713} {"train_loss": -11.924018859863281, "global_step": 287887, "epoch": 1713} {"train_loss": -11.776655197143555, "global_step": 287888, "epoch": 1713} {"train_loss": -11.876102447509766, "global_step": 287889, "epoch": 1713} {"train_loss": -12.04174518585205, "global_step": 287890, "epoch": 1713} {"train_loss": -12.168697357177734, "global_step": 287891, "epoch": 1713} {"train_loss": -12.023670196533203, "global_step": 287892, "epoch": 1713} {"train_loss": -12.201652526855469, "global_step": 287893, "epoch": 1713} {"train_loss": -12.30314826965332, "global_step": 287894, "epoch": 1713} {"train_loss": -12.006591796875, "global_step": 287895, "epoch": 1713} {"train_loss": -11.94735050201416, "global_step": 287896, "epoch": 1713} {"train_loss": -12.05087661743164, "global_step": 287897, "epoch": 1713} {"train_loss": -12.219413757324219, "global_step": 287898, "epoch": 1713} {"train_loss": -12.131654739379883, "global_step": 287899, "epoch": 1713} {"train_loss": -12.174971580505371, "global_step": 287900, "epoch": 1713} {"train_loss": -12.10512924194336, "global_step": 287901, "epoch": 1713} {"train_loss": -12.10696029663086, "global_step": 287902, "epoch": 1713} {"train_loss": -12.188713073730469, "global_step": 287903, "epoch": 1713} {"train_loss": -12.211228370666504, "global_step": 287904, "epoch": 1713} {"train_loss": -12.208951950073242, "global_step": 287905, "epoch": 1713} {"train_loss": -12.239325523376465, "global_step": 287906, "epoch": 1713} {"train_loss": -12.425477981567383, "global_step": 287907, "epoch": 1713} {"train_loss": -12.198866844177246, "global_step": 287908, "epoch": 1713} {"train_loss": -12.131694793701172, "global_step": 287909, "epoch": 1713} {"train_loss": -12.215960502624512, "global_step": 287910, "epoch": 1713} {"train_loss": -12.156843185424805, "global_step": 287911, "epoch": 1713} {"train_loss": -12.281222343444824, "global_step": 287912, "epoch": 1713} {"train_loss": -12.086397171020508, "global_step": 287913, "epoch": 1713} {"train_loss": -12.2472562789917, "global_step": 287914, "epoch": 1713} {"train_loss": -12.265715599060059, "global_step": 287915, "epoch": 1713} {"train_loss": -12.109487533569336, "global_step": 287916, "epoch": 1713} {"train_loss": -12.118955612182617, "global_step": 287917, "epoch": 1713} {"train_loss": -12.446088790893555, "global_step": 287918, "epoch": 1713} {"train_loss": -12.229043006896973, "global_step": 287919, "epoch": 1713} {"train_loss": -12.51141357421875, "global_step": 287920, "epoch": 1713} {"train_loss": -12.37952995300293, "global_step": 287921, "epoch": 1713} {"train_loss": -12.183656692504883, "global_step": 287922, "epoch": 1713} {"train_loss": -12.35029411315918, "global_step": 287923, "epoch": 1713} {"train_loss": -12.423850059509277, "global_step": 287924, "epoch": 1713} {"train_loss": -12.52139949798584, "global_step": 287925, "epoch": 1713} {"train_loss": -12.486989974975586, "global_step": 287926, "epoch": 1713} {"train_loss": -12.43747329711914, "global_step": 287927, "epoch": 1713} {"train_loss": -12.566022872924805, "global_step": 287928, "epoch": 1713} {"train_loss": -12.323246002197266, "global_step": 287929, "epoch": 1713} {"train_loss": -12.546427726745605, "global_step": 287930, "epoch": 1713} {"train_loss": -11.907510757446289, "global_step": 287931, "epoch": 1713} {"train_loss": -12.564191818237305, "global_step": 287932, "epoch": 1713} {"train_loss": -12.22818660736084, "global_step": 287933, "epoch": 1713} {"train_loss": -12.491190910339355, "global_step": 287934, "epoch": 1713} {"train_loss": -12.394235610961914, "global_step": 287935, "epoch": 1713} {"train_loss": -12.359210968017578, "global_step": 287936, "epoch": 1713} {"train_loss": -12.3702974319458, "global_step": 287937, "epoch": 1713} {"train_loss": -12.217460632324219, "global_step": 287938, "epoch": 1713} {"train_loss": -11.906660079956055, "global_step": 287939, "epoch": 1713} {"train_loss": -11.78270149230957, "global_step": 287940, "epoch": 1713} {"train_loss": -11.576640129089355, "global_step": 287941, "epoch": 1713} {"train_loss": -12.000693321228027, "global_step": 287942, "epoch": 1713} {"train_loss": -11.33808708190918, "global_step": 287943, "epoch": 1713} {"train_loss": -11.349559783935547, "global_step": 287944, "epoch": 1713} {"train_loss": -11.986520767211914, "global_step": 287945, "epoch": 1713} {"train_loss": -11.790363311767578, "global_step": 287946, "epoch": 1713} {"train_loss": -11.649045944213867, "global_step": 287947, "epoch": 1713} {"train_loss": -11.529274940490723, "global_step": 287948, "epoch": 1713} {"train_loss": -11.54746150970459, "global_step": 287949, "epoch": 1713} {"train_loss": -11.504371643066406, "global_step": 287950, "epoch": 1713} {"train_loss": -11.738975964841389, "global_step": 287951, "epoch": 1713, "val_loss": 276491.03125} {"train_loss": -11.751789093017578, "global_step": 287952, "epoch": 1714} {"train_loss": -10.868804931640625, "global_step": 287953, "epoch": 1714} {"train_loss": -8.66109848022461, "global_step": 287954, "epoch": 1714} {"train_loss": -9.468280792236328, "global_step": 287955, "epoch": 1714} {"train_loss": -8.921026229858398, "global_step": 287956, "epoch": 1714} {"train_loss": -11.18455696105957, "global_step": 287957, "epoch": 1714} {"train_loss": -7.673541069030762, "global_step": 287958, "epoch": 1714} {"train_loss": -9.776914596557617, "global_step": 287959, "epoch": 1714} {"train_loss": -5.628307342529297, "global_step": 287960, "epoch": 1714} {"train_loss": -7.604844093322754, "global_step": 287961, "epoch": 1714} {"train_loss": -6.21959114074707, "global_step": 287962, "epoch": 1714} {"train_loss": -6.319736957550049, "global_step": 287963, "epoch": 1714} {"train_loss": -6.839605808258057, "global_step": 287964, "epoch": 1714} {"train_loss": -8.170957565307617, "global_step": 287965, "epoch": 1714} {"train_loss": -8.322967529296875, "global_step": 287966, "epoch": 1714} {"train_loss": -8.010187149047852, "global_step": 287967, "epoch": 1714} {"train_loss": -7.66180944442749, "global_step": 287968, "epoch": 1714} {"train_loss": -7.6358184814453125, "global_step": 287969, "epoch": 1714} {"train_loss": -8.641284942626953, "global_step": 287970, "epoch": 1714} {"train_loss": -9.46227741241455, "global_step": 287971, "epoch": 1714} {"train_loss": -8.897810935974121, "global_step": 287972, "epoch": 1714} {"train_loss": -9.183098793029785, "global_step": 287973, "epoch": 1714} {"train_loss": -10.074649810791016, "global_step": 287974, "epoch": 1714} {"train_loss": -10.13451862335205, "global_step": 287975, "epoch": 1714} {"train_loss": -10.610179901123047, "global_step": 287976, "epoch": 1714} {"train_loss": -10.59829330444336, "global_step": 287977, "epoch": 1714} {"train_loss": -11.093421936035156, "global_step": 287978, "epoch": 1714} {"train_loss": -9.738819122314453, "global_step": 287979, "epoch": 1714} {"train_loss": -10.565021514892578, "global_step": 287980, "epoch": 1714} {"train_loss": -9.933737754821777, "global_step": 287981, "epoch": 1714} {"train_loss": -9.933859825134277, "global_step": 287982, "epoch": 1714} {"train_loss": -11.005561828613281, "global_step": 287983, "epoch": 1714} {"train_loss": -10.560770034790039, "global_step": 287984, "epoch": 1714} {"train_loss": -11.056413650512695, "global_step": 287985, "epoch": 1714} {"train_loss": -11.404159545898438, "global_step": 287986, "epoch": 1714} {"train_loss": -11.236856460571289, "global_step": 287987, "epoch": 1714} {"train_loss": -11.385466575622559, "global_step": 287988, "epoch": 1714} {"train_loss": -11.205511093139648, "global_step": 287989, "epoch": 1714} {"train_loss": -11.647689819335938, "global_step": 287990, "epoch": 1714} {"train_loss": -11.433683395385742, "global_step": 287991, "epoch": 1714} {"train_loss": -11.614384651184082, "global_step": 287992, "epoch": 1714} {"train_loss": -11.570594787597656, "global_step": 287993, "epoch": 1714} {"train_loss": -11.291370391845703, "global_step": 287994, "epoch": 1714} {"train_loss": -11.809183120727539, "global_step": 287995, "epoch": 1714} {"train_loss": -11.592527389526367, "global_step": 287996, "epoch": 1714} {"train_loss": -11.417095184326172, "global_step": 287997, "epoch": 1714} {"train_loss": -11.817404747009277, "global_step": 287998, "epoch": 1714} {"train_loss": -11.730630874633789, "global_step": 287999, "epoch": 1714} {"train_loss": -11.648416519165039, "global_step": 288000, "epoch": 1714} {"train_loss": -11.726125717163086, "global_step": 288001, "epoch": 1714} {"train_loss": -11.6453218460083, "global_step": 288002, "epoch": 1714} {"train_loss": -11.924009323120117, "global_step": 288003, "epoch": 1714} {"train_loss": -11.868389129638672, "global_step": 288004, "epoch": 1714} {"train_loss": -11.818986892700195, "global_step": 288005, "epoch": 1714} {"train_loss": -11.639753341674805, "global_step": 288006, "epoch": 1714} {"train_loss": -11.946737289428711, "global_step": 288007, "epoch": 1714} {"train_loss": -11.893529891967773, "global_step": 288008, "epoch": 1714} {"train_loss": -11.90984058380127, "global_step": 288009, "epoch": 1714} {"train_loss": -11.570813179016113, "global_step": 288010, "epoch": 1714} {"train_loss": -11.92772388458252, "global_step": 288011, "epoch": 1714} {"train_loss": -11.826651573181152, "global_step": 288012, "epoch": 1714} {"train_loss": -11.863381385803223, "global_step": 288013, "epoch": 1714} {"train_loss": -11.89318561553955, "global_step": 288014, "epoch": 1714} {"train_loss": -12.011204719543457, "global_step": 288015, "epoch": 1714} {"train_loss": -12.03915023803711, "global_step": 288016, "epoch": 1714} {"train_loss": -11.90362548828125, "global_step": 288017, "epoch": 1714} {"train_loss": -12.089738845825195, "global_step": 288018, "epoch": 1714} {"train_loss": -11.857257843017578, "global_step": 288019, "epoch": 1714} {"train_loss": -11.850427627563477, "global_step": 288020, "epoch": 1714} {"train_loss": -12.04395866394043, "global_step": 288021, "epoch": 1714} {"train_loss": -11.836694717407227, "global_step": 288022, "epoch": 1714} {"train_loss": -11.760457992553711, "global_step": 288023, "epoch": 1714} {"train_loss": -11.791179656982422, "global_step": 288024, "epoch": 1714} {"train_loss": -11.805477142333984, "global_step": 288025, "epoch": 1714} {"train_loss": -12.098440170288086, "global_step": 288026, "epoch": 1714} {"train_loss": -11.692371368408203, "global_step": 288027, "epoch": 1714} {"train_loss": -12.213005065917969, "global_step": 288028, "epoch": 1714} {"train_loss": -11.71839714050293, "global_step": 288029, "epoch": 1714} {"train_loss": -12.043537139892578, "global_step": 288030, "epoch": 1714} {"train_loss": -12.036255836486816, "global_step": 288031, "epoch": 1714} {"train_loss": -11.951437950134277, "global_step": 288032, "epoch": 1714} {"train_loss": -11.875059127807617, "global_step": 288033, "epoch": 1714} {"train_loss": -12.23428726196289, "global_step": 288034, "epoch": 1714} {"train_loss": -12.090078353881836, "global_step": 288035, "epoch": 1714} {"train_loss": -11.892799377441406, "global_step": 288036, "epoch": 1714} {"train_loss": -12.053400993347168, "global_step": 288037, "epoch": 1714} {"train_loss": -11.853891372680664, "global_step": 288038, "epoch": 1714} {"train_loss": -12.124979019165039, "global_step": 288039, "epoch": 1714} {"train_loss": -12.288873672485352, "global_step": 288040, "epoch": 1714} {"train_loss": -12.074462890625, "global_step": 288041, "epoch": 1714} {"train_loss": -12.170713424682617, "global_step": 288042, "epoch": 1714} {"train_loss": -12.038412094116211, "global_step": 288043, "epoch": 1714} {"train_loss": -12.128573417663574, "global_step": 288044, "epoch": 1714} {"train_loss": -11.868658065795898, "global_step": 288045, "epoch": 1714} {"train_loss": -11.901948928833008, "global_step": 288046, "epoch": 1714} {"train_loss": -11.756940841674805, "global_step": 288047, "epoch": 1714} {"train_loss": -12.244945526123047, "global_step": 288048, "epoch": 1714} {"train_loss": -11.49483585357666, "global_step": 288049, "epoch": 1714} {"train_loss": -12.174083709716797, "global_step": 288050, "epoch": 1714} {"train_loss": -11.77657699584961, "global_step": 288051, "epoch": 1714} {"train_loss": -12.150129318237305, "global_step": 288052, "epoch": 1714} {"train_loss": -11.789212226867676, "global_step": 288053, "epoch": 1714} {"train_loss": -12.091930389404297, "global_step": 288054, "epoch": 1714} {"train_loss": -12.082511901855469, "global_step": 288055, "epoch": 1714} {"train_loss": -11.988327026367188, "global_step": 288056, "epoch": 1714} {"train_loss": -11.703048706054688, "global_step": 288057, "epoch": 1714} {"train_loss": -12.14189338684082, "global_step": 288058, "epoch": 1714} {"train_loss": -11.821342468261719, "global_step": 288059, "epoch": 1714} {"train_loss": -11.888229370117188, "global_step": 288060, "epoch": 1714} {"train_loss": -11.958107948303223, "global_step": 288061, "epoch": 1714} {"train_loss": -11.968751907348633, "global_step": 288062, "epoch": 1714} {"train_loss": -12.0706787109375, "global_step": 288063, "epoch": 1714} {"train_loss": -11.611970901489258, "global_step": 288064, "epoch": 1714} {"train_loss": -12.185112953186035, "global_step": 288065, "epoch": 1714} {"train_loss": -11.782520294189453, "global_step": 288066, "epoch": 1714} {"train_loss": -11.80398941040039, "global_step": 288067, "epoch": 1714} {"train_loss": -11.897537231445312, "global_step": 288068, "epoch": 1714} {"train_loss": -11.47767448425293, "global_step": 288069, "epoch": 1714} {"train_loss": -10.578678131103516, "global_step": 288070, "epoch": 1714} {"train_loss": -11.79834270477295, "global_step": 288071, "epoch": 1714} {"train_loss": -11.03466796875, "global_step": 288072, "epoch": 1714} {"train_loss": -10.576786994934082, "global_step": 288073, "epoch": 1714} {"train_loss": -10.577703475952148, "global_step": 288074, "epoch": 1714} {"train_loss": -11.235637664794922, "global_step": 288075, "epoch": 1714} {"train_loss": -10.862802505493164, "global_step": 288076, "epoch": 1714} {"train_loss": -10.519765853881836, "global_step": 288077, "epoch": 1714} {"train_loss": -10.094486236572266, "global_step": 288078, "epoch": 1714} {"train_loss": -11.493446350097656, "global_step": 288079, "epoch": 1714} {"train_loss": -10.046142578125, "global_step": 288080, "epoch": 1714} {"train_loss": -11.147274017333984, "global_step": 288081, "epoch": 1714} {"train_loss": -10.257092475891113, "global_step": 288082, "epoch": 1714} {"train_loss": -10.054132461547852, "global_step": 288083, "epoch": 1714} {"train_loss": -11.648584365844727, "global_step": 288084, "epoch": 1714} {"train_loss": -10.131336212158203, "global_step": 288085, "epoch": 1714} {"train_loss": -10.850980758666992, "global_step": 288086, "epoch": 1714} {"train_loss": -10.22372055053711, "global_step": 288087, "epoch": 1714} {"train_loss": -10.740035057067871, "global_step": 288088, "epoch": 1714} {"train_loss": -11.311120986938477, "global_step": 288089, "epoch": 1714} {"train_loss": -10.74139404296875, "global_step": 288090, "epoch": 1714} {"train_loss": -10.409064292907715, "global_step": 288091, "epoch": 1714} {"train_loss": -11.354284286499023, "global_step": 288092, "epoch": 1714} {"train_loss": -10.68542766571045, "global_step": 288093, "epoch": 1714} {"train_loss": -10.98593521118164, "global_step": 288094, "epoch": 1714} {"train_loss": -11.453059196472168, "global_step": 288095, "epoch": 1714} {"train_loss": -10.095854759216309, "global_step": 288096, "epoch": 1714} {"train_loss": -11.45050048828125, "global_step": 288097, "epoch": 1714} {"train_loss": -11.125962257385254, "global_step": 288098, "epoch": 1714} {"train_loss": -10.849462509155273, "global_step": 288099, "epoch": 1714} {"train_loss": -11.186487197875977, "global_step": 288100, "epoch": 1714} {"train_loss": -10.923261642456055, "global_step": 288101, "epoch": 1714} {"train_loss": -10.28071403503418, "global_step": 288102, "epoch": 1714} {"train_loss": -11.032360076904297, "global_step": 288103, "epoch": 1714} {"train_loss": -10.301234245300293, "global_step": 288104, "epoch": 1714} {"train_loss": -11.109987258911133, "global_step": 288105, "epoch": 1714} {"train_loss": -10.817646026611328, "global_step": 288106, "epoch": 1714} {"train_loss": -11.045636177062988, "global_step": 288107, "epoch": 1714} {"train_loss": -11.229545593261719, "global_step": 288108, "epoch": 1714} {"train_loss": -10.656790733337402, "global_step": 288109, "epoch": 1714} {"train_loss": -11.269942283630371, "global_step": 288110, "epoch": 1714} {"train_loss": -11.026315689086914, "global_step": 288111, "epoch": 1714} {"train_loss": -10.983924865722656, "global_step": 288112, "epoch": 1714} {"train_loss": -11.49199104309082, "global_step": 288113, "epoch": 1714} {"train_loss": -11.450220108032227, "global_step": 288114, "epoch": 1714} {"train_loss": -11.148967742919922, "global_step": 288115, "epoch": 1714} {"train_loss": -11.503095626831055, "global_step": 288116, "epoch": 1714} {"train_loss": -11.037789344787598, "global_step": 288117, "epoch": 1714} {"train_loss": -11.184213638305664, "global_step": 288118, "epoch": 1714} {"train_loss": -11.030539560885657, "global_step": 288119, "epoch": 1714, "val_loss": 277939.28125} {"train_loss": -11.330497741699219, "global_step": 288120, "epoch": 1715} {"train_loss": -11.45762825012207, "global_step": 288121, "epoch": 1715} {"train_loss": -11.706625938415527, "global_step": 288122, "epoch": 1715} {"train_loss": -11.436667442321777, "global_step": 288123, "epoch": 1715} {"train_loss": -11.517963409423828, "global_step": 288124, "epoch": 1715} {"train_loss": -11.682149887084961, "global_step": 288125, "epoch": 1715} {"train_loss": -11.242340087890625, "global_step": 288126, "epoch": 1715} {"train_loss": -11.692859649658203, "global_step": 288127, "epoch": 1715} {"train_loss": -11.147103309631348, "global_step": 288128, "epoch": 1715} {"train_loss": -11.754716873168945, "global_step": 288129, "epoch": 1715} {"train_loss": -11.424545288085938, "global_step": 288130, "epoch": 1715} {"train_loss": -11.797122955322266, "global_step": 288131, "epoch": 1715} {"train_loss": -11.885541915893555, "global_step": 288132, "epoch": 1715} {"train_loss": -11.823836326599121, "global_step": 288133, "epoch": 1715} {"train_loss": -11.67042064666748, "global_step": 288134, "epoch": 1715} {"train_loss": -11.889302253723145, "global_step": 288135, "epoch": 1715} {"train_loss": -11.803893089294434, "global_step": 288136, "epoch": 1715} {"train_loss": -11.693089485168457, "global_step": 288137, "epoch": 1715} {"train_loss": -11.957439422607422, "global_step": 288138, "epoch": 1715} {"train_loss": -11.90138053894043, "global_step": 288139, "epoch": 1715} {"train_loss": -12.012587547302246, "global_step": 288140, "epoch": 1715} {"train_loss": -11.759571075439453, "global_step": 288141, "epoch": 1715} {"train_loss": -11.991086959838867, "global_step": 288142, "epoch": 1715} {"train_loss": -11.537732124328613, "global_step": 288143, "epoch": 1715} {"train_loss": -12.065112113952637, "global_step": 288144, "epoch": 1715} {"train_loss": -11.751399040222168, "global_step": 288145, "epoch": 1715} {"train_loss": -12.117653846740723, "global_step": 288146, "epoch": 1715} {"train_loss": -11.702786445617676, "global_step": 288147, "epoch": 1715} {"train_loss": -11.964643478393555, "global_step": 288148, "epoch": 1715} {"train_loss": -11.713237762451172, "global_step": 288149, "epoch": 1715} {"train_loss": -11.81823444366455, "global_step": 288150, "epoch": 1715} {"train_loss": -11.512189865112305, "global_step": 288151, "epoch": 1715} {"train_loss": -11.733457565307617, "global_step": 288152, "epoch": 1715} {"train_loss": -11.601273536682129, "global_step": 288153, "epoch": 1715} {"train_loss": -11.988954544067383, "global_step": 288154, "epoch": 1715} {"train_loss": -11.485919952392578, "global_step": 288155, "epoch": 1715} {"train_loss": -11.984015464782715, "global_step": 288156, "epoch": 1715} {"train_loss": -11.907968521118164, "global_step": 288157, "epoch": 1715} {"train_loss": -11.922218322753906, "global_step": 288158, "epoch": 1715} {"train_loss": -11.972423553466797, "global_step": 288159, "epoch": 1715} {"train_loss": -11.762567520141602, "global_step": 288160, "epoch": 1715} {"train_loss": -11.78923511505127, "global_step": 288161, "epoch": 1715} {"train_loss": -11.92538070678711, "global_step": 288162, "epoch": 1715} {"train_loss": -11.601566314697266, "global_step": 288163, "epoch": 1715} {"train_loss": -11.957345962524414, "global_step": 288164, "epoch": 1715} {"train_loss": -11.815396308898926, "global_step": 288165, "epoch": 1715} {"train_loss": -11.59874153137207, "global_step": 288166, "epoch": 1715} {"train_loss": -11.807127952575684, "global_step": 288167, "epoch": 1715} {"train_loss": -11.427897453308105, "global_step": 288168, "epoch": 1715} {"train_loss": -11.78885269165039, "global_step": 288169, "epoch": 1715} {"train_loss": -11.423360824584961, "global_step": 288170, "epoch": 1715} {"train_loss": -11.969573974609375, "global_step": 288171, "epoch": 1715} {"train_loss": -12.081573486328125, "global_step": 288172, "epoch": 1715} {"train_loss": -11.619434356689453, "global_step": 288173, "epoch": 1715} {"train_loss": -12.202327728271484, "global_step": 288174, "epoch": 1715} {"train_loss": -11.77627182006836, "global_step": 288175, "epoch": 1715} {"train_loss": -11.85058307647705, "global_step": 288176, "epoch": 1715} {"train_loss": -11.82032585144043, "global_step": 288177, "epoch": 1715} {"train_loss": -11.677370071411133, "global_step": 288178, "epoch": 1715} {"train_loss": -11.741674423217773, "global_step": 288179, "epoch": 1715} {"train_loss": -11.96971321105957, "global_step": 288180, "epoch": 1715} {"train_loss": -11.689970016479492, "global_step": 288181, "epoch": 1715} {"train_loss": -11.795340538024902, "global_step": 288182, "epoch": 1715} {"train_loss": -11.778238296508789, "global_step": 288183, "epoch": 1715} {"train_loss": -11.540589332580566, "global_step": 288184, "epoch": 1715} {"train_loss": -11.908275604248047, "global_step": 288185, "epoch": 1715} {"train_loss": -11.446834564208984, "global_step": 288186, "epoch": 1715} {"train_loss": -11.784856796264648, "global_step": 288187, "epoch": 1715} {"train_loss": -11.226251602172852, "global_step": 288188, "epoch": 1715} {"train_loss": -11.83387565612793, "global_step": 288189, "epoch": 1715} {"train_loss": -11.721295356750488, "global_step": 288190, "epoch": 1715} {"train_loss": -11.961780548095703, "global_step": 288191, "epoch": 1715} {"train_loss": -11.93404769897461, "global_step": 288192, "epoch": 1715} {"train_loss": -11.965530395507812, "global_step": 288193, "epoch": 1715} {"train_loss": -12.242883682250977, "global_step": 288194, "epoch": 1715} {"train_loss": -11.934617042541504, "global_step": 288195, "epoch": 1715} {"train_loss": -12.095714569091797, "global_step": 288196, "epoch": 1715} {"train_loss": -11.782877922058105, "global_step": 288197, "epoch": 1715} {"train_loss": -12.20151138305664, "global_step": 288198, "epoch": 1715} {"train_loss": -11.810270309448242, "global_step": 288199, "epoch": 1715} {"train_loss": -12.244760513305664, "global_step": 288200, "epoch": 1715} {"train_loss": -12.098281860351562, "global_step": 288201, "epoch": 1715} {"train_loss": -12.01885986328125, "global_step": 288202, "epoch": 1715} {"train_loss": -11.987165451049805, "global_step": 288203, "epoch": 1715} {"train_loss": -11.626686096191406, "global_step": 288204, "epoch": 1715} {"train_loss": -12.44930648803711, "global_step": 288205, "epoch": 1715} {"train_loss": -11.921140670776367, "global_step": 288206, "epoch": 1715} {"train_loss": -12.279403686523438, "global_step": 288207, "epoch": 1715} {"train_loss": -11.682424545288086, "global_step": 288208, "epoch": 1715} {"train_loss": -12.202327728271484, "global_step": 288209, "epoch": 1715} {"train_loss": -12.225061416625977, "global_step": 288210, "epoch": 1715} {"train_loss": -12.114153861999512, "global_step": 288211, "epoch": 1715} {"train_loss": -12.30220890045166, "global_step": 288212, "epoch": 1715} {"train_loss": -12.506830215454102, "global_step": 288213, "epoch": 1715} {"train_loss": -12.282149314880371, "global_step": 288214, "epoch": 1715} {"train_loss": -12.26577377319336, "global_step": 288215, "epoch": 1715} {"train_loss": -12.366397857666016, "global_step": 288216, "epoch": 1715} {"train_loss": -12.453059196472168, "global_step": 288217, "epoch": 1715} {"train_loss": -12.212242126464844, "global_step": 288218, "epoch": 1715} {"train_loss": -12.244844436645508, "global_step": 288219, "epoch": 1715} {"train_loss": -12.34709644317627, "global_step": 288220, "epoch": 1715} {"train_loss": -12.548141479492188, "global_step": 288221, "epoch": 1715} {"train_loss": -12.487939834594727, "global_step": 288222, "epoch": 1715} {"train_loss": -12.496228218078613, "global_step": 288223, "epoch": 1715} {"train_loss": -12.61015510559082, "global_step": 288224, "epoch": 1715} {"train_loss": -12.32913589477539, "global_step": 288225, "epoch": 1715} {"train_loss": -12.414407730102539, "global_step": 288226, "epoch": 1715} {"train_loss": -12.413646697998047, "global_step": 288227, "epoch": 1715} {"train_loss": -12.204193115234375, "global_step": 288228, "epoch": 1715} {"train_loss": -12.403823852539062, "global_step": 288229, "epoch": 1715} {"train_loss": -12.327836990356445, "global_step": 288230, "epoch": 1715} {"train_loss": -12.576556205749512, "global_step": 288231, "epoch": 1715} {"train_loss": -12.365228652954102, "global_step": 288232, "epoch": 1715} {"train_loss": -12.22340202331543, "global_step": 288233, "epoch": 1715} {"train_loss": -12.304839134216309, "global_step": 288234, "epoch": 1715} {"train_loss": -12.185158729553223, "global_step": 288235, "epoch": 1715} {"train_loss": -12.301261901855469, "global_step": 288236, "epoch": 1715} {"train_loss": -12.479585647583008, "global_step": 288237, "epoch": 1715} {"train_loss": -11.891620635986328, "global_step": 288238, "epoch": 1715} {"train_loss": -11.19041633605957, "global_step": 288239, "epoch": 1715} {"train_loss": -11.357789993286133, "global_step": 288240, "epoch": 1715} {"train_loss": -12.025310516357422, "global_step": 288241, "epoch": 1715} {"train_loss": -11.893959045410156, "global_step": 288242, "epoch": 1715} {"train_loss": -11.998517990112305, "global_step": 288243, "epoch": 1715} {"train_loss": -11.005637168884277, "global_step": 288244, "epoch": 1715} {"train_loss": -11.08690071105957, "global_step": 288245, "epoch": 1715} {"train_loss": -11.569496154785156, "global_step": 288246, "epoch": 1715} {"train_loss": -10.496748924255371, "global_step": 288247, "epoch": 1715} {"train_loss": -10.647176742553711, "global_step": 288248, "epoch": 1715} {"train_loss": -12.09063720703125, "global_step": 288249, "epoch": 1715} {"train_loss": -11.186677932739258, "global_step": 288250, "epoch": 1715} {"train_loss": -10.969432830810547, "global_step": 288251, "epoch": 1715} {"train_loss": -11.138609886169434, "global_step": 288252, "epoch": 1715} {"train_loss": -12.020262718200684, "global_step": 288253, "epoch": 1715} {"train_loss": -11.58116626739502, "global_step": 288254, "epoch": 1715} {"train_loss": -12.164868354797363, "global_step": 288255, "epoch": 1715} {"train_loss": -11.31597900390625, "global_step": 288256, "epoch": 1715} {"train_loss": -11.735681533813477, "global_step": 288257, "epoch": 1715} {"train_loss": -10.335521697998047, "global_step": 288258, "epoch": 1715} {"train_loss": -11.374540328979492, "global_step": 288259, "epoch": 1715} {"train_loss": -11.441566467285156, "global_step": 288260, "epoch": 1715} {"train_loss": -11.297416687011719, "global_step": 288261, "epoch": 1715} {"train_loss": -11.349630355834961, "global_step": 288262, "epoch": 1715} {"train_loss": -10.714229583740234, "global_step": 288263, "epoch": 1715} {"train_loss": -10.671164512634277, "global_step": 288264, "epoch": 1715} {"train_loss": -11.988327980041504, "global_step": 288265, "epoch": 1715} {"train_loss": -11.399895668029785, "global_step": 288266, "epoch": 1715} {"train_loss": -12.179207801818848, "global_step": 288267, "epoch": 1715} {"train_loss": -11.508623123168945, "global_step": 288268, "epoch": 1715} {"train_loss": -11.864276885986328, "global_step": 288269, "epoch": 1715} {"train_loss": -11.980295181274414, "global_step": 288270, "epoch": 1715} {"train_loss": -11.913409233093262, "global_step": 288271, "epoch": 1715} {"train_loss": -11.792611122131348, "global_step": 288272, "epoch": 1715} {"train_loss": -12.23531723022461, "global_step": 288273, "epoch": 1715} {"train_loss": -12.158279418945312, "global_step": 288274, "epoch": 1715} {"train_loss": -11.940731048583984, "global_step": 288275, "epoch": 1715} {"train_loss": -11.573965072631836, "global_step": 288276, "epoch": 1715} {"train_loss": -12.122859954833984, "global_step": 288277, "epoch": 1715} {"train_loss": -11.782930374145508, "global_step": 288278, "epoch": 1715} {"train_loss": -11.936737060546875, "global_step": 288279, "epoch": 1715} {"train_loss": -12.109240531921387, "global_step": 288280, "epoch": 1715} {"train_loss": -11.861175537109375, "global_step": 288281, "epoch": 1715} {"train_loss": -11.919778823852539, "global_step": 288282, "epoch": 1715} {"train_loss": -12.076336860656738, "global_step": 288283, "epoch": 1715} {"train_loss": -12.259408950805664, "global_step": 288284, "epoch": 1715} {"train_loss": -12.27353286743164, "global_step": 288285, "epoch": 1715} {"train_loss": -12.191215515136719, "global_step": 288286, "epoch": 1715} {"train_loss": -11.842525243759155, "global_step": 288287, "epoch": 1715, "val_loss": 276487.9375, "train_action_mse_error": 2.230868339538574} {"train_loss": -12.020505905151367, "global_step": 288288, "epoch": 1716} {"train_loss": -11.81833267211914, "global_step": 288289, "epoch": 1716} {"train_loss": -11.891565322875977, "global_step": 288290, "epoch": 1716} {"train_loss": -11.838338851928711, "global_step": 288291, "epoch": 1716} {"train_loss": -12.040270805358887, "global_step": 288292, "epoch": 1716} {"train_loss": -10.98973274230957, "global_step": 288293, "epoch": 1716} {"train_loss": -11.894149780273438, "global_step": 288294, "epoch": 1716} {"train_loss": -11.290685653686523, "global_step": 288295, "epoch": 1716} {"train_loss": -11.844888687133789, "global_step": 288296, "epoch": 1716} {"train_loss": -11.656096458435059, "global_step": 288297, "epoch": 1716} {"train_loss": -12.083614349365234, "global_step": 288298, "epoch": 1716} {"train_loss": -11.582571029663086, "global_step": 288299, "epoch": 1716} {"train_loss": -11.48833179473877, "global_step": 288300, "epoch": 1716} {"train_loss": -11.047638893127441, "global_step": 288301, "epoch": 1716} {"train_loss": -11.47401237487793, "global_step": 288302, "epoch": 1716} {"train_loss": -10.88736343383789, "global_step": 288303, "epoch": 1716} {"train_loss": -10.640470504760742, "global_step": 288304, "epoch": 1716} {"train_loss": -10.845314979553223, "global_step": 288305, "epoch": 1716} {"train_loss": -10.306877136230469, "global_step": 288306, "epoch": 1716} {"train_loss": -11.419803619384766, "global_step": 288307, "epoch": 1716} {"train_loss": -10.202033996582031, "global_step": 288308, "epoch": 1716} {"train_loss": -11.208446502685547, "global_step": 288309, "epoch": 1716} {"train_loss": -10.89859676361084, "global_step": 288310, "epoch": 1716} {"train_loss": -11.657038688659668, "global_step": 288311, "epoch": 1716} {"train_loss": -11.28314208984375, "global_step": 288312, "epoch": 1716} {"train_loss": -11.399362564086914, "global_step": 288313, "epoch": 1716} {"train_loss": -11.315885543823242, "global_step": 288314, "epoch": 1716} {"train_loss": -11.684930801391602, "global_step": 288315, "epoch": 1716} {"train_loss": -11.210821151733398, "global_step": 288316, "epoch": 1716} {"train_loss": -11.126663208007812, "global_step": 288317, "epoch": 1716} {"train_loss": -11.538305282592773, "global_step": 288318, "epoch": 1716} {"train_loss": -11.401601791381836, "global_step": 288319, "epoch": 1716} {"train_loss": -11.896867752075195, "global_step": 288320, "epoch": 1716} {"train_loss": -11.39211654663086, "global_step": 288321, "epoch": 1716} {"train_loss": -11.731786727905273, "global_step": 288322, "epoch": 1716} {"train_loss": -11.627328872680664, "global_step": 288323, "epoch": 1716} {"train_loss": -10.983428955078125, "global_step": 288324, "epoch": 1716} {"train_loss": -11.616109848022461, "global_step": 288325, "epoch": 1716} {"train_loss": -11.41151237487793, "global_step": 288326, "epoch": 1716} {"train_loss": -11.232038497924805, "global_step": 288327, "epoch": 1716} {"train_loss": -11.347651481628418, "global_step": 288328, "epoch": 1716} {"train_loss": -11.225343704223633, "global_step": 288329, "epoch": 1716} {"train_loss": -11.73763656616211, "global_step": 288330, "epoch": 1716} {"train_loss": -11.240594863891602, "global_step": 288331, "epoch": 1716} {"train_loss": -10.789093017578125, "global_step": 288332, "epoch": 1716} {"train_loss": -11.856395721435547, "global_step": 288333, "epoch": 1716} {"train_loss": -10.68592643737793, "global_step": 288334, "epoch": 1716} {"train_loss": -11.965312957763672, "global_step": 288335, "epoch": 1716} {"train_loss": -11.556373596191406, "global_step": 288336, "epoch": 1716} {"train_loss": -11.654158592224121, "global_step": 288337, "epoch": 1716} {"train_loss": -11.740617752075195, "global_step": 288338, "epoch": 1716} {"train_loss": -11.280807495117188, "global_step": 288339, "epoch": 1716} {"train_loss": -11.92790412902832, "global_step": 288340, "epoch": 1716} {"train_loss": -11.882331848144531, "global_step": 288341, "epoch": 1716} {"train_loss": -11.809041023254395, "global_step": 288342, "epoch": 1716} {"train_loss": -12.011902809143066, "global_step": 288343, "epoch": 1716} {"train_loss": -11.916069984436035, "global_step": 288344, "epoch": 1716} {"train_loss": -11.802417755126953, "global_step": 288345, "epoch": 1716} {"train_loss": -11.615815162658691, "global_step": 288346, "epoch": 1716} {"train_loss": -11.910057067871094, "global_step": 288347, "epoch": 1716} {"train_loss": -11.547452926635742, "global_step": 288348, "epoch": 1716} {"train_loss": -11.89944839477539, "global_step": 288349, "epoch": 1716} {"train_loss": -11.586722373962402, "global_step": 288350, "epoch": 1716} {"train_loss": -12.140592575073242, "global_step": 288351, "epoch": 1716} {"train_loss": -11.65158462524414, "global_step": 288352, "epoch": 1716} {"train_loss": -11.730030059814453, "global_step": 288353, "epoch": 1716} {"train_loss": -11.95329475402832, "global_step": 288354, "epoch": 1716} {"train_loss": -11.966691970825195, "global_step": 288355, "epoch": 1716} {"train_loss": -12.147193908691406, "global_step": 288356, "epoch": 1716} {"train_loss": -12.134270668029785, "global_step": 288357, "epoch": 1716} {"train_loss": -11.962121963500977, "global_step": 288358, "epoch": 1716} {"train_loss": -11.805047988891602, "global_step": 288359, "epoch": 1716} {"train_loss": -12.06286334991455, "global_step": 288360, "epoch": 1716} {"train_loss": -11.710172653198242, "global_step": 288361, "epoch": 1716} {"train_loss": -12.106785774230957, "global_step": 288362, "epoch": 1716} {"train_loss": -11.69766902923584, "global_step": 288363, "epoch": 1716} {"train_loss": -11.537514686584473, "global_step": 288364, "epoch": 1716} {"train_loss": -11.8764066696167, "global_step": 288365, "epoch": 1716} {"train_loss": -11.182520866394043, "global_step": 288366, "epoch": 1716} {"train_loss": -12.160051345825195, "global_step": 288367, "epoch": 1716} {"train_loss": -11.639928817749023, "global_step": 288368, "epoch": 1716} {"train_loss": -11.96042251586914, "global_step": 288369, "epoch": 1716} {"train_loss": -11.939669609069824, "global_step": 288370, "epoch": 1716} {"train_loss": -11.830462455749512, "global_step": 288371, "epoch": 1716} {"train_loss": -11.98233413696289, "global_step": 288372, "epoch": 1716} {"train_loss": -11.743389129638672, "global_step": 288373, "epoch": 1716} {"train_loss": -12.073896408081055, "global_step": 288374, "epoch": 1716} {"train_loss": -12.120747566223145, "global_step": 288375, "epoch": 1716} {"train_loss": -12.093587875366211, "global_step": 288376, "epoch": 1716} {"train_loss": -12.084026336669922, "global_step": 288377, "epoch": 1716} {"train_loss": -12.007872581481934, "global_step": 288378, "epoch": 1716} {"train_loss": -11.78581428527832, "global_step": 288379, "epoch": 1716} {"train_loss": -12.128114700317383, "global_step": 288380, "epoch": 1716} {"train_loss": -12.090948104858398, "global_step": 288381, "epoch": 1716} {"train_loss": -12.263632774353027, "global_step": 288382, "epoch": 1716} {"train_loss": -12.271167755126953, "global_step": 288383, "epoch": 1716} {"train_loss": -12.161396026611328, "global_step": 288384, "epoch": 1716} {"train_loss": -12.291622161865234, "global_step": 288385, "epoch": 1716} {"train_loss": -12.040705680847168, "global_step": 288386, "epoch": 1716} {"train_loss": -12.232061386108398, "global_step": 288387, "epoch": 1716} {"train_loss": -12.313253402709961, "global_step": 288388, "epoch": 1716} {"train_loss": -12.037164688110352, "global_step": 288389, "epoch": 1716} {"train_loss": -12.059871673583984, "global_step": 288390, "epoch": 1716} {"train_loss": -12.05975341796875, "global_step": 288391, "epoch": 1716} {"train_loss": -12.190585136413574, "global_step": 288392, "epoch": 1716} {"train_loss": -12.188009262084961, "global_step": 288393, "epoch": 1716} {"train_loss": -12.26303768157959, "global_step": 288394, "epoch": 1716} {"train_loss": -12.34671401977539, "global_step": 288395, "epoch": 1716} {"train_loss": -11.950416564941406, "global_step": 288396, "epoch": 1716} {"train_loss": -12.2362060546875, "global_step": 288397, "epoch": 1716} {"train_loss": -12.376453399658203, "global_step": 288398, "epoch": 1716} {"train_loss": -12.187750816345215, "global_step": 288399, "epoch": 1716} {"train_loss": -12.326265335083008, "global_step": 288400, "epoch": 1716} {"train_loss": -12.35551643371582, "global_step": 288401, "epoch": 1716} {"train_loss": -12.319565773010254, "global_step": 288402, "epoch": 1716} {"train_loss": -12.372057914733887, "global_step": 288403, "epoch": 1716} {"train_loss": -12.325397491455078, "global_step": 288404, "epoch": 1716} {"train_loss": -12.261116981506348, "global_step": 288405, "epoch": 1716} {"train_loss": -12.504395484924316, "global_step": 288406, "epoch": 1716} {"train_loss": -12.405223846435547, "global_step": 288407, "epoch": 1716} {"train_loss": -12.258832931518555, "global_step": 288408, "epoch": 1716} {"train_loss": -12.383750915527344, "global_step": 288409, "epoch": 1716} {"train_loss": -12.233051300048828, "global_step": 288410, "epoch": 1716} {"train_loss": -12.254456520080566, "global_step": 288411, "epoch": 1716} {"train_loss": -12.120621681213379, "global_step": 288412, "epoch": 1716} {"train_loss": -12.24789810180664, "global_step": 288413, "epoch": 1716} {"train_loss": -12.41128921508789, "global_step": 288414, "epoch": 1716} {"train_loss": -12.262094497680664, "global_step": 288415, "epoch": 1716} {"train_loss": -12.063344955444336, "global_step": 288416, "epoch": 1716} {"train_loss": -12.382577896118164, "global_step": 288417, "epoch": 1716} {"train_loss": -12.227972984313965, "global_step": 288418, "epoch": 1716} {"train_loss": -12.082216262817383, "global_step": 288419, "epoch": 1716} {"train_loss": -12.352714538574219, "global_step": 288420, "epoch": 1716} {"train_loss": -12.23291301727295, "global_step": 288421, "epoch": 1716} {"train_loss": -12.013957023620605, "global_step": 288422, "epoch": 1716} {"train_loss": -12.225431442260742, "global_step": 288423, "epoch": 1716} {"train_loss": -12.109100341796875, "global_step": 288424, "epoch": 1716} {"train_loss": -11.871219635009766, "global_step": 288425, "epoch": 1716} {"train_loss": -11.819703102111816, "global_step": 288426, "epoch": 1716} {"train_loss": -11.985433578491211, "global_step": 288427, "epoch": 1716} {"train_loss": -11.679555892944336, "global_step": 288428, "epoch": 1716} {"train_loss": -11.71667766571045, "global_step": 288429, "epoch": 1716} {"train_loss": -11.851805686950684, "global_step": 288430, "epoch": 1716} {"train_loss": -11.754911422729492, "global_step": 288431, "epoch": 1716} {"train_loss": -11.059789657592773, "global_step": 288432, "epoch": 1716} {"train_loss": -11.962152481079102, "global_step": 288433, "epoch": 1716} {"train_loss": -10.098710060119629, "global_step": 288434, "epoch": 1716} {"train_loss": -11.687126159667969, "global_step": 288435, "epoch": 1716} {"train_loss": -9.744207382202148, "global_step": 288436, "epoch": 1716} {"train_loss": -11.825557708740234, "global_step": 288437, "epoch": 1716} {"train_loss": -10.389408111572266, "global_step": 288438, "epoch": 1716} {"train_loss": -11.546392440795898, "global_step": 288439, "epoch": 1716} {"train_loss": -11.692171096801758, "global_step": 288440, "epoch": 1716} {"train_loss": -11.022560119628906, "global_step": 288441, "epoch": 1716} {"train_loss": -10.828557968139648, "global_step": 288442, "epoch": 1716} {"train_loss": -10.197858810424805, "global_step": 288443, "epoch": 1716} {"train_loss": -11.971362113952637, "global_step": 288444, "epoch": 1716} {"train_loss": -10.21378231048584, "global_step": 288445, "epoch": 1716} {"train_loss": -11.086797714233398, "global_step": 288446, "epoch": 1716} {"train_loss": -10.629179000854492, "global_step": 288447, "epoch": 1716} {"train_loss": -10.839493751525879, "global_step": 288448, "epoch": 1716} {"train_loss": -11.754196166992188, "global_step": 288449, "epoch": 1716} {"train_loss": -10.391117095947266, "global_step": 288450, "epoch": 1716} {"train_loss": -10.114875793457031, "global_step": 288451, "epoch": 1716} {"train_loss": -11.16085433959961, "global_step": 288452, "epoch": 1716} {"train_loss": -10.790000915527344, "global_step": 288453, "epoch": 1716} {"train_loss": -11.691141128540039, "global_step": 288454, "epoch": 1716} {"train_loss": -11.697154527618771, "global_step": 288455, "epoch": 1716, "val_loss": 278572.84375} {"train_loss": -11.51215934753418, "global_step": 288456, "epoch": 1717} {"train_loss": -11.338228225708008, "global_step": 288457, "epoch": 1717} {"train_loss": -11.816061019897461, "global_step": 288458, "epoch": 1717} {"train_loss": -11.512617111206055, "global_step": 288459, "epoch": 1717} {"train_loss": -11.907185554504395, "global_step": 288460, "epoch": 1717} {"train_loss": -11.492148399353027, "global_step": 288461, "epoch": 1717} {"train_loss": -11.909823417663574, "global_step": 288462, "epoch": 1717} {"train_loss": -11.983736038208008, "global_step": 288463, "epoch": 1717} {"train_loss": -11.441692352294922, "global_step": 288464, "epoch": 1717} {"train_loss": -11.651689529418945, "global_step": 288465, "epoch": 1717} {"train_loss": -11.933636665344238, "global_step": 288466, "epoch": 1717} {"train_loss": -11.460628509521484, "global_step": 288467, "epoch": 1717} {"train_loss": -11.63375473022461, "global_step": 288468, "epoch": 1717} {"train_loss": -11.74643611907959, "global_step": 288469, "epoch": 1717} {"train_loss": -11.560083389282227, "global_step": 288470, "epoch": 1717} {"train_loss": -11.75772762298584, "global_step": 288471, "epoch": 1717} {"train_loss": -11.900156021118164, "global_step": 288472, "epoch": 1717} {"train_loss": -12.00132942199707, "global_step": 288473, "epoch": 1717} {"train_loss": -11.939083099365234, "global_step": 288474, "epoch": 1717} {"train_loss": -12.128561019897461, "global_step": 288475, "epoch": 1717} {"train_loss": -11.97285270690918, "global_step": 288476, "epoch": 1717} {"train_loss": -11.96323013305664, "global_step": 288477, "epoch": 1717} {"train_loss": -11.827309608459473, "global_step": 288478, "epoch": 1717} {"train_loss": -11.958391189575195, "global_step": 288479, "epoch": 1717} {"train_loss": -12.046395301818848, "global_step": 288480, "epoch": 1717} {"train_loss": -11.908601760864258, "global_step": 288481, "epoch": 1717} {"train_loss": -12.158197402954102, "global_step": 288482, "epoch": 1717} {"train_loss": -11.917244911193848, "global_step": 288483, "epoch": 1717} {"train_loss": -11.754413604736328, "global_step": 288484, "epoch": 1717} {"train_loss": -12.105859756469727, "global_step": 288485, "epoch": 1717} {"train_loss": -11.798595428466797, "global_step": 288486, "epoch": 1717} {"train_loss": -11.886576652526855, "global_step": 288487, "epoch": 1717} {"train_loss": -12.088722229003906, "global_step": 288488, "epoch": 1717} {"train_loss": -11.863670349121094, "global_step": 288489, "epoch": 1717} {"train_loss": -11.88238525390625, "global_step": 288490, "epoch": 1717} {"train_loss": -11.997163772583008, "global_step": 288491, "epoch": 1717} {"train_loss": -11.988649368286133, "global_step": 288492, "epoch": 1717} {"train_loss": -11.807771682739258, "global_step": 288493, "epoch": 1717} {"train_loss": -11.936786651611328, "global_step": 288494, "epoch": 1717} {"train_loss": -11.544732093811035, "global_step": 288495, "epoch": 1717} {"train_loss": -12.033435821533203, "global_step": 288496, "epoch": 1717} {"train_loss": -12.168731689453125, "global_step": 288497, "epoch": 1717} {"train_loss": -11.918878555297852, "global_step": 288498, "epoch": 1717} {"train_loss": -12.17412281036377, "global_step": 288499, "epoch": 1717} {"train_loss": -11.994443893432617, "global_step": 288500, "epoch": 1717} {"train_loss": -11.819549560546875, "global_step": 288501, "epoch": 1717} {"train_loss": -12.077407836914062, "global_step": 288502, "epoch": 1717} {"train_loss": -11.926569938659668, "global_step": 288503, "epoch": 1717} {"train_loss": -11.866432189941406, "global_step": 288504, "epoch": 1717} {"train_loss": -11.95657730102539, "global_step": 288505, "epoch": 1717} {"train_loss": -11.481986045837402, "global_step": 288506, "epoch": 1717} {"train_loss": -11.90896987915039, "global_step": 288507, "epoch": 1717} {"train_loss": -11.974323272705078, "global_step": 288508, "epoch": 1717} {"train_loss": -11.40826416015625, "global_step": 288509, "epoch": 1717} {"train_loss": -11.838488578796387, "global_step": 288510, "epoch": 1717} {"train_loss": -11.807857513427734, "global_step": 288511, "epoch": 1717} {"train_loss": -12.029669761657715, "global_step": 288512, "epoch": 1717} {"train_loss": -12.046184539794922, "global_step": 288513, "epoch": 1717} {"train_loss": -11.46827220916748, "global_step": 288514, "epoch": 1717} {"train_loss": -12.188167572021484, "global_step": 288515, "epoch": 1717} {"train_loss": -11.903059005737305, "global_step": 288516, "epoch": 1717} {"train_loss": -12.11254596710205, "global_step": 288517, "epoch": 1717} {"train_loss": -12.15312671661377, "global_step": 288518, "epoch": 1717} {"train_loss": -12.02891731262207, "global_step": 288519, "epoch": 1717} {"train_loss": -11.84794807434082, "global_step": 288520, "epoch": 1717} {"train_loss": -11.97793197631836, "global_step": 288521, "epoch": 1717} {"train_loss": -11.832889556884766, "global_step": 288522, "epoch": 1717} {"train_loss": -12.186196327209473, "global_step": 288523, "epoch": 1717} {"train_loss": -11.76048755645752, "global_step": 288524, "epoch": 1717} {"train_loss": -12.335149765014648, "global_step": 288525, "epoch": 1717} {"train_loss": -12.040704727172852, "global_step": 288526, "epoch": 1717} {"train_loss": -11.909690856933594, "global_step": 288527, "epoch": 1717} {"train_loss": -12.18526554107666, "global_step": 288528, "epoch": 1717} {"train_loss": -12.365755081176758, "global_step": 288529, "epoch": 1717} {"train_loss": -12.166084289550781, "global_step": 288530, "epoch": 1717} {"train_loss": -12.404869079589844, "global_step": 288531, "epoch": 1717} {"train_loss": -12.10411262512207, "global_step": 288532, "epoch": 1717} {"train_loss": -11.924848556518555, "global_step": 288533, "epoch": 1717} {"train_loss": -12.161176681518555, "global_step": 288534, "epoch": 1717} {"train_loss": -12.110128402709961, "global_step": 288535, "epoch": 1717} {"train_loss": -11.927396774291992, "global_step": 288536, "epoch": 1717} {"train_loss": -12.065323829650879, "global_step": 288537, "epoch": 1717} {"train_loss": -12.111103057861328, "global_step": 288538, "epoch": 1717} {"train_loss": -12.094709396362305, "global_step": 288539, "epoch": 1717} {"train_loss": -12.10305404663086, "global_step": 288540, "epoch": 1717} {"train_loss": -12.163747787475586, "global_step": 288541, "epoch": 1717} {"train_loss": -12.278423309326172, "global_step": 288542, "epoch": 1717} {"train_loss": -12.145594596862793, "global_step": 288543, "epoch": 1717} {"train_loss": -12.126779556274414, "global_step": 288544, "epoch": 1717} {"train_loss": -12.12520980834961, "global_step": 288545, "epoch": 1717} {"train_loss": -12.078996658325195, "global_step": 288546, "epoch": 1717} {"train_loss": -11.97231388092041, "global_step": 288547, "epoch": 1717} {"train_loss": -12.100065231323242, "global_step": 288548, "epoch": 1717} {"train_loss": -11.893304824829102, "global_step": 288549, "epoch": 1717} {"train_loss": -12.31980037689209, "global_step": 288550, "epoch": 1717} {"train_loss": -11.666122436523438, "global_step": 288551, "epoch": 1717} {"train_loss": -11.88986873626709, "global_step": 288552, "epoch": 1717} {"train_loss": -12.29559326171875, "global_step": 288553, "epoch": 1717} {"train_loss": -11.933572769165039, "global_step": 288554, "epoch": 1717} {"train_loss": -11.763296127319336, "global_step": 288555, "epoch": 1717} {"train_loss": -12.442825317382812, "global_step": 288556, "epoch": 1717} {"train_loss": -12.374140739440918, "global_step": 288557, "epoch": 1717} {"train_loss": -12.172521591186523, "global_step": 288558, "epoch": 1717} {"train_loss": -12.262809753417969, "global_step": 288559, "epoch": 1717} {"train_loss": -11.868524551391602, "global_step": 288560, "epoch": 1717} {"train_loss": -12.432148933410645, "global_step": 288561, "epoch": 1717} {"train_loss": -11.904844284057617, "global_step": 288562, "epoch": 1717} {"train_loss": -12.103821754455566, "global_step": 288563, "epoch": 1717} {"train_loss": -12.114253997802734, "global_step": 288564, "epoch": 1717} {"train_loss": -11.858020782470703, "global_step": 288565, "epoch": 1717} {"train_loss": -12.540033340454102, "global_step": 288566, "epoch": 1717} {"train_loss": -11.773833274841309, "global_step": 288567, "epoch": 1717} {"train_loss": -10.78510570526123, "global_step": 288568, "epoch": 1717} {"train_loss": -12.103368759155273, "global_step": 288569, "epoch": 1717} {"train_loss": -11.34536361694336, "global_step": 288570, "epoch": 1717} {"train_loss": -10.567010879516602, "global_step": 288571, "epoch": 1717} {"train_loss": -11.622152328491211, "global_step": 288572, "epoch": 1717} {"train_loss": -11.662083625793457, "global_step": 288573, "epoch": 1717} {"train_loss": -10.778238296508789, "global_step": 288574, "epoch": 1717} {"train_loss": -11.936312675476074, "global_step": 288575, "epoch": 1717} {"train_loss": -11.330307006835938, "global_step": 288576, "epoch": 1717} {"train_loss": -10.841371536254883, "global_step": 288577, "epoch": 1717} {"train_loss": -11.600931167602539, "global_step": 288578, "epoch": 1717} {"train_loss": -10.78022575378418, "global_step": 288579, "epoch": 1717} {"train_loss": -11.773962020874023, "global_step": 288580, "epoch": 1717} {"train_loss": -11.199337005615234, "global_step": 288581, "epoch": 1717} {"train_loss": -9.588146209716797, "global_step": 288582, "epoch": 1717} {"train_loss": -11.811553955078125, "global_step": 288583, "epoch": 1717} {"train_loss": -9.83684253692627, "global_step": 288584, "epoch": 1717} {"train_loss": -10.875041007995605, "global_step": 288585, "epoch": 1717} {"train_loss": -10.798127174377441, "global_step": 288586, "epoch": 1717} {"train_loss": -11.242701530456543, "global_step": 288587, "epoch": 1717} {"train_loss": -11.389044761657715, "global_step": 288588, "epoch": 1717} {"train_loss": -11.564470291137695, "global_step": 288589, "epoch": 1717} {"train_loss": -12.033926010131836, "global_step": 288590, "epoch": 1717} {"train_loss": -11.50522232055664, "global_step": 288591, "epoch": 1717} {"train_loss": -11.961885452270508, "global_step": 288592, "epoch": 1717} {"train_loss": -11.480978012084961, "global_step": 288593, "epoch": 1717} {"train_loss": -11.898969650268555, "global_step": 288594, "epoch": 1717} {"train_loss": -12.031042098999023, "global_step": 288595, "epoch": 1717} {"train_loss": -12.035395622253418, "global_step": 288596, "epoch": 1717} {"train_loss": -11.835285186767578, "global_step": 288597, "epoch": 1717} {"train_loss": -11.905699729919434, "global_step": 288598, "epoch": 1717} {"train_loss": -11.836441040039062, "global_step": 288599, "epoch": 1717} {"train_loss": -11.606801986694336, "global_step": 288600, "epoch": 1717} {"train_loss": -11.835896492004395, "global_step": 288601, "epoch": 1717} {"train_loss": -11.94289779663086, "global_step": 288602, "epoch": 1717} {"train_loss": -11.793357849121094, "global_step": 288603, "epoch": 1717} {"train_loss": -11.578144073486328, "global_step": 288604, "epoch": 1717} {"train_loss": -11.305646896362305, "global_step": 288605, "epoch": 1717} {"train_loss": -11.859674453735352, "global_step": 288606, "epoch": 1717} {"train_loss": -11.585542678833008, "global_step": 288607, "epoch": 1717} {"train_loss": -11.764806747436523, "global_step": 288608, "epoch": 1717} {"train_loss": -11.896196365356445, "global_step": 288609, "epoch": 1717} {"train_loss": -12.228982925415039, "global_step": 288610, "epoch": 1717} {"train_loss": -11.808446884155273, "global_step": 288611, "epoch": 1717} {"train_loss": -12.024789810180664, "global_step": 288612, "epoch": 1717} {"train_loss": -11.999210357666016, "global_step": 288613, "epoch": 1717} {"train_loss": -12.191617965698242, "global_step": 288614, "epoch": 1717} {"train_loss": -12.1468505859375, "global_step": 288615, "epoch": 1717} {"train_loss": -12.170987129211426, "global_step": 288616, "epoch": 1717} {"train_loss": -12.004547119140625, "global_step": 288617, "epoch": 1717} {"train_loss": -12.193824768066406, "global_step": 288618, "epoch": 1717} {"train_loss": -12.01992416381836, "global_step": 288619, "epoch": 1717} {"train_loss": -12.079829216003418, "global_step": 288620, "epoch": 1717} {"train_loss": -11.93969440460205, "global_step": 288621, "epoch": 1717} {"train_loss": -12.075576782226562, "global_step": 288622, "epoch": 1717} {"train_loss": -11.842743442172097, "global_step": 288623, "epoch": 1717, "val_loss": 278030.71875} {"train_loss": -11.997514724731445, "global_step": 288624, "epoch": 1718} {"train_loss": -11.865800857543945, "global_step": 288625, "epoch": 1718} {"train_loss": -12.116832733154297, "global_step": 288626, "epoch": 1718} {"train_loss": -12.121740341186523, "global_step": 288627, "epoch": 1718} {"train_loss": -11.88813591003418, "global_step": 288628, "epoch": 1718} {"train_loss": -12.14738655090332, "global_step": 288629, "epoch": 1718} {"train_loss": -12.024417877197266, "global_step": 288630, "epoch": 1718} {"train_loss": -12.171834945678711, "global_step": 288631, "epoch": 1718} {"train_loss": -12.296717643737793, "global_step": 288632, "epoch": 1718} {"train_loss": -12.162513732910156, "global_step": 288633, "epoch": 1718} {"train_loss": -12.305712699890137, "global_step": 288634, "epoch": 1718} {"train_loss": -12.287115097045898, "global_step": 288635, "epoch": 1718} {"train_loss": -12.253254890441895, "global_step": 288636, "epoch": 1718} {"train_loss": -12.10585880279541, "global_step": 288637, "epoch": 1718} {"train_loss": -12.269299507141113, "global_step": 288638, "epoch": 1718} {"train_loss": -12.2823486328125, "global_step": 288639, "epoch": 1718} {"train_loss": -12.23396110534668, "global_step": 288640, "epoch": 1718} {"train_loss": -12.216814041137695, "global_step": 288641, "epoch": 1718} {"train_loss": -12.104182243347168, "global_step": 288642, "epoch": 1718} {"train_loss": -12.283487319946289, "global_step": 288643, "epoch": 1718} {"train_loss": -12.323387145996094, "global_step": 288644, "epoch": 1718} {"train_loss": -12.164588928222656, "global_step": 288645, "epoch": 1718} {"train_loss": -12.29220962524414, "global_step": 288646, "epoch": 1718} {"train_loss": -12.286913871765137, "global_step": 288647, "epoch": 1718} {"train_loss": -12.407085418701172, "global_step": 288648, "epoch": 1718} {"train_loss": -12.250967025756836, "global_step": 288649, "epoch": 1718} {"train_loss": -12.260971069335938, "global_step": 288650, "epoch": 1718} {"train_loss": -12.46547794342041, "global_step": 288651, "epoch": 1718} {"train_loss": -12.126141548156738, "global_step": 288652, "epoch": 1718} {"train_loss": -12.503440856933594, "global_step": 288653, "epoch": 1718} {"train_loss": -12.35976791381836, "global_step": 288654, "epoch": 1718} {"train_loss": -12.243465423583984, "global_step": 288655, "epoch": 1718} {"train_loss": -12.430486679077148, "global_step": 288656, "epoch": 1718} {"train_loss": -12.566511154174805, "global_step": 288657, "epoch": 1718} {"train_loss": -12.372876167297363, "global_step": 288658, "epoch": 1718} {"train_loss": -12.299615859985352, "global_step": 288659, "epoch": 1718} {"train_loss": -12.228815078735352, "global_step": 288660, "epoch": 1718} {"train_loss": -12.354808807373047, "global_step": 288661, "epoch": 1718} {"train_loss": -12.14598274230957, "global_step": 288662, "epoch": 1718} {"train_loss": -12.22402572631836, "global_step": 288663, "epoch": 1718} {"train_loss": -12.13433837890625, "global_step": 288664, "epoch": 1718} {"train_loss": -12.035487174987793, "global_step": 288665, "epoch": 1718} {"train_loss": -12.346550941467285, "global_step": 288666, "epoch": 1718} {"train_loss": -11.83551025390625, "global_step": 288667, "epoch": 1718} {"train_loss": -10.724943161010742, "global_step": 288668, "epoch": 1718} {"train_loss": -11.088898658752441, "global_step": 288669, "epoch": 1718} {"train_loss": -11.842934608459473, "global_step": 288670, "epoch": 1718} {"train_loss": -12.116130828857422, "global_step": 288671, "epoch": 1718} {"train_loss": -12.121171951293945, "global_step": 288672, "epoch": 1718} {"train_loss": -11.717761993408203, "global_step": 288673, "epoch": 1718} {"train_loss": -11.528602600097656, "global_step": 288674, "epoch": 1718} {"train_loss": -12.094159126281738, "global_step": 288675, "epoch": 1718} {"train_loss": -11.686097145080566, "global_step": 288676, "epoch": 1718} {"train_loss": -11.5187406539917, "global_step": 288677, "epoch": 1718} {"train_loss": -12.038030624389648, "global_step": 288678, "epoch": 1718} {"train_loss": -11.31441879272461, "global_step": 288679, "epoch": 1718} {"train_loss": -10.423072814941406, "global_step": 288680, "epoch": 1718} {"train_loss": -11.271004676818848, "global_step": 288681, "epoch": 1718} {"train_loss": -9.869711875915527, "global_step": 288682, "epoch": 1718} {"train_loss": -9.758218765258789, "global_step": 288683, "epoch": 1718} {"train_loss": -11.37049388885498, "global_step": 288684, "epoch": 1718} {"train_loss": -11.737129211425781, "global_step": 288685, "epoch": 1718} {"train_loss": -11.480303764343262, "global_step": 288686, "epoch": 1718} {"train_loss": -11.599252700805664, "global_step": 288687, "epoch": 1718} {"train_loss": -11.926246643066406, "global_step": 288688, "epoch": 1718} {"train_loss": -11.107126235961914, "global_step": 288689, "epoch": 1718} {"train_loss": -11.027636528015137, "global_step": 288690, "epoch": 1718} {"train_loss": -11.045225143432617, "global_step": 288691, "epoch": 1718} {"train_loss": -11.55505657196045, "global_step": 288692, "epoch": 1718} {"train_loss": -11.115011215209961, "global_step": 288693, "epoch": 1718} {"train_loss": -12.078347206115723, "global_step": 288694, "epoch": 1718} {"train_loss": -9.92011833190918, "global_step": 288695, "epoch": 1718} {"train_loss": -11.325477600097656, "global_step": 288696, "epoch": 1718} {"train_loss": -10.633783340454102, "global_step": 288697, "epoch": 1718} {"train_loss": -9.607547760009766, "global_step": 288698, "epoch": 1718} {"train_loss": -11.596966743469238, "global_step": 288699, "epoch": 1718} {"train_loss": -9.210367202758789, "global_step": 288700, "epoch": 1718} {"train_loss": -11.217856407165527, "global_step": 288701, "epoch": 1718} {"train_loss": -10.726799011230469, "global_step": 288702, "epoch": 1718} {"train_loss": -9.683189392089844, "global_step": 288703, "epoch": 1718} {"train_loss": -9.074461936950684, "global_step": 288704, "epoch": 1718} {"train_loss": -11.163399696350098, "global_step": 288705, "epoch": 1718} {"train_loss": -8.969139099121094, "global_step": 288706, "epoch": 1718} {"train_loss": -10.989453315734863, "global_step": 288707, "epoch": 1718} {"train_loss": -9.340187072753906, "global_step": 288708, "epoch": 1718} {"train_loss": -10.778390884399414, "global_step": 288709, "epoch": 1718} {"train_loss": -8.612783432006836, "global_step": 288710, "epoch": 1718} {"train_loss": -11.462034225463867, "global_step": 288711, "epoch": 1718} {"train_loss": -8.672933578491211, "global_step": 288712, "epoch": 1718} {"train_loss": -11.106693267822266, "global_step": 288713, "epoch": 1718} {"train_loss": -8.98475456237793, "global_step": 288714, "epoch": 1718} {"train_loss": -10.110407829284668, "global_step": 288715, "epoch": 1718} {"train_loss": -9.011752128601074, "global_step": 288716, "epoch": 1718} {"train_loss": -9.09318733215332, "global_step": 288717, "epoch": 1718} {"train_loss": -10.158893585205078, "global_step": 288718, "epoch": 1718} {"train_loss": -8.197443962097168, "global_step": 288719, "epoch": 1718} {"train_loss": -11.096478462219238, "global_step": 288720, "epoch": 1718} {"train_loss": -8.936423301696777, "global_step": 288721, "epoch": 1718} {"train_loss": -9.874813079833984, "global_step": 288722, "epoch": 1718} {"train_loss": -10.400871276855469, "global_step": 288723, "epoch": 1718} {"train_loss": -10.04054069519043, "global_step": 288724, "epoch": 1718} {"train_loss": -11.155120849609375, "global_step": 288725, "epoch": 1718} {"train_loss": -9.557405471801758, "global_step": 288726, "epoch": 1718} {"train_loss": -10.815549850463867, "global_step": 288727, "epoch": 1718} {"train_loss": -11.100555419921875, "global_step": 288728, "epoch": 1718} {"train_loss": -10.081645965576172, "global_step": 288729, "epoch": 1718} {"train_loss": -11.878562927246094, "global_step": 288730, "epoch": 1718} {"train_loss": -9.798395156860352, "global_step": 288731, "epoch": 1718} {"train_loss": -10.262499809265137, "global_step": 288732, "epoch": 1718} {"train_loss": -11.231491088867188, "global_step": 288733, "epoch": 1718} {"train_loss": -10.47652816772461, "global_step": 288734, "epoch": 1718} {"train_loss": -11.240974426269531, "global_step": 288735, "epoch": 1718} {"train_loss": -11.385236740112305, "global_step": 288736, "epoch": 1718} {"train_loss": -11.119796752929688, "global_step": 288737, "epoch": 1718} {"train_loss": -11.230432510375977, "global_step": 288738, "epoch": 1718} {"train_loss": -11.140432357788086, "global_step": 288739, "epoch": 1718} {"train_loss": -11.055519104003906, "global_step": 288740, "epoch": 1718} {"train_loss": -11.24932861328125, "global_step": 288741, "epoch": 1718} {"train_loss": -10.916259765625, "global_step": 288742, "epoch": 1718} {"train_loss": -11.355448722839355, "global_step": 288743, "epoch": 1718} {"train_loss": -11.587615966796875, "global_step": 288744, "epoch": 1718} {"train_loss": -11.508733749389648, "global_step": 288745, "epoch": 1718} {"train_loss": -11.644368171691895, "global_step": 288746, "epoch": 1718} {"train_loss": -11.599367141723633, "global_step": 288747, "epoch": 1718} {"train_loss": -11.743029594421387, "global_step": 288748, "epoch": 1718} {"train_loss": -11.498705863952637, "global_step": 288749, "epoch": 1718} {"train_loss": -11.766836166381836, "global_step": 288750, "epoch": 1718} {"train_loss": -11.553123474121094, "global_step": 288751, "epoch": 1718} {"train_loss": -11.664992332458496, "global_step": 288752, "epoch": 1718} {"train_loss": -11.682901382446289, "global_step": 288753, "epoch": 1718} {"train_loss": -11.563457489013672, "global_step": 288754, "epoch": 1718} {"train_loss": -11.808639526367188, "global_step": 288755, "epoch": 1718} {"train_loss": -11.85903549194336, "global_step": 288756, "epoch": 1718} {"train_loss": -11.52798080444336, "global_step": 288757, "epoch": 1718} {"train_loss": -11.765170097351074, "global_step": 288758, "epoch": 1718} {"train_loss": -11.72199535369873, "global_step": 288759, "epoch": 1718} {"train_loss": -11.646965026855469, "global_step": 288760, "epoch": 1718} {"train_loss": -11.839310646057129, "global_step": 288761, "epoch": 1718} {"train_loss": -11.761253356933594, "global_step": 288762, "epoch": 1718} {"train_loss": -11.75912857055664, "global_step": 288763, "epoch": 1718} {"train_loss": -11.861984252929688, "global_step": 288764, "epoch": 1718} {"train_loss": -11.901092529296875, "global_step": 288765, "epoch": 1718} {"train_loss": -11.960744857788086, "global_step": 288766, "epoch": 1718} {"train_loss": -11.889347076416016, "global_step": 288767, "epoch": 1718} {"train_loss": -11.781444549560547, "global_step": 288768, "epoch": 1718} {"train_loss": -11.858080863952637, "global_step": 288769, "epoch": 1718} {"train_loss": -11.750761032104492, "global_step": 288770, "epoch": 1718} {"train_loss": -11.856681823730469, "global_step": 288771, "epoch": 1718} {"train_loss": -12.057587623596191, "global_step": 288772, "epoch": 1718} {"train_loss": -11.893049240112305, "global_step": 288773, "epoch": 1718} {"train_loss": -12.097471237182617, "global_step": 288774, "epoch": 1718} {"train_loss": -12.038424491882324, "global_step": 288775, "epoch": 1718} {"train_loss": -12.098950386047363, "global_step": 288776, "epoch": 1718} {"train_loss": -12.1971435546875, "global_step": 288777, "epoch": 1718} {"train_loss": -12.024333953857422, "global_step": 288778, "epoch": 1718} {"train_loss": -12.02771282196045, "global_step": 288779, "epoch": 1718} {"train_loss": -12.136370658874512, "global_step": 288780, "epoch": 1718} {"train_loss": -12.058679580688477, "global_step": 288781, "epoch": 1718} {"train_loss": -12.265382766723633, "global_step": 288782, "epoch": 1718} {"train_loss": -12.095860481262207, "global_step": 288783, "epoch": 1718} {"train_loss": -12.182699203491211, "global_step": 288784, "epoch": 1718} {"train_loss": -12.22626781463623, "global_step": 288785, "epoch": 1718} {"train_loss": -12.198907852172852, "global_step": 288786, "epoch": 1718} {"train_loss": -12.34360122680664, "global_step": 288787, "epoch": 1718} {"train_loss": -12.400379180908203, "global_step": 288788, "epoch": 1718} {"train_loss": -12.1785888671875, "global_step": 288789, "epoch": 1718} {"train_loss": -12.266578674316406, "global_step": 288790, "epoch": 1718} {"train_loss": -11.448836400395347, "global_step": 288791, "epoch": 1718, "val_loss": 278385.96875} {"train_loss": -12.333259582519531, "global_step": 288792, "epoch": 1719} {"train_loss": -12.269192695617676, "global_step": 288793, "epoch": 1719} {"train_loss": -12.183338165283203, "global_step": 288794, "epoch": 1719} {"train_loss": -12.360950469970703, "global_step": 288795, "epoch": 1719} {"train_loss": -12.226781845092773, "global_step": 288796, "epoch": 1719} {"train_loss": -12.271379470825195, "global_step": 288797, "epoch": 1719} {"train_loss": -12.31299114227295, "global_step": 288798, "epoch": 1719} {"train_loss": -12.282169342041016, "global_step": 288799, "epoch": 1719} {"train_loss": -12.399576187133789, "global_step": 288800, "epoch": 1719} {"train_loss": -12.232871055603027, "global_step": 288801, "epoch": 1719} {"train_loss": -12.151626586914062, "global_step": 288802, "epoch": 1719} {"train_loss": -12.254814147949219, "global_step": 288803, "epoch": 1719} {"train_loss": -12.211359977722168, "global_step": 288804, "epoch": 1719} {"train_loss": -12.35074234008789, "global_step": 288805, "epoch": 1719} {"train_loss": -12.213138580322266, "global_step": 288806, "epoch": 1719} {"train_loss": -12.243160247802734, "global_step": 288807, "epoch": 1719} {"train_loss": -12.233396530151367, "global_step": 288808, "epoch": 1719} {"train_loss": -12.205703735351562, "global_step": 288809, "epoch": 1719} {"train_loss": -12.300085067749023, "global_step": 288810, "epoch": 1719} {"train_loss": -12.172369003295898, "global_step": 288811, "epoch": 1719} {"train_loss": -12.279363632202148, "global_step": 288812, "epoch": 1719} {"train_loss": -12.195475578308105, "global_step": 288813, "epoch": 1719} {"train_loss": -12.273905754089355, "global_step": 288814, "epoch": 1719} {"train_loss": -12.498111724853516, "global_step": 288815, "epoch": 1719} {"train_loss": -12.335399627685547, "global_step": 288816, "epoch": 1719} {"train_loss": -12.154598236083984, "global_step": 288817, "epoch": 1719} {"train_loss": -12.194721221923828, "global_step": 288818, "epoch": 1719} {"train_loss": -12.116473197937012, "global_step": 288819, "epoch": 1719} {"train_loss": -12.047506332397461, "global_step": 288820, "epoch": 1719} {"train_loss": -12.2835693359375, "global_step": 288821, "epoch": 1719} {"train_loss": -11.617673873901367, "global_step": 288822, "epoch": 1719} {"train_loss": -11.733802795410156, "global_step": 288823, "epoch": 1719} {"train_loss": -12.217508316040039, "global_step": 288824, "epoch": 1719} {"train_loss": -12.295092582702637, "global_step": 288825, "epoch": 1719} {"train_loss": -11.291942596435547, "global_step": 288826, "epoch": 1719} {"train_loss": -11.182500839233398, "global_step": 288827, "epoch": 1719} {"train_loss": -11.609651565551758, "global_step": 288828, "epoch": 1719} {"train_loss": -12.13267707824707, "global_step": 288829, "epoch": 1719} {"train_loss": -11.36988353729248, "global_step": 288830, "epoch": 1719} {"train_loss": -11.992603302001953, "global_step": 288831, "epoch": 1719} {"train_loss": -11.803503036499023, "global_step": 288832, "epoch": 1719} {"train_loss": -11.948237419128418, "global_step": 288833, "epoch": 1719} {"train_loss": -11.727743148803711, "global_step": 288834, "epoch": 1719} {"train_loss": -11.976186752319336, "global_step": 288835, "epoch": 1719} {"train_loss": -11.507847785949707, "global_step": 288836, "epoch": 1719} {"train_loss": -11.260112762451172, "global_step": 288837, "epoch": 1719} {"train_loss": -12.012357711791992, "global_step": 288838, "epoch": 1719} {"train_loss": -11.923789978027344, "global_step": 288839, "epoch": 1719} {"train_loss": -11.940618515014648, "global_step": 288840, "epoch": 1719} {"train_loss": -11.398442268371582, "global_step": 288841, "epoch": 1719} {"train_loss": -12.083643913269043, "global_step": 288842, "epoch": 1719} {"train_loss": -11.700533866882324, "global_step": 288843, "epoch": 1719} {"train_loss": -11.961505889892578, "global_step": 288844, "epoch": 1719} {"train_loss": -12.11845874786377, "global_step": 288845, "epoch": 1719} {"train_loss": -12.250577926635742, "global_step": 288846, "epoch": 1719} {"train_loss": -11.812769889831543, "global_step": 288847, "epoch": 1719} {"train_loss": -12.127918243408203, "global_step": 288848, "epoch": 1719} {"train_loss": -12.148347854614258, "global_step": 288849, "epoch": 1719} {"train_loss": -12.016938209533691, "global_step": 288850, "epoch": 1719} {"train_loss": -11.867086410522461, "global_step": 288851, "epoch": 1719} {"train_loss": -11.484785079956055, "global_step": 288852, "epoch": 1719} {"train_loss": -12.082626342773438, "global_step": 288853, "epoch": 1719} {"train_loss": -11.951970100402832, "global_step": 288854, "epoch": 1719} {"train_loss": -11.996535301208496, "global_step": 288855, "epoch": 1719} {"train_loss": -11.96009635925293, "global_step": 288856, "epoch": 1719} {"train_loss": -11.942577362060547, "global_step": 288857, "epoch": 1719} {"train_loss": -11.940637588500977, "global_step": 288858, "epoch": 1719} {"train_loss": -11.470939636230469, "global_step": 288859, "epoch": 1719} {"train_loss": -11.429513931274414, "global_step": 288860, "epoch": 1719} {"train_loss": -11.301965713500977, "global_step": 288861, "epoch": 1719} {"train_loss": -12.078563690185547, "global_step": 288862, "epoch": 1719} {"train_loss": -11.813461303710938, "global_step": 288863, "epoch": 1719} {"train_loss": -12.03872299194336, "global_step": 288864, "epoch": 1719} {"train_loss": -11.987972259521484, "global_step": 288865, "epoch": 1719} {"train_loss": -12.097146987915039, "global_step": 288866, "epoch": 1719} {"train_loss": -12.081074714660645, "global_step": 288867, "epoch": 1719} {"train_loss": -12.189521789550781, "global_step": 288868, "epoch": 1719} {"train_loss": -11.659270286560059, "global_step": 288869, "epoch": 1719} {"train_loss": -11.96617317199707, "global_step": 288870, "epoch": 1719} {"train_loss": -12.001812934875488, "global_step": 288871, "epoch": 1719} {"train_loss": -12.001859664916992, "global_step": 288872, "epoch": 1719} {"train_loss": -12.01531982421875, "global_step": 288873, "epoch": 1719} {"train_loss": -12.23558521270752, "global_step": 288874, "epoch": 1719} {"train_loss": -12.113941192626953, "global_step": 288875, "epoch": 1719} {"train_loss": -12.323253631591797, "global_step": 288876, "epoch": 1719} {"train_loss": -11.796212196350098, "global_step": 288877, "epoch": 1719} {"train_loss": -12.03929615020752, "global_step": 288878, "epoch": 1719} {"train_loss": -12.228196144104004, "global_step": 288879, "epoch": 1719} {"train_loss": -12.369861602783203, "global_step": 288880, "epoch": 1719} {"train_loss": -11.546480178833008, "global_step": 288881, "epoch": 1719} {"train_loss": -12.104783058166504, "global_step": 288882, "epoch": 1719} {"train_loss": -11.88656997680664, "global_step": 288883, "epoch": 1719} {"train_loss": -11.836365699768066, "global_step": 288884, "epoch": 1719} {"train_loss": -11.858436584472656, "global_step": 288885, "epoch": 1719} {"train_loss": -11.914264678955078, "global_step": 288886, "epoch": 1719} {"train_loss": -12.088972091674805, "global_step": 288887, "epoch": 1719} {"train_loss": -11.954265594482422, "global_step": 288888, "epoch": 1719} {"train_loss": -11.903648376464844, "global_step": 288889, "epoch": 1719} {"train_loss": -12.009973526000977, "global_step": 288890, "epoch": 1719} {"train_loss": -11.365769386291504, "global_step": 288891, "epoch": 1719} {"train_loss": -11.00437068939209, "global_step": 288892, "epoch": 1719} {"train_loss": -11.801437377929688, "global_step": 288893, "epoch": 1719} {"train_loss": -11.83498764038086, "global_step": 288894, "epoch": 1719} {"train_loss": -11.72557258605957, "global_step": 288895, "epoch": 1719} {"train_loss": -11.21337604522705, "global_step": 288896, "epoch": 1719} {"train_loss": -11.95132827758789, "global_step": 288897, "epoch": 1719} {"train_loss": -11.648905754089355, "global_step": 288898, "epoch": 1719} {"train_loss": -11.210729598999023, "global_step": 288899, "epoch": 1719} {"train_loss": -11.300149917602539, "global_step": 288900, "epoch": 1719} {"train_loss": -11.749052047729492, "global_step": 288901, "epoch": 1719} {"train_loss": -11.517439842224121, "global_step": 288902, "epoch": 1719} {"train_loss": -10.827203750610352, "global_step": 288903, "epoch": 1719} {"train_loss": -11.161468505859375, "global_step": 288904, "epoch": 1719} {"train_loss": -11.739105224609375, "global_step": 288905, "epoch": 1719} {"train_loss": -10.411966323852539, "global_step": 288906, "epoch": 1719} {"train_loss": -11.828742027282715, "global_step": 288907, "epoch": 1719} {"train_loss": -11.437369346618652, "global_step": 288908, "epoch": 1719} {"train_loss": -11.24656867980957, "global_step": 288909, "epoch": 1719} {"train_loss": -11.083931922912598, "global_step": 288910, "epoch": 1719} {"train_loss": -11.24953842163086, "global_step": 288911, "epoch": 1719} {"train_loss": -10.14487361907959, "global_step": 288912, "epoch": 1719} {"train_loss": -11.755791664123535, "global_step": 288913, "epoch": 1719} {"train_loss": -10.356254577636719, "global_step": 288914, "epoch": 1719} {"train_loss": -9.698230743408203, "global_step": 288915, "epoch": 1719} {"train_loss": -11.384703636169434, "global_step": 288916, "epoch": 1719} {"train_loss": -9.804645538330078, "global_step": 288917, "epoch": 1719} {"train_loss": -9.503543853759766, "global_step": 288918, "epoch": 1719} {"train_loss": -11.368996620178223, "global_step": 288919, "epoch": 1719} {"train_loss": -9.175529479980469, "global_step": 288920, "epoch": 1719} {"train_loss": -10.741819381713867, "global_step": 288921, "epoch": 1719} {"train_loss": -9.936725616455078, "global_step": 288922, "epoch": 1719} {"train_loss": -9.967100143432617, "global_step": 288923, "epoch": 1719} {"train_loss": -10.57246208190918, "global_step": 288924, "epoch": 1719} {"train_loss": -10.24276351928711, "global_step": 288925, "epoch": 1719} {"train_loss": -10.169022560119629, "global_step": 288926, "epoch": 1719} {"train_loss": -10.809914588928223, "global_step": 288927, "epoch": 1719} {"train_loss": -10.650653839111328, "global_step": 288928, "epoch": 1719} {"train_loss": -11.047438621520996, "global_step": 288929, "epoch": 1719} {"train_loss": -11.177835464477539, "global_step": 288930, "epoch": 1719} {"train_loss": -10.984402656555176, "global_step": 288931, "epoch": 1719} {"train_loss": -11.645894050598145, "global_step": 288932, "epoch": 1719} {"train_loss": -10.804532051086426, "global_step": 288933, "epoch": 1719} {"train_loss": -11.364105224609375, "global_step": 288934, "epoch": 1719} {"train_loss": -11.552595138549805, "global_step": 288935, "epoch": 1719} {"train_loss": -11.664164543151855, "global_step": 288936, "epoch": 1719} {"train_loss": -11.551603317260742, "global_step": 288937, "epoch": 1719} {"train_loss": -11.702051162719727, "global_step": 288938, "epoch": 1719} {"train_loss": -11.730886459350586, "global_step": 288939, "epoch": 1719} {"train_loss": -12.035536766052246, "global_step": 288940, "epoch": 1719} {"train_loss": -11.980222702026367, "global_step": 288941, "epoch": 1719} {"train_loss": -11.84756851196289, "global_step": 288942, "epoch": 1719} {"train_loss": -11.724311828613281, "global_step": 288943, "epoch": 1719} {"train_loss": -11.91910171508789, "global_step": 288944, "epoch": 1719} {"train_loss": -11.966078758239746, "global_step": 288945, "epoch": 1719} {"train_loss": -12.056276321411133, "global_step": 288946, "epoch": 1719} {"train_loss": -11.856002807617188, "global_step": 288947, "epoch": 1719} {"train_loss": -11.940662384033203, "global_step": 288948, "epoch": 1719} {"train_loss": -12.070446014404297, "global_step": 288949, "epoch": 1719} {"train_loss": -11.93106460571289, "global_step": 288950, "epoch": 1719} {"train_loss": -12.079336166381836, "global_step": 288951, "epoch": 1719} {"train_loss": -12.029899597167969, "global_step": 288952, "epoch": 1719} {"train_loss": -12.132698059082031, "global_step": 288953, "epoch": 1719} {"train_loss": -12.024171829223633, "global_step": 288954, "epoch": 1719} {"train_loss": -12.022382736206055, "global_step": 288955, "epoch": 1719} {"train_loss": -12.220011711120605, "global_step": 288956, "epoch": 1719} {"train_loss": -12.100844383239746, "global_step": 288957, "epoch": 1719} {"train_loss": -12.117400169372559, "global_step": 288958, "epoch": 1719} {"train_loss": -11.723353437014989, "global_step": 288959, "epoch": 1719, "val_loss": 277835.40625} {"train_loss": -12.180435180664062, "global_step": 288960, "epoch": 1720} {"train_loss": -12.288331031799316, "global_step": 288961, "epoch": 1720} {"train_loss": -12.258552551269531, "global_step": 288962, "epoch": 1720} {"train_loss": -12.096185684204102, "global_step": 288963, "epoch": 1720} {"train_loss": -12.32087230682373, "global_step": 288964, "epoch": 1720} {"train_loss": -12.125819206237793, "global_step": 288965, "epoch": 1720} {"train_loss": -12.046012878417969, "global_step": 288966, "epoch": 1720} {"train_loss": -12.196809768676758, "global_step": 288967, "epoch": 1720} {"train_loss": -12.077703475952148, "global_step": 288968, "epoch": 1720} {"train_loss": -12.0034818649292, "global_step": 288969, "epoch": 1720} {"train_loss": -12.293573379516602, "global_step": 288970, "epoch": 1720} {"train_loss": -11.974201202392578, "global_step": 288971, "epoch": 1720} {"train_loss": -12.409261703491211, "global_step": 288972, "epoch": 1720} {"train_loss": -12.015632629394531, "global_step": 288973, "epoch": 1720} {"train_loss": -12.188932418823242, "global_step": 288974, "epoch": 1720} {"train_loss": -12.236566543579102, "global_step": 288975, "epoch": 1720} {"train_loss": -12.091485977172852, "global_step": 288976, "epoch": 1720} {"train_loss": -12.266615867614746, "global_step": 288977, "epoch": 1720} {"train_loss": -12.193593978881836, "global_step": 288978, "epoch": 1720} {"train_loss": -12.258811950683594, "global_step": 288979, "epoch": 1720} {"train_loss": -11.929344177246094, "global_step": 288980, "epoch": 1720} {"train_loss": -12.258429527282715, "global_step": 288981, "epoch": 1720} {"train_loss": -11.97452163696289, "global_step": 288982, "epoch": 1720} {"train_loss": -12.320765495300293, "global_step": 288983, "epoch": 1720} {"train_loss": -12.334964752197266, "global_step": 288984, "epoch": 1720} {"train_loss": -12.062484741210938, "global_step": 288985, "epoch": 1720} {"train_loss": -12.264792442321777, "global_step": 288986, "epoch": 1720} {"train_loss": -12.114191055297852, "global_step": 288987, "epoch": 1720} {"train_loss": -12.35153865814209, "global_step": 288988, "epoch": 1720} {"train_loss": -12.538591384887695, "global_step": 288989, "epoch": 1720} {"train_loss": -12.474374771118164, "global_step": 288990, "epoch": 1720} {"train_loss": -12.160123825073242, "global_step": 288991, "epoch": 1720} {"train_loss": -12.514154434204102, "global_step": 288992, "epoch": 1720} {"train_loss": -12.288009643554688, "global_step": 288993, "epoch": 1720} {"train_loss": -12.431181907653809, "global_step": 288994, "epoch": 1720} {"train_loss": -12.570012092590332, "global_step": 288995, "epoch": 1720} {"train_loss": -12.303590774536133, "global_step": 288996, "epoch": 1720} {"train_loss": -12.580269813537598, "global_step": 288997, "epoch": 1720} {"train_loss": -11.984769821166992, "global_step": 288998, "epoch": 1720} {"train_loss": -12.101541519165039, "global_step": 288999, "epoch": 1720} {"train_loss": -12.519109725952148, "global_step": 289000, "epoch": 1720} {"train_loss": -12.277854919433594, "global_step": 289001, "epoch": 1720} {"train_loss": -12.328367233276367, "global_step": 289002, "epoch": 1720} {"train_loss": -12.41335678100586, "global_step": 289003, "epoch": 1720} {"train_loss": -12.564536094665527, "global_step": 289004, "epoch": 1720} {"train_loss": -12.37668228149414, "global_step": 289005, "epoch": 1720} {"train_loss": -12.580841064453125, "global_step": 289006, "epoch": 1720} {"train_loss": -12.413362503051758, "global_step": 289007, "epoch": 1720} {"train_loss": -12.623979568481445, "global_step": 289008, "epoch": 1720} {"train_loss": -12.360267639160156, "global_step": 289009, "epoch": 1720} {"train_loss": -12.481643676757812, "global_step": 289010, "epoch": 1720} {"train_loss": -12.408845901489258, "global_step": 289011, "epoch": 1720} {"train_loss": -12.565906524658203, "global_step": 289012, "epoch": 1720} {"train_loss": -12.520956993103027, "global_step": 289013, "epoch": 1720} {"train_loss": -12.415599822998047, "global_step": 289014, "epoch": 1720} {"train_loss": -12.440053939819336, "global_step": 289015, "epoch": 1720} {"train_loss": -12.164612770080566, "global_step": 289016, "epoch": 1720} {"train_loss": -12.226482391357422, "global_step": 289017, "epoch": 1720} {"train_loss": -11.674722671508789, "global_step": 289018, "epoch": 1720} {"train_loss": -11.119430541992188, "global_step": 289019, "epoch": 1720} {"train_loss": -11.619643211364746, "global_step": 289020, "epoch": 1720} {"train_loss": -11.46147346496582, "global_step": 289021, "epoch": 1720} {"train_loss": -11.981649398803711, "global_step": 289022, "epoch": 1720} {"train_loss": -12.24502944946289, "global_step": 289023, "epoch": 1720} {"train_loss": -12.288167953491211, "global_step": 289024, "epoch": 1720} {"train_loss": -11.144186973571777, "global_step": 289025, "epoch": 1720} {"train_loss": -11.83856201171875, "global_step": 289026, "epoch": 1720} {"train_loss": -11.731790542602539, "global_step": 289027, "epoch": 1720} {"train_loss": -11.658651351928711, "global_step": 289028, "epoch": 1720} {"train_loss": -11.169910430908203, "global_step": 289029, "epoch": 1720} {"train_loss": -11.57206916809082, "global_step": 289030, "epoch": 1720} {"train_loss": -11.970573425292969, "global_step": 289031, "epoch": 1720} {"train_loss": -12.13587760925293, "global_step": 289032, "epoch": 1720} {"train_loss": -11.472574234008789, "global_step": 289033, "epoch": 1720} {"train_loss": -10.739948272705078, "global_step": 289034, "epoch": 1720} {"train_loss": -10.37730884552002, "global_step": 289035, "epoch": 1720} {"train_loss": -11.548038482666016, "global_step": 289036, "epoch": 1720} {"train_loss": -10.348331451416016, "global_step": 289037, "epoch": 1720} {"train_loss": -11.38870620727539, "global_step": 289038, "epoch": 1720} {"train_loss": -11.12225341796875, "global_step": 289039, "epoch": 1720} {"train_loss": -11.272674560546875, "global_step": 289040, "epoch": 1720} {"train_loss": -11.785820007324219, "global_step": 289041, "epoch": 1720} {"train_loss": -11.972369194030762, "global_step": 289042, "epoch": 1720} {"train_loss": -11.440388679504395, "global_step": 289043, "epoch": 1720} {"train_loss": -11.163710594177246, "global_step": 289044, "epoch": 1720} {"train_loss": -11.414746284484863, "global_step": 289045, "epoch": 1720} {"train_loss": -11.386523246765137, "global_step": 289046, "epoch": 1720} {"train_loss": -11.523195266723633, "global_step": 289047, "epoch": 1720} {"train_loss": -11.425359725952148, "global_step": 289048, "epoch": 1720} {"train_loss": -11.775289535522461, "global_step": 289049, "epoch": 1720} {"train_loss": -11.419550895690918, "global_step": 289050, "epoch": 1720} {"train_loss": -11.426125526428223, "global_step": 289051, "epoch": 1720} {"train_loss": -11.024145126342773, "global_step": 289052, "epoch": 1720} {"train_loss": -11.986939430236816, "global_step": 289053, "epoch": 1720} {"train_loss": -10.539739608764648, "global_step": 289054, "epoch": 1720} {"train_loss": -11.784549713134766, "global_step": 289055, "epoch": 1720} {"train_loss": -11.049072265625, "global_step": 289056, "epoch": 1720} {"train_loss": -11.246650695800781, "global_step": 289057, "epoch": 1720} {"train_loss": -11.636186599731445, "global_step": 289058, "epoch": 1720} {"train_loss": -11.77572250366211, "global_step": 289059, "epoch": 1720} {"train_loss": -11.633739471435547, "global_step": 289060, "epoch": 1720} {"train_loss": -11.687196731567383, "global_step": 289061, "epoch": 1720} {"train_loss": -11.96029281616211, "global_step": 289062, "epoch": 1720} {"train_loss": -11.87967586517334, "global_step": 289063, "epoch": 1720} {"train_loss": -11.629806518554688, "global_step": 289064, "epoch": 1720} {"train_loss": -12.038661003112793, "global_step": 289065, "epoch": 1720} {"train_loss": -11.5748291015625, "global_step": 289066, "epoch": 1720} {"train_loss": -11.451183319091797, "global_step": 289067, "epoch": 1720} {"train_loss": -11.660096168518066, "global_step": 289068, "epoch": 1720} {"train_loss": -11.8125581741333, "global_step": 289069, "epoch": 1720} {"train_loss": -11.11553955078125, "global_step": 289070, "epoch": 1720} {"train_loss": -11.101583480834961, "global_step": 289071, "epoch": 1720} {"train_loss": -11.950662612915039, "global_step": 289072, "epoch": 1720} {"train_loss": -11.309537887573242, "global_step": 289073, "epoch": 1720} {"train_loss": -12.385963439941406, "global_step": 289074, "epoch": 1720} {"train_loss": -11.811159133911133, "global_step": 289075, "epoch": 1720} {"train_loss": -12.29539680480957, "global_step": 289076, "epoch": 1720} {"train_loss": -12.016756057739258, "global_step": 289077, "epoch": 1720} {"train_loss": -11.966318130493164, "global_step": 289078, "epoch": 1720} {"train_loss": -11.948701858520508, "global_step": 289079, "epoch": 1720} {"train_loss": -11.853034973144531, "global_step": 289080, "epoch": 1720} {"train_loss": -12.291391372680664, "global_step": 289081, "epoch": 1720} {"train_loss": -11.699283599853516, "global_step": 289082, "epoch": 1720} {"train_loss": -11.884857177734375, "global_step": 289083, "epoch": 1720} {"train_loss": -11.615407943725586, "global_step": 289084, "epoch": 1720} {"train_loss": -12.145757675170898, "global_step": 289085, "epoch": 1720} {"train_loss": -12.001175880432129, "global_step": 289086, "epoch": 1720} {"train_loss": -11.949681282043457, "global_step": 289087, "epoch": 1720} {"train_loss": -12.09906005859375, "global_step": 289088, "epoch": 1720} {"train_loss": -11.923511505126953, "global_step": 289089, "epoch": 1720} {"train_loss": -11.919988632202148, "global_step": 289090, "epoch": 1720} {"train_loss": -11.926212310791016, "global_step": 289091, "epoch": 1720} {"train_loss": -11.853412628173828, "global_step": 289092, "epoch": 1720} {"train_loss": -11.299267768859863, "global_step": 289093, "epoch": 1720} {"train_loss": -12.340089797973633, "global_step": 289094, "epoch": 1720} {"train_loss": -11.461201667785645, "global_step": 289095, "epoch": 1720} {"train_loss": -12.113429069519043, "global_step": 289096, "epoch": 1720} {"train_loss": -11.679207801818848, "global_step": 289097, "epoch": 1720} {"train_loss": -11.792604446411133, "global_step": 289098, "epoch": 1720} {"train_loss": -11.879302978515625, "global_step": 289099, "epoch": 1720} {"train_loss": -12.124310493469238, "global_step": 289100, "epoch": 1720} {"train_loss": -11.703978538513184, "global_step": 289101, "epoch": 1720} {"train_loss": -12.262206077575684, "global_step": 289102, "epoch": 1720} {"train_loss": -12.18993091583252, "global_step": 289103, "epoch": 1720} {"train_loss": -11.867476463317871, "global_step": 289104, "epoch": 1720} {"train_loss": -12.090129852294922, "global_step": 289105, "epoch": 1720} {"train_loss": -12.151902198791504, "global_step": 289106, "epoch": 1720} {"train_loss": -12.139763832092285, "global_step": 289107, "epoch": 1720} {"train_loss": -12.113068580627441, "global_step": 289108, "epoch": 1720} {"train_loss": -12.277680397033691, "global_step": 289109, "epoch": 1720} {"train_loss": -12.231048583984375, "global_step": 289110, "epoch": 1720} {"train_loss": -12.038737297058105, "global_step": 289111, "epoch": 1720} {"train_loss": -12.377124786376953, "global_step": 289112, "epoch": 1720} {"train_loss": -11.901540756225586, "global_step": 289113, "epoch": 1720} {"train_loss": -12.05750846862793, "global_step": 289114, "epoch": 1720} {"train_loss": -12.034364700317383, "global_step": 289115, "epoch": 1720} {"train_loss": -11.760733604431152, "global_step": 289116, "epoch": 1720} {"train_loss": -11.959277153015137, "global_step": 289117, "epoch": 1720} {"train_loss": -11.606411933898926, "global_step": 289118, "epoch": 1720} {"train_loss": -11.014923095703125, "global_step": 289119, "epoch": 1720} {"train_loss": -11.90861701965332, "global_step": 289120, "epoch": 1720} {"train_loss": -11.070700645446777, "global_step": 289121, "epoch": 1720} {"train_loss": -10.957871437072754, "global_step": 289122, "epoch": 1720} {"train_loss": -11.37398910522461, "global_step": 289123, "epoch": 1720} {"train_loss": -11.035009384155273, "global_step": 289124, "epoch": 1720} {"train_loss": -11.040578842163086, "global_step": 289125, "epoch": 1720} {"train_loss": -11.694731712341309, "global_step": 289126, "epoch": 1720} {"train_loss": -11.891901470365978, "global_step": 289127, "epoch": 1720, "val_loss": 275964.65625, "train_action_mse_error": 3.2317686080932617} {"train_loss": -11.770267486572266, "global_step": 289128, "epoch": 1721} {"train_loss": -11.517990112304688, "global_step": 289129, "epoch": 1721} {"train_loss": -11.76608657836914, "global_step": 289130, "epoch": 1721} {"train_loss": -10.941221237182617, "global_step": 289131, "epoch": 1721} {"train_loss": -12.175582885742188, "global_step": 289132, "epoch": 1721} {"train_loss": -10.939266204833984, "global_step": 289133, "epoch": 1721} {"train_loss": -11.928832054138184, "global_step": 289134, "epoch": 1721} {"train_loss": -11.064299583435059, "global_step": 289135, "epoch": 1721} {"train_loss": -11.344610214233398, "global_step": 289136, "epoch": 1721} {"train_loss": -11.496685028076172, "global_step": 289137, "epoch": 1721} {"train_loss": -11.733625411987305, "global_step": 289138, "epoch": 1721} {"train_loss": -11.598758697509766, "global_step": 289139, "epoch": 1721} {"train_loss": -11.81922721862793, "global_step": 289140, "epoch": 1721} {"train_loss": -11.933624267578125, "global_step": 289141, "epoch": 1721} {"train_loss": -11.59810733795166, "global_step": 289142, "epoch": 1721} {"train_loss": -11.661080360412598, "global_step": 289143, "epoch": 1721} {"train_loss": -11.51828384399414, "global_step": 289144, "epoch": 1721} {"train_loss": -12.001441955566406, "global_step": 289145, "epoch": 1721} {"train_loss": -11.988204956054688, "global_step": 289146, "epoch": 1721} {"train_loss": -12.306900024414062, "global_step": 289147, "epoch": 1721} {"train_loss": -12.033434867858887, "global_step": 289148, "epoch": 1721} {"train_loss": -12.017477989196777, "global_step": 289149, "epoch": 1721} {"train_loss": -11.897343635559082, "global_step": 289150, "epoch": 1721} {"train_loss": -12.089463233947754, "global_step": 289151, "epoch": 1721} {"train_loss": -11.906399726867676, "global_step": 289152, "epoch": 1721} {"train_loss": -12.229694366455078, "global_step": 289153, "epoch": 1721} {"train_loss": -11.98989486694336, "global_step": 289154, "epoch": 1721} {"train_loss": -12.176513671875, "global_step": 289155, "epoch": 1721} {"train_loss": -12.16541862487793, "global_step": 289156, "epoch": 1721} {"train_loss": -11.972143173217773, "global_step": 289157, "epoch": 1721} {"train_loss": -12.103418350219727, "global_step": 289158, "epoch": 1721} {"train_loss": -12.34054183959961, "global_step": 289159, "epoch": 1721} {"train_loss": -11.934333801269531, "global_step": 289160, "epoch": 1721} {"train_loss": -11.338737487792969, "global_step": 289161, "epoch": 1721} {"train_loss": -12.308053970336914, "global_step": 289162, "epoch": 1721} {"train_loss": -11.517318725585938, "global_step": 289163, "epoch": 1721} {"train_loss": -11.644293785095215, "global_step": 289164, "epoch": 1721} {"train_loss": -11.878179550170898, "global_step": 289165, "epoch": 1721} {"train_loss": -12.045366287231445, "global_step": 289166, "epoch": 1721} {"train_loss": -11.687115669250488, "global_step": 289167, "epoch": 1721} {"train_loss": -11.83273696899414, "global_step": 289168, "epoch": 1721} {"train_loss": -11.340932846069336, "global_step": 289169, "epoch": 1721} {"train_loss": -11.44888687133789, "global_step": 289170, "epoch": 1721} {"train_loss": -10.774128913879395, "global_step": 289171, "epoch": 1721} {"train_loss": -10.56943130493164, "global_step": 289172, "epoch": 1721} {"train_loss": -11.094961166381836, "global_step": 289173, "epoch": 1721} {"train_loss": -11.037595748901367, "global_step": 289174, "epoch": 1721} {"train_loss": -11.258129119873047, "global_step": 289175, "epoch": 1721} {"train_loss": -10.046838760375977, "global_step": 289176, "epoch": 1721} {"train_loss": -11.358043670654297, "global_step": 289177, "epoch": 1721} {"train_loss": -11.033862113952637, "global_step": 289178, "epoch": 1721} {"train_loss": -11.230120658874512, "global_step": 289179, "epoch": 1721} {"train_loss": -11.843208312988281, "global_step": 289180, "epoch": 1721} {"train_loss": -11.148704528808594, "global_step": 289181, "epoch": 1721} {"train_loss": -11.45099925994873, "global_step": 289182, "epoch": 1721} {"train_loss": -11.540863990783691, "global_step": 289183, "epoch": 1721} {"train_loss": -12.030831336975098, "global_step": 289184, "epoch": 1721} {"train_loss": -11.549619674682617, "global_step": 289185, "epoch": 1721} {"train_loss": -11.820267677307129, "global_step": 289186, "epoch": 1721} {"train_loss": -11.97533130645752, "global_step": 289187, "epoch": 1721} {"train_loss": -11.99963665008545, "global_step": 289188, "epoch": 1721} {"train_loss": -12.063189506530762, "global_step": 289189, "epoch": 1721} {"train_loss": -12.155413627624512, "global_step": 289190, "epoch": 1721} {"train_loss": -12.019109725952148, "global_step": 289191, "epoch": 1721} {"train_loss": -12.011083602905273, "global_step": 289192, "epoch": 1721} {"train_loss": -12.260734558105469, "global_step": 289193, "epoch": 1721} {"train_loss": -12.048870086669922, "global_step": 289194, "epoch": 1721} {"train_loss": -12.149003982543945, "global_step": 289195, "epoch": 1721} {"train_loss": -12.096586227416992, "global_step": 289196, "epoch": 1721} {"train_loss": -12.273250579833984, "global_step": 289197, "epoch": 1721} {"train_loss": -12.17402458190918, "global_step": 289198, "epoch": 1721} {"train_loss": -12.222105026245117, "global_step": 289199, "epoch": 1721} {"train_loss": -12.107078552246094, "global_step": 289200, "epoch": 1721} {"train_loss": -12.136459350585938, "global_step": 289201, "epoch": 1721} {"train_loss": -12.044296264648438, "global_step": 289202, "epoch": 1721} {"train_loss": -12.186637878417969, "global_step": 289203, "epoch": 1721} {"train_loss": -12.124773025512695, "global_step": 289204, "epoch": 1721} {"train_loss": -12.109506607055664, "global_step": 289205, "epoch": 1721} {"train_loss": -12.192972183227539, "global_step": 289206, "epoch": 1721} {"train_loss": -12.110267639160156, "global_step": 289207, "epoch": 1721} {"train_loss": -12.166778564453125, "global_step": 289208, "epoch": 1721} {"train_loss": -11.902990341186523, "global_step": 289209, "epoch": 1721} {"train_loss": -12.042789459228516, "global_step": 289210, "epoch": 1721} {"train_loss": -12.183162689208984, "global_step": 289211, "epoch": 1721} {"train_loss": -12.120119094848633, "global_step": 289212, "epoch": 1721} {"train_loss": -11.864324569702148, "global_step": 289213, "epoch": 1721} {"train_loss": -12.08610725402832, "global_step": 289214, "epoch": 1721} {"train_loss": -12.220365524291992, "global_step": 289215, "epoch": 1721} {"train_loss": -12.238497734069824, "global_step": 289216, "epoch": 1721} {"train_loss": -11.909046173095703, "global_step": 289217, "epoch": 1721} {"train_loss": -12.119990348815918, "global_step": 289218, "epoch": 1721} {"train_loss": -12.002938270568848, "global_step": 289219, "epoch": 1721} {"train_loss": -12.114641189575195, "global_step": 289220, "epoch": 1721} {"train_loss": -12.222768783569336, "global_step": 289221, "epoch": 1721} {"train_loss": -11.883472442626953, "global_step": 289222, "epoch": 1721} {"train_loss": -12.139902114868164, "global_step": 289223, "epoch": 1721} {"train_loss": -12.0509614944458, "global_step": 289224, "epoch": 1721} {"train_loss": -11.998828887939453, "global_step": 289225, "epoch": 1721} {"train_loss": -12.331066131591797, "global_step": 289226, "epoch": 1721} {"train_loss": -12.045284271240234, "global_step": 289227, "epoch": 1721} {"train_loss": -11.530965805053711, "global_step": 289228, "epoch": 1721} {"train_loss": -11.94504165649414, "global_step": 289229, "epoch": 1721} {"train_loss": -11.622005462646484, "global_step": 289230, "epoch": 1721} {"train_loss": -11.329312324523926, "global_step": 289231, "epoch": 1721} {"train_loss": -10.909588813781738, "global_step": 289232, "epoch": 1721} {"train_loss": -12.008964538574219, "global_step": 289233, "epoch": 1721} {"train_loss": -10.871635437011719, "global_step": 289234, "epoch": 1721} {"train_loss": -11.334935188293457, "global_step": 289235, "epoch": 1721} {"train_loss": -11.824291229248047, "global_step": 289236, "epoch": 1721} {"train_loss": -10.819323539733887, "global_step": 289237, "epoch": 1721} {"train_loss": -12.055768013000488, "global_step": 289238, "epoch": 1721} {"train_loss": -11.209718704223633, "global_step": 289239, "epoch": 1721} {"train_loss": -10.766098976135254, "global_step": 289240, "epoch": 1721} {"train_loss": -11.776012420654297, "global_step": 289241, "epoch": 1721} {"train_loss": -11.371746063232422, "global_step": 289242, "epoch": 1721} {"train_loss": -12.194235801696777, "global_step": 289243, "epoch": 1721} {"train_loss": -11.563886642456055, "global_step": 289244, "epoch": 1721} {"train_loss": -11.633405685424805, "global_step": 289245, "epoch": 1721} {"train_loss": -11.806299209594727, "global_step": 289246, "epoch": 1721} {"train_loss": -11.75840950012207, "global_step": 289247, "epoch": 1721} {"train_loss": -11.969189643859863, "global_step": 289248, "epoch": 1721} {"train_loss": -11.977296829223633, "global_step": 289249, "epoch": 1721} {"train_loss": -12.084203720092773, "global_step": 289250, "epoch": 1721} {"train_loss": -11.836910247802734, "global_step": 289251, "epoch": 1721} {"train_loss": -11.746254920959473, "global_step": 289252, "epoch": 1721} {"train_loss": -11.881954193115234, "global_step": 289253, "epoch": 1721} {"train_loss": -11.941413879394531, "global_step": 289254, "epoch": 1721} {"train_loss": -11.069087982177734, "global_step": 289255, "epoch": 1721} {"train_loss": -11.737194061279297, "global_step": 289256, "epoch": 1721} {"train_loss": -11.161032676696777, "global_step": 289257, "epoch": 1721} {"train_loss": -10.11993408203125, "global_step": 289258, "epoch": 1721} {"train_loss": -11.844860076904297, "global_step": 289259, "epoch": 1721} {"train_loss": -10.488715171813965, "global_step": 289260, "epoch": 1721} {"train_loss": -10.749356269836426, "global_step": 289261, "epoch": 1721} {"train_loss": -10.006840705871582, "global_step": 289262, "epoch": 1721} {"train_loss": -9.787511825561523, "global_step": 289263, "epoch": 1721} {"train_loss": -10.602174758911133, "global_step": 289264, "epoch": 1721} {"train_loss": -10.592870712280273, "global_step": 289265, "epoch": 1721} {"train_loss": -9.868904113769531, "global_step": 289266, "epoch": 1721} {"train_loss": -10.206914901733398, "global_step": 289267, "epoch": 1721} {"train_loss": -9.889497756958008, "global_step": 289268, "epoch": 1721} {"train_loss": -11.217828750610352, "global_step": 289269, "epoch": 1721} {"train_loss": -9.723681449890137, "global_step": 289270, "epoch": 1721} {"train_loss": -10.231093406677246, "global_step": 289271, "epoch": 1721} {"train_loss": -10.865945816040039, "global_step": 289272, "epoch": 1721} {"train_loss": -10.195919036865234, "global_step": 289273, "epoch": 1721} {"train_loss": -10.621997833251953, "global_step": 289274, "epoch": 1721} {"train_loss": -10.855193138122559, "global_step": 289275, "epoch": 1721} {"train_loss": -10.131591796875, "global_step": 289276, "epoch": 1721} {"train_loss": -10.102592468261719, "global_step": 289277, "epoch": 1721} {"train_loss": -11.509675979614258, "global_step": 289278, "epoch": 1721} {"train_loss": -10.304058074951172, "global_step": 289279, "epoch": 1721} {"train_loss": -11.197612762451172, "global_step": 289280, "epoch": 1721} {"train_loss": -11.053765296936035, "global_step": 289281, "epoch": 1721} {"train_loss": -10.58245849609375, "global_step": 289282, "epoch": 1721} {"train_loss": -11.360860824584961, "global_step": 289283, "epoch": 1721} {"train_loss": -11.125009536743164, "global_step": 289284, "epoch": 1721} {"train_loss": -11.387665748596191, "global_step": 289285, "epoch": 1721} {"train_loss": -11.414186477661133, "global_step": 289286, "epoch": 1721} {"train_loss": -11.476807594299316, "global_step": 289287, "epoch": 1721} {"train_loss": -11.370894432067871, "global_step": 289288, "epoch": 1721} {"train_loss": -11.828567504882812, "global_step": 289289, "epoch": 1721} {"train_loss": -11.714412689208984, "global_step": 289290, "epoch": 1721} {"train_loss": -11.620503425598145, "global_step": 289291, "epoch": 1721} {"train_loss": -11.598491668701172, "global_step": 289292, "epoch": 1721} {"train_loss": -11.718412399291992, "global_step": 289293, "epoch": 1721} {"train_loss": -11.743091583251953, "global_step": 289294, "epoch": 1721} {"train_loss": -11.56728971004486, "global_step": 289295, "epoch": 1721, "val_loss": 275248.8125} {"train_loss": -11.495007514953613, "global_step": 289296, "epoch": 1722} {"train_loss": -11.892176628112793, "global_step": 289297, "epoch": 1722} {"train_loss": -11.457962989807129, "global_step": 289298, "epoch": 1722} {"train_loss": -11.84490966796875, "global_step": 289299, "epoch": 1722} {"train_loss": -11.705879211425781, "global_step": 289300, "epoch": 1722} {"train_loss": -11.777993202209473, "global_step": 289301, "epoch": 1722} {"train_loss": -11.894264221191406, "global_step": 289302, "epoch": 1722} {"train_loss": -11.696006774902344, "global_step": 289303, "epoch": 1722} {"train_loss": -11.88454532623291, "global_step": 289304, "epoch": 1722} {"train_loss": -11.979684829711914, "global_step": 289305, "epoch": 1722} {"train_loss": -12.06817626953125, "global_step": 289306, "epoch": 1722} {"train_loss": -12.007989883422852, "global_step": 289307, "epoch": 1722} {"train_loss": -12.286458969116211, "global_step": 289308, "epoch": 1722} {"train_loss": -11.87651252746582, "global_step": 289309, "epoch": 1722} {"train_loss": -11.986947059631348, "global_step": 289310, "epoch": 1722} {"train_loss": -12.010396957397461, "global_step": 289311, "epoch": 1722} {"train_loss": -11.936948776245117, "global_step": 289312, "epoch": 1722} {"train_loss": -12.197135925292969, "global_step": 289313, "epoch": 1722} {"train_loss": -12.176549911499023, "global_step": 289314, "epoch": 1722} {"train_loss": -12.00313663482666, "global_step": 289315, "epoch": 1722} {"train_loss": -12.175479888916016, "global_step": 289316, "epoch": 1722} {"train_loss": -12.194764137268066, "global_step": 289317, "epoch": 1722} {"train_loss": -12.233407974243164, "global_step": 289318, "epoch": 1722} {"train_loss": -11.875351905822754, "global_step": 289319, "epoch": 1722} {"train_loss": -12.15048599243164, "global_step": 289320, "epoch": 1722} {"train_loss": -11.979408264160156, "global_step": 289321, "epoch": 1722} {"train_loss": -12.257741928100586, "global_step": 289322, "epoch": 1722} {"train_loss": -12.163468360900879, "global_step": 289323, "epoch": 1722} {"train_loss": -12.201715469360352, "global_step": 289324, "epoch": 1722} {"train_loss": -11.88579273223877, "global_step": 289325, "epoch": 1722} {"train_loss": -12.18339729309082, "global_step": 289326, "epoch": 1722} {"train_loss": -12.117766380310059, "global_step": 289327, "epoch": 1722} {"train_loss": -12.083627700805664, "global_step": 289328, "epoch": 1722} {"train_loss": -12.101858139038086, "global_step": 289329, "epoch": 1722} {"train_loss": -12.273193359375, "global_step": 289330, "epoch": 1722} {"train_loss": -12.149293899536133, "global_step": 289331, "epoch": 1722} {"train_loss": -11.939772605895996, "global_step": 289332, "epoch": 1722} {"train_loss": -11.849072456359863, "global_step": 289333, "epoch": 1722} {"train_loss": -12.008625030517578, "global_step": 289334, "epoch": 1722} {"train_loss": -12.048462867736816, "global_step": 289335, "epoch": 1722} {"train_loss": -12.178412437438965, "global_step": 289336, "epoch": 1722} {"train_loss": -11.94939136505127, "global_step": 289337, "epoch": 1722} {"train_loss": -12.352641105651855, "global_step": 289338, "epoch": 1722} {"train_loss": -12.010008811950684, "global_step": 289339, "epoch": 1722} {"train_loss": -11.609066009521484, "global_step": 289340, "epoch": 1722} {"train_loss": -12.268950462341309, "global_step": 289341, "epoch": 1722} {"train_loss": -11.599042892456055, "global_step": 289342, "epoch": 1722} {"train_loss": -12.307024002075195, "global_step": 289343, "epoch": 1722} {"train_loss": -11.625846862792969, "global_step": 289344, "epoch": 1722} {"train_loss": -12.21406078338623, "global_step": 289345, "epoch": 1722} {"train_loss": -11.725967407226562, "global_step": 289346, "epoch": 1722} {"train_loss": -11.867927551269531, "global_step": 289347, "epoch": 1722} {"train_loss": -11.942951202392578, "global_step": 289348, "epoch": 1722} {"train_loss": -11.976837158203125, "global_step": 289349, "epoch": 1722} {"train_loss": -12.093507766723633, "global_step": 289350, "epoch": 1722} {"train_loss": -12.029199600219727, "global_step": 289351, "epoch": 1722} {"train_loss": -11.855033874511719, "global_step": 289352, "epoch": 1722} {"train_loss": -12.323423385620117, "global_step": 289353, "epoch": 1722} {"train_loss": -12.39290714263916, "global_step": 289354, "epoch": 1722} {"train_loss": -11.89445686340332, "global_step": 289355, "epoch": 1722} {"train_loss": -12.132477760314941, "global_step": 289356, "epoch": 1722} {"train_loss": -12.238349914550781, "global_step": 289357, "epoch": 1722} {"train_loss": -11.937522888183594, "global_step": 289358, "epoch": 1722} {"train_loss": -11.88667106628418, "global_step": 289359, "epoch": 1722} {"train_loss": -11.966730117797852, "global_step": 289360, "epoch": 1722} {"train_loss": -12.11280632019043, "global_step": 289361, "epoch": 1722} {"train_loss": -11.595314979553223, "global_step": 289362, "epoch": 1722} {"train_loss": -11.710868835449219, "global_step": 289363, "epoch": 1722} {"train_loss": -12.073308944702148, "global_step": 289364, "epoch": 1722} {"train_loss": -11.893779754638672, "global_step": 289365, "epoch": 1722} {"train_loss": -11.597162246704102, "global_step": 289366, "epoch": 1722} {"train_loss": -11.351005554199219, "global_step": 289367, "epoch": 1722} {"train_loss": -11.701801300048828, "global_step": 289368, "epoch": 1722} {"train_loss": -11.829109191894531, "global_step": 289369, "epoch": 1722} {"train_loss": -11.629262924194336, "global_step": 289370, "epoch": 1722} {"train_loss": -12.025899887084961, "global_step": 289371, "epoch": 1722} {"train_loss": -11.865543365478516, "global_step": 289372, "epoch": 1722} {"train_loss": -12.157129287719727, "global_step": 289373, "epoch": 1722} {"train_loss": -12.259567260742188, "global_step": 289374, "epoch": 1722} {"train_loss": -11.997940063476562, "global_step": 289375, "epoch": 1722} {"train_loss": -11.899759292602539, "global_step": 289376, "epoch": 1722} {"train_loss": -11.949971199035645, "global_step": 289377, "epoch": 1722} {"train_loss": -12.344989776611328, "global_step": 289378, "epoch": 1722} {"train_loss": -12.04934310913086, "global_step": 289379, "epoch": 1722} {"train_loss": -11.8687744140625, "global_step": 289380, "epoch": 1722} {"train_loss": -11.938238143920898, "global_step": 289381, "epoch": 1722} {"train_loss": -11.39675235748291, "global_step": 289382, "epoch": 1722} {"train_loss": -11.220684051513672, "global_step": 289383, "epoch": 1722} {"train_loss": -11.70002555847168, "global_step": 289384, "epoch": 1722} {"train_loss": -10.723553657531738, "global_step": 289385, "epoch": 1722} {"train_loss": -11.320724487304688, "global_step": 289386, "epoch": 1722} {"train_loss": -11.600244522094727, "global_step": 289387, "epoch": 1722} {"train_loss": -11.57650089263916, "global_step": 289388, "epoch": 1722} {"train_loss": -10.937934875488281, "global_step": 289389, "epoch": 1722} {"train_loss": -11.708532333374023, "global_step": 289390, "epoch": 1722} {"train_loss": -11.521780014038086, "global_step": 289391, "epoch": 1722} {"train_loss": -11.249374389648438, "global_step": 289392, "epoch": 1722} {"train_loss": -11.333741188049316, "global_step": 289393, "epoch": 1722} {"train_loss": -11.77330493927002, "global_step": 289394, "epoch": 1722} {"train_loss": -11.712961196899414, "global_step": 289395, "epoch": 1722} {"train_loss": -11.96937370300293, "global_step": 289396, "epoch": 1722} {"train_loss": -11.711851119995117, "global_step": 289397, "epoch": 1722} {"train_loss": -11.601661682128906, "global_step": 289398, "epoch": 1722} {"train_loss": -11.591861724853516, "global_step": 289399, "epoch": 1722} {"train_loss": -11.811996459960938, "global_step": 289400, "epoch": 1722} {"train_loss": -11.71403694152832, "global_step": 289401, "epoch": 1722} {"train_loss": -11.885690689086914, "global_step": 289402, "epoch": 1722} {"train_loss": -11.693197250366211, "global_step": 289403, "epoch": 1722} {"train_loss": -11.739255905151367, "global_step": 289404, "epoch": 1722} {"train_loss": -11.710026741027832, "global_step": 289405, "epoch": 1722} {"train_loss": -12.059617042541504, "global_step": 289406, "epoch": 1722} {"train_loss": -11.67497444152832, "global_step": 289407, "epoch": 1722} {"train_loss": -11.891189575195312, "global_step": 289408, "epoch": 1722} {"train_loss": -12.146093368530273, "global_step": 289409, "epoch": 1722} {"train_loss": -11.998319625854492, "global_step": 289410, "epoch": 1722} {"train_loss": -12.368924140930176, "global_step": 289411, "epoch": 1722} {"train_loss": -11.708959579467773, "global_step": 289412, "epoch": 1722} {"train_loss": -11.888113975524902, "global_step": 289413, "epoch": 1722} {"train_loss": -11.979668617248535, "global_step": 289414, "epoch": 1722} {"train_loss": -11.824219703674316, "global_step": 289415, "epoch": 1722} {"train_loss": -11.99014949798584, "global_step": 289416, "epoch": 1722} {"train_loss": -12.104313850402832, "global_step": 289417, "epoch": 1722} {"train_loss": -11.87967300415039, "global_step": 289418, "epoch": 1722} {"train_loss": -11.96232795715332, "global_step": 289419, "epoch": 1722} {"train_loss": -12.084314346313477, "global_step": 289420, "epoch": 1722} {"train_loss": -11.883140563964844, "global_step": 289421, "epoch": 1722} {"train_loss": -12.269298553466797, "global_step": 289422, "epoch": 1722} {"train_loss": -11.925994873046875, "global_step": 289423, "epoch": 1722} {"train_loss": -11.993500709533691, "global_step": 289424, "epoch": 1722} {"train_loss": -11.883828163146973, "global_step": 289425, "epoch": 1722} {"train_loss": -12.36754322052002, "global_step": 289426, "epoch": 1722} {"train_loss": -11.982208251953125, "global_step": 289427, "epoch": 1722} {"train_loss": -12.389796257019043, "global_step": 289428, "epoch": 1722} {"train_loss": -12.180168151855469, "global_step": 289429, "epoch": 1722} {"train_loss": -12.355895042419434, "global_step": 289430, "epoch": 1722} {"train_loss": -11.858680725097656, "global_step": 289431, "epoch": 1722} {"train_loss": -12.246543884277344, "global_step": 289432, "epoch": 1722} {"train_loss": -11.824384689331055, "global_step": 289433, "epoch": 1722} {"train_loss": -12.09034252166748, "global_step": 289434, "epoch": 1722} {"train_loss": -12.163043022155762, "global_step": 289435, "epoch": 1722} {"train_loss": -12.019879341125488, "global_step": 289436, "epoch": 1722} {"train_loss": -11.914302825927734, "global_step": 289437, "epoch": 1722} {"train_loss": -12.42678165435791, "global_step": 289438, "epoch": 1722} {"train_loss": -12.090400695800781, "global_step": 289439, "epoch": 1722} {"train_loss": -11.97513484954834, "global_step": 289440, "epoch": 1722} {"train_loss": -11.863683700561523, "global_step": 289441, "epoch": 1722} {"train_loss": -12.275598526000977, "global_step": 289442, "epoch": 1722} {"train_loss": -12.286569595336914, "global_step": 289443, "epoch": 1722} {"train_loss": -12.108458518981934, "global_step": 289444, "epoch": 1722} {"train_loss": -12.192280769348145, "global_step": 289445, "epoch": 1722} {"train_loss": -12.186503410339355, "global_step": 289446, "epoch": 1722} {"train_loss": -12.263575553894043, "global_step": 289447, "epoch": 1722} {"train_loss": -11.31761646270752, "global_step": 289448, "epoch": 1722} {"train_loss": -12.368415832519531, "global_step": 289449, "epoch": 1722} {"train_loss": -11.300737380981445, "global_step": 289450, "epoch": 1722} {"train_loss": -11.672786712646484, "global_step": 289451, "epoch": 1722} {"train_loss": -10.998671531677246, "global_step": 289452, "epoch": 1722} {"train_loss": -12.015464782714844, "global_step": 289453, "epoch": 1722} {"train_loss": -11.522628784179688, "global_step": 289454, "epoch": 1722} {"train_loss": -11.406526565551758, "global_step": 289455, "epoch": 1722} {"train_loss": -11.922563552856445, "global_step": 289456, "epoch": 1722} {"train_loss": -11.366601943969727, "global_step": 289457, "epoch": 1722} {"train_loss": -11.216400146484375, "global_step": 289458, "epoch": 1722} {"train_loss": -11.060138702392578, "global_step": 289459, "epoch": 1722} {"train_loss": -12.238668441772461, "global_step": 289460, "epoch": 1722} {"train_loss": -11.171887397766113, "global_step": 289461, "epoch": 1722} {"train_loss": -11.417112350463867, "global_step": 289462, "epoch": 1722} {"train_loss": -11.89702072030022, "global_step": 289463, "epoch": 1722, "val_loss": 278812.3125} {"train_loss": -11.56203842163086, "global_step": 289464, "epoch": 1723} {"train_loss": -11.815321922302246, "global_step": 289465, "epoch": 1723} {"train_loss": -11.735901832580566, "global_step": 289466, "epoch": 1723} {"train_loss": -11.628274917602539, "global_step": 289467, "epoch": 1723} {"train_loss": -11.854629516601562, "global_step": 289468, "epoch": 1723} {"train_loss": -11.730432510375977, "global_step": 289469, "epoch": 1723} {"train_loss": -12.53548526763916, "global_step": 289470, "epoch": 1723} {"train_loss": -11.788433074951172, "global_step": 289471, "epoch": 1723} {"train_loss": -11.878168106079102, "global_step": 289472, "epoch": 1723} {"train_loss": -11.746788024902344, "global_step": 289473, "epoch": 1723} {"train_loss": -11.904996871948242, "global_step": 289474, "epoch": 1723} {"train_loss": -12.22616958618164, "global_step": 289475, "epoch": 1723} {"train_loss": -11.374273300170898, "global_step": 289476, "epoch": 1723} {"train_loss": -12.244548797607422, "global_step": 289477, "epoch": 1723} {"train_loss": -11.982040405273438, "global_step": 289478, "epoch": 1723} {"train_loss": -12.016487121582031, "global_step": 289479, "epoch": 1723} {"train_loss": -11.599959373474121, "global_step": 289480, "epoch": 1723} {"train_loss": -11.946186065673828, "global_step": 289481, "epoch": 1723} {"train_loss": -11.543593406677246, "global_step": 289482, "epoch": 1723} {"train_loss": -11.942949295043945, "global_step": 289483, "epoch": 1723} {"train_loss": -12.31421947479248, "global_step": 289484, "epoch": 1723} {"train_loss": -11.775522232055664, "global_step": 289485, "epoch": 1723} {"train_loss": -12.393769264221191, "global_step": 289486, "epoch": 1723} {"train_loss": -11.753329277038574, "global_step": 289487, "epoch": 1723} {"train_loss": -12.047733306884766, "global_step": 289488, "epoch": 1723} {"train_loss": -12.028564453125, "global_step": 289489, "epoch": 1723} {"train_loss": -12.062849998474121, "global_step": 289490, "epoch": 1723} {"train_loss": -11.924105644226074, "global_step": 289491, "epoch": 1723} {"train_loss": -11.986818313598633, "global_step": 289492, "epoch": 1723} {"train_loss": -12.053980827331543, "global_step": 289493, "epoch": 1723} {"train_loss": -12.099248886108398, "global_step": 289494, "epoch": 1723} {"train_loss": -11.8759765625, "global_step": 289495, "epoch": 1723} {"train_loss": -11.54175090789795, "global_step": 289496, "epoch": 1723} {"train_loss": -12.299236297607422, "global_step": 289497, "epoch": 1723} {"train_loss": -11.902349472045898, "global_step": 289498, "epoch": 1723} {"train_loss": -12.196986198425293, "global_step": 289499, "epoch": 1723} {"train_loss": -11.856618881225586, "global_step": 289500, "epoch": 1723} {"train_loss": -12.109376907348633, "global_step": 289501, "epoch": 1723} {"train_loss": -11.748971939086914, "global_step": 289502, "epoch": 1723} {"train_loss": -11.895435333251953, "global_step": 289503, "epoch": 1723} {"train_loss": -12.213313102722168, "global_step": 289504, "epoch": 1723} {"train_loss": -11.984739303588867, "global_step": 289505, "epoch": 1723} {"train_loss": -11.85488224029541, "global_step": 289506, "epoch": 1723} {"train_loss": -11.365410804748535, "global_step": 289507, "epoch": 1723} {"train_loss": -12.086028099060059, "global_step": 289508, "epoch": 1723} {"train_loss": -11.446067810058594, "global_step": 289509, "epoch": 1723} {"train_loss": -12.097227096557617, "global_step": 289510, "epoch": 1723} {"train_loss": -11.756397247314453, "global_step": 289511, "epoch": 1723} {"train_loss": -12.281783103942871, "global_step": 289512, "epoch": 1723} {"train_loss": -11.560201644897461, "global_step": 289513, "epoch": 1723} {"train_loss": -12.33228874206543, "global_step": 289514, "epoch": 1723} {"train_loss": -11.804433822631836, "global_step": 289515, "epoch": 1723} {"train_loss": -12.230262756347656, "global_step": 289516, "epoch": 1723} {"train_loss": -11.975446701049805, "global_step": 289517, "epoch": 1723} {"train_loss": -11.809015274047852, "global_step": 289518, "epoch": 1723} {"train_loss": -11.632101058959961, "global_step": 289519, "epoch": 1723} {"train_loss": -11.858477592468262, "global_step": 289520, "epoch": 1723} {"train_loss": -11.742110252380371, "global_step": 289521, "epoch": 1723} {"train_loss": -11.312947273254395, "global_step": 289522, "epoch": 1723} {"train_loss": -10.807369232177734, "global_step": 289523, "epoch": 1723} {"train_loss": -11.513166427612305, "global_step": 289524, "epoch": 1723} {"train_loss": -12.069364547729492, "global_step": 289525, "epoch": 1723} {"train_loss": -11.06541919708252, "global_step": 289526, "epoch": 1723} {"train_loss": -11.783763885498047, "global_step": 289527, "epoch": 1723} {"train_loss": -11.706501007080078, "global_step": 289528, "epoch": 1723} {"train_loss": -11.604317665100098, "global_step": 289529, "epoch": 1723} {"train_loss": -10.555801391601562, "global_step": 289530, "epoch": 1723} {"train_loss": -11.096565246582031, "global_step": 289531, "epoch": 1723} {"train_loss": -12.071067810058594, "global_step": 289532, "epoch": 1723} {"train_loss": -10.659107208251953, "global_step": 289533, "epoch": 1723} {"train_loss": -11.251834869384766, "global_step": 289534, "epoch": 1723} {"train_loss": -11.092677116394043, "global_step": 289535, "epoch": 1723} {"train_loss": -8.58895492553711, "global_step": 289536, "epoch": 1723} {"train_loss": -10.945570945739746, "global_step": 289537, "epoch": 1723} {"train_loss": -9.261516571044922, "global_step": 289538, "epoch": 1723} {"train_loss": -9.8887357711792, "global_step": 289539, "epoch": 1723} {"train_loss": -10.770256042480469, "global_step": 289540, "epoch": 1723} {"train_loss": -8.32602310180664, "global_step": 289541, "epoch": 1723} {"train_loss": -10.03471565246582, "global_step": 289542, "epoch": 1723} {"train_loss": -9.927020072937012, "global_step": 289543, "epoch": 1723} {"train_loss": -10.102644920349121, "global_step": 289544, "epoch": 1723} {"train_loss": -10.701225280761719, "global_step": 289545, "epoch": 1723} {"train_loss": -10.923088073730469, "global_step": 289546, "epoch": 1723} {"train_loss": -10.781448364257812, "global_step": 289547, "epoch": 1723} {"train_loss": -10.5966796875, "global_step": 289548, "epoch": 1723} {"train_loss": -10.828203201293945, "global_step": 289549, "epoch": 1723} {"train_loss": -10.65316390991211, "global_step": 289550, "epoch": 1723} {"train_loss": -10.675298690795898, "global_step": 289551, "epoch": 1723} {"train_loss": -11.081268310546875, "global_step": 289552, "epoch": 1723} {"train_loss": -11.290971755981445, "global_step": 289553, "epoch": 1723} {"train_loss": -10.98825454711914, "global_step": 289554, "epoch": 1723} {"train_loss": -11.146448135375977, "global_step": 289555, "epoch": 1723} {"train_loss": -10.952369689941406, "global_step": 289556, "epoch": 1723} {"train_loss": -11.52255630493164, "global_step": 289557, "epoch": 1723} {"train_loss": -11.188665390014648, "global_step": 289558, "epoch": 1723} {"train_loss": -10.912399291992188, "global_step": 289559, "epoch": 1723} {"train_loss": -11.615463256835938, "global_step": 289560, "epoch": 1723} {"train_loss": -11.074803352355957, "global_step": 289561, "epoch": 1723} {"train_loss": -11.4539794921875, "global_step": 289562, "epoch": 1723} {"train_loss": -11.089921951293945, "global_step": 289563, "epoch": 1723} {"train_loss": -11.399563789367676, "global_step": 289564, "epoch": 1723} {"train_loss": -11.017115592956543, "global_step": 289565, "epoch": 1723} {"train_loss": -11.384225845336914, "global_step": 289566, "epoch": 1723} {"train_loss": -11.117362976074219, "global_step": 289567, "epoch": 1723} {"train_loss": -11.247613906860352, "global_step": 289568, "epoch": 1723} {"train_loss": -11.501683235168457, "global_step": 289569, "epoch": 1723} {"train_loss": -11.19111442565918, "global_step": 289570, "epoch": 1723} {"train_loss": -11.499711990356445, "global_step": 289571, "epoch": 1723} {"train_loss": -11.33357048034668, "global_step": 289572, "epoch": 1723} {"train_loss": -11.53880500793457, "global_step": 289573, "epoch": 1723} {"train_loss": -11.452775955200195, "global_step": 289574, "epoch": 1723} {"train_loss": -11.470545768737793, "global_step": 289575, "epoch": 1723} {"train_loss": -11.455992698669434, "global_step": 289576, "epoch": 1723} {"train_loss": -11.819913864135742, "global_step": 289577, "epoch": 1723} {"train_loss": -11.847284317016602, "global_step": 289578, "epoch": 1723} {"train_loss": -11.674251556396484, "global_step": 289579, "epoch": 1723} {"train_loss": -11.857917785644531, "global_step": 289580, "epoch": 1723} {"train_loss": -11.89023494720459, "global_step": 289581, "epoch": 1723} {"train_loss": -11.794821739196777, "global_step": 289582, "epoch": 1723} {"train_loss": -11.830608367919922, "global_step": 289583, "epoch": 1723} {"train_loss": -11.987190246582031, "global_step": 289584, "epoch": 1723} {"train_loss": -12.088144302368164, "global_step": 289585, "epoch": 1723} {"train_loss": -11.92970085144043, "global_step": 289586, "epoch": 1723} {"train_loss": -11.594325065612793, "global_step": 289587, "epoch": 1723} {"train_loss": -11.889657974243164, "global_step": 289588, "epoch": 1723} {"train_loss": -11.860954284667969, "global_step": 289589, "epoch": 1723} {"train_loss": -12.129461288452148, "global_step": 289590, "epoch": 1723} {"train_loss": -11.836301803588867, "global_step": 289591, "epoch": 1723} {"train_loss": -12.108513832092285, "global_step": 289592, "epoch": 1723} {"train_loss": -12.02535343170166, "global_step": 289593, "epoch": 1723} {"train_loss": -12.080421447753906, "global_step": 289594, "epoch": 1723} {"train_loss": -12.084185600280762, "global_step": 289595, "epoch": 1723} {"train_loss": -11.951847076416016, "global_step": 289596, "epoch": 1723} {"train_loss": -11.825162887573242, "global_step": 289597, "epoch": 1723} {"train_loss": -11.894923210144043, "global_step": 289598, "epoch": 1723} {"train_loss": -11.89578628540039, "global_step": 289599, "epoch": 1723} {"train_loss": -11.89896297454834, "global_step": 289600, "epoch": 1723} {"train_loss": -11.958964347839355, "global_step": 289601, "epoch": 1723} {"train_loss": -12.186075210571289, "global_step": 289602, "epoch": 1723} {"train_loss": -12.000495910644531, "global_step": 289603, "epoch": 1723} {"train_loss": -12.188272476196289, "global_step": 289604, "epoch": 1723} {"train_loss": -12.168514251708984, "global_step": 289605, "epoch": 1723} {"train_loss": -12.24704360961914, "global_step": 289606, "epoch": 1723} {"train_loss": -12.210248947143555, "global_step": 289607, "epoch": 1723} {"train_loss": -12.300420761108398, "global_step": 289608, "epoch": 1723} {"train_loss": -12.1882963180542, "global_step": 289609, "epoch": 1723} {"train_loss": -12.261601448059082, "global_step": 289610, "epoch": 1723} {"train_loss": -12.345224380493164, "global_step": 289611, "epoch": 1723} {"train_loss": -12.142355918884277, "global_step": 289612, "epoch": 1723} {"train_loss": -12.29959487915039, "global_step": 289613, "epoch": 1723} {"train_loss": -12.278022766113281, "global_step": 289614, "epoch": 1723} {"train_loss": -12.360275268554688, "global_step": 289615, "epoch": 1723} {"train_loss": -12.15194320678711, "global_step": 289616, "epoch": 1723} {"train_loss": -12.47703742980957, "global_step": 289617, "epoch": 1723} {"train_loss": -12.500056266784668, "global_step": 289618, "epoch": 1723} {"train_loss": -12.432211875915527, "global_step": 289619, "epoch": 1723} {"train_loss": -12.500092506408691, "global_step": 289620, "epoch": 1723} {"train_loss": -12.461446762084961, "global_step": 289621, "epoch": 1723} {"train_loss": -12.366731643676758, "global_step": 289622, "epoch": 1723} {"train_loss": -12.448322296142578, "global_step": 289623, "epoch": 1723} {"train_loss": -12.359103202819824, "global_step": 289624, "epoch": 1723} {"train_loss": -12.467316627502441, "global_step": 289625, "epoch": 1723} {"train_loss": -12.419112205505371, "global_step": 289626, "epoch": 1723} {"train_loss": -12.355783462524414, "global_step": 289627, "epoch": 1723} {"train_loss": -12.503388404846191, "global_step": 289628, "epoch": 1723} {"train_loss": -12.424440383911133, "global_step": 289629, "epoch": 1723} {"train_loss": -12.294302940368652, "global_step": 289630, "epoch": 1723} {"train_loss": -11.678685846782866, "global_step": 289631, "epoch": 1723, "val_loss": 278594.90625} {"train_loss": -12.437718391418457, "global_step": 289632, "epoch": 1724} {"train_loss": -12.166566848754883, "global_step": 289633, "epoch": 1724} {"train_loss": -12.46360969543457, "global_step": 289634, "epoch": 1724} {"train_loss": -12.449833869934082, "global_step": 289635, "epoch": 1724} {"train_loss": -12.292972564697266, "global_step": 289636, "epoch": 1724} {"train_loss": -11.784025192260742, "global_step": 289637, "epoch": 1724} {"train_loss": -12.400168418884277, "global_step": 289638, "epoch": 1724} {"train_loss": -12.393512725830078, "global_step": 289639, "epoch": 1724} {"train_loss": -12.282920837402344, "global_step": 289640, "epoch": 1724} {"train_loss": -12.451616287231445, "global_step": 289641, "epoch": 1724} {"train_loss": -12.37506103515625, "global_step": 289642, "epoch": 1724} {"train_loss": -12.440074920654297, "global_step": 289643, "epoch": 1724} {"train_loss": -12.277837753295898, "global_step": 289644, "epoch": 1724} {"train_loss": -12.233634948730469, "global_step": 289645, "epoch": 1724} {"train_loss": -12.260993957519531, "global_step": 289646, "epoch": 1724} {"train_loss": -12.607710838317871, "global_step": 289647, "epoch": 1724} {"train_loss": -12.331342697143555, "global_step": 289648, "epoch": 1724} {"train_loss": -12.564189910888672, "global_step": 289649, "epoch": 1724} {"train_loss": -12.332170486450195, "global_step": 289650, "epoch": 1724} {"train_loss": -12.259220123291016, "global_step": 289651, "epoch": 1724} {"train_loss": -12.353414535522461, "global_step": 289652, "epoch": 1724} {"train_loss": -12.593029022216797, "global_step": 289653, "epoch": 1724} {"train_loss": -12.164021492004395, "global_step": 289654, "epoch": 1724} {"train_loss": -11.506484985351562, "global_step": 289655, "epoch": 1724} {"train_loss": -11.097716331481934, "global_step": 289656, "epoch": 1724} {"train_loss": -12.24608039855957, "global_step": 289657, "epoch": 1724} {"train_loss": -12.268962860107422, "global_step": 289658, "epoch": 1724} {"train_loss": -12.30469799041748, "global_step": 289659, "epoch": 1724} {"train_loss": -11.815671920776367, "global_step": 289660, "epoch": 1724} {"train_loss": -11.990262031555176, "global_step": 289661, "epoch": 1724} {"train_loss": -11.60651969909668, "global_step": 289662, "epoch": 1724} {"train_loss": -12.004631042480469, "global_step": 289663, "epoch": 1724} {"train_loss": -12.008255958557129, "global_step": 289664, "epoch": 1724} {"train_loss": -11.571051597595215, "global_step": 289665, "epoch": 1724} {"train_loss": -10.353662490844727, "global_step": 289666, "epoch": 1724} {"train_loss": -12.245943069458008, "global_step": 289667, "epoch": 1724} {"train_loss": -10.065481185913086, "global_step": 289668, "epoch": 1724} {"train_loss": -10.745953559875488, "global_step": 289669, "epoch": 1724} {"train_loss": -10.62395191192627, "global_step": 289670, "epoch": 1724} {"train_loss": -9.421903610229492, "global_step": 289671, "epoch": 1724} {"train_loss": -9.326945304870605, "global_step": 289672, "epoch": 1724} {"train_loss": -11.44978141784668, "global_step": 289673, "epoch": 1724} {"train_loss": -8.626730918884277, "global_step": 289674, "epoch": 1724} {"train_loss": -11.853739738464355, "global_step": 289675, "epoch": 1724} {"train_loss": -11.187226295471191, "global_step": 289676, "epoch": 1724} {"train_loss": -9.927423477172852, "global_step": 289677, "epoch": 1724} {"train_loss": -11.644575119018555, "global_step": 289678, "epoch": 1724} {"train_loss": -9.509981155395508, "global_step": 289679, "epoch": 1724} {"train_loss": -11.228652954101562, "global_step": 289680, "epoch": 1724} {"train_loss": -9.130703926086426, "global_step": 289681, "epoch": 1724} {"train_loss": -10.737825393676758, "global_step": 289682, "epoch": 1724} {"train_loss": -11.02261734008789, "global_step": 289683, "epoch": 1724} {"train_loss": -9.6182279586792, "global_step": 289684, "epoch": 1724} {"train_loss": -9.278373718261719, "global_step": 289685, "epoch": 1724} {"train_loss": -8.83049201965332, "global_step": 289686, "epoch": 1724} {"train_loss": -9.484407424926758, "global_step": 289687, "epoch": 1724} {"train_loss": -10.76342487335205, "global_step": 289688, "epoch": 1724} {"train_loss": -10.120098114013672, "global_step": 289689, "epoch": 1724} {"train_loss": -9.27886962890625, "global_step": 289690, "epoch": 1724} {"train_loss": -9.416406631469727, "global_step": 289691, "epoch": 1724} {"train_loss": -10.08320140838623, "global_step": 289692, "epoch": 1724} {"train_loss": -10.87215805053711, "global_step": 289693, "epoch": 1724} {"train_loss": -9.25673770904541, "global_step": 289694, "epoch": 1724} {"train_loss": -10.779546737670898, "global_step": 289695, "epoch": 1724} {"train_loss": -10.519035339355469, "global_step": 289696, "epoch": 1724} {"train_loss": -10.450183868408203, "global_step": 289697, "epoch": 1724} {"train_loss": -11.479639053344727, "global_step": 289698, "epoch": 1724} {"train_loss": -10.997025489807129, "global_step": 289699, "epoch": 1724} {"train_loss": -11.18044376373291, "global_step": 289700, "epoch": 1724} {"train_loss": -11.530301094055176, "global_step": 289701, "epoch": 1724} {"train_loss": -10.673592567443848, "global_step": 289702, "epoch": 1724} {"train_loss": -11.264915466308594, "global_step": 289703, "epoch": 1724} {"train_loss": -11.66385555267334, "global_step": 289704, "epoch": 1724} {"train_loss": -11.40289306640625, "global_step": 289705, "epoch": 1724} {"train_loss": -11.86397647857666, "global_step": 289706, "epoch": 1724} {"train_loss": -11.287018775939941, "global_step": 289707, "epoch": 1724} {"train_loss": -11.308292388916016, "global_step": 289708, "epoch": 1724} {"train_loss": -11.544670104980469, "global_step": 289709, "epoch": 1724} {"train_loss": -11.454292297363281, "global_step": 289710, "epoch": 1724} {"train_loss": -11.614035606384277, "global_step": 289711, "epoch": 1724} {"train_loss": -11.865488052368164, "global_step": 289712, "epoch": 1724} {"train_loss": -11.484384536743164, "global_step": 289713, "epoch": 1724} {"train_loss": -11.62529182434082, "global_step": 289714, "epoch": 1724} {"train_loss": -11.595840454101562, "global_step": 289715, "epoch": 1724} {"train_loss": -11.446660995483398, "global_step": 289716, "epoch": 1724} {"train_loss": -11.471512794494629, "global_step": 289717, "epoch": 1724} {"train_loss": -11.59288215637207, "global_step": 289718, "epoch": 1724} {"train_loss": -11.592422485351562, "global_step": 289719, "epoch": 1724} {"train_loss": -11.826278686523438, "global_step": 289720, "epoch": 1724} {"train_loss": -11.665092468261719, "global_step": 289721, "epoch": 1724} {"train_loss": -12.051151275634766, "global_step": 289722, "epoch": 1724} {"train_loss": -11.393587112426758, "global_step": 289723, "epoch": 1724} {"train_loss": -11.583358764648438, "global_step": 289724, "epoch": 1724} {"train_loss": -11.907466888427734, "global_step": 289725, "epoch": 1724} {"train_loss": -11.690665245056152, "global_step": 289726, "epoch": 1724} {"train_loss": -11.91835880279541, "global_step": 289727, "epoch": 1724} {"train_loss": -11.71603012084961, "global_step": 289728, "epoch": 1724} {"train_loss": -11.847397804260254, "global_step": 289729, "epoch": 1724} {"train_loss": -11.920373916625977, "global_step": 289730, "epoch": 1724} {"train_loss": -11.661928176879883, "global_step": 289731, "epoch": 1724} {"train_loss": -11.89692497253418, "global_step": 289732, "epoch": 1724} {"train_loss": -11.749581336975098, "global_step": 289733, "epoch": 1724} {"train_loss": -11.808307647705078, "global_step": 289734, "epoch": 1724} {"train_loss": -12.042560577392578, "global_step": 289735, "epoch": 1724} {"train_loss": -11.468881607055664, "global_step": 289736, "epoch": 1724} {"train_loss": -11.97185230255127, "global_step": 289737, "epoch": 1724} {"train_loss": -11.787803649902344, "global_step": 289738, "epoch": 1724} {"train_loss": -11.877418518066406, "global_step": 289739, "epoch": 1724} {"train_loss": -12.038532257080078, "global_step": 289740, "epoch": 1724} {"train_loss": -11.857026100158691, "global_step": 289741, "epoch": 1724} {"train_loss": -11.926530838012695, "global_step": 289742, "epoch": 1724} {"train_loss": -11.961614608764648, "global_step": 289743, "epoch": 1724} {"train_loss": -12.2596435546875, "global_step": 289744, "epoch": 1724} {"train_loss": -11.826506614685059, "global_step": 289745, "epoch": 1724} {"train_loss": -12.078550338745117, "global_step": 289746, "epoch": 1724} {"train_loss": -11.87195873260498, "global_step": 289747, "epoch": 1724} {"train_loss": -12.14669132232666, "global_step": 289748, "epoch": 1724} {"train_loss": -12.126953125, "global_step": 289749, "epoch": 1724} {"train_loss": -12.03015422821045, "global_step": 289750, "epoch": 1724} {"train_loss": -12.229183197021484, "global_step": 289751, "epoch": 1724} {"train_loss": -12.189199447631836, "global_step": 289752, "epoch": 1724} {"train_loss": -12.237205505371094, "global_step": 289753, "epoch": 1724} {"train_loss": -12.081781387329102, "global_step": 289754, "epoch": 1724} {"train_loss": -12.25864315032959, "global_step": 289755, "epoch": 1724} {"train_loss": -12.145223617553711, "global_step": 289756, "epoch": 1724} {"train_loss": -12.144939422607422, "global_step": 289757, "epoch": 1724} {"train_loss": -12.001200675964355, "global_step": 289758, "epoch": 1724} {"train_loss": -12.225193977355957, "global_step": 289759, "epoch": 1724} {"train_loss": -11.996700286865234, "global_step": 289760, "epoch": 1724} {"train_loss": -12.133539199829102, "global_step": 289761, "epoch": 1724} {"train_loss": -11.863851547241211, "global_step": 289762, "epoch": 1724} {"train_loss": -12.361199378967285, "global_step": 289763, "epoch": 1724} {"train_loss": -12.174962997436523, "global_step": 289764, "epoch": 1724} {"train_loss": -12.165191650390625, "global_step": 289765, "epoch": 1724} {"train_loss": -12.072601318359375, "global_step": 289766, "epoch": 1724} {"train_loss": -12.34833812713623, "global_step": 289767, "epoch": 1724} {"train_loss": -11.917405128479004, "global_step": 289768, "epoch": 1724} {"train_loss": -12.211708068847656, "global_step": 289769, "epoch": 1724} {"train_loss": -12.19806957244873, "global_step": 289770, "epoch": 1724} {"train_loss": -12.208771705627441, "global_step": 289771, "epoch": 1724} {"train_loss": -12.11623764038086, "global_step": 289772, "epoch": 1724} {"train_loss": -12.266439437866211, "global_step": 289773, "epoch": 1724} {"train_loss": -12.396718978881836, "global_step": 289774, "epoch": 1724} {"train_loss": -12.148271560668945, "global_step": 289775, "epoch": 1724} {"train_loss": -12.372231483459473, "global_step": 289776, "epoch": 1724} {"train_loss": -12.089609146118164, "global_step": 289777, "epoch": 1724} {"train_loss": -12.401742935180664, "global_step": 289778, "epoch": 1724} {"train_loss": -12.301560401916504, "global_step": 289779, "epoch": 1724} {"train_loss": -12.328784942626953, "global_step": 289780, "epoch": 1724} {"train_loss": -12.511585235595703, "global_step": 289781, "epoch": 1724} {"train_loss": -12.267847061157227, "global_step": 289782, "epoch": 1724} {"train_loss": -12.450183868408203, "global_step": 289783, "epoch": 1724} {"train_loss": -12.370990753173828, "global_step": 289784, "epoch": 1724} {"train_loss": -12.381695747375488, "global_step": 289785, "epoch": 1724} {"train_loss": -12.47569465637207, "global_step": 289786, "epoch": 1724} {"train_loss": -12.264152526855469, "global_step": 289787, "epoch": 1724} {"train_loss": -12.39828872680664, "global_step": 289788, "epoch": 1724} {"train_loss": -12.474390029907227, "global_step": 289789, "epoch": 1724} {"train_loss": -12.338752746582031, "global_step": 289790, "epoch": 1724} {"train_loss": -12.547107696533203, "global_step": 289791, "epoch": 1724} {"train_loss": -12.358304977416992, "global_step": 289792, "epoch": 1724} {"train_loss": -12.430950164794922, "global_step": 289793, "epoch": 1724} {"train_loss": -12.317132949829102, "global_step": 289794, "epoch": 1724} {"train_loss": -12.095653533935547, "global_step": 289795, "epoch": 1724} {"train_loss": -12.465177536010742, "global_step": 289796, "epoch": 1724} {"train_loss": -12.032588005065918, "global_step": 289797, "epoch": 1724} {"train_loss": -11.028791427612305, "global_step": 289798, "epoch": 1724} {"train_loss": -11.670053975922722, "global_step": 289799, "epoch": 1724, "val_loss": 279135.40625} {"train_loss": -11.717903137207031, "global_step": 289800, "epoch": 1725} {"train_loss": -11.972944259643555, "global_step": 289801, "epoch": 1725} {"train_loss": -11.649321556091309, "global_step": 289802, "epoch": 1725} {"train_loss": -11.772971153259277, "global_step": 289803, "epoch": 1725} {"train_loss": -12.039127349853516, "global_step": 289804, "epoch": 1725} {"train_loss": -10.94830322265625, "global_step": 289805, "epoch": 1725} {"train_loss": -12.053523063659668, "global_step": 289806, "epoch": 1725} {"train_loss": -11.335039138793945, "global_step": 289807, "epoch": 1725} {"train_loss": -11.707388877868652, "global_step": 289808, "epoch": 1725} {"train_loss": -11.132817268371582, "global_step": 289809, "epoch": 1725} {"train_loss": -12.011977195739746, "global_step": 289810, "epoch": 1725} {"train_loss": -11.73405647277832, "global_step": 289811, "epoch": 1725} {"train_loss": -12.24321460723877, "global_step": 289812, "epoch": 1725} {"train_loss": -11.866180419921875, "global_step": 289813, "epoch": 1725} {"train_loss": -12.21542739868164, "global_step": 289814, "epoch": 1725} {"train_loss": -11.764524459838867, "global_step": 289815, "epoch": 1725} {"train_loss": -11.996456146240234, "global_step": 289816, "epoch": 1725} {"train_loss": -11.618057250976562, "global_step": 289817, "epoch": 1725} {"train_loss": -11.83035659790039, "global_step": 289818, "epoch": 1725} {"train_loss": -11.803447723388672, "global_step": 289819, "epoch": 1725} {"train_loss": -12.341766357421875, "global_step": 289820, "epoch": 1725} {"train_loss": -11.801422119140625, "global_step": 289821, "epoch": 1725} {"train_loss": -12.18816089630127, "global_step": 289822, "epoch": 1725} {"train_loss": -11.74795913696289, "global_step": 289823, "epoch": 1725} {"train_loss": -12.120504379272461, "global_step": 289824, "epoch": 1725} {"train_loss": -11.601202964782715, "global_step": 289825, "epoch": 1725} {"train_loss": -11.727893829345703, "global_step": 289826, "epoch": 1725} {"train_loss": -12.122117042541504, "global_step": 289827, "epoch": 1725} {"train_loss": -11.764608383178711, "global_step": 289828, "epoch": 1725} {"train_loss": -11.067588806152344, "global_step": 289829, "epoch": 1725} {"train_loss": -11.227437973022461, "global_step": 289830, "epoch": 1725} {"train_loss": -11.869190216064453, "global_step": 289831, "epoch": 1725} {"train_loss": -11.274408340454102, "global_step": 289832, "epoch": 1725} {"train_loss": -9.769198417663574, "global_step": 289833, "epoch": 1725} {"train_loss": -11.721809387207031, "global_step": 289834, "epoch": 1725} {"train_loss": -10.957533836364746, "global_step": 289835, "epoch": 1725} {"train_loss": -7.4339399337768555, "global_step": 289836, "epoch": 1725} {"train_loss": -10.682753562927246, "global_step": 289837, "epoch": 1725} {"train_loss": -10.016950607299805, "global_step": 289838, "epoch": 1725} {"train_loss": -9.18516731262207, "global_step": 289839, "epoch": 1725} {"train_loss": -9.5617094039917, "global_step": 289840, "epoch": 1725} {"train_loss": -10.135138511657715, "global_step": 289841, "epoch": 1725} {"train_loss": -10.339374542236328, "global_step": 289842, "epoch": 1725} {"train_loss": -9.508639335632324, "global_step": 289843, "epoch": 1725} {"train_loss": -8.227422714233398, "global_step": 289844, "epoch": 1725} {"train_loss": -10.318449020385742, "global_step": 289845, "epoch": 1725} {"train_loss": -10.643411636352539, "global_step": 289846, "epoch": 1725} {"train_loss": -9.488651275634766, "global_step": 289847, "epoch": 1725} {"train_loss": -10.779436111450195, "global_step": 289848, "epoch": 1725} {"train_loss": -11.431071281433105, "global_step": 289849, "epoch": 1725} {"train_loss": -9.998565673828125, "global_step": 289850, "epoch": 1725} {"train_loss": -11.01487922668457, "global_step": 289851, "epoch": 1725} {"train_loss": -9.781806945800781, "global_step": 289852, "epoch": 1725} {"train_loss": -10.163619995117188, "global_step": 289853, "epoch": 1725} {"train_loss": -10.467263221740723, "global_step": 289854, "epoch": 1725} {"train_loss": -9.889924049377441, "global_step": 289855, "epoch": 1725} {"train_loss": -10.5086088180542, "global_step": 289856, "epoch": 1725} {"train_loss": -11.23883056640625, "global_step": 289857, "epoch": 1725} {"train_loss": -10.13973331451416, "global_step": 289858, "epoch": 1725} {"train_loss": -11.082979202270508, "global_step": 289859, "epoch": 1725} {"train_loss": -11.17564868927002, "global_step": 289860, "epoch": 1725} {"train_loss": -10.786601066589355, "global_step": 289861, "epoch": 1725} {"train_loss": -11.116701126098633, "global_step": 289862, "epoch": 1725} {"train_loss": -11.08588981628418, "global_step": 289863, "epoch": 1725} {"train_loss": -10.906915664672852, "global_step": 289864, "epoch": 1725} {"train_loss": -11.16830825805664, "global_step": 289865, "epoch": 1725} {"train_loss": -11.101179122924805, "global_step": 289866, "epoch": 1725} {"train_loss": -11.617386817932129, "global_step": 289867, "epoch": 1725} {"train_loss": -11.213142395019531, "global_step": 289868, "epoch": 1725} {"train_loss": -11.36021900177002, "global_step": 289869, "epoch": 1725} {"train_loss": -11.371007919311523, "global_step": 289870, "epoch": 1725} {"train_loss": -11.368537902832031, "global_step": 289871, "epoch": 1725} {"train_loss": -11.307123184204102, "global_step": 289872, "epoch": 1725} {"train_loss": -11.389015197753906, "global_step": 289873, "epoch": 1725} {"train_loss": -11.11894702911377, "global_step": 289874, "epoch": 1725} {"train_loss": -11.318916320800781, "global_step": 289875, "epoch": 1725} {"train_loss": -11.668318748474121, "global_step": 289876, "epoch": 1725} {"train_loss": -11.237789154052734, "global_step": 289877, "epoch": 1725} {"train_loss": -11.74963665008545, "global_step": 289878, "epoch": 1725} {"train_loss": -11.446502685546875, "global_step": 289879, "epoch": 1725} {"train_loss": -11.653362274169922, "global_step": 289880, "epoch": 1725} {"train_loss": -11.48471450805664, "global_step": 289881, "epoch": 1725} {"train_loss": -11.515106201171875, "global_step": 289882, "epoch": 1725} {"train_loss": -11.569910049438477, "global_step": 289883, "epoch": 1725} {"train_loss": -11.401630401611328, "global_step": 289884, "epoch": 1725} {"train_loss": -11.464322090148926, "global_step": 289885, "epoch": 1725} {"train_loss": -11.84660530090332, "global_step": 289886, "epoch": 1725} {"train_loss": -11.832176208496094, "global_step": 289887, "epoch": 1725} {"train_loss": -11.799578666687012, "global_step": 289888, "epoch": 1725} {"train_loss": -11.825383186340332, "global_step": 289889, "epoch": 1725} {"train_loss": -11.721590042114258, "global_step": 289890, "epoch": 1725} {"train_loss": -11.683037757873535, "global_step": 289891, "epoch": 1725} {"train_loss": -11.927995681762695, "global_step": 289892, "epoch": 1725} {"train_loss": -11.723766326904297, "global_step": 289893, "epoch": 1725} {"train_loss": -11.806401252746582, "global_step": 289894, "epoch": 1725} {"train_loss": -11.875349044799805, "global_step": 289895, "epoch": 1725} {"train_loss": -11.414907455444336, "global_step": 289896, "epoch": 1725} {"train_loss": -11.881746292114258, "global_step": 289897, "epoch": 1725} {"train_loss": -11.759054183959961, "global_step": 289898, "epoch": 1725} {"train_loss": -11.888790130615234, "global_step": 289899, "epoch": 1725} {"train_loss": -11.947482109069824, "global_step": 289900, "epoch": 1725} {"train_loss": -11.775127410888672, "global_step": 289901, "epoch": 1725} {"train_loss": -11.856094360351562, "global_step": 289902, "epoch": 1725} {"train_loss": -11.942360877990723, "global_step": 289903, "epoch": 1725} {"train_loss": -12.106550216674805, "global_step": 289904, "epoch": 1725} {"train_loss": -11.893309593200684, "global_step": 289905, "epoch": 1725} {"train_loss": -11.989681243896484, "global_step": 289906, "epoch": 1725} {"train_loss": -12.126243591308594, "global_step": 289907, "epoch": 1725} {"train_loss": -12.004373550415039, "global_step": 289908, "epoch": 1725} {"train_loss": -11.95262336730957, "global_step": 289909, "epoch": 1725} {"train_loss": -12.251163482666016, "global_step": 289910, "epoch": 1725} {"train_loss": -11.940235137939453, "global_step": 289911, "epoch": 1725} {"train_loss": -12.005355834960938, "global_step": 289912, "epoch": 1725} {"train_loss": -11.952886581420898, "global_step": 289913, "epoch": 1725} {"train_loss": -12.254816055297852, "global_step": 289914, "epoch": 1725} {"train_loss": -11.924068450927734, "global_step": 289915, "epoch": 1725} {"train_loss": -11.994012832641602, "global_step": 289916, "epoch": 1725} {"train_loss": -12.115752220153809, "global_step": 289917, "epoch": 1725} {"train_loss": -11.984455108642578, "global_step": 289918, "epoch": 1725} {"train_loss": -12.176517486572266, "global_step": 289919, "epoch": 1725} {"train_loss": -12.13981819152832, "global_step": 289920, "epoch": 1725} {"train_loss": -11.873210906982422, "global_step": 289921, "epoch": 1725} {"train_loss": -12.100014686584473, "global_step": 289922, "epoch": 1725} {"train_loss": -11.858065605163574, "global_step": 289923, "epoch": 1725} {"train_loss": -12.040656089782715, "global_step": 289924, "epoch": 1725} {"train_loss": -11.840353012084961, "global_step": 289925, "epoch": 1725} {"train_loss": -12.200188636779785, "global_step": 289926, "epoch": 1725} {"train_loss": -11.773274421691895, "global_step": 289927, "epoch": 1725} {"train_loss": -11.847280502319336, "global_step": 289928, "epoch": 1725} {"train_loss": -12.082344055175781, "global_step": 289929, "epoch": 1725} {"train_loss": -12.030466079711914, "global_step": 289930, "epoch": 1725} {"train_loss": -12.016602516174316, "global_step": 289931, "epoch": 1725} {"train_loss": -12.197518348693848, "global_step": 289932, "epoch": 1725} {"train_loss": -11.828304290771484, "global_step": 289933, "epoch": 1725} {"train_loss": -12.02972412109375, "global_step": 289934, "epoch": 1725} {"train_loss": -11.919235229492188, "global_step": 289935, "epoch": 1725} {"train_loss": -11.783084869384766, "global_step": 289936, "epoch": 1725} {"train_loss": -11.953695297241211, "global_step": 289937, "epoch": 1725} {"train_loss": -11.935802459716797, "global_step": 289938, "epoch": 1725} {"train_loss": -12.109271049499512, "global_step": 289939, "epoch": 1725} {"train_loss": -11.890664100646973, "global_step": 289940, "epoch": 1725} {"train_loss": -12.05166244506836, "global_step": 289941, "epoch": 1725} {"train_loss": -12.179388046264648, "global_step": 289942, "epoch": 1725} {"train_loss": -11.827520370483398, "global_step": 289943, "epoch": 1725} {"train_loss": -12.003484725952148, "global_step": 289944, "epoch": 1725} {"train_loss": -12.189064025878906, "global_step": 289945, "epoch": 1725} {"train_loss": -12.151100158691406, "global_step": 289946, "epoch": 1725} {"train_loss": -11.971881866455078, "global_step": 289947, "epoch": 1725} {"train_loss": -11.632537841796875, "global_step": 289948, "epoch": 1725} {"train_loss": -11.912703514099121, "global_step": 289949, "epoch": 1725} {"train_loss": -12.097051620483398, "global_step": 289950, "epoch": 1725} {"train_loss": -11.855220794677734, "global_step": 289951, "epoch": 1725} {"train_loss": -12.144075393676758, "global_step": 289952, "epoch": 1725} {"train_loss": -12.264474868774414, "global_step": 289953, "epoch": 1725} {"train_loss": -11.835680961608887, "global_step": 289954, "epoch": 1725} {"train_loss": -12.227800369262695, "global_step": 289955, "epoch": 1725} {"train_loss": -12.353902816772461, "global_step": 289956, "epoch": 1725} {"train_loss": -12.240826606750488, "global_step": 289957, "epoch": 1725} {"train_loss": -12.00575065612793, "global_step": 289958, "epoch": 1725} {"train_loss": -11.992256164550781, "global_step": 289959, "epoch": 1725} {"train_loss": -12.150676727294922, "global_step": 289960, "epoch": 1725} {"train_loss": -12.188620567321777, "global_step": 289961, "epoch": 1725} {"train_loss": -12.265174865722656, "global_step": 289962, "epoch": 1725} {"train_loss": -11.999879837036133, "global_step": 289963, "epoch": 1725} {"train_loss": -12.230746269226074, "global_step": 289964, "epoch": 1725} {"train_loss": -12.111666679382324, "global_step": 289965, "epoch": 1725} {"train_loss": -12.02621841430664, "global_step": 289966, "epoch": 1725} {"train_loss": -11.546980205036345, "global_step": 289967, "epoch": 1725, "val_loss": 274679.1875, "train_action_mse_error": 3.297973155975342} {"train_loss": -11.97822380065918, "global_step": 289968, "epoch": 1726} {"train_loss": -12.083158493041992, "global_step": 289969, "epoch": 1726} {"train_loss": -11.994122505187988, "global_step": 289970, "epoch": 1726} {"train_loss": -11.539121627807617, "global_step": 289971, "epoch": 1726} {"train_loss": -11.774911880493164, "global_step": 289972, "epoch": 1726} {"train_loss": -12.014241218566895, "global_step": 289973, "epoch": 1726} {"train_loss": -12.21963119506836, "global_step": 289974, "epoch": 1726} {"train_loss": -11.755505561828613, "global_step": 289975, "epoch": 1726} {"train_loss": -12.056831359863281, "global_step": 289976, "epoch": 1726} {"train_loss": -12.276561737060547, "global_step": 289977, "epoch": 1726} {"train_loss": -11.956010818481445, "global_step": 289978, "epoch": 1726} {"train_loss": -11.951236724853516, "global_step": 289979, "epoch": 1726} {"train_loss": -11.838595390319824, "global_step": 289980, "epoch": 1726} {"train_loss": -11.597368240356445, "global_step": 289981, "epoch": 1726} {"train_loss": -12.32009506225586, "global_step": 289982, "epoch": 1726} {"train_loss": -11.269405364990234, "global_step": 289983, "epoch": 1726} {"train_loss": -12.221833229064941, "global_step": 289984, "epoch": 1726} {"train_loss": -11.632525444030762, "global_step": 289985, "epoch": 1726} {"train_loss": -11.914485931396484, "global_step": 289986, "epoch": 1726} {"train_loss": -11.834617614746094, "global_step": 289987, "epoch": 1726} {"train_loss": -11.973993301391602, "global_step": 289988, "epoch": 1726} {"train_loss": -11.764700889587402, "global_step": 289989, "epoch": 1726} {"train_loss": -12.219612121582031, "global_step": 289990, "epoch": 1726} {"train_loss": -11.976961135864258, "global_step": 289991, "epoch": 1726} {"train_loss": -12.11508560180664, "global_step": 289992, "epoch": 1726} {"train_loss": -11.669569969177246, "global_step": 289993, "epoch": 1726} {"train_loss": -12.133306503295898, "global_step": 289994, "epoch": 1726} {"train_loss": -12.133411407470703, "global_step": 289995, "epoch": 1726} {"train_loss": -12.280298233032227, "global_step": 289996, "epoch": 1726} {"train_loss": -12.045785903930664, "global_step": 289997, "epoch": 1726} {"train_loss": -12.010229110717773, "global_step": 289998, "epoch": 1726} {"train_loss": -12.274089813232422, "global_step": 289999, "epoch": 1726} {"train_loss": -12.331792831420898, "global_step": 290000, "epoch": 1726} {"train_loss": -11.741554260253906, "global_step": 290001, "epoch": 1726} {"train_loss": -11.912256240844727, "global_step": 290002, "epoch": 1726} {"train_loss": -12.214983940124512, "global_step": 290003, "epoch": 1726} {"train_loss": -12.436235427856445, "global_step": 290004, "epoch": 1726} {"train_loss": -12.013882637023926, "global_step": 290005, "epoch": 1726} {"train_loss": -11.824751853942871, "global_step": 290006, "epoch": 1726} {"train_loss": -11.614426612854004, "global_step": 290007, "epoch": 1726} {"train_loss": -12.201387405395508, "global_step": 290008, "epoch": 1726} {"train_loss": -11.021270751953125, "global_step": 290009, "epoch": 1726} {"train_loss": -11.946060180664062, "global_step": 290010, "epoch": 1726} {"train_loss": -11.568035125732422, "global_step": 290011, "epoch": 1726} {"train_loss": -11.709977149963379, "global_step": 290012, "epoch": 1726} {"train_loss": -10.520591735839844, "global_step": 290013, "epoch": 1726} {"train_loss": -10.606130599975586, "global_step": 290014, "epoch": 1726} {"train_loss": -10.756969451904297, "global_step": 290015, "epoch": 1726} {"train_loss": -10.090534210205078, "global_step": 290016, "epoch": 1726} {"train_loss": -8.744542121887207, "global_step": 290017, "epoch": 1726} {"train_loss": -9.672075271606445, "global_step": 290018, "epoch": 1726} {"train_loss": -8.546022415161133, "global_step": 290019, "epoch": 1726} {"train_loss": -7.159151554107666, "global_step": 290020, "epoch": 1726} {"train_loss": -8.182527542114258, "global_step": 290021, "epoch": 1726} {"train_loss": -8.982553482055664, "global_step": 290022, "epoch": 1726} {"train_loss": -8.263031005859375, "global_step": 290023, "epoch": 1726} {"train_loss": -7.820363998413086, "global_step": 290024, "epoch": 1726} {"train_loss": -7.64743709564209, "global_step": 290025, "epoch": 1726} {"train_loss": -7.407303810119629, "global_step": 290026, "epoch": 1726} {"train_loss": -9.235678672790527, "global_step": 290027, "epoch": 1726} {"train_loss": -9.317750930786133, "global_step": 290028, "epoch": 1726} {"train_loss": -9.610067367553711, "global_step": 290029, "epoch": 1726} {"train_loss": -9.28408432006836, "global_step": 290030, "epoch": 1726} {"train_loss": -8.8501615524292, "global_step": 290031, "epoch": 1726} {"train_loss": -9.23741340637207, "global_step": 290032, "epoch": 1726} {"train_loss": -10.406482696533203, "global_step": 290033, "epoch": 1726} {"train_loss": -10.60629653930664, "global_step": 290034, "epoch": 1726} {"train_loss": -10.302574157714844, "global_step": 290035, "epoch": 1726} {"train_loss": -10.201922416687012, "global_step": 290036, "epoch": 1726} {"train_loss": -10.638145446777344, "global_step": 290037, "epoch": 1726} {"train_loss": -10.579216003417969, "global_step": 290038, "epoch": 1726} {"train_loss": -11.133676528930664, "global_step": 290039, "epoch": 1726} {"train_loss": -10.504759788513184, "global_step": 290040, "epoch": 1726} {"train_loss": -11.123153686523438, "global_step": 290041, "epoch": 1726} {"train_loss": -10.956539154052734, "global_step": 290042, "epoch": 1726} {"train_loss": -10.992008209228516, "global_step": 290043, "epoch": 1726} {"train_loss": -11.275214195251465, "global_step": 290044, "epoch": 1726} {"train_loss": -11.335334777832031, "global_step": 290045, "epoch": 1726} {"train_loss": -11.378480911254883, "global_step": 290046, "epoch": 1726} {"train_loss": -11.454627990722656, "global_step": 290047, "epoch": 1726} {"train_loss": -11.425575256347656, "global_step": 290048, "epoch": 1726} {"train_loss": -11.74411392211914, "global_step": 290049, "epoch": 1726} {"train_loss": -11.363079071044922, "global_step": 290050, "epoch": 1726} {"train_loss": -11.494203567504883, "global_step": 290051, "epoch": 1726} {"train_loss": -11.495680809020996, "global_step": 290052, "epoch": 1726} {"train_loss": -11.611125946044922, "global_step": 290053, "epoch": 1726} {"train_loss": -11.377809524536133, "global_step": 290054, "epoch": 1726} {"train_loss": -11.659788131713867, "global_step": 290055, "epoch": 1726} {"train_loss": -11.549124717712402, "global_step": 290056, "epoch": 1726} {"train_loss": -11.652334213256836, "global_step": 290057, "epoch": 1726} {"train_loss": -11.728395462036133, "global_step": 290058, "epoch": 1726} {"train_loss": -11.76823616027832, "global_step": 290059, "epoch": 1726} {"train_loss": -11.720229148864746, "global_step": 290060, "epoch": 1726} {"train_loss": -11.862337112426758, "global_step": 290061, "epoch": 1726} {"train_loss": -11.627836227416992, "global_step": 290062, "epoch": 1726} {"train_loss": -11.771034240722656, "global_step": 290063, "epoch": 1726} {"train_loss": -11.769050598144531, "global_step": 290064, "epoch": 1726} {"train_loss": -11.738746643066406, "global_step": 290065, "epoch": 1726} {"train_loss": -11.861990928649902, "global_step": 290066, "epoch": 1726} {"train_loss": -11.913444519042969, "global_step": 290067, "epoch": 1726} {"train_loss": -11.902233123779297, "global_step": 290068, "epoch": 1726} {"train_loss": -12.000783920288086, "global_step": 290069, "epoch": 1726} {"train_loss": -11.741870880126953, "global_step": 290070, "epoch": 1726} {"train_loss": -11.981813430786133, "global_step": 290071, "epoch": 1726} {"train_loss": -12.147253036499023, "global_step": 290072, "epoch": 1726} {"train_loss": -11.92650032043457, "global_step": 290073, "epoch": 1726} {"train_loss": -11.980583190917969, "global_step": 290074, "epoch": 1726} {"train_loss": -12.240029335021973, "global_step": 290075, "epoch": 1726} {"train_loss": -11.98255443572998, "global_step": 290076, "epoch": 1726} {"train_loss": -12.206684112548828, "global_step": 290077, "epoch": 1726} {"train_loss": -12.016261100769043, "global_step": 290078, "epoch": 1726} {"train_loss": -12.078474998474121, "global_step": 290079, "epoch": 1726} {"train_loss": -12.109685897827148, "global_step": 290080, "epoch": 1726} {"train_loss": -11.917867660522461, "global_step": 290081, "epoch": 1726} {"train_loss": -12.075923919677734, "global_step": 290082, "epoch": 1726} {"train_loss": -11.945511817932129, "global_step": 290083, "epoch": 1726} {"train_loss": -12.023305892944336, "global_step": 290084, "epoch": 1726} {"train_loss": -11.920858383178711, "global_step": 290085, "epoch": 1726} {"train_loss": -12.00129222869873, "global_step": 290086, "epoch": 1726} {"train_loss": -12.048458099365234, "global_step": 290087, "epoch": 1726} {"train_loss": -12.041982650756836, "global_step": 290088, "epoch": 1726} {"train_loss": -11.974637985229492, "global_step": 290089, "epoch": 1726} {"train_loss": -12.09614372253418, "global_step": 290090, "epoch": 1726} {"train_loss": -12.256400108337402, "global_step": 290091, "epoch": 1726} {"train_loss": -12.181984901428223, "global_step": 290092, "epoch": 1726} {"train_loss": -12.032944679260254, "global_step": 290093, "epoch": 1726} {"train_loss": -12.241063117980957, "global_step": 290094, "epoch": 1726} {"train_loss": -12.222902297973633, "global_step": 290095, "epoch": 1726} {"train_loss": -12.064082145690918, "global_step": 290096, "epoch": 1726} {"train_loss": -12.165596008300781, "global_step": 290097, "epoch": 1726} {"train_loss": -12.300195693969727, "global_step": 290098, "epoch": 1726} {"train_loss": -12.163421630859375, "global_step": 290099, "epoch": 1726} {"train_loss": -12.22400951385498, "global_step": 290100, "epoch": 1726} {"train_loss": -12.340262413024902, "global_step": 290101, "epoch": 1726} {"train_loss": -12.298542022705078, "global_step": 290102, "epoch": 1726} {"train_loss": -12.33975887298584, "global_step": 290103, "epoch": 1726} {"train_loss": -12.425241470336914, "global_step": 290104, "epoch": 1726} {"train_loss": -12.144086837768555, "global_step": 290105, "epoch": 1726} {"train_loss": -12.427602767944336, "global_step": 290106, "epoch": 1726} {"train_loss": -12.146859169006348, "global_step": 290107, "epoch": 1726} {"train_loss": -12.320512771606445, "global_step": 290108, "epoch": 1726} {"train_loss": -12.132942199707031, "global_step": 290109, "epoch": 1726} {"train_loss": -12.337251663208008, "global_step": 290110, "epoch": 1726} {"train_loss": -12.424219131469727, "global_step": 290111, "epoch": 1726} {"train_loss": -12.22115421295166, "global_step": 290112, "epoch": 1726} {"train_loss": -12.341894149780273, "global_step": 290113, "epoch": 1726} {"train_loss": -12.212632179260254, "global_step": 290114, "epoch": 1726} {"train_loss": -12.302168846130371, "global_step": 290115, "epoch": 1726} {"train_loss": -12.323183059692383, "global_step": 290116, "epoch": 1726} {"train_loss": -12.389522552490234, "global_step": 290117, "epoch": 1726} {"train_loss": -12.25350570678711, "global_step": 290118, "epoch": 1726} {"train_loss": -12.244041442871094, "global_step": 290119, "epoch": 1726} {"train_loss": -12.390707969665527, "global_step": 290120, "epoch": 1726} {"train_loss": -12.118478775024414, "global_step": 290121, "epoch": 1726} {"train_loss": -12.03469467163086, "global_step": 290122, "epoch": 1726} {"train_loss": -11.70065689086914, "global_step": 290123, "epoch": 1726} {"train_loss": -12.030738830566406, "global_step": 290124, "epoch": 1726} {"train_loss": -12.199127197265625, "global_step": 290125, "epoch": 1726} {"train_loss": -12.205323219299316, "global_step": 290126, "epoch": 1726} {"train_loss": -12.248762130737305, "global_step": 290127, "epoch": 1726} {"train_loss": -12.244743347167969, "global_step": 290128, "epoch": 1726} {"train_loss": -12.312740325927734, "global_step": 290129, "epoch": 1726} {"train_loss": -11.999412536621094, "global_step": 290130, "epoch": 1726} {"train_loss": -12.279380798339844, "global_step": 290131, "epoch": 1726} {"train_loss": -12.477871894836426, "global_step": 290132, "epoch": 1726} {"train_loss": -12.321958541870117, "global_step": 290133, "epoch": 1726} {"train_loss": -12.478978157043457, "global_step": 290134, "epoch": 1726} {"train_loss": -11.547983132657551, "global_step": 290135, "epoch": 1726, "val_loss": 274278.53125} {"train_loss": -12.267452239990234, "global_step": 290136, "epoch": 1727} {"train_loss": -11.388446807861328, "global_step": 290137, "epoch": 1727} {"train_loss": -11.783106803894043, "global_step": 290138, "epoch": 1727} {"train_loss": -11.20163345336914, "global_step": 290139, "epoch": 1727} {"train_loss": -11.69328498840332, "global_step": 290140, "epoch": 1727} {"train_loss": -11.511516571044922, "global_step": 290141, "epoch": 1727} {"train_loss": -11.80029582977295, "global_step": 290142, "epoch": 1727} {"train_loss": -11.13762092590332, "global_step": 290143, "epoch": 1727} {"train_loss": -10.965555191040039, "global_step": 290144, "epoch": 1727} {"train_loss": -9.066585540771484, "global_step": 290145, "epoch": 1727} {"train_loss": -10.335655212402344, "global_step": 290146, "epoch": 1727} {"train_loss": -8.475549697875977, "global_step": 290147, "epoch": 1727} {"train_loss": -8.628275871276855, "global_step": 290148, "epoch": 1727} {"train_loss": -8.325247764587402, "global_step": 290149, "epoch": 1727} {"train_loss": -9.110377311706543, "global_step": 290150, "epoch": 1727} {"train_loss": -10.031050682067871, "global_step": 290151, "epoch": 1727} {"train_loss": -9.625391960144043, "global_step": 290152, "epoch": 1727} {"train_loss": -9.311376571655273, "global_step": 290153, "epoch": 1727} {"train_loss": -9.95914077758789, "global_step": 290154, "epoch": 1727} {"train_loss": -11.066488265991211, "global_step": 290155, "epoch": 1727} {"train_loss": -11.518638610839844, "global_step": 290156, "epoch": 1727} {"train_loss": -11.292854309082031, "global_step": 290157, "epoch": 1727} {"train_loss": -10.047945022583008, "global_step": 290158, "epoch": 1727} {"train_loss": -10.219096183776855, "global_step": 290159, "epoch": 1727} {"train_loss": -10.669940948486328, "global_step": 290160, "epoch": 1727} {"train_loss": -10.687172889709473, "global_step": 290161, "epoch": 1727} {"train_loss": -10.875551223754883, "global_step": 290162, "epoch": 1727} {"train_loss": -11.088787078857422, "global_step": 290163, "epoch": 1727} {"train_loss": -11.081160545349121, "global_step": 290164, "epoch": 1727} {"train_loss": -10.841301918029785, "global_step": 290165, "epoch": 1727} {"train_loss": -11.186532974243164, "global_step": 290166, "epoch": 1727} {"train_loss": -10.221633911132812, "global_step": 290167, "epoch": 1727} {"train_loss": -10.847373962402344, "global_step": 290168, "epoch": 1727} {"train_loss": -10.854724884033203, "global_step": 290169, "epoch": 1727} {"train_loss": -11.268041610717773, "global_step": 290170, "epoch": 1727} {"train_loss": -10.46261215209961, "global_step": 290171, "epoch": 1727} {"train_loss": -10.81846809387207, "global_step": 290172, "epoch": 1727} {"train_loss": -10.620719909667969, "global_step": 290173, "epoch": 1727} {"train_loss": -11.07525634765625, "global_step": 290174, "epoch": 1727} {"train_loss": -10.816903114318848, "global_step": 290175, "epoch": 1727} {"train_loss": -10.569988250732422, "global_step": 290176, "epoch": 1727} {"train_loss": -11.53610897064209, "global_step": 290177, "epoch": 1727} {"train_loss": -10.73748779296875, "global_step": 290178, "epoch": 1727} {"train_loss": -11.148396492004395, "global_step": 290179, "epoch": 1727} {"train_loss": -11.027193069458008, "global_step": 290180, "epoch": 1727} {"train_loss": -10.613984107971191, "global_step": 290181, "epoch": 1727} {"train_loss": -11.221076965332031, "global_step": 290182, "epoch": 1727} {"train_loss": -11.233012199401855, "global_step": 290183, "epoch": 1727} {"train_loss": -11.491559028625488, "global_step": 290184, "epoch": 1727} {"train_loss": -11.14680004119873, "global_step": 290185, "epoch": 1727} {"train_loss": -11.530501365661621, "global_step": 290186, "epoch": 1727} {"train_loss": -11.532873153686523, "global_step": 290187, "epoch": 1727} {"train_loss": -11.146705627441406, "global_step": 290188, "epoch": 1727} {"train_loss": -10.899559020996094, "global_step": 290189, "epoch": 1727} {"train_loss": -11.59572982788086, "global_step": 290190, "epoch": 1727} {"train_loss": -11.283717155456543, "global_step": 290191, "epoch": 1727} {"train_loss": -11.724519729614258, "global_step": 290192, "epoch": 1727} {"train_loss": -11.451362609863281, "global_step": 290193, "epoch": 1727} {"train_loss": -11.308181762695312, "global_step": 290194, "epoch": 1727} {"train_loss": -11.59848403930664, "global_step": 290195, "epoch": 1727} {"train_loss": -11.705471992492676, "global_step": 290196, "epoch": 1727} {"train_loss": -11.553586959838867, "global_step": 290197, "epoch": 1727} {"train_loss": -11.652016639709473, "global_step": 290198, "epoch": 1727} {"train_loss": -11.70585823059082, "global_step": 290199, "epoch": 1727} {"train_loss": -11.655163764953613, "global_step": 290200, "epoch": 1727} {"train_loss": -11.91453742980957, "global_step": 290201, "epoch": 1727} {"train_loss": -11.868626594543457, "global_step": 290202, "epoch": 1727} {"train_loss": -11.664525032043457, "global_step": 290203, "epoch": 1727} {"train_loss": -11.616981506347656, "global_step": 290204, "epoch": 1727} {"train_loss": -11.673507690429688, "global_step": 290205, "epoch": 1727} {"train_loss": -11.532697677612305, "global_step": 290206, "epoch": 1727} {"train_loss": -11.770576477050781, "global_step": 290207, "epoch": 1727} {"train_loss": -11.605541229248047, "global_step": 290208, "epoch": 1727} {"train_loss": -11.664011001586914, "global_step": 290209, "epoch": 1727} {"train_loss": -11.731437683105469, "global_step": 290210, "epoch": 1727} {"train_loss": -11.622725486755371, "global_step": 290211, "epoch": 1727} {"train_loss": -11.922466278076172, "global_step": 290212, "epoch": 1727} {"train_loss": -11.818129539489746, "global_step": 290213, "epoch": 1727} {"train_loss": -11.788314819335938, "global_step": 290214, "epoch": 1727} {"train_loss": -11.763496398925781, "global_step": 290215, "epoch": 1727} {"train_loss": -11.618459701538086, "global_step": 290216, "epoch": 1727} {"train_loss": -11.768375396728516, "global_step": 290217, "epoch": 1727} {"train_loss": -11.770584106445312, "global_step": 290218, "epoch": 1727} {"train_loss": -11.654651641845703, "global_step": 290219, "epoch": 1727} {"train_loss": -11.932750701904297, "global_step": 290220, "epoch": 1727} {"train_loss": -11.739355087280273, "global_step": 290221, "epoch": 1727} {"train_loss": -12.062298774719238, "global_step": 290222, "epoch": 1727} {"train_loss": -11.71161937713623, "global_step": 290223, "epoch": 1727} {"train_loss": -11.760409355163574, "global_step": 290224, "epoch": 1727} {"train_loss": -12.086276054382324, "global_step": 290225, "epoch": 1727} {"train_loss": -11.553634643554688, "global_step": 290226, "epoch": 1727} {"train_loss": -12.194830894470215, "global_step": 290227, "epoch": 1727} {"train_loss": -11.635601043701172, "global_step": 290228, "epoch": 1727} {"train_loss": -12.046340942382812, "global_step": 290229, "epoch": 1727} {"train_loss": -11.938912391662598, "global_step": 290230, "epoch": 1727} {"train_loss": -11.85238265991211, "global_step": 290231, "epoch": 1727} {"train_loss": -11.849550247192383, "global_step": 290232, "epoch": 1727} {"train_loss": -11.855022430419922, "global_step": 290233, "epoch": 1727} {"train_loss": -12.046377182006836, "global_step": 290234, "epoch": 1727} {"train_loss": -11.756518363952637, "global_step": 290235, "epoch": 1727} {"train_loss": -12.141691207885742, "global_step": 290236, "epoch": 1727} {"train_loss": -11.928451538085938, "global_step": 290237, "epoch": 1727} {"train_loss": -12.009632110595703, "global_step": 290238, "epoch": 1727} {"train_loss": -11.887333869934082, "global_step": 290239, "epoch": 1727} {"train_loss": -12.05015754699707, "global_step": 290240, "epoch": 1727} {"train_loss": -11.82601547241211, "global_step": 290241, "epoch": 1727} {"train_loss": -11.97125244140625, "global_step": 290242, "epoch": 1727} {"train_loss": -12.142529487609863, "global_step": 290243, "epoch": 1727} {"train_loss": -11.959997177124023, "global_step": 290244, "epoch": 1727} {"train_loss": -11.976879119873047, "global_step": 290245, "epoch": 1727} {"train_loss": -11.995491027832031, "global_step": 290246, "epoch": 1727} {"train_loss": -11.94255256652832, "global_step": 290247, "epoch": 1727} {"train_loss": -11.995131492614746, "global_step": 290248, "epoch": 1727} {"train_loss": -11.55354118347168, "global_step": 290249, "epoch": 1727} {"train_loss": -11.861900329589844, "global_step": 290250, "epoch": 1727} {"train_loss": -11.758913040161133, "global_step": 290251, "epoch": 1727} {"train_loss": -11.527017593383789, "global_step": 290252, "epoch": 1727} {"train_loss": -12.0203275680542, "global_step": 290253, "epoch": 1727} {"train_loss": -11.438892364501953, "global_step": 290254, "epoch": 1727} {"train_loss": -11.506881713867188, "global_step": 290255, "epoch": 1727} {"train_loss": -10.320454597473145, "global_step": 290256, "epoch": 1727} {"train_loss": -11.346162796020508, "global_step": 290257, "epoch": 1727} {"train_loss": -11.251993179321289, "global_step": 290258, "epoch": 1727} {"train_loss": -11.01750373840332, "global_step": 290259, "epoch": 1727} {"train_loss": -11.839008331298828, "global_step": 290260, "epoch": 1727} {"train_loss": -10.102575302124023, "global_step": 290261, "epoch": 1727} {"train_loss": -11.639922142028809, "global_step": 290262, "epoch": 1727} {"train_loss": -10.835750579833984, "global_step": 290263, "epoch": 1727} {"train_loss": -11.353160858154297, "global_step": 290264, "epoch": 1727} {"train_loss": -11.473913192749023, "global_step": 290265, "epoch": 1727} {"train_loss": -11.503616333007812, "global_step": 290266, "epoch": 1727} {"train_loss": -11.072322845458984, "global_step": 290267, "epoch": 1727} {"train_loss": -11.056690216064453, "global_step": 290268, "epoch": 1727} {"train_loss": -11.558305740356445, "global_step": 290269, "epoch": 1727} {"train_loss": -9.922319412231445, "global_step": 290270, "epoch": 1727} {"train_loss": -11.718414306640625, "global_step": 290271, "epoch": 1727} {"train_loss": -10.798439979553223, "global_step": 290272, "epoch": 1727} {"train_loss": -11.512529373168945, "global_step": 290273, "epoch": 1727} {"train_loss": -11.700759887695312, "global_step": 290274, "epoch": 1727} {"train_loss": -11.472646713256836, "global_step": 290275, "epoch": 1727} {"train_loss": -11.95301342010498, "global_step": 290276, "epoch": 1727} {"train_loss": -11.741376876831055, "global_step": 290277, "epoch": 1727} {"train_loss": -12.026144027709961, "global_step": 290278, "epoch": 1727} {"train_loss": -11.992741584777832, "global_step": 290279, "epoch": 1727} {"train_loss": -12.018301010131836, "global_step": 290280, "epoch": 1727} {"train_loss": -12.215047836303711, "global_step": 290281, "epoch": 1727} {"train_loss": -12.18645191192627, "global_step": 290282, "epoch": 1727} {"train_loss": -12.089115142822266, "global_step": 290283, "epoch": 1727} {"train_loss": -11.791962623596191, "global_step": 290284, "epoch": 1727} {"train_loss": -11.94568920135498, "global_step": 290285, "epoch": 1727} {"train_loss": -11.972311019897461, "global_step": 290286, "epoch": 1727} {"train_loss": -11.933626174926758, "global_step": 290287, "epoch": 1727} {"train_loss": -12.129485130310059, "global_step": 290288, "epoch": 1727} {"train_loss": -12.049383163452148, "global_step": 290289, "epoch": 1727} {"train_loss": -12.1748046875, "global_step": 290290, "epoch": 1727} {"train_loss": -12.065399169921875, "global_step": 290291, "epoch": 1727} {"train_loss": -12.282129287719727, "global_step": 290292, "epoch": 1727} {"train_loss": -12.289549827575684, "global_step": 290293, "epoch": 1727} {"train_loss": -12.160574913024902, "global_step": 290294, "epoch": 1727} {"train_loss": -11.978851318359375, "global_step": 290295, "epoch": 1727} {"train_loss": -12.17379379272461, "global_step": 290296, "epoch": 1727} {"train_loss": -12.321186065673828, "global_step": 290297, "epoch": 1727} {"train_loss": -12.196303367614746, "global_step": 290298, "epoch": 1727} {"train_loss": -12.146303176879883, "global_step": 290299, "epoch": 1727} {"train_loss": -12.212640762329102, "global_step": 290300, "epoch": 1727} {"train_loss": -12.180268287658691, "global_step": 290301, "epoch": 1727} {"train_loss": -12.190969467163086, "global_step": 290302, "epoch": 1727} {"train_loss": -11.427221786408197, "global_step": 290303, "epoch": 1727, "val_loss": 271884.1875} {"train_loss": -12.174392700195312, "global_step": 290304, "epoch": 1728} {"train_loss": -12.297210693359375, "global_step": 290305, "epoch": 1728} {"train_loss": -12.160627365112305, "global_step": 290306, "epoch": 1728} {"train_loss": -12.272987365722656, "global_step": 290307, "epoch": 1728} {"train_loss": -12.02182388305664, "global_step": 290308, "epoch": 1728} {"train_loss": -12.257426261901855, "global_step": 290309, "epoch": 1728} {"train_loss": -12.125673294067383, "global_step": 290310, "epoch": 1728} {"train_loss": -12.332992553710938, "global_step": 290311, "epoch": 1728} {"train_loss": -11.98725700378418, "global_step": 290312, "epoch": 1728} {"train_loss": -12.218955993652344, "global_step": 290313, "epoch": 1728} {"train_loss": -12.038385391235352, "global_step": 290314, "epoch": 1728} {"train_loss": -12.131099700927734, "global_step": 290315, "epoch": 1728} {"train_loss": -12.062918663024902, "global_step": 290316, "epoch": 1728} {"train_loss": -12.21615219116211, "global_step": 290317, "epoch": 1728} {"train_loss": -11.918891906738281, "global_step": 290318, "epoch": 1728} {"train_loss": -12.094189643859863, "global_step": 290319, "epoch": 1728} {"train_loss": -11.68514633178711, "global_step": 290320, "epoch": 1728} {"train_loss": -11.357908248901367, "global_step": 290321, "epoch": 1728} {"train_loss": -12.133532524108887, "global_step": 290322, "epoch": 1728} {"train_loss": -11.276374816894531, "global_step": 290323, "epoch": 1728} {"train_loss": -11.477386474609375, "global_step": 290324, "epoch": 1728} {"train_loss": -11.982112884521484, "global_step": 290325, "epoch": 1728} {"train_loss": -11.196609497070312, "global_step": 290326, "epoch": 1728} {"train_loss": -11.637588500976562, "global_step": 290327, "epoch": 1728} {"train_loss": -11.12016773223877, "global_step": 290328, "epoch": 1728} {"train_loss": -12.198508262634277, "global_step": 290329, "epoch": 1728} {"train_loss": -10.575811386108398, "global_step": 290330, "epoch": 1728} {"train_loss": -11.492664337158203, "global_step": 290331, "epoch": 1728} {"train_loss": -11.876114845275879, "global_step": 290332, "epoch": 1728} {"train_loss": -11.640239715576172, "global_step": 290333, "epoch": 1728} {"train_loss": -11.771153450012207, "global_step": 290334, "epoch": 1728} {"train_loss": -11.580642700195312, "global_step": 290335, "epoch": 1728} {"train_loss": -11.189888000488281, "global_step": 290336, "epoch": 1728} {"train_loss": -10.560380935668945, "global_step": 290337, "epoch": 1728} {"train_loss": -11.558516502380371, "global_step": 290338, "epoch": 1728} {"train_loss": -10.953413009643555, "global_step": 290339, "epoch": 1728} {"train_loss": -8.967656135559082, "global_step": 290340, "epoch": 1728} {"train_loss": -9.947665214538574, "global_step": 290341, "epoch": 1728} {"train_loss": -7.76406192779541, "global_step": 290342, "epoch": 1728} {"train_loss": -7.486822128295898, "global_step": 290343, "epoch": 1728} {"train_loss": -8.746447563171387, "global_step": 290344, "epoch": 1728} {"train_loss": -8.663202285766602, "global_step": 290345, "epoch": 1728} {"train_loss": -9.965861320495605, "global_step": 290346, "epoch": 1728} {"train_loss": -9.567691802978516, "global_step": 290347, "epoch": 1728} {"train_loss": -8.182731628417969, "global_step": 290348, "epoch": 1728} {"train_loss": -9.32756519317627, "global_step": 290349, "epoch": 1728} {"train_loss": -10.109635353088379, "global_step": 290350, "epoch": 1728} {"train_loss": -10.398859977722168, "global_step": 290351, "epoch": 1728} {"train_loss": -10.43222427368164, "global_step": 290352, "epoch": 1728} {"train_loss": -10.800516128540039, "global_step": 290353, "epoch": 1728} {"train_loss": -10.38801097869873, "global_step": 290354, "epoch": 1728} {"train_loss": -10.783182144165039, "global_step": 290355, "epoch": 1728} {"train_loss": -10.615501403808594, "global_step": 290356, "epoch": 1728} {"train_loss": -10.661022186279297, "global_step": 290357, "epoch": 1728} {"train_loss": -11.075836181640625, "global_step": 290358, "epoch": 1728} {"train_loss": -11.022367477416992, "global_step": 290359, "epoch": 1728} {"train_loss": -11.169057846069336, "global_step": 290360, "epoch": 1728} {"train_loss": -10.459656715393066, "global_step": 290361, "epoch": 1728} {"train_loss": -10.969762802124023, "global_step": 290362, "epoch": 1728} {"train_loss": -11.319162368774414, "global_step": 290363, "epoch": 1728} {"train_loss": -11.055679321289062, "global_step": 290364, "epoch": 1728} {"train_loss": -10.696913719177246, "global_step": 290365, "epoch": 1728} {"train_loss": -10.980466842651367, "global_step": 290366, "epoch": 1728} {"train_loss": -11.123062133789062, "global_step": 290367, "epoch": 1728} {"train_loss": -11.373560905456543, "global_step": 290368, "epoch": 1728} {"train_loss": -11.489425659179688, "global_step": 290369, "epoch": 1728} {"train_loss": -11.609322547912598, "global_step": 290370, "epoch": 1728} {"train_loss": -11.440903663635254, "global_step": 290371, "epoch": 1728} {"train_loss": -11.868196487426758, "global_step": 290372, "epoch": 1728} {"train_loss": -11.338357925415039, "global_step": 290373, "epoch": 1728} {"train_loss": -11.630020141601562, "global_step": 290374, "epoch": 1728} {"train_loss": -11.578917503356934, "global_step": 290375, "epoch": 1728} {"train_loss": -11.80746078491211, "global_step": 290376, "epoch": 1728} {"train_loss": -11.419609069824219, "global_step": 290377, "epoch": 1728} {"train_loss": -12.008855819702148, "global_step": 290378, "epoch": 1728} {"train_loss": -11.660845756530762, "global_step": 290379, "epoch": 1728} {"train_loss": -11.675399780273438, "global_step": 290380, "epoch": 1728} {"train_loss": -11.792057037353516, "global_step": 290381, "epoch": 1728} {"train_loss": -11.62832260131836, "global_step": 290382, "epoch": 1728} {"train_loss": -11.970735549926758, "global_step": 290383, "epoch": 1728} {"train_loss": -11.69163990020752, "global_step": 290384, "epoch": 1728} {"train_loss": -11.618769645690918, "global_step": 290385, "epoch": 1728} {"train_loss": -11.704252243041992, "global_step": 290386, "epoch": 1728} {"train_loss": -11.928346633911133, "global_step": 290387, "epoch": 1728} {"train_loss": -11.8990478515625, "global_step": 290388, "epoch": 1728} {"train_loss": -11.825772285461426, "global_step": 290389, "epoch": 1728} {"train_loss": -12.03731918334961, "global_step": 290390, "epoch": 1728} {"train_loss": -11.74699878692627, "global_step": 290391, "epoch": 1728} {"train_loss": -11.769577026367188, "global_step": 290392, "epoch": 1728} {"train_loss": -12.1472806930542, "global_step": 290393, "epoch": 1728} {"train_loss": -11.92391300201416, "global_step": 290394, "epoch": 1728} {"train_loss": -12.0745849609375, "global_step": 290395, "epoch": 1728} {"train_loss": -11.945064544677734, "global_step": 290396, "epoch": 1728} {"train_loss": -11.869658470153809, "global_step": 290397, "epoch": 1728} {"train_loss": -11.720863342285156, "global_step": 290398, "epoch": 1728} {"train_loss": -11.997198104858398, "global_step": 290399, "epoch": 1728} {"train_loss": -11.991411209106445, "global_step": 290400, "epoch": 1728} {"train_loss": -11.90139389038086, "global_step": 290401, "epoch": 1728} {"train_loss": -11.993545532226562, "global_step": 290402, "epoch": 1728} {"train_loss": -11.934588432312012, "global_step": 290403, "epoch": 1728} {"train_loss": -11.954412460327148, "global_step": 290404, "epoch": 1728} {"train_loss": -12.106115341186523, "global_step": 290405, "epoch": 1728} {"train_loss": -11.96956729888916, "global_step": 290406, "epoch": 1728} {"train_loss": -11.96216106414795, "global_step": 290407, "epoch": 1728} {"train_loss": -12.073183059692383, "global_step": 290408, "epoch": 1728} {"train_loss": -12.118512153625488, "global_step": 290409, "epoch": 1728} {"train_loss": -12.166680335998535, "global_step": 290410, "epoch": 1728} {"train_loss": -12.139148712158203, "global_step": 290411, "epoch": 1728} {"train_loss": -12.043830871582031, "global_step": 290412, "epoch": 1728} {"train_loss": -12.138262748718262, "global_step": 290413, "epoch": 1728} {"train_loss": -12.17845344543457, "global_step": 290414, "epoch": 1728} {"train_loss": -12.087108612060547, "global_step": 290415, "epoch": 1728} {"train_loss": -12.182559967041016, "global_step": 290416, "epoch": 1728} {"train_loss": -12.181926727294922, "global_step": 290417, "epoch": 1728} {"train_loss": -12.34237289428711, "global_step": 290418, "epoch": 1728} {"train_loss": -12.21285343170166, "global_step": 290419, "epoch": 1728} {"train_loss": -12.168216705322266, "global_step": 290420, "epoch": 1728} {"train_loss": -12.400701522827148, "global_step": 290421, "epoch": 1728} {"train_loss": -12.023271560668945, "global_step": 290422, "epoch": 1728} {"train_loss": -12.238231658935547, "global_step": 290423, "epoch": 1728} {"train_loss": -12.226441383361816, "global_step": 290424, "epoch": 1728} {"train_loss": -12.384149551391602, "global_step": 290425, "epoch": 1728} {"train_loss": -12.139592170715332, "global_step": 290426, "epoch": 1728} {"train_loss": -12.110246658325195, "global_step": 290427, "epoch": 1728} {"train_loss": -11.99478816986084, "global_step": 290428, "epoch": 1728} {"train_loss": -12.149545669555664, "global_step": 290429, "epoch": 1728} {"train_loss": -11.810652732849121, "global_step": 290430, "epoch": 1728} {"train_loss": -12.250944137573242, "global_step": 290431, "epoch": 1728} {"train_loss": -11.8076753616333, "global_step": 290432, "epoch": 1728} {"train_loss": -11.854263305664062, "global_step": 290433, "epoch": 1728} {"train_loss": -12.087151527404785, "global_step": 290434, "epoch": 1728} {"train_loss": -11.831310272216797, "global_step": 290435, "epoch": 1728} {"train_loss": -12.209022521972656, "global_step": 290436, "epoch": 1728} {"train_loss": -12.022237777709961, "global_step": 290437, "epoch": 1728} {"train_loss": -12.34351921081543, "global_step": 290438, "epoch": 1728} {"train_loss": -12.034366607666016, "global_step": 290439, "epoch": 1728} {"train_loss": -11.973583221435547, "global_step": 290440, "epoch": 1728} {"train_loss": -11.757539749145508, "global_step": 290441, "epoch": 1728} {"train_loss": -11.851165771484375, "global_step": 290442, "epoch": 1728} {"train_loss": -12.183950424194336, "global_step": 290443, "epoch": 1728} {"train_loss": -11.734292030334473, "global_step": 290444, "epoch": 1728} {"train_loss": -12.435478210449219, "global_step": 290445, "epoch": 1728} {"train_loss": -12.071571350097656, "global_step": 290446, "epoch": 1728} {"train_loss": -11.924400329589844, "global_step": 290447, "epoch": 1728} {"train_loss": -12.157912254333496, "global_step": 290448, "epoch": 1728} {"train_loss": -11.821462631225586, "global_step": 290449, "epoch": 1728} {"train_loss": -12.412763595581055, "global_step": 290450, "epoch": 1728} {"train_loss": -11.89910888671875, "global_step": 290451, "epoch": 1728} {"train_loss": -12.058241844177246, "global_step": 290452, "epoch": 1728} {"train_loss": -11.811970710754395, "global_step": 290453, "epoch": 1728} {"train_loss": -11.999517440795898, "global_step": 290454, "epoch": 1728} {"train_loss": -11.955694198608398, "global_step": 290455, "epoch": 1728} {"train_loss": -12.214406967163086, "global_step": 290456, "epoch": 1728} {"train_loss": -11.995929718017578, "global_step": 290457, "epoch": 1728} {"train_loss": -12.353325843811035, "global_step": 290458, "epoch": 1728} {"train_loss": -11.89875602722168, "global_step": 290459, "epoch": 1728} {"train_loss": -11.50240707397461, "global_step": 290460, "epoch": 1728} {"train_loss": -11.333250999450684, "global_step": 290461, "epoch": 1728} {"train_loss": -12.311208724975586, "global_step": 290462, "epoch": 1728} {"train_loss": -11.441940307617188, "global_step": 290463, "epoch": 1728} {"train_loss": -10.575937271118164, "global_step": 290464, "epoch": 1728} {"train_loss": -11.367032051086426, "global_step": 290465, "epoch": 1728} {"train_loss": -12.164361953735352, "global_step": 290466, "epoch": 1728} {"train_loss": -11.68021011352539, "global_step": 290467, "epoch": 1728} {"train_loss": -11.525940895080566, "global_step": 290468, "epoch": 1728} {"train_loss": -11.35098648071289, "global_step": 290469, "epoch": 1728} {"train_loss": -11.218942642211914, "global_step": 290470, "epoch": 1728} {"train_loss": -11.56159092131115, "global_step": 290471, "epoch": 1728, "val_loss": 274456.9375} {"train_loss": -11.002222061157227, "global_step": 290472, "epoch": 1729} {"train_loss": -8.822367668151855, "global_step": 290473, "epoch": 1729} {"train_loss": -9.356793403625488, "global_step": 290474, "epoch": 1729} {"train_loss": -9.952213287353516, "global_step": 290475, "epoch": 1729} {"train_loss": -8.760284423828125, "global_step": 290476, "epoch": 1729} {"train_loss": -8.971944808959961, "global_step": 290477, "epoch": 1729} {"train_loss": -10.184122085571289, "global_step": 290478, "epoch": 1729} {"train_loss": -10.211875915527344, "global_step": 290479, "epoch": 1729} {"train_loss": -10.208702087402344, "global_step": 290480, "epoch": 1729} {"train_loss": -9.776521682739258, "global_step": 290481, "epoch": 1729} {"train_loss": -10.390771865844727, "global_step": 290482, "epoch": 1729} {"train_loss": -10.039508819580078, "global_step": 290483, "epoch": 1729} {"train_loss": -10.573864936828613, "global_step": 290484, "epoch": 1729} {"train_loss": -10.816425323486328, "global_step": 290485, "epoch": 1729} {"train_loss": -11.329763412475586, "global_step": 290486, "epoch": 1729} {"train_loss": -10.993846893310547, "global_step": 290487, "epoch": 1729} {"train_loss": -11.576019287109375, "global_step": 290488, "epoch": 1729} {"train_loss": -10.973760604858398, "global_step": 290489, "epoch": 1729} {"train_loss": -11.451608657836914, "global_step": 290490, "epoch": 1729} {"train_loss": -11.263065338134766, "global_step": 290491, "epoch": 1729} {"train_loss": -10.756315231323242, "global_step": 290492, "epoch": 1729} {"train_loss": -11.62765884399414, "global_step": 290493, "epoch": 1729} {"train_loss": -10.713254928588867, "global_step": 290494, "epoch": 1729} {"train_loss": -11.727089881896973, "global_step": 290495, "epoch": 1729} {"train_loss": -10.963767051696777, "global_step": 290496, "epoch": 1729} {"train_loss": -11.528250694274902, "global_step": 290497, "epoch": 1729} {"train_loss": -11.703948974609375, "global_step": 290498, "epoch": 1729} {"train_loss": -11.53448486328125, "global_step": 290499, "epoch": 1729} {"train_loss": -11.630304336547852, "global_step": 290500, "epoch": 1729} {"train_loss": -11.692657470703125, "global_step": 290501, "epoch": 1729} {"train_loss": -11.648910522460938, "global_step": 290502, "epoch": 1729} {"train_loss": -11.846099853515625, "global_step": 290503, "epoch": 1729} {"train_loss": -11.553242683410645, "global_step": 290504, "epoch": 1729} {"train_loss": -11.790620803833008, "global_step": 290505, "epoch": 1729} {"train_loss": -11.854419708251953, "global_step": 290506, "epoch": 1729} {"train_loss": -11.907663345336914, "global_step": 290507, "epoch": 1729} {"train_loss": -11.9782133102417, "global_step": 290508, "epoch": 1729} {"train_loss": -11.803176879882812, "global_step": 290509, "epoch": 1729} {"train_loss": -11.726680755615234, "global_step": 290510, "epoch": 1729} {"train_loss": -11.708794593811035, "global_step": 290511, "epoch": 1729} {"train_loss": -11.582489013671875, "global_step": 290512, "epoch": 1729} {"train_loss": -12.1217041015625, "global_step": 290513, "epoch": 1729} {"train_loss": -11.84934139251709, "global_step": 290514, "epoch": 1729} {"train_loss": -12.130062103271484, "global_step": 290515, "epoch": 1729} {"train_loss": -11.957148551940918, "global_step": 290516, "epoch": 1729} {"train_loss": -11.844077110290527, "global_step": 290517, "epoch": 1729} {"train_loss": -12.151884078979492, "global_step": 290518, "epoch": 1729} {"train_loss": -11.898551940917969, "global_step": 290519, "epoch": 1729} {"train_loss": -12.0201416015625, "global_step": 290520, "epoch": 1729} {"train_loss": -12.23390007019043, "global_step": 290521, "epoch": 1729} {"train_loss": -12.224105834960938, "global_step": 290522, "epoch": 1729} {"train_loss": -12.274590492248535, "global_step": 290523, "epoch": 1729} {"train_loss": -12.285734176635742, "global_step": 290524, "epoch": 1729} {"train_loss": -12.174263000488281, "global_step": 290525, "epoch": 1729} {"train_loss": -12.07884407043457, "global_step": 290526, "epoch": 1729} {"train_loss": -12.25051212310791, "global_step": 290527, "epoch": 1729} {"train_loss": -12.181863784790039, "global_step": 290528, "epoch": 1729} {"train_loss": -11.949113845825195, "global_step": 290529, "epoch": 1729} {"train_loss": -12.296141624450684, "global_step": 290530, "epoch": 1729} {"train_loss": -12.125357627868652, "global_step": 290531, "epoch": 1729} {"train_loss": -12.188810348510742, "global_step": 290532, "epoch": 1729} {"train_loss": -12.370597839355469, "global_step": 290533, "epoch": 1729} {"train_loss": -12.27934455871582, "global_step": 290534, "epoch": 1729} {"train_loss": -12.288816452026367, "global_step": 290535, "epoch": 1729} {"train_loss": -12.020774841308594, "global_step": 290536, "epoch": 1729} {"train_loss": -12.235587120056152, "global_step": 290537, "epoch": 1729} {"train_loss": -12.188746452331543, "global_step": 290538, "epoch": 1729} {"train_loss": -12.023967742919922, "global_step": 290539, "epoch": 1729} {"train_loss": -12.241469383239746, "global_step": 290540, "epoch": 1729} {"train_loss": -12.207231521606445, "global_step": 290541, "epoch": 1729} {"train_loss": -12.042095184326172, "global_step": 290542, "epoch": 1729} {"train_loss": -12.298280715942383, "global_step": 290543, "epoch": 1729} {"train_loss": -11.779145240783691, "global_step": 290544, "epoch": 1729} {"train_loss": -12.249130249023438, "global_step": 290545, "epoch": 1729} {"train_loss": -12.065704345703125, "global_step": 290546, "epoch": 1729} {"train_loss": -12.036543846130371, "global_step": 290547, "epoch": 1729} {"train_loss": -12.16880989074707, "global_step": 290548, "epoch": 1729} {"train_loss": -11.833795547485352, "global_step": 290549, "epoch": 1729} {"train_loss": -12.373594284057617, "global_step": 290550, "epoch": 1729} {"train_loss": -11.801820755004883, "global_step": 290551, "epoch": 1729} {"train_loss": -12.071976661682129, "global_step": 290552, "epoch": 1729} {"train_loss": -12.207636833190918, "global_step": 290553, "epoch": 1729} {"train_loss": -11.854978561401367, "global_step": 290554, "epoch": 1729} {"train_loss": -12.511305809020996, "global_step": 290555, "epoch": 1729} {"train_loss": -11.869943618774414, "global_step": 290556, "epoch": 1729} {"train_loss": -12.206798553466797, "global_step": 290557, "epoch": 1729} {"train_loss": -12.33206558227539, "global_step": 290558, "epoch": 1729} {"train_loss": -12.325899124145508, "global_step": 290559, "epoch": 1729} {"train_loss": -12.185174942016602, "global_step": 290560, "epoch": 1729} {"train_loss": -12.305197715759277, "global_step": 290561, "epoch": 1729} {"train_loss": -11.817588806152344, "global_step": 290562, "epoch": 1729} {"train_loss": -12.18240737915039, "global_step": 290563, "epoch": 1729} {"train_loss": -12.257001876831055, "global_step": 290564, "epoch": 1729} {"train_loss": -11.656373977661133, "global_step": 290565, "epoch": 1729} {"train_loss": -11.848621368408203, "global_step": 290566, "epoch": 1729} {"train_loss": -12.305006980895996, "global_step": 290567, "epoch": 1729} {"train_loss": -11.609992027282715, "global_step": 290568, "epoch": 1729} {"train_loss": -12.178960800170898, "global_step": 290569, "epoch": 1729} {"train_loss": -11.563469886779785, "global_step": 290570, "epoch": 1729} {"train_loss": -10.921375274658203, "global_step": 290571, "epoch": 1729} {"train_loss": -12.084096908569336, "global_step": 290572, "epoch": 1729} {"train_loss": -11.311376571655273, "global_step": 290573, "epoch": 1729} {"train_loss": -11.058487892150879, "global_step": 290574, "epoch": 1729} {"train_loss": -11.744340896606445, "global_step": 290575, "epoch": 1729} {"train_loss": -11.62412166595459, "global_step": 290576, "epoch": 1729} {"train_loss": -12.087606430053711, "global_step": 290577, "epoch": 1729} {"train_loss": -11.889469146728516, "global_step": 290578, "epoch": 1729} {"train_loss": -11.60426139831543, "global_step": 290579, "epoch": 1729} {"train_loss": -12.034317016601562, "global_step": 290580, "epoch": 1729} {"train_loss": -11.770158767700195, "global_step": 290581, "epoch": 1729} {"train_loss": -12.08301830291748, "global_step": 290582, "epoch": 1729} {"train_loss": -12.04442024230957, "global_step": 290583, "epoch": 1729} {"train_loss": -11.762174606323242, "global_step": 290584, "epoch": 1729} {"train_loss": -11.770279884338379, "global_step": 290585, "epoch": 1729} {"train_loss": -11.839790344238281, "global_step": 290586, "epoch": 1729} {"train_loss": -12.014156341552734, "global_step": 290587, "epoch": 1729} {"train_loss": -12.044561386108398, "global_step": 290588, "epoch": 1729} {"train_loss": -11.714105606079102, "global_step": 290589, "epoch": 1729} {"train_loss": -12.356765747070312, "global_step": 290590, "epoch": 1729} {"train_loss": -12.128504753112793, "global_step": 290591, "epoch": 1729} {"train_loss": -12.099334716796875, "global_step": 290592, "epoch": 1729} {"train_loss": -12.228350639343262, "global_step": 290593, "epoch": 1729} {"train_loss": -11.670635223388672, "global_step": 290594, "epoch": 1729} {"train_loss": -12.319398880004883, "global_step": 290595, "epoch": 1729} {"train_loss": -12.270181655883789, "global_step": 290596, "epoch": 1729} {"train_loss": -11.949999809265137, "global_step": 290597, "epoch": 1729} {"train_loss": -11.988677978515625, "global_step": 290598, "epoch": 1729} {"train_loss": -11.818660736083984, "global_step": 290599, "epoch": 1729} {"train_loss": -11.90552806854248, "global_step": 290600, "epoch": 1729} {"train_loss": -11.681242942810059, "global_step": 290601, "epoch": 1729} {"train_loss": -11.357962608337402, "global_step": 290602, "epoch": 1729} {"train_loss": -11.633157730102539, "global_step": 290603, "epoch": 1729} {"train_loss": -11.687176704406738, "global_step": 290604, "epoch": 1729} {"train_loss": -11.502948760986328, "global_step": 290605, "epoch": 1729} {"train_loss": -11.986382484436035, "global_step": 290606, "epoch": 1729} {"train_loss": -11.604718208312988, "global_step": 290607, "epoch": 1729} {"train_loss": -11.752519607543945, "global_step": 290608, "epoch": 1729} {"train_loss": -11.541221618652344, "global_step": 290609, "epoch": 1729} {"train_loss": -11.320308685302734, "global_step": 290610, "epoch": 1729} {"train_loss": -11.723600387573242, "global_step": 290611, "epoch": 1729} {"train_loss": -11.631099700927734, "global_step": 290612, "epoch": 1729} {"train_loss": -11.469193458557129, "global_step": 290613, "epoch": 1729} {"train_loss": -11.901077270507812, "global_step": 290614, "epoch": 1729} {"train_loss": -11.685052871704102, "global_step": 290615, "epoch": 1729} {"train_loss": -11.738992691040039, "global_step": 290616, "epoch": 1729} {"train_loss": -11.730810165405273, "global_step": 290617, "epoch": 1729} {"train_loss": -11.649538040161133, "global_step": 290618, "epoch": 1729} {"train_loss": -11.776122093200684, "global_step": 290619, "epoch": 1729} {"train_loss": -11.916374206542969, "global_step": 290620, "epoch": 1729} {"train_loss": -11.675292015075684, "global_step": 290621, "epoch": 1729} {"train_loss": -12.20118522644043, "global_step": 290622, "epoch": 1729} {"train_loss": -11.404989242553711, "global_step": 290623, "epoch": 1729} {"train_loss": -11.735333442687988, "global_step": 290624, "epoch": 1729} {"train_loss": -11.160003662109375, "global_step": 290625, "epoch": 1729} {"train_loss": -11.611804962158203, "global_step": 290626, "epoch": 1729} {"train_loss": -10.345331192016602, "global_step": 290627, "epoch": 1729} {"train_loss": -10.856853485107422, "global_step": 290628, "epoch": 1729} {"train_loss": -11.78403091430664, "global_step": 290629, "epoch": 1729} {"train_loss": -10.834755897521973, "global_step": 290630, "epoch": 1729} {"train_loss": -12.138984680175781, "global_step": 290631, "epoch": 1729} {"train_loss": -10.597282409667969, "global_step": 290632, "epoch": 1729} {"train_loss": -11.2003755569458, "global_step": 290633, "epoch": 1729} {"train_loss": -11.014325141906738, "global_step": 290634, "epoch": 1729} {"train_loss": -11.787541389465332, "global_step": 290635, "epoch": 1729} {"train_loss": -10.739706039428711, "global_step": 290636, "epoch": 1729} {"train_loss": -11.378357887268066, "global_step": 290637, "epoch": 1729} {"train_loss": -12.112946510314941, "global_step": 290638, "epoch": 1729} {"train_loss": -11.647609239532834, "global_step": 290639, "epoch": 1729, "val_loss": 277695.21875} {"train_loss": -11.9280424118042, "global_step": 290640, "epoch": 1730} {"train_loss": -11.543834686279297, "global_step": 290641, "epoch": 1730} {"train_loss": -12.118633270263672, "global_step": 290642, "epoch": 1730} {"train_loss": -11.785430908203125, "global_step": 290643, "epoch": 1730} {"train_loss": -11.844682693481445, "global_step": 290644, "epoch": 1730} {"train_loss": -11.337830543518066, "global_step": 290645, "epoch": 1730} {"train_loss": -11.942087173461914, "global_step": 290646, "epoch": 1730} {"train_loss": -11.38498306274414, "global_step": 290647, "epoch": 1730} {"train_loss": -11.193843841552734, "global_step": 290648, "epoch": 1730} {"train_loss": -11.968863487243652, "global_step": 290649, "epoch": 1730} {"train_loss": -11.072839736938477, "global_step": 290650, "epoch": 1730} {"train_loss": -11.844270706176758, "global_step": 290651, "epoch": 1730} {"train_loss": -10.45903205871582, "global_step": 290652, "epoch": 1730} {"train_loss": -11.355918884277344, "global_step": 290653, "epoch": 1730} {"train_loss": -11.518940925598145, "global_step": 290654, "epoch": 1730} {"train_loss": -10.917993545532227, "global_step": 290655, "epoch": 1730} {"train_loss": -11.037694931030273, "global_step": 290656, "epoch": 1730} {"train_loss": -11.261697769165039, "global_step": 290657, "epoch": 1730} {"train_loss": -10.452499389648438, "global_step": 290658, "epoch": 1730} {"train_loss": -10.359966278076172, "global_step": 290659, "epoch": 1730} {"train_loss": -11.76416301727295, "global_step": 290660, "epoch": 1730} {"train_loss": -10.23558521270752, "global_step": 290661, "epoch": 1730} {"train_loss": -11.856882095336914, "global_step": 290662, "epoch": 1730} {"train_loss": -10.654592514038086, "global_step": 290663, "epoch": 1730} {"train_loss": -11.64341926574707, "global_step": 290664, "epoch": 1730} {"train_loss": -11.731459617614746, "global_step": 290665, "epoch": 1730} {"train_loss": -11.653411865234375, "global_step": 290666, "epoch": 1730} {"train_loss": -11.937141418457031, "global_step": 290667, "epoch": 1730} {"train_loss": -11.797165870666504, "global_step": 290668, "epoch": 1730} {"train_loss": -11.044038772583008, "global_step": 290669, "epoch": 1730} {"train_loss": -11.81491470336914, "global_step": 290670, "epoch": 1730} {"train_loss": -11.653959274291992, "global_step": 290671, "epoch": 1730} {"train_loss": -11.075075149536133, "global_step": 290672, "epoch": 1730} {"train_loss": -11.63517951965332, "global_step": 290673, "epoch": 1730} {"train_loss": -11.59761905670166, "global_step": 290674, "epoch": 1730} {"train_loss": -10.710692405700684, "global_step": 290675, "epoch": 1730} {"train_loss": -11.993572235107422, "global_step": 290676, "epoch": 1730} {"train_loss": -11.300623893737793, "global_step": 290677, "epoch": 1730} {"train_loss": -11.540287017822266, "global_step": 290678, "epoch": 1730} {"train_loss": -11.667747497558594, "global_step": 290679, "epoch": 1730} {"train_loss": -11.0098876953125, "global_step": 290680, "epoch": 1730} {"train_loss": -11.506058692932129, "global_step": 290681, "epoch": 1730} {"train_loss": -11.647710800170898, "global_step": 290682, "epoch": 1730} {"train_loss": -10.882884979248047, "global_step": 290683, "epoch": 1730} {"train_loss": -11.798547744750977, "global_step": 290684, "epoch": 1730} {"train_loss": -11.80380630493164, "global_step": 290685, "epoch": 1730} {"train_loss": -11.218052864074707, "global_step": 290686, "epoch": 1730} {"train_loss": -11.742012977600098, "global_step": 290687, "epoch": 1730} {"train_loss": -11.751984596252441, "global_step": 290688, "epoch": 1730} {"train_loss": -11.550041198730469, "global_step": 290689, "epoch": 1730} {"train_loss": -12.199002265930176, "global_step": 290690, "epoch": 1730} {"train_loss": -11.842072486877441, "global_step": 290691, "epoch": 1730} {"train_loss": -11.83647346496582, "global_step": 290692, "epoch": 1730} {"train_loss": -12.02138900756836, "global_step": 290693, "epoch": 1730} {"train_loss": -11.895450592041016, "global_step": 290694, "epoch": 1730} {"train_loss": -11.852834701538086, "global_step": 290695, "epoch": 1730} {"train_loss": -12.043195724487305, "global_step": 290696, "epoch": 1730} {"train_loss": -11.720802307128906, "global_step": 290697, "epoch": 1730} {"train_loss": -12.008970260620117, "global_step": 290698, "epoch": 1730} {"train_loss": -11.880249977111816, "global_step": 290699, "epoch": 1730} {"train_loss": -12.095015525817871, "global_step": 290700, "epoch": 1730} {"train_loss": -11.967445373535156, "global_step": 290701, "epoch": 1730} {"train_loss": -11.976339340209961, "global_step": 290702, "epoch": 1730} {"train_loss": -12.167898178100586, "global_step": 290703, "epoch": 1730} {"train_loss": -12.077095031738281, "global_step": 290704, "epoch": 1730} {"train_loss": -12.135704040527344, "global_step": 290705, "epoch": 1730} {"train_loss": -12.05008316040039, "global_step": 290706, "epoch": 1730} {"train_loss": -12.226222038269043, "global_step": 290707, "epoch": 1730} {"train_loss": -12.09128189086914, "global_step": 290708, "epoch": 1730} {"train_loss": -12.212860107421875, "global_step": 290709, "epoch": 1730} {"train_loss": -12.039143562316895, "global_step": 290710, "epoch": 1730} {"train_loss": -12.201263427734375, "global_step": 290711, "epoch": 1730} {"train_loss": -12.198651313781738, "global_step": 290712, "epoch": 1730} {"train_loss": -12.160812377929688, "global_step": 290713, "epoch": 1730} {"train_loss": -12.324685096740723, "global_step": 290714, "epoch": 1730} {"train_loss": -12.04201889038086, "global_step": 290715, "epoch": 1730} {"train_loss": -12.26925277709961, "global_step": 290716, "epoch": 1730} {"train_loss": -12.252107620239258, "global_step": 290717, "epoch": 1730} {"train_loss": -12.202280044555664, "global_step": 290718, "epoch": 1730} {"train_loss": -12.182184219360352, "global_step": 290719, "epoch": 1730} {"train_loss": -12.12660026550293, "global_step": 290720, "epoch": 1730} {"train_loss": -12.228567123413086, "global_step": 290721, "epoch": 1730} {"train_loss": -12.269283294677734, "global_step": 290722, "epoch": 1730} {"train_loss": -12.307048797607422, "global_step": 290723, "epoch": 1730} {"train_loss": -12.285524368286133, "global_step": 290724, "epoch": 1730} {"train_loss": -12.222811698913574, "global_step": 290725, "epoch": 1730} {"train_loss": -12.41944694519043, "global_step": 290726, "epoch": 1730} {"train_loss": -12.485755920410156, "global_step": 290727, "epoch": 1730} {"train_loss": -12.379018783569336, "global_step": 290728, "epoch": 1730} {"train_loss": -12.366933822631836, "global_step": 290729, "epoch": 1730} {"train_loss": -12.283381462097168, "global_step": 290730, "epoch": 1730} {"train_loss": -12.140504837036133, "global_step": 290731, "epoch": 1730} {"train_loss": -12.115612030029297, "global_step": 290732, "epoch": 1730} {"train_loss": -12.198997497558594, "global_step": 290733, "epoch": 1730} {"train_loss": -11.758172035217285, "global_step": 290734, "epoch": 1730} {"train_loss": -11.748692512512207, "global_step": 290735, "epoch": 1730} {"train_loss": -11.878799438476562, "global_step": 290736, "epoch": 1730} {"train_loss": -11.921253204345703, "global_step": 290737, "epoch": 1730} {"train_loss": -12.361078262329102, "global_step": 290738, "epoch": 1730} {"train_loss": -11.81810474395752, "global_step": 290739, "epoch": 1730} {"train_loss": -12.164069175720215, "global_step": 290740, "epoch": 1730} {"train_loss": -12.38421630859375, "global_step": 290741, "epoch": 1730} {"train_loss": -12.349716186523438, "global_step": 290742, "epoch": 1730} {"train_loss": -12.032369613647461, "global_step": 290743, "epoch": 1730} {"train_loss": -11.406774520874023, "global_step": 290744, "epoch": 1730} {"train_loss": -9.966514587402344, "global_step": 290745, "epoch": 1730} {"train_loss": -10.6798095703125, "global_step": 290746, "epoch": 1730} {"train_loss": -11.667364120483398, "global_step": 290747, "epoch": 1730} {"train_loss": -11.645590782165527, "global_step": 290748, "epoch": 1730} {"train_loss": -10.042859077453613, "global_step": 290749, "epoch": 1730} {"train_loss": -11.239806175231934, "global_step": 290750, "epoch": 1730} {"train_loss": -11.965370178222656, "global_step": 290751, "epoch": 1730} {"train_loss": -11.617707252502441, "global_step": 290752, "epoch": 1730} {"train_loss": -11.790864944458008, "global_step": 290753, "epoch": 1730} {"train_loss": -10.948875427246094, "global_step": 290754, "epoch": 1730} {"train_loss": -10.455497741699219, "global_step": 290755, "epoch": 1730} {"train_loss": -10.638154983520508, "global_step": 290756, "epoch": 1730} {"train_loss": -8.677327156066895, "global_step": 290757, "epoch": 1730} {"train_loss": -9.36170768737793, "global_step": 290758, "epoch": 1730} {"train_loss": -9.318511962890625, "global_step": 290759, "epoch": 1730} {"train_loss": -10.951969146728516, "global_step": 290760, "epoch": 1730} {"train_loss": -8.71403694152832, "global_step": 290761, "epoch": 1730} {"train_loss": -7.705817222595215, "global_step": 290762, "epoch": 1730} {"train_loss": -8.656211853027344, "global_step": 290763, "epoch": 1730} {"train_loss": -8.893705368041992, "global_step": 290764, "epoch": 1730} {"train_loss": -9.789615631103516, "global_step": 290765, "epoch": 1730} {"train_loss": -9.604082107543945, "global_step": 290766, "epoch": 1730} {"train_loss": -8.893402099609375, "global_step": 290767, "epoch": 1730} {"train_loss": -8.574430465698242, "global_step": 290768, "epoch": 1730} {"train_loss": -10.076720237731934, "global_step": 290769, "epoch": 1730} {"train_loss": -10.378952026367188, "global_step": 290770, "epoch": 1730} {"train_loss": -9.182968139648438, "global_step": 290771, "epoch": 1730} {"train_loss": -9.32744026184082, "global_step": 290772, "epoch": 1730} {"train_loss": -11.37175178527832, "global_step": 290773, "epoch": 1730} {"train_loss": -9.280027389526367, "global_step": 290774, "epoch": 1730} {"train_loss": -9.567832946777344, "global_step": 290775, "epoch": 1730} {"train_loss": -9.962053298950195, "global_step": 290776, "epoch": 1730} {"train_loss": -10.096304893493652, "global_step": 290777, "epoch": 1730} {"train_loss": -9.429895401000977, "global_step": 290778, "epoch": 1730} {"train_loss": -9.856914520263672, "global_step": 290779, "epoch": 1730} {"train_loss": -10.503091812133789, "global_step": 290780, "epoch": 1730} {"train_loss": -10.487397193908691, "global_step": 290781, "epoch": 1730} {"train_loss": -10.394536972045898, "global_step": 290782, "epoch": 1730} {"train_loss": -10.970268249511719, "global_step": 290783, "epoch": 1730} {"train_loss": -11.007268905639648, "global_step": 290784, "epoch": 1730} {"train_loss": -10.636186599731445, "global_step": 290785, "epoch": 1730} {"train_loss": -11.093737602233887, "global_step": 290786, "epoch": 1730} {"train_loss": -10.656871795654297, "global_step": 290787, "epoch": 1730} {"train_loss": -10.928681373596191, "global_step": 290788, "epoch": 1730} {"train_loss": -11.200756072998047, "global_step": 290789, "epoch": 1730} {"train_loss": -11.118839263916016, "global_step": 290790, "epoch": 1730} {"train_loss": -11.067154884338379, "global_step": 290791, "epoch": 1730} {"train_loss": -11.410390853881836, "global_step": 290792, "epoch": 1730} {"train_loss": -11.350577354431152, "global_step": 290793, "epoch": 1730} {"train_loss": -11.504700660705566, "global_step": 290794, "epoch": 1730} {"train_loss": -11.669330596923828, "global_step": 290795, "epoch": 1730} {"train_loss": -11.460379600524902, "global_step": 290796, "epoch": 1730} {"train_loss": -11.411964416503906, "global_step": 290797, "epoch": 1730} {"train_loss": -11.64869499206543, "global_step": 290798, "epoch": 1730} {"train_loss": -11.815881729125977, "global_step": 290799, "epoch": 1730} {"train_loss": -11.616680145263672, "global_step": 290800, "epoch": 1730} {"train_loss": -11.692327499389648, "global_step": 290801, "epoch": 1730} {"train_loss": -11.566499710083008, "global_step": 290802, "epoch": 1730} {"train_loss": -11.756689071655273, "global_step": 290803, "epoch": 1730} {"train_loss": -11.595809936523438, "global_step": 290804, "epoch": 1730} {"train_loss": -11.636539459228516, "global_step": 290805, "epoch": 1730} {"train_loss": -11.532126426696777, "global_step": 290806, "epoch": 1730} {"train_loss": -11.328848929632278, "global_step": 290807, "epoch": 1730, "val_loss": 274037.625, "train_action_mse_error": 1.9047653675079346} {"train_loss": -11.453058242797852, "global_step": 290808, "epoch": 1731} {"train_loss": -11.702075958251953, "global_step": 290809, "epoch": 1731} {"train_loss": -11.570599555969238, "global_step": 290810, "epoch": 1731} {"train_loss": -11.529669761657715, "global_step": 290811, "epoch": 1731} {"train_loss": -11.690448760986328, "global_step": 290812, "epoch": 1731} {"train_loss": -11.752396583557129, "global_step": 290813, "epoch": 1731} {"train_loss": -11.972038269042969, "global_step": 290814, "epoch": 1731} {"train_loss": -11.862433433532715, "global_step": 290815, "epoch": 1731} {"train_loss": -11.966601371765137, "global_step": 290816, "epoch": 1731} {"train_loss": -12.040928840637207, "global_step": 290817, "epoch": 1731} {"train_loss": -11.86803913116455, "global_step": 290818, "epoch": 1731} {"train_loss": -12.146409034729004, "global_step": 290819, "epoch": 1731} {"train_loss": -11.961094856262207, "global_step": 290820, "epoch": 1731} {"train_loss": -11.895588874816895, "global_step": 290821, "epoch": 1731} {"train_loss": -12.095332145690918, "global_step": 290822, "epoch": 1731} {"train_loss": -11.88898754119873, "global_step": 290823, "epoch": 1731} {"train_loss": -11.861282348632812, "global_step": 290824, "epoch": 1731} {"train_loss": -12.075349807739258, "global_step": 290825, "epoch": 1731} {"train_loss": -12.214000701904297, "global_step": 290826, "epoch": 1731} {"train_loss": -12.339620590209961, "global_step": 290827, "epoch": 1731} {"train_loss": -12.052573204040527, "global_step": 290828, "epoch": 1731} {"train_loss": -12.318244934082031, "global_step": 290829, "epoch": 1731} {"train_loss": -12.102836608886719, "global_step": 290830, "epoch": 1731} {"train_loss": -12.209781646728516, "global_step": 290831, "epoch": 1731} {"train_loss": -12.217998504638672, "global_step": 290832, "epoch": 1731} {"train_loss": -12.25691032409668, "global_step": 290833, "epoch": 1731} {"train_loss": -12.194587707519531, "global_step": 290834, "epoch": 1731} {"train_loss": -12.15478801727295, "global_step": 290835, "epoch": 1731} {"train_loss": -12.234357833862305, "global_step": 290836, "epoch": 1731} {"train_loss": -12.290603637695312, "global_step": 290837, "epoch": 1731} {"train_loss": -12.225371360778809, "global_step": 290838, "epoch": 1731} {"train_loss": -12.236825942993164, "global_step": 290839, "epoch": 1731} {"train_loss": -12.214324951171875, "global_step": 290840, "epoch": 1731} {"train_loss": -12.1588134765625, "global_step": 290841, "epoch": 1731} {"train_loss": -12.20566177368164, "global_step": 290842, "epoch": 1731} {"train_loss": -12.217781066894531, "global_step": 290843, "epoch": 1731} {"train_loss": -11.939590454101562, "global_step": 290844, "epoch": 1731} {"train_loss": -12.369293212890625, "global_step": 290845, "epoch": 1731} {"train_loss": -12.26057243347168, "global_step": 290846, "epoch": 1731} {"train_loss": -12.260476112365723, "global_step": 290847, "epoch": 1731} {"train_loss": -12.509946823120117, "global_step": 290848, "epoch": 1731} {"train_loss": -11.951894760131836, "global_step": 290849, "epoch": 1731} {"train_loss": -12.461492538452148, "global_step": 290850, "epoch": 1731} {"train_loss": -12.342939376831055, "global_step": 290851, "epoch": 1731} {"train_loss": -12.31052017211914, "global_step": 290852, "epoch": 1731} {"train_loss": -12.272634506225586, "global_step": 290853, "epoch": 1731} {"train_loss": -12.12975788116455, "global_step": 290854, "epoch": 1731} {"train_loss": -12.13429069519043, "global_step": 290855, "epoch": 1731} {"train_loss": -12.421581268310547, "global_step": 290856, "epoch": 1731} {"train_loss": -12.377958297729492, "global_step": 290857, "epoch": 1731} {"train_loss": -12.349580764770508, "global_step": 290858, "epoch": 1731} {"train_loss": -12.33404541015625, "global_step": 290859, "epoch": 1731} {"train_loss": -12.17527961730957, "global_step": 290860, "epoch": 1731} {"train_loss": -12.35752010345459, "global_step": 290861, "epoch": 1731} {"train_loss": -12.491859436035156, "global_step": 290862, "epoch": 1731} {"train_loss": -12.29802131652832, "global_step": 290863, "epoch": 1731} {"train_loss": -12.17047119140625, "global_step": 290864, "epoch": 1731} {"train_loss": -11.65994644165039, "global_step": 290865, "epoch": 1731} {"train_loss": -12.192551612854004, "global_step": 290866, "epoch": 1731} {"train_loss": -11.479536056518555, "global_step": 290867, "epoch": 1731} {"train_loss": -11.571413040161133, "global_step": 290868, "epoch": 1731} {"train_loss": -11.730826377868652, "global_step": 290869, "epoch": 1731} {"train_loss": -12.061112403869629, "global_step": 290870, "epoch": 1731} {"train_loss": -12.23485279083252, "global_step": 290871, "epoch": 1731} {"train_loss": -11.894868850708008, "global_step": 290872, "epoch": 1731} {"train_loss": -11.968815803527832, "global_step": 290873, "epoch": 1731} {"train_loss": -10.866799354553223, "global_step": 290874, "epoch": 1731} {"train_loss": -10.538091659545898, "global_step": 290875, "epoch": 1731} {"train_loss": -11.594995498657227, "global_step": 290876, "epoch": 1731} {"train_loss": -11.86391830444336, "global_step": 290877, "epoch": 1731} {"train_loss": -12.120645523071289, "global_step": 290878, "epoch": 1731} {"train_loss": -11.227651596069336, "global_step": 290879, "epoch": 1731} {"train_loss": -11.660528182983398, "global_step": 290880, "epoch": 1731} {"train_loss": -11.691812515258789, "global_step": 290881, "epoch": 1731} {"train_loss": -11.331578254699707, "global_step": 290882, "epoch": 1731} {"train_loss": -11.015491485595703, "global_step": 290883, "epoch": 1731} {"train_loss": -11.975545883178711, "global_step": 290884, "epoch": 1731} {"train_loss": -11.696993827819824, "global_step": 290885, "epoch": 1731} {"train_loss": -10.288309097290039, "global_step": 290886, "epoch": 1731} {"train_loss": -10.29792594909668, "global_step": 290887, "epoch": 1731} {"train_loss": -11.682476043701172, "global_step": 290888, "epoch": 1731} {"train_loss": -11.096770286560059, "global_step": 290889, "epoch": 1731} {"train_loss": -10.584541320800781, "global_step": 290890, "epoch": 1731} {"train_loss": -11.512969017028809, "global_step": 290891, "epoch": 1731} {"train_loss": -10.983633041381836, "global_step": 290892, "epoch": 1731} {"train_loss": -11.572246551513672, "global_step": 290893, "epoch": 1731} {"train_loss": -11.424759864807129, "global_step": 290894, "epoch": 1731} {"train_loss": -11.507293701171875, "global_step": 290895, "epoch": 1731} {"train_loss": -11.436382293701172, "global_step": 290896, "epoch": 1731} {"train_loss": -11.530221939086914, "global_step": 290897, "epoch": 1731} {"train_loss": -11.664344787597656, "global_step": 290898, "epoch": 1731} {"train_loss": -11.621907234191895, "global_step": 290899, "epoch": 1731} {"train_loss": -11.840057373046875, "global_step": 290900, "epoch": 1731} {"train_loss": -11.911787986755371, "global_step": 290901, "epoch": 1731} {"train_loss": -11.480499267578125, "global_step": 290902, "epoch": 1731} {"train_loss": -11.750882148742676, "global_step": 290903, "epoch": 1731} {"train_loss": -11.690391540527344, "global_step": 290904, "epoch": 1731} {"train_loss": -11.907485961914062, "global_step": 290905, "epoch": 1731} {"train_loss": -11.775689125061035, "global_step": 290906, "epoch": 1731} {"train_loss": -11.604715347290039, "global_step": 290907, "epoch": 1731} {"train_loss": -11.805383682250977, "global_step": 290908, "epoch": 1731} {"train_loss": -11.74493408203125, "global_step": 290909, "epoch": 1731} {"train_loss": -11.806167602539062, "global_step": 290910, "epoch": 1731} {"train_loss": -11.550687789916992, "global_step": 290911, "epoch": 1731} {"train_loss": -11.903131484985352, "global_step": 290912, "epoch": 1731} {"train_loss": -11.322641372680664, "global_step": 290913, "epoch": 1731} {"train_loss": -11.706355094909668, "global_step": 290914, "epoch": 1731} {"train_loss": -11.871379852294922, "global_step": 290915, "epoch": 1731} {"train_loss": -11.592884063720703, "global_step": 290916, "epoch": 1731} {"train_loss": -11.929004669189453, "global_step": 290917, "epoch": 1731} {"train_loss": -11.564294815063477, "global_step": 290918, "epoch": 1731} {"train_loss": -12.055757522583008, "global_step": 290919, "epoch": 1731} {"train_loss": -11.689022064208984, "global_step": 290920, "epoch": 1731} {"train_loss": -11.846464157104492, "global_step": 290921, "epoch": 1731} {"train_loss": -11.848846435546875, "global_step": 290922, "epoch": 1731} {"train_loss": -11.910747528076172, "global_step": 290923, "epoch": 1731} {"train_loss": -11.670259475708008, "global_step": 290924, "epoch": 1731} {"train_loss": -11.985950469970703, "global_step": 290925, "epoch": 1731} {"train_loss": -11.76885986328125, "global_step": 290926, "epoch": 1731} {"train_loss": -11.568052291870117, "global_step": 290927, "epoch": 1731} {"train_loss": -11.270204544067383, "global_step": 290928, "epoch": 1731} {"train_loss": -12.053655624389648, "global_step": 290929, "epoch": 1731} {"train_loss": -11.693910598754883, "global_step": 290930, "epoch": 1731} {"train_loss": -12.010679244995117, "global_step": 290931, "epoch": 1731} {"train_loss": -11.92658805847168, "global_step": 290932, "epoch": 1731} {"train_loss": -11.98735237121582, "global_step": 290933, "epoch": 1731} {"train_loss": -12.24186897277832, "global_step": 290934, "epoch": 1731} {"train_loss": -12.02619743347168, "global_step": 290935, "epoch": 1731} {"train_loss": -12.209787368774414, "global_step": 290936, "epoch": 1731} {"train_loss": -11.833767890930176, "global_step": 290937, "epoch": 1731} {"train_loss": -12.190644264221191, "global_step": 290938, "epoch": 1731} {"train_loss": -11.987783432006836, "global_step": 290939, "epoch": 1731} {"train_loss": -12.05677318572998, "global_step": 290940, "epoch": 1731} {"train_loss": -11.924156188964844, "global_step": 290941, "epoch": 1731} {"train_loss": -12.077811241149902, "global_step": 290942, "epoch": 1731} {"train_loss": -12.264845848083496, "global_step": 290943, "epoch": 1731} {"train_loss": -12.043596267700195, "global_step": 290944, "epoch": 1731} {"train_loss": -11.867008209228516, "global_step": 290945, "epoch": 1731} {"train_loss": -11.916671752929688, "global_step": 290946, "epoch": 1731} {"train_loss": -12.03405475616455, "global_step": 290947, "epoch": 1731} {"train_loss": -11.880099296569824, "global_step": 290948, "epoch": 1731} {"train_loss": -12.467767715454102, "global_step": 290949, "epoch": 1731} {"train_loss": -11.991754531860352, "global_step": 290950, "epoch": 1731} {"train_loss": -11.966805458068848, "global_step": 290951, "epoch": 1731} {"train_loss": -12.358186721801758, "global_step": 290952, "epoch": 1731} {"train_loss": -12.172398567199707, "global_step": 290953, "epoch": 1731} {"train_loss": -12.277576446533203, "global_step": 290954, "epoch": 1731} {"train_loss": -12.15880012512207, "global_step": 290955, "epoch": 1731} {"train_loss": -12.373113632202148, "global_step": 290956, "epoch": 1731} {"train_loss": -12.237728118896484, "global_step": 290957, "epoch": 1731} {"train_loss": -11.971248626708984, "global_step": 290958, "epoch": 1731} {"train_loss": -12.246818542480469, "global_step": 290959, "epoch": 1731} {"train_loss": -11.988479614257812, "global_step": 290960, "epoch": 1731} {"train_loss": -12.204977989196777, "global_step": 290961, "epoch": 1731} {"train_loss": -12.217828750610352, "global_step": 290962, "epoch": 1731} {"train_loss": -12.062424659729004, "global_step": 290963, "epoch": 1731} {"train_loss": -12.269599914550781, "global_step": 290964, "epoch": 1731} {"train_loss": -11.602758407592773, "global_step": 290965, "epoch": 1731} {"train_loss": -12.01336669921875, "global_step": 290966, "epoch": 1731} {"train_loss": -12.215289115905762, "global_step": 290967, "epoch": 1731} {"train_loss": -12.220075607299805, "global_step": 290968, "epoch": 1731} {"train_loss": -12.19497013092041, "global_step": 290969, "epoch": 1731} {"train_loss": -12.197334289550781, "global_step": 290970, "epoch": 1731} {"train_loss": -11.754476547241211, "global_step": 290971, "epoch": 1731} {"train_loss": -11.808667182922363, "global_step": 290972, "epoch": 1731} {"train_loss": -11.915197372436523, "global_step": 290973, "epoch": 1731} {"train_loss": -11.508719444274902, "global_step": 290974, "epoch": 1731} {"train_loss": -11.89611754530952, "global_step": 290975, "epoch": 1731, "val_loss": 281989.625} {"train_loss": -11.225208282470703, "global_step": 290976, "epoch": 1732} {"train_loss": -11.954557418823242, "global_step": 290977, "epoch": 1732} {"train_loss": -11.408466339111328, "global_step": 290978, "epoch": 1732} {"train_loss": -11.892770767211914, "global_step": 290979, "epoch": 1732} {"train_loss": -11.961047172546387, "global_step": 290980, "epoch": 1732} {"train_loss": -11.235859870910645, "global_step": 290981, "epoch": 1732} {"train_loss": -11.311280250549316, "global_step": 290982, "epoch": 1732} {"train_loss": -10.325481414794922, "global_step": 290983, "epoch": 1732} {"train_loss": -11.056939125061035, "global_step": 290984, "epoch": 1732} {"train_loss": -9.88748836517334, "global_step": 290985, "epoch": 1732} {"train_loss": -10.873287200927734, "global_step": 290986, "epoch": 1732} {"train_loss": -10.495391845703125, "global_step": 290987, "epoch": 1732} {"train_loss": -11.478157043457031, "global_step": 290988, "epoch": 1732} {"train_loss": -10.37331771850586, "global_step": 290989, "epoch": 1732} {"train_loss": -9.067666053771973, "global_step": 290990, "epoch": 1732} {"train_loss": -9.518815040588379, "global_step": 290991, "epoch": 1732} {"train_loss": -9.836803436279297, "global_step": 290992, "epoch": 1732} {"train_loss": -8.965337753295898, "global_step": 290993, "epoch": 1732} {"train_loss": -8.108728408813477, "global_step": 290994, "epoch": 1732} {"train_loss": -10.952005386352539, "global_step": 290995, "epoch": 1732} {"train_loss": -8.58245849609375, "global_step": 290996, "epoch": 1732} {"train_loss": -9.825851440429688, "global_step": 290997, "epoch": 1732} {"train_loss": -10.09012222290039, "global_step": 290998, "epoch": 1732} {"train_loss": -10.390151977539062, "global_step": 290999, "epoch": 1732} {"train_loss": -10.235635757446289, "global_step": 291000, "epoch": 1732} {"train_loss": -10.122300148010254, "global_step": 291001, "epoch": 1732} {"train_loss": -10.599382400512695, "global_step": 291002, "epoch": 1732} {"train_loss": -10.026679992675781, "global_step": 291003, "epoch": 1732} {"train_loss": -10.584043502807617, "global_step": 291004, "epoch": 1732} {"train_loss": -11.272056579589844, "global_step": 291005, "epoch": 1732} {"train_loss": -11.185874938964844, "global_step": 291006, "epoch": 1732} {"train_loss": -10.773038864135742, "global_step": 291007, "epoch": 1732} {"train_loss": -11.255584716796875, "global_step": 291008, "epoch": 1732} {"train_loss": -11.210049629211426, "global_step": 291009, "epoch": 1732} {"train_loss": -11.298086166381836, "global_step": 291010, "epoch": 1732} {"train_loss": -10.999903678894043, "global_step": 291011, "epoch": 1732} {"train_loss": -11.656408309936523, "global_step": 291012, "epoch": 1732} {"train_loss": -11.016258239746094, "global_step": 291013, "epoch": 1732} {"train_loss": -11.610809326171875, "global_step": 291014, "epoch": 1732} {"train_loss": -11.100831985473633, "global_step": 291015, "epoch": 1732} {"train_loss": -11.55916976928711, "global_step": 291016, "epoch": 1732} {"train_loss": -11.285045623779297, "global_step": 291017, "epoch": 1732} {"train_loss": -11.808067321777344, "global_step": 291018, "epoch": 1732} {"train_loss": -11.388029098510742, "global_step": 291019, "epoch": 1732} {"train_loss": -11.574705123901367, "global_step": 291020, "epoch": 1732} {"train_loss": -11.233370780944824, "global_step": 291021, "epoch": 1732} {"train_loss": -11.477561950683594, "global_step": 291022, "epoch": 1732} {"train_loss": -11.559825897216797, "global_step": 291023, "epoch": 1732} {"train_loss": -11.247293472290039, "global_step": 291024, "epoch": 1732} {"train_loss": -11.496953010559082, "global_step": 291025, "epoch": 1732} {"train_loss": -10.863076210021973, "global_step": 291026, "epoch": 1732} {"train_loss": -11.38116455078125, "global_step": 291027, "epoch": 1732} {"train_loss": -10.681178092956543, "global_step": 291028, "epoch": 1732} {"train_loss": -11.715015411376953, "global_step": 291029, "epoch": 1732} {"train_loss": -11.384605407714844, "global_step": 291030, "epoch": 1732} {"train_loss": -11.845823287963867, "global_step": 291031, "epoch": 1732} {"train_loss": -11.565178871154785, "global_step": 291032, "epoch": 1732} {"train_loss": -11.55309009552002, "global_step": 291033, "epoch": 1732} {"train_loss": -11.713107109069824, "global_step": 291034, "epoch": 1732} {"train_loss": -11.663366317749023, "global_step": 291035, "epoch": 1732} {"train_loss": -11.67891788482666, "global_step": 291036, "epoch": 1732} {"train_loss": -11.864530563354492, "global_step": 291037, "epoch": 1732} {"train_loss": -11.753583908081055, "global_step": 291038, "epoch": 1732} {"train_loss": -11.888070106506348, "global_step": 291039, "epoch": 1732} {"train_loss": -11.868270874023438, "global_step": 291040, "epoch": 1732} {"train_loss": -11.840742111206055, "global_step": 291041, "epoch": 1732} {"train_loss": -11.90514087677002, "global_step": 291042, "epoch": 1732} {"train_loss": -11.912096977233887, "global_step": 291043, "epoch": 1732} {"train_loss": -11.881080627441406, "global_step": 291044, "epoch": 1732} {"train_loss": -11.884086608886719, "global_step": 291045, "epoch": 1732} {"train_loss": -11.930612564086914, "global_step": 291046, "epoch": 1732} {"train_loss": -12.011723518371582, "global_step": 291047, "epoch": 1732} {"train_loss": -12.120452880859375, "global_step": 291048, "epoch": 1732} {"train_loss": -11.945306777954102, "global_step": 291049, "epoch": 1732} {"train_loss": -12.127176284790039, "global_step": 291050, "epoch": 1732} {"train_loss": -11.937569618225098, "global_step": 291051, "epoch": 1732} {"train_loss": -12.093928337097168, "global_step": 291052, "epoch": 1732} {"train_loss": -12.150707244873047, "global_step": 291053, "epoch": 1732} {"train_loss": -12.038851737976074, "global_step": 291054, "epoch": 1732} {"train_loss": -12.260305404663086, "global_step": 291055, "epoch": 1732} {"train_loss": -11.972009658813477, "global_step": 291056, "epoch": 1732} {"train_loss": -12.218404769897461, "global_step": 291057, "epoch": 1732} {"train_loss": -12.159247398376465, "global_step": 291058, "epoch": 1732} {"train_loss": -12.099931716918945, "global_step": 291059, "epoch": 1732} {"train_loss": -11.97049331665039, "global_step": 291060, "epoch": 1732} {"train_loss": -12.072213172912598, "global_step": 291061, "epoch": 1732} {"train_loss": -12.092536926269531, "global_step": 291062, "epoch": 1732} {"train_loss": -11.982471466064453, "global_step": 291063, "epoch": 1732} {"train_loss": -12.168225288391113, "global_step": 291064, "epoch": 1732} {"train_loss": -12.3326416015625, "global_step": 291065, "epoch": 1732} {"train_loss": -12.155418395996094, "global_step": 291066, "epoch": 1732} {"train_loss": -12.281562805175781, "global_step": 291067, "epoch": 1732} {"train_loss": -12.036787033081055, "global_step": 291068, "epoch": 1732} {"train_loss": -12.24747085571289, "global_step": 291069, "epoch": 1732} {"train_loss": -12.201502799987793, "global_step": 291070, "epoch": 1732} {"train_loss": -12.192739486694336, "global_step": 291071, "epoch": 1732} {"train_loss": -12.2109956741333, "global_step": 291072, "epoch": 1732} {"train_loss": -12.334394454956055, "global_step": 291073, "epoch": 1732} {"train_loss": -12.064716339111328, "global_step": 291074, "epoch": 1732} {"train_loss": -12.284835815429688, "global_step": 291075, "epoch": 1732} {"train_loss": -12.031744003295898, "global_step": 291076, "epoch": 1732} {"train_loss": -11.830198287963867, "global_step": 291077, "epoch": 1732} {"train_loss": -11.363163948059082, "global_step": 291078, "epoch": 1732} {"train_loss": -11.904949188232422, "global_step": 291079, "epoch": 1732} {"train_loss": -12.302040100097656, "global_step": 291080, "epoch": 1732} {"train_loss": -11.167598724365234, "global_step": 291081, "epoch": 1732} {"train_loss": -11.039521217346191, "global_step": 291082, "epoch": 1732} {"train_loss": -12.216976165771484, "global_step": 291083, "epoch": 1732} {"train_loss": -11.461311340332031, "global_step": 291084, "epoch": 1732} {"train_loss": -11.689338684082031, "global_step": 291085, "epoch": 1732} {"train_loss": -11.98373031616211, "global_step": 291086, "epoch": 1732} {"train_loss": -10.587141036987305, "global_step": 291087, "epoch": 1732} {"train_loss": -11.569480895996094, "global_step": 291088, "epoch": 1732} {"train_loss": -11.515617370605469, "global_step": 291089, "epoch": 1732} {"train_loss": -10.646533012390137, "global_step": 291090, "epoch": 1732} {"train_loss": -12.03306770324707, "global_step": 291091, "epoch": 1732} {"train_loss": -11.726703643798828, "global_step": 291092, "epoch": 1732} {"train_loss": -11.059760093688965, "global_step": 291093, "epoch": 1732} {"train_loss": -11.879621505737305, "global_step": 291094, "epoch": 1732} {"train_loss": -10.982776641845703, "global_step": 291095, "epoch": 1732} {"train_loss": -10.236763000488281, "global_step": 291096, "epoch": 1732} {"train_loss": -11.68895149230957, "global_step": 291097, "epoch": 1732} {"train_loss": -11.300254821777344, "global_step": 291098, "epoch": 1732} {"train_loss": -11.150690078735352, "global_step": 291099, "epoch": 1732} {"train_loss": -11.176630020141602, "global_step": 291100, "epoch": 1732} {"train_loss": -10.848123550415039, "global_step": 291101, "epoch": 1732} {"train_loss": -11.420896530151367, "global_step": 291102, "epoch": 1732} {"train_loss": -10.763456344604492, "global_step": 291103, "epoch": 1732} {"train_loss": -11.764501571655273, "global_step": 291104, "epoch": 1732} {"train_loss": -11.427927017211914, "global_step": 291105, "epoch": 1732} {"train_loss": -11.83285140991211, "global_step": 291106, "epoch": 1732} {"train_loss": -11.799911499023438, "global_step": 291107, "epoch": 1732} {"train_loss": -11.898580551147461, "global_step": 291108, "epoch": 1732} {"train_loss": -11.921501159667969, "global_step": 291109, "epoch": 1732} {"train_loss": -11.840076446533203, "global_step": 291110, "epoch": 1732} {"train_loss": -12.10861587524414, "global_step": 291111, "epoch": 1732} {"train_loss": -11.882086753845215, "global_step": 291112, "epoch": 1732} {"train_loss": -11.837875366210938, "global_step": 291113, "epoch": 1732} {"train_loss": -12.135323524475098, "global_step": 291114, "epoch": 1732} {"train_loss": -11.982051849365234, "global_step": 291115, "epoch": 1732} {"train_loss": -12.172292709350586, "global_step": 291116, "epoch": 1732} {"train_loss": -12.022262573242188, "global_step": 291117, "epoch": 1732} {"train_loss": -11.987308502197266, "global_step": 291118, "epoch": 1732} {"train_loss": -12.058422088623047, "global_step": 291119, "epoch": 1732} {"train_loss": -11.95189094543457, "global_step": 291120, "epoch": 1732} {"train_loss": -11.96539306640625, "global_step": 291121, "epoch": 1732} {"train_loss": -12.006063461303711, "global_step": 291122, "epoch": 1732} {"train_loss": -11.951355934143066, "global_step": 291123, "epoch": 1732} {"train_loss": -11.826054573059082, "global_step": 291124, "epoch": 1732} {"train_loss": -12.220430374145508, "global_step": 291125, "epoch": 1732} {"train_loss": -12.330620765686035, "global_step": 291126, "epoch": 1732} {"train_loss": -12.0138578414917, "global_step": 291127, "epoch": 1732} {"train_loss": -12.134765625, "global_step": 291128, "epoch": 1732} {"train_loss": -12.113348007202148, "global_step": 291129, "epoch": 1732} {"train_loss": -12.157774925231934, "global_step": 291130, "epoch": 1732} {"train_loss": -12.123760223388672, "global_step": 291131, "epoch": 1732} {"train_loss": -12.103660583496094, "global_step": 291132, "epoch": 1732} {"train_loss": -12.251466751098633, "global_step": 291133, "epoch": 1732} {"train_loss": -12.367725372314453, "global_step": 291134, "epoch": 1732} {"train_loss": -12.10387134552002, "global_step": 291135, "epoch": 1732} {"train_loss": -11.933465957641602, "global_step": 291136, "epoch": 1732} {"train_loss": -12.199348449707031, "global_step": 291137, "epoch": 1732} {"train_loss": -12.27667236328125, "global_step": 291138, "epoch": 1732} {"train_loss": -12.335993766784668, "global_step": 291139, "epoch": 1732} {"train_loss": -12.350481033325195, "global_step": 291140, "epoch": 1732} {"train_loss": -12.319639205932617, "global_step": 291141, "epoch": 1732} {"train_loss": -12.238569259643555, "global_step": 291142, "epoch": 1732} {"train_loss": -11.540907649766831, "global_step": 291143, "epoch": 1732, "val_loss": 280566.96875} {"train_loss": -12.036089897155762, "global_step": 291144, "epoch": 1733} {"train_loss": -12.220046997070312, "global_step": 291145, "epoch": 1733} {"train_loss": -11.919486999511719, "global_step": 291146, "epoch": 1733} {"train_loss": -12.249358177185059, "global_step": 291147, "epoch": 1733} {"train_loss": -12.046087265014648, "global_step": 291148, "epoch": 1733} {"train_loss": -12.017111778259277, "global_step": 291149, "epoch": 1733} {"train_loss": -12.033143997192383, "global_step": 291150, "epoch": 1733} {"train_loss": -12.173604965209961, "global_step": 291151, "epoch": 1733} {"train_loss": -11.899933815002441, "global_step": 291152, "epoch": 1733} {"train_loss": -12.293607711791992, "global_step": 291153, "epoch": 1733} {"train_loss": -11.359180450439453, "global_step": 291154, "epoch": 1733} {"train_loss": -10.688529968261719, "global_step": 291155, "epoch": 1733} {"train_loss": -12.085973739624023, "global_step": 291156, "epoch": 1733} {"train_loss": -11.250600814819336, "global_step": 291157, "epoch": 1733} {"train_loss": -10.304515838623047, "global_step": 291158, "epoch": 1733} {"train_loss": -11.872027397155762, "global_step": 291159, "epoch": 1733} {"train_loss": -10.778194427490234, "global_step": 291160, "epoch": 1733} {"train_loss": -11.528711318969727, "global_step": 291161, "epoch": 1733} {"train_loss": -11.114395141601562, "global_step": 291162, "epoch": 1733} {"train_loss": -10.848416328430176, "global_step": 291163, "epoch": 1733} {"train_loss": -11.559255599975586, "global_step": 291164, "epoch": 1733} {"train_loss": -11.362545013427734, "global_step": 291165, "epoch": 1733} {"train_loss": -10.909770965576172, "global_step": 291166, "epoch": 1733} {"train_loss": -11.568220138549805, "global_step": 291167, "epoch": 1733} {"train_loss": -10.006860733032227, "global_step": 291168, "epoch": 1733} {"train_loss": -11.212759017944336, "global_step": 291169, "epoch": 1733} {"train_loss": -11.382863998413086, "global_step": 291170, "epoch": 1733} {"train_loss": -11.44185733795166, "global_step": 291171, "epoch": 1733} {"train_loss": -11.670533180236816, "global_step": 291172, "epoch": 1733} {"train_loss": -10.673677444458008, "global_step": 291173, "epoch": 1733} {"train_loss": -11.104103088378906, "global_step": 291174, "epoch": 1733} {"train_loss": -11.005843162536621, "global_step": 291175, "epoch": 1733} {"train_loss": -11.496910095214844, "global_step": 291176, "epoch": 1733} {"train_loss": -11.287528038024902, "global_step": 291177, "epoch": 1733} {"train_loss": -11.821359634399414, "global_step": 291178, "epoch": 1733} {"train_loss": -10.544943809509277, "global_step": 291179, "epoch": 1733} {"train_loss": -11.579219818115234, "global_step": 291180, "epoch": 1733} {"train_loss": -11.191598892211914, "global_step": 291181, "epoch": 1733} {"train_loss": -10.856494903564453, "global_step": 291182, "epoch": 1733} {"train_loss": -10.980817794799805, "global_step": 291183, "epoch": 1733} {"train_loss": -11.52309799194336, "global_step": 291184, "epoch": 1733} {"train_loss": -11.719505310058594, "global_step": 291185, "epoch": 1733} {"train_loss": -11.307577133178711, "global_step": 291186, "epoch": 1733} {"train_loss": -12.006072998046875, "global_step": 291187, "epoch": 1733} {"train_loss": -11.508820533752441, "global_step": 291188, "epoch": 1733} {"train_loss": -11.660087585449219, "global_step": 291189, "epoch": 1733} {"train_loss": -11.243515968322754, "global_step": 291190, "epoch": 1733} {"train_loss": -11.643531799316406, "global_step": 291191, "epoch": 1733} {"train_loss": -11.817142486572266, "global_step": 291192, "epoch": 1733} {"train_loss": -11.831424713134766, "global_step": 291193, "epoch": 1733} {"train_loss": -11.87864875793457, "global_step": 291194, "epoch": 1733} {"train_loss": -11.64491081237793, "global_step": 291195, "epoch": 1733} {"train_loss": -11.879669189453125, "global_step": 291196, "epoch": 1733} {"train_loss": -11.837157249450684, "global_step": 291197, "epoch": 1733} {"train_loss": -11.953134536743164, "global_step": 291198, "epoch": 1733} {"train_loss": -11.99250602722168, "global_step": 291199, "epoch": 1733} {"train_loss": -11.912973403930664, "global_step": 291200, "epoch": 1733} {"train_loss": -12.173446655273438, "global_step": 291201, "epoch": 1733} {"train_loss": -11.865352630615234, "global_step": 291202, "epoch": 1733} {"train_loss": -11.886597633361816, "global_step": 291203, "epoch": 1733} {"train_loss": -12.034647941589355, "global_step": 291204, "epoch": 1733} {"train_loss": -11.688133239746094, "global_step": 291205, "epoch": 1733} {"train_loss": -11.81631851196289, "global_step": 291206, "epoch": 1733} {"train_loss": -11.833407402038574, "global_step": 291207, "epoch": 1733} {"train_loss": -11.76679801940918, "global_step": 291208, "epoch": 1733} {"train_loss": -11.777889251708984, "global_step": 291209, "epoch": 1733} {"train_loss": -11.913482666015625, "global_step": 291210, "epoch": 1733} {"train_loss": -11.623222351074219, "global_step": 291211, "epoch": 1733} {"train_loss": -12.17026424407959, "global_step": 291212, "epoch": 1733} {"train_loss": -11.653443336486816, "global_step": 291213, "epoch": 1733} {"train_loss": -12.010744094848633, "global_step": 291214, "epoch": 1733} {"train_loss": -11.585567474365234, "global_step": 291215, "epoch": 1733} {"train_loss": -11.822856903076172, "global_step": 291216, "epoch": 1733} {"train_loss": -11.800846099853516, "global_step": 291217, "epoch": 1733} {"train_loss": -11.27787971496582, "global_step": 291218, "epoch": 1733} {"train_loss": -11.884991645812988, "global_step": 291219, "epoch": 1733} {"train_loss": -11.387651443481445, "global_step": 291220, "epoch": 1733} {"train_loss": -11.96278190612793, "global_step": 291221, "epoch": 1733} {"train_loss": -11.438814163208008, "global_step": 291222, "epoch": 1733} {"train_loss": -10.99179744720459, "global_step": 291223, "epoch": 1733} {"train_loss": -11.855361938476562, "global_step": 291224, "epoch": 1733} {"train_loss": -11.40512752532959, "global_step": 291225, "epoch": 1733} {"train_loss": -11.766716003417969, "global_step": 291226, "epoch": 1733} {"train_loss": -11.461569786071777, "global_step": 291227, "epoch": 1733} {"train_loss": -12.111913681030273, "global_step": 291228, "epoch": 1733} {"train_loss": -11.493269920349121, "global_step": 291229, "epoch": 1733} {"train_loss": -11.847715377807617, "global_step": 291230, "epoch": 1733} {"train_loss": -11.957428932189941, "global_step": 291231, "epoch": 1733} {"train_loss": -11.715048789978027, "global_step": 291232, "epoch": 1733} {"train_loss": -12.212028503417969, "global_step": 291233, "epoch": 1733} {"train_loss": -11.918600082397461, "global_step": 291234, "epoch": 1733} {"train_loss": -12.032855987548828, "global_step": 291235, "epoch": 1733} {"train_loss": -11.97865104675293, "global_step": 291236, "epoch": 1733} {"train_loss": -12.013455390930176, "global_step": 291237, "epoch": 1733} {"train_loss": -12.294307708740234, "global_step": 291238, "epoch": 1733} {"train_loss": -11.850225448608398, "global_step": 291239, "epoch": 1733} {"train_loss": -12.290282249450684, "global_step": 291240, "epoch": 1733} {"train_loss": -11.832843780517578, "global_step": 291241, "epoch": 1733} {"train_loss": -11.946076393127441, "global_step": 291242, "epoch": 1733} {"train_loss": -11.402581214904785, "global_step": 291243, "epoch": 1733} {"train_loss": -11.90485954284668, "global_step": 291244, "epoch": 1733} {"train_loss": -11.793789863586426, "global_step": 291245, "epoch": 1733} {"train_loss": -11.887022972106934, "global_step": 291246, "epoch": 1733} {"train_loss": -11.780803680419922, "global_step": 291247, "epoch": 1733} {"train_loss": -11.892574310302734, "global_step": 291248, "epoch": 1733} {"train_loss": -12.168865203857422, "global_step": 291249, "epoch": 1733} {"train_loss": -11.726462364196777, "global_step": 291250, "epoch": 1733} {"train_loss": -12.087240219116211, "global_step": 291251, "epoch": 1733} {"train_loss": -11.726038932800293, "global_step": 291252, "epoch": 1733} {"train_loss": -12.077629089355469, "global_step": 291253, "epoch": 1733} {"train_loss": -12.028938293457031, "global_step": 291254, "epoch": 1733} {"train_loss": -11.27121353149414, "global_step": 291255, "epoch": 1733} {"train_loss": -12.019351959228516, "global_step": 291256, "epoch": 1733} {"train_loss": -11.864725112915039, "global_step": 291257, "epoch": 1733} {"train_loss": -11.919793128967285, "global_step": 291258, "epoch": 1733} {"train_loss": -11.965018272399902, "global_step": 291259, "epoch": 1733} {"train_loss": -12.064205169677734, "global_step": 291260, "epoch": 1733} {"train_loss": -12.248132705688477, "global_step": 291261, "epoch": 1733} {"train_loss": -11.977025985717773, "global_step": 291262, "epoch": 1733} {"train_loss": -11.97911548614502, "global_step": 291263, "epoch": 1733} {"train_loss": -11.792346000671387, "global_step": 291264, "epoch": 1733} {"train_loss": -12.303621292114258, "global_step": 291265, "epoch": 1733} {"train_loss": -11.768620491027832, "global_step": 291266, "epoch": 1733} {"train_loss": -12.034605026245117, "global_step": 291267, "epoch": 1733} {"train_loss": -11.840831756591797, "global_step": 291268, "epoch": 1733} {"train_loss": -11.884477615356445, "global_step": 291269, "epoch": 1733} {"train_loss": -12.282629013061523, "global_step": 291270, "epoch": 1733} {"train_loss": -11.956268310546875, "global_step": 291271, "epoch": 1733} {"train_loss": -12.097421646118164, "global_step": 291272, "epoch": 1733} {"train_loss": -12.109960556030273, "global_step": 291273, "epoch": 1733} {"train_loss": -12.102300643920898, "global_step": 291274, "epoch": 1733} {"train_loss": -12.370477676391602, "global_step": 291275, "epoch": 1733} {"train_loss": -12.156673431396484, "global_step": 291276, "epoch": 1733} {"train_loss": -12.053548812866211, "global_step": 291277, "epoch": 1733} {"train_loss": -12.272140502929688, "global_step": 291278, "epoch": 1733} {"train_loss": -12.38873291015625, "global_step": 291279, "epoch": 1733} {"train_loss": -12.236515045166016, "global_step": 291280, "epoch": 1733} {"train_loss": -12.264059066772461, "global_step": 291281, "epoch": 1733} {"train_loss": -12.182862281799316, "global_step": 291282, "epoch": 1733} {"train_loss": -12.332045555114746, "global_step": 291283, "epoch": 1733} {"train_loss": -12.142932891845703, "global_step": 291284, "epoch": 1733} {"train_loss": -12.334370613098145, "global_step": 291285, "epoch": 1733} {"train_loss": -12.49017333984375, "global_step": 291286, "epoch": 1733} {"train_loss": -12.202524185180664, "global_step": 291287, "epoch": 1733} {"train_loss": -12.30237865447998, "global_step": 291288, "epoch": 1733} {"train_loss": -12.322732925415039, "global_step": 291289, "epoch": 1733} {"train_loss": -12.338889122009277, "global_step": 291290, "epoch": 1733} {"train_loss": -12.352672576904297, "global_step": 291291, "epoch": 1733} {"train_loss": -12.148746490478516, "global_step": 291292, "epoch": 1733} {"train_loss": -11.850975036621094, "global_step": 291293, "epoch": 1733} {"train_loss": -12.331489562988281, "global_step": 291294, "epoch": 1733} {"train_loss": -11.954005241394043, "global_step": 291295, "epoch": 1733} {"train_loss": -12.249652862548828, "global_step": 291296, "epoch": 1733} {"train_loss": -11.70909595489502, "global_step": 291297, "epoch": 1733} {"train_loss": -12.189432144165039, "global_step": 291298, "epoch": 1733} {"train_loss": -12.190857887268066, "global_step": 291299, "epoch": 1733} {"train_loss": -12.101970672607422, "global_step": 291300, "epoch": 1733} {"train_loss": -12.067211151123047, "global_step": 291301, "epoch": 1733} {"train_loss": -12.02754020690918, "global_step": 291302, "epoch": 1733} {"train_loss": -12.47164249420166, "global_step": 291303, "epoch": 1733} {"train_loss": -12.403202056884766, "global_step": 291304, "epoch": 1733} {"train_loss": -12.350370407104492, "global_step": 291305, "epoch": 1733} {"train_loss": -11.947002410888672, "global_step": 291306, "epoch": 1733} {"train_loss": -11.318965911865234, "global_step": 291307, "epoch": 1733} {"train_loss": -12.04262924194336, "global_step": 291308, "epoch": 1733} {"train_loss": -12.246040344238281, "global_step": 291309, "epoch": 1733} {"train_loss": -12.414799690246582, "global_step": 291310, "epoch": 1733} {"train_loss": -11.813177699134464, "global_step": 291311, "epoch": 1733, "val_loss": 278304.375} {"train_loss": -12.010823249816895, "global_step": 291312, "epoch": 1734} {"train_loss": -12.268404006958008, "global_step": 291313, "epoch": 1734} {"train_loss": -12.304559707641602, "global_step": 291314, "epoch": 1734} {"train_loss": -12.496910095214844, "global_step": 291315, "epoch": 1734} {"train_loss": -12.215764999389648, "global_step": 291316, "epoch": 1734} {"train_loss": -11.770946502685547, "global_step": 291317, "epoch": 1734} {"train_loss": -11.046137809753418, "global_step": 291318, "epoch": 1734} {"train_loss": -11.226354598999023, "global_step": 291319, "epoch": 1734} {"train_loss": -10.048931121826172, "global_step": 291320, "epoch": 1734} {"train_loss": -11.94613265991211, "global_step": 291321, "epoch": 1734} {"train_loss": -11.225126266479492, "global_step": 291322, "epoch": 1734} {"train_loss": -10.479293823242188, "global_step": 291323, "epoch": 1734} {"train_loss": -11.281759262084961, "global_step": 291324, "epoch": 1734} {"train_loss": -12.003674507141113, "global_step": 291325, "epoch": 1734} {"train_loss": -9.9258451461792, "global_step": 291326, "epoch": 1734} {"train_loss": -12.110292434692383, "global_step": 291327, "epoch": 1734} {"train_loss": -10.069937705993652, "global_step": 291328, "epoch": 1734} {"train_loss": -10.14749813079834, "global_step": 291329, "epoch": 1734} {"train_loss": -10.881773948669434, "global_step": 291330, "epoch": 1734} {"train_loss": -10.492413520812988, "global_step": 291331, "epoch": 1734} {"train_loss": -11.60936164855957, "global_step": 291332, "epoch": 1734} {"train_loss": -11.49334716796875, "global_step": 291333, "epoch": 1734} {"train_loss": -9.683727264404297, "global_step": 291334, "epoch": 1734} {"train_loss": -9.84286117553711, "global_step": 291335, "epoch": 1734} {"train_loss": -11.999811172485352, "global_step": 291336, "epoch": 1734} {"train_loss": -9.976114273071289, "global_step": 291337, "epoch": 1734} {"train_loss": -11.168435096740723, "global_step": 291338, "epoch": 1734} {"train_loss": -11.370758056640625, "global_step": 291339, "epoch": 1734} {"train_loss": -10.070507049560547, "global_step": 291340, "epoch": 1734} {"train_loss": -11.988869667053223, "global_step": 291341, "epoch": 1734} {"train_loss": -10.941446304321289, "global_step": 291342, "epoch": 1734} {"train_loss": -11.451452255249023, "global_step": 291343, "epoch": 1734} {"train_loss": -11.481513977050781, "global_step": 291344, "epoch": 1734} {"train_loss": -10.924331665039062, "global_step": 291345, "epoch": 1734} {"train_loss": -11.737735748291016, "global_step": 291346, "epoch": 1734} {"train_loss": -11.514352798461914, "global_step": 291347, "epoch": 1734} {"train_loss": -12.01556396484375, "global_step": 291348, "epoch": 1734} {"train_loss": -11.564363479614258, "global_step": 291349, "epoch": 1734} {"train_loss": -11.866708755493164, "global_step": 291350, "epoch": 1734} {"train_loss": -11.618383407592773, "global_step": 291351, "epoch": 1734} {"train_loss": -11.282861709594727, "global_step": 291352, "epoch": 1734} {"train_loss": -11.515796661376953, "global_step": 291353, "epoch": 1734} {"train_loss": -11.538341522216797, "global_step": 291354, "epoch": 1734} {"train_loss": -11.802997589111328, "global_step": 291355, "epoch": 1734} {"train_loss": -11.707477569580078, "global_step": 291356, "epoch": 1734} {"train_loss": -11.373065948486328, "global_step": 291357, "epoch": 1734} {"train_loss": -11.877311706542969, "global_step": 291358, "epoch": 1734} {"train_loss": -10.863033294677734, "global_step": 291359, "epoch": 1734} {"train_loss": -12.011322975158691, "global_step": 291360, "epoch": 1734} {"train_loss": -11.405345916748047, "global_step": 291361, "epoch": 1734} {"train_loss": -11.851578712463379, "global_step": 291362, "epoch": 1734} {"train_loss": -11.648344039916992, "global_step": 291363, "epoch": 1734} {"train_loss": -11.219926834106445, "global_step": 291364, "epoch": 1734} {"train_loss": -11.84532356262207, "global_step": 291365, "epoch": 1734} {"train_loss": -11.743444442749023, "global_step": 291366, "epoch": 1734} {"train_loss": -11.787399291992188, "global_step": 291367, "epoch": 1734} {"train_loss": -11.918657302856445, "global_step": 291368, "epoch": 1734} {"train_loss": -11.526820182800293, "global_step": 291369, "epoch": 1734} {"train_loss": -12.079076766967773, "global_step": 291370, "epoch": 1734} {"train_loss": -11.925533294677734, "global_step": 291371, "epoch": 1734} {"train_loss": -11.964599609375, "global_step": 291372, "epoch": 1734} {"train_loss": -11.938919067382812, "global_step": 291373, "epoch": 1734} {"train_loss": -12.032533645629883, "global_step": 291374, "epoch": 1734} {"train_loss": -11.932003021240234, "global_step": 291375, "epoch": 1734} {"train_loss": -11.888093948364258, "global_step": 291376, "epoch": 1734} {"train_loss": -11.64013671875, "global_step": 291377, "epoch": 1734} {"train_loss": -11.49323844909668, "global_step": 291378, "epoch": 1734} {"train_loss": -12.020111083984375, "global_step": 291379, "epoch": 1734} {"train_loss": -12.01275634765625, "global_step": 291380, "epoch": 1734} {"train_loss": -11.769652366638184, "global_step": 291381, "epoch": 1734} {"train_loss": -11.951431274414062, "global_step": 291382, "epoch": 1734} {"train_loss": -12.09853458404541, "global_step": 291383, "epoch": 1734} {"train_loss": -11.945152282714844, "global_step": 291384, "epoch": 1734} {"train_loss": -12.121423721313477, "global_step": 291385, "epoch": 1734} {"train_loss": -12.058088302612305, "global_step": 291386, "epoch": 1734} {"train_loss": -11.836817741394043, "global_step": 291387, "epoch": 1734} {"train_loss": -12.276777267456055, "global_step": 291388, "epoch": 1734} {"train_loss": -11.902565002441406, "global_step": 291389, "epoch": 1734} {"train_loss": -12.139938354492188, "global_step": 291390, "epoch": 1734} {"train_loss": -12.28835678100586, "global_step": 291391, "epoch": 1734} {"train_loss": -12.099602699279785, "global_step": 291392, "epoch": 1734} {"train_loss": -12.102950096130371, "global_step": 291393, "epoch": 1734} {"train_loss": -12.142786979675293, "global_step": 291394, "epoch": 1734} {"train_loss": -11.932649612426758, "global_step": 291395, "epoch": 1734} {"train_loss": -12.137041091918945, "global_step": 291396, "epoch": 1734} {"train_loss": -12.223108291625977, "global_step": 291397, "epoch": 1734} {"train_loss": -12.438610076904297, "global_step": 291398, "epoch": 1734} {"train_loss": -12.108061790466309, "global_step": 291399, "epoch": 1734} {"train_loss": -12.287529945373535, "global_step": 291400, "epoch": 1734} {"train_loss": -12.339374542236328, "global_step": 291401, "epoch": 1734} {"train_loss": -12.313090324401855, "global_step": 291402, "epoch": 1734} {"train_loss": -12.327183723449707, "global_step": 291403, "epoch": 1734} {"train_loss": -12.426907539367676, "global_step": 291404, "epoch": 1734} {"train_loss": -12.082748413085938, "global_step": 291405, "epoch": 1734} {"train_loss": -11.958490371704102, "global_step": 291406, "epoch": 1734} {"train_loss": -12.298145294189453, "global_step": 291407, "epoch": 1734} {"train_loss": -11.990123748779297, "global_step": 291408, "epoch": 1734} {"train_loss": -12.285906791687012, "global_step": 291409, "epoch": 1734} {"train_loss": -12.350252151489258, "global_step": 291410, "epoch": 1734} {"train_loss": -12.417072296142578, "global_step": 291411, "epoch": 1734} {"train_loss": -11.781113624572754, "global_step": 291412, "epoch": 1734} {"train_loss": -11.998868942260742, "global_step": 291413, "epoch": 1734} {"train_loss": -12.072991371154785, "global_step": 291414, "epoch": 1734} {"train_loss": -12.427064895629883, "global_step": 291415, "epoch": 1734} {"train_loss": -11.736601829528809, "global_step": 291416, "epoch": 1734} {"train_loss": -11.785825729370117, "global_step": 291417, "epoch": 1734} {"train_loss": -12.032574653625488, "global_step": 291418, "epoch": 1734} {"train_loss": -12.442329406738281, "global_step": 291419, "epoch": 1734} {"train_loss": -11.741800308227539, "global_step": 291420, "epoch": 1734} {"train_loss": -12.051176071166992, "global_step": 291421, "epoch": 1734} {"train_loss": -12.366666793823242, "global_step": 291422, "epoch": 1734} {"train_loss": -12.263092041015625, "global_step": 291423, "epoch": 1734} {"train_loss": -11.709619522094727, "global_step": 291424, "epoch": 1734} {"train_loss": -10.658773422241211, "global_step": 291425, "epoch": 1734} {"train_loss": -11.47689437866211, "global_step": 291426, "epoch": 1734} {"train_loss": -12.076085090637207, "global_step": 291427, "epoch": 1734} {"train_loss": -10.533557891845703, "global_step": 291428, "epoch": 1734} {"train_loss": -10.351659774780273, "global_step": 291429, "epoch": 1734} {"train_loss": -11.941193580627441, "global_step": 291430, "epoch": 1734} {"train_loss": -11.664457321166992, "global_step": 291431, "epoch": 1734} {"train_loss": -11.099769592285156, "global_step": 291432, "epoch": 1734} {"train_loss": -11.855769157409668, "global_step": 291433, "epoch": 1734} {"train_loss": -11.837797164916992, "global_step": 291434, "epoch": 1734} {"train_loss": -10.824636459350586, "global_step": 291435, "epoch": 1734} {"train_loss": -11.495790481567383, "global_step": 291436, "epoch": 1734} {"train_loss": -12.043785095214844, "global_step": 291437, "epoch": 1734} {"train_loss": -11.12937068939209, "global_step": 291438, "epoch": 1734} {"train_loss": -11.863947868347168, "global_step": 291439, "epoch": 1734} {"train_loss": -11.211938858032227, "global_step": 291440, "epoch": 1734} {"train_loss": -11.075945854187012, "global_step": 291441, "epoch": 1734} {"train_loss": -12.02406120300293, "global_step": 291442, "epoch": 1734} {"train_loss": -11.796514511108398, "global_step": 291443, "epoch": 1734} {"train_loss": -11.470932006835938, "global_step": 291444, "epoch": 1734} {"train_loss": -11.52801513671875, "global_step": 291445, "epoch": 1734} {"train_loss": -11.472576141357422, "global_step": 291446, "epoch": 1734} {"train_loss": -11.927633285522461, "global_step": 291447, "epoch": 1734} {"train_loss": -11.164301872253418, "global_step": 291448, "epoch": 1734} {"train_loss": -11.848255157470703, "global_step": 291449, "epoch": 1734} {"train_loss": -11.614864349365234, "global_step": 291450, "epoch": 1734} {"train_loss": -11.977202415466309, "global_step": 291451, "epoch": 1734} {"train_loss": -11.942815780639648, "global_step": 291452, "epoch": 1734} {"train_loss": -11.798317909240723, "global_step": 291453, "epoch": 1734} {"train_loss": -11.972929000854492, "global_step": 291454, "epoch": 1734} {"train_loss": -11.757043838500977, "global_step": 291455, "epoch": 1734} {"train_loss": -11.96041488647461, "global_step": 291456, "epoch": 1734} {"train_loss": -11.447949409484863, "global_step": 291457, "epoch": 1734} {"train_loss": -11.924266815185547, "global_step": 291458, "epoch": 1734} {"train_loss": -11.013847351074219, "global_step": 291459, "epoch": 1734} {"train_loss": -12.161392211914062, "global_step": 291460, "epoch": 1734} {"train_loss": -11.280760765075684, "global_step": 291461, "epoch": 1734} {"train_loss": -11.762532234191895, "global_step": 291462, "epoch": 1734} {"train_loss": -11.853569030761719, "global_step": 291463, "epoch": 1734} {"train_loss": -11.250055313110352, "global_step": 291464, "epoch": 1734} {"train_loss": -12.105463027954102, "global_step": 291465, "epoch": 1734} {"train_loss": -10.397808074951172, "global_step": 291466, "epoch": 1734} {"train_loss": -10.454216003417969, "global_step": 291467, "epoch": 1734} {"train_loss": -10.991979598999023, "global_step": 291468, "epoch": 1734} {"train_loss": -10.401707649230957, "global_step": 291469, "epoch": 1734} {"train_loss": -11.68113899230957, "global_step": 291470, "epoch": 1734} {"train_loss": -11.408120155334473, "global_step": 291471, "epoch": 1734} {"train_loss": -10.877243041992188, "global_step": 291472, "epoch": 1734} {"train_loss": -11.687885284423828, "global_step": 291473, "epoch": 1734} {"train_loss": -10.405378341674805, "global_step": 291474, "epoch": 1734} {"train_loss": -11.947126388549805, "global_step": 291475, "epoch": 1734} {"train_loss": -11.24692153930664, "global_step": 291476, "epoch": 1734} {"train_loss": -10.573147773742676, "global_step": 291477, "epoch": 1734} {"train_loss": -11.191444396972656, "global_step": 291478, "epoch": 1734} {"train_loss": -11.615336940402077, "global_step": 291479, "epoch": 1734, "val_loss": 279141.71875} {"train_loss": -10.379995346069336, "global_step": 291480, "epoch": 1735} {"train_loss": -11.633071899414062, "global_step": 291481, "epoch": 1735} {"train_loss": -10.475488662719727, "global_step": 291482, "epoch": 1735} {"train_loss": -11.047172546386719, "global_step": 291483, "epoch": 1735} {"train_loss": -10.736248970031738, "global_step": 291484, "epoch": 1735} {"train_loss": -11.32187557220459, "global_step": 291485, "epoch": 1735} {"train_loss": -11.495380401611328, "global_step": 291486, "epoch": 1735} {"train_loss": -11.777303695678711, "global_step": 291487, "epoch": 1735} {"train_loss": -11.247689247131348, "global_step": 291488, "epoch": 1735} {"train_loss": -11.417314529418945, "global_step": 291489, "epoch": 1735} {"train_loss": -11.548794746398926, "global_step": 291490, "epoch": 1735} {"train_loss": -12.028116226196289, "global_step": 291491, "epoch": 1735} {"train_loss": -11.722052574157715, "global_step": 291492, "epoch": 1735} {"train_loss": -11.830290794372559, "global_step": 291493, "epoch": 1735} {"train_loss": -11.594016075134277, "global_step": 291494, "epoch": 1735} {"train_loss": -12.013392448425293, "global_step": 291495, "epoch": 1735} {"train_loss": -11.885761260986328, "global_step": 291496, "epoch": 1735} {"train_loss": -11.883795738220215, "global_step": 291497, "epoch": 1735} {"train_loss": -11.714622497558594, "global_step": 291498, "epoch": 1735} {"train_loss": -11.67995834350586, "global_step": 291499, "epoch": 1735} {"train_loss": -11.422082901000977, "global_step": 291500, "epoch": 1735} {"train_loss": -12.19621753692627, "global_step": 291501, "epoch": 1735} {"train_loss": -11.387749671936035, "global_step": 291502, "epoch": 1735} {"train_loss": -11.999350547790527, "global_step": 291503, "epoch": 1735} {"train_loss": -11.705042839050293, "global_step": 291504, "epoch": 1735} {"train_loss": -12.140829086303711, "global_step": 291505, "epoch": 1735} {"train_loss": -11.808944702148438, "global_step": 291506, "epoch": 1735} {"train_loss": -12.088176727294922, "global_step": 291507, "epoch": 1735} {"train_loss": -12.03873062133789, "global_step": 291508, "epoch": 1735} {"train_loss": -12.111146926879883, "global_step": 291509, "epoch": 1735} {"train_loss": -11.978352546691895, "global_step": 291510, "epoch": 1735} {"train_loss": -12.196271896362305, "global_step": 291511, "epoch": 1735} {"train_loss": -11.889039039611816, "global_step": 291512, "epoch": 1735} {"train_loss": -11.895024299621582, "global_step": 291513, "epoch": 1735} {"train_loss": -11.71548843383789, "global_step": 291514, "epoch": 1735} {"train_loss": -12.101156234741211, "global_step": 291515, "epoch": 1735} {"train_loss": -11.994607925415039, "global_step": 291516, "epoch": 1735} {"train_loss": -11.933144569396973, "global_step": 291517, "epoch": 1735} {"train_loss": -12.149993896484375, "global_step": 291518, "epoch": 1735} {"train_loss": -11.980175018310547, "global_step": 291519, "epoch": 1735} {"train_loss": -12.173704147338867, "global_step": 291520, "epoch": 1735} {"train_loss": -12.161362648010254, "global_step": 291521, "epoch": 1735} {"train_loss": -12.214792251586914, "global_step": 291522, "epoch": 1735} {"train_loss": -12.19906234741211, "global_step": 291523, "epoch": 1735} {"train_loss": -12.506088256835938, "global_step": 291524, "epoch": 1735} {"train_loss": -12.268726348876953, "global_step": 291525, "epoch": 1735} {"train_loss": -12.219547271728516, "global_step": 291526, "epoch": 1735} {"train_loss": -12.168180465698242, "global_step": 291527, "epoch": 1735} {"train_loss": -12.17823314666748, "global_step": 291528, "epoch": 1735} {"train_loss": -12.259075164794922, "global_step": 291529, "epoch": 1735} {"train_loss": -12.249723434448242, "global_step": 291530, "epoch": 1735} {"train_loss": -12.049644470214844, "global_step": 291531, "epoch": 1735} {"train_loss": -12.280158996582031, "global_step": 291532, "epoch": 1735} {"train_loss": -12.205053329467773, "global_step": 291533, "epoch": 1735} {"train_loss": -12.406587600708008, "global_step": 291534, "epoch": 1735} {"train_loss": -11.949219703674316, "global_step": 291535, "epoch": 1735} {"train_loss": -12.23434829711914, "global_step": 291536, "epoch": 1735} {"train_loss": -12.295964241027832, "global_step": 291537, "epoch": 1735} {"train_loss": -12.32260799407959, "global_step": 291538, "epoch": 1735} {"train_loss": -12.181156158447266, "global_step": 291539, "epoch": 1735} {"train_loss": -12.21951675415039, "global_step": 291540, "epoch": 1735} {"train_loss": -11.748647689819336, "global_step": 291541, "epoch": 1735} {"train_loss": -11.708383560180664, "global_step": 291542, "epoch": 1735} {"train_loss": -11.442315101623535, "global_step": 291543, "epoch": 1735} {"train_loss": -11.293548583984375, "global_step": 291544, "epoch": 1735} {"train_loss": -11.400672912597656, "global_step": 291545, "epoch": 1735} {"train_loss": -11.413017272949219, "global_step": 291546, "epoch": 1735} {"train_loss": -10.448858261108398, "global_step": 291547, "epoch": 1735} {"train_loss": -10.533954620361328, "global_step": 291548, "epoch": 1735} {"train_loss": -11.628418922424316, "global_step": 291549, "epoch": 1735} {"train_loss": -11.165786743164062, "global_step": 291550, "epoch": 1735} {"train_loss": -11.32813835144043, "global_step": 291551, "epoch": 1735} {"train_loss": -9.348936080932617, "global_step": 291552, "epoch": 1735} {"train_loss": -10.482561111450195, "global_step": 291553, "epoch": 1735} {"train_loss": -10.275875091552734, "global_step": 291554, "epoch": 1735} {"train_loss": -10.452850341796875, "global_step": 291555, "epoch": 1735} {"train_loss": -9.885565757751465, "global_step": 291556, "epoch": 1735} {"train_loss": -10.028947830200195, "global_step": 291557, "epoch": 1735} {"train_loss": -9.805400848388672, "global_step": 291558, "epoch": 1735} {"train_loss": -10.344438552856445, "global_step": 291559, "epoch": 1735} {"train_loss": -10.494745254516602, "global_step": 291560, "epoch": 1735} {"train_loss": -10.231609344482422, "global_step": 291561, "epoch": 1735} {"train_loss": -11.19094467163086, "global_step": 291562, "epoch": 1735} {"train_loss": -10.93826675415039, "global_step": 291563, "epoch": 1735} {"train_loss": -11.23771858215332, "global_step": 291564, "epoch": 1735} {"train_loss": -11.392056465148926, "global_step": 291565, "epoch": 1735} {"train_loss": -11.55154037475586, "global_step": 291566, "epoch": 1735} {"train_loss": -10.799196243286133, "global_step": 291567, "epoch": 1735} {"train_loss": -10.880260467529297, "global_step": 291568, "epoch": 1735} {"train_loss": -10.978233337402344, "global_step": 291569, "epoch": 1735} {"train_loss": -11.037622451782227, "global_step": 291570, "epoch": 1735} {"train_loss": -10.977489471435547, "global_step": 291571, "epoch": 1735} {"train_loss": -11.308332443237305, "global_step": 291572, "epoch": 1735} {"train_loss": -11.104649543762207, "global_step": 291573, "epoch": 1735} {"train_loss": -11.711835861206055, "global_step": 291574, "epoch": 1735} {"train_loss": -11.075048446655273, "global_step": 291575, "epoch": 1735} {"train_loss": -11.365998268127441, "global_step": 291576, "epoch": 1735} {"train_loss": -11.69029712677002, "global_step": 291577, "epoch": 1735} {"train_loss": -11.17049789428711, "global_step": 291578, "epoch": 1735} {"train_loss": -11.59682846069336, "global_step": 291579, "epoch": 1735} {"train_loss": -11.52501106262207, "global_step": 291580, "epoch": 1735} {"train_loss": -11.235219955444336, "global_step": 291581, "epoch": 1735} {"train_loss": -11.601905822753906, "global_step": 291582, "epoch": 1735} {"train_loss": -11.130809783935547, "global_step": 291583, "epoch": 1735} {"train_loss": -11.656866073608398, "global_step": 291584, "epoch": 1735} {"train_loss": -11.636009216308594, "global_step": 291585, "epoch": 1735} {"train_loss": -11.539701461791992, "global_step": 291586, "epoch": 1735} {"train_loss": -11.83895492553711, "global_step": 291587, "epoch": 1735} {"train_loss": -11.849266052246094, "global_step": 291588, "epoch": 1735} {"train_loss": -11.651039123535156, "global_step": 291589, "epoch": 1735} {"train_loss": -11.685359954833984, "global_step": 291590, "epoch": 1735} {"train_loss": -11.937118530273438, "global_step": 291591, "epoch": 1735} {"train_loss": -11.086978912353516, "global_step": 291592, "epoch": 1735} {"train_loss": -12.02604866027832, "global_step": 291593, "epoch": 1735} {"train_loss": -11.386239051818848, "global_step": 291594, "epoch": 1735} {"train_loss": -12.112652778625488, "global_step": 291595, "epoch": 1735} {"train_loss": -11.714889526367188, "global_step": 291596, "epoch": 1735} {"train_loss": -11.892677307128906, "global_step": 291597, "epoch": 1735} {"train_loss": -11.899728775024414, "global_step": 291598, "epoch": 1735} {"train_loss": -11.655902862548828, "global_step": 291599, "epoch": 1735} {"train_loss": -11.703840255737305, "global_step": 291600, "epoch": 1735} {"train_loss": -11.9286470413208, "global_step": 291601, "epoch": 1735} {"train_loss": -11.67120361328125, "global_step": 291602, "epoch": 1735} {"train_loss": -11.987972259521484, "global_step": 291603, "epoch": 1735} {"train_loss": -11.90031623840332, "global_step": 291604, "epoch": 1735} {"train_loss": -11.91046142578125, "global_step": 291605, "epoch": 1735} {"train_loss": -12.296656608581543, "global_step": 291606, "epoch": 1735} {"train_loss": -11.815568923950195, "global_step": 291607, "epoch": 1735} {"train_loss": -12.275672912597656, "global_step": 291608, "epoch": 1735} {"train_loss": -11.722049713134766, "global_step": 291609, "epoch": 1735} {"train_loss": -12.035665512084961, "global_step": 291610, "epoch": 1735} {"train_loss": -11.847814559936523, "global_step": 291611, "epoch": 1735} {"train_loss": -11.86978816986084, "global_step": 291612, "epoch": 1735} {"train_loss": -11.65649127960205, "global_step": 291613, "epoch": 1735} {"train_loss": -11.921823501586914, "global_step": 291614, "epoch": 1735} {"train_loss": -11.827491760253906, "global_step": 291615, "epoch": 1735} {"train_loss": -11.887168884277344, "global_step": 291616, "epoch": 1735} {"train_loss": -11.712398529052734, "global_step": 291617, "epoch": 1735} {"train_loss": -11.912511825561523, "global_step": 291618, "epoch": 1735} {"train_loss": -11.655523300170898, "global_step": 291619, "epoch": 1735} {"train_loss": -11.559934616088867, "global_step": 291620, "epoch": 1735} {"train_loss": -11.676210403442383, "global_step": 291621, "epoch": 1735} {"train_loss": -11.79961109161377, "global_step": 291622, "epoch": 1735} {"train_loss": -11.58670425415039, "global_step": 291623, "epoch": 1735} {"train_loss": -11.753442764282227, "global_step": 291624, "epoch": 1735} {"train_loss": -11.579866409301758, "global_step": 291625, "epoch": 1735} {"train_loss": -12.000190734863281, "global_step": 291626, "epoch": 1735} {"train_loss": -11.78192138671875, "global_step": 291627, "epoch": 1735} {"train_loss": -11.675581932067871, "global_step": 291628, "epoch": 1735} {"train_loss": -11.931943893432617, "global_step": 291629, "epoch": 1735} {"train_loss": -11.765640258789062, "global_step": 291630, "epoch": 1735} {"train_loss": -11.950460433959961, "global_step": 291631, "epoch": 1735} {"train_loss": -11.918012619018555, "global_step": 291632, "epoch": 1735} {"train_loss": -11.978952407836914, "global_step": 291633, "epoch": 1735} {"train_loss": -12.276065826416016, "global_step": 291634, "epoch": 1735} {"train_loss": -11.986997604370117, "global_step": 291635, "epoch": 1735} {"train_loss": -11.993587493896484, "global_step": 291636, "epoch": 1735} {"train_loss": -12.359258651733398, "global_step": 291637, "epoch": 1735} {"train_loss": -11.972902297973633, "global_step": 291638, "epoch": 1735} {"train_loss": -11.772098541259766, "global_step": 291639, "epoch": 1735} {"train_loss": -12.322206497192383, "global_step": 291640, "epoch": 1735} {"train_loss": -11.947664260864258, "global_step": 291641, "epoch": 1735} {"train_loss": -11.892667770385742, "global_step": 291642, "epoch": 1735} {"train_loss": -12.339459419250488, "global_step": 291643, "epoch": 1735} {"train_loss": -12.064956665039062, "global_step": 291644, "epoch": 1735} {"train_loss": -12.353530883789062, "global_step": 291645, "epoch": 1735} {"train_loss": -12.170951843261719, "global_step": 291646, "epoch": 1735} {"train_loss": -11.652405148460751, "global_step": 291647, "epoch": 1735, "val_loss": 277287.96875, "train_action_mse_error": 2.914964437484741} {"train_loss": -12.105843544006348, "global_step": 291648, "epoch": 1736} {"train_loss": -12.075153350830078, "global_step": 291649, "epoch": 1736} {"train_loss": -12.259358406066895, "global_step": 291650, "epoch": 1736} {"train_loss": -11.912596702575684, "global_step": 291651, "epoch": 1736} {"train_loss": -11.920524597167969, "global_step": 291652, "epoch": 1736} {"train_loss": -11.968008041381836, "global_step": 291653, "epoch": 1736} {"train_loss": -12.017486572265625, "global_step": 291654, "epoch": 1736} {"train_loss": -11.656166076660156, "global_step": 291655, "epoch": 1736} {"train_loss": -12.070869445800781, "global_step": 291656, "epoch": 1736} {"train_loss": -11.521587371826172, "global_step": 291657, "epoch": 1736} {"train_loss": -12.121210098266602, "global_step": 291658, "epoch": 1736} {"train_loss": -11.942872047424316, "global_step": 291659, "epoch": 1736} {"train_loss": -11.707832336425781, "global_step": 291660, "epoch": 1736} {"train_loss": -11.924652099609375, "global_step": 291661, "epoch": 1736} {"train_loss": -11.938558578491211, "global_step": 291662, "epoch": 1736} {"train_loss": -11.618988037109375, "global_step": 291663, "epoch": 1736} {"train_loss": -12.16018009185791, "global_step": 291664, "epoch": 1736} {"train_loss": -12.191842079162598, "global_step": 291665, "epoch": 1736} {"train_loss": -11.75483512878418, "global_step": 291666, "epoch": 1736} {"train_loss": -12.116082191467285, "global_step": 291667, "epoch": 1736} {"train_loss": -12.052289962768555, "global_step": 291668, "epoch": 1736} {"train_loss": -12.419610977172852, "global_step": 291669, "epoch": 1736} {"train_loss": -12.184806823730469, "global_step": 291670, "epoch": 1736} {"train_loss": -12.090763092041016, "global_step": 291671, "epoch": 1736} {"train_loss": -12.166709899902344, "global_step": 291672, "epoch": 1736} {"train_loss": -12.398155212402344, "global_step": 291673, "epoch": 1736} {"train_loss": -12.264633178710938, "global_step": 291674, "epoch": 1736} {"train_loss": -12.258211135864258, "global_step": 291675, "epoch": 1736} {"train_loss": -11.7694091796875, "global_step": 291676, "epoch": 1736} {"train_loss": -12.415399551391602, "global_step": 291677, "epoch": 1736} {"train_loss": -11.938032150268555, "global_step": 291678, "epoch": 1736} {"train_loss": -12.23276424407959, "global_step": 291679, "epoch": 1736} {"train_loss": -11.970006942749023, "global_step": 291680, "epoch": 1736} {"train_loss": -12.105772972106934, "global_step": 291681, "epoch": 1736} {"train_loss": -11.192777633666992, "global_step": 291682, "epoch": 1736} {"train_loss": -12.153474807739258, "global_step": 291683, "epoch": 1736} {"train_loss": -11.604789733886719, "global_step": 291684, "epoch": 1736} {"train_loss": -12.013781547546387, "global_step": 291685, "epoch": 1736} {"train_loss": -11.97170352935791, "global_step": 291686, "epoch": 1736} {"train_loss": -11.748809814453125, "global_step": 291687, "epoch": 1736} {"train_loss": -11.416542053222656, "global_step": 291688, "epoch": 1736} {"train_loss": -10.8637113571167, "global_step": 291689, "epoch": 1736} {"train_loss": -12.267696380615234, "global_step": 291690, "epoch": 1736} {"train_loss": -10.544919967651367, "global_step": 291691, "epoch": 1736} {"train_loss": -10.654289245605469, "global_step": 291692, "epoch": 1736} {"train_loss": -11.860579490661621, "global_step": 291693, "epoch": 1736} {"train_loss": -11.34039306640625, "global_step": 291694, "epoch": 1736} {"train_loss": -8.85312271118164, "global_step": 291695, "epoch": 1736} {"train_loss": -11.00681209564209, "global_step": 291696, "epoch": 1736} {"train_loss": -10.22159481048584, "global_step": 291697, "epoch": 1736} {"train_loss": -11.30837345123291, "global_step": 291698, "epoch": 1736} {"train_loss": -11.597333908081055, "global_step": 291699, "epoch": 1736} {"train_loss": -11.457860946655273, "global_step": 291700, "epoch": 1736} {"train_loss": -10.90573787689209, "global_step": 291701, "epoch": 1736} {"train_loss": -11.68754768371582, "global_step": 291702, "epoch": 1736} {"train_loss": -11.19303035736084, "global_step": 291703, "epoch": 1736} {"train_loss": -11.165460586547852, "global_step": 291704, "epoch": 1736} {"train_loss": -11.71401596069336, "global_step": 291705, "epoch": 1736} {"train_loss": -11.001609802246094, "global_step": 291706, "epoch": 1736} {"train_loss": -10.800971984863281, "global_step": 291707, "epoch": 1736} {"train_loss": -10.7173490524292, "global_step": 291708, "epoch": 1736} {"train_loss": -10.800250053405762, "global_step": 291709, "epoch": 1736} {"train_loss": -10.845354080200195, "global_step": 291710, "epoch": 1736} {"train_loss": -11.674285888671875, "global_step": 291711, "epoch": 1736} {"train_loss": -11.210055351257324, "global_step": 291712, "epoch": 1736} {"train_loss": -11.523499488830566, "global_step": 291713, "epoch": 1736} {"train_loss": -11.03753662109375, "global_step": 291714, "epoch": 1736} {"train_loss": -11.345292091369629, "global_step": 291715, "epoch": 1736} {"train_loss": -11.457916259765625, "global_step": 291716, "epoch": 1736} {"train_loss": -11.743440628051758, "global_step": 291717, "epoch": 1736} {"train_loss": -11.705339431762695, "global_step": 291718, "epoch": 1736} {"train_loss": -11.154292106628418, "global_step": 291719, "epoch": 1736} {"train_loss": -11.567044258117676, "global_step": 291720, "epoch": 1736} {"train_loss": -11.126432418823242, "global_step": 291721, "epoch": 1736} {"train_loss": -11.453407287597656, "global_step": 291722, "epoch": 1736} {"train_loss": -11.627685546875, "global_step": 291723, "epoch": 1736} {"train_loss": -11.531590461730957, "global_step": 291724, "epoch": 1736} {"train_loss": -11.678010940551758, "global_step": 291725, "epoch": 1736} {"train_loss": -11.733491897583008, "global_step": 291726, "epoch": 1736} {"train_loss": -11.538185119628906, "global_step": 291727, "epoch": 1736} {"train_loss": -11.73175048828125, "global_step": 291728, "epoch": 1736} {"train_loss": -11.374268531799316, "global_step": 291729, "epoch": 1736} {"train_loss": -11.497366905212402, "global_step": 291730, "epoch": 1736} {"train_loss": -11.749524116516113, "global_step": 291731, "epoch": 1736} {"train_loss": -11.876148223876953, "global_step": 291732, "epoch": 1736} {"train_loss": -11.245001792907715, "global_step": 291733, "epoch": 1736} {"train_loss": -11.74766731262207, "global_step": 291734, "epoch": 1736} {"train_loss": -11.377315521240234, "global_step": 291735, "epoch": 1736} {"train_loss": -11.963361740112305, "global_step": 291736, "epoch": 1736} {"train_loss": -11.837556838989258, "global_step": 291737, "epoch": 1736} {"train_loss": -11.70089340209961, "global_step": 291738, "epoch": 1736} {"train_loss": -11.821240425109863, "global_step": 291739, "epoch": 1736} {"train_loss": -11.867368698120117, "global_step": 291740, "epoch": 1736} {"train_loss": -11.659703254699707, "global_step": 291741, "epoch": 1736} {"train_loss": -11.78381061553955, "global_step": 291742, "epoch": 1736} {"train_loss": -11.68674373626709, "global_step": 291743, "epoch": 1736} {"train_loss": -11.61324691772461, "global_step": 291744, "epoch": 1736} {"train_loss": -11.895404815673828, "global_step": 291745, "epoch": 1736} {"train_loss": -11.895846366882324, "global_step": 291746, "epoch": 1736} {"train_loss": -11.613805770874023, "global_step": 291747, "epoch": 1736} {"train_loss": -11.841691970825195, "global_step": 291748, "epoch": 1736} {"train_loss": -11.373733520507812, "global_step": 291749, "epoch": 1736} {"train_loss": -11.280315399169922, "global_step": 291750, "epoch": 1736} {"train_loss": -11.126483917236328, "global_step": 291751, "epoch": 1736} {"train_loss": -11.744794845581055, "global_step": 291752, "epoch": 1736} {"train_loss": -11.46496868133545, "global_step": 291753, "epoch": 1736} {"train_loss": -11.705044746398926, "global_step": 291754, "epoch": 1736} {"train_loss": -11.725400924682617, "global_step": 291755, "epoch": 1736} {"train_loss": -11.814616203308105, "global_step": 291756, "epoch": 1736} {"train_loss": -12.028279304504395, "global_step": 291757, "epoch": 1736} {"train_loss": -12.141083717346191, "global_step": 291758, "epoch": 1736} {"train_loss": -11.945899963378906, "global_step": 291759, "epoch": 1736} {"train_loss": -11.97745132446289, "global_step": 291760, "epoch": 1736} {"train_loss": -11.927245140075684, "global_step": 291761, "epoch": 1736} {"train_loss": -12.088848114013672, "global_step": 291762, "epoch": 1736} {"train_loss": -12.157526016235352, "global_step": 291763, "epoch": 1736} {"train_loss": -11.909969329833984, "global_step": 291764, "epoch": 1736} {"train_loss": -12.229524612426758, "global_step": 291765, "epoch": 1736} {"train_loss": -12.031452178955078, "global_step": 291766, "epoch": 1736} {"train_loss": -12.182384490966797, "global_step": 291767, "epoch": 1736} {"train_loss": -12.386253356933594, "global_step": 291768, "epoch": 1736} {"train_loss": -12.010879516601562, "global_step": 291769, "epoch": 1736} {"train_loss": -12.370437622070312, "global_step": 291770, "epoch": 1736} {"train_loss": -12.349742889404297, "global_step": 291771, "epoch": 1736} {"train_loss": -12.13358211517334, "global_step": 291772, "epoch": 1736} {"train_loss": -12.223306655883789, "global_step": 291773, "epoch": 1736} {"train_loss": -12.12942123413086, "global_step": 291774, "epoch": 1736} {"train_loss": -12.228145599365234, "global_step": 291775, "epoch": 1736} {"train_loss": -12.269275665283203, "global_step": 291776, "epoch": 1736} {"train_loss": -11.99102783203125, "global_step": 291777, "epoch": 1736} {"train_loss": -12.246716499328613, "global_step": 291778, "epoch": 1736} {"train_loss": -11.936939239501953, "global_step": 291779, "epoch": 1736} {"train_loss": -11.91093635559082, "global_step": 291780, "epoch": 1736} {"train_loss": -11.85163688659668, "global_step": 291781, "epoch": 1736} {"train_loss": -11.437103271484375, "global_step": 291782, "epoch": 1736} {"train_loss": -12.134764671325684, "global_step": 291783, "epoch": 1736} {"train_loss": -11.510986328125, "global_step": 291784, "epoch": 1736} {"train_loss": -11.914430618286133, "global_step": 291785, "epoch": 1736} {"train_loss": -11.829962730407715, "global_step": 291786, "epoch": 1736} {"train_loss": -12.018418312072754, "global_step": 291787, "epoch": 1736} {"train_loss": -11.07461929321289, "global_step": 291788, "epoch": 1736} {"train_loss": -12.118692398071289, "global_step": 291789, "epoch": 1736} {"train_loss": -11.328573226928711, "global_step": 291790, "epoch": 1736} {"train_loss": -12.116255760192871, "global_step": 291791, "epoch": 1736} {"train_loss": -11.570777893066406, "global_step": 291792, "epoch": 1736} {"train_loss": -11.885879516601562, "global_step": 291793, "epoch": 1736} {"train_loss": -11.842960357666016, "global_step": 291794, "epoch": 1736} {"train_loss": -11.780686378479004, "global_step": 291795, "epoch": 1736} {"train_loss": -12.010186195373535, "global_step": 291796, "epoch": 1736} {"train_loss": -11.81010627746582, "global_step": 291797, "epoch": 1736} {"train_loss": -11.699905395507812, "global_step": 291798, "epoch": 1736} {"train_loss": -10.9447021484375, "global_step": 291799, "epoch": 1736} {"train_loss": -12.182351112365723, "global_step": 291800, "epoch": 1736} {"train_loss": -11.606689453125, "global_step": 291801, "epoch": 1736} {"train_loss": -11.580157279968262, "global_step": 291802, "epoch": 1736} {"train_loss": -12.314244270324707, "global_step": 291803, "epoch": 1736} {"train_loss": -11.948720932006836, "global_step": 291804, "epoch": 1736} {"train_loss": -11.568426132202148, "global_step": 291805, "epoch": 1736} {"train_loss": -12.399735450744629, "global_step": 291806, "epoch": 1736} {"train_loss": -12.088717460632324, "global_step": 291807, "epoch": 1736} {"train_loss": -11.708571434020996, "global_step": 291808, "epoch": 1736} {"train_loss": -11.917764663696289, "global_step": 291809, "epoch": 1736} {"train_loss": -11.673372268676758, "global_step": 291810, "epoch": 1736} {"train_loss": -12.293596267700195, "global_step": 291811, "epoch": 1736} {"train_loss": -11.6951265335083, "global_step": 291812, "epoch": 1736} {"train_loss": -12.18238639831543, "global_step": 291813, "epoch": 1736} {"train_loss": -12.151573181152344, "global_step": 291814, "epoch": 1736} {"train_loss": -11.738415224211556, "global_step": 291815, "epoch": 1736, "val_loss": 279743.53125} {"train_loss": -11.736053466796875, "global_step": 291816, "epoch": 1737} {"train_loss": -11.908417701721191, "global_step": 291817, "epoch": 1737} {"train_loss": -11.633726119995117, "global_step": 291818, "epoch": 1737} {"train_loss": -11.63786506652832, "global_step": 291819, "epoch": 1737} {"train_loss": -12.070003509521484, "global_step": 291820, "epoch": 1737} {"train_loss": -11.658729553222656, "global_step": 291821, "epoch": 1737} {"train_loss": -11.825922012329102, "global_step": 291822, "epoch": 1737} {"train_loss": -11.658008575439453, "global_step": 291823, "epoch": 1737} {"train_loss": -12.07489013671875, "global_step": 291824, "epoch": 1737} {"train_loss": -12.071252822875977, "global_step": 291825, "epoch": 1737} {"train_loss": -12.054141998291016, "global_step": 291826, "epoch": 1737} {"train_loss": -12.301729202270508, "global_step": 291827, "epoch": 1737} {"train_loss": -12.04090690612793, "global_step": 291828, "epoch": 1737} {"train_loss": -11.62541389465332, "global_step": 291829, "epoch": 1737} {"train_loss": -11.879137992858887, "global_step": 291830, "epoch": 1737} {"train_loss": -12.339048385620117, "global_step": 291831, "epoch": 1737} {"train_loss": -11.781257629394531, "global_step": 291832, "epoch": 1737} {"train_loss": -12.161831855773926, "global_step": 291833, "epoch": 1737} {"train_loss": -12.100500106811523, "global_step": 291834, "epoch": 1737} {"train_loss": -11.55198860168457, "global_step": 291835, "epoch": 1737} {"train_loss": -11.981204986572266, "global_step": 291836, "epoch": 1737} {"train_loss": -11.92170524597168, "global_step": 291837, "epoch": 1737} {"train_loss": -11.619482040405273, "global_step": 291838, "epoch": 1737} {"train_loss": -12.274080276489258, "global_step": 291839, "epoch": 1737} {"train_loss": -11.786600112915039, "global_step": 291840, "epoch": 1737} {"train_loss": -12.039447784423828, "global_step": 291841, "epoch": 1737} {"train_loss": -12.154129028320312, "global_step": 291842, "epoch": 1737} {"train_loss": -11.300905227661133, "global_step": 291843, "epoch": 1737} {"train_loss": -11.600191116333008, "global_step": 291844, "epoch": 1737} {"train_loss": -12.125153541564941, "global_step": 291845, "epoch": 1737} {"train_loss": -11.399876594543457, "global_step": 291846, "epoch": 1737} {"train_loss": -12.297714233398438, "global_step": 291847, "epoch": 1737} {"train_loss": -11.81778335571289, "global_step": 291848, "epoch": 1737} {"train_loss": -12.588825225830078, "global_step": 291849, "epoch": 1737} {"train_loss": -11.198092460632324, "global_step": 291850, "epoch": 1737} {"train_loss": -12.336606979370117, "global_step": 291851, "epoch": 1737} {"train_loss": -11.701805114746094, "global_step": 291852, "epoch": 1737} {"train_loss": -12.038787841796875, "global_step": 291853, "epoch": 1737} {"train_loss": -11.965139389038086, "global_step": 291854, "epoch": 1737} {"train_loss": -12.060623168945312, "global_step": 291855, "epoch": 1737} {"train_loss": -11.704023361206055, "global_step": 291856, "epoch": 1737} {"train_loss": -11.362263679504395, "global_step": 291857, "epoch": 1737} {"train_loss": -11.244457244873047, "global_step": 291858, "epoch": 1737} {"train_loss": -11.285627365112305, "global_step": 291859, "epoch": 1737} {"train_loss": -12.05361557006836, "global_step": 291860, "epoch": 1737} {"train_loss": -11.269245147705078, "global_step": 291861, "epoch": 1737} {"train_loss": -11.223278045654297, "global_step": 291862, "epoch": 1737} {"train_loss": -11.289915084838867, "global_step": 291863, "epoch": 1737} {"train_loss": -12.000303268432617, "global_step": 291864, "epoch": 1737} {"train_loss": -11.596275329589844, "global_step": 291865, "epoch": 1737} {"train_loss": -11.446712493896484, "global_step": 291866, "epoch": 1737} {"train_loss": -11.88545036315918, "global_step": 291867, "epoch": 1737} {"train_loss": -10.716062545776367, "global_step": 291868, "epoch": 1737} {"train_loss": -12.151132583618164, "global_step": 291869, "epoch": 1737} {"train_loss": -10.584964752197266, "global_step": 291870, "epoch": 1737} {"train_loss": -11.897199630737305, "global_step": 291871, "epoch": 1737} {"train_loss": -11.65626335144043, "global_step": 291872, "epoch": 1737} {"train_loss": -11.554450035095215, "global_step": 291873, "epoch": 1737} {"train_loss": -12.042333602905273, "global_step": 291874, "epoch": 1737} {"train_loss": -11.335054397583008, "global_step": 291875, "epoch": 1737} {"train_loss": -11.935966491699219, "global_step": 291876, "epoch": 1737} {"train_loss": -11.343578338623047, "global_step": 291877, "epoch": 1737} {"train_loss": -11.821151733398438, "global_step": 291878, "epoch": 1737} {"train_loss": -11.670955657958984, "global_step": 291879, "epoch": 1737} {"train_loss": -11.660804748535156, "global_step": 291880, "epoch": 1737} {"train_loss": -11.489465713500977, "global_step": 291881, "epoch": 1737} {"train_loss": -11.394062042236328, "global_step": 291882, "epoch": 1737} {"train_loss": -11.985213279724121, "global_step": 291883, "epoch": 1737} {"train_loss": -11.648675918579102, "global_step": 291884, "epoch": 1737} {"train_loss": -11.833831787109375, "global_step": 291885, "epoch": 1737} {"train_loss": -11.349678039550781, "global_step": 291886, "epoch": 1737} {"train_loss": -12.116829872131348, "global_step": 291887, "epoch": 1737} {"train_loss": -11.844636917114258, "global_step": 291888, "epoch": 1737} {"train_loss": -11.470706939697266, "global_step": 291889, "epoch": 1737} {"train_loss": -11.686580657958984, "global_step": 291890, "epoch": 1737} {"train_loss": -11.708602905273438, "global_step": 291891, "epoch": 1737} {"train_loss": -12.089929580688477, "global_step": 291892, "epoch": 1737} {"train_loss": -11.54018783569336, "global_step": 291893, "epoch": 1737} {"train_loss": -11.663148880004883, "global_step": 291894, "epoch": 1737} {"train_loss": -11.798149108886719, "global_step": 291895, "epoch": 1737} {"train_loss": -11.189563751220703, "global_step": 291896, "epoch": 1737} {"train_loss": -12.082822799682617, "global_step": 291897, "epoch": 1737} {"train_loss": -11.697028160095215, "global_step": 291898, "epoch": 1737} {"train_loss": -11.898083686828613, "global_step": 291899, "epoch": 1737} {"train_loss": -11.642887115478516, "global_step": 291900, "epoch": 1737} {"train_loss": -11.78806209564209, "global_step": 291901, "epoch": 1737} {"train_loss": -12.101593017578125, "global_step": 291902, "epoch": 1737} {"train_loss": -12.134315490722656, "global_step": 291903, "epoch": 1737} {"train_loss": -11.971746444702148, "global_step": 291904, "epoch": 1737} {"train_loss": -11.579192161560059, "global_step": 291905, "epoch": 1737} {"train_loss": -11.926596641540527, "global_step": 291906, "epoch": 1737} {"train_loss": -12.187300682067871, "global_step": 291907, "epoch": 1737} {"train_loss": -11.63909912109375, "global_step": 291908, "epoch": 1737} {"train_loss": -12.103401184082031, "global_step": 291909, "epoch": 1737} {"train_loss": -11.61480712890625, "global_step": 291910, "epoch": 1737} {"train_loss": -11.899130821228027, "global_step": 291911, "epoch": 1737} {"train_loss": -12.051445007324219, "global_step": 291912, "epoch": 1737} {"train_loss": -11.963565826416016, "global_step": 291913, "epoch": 1737} {"train_loss": -11.928417205810547, "global_step": 291914, "epoch": 1737} {"train_loss": -12.241568565368652, "global_step": 291915, "epoch": 1737} {"train_loss": -12.12741470336914, "global_step": 291916, "epoch": 1737} {"train_loss": -11.762489318847656, "global_step": 291917, "epoch": 1737} {"train_loss": -12.004377365112305, "global_step": 291918, "epoch": 1737} {"train_loss": -12.034449577331543, "global_step": 291919, "epoch": 1737} {"train_loss": -11.987167358398438, "global_step": 291920, "epoch": 1737} {"train_loss": -12.003620147705078, "global_step": 291921, "epoch": 1737} {"train_loss": -12.145685195922852, "global_step": 291922, "epoch": 1737} {"train_loss": -12.091785430908203, "global_step": 291923, "epoch": 1737} {"train_loss": -12.201898574829102, "global_step": 291924, "epoch": 1737} {"train_loss": -12.180374145507812, "global_step": 291925, "epoch": 1737} {"train_loss": -12.145764350891113, "global_step": 291926, "epoch": 1737} {"train_loss": -12.30087661743164, "global_step": 291927, "epoch": 1737} {"train_loss": -11.79496955871582, "global_step": 291928, "epoch": 1737} {"train_loss": -12.327112197875977, "global_step": 291929, "epoch": 1737} {"train_loss": -12.0967435836792, "global_step": 291930, "epoch": 1737} {"train_loss": -12.331011772155762, "global_step": 291931, "epoch": 1737} {"train_loss": -12.046753883361816, "global_step": 291932, "epoch": 1737} {"train_loss": -12.291726112365723, "global_step": 291933, "epoch": 1737} {"train_loss": -12.053043365478516, "global_step": 291934, "epoch": 1737} {"train_loss": -12.165271759033203, "global_step": 291935, "epoch": 1737} {"train_loss": -12.243744850158691, "global_step": 291936, "epoch": 1737} {"train_loss": -12.024486541748047, "global_step": 291937, "epoch": 1737} {"train_loss": -12.347559928894043, "global_step": 291938, "epoch": 1737} {"train_loss": -12.234490394592285, "global_step": 291939, "epoch": 1737} {"train_loss": -12.04423999786377, "global_step": 291940, "epoch": 1737} {"train_loss": -12.12331771850586, "global_step": 291941, "epoch": 1737} {"train_loss": -12.306243896484375, "global_step": 291942, "epoch": 1737} {"train_loss": -12.145906448364258, "global_step": 291943, "epoch": 1737} {"train_loss": -12.046655654907227, "global_step": 291944, "epoch": 1737} {"train_loss": -12.164305686950684, "global_step": 291945, "epoch": 1737} {"train_loss": -12.139997482299805, "global_step": 291946, "epoch": 1737} {"train_loss": -12.014548301696777, "global_step": 291947, "epoch": 1737} {"train_loss": -11.748529434204102, "global_step": 291948, "epoch": 1737} {"train_loss": -11.983592987060547, "global_step": 291949, "epoch": 1737} {"train_loss": -12.181943893432617, "global_step": 291950, "epoch": 1737} {"train_loss": -12.321538925170898, "global_step": 291951, "epoch": 1737} {"train_loss": -12.336040496826172, "global_step": 291952, "epoch": 1737} {"train_loss": -12.172541618347168, "global_step": 291953, "epoch": 1737} {"train_loss": -12.095832824707031, "global_step": 291954, "epoch": 1737} {"train_loss": -12.143808364868164, "global_step": 291955, "epoch": 1737} {"train_loss": -12.282960891723633, "global_step": 291956, "epoch": 1737} {"train_loss": -12.299409866333008, "global_step": 291957, "epoch": 1737} {"train_loss": -12.312957763671875, "global_step": 291958, "epoch": 1737} {"train_loss": -11.657381057739258, "global_step": 291959, "epoch": 1737} {"train_loss": -10.628618240356445, "global_step": 291960, "epoch": 1737} {"train_loss": -10.356027603149414, "global_step": 291961, "epoch": 1737} {"train_loss": -12.518024444580078, "global_step": 291962, "epoch": 1737} {"train_loss": -10.003643035888672, "global_step": 291963, "epoch": 1737} {"train_loss": -11.20821475982666, "global_step": 291964, "epoch": 1737} {"train_loss": -11.560320854187012, "global_step": 291965, "epoch": 1737} {"train_loss": -10.51572036743164, "global_step": 291966, "epoch": 1737} {"train_loss": -10.118280410766602, "global_step": 291967, "epoch": 1737} {"train_loss": -12.056500434875488, "global_step": 291968, "epoch": 1737} {"train_loss": -11.095285415649414, "global_step": 291969, "epoch": 1737} {"train_loss": -10.842446327209473, "global_step": 291970, "epoch": 1737} {"train_loss": -11.702627182006836, "global_step": 291971, "epoch": 1737} {"train_loss": -11.205604553222656, "global_step": 291972, "epoch": 1737} {"train_loss": -11.412322998046875, "global_step": 291973, "epoch": 1737} {"train_loss": -11.75823974609375, "global_step": 291974, "epoch": 1737} {"train_loss": -10.937690734863281, "global_step": 291975, "epoch": 1737} {"train_loss": -11.881868362426758, "global_step": 291976, "epoch": 1737} {"train_loss": -10.96313190460205, "global_step": 291977, "epoch": 1737} {"train_loss": -11.063861846923828, "global_step": 291978, "epoch": 1737} {"train_loss": -11.946517944335938, "global_step": 291979, "epoch": 1737} {"train_loss": -11.485276222229004, "global_step": 291980, "epoch": 1737} {"train_loss": -11.458118438720703, "global_step": 291981, "epoch": 1737} {"train_loss": -11.815173149108887, "global_step": 291982, "epoch": 1737} {"train_loss": -11.797228852907816, "global_step": 291983, "epoch": 1737, "val_loss": 281316.0} {"train_loss": -11.59812068939209, "global_step": 291984, "epoch": 1738} {"train_loss": -11.68039321899414, "global_step": 291985, "epoch": 1738} {"train_loss": -11.410913467407227, "global_step": 291986, "epoch": 1738} {"train_loss": -11.189411163330078, "global_step": 291987, "epoch": 1738} {"train_loss": -11.631889343261719, "global_step": 291988, "epoch": 1738} {"train_loss": -11.696439743041992, "global_step": 291989, "epoch": 1738} {"train_loss": -12.107430458068848, "global_step": 291990, "epoch": 1738} {"train_loss": -11.896288871765137, "global_step": 291991, "epoch": 1738} {"train_loss": -11.353276252746582, "global_step": 291992, "epoch": 1738} {"train_loss": -11.840845108032227, "global_step": 291993, "epoch": 1738} {"train_loss": -11.931941986083984, "global_step": 291994, "epoch": 1738} {"train_loss": -11.8016996383667, "global_step": 291995, "epoch": 1738} {"train_loss": -11.895145416259766, "global_step": 291996, "epoch": 1738} {"train_loss": -11.514437675476074, "global_step": 291997, "epoch": 1738} {"train_loss": -11.74771499633789, "global_step": 291998, "epoch": 1738} {"train_loss": -11.74618911743164, "global_step": 291999, "epoch": 1738} {"train_loss": -11.752649307250977, "global_step": 292000, "epoch": 1738} {"train_loss": -12.111278533935547, "global_step": 292001, "epoch": 1738} {"train_loss": -11.820305824279785, "global_step": 292002, "epoch": 1738} {"train_loss": -11.908743858337402, "global_step": 292003, "epoch": 1738} {"train_loss": -12.048141479492188, "global_step": 292004, "epoch": 1738} {"train_loss": -12.153926849365234, "global_step": 292005, "epoch": 1738} {"train_loss": -11.905263900756836, "global_step": 292006, "epoch": 1738} {"train_loss": -12.15200424194336, "global_step": 292007, "epoch": 1738} {"train_loss": -12.161409378051758, "global_step": 292008, "epoch": 1738} {"train_loss": -12.132692337036133, "global_step": 292009, "epoch": 1738} {"train_loss": -12.126016616821289, "global_step": 292010, "epoch": 1738} {"train_loss": -12.073875427246094, "global_step": 292011, "epoch": 1738} {"train_loss": -12.331857681274414, "global_step": 292012, "epoch": 1738} {"train_loss": -12.12326431274414, "global_step": 292013, "epoch": 1738} {"train_loss": -12.061509132385254, "global_step": 292014, "epoch": 1738} {"train_loss": -11.946928024291992, "global_step": 292015, "epoch": 1738} {"train_loss": -12.13532829284668, "global_step": 292016, "epoch": 1738} {"train_loss": -12.133609771728516, "global_step": 292017, "epoch": 1738} {"train_loss": -12.176076889038086, "global_step": 292018, "epoch": 1738} {"train_loss": -12.49300765991211, "global_step": 292019, "epoch": 1738} {"train_loss": -12.061237335205078, "global_step": 292020, "epoch": 1738} {"train_loss": -12.306449890136719, "global_step": 292021, "epoch": 1738} {"train_loss": -12.179977416992188, "global_step": 292022, "epoch": 1738} {"train_loss": -12.284358978271484, "global_step": 292023, "epoch": 1738} {"train_loss": -12.499154090881348, "global_step": 292024, "epoch": 1738} {"train_loss": -12.221647262573242, "global_step": 292025, "epoch": 1738} {"train_loss": -12.441875457763672, "global_step": 292026, "epoch": 1738} {"train_loss": -12.396500587463379, "global_step": 292027, "epoch": 1738} {"train_loss": -12.314754486083984, "global_step": 292028, "epoch": 1738} {"train_loss": -12.304067611694336, "global_step": 292029, "epoch": 1738} {"train_loss": -12.452895164489746, "global_step": 292030, "epoch": 1738} {"train_loss": -12.305978775024414, "global_step": 292031, "epoch": 1738} {"train_loss": -12.216403007507324, "global_step": 292032, "epoch": 1738} {"train_loss": -11.893952369689941, "global_step": 292033, "epoch": 1738} {"train_loss": -11.62452507019043, "global_step": 292034, "epoch": 1738} {"train_loss": -12.03973388671875, "global_step": 292035, "epoch": 1738} {"train_loss": -12.013092041015625, "global_step": 292036, "epoch": 1738} {"train_loss": -12.161388397216797, "global_step": 292037, "epoch": 1738} {"train_loss": -12.126016616821289, "global_step": 292038, "epoch": 1738} {"train_loss": -12.337320327758789, "global_step": 292039, "epoch": 1738} {"train_loss": -12.428646087646484, "global_step": 292040, "epoch": 1738} {"train_loss": -12.436792373657227, "global_step": 292041, "epoch": 1738} {"train_loss": -12.080424308776855, "global_step": 292042, "epoch": 1738} {"train_loss": -12.203723907470703, "global_step": 292043, "epoch": 1738} {"train_loss": -12.162894248962402, "global_step": 292044, "epoch": 1738} {"train_loss": -12.02243423461914, "global_step": 292045, "epoch": 1738} {"train_loss": -12.189329147338867, "global_step": 292046, "epoch": 1738} {"train_loss": -12.031719207763672, "global_step": 292047, "epoch": 1738} {"train_loss": -12.095067977905273, "global_step": 292048, "epoch": 1738} {"train_loss": -11.687067031860352, "global_step": 292049, "epoch": 1738} {"train_loss": -11.967052459716797, "global_step": 292050, "epoch": 1738} {"train_loss": -12.197484016418457, "global_step": 292051, "epoch": 1738} {"train_loss": -11.93545150756836, "global_step": 292052, "epoch": 1738} {"train_loss": -12.016921997070312, "global_step": 292053, "epoch": 1738} {"train_loss": -11.966482162475586, "global_step": 292054, "epoch": 1738} {"train_loss": -12.044140815734863, "global_step": 292055, "epoch": 1738} {"train_loss": -11.880081176757812, "global_step": 292056, "epoch": 1738} {"train_loss": -11.97693920135498, "global_step": 292057, "epoch": 1738} {"train_loss": -11.407712936401367, "global_step": 292058, "epoch": 1738} {"train_loss": -11.821293830871582, "global_step": 292059, "epoch": 1738} {"train_loss": -11.647918701171875, "global_step": 292060, "epoch": 1738} {"train_loss": -11.942483901977539, "global_step": 292061, "epoch": 1738} {"train_loss": -11.741425514221191, "global_step": 292062, "epoch": 1738} {"train_loss": -12.099605560302734, "global_step": 292063, "epoch": 1738} {"train_loss": -11.696889877319336, "global_step": 292064, "epoch": 1738} {"train_loss": -11.604300498962402, "global_step": 292065, "epoch": 1738} {"train_loss": -11.609376907348633, "global_step": 292066, "epoch": 1738} {"train_loss": -11.684226989746094, "global_step": 292067, "epoch": 1738} {"train_loss": -11.87442684173584, "global_step": 292068, "epoch": 1738} {"train_loss": -10.793645858764648, "global_step": 292069, "epoch": 1738} {"train_loss": -12.011699676513672, "global_step": 292070, "epoch": 1738} {"train_loss": -10.843164443969727, "global_step": 292071, "epoch": 1738} {"train_loss": -11.981935501098633, "global_step": 292072, "epoch": 1738} {"train_loss": -11.543388366699219, "global_step": 292073, "epoch": 1738} {"train_loss": -11.967279434204102, "global_step": 292074, "epoch": 1738} {"train_loss": -11.826924324035645, "global_step": 292075, "epoch": 1738} {"train_loss": -11.803237915039062, "global_step": 292076, "epoch": 1738} {"train_loss": -11.474142074584961, "global_step": 292077, "epoch": 1738} {"train_loss": -11.999710083007812, "global_step": 292078, "epoch": 1738} {"train_loss": -11.955474853515625, "global_step": 292079, "epoch": 1738} {"train_loss": -12.162286758422852, "global_step": 292080, "epoch": 1738} {"train_loss": -12.026134490966797, "global_step": 292081, "epoch": 1738} {"train_loss": -12.212800025939941, "global_step": 292082, "epoch": 1738} {"train_loss": -11.971094131469727, "global_step": 292083, "epoch": 1738} {"train_loss": -11.683347702026367, "global_step": 292084, "epoch": 1738} {"train_loss": -11.70254898071289, "global_step": 292085, "epoch": 1738} {"train_loss": -11.96483325958252, "global_step": 292086, "epoch": 1738} {"train_loss": -11.903635025024414, "global_step": 292087, "epoch": 1738} {"train_loss": -11.543278694152832, "global_step": 292088, "epoch": 1738} {"train_loss": -11.404311180114746, "global_step": 292089, "epoch": 1738} {"train_loss": -11.854047775268555, "global_step": 292090, "epoch": 1738} {"train_loss": -11.225213050842285, "global_step": 292091, "epoch": 1738} {"train_loss": -12.060136795043945, "global_step": 292092, "epoch": 1738} {"train_loss": -11.320720672607422, "global_step": 292093, "epoch": 1738} {"train_loss": -12.249844551086426, "global_step": 292094, "epoch": 1738} {"train_loss": -11.370040893554688, "global_step": 292095, "epoch": 1738} {"train_loss": -11.811914443969727, "global_step": 292096, "epoch": 1738} {"train_loss": -11.491933822631836, "global_step": 292097, "epoch": 1738} {"train_loss": -11.198558807373047, "global_step": 292098, "epoch": 1738} {"train_loss": -10.940201759338379, "global_step": 292099, "epoch": 1738} {"train_loss": -10.12314224243164, "global_step": 292100, "epoch": 1738} {"train_loss": -11.09031867980957, "global_step": 292101, "epoch": 1738} {"train_loss": -9.508329391479492, "global_step": 292102, "epoch": 1738} {"train_loss": -11.198687553405762, "global_step": 292103, "epoch": 1738} {"train_loss": -9.961647033691406, "global_step": 292104, "epoch": 1738} {"train_loss": -9.41172981262207, "global_step": 292105, "epoch": 1738} {"train_loss": -9.69119644165039, "global_step": 292106, "epoch": 1738} {"train_loss": -9.92117691040039, "global_step": 292107, "epoch": 1738} {"train_loss": -8.472548484802246, "global_step": 292108, "epoch": 1738} {"train_loss": -9.453756332397461, "global_step": 292109, "epoch": 1738} {"train_loss": -10.063089370727539, "global_step": 292110, "epoch": 1738} {"train_loss": -9.676370620727539, "global_step": 292111, "epoch": 1738} {"train_loss": -10.719752311706543, "global_step": 292112, "epoch": 1738} {"train_loss": -10.261213302612305, "global_step": 292113, "epoch": 1738} {"train_loss": -10.49101448059082, "global_step": 292114, "epoch": 1738} {"train_loss": -10.762386322021484, "global_step": 292115, "epoch": 1738} {"train_loss": -10.899992942810059, "global_step": 292116, "epoch": 1738} {"train_loss": -11.237207412719727, "global_step": 292117, "epoch": 1738} {"train_loss": -10.09885025024414, "global_step": 292118, "epoch": 1738} {"train_loss": -10.364856719970703, "global_step": 292119, "epoch": 1738} {"train_loss": -11.081658363342285, "global_step": 292120, "epoch": 1738} {"train_loss": -10.390898704528809, "global_step": 292121, "epoch": 1738} {"train_loss": -11.153484344482422, "global_step": 292122, "epoch": 1738} {"train_loss": -11.008294105529785, "global_step": 292123, "epoch": 1738} {"train_loss": -11.190683364868164, "global_step": 292124, "epoch": 1738} {"train_loss": -11.06134033203125, "global_step": 292125, "epoch": 1738} {"train_loss": -11.012150764465332, "global_step": 292126, "epoch": 1738} {"train_loss": -11.588079452514648, "global_step": 292127, "epoch": 1738} {"train_loss": -11.507593154907227, "global_step": 292128, "epoch": 1738} {"train_loss": -11.474945068359375, "global_step": 292129, "epoch": 1738} {"train_loss": -11.554110527038574, "global_step": 292130, "epoch": 1738} {"train_loss": -11.259927749633789, "global_step": 292131, "epoch": 1738} {"train_loss": -11.24813461303711, "global_step": 292132, "epoch": 1738} {"train_loss": -11.296524047851562, "global_step": 292133, "epoch": 1738} {"train_loss": -11.346979141235352, "global_step": 292134, "epoch": 1738} {"train_loss": -11.507524490356445, "global_step": 292135, "epoch": 1738} {"train_loss": -11.440706253051758, "global_step": 292136, "epoch": 1738} {"train_loss": -11.770410537719727, "global_step": 292137, "epoch": 1738} {"train_loss": -11.53281021118164, "global_step": 292138, "epoch": 1738} {"train_loss": -11.592767715454102, "global_step": 292139, "epoch": 1738} {"train_loss": -11.999896049499512, "global_step": 292140, "epoch": 1738} {"train_loss": -11.809082984924316, "global_step": 292141, "epoch": 1738} {"train_loss": -11.701385498046875, "global_step": 292142, "epoch": 1738} {"train_loss": -11.718241691589355, "global_step": 292143, "epoch": 1738} {"train_loss": -11.845343589782715, "global_step": 292144, "epoch": 1738} {"train_loss": -11.874533653259277, "global_step": 292145, "epoch": 1738} {"train_loss": -11.785314559936523, "global_step": 292146, "epoch": 1738} {"train_loss": -11.735761642456055, "global_step": 292147, "epoch": 1738} {"train_loss": -11.684619903564453, "global_step": 292148, "epoch": 1738} {"train_loss": -11.972393035888672, "global_step": 292149, "epoch": 1738} {"train_loss": -11.836322784423828, "global_step": 292150, "epoch": 1738} {"train_loss": -11.626372047833033, "global_step": 292151, "epoch": 1738, "val_loss": 279985.5625} {"train_loss": -11.713045120239258, "global_step": 292152, "epoch": 1739} {"train_loss": -12.000368118286133, "global_step": 292153, "epoch": 1739} {"train_loss": -12.008001327514648, "global_step": 292154, "epoch": 1739} {"train_loss": -12.077756881713867, "global_step": 292155, "epoch": 1739} {"train_loss": -11.971945762634277, "global_step": 292156, "epoch": 1739} {"train_loss": -11.95555305480957, "global_step": 292157, "epoch": 1739} {"train_loss": -11.857335090637207, "global_step": 292158, "epoch": 1739} {"train_loss": -11.947713851928711, "global_step": 292159, "epoch": 1739} {"train_loss": -12.013026237487793, "global_step": 292160, "epoch": 1739} {"train_loss": -11.911325454711914, "global_step": 292161, "epoch": 1739} {"train_loss": -11.974835395812988, "global_step": 292162, "epoch": 1739} {"train_loss": -11.986329078674316, "global_step": 292163, "epoch": 1739} {"train_loss": -11.822442054748535, "global_step": 292164, "epoch": 1739} {"train_loss": -11.813121795654297, "global_step": 292165, "epoch": 1739} {"train_loss": -11.985280990600586, "global_step": 292166, "epoch": 1739} {"train_loss": -12.161163330078125, "global_step": 292167, "epoch": 1739} {"train_loss": -11.965705871582031, "global_step": 292168, "epoch": 1739} {"train_loss": -12.17000675201416, "global_step": 292169, "epoch": 1739} {"train_loss": -11.867693901062012, "global_step": 292170, "epoch": 1739} {"train_loss": -12.343621253967285, "global_step": 292171, "epoch": 1739} {"train_loss": -11.835681915283203, "global_step": 292172, "epoch": 1739} {"train_loss": -12.246761322021484, "global_step": 292173, "epoch": 1739} {"train_loss": -11.882033348083496, "global_step": 292174, "epoch": 1739} {"train_loss": -11.97789192199707, "global_step": 292175, "epoch": 1739} {"train_loss": -11.709188461303711, "global_step": 292176, "epoch": 1739} {"train_loss": -12.405759811401367, "global_step": 292177, "epoch": 1739} {"train_loss": -11.79399299621582, "global_step": 292178, "epoch": 1739} {"train_loss": -12.275026321411133, "global_step": 292179, "epoch": 1739} {"train_loss": -12.164445877075195, "global_step": 292180, "epoch": 1739} {"train_loss": -12.038113594055176, "global_step": 292181, "epoch": 1739} {"train_loss": -12.15038776397705, "global_step": 292182, "epoch": 1739} {"train_loss": -12.061260223388672, "global_step": 292183, "epoch": 1739} {"train_loss": -11.899004936218262, "global_step": 292184, "epoch": 1739} {"train_loss": -12.07557487487793, "global_step": 292185, "epoch": 1739} {"train_loss": -12.291997909545898, "global_step": 292186, "epoch": 1739} {"train_loss": -12.160120010375977, "global_step": 292187, "epoch": 1739} {"train_loss": -12.179516792297363, "global_step": 292188, "epoch": 1739} {"train_loss": -12.173561096191406, "global_step": 292189, "epoch": 1739} {"train_loss": -12.257242202758789, "global_step": 292190, "epoch": 1739} {"train_loss": -12.154563903808594, "global_step": 292191, "epoch": 1739} {"train_loss": -12.260660171508789, "global_step": 292192, "epoch": 1739} {"train_loss": -12.148882865905762, "global_step": 292193, "epoch": 1739} {"train_loss": -12.193777084350586, "global_step": 292194, "epoch": 1739} {"train_loss": -12.3079833984375, "global_step": 292195, "epoch": 1739} {"train_loss": -12.129908561706543, "global_step": 292196, "epoch": 1739} {"train_loss": -12.316667556762695, "global_step": 292197, "epoch": 1739} {"train_loss": -12.157718658447266, "global_step": 292198, "epoch": 1739} {"train_loss": -12.09272575378418, "global_step": 292199, "epoch": 1739} {"train_loss": -12.32866382598877, "global_step": 292200, "epoch": 1739} {"train_loss": -12.052306175231934, "global_step": 292201, "epoch": 1739} {"train_loss": -12.179271697998047, "global_step": 292202, "epoch": 1739} {"train_loss": -12.22677230834961, "global_step": 292203, "epoch": 1739} {"train_loss": -12.146940231323242, "global_step": 292204, "epoch": 1739} {"train_loss": -12.203731536865234, "global_step": 292205, "epoch": 1739} {"train_loss": -12.122068405151367, "global_step": 292206, "epoch": 1739} {"train_loss": -12.0760498046875, "global_step": 292207, "epoch": 1739} {"train_loss": -12.20004940032959, "global_step": 292208, "epoch": 1739} {"train_loss": -12.009424209594727, "global_step": 292209, "epoch": 1739} {"train_loss": -11.945684432983398, "global_step": 292210, "epoch": 1739} {"train_loss": -12.119264602661133, "global_step": 292211, "epoch": 1739} {"train_loss": -12.215434074401855, "global_step": 292212, "epoch": 1739} {"train_loss": -12.144404411315918, "global_step": 292213, "epoch": 1739} {"train_loss": -12.188636779785156, "global_step": 292214, "epoch": 1739} {"train_loss": -12.172795295715332, "global_step": 292215, "epoch": 1739} {"train_loss": -12.052129745483398, "global_step": 292216, "epoch": 1739} {"train_loss": -11.937043190002441, "global_step": 292217, "epoch": 1739} {"train_loss": -12.025840759277344, "global_step": 292218, "epoch": 1739} {"train_loss": -12.308801651000977, "global_step": 292219, "epoch": 1739} {"train_loss": -12.156047821044922, "global_step": 292220, "epoch": 1739} {"train_loss": -11.913460731506348, "global_step": 292221, "epoch": 1739} {"train_loss": -11.890681266784668, "global_step": 292222, "epoch": 1739} {"train_loss": -11.991580963134766, "global_step": 292223, "epoch": 1739} {"train_loss": -12.188565254211426, "global_step": 292224, "epoch": 1739} {"train_loss": -12.252983093261719, "global_step": 292225, "epoch": 1739} {"train_loss": -12.21584701538086, "global_step": 292226, "epoch": 1739} {"train_loss": -11.782137870788574, "global_step": 292227, "epoch": 1739} {"train_loss": -11.924173355102539, "global_step": 292228, "epoch": 1739} {"train_loss": -12.279659271240234, "global_step": 292229, "epoch": 1739} {"train_loss": -12.121206283569336, "global_step": 292230, "epoch": 1739} {"train_loss": -11.139749526977539, "global_step": 292231, "epoch": 1739} {"train_loss": -11.989882469177246, "global_step": 292232, "epoch": 1739} {"train_loss": -12.114053726196289, "global_step": 292233, "epoch": 1739} {"train_loss": -11.675326347351074, "global_step": 292234, "epoch": 1739} {"train_loss": -11.87843132019043, "global_step": 292235, "epoch": 1739} {"train_loss": -12.24443244934082, "global_step": 292236, "epoch": 1739} {"train_loss": -12.146995544433594, "global_step": 292237, "epoch": 1739} {"train_loss": -11.549044609069824, "global_step": 292238, "epoch": 1739} {"train_loss": -12.167112350463867, "global_step": 292239, "epoch": 1739} {"train_loss": -12.35743522644043, "global_step": 292240, "epoch": 1739} {"train_loss": -11.67976188659668, "global_step": 292241, "epoch": 1739} {"train_loss": -12.12582015991211, "global_step": 292242, "epoch": 1739} {"train_loss": -12.245497703552246, "global_step": 292243, "epoch": 1739} {"train_loss": -11.598222732543945, "global_step": 292244, "epoch": 1739} {"train_loss": -12.305791854858398, "global_step": 292245, "epoch": 1739} {"train_loss": -12.062416076660156, "global_step": 292246, "epoch": 1739} {"train_loss": -11.949392318725586, "global_step": 292247, "epoch": 1739} {"train_loss": -11.807291984558105, "global_step": 292248, "epoch": 1739} {"train_loss": -12.176128387451172, "global_step": 292249, "epoch": 1739} {"train_loss": -11.267852783203125, "global_step": 292250, "epoch": 1739} {"train_loss": -11.603422164916992, "global_step": 292251, "epoch": 1739} {"train_loss": -12.088851928710938, "global_step": 292252, "epoch": 1739} {"train_loss": -10.89578628540039, "global_step": 292253, "epoch": 1739} {"train_loss": -10.379497528076172, "global_step": 292254, "epoch": 1739} {"train_loss": -11.762079238891602, "global_step": 292255, "epoch": 1739} {"train_loss": -10.132524490356445, "global_step": 292256, "epoch": 1739} {"train_loss": -9.84732723236084, "global_step": 292257, "epoch": 1739} {"train_loss": -11.94121265411377, "global_step": 292258, "epoch": 1739} {"train_loss": -10.978450775146484, "global_step": 292259, "epoch": 1739} {"train_loss": -10.347297668457031, "global_step": 292260, "epoch": 1739} {"train_loss": -11.926033020019531, "global_step": 292261, "epoch": 1739} {"train_loss": -9.467988967895508, "global_step": 292262, "epoch": 1739} {"train_loss": -10.648138046264648, "global_step": 292263, "epoch": 1739} {"train_loss": -9.618782997131348, "global_step": 292264, "epoch": 1739} {"train_loss": -9.967188835144043, "global_step": 292265, "epoch": 1739} {"train_loss": -11.464763641357422, "global_step": 292266, "epoch": 1739} {"train_loss": -10.381804466247559, "global_step": 292267, "epoch": 1739} {"train_loss": -11.45986270904541, "global_step": 292268, "epoch": 1739} {"train_loss": -11.237001419067383, "global_step": 292269, "epoch": 1739} {"train_loss": -11.294160842895508, "global_step": 292270, "epoch": 1739} {"train_loss": -10.989052772521973, "global_step": 292271, "epoch": 1739} {"train_loss": -11.906527519226074, "global_step": 292272, "epoch": 1739} {"train_loss": -11.494991302490234, "global_step": 292273, "epoch": 1739} {"train_loss": -11.767950057983398, "global_step": 292274, "epoch": 1739} {"train_loss": -11.635283470153809, "global_step": 292275, "epoch": 1739} {"train_loss": -11.636100769042969, "global_step": 292276, "epoch": 1739} {"train_loss": -11.60097885131836, "global_step": 292277, "epoch": 1739} {"train_loss": -11.646581649780273, "global_step": 292278, "epoch": 1739} {"train_loss": -11.931421279907227, "global_step": 292279, "epoch": 1739} {"train_loss": -11.774177551269531, "global_step": 292280, "epoch": 1739} {"train_loss": -11.860776901245117, "global_step": 292281, "epoch": 1739} {"train_loss": -11.827957153320312, "global_step": 292282, "epoch": 1739} {"train_loss": -12.130802154541016, "global_step": 292283, "epoch": 1739} {"train_loss": -11.957467079162598, "global_step": 292284, "epoch": 1739} {"train_loss": -11.93133544921875, "global_step": 292285, "epoch": 1739} {"train_loss": -12.091803550720215, "global_step": 292286, "epoch": 1739} {"train_loss": -11.984130859375, "global_step": 292287, "epoch": 1739} {"train_loss": -11.86477279663086, "global_step": 292288, "epoch": 1739} {"train_loss": -12.182491302490234, "global_step": 292289, "epoch": 1739} {"train_loss": -12.064959526062012, "global_step": 292290, "epoch": 1739} {"train_loss": -12.123537063598633, "global_step": 292291, "epoch": 1739} {"train_loss": -11.808357238769531, "global_step": 292292, "epoch": 1739} {"train_loss": -12.258241653442383, "global_step": 292293, "epoch": 1739} {"train_loss": -11.75992202758789, "global_step": 292294, "epoch": 1739} {"train_loss": -11.9774169921875, "global_step": 292295, "epoch": 1739} {"train_loss": -12.333430290222168, "global_step": 292296, "epoch": 1739} {"train_loss": -11.957456588745117, "global_step": 292297, "epoch": 1739} {"train_loss": -12.18945026397705, "global_step": 292298, "epoch": 1739} {"train_loss": -11.846278190612793, "global_step": 292299, "epoch": 1739} {"train_loss": -12.05790901184082, "global_step": 292300, "epoch": 1739} {"train_loss": -12.222827911376953, "global_step": 292301, "epoch": 1739} {"train_loss": -12.403861999511719, "global_step": 292302, "epoch": 1739} {"train_loss": -11.975444793701172, "global_step": 292303, "epoch": 1739} {"train_loss": -12.171989440917969, "global_step": 292304, "epoch": 1739} {"train_loss": -12.309638023376465, "global_step": 292305, "epoch": 1739} {"train_loss": -12.191991806030273, "global_step": 292306, "epoch": 1739} {"train_loss": -12.219134330749512, "global_step": 292307, "epoch": 1739} {"train_loss": -12.217212677001953, "global_step": 292308, "epoch": 1739} {"train_loss": -12.32677936553955, "global_step": 292309, "epoch": 1739} {"train_loss": -11.926483154296875, "global_step": 292310, "epoch": 1739} {"train_loss": -11.915854454040527, "global_step": 292311, "epoch": 1739} {"train_loss": -11.97940444946289, "global_step": 292312, "epoch": 1739} {"train_loss": -12.349609375, "global_step": 292313, "epoch": 1739} {"train_loss": -12.048864364624023, "global_step": 292314, "epoch": 1739} {"train_loss": -12.430509567260742, "global_step": 292315, "epoch": 1739} {"train_loss": -12.181077003479004, "global_step": 292316, "epoch": 1739} {"train_loss": -12.107625961303711, "global_step": 292317, "epoch": 1739} {"train_loss": -12.11616325378418, "global_step": 292318, "epoch": 1739} {"train_loss": -11.895013133684794, "global_step": 292319, "epoch": 1739, "val_loss": 276793.40625} {"train_loss": -12.186004638671875, "global_step": 292320, "epoch": 1740} {"train_loss": -12.154924392700195, "global_step": 292321, "epoch": 1740} {"train_loss": -12.143326759338379, "global_step": 292322, "epoch": 1740} {"train_loss": -12.480932235717773, "global_step": 292323, "epoch": 1740} {"train_loss": -12.215448379516602, "global_step": 292324, "epoch": 1740} {"train_loss": -12.240571022033691, "global_step": 292325, "epoch": 1740} {"train_loss": -12.084988594055176, "global_step": 292326, "epoch": 1740} {"train_loss": -12.145040512084961, "global_step": 292327, "epoch": 1740} {"train_loss": -12.269746780395508, "global_step": 292328, "epoch": 1740} {"train_loss": -12.458916664123535, "global_step": 292329, "epoch": 1740} {"train_loss": -12.372111320495605, "global_step": 292330, "epoch": 1740} {"train_loss": -12.101337432861328, "global_step": 292331, "epoch": 1740} {"train_loss": -12.12067985534668, "global_step": 292332, "epoch": 1740} {"train_loss": -12.163142204284668, "global_step": 292333, "epoch": 1740} {"train_loss": -12.152765274047852, "global_step": 292334, "epoch": 1740} {"train_loss": -12.263309478759766, "global_step": 292335, "epoch": 1740} {"train_loss": -11.789825439453125, "global_step": 292336, "epoch": 1740} {"train_loss": -12.108756065368652, "global_step": 292337, "epoch": 1740} {"train_loss": -11.960993766784668, "global_step": 292338, "epoch": 1740} {"train_loss": -11.471861839294434, "global_step": 292339, "epoch": 1740} {"train_loss": -11.843887329101562, "global_step": 292340, "epoch": 1740} {"train_loss": -12.171664237976074, "global_step": 292341, "epoch": 1740} {"train_loss": -12.255331993103027, "global_step": 292342, "epoch": 1740} {"train_loss": -10.93992805480957, "global_step": 292343, "epoch": 1740} {"train_loss": -10.395334243774414, "global_step": 292344, "epoch": 1740} {"train_loss": -12.21303653717041, "global_step": 292345, "epoch": 1740} {"train_loss": -11.276689529418945, "global_step": 292346, "epoch": 1740} {"train_loss": -10.968782424926758, "global_step": 292347, "epoch": 1740} {"train_loss": -11.936717987060547, "global_step": 292348, "epoch": 1740} {"train_loss": -11.732215881347656, "global_step": 292349, "epoch": 1740} {"train_loss": -12.03512954711914, "global_step": 292350, "epoch": 1740} {"train_loss": -11.975035667419434, "global_step": 292351, "epoch": 1740} {"train_loss": -12.10719108581543, "global_step": 292352, "epoch": 1740} {"train_loss": -11.968907356262207, "global_step": 292353, "epoch": 1740} {"train_loss": -12.15630054473877, "global_step": 292354, "epoch": 1740} {"train_loss": -11.733002662658691, "global_step": 292355, "epoch": 1740} {"train_loss": -12.081537246704102, "global_step": 292356, "epoch": 1740} {"train_loss": -11.460039138793945, "global_step": 292357, "epoch": 1740} {"train_loss": -11.620811462402344, "global_step": 292358, "epoch": 1740} {"train_loss": -11.905202865600586, "global_step": 292359, "epoch": 1740} {"train_loss": -11.608404159545898, "global_step": 292360, "epoch": 1740} {"train_loss": -11.561894416809082, "global_step": 292361, "epoch": 1740} {"train_loss": -11.994105339050293, "global_step": 292362, "epoch": 1740} {"train_loss": -11.83901596069336, "global_step": 292363, "epoch": 1740} {"train_loss": -12.203079223632812, "global_step": 292364, "epoch": 1740} {"train_loss": -11.883439064025879, "global_step": 292365, "epoch": 1740} {"train_loss": -11.8759126663208, "global_step": 292366, "epoch": 1740} {"train_loss": -12.076473236083984, "global_step": 292367, "epoch": 1740} {"train_loss": -11.919279098510742, "global_step": 292368, "epoch": 1740} {"train_loss": -11.625368118286133, "global_step": 292369, "epoch": 1740} {"train_loss": -11.642230987548828, "global_step": 292370, "epoch": 1740} {"train_loss": -11.91784954071045, "global_step": 292371, "epoch": 1740} {"train_loss": -11.719161987304688, "global_step": 292372, "epoch": 1740} {"train_loss": -11.758660316467285, "global_step": 292373, "epoch": 1740} {"train_loss": -11.805244445800781, "global_step": 292374, "epoch": 1740} {"train_loss": -11.895506858825684, "global_step": 292375, "epoch": 1740} {"train_loss": -11.30583667755127, "global_step": 292376, "epoch": 1740} {"train_loss": -10.807962417602539, "global_step": 292377, "epoch": 1740} {"train_loss": -10.936702728271484, "global_step": 292378, "epoch": 1740} {"train_loss": -11.003759384155273, "global_step": 292379, "epoch": 1740} {"train_loss": -11.771650314331055, "global_step": 292380, "epoch": 1740} {"train_loss": -9.577640533447266, "global_step": 292381, "epoch": 1740} {"train_loss": -11.405333518981934, "global_step": 292382, "epoch": 1740} {"train_loss": -11.283073425292969, "global_step": 292383, "epoch": 1740} {"train_loss": -10.508769035339355, "global_step": 292384, "epoch": 1740} {"train_loss": -10.450630187988281, "global_step": 292385, "epoch": 1740} {"train_loss": -11.461753845214844, "global_step": 292386, "epoch": 1740} {"train_loss": -10.116336822509766, "global_step": 292387, "epoch": 1740} {"train_loss": -10.731527328491211, "global_step": 292388, "epoch": 1740} {"train_loss": -11.070858001708984, "global_step": 292389, "epoch": 1740} {"train_loss": -10.13310432434082, "global_step": 292390, "epoch": 1740} {"train_loss": -10.024194717407227, "global_step": 292391, "epoch": 1740} {"train_loss": -10.755029678344727, "global_step": 292392, "epoch": 1740} {"train_loss": -10.96609878540039, "global_step": 292393, "epoch": 1740} {"train_loss": -9.816694259643555, "global_step": 292394, "epoch": 1740} {"train_loss": -10.543717384338379, "global_step": 292395, "epoch": 1740} {"train_loss": -10.555782318115234, "global_step": 292396, "epoch": 1740} {"train_loss": -9.974615097045898, "global_step": 292397, "epoch": 1740} {"train_loss": -9.96031379699707, "global_step": 292398, "epoch": 1740} {"train_loss": -11.39650821685791, "global_step": 292399, "epoch": 1740} {"train_loss": -10.263277053833008, "global_step": 292400, "epoch": 1740} {"train_loss": -10.0779390335083, "global_step": 292401, "epoch": 1740} {"train_loss": -11.214864730834961, "global_step": 292402, "epoch": 1740} {"train_loss": -10.603249549865723, "global_step": 292403, "epoch": 1740} {"train_loss": -10.934073448181152, "global_step": 292404, "epoch": 1740} {"train_loss": -11.306659698486328, "global_step": 292405, "epoch": 1740} {"train_loss": -11.393980026245117, "global_step": 292406, "epoch": 1740} {"train_loss": -10.951557159423828, "global_step": 292407, "epoch": 1740} {"train_loss": -11.485483169555664, "global_step": 292408, "epoch": 1740} {"train_loss": -11.18608283996582, "global_step": 292409, "epoch": 1740} {"train_loss": -11.844322204589844, "global_step": 292410, "epoch": 1740} {"train_loss": -11.117040634155273, "global_step": 292411, "epoch": 1740} {"train_loss": -11.657953262329102, "global_step": 292412, "epoch": 1740} {"train_loss": -11.296310424804688, "global_step": 292413, "epoch": 1740} {"train_loss": -11.605777740478516, "global_step": 292414, "epoch": 1740} {"train_loss": -11.766389846801758, "global_step": 292415, "epoch": 1740} {"train_loss": -11.458395957946777, "global_step": 292416, "epoch": 1740} {"train_loss": -11.527023315429688, "global_step": 292417, "epoch": 1740} {"train_loss": -11.61894416809082, "global_step": 292418, "epoch": 1740} {"train_loss": -11.238227844238281, "global_step": 292419, "epoch": 1740} {"train_loss": -11.519713401794434, "global_step": 292420, "epoch": 1740} {"train_loss": -11.565829277038574, "global_step": 292421, "epoch": 1740} {"train_loss": -11.606107711791992, "global_step": 292422, "epoch": 1740} {"train_loss": -11.615387916564941, "global_step": 292423, "epoch": 1740} {"train_loss": -11.839767456054688, "global_step": 292424, "epoch": 1740} {"train_loss": -11.89026165008545, "global_step": 292425, "epoch": 1740} {"train_loss": -11.660133361816406, "global_step": 292426, "epoch": 1740} {"train_loss": -11.723258972167969, "global_step": 292427, "epoch": 1740} {"train_loss": -11.803720474243164, "global_step": 292428, "epoch": 1740} {"train_loss": -11.894895553588867, "global_step": 292429, "epoch": 1740} {"train_loss": -11.931722640991211, "global_step": 292430, "epoch": 1740} {"train_loss": -11.716532707214355, "global_step": 292431, "epoch": 1740} {"train_loss": -12.045857429504395, "global_step": 292432, "epoch": 1740} {"train_loss": -11.673612594604492, "global_step": 292433, "epoch": 1740} {"train_loss": -12.123668670654297, "global_step": 292434, "epoch": 1740} {"train_loss": -12.068296432495117, "global_step": 292435, "epoch": 1740} {"train_loss": -12.108784675598145, "global_step": 292436, "epoch": 1740} {"train_loss": -12.071222305297852, "global_step": 292437, "epoch": 1740} {"train_loss": -12.213829040527344, "global_step": 292438, "epoch": 1740} {"train_loss": -12.043994903564453, "global_step": 292439, "epoch": 1740} {"train_loss": -12.215723037719727, "global_step": 292440, "epoch": 1740} {"train_loss": -12.109302520751953, "global_step": 292441, "epoch": 1740} {"train_loss": -12.352741241455078, "global_step": 292442, "epoch": 1740} {"train_loss": -12.08537769317627, "global_step": 292443, "epoch": 1740} {"train_loss": -12.155790328979492, "global_step": 292444, "epoch": 1740} {"train_loss": -12.262843132019043, "global_step": 292445, "epoch": 1740} {"train_loss": -12.13758373260498, "global_step": 292446, "epoch": 1740} {"train_loss": -11.999777793884277, "global_step": 292447, "epoch": 1740} {"train_loss": -12.130799293518066, "global_step": 292448, "epoch": 1740} {"train_loss": -12.152268409729004, "global_step": 292449, "epoch": 1740} {"train_loss": -12.080986022949219, "global_step": 292450, "epoch": 1740} {"train_loss": -12.120504379272461, "global_step": 292451, "epoch": 1740} {"train_loss": -12.126667976379395, "global_step": 292452, "epoch": 1740} {"train_loss": -12.140108108520508, "global_step": 292453, "epoch": 1740} {"train_loss": -12.20096206665039, "global_step": 292454, "epoch": 1740} {"train_loss": -12.13926887512207, "global_step": 292455, "epoch": 1740} {"train_loss": -12.236312866210938, "global_step": 292456, "epoch": 1740} {"train_loss": -12.257354736328125, "global_step": 292457, "epoch": 1740} {"train_loss": -12.364492416381836, "global_step": 292458, "epoch": 1740} {"train_loss": -12.394417762756348, "global_step": 292459, "epoch": 1740} {"train_loss": -12.020445823669434, "global_step": 292460, "epoch": 1740} {"train_loss": -12.454065322875977, "global_step": 292461, "epoch": 1740} {"train_loss": -12.296417236328125, "global_step": 292462, "epoch": 1740} {"train_loss": -12.231087684631348, "global_step": 292463, "epoch": 1740} {"train_loss": -12.355454444885254, "global_step": 292464, "epoch": 1740} {"train_loss": -12.190237045288086, "global_step": 292465, "epoch": 1740} {"train_loss": -12.192556381225586, "global_step": 292466, "epoch": 1740} {"train_loss": -12.095894813537598, "global_step": 292467, "epoch": 1740} {"train_loss": -12.295652389526367, "global_step": 292468, "epoch": 1740} {"train_loss": -12.418057441711426, "global_step": 292469, "epoch": 1740} {"train_loss": -12.164104461669922, "global_step": 292470, "epoch": 1740} {"train_loss": -12.292552947998047, "global_step": 292471, "epoch": 1740} {"train_loss": -12.270561218261719, "global_step": 292472, "epoch": 1740} {"train_loss": -12.420825958251953, "global_step": 292473, "epoch": 1740} {"train_loss": -12.190591812133789, "global_step": 292474, "epoch": 1740} {"train_loss": -12.483609199523926, "global_step": 292475, "epoch": 1740} {"train_loss": -12.639549255371094, "global_step": 292476, "epoch": 1740} {"train_loss": -12.306097030639648, "global_step": 292477, "epoch": 1740} {"train_loss": -12.523695945739746, "global_step": 292478, "epoch": 1740} {"train_loss": -12.40408992767334, "global_step": 292479, "epoch": 1740} {"train_loss": -12.293560028076172, "global_step": 292480, "epoch": 1740} {"train_loss": -12.552083969116211, "global_step": 292481, "epoch": 1740} {"train_loss": -12.241216659545898, "global_step": 292482, "epoch": 1740} {"train_loss": -12.063088417053223, "global_step": 292483, "epoch": 1740} {"train_loss": -12.054096221923828, "global_step": 292484, "epoch": 1740} {"train_loss": -12.098845481872559, "global_step": 292485, "epoch": 1740} {"train_loss": -11.7555513381958, "global_step": 292486, "epoch": 1740} {"train_loss": -11.737188339233398, "global_step": 292487, "epoch": 1740, "val_loss": 277801.3125, "train_action_mse_error": 3.7559897899627686} {"train_loss": -12.495685577392578, "global_step": 292488, "epoch": 1741} {"train_loss": -11.69600772857666, "global_step": 292489, "epoch": 1741} {"train_loss": -11.433490753173828, "global_step": 292490, "epoch": 1741} {"train_loss": -11.85428237915039, "global_step": 292491, "epoch": 1741} {"train_loss": -11.98519515991211, "global_step": 292492, "epoch": 1741} {"train_loss": -11.2532958984375, "global_step": 292493, "epoch": 1741} {"train_loss": -11.489404678344727, "global_step": 292494, "epoch": 1741} {"train_loss": -11.285367965698242, "global_step": 292495, "epoch": 1741} {"train_loss": -11.031177520751953, "global_step": 292496, "epoch": 1741} {"train_loss": -11.077120780944824, "global_step": 292497, "epoch": 1741} {"train_loss": -11.863370895385742, "global_step": 292498, "epoch": 1741} {"train_loss": -11.481328964233398, "global_step": 292499, "epoch": 1741} {"train_loss": -11.469761848449707, "global_step": 292500, "epoch": 1741} {"train_loss": -11.387308120727539, "global_step": 292501, "epoch": 1741} {"train_loss": -9.98588752746582, "global_step": 292502, "epoch": 1741} {"train_loss": -11.410324096679688, "global_step": 292503, "epoch": 1741} {"train_loss": -10.30508041381836, "global_step": 292504, "epoch": 1741} {"train_loss": -9.557150840759277, "global_step": 292505, "epoch": 1741} {"train_loss": -10.524333953857422, "global_step": 292506, "epoch": 1741} {"train_loss": -11.004369735717773, "global_step": 292507, "epoch": 1741} {"train_loss": -10.392913818359375, "global_step": 292508, "epoch": 1741} {"train_loss": -11.680889129638672, "global_step": 292509, "epoch": 1741} {"train_loss": -10.820869445800781, "global_step": 292510, "epoch": 1741} {"train_loss": -11.505128860473633, "global_step": 292511, "epoch": 1741} {"train_loss": -11.422706604003906, "global_step": 292512, "epoch": 1741} {"train_loss": -10.990840911865234, "global_step": 292513, "epoch": 1741} {"train_loss": -11.46292781829834, "global_step": 292514, "epoch": 1741} {"train_loss": -11.430776596069336, "global_step": 292515, "epoch": 1741} {"train_loss": -11.578240394592285, "global_step": 292516, "epoch": 1741} {"train_loss": -11.287141799926758, "global_step": 292517, "epoch": 1741} {"train_loss": -11.363729476928711, "global_step": 292518, "epoch": 1741} {"train_loss": -11.713586807250977, "global_step": 292519, "epoch": 1741} {"train_loss": -11.547409057617188, "global_step": 292520, "epoch": 1741} {"train_loss": -11.56571102142334, "global_step": 292521, "epoch": 1741} {"train_loss": -11.556394577026367, "global_step": 292522, "epoch": 1741} {"train_loss": -11.110336303710938, "global_step": 292523, "epoch": 1741} {"train_loss": -11.866035461425781, "global_step": 292524, "epoch": 1741} {"train_loss": -11.488017082214355, "global_step": 292525, "epoch": 1741} {"train_loss": -11.466277122497559, "global_step": 292526, "epoch": 1741} {"train_loss": -11.894908905029297, "global_step": 292527, "epoch": 1741} {"train_loss": -11.476829528808594, "global_step": 292528, "epoch": 1741} {"train_loss": -11.609504699707031, "global_step": 292529, "epoch": 1741} {"train_loss": -11.382120132446289, "global_step": 292530, "epoch": 1741} {"train_loss": -11.361347198486328, "global_step": 292531, "epoch": 1741} {"train_loss": -11.783291816711426, "global_step": 292532, "epoch": 1741} {"train_loss": -11.556976318359375, "global_step": 292533, "epoch": 1741} {"train_loss": -11.82382583618164, "global_step": 292534, "epoch": 1741} {"train_loss": -11.653221130371094, "global_step": 292535, "epoch": 1741} {"train_loss": -12.064067840576172, "global_step": 292536, "epoch": 1741} {"train_loss": -11.607980728149414, "global_step": 292537, "epoch": 1741} {"train_loss": -11.884424209594727, "global_step": 292538, "epoch": 1741} {"train_loss": -11.913246154785156, "global_step": 292539, "epoch": 1741} {"train_loss": -11.799442291259766, "global_step": 292540, "epoch": 1741} {"train_loss": -12.09726333618164, "global_step": 292541, "epoch": 1741} {"train_loss": -11.818893432617188, "global_step": 292542, "epoch": 1741} {"train_loss": -12.039636611938477, "global_step": 292543, "epoch": 1741} {"train_loss": -11.905183792114258, "global_step": 292544, "epoch": 1741} {"train_loss": -12.275209426879883, "global_step": 292545, "epoch": 1741} {"train_loss": -11.996208190917969, "global_step": 292546, "epoch": 1741} {"train_loss": -11.941085815429688, "global_step": 292547, "epoch": 1741} {"train_loss": -11.844610214233398, "global_step": 292548, "epoch": 1741} {"train_loss": -11.699599266052246, "global_step": 292549, "epoch": 1741} {"train_loss": -12.037397384643555, "global_step": 292550, "epoch": 1741} {"train_loss": -12.023414611816406, "global_step": 292551, "epoch": 1741} {"train_loss": -12.056885719299316, "global_step": 292552, "epoch": 1741} {"train_loss": -12.133393287658691, "global_step": 292553, "epoch": 1741} {"train_loss": -12.051386833190918, "global_step": 292554, "epoch": 1741} {"train_loss": -12.028590202331543, "global_step": 292555, "epoch": 1741} {"train_loss": -12.102001190185547, "global_step": 292556, "epoch": 1741} {"train_loss": -12.308795928955078, "global_step": 292557, "epoch": 1741} {"train_loss": -12.308130264282227, "global_step": 292558, "epoch": 1741} {"train_loss": -12.09763240814209, "global_step": 292559, "epoch": 1741} {"train_loss": -12.313726425170898, "global_step": 292560, "epoch": 1741} {"train_loss": -12.140091896057129, "global_step": 292561, "epoch": 1741} {"train_loss": -12.130335807800293, "global_step": 292562, "epoch": 1741} {"train_loss": -12.296834945678711, "global_step": 292563, "epoch": 1741} {"train_loss": -12.252020835876465, "global_step": 292564, "epoch": 1741} {"train_loss": -12.26801872253418, "global_step": 292565, "epoch": 1741} {"train_loss": -12.306257247924805, "global_step": 292566, "epoch": 1741} {"train_loss": -12.427679061889648, "global_step": 292567, "epoch": 1741} {"train_loss": -12.233436584472656, "global_step": 292568, "epoch": 1741} {"train_loss": -11.84642219543457, "global_step": 292569, "epoch": 1741} {"train_loss": -12.177306175231934, "global_step": 292570, "epoch": 1741} {"train_loss": -11.953747749328613, "global_step": 292571, "epoch": 1741} {"train_loss": -11.939231872558594, "global_step": 292572, "epoch": 1741} {"train_loss": -12.184036254882812, "global_step": 292573, "epoch": 1741} {"train_loss": -12.102270126342773, "global_step": 292574, "epoch": 1741} {"train_loss": -12.039900779724121, "global_step": 292575, "epoch": 1741} {"train_loss": -12.238473892211914, "global_step": 292576, "epoch": 1741} {"train_loss": -12.059101104736328, "global_step": 292577, "epoch": 1741} {"train_loss": -12.538932800292969, "global_step": 292578, "epoch": 1741} {"train_loss": -12.199810981750488, "global_step": 292579, "epoch": 1741} {"train_loss": -12.237595558166504, "global_step": 292580, "epoch": 1741} {"train_loss": -12.27884292602539, "global_step": 292581, "epoch": 1741} {"train_loss": -12.390298843383789, "global_step": 292582, "epoch": 1741} {"train_loss": -12.575735092163086, "global_step": 292583, "epoch": 1741} {"train_loss": -12.142794609069824, "global_step": 292584, "epoch": 1741} {"train_loss": -12.051056861877441, "global_step": 292585, "epoch": 1741} {"train_loss": -12.284502029418945, "global_step": 292586, "epoch": 1741} {"train_loss": -11.981417655944824, "global_step": 292587, "epoch": 1741} {"train_loss": -12.281692504882812, "global_step": 292588, "epoch": 1741} {"train_loss": -12.040766716003418, "global_step": 292589, "epoch": 1741} {"train_loss": -12.032777786254883, "global_step": 292590, "epoch": 1741} {"train_loss": -12.239062309265137, "global_step": 292591, "epoch": 1741} {"train_loss": -11.810434341430664, "global_step": 292592, "epoch": 1741} {"train_loss": -12.28494930267334, "global_step": 292593, "epoch": 1741} {"train_loss": -12.182281494140625, "global_step": 292594, "epoch": 1741} {"train_loss": -12.230098724365234, "global_step": 292595, "epoch": 1741} {"train_loss": -11.997255325317383, "global_step": 292596, "epoch": 1741} {"train_loss": -12.226663589477539, "global_step": 292597, "epoch": 1741} {"train_loss": -12.216724395751953, "global_step": 292598, "epoch": 1741} {"train_loss": -12.058005332946777, "global_step": 292599, "epoch": 1741} {"train_loss": -12.450382232666016, "global_step": 292600, "epoch": 1741} {"train_loss": -12.585795402526855, "global_step": 292601, "epoch": 1741} {"train_loss": -12.213708877563477, "global_step": 292602, "epoch": 1741} {"train_loss": -12.489058494567871, "global_step": 292603, "epoch": 1741} {"train_loss": -12.2722749710083, "global_step": 292604, "epoch": 1741} {"train_loss": -12.294920921325684, "global_step": 292605, "epoch": 1741} {"train_loss": -12.275169372558594, "global_step": 292606, "epoch": 1741} {"train_loss": -12.259159088134766, "global_step": 292607, "epoch": 1741} {"train_loss": -12.100052833557129, "global_step": 292608, "epoch": 1741} {"train_loss": -12.229682922363281, "global_step": 292609, "epoch": 1741} {"train_loss": -12.288455963134766, "global_step": 292610, "epoch": 1741} {"train_loss": -12.278440475463867, "global_step": 292611, "epoch": 1741} {"train_loss": -12.440105438232422, "global_step": 292612, "epoch": 1741} {"train_loss": -12.280786514282227, "global_step": 292613, "epoch": 1741} {"train_loss": -11.947611808776855, "global_step": 292614, "epoch": 1741} {"train_loss": -12.183332443237305, "global_step": 292615, "epoch": 1741} {"train_loss": -12.230862617492676, "global_step": 292616, "epoch": 1741} {"train_loss": -11.443279266357422, "global_step": 292617, "epoch": 1741} {"train_loss": -10.384078025817871, "global_step": 292618, "epoch": 1741} {"train_loss": -10.600056648254395, "global_step": 292619, "epoch": 1741} {"train_loss": -11.235340118408203, "global_step": 292620, "epoch": 1741} {"train_loss": -10.405583381652832, "global_step": 292621, "epoch": 1741} {"train_loss": -9.685606956481934, "global_step": 292622, "epoch": 1741} {"train_loss": -8.647659301757812, "global_step": 292623, "epoch": 1741} {"train_loss": -9.998462677001953, "global_step": 292624, "epoch": 1741} {"train_loss": -9.750532150268555, "global_step": 292625, "epoch": 1741} {"train_loss": -9.725625038146973, "global_step": 292626, "epoch": 1741} {"train_loss": -10.127301216125488, "global_step": 292627, "epoch": 1741} {"train_loss": -6.63041353225708, "global_step": 292628, "epoch": 1741} {"train_loss": -6.16507625579834, "global_step": 292629, "epoch": 1741} {"train_loss": -5.591041088104248, "global_step": 292630, "epoch": 1741} {"train_loss": -5.487470626831055, "global_step": 292631, "epoch": 1741} {"train_loss": -6.3185882568359375, "global_step": 292632, "epoch": 1741} {"train_loss": -6.317124366760254, "global_step": 292633, "epoch": 1741} {"train_loss": -6.057432174682617, "global_step": 292634, "epoch": 1741} {"train_loss": -7.494790077209473, "global_step": 292635, "epoch": 1741} {"train_loss": -9.013373374938965, "global_step": 292636, "epoch": 1741} {"train_loss": -8.31003189086914, "global_step": 292637, "epoch": 1741} {"train_loss": -8.234870910644531, "global_step": 292638, "epoch": 1741} {"train_loss": -8.644685745239258, "global_step": 292639, "epoch": 1741} {"train_loss": -9.560680389404297, "global_step": 292640, "epoch": 1741} {"train_loss": -10.108142852783203, "global_step": 292641, "epoch": 1741} {"train_loss": -9.975162506103516, "global_step": 292642, "epoch": 1741} {"train_loss": -9.686330795288086, "global_step": 292643, "epoch": 1741} {"train_loss": -10.442218780517578, "global_step": 292644, "epoch": 1741} {"train_loss": -9.023509979248047, "global_step": 292645, "epoch": 1741} {"train_loss": -9.503610610961914, "global_step": 292646, "epoch": 1741} {"train_loss": -9.953315734863281, "global_step": 292647, "epoch": 1741} {"train_loss": -10.741273880004883, "global_step": 292648, "epoch": 1741} {"train_loss": -10.366117477416992, "global_step": 292649, "epoch": 1741} {"train_loss": -10.698802947998047, "global_step": 292650, "epoch": 1741} {"train_loss": -10.8180513381958, "global_step": 292651, "epoch": 1741} {"train_loss": -10.75364875793457, "global_step": 292652, "epoch": 1741} {"train_loss": -11.034969329833984, "global_step": 292653, "epoch": 1741} {"train_loss": -10.81905460357666, "global_step": 292654, "epoch": 1741} {"train_loss": -11.25066249711173, "global_step": 292655, "epoch": 1741, "val_loss": 269836.4375} {"train_loss": -11.23481559753418, "global_step": 292656, "epoch": 1742} {"train_loss": -10.88382339477539, "global_step": 292657, "epoch": 1742} {"train_loss": -11.156463623046875, "global_step": 292658, "epoch": 1742} {"train_loss": -11.339780807495117, "global_step": 292659, "epoch": 1742} {"train_loss": -10.943435668945312, "global_step": 292660, "epoch": 1742} {"train_loss": -11.540674209594727, "global_step": 292661, "epoch": 1742} {"train_loss": -11.427993774414062, "global_step": 292662, "epoch": 1742} {"train_loss": -11.364446640014648, "global_step": 292663, "epoch": 1742} {"train_loss": -11.734451293945312, "global_step": 292664, "epoch": 1742} {"train_loss": -11.326332092285156, "global_step": 292665, "epoch": 1742} {"train_loss": -11.354329109191895, "global_step": 292666, "epoch": 1742} {"train_loss": -11.443626403808594, "global_step": 292667, "epoch": 1742} {"train_loss": -11.38582992553711, "global_step": 292668, "epoch": 1742} {"train_loss": -11.532583236694336, "global_step": 292669, "epoch": 1742} {"train_loss": -11.66958999633789, "global_step": 292670, "epoch": 1742} {"train_loss": -11.50912857055664, "global_step": 292671, "epoch": 1742} {"train_loss": -11.787948608398438, "global_step": 292672, "epoch": 1742} {"train_loss": -11.630317687988281, "global_step": 292673, "epoch": 1742} {"train_loss": -11.558266639709473, "global_step": 292674, "epoch": 1742} {"train_loss": -11.905152320861816, "global_step": 292675, "epoch": 1742} {"train_loss": -11.58653736114502, "global_step": 292676, "epoch": 1742} {"train_loss": -11.824708938598633, "global_step": 292677, "epoch": 1742} {"train_loss": -11.904376983642578, "global_step": 292678, "epoch": 1742} {"train_loss": -12.093557357788086, "global_step": 292679, "epoch": 1742} {"train_loss": -11.701375007629395, "global_step": 292680, "epoch": 1742} {"train_loss": -12.025644302368164, "global_step": 292681, "epoch": 1742} {"train_loss": -12.05904769897461, "global_step": 292682, "epoch": 1742} {"train_loss": -11.85886001586914, "global_step": 292683, "epoch": 1742} {"train_loss": -12.120607376098633, "global_step": 292684, "epoch": 1742} {"train_loss": -11.847051620483398, "global_step": 292685, "epoch": 1742} {"train_loss": -12.069452285766602, "global_step": 292686, "epoch": 1742} {"train_loss": -11.889873504638672, "global_step": 292687, "epoch": 1742} {"train_loss": -12.069831848144531, "global_step": 292688, "epoch": 1742} {"train_loss": -11.85174560546875, "global_step": 292689, "epoch": 1742} {"train_loss": -11.970449447631836, "global_step": 292690, "epoch": 1742} {"train_loss": -11.982748031616211, "global_step": 292691, "epoch": 1742} {"train_loss": -12.264876365661621, "global_step": 292692, "epoch": 1742} {"train_loss": -12.124907493591309, "global_step": 292693, "epoch": 1742} {"train_loss": -12.23609733581543, "global_step": 292694, "epoch": 1742} {"train_loss": -12.012702941894531, "global_step": 292695, "epoch": 1742} {"train_loss": -12.301511764526367, "global_step": 292696, "epoch": 1742} {"train_loss": -12.187749862670898, "global_step": 292697, "epoch": 1742} {"train_loss": -12.20295524597168, "global_step": 292698, "epoch": 1742} {"train_loss": -12.147583961486816, "global_step": 292699, "epoch": 1742} {"train_loss": -12.074127197265625, "global_step": 292700, "epoch": 1742} {"train_loss": -12.222715377807617, "global_step": 292701, "epoch": 1742} {"train_loss": -12.405741691589355, "global_step": 292702, "epoch": 1742} {"train_loss": -12.185816764831543, "global_step": 292703, "epoch": 1742} {"train_loss": -12.171967506408691, "global_step": 292704, "epoch": 1742} {"train_loss": -12.302125930786133, "global_step": 292705, "epoch": 1742} {"train_loss": -12.119810104370117, "global_step": 292706, "epoch": 1742} {"train_loss": -12.352168083190918, "global_step": 292707, "epoch": 1742} {"train_loss": -12.353822708129883, "global_step": 292708, "epoch": 1742} {"train_loss": -12.229369163513184, "global_step": 292709, "epoch": 1742} {"train_loss": -12.41508674621582, "global_step": 292710, "epoch": 1742} {"train_loss": -12.285238265991211, "global_step": 292711, "epoch": 1742} {"train_loss": -12.318558692932129, "global_step": 292712, "epoch": 1742} {"train_loss": -12.34195327758789, "global_step": 292713, "epoch": 1742} {"train_loss": -12.11800479888916, "global_step": 292714, "epoch": 1742} {"train_loss": -12.27931022644043, "global_step": 292715, "epoch": 1742} {"train_loss": -12.166330337524414, "global_step": 292716, "epoch": 1742} {"train_loss": -12.43448257446289, "global_step": 292717, "epoch": 1742} {"train_loss": -12.394638061523438, "global_step": 292718, "epoch": 1742} {"train_loss": -12.525474548339844, "global_step": 292719, "epoch": 1742} {"train_loss": -12.299561500549316, "global_step": 292720, "epoch": 1742} {"train_loss": -12.194803237915039, "global_step": 292721, "epoch": 1742} {"train_loss": -12.317740440368652, "global_step": 292722, "epoch": 1742} {"train_loss": -12.374879837036133, "global_step": 292723, "epoch": 1742} {"train_loss": -12.291783332824707, "global_step": 292724, "epoch": 1742} {"train_loss": -12.458808898925781, "global_step": 292725, "epoch": 1742} {"train_loss": -12.318681716918945, "global_step": 292726, "epoch": 1742} {"train_loss": -12.507532119750977, "global_step": 292727, "epoch": 1742} {"train_loss": -12.270014762878418, "global_step": 292728, "epoch": 1742} {"train_loss": -12.310869216918945, "global_step": 292729, "epoch": 1742} {"train_loss": -12.180177688598633, "global_step": 292730, "epoch": 1742} {"train_loss": -12.397135734558105, "global_step": 292731, "epoch": 1742} {"train_loss": -12.284300804138184, "global_step": 292732, "epoch": 1742} {"train_loss": -12.412086486816406, "global_step": 292733, "epoch": 1742} {"train_loss": -12.357294082641602, "global_step": 292734, "epoch": 1742} {"train_loss": -12.162580490112305, "global_step": 292735, "epoch": 1742} {"train_loss": -12.382792472839355, "global_step": 292736, "epoch": 1742} {"train_loss": -12.441237449645996, "global_step": 292737, "epoch": 1742} {"train_loss": -12.095651626586914, "global_step": 292738, "epoch": 1742} {"train_loss": -12.448646545410156, "global_step": 292739, "epoch": 1742} {"train_loss": -12.522127151489258, "global_step": 292740, "epoch": 1742} {"train_loss": -12.181641578674316, "global_step": 292741, "epoch": 1742} {"train_loss": -12.241859436035156, "global_step": 292742, "epoch": 1742} {"train_loss": -12.449281692504883, "global_step": 292743, "epoch": 1742} {"train_loss": -12.226099014282227, "global_step": 292744, "epoch": 1742} {"train_loss": -12.188371658325195, "global_step": 292745, "epoch": 1742} {"train_loss": -12.422060012817383, "global_step": 292746, "epoch": 1742} {"train_loss": -12.234906196594238, "global_step": 292747, "epoch": 1742} {"train_loss": -12.557571411132812, "global_step": 292748, "epoch": 1742} {"train_loss": -12.481192588806152, "global_step": 292749, "epoch": 1742} {"train_loss": -12.320377349853516, "global_step": 292750, "epoch": 1742} {"train_loss": -12.035011291503906, "global_step": 292751, "epoch": 1742} {"train_loss": -12.387303352355957, "global_step": 292752, "epoch": 1742} {"train_loss": -12.325952529907227, "global_step": 292753, "epoch": 1742} {"train_loss": -11.55303955078125, "global_step": 292754, "epoch": 1742} {"train_loss": -11.961889266967773, "global_step": 292755, "epoch": 1742} {"train_loss": -11.870065689086914, "global_step": 292756, "epoch": 1742} {"train_loss": -11.634984970092773, "global_step": 292757, "epoch": 1742} {"train_loss": -12.12909984588623, "global_step": 292758, "epoch": 1742} {"train_loss": -11.844009399414062, "global_step": 292759, "epoch": 1742} {"train_loss": -12.213033676147461, "global_step": 292760, "epoch": 1742} {"train_loss": -12.080822944641113, "global_step": 292761, "epoch": 1742} {"train_loss": -12.205503463745117, "global_step": 292762, "epoch": 1742} {"train_loss": -10.82545280456543, "global_step": 292763, "epoch": 1742} {"train_loss": -7.59845495223999, "global_step": 292764, "epoch": 1742} {"train_loss": -10.881372451782227, "global_step": 292765, "epoch": 1742} {"train_loss": -6.093868732452393, "global_step": 292766, "epoch": 1742} {"train_loss": -7.04622745513916, "global_step": 292767, "epoch": 1742} {"train_loss": -6.855217933654785, "global_step": 292768, "epoch": 1742} {"train_loss": -7.545026779174805, "global_step": 292769, "epoch": 1742} {"train_loss": -7.148101806640625, "global_step": 292770, "epoch": 1742} {"train_loss": -8.253003120422363, "global_step": 292771, "epoch": 1742} {"train_loss": -7.903005599975586, "global_step": 292772, "epoch": 1742} {"train_loss": -5.999235153198242, "global_step": 292773, "epoch": 1742} {"train_loss": -8.645784378051758, "global_step": 292774, "epoch": 1742} {"train_loss": -8.748029708862305, "global_step": 292775, "epoch": 1742} {"train_loss": -8.795408248901367, "global_step": 292776, "epoch": 1742} {"train_loss": -8.406222343444824, "global_step": 292777, "epoch": 1742} {"train_loss": -7.976127624511719, "global_step": 292778, "epoch": 1742} {"train_loss": -9.840209007263184, "global_step": 292779, "epoch": 1742} {"train_loss": -10.410560607910156, "global_step": 292780, "epoch": 1742} {"train_loss": -9.675395965576172, "global_step": 292781, "epoch": 1742} {"train_loss": -9.609107971191406, "global_step": 292782, "epoch": 1742} {"train_loss": -10.669330596923828, "global_step": 292783, "epoch": 1742} {"train_loss": -10.121488571166992, "global_step": 292784, "epoch": 1742} {"train_loss": -9.929769515991211, "global_step": 292785, "epoch": 1742} {"train_loss": -11.319334030151367, "global_step": 292786, "epoch": 1742} {"train_loss": -9.756662368774414, "global_step": 292787, "epoch": 1742} {"train_loss": -10.922845840454102, "global_step": 292788, "epoch": 1742} {"train_loss": -10.510042190551758, "global_step": 292789, "epoch": 1742} {"train_loss": -10.476574897766113, "global_step": 292790, "epoch": 1742} {"train_loss": -10.550235748291016, "global_step": 292791, "epoch": 1742} {"train_loss": -11.32309341430664, "global_step": 292792, "epoch": 1742} {"train_loss": -10.753669738769531, "global_step": 292793, "epoch": 1742} {"train_loss": -11.212679862976074, "global_step": 292794, "epoch": 1742} {"train_loss": -11.43978214263916, "global_step": 292795, "epoch": 1742} {"train_loss": -11.3912353515625, "global_step": 292796, "epoch": 1742} {"train_loss": -11.247934341430664, "global_step": 292797, "epoch": 1742} {"train_loss": -11.45671272277832, "global_step": 292798, "epoch": 1742} {"train_loss": -11.065849304199219, "global_step": 292799, "epoch": 1742} {"train_loss": -11.553998947143555, "global_step": 292800, "epoch": 1742} {"train_loss": -11.550819396972656, "global_step": 292801, "epoch": 1742} {"train_loss": -11.5548734664917, "global_step": 292802, "epoch": 1742} {"train_loss": -11.522598266601562, "global_step": 292803, "epoch": 1742} {"train_loss": -11.8505220413208, "global_step": 292804, "epoch": 1742} {"train_loss": -11.829244613647461, "global_step": 292805, "epoch": 1742} {"train_loss": -12.033814430236816, "global_step": 292806, "epoch": 1742} {"train_loss": -11.911294937133789, "global_step": 292807, "epoch": 1742} {"train_loss": -11.605791091918945, "global_step": 292808, "epoch": 1742} {"train_loss": -11.863595008850098, "global_step": 292809, "epoch": 1742} {"train_loss": -11.747364044189453, "global_step": 292810, "epoch": 1742} {"train_loss": -11.754339218139648, "global_step": 292811, "epoch": 1742} {"train_loss": -12.073451042175293, "global_step": 292812, "epoch": 1742} {"train_loss": -11.678971290588379, "global_step": 292813, "epoch": 1742} {"train_loss": -11.777322769165039, "global_step": 292814, "epoch": 1742} {"train_loss": -11.614496231079102, "global_step": 292815, "epoch": 1742} {"train_loss": -11.80191707611084, "global_step": 292816, "epoch": 1742} {"train_loss": -12.054759979248047, "global_step": 292817, "epoch": 1742} {"train_loss": -12.079479217529297, "global_step": 292818, "epoch": 1742} {"train_loss": -12.097123146057129, "global_step": 292819, "epoch": 1742} {"train_loss": -11.92674446105957, "global_step": 292820, "epoch": 1742} {"train_loss": -12.107810020446777, "global_step": 292821, "epoch": 1742} {"train_loss": -11.861223220825195, "global_step": 292822, "epoch": 1742} {"train_loss": -11.462241098994301, "global_step": 292823, "epoch": 1742, "val_loss": 276164.5} {"train_loss": -12.015434265136719, "global_step": 292824, "epoch": 1743} {"train_loss": -11.964239120483398, "global_step": 292825, "epoch": 1743} {"train_loss": -12.096802711486816, "global_step": 292826, "epoch": 1743} {"train_loss": -11.836092948913574, "global_step": 292827, "epoch": 1743} {"train_loss": -12.14723014831543, "global_step": 292828, "epoch": 1743} {"train_loss": -12.232854843139648, "global_step": 292829, "epoch": 1743} {"train_loss": -12.082452774047852, "global_step": 292830, "epoch": 1743} {"train_loss": -12.275632858276367, "global_step": 292831, "epoch": 1743} {"train_loss": -12.188623428344727, "global_step": 292832, "epoch": 1743} {"train_loss": -12.212921142578125, "global_step": 292833, "epoch": 1743} {"train_loss": -11.944281578063965, "global_step": 292834, "epoch": 1743} {"train_loss": -12.159555435180664, "global_step": 292835, "epoch": 1743} {"train_loss": -12.33624267578125, "global_step": 292836, "epoch": 1743} {"train_loss": -12.079644203186035, "global_step": 292837, "epoch": 1743} {"train_loss": -12.298803329467773, "global_step": 292838, "epoch": 1743} {"train_loss": -12.078607559204102, "global_step": 292839, "epoch": 1743} {"train_loss": -12.17006778717041, "global_step": 292840, "epoch": 1743} {"train_loss": -12.208776473999023, "global_step": 292841, "epoch": 1743} {"train_loss": -12.034412384033203, "global_step": 292842, "epoch": 1743} {"train_loss": -12.319202423095703, "global_step": 292843, "epoch": 1743} {"train_loss": -12.176513671875, "global_step": 292844, "epoch": 1743} {"train_loss": -12.313523292541504, "global_step": 292845, "epoch": 1743} {"train_loss": -12.131937026977539, "global_step": 292846, "epoch": 1743} {"train_loss": -12.322421073913574, "global_step": 292847, "epoch": 1743} {"train_loss": -12.255382537841797, "global_step": 292848, "epoch": 1743} {"train_loss": -12.211309432983398, "global_step": 292849, "epoch": 1743} {"train_loss": -12.283199310302734, "global_step": 292850, "epoch": 1743} {"train_loss": -12.310303688049316, "global_step": 292851, "epoch": 1743} {"train_loss": -12.302265167236328, "global_step": 292852, "epoch": 1743} {"train_loss": -12.260828018188477, "global_step": 292853, "epoch": 1743} {"train_loss": -12.292937278747559, "global_step": 292854, "epoch": 1743} {"train_loss": -12.343151092529297, "global_step": 292855, "epoch": 1743} {"train_loss": -12.286381721496582, "global_step": 292856, "epoch": 1743} {"train_loss": -12.354493141174316, "global_step": 292857, "epoch": 1743} {"train_loss": -12.2778902053833, "global_step": 292858, "epoch": 1743} {"train_loss": -12.532041549682617, "global_step": 292859, "epoch": 1743} {"train_loss": -12.194622039794922, "global_step": 292860, "epoch": 1743} {"train_loss": -12.23188591003418, "global_step": 292861, "epoch": 1743} {"train_loss": -12.180976867675781, "global_step": 292862, "epoch": 1743} {"train_loss": -12.182731628417969, "global_step": 292863, "epoch": 1743} {"train_loss": -12.140806198120117, "global_step": 292864, "epoch": 1743} {"train_loss": -12.057960510253906, "global_step": 292865, "epoch": 1743} {"train_loss": -12.355965614318848, "global_step": 292866, "epoch": 1743} {"train_loss": -12.293012619018555, "global_step": 292867, "epoch": 1743} {"train_loss": -12.22935676574707, "global_step": 292868, "epoch": 1743} {"train_loss": -11.233752250671387, "global_step": 292869, "epoch": 1743} {"train_loss": -10.96229076385498, "global_step": 292870, "epoch": 1743} {"train_loss": -11.623992919921875, "global_step": 292871, "epoch": 1743} {"train_loss": -12.002206802368164, "global_step": 292872, "epoch": 1743} {"train_loss": -11.15013313293457, "global_step": 292873, "epoch": 1743} {"train_loss": -10.201019287109375, "global_step": 292874, "epoch": 1743} {"train_loss": -11.024989128112793, "global_step": 292875, "epoch": 1743} {"train_loss": -10.120899200439453, "global_step": 292876, "epoch": 1743} {"train_loss": -11.477283477783203, "global_step": 292877, "epoch": 1743} {"train_loss": -11.066490173339844, "global_step": 292878, "epoch": 1743} {"train_loss": -11.193438529968262, "global_step": 292879, "epoch": 1743} {"train_loss": -11.695892333984375, "global_step": 292880, "epoch": 1743} {"train_loss": -11.571966171264648, "global_step": 292881, "epoch": 1743} {"train_loss": -11.421948432922363, "global_step": 292882, "epoch": 1743} {"train_loss": -11.84268856048584, "global_step": 292883, "epoch": 1743} {"train_loss": -11.847427368164062, "global_step": 292884, "epoch": 1743} {"train_loss": -12.019684791564941, "global_step": 292885, "epoch": 1743} {"train_loss": -12.002854347229004, "global_step": 292886, "epoch": 1743} {"train_loss": -11.884315490722656, "global_step": 292887, "epoch": 1743} {"train_loss": -11.831148147583008, "global_step": 292888, "epoch": 1743} {"train_loss": -11.861763000488281, "global_step": 292889, "epoch": 1743} {"train_loss": -11.964231491088867, "global_step": 292890, "epoch": 1743} {"train_loss": -11.547369003295898, "global_step": 292891, "epoch": 1743} {"train_loss": -12.085892677307129, "global_step": 292892, "epoch": 1743} {"train_loss": -11.395009994506836, "global_step": 292893, "epoch": 1743} {"train_loss": -12.036280632019043, "global_step": 292894, "epoch": 1743} {"train_loss": -11.202621459960938, "global_step": 292895, "epoch": 1743} {"train_loss": -11.935378074645996, "global_step": 292896, "epoch": 1743} {"train_loss": -11.470553398132324, "global_step": 292897, "epoch": 1743} {"train_loss": -12.04407024383545, "global_step": 292898, "epoch": 1743} {"train_loss": -11.399534225463867, "global_step": 292899, "epoch": 1743} {"train_loss": -12.19144058227539, "global_step": 292900, "epoch": 1743} {"train_loss": -11.316778182983398, "global_step": 292901, "epoch": 1743} {"train_loss": -12.208540916442871, "global_step": 292902, "epoch": 1743} {"train_loss": -11.544988632202148, "global_step": 292903, "epoch": 1743} {"train_loss": -11.744033813476562, "global_step": 292904, "epoch": 1743} {"train_loss": -11.358756065368652, "global_step": 292905, "epoch": 1743} {"train_loss": -11.83326244354248, "global_step": 292906, "epoch": 1743} {"train_loss": -12.299806594848633, "global_step": 292907, "epoch": 1743} {"train_loss": -12.062826156616211, "global_step": 292908, "epoch": 1743} {"train_loss": -12.004688262939453, "global_step": 292909, "epoch": 1743} {"train_loss": -12.251049995422363, "global_step": 292910, "epoch": 1743} {"train_loss": -12.0410795211792, "global_step": 292911, "epoch": 1743} {"train_loss": -11.974159240722656, "global_step": 292912, "epoch": 1743} {"train_loss": -12.343439102172852, "global_step": 292913, "epoch": 1743} {"train_loss": -11.906156539916992, "global_step": 292914, "epoch": 1743} {"train_loss": -11.80678939819336, "global_step": 292915, "epoch": 1743} {"train_loss": -12.240293502807617, "global_step": 292916, "epoch": 1743} {"train_loss": -11.928874969482422, "global_step": 292917, "epoch": 1743} {"train_loss": -11.637446403503418, "global_step": 292918, "epoch": 1743} {"train_loss": -12.048378944396973, "global_step": 292919, "epoch": 1743} {"train_loss": -11.482367515563965, "global_step": 292920, "epoch": 1743} {"train_loss": -11.909645080566406, "global_step": 292921, "epoch": 1743} {"train_loss": -12.123907089233398, "global_step": 292922, "epoch": 1743} {"train_loss": -11.751630783081055, "global_step": 292923, "epoch": 1743} {"train_loss": -12.336774826049805, "global_step": 292924, "epoch": 1743} {"train_loss": -11.639549255371094, "global_step": 292925, "epoch": 1743} {"train_loss": -11.95966911315918, "global_step": 292926, "epoch": 1743} {"train_loss": -11.73007583618164, "global_step": 292927, "epoch": 1743} {"train_loss": -11.973917961120605, "global_step": 292928, "epoch": 1743} {"train_loss": -12.16882610321045, "global_step": 292929, "epoch": 1743} {"train_loss": -11.907942771911621, "global_step": 292930, "epoch": 1743} {"train_loss": -12.1742582321167, "global_step": 292931, "epoch": 1743} {"train_loss": -11.974860191345215, "global_step": 292932, "epoch": 1743} {"train_loss": -12.257040023803711, "global_step": 292933, "epoch": 1743} {"train_loss": -11.81912612915039, "global_step": 292934, "epoch": 1743} {"train_loss": -12.11533260345459, "global_step": 292935, "epoch": 1743} {"train_loss": -12.026248931884766, "global_step": 292936, "epoch": 1743} {"train_loss": -12.389930725097656, "global_step": 292937, "epoch": 1743} {"train_loss": -12.120336532592773, "global_step": 292938, "epoch": 1743} {"train_loss": -12.178576469421387, "global_step": 292939, "epoch": 1743} {"train_loss": -12.13182258605957, "global_step": 292940, "epoch": 1743} {"train_loss": -12.063958168029785, "global_step": 292941, "epoch": 1743} {"train_loss": -12.093709945678711, "global_step": 292942, "epoch": 1743} {"train_loss": -12.385021209716797, "global_step": 292943, "epoch": 1743} {"train_loss": -12.031685829162598, "global_step": 292944, "epoch": 1743} {"train_loss": -12.102033615112305, "global_step": 292945, "epoch": 1743} {"train_loss": -12.148917198181152, "global_step": 292946, "epoch": 1743} {"train_loss": -12.173707962036133, "global_step": 292947, "epoch": 1743} {"train_loss": -11.930499076843262, "global_step": 292948, "epoch": 1743} {"train_loss": -12.006503105163574, "global_step": 292949, "epoch": 1743} {"train_loss": -12.370404243469238, "global_step": 292950, "epoch": 1743} {"train_loss": -12.186304092407227, "global_step": 292951, "epoch": 1743} {"train_loss": -12.25600528717041, "global_step": 292952, "epoch": 1743} {"train_loss": -11.892091751098633, "global_step": 292953, "epoch": 1743} {"train_loss": -11.914194107055664, "global_step": 292954, "epoch": 1743} {"train_loss": -12.303451538085938, "global_step": 292955, "epoch": 1743} {"train_loss": -12.199628829956055, "global_step": 292956, "epoch": 1743} {"train_loss": -12.093294143676758, "global_step": 292957, "epoch": 1743} {"train_loss": -12.32392692565918, "global_step": 292958, "epoch": 1743} {"train_loss": -12.117521286010742, "global_step": 292959, "epoch": 1743} {"train_loss": -12.146830558776855, "global_step": 292960, "epoch": 1743} {"train_loss": -12.24661636352539, "global_step": 292961, "epoch": 1743} {"train_loss": -12.147884368896484, "global_step": 292962, "epoch": 1743} {"train_loss": -12.02103328704834, "global_step": 292963, "epoch": 1743} {"train_loss": -11.921815872192383, "global_step": 292964, "epoch": 1743} {"train_loss": -11.865455627441406, "global_step": 292965, "epoch": 1743} {"train_loss": -11.743327140808105, "global_step": 292966, "epoch": 1743} {"train_loss": -12.346542358398438, "global_step": 292967, "epoch": 1743} {"train_loss": -11.871208190917969, "global_step": 292968, "epoch": 1743} {"train_loss": -12.106454849243164, "global_step": 292969, "epoch": 1743} {"train_loss": -11.839699745178223, "global_step": 292970, "epoch": 1743} {"train_loss": -11.559711456298828, "global_step": 292971, "epoch": 1743} {"train_loss": -11.591176986694336, "global_step": 292972, "epoch": 1743} {"train_loss": -11.955207824707031, "global_step": 292973, "epoch": 1743} {"train_loss": -12.040597915649414, "global_step": 292974, "epoch": 1743} {"train_loss": -11.406761169433594, "global_step": 292975, "epoch": 1743} {"train_loss": -11.527345657348633, "global_step": 292976, "epoch": 1743} {"train_loss": -11.56474494934082, "global_step": 292977, "epoch": 1743} {"train_loss": -10.631763458251953, "global_step": 292978, "epoch": 1743} {"train_loss": -10.305315017700195, "global_step": 292979, "epoch": 1743} {"train_loss": -11.719666481018066, "global_step": 292980, "epoch": 1743} {"train_loss": -10.968696594238281, "global_step": 292981, "epoch": 1743} {"train_loss": -10.890199661254883, "global_step": 292982, "epoch": 1743} {"train_loss": -11.707526206970215, "global_step": 292983, "epoch": 1743} {"train_loss": -11.572724342346191, "global_step": 292984, "epoch": 1743} {"train_loss": -11.611066818237305, "global_step": 292985, "epoch": 1743} {"train_loss": -11.807806015014648, "global_step": 292986, "epoch": 1743} {"train_loss": -11.527315139770508, "global_step": 292987, "epoch": 1743} {"train_loss": -11.878595352172852, "global_step": 292988, "epoch": 1743} {"train_loss": -11.478883743286133, "global_step": 292989, "epoch": 1743} {"train_loss": -10.827604293823242, "global_step": 292990, "epoch": 1743} {"train_loss": -11.907831118220376, "global_step": 292991, "epoch": 1743, "val_loss": 278468.21875} {"train_loss": -10.930122375488281, "global_step": 292992, "epoch": 1744} {"train_loss": -10.526752471923828, "global_step": 292993, "epoch": 1744} {"train_loss": -11.825101852416992, "global_step": 292994, "epoch": 1744} {"train_loss": -9.277166366577148, "global_step": 292995, "epoch": 1744} {"train_loss": -11.11755084991455, "global_step": 292996, "epoch": 1744} {"train_loss": -9.189323425292969, "global_step": 292997, "epoch": 1744} {"train_loss": -11.091815948486328, "global_step": 292998, "epoch": 1744} {"train_loss": -9.100410461425781, "global_step": 292999, "epoch": 1744} {"train_loss": -11.788415908813477, "global_step": 293000, "epoch": 1744} {"train_loss": -8.74946117401123, "global_step": 293001, "epoch": 1744} {"train_loss": -10.650215148925781, "global_step": 293002, "epoch": 1744} {"train_loss": -11.030803680419922, "global_step": 293003, "epoch": 1744} {"train_loss": -10.18686294555664, "global_step": 293004, "epoch": 1744} {"train_loss": -11.012724876403809, "global_step": 293005, "epoch": 1744} {"train_loss": -9.747537612915039, "global_step": 293006, "epoch": 1744} {"train_loss": -11.261710166931152, "global_step": 293007, "epoch": 1744} {"train_loss": -10.941303253173828, "global_step": 293008, "epoch": 1744} {"train_loss": -11.103534698486328, "global_step": 293009, "epoch": 1744} {"train_loss": -10.996724128723145, "global_step": 293010, "epoch": 1744} {"train_loss": -11.616286277770996, "global_step": 293011, "epoch": 1744} {"train_loss": -11.1961030960083, "global_step": 293012, "epoch": 1744} {"train_loss": -11.465106964111328, "global_step": 293013, "epoch": 1744} {"train_loss": -11.631235122680664, "global_step": 293014, "epoch": 1744} {"train_loss": -11.454997062683105, "global_step": 293015, "epoch": 1744} {"train_loss": -11.33944034576416, "global_step": 293016, "epoch": 1744} {"train_loss": -11.67313003540039, "global_step": 293017, "epoch": 1744} {"train_loss": -11.346468925476074, "global_step": 293018, "epoch": 1744} {"train_loss": -11.873291015625, "global_step": 293019, "epoch": 1744} {"train_loss": -11.804065704345703, "global_step": 293020, "epoch": 1744} {"train_loss": -11.45634651184082, "global_step": 293021, "epoch": 1744} {"train_loss": -11.83249282836914, "global_step": 293022, "epoch": 1744} {"train_loss": -11.262510299682617, "global_step": 293023, "epoch": 1744} {"train_loss": -11.95046615600586, "global_step": 293024, "epoch": 1744} {"train_loss": -11.633129119873047, "global_step": 293025, "epoch": 1744} {"train_loss": -12.045520782470703, "global_step": 293026, "epoch": 1744} {"train_loss": -11.32457447052002, "global_step": 293027, "epoch": 1744} {"train_loss": -11.823701858520508, "global_step": 293028, "epoch": 1744} {"train_loss": -11.491537094116211, "global_step": 293029, "epoch": 1744} {"train_loss": -12.197964668273926, "global_step": 293030, "epoch": 1744} {"train_loss": -11.495893478393555, "global_step": 293031, "epoch": 1744} {"train_loss": -11.798837661743164, "global_step": 293032, "epoch": 1744} {"train_loss": -11.693193435668945, "global_step": 293033, "epoch": 1744} {"train_loss": -11.914663314819336, "global_step": 293034, "epoch": 1744} {"train_loss": -11.893487930297852, "global_step": 293035, "epoch": 1744} {"train_loss": -11.937666893005371, "global_step": 293036, "epoch": 1744} {"train_loss": -12.109240531921387, "global_step": 293037, "epoch": 1744} {"train_loss": -11.860568046569824, "global_step": 293038, "epoch": 1744} {"train_loss": -12.080670356750488, "global_step": 293039, "epoch": 1744} {"train_loss": -12.13798999786377, "global_step": 293040, "epoch": 1744} {"train_loss": -11.874629020690918, "global_step": 293041, "epoch": 1744} {"train_loss": -12.052005767822266, "global_step": 293042, "epoch": 1744} {"train_loss": -12.013311386108398, "global_step": 293043, "epoch": 1744} {"train_loss": -12.039861679077148, "global_step": 293044, "epoch": 1744} {"train_loss": -12.146533966064453, "global_step": 293045, "epoch": 1744} {"train_loss": -12.018281936645508, "global_step": 293046, "epoch": 1744} {"train_loss": -12.220824241638184, "global_step": 293047, "epoch": 1744} {"train_loss": -12.19908618927002, "global_step": 293048, "epoch": 1744} {"train_loss": -12.187573432922363, "global_step": 293049, "epoch": 1744} {"train_loss": -12.293722152709961, "global_step": 293050, "epoch": 1744} {"train_loss": -12.066755294799805, "global_step": 293051, "epoch": 1744} {"train_loss": -12.477701187133789, "global_step": 293052, "epoch": 1744} {"train_loss": -12.38286018371582, "global_step": 293053, "epoch": 1744} {"train_loss": -12.421270370483398, "global_step": 293054, "epoch": 1744} {"train_loss": -12.26763916015625, "global_step": 293055, "epoch": 1744} {"train_loss": -12.128496170043945, "global_step": 293056, "epoch": 1744} {"train_loss": -12.241920471191406, "global_step": 293057, "epoch": 1744} {"train_loss": -12.205101013183594, "global_step": 293058, "epoch": 1744} {"train_loss": -12.161391258239746, "global_step": 293059, "epoch": 1744} {"train_loss": -12.460041046142578, "global_step": 293060, "epoch": 1744} {"train_loss": -12.215601921081543, "global_step": 293061, "epoch": 1744} {"train_loss": -12.288382530212402, "global_step": 293062, "epoch": 1744} {"train_loss": -12.29750919342041, "global_step": 293063, "epoch": 1744} {"train_loss": -12.447880744934082, "global_step": 293064, "epoch": 1744} {"train_loss": -12.44765853881836, "global_step": 293065, "epoch": 1744} {"train_loss": -12.372727394104004, "global_step": 293066, "epoch": 1744} {"train_loss": -12.42849063873291, "global_step": 293067, "epoch": 1744} {"train_loss": -12.402772903442383, "global_step": 293068, "epoch": 1744} {"train_loss": -12.311578750610352, "global_step": 293069, "epoch": 1744} {"train_loss": -12.42582893371582, "global_step": 293070, "epoch": 1744} {"train_loss": -12.340827941894531, "global_step": 293071, "epoch": 1744} {"train_loss": -12.373261451721191, "global_step": 293072, "epoch": 1744} {"train_loss": -12.524320602416992, "global_step": 293073, "epoch": 1744} {"train_loss": -12.450655937194824, "global_step": 293074, "epoch": 1744} {"train_loss": -12.561382293701172, "global_step": 293075, "epoch": 1744} {"train_loss": -12.500394821166992, "global_step": 293076, "epoch": 1744} {"train_loss": -12.588754653930664, "global_step": 293077, "epoch": 1744} {"train_loss": -12.180413246154785, "global_step": 293078, "epoch": 1744} {"train_loss": -12.488906860351562, "global_step": 293079, "epoch": 1744} {"train_loss": -12.27801513671875, "global_step": 293080, "epoch": 1744} {"train_loss": -12.196533203125, "global_step": 293081, "epoch": 1744} {"train_loss": -12.369643211364746, "global_step": 293082, "epoch": 1744} {"train_loss": -12.346094131469727, "global_step": 293083, "epoch": 1744} {"train_loss": -12.01126480102539, "global_step": 293084, "epoch": 1744} {"train_loss": -12.103829383850098, "global_step": 293085, "epoch": 1744} {"train_loss": -12.395099639892578, "global_step": 293086, "epoch": 1744} {"train_loss": -12.105157852172852, "global_step": 293087, "epoch": 1744} {"train_loss": -11.58551025390625, "global_step": 293088, "epoch": 1744} {"train_loss": -11.011643409729004, "global_step": 293089, "epoch": 1744} {"train_loss": -9.73638916015625, "global_step": 293090, "epoch": 1744} {"train_loss": -10.355448722839355, "global_step": 293091, "epoch": 1744} {"train_loss": -8.208938598632812, "global_step": 293092, "epoch": 1744} {"train_loss": -8.200631141662598, "global_step": 293093, "epoch": 1744} {"train_loss": -9.104620933532715, "global_step": 293094, "epoch": 1744} {"train_loss": -9.197474479675293, "global_step": 293095, "epoch": 1744} {"train_loss": -9.796549797058105, "global_step": 293096, "epoch": 1744} {"train_loss": -9.052765846252441, "global_step": 293097, "epoch": 1744} {"train_loss": -8.154869079589844, "global_step": 293098, "epoch": 1744} {"train_loss": -9.442374229431152, "global_step": 293099, "epoch": 1744} {"train_loss": -7.824213981628418, "global_step": 293100, "epoch": 1744} {"train_loss": -8.886734962463379, "global_step": 293101, "epoch": 1744} {"train_loss": -7.323674201965332, "global_step": 293102, "epoch": 1744} {"train_loss": -8.840381622314453, "global_step": 293103, "epoch": 1744} {"train_loss": -9.366450309753418, "global_step": 293104, "epoch": 1744} {"train_loss": -9.727372169494629, "global_step": 293105, "epoch": 1744} {"train_loss": -8.406878471374512, "global_step": 293106, "epoch": 1744} {"train_loss": -9.690381050109863, "global_step": 293107, "epoch": 1744} {"train_loss": -9.807097434997559, "global_step": 293108, "epoch": 1744} {"train_loss": -9.046195983886719, "global_step": 293109, "epoch": 1744} {"train_loss": -9.449031829833984, "global_step": 293110, "epoch": 1744} {"train_loss": -8.816364288330078, "global_step": 293111, "epoch": 1744} {"train_loss": -9.869516372680664, "global_step": 293112, "epoch": 1744} {"train_loss": -9.161466598510742, "global_step": 293113, "epoch": 1744} {"train_loss": -9.55392074584961, "global_step": 293114, "epoch": 1744} {"train_loss": -10.491674423217773, "global_step": 293115, "epoch": 1744} {"train_loss": -9.957491874694824, "global_step": 293116, "epoch": 1744} {"train_loss": -10.22833251953125, "global_step": 293117, "epoch": 1744} {"train_loss": -10.875116348266602, "global_step": 293118, "epoch": 1744} {"train_loss": -10.815784454345703, "global_step": 293119, "epoch": 1744} {"train_loss": -10.37020492553711, "global_step": 293120, "epoch": 1744} {"train_loss": -11.42154598236084, "global_step": 293121, "epoch": 1744} {"train_loss": -10.823918342590332, "global_step": 293122, "epoch": 1744} {"train_loss": -10.539506912231445, "global_step": 293123, "epoch": 1744} {"train_loss": -11.417850494384766, "global_step": 293124, "epoch": 1744} {"train_loss": -10.861167907714844, "global_step": 293125, "epoch": 1744} {"train_loss": -10.801788330078125, "global_step": 293126, "epoch": 1744} {"train_loss": -11.335649490356445, "global_step": 293127, "epoch": 1744} {"train_loss": -11.06356430053711, "global_step": 293128, "epoch": 1744} {"train_loss": -11.210023880004883, "global_step": 293129, "epoch": 1744} {"train_loss": -11.370070457458496, "global_step": 293130, "epoch": 1744} {"train_loss": -11.207382202148438, "global_step": 293131, "epoch": 1744} {"train_loss": -11.436178207397461, "global_step": 293132, "epoch": 1744} {"train_loss": -11.675745010375977, "global_step": 293133, "epoch": 1744} {"train_loss": -11.201417922973633, "global_step": 293134, "epoch": 1744} {"train_loss": -11.630989074707031, "global_step": 293135, "epoch": 1744} {"train_loss": -11.493936538696289, "global_step": 293136, "epoch": 1744} {"train_loss": -11.517087936401367, "global_step": 293137, "epoch": 1744} {"train_loss": -11.426142692565918, "global_step": 293138, "epoch": 1744} {"train_loss": -11.850288391113281, "global_step": 293139, "epoch": 1744} {"train_loss": -11.576587677001953, "global_step": 293140, "epoch": 1744} {"train_loss": -11.50429916381836, "global_step": 293141, "epoch": 1744} {"train_loss": -11.743576049804688, "global_step": 293142, "epoch": 1744} {"train_loss": -11.780366897583008, "global_step": 293143, "epoch": 1744} {"train_loss": -11.616015434265137, "global_step": 293144, "epoch": 1744} {"train_loss": -11.70329475402832, "global_step": 293145, "epoch": 1744} {"train_loss": -11.590738296508789, "global_step": 293146, "epoch": 1744} {"train_loss": -11.66349983215332, "global_step": 293147, "epoch": 1744} {"train_loss": -11.928102493286133, "global_step": 293148, "epoch": 1744} {"train_loss": -11.821985244750977, "global_step": 293149, "epoch": 1744} {"train_loss": -11.707239151000977, "global_step": 293150, "epoch": 1744} {"train_loss": -11.831266403198242, "global_step": 293151, "epoch": 1744} {"train_loss": -11.933122634887695, "global_step": 293152, "epoch": 1744} {"train_loss": -11.753012657165527, "global_step": 293153, "epoch": 1744} {"train_loss": -11.90377140045166, "global_step": 293154, "epoch": 1744} {"train_loss": -12.022453308105469, "global_step": 293155, "epoch": 1744} {"train_loss": -11.797880172729492, "global_step": 293156, "epoch": 1744} {"train_loss": -12.187699317932129, "global_step": 293157, "epoch": 1744} {"train_loss": -12.106566429138184, "global_step": 293158, "epoch": 1744} {"train_loss": -11.260653490111942, "global_step": 293159, "epoch": 1744, "val_loss": 278284.75} {"train_loss": -11.986324310302734, "global_step": 293160, "epoch": 1745} {"train_loss": -11.877254486083984, "global_step": 293161, "epoch": 1745} {"train_loss": -11.763086318969727, "global_step": 293162, "epoch": 1745} {"train_loss": -11.833759307861328, "global_step": 293163, "epoch": 1745} {"train_loss": -12.118402481079102, "global_step": 293164, "epoch": 1745} {"train_loss": -12.085806846618652, "global_step": 293165, "epoch": 1745} {"train_loss": -11.924522399902344, "global_step": 293166, "epoch": 1745} {"train_loss": -12.11731243133545, "global_step": 293167, "epoch": 1745} {"train_loss": -12.158456802368164, "global_step": 293168, "epoch": 1745} {"train_loss": -12.0894775390625, "global_step": 293169, "epoch": 1745} {"train_loss": -12.035837173461914, "global_step": 293170, "epoch": 1745} {"train_loss": -11.827964782714844, "global_step": 293171, "epoch": 1745} {"train_loss": -11.965686798095703, "global_step": 293172, "epoch": 1745} {"train_loss": -12.053861618041992, "global_step": 293173, "epoch": 1745} {"train_loss": -11.845402717590332, "global_step": 293174, "epoch": 1745} {"train_loss": -12.177865982055664, "global_step": 293175, "epoch": 1745} {"train_loss": -11.914960861206055, "global_step": 293176, "epoch": 1745} {"train_loss": -12.244518280029297, "global_step": 293177, "epoch": 1745} {"train_loss": -12.177576065063477, "global_step": 293178, "epoch": 1745} {"train_loss": -11.935409545898438, "global_step": 293179, "epoch": 1745} {"train_loss": -11.9634428024292, "global_step": 293180, "epoch": 1745} {"train_loss": -11.91305923461914, "global_step": 293181, "epoch": 1745} {"train_loss": -12.285110473632812, "global_step": 293182, "epoch": 1745} {"train_loss": -12.059947967529297, "global_step": 293183, "epoch": 1745} {"train_loss": -12.300958633422852, "global_step": 293184, "epoch": 1745} {"train_loss": -11.822463989257812, "global_step": 293185, "epoch": 1745} {"train_loss": -12.110014915466309, "global_step": 293186, "epoch": 1745} {"train_loss": -12.11404800415039, "global_step": 293187, "epoch": 1745} {"train_loss": -12.11429500579834, "global_step": 293188, "epoch": 1745} {"train_loss": -12.088579177856445, "global_step": 293189, "epoch": 1745} {"train_loss": -12.073314666748047, "global_step": 293190, "epoch": 1745} {"train_loss": -12.118387222290039, "global_step": 293191, "epoch": 1745} {"train_loss": -12.41006088256836, "global_step": 293192, "epoch": 1745} {"train_loss": -12.17640495300293, "global_step": 293193, "epoch": 1745} {"train_loss": -11.994495391845703, "global_step": 293194, "epoch": 1745} {"train_loss": -12.303346633911133, "global_step": 293195, "epoch": 1745} {"train_loss": -12.069311141967773, "global_step": 293196, "epoch": 1745} {"train_loss": -12.20763111114502, "global_step": 293197, "epoch": 1745} {"train_loss": -12.417101860046387, "global_step": 293198, "epoch": 1745} {"train_loss": -12.014460563659668, "global_step": 293199, "epoch": 1745} {"train_loss": -12.390254974365234, "global_step": 293200, "epoch": 1745} {"train_loss": -12.318672180175781, "global_step": 293201, "epoch": 1745} {"train_loss": -12.164599418640137, "global_step": 293202, "epoch": 1745} {"train_loss": -12.284589767456055, "global_step": 293203, "epoch": 1745} {"train_loss": -12.015649795532227, "global_step": 293204, "epoch": 1745} {"train_loss": -12.317887306213379, "global_step": 293205, "epoch": 1745} {"train_loss": -12.528644561767578, "global_step": 293206, "epoch": 1745} {"train_loss": -11.964031219482422, "global_step": 293207, "epoch": 1745} {"train_loss": -12.363907814025879, "global_step": 293208, "epoch": 1745} {"train_loss": -12.3145751953125, "global_step": 293209, "epoch": 1745} {"train_loss": -12.275951385498047, "global_step": 293210, "epoch": 1745} {"train_loss": -12.124889373779297, "global_step": 293211, "epoch": 1745} {"train_loss": -12.084365844726562, "global_step": 293212, "epoch": 1745} {"train_loss": -12.388310432434082, "global_step": 293213, "epoch": 1745} {"train_loss": -12.102395057678223, "global_step": 293214, "epoch": 1745} {"train_loss": -12.087209701538086, "global_step": 293215, "epoch": 1745} {"train_loss": -12.57828426361084, "global_step": 293216, "epoch": 1745} {"train_loss": -11.901166915893555, "global_step": 293217, "epoch": 1745} {"train_loss": -12.258196830749512, "global_step": 293218, "epoch": 1745} {"train_loss": -12.414281845092773, "global_step": 293219, "epoch": 1745} {"train_loss": -11.902519226074219, "global_step": 293220, "epoch": 1745} {"train_loss": -12.450115203857422, "global_step": 293221, "epoch": 1745} {"train_loss": -12.044588088989258, "global_step": 293222, "epoch": 1745} {"train_loss": -12.465163230895996, "global_step": 293223, "epoch": 1745} {"train_loss": -11.776603698730469, "global_step": 293224, "epoch": 1745} {"train_loss": -12.424781799316406, "global_step": 293225, "epoch": 1745} {"train_loss": -12.19563102722168, "global_step": 293226, "epoch": 1745} {"train_loss": -12.40810775756836, "global_step": 293227, "epoch": 1745} {"train_loss": -12.134031295776367, "global_step": 293228, "epoch": 1745} {"train_loss": -11.908266067504883, "global_step": 293229, "epoch": 1745} {"train_loss": -12.056140899658203, "global_step": 293230, "epoch": 1745} {"train_loss": -12.449417114257812, "global_step": 293231, "epoch": 1745} {"train_loss": -12.41494369506836, "global_step": 293232, "epoch": 1745} {"train_loss": -12.407983779907227, "global_step": 293233, "epoch": 1745} {"train_loss": -12.132281303405762, "global_step": 293234, "epoch": 1745} {"train_loss": -12.182279586791992, "global_step": 293235, "epoch": 1745} {"train_loss": -12.001384735107422, "global_step": 293236, "epoch": 1745} {"train_loss": -12.067434310913086, "global_step": 293237, "epoch": 1745} {"train_loss": -12.473299980163574, "global_step": 293238, "epoch": 1745} {"train_loss": -12.18856430053711, "global_step": 293239, "epoch": 1745} {"train_loss": -11.950315475463867, "global_step": 293240, "epoch": 1745} {"train_loss": -11.86335277557373, "global_step": 293241, "epoch": 1745} {"train_loss": -11.274574279785156, "global_step": 293242, "epoch": 1745} {"train_loss": -12.136085510253906, "global_step": 293243, "epoch": 1745} {"train_loss": -12.226740837097168, "global_step": 293244, "epoch": 1745} {"train_loss": -11.480705261230469, "global_step": 293245, "epoch": 1745} {"train_loss": -11.943010330200195, "global_step": 293246, "epoch": 1745} {"train_loss": -11.87588119506836, "global_step": 293247, "epoch": 1745} {"train_loss": -11.218233108520508, "global_step": 293248, "epoch": 1745} {"train_loss": -10.995221138000488, "global_step": 293249, "epoch": 1745} {"train_loss": -11.501811981201172, "global_step": 293250, "epoch": 1745} {"train_loss": -8.848020553588867, "global_step": 293251, "epoch": 1745} {"train_loss": -11.61719799041748, "global_step": 293252, "epoch": 1745} {"train_loss": -10.047367095947266, "global_step": 293253, "epoch": 1745} {"train_loss": -9.950860977172852, "global_step": 293254, "epoch": 1745} {"train_loss": -8.210701942443848, "global_step": 293255, "epoch": 1745} {"train_loss": -11.043460845947266, "global_step": 293256, "epoch": 1745} {"train_loss": -9.174201965332031, "global_step": 293257, "epoch": 1745} {"train_loss": -9.705484390258789, "global_step": 293258, "epoch": 1745} {"train_loss": -9.749666213989258, "global_step": 293259, "epoch": 1745} {"train_loss": -10.030342102050781, "global_step": 293260, "epoch": 1745} {"train_loss": -9.996496200561523, "global_step": 293261, "epoch": 1745} {"train_loss": -10.931478500366211, "global_step": 293262, "epoch": 1745} {"train_loss": -8.912818908691406, "global_step": 293263, "epoch": 1745} {"train_loss": -8.297794342041016, "global_step": 293264, "epoch": 1745} {"train_loss": -10.932999610900879, "global_step": 293265, "epoch": 1745} {"train_loss": -8.440211296081543, "global_step": 293266, "epoch": 1745} {"train_loss": -10.22610092163086, "global_step": 293267, "epoch": 1745} {"train_loss": -8.759407043457031, "global_step": 293268, "epoch": 1745} {"train_loss": -9.708247184753418, "global_step": 293269, "epoch": 1745} {"train_loss": -9.836578369140625, "global_step": 293270, "epoch": 1745} {"train_loss": -9.310768127441406, "global_step": 293271, "epoch": 1745} {"train_loss": -9.423200607299805, "global_step": 293272, "epoch": 1745} {"train_loss": -10.510372161865234, "global_step": 293273, "epoch": 1745} {"train_loss": -11.24367904663086, "global_step": 293274, "epoch": 1745} {"train_loss": -9.884469985961914, "global_step": 293275, "epoch": 1745} {"train_loss": -11.054542541503906, "global_step": 293276, "epoch": 1745} {"train_loss": -10.492073059082031, "global_step": 293277, "epoch": 1745} {"train_loss": -10.146158218383789, "global_step": 293278, "epoch": 1745} {"train_loss": -10.584218978881836, "global_step": 293279, "epoch": 1745} {"train_loss": -10.666826248168945, "global_step": 293280, "epoch": 1745} {"train_loss": -10.48175048828125, "global_step": 293281, "epoch": 1745} {"train_loss": -10.798337936401367, "global_step": 293282, "epoch": 1745} {"train_loss": -10.779647827148438, "global_step": 293283, "epoch": 1745} {"train_loss": -10.642190933227539, "global_step": 293284, "epoch": 1745} {"train_loss": -11.01637077331543, "global_step": 293285, "epoch": 1745} {"train_loss": -11.022977828979492, "global_step": 293286, "epoch": 1745} {"train_loss": -10.731443405151367, "global_step": 293287, "epoch": 1745} {"train_loss": -11.24380111694336, "global_step": 293288, "epoch": 1745} {"train_loss": -11.367918014526367, "global_step": 293289, "epoch": 1745} {"train_loss": -10.859565734863281, "global_step": 293290, "epoch": 1745} {"train_loss": -11.710573196411133, "global_step": 293291, "epoch": 1745} {"train_loss": -11.050249099731445, "global_step": 293292, "epoch": 1745} {"train_loss": -11.040245056152344, "global_step": 293293, "epoch": 1745} {"train_loss": -11.776705741882324, "global_step": 293294, "epoch": 1745} {"train_loss": -11.18635368347168, "global_step": 293295, "epoch": 1745} {"train_loss": -11.296621322631836, "global_step": 293296, "epoch": 1745} {"train_loss": -11.40388298034668, "global_step": 293297, "epoch": 1745} {"train_loss": -11.43539810180664, "global_step": 293298, "epoch": 1745} {"train_loss": -11.808982849121094, "global_step": 293299, "epoch": 1745} {"train_loss": -11.466211318969727, "global_step": 293300, "epoch": 1745} {"train_loss": -11.561607360839844, "global_step": 293301, "epoch": 1745} {"train_loss": -11.793018341064453, "global_step": 293302, "epoch": 1745} {"train_loss": -11.880638122558594, "global_step": 293303, "epoch": 1745} {"train_loss": -11.588197708129883, "global_step": 293304, "epoch": 1745} {"train_loss": -11.625955581665039, "global_step": 293305, "epoch": 1745} {"train_loss": -11.725025177001953, "global_step": 293306, "epoch": 1745} {"train_loss": -11.917600631713867, "global_step": 293307, "epoch": 1745} {"train_loss": -11.902217864990234, "global_step": 293308, "epoch": 1745} {"train_loss": -11.680042266845703, "global_step": 293309, "epoch": 1745} {"train_loss": -11.829719543457031, "global_step": 293310, "epoch": 1745} {"train_loss": -12.053461074829102, "global_step": 293311, "epoch": 1745} {"train_loss": -11.791418075561523, "global_step": 293312, "epoch": 1745} {"train_loss": -11.95065689086914, "global_step": 293313, "epoch": 1745} {"train_loss": -12.073160171508789, "global_step": 293314, "epoch": 1745} {"train_loss": -11.942098617553711, "global_step": 293315, "epoch": 1745} {"train_loss": -12.018998146057129, "global_step": 293316, "epoch": 1745} {"train_loss": -11.966972351074219, "global_step": 293317, "epoch": 1745} {"train_loss": -11.969217300415039, "global_step": 293318, "epoch": 1745} {"train_loss": -11.830902099609375, "global_step": 293319, "epoch": 1745} {"train_loss": -12.023391723632812, "global_step": 293320, "epoch": 1745} {"train_loss": -11.978108406066895, "global_step": 293321, "epoch": 1745} {"train_loss": -12.034430503845215, "global_step": 293322, "epoch": 1745} {"train_loss": -12.095800399780273, "global_step": 293323, "epoch": 1745} {"train_loss": -12.214229583740234, "global_step": 293324, "epoch": 1745} {"train_loss": -12.179027557373047, "global_step": 293325, "epoch": 1745} {"train_loss": -12.146844863891602, "global_step": 293326, "epoch": 1745} {"train_loss": -11.564637462298075, "global_step": 293327, "epoch": 1745, "val_loss": 275042.375, "train_action_mse_error": 2.0057287216186523} {"train_loss": -12.34107780456543, "global_step": 293328, "epoch": 1746} {"train_loss": -12.273971557617188, "global_step": 293329, "epoch": 1746} {"train_loss": -12.050328254699707, "global_step": 293330, "epoch": 1746} {"train_loss": -12.248680114746094, "global_step": 293331, "epoch": 1746} {"train_loss": -12.14200496673584, "global_step": 293332, "epoch": 1746} {"train_loss": -12.297170639038086, "global_step": 293333, "epoch": 1746} {"train_loss": -12.043180465698242, "global_step": 293334, "epoch": 1746} {"train_loss": -12.307311058044434, "global_step": 293335, "epoch": 1746} {"train_loss": -12.23611068725586, "global_step": 293336, "epoch": 1746} {"train_loss": -12.19456672668457, "global_step": 293337, "epoch": 1746} {"train_loss": -12.170004844665527, "global_step": 293338, "epoch": 1746} {"train_loss": -11.949983596801758, "global_step": 293339, "epoch": 1746} {"train_loss": -11.896764755249023, "global_step": 293340, "epoch": 1746} {"train_loss": -12.00859546661377, "global_step": 293341, "epoch": 1746} {"train_loss": -10.429693222045898, "global_step": 293342, "epoch": 1746} {"train_loss": -11.663795471191406, "global_step": 293343, "epoch": 1746} {"train_loss": -12.101876258850098, "global_step": 293344, "epoch": 1746} {"train_loss": -11.550847053527832, "global_step": 293345, "epoch": 1746} {"train_loss": -11.294485092163086, "global_step": 293346, "epoch": 1746} {"train_loss": -11.69964599609375, "global_step": 293347, "epoch": 1746} {"train_loss": -12.054014205932617, "global_step": 293348, "epoch": 1746} {"train_loss": -11.20284652709961, "global_step": 293349, "epoch": 1746} {"train_loss": -10.997283935546875, "global_step": 293350, "epoch": 1746} {"train_loss": -12.07925796508789, "global_step": 293351, "epoch": 1746} {"train_loss": -11.7382173538208, "global_step": 293352, "epoch": 1746} {"train_loss": -11.585638046264648, "global_step": 293353, "epoch": 1746} {"train_loss": -12.074259757995605, "global_step": 293354, "epoch": 1746} {"train_loss": -11.637664794921875, "global_step": 293355, "epoch": 1746} {"train_loss": -11.540319442749023, "global_step": 293356, "epoch": 1746} {"train_loss": -12.187379837036133, "global_step": 293357, "epoch": 1746} {"train_loss": -11.989128112792969, "global_step": 293358, "epoch": 1746} {"train_loss": -11.673128128051758, "global_step": 293359, "epoch": 1746} {"train_loss": -11.92905330657959, "global_step": 293360, "epoch": 1746} {"train_loss": -11.993589401245117, "global_step": 293361, "epoch": 1746} {"train_loss": -11.855331420898438, "global_step": 293362, "epoch": 1746} {"train_loss": -12.086617469787598, "global_step": 293363, "epoch": 1746} {"train_loss": -12.116168975830078, "global_step": 293364, "epoch": 1746} {"train_loss": -11.894499778747559, "global_step": 293365, "epoch": 1746} {"train_loss": -12.125168800354004, "global_step": 293366, "epoch": 1746} {"train_loss": -12.08958625793457, "global_step": 293367, "epoch": 1746} {"train_loss": -12.126466751098633, "global_step": 293368, "epoch": 1746} {"train_loss": -11.75502872467041, "global_step": 293369, "epoch": 1746} {"train_loss": -11.387954711914062, "global_step": 293370, "epoch": 1746} {"train_loss": -11.840679168701172, "global_step": 293371, "epoch": 1746} {"train_loss": -12.10159683227539, "global_step": 293372, "epoch": 1746} {"train_loss": -11.760002136230469, "global_step": 293373, "epoch": 1746} {"train_loss": -11.798870086669922, "global_step": 293374, "epoch": 1746} {"train_loss": -11.937616348266602, "global_step": 293375, "epoch": 1746} {"train_loss": -11.660663604736328, "global_step": 293376, "epoch": 1746} {"train_loss": -12.140539169311523, "global_step": 293377, "epoch": 1746} {"train_loss": -11.71705436706543, "global_step": 293378, "epoch": 1746} {"train_loss": -12.28584098815918, "global_step": 293379, "epoch": 1746} {"train_loss": -12.121091842651367, "global_step": 293380, "epoch": 1746} {"train_loss": -12.295318603515625, "global_step": 293381, "epoch": 1746} {"train_loss": -11.892974853515625, "global_step": 293382, "epoch": 1746} {"train_loss": -12.242162704467773, "global_step": 293383, "epoch": 1746} {"train_loss": -11.167618751525879, "global_step": 293384, "epoch": 1746} {"train_loss": -11.062484741210938, "global_step": 293385, "epoch": 1746} {"train_loss": -11.720117568969727, "global_step": 293386, "epoch": 1746} {"train_loss": -12.165685653686523, "global_step": 293387, "epoch": 1746} {"train_loss": -11.788877487182617, "global_step": 293388, "epoch": 1746} {"train_loss": -12.268436431884766, "global_step": 293389, "epoch": 1746} {"train_loss": -12.026263236999512, "global_step": 293390, "epoch": 1746} {"train_loss": -11.913445472717285, "global_step": 293391, "epoch": 1746} {"train_loss": -11.717460632324219, "global_step": 293392, "epoch": 1746} {"train_loss": -12.530525207519531, "global_step": 293393, "epoch": 1746} {"train_loss": -11.541369438171387, "global_step": 293394, "epoch": 1746} {"train_loss": -11.048203468322754, "global_step": 293395, "epoch": 1746} {"train_loss": -11.838866233825684, "global_step": 293396, "epoch": 1746} {"train_loss": -12.099931716918945, "global_step": 293397, "epoch": 1746} {"train_loss": -11.56282901763916, "global_step": 293398, "epoch": 1746} {"train_loss": -11.887365341186523, "global_step": 293399, "epoch": 1746} {"train_loss": -11.515226364135742, "global_step": 293400, "epoch": 1746} {"train_loss": -10.99553108215332, "global_step": 293401, "epoch": 1746} {"train_loss": -11.910784721374512, "global_step": 293402, "epoch": 1746} {"train_loss": -10.445854187011719, "global_step": 293403, "epoch": 1746} {"train_loss": -10.165836334228516, "global_step": 293404, "epoch": 1746} {"train_loss": -10.435796737670898, "global_step": 293405, "epoch": 1746} {"train_loss": -8.495382308959961, "global_step": 293406, "epoch": 1746} {"train_loss": -9.105599403381348, "global_step": 293407, "epoch": 1746} {"train_loss": -9.951589584350586, "global_step": 293408, "epoch": 1746} {"train_loss": -9.478754043579102, "global_step": 293409, "epoch": 1746} {"train_loss": -9.967856407165527, "global_step": 293410, "epoch": 1746} {"train_loss": -9.5830078125, "global_step": 293411, "epoch": 1746} {"train_loss": -9.952354431152344, "global_step": 293412, "epoch": 1746} {"train_loss": -10.501441955566406, "global_step": 293413, "epoch": 1746} {"train_loss": -11.0101900100708, "global_step": 293414, "epoch": 1746} {"train_loss": -9.992359161376953, "global_step": 293415, "epoch": 1746} {"train_loss": -10.434761047363281, "global_step": 293416, "epoch": 1746} {"train_loss": -11.033706665039062, "global_step": 293417, "epoch": 1746} {"train_loss": -10.503767013549805, "global_step": 293418, "epoch": 1746} {"train_loss": -10.268260955810547, "global_step": 293419, "epoch": 1746} {"train_loss": -10.807193756103516, "global_step": 293420, "epoch": 1746} {"train_loss": -9.886910438537598, "global_step": 293421, "epoch": 1746} {"train_loss": -11.291683197021484, "global_step": 293422, "epoch": 1746} {"train_loss": -9.264999389648438, "global_step": 293423, "epoch": 1746} {"train_loss": -10.992940902709961, "global_step": 293424, "epoch": 1746} {"train_loss": -10.384532928466797, "global_step": 293425, "epoch": 1746} {"train_loss": -10.807527542114258, "global_step": 293426, "epoch": 1746} {"train_loss": -10.5330810546875, "global_step": 293427, "epoch": 1746} {"train_loss": -10.799883842468262, "global_step": 293428, "epoch": 1746} {"train_loss": -10.624773025512695, "global_step": 293429, "epoch": 1746} {"train_loss": -11.340194702148438, "global_step": 293430, "epoch": 1746} {"train_loss": -9.89349365234375, "global_step": 293431, "epoch": 1746} {"train_loss": -11.45016860961914, "global_step": 293432, "epoch": 1746} {"train_loss": -11.534062385559082, "global_step": 293433, "epoch": 1746} {"train_loss": -10.65608024597168, "global_step": 293434, "epoch": 1746} {"train_loss": -11.540068626403809, "global_step": 293435, "epoch": 1746} {"train_loss": -11.335575103759766, "global_step": 293436, "epoch": 1746} {"train_loss": -11.324509620666504, "global_step": 293437, "epoch": 1746} {"train_loss": -11.799513816833496, "global_step": 293438, "epoch": 1746} {"train_loss": -11.089365005493164, "global_step": 293439, "epoch": 1746} {"train_loss": -11.4196138381958, "global_step": 293440, "epoch": 1746} {"train_loss": -11.677125930786133, "global_step": 293441, "epoch": 1746} {"train_loss": -11.523900032043457, "global_step": 293442, "epoch": 1746} {"train_loss": -11.835553169250488, "global_step": 293443, "epoch": 1746} {"train_loss": -11.817544937133789, "global_step": 293444, "epoch": 1746} {"train_loss": -11.628196716308594, "global_step": 293445, "epoch": 1746} {"train_loss": -11.904937744140625, "global_step": 293446, "epoch": 1746} {"train_loss": -11.622774124145508, "global_step": 293447, "epoch": 1746} {"train_loss": -11.865306854248047, "global_step": 293448, "epoch": 1746} {"train_loss": -11.718986511230469, "global_step": 293449, "epoch": 1746} {"train_loss": -11.769432067871094, "global_step": 293450, "epoch": 1746} {"train_loss": -11.562460899353027, "global_step": 293451, "epoch": 1746} {"train_loss": -11.923234939575195, "global_step": 293452, "epoch": 1746} {"train_loss": -11.966446876525879, "global_step": 293453, "epoch": 1746} {"train_loss": -11.872762680053711, "global_step": 293454, "epoch": 1746} {"train_loss": -11.770626068115234, "global_step": 293455, "epoch": 1746} {"train_loss": -11.787269592285156, "global_step": 293456, "epoch": 1746} {"train_loss": -11.916383743286133, "global_step": 293457, "epoch": 1746} {"train_loss": -11.904037475585938, "global_step": 293458, "epoch": 1746} {"train_loss": -11.947263717651367, "global_step": 293459, "epoch": 1746} {"train_loss": -11.885974884033203, "global_step": 293460, "epoch": 1746} {"train_loss": -11.964319229125977, "global_step": 293461, "epoch": 1746} {"train_loss": -11.839986801147461, "global_step": 293462, "epoch": 1746} {"train_loss": -11.821861267089844, "global_step": 293463, "epoch": 1746} {"train_loss": -11.876136779785156, "global_step": 293464, "epoch": 1746} {"train_loss": -11.950580596923828, "global_step": 293465, "epoch": 1746} {"train_loss": -12.132951736450195, "global_step": 293466, "epoch": 1746} {"train_loss": -12.098437309265137, "global_step": 293467, "epoch": 1746} {"train_loss": -11.977563858032227, "global_step": 293468, "epoch": 1746} {"train_loss": -12.170797348022461, "global_step": 293469, "epoch": 1746} {"train_loss": -12.106472969055176, "global_step": 293470, "epoch": 1746} {"train_loss": -12.086617469787598, "global_step": 293471, "epoch": 1746} {"train_loss": -12.202407836914062, "global_step": 293472, "epoch": 1746} {"train_loss": -12.22117805480957, "global_step": 293473, "epoch": 1746} {"train_loss": -12.191997528076172, "global_step": 293474, "epoch": 1746} {"train_loss": -12.07252311706543, "global_step": 293475, "epoch": 1746} {"train_loss": -12.132269859313965, "global_step": 293476, "epoch": 1746} {"train_loss": -12.039192199707031, "global_step": 293477, "epoch": 1746} {"train_loss": -12.011614799499512, "global_step": 293478, "epoch": 1746} {"train_loss": -12.331522941589355, "global_step": 293479, "epoch": 1746} {"train_loss": -11.903075218200684, "global_step": 293480, "epoch": 1746} {"train_loss": -12.097611427307129, "global_step": 293481, "epoch": 1746} {"train_loss": -11.866456985473633, "global_step": 293482, "epoch": 1746} {"train_loss": -12.270975112915039, "global_step": 293483, "epoch": 1746} {"train_loss": -12.201837539672852, "global_step": 293484, "epoch": 1746} {"train_loss": -12.27569580078125, "global_step": 293485, "epoch": 1746} {"train_loss": -12.463448524475098, "global_step": 293486, "epoch": 1746} {"train_loss": -12.448152542114258, "global_step": 293487, "epoch": 1746} {"train_loss": -12.06197738647461, "global_step": 293488, "epoch": 1746} {"train_loss": -12.1954345703125, "global_step": 293489, "epoch": 1746} {"train_loss": -11.934155464172363, "global_step": 293490, "epoch": 1746} {"train_loss": -12.218690872192383, "global_step": 293491, "epoch": 1746} {"train_loss": -12.094989776611328, "global_step": 293492, "epoch": 1746} {"train_loss": -12.211874008178711, "global_step": 293493, "epoch": 1746} {"train_loss": -12.338716506958008, "global_step": 293494, "epoch": 1746} {"train_loss": -11.605132750102452, "global_step": 293495, "epoch": 1746, "val_loss": 271464.75} {"train_loss": -12.299089431762695, "global_step": 293496, "epoch": 1747} {"train_loss": -12.466776847839355, "global_step": 293497, "epoch": 1747} {"train_loss": -12.448402404785156, "global_step": 293498, "epoch": 1747} {"train_loss": -12.280656814575195, "global_step": 293499, "epoch": 1747} {"train_loss": -12.284990310668945, "global_step": 293500, "epoch": 1747} {"train_loss": -12.480978012084961, "global_step": 293501, "epoch": 1747} {"train_loss": -12.202820777893066, "global_step": 293502, "epoch": 1747} {"train_loss": -12.353179931640625, "global_step": 293503, "epoch": 1747} {"train_loss": -12.341022491455078, "global_step": 293504, "epoch": 1747} {"train_loss": -12.047152519226074, "global_step": 293505, "epoch": 1747} {"train_loss": -12.14549446105957, "global_step": 293506, "epoch": 1747} {"train_loss": -11.969720840454102, "global_step": 293507, "epoch": 1747} {"train_loss": -11.9180269241333, "global_step": 293508, "epoch": 1747} {"train_loss": -12.1981201171875, "global_step": 293509, "epoch": 1747} {"train_loss": -12.05239486694336, "global_step": 293510, "epoch": 1747} {"train_loss": -11.89206314086914, "global_step": 293511, "epoch": 1747} {"train_loss": -12.13922119140625, "global_step": 293512, "epoch": 1747} {"train_loss": -11.98668384552002, "global_step": 293513, "epoch": 1747} {"train_loss": -12.535468101501465, "global_step": 293514, "epoch": 1747} {"train_loss": -11.675621032714844, "global_step": 293515, "epoch": 1747} {"train_loss": -12.084760665893555, "global_step": 293516, "epoch": 1747} {"train_loss": -11.928388595581055, "global_step": 293517, "epoch": 1747} {"train_loss": -11.923158645629883, "global_step": 293518, "epoch": 1747} {"train_loss": -12.503506660461426, "global_step": 293519, "epoch": 1747} {"train_loss": -11.706656455993652, "global_step": 293520, "epoch": 1747} {"train_loss": -12.660652160644531, "global_step": 293521, "epoch": 1747} {"train_loss": -11.46474838256836, "global_step": 293522, "epoch": 1747} {"train_loss": -11.65658187866211, "global_step": 293523, "epoch": 1747} {"train_loss": -11.805046081542969, "global_step": 293524, "epoch": 1747} {"train_loss": -11.813796043395996, "global_step": 293525, "epoch": 1747} {"train_loss": -12.381607055664062, "global_step": 293526, "epoch": 1747} {"train_loss": -11.946208000183105, "global_step": 293527, "epoch": 1747} {"train_loss": -10.352089881896973, "global_step": 293528, "epoch": 1747} {"train_loss": -10.203866958618164, "global_step": 293529, "epoch": 1747} {"train_loss": -11.44153881072998, "global_step": 293530, "epoch": 1747} {"train_loss": -11.652800559997559, "global_step": 293531, "epoch": 1747} {"train_loss": -10.323429107666016, "global_step": 293532, "epoch": 1747} {"train_loss": -10.867947578430176, "global_step": 293533, "epoch": 1747} {"train_loss": -11.32689094543457, "global_step": 293534, "epoch": 1747} {"train_loss": -11.737140655517578, "global_step": 293535, "epoch": 1747} {"train_loss": -11.170625686645508, "global_step": 293536, "epoch": 1747} {"train_loss": -11.885650634765625, "global_step": 293537, "epoch": 1747} {"train_loss": -11.520606994628906, "global_step": 293538, "epoch": 1747} {"train_loss": -11.433974266052246, "global_step": 293539, "epoch": 1747} {"train_loss": -11.846956253051758, "global_step": 293540, "epoch": 1747} {"train_loss": -10.908658027648926, "global_step": 293541, "epoch": 1747} {"train_loss": -11.744306564331055, "global_step": 293542, "epoch": 1747} {"train_loss": -11.228571891784668, "global_step": 293543, "epoch": 1747} {"train_loss": -11.502103805541992, "global_step": 293544, "epoch": 1747} {"train_loss": -11.125893592834473, "global_step": 293545, "epoch": 1747} {"train_loss": -11.42393684387207, "global_step": 293546, "epoch": 1747} {"train_loss": -11.48038101196289, "global_step": 293547, "epoch": 1747} {"train_loss": -10.437750816345215, "global_step": 293548, "epoch": 1747} {"train_loss": -11.360832214355469, "global_step": 293549, "epoch": 1747} {"train_loss": -11.263043403625488, "global_step": 293550, "epoch": 1747} {"train_loss": -11.46957015991211, "global_step": 293551, "epoch": 1747} {"train_loss": -11.522232055664062, "global_step": 293552, "epoch": 1747} {"train_loss": -11.553752899169922, "global_step": 293553, "epoch": 1747} {"train_loss": -11.617012023925781, "global_step": 293554, "epoch": 1747} {"train_loss": -11.598950386047363, "global_step": 293555, "epoch": 1747} {"train_loss": -11.69061279296875, "global_step": 293556, "epoch": 1747} {"train_loss": -11.350831031799316, "global_step": 293557, "epoch": 1747} {"train_loss": -11.917118072509766, "global_step": 293558, "epoch": 1747} {"train_loss": -11.159303665161133, "global_step": 293559, "epoch": 1747} {"train_loss": -11.599710464477539, "global_step": 293560, "epoch": 1747} {"train_loss": -11.492965698242188, "global_step": 293561, "epoch": 1747} {"train_loss": -11.189464569091797, "global_step": 293562, "epoch": 1747} {"train_loss": -11.94528579711914, "global_step": 293563, "epoch": 1747} {"train_loss": -11.05714225769043, "global_step": 293564, "epoch": 1747} {"train_loss": -11.57303237915039, "global_step": 293565, "epoch": 1747} {"train_loss": -11.695760726928711, "global_step": 293566, "epoch": 1747} {"train_loss": -11.482404708862305, "global_step": 293567, "epoch": 1747} {"train_loss": -11.885747909545898, "global_step": 293568, "epoch": 1747} {"train_loss": -11.578144073486328, "global_step": 293569, "epoch": 1747} {"train_loss": -11.860587120056152, "global_step": 293570, "epoch": 1747} {"train_loss": -11.559091567993164, "global_step": 293571, "epoch": 1747} {"train_loss": -12.009981155395508, "global_step": 293572, "epoch": 1747} {"train_loss": -11.660888671875, "global_step": 293573, "epoch": 1747} {"train_loss": -12.008858680725098, "global_step": 293574, "epoch": 1747} {"train_loss": -11.96568489074707, "global_step": 293575, "epoch": 1747} {"train_loss": -11.633639335632324, "global_step": 293576, "epoch": 1747} {"train_loss": -11.242368698120117, "global_step": 293577, "epoch": 1747} {"train_loss": -11.829383850097656, "global_step": 293578, "epoch": 1747} {"train_loss": -11.446554183959961, "global_step": 293579, "epoch": 1747} {"train_loss": -11.696560859680176, "global_step": 293580, "epoch": 1747} {"train_loss": -11.325568199157715, "global_step": 293581, "epoch": 1747} {"train_loss": -11.673595428466797, "global_step": 293582, "epoch": 1747} {"train_loss": -11.551812171936035, "global_step": 293583, "epoch": 1747} {"train_loss": -11.057180404663086, "global_step": 293584, "epoch": 1747} {"train_loss": -11.895482063293457, "global_step": 293585, "epoch": 1747} {"train_loss": -11.502242088317871, "global_step": 293586, "epoch": 1747} {"train_loss": -11.943506240844727, "global_step": 293587, "epoch": 1747} {"train_loss": -11.855682373046875, "global_step": 293588, "epoch": 1747} {"train_loss": -11.852112770080566, "global_step": 293589, "epoch": 1747} {"train_loss": -11.718286514282227, "global_step": 293590, "epoch": 1747} {"train_loss": -11.957442283630371, "global_step": 293591, "epoch": 1747} {"train_loss": -11.69521713256836, "global_step": 293592, "epoch": 1747} {"train_loss": -11.875, "global_step": 293593, "epoch": 1747} {"train_loss": -11.894964218139648, "global_step": 293594, "epoch": 1747} {"train_loss": -11.518192291259766, "global_step": 293595, "epoch": 1747} {"train_loss": -12.19522476196289, "global_step": 293596, "epoch": 1747} {"train_loss": -11.796733856201172, "global_step": 293597, "epoch": 1747} {"train_loss": -12.098681449890137, "global_step": 293598, "epoch": 1747} {"train_loss": -11.682861328125, "global_step": 293599, "epoch": 1747} {"train_loss": -12.131356239318848, "global_step": 293600, "epoch": 1747} {"train_loss": -11.615619659423828, "global_step": 293601, "epoch": 1747} {"train_loss": -11.687139511108398, "global_step": 293602, "epoch": 1747} {"train_loss": -11.628053665161133, "global_step": 293603, "epoch": 1747} {"train_loss": -11.532875061035156, "global_step": 293604, "epoch": 1747} {"train_loss": -11.848297119140625, "global_step": 293605, "epoch": 1747} {"train_loss": -12.015583038330078, "global_step": 293606, "epoch": 1747} {"train_loss": -11.366832733154297, "global_step": 293607, "epoch": 1747} {"train_loss": -12.160058975219727, "global_step": 293608, "epoch": 1747} {"train_loss": -11.205124855041504, "global_step": 293609, "epoch": 1747} {"train_loss": -11.912517547607422, "global_step": 293610, "epoch": 1747} {"train_loss": -11.95005989074707, "global_step": 293611, "epoch": 1747} {"train_loss": -12.057849884033203, "global_step": 293612, "epoch": 1747} {"train_loss": -11.991968154907227, "global_step": 293613, "epoch": 1747} {"train_loss": -11.775569915771484, "global_step": 293614, "epoch": 1747} {"train_loss": -11.860589981079102, "global_step": 293615, "epoch": 1747} {"train_loss": -11.962764739990234, "global_step": 293616, "epoch": 1747} {"train_loss": -11.699613571166992, "global_step": 293617, "epoch": 1747} {"train_loss": -12.078017234802246, "global_step": 293618, "epoch": 1747} {"train_loss": -11.598081588745117, "global_step": 293619, "epoch": 1747} {"train_loss": -11.812594413757324, "global_step": 293620, "epoch": 1747} {"train_loss": -12.015298843383789, "global_step": 293621, "epoch": 1747} {"train_loss": -11.57426929473877, "global_step": 293622, "epoch": 1747} {"train_loss": -11.684732437133789, "global_step": 293623, "epoch": 1747} {"train_loss": -12.128466606140137, "global_step": 293624, "epoch": 1747} {"train_loss": -11.955950736999512, "global_step": 293625, "epoch": 1747} {"train_loss": -12.05667781829834, "global_step": 293626, "epoch": 1747} {"train_loss": -11.976251602172852, "global_step": 293627, "epoch": 1747} {"train_loss": -12.433700561523438, "global_step": 293628, "epoch": 1747} {"train_loss": -12.199881553649902, "global_step": 293629, "epoch": 1747} {"train_loss": -12.06295394897461, "global_step": 293630, "epoch": 1747} {"train_loss": -12.168352127075195, "global_step": 293631, "epoch": 1747} {"train_loss": -12.339029312133789, "global_step": 293632, "epoch": 1747} {"train_loss": -12.021053314208984, "global_step": 293633, "epoch": 1747} {"train_loss": -12.229467391967773, "global_step": 293634, "epoch": 1747} {"train_loss": -12.31100845336914, "global_step": 293635, "epoch": 1747} {"train_loss": -12.182112693786621, "global_step": 293636, "epoch": 1747} {"train_loss": -12.09396743774414, "global_step": 293637, "epoch": 1747} {"train_loss": -12.32115364074707, "global_step": 293638, "epoch": 1747} {"train_loss": -12.1242036819458, "global_step": 293639, "epoch": 1747} {"train_loss": -12.328316688537598, "global_step": 293640, "epoch": 1747} {"train_loss": -12.471370697021484, "global_step": 293641, "epoch": 1747} {"train_loss": -12.074764251708984, "global_step": 293642, "epoch": 1747} {"train_loss": -12.347597122192383, "global_step": 293643, "epoch": 1747} {"train_loss": -12.368330001831055, "global_step": 293644, "epoch": 1747} {"train_loss": -12.07108211517334, "global_step": 293645, "epoch": 1747} {"train_loss": -12.372056007385254, "global_step": 293646, "epoch": 1747} {"train_loss": -12.069208145141602, "global_step": 293647, "epoch": 1747} {"train_loss": -11.980426788330078, "global_step": 293648, "epoch": 1747} {"train_loss": -12.023744583129883, "global_step": 293649, "epoch": 1747} {"train_loss": -11.949481964111328, "global_step": 293650, "epoch": 1747} {"train_loss": -11.861869812011719, "global_step": 293651, "epoch": 1747} {"train_loss": -12.03737735748291, "global_step": 293652, "epoch": 1747} {"train_loss": -11.852895736694336, "global_step": 293653, "epoch": 1747} {"train_loss": -12.253335952758789, "global_step": 293654, "epoch": 1747} {"train_loss": -12.193326950073242, "global_step": 293655, "epoch": 1747} {"train_loss": -11.935028076171875, "global_step": 293656, "epoch": 1747} {"train_loss": -11.883779525756836, "global_step": 293657, "epoch": 1747} {"train_loss": -12.02542495727539, "global_step": 293658, "epoch": 1747} {"train_loss": -11.419465065002441, "global_step": 293659, "epoch": 1747} {"train_loss": -12.392373085021973, "global_step": 293660, "epoch": 1747} {"train_loss": -11.866926193237305, "global_step": 293661, "epoch": 1747} {"train_loss": -12.343345642089844, "global_step": 293662, "epoch": 1747} {"train_loss": -11.815159905524482, "global_step": 293663, "epoch": 1747, "val_loss": 276653.46875} {"train_loss": -12.093673706054688, "global_step": 293664, "epoch": 1748} {"train_loss": -11.313332557678223, "global_step": 293665, "epoch": 1748} {"train_loss": -11.70689582824707, "global_step": 293666, "epoch": 1748} {"train_loss": -11.541986465454102, "global_step": 293667, "epoch": 1748} {"train_loss": -11.640523910522461, "global_step": 293668, "epoch": 1748} {"train_loss": -11.766580581665039, "global_step": 293669, "epoch": 1748} {"train_loss": -11.545246124267578, "global_step": 293670, "epoch": 1748} {"train_loss": -11.20623779296875, "global_step": 293671, "epoch": 1748} {"train_loss": -11.541748046875, "global_step": 293672, "epoch": 1748} {"train_loss": -11.379195213317871, "global_step": 293673, "epoch": 1748} {"train_loss": -11.642526626586914, "global_step": 293674, "epoch": 1748} {"train_loss": -11.432416915893555, "global_step": 293675, "epoch": 1748} {"train_loss": -11.826029777526855, "global_step": 293676, "epoch": 1748} {"train_loss": -11.560338020324707, "global_step": 293677, "epoch": 1748} {"train_loss": -12.08888053894043, "global_step": 293678, "epoch": 1748} {"train_loss": -11.784950256347656, "global_step": 293679, "epoch": 1748} {"train_loss": -11.399971961975098, "global_step": 293680, "epoch": 1748} {"train_loss": -11.728282928466797, "global_step": 293681, "epoch": 1748} {"train_loss": -11.157379150390625, "global_step": 293682, "epoch": 1748} {"train_loss": -11.390853881835938, "global_step": 293683, "epoch": 1748} {"train_loss": -11.451139450073242, "global_step": 293684, "epoch": 1748} {"train_loss": -11.066217422485352, "global_step": 293685, "epoch": 1748} {"train_loss": -10.892345428466797, "global_step": 293686, "epoch": 1748} {"train_loss": -11.619194030761719, "global_step": 293687, "epoch": 1748} {"train_loss": -11.592039108276367, "global_step": 293688, "epoch": 1748} {"train_loss": -11.747047424316406, "global_step": 293689, "epoch": 1748} {"train_loss": -11.786977767944336, "global_step": 293690, "epoch": 1748} {"train_loss": -11.22419548034668, "global_step": 293691, "epoch": 1748} {"train_loss": -12.181842803955078, "global_step": 293692, "epoch": 1748} {"train_loss": -10.742498397827148, "global_step": 293693, "epoch": 1748} {"train_loss": -11.126352310180664, "global_step": 293694, "epoch": 1748} {"train_loss": -11.594768524169922, "global_step": 293695, "epoch": 1748} {"train_loss": -11.504936218261719, "global_step": 293696, "epoch": 1748} {"train_loss": -11.124815940856934, "global_step": 293697, "epoch": 1748} {"train_loss": -11.765548706054688, "global_step": 293698, "epoch": 1748} {"train_loss": -11.555069923400879, "global_step": 293699, "epoch": 1748} {"train_loss": -11.90011978149414, "global_step": 293700, "epoch": 1748} {"train_loss": -11.91987419128418, "global_step": 293701, "epoch": 1748} {"train_loss": -11.572637557983398, "global_step": 293702, "epoch": 1748} {"train_loss": -11.640350341796875, "global_step": 293703, "epoch": 1748} {"train_loss": -11.449199676513672, "global_step": 293704, "epoch": 1748} {"train_loss": -12.006783485412598, "global_step": 293705, "epoch": 1748} {"train_loss": -11.541372299194336, "global_step": 293706, "epoch": 1748} {"train_loss": -11.731548309326172, "global_step": 293707, "epoch": 1748} {"train_loss": -11.997591972351074, "global_step": 293708, "epoch": 1748} {"train_loss": -11.881372451782227, "global_step": 293709, "epoch": 1748} {"train_loss": -12.166436195373535, "global_step": 293710, "epoch": 1748} {"train_loss": -12.156494140625, "global_step": 293711, "epoch": 1748} {"train_loss": -11.790964126586914, "global_step": 293712, "epoch": 1748} {"train_loss": -12.02243423461914, "global_step": 293713, "epoch": 1748} {"train_loss": -11.976885795593262, "global_step": 293714, "epoch": 1748} {"train_loss": -12.136216163635254, "global_step": 293715, "epoch": 1748} {"train_loss": -11.938179969787598, "global_step": 293716, "epoch": 1748} {"train_loss": -12.264122009277344, "global_step": 293717, "epoch": 1748} {"train_loss": -12.141841888427734, "global_step": 293718, "epoch": 1748} {"train_loss": -12.23431396484375, "global_step": 293719, "epoch": 1748} {"train_loss": -12.165298461914062, "global_step": 293720, "epoch": 1748} {"train_loss": -12.183212280273438, "global_step": 293721, "epoch": 1748} {"train_loss": -11.951981544494629, "global_step": 293722, "epoch": 1748} {"train_loss": -12.046363830566406, "global_step": 293723, "epoch": 1748} {"train_loss": -11.998380661010742, "global_step": 293724, "epoch": 1748} {"train_loss": -11.990440368652344, "global_step": 293725, "epoch": 1748} {"train_loss": -11.919607162475586, "global_step": 293726, "epoch": 1748} {"train_loss": -11.851259231567383, "global_step": 293727, "epoch": 1748} {"train_loss": -11.75029182434082, "global_step": 293728, "epoch": 1748} {"train_loss": -12.326827049255371, "global_step": 293729, "epoch": 1748} {"train_loss": -12.08668041229248, "global_step": 293730, "epoch": 1748} {"train_loss": -12.282072067260742, "global_step": 293731, "epoch": 1748} {"train_loss": -12.147659301757812, "global_step": 293732, "epoch": 1748} {"train_loss": -12.072649002075195, "global_step": 293733, "epoch": 1748} {"train_loss": -12.204666137695312, "global_step": 293734, "epoch": 1748} {"train_loss": -12.159514427185059, "global_step": 293735, "epoch": 1748} {"train_loss": -12.241134643554688, "global_step": 293736, "epoch": 1748} {"train_loss": -11.984173774719238, "global_step": 293737, "epoch": 1748} {"train_loss": -12.266669273376465, "global_step": 293738, "epoch": 1748} {"train_loss": -12.151275634765625, "global_step": 293739, "epoch": 1748} {"train_loss": -12.30842399597168, "global_step": 293740, "epoch": 1748} {"train_loss": -12.028975486755371, "global_step": 293741, "epoch": 1748} {"train_loss": -11.747564315795898, "global_step": 293742, "epoch": 1748} {"train_loss": -11.63519287109375, "global_step": 293743, "epoch": 1748} {"train_loss": -11.9412841796875, "global_step": 293744, "epoch": 1748} {"train_loss": -11.855267524719238, "global_step": 293745, "epoch": 1748} {"train_loss": -12.147441864013672, "global_step": 293746, "epoch": 1748} {"train_loss": -12.224114418029785, "global_step": 293747, "epoch": 1748} {"train_loss": -12.293137550354004, "global_step": 293748, "epoch": 1748} {"train_loss": -12.102241516113281, "global_step": 293749, "epoch": 1748} {"train_loss": -12.076400756835938, "global_step": 293750, "epoch": 1748} {"train_loss": -12.170049667358398, "global_step": 293751, "epoch": 1748} {"train_loss": -12.43835735321045, "global_step": 293752, "epoch": 1748} {"train_loss": -11.998285293579102, "global_step": 293753, "epoch": 1748} {"train_loss": -12.518064498901367, "global_step": 293754, "epoch": 1748} {"train_loss": -12.078032493591309, "global_step": 293755, "epoch": 1748} {"train_loss": -12.260976791381836, "global_step": 293756, "epoch": 1748} {"train_loss": -12.378305435180664, "global_step": 293757, "epoch": 1748} {"train_loss": -12.227588653564453, "global_step": 293758, "epoch": 1748} {"train_loss": -12.497086524963379, "global_step": 293759, "epoch": 1748} {"train_loss": -12.049795150756836, "global_step": 293760, "epoch": 1748} {"train_loss": -12.205694198608398, "global_step": 293761, "epoch": 1748} {"train_loss": -11.890625, "global_step": 293762, "epoch": 1748} {"train_loss": -12.480711936950684, "global_step": 293763, "epoch": 1748} {"train_loss": -12.426688194274902, "global_step": 293764, "epoch": 1748} {"train_loss": -12.246580123901367, "global_step": 293765, "epoch": 1748} {"train_loss": -11.96165657043457, "global_step": 293766, "epoch": 1748} {"train_loss": -11.6412992477417, "global_step": 293767, "epoch": 1748} {"train_loss": -11.808334350585938, "global_step": 293768, "epoch": 1748} {"train_loss": -12.04011344909668, "global_step": 293769, "epoch": 1748} {"train_loss": -11.871758460998535, "global_step": 293770, "epoch": 1748} {"train_loss": -11.189102172851562, "global_step": 293771, "epoch": 1748} {"train_loss": -10.663962364196777, "global_step": 293772, "epoch": 1748} {"train_loss": -12.118703842163086, "global_step": 293773, "epoch": 1748} {"train_loss": -10.299334526062012, "global_step": 293774, "epoch": 1748} {"train_loss": -9.671703338623047, "global_step": 293775, "epoch": 1748} {"train_loss": -10.636329650878906, "global_step": 293776, "epoch": 1748} {"train_loss": -7.59282112121582, "global_step": 293777, "epoch": 1748} {"train_loss": -7.871253967285156, "global_step": 293778, "epoch": 1748} {"train_loss": -7.548011302947998, "global_step": 293779, "epoch": 1748} {"train_loss": -8.61910343170166, "global_step": 293780, "epoch": 1748} {"train_loss": -9.177875518798828, "global_step": 293781, "epoch": 1748} {"train_loss": -8.047294616699219, "global_step": 293782, "epoch": 1748} {"train_loss": -8.031856536865234, "global_step": 293783, "epoch": 1748} {"train_loss": -9.113856315612793, "global_step": 293784, "epoch": 1748} {"train_loss": -8.865006446838379, "global_step": 293785, "epoch": 1748} {"train_loss": -7.170042991638184, "global_step": 293786, "epoch": 1748} {"train_loss": -9.21220588684082, "global_step": 293787, "epoch": 1748} {"train_loss": -9.079277992248535, "global_step": 293788, "epoch": 1748} {"train_loss": -8.694360733032227, "global_step": 293789, "epoch": 1748} {"train_loss": -10.079782485961914, "global_step": 293790, "epoch": 1748} {"train_loss": -8.897754669189453, "global_step": 293791, "epoch": 1748} {"train_loss": -9.225204467773438, "global_step": 293792, "epoch": 1748} {"train_loss": -10.231501579284668, "global_step": 293793, "epoch": 1748} {"train_loss": -9.671475410461426, "global_step": 293794, "epoch": 1748} {"train_loss": -9.303665161132812, "global_step": 293795, "epoch": 1748} {"train_loss": -9.299614906311035, "global_step": 293796, "epoch": 1748} {"train_loss": -8.593940734863281, "global_step": 293797, "epoch": 1748} {"train_loss": -10.15774917602539, "global_step": 293798, "epoch": 1748} {"train_loss": -10.407247543334961, "global_step": 293799, "epoch": 1748} {"train_loss": -10.44744873046875, "global_step": 293800, "epoch": 1748} {"train_loss": -10.988204956054688, "global_step": 293801, "epoch": 1748} {"train_loss": -10.71557331085205, "global_step": 293802, "epoch": 1748} {"train_loss": -10.48691463470459, "global_step": 293803, "epoch": 1748} {"train_loss": -10.97864818572998, "global_step": 293804, "epoch": 1748} {"train_loss": -10.921550750732422, "global_step": 293805, "epoch": 1748} {"train_loss": -11.211322784423828, "global_step": 293806, "epoch": 1748} {"train_loss": -10.709891319274902, "global_step": 293807, "epoch": 1748} {"train_loss": -11.176864624023438, "global_step": 293808, "epoch": 1748} {"train_loss": -11.075620651245117, "global_step": 293809, "epoch": 1748} {"train_loss": -11.11401081085205, "global_step": 293810, "epoch": 1748} {"train_loss": -11.433164596557617, "global_step": 293811, "epoch": 1748} {"train_loss": -11.024900436401367, "global_step": 293812, "epoch": 1748} {"train_loss": -11.768635749816895, "global_step": 293813, "epoch": 1748} {"train_loss": -11.432680130004883, "global_step": 293814, "epoch": 1748} {"train_loss": -11.445728302001953, "global_step": 293815, "epoch": 1748} {"train_loss": -11.596525192260742, "global_step": 293816, "epoch": 1748} {"train_loss": -11.803451538085938, "global_step": 293817, "epoch": 1748} {"train_loss": -11.444419860839844, "global_step": 293818, "epoch": 1748} {"train_loss": -11.758843421936035, "global_step": 293819, "epoch": 1748} {"train_loss": -11.582921981811523, "global_step": 293820, "epoch": 1748} {"train_loss": -11.416044235229492, "global_step": 293821, "epoch": 1748} {"train_loss": -11.742291450500488, "global_step": 293822, "epoch": 1748} {"train_loss": -11.647706031799316, "global_step": 293823, "epoch": 1748} {"train_loss": -11.783882141113281, "global_step": 293824, "epoch": 1748} {"train_loss": -11.750107765197754, "global_step": 293825, "epoch": 1748} {"train_loss": -11.65045166015625, "global_step": 293826, "epoch": 1748} {"train_loss": -11.65783977508545, "global_step": 293827, "epoch": 1748} {"train_loss": -11.867349624633789, "global_step": 293828, "epoch": 1748} {"train_loss": -11.641679763793945, "global_step": 293829, "epoch": 1748} {"train_loss": -11.619124412536621, "global_step": 293830, "epoch": 1748} {"train_loss": -11.330849247319358, "global_step": 293831, "epoch": 1748, "val_loss": 279249.53125} {"train_loss": -11.979554176330566, "global_step": 293832, "epoch": 1749} {"train_loss": -11.663314819335938, "global_step": 293833, "epoch": 1749} {"train_loss": -11.61188793182373, "global_step": 293834, "epoch": 1749} {"train_loss": -11.741243362426758, "global_step": 293835, "epoch": 1749} {"train_loss": -12.055288314819336, "global_step": 293836, "epoch": 1749} {"train_loss": -11.889581680297852, "global_step": 293837, "epoch": 1749} {"train_loss": -11.541110038757324, "global_step": 293838, "epoch": 1749} {"train_loss": -12.052314758300781, "global_step": 293839, "epoch": 1749} {"train_loss": -11.916278839111328, "global_step": 293840, "epoch": 1749} {"train_loss": -12.054159164428711, "global_step": 293841, "epoch": 1749} {"train_loss": -11.76488208770752, "global_step": 293842, "epoch": 1749} {"train_loss": -11.732986450195312, "global_step": 293843, "epoch": 1749} {"train_loss": -11.897459983825684, "global_step": 293844, "epoch": 1749} {"train_loss": -11.979486465454102, "global_step": 293845, "epoch": 1749} {"train_loss": -11.995131492614746, "global_step": 293846, "epoch": 1749} {"train_loss": -11.959939956665039, "global_step": 293847, "epoch": 1749} {"train_loss": -12.154701232910156, "global_step": 293848, "epoch": 1749} {"train_loss": -12.033103942871094, "global_step": 293849, "epoch": 1749} {"train_loss": -12.15014362335205, "global_step": 293850, "epoch": 1749} {"train_loss": -12.145227432250977, "global_step": 293851, "epoch": 1749} {"train_loss": -12.019567489624023, "global_step": 293852, "epoch": 1749} {"train_loss": -12.09155559539795, "global_step": 293853, "epoch": 1749} {"train_loss": -12.258875846862793, "global_step": 293854, "epoch": 1749} {"train_loss": -12.213363647460938, "global_step": 293855, "epoch": 1749} {"train_loss": -12.222846984863281, "global_step": 293856, "epoch": 1749} {"train_loss": -12.22927474975586, "global_step": 293857, "epoch": 1749} {"train_loss": -12.250385284423828, "global_step": 293858, "epoch": 1749} {"train_loss": -12.029314041137695, "global_step": 293859, "epoch": 1749} {"train_loss": -12.202875137329102, "global_step": 293860, "epoch": 1749} {"train_loss": -12.059746742248535, "global_step": 293861, "epoch": 1749} {"train_loss": -12.185063362121582, "global_step": 293862, "epoch": 1749} {"train_loss": -12.004003524780273, "global_step": 293863, "epoch": 1749} {"train_loss": -12.135298728942871, "global_step": 293864, "epoch": 1749} {"train_loss": -12.007634162902832, "global_step": 293865, "epoch": 1749} {"train_loss": -12.316757202148438, "global_step": 293866, "epoch": 1749} {"train_loss": -12.072047233581543, "global_step": 293867, "epoch": 1749} {"train_loss": -12.25838851928711, "global_step": 293868, "epoch": 1749} {"train_loss": -12.202112197875977, "global_step": 293869, "epoch": 1749} {"train_loss": -12.207662582397461, "global_step": 293870, "epoch": 1749} {"train_loss": -11.956844329833984, "global_step": 293871, "epoch": 1749} {"train_loss": -12.120494842529297, "global_step": 293872, "epoch": 1749} {"train_loss": -11.869828224182129, "global_step": 293873, "epoch": 1749} {"train_loss": -11.685527801513672, "global_step": 293874, "epoch": 1749} {"train_loss": -11.702929496765137, "global_step": 293875, "epoch": 1749} {"train_loss": -12.287971496582031, "global_step": 293876, "epoch": 1749} {"train_loss": -11.71280288696289, "global_step": 293877, "epoch": 1749} {"train_loss": -11.684040069580078, "global_step": 293878, "epoch": 1749} {"train_loss": -12.41994857788086, "global_step": 293879, "epoch": 1749} {"train_loss": -11.735417366027832, "global_step": 293880, "epoch": 1749} {"train_loss": -11.772991180419922, "global_step": 293881, "epoch": 1749} {"train_loss": -12.272359848022461, "global_step": 293882, "epoch": 1749} {"train_loss": -11.939234733581543, "global_step": 293883, "epoch": 1749} {"train_loss": -12.215133666992188, "global_step": 293884, "epoch": 1749} {"train_loss": -11.843868255615234, "global_step": 293885, "epoch": 1749} {"train_loss": -11.872489929199219, "global_step": 293886, "epoch": 1749} {"train_loss": -11.266168594360352, "global_step": 293887, "epoch": 1749} {"train_loss": -11.433253288269043, "global_step": 293888, "epoch": 1749} {"train_loss": -12.226419448852539, "global_step": 293889, "epoch": 1749} {"train_loss": -11.321609497070312, "global_step": 293890, "epoch": 1749} {"train_loss": -10.456084251403809, "global_step": 293891, "epoch": 1749} {"train_loss": -11.289010047912598, "global_step": 293892, "epoch": 1749} {"train_loss": -11.888962745666504, "global_step": 293893, "epoch": 1749} {"train_loss": -10.460697174072266, "global_step": 293894, "epoch": 1749} {"train_loss": -10.712581634521484, "global_step": 293895, "epoch": 1749} {"train_loss": -10.651491165161133, "global_step": 293896, "epoch": 1749} {"train_loss": -9.338849067687988, "global_step": 293897, "epoch": 1749} {"train_loss": -8.995808601379395, "global_step": 293898, "epoch": 1749} {"train_loss": -11.024372100830078, "global_step": 293899, "epoch": 1749} {"train_loss": -10.249092102050781, "global_step": 293900, "epoch": 1749} {"train_loss": -9.228853225708008, "global_step": 293901, "epoch": 1749} {"train_loss": -9.960399627685547, "global_step": 293902, "epoch": 1749} {"train_loss": -10.416582107543945, "global_step": 293903, "epoch": 1749} {"train_loss": -10.765216827392578, "global_step": 293904, "epoch": 1749} {"train_loss": -11.502344131469727, "global_step": 293905, "epoch": 1749} {"train_loss": -11.182138442993164, "global_step": 293906, "epoch": 1749} {"train_loss": -11.455907821655273, "global_step": 293907, "epoch": 1749} {"train_loss": -11.452890396118164, "global_step": 293908, "epoch": 1749} {"train_loss": -11.215474128723145, "global_step": 293909, "epoch": 1749} {"train_loss": -11.565169334411621, "global_step": 293910, "epoch": 1749} {"train_loss": -10.925716400146484, "global_step": 293911, "epoch": 1749} {"train_loss": -11.655613899230957, "global_step": 293912, "epoch": 1749} {"train_loss": -11.073213577270508, "global_step": 293913, "epoch": 1749} {"train_loss": -11.944485664367676, "global_step": 293914, "epoch": 1749} {"train_loss": -10.633285522460938, "global_step": 293915, "epoch": 1749} {"train_loss": -11.8343505859375, "global_step": 293916, "epoch": 1749} {"train_loss": -11.296385765075684, "global_step": 293917, "epoch": 1749} {"train_loss": -11.458195686340332, "global_step": 293918, "epoch": 1749} {"train_loss": -11.663288116455078, "global_step": 293919, "epoch": 1749} {"train_loss": -11.246397972106934, "global_step": 293920, "epoch": 1749} {"train_loss": -11.852519035339355, "global_step": 293921, "epoch": 1749} {"train_loss": -11.70218276977539, "global_step": 293922, "epoch": 1749} {"train_loss": -11.600634574890137, "global_step": 293923, "epoch": 1749} {"train_loss": -11.739774703979492, "global_step": 293924, "epoch": 1749} {"train_loss": -12.101024627685547, "global_step": 293925, "epoch": 1749} {"train_loss": -11.707365036010742, "global_step": 293926, "epoch": 1749} {"train_loss": -11.929574966430664, "global_step": 293927, "epoch": 1749} {"train_loss": -11.917853355407715, "global_step": 293928, "epoch": 1749} {"train_loss": -12.06362533569336, "global_step": 293929, "epoch": 1749} {"train_loss": -11.896940231323242, "global_step": 293930, "epoch": 1749} {"train_loss": -12.039899826049805, "global_step": 293931, "epoch": 1749} {"train_loss": -12.209068298339844, "global_step": 293932, "epoch": 1749} {"train_loss": -11.944740295410156, "global_step": 293933, "epoch": 1749} {"train_loss": -12.153640747070312, "global_step": 293934, "epoch": 1749} {"train_loss": -11.965322494506836, "global_step": 293935, "epoch": 1749} {"train_loss": -11.90096664428711, "global_step": 293936, "epoch": 1749} {"train_loss": -12.121310234069824, "global_step": 293937, "epoch": 1749} {"train_loss": -11.960561752319336, "global_step": 293938, "epoch": 1749} {"train_loss": -12.133779525756836, "global_step": 293939, "epoch": 1749} {"train_loss": -11.968801498413086, "global_step": 293940, "epoch": 1749} {"train_loss": -12.305809020996094, "global_step": 293941, "epoch": 1749} {"train_loss": -11.979089736938477, "global_step": 293942, "epoch": 1749} {"train_loss": -11.957008361816406, "global_step": 293943, "epoch": 1749} {"train_loss": -12.019099235534668, "global_step": 293944, "epoch": 1749} {"train_loss": -11.9986572265625, "global_step": 293945, "epoch": 1749} {"train_loss": -11.824356079101562, "global_step": 293946, "epoch": 1749} {"train_loss": -12.411837577819824, "global_step": 293947, "epoch": 1749} {"train_loss": -11.714338302612305, "global_step": 293948, "epoch": 1749} {"train_loss": -12.297069549560547, "global_step": 293949, "epoch": 1749} {"train_loss": -11.997905731201172, "global_step": 293950, "epoch": 1749} {"train_loss": -12.00900650024414, "global_step": 293951, "epoch": 1749} {"train_loss": -12.301395416259766, "global_step": 293952, "epoch": 1749} {"train_loss": -12.25941276550293, "global_step": 293953, "epoch": 1749} {"train_loss": -12.190839767456055, "global_step": 293954, "epoch": 1749} {"train_loss": -11.982829093933105, "global_step": 293955, "epoch": 1749} {"train_loss": -12.017254829406738, "global_step": 293956, "epoch": 1749} {"train_loss": -12.42763900756836, "global_step": 293957, "epoch": 1749} {"train_loss": -12.304167747497559, "global_step": 293958, "epoch": 1749} {"train_loss": -12.165882110595703, "global_step": 293959, "epoch": 1749} {"train_loss": -12.334622383117676, "global_step": 293960, "epoch": 1749} {"train_loss": -12.148112297058105, "global_step": 293961, "epoch": 1749} {"train_loss": -12.265900611877441, "global_step": 293962, "epoch": 1749} {"train_loss": -12.388824462890625, "global_step": 293963, "epoch": 1749} {"train_loss": -12.144025802612305, "global_step": 293964, "epoch": 1749} {"train_loss": -12.12672233581543, "global_step": 293965, "epoch": 1749} {"train_loss": -12.26199722290039, "global_step": 293966, "epoch": 1749} {"train_loss": -12.297266960144043, "global_step": 293967, "epoch": 1749} {"train_loss": -12.40501880645752, "global_step": 293968, "epoch": 1749} {"train_loss": -12.091320037841797, "global_step": 293969, "epoch": 1749} {"train_loss": -12.515932083129883, "global_step": 293970, "epoch": 1749} {"train_loss": -12.14289665222168, "global_step": 293971, "epoch": 1749} {"train_loss": -12.45432186126709, "global_step": 293972, "epoch": 1749} {"train_loss": -12.213321685791016, "global_step": 293973, "epoch": 1749} {"train_loss": -12.354406356811523, "global_step": 293974, "epoch": 1749} {"train_loss": -12.128825187683105, "global_step": 293975, "epoch": 1749} {"train_loss": -12.394686698913574, "global_step": 293976, "epoch": 1749} {"train_loss": -12.308124542236328, "global_step": 293977, "epoch": 1749} {"train_loss": -12.027339935302734, "global_step": 293978, "epoch": 1749} {"train_loss": -12.2228364944458, "global_step": 293979, "epoch": 1749} {"train_loss": -12.408096313476562, "global_step": 293980, "epoch": 1749} {"train_loss": -12.346116065979004, "global_step": 293981, "epoch": 1749} {"train_loss": -12.14959716796875, "global_step": 293982, "epoch": 1749} {"train_loss": -12.15938949584961, "global_step": 293983, "epoch": 1749} {"train_loss": -12.14657211303711, "global_step": 293984, "epoch": 1749} {"train_loss": -11.55514907836914, "global_step": 293985, "epoch": 1749} {"train_loss": -11.187448501586914, "global_step": 293986, "epoch": 1749} {"train_loss": -12.039685249328613, "global_step": 293987, "epoch": 1749} {"train_loss": -11.518354415893555, "global_step": 293988, "epoch": 1749} {"train_loss": -10.267292022705078, "global_step": 293989, "epoch": 1749} {"train_loss": -10.746026992797852, "global_step": 293990, "epoch": 1749} {"train_loss": -9.103788375854492, "global_step": 293991, "epoch": 1749} {"train_loss": -9.710906028747559, "global_step": 293992, "epoch": 1749} {"train_loss": -10.212238311767578, "global_step": 293993, "epoch": 1749} {"train_loss": -8.934011459350586, "global_step": 293994, "epoch": 1749} {"train_loss": -10.839899063110352, "global_step": 293995, "epoch": 1749} {"train_loss": -8.316182136535645, "global_step": 293996, "epoch": 1749} {"train_loss": -9.696638107299805, "global_step": 293997, "epoch": 1749} {"train_loss": -10.828737258911133, "global_step": 293998, "epoch": 1749} {"train_loss": -11.690563116754804, "global_step": 293999, "epoch": 1749, "val_loss": 277882.46875} {"train_loss": -10.911848068237305, "global_step": 294000, "epoch": 1750} {"train_loss": -10.372222900390625, "global_step": 294001, "epoch": 1750} {"train_loss": -9.337738037109375, "global_step": 294002, "epoch": 1750} {"train_loss": -11.172344207763672, "global_step": 294003, "epoch": 1750} {"train_loss": -8.131175994873047, "global_step": 294004, "epoch": 1750} {"train_loss": -9.04714584350586, "global_step": 294005, "epoch": 1750} {"train_loss": -9.14867877960205, "global_step": 294006, "epoch": 1750} {"train_loss": -10.395930290222168, "global_step": 294007, "epoch": 1750} {"train_loss": -8.187405586242676, "global_step": 294008, "epoch": 1750} {"train_loss": -9.945859909057617, "global_step": 294009, "epoch": 1750} {"train_loss": -8.721551895141602, "global_step": 294010, "epoch": 1750} {"train_loss": -10.236412048339844, "global_step": 294011, "epoch": 1750} {"train_loss": -9.662581443786621, "global_step": 294012, "epoch": 1750} {"train_loss": -9.63371467590332, "global_step": 294013, "epoch": 1750} {"train_loss": -10.720418930053711, "global_step": 294014, "epoch": 1750} {"train_loss": -9.953386306762695, "global_step": 294015, "epoch": 1750} {"train_loss": -10.989794731140137, "global_step": 294016, "epoch": 1750} {"train_loss": -10.69381332397461, "global_step": 294017, "epoch": 1750} {"train_loss": -10.6202392578125, "global_step": 294018, "epoch": 1750} {"train_loss": -10.748035430908203, "global_step": 294019, "epoch": 1750} {"train_loss": -10.772533416748047, "global_step": 294020, "epoch": 1750} {"train_loss": -10.127288818359375, "global_step": 294021, "epoch": 1750} {"train_loss": -11.15118408203125, "global_step": 294022, "epoch": 1750} {"train_loss": -10.580262184143066, "global_step": 294023, "epoch": 1750} {"train_loss": -11.256906509399414, "global_step": 294024, "epoch": 1750} {"train_loss": -11.094791412353516, "global_step": 294025, "epoch": 1750} {"train_loss": -11.15970230102539, "global_step": 294026, "epoch": 1750} {"train_loss": -10.878061294555664, "global_step": 294027, "epoch": 1750} {"train_loss": -11.190938949584961, "global_step": 294028, "epoch": 1750} {"train_loss": -11.484073638916016, "global_step": 294029, "epoch": 1750} {"train_loss": -11.17033576965332, "global_step": 294030, "epoch": 1750} {"train_loss": -11.445539474487305, "global_step": 294031, "epoch": 1750} {"train_loss": -11.537296295166016, "global_step": 294032, "epoch": 1750} {"train_loss": -11.465575218200684, "global_step": 294033, "epoch": 1750} {"train_loss": -11.560275077819824, "global_step": 294034, "epoch": 1750} {"train_loss": -11.49756908416748, "global_step": 294035, "epoch": 1750} {"train_loss": -11.640693664550781, "global_step": 294036, "epoch": 1750} {"train_loss": -11.606840133666992, "global_step": 294037, "epoch": 1750} {"train_loss": -11.522703170776367, "global_step": 294038, "epoch": 1750} {"train_loss": -11.631492614746094, "global_step": 294039, "epoch": 1750} {"train_loss": -11.516427993774414, "global_step": 294040, "epoch": 1750} {"train_loss": -11.590304374694824, "global_step": 294041, "epoch": 1750} {"train_loss": -11.716765403747559, "global_step": 294042, "epoch": 1750} {"train_loss": -11.69758129119873, "global_step": 294043, "epoch": 1750} {"train_loss": -11.765581130981445, "global_step": 294044, "epoch": 1750} {"train_loss": -11.81355094909668, "global_step": 294045, "epoch": 1750} {"train_loss": -11.596037864685059, "global_step": 294046, "epoch": 1750} {"train_loss": -11.847696304321289, "global_step": 294047, "epoch": 1750} {"train_loss": -11.744478225708008, "global_step": 294048, "epoch": 1750} {"train_loss": -11.859426498413086, "global_step": 294049, "epoch": 1750} {"train_loss": -11.769618034362793, "global_step": 294050, "epoch": 1750} {"train_loss": -11.942581176757812, "global_step": 294051, "epoch": 1750} {"train_loss": -11.831977844238281, "global_step": 294052, "epoch": 1750} {"train_loss": -11.956539154052734, "global_step": 294053, "epoch": 1750} {"train_loss": -12.021284103393555, "global_step": 294054, "epoch": 1750} {"train_loss": -11.871158599853516, "global_step": 294055, "epoch": 1750} {"train_loss": -11.943324089050293, "global_step": 294056, "epoch": 1750} {"train_loss": -12.00023078918457, "global_step": 294057, "epoch": 1750} {"train_loss": -12.020317077636719, "global_step": 294058, "epoch": 1750} {"train_loss": -11.92049789428711, "global_step": 294059, "epoch": 1750} {"train_loss": -11.916321754455566, "global_step": 294060, "epoch": 1750} {"train_loss": -12.023015975952148, "global_step": 294061, "epoch": 1750} {"train_loss": -12.128124237060547, "global_step": 294062, "epoch": 1750} {"train_loss": -12.183509826660156, "global_step": 294063, "epoch": 1750} {"train_loss": -12.12248420715332, "global_step": 294064, "epoch": 1750} {"train_loss": -12.104448318481445, "global_step": 294065, "epoch": 1750} {"train_loss": -12.053544998168945, "global_step": 294066, "epoch": 1750} {"train_loss": -11.963024139404297, "global_step": 294067, "epoch": 1750} {"train_loss": -12.205665588378906, "global_step": 294068, "epoch": 1750} {"train_loss": -12.237582206726074, "global_step": 294069, "epoch": 1750} {"train_loss": -12.141059875488281, "global_step": 294070, "epoch": 1750} {"train_loss": -12.169172286987305, "global_step": 294071, "epoch": 1750} {"train_loss": -12.264677047729492, "global_step": 294072, "epoch": 1750} {"train_loss": -12.092668533325195, "global_step": 294073, "epoch": 1750} {"train_loss": -12.330924987792969, "global_step": 294074, "epoch": 1750} {"train_loss": -12.10515022277832, "global_step": 294075, "epoch": 1750} {"train_loss": -12.390233993530273, "global_step": 294076, "epoch": 1750} {"train_loss": -12.110321044921875, "global_step": 294077, "epoch": 1750} {"train_loss": -11.988187789916992, "global_step": 294078, "epoch": 1750} {"train_loss": -12.24464225769043, "global_step": 294079, "epoch": 1750} {"train_loss": -12.417670249938965, "global_step": 294080, "epoch": 1750} {"train_loss": -12.219894409179688, "global_step": 294081, "epoch": 1750} {"train_loss": -12.138622283935547, "global_step": 294082, "epoch": 1750} {"train_loss": -12.244194030761719, "global_step": 294083, "epoch": 1750} {"train_loss": -12.084404945373535, "global_step": 294084, "epoch": 1750} {"train_loss": -12.258484840393066, "global_step": 294085, "epoch": 1750} {"train_loss": -12.161640167236328, "global_step": 294086, "epoch": 1750} {"train_loss": -12.21362018585205, "global_step": 294087, "epoch": 1750} {"train_loss": -12.285884857177734, "global_step": 294088, "epoch": 1750} {"train_loss": -12.192648887634277, "global_step": 294089, "epoch": 1750} {"train_loss": -12.362686157226562, "global_step": 294090, "epoch": 1750} {"train_loss": -12.128369331359863, "global_step": 294091, "epoch": 1750} {"train_loss": -12.306636810302734, "global_step": 294092, "epoch": 1750} {"train_loss": -12.288585662841797, "global_step": 294093, "epoch": 1750} {"train_loss": -12.405163764953613, "global_step": 294094, "epoch": 1750} {"train_loss": -12.405399322509766, "global_step": 294095, "epoch": 1750} {"train_loss": -12.266876220703125, "global_step": 294096, "epoch": 1750} {"train_loss": -12.285360336303711, "global_step": 294097, "epoch": 1750} {"train_loss": -12.492025375366211, "global_step": 294098, "epoch": 1750} {"train_loss": -12.346217155456543, "global_step": 294099, "epoch": 1750} {"train_loss": -12.252006530761719, "global_step": 294100, "epoch": 1750} {"train_loss": -12.153458595275879, "global_step": 294101, "epoch": 1750} {"train_loss": -12.37629222869873, "global_step": 294102, "epoch": 1750} {"train_loss": -12.078287124633789, "global_step": 294103, "epoch": 1750} {"train_loss": -12.276535034179688, "global_step": 294104, "epoch": 1750} {"train_loss": -12.177900314331055, "global_step": 294105, "epoch": 1750} {"train_loss": -12.328086853027344, "global_step": 294106, "epoch": 1750} {"train_loss": -12.277166366577148, "global_step": 294107, "epoch": 1750} {"train_loss": -12.002812385559082, "global_step": 294108, "epoch": 1750} {"train_loss": -12.111549377441406, "global_step": 294109, "epoch": 1750} {"train_loss": -12.290213584899902, "global_step": 294110, "epoch": 1750} {"train_loss": -12.370820999145508, "global_step": 294111, "epoch": 1750} {"train_loss": -12.120874404907227, "global_step": 294112, "epoch": 1750} {"train_loss": -11.844030380249023, "global_step": 294113, "epoch": 1750} {"train_loss": -11.124890327453613, "global_step": 294114, "epoch": 1750} {"train_loss": -12.086954116821289, "global_step": 294115, "epoch": 1750} {"train_loss": -11.57126235961914, "global_step": 294116, "epoch": 1750} {"train_loss": -11.145491600036621, "global_step": 294117, "epoch": 1750} {"train_loss": -11.33864688873291, "global_step": 294118, "epoch": 1750} {"train_loss": -11.657405853271484, "global_step": 294119, "epoch": 1750} {"train_loss": -10.706315994262695, "global_step": 294120, "epoch": 1750} {"train_loss": -10.73482894897461, "global_step": 294121, "epoch": 1750} {"train_loss": -10.804296493530273, "global_step": 294122, "epoch": 1750} {"train_loss": -9.672624588012695, "global_step": 294123, "epoch": 1750} {"train_loss": -9.297567367553711, "global_step": 294124, "epoch": 1750} {"train_loss": -10.770756721496582, "global_step": 294125, "epoch": 1750} {"train_loss": -9.45832633972168, "global_step": 294126, "epoch": 1750} {"train_loss": -10.402206420898438, "global_step": 294127, "epoch": 1750} {"train_loss": -9.548323631286621, "global_step": 294128, "epoch": 1750} {"train_loss": -11.213415145874023, "global_step": 294129, "epoch": 1750} {"train_loss": -9.938464164733887, "global_step": 294130, "epoch": 1750} {"train_loss": -10.970235824584961, "global_step": 294131, "epoch": 1750} {"train_loss": -10.464345932006836, "global_step": 294132, "epoch": 1750} {"train_loss": -10.926151275634766, "global_step": 294133, "epoch": 1750} {"train_loss": -11.492328643798828, "global_step": 294134, "epoch": 1750} {"train_loss": -10.688918113708496, "global_step": 294135, "epoch": 1750} {"train_loss": -11.656447410583496, "global_step": 294136, "epoch": 1750} {"train_loss": -10.256929397583008, "global_step": 294137, "epoch": 1750} {"train_loss": -11.828933715820312, "global_step": 294138, "epoch": 1750} {"train_loss": -11.05955982208252, "global_step": 294139, "epoch": 1750} {"train_loss": -11.431294441223145, "global_step": 294140, "epoch": 1750} {"train_loss": -10.898740768432617, "global_step": 294141, "epoch": 1750} {"train_loss": -11.688713073730469, "global_step": 294142, "epoch": 1750} {"train_loss": -11.642967224121094, "global_step": 294143, "epoch": 1750} {"train_loss": -11.238798141479492, "global_step": 294144, "epoch": 1750} {"train_loss": -11.743846893310547, "global_step": 294145, "epoch": 1750} {"train_loss": -11.773016929626465, "global_step": 294146, "epoch": 1750} {"train_loss": -11.715972900390625, "global_step": 294147, "epoch": 1750} {"train_loss": -11.749587059020996, "global_step": 294148, "epoch": 1750} {"train_loss": -11.707536697387695, "global_step": 294149, "epoch": 1750} {"train_loss": -11.70421028137207, "global_step": 294150, "epoch": 1750} {"train_loss": -11.872063636779785, "global_step": 294151, "epoch": 1750} {"train_loss": -11.804988861083984, "global_step": 294152, "epoch": 1750} {"train_loss": -11.981388092041016, "global_step": 294153, "epoch": 1750} {"train_loss": -11.800949096679688, "global_step": 294154, "epoch": 1750} {"train_loss": -11.848217010498047, "global_step": 294155, "epoch": 1750} {"train_loss": -12.097923278808594, "global_step": 294156, "epoch": 1750} {"train_loss": -11.72679615020752, "global_step": 294157, "epoch": 1750} {"train_loss": -12.217767715454102, "global_step": 294158, "epoch": 1750} {"train_loss": -11.885150909423828, "global_step": 294159, "epoch": 1750} {"train_loss": -11.870237350463867, "global_step": 294160, "epoch": 1750} {"train_loss": -11.70377254486084, "global_step": 294161, "epoch": 1750} {"train_loss": -11.950407028198242, "global_step": 294162, "epoch": 1750} {"train_loss": -11.766719818115234, "global_step": 294163, "epoch": 1750} {"train_loss": -11.633369445800781, "global_step": 294164, "epoch": 1750} {"train_loss": -11.75614070892334, "global_step": 294165, "epoch": 1750} {"train_loss": -11.282573699951172, "global_step": 294166, "epoch": 1750} {"train_loss": -11.475127146357583, "global_step": 294167, "epoch": 1750, "train/sim_max_reward_0": 0.5219651096546657, "train/sim_max_reward_1": 0.9274592147350219, "train/sim_max_reward_2": 0.008617882511292183, "train/sim_max_reward_3": 0.9991670935219824, "train/sim_max_reward_4": 0.9967135911955936, "train/sim_max_reward_5": 0.9356570159541737, "test/sim_max_reward_4400000": 0.9123097008356058, "test/sim_max_reward_4400001": 0.3749614513388594, "test/sim_max_reward_4400002": 0.15284285717614643, "test/sim_max_reward_4400003": 0.001507481594727359, "test/sim_max_reward_4400004": 0.6398962329489004, "test/sim_max_reward_4400005": 0.9351177849624925, "test/sim_max_reward_4400006": 0.6760018062862775, "test/sim_max_reward_4400007": 0.5689756882637457, "test/sim_max_reward_4400008": 0.6604552475668369, "test/sim_max_reward_4400009": 0.027674051460205205, "test/sim_max_reward_4400010": 0.9954411877032137, "test/sim_max_reward_4400011": 0.9866779776207542, "test/sim_max_reward_4400012": 0.9975021442743972, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.591758117393621, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 0.9905865374745405, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.681533135335832, "test/sim_max_reward_4400022": 0.9493706949310725, "test/sim_max_reward_4400023": 0.19639037722856018, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.6106832317568183, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.6778755369092625, "test/sim_max_reward_4400028": 0.7119484800109713, "test/sim_max_reward_4400029": 1.0, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.9507329229821243, "test/sim_max_reward_4400033": 0.6590741617472977, "test/sim_max_reward_4400034": 0.4784358067140684, "test/sim_max_reward_4400035": 0.9768974329034257, "test/sim_max_reward_4400036": 0.37476596307033877, "test/sim_max_reward_4400037": 0.9836870343362322, "test/sim_max_reward_4400038": 0.2900610367317126, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.16590677504843962, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.34845389663514137, "test/sim_max_reward_4400044": 0.9629667206224475, "test/sim_max_reward_4400045": 0.3932296013236084, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 0.9761122774257558, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.7315966512621216, "test/mean_score": 0.5681936847536562, "val_loss": 280996.15625, "train_action_mse_error": 5.050374507904053} {"train_loss": -12.03068733215332, "global_step": 294168, "epoch": 1751} {"train_loss": -11.993871688842773, "global_step": 294169, "epoch": 1751} {"train_loss": -11.901968002319336, "global_step": 294170, "epoch": 1751} {"train_loss": -12.143263816833496, "global_step": 294171, "epoch": 1751} {"train_loss": -12.209266662597656, "global_step": 294172, "epoch": 1751} {"train_loss": -11.877699851989746, "global_step": 294173, "epoch": 1751} {"train_loss": -11.946725845336914, "global_step": 294174, "epoch": 1751} {"train_loss": -12.167080879211426, "global_step": 294175, "epoch": 1751} {"train_loss": -12.146907806396484, "global_step": 294176, "epoch": 1751} {"train_loss": -12.14518928527832, "global_step": 294177, "epoch": 1751} {"train_loss": -11.881071090698242, "global_step": 294178, "epoch": 1751} {"train_loss": -12.052827835083008, "global_step": 294179, "epoch": 1751} {"train_loss": -12.01327133178711, "global_step": 294180, "epoch": 1751} {"train_loss": -12.001598358154297, "global_step": 294181, "epoch": 1751} {"train_loss": -11.959169387817383, "global_step": 294182, "epoch": 1751} {"train_loss": -11.972557067871094, "global_step": 294183, "epoch": 1751} {"train_loss": -12.241050720214844, "global_step": 294184, "epoch": 1751} {"train_loss": -11.573005676269531, "global_step": 294185, "epoch": 1751} {"train_loss": -11.775651931762695, "global_step": 294186, "epoch": 1751} {"train_loss": -12.070219039916992, "global_step": 294187, "epoch": 1751} {"train_loss": -11.816879272460938, "global_step": 294188, "epoch": 1751} {"train_loss": -12.277336120605469, "global_step": 294189, "epoch": 1751} {"train_loss": -11.584671020507812, "global_step": 294190, "epoch": 1751} {"train_loss": -11.77927017211914, "global_step": 294191, "epoch": 1751} {"train_loss": -12.082377433776855, "global_step": 294192, "epoch": 1751} {"train_loss": -11.726932525634766, "global_step": 294193, "epoch": 1751} {"train_loss": -11.805652618408203, "global_step": 294194, "epoch": 1751} {"train_loss": -11.842084884643555, "global_step": 294195, "epoch": 1751} {"train_loss": -11.867433547973633, "global_step": 294196, "epoch": 1751} {"train_loss": -12.045409202575684, "global_step": 294197, "epoch": 1751} {"train_loss": -11.889689445495605, "global_step": 294198, "epoch": 1751} {"train_loss": -11.893546104431152, "global_step": 294199, "epoch": 1751} {"train_loss": -12.234166145324707, "global_step": 294200, "epoch": 1751} {"train_loss": -11.912555694580078, "global_step": 294201, "epoch": 1751} {"train_loss": -12.092275619506836, "global_step": 294202, "epoch": 1751} {"train_loss": -12.002994537353516, "global_step": 294203, "epoch": 1751} {"train_loss": -11.66364574432373, "global_step": 294204, "epoch": 1751} {"train_loss": -11.854228973388672, "global_step": 294205, "epoch": 1751} {"train_loss": -12.039600372314453, "global_step": 294206, "epoch": 1751} {"train_loss": -12.126543045043945, "global_step": 294207, "epoch": 1751} {"train_loss": -12.056130409240723, "global_step": 294208, "epoch": 1751} {"train_loss": -11.79359245300293, "global_step": 294209, "epoch": 1751} {"train_loss": -12.137351989746094, "global_step": 294210, "epoch": 1751} {"train_loss": -12.264904022216797, "global_step": 294211, "epoch": 1751} {"train_loss": -12.072920799255371, "global_step": 294212, "epoch": 1751} {"train_loss": -12.27865982055664, "global_step": 294213, "epoch": 1751} {"train_loss": -12.332437515258789, "global_step": 294214, "epoch": 1751} {"train_loss": -12.341775894165039, "global_step": 294215, "epoch": 1751} {"train_loss": -12.299181938171387, "global_step": 294216, "epoch": 1751} {"train_loss": -12.181811332702637, "global_step": 294217, "epoch": 1751} {"train_loss": -12.225626945495605, "global_step": 294218, "epoch": 1751} {"train_loss": -12.07736587524414, "global_step": 294219, "epoch": 1751} {"train_loss": -12.250692367553711, "global_step": 294220, "epoch": 1751} {"train_loss": -11.962068557739258, "global_step": 294221, "epoch": 1751} {"train_loss": -12.278026580810547, "global_step": 294222, "epoch": 1751} {"train_loss": -12.133434295654297, "global_step": 294223, "epoch": 1751} {"train_loss": -11.947136878967285, "global_step": 294224, "epoch": 1751} {"train_loss": -12.095443725585938, "global_step": 294225, "epoch": 1751} {"train_loss": -12.381720542907715, "global_step": 294226, "epoch": 1751} {"train_loss": -12.46030330657959, "global_step": 294227, "epoch": 1751} {"train_loss": -12.288812637329102, "global_step": 294228, "epoch": 1751} {"train_loss": -12.048986434936523, "global_step": 294229, "epoch": 1751} {"train_loss": -12.209492683410645, "global_step": 294230, "epoch": 1751} {"train_loss": -11.926643371582031, "global_step": 294231, "epoch": 1751} {"train_loss": -12.411861419677734, "global_step": 294232, "epoch": 1751} {"train_loss": -11.975521087646484, "global_step": 294233, "epoch": 1751} {"train_loss": -12.001581192016602, "global_step": 294234, "epoch": 1751} {"train_loss": -12.064347267150879, "global_step": 294235, "epoch": 1751} {"train_loss": -11.802885055541992, "global_step": 294236, "epoch": 1751} {"train_loss": -11.740104675292969, "global_step": 294237, "epoch": 1751} {"train_loss": -12.160558700561523, "global_step": 294238, "epoch": 1751} {"train_loss": -11.991751670837402, "global_step": 294239, "epoch": 1751} {"train_loss": -11.83491325378418, "global_step": 294240, "epoch": 1751} {"train_loss": -12.125885009765625, "global_step": 294241, "epoch": 1751} {"train_loss": -11.859762191772461, "global_step": 294242, "epoch": 1751} {"train_loss": -11.898442268371582, "global_step": 294243, "epoch": 1751} {"train_loss": -12.367889404296875, "global_step": 294244, "epoch": 1751} {"train_loss": -12.270736694335938, "global_step": 294245, "epoch": 1751} {"train_loss": -11.923571586608887, "global_step": 294246, "epoch": 1751} {"train_loss": -12.278420448303223, "global_step": 294247, "epoch": 1751} {"train_loss": -11.876368522644043, "global_step": 294248, "epoch": 1751} {"train_loss": -11.01280689239502, "global_step": 294249, "epoch": 1751} {"train_loss": -11.932685852050781, "global_step": 294250, "epoch": 1751} {"train_loss": -11.599611282348633, "global_step": 294251, "epoch": 1751} {"train_loss": -10.036890029907227, "global_step": 294252, "epoch": 1751} {"train_loss": -10.432376861572266, "global_step": 294253, "epoch": 1751} {"train_loss": -11.390449523925781, "global_step": 294254, "epoch": 1751} {"train_loss": -10.701607704162598, "global_step": 294255, "epoch": 1751} {"train_loss": -10.827336311340332, "global_step": 294256, "epoch": 1751} {"train_loss": -9.736412048339844, "global_step": 294257, "epoch": 1751} {"train_loss": -10.897093772888184, "global_step": 294258, "epoch": 1751} {"train_loss": -11.059759140014648, "global_step": 294259, "epoch": 1751} {"train_loss": -9.899209022521973, "global_step": 294260, "epoch": 1751} {"train_loss": -9.573995590209961, "global_step": 294261, "epoch": 1751} {"train_loss": -10.434943199157715, "global_step": 294262, "epoch": 1751} {"train_loss": -11.039257049560547, "global_step": 294263, "epoch": 1751} {"train_loss": -10.032571792602539, "global_step": 294264, "epoch": 1751} {"train_loss": -11.165891647338867, "global_step": 294265, "epoch": 1751} {"train_loss": -10.529460906982422, "global_step": 294266, "epoch": 1751} {"train_loss": -9.827722549438477, "global_step": 294267, "epoch": 1751} {"train_loss": -11.433963775634766, "global_step": 294268, "epoch": 1751} {"train_loss": -10.069226264953613, "global_step": 294269, "epoch": 1751} {"train_loss": -10.450789451599121, "global_step": 294270, "epoch": 1751} {"train_loss": -11.164772033691406, "global_step": 294271, "epoch": 1751} {"train_loss": -10.515981674194336, "global_step": 294272, "epoch": 1751} {"train_loss": -11.069267272949219, "global_step": 294273, "epoch": 1751} {"train_loss": -10.483970642089844, "global_step": 294274, "epoch": 1751} {"train_loss": -11.325620651245117, "global_step": 294275, "epoch": 1751} {"train_loss": -9.961960792541504, "global_step": 294276, "epoch": 1751} {"train_loss": -11.455851554870605, "global_step": 294277, "epoch": 1751} {"train_loss": -10.589113235473633, "global_step": 294278, "epoch": 1751} {"train_loss": -10.988840103149414, "global_step": 294279, "epoch": 1751} {"train_loss": -10.623392105102539, "global_step": 294280, "epoch": 1751} {"train_loss": -10.604423522949219, "global_step": 294281, "epoch": 1751} {"train_loss": -11.347591400146484, "global_step": 294282, "epoch": 1751} {"train_loss": -10.879663467407227, "global_step": 294283, "epoch": 1751} {"train_loss": -11.275875091552734, "global_step": 294284, "epoch": 1751} {"train_loss": -11.540487289428711, "global_step": 294285, "epoch": 1751} {"train_loss": -11.471290588378906, "global_step": 294286, "epoch": 1751} {"train_loss": -11.408472061157227, "global_step": 294287, "epoch": 1751} {"train_loss": -11.585611343383789, "global_step": 294288, "epoch": 1751} {"train_loss": -11.518994331359863, "global_step": 294289, "epoch": 1751} {"train_loss": -11.732306480407715, "global_step": 294290, "epoch": 1751} {"train_loss": -11.716609954833984, "global_step": 294291, "epoch": 1751} {"train_loss": -11.840291023254395, "global_step": 294292, "epoch": 1751} {"train_loss": -11.905959129333496, "global_step": 294293, "epoch": 1751} {"train_loss": -11.607349395751953, "global_step": 294294, "epoch": 1751} {"train_loss": -11.839853286743164, "global_step": 294295, "epoch": 1751} {"train_loss": -12.001777648925781, "global_step": 294296, "epoch": 1751} {"train_loss": -11.5880126953125, "global_step": 294297, "epoch": 1751} {"train_loss": -11.591707229614258, "global_step": 294298, "epoch": 1751} {"train_loss": -11.92538070678711, "global_step": 294299, "epoch": 1751} {"train_loss": -11.746028900146484, "global_step": 294300, "epoch": 1751} {"train_loss": -12.070917129516602, "global_step": 294301, "epoch": 1751} {"train_loss": -11.9002685546875, "global_step": 294302, "epoch": 1751} {"train_loss": -12.106203079223633, "global_step": 294303, "epoch": 1751} {"train_loss": -11.879501342773438, "global_step": 294304, "epoch": 1751} {"train_loss": -12.024391174316406, "global_step": 294305, "epoch": 1751} {"train_loss": -11.943575859069824, "global_step": 294306, "epoch": 1751} {"train_loss": -11.988433837890625, "global_step": 294307, "epoch": 1751} {"train_loss": -12.133137702941895, "global_step": 294308, "epoch": 1751} {"train_loss": -12.083885192871094, "global_step": 294309, "epoch": 1751} {"train_loss": -12.068875312805176, "global_step": 294310, "epoch": 1751} {"train_loss": -11.87485122680664, "global_step": 294311, "epoch": 1751} {"train_loss": -12.005069732666016, "global_step": 294312, "epoch": 1751} {"train_loss": -11.999445915222168, "global_step": 294313, "epoch": 1751} {"train_loss": -12.044390678405762, "global_step": 294314, "epoch": 1751} {"train_loss": -12.137445449829102, "global_step": 294315, "epoch": 1751} {"train_loss": -12.10196590423584, "global_step": 294316, "epoch": 1751} {"train_loss": -12.079113006591797, "global_step": 294317, "epoch": 1751} {"train_loss": -11.939053535461426, "global_step": 294318, "epoch": 1751} {"train_loss": -12.049983978271484, "global_step": 294319, "epoch": 1751} {"train_loss": -11.993000984191895, "global_step": 294320, "epoch": 1751} {"train_loss": -12.258834838867188, "global_step": 294321, "epoch": 1751} {"train_loss": -12.004035949707031, "global_step": 294322, "epoch": 1751} {"train_loss": -12.255271911621094, "global_step": 294323, "epoch": 1751} {"train_loss": -12.11129093170166, "global_step": 294324, "epoch": 1751} {"train_loss": -12.308755874633789, "global_step": 294325, "epoch": 1751} {"train_loss": -12.269397735595703, "global_step": 294326, "epoch": 1751} {"train_loss": -12.116194725036621, "global_step": 294327, "epoch": 1751} {"train_loss": -12.100239753723145, "global_step": 294328, "epoch": 1751} {"train_loss": -12.08405876159668, "global_step": 294329, "epoch": 1751} {"train_loss": -12.117477416992188, "global_step": 294330, "epoch": 1751} {"train_loss": -11.524112701416016, "global_step": 294331, "epoch": 1751} {"train_loss": -12.166671752929688, "global_step": 294332, "epoch": 1751} {"train_loss": -11.744363784790039, "global_step": 294333, "epoch": 1751} {"train_loss": -12.174055099487305, "global_step": 294334, "epoch": 1751} {"train_loss": -11.726780045600165, "global_step": 294335, "epoch": 1751, "val_loss": 277465.3125} {"train_loss": -12.182851791381836, "global_step": 294336, "epoch": 1752} {"train_loss": -11.675596237182617, "global_step": 294337, "epoch": 1752} {"train_loss": -12.114517211914062, "global_step": 294338, "epoch": 1752} {"train_loss": -11.885441780090332, "global_step": 294339, "epoch": 1752} {"train_loss": -12.149764060974121, "global_step": 294340, "epoch": 1752} {"train_loss": -12.089020729064941, "global_step": 294341, "epoch": 1752} {"train_loss": -11.864288330078125, "global_step": 294342, "epoch": 1752} {"train_loss": -12.34039306640625, "global_step": 294343, "epoch": 1752} {"train_loss": -12.037552833557129, "global_step": 294344, "epoch": 1752} {"train_loss": -11.931696891784668, "global_step": 294345, "epoch": 1752} {"train_loss": -11.85659408569336, "global_step": 294346, "epoch": 1752} {"train_loss": -12.100553512573242, "global_step": 294347, "epoch": 1752} {"train_loss": -12.189753532409668, "global_step": 294348, "epoch": 1752} {"train_loss": -11.853654861450195, "global_step": 294349, "epoch": 1752} {"train_loss": -11.995278358459473, "global_step": 294350, "epoch": 1752} {"train_loss": -12.229500770568848, "global_step": 294351, "epoch": 1752} {"train_loss": -11.932795524597168, "global_step": 294352, "epoch": 1752} {"train_loss": -11.580877304077148, "global_step": 294353, "epoch": 1752} {"train_loss": -12.34663200378418, "global_step": 294354, "epoch": 1752} {"train_loss": -11.351669311523438, "global_step": 294355, "epoch": 1752} {"train_loss": -10.712392807006836, "global_step": 294356, "epoch": 1752} {"train_loss": -11.701746940612793, "global_step": 294357, "epoch": 1752} {"train_loss": -11.978296279907227, "global_step": 294358, "epoch": 1752} {"train_loss": -11.247575759887695, "global_step": 294359, "epoch": 1752} {"train_loss": -11.361513137817383, "global_step": 294360, "epoch": 1752} {"train_loss": -11.395804405212402, "global_step": 294361, "epoch": 1752} {"train_loss": -11.168394088745117, "global_step": 294362, "epoch": 1752} {"train_loss": -10.933982849121094, "global_step": 294363, "epoch": 1752} {"train_loss": -12.04905891418457, "global_step": 294364, "epoch": 1752} {"train_loss": -11.924489974975586, "global_step": 294365, "epoch": 1752} {"train_loss": -11.276595115661621, "global_step": 294366, "epoch": 1752} {"train_loss": -12.091039657592773, "global_step": 294367, "epoch": 1752} {"train_loss": -11.735483169555664, "global_step": 294368, "epoch": 1752} {"train_loss": -11.546466827392578, "global_step": 294369, "epoch": 1752} {"train_loss": -11.491865158081055, "global_step": 294370, "epoch": 1752} {"train_loss": -11.889490127563477, "global_step": 294371, "epoch": 1752} {"train_loss": -11.33069133758545, "global_step": 294372, "epoch": 1752} {"train_loss": -11.777456283569336, "global_step": 294373, "epoch": 1752} {"train_loss": -11.269047737121582, "global_step": 294374, "epoch": 1752} {"train_loss": -11.449738502502441, "global_step": 294375, "epoch": 1752} {"train_loss": -11.500951766967773, "global_step": 294376, "epoch": 1752} {"train_loss": -11.144132614135742, "global_step": 294377, "epoch": 1752} {"train_loss": -11.55544662475586, "global_step": 294378, "epoch": 1752} {"train_loss": -10.674593925476074, "global_step": 294379, "epoch": 1752} {"train_loss": -11.179378509521484, "global_step": 294380, "epoch": 1752} {"train_loss": -11.47217845916748, "global_step": 294381, "epoch": 1752} {"train_loss": -10.830657005310059, "global_step": 294382, "epoch": 1752} {"train_loss": -11.653501510620117, "global_step": 294383, "epoch": 1752} {"train_loss": -11.021129608154297, "global_step": 294384, "epoch": 1752} {"train_loss": -11.944561004638672, "global_step": 294385, "epoch": 1752} {"train_loss": -11.024877548217773, "global_step": 294386, "epoch": 1752} {"train_loss": -11.667644500732422, "global_step": 294387, "epoch": 1752} {"train_loss": -11.399652481079102, "global_step": 294388, "epoch": 1752} {"train_loss": -11.489760398864746, "global_step": 294389, "epoch": 1752} {"train_loss": -11.579501152038574, "global_step": 294390, "epoch": 1752} {"train_loss": -11.836219787597656, "global_step": 294391, "epoch": 1752} {"train_loss": -11.654952049255371, "global_step": 294392, "epoch": 1752} {"train_loss": -11.926889419555664, "global_step": 294393, "epoch": 1752} {"train_loss": -11.738973617553711, "global_step": 294394, "epoch": 1752} {"train_loss": -11.798069953918457, "global_step": 294395, "epoch": 1752} {"train_loss": -12.155130386352539, "global_step": 294396, "epoch": 1752} {"train_loss": -11.562729835510254, "global_step": 294397, "epoch": 1752} {"train_loss": -11.943927764892578, "global_step": 294398, "epoch": 1752} {"train_loss": -11.785676956176758, "global_step": 294399, "epoch": 1752} {"train_loss": -12.259514808654785, "global_step": 294400, "epoch": 1752} {"train_loss": -11.967055320739746, "global_step": 294401, "epoch": 1752} {"train_loss": -12.064620971679688, "global_step": 294402, "epoch": 1752} {"train_loss": -12.051713943481445, "global_step": 294403, "epoch": 1752} {"train_loss": -11.926741600036621, "global_step": 294404, "epoch": 1752} {"train_loss": -11.993659019470215, "global_step": 294405, "epoch": 1752} {"train_loss": -11.913223266601562, "global_step": 294406, "epoch": 1752} {"train_loss": -12.264151573181152, "global_step": 294407, "epoch": 1752} {"train_loss": -11.803422927856445, "global_step": 294408, "epoch": 1752} {"train_loss": -12.04013729095459, "global_step": 294409, "epoch": 1752} {"train_loss": -12.022369384765625, "global_step": 294410, "epoch": 1752} {"train_loss": -12.008062362670898, "global_step": 294411, "epoch": 1752} {"train_loss": -12.084108352661133, "global_step": 294412, "epoch": 1752} {"train_loss": -12.174705505371094, "global_step": 294413, "epoch": 1752} {"train_loss": -12.315558433532715, "global_step": 294414, "epoch": 1752} {"train_loss": -12.120895385742188, "global_step": 294415, "epoch": 1752} {"train_loss": -12.128753662109375, "global_step": 294416, "epoch": 1752} {"train_loss": -12.249622344970703, "global_step": 294417, "epoch": 1752} {"train_loss": -12.262487411499023, "global_step": 294418, "epoch": 1752} {"train_loss": -12.381433486938477, "global_step": 294419, "epoch": 1752} {"train_loss": -12.19703483581543, "global_step": 294420, "epoch": 1752} {"train_loss": -12.112424850463867, "global_step": 294421, "epoch": 1752} {"train_loss": -12.27673625946045, "global_step": 294422, "epoch": 1752} {"train_loss": -12.380376815795898, "global_step": 294423, "epoch": 1752} {"train_loss": -12.024173736572266, "global_step": 294424, "epoch": 1752} {"train_loss": -12.248226165771484, "global_step": 294425, "epoch": 1752} {"train_loss": -11.594289779663086, "global_step": 294426, "epoch": 1752} {"train_loss": -12.352272033691406, "global_step": 294427, "epoch": 1752} {"train_loss": -11.758880615234375, "global_step": 294428, "epoch": 1752} {"train_loss": -11.169891357421875, "global_step": 294429, "epoch": 1752} {"train_loss": -11.939188003540039, "global_step": 294430, "epoch": 1752} {"train_loss": -12.301782608032227, "global_step": 294431, "epoch": 1752} {"train_loss": -11.958402633666992, "global_step": 294432, "epoch": 1752} {"train_loss": -12.077716827392578, "global_step": 294433, "epoch": 1752} {"train_loss": -11.973382949829102, "global_step": 294434, "epoch": 1752} {"train_loss": -11.855001449584961, "global_step": 294435, "epoch": 1752} {"train_loss": -11.83941650390625, "global_step": 294436, "epoch": 1752} {"train_loss": -12.454516410827637, "global_step": 294437, "epoch": 1752} {"train_loss": -11.910584449768066, "global_step": 294438, "epoch": 1752} {"train_loss": -11.859664916992188, "global_step": 294439, "epoch": 1752} {"train_loss": -12.310589790344238, "global_step": 294440, "epoch": 1752} {"train_loss": -12.023519515991211, "global_step": 294441, "epoch": 1752} {"train_loss": -12.335264205932617, "global_step": 294442, "epoch": 1752} {"train_loss": -12.20176887512207, "global_step": 294443, "epoch": 1752} {"train_loss": -12.359858512878418, "global_step": 294444, "epoch": 1752} {"train_loss": -12.317821502685547, "global_step": 294445, "epoch": 1752} {"train_loss": -12.185375213623047, "global_step": 294446, "epoch": 1752} {"train_loss": -12.218799591064453, "global_step": 294447, "epoch": 1752} {"train_loss": -12.575042724609375, "global_step": 294448, "epoch": 1752} {"train_loss": -12.274150848388672, "global_step": 294449, "epoch": 1752} {"train_loss": -12.337005615234375, "global_step": 294450, "epoch": 1752} {"train_loss": -12.420951843261719, "global_step": 294451, "epoch": 1752} {"train_loss": -12.198070526123047, "global_step": 294452, "epoch": 1752} {"train_loss": -12.033304214477539, "global_step": 294453, "epoch": 1752} {"train_loss": -12.313368797302246, "global_step": 294454, "epoch": 1752} {"train_loss": -12.04011344909668, "global_step": 294455, "epoch": 1752} {"train_loss": -11.873446464538574, "global_step": 294456, "epoch": 1752} {"train_loss": -12.319892883300781, "global_step": 294457, "epoch": 1752} {"train_loss": -12.140241622924805, "global_step": 294458, "epoch": 1752} {"train_loss": -12.56762981414795, "global_step": 294459, "epoch": 1752} {"train_loss": -12.292625427246094, "global_step": 294460, "epoch": 1752} {"train_loss": -12.131179809570312, "global_step": 294461, "epoch": 1752} {"train_loss": -12.136005401611328, "global_step": 294462, "epoch": 1752} {"train_loss": -12.373162269592285, "global_step": 294463, "epoch": 1752} {"train_loss": -12.034318923950195, "global_step": 294464, "epoch": 1752} {"train_loss": -11.974030494689941, "global_step": 294465, "epoch": 1752} {"train_loss": -12.228963851928711, "global_step": 294466, "epoch": 1752} {"train_loss": -12.512458801269531, "global_step": 294467, "epoch": 1752} {"train_loss": -12.100942611694336, "global_step": 294468, "epoch": 1752} {"train_loss": -12.438133239746094, "global_step": 294469, "epoch": 1752} {"train_loss": -11.823204040527344, "global_step": 294470, "epoch": 1752} {"train_loss": -11.407878875732422, "global_step": 294471, "epoch": 1752} {"train_loss": -11.43824577331543, "global_step": 294472, "epoch": 1752} {"train_loss": -11.894455909729004, "global_step": 294473, "epoch": 1752} {"train_loss": -11.833013534545898, "global_step": 294474, "epoch": 1752} {"train_loss": -11.489704132080078, "global_step": 294475, "epoch": 1752} {"train_loss": -12.215442657470703, "global_step": 294476, "epoch": 1752} {"train_loss": -11.88045883178711, "global_step": 294477, "epoch": 1752} {"train_loss": -12.000933647155762, "global_step": 294478, "epoch": 1752} {"train_loss": -12.035440444946289, "global_step": 294479, "epoch": 1752} {"train_loss": -11.788566589355469, "global_step": 294480, "epoch": 1752} {"train_loss": -10.589369773864746, "global_step": 294481, "epoch": 1752} {"train_loss": -12.083555221557617, "global_step": 294482, "epoch": 1752} {"train_loss": -10.755453109741211, "global_step": 294483, "epoch": 1752} {"train_loss": -10.330649375915527, "global_step": 294484, "epoch": 1752} {"train_loss": -11.77292537689209, "global_step": 294485, "epoch": 1752} {"train_loss": -10.623706817626953, "global_step": 294486, "epoch": 1752} {"train_loss": -11.689840316772461, "global_step": 294487, "epoch": 1752} {"train_loss": -11.827695846557617, "global_step": 294488, "epoch": 1752} {"train_loss": -11.137805938720703, "global_step": 294489, "epoch": 1752} {"train_loss": -11.978935241699219, "global_step": 294490, "epoch": 1752} {"train_loss": -11.711694717407227, "global_step": 294491, "epoch": 1752} {"train_loss": -11.00719928741455, "global_step": 294492, "epoch": 1752} {"train_loss": -11.408485412597656, "global_step": 294493, "epoch": 1752} {"train_loss": -11.976911544799805, "global_step": 294494, "epoch": 1752} {"train_loss": -11.753995895385742, "global_step": 294495, "epoch": 1752} {"train_loss": -11.821252822875977, "global_step": 294496, "epoch": 1752} {"train_loss": -11.37231731414795, "global_step": 294497, "epoch": 1752} {"train_loss": -11.964465141296387, "global_step": 294498, "epoch": 1752} {"train_loss": -12.205978393554688, "global_step": 294499, "epoch": 1752} {"train_loss": -11.923887252807617, "global_step": 294500, "epoch": 1752} {"train_loss": -12.205326080322266, "global_step": 294501, "epoch": 1752} {"train_loss": -11.984737396240234, "global_step": 294502, "epoch": 1752} {"train_loss": -11.857223612921578, "global_step": 294503, "epoch": 1752, "val_loss": 282042.40625} {"train_loss": -11.83528995513916, "global_step": 294504, "epoch": 1753} {"train_loss": -11.99874496459961, "global_step": 294505, "epoch": 1753} {"train_loss": -11.992280960083008, "global_step": 294506, "epoch": 1753} {"train_loss": -12.228567123413086, "global_step": 294507, "epoch": 1753} {"train_loss": -12.169412612915039, "global_step": 294508, "epoch": 1753} {"train_loss": -12.053909301757812, "global_step": 294509, "epoch": 1753} {"train_loss": -12.218819618225098, "global_step": 294510, "epoch": 1753} {"train_loss": -12.101917266845703, "global_step": 294511, "epoch": 1753} {"train_loss": -12.228832244873047, "global_step": 294512, "epoch": 1753} {"train_loss": -12.177164077758789, "global_step": 294513, "epoch": 1753} {"train_loss": -12.19759464263916, "global_step": 294514, "epoch": 1753} {"train_loss": -12.21237564086914, "global_step": 294515, "epoch": 1753} {"train_loss": -12.0494384765625, "global_step": 294516, "epoch": 1753} {"train_loss": -12.378811836242676, "global_step": 294517, "epoch": 1753} {"train_loss": -12.401754379272461, "global_step": 294518, "epoch": 1753} {"train_loss": -12.347850799560547, "global_step": 294519, "epoch": 1753} {"train_loss": -12.254659652709961, "global_step": 294520, "epoch": 1753} {"train_loss": -12.402786254882812, "global_step": 294521, "epoch": 1753} {"train_loss": -12.129142761230469, "global_step": 294522, "epoch": 1753} {"train_loss": -12.380001068115234, "global_step": 294523, "epoch": 1753} {"train_loss": -12.247791290283203, "global_step": 294524, "epoch": 1753} {"train_loss": -12.243087768554688, "global_step": 294525, "epoch": 1753} {"train_loss": -12.422447204589844, "global_step": 294526, "epoch": 1753} {"train_loss": -12.067219734191895, "global_step": 294527, "epoch": 1753} {"train_loss": -12.235798835754395, "global_step": 294528, "epoch": 1753} {"train_loss": -12.250317573547363, "global_step": 294529, "epoch": 1753} {"train_loss": -11.950041770935059, "global_step": 294530, "epoch": 1753} {"train_loss": -12.146042823791504, "global_step": 294531, "epoch": 1753} {"train_loss": -12.363401412963867, "global_step": 294532, "epoch": 1753} {"train_loss": -11.990281105041504, "global_step": 294533, "epoch": 1753} {"train_loss": -12.108747482299805, "global_step": 294534, "epoch": 1753} {"train_loss": -12.426246643066406, "global_step": 294535, "epoch": 1753} {"train_loss": -11.904693603515625, "global_step": 294536, "epoch": 1753} {"train_loss": -12.282539367675781, "global_step": 294537, "epoch": 1753} {"train_loss": -12.04106330871582, "global_step": 294538, "epoch": 1753} {"train_loss": -11.356852531433105, "global_step": 294539, "epoch": 1753} {"train_loss": -11.584857940673828, "global_step": 294540, "epoch": 1753} {"train_loss": -11.721940994262695, "global_step": 294541, "epoch": 1753} {"train_loss": -12.00209903717041, "global_step": 294542, "epoch": 1753} {"train_loss": -11.651538848876953, "global_step": 294543, "epoch": 1753} {"train_loss": -11.443142890930176, "global_step": 294544, "epoch": 1753} {"train_loss": -10.728180885314941, "global_step": 294545, "epoch": 1753} {"train_loss": -11.52967643737793, "global_step": 294546, "epoch": 1753} {"train_loss": -11.931402206420898, "global_step": 294547, "epoch": 1753} {"train_loss": -11.782543182373047, "global_step": 294548, "epoch": 1753} {"train_loss": -11.569316864013672, "global_step": 294549, "epoch": 1753} {"train_loss": -11.529867172241211, "global_step": 294550, "epoch": 1753} {"train_loss": -11.397640228271484, "global_step": 294551, "epoch": 1753} {"train_loss": -11.72465991973877, "global_step": 294552, "epoch": 1753} {"train_loss": -11.865334510803223, "global_step": 294553, "epoch": 1753} {"train_loss": -11.285791397094727, "global_step": 294554, "epoch": 1753} {"train_loss": -11.42599868774414, "global_step": 294555, "epoch": 1753} {"train_loss": -11.829593658447266, "global_step": 294556, "epoch": 1753} {"train_loss": -10.9400634765625, "global_step": 294557, "epoch": 1753} {"train_loss": -11.746970176696777, "global_step": 294558, "epoch": 1753} {"train_loss": -10.702254295349121, "global_step": 294559, "epoch": 1753} {"train_loss": -11.763267517089844, "global_step": 294560, "epoch": 1753} {"train_loss": -9.868258476257324, "global_step": 294561, "epoch": 1753} {"train_loss": -12.050128936767578, "global_step": 294562, "epoch": 1753} {"train_loss": -10.698294639587402, "global_step": 294563, "epoch": 1753} {"train_loss": -11.096027374267578, "global_step": 294564, "epoch": 1753} {"train_loss": -11.682788848876953, "global_step": 294565, "epoch": 1753} {"train_loss": -10.904370307922363, "global_step": 294566, "epoch": 1753} {"train_loss": -11.989862442016602, "global_step": 294567, "epoch": 1753} {"train_loss": -11.264902114868164, "global_step": 294568, "epoch": 1753} {"train_loss": -11.414217948913574, "global_step": 294569, "epoch": 1753} {"train_loss": -11.82705020904541, "global_step": 294570, "epoch": 1753} {"train_loss": -11.320629119873047, "global_step": 294571, "epoch": 1753} {"train_loss": -11.608423233032227, "global_step": 294572, "epoch": 1753} {"train_loss": -11.57032585144043, "global_step": 294573, "epoch": 1753} {"train_loss": -11.935586929321289, "global_step": 294574, "epoch": 1753} {"train_loss": -11.472179412841797, "global_step": 294575, "epoch": 1753} {"train_loss": -11.56336784362793, "global_step": 294576, "epoch": 1753} {"train_loss": -11.610154151916504, "global_step": 294577, "epoch": 1753} {"train_loss": -11.768959045410156, "global_step": 294578, "epoch": 1753} {"train_loss": -11.686439514160156, "global_step": 294579, "epoch": 1753} {"train_loss": -11.6647367477417, "global_step": 294580, "epoch": 1753} {"train_loss": -11.37162971496582, "global_step": 294581, "epoch": 1753} {"train_loss": -11.846222877502441, "global_step": 294582, "epoch": 1753} {"train_loss": -11.730636596679688, "global_step": 294583, "epoch": 1753} {"train_loss": -11.647292137145996, "global_step": 294584, "epoch": 1753} {"train_loss": -11.566069602966309, "global_step": 294585, "epoch": 1753} {"train_loss": -12.004671096801758, "global_step": 294586, "epoch": 1753} {"train_loss": -11.767635345458984, "global_step": 294587, "epoch": 1753} {"train_loss": -11.458137512207031, "global_step": 294588, "epoch": 1753} {"train_loss": -12.064535140991211, "global_step": 294589, "epoch": 1753} {"train_loss": -11.655474662780762, "global_step": 294590, "epoch": 1753} {"train_loss": -11.718729019165039, "global_step": 294591, "epoch": 1753} {"train_loss": -11.593765258789062, "global_step": 294592, "epoch": 1753} {"train_loss": -11.790042877197266, "global_step": 294593, "epoch": 1753} {"train_loss": -11.79261589050293, "global_step": 294594, "epoch": 1753} {"train_loss": -11.839591979980469, "global_step": 294595, "epoch": 1753} {"train_loss": -11.826284408569336, "global_step": 294596, "epoch": 1753} {"train_loss": -11.595069885253906, "global_step": 294597, "epoch": 1753} {"train_loss": -12.171342849731445, "global_step": 294598, "epoch": 1753} {"train_loss": -11.931209564208984, "global_step": 294599, "epoch": 1753} {"train_loss": -11.42223834991455, "global_step": 294600, "epoch": 1753} {"train_loss": -11.662681579589844, "global_step": 294601, "epoch": 1753} {"train_loss": -11.726417541503906, "global_step": 294602, "epoch": 1753} {"train_loss": -11.192453384399414, "global_step": 294603, "epoch": 1753} {"train_loss": -11.531852722167969, "global_step": 294604, "epoch": 1753} {"train_loss": -11.017560005187988, "global_step": 294605, "epoch": 1753} {"train_loss": -11.093040466308594, "global_step": 294606, "epoch": 1753} {"train_loss": -11.60660171508789, "global_step": 294607, "epoch": 1753} {"train_loss": -11.514404296875, "global_step": 294608, "epoch": 1753} {"train_loss": -11.658974647521973, "global_step": 294609, "epoch": 1753} {"train_loss": -11.777913093566895, "global_step": 294610, "epoch": 1753} {"train_loss": -11.931408882141113, "global_step": 294611, "epoch": 1753} {"train_loss": -11.811701774597168, "global_step": 294612, "epoch": 1753} {"train_loss": -11.748987197875977, "global_step": 294613, "epoch": 1753} {"train_loss": -11.792963981628418, "global_step": 294614, "epoch": 1753} {"train_loss": -11.513785362243652, "global_step": 294615, "epoch": 1753} {"train_loss": -11.993566513061523, "global_step": 294616, "epoch": 1753} {"train_loss": -12.030282020568848, "global_step": 294617, "epoch": 1753} {"train_loss": -12.118558883666992, "global_step": 294618, "epoch": 1753} {"train_loss": -11.97048568725586, "global_step": 294619, "epoch": 1753} {"train_loss": -11.972654342651367, "global_step": 294620, "epoch": 1753} {"train_loss": -12.184380531311035, "global_step": 294621, "epoch": 1753} {"train_loss": -11.942113876342773, "global_step": 294622, "epoch": 1753} {"train_loss": -11.994656562805176, "global_step": 294623, "epoch": 1753} {"train_loss": -12.089601516723633, "global_step": 294624, "epoch": 1753} {"train_loss": -12.06159496307373, "global_step": 294625, "epoch": 1753} {"train_loss": -12.332293510437012, "global_step": 294626, "epoch": 1753} {"train_loss": -12.129697799682617, "global_step": 294627, "epoch": 1753} {"train_loss": -12.241870880126953, "global_step": 294628, "epoch": 1753} {"train_loss": -12.214109420776367, "global_step": 294629, "epoch": 1753} {"train_loss": -12.210591316223145, "global_step": 294630, "epoch": 1753} {"train_loss": -12.34931755065918, "global_step": 294631, "epoch": 1753} {"train_loss": -11.98983383178711, "global_step": 294632, "epoch": 1753} {"train_loss": -12.240253448486328, "global_step": 294633, "epoch": 1753} {"train_loss": -12.145241737365723, "global_step": 294634, "epoch": 1753} {"train_loss": -12.15864086151123, "global_step": 294635, "epoch": 1753} {"train_loss": -12.223243713378906, "global_step": 294636, "epoch": 1753} {"train_loss": -12.26711654663086, "global_step": 294637, "epoch": 1753} {"train_loss": -12.356412887573242, "global_step": 294638, "epoch": 1753} {"train_loss": -12.207725524902344, "global_step": 294639, "epoch": 1753} {"train_loss": -12.180977821350098, "global_step": 294640, "epoch": 1753} {"train_loss": -12.04018497467041, "global_step": 294641, "epoch": 1753} {"train_loss": -12.171207427978516, "global_step": 294642, "epoch": 1753} {"train_loss": -11.974689483642578, "global_step": 294643, "epoch": 1753} {"train_loss": -12.156800270080566, "global_step": 294644, "epoch": 1753} {"train_loss": -12.177932739257812, "global_step": 294645, "epoch": 1753} {"train_loss": -12.061238288879395, "global_step": 294646, "epoch": 1753} {"train_loss": -12.2027587890625, "global_step": 294647, "epoch": 1753} {"train_loss": -12.060033798217773, "global_step": 294648, "epoch": 1753} {"train_loss": -12.00029468536377, "global_step": 294649, "epoch": 1753} {"train_loss": -12.395679473876953, "global_step": 294650, "epoch": 1753} {"train_loss": -11.979759216308594, "global_step": 294651, "epoch": 1753} {"train_loss": -11.94763469696045, "global_step": 294652, "epoch": 1753} {"train_loss": -12.132710456848145, "global_step": 294653, "epoch": 1753} {"train_loss": -12.083343505859375, "global_step": 294654, "epoch": 1753} {"train_loss": -12.109880447387695, "global_step": 294655, "epoch": 1753} {"train_loss": -12.170449256896973, "global_step": 294656, "epoch": 1753} {"train_loss": -12.303010940551758, "global_step": 294657, "epoch": 1753} {"train_loss": -12.344574928283691, "global_step": 294658, "epoch": 1753} {"train_loss": -12.088896751403809, "global_step": 294659, "epoch": 1753} {"train_loss": -12.490382194519043, "global_step": 294660, "epoch": 1753} {"train_loss": -12.285099029541016, "global_step": 294661, "epoch": 1753} {"train_loss": -12.407598495483398, "global_step": 294662, "epoch": 1753} {"train_loss": -12.404890060424805, "global_step": 294663, "epoch": 1753} {"train_loss": -12.394680976867676, "global_step": 294664, "epoch": 1753} {"train_loss": -12.374727249145508, "global_step": 294665, "epoch": 1753} {"train_loss": -12.384574890136719, "global_step": 294666, "epoch": 1753} {"train_loss": -12.174980163574219, "global_step": 294667, "epoch": 1753} {"train_loss": -11.905172348022461, "global_step": 294668, "epoch": 1753} {"train_loss": -11.874177932739258, "global_step": 294669, "epoch": 1753} {"train_loss": -12.115080833435059, "global_step": 294670, "epoch": 1753} {"train_loss": -11.894079191344124, "global_step": 294671, "epoch": 1753, "val_loss": 280257.15625} {"train_loss": -11.435407638549805, "global_step": 294672, "epoch": 1754} {"train_loss": -10.441954612731934, "global_step": 294673, "epoch": 1754} {"train_loss": -11.654574394226074, "global_step": 294674, "epoch": 1754} {"train_loss": -11.14002513885498, "global_step": 294675, "epoch": 1754} {"train_loss": -8.744579315185547, "global_step": 294676, "epoch": 1754} {"train_loss": -11.459129333496094, "global_step": 294677, "epoch": 1754} {"train_loss": -9.918542861938477, "global_step": 294678, "epoch": 1754} {"train_loss": -9.746938705444336, "global_step": 294679, "epoch": 1754} {"train_loss": -10.463693618774414, "global_step": 294680, "epoch": 1754} {"train_loss": -9.325566291809082, "global_step": 294681, "epoch": 1754} {"train_loss": -9.770310401916504, "global_step": 294682, "epoch": 1754} {"train_loss": -9.196075439453125, "global_step": 294683, "epoch": 1754} {"train_loss": -9.82621955871582, "global_step": 294684, "epoch": 1754} {"train_loss": -8.291690826416016, "global_step": 294685, "epoch": 1754} {"train_loss": -9.626550674438477, "global_step": 294686, "epoch": 1754} {"train_loss": -9.534467697143555, "global_step": 294687, "epoch": 1754} {"train_loss": -9.870452880859375, "global_step": 294688, "epoch": 1754} {"train_loss": -10.096059799194336, "global_step": 294689, "epoch": 1754} {"train_loss": -10.428692817687988, "global_step": 294690, "epoch": 1754} {"train_loss": -10.851402282714844, "global_step": 294691, "epoch": 1754} {"train_loss": -10.227829933166504, "global_step": 294692, "epoch": 1754} {"train_loss": -10.080343246459961, "global_step": 294693, "epoch": 1754} {"train_loss": -10.1047945022583, "global_step": 294694, "epoch": 1754} {"train_loss": -10.73829460144043, "global_step": 294695, "epoch": 1754} {"train_loss": -10.012678146362305, "global_step": 294696, "epoch": 1754} {"train_loss": -9.946252822875977, "global_step": 294697, "epoch": 1754} {"train_loss": -10.526407241821289, "global_step": 294698, "epoch": 1754} {"train_loss": -10.107826232910156, "global_step": 294699, "epoch": 1754} {"train_loss": -9.512367248535156, "global_step": 294700, "epoch": 1754} {"train_loss": -11.701595306396484, "global_step": 294701, "epoch": 1754} {"train_loss": -9.55051326751709, "global_step": 294702, "epoch": 1754} {"train_loss": -10.5956449508667, "global_step": 294703, "epoch": 1754} {"train_loss": -9.717178344726562, "global_step": 294704, "epoch": 1754} {"train_loss": -10.458380699157715, "global_step": 294705, "epoch": 1754} {"train_loss": -10.739140510559082, "global_step": 294706, "epoch": 1754} {"train_loss": -10.688008308410645, "global_step": 294707, "epoch": 1754} {"train_loss": -10.721574783325195, "global_step": 294708, "epoch": 1754} {"train_loss": -9.899664878845215, "global_step": 294709, "epoch": 1754} {"train_loss": -11.043940544128418, "global_step": 294710, "epoch": 1754} {"train_loss": -10.631258010864258, "global_step": 294711, "epoch": 1754} {"train_loss": -10.1328125, "global_step": 294712, "epoch": 1754} {"train_loss": -11.283287048339844, "global_step": 294713, "epoch": 1754} {"train_loss": -11.062110900878906, "global_step": 294714, "epoch": 1754} {"train_loss": -10.783629417419434, "global_step": 294715, "epoch": 1754} {"train_loss": -10.992673873901367, "global_step": 294716, "epoch": 1754} {"train_loss": -11.530611038208008, "global_step": 294717, "epoch": 1754} {"train_loss": -11.259498596191406, "global_step": 294718, "epoch": 1754} {"train_loss": -11.42886734008789, "global_step": 294719, "epoch": 1754} {"train_loss": -11.80698299407959, "global_step": 294720, "epoch": 1754} {"train_loss": -11.61897087097168, "global_step": 294721, "epoch": 1754} {"train_loss": -11.756545066833496, "global_step": 294722, "epoch": 1754} {"train_loss": -11.546217918395996, "global_step": 294723, "epoch": 1754} {"train_loss": -11.662639617919922, "global_step": 294724, "epoch": 1754} {"train_loss": -11.580307006835938, "global_step": 294725, "epoch": 1754} {"train_loss": -11.70071029663086, "global_step": 294726, "epoch": 1754} {"train_loss": -11.603877067565918, "global_step": 294727, "epoch": 1754} {"train_loss": -11.649627685546875, "global_step": 294728, "epoch": 1754} {"train_loss": -11.8013334274292, "global_step": 294729, "epoch": 1754} {"train_loss": -11.674110412597656, "global_step": 294730, "epoch": 1754} {"train_loss": -11.458979606628418, "global_step": 294731, "epoch": 1754} {"train_loss": -11.818986892700195, "global_step": 294732, "epoch": 1754} {"train_loss": -11.719087600708008, "global_step": 294733, "epoch": 1754} {"train_loss": -11.472063064575195, "global_step": 294734, "epoch": 1754} {"train_loss": -11.761480331420898, "global_step": 294735, "epoch": 1754} {"train_loss": -11.495528221130371, "global_step": 294736, "epoch": 1754} {"train_loss": -11.723670959472656, "global_step": 294737, "epoch": 1754} {"train_loss": -11.675040245056152, "global_step": 294738, "epoch": 1754} {"train_loss": -11.939203262329102, "global_step": 294739, "epoch": 1754} {"train_loss": -11.573771476745605, "global_step": 294740, "epoch": 1754} {"train_loss": -12.070049285888672, "global_step": 294741, "epoch": 1754} {"train_loss": -11.997859954833984, "global_step": 294742, "epoch": 1754} {"train_loss": -11.87626838684082, "global_step": 294743, "epoch": 1754} {"train_loss": -12.019327163696289, "global_step": 294744, "epoch": 1754} {"train_loss": -11.807056427001953, "global_step": 294745, "epoch": 1754} {"train_loss": -11.940507888793945, "global_step": 294746, "epoch": 1754} {"train_loss": -11.995039939880371, "global_step": 294747, "epoch": 1754} {"train_loss": -11.979532241821289, "global_step": 294748, "epoch": 1754} {"train_loss": -12.165833473205566, "global_step": 294749, "epoch": 1754} {"train_loss": -12.013738632202148, "global_step": 294750, "epoch": 1754} {"train_loss": -12.254209518432617, "global_step": 294751, "epoch": 1754} {"train_loss": -12.112202644348145, "global_step": 294752, "epoch": 1754} {"train_loss": -11.878371238708496, "global_step": 294753, "epoch": 1754} {"train_loss": -12.116515159606934, "global_step": 294754, "epoch": 1754} {"train_loss": -11.966835975646973, "global_step": 294755, "epoch": 1754} {"train_loss": -12.081111907958984, "global_step": 294756, "epoch": 1754} {"train_loss": -12.052196502685547, "global_step": 294757, "epoch": 1754} {"train_loss": -11.986799240112305, "global_step": 294758, "epoch": 1754} {"train_loss": -12.077625274658203, "global_step": 294759, "epoch": 1754} {"train_loss": -12.189298629760742, "global_step": 294760, "epoch": 1754} {"train_loss": -12.065884590148926, "global_step": 294761, "epoch": 1754} {"train_loss": -12.147605895996094, "global_step": 294762, "epoch": 1754} {"train_loss": -12.267218589782715, "global_step": 294763, "epoch": 1754} {"train_loss": -12.199201583862305, "global_step": 294764, "epoch": 1754} {"train_loss": -12.155149459838867, "global_step": 294765, "epoch": 1754} {"train_loss": -12.281498908996582, "global_step": 294766, "epoch": 1754} {"train_loss": -12.354029655456543, "global_step": 294767, "epoch": 1754} {"train_loss": -11.96811580657959, "global_step": 294768, "epoch": 1754} {"train_loss": -12.383688926696777, "global_step": 294769, "epoch": 1754} {"train_loss": -12.1574125289917, "global_step": 294770, "epoch": 1754} {"train_loss": -12.262187957763672, "global_step": 294771, "epoch": 1754} {"train_loss": -12.200944900512695, "global_step": 294772, "epoch": 1754} {"train_loss": -12.318378448486328, "global_step": 294773, "epoch": 1754} {"train_loss": -12.274940490722656, "global_step": 294774, "epoch": 1754} {"train_loss": -12.35563850402832, "global_step": 294775, "epoch": 1754} {"train_loss": -12.210288047790527, "global_step": 294776, "epoch": 1754} {"train_loss": -12.43388557434082, "global_step": 294777, "epoch": 1754} {"train_loss": -12.333165168762207, "global_step": 294778, "epoch": 1754} {"train_loss": -12.355921745300293, "global_step": 294779, "epoch": 1754} {"train_loss": -12.343095779418945, "global_step": 294780, "epoch": 1754} {"train_loss": -12.284417152404785, "global_step": 294781, "epoch": 1754} {"train_loss": -12.328422546386719, "global_step": 294782, "epoch": 1754} {"train_loss": -12.595224380493164, "global_step": 294783, "epoch": 1754} {"train_loss": -12.278579711914062, "global_step": 294784, "epoch": 1754} {"train_loss": -12.373083114624023, "global_step": 294785, "epoch": 1754} {"train_loss": -12.61430549621582, "global_step": 294786, "epoch": 1754} {"train_loss": -12.249088287353516, "global_step": 294787, "epoch": 1754} {"train_loss": -12.340047836303711, "global_step": 294788, "epoch": 1754} {"train_loss": -12.366058349609375, "global_step": 294789, "epoch": 1754} {"train_loss": -12.239842414855957, "global_step": 294790, "epoch": 1754} {"train_loss": -12.34737777709961, "global_step": 294791, "epoch": 1754} {"train_loss": -12.534655570983887, "global_step": 294792, "epoch": 1754} {"train_loss": -12.218228340148926, "global_step": 294793, "epoch": 1754} {"train_loss": -12.210221290588379, "global_step": 294794, "epoch": 1754} {"train_loss": -12.185157775878906, "global_step": 294795, "epoch": 1754} {"train_loss": -12.13513469696045, "global_step": 294796, "epoch": 1754} {"train_loss": -11.492685317993164, "global_step": 294797, "epoch": 1754} {"train_loss": -11.983787536621094, "global_step": 294798, "epoch": 1754} {"train_loss": -11.75977897644043, "global_step": 294799, "epoch": 1754} {"train_loss": -12.239643096923828, "global_step": 294800, "epoch": 1754} {"train_loss": -11.608081817626953, "global_step": 294801, "epoch": 1754} {"train_loss": -11.713157653808594, "global_step": 294802, "epoch": 1754} {"train_loss": -12.100930213928223, "global_step": 294803, "epoch": 1754} {"train_loss": -10.681672096252441, "global_step": 294804, "epoch": 1754} {"train_loss": -11.367074966430664, "global_step": 294805, "epoch": 1754} {"train_loss": -10.482355117797852, "global_step": 294806, "epoch": 1754} {"train_loss": -10.853870391845703, "global_step": 294807, "epoch": 1754} {"train_loss": -11.435227394104004, "global_step": 294808, "epoch": 1754} {"train_loss": -10.619885444641113, "global_step": 294809, "epoch": 1754} {"train_loss": -10.407573699951172, "global_step": 294810, "epoch": 1754} {"train_loss": -10.723087310791016, "global_step": 294811, "epoch": 1754} {"train_loss": -10.444965362548828, "global_step": 294812, "epoch": 1754} {"train_loss": -9.977642059326172, "global_step": 294813, "epoch": 1754} {"train_loss": -10.641799926757812, "global_step": 294814, "epoch": 1754} {"train_loss": -11.59228801727295, "global_step": 294815, "epoch": 1754} {"train_loss": -10.169427871704102, "global_step": 294816, "epoch": 1754} {"train_loss": -9.45682144165039, "global_step": 294817, "epoch": 1754} {"train_loss": -8.785036087036133, "global_step": 294818, "epoch": 1754} {"train_loss": -11.14481258392334, "global_step": 294819, "epoch": 1754} {"train_loss": -8.972509384155273, "global_step": 294820, "epoch": 1754} {"train_loss": -8.42975902557373, "global_step": 294821, "epoch": 1754} {"train_loss": -8.839423179626465, "global_step": 294822, "epoch": 1754} {"train_loss": -9.882304191589355, "global_step": 294823, "epoch": 1754} {"train_loss": -7.899550914764404, "global_step": 294824, "epoch": 1754} {"train_loss": -9.510772705078125, "global_step": 294825, "epoch": 1754} {"train_loss": -10.085638999938965, "global_step": 294826, "epoch": 1754} {"train_loss": -9.880712509155273, "global_step": 294827, "epoch": 1754} {"train_loss": -9.780527114868164, "global_step": 294828, "epoch": 1754} {"train_loss": -10.227975845336914, "global_step": 294829, "epoch": 1754} {"train_loss": -10.155352592468262, "global_step": 294830, "epoch": 1754} {"train_loss": -9.721094131469727, "global_step": 294831, "epoch": 1754} {"train_loss": -10.801519393920898, "global_step": 294832, "epoch": 1754} {"train_loss": -9.792665481567383, "global_step": 294833, "epoch": 1754} {"train_loss": -10.091336250305176, "global_step": 294834, "epoch": 1754} {"train_loss": -11.250738143920898, "global_step": 294835, "epoch": 1754} {"train_loss": -9.864519119262695, "global_step": 294836, "epoch": 1754} {"train_loss": -10.25004768371582, "global_step": 294837, "epoch": 1754} {"train_loss": -10.76795768737793, "global_step": 294838, "epoch": 1754} {"train_loss": -11.148405316330138, "global_step": 294839, "epoch": 1754, "val_loss": 281819.0625} {"train_loss": -10.462348937988281, "global_step": 294840, "epoch": 1755} {"train_loss": -10.261588096618652, "global_step": 294841, "epoch": 1755} {"train_loss": -9.974506378173828, "global_step": 294842, "epoch": 1755} {"train_loss": -8.866684913635254, "global_step": 294843, "epoch": 1755} {"train_loss": -11.458989143371582, "global_step": 294844, "epoch": 1755} {"train_loss": -10.665465354919434, "global_step": 294845, "epoch": 1755} {"train_loss": -10.062516212463379, "global_step": 294846, "epoch": 1755} {"train_loss": -10.968122482299805, "global_step": 294847, "epoch": 1755} {"train_loss": -10.501413345336914, "global_step": 294848, "epoch": 1755} {"train_loss": -10.806465148925781, "global_step": 294849, "epoch": 1755} {"train_loss": -10.410260200500488, "global_step": 294850, "epoch": 1755} {"train_loss": -10.835874557495117, "global_step": 294851, "epoch": 1755} {"train_loss": -10.752330780029297, "global_step": 294852, "epoch": 1755} {"train_loss": -10.726102828979492, "global_step": 294853, "epoch": 1755} {"train_loss": -11.595890045166016, "global_step": 294854, "epoch": 1755} {"train_loss": -10.693828582763672, "global_step": 294855, "epoch": 1755} {"train_loss": -11.321081161499023, "global_step": 294856, "epoch": 1755} {"train_loss": -11.386274337768555, "global_step": 294857, "epoch": 1755} {"train_loss": -11.298582077026367, "global_step": 294858, "epoch": 1755} {"train_loss": -11.390532493591309, "global_step": 294859, "epoch": 1755} {"train_loss": -11.589344024658203, "global_step": 294860, "epoch": 1755} {"train_loss": -11.632570266723633, "global_step": 294861, "epoch": 1755} {"train_loss": -11.18454360961914, "global_step": 294862, "epoch": 1755} {"train_loss": -11.386884689331055, "global_step": 294863, "epoch": 1755} {"train_loss": -11.426810264587402, "global_step": 294864, "epoch": 1755} {"train_loss": -11.409310340881348, "global_step": 294865, "epoch": 1755} {"train_loss": -11.667837142944336, "global_step": 294866, "epoch": 1755} {"train_loss": -11.80946159362793, "global_step": 294867, "epoch": 1755} {"train_loss": -11.671822547912598, "global_step": 294868, "epoch": 1755} {"train_loss": -11.593414306640625, "global_step": 294869, "epoch": 1755} {"train_loss": -11.899225234985352, "global_step": 294870, "epoch": 1755} {"train_loss": -11.552399635314941, "global_step": 294871, "epoch": 1755} {"train_loss": -11.691734313964844, "global_step": 294872, "epoch": 1755} {"train_loss": -11.800516128540039, "global_step": 294873, "epoch": 1755} {"train_loss": -11.602932929992676, "global_step": 294874, "epoch": 1755} {"train_loss": -11.830499649047852, "global_step": 294875, "epoch": 1755} {"train_loss": -11.851554870605469, "global_step": 294876, "epoch": 1755} {"train_loss": -11.93641471862793, "global_step": 294877, "epoch": 1755} {"train_loss": -11.99816608428955, "global_step": 294878, "epoch": 1755} {"train_loss": -11.880550384521484, "global_step": 294879, "epoch": 1755} {"train_loss": -11.908143997192383, "global_step": 294880, "epoch": 1755} {"train_loss": -11.902318954467773, "global_step": 294881, "epoch": 1755} {"train_loss": -11.896379470825195, "global_step": 294882, "epoch": 1755} {"train_loss": -11.892158508300781, "global_step": 294883, "epoch": 1755} {"train_loss": -11.829524993896484, "global_step": 294884, "epoch": 1755} {"train_loss": -11.923002243041992, "global_step": 294885, "epoch": 1755} {"train_loss": -11.912792205810547, "global_step": 294886, "epoch": 1755} {"train_loss": -12.022245407104492, "global_step": 294887, "epoch": 1755} {"train_loss": -11.946366310119629, "global_step": 294888, "epoch": 1755} {"train_loss": -11.9098539352417, "global_step": 294889, "epoch": 1755} {"train_loss": -12.093292236328125, "global_step": 294890, "epoch": 1755} {"train_loss": -12.021732330322266, "global_step": 294891, "epoch": 1755} {"train_loss": -12.192636489868164, "global_step": 294892, "epoch": 1755} {"train_loss": -12.063512802124023, "global_step": 294893, "epoch": 1755} {"train_loss": -12.033175468444824, "global_step": 294894, "epoch": 1755} {"train_loss": -12.130505561828613, "global_step": 294895, "epoch": 1755} {"train_loss": -12.173639297485352, "global_step": 294896, "epoch": 1755} {"train_loss": -12.127248764038086, "global_step": 294897, "epoch": 1755} {"train_loss": -11.939157485961914, "global_step": 294898, "epoch": 1755} {"train_loss": -12.240692138671875, "global_step": 294899, "epoch": 1755} {"train_loss": -12.073541641235352, "global_step": 294900, "epoch": 1755} {"train_loss": -12.188695907592773, "global_step": 294901, "epoch": 1755} {"train_loss": -12.035146713256836, "global_step": 294902, "epoch": 1755} {"train_loss": -11.896541595458984, "global_step": 294903, "epoch": 1755} {"train_loss": -12.214883804321289, "global_step": 294904, "epoch": 1755} {"train_loss": -12.337385177612305, "global_step": 294905, "epoch": 1755} {"train_loss": -12.33532428741455, "global_step": 294906, "epoch": 1755} {"train_loss": -12.04199504852295, "global_step": 294907, "epoch": 1755} {"train_loss": -12.219542503356934, "global_step": 294908, "epoch": 1755} {"train_loss": -12.246169090270996, "global_step": 294909, "epoch": 1755} {"train_loss": -12.364255905151367, "global_step": 294910, "epoch": 1755} {"train_loss": -12.302207946777344, "global_step": 294911, "epoch": 1755} {"train_loss": -12.253063201904297, "global_step": 294912, "epoch": 1755} {"train_loss": -12.072511672973633, "global_step": 294913, "epoch": 1755} {"train_loss": -12.325185775756836, "global_step": 294914, "epoch": 1755} {"train_loss": -12.148969650268555, "global_step": 294915, "epoch": 1755} {"train_loss": -12.348677635192871, "global_step": 294916, "epoch": 1755} {"train_loss": -12.329978942871094, "global_step": 294917, "epoch": 1755} {"train_loss": -12.185516357421875, "global_step": 294918, "epoch": 1755} {"train_loss": -12.39337158203125, "global_step": 294919, "epoch": 1755} {"train_loss": -12.268268585205078, "global_step": 294920, "epoch": 1755} {"train_loss": -12.334726333618164, "global_step": 294921, "epoch": 1755} {"train_loss": -12.303070068359375, "global_step": 294922, "epoch": 1755} {"train_loss": -12.406532287597656, "global_step": 294923, "epoch": 1755} {"train_loss": -12.285367965698242, "global_step": 294924, "epoch": 1755} {"train_loss": -12.589004516601562, "global_step": 294925, "epoch": 1755} {"train_loss": -12.36483383178711, "global_step": 294926, "epoch": 1755} {"train_loss": -12.33340072631836, "global_step": 294927, "epoch": 1755} {"train_loss": -12.309085845947266, "global_step": 294928, "epoch": 1755} {"train_loss": -12.242569923400879, "global_step": 294929, "epoch": 1755} {"train_loss": -12.507013320922852, "global_step": 294930, "epoch": 1755} {"train_loss": -12.526018142700195, "global_step": 294931, "epoch": 1755} {"train_loss": -12.23862075805664, "global_step": 294932, "epoch": 1755} {"train_loss": -12.282917976379395, "global_step": 294933, "epoch": 1755} {"train_loss": -12.5283203125, "global_step": 294934, "epoch": 1755} {"train_loss": -12.38049030303955, "global_step": 294935, "epoch": 1755} {"train_loss": -12.234119415283203, "global_step": 294936, "epoch": 1755} {"train_loss": -12.472599029541016, "global_step": 294937, "epoch": 1755} {"train_loss": -12.219979286193848, "global_step": 294938, "epoch": 1755} {"train_loss": -12.548773765563965, "global_step": 294939, "epoch": 1755} {"train_loss": -12.188905715942383, "global_step": 294940, "epoch": 1755} {"train_loss": -12.506209373474121, "global_step": 294941, "epoch": 1755} {"train_loss": -12.406665802001953, "global_step": 294942, "epoch": 1755} {"train_loss": -12.248188018798828, "global_step": 294943, "epoch": 1755} {"train_loss": -12.224738121032715, "global_step": 294944, "epoch": 1755} {"train_loss": -12.127674102783203, "global_step": 294945, "epoch": 1755} {"train_loss": -12.207975387573242, "global_step": 294946, "epoch": 1755} {"train_loss": -12.569147109985352, "global_step": 294947, "epoch": 1755} {"train_loss": -12.279764175415039, "global_step": 294948, "epoch": 1755} {"train_loss": -12.402788162231445, "global_step": 294949, "epoch": 1755} {"train_loss": -12.256953239440918, "global_step": 294950, "epoch": 1755} {"train_loss": -12.353519439697266, "global_step": 294951, "epoch": 1755} {"train_loss": -12.524419784545898, "global_step": 294952, "epoch": 1755} {"train_loss": -12.362215042114258, "global_step": 294953, "epoch": 1755} {"train_loss": -12.500635147094727, "global_step": 294954, "epoch": 1755} {"train_loss": -12.405567169189453, "global_step": 294955, "epoch": 1755} {"train_loss": -12.374170303344727, "global_step": 294956, "epoch": 1755} {"train_loss": -12.55605411529541, "global_step": 294957, "epoch": 1755} {"train_loss": -12.187183380126953, "global_step": 294958, "epoch": 1755} {"train_loss": -11.948043823242188, "global_step": 294959, "epoch": 1755} {"train_loss": -11.026095390319824, "global_step": 294960, "epoch": 1755} {"train_loss": -9.083566665649414, "global_step": 294961, "epoch": 1755} {"train_loss": -9.92540454864502, "global_step": 294962, "epoch": 1755} {"train_loss": -10.027413368225098, "global_step": 294963, "epoch": 1755} {"train_loss": -9.917465209960938, "global_step": 294964, "epoch": 1755} {"train_loss": -9.681621551513672, "global_step": 294965, "epoch": 1755} {"train_loss": -10.564762115478516, "global_step": 294966, "epoch": 1755} {"train_loss": -11.06527328491211, "global_step": 294967, "epoch": 1755} {"train_loss": -9.850053787231445, "global_step": 294968, "epoch": 1755} {"train_loss": -10.670154571533203, "global_step": 294969, "epoch": 1755} {"train_loss": -9.650957107543945, "global_step": 294970, "epoch": 1755} {"train_loss": -10.275968551635742, "global_step": 294971, "epoch": 1755} {"train_loss": -10.967345237731934, "global_step": 294972, "epoch": 1755} {"train_loss": -11.0494966506958, "global_step": 294973, "epoch": 1755} {"train_loss": -10.098827362060547, "global_step": 294974, "epoch": 1755} {"train_loss": -11.697809219360352, "global_step": 294975, "epoch": 1755} {"train_loss": -10.700948715209961, "global_step": 294976, "epoch": 1755} {"train_loss": -10.272565841674805, "global_step": 294977, "epoch": 1755} {"train_loss": -10.99433422088623, "global_step": 294978, "epoch": 1755} {"train_loss": -11.42982006072998, "global_step": 294979, "epoch": 1755} {"train_loss": -10.755607604980469, "global_step": 294980, "epoch": 1755} {"train_loss": -11.891851425170898, "global_step": 294981, "epoch": 1755} {"train_loss": -11.185958862304688, "global_step": 294982, "epoch": 1755} {"train_loss": -11.547806739807129, "global_step": 294983, "epoch": 1755} {"train_loss": -11.424423217773438, "global_step": 294984, "epoch": 1755} {"train_loss": -11.037726402282715, "global_step": 294985, "epoch": 1755} {"train_loss": -11.552980422973633, "global_step": 294986, "epoch": 1755} {"train_loss": -11.07759952545166, "global_step": 294987, "epoch": 1755} {"train_loss": -11.744504928588867, "global_step": 294988, "epoch": 1755} {"train_loss": -11.569744110107422, "global_step": 294989, "epoch": 1755} {"train_loss": -11.525744438171387, "global_step": 294990, "epoch": 1755} {"train_loss": -11.421026229858398, "global_step": 294991, "epoch": 1755} {"train_loss": -11.834413528442383, "global_step": 294992, "epoch": 1755} {"train_loss": -11.668176651000977, "global_step": 294993, "epoch": 1755} {"train_loss": -10.910881042480469, "global_step": 294994, "epoch": 1755} {"train_loss": -11.877767562866211, "global_step": 294995, "epoch": 1755} {"train_loss": -11.291662216186523, "global_step": 294996, "epoch": 1755} {"train_loss": -12.117618560791016, "global_step": 294997, "epoch": 1755} {"train_loss": -11.187434196472168, "global_step": 294998, "epoch": 1755} {"train_loss": -11.576224327087402, "global_step": 294999, "epoch": 1755} {"train_loss": -11.363077163696289, "global_step": 295000, "epoch": 1755} {"train_loss": -11.324566841125488, "global_step": 295001, "epoch": 1755} {"train_loss": -11.607044219970703, "global_step": 295002, "epoch": 1755} {"train_loss": -11.154373168945312, "global_step": 295003, "epoch": 1755} {"train_loss": -11.645584106445312, "global_step": 295004, "epoch": 1755} {"train_loss": -11.426290512084961, "global_step": 295005, "epoch": 1755} {"train_loss": -11.814546585083008, "global_step": 295006, "epoch": 1755} {"train_loss": -11.64012460481553, "global_step": 295007, "epoch": 1755, "val_loss": 274980.59375, "train_action_mse_error": 2.9514822959899902} {"train_loss": -11.106487274169922, "global_step": 295008, "epoch": 1756} {"train_loss": -10.655098915100098, "global_step": 295009, "epoch": 1756} {"train_loss": -11.563093185424805, "global_step": 295010, "epoch": 1756} {"train_loss": -11.270944595336914, "global_step": 295011, "epoch": 1756} {"train_loss": -11.896734237670898, "global_step": 295012, "epoch": 1756} {"train_loss": -11.231002807617188, "global_step": 295013, "epoch": 1756} {"train_loss": -11.465495109558105, "global_step": 295014, "epoch": 1756} {"train_loss": -11.648078918457031, "global_step": 295015, "epoch": 1756} {"train_loss": -11.741134643554688, "global_step": 295016, "epoch": 1756} {"train_loss": -11.939887046813965, "global_step": 295017, "epoch": 1756} {"train_loss": -11.445363998413086, "global_step": 295018, "epoch": 1756} {"train_loss": -12.057548522949219, "global_step": 295019, "epoch": 1756} {"train_loss": -11.833755493164062, "global_step": 295020, "epoch": 1756} {"train_loss": -11.96633243560791, "global_step": 295021, "epoch": 1756} {"train_loss": -11.775604248046875, "global_step": 295022, "epoch": 1756} {"train_loss": -11.971969604492188, "global_step": 295023, "epoch": 1756} {"train_loss": -12.051615715026855, "global_step": 295024, "epoch": 1756} {"train_loss": -11.970141410827637, "global_step": 295025, "epoch": 1756} {"train_loss": -11.924613952636719, "global_step": 295026, "epoch": 1756} {"train_loss": -11.849464416503906, "global_step": 295027, "epoch": 1756} {"train_loss": -11.884597778320312, "global_step": 295028, "epoch": 1756} {"train_loss": -12.075639724731445, "global_step": 295029, "epoch": 1756} {"train_loss": -11.485189437866211, "global_step": 295030, "epoch": 1756} {"train_loss": -12.12894058227539, "global_step": 295031, "epoch": 1756} {"train_loss": -11.928897857666016, "global_step": 295032, "epoch": 1756} {"train_loss": -11.848869323730469, "global_step": 295033, "epoch": 1756} {"train_loss": -12.27174186706543, "global_step": 295034, "epoch": 1756} {"train_loss": -11.465278625488281, "global_step": 295035, "epoch": 1756} {"train_loss": -12.029991149902344, "global_step": 295036, "epoch": 1756} {"train_loss": -11.803311347961426, "global_step": 295037, "epoch": 1756} {"train_loss": -11.580753326416016, "global_step": 295038, "epoch": 1756} {"train_loss": -11.987122535705566, "global_step": 295039, "epoch": 1756} {"train_loss": -11.904108047485352, "global_step": 295040, "epoch": 1756} {"train_loss": -11.914712905883789, "global_step": 295041, "epoch": 1756} {"train_loss": -11.70701789855957, "global_step": 295042, "epoch": 1756} {"train_loss": -12.104927062988281, "global_step": 295043, "epoch": 1756} {"train_loss": -11.944867134094238, "global_step": 295044, "epoch": 1756} {"train_loss": -11.174484252929688, "global_step": 295045, "epoch": 1756} {"train_loss": -11.923860549926758, "global_step": 295046, "epoch": 1756} {"train_loss": -11.864835739135742, "global_step": 295047, "epoch": 1756} {"train_loss": -11.232572555541992, "global_step": 295048, "epoch": 1756} {"train_loss": -12.222711563110352, "global_step": 295049, "epoch": 1756} {"train_loss": -11.863633155822754, "global_step": 295050, "epoch": 1756} {"train_loss": -12.277629852294922, "global_step": 295051, "epoch": 1756} {"train_loss": -11.898731231689453, "global_step": 295052, "epoch": 1756} {"train_loss": -11.967257499694824, "global_step": 295053, "epoch": 1756} {"train_loss": -12.181943893432617, "global_step": 295054, "epoch": 1756} {"train_loss": -12.132935523986816, "global_step": 295055, "epoch": 1756} {"train_loss": -12.039953231811523, "global_step": 295056, "epoch": 1756} {"train_loss": -11.990285873413086, "global_step": 295057, "epoch": 1756} {"train_loss": -12.011590957641602, "global_step": 295058, "epoch": 1756} {"train_loss": -12.073545455932617, "global_step": 295059, "epoch": 1756} {"train_loss": -12.0769624710083, "global_step": 295060, "epoch": 1756} {"train_loss": -12.11290454864502, "global_step": 295061, "epoch": 1756} {"train_loss": -12.094732284545898, "global_step": 295062, "epoch": 1756} {"train_loss": -12.001296043395996, "global_step": 295063, "epoch": 1756} {"train_loss": -12.249293327331543, "global_step": 295064, "epoch": 1756} {"train_loss": -12.238122940063477, "global_step": 295065, "epoch": 1756} {"train_loss": -12.083090782165527, "global_step": 295066, "epoch": 1756} {"train_loss": -12.404669761657715, "global_step": 295067, "epoch": 1756} {"train_loss": -12.16594409942627, "global_step": 295068, "epoch": 1756} {"train_loss": -11.815065383911133, "global_step": 295069, "epoch": 1756} {"train_loss": -12.236981391906738, "global_step": 295070, "epoch": 1756} {"train_loss": -12.151544570922852, "global_step": 295071, "epoch": 1756} {"train_loss": -11.956512451171875, "global_step": 295072, "epoch": 1756} {"train_loss": -12.276376724243164, "global_step": 295073, "epoch": 1756} {"train_loss": -11.982683181762695, "global_step": 295074, "epoch": 1756} {"train_loss": -12.196624755859375, "global_step": 295075, "epoch": 1756} {"train_loss": -12.264151573181152, "global_step": 295076, "epoch": 1756} {"train_loss": -12.17032241821289, "global_step": 295077, "epoch": 1756} {"train_loss": -12.237100601196289, "global_step": 295078, "epoch": 1756} {"train_loss": -12.168598175048828, "global_step": 295079, "epoch": 1756} {"train_loss": -12.361150741577148, "global_step": 295080, "epoch": 1756} {"train_loss": -11.757172584533691, "global_step": 295081, "epoch": 1756} {"train_loss": -12.177821159362793, "global_step": 295082, "epoch": 1756} {"train_loss": -12.304948806762695, "global_step": 295083, "epoch": 1756} {"train_loss": -12.064580917358398, "global_step": 295084, "epoch": 1756} {"train_loss": -12.204363822937012, "global_step": 295085, "epoch": 1756} {"train_loss": -12.32126235961914, "global_step": 295086, "epoch": 1756} {"train_loss": -12.389483451843262, "global_step": 295087, "epoch": 1756} {"train_loss": -12.290273666381836, "global_step": 295088, "epoch": 1756} {"train_loss": -12.10949993133545, "global_step": 295089, "epoch": 1756} {"train_loss": -11.795337677001953, "global_step": 295090, "epoch": 1756} {"train_loss": -11.515655517578125, "global_step": 295091, "epoch": 1756} {"train_loss": -12.250911712646484, "global_step": 295092, "epoch": 1756} {"train_loss": -11.66140365600586, "global_step": 295093, "epoch": 1756} {"train_loss": -11.488924980163574, "global_step": 295094, "epoch": 1756} {"train_loss": -12.043773651123047, "global_step": 295095, "epoch": 1756} {"train_loss": -12.019784927368164, "global_step": 295096, "epoch": 1756} {"train_loss": -11.767084121704102, "global_step": 295097, "epoch": 1756} {"train_loss": -12.161685943603516, "global_step": 295098, "epoch": 1756} {"train_loss": -12.037660598754883, "global_step": 295099, "epoch": 1756} {"train_loss": -11.859238624572754, "global_step": 295100, "epoch": 1756} {"train_loss": -12.207311630249023, "global_step": 295101, "epoch": 1756} {"train_loss": -12.089881896972656, "global_step": 295102, "epoch": 1756} {"train_loss": -11.96853256225586, "global_step": 295103, "epoch": 1756} {"train_loss": -12.287010192871094, "global_step": 295104, "epoch": 1756} {"train_loss": -11.82258415222168, "global_step": 295105, "epoch": 1756} {"train_loss": -11.91198444366455, "global_step": 295106, "epoch": 1756} {"train_loss": -12.300260543823242, "global_step": 295107, "epoch": 1756} {"train_loss": -12.252147674560547, "global_step": 295108, "epoch": 1756} {"train_loss": -12.059652328491211, "global_step": 295109, "epoch": 1756} {"train_loss": -12.155745506286621, "global_step": 295110, "epoch": 1756} {"train_loss": -11.890807151794434, "global_step": 295111, "epoch": 1756} {"train_loss": -11.785257339477539, "global_step": 295112, "epoch": 1756} {"train_loss": -12.060911178588867, "global_step": 295113, "epoch": 1756} {"train_loss": -12.287069320678711, "global_step": 295114, "epoch": 1756} {"train_loss": -11.964794158935547, "global_step": 295115, "epoch": 1756} {"train_loss": -12.150039672851562, "global_step": 295116, "epoch": 1756} {"train_loss": -11.753767013549805, "global_step": 295117, "epoch": 1756} {"train_loss": -12.332206726074219, "global_step": 295118, "epoch": 1756} {"train_loss": -11.73666000366211, "global_step": 295119, "epoch": 1756} {"train_loss": -12.068796157836914, "global_step": 295120, "epoch": 1756} {"train_loss": -12.113212585449219, "global_step": 295121, "epoch": 1756} {"train_loss": -12.258198738098145, "global_step": 295122, "epoch": 1756} {"train_loss": -11.582624435424805, "global_step": 295123, "epoch": 1756} {"train_loss": -11.760123252868652, "global_step": 295124, "epoch": 1756} {"train_loss": -11.859769821166992, "global_step": 295125, "epoch": 1756} {"train_loss": -12.019009590148926, "global_step": 295126, "epoch": 1756} {"train_loss": -11.932046890258789, "global_step": 295127, "epoch": 1756} {"train_loss": -11.865867614746094, "global_step": 295128, "epoch": 1756} {"train_loss": -12.176166534423828, "global_step": 295129, "epoch": 1756} {"train_loss": -11.82809829711914, "global_step": 295130, "epoch": 1756} {"train_loss": -11.708642959594727, "global_step": 295131, "epoch": 1756} {"train_loss": -11.420581817626953, "global_step": 295132, "epoch": 1756} {"train_loss": -11.15553092956543, "global_step": 295133, "epoch": 1756} {"train_loss": -12.154129028320312, "global_step": 295134, "epoch": 1756} {"train_loss": -11.365577697753906, "global_step": 295135, "epoch": 1756} {"train_loss": -12.015262603759766, "global_step": 295136, "epoch": 1756} {"train_loss": -11.604893684387207, "global_step": 295137, "epoch": 1756} {"train_loss": -11.951483726501465, "global_step": 295138, "epoch": 1756} {"train_loss": -12.384954452514648, "global_step": 295139, "epoch": 1756} {"train_loss": -11.782516479492188, "global_step": 295140, "epoch": 1756} {"train_loss": -11.857305526733398, "global_step": 295141, "epoch": 1756} {"train_loss": -12.168120384216309, "global_step": 295142, "epoch": 1756} {"train_loss": -10.734186172485352, "global_step": 295143, "epoch": 1756} {"train_loss": -10.408248901367188, "global_step": 295144, "epoch": 1756} {"train_loss": -11.052213668823242, "global_step": 295145, "epoch": 1756} {"train_loss": -11.984884262084961, "global_step": 295146, "epoch": 1756} {"train_loss": -11.693944931030273, "global_step": 295147, "epoch": 1756} {"train_loss": -11.37429141998291, "global_step": 295148, "epoch": 1756} {"train_loss": -11.588863372802734, "global_step": 295149, "epoch": 1756} {"train_loss": -10.137811660766602, "global_step": 295150, "epoch": 1756} {"train_loss": -11.91677474975586, "global_step": 295151, "epoch": 1756} {"train_loss": -10.382247924804688, "global_step": 295152, "epoch": 1756} {"train_loss": -11.244476318359375, "global_step": 295153, "epoch": 1756} {"train_loss": -10.49586296081543, "global_step": 295154, "epoch": 1756} {"train_loss": -10.843317985534668, "global_step": 295155, "epoch": 1756} {"train_loss": -11.616524696350098, "global_step": 295156, "epoch": 1756} {"train_loss": -10.591529846191406, "global_step": 295157, "epoch": 1756} {"train_loss": -10.828869819641113, "global_step": 295158, "epoch": 1756} {"train_loss": -10.527007102966309, "global_step": 295159, "epoch": 1756} {"train_loss": -11.807516098022461, "global_step": 295160, "epoch": 1756} {"train_loss": -10.755242347717285, "global_step": 295161, "epoch": 1756} {"train_loss": -10.986547470092773, "global_step": 295162, "epoch": 1756} {"train_loss": -10.95833683013916, "global_step": 295163, "epoch": 1756} {"train_loss": -10.93309497833252, "global_step": 295164, "epoch": 1756} {"train_loss": -10.837851524353027, "global_step": 295165, "epoch": 1756} {"train_loss": -10.533321380615234, "global_step": 295166, "epoch": 1756} {"train_loss": -11.70359992980957, "global_step": 295167, "epoch": 1756} {"train_loss": -10.110637664794922, "global_step": 295168, "epoch": 1756} {"train_loss": -11.177766799926758, "global_step": 295169, "epoch": 1756} {"train_loss": -11.171845436096191, "global_step": 295170, "epoch": 1756} {"train_loss": -11.252307891845703, "global_step": 295171, "epoch": 1756} {"train_loss": -11.866329193115234, "global_step": 295172, "epoch": 1756} {"train_loss": -11.204378128051758, "global_step": 295173, "epoch": 1756} {"train_loss": -11.704014778137207, "global_step": 295174, "epoch": 1756} {"train_loss": -11.769614764622279, "global_step": 295175, "epoch": 1756, "val_loss": 281838.46875} {"train_loss": -10.930347442626953, "global_step": 295176, "epoch": 1757} {"train_loss": -11.632768630981445, "global_step": 295177, "epoch": 1757} {"train_loss": -10.56693172454834, "global_step": 295178, "epoch": 1757} {"train_loss": -11.946486473083496, "global_step": 295179, "epoch": 1757} {"train_loss": -10.600156784057617, "global_step": 295180, "epoch": 1757} {"train_loss": -11.818437576293945, "global_step": 295181, "epoch": 1757} {"train_loss": -11.140728950500488, "global_step": 295182, "epoch": 1757} {"train_loss": -11.775971412658691, "global_step": 295183, "epoch": 1757} {"train_loss": -11.12535285949707, "global_step": 295184, "epoch": 1757} {"train_loss": -11.564793586730957, "global_step": 295185, "epoch": 1757} {"train_loss": -11.190055847167969, "global_step": 295186, "epoch": 1757} {"train_loss": -11.81607437133789, "global_step": 295187, "epoch": 1757} {"train_loss": -10.76717758178711, "global_step": 295188, "epoch": 1757} {"train_loss": -11.825292587280273, "global_step": 295189, "epoch": 1757} {"train_loss": -10.98194694519043, "global_step": 295190, "epoch": 1757} {"train_loss": -11.587576866149902, "global_step": 295191, "epoch": 1757} {"train_loss": -11.264191627502441, "global_step": 295192, "epoch": 1757} {"train_loss": -11.707368850708008, "global_step": 295193, "epoch": 1757} {"train_loss": -11.6680908203125, "global_step": 295194, "epoch": 1757} {"train_loss": -11.907683372497559, "global_step": 295195, "epoch": 1757} {"train_loss": -11.654739379882812, "global_step": 295196, "epoch": 1757} {"train_loss": -11.585041046142578, "global_step": 295197, "epoch": 1757} {"train_loss": -11.668521881103516, "global_step": 295198, "epoch": 1757} {"train_loss": -11.877671241760254, "global_step": 295199, "epoch": 1757} {"train_loss": -11.911828994750977, "global_step": 295200, "epoch": 1757} {"train_loss": -11.934257507324219, "global_step": 295201, "epoch": 1757} {"train_loss": -11.766501426696777, "global_step": 295202, "epoch": 1757} {"train_loss": -12.034948348999023, "global_step": 295203, "epoch": 1757} {"train_loss": -11.885361671447754, "global_step": 295204, "epoch": 1757} {"train_loss": -11.88286304473877, "global_step": 295205, "epoch": 1757} {"train_loss": -12.081830978393555, "global_step": 295206, "epoch": 1757} {"train_loss": -11.849660873413086, "global_step": 295207, "epoch": 1757} {"train_loss": -12.141220092773438, "global_step": 295208, "epoch": 1757} {"train_loss": -11.809017181396484, "global_step": 295209, "epoch": 1757} {"train_loss": -12.127466201782227, "global_step": 295210, "epoch": 1757} {"train_loss": -11.93925666809082, "global_step": 295211, "epoch": 1757} {"train_loss": -12.134471893310547, "global_step": 295212, "epoch": 1757} {"train_loss": -12.158702850341797, "global_step": 295213, "epoch": 1757} {"train_loss": -12.133376121520996, "global_step": 295214, "epoch": 1757} {"train_loss": -11.895051956176758, "global_step": 295215, "epoch": 1757} {"train_loss": -11.942534446716309, "global_step": 295216, "epoch": 1757} {"train_loss": -12.235307693481445, "global_step": 295217, "epoch": 1757} {"train_loss": -11.978278160095215, "global_step": 295218, "epoch": 1757} {"train_loss": -11.834728240966797, "global_step": 295219, "epoch": 1757} {"train_loss": -12.07847785949707, "global_step": 295220, "epoch": 1757} {"train_loss": -12.232696533203125, "global_step": 295221, "epoch": 1757} {"train_loss": -12.003325462341309, "global_step": 295222, "epoch": 1757} {"train_loss": -12.113582611083984, "global_step": 295223, "epoch": 1757} {"train_loss": -12.116703033447266, "global_step": 295224, "epoch": 1757} {"train_loss": -11.884540557861328, "global_step": 295225, "epoch": 1757} {"train_loss": -12.204888343811035, "global_step": 295226, "epoch": 1757} {"train_loss": -12.391741752624512, "global_step": 295227, "epoch": 1757} {"train_loss": -11.982101440429688, "global_step": 295228, "epoch": 1757} {"train_loss": -12.250753402709961, "global_step": 295229, "epoch": 1757} {"train_loss": -12.289424896240234, "global_step": 295230, "epoch": 1757} {"train_loss": -12.437743186950684, "global_step": 295231, "epoch": 1757} {"train_loss": -12.254183769226074, "global_step": 295232, "epoch": 1757} {"train_loss": -12.138235092163086, "global_step": 295233, "epoch": 1757} {"train_loss": -12.23080825805664, "global_step": 295234, "epoch": 1757} {"train_loss": -12.270005226135254, "global_step": 295235, "epoch": 1757} {"train_loss": -11.898091316223145, "global_step": 295236, "epoch": 1757} {"train_loss": -12.187965393066406, "global_step": 295237, "epoch": 1757} {"train_loss": -12.160194396972656, "global_step": 295238, "epoch": 1757} {"train_loss": -12.37314510345459, "global_step": 295239, "epoch": 1757} {"train_loss": -11.9091796875, "global_step": 295240, "epoch": 1757} {"train_loss": -12.261321067810059, "global_step": 295241, "epoch": 1757} {"train_loss": -12.166831016540527, "global_step": 295242, "epoch": 1757} {"train_loss": -11.85513687133789, "global_step": 295243, "epoch": 1757} {"train_loss": -11.840134620666504, "global_step": 295244, "epoch": 1757} {"train_loss": -12.158052444458008, "global_step": 295245, "epoch": 1757} {"train_loss": -11.843019485473633, "global_step": 295246, "epoch": 1757} {"train_loss": -12.15730094909668, "global_step": 295247, "epoch": 1757} {"train_loss": -11.958477020263672, "global_step": 295248, "epoch": 1757} {"train_loss": -11.873724937438965, "global_step": 295249, "epoch": 1757} {"train_loss": -12.375832557678223, "global_step": 295250, "epoch": 1757} {"train_loss": -12.407586097717285, "global_step": 295251, "epoch": 1757} {"train_loss": -12.303117752075195, "global_step": 295252, "epoch": 1757} {"train_loss": -12.246492385864258, "global_step": 295253, "epoch": 1757} {"train_loss": -12.236810684204102, "global_step": 295254, "epoch": 1757} {"train_loss": -12.25836181640625, "global_step": 295255, "epoch": 1757} {"train_loss": -12.141050338745117, "global_step": 295256, "epoch": 1757} {"train_loss": -12.350179672241211, "global_step": 295257, "epoch": 1757} {"train_loss": -12.448482513427734, "global_step": 295258, "epoch": 1757} {"train_loss": -12.294809341430664, "global_step": 295259, "epoch": 1757} {"train_loss": -12.280529975891113, "global_step": 295260, "epoch": 1757} {"train_loss": -12.522422790527344, "global_step": 295261, "epoch": 1757} {"train_loss": -12.329256057739258, "global_step": 295262, "epoch": 1757} {"train_loss": -12.5132417678833, "global_step": 295263, "epoch": 1757} {"train_loss": -12.36227798461914, "global_step": 295264, "epoch": 1757} {"train_loss": -12.238298416137695, "global_step": 295265, "epoch": 1757} {"train_loss": -12.383020401000977, "global_step": 295266, "epoch": 1757} {"train_loss": -12.154094696044922, "global_step": 295267, "epoch": 1757} {"train_loss": -12.405707359313965, "global_step": 295268, "epoch": 1757} {"train_loss": -12.277573585510254, "global_step": 295269, "epoch": 1757} {"train_loss": -12.28223991394043, "global_step": 295270, "epoch": 1757} {"train_loss": -12.66421890258789, "global_step": 295271, "epoch": 1757} {"train_loss": -12.518205642700195, "global_step": 295272, "epoch": 1757} {"train_loss": -12.385004997253418, "global_step": 295273, "epoch": 1757} {"train_loss": -12.611910820007324, "global_step": 295274, "epoch": 1757} {"train_loss": -12.418654441833496, "global_step": 295275, "epoch": 1757} {"train_loss": -12.460195541381836, "global_step": 295276, "epoch": 1757} {"train_loss": -12.401651382446289, "global_step": 295277, "epoch": 1757} {"train_loss": -12.273853302001953, "global_step": 295278, "epoch": 1757} {"train_loss": -12.472641944885254, "global_step": 295279, "epoch": 1757} {"train_loss": -12.498952865600586, "global_step": 295280, "epoch": 1757} {"train_loss": -12.339310646057129, "global_step": 295281, "epoch": 1757} {"train_loss": -12.555656433105469, "global_step": 295282, "epoch": 1757} {"train_loss": -12.066465377807617, "global_step": 295283, "epoch": 1757} {"train_loss": -12.012519836425781, "global_step": 295284, "epoch": 1757} {"train_loss": -12.077476501464844, "global_step": 295285, "epoch": 1757} {"train_loss": -12.15542221069336, "global_step": 295286, "epoch": 1757} {"train_loss": -12.226909637451172, "global_step": 295287, "epoch": 1757} {"train_loss": -11.784688949584961, "global_step": 295288, "epoch": 1757} {"train_loss": -12.129310607910156, "global_step": 295289, "epoch": 1757} {"train_loss": -11.654212951660156, "global_step": 295290, "epoch": 1757} {"train_loss": -11.57225227355957, "global_step": 295291, "epoch": 1757} {"train_loss": -11.732149124145508, "global_step": 295292, "epoch": 1757} {"train_loss": -12.258471488952637, "global_step": 295293, "epoch": 1757} {"train_loss": -12.037452697753906, "global_step": 295294, "epoch": 1757} {"train_loss": -11.447772979736328, "global_step": 295295, "epoch": 1757} {"train_loss": -8.843334197998047, "global_step": 295296, "epoch": 1757} {"train_loss": -9.596832275390625, "global_step": 295297, "epoch": 1757} {"train_loss": -11.560640335083008, "global_step": 295298, "epoch": 1757} {"train_loss": -9.281692504882812, "global_step": 295299, "epoch": 1757} {"train_loss": -10.423494338989258, "global_step": 295300, "epoch": 1757} {"train_loss": -10.371850967407227, "global_step": 295301, "epoch": 1757} {"train_loss": -7.865818023681641, "global_step": 295302, "epoch": 1757} {"train_loss": -9.041181564331055, "global_step": 295303, "epoch": 1757} {"train_loss": -9.292922019958496, "global_step": 295304, "epoch": 1757} {"train_loss": -7.479702949523926, "global_step": 295305, "epoch": 1757} {"train_loss": -8.943338394165039, "global_step": 295306, "epoch": 1757} {"train_loss": -8.310583114624023, "global_step": 295307, "epoch": 1757} {"train_loss": -10.359294891357422, "global_step": 295308, "epoch": 1757} {"train_loss": -10.303452491760254, "global_step": 295309, "epoch": 1757} {"train_loss": -8.60664176940918, "global_step": 295310, "epoch": 1757} {"train_loss": -9.184894561767578, "global_step": 295311, "epoch": 1757} {"train_loss": -9.428390502929688, "global_step": 295312, "epoch": 1757} {"train_loss": -11.024840354919434, "global_step": 295313, "epoch": 1757} {"train_loss": -10.306355476379395, "global_step": 295314, "epoch": 1757} {"train_loss": -10.880938529968262, "global_step": 295315, "epoch": 1757} {"train_loss": -10.550792694091797, "global_step": 295316, "epoch": 1757} {"train_loss": -11.327494621276855, "global_step": 295317, "epoch": 1757} {"train_loss": -10.076190948486328, "global_step": 295318, "epoch": 1757} {"train_loss": -11.280665397644043, "global_step": 295319, "epoch": 1757} {"train_loss": -10.270217895507812, "global_step": 295320, "epoch": 1757} {"train_loss": -11.606573104858398, "global_step": 295321, "epoch": 1757} {"train_loss": -9.907938003540039, "global_step": 295322, "epoch": 1757} {"train_loss": -11.297029495239258, "global_step": 295323, "epoch": 1757} {"train_loss": -10.2706880569458, "global_step": 295324, "epoch": 1757} {"train_loss": -11.643804550170898, "global_step": 295325, "epoch": 1757} {"train_loss": -10.327417373657227, "global_step": 295326, "epoch": 1757} {"train_loss": -11.096378326416016, "global_step": 295327, "epoch": 1757} {"train_loss": -10.401113510131836, "global_step": 295328, "epoch": 1757} {"train_loss": -11.011958122253418, "global_step": 295329, "epoch": 1757} {"train_loss": -11.129118919372559, "global_step": 295330, "epoch": 1757} {"train_loss": -11.231531143188477, "global_step": 295331, "epoch": 1757} {"train_loss": -10.795537948608398, "global_step": 295332, "epoch": 1757} {"train_loss": -11.398618698120117, "global_step": 295333, "epoch": 1757} {"train_loss": -11.045234680175781, "global_step": 295334, "epoch": 1757} {"train_loss": -11.50314712524414, "global_step": 295335, "epoch": 1757} {"train_loss": -11.568437576293945, "global_step": 295336, "epoch": 1757} {"train_loss": -11.699689865112305, "global_step": 295337, "epoch": 1757} {"train_loss": -11.541648864746094, "global_step": 295338, "epoch": 1757} {"train_loss": -11.746623992919922, "global_step": 295339, "epoch": 1757} {"train_loss": -11.297821998596191, "global_step": 295340, "epoch": 1757} {"train_loss": -11.553038597106934, "global_step": 295341, "epoch": 1757} {"train_loss": -11.634273529052734, "global_step": 295342, "epoch": 1757} {"train_loss": -11.56618393035162, "global_step": 295343, "epoch": 1757, "val_loss": 279919.53125} {"train_loss": -11.810934066772461, "global_step": 295344, "epoch": 1758} {"train_loss": -11.474459648132324, "global_step": 295345, "epoch": 1758} {"train_loss": -12.055635452270508, "global_step": 295346, "epoch": 1758} {"train_loss": -11.524152755737305, "global_step": 295347, "epoch": 1758} {"train_loss": -11.548507690429688, "global_step": 295348, "epoch": 1758} {"train_loss": -11.292110443115234, "global_step": 295349, "epoch": 1758} {"train_loss": -11.695842742919922, "global_step": 295350, "epoch": 1758} {"train_loss": -11.436960220336914, "global_step": 295351, "epoch": 1758} {"train_loss": -11.742183685302734, "global_step": 295352, "epoch": 1758} {"train_loss": -11.714285850524902, "global_step": 295353, "epoch": 1758} {"train_loss": -11.372529029846191, "global_step": 295354, "epoch": 1758} {"train_loss": -11.930081367492676, "global_step": 295355, "epoch": 1758} {"train_loss": -11.545368194580078, "global_step": 295356, "epoch": 1758} {"train_loss": -11.655457496643066, "global_step": 295357, "epoch": 1758} {"train_loss": -11.928546905517578, "global_step": 295358, "epoch": 1758} {"train_loss": -11.633201599121094, "global_step": 295359, "epoch": 1758} {"train_loss": -11.804719924926758, "global_step": 295360, "epoch": 1758} {"train_loss": -11.673928260803223, "global_step": 295361, "epoch": 1758} {"train_loss": -11.893564224243164, "global_step": 295362, "epoch": 1758} {"train_loss": -11.982597351074219, "global_step": 295363, "epoch": 1758} {"train_loss": -11.806087493896484, "global_step": 295364, "epoch": 1758} {"train_loss": -11.943148612976074, "global_step": 295365, "epoch": 1758} {"train_loss": -11.770533561706543, "global_step": 295366, "epoch": 1758} {"train_loss": -12.099783897399902, "global_step": 295367, "epoch": 1758} {"train_loss": -11.726724624633789, "global_step": 295368, "epoch": 1758} {"train_loss": -11.943562507629395, "global_step": 295369, "epoch": 1758} {"train_loss": -11.948394775390625, "global_step": 295370, "epoch": 1758} {"train_loss": -12.230481147766113, "global_step": 295371, "epoch": 1758} {"train_loss": -12.029550552368164, "global_step": 295372, "epoch": 1758} {"train_loss": -11.867427825927734, "global_step": 295373, "epoch": 1758} {"train_loss": -12.30430793762207, "global_step": 295374, "epoch": 1758} {"train_loss": -11.959402084350586, "global_step": 295375, "epoch": 1758} {"train_loss": -12.095315933227539, "global_step": 295376, "epoch": 1758} {"train_loss": -11.855537414550781, "global_step": 295377, "epoch": 1758} {"train_loss": -11.82162094116211, "global_step": 295378, "epoch": 1758} {"train_loss": -12.12938117980957, "global_step": 295379, "epoch": 1758} {"train_loss": -11.799938201904297, "global_step": 295380, "epoch": 1758} {"train_loss": -12.012945175170898, "global_step": 295381, "epoch": 1758} {"train_loss": -12.104833602905273, "global_step": 295382, "epoch": 1758} {"train_loss": -12.000739097595215, "global_step": 295383, "epoch": 1758} {"train_loss": -12.021464347839355, "global_step": 295384, "epoch": 1758} {"train_loss": -12.010171890258789, "global_step": 295385, "epoch": 1758} {"train_loss": -12.00054931640625, "global_step": 295386, "epoch": 1758} {"train_loss": -12.17695426940918, "global_step": 295387, "epoch": 1758} {"train_loss": -12.20172119140625, "global_step": 295388, "epoch": 1758} {"train_loss": -12.179632186889648, "global_step": 295389, "epoch": 1758} {"train_loss": -12.027660369873047, "global_step": 295390, "epoch": 1758} {"train_loss": -12.052396774291992, "global_step": 295391, "epoch": 1758} {"train_loss": -12.334423065185547, "global_step": 295392, "epoch": 1758} {"train_loss": -11.919816970825195, "global_step": 295393, "epoch": 1758} {"train_loss": -11.981586456298828, "global_step": 295394, "epoch": 1758} {"train_loss": -12.07620620727539, "global_step": 295395, "epoch": 1758} {"train_loss": -12.061264991760254, "global_step": 295396, "epoch": 1758} {"train_loss": -12.012018203735352, "global_step": 295397, "epoch": 1758} {"train_loss": -12.325111389160156, "global_step": 295398, "epoch": 1758} {"train_loss": -12.004158020019531, "global_step": 295399, "epoch": 1758} {"train_loss": -12.064201354980469, "global_step": 295400, "epoch": 1758} {"train_loss": -12.19620418548584, "global_step": 295401, "epoch": 1758} {"train_loss": -12.022714614868164, "global_step": 295402, "epoch": 1758} {"train_loss": -12.246767044067383, "global_step": 295403, "epoch": 1758} {"train_loss": -12.17129898071289, "global_step": 295404, "epoch": 1758} {"train_loss": -11.87080192565918, "global_step": 295405, "epoch": 1758} {"train_loss": -11.693267822265625, "global_step": 295406, "epoch": 1758} {"train_loss": -10.211943626403809, "global_step": 295407, "epoch": 1758} {"train_loss": -11.388711929321289, "global_step": 295408, "epoch": 1758} {"train_loss": -11.460342407226562, "global_step": 295409, "epoch": 1758} {"train_loss": -11.601181030273438, "global_step": 295410, "epoch": 1758} {"train_loss": -10.932877540588379, "global_step": 295411, "epoch": 1758} {"train_loss": -11.926061630249023, "global_step": 295412, "epoch": 1758} {"train_loss": -10.770227432250977, "global_step": 295413, "epoch": 1758} {"train_loss": -11.190088272094727, "global_step": 295414, "epoch": 1758} {"train_loss": -11.871180534362793, "global_step": 295415, "epoch": 1758} {"train_loss": -11.869897842407227, "global_step": 295416, "epoch": 1758} {"train_loss": -10.692977905273438, "global_step": 295417, "epoch": 1758} {"train_loss": -11.591434478759766, "global_step": 295418, "epoch": 1758} {"train_loss": -11.842304229736328, "global_step": 295419, "epoch": 1758} {"train_loss": -10.508291244506836, "global_step": 295420, "epoch": 1758} {"train_loss": -11.453411102294922, "global_step": 295421, "epoch": 1758} {"train_loss": -11.348217010498047, "global_step": 295422, "epoch": 1758} {"train_loss": -10.595963478088379, "global_step": 295423, "epoch": 1758} {"train_loss": -11.924711227416992, "global_step": 295424, "epoch": 1758} {"train_loss": -11.042322158813477, "global_step": 295425, "epoch": 1758} {"train_loss": -11.04493522644043, "global_step": 295426, "epoch": 1758} {"train_loss": -11.047643661499023, "global_step": 295427, "epoch": 1758} {"train_loss": -10.662094116210938, "global_step": 295428, "epoch": 1758} {"train_loss": -11.877023696899414, "global_step": 295429, "epoch": 1758} {"train_loss": -11.016359329223633, "global_step": 295430, "epoch": 1758} {"train_loss": -10.67617130279541, "global_step": 295431, "epoch": 1758} {"train_loss": -11.64401626586914, "global_step": 295432, "epoch": 1758} {"train_loss": -11.000033378601074, "global_step": 295433, "epoch": 1758} {"train_loss": -11.580568313598633, "global_step": 295434, "epoch": 1758} {"train_loss": -10.811975479125977, "global_step": 295435, "epoch": 1758} {"train_loss": -11.87513542175293, "global_step": 295436, "epoch": 1758} {"train_loss": -11.547113418579102, "global_step": 295437, "epoch": 1758} {"train_loss": -11.318132400512695, "global_step": 295438, "epoch": 1758} {"train_loss": -11.345185279846191, "global_step": 295439, "epoch": 1758} {"train_loss": -11.026676177978516, "global_step": 295440, "epoch": 1758} {"train_loss": -11.723177909851074, "global_step": 295441, "epoch": 1758} {"train_loss": -11.530590057373047, "global_step": 295442, "epoch": 1758} {"train_loss": -11.653839111328125, "global_step": 295443, "epoch": 1758} {"train_loss": -11.843545913696289, "global_step": 295444, "epoch": 1758} {"train_loss": -11.901817321777344, "global_step": 295445, "epoch": 1758} {"train_loss": -11.870147705078125, "global_step": 295446, "epoch": 1758} {"train_loss": -12.012441635131836, "global_step": 295447, "epoch": 1758} {"train_loss": -12.010414123535156, "global_step": 295448, "epoch": 1758} {"train_loss": -11.827913284301758, "global_step": 295449, "epoch": 1758} {"train_loss": -12.199851989746094, "global_step": 295450, "epoch": 1758} {"train_loss": -12.097153663635254, "global_step": 295451, "epoch": 1758} {"train_loss": -12.054335594177246, "global_step": 295452, "epoch": 1758} {"train_loss": -11.953798294067383, "global_step": 295453, "epoch": 1758} {"train_loss": -12.103384017944336, "global_step": 295454, "epoch": 1758} {"train_loss": -11.854156494140625, "global_step": 295455, "epoch": 1758} {"train_loss": -12.062681198120117, "global_step": 295456, "epoch": 1758} {"train_loss": -12.15929126739502, "global_step": 295457, "epoch": 1758} {"train_loss": -12.195627212524414, "global_step": 295458, "epoch": 1758} {"train_loss": -12.08201789855957, "global_step": 295459, "epoch": 1758} {"train_loss": -12.080232620239258, "global_step": 295460, "epoch": 1758} {"train_loss": -11.921987533569336, "global_step": 295461, "epoch": 1758} {"train_loss": -12.215473175048828, "global_step": 295462, "epoch": 1758} {"train_loss": -12.258594512939453, "global_step": 295463, "epoch": 1758} {"train_loss": -12.058645248413086, "global_step": 295464, "epoch": 1758} {"train_loss": -12.139114379882812, "global_step": 295465, "epoch": 1758} {"train_loss": -11.821844100952148, "global_step": 295466, "epoch": 1758} {"train_loss": -12.291257858276367, "global_step": 295467, "epoch": 1758} {"train_loss": -11.981790542602539, "global_step": 295468, "epoch": 1758} {"train_loss": -11.906137466430664, "global_step": 295469, "epoch": 1758} {"train_loss": -12.13616943359375, "global_step": 295470, "epoch": 1758} {"train_loss": -12.146541595458984, "global_step": 295471, "epoch": 1758} {"train_loss": -12.138912200927734, "global_step": 295472, "epoch": 1758} {"train_loss": -12.047743797302246, "global_step": 295473, "epoch": 1758} {"train_loss": -12.159496307373047, "global_step": 295474, "epoch": 1758} {"train_loss": -12.189205169677734, "global_step": 295475, "epoch": 1758} {"train_loss": -12.125885963439941, "global_step": 295476, "epoch": 1758} {"train_loss": -12.049687385559082, "global_step": 295477, "epoch": 1758} {"train_loss": -12.055728912353516, "global_step": 295478, "epoch": 1758} {"train_loss": -12.032889366149902, "global_step": 295479, "epoch": 1758} {"train_loss": -12.131351470947266, "global_step": 295480, "epoch": 1758} {"train_loss": -12.131714820861816, "global_step": 295481, "epoch": 1758} {"train_loss": -12.182828903198242, "global_step": 295482, "epoch": 1758} {"train_loss": -12.061912536621094, "global_step": 295483, "epoch": 1758} {"train_loss": -12.114337921142578, "global_step": 295484, "epoch": 1758} {"train_loss": -12.271839141845703, "global_step": 295485, "epoch": 1758} {"train_loss": -12.042739868164062, "global_step": 295486, "epoch": 1758} {"train_loss": -12.262921333312988, "global_step": 295487, "epoch": 1758} {"train_loss": -12.378124237060547, "global_step": 295488, "epoch": 1758} {"train_loss": -12.174454689025879, "global_step": 295489, "epoch": 1758} {"train_loss": -11.979764938354492, "global_step": 295490, "epoch": 1758} {"train_loss": -12.376436233520508, "global_step": 295491, "epoch": 1758} {"train_loss": -12.267030715942383, "global_step": 295492, "epoch": 1758} {"train_loss": -12.337413787841797, "global_step": 295493, "epoch": 1758} {"train_loss": -12.009149551391602, "global_step": 295494, "epoch": 1758} {"train_loss": -12.482197761535645, "global_step": 295495, "epoch": 1758} {"train_loss": -12.366369247436523, "global_step": 295496, "epoch": 1758} {"train_loss": -12.255514144897461, "global_step": 295497, "epoch": 1758} {"train_loss": -12.445056915283203, "global_step": 295498, "epoch": 1758} {"train_loss": -12.4243803024292, "global_step": 295499, "epoch": 1758} {"train_loss": -11.61742115020752, "global_step": 295500, "epoch": 1758} {"train_loss": -12.33676528930664, "global_step": 295501, "epoch": 1758} {"train_loss": -12.032403945922852, "global_step": 295502, "epoch": 1758} {"train_loss": -12.158303260803223, "global_step": 295503, "epoch": 1758} {"train_loss": -12.227935791015625, "global_step": 295504, "epoch": 1758} {"train_loss": -11.3047456741333, "global_step": 295505, "epoch": 1758} {"train_loss": -11.586715698242188, "global_step": 295506, "epoch": 1758} {"train_loss": -12.45345687866211, "global_step": 295507, "epoch": 1758} {"train_loss": -11.975556373596191, "global_step": 295508, "epoch": 1758} {"train_loss": -11.843177795410156, "global_step": 295509, "epoch": 1758} {"train_loss": -12.353343963623047, "global_step": 295510, "epoch": 1758} {"train_loss": -11.850492108435859, "global_step": 295511, "epoch": 1758, "val_loss": 281245.28125} {"train_loss": -11.73869514465332, "global_step": 295512, "epoch": 1759} {"train_loss": -12.286357879638672, "global_step": 295513, "epoch": 1759} {"train_loss": -11.492722511291504, "global_step": 295514, "epoch": 1759} {"train_loss": -11.473252296447754, "global_step": 295515, "epoch": 1759} {"train_loss": -12.011449813842773, "global_step": 295516, "epoch": 1759} {"train_loss": -9.547830581665039, "global_step": 295517, "epoch": 1759} {"train_loss": -9.626436233520508, "global_step": 295518, "epoch": 1759} {"train_loss": -9.121110916137695, "global_step": 295519, "epoch": 1759} {"train_loss": -11.054826736450195, "global_step": 295520, "epoch": 1759} {"train_loss": -9.635607719421387, "global_step": 295521, "epoch": 1759} {"train_loss": -9.684957504272461, "global_step": 295522, "epoch": 1759} {"train_loss": -9.296100616455078, "global_step": 295523, "epoch": 1759} {"train_loss": -8.563546180725098, "global_step": 295524, "epoch": 1759} {"train_loss": -6.771096229553223, "global_step": 295525, "epoch": 1759} {"train_loss": -8.99666690826416, "global_step": 295526, "epoch": 1759} {"train_loss": -9.022018432617188, "global_step": 295527, "epoch": 1759} {"train_loss": -9.20991325378418, "global_step": 295528, "epoch": 1759} {"train_loss": -9.29700756072998, "global_step": 295529, "epoch": 1759} {"train_loss": -7.821969985961914, "global_step": 295530, "epoch": 1759} {"train_loss": -9.766489028930664, "global_step": 295531, "epoch": 1759} {"train_loss": -10.415684700012207, "global_step": 295532, "epoch": 1759} {"train_loss": -10.389780044555664, "global_step": 295533, "epoch": 1759} {"train_loss": -10.621706008911133, "global_step": 295534, "epoch": 1759} {"train_loss": -10.968299865722656, "global_step": 295535, "epoch": 1759} {"train_loss": -10.699175834655762, "global_step": 295536, "epoch": 1759} {"train_loss": -11.712308883666992, "global_step": 295537, "epoch": 1759} {"train_loss": -10.50863265991211, "global_step": 295538, "epoch": 1759} {"train_loss": -11.31159782409668, "global_step": 295539, "epoch": 1759} {"train_loss": -11.122146606445312, "global_step": 295540, "epoch": 1759} {"train_loss": -11.377908706665039, "global_step": 295541, "epoch": 1759} {"train_loss": -11.176261901855469, "global_step": 295542, "epoch": 1759} {"train_loss": -11.242008209228516, "global_step": 295543, "epoch": 1759} {"train_loss": -11.392093658447266, "global_step": 295544, "epoch": 1759} {"train_loss": -11.368062019348145, "global_step": 295545, "epoch": 1759} {"train_loss": -11.645332336425781, "global_step": 295546, "epoch": 1759} {"train_loss": -11.2315673828125, "global_step": 295547, "epoch": 1759} {"train_loss": -11.274711608886719, "global_step": 295548, "epoch": 1759} {"train_loss": -11.479132652282715, "global_step": 295549, "epoch": 1759} {"train_loss": -11.205185890197754, "global_step": 295550, "epoch": 1759} {"train_loss": -11.602895736694336, "global_step": 295551, "epoch": 1759} {"train_loss": -11.53463363647461, "global_step": 295552, "epoch": 1759} {"train_loss": -11.617413520812988, "global_step": 295553, "epoch": 1759} {"train_loss": -11.58482837677002, "global_step": 295554, "epoch": 1759} {"train_loss": -11.629135131835938, "global_step": 295555, "epoch": 1759} {"train_loss": -11.416069030761719, "global_step": 295556, "epoch": 1759} {"train_loss": -11.728772163391113, "global_step": 295557, "epoch": 1759} {"train_loss": -11.796085357666016, "global_step": 295558, "epoch": 1759} {"train_loss": -11.718663215637207, "global_step": 295559, "epoch": 1759} {"train_loss": -11.50670051574707, "global_step": 295560, "epoch": 1759} {"train_loss": -11.825817108154297, "global_step": 295561, "epoch": 1759} {"train_loss": -11.659280776977539, "global_step": 295562, "epoch": 1759} {"train_loss": -11.86699104309082, "global_step": 295563, "epoch": 1759} {"train_loss": -11.59608268737793, "global_step": 295564, "epoch": 1759} {"train_loss": -11.766934394836426, "global_step": 295565, "epoch": 1759} {"train_loss": -11.895841598510742, "global_step": 295566, "epoch": 1759} {"train_loss": -11.961483001708984, "global_step": 295567, "epoch": 1759} {"train_loss": -11.939847946166992, "global_step": 295568, "epoch": 1759} {"train_loss": -11.796178817749023, "global_step": 295569, "epoch": 1759} {"train_loss": -12.11130142211914, "global_step": 295570, "epoch": 1759} {"train_loss": -11.989387512207031, "global_step": 295571, "epoch": 1759} {"train_loss": -11.704965591430664, "global_step": 295572, "epoch": 1759} {"train_loss": -12.00465202331543, "global_step": 295573, "epoch": 1759} {"train_loss": -11.857222557067871, "global_step": 295574, "epoch": 1759} {"train_loss": -12.055292129516602, "global_step": 295575, "epoch": 1759} {"train_loss": -11.562084197998047, "global_step": 295576, "epoch": 1759} {"train_loss": -11.941637992858887, "global_step": 295577, "epoch": 1759} {"train_loss": -11.725909233093262, "global_step": 295578, "epoch": 1759} {"train_loss": -11.76573371887207, "global_step": 295579, "epoch": 1759} {"train_loss": -11.708860397338867, "global_step": 295580, "epoch": 1759} {"train_loss": -11.8662748336792, "global_step": 295581, "epoch": 1759} {"train_loss": -11.010943412780762, "global_step": 295582, "epoch": 1759} {"train_loss": -11.819305419921875, "global_step": 295583, "epoch": 1759} {"train_loss": -11.135098457336426, "global_step": 295584, "epoch": 1759} {"train_loss": -11.336639404296875, "global_step": 295585, "epoch": 1759} {"train_loss": -11.534943580627441, "global_step": 295586, "epoch": 1759} {"train_loss": -11.563926696777344, "global_step": 295587, "epoch": 1759} {"train_loss": -11.979372024536133, "global_step": 295588, "epoch": 1759} {"train_loss": -11.441442489624023, "global_step": 295589, "epoch": 1759} {"train_loss": -12.352933883666992, "global_step": 295590, "epoch": 1759} {"train_loss": -11.431428909301758, "global_step": 295591, "epoch": 1759} {"train_loss": -11.477399826049805, "global_step": 295592, "epoch": 1759} {"train_loss": -12.06764030456543, "global_step": 295593, "epoch": 1759} {"train_loss": -11.680564880371094, "global_step": 295594, "epoch": 1759} {"train_loss": -12.067901611328125, "global_step": 295595, "epoch": 1759} {"train_loss": -11.765528678894043, "global_step": 295596, "epoch": 1759} {"train_loss": -11.636150360107422, "global_step": 295597, "epoch": 1759} {"train_loss": -11.855725288391113, "global_step": 295598, "epoch": 1759} {"train_loss": -11.771608352661133, "global_step": 295599, "epoch": 1759} {"train_loss": -11.514261245727539, "global_step": 295600, "epoch": 1759} {"train_loss": -11.910318374633789, "global_step": 295601, "epoch": 1759} {"train_loss": -11.174034118652344, "global_step": 295602, "epoch": 1759} {"train_loss": -12.047653198242188, "global_step": 295603, "epoch": 1759} {"train_loss": -11.428006172180176, "global_step": 295604, "epoch": 1759} {"train_loss": -11.723560333251953, "global_step": 295605, "epoch": 1759} {"train_loss": -12.171281814575195, "global_step": 295606, "epoch": 1759} {"train_loss": -11.753730773925781, "global_step": 295607, "epoch": 1759} {"train_loss": -11.89550495147705, "global_step": 295608, "epoch": 1759} {"train_loss": -11.892425537109375, "global_step": 295609, "epoch": 1759} {"train_loss": -12.110570907592773, "global_step": 295610, "epoch": 1759} {"train_loss": -12.033392906188965, "global_step": 295611, "epoch": 1759} {"train_loss": -12.104476928710938, "global_step": 295612, "epoch": 1759} {"train_loss": -12.03514289855957, "global_step": 295613, "epoch": 1759} {"train_loss": -11.89657211303711, "global_step": 295614, "epoch": 1759} {"train_loss": -12.120477676391602, "global_step": 295615, "epoch": 1759} {"train_loss": -12.058984756469727, "global_step": 295616, "epoch": 1759} {"train_loss": -12.134075164794922, "global_step": 295617, "epoch": 1759} {"train_loss": -12.01535415649414, "global_step": 295618, "epoch": 1759} {"train_loss": -11.998727798461914, "global_step": 295619, "epoch": 1759} {"train_loss": -12.175037384033203, "global_step": 295620, "epoch": 1759} {"train_loss": -12.125024795532227, "global_step": 295621, "epoch": 1759} {"train_loss": -11.814008712768555, "global_step": 295622, "epoch": 1759} {"train_loss": -12.220702171325684, "global_step": 295623, "epoch": 1759} {"train_loss": -11.797374725341797, "global_step": 295624, "epoch": 1759} {"train_loss": -12.382179260253906, "global_step": 295625, "epoch": 1759} {"train_loss": -12.008207321166992, "global_step": 295626, "epoch": 1759} {"train_loss": -12.023242950439453, "global_step": 295627, "epoch": 1759} {"train_loss": -12.178886413574219, "global_step": 295628, "epoch": 1759} {"train_loss": -12.088279724121094, "global_step": 295629, "epoch": 1759} {"train_loss": -12.066118240356445, "global_step": 295630, "epoch": 1759} {"train_loss": -12.203079223632812, "global_step": 295631, "epoch": 1759} {"train_loss": -12.189774513244629, "global_step": 295632, "epoch": 1759} {"train_loss": -12.099212646484375, "global_step": 295633, "epoch": 1759} {"train_loss": -12.305855751037598, "global_step": 295634, "epoch": 1759} {"train_loss": -11.906181335449219, "global_step": 295635, "epoch": 1759} {"train_loss": -12.135054588317871, "global_step": 295636, "epoch": 1759} {"train_loss": -12.068578720092773, "global_step": 295637, "epoch": 1759} {"train_loss": -12.124632835388184, "global_step": 295638, "epoch": 1759} {"train_loss": -12.235416412353516, "global_step": 295639, "epoch": 1759} {"train_loss": -12.004769325256348, "global_step": 295640, "epoch": 1759} {"train_loss": -12.282319068908691, "global_step": 295641, "epoch": 1759} {"train_loss": -11.967950820922852, "global_step": 295642, "epoch": 1759} {"train_loss": -12.252283096313477, "global_step": 295643, "epoch": 1759} {"train_loss": -12.027241706848145, "global_step": 295644, "epoch": 1759} {"train_loss": -12.347685813903809, "global_step": 295645, "epoch": 1759} {"train_loss": -11.836594581604004, "global_step": 295646, "epoch": 1759} {"train_loss": -11.84353256225586, "global_step": 295647, "epoch": 1759} {"train_loss": -12.292156219482422, "global_step": 295648, "epoch": 1759} {"train_loss": -12.04101276397705, "global_step": 295649, "epoch": 1759} {"train_loss": -11.956616401672363, "global_step": 295650, "epoch": 1759} {"train_loss": -12.07007122039795, "global_step": 295651, "epoch": 1759} {"train_loss": -11.988137245178223, "global_step": 295652, "epoch": 1759} {"train_loss": -11.812135696411133, "global_step": 295653, "epoch": 1759} {"train_loss": -11.67074203491211, "global_step": 295654, "epoch": 1759} {"train_loss": -11.442256927490234, "global_step": 295655, "epoch": 1759} {"train_loss": -11.91645622253418, "global_step": 295656, "epoch": 1759} {"train_loss": -11.925894737243652, "global_step": 295657, "epoch": 1759} {"train_loss": -11.169198989868164, "global_step": 295658, "epoch": 1759} {"train_loss": -11.801162719726562, "global_step": 295659, "epoch": 1759} {"train_loss": -11.239580154418945, "global_step": 295660, "epoch": 1759} {"train_loss": -12.040627479553223, "global_step": 295661, "epoch": 1759} {"train_loss": -10.77338695526123, "global_step": 295662, "epoch": 1759} {"train_loss": -11.513973236083984, "global_step": 295663, "epoch": 1759} {"train_loss": -10.882965087890625, "global_step": 295664, "epoch": 1759} {"train_loss": -10.167680740356445, "global_step": 295665, "epoch": 1759} {"train_loss": -9.442644119262695, "global_step": 295666, "epoch": 1759} {"train_loss": -10.76048469543457, "global_step": 295667, "epoch": 1759} {"train_loss": -10.33726692199707, "global_step": 295668, "epoch": 1759} {"train_loss": -8.641189575195312, "global_step": 295669, "epoch": 1759} {"train_loss": -9.69991683959961, "global_step": 295670, "epoch": 1759} {"train_loss": -10.916055679321289, "global_step": 295671, "epoch": 1759} {"train_loss": -9.649133682250977, "global_step": 295672, "epoch": 1759} {"train_loss": -11.195841789245605, "global_step": 295673, "epoch": 1759} {"train_loss": -10.614161491394043, "global_step": 295674, "epoch": 1759} {"train_loss": -10.49509048461914, "global_step": 295675, "epoch": 1759} {"train_loss": -11.122777938842773, "global_step": 295676, "epoch": 1759} {"train_loss": -10.273969650268555, "global_step": 295677, "epoch": 1759} {"train_loss": -10.51321792602539, "global_step": 295678, "epoch": 1759} {"train_loss": -11.379666952859788, "global_step": 295679, "epoch": 1759, "val_loss": 269757.375} {"train_loss": -9.062549591064453, "global_step": 295680, "epoch": 1760} {"train_loss": -10.782440185546875, "global_step": 295681, "epoch": 1760} {"train_loss": -9.990947723388672, "global_step": 295682, "epoch": 1760} {"train_loss": -10.263580322265625, "global_step": 295683, "epoch": 1760} {"train_loss": -10.226486206054688, "global_step": 295684, "epoch": 1760} {"train_loss": -10.185813903808594, "global_step": 295685, "epoch": 1760} {"train_loss": -10.718399047851562, "global_step": 295686, "epoch": 1760} {"train_loss": -11.618959426879883, "global_step": 295687, "epoch": 1760} {"train_loss": -10.949332237243652, "global_step": 295688, "epoch": 1760} {"train_loss": -10.913963317871094, "global_step": 295689, "epoch": 1760} {"train_loss": -11.48194694519043, "global_step": 295690, "epoch": 1760} {"train_loss": -11.110669136047363, "global_step": 295691, "epoch": 1760} {"train_loss": -11.10067081451416, "global_step": 295692, "epoch": 1760} {"train_loss": -11.47627067565918, "global_step": 295693, "epoch": 1760} {"train_loss": -11.001501083374023, "global_step": 295694, "epoch": 1760} {"train_loss": -11.622899055480957, "global_step": 295695, "epoch": 1760} {"train_loss": -11.85241413116455, "global_step": 295696, "epoch": 1760} {"train_loss": -11.29306411743164, "global_step": 295697, "epoch": 1760} {"train_loss": -11.487014770507812, "global_step": 295698, "epoch": 1760} {"train_loss": -11.548391342163086, "global_step": 295699, "epoch": 1760} {"train_loss": -11.452985763549805, "global_step": 295700, "epoch": 1760} {"train_loss": -11.848346710205078, "global_step": 295701, "epoch": 1760} {"train_loss": -11.787226676940918, "global_step": 295702, "epoch": 1760} {"train_loss": -11.682427406311035, "global_step": 295703, "epoch": 1760} {"train_loss": -11.783428192138672, "global_step": 295704, "epoch": 1760} {"train_loss": -11.622703552246094, "global_step": 295705, "epoch": 1760} {"train_loss": -11.938325881958008, "global_step": 295706, "epoch": 1760} {"train_loss": -11.531768798828125, "global_step": 295707, "epoch": 1760} {"train_loss": -11.92768383026123, "global_step": 295708, "epoch": 1760} {"train_loss": -11.721052169799805, "global_step": 295709, "epoch": 1760} {"train_loss": -11.929802894592285, "global_step": 295710, "epoch": 1760} {"train_loss": -11.912500381469727, "global_step": 295711, "epoch": 1760} {"train_loss": -11.861482620239258, "global_step": 295712, "epoch": 1760} {"train_loss": -11.857112884521484, "global_step": 295713, "epoch": 1760} {"train_loss": -12.148402214050293, "global_step": 295714, "epoch": 1760} {"train_loss": -11.963241577148438, "global_step": 295715, "epoch": 1760} {"train_loss": -12.121838569641113, "global_step": 295716, "epoch": 1760} {"train_loss": -11.785109519958496, "global_step": 295717, "epoch": 1760} {"train_loss": -11.980730056762695, "global_step": 295718, "epoch": 1760} {"train_loss": -11.874449729919434, "global_step": 295719, "epoch": 1760} {"train_loss": -12.005200386047363, "global_step": 295720, "epoch": 1760} {"train_loss": -12.002206802368164, "global_step": 295721, "epoch": 1760} {"train_loss": -11.934890747070312, "global_step": 295722, "epoch": 1760} {"train_loss": -12.103084564208984, "global_step": 295723, "epoch": 1760} {"train_loss": -12.034059524536133, "global_step": 295724, "epoch": 1760} {"train_loss": -12.216064453125, "global_step": 295725, "epoch": 1760} {"train_loss": -11.89621639251709, "global_step": 295726, "epoch": 1760} {"train_loss": -12.049951553344727, "global_step": 295727, "epoch": 1760} {"train_loss": -11.990478515625, "global_step": 295728, "epoch": 1760} {"train_loss": -12.104471206665039, "global_step": 295729, "epoch": 1760} {"train_loss": -12.144024848937988, "global_step": 295730, "epoch": 1760} {"train_loss": -11.953568458557129, "global_step": 295731, "epoch": 1760} {"train_loss": -12.120646476745605, "global_step": 295732, "epoch": 1760} {"train_loss": -12.05673885345459, "global_step": 295733, "epoch": 1760} {"train_loss": -12.212579727172852, "global_step": 295734, "epoch": 1760} {"train_loss": -12.157624244689941, "global_step": 295735, "epoch": 1760} {"train_loss": -12.046455383300781, "global_step": 295736, "epoch": 1760} {"train_loss": -12.200077056884766, "global_step": 295737, "epoch": 1760} {"train_loss": -11.962153434753418, "global_step": 295738, "epoch": 1760} {"train_loss": -12.338113784790039, "global_step": 295739, "epoch": 1760} {"train_loss": -12.155906677246094, "global_step": 295740, "epoch": 1760} {"train_loss": -12.091686248779297, "global_step": 295741, "epoch": 1760} {"train_loss": -11.824731826782227, "global_step": 295742, "epoch": 1760} {"train_loss": -11.640069961547852, "global_step": 295743, "epoch": 1760} {"train_loss": -12.193517684936523, "global_step": 295744, "epoch": 1760} {"train_loss": -11.968897819519043, "global_step": 295745, "epoch": 1760} {"train_loss": -11.981706619262695, "global_step": 295746, "epoch": 1760} {"train_loss": -12.219308853149414, "global_step": 295747, "epoch": 1760} {"train_loss": -11.815436363220215, "global_step": 295748, "epoch": 1760} {"train_loss": -12.059003829956055, "global_step": 295749, "epoch": 1760} {"train_loss": -12.046570777893066, "global_step": 295750, "epoch": 1760} {"train_loss": -11.851905822753906, "global_step": 295751, "epoch": 1760} {"train_loss": -12.067561149597168, "global_step": 295752, "epoch": 1760} {"train_loss": -12.288248062133789, "global_step": 295753, "epoch": 1760} {"train_loss": -11.836484909057617, "global_step": 295754, "epoch": 1760} {"train_loss": -12.243369102478027, "global_step": 295755, "epoch": 1760} {"train_loss": -11.81344223022461, "global_step": 295756, "epoch": 1760} {"train_loss": -11.964178085327148, "global_step": 295757, "epoch": 1760} {"train_loss": -11.67636775970459, "global_step": 295758, "epoch": 1760} {"train_loss": -11.93362045288086, "global_step": 295759, "epoch": 1760} {"train_loss": -11.419733047485352, "global_step": 295760, "epoch": 1760} {"train_loss": -12.025619506835938, "global_step": 295761, "epoch": 1760} {"train_loss": -12.069376945495605, "global_step": 295762, "epoch": 1760} {"train_loss": -11.883663177490234, "global_step": 295763, "epoch": 1760} {"train_loss": -11.903767585754395, "global_step": 295764, "epoch": 1760} {"train_loss": -12.130016326904297, "global_step": 295765, "epoch": 1760} {"train_loss": -12.07492446899414, "global_step": 295766, "epoch": 1760} {"train_loss": -11.744324684143066, "global_step": 295767, "epoch": 1760} {"train_loss": -12.167959213256836, "global_step": 295768, "epoch": 1760} {"train_loss": -11.737157821655273, "global_step": 295769, "epoch": 1760} {"train_loss": -12.05738639831543, "global_step": 295770, "epoch": 1760} {"train_loss": -12.104745864868164, "global_step": 295771, "epoch": 1760} {"train_loss": -11.78221607208252, "global_step": 295772, "epoch": 1760} {"train_loss": -12.135311126708984, "global_step": 295773, "epoch": 1760} {"train_loss": -11.75739574432373, "global_step": 295774, "epoch": 1760} {"train_loss": -12.164886474609375, "global_step": 295775, "epoch": 1760} {"train_loss": -11.706781387329102, "global_step": 295776, "epoch": 1760} {"train_loss": -11.698110580444336, "global_step": 295777, "epoch": 1760} {"train_loss": -11.847532272338867, "global_step": 295778, "epoch": 1760} {"train_loss": -11.642621994018555, "global_step": 295779, "epoch": 1760} {"train_loss": -11.08387565612793, "global_step": 295780, "epoch": 1760} {"train_loss": -11.810552597045898, "global_step": 295781, "epoch": 1760} {"train_loss": -11.621686935424805, "global_step": 295782, "epoch": 1760} {"train_loss": -11.765655517578125, "global_step": 295783, "epoch": 1760} {"train_loss": -11.985299110412598, "global_step": 295784, "epoch": 1760} {"train_loss": -11.378095626831055, "global_step": 295785, "epoch": 1760} {"train_loss": -11.928133010864258, "global_step": 295786, "epoch": 1760} {"train_loss": -11.409161567687988, "global_step": 295787, "epoch": 1760} {"train_loss": -10.979093551635742, "global_step": 295788, "epoch": 1760} {"train_loss": -11.095247268676758, "global_step": 295789, "epoch": 1760} {"train_loss": -11.812213897705078, "global_step": 295790, "epoch": 1760} {"train_loss": -10.381452560424805, "global_step": 295791, "epoch": 1760} {"train_loss": -11.963534355163574, "global_step": 295792, "epoch": 1760} {"train_loss": -11.021415710449219, "global_step": 295793, "epoch": 1760} {"train_loss": -11.303886413574219, "global_step": 295794, "epoch": 1760} {"train_loss": -11.66929817199707, "global_step": 295795, "epoch": 1760} {"train_loss": -10.883115768432617, "global_step": 295796, "epoch": 1760} {"train_loss": -12.168682098388672, "global_step": 295797, "epoch": 1760} {"train_loss": -10.930898666381836, "global_step": 295798, "epoch": 1760} {"train_loss": -11.786138534545898, "global_step": 295799, "epoch": 1760} {"train_loss": -11.538432121276855, "global_step": 295800, "epoch": 1760} {"train_loss": -11.27135181427002, "global_step": 295801, "epoch": 1760} {"train_loss": -11.723783493041992, "global_step": 295802, "epoch": 1760} {"train_loss": -11.733758926391602, "global_step": 295803, "epoch": 1760} {"train_loss": -11.805956840515137, "global_step": 295804, "epoch": 1760} {"train_loss": -11.94637680053711, "global_step": 295805, "epoch": 1760} {"train_loss": -11.951691627502441, "global_step": 295806, "epoch": 1760} {"train_loss": -11.794910430908203, "global_step": 295807, "epoch": 1760} {"train_loss": -12.038948059082031, "global_step": 295808, "epoch": 1760} {"train_loss": -11.801856994628906, "global_step": 295809, "epoch": 1760} {"train_loss": -11.483207702636719, "global_step": 295810, "epoch": 1760} {"train_loss": -11.38878059387207, "global_step": 295811, "epoch": 1760} {"train_loss": -11.78245735168457, "global_step": 295812, "epoch": 1760} {"train_loss": -11.7213134765625, "global_step": 295813, "epoch": 1760} {"train_loss": -11.050250053405762, "global_step": 295814, "epoch": 1760} {"train_loss": -10.08337688446045, "global_step": 295815, "epoch": 1760} {"train_loss": -11.330982208251953, "global_step": 295816, "epoch": 1760} {"train_loss": -10.226536750793457, "global_step": 295817, "epoch": 1760} {"train_loss": -11.403027534484863, "global_step": 295818, "epoch": 1760} {"train_loss": -11.045225143432617, "global_step": 295819, "epoch": 1760} {"train_loss": -11.653590202331543, "global_step": 295820, "epoch": 1760} {"train_loss": -11.347407341003418, "global_step": 295821, "epoch": 1760} {"train_loss": -11.968600273132324, "global_step": 295822, "epoch": 1760} {"train_loss": -11.458425521850586, "global_step": 295823, "epoch": 1760} {"train_loss": -11.865337371826172, "global_step": 295824, "epoch": 1760} {"train_loss": -11.696949005126953, "global_step": 295825, "epoch": 1760} {"train_loss": -11.421310424804688, "global_step": 295826, "epoch": 1760} {"train_loss": -12.065281867980957, "global_step": 295827, "epoch": 1760} {"train_loss": -11.580824851989746, "global_step": 295828, "epoch": 1760} {"train_loss": -11.645816802978516, "global_step": 295829, "epoch": 1760} {"train_loss": -12.017765045166016, "global_step": 295830, "epoch": 1760} {"train_loss": -11.829936027526855, "global_step": 295831, "epoch": 1760} {"train_loss": -12.07565689086914, "global_step": 295832, "epoch": 1760} {"train_loss": -11.98154354095459, "global_step": 295833, "epoch": 1760} {"train_loss": -12.052974700927734, "global_step": 295834, "epoch": 1760} {"train_loss": -11.987624168395996, "global_step": 295835, "epoch": 1760} {"train_loss": -12.300117492675781, "global_step": 295836, "epoch": 1760} {"train_loss": -12.049434661865234, "global_step": 295837, "epoch": 1760} {"train_loss": -11.868417739868164, "global_step": 295838, "epoch": 1760} {"train_loss": -12.099339485168457, "global_step": 295839, "epoch": 1760} {"train_loss": -12.05428695678711, "global_step": 295840, "epoch": 1760} {"train_loss": -12.266460418701172, "global_step": 295841, "epoch": 1760} {"train_loss": -12.148138999938965, "global_step": 295842, "epoch": 1760} {"train_loss": -12.095340728759766, "global_step": 295843, "epoch": 1760} {"train_loss": -12.142692565917969, "global_step": 295844, "epoch": 1760} {"train_loss": -12.310903549194336, "global_step": 295845, "epoch": 1760} {"train_loss": -12.218988418579102, "global_step": 295846, "epoch": 1760} {"train_loss": -11.705949885504586, "global_step": 295847, "epoch": 1760, "val_loss": 280114.3125, "train_action_mse_error": 4.365351676940918} {"train_loss": -12.317684173583984, "global_step": 295848, "epoch": 1761} {"train_loss": -11.911401748657227, "global_step": 295849, "epoch": 1761} {"train_loss": -11.93055534362793, "global_step": 295850, "epoch": 1761} {"train_loss": -12.232626914978027, "global_step": 295851, "epoch": 1761} {"train_loss": -11.904413223266602, "global_step": 295852, "epoch": 1761} {"train_loss": -12.078890800476074, "global_step": 295853, "epoch": 1761} {"train_loss": -12.21310806274414, "global_step": 295854, "epoch": 1761} {"train_loss": -11.658931732177734, "global_step": 295855, "epoch": 1761} {"train_loss": -12.045235633850098, "global_step": 295856, "epoch": 1761} {"train_loss": -12.058148384094238, "global_step": 295857, "epoch": 1761} {"train_loss": -11.866052627563477, "global_step": 295858, "epoch": 1761} {"train_loss": -11.828022003173828, "global_step": 295859, "epoch": 1761} {"train_loss": -12.189088821411133, "global_step": 295860, "epoch": 1761} {"train_loss": -11.835216522216797, "global_step": 295861, "epoch": 1761} {"train_loss": -11.844541549682617, "global_step": 295862, "epoch": 1761} {"train_loss": -12.309526443481445, "global_step": 295863, "epoch": 1761} {"train_loss": -12.280512809753418, "global_step": 295864, "epoch": 1761} {"train_loss": -11.938362121582031, "global_step": 295865, "epoch": 1761} {"train_loss": -11.983220100402832, "global_step": 295866, "epoch": 1761} {"train_loss": -12.059450149536133, "global_step": 295867, "epoch": 1761} {"train_loss": -12.172908782958984, "global_step": 295868, "epoch": 1761} {"train_loss": -11.497533798217773, "global_step": 295869, "epoch": 1761} {"train_loss": -12.276935577392578, "global_step": 295870, "epoch": 1761} {"train_loss": -11.534873008728027, "global_step": 295871, "epoch": 1761} {"train_loss": -12.133716583251953, "global_step": 295872, "epoch": 1761} {"train_loss": -11.956000328063965, "global_step": 295873, "epoch": 1761} {"train_loss": -12.126090049743652, "global_step": 295874, "epoch": 1761} {"train_loss": -11.53677749633789, "global_step": 295875, "epoch": 1761} {"train_loss": -11.996875762939453, "global_step": 295876, "epoch": 1761} {"train_loss": -11.118263244628906, "global_step": 295877, "epoch": 1761} {"train_loss": -12.25432014465332, "global_step": 295878, "epoch": 1761} {"train_loss": -11.879104614257812, "global_step": 295879, "epoch": 1761} {"train_loss": -11.074980735778809, "global_step": 295880, "epoch": 1761} {"train_loss": -11.58175277709961, "global_step": 295881, "epoch": 1761} {"train_loss": -12.15828800201416, "global_step": 295882, "epoch": 1761} {"train_loss": -11.211567878723145, "global_step": 295883, "epoch": 1761} {"train_loss": -11.506217002868652, "global_step": 295884, "epoch": 1761} {"train_loss": -12.06866455078125, "global_step": 295885, "epoch": 1761} {"train_loss": -11.897878646850586, "global_step": 295886, "epoch": 1761} {"train_loss": -12.394525527954102, "global_step": 295887, "epoch": 1761} {"train_loss": -11.936347961425781, "global_step": 295888, "epoch": 1761} {"train_loss": -11.672216415405273, "global_step": 295889, "epoch": 1761} {"train_loss": -12.268189430236816, "global_step": 295890, "epoch": 1761} {"train_loss": -12.022571563720703, "global_step": 295891, "epoch": 1761} {"train_loss": -11.894251823425293, "global_step": 295892, "epoch": 1761} {"train_loss": -12.386567115783691, "global_step": 295893, "epoch": 1761} {"train_loss": -11.55983829498291, "global_step": 295894, "epoch": 1761} {"train_loss": -11.28217601776123, "global_step": 295895, "epoch": 1761} {"train_loss": -12.220317840576172, "global_step": 295896, "epoch": 1761} {"train_loss": -11.223020553588867, "global_step": 295897, "epoch": 1761} {"train_loss": -11.745814323425293, "global_step": 295898, "epoch": 1761} {"train_loss": -11.775029182434082, "global_step": 295899, "epoch": 1761} {"train_loss": -11.0427827835083, "global_step": 295900, "epoch": 1761} {"train_loss": -11.447866439819336, "global_step": 295901, "epoch": 1761} {"train_loss": -10.76715087890625, "global_step": 295902, "epoch": 1761} {"train_loss": -11.184661865234375, "global_step": 295903, "epoch": 1761} {"train_loss": -11.219644546508789, "global_step": 295904, "epoch": 1761} {"train_loss": -10.146994590759277, "global_step": 295905, "epoch": 1761} {"train_loss": -11.973477363586426, "global_step": 295906, "epoch": 1761} {"train_loss": -10.86231517791748, "global_step": 295907, "epoch": 1761} {"train_loss": -11.40391731262207, "global_step": 295908, "epoch": 1761} {"train_loss": -10.523399353027344, "global_step": 295909, "epoch": 1761} {"train_loss": -10.78808879852295, "global_step": 295910, "epoch": 1761} {"train_loss": -11.060876846313477, "global_step": 295911, "epoch": 1761} {"train_loss": -10.620725631713867, "global_step": 295912, "epoch": 1761} {"train_loss": -10.669637680053711, "global_step": 295913, "epoch": 1761} {"train_loss": -11.154720306396484, "global_step": 295914, "epoch": 1761} {"train_loss": -11.156742095947266, "global_step": 295915, "epoch": 1761} {"train_loss": -11.890494346618652, "global_step": 295916, "epoch": 1761} {"train_loss": -10.5203218460083, "global_step": 295917, "epoch": 1761} {"train_loss": -10.783683776855469, "global_step": 295918, "epoch": 1761} {"train_loss": -11.410686492919922, "global_step": 295919, "epoch": 1761} {"train_loss": -10.590866088867188, "global_step": 295920, "epoch": 1761} {"train_loss": -11.83148193359375, "global_step": 295921, "epoch": 1761} {"train_loss": -11.816974639892578, "global_step": 295922, "epoch": 1761} {"train_loss": -11.752058029174805, "global_step": 295923, "epoch": 1761} {"train_loss": -11.797759056091309, "global_step": 295924, "epoch": 1761} {"train_loss": -11.628039360046387, "global_step": 295925, "epoch": 1761} {"train_loss": -11.878674507141113, "global_step": 295926, "epoch": 1761} {"train_loss": -11.66264533996582, "global_step": 295927, "epoch": 1761} {"train_loss": -11.592628479003906, "global_step": 295928, "epoch": 1761} {"train_loss": -11.91590404510498, "global_step": 295929, "epoch": 1761} {"train_loss": -11.809942245483398, "global_step": 295930, "epoch": 1761} {"train_loss": -11.715757369995117, "global_step": 295931, "epoch": 1761} {"train_loss": -11.303842544555664, "global_step": 295932, "epoch": 1761} {"train_loss": -11.593757629394531, "global_step": 295933, "epoch": 1761} {"train_loss": -11.915184020996094, "global_step": 295934, "epoch": 1761} {"train_loss": -11.49111557006836, "global_step": 295935, "epoch": 1761} {"train_loss": -12.021913528442383, "global_step": 295936, "epoch": 1761} {"train_loss": -11.703293800354004, "global_step": 295937, "epoch": 1761} {"train_loss": -11.788071632385254, "global_step": 295938, "epoch": 1761} {"train_loss": -11.963663101196289, "global_step": 295939, "epoch": 1761} {"train_loss": -11.651360511779785, "global_step": 295940, "epoch": 1761} {"train_loss": -11.904142379760742, "global_step": 295941, "epoch": 1761} {"train_loss": -11.461660385131836, "global_step": 295942, "epoch": 1761} {"train_loss": -11.87307071685791, "global_step": 295943, "epoch": 1761} {"train_loss": -11.943578720092773, "global_step": 295944, "epoch": 1761} {"train_loss": -11.835517883300781, "global_step": 295945, "epoch": 1761} {"train_loss": -12.081096649169922, "global_step": 295946, "epoch": 1761} {"train_loss": -12.05569076538086, "global_step": 295947, "epoch": 1761} {"train_loss": -11.869220733642578, "global_step": 295948, "epoch": 1761} {"train_loss": -11.863525390625, "global_step": 295949, "epoch": 1761} {"train_loss": -11.745388984680176, "global_step": 295950, "epoch": 1761} {"train_loss": -12.07046127319336, "global_step": 295951, "epoch": 1761} {"train_loss": -12.196599960327148, "global_step": 295952, "epoch": 1761} {"train_loss": -12.179154396057129, "global_step": 295953, "epoch": 1761} {"train_loss": -12.002617835998535, "global_step": 295954, "epoch": 1761} {"train_loss": -12.185710906982422, "global_step": 295955, "epoch": 1761} {"train_loss": -12.249982833862305, "global_step": 295956, "epoch": 1761} {"train_loss": -12.105911254882812, "global_step": 295957, "epoch": 1761} {"train_loss": -11.933359146118164, "global_step": 295958, "epoch": 1761} {"train_loss": -11.833776473999023, "global_step": 295959, "epoch": 1761} {"train_loss": -11.904561042785645, "global_step": 295960, "epoch": 1761} {"train_loss": -12.094940185546875, "global_step": 295961, "epoch": 1761} {"train_loss": -11.732889175415039, "global_step": 295962, "epoch": 1761} {"train_loss": -11.736955642700195, "global_step": 295963, "epoch": 1761} {"train_loss": -12.067207336425781, "global_step": 295964, "epoch": 1761} {"train_loss": -12.019126892089844, "global_step": 295965, "epoch": 1761} {"train_loss": -11.829376220703125, "global_step": 295966, "epoch": 1761} {"train_loss": -12.07282829284668, "global_step": 295967, "epoch": 1761} {"train_loss": -11.732942581176758, "global_step": 295968, "epoch": 1761} {"train_loss": -11.460681915283203, "global_step": 295969, "epoch": 1761} {"train_loss": -12.207479476928711, "global_step": 295970, "epoch": 1761} {"train_loss": -11.73024845123291, "global_step": 295971, "epoch": 1761} {"train_loss": -12.01253604888916, "global_step": 295972, "epoch": 1761} {"train_loss": -11.845650672912598, "global_step": 295973, "epoch": 1761} {"train_loss": -11.406621932983398, "global_step": 295974, "epoch": 1761} {"train_loss": -12.208564758300781, "global_step": 295975, "epoch": 1761} {"train_loss": -11.165596008300781, "global_step": 295976, "epoch": 1761} {"train_loss": -10.193483352661133, "global_step": 295977, "epoch": 1761} {"train_loss": -12.261054992675781, "global_step": 295978, "epoch": 1761} {"train_loss": -10.626809120178223, "global_step": 295979, "epoch": 1761} {"train_loss": -10.794548988342285, "global_step": 295980, "epoch": 1761} {"train_loss": -11.838080406188965, "global_step": 295981, "epoch": 1761} {"train_loss": -8.311885833740234, "global_step": 295982, "epoch": 1761} {"train_loss": -9.469987869262695, "global_step": 295983, "epoch": 1761} {"train_loss": -10.822124481201172, "global_step": 295984, "epoch": 1761} {"train_loss": -10.990745544433594, "global_step": 295985, "epoch": 1761} {"train_loss": -9.890815734863281, "global_step": 295986, "epoch": 1761} {"train_loss": -11.402071952819824, "global_step": 295987, "epoch": 1761} {"train_loss": -9.059389114379883, "global_step": 295988, "epoch": 1761} {"train_loss": -11.393417358398438, "global_step": 295989, "epoch": 1761} {"train_loss": -9.517305374145508, "global_step": 295990, "epoch": 1761} {"train_loss": -11.162168502807617, "global_step": 295991, "epoch": 1761} {"train_loss": -10.245077133178711, "global_step": 295992, "epoch": 1761} {"train_loss": -11.230619430541992, "global_step": 295993, "epoch": 1761} {"train_loss": -10.085851669311523, "global_step": 295994, "epoch": 1761} {"train_loss": -11.66439437866211, "global_step": 295995, "epoch": 1761} {"train_loss": -10.44908618927002, "global_step": 295996, "epoch": 1761} {"train_loss": -11.203330993652344, "global_step": 295997, "epoch": 1761} {"train_loss": -11.44763469696045, "global_step": 295998, "epoch": 1761} {"train_loss": -11.2202787399292, "global_step": 295999, "epoch": 1761} {"train_loss": -11.755422592163086, "global_step": 296000, "epoch": 1761} {"train_loss": -11.323229789733887, "global_step": 296001, "epoch": 1761} {"train_loss": -11.610913276672363, "global_step": 296002, "epoch": 1761} {"train_loss": -11.195442199707031, "global_step": 296003, "epoch": 1761} {"train_loss": -11.734323501586914, "global_step": 296004, "epoch": 1761} {"train_loss": -11.374470710754395, "global_step": 296005, "epoch": 1761} {"train_loss": -11.661642074584961, "global_step": 296006, "epoch": 1761} {"train_loss": -11.335933685302734, "global_step": 296007, "epoch": 1761} {"train_loss": -11.83997917175293, "global_step": 296008, "epoch": 1761} {"train_loss": -11.895087242126465, "global_step": 296009, "epoch": 1761} {"train_loss": -11.938821792602539, "global_step": 296010, "epoch": 1761} {"train_loss": -11.924686431884766, "global_step": 296011, "epoch": 1761} {"train_loss": -11.923398971557617, "global_step": 296012, "epoch": 1761} {"train_loss": -11.689298629760742, "global_step": 296013, "epoch": 1761} {"train_loss": -12.121137619018555, "global_step": 296014, "epoch": 1761} {"train_loss": -11.583519305501666, "global_step": 296015, "epoch": 1761, "val_loss": 273659.78125} {"train_loss": -11.81121826171875, "global_step": 296016, "epoch": 1762} {"train_loss": -12.068775177001953, "global_step": 296017, "epoch": 1762} {"train_loss": -11.633491516113281, "global_step": 296018, "epoch": 1762} {"train_loss": -12.11505126953125, "global_step": 296019, "epoch": 1762} {"train_loss": -11.77299690246582, "global_step": 296020, "epoch": 1762} {"train_loss": -11.836803436279297, "global_step": 296021, "epoch": 1762} {"train_loss": -11.901531219482422, "global_step": 296022, "epoch": 1762} {"train_loss": -11.741369247436523, "global_step": 296023, "epoch": 1762} {"train_loss": -11.598257064819336, "global_step": 296024, "epoch": 1762} {"train_loss": -11.889604568481445, "global_step": 296025, "epoch": 1762} {"train_loss": -11.483428001403809, "global_step": 296026, "epoch": 1762} {"train_loss": -11.886434555053711, "global_step": 296027, "epoch": 1762} {"train_loss": -11.585481643676758, "global_step": 296028, "epoch": 1762} {"train_loss": -12.09376335144043, "global_step": 296029, "epoch": 1762} {"train_loss": -11.361230850219727, "global_step": 296030, "epoch": 1762} {"train_loss": -11.569883346557617, "global_step": 296031, "epoch": 1762} {"train_loss": -11.020931243896484, "global_step": 296032, "epoch": 1762} {"train_loss": -11.659770965576172, "global_step": 296033, "epoch": 1762} {"train_loss": -11.150411605834961, "global_step": 296034, "epoch": 1762} {"train_loss": -12.005681991577148, "global_step": 296035, "epoch": 1762} {"train_loss": -11.559379577636719, "global_step": 296036, "epoch": 1762} {"train_loss": -11.647184371948242, "global_step": 296037, "epoch": 1762} {"train_loss": -11.871813774108887, "global_step": 296038, "epoch": 1762} {"train_loss": -11.227310180664062, "global_step": 296039, "epoch": 1762} {"train_loss": -11.862967491149902, "global_step": 296040, "epoch": 1762} {"train_loss": -10.988122940063477, "global_step": 296041, "epoch": 1762} {"train_loss": -12.009156227111816, "global_step": 296042, "epoch": 1762} {"train_loss": -11.544977188110352, "global_step": 296043, "epoch": 1762} {"train_loss": -11.726753234863281, "global_step": 296044, "epoch": 1762} {"train_loss": -11.85838508605957, "global_step": 296045, "epoch": 1762} {"train_loss": -11.745368003845215, "global_step": 296046, "epoch": 1762} {"train_loss": -11.76379108428955, "global_step": 296047, "epoch": 1762} {"train_loss": -11.680484771728516, "global_step": 296048, "epoch": 1762} {"train_loss": -11.747808456420898, "global_step": 296049, "epoch": 1762} {"train_loss": -11.785144805908203, "global_step": 296050, "epoch": 1762} {"train_loss": -11.430612564086914, "global_step": 296051, "epoch": 1762} {"train_loss": -12.02739143371582, "global_step": 296052, "epoch": 1762} {"train_loss": -11.596672058105469, "global_step": 296053, "epoch": 1762} {"train_loss": -11.994039535522461, "global_step": 296054, "epoch": 1762} {"train_loss": -11.700567245483398, "global_step": 296055, "epoch": 1762} {"train_loss": -11.864029884338379, "global_step": 296056, "epoch": 1762} {"train_loss": -11.951607704162598, "global_step": 296057, "epoch": 1762} {"train_loss": -12.040899276733398, "global_step": 296058, "epoch": 1762} {"train_loss": -11.914456367492676, "global_step": 296059, "epoch": 1762} {"train_loss": -12.019688606262207, "global_step": 296060, "epoch": 1762} {"train_loss": -12.039369583129883, "global_step": 296061, "epoch": 1762} {"train_loss": -12.192808151245117, "global_step": 296062, "epoch": 1762} {"train_loss": -12.18425178527832, "global_step": 296063, "epoch": 1762} {"train_loss": -12.215970993041992, "global_step": 296064, "epoch": 1762} {"train_loss": -12.249122619628906, "global_step": 296065, "epoch": 1762} {"train_loss": -12.152687072753906, "global_step": 296066, "epoch": 1762} {"train_loss": -11.7076416015625, "global_step": 296067, "epoch": 1762} {"train_loss": -11.901808738708496, "global_step": 296068, "epoch": 1762} {"train_loss": -11.9359712600708, "global_step": 296069, "epoch": 1762} {"train_loss": -12.310871124267578, "global_step": 296070, "epoch": 1762} {"train_loss": -11.907737731933594, "global_step": 296071, "epoch": 1762} {"train_loss": -12.225019454956055, "global_step": 296072, "epoch": 1762} {"train_loss": -11.852621078491211, "global_step": 296073, "epoch": 1762} {"train_loss": -12.000433921813965, "global_step": 296074, "epoch": 1762} {"train_loss": -11.798288345336914, "global_step": 296075, "epoch": 1762} {"train_loss": -11.929449081420898, "global_step": 296076, "epoch": 1762} {"train_loss": -11.950057983398438, "global_step": 296077, "epoch": 1762} {"train_loss": -12.000258445739746, "global_step": 296078, "epoch": 1762} {"train_loss": -12.181583404541016, "global_step": 296079, "epoch": 1762} {"train_loss": -11.892541885375977, "global_step": 296080, "epoch": 1762} {"train_loss": -12.250240325927734, "global_step": 296081, "epoch": 1762} {"train_loss": -11.900395393371582, "global_step": 296082, "epoch": 1762} {"train_loss": -11.95902156829834, "global_step": 296083, "epoch": 1762} {"train_loss": -11.67166519165039, "global_step": 296084, "epoch": 1762} {"train_loss": -12.482694625854492, "global_step": 296085, "epoch": 1762} {"train_loss": -11.582754135131836, "global_step": 296086, "epoch": 1762} {"train_loss": -12.241230010986328, "global_step": 296087, "epoch": 1762} {"train_loss": -11.95321273803711, "global_step": 296088, "epoch": 1762} {"train_loss": -12.093034744262695, "global_step": 296089, "epoch": 1762} {"train_loss": -12.408065795898438, "global_step": 296090, "epoch": 1762} {"train_loss": -12.045075416564941, "global_step": 296091, "epoch": 1762} {"train_loss": -12.08787727355957, "global_step": 296092, "epoch": 1762} {"train_loss": -12.07565689086914, "global_step": 296093, "epoch": 1762} {"train_loss": -12.250883102416992, "global_step": 296094, "epoch": 1762} {"train_loss": -12.007824897766113, "global_step": 296095, "epoch": 1762} {"train_loss": -12.459105491638184, "global_step": 296096, "epoch": 1762} {"train_loss": -11.852937698364258, "global_step": 296097, "epoch": 1762} {"train_loss": -12.214096069335938, "global_step": 296098, "epoch": 1762} {"train_loss": -12.150568008422852, "global_step": 296099, "epoch": 1762} {"train_loss": -11.799407005310059, "global_step": 296100, "epoch": 1762} {"train_loss": -12.063996315002441, "global_step": 296101, "epoch": 1762} {"train_loss": -11.806595802307129, "global_step": 296102, "epoch": 1762} {"train_loss": -11.914390563964844, "global_step": 296103, "epoch": 1762} {"train_loss": -11.942604064941406, "global_step": 296104, "epoch": 1762} {"train_loss": -12.276741027832031, "global_step": 296105, "epoch": 1762} {"train_loss": -11.572771072387695, "global_step": 296106, "epoch": 1762} {"train_loss": -11.907855033874512, "global_step": 296107, "epoch": 1762} {"train_loss": -11.762937545776367, "global_step": 296108, "epoch": 1762} {"train_loss": -11.799403190612793, "global_step": 296109, "epoch": 1762} {"train_loss": -12.035433769226074, "global_step": 296110, "epoch": 1762} {"train_loss": -11.695501327514648, "global_step": 296111, "epoch": 1762} {"train_loss": -11.934833526611328, "global_step": 296112, "epoch": 1762} {"train_loss": -11.893203735351562, "global_step": 296113, "epoch": 1762} {"train_loss": -12.261083602905273, "global_step": 296114, "epoch": 1762} {"train_loss": -11.872753143310547, "global_step": 296115, "epoch": 1762} {"train_loss": -12.379349708557129, "global_step": 296116, "epoch": 1762} {"train_loss": -11.509366989135742, "global_step": 296117, "epoch": 1762} {"train_loss": -12.050265312194824, "global_step": 296118, "epoch": 1762} {"train_loss": -11.750224113464355, "global_step": 296119, "epoch": 1762} {"train_loss": -11.72069263458252, "global_step": 296120, "epoch": 1762} {"train_loss": -11.606658935546875, "global_step": 296121, "epoch": 1762} {"train_loss": -11.838240623474121, "global_step": 296122, "epoch": 1762} {"train_loss": -12.031744003295898, "global_step": 296123, "epoch": 1762} {"train_loss": -12.058300018310547, "global_step": 296124, "epoch": 1762} {"train_loss": -12.248324394226074, "global_step": 296125, "epoch": 1762} {"train_loss": -12.040760040283203, "global_step": 296126, "epoch": 1762} {"train_loss": -12.310532569885254, "global_step": 296127, "epoch": 1762} {"train_loss": -12.23621654510498, "global_step": 296128, "epoch": 1762} {"train_loss": -12.056005477905273, "global_step": 296129, "epoch": 1762} {"train_loss": -12.134504318237305, "global_step": 296130, "epoch": 1762} {"train_loss": -12.136465072631836, "global_step": 296131, "epoch": 1762} {"train_loss": -12.042852401733398, "global_step": 296132, "epoch": 1762} {"train_loss": -12.117876052856445, "global_step": 296133, "epoch": 1762} {"train_loss": -12.328843116760254, "global_step": 296134, "epoch": 1762} {"train_loss": -11.864826202392578, "global_step": 296135, "epoch": 1762} {"train_loss": -12.232475280761719, "global_step": 296136, "epoch": 1762} {"train_loss": -12.271635055541992, "global_step": 296137, "epoch": 1762} {"train_loss": -11.82199764251709, "global_step": 296138, "epoch": 1762} {"train_loss": -12.07731819152832, "global_step": 296139, "epoch": 1762} {"train_loss": -12.236271858215332, "global_step": 296140, "epoch": 1762} {"train_loss": -12.067453384399414, "global_step": 296141, "epoch": 1762} {"train_loss": -12.006954193115234, "global_step": 296142, "epoch": 1762} {"train_loss": -11.729496955871582, "global_step": 296143, "epoch": 1762} {"train_loss": -12.045232772827148, "global_step": 296144, "epoch": 1762} {"train_loss": -11.413130760192871, "global_step": 296145, "epoch": 1762} {"train_loss": -12.44020938873291, "global_step": 296146, "epoch": 1762} {"train_loss": -11.853766441345215, "global_step": 296147, "epoch": 1762} {"train_loss": -11.566604614257812, "global_step": 296148, "epoch": 1762} {"train_loss": -11.519953727722168, "global_step": 296149, "epoch": 1762} {"train_loss": -12.020028114318848, "global_step": 296150, "epoch": 1762} {"train_loss": -11.412505149841309, "global_step": 296151, "epoch": 1762} {"train_loss": -11.763616561889648, "global_step": 296152, "epoch": 1762} {"train_loss": -11.721536636352539, "global_step": 296153, "epoch": 1762} {"train_loss": -11.219789505004883, "global_step": 296154, "epoch": 1762} {"train_loss": -11.574630737304688, "global_step": 296155, "epoch": 1762} {"train_loss": -11.771583557128906, "global_step": 296156, "epoch": 1762} {"train_loss": -11.218547821044922, "global_step": 296157, "epoch": 1762} {"train_loss": -11.175853729248047, "global_step": 296158, "epoch": 1762} {"train_loss": -11.750789642333984, "global_step": 296159, "epoch": 1762} {"train_loss": -10.25615406036377, "global_step": 296160, "epoch": 1762} {"train_loss": -11.8844575881958, "global_step": 296161, "epoch": 1762} {"train_loss": -9.842767715454102, "global_step": 296162, "epoch": 1762} {"train_loss": -10.597654342651367, "global_step": 296163, "epoch": 1762} {"train_loss": -10.855083465576172, "global_step": 296164, "epoch": 1762} {"train_loss": -10.51837158203125, "global_step": 296165, "epoch": 1762} {"train_loss": -11.10395622253418, "global_step": 296166, "epoch": 1762} {"train_loss": -9.854721069335938, "global_step": 296167, "epoch": 1762} {"train_loss": -11.277351379394531, "global_step": 296168, "epoch": 1762} {"train_loss": -9.915449142456055, "global_step": 296169, "epoch": 1762} {"train_loss": -10.705428123474121, "global_step": 296170, "epoch": 1762} {"train_loss": -10.193866729736328, "global_step": 296171, "epoch": 1762} {"train_loss": -9.831216812133789, "global_step": 296172, "epoch": 1762} {"train_loss": -11.444878578186035, "global_step": 296173, "epoch": 1762} {"train_loss": -10.626676559448242, "global_step": 296174, "epoch": 1762} {"train_loss": -11.084951400756836, "global_step": 296175, "epoch": 1762} {"train_loss": -11.407655715942383, "global_step": 296176, "epoch": 1762} {"train_loss": -10.477029800415039, "global_step": 296177, "epoch": 1762} {"train_loss": -11.896575927734375, "global_step": 296178, "epoch": 1762} {"train_loss": -10.961215019226074, "global_step": 296179, "epoch": 1762} {"train_loss": -11.603708267211914, "global_step": 296180, "epoch": 1762} {"train_loss": -11.491647720336914, "global_step": 296181, "epoch": 1762} {"train_loss": -11.216693878173828, "global_step": 296182, "epoch": 1762} {"train_loss": -11.742025017738342, "global_step": 296183, "epoch": 1762, "val_loss": 276268.28125} {"train_loss": -11.645191192626953, "global_step": 296184, "epoch": 1763} {"train_loss": -11.573464393615723, "global_step": 296185, "epoch": 1763} {"train_loss": -11.925931930541992, "global_step": 296186, "epoch": 1763} {"train_loss": -11.515009880065918, "global_step": 296187, "epoch": 1763} {"train_loss": -11.948732376098633, "global_step": 296188, "epoch": 1763} {"train_loss": -11.637823104858398, "global_step": 296189, "epoch": 1763} {"train_loss": -11.895538330078125, "global_step": 296190, "epoch": 1763} {"train_loss": -11.962418556213379, "global_step": 296191, "epoch": 1763} {"train_loss": -11.802867889404297, "global_step": 296192, "epoch": 1763} {"train_loss": -11.625539779663086, "global_step": 296193, "epoch": 1763} {"train_loss": -11.953792572021484, "global_step": 296194, "epoch": 1763} {"train_loss": -11.794734001159668, "global_step": 296195, "epoch": 1763} {"train_loss": -11.956315994262695, "global_step": 296196, "epoch": 1763} {"train_loss": -11.746256828308105, "global_step": 296197, "epoch": 1763} {"train_loss": -11.856820106506348, "global_step": 296198, "epoch": 1763} {"train_loss": -11.926213264465332, "global_step": 296199, "epoch": 1763} {"train_loss": -11.901786804199219, "global_step": 296200, "epoch": 1763} {"train_loss": -12.03072738647461, "global_step": 296201, "epoch": 1763} {"train_loss": -11.900999069213867, "global_step": 296202, "epoch": 1763} {"train_loss": -12.194377899169922, "global_step": 296203, "epoch": 1763} {"train_loss": -12.139877319335938, "global_step": 296204, "epoch": 1763} {"train_loss": -12.200431823730469, "global_step": 296205, "epoch": 1763} {"train_loss": -12.016868591308594, "global_step": 296206, "epoch": 1763} {"train_loss": -11.97952651977539, "global_step": 296207, "epoch": 1763} {"train_loss": -11.928094863891602, "global_step": 296208, "epoch": 1763} {"train_loss": -12.169221878051758, "global_step": 296209, "epoch": 1763} {"train_loss": -11.946723937988281, "global_step": 296210, "epoch": 1763} {"train_loss": -12.272034645080566, "global_step": 296211, "epoch": 1763} {"train_loss": -11.946690559387207, "global_step": 296212, "epoch": 1763} {"train_loss": -12.116167068481445, "global_step": 296213, "epoch": 1763} {"train_loss": -12.176959991455078, "global_step": 296214, "epoch": 1763} {"train_loss": -12.047106742858887, "global_step": 296215, "epoch": 1763} {"train_loss": -11.9691162109375, "global_step": 296216, "epoch": 1763} {"train_loss": -12.292308807373047, "global_step": 296217, "epoch": 1763} {"train_loss": -11.921582221984863, "global_step": 296218, "epoch": 1763} {"train_loss": -12.205336570739746, "global_step": 296219, "epoch": 1763} {"train_loss": -12.252359390258789, "global_step": 296220, "epoch": 1763} {"train_loss": -12.122835159301758, "global_step": 296221, "epoch": 1763} {"train_loss": -12.197563171386719, "global_step": 296222, "epoch": 1763} {"train_loss": -12.155149459838867, "global_step": 296223, "epoch": 1763} {"train_loss": -12.221354484558105, "global_step": 296224, "epoch": 1763} {"train_loss": -11.98409366607666, "global_step": 296225, "epoch": 1763} {"train_loss": -12.42273998260498, "global_step": 296226, "epoch": 1763} {"train_loss": -12.300325393676758, "global_step": 296227, "epoch": 1763} {"train_loss": -11.908894538879395, "global_step": 296228, "epoch": 1763} {"train_loss": -12.397937774658203, "global_step": 296229, "epoch": 1763} {"train_loss": -12.10954475402832, "global_step": 296230, "epoch": 1763} {"train_loss": -12.18707275390625, "global_step": 296231, "epoch": 1763} {"train_loss": -12.224609375, "global_step": 296232, "epoch": 1763} {"train_loss": -12.112981796264648, "global_step": 296233, "epoch": 1763} {"train_loss": -12.08852767944336, "global_step": 296234, "epoch": 1763} {"train_loss": -11.964195251464844, "global_step": 296235, "epoch": 1763} {"train_loss": -12.064302444458008, "global_step": 296236, "epoch": 1763} {"train_loss": -12.093518257141113, "global_step": 296237, "epoch": 1763} {"train_loss": -12.090219497680664, "global_step": 296238, "epoch": 1763} {"train_loss": -12.20040512084961, "global_step": 296239, "epoch": 1763} {"train_loss": -12.00446891784668, "global_step": 296240, "epoch": 1763} {"train_loss": -11.640759468078613, "global_step": 296241, "epoch": 1763} {"train_loss": -11.110797882080078, "global_step": 296242, "epoch": 1763} {"train_loss": -11.677343368530273, "global_step": 296243, "epoch": 1763} {"train_loss": -11.348136901855469, "global_step": 296244, "epoch": 1763} {"train_loss": -11.637470245361328, "global_step": 296245, "epoch": 1763} {"train_loss": -10.92864990234375, "global_step": 296246, "epoch": 1763} {"train_loss": -11.899513244628906, "global_step": 296247, "epoch": 1763} {"train_loss": -10.791773796081543, "global_step": 296248, "epoch": 1763} {"train_loss": -10.43596076965332, "global_step": 296249, "epoch": 1763} {"train_loss": -12.060136795043945, "global_step": 296250, "epoch": 1763} {"train_loss": -10.89393424987793, "global_step": 296251, "epoch": 1763} {"train_loss": -11.973142623901367, "global_step": 296252, "epoch": 1763} {"train_loss": -11.917254447937012, "global_step": 296253, "epoch": 1763} {"train_loss": -11.803131103515625, "global_step": 296254, "epoch": 1763} {"train_loss": -12.045047760009766, "global_step": 296255, "epoch": 1763} {"train_loss": -11.500286102294922, "global_step": 296256, "epoch": 1763} {"train_loss": -11.896775245666504, "global_step": 296257, "epoch": 1763} {"train_loss": -12.269206047058105, "global_step": 296258, "epoch": 1763} {"train_loss": -11.930933952331543, "global_step": 296259, "epoch": 1763} {"train_loss": -11.972177505493164, "global_step": 296260, "epoch": 1763} {"train_loss": -11.918067932128906, "global_step": 296261, "epoch": 1763} {"train_loss": -12.115474700927734, "global_step": 296262, "epoch": 1763} {"train_loss": -11.940220832824707, "global_step": 296263, "epoch": 1763} {"train_loss": -12.208361625671387, "global_step": 296264, "epoch": 1763} {"train_loss": -11.786529541015625, "global_step": 296265, "epoch": 1763} {"train_loss": -12.177084922790527, "global_step": 296266, "epoch": 1763} {"train_loss": -11.726945877075195, "global_step": 296267, "epoch": 1763} {"train_loss": -11.841446876525879, "global_step": 296268, "epoch": 1763} {"train_loss": -12.040796279907227, "global_step": 296269, "epoch": 1763} {"train_loss": -12.11899471282959, "global_step": 296270, "epoch": 1763} {"train_loss": -11.786981582641602, "global_step": 296271, "epoch": 1763} {"train_loss": -12.118842124938965, "global_step": 296272, "epoch": 1763} {"train_loss": -12.052513122558594, "global_step": 296273, "epoch": 1763} {"train_loss": -12.261484146118164, "global_step": 296274, "epoch": 1763} {"train_loss": -12.099563598632812, "global_step": 296275, "epoch": 1763} {"train_loss": -12.250673294067383, "global_step": 296276, "epoch": 1763} {"train_loss": -12.227291107177734, "global_step": 296277, "epoch": 1763} {"train_loss": -12.290241241455078, "global_step": 296278, "epoch": 1763} {"train_loss": -12.13653564453125, "global_step": 296279, "epoch": 1763} {"train_loss": -12.169981956481934, "global_step": 296280, "epoch": 1763} {"train_loss": -12.268634796142578, "global_step": 296281, "epoch": 1763} {"train_loss": -12.231822967529297, "global_step": 296282, "epoch": 1763} {"train_loss": -12.413166046142578, "global_step": 296283, "epoch": 1763} {"train_loss": -12.225931167602539, "global_step": 296284, "epoch": 1763} {"train_loss": -12.44781494140625, "global_step": 296285, "epoch": 1763} {"train_loss": -12.008771896362305, "global_step": 296286, "epoch": 1763} {"train_loss": -12.224959373474121, "global_step": 296287, "epoch": 1763} {"train_loss": -12.025492668151855, "global_step": 296288, "epoch": 1763} {"train_loss": -12.309322357177734, "global_step": 296289, "epoch": 1763} {"train_loss": -11.952949523925781, "global_step": 296290, "epoch": 1763} {"train_loss": -12.323834419250488, "global_step": 296291, "epoch": 1763} {"train_loss": -12.276227951049805, "global_step": 296292, "epoch": 1763} {"train_loss": -12.424247741699219, "global_step": 296293, "epoch": 1763} {"train_loss": -12.201204299926758, "global_step": 296294, "epoch": 1763} {"train_loss": -12.247785568237305, "global_step": 296295, "epoch": 1763} {"train_loss": -12.274404525756836, "global_step": 296296, "epoch": 1763} {"train_loss": -12.183431625366211, "global_step": 296297, "epoch": 1763} {"train_loss": -11.704252243041992, "global_step": 296298, "epoch": 1763} {"train_loss": -12.163885116577148, "global_step": 296299, "epoch": 1763} {"train_loss": -11.763927459716797, "global_step": 296300, "epoch": 1763} {"train_loss": -12.010517120361328, "global_step": 296301, "epoch": 1763} {"train_loss": -11.593225479125977, "global_step": 296302, "epoch": 1763} {"train_loss": -11.432354927062988, "global_step": 296303, "epoch": 1763} {"train_loss": -12.269784927368164, "global_step": 296304, "epoch": 1763} {"train_loss": -12.121591567993164, "global_step": 296305, "epoch": 1763} {"train_loss": -12.091455459594727, "global_step": 296306, "epoch": 1763} {"train_loss": -12.346695899963379, "global_step": 296307, "epoch": 1763} {"train_loss": -12.35512924194336, "global_step": 296308, "epoch": 1763} {"train_loss": -12.459335327148438, "global_step": 296309, "epoch": 1763} {"train_loss": -12.186042785644531, "global_step": 296310, "epoch": 1763} {"train_loss": -12.419539451599121, "global_step": 296311, "epoch": 1763} {"train_loss": -11.855213165283203, "global_step": 296312, "epoch": 1763} {"train_loss": -11.737384796142578, "global_step": 296313, "epoch": 1763} {"train_loss": -11.418144226074219, "global_step": 296314, "epoch": 1763} {"train_loss": -11.909242630004883, "global_step": 296315, "epoch": 1763} {"train_loss": -11.742740631103516, "global_step": 296316, "epoch": 1763} {"train_loss": -12.102142333984375, "global_step": 296317, "epoch": 1763} {"train_loss": -11.846952438354492, "global_step": 296318, "epoch": 1763} {"train_loss": -11.733869552612305, "global_step": 296319, "epoch": 1763} {"train_loss": -11.406393051147461, "global_step": 296320, "epoch": 1763} {"train_loss": -11.009328842163086, "global_step": 296321, "epoch": 1763} {"train_loss": -11.724955558776855, "global_step": 296322, "epoch": 1763} {"train_loss": -11.505674362182617, "global_step": 296323, "epoch": 1763} {"train_loss": -11.203639030456543, "global_step": 296324, "epoch": 1763} {"train_loss": -10.353376388549805, "global_step": 296325, "epoch": 1763} {"train_loss": -11.428555488586426, "global_step": 296326, "epoch": 1763} {"train_loss": -11.217667579650879, "global_step": 296327, "epoch": 1763} {"train_loss": -11.146429061889648, "global_step": 296328, "epoch": 1763} {"train_loss": -11.475400924682617, "global_step": 296329, "epoch": 1763} {"train_loss": -11.874709129333496, "global_step": 296330, "epoch": 1763} {"train_loss": -11.777469635009766, "global_step": 296331, "epoch": 1763} {"train_loss": -11.890800476074219, "global_step": 296332, "epoch": 1763} {"train_loss": -11.74679183959961, "global_step": 296333, "epoch": 1763} {"train_loss": -11.664874076843262, "global_step": 296334, "epoch": 1763} {"train_loss": -11.572023391723633, "global_step": 296335, "epoch": 1763} {"train_loss": -11.66455078125, "global_step": 296336, "epoch": 1763} {"train_loss": -12.170881271362305, "global_step": 296337, "epoch": 1763} {"train_loss": -11.65338134765625, "global_step": 296338, "epoch": 1763} {"train_loss": -11.838912963867188, "global_step": 296339, "epoch": 1763} {"train_loss": -11.904622077941895, "global_step": 296340, "epoch": 1763} {"train_loss": -12.036148071289062, "global_step": 296341, "epoch": 1763} {"train_loss": -12.010883331298828, "global_step": 296342, "epoch": 1763} {"train_loss": -11.523375511169434, "global_step": 296343, "epoch": 1763} {"train_loss": -12.007420539855957, "global_step": 296344, "epoch": 1763} {"train_loss": -11.975550651550293, "global_step": 296345, "epoch": 1763} {"train_loss": -11.472930908203125, "global_step": 296346, "epoch": 1763} {"train_loss": -11.810382843017578, "global_step": 296347, "epoch": 1763} {"train_loss": -11.601889610290527, "global_step": 296348, "epoch": 1763} {"train_loss": -11.321823120117188, "global_step": 296349, "epoch": 1763} {"train_loss": -11.979897499084473, "global_step": 296350, "epoch": 1763} {"train_loss": -11.908210357030233, "global_step": 296351, "epoch": 1763, "val_loss": 276584.59375} {"train_loss": -11.10713005065918, "global_step": 296352, "epoch": 1764} {"train_loss": -11.765875816345215, "global_step": 296353, "epoch": 1764} {"train_loss": -11.225905418395996, "global_step": 296354, "epoch": 1764} {"train_loss": -11.878973960876465, "global_step": 296355, "epoch": 1764} {"train_loss": -11.716582298278809, "global_step": 296356, "epoch": 1764} {"train_loss": -11.527626037597656, "global_step": 296357, "epoch": 1764} {"train_loss": -11.420465469360352, "global_step": 296358, "epoch": 1764} {"train_loss": -12.2208833694458, "global_step": 296359, "epoch": 1764} {"train_loss": -11.487964630126953, "global_step": 296360, "epoch": 1764} {"train_loss": -12.042964935302734, "global_step": 296361, "epoch": 1764} {"train_loss": -11.731206893920898, "global_step": 296362, "epoch": 1764} {"train_loss": -11.314855575561523, "global_step": 296363, "epoch": 1764} {"train_loss": -12.244022369384766, "global_step": 296364, "epoch": 1764} {"train_loss": -11.473546981811523, "global_step": 296365, "epoch": 1764} {"train_loss": -11.772083282470703, "global_step": 296366, "epoch": 1764} {"train_loss": -11.815722465515137, "global_step": 296367, "epoch": 1764} {"train_loss": -11.407350540161133, "global_step": 296368, "epoch": 1764} {"train_loss": -12.019376754760742, "global_step": 296369, "epoch": 1764} {"train_loss": -11.147924423217773, "global_step": 296370, "epoch": 1764} {"train_loss": -11.757221221923828, "global_step": 296371, "epoch": 1764} {"train_loss": -11.922082901000977, "global_step": 296372, "epoch": 1764} {"train_loss": -11.324600219726562, "global_step": 296373, "epoch": 1764} {"train_loss": -12.08061408996582, "global_step": 296374, "epoch": 1764} {"train_loss": -11.756656646728516, "global_step": 296375, "epoch": 1764} {"train_loss": -12.105752944946289, "global_step": 296376, "epoch": 1764} {"train_loss": -11.946069717407227, "global_step": 296377, "epoch": 1764} {"train_loss": -11.851861000061035, "global_step": 296378, "epoch": 1764} {"train_loss": -11.9653902053833, "global_step": 296379, "epoch": 1764} {"train_loss": -11.920271873474121, "global_step": 296380, "epoch": 1764} {"train_loss": -12.039623260498047, "global_step": 296381, "epoch": 1764} {"train_loss": -11.79200553894043, "global_step": 296382, "epoch": 1764} {"train_loss": -11.928842544555664, "global_step": 296383, "epoch": 1764} {"train_loss": -12.067291259765625, "global_step": 296384, "epoch": 1764} {"train_loss": -12.06306266784668, "global_step": 296385, "epoch": 1764} {"train_loss": -12.151897430419922, "global_step": 296386, "epoch": 1764} {"train_loss": -12.106185913085938, "global_step": 296387, "epoch": 1764} {"train_loss": -12.163545608520508, "global_step": 296388, "epoch": 1764} {"train_loss": -12.023283958435059, "global_step": 296389, "epoch": 1764} {"train_loss": -12.156694412231445, "global_step": 296390, "epoch": 1764} {"train_loss": -12.217954635620117, "global_step": 296391, "epoch": 1764} {"train_loss": -12.345935821533203, "global_step": 296392, "epoch": 1764} {"train_loss": -12.279958724975586, "global_step": 296393, "epoch": 1764} {"train_loss": -12.319538116455078, "global_step": 296394, "epoch": 1764} {"train_loss": -12.34669303894043, "global_step": 296395, "epoch": 1764} {"train_loss": -11.886541366577148, "global_step": 296396, "epoch": 1764} {"train_loss": -12.34420394897461, "global_step": 296397, "epoch": 1764} {"train_loss": -12.169975280761719, "global_step": 296398, "epoch": 1764} {"train_loss": -12.350591659545898, "global_step": 296399, "epoch": 1764} {"train_loss": -11.984599113464355, "global_step": 296400, "epoch": 1764} {"train_loss": -12.225865364074707, "global_step": 296401, "epoch": 1764} {"train_loss": -11.961676597595215, "global_step": 296402, "epoch": 1764} {"train_loss": -12.047491073608398, "global_step": 296403, "epoch": 1764} {"train_loss": -12.131607055664062, "global_step": 296404, "epoch": 1764} {"train_loss": -12.208284378051758, "global_step": 296405, "epoch": 1764} {"train_loss": -12.101011276245117, "global_step": 296406, "epoch": 1764} {"train_loss": -11.85966682434082, "global_step": 296407, "epoch": 1764} {"train_loss": -11.901363372802734, "global_step": 296408, "epoch": 1764} {"train_loss": -12.09251594543457, "global_step": 296409, "epoch": 1764} {"train_loss": -11.937114715576172, "global_step": 296410, "epoch": 1764} {"train_loss": -11.723129272460938, "global_step": 296411, "epoch": 1764} {"train_loss": -12.111063957214355, "global_step": 296412, "epoch": 1764} {"train_loss": -11.708983421325684, "global_step": 296413, "epoch": 1764} {"train_loss": -12.047372817993164, "global_step": 296414, "epoch": 1764} {"train_loss": -11.504692077636719, "global_step": 296415, "epoch": 1764} {"train_loss": -11.756292343139648, "global_step": 296416, "epoch": 1764} {"train_loss": -12.239969253540039, "global_step": 296417, "epoch": 1764} {"train_loss": -11.754246711730957, "global_step": 296418, "epoch": 1764} {"train_loss": -11.642559051513672, "global_step": 296419, "epoch": 1764} {"train_loss": -11.921356201171875, "global_step": 296420, "epoch": 1764} {"train_loss": -12.224567413330078, "global_step": 296421, "epoch": 1764} {"train_loss": -11.861364364624023, "global_step": 296422, "epoch": 1764} {"train_loss": -12.202535629272461, "global_step": 296423, "epoch": 1764} {"train_loss": -11.741779327392578, "global_step": 296424, "epoch": 1764} {"train_loss": -11.630945205688477, "global_step": 296425, "epoch": 1764} {"train_loss": -11.840398788452148, "global_step": 296426, "epoch": 1764} {"train_loss": -12.053911209106445, "global_step": 296427, "epoch": 1764} {"train_loss": -11.686175346374512, "global_step": 296428, "epoch": 1764} {"train_loss": -12.028858184814453, "global_step": 296429, "epoch": 1764} {"train_loss": -11.839802742004395, "global_step": 296430, "epoch": 1764} {"train_loss": -11.788052558898926, "global_step": 296431, "epoch": 1764} {"train_loss": -11.950979232788086, "global_step": 296432, "epoch": 1764} {"train_loss": -12.24945068359375, "global_step": 296433, "epoch": 1764} {"train_loss": -12.22349739074707, "global_step": 296434, "epoch": 1764} {"train_loss": -12.347172737121582, "global_step": 296435, "epoch": 1764} {"train_loss": -12.020330429077148, "global_step": 296436, "epoch": 1764} {"train_loss": -12.133621215820312, "global_step": 296437, "epoch": 1764} {"train_loss": -12.120336532592773, "global_step": 296438, "epoch": 1764} {"train_loss": -12.272212982177734, "global_step": 296439, "epoch": 1764} {"train_loss": -12.323596954345703, "global_step": 296440, "epoch": 1764} {"train_loss": -12.252643585205078, "global_step": 296441, "epoch": 1764} {"train_loss": -12.317275047302246, "global_step": 296442, "epoch": 1764} {"train_loss": -12.273236274719238, "global_step": 296443, "epoch": 1764} {"train_loss": -12.018819808959961, "global_step": 296444, "epoch": 1764} {"train_loss": -12.366056442260742, "global_step": 296445, "epoch": 1764} {"train_loss": -12.17502498626709, "global_step": 296446, "epoch": 1764} {"train_loss": -11.432275772094727, "global_step": 296447, "epoch": 1764} {"train_loss": -11.510334968566895, "global_step": 296448, "epoch": 1764} {"train_loss": -11.709161758422852, "global_step": 296449, "epoch": 1764} {"train_loss": -11.444061279296875, "global_step": 296450, "epoch": 1764} {"train_loss": -9.436464309692383, "global_step": 296451, "epoch": 1764} {"train_loss": -12.07210636138916, "global_step": 296452, "epoch": 1764} {"train_loss": -10.184944152832031, "global_step": 296453, "epoch": 1764} {"train_loss": -11.272909164428711, "global_step": 296454, "epoch": 1764} {"train_loss": -11.289566040039062, "global_step": 296455, "epoch": 1764} {"train_loss": -8.443005561828613, "global_step": 296456, "epoch": 1764} {"train_loss": -11.635027885437012, "global_step": 296457, "epoch": 1764} {"train_loss": -10.898215293884277, "global_step": 296458, "epoch": 1764} {"train_loss": -9.284725189208984, "global_step": 296459, "epoch": 1764} {"train_loss": -10.391691207885742, "global_step": 296460, "epoch": 1764} {"train_loss": -11.370285987854004, "global_step": 296461, "epoch": 1764} {"train_loss": -9.44781494140625, "global_step": 296462, "epoch": 1764} {"train_loss": -10.68940544128418, "global_step": 296463, "epoch": 1764} {"train_loss": -9.197627067565918, "global_step": 296464, "epoch": 1764} {"train_loss": -9.762177467346191, "global_step": 296465, "epoch": 1764} {"train_loss": -10.764941215515137, "global_step": 296466, "epoch": 1764} {"train_loss": -9.324912071228027, "global_step": 296467, "epoch": 1764} {"train_loss": -9.720444679260254, "global_step": 296468, "epoch": 1764} {"train_loss": -10.874456405639648, "global_step": 296469, "epoch": 1764} {"train_loss": -10.025275230407715, "global_step": 296470, "epoch": 1764} {"train_loss": -10.411911964416504, "global_step": 296471, "epoch": 1764} {"train_loss": -10.526750564575195, "global_step": 296472, "epoch": 1764} {"train_loss": -10.662508010864258, "global_step": 296473, "epoch": 1764} {"train_loss": -10.769098281860352, "global_step": 296474, "epoch": 1764} {"train_loss": -10.278955459594727, "global_step": 296475, "epoch": 1764} {"train_loss": -10.313858032226562, "global_step": 296476, "epoch": 1764} {"train_loss": -10.298669815063477, "global_step": 296477, "epoch": 1764} {"train_loss": -10.791984558105469, "global_step": 296478, "epoch": 1764} {"train_loss": -10.451581954956055, "global_step": 296479, "epoch": 1764} {"train_loss": -10.87257194519043, "global_step": 296480, "epoch": 1764} {"train_loss": -10.43971061706543, "global_step": 296481, "epoch": 1764} {"train_loss": -11.548165321350098, "global_step": 296482, "epoch": 1764} {"train_loss": -10.127257347106934, "global_step": 296483, "epoch": 1764} {"train_loss": -11.621145248413086, "global_step": 296484, "epoch": 1764} {"train_loss": -10.641271591186523, "global_step": 296485, "epoch": 1764} {"train_loss": -11.651310920715332, "global_step": 296486, "epoch": 1764} {"train_loss": -10.494261741638184, "global_step": 296487, "epoch": 1764} {"train_loss": -11.505084991455078, "global_step": 296488, "epoch": 1764} {"train_loss": -11.036796569824219, "global_step": 296489, "epoch": 1764} {"train_loss": -11.621962547302246, "global_step": 296490, "epoch": 1764} {"train_loss": -11.039735794067383, "global_step": 296491, "epoch": 1764} {"train_loss": -11.586366653442383, "global_step": 296492, "epoch": 1764} {"train_loss": -11.422042846679688, "global_step": 296493, "epoch": 1764} {"train_loss": -11.718372344970703, "global_step": 296494, "epoch": 1764} {"train_loss": -11.585830688476562, "global_step": 296495, "epoch": 1764} {"train_loss": -11.874080657958984, "global_step": 296496, "epoch": 1764} {"train_loss": -11.647726058959961, "global_step": 296497, "epoch": 1764} {"train_loss": -11.974626541137695, "global_step": 296498, "epoch": 1764} {"train_loss": -11.81265640258789, "global_step": 296499, "epoch": 1764} {"train_loss": -11.721115112304688, "global_step": 296500, "epoch": 1764} {"train_loss": -11.836784362792969, "global_step": 296501, "epoch": 1764} {"train_loss": -11.70744514465332, "global_step": 296502, "epoch": 1764} {"train_loss": -11.931215286254883, "global_step": 296503, "epoch": 1764} {"train_loss": -12.016060829162598, "global_step": 296504, "epoch": 1764} {"train_loss": -12.007190704345703, "global_step": 296505, "epoch": 1764} {"train_loss": -11.957256317138672, "global_step": 296506, "epoch": 1764} {"train_loss": -11.894231796264648, "global_step": 296507, "epoch": 1764} {"train_loss": -12.200563430786133, "global_step": 296508, "epoch": 1764} {"train_loss": -11.941425323486328, "global_step": 296509, "epoch": 1764} {"train_loss": -11.964934349060059, "global_step": 296510, "epoch": 1764} {"train_loss": -11.984068870544434, "global_step": 296511, "epoch": 1764} {"train_loss": -12.234572410583496, "global_step": 296512, "epoch": 1764} {"train_loss": -12.129571914672852, "global_step": 296513, "epoch": 1764} {"train_loss": -12.110248565673828, "global_step": 296514, "epoch": 1764} {"train_loss": -12.153189659118652, "global_step": 296515, "epoch": 1764} {"train_loss": -12.0903902053833, "global_step": 296516, "epoch": 1764} {"train_loss": -12.094712257385254, "global_step": 296517, "epoch": 1764} {"train_loss": -12.239324569702148, "global_step": 296518, "epoch": 1764} {"train_loss": -11.599348493984767, "global_step": 296519, "epoch": 1764, "val_loss": 280239.53125} {"train_loss": -11.839767456054688, "global_step": 296520, "epoch": 1765} {"train_loss": -12.213197708129883, "global_step": 296521, "epoch": 1765} {"train_loss": -12.133030891418457, "global_step": 296522, "epoch": 1765} {"train_loss": -12.19668960571289, "global_step": 296523, "epoch": 1765} {"train_loss": -12.135525703430176, "global_step": 296524, "epoch": 1765} {"train_loss": -12.08195686340332, "global_step": 296525, "epoch": 1765} {"train_loss": -12.190326690673828, "global_step": 296526, "epoch": 1765} {"train_loss": -12.151373863220215, "global_step": 296527, "epoch": 1765} {"train_loss": -12.212468147277832, "global_step": 296528, "epoch": 1765} {"train_loss": -12.088748931884766, "global_step": 296529, "epoch": 1765} {"train_loss": -12.302840232849121, "global_step": 296530, "epoch": 1765} {"train_loss": -11.940832138061523, "global_step": 296531, "epoch": 1765} {"train_loss": -12.290763854980469, "global_step": 296532, "epoch": 1765} {"train_loss": -12.017868041992188, "global_step": 296533, "epoch": 1765} {"train_loss": -12.28021240234375, "global_step": 296534, "epoch": 1765} {"train_loss": -12.078367233276367, "global_step": 296535, "epoch": 1765} {"train_loss": -12.302364349365234, "global_step": 296536, "epoch": 1765} {"train_loss": -12.110564231872559, "global_step": 296537, "epoch": 1765} {"train_loss": -12.35222053527832, "global_step": 296538, "epoch": 1765} {"train_loss": -12.379117965698242, "global_step": 296539, "epoch": 1765} {"train_loss": -12.067983627319336, "global_step": 296540, "epoch": 1765} {"train_loss": -12.444665908813477, "global_step": 296541, "epoch": 1765} {"train_loss": -12.42093276977539, "global_step": 296542, "epoch": 1765} {"train_loss": -12.45608901977539, "global_step": 296543, "epoch": 1765} {"train_loss": -12.353882789611816, "global_step": 296544, "epoch": 1765} {"train_loss": -12.054102897644043, "global_step": 296545, "epoch": 1765} {"train_loss": -12.424612045288086, "global_step": 296546, "epoch": 1765} {"train_loss": -12.44093132019043, "global_step": 296547, "epoch": 1765} {"train_loss": -12.389330863952637, "global_step": 296548, "epoch": 1765} {"train_loss": -12.477713584899902, "global_step": 296549, "epoch": 1765} {"train_loss": -12.380443572998047, "global_step": 296550, "epoch": 1765} {"train_loss": -12.200966835021973, "global_step": 296551, "epoch": 1765} {"train_loss": -12.516674041748047, "global_step": 296552, "epoch": 1765} {"train_loss": -12.352592468261719, "global_step": 296553, "epoch": 1765} {"train_loss": -12.42778205871582, "global_step": 296554, "epoch": 1765} {"train_loss": -12.390256881713867, "global_step": 296555, "epoch": 1765} {"train_loss": -12.389123916625977, "global_step": 296556, "epoch": 1765} {"train_loss": -12.457815170288086, "global_step": 296557, "epoch": 1765} {"train_loss": -12.380409240722656, "global_step": 296558, "epoch": 1765} {"train_loss": -12.650230407714844, "global_step": 296559, "epoch": 1765} {"train_loss": -12.575507164001465, "global_step": 296560, "epoch": 1765} {"train_loss": -12.17483901977539, "global_step": 296561, "epoch": 1765} {"train_loss": -12.468228340148926, "global_step": 296562, "epoch": 1765} {"train_loss": -12.317778587341309, "global_step": 296563, "epoch": 1765} {"train_loss": -11.745354652404785, "global_step": 296564, "epoch": 1765} {"train_loss": -12.159814834594727, "global_step": 296565, "epoch": 1765} {"train_loss": -12.416534423828125, "global_step": 296566, "epoch": 1765} {"train_loss": -12.062963485717773, "global_step": 296567, "epoch": 1765} {"train_loss": -12.637168884277344, "global_step": 296568, "epoch": 1765} {"train_loss": -12.132065773010254, "global_step": 296569, "epoch": 1765} {"train_loss": -11.95860481262207, "global_step": 296570, "epoch": 1765} {"train_loss": -11.984317779541016, "global_step": 296571, "epoch": 1765} {"train_loss": -12.553519248962402, "global_step": 296572, "epoch": 1765} {"train_loss": -12.317556381225586, "global_step": 296573, "epoch": 1765} {"train_loss": -12.331878662109375, "global_step": 296574, "epoch": 1765} {"train_loss": -12.259170532226562, "global_step": 296575, "epoch": 1765} {"train_loss": -12.474271774291992, "global_step": 296576, "epoch": 1765} {"train_loss": -12.451537132263184, "global_step": 296577, "epoch": 1765} {"train_loss": -12.21839427947998, "global_step": 296578, "epoch": 1765} {"train_loss": -12.016790390014648, "global_step": 296579, "epoch": 1765} {"train_loss": -11.416532516479492, "global_step": 296580, "epoch": 1765} {"train_loss": -11.868341445922852, "global_step": 296581, "epoch": 1765} {"train_loss": -11.621162414550781, "global_step": 296582, "epoch": 1765} {"train_loss": -10.002429008483887, "global_step": 296583, "epoch": 1765} {"train_loss": -10.411108016967773, "global_step": 296584, "epoch": 1765} {"train_loss": -9.569363594055176, "global_step": 296585, "epoch": 1765} {"train_loss": -8.223002433776855, "global_step": 296586, "epoch": 1765} {"train_loss": -8.316604614257812, "global_step": 296587, "epoch": 1765} {"train_loss": -10.7681303024292, "global_step": 296588, "epoch": 1765} {"train_loss": -7.984586238861084, "global_step": 296589, "epoch": 1765} {"train_loss": -8.128622055053711, "global_step": 296590, "epoch": 1765} {"train_loss": -8.401959419250488, "global_step": 296591, "epoch": 1765} {"train_loss": -8.5133638381958, "global_step": 296592, "epoch": 1765} {"train_loss": -9.35795783996582, "global_step": 296593, "epoch": 1765} {"train_loss": -9.481369018554688, "global_step": 296594, "epoch": 1765} {"train_loss": -9.776029586791992, "global_step": 296595, "epoch": 1765} {"train_loss": -9.867486953735352, "global_step": 296596, "epoch": 1765} {"train_loss": -9.763211250305176, "global_step": 296597, "epoch": 1765} {"train_loss": -9.442486763000488, "global_step": 296598, "epoch": 1765} {"train_loss": -10.011795043945312, "global_step": 296599, "epoch": 1765} {"train_loss": -10.557687759399414, "global_step": 296600, "epoch": 1765} {"train_loss": -9.353363037109375, "global_step": 296601, "epoch": 1765} {"train_loss": -10.40114688873291, "global_step": 296602, "epoch": 1765} {"train_loss": -9.994180679321289, "global_step": 296603, "epoch": 1765} {"train_loss": -8.200281143188477, "global_step": 296604, "epoch": 1765} {"train_loss": -8.088719367980957, "global_step": 296605, "epoch": 1765} {"train_loss": -8.087203025817871, "global_step": 296606, "epoch": 1765} {"train_loss": -9.487131118774414, "global_step": 296607, "epoch": 1765} {"train_loss": -10.301422119140625, "global_step": 296608, "epoch": 1765} {"train_loss": -9.401851654052734, "global_step": 296609, "epoch": 1765} {"train_loss": -10.474934577941895, "global_step": 296610, "epoch": 1765} {"train_loss": -10.602956771850586, "global_step": 296611, "epoch": 1765} {"train_loss": -10.698007583618164, "global_step": 296612, "epoch": 1765} {"train_loss": -10.759531021118164, "global_step": 296613, "epoch": 1765} {"train_loss": -10.855499267578125, "global_step": 296614, "epoch": 1765} {"train_loss": -10.818227767944336, "global_step": 296615, "epoch": 1765} {"train_loss": -11.160416603088379, "global_step": 296616, "epoch": 1765} {"train_loss": -10.33609390258789, "global_step": 296617, "epoch": 1765} {"train_loss": -11.361371040344238, "global_step": 296618, "epoch": 1765} {"train_loss": -11.043769836425781, "global_step": 296619, "epoch": 1765} {"train_loss": -10.568748474121094, "global_step": 296620, "epoch": 1765} {"train_loss": -11.359004020690918, "global_step": 296621, "epoch": 1765} {"train_loss": -11.197417259216309, "global_step": 296622, "epoch": 1765} {"train_loss": -11.429701805114746, "global_step": 296623, "epoch": 1765} {"train_loss": -11.516045570373535, "global_step": 296624, "epoch": 1765} {"train_loss": -11.73099136352539, "global_step": 296625, "epoch": 1765} {"train_loss": -11.615686416625977, "global_step": 296626, "epoch": 1765} {"train_loss": -11.446977615356445, "global_step": 296627, "epoch": 1765} {"train_loss": -11.547743797302246, "global_step": 296628, "epoch": 1765} {"train_loss": -11.779090881347656, "global_step": 296629, "epoch": 1765} {"train_loss": -11.79850959777832, "global_step": 296630, "epoch": 1765} {"train_loss": -11.562545776367188, "global_step": 296631, "epoch": 1765} {"train_loss": -11.751558303833008, "global_step": 296632, "epoch": 1765} {"train_loss": -11.698606491088867, "global_step": 296633, "epoch": 1765} {"train_loss": -11.47375202178955, "global_step": 296634, "epoch": 1765} {"train_loss": -11.861226081848145, "global_step": 296635, "epoch": 1765} {"train_loss": -11.761430740356445, "global_step": 296636, "epoch": 1765} {"train_loss": -11.871160507202148, "global_step": 296637, "epoch": 1765} {"train_loss": -11.71609115600586, "global_step": 296638, "epoch": 1765} {"train_loss": -12.01618766784668, "global_step": 296639, "epoch": 1765} {"train_loss": -11.873678207397461, "global_step": 296640, "epoch": 1765} {"train_loss": -12.003378868103027, "global_step": 296641, "epoch": 1765} {"train_loss": -12.067974090576172, "global_step": 296642, "epoch": 1765} {"train_loss": -12.031352996826172, "global_step": 296643, "epoch": 1765} {"train_loss": -11.956238746643066, "global_step": 296644, "epoch": 1765} {"train_loss": -11.91049575805664, "global_step": 296645, "epoch": 1765} {"train_loss": -11.884937286376953, "global_step": 296646, "epoch": 1765} {"train_loss": -11.818025588989258, "global_step": 296647, "epoch": 1765} {"train_loss": -11.995936393737793, "global_step": 296648, "epoch": 1765} {"train_loss": -11.744668960571289, "global_step": 296649, "epoch": 1765} {"train_loss": -12.229934692382812, "global_step": 296650, "epoch": 1765} {"train_loss": -11.86036491394043, "global_step": 296651, "epoch": 1765} {"train_loss": -11.997940063476562, "global_step": 296652, "epoch": 1765} {"train_loss": -11.862059593200684, "global_step": 296653, "epoch": 1765} {"train_loss": -12.13470458984375, "global_step": 296654, "epoch": 1765} {"train_loss": -11.991180419921875, "global_step": 296655, "epoch": 1765} {"train_loss": -12.012752532958984, "global_step": 296656, "epoch": 1765} {"train_loss": -11.96335506439209, "global_step": 296657, "epoch": 1765} {"train_loss": -11.903347969055176, "global_step": 296658, "epoch": 1765} {"train_loss": -12.170156478881836, "global_step": 296659, "epoch": 1765} {"train_loss": -12.031314849853516, "global_step": 296660, "epoch": 1765} {"train_loss": -12.127449035644531, "global_step": 296661, "epoch": 1765} {"train_loss": -11.941423416137695, "global_step": 296662, "epoch": 1765} {"train_loss": -12.142659187316895, "global_step": 296663, "epoch": 1765} {"train_loss": -11.960277557373047, "global_step": 296664, "epoch": 1765} {"train_loss": -12.034255027770996, "global_step": 296665, "epoch": 1765} {"train_loss": -12.097777366638184, "global_step": 296666, "epoch": 1765} {"train_loss": -12.198175430297852, "global_step": 296667, "epoch": 1765} {"train_loss": -11.81587028503418, "global_step": 296668, "epoch": 1765} {"train_loss": -11.977951049804688, "global_step": 296669, "epoch": 1765} {"train_loss": -11.66061019897461, "global_step": 296670, "epoch": 1765} {"train_loss": -11.642044067382812, "global_step": 296671, "epoch": 1765} {"train_loss": -11.847222328186035, "global_step": 296672, "epoch": 1765} {"train_loss": -10.371063232421875, "global_step": 296673, "epoch": 1765} {"train_loss": -11.921598434448242, "global_step": 296674, "epoch": 1765} {"train_loss": -10.543760299682617, "global_step": 296675, "epoch": 1765} {"train_loss": -11.664327621459961, "global_step": 296676, "epoch": 1765} {"train_loss": -11.434236526489258, "global_step": 296677, "epoch": 1765} {"train_loss": -11.56739616394043, "global_step": 296678, "epoch": 1765} {"train_loss": -11.970104217529297, "global_step": 296679, "epoch": 1765} {"train_loss": -11.588054656982422, "global_step": 296680, "epoch": 1765} {"train_loss": -11.995040893554688, "global_step": 296681, "epoch": 1765} {"train_loss": -11.190174102783203, "global_step": 296682, "epoch": 1765} {"train_loss": -11.081825256347656, "global_step": 296683, "epoch": 1765} {"train_loss": -11.856694221496582, "global_step": 296684, "epoch": 1765} {"train_loss": -12.134292602539062, "global_step": 296685, "epoch": 1765} {"train_loss": -11.87629222869873, "global_step": 296686, "epoch": 1765} {"train_loss": -11.493127280757541, "global_step": 296687, "epoch": 1765, "val_loss": 275720.40625, "train_action_mse_error": 2.128370523452759} {"train_loss": -11.394296646118164, "global_step": 296688, "epoch": 1766} {"train_loss": -11.886411666870117, "global_step": 296689, "epoch": 1766} {"train_loss": -11.882284164428711, "global_step": 296690, "epoch": 1766} {"train_loss": -12.110539436340332, "global_step": 296691, "epoch": 1766} {"train_loss": -12.10818862915039, "global_step": 296692, "epoch": 1766} {"train_loss": -12.208662033081055, "global_step": 296693, "epoch": 1766} {"train_loss": -12.023435592651367, "global_step": 296694, "epoch": 1766} {"train_loss": -12.084949493408203, "global_step": 296695, "epoch": 1766} {"train_loss": -12.01266098022461, "global_step": 296696, "epoch": 1766} {"train_loss": -12.041651725769043, "global_step": 296697, "epoch": 1766} {"train_loss": -12.219496726989746, "global_step": 296698, "epoch": 1766} {"train_loss": -12.10395622253418, "global_step": 296699, "epoch": 1766} {"train_loss": -12.236429214477539, "global_step": 296700, "epoch": 1766} {"train_loss": -12.101290702819824, "global_step": 296701, "epoch": 1766} {"train_loss": -12.385025024414062, "global_step": 296702, "epoch": 1766} {"train_loss": -12.195028305053711, "global_step": 296703, "epoch": 1766} {"train_loss": -12.100981712341309, "global_step": 296704, "epoch": 1766} {"train_loss": -12.450838088989258, "global_step": 296705, "epoch": 1766} {"train_loss": -12.117780685424805, "global_step": 296706, "epoch": 1766} {"train_loss": -12.251426696777344, "global_step": 296707, "epoch": 1766} {"train_loss": -12.378814697265625, "global_step": 296708, "epoch": 1766} {"train_loss": -12.359530448913574, "global_step": 296709, "epoch": 1766} {"train_loss": -12.243840217590332, "global_step": 296710, "epoch": 1766} {"train_loss": -12.156723022460938, "global_step": 296711, "epoch": 1766} {"train_loss": -12.297680854797363, "global_step": 296712, "epoch": 1766} {"train_loss": -12.195234298706055, "global_step": 296713, "epoch": 1766} {"train_loss": -12.325254440307617, "global_step": 296714, "epoch": 1766} {"train_loss": -12.06961441040039, "global_step": 296715, "epoch": 1766} {"train_loss": -12.344793319702148, "global_step": 296716, "epoch": 1766} {"train_loss": -11.991250991821289, "global_step": 296717, "epoch": 1766} {"train_loss": -12.22648811340332, "global_step": 296718, "epoch": 1766} {"train_loss": -12.33837604522705, "global_step": 296719, "epoch": 1766} {"train_loss": -12.313583374023438, "global_step": 296720, "epoch": 1766} {"train_loss": -12.354732513427734, "global_step": 296721, "epoch": 1766} {"train_loss": -12.095531463623047, "global_step": 296722, "epoch": 1766} {"train_loss": -11.811458587646484, "global_step": 296723, "epoch": 1766} {"train_loss": -12.306510925292969, "global_step": 296724, "epoch": 1766} {"train_loss": -11.985067367553711, "global_step": 296725, "epoch": 1766} {"train_loss": -12.136764526367188, "global_step": 296726, "epoch": 1766} {"train_loss": -12.18044662475586, "global_step": 296727, "epoch": 1766} {"train_loss": -12.386087417602539, "global_step": 296728, "epoch": 1766} {"train_loss": -12.236625671386719, "global_step": 296729, "epoch": 1766} {"train_loss": -12.502687454223633, "global_step": 296730, "epoch": 1766} {"train_loss": -12.321882247924805, "global_step": 296731, "epoch": 1766} {"train_loss": -12.522089004516602, "global_step": 296732, "epoch": 1766} {"train_loss": -11.923005104064941, "global_step": 296733, "epoch": 1766} {"train_loss": -12.361349105834961, "global_step": 296734, "epoch": 1766} {"train_loss": -12.378889083862305, "global_step": 296735, "epoch": 1766} {"train_loss": -12.142354965209961, "global_step": 296736, "epoch": 1766} {"train_loss": -12.34676742553711, "global_step": 296737, "epoch": 1766} {"train_loss": -12.055546760559082, "global_step": 296738, "epoch": 1766} {"train_loss": -12.185567855834961, "global_step": 296739, "epoch": 1766} {"train_loss": -12.31922435760498, "global_step": 296740, "epoch": 1766} {"train_loss": -12.51968002319336, "global_step": 296741, "epoch": 1766} {"train_loss": -12.288515090942383, "global_step": 296742, "epoch": 1766} {"train_loss": -12.322050094604492, "global_step": 296743, "epoch": 1766} {"train_loss": -12.2713623046875, "global_step": 296744, "epoch": 1766} {"train_loss": -12.275912284851074, "global_step": 296745, "epoch": 1766} {"train_loss": -12.374382019042969, "global_step": 296746, "epoch": 1766} {"train_loss": -12.061113357543945, "global_step": 296747, "epoch": 1766} {"train_loss": -12.539078712463379, "global_step": 296748, "epoch": 1766} {"train_loss": -12.144740104675293, "global_step": 296749, "epoch": 1766} {"train_loss": -12.227616310119629, "global_step": 296750, "epoch": 1766} {"train_loss": -12.118663787841797, "global_step": 296751, "epoch": 1766} {"train_loss": -12.376020431518555, "global_step": 296752, "epoch": 1766} {"train_loss": -11.981099128723145, "global_step": 296753, "epoch": 1766} {"train_loss": -11.417320251464844, "global_step": 296754, "epoch": 1766} {"train_loss": -11.78636646270752, "global_step": 296755, "epoch": 1766} {"train_loss": -10.776103973388672, "global_step": 296756, "epoch": 1766} {"train_loss": -11.2031888961792, "global_step": 296757, "epoch": 1766} {"train_loss": -8.991891860961914, "global_step": 296758, "epoch": 1766} {"train_loss": -8.625442504882812, "global_step": 296759, "epoch": 1766} {"train_loss": -8.969831466674805, "global_step": 296760, "epoch": 1766} {"train_loss": -10.491000175476074, "global_step": 296761, "epoch": 1766} {"train_loss": -10.799650192260742, "global_step": 296762, "epoch": 1766} {"train_loss": -9.34244155883789, "global_step": 296763, "epoch": 1766} {"train_loss": -10.880298614501953, "global_step": 296764, "epoch": 1766} {"train_loss": -9.899452209472656, "global_step": 296765, "epoch": 1766} {"train_loss": -9.130520820617676, "global_step": 296766, "epoch": 1766} {"train_loss": -7.688076019287109, "global_step": 296767, "epoch": 1766} {"train_loss": -11.362007141113281, "global_step": 296768, "epoch": 1766} {"train_loss": -8.041281700134277, "global_step": 296769, "epoch": 1766} {"train_loss": -10.183890342712402, "global_step": 296770, "epoch": 1766} {"train_loss": -6.767911911010742, "global_step": 296771, "epoch": 1766} {"train_loss": -7.874894618988037, "global_step": 296772, "epoch": 1766} {"train_loss": -9.060401916503906, "global_step": 296773, "epoch": 1766} {"train_loss": -7.575390815734863, "global_step": 296774, "epoch": 1766} {"train_loss": -9.587396621704102, "global_step": 296775, "epoch": 1766} {"train_loss": -8.402950286865234, "global_step": 296776, "epoch": 1766} {"train_loss": -9.783794403076172, "global_step": 296777, "epoch": 1766} {"train_loss": -8.901077270507812, "global_step": 296778, "epoch": 1766} {"train_loss": -8.762773513793945, "global_step": 296779, "epoch": 1766} {"train_loss": -9.037830352783203, "global_step": 296780, "epoch": 1766} {"train_loss": -10.14371109008789, "global_step": 296781, "epoch": 1766} {"train_loss": -8.90231704711914, "global_step": 296782, "epoch": 1766} {"train_loss": -7.549612522125244, "global_step": 296783, "epoch": 1766} {"train_loss": -9.554141998291016, "global_step": 296784, "epoch": 1766} {"train_loss": -9.08465576171875, "global_step": 296785, "epoch": 1766} {"train_loss": -9.53463077545166, "global_step": 296786, "epoch": 1766} {"train_loss": -9.692520141601562, "global_step": 296787, "epoch": 1766} {"train_loss": -10.646902084350586, "global_step": 296788, "epoch": 1766} {"train_loss": -10.451634407043457, "global_step": 296789, "epoch": 1766} {"train_loss": -9.87835693359375, "global_step": 296790, "epoch": 1766} {"train_loss": -10.086235046386719, "global_step": 296791, "epoch": 1766} {"train_loss": -10.962883949279785, "global_step": 296792, "epoch": 1766} {"train_loss": -9.811552047729492, "global_step": 296793, "epoch": 1766} {"train_loss": -10.344897270202637, "global_step": 296794, "epoch": 1766} {"train_loss": -11.292474746704102, "global_step": 296795, "epoch": 1766} {"train_loss": -10.71024227142334, "global_step": 296796, "epoch": 1766} {"train_loss": -10.762870788574219, "global_step": 296797, "epoch": 1766} {"train_loss": -11.19709300994873, "global_step": 296798, "epoch": 1766} {"train_loss": -10.962124824523926, "global_step": 296799, "epoch": 1766} {"train_loss": -10.648370742797852, "global_step": 296800, "epoch": 1766} {"train_loss": -11.080648422241211, "global_step": 296801, "epoch": 1766} {"train_loss": -11.492608070373535, "global_step": 296802, "epoch": 1766} {"train_loss": -10.83465576171875, "global_step": 296803, "epoch": 1766} {"train_loss": -11.265287399291992, "global_step": 296804, "epoch": 1766} {"train_loss": -11.487834930419922, "global_step": 296805, "epoch": 1766} {"train_loss": -11.198677062988281, "global_step": 296806, "epoch": 1766} {"train_loss": -11.386130332946777, "global_step": 296807, "epoch": 1766} {"train_loss": -11.730463027954102, "global_step": 296808, "epoch": 1766} {"train_loss": -11.505447387695312, "global_step": 296809, "epoch": 1766} {"train_loss": -11.171920776367188, "global_step": 296810, "epoch": 1766} {"train_loss": -11.735440254211426, "global_step": 296811, "epoch": 1766} {"train_loss": -11.788966178894043, "global_step": 296812, "epoch": 1766} {"train_loss": -11.546207427978516, "global_step": 296813, "epoch": 1766} {"train_loss": -11.400266647338867, "global_step": 296814, "epoch": 1766} {"train_loss": -11.862642288208008, "global_step": 296815, "epoch": 1766} {"train_loss": -11.427452087402344, "global_step": 296816, "epoch": 1766} {"train_loss": -11.734171867370605, "global_step": 296817, "epoch": 1766} {"train_loss": -11.78138256072998, "global_step": 296818, "epoch": 1766} {"train_loss": -11.559059143066406, "global_step": 296819, "epoch": 1766} {"train_loss": -11.79489803314209, "global_step": 296820, "epoch": 1766} {"train_loss": -11.749933242797852, "global_step": 296821, "epoch": 1766} {"train_loss": -11.796173095703125, "global_step": 296822, "epoch": 1766} {"train_loss": -11.972721099853516, "global_step": 296823, "epoch": 1766} {"train_loss": -11.734186172485352, "global_step": 296824, "epoch": 1766} {"train_loss": -11.750123977661133, "global_step": 296825, "epoch": 1766} {"train_loss": -11.852628707885742, "global_step": 296826, "epoch": 1766} {"train_loss": -11.757684707641602, "global_step": 296827, "epoch": 1766} {"train_loss": -12.080484390258789, "global_step": 296828, "epoch": 1766} {"train_loss": -11.91280460357666, "global_step": 296829, "epoch": 1766} {"train_loss": -11.716728210449219, "global_step": 296830, "epoch": 1766} {"train_loss": -11.943410873413086, "global_step": 296831, "epoch": 1766} {"train_loss": -11.612569808959961, "global_step": 296832, "epoch": 1766} {"train_loss": -11.977193832397461, "global_step": 296833, "epoch": 1766} {"train_loss": -12.047727584838867, "global_step": 296834, "epoch": 1766} {"train_loss": -11.76815414428711, "global_step": 296835, "epoch": 1766} {"train_loss": -11.95048999786377, "global_step": 296836, "epoch": 1766} {"train_loss": -12.081121444702148, "global_step": 296837, "epoch": 1766} {"train_loss": -12.102594375610352, "global_step": 296838, "epoch": 1766} {"train_loss": -11.977943420410156, "global_step": 296839, "epoch": 1766} {"train_loss": -12.062910079956055, "global_step": 296840, "epoch": 1766} {"train_loss": -12.047897338867188, "global_step": 296841, "epoch": 1766} {"train_loss": -11.842232704162598, "global_step": 296842, "epoch": 1766} {"train_loss": -12.170510292053223, "global_step": 296843, "epoch": 1766} {"train_loss": -11.96432113647461, "global_step": 296844, "epoch": 1766} {"train_loss": -12.020698547363281, "global_step": 296845, "epoch": 1766} {"train_loss": -11.964351654052734, "global_step": 296846, "epoch": 1766} {"train_loss": -12.037863731384277, "global_step": 296847, "epoch": 1766} {"train_loss": -12.082663536071777, "global_step": 296848, "epoch": 1766} {"train_loss": -11.864051818847656, "global_step": 296849, "epoch": 1766} {"train_loss": -11.923028945922852, "global_step": 296850, "epoch": 1766} {"train_loss": -11.90683364868164, "global_step": 296851, "epoch": 1766} {"train_loss": -11.920808792114258, "global_step": 296852, "epoch": 1766} {"train_loss": -11.976346015930176, "global_step": 296853, "epoch": 1766} {"train_loss": -11.77864933013916, "global_step": 296854, "epoch": 1766} {"train_loss": -11.368985159056527, "global_step": 296855, "epoch": 1766, "val_loss": 275165.21875} {"train_loss": -11.847467422485352, "global_step": 296856, "epoch": 1767} {"train_loss": -12.157613754272461, "global_step": 296857, "epoch": 1767} {"train_loss": -12.150167465209961, "global_step": 296858, "epoch": 1767} {"train_loss": -12.169046401977539, "global_step": 296859, "epoch": 1767} {"train_loss": -12.15433120727539, "global_step": 296860, "epoch": 1767} {"train_loss": -12.250812530517578, "global_step": 296861, "epoch": 1767} {"train_loss": -12.02787971496582, "global_step": 296862, "epoch": 1767} {"train_loss": -12.19833755493164, "global_step": 296863, "epoch": 1767} {"train_loss": -11.784143447875977, "global_step": 296864, "epoch": 1767} {"train_loss": -12.096709251403809, "global_step": 296865, "epoch": 1767} {"train_loss": -12.293329238891602, "global_step": 296866, "epoch": 1767} {"train_loss": -11.959430694580078, "global_step": 296867, "epoch": 1767} {"train_loss": -11.733633041381836, "global_step": 296868, "epoch": 1767} {"train_loss": -12.227712631225586, "global_step": 296869, "epoch": 1767} {"train_loss": -12.093195915222168, "global_step": 296870, "epoch": 1767} {"train_loss": -12.369231224060059, "global_step": 296871, "epoch": 1767} {"train_loss": -12.271018981933594, "global_step": 296872, "epoch": 1767} {"train_loss": -12.350749969482422, "global_step": 296873, "epoch": 1767} {"train_loss": -12.41338062286377, "global_step": 296874, "epoch": 1767} {"train_loss": -12.254297256469727, "global_step": 296875, "epoch": 1767} {"train_loss": -12.397136688232422, "global_step": 296876, "epoch": 1767} {"train_loss": -12.421783447265625, "global_step": 296877, "epoch": 1767} {"train_loss": -12.077312469482422, "global_step": 296878, "epoch": 1767} {"train_loss": -12.395574569702148, "global_step": 296879, "epoch": 1767} {"train_loss": -12.325383186340332, "global_step": 296880, "epoch": 1767} {"train_loss": -12.359527587890625, "global_step": 296881, "epoch": 1767} {"train_loss": -12.438179016113281, "global_step": 296882, "epoch": 1767} {"train_loss": -12.374601364135742, "global_step": 296883, "epoch": 1767} {"train_loss": -12.518789291381836, "global_step": 296884, "epoch": 1767} {"train_loss": -12.399097442626953, "global_step": 296885, "epoch": 1767} {"train_loss": -12.546283721923828, "global_step": 296886, "epoch": 1767} {"train_loss": -12.248981475830078, "global_step": 296887, "epoch": 1767} {"train_loss": -12.452919006347656, "global_step": 296888, "epoch": 1767} {"train_loss": -12.29167366027832, "global_step": 296889, "epoch": 1767} {"train_loss": -12.398809432983398, "global_step": 296890, "epoch": 1767} {"train_loss": -12.278093338012695, "global_step": 296891, "epoch": 1767} {"train_loss": -12.552347183227539, "global_step": 296892, "epoch": 1767} {"train_loss": -12.39854621887207, "global_step": 296893, "epoch": 1767} {"train_loss": -12.592039108276367, "global_step": 296894, "epoch": 1767} {"train_loss": -12.48137092590332, "global_step": 296895, "epoch": 1767} {"train_loss": -12.435771942138672, "global_step": 296896, "epoch": 1767} {"train_loss": -12.467816352844238, "global_step": 296897, "epoch": 1767} {"train_loss": -12.325363159179688, "global_step": 296898, "epoch": 1767} {"train_loss": -12.450254440307617, "global_step": 296899, "epoch": 1767} {"train_loss": -12.318065643310547, "global_step": 296900, "epoch": 1767} {"train_loss": -12.4461669921875, "global_step": 296901, "epoch": 1767} {"train_loss": -12.232356071472168, "global_step": 296902, "epoch": 1767} {"train_loss": -12.405158996582031, "global_step": 296903, "epoch": 1767} {"train_loss": -12.37641429901123, "global_step": 296904, "epoch": 1767} {"train_loss": -12.49550724029541, "global_step": 296905, "epoch": 1767} {"train_loss": -12.31714916229248, "global_step": 296906, "epoch": 1767} {"train_loss": -12.539840698242188, "global_step": 296907, "epoch": 1767} {"train_loss": -12.064431190490723, "global_step": 296908, "epoch": 1767} {"train_loss": -12.155803680419922, "global_step": 296909, "epoch": 1767} {"train_loss": -12.385774612426758, "global_step": 296910, "epoch": 1767} {"train_loss": -12.39128303527832, "global_step": 296911, "epoch": 1767} {"train_loss": -12.217412948608398, "global_step": 296912, "epoch": 1767} {"train_loss": -11.70438289642334, "global_step": 296913, "epoch": 1767} {"train_loss": -10.783241271972656, "global_step": 296914, "epoch": 1767} {"train_loss": -11.526839256286621, "global_step": 296915, "epoch": 1767} {"train_loss": -11.360932350158691, "global_step": 296916, "epoch": 1767} {"train_loss": -12.317769050598145, "global_step": 296917, "epoch": 1767} {"train_loss": -11.126721382141113, "global_step": 296918, "epoch": 1767} {"train_loss": -12.16463565826416, "global_step": 296919, "epoch": 1767} {"train_loss": -10.42425537109375, "global_step": 296920, "epoch": 1767} {"train_loss": -11.106161117553711, "global_step": 296921, "epoch": 1767} {"train_loss": -10.398197174072266, "global_step": 296922, "epoch": 1767} {"train_loss": -12.133803367614746, "global_step": 296923, "epoch": 1767} {"train_loss": -9.472553253173828, "global_step": 296924, "epoch": 1767} {"train_loss": -9.01625919342041, "global_step": 296925, "epoch": 1767} {"train_loss": -11.28930377960205, "global_step": 296926, "epoch": 1767} {"train_loss": -11.350881576538086, "global_step": 296927, "epoch": 1767} {"train_loss": -9.788590431213379, "global_step": 296928, "epoch": 1767} {"train_loss": -10.877660751342773, "global_step": 296929, "epoch": 1767} {"train_loss": -9.647266387939453, "global_step": 296930, "epoch": 1767} {"train_loss": -10.13510513305664, "global_step": 296931, "epoch": 1767} {"train_loss": -10.867820739746094, "global_step": 296932, "epoch": 1767} {"train_loss": -7.9279022216796875, "global_step": 296933, "epoch": 1767} {"train_loss": -6.737672805786133, "global_step": 296934, "epoch": 1767} {"train_loss": -7.176090717315674, "global_step": 296935, "epoch": 1767} {"train_loss": -7.437290191650391, "global_step": 296936, "epoch": 1767} {"train_loss": -7.835768699645996, "global_step": 296937, "epoch": 1767} {"train_loss": -8.564567565917969, "global_step": 296938, "epoch": 1767} {"train_loss": -7.332415580749512, "global_step": 296939, "epoch": 1767} {"train_loss": -8.20159912109375, "global_step": 296940, "epoch": 1767} {"train_loss": -8.331565856933594, "global_step": 296941, "epoch": 1767} {"train_loss": -7.6812849044799805, "global_step": 296942, "epoch": 1767} {"train_loss": -8.113617897033691, "global_step": 296943, "epoch": 1767} {"train_loss": -8.663483619689941, "global_step": 296944, "epoch": 1767} {"train_loss": -9.328153610229492, "global_step": 296945, "epoch": 1767} {"train_loss": -9.427501678466797, "global_step": 296946, "epoch": 1767} {"train_loss": -9.423873901367188, "global_step": 296947, "epoch": 1767} {"train_loss": -10.074604034423828, "global_step": 296948, "epoch": 1767} {"train_loss": -9.485365867614746, "global_step": 296949, "epoch": 1767} {"train_loss": -10.156858444213867, "global_step": 296950, "epoch": 1767} {"train_loss": -10.346159934997559, "global_step": 296951, "epoch": 1767} {"train_loss": -10.103403091430664, "global_step": 296952, "epoch": 1767} {"train_loss": -9.3171968460083, "global_step": 296953, "epoch": 1767} {"train_loss": -10.349483489990234, "global_step": 296954, "epoch": 1767} {"train_loss": -10.25663948059082, "global_step": 296955, "epoch": 1767} {"train_loss": -9.622295379638672, "global_step": 296956, "epoch": 1767} {"train_loss": -11.024211883544922, "global_step": 296957, "epoch": 1767} {"train_loss": -10.705375671386719, "global_step": 296958, "epoch": 1767} {"train_loss": -10.420052528381348, "global_step": 296959, "epoch": 1767} {"train_loss": -10.631952285766602, "global_step": 296960, "epoch": 1767} {"train_loss": -11.094860076904297, "global_step": 296961, "epoch": 1767} {"train_loss": -10.581262588500977, "global_step": 296962, "epoch": 1767} {"train_loss": -11.289047241210938, "global_step": 296963, "epoch": 1767} {"train_loss": -11.143278121948242, "global_step": 296964, "epoch": 1767} {"train_loss": -11.15829849243164, "global_step": 296965, "epoch": 1767} {"train_loss": -11.21525764465332, "global_step": 296966, "epoch": 1767} {"train_loss": -11.365240097045898, "global_step": 296967, "epoch": 1767} {"train_loss": -11.399967193603516, "global_step": 296968, "epoch": 1767} {"train_loss": -11.325051307678223, "global_step": 296969, "epoch": 1767} {"train_loss": -11.448660850524902, "global_step": 296970, "epoch": 1767} {"train_loss": -11.117177963256836, "global_step": 296971, "epoch": 1767} {"train_loss": -11.065065383911133, "global_step": 296972, "epoch": 1767} {"train_loss": -11.417762756347656, "global_step": 296973, "epoch": 1767} {"train_loss": -11.283077239990234, "global_step": 296974, "epoch": 1767} {"train_loss": -11.449674606323242, "global_step": 296975, "epoch": 1767} {"train_loss": -11.50692081451416, "global_step": 296976, "epoch": 1767} {"train_loss": -11.251958847045898, "global_step": 296977, "epoch": 1767} {"train_loss": -11.409698486328125, "global_step": 296978, "epoch": 1767} {"train_loss": -11.506354331970215, "global_step": 296979, "epoch": 1767} {"train_loss": -11.372228622436523, "global_step": 296980, "epoch": 1767} {"train_loss": -11.365612030029297, "global_step": 296981, "epoch": 1767} {"train_loss": -10.95953369140625, "global_step": 296982, "epoch": 1767} {"train_loss": -11.916956901550293, "global_step": 296983, "epoch": 1767} {"train_loss": -11.000144958496094, "global_step": 296984, "epoch": 1767} {"train_loss": -12.083433151245117, "global_step": 296985, "epoch": 1767} {"train_loss": -11.306922912597656, "global_step": 296986, "epoch": 1767} {"train_loss": -11.864540100097656, "global_step": 296987, "epoch": 1767} {"train_loss": -11.589484214782715, "global_step": 296988, "epoch": 1767} {"train_loss": -11.871261596679688, "global_step": 296989, "epoch": 1767} {"train_loss": -11.181938171386719, "global_step": 296990, "epoch": 1767} {"train_loss": -11.834266662597656, "global_step": 296991, "epoch": 1767} {"train_loss": -11.52841854095459, "global_step": 296992, "epoch": 1767} {"train_loss": -11.87940788269043, "global_step": 296993, "epoch": 1767} {"train_loss": -11.809679985046387, "global_step": 296994, "epoch": 1767} {"train_loss": -11.761917114257812, "global_step": 296995, "epoch": 1767} {"train_loss": -11.891448974609375, "global_step": 296996, "epoch": 1767} {"train_loss": -12.022480010986328, "global_step": 296997, "epoch": 1767} {"train_loss": -11.627464294433594, "global_step": 296998, "epoch": 1767} {"train_loss": -11.95795726776123, "global_step": 296999, "epoch": 1767} {"train_loss": -12.036630630493164, "global_step": 297000, "epoch": 1767} {"train_loss": -12.07291030883789, "global_step": 297001, "epoch": 1767} {"train_loss": -11.76146411895752, "global_step": 297002, "epoch": 1767} {"train_loss": -11.822799682617188, "global_step": 297003, "epoch": 1767} {"train_loss": -11.70980167388916, "global_step": 297004, "epoch": 1767} {"train_loss": -12.057328224182129, "global_step": 297005, "epoch": 1767} {"train_loss": -11.82770824432373, "global_step": 297006, "epoch": 1767} {"train_loss": -11.948034286499023, "global_step": 297007, "epoch": 1767} {"train_loss": -12.100265502929688, "global_step": 297008, "epoch": 1767} {"train_loss": -12.151690483093262, "global_step": 297009, "epoch": 1767} {"train_loss": -11.700047492980957, "global_step": 297010, "epoch": 1767} {"train_loss": -12.069278717041016, "global_step": 297011, "epoch": 1767} {"train_loss": -12.1351318359375, "global_step": 297012, "epoch": 1767} {"train_loss": -12.01387882232666, "global_step": 297013, "epoch": 1767} {"train_loss": -12.234319686889648, "global_step": 297014, "epoch": 1767} {"train_loss": -12.085225105285645, "global_step": 297015, "epoch": 1767} {"train_loss": -11.939650535583496, "global_step": 297016, "epoch": 1767} {"train_loss": -12.196783065795898, "global_step": 297017, "epoch": 1767} {"train_loss": -11.91705322265625, "global_step": 297018, "epoch": 1767} {"train_loss": -12.134050369262695, "global_step": 297019, "epoch": 1767} {"train_loss": -12.14661693572998, "global_step": 297020, "epoch": 1767} {"train_loss": -12.085010528564453, "global_step": 297021, "epoch": 1767} {"train_loss": -12.365192413330078, "global_step": 297022, "epoch": 1767} {"train_loss": -11.359444831098829, "global_step": 297023, "epoch": 1767, "val_loss": 276399.9375} {"train_loss": -12.152176856994629, "global_step": 297024, "epoch": 1768} {"train_loss": -11.96455192565918, "global_step": 297025, "epoch": 1768} {"train_loss": -12.234436988830566, "global_step": 297026, "epoch": 1768} {"train_loss": -12.423468589782715, "global_step": 297027, "epoch": 1768} {"train_loss": -12.192827224731445, "global_step": 297028, "epoch": 1768} {"train_loss": -12.362728118896484, "global_step": 297029, "epoch": 1768} {"train_loss": -12.190183639526367, "global_step": 297030, "epoch": 1768} {"train_loss": -12.278605461120605, "global_step": 297031, "epoch": 1768} {"train_loss": -12.319507598876953, "global_step": 297032, "epoch": 1768} {"train_loss": -12.28887939453125, "global_step": 297033, "epoch": 1768} {"train_loss": -12.057947158813477, "global_step": 297034, "epoch": 1768} {"train_loss": -12.264890670776367, "global_step": 297035, "epoch": 1768} {"train_loss": -12.336100578308105, "global_step": 297036, "epoch": 1768} {"train_loss": -12.12243938446045, "global_step": 297037, "epoch": 1768} {"train_loss": -12.298027038574219, "global_step": 297038, "epoch": 1768} {"train_loss": -12.183282852172852, "global_step": 297039, "epoch": 1768} {"train_loss": -12.135787010192871, "global_step": 297040, "epoch": 1768} {"train_loss": -12.420859336853027, "global_step": 297041, "epoch": 1768} {"train_loss": -12.251447677612305, "global_step": 297042, "epoch": 1768} {"train_loss": -12.481380462646484, "global_step": 297043, "epoch": 1768} {"train_loss": -12.506061553955078, "global_step": 297044, "epoch": 1768} {"train_loss": -12.13262939453125, "global_step": 297045, "epoch": 1768} {"train_loss": -12.073841094970703, "global_step": 297046, "epoch": 1768} {"train_loss": -12.5191650390625, "global_step": 297047, "epoch": 1768} {"train_loss": -12.082321166992188, "global_step": 297048, "epoch": 1768} {"train_loss": -12.2032470703125, "global_step": 297049, "epoch": 1768} {"train_loss": -12.246270179748535, "global_step": 297050, "epoch": 1768} {"train_loss": -12.025904655456543, "global_step": 297051, "epoch": 1768} {"train_loss": -11.904759407043457, "global_step": 297052, "epoch": 1768} {"train_loss": -12.241315841674805, "global_step": 297053, "epoch": 1768} {"train_loss": -12.436689376831055, "global_step": 297054, "epoch": 1768} {"train_loss": -12.190047264099121, "global_step": 297055, "epoch": 1768} {"train_loss": -12.47170639038086, "global_step": 297056, "epoch": 1768} {"train_loss": -12.290382385253906, "global_step": 297057, "epoch": 1768} {"train_loss": -12.356850624084473, "global_step": 297058, "epoch": 1768} {"train_loss": -12.455552101135254, "global_step": 297059, "epoch": 1768} {"train_loss": -11.973584175109863, "global_step": 297060, "epoch": 1768} {"train_loss": -12.43847942352295, "global_step": 297061, "epoch": 1768} {"train_loss": -12.355047225952148, "global_step": 297062, "epoch": 1768} {"train_loss": -12.300826072692871, "global_step": 297063, "epoch": 1768} {"train_loss": -12.334257125854492, "global_step": 297064, "epoch": 1768} {"train_loss": -12.17043685913086, "global_step": 297065, "epoch": 1768} {"train_loss": -12.387306213378906, "global_step": 297066, "epoch": 1768} {"train_loss": -12.464643478393555, "global_step": 297067, "epoch": 1768} {"train_loss": -12.076200485229492, "global_step": 297068, "epoch": 1768} {"train_loss": -12.167622566223145, "global_step": 297069, "epoch": 1768} {"train_loss": -11.79842758178711, "global_step": 297070, "epoch": 1768} {"train_loss": -12.530914306640625, "global_step": 297071, "epoch": 1768} {"train_loss": -12.34307861328125, "global_step": 297072, "epoch": 1768} {"train_loss": -12.287813186645508, "global_step": 297073, "epoch": 1768} {"train_loss": -12.52249526977539, "global_step": 297074, "epoch": 1768} {"train_loss": -12.277162551879883, "global_step": 297075, "epoch": 1768} {"train_loss": -12.55245590209961, "global_step": 297076, "epoch": 1768} {"train_loss": -12.265105247497559, "global_step": 297077, "epoch": 1768} {"train_loss": -12.023534774780273, "global_step": 297078, "epoch": 1768} {"train_loss": -11.045072555541992, "global_step": 297079, "epoch": 1768} {"train_loss": -11.212590217590332, "global_step": 297080, "epoch": 1768} {"train_loss": -12.253263473510742, "global_step": 297081, "epoch": 1768} {"train_loss": -9.496772766113281, "global_step": 297082, "epoch": 1768} {"train_loss": -10.561281204223633, "global_step": 297083, "epoch": 1768} {"train_loss": -10.897783279418945, "global_step": 297084, "epoch": 1768} {"train_loss": -11.63649845123291, "global_step": 297085, "epoch": 1768} {"train_loss": -11.456153869628906, "global_step": 297086, "epoch": 1768} {"train_loss": -11.644609451293945, "global_step": 297087, "epoch": 1768} {"train_loss": -11.51229476928711, "global_step": 297088, "epoch": 1768} {"train_loss": -10.602922439575195, "global_step": 297089, "epoch": 1768} {"train_loss": -11.55026912689209, "global_step": 297090, "epoch": 1768} {"train_loss": -10.469335556030273, "global_step": 297091, "epoch": 1768} {"train_loss": -11.667411804199219, "global_step": 297092, "epoch": 1768} {"train_loss": -10.210430145263672, "global_step": 297093, "epoch": 1768} {"train_loss": -9.947121620178223, "global_step": 297094, "epoch": 1768} {"train_loss": -12.086434364318848, "global_step": 297095, "epoch": 1768} {"train_loss": -9.873086929321289, "global_step": 297096, "epoch": 1768} {"train_loss": -10.275640487670898, "global_step": 297097, "epoch": 1768} {"train_loss": -10.582021713256836, "global_step": 297098, "epoch": 1768} {"train_loss": -11.077994346618652, "global_step": 297099, "epoch": 1768} {"train_loss": -11.614737510681152, "global_step": 297100, "epoch": 1768} {"train_loss": -10.980062484741211, "global_step": 297101, "epoch": 1768} {"train_loss": -11.627127647399902, "global_step": 297102, "epoch": 1768} {"train_loss": -10.942924499511719, "global_step": 297103, "epoch": 1768} {"train_loss": -11.572708129882812, "global_step": 297104, "epoch": 1768} {"train_loss": -11.767913818359375, "global_step": 297105, "epoch": 1768} {"train_loss": -10.522558212280273, "global_step": 297106, "epoch": 1768} {"train_loss": -10.690302848815918, "global_step": 297107, "epoch": 1768} {"train_loss": -10.543679237365723, "global_step": 297108, "epoch": 1768} {"train_loss": -10.662626266479492, "global_step": 297109, "epoch": 1768} {"train_loss": -11.245396614074707, "global_step": 297110, "epoch": 1768} {"train_loss": -10.798456192016602, "global_step": 297111, "epoch": 1768} {"train_loss": -10.633228302001953, "global_step": 297112, "epoch": 1768} {"train_loss": -11.236518859863281, "global_step": 297113, "epoch": 1768} {"train_loss": -10.858627319335938, "global_step": 297114, "epoch": 1768} {"train_loss": -11.01666259765625, "global_step": 297115, "epoch": 1768} {"train_loss": -10.366777420043945, "global_step": 297116, "epoch": 1768} {"train_loss": -10.927146911621094, "global_step": 297117, "epoch": 1768} {"train_loss": -11.354543685913086, "global_step": 297118, "epoch": 1768} {"train_loss": -10.653112411499023, "global_step": 297119, "epoch": 1768} {"train_loss": -11.450822830200195, "global_step": 297120, "epoch": 1768} {"train_loss": -10.654204368591309, "global_step": 297121, "epoch": 1768} {"train_loss": -10.665653228759766, "global_step": 297122, "epoch": 1768} {"train_loss": -10.741934776306152, "global_step": 297123, "epoch": 1768} {"train_loss": -11.559426307678223, "global_step": 297124, "epoch": 1768} {"train_loss": -10.23080825805664, "global_step": 297125, "epoch": 1768} {"train_loss": -11.547243118286133, "global_step": 297126, "epoch": 1768} {"train_loss": -10.897075653076172, "global_step": 297127, "epoch": 1768} {"train_loss": -11.41672134399414, "global_step": 297128, "epoch": 1768} {"train_loss": -11.166584014892578, "global_step": 297129, "epoch": 1768} {"train_loss": -11.042540550231934, "global_step": 297130, "epoch": 1768} {"train_loss": -11.357186317443848, "global_step": 297131, "epoch": 1768} {"train_loss": -11.478960990905762, "global_step": 297132, "epoch": 1768} {"train_loss": -10.855233192443848, "global_step": 297133, "epoch": 1768} {"train_loss": -11.781854629516602, "global_step": 297134, "epoch": 1768} {"train_loss": -11.45346736907959, "global_step": 297135, "epoch": 1768} {"train_loss": -11.63066291809082, "global_step": 297136, "epoch": 1768} {"train_loss": -11.765342712402344, "global_step": 297137, "epoch": 1768} {"train_loss": -11.652657508850098, "global_step": 297138, "epoch": 1768} {"train_loss": -11.746784210205078, "global_step": 297139, "epoch": 1768} {"train_loss": -11.725419998168945, "global_step": 297140, "epoch": 1768} {"train_loss": -11.732809066772461, "global_step": 297141, "epoch": 1768} {"train_loss": -11.888437271118164, "global_step": 297142, "epoch": 1768} {"train_loss": -11.437739372253418, "global_step": 297143, "epoch": 1768} {"train_loss": -12.016904830932617, "global_step": 297144, "epoch": 1768} {"train_loss": -11.777536392211914, "global_step": 297145, "epoch": 1768} {"train_loss": -11.73986530303955, "global_step": 297146, "epoch": 1768} {"train_loss": -11.864295959472656, "global_step": 297147, "epoch": 1768} {"train_loss": -11.584342956542969, "global_step": 297148, "epoch": 1768} {"train_loss": -11.861373901367188, "global_step": 297149, "epoch": 1768} {"train_loss": -11.785052299499512, "global_step": 297150, "epoch": 1768} {"train_loss": -11.575157165527344, "global_step": 297151, "epoch": 1768} {"train_loss": -11.78622055053711, "global_step": 297152, "epoch": 1768} {"train_loss": -11.70119857788086, "global_step": 297153, "epoch": 1768} {"train_loss": -11.940183639526367, "global_step": 297154, "epoch": 1768} {"train_loss": -11.851789474487305, "global_step": 297155, "epoch": 1768} {"train_loss": -11.76844596862793, "global_step": 297156, "epoch": 1768} {"train_loss": -11.968860626220703, "global_step": 297157, "epoch": 1768} {"train_loss": -11.737593650817871, "global_step": 297158, "epoch": 1768} {"train_loss": -11.954233169555664, "global_step": 297159, "epoch": 1768} {"train_loss": -11.99813461303711, "global_step": 297160, "epoch": 1768} {"train_loss": -12.158897399902344, "global_step": 297161, "epoch": 1768} {"train_loss": -12.062928199768066, "global_step": 297162, "epoch": 1768} {"train_loss": -12.27260971069336, "global_step": 297163, "epoch": 1768} {"train_loss": -11.954024314880371, "global_step": 297164, "epoch": 1768} {"train_loss": -12.119115829467773, "global_step": 297165, "epoch": 1768} {"train_loss": -11.614243507385254, "global_step": 297166, "epoch": 1768} {"train_loss": -12.034972190856934, "global_step": 297167, "epoch": 1768} {"train_loss": -12.01386833190918, "global_step": 297168, "epoch": 1768} {"train_loss": -12.128345489501953, "global_step": 297169, "epoch": 1768} {"train_loss": -12.084174156188965, "global_step": 297170, "epoch": 1768} {"train_loss": -12.106639862060547, "global_step": 297171, "epoch": 1768} {"train_loss": -12.08676528930664, "global_step": 297172, "epoch": 1768} {"train_loss": -11.955122947692871, "global_step": 297173, "epoch": 1768} {"train_loss": -11.891243934631348, "global_step": 297174, "epoch": 1768} {"train_loss": -11.971527099609375, "global_step": 297175, "epoch": 1768} {"train_loss": -11.746545791625977, "global_step": 297176, "epoch": 1768} {"train_loss": -12.003255844116211, "global_step": 297177, "epoch": 1768} {"train_loss": -11.980186462402344, "global_step": 297178, "epoch": 1768} {"train_loss": -12.047882080078125, "global_step": 297179, "epoch": 1768} {"train_loss": -12.08143138885498, "global_step": 297180, "epoch": 1768} {"train_loss": -12.135272979736328, "global_step": 297181, "epoch": 1768} {"train_loss": -11.901540756225586, "global_step": 297182, "epoch": 1768} {"train_loss": -11.784029960632324, "global_step": 297183, "epoch": 1768} {"train_loss": -12.085190773010254, "global_step": 297184, "epoch": 1768} {"train_loss": -11.589128494262695, "global_step": 297185, "epoch": 1768} {"train_loss": -11.959476470947266, "global_step": 297186, "epoch": 1768} {"train_loss": -12.01361083984375, "global_step": 297187, "epoch": 1768} {"train_loss": -11.92761516571045, "global_step": 297188, "epoch": 1768} {"train_loss": -12.223767280578613, "global_step": 297189, "epoch": 1768} {"train_loss": -11.302814483642578, "global_step": 297190, "epoch": 1768} {"train_loss": -11.718998409452892, "global_step": 297191, "epoch": 1768, "val_loss": 279668.78125} {"train_loss": -11.145872116088867, "global_step": 297192, "epoch": 1769} {"train_loss": -11.837190628051758, "global_step": 297193, "epoch": 1769} {"train_loss": -11.708929061889648, "global_step": 297194, "epoch": 1769} {"train_loss": -11.293107032775879, "global_step": 297195, "epoch": 1769} {"train_loss": -12.224905014038086, "global_step": 297196, "epoch": 1769} {"train_loss": -11.57075309753418, "global_step": 297197, "epoch": 1769} {"train_loss": -12.21288013458252, "global_step": 297198, "epoch": 1769} {"train_loss": -11.30370044708252, "global_step": 297199, "epoch": 1769} {"train_loss": -11.51953411102295, "global_step": 297200, "epoch": 1769} {"train_loss": -11.817809104919434, "global_step": 297201, "epoch": 1769} {"train_loss": -11.579269409179688, "global_step": 297202, "epoch": 1769} {"train_loss": -11.839719772338867, "global_step": 297203, "epoch": 1769} {"train_loss": -11.296096801757812, "global_step": 297204, "epoch": 1769} {"train_loss": -11.69204044342041, "global_step": 297205, "epoch": 1769} {"train_loss": -12.102705001831055, "global_step": 297206, "epoch": 1769} {"train_loss": -11.888933181762695, "global_step": 297207, "epoch": 1769} {"train_loss": -11.688612937927246, "global_step": 297208, "epoch": 1769} {"train_loss": -11.772994995117188, "global_step": 297209, "epoch": 1769} {"train_loss": -11.566200256347656, "global_step": 297210, "epoch": 1769} {"train_loss": -11.770018577575684, "global_step": 297211, "epoch": 1769} {"train_loss": -11.689489364624023, "global_step": 297212, "epoch": 1769} {"train_loss": -11.805126190185547, "global_step": 297213, "epoch": 1769} {"train_loss": -11.857234001159668, "global_step": 297214, "epoch": 1769} {"train_loss": -11.613717079162598, "global_step": 297215, "epoch": 1769} {"train_loss": -11.850751876831055, "global_step": 297216, "epoch": 1769} {"train_loss": -11.806018829345703, "global_step": 297217, "epoch": 1769} {"train_loss": -11.759868621826172, "global_step": 297218, "epoch": 1769} {"train_loss": -11.586302757263184, "global_step": 297219, "epoch": 1769} {"train_loss": -11.776037216186523, "global_step": 297220, "epoch": 1769} {"train_loss": -11.975364685058594, "global_step": 297221, "epoch": 1769} {"train_loss": -12.101682662963867, "global_step": 297222, "epoch": 1769} {"train_loss": -11.984628677368164, "global_step": 297223, "epoch": 1769} {"train_loss": -11.966400146484375, "global_step": 297224, "epoch": 1769} {"train_loss": -12.138607025146484, "global_step": 297225, "epoch": 1769} {"train_loss": -12.04263687133789, "global_step": 297226, "epoch": 1769} {"train_loss": -12.286767959594727, "global_step": 297227, "epoch": 1769} {"train_loss": -12.233756065368652, "global_step": 297228, "epoch": 1769} {"train_loss": -12.258052825927734, "global_step": 297229, "epoch": 1769} {"train_loss": -12.249747276306152, "global_step": 297230, "epoch": 1769} {"train_loss": -12.143559455871582, "global_step": 297231, "epoch": 1769} {"train_loss": -12.273199081420898, "global_step": 297232, "epoch": 1769} {"train_loss": -12.14651870727539, "global_step": 297233, "epoch": 1769} {"train_loss": -11.981800079345703, "global_step": 297234, "epoch": 1769} {"train_loss": -11.660491943359375, "global_step": 297235, "epoch": 1769} {"train_loss": -12.273005485534668, "global_step": 297236, "epoch": 1769} {"train_loss": -12.083436012268066, "global_step": 297237, "epoch": 1769} {"train_loss": -11.682214736938477, "global_step": 297238, "epoch": 1769} {"train_loss": -11.116508483886719, "global_step": 297239, "epoch": 1769} {"train_loss": -11.759906768798828, "global_step": 297240, "epoch": 1769} {"train_loss": -11.218820571899414, "global_step": 297241, "epoch": 1769} {"train_loss": -11.554197311401367, "global_step": 297242, "epoch": 1769} {"train_loss": -12.188268661499023, "global_step": 297243, "epoch": 1769} {"train_loss": -11.969097137451172, "global_step": 297244, "epoch": 1769} {"train_loss": -11.88705825805664, "global_step": 297245, "epoch": 1769} {"train_loss": -12.045804023742676, "global_step": 297246, "epoch": 1769} {"train_loss": -11.740302085876465, "global_step": 297247, "epoch": 1769} {"train_loss": -12.20169448852539, "global_step": 297248, "epoch": 1769} {"train_loss": -11.192337989807129, "global_step": 297249, "epoch": 1769} {"train_loss": -11.89067268371582, "global_step": 297250, "epoch": 1769} {"train_loss": -11.744577407836914, "global_step": 297251, "epoch": 1769} {"train_loss": -11.927990913391113, "global_step": 297252, "epoch": 1769} {"train_loss": -11.835878372192383, "global_step": 297253, "epoch": 1769} {"train_loss": -11.755712509155273, "global_step": 297254, "epoch": 1769} {"train_loss": -12.225611686706543, "global_step": 297255, "epoch": 1769} {"train_loss": -11.681869506835938, "global_step": 297256, "epoch": 1769} {"train_loss": -11.837933540344238, "global_step": 297257, "epoch": 1769} {"train_loss": -12.053309440612793, "global_step": 297258, "epoch": 1769} {"train_loss": -11.772811889648438, "global_step": 297259, "epoch": 1769} {"train_loss": -12.112401962280273, "global_step": 297260, "epoch": 1769} {"train_loss": -11.44578742980957, "global_step": 297261, "epoch": 1769} {"train_loss": -11.780258178710938, "global_step": 297262, "epoch": 1769} {"train_loss": -11.924734115600586, "global_step": 297263, "epoch": 1769} {"train_loss": -11.389999389648438, "global_step": 297264, "epoch": 1769} {"train_loss": -11.60782241821289, "global_step": 297265, "epoch": 1769} {"train_loss": -10.99751091003418, "global_step": 297266, "epoch": 1769} {"train_loss": -11.720605850219727, "global_step": 297267, "epoch": 1769} {"train_loss": -11.222512245178223, "global_step": 297268, "epoch": 1769} {"train_loss": -11.246757507324219, "global_step": 297269, "epoch": 1769} {"train_loss": -11.984796524047852, "global_step": 297270, "epoch": 1769} {"train_loss": -11.24850845336914, "global_step": 297271, "epoch": 1769} {"train_loss": -12.09602165222168, "global_step": 297272, "epoch": 1769} {"train_loss": -11.26797103881836, "global_step": 297273, "epoch": 1769} {"train_loss": -11.90843391418457, "global_step": 297274, "epoch": 1769} {"train_loss": -11.04214096069336, "global_step": 297275, "epoch": 1769} {"train_loss": -11.672296524047852, "global_step": 297276, "epoch": 1769} {"train_loss": -11.475689888000488, "global_step": 297277, "epoch": 1769} {"train_loss": -10.757247924804688, "global_step": 297278, "epoch": 1769} {"train_loss": -11.592886924743652, "global_step": 297279, "epoch": 1769} {"train_loss": -11.303627967834473, "global_step": 297280, "epoch": 1769} {"train_loss": -10.923476219177246, "global_step": 297281, "epoch": 1769} {"train_loss": -12.052398681640625, "global_step": 297282, "epoch": 1769} {"train_loss": -11.056159973144531, "global_step": 297283, "epoch": 1769} {"train_loss": -11.792633056640625, "global_step": 297284, "epoch": 1769} {"train_loss": -11.79492473602295, "global_step": 297285, "epoch": 1769} {"train_loss": -11.703511238098145, "global_step": 297286, "epoch": 1769} {"train_loss": -11.994821548461914, "global_step": 297287, "epoch": 1769} {"train_loss": -11.494409561157227, "global_step": 297288, "epoch": 1769} {"train_loss": -11.873922348022461, "global_step": 297289, "epoch": 1769} {"train_loss": -12.135576248168945, "global_step": 297290, "epoch": 1769} {"train_loss": -11.80128002166748, "global_step": 297291, "epoch": 1769} {"train_loss": -12.02001953125, "global_step": 297292, "epoch": 1769} {"train_loss": -12.224437713623047, "global_step": 297293, "epoch": 1769} {"train_loss": -11.938722610473633, "global_step": 297294, "epoch": 1769} {"train_loss": -12.237736701965332, "global_step": 297295, "epoch": 1769} {"train_loss": -12.036849975585938, "global_step": 297296, "epoch": 1769} {"train_loss": -11.883723258972168, "global_step": 297297, "epoch": 1769} {"train_loss": -12.091291427612305, "global_step": 297298, "epoch": 1769} {"train_loss": -11.73893928527832, "global_step": 297299, "epoch": 1769} {"train_loss": -12.202122688293457, "global_step": 297300, "epoch": 1769} {"train_loss": -11.877365112304688, "global_step": 297301, "epoch": 1769} {"train_loss": -12.137935638427734, "global_step": 297302, "epoch": 1769} {"train_loss": -12.063159942626953, "global_step": 297303, "epoch": 1769} {"train_loss": -12.061531066894531, "global_step": 297304, "epoch": 1769} {"train_loss": -12.058513641357422, "global_step": 297305, "epoch": 1769} {"train_loss": -12.036505699157715, "global_step": 297306, "epoch": 1769} {"train_loss": -12.0999174118042, "global_step": 297307, "epoch": 1769} {"train_loss": -12.069310188293457, "global_step": 297308, "epoch": 1769} {"train_loss": -12.343705177307129, "global_step": 297309, "epoch": 1769} {"train_loss": -12.052787780761719, "global_step": 297310, "epoch": 1769} {"train_loss": -12.338543891906738, "global_step": 297311, "epoch": 1769} {"train_loss": -12.381930351257324, "global_step": 297312, "epoch": 1769} {"train_loss": -12.284826278686523, "global_step": 297313, "epoch": 1769} {"train_loss": -12.321053504943848, "global_step": 297314, "epoch": 1769} {"train_loss": -12.2433500289917, "global_step": 297315, "epoch": 1769} {"train_loss": -12.35577392578125, "global_step": 297316, "epoch": 1769} {"train_loss": -12.105108261108398, "global_step": 297317, "epoch": 1769} {"train_loss": -12.447978973388672, "global_step": 297318, "epoch": 1769} {"train_loss": -12.273028373718262, "global_step": 297319, "epoch": 1769} {"train_loss": -12.228672981262207, "global_step": 297320, "epoch": 1769} {"train_loss": -12.358264923095703, "global_step": 297321, "epoch": 1769} {"train_loss": -12.179052352905273, "global_step": 297322, "epoch": 1769} {"train_loss": -12.186914443969727, "global_step": 297323, "epoch": 1769} {"train_loss": -12.396777153015137, "global_step": 297324, "epoch": 1769} {"train_loss": -12.225571632385254, "global_step": 297325, "epoch": 1769} {"train_loss": -11.840107917785645, "global_step": 297326, "epoch": 1769} {"train_loss": -12.165338516235352, "global_step": 297327, "epoch": 1769} {"train_loss": -12.097677230834961, "global_step": 297328, "epoch": 1769} {"train_loss": -12.039543151855469, "global_step": 297329, "epoch": 1769} {"train_loss": -11.569714546203613, "global_step": 297330, "epoch": 1769} {"train_loss": -11.335336685180664, "global_step": 297331, "epoch": 1769} {"train_loss": -10.903112411499023, "global_step": 297332, "epoch": 1769} {"train_loss": -11.536422729492188, "global_step": 297333, "epoch": 1769} {"train_loss": -11.730425834655762, "global_step": 297334, "epoch": 1769} {"train_loss": -11.85762882232666, "global_step": 297335, "epoch": 1769} {"train_loss": -11.538556098937988, "global_step": 297336, "epoch": 1769} {"train_loss": -11.598051071166992, "global_step": 297337, "epoch": 1769} {"train_loss": -12.116859436035156, "global_step": 297338, "epoch": 1769} {"train_loss": -11.854612350463867, "global_step": 297339, "epoch": 1769} {"train_loss": -11.85410213470459, "global_step": 297340, "epoch": 1769} {"train_loss": -12.319731712341309, "global_step": 297341, "epoch": 1769} {"train_loss": -12.173946380615234, "global_step": 297342, "epoch": 1769} {"train_loss": -11.806835174560547, "global_step": 297343, "epoch": 1769} {"train_loss": -11.749424934387207, "global_step": 297344, "epoch": 1769} {"train_loss": -12.061997413635254, "global_step": 297345, "epoch": 1769} {"train_loss": -12.09545612335205, "global_step": 297346, "epoch": 1769} {"train_loss": -12.080011367797852, "global_step": 297347, "epoch": 1769} {"train_loss": -11.895788192749023, "global_step": 297348, "epoch": 1769} {"train_loss": -11.879415512084961, "global_step": 297349, "epoch": 1769} {"train_loss": -12.137816429138184, "global_step": 297350, "epoch": 1769} {"train_loss": -12.074188232421875, "global_step": 297351, "epoch": 1769} {"train_loss": -12.40703010559082, "global_step": 297352, "epoch": 1769} {"train_loss": -11.950334548950195, "global_step": 297353, "epoch": 1769} {"train_loss": -12.092549324035645, "global_step": 297354, "epoch": 1769} {"train_loss": -11.992066383361816, "global_step": 297355, "epoch": 1769} {"train_loss": -12.261771202087402, "global_step": 297356, "epoch": 1769} {"train_loss": -12.01063346862793, "global_step": 297357, "epoch": 1769} {"train_loss": -12.255072593688965, "global_step": 297358, "epoch": 1769} {"train_loss": -11.868541115806217, "global_step": 297359, "epoch": 1769, "val_loss": 281162.46875} {"train_loss": -11.854058265686035, "global_step": 297360, "epoch": 1770} {"train_loss": -11.584741592407227, "global_step": 297361, "epoch": 1770} {"train_loss": -12.233150482177734, "global_step": 297362, "epoch": 1770} {"train_loss": -11.869869232177734, "global_step": 297363, "epoch": 1770} {"train_loss": -11.623991012573242, "global_step": 297364, "epoch": 1770} {"train_loss": -11.808247566223145, "global_step": 297365, "epoch": 1770} {"train_loss": -11.820364952087402, "global_step": 297366, "epoch": 1770} {"train_loss": -12.353392601013184, "global_step": 297367, "epoch": 1770} {"train_loss": -12.136329650878906, "global_step": 297368, "epoch": 1770} {"train_loss": -11.962021827697754, "global_step": 297369, "epoch": 1770} {"train_loss": -11.627605438232422, "global_step": 297370, "epoch": 1770} {"train_loss": -11.399284362792969, "global_step": 297371, "epoch": 1770} {"train_loss": -12.068565368652344, "global_step": 297372, "epoch": 1770} {"train_loss": -11.618882179260254, "global_step": 297373, "epoch": 1770} {"train_loss": -12.188173294067383, "global_step": 297374, "epoch": 1770} {"train_loss": -11.301977157592773, "global_step": 297375, "epoch": 1770} {"train_loss": -11.968658447265625, "global_step": 297376, "epoch": 1770} {"train_loss": -11.375787734985352, "global_step": 297377, "epoch": 1770} {"train_loss": -11.810181617736816, "global_step": 297378, "epoch": 1770} {"train_loss": -11.296018600463867, "global_step": 297379, "epoch": 1770} {"train_loss": -11.802297592163086, "global_step": 297380, "epoch": 1770} {"train_loss": -11.59203815460205, "global_step": 297381, "epoch": 1770} {"train_loss": -10.896907806396484, "global_step": 297382, "epoch": 1770} {"train_loss": -11.37806510925293, "global_step": 297383, "epoch": 1770} {"train_loss": -11.584177017211914, "global_step": 297384, "epoch": 1770} {"train_loss": -11.970786094665527, "global_step": 297385, "epoch": 1770} {"train_loss": -10.5377836227417, "global_step": 297386, "epoch": 1770} {"train_loss": -11.93021011352539, "global_step": 297387, "epoch": 1770} {"train_loss": -10.440866470336914, "global_step": 297388, "epoch": 1770} {"train_loss": -11.432849884033203, "global_step": 297389, "epoch": 1770} {"train_loss": -10.791728019714355, "global_step": 297390, "epoch": 1770} {"train_loss": -11.179145812988281, "global_step": 297391, "epoch": 1770} {"train_loss": -10.599710464477539, "global_step": 297392, "epoch": 1770} {"train_loss": -11.909632682800293, "global_step": 297393, "epoch": 1770} {"train_loss": -11.33102798461914, "global_step": 297394, "epoch": 1770} {"train_loss": -11.762297630310059, "global_step": 297395, "epoch": 1770} {"train_loss": -11.445955276489258, "global_step": 297396, "epoch": 1770} {"train_loss": -12.257200241088867, "global_step": 297397, "epoch": 1770} {"train_loss": -11.809272766113281, "global_step": 297398, "epoch": 1770} {"train_loss": -11.942870140075684, "global_step": 297399, "epoch": 1770} {"train_loss": -11.990376472473145, "global_step": 297400, "epoch": 1770} {"train_loss": -11.95832633972168, "global_step": 297401, "epoch": 1770} {"train_loss": -12.02616024017334, "global_step": 297402, "epoch": 1770} {"train_loss": -11.985557556152344, "global_step": 297403, "epoch": 1770} {"train_loss": -11.815933227539062, "global_step": 297404, "epoch": 1770} {"train_loss": -11.910516738891602, "global_step": 297405, "epoch": 1770} {"train_loss": -12.027234077453613, "global_step": 297406, "epoch": 1770} {"train_loss": -12.083450317382812, "global_step": 297407, "epoch": 1770} {"train_loss": -12.158853530883789, "global_step": 297408, "epoch": 1770} {"train_loss": -12.209203720092773, "global_step": 297409, "epoch": 1770} {"train_loss": -12.221168518066406, "global_step": 297410, "epoch": 1770} {"train_loss": -12.245306968688965, "global_step": 297411, "epoch": 1770} {"train_loss": -12.057489395141602, "global_step": 297412, "epoch": 1770} {"train_loss": -12.136902809143066, "global_step": 297413, "epoch": 1770} {"train_loss": -12.270315170288086, "global_step": 297414, "epoch": 1770} {"train_loss": -11.86414623260498, "global_step": 297415, "epoch": 1770} {"train_loss": -12.292581558227539, "global_step": 297416, "epoch": 1770} {"train_loss": -12.067197799682617, "global_step": 297417, "epoch": 1770} {"train_loss": -12.043781280517578, "global_step": 297418, "epoch": 1770} {"train_loss": -11.979523658752441, "global_step": 297419, "epoch": 1770} {"train_loss": -11.84975814819336, "global_step": 297420, "epoch": 1770} {"train_loss": -12.232638359069824, "global_step": 297421, "epoch": 1770} {"train_loss": -11.46476936340332, "global_step": 297422, "epoch": 1770} {"train_loss": -12.126927375793457, "global_step": 297423, "epoch": 1770} {"train_loss": -11.917549133300781, "global_step": 297424, "epoch": 1770} {"train_loss": -11.760064125061035, "global_step": 297425, "epoch": 1770} {"train_loss": -12.501801490783691, "global_step": 297426, "epoch": 1770} {"train_loss": -11.680891036987305, "global_step": 297427, "epoch": 1770} {"train_loss": -11.891946792602539, "global_step": 297428, "epoch": 1770} {"train_loss": -12.000785827636719, "global_step": 297429, "epoch": 1770} {"train_loss": -11.643875122070312, "global_step": 297430, "epoch": 1770} {"train_loss": -11.769450187683105, "global_step": 297431, "epoch": 1770} {"train_loss": -12.169373512268066, "global_step": 297432, "epoch": 1770} {"train_loss": -12.03223991394043, "global_step": 297433, "epoch": 1770} {"train_loss": -12.442428588867188, "global_step": 297434, "epoch": 1770} {"train_loss": -11.459962844848633, "global_step": 297435, "epoch": 1770} {"train_loss": -12.137392044067383, "global_step": 297436, "epoch": 1770} {"train_loss": -11.764665603637695, "global_step": 297437, "epoch": 1770} {"train_loss": -11.758268356323242, "global_step": 297438, "epoch": 1770} {"train_loss": -12.222345352172852, "global_step": 297439, "epoch": 1770} {"train_loss": -11.89487361907959, "global_step": 297440, "epoch": 1770} {"train_loss": -11.910228729248047, "global_step": 297441, "epoch": 1770} {"train_loss": -12.047948837280273, "global_step": 297442, "epoch": 1770} {"train_loss": -11.782430648803711, "global_step": 297443, "epoch": 1770} {"train_loss": -11.870701789855957, "global_step": 297444, "epoch": 1770} {"train_loss": -12.365653038024902, "global_step": 297445, "epoch": 1770} {"train_loss": -11.984729766845703, "global_step": 297446, "epoch": 1770} {"train_loss": -12.31501293182373, "global_step": 297447, "epoch": 1770} {"train_loss": -12.135281562805176, "global_step": 297448, "epoch": 1770} {"train_loss": -12.402464866638184, "global_step": 297449, "epoch": 1770} {"train_loss": -12.322534561157227, "global_step": 297450, "epoch": 1770} {"train_loss": -12.062809944152832, "global_step": 297451, "epoch": 1770} {"train_loss": -12.251327514648438, "global_step": 297452, "epoch": 1770} {"train_loss": -11.914651870727539, "global_step": 297453, "epoch": 1770} {"train_loss": -12.052023887634277, "global_step": 297454, "epoch": 1770} {"train_loss": -12.195764541625977, "global_step": 297455, "epoch": 1770} {"train_loss": -12.097312927246094, "global_step": 297456, "epoch": 1770} {"train_loss": -12.003169059753418, "global_step": 297457, "epoch": 1770} {"train_loss": -12.29552936553955, "global_step": 297458, "epoch": 1770} {"train_loss": -11.901314735412598, "global_step": 297459, "epoch": 1770} {"train_loss": -12.350441932678223, "global_step": 297460, "epoch": 1770} {"train_loss": -12.407318115234375, "global_step": 297461, "epoch": 1770} {"train_loss": -12.108238220214844, "global_step": 297462, "epoch": 1770} {"train_loss": -12.293256759643555, "global_step": 297463, "epoch": 1770} {"train_loss": -11.632843017578125, "global_step": 297464, "epoch": 1770} {"train_loss": -12.362190246582031, "global_step": 297465, "epoch": 1770} {"train_loss": -12.385647773742676, "global_step": 297466, "epoch": 1770} {"train_loss": -12.028216361999512, "global_step": 297467, "epoch": 1770} {"train_loss": -12.137571334838867, "global_step": 297468, "epoch": 1770} {"train_loss": -12.339472770690918, "global_step": 297469, "epoch": 1770} {"train_loss": -12.248015403747559, "global_step": 297470, "epoch": 1770} {"train_loss": -11.985711097717285, "global_step": 297471, "epoch": 1770} {"train_loss": -12.137948036193848, "global_step": 297472, "epoch": 1770} {"train_loss": -12.114027976989746, "global_step": 297473, "epoch": 1770} {"train_loss": -12.037057876586914, "global_step": 297474, "epoch": 1770} {"train_loss": -11.807500839233398, "global_step": 297475, "epoch": 1770} {"train_loss": -11.829874038696289, "global_step": 297476, "epoch": 1770} {"train_loss": -12.012531280517578, "global_step": 297477, "epoch": 1770} {"train_loss": -10.881914138793945, "global_step": 297478, "epoch": 1770} {"train_loss": -11.787738800048828, "global_step": 297479, "epoch": 1770} {"train_loss": -11.256092071533203, "global_step": 297480, "epoch": 1770} {"train_loss": -10.934745788574219, "global_step": 297481, "epoch": 1770} {"train_loss": -10.7523193359375, "global_step": 297482, "epoch": 1770} {"train_loss": -11.933905601501465, "global_step": 297483, "epoch": 1770} {"train_loss": -11.740391731262207, "global_step": 297484, "epoch": 1770} {"train_loss": -12.029449462890625, "global_step": 297485, "epoch": 1770} {"train_loss": -11.809470176696777, "global_step": 297486, "epoch": 1770} {"train_loss": -11.826713562011719, "global_step": 297487, "epoch": 1770} {"train_loss": -12.071701049804688, "global_step": 297488, "epoch": 1770} {"train_loss": -12.09697151184082, "global_step": 297489, "epoch": 1770} {"train_loss": -11.883040428161621, "global_step": 297490, "epoch": 1770} {"train_loss": -11.925207138061523, "global_step": 297491, "epoch": 1770} {"train_loss": -11.761826515197754, "global_step": 297492, "epoch": 1770} {"train_loss": -12.063180923461914, "global_step": 297493, "epoch": 1770} {"train_loss": -12.185916900634766, "global_step": 297494, "epoch": 1770} {"train_loss": -12.177992820739746, "global_step": 297495, "epoch": 1770} {"train_loss": -12.106006622314453, "global_step": 297496, "epoch": 1770} {"train_loss": -11.72128677368164, "global_step": 297497, "epoch": 1770} {"train_loss": -11.585498809814453, "global_step": 297498, "epoch": 1770} {"train_loss": -11.918794631958008, "global_step": 297499, "epoch": 1770} {"train_loss": -11.88308334350586, "global_step": 297500, "epoch": 1770} {"train_loss": -11.36058235168457, "global_step": 297501, "epoch": 1770} {"train_loss": -11.434171676635742, "global_step": 297502, "epoch": 1770} {"train_loss": -11.916860580444336, "global_step": 297503, "epoch": 1770} {"train_loss": -11.954010009765625, "global_step": 297504, "epoch": 1770} {"train_loss": -11.736282348632812, "global_step": 297505, "epoch": 1770} {"train_loss": -11.424242973327637, "global_step": 297506, "epoch": 1770} {"train_loss": -11.756391525268555, "global_step": 297507, "epoch": 1770} {"train_loss": -11.253142356872559, "global_step": 297508, "epoch": 1770} {"train_loss": -11.843170166015625, "global_step": 297509, "epoch": 1770} {"train_loss": -11.229070663452148, "global_step": 297510, "epoch": 1770} {"train_loss": -11.472524642944336, "global_step": 297511, "epoch": 1770} {"train_loss": -10.961273193359375, "global_step": 297512, "epoch": 1770} {"train_loss": -12.124181747436523, "global_step": 297513, "epoch": 1770} {"train_loss": -10.624555587768555, "global_step": 297514, "epoch": 1770} {"train_loss": -11.920366287231445, "global_step": 297515, "epoch": 1770} {"train_loss": -11.08049201965332, "global_step": 297516, "epoch": 1770} {"train_loss": -11.935276985168457, "global_step": 297517, "epoch": 1770} {"train_loss": -11.595757484436035, "global_step": 297518, "epoch": 1770} {"train_loss": -11.936929702758789, "global_step": 297519, "epoch": 1770} {"train_loss": -11.863129615783691, "global_step": 297520, "epoch": 1770} {"train_loss": -11.997825622558594, "global_step": 297521, "epoch": 1770} {"train_loss": -11.885251998901367, "global_step": 297522, "epoch": 1770} {"train_loss": -12.136861801147461, "global_step": 297523, "epoch": 1770} {"train_loss": -11.713772773742676, "global_step": 297524, "epoch": 1770} {"train_loss": -12.1292724609375, "global_step": 297525, "epoch": 1770} {"train_loss": -11.700233459472656, "global_step": 297526, "epoch": 1770} {"train_loss": -11.846181648118156, "global_step": 297527, "epoch": 1770, "val_loss": 281234.0, "train_action_mse_error": 1.0985057353973389} {"train_loss": -12.20817756652832, "global_step": 297528, "epoch": 1771} {"train_loss": -11.796140670776367, "global_step": 297529, "epoch": 1771} {"train_loss": -12.129995346069336, "global_step": 297530, "epoch": 1771} {"train_loss": -12.310855865478516, "global_step": 297531, "epoch": 1771} {"train_loss": -12.390939712524414, "global_step": 297532, "epoch": 1771} {"train_loss": -12.258668899536133, "global_step": 297533, "epoch": 1771} {"train_loss": -12.391851425170898, "global_step": 297534, "epoch": 1771} {"train_loss": -12.294767379760742, "global_step": 297535, "epoch": 1771} {"train_loss": -12.224067687988281, "global_step": 297536, "epoch": 1771} {"train_loss": -12.098978042602539, "global_step": 297537, "epoch": 1771} {"train_loss": -12.206295013427734, "global_step": 297538, "epoch": 1771} {"train_loss": -12.058831214904785, "global_step": 297539, "epoch": 1771} {"train_loss": -12.125697135925293, "global_step": 297540, "epoch": 1771} {"train_loss": -12.12156867980957, "global_step": 297541, "epoch": 1771} {"train_loss": -12.03399658203125, "global_step": 297542, "epoch": 1771} {"train_loss": -11.866338729858398, "global_step": 297543, "epoch": 1771} {"train_loss": -12.403326034545898, "global_step": 297544, "epoch": 1771} {"train_loss": -11.99638557434082, "global_step": 297545, "epoch": 1771} {"train_loss": -12.05003547668457, "global_step": 297546, "epoch": 1771} {"train_loss": -11.803206443786621, "global_step": 297547, "epoch": 1771} {"train_loss": -12.138326644897461, "global_step": 297548, "epoch": 1771} {"train_loss": -11.870290756225586, "global_step": 297549, "epoch": 1771} {"train_loss": -11.745158195495605, "global_step": 297550, "epoch": 1771} {"train_loss": -10.752338409423828, "global_step": 297551, "epoch": 1771} {"train_loss": -11.873306274414062, "global_step": 297552, "epoch": 1771} {"train_loss": -11.952296257019043, "global_step": 297553, "epoch": 1771} {"train_loss": -11.16435432434082, "global_step": 297554, "epoch": 1771} {"train_loss": -11.426290512084961, "global_step": 297555, "epoch": 1771} {"train_loss": -12.146219253540039, "global_step": 297556, "epoch": 1771} {"train_loss": -11.542137145996094, "global_step": 297557, "epoch": 1771} {"train_loss": -11.687248229980469, "global_step": 297558, "epoch": 1771} {"train_loss": -11.573171615600586, "global_step": 297559, "epoch": 1771} {"train_loss": -11.166923522949219, "global_step": 297560, "epoch": 1771} {"train_loss": -11.058624267578125, "global_step": 297561, "epoch": 1771} {"train_loss": -11.70096206665039, "global_step": 297562, "epoch": 1771} {"train_loss": -11.133783340454102, "global_step": 297563, "epoch": 1771} {"train_loss": -11.434585571289062, "global_step": 297564, "epoch": 1771} {"train_loss": -10.129968643188477, "global_step": 297565, "epoch": 1771} {"train_loss": -11.324289321899414, "global_step": 297566, "epoch": 1771} {"train_loss": -10.053107261657715, "global_step": 297567, "epoch": 1771} {"train_loss": -11.001790046691895, "global_step": 297568, "epoch": 1771} {"train_loss": -10.181617736816406, "global_step": 297569, "epoch": 1771} {"train_loss": -10.392303466796875, "global_step": 297570, "epoch": 1771} {"train_loss": -10.226097106933594, "global_step": 297571, "epoch": 1771} {"train_loss": -11.008005142211914, "global_step": 297572, "epoch": 1771} {"train_loss": -10.373191833496094, "global_step": 297573, "epoch": 1771} {"train_loss": -10.607170104980469, "global_step": 297574, "epoch": 1771} {"train_loss": -10.279874801635742, "global_step": 297575, "epoch": 1771} {"train_loss": -11.682076454162598, "global_step": 297576, "epoch": 1771} {"train_loss": -10.590978622436523, "global_step": 297577, "epoch": 1771} {"train_loss": -12.044031143188477, "global_step": 297578, "epoch": 1771} {"train_loss": -10.729820251464844, "global_step": 297579, "epoch": 1771} {"train_loss": -11.80119514465332, "global_step": 297580, "epoch": 1771} {"train_loss": -11.274210929870605, "global_step": 297581, "epoch": 1771} {"train_loss": -11.48544692993164, "global_step": 297582, "epoch": 1771} {"train_loss": -11.494409561157227, "global_step": 297583, "epoch": 1771} {"train_loss": -10.975214004516602, "global_step": 297584, "epoch": 1771} {"train_loss": -11.772781372070312, "global_step": 297585, "epoch": 1771} {"train_loss": -11.63212776184082, "global_step": 297586, "epoch": 1771} {"train_loss": -11.527015686035156, "global_step": 297587, "epoch": 1771} {"train_loss": -11.851863861083984, "global_step": 297588, "epoch": 1771} {"train_loss": -11.721967697143555, "global_step": 297589, "epoch": 1771} {"train_loss": -12.222518920898438, "global_step": 297590, "epoch": 1771} {"train_loss": -11.795669555664062, "global_step": 297591, "epoch": 1771} {"train_loss": -12.035934448242188, "global_step": 297592, "epoch": 1771} {"train_loss": -11.77231502532959, "global_step": 297593, "epoch": 1771} {"train_loss": -11.815035820007324, "global_step": 297594, "epoch": 1771} {"train_loss": -12.013612747192383, "global_step": 297595, "epoch": 1771} {"train_loss": -11.626788139343262, "global_step": 297596, "epoch": 1771} {"train_loss": -11.985189437866211, "global_step": 297597, "epoch": 1771} {"train_loss": -11.939081192016602, "global_step": 297598, "epoch": 1771} {"train_loss": -11.82955551147461, "global_step": 297599, "epoch": 1771} {"train_loss": -11.806774139404297, "global_step": 297600, "epoch": 1771} {"train_loss": -11.970714569091797, "global_step": 297601, "epoch": 1771} {"train_loss": -11.779499053955078, "global_step": 297602, "epoch": 1771} {"train_loss": -11.993404388427734, "global_step": 297603, "epoch": 1771} {"train_loss": -12.059864044189453, "global_step": 297604, "epoch": 1771} {"train_loss": -11.92473316192627, "global_step": 297605, "epoch": 1771} {"train_loss": -12.07346248626709, "global_step": 297606, "epoch": 1771} {"train_loss": -12.046185493469238, "global_step": 297607, "epoch": 1771} {"train_loss": -11.865046501159668, "global_step": 297608, "epoch": 1771} {"train_loss": -12.099105834960938, "global_step": 297609, "epoch": 1771} {"train_loss": -12.144706726074219, "global_step": 297610, "epoch": 1771} {"train_loss": -12.098443031311035, "global_step": 297611, "epoch": 1771} {"train_loss": -12.255109786987305, "global_step": 297612, "epoch": 1771} {"train_loss": -11.94318675994873, "global_step": 297613, "epoch": 1771} {"train_loss": -12.008395195007324, "global_step": 297614, "epoch": 1771} {"train_loss": -12.212160110473633, "global_step": 297615, "epoch": 1771} {"train_loss": -12.186966896057129, "global_step": 297616, "epoch": 1771} {"train_loss": -12.275474548339844, "global_step": 297617, "epoch": 1771} {"train_loss": -12.28868293762207, "global_step": 297618, "epoch": 1771} {"train_loss": -12.247005462646484, "global_step": 297619, "epoch": 1771} {"train_loss": -12.1160306930542, "global_step": 297620, "epoch": 1771} {"train_loss": -12.112281799316406, "global_step": 297621, "epoch": 1771} {"train_loss": -12.163143157958984, "global_step": 297622, "epoch": 1771} {"train_loss": -11.93836784362793, "global_step": 297623, "epoch": 1771} {"train_loss": -12.391485214233398, "global_step": 297624, "epoch": 1771} {"train_loss": -11.82246208190918, "global_step": 297625, "epoch": 1771} {"train_loss": -11.85529613494873, "global_step": 297626, "epoch": 1771} {"train_loss": -11.942916870117188, "global_step": 297627, "epoch": 1771} {"train_loss": -11.507368087768555, "global_step": 297628, "epoch": 1771} {"train_loss": -12.044702529907227, "global_step": 297629, "epoch": 1771} {"train_loss": -12.015018463134766, "global_step": 297630, "epoch": 1771} {"train_loss": -12.291242599487305, "global_step": 297631, "epoch": 1771} {"train_loss": -11.020112991333008, "global_step": 297632, "epoch": 1771} {"train_loss": -12.203951835632324, "global_step": 297633, "epoch": 1771} {"train_loss": -11.52463436126709, "global_step": 297634, "epoch": 1771} {"train_loss": -11.867451667785645, "global_step": 297635, "epoch": 1771} {"train_loss": -11.650705337524414, "global_step": 297636, "epoch": 1771} {"train_loss": -12.095996856689453, "global_step": 297637, "epoch": 1771} {"train_loss": -11.845746040344238, "global_step": 297638, "epoch": 1771} {"train_loss": -11.964967727661133, "global_step": 297639, "epoch": 1771} {"train_loss": -11.517457962036133, "global_step": 297640, "epoch": 1771} {"train_loss": -11.727313041687012, "global_step": 297641, "epoch": 1771} {"train_loss": -11.12767219543457, "global_step": 297642, "epoch": 1771} {"train_loss": -11.589444160461426, "global_step": 297643, "epoch": 1771} {"train_loss": -11.938526153564453, "global_step": 297644, "epoch": 1771} {"train_loss": -11.190414428710938, "global_step": 297645, "epoch": 1771} {"train_loss": -12.062705039978027, "global_step": 297646, "epoch": 1771} {"train_loss": -11.503375053405762, "global_step": 297647, "epoch": 1771} {"train_loss": -10.365188598632812, "global_step": 297648, "epoch": 1771} {"train_loss": -11.554277420043945, "global_step": 297649, "epoch": 1771} {"train_loss": -11.442167282104492, "global_step": 297650, "epoch": 1771} {"train_loss": -9.21086597442627, "global_step": 297651, "epoch": 1771} {"train_loss": -10.98985481262207, "global_step": 297652, "epoch": 1771} {"train_loss": -11.724148750305176, "global_step": 297653, "epoch": 1771} {"train_loss": -10.26535415649414, "global_step": 297654, "epoch": 1771} {"train_loss": -11.79709529876709, "global_step": 297655, "epoch": 1771} {"train_loss": -10.029682159423828, "global_step": 297656, "epoch": 1771} {"train_loss": -11.602033615112305, "global_step": 297657, "epoch": 1771} {"train_loss": -10.402713775634766, "global_step": 297658, "epoch": 1771} {"train_loss": -10.998848915100098, "global_step": 297659, "epoch": 1771} {"train_loss": -10.512592315673828, "global_step": 297660, "epoch": 1771} {"train_loss": -11.64898681640625, "global_step": 297661, "epoch": 1771} {"train_loss": -10.99798583984375, "global_step": 297662, "epoch": 1771} {"train_loss": -11.917205810546875, "global_step": 297663, "epoch": 1771} {"train_loss": -11.22335433959961, "global_step": 297664, "epoch": 1771} {"train_loss": -11.447427749633789, "global_step": 297665, "epoch": 1771} {"train_loss": -11.868240356445312, "global_step": 297666, "epoch": 1771} {"train_loss": -11.287853240966797, "global_step": 297667, "epoch": 1771} {"train_loss": -11.738948822021484, "global_step": 297668, "epoch": 1771} {"train_loss": -11.388823509216309, "global_step": 297669, "epoch": 1771} {"train_loss": -12.000110626220703, "global_step": 297670, "epoch": 1771} {"train_loss": -11.710070610046387, "global_step": 297671, "epoch": 1771} {"train_loss": -11.42392349243164, "global_step": 297672, "epoch": 1771} {"train_loss": -11.771484375, "global_step": 297673, "epoch": 1771} {"train_loss": -11.172061920166016, "global_step": 297674, "epoch": 1771} {"train_loss": -11.970588684082031, "global_step": 297675, "epoch": 1771} {"train_loss": -11.191658973693848, "global_step": 297676, "epoch": 1771} {"train_loss": -12.035541534423828, "global_step": 297677, "epoch": 1771} {"train_loss": -11.409900665283203, "global_step": 297678, "epoch": 1771} {"train_loss": -12.221567153930664, "global_step": 297679, "epoch": 1771} {"train_loss": -11.612818717956543, "global_step": 297680, "epoch": 1771} {"train_loss": -12.036226272583008, "global_step": 297681, "epoch": 1771} {"train_loss": -11.51544189453125, "global_step": 297682, "epoch": 1771} {"train_loss": -11.815729141235352, "global_step": 297683, "epoch": 1771} {"train_loss": -11.41012191772461, "global_step": 297684, "epoch": 1771} {"train_loss": -11.668455123901367, "global_step": 297685, "epoch": 1771} {"train_loss": -11.316852569580078, "global_step": 297686, "epoch": 1771} {"train_loss": -11.367206573486328, "global_step": 297687, "epoch": 1771} {"train_loss": -11.725509643554688, "global_step": 297688, "epoch": 1771} {"train_loss": -11.867827415466309, "global_step": 297689, "epoch": 1771} {"train_loss": -11.808626174926758, "global_step": 297690, "epoch": 1771} {"train_loss": -12.010777473449707, "global_step": 297691, "epoch": 1771} {"train_loss": -11.889944076538086, "global_step": 297692, "epoch": 1771} {"train_loss": -11.939330101013184, "global_step": 297693, "epoch": 1771} {"train_loss": -11.784202575683594, "global_step": 297694, "epoch": 1771} {"train_loss": -11.640941347394671, "global_step": 297695, "epoch": 1771, "val_loss": 280798.15625} {"train_loss": -11.81959342956543, "global_step": 297696, "epoch": 1772} {"train_loss": -12.067285537719727, "global_step": 297697, "epoch": 1772} {"train_loss": -11.912498474121094, "global_step": 297698, "epoch": 1772} {"train_loss": -11.988191604614258, "global_step": 297699, "epoch": 1772} {"train_loss": -12.245609283447266, "global_step": 297700, "epoch": 1772} {"train_loss": -11.99229621887207, "global_step": 297701, "epoch": 1772} {"train_loss": -12.238081932067871, "global_step": 297702, "epoch": 1772} {"train_loss": -12.150880813598633, "global_step": 297703, "epoch": 1772} {"train_loss": -12.302873611450195, "global_step": 297704, "epoch": 1772} {"train_loss": -12.323596954345703, "global_step": 297705, "epoch": 1772} {"train_loss": -12.21261215209961, "global_step": 297706, "epoch": 1772} {"train_loss": -11.92425537109375, "global_step": 297707, "epoch": 1772} {"train_loss": -12.255681037902832, "global_step": 297708, "epoch": 1772} {"train_loss": -12.214322090148926, "global_step": 297709, "epoch": 1772} {"train_loss": -12.381082534790039, "global_step": 297710, "epoch": 1772} {"train_loss": -12.255901336669922, "global_step": 297711, "epoch": 1772} {"train_loss": -12.350547790527344, "global_step": 297712, "epoch": 1772} {"train_loss": -12.298745155334473, "global_step": 297713, "epoch": 1772} {"train_loss": -12.33816146850586, "global_step": 297714, "epoch": 1772} {"train_loss": -12.257085800170898, "global_step": 297715, "epoch": 1772} {"train_loss": -12.307648658752441, "global_step": 297716, "epoch": 1772} {"train_loss": -12.262552261352539, "global_step": 297717, "epoch": 1772} {"train_loss": -12.187926292419434, "global_step": 297718, "epoch": 1772} {"train_loss": -12.131251335144043, "global_step": 297719, "epoch": 1772} {"train_loss": -12.46048355102539, "global_step": 297720, "epoch": 1772} {"train_loss": -12.17445182800293, "global_step": 297721, "epoch": 1772} {"train_loss": -12.301919937133789, "global_step": 297722, "epoch": 1772} {"train_loss": -12.223155975341797, "global_step": 297723, "epoch": 1772} {"train_loss": -11.893758773803711, "global_step": 297724, "epoch": 1772} {"train_loss": -12.421854019165039, "global_step": 297725, "epoch": 1772} {"train_loss": -12.129035949707031, "global_step": 297726, "epoch": 1772} {"train_loss": -12.419320106506348, "global_step": 297727, "epoch": 1772} {"train_loss": -12.423733711242676, "global_step": 297728, "epoch": 1772} {"train_loss": -12.217049598693848, "global_step": 297729, "epoch": 1772} {"train_loss": -12.491653442382812, "global_step": 297730, "epoch": 1772} {"train_loss": -12.372152328491211, "global_step": 297731, "epoch": 1772} {"train_loss": -12.372551918029785, "global_step": 297732, "epoch": 1772} {"train_loss": -12.256811141967773, "global_step": 297733, "epoch": 1772} {"train_loss": -12.30455207824707, "global_step": 297734, "epoch": 1772} {"train_loss": -12.311932563781738, "global_step": 297735, "epoch": 1772} {"train_loss": -12.479774475097656, "global_step": 297736, "epoch": 1772} {"train_loss": -12.160018920898438, "global_step": 297737, "epoch": 1772} {"train_loss": -12.217195510864258, "global_step": 297738, "epoch": 1772} {"train_loss": -12.506184577941895, "global_step": 297739, "epoch": 1772} {"train_loss": -12.499394416809082, "global_step": 297740, "epoch": 1772} {"train_loss": -12.08675765991211, "global_step": 297741, "epoch": 1772} {"train_loss": -12.35750675201416, "global_step": 297742, "epoch": 1772} {"train_loss": -12.296588897705078, "global_step": 297743, "epoch": 1772} {"train_loss": -12.333854675292969, "global_step": 297744, "epoch": 1772} {"train_loss": -12.223382949829102, "global_step": 297745, "epoch": 1772} {"train_loss": -12.277179718017578, "global_step": 297746, "epoch": 1772} {"train_loss": -12.51829719543457, "global_step": 297747, "epoch": 1772} {"train_loss": -12.287765502929688, "global_step": 297748, "epoch": 1772} {"train_loss": -12.324647903442383, "global_step": 297749, "epoch": 1772} {"train_loss": -12.27006721496582, "global_step": 297750, "epoch": 1772} {"train_loss": -12.245962142944336, "global_step": 297751, "epoch": 1772} {"train_loss": -12.070369720458984, "global_step": 297752, "epoch": 1772} {"train_loss": -11.902559280395508, "global_step": 297753, "epoch": 1772} {"train_loss": -11.892121315002441, "global_step": 297754, "epoch": 1772} {"train_loss": -12.523314476013184, "global_step": 297755, "epoch": 1772} {"train_loss": -12.015589714050293, "global_step": 297756, "epoch": 1772} {"train_loss": -12.100639343261719, "global_step": 297757, "epoch": 1772} {"train_loss": -12.349037170410156, "global_step": 297758, "epoch": 1772} {"train_loss": -12.023628234863281, "global_step": 297759, "epoch": 1772} {"train_loss": -12.592023849487305, "global_step": 297760, "epoch": 1772} {"train_loss": -11.811720848083496, "global_step": 297761, "epoch": 1772} {"train_loss": -12.126124382019043, "global_step": 297762, "epoch": 1772} {"train_loss": -12.046038627624512, "global_step": 297763, "epoch": 1772} {"train_loss": -12.375293731689453, "global_step": 297764, "epoch": 1772} {"train_loss": -11.943413734436035, "global_step": 297765, "epoch": 1772} {"train_loss": -12.340673446655273, "global_step": 297766, "epoch": 1772} {"train_loss": -12.312288284301758, "global_step": 297767, "epoch": 1772} {"train_loss": -12.469718933105469, "global_step": 297768, "epoch": 1772} {"train_loss": -12.09543228149414, "global_step": 297769, "epoch": 1772} {"train_loss": -11.659859657287598, "global_step": 297770, "epoch": 1772} {"train_loss": -11.669906616210938, "global_step": 297771, "epoch": 1772} {"train_loss": -11.935908317565918, "global_step": 297772, "epoch": 1772} {"train_loss": -11.929512023925781, "global_step": 297773, "epoch": 1772} {"train_loss": -11.970870971679688, "global_step": 297774, "epoch": 1772} {"train_loss": -11.891462326049805, "global_step": 297775, "epoch": 1772} {"train_loss": -11.46394157409668, "global_step": 297776, "epoch": 1772} {"train_loss": -12.410465240478516, "global_step": 297777, "epoch": 1772} {"train_loss": -11.889337539672852, "global_step": 297778, "epoch": 1772} {"train_loss": -12.298381805419922, "global_step": 297779, "epoch": 1772} {"train_loss": -12.172323226928711, "global_step": 297780, "epoch": 1772} {"train_loss": -12.054303169250488, "global_step": 297781, "epoch": 1772} {"train_loss": -11.583873748779297, "global_step": 297782, "epoch": 1772} {"train_loss": -12.208524703979492, "global_step": 297783, "epoch": 1772} {"train_loss": -11.899859428405762, "global_step": 297784, "epoch": 1772} {"train_loss": -11.254822731018066, "global_step": 297785, "epoch": 1772} {"train_loss": -11.510591506958008, "global_step": 297786, "epoch": 1772} {"train_loss": -12.098033905029297, "global_step": 297787, "epoch": 1772} {"train_loss": -11.976890563964844, "global_step": 297788, "epoch": 1772} {"train_loss": -11.684030532836914, "global_step": 297789, "epoch": 1772} {"train_loss": -12.075109481811523, "global_step": 297790, "epoch": 1772} {"train_loss": -12.08202075958252, "global_step": 297791, "epoch": 1772} {"train_loss": -11.258991241455078, "global_step": 297792, "epoch": 1772} {"train_loss": -11.615495681762695, "global_step": 297793, "epoch": 1772} {"train_loss": -11.404982566833496, "global_step": 297794, "epoch": 1772} {"train_loss": -11.407045364379883, "global_step": 297795, "epoch": 1772} {"train_loss": -11.261335372924805, "global_step": 297796, "epoch": 1772} {"train_loss": -12.345709800720215, "global_step": 297797, "epoch": 1772} {"train_loss": -11.208908081054688, "global_step": 297798, "epoch": 1772} {"train_loss": -10.97958755493164, "global_step": 297799, "epoch": 1772} {"train_loss": -11.376409530639648, "global_step": 297800, "epoch": 1772} {"train_loss": -11.339343070983887, "global_step": 297801, "epoch": 1772} {"train_loss": -10.138289451599121, "global_step": 297802, "epoch": 1772} {"train_loss": -10.99182415008545, "global_step": 297803, "epoch": 1772} {"train_loss": -10.111557006835938, "global_step": 297804, "epoch": 1772} {"train_loss": -10.048674583435059, "global_step": 297805, "epoch": 1772} {"train_loss": -10.685834884643555, "global_step": 297806, "epoch": 1772} {"train_loss": -10.594066619873047, "global_step": 297807, "epoch": 1772} {"train_loss": -9.864309310913086, "global_step": 297808, "epoch": 1772} {"train_loss": -10.972339630126953, "global_step": 297809, "epoch": 1772} {"train_loss": -10.38724136352539, "global_step": 297810, "epoch": 1772} {"train_loss": -9.142969131469727, "global_step": 297811, "epoch": 1772} {"train_loss": -11.213762283325195, "global_step": 297812, "epoch": 1772} {"train_loss": -9.381882667541504, "global_step": 297813, "epoch": 1772} {"train_loss": -10.58991813659668, "global_step": 297814, "epoch": 1772} {"train_loss": -9.876220703125, "global_step": 297815, "epoch": 1772} {"train_loss": -11.019086837768555, "global_step": 297816, "epoch": 1772} {"train_loss": -10.14937973022461, "global_step": 297817, "epoch": 1772} {"train_loss": -11.351524353027344, "global_step": 297818, "epoch": 1772} {"train_loss": -8.806068420410156, "global_step": 297819, "epoch": 1772} {"train_loss": -11.006972312927246, "global_step": 297820, "epoch": 1772} {"train_loss": -9.508001327514648, "global_step": 297821, "epoch": 1772} {"train_loss": -10.636297225952148, "global_step": 297822, "epoch": 1772} {"train_loss": -10.459396362304688, "global_step": 297823, "epoch": 1772} {"train_loss": -10.963119506835938, "global_step": 297824, "epoch": 1772} {"train_loss": -10.352334976196289, "global_step": 297825, "epoch": 1772} {"train_loss": -11.224112510681152, "global_step": 297826, "epoch": 1772} {"train_loss": -11.049388885498047, "global_step": 297827, "epoch": 1772} {"train_loss": -10.970657348632812, "global_step": 297828, "epoch": 1772} {"train_loss": -11.421038627624512, "global_step": 297829, "epoch": 1772} {"train_loss": -11.161934852600098, "global_step": 297830, "epoch": 1772} {"train_loss": -11.706830978393555, "global_step": 297831, "epoch": 1772} {"train_loss": -11.552501678466797, "global_step": 297832, "epoch": 1772} {"train_loss": -11.50217056274414, "global_step": 297833, "epoch": 1772} {"train_loss": -11.56159782409668, "global_step": 297834, "epoch": 1772} {"train_loss": -11.558161735534668, "global_step": 297835, "epoch": 1772} {"train_loss": -11.628355026245117, "global_step": 297836, "epoch": 1772} {"train_loss": -11.62220573425293, "global_step": 297837, "epoch": 1772} {"train_loss": -11.629737854003906, "global_step": 297838, "epoch": 1772} {"train_loss": -11.95592212677002, "global_step": 297839, "epoch": 1772} {"train_loss": -11.603643417358398, "global_step": 297840, "epoch": 1772} {"train_loss": -11.70777416229248, "global_step": 297841, "epoch": 1772} {"train_loss": -11.686247825622559, "global_step": 297842, "epoch": 1772} {"train_loss": -11.817764282226562, "global_step": 297843, "epoch": 1772} {"train_loss": -11.851783752441406, "global_step": 297844, "epoch": 1772} {"train_loss": -12.086158752441406, "global_step": 297845, "epoch": 1772} {"train_loss": -11.913209915161133, "global_step": 297846, "epoch": 1772} {"train_loss": -12.100654602050781, "global_step": 297847, "epoch": 1772} {"train_loss": -12.058622360229492, "global_step": 297848, "epoch": 1772} {"train_loss": -11.784675598144531, "global_step": 297849, "epoch": 1772} {"train_loss": -11.929319381713867, "global_step": 297850, "epoch": 1772} {"train_loss": -11.757640838623047, "global_step": 297851, "epoch": 1772} {"train_loss": -12.042905807495117, "global_step": 297852, "epoch": 1772} {"train_loss": -11.993616104125977, "global_step": 297853, "epoch": 1772} {"train_loss": -11.943889617919922, "global_step": 297854, "epoch": 1772} {"train_loss": -11.803271293640137, "global_step": 297855, "epoch": 1772} {"train_loss": -12.089977264404297, "global_step": 297856, "epoch": 1772} {"train_loss": -11.79815673828125, "global_step": 297857, "epoch": 1772} {"train_loss": -11.890475273132324, "global_step": 297858, "epoch": 1772} {"train_loss": -11.831565856933594, "global_step": 297859, "epoch": 1772} {"train_loss": -11.777536392211914, "global_step": 297860, "epoch": 1772} {"train_loss": -12.024495124816895, "global_step": 297861, "epoch": 1772} {"train_loss": -12.257314682006836, "global_step": 297862, "epoch": 1772} {"train_loss": -11.761067208789644, "global_step": 297863, "epoch": 1772, "val_loss": 283546.25} {"train_loss": -12.045461654663086, "global_step": 297864, "epoch": 1773} {"train_loss": -12.182472229003906, "global_step": 297865, "epoch": 1773} {"train_loss": -11.80834674835205, "global_step": 297866, "epoch": 1773} {"train_loss": -11.994924545288086, "global_step": 297867, "epoch": 1773} {"train_loss": -12.17242431640625, "global_step": 297868, "epoch": 1773} {"train_loss": -12.077632904052734, "global_step": 297869, "epoch": 1773} {"train_loss": -12.194623947143555, "global_step": 297870, "epoch": 1773} {"train_loss": -12.059173583984375, "global_step": 297871, "epoch": 1773} {"train_loss": -12.301876068115234, "global_step": 297872, "epoch": 1773} {"train_loss": -12.089478492736816, "global_step": 297873, "epoch": 1773} {"train_loss": -12.416498184204102, "global_step": 297874, "epoch": 1773} {"train_loss": -12.220853805541992, "global_step": 297875, "epoch": 1773} {"train_loss": -12.27342700958252, "global_step": 297876, "epoch": 1773} {"train_loss": -12.218099594116211, "global_step": 297877, "epoch": 1773} {"train_loss": -12.21968936920166, "global_step": 297878, "epoch": 1773} {"train_loss": -12.21899700164795, "global_step": 297879, "epoch": 1773} {"train_loss": -12.283638000488281, "global_step": 297880, "epoch": 1773} {"train_loss": -12.165626525878906, "global_step": 297881, "epoch": 1773} {"train_loss": -12.483716011047363, "global_step": 297882, "epoch": 1773} {"train_loss": -12.198427200317383, "global_step": 297883, "epoch": 1773} {"train_loss": -12.246479034423828, "global_step": 297884, "epoch": 1773} {"train_loss": -12.286677360534668, "global_step": 297885, "epoch": 1773} {"train_loss": -11.891862869262695, "global_step": 297886, "epoch": 1773} {"train_loss": -12.478164672851562, "global_step": 297887, "epoch": 1773} {"train_loss": -12.351554870605469, "global_step": 297888, "epoch": 1773} {"train_loss": -12.395776748657227, "global_step": 297889, "epoch": 1773} {"train_loss": -12.426183700561523, "global_step": 297890, "epoch": 1773} {"train_loss": -12.437499046325684, "global_step": 297891, "epoch": 1773} {"train_loss": -12.452398300170898, "global_step": 297892, "epoch": 1773} {"train_loss": -12.341707229614258, "global_step": 297893, "epoch": 1773} {"train_loss": -12.417698860168457, "global_step": 297894, "epoch": 1773} {"train_loss": -12.493392944335938, "global_step": 297895, "epoch": 1773} {"train_loss": -12.444854736328125, "global_step": 297896, "epoch": 1773} {"train_loss": -12.488407135009766, "global_step": 297897, "epoch": 1773} {"train_loss": -12.122154235839844, "global_step": 297898, "epoch": 1773} {"train_loss": -12.220414161682129, "global_step": 297899, "epoch": 1773} {"train_loss": -12.440887451171875, "global_step": 297900, "epoch": 1773} {"train_loss": -12.448307037353516, "global_step": 297901, "epoch": 1773} {"train_loss": -12.103622436523438, "global_step": 297902, "epoch": 1773} {"train_loss": -12.34131908416748, "global_step": 297903, "epoch": 1773} {"train_loss": -12.316106796264648, "global_step": 297904, "epoch": 1773} {"train_loss": -11.993407249450684, "global_step": 297905, "epoch": 1773} {"train_loss": -12.358301162719727, "global_step": 297906, "epoch": 1773} {"train_loss": -11.908696174621582, "global_step": 297907, "epoch": 1773} {"train_loss": -12.282842636108398, "global_step": 297908, "epoch": 1773} {"train_loss": -11.452858924865723, "global_step": 297909, "epoch": 1773} {"train_loss": -11.476378440856934, "global_step": 297910, "epoch": 1773} {"train_loss": -11.344884872436523, "global_step": 297911, "epoch": 1773} {"train_loss": -11.667232513427734, "global_step": 297912, "epoch": 1773} {"train_loss": -11.30632209777832, "global_step": 297913, "epoch": 1773} {"train_loss": -11.715719223022461, "global_step": 297914, "epoch": 1773} {"train_loss": -11.495574951171875, "global_step": 297915, "epoch": 1773} {"train_loss": -12.28521728515625, "global_step": 297916, "epoch": 1773} {"train_loss": -11.773590087890625, "global_step": 297917, "epoch": 1773} {"train_loss": -11.286846160888672, "global_step": 297918, "epoch": 1773} {"train_loss": -11.243413925170898, "global_step": 297919, "epoch": 1773} {"train_loss": -11.829312324523926, "global_step": 297920, "epoch": 1773} {"train_loss": -11.948114395141602, "global_step": 297921, "epoch": 1773} {"train_loss": -12.003515243530273, "global_step": 297922, "epoch": 1773} {"train_loss": -11.959610939025879, "global_step": 297923, "epoch": 1773} {"train_loss": -11.752148628234863, "global_step": 297924, "epoch": 1773} {"train_loss": -11.937853813171387, "global_step": 297925, "epoch": 1773} {"train_loss": -12.147632598876953, "global_step": 297926, "epoch": 1773} {"train_loss": -11.991273880004883, "global_step": 297927, "epoch": 1773} {"train_loss": -11.818342208862305, "global_step": 297928, "epoch": 1773} {"train_loss": -11.808015823364258, "global_step": 297929, "epoch": 1773} {"train_loss": -11.894037246704102, "global_step": 297930, "epoch": 1773} {"train_loss": -12.033692359924316, "global_step": 297931, "epoch": 1773} {"train_loss": -12.037416458129883, "global_step": 297932, "epoch": 1773} {"train_loss": -11.666168212890625, "global_step": 297933, "epoch": 1773} {"train_loss": -11.567638397216797, "global_step": 297934, "epoch": 1773} {"train_loss": -12.00652027130127, "global_step": 297935, "epoch": 1773} {"train_loss": -10.908836364746094, "global_step": 297936, "epoch": 1773} {"train_loss": -11.772798538208008, "global_step": 297937, "epoch": 1773} {"train_loss": -11.141265869140625, "global_step": 297938, "epoch": 1773} {"train_loss": -11.379372596740723, "global_step": 297939, "epoch": 1773} {"train_loss": -11.937040328979492, "global_step": 297940, "epoch": 1773} {"train_loss": -11.682195663452148, "global_step": 297941, "epoch": 1773} {"train_loss": -11.764325141906738, "global_step": 297942, "epoch": 1773} {"train_loss": -11.028746604919434, "global_step": 297943, "epoch": 1773} {"train_loss": -11.158016204833984, "global_step": 297944, "epoch": 1773} {"train_loss": -10.707804679870605, "global_step": 297945, "epoch": 1773} {"train_loss": -11.018024444580078, "global_step": 297946, "epoch": 1773} {"train_loss": -10.920775413513184, "global_step": 297947, "epoch": 1773} {"train_loss": -9.969947814941406, "global_step": 297948, "epoch": 1773} {"train_loss": -10.9838285446167, "global_step": 297949, "epoch": 1773} {"train_loss": -10.021454811096191, "global_step": 297950, "epoch": 1773} {"train_loss": -11.729480743408203, "global_step": 297951, "epoch": 1773} {"train_loss": -9.828688621520996, "global_step": 297952, "epoch": 1773} {"train_loss": -11.799064636230469, "global_step": 297953, "epoch": 1773} {"train_loss": -11.13305377960205, "global_step": 297954, "epoch": 1773} {"train_loss": -11.361119270324707, "global_step": 297955, "epoch": 1773} {"train_loss": -11.145511627197266, "global_step": 297956, "epoch": 1773} {"train_loss": -11.144662857055664, "global_step": 297957, "epoch": 1773} {"train_loss": -11.353979110717773, "global_step": 297958, "epoch": 1773} {"train_loss": -11.67910385131836, "global_step": 297959, "epoch": 1773} {"train_loss": -11.428701400756836, "global_step": 297960, "epoch": 1773} {"train_loss": -11.231284141540527, "global_step": 297961, "epoch": 1773} {"train_loss": -11.505928993225098, "global_step": 297962, "epoch": 1773} {"train_loss": -11.676448822021484, "global_step": 297963, "epoch": 1773} {"train_loss": -11.545845031738281, "global_step": 297964, "epoch": 1773} {"train_loss": -11.433415412902832, "global_step": 297965, "epoch": 1773} {"train_loss": -11.597293853759766, "global_step": 297966, "epoch": 1773} {"train_loss": -11.425498962402344, "global_step": 297967, "epoch": 1773} {"train_loss": -12.107561111450195, "global_step": 297968, "epoch": 1773} {"train_loss": -11.839841842651367, "global_step": 297969, "epoch": 1773} {"train_loss": -11.678730010986328, "global_step": 297970, "epoch": 1773} {"train_loss": -11.895726203918457, "global_step": 297971, "epoch": 1773} {"train_loss": -11.76395320892334, "global_step": 297972, "epoch": 1773} {"train_loss": -11.823357582092285, "global_step": 297973, "epoch": 1773} {"train_loss": -12.06881046295166, "global_step": 297974, "epoch": 1773} {"train_loss": -11.631363868713379, "global_step": 297975, "epoch": 1773} {"train_loss": -12.000603675842285, "global_step": 297976, "epoch": 1773} {"train_loss": -11.708538055419922, "global_step": 297977, "epoch": 1773} {"train_loss": -12.110225677490234, "global_step": 297978, "epoch": 1773} {"train_loss": -11.854606628417969, "global_step": 297979, "epoch": 1773} {"train_loss": -12.040313720703125, "global_step": 297980, "epoch": 1773} {"train_loss": -11.898975372314453, "global_step": 297981, "epoch": 1773} {"train_loss": -12.201876640319824, "global_step": 297982, "epoch": 1773} {"train_loss": -11.76820182800293, "global_step": 297983, "epoch": 1773} {"train_loss": -11.923442840576172, "global_step": 297984, "epoch": 1773} {"train_loss": -12.080207824707031, "global_step": 297985, "epoch": 1773} {"train_loss": -11.94643783569336, "global_step": 297986, "epoch": 1773} {"train_loss": -11.95302963256836, "global_step": 297987, "epoch": 1773} {"train_loss": -12.234733581542969, "global_step": 297988, "epoch": 1773} {"train_loss": -12.247276306152344, "global_step": 297989, "epoch": 1773} {"train_loss": -11.717710494995117, "global_step": 297990, "epoch": 1773} {"train_loss": -12.255416870117188, "global_step": 297991, "epoch": 1773} {"train_loss": -12.043131828308105, "global_step": 297992, "epoch": 1773} {"train_loss": -12.302773475646973, "global_step": 297993, "epoch": 1773} {"train_loss": -12.026912689208984, "global_step": 297994, "epoch": 1773} {"train_loss": -12.225717544555664, "global_step": 297995, "epoch": 1773} {"train_loss": -12.199572563171387, "global_step": 297996, "epoch": 1773} {"train_loss": -12.296150207519531, "global_step": 297997, "epoch": 1773} {"train_loss": -12.26242733001709, "global_step": 297998, "epoch": 1773} {"train_loss": -12.350497245788574, "global_step": 297999, "epoch": 1773} {"train_loss": -12.179594039916992, "global_step": 298000, "epoch": 1773} {"train_loss": -11.976543426513672, "global_step": 298001, "epoch": 1773} {"train_loss": -12.209321975708008, "global_step": 298002, "epoch": 1773} {"train_loss": -12.090493202209473, "global_step": 298003, "epoch": 1773} {"train_loss": -12.110811233520508, "global_step": 298004, "epoch": 1773} {"train_loss": -12.314140319824219, "global_step": 298005, "epoch": 1773} {"train_loss": -12.178476333618164, "global_step": 298006, "epoch": 1773} {"train_loss": -12.168438911437988, "global_step": 298007, "epoch": 1773} {"train_loss": -12.408182144165039, "global_step": 298008, "epoch": 1773} {"train_loss": -12.026887893676758, "global_step": 298009, "epoch": 1773} {"train_loss": -12.257246017456055, "global_step": 298010, "epoch": 1773} {"train_loss": -11.614959716796875, "global_step": 298011, "epoch": 1773} {"train_loss": -12.141172409057617, "global_step": 298012, "epoch": 1773} {"train_loss": -12.091796875, "global_step": 298013, "epoch": 1773} {"train_loss": -11.21176528930664, "global_step": 298014, "epoch": 1773} {"train_loss": -10.81441593170166, "global_step": 298015, "epoch": 1773} {"train_loss": -12.2636079788208, "global_step": 298016, "epoch": 1773} {"train_loss": -11.388525009155273, "global_step": 298017, "epoch": 1773} {"train_loss": -11.682317733764648, "global_step": 298018, "epoch": 1773} {"train_loss": -11.655723571777344, "global_step": 298019, "epoch": 1773} {"train_loss": -12.123481750488281, "global_step": 298020, "epoch": 1773} {"train_loss": -11.88123893737793, "global_step": 298021, "epoch": 1773} {"train_loss": -11.18878173828125, "global_step": 298022, "epoch": 1773} {"train_loss": -11.988716125488281, "global_step": 298023, "epoch": 1773} {"train_loss": -11.51333999633789, "global_step": 298024, "epoch": 1773} {"train_loss": -11.67825984954834, "global_step": 298025, "epoch": 1773} {"train_loss": -11.891982078552246, "global_step": 298026, "epoch": 1773} {"train_loss": -11.371732711791992, "global_step": 298027, "epoch": 1773} {"train_loss": -11.978960990905762, "global_step": 298028, "epoch": 1773} {"train_loss": -11.73775863647461, "global_step": 298029, "epoch": 1773} {"train_loss": -12.23647689819336, "global_step": 298030, "epoch": 1773} {"train_loss": -11.862059400195168, "global_step": 298031, "epoch": 1773, "val_loss": 280617.25} {"train_loss": -11.670594215393066, "global_step": 298032, "epoch": 1774} {"train_loss": -11.671716690063477, "global_step": 298033, "epoch": 1774} {"train_loss": -11.900111198425293, "global_step": 298034, "epoch": 1774} {"train_loss": -11.98647689819336, "global_step": 298035, "epoch": 1774} {"train_loss": -11.666236877441406, "global_step": 298036, "epoch": 1774} {"train_loss": -11.924954414367676, "global_step": 298037, "epoch": 1774} {"train_loss": -11.631817817687988, "global_step": 298038, "epoch": 1774} {"train_loss": -11.646851539611816, "global_step": 298039, "epoch": 1774} {"train_loss": -11.859594345092773, "global_step": 298040, "epoch": 1774} {"train_loss": -11.851184844970703, "global_step": 298041, "epoch": 1774} {"train_loss": -12.139358520507812, "global_step": 298042, "epoch": 1774} {"train_loss": -11.77381706237793, "global_step": 298043, "epoch": 1774} {"train_loss": -11.7674560546875, "global_step": 298044, "epoch": 1774} {"train_loss": -11.544095039367676, "global_step": 298045, "epoch": 1774} {"train_loss": -11.889640808105469, "global_step": 298046, "epoch": 1774} {"train_loss": -11.518770217895508, "global_step": 298047, "epoch": 1774} {"train_loss": -11.564172744750977, "global_step": 298048, "epoch": 1774} {"train_loss": -11.804071426391602, "global_step": 298049, "epoch": 1774} {"train_loss": -11.542757034301758, "global_step": 298050, "epoch": 1774} {"train_loss": -11.16991901397705, "global_step": 298051, "epoch": 1774} {"train_loss": -11.961812973022461, "global_step": 298052, "epoch": 1774} {"train_loss": -11.230483055114746, "global_step": 298053, "epoch": 1774} {"train_loss": -12.041801452636719, "global_step": 298054, "epoch": 1774} {"train_loss": -11.909439086914062, "global_step": 298055, "epoch": 1774} {"train_loss": -11.751852035522461, "global_step": 298056, "epoch": 1774} {"train_loss": -12.089868545532227, "global_step": 298057, "epoch": 1774} {"train_loss": -11.870049476623535, "global_step": 298058, "epoch": 1774} {"train_loss": -12.423807144165039, "global_step": 298059, "epoch": 1774} {"train_loss": -11.824705123901367, "global_step": 298060, "epoch": 1774} {"train_loss": -12.009021759033203, "global_step": 298061, "epoch": 1774} {"train_loss": -11.8079833984375, "global_step": 298062, "epoch": 1774} {"train_loss": -11.999814987182617, "global_step": 298063, "epoch": 1774} {"train_loss": -11.919349670410156, "global_step": 298064, "epoch": 1774} {"train_loss": -12.200163841247559, "global_step": 298065, "epoch": 1774} {"train_loss": -11.938751220703125, "global_step": 298066, "epoch": 1774} {"train_loss": -12.032888412475586, "global_step": 298067, "epoch": 1774} {"train_loss": -11.928655624389648, "global_step": 298068, "epoch": 1774} {"train_loss": -12.111367225646973, "global_step": 298069, "epoch": 1774} {"train_loss": -11.854288101196289, "global_step": 298070, "epoch": 1774} {"train_loss": -11.801261901855469, "global_step": 298071, "epoch": 1774} {"train_loss": -11.60478401184082, "global_step": 298072, "epoch": 1774} {"train_loss": -12.119367599487305, "global_step": 298073, "epoch": 1774} {"train_loss": -11.927253723144531, "global_step": 298074, "epoch": 1774} {"train_loss": -11.887622833251953, "global_step": 298075, "epoch": 1774} {"train_loss": -12.309843063354492, "global_step": 298076, "epoch": 1774} {"train_loss": -11.627737045288086, "global_step": 298077, "epoch": 1774} {"train_loss": -12.110218048095703, "global_step": 298078, "epoch": 1774} {"train_loss": -12.05075454711914, "global_step": 298079, "epoch": 1774} {"train_loss": -11.14107894897461, "global_step": 298080, "epoch": 1774} {"train_loss": -11.225284576416016, "global_step": 298081, "epoch": 1774} {"train_loss": -11.87774658203125, "global_step": 298082, "epoch": 1774} {"train_loss": -11.657377243041992, "global_step": 298083, "epoch": 1774} {"train_loss": -11.827820777893066, "global_step": 298084, "epoch": 1774} {"train_loss": -11.515081405639648, "global_step": 298085, "epoch": 1774} {"train_loss": -12.189558982849121, "global_step": 298086, "epoch": 1774} {"train_loss": -11.834981918334961, "global_step": 298087, "epoch": 1774} {"train_loss": -11.586332321166992, "global_step": 298088, "epoch": 1774} {"train_loss": -11.461296081542969, "global_step": 298089, "epoch": 1774} {"train_loss": -11.957456588745117, "global_step": 298090, "epoch": 1774} {"train_loss": -11.724092483520508, "global_step": 298091, "epoch": 1774} {"train_loss": -11.910423278808594, "global_step": 298092, "epoch": 1774} {"train_loss": -11.995382308959961, "global_step": 298093, "epoch": 1774} {"train_loss": -11.844463348388672, "global_step": 298094, "epoch": 1774} {"train_loss": -11.47608470916748, "global_step": 298095, "epoch": 1774} {"train_loss": -11.436704635620117, "global_step": 298096, "epoch": 1774} {"train_loss": -12.117936134338379, "global_step": 298097, "epoch": 1774} {"train_loss": -11.796769142150879, "global_step": 298098, "epoch": 1774} {"train_loss": -12.067874908447266, "global_step": 298099, "epoch": 1774} {"train_loss": -11.843290328979492, "global_step": 298100, "epoch": 1774} {"train_loss": -12.058124542236328, "global_step": 298101, "epoch": 1774} {"train_loss": -11.711640357971191, "global_step": 298102, "epoch": 1774} {"train_loss": -11.936111450195312, "global_step": 298103, "epoch": 1774} {"train_loss": -12.159523010253906, "global_step": 298104, "epoch": 1774} {"train_loss": -11.764913558959961, "global_step": 298105, "epoch": 1774} {"train_loss": -12.111000061035156, "global_step": 298106, "epoch": 1774} {"train_loss": -11.919755935668945, "global_step": 298107, "epoch": 1774} {"train_loss": -11.933966636657715, "global_step": 298108, "epoch": 1774} {"train_loss": -11.767206192016602, "global_step": 298109, "epoch": 1774} {"train_loss": -12.060397148132324, "global_step": 298110, "epoch": 1774} {"train_loss": -11.99738597869873, "global_step": 298111, "epoch": 1774} {"train_loss": -12.002008438110352, "global_step": 298112, "epoch": 1774} {"train_loss": -11.978801727294922, "global_step": 298113, "epoch": 1774} {"train_loss": -12.018016815185547, "global_step": 298114, "epoch": 1774} {"train_loss": -12.306447982788086, "global_step": 298115, "epoch": 1774} {"train_loss": -12.156465530395508, "global_step": 298116, "epoch": 1774} {"train_loss": -12.024352073669434, "global_step": 298117, "epoch": 1774} {"train_loss": -12.163490295410156, "global_step": 298118, "epoch": 1774} {"train_loss": -12.221061706542969, "global_step": 298119, "epoch": 1774} {"train_loss": -11.742899894714355, "global_step": 298120, "epoch": 1774} {"train_loss": -12.242782592773438, "global_step": 298121, "epoch": 1774} {"train_loss": -12.27530288696289, "global_step": 298122, "epoch": 1774} {"train_loss": -12.284299850463867, "global_step": 298123, "epoch": 1774} {"train_loss": -12.040448188781738, "global_step": 298124, "epoch": 1774} {"train_loss": -12.173510551452637, "global_step": 298125, "epoch": 1774} {"train_loss": -12.293008804321289, "global_step": 298126, "epoch": 1774} {"train_loss": -12.311147689819336, "global_step": 298127, "epoch": 1774} {"train_loss": -12.218287467956543, "global_step": 298128, "epoch": 1774} {"train_loss": -12.358335494995117, "global_step": 298129, "epoch": 1774} {"train_loss": -12.281879425048828, "global_step": 298130, "epoch": 1774} {"train_loss": -12.516500473022461, "global_step": 298131, "epoch": 1774} {"train_loss": -12.191017150878906, "global_step": 298132, "epoch": 1774} {"train_loss": -12.249046325683594, "global_step": 298133, "epoch": 1774} {"train_loss": -12.540609359741211, "global_step": 298134, "epoch": 1774} {"train_loss": -12.045164108276367, "global_step": 298135, "epoch": 1774} {"train_loss": -12.559558868408203, "global_step": 298136, "epoch": 1774} {"train_loss": -12.265267372131348, "global_step": 298137, "epoch": 1774} {"train_loss": -12.400629043579102, "global_step": 298138, "epoch": 1774} {"train_loss": -12.41604232788086, "global_step": 298139, "epoch": 1774} {"train_loss": -12.144760131835938, "global_step": 298140, "epoch": 1774} {"train_loss": -12.442230224609375, "global_step": 298141, "epoch": 1774} {"train_loss": -12.287701606750488, "global_step": 298142, "epoch": 1774} {"train_loss": -12.309106826782227, "global_step": 298143, "epoch": 1774} {"train_loss": -12.131346702575684, "global_step": 298144, "epoch": 1774} {"train_loss": -12.357759475708008, "global_step": 298145, "epoch": 1774} {"train_loss": -12.45093059539795, "global_step": 298146, "epoch": 1774} {"train_loss": -12.413671493530273, "global_step": 298147, "epoch": 1774} {"train_loss": -12.52342414855957, "global_step": 298148, "epoch": 1774} {"train_loss": -12.30238151550293, "global_step": 298149, "epoch": 1774} {"train_loss": -12.232385635375977, "global_step": 298150, "epoch": 1774} {"train_loss": -12.47938346862793, "global_step": 298151, "epoch": 1774} {"train_loss": -12.3339204788208, "global_step": 298152, "epoch": 1774} {"train_loss": -12.50644588470459, "global_step": 298153, "epoch": 1774} {"train_loss": -12.224379539489746, "global_step": 298154, "epoch": 1774} {"train_loss": -12.32991886138916, "global_step": 298155, "epoch": 1774} {"train_loss": -12.289525985717773, "global_step": 298156, "epoch": 1774} {"train_loss": -11.94102954864502, "global_step": 298157, "epoch": 1774} {"train_loss": -11.421823501586914, "global_step": 298158, "epoch": 1774} {"train_loss": -11.489255905151367, "global_step": 298159, "epoch": 1774} {"train_loss": -11.782503128051758, "global_step": 298160, "epoch": 1774} {"train_loss": -12.473868370056152, "global_step": 298161, "epoch": 1774} {"train_loss": -11.417224884033203, "global_step": 298162, "epoch": 1774} {"train_loss": -10.638191223144531, "global_step": 298163, "epoch": 1774} {"train_loss": -12.019918441772461, "global_step": 298164, "epoch": 1774} {"train_loss": -9.668290138244629, "global_step": 298165, "epoch": 1774} {"train_loss": -10.803092956542969, "global_step": 298166, "epoch": 1774} {"train_loss": -10.553199768066406, "global_step": 298167, "epoch": 1774} {"train_loss": -9.564833641052246, "global_step": 298168, "epoch": 1774} {"train_loss": -10.827728271484375, "global_step": 298169, "epoch": 1774} {"train_loss": -7.5029401779174805, "global_step": 298170, "epoch": 1774} {"train_loss": -8.02033805847168, "global_step": 298171, "epoch": 1774} {"train_loss": -9.300165176391602, "global_step": 298172, "epoch": 1774} {"train_loss": -10.57474136352539, "global_step": 298173, "epoch": 1774} {"train_loss": -10.398797988891602, "global_step": 298174, "epoch": 1774} {"train_loss": -9.401424407958984, "global_step": 298175, "epoch": 1774} {"train_loss": -9.532463073730469, "global_step": 298176, "epoch": 1774} {"train_loss": -10.679767608642578, "global_step": 298177, "epoch": 1774} {"train_loss": -9.488525390625, "global_step": 298178, "epoch": 1774} {"train_loss": -9.806778907775879, "global_step": 298179, "epoch": 1774} {"train_loss": -11.43461799621582, "global_step": 298180, "epoch": 1774} {"train_loss": -10.277826309204102, "global_step": 298181, "epoch": 1774} {"train_loss": -11.101984024047852, "global_step": 298182, "epoch": 1774} {"train_loss": -10.160911560058594, "global_step": 298183, "epoch": 1774} {"train_loss": -11.497323989868164, "global_step": 298184, "epoch": 1774} {"train_loss": -9.822698593139648, "global_step": 298185, "epoch": 1774} {"train_loss": -11.170257568359375, "global_step": 298186, "epoch": 1774} {"train_loss": -10.482807159423828, "global_step": 298187, "epoch": 1774} {"train_loss": -11.02250862121582, "global_step": 298188, "epoch": 1774} {"train_loss": -11.153334617614746, "global_step": 298189, "epoch": 1774} {"train_loss": -10.98033332824707, "global_step": 298190, "epoch": 1774} {"train_loss": -11.531760215759277, "global_step": 298191, "epoch": 1774} {"train_loss": -11.160404205322266, "global_step": 298192, "epoch": 1774} {"train_loss": -11.150481224060059, "global_step": 298193, "epoch": 1774} {"train_loss": -10.576452255249023, "global_step": 298194, "epoch": 1774} {"train_loss": -11.978084564208984, "global_step": 298195, "epoch": 1774} {"train_loss": -11.313902854919434, "global_step": 298196, "epoch": 1774} {"train_loss": -11.771269798278809, "global_step": 298197, "epoch": 1774} {"train_loss": -11.401497840881348, "global_step": 298198, "epoch": 1774} {"train_loss": -11.66249852521079, "global_step": 298199, "epoch": 1774, "val_loss": 280337.15625} {"train_loss": -11.758508682250977, "global_step": 298200, "epoch": 1775} {"train_loss": -11.460986137390137, "global_step": 298201, "epoch": 1775} {"train_loss": -11.663370132446289, "global_step": 298202, "epoch": 1775} {"train_loss": -11.861321449279785, "global_step": 298203, "epoch": 1775} {"train_loss": -11.790806770324707, "global_step": 298204, "epoch": 1775} {"train_loss": -11.646793365478516, "global_step": 298205, "epoch": 1775} {"train_loss": -11.519865036010742, "global_step": 298206, "epoch": 1775} {"train_loss": -12.01303768157959, "global_step": 298207, "epoch": 1775} {"train_loss": -11.525178909301758, "global_step": 298208, "epoch": 1775} {"train_loss": -11.915939331054688, "global_step": 298209, "epoch": 1775} {"train_loss": -11.777798652648926, "global_step": 298210, "epoch": 1775} {"train_loss": -11.693106651306152, "global_step": 298211, "epoch": 1775} {"train_loss": -12.122806549072266, "global_step": 298212, "epoch": 1775} {"train_loss": -11.883001327514648, "global_step": 298213, "epoch": 1775} {"train_loss": -12.136384963989258, "global_step": 298214, "epoch": 1775} {"train_loss": -11.962021827697754, "global_step": 298215, "epoch": 1775} {"train_loss": -11.891217231750488, "global_step": 298216, "epoch": 1775} {"train_loss": -11.945710182189941, "global_step": 298217, "epoch": 1775} {"train_loss": -11.978208541870117, "global_step": 298218, "epoch": 1775} {"train_loss": -11.919240951538086, "global_step": 298219, "epoch": 1775} {"train_loss": -11.954768180847168, "global_step": 298220, "epoch": 1775} {"train_loss": -12.09046459197998, "global_step": 298221, "epoch": 1775} {"train_loss": -11.96845817565918, "global_step": 298222, "epoch": 1775} {"train_loss": -12.080121994018555, "global_step": 298223, "epoch": 1775} {"train_loss": -12.038185119628906, "global_step": 298224, "epoch": 1775} {"train_loss": -11.729881286621094, "global_step": 298225, "epoch": 1775} {"train_loss": -12.091324806213379, "global_step": 298226, "epoch": 1775} {"train_loss": -11.97653579711914, "global_step": 298227, "epoch": 1775} {"train_loss": -12.123733520507812, "global_step": 298228, "epoch": 1775} {"train_loss": -11.959348678588867, "global_step": 298229, "epoch": 1775} {"train_loss": -11.970804214477539, "global_step": 298230, "epoch": 1775} {"train_loss": -12.311431884765625, "global_step": 298231, "epoch": 1775} {"train_loss": -11.878965377807617, "global_step": 298232, "epoch": 1775} {"train_loss": -12.129301071166992, "global_step": 298233, "epoch": 1775} {"train_loss": -12.018289566040039, "global_step": 298234, "epoch": 1775} {"train_loss": -12.096589088439941, "global_step": 298235, "epoch": 1775} {"train_loss": -12.118321418762207, "global_step": 298236, "epoch": 1775} {"train_loss": -11.888341903686523, "global_step": 298237, "epoch": 1775} {"train_loss": -12.205334663391113, "global_step": 298238, "epoch": 1775} {"train_loss": -11.827194213867188, "global_step": 298239, "epoch": 1775} {"train_loss": -12.047698974609375, "global_step": 298240, "epoch": 1775} {"train_loss": -11.86700439453125, "global_step": 298241, "epoch": 1775} {"train_loss": -12.238182067871094, "global_step": 298242, "epoch": 1775} {"train_loss": -11.999024391174316, "global_step": 298243, "epoch": 1775} {"train_loss": -11.841997146606445, "global_step": 298244, "epoch": 1775} {"train_loss": -11.676460266113281, "global_step": 298245, "epoch": 1775} {"train_loss": -12.274555206298828, "global_step": 298246, "epoch": 1775} {"train_loss": -12.142861366271973, "global_step": 298247, "epoch": 1775} {"train_loss": -12.24726676940918, "global_step": 298248, "epoch": 1775} {"train_loss": -11.875142097473145, "global_step": 298249, "epoch": 1775} {"train_loss": -12.04941177368164, "global_step": 298250, "epoch": 1775} {"train_loss": -12.042391777038574, "global_step": 298251, "epoch": 1775} {"train_loss": -12.020858764648438, "global_step": 298252, "epoch": 1775} {"train_loss": -12.138364791870117, "global_step": 298253, "epoch": 1775} {"train_loss": -12.125265121459961, "global_step": 298254, "epoch": 1775} {"train_loss": -12.143918991088867, "global_step": 298255, "epoch": 1775} {"train_loss": -11.768016815185547, "global_step": 298256, "epoch": 1775} {"train_loss": -12.35840892791748, "global_step": 298257, "epoch": 1775} {"train_loss": -11.826506614685059, "global_step": 298258, "epoch": 1775} {"train_loss": -12.011885643005371, "global_step": 298259, "epoch": 1775} {"train_loss": -11.729763984680176, "global_step": 298260, "epoch": 1775} {"train_loss": -11.725667953491211, "global_step": 298261, "epoch": 1775} {"train_loss": -12.156463623046875, "global_step": 298262, "epoch": 1775} {"train_loss": -12.289176940917969, "global_step": 298263, "epoch": 1775} {"train_loss": -12.353216171264648, "global_step": 298264, "epoch": 1775} {"train_loss": -12.146380424499512, "global_step": 298265, "epoch": 1775} {"train_loss": -12.234024047851562, "global_step": 298266, "epoch": 1775} {"train_loss": -12.049581527709961, "global_step": 298267, "epoch": 1775} {"train_loss": -12.468706130981445, "global_step": 298268, "epoch": 1775} {"train_loss": -12.267836570739746, "global_step": 298269, "epoch": 1775} {"train_loss": -12.337308883666992, "global_step": 298270, "epoch": 1775} {"train_loss": -12.054059982299805, "global_step": 298271, "epoch": 1775} {"train_loss": -12.199708938598633, "global_step": 298272, "epoch": 1775} {"train_loss": -12.183213233947754, "global_step": 298273, "epoch": 1775} {"train_loss": -12.449148178100586, "global_step": 298274, "epoch": 1775} {"train_loss": -12.354496002197266, "global_step": 298275, "epoch": 1775} {"train_loss": -12.420846939086914, "global_step": 298276, "epoch": 1775} {"train_loss": -12.366228103637695, "global_step": 298277, "epoch": 1775} {"train_loss": -12.174251556396484, "global_step": 298278, "epoch": 1775} {"train_loss": -12.029656410217285, "global_step": 298279, "epoch": 1775} {"train_loss": -12.326744079589844, "global_step": 298280, "epoch": 1775} {"train_loss": -12.38621711730957, "global_step": 298281, "epoch": 1775} {"train_loss": -11.638336181640625, "global_step": 298282, "epoch": 1775} {"train_loss": -12.40576171875, "global_step": 298283, "epoch": 1775} {"train_loss": -12.192838668823242, "global_step": 298284, "epoch": 1775} {"train_loss": -11.776725769042969, "global_step": 298285, "epoch": 1775} {"train_loss": -12.13469409942627, "global_step": 298286, "epoch": 1775} {"train_loss": -12.252341270446777, "global_step": 298287, "epoch": 1775} {"train_loss": -11.935306549072266, "global_step": 298288, "epoch": 1775} {"train_loss": -12.213194847106934, "global_step": 298289, "epoch": 1775} {"train_loss": -11.9075345993042, "global_step": 298290, "epoch": 1775} {"train_loss": -11.862567901611328, "global_step": 298291, "epoch": 1775} {"train_loss": -11.419817924499512, "global_step": 298292, "epoch": 1775} {"train_loss": -11.920658111572266, "global_step": 298293, "epoch": 1775} {"train_loss": -11.952849388122559, "global_step": 298294, "epoch": 1775} {"train_loss": -11.593620300292969, "global_step": 298295, "epoch": 1775} {"train_loss": -11.467655181884766, "global_step": 298296, "epoch": 1775} {"train_loss": -11.737159729003906, "global_step": 298297, "epoch": 1775} {"train_loss": -10.564855575561523, "global_step": 298298, "epoch": 1775} {"train_loss": -11.082633972167969, "global_step": 298299, "epoch": 1775} {"train_loss": -10.011914253234863, "global_step": 298300, "epoch": 1775} {"train_loss": -11.026617050170898, "global_step": 298301, "epoch": 1775} {"train_loss": -10.551228523254395, "global_step": 298302, "epoch": 1775} {"train_loss": -8.9060640335083, "global_step": 298303, "epoch": 1775} {"train_loss": -9.305089950561523, "global_step": 298304, "epoch": 1775} {"train_loss": -10.430429458618164, "global_step": 298305, "epoch": 1775} {"train_loss": -10.614147186279297, "global_step": 298306, "epoch": 1775} {"train_loss": -10.45183277130127, "global_step": 298307, "epoch": 1775} {"train_loss": -11.147690773010254, "global_step": 298308, "epoch": 1775} {"train_loss": -9.536039352416992, "global_step": 298309, "epoch": 1775} {"train_loss": -11.585491180419922, "global_step": 298310, "epoch": 1775} {"train_loss": -10.779043197631836, "global_step": 298311, "epoch": 1775} {"train_loss": -11.292505264282227, "global_step": 298312, "epoch": 1775} {"train_loss": -11.201763153076172, "global_step": 298313, "epoch": 1775} {"train_loss": -11.426615715026855, "global_step": 298314, "epoch": 1775} {"train_loss": -11.557761192321777, "global_step": 298315, "epoch": 1775} {"train_loss": -11.851163864135742, "global_step": 298316, "epoch": 1775} {"train_loss": -11.581806182861328, "global_step": 298317, "epoch": 1775} {"train_loss": -11.86735725402832, "global_step": 298318, "epoch": 1775} {"train_loss": -11.675117492675781, "global_step": 298319, "epoch": 1775} {"train_loss": -12.211380004882812, "global_step": 298320, "epoch": 1775} {"train_loss": -11.472397804260254, "global_step": 298321, "epoch": 1775} {"train_loss": -11.896514892578125, "global_step": 298322, "epoch": 1775} {"train_loss": -11.82715892791748, "global_step": 298323, "epoch": 1775} {"train_loss": -11.555732727050781, "global_step": 298324, "epoch": 1775} {"train_loss": -11.779391288757324, "global_step": 298325, "epoch": 1775} {"train_loss": -12.089563369750977, "global_step": 298326, "epoch": 1775} {"train_loss": -12.03873062133789, "global_step": 298327, "epoch": 1775} {"train_loss": -12.09266185760498, "global_step": 298328, "epoch": 1775} {"train_loss": -11.8961181640625, "global_step": 298329, "epoch": 1775} {"train_loss": -12.131656646728516, "global_step": 298330, "epoch": 1775} {"train_loss": -11.906231880187988, "global_step": 298331, "epoch": 1775} {"train_loss": -12.207176208496094, "global_step": 298332, "epoch": 1775} {"train_loss": -12.181471824645996, "global_step": 298333, "epoch": 1775} {"train_loss": -11.671130180358887, "global_step": 298334, "epoch": 1775} {"train_loss": -12.05312442779541, "global_step": 298335, "epoch": 1775} {"train_loss": -11.755270004272461, "global_step": 298336, "epoch": 1775} {"train_loss": -11.623871803283691, "global_step": 298337, "epoch": 1775} {"train_loss": -12.011117935180664, "global_step": 298338, "epoch": 1775} {"train_loss": -12.08283805847168, "global_step": 298339, "epoch": 1775} {"train_loss": -12.109760284423828, "global_step": 298340, "epoch": 1775} {"train_loss": -12.239602088928223, "global_step": 298341, "epoch": 1775} {"train_loss": -11.708105087280273, "global_step": 298342, "epoch": 1775} {"train_loss": -12.210823059082031, "global_step": 298343, "epoch": 1775} {"train_loss": -11.81892204284668, "global_step": 298344, "epoch": 1775} {"train_loss": -12.347179412841797, "global_step": 298345, "epoch": 1775} {"train_loss": -12.350245475769043, "global_step": 298346, "epoch": 1775} {"train_loss": -12.050337791442871, "global_step": 298347, "epoch": 1775} {"train_loss": -12.140569686889648, "global_step": 298348, "epoch": 1775} {"train_loss": -12.13534164428711, "global_step": 298349, "epoch": 1775} {"train_loss": -11.995039939880371, "global_step": 298350, "epoch": 1775} {"train_loss": -12.086518287658691, "global_step": 298351, "epoch": 1775} {"train_loss": -11.907258033752441, "global_step": 298352, "epoch": 1775} {"train_loss": -12.036087036132812, "global_step": 298353, "epoch": 1775} {"train_loss": -12.394176483154297, "global_step": 298354, "epoch": 1775} {"train_loss": -12.101000785827637, "global_step": 298355, "epoch": 1775} {"train_loss": -12.015251159667969, "global_step": 298356, "epoch": 1775} {"train_loss": -12.263577461242676, "global_step": 298357, "epoch": 1775} {"train_loss": -12.00130844116211, "global_step": 298358, "epoch": 1775} {"train_loss": -12.171247482299805, "global_step": 298359, "epoch": 1775} {"train_loss": -12.447303771972656, "global_step": 298360, "epoch": 1775} {"train_loss": -11.949873924255371, "global_step": 298361, "epoch": 1775} {"train_loss": -12.130958557128906, "global_step": 298362, "epoch": 1775} {"train_loss": -12.253291130065918, "global_step": 298363, "epoch": 1775} {"train_loss": -11.954835891723633, "global_step": 298364, "epoch": 1775} {"train_loss": -11.635306358337402, "global_step": 298365, "epoch": 1775} {"train_loss": -12.346359252929688, "global_step": 298366, "epoch": 1775} {"train_loss": -11.857679616837274, "global_step": 298367, "epoch": 1775, "val_loss": 276452.40625, "train_action_mse_error": 1.7070462703704834} {"train_loss": -10.8580322265625, "global_step": 298368, "epoch": 1776} {"train_loss": -12.131416320800781, "global_step": 298369, "epoch": 1776} {"train_loss": -11.483419418334961, "global_step": 298370, "epoch": 1776} {"train_loss": -10.897457122802734, "global_step": 298371, "epoch": 1776} {"train_loss": -11.164817810058594, "global_step": 298372, "epoch": 1776} {"train_loss": -11.713712692260742, "global_step": 298373, "epoch": 1776} {"train_loss": -10.390731811523438, "global_step": 298374, "epoch": 1776} {"train_loss": -11.516155242919922, "global_step": 298375, "epoch": 1776} {"train_loss": -10.929815292358398, "global_step": 298376, "epoch": 1776} {"train_loss": -10.705284118652344, "global_step": 298377, "epoch": 1776} {"train_loss": -11.213006019592285, "global_step": 298378, "epoch": 1776} {"train_loss": -10.046042442321777, "global_step": 298379, "epoch": 1776} {"train_loss": -10.816914558410645, "global_step": 298380, "epoch": 1776} {"train_loss": -11.540182113647461, "global_step": 298381, "epoch": 1776} {"train_loss": -9.848329544067383, "global_step": 298382, "epoch": 1776} {"train_loss": -11.217633247375488, "global_step": 298383, "epoch": 1776} {"train_loss": -9.331354141235352, "global_step": 298384, "epoch": 1776} {"train_loss": -8.7803955078125, "global_step": 298385, "epoch": 1776} {"train_loss": -9.531631469726562, "global_step": 298386, "epoch": 1776} {"train_loss": -9.841606140136719, "global_step": 298387, "epoch": 1776} {"train_loss": -9.148443222045898, "global_step": 298388, "epoch": 1776} {"train_loss": -9.5664644241333, "global_step": 298389, "epoch": 1776} {"train_loss": -9.803609848022461, "global_step": 298390, "epoch": 1776} {"train_loss": -9.57841682434082, "global_step": 298391, "epoch": 1776} {"train_loss": -10.416220664978027, "global_step": 298392, "epoch": 1776} {"train_loss": -10.598628997802734, "global_step": 298393, "epoch": 1776} {"train_loss": -11.152139663696289, "global_step": 298394, "epoch": 1776} {"train_loss": -11.538008689880371, "global_step": 298395, "epoch": 1776} {"train_loss": -11.423015594482422, "global_step": 298396, "epoch": 1776} {"train_loss": -10.900190353393555, "global_step": 298397, "epoch": 1776} {"train_loss": -10.752761840820312, "global_step": 298398, "epoch": 1776} {"train_loss": -10.298131942749023, "global_step": 298399, "epoch": 1776} {"train_loss": -10.927789688110352, "global_step": 298400, "epoch": 1776} {"train_loss": -11.270421981811523, "global_step": 298401, "epoch": 1776} {"train_loss": -11.457965850830078, "global_step": 298402, "epoch": 1776} {"train_loss": -11.417076110839844, "global_step": 298403, "epoch": 1776} {"train_loss": -11.573312759399414, "global_step": 298404, "epoch": 1776} {"train_loss": -11.074411392211914, "global_step": 298405, "epoch": 1776} {"train_loss": -11.554014205932617, "global_step": 298406, "epoch": 1776} {"train_loss": -10.747262954711914, "global_step": 298407, "epoch": 1776} {"train_loss": -11.2147798538208, "global_step": 298408, "epoch": 1776} {"train_loss": -10.759519577026367, "global_step": 298409, "epoch": 1776} {"train_loss": -11.835968017578125, "global_step": 298410, "epoch": 1776} {"train_loss": -11.092385292053223, "global_step": 298411, "epoch": 1776} {"train_loss": -11.951616287231445, "global_step": 298412, "epoch": 1776} {"train_loss": -11.112873077392578, "global_step": 298413, "epoch": 1776} {"train_loss": -11.690597534179688, "global_step": 298414, "epoch": 1776} {"train_loss": -11.543313980102539, "global_step": 298415, "epoch": 1776} {"train_loss": -11.805286407470703, "global_step": 298416, "epoch": 1776} {"train_loss": -11.796618461608887, "global_step": 298417, "epoch": 1776} {"train_loss": -11.704008102416992, "global_step": 298418, "epoch": 1776} {"train_loss": -11.883096694946289, "global_step": 298419, "epoch": 1776} {"train_loss": -11.820900917053223, "global_step": 298420, "epoch": 1776} {"train_loss": -11.756412506103516, "global_step": 298421, "epoch": 1776} {"train_loss": -11.942476272583008, "global_step": 298422, "epoch": 1776} {"train_loss": -11.67997932434082, "global_step": 298423, "epoch": 1776} {"train_loss": -11.887513160705566, "global_step": 298424, "epoch": 1776} {"train_loss": -12.036169052124023, "global_step": 298425, "epoch": 1776} {"train_loss": -12.00104808807373, "global_step": 298426, "epoch": 1776} {"train_loss": -12.072124481201172, "global_step": 298427, "epoch": 1776} {"train_loss": -11.929975509643555, "global_step": 298428, "epoch": 1776} {"train_loss": -11.844648361206055, "global_step": 298429, "epoch": 1776} {"train_loss": -11.895195007324219, "global_step": 298430, "epoch": 1776} {"train_loss": -12.002406120300293, "global_step": 298431, "epoch": 1776} {"train_loss": -11.985786437988281, "global_step": 298432, "epoch": 1776} {"train_loss": -11.926179885864258, "global_step": 298433, "epoch": 1776} {"train_loss": -12.122562408447266, "global_step": 298434, "epoch": 1776} {"train_loss": -12.009893417358398, "global_step": 298435, "epoch": 1776} {"train_loss": -12.226456642150879, "global_step": 298436, "epoch": 1776} {"train_loss": -12.217523574829102, "global_step": 298437, "epoch": 1776} {"train_loss": -12.0176420211792, "global_step": 298438, "epoch": 1776} {"train_loss": -12.323012351989746, "global_step": 298439, "epoch": 1776} {"train_loss": -11.8615083694458, "global_step": 298440, "epoch": 1776} {"train_loss": -11.986649513244629, "global_step": 298441, "epoch": 1776} {"train_loss": -12.061363220214844, "global_step": 298442, "epoch": 1776} {"train_loss": -12.167404174804688, "global_step": 298443, "epoch": 1776} {"train_loss": -12.346212387084961, "global_step": 298444, "epoch": 1776} {"train_loss": -12.199081420898438, "global_step": 298445, "epoch": 1776} {"train_loss": -11.995504379272461, "global_step": 298446, "epoch": 1776} {"train_loss": -12.129695892333984, "global_step": 298447, "epoch": 1776} {"train_loss": -12.095041275024414, "global_step": 298448, "epoch": 1776} {"train_loss": -12.097105979919434, "global_step": 298449, "epoch": 1776} {"train_loss": -12.335477828979492, "global_step": 298450, "epoch": 1776} {"train_loss": -12.0523681640625, "global_step": 298451, "epoch": 1776} {"train_loss": -12.169153213500977, "global_step": 298452, "epoch": 1776} {"train_loss": -12.145824432373047, "global_step": 298453, "epoch": 1776} {"train_loss": -12.034646987915039, "global_step": 298454, "epoch": 1776} {"train_loss": -12.327875137329102, "global_step": 298455, "epoch": 1776} {"train_loss": -12.389530181884766, "global_step": 298456, "epoch": 1776} {"train_loss": -12.462373733520508, "global_step": 298457, "epoch": 1776} {"train_loss": -12.300990104675293, "global_step": 298458, "epoch": 1776} {"train_loss": -12.210552215576172, "global_step": 298459, "epoch": 1776} {"train_loss": -12.190764427185059, "global_step": 298460, "epoch": 1776} {"train_loss": -12.305593490600586, "global_step": 298461, "epoch": 1776} {"train_loss": -12.263102531433105, "global_step": 298462, "epoch": 1776} {"train_loss": -12.426478385925293, "global_step": 298463, "epoch": 1776} {"train_loss": -12.384178161621094, "global_step": 298464, "epoch": 1776} {"train_loss": -12.406932830810547, "global_step": 298465, "epoch": 1776} {"train_loss": -12.437530517578125, "global_step": 298466, "epoch": 1776} {"train_loss": -12.653556823730469, "global_step": 298467, "epoch": 1776} {"train_loss": -12.393789291381836, "global_step": 298468, "epoch": 1776} {"train_loss": -12.016036987304688, "global_step": 298469, "epoch": 1776} {"train_loss": -12.529172897338867, "global_step": 298470, "epoch": 1776} {"train_loss": -12.437806129455566, "global_step": 298471, "epoch": 1776} {"train_loss": -12.4345064163208, "global_step": 298472, "epoch": 1776} {"train_loss": -12.3429536819458, "global_step": 298473, "epoch": 1776} {"train_loss": -12.501941680908203, "global_step": 298474, "epoch": 1776} {"train_loss": -12.220726013183594, "global_step": 298475, "epoch": 1776} {"train_loss": -12.111175537109375, "global_step": 298476, "epoch": 1776} {"train_loss": -12.417520523071289, "global_step": 298477, "epoch": 1776} {"train_loss": -12.182708740234375, "global_step": 298478, "epoch": 1776} {"train_loss": -12.286999702453613, "global_step": 298479, "epoch": 1776} {"train_loss": -12.397600173950195, "global_step": 298480, "epoch": 1776} {"train_loss": -12.247591018676758, "global_step": 298481, "epoch": 1776} {"train_loss": -12.469708442687988, "global_step": 298482, "epoch": 1776} {"train_loss": -11.998810768127441, "global_step": 298483, "epoch": 1776} {"train_loss": -11.447160720825195, "global_step": 298484, "epoch": 1776} {"train_loss": -11.248042106628418, "global_step": 298485, "epoch": 1776} {"train_loss": -12.272224426269531, "global_step": 298486, "epoch": 1776} {"train_loss": -11.642718315124512, "global_step": 298487, "epoch": 1776} {"train_loss": -11.951578140258789, "global_step": 298488, "epoch": 1776} {"train_loss": -11.924222946166992, "global_step": 298489, "epoch": 1776} {"train_loss": -12.123674392700195, "global_step": 298490, "epoch": 1776} {"train_loss": -11.944673538208008, "global_step": 298491, "epoch": 1776} {"train_loss": -11.202070236206055, "global_step": 298492, "epoch": 1776} {"train_loss": -12.173258781433105, "global_step": 298493, "epoch": 1776} {"train_loss": -11.833301544189453, "global_step": 298494, "epoch": 1776} {"train_loss": -11.454404830932617, "global_step": 298495, "epoch": 1776} {"train_loss": -10.611166000366211, "global_step": 298496, "epoch": 1776} {"train_loss": -12.140249252319336, "global_step": 298497, "epoch": 1776} {"train_loss": -10.147750854492188, "global_step": 298498, "epoch": 1776} {"train_loss": -10.714583396911621, "global_step": 298499, "epoch": 1776} {"train_loss": -11.162481307983398, "global_step": 298500, "epoch": 1776} {"train_loss": -11.317977905273438, "global_step": 298501, "epoch": 1776} {"train_loss": -11.080096244812012, "global_step": 298502, "epoch": 1776} {"train_loss": -11.130666732788086, "global_step": 298503, "epoch": 1776} {"train_loss": -9.811574935913086, "global_step": 298504, "epoch": 1776} {"train_loss": -11.948091506958008, "global_step": 298505, "epoch": 1776} {"train_loss": -11.171822547912598, "global_step": 298506, "epoch": 1776} {"train_loss": -11.770832061767578, "global_step": 298507, "epoch": 1776} {"train_loss": -11.650733947753906, "global_step": 298508, "epoch": 1776} {"train_loss": -11.684106826782227, "global_step": 298509, "epoch": 1776} {"train_loss": -11.308162689208984, "global_step": 298510, "epoch": 1776} {"train_loss": -11.992733001708984, "global_step": 298511, "epoch": 1776} {"train_loss": -11.562140464782715, "global_step": 298512, "epoch": 1776} {"train_loss": -12.039165496826172, "global_step": 298513, "epoch": 1776} {"train_loss": -11.594793319702148, "global_step": 298514, "epoch": 1776} {"train_loss": -11.904289245605469, "global_step": 298515, "epoch": 1776} {"train_loss": -11.28506851196289, "global_step": 298516, "epoch": 1776} {"train_loss": -12.124098777770996, "global_step": 298517, "epoch": 1776} {"train_loss": -11.437259674072266, "global_step": 298518, "epoch": 1776} {"train_loss": -11.74394702911377, "global_step": 298519, "epoch": 1776} {"train_loss": -11.350428581237793, "global_step": 298520, "epoch": 1776} {"train_loss": -10.281450271606445, "global_step": 298521, "epoch": 1776} {"train_loss": -11.775439262390137, "global_step": 298522, "epoch": 1776} {"train_loss": -10.454242706298828, "global_step": 298523, "epoch": 1776} {"train_loss": -11.88772201538086, "global_step": 298524, "epoch": 1776} {"train_loss": -10.954119682312012, "global_step": 298525, "epoch": 1776} {"train_loss": -11.776222229003906, "global_step": 298526, "epoch": 1776} {"train_loss": -11.295835494995117, "global_step": 298527, "epoch": 1776} {"train_loss": -11.42976188659668, "global_step": 298528, "epoch": 1776} {"train_loss": -11.565793991088867, "global_step": 298529, "epoch": 1776} {"train_loss": -11.296924591064453, "global_step": 298530, "epoch": 1776} {"train_loss": -11.932836532592773, "global_step": 298531, "epoch": 1776} {"train_loss": -11.619734764099121, "global_step": 298532, "epoch": 1776} {"train_loss": -11.983843803405762, "global_step": 298533, "epoch": 1776} {"train_loss": -12.045965194702148, "global_step": 298534, "epoch": 1776} {"train_loss": -11.572904893330165, "global_step": 298535, "epoch": 1776, "val_loss": 276875.75} {"train_loss": -11.855358123779297, "global_step": 298536, "epoch": 1777} {"train_loss": -11.716221809387207, "global_step": 298537, "epoch": 1777} {"train_loss": -11.760191917419434, "global_step": 298538, "epoch": 1777} {"train_loss": -11.743545532226562, "global_step": 298539, "epoch": 1777} {"train_loss": -12.124860763549805, "global_step": 298540, "epoch": 1777} {"train_loss": -11.87777328491211, "global_step": 298541, "epoch": 1777} {"train_loss": -11.658138275146484, "global_step": 298542, "epoch": 1777} {"train_loss": -11.960280418395996, "global_step": 298543, "epoch": 1777} {"train_loss": -11.270526885986328, "global_step": 298544, "epoch": 1777} {"train_loss": -12.093422889709473, "global_step": 298545, "epoch": 1777} {"train_loss": -11.666038513183594, "global_step": 298546, "epoch": 1777} {"train_loss": -12.066524505615234, "global_step": 298547, "epoch": 1777} {"train_loss": -11.548410415649414, "global_step": 298548, "epoch": 1777} {"train_loss": -12.096075057983398, "global_step": 298549, "epoch": 1777} {"train_loss": -11.735657691955566, "global_step": 298550, "epoch": 1777} {"train_loss": -11.310513496398926, "global_step": 298551, "epoch": 1777} {"train_loss": -11.692618370056152, "global_step": 298552, "epoch": 1777} {"train_loss": -11.546171188354492, "global_step": 298553, "epoch": 1777} {"train_loss": -11.25980281829834, "global_step": 298554, "epoch": 1777} {"train_loss": -11.950101852416992, "global_step": 298555, "epoch": 1777} {"train_loss": -11.35726547241211, "global_step": 298556, "epoch": 1777} {"train_loss": -12.018006324768066, "global_step": 298557, "epoch": 1777} {"train_loss": -11.199344635009766, "global_step": 298558, "epoch": 1777} {"train_loss": -11.857283592224121, "global_step": 298559, "epoch": 1777} {"train_loss": -11.619083404541016, "global_step": 298560, "epoch": 1777} {"train_loss": -11.880105018615723, "global_step": 298561, "epoch": 1777} {"train_loss": -11.075494766235352, "global_step": 298562, "epoch": 1777} {"train_loss": -11.848466873168945, "global_step": 298563, "epoch": 1777} {"train_loss": -11.440359115600586, "global_step": 298564, "epoch": 1777} {"train_loss": -11.931815147399902, "global_step": 298565, "epoch": 1777} {"train_loss": -11.532421112060547, "global_step": 298566, "epoch": 1777} {"train_loss": -11.735663414001465, "global_step": 298567, "epoch": 1777} {"train_loss": -11.818340301513672, "global_step": 298568, "epoch": 1777} {"train_loss": -12.081594467163086, "global_step": 298569, "epoch": 1777} {"train_loss": -11.950885772705078, "global_step": 298570, "epoch": 1777} {"train_loss": -12.017217636108398, "global_step": 298571, "epoch": 1777} {"train_loss": -11.848825454711914, "global_step": 298572, "epoch": 1777} {"train_loss": -11.841516494750977, "global_step": 298573, "epoch": 1777} {"train_loss": -12.195292472839355, "global_step": 298574, "epoch": 1777} {"train_loss": -12.15510368347168, "global_step": 298575, "epoch": 1777} {"train_loss": -12.046875, "global_step": 298576, "epoch": 1777} {"train_loss": -11.901660919189453, "global_step": 298577, "epoch": 1777} {"train_loss": -11.797852516174316, "global_step": 298578, "epoch": 1777} {"train_loss": -11.997087478637695, "global_step": 298579, "epoch": 1777} {"train_loss": -11.890281677246094, "global_step": 298580, "epoch": 1777} {"train_loss": -12.144218444824219, "global_step": 298581, "epoch": 1777} {"train_loss": -11.915305137634277, "global_step": 298582, "epoch": 1777} {"train_loss": -12.038806915283203, "global_step": 298583, "epoch": 1777} {"train_loss": -12.157424926757812, "global_step": 298584, "epoch": 1777} {"train_loss": -12.276975631713867, "global_step": 298585, "epoch": 1777} {"train_loss": -12.078936576843262, "global_step": 298586, "epoch": 1777} {"train_loss": -11.326604843139648, "global_step": 298587, "epoch": 1777} {"train_loss": -11.879042625427246, "global_step": 298588, "epoch": 1777} {"train_loss": -11.783710479736328, "global_step": 298589, "epoch": 1777} {"train_loss": -11.745254516601562, "global_step": 298590, "epoch": 1777} {"train_loss": -12.104728698730469, "global_step": 298591, "epoch": 1777} {"train_loss": -11.423995971679688, "global_step": 298592, "epoch": 1777} {"train_loss": -12.290351867675781, "global_step": 298593, "epoch": 1777} {"train_loss": -11.947380065917969, "global_step": 298594, "epoch": 1777} {"train_loss": -11.674311637878418, "global_step": 298595, "epoch": 1777} {"train_loss": -12.160640716552734, "global_step": 298596, "epoch": 1777} {"train_loss": -10.760088920593262, "global_step": 298597, "epoch": 1777} {"train_loss": -11.860499382019043, "global_step": 298598, "epoch": 1777} {"train_loss": -11.889148712158203, "global_step": 298599, "epoch": 1777} {"train_loss": -11.569894790649414, "global_step": 298600, "epoch": 1777} {"train_loss": -10.972085952758789, "global_step": 298601, "epoch": 1777} {"train_loss": -10.641592025756836, "global_step": 298602, "epoch": 1777} {"train_loss": -10.805608749389648, "global_step": 298603, "epoch": 1777} {"train_loss": -11.624898910522461, "global_step": 298604, "epoch": 1777} {"train_loss": -9.809268951416016, "global_step": 298605, "epoch": 1777} {"train_loss": -10.323741912841797, "global_step": 298606, "epoch": 1777} {"train_loss": -11.728267669677734, "global_step": 298607, "epoch": 1777} {"train_loss": -9.540592193603516, "global_step": 298608, "epoch": 1777} {"train_loss": -10.642316818237305, "global_step": 298609, "epoch": 1777} {"train_loss": -10.182012557983398, "global_step": 298610, "epoch": 1777} {"train_loss": -10.521227836608887, "global_step": 298611, "epoch": 1777} {"train_loss": -10.246194839477539, "global_step": 298612, "epoch": 1777} {"train_loss": -10.892786026000977, "global_step": 298613, "epoch": 1777} {"train_loss": -10.649223327636719, "global_step": 298614, "epoch": 1777} {"train_loss": -11.996062278747559, "global_step": 298615, "epoch": 1777} {"train_loss": -11.247848510742188, "global_step": 298616, "epoch": 1777} {"train_loss": -11.60476016998291, "global_step": 298617, "epoch": 1777} {"train_loss": -11.48679256439209, "global_step": 298618, "epoch": 1777} {"train_loss": -11.436210632324219, "global_step": 298619, "epoch": 1777} {"train_loss": -11.72563362121582, "global_step": 298620, "epoch": 1777} {"train_loss": -11.575292587280273, "global_step": 298621, "epoch": 1777} {"train_loss": -11.266969680786133, "global_step": 298622, "epoch": 1777} {"train_loss": -11.70795726776123, "global_step": 298623, "epoch": 1777} {"train_loss": -11.827299118041992, "global_step": 298624, "epoch": 1777} {"train_loss": -11.70461654663086, "global_step": 298625, "epoch": 1777} {"train_loss": -11.467561721801758, "global_step": 298626, "epoch": 1777} {"train_loss": -11.837133407592773, "global_step": 298627, "epoch": 1777} {"train_loss": -11.828838348388672, "global_step": 298628, "epoch": 1777} {"train_loss": -11.536054611206055, "global_step": 298629, "epoch": 1777} {"train_loss": -11.886789321899414, "global_step": 298630, "epoch": 1777} {"train_loss": -11.460289001464844, "global_step": 298631, "epoch": 1777} {"train_loss": -12.215014457702637, "global_step": 298632, "epoch": 1777} {"train_loss": -11.625362396240234, "global_step": 298633, "epoch": 1777} {"train_loss": -12.209811210632324, "global_step": 298634, "epoch": 1777} {"train_loss": -11.791746139526367, "global_step": 298635, "epoch": 1777} {"train_loss": -12.139052391052246, "global_step": 298636, "epoch": 1777} {"train_loss": -11.338957786560059, "global_step": 298637, "epoch": 1777} {"train_loss": -12.058773040771484, "global_step": 298638, "epoch": 1777} {"train_loss": -11.275253295898438, "global_step": 298639, "epoch": 1777} {"train_loss": -12.148260116577148, "global_step": 298640, "epoch": 1777} {"train_loss": -11.810617446899414, "global_step": 298641, "epoch": 1777} {"train_loss": -11.651420593261719, "global_step": 298642, "epoch": 1777} {"train_loss": -11.790361404418945, "global_step": 298643, "epoch": 1777} {"train_loss": -12.184497833251953, "global_step": 298644, "epoch": 1777} {"train_loss": -11.945356369018555, "global_step": 298645, "epoch": 1777} {"train_loss": -12.146653175354004, "global_step": 298646, "epoch": 1777} {"train_loss": -11.527620315551758, "global_step": 298647, "epoch": 1777} {"train_loss": -12.00386905670166, "global_step": 298648, "epoch": 1777} {"train_loss": -11.688730239868164, "global_step": 298649, "epoch": 1777} {"train_loss": -11.67341423034668, "global_step": 298650, "epoch": 1777} {"train_loss": -11.482592582702637, "global_step": 298651, "epoch": 1777} {"train_loss": -12.005066871643066, "global_step": 298652, "epoch": 1777} {"train_loss": -11.835190773010254, "global_step": 298653, "epoch": 1777} {"train_loss": -11.78872299194336, "global_step": 298654, "epoch": 1777} {"train_loss": -11.774051666259766, "global_step": 298655, "epoch": 1777} {"train_loss": -12.142292022705078, "global_step": 298656, "epoch": 1777} {"train_loss": -12.199766159057617, "global_step": 298657, "epoch": 1777} {"train_loss": -12.030691146850586, "global_step": 298658, "epoch": 1777} {"train_loss": -12.067413330078125, "global_step": 298659, "epoch": 1777} {"train_loss": -12.233718872070312, "global_step": 298660, "epoch": 1777} {"train_loss": -12.128870010375977, "global_step": 298661, "epoch": 1777} {"train_loss": -11.867456436157227, "global_step": 298662, "epoch": 1777} {"train_loss": -12.384111404418945, "global_step": 298663, "epoch": 1777} {"train_loss": -11.870443344116211, "global_step": 298664, "epoch": 1777} {"train_loss": -12.224711418151855, "global_step": 298665, "epoch": 1777} {"train_loss": -12.227231979370117, "global_step": 298666, "epoch": 1777} {"train_loss": -11.771394729614258, "global_step": 298667, "epoch": 1777} {"train_loss": -11.911412239074707, "global_step": 298668, "epoch": 1777} {"train_loss": -12.183950424194336, "global_step": 298669, "epoch": 1777} {"train_loss": -11.860200881958008, "global_step": 298670, "epoch": 1777} {"train_loss": -12.232719421386719, "global_step": 298671, "epoch": 1777} {"train_loss": -11.91069221496582, "global_step": 298672, "epoch": 1777} {"train_loss": -11.76076889038086, "global_step": 298673, "epoch": 1777} {"train_loss": -11.9496488571167, "global_step": 298674, "epoch": 1777} {"train_loss": -12.169414520263672, "global_step": 298675, "epoch": 1777} {"train_loss": -11.851768493652344, "global_step": 298676, "epoch": 1777} {"train_loss": -11.563946723937988, "global_step": 298677, "epoch": 1777} {"train_loss": -11.729594230651855, "global_step": 298678, "epoch": 1777} {"train_loss": -12.096687316894531, "global_step": 298679, "epoch": 1777} {"train_loss": -11.38248348236084, "global_step": 298680, "epoch": 1777} {"train_loss": -11.81161880493164, "global_step": 298681, "epoch": 1777} {"train_loss": -11.835525512695312, "global_step": 298682, "epoch": 1777} {"train_loss": -11.833057403564453, "global_step": 298683, "epoch": 1777} {"train_loss": -12.107799530029297, "global_step": 298684, "epoch": 1777} {"train_loss": -11.843389511108398, "global_step": 298685, "epoch": 1777} {"train_loss": -12.29513168334961, "global_step": 298686, "epoch": 1777} {"train_loss": -11.889469146728516, "global_step": 298687, "epoch": 1777} {"train_loss": -12.123869895935059, "global_step": 298688, "epoch": 1777} {"train_loss": -12.195759773254395, "global_step": 298689, "epoch": 1777} {"train_loss": -11.999446868896484, "global_step": 298690, "epoch": 1777} {"train_loss": -12.333794593811035, "global_step": 298691, "epoch": 1777} {"train_loss": -12.17786693572998, "global_step": 298692, "epoch": 1777} {"train_loss": -12.364848136901855, "global_step": 298693, "epoch": 1777} {"train_loss": -12.292183876037598, "global_step": 298694, "epoch": 1777} {"train_loss": -12.35604476928711, "global_step": 298695, "epoch": 1777} {"train_loss": -12.378263473510742, "global_step": 298696, "epoch": 1777} {"train_loss": -12.43056583404541, "global_step": 298697, "epoch": 1777} {"train_loss": -12.43578052520752, "global_step": 298698, "epoch": 1777} {"train_loss": -12.239354133605957, "global_step": 298699, "epoch": 1777} {"train_loss": -12.268417358398438, "global_step": 298700, "epoch": 1777} {"train_loss": -12.265813827514648, "global_step": 298701, "epoch": 1777} {"train_loss": -12.568984985351562, "global_step": 298702, "epoch": 1777} {"train_loss": -11.77090763478052, "global_step": 298703, "epoch": 1777, "val_loss": 281932.21875} {"train_loss": -12.295125961303711, "global_step": 298704, "epoch": 1778} {"train_loss": -12.327630996704102, "global_step": 298705, "epoch": 1778} {"train_loss": -12.200431823730469, "global_step": 298706, "epoch": 1778} {"train_loss": -12.136887550354004, "global_step": 298707, "epoch": 1778} {"train_loss": -12.069541931152344, "global_step": 298708, "epoch": 1778} {"train_loss": -12.179086685180664, "global_step": 298709, "epoch": 1778} {"train_loss": -12.203553199768066, "global_step": 298710, "epoch": 1778} {"train_loss": -12.177168846130371, "global_step": 298711, "epoch": 1778} {"train_loss": -12.239984512329102, "global_step": 298712, "epoch": 1778} {"train_loss": -12.484453201293945, "global_step": 298713, "epoch": 1778} {"train_loss": -12.026705741882324, "global_step": 298714, "epoch": 1778} {"train_loss": -11.940616607666016, "global_step": 298715, "epoch": 1778} {"train_loss": -11.903087615966797, "global_step": 298716, "epoch": 1778} {"train_loss": -12.184301376342773, "global_step": 298717, "epoch": 1778} {"train_loss": -12.117733001708984, "global_step": 298718, "epoch": 1778} {"train_loss": -12.326898574829102, "global_step": 298719, "epoch": 1778} {"train_loss": -12.288756370544434, "global_step": 298720, "epoch": 1778} {"train_loss": -11.901408195495605, "global_step": 298721, "epoch": 1778} {"train_loss": -12.004658699035645, "global_step": 298722, "epoch": 1778} {"train_loss": -12.151569366455078, "global_step": 298723, "epoch": 1778} {"train_loss": -11.949129104614258, "global_step": 298724, "epoch": 1778} {"train_loss": -12.383509635925293, "global_step": 298725, "epoch": 1778} {"train_loss": -12.058935165405273, "global_step": 298726, "epoch": 1778} {"train_loss": -12.268394470214844, "global_step": 298727, "epoch": 1778} {"train_loss": -11.995625495910645, "global_step": 298728, "epoch": 1778} {"train_loss": -11.725175857543945, "global_step": 298729, "epoch": 1778} {"train_loss": -11.254013061523438, "global_step": 298730, "epoch": 1778} {"train_loss": -11.79906177520752, "global_step": 298731, "epoch": 1778} {"train_loss": -12.197442054748535, "global_step": 298732, "epoch": 1778} {"train_loss": -12.014110565185547, "global_step": 298733, "epoch": 1778} {"train_loss": -12.18962287902832, "global_step": 298734, "epoch": 1778} {"train_loss": -12.06683349609375, "global_step": 298735, "epoch": 1778} {"train_loss": -11.989243507385254, "global_step": 298736, "epoch": 1778} {"train_loss": -12.346426010131836, "global_step": 298737, "epoch": 1778} {"train_loss": -12.085514068603516, "global_step": 298738, "epoch": 1778} {"train_loss": -11.91379165649414, "global_step": 298739, "epoch": 1778} {"train_loss": -12.30547046661377, "global_step": 298740, "epoch": 1778} {"train_loss": -12.141561508178711, "global_step": 298741, "epoch": 1778} {"train_loss": -12.309358596801758, "global_step": 298742, "epoch": 1778} {"train_loss": -12.04124927520752, "global_step": 298743, "epoch": 1778} {"train_loss": -12.374275207519531, "global_step": 298744, "epoch": 1778} {"train_loss": -12.386228561401367, "global_step": 298745, "epoch": 1778} {"train_loss": -12.15340805053711, "global_step": 298746, "epoch": 1778} {"train_loss": -11.825064659118652, "global_step": 298747, "epoch": 1778} {"train_loss": -12.049701690673828, "global_step": 298748, "epoch": 1778} {"train_loss": -11.495168685913086, "global_step": 298749, "epoch": 1778} {"train_loss": -11.460623741149902, "global_step": 298750, "epoch": 1778} {"train_loss": -12.144577980041504, "global_step": 298751, "epoch": 1778} {"train_loss": -10.66659164428711, "global_step": 298752, "epoch": 1778} {"train_loss": -9.222288131713867, "global_step": 298753, "epoch": 1778} {"train_loss": -10.799543380737305, "global_step": 298754, "epoch": 1778} {"train_loss": -8.35046672821045, "global_step": 298755, "epoch": 1778} {"train_loss": -10.997274398803711, "global_step": 298756, "epoch": 1778} {"train_loss": -9.014066696166992, "global_step": 298757, "epoch": 1778} {"train_loss": -10.322790145874023, "global_step": 298758, "epoch": 1778} {"train_loss": -9.672966003417969, "global_step": 298759, "epoch": 1778} {"train_loss": -10.670519828796387, "global_step": 298760, "epoch": 1778} {"train_loss": -9.317425727844238, "global_step": 298761, "epoch": 1778} {"train_loss": -9.787912368774414, "global_step": 298762, "epoch": 1778} {"train_loss": -9.214018821716309, "global_step": 298763, "epoch": 1778} {"train_loss": -9.292978286743164, "global_step": 298764, "epoch": 1778} {"train_loss": -9.119382858276367, "global_step": 298765, "epoch": 1778} {"train_loss": -10.092620849609375, "global_step": 298766, "epoch": 1778} {"train_loss": -10.375328063964844, "global_step": 298767, "epoch": 1778} {"train_loss": -10.6945161819458, "global_step": 298768, "epoch": 1778} {"train_loss": -11.023237228393555, "global_step": 298769, "epoch": 1778} {"train_loss": -10.995575904846191, "global_step": 298770, "epoch": 1778} {"train_loss": -11.16093635559082, "global_step": 298771, "epoch": 1778} {"train_loss": -10.571272850036621, "global_step": 298772, "epoch": 1778} {"train_loss": -10.956006050109863, "global_step": 298773, "epoch": 1778} {"train_loss": -10.867401123046875, "global_step": 298774, "epoch": 1778} {"train_loss": -11.155196189880371, "global_step": 298775, "epoch": 1778} {"train_loss": -11.257368087768555, "global_step": 298776, "epoch": 1778} {"train_loss": -11.109087944030762, "global_step": 298777, "epoch": 1778} {"train_loss": -11.311225891113281, "global_step": 298778, "epoch": 1778} {"train_loss": -11.177791595458984, "global_step": 298779, "epoch": 1778} {"train_loss": -11.555059432983398, "global_step": 298780, "epoch": 1778} {"train_loss": -10.840959548950195, "global_step": 298781, "epoch": 1778} {"train_loss": -11.725570678710938, "global_step": 298782, "epoch": 1778} {"train_loss": -11.25224781036377, "global_step": 298783, "epoch": 1778} {"train_loss": -11.53310775756836, "global_step": 298784, "epoch": 1778} {"train_loss": -11.955252647399902, "global_step": 298785, "epoch": 1778} {"train_loss": -11.661812782287598, "global_step": 298786, "epoch": 1778} {"train_loss": -11.9122314453125, "global_step": 298787, "epoch": 1778} {"train_loss": -11.902542114257812, "global_step": 298788, "epoch": 1778} {"train_loss": -11.922259330749512, "global_step": 298789, "epoch": 1778} {"train_loss": -11.547773361206055, "global_step": 298790, "epoch": 1778} {"train_loss": -11.856513977050781, "global_step": 298791, "epoch": 1778} {"train_loss": -11.921653747558594, "global_step": 298792, "epoch": 1778} {"train_loss": -11.702369689941406, "global_step": 298793, "epoch": 1778} {"train_loss": -11.900273323059082, "global_step": 298794, "epoch": 1778} {"train_loss": -11.854005813598633, "global_step": 298795, "epoch": 1778} {"train_loss": -11.903666496276855, "global_step": 298796, "epoch": 1778} {"train_loss": -11.947088241577148, "global_step": 298797, "epoch": 1778} {"train_loss": -12.086071014404297, "global_step": 298798, "epoch": 1778} {"train_loss": -11.892337799072266, "global_step": 298799, "epoch": 1778} {"train_loss": -12.070131301879883, "global_step": 298800, "epoch": 1778} {"train_loss": -11.900500297546387, "global_step": 298801, "epoch": 1778} {"train_loss": -12.22593879699707, "global_step": 298802, "epoch": 1778} {"train_loss": -12.031137466430664, "global_step": 298803, "epoch": 1778} {"train_loss": -12.177833557128906, "global_step": 298804, "epoch": 1778} {"train_loss": -11.998416900634766, "global_step": 298805, "epoch": 1778} {"train_loss": -11.903992652893066, "global_step": 298806, "epoch": 1778} {"train_loss": -12.056770324707031, "global_step": 298807, "epoch": 1778} {"train_loss": -12.086453437805176, "global_step": 298808, "epoch": 1778} {"train_loss": -11.853096008300781, "global_step": 298809, "epoch": 1778} {"train_loss": -12.171825408935547, "global_step": 298810, "epoch": 1778} {"train_loss": -11.761884689331055, "global_step": 298811, "epoch": 1778} {"train_loss": -11.840901374816895, "global_step": 298812, "epoch": 1778} {"train_loss": -11.77244758605957, "global_step": 298813, "epoch": 1778} {"train_loss": -11.718022346496582, "global_step": 298814, "epoch": 1778} {"train_loss": -12.196435928344727, "global_step": 298815, "epoch": 1778} {"train_loss": -11.898273468017578, "global_step": 298816, "epoch": 1778} {"train_loss": -12.04191780090332, "global_step": 298817, "epoch": 1778} {"train_loss": -11.989827156066895, "global_step": 298818, "epoch": 1778} {"train_loss": -12.087757110595703, "global_step": 298819, "epoch": 1778} {"train_loss": -12.231241226196289, "global_step": 298820, "epoch": 1778} {"train_loss": -12.356124877929688, "global_step": 298821, "epoch": 1778} {"train_loss": -12.16316032409668, "global_step": 298822, "epoch": 1778} {"train_loss": -12.455997467041016, "global_step": 298823, "epoch": 1778} {"train_loss": -11.947917938232422, "global_step": 298824, "epoch": 1778} {"train_loss": -12.169461250305176, "global_step": 298825, "epoch": 1778} {"train_loss": -12.45698356628418, "global_step": 298826, "epoch": 1778} {"train_loss": -12.371173858642578, "global_step": 298827, "epoch": 1778} {"train_loss": -12.4683837890625, "global_step": 298828, "epoch": 1778} {"train_loss": -12.31389045715332, "global_step": 298829, "epoch": 1778} {"train_loss": -11.956223487854004, "global_step": 298830, "epoch": 1778} {"train_loss": -12.24316120147705, "global_step": 298831, "epoch": 1778} {"train_loss": -12.247247695922852, "global_step": 298832, "epoch": 1778} {"train_loss": -12.25472640991211, "global_step": 298833, "epoch": 1778} {"train_loss": -12.299476623535156, "global_step": 298834, "epoch": 1778} {"train_loss": -12.202272415161133, "global_step": 298835, "epoch": 1778} {"train_loss": -12.559852600097656, "global_step": 298836, "epoch": 1778} {"train_loss": -12.466785430908203, "global_step": 298837, "epoch": 1778} {"train_loss": -12.503707885742188, "global_step": 298838, "epoch": 1778} {"train_loss": -12.422567367553711, "global_step": 298839, "epoch": 1778} {"train_loss": -12.187199592590332, "global_step": 298840, "epoch": 1778} {"train_loss": -12.446292877197266, "global_step": 298841, "epoch": 1778} {"train_loss": -12.361766815185547, "global_step": 298842, "epoch": 1778} {"train_loss": -12.304342269897461, "global_step": 298843, "epoch": 1778} {"train_loss": -12.174072265625, "global_step": 298844, "epoch": 1778} {"train_loss": -12.474973678588867, "global_step": 298845, "epoch": 1778} {"train_loss": -12.2940673828125, "global_step": 298846, "epoch": 1778} {"train_loss": -12.196735382080078, "global_step": 298847, "epoch": 1778} {"train_loss": -12.175745964050293, "global_step": 298848, "epoch": 1778} {"train_loss": -11.74572467803955, "global_step": 298849, "epoch": 1778} {"train_loss": -12.10891342163086, "global_step": 298850, "epoch": 1778} {"train_loss": -12.121686935424805, "global_step": 298851, "epoch": 1778} {"train_loss": -12.03493881225586, "global_step": 298852, "epoch": 1778} {"train_loss": -11.881149291992188, "global_step": 298853, "epoch": 1778} {"train_loss": -12.524084091186523, "global_step": 298854, "epoch": 1778} {"train_loss": -12.237905502319336, "global_step": 298855, "epoch": 1778} {"train_loss": -12.102764129638672, "global_step": 298856, "epoch": 1778} {"train_loss": -12.191487312316895, "global_step": 298857, "epoch": 1778} {"train_loss": -12.040216445922852, "global_step": 298858, "epoch": 1778} {"train_loss": -12.517623901367188, "global_step": 298859, "epoch": 1778} {"train_loss": -12.134725570678711, "global_step": 298860, "epoch": 1778} {"train_loss": -12.372262954711914, "global_step": 298861, "epoch": 1778} {"train_loss": -12.23597240447998, "global_step": 298862, "epoch": 1778} {"train_loss": -12.111974716186523, "global_step": 298863, "epoch": 1778} {"train_loss": -12.169133186340332, "global_step": 298864, "epoch": 1778} {"train_loss": -12.571418762207031, "global_step": 298865, "epoch": 1778} {"train_loss": -12.145149230957031, "global_step": 298866, "epoch": 1778} {"train_loss": -12.37747859954834, "global_step": 298867, "epoch": 1778} {"train_loss": -12.38875961303711, "global_step": 298868, "epoch": 1778} {"train_loss": -11.780391693115234, "global_step": 298869, "epoch": 1778} {"train_loss": -11.619955062866211, "global_step": 298870, "epoch": 1778} {"train_loss": -11.789621540478297, "global_step": 298871, "epoch": 1778, "val_loss": 281430.3125} {"train_loss": -12.195713996887207, "global_step": 298872, "epoch": 1779} {"train_loss": -12.316499710083008, "global_step": 298873, "epoch": 1779} {"train_loss": -12.028417587280273, "global_step": 298874, "epoch": 1779} {"train_loss": -12.321172714233398, "global_step": 298875, "epoch": 1779} {"train_loss": -12.260730743408203, "global_step": 298876, "epoch": 1779} {"train_loss": -12.278343200683594, "global_step": 298877, "epoch": 1779} {"train_loss": -11.736989974975586, "global_step": 298878, "epoch": 1779} {"train_loss": -12.343571662902832, "global_step": 298879, "epoch": 1779} {"train_loss": -11.70711898803711, "global_step": 298880, "epoch": 1779} {"train_loss": -10.372762680053711, "global_step": 298881, "epoch": 1779} {"train_loss": -11.54608154296875, "global_step": 298882, "epoch": 1779} {"train_loss": -11.732734680175781, "global_step": 298883, "epoch": 1779} {"train_loss": -11.968695640563965, "global_step": 298884, "epoch": 1779} {"train_loss": -11.795272827148438, "global_step": 298885, "epoch": 1779} {"train_loss": -11.203222274780273, "global_step": 298886, "epoch": 1779} {"train_loss": -11.511482238769531, "global_step": 298887, "epoch": 1779} {"train_loss": -12.020795822143555, "global_step": 298888, "epoch": 1779} {"train_loss": -12.257987976074219, "global_step": 298889, "epoch": 1779} {"train_loss": -12.230828285217285, "global_step": 298890, "epoch": 1779} {"train_loss": -11.569921493530273, "global_step": 298891, "epoch": 1779} {"train_loss": -11.776050567626953, "global_step": 298892, "epoch": 1779} {"train_loss": -11.958988189697266, "global_step": 298893, "epoch": 1779} {"train_loss": -12.200582504272461, "global_step": 298894, "epoch": 1779} {"train_loss": -10.799019813537598, "global_step": 298895, "epoch": 1779} {"train_loss": -11.538322448730469, "global_step": 298896, "epoch": 1779} {"train_loss": -11.878368377685547, "global_step": 298897, "epoch": 1779} {"train_loss": -11.098467826843262, "global_step": 298898, "epoch": 1779} {"train_loss": -11.488285064697266, "global_step": 298899, "epoch": 1779} {"train_loss": -11.854375839233398, "global_step": 298900, "epoch": 1779} {"train_loss": -12.272255897521973, "global_step": 298901, "epoch": 1779} {"train_loss": -11.624274253845215, "global_step": 298902, "epoch": 1779} {"train_loss": -12.035815238952637, "global_step": 298903, "epoch": 1779} {"train_loss": -11.506942749023438, "global_step": 298904, "epoch": 1779} {"train_loss": -12.350387573242188, "global_step": 298905, "epoch": 1779} {"train_loss": -11.884849548339844, "global_step": 298906, "epoch": 1779} {"train_loss": -11.846975326538086, "global_step": 298907, "epoch": 1779} {"train_loss": -12.02915096282959, "global_step": 298908, "epoch": 1779} {"train_loss": -11.746833801269531, "global_step": 298909, "epoch": 1779} {"train_loss": -12.01019287109375, "global_step": 298910, "epoch": 1779} {"train_loss": -11.69810676574707, "global_step": 298911, "epoch": 1779} {"train_loss": -11.521537780761719, "global_step": 298912, "epoch": 1779} {"train_loss": -11.570770263671875, "global_step": 298913, "epoch": 1779} {"train_loss": -11.933229446411133, "global_step": 298914, "epoch": 1779} {"train_loss": -11.762055397033691, "global_step": 298915, "epoch": 1779} {"train_loss": -11.823371887207031, "global_step": 298916, "epoch": 1779} {"train_loss": -11.891654014587402, "global_step": 298917, "epoch": 1779} {"train_loss": -12.140626907348633, "global_step": 298918, "epoch": 1779} {"train_loss": -11.837531089782715, "global_step": 298919, "epoch": 1779} {"train_loss": -11.880577087402344, "global_step": 298920, "epoch": 1779} {"train_loss": -11.269750595092773, "global_step": 298921, "epoch": 1779} {"train_loss": -12.163715362548828, "global_step": 298922, "epoch": 1779} {"train_loss": -11.908269882202148, "global_step": 298923, "epoch": 1779} {"train_loss": -11.640645027160645, "global_step": 298924, "epoch": 1779} {"train_loss": -12.149085998535156, "global_step": 298925, "epoch": 1779} {"train_loss": -11.605730056762695, "global_step": 298926, "epoch": 1779} {"train_loss": -11.015419006347656, "global_step": 298927, "epoch": 1779} {"train_loss": -12.046442031860352, "global_step": 298928, "epoch": 1779} {"train_loss": -10.691010475158691, "global_step": 298929, "epoch": 1779} {"train_loss": -10.842597961425781, "global_step": 298930, "epoch": 1779} {"train_loss": -11.768793106079102, "global_step": 298931, "epoch": 1779} {"train_loss": -9.235871315002441, "global_step": 298932, "epoch": 1779} {"train_loss": -11.191370010375977, "global_step": 298933, "epoch": 1779} {"train_loss": -10.942825317382812, "global_step": 298934, "epoch": 1779} {"train_loss": -9.80615234375, "global_step": 298935, "epoch": 1779} {"train_loss": -11.820816993713379, "global_step": 298936, "epoch": 1779} {"train_loss": -9.408193588256836, "global_step": 298937, "epoch": 1779} {"train_loss": -11.821170806884766, "global_step": 298938, "epoch": 1779} {"train_loss": -9.929754257202148, "global_step": 298939, "epoch": 1779} {"train_loss": -10.919805526733398, "global_step": 298940, "epoch": 1779} {"train_loss": -10.202033996582031, "global_step": 298941, "epoch": 1779} {"train_loss": -11.08713150024414, "global_step": 298942, "epoch": 1779} {"train_loss": -10.353673934936523, "global_step": 298943, "epoch": 1779} {"train_loss": -10.292470932006836, "global_step": 298944, "epoch": 1779} {"train_loss": -9.906240463256836, "global_step": 298945, "epoch": 1779} {"train_loss": -11.114166259765625, "global_step": 298946, "epoch": 1779} {"train_loss": -10.063356399536133, "global_step": 298947, "epoch": 1779} {"train_loss": -10.03782844543457, "global_step": 298948, "epoch": 1779} {"train_loss": -8.94642448425293, "global_step": 298949, "epoch": 1779} {"train_loss": -10.93821907043457, "global_step": 298950, "epoch": 1779} {"train_loss": -9.910261154174805, "global_step": 298951, "epoch": 1779} {"train_loss": -11.207395553588867, "global_step": 298952, "epoch": 1779} {"train_loss": -10.463895797729492, "global_step": 298953, "epoch": 1779} {"train_loss": -11.534499168395996, "global_step": 298954, "epoch": 1779} {"train_loss": -10.779027938842773, "global_step": 298955, "epoch": 1779} {"train_loss": -10.943903923034668, "global_step": 298956, "epoch": 1779} {"train_loss": -11.291828155517578, "global_step": 298957, "epoch": 1779} {"train_loss": -11.1038818359375, "global_step": 298958, "epoch": 1779} {"train_loss": -11.772582054138184, "global_step": 298959, "epoch": 1779} {"train_loss": -11.598074913024902, "global_step": 298960, "epoch": 1779} {"train_loss": -11.545312881469727, "global_step": 298961, "epoch": 1779} {"train_loss": -11.84193229675293, "global_step": 298962, "epoch": 1779} {"train_loss": -11.40614128112793, "global_step": 298963, "epoch": 1779} {"train_loss": -11.828248977661133, "global_step": 298964, "epoch": 1779} {"train_loss": -11.501340866088867, "global_step": 298965, "epoch": 1779} {"train_loss": -11.64277458190918, "global_step": 298966, "epoch": 1779} {"train_loss": -11.283293724060059, "global_step": 298967, "epoch": 1779} {"train_loss": -11.96389389038086, "global_step": 298968, "epoch": 1779} {"train_loss": -11.737348556518555, "global_step": 298969, "epoch": 1779} {"train_loss": -11.868431091308594, "global_step": 298970, "epoch": 1779} {"train_loss": -11.900487899780273, "global_step": 298971, "epoch": 1779} {"train_loss": -11.76596736907959, "global_step": 298972, "epoch": 1779} {"train_loss": -12.00268840789795, "global_step": 298973, "epoch": 1779} {"train_loss": -11.939757347106934, "global_step": 298974, "epoch": 1779} {"train_loss": -11.992269515991211, "global_step": 298975, "epoch": 1779} {"train_loss": -11.908798217773438, "global_step": 298976, "epoch": 1779} {"train_loss": -11.915319442749023, "global_step": 298977, "epoch": 1779} {"train_loss": -11.846959114074707, "global_step": 298978, "epoch": 1779} {"train_loss": -11.831096649169922, "global_step": 298979, "epoch": 1779} {"train_loss": -11.962800979614258, "global_step": 298980, "epoch": 1779} {"train_loss": -12.130630493164062, "global_step": 298981, "epoch": 1779} {"train_loss": -11.934322357177734, "global_step": 298982, "epoch": 1779} {"train_loss": -12.107772827148438, "global_step": 298983, "epoch": 1779} {"train_loss": -11.959518432617188, "global_step": 298984, "epoch": 1779} {"train_loss": -12.068798065185547, "global_step": 298985, "epoch": 1779} {"train_loss": -12.279034614562988, "global_step": 298986, "epoch": 1779} {"train_loss": -12.002089500427246, "global_step": 298987, "epoch": 1779} {"train_loss": -12.100486755371094, "global_step": 298988, "epoch": 1779} {"train_loss": -12.261554718017578, "global_step": 298989, "epoch": 1779} {"train_loss": -12.212368965148926, "global_step": 298990, "epoch": 1779} {"train_loss": -12.19939136505127, "global_step": 298991, "epoch": 1779} {"train_loss": -12.29629898071289, "global_step": 298992, "epoch": 1779} {"train_loss": -12.286432266235352, "global_step": 298993, "epoch": 1779} {"train_loss": -12.355415344238281, "global_step": 298994, "epoch": 1779} {"train_loss": -12.256518363952637, "global_step": 298995, "epoch": 1779} {"train_loss": -12.505350112915039, "global_step": 298996, "epoch": 1779} {"train_loss": -12.302444458007812, "global_step": 298997, "epoch": 1779} {"train_loss": -12.292618751525879, "global_step": 298998, "epoch": 1779} {"train_loss": -12.402965545654297, "global_step": 298999, "epoch": 1779} {"train_loss": -12.388138771057129, "global_step": 299000, "epoch": 1779} {"train_loss": -12.034486770629883, "global_step": 299001, "epoch": 1779} {"train_loss": -12.241000175476074, "global_step": 299002, "epoch": 1779} {"train_loss": -12.216659545898438, "global_step": 299003, "epoch": 1779} {"train_loss": -12.185356140136719, "global_step": 299004, "epoch": 1779} {"train_loss": -12.41977596282959, "global_step": 299005, "epoch": 1779} {"train_loss": -12.246700286865234, "global_step": 299006, "epoch": 1779} {"train_loss": -12.401827812194824, "global_step": 299007, "epoch": 1779} {"train_loss": -12.079421997070312, "global_step": 299008, "epoch": 1779} {"train_loss": -12.287313461303711, "global_step": 299009, "epoch": 1779} {"train_loss": -12.280364990234375, "global_step": 299010, "epoch": 1779} {"train_loss": -12.362689018249512, "global_step": 299011, "epoch": 1779} {"train_loss": -12.282028198242188, "global_step": 299012, "epoch": 1779} {"train_loss": -12.23707389831543, "global_step": 299013, "epoch": 1779} {"train_loss": -12.297918319702148, "global_step": 299014, "epoch": 1779} {"train_loss": -12.095605850219727, "global_step": 299015, "epoch": 1779} {"train_loss": -11.975318908691406, "global_step": 299016, "epoch": 1779} {"train_loss": -12.306156158447266, "global_step": 299017, "epoch": 1779} {"train_loss": -12.350198745727539, "global_step": 299018, "epoch": 1779} {"train_loss": -12.063108444213867, "global_step": 299019, "epoch": 1779} {"train_loss": -12.404312133789062, "global_step": 299020, "epoch": 1779} {"train_loss": -12.281684875488281, "global_step": 299021, "epoch": 1779} {"train_loss": -12.4339017868042, "global_step": 299022, "epoch": 1779} {"train_loss": -12.509346008300781, "global_step": 299023, "epoch": 1779} {"train_loss": -12.356056213378906, "global_step": 299024, "epoch": 1779} {"train_loss": -12.441377639770508, "global_step": 299025, "epoch": 1779} {"train_loss": -12.290716171264648, "global_step": 299026, "epoch": 1779} {"train_loss": -12.333351135253906, "global_step": 299027, "epoch": 1779} {"train_loss": -12.442960739135742, "global_step": 299028, "epoch": 1779} {"train_loss": -12.59422492980957, "global_step": 299029, "epoch": 1779} {"train_loss": -12.113700866699219, "global_step": 299030, "epoch": 1779} {"train_loss": -12.574518203735352, "global_step": 299031, "epoch": 1779} {"train_loss": -12.153532028198242, "global_step": 299032, "epoch": 1779} {"train_loss": -12.105705261230469, "global_step": 299033, "epoch": 1779} {"train_loss": -12.293046951293945, "global_step": 299034, "epoch": 1779} {"train_loss": -11.908520698547363, "global_step": 299035, "epoch": 1779} {"train_loss": -12.222526550292969, "global_step": 299036, "epoch": 1779} {"train_loss": -12.305329322814941, "global_step": 299037, "epoch": 1779} {"train_loss": -11.968807220458984, "global_step": 299038, "epoch": 1779} {"train_loss": -11.746562287920998, "global_step": 299039, "epoch": 1779, "val_loss": 281787.25} {"train_loss": -12.2125244140625, "global_step": 299040, "epoch": 1780} {"train_loss": -11.621635437011719, "global_step": 299041, "epoch": 1780} {"train_loss": -11.112284660339355, "global_step": 299042, "epoch": 1780} {"train_loss": -12.026363372802734, "global_step": 299043, "epoch": 1780} {"train_loss": -11.421773910522461, "global_step": 299044, "epoch": 1780} {"train_loss": -11.459126472473145, "global_step": 299045, "epoch": 1780} {"train_loss": -11.685678482055664, "global_step": 299046, "epoch": 1780} {"train_loss": -11.900833129882812, "global_step": 299047, "epoch": 1780} {"train_loss": -11.689776420593262, "global_step": 299048, "epoch": 1780} {"train_loss": -11.851041793823242, "global_step": 299049, "epoch": 1780} {"train_loss": -11.77889633178711, "global_step": 299050, "epoch": 1780} {"train_loss": -10.378411293029785, "global_step": 299051, "epoch": 1780} {"train_loss": -11.876848220825195, "global_step": 299052, "epoch": 1780} {"train_loss": -9.886821746826172, "global_step": 299053, "epoch": 1780} {"train_loss": -10.551566123962402, "global_step": 299054, "epoch": 1780} {"train_loss": -10.735187530517578, "global_step": 299055, "epoch": 1780} {"train_loss": -9.272313117980957, "global_step": 299056, "epoch": 1780} {"train_loss": -7.244105339050293, "global_step": 299057, "epoch": 1780} {"train_loss": -8.768799781799316, "global_step": 299058, "epoch": 1780} {"train_loss": -8.152007102966309, "global_step": 299059, "epoch": 1780} {"train_loss": -9.500938415527344, "global_step": 299060, "epoch": 1780} {"train_loss": -10.173609733581543, "global_step": 299061, "epoch": 1780} {"train_loss": -9.574787139892578, "global_step": 299062, "epoch": 1780} {"train_loss": -11.37100601196289, "global_step": 299063, "epoch": 1780} {"train_loss": -10.330232620239258, "global_step": 299064, "epoch": 1780} {"train_loss": -11.099868774414062, "global_step": 299065, "epoch": 1780} {"train_loss": -10.845341682434082, "global_step": 299066, "epoch": 1780} {"train_loss": -11.037412643432617, "global_step": 299067, "epoch": 1780} {"train_loss": -11.037357330322266, "global_step": 299068, "epoch": 1780} {"train_loss": -10.732386589050293, "global_step": 299069, "epoch": 1780} {"train_loss": -11.196817398071289, "global_step": 299070, "epoch": 1780} {"train_loss": -10.577702522277832, "global_step": 299071, "epoch": 1780} {"train_loss": -11.675628662109375, "global_step": 299072, "epoch": 1780} {"train_loss": -11.471428871154785, "global_step": 299073, "epoch": 1780} {"train_loss": -10.65422248840332, "global_step": 299074, "epoch": 1780} {"train_loss": -11.366048812866211, "global_step": 299075, "epoch": 1780} {"train_loss": -11.21064281463623, "global_step": 299076, "epoch": 1780} {"train_loss": -11.781583786010742, "global_step": 299077, "epoch": 1780} {"train_loss": -11.489925384521484, "global_step": 299078, "epoch": 1780} {"train_loss": -11.453642845153809, "global_step": 299079, "epoch": 1780} {"train_loss": -11.6668701171875, "global_step": 299080, "epoch": 1780} {"train_loss": -11.431001663208008, "global_step": 299081, "epoch": 1780} {"train_loss": -10.594045639038086, "global_step": 299082, "epoch": 1780} {"train_loss": -11.552431106567383, "global_step": 299083, "epoch": 1780} {"train_loss": -10.402376174926758, "global_step": 299084, "epoch": 1780} {"train_loss": -11.352436065673828, "global_step": 299085, "epoch": 1780} {"train_loss": -11.131485939025879, "global_step": 299086, "epoch": 1780} {"train_loss": -11.525673866271973, "global_step": 299087, "epoch": 1780} {"train_loss": -11.197781562805176, "global_step": 299088, "epoch": 1780} {"train_loss": -11.335708618164062, "global_step": 299089, "epoch": 1780} {"train_loss": -11.17409896850586, "global_step": 299090, "epoch": 1780} {"train_loss": -11.409870147705078, "global_step": 299091, "epoch": 1780} {"train_loss": -10.667074203491211, "global_step": 299092, "epoch": 1780} {"train_loss": -11.246711730957031, "global_step": 299093, "epoch": 1780} {"train_loss": -10.412243843078613, "global_step": 299094, "epoch": 1780} {"train_loss": -11.634078979492188, "global_step": 299095, "epoch": 1780} {"train_loss": -10.529475212097168, "global_step": 299096, "epoch": 1780} {"train_loss": -11.372400283813477, "global_step": 299097, "epoch": 1780} {"train_loss": -11.509052276611328, "global_step": 299098, "epoch": 1780} {"train_loss": -11.456426620483398, "global_step": 299099, "epoch": 1780} {"train_loss": -11.888406753540039, "global_step": 299100, "epoch": 1780} {"train_loss": -11.854262351989746, "global_step": 299101, "epoch": 1780} {"train_loss": -11.846474647521973, "global_step": 299102, "epoch": 1780} {"train_loss": -11.744422912597656, "global_step": 299103, "epoch": 1780} {"train_loss": -11.524818420410156, "global_step": 299104, "epoch": 1780} {"train_loss": -11.646160125732422, "global_step": 299105, "epoch": 1780} {"train_loss": -11.640291213989258, "global_step": 299106, "epoch": 1780} {"train_loss": -11.438796997070312, "global_step": 299107, "epoch": 1780} {"train_loss": -12.031494140625, "global_step": 299108, "epoch": 1780} {"train_loss": -11.530023574829102, "global_step": 299109, "epoch": 1780} {"train_loss": -11.687837600708008, "global_step": 299110, "epoch": 1780} {"train_loss": -12.063127517700195, "global_step": 299111, "epoch": 1780} {"train_loss": -11.37507438659668, "global_step": 299112, "epoch": 1780} {"train_loss": -12.14875316619873, "global_step": 299113, "epoch": 1780} {"train_loss": -11.586747169494629, "global_step": 299114, "epoch": 1780} {"train_loss": -11.433401107788086, "global_step": 299115, "epoch": 1780} {"train_loss": -12.221437454223633, "global_step": 299116, "epoch": 1780} {"train_loss": -11.88585090637207, "global_step": 299117, "epoch": 1780} {"train_loss": -11.675603866577148, "global_step": 299118, "epoch": 1780} {"train_loss": -11.939289093017578, "global_step": 299119, "epoch": 1780} {"train_loss": -11.303565979003906, "global_step": 299120, "epoch": 1780} {"train_loss": -11.860222816467285, "global_step": 299121, "epoch": 1780} {"train_loss": -11.65511417388916, "global_step": 299122, "epoch": 1780} {"train_loss": -11.893531799316406, "global_step": 299123, "epoch": 1780} {"train_loss": -12.26668930053711, "global_step": 299124, "epoch": 1780} {"train_loss": -11.815254211425781, "global_step": 299125, "epoch": 1780} {"train_loss": -11.911943435668945, "global_step": 299126, "epoch": 1780} {"train_loss": -12.141321182250977, "global_step": 299127, "epoch": 1780} {"train_loss": -11.687104225158691, "global_step": 299128, "epoch": 1780} {"train_loss": -12.21922492980957, "global_step": 299129, "epoch": 1780} {"train_loss": -12.157486915588379, "global_step": 299130, "epoch": 1780} {"train_loss": -11.999591827392578, "global_step": 299131, "epoch": 1780} {"train_loss": -12.237374305725098, "global_step": 299132, "epoch": 1780} {"train_loss": -11.867900848388672, "global_step": 299133, "epoch": 1780} {"train_loss": -12.033717155456543, "global_step": 299134, "epoch": 1780} {"train_loss": -12.136411666870117, "global_step": 299135, "epoch": 1780} {"train_loss": -11.622613906860352, "global_step": 299136, "epoch": 1780} {"train_loss": -12.209449768066406, "global_step": 299137, "epoch": 1780} {"train_loss": -12.13296890258789, "global_step": 299138, "epoch": 1780} {"train_loss": -12.263143539428711, "global_step": 299139, "epoch": 1780} {"train_loss": -12.112083435058594, "global_step": 299140, "epoch": 1780} {"train_loss": -12.165082931518555, "global_step": 299141, "epoch": 1780} {"train_loss": -12.026522636413574, "global_step": 299142, "epoch": 1780} {"train_loss": -12.106134414672852, "global_step": 299143, "epoch": 1780} {"train_loss": -11.965721130371094, "global_step": 299144, "epoch": 1780} {"train_loss": -12.324005126953125, "global_step": 299145, "epoch": 1780} {"train_loss": -12.265148162841797, "global_step": 299146, "epoch": 1780} {"train_loss": -11.834810256958008, "global_step": 299147, "epoch": 1780} {"train_loss": -12.006349563598633, "global_step": 299148, "epoch": 1780} {"train_loss": -12.17125129699707, "global_step": 299149, "epoch": 1780} {"train_loss": -11.899706840515137, "global_step": 299150, "epoch": 1780} {"train_loss": -11.552652359008789, "global_step": 299151, "epoch": 1780} {"train_loss": -11.753281593322754, "global_step": 299152, "epoch": 1780} {"train_loss": -11.330667495727539, "global_step": 299153, "epoch": 1780} {"train_loss": -9.206789016723633, "global_step": 299154, "epoch": 1780} {"train_loss": -11.695746421813965, "global_step": 299155, "epoch": 1780} {"train_loss": -11.075250625610352, "global_step": 299156, "epoch": 1780} {"train_loss": -11.268186569213867, "global_step": 299157, "epoch": 1780} {"train_loss": -11.569490432739258, "global_step": 299158, "epoch": 1780} {"train_loss": -10.59377384185791, "global_step": 299159, "epoch": 1780} {"train_loss": -10.50169563293457, "global_step": 299160, "epoch": 1780} {"train_loss": -6.979884147644043, "global_step": 299161, "epoch": 1780} {"train_loss": -8.356096267700195, "global_step": 299162, "epoch": 1780} {"train_loss": -7.830360412597656, "global_step": 299163, "epoch": 1780} {"train_loss": -7.356083869934082, "global_step": 299164, "epoch": 1780} {"train_loss": -8.627635955810547, "global_step": 299165, "epoch": 1780} {"train_loss": -10.266986846923828, "global_step": 299166, "epoch": 1780} {"train_loss": -7.93755578994751, "global_step": 299167, "epoch": 1780} {"train_loss": -8.815038681030273, "global_step": 299168, "epoch": 1780} {"train_loss": -9.553348541259766, "global_step": 299169, "epoch": 1780} {"train_loss": -10.89327621459961, "global_step": 299170, "epoch": 1780} {"train_loss": -10.147512435913086, "global_step": 299171, "epoch": 1780} {"train_loss": -10.145695686340332, "global_step": 299172, "epoch": 1780} {"train_loss": -11.281692504882812, "global_step": 299173, "epoch": 1780} {"train_loss": -10.745819091796875, "global_step": 299174, "epoch": 1780} {"train_loss": -10.635812759399414, "global_step": 299175, "epoch": 1780} {"train_loss": -10.618608474731445, "global_step": 299176, "epoch": 1780} {"train_loss": -9.830495834350586, "global_step": 299177, "epoch": 1780} {"train_loss": -10.231019020080566, "global_step": 299178, "epoch": 1780} {"train_loss": -9.645364761352539, "global_step": 299179, "epoch": 1780} {"train_loss": -11.572282791137695, "global_step": 299180, "epoch": 1780} {"train_loss": -10.482831954956055, "global_step": 299181, "epoch": 1780} {"train_loss": -10.259617805480957, "global_step": 299182, "epoch": 1780} {"train_loss": -11.306159019470215, "global_step": 299183, "epoch": 1780} {"train_loss": -9.347003936767578, "global_step": 299184, "epoch": 1780} {"train_loss": -10.999176979064941, "global_step": 299185, "epoch": 1780} {"train_loss": -11.324357986450195, "global_step": 299186, "epoch": 1780} {"train_loss": -10.712884902954102, "global_step": 299187, "epoch": 1780} {"train_loss": -10.987077713012695, "global_step": 299188, "epoch": 1780} {"train_loss": -11.088066101074219, "global_step": 299189, "epoch": 1780} {"train_loss": -10.413766860961914, "global_step": 299190, "epoch": 1780} {"train_loss": -11.224725723266602, "global_step": 299191, "epoch": 1780} {"train_loss": -11.105019569396973, "global_step": 299192, "epoch": 1780} {"train_loss": -10.831153869628906, "global_step": 299193, "epoch": 1780} {"train_loss": -11.51310920715332, "global_step": 299194, "epoch": 1780} {"train_loss": -11.270854949951172, "global_step": 299195, "epoch": 1780} {"train_loss": -11.609983444213867, "global_step": 299196, "epoch": 1780} {"train_loss": -11.49952507019043, "global_step": 299197, "epoch": 1780} {"train_loss": -11.558863639831543, "global_step": 299198, "epoch": 1780} {"train_loss": -11.529678344726562, "global_step": 299199, "epoch": 1780} {"train_loss": -11.47337532043457, "global_step": 299200, "epoch": 1780} {"train_loss": -11.649479866027832, "global_step": 299201, "epoch": 1780} {"train_loss": -11.642736434936523, "global_step": 299202, "epoch": 1780} {"train_loss": -11.744294166564941, "global_step": 299203, "epoch": 1780} {"train_loss": -11.567626953125, "global_step": 299204, "epoch": 1780} {"train_loss": -11.684696197509766, "global_step": 299205, "epoch": 1780} {"train_loss": -11.526659965515137, "global_step": 299206, "epoch": 1780} {"train_loss": -11.126984655857086, "global_step": 299207, "epoch": 1780, "val_loss": 268304.78125, "train_action_mse_error": 3.4874017238616943} {"train_loss": -11.678314208984375, "global_step": 299208, "epoch": 1781} {"train_loss": -11.901252746582031, "global_step": 299209, "epoch": 1781} {"train_loss": -11.869237899780273, "global_step": 299210, "epoch": 1781} {"train_loss": -11.953913688659668, "global_step": 299211, "epoch": 1781} {"train_loss": -11.957342147827148, "global_step": 299212, "epoch": 1781} {"train_loss": -11.919758796691895, "global_step": 299213, "epoch": 1781} {"train_loss": -12.066771507263184, "global_step": 299214, "epoch": 1781} {"train_loss": -12.046299934387207, "global_step": 299215, "epoch": 1781} {"train_loss": -11.772354125976562, "global_step": 299216, "epoch": 1781} {"train_loss": -11.989994049072266, "global_step": 299217, "epoch": 1781} {"train_loss": -12.088268280029297, "global_step": 299218, "epoch": 1781} {"train_loss": -11.902800559997559, "global_step": 299219, "epoch": 1781} {"train_loss": -12.024734497070312, "global_step": 299220, "epoch": 1781} {"train_loss": -11.871377944946289, "global_step": 299221, "epoch": 1781} {"train_loss": -12.109375953674316, "global_step": 299222, "epoch": 1781} {"train_loss": -12.187300682067871, "global_step": 299223, "epoch": 1781} {"train_loss": -11.885851860046387, "global_step": 299224, "epoch": 1781} {"train_loss": -12.071191787719727, "global_step": 299225, "epoch": 1781} {"train_loss": -11.935583114624023, "global_step": 299226, "epoch": 1781} {"train_loss": -11.902482986450195, "global_step": 299227, "epoch": 1781} {"train_loss": -12.029909133911133, "global_step": 299228, "epoch": 1781} {"train_loss": -11.987747192382812, "global_step": 299229, "epoch": 1781} {"train_loss": -11.921309471130371, "global_step": 299230, "epoch": 1781} {"train_loss": -12.158295631408691, "global_step": 299231, "epoch": 1781} {"train_loss": -11.954509735107422, "global_step": 299232, "epoch": 1781} {"train_loss": -11.840799331665039, "global_step": 299233, "epoch": 1781} {"train_loss": -12.040404319763184, "global_step": 299234, "epoch": 1781} {"train_loss": -11.95262336730957, "global_step": 299235, "epoch": 1781} {"train_loss": -11.96998405456543, "global_step": 299236, "epoch": 1781} {"train_loss": -11.94399642944336, "global_step": 299237, "epoch": 1781} {"train_loss": -12.134589195251465, "global_step": 299238, "epoch": 1781} {"train_loss": -12.065047264099121, "global_step": 299239, "epoch": 1781} {"train_loss": -12.150566101074219, "global_step": 299240, "epoch": 1781} {"train_loss": -12.213653564453125, "global_step": 299241, "epoch": 1781} {"train_loss": -12.354979515075684, "global_step": 299242, "epoch": 1781} {"train_loss": -11.924982070922852, "global_step": 299243, "epoch": 1781} {"train_loss": -11.945801734924316, "global_step": 299244, "epoch": 1781} {"train_loss": -12.115180969238281, "global_step": 299245, "epoch": 1781} {"train_loss": -11.944257736206055, "global_step": 299246, "epoch": 1781} {"train_loss": -12.186359405517578, "global_step": 299247, "epoch": 1781} {"train_loss": -12.160433769226074, "global_step": 299248, "epoch": 1781} {"train_loss": -12.369287490844727, "global_step": 299249, "epoch": 1781} {"train_loss": -12.14044189453125, "global_step": 299250, "epoch": 1781} {"train_loss": -12.287400245666504, "global_step": 299251, "epoch": 1781} {"train_loss": -12.165979385375977, "global_step": 299252, "epoch": 1781} {"train_loss": -12.17690658569336, "global_step": 299253, "epoch": 1781} {"train_loss": -12.2474365234375, "global_step": 299254, "epoch": 1781} {"train_loss": -12.17262077331543, "global_step": 299255, "epoch": 1781} {"train_loss": -12.2899808883667, "global_step": 299256, "epoch": 1781} {"train_loss": -12.227568626403809, "global_step": 299257, "epoch": 1781} {"train_loss": -12.024737358093262, "global_step": 299258, "epoch": 1781} {"train_loss": -12.18553352355957, "global_step": 299259, "epoch": 1781} {"train_loss": -12.360157012939453, "global_step": 299260, "epoch": 1781} {"train_loss": -12.361262321472168, "global_step": 299261, "epoch": 1781} {"train_loss": -12.316813468933105, "global_step": 299262, "epoch": 1781} {"train_loss": -12.208219528198242, "global_step": 299263, "epoch": 1781} {"train_loss": -12.201814651489258, "global_step": 299264, "epoch": 1781} {"train_loss": -12.233991622924805, "global_step": 299265, "epoch": 1781} {"train_loss": -12.321320533752441, "global_step": 299266, "epoch": 1781} {"train_loss": -12.39614486694336, "global_step": 299267, "epoch": 1781} {"train_loss": -12.525299072265625, "global_step": 299268, "epoch": 1781} {"train_loss": -12.386062622070312, "global_step": 299269, "epoch": 1781} {"train_loss": -12.282997131347656, "global_step": 299270, "epoch": 1781} {"train_loss": -12.068902969360352, "global_step": 299271, "epoch": 1781} {"train_loss": -12.014686584472656, "global_step": 299272, "epoch": 1781} {"train_loss": -11.698424339294434, "global_step": 299273, "epoch": 1781} {"train_loss": -12.267511367797852, "global_step": 299274, "epoch": 1781} {"train_loss": -12.179593086242676, "global_step": 299275, "epoch": 1781} {"train_loss": -12.022953033447266, "global_step": 299276, "epoch": 1781} {"train_loss": -12.390003204345703, "global_step": 299277, "epoch": 1781} {"train_loss": -11.872455596923828, "global_step": 299278, "epoch": 1781} {"train_loss": -11.779613494873047, "global_step": 299279, "epoch": 1781} {"train_loss": -12.339700698852539, "global_step": 299280, "epoch": 1781} {"train_loss": -11.926140785217285, "global_step": 299281, "epoch": 1781} {"train_loss": -12.332908630371094, "global_step": 299282, "epoch": 1781} {"train_loss": -11.607950210571289, "global_step": 299283, "epoch": 1781} {"train_loss": -11.978643417358398, "global_step": 299284, "epoch": 1781} {"train_loss": -12.022595405578613, "global_step": 299285, "epoch": 1781} {"train_loss": -11.26891803741455, "global_step": 299286, "epoch": 1781} {"train_loss": -10.615840911865234, "global_step": 299287, "epoch": 1781} {"train_loss": -12.03605842590332, "global_step": 299288, "epoch": 1781} {"train_loss": -9.481348037719727, "global_step": 299289, "epoch": 1781} {"train_loss": -10.513967514038086, "global_step": 299290, "epoch": 1781} {"train_loss": -11.242364883422852, "global_step": 299291, "epoch": 1781} {"train_loss": -8.136700630187988, "global_step": 299292, "epoch": 1781} {"train_loss": -12.238822937011719, "global_step": 299293, "epoch": 1781} {"train_loss": -10.021942138671875, "global_step": 299294, "epoch": 1781} {"train_loss": -10.910940170288086, "global_step": 299295, "epoch": 1781} {"train_loss": -11.939512252807617, "global_step": 299296, "epoch": 1781} {"train_loss": -10.709421157836914, "global_step": 299297, "epoch": 1781} {"train_loss": -12.049243927001953, "global_step": 299298, "epoch": 1781} {"train_loss": -11.299806594848633, "global_step": 299299, "epoch": 1781} {"train_loss": -11.937347412109375, "global_step": 299300, "epoch": 1781} {"train_loss": -11.971245765686035, "global_step": 299301, "epoch": 1781} {"train_loss": -11.802569389343262, "global_step": 299302, "epoch": 1781} {"train_loss": -12.047065734863281, "global_step": 299303, "epoch": 1781} {"train_loss": -11.86854076385498, "global_step": 299304, "epoch": 1781} {"train_loss": -12.103982925415039, "global_step": 299305, "epoch": 1781} {"train_loss": -11.774885177612305, "global_step": 299306, "epoch": 1781} {"train_loss": -12.071524620056152, "global_step": 299307, "epoch": 1781} {"train_loss": -12.160687446594238, "global_step": 299308, "epoch": 1781} {"train_loss": -11.59736156463623, "global_step": 299309, "epoch": 1781} {"train_loss": -12.167216300964355, "global_step": 299310, "epoch": 1781} {"train_loss": -11.975992202758789, "global_step": 299311, "epoch": 1781} {"train_loss": -12.124054908752441, "global_step": 299312, "epoch": 1781} {"train_loss": -11.990741729736328, "global_step": 299313, "epoch": 1781} {"train_loss": -11.663747787475586, "global_step": 299314, "epoch": 1781} {"train_loss": -12.043733596801758, "global_step": 299315, "epoch": 1781} {"train_loss": -12.022722244262695, "global_step": 299316, "epoch": 1781} {"train_loss": -12.161067008972168, "global_step": 299317, "epoch": 1781} {"train_loss": -11.936346054077148, "global_step": 299318, "epoch": 1781} {"train_loss": -12.336483001708984, "global_step": 299319, "epoch": 1781} {"train_loss": -12.118274688720703, "global_step": 299320, "epoch": 1781} {"train_loss": -12.235976219177246, "global_step": 299321, "epoch": 1781} {"train_loss": -12.053220748901367, "global_step": 299322, "epoch": 1781} {"train_loss": -12.053332328796387, "global_step": 299323, "epoch": 1781} {"train_loss": -11.650447845458984, "global_step": 299324, "epoch": 1781} {"train_loss": -12.31202220916748, "global_step": 299325, "epoch": 1781} {"train_loss": -12.015897750854492, "global_step": 299326, "epoch": 1781} {"train_loss": -12.318678855895996, "global_step": 299327, "epoch": 1781} {"train_loss": -12.054561614990234, "global_step": 299328, "epoch": 1781} {"train_loss": -12.296747207641602, "global_step": 299329, "epoch": 1781} {"train_loss": -12.43006706237793, "global_step": 299330, "epoch": 1781} {"train_loss": -12.023822784423828, "global_step": 299331, "epoch": 1781} {"train_loss": -12.350873947143555, "global_step": 299332, "epoch": 1781} {"train_loss": -12.109701156616211, "global_step": 299333, "epoch": 1781} {"train_loss": -12.384939193725586, "global_step": 299334, "epoch": 1781} {"train_loss": -12.09530258178711, "global_step": 299335, "epoch": 1781} {"train_loss": -12.364421844482422, "global_step": 299336, "epoch": 1781} {"train_loss": -12.127007484436035, "global_step": 299337, "epoch": 1781} {"train_loss": -12.113216400146484, "global_step": 299338, "epoch": 1781} {"train_loss": -12.257486343383789, "global_step": 299339, "epoch": 1781} {"train_loss": -11.854933738708496, "global_step": 299340, "epoch": 1781} {"train_loss": -12.127546310424805, "global_step": 299341, "epoch": 1781} {"train_loss": -11.488621711730957, "global_step": 299342, "epoch": 1781} {"train_loss": -11.765140533447266, "global_step": 299343, "epoch": 1781} {"train_loss": -11.874536514282227, "global_step": 299344, "epoch": 1781} {"train_loss": -11.327884674072266, "global_step": 299345, "epoch": 1781} {"train_loss": -11.381112098693848, "global_step": 299346, "epoch": 1781} {"train_loss": -11.764236450195312, "global_step": 299347, "epoch": 1781} {"train_loss": -12.155961036682129, "global_step": 299348, "epoch": 1781} {"train_loss": -11.628823280334473, "global_step": 299349, "epoch": 1781} {"train_loss": -11.448195457458496, "global_step": 299350, "epoch": 1781} {"train_loss": -11.9327974319458, "global_step": 299351, "epoch": 1781} {"train_loss": -11.41201400756836, "global_step": 299352, "epoch": 1781} {"train_loss": -11.40540599822998, "global_step": 299353, "epoch": 1781} {"train_loss": -11.769426345825195, "global_step": 299354, "epoch": 1781} {"train_loss": -11.226377487182617, "global_step": 299355, "epoch": 1781} {"train_loss": -11.066385269165039, "global_step": 299356, "epoch": 1781} {"train_loss": -11.630378723144531, "global_step": 299357, "epoch": 1781} {"train_loss": -10.534448623657227, "global_step": 299358, "epoch": 1781} {"train_loss": -11.754782676696777, "global_step": 299359, "epoch": 1781} {"train_loss": -10.509428977966309, "global_step": 299360, "epoch": 1781} {"train_loss": -11.932695388793945, "global_step": 299361, "epoch": 1781} {"train_loss": -10.918111801147461, "global_step": 299362, "epoch": 1781} {"train_loss": -11.88582992553711, "global_step": 299363, "epoch": 1781} {"train_loss": -11.291004180908203, "global_step": 299364, "epoch": 1781} {"train_loss": -11.93305778503418, "global_step": 299365, "epoch": 1781} {"train_loss": -11.09177017211914, "global_step": 299366, "epoch": 1781} {"train_loss": -12.183345794677734, "global_step": 299367, "epoch": 1781} {"train_loss": -11.365476608276367, "global_step": 299368, "epoch": 1781} {"train_loss": -11.82113265991211, "global_step": 299369, "epoch": 1781} {"train_loss": -11.643394470214844, "global_step": 299370, "epoch": 1781} {"train_loss": -12.137474060058594, "global_step": 299371, "epoch": 1781} {"train_loss": -12.00783634185791, "global_step": 299372, "epoch": 1781} {"train_loss": -12.148351669311523, "global_step": 299373, "epoch": 1781} {"train_loss": -12.071914672851562, "global_step": 299374, "epoch": 1781} {"train_loss": -11.884670002119881, "global_step": 299375, "epoch": 1781, "val_loss": 276100.15625} {"train_loss": -11.983518600463867, "global_step": 299376, "epoch": 1782} {"train_loss": -11.761219024658203, "global_step": 299377, "epoch": 1782} {"train_loss": -12.168268203735352, "global_step": 299378, "epoch": 1782} {"train_loss": -12.144264221191406, "global_step": 299379, "epoch": 1782} {"train_loss": -12.154748916625977, "global_step": 299380, "epoch": 1782} {"train_loss": -12.070345878601074, "global_step": 299381, "epoch": 1782} {"train_loss": -11.970170974731445, "global_step": 299382, "epoch": 1782} {"train_loss": -12.017483711242676, "global_step": 299383, "epoch": 1782} {"train_loss": -12.044784545898438, "global_step": 299384, "epoch": 1782} {"train_loss": -12.059284210205078, "global_step": 299385, "epoch": 1782} {"train_loss": -11.946741104125977, "global_step": 299386, "epoch": 1782} {"train_loss": -12.051937103271484, "global_step": 299387, "epoch": 1782} {"train_loss": -11.85774040222168, "global_step": 299388, "epoch": 1782} {"train_loss": -12.116852760314941, "global_step": 299389, "epoch": 1782} {"train_loss": -12.10882568359375, "global_step": 299390, "epoch": 1782} {"train_loss": -11.401394844055176, "global_step": 299391, "epoch": 1782} {"train_loss": -12.091269493103027, "global_step": 299392, "epoch": 1782} {"train_loss": -11.70166015625, "global_step": 299393, "epoch": 1782} {"train_loss": -11.72336196899414, "global_step": 299394, "epoch": 1782} {"train_loss": -11.718961715698242, "global_step": 299395, "epoch": 1782} {"train_loss": -11.363094329833984, "global_step": 299396, "epoch": 1782} {"train_loss": -11.030035018920898, "global_step": 299397, "epoch": 1782} {"train_loss": -11.87364387512207, "global_step": 299398, "epoch": 1782} {"train_loss": -11.702881813049316, "global_step": 299399, "epoch": 1782} {"train_loss": -10.814785957336426, "global_step": 299400, "epoch": 1782} {"train_loss": -11.706089973449707, "global_step": 299401, "epoch": 1782} {"train_loss": -11.795321464538574, "global_step": 299402, "epoch": 1782} {"train_loss": -11.956588745117188, "global_step": 299403, "epoch": 1782} {"train_loss": -12.230134963989258, "global_step": 299404, "epoch": 1782} {"train_loss": -11.836870193481445, "global_step": 299405, "epoch": 1782} {"train_loss": -12.063648223876953, "global_step": 299406, "epoch": 1782} {"train_loss": -11.930788040161133, "global_step": 299407, "epoch": 1782} {"train_loss": -12.091085433959961, "global_step": 299408, "epoch": 1782} {"train_loss": -11.749250411987305, "global_step": 299409, "epoch": 1782} {"train_loss": -12.147391319274902, "global_step": 299410, "epoch": 1782} {"train_loss": -11.679463386535645, "global_step": 299411, "epoch": 1782} {"train_loss": -11.87806510925293, "global_step": 299412, "epoch": 1782} {"train_loss": -11.189128875732422, "global_step": 299413, "epoch": 1782} {"train_loss": -11.909018516540527, "global_step": 299414, "epoch": 1782} {"train_loss": -11.771915435791016, "global_step": 299415, "epoch": 1782} {"train_loss": -11.98634147644043, "global_step": 299416, "epoch": 1782} {"train_loss": -11.904165267944336, "global_step": 299417, "epoch": 1782} {"train_loss": -12.033675193786621, "global_step": 299418, "epoch": 1782} {"train_loss": -11.989997863769531, "global_step": 299419, "epoch": 1782} {"train_loss": -11.903230667114258, "global_step": 299420, "epoch": 1782} {"train_loss": -12.209148406982422, "global_step": 299421, "epoch": 1782} {"train_loss": -11.91160774230957, "global_step": 299422, "epoch": 1782} {"train_loss": -12.172856330871582, "global_step": 299423, "epoch": 1782} {"train_loss": -12.29778003692627, "global_step": 299424, "epoch": 1782} {"train_loss": -11.85453987121582, "global_step": 299425, "epoch": 1782} {"train_loss": -11.409856796264648, "global_step": 299426, "epoch": 1782} {"train_loss": -12.280614852905273, "global_step": 299427, "epoch": 1782} {"train_loss": -12.179718971252441, "global_step": 299428, "epoch": 1782} {"train_loss": -12.083600997924805, "global_step": 299429, "epoch": 1782} {"train_loss": -11.922247886657715, "global_step": 299430, "epoch": 1782} {"train_loss": -12.165279388427734, "global_step": 299431, "epoch": 1782} {"train_loss": -12.053693771362305, "global_step": 299432, "epoch": 1782} {"train_loss": -12.117326736450195, "global_step": 299433, "epoch": 1782} {"train_loss": -12.14150619506836, "global_step": 299434, "epoch": 1782} {"train_loss": -12.217857360839844, "global_step": 299435, "epoch": 1782} {"train_loss": -11.903518676757812, "global_step": 299436, "epoch": 1782} {"train_loss": -11.945626258850098, "global_step": 299437, "epoch": 1782} {"train_loss": -12.089799880981445, "global_step": 299438, "epoch": 1782} {"train_loss": -11.781698226928711, "global_step": 299439, "epoch": 1782} {"train_loss": -11.189483642578125, "global_step": 299440, "epoch": 1782} {"train_loss": -11.908834457397461, "global_step": 299441, "epoch": 1782} {"train_loss": -11.791559219360352, "global_step": 299442, "epoch": 1782} {"train_loss": -11.844197273254395, "global_step": 299443, "epoch": 1782} {"train_loss": -12.070241928100586, "global_step": 299444, "epoch": 1782} {"train_loss": -11.953254699707031, "global_step": 299445, "epoch": 1782} {"train_loss": -11.114767074584961, "global_step": 299446, "epoch": 1782} {"train_loss": -11.694535255432129, "global_step": 299447, "epoch": 1782} {"train_loss": -12.103955268859863, "global_step": 299448, "epoch": 1782} {"train_loss": -11.117483139038086, "global_step": 299449, "epoch": 1782} {"train_loss": -11.839213371276855, "global_step": 299450, "epoch": 1782} {"train_loss": -11.4743070602417, "global_step": 299451, "epoch": 1782} {"train_loss": -12.078862190246582, "global_step": 299452, "epoch": 1782} {"train_loss": -11.724807739257812, "global_step": 299453, "epoch": 1782} {"train_loss": -11.672388076782227, "global_step": 299454, "epoch": 1782} {"train_loss": -11.030789375305176, "global_step": 299455, "epoch": 1782} {"train_loss": -11.626402854919434, "global_step": 299456, "epoch": 1782} {"train_loss": -11.226112365722656, "global_step": 299457, "epoch": 1782} {"train_loss": -11.501456260681152, "global_step": 299458, "epoch": 1782} {"train_loss": -11.978813171386719, "global_step": 299459, "epoch": 1782} {"train_loss": -11.287747383117676, "global_step": 299460, "epoch": 1782} {"train_loss": -11.670083999633789, "global_step": 299461, "epoch": 1782} {"train_loss": -11.822660446166992, "global_step": 299462, "epoch": 1782} {"train_loss": -11.028190612792969, "global_step": 299463, "epoch": 1782} {"train_loss": -11.457111358642578, "global_step": 299464, "epoch": 1782} {"train_loss": -11.173990249633789, "global_step": 299465, "epoch": 1782} {"train_loss": -11.518936157226562, "global_step": 299466, "epoch": 1782} {"train_loss": -10.645273208618164, "global_step": 299467, "epoch": 1782} {"train_loss": -11.866174697875977, "global_step": 299468, "epoch": 1782} {"train_loss": -10.79621696472168, "global_step": 299469, "epoch": 1782} {"train_loss": -11.125069618225098, "global_step": 299470, "epoch": 1782} {"train_loss": -11.938907623291016, "global_step": 299471, "epoch": 1782} {"train_loss": -11.189264297485352, "global_step": 299472, "epoch": 1782} {"train_loss": -11.828847885131836, "global_step": 299473, "epoch": 1782} {"train_loss": -11.39578628540039, "global_step": 299474, "epoch": 1782} {"train_loss": -11.563468933105469, "global_step": 299475, "epoch": 1782} {"train_loss": -11.960060119628906, "global_step": 299476, "epoch": 1782} {"train_loss": -11.61864185333252, "global_step": 299477, "epoch": 1782} {"train_loss": -11.742201805114746, "global_step": 299478, "epoch": 1782} {"train_loss": -11.514147758483887, "global_step": 299479, "epoch": 1782} {"train_loss": -11.683263778686523, "global_step": 299480, "epoch": 1782} {"train_loss": -11.954473495483398, "global_step": 299481, "epoch": 1782} {"train_loss": -11.858636856079102, "global_step": 299482, "epoch": 1782} {"train_loss": -11.937707901000977, "global_step": 299483, "epoch": 1782} {"train_loss": -11.583897590637207, "global_step": 299484, "epoch": 1782} {"train_loss": -12.009440422058105, "global_step": 299485, "epoch": 1782} {"train_loss": -11.93441104888916, "global_step": 299486, "epoch": 1782} {"train_loss": -11.601883888244629, "global_step": 299487, "epoch": 1782} {"train_loss": -12.398782730102539, "global_step": 299488, "epoch": 1782} {"train_loss": -11.847251892089844, "global_step": 299489, "epoch": 1782} {"train_loss": -11.842998504638672, "global_step": 299490, "epoch": 1782} {"train_loss": -11.809425354003906, "global_step": 299491, "epoch": 1782} {"train_loss": -12.144510269165039, "global_step": 299492, "epoch": 1782} {"train_loss": -11.520671844482422, "global_step": 299493, "epoch": 1782} {"train_loss": -11.958480834960938, "global_step": 299494, "epoch": 1782} {"train_loss": -12.142112731933594, "global_step": 299495, "epoch": 1782} {"train_loss": -11.566291809082031, "global_step": 299496, "epoch": 1782} {"train_loss": -12.098989486694336, "global_step": 299497, "epoch": 1782} {"train_loss": -12.223021507263184, "global_step": 299498, "epoch": 1782} {"train_loss": -11.642826080322266, "global_step": 299499, "epoch": 1782} {"train_loss": -12.142549514770508, "global_step": 299500, "epoch": 1782} {"train_loss": -11.981609344482422, "global_step": 299501, "epoch": 1782} {"train_loss": -12.187080383300781, "global_step": 299502, "epoch": 1782} {"train_loss": -12.024060249328613, "global_step": 299503, "epoch": 1782} {"train_loss": -12.118246078491211, "global_step": 299504, "epoch": 1782} {"train_loss": -12.14149284362793, "global_step": 299505, "epoch": 1782} {"train_loss": -12.190462112426758, "global_step": 299506, "epoch": 1782} {"train_loss": -12.272809982299805, "global_step": 299507, "epoch": 1782} {"train_loss": -12.027241706848145, "global_step": 299508, "epoch": 1782} {"train_loss": -12.1715087890625, "global_step": 299509, "epoch": 1782} {"train_loss": -12.30040454864502, "global_step": 299510, "epoch": 1782} {"train_loss": -12.261374473571777, "global_step": 299511, "epoch": 1782} {"train_loss": -12.231231689453125, "global_step": 299512, "epoch": 1782} {"train_loss": -12.137214660644531, "global_step": 299513, "epoch": 1782} {"train_loss": -12.085172653198242, "global_step": 299514, "epoch": 1782} {"train_loss": -12.161321640014648, "global_step": 299515, "epoch": 1782} {"train_loss": -12.15576171875, "global_step": 299516, "epoch": 1782} {"train_loss": -12.400432586669922, "global_step": 299517, "epoch": 1782} {"train_loss": -12.361237525939941, "global_step": 299518, "epoch": 1782} {"train_loss": -12.133687019348145, "global_step": 299519, "epoch": 1782} {"train_loss": -12.227386474609375, "global_step": 299520, "epoch": 1782} {"train_loss": -12.187419891357422, "global_step": 299521, "epoch": 1782} {"train_loss": -12.164159774780273, "global_step": 299522, "epoch": 1782} {"train_loss": -12.228109359741211, "global_step": 299523, "epoch": 1782} {"train_loss": -12.013110160827637, "global_step": 299524, "epoch": 1782} {"train_loss": -11.982416152954102, "global_step": 299525, "epoch": 1782} {"train_loss": -12.211954116821289, "global_step": 299526, "epoch": 1782} {"train_loss": -11.810810089111328, "global_step": 299527, "epoch": 1782} {"train_loss": -12.420415878295898, "global_step": 299528, "epoch": 1782} {"train_loss": -11.486576080322266, "global_step": 299529, "epoch": 1782} {"train_loss": -12.063851356506348, "global_step": 299530, "epoch": 1782} {"train_loss": -12.163299560546875, "global_step": 299531, "epoch": 1782} {"train_loss": -12.352251052856445, "global_step": 299532, "epoch": 1782} {"train_loss": -12.027718544006348, "global_step": 299533, "epoch": 1782} {"train_loss": -11.891026496887207, "global_step": 299534, "epoch": 1782} {"train_loss": -12.275581359863281, "global_step": 299535, "epoch": 1782} {"train_loss": -12.25243854522705, "global_step": 299536, "epoch": 1782} {"train_loss": -12.391559600830078, "global_step": 299537, "epoch": 1782} {"train_loss": -12.138240814208984, "global_step": 299538, "epoch": 1782} {"train_loss": -11.944598197937012, "global_step": 299539, "epoch": 1782} {"train_loss": -12.101396560668945, "global_step": 299540, "epoch": 1782} {"train_loss": -11.706010818481445, "global_step": 299541, "epoch": 1782} {"train_loss": -11.952098846435547, "global_step": 299542, "epoch": 1782} {"train_loss": -11.879958816937037, "global_step": 299543, "epoch": 1782, "val_loss": 276100.65625} {"train_loss": -11.905998229980469, "global_step": 299544, "epoch": 1783} {"train_loss": -12.23046875, "global_step": 299545, "epoch": 1783} {"train_loss": -12.215436935424805, "global_step": 299546, "epoch": 1783} {"train_loss": -11.98127269744873, "global_step": 299547, "epoch": 1783} {"train_loss": -12.269176483154297, "global_step": 299548, "epoch": 1783} {"train_loss": -11.910242080688477, "global_step": 299549, "epoch": 1783} {"train_loss": -12.221593856811523, "global_step": 299550, "epoch": 1783} {"train_loss": -12.091833114624023, "global_step": 299551, "epoch": 1783} {"train_loss": -12.115392684936523, "global_step": 299552, "epoch": 1783} {"train_loss": -12.086891174316406, "global_step": 299553, "epoch": 1783} {"train_loss": -12.075291633605957, "global_step": 299554, "epoch": 1783} {"train_loss": -10.893477439880371, "global_step": 299555, "epoch": 1783} {"train_loss": -10.874587059020996, "global_step": 299556, "epoch": 1783} {"train_loss": -11.669767379760742, "global_step": 299557, "epoch": 1783} {"train_loss": -11.607179641723633, "global_step": 299558, "epoch": 1783} {"train_loss": -11.155999183654785, "global_step": 299559, "epoch": 1783} {"train_loss": -10.04447078704834, "global_step": 299560, "epoch": 1783} {"train_loss": -12.015494346618652, "global_step": 299561, "epoch": 1783} {"train_loss": -10.59409236907959, "global_step": 299562, "epoch": 1783} {"train_loss": -10.22540283203125, "global_step": 299563, "epoch": 1783} {"train_loss": -11.881875991821289, "global_step": 299564, "epoch": 1783} {"train_loss": -11.222142219543457, "global_step": 299565, "epoch": 1783} {"train_loss": -10.594852447509766, "global_step": 299566, "epoch": 1783} {"train_loss": -11.497800827026367, "global_step": 299567, "epoch": 1783} {"train_loss": -11.231316566467285, "global_step": 299568, "epoch": 1783} {"train_loss": -11.138473510742188, "global_step": 299569, "epoch": 1783} {"train_loss": -11.778952598571777, "global_step": 299570, "epoch": 1783} {"train_loss": -11.621604919433594, "global_step": 299571, "epoch": 1783} {"train_loss": -11.744071960449219, "global_step": 299572, "epoch": 1783} {"train_loss": -11.911039352416992, "global_step": 299573, "epoch": 1783} {"train_loss": -11.971394538879395, "global_step": 299574, "epoch": 1783} {"train_loss": -12.120185852050781, "global_step": 299575, "epoch": 1783} {"train_loss": -11.973197937011719, "global_step": 299576, "epoch": 1783} {"train_loss": -11.97185230255127, "global_step": 299577, "epoch": 1783} {"train_loss": -11.591902732849121, "global_step": 299578, "epoch": 1783} {"train_loss": -11.81419563293457, "global_step": 299579, "epoch": 1783} {"train_loss": -11.721346855163574, "global_step": 299580, "epoch": 1783} {"train_loss": -12.066900253295898, "global_step": 299581, "epoch": 1783} {"train_loss": -11.703763961791992, "global_step": 299582, "epoch": 1783} {"train_loss": -11.962627410888672, "global_step": 299583, "epoch": 1783} {"train_loss": -11.906789779663086, "global_step": 299584, "epoch": 1783} {"train_loss": -11.831305503845215, "global_step": 299585, "epoch": 1783} {"train_loss": -11.780206680297852, "global_step": 299586, "epoch": 1783} {"train_loss": -11.869497299194336, "global_step": 299587, "epoch": 1783} {"train_loss": -11.864084243774414, "global_step": 299588, "epoch": 1783} {"train_loss": -11.839381217956543, "global_step": 299589, "epoch": 1783} {"train_loss": -12.189254760742188, "global_step": 299590, "epoch": 1783} {"train_loss": -11.722636222839355, "global_step": 299591, "epoch": 1783} {"train_loss": -11.567663192749023, "global_step": 299592, "epoch": 1783} {"train_loss": -11.46494197845459, "global_step": 299593, "epoch": 1783} {"train_loss": -12.199258804321289, "global_step": 299594, "epoch": 1783} {"train_loss": -11.431288719177246, "global_step": 299595, "epoch": 1783} {"train_loss": -11.9937744140625, "global_step": 299596, "epoch": 1783} {"train_loss": -11.761545181274414, "global_step": 299597, "epoch": 1783} {"train_loss": -11.381656646728516, "global_step": 299598, "epoch": 1783} {"train_loss": -11.843341827392578, "global_step": 299599, "epoch": 1783} {"train_loss": -10.55112075805664, "global_step": 299600, "epoch": 1783} {"train_loss": -11.42991828918457, "global_step": 299601, "epoch": 1783} {"train_loss": -11.454521179199219, "global_step": 299602, "epoch": 1783} {"train_loss": -10.465997695922852, "global_step": 299603, "epoch": 1783} {"train_loss": -11.786750793457031, "global_step": 299604, "epoch": 1783} {"train_loss": -9.880125045776367, "global_step": 299605, "epoch": 1783} {"train_loss": -11.235054016113281, "global_step": 299606, "epoch": 1783} {"train_loss": -11.255952835083008, "global_step": 299607, "epoch": 1783} {"train_loss": -10.980951309204102, "global_step": 299608, "epoch": 1783} {"train_loss": -11.44035530090332, "global_step": 299609, "epoch": 1783} {"train_loss": -10.856942176818848, "global_step": 299610, "epoch": 1783} {"train_loss": -11.470743179321289, "global_step": 299611, "epoch": 1783} {"train_loss": -11.573587417602539, "global_step": 299612, "epoch": 1783} {"train_loss": -11.14980697631836, "global_step": 299613, "epoch": 1783} {"train_loss": -11.153219223022461, "global_step": 299614, "epoch": 1783} {"train_loss": -11.03261947631836, "global_step": 299615, "epoch": 1783} {"train_loss": -11.874074935913086, "global_step": 299616, "epoch": 1783} {"train_loss": -11.458378791809082, "global_step": 299617, "epoch": 1783} {"train_loss": -11.542144775390625, "global_step": 299618, "epoch": 1783} {"train_loss": -11.841976165771484, "global_step": 299619, "epoch": 1783} {"train_loss": -11.577192306518555, "global_step": 299620, "epoch": 1783} {"train_loss": -11.89638900756836, "global_step": 299621, "epoch": 1783} {"train_loss": -11.761042594909668, "global_step": 299622, "epoch": 1783} {"train_loss": -12.072443008422852, "global_step": 299623, "epoch": 1783} {"train_loss": -12.004565238952637, "global_step": 299624, "epoch": 1783} {"train_loss": -11.735515594482422, "global_step": 299625, "epoch": 1783} {"train_loss": -11.879404067993164, "global_step": 299626, "epoch": 1783} {"train_loss": -11.905006408691406, "global_step": 299627, "epoch": 1783} {"train_loss": -12.0408935546875, "global_step": 299628, "epoch": 1783} {"train_loss": -12.166031837463379, "global_step": 299629, "epoch": 1783} {"train_loss": -11.801324844360352, "global_step": 299630, "epoch": 1783} {"train_loss": -12.163089752197266, "global_step": 299631, "epoch": 1783} {"train_loss": -11.905620574951172, "global_step": 299632, "epoch": 1783} {"train_loss": -12.10017204284668, "global_step": 299633, "epoch": 1783} {"train_loss": -11.82420539855957, "global_step": 299634, "epoch": 1783} {"train_loss": -11.756054878234863, "global_step": 299635, "epoch": 1783} {"train_loss": -11.942237854003906, "global_step": 299636, "epoch": 1783} {"train_loss": -11.610986709594727, "global_step": 299637, "epoch": 1783} {"train_loss": -12.05636215209961, "global_step": 299638, "epoch": 1783} {"train_loss": -12.229863166809082, "global_step": 299639, "epoch": 1783} {"train_loss": -11.939602851867676, "global_step": 299640, "epoch": 1783} {"train_loss": -11.911577224731445, "global_step": 299641, "epoch": 1783} {"train_loss": -12.068264961242676, "global_step": 299642, "epoch": 1783} {"train_loss": -11.862520217895508, "global_step": 299643, "epoch": 1783} {"train_loss": -12.12899112701416, "global_step": 299644, "epoch": 1783} {"train_loss": -11.842573165893555, "global_step": 299645, "epoch": 1783} {"train_loss": -12.239033699035645, "global_step": 299646, "epoch": 1783} {"train_loss": -12.02352523803711, "global_step": 299647, "epoch": 1783} {"train_loss": -12.268856048583984, "global_step": 299648, "epoch": 1783} {"train_loss": -12.23287582397461, "global_step": 299649, "epoch": 1783} {"train_loss": -12.312047958374023, "global_step": 299650, "epoch": 1783} {"train_loss": -12.291788101196289, "global_step": 299651, "epoch": 1783} {"train_loss": -12.445198059082031, "global_step": 299652, "epoch": 1783} {"train_loss": -12.126300811767578, "global_step": 299653, "epoch": 1783} {"train_loss": -12.157096862792969, "global_step": 299654, "epoch": 1783} {"train_loss": -12.398788452148438, "global_step": 299655, "epoch": 1783} {"train_loss": -12.390357971191406, "global_step": 299656, "epoch": 1783} {"train_loss": -12.21371078491211, "global_step": 299657, "epoch": 1783} {"train_loss": -12.331863403320312, "global_step": 299658, "epoch": 1783} {"train_loss": -12.327690124511719, "global_step": 299659, "epoch": 1783} {"train_loss": -12.352214813232422, "global_step": 299660, "epoch": 1783} {"train_loss": -12.237545013427734, "global_step": 299661, "epoch": 1783} {"train_loss": -12.281332969665527, "global_step": 299662, "epoch": 1783} {"train_loss": -12.527717590332031, "global_step": 299663, "epoch": 1783} {"train_loss": -12.379035949707031, "global_step": 299664, "epoch": 1783} {"train_loss": -12.298613548278809, "global_step": 299665, "epoch": 1783} {"train_loss": -12.608838081359863, "global_step": 299666, "epoch": 1783} {"train_loss": -12.180252075195312, "global_step": 299667, "epoch": 1783} {"train_loss": -12.151899337768555, "global_step": 299668, "epoch": 1783} {"train_loss": -12.543268203735352, "global_step": 299669, "epoch": 1783} {"train_loss": -12.305233001708984, "global_step": 299670, "epoch": 1783} {"train_loss": -11.75097942352295, "global_step": 299671, "epoch": 1783} {"train_loss": -11.27661418914795, "global_step": 299672, "epoch": 1783} {"train_loss": -11.80868148803711, "global_step": 299673, "epoch": 1783} {"train_loss": -12.211087226867676, "global_step": 299674, "epoch": 1783} {"train_loss": -12.192855834960938, "global_step": 299675, "epoch": 1783} {"train_loss": -12.054689407348633, "global_step": 299676, "epoch": 1783} {"train_loss": -12.207961082458496, "global_step": 299677, "epoch": 1783} {"train_loss": -11.52427864074707, "global_step": 299678, "epoch": 1783} {"train_loss": -10.35551643371582, "global_step": 299679, "epoch": 1783} {"train_loss": -11.825897216796875, "global_step": 299680, "epoch": 1783} {"train_loss": -10.949878692626953, "global_step": 299681, "epoch": 1783} {"train_loss": -10.737105369567871, "global_step": 299682, "epoch": 1783} {"train_loss": -12.219470977783203, "global_step": 299683, "epoch": 1783} {"train_loss": -11.072465896606445, "global_step": 299684, "epoch": 1783} {"train_loss": -10.335805892944336, "global_step": 299685, "epoch": 1783} {"train_loss": -11.50613784790039, "global_step": 299686, "epoch": 1783} {"train_loss": -10.697778701782227, "global_step": 299687, "epoch": 1783} {"train_loss": -9.913152694702148, "global_step": 299688, "epoch": 1783} {"train_loss": -11.854945182800293, "global_step": 299689, "epoch": 1783} {"train_loss": -10.862695693969727, "global_step": 299690, "epoch": 1783} {"train_loss": -10.593271255493164, "global_step": 299691, "epoch": 1783} {"train_loss": -11.908378601074219, "global_step": 299692, "epoch": 1783} {"train_loss": -10.590153694152832, "global_step": 299693, "epoch": 1783} {"train_loss": -11.972892761230469, "global_step": 299694, "epoch": 1783} {"train_loss": -11.041089057922363, "global_step": 299695, "epoch": 1783} {"train_loss": -11.152872085571289, "global_step": 299696, "epoch": 1783} {"train_loss": -12.189760208129883, "global_step": 299697, "epoch": 1783} {"train_loss": -11.68493366241455, "global_step": 299698, "epoch": 1783} {"train_loss": -11.77436637878418, "global_step": 299699, "epoch": 1783} {"train_loss": -11.853654861450195, "global_step": 299700, "epoch": 1783} {"train_loss": -11.421773910522461, "global_step": 299701, "epoch": 1783} {"train_loss": -11.999860763549805, "global_step": 299702, "epoch": 1783} {"train_loss": -11.772052764892578, "global_step": 299703, "epoch": 1783} {"train_loss": -11.953530311584473, "global_step": 299704, "epoch": 1783} {"train_loss": -11.921727180480957, "global_step": 299705, "epoch": 1783} {"train_loss": -11.545894622802734, "global_step": 299706, "epoch": 1783} {"train_loss": -11.902843475341797, "global_step": 299707, "epoch": 1783} {"train_loss": -11.741043090820312, "global_step": 299708, "epoch": 1783} {"train_loss": -11.722967147827148, "global_step": 299709, "epoch": 1783} {"train_loss": -11.993032455444336, "global_step": 299710, "epoch": 1783} {"train_loss": -11.716462680271693, "global_step": 299711, "epoch": 1783, "val_loss": 280037.0625} {"train_loss": -11.502250671386719, "global_step": 299712, "epoch": 1784} {"train_loss": -11.68079948425293, "global_step": 299713, "epoch": 1784} {"train_loss": -11.67304801940918, "global_step": 299714, "epoch": 1784} {"train_loss": -11.718155860900879, "global_step": 299715, "epoch": 1784} {"train_loss": -11.116988182067871, "global_step": 299716, "epoch": 1784} {"train_loss": -11.024214744567871, "global_step": 299717, "epoch": 1784} {"train_loss": -11.464302062988281, "global_step": 299718, "epoch": 1784} {"train_loss": -11.429508209228516, "global_step": 299719, "epoch": 1784} {"train_loss": -11.40261459350586, "global_step": 299720, "epoch": 1784} {"train_loss": -11.766289710998535, "global_step": 299721, "epoch": 1784} {"train_loss": -11.233099937438965, "global_step": 299722, "epoch": 1784} {"train_loss": -11.884150505065918, "global_step": 299723, "epoch": 1784} {"train_loss": -11.467766761779785, "global_step": 299724, "epoch": 1784} {"train_loss": -11.51510238647461, "global_step": 299725, "epoch": 1784} {"train_loss": -11.658269882202148, "global_step": 299726, "epoch": 1784} {"train_loss": -11.910188674926758, "global_step": 299727, "epoch": 1784} {"train_loss": -11.636507034301758, "global_step": 299728, "epoch": 1784} {"train_loss": -12.134378433227539, "global_step": 299729, "epoch": 1784} {"train_loss": -11.861015319824219, "global_step": 299730, "epoch": 1784} {"train_loss": -12.045581817626953, "global_step": 299731, "epoch": 1784} {"train_loss": -11.759600639343262, "global_step": 299732, "epoch": 1784} {"train_loss": -11.991426467895508, "global_step": 299733, "epoch": 1784} {"train_loss": -11.89251708984375, "global_step": 299734, "epoch": 1784} {"train_loss": -12.044240951538086, "global_step": 299735, "epoch": 1784} {"train_loss": -12.12222671508789, "global_step": 299736, "epoch": 1784} {"train_loss": -11.821781158447266, "global_step": 299737, "epoch": 1784} {"train_loss": -12.246978759765625, "global_step": 299738, "epoch": 1784} {"train_loss": -11.830355644226074, "global_step": 299739, "epoch": 1784} {"train_loss": -12.075322151184082, "global_step": 299740, "epoch": 1784} {"train_loss": -11.950586318969727, "global_step": 299741, "epoch": 1784} {"train_loss": -11.915040016174316, "global_step": 299742, "epoch": 1784} {"train_loss": -11.912237167358398, "global_step": 299743, "epoch": 1784} {"train_loss": -11.71830940246582, "global_step": 299744, "epoch": 1784} {"train_loss": -12.134393692016602, "global_step": 299745, "epoch": 1784} {"train_loss": -12.001350402832031, "global_step": 299746, "epoch": 1784} {"train_loss": -12.100951194763184, "global_step": 299747, "epoch": 1784} {"train_loss": -11.977712631225586, "global_step": 299748, "epoch": 1784} {"train_loss": -11.863216400146484, "global_step": 299749, "epoch": 1784} {"train_loss": -12.114437103271484, "global_step": 299750, "epoch": 1784} {"train_loss": -11.928437232971191, "global_step": 299751, "epoch": 1784} {"train_loss": -12.366474151611328, "global_step": 299752, "epoch": 1784} {"train_loss": -11.952667236328125, "global_step": 299753, "epoch": 1784} {"train_loss": -11.99525260925293, "global_step": 299754, "epoch": 1784} {"train_loss": -11.727727890014648, "global_step": 299755, "epoch": 1784} {"train_loss": -11.633797645568848, "global_step": 299756, "epoch": 1784} {"train_loss": -11.74539852142334, "global_step": 299757, "epoch": 1784} {"train_loss": -11.636683464050293, "global_step": 299758, "epoch": 1784} {"train_loss": -11.890426635742188, "global_step": 299759, "epoch": 1784} {"train_loss": -11.592765808105469, "global_step": 299760, "epoch": 1784} {"train_loss": -12.023292541503906, "global_step": 299761, "epoch": 1784} {"train_loss": -11.629450798034668, "global_step": 299762, "epoch": 1784} {"train_loss": -12.02839469909668, "global_step": 299763, "epoch": 1784} {"train_loss": -11.648193359375, "global_step": 299764, "epoch": 1784} {"train_loss": -11.95913314819336, "global_step": 299765, "epoch": 1784} {"train_loss": -11.904426574707031, "global_step": 299766, "epoch": 1784} {"train_loss": -11.479720115661621, "global_step": 299767, "epoch": 1784} {"train_loss": -12.22930908203125, "global_step": 299768, "epoch": 1784} {"train_loss": -11.459660530090332, "global_step": 299769, "epoch": 1784} {"train_loss": -11.918027877807617, "global_step": 299770, "epoch": 1784} {"train_loss": -11.984142303466797, "global_step": 299771, "epoch": 1784} {"train_loss": -11.870748519897461, "global_step": 299772, "epoch": 1784} {"train_loss": -12.08027458190918, "global_step": 299773, "epoch": 1784} {"train_loss": -11.751326560974121, "global_step": 299774, "epoch": 1784} {"train_loss": -11.883641242980957, "global_step": 299775, "epoch": 1784} {"train_loss": -12.2483491897583, "global_step": 299776, "epoch": 1784} {"train_loss": -12.025983810424805, "global_step": 299777, "epoch": 1784} {"train_loss": -11.807219505310059, "global_step": 299778, "epoch": 1784} {"train_loss": -12.2244234085083, "global_step": 299779, "epoch": 1784} {"train_loss": -11.599152565002441, "global_step": 299780, "epoch": 1784} {"train_loss": -12.340763092041016, "global_step": 299781, "epoch": 1784} {"train_loss": -11.87993049621582, "global_step": 299782, "epoch": 1784} {"train_loss": -12.085658073425293, "global_step": 299783, "epoch": 1784} {"train_loss": -12.00426197052002, "global_step": 299784, "epoch": 1784} {"train_loss": -11.642340660095215, "global_step": 299785, "epoch": 1784} {"train_loss": -12.155460357666016, "global_step": 299786, "epoch": 1784} {"train_loss": -11.584548950195312, "global_step": 299787, "epoch": 1784} {"train_loss": -12.457913398742676, "global_step": 299788, "epoch": 1784} {"train_loss": -11.47873306274414, "global_step": 299789, "epoch": 1784} {"train_loss": -12.359594345092773, "global_step": 299790, "epoch": 1784} {"train_loss": -11.627067565917969, "global_step": 299791, "epoch": 1784} {"train_loss": -12.322761535644531, "global_step": 299792, "epoch": 1784} {"train_loss": -12.055716514587402, "global_step": 299793, "epoch": 1784} {"train_loss": -12.244985580444336, "global_step": 299794, "epoch": 1784} {"train_loss": -12.413108825683594, "global_step": 299795, "epoch": 1784} {"train_loss": -12.251276969909668, "global_step": 299796, "epoch": 1784} {"train_loss": -12.362396240234375, "global_step": 299797, "epoch": 1784} {"train_loss": -11.688384056091309, "global_step": 299798, "epoch": 1784} {"train_loss": -12.044475555419922, "global_step": 299799, "epoch": 1784} {"train_loss": -12.269567489624023, "global_step": 299800, "epoch": 1784} {"train_loss": -12.101348876953125, "global_step": 299801, "epoch": 1784} {"train_loss": -12.25792407989502, "global_step": 299802, "epoch": 1784} {"train_loss": -12.57024097442627, "global_step": 299803, "epoch": 1784} {"train_loss": -12.390151977539062, "global_step": 299804, "epoch": 1784} {"train_loss": -12.349971771240234, "global_step": 299805, "epoch": 1784} {"train_loss": -12.330572128295898, "global_step": 299806, "epoch": 1784} {"train_loss": -12.3905668258667, "global_step": 299807, "epoch": 1784} {"train_loss": -12.41381549835205, "global_step": 299808, "epoch": 1784} {"train_loss": -12.439955711364746, "global_step": 299809, "epoch": 1784} {"train_loss": -12.176823616027832, "global_step": 299810, "epoch": 1784} {"train_loss": -12.518915176391602, "global_step": 299811, "epoch": 1784} {"train_loss": -11.910589218139648, "global_step": 299812, "epoch": 1784} {"train_loss": -11.928987503051758, "global_step": 299813, "epoch": 1784} {"train_loss": -12.44117546081543, "global_step": 299814, "epoch": 1784} {"train_loss": -11.803098678588867, "global_step": 299815, "epoch": 1784} {"train_loss": -12.06458854675293, "global_step": 299816, "epoch": 1784} {"train_loss": -12.194900512695312, "global_step": 299817, "epoch": 1784} {"train_loss": -12.197651863098145, "global_step": 299818, "epoch": 1784} {"train_loss": -12.06158447265625, "global_step": 299819, "epoch": 1784} {"train_loss": -12.331295013427734, "global_step": 299820, "epoch": 1784} {"train_loss": -12.191927909851074, "global_step": 299821, "epoch": 1784} {"train_loss": -12.246996879577637, "global_step": 299822, "epoch": 1784} {"train_loss": -12.35069751739502, "global_step": 299823, "epoch": 1784} {"train_loss": -12.192583084106445, "global_step": 299824, "epoch": 1784} {"train_loss": -12.461284637451172, "global_step": 299825, "epoch": 1784} {"train_loss": -12.280295372009277, "global_step": 299826, "epoch": 1784} {"train_loss": -11.808553695678711, "global_step": 299827, "epoch": 1784} {"train_loss": -12.416303634643555, "global_step": 299828, "epoch": 1784} {"train_loss": -12.384425163269043, "global_step": 299829, "epoch": 1784} {"train_loss": -11.950447082519531, "global_step": 299830, "epoch": 1784} {"train_loss": -11.668514251708984, "global_step": 299831, "epoch": 1784} {"train_loss": -12.285676956176758, "global_step": 299832, "epoch": 1784} {"train_loss": -11.684562683105469, "global_step": 299833, "epoch": 1784} {"train_loss": -12.304281234741211, "global_step": 299834, "epoch": 1784} {"train_loss": -11.958112716674805, "global_step": 299835, "epoch": 1784} {"train_loss": -11.847220420837402, "global_step": 299836, "epoch": 1784} {"train_loss": -12.20541000366211, "global_step": 299837, "epoch": 1784} {"train_loss": -11.844810485839844, "global_step": 299838, "epoch": 1784} {"train_loss": -12.274170875549316, "global_step": 299839, "epoch": 1784} {"train_loss": -11.482158660888672, "global_step": 299840, "epoch": 1784} {"train_loss": -12.452859878540039, "global_step": 299841, "epoch": 1784} {"train_loss": -11.136016845703125, "global_step": 299842, "epoch": 1784} {"train_loss": -11.015739440917969, "global_step": 299843, "epoch": 1784} {"train_loss": -11.539711952209473, "global_step": 299844, "epoch": 1784} {"train_loss": -11.397936820983887, "global_step": 299845, "epoch": 1784} {"train_loss": -8.61406135559082, "global_step": 299846, "epoch": 1784} {"train_loss": -8.947063446044922, "global_step": 299847, "epoch": 1784} {"train_loss": -10.259931564331055, "global_step": 299848, "epoch": 1784} {"train_loss": -9.86412239074707, "global_step": 299849, "epoch": 1784} {"train_loss": -9.177934646606445, "global_step": 299850, "epoch": 1784} {"train_loss": -9.874825477600098, "global_step": 299851, "epoch": 1784} {"train_loss": -10.071712493896484, "global_step": 299852, "epoch": 1784} {"train_loss": -9.734530448913574, "global_step": 299853, "epoch": 1784} {"train_loss": -10.256593704223633, "global_step": 299854, "epoch": 1784} {"train_loss": -10.211709976196289, "global_step": 299855, "epoch": 1784} {"train_loss": -10.298548698425293, "global_step": 299856, "epoch": 1784} {"train_loss": -11.388277053833008, "global_step": 299857, "epoch": 1784} {"train_loss": -10.769750595092773, "global_step": 299858, "epoch": 1784} {"train_loss": -10.517417907714844, "global_step": 299859, "epoch": 1784} {"train_loss": -11.054396629333496, "global_step": 299860, "epoch": 1784} {"train_loss": -10.882234573364258, "global_step": 299861, "epoch": 1784} {"train_loss": -11.679070472717285, "global_step": 299862, "epoch": 1784} {"train_loss": -11.277692794799805, "global_step": 299863, "epoch": 1784} {"train_loss": -11.368572235107422, "global_step": 299864, "epoch": 1784} {"train_loss": -11.46743392944336, "global_step": 299865, "epoch": 1784} {"train_loss": -10.041638374328613, "global_step": 299866, "epoch": 1784} {"train_loss": -11.067300796508789, "global_step": 299867, "epoch": 1784} {"train_loss": -11.12959098815918, "global_step": 299868, "epoch": 1784} {"train_loss": -10.761566162109375, "global_step": 299869, "epoch": 1784} {"train_loss": -11.515256881713867, "global_step": 299870, "epoch": 1784} {"train_loss": -11.298397064208984, "global_step": 299871, "epoch": 1784} {"train_loss": -11.138240814208984, "global_step": 299872, "epoch": 1784} {"train_loss": -11.317129135131836, "global_step": 299873, "epoch": 1784} {"train_loss": -11.45439624786377, "global_step": 299874, "epoch": 1784} {"train_loss": -11.794933319091797, "global_step": 299875, "epoch": 1784} {"train_loss": -11.96397590637207, "global_step": 299876, "epoch": 1784} {"train_loss": -11.617518424987793, "global_step": 299877, "epoch": 1784} {"train_loss": -11.871183395385742, "global_step": 299878, "epoch": 1784} {"train_loss": -11.713057398796082, "global_step": 299879, "epoch": 1784, "val_loss": 278857.0} {"train_loss": -11.549802780151367, "global_step": 299880, "epoch": 1785} {"train_loss": -11.79612922668457, "global_step": 299881, "epoch": 1785} {"train_loss": -11.770180702209473, "global_step": 299882, "epoch": 1785} {"train_loss": -11.754252433776855, "global_step": 299883, "epoch": 1785} {"train_loss": -11.68554401397705, "global_step": 299884, "epoch": 1785} {"train_loss": -11.860321998596191, "global_step": 299885, "epoch": 1785} {"train_loss": -12.025716781616211, "global_step": 299886, "epoch": 1785} {"train_loss": -11.851128578186035, "global_step": 299887, "epoch": 1785} {"train_loss": -11.755209922790527, "global_step": 299888, "epoch": 1785} {"train_loss": -11.990446090698242, "global_step": 299889, "epoch": 1785} {"train_loss": -11.896771430969238, "global_step": 299890, "epoch": 1785} {"train_loss": -11.88912582397461, "global_step": 299891, "epoch": 1785} {"train_loss": -12.041765213012695, "global_step": 299892, "epoch": 1785} {"train_loss": -12.063095092773438, "global_step": 299893, "epoch": 1785} {"train_loss": -11.863558769226074, "global_step": 299894, "epoch": 1785} {"train_loss": -11.976421356201172, "global_step": 299895, "epoch": 1785} {"train_loss": -12.105042457580566, "global_step": 299896, "epoch": 1785} {"train_loss": -11.90090274810791, "global_step": 299897, "epoch": 1785} {"train_loss": -12.030130386352539, "global_step": 299898, "epoch": 1785} {"train_loss": -12.296902656555176, "global_step": 299899, "epoch": 1785} {"train_loss": -12.025188446044922, "global_step": 299900, "epoch": 1785} {"train_loss": -12.307418823242188, "global_step": 299901, "epoch": 1785} {"train_loss": -12.270506858825684, "global_step": 299902, "epoch": 1785} {"train_loss": -12.172338485717773, "global_step": 299903, "epoch": 1785} {"train_loss": -12.2099027633667, "global_step": 299904, "epoch": 1785} {"train_loss": -12.401735305786133, "global_step": 299905, "epoch": 1785} {"train_loss": -12.240447998046875, "global_step": 299906, "epoch": 1785} {"train_loss": -12.31209659576416, "global_step": 299907, "epoch": 1785} {"train_loss": -12.284348487854004, "global_step": 299908, "epoch": 1785} {"train_loss": -12.321770668029785, "global_step": 299909, "epoch": 1785} {"train_loss": -12.202085494995117, "global_step": 299910, "epoch": 1785} {"train_loss": -12.321687698364258, "global_step": 299911, "epoch": 1785} {"train_loss": -12.390012741088867, "global_step": 299912, "epoch": 1785} {"train_loss": -12.135875701904297, "global_step": 299913, "epoch": 1785} {"train_loss": -12.308858871459961, "global_step": 299914, "epoch": 1785} {"train_loss": -12.251590728759766, "global_step": 299915, "epoch": 1785} {"train_loss": -12.085460662841797, "global_step": 299916, "epoch": 1785} {"train_loss": -12.065071105957031, "global_step": 299917, "epoch": 1785} {"train_loss": -12.058759689331055, "global_step": 299918, "epoch": 1785} {"train_loss": -12.153216361999512, "global_step": 299919, "epoch": 1785} {"train_loss": -11.946714401245117, "global_step": 299920, "epoch": 1785} {"train_loss": -12.246227264404297, "global_step": 299921, "epoch": 1785} {"train_loss": -12.23941421508789, "global_step": 299922, "epoch": 1785} {"train_loss": -12.157281875610352, "global_step": 299923, "epoch": 1785} {"train_loss": -12.15654182434082, "global_step": 299924, "epoch": 1785} {"train_loss": -12.501749992370605, "global_step": 299925, "epoch": 1785} {"train_loss": -12.262913703918457, "global_step": 299926, "epoch": 1785} {"train_loss": -12.036873817443848, "global_step": 299927, "epoch": 1785} {"train_loss": -12.204137802124023, "global_step": 299928, "epoch": 1785} {"train_loss": -11.827474594116211, "global_step": 299929, "epoch": 1785} {"train_loss": -11.681488037109375, "global_step": 299930, "epoch": 1785} {"train_loss": -12.280158996582031, "global_step": 299931, "epoch": 1785} {"train_loss": -11.644964218139648, "global_step": 299932, "epoch": 1785} {"train_loss": -10.84769344329834, "global_step": 299933, "epoch": 1785} {"train_loss": -12.131999969482422, "global_step": 299934, "epoch": 1785} {"train_loss": -11.78750991821289, "global_step": 299935, "epoch": 1785} {"train_loss": -11.192943572998047, "global_step": 299936, "epoch": 1785} {"train_loss": -11.314386367797852, "global_step": 299937, "epoch": 1785} {"train_loss": -11.313276290893555, "global_step": 299938, "epoch": 1785} {"train_loss": -9.313680648803711, "global_step": 299939, "epoch": 1785} {"train_loss": -11.171682357788086, "global_step": 299940, "epoch": 1785} {"train_loss": -10.216899871826172, "global_step": 299941, "epoch": 1785} {"train_loss": -10.71504020690918, "global_step": 299942, "epoch": 1785} {"train_loss": -11.118621826171875, "global_step": 299943, "epoch": 1785} {"train_loss": -9.739362716674805, "global_step": 299944, "epoch": 1785} {"train_loss": -11.99335765838623, "global_step": 299945, "epoch": 1785} {"train_loss": -10.61823844909668, "global_step": 299946, "epoch": 1785} {"train_loss": -10.566218376159668, "global_step": 299947, "epoch": 1785} {"train_loss": -11.38392448425293, "global_step": 299948, "epoch": 1785} {"train_loss": -11.020120620727539, "global_step": 299949, "epoch": 1785} {"train_loss": -10.585683822631836, "global_step": 299950, "epoch": 1785} {"train_loss": -11.005294799804688, "global_step": 299951, "epoch": 1785} {"train_loss": -11.060094833374023, "global_step": 299952, "epoch": 1785} {"train_loss": -11.801414489746094, "global_step": 299953, "epoch": 1785} {"train_loss": -11.543741226196289, "global_step": 299954, "epoch": 1785} {"train_loss": -11.986246109008789, "global_step": 299955, "epoch": 1785} {"train_loss": -11.539567947387695, "global_step": 299956, "epoch": 1785} {"train_loss": -11.48154067993164, "global_step": 299957, "epoch": 1785} {"train_loss": -11.730857849121094, "global_step": 299958, "epoch": 1785} {"train_loss": -11.334615707397461, "global_step": 299959, "epoch": 1785} {"train_loss": -11.84520435333252, "global_step": 299960, "epoch": 1785} {"train_loss": -11.043885231018066, "global_step": 299961, "epoch": 1785} {"train_loss": -11.536317825317383, "global_step": 299962, "epoch": 1785} {"train_loss": -11.148086547851562, "global_step": 299963, "epoch": 1785} {"train_loss": -11.73310375213623, "global_step": 299964, "epoch": 1785} {"train_loss": -11.441803932189941, "global_step": 299965, "epoch": 1785} {"train_loss": -11.070758819580078, "global_step": 299966, "epoch": 1785} {"train_loss": -12.092077255249023, "global_step": 299967, "epoch": 1785} {"train_loss": -11.028308868408203, "global_step": 299968, "epoch": 1785} {"train_loss": -11.89568042755127, "global_step": 299969, "epoch": 1785} {"train_loss": -11.0109281539917, "global_step": 299970, "epoch": 1785} {"train_loss": -11.999317169189453, "global_step": 299971, "epoch": 1785} {"train_loss": -11.189990997314453, "global_step": 299972, "epoch": 1785} {"train_loss": -12.065194129943848, "global_step": 299973, "epoch": 1785} {"train_loss": -11.666196823120117, "global_step": 299974, "epoch": 1785} {"train_loss": -12.160919189453125, "global_step": 299975, "epoch": 1785} {"train_loss": -11.312349319458008, "global_step": 299976, "epoch": 1785} {"train_loss": -11.822826385498047, "global_step": 299977, "epoch": 1785} {"train_loss": -11.550935745239258, "global_step": 299978, "epoch": 1785} {"train_loss": -12.075010299682617, "global_step": 299979, "epoch": 1785} {"train_loss": -11.807104110717773, "global_step": 299980, "epoch": 1785} {"train_loss": -12.2772798538208, "global_step": 299981, "epoch": 1785} {"train_loss": -12.136157989501953, "global_step": 299982, "epoch": 1785} {"train_loss": -12.171258926391602, "global_step": 299983, "epoch": 1785} {"train_loss": -11.868032455444336, "global_step": 299984, "epoch": 1785} {"train_loss": -12.056396484375, "global_step": 299985, "epoch": 1785} {"train_loss": -11.809446334838867, "global_step": 299986, "epoch": 1785} {"train_loss": -12.07176399230957, "global_step": 299987, "epoch": 1785} {"train_loss": -11.984756469726562, "global_step": 299988, "epoch": 1785} {"train_loss": -12.005565643310547, "global_step": 299989, "epoch": 1785} {"train_loss": -12.123109817504883, "global_step": 299990, "epoch": 1785} {"train_loss": -12.090429306030273, "global_step": 299991, "epoch": 1785} {"train_loss": -12.189065933227539, "global_step": 299992, "epoch": 1785} {"train_loss": -11.73184585571289, "global_step": 299993, "epoch": 1785} {"train_loss": -12.262279510498047, "global_step": 299994, "epoch": 1785} {"train_loss": -12.081035614013672, "global_step": 299995, "epoch": 1785} {"train_loss": -12.03053092956543, "global_step": 299996, "epoch": 1785} {"train_loss": -12.119657516479492, "global_step": 299997, "epoch": 1785} {"train_loss": -11.982447624206543, "global_step": 299998, "epoch": 1785} {"train_loss": -12.062446594238281, "global_step": 299999, "epoch": 1785} {"train_loss": -12.12356185913086, "global_step": 300000, "epoch": 1785} {"train_loss": -11.961366653442383, "global_step": 300001, "epoch": 1785} {"train_loss": -12.349567413330078, "global_step": 300002, "epoch": 1785} {"train_loss": -12.02528190612793, "global_step": 300003, "epoch": 1785} {"train_loss": -12.16591739654541, "global_step": 300004, "epoch": 1785} {"train_loss": -11.831995964050293, "global_step": 300005, "epoch": 1785} {"train_loss": -12.286827087402344, "global_step": 300006, "epoch": 1785} {"train_loss": -12.014019012451172, "global_step": 300007, "epoch": 1785} {"train_loss": -12.194669723510742, "global_step": 300008, "epoch": 1785} {"train_loss": -12.057991027832031, "global_step": 300009, "epoch": 1785} {"train_loss": -12.034286499023438, "global_step": 300010, "epoch": 1785} {"train_loss": -12.052071571350098, "global_step": 300011, "epoch": 1785} {"train_loss": -12.15064811706543, "global_step": 300012, "epoch": 1785} {"train_loss": -12.296228408813477, "global_step": 300013, "epoch": 1785} {"train_loss": -12.017129898071289, "global_step": 300014, "epoch": 1785} {"train_loss": -12.074495315551758, "global_step": 300015, "epoch": 1785} {"train_loss": -12.05868911743164, "global_step": 300016, "epoch": 1785} {"train_loss": -12.253625869750977, "global_step": 300017, "epoch": 1785} {"train_loss": -12.265777587890625, "global_step": 300018, "epoch": 1785} {"train_loss": -11.699451446533203, "global_step": 300019, "epoch": 1785} {"train_loss": -12.033620834350586, "global_step": 300020, "epoch": 1785} {"train_loss": -12.08884048461914, "global_step": 300021, "epoch": 1785} {"train_loss": -12.009354591369629, "global_step": 300022, "epoch": 1785} {"train_loss": -12.146209716796875, "global_step": 300023, "epoch": 1785} {"train_loss": -12.285645484924316, "global_step": 300024, "epoch": 1785} {"train_loss": -11.955547332763672, "global_step": 300025, "epoch": 1785} {"train_loss": -12.200101852416992, "global_step": 300026, "epoch": 1785} {"train_loss": -12.290451049804688, "global_step": 300027, "epoch": 1785} {"train_loss": -12.094141960144043, "global_step": 300028, "epoch": 1785} {"train_loss": -12.15371322631836, "global_step": 300029, "epoch": 1785} {"train_loss": -12.263672828674316, "global_step": 300030, "epoch": 1785} {"train_loss": -11.85215950012207, "global_step": 300031, "epoch": 1785} {"train_loss": -11.965008735656738, "global_step": 300032, "epoch": 1785} {"train_loss": -11.867568016052246, "global_step": 300033, "epoch": 1785} {"train_loss": -11.992740631103516, "global_step": 300034, "epoch": 1785} {"train_loss": -12.343610763549805, "global_step": 300035, "epoch": 1785} {"train_loss": -12.094658851623535, "global_step": 300036, "epoch": 1785} {"train_loss": -12.188703536987305, "global_step": 300037, "epoch": 1785} {"train_loss": -12.078022003173828, "global_step": 300038, "epoch": 1785} {"train_loss": -12.047247886657715, "global_step": 300039, "epoch": 1785} {"train_loss": -12.321573257446289, "global_step": 300040, "epoch": 1785} {"train_loss": -12.25999927520752, "global_step": 300041, "epoch": 1785} {"train_loss": -12.12581729888916, "global_step": 300042, "epoch": 1785} {"train_loss": -12.146517753601074, "global_step": 300043, "epoch": 1785} {"train_loss": -12.107536315917969, "global_step": 300044, "epoch": 1785} {"train_loss": -11.964906692504883, "global_step": 300045, "epoch": 1785} {"train_loss": -12.429903984069824, "global_step": 300046, "epoch": 1785} {"train_loss": -11.866947327341352, "global_step": 300047, "epoch": 1785, "val_loss": 280066.28125, "train_action_mse_error": 1.7929282188415527} {"train_loss": -12.178132057189941, "global_step": 300048, "epoch": 1786} {"train_loss": -11.726515769958496, "global_step": 300049, "epoch": 1786} {"train_loss": -12.13359260559082, "global_step": 300050, "epoch": 1786} {"train_loss": -11.60845947265625, "global_step": 300051, "epoch": 1786} {"train_loss": -12.027068138122559, "global_step": 300052, "epoch": 1786} {"train_loss": -11.83295726776123, "global_step": 300053, "epoch": 1786} {"train_loss": -12.34276008605957, "global_step": 300054, "epoch": 1786} {"train_loss": -11.45315170288086, "global_step": 300055, "epoch": 1786} {"train_loss": -11.97661304473877, "global_step": 300056, "epoch": 1786} {"train_loss": -12.099000930786133, "global_step": 300057, "epoch": 1786} {"train_loss": -12.055432319641113, "global_step": 300058, "epoch": 1786} {"train_loss": -12.40093994140625, "global_step": 300059, "epoch": 1786} {"train_loss": -12.475226402282715, "global_step": 300060, "epoch": 1786} {"train_loss": -12.054433822631836, "global_step": 300061, "epoch": 1786} {"train_loss": -12.299208641052246, "global_step": 300062, "epoch": 1786} {"train_loss": -12.020057678222656, "global_step": 300063, "epoch": 1786} {"train_loss": -12.321624755859375, "global_step": 300064, "epoch": 1786} {"train_loss": -12.295236587524414, "global_step": 300065, "epoch": 1786} {"train_loss": -12.032888412475586, "global_step": 300066, "epoch": 1786} {"train_loss": -12.092131614685059, "global_step": 300067, "epoch": 1786} {"train_loss": -12.100408554077148, "global_step": 300068, "epoch": 1786} {"train_loss": -12.25050163269043, "global_step": 300069, "epoch": 1786} {"train_loss": -11.785194396972656, "global_step": 300070, "epoch": 1786} {"train_loss": -11.98548698425293, "global_step": 300071, "epoch": 1786} {"train_loss": -11.818598747253418, "global_step": 300072, "epoch": 1786} {"train_loss": -10.760022163391113, "global_step": 300073, "epoch": 1786} {"train_loss": -10.899429321289062, "global_step": 300074, "epoch": 1786} {"train_loss": -11.369497299194336, "global_step": 300075, "epoch": 1786} {"train_loss": -10.764019966125488, "global_step": 300076, "epoch": 1786} {"train_loss": -10.385510444641113, "global_step": 300077, "epoch": 1786} {"train_loss": -10.742518424987793, "global_step": 300078, "epoch": 1786} {"train_loss": -11.34969711303711, "global_step": 300079, "epoch": 1786} {"train_loss": -11.237260818481445, "global_step": 300080, "epoch": 1786} {"train_loss": -11.270947456359863, "global_step": 300081, "epoch": 1786} {"train_loss": -11.26511001586914, "global_step": 300082, "epoch": 1786} {"train_loss": -10.981239318847656, "global_step": 300083, "epoch": 1786} {"train_loss": -11.425674438476562, "global_step": 300084, "epoch": 1786} {"train_loss": -10.3121337890625, "global_step": 300085, "epoch": 1786} {"train_loss": -11.581307411193848, "global_step": 300086, "epoch": 1786} {"train_loss": -10.510951042175293, "global_step": 300087, "epoch": 1786} {"train_loss": -11.706822395324707, "global_step": 300088, "epoch": 1786} {"train_loss": -10.133129119873047, "global_step": 300089, "epoch": 1786} {"train_loss": -9.647478103637695, "global_step": 300090, "epoch": 1786} {"train_loss": -11.117809295654297, "global_step": 300091, "epoch": 1786} {"train_loss": -10.191001892089844, "global_step": 300092, "epoch": 1786} {"train_loss": -10.516240119934082, "global_step": 300093, "epoch": 1786} {"train_loss": -10.917631149291992, "global_step": 300094, "epoch": 1786} {"train_loss": -10.808815002441406, "global_step": 300095, "epoch": 1786} {"train_loss": -11.285539627075195, "global_step": 300096, "epoch": 1786} {"train_loss": -10.619370460510254, "global_step": 300097, "epoch": 1786} {"train_loss": -10.48987865447998, "global_step": 300098, "epoch": 1786} {"train_loss": -10.841764450073242, "global_step": 300099, "epoch": 1786} {"train_loss": -10.756673812866211, "global_step": 300100, "epoch": 1786} {"train_loss": -10.641584396362305, "global_step": 300101, "epoch": 1786} {"train_loss": -11.455090522766113, "global_step": 300102, "epoch": 1786} {"train_loss": -10.879730224609375, "global_step": 300103, "epoch": 1786} {"train_loss": -11.680164337158203, "global_step": 300104, "epoch": 1786} {"train_loss": -11.145644187927246, "global_step": 300105, "epoch": 1786} {"train_loss": -11.738311767578125, "global_step": 300106, "epoch": 1786} {"train_loss": -11.162575721740723, "global_step": 300107, "epoch": 1786} {"train_loss": -11.686741828918457, "global_step": 300108, "epoch": 1786} {"train_loss": -11.513240814208984, "global_step": 300109, "epoch": 1786} {"train_loss": -11.77385139465332, "global_step": 300110, "epoch": 1786} {"train_loss": -11.33933162689209, "global_step": 300111, "epoch": 1786} {"train_loss": -11.861494064331055, "global_step": 300112, "epoch": 1786} {"train_loss": -11.223325729370117, "global_step": 300113, "epoch": 1786} {"train_loss": -11.722370147705078, "global_step": 300114, "epoch": 1786} {"train_loss": -11.471872329711914, "global_step": 300115, "epoch": 1786} {"train_loss": -11.78182315826416, "global_step": 300116, "epoch": 1786} {"train_loss": -11.79041862487793, "global_step": 300117, "epoch": 1786} {"train_loss": -11.527215003967285, "global_step": 300118, "epoch": 1786} {"train_loss": -11.69638442993164, "global_step": 300119, "epoch": 1786} {"train_loss": -11.888007164001465, "global_step": 300120, "epoch": 1786} {"train_loss": -11.747367858886719, "global_step": 300121, "epoch": 1786} {"train_loss": -11.941500663757324, "global_step": 300122, "epoch": 1786} {"train_loss": -11.846094131469727, "global_step": 300123, "epoch": 1786} {"train_loss": -11.645991325378418, "global_step": 300124, "epoch": 1786} {"train_loss": -11.751218795776367, "global_step": 300125, "epoch": 1786} {"train_loss": -11.874120712280273, "global_step": 300126, "epoch": 1786} {"train_loss": -11.942490577697754, "global_step": 300127, "epoch": 1786} {"train_loss": -11.692790031433105, "global_step": 300128, "epoch": 1786} {"train_loss": -11.968530654907227, "global_step": 300129, "epoch": 1786} {"train_loss": -11.992880821228027, "global_step": 300130, "epoch": 1786} {"train_loss": -11.999164581298828, "global_step": 300131, "epoch": 1786} {"train_loss": -11.943028450012207, "global_step": 300132, "epoch": 1786} {"train_loss": -11.863943099975586, "global_step": 300133, "epoch": 1786} {"train_loss": -11.55659008026123, "global_step": 300134, "epoch": 1786} {"train_loss": -11.510007858276367, "global_step": 300135, "epoch": 1786} {"train_loss": -11.56589126586914, "global_step": 300136, "epoch": 1786} {"train_loss": -12.09406852722168, "global_step": 300137, "epoch": 1786} {"train_loss": -11.601777076721191, "global_step": 300138, "epoch": 1786} {"train_loss": -11.921019554138184, "global_step": 300139, "epoch": 1786} {"train_loss": -11.763904571533203, "global_step": 300140, "epoch": 1786} {"train_loss": -11.819986343383789, "global_step": 300141, "epoch": 1786} {"train_loss": -12.084587097167969, "global_step": 300142, "epoch": 1786} {"train_loss": -11.642888069152832, "global_step": 300143, "epoch": 1786} {"train_loss": -12.139165878295898, "global_step": 300144, "epoch": 1786} {"train_loss": -11.725479125976562, "global_step": 300145, "epoch": 1786} {"train_loss": -12.105203628540039, "global_step": 300146, "epoch": 1786} {"train_loss": -12.148490905761719, "global_step": 300147, "epoch": 1786} {"train_loss": -12.056647300720215, "global_step": 300148, "epoch": 1786} {"train_loss": -12.172651290893555, "global_step": 300149, "epoch": 1786} {"train_loss": -11.988821983337402, "global_step": 300150, "epoch": 1786} {"train_loss": -12.240982055664062, "global_step": 300151, "epoch": 1786} {"train_loss": -12.403907775878906, "global_step": 300152, "epoch": 1786} {"train_loss": -12.066164016723633, "global_step": 300153, "epoch": 1786} {"train_loss": -12.227036476135254, "global_step": 300154, "epoch": 1786} {"train_loss": -12.124072074890137, "global_step": 300155, "epoch": 1786} {"train_loss": -12.239750862121582, "global_step": 300156, "epoch": 1786} {"train_loss": -12.255531311035156, "global_step": 300157, "epoch": 1786} {"train_loss": -12.049836158752441, "global_step": 300158, "epoch": 1786} {"train_loss": -12.12730598449707, "global_step": 300159, "epoch": 1786} {"train_loss": -12.055868148803711, "global_step": 300160, "epoch": 1786} {"train_loss": -12.309455871582031, "global_step": 300161, "epoch": 1786} {"train_loss": -12.187284469604492, "global_step": 300162, "epoch": 1786} {"train_loss": -12.128128051757812, "global_step": 300163, "epoch": 1786} {"train_loss": -12.23218059539795, "global_step": 300164, "epoch": 1786} {"train_loss": -12.076128005981445, "global_step": 300165, "epoch": 1786} {"train_loss": -12.155041694641113, "global_step": 300166, "epoch": 1786} {"train_loss": -12.242286682128906, "global_step": 300167, "epoch": 1786} {"train_loss": -12.211185455322266, "global_step": 300168, "epoch": 1786} {"train_loss": -12.087100982666016, "global_step": 300169, "epoch": 1786} {"train_loss": -12.07182502746582, "global_step": 300170, "epoch": 1786} {"train_loss": -12.546035766601562, "global_step": 300171, "epoch": 1786} {"train_loss": -12.085737228393555, "global_step": 300172, "epoch": 1786} {"train_loss": -12.066296577453613, "global_step": 300173, "epoch": 1786} {"train_loss": -12.430895805358887, "global_step": 300174, "epoch": 1786} {"train_loss": -12.369955062866211, "global_step": 300175, "epoch": 1786} {"train_loss": -12.52743911743164, "global_step": 300176, "epoch": 1786} {"train_loss": -12.443748474121094, "global_step": 300177, "epoch": 1786} {"train_loss": -12.37388801574707, "global_step": 300178, "epoch": 1786} {"train_loss": -12.450305938720703, "global_step": 300179, "epoch": 1786} {"train_loss": -12.456645965576172, "global_step": 300180, "epoch": 1786} {"train_loss": -12.393198013305664, "global_step": 300181, "epoch": 1786} {"train_loss": -12.503416061401367, "global_step": 300182, "epoch": 1786} {"train_loss": -11.972550392150879, "global_step": 300183, "epoch": 1786} {"train_loss": -12.19826602935791, "global_step": 300184, "epoch": 1786} {"train_loss": -12.531099319458008, "global_step": 300185, "epoch": 1786} {"train_loss": -12.296693801879883, "global_step": 300186, "epoch": 1786} {"train_loss": -12.04521369934082, "global_step": 300187, "epoch": 1786} {"train_loss": -12.378238677978516, "global_step": 300188, "epoch": 1786} {"train_loss": -12.202430725097656, "global_step": 300189, "epoch": 1786} {"train_loss": -12.522619247436523, "global_step": 300190, "epoch": 1786} {"train_loss": -12.354608535766602, "global_step": 300191, "epoch": 1786} {"train_loss": -12.483304977416992, "global_step": 300192, "epoch": 1786} {"train_loss": -12.317638397216797, "global_step": 300193, "epoch": 1786} {"train_loss": -12.356340408325195, "global_step": 300194, "epoch": 1786} {"train_loss": -12.380965232849121, "global_step": 300195, "epoch": 1786} {"train_loss": -12.486749649047852, "global_step": 300196, "epoch": 1786} {"train_loss": -12.200796127319336, "global_step": 300197, "epoch": 1786} {"train_loss": -12.151798248291016, "global_step": 300198, "epoch": 1786} {"train_loss": -12.258241653442383, "global_step": 300199, "epoch": 1786} {"train_loss": -12.376993179321289, "global_step": 300200, "epoch": 1786} {"train_loss": -12.133874893188477, "global_step": 300201, "epoch": 1786} {"train_loss": -12.663782119750977, "global_step": 300202, "epoch": 1786} {"train_loss": -12.521766662597656, "global_step": 300203, "epoch": 1786} {"train_loss": -12.120050430297852, "global_step": 300204, "epoch": 1786} {"train_loss": -11.853097915649414, "global_step": 300205, "epoch": 1786} {"train_loss": -11.810872077941895, "global_step": 300206, "epoch": 1786} {"train_loss": -12.270858764648438, "global_step": 300207, "epoch": 1786} {"train_loss": -12.231464385986328, "global_step": 300208, "epoch": 1786} {"train_loss": -10.924911499023438, "global_step": 300209, "epoch": 1786} {"train_loss": -10.025193214416504, "global_step": 300210, "epoch": 1786} {"train_loss": -11.456085205078125, "global_step": 300211, "epoch": 1786} {"train_loss": -11.940420150756836, "global_step": 300212, "epoch": 1786} {"train_loss": -11.554237365722656, "global_step": 300213, "epoch": 1786} {"train_loss": -11.587709426879883, "global_step": 300214, "epoch": 1786} {"train_loss": -11.799250983056568, "global_step": 300215, "epoch": 1786, "val_loss": 278749.03125} {"train_loss": -12.186179161071777, "global_step": 300216, "epoch": 1787} {"train_loss": -11.057777404785156, "global_step": 300217, "epoch": 1787} {"train_loss": -11.48328971862793, "global_step": 300218, "epoch": 1787} {"train_loss": -12.087888717651367, "global_step": 300219, "epoch": 1787} {"train_loss": -11.297903060913086, "global_step": 300220, "epoch": 1787} {"train_loss": -12.295989990234375, "global_step": 300221, "epoch": 1787} {"train_loss": -10.985627174377441, "global_step": 300222, "epoch": 1787} {"train_loss": -10.89773178100586, "global_step": 300223, "epoch": 1787} {"train_loss": -10.695900917053223, "global_step": 300224, "epoch": 1787} {"train_loss": -11.432519912719727, "global_step": 300225, "epoch": 1787} {"train_loss": -10.631368637084961, "global_step": 300226, "epoch": 1787} {"train_loss": -11.39747142791748, "global_step": 300227, "epoch": 1787} {"train_loss": -10.400896072387695, "global_step": 300228, "epoch": 1787} {"train_loss": -10.832006454467773, "global_step": 300229, "epoch": 1787} {"train_loss": -11.617441177368164, "global_step": 300230, "epoch": 1787} {"train_loss": -9.742063522338867, "global_step": 300231, "epoch": 1787} {"train_loss": -10.471637725830078, "global_step": 300232, "epoch": 1787} {"train_loss": -10.874045372009277, "global_step": 300233, "epoch": 1787} {"train_loss": -9.24317741394043, "global_step": 300234, "epoch": 1787} {"train_loss": -11.170844078063965, "global_step": 300235, "epoch": 1787} {"train_loss": -10.744882583618164, "global_step": 300236, "epoch": 1787} {"train_loss": -10.871360778808594, "global_step": 300237, "epoch": 1787} {"train_loss": -11.53681755065918, "global_step": 300238, "epoch": 1787} {"train_loss": -10.980669021606445, "global_step": 300239, "epoch": 1787} {"train_loss": -11.42368221282959, "global_step": 300240, "epoch": 1787} {"train_loss": -11.074528694152832, "global_step": 300241, "epoch": 1787} {"train_loss": -11.146738052368164, "global_step": 300242, "epoch": 1787} {"train_loss": -10.321844100952148, "global_step": 300243, "epoch": 1787} {"train_loss": -10.197978973388672, "global_step": 300244, "epoch": 1787} {"train_loss": -10.284032821655273, "global_step": 300245, "epoch": 1787} {"train_loss": -11.159669876098633, "global_step": 300246, "epoch": 1787} {"train_loss": -10.069318771362305, "global_step": 300247, "epoch": 1787} {"train_loss": -11.193487167358398, "global_step": 300248, "epoch": 1787} {"train_loss": -9.408370971679688, "global_step": 300249, "epoch": 1787} {"train_loss": -11.000792503356934, "global_step": 300250, "epoch": 1787} {"train_loss": -10.987112998962402, "global_step": 300251, "epoch": 1787} {"train_loss": -10.296466827392578, "global_step": 300252, "epoch": 1787} {"train_loss": -11.543449401855469, "global_step": 300253, "epoch": 1787} {"train_loss": -10.416589736938477, "global_step": 300254, "epoch": 1787} {"train_loss": -10.812664031982422, "global_step": 300255, "epoch": 1787} {"train_loss": -11.352048873901367, "global_step": 300256, "epoch": 1787} {"train_loss": -10.822345733642578, "global_step": 300257, "epoch": 1787} {"train_loss": -11.682855606079102, "global_step": 300258, "epoch": 1787} {"train_loss": -11.515202522277832, "global_step": 300259, "epoch": 1787} {"train_loss": -10.795339584350586, "global_step": 300260, "epoch": 1787} {"train_loss": -11.776144027709961, "global_step": 300261, "epoch": 1787} {"train_loss": -10.661663055419922, "global_step": 300262, "epoch": 1787} {"train_loss": -10.718358993530273, "global_step": 300263, "epoch": 1787} {"train_loss": -11.487895965576172, "global_step": 300264, "epoch": 1787} {"train_loss": -10.277776718139648, "global_step": 300265, "epoch": 1787} {"train_loss": -11.416178703308105, "global_step": 300266, "epoch": 1787} {"train_loss": -11.425277709960938, "global_step": 300267, "epoch": 1787} {"train_loss": -10.830133438110352, "global_step": 300268, "epoch": 1787} {"train_loss": -11.773438453674316, "global_step": 300269, "epoch": 1787} {"train_loss": -11.238924026489258, "global_step": 300270, "epoch": 1787} {"train_loss": -11.407207489013672, "global_step": 300271, "epoch": 1787} {"train_loss": -11.932870864868164, "global_step": 300272, "epoch": 1787} {"train_loss": -11.566661834716797, "global_step": 300273, "epoch": 1787} {"train_loss": -11.563947677612305, "global_step": 300274, "epoch": 1787} {"train_loss": -11.7689208984375, "global_step": 300275, "epoch": 1787} {"train_loss": -11.533218383789062, "global_step": 300276, "epoch": 1787} {"train_loss": -11.918438911437988, "global_step": 300277, "epoch": 1787} {"train_loss": -11.716039657592773, "global_step": 300278, "epoch": 1787} {"train_loss": -11.68727970123291, "global_step": 300279, "epoch": 1787} {"train_loss": -11.788206100463867, "global_step": 300280, "epoch": 1787} {"train_loss": -11.471476554870605, "global_step": 300281, "epoch": 1787} {"train_loss": -11.721502304077148, "global_step": 300282, "epoch": 1787} {"train_loss": -11.570256233215332, "global_step": 300283, "epoch": 1787} {"train_loss": -11.738462448120117, "global_step": 300284, "epoch": 1787} {"train_loss": -11.74390697479248, "global_step": 300285, "epoch": 1787} {"train_loss": -11.60879135131836, "global_step": 300286, "epoch": 1787} {"train_loss": -11.853471755981445, "global_step": 300287, "epoch": 1787} {"train_loss": -11.743629455566406, "global_step": 300288, "epoch": 1787} {"train_loss": -11.912282943725586, "global_step": 300289, "epoch": 1787} {"train_loss": -11.952329635620117, "global_step": 300290, "epoch": 1787} {"train_loss": -11.677831649780273, "global_step": 300291, "epoch": 1787} {"train_loss": -12.04246997833252, "global_step": 300292, "epoch": 1787} {"train_loss": -11.91036319732666, "global_step": 300293, "epoch": 1787} {"train_loss": -11.752143859863281, "global_step": 300294, "epoch": 1787} {"train_loss": -12.170351028442383, "global_step": 300295, "epoch": 1787} {"train_loss": -11.97068977355957, "global_step": 300296, "epoch": 1787} {"train_loss": -11.943208694458008, "global_step": 300297, "epoch": 1787} {"train_loss": -12.037965774536133, "global_step": 300298, "epoch": 1787} {"train_loss": -11.865787506103516, "global_step": 300299, "epoch": 1787} {"train_loss": -12.040107727050781, "global_step": 300300, "epoch": 1787} {"train_loss": -12.234613418579102, "global_step": 300301, "epoch": 1787} {"train_loss": -12.171302795410156, "global_step": 300302, "epoch": 1787} {"train_loss": -12.170032501220703, "global_step": 300303, "epoch": 1787} {"train_loss": -12.134697914123535, "global_step": 300304, "epoch": 1787} {"train_loss": -12.069707870483398, "global_step": 300305, "epoch": 1787} {"train_loss": -12.197013854980469, "global_step": 300306, "epoch": 1787} {"train_loss": -12.265632629394531, "global_step": 300307, "epoch": 1787} {"train_loss": -12.351160049438477, "global_step": 300308, "epoch": 1787} {"train_loss": -12.099403381347656, "global_step": 300309, "epoch": 1787} {"train_loss": -12.188467979431152, "global_step": 300310, "epoch": 1787} {"train_loss": -12.194527626037598, "global_step": 300311, "epoch": 1787} {"train_loss": -12.106842994689941, "global_step": 300312, "epoch": 1787} {"train_loss": -12.104107856750488, "global_step": 300313, "epoch": 1787} {"train_loss": -12.27868366241455, "global_step": 300314, "epoch": 1787} {"train_loss": -12.305005073547363, "global_step": 300315, "epoch": 1787} {"train_loss": -12.105809211730957, "global_step": 300316, "epoch": 1787} {"train_loss": -12.210441589355469, "global_step": 300317, "epoch": 1787} {"train_loss": -11.997568130493164, "global_step": 300318, "epoch": 1787} {"train_loss": -12.252998352050781, "global_step": 300319, "epoch": 1787} {"train_loss": -12.00046443939209, "global_step": 300320, "epoch": 1787} {"train_loss": -12.212364196777344, "global_step": 300321, "epoch": 1787} {"train_loss": -11.964498519897461, "global_step": 300322, "epoch": 1787} {"train_loss": -11.84402847290039, "global_step": 300323, "epoch": 1787} {"train_loss": -12.213211059570312, "global_step": 300324, "epoch": 1787} {"train_loss": -12.138638496398926, "global_step": 300325, "epoch": 1787} {"train_loss": -12.192907333374023, "global_step": 300326, "epoch": 1787} {"train_loss": -12.239958763122559, "global_step": 300327, "epoch": 1787} {"train_loss": -12.358667373657227, "global_step": 300328, "epoch": 1787} {"train_loss": -12.404574394226074, "global_step": 300329, "epoch": 1787} {"train_loss": -12.290624618530273, "global_step": 300330, "epoch": 1787} {"train_loss": -12.330842971801758, "global_step": 300331, "epoch": 1787} {"train_loss": -12.390832901000977, "global_step": 300332, "epoch": 1787} {"train_loss": -12.201543807983398, "global_step": 300333, "epoch": 1787} {"train_loss": -12.351652145385742, "global_step": 300334, "epoch": 1787} {"train_loss": -12.453857421875, "global_step": 300335, "epoch": 1787} {"train_loss": -12.443696022033691, "global_step": 300336, "epoch": 1787} {"train_loss": -12.619270324707031, "global_step": 300337, "epoch": 1787} {"train_loss": -12.492019653320312, "global_step": 300338, "epoch": 1787} {"train_loss": -12.27183723449707, "global_step": 300339, "epoch": 1787} {"train_loss": -12.239566802978516, "global_step": 300340, "epoch": 1787} {"train_loss": -12.321313858032227, "global_step": 300341, "epoch": 1787} {"train_loss": -12.54530143737793, "global_step": 300342, "epoch": 1787} {"train_loss": -12.127784729003906, "global_step": 300343, "epoch": 1787} {"train_loss": -12.273324012756348, "global_step": 300344, "epoch": 1787} {"train_loss": -12.122416496276855, "global_step": 300345, "epoch": 1787} {"train_loss": -11.931230545043945, "global_step": 300346, "epoch": 1787} {"train_loss": -11.40254020690918, "global_step": 300347, "epoch": 1787} {"train_loss": -12.3626708984375, "global_step": 300348, "epoch": 1787} {"train_loss": -12.317707061767578, "global_step": 300349, "epoch": 1787} {"train_loss": -11.501739501953125, "global_step": 300350, "epoch": 1787} {"train_loss": -11.42669677734375, "global_step": 300351, "epoch": 1787} {"train_loss": -11.91195297241211, "global_step": 300352, "epoch": 1787} {"train_loss": -11.241178512573242, "global_step": 300353, "epoch": 1787} {"train_loss": -9.740669250488281, "global_step": 300354, "epoch": 1787} {"train_loss": -11.606499671936035, "global_step": 300355, "epoch": 1787} {"train_loss": -9.27885913848877, "global_step": 300356, "epoch": 1787} {"train_loss": -10.225749015808105, "global_step": 300357, "epoch": 1787} {"train_loss": -10.22504997253418, "global_step": 300358, "epoch": 1787} {"train_loss": -10.786944389343262, "global_step": 300359, "epoch": 1787} {"train_loss": -9.75045108795166, "global_step": 300360, "epoch": 1787} {"train_loss": -10.256000518798828, "global_step": 300361, "epoch": 1787} {"train_loss": -11.499235153198242, "global_step": 300362, "epoch": 1787} {"train_loss": -10.001236915588379, "global_step": 300363, "epoch": 1787} {"train_loss": -10.802776336669922, "global_step": 300364, "epoch": 1787} {"train_loss": -9.628299713134766, "global_step": 300365, "epoch": 1787} {"train_loss": -11.271413803100586, "global_step": 300366, "epoch": 1787} {"train_loss": -11.30472183227539, "global_step": 300367, "epoch": 1787} {"train_loss": -11.012025833129883, "global_step": 300368, "epoch": 1787} {"train_loss": -10.322418212890625, "global_step": 300369, "epoch": 1787} {"train_loss": -10.312657356262207, "global_step": 300370, "epoch": 1787} {"train_loss": -9.807965278625488, "global_step": 300371, "epoch": 1787} {"train_loss": -8.478971481323242, "global_step": 300372, "epoch": 1787} {"train_loss": -10.978875160217285, "global_step": 300373, "epoch": 1787} {"train_loss": -9.022014617919922, "global_step": 300374, "epoch": 1787} {"train_loss": -9.992035865783691, "global_step": 300375, "epoch": 1787} {"train_loss": -10.078107833862305, "global_step": 300376, "epoch": 1787} {"train_loss": -11.06584358215332, "global_step": 300377, "epoch": 1787} {"train_loss": -10.301206588745117, "global_step": 300378, "epoch": 1787} {"train_loss": -10.985554695129395, "global_step": 300379, "epoch": 1787} {"train_loss": -11.035785675048828, "global_step": 300380, "epoch": 1787} {"train_loss": -11.33602237701416, "global_step": 300381, "epoch": 1787} {"train_loss": -11.545435905456543, "global_step": 300382, "epoch": 1787} {"train_loss": -11.403426465534029, "global_step": 300383, "epoch": 1787, "val_loss": 276179.875} {"train_loss": -11.322998046875, "global_step": 300384, "epoch": 1788} {"train_loss": -11.842975616455078, "global_step": 300385, "epoch": 1788} {"train_loss": -11.571406364440918, "global_step": 300386, "epoch": 1788} {"train_loss": -11.873899459838867, "global_step": 300387, "epoch": 1788} {"train_loss": -11.857662200927734, "global_step": 300388, "epoch": 1788} {"train_loss": -11.516386985778809, "global_step": 300389, "epoch": 1788} {"train_loss": -11.705879211425781, "global_step": 300390, "epoch": 1788} {"train_loss": -11.726079940795898, "global_step": 300391, "epoch": 1788} {"train_loss": -11.919355392456055, "global_step": 300392, "epoch": 1788} {"train_loss": -11.807958602905273, "global_step": 300393, "epoch": 1788} {"train_loss": -12.04023551940918, "global_step": 300394, "epoch": 1788} {"train_loss": -11.860353469848633, "global_step": 300395, "epoch": 1788} {"train_loss": -11.930102348327637, "global_step": 300396, "epoch": 1788} {"train_loss": -11.78870964050293, "global_step": 300397, "epoch": 1788} {"train_loss": -11.717456817626953, "global_step": 300398, "epoch": 1788} {"train_loss": -12.125986099243164, "global_step": 300399, "epoch": 1788} {"train_loss": -11.868510246276855, "global_step": 300400, "epoch": 1788} {"train_loss": -11.819439888000488, "global_step": 300401, "epoch": 1788} {"train_loss": -12.080469131469727, "global_step": 300402, "epoch": 1788} {"train_loss": -11.933586120605469, "global_step": 300403, "epoch": 1788} {"train_loss": -12.120855331420898, "global_step": 300404, "epoch": 1788} {"train_loss": -12.060251235961914, "global_step": 300405, "epoch": 1788} {"train_loss": -11.979339599609375, "global_step": 300406, "epoch": 1788} {"train_loss": -12.135953903198242, "global_step": 300407, "epoch": 1788} {"train_loss": -11.97011947631836, "global_step": 300408, "epoch": 1788} {"train_loss": -12.082609176635742, "global_step": 300409, "epoch": 1788} {"train_loss": -11.873435974121094, "global_step": 300410, "epoch": 1788} {"train_loss": -12.002504348754883, "global_step": 300411, "epoch": 1788} {"train_loss": -11.946130752563477, "global_step": 300412, "epoch": 1788} {"train_loss": -12.102670669555664, "global_step": 300413, "epoch": 1788} {"train_loss": -11.799736976623535, "global_step": 300414, "epoch": 1788} {"train_loss": -12.229257583618164, "global_step": 300415, "epoch": 1788} {"train_loss": -12.120996475219727, "global_step": 300416, "epoch": 1788} {"train_loss": -12.251104354858398, "global_step": 300417, "epoch": 1788} {"train_loss": -12.062920570373535, "global_step": 300418, "epoch": 1788} {"train_loss": -12.004507064819336, "global_step": 300419, "epoch": 1788} {"train_loss": -12.150064468383789, "global_step": 300420, "epoch": 1788} {"train_loss": -11.96153450012207, "global_step": 300421, "epoch": 1788} {"train_loss": -12.042709350585938, "global_step": 300422, "epoch": 1788} {"train_loss": -12.113359451293945, "global_step": 300423, "epoch": 1788} {"train_loss": -12.405799865722656, "global_step": 300424, "epoch": 1788} {"train_loss": -12.116592407226562, "global_step": 300425, "epoch": 1788} {"train_loss": -12.022686958312988, "global_step": 300426, "epoch": 1788} {"train_loss": -12.239974975585938, "global_step": 300427, "epoch": 1788} {"train_loss": -12.128130912780762, "global_step": 300428, "epoch": 1788} {"train_loss": -12.123550415039062, "global_step": 300429, "epoch": 1788} {"train_loss": -12.313735961914062, "global_step": 300430, "epoch": 1788} {"train_loss": -12.18127155303955, "global_step": 300431, "epoch": 1788} {"train_loss": -12.273879051208496, "global_step": 300432, "epoch": 1788} {"train_loss": -12.205900192260742, "global_step": 300433, "epoch": 1788} {"train_loss": -12.29879093170166, "global_step": 300434, "epoch": 1788} {"train_loss": -12.272045135498047, "global_step": 300435, "epoch": 1788} {"train_loss": -12.377798080444336, "global_step": 300436, "epoch": 1788} {"train_loss": -12.087360382080078, "global_step": 300437, "epoch": 1788} {"train_loss": -12.157073974609375, "global_step": 300438, "epoch": 1788} {"train_loss": -12.119688034057617, "global_step": 300439, "epoch": 1788} {"train_loss": -12.09864330291748, "global_step": 300440, "epoch": 1788} {"train_loss": -12.334210395812988, "global_step": 300441, "epoch": 1788} {"train_loss": -12.024343490600586, "global_step": 300442, "epoch": 1788} {"train_loss": -12.312576293945312, "global_step": 300443, "epoch": 1788} {"train_loss": -11.970671653747559, "global_step": 300444, "epoch": 1788} {"train_loss": -12.279526710510254, "global_step": 300445, "epoch": 1788} {"train_loss": -12.23775863647461, "global_step": 300446, "epoch": 1788} {"train_loss": -12.22347640991211, "global_step": 300447, "epoch": 1788} {"train_loss": -12.501314163208008, "global_step": 300448, "epoch": 1788} {"train_loss": -12.181364059448242, "global_step": 300449, "epoch": 1788} {"train_loss": -12.138786315917969, "global_step": 300450, "epoch": 1788} {"train_loss": -12.321145057678223, "global_step": 300451, "epoch": 1788} {"train_loss": -12.206218719482422, "global_step": 300452, "epoch": 1788} {"train_loss": -12.210285186767578, "global_step": 300453, "epoch": 1788} {"train_loss": -12.155266761779785, "global_step": 300454, "epoch": 1788} {"train_loss": -12.391260147094727, "global_step": 300455, "epoch": 1788} {"train_loss": -12.244550704956055, "global_step": 300456, "epoch": 1788} {"train_loss": -12.211223602294922, "global_step": 300457, "epoch": 1788} {"train_loss": -12.671597480773926, "global_step": 300458, "epoch": 1788} {"train_loss": -12.003497123718262, "global_step": 300459, "epoch": 1788} {"train_loss": -12.37092399597168, "global_step": 300460, "epoch": 1788} {"train_loss": -12.441385269165039, "global_step": 300461, "epoch": 1788} {"train_loss": -12.322629928588867, "global_step": 300462, "epoch": 1788} {"train_loss": -12.146232604980469, "global_step": 300463, "epoch": 1788} {"train_loss": -12.198604583740234, "global_step": 300464, "epoch": 1788} {"train_loss": -11.97485065460205, "global_step": 300465, "epoch": 1788} {"train_loss": -12.157236099243164, "global_step": 300466, "epoch": 1788} {"train_loss": -11.69277286529541, "global_step": 300467, "epoch": 1788} {"train_loss": -11.772332191467285, "global_step": 300468, "epoch": 1788} {"train_loss": -11.613547325134277, "global_step": 300469, "epoch": 1788} {"train_loss": -11.484806060791016, "global_step": 300470, "epoch": 1788} {"train_loss": -11.72828483581543, "global_step": 300471, "epoch": 1788} {"train_loss": -10.928255081176758, "global_step": 300472, "epoch": 1788} {"train_loss": -10.938793182373047, "global_step": 300473, "epoch": 1788} {"train_loss": -10.580329895019531, "global_step": 300474, "epoch": 1788} {"train_loss": -11.333273887634277, "global_step": 300475, "epoch": 1788} {"train_loss": -11.39453125, "global_step": 300476, "epoch": 1788} {"train_loss": -12.003010749816895, "global_step": 300477, "epoch": 1788} {"train_loss": -11.012859344482422, "global_step": 300478, "epoch": 1788} {"train_loss": -11.852654457092285, "global_step": 300479, "epoch": 1788} {"train_loss": -11.940694808959961, "global_step": 300480, "epoch": 1788} {"train_loss": -12.060932159423828, "global_step": 300481, "epoch": 1788} {"train_loss": -11.169143676757812, "global_step": 300482, "epoch": 1788} {"train_loss": -11.925539016723633, "global_step": 300483, "epoch": 1788} {"train_loss": -11.671351432800293, "global_step": 300484, "epoch": 1788} {"train_loss": -11.242118835449219, "global_step": 300485, "epoch": 1788} {"train_loss": -11.547741889953613, "global_step": 300486, "epoch": 1788} {"train_loss": -11.454855918884277, "global_step": 300487, "epoch": 1788} {"train_loss": -11.169408798217773, "global_step": 300488, "epoch": 1788} {"train_loss": -11.556610107421875, "global_step": 300489, "epoch": 1788} {"train_loss": -11.775717735290527, "global_step": 300490, "epoch": 1788} {"train_loss": -11.378847122192383, "global_step": 300491, "epoch": 1788} {"train_loss": -11.504735946655273, "global_step": 300492, "epoch": 1788} {"train_loss": -11.597074508666992, "global_step": 300493, "epoch": 1788} {"train_loss": -10.037158012390137, "global_step": 300494, "epoch": 1788} {"train_loss": -11.177919387817383, "global_step": 300495, "epoch": 1788} {"train_loss": -11.214705467224121, "global_step": 300496, "epoch": 1788} {"train_loss": -11.477741241455078, "global_step": 300497, "epoch": 1788} {"train_loss": -11.269054412841797, "global_step": 300498, "epoch": 1788} {"train_loss": -12.161638259887695, "global_step": 300499, "epoch": 1788} {"train_loss": -11.735783576965332, "global_step": 300500, "epoch": 1788} {"train_loss": -11.997108459472656, "global_step": 300501, "epoch": 1788} {"train_loss": -11.56163501739502, "global_step": 300502, "epoch": 1788} {"train_loss": -11.96151065826416, "global_step": 300503, "epoch": 1788} {"train_loss": -11.935565948486328, "global_step": 300504, "epoch": 1788} {"train_loss": -12.066749572753906, "global_step": 300505, "epoch": 1788} {"train_loss": -11.903027534484863, "global_step": 300506, "epoch": 1788} {"train_loss": -11.88237190246582, "global_step": 300507, "epoch": 1788} {"train_loss": -11.973883628845215, "global_step": 300508, "epoch": 1788} {"train_loss": -12.016597747802734, "global_step": 300509, "epoch": 1788} {"train_loss": -12.085897445678711, "global_step": 300510, "epoch": 1788} {"train_loss": -12.010229110717773, "global_step": 300511, "epoch": 1788} {"train_loss": -11.769088745117188, "global_step": 300512, "epoch": 1788} {"train_loss": -12.024497985839844, "global_step": 300513, "epoch": 1788} {"train_loss": -12.025832176208496, "global_step": 300514, "epoch": 1788} {"train_loss": -12.035619735717773, "global_step": 300515, "epoch": 1788} {"train_loss": -11.93368148803711, "global_step": 300516, "epoch": 1788} {"train_loss": -12.065102577209473, "global_step": 300517, "epoch": 1788} {"train_loss": -11.979677200317383, "global_step": 300518, "epoch": 1788} {"train_loss": -12.051069259643555, "global_step": 300519, "epoch": 1788} {"train_loss": -12.133458137512207, "global_step": 300520, "epoch": 1788} {"train_loss": -12.081037521362305, "global_step": 300521, "epoch": 1788} {"train_loss": -12.179872512817383, "global_step": 300522, "epoch": 1788} {"train_loss": -12.149900436401367, "global_step": 300523, "epoch": 1788} {"train_loss": -12.30345344543457, "global_step": 300524, "epoch": 1788} {"train_loss": -11.83859634399414, "global_step": 300525, "epoch": 1788} {"train_loss": -12.420086860656738, "global_step": 300526, "epoch": 1788} {"train_loss": -12.14027214050293, "global_step": 300527, "epoch": 1788} {"train_loss": -12.197137832641602, "global_step": 300528, "epoch": 1788} {"train_loss": -12.093755722045898, "global_step": 300529, "epoch": 1788} {"train_loss": -11.929298400878906, "global_step": 300530, "epoch": 1788} {"train_loss": -11.975000381469727, "global_step": 300531, "epoch": 1788} {"train_loss": -12.345949172973633, "global_step": 300532, "epoch": 1788} {"train_loss": -12.075494766235352, "global_step": 300533, "epoch": 1788} {"train_loss": -12.183958053588867, "global_step": 300534, "epoch": 1788} {"train_loss": -12.216614723205566, "global_step": 300535, "epoch": 1788} {"train_loss": -12.223384857177734, "global_step": 300536, "epoch": 1788} {"train_loss": -12.441057205200195, "global_step": 300537, "epoch": 1788} {"train_loss": -12.37488079071045, "global_step": 300538, "epoch": 1788} {"train_loss": -11.992568016052246, "global_step": 300539, "epoch": 1788} {"train_loss": -12.157964706420898, "global_step": 300540, "epoch": 1788} {"train_loss": -12.438599586486816, "global_step": 300541, "epoch": 1788} {"train_loss": -12.30883502960205, "global_step": 300542, "epoch": 1788} {"train_loss": -12.035677909851074, "global_step": 300543, "epoch": 1788} {"train_loss": -12.256383895874023, "global_step": 300544, "epoch": 1788} {"train_loss": -12.282085418701172, "global_step": 300545, "epoch": 1788} {"train_loss": -12.409271240234375, "global_step": 300546, "epoch": 1788} {"train_loss": -12.587160110473633, "global_step": 300547, "epoch": 1788} {"train_loss": -12.38371467590332, "global_step": 300548, "epoch": 1788} {"train_loss": -12.458770751953125, "global_step": 300549, "epoch": 1788} {"train_loss": -12.346847534179688, "global_step": 300550, "epoch": 1788} {"train_loss": -11.970801205862136, "global_step": 300551, "epoch": 1788, "val_loss": 281532.0625} {"train_loss": -12.41130256652832, "global_step": 300552, "epoch": 1789} {"train_loss": -12.521796226501465, "global_step": 300553, "epoch": 1789} {"train_loss": -12.404534339904785, "global_step": 300554, "epoch": 1789} {"train_loss": -12.529293060302734, "global_step": 300555, "epoch": 1789} {"train_loss": -12.35360336303711, "global_step": 300556, "epoch": 1789} {"train_loss": -12.294544219970703, "global_step": 300557, "epoch": 1789} {"train_loss": -12.465991973876953, "global_step": 300558, "epoch": 1789} {"train_loss": -12.405013084411621, "global_step": 300559, "epoch": 1789} {"train_loss": -12.15163803100586, "global_step": 300560, "epoch": 1789} {"train_loss": -12.592819213867188, "global_step": 300561, "epoch": 1789} {"train_loss": -12.30848503112793, "global_step": 300562, "epoch": 1789} {"train_loss": -12.334358215332031, "global_step": 300563, "epoch": 1789} {"train_loss": -12.404756546020508, "global_step": 300564, "epoch": 1789} {"train_loss": -12.187620162963867, "global_step": 300565, "epoch": 1789} {"train_loss": -12.058317184448242, "global_step": 300566, "epoch": 1789} {"train_loss": -12.28995132446289, "global_step": 300567, "epoch": 1789} {"train_loss": -12.440454483032227, "global_step": 300568, "epoch": 1789} {"train_loss": -11.994072914123535, "global_step": 300569, "epoch": 1789} {"train_loss": -12.30198860168457, "global_step": 300570, "epoch": 1789} {"train_loss": -12.18934154510498, "global_step": 300571, "epoch": 1789} {"train_loss": -12.068838119506836, "global_step": 300572, "epoch": 1789} {"train_loss": -11.960996627807617, "global_step": 300573, "epoch": 1789} {"train_loss": -11.763826370239258, "global_step": 300574, "epoch": 1789} {"train_loss": -11.387325286865234, "global_step": 300575, "epoch": 1789} {"train_loss": -11.939519882202148, "global_step": 300576, "epoch": 1789} {"train_loss": -11.964462280273438, "global_step": 300577, "epoch": 1789} {"train_loss": -11.714654922485352, "global_step": 300578, "epoch": 1789} {"train_loss": -11.659952163696289, "global_step": 300579, "epoch": 1789} {"train_loss": -11.193453788757324, "global_step": 300580, "epoch": 1789} {"train_loss": -12.098628997802734, "global_step": 300581, "epoch": 1789} {"train_loss": -11.424539566040039, "global_step": 300582, "epoch": 1789} {"train_loss": -11.84022045135498, "global_step": 300583, "epoch": 1789} {"train_loss": -11.547362327575684, "global_step": 300584, "epoch": 1789} {"train_loss": -11.933927536010742, "global_step": 300585, "epoch": 1789} {"train_loss": -12.274831771850586, "global_step": 300586, "epoch": 1789} {"train_loss": -11.907690048217773, "global_step": 300587, "epoch": 1789} {"train_loss": -11.478515625, "global_step": 300588, "epoch": 1789} {"train_loss": -11.433304786682129, "global_step": 300589, "epoch": 1789} {"train_loss": -12.128073692321777, "global_step": 300590, "epoch": 1789} {"train_loss": -11.535422325134277, "global_step": 300591, "epoch": 1789} {"train_loss": -10.826854705810547, "global_step": 300592, "epoch": 1789} {"train_loss": -11.6022310256958, "global_step": 300593, "epoch": 1789} {"train_loss": -12.012044906616211, "global_step": 300594, "epoch": 1789} {"train_loss": -10.736120223999023, "global_step": 300595, "epoch": 1789} {"train_loss": -11.404890060424805, "global_step": 300596, "epoch": 1789} {"train_loss": -11.155708312988281, "global_step": 300597, "epoch": 1789} {"train_loss": -10.643759727478027, "global_step": 300598, "epoch": 1789} {"train_loss": -11.719779014587402, "global_step": 300599, "epoch": 1789} {"train_loss": -12.07619857788086, "global_step": 300600, "epoch": 1789} {"train_loss": -11.589570999145508, "global_step": 300601, "epoch": 1789} {"train_loss": -11.880435943603516, "global_step": 300602, "epoch": 1789} {"train_loss": -11.769281387329102, "global_step": 300603, "epoch": 1789} {"train_loss": -11.664721488952637, "global_step": 300604, "epoch": 1789} {"train_loss": -11.105154037475586, "global_step": 300605, "epoch": 1789} {"train_loss": -11.375997543334961, "global_step": 300606, "epoch": 1789} {"train_loss": -11.950002670288086, "global_step": 300607, "epoch": 1789} {"train_loss": -12.005918502807617, "global_step": 300608, "epoch": 1789} {"train_loss": -11.899632453918457, "global_step": 300609, "epoch": 1789} {"train_loss": -11.698328018188477, "global_step": 300610, "epoch": 1789} {"train_loss": -11.982519149780273, "global_step": 300611, "epoch": 1789} {"train_loss": -11.182024002075195, "global_step": 300612, "epoch": 1789} {"train_loss": -12.214031219482422, "global_step": 300613, "epoch": 1789} {"train_loss": -11.010457038879395, "global_step": 300614, "epoch": 1789} {"train_loss": -12.163326263427734, "global_step": 300615, "epoch": 1789} {"train_loss": -10.754961013793945, "global_step": 300616, "epoch": 1789} {"train_loss": -12.173027038574219, "global_step": 300617, "epoch": 1789} {"train_loss": -11.683403968811035, "global_step": 300618, "epoch": 1789} {"train_loss": -11.921647071838379, "global_step": 300619, "epoch": 1789} {"train_loss": -11.481046676635742, "global_step": 300620, "epoch": 1789} {"train_loss": -11.812034606933594, "global_step": 300621, "epoch": 1789} {"train_loss": -11.872417449951172, "global_step": 300622, "epoch": 1789} {"train_loss": -11.54680061340332, "global_step": 300623, "epoch": 1789} {"train_loss": -11.491620063781738, "global_step": 300624, "epoch": 1789} {"train_loss": -11.801355361938477, "global_step": 300625, "epoch": 1789} {"train_loss": -11.544407844543457, "global_step": 300626, "epoch": 1789} {"train_loss": -11.567251205444336, "global_step": 300627, "epoch": 1789} {"train_loss": -11.441381454467773, "global_step": 300628, "epoch": 1789} {"train_loss": -11.251564025878906, "global_step": 300629, "epoch": 1789} {"train_loss": -11.945524215698242, "global_step": 300630, "epoch": 1789} {"train_loss": -11.793670654296875, "global_step": 300631, "epoch": 1789} {"train_loss": -11.930621147155762, "global_step": 300632, "epoch": 1789} {"train_loss": -11.741358757019043, "global_step": 300633, "epoch": 1789} {"train_loss": -12.052124977111816, "global_step": 300634, "epoch": 1789} {"train_loss": -11.885639190673828, "global_step": 300635, "epoch": 1789} {"train_loss": -12.103524208068848, "global_step": 300636, "epoch": 1789} {"train_loss": -11.718522071838379, "global_step": 300637, "epoch": 1789} {"train_loss": -12.182611465454102, "global_step": 300638, "epoch": 1789} {"train_loss": -11.444148063659668, "global_step": 300639, "epoch": 1789} {"train_loss": -11.912257194519043, "global_step": 300640, "epoch": 1789} {"train_loss": -11.916655540466309, "global_step": 300641, "epoch": 1789} {"train_loss": -11.457643508911133, "global_step": 300642, "epoch": 1789} {"train_loss": -12.098064422607422, "global_step": 300643, "epoch": 1789} {"train_loss": -10.709098815917969, "global_step": 300644, "epoch": 1789} {"train_loss": -12.142620086669922, "global_step": 300645, "epoch": 1789} {"train_loss": -10.867149353027344, "global_step": 300646, "epoch": 1789} {"train_loss": -11.682657241821289, "global_step": 300647, "epoch": 1789} {"train_loss": -11.865459442138672, "global_step": 300648, "epoch": 1789} {"train_loss": -11.4105863571167, "global_step": 300649, "epoch": 1789} {"train_loss": -11.899872779846191, "global_step": 300650, "epoch": 1789} {"train_loss": -10.689125061035156, "global_step": 300651, "epoch": 1789} {"train_loss": -12.425569534301758, "global_step": 300652, "epoch": 1789} {"train_loss": -10.622645378112793, "global_step": 300653, "epoch": 1789} {"train_loss": -11.927309036254883, "global_step": 300654, "epoch": 1789} {"train_loss": -11.083381652832031, "global_step": 300655, "epoch": 1789} {"train_loss": -11.646584510803223, "global_step": 300656, "epoch": 1789} {"train_loss": -11.439149856567383, "global_step": 300657, "epoch": 1789} {"train_loss": -11.792818069458008, "global_step": 300658, "epoch": 1789} {"train_loss": -11.820405006408691, "global_step": 300659, "epoch": 1789} {"train_loss": -11.520524978637695, "global_step": 300660, "epoch": 1789} {"train_loss": -12.002006530761719, "global_step": 300661, "epoch": 1789} {"train_loss": -11.82116413116455, "global_step": 300662, "epoch": 1789} {"train_loss": -11.684799194335938, "global_step": 300663, "epoch": 1789} {"train_loss": -11.772483825683594, "global_step": 300664, "epoch": 1789} {"train_loss": -11.814775466918945, "global_step": 300665, "epoch": 1789} {"train_loss": -11.91217041015625, "global_step": 300666, "epoch": 1789} {"train_loss": -11.861871719360352, "global_step": 300667, "epoch": 1789} {"train_loss": -11.95462417602539, "global_step": 300668, "epoch": 1789} {"train_loss": -11.757519721984863, "global_step": 300669, "epoch": 1789} {"train_loss": -12.091300964355469, "global_step": 300670, "epoch": 1789} {"train_loss": -11.47365951538086, "global_step": 300671, "epoch": 1789} {"train_loss": -11.674202919006348, "global_step": 300672, "epoch": 1789} {"train_loss": -10.520269393920898, "global_step": 300673, "epoch": 1789} {"train_loss": -12.114554405212402, "global_step": 300674, "epoch": 1789} {"train_loss": -11.662724494934082, "global_step": 300675, "epoch": 1789} {"train_loss": -11.035179138183594, "global_step": 300676, "epoch": 1789} {"train_loss": -11.638575553894043, "global_step": 300677, "epoch": 1789} {"train_loss": -11.723970413208008, "global_step": 300678, "epoch": 1789} {"train_loss": -10.873991012573242, "global_step": 300679, "epoch": 1789} {"train_loss": -11.413127899169922, "global_step": 300680, "epoch": 1789} {"train_loss": -11.435916900634766, "global_step": 300681, "epoch": 1789} {"train_loss": -11.72782039642334, "global_step": 300682, "epoch": 1789} {"train_loss": -11.134425163269043, "global_step": 300683, "epoch": 1789} {"train_loss": -11.818857192993164, "global_step": 300684, "epoch": 1789} {"train_loss": -11.364182472229004, "global_step": 300685, "epoch": 1789} {"train_loss": -11.66677474975586, "global_step": 300686, "epoch": 1789} {"train_loss": -12.23403549194336, "global_step": 300687, "epoch": 1789} {"train_loss": -11.582975387573242, "global_step": 300688, "epoch": 1789} {"train_loss": -12.020170211791992, "global_step": 300689, "epoch": 1789} {"train_loss": -11.775318145751953, "global_step": 300690, "epoch": 1789} {"train_loss": -11.690442085266113, "global_step": 300691, "epoch": 1789} {"train_loss": -11.731729507446289, "global_step": 300692, "epoch": 1789} {"train_loss": -12.077345848083496, "global_step": 300693, "epoch": 1789} {"train_loss": -11.83464241027832, "global_step": 300694, "epoch": 1789} {"train_loss": -11.96213150024414, "global_step": 300695, "epoch": 1789} {"train_loss": -11.960433959960938, "global_step": 300696, "epoch": 1789} {"train_loss": -11.856406211853027, "global_step": 300697, "epoch": 1789} {"train_loss": -12.054773330688477, "global_step": 300698, "epoch": 1789} {"train_loss": -12.031660079956055, "global_step": 300699, "epoch": 1789} {"train_loss": -12.099862098693848, "global_step": 300700, "epoch": 1789} {"train_loss": -12.207954406738281, "global_step": 300701, "epoch": 1789} {"train_loss": -12.030618667602539, "global_step": 300702, "epoch": 1789} {"train_loss": -11.962808609008789, "global_step": 300703, "epoch": 1789} {"train_loss": -12.342340469360352, "global_step": 300704, "epoch": 1789} {"train_loss": -12.089134216308594, "global_step": 300705, "epoch": 1789} {"train_loss": -12.038640975952148, "global_step": 300706, "epoch": 1789} {"train_loss": -12.172673225402832, "global_step": 300707, "epoch": 1789} {"train_loss": -12.069028854370117, "global_step": 300708, "epoch": 1789} {"train_loss": -12.144601821899414, "global_step": 300709, "epoch": 1789} {"train_loss": -12.15559196472168, "global_step": 300710, "epoch": 1789} {"train_loss": -12.037310600280762, "global_step": 300711, "epoch": 1789} {"train_loss": -12.175539016723633, "global_step": 300712, "epoch": 1789} {"train_loss": -12.09685230255127, "global_step": 300713, "epoch": 1789} {"train_loss": -11.78265380859375, "global_step": 300714, "epoch": 1789} {"train_loss": -11.789617538452148, "global_step": 300715, "epoch": 1789} {"train_loss": -12.30501651763916, "global_step": 300716, "epoch": 1789} {"train_loss": -11.798389434814453, "global_step": 300717, "epoch": 1789} {"train_loss": -12.183507919311523, "global_step": 300718, "epoch": 1789} {"train_loss": -11.797083741142636, "global_step": 300719, "epoch": 1789, "val_loss": 279807.0625} {"train_loss": -12.060829162597656, "global_step": 300720, "epoch": 1790} {"train_loss": -12.277203559875488, "global_step": 300721, "epoch": 1790} {"train_loss": -12.203399658203125, "global_step": 300722, "epoch": 1790} {"train_loss": -12.120755195617676, "global_step": 300723, "epoch": 1790} {"train_loss": -12.344176292419434, "global_step": 300724, "epoch": 1790} {"train_loss": -12.44414234161377, "global_step": 300725, "epoch": 1790} {"train_loss": -12.401832580566406, "global_step": 300726, "epoch": 1790} {"train_loss": -12.27322006225586, "global_step": 300727, "epoch": 1790} {"train_loss": -12.02029037475586, "global_step": 300728, "epoch": 1790} {"train_loss": -12.245429039001465, "global_step": 300729, "epoch": 1790} {"train_loss": -12.410033226013184, "global_step": 300730, "epoch": 1790} {"train_loss": -12.390264511108398, "global_step": 300731, "epoch": 1790} {"train_loss": -12.18280029296875, "global_step": 300732, "epoch": 1790} {"train_loss": -12.378754615783691, "global_step": 300733, "epoch": 1790} {"train_loss": -12.105586051940918, "global_step": 300734, "epoch": 1790} {"train_loss": -12.174797058105469, "global_step": 300735, "epoch": 1790} {"train_loss": -12.118897438049316, "global_step": 300736, "epoch": 1790} {"train_loss": -12.134744644165039, "global_step": 300737, "epoch": 1790} {"train_loss": -11.630033493041992, "global_step": 300738, "epoch": 1790} {"train_loss": -12.210857391357422, "global_step": 300739, "epoch": 1790} {"train_loss": -12.088126182556152, "global_step": 300740, "epoch": 1790} {"train_loss": -11.374704360961914, "global_step": 300741, "epoch": 1790} {"train_loss": -11.907584190368652, "global_step": 300742, "epoch": 1790} {"train_loss": -11.859050750732422, "global_step": 300743, "epoch": 1790} {"train_loss": -11.594736099243164, "global_step": 300744, "epoch": 1790} {"train_loss": -12.054595947265625, "global_step": 300745, "epoch": 1790} {"train_loss": -11.793150901794434, "global_step": 300746, "epoch": 1790} {"train_loss": -11.957155227661133, "global_step": 300747, "epoch": 1790} {"train_loss": -11.832443237304688, "global_step": 300748, "epoch": 1790} {"train_loss": -11.994184494018555, "global_step": 300749, "epoch": 1790} {"train_loss": -11.918033599853516, "global_step": 300750, "epoch": 1790} {"train_loss": -11.278980255126953, "global_step": 300751, "epoch": 1790} {"train_loss": -11.37077522277832, "global_step": 300752, "epoch": 1790} {"train_loss": -11.176523208618164, "global_step": 300753, "epoch": 1790} {"train_loss": -11.240234375, "global_step": 300754, "epoch": 1790} {"train_loss": -11.49799633026123, "global_step": 300755, "epoch": 1790} {"train_loss": -10.931471824645996, "global_step": 300756, "epoch": 1790} {"train_loss": -11.135226249694824, "global_step": 300757, "epoch": 1790} {"train_loss": -11.427943229675293, "global_step": 300758, "epoch": 1790} {"train_loss": -11.295215606689453, "global_step": 300759, "epoch": 1790} {"train_loss": -11.713431358337402, "global_step": 300760, "epoch": 1790} {"train_loss": -10.729816436767578, "global_step": 300761, "epoch": 1790} {"train_loss": -11.60864543914795, "global_step": 300762, "epoch": 1790} {"train_loss": -11.561342239379883, "global_step": 300763, "epoch": 1790} {"train_loss": -10.645417213439941, "global_step": 300764, "epoch": 1790} {"train_loss": -11.529937744140625, "global_step": 300765, "epoch": 1790} {"train_loss": -11.646297454833984, "global_step": 300766, "epoch": 1790} {"train_loss": -11.824394226074219, "global_step": 300767, "epoch": 1790} {"train_loss": -11.735635757446289, "global_step": 300768, "epoch": 1790} {"train_loss": -11.912128448486328, "global_step": 300769, "epoch": 1790} {"train_loss": -11.154077529907227, "global_step": 300770, "epoch": 1790} {"train_loss": -12.38557243347168, "global_step": 300771, "epoch": 1790} {"train_loss": -11.135364532470703, "global_step": 300772, "epoch": 1790} {"train_loss": -11.186480522155762, "global_step": 300773, "epoch": 1790} {"train_loss": -11.992610931396484, "global_step": 300774, "epoch": 1790} {"train_loss": -11.154911041259766, "global_step": 300775, "epoch": 1790} {"train_loss": -11.805928230285645, "global_step": 300776, "epoch": 1790} {"train_loss": -11.634672164916992, "global_step": 300777, "epoch": 1790} {"train_loss": -12.135438919067383, "global_step": 300778, "epoch": 1790} {"train_loss": -11.680793762207031, "global_step": 300779, "epoch": 1790} {"train_loss": -11.70806884765625, "global_step": 300780, "epoch": 1790} {"train_loss": -11.967306137084961, "global_step": 300781, "epoch": 1790} {"train_loss": -11.881450653076172, "global_step": 300782, "epoch": 1790} {"train_loss": -11.946321487426758, "global_step": 300783, "epoch": 1790} {"train_loss": -12.107829093933105, "global_step": 300784, "epoch": 1790} {"train_loss": -11.432938575744629, "global_step": 300785, "epoch": 1790} {"train_loss": -11.974781036376953, "global_step": 300786, "epoch": 1790} {"train_loss": -11.7062406539917, "global_step": 300787, "epoch": 1790} {"train_loss": -12.049201011657715, "global_step": 300788, "epoch": 1790} {"train_loss": -11.907415390014648, "global_step": 300789, "epoch": 1790} {"train_loss": -12.144710540771484, "global_step": 300790, "epoch": 1790} {"train_loss": -11.931260108947754, "global_step": 300791, "epoch": 1790} {"train_loss": -11.939953804016113, "global_step": 300792, "epoch": 1790} {"train_loss": -12.117388725280762, "global_step": 300793, "epoch": 1790} {"train_loss": -11.993890762329102, "global_step": 300794, "epoch": 1790} {"train_loss": -12.114612579345703, "global_step": 300795, "epoch": 1790} {"train_loss": -11.481059074401855, "global_step": 300796, "epoch": 1790} {"train_loss": -11.234574317932129, "global_step": 300797, "epoch": 1790} {"train_loss": -12.185724258422852, "global_step": 300798, "epoch": 1790} {"train_loss": -11.908590316772461, "global_step": 300799, "epoch": 1790} {"train_loss": -11.859704971313477, "global_step": 300800, "epoch": 1790} {"train_loss": -12.199272155761719, "global_step": 300801, "epoch": 1790} {"train_loss": -11.83774185180664, "global_step": 300802, "epoch": 1790} {"train_loss": -12.154293060302734, "global_step": 300803, "epoch": 1790} {"train_loss": -12.059144020080566, "global_step": 300804, "epoch": 1790} {"train_loss": -12.076406478881836, "global_step": 300805, "epoch": 1790} {"train_loss": -11.858755111694336, "global_step": 300806, "epoch": 1790} {"train_loss": -11.656630516052246, "global_step": 300807, "epoch": 1790} {"train_loss": -12.194751739501953, "global_step": 300808, "epoch": 1790} {"train_loss": -11.950826644897461, "global_step": 300809, "epoch": 1790} {"train_loss": -12.11033821105957, "global_step": 300810, "epoch": 1790} {"train_loss": -12.191230773925781, "global_step": 300811, "epoch": 1790} {"train_loss": -12.055147171020508, "global_step": 300812, "epoch": 1790} {"train_loss": -12.076183319091797, "global_step": 300813, "epoch": 1790} {"train_loss": -12.195022583007812, "global_step": 300814, "epoch": 1790} {"train_loss": -11.950386047363281, "global_step": 300815, "epoch": 1790} {"train_loss": -11.770917892456055, "global_step": 300816, "epoch": 1790} {"train_loss": -12.375221252441406, "global_step": 300817, "epoch": 1790} {"train_loss": -11.93801498413086, "global_step": 300818, "epoch": 1790} {"train_loss": -12.197296142578125, "global_step": 300819, "epoch": 1790} {"train_loss": -12.077460289001465, "global_step": 300820, "epoch": 1790} {"train_loss": -12.113668441772461, "global_step": 300821, "epoch": 1790} {"train_loss": -12.098993301391602, "global_step": 300822, "epoch": 1790} {"train_loss": -12.149856567382812, "global_step": 300823, "epoch": 1790} {"train_loss": -12.417762756347656, "global_step": 300824, "epoch": 1790} {"train_loss": -11.890875816345215, "global_step": 300825, "epoch": 1790} {"train_loss": -12.247004508972168, "global_step": 300826, "epoch": 1790} {"train_loss": -12.2106351852417, "global_step": 300827, "epoch": 1790} {"train_loss": -12.18266487121582, "global_step": 300828, "epoch": 1790} {"train_loss": -11.856060028076172, "global_step": 300829, "epoch": 1790} {"train_loss": -12.325319290161133, "global_step": 300830, "epoch": 1790} {"train_loss": -12.070311546325684, "global_step": 300831, "epoch": 1790} {"train_loss": -11.748706817626953, "global_step": 300832, "epoch": 1790} {"train_loss": -12.236462593078613, "global_step": 300833, "epoch": 1790} {"train_loss": -11.926565170288086, "global_step": 300834, "epoch": 1790} {"train_loss": -12.129378318786621, "global_step": 300835, "epoch": 1790} {"train_loss": -12.018604278564453, "global_step": 300836, "epoch": 1790} {"train_loss": -12.001815795898438, "global_step": 300837, "epoch": 1790} {"train_loss": -11.278369903564453, "global_step": 300838, "epoch": 1790} {"train_loss": -10.9317626953125, "global_step": 300839, "epoch": 1790} {"train_loss": -11.311850547790527, "global_step": 300840, "epoch": 1790} {"train_loss": -12.160137176513672, "global_step": 300841, "epoch": 1790} {"train_loss": -10.673585891723633, "global_step": 300842, "epoch": 1790} {"train_loss": -12.014095306396484, "global_step": 300843, "epoch": 1790} {"train_loss": -11.653712272644043, "global_step": 300844, "epoch": 1790} {"train_loss": -11.700942993164062, "global_step": 300845, "epoch": 1790} {"train_loss": -11.91916275024414, "global_step": 300846, "epoch": 1790} {"train_loss": -11.767362594604492, "global_step": 300847, "epoch": 1790} {"train_loss": -11.475397109985352, "global_step": 300848, "epoch": 1790} {"train_loss": -12.070056915283203, "global_step": 300849, "epoch": 1790} {"train_loss": -11.444829940795898, "global_step": 300850, "epoch": 1790} {"train_loss": -12.229202270507812, "global_step": 300851, "epoch": 1790} {"train_loss": -11.549816131591797, "global_step": 300852, "epoch": 1790} {"train_loss": -11.51952838897705, "global_step": 300853, "epoch": 1790} {"train_loss": -11.589515686035156, "global_step": 300854, "epoch": 1790} {"train_loss": -11.512929916381836, "global_step": 300855, "epoch": 1790} {"train_loss": -12.27676773071289, "global_step": 300856, "epoch": 1790} {"train_loss": -11.524295806884766, "global_step": 300857, "epoch": 1790} {"train_loss": -11.836427688598633, "global_step": 300858, "epoch": 1790} {"train_loss": -11.985581398010254, "global_step": 300859, "epoch": 1790} {"train_loss": -11.71717643737793, "global_step": 300860, "epoch": 1790} {"train_loss": -12.08201789855957, "global_step": 300861, "epoch": 1790} {"train_loss": -11.55723762512207, "global_step": 300862, "epoch": 1790} {"train_loss": -11.484594345092773, "global_step": 300863, "epoch": 1790} {"train_loss": -11.826851844787598, "global_step": 300864, "epoch": 1790} {"train_loss": -11.326123237609863, "global_step": 300865, "epoch": 1790} {"train_loss": -11.97906494140625, "global_step": 300866, "epoch": 1790} {"train_loss": -11.62593936920166, "global_step": 300867, "epoch": 1790} {"train_loss": -11.982470512390137, "global_step": 300868, "epoch": 1790} {"train_loss": -11.3388671875, "global_step": 300869, "epoch": 1790} {"train_loss": -12.169107437133789, "global_step": 300870, "epoch": 1790} {"train_loss": -11.231061935424805, "global_step": 300871, "epoch": 1790} {"train_loss": -11.801794052124023, "global_step": 300872, "epoch": 1790} {"train_loss": -11.473630905151367, "global_step": 300873, "epoch": 1790} {"train_loss": -11.362314224243164, "global_step": 300874, "epoch": 1790} {"train_loss": -11.25643539428711, "global_step": 300875, "epoch": 1790} {"train_loss": -11.778995513916016, "global_step": 300876, "epoch": 1790} {"train_loss": -11.692506790161133, "global_step": 300877, "epoch": 1790} {"train_loss": -11.801692962646484, "global_step": 300878, "epoch": 1790} {"train_loss": -11.911253929138184, "global_step": 300879, "epoch": 1790} {"train_loss": -11.95656967163086, "global_step": 300880, "epoch": 1790} {"train_loss": -11.46066951751709, "global_step": 300881, "epoch": 1790} {"train_loss": -12.240320205688477, "global_step": 300882, "epoch": 1790} {"train_loss": -11.681694030761719, "global_step": 300883, "epoch": 1790} {"train_loss": -12.03795051574707, "global_step": 300884, "epoch": 1790} {"train_loss": -12.066442489624023, "global_step": 300885, "epoch": 1790} {"train_loss": -11.820539474487305, "global_step": 300886, "epoch": 1790} {"train_loss": -11.836673770632062, "global_step": 300887, "epoch": 1790, "val_loss": 283011.03125, "train_action_mse_error": 6.483133316040039} {"train_loss": -11.814865112304688, "global_step": 300888, "epoch": 1791} {"train_loss": -12.074607849121094, "global_step": 300889, "epoch": 1791} {"train_loss": -12.304962158203125, "global_step": 300890, "epoch": 1791} {"train_loss": -12.016490936279297, "global_step": 300891, "epoch": 1791} {"train_loss": -12.189645767211914, "global_step": 300892, "epoch": 1791} {"train_loss": -11.972511291503906, "global_step": 300893, "epoch": 1791} {"train_loss": -11.077531814575195, "global_step": 300894, "epoch": 1791} {"train_loss": -12.026697158813477, "global_step": 300895, "epoch": 1791} {"train_loss": -11.7611083984375, "global_step": 300896, "epoch": 1791} {"train_loss": -11.396614074707031, "global_step": 300897, "epoch": 1791} {"train_loss": -11.731819152832031, "global_step": 300898, "epoch": 1791} {"train_loss": -11.205385208129883, "global_step": 300899, "epoch": 1791} {"train_loss": -11.77808952331543, "global_step": 300900, "epoch": 1791} {"train_loss": -9.99653148651123, "global_step": 300901, "epoch": 1791} {"train_loss": -12.059269905090332, "global_step": 300902, "epoch": 1791} {"train_loss": -10.80604362487793, "global_step": 300903, "epoch": 1791} {"train_loss": -11.379629135131836, "global_step": 300904, "epoch": 1791} {"train_loss": -11.605859756469727, "global_step": 300905, "epoch": 1791} {"train_loss": -11.445951461791992, "global_step": 300906, "epoch": 1791} {"train_loss": -11.724328994750977, "global_step": 300907, "epoch": 1791} {"train_loss": -10.774942398071289, "global_step": 300908, "epoch": 1791} {"train_loss": -11.89931869506836, "global_step": 300909, "epoch": 1791} {"train_loss": -11.749303817749023, "global_step": 300910, "epoch": 1791} {"train_loss": -11.308822631835938, "global_step": 300911, "epoch": 1791} {"train_loss": -11.470176696777344, "global_step": 300912, "epoch": 1791} {"train_loss": -11.340827941894531, "global_step": 300913, "epoch": 1791} {"train_loss": -11.850086212158203, "global_step": 300914, "epoch": 1791} {"train_loss": -11.630674362182617, "global_step": 300915, "epoch": 1791} {"train_loss": -11.193458557128906, "global_step": 300916, "epoch": 1791} {"train_loss": -11.824851989746094, "global_step": 300917, "epoch": 1791} {"train_loss": -11.596867561340332, "global_step": 300918, "epoch": 1791} {"train_loss": -11.564428329467773, "global_step": 300919, "epoch": 1791} {"train_loss": -11.452634811401367, "global_step": 300920, "epoch": 1791} {"train_loss": -11.602571487426758, "global_step": 300921, "epoch": 1791} {"train_loss": -11.706503868103027, "global_step": 300922, "epoch": 1791} {"train_loss": -11.877764701843262, "global_step": 300923, "epoch": 1791} {"train_loss": -12.071919441223145, "global_step": 300924, "epoch": 1791} {"train_loss": -11.78829288482666, "global_step": 300925, "epoch": 1791} {"train_loss": -12.009531021118164, "global_step": 300926, "epoch": 1791} {"train_loss": -11.83763313293457, "global_step": 300927, "epoch": 1791} {"train_loss": -11.620229721069336, "global_step": 300928, "epoch": 1791} {"train_loss": -11.834840774536133, "global_step": 300929, "epoch": 1791} {"train_loss": -11.520357131958008, "global_step": 300930, "epoch": 1791} {"train_loss": -11.859712600708008, "global_step": 300931, "epoch": 1791} {"train_loss": -11.69266414642334, "global_step": 300932, "epoch": 1791} {"train_loss": -11.856343269348145, "global_step": 300933, "epoch": 1791} {"train_loss": -12.010284423828125, "global_step": 300934, "epoch": 1791} {"train_loss": -11.887407302856445, "global_step": 300935, "epoch": 1791} {"train_loss": -11.805506706237793, "global_step": 300936, "epoch": 1791} {"train_loss": -12.11115837097168, "global_step": 300937, "epoch": 1791} {"train_loss": -11.998601913452148, "global_step": 300938, "epoch": 1791} {"train_loss": -12.030715942382812, "global_step": 300939, "epoch": 1791} {"train_loss": -12.009477615356445, "global_step": 300940, "epoch": 1791} {"train_loss": -12.012475967407227, "global_step": 300941, "epoch": 1791} {"train_loss": -11.912055969238281, "global_step": 300942, "epoch": 1791} {"train_loss": -11.890069961547852, "global_step": 300943, "epoch": 1791} {"train_loss": -12.295366287231445, "global_step": 300944, "epoch": 1791} {"train_loss": -12.03493595123291, "global_step": 300945, "epoch": 1791} {"train_loss": -12.234793663024902, "global_step": 300946, "epoch": 1791} {"train_loss": -11.604423522949219, "global_step": 300947, "epoch": 1791} {"train_loss": -12.166168212890625, "global_step": 300948, "epoch": 1791} {"train_loss": -12.188312530517578, "global_step": 300949, "epoch": 1791} {"train_loss": -11.864693641662598, "global_step": 300950, "epoch": 1791} {"train_loss": -11.879059791564941, "global_step": 300951, "epoch": 1791} {"train_loss": -11.79146957397461, "global_step": 300952, "epoch": 1791} {"train_loss": -12.201845169067383, "global_step": 300953, "epoch": 1791} {"train_loss": -11.802947998046875, "global_step": 300954, "epoch": 1791} {"train_loss": -12.171427726745605, "global_step": 300955, "epoch": 1791} {"train_loss": -11.97283935546875, "global_step": 300956, "epoch": 1791} {"train_loss": -12.177282333374023, "global_step": 300957, "epoch": 1791} {"train_loss": -12.513452529907227, "global_step": 300958, "epoch": 1791} {"train_loss": -12.266101837158203, "global_step": 300959, "epoch": 1791} {"train_loss": -12.296329498291016, "global_step": 300960, "epoch": 1791} {"train_loss": -11.91338062286377, "global_step": 300961, "epoch": 1791} {"train_loss": -12.394775390625, "global_step": 300962, "epoch": 1791} {"train_loss": -11.88553524017334, "global_step": 300963, "epoch": 1791} {"train_loss": -12.332202911376953, "global_step": 300964, "epoch": 1791} {"train_loss": -11.906011581420898, "global_step": 300965, "epoch": 1791} {"train_loss": -12.26960563659668, "global_step": 300966, "epoch": 1791} {"train_loss": -12.138307571411133, "global_step": 300967, "epoch": 1791} {"train_loss": -12.060701370239258, "global_step": 300968, "epoch": 1791} {"train_loss": -11.806979179382324, "global_step": 300969, "epoch": 1791} {"train_loss": -11.817902565002441, "global_step": 300970, "epoch": 1791} {"train_loss": -12.03672981262207, "global_step": 300971, "epoch": 1791} {"train_loss": -12.299914360046387, "global_step": 300972, "epoch": 1791} {"train_loss": -11.69468879699707, "global_step": 300973, "epoch": 1791} {"train_loss": -12.258463859558105, "global_step": 300974, "epoch": 1791} {"train_loss": -11.331570625305176, "global_step": 300975, "epoch": 1791} {"train_loss": -12.022457122802734, "global_step": 300976, "epoch": 1791} {"train_loss": -11.637616157531738, "global_step": 300977, "epoch": 1791} {"train_loss": -11.833503723144531, "global_step": 300978, "epoch": 1791} {"train_loss": -11.887954711914062, "global_step": 300979, "epoch": 1791} {"train_loss": -11.74077320098877, "global_step": 300980, "epoch": 1791} {"train_loss": -12.025327682495117, "global_step": 300981, "epoch": 1791} {"train_loss": -12.20599365234375, "global_step": 300982, "epoch": 1791} {"train_loss": -11.894445419311523, "global_step": 300983, "epoch": 1791} {"train_loss": -12.263318061828613, "global_step": 300984, "epoch": 1791} {"train_loss": -11.596517562866211, "global_step": 300985, "epoch": 1791} {"train_loss": -11.963451385498047, "global_step": 300986, "epoch": 1791} {"train_loss": -11.6123046875, "global_step": 300987, "epoch": 1791} {"train_loss": -11.78825569152832, "global_step": 300988, "epoch": 1791} {"train_loss": -12.417841911315918, "global_step": 300989, "epoch": 1791} {"train_loss": -12.07829475402832, "global_step": 300990, "epoch": 1791} {"train_loss": -12.233007431030273, "global_step": 300991, "epoch": 1791} {"train_loss": -12.078969955444336, "global_step": 300992, "epoch": 1791} {"train_loss": -12.304291725158691, "global_step": 300993, "epoch": 1791} {"train_loss": -12.297283172607422, "global_step": 300994, "epoch": 1791} {"train_loss": -12.198087692260742, "global_step": 300995, "epoch": 1791} {"train_loss": -12.235698699951172, "global_step": 300996, "epoch": 1791} {"train_loss": -12.083968162536621, "global_step": 300997, "epoch": 1791} {"train_loss": -11.858945846557617, "global_step": 300998, "epoch": 1791} {"train_loss": -12.399561882019043, "global_step": 300999, "epoch": 1791} {"train_loss": -11.411145210266113, "global_step": 301000, "epoch": 1791} {"train_loss": -12.228515625, "global_step": 301001, "epoch": 1791} {"train_loss": -12.111660957336426, "global_step": 301002, "epoch": 1791} {"train_loss": -12.295927047729492, "global_step": 301003, "epoch": 1791} {"train_loss": -12.092151641845703, "global_step": 301004, "epoch": 1791} {"train_loss": -12.342506408691406, "global_step": 301005, "epoch": 1791} {"train_loss": -12.169639587402344, "global_step": 301006, "epoch": 1791} {"train_loss": -12.330047607421875, "global_step": 301007, "epoch": 1791} {"train_loss": -12.103555679321289, "global_step": 301008, "epoch": 1791} {"train_loss": -12.222930908203125, "global_step": 301009, "epoch": 1791} {"train_loss": -12.53451919555664, "global_step": 301010, "epoch": 1791} {"train_loss": -12.052604675292969, "global_step": 301011, "epoch": 1791} {"train_loss": -12.067275047302246, "global_step": 301012, "epoch": 1791} {"train_loss": -12.395149230957031, "global_step": 301013, "epoch": 1791} {"train_loss": -12.028249740600586, "global_step": 301014, "epoch": 1791} {"train_loss": -12.253061294555664, "global_step": 301015, "epoch": 1791} {"train_loss": -12.190101623535156, "global_step": 301016, "epoch": 1791} {"train_loss": -11.699235916137695, "global_step": 301017, "epoch": 1791} {"train_loss": -12.236845016479492, "global_step": 301018, "epoch": 1791} {"train_loss": -11.232524871826172, "global_step": 301019, "epoch": 1791} {"train_loss": -11.906846046447754, "global_step": 301020, "epoch": 1791} {"train_loss": -11.141168594360352, "global_step": 301021, "epoch": 1791} {"train_loss": -12.201766967773438, "global_step": 301022, "epoch": 1791} {"train_loss": -10.620742797851562, "global_step": 301023, "epoch": 1791} {"train_loss": -11.844898223876953, "global_step": 301024, "epoch": 1791} {"train_loss": -11.531015396118164, "global_step": 301025, "epoch": 1791} {"train_loss": -10.984851837158203, "global_step": 301026, "epoch": 1791} {"train_loss": -10.367599487304688, "global_step": 301027, "epoch": 1791} {"train_loss": -11.904980659484863, "global_step": 301028, "epoch": 1791} {"train_loss": -10.636370658874512, "global_step": 301029, "epoch": 1791} {"train_loss": -10.735862731933594, "global_step": 301030, "epoch": 1791} {"train_loss": -11.113611221313477, "global_step": 301031, "epoch": 1791} {"train_loss": -11.160614967346191, "global_step": 301032, "epoch": 1791} {"train_loss": -10.47420597076416, "global_step": 301033, "epoch": 1791} {"train_loss": -11.789939880371094, "global_step": 301034, "epoch": 1791} {"train_loss": -11.370386123657227, "global_step": 301035, "epoch": 1791} {"train_loss": -11.136972427368164, "global_step": 301036, "epoch": 1791} {"train_loss": -11.413738250732422, "global_step": 301037, "epoch": 1791} {"train_loss": -11.446794509887695, "global_step": 301038, "epoch": 1791} {"train_loss": -11.867734909057617, "global_step": 301039, "epoch": 1791} {"train_loss": -11.712630271911621, "global_step": 301040, "epoch": 1791} {"train_loss": -12.050821304321289, "global_step": 301041, "epoch": 1791} {"train_loss": -11.43566608428955, "global_step": 301042, "epoch": 1791} {"train_loss": -12.382369995117188, "global_step": 301043, "epoch": 1791} {"train_loss": -11.780925750732422, "global_step": 301044, "epoch": 1791} {"train_loss": -11.963628768920898, "global_step": 301045, "epoch": 1791} {"train_loss": -11.951775550842285, "global_step": 301046, "epoch": 1791} {"train_loss": -11.712956428527832, "global_step": 301047, "epoch": 1791} {"train_loss": -11.602373123168945, "global_step": 301048, "epoch": 1791} {"train_loss": -11.042068481445312, "global_step": 301049, "epoch": 1791} {"train_loss": -11.878835678100586, "global_step": 301050, "epoch": 1791} {"train_loss": -11.954086303710938, "global_step": 301051, "epoch": 1791} {"train_loss": -11.54380989074707, "global_step": 301052, "epoch": 1791} {"train_loss": -11.458112716674805, "global_step": 301053, "epoch": 1791} {"train_loss": -11.231653213500977, "global_step": 301054, "epoch": 1791} {"train_loss": -11.813136793318249, "global_step": 301055, "epoch": 1791, "val_loss": 279063.0625} {"train_loss": -11.992531776428223, "global_step": 301056, "epoch": 1792} {"train_loss": -11.968154907226562, "global_step": 301057, "epoch": 1792} {"train_loss": -11.970685005187988, "global_step": 301058, "epoch": 1792} {"train_loss": -11.955408096313477, "global_step": 301059, "epoch": 1792} {"train_loss": -12.075864791870117, "global_step": 301060, "epoch": 1792} {"train_loss": -12.172403335571289, "global_step": 301061, "epoch": 1792} {"train_loss": -12.114785194396973, "global_step": 301062, "epoch": 1792} {"train_loss": -12.12350845336914, "global_step": 301063, "epoch": 1792} {"train_loss": -12.113715171813965, "global_step": 301064, "epoch": 1792} {"train_loss": -12.166130065917969, "global_step": 301065, "epoch": 1792} {"train_loss": -12.422916412353516, "global_step": 301066, "epoch": 1792} {"train_loss": -11.965513229370117, "global_step": 301067, "epoch": 1792} {"train_loss": -12.070441246032715, "global_step": 301068, "epoch": 1792} {"train_loss": -12.257750511169434, "global_step": 301069, "epoch": 1792} {"train_loss": -11.839240074157715, "global_step": 301070, "epoch": 1792} {"train_loss": -12.115171432495117, "global_step": 301071, "epoch": 1792} {"train_loss": -11.801424026489258, "global_step": 301072, "epoch": 1792} {"train_loss": -12.140443801879883, "global_step": 301073, "epoch": 1792} {"train_loss": -12.231247901916504, "global_step": 301074, "epoch": 1792} {"train_loss": -11.855995178222656, "global_step": 301075, "epoch": 1792} {"train_loss": -12.205037117004395, "global_step": 301076, "epoch": 1792} {"train_loss": -11.962549209594727, "global_step": 301077, "epoch": 1792} {"train_loss": -12.118905067443848, "global_step": 301078, "epoch": 1792} {"train_loss": -12.142348289489746, "global_step": 301079, "epoch": 1792} {"train_loss": -12.06131362915039, "global_step": 301080, "epoch": 1792} {"train_loss": -12.335386276245117, "global_step": 301081, "epoch": 1792} {"train_loss": -12.134013175964355, "global_step": 301082, "epoch": 1792} {"train_loss": -12.031393051147461, "global_step": 301083, "epoch": 1792} {"train_loss": -12.023429870605469, "global_step": 301084, "epoch": 1792} {"train_loss": -12.08907699584961, "global_step": 301085, "epoch": 1792} {"train_loss": -12.000116348266602, "global_step": 301086, "epoch": 1792} {"train_loss": -11.955978393554688, "global_step": 301087, "epoch": 1792} {"train_loss": -12.264606475830078, "global_step": 301088, "epoch": 1792} {"train_loss": -12.20046615600586, "global_step": 301089, "epoch": 1792} {"train_loss": -12.388847351074219, "global_step": 301090, "epoch": 1792} {"train_loss": -12.03349494934082, "global_step": 301091, "epoch": 1792} {"train_loss": -12.257065773010254, "global_step": 301092, "epoch": 1792} {"train_loss": -12.252388000488281, "global_step": 301093, "epoch": 1792} {"train_loss": -12.265335083007812, "global_step": 301094, "epoch": 1792} {"train_loss": -12.259121894836426, "global_step": 301095, "epoch": 1792} {"train_loss": -12.059191703796387, "global_step": 301096, "epoch": 1792} {"train_loss": -12.079790115356445, "global_step": 301097, "epoch": 1792} {"train_loss": -11.790700912475586, "global_step": 301098, "epoch": 1792} {"train_loss": -11.274606704711914, "global_step": 301099, "epoch": 1792} {"train_loss": -12.192843437194824, "global_step": 301100, "epoch": 1792} {"train_loss": -11.478887557983398, "global_step": 301101, "epoch": 1792} {"train_loss": -11.958157539367676, "global_step": 301102, "epoch": 1792} {"train_loss": -11.868968963623047, "global_step": 301103, "epoch": 1792} {"train_loss": -12.12678337097168, "global_step": 301104, "epoch": 1792} {"train_loss": -11.88924789428711, "global_step": 301105, "epoch": 1792} {"train_loss": -11.823052406311035, "global_step": 301106, "epoch": 1792} {"train_loss": -12.02133560180664, "global_step": 301107, "epoch": 1792} {"train_loss": -12.271141052246094, "global_step": 301108, "epoch": 1792} {"train_loss": -12.050451278686523, "global_step": 301109, "epoch": 1792} {"train_loss": -12.288291931152344, "global_step": 301110, "epoch": 1792} {"train_loss": -12.320396423339844, "global_step": 301111, "epoch": 1792} {"train_loss": -11.555987358093262, "global_step": 301112, "epoch": 1792} {"train_loss": -12.106417655944824, "global_step": 301113, "epoch": 1792} {"train_loss": -12.017877578735352, "global_step": 301114, "epoch": 1792} {"train_loss": -11.673624038696289, "global_step": 301115, "epoch": 1792} {"train_loss": -11.708788871765137, "global_step": 301116, "epoch": 1792} {"train_loss": -11.440722465515137, "global_step": 301117, "epoch": 1792} {"train_loss": -12.117786407470703, "global_step": 301118, "epoch": 1792} {"train_loss": -10.758199691772461, "global_step": 301119, "epoch": 1792} {"train_loss": -11.223716735839844, "global_step": 301120, "epoch": 1792} {"train_loss": -11.73129940032959, "global_step": 301121, "epoch": 1792} {"train_loss": -12.04112720489502, "global_step": 301122, "epoch": 1792} {"train_loss": -11.45655632019043, "global_step": 301123, "epoch": 1792} {"train_loss": -11.731470108032227, "global_step": 301124, "epoch": 1792} {"train_loss": -11.515656471252441, "global_step": 301125, "epoch": 1792} {"train_loss": -12.235513687133789, "global_step": 301126, "epoch": 1792} {"train_loss": -12.282501220703125, "global_step": 301127, "epoch": 1792} {"train_loss": -11.871450424194336, "global_step": 301128, "epoch": 1792} {"train_loss": -12.238606452941895, "global_step": 301129, "epoch": 1792} {"train_loss": -12.276615142822266, "global_step": 301130, "epoch": 1792} {"train_loss": -12.267057418823242, "global_step": 301131, "epoch": 1792} {"train_loss": -12.335091590881348, "global_step": 301132, "epoch": 1792} {"train_loss": -12.300517082214355, "global_step": 301133, "epoch": 1792} {"train_loss": -12.487168312072754, "global_step": 301134, "epoch": 1792} {"train_loss": -11.951749801635742, "global_step": 301135, "epoch": 1792} {"train_loss": -12.516927719116211, "global_step": 301136, "epoch": 1792} {"train_loss": -12.489385604858398, "global_step": 301137, "epoch": 1792} {"train_loss": -12.165761947631836, "global_step": 301138, "epoch": 1792} {"train_loss": -12.420470237731934, "global_step": 301139, "epoch": 1792} {"train_loss": -12.413473129272461, "global_step": 301140, "epoch": 1792} {"train_loss": -12.436666488647461, "global_step": 301141, "epoch": 1792} {"train_loss": -12.29792594909668, "global_step": 301142, "epoch": 1792} {"train_loss": -12.376805305480957, "global_step": 301143, "epoch": 1792} {"train_loss": -12.222991943359375, "global_step": 301144, "epoch": 1792} {"train_loss": -11.752729415893555, "global_step": 301145, "epoch": 1792} {"train_loss": -11.675813674926758, "global_step": 301146, "epoch": 1792} {"train_loss": -11.890257835388184, "global_step": 301147, "epoch": 1792} {"train_loss": -12.162220001220703, "global_step": 301148, "epoch": 1792} {"train_loss": -11.645631790161133, "global_step": 301149, "epoch": 1792} {"train_loss": -11.911623001098633, "global_step": 301150, "epoch": 1792} {"train_loss": -12.032087326049805, "global_step": 301151, "epoch": 1792} {"train_loss": -11.579057693481445, "global_step": 301152, "epoch": 1792} {"train_loss": -10.44819450378418, "global_step": 301153, "epoch": 1792} {"train_loss": -11.790180206298828, "global_step": 301154, "epoch": 1792} {"train_loss": -11.57767105102539, "global_step": 301155, "epoch": 1792} {"train_loss": -11.687566757202148, "global_step": 301156, "epoch": 1792} {"train_loss": -11.331747055053711, "global_step": 301157, "epoch": 1792} {"train_loss": -11.505627632141113, "global_step": 301158, "epoch": 1792} {"train_loss": -11.590252876281738, "global_step": 301159, "epoch": 1792} {"train_loss": -11.95416259765625, "global_step": 301160, "epoch": 1792} {"train_loss": -11.23069953918457, "global_step": 301161, "epoch": 1792} {"train_loss": -11.452899932861328, "global_step": 301162, "epoch": 1792} {"train_loss": -11.724620819091797, "global_step": 301163, "epoch": 1792} {"train_loss": -11.026764869689941, "global_step": 301164, "epoch": 1792} {"train_loss": -11.719856262207031, "global_step": 301165, "epoch": 1792} {"train_loss": -11.53370189666748, "global_step": 301166, "epoch": 1792} {"train_loss": -9.855302810668945, "global_step": 301167, "epoch": 1792} {"train_loss": -10.82986831665039, "global_step": 301168, "epoch": 1792} {"train_loss": -10.412827491760254, "global_step": 301169, "epoch": 1792} {"train_loss": -11.301847457885742, "global_step": 301170, "epoch": 1792} {"train_loss": -11.203686714172363, "global_step": 301171, "epoch": 1792} {"train_loss": -10.039438247680664, "global_step": 301172, "epoch": 1792} {"train_loss": -11.531438827514648, "global_step": 301173, "epoch": 1792} {"train_loss": -11.386518478393555, "global_step": 301174, "epoch": 1792} {"train_loss": -11.779452323913574, "global_step": 301175, "epoch": 1792} {"train_loss": -10.969502449035645, "global_step": 301176, "epoch": 1792} {"train_loss": -11.286905288696289, "global_step": 301177, "epoch": 1792} {"train_loss": -11.630195617675781, "global_step": 301178, "epoch": 1792} {"train_loss": -11.005882263183594, "global_step": 301179, "epoch": 1792} {"train_loss": -11.822196960449219, "global_step": 301180, "epoch": 1792} {"train_loss": -10.930094718933105, "global_step": 301181, "epoch": 1792} {"train_loss": -11.43106746673584, "global_step": 301182, "epoch": 1792} {"train_loss": -10.924394607543945, "global_step": 301183, "epoch": 1792} {"train_loss": -9.506793975830078, "global_step": 301184, "epoch": 1792} {"train_loss": -10.342537879943848, "global_step": 301185, "epoch": 1792} {"train_loss": -11.405162811279297, "global_step": 301186, "epoch": 1792} {"train_loss": -10.481039047241211, "global_step": 301187, "epoch": 1792} {"train_loss": -10.81412124633789, "global_step": 301188, "epoch": 1792} {"train_loss": -10.724943161010742, "global_step": 301189, "epoch": 1792} {"train_loss": -10.093306541442871, "global_step": 301190, "epoch": 1792} {"train_loss": -11.252396583557129, "global_step": 301191, "epoch": 1792} {"train_loss": -10.5579252243042, "global_step": 301192, "epoch": 1792} {"train_loss": -10.252849578857422, "global_step": 301193, "epoch": 1792} {"train_loss": -10.295906066894531, "global_step": 301194, "epoch": 1792} {"train_loss": -10.52275276184082, "global_step": 301195, "epoch": 1792} {"train_loss": -9.946301460266113, "global_step": 301196, "epoch": 1792} {"train_loss": -9.967660903930664, "global_step": 301197, "epoch": 1792} {"train_loss": -10.48508071899414, "global_step": 301198, "epoch": 1792} {"train_loss": -10.49346923828125, "global_step": 301199, "epoch": 1792} {"train_loss": -10.79404067993164, "global_step": 301200, "epoch": 1792} {"train_loss": -10.138139724731445, "global_step": 301201, "epoch": 1792} {"train_loss": -10.001338958740234, "global_step": 301202, "epoch": 1792} {"train_loss": -10.90971851348877, "global_step": 301203, "epoch": 1792} {"train_loss": -11.06033706665039, "global_step": 301204, "epoch": 1792} {"train_loss": -9.861312866210938, "global_step": 301205, "epoch": 1792} {"train_loss": -11.471370697021484, "global_step": 301206, "epoch": 1792} {"train_loss": -10.33410358428955, "global_step": 301207, "epoch": 1792} {"train_loss": -11.203271865844727, "global_step": 301208, "epoch": 1792} {"train_loss": -10.723516464233398, "global_step": 301209, "epoch": 1792} {"train_loss": -10.428525924682617, "global_step": 301210, "epoch": 1792} {"train_loss": -11.51819896697998, "global_step": 301211, "epoch": 1792} {"train_loss": -10.958453178405762, "global_step": 301212, "epoch": 1792} {"train_loss": -10.815152168273926, "global_step": 301213, "epoch": 1792} {"train_loss": -11.237044334411621, "global_step": 301214, "epoch": 1792} {"train_loss": -11.12565803527832, "global_step": 301215, "epoch": 1792} {"train_loss": -11.068899154663086, "global_step": 301216, "epoch": 1792} {"train_loss": -11.95459270477295, "global_step": 301217, "epoch": 1792} {"train_loss": -11.226617813110352, "global_step": 301218, "epoch": 1792} {"train_loss": -11.740692138671875, "global_step": 301219, "epoch": 1792} {"train_loss": -11.862192153930664, "global_step": 301220, "epoch": 1792} {"train_loss": -11.44284725189209, "global_step": 301221, "epoch": 1792} {"train_loss": -11.811345100402832, "global_step": 301222, "epoch": 1792} {"train_loss": -11.599224533353533, "global_step": 301223, "epoch": 1792, "val_loss": 281768.0} {"train_loss": -11.700518608093262, "global_step": 301224, "epoch": 1793} {"train_loss": -11.748199462890625, "global_step": 301225, "epoch": 1793} {"train_loss": -11.737048149108887, "global_step": 301226, "epoch": 1793} {"train_loss": -11.460254669189453, "global_step": 301227, "epoch": 1793} {"train_loss": -11.712957382202148, "global_step": 301228, "epoch": 1793} {"train_loss": -11.860418319702148, "global_step": 301229, "epoch": 1793} {"train_loss": -11.499905586242676, "global_step": 301230, "epoch": 1793} {"train_loss": -11.632062911987305, "global_step": 301231, "epoch": 1793} {"train_loss": -11.930158615112305, "global_step": 301232, "epoch": 1793} {"train_loss": -11.655340194702148, "global_step": 301233, "epoch": 1793} {"train_loss": -11.95128059387207, "global_step": 301234, "epoch": 1793} {"train_loss": -11.690947532653809, "global_step": 301235, "epoch": 1793} {"train_loss": -11.742378234863281, "global_step": 301236, "epoch": 1793} {"train_loss": -11.853609085083008, "global_step": 301237, "epoch": 1793} {"train_loss": -11.947704315185547, "global_step": 301238, "epoch": 1793} {"train_loss": -11.459696769714355, "global_step": 301239, "epoch": 1793} {"train_loss": -12.002795219421387, "global_step": 301240, "epoch": 1793} {"train_loss": -11.8915433883667, "global_step": 301241, "epoch": 1793} {"train_loss": -11.922141075134277, "global_step": 301242, "epoch": 1793} {"train_loss": -11.937030792236328, "global_step": 301243, "epoch": 1793} {"train_loss": -11.917461395263672, "global_step": 301244, "epoch": 1793} {"train_loss": -11.967351913452148, "global_step": 301245, "epoch": 1793} {"train_loss": -11.908825874328613, "global_step": 301246, "epoch": 1793} {"train_loss": -11.874394416809082, "global_step": 301247, "epoch": 1793} {"train_loss": -11.987359046936035, "global_step": 301248, "epoch": 1793} {"train_loss": -12.06786060333252, "global_step": 301249, "epoch": 1793} {"train_loss": -12.248414993286133, "global_step": 301250, "epoch": 1793} {"train_loss": -12.181788444519043, "global_step": 301251, "epoch": 1793} {"train_loss": -11.938680648803711, "global_step": 301252, "epoch": 1793} {"train_loss": -11.928595542907715, "global_step": 301253, "epoch": 1793} {"train_loss": -11.918523788452148, "global_step": 301254, "epoch": 1793} {"train_loss": -12.12346076965332, "global_step": 301255, "epoch": 1793} {"train_loss": -11.987743377685547, "global_step": 301256, "epoch": 1793} {"train_loss": -12.017850875854492, "global_step": 301257, "epoch": 1793} {"train_loss": -12.203104019165039, "global_step": 301258, "epoch": 1793} {"train_loss": -12.105255126953125, "global_step": 301259, "epoch": 1793} {"train_loss": -12.17386531829834, "global_step": 301260, "epoch": 1793} {"train_loss": -12.133758544921875, "global_step": 301261, "epoch": 1793} {"train_loss": -12.237447738647461, "global_step": 301262, "epoch": 1793} {"train_loss": -12.327118873596191, "global_step": 301263, "epoch": 1793} {"train_loss": -12.333064079284668, "global_step": 301264, "epoch": 1793} {"train_loss": -12.224254608154297, "global_step": 301265, "epoch": 1793} {"train_loss": -12.29151725769043, "global_step": 301266, "epoch": 1793} {"train_loss": -12.312910079956055, "global_step": 301267, "epoch": 1793} {"train_loss": -12.209168434143066, "global_step": 301268, "epoch": 1793} {"train_loss": -12.3177490234375, "global_step": 301269, "epoch": 1793} {"train_loss": -12.275693893432617, "global_step": 301270, "epoch": 1793} {"train_loss": -12.252872467041016, "global_step": 301271, "epoch": 1793} {"train_loss": -12.331442832946777, "global_step": 301272, "epoch": 1793} {"train_loss": -12.461325645446777, "global_step": 301273, "epoch": 1793} {"train_loss": -12.116451263427734, "global_step": 301274, "epoch": 1793} {"train_loss": -12.408571243286133, "global_step": 301275, "epoch": 1793} {"train_loss": -12.330921173095703, "global_step": 301276, "epoch": 1793} {"train_loss": -12.370152473449707, "global_step": 301277, "epoch": 1793} {"train_loss": -12.372394561767578, "global_step": 301278, "epoch": 1793} {"train_loss": -12.175861358642578, "global_step": 301279, "epoch": 1793} {"train_loss": -12.535568237304688, "global_step": 301280, "epoch": 1793} {"train_loss": -12.490748405456543, "global_step": 301281, "epoch": 1793} {"train_loss": -12.283968925476074, "global_step": 301282, "epoch": 1793} {"train_loss": -12.463253021240234, "global_step": 301283, "epoch": 1793} {"train_loss": -12.495885848999023, "global_step": 301284, "epoch": 1793} {"train_loss": -12.600515365600586, "global_step": 301285, "epoch": 1793} {"train_loss": -12.493499755859375, "global_step": 301286, "epoch": 1793} {"train_loss": -12.318058967590332, "global_step": 301287, "epoch": 1793} {"train_loss": -12.281766891479492, "global_step": 301288, "epoch": 1793} {"train_loss": -12.510420799255371, "global_step": 301289, "epoch": 1793} {"train_loss": -12.537525177001953, "global_step": 301290, "epoch": 1793} {"train_loss": -12.485170364379883, "global_step": 301291, "epoch": 1793} {"train_loss": -12.656516075134277, "global_step": 301292, "epoch": 1793} {"train_loss": -12.472908973693848, "global_step": 301293, "epoch": 1793} {"train_loss": -12.51885986328125, "global_step": 301294, "epoch": 1793} {"train_loss": -12.511917114257812, "global_step": 301295, "epoch": 1793} {"train_loss": -12.544891357421875, "global_step": 301296, "epoch": 1793} {"train_loss": -12.453741073608398, "global_step": 301297, "epoch": 1793} {"train_loss": -12.160505294799805, "global_step": 301298, "epoch": 1793} {"train_loss": -12.142066955566406, "global_step": 301299, "epoch": 1793} {"train_loss": -12.532264709472656, "global_step": 301300, "epoch": 1793} {"train_loss": -12.516886711120605, "global_step": 301301, "epoch": 1793} {"train_loss": -12.550801277160645, "global_step": 301302, "epoch": 1793} {"train_loss": -12.234893798828125, "global_step": 301303, "epoch": 1793} {"train_loss": -12.407910346984863, "global_step": 301304, "epoch": 1793} {"train_loss": -12.576065063476562, "global_step": 301305, "epoch": 1793} {"train_loss": -12.15623950958252, "global_step": 301306, "epoch": 1793} {"train_loss": -11.958436965942383, "global_step": 301307, "epoch": 1793} {"train_loss": -11.624370574951172, "global_step": 301308, "epoch": 1793} {"train_loss": -11.661550521850586, "global_step": 301309, "epoch": 1793} {"train_loss": -12.077503204345703, "global_step": 301310, "epoch": 1793} {"train_loss": -12.445417404174805, "global_step": 301311, "epoch": 1793} {"train_loss": -12.079488754272461, "global_step": 301312, "epoch": 1793} {"train_loss": -12.16673469543457, "global_step": 301313, "epoch": 1793} {"train_loss": -12.553600311279297, "global_step": 301314, "epoch": 1793} {"train_loss": -11.516233444213867, "global_step": 301315, "epoch": 1793} {"train_loss": -8.71917724609375, "global_step": 301316, "epoch": 1793} {"train_loss": -11.754762649536133, "global_step": 301317, "epoch": 1793} {"train_loss": -8.737197875976562, "global_step": 301318, "epoch": 1793} {"train_loss": -9.68821907043457, "global_step": 301319, "epoch": 1793} {"train_loss": -7.320960998535156, "global_step": 301320, "epoch": 1793} {"train_loss": -7.6426777839660645, "global_step": 301321, "epoch": 1793} {"train_loss": -7.0176544189453125, "global_step": 301322, "epoch": 1793} {"train_loss": -6.47589111328125, "global_step": 301323, "epoch": 1793} {"train_loss": -6.9798784255981445, "global_step": 301324, "epoch": 1793} {"train_loss": -7.461617469787598, "global_step": 301325, "epoch": 1793} {"train_loss": -7.462717056274414, "global_step": 301326, "epoch": 1793} {"train_loss": -7.431407451629639, "global_step": 301327, "epoch": 1793} {"train_loss": -7.365708827972412, "global_step": 301328, "epoch": 1793} {"train_loss": -7.899342060089111, "global_step": 301329, "epoch": 1793} {"train_loss": -7.334677696228027, "global_step": 301330, "epoch": 1793} {"train_loss": -8.31673812866211, "global_step": 301331, "epoch": 1793} {"train_loss": -8.608867645263672, "global_step": 301332, "epoch": 1793} {"train_loss": -8.70094108581543, "global_step": 301333, "epoch": 1793} {"train_loss": -9.688446998596191, "global_step": 301334, "epoch": 1793} {"train_loss": -10.163808822631836, "global_step": 301335, "epoch": 1793} {"train_loss": -10.255392074584961, "global_step": 301336, "epoch": 1793} {"train_loss": -10.828886032104492, "global_step": 301337, "epoch": 1793} {"train_loss": -9.811731338500977, "global_step": 301338, "epoch": 1793} {"train_loss": -10.451910018920898, "global_step": 301339, "epoch": 1793} {"train_loss": -9.275923728942871, "global_step": 301340, "epoch": 1793} {"train_loss": -10.244913101196289, "global_step": 301341, "epoch": 1793} {"train_loss": -10.031646728515625, "global_step": 301342, "epoch": 1793} {"train_loss": -11.016792297363281, "global_step": 301343, "epoch": 1793} {"train_loss": -10.936196327209473, "global_step": 301344, "epoch": 1793} {"train_loss": -11.266766548156738, "global_step": 301345, "epoch": 1793} {"train_loss": -10.956512451171875, "global_step": 301346, "epoch": 1793} {"train_loss": -10.70413875579834, "global_step": 301347, "epoch": 1793} {"train_loss": -11.009318351745605, "global_step": 301348, "epoch": 1793} {"train_loss": -11.212261199951172, "global_step": 301349, "epoch": 1793} {"train_loss": -11.264883995056152, "global_step": 301350, "epoch": 1793} {"train_loss": -11.570655822753906, "global_step": 301351, "epoch": 1793} {"train_loss": -11.639266014099121, "global_step": 301352, "epoch": 1793} {"train_loss": -11.412890434265137, "global_step": 301353, "epoch": 1793} {"train_loss": -11.591623306274414, "global_step": 301354, "epoch": 1793} {"train_loss": -11.495420455932617, "global_step": 301355, "epoch": 1793} {"train_loss": -11.542475700378418, "global_step": 301356, "epoch": 1793} {"train_loss": -11.579549789428711, "global_step": 301357, "epoch": 1793} {"train_loss": -11.550148010253906, "global_step": 301358, "epoch": 1793} {"train_loss": -11.293749809265137, "global_step": 301359, "epoch": 1793} {"train_loss": -11.921463012695312, "global_step": 301360, "epoch": 1793} {"train_loss": -11.781906127929688, "global_step": 301361, "epoch": 1793} {"train_loss": -11.360773086547852, "global_step": 301362, "epoch": 1793} {"train_loss": -11.747967720031738, "global_step": 301363, "epoch": 1793} {"train_loss": -11.563470840454102, "global_step": 301364, "epoch": 1793} {"train_loss": -11.86900520324707, "global_step": 301365, "epoch": 1793} {"train_loss": -11.740662574768066, "global_step": 301366, "epoch": 1793} {"train_loss": -11.652183532714844, "global_step": 301367, "epoch": 1793} {"train_loss": -11.92639446258545, "global_step": 301368, "epoch": 1793} {"train_loss": -11.643054962158203, "global_step": 301369, "epoch": 1793} {"train_loss": -11.96972370147705, "global_step": 301370, "epoch": 1793} {"train_loss": -12.095183372497559, "global_step": 301371, "epoch": 1793} {"train_loss": -11.869028091430664, "global_step": 301372, "epoch": 1793} {"train_loss": -11.835296630859375, "global_step": 301373, "epoch": 1793} {"train_loss": -11.937522888183594, "global_step": 301374, "epoch": 1793} {"train_loss": -12.097705841064453, "global_step": 301375, "epoch": 1793} {"train_loss": -11.963089942932129, "global_step": 301376, "epoch": 1793} {"train_loss": -11.993614196777344, "global_step": 301377, "epoch": 1793} {"train_loss": -12.06326961517334, "global_step": 301378, "epoch": 1793} {"train_loss": -12.084190368652344, "global_step": 301379, "epoch": 1793} {"train_loss": -11.755836486816406, "global_step": 301380, "epoch": 1793} {"train_loss": -12.090498924255371, "global_step": 301381, "epoch": 1793} {"train_loss": -11.533280372619629, "global_step": 301382, "epoch": 1793} {"train_loss": -11.81773567199707, "global_step": 301383, "epoch": 1793} {"train_loss": -12.1835355758667, "global_step": 301384, "epoch": 1793} {"train_loss": -12.151576042175293, "global_step": 301385, "epoch": 1793} {"train_loss": -12.022220611572266, "global_step": 301386, "epoch": 1793} {"train_loss": -12.264627456665039, "global_step": 301387, "epoch": 1793} {"train_loss": -12.039276123046875, "global_step": 301388, "epoch": 1793} {"train_loss": -12.191347122192383, "global_step": 301389, "epoch": 1793} {"train_loss": -12.272225379943848, "global_step": 301390, "epoch": 1793} {"train_loss": -11.469457524163383, "global_step": 301391, "epoch": 1793, "val_loss": 276951.25} {"train_loss": -12.32952880859375, "global_step": 301392, "epoch": 1794} {"train_loss": -12.181490898132324, "global_step": 301393, "epoch": 1794} {"train_loss": -12.311189651489258, "global_step": 301394, "epoch": 1794} {"train_loss": -12.343441009521484, "global_step": 301395, "epoch": 1794} {"train_loss": -12.217309951782227, "global_step": 301396, "epoch": 1794} {"train_loss": -12.475839614868164, "global_step": 301397, "epoch": 1794} {"train_loss": -11.957759857177734, "global_step": 301398, "epoch": 1794} {"train_loss": -12.309982299804688, "global_step": 301399, "epoch": 1794} {"train_loss": -12.41023063659668, "global_step": 301400, "epoch": 1794} {"train_loss": -12.250141143798828, "global_step": 301401, "epoch": 1794} {"train_loss": -12.260046005249023, "global_step": 301402, "epoch": 1794} {"train_loss": -12.253312110900879, "global_step": 301403, "epoch": 1794} {"train_loss": -12.19826889038086, "global_step": 301404, "epoch": 1794} {"train_loss": -12.294280052185059, "global_step": 301405, "epoch": 1794} {"train_loss": -12.36402702331543, "global_step": 301406, "epoch": 1794} {"train_loss": -12.339808464050293, "global_step": 301407, "epoch": 1794} {"train_loss": -12.458051681518555, "global_step": 301408, "epoch": 1794} {"train_loss": -12.295360565185547, "global_step": 301409, "epoch": 1794} {"train_loss": -12.29326057434082, "global_step": 301410, "epoch": 1794} {"train_loss": -12.314936637878418, "global_step": 301411, "epoch": 1794} {"train_loss": -12.433053970336914, "global_step": 301412, "epoch": 1794} {"train_loss": -12.25955581665039, "global_step": 301413, "epoch": 1794} {"train_loss": -12.413537979125977, "global_step": 301414, "epoch": 1794} {"train_loss": -12.501346588134766, "global_step": 301415, "epoch": 1794} {"train_loss": -12.505071640014648, "global_step": 301416, "epoch": 1794} {"train_loss": -12.420661926269531, "global_step": 301417, "epoch": 1794} {"train_loss": -12.48359203338623, "global_step": 301418, "epoch": 1794} {"train_loss": -12.397789001464844, "global_step": 301419, "epoch": 1794} {"train_loss": -12.224690437316895, "global_step": 301420, "epoch": 1794} {"train_loss": -12.492870330810547, "global_step": 301421, "epoch": 1794} {"train_loss": -12.630367279052734, "global_step": 301422, "epoch": 1794} {"train_loss": -12.263227462768555, "global_step": 301423, "epoch": 1794} {"train_loss": -12.258408546447754, "global_step": 301424, "epoch": 1794} {"train_loss": -12.21426773071289, "global_step": 301425, "epoch": 1794} {"train_loss": -12.495728492736816, "global_step": 301426, "epoch": 1794} {"train_loss": -12.176472663879395, "global_step": 301427, "epoch": 1794} {"train_loss": -12.19375991821289, "global_step": 301428, "epoch": 1794} {"train_loss": -12.359842300415039, "global_step": 301429, "epoch": 1794} {"train_loss": -12.283561706542969, "global_step": 301430, "epoch": 1794} {"train_loss": -12.539412498474121, "global_step": 301431, "epoch": 1794} {"train_loss": -12.451324462890625, "global_step": 301432, "epoch": 1794} {"train_loss": -12.440142631530762, "global_step": 301433, "epoch": 1794} {"train_loss": -12.443246841430664, "global_step": 301434, "epoch": 1794} {"train_loss": -12.341405868530273, "global_step": 301435, "epoch": 1794} {"train_loss": -12.387439727783203, "global_step": 301436, "epoch": 1794} {"train_loss": -11.787702560424805, "global_step": 301437, "epoch": 1794} {"train_loss": -10.70277214050293, "global_step": 301438, "epoch": 1794} {"train_loss": -12.243417739868164, "global_step": 301439, "epoch": 1794} {"train_loss": -12.014728546142578, "global_step": 301440, "epoch": 1794} {"train_loss": -11.266386985778809, "global_step": 301441, "epoch": 1794} {"train_loss": -10.539627075195312, "global_step": 301442, "epoch": 1794} {"train_loss": -8.897380828857422, "global_step": 301443, "epoch": 1794} {"train_loss": -11.52570915222168, "global_step": 301444, "epoch": 1794} {"train_loss": -8.79302978515625, "global_step": 301445, "epoch": 1794} {"train_loss": -10.790538787841797, "global_step": 301446, "epoch": 1794} {"train_loss": -8.416994094848633, "global_step": 301447, "epoch": 1794} {"train_loss": -8.770807266235352, "global_step": 301448, "epoch": 1794} {"train_loss": -9.95844841003418, "global_step": 301449, "epoch": 1794} {"train_loss": -8.364886283874512, "global_step": 301450, "epoch": 1794} {"train_loss": -8.903280258178711, "global_step": 301451, "epoch": 1794} {"train_loss": -9.899799346923828, "global_step": 301452, "epoch": 1794} {"train_loss": -11.193784713745117, "global_step": 301453, "epoch": 1794} {"train_loss": -10.46703052520752, "global_step": 301454, "epoch": 1794} {"train_loss": -10.354612350463867, "global_step": 301455, "epoch": 1794} {"train_loss": -10.807004928588867, "global_step": 301456, "epoch": 1794} {"train_loss": -10.897163391113281, "global_step": 301457, "epoch": 1794} {"train_loss": -10.044868469238281, "global_step": 301458, "epoch": 1794} {"train_loss": -10.737863540649414, "global_step": 301459, "epoch": 1794} {"train_loss": -10.200798988342285, "global_step": 301460, "epoch": 1794} {"train_loss": -11.015802383422852, "global_step": 301461, "epoch": 1794} {"train_loss": -9.054301261901855, "global_step": 301462, "epoch": 1794} {"train_loss": -10.439998626708984, "global_step": 301463, "epoch": 1794} {"train_loss": -10.273386001586914, "global_step": 301464, "epoch": 1794} {"train_loss": -10.347511291503906, "global_step": 301465, "epoch": 1794} {"train_loss": -11.383405685424805, "global_step": 301466, "epoch": 1794} {"train_loss": -11.006353378295898, "global_step": 301467, "epoch": 1794} {"train_loss": -11.328374862670898, "global_step": 301468, "epoch": 1794} {"train_loss": -11.676172256469727, "global_step": 301469, "epoch": 1794} {"train_loss": -11.508816719055176, "global_step": 301470, "epoch": 1794} {"train_loss": -11.824919700622559, "global_step": 301471, "epoch": 1794} {"train_loss": -11.52861213684082, "global_step": 301472, "epoch": 1794} {"train_loss": -11.626701354980469, "global_step": 301473, "epoch": 1794} {"train_loss": -11.598016738891602, "global_step": 301474, "epoch": 1794} {"train_loss": -11.510833740234375, "global_step": 301475, "epoch": 1794} {"train_loss": -11.773338317871094, "global_step": 301476, "epoch": 1794} {"train_loss": -11.861998558044434, "global_step": 301477, "epoch": 1794} {"train_loss": -11.201410293579102, "global_step": 301478, "epoch": 1794} {"train_loss": -11.711297035217285, "global_step": 301479, "epoch": 1794} {"train_loss": -11.605820655822754, "global_step": 301480, "epoch": 1794} {"train_loss": -11.633138656616211, "global_step": 301481, "epoch": 1794} {"train_loss": -12.004230499267578, "global_step": 301482, "epoch": 1794} {"train_loss": -11.660392761230469, "global_step": 301483, "epoch": 1794} {"train_loss": -11.754877090454102, "global_step": 301484, "epoch": 1794} {"train_loss": -11.806756973266602, "global_step": 301485, "epoch": 1794} {"train_loss": -11.350686073303223, "global_step": 301486, "epoch": 1794} {"train_loss": -11.747278213500977, "global_step": 301487, "epoch": 1794} {"train_loss": -11.38802433013916, "global_step": 301488, "epoch": 1794} {"train_loss": -11.698005676269531, "global_step": 301489, "epoch": 1794} {"train_loss": -12.06053352355957, "global_step": 301490, "epoch": 1794} {"train_loss": -11.365530014038086, "global_step": 301491, "epoch": 1794} {"train_loss": -11.677377700805664, "global_step": 301492, "epoch": 1794} {"train_loss": -11.609780311584473, "global_step": 301493, "epoch": 1794} {"train_loss": -11.947332382202148, "global_step": 301494, "epoch": 1794} {"train_loss": -11.534607887268066, "global_step": 301495, "epoch": 1794} {"train_loss": -11.509069442749023, "global_step": 301496, "epoch": 1794} {"train_loss": -11.669981002807617, "global_step": 301497, "epoch": 1794} {"train_loss": -11.415708541870117, "global_step": 301498, "epoch": 1794} {"train_loss": -11.79862117767334, "global_step": 301499, "epoch": 1794} {"train_loss": -11.559494972229004, "global_step": 301500, "epoch": 1794} {"train_loss": -11.816326141357422, "global_step": 301501, "epoch": 1794} {"train_loss": -11.517986297607422, "global_step": 301502, "epoch": 1794} {"train_loss": -11.913969993591309, "global_step": 301503, "epoch": 1794} {"train_loss": -11.717270851135254, "global_step": 301504, "epoch": 1794} {"train_loss": -11.631816864013672, "global_step": 301505, "epoch": 1794} {"train_loss": -11.929737091064453, "global_step": 301506, "epoch": 1794} {"train_loss": -11.63352108001709, "global_step": 301507, "epoch": 1794} {"train_loss": -12.002923011779785, "global_step": 301508, "epoch": 1794} {"train_loss": -11.598431587219238, "global_step": 301509, "epoch": 1794} {"train_loss": -11.990655899047852, "global_step": 301510, "epoch": 1794} {"train_loss": -11.704490661621094, "global_step": 301511, "epoch": 1794} {"train_loss": -12.17275333404541, "global_step": 301512, "epoch": 1794} {"train_loss": -11.803236961364746, "global_step": 301513, "epoch": 1794} {"train_loss": -11.959049224853516, "global_step": 301514, "epoch": 1794} {"train_loss": -12.005398750305176, "global_step": 301515, "epoch": 1794} {"train_loss": -11.849815368652344, "global_step": 301516, "epoch": 1794} {"train_loss": -12.164921760559082, "global_step": 301517, "epoch": 1794} {"train_loss": -11.842243194580078, "global_step": 301518, "epoch": 1794} {"train_loss": -12.014001846313477, "global_step": 301519, "epoch": 1794} {"train_loss": -12.072224617004395, "global_step": 301520, "epoch": 1794} {"train_loss": -12.105103492736816, "global_step": 301521, "epoch": 1794} {"train_loss": -12.272031784057617, "global_step": 301522, "epoch": 1794} {"train_loss": -12.034643173217773, "global_step": 301523, "epoch": 1794} {"train_loss": -12.342280387878418, "global_step": 301524, "epoch": 1794} {"train_loss": -12.07619857788086, "global_step": 301525, "epoch": 1794} {"train_loss": -12.30717945098877, "global_step": 301526, "epoch": 1794} {"train_loss": -12.312673568725586, "global_step": 301527, "epoch": 1794} {"train_loss": -12.365255355834961, "global_step": 301528, "epoch": 1794} {"train_loss": -12.362224578857422, "global_step": 301529, "epoch": 1794} {"train_loss": -12.357108116149902, "global_step": 301530, "epoch": 1794} {"train_loss": -12.219413757324219, "global_step": 301531, "epoch": 1794} {"train_loss": -12.245373725891113, "global_step": 301532, "epoch": 1794} {"train_loss": -12.328699111938477, "global_step": 301533, "epoch": 1794} {"train_loss": -11.975032806396484, "global_step": 301534, "epoch": 1794} {"train_loss": -12.321475982666016, "global_step": 301535, "epoch": 1794} {"train_loss": -12.352715492248535, "global_step": 301536, "epoch": 1794} {"train_loss": -12.293142318725586, "global_step": 301537, "epoch": 1794} {"train_loss": -12.409568786621094, "global_step": 301538, "epoch": 1794} {"train_loss": -12.393600463867188, "global_step": 301539, "epoch": 1794} {"train_loss": -12.371192932128906, "global_step": 301540, "epoch": 1794} {"train_loss": -12.398813247680664, "global_step": 301541, "epoch": 1794} {"train_loss": -12.290340423583984, "global_step": 301542, "epoch": 1794} {"train_loss": -12.363773345947266, "global_step": 301543, "epoch": 1794} {"train_loss": -12.330862045288086, "global_step": 301544, "epoch": 1794} {"train_loss": -12.317693710327148, "global_step": 301545, "epoch": 1794} {"train_loss": -12.304559707641602, "global_step": 301546, "epoch": 1794} {"train_loss": -12.568557739257812, "global_step": 301547, "epoch": 1794} {"train_loss": -12.34819221496582, "global_step": 301548, "epoch": 1794} {"train_loss": -12.320344924926758, "global_step": 301549, "epoch": 1794} {"train_loss": -12.286673545837402, "global_step": 301550, "epoch": 1794} {"train_loss": -12.173803329467773, "global_step": 301551, "epoch": 1794} {"train_loss": -12.295787811279297, "global_step": 301552, "epoch": 1794} {"train_loss": -12.378952026367188, "global_step": 301553, "epoch": 1794} {"train_loss": -12.396601676940918, "global_step": 301554, "epoch": 1794} {"train_loss": -11.912879943847656, "global_step": 301555, "epoch": 1794} {"train_loss": -12.480642318725586, "global_step": 301556, "epoch": 1794} {"train_loss": -11.582332611083984, "global_step": 301557, "epoch": 1794} {"train_loss": -11.236494064331055, "global_step": 301558, "epoch": 1794} {"train_loss": -11.758739681470962, "global_step": 301559, "epoch": 1794, "val_loss": 280800.09375} {"train_loss": -12.519123077392578, "global_step": 301560, "epoch": 1795} {"train_loss": -11.839639663696289, "global_step": 301561, "epoch": 1795} {"train_loss": -11.875572204589844, "global_step": 301562, "epoch": 1795} {"train_loss": -12.577627182006836, "global_step": 301563, "epoch": 1795} {"train_loss": -11.777826309204102, "global_step": 301564, "epoch": 1795} {"train_loss": -11.121892929077148, "global_step": 301565, "epoch": 1795} {"train_loss": -11.749425888061523, "global_step": 301566, "epoch": 1795} {"train_loss": -9.63737678527832, "global_step": 301567, "epoch": 1795} {"train_loss": -11.160608291625977, "global_step": 301568, "epoch": 1795} {"train_loss": -11.130404472351074, "global_step": 301569, "epoch": 1795} {"train_loss": -10.244519233703613, "global_step": 301570, "epoch": 1795} {"train_loss": -9.94149112701416, "global_step": 301571, "epoch": 1795} {"train_loss": -10.908976554870605, "global_step": 301572, "epoch": 1795} {"train_loss": -9.355094909667969, "global_step": 301573, "epoch": 1795} {"train_loss": -11.225757598876953, "global_step": 301574, "epoch": 1795} {"train_loss": -10.113731384277344, "global_step": 301575, "epoch": 1795} {"train_loss": -10.868682861328125, "global_step": 301576, "epoch": 1795} {"train_loss": -11.024673461914062, "global_step": 301577, "epoch": 1795} {"train_loss": -10.402406692504883, "global_step": 301578, "epoch": 1795} {"train_loss": -11.544462203979492, "global_step": 301579, "epoch": 1795} {"train_loss": -10.465278625488281, "global_step": 301580, "epoch": 1795} {"train_loss": -11.410543441772461, "global_step": 301581, "epoch": 1795} {"train_loss": -11.337260246276855, "global_step": 301582, "epoch": 1795} {"train_loss": -11.015230178833008, "global_step": 301583, "epoch": 1795} {"train_loss": -10.95438003540039, "global_step": 301584, "epoch": 1795} {"train_loss": -10.767889976501465, "global_step": 301585, "epoch": 1795} {"train_loss": -11.415201187133789, "global_step": 301586, "epoch": 1795} {"train_loss": -9.598299980163574, "global_step": 301587, "epoch": 1795} {"train_loss": -11.905572891235352, "global_step": 301588, "epoch": 1795} {"train_loss": -11.057403564453125, "global_step": 301589, "epoch": 1795} {"train_loss": -11.339131355285645, "global_step": 301590, "epoch": 1795} {"train_loss": -10.709519386291504, "global_step": 301591, "epoch": 1795} {"train_loss": -10.985261917114258, "global_step": 301592, "epoch": 1795} {"train_loss": -11.479679107666016, "global_step": 301593, "epoch": 1795} {"train_loss": -11.409462928771973, "global_step": 301594, "epoch": 1795} {"train_loss": -11.04196548461914, "global_step": 301595, "epoch": 1795} {"train_loss": -11.775495529174805, "global_step": 301596, "epoch": 1795} {"train_loss": -10.810491561889648, "global_step": 301597, "epoch": 1795} {"train_loss": -11.761974334716797, "global_step": 301598, "epoch": 1795} {"train_loss": -11.383359909057617, "global_step": 301599, "epoch": 1795} {"train_loss": -11.455562591552734, "global_step": 301600, "epoch": 1795} {"train_loss": -11.545846939086914, "global_step": 301601, "epoch": 1795} {"train_loss": -11.45283031463623, "global_step": 301602, "epoch": 1795} {"train_loss": -11.410079956054688, "global_step": 301603, "epoch": 1795} {"train_loss": -11.644400596618652, "global_step": 301604, "epoch": 1795} {"train_loss": -10.487918853759766, "global_step": 301605, "epoch": 1795} {"train_loss": -11.908461570739746, "global_step": 301606, "epoch": 1795} {"train_loss": -10.992572784423828, "global_step": 301607, "epoch": 1795} {"train_loss": -11.788092613220215, "global_step": 301608, "epoch": 1795} {"train_loss": -11.75352668762207, "global_step": 301609, "epoch": 1795} {"train_loss": -11.164077758789062, "global_step": 301610, "epoch": 1795} {"train_loss": -11.78919792175293, "global_step": 301611, "epoch": 1795} {"train_loss": -11.835466384887695, "global_step": 301612, "epoch": 1795} {"train_loss": -11.569534301757812, "global_step": 301613, "epoch": 1795} {"train_loss": -12.163488388061523, "global_step": 301614, "epoch": 1795} {"train_loss": -11.400496482849121, "global_step": 301615, "epoch": 1795} {"train_loss": -12.139839172363281, "global_step": 301616, "epoch": 1795} {"train_loss": -11.760579109191895, "global_step": 301617, "epoch": 1795} {"train_loss": -11.806127548217773, "global_step": 301618, "epoch": 1795} {"train_loss": -12.075692176818848, "global_step": 301619, "epoch": 1795} {"train_loss": -11.471612930297852, "global_step": 301620, "epoch": 1795} {"train_loss": -11.948968887329102, "global_step": 301621, "epoch": 1795} {"train_loss": -11.725353240966797, "global_step": 301622, "epoch": 1795} {"train_loss": -11.986028671264648, "global_step": 301623, "epoch": 1795} {"train_loss": -12.06131649017334, "global_step": 301624, "epoch": 1795} {"train_loss": -11.907955169677734, "global_step": 301625, "epoch": 1795} {"train_loss": -12.132822036743164, "global_step": 301626, "epoch": 1795} {"train_loss": -11.928857803344727, "global_step": 301627, "epoch": 1795} {"train_loss": -12.057734489440918, "global_step": 301628, "epoch": 1795} {"train_loss": -12.18498706817627, "global_step": 301629, "epoch": 1795} {"train_loss": -12.078865051269531, "global_step": 301630, "epoch": 1795} {"train_loss": -12.087642669677734, "global_step": 301631, "epoch": 1795} {"train_loss": -12.069210052490234, "global_step": 301632, "epoch": 1795} {"train_loss": -11.749000549316406, "global_step": 301633, "epoch": 1795} {"train_loss": -12.133331298828125, "global_step": 301634, "epoch": 1795} {"train_loss": -12.130517959594727, "global_step": 301635, "epoch": 1795} {"train_loss": -12.291817665100098, "global_step": 301636, "epoch": 1795} {"train_loss": -12.061687469482422, "global_step": 301637, "epoch": 1795} {"train_loss": -12.403800964355469, "global_step": 301638, "epoch": 1795} {"train_loss": -12.267155647277832, "global_step": 301639, "epoch": 1795} {"train_loss": -12.173494338989258, "global_step": 301640, "epoch": 1795} {"train_loss": -12.165355682373047, "global_step": 301641, "epoch": 1795} {"train_loss": -12.188876152038574, "global_step": 301642, "epoch": 1795} {"train_loss": -12.256561279296875, "global_step": 301643, "epoch": 1795} {"train_loss": -12.256582260131836, "global_step": 301644, "epoch": 1795} {"train_loss": -12.092735290527344, "global_step": 301645, "epoch": 1795} {"train_loss": -12.284651756286621, "global_step": 301646, "epoch": 1795} {"train_loss": -12.231000900268555, "global_step": 301647, "epoch": 1795} {"train_loss": -12.32866096496582, "global_step": 301648, "epoch": 1795} {"train_loss": -12.416200637817383, "global_step": 301649, "epoch": 1795} {"train_loss": -12.044147491455078, "global_step": 301650, "epoch": 1795} {"train_loss": -12.391849517822266, "global_step": 301651, "epoch": 1795} {"train_loss": -12.278829574584961, "global_step": 301652, "epoch": 1795} {"train_loss": -12.161691665649414, "global_step": 301653, "epoch": 1795} {"train_loss": -12.197957038879395, "global_step": 301654, "epoch": 1795} {"train_loss": -12.13522720336914, "global_step": 301655, "epoch": 1795} {"train_loss": -12.349847793579102, "global_step": 301656, "epoch": 1795} {"train_loss": -12.386796951293945, "global_step": 301657, "epoch": 1795} {"train_loss": -12.261341094970703, "global_step": 301658, "epoch": 1795} {"train_loss": -12.448263168334961, "global_step": 301659, "epoch": 1795} {"train_loss": -12.256406784057617, "global_step": 301660, "epoch": 1795} {"train_loss": -12.247961044311523, "global_step": 301661, "epoch": 1795} {"train_loss": -12.323122024536133, "global_step": 301662, "epoch": 1795} {"train_loss": -12.110507011413574, "global_step": 301663, "epoch": 1795} {"train_loss": -12.250896453857422, "global_step": 301664, "epoch": 1795} {"train_loss": -12.155420303344727, "global_step": 301665, "epoch": 1795} {"train_loss": -12.258404731750488, "global_step": 301666, "epoch": 1795} {"train_loss": -11.792327880859375, "global_step": 301667, "epoch": 1795} {"train_loss": -12.096261978149414, "global_step": 301668, "epoch": 1795} {"train_loss": -12.395668983459473, "global_step": 301669, "epoch": 1795} {"train_loss": -12.287851333618164, "global_step": 301670, "epoch": 1795} {"train_loss": -12.099056243896484, "global_step": 301671, "epoch": 1795} {"train_loss": -11.818800926208496, "global_step": 301672, "epoch": 1795} {"train_loss": -12.448568344116211, "global_step": 301673, "epoch": 1795} {"train_loss": -12.239916801452637, "global_step": 301674, "epoch": 1795} {"train_loss": -12.205328941345215, "global_step": 301675, "epoch": 1795} {"train_loss": -12.185403823852539, "global_step": 301676, "epoch": 1795} {"train_loss": -12.26723861694336, "global_step": 301677, "epoch": 1795} {"train_loss": -12.21558666229248, "global_step": 301678, "epoch": 1795} {"train_loss": -12.329449653625488, "global_step": 301679, "epoch": 1795} {"train_loss": -12.095691680908203, "global_step": 301680, "epoch": 1795} {"train_loss": -12.553319931030273, "global_step": 301681, "epoch": 1795} {"train_loss": -11.986366271972656, "global_step": 301682, "epoch": 1795} {"train_loss": -12.152758598327637, "global_step": 301683, "epoch": 1795} {"train_loss": -12.381088256835938, "global_step": 301684, "epoch": 1795} {"train_loss": -12.354894638061523, "global_step": 301685, "epoch": 1795} {"train_loss": -12.13151741027832, "global_step": 301686, "epoch": 1795} {"train_loss": -12.513431549072266, "global_step": 301687, "epoch": 1795} {"train_loss": -12.257619857788086, "global_step": 301688, "epoch": 1795} {"train_loss": -12.24075698852539, "global_step": 301689, "epoch": 1795} {"train_loss": -12.479110717773438, "global_step": 301690, "epoch": 1795} {"train_loss": -11.940301895141602, "global_step": 301691, "epoch": 1795} {"train_loss": -11.689702033996582, "global_step": 301692, "epoch": 1795} {"train_loss": -12.299420356750488, "global_step": 301693, "epoch": 1795} {"train_loss": -12.215572357177734, "global_step": 301694, "epoch": 1795} {"train_loss": -11.572296142578125, "global_step": 301695, "epoch": 1795} {"train_loss": -11.890722274780273, "global_step": 301696, "epoch": 1795} {"train_loss": -11.716445922851562, "global_step": 301697, "epoch": 1795} {"train_loss": -12.560644149780273, "global_step": 301698, "epoch": 1795} {"train_loss": -11.358938217163086, "global_step": 301699, "epoch": 1795} {"train_loss": -11.308685302734375, "global_step": 301700, "epoch": 1795} {"train_loss": -12.266654014587402, "global_step": 301701, "epoch": 1795} {"train_loss": -11.839632034301758, "global_step": 301702, "epoch": 1795} {"train_loss": -12.047881126403809, "global_step": 301703, "epoch": 1795} {"train_loss": -12.080121040344238, "global_step": 301704, "epoch": 1795} {"train_loss": -11.856847763061523, "global_step": 301705, "epoch": 1795} {"train_loss": -11.825641632080078, "global_step": 301706, "epoch": 1795} {"train_loss": -11.977631568908691, "global_step": 301707, "epoch": 1795} {"train_loss": -11.05735969543457, "global_step": 301708, "epoch": 1795} {"train_loss": -11.83427619934082, "global_step": 301709, "epoch": 1795} {"train_loss": -11.498100280761719, "global_step": 301710, "epoch": 1795} {"train_loss": -11.89120864868164, "global_step": 301711, "epoch": 1795} {"train_loss": -10.233736038208008, "global_step": 301712, "epoch": 1795} {"train_loss": -11.709449768066406, "global_step": 301713, "epoch": 1795} {"train_loss": -11.174413681030273, "global_step": 301714, "epoch": 1795} {"train_loss": -10.397904396057129, "global_step": 301715, "epoch": 1795} {"train_loss": -9.879095077514648, "global_step": 301716, "epoch": 1795} {"train_loss": -10.245301246643066, "global_step": 301717, "epoch": 1795} {"train_loss": -10.90662670135498, "global_step": 301718, "epoch": 1795} {"train_loss": -9.700897216796875, "global_step": 301719, "epoch": 1795} {"train_loss": -11.715300559997559, "global_step": 301720, "epoch": 1795} {"train_loss": -10.358924865722656, "global_step": 301721, "epoch": 1795} {"train_loss": -9.807547569274902, "global_step": 301722, "epoch": 1795} {"train_loss": -10.56509780883789, "global_step": 301723, "epoch": 1795} {"train_loss": -8.456052780151367, "global_step": 301724, "epoch": 1795} {"train_loss": -8.169595718383789, "global_step": 301725, "epoch": 1795} {"train_loss": -9.413455963134766, "global_step": 301726, "epoch": 1795} {"train_loss": -11.615602538699196, "global_step": 301727, "epoch": 1795, "val_loss": 281215.78125, "train_action_mse_error": 4.501954078674316} {"train_loss": -9.223993301391602, "global_step": 301728, "epoch": 1796} {"train_loss": -8.342430114746094, "global_step": 301729, "epoch": 1796} {"train_loss": -9.363277435302734, "global_step": 301730, "epoch": 1796} {"train_loss": -8.157611846923828, "global_step": 301731, "epoch": 1796} {"train_loss": -8.850384712219238, "global_step": 301732, "epoch": 1796} {"train_loss": -10.849111557006836, "global_step": 301733, "epoch": 1796} {"train_loss": -8.877848625183105, "global_step": 301734, "epoch": 1796} {"train_loss": -7.667346000671387, "global_step": 301735, "epoch": 1796} {"train_loss": -8.53742790222168, "global_step": 301736, "epoch": 1796} {"train_loss": -8.758556365966797, "global_step": 301737, "epoch": 1796} {"train_loss": -9.322187423706055, "global_step": 301738, "epoch": 1796} {"train_loss": -10.284034729003906, "global_step": 301739, "epoch": 1796} {"train_loss": -9.916086196899414, "global_step": 301740, "epoch": 1796} {"train_loss": -8.921024322509766, "global_step": 301741, "epoch": 1796} {"train_loss": -10.554464340209961, "global_step": 301742, "epoch": 1796} {"train_loss": -10.448681831359863, "global_step": 301743, "epoch": 1796} {"train_loss": -9.761122703552246, "global_step": 301744, "epoch": 1796} {"train_loss": -10.014135360717773, "global_step": 301745, "epoch": 1796} {"train_loss": -10.510323524475098, "global_step": 301746, "epoch": 1796} {"train_loss": -10.214753150939941, "global_step": 301747, "epoch": 1796} {"train_loss": -10.736296653747559, "global_step": 301748, "epoch": 1796} {"train_loss": -11.59117603302002, "global_step": 301749, "epoch": 1796} {"train_loss": -11.274456977844238, "global_step": 301750, "epoch": 1796} {"train_loss": -11.444122314453125, "global_step": 301751, "epoch": 1796} {"train_loss": -11.397944450378418, "global_step": 301752, "epoch": 1796} {"train_loss": -11.356143951416016, "global_step": 301753, "epoch": 1796} {"train_loss": -11.254926681518555, "global_step": 301754, "epoch": 1796} {"train_loss": -11.613289833068848, "global_step": 301755, "epoch": 1796} {"train_loss": -11.254129409790039, "global_step": 301756, "epoch": 1796} {"train_loss": -11.236326217651367, "global_step": 301757, "epoch": 1796} {"train_loss": -11.606903076171875, "global_step": 301758, "epoch": 1796} {"train_loss": -11.47604751586914, "global_step": 301759, "epoch": 1796} {"train_loss": -11.739703178405762, "global_step": 301760, "epoch": 1796} {"train_loss": -11.69410514831543, "global_step": 301761, "epoch": 1796} {"train_loss": -11.728841781616211, "global_step": 301762, "epoch": 1796} {"train_loss": -11.729562759399414, "global_step": 301763, "epoch": 1796} {"train_loss": -11.96440315246582, "global_step": 301764, "epoch": 1796} {"train_loss": -11.792569160461426, "global_step": 301765, "epoch": 1796} {"train_loss": -11.869327545166016, "global_step": 301766, "epoch": 1796} {"train_loss": -11.960596084594727, "global_step": 301767, "epoch": 1796} {"train_loss": -11.854646682739258, "global_step": 301768, "epoch": 1796} {"train_loss": -11.845442771911621, "global_step": 301769, "epoch": 1796} {"train_loss": -11.785409927368164, "global_step": 301770, "epoch": 1796} {"train_loss": -11.688471794128418, "global_step": 301771, "epoch": 1796} {"train_loss": -11.865883827209473, "global_step": 301772, "epoch": 1796} {"train_loss": -11.732234954833984, "global_step": 301773, "epoch": 1796} {"train_loss": -11.81644058227539, "global_step": 301774, "epoch": 1796} {"train_loss": -11.945554733276367, "global_step": 301775, "epoch": 1796} {"train_loss": -11.926486015319824, "global_step": 301776, "epoch": 1796} {"train_loss": -11.977442741394043, "global_step": 301777, "epoch": 1796} {"train_loss": -12.01083755493164, "global_step": 301778, "epoch": 1796} {"train_loss": -11.745969772338867, "global_step": 301779, "epoch": 1796} {"train_loss": -12.078025817871094, "global_step": 301780, "epoch": 1796} {"train_loss": -12.09931755065918, "global_step": 301781, "epoch": 1796} {"train_loss": -12.03675651550293, "global_step": 301782, "epoch": 1796} {"train_loss": -12.081274032592773, "global_step": 301783, "epoch": 1796} {"train_loss": -12.094837188720703, "global_step": 301784, "epoch": 1796} {"train_loss": -11.937482833862305, "global_step": 301785, "epoch": 1796} {"train_loss": -12.12446403503418, "global_step": 301786, "epoch": 1796} {"train_loss": -11.872030258178711, "global_step": 301787, "epoch": 1796} {"train_loss": -12.0794095993042, "global_step": 301788, "epoch": 1796} {"train_loss": -12.103864669799805, "global_step": 301789, "epoch": 1796} {"train_loss": -12.092700958251953, "global_step": 301790, "epoch": 1796} {"train_loss": -12.166463851928711, "global_step": 301791, "epoch": 1796} {"train_loss": -11.81716537475586, "global_step": 301792, "epoch": 1796} {"train_loss": -11.943954467773438, "global_step": 301793, "epoch": 1796} {"train_loss": -12.01565170288086, "global_step": 301794, "epoch": 1796} {"train_loss": -12.067157745361328, "global_step": 301795, "epoch": 1796} {"train_loss": -12.318574905395508, "global_step": 301796, "epoch": 1796} {"train_loss": -12.103424072265625, "global_step": 301797, "epoch": 1796} {"train_loss": -12.054618835449219, "global_step": 301798, "epoch": 1796} {"train_loss": -12.17518424987793, "global_step": 301799, "epoch": 1796} {"train_loss": -12.10975456237793, "global_step": 301800, "epoch": 1796} {"train_loss": -11.750345230102539, "global_step": 301801, "epoch": 1796} {"train_loss": -12.425674438476562, "global_step": 301802, "epoch": 1796} {"train_loss": -11.830961227416992, "global_step": 301803, "epoch": 1796} {"train_loss": -11.667828559875488, "global_step": 301804, "epoch": 1796} {"train_loss": -12.232407569885254, "global_step": 301805, "epoch": 1796} {"train_loss": -11.649801254272461, "global_step": 301806, "epoch": 1796} {"train_loss": -11.958619117736816, "global_step": 301807, "epoch": 1796} {"train_loss": -12.092761993408203, "global_step": 301808, "epoch": 1796} {"train_loss": -11.189842224121094, "global_step": 301809, "epoch": 1796} {"train_loss": -11.993318557739258, "global_step": 301810, "epoch": 1796} {"train_loss": -11.813039779663086, "global_step": 301811, "epoch": 1796} {"train_loss": -11.353167533874512, "global_step": 301812, "epoch": 1796} {"train_loss": -12.142139434814453, "global_step": 301813, "epoch": 1796} {"train_loss": -11.579866409301758, "global_step": 301814, "epoch": 1796} {"train_loss": -11.479524612426758, "global_step": 301815, "epoch": 1796} {"train_loss": -11.997797012329102, "global_step": 301816, "epoch": 1796} {"train_loss": -12.07872486114502, "global_step": 301817, "epoch": 1796} {"train_loss": -12.028033256530762, "global_step": 301818, "epoch": 1796} {"train_loss": -12.076955795288086, "global_step": 301819, "epoch": 1796} {"train_loss": -12.050213813781738, "global_step": 301820, "epoch": 1796} {"train_loss": -10.765063285827637, "global_step": 301821, "epoch": 1796} {"train_loss": -12.316539764404297, "global_step": 301822, "epoch": 1796} {"train_loss": -11.146297454833984, "global_step": 301823, "epoch": 1796} {"train_loss": -12.088438987731934, "global_step": 301824, "epoch": 1796} {"train_loss": -11.785360336303711, "global_step": 301825, "epoch": 1796} {"train_loss": -11.25387954711914, "global_step": 301826, "epoch": 1796} {"train_loss": -11.387263298034668, "global_step": 301827, "epoch": 1796} {"train_loss": -10.602123260498047, "global_step": 301828, "epoch": 1796} {"train_loss": -9.399073600769043, "global_step": 301829, "epoch": 1796} {"train_loss": -10.088485717773438, "global_step": 301830, "epoch": 1796} {"train_loss": -9.960397720336914, "global_step": 301831, "epoch": 1796} {"train_loss": -10.359564781188965, "global_step": 301832, "epoch": 1796} {"train_loss": -10.512065887451172, "global_step": 301833, "epoch": 1796} {"train_loss": -9.872864723205566, "global_step": 301834, "epoch": 1796} {"train_loss": -10.835975646972656, "global_step": 301835, "epoch": 1796} {"train_loss": -10.9044189453125, "global_step": 301836, "epoch": 1796} {"train_loss": -10.546302795410156, "global_step": 301837, "epoch": 1796} {"train_loss": -11.303157806396484, "global_step": 301838, "epoch": 1796} {"train_loss": -10.39059829711914, "global_step": 301839, "epoch": 1796} {"train_loss": -11.871325492858887, "global_step": 301840, "epoch": 1796} {"train_loss": -10.395792007446289, "global_step": 301841, "epoch": 1796} {"train_loss": -11.83894157409668, "global_step": 301842, "epoch": 1796} {"train_loss": -9.31947135925293, "global_step": 301843, "epoch": 1796} {"train_loss": -11.963909149169922, "global_step": 301844, "epoch": 1796} {"train_loss": -9.964578628540039, "global_step": 301845, "epoch": 1796} {"train_loss": -11.60777473449707, "global_step": 301846, "epoch": 1796} {"train_loss": -10.719593048095703, "global_step": 301847, "epoch": 1796} {"train_loss": -11.668038368225098, "global_step": 301848, "epoch": 1796} {"train_loss": -10.937555313110352, "global_step": 301849, "epoch": 1796} {"train_loss": -11.893444061279297, "global_step": 301850, "epoch": 1796} {"train_loss": -11.485664367675781, "global_step": 301851, "epoch": 1796} {"train_loss": -11.915220260620117, "global_step": 301852, "epoch": 1796} {"train_loss": -11.707306861877441, "global_step": 301853, "epoch": 1796} {"train_loss": -11.884654998779297, "global_step": 301854, "epoch": 1796} {"train_loss": -12.051639556884766, "global_step": 301855, "epoch": 1796} {"train_loss": -11.56399154663086, "global_step": 301856, "epoch": 1796} {"train_loss": -11.990242004394531, "global_step": 301857, "epoch": 1796} {"train_loss": -11.846569061279297, "global_step": 301858, "epoch": 1796} {"train_loss": -11.888750076293945, "global_step": 301859, "epoch": 1796} {"train_loss": -12.005906105041504, "global_step": 301860, "epoch": 1796} {"train_loss": -11.747753143310547, "global_step": 301861, "epoch": 1796} {"train_loss": -11.882255554199219, "global_step": 301862, "epoch": 1796} {"train_loss": -12.03082275390625, "global_step": 301863, "epoch": 1796} {"train_loss": -11.831849098205566, "global_step": 301864, "epoch": 1796} {"train_loss": -11.983227729797363, "global_step": 301865, "epoch": 1796} {"train_loss": -12.165514945983887, "global_step": 301866, "epoch": 1796} {"train_loss": -11.941492080688477, "global_step": 301867, "epoch": 1796} {"train_loss": -12.245776176452637, "global_step": 301868, "epoch": 1796} {"train_loss": -12.056533813476562, "global_step": 301869, "epoch": 1796} {"train_loss": -11.73582935333252, "global_step": 301870, "epoch": 1796} {"train_loss": -12.060394287109375, "global_step": 301871, "epoch": 1796} {"train_loss": -12.129597663879395, "global_step": 301872, "epoch": 1796} {"train_loss": -12.10306167602539, "global_step": 301873, "epoch": 1796} {"train_loss": -12.200143814086914, "global_step": 301874, "epoch": 1796} {"train_loss": -12.166054725646973, "global_step": 301875, "epoch": 1796} {"train_loss": -12.309225082397461, "global_step": 301876, "epoch": 1796} {"train_loss": -12.105966567993164, "global_step": 301877, "epoch": 1796} {"train_loss": -12.133598327636719, "global_step": 301878, "epoch": 1796} {"train_loss": -12.227629661560059, "global_step": 301879, "epoch": 1796} {"train_loss": -12.234954833984375, "global_step": 301880, "epoch": 1796} {"train_loss": -11.850217819213867, "global_step": 301881, "epoch": 1796} {"train_loss": -12.059830665588379, "global_step": 301882, "epoch": 1796} {"train_loss": -12.312324523925781, "global_step": 301883, "epoch": 1796} {"train_loss": -12.226452827453613, "global_step": 301884, "epoch": 1796} {"train_loss": -12.360058784484863, "global_step": 301885, "epoch": 1796} {"train_loss": -12.24131965637207, "global_step": 301886, "epoch": 1796} {"train_loss": -12.065092086791992, "global_step": 301887, "epoch": 1796} {"train_loss": -12.195533752441406, "global_step": 301888, "epoch": 1796} {"train_loss": -12.235292434692383, "global_step": 301889, "epoch": 1796} {"train_loss": -12.143978118896484, "global_step": 301890, "epoch": 1796} {"train_loss": -12.458290100097656, "global_step": 301891, "epoch": 1796} {"train_loss": -12.424358367919922, "global_step": 301892, "epoch": 1796} {"train_loss": -12.205495834350586, "global_step": 301893, "epoch": 1796} {"train_loss": -12.105241775512695, "global_step": 301894, "epoch": 1796} {"train_loss": -11.444987416267395, "global_step": 301895, "epoch": 1796, "val_loss": 284718.03125} {"train_loss": -12.448822975158691, "global_step": 301896, "epoch": 1797} {"train_loss": -12.351021766662598, "global_step": 301897, "epoch": 1797} {"train_loss": -12.261417388916016, "global_step": 301898, "epoch": 1797} {"train_loss": -12.376668930053711, "global_step": 301899, "epoch": 1797} {"train_loss": -12.37558650970459, "global_step": 301900, "epoch": 1797} {"train_loss": -12.02164077758789, "global_step": 301901, "epoch": 1797} {"train_loss": -12.002660751342773, "global_step": 301902, "epoch": 1797} {"train_loss": -12.197288513183594, "global_step": 301903, "epoch": 1797} {"train_loss": -11.820829391479492, "global_step": 301904, "epoch": 1797} {"train_loss": -11.820322036743164, "global_step": 301905, "epoch": 1797} {"train_loss": -11.716368675231934, "global_step": 301906, "epoch": 1797} {"train_loss": -11.583373069763184, "global_step": 301907, "epoch": 1797} {"train_loss": -11.756797790527344, "global_step": 301908, "epoch": 1797} {"train_loss": -11.509331703186035, "global_step": 301909, "epoch": 1797} {"train_loss": -11.806472778320312, "global_step": 301910, "epoch": 1797} {"train_loss": -11.470830917358398, "global_step": 301911, "epoch": 1797} {"train_loss": -11.884469985961914, "global_step": 301912, "epoch": 1797} {"train_loss": -10.801916122436523, "global_step": 301913, "epoch": 1797} {"train_loss": -11.715215682983398, "global_step": 301914, "epoch": 1797} {"train_loss": -11.299919128417969, "global_step": 301915, "epoch": 1797} {"train_loss": -11.911376953125, "global_step": 301916, "epoch": 1797} {"train_loss": -11.256998062133789, "global_step": 301917, "epoch": 1797} {"train_loss": -12.136627197265625, "global_step": 301918, "epoch": 1797} {"train_loss": -11.666839599609375, "global_step": 301919, "epoch": 1797} {"train_loss": -11.89818286895752, "global_step": 301920, "epoch": 1797} {"train_loss": -11.896214485168457, "global_step": 301921, "epoch": 1797} {"train_loss": -12.28925609588623, "global_step": 301922, "epoch": 1797} {"train_loss": -11.82122802734375, "global_step": 301923, "epoch": 1797} {"train_loss": -11.719058990478516, "global_step": 301924, "epoch": 1797} {"train_loss": -12.109047889709473, "global_step": 301925, "epoch": 1797} {"train_loss": -11.534220695495605, "global_step": 301926, "epoch": 1797} {"train_loss": -12.099501609802246, "global_step": 301927, "epoch": 1797} {"train_loss": -10.994477272033691, "global_step": 301928, "epoch": 1797} {"train_loss": -12.129776000976562, "global_step": 301929, "epoch": 1797} {"train_loss": -10.880315780639648, "global_step": 301930, "epoch": 1797} {"train_loss": -12.032028198242188, "global_step": 301931, "epoch": 1797} {"train_loss": -11.158232688903809, "global_step": 301932, "epoch": 1797} {"train_loss": -12.199813842773438, "global_step": 301933, "epoch": 1797} {"train_loss": -11.856363296508789, "global_step": 301934, "epoch": 1797} {"train_loss": -11.962353706359863, "global_step": 301935, "epoch": 1797} {"train_loss": -11.941010475158691, "global_step": 301936, "epoch": 1797} {"train_loss": -12.020784378051758, "global_step": 301937, "epoch": 1797} {"train_loss": -12.127561569213867, "global_step": 301938, "epoch": 1797} {"train_loss": -11.98691177368164, "global_step": 301939, "epoch": 1797} {"train_loss": -12.036343574523926, "global_step": 301940, "epoch": 1797} {"train_loss": -11.724422454833984, "global_step": 301941, "epoch": 1797} {"train_loss": -12.123059272766113, "global_step": 301942, "epoch": 1797} {"train_loss": -12.062461853027344, "global_step": 301943, "epoch": 1797} {"train_loss": -12.166339874267578, "global_step": 301944, "epoch": 1797} {"train_loss": -12.084586143493652, "global_step": 301945, "epoch": 1797} {"train_loss": -11.785024642944336, "global_step": 301946, "epoch": 1797} {"train_loss": -11.5349702835083, "global_step": 301947, "epoch": 1797} {"train_loss": -11.87453842163086, "global_step": 301948, "epoch": 1797} {"train_loss": -11.933228492736816, "global_step": 301949, "epoch": 1797} {"train_loss": -12.003154754638672, "global_step": 301950, "epoch": 1797} {"train_loss": -12.101114273071289, "global_step": 301951, "epoch": 1797} {"train_loss": -11.336711883544922, "global_step": 301952, "epoch": 1797} {"train_loss": -11.827858924865723, "global_step": 301953, "epoch": 1797} {"train_loss": -11.680754661560059, "global_step": 301954, "epoch": 1797} {"train_loss": -11.619699478149414, "global_step": 301955, "epoch": 1797} {"train_loss": -11.9940185546875, "global_step": 301956, "epoch": 1797} {"train_loss": -11.719722747802734, "global_step": 301957, "epoch": 1797} {"train_loss": -12.159265518188477, "global_step": 301958, "epoch": 1797} {"train_loss": -11.856562614440918, "global_step": 301959, "epoch": 1797} {"train_loss": -12.199048042297363, "global_step": 301960, "epoch": 1797} {"train_loss": -11.713542938232422, "global_step": 301961, "epoch": 1797} {"train_loss": -11.872116088867188, "global_step": 301962, "epoch": 1797} {"train_loss": -11.646100997924805, "global_step": 301963, "epoch": 1797} {"train_loss": -11.579060554504395, "global_step": 301964, "epoch": 1797} {"train_loss": -12.09661865234375, "global_step": 301965, "epoch": 1797} {"train_loss": -11.666116714477539, "global_step": 301966, "epoch": 1797} {"train_loss": -11.841706275939941, "global_step": 301967, "epoch": 1797} {"train_loss": -12.256681442260742, "global_step": 301968, "epoch": 1797} {"train_loss": -11.62489128112793, "global_step": 301969, "epoch": 1797} {"train_loss": -11.782127380371094, "global_step": 301970, "epoch": 1797} {"train_loss": -12.236653327941895, "global_step": 301971, "epoch": 1797} {"train_loss": -11.745179176330566, "global_step": 301972, "epoch": 1797} {"train_loss": -11.935931205749512, "global_step": 301973, "epoch": 1797} {"train_loss": -11.90381145477295, "global_step": 301974, "epoch": 1797} {"train_loss": -11.83536148071289, "global_step": 301975, "epoch": 1797} {"train_loss": -11.763315200805664, "global_step": 301976, "epoch": 1797} {"train_loss": -12.093767166137695, "global_step": 301977, "epoch": 1797} {"train_loss": -11.595478057861328, "global_step": 301978, "epoch": 1797} {"train_loss": -12.071165084838867, "global_step": 301979, "epoch": 1797} {"train_loss": -11.692184448242188, "global_step": 301980, "epoch": 1797} {"train_loss": -11.996709823608398, "global_step": 301981, "epoch": 1797} {"train_loss": -12.054726600646973, "global_step": 301982, "epoch": 1797} {"train_loss": -12.03982925415039, "global_step": 301983, "epoch": 1797} {"train_loss": -12.19562816619873, "global_step": 301984, "epoch": 1797} {"train_loss": -12.151693344116211, "global_step": 301985, "epoch": 1797} {"train_loss": -11.670061111450195, "global_step": 301986, "epoch": 1797} {"train_loss": -11.994118690490723, "global_step": 301987, "epoch": 1797} {"train_loss": -11.941040992736816, "global_step": 301988, "epoch": 1797} {"train_loss": -11.938451766967773, "global_step": 301989, "epoch": 1797} {"train_loss": -11.920633316040039, "global_step": 301990, "epoch": 1797} {"train_loss": -12.224135398864746, "global_step": 301991, "epoch": 1797} {"train_loss": -12.099017143249512, "global_step": 301992, "epoch": 1797} {"train_loss": -11.994510650634766, "global_step": 301993, "epoch": 1797} {"train_loss": -11.949495315551758, "global_step": 301994, "epoch": 1797} {"train_loss": -11.806707382202148, "global_step": 301995, "epoch": 1797} {"train_loss": -12.15534496307373, "global_step": 301996, "epoch": 1797} {"train_loss": -11.804479598999023, "global_step": 301997, "epoch": 1797} {"train_loss": -11.700096130371094, "global_step": 301998, "epoch": 1797} {"train_loss": -12.059450149536133, "global_step": 301999, "epoch": 1797} {"train_loss": -11.726231575012207, "global_step": 302000, "epoch": 1797} {"train_loss": -11.484167098999023, "global_step": 302001, "epoch": 1797} {"train_loss": -12.143611907958984, "global_step": 302002, "epoch": 1797} {"train_loss": -11.107904434204102, "global_step": 302003, "epoch": 1797} {"train_loss": -11.545489311218262, "global_step": 302004, "epoch": 1797} {"train_loss": -11.613078117370605, "global_step": 302005, "epoch": 1797} {"train_loss": -11.91856575012207, "global_step": 302006, "epoch": 1797} {"train_loss": -11.131342887878418, "global_step": 302007, "epoch": 1797} {"train_loss": -11.03265380859375, "global_step": 302008, "epoch": 1797} {"train_loss": -11.523541450500488, "global_step": 302009, "epoch": 1797} {"train_loss": -10.66891860961914, "global_step": 302010, "epoch": 1797} {"train_loss": -10.942476272583008, "global_step": 302011, "epoch": 1797} {"train_loss": -10.41505241394043, "global_step": 302012, "epoch": 1797} {"train_loss": -10.314350128173828, "global_step": 302013, "epoch": 1797} {"train_loss": -11.2324857711792, "global_step": 302014, "epoch": 1797} {"train_loss": -10.599726676940918, "global_step": 302015, "epoch": 1797} {"train_loss": -10.415855407714844, "global_step": 302016, "epoch": 1797} {"train_loss": -11.474376678466797, "global_step": 302017, "epoch": 1797} {"train_loss": -10.247011184692383, "global_step": 302018, "epoch": 1797} {"train_loss": -11.935319900512695, "global_step": 302019, "epoch": 1797} {"train_loss": -11.146397590637207, "global_step": 302020, "epoch": 1797} {"train_loss": -11.339422225952148, "global_step": 302021, "epoch": 1797} {"train_loss": -11.31183910369873, "global_step": 302022, "epoch": 1797} {"train_loss": -11.319839477539062, "global_step": 302023, "epoch": 1797} {"train_loss": -11.280509948730469, "global_step": 302024, "epoch": 1797} {"train_loss": -11.540046691894531, "global_step": 302025, "epoch": 1797} {"train_loss": -11.748495101928711, "global_step": 302026, "epoch": 1797} {"train_loss": -11.933279991149902, "global_step": 302027, "epoch": 1797} {"train_loss": -11.895210266113281, "global_step": 302028, "epoch": 1797} {"train_loss": -12.025784492492676, "global_step": 302029, "epoch": 1797} {"train_loss": -11.715845108032227, "global_step": 302030, "epoch": 1797} {"train_loss": -11.568997383117676, "global_step": 302031, "epoch": 1797} {"train_loss": -12.033113479614258, "global_step": 302032, "epoch": 1797} {"train_loss": -11.686749458312988, "global_step": 302033, "epoch": 1797} {"train_loss": -12.054902076721191, "global_step": 302034, "epoch": 1797} {"train_loss": -11.899177551269531, "global_step": 302035, "epoch": 1797} {"train_loss": -11.703681945800781, "global_step": 302036, "epoch": 1797} {"train_loss": -11.753589630126953, "global_step": 302037, "epoch": 1797} {"train_loss": -12.14114761352539, "global_step": 302038, "epoch": 1797} {"train_loss": -11.819669723510742, "global_step": 302039, "epoch": 1797} {"train_loss": -12.001924514770508, "global_step": 302040, "epoch": 1797} {"train_loss": -11.887896537780762, "global_step": 302041, "epoch": 1797} {"train_loss": -12.027440071105957, "global_step": 302042, "epoch": 1797} {"train_loss": -12.106437683105469, "global_step": 302043, "epoch": 1797} {"train_loss": -12.00322151184082, "global_step": 302044, "epoch": 1797} {"train_loss": -11.87308120727539, "global_step": 302045, "epoch": 1797} {"train_loss": -11.928443908691406, "global_step": 302046, "epoch": 1797} {"train_loss": -11.832559585571289, "global_step": 302047, "epoch": 1797} {"train_loss": -12.194456100463867, "global_step": 302048, "epoch": 1797} {"train_loss": -11.823387145996094, "global_step": 302049, "epoch": 1797} {"train_loss": -11.810629844665527, "global_step": 302050, "epoch": 1797} {"train_loss": -12.172066688537598, "global_step": 302051, "epoch": 1797} {"train_loss": -11.91262149810791, "global_step": 302052, "epoch": 1797} {"train_loss": -11.958089828491211, "global_step": 302053, "epoch": 1797} {"train_loss": -11.895284652709961, "global_step": 302054, "epoch": 1797} {"train_loss": -12.186573028564453, "global_step": 302055, "epoch": 1797} {"train_loss": -12.012225151062012, "global_step": 302056, "epoch": 1797} {"train_loss": -11.989635467529297, "global_step": 302057, "epoch": 1797} {"train_loss": -11.868638038635254, "global_step": 302058, "epoch": 1797} {"train_loss": -12.353530883789062, "global_step": 302059, "epoch": 1797} {"train_loss": -12.050005912780762, "global_step": 302060, "epoch": 1797} {"train_loss": -12.143239974975586, "global_step": 302061, "epoch": 1797} {"train_loss": -12.15416431427002, "global_step": 302062, "epoch": 1797} {"train_loss": -11.793233655747914, "global_step": 302063, "epoch": 1797, "val_loss": 282544.65625} {"train_loss": -12.13304328918457, "global_step": 302064, "epoch": 1798} {"train_loss": -12.107908248901367, "global_step": 302065, "epoch": 1798} {"train_loss": -12.14263916015625, "global_step": 302066, "epoch": 1798} {"train_loss": -12.126437187194824, "global_step": 302067, "epoch": 1798} {"train_loss": -12.116744995117188, "global_step": 302068, "epoch": 1798} {"train_loss": -12.398114204406738, "global_step": 302069, "epoch": 1798} {"train_loss": -12.081260681152344, "global_step": 302070, "epoch": 1798} {"train_loss": -12.055529594421387, "global_step": 302071, "epoch": 1798} {"train_loss": -12.08064079284668, "global_step": 302072, "epoch": 1798} {"train_loss": -11.8646240234375, "global_step": 302073, "epoch": 1798} {"train_loss": -12.344470977783203, "global_step": 302074, "epoch": 1798} {"train_loss": -11.610279083251953, "global_step": 302075, "epoch": 1798} {"train_loss": -11.43692684173584, "global_step": 302076, "epoch": 1798} {"train_loss": -12.09716796875, "global_step": 302077, "epoch": 1798} {"train_loss": -12.239181518554688, "global_step": 302078, "epoch": 1798} {"train_loss": -11.726659774780273, "global_step": 302079, "epoch": 1798} {"train_loss": -12.070549964904785, "global_step": 302080, "epoch": 1798} {"train_loss": -11.532806396484375, "global_step": 302081, "epoch": 1798} {"train_loss": -11.202753067016602, "global_step": 302082, "epoch": 1798} {"train_loss": -11.616933822631836, "global_step": 302083, "epoch": 1798} {"train_loss": -10.55291748046875, "global_step": 302084, "epoch": 1798} {"train_loss": -10.843986511230469, "global_step": 302085, "epoch": 1798} {"train_loss": -11.551206588745117, "global_step": 302086, "epoch": 1798} {"train_loss": -11.02562427520752, "global_step": 302087, "epoch": 1798} {"train_loss": -11.013174057006836, "global_step": 302088, "epoch": 1798} {"train_loss": -10.007646560668945, "global_step": 302089, "epoch": 1798} {"train_loss": -11.080720901489258, "global_step": 302090, "epoch": 1798} {"train_loss": -10.889347076416016, "global_step": 302091, "epoch": 1798} {"train_loss": -11.2232666015625, "global_step": 302092, "epoch": 1798} {"train_loss": -11.598869323730469, "global_step": 302093, "epoch": 1798} {"train_loss": -11.732268333435059, "global_step": 302094, "epoch": 1798} {"train_loss": -11.71238899230957, "global_step": 302095, "epoch": 1798} {"train_loss": -11.894061088562012, "global_step": 302096, "epoch": 1798} {"train_loss": -11.94630241394043, "global_step": 302097, "epoch": 1798} {"train_loss": -11.835264205932617, "global_step": 302098, "epoch": 1798} {"train_loss": -11.56092357635498, "global_step": 302099, "epoch": 1798} {"train_loss": -11.2743501663208, "global_step": 302100, "epoch": 1798} {"train_loss": -11.120691299438477, "global_step": 302101, "epoch": 1798} {"train_loss": -11.478874206542969, "global_step": 302102, "epoch": 1798} {"train_loss": -11.842229843139648, "global_step": 302103, "epoch": 1798} {"train_loss": -11.797348022460938, "global_step": 302104, "epoch": 1798} {"train_loss": -11.772016525268555, "global_step": 302105, "epoch": 1798} {"train_loss": -11.952280044555664, "global_step": 302106, "epoch": 1798} {"train_loss": -11.85836124420166, "global_step": 302107, "epoch": 1798} {"train_loss": -11.53777027130127, "global_step": 302108, "epoch": 1798} {"train_loss": -12.259773254394531, "global_step": 302109, "epoch": 1798} {"train_loss": -11.603874206542969, "global_step": 302110, "epoch": 1798} {"train_loss": -12.025522232055664, "global_step": 302111, "epoch": 1798} {"train_loss": -11.850364685058594, "global_step": 302112, "epoch": 1798} {"train_loss": -11.488998413085938, "global_step": 302113, "epoch": 1798} {"train_loss": -11.848740577697754, "global_step": 302114, "epoch": 1798} {"train_loss": -11.802398681640625, "global_step": 302115, "epoch": 1798} {"train_loss": -11.640411376953125, "global_step": 302116, "epoch": 1798} {"train_loss": -11.856746673583984, "global_step": 302117, "epoch": 1798} {"train_loss": -11.390670776367188, "global_step": 302118, "epoch": 1798} {"train_loss": -11.819324493408203, "global_step": 302119, "epoch": 1798} {"train_loss": -11.98529052734375, "global_step": 302120, "epoch": 1798} {"train_loss": -11.904184341430664, "global_step": 302121, "epoch": 1798} {"train_loss": -11.894647598266602, "global_step": 302122, "epoch": 1798} {"train_loss": -12.037558555603027, "global_step": 302123, "epoch": 1798} {"train_loss": -11.786502838134766, "global_step": 302124, "epoch": 1798} {"train_loss": -11.908401489257812, "global_step": 302125, "epoch": 1798} {"train_loss": -11.755043029785156, "global_step": 302126, "epoch": 1798} {"train_loss": -12.004852294921875, "global_step": 302127, "epoch": 1798} {"train_loss": -11.685964584350586, "global_step": 302128, "epoch": 1798} {"train_loss": -12.134092330932617, "global_step": 302129, "epoch": 1798} {"train_loss": -11.661238670349121, "global_step": 302130, "epoch": 1798} {"train_loss": -11.908336639404297, "global_step": 302131, "epoch": 1798} {"train_loss": -12.176639556884766, "global_step": 302132, "epoch": 1798} {"train_loss": -11.712202072143555, "global_step": 302133, "epoch": 1798} {"train_loss": -11.932644844055176, "global_step": 302134, "epoch": 1798} {"train_loss": -11.720364570617676, "global_step": 302135, "epoch": 1798} {"train_loss": -11.531171798706055, "global_step": 302136, "epoch": 1798} {"train_loss": -11.89818000793457, "global_step": 302137, "epoch": 1798} {"train_loss": -11.555416107177734, "global_step": 302138, "epoch": 1798} {"train_loss": -11.708818435668945, "global_step": 302139, "epoch": 1798} {"train_loss": -11.698601722717285, "global_step": 302140, "epoch": 1798} {"train_loss": -11.827936172485352, "global_step": 302141, "epoch": 1798} {"train_loss": -12.098559379577637, "global_step": 302142, "epoch": 1798} {"train_loss": -12.022849082946777, "global_step": 302143, "epoch": 1798} {"train_loss": -12.146942138671875, "global_step": 302144, "epoch": 1798} {"train_loss": -11.961376190185547, "global_step": 302145, "epoch": 1798} {"train_loss": -12.196259498596191, "global_step": 302146, "epoch": 1798} {"train_loss": -12.111507415771484, "global_step": 302147, "epoch": 1798} {"train_loss": -12.108072280883789, "global_step": 302148, "epoch": 1798} {"train_loss": -12.069835662841797, "global_step": 302149, "epoch": 1798} {"train_loss": -11.950963973999023, "global_step": 302150, "epoch": 1798} {"train_loss": -12.243965148925781, "global_step": 302151, "epoch": 1798} {"train_loss": -12.195721626281738, "global_step": 302152, "epoch": 1798} {"train_loss": -11.88662338256836, "global_step": 302153, "epoch": 1798} {"train_loss": -12.247526168823242, "global_step": 302154, "epoch": 1798} {"train_loss": -12.104242324829102, "global_step": 302155, "epoch": 1798} {"train_loss": -12.292776107788086, "global_step": 302156, "epoch": 1798} {"train_loss": -12.318934440612793, "global_step": 302157, "epoch": 1798} {"train_loss": -12.09337329864502, "global_step": 302158, "epoch": 1798} {"train_loss": -12.14976692199707, "global_step": 302159, "epoch": 1798} {"train_loss": -12.206802368164062, "global_step": 302160, "epoch": 1798} {"train_loss": -12.315349578857422, "global_step": 302161, "epoch": 1798} {"train_loss": -12.440130233764648, "global_step": 302162, "epoch": 1798} {"train_loss": -12.369058609008789, "global_step": 302163, "epoch": 1798} {"train_loss": -12.275619506835938, "global_step": 302164, "epoch": 1798} {"train_loss": -12.226184844970703, "global_step": 302165, "epoch": 1798} {"train_loss": -12.306133270263672, "global_step": 302166, "epoch": 1798} {"train_loss": -11.867700576782227, "global_step": 302167, "epoch": 1798} {"train_loss": -11.986835479736328, "global_step": 302168, "epoch": 1798} {"train_loss": -12.165660858154297, "global_step": 302169, "epoch": 1798} {"train_loss": -12.197797775268555, "global_step": 302170, "epoch": 1798} {"train_loss": -11.847450256347656, "global_step": 302171, "epoch": 1798} {"train_loss": -12.173818588256836, "global_step": 302172, "epoch": 1798} {"train_loss": -11.73466682434082, "global_step": 302173, "epoch": 1798} {"train_loss": -11.980018615722656, "global_step": 302174, "epoch": 1798} {"train_loss": -12.214099884033203, "global_step": 302175, "epoch": 1798} {"train_loss": -11.6529541015625, "global_step": 302176, "epoch": 1798} {"train_loss": -12.344396591186523, "global_step": 302177, "epoch": 1798} {"train_loss": -12.406671524047852, "global_step": 302178, "epoch": 1798} {"train_loss": -11.949060440063477, "global_step": 302179, "epoch": 1798} {"train_loss": -12.089298248291016, "global_step": 302180, "epoch": 1798} {"train_loss": -11.313365936279297, "global_step": 302181, "epoch": 1798} {"train_loss": -12.03810977935791, "global_step": 302182, "epoch": 1798} {"train_loss": -11.534051895141602, "global_step": 302183, "epoch": 1798} {"train_loss": -11.601401329040527, "global_step": 302184, "epoch": 1798} {"train_loss": -10.91142463684082, "global_step": 302185, "epoch": 1798} {"train_loss": -11.543947219848633, "global_step": 302186, "epoch": 1798} {"train_loss": -11.536609649658203, "global_step": 302187, "epoch": 1798} {"train_loss": -11.035745620727539, "global_step": 302188, "epoch": 1798} {"train_loss": -11.82809066772461, "global_step": 302189, "epoch": 1798} {"train_loss": -11.803211212158203, "global_step": 302190, "epoch": 1798} {"train_loss": -11.373589515686035, "global_step": 302191, "epoch": 1798} {"train_loss": -11.13402271270752, "global_step": 302192, "epoch": 1798} {"train_loss": -11.768896102905273, "global_step": 302193, "epoch": 1798} {"train_loss": -11.096105575561523, "global_step": 302194, "epoch": 1798} {"train_loss": -10.799176216125488, "global_step": 302195, "epoch": 1798} {"train_loss": -10.837592124938965, "global_step": 302196, "epoch": 1798} {"train_loss": -10.140092849731445, "global_step": 302197, "epoch": 1798} {"train_loss": -10.399714469909668, "global_step": 302198, "epoch": 1798} {"train_loss": -10.432411193847656, "global_step": 302199, "epoch": 1798} {"train_loss": -11.002120971679688, "global_step": 302200, "epoch": 1798} {"train_loss": -10.348637580871582, "global_step": 302201, "epoch": 1798} {"train_loss": -11.043615341186523, "global_step": 302202, "epoch": 1798} {"train_loss": -10.179489135742188, "global_step": 302203, "epoch": 1798} {"train_loss": -11.014906883239746, "global_step": 302204, "epoch": 1798} {"train_loss": -10.624853134155273, "global_step": 302205, "epoch": 1798} {"train_loss": -9.952048301696777, "global_step": 302206, "epoch": 1798} {"train_loss": -10.992874145507812, "global_step": 302207, "epoch": 1798} {"train_loss": -10.195756912231445, "global_step": 302208, "epoch": 1798} {"train_loss": -10.444280624389648, "global_step": 302209, "epoch": 1798} {"train_loss": -11.808032035827637, "global_step": 302210, "epoch": 1798} {"train_loss": -11.199155807495117, "global_step": 302211, "epoch": 1798} {"train_loss": -11.549516677856445, "global_step": 302212, "epoch": 1798} {"train_loss": -10.86868953704834, "global_step": 302213, "epoch": 1798} {"train_loss": -10.909696578979492, "global_step": 302214, "epoch": 1798} {"train_loss": -11.519405364990234, "global_step": 302215, "epoch": 1798} {"train_loss": -10.9662446975708, "global_step": 302216, "epoch": 1798} {"train_loss": -11.496417999267578, "global_step": 302217, "epoch": 1798} {"train_loss": -11.31517219543457, "global_step": 302218, "epoch": 1798} {"train_loss": -11.176292419433594, "global_step": 302219, "epoch": 1798} {"train_loss": -11.814016342163086, "global_step": 302220, "epoch": 1798} {"train_loss": -11.246637344360352, "global_step": 302221, "epoch": 1798} {"train_loss": -11.1577787399292, "global_step": 302222, "epoch": 1798} {"train_loss": -11.75063419342041, "global_step": 302223, "epoch": 1798} {"train_loss": -10.950112342834473, "global_step": 302224, "epoch": 1798} {"train_loss": -11.763279914855957, "global_step": 302225, "epoch": 1798} {"train_loss": -11.58905029296875, "global_step": 302226, "epoch": 1798} {"train_loss": -11.648821830749512, "global_step": 302227, "epoch": 1798} {"train_loss": -11.685981750488281, "global_step": 302228, "epoch": 1798} {"train_loss": -11.722000122070312, "global_step": 302229, "epoch": 1798} {"train_loss": -11.591841697692871, "global_step": 302230, "epoch": 1798} {"train_loss": -11.650449099994841, "global_step": 302231, "epoch": 1798, "val_loss": 281224.78125} {"train_loss": -11.649391174316406, "global_step": 302232, "epoch": 1799} {"train_loss": -12.012495994567871, "global_step": 302233, "epoch": 1799} {"train_loss": -11.497384071350098, "global_step": 302234, "epoch": 1799} {"train_loss": -12.047048568725586, "global_step": 302235, "epoch": 1799} {"train_loss": -11.912698745727539, "global_step": 302236, "epoch": 1799} {"train_loss": -11.907764434814453, "global_step": 302237, "epoch": 1799} {"train_loss": -12.145671844482422, "global_step": 302238, "epoch": 1799} {"train_loss": -11.994186401367188, "global_step": 302239, "epoch": 1799} {"train_loss": -11.990726470947266, "global_step": 302240, "epoch": 1799} {"train_loss": -12.124910354614258, "global_step": 302241, "epoch": 1799} {"train_loss": -11.95378303527832, "global_step": 302242, "epoch": 1799} {"train_loss": -12.020211219787598, "global_step": 302243, "epoch": 1799} {"train_loss": -12.09107780456543, "global_step": 302244, "epoch": 1799} {"train_loss": -11.820623397827148, "global_step": 302245, "epoch": 1799} {"train_loss": -12.154147148132324, "global_step": 302246, "epoch": 1799} {"train_loss": -12.124683380126953, "global_step": 302247, "epoch": 1799} {"train_loss": -12.208516120910645, "global_step": 302248, "epoch": 1799} {"train_loss": -12.189897537231445, "global_step": 302249, "epoch": 1799} {"train_loss": -12.159971237182617, "global_step": 302250, "epoch": 1799} {"train_loss": -12.304550170898438, "global_step": 302251, "epoch": 1799} {"train_loss": -12.011837005615234, "global_step": 302252, "epoch": 1799} {"train_loss": -12.093505859375, "global_step": 302253, "epoch": 1799} {"train_loss": -11.878332138061523, "global_step": 302254, "epoch": 1799} {"train_loss": -12.314793586730957, "global_step": 302255, "epoch": 1799} {"train_loss": -12.142047882080078, "global_step": 302256, "epoch": 1799} {"train_loss": -12.157381057739258, "global_step": 302257, "epoch": 1799} {"train_loss": -11.956001281738281, "global_step": 302258, "epoch": 1799} {"train_loss": -12.325174331665039, "global_step": 302259, "epoch": 1799} {"train_loss": -12.337183952331543, "global_step": 302260, "epoch": 1799} {"train_loss": -12.303242683410645, "global_step": 302261, "epoch": 1799} {"train_loss": -12.307923316955566, "global_step": 302262, "epoch": 1799} {"train_loss": -12.122753143310547, "global_step": 302263, "epoch": 1799} {"train_loss": -12.039359092712402, "global_step": 302264, "epoch": 1799} {"train_loss": -12.02273941040039, "global_step": 302265, "epoch": 1799} {"train_loss": -12.272421836853027, "global_step": 302266, "epoch": 1799} {"train_loss": -11.94588565826416, "global_step": 302267, "epoch": 1799} {"train_loss": -12.303638458251953, "global_step": 302268, "epoch": 1799} {"train_loss": -12.010101318359375, "global_step": 302269, "epoch": 1799} {"train_loss": -12.173469543457031, "global_step": 302270, "epoch": 1799} {"train_loss": -11.913408279418945, "global_step": 302271, "epoch": 1799} {"train_loss": -12.204423904418945, "global_step": 302272, "epoch": 1799} {"train_loss": -11.92148208618164, "global_step": 302273, "epoch": 1799} {"train_loss": -12.08203125, "global_step": 302274, "epoch": 1799} {"train_loss": -11.92835807800293, "global_step": 302275, "epoch": 1799} {"train_loss": -12.503355026245117, "global_step": 302276, "epoch": 1799} {"train_loss": -11.645369529724121, "global_step": 302277, "epoch": 1799} {"train_loss": -12.356091499328613, "global_step": 302278, "epoch": 1799} {"train_loss": -11.901864051818848, "global_step": 302279, "epoch": 1799} {"train_loss": -12.16842269897461, "global_step": 302280, "epoch": 1799} {"train_loss": -11.894975662231445, "global_step": 302281, "epoch": 1799} {"train_loss": -12.060945510864258, "global_step": 302282, "epoch": 1799} {"train_loss": -12.317380905151367, "global_step": 302283, "epoch": 1799} {"train_loss": -12.291215896606445, "global_step": 302284, "epoch": 1799} {"train_loss": -12.27763557434082, "global_step": 302285, "epoch": 1799} {"train_loss": -12.424155235290527, "global_step": 302286, "epoch": 1799} {"train_loss": -12.203479766845703, "global_step": 302287, "epoch": 1799} {"train_loss": -11.822985649108887, "global_step": 302288, "epoch": 1799} {"train_loss": -12.222872734069824, "global_step": 302289, "epoch": 1799} {"train_loss": -11.975679397583008, "global_step": 302290, "epoch": 1799} {"train_loss": -12.091609954833984, "global_step": 302291, "epoch": 1799} {"train_loss": -12.038253784179688, "global_step": 302292, "epoch": 1799} {"train_loss": -11.108378410339355, "global_step": 302293, "epoch": 1799} {"train_loss": -11.497238159179688, "global_step": 302294, "epoch": 1799} {"train_loss": -12.033414840698242, "global_step": 302295, "epoch": 1799} {"train_loss": -11.475265502929688, "global_step": 302296, "epoch": 1799} {"train_loss": -10.800508499145508, "global_step": 302297, "epoch": 1799} {"train_loss": -12.292021751403809, "global_step": 302298, "epoch": 1799} {"train_loss": -10.893426895141602, "global_step": 302299, "epoch": 1799} {"train_loss": -10.457727432250977, "global_step": 302300, "epoch": 1799} {"train_loss": -11.883968353271484, "global_step": 302301, "epoch": 1799} {"train_loss": -11.288263320922852, "global_step": 302302, "epoch": 1799} {"train_loss": -11.287895202636719, "global_step": 302303, "epoch": 1799} {"train_loss": -11.875020027160645, "global_step": 302304, "epoch": 1799} {"train_loss": -11.599845886230469, "global_step": 302305, "epoch": 1799} {"train_loss": -11.482311248779297, "global_step": 302306, "epoch": 1799} {"train_loss": -11.85959529876709, "global_step": 302307, "epoch": 1799} {"train_loss": -10.583784103393555, "global_step": 302308, "epoch": 1799} {"train_loss": -11.690828323364258, "global_step": 302309, "epoch": 1799} {"train_loss": -11.033479690551758, "global_step": 302310, "epoch": 1799} {"train_loss": -11.406453132629395, "global_step": 302311, "epoch": 1799} {"train_loss": -11.032721519470215, "global_step": 302312, "epoch": 1799} {"train_loss": -11.267623901367188, "global_step": 302313, "epoch": 1799} {"train_loss": -11.78779411315918, "global_step": 302314, "epoch": 1799} {"train_loss": -10.686100006103516, "global_step": 302315, "epoch": 1799} {"train_loss": -11.482917785644531, "global_step": 302316, "epoch": 1799} {"train_loss": -10.686637878417969, "global_step": 302317, "epoch": 1799} {"train_loss": -9.9314603805542, "global_step": 302318, "epoch": 1799} {"train_loss": -11.014163970947266, "global_step": 302319, "epoch": 1799} {"train_loss": -10.18208122253418, "global_step": 302320, "epoch": 1799} {"train_loss": -10.690591812133789, "global_step": 302321, "epoch": 1799} {"train_loss": -11.352851867675781, "global_step": 302322, "epoch": 1799} {"train_loss": -10.349411964416504, "global_step": 302323, "epoch": 1799} {"train_loss": -11.476219177246094, "global_step": 302324, "epoch": 1799} {"train_loss": -10.179285049438477, "global_step": 302325, "epoch": 1799} {"train_loss": -10.819923400878906, "global_step": 302326, "epoch": 1799} {"train_loss": -10.384542465209961, "global_step": 302327, "epoch": 1799} {"train_loss": -9.911910057067871, "global_step": 302328, "epoch": 1799} {"train_loss": -9.820072174072266, "global_step": 302329, "epoch": 1799} {"train_loss": -10.707040786743164, "global_step": 302330, "epoch": 1799} {"train_loss": -10.61573600769043, "global_step": 302331, "epoch": 1799} {"train_loss": -10.714676856994629, "global_step": 302332, "epoch": 1799} {"train_loss": -10.068584442138672, "global_step": 302333, "epoch": 1799} {"train_loss": -10.98944091796875, "global_step": 302334, "epoch": 1799} {"train_loss": -10.38444709777832, "global_step": 302335, "epoch": 1799} {"train_loss": -11.022258758544922, "global_step": 302336, "epoch": 1799} {"train_loss": -10.232927322387695, "global_step": 302337, "epoch": 1799} {"train_loss": -10.86525821685791, "global_step": 302338, "epoch": 1799} {"train_loss": -10.90767765045166, "global_step": 302339, "epoch": 1799} {"train_loss": -11.033529281616211, "global_step": 302340, "epoch": 1799} {"train_loss": -11.025358200073242, "global_step": 302341, "epoch": 1799} {"train_loss": -11.546546936035156, "global_step": 302342, "epoch": 1799} {"train_loss": -11.297598838806152, "global_step": 302343, "epoch": 1799} {"train_loss": -11.300128936767578, "global_step": 302344, "epoch": 1799} {"train_loss": -11.601066589355469, "global_step": 302345, "epoch": 1799} {"train_loss": -11.321008682250977, "global_step": 302346, "epoch": 1799} {"train_loss": -12.005175590515137, "global_step": 302347, "epoch": 1799} {"train_loss": -11.647248268127441, "global_step": 302348, "epoch": 1799} {"train_loss": -11.767009735107422, "global_step": 302349, "epoch": 1799} {"train_loss": -11.9422607421875, "global_step": 302350, "epoch": 1799} {"train_loss": -11.733043670654297, "global_step": 302351, "epoch": 1799} {"train_loss": -11.557550430297852, "global_step": 302352, "epoch": 1799} {"train_loss": -11.83619213104248, "global_step": 302353, "epoch": 1799} {"train_loss": -11.752041816711426, "global_step": 302354, "epoch": 1799} {"train_loss": -11.97205924987793, "global_step": 302355, "epoch": 1799} {"train_loss": -11.839929580688477, "global_step": 302356, "epoch": 1799} {"train_loss": -12.120588302612305, "global_step": 302357, "epoch": 1799} {"train_loss": -11.99398422241211, "global_step": 302358, "epoch": 1799} {"train_loss": -11.704221725463867, "global_step": 302359, "epoch": 1799} {"train_loss": -12.055469512939453, "global_step": 302360, "epoch": 1799} {"train_loss": -11.919498443603516, "global_step": 302361, "epoch": 1799} {"train_loss": -11.819782257080078, "global_step": 302362, "epoch": 1799} {"train_loss": -11.83622932434082, "global_step": 302363, "epoch": 1799} {"train_loss": -11.787158966064453, "global_step": 302364, "epoch": 1799} {"train_loss": -11.987363815307617, "global_step": 302365, "epoch": 1799} {"train_loss": -11.987380981445312, "global_step": 302366, "epoch": 1799} {"train_loss": -11.831378936767578, "global_step": 302367, "epoch": 1799} {"train_loss": -12.01101016998291, "global_step": 302368, "epoch": 1799} {"train_loss": -11.871942520141602, "global_step": 302369, "epoch": 1799} {"train_loss": -12.10482120513916, "global_step": 302370, "epoch": 1799} {"train_loss": -12.23295783996582, "global_step": 302371, "epoch": 1799} {"train_loss": -11.930843353271484, "global_step": 302372, "epoch": 1799} {"train_loss": -11.998565673828125, "global_step": 302373, "epoch": 1799} {"train_loss": -12.01276969909668, "global_step": 302374, "epoch": 1799} {"train_loss": -12.067325592041016, "global_step": 302375, "epoch": 1799} {"train_loss": -12.136245727539062, "global_step": 302376, "epoch": 1799} {"train_loss": -12.002113342285156, "global_step": 302377, "epoch": 1799} {"train_loss": -12.114286422729492, "global_step": 302378, "epoch": 1799} {"train_loss": -11.963628768920898, "global_step": 302379, "epoch": 1799} {"train_loss": -12.129722595214844, "global_step": 302380, "epoch": 1799} {"train_loss": -12.102193832397461, "global_step": 302381, "epoch": 1799} {"train_loss": -11.88117790222168, "global_step": 302382, "epoch": 1799} {"train_loss": -12.075037956237793, "global_step": 302383, "epoch": 1799} {"train_loss": -11.920816421508789, "global_step": 302384, "epoch": 1799} {"train_loss": -12.083372116088867, "global_step": 302385, "epoch": 1799} {"train_loss": -11.64769458770752, "global_step": 302386, "epoch": 1799} {"train_loss": -12.074084281921387, "global_step": 302387, "epoch": 1799} {"train_loss": -12.042036056518555, "global_step": 302388, "epoch": 1799} {"train_loss": -12.112546920776367, "global_step": 302389, "epoch": 1799} {"train_loss": -12.273360252380371, "global_step": 302390, "epoch": 1799} {"train_loss": -12.156298637390137, "global_step": 302391, "epoch": 1799} {"train_loss": -12.075249671936035, "global_step": 302392, "epoch": 1799} {"train_loss": -12.29886245727539, "global_step": 302393, "epoch": 1799} {"train_loss": -12.120063781738281, "global_step": 302394, "epoch": 1799} {"train_loss": -12.340331077575684, "global_step": 302395, "epoch": 1799} {"train_loss": -12.03348159790039, "global_step": 302396, "epoch": 1799} {"train_loss": -12.090335845947266, "global_step": 302397, "epoch": 1799} {"train_loss": -11.788604736328125, "global_step": 302398, "epoch": 1799} {"train_loss": -11.711031828607831, "global_step": 302399, "epoch": 1799, "val_loss": 281560.53125} {"train_loss": -11.970319747924805, "global_step": 302400, "epoch": 1800} {"train_loss": -12.23741340637207, "global_step": 302401, "epoch": 1800} {"train_loss": -12.331640243530273, "global_step": 302402, "epoch": 1800} {"train_loss": -12.293519973754883, "global_step": 302403, "epoch": 1800} {"train_loss": -12.277645111083984, "global_step": 302404, "epoch": 1800} {"train_loss": -11.990602493286133, "global_step": 302405, "epoch": 1800} {"train_loss": -12.193171501159668, "global_step": 302406, "epoch": 1800} {"train_loss": -12.257955551147461, "global_step": 302407, "epoch": 1800} {"train_loss": -12.183751106262207, "global_step": 302408, "epoch": 1800} {"train_loss": -12.339320182800293, "global_step": 302409, "epoch": 1800} {"train_loss": -12.402729034423828, "global_step": 302410, "epoch": 1800} {"train_loss": -11.848836898803711, "global_step": 302411, "epoch": 1800} {"train_loss": -12.0449800491333, "global_step": 302412, "epoch": 1800} {"train_loss": -12.201571464538574, "global_step": 302413, "epoch": 1800} {"train_loss": -11.916984558105469, "global_step": 302414, "epoch": 1800} {"train_loss": -11.936283111572266, "global_step": 302415, "epoch": 1800} {"train_loss": -12.28653335571289, "global_step": 302416, "epoch": 1800} {"train_loss": -11.843252182006836, "global_step": 302417, "epoch": 1800} {"train_loss": -12.300570487976074, "global_step": 302418, "epoch": 1800} {"train_loss": -12.084832191467285, "global_step": 302419, "epoch": 1800} {"train_loss": -12.471990585327148, "global_step": 302420, "epoch": 1800} {"train_loss": -12.36289119720459, "global_step": 302421, "epoch": 1800} {"train_loss": -12.296638488769531, "global_step": 302422, "epoch": 1800} {"train_loss": -12.32206916809082, "global_step": 302423, "epoch": 1800} {"train_loss": -12.38394546508789, "global_step": 302424, "epoch": 1800} {"train_loss": -12.41695785522461, "global_step": 302425, "epoch": 1800} {"train_loss": -12.447935104370117, "global_step": 302426, "epoch": 1800} {"train_loss": -12.295355796813965, "global_step": 302427, "epoch": 1800} {"train_loss": -12.310155868530273, "global_step": 302428, "epoch": 1800} {"train_loss": -12.245758056640625, "global_step": 302429, "epoch": 1800} {"train_loss": -12.280905723571777, "global_step": 302430, "epoch": 1800} {"train_loss": -12.346612930297852, "global_step": 302431, "epoch": 1800} {"train_loss": -12.385324478149414, "global_step": 302432, "epoch": 1800} {"train_loss": -11.848658561706543, "global_step": 302433, "epoch": 1800} {"train_loss": -12.01363754272461, "global_step": 302434, "epoch": 1800} {"train_loss": -11.702676773071289, "global_step": 302435, "epoch": 1800} {"train_loss": -12.332889556884766, "global_step": 302436, "epoch": 1800} {"train_loss": -11.533756256103516, "global_step": 302437, "epoch": 1800} {"train_loss": -12.166580200195312, "global_step": 302438, "epoch": 1800} {"train_loss": -11.575593948364258, "global_step": 302439, "epoch": 1800} {"train_loss": -12.10527229309082, "global_step": 302440, "epoch": 1800} {"train_loss": -11.538456916809082, "global_step": 302441, "epoch": 1800} {"train_loss": -12.311484336853027, "global_step": 302442, "epoch": 1800} {"train_loss": -11.595956802368164, "global_step": 302443, "epoch": 1800} {"train_loss": -12.098642349243164, "global_step": 302444, "epoch": 1800} {"train_loss": -10.77288818359375, "global_step": 302445, "epoch": 1800} {"train_loss": -12.015509605407715, "global_step": 302446, "epoch": 1800} {"train_loss": -11.189126014709473, "global_step": 302447, "epoch": 1800} {"train_loss": -10.640180587768555, "global_step": 302448, "epoch": 1800} {"train_loss": -11.617157936096191, "global_step": 302449, "epoch": 1800} {"train_loss": -11.189090728759766, "global_step": 302450, "epoch": 1800} {"train_loss": -11.283823013305664, "global_step": 302451, "epoch": 1800} {"train_loss": -11.754151344299316, "global_step": 302452, "epoch": 1800} {"train_loss": -11.293388366699219, "global_step": 302453, "epoch": 1800} {"train_loss": -11.549371719360352, "global_step": 302454, "epoch": 1800} {"train_loss": -11.746528625488281, "global_step": 302455, "epoch": 1800} {"train_loss": -11.62869930267334, "global_step": 302456, "epoch": 1800} {"train_loss": -11.502077102661133, "global_step": 302457, "epoch": 1800} {"train_loss": -11.65787124633789, "global_step": 302458, "epoch": 1800} {"train_loss": -11.802780151367188, "global_step": 302459, "epoch": 1800} {"train_loss": -11.273109436035156, "global_step": 302460, "epoch": 1800} {"train_loss": -11.639751434326172, "global_step": 302461, "epoch": 1800} {"train_loss": -11.188151359558105, "global_step": 302462, "epoch": 1800} {"train_loss": -10.541484832763672, "global_step": 302463, "epoch": 1800} {"train_loss": -11.631345748901367, "global_step": 302464, "epoch": 1800} {"train_loss": -11.475571632385254, "global_step": 302465, "epoch": 1800} {"train_loss": -11.515274047851562, "global_step": 302466, "epoch": 1800} {"train_loss": -10.779563903808594, "global_step": 302467, "epoch": 1800} {"train_loss": -12.32961368560791, "global_step": 302468, "epoch": 1800} {"train_loss": -11.125711441040039, "global_step": 302469, "epoch": 1800} {"train_loss": -12.249859809875488, "global_step": 302470, "epoch": 1800} {"train_loss": -11.097476959228516, "global_step": 302471, "epoch": 1800} {"train_loss": -11.720486640930176, "global_step": 302472, "epoch": 1800} {"train_loss": -11.656145095825195, "global_step": 302473, "epoch": 1800} {"train_loss": -11.110397338867188, "global_step": 302474, "epoch": 1800} {"train_loss": -11.530977249145508, "global_step": 302475, "epoch": 1800} {"train_loss": -11.29180908203125, "global_step": 302476, "epoch": 1800} {"train_loss": -11.764921188354492, "global_step": 302477, "epoch": 1800} {"train_loss": -11.190292358398438, "global_step": 302478, "epoch": 1800} {"train_loss": -12.303316116333008, "global_step": 302479, "epoch": 1800} {"train_loss": -11.675158500671387, "global_step": 302480, "epoch": 1800} {"train_loss": -11.67012882232666, "global_step": 302481, "epoch": 1800} {"train_loss": -11.962857246398926, "global_step": 302482, "epoch": 1800} {"train_loss": -11.99975299835205, "global_step": 302483, "epoch": 1800} {"train_loss": -11.918935775756836, "global_step": 302484, "epoch": 1800} {"train_loss": -11.849916458129883, "global_step": 302485, "epoch": 1800} {"train_loss": -12.121000289916992, "global_step": 302486, "epoch": 1800} {"train_loss": -11.87930679321289, "global_step": 302487, "epoch": 1800} {"train_loss": -12.190559387207031, "global_step": 302488, "epoch": 1800} {"train_loss": -12.008894920349121, "global_step": 302489, "epoch": 1800} {"train_loss": -12.189486503601074, "global_step": 302490, "epoch": 1800} {"train_loss": -12.07701587677002, "global_step": 302491, "epoch": 1800} {"train_loss": -12.309464454650879, "global_step": 302492, "epoch": 1800} {"train_loss": -12.113247871398926, "global_step": 302493, "epoch": 1800} {"train_loss": -12.248916625976562, "global_step": 302494, "epoch": 1800} {"train_loss": -12.059624671936035, "global_step": 302495, "epoch": 1800} {"train_loss": -12.259913444519043, "global_step": 302496, "epoch": 1800} {"train_loss": -12.109890937805176, "global_step": 302497, "epoch": 1800} {"train_loss": -12.135528564453125, "global_step": 302498, "epoch": 1800} {"train_loss": -11.93478012084961, "global_step": 302499, "epoch": 1800} {"train_loss": -12.238667488098145, "global_step": 302500, "epoch": 1800} {"train_loss": -12.094348907470703, "global_step": 302501, "epoch": 1800} {"train_loss": -12.090354919433594, "global_step": 302502, "epoch": 1800} {"train_loss": -12.15703010559082, "global_step": 302503, "epoch": 1800} {"train_loss": -11.722992897033691, "global_step": 302504, "epoch": 1800} {"train_loss": -11.751500129699707, "global_step": 302505, "epoch": 1800} {"train_loss": -12.43199634552002, "global_step": 302506, "epoch": 1800} {"train_loss": -11.769691467285156, "global_step": 302507, "epoch": 1800} {"train_loss": -11.979653358459473, "global_step": 302508, "epoch": 1800} {"train_loss": -12.266016960144043, "global_step": 302509, "epoch": 1800} {"train_loss": -12.294747352600098, "global_step": 302510, "epoch": 1800} {"train_loss": -11.432750701904297, "global_step": 302511, "epoch": 1800} {"train_loss": -12.082956314086914, "global_step": 302512, "epoch": 1800} {"train_loss": -12.075925827026367, "global_step": 302513, "epoch": 1800} {"train_loss": -11.403657913208008, "global_step": 302514, "epoch": 1800} {"train_loss": -11.984620094299316, "global_step": 302515, "epoch": 1800} {"train_loss": -12.324186325073242, "global_step": 302516, "epoch": 1800} {"train_loss": -12.055710792541504, "global_step": 302517, "epoch": 1800} {"train_loss": -12.020745277404785, "global_step": 302518, "epoch": 1800} {"train_loss": -11.951530456542969, "global_step": 302519, "epoch": 1800} {"train_loss": -12.316749572753906, "global_step": 302520, "epoch": 1800} {"train_loss": -12.109748840332031, "global_step": 302521, "epoch": 1800} {"train_loss": -12.277252197265625, "global_step": 302522, "epoch": 1800} {"train_loss": -12.207255363464355, "global_step": 302523, "epoch": 1800} {"train_loss": -12.061598777770996, "global_step": 302524, "epoch": 1800} {"train_loss": -12.016324996948242, "global_step": 302525, "epoch": 1800} {"train_loss": -12.333714485168457, "global_step": 302526, "epoch": 1800} {"train_loss": -11.714994430541992, "global_step": 302527, "epoch": 1800} {"train_loss": -12.210077285766602, "global_step": 302528, "epoch": 1800} {"train_loss": -12.084405899047852, "global_step": 302529, "epoch": 1800} {"train_loss": -12.129632949829102, "global_step": 302530, "epoch": 1800} {"train_loss": -12.413593292236328, "global_step": 302531, "epoch": 1800} {"train_loss": -11.900141716003418, "global_step": 302532, "epoch": 1800} {"train_loss": -12.317130088806152, "global_step": 302533, "epoch": 1800} {"train_loss": -12.074897766113281, "global_step": 302534, "epoch": 1800} {"train_loss": -11.96651554107666, "global_step": 302535, "epoch": 1800} {"train_loss": -12.410924911499023, "global_step": 302536, "epoch": 1800} {"train_loss": -12.17469310760498, "global_step": 302537, "epoch": 1800} {"train_loss": -12.254030227661133, "global_step": 302538, "epoch": 1800} {"train_loss": -12.13087272644043, "global_step": 302539, "epoch": 1800} {"train_loss": -12.347169876098633, "global_step": 302540, "epoch": 1800} {"train_loss": -12.066783905029297, "global_step": 302541, "epoch": 1800} {"train_loss": -12.597537994384766, "global_step": 302542, "epoch": 1800} {"train_loss": -11.952771186828613, "global_step": 302543, "epoch": 1800} {"train_loss": -12.490907669067383, "global_step": 302544, "epoch": 1800} {"train_loss": -11.786526679992676, "global_step": 302545, "epoch": 1800} {"train_loss": -11.865758895874023, "global_step": 302546, "epoch": 1800} {"train_loss": -12.164037704467773, "global_step": 302547, "epoch": 1800} {"train_loss": -11.858522415161133, "global_step": 302548, "epoch": 1800} {"train_loss": -11.815686225891113, "global_step": 302549, "epoch": 1800} {"train_loss": -11.541777610778809, "global_step": 302550, "epoch": 1800} {"train_loss": -12.018366813659668, "global_step": 302551, "epoch": 1800} {"train_loss": -11.811806678771973, "global_step": 302552, "epoch": 1800} {"train_loss": -11.972615242004395, "global_step": 302553, "epoch": 1800} {"train_loss": -11.923774719238281, "global_step": 302554, "epoch": 1800} {"train_loss": -11.450716018676758, "global_step": 302555, "epoch": 1800} {"train_loss": -11.639339447021484, "global_step": 302556, "epoch": 1800} {"train_loss": -11.740361213684082, "global_step": 302557, "epoch": 1800} {"train_loss": -11.221419334411621, "global_step": 302558, "epoch": 1800} {"train_loss": -11.92992115020752, "global_step": 302559, "epoch": 1800} {"train_loss": -11.789973258972168, "global_step": 302560, "epoch": 1800} {"train_loss": -11.46548080444336, "global_step": 302561, "epoch": 1800} {"train_loss": -11.999576568603516, "global_step": 302562, "epoch": 1800} {"train_loss": -11.367506980895996, "global_step": 302563, "epoch": 1800} {"train_loss": -11.402793884277344, "global_step": 302564, "epoch": 1800} {"train_loss": -11.485943794250488, "global_step": 302565, "epoch": 1800} {"train_loss": -12.077486038208008, "global_step": 302566, "epoch": 1800} {"train_loss": -11.92070384252639, "global_step": 302567, "epoch": 1800, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 0.9703854542075998, "train/sim_max_reward_2": 0.00017223234184533736, "train/sim_max_reward_3": 0.8604205683217678, "train/sim_max_reward_4": 0.40858781503611874, "train/sim_max_reward_5": 0.5855578185159271, "test/sim_max_reward_4400000": 0.9608455836019111, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 0.06123617791975391, "test/sim_max_reward_4400003": 0.9581594158393302, "test/sim_max_reward_4400004": 0.5736892397435087, "test/sim_max_reward_4400005": 0.03078422314434117, "test/sim_max_reward_4400006": 0.9605791664164343, "test/sim_max_reward_4400007": 0.532442236430727, "test/sim_max_reward_4400008": 0.6784291457687017, "test/sim_max_reward_4400009": 0.03180737828800997, "test/sim_max_reward_4400010": 0.9399281628814968, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 0.4038209523938719, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 0.6215260645571362, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9810593827490922, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00015914492010484432, "test/sim_max_reward_4400021": 0.9784658739845814, "test/sim_max_reward_4400022": 0.9972776338631503, "test/sim_max_reward_4400023": 0.15917628138282716, "test/sim_max_reward_4400024": 0.9926088681875971, "test/sim_max_reward_4400025": 0.5155949291053162, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.43326989353624284, "test/sim_max_reward_4400028": 0.9663617243889859, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9871036367531763, "test/sim_max_reward_4400031": 0.9888988756015872, "test/sim_max_reward_4400032": 0.06706444118643672, "test/sim_max_reward_4400033": 0.659820344535201, "test/sim_max_reward_4400034": 0.45330929846888907, "test/sim_max_reward_4400035": 0.28544898983581934, "test/sim_max_reward_4400036": 0.7397333664545208, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.29939873018771973, "test/sim_max_reward_4400039": 0.4116314669060675, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9712724987636331, "test/sim_max_reward_4400042": 0.03670929894426338, "test/sim_max_reward_4400043": 0.855550939261492, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.47275197409995867, "test/sim_max_reward_4400046": 0.3357145392238469, "test/sim_max_reward_4400047": 0.950572065965463, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.7250709156580237, "train/mean_score": 0.6375206480705432, "test/mean_score": 0.5603454572189844, "val_loss": 280312.0, "train_action_mse_error": 2.7217326164245605} {"train_loss": -11.121131896972656, "global_step": 302568, "epoch": 1801} {"train_loss": -10.534368515014648, "global_step": 302569, "epoch": 1801} {"train_loss": -11.483718872070312, "global_step": 302570, "epoch": 1801} {"train_loss": -10.752705574035645, "global_step": 302571, "epoch": 1801} {"train_loss": -10.44974136352539, "global_step": 302572, "epoch": 1801} {"train_loss": -11.563885688781738, "global_step": 302573, "epoch": 1801} {"train_loss": -10.604434967041016, "global_step": 302574, "epoch": 1801} {"train_loss": -10.8008451461792, "global_step": 302575, "epoch": 1801} {"train_loss": -11.42480754852295, "global_step": 302576, "epoch": 1801} {"train_loss": -11.294076919555664, "global_step": 302577, "epoch": 1801} {"train_loss": -10.759284973144531, "global_step": 302578, "epoch": 1801} {"train_loss": -11.45034122467041, "global_step": 302579, "epoch": 1801} {"train_loss": -10.395584106445312, "global_step": 302580, "epoch": 1801} {"train_loss": -11.82640552520752, "global_step": 302581, "epoch": 1801} {"train_loss": -11.670461654663086, "global_step": 302582, "epoch": 1801} {"train_loss": -11.334066390991211, "global_step": 302583, "epoch": 1801} {"train_loss": -12.076461791992188, "global_step": 302584, "epoch": 1801} {"train_loss": -10.954377174377441, "global_step": 302585, "epoch": 1801} {"train_loss": -11.620416641235352, "global_step": 302586, "epoch": 1801} {"train_loss": -11.608378410339355, "global_step": 302587, "epoch": 1801} {"train_loss": -10.892058372497559, "global_step": 302588, "epoch": 1801} {"train_loss": -11.82304859161377, "global_step": 302589, "epoch": 1801} {"train_loss": -10.933944702148438, "global_step": 302590, "epoch": 1801} {"train_loss": -11.897977828979492, "global_step": 302591, "epoch": 1801} {"train_loss": -11.45196533203125, "global_step": 302592, "epoch": 1801} {"train_loss": -11.435134887695312, "global_step": 302593, "epoch": 1801} {"train_loss": -11.578948974609375, "global_step": 302594, "epoch": 1801} {"train_loss": -11.380962371826172, "global_step": 302595, "epoch": 1801} {"train_loss": -11.429035186767578, "global_step": 302596, "epoch": 1801} {"train_loss": -12.12450122833252, "global_step": 302597, "epoch": 1801} {"train_loss": -11.538217544555664, "global_step": 302598, "epoch": 1801} {"train_loss": -12.158170700073242, "global_step": 302599, "epoch": 1801} {"train_loss": -11.559990882873535, "global_step": 302600, "epoch": 1801} {"train_loss": -11.7867431640625, "global_step": 302601, "epoch": 1801} {"train_loss": -11.693720817565918, "global_step": 302602, "epoch": 1801} {"train_loss": -11.621344566345215, "global_step": 302603, "epoch": 1801} {"train_loss": -11.97134780883789, "global_step": 302604, "epoch": 1801} {"train_loss": -11.222989082336426, "global_step": 302605, "epoch": 1801} {"train_loss": -11.780427932739258, "global_step": 302606, "epoch": 1801} {"train_loss": -11.742981910705566, "global_step": 302607, "epoch": 1801} {"train_loss": -11.437175750732422, "global_step": 302608, "epoch": 1801} {"train_loss": -11.692972183227539, "global_step": 302609, "epoch": 1801} {"train_loss": -11.559264183044434, "global_step": 302610, "epoch": 1801} {"train_loss": -11.986255645751953, "global_step": 302611, "epoch": 1801} {"train_loss": -11.559005737304688, "global_step": 302612, "epoch": 1801} {"train_loss": -11.590041160583496, "global_step": 302613, "epoch": 1801} {"train_loss": -11.820565223693848, "global_step": 302614, "epoch": 1801} {"train_loss": -11.771326065063477, "global_step": 302615, "epoch": 1801} {"train_loss": -12.067487716674805, "global_step": 302616, "epoch": 1801} {"train_loss": -11.384513854980469, "global_step": 302617, "epoch": 1801} {"train_loss": -11.941827774047852, "global_step": 302618, "epoch": 1801} {"train_loss": -11.754768371582031, "global_step": 302619, "epoch": 1801} {"train_loss": -11.898061752319336, "global_step": 302620, "epoch": 1801} {"train_loss": -11.670089721679688, "global_step": 302621, "epoch": 1801} {"train_loss": -10.957006454467773, "global_step": 302622, "epoch": 1801} {"train_loss": -11.853303909301758, "global_step": 302623, "epoch": 1801} {"train_loss": -11.844483375549316, "global_step": 302624, "epoch": 1801} {"train_loss": -11.83080005645752, "global_step": 302625, "epoch": 1801} {"train_loss": -11.902101516723633, "global_step": 302626, "epoch": 1801} {"train_loss": -11.769001007080078, "global_step": 302627, "epoch": 1801} {"train_loss": -11.92552375793457, "global_step": 302628, "epoch": 1801} {"train_loss": -11.766006469726562, "global_step": 302629, "epoch": 1801} {"train_loss": -12.040221214294434, "global_step": 302630, "epoch": 1801} {"train_loss": -11.981011390686035, "global_step": 302631, "epoch": 1801} {"train_loss": -11.516382217407227, "global_step": 302632, "epoch": 1801} {"train_loss": -12.064271926879883, "global_step": 302633, "epoch": 1801} {"train_loss": -11.780336380004883, "global_step": 302634, "epoch": 1801} {"train_loss": -12.06602954864502, "global_step": 302635, "epoch": 1801} {"train_loss": -11.699178695678711, "global_step": 302636, "epoch": 1801} {"train_loss": -11.926460266113281, "global_step": 302637, "epoch": 1801} {"train_loss": -11.745061874389648, "global_step": 302638, "epoch": 1801} {"train_loss": -12.164403915405273, "global_step": 302639, "epoch": 1801} {"train_loss": -11.931024551391602, "global_step": 302640, "epoch": 1801} {"train_loss": -12.058826446533203, "global_step": 302641, "epoch": 1801} {"train_loss": -12.075454711914062, "global_step": 302642, "epoch": 1801} {"train_loss": -12.05868148803711, "global_step": 302643, "epoch": 1801} {"train_loss": -12.35359001159668, "global_step": 302644, "epoch": 1801} {"train_loss": -12.245210647583008, "global_step": 302645, "epoch": 1801} {"train_loss": -12.20328426361084, "global_step": 302646, "epoch": 1801} {"train_loss": -12.265111923217773, "global_step": 302647, "epoch": 1801} {"train_loss": -12.245936393737793, "global_step": 302648, "epoch": 1801} {"train_loss": -12.292792320251465, "global_step": 302649, "epoch": 1801} {"train_loss": -12.22396469116211, "global_step": 302650, "epoch": 1801} {"train_loss": -12.363969802856445, "global_step": 302651, "epoch": 1801} {"train_loss": -12.204082489013672, "global_step": 302652, "epoch": 1801} {"train_loss": -12.320708274841309, "global_step": 302653, "epoch": 1801} {"train_loss": -12.349255561828613, "global_step": 302654, "epoch": 1801} {"train_loss": -12.190878868103027, "global_step": 302655, "epoch": 1801} {"train_loss": -12.067024230957031, "global_step": 302656, "epoch": 1801} {"train_loss": -12.21590805053711, "global_step": 302657, "epoch": 1801} {"train_loss": -11.997687339782715, "global_step": 302658, "epoch": 1801} {"train_loss": -12.277457237243652, "global_step": 302659, "epoch": 1801} {"train_loss": -12.353334426879883, "global_step": 302660, "epoch": 1801} {"train_loss": -12.296670913696289, "global_step": 302661, "epoch": 1801} {"train_loss": -12.38662338256836, "global_step": 302662, "epoch": 1801} {"train_loss": -12.273164749145508, "global_step": 302663, "epoch": 1801} {"train_loss": -12.302497863769531, "global_step": 302664, "epoch": 1801} {"train_loss": -12.280741691589355, "global_step": 302665, "epoch": 1801} {"train_loss": -12.174320220947266, "global_step": 302666, "epoch": 1801} {"train_loss": -11.841851234436035, "global_step": 302667, "epoch": 1801} {"train_loss": -11.997882843017578, "global_step": 302668, "epoch": 1801} {"train_loss": -11.685467720031738, "global_step": 302669, "epoch": 1801} {"train_loss": -11.427059173583984, "global_step": 302670, "epoch": 1801} {"train_loss": -11.252508163452148, "global_step": 302671, "epoch": 1801} {"train_loss": -11.489233016967773, "global_step": 302672, "epoch": 1801} {"train_loss": -11.886348724365234, "global_step": 302673, "epoch": 1801} {"train_loss": -11.389310836791992, "global_step": 302674, "epoch": 1801} {"train_loss": -11.893686294555664, "global_step": 302675, "epoch": 1801} {"train_loss": -12.000909805297852, "global_step": 302676, "epoch": 1801} {"train_loss": -11.450706481933594, "global_step": 302677, "epoch": 1801} {"train_loss": -11.573530197143555, "global_step": 302678, "epoch": 1801} {"train_loss": -11.885467529296875, "global_step": 302679, "epoch": 1801} {"train_loss": -12.147274017333984, "global_step": 302680, "epoch": 1801} {"train_loss": -11.283617973327637, "global_step": 302681, "epoch": 1801} {"train_loss": -12.141685485839844, "global_step": 302682, "epoch": 1801} {"train_loss": -11.153616905212402, "global_step": 302683, "epoch": 1801} {"train_loss": -12.10909652709961, "global_step": 302684, "epoch": 1801} {"train_loss": -11.735980987548828, "global_step": 302685, "epoch": 1801} {"train_loss": -11.655132293701172, "global_step": 302686, "epoch": 1801} {"train_loss": -11.759744644165039, "global_step": 302687, "epoch": 1801} {"train_loss": -11.093412399291992, "global_step": 302688, "epoch": 1801} {"train_loss": -11.862144470214844, "global_step": 302689, "epoch": 1801} {"train_loss": -11.240307807922363, "global_step": 302690, "epoch": 1801} {"train_loss": -11.5794677734375, "global_step": 302691, "epoch": 1801} {"train_loss": -11.613431930541992, "global_step": 302692, "epoch": 1801} {"train_loss": -11.497167587280273, "global_step": 302693, "epoch": 1801} {"train_loss": -11.35477066040039, "global_step": 302694, "epoch": 1801} {"train_loss": -11.389033317565918, "global_step": 302695, "epoch": 1801} {"train_loss": -9.998607635498047, "global_step": 302696, "epoch": 1801} {"train_loss": -11.571966171264648, "global_step": 302697, "epoch": 1801} {"train_loss": -11.076069831848145, "global_step": 302698, "epoch": 1801} {"train_loss": -11.584957122802734, "global_step": 302699, "epoch": 1801} {"train_loss": -11.433855056762695, "global_step": 302700, "epoch": 1801} {"train_loss": -10.770920753479004, "global_step": 302701, "epoch": 1801} {"train_loss": -11.299636840820312, "global_step": 302702, "epoch": 1801} {"train_loss": -11.26801872253418, "global_step": 302703, "epoch": 1801} {"train_loss": -11.373065948486328, "global_step": 302704, "epoch": 1801} {"train_loss": -10.898733139038086, "global_step": 302705, "epoch": 1801} {"train_loss": -12.089300155639648, "global_step": 302706, "epoch": 1801} {"train_loss": -11.1751708984375, "global_step": 302707, "epoch": 1801} {"train_loss": -11.381946563720703, "global_step": 302708, "epoch": 1801} {"train_loss": -11.686232566833496, "global_step": 302709, "epoch": 1801} {"train_loss": -11.909185409545898, "global_step": 302710, "epoch": 1801} {"train_loss": -10.887741088867188, "global_step": 302711, "epoch": 1801} {"train_loss": -11.872173309326172, "global_step": 302712, "epoch": 1801} {"train_loss": -10.86142635345459, "global_step": 302713, "epoch": 1801} {"train_loss": -11.673249244689941, "global_step": 302714, "epoch": 1801} {"train_loss": -11.602222442626953, "global_step": 302715, "epoch": 1801} {"train_loss": -11.479514122009277, "global_step": 302716, "epoch": 1801} {"train_loss": -12.016355514526367, "global_step": 302717, "epoch": 1801} {"train_loss": -11.491927146911621, "global_step": 302718, "epoch": 1801} {"train_loss": -12.07270336151123, "global_step": 302719, "epoch": 1801} {"train_loss": -11.379251480102539, "global_step": 302720, "epoch": 1801} {"train_loss": -11.575053215026855, "global_step": 302721, "epoch": 1801} {"train_loss": -11.95702838897705, "global_step": 302722, "epoch": 1801} {"train_loss": -11.704708099365234, "global_step": 302723, "epoch": 1801} {"train_loss": -11.848695755004883, "global_step": 302724, "epoch": 1801} {"train_loss": -12.131230354309082, "global_step": 302725, "epoch": 1801} {"train_loss": -11.913076400756836, "global_step": 302726, "epoch": 1801} {"train_loss": -11.961414337158203, "global_step": 302727, "epoch": 1801} {"train_loss": -11.931161880493164, "global_step": 302728, "epoch": 1801} {"train_loss": -11.82879638671875, "global_step": 302729, "epoch": 1801} {"train_loss": -11.904451370239258, "global_step": 302730, "epoch": 1801} {"train_loss": -12.206283569335938, "global_step": 302731, "epoch": 1801} {"train_loss": -12.055395126342773, "global_step": 302732, "epoch": 1801} {"train_loss": -12.326583862304688, "global_step": 302733, "epoch": 1801} {"train_loss": -12.249707221984863, "global_step": 302734, "epoch": 1801} {"train_loss": -11.695951643444243, "global_step": 302735, "epoch": 1801, "val_loss": 282395.3125} {"train_loss": -12.154353141784668, "global_step": 302736, "epoch": 1802} {"train_loss": -12.131329536437988, "global_step": 302737, "epoch": 1802} {"train_loss": -12.259950637817383, "global_step": 302738, "epoch": 1802} {"train_loss": -12.362871170043945, "global_step": 302739, "epoch": 1802} {"train_loss": -12.329813957214355, "global_step": 302740, "epoch": 1802} {"train_loss": -12.264690399169922, "global_step": 302741, "epoch": 1802} {"train_loss": -12.364171981811523, "global_step": 302742, "epoch": 1802} {"train_loss": -12.207971572875977, "global_step": 302743, "epoch": 1802} {"train_loss": -12.294677734375, "global_step": 302744, "epoch": 1802} {"train_loss": -12.160909652709961, "global_step": 302745, "epoch": 1802} {"train_loss": -12.132932662963867, "global_step": 302746, "epoch": 1802} {"train_loss": -12.188616752624512, "global_step": 302747, "epoch": 1802} {"train_loss": -12.256024360656738, "global_step": 302748, "epoch": 1802} {"train_loss": -12.304985046386719, "global_step": 302749, "epoch": 1802} {"train_loss": -12.219270706176758, "global_step": 302750, "epoch": 1802} {"train_loss": -12.539566993713379, "global_step": 302751, "epoch": 1802} {"train_loss": -12.441039085388184, "global_step": 302752, "epoch": 1802} {"train_loss": -12.187355041503906, "global_step": 302753, "epoch": 1802} {"train_loss": -12.449499130249023, "global_step": 302754, "epoch": 1802} {"train_loss": -12.475871086120605, "global_step": 302755, "epoch": 1802} {"train_loss": -12.555197715759277, "global_step": 302756, "epoch": 1802} {"train_loss": -12.298974990844727, "global_step": 302757, "epoch": 1802} {"train_loss": -12.268536567687988, "global_step": 302758, "epoch": 1802} {"train_loss": -12.400531768798828, "global_step": 302759, "epoch": 1802} {"train_loss": -12.542165756225586, "global_step": 302760, "epoch": 1802} {"train_loss": -12.26707649230957, "global_step": 302761, "epoch": 1802} {"train_loss": -12.335060119628906, "global_step": 302762, "epoch": 1802} {"train_loss": -12.292987823486328, "global_step": 302763, "epoch": 1802} {"train_loss": -12.463109970092773, "global_step": 302764, "epoch": 1802} {"train_loss": -12.544493675231934, "global_step": 302765, "epoch": 1802} {"train_loss": -12.229043960571289, "global_step": 302766, "epoch": 1802} {"train_loss": -12.656682014465332, "global_step": 302767, "epoch": 1802} {"train_loss": -12.482446670532227, "global_step": 302768, "epoch": 1802} {"train_loss": -12.55052661895752, "global_step": 302769, "epoch": 1802} {"train_loss": -12.476967811584473, "global_step": 302770, "epoch": 1802} {"train_loss": -12.400070190429688, "global_step": 302771, "epoch": 1802} {"train_loss": -12.497539520263672, "global_step": 302772, "epoch": 1802} {"train_loss": -12.355245590209961, "global_step": 302773, "epoch": 1802} {"train_loss": -12.431400299072266, "global_step": 302774, "epoch": 1802} {"train_loss": -12.422861099243164, "global_step": 302775, "epoch": 1802} {"train_loss": -12.34243392944336, "global_step": 302776, "epoch": 1802} {"train_loss": -12.199902534484863, "global_step": 302777, "epoch": 1802} {"train_loss": -12.022420883178711, "global_step": 302778, "epoch": 1802} {"train_loss": -12.461498260498047, "global_step": 302779, "epoch": 1802} {"train_loss": -12.048872947692871, "global_step": 302780, "epoch": 1802} {"train_loss": -12.410411834716797, "global_step": 302781, "epoch": 1802} {"train_loss": -11.741222381591797, "global_step": 302782, "epoch": 1802} {"train_loss": -11.99249267578125, "global_step": 302783, "epoch": 1802} {"train_loss": -12.11739444732666, "global_step": 302784, "epoch": 1802} {"train_loss": -12.007545471191406, "global_step": 302785, "epoch": 1802} {"train_loss": -11.810637474060059, "global_step": 302786, "epoch": 1802} {"train_loss": -11.847978591918945, "global_step": 302787, "epoch": 1802} {"train_loss": -10.945137023925781, "global_step": 302788, "epoch": 1802} {"train_loss": -11.18234634399414, "global_step": 302789, "epoch": 1802} {"train_loss": -11.590275764465332, "global_step": 302790, "epoch": 1802} {"train_loss": -9.394664764404297, "global_step": 302791, "epoch": 1802} {"train_loss": -11.272034645080566, "global_step": 302792, "epoch": 1802} {"train_loss": -10.325305938720703, "global_step": 302793, "epoch": 1802} {"train_loss": -9.975452423095703, "global_step": 302794, "epoch": 1802} {"train_loss": -11.98408031463623, "global_step": 302795, "epoch": 1802} {"train_loss": -10.439719200134277, "global_step": 302796, "epoch": 1802} {"train_loss": -11.747678756713867, "global_step": 302797, "epoch": 1802} {"train_loss": -11.125818252563477, "global_step": 302798, "epoch": 1802} {"train_loss": -10.808571815490723, "global_step": 302799, "epoch": 1802} {"train_loss": -11.130547523498535, "global_step": 302800, "epoch": 1802} {"train_loss": -11.363055229187012, "global_step": 302801, "epoch": 1802} {"train_loss": -11.212743759155273, "global_step": 302802, "epoch": 1802} {"train_loss": -11.702333450317383, "global_step": 302803, "epoch": 1802} {"train_loss": -10.497526168823242, "global_step": 302804, "epoch": 1802} {"train_loss": -11.62330150604248, "global_step": 302805, "epoch": 1802} {"train_loss": -11.617513656616211, "global_step": 302806, "epoch": 1802} {"train_loss": -10.631635665893555, "global_step": 302807, "epoch": 1802} {"train_loss": -10.234172821044922, "global_step": 302808, "epoch": 1802} {"train_loss": -10.031213760375977, "global_step": 302809, "epoch": 1802} {"train_loss": -11.276309967041016, "global_step": 302810, "epoch": 1802} {"train_loss": -10.281627655029297, "global_step": 302811, "epoch": 1802} {"train_loss": -11.836830139160156, "global_step": 302812, "epoch": 1802} {"train_loss": -10.80521011352539, "global_step": 302813, "epoch": 1802} {"train_loss": -11.049257278442383, "global_step": 302814, "epoch": 1802} {"train_loss": -11.621231079101562, "global_step": 302815, "epoch": 1802} {"train_loss": -11.073038101196289, "global_step": 302816, "epoch": 1802} {"train_loss": -11.660879135131836, "global_step": 302817, "epoch": 1802} {"train_loss": -10.638845443725586, "global_step": 302818, "epoch": 1802} {"train_loss": -11.772380828857422, "global_step": 302819, "epoch": 1802} {"train_loss": -11.043115615844727, "global_step": 302820, "epoch": 1802} {"train_loss": -11.712284088134766, "global_step": 302821, "epoch": 1802} {"train_loss": -10.959842681884766, "global_step": 302822, "epoch": 1802} {"train_loss": -11.861551284790039, "global_step": 302823, "epoch": 1802} {"train_loss": -11.606502532958984, "global_step": 302824, "epoch": 1802} {"train_loss": -11.500602722167969, "global_step": 302825, "epoch": 1802} {"train_loss": -11.809090614318848, "global_step": 302826, "epoch": 1802} {"train_loss": -11.320905685424805, "global_step": 302827, "epoch": 1802} {"train_loss": -11.53223991394043, "global_step": 302828, "epoch": 1802} {"train_loss": -11.872904777526855, "global_step": 302829, "epoch": 1802} {"train_loss": -11.764854431152344, "global_step": 302830, "epoch": 1802} {"train_loss": -11.204839706420898, "global_step": 302831, "epoch": 1802} {"train_loss": -11.879526138305664, "global_step": 302832, "epoch": 1802} {"train_loss": -11.432756423950195, "global_step": 302833, "epoch": 1802} {"train_loss": -12.100701332092285, "global_step": 302834, "epoch": 1802} {"train_loss": -11.527039527893066, "global_step": 302835, "epoch": 1802} {"train_loss": -11.822961807250977, "global_step": 302836, "epoch": 1802} {"train_loss": -11.837047576904297, "global_step": 302837, "epoch": 1802} {"train_loss": -11.723580360412598, "global_step": 302838, "epoch": 1802} {"train_loss": -11.782184600830078, "global_step": 302839, "epoch": 1802} {"train_loss": -11.81921100616455, "global_step": 302840, "epoch": 1802} {"train_loss": -11.854846954345703, "global_step": 302841, "epoch": 1802} {"train_loss": -11.453268051147461, "global_step": 302842, "epoch": 1802} {"train_loss": -12.131438255310059, "global_step": 302843, "epoch": 1802} {"train_loss": -11.000160217285156, "global_step": 302844, "epoch": 1802} {"train_loss": -12.112046241760254, "global_step": 302845, "epoch": 1802} {"train_loss": -11.537689208984375, "global_step": 302846, "epoch": 1802} {"train_loss": -11.826608657836914, "global_step": 302847, "epoch": 1802} {"train_loss": -11.671192169189453, "global_step": 302848, "epoch": 1802} {"train_loss": -11.603940963745117, "global_step": 302849, "epoch": 1802} {"train_loss": -10.889759063720703, "global_step": 302850, "epoch": 1802} {"train_loss": -12.082218170166016, "global_step": 302851, "epoch": 1802} {"train_loss": -11.568376541137695, "global_step": 302852, "epoch": 1802} {"train_loss": -11.959553718566895, "global_step": 302853, "epoch": 1802} {"train_loss": -11.741250038146973, "global_step": 302854, "epoch": 1802} {"train_loss": -11.756570816040039, "global_step": 302855, "epoch": 1802} {"train_loss": -12.077047348022461, "global_step": 302856, "epoch": 1802} {"train_loss": -11.77601432800293, "global_step": 302857, "epoch": 1802} {"train_loss": -11.809553146362305, "global_step": 302858, "epoch": 1802} {"train_loss": -11.728005409240723, "global_step": 302859, "epoch": 1802} {"train_loss": -11.601780891418457, "global_step": 302860, "epoch": 1802} {"train_loss": -11.996191024780273, "global_step": 302861, "epoch": 1802} {"train_loss": -11.054498672485352, "global_step": 302862, "epoch": 1802} {"train_loss": -12.242172241210938, "global_step": 302863, "epoch": 1802} {"train_loss": -11.324946403503418, "global_step": 302864, "epoch": 1802} {"train_loss": -11.59981918334961, "global_step": 302865, "epoch": 1802} {"train_loss": -11.601310729980469, "global_step": 302866, "epoch": 1802} {"train_loss": -11.845446586608887, "global_step": 302867, "epoch": 1802} {"train_loss": -11.757034301757812, "global_step": 302868, "epoch": 1802} {"train_loss": -12.109830856323242, "global_step": 302869, "epoch": 1802} {"train_loss": -11.623281478881836, "global_step": 302870, "epoch": 1802} {"train_loss": -12.264455795288086, "global_step": 302871, "epoch": 1802} {"train_loss": -11.716476440429688, "global_step": 302872, "epoch": 1802} {"train_loss": -12.373228073120117, "global_step": 302873, "epoch": 1802} {"train_loss": -11.898025512695312, "global_step": 302874, "epoch": 1802} {"train_loss": -11.948925018310547, "global_step": 302875, "epoch": 1802} {"train_loss": -11.784113883972168, "global_step": 302876, "epoch": 1802} {"train_loss": -11.754932403564453, "global_step": 302877, "epoch": 1802} {"train_loss": -11.934657096862793, "global_step": 302878, "epoch": 1802} {"train_loss": -11.898311614990234, "global_step": 302879, "epoch": 1802} {"train_loss": -12.00279712677002, "global_step": 302880, "epoch": 1802} {"train_loss": -11.94459342956543, "global_step": 302881, "epoch": 1802} {"train_loss": -11.873130798339844, "global_step": 302882, "epoch": 1802} {"train_loss": -12.150131225585938, "global_step": 302883, "epoch": 1802} {"train_loss": -12.068109512329102, "global_step": 302884, "epoch": 1802} {"train_loss": -11.911407470703125, "global_step": 302885, "epoch": 1802} {"train_loss": -12.10219955444336, "global_step": 302886, "epoch": 1802} {"train_loss": -11.792501449584961, "global_step": 302887, "epoch": 1802} {"train_loss": -12.229598045349121, "global_step": 302888, "epoch": 1802} {"train_loss": -12.288331985473633, "global_step": 302889, "epoch": 1802} {"train_loss": -12.08433723449707, "global_step": 302890, "epoch": 1802} {"train_loss": -12.054686546325684, "global_step": 302891, "epoch": 1802} {"train_loss": -11.955878257751465, "global_step": 302892, "epoch": 1802} {"train_loss": -12.260709762573242, "global_step": 302893, "epoch": 1802} {"train_loss": -11.927525520324707, "global_step": 302894, "epoch": 1802} {"train_loss": -12.287590026855469, "global_step": 302895, "epoch": 1802} {"train_loss": -11.96075439453125, "global_step": 302896, "epoch": 1802} {"train_loss": -12.194327354431152, "global_step": 302897, "epoch": 1802} {"train_loss": -12.306144714355469, "global_step": 302898, "epoch": 1802} {"train_loss": -12.37669849395752, "global_step": 302899, "epoch": 1802} {"train_loss": -12.104363441467285, "global_step": 302900, "epoch": 1802} {"train_loss": -12.263311386108398, "global_step": 302901, "epoch": 1802} {"train_loss": -12.386251449584961, "global_step": 302902, "epoch": 1802} {"train_loss": -11.819013396898905, "global_step": 302903, "epoch": 1802, "val_loss": 283682.28125} {"train_loss": -12.311910629272461, "global_step": 302904, "epoch": 1803} {"train_loss": -12.108904838562012, "global_step": 302905, "epoch": 1803} {"train_loss": -12.153881072998047, "global_step": 302906, "epoch": 1803} {"train_loss": -12.283750534057617, "global_step": 302907, "epoch": 1803} {"train_loss": -12.147624969482422, "global_step": 302908, "epoch": 1803} {"train_loss": -12.39462661743164, "global_step": 302909, "epoch": 1803} {"train_loss": -12.253265380859375, "global_step": 302910, "epoch": 1803} {"train_loss": -12.528007507324219, "global_step": 302911, "epoch": 1803} {"train_loss": -12.24752426147461, "global_step": 302912, "epoch": 1803} {"train_loss": -12.202290534973145, "global_step": 302913, "epoch": 1803} {"train_loss": -12.489291191101074, "global_step": 302914, "epoch": 1803} {"train_loss": -12.177531242370605, "global_step": 302915, "epoch": 1803} {"train_loss": -12.439321517944336, "global_step": 302916, "epoch": 1803} {"train_loss": -12.312216758728027, "global_step": 302917, "epoch": 1803} {"train_loss": -12.288372039794922, "global_step": 302918, "epoch": 1803} {"train_loss": -12.35360050201416, "global_step": 302919, "epoch": 1803} {"train_loss": -12.44843864440918, "global_step": 302920, "epoch": 1803} {"train_loss": -12.30075740814209, "global_step": 302921, "epoch": 1803} {"train_loss": -12.475130081176758, "global_step": 302922, "epoch": 1803} {"train_loss": -12.410242080688477, "global_step": 302923, "epoch": 1803} {"train_loss": -12.354223251342773, "global_step": 302924, "epoch": 1803} {"train_loss": -12.35708999633789, "global_step": 302925, "epoch": 1803} {"train_loss": -12.330228805541992, "global_step": 302926, "epoch": 1803} {"train_loss": -12.213420867919922, "global_step": 302927, "epoch": 1803} {"train_loss": -12.422368049621582, "global_step": 302928, "epoch": 1803} {"train_loss": -12.334674835205078, "global_step": 302929, "epoch": 1803} {"train_loss": -12.474908828735352, "global_step": 302930, "epoch": 1803} {"train_loss": -12.2446928024292, "global_step": 302931, "epoch": 1803} {"train_loss": -12.204648971557617, "global_step": 302932, "epoch": 1803} {"train_loss": -12.111764907836914, "global_step": 302933, "epoch": 1803} {"train_loss": -12.101255416870117, "global_step": 302934, "epoch": 1803} {"train_loss": -12.222419738769531, "global_step": 302935, "epoch": 1803} {"train_loss": -12.069758415222168, "global_step": 302936, "epoch": 1803} {"train_loss": -12.33407974243164, "global_step": 302937, "epoch": 1803} {"train_loss": -12.396279335021973, "global_step": 302938, "epoch": 1803} {"train_loss": -11.773611068725586, "global_step": 302939, "epoch": 1803} {"train_loss": -11.783597946166992, "global_step": 302940, "epoch": 1803} {"train_loss": -11.97372817993164, "global_step": 302941, "epoch": 1803} {"train_loss": -11.848442077636719, "global_step": 302942, "epoch": 1803} {"train_loss": -12.222017288208008, "global_step": 302943, "epoch": 1803} {"train_loss": -11.854471206665039, "global_step": 302944, "epoch": 1803} {"train_loss": -12.256171226501465, "global_step": 302945, "epoch": 1803} {"train_loss": -11.554740905761719, "global_step": 302946, "epoch": 1803} {"train_loss": -12.215659141540527, "global_step": 302947, "epoch": 1803} {"train_loss": -11.713377952575684, "global_step": 302948, "epoch": 1803} {"train_loss": -11.933747291564941, "global_step": 302949, "epoch": 1803} {"train_loss": -12.053853034973145, "global_step": 302950, "epoch": 1803} {"train_loss": -11.754318237304688, "global_step": 302951, "epoch": 1803} {"train_loss": -12.215906143188477, "global_step": 302952, "epoch": 1803} {"train_loss": -11.674298286437988, "global_step": 302953, "epoch": 1803} {"train_loss": -12.117231369018555, "global_step": 302954, "epoch": 1803} {"train_loss": -11.886042594909668, "global_step": 302955, "epoch": 1803} {"train_loss": -12.093242645263672, "global_step": 302956, "epoch": 1803} {"train_loss": -12.049570083618164, "global_step": 302957, "epoch": 1803} {"train_loss": -12.242444038391113, "global_step": 302958, "epoch": 1803} {"train_loss": -11.572652816772461, "global_step": 302959, "epoch": 1803} {"train_loss": -11.968077659606934, "global_step": 302960, "epoch": 1803} {"train_loss": -11.567584991455078, "global_step": 302961, "epoch": 1803} {"train_loss": -12.203112602233887, "global_step": 302962, "epoch": 1803} {"train_loss": -11.299245834350586, "global_step": 302963, "epoch": 1803} {"train_loss": -11.78756332397461, "global_step": 302964, "epoch": 1803} {"train_loss": -11.867965698242188, "global_step": 302965, "epoch": 1803} {"train_loss": -11.582076072692871, "global_step": 302966, "epoch": 1803} {"train_loss": -11.05899429321289, "global_step": 302967, "epoch": 1803} {"train_loss": -11.384941101074219, "global_step": 302968, "epoch": 1803} {"train_loss": -10.540838241577148, "global_step": 302969, "epoch": 1803} {"train_loss": -11.226072311401367, "global_step": 302970, "epoch": 1803} {"train_loss": -10.753564834594727, "global_step": 302971, "epoch": 1803} {"train_loss": -11.774984359741211, "global_step": 302972, "epoch": 1803} {"train_loss": -11.01360034942627, "global_step": 302973, "epoch": 1803} {"train_loss": -11.326915740966797, "global_step": 302974, "epoch": 1803} {"train_loss": -11.542367935180664, "global_step": 302975, "epoch": 1803} {"train_loss": -10.955936431884766, "global_step": 302976, "epoch": 1803} {"train_loss": -11.765497207641602, "global_step": 302977, "epoch": 1803} {"train_loss": -10.254171371459961, "global_step": 302978, "epoch": 1803} {"train_loss": -11.082841873168945, "global_step": 302979, "epoch": 1803} {"train_loss": -10.732112884521484, "global_step": 302980, "epoch": 1803} {"train_loss": -11.504106521606445, "global_step": 302981, "epoch": 1803} {"train_loss": -11.466413497924805, "global_step": 302982, "epoch": 1803} {"train_loss": -11.648458480834961, "global_step": 302983, "epoch": 1803} {"train_loss": -11.731475830078125, "global_step": 302984, "epoch": 1803} {"train_loss": -11.680051803588867, "global_step": 302985, "epoch": 1803} {"train_loss": -11.626428604125977, "global_step": 302986, "epoch": 1803} {"train_loss": -12.06196117401123, "global_step": 302987, "epoch": 1803} {"train_loss": -11.732620239257812, "global_step": 302988, "epoch": 1803} {"train_loss": -11.984304428100586, "global_step": 302989, "epoch": 1803} {"train_loss": -11.608587265014648, "global_step": 302990, "epoch": 1803} {"train_loss": -12.096599578857422, "global_step": 302991, "epoch": 1803} {"train_loss": -11.78200912475586, "global_step": 302992, "epoch": 1803} {"train_loss": -12.072610855102539, "global_step": 302993, "epoch": 1803} {"train_loss": -12.133359909057617, "global_step": 302994, "epoch": 1803} {"train_loss": -11.606236457824707, "global_step": 302995, "epoch": 1803} {"train_loss": -11.95388412475586, "global_step": 302996, "epoch": 1803} {"train_loss": -11.57811164855957, "global_step": 302997, "epoch": 1803} {"train_loss": -11.602741241455078, "global_step": 302998, "epoch": 1803} {"train_loss": -12.123218536376953, "global_step": 302999, "epoch": 1803} {"train_loss": -11.346590042114258, "global_step": 303000, "epoch": 1803} {"train_loss": -11.6777982711792, "global_step": 303001, "epoch": 1803} {"train_loss": -11.827560424804688, "global_step": 303002, "epoch": 1803} {"train_loss": -11.452594757080078, "global_step": 303003, "epoch": 1803} {"train_loss": -10.563995361328125, "global_step": 303004, "epoch": 1803} {"train_loss": -12.324274063110352, "global_step": 303005, "epoch": 1803} {"train_loss": -11.560916900634766, "global_step": 303006, "epoch": 1803} {"train_loss": -11.914464950561523, "global_step": 303007, "epoch": 1803} {"train_loss": -11.011968612670898, "global_step": 303008, "epoch": 1803} {"train_loss": -11.772562980651855, "global_step": 303009, "epoch": 1803} {"train_loss": -11.76785659790039, "global_step": 303010, "epoch": 1803} {"train_loss": -11.625760078430176, "global_step": 303011, "epoch": 1803} {"train_loss": -11.926112174987793, "global_step": 303012, "epoch": 1803} {"train_loss": -12.096834182739258, "global_step": 303013, "epoch": 1803} {"train_loss": -11.472850799560547, "global_step": 303014, "epoch": 1803} {"train_loss": -11.900693893432617, "global_step": 303015, "epoch": 1803} {"train_loss": -11.87330436706543, "global_step": 303016, "epoch": 1803} {"train_loss": -11.725713729858398, "global_step": 303017, "epoch": 1803} {"train_loss": -12.206632614135742, "global_step": 303018, "epoch": 1803} {"train_loss": -11.691417694091797, "global_step": 303019, "epoch": 1803} {"train_loss": -12.104372024536133, "global_step": 303020, "epoch": 1803} {"train_loss": -11.840507507324219, "global_step": 303021, "epoch": 1803} {"train_loss": -12.022209167480469, "global_step": 303022, "epoch": 1803} {"train_loss": -11.939902305603027, "global_step": 303023, "epoch": 1803} {"train_loss": -11.895100593566895, "global_step": 303024, "epoch": 1803} {"train_loss": -12.161778450012207, "global_step": 303025, "epoch": 1803} {"train_loss": -11.972633361816406, "global_step": 303026, "epoch": 1803} {"train_loss": -12.054183959960938, "global_step": 303027, "epoch": 1803} {"train_loss": -12.232248306274414, "global_step": 303028, "epoch": 1803} {"train_loss": -11.916542053222656, "global_step": 303029, "epoch": 1803} {"train_loss": -11.88055419921875, "global_step": 303030, "epoch": 1803} {"train_loss": -12.351757049560547, "global_step": 303031, "epoch": 1803} {"train_loss": -11.746546745300293, "global_step": 303032, "epoch": 1803} {"train_loss": -12.016523361206055, "global_step": 303033, "epoch": 1803} {"train_loss": -11.898509979248047, "global_step": 303034, "epoch": 1803} {"train_loss": -12.162078857421875, "global_step": 303035, "epoch": 1803} {"train_loss": -11.69730281829834, "global_step": 303036, "epoch": 1803} {"train_loss": -12.181201934814453, "global_step": 303037, "epoch": 1803} {"train_loss": -11.998919486999512, "global_step": 303038, "epoch": 1803} {"train_loss": -12.153775215148926, "global_step": 303039, "epoch": 1803} {"train_loss": -12.059700012207031, "global_step": 303040, "epoch": 1803} {"train_loss": -12.030210494995117, "global_step": 303041, "epoch": 1803} {"train_loss": -11.794012069702148, "global_step": 303042, "epoch": 1803} {"train_loss": -12.117715835571289, "global_step": 303043, "epoch": 1803} {"train_loss": -11.971578598022461, "global_step": 303044, "epoch": 1803} {"train_loss": -12.04987907409668, "global_step": 303045, "epoch": 1803} {"train_loss": -11.861669540405273, "global_step": 303046, "epoch": 1803} {"train_loss": -12.010951042175293, "global_step": 303047, "epoch": 1803} {"train_loss": -12.271827697753906, "global_step": 303048, "epoch": 1803} {"train_loss": -11.866766929626465, "global_step": 303049, "epoch": 1803} {"train_loss": -12.171000480651855, "global_step": 303050, "epoch": 1803} {"train_loss": -12.07931137084961, "global_step": 303051, "epoch": 1803} {"train_loss": -11.419363975524902, "global_step": 303052, "epoch": 1803} {"train_loss": -12.023716926574707, "global_step": 303053, "epoch": 1803} {"train_loss": -11.96815299987793, "global_step": 303054, "epoch": 1803} {"train_loss": -11.737297058105469, "global_step": 303055, "epoch": 1803} {"train_loss": -12.161813735961914, "global_step": 303056, "epoch": 1803} {"train_loss": -12.219772338867188, "global_step": 303057, "epoch": 1803} {"train_loss": -11.782444953918457, "global_step": 303058, "epoch": 1803} {"train_loss": -12.176025390625, "global_step": 303059, "epoch": 1803} {"train_loss": -11.836954116821289, "global_step": 303060, "epoch": 1803} {"train_loss": -12.404489517211914, "global_step": 303061, "epoch": 1803} {"train_loss": -12.024347305297852, "global_step": 303062, "epoch": 1803} {"train_loss": -12.110601425170898, "global_step": 303063, "epoch": 1803} {"train_loss": -12.385677337646484, "global_step": 303064, "epoch": 1803} {"train_loss": -12.164241790771484, "global_step": 303065, "epoch": 1803} {"train_loss": -12.323575973510742, "global_step": 303066, "epoch": 1803} {"train_loss": -12.237765312194824, "global_step": 303067, "epoch": 1803} {"train_loss": -12.143739700317383, "global_step": 303068, "epoch": 1803} {"train_loss": -12.23084545135498, "global_step": 303069, "epoch": 1803} {"train_loss": -12.526823043823242, "global_step": 303070, "epoch": 1803} {"train_loss": -11.92603550070808, "global_step": 303071, "epoch": 1803, "val_loss": 282334.46875} {"train_loss": -11.938673973083496, "global_step": 303072, "epoch": 1804} {"train_loss": -12.0261869430542, "global_step": 303073, "epoch": 1804} {"train_loss": -12.137453079223633, "global_step": 303074, "epoch": 1804} {"train_loss": -11.963813781738281, "global_step": 303075, "epoch": 1804} {"train_loss": -11.907732009887695, "global_step": 303076, "epoch": 1804} {"train_loss": -12.122934341430664, "global_step": 303077, "epoch": 1804} {"train_loss": -12.07999038696289, "global_step": 303078, "epoch": 1804} {"train_loss": -11.955526351928711, "global_step": 303079, "epoch": 1804} {"train_loss": -12.199809074401855, "global_step": 303080, "epoch": 1804} {"train_loss": -11.678211212158203, "global_step": 303081, "epoch": 1804} {"train_loss": -12.097192764282227, "global_step": 303082, "epoch": 1804} {"train_loss": -11.839773178100586, "global_step": 303083, "epoch": 1804} {"train_loss": -12.153594970703125, "global_step": 303084, "epoch": 1804} {"train_loss": -11.879304885864258, "global_step": 303085, "epoch": 1804} {"train_loss": -12.21613597869873, "global_step": 303086, "epoch": 1804} {"train_loss": -12.384249687194824, "global_step": 303087, "epoch": 1804} {"train_loss": -12.110095977783203, "global_step": 303088, "epoch": 1804} {"train_loss": -12.43728256225586, "global_step": 303089, "epoch": 1804} {"train_loss": -12.37700366973877, "global_step": 303090, "epoch": 1804} {"train_loss": -12.422103881835938, "global_step": 303091, "epoch": 1804} {"train_loss": -12.211039543151855, "global_step": 303092, "epoch": 1804} {"train_loss": -12.217588424682617, "global_step": 303093, "epoch": 1804} {"train_loss": -12.005197525024414, "global_step": 303094, "epoch": 1804} {"train_loss": -12.401432037353516, "global_step": 303095, "epoch": 1804} {"train_loss": -12.245129585266113, "global_step": 303096, "epoch": 1804} {"train_loss": -12.327241897583008, "global_step": 303097, "epoch": 1804} {"train_loss": -12.021430969238281, "global_step": 303098, "epoch": 1804} {"train_loss": -12.24627685546875, "global_step": 303099, "epoch": 1804} {"train_loss": -12.11503791809082, "global_step": 303100, "epoch": 1804} {"train_loss": -12.000844955444336, "global_step": 303101, "epoch": 1804} {"train_loss": -11.74664306640625, "global_step": 303102, "epoch": 1804} {"train_loss": -12.507847785949707, "global_step": 303103, "epoch": 1804} {"train_loss": -12.458902359008789, "global_step": 303104, "epoch": 1804} {"train_loss": -12.008454322814941, "global_step": 303105, "epoch": 1804} {"train_loss": -11.958436965942383, "global_step": 303106, "epoch": 1804} {"train_loss": -11.968951225280762, "global_step": 303107, "epoch": 1804} {"train_loss": -12.173839569091797, "global_step": 303108, "epoch": 1804} {"train_loss": -12.043584823608398, "global_step": 303109, "epoch": 1804} {"train_loss": -11.978643417358398, "global_step": 303110, "epoch": 1804} {"train_loss": -12.288406372070312, "global_step": 303111, "epoch": 1804} {"train_loss": -12.64163875579834, "global_step": 303112, "epoch": 1804} {"train_loss": -12.289422988891602, "global_step": 303113, "epoch": 1804} {"train_loss": -12.071532249450684, "global_step": 303114, "epoch": 1804} {"train_loss": -12.030608177185059, "global_step": 303115, "epoch": 1804} {"train_loss": -12.515069007873535, "global_step": 303116, "epoch": 1804} {"train_loss": -11.976335525512695, "global_step": 303117, "epoch": 1804} {"train_loss": -11.9835205078125, "global_step": 303118, "epoch": 1804} {"train_loss": -12.003456115722656, "global_step": 303119, "epoch": 1804} {"train_loss": -11.59074592590332, "global_step": 303120, "epoch": 1804} {"train_loss": -11.454170227050781, "global_step": 303121, "epoch": 1804} {"train_loss": -12.026968002319336, "global_step": 303122, "epoch": 1804} {"train_loss": -11.884244918823242, "global_step": 303123, "epoch": 1804} {"train_loss": -10.942768096923828, "global_step": 303124, "epoch": 1804} {"train_loss": -11.668827056884766, "global_step": 303125, "epoch": 1804} {"train_loss": -11.121389389038086, "global_step": 303126, "epoch": 1804} {"train_loss": -10.924538612365723, "global_step": 303127, "epoch": 1804} {"train_loss": -11.628767013549805, "global_step": 303128, "epoch": 1804} {"train_loss": -11.603803634643555, "global_step": 303129, "epoch": 1804} {"train_loss": -11.570341110229492, "global_step": 303130, "epoch": 1804} {"train_loss": -12.083396911621094, "global_step": 303131, "epoch": 1804} {"train_loss": -11.485346794128418, "global_step": 303132, "epoch": 1804} {"train_loss": -11.226442337036133, "global_step": 303133, "epoch": 1804} {"train_loss": -11.70811939239502, "global_step": 303134, "epoch": 1804} {"train_loss": -11.732633590698242, "global_step": 303135, "epoch": 1804} {"train_loss": -11.836309432983398, "global_step": 303136, "epoch": 1804} {"train_loss": -11.507425308227539, "global_step": 303137, "epoch": 1804} {"train_loss": -12.192523956298828, "global_step": 303138, "epoch": 1804} {"train_loss": -12.171594619750977, "global_step": 303139, "epoch": 1804} {"train_loss": -11.720529556274414, "global_step": 303140, "epoch": 1804} {"train_loss": -11.840937614440918, "global_step": 303141, "epoch": 1804} {"train_loss": -11.930166244506836, "global_step": 303142, "epoch": 1804} {"train_loss": -12.133127212524414, "global_step": 303143, "epoch": 1804} {"train_loss": -12.059673309326172, "global_step": 303144, "epoch": 1804} {"train_loss": -11.670513153076172, "global_step": 303145, "epoch": 1804} {"train_loss": -12.091123580932617, "global_step": 303146, "epoch": 1804} {"train_loss": -12.284579277038574, "global_step": 303147, "epoch": 1804} {"train_loss": -11.803136825561523, "global_step": 303148, "epoch": 1804} {"train_loss": -11.870003700256348, "global_step": 303149, "epoch": 1804} {"train_loss": -12.23511791229248, "global_step": 303150, "epoch": 1804} {"train_loss": -11.880510330200195, "global_step": 303151, "epoch": 1804} {"train_loss": -12.22738265991211, "global_step": 303152, "epoch": 1804} {"train_loss": -12.106151580810547, "global_step": 303153, "epoch": 1804} {"train_loss": -12.12319564819336, "global_step": 303154, "epoch": 1804} {"train_loss": -12.183308601379395, "global_step": 303155, "epoch": 1804} {"train_loss": -12.101068496704102, "global_step": 303156, "epoch": 1804} {"train_loss": -12.15794563293457, "global_step": 303157, "epoch": 1804} {"train_loss": -11.624195098876953, "global_step": 303158, "epoch": 1804} {"train_loss": -11.79771900177002, "global_step": 303159, "epoch": 1804} {"train_loss": -11.464652061462402, "global_step": 303160, "epoch": 1804} {"train_loss": -10.628971099853516, "global_step": 303161, "epoch": 1804} {"train_loss": -11.546775817871094, "global_step": 303162, "epoch": 1804} {"train_loss": -11.004226684570312, "global_step": 303163, "epoch": 1804} {"train_loss": -11.91452407836914, "global_step": 303164, "epoch": 1804} {"train_loss": -10.598414421081543, "global_step": 303165, "epoch": 1804} {"train_loss": -11.594404220581055, "global_step": 303166, "epoch": 1804} {"train_loss": -10.750141143798828, "global_step": 303167, "epoch": 1804} {"train_loss": -11.109554290771484, "global_step": 303168, "epoch": 1804} {"train_loss": -11.824615478515625, "global_step": 303169, "epoch": 1804} {"train_loss": -10.68350601196289, "global_step": 303170, "epoch": 1804} {"train_loss": -12.126977920532227, "global_step": 303171, "epoch": 1804} {"train_loss": -10.841470718383789, "global_step": 303172, "epoch": 1804} {"train_loss": -11.511101722717285, "global_step": 303173, "epoch": 1804} {"train_loss": -11.881030082702637, "global_step": 303174, "epoch": 1804} {"train_loss": -11.154489517211914, "global_step": 303175, "epoch": 1804} {"train_loss": -12.216015815734863, "global_step": 303176, "epoch": 1804} {"train_loss": -11.171664237976074, "global_step": 303177, "epoch": 1804} {"train_loss": -11.617230415344238, "global_step": 303178, "epoch": 1804} {"train_loss": -11.942177772521973, "global_step": 303179, "epoch": 1804} {"train_loss": -11.713644027709961, "global_step": 303180, "epoch": 1804} {"train_loss": -11.673831939697266, "global_step": 303181, "epoch": 1804} {"train_loss": -11.044662475585938, "global_step": 303182, "epoch": 1804} {"train_loss": -11.927618026733398, "global_step": 303183, "epoch": 1804} {"train_loss": -10.97430419921875, "global_step": 303184, "epoch": 1804} {"train_loss": -12.058076858520508, "global_step": 303185, "epoch": 1804} {"train_loss": -11.308048248291016, "global_step": 303186, "epoch": 1804} {"train_loss": -11.580333709716797, "global_step": 303187, "epoch": 1804} {"train_loss": -11.249446868896484, "global_step": 303188, "epoch": 1804} {"train_loss": -11.140892028808594, "global_step": 303189, "epoch": 1804} {"train_loss": -10.980045318603516, "global_step": 303190, "epoch": 1804} {"train_loss": -11.567904472351074, "global_step": 303191, "epoch": 1804} {"train_loss": -10.755529403686523, "global_step": 303192, "epoch": 1804} {"train_loss": -11.314781188964844, "global_step": 303193, "epoch": 1804} {"train_loss": -10.26705551147461, "global_step": 303194, "epoch": 1804} {"train_loss": -11.63123893737793, "global_step": 303195, "epoch": 1804} {"train_loss": -10.683843612670898, "global_step": 303196, "epoch": 1804} {"train_loss": -11.537676811218262, "global_step": 303197, "epoch": 1804} {"train_loss": -11.1868896484375, "global_step": 303198, "epoch": 1804} {"train_loss": -11.395713806152344, "global_step": 303199, "epoch": 1804} {"train_loss": -11.168731689453125, "global_step": 303200, "epoch": 1804} {"train_loss": -12.07158088684082, "global_step": 303201, "epoch": 1804} {"train_loss": -10.613557815551758, "global_step": 303202, "epoch": 1804} {"train_loss": -11.769437789916992, "global_step": 303203, "epoch": 1804} {"train_loss": -11.617262840270996, "global_step": 303204, "epoch": 1804} {"train_loss": -11.387192726135254, "global_step": 303205, "epoch": 1804} {"train_loss": -11.926546096801758, "global_step": 303206, "epoch": 1804} {"train_loss": -11.374150276184082, "global_step": 303207, "epoch": 1804} {"train_loss": -11.416646957397461, "global_step": 303208, "epoch": 1804} {"train_loss": -12.135368347167969, "global_step": 303209, "epoch": 1804} {"train_loss": -11.457128524780273, "global_step": 303210, "epoch": 1804} {"train_loss": -11.899231910705566, "global_step": 303211, "epoch": 1804} {"train_loss": -11.76734447479248, "global_step": 303212, "epoch": 1804} {"train_loss": -11.854644775390625, "global_step": 303213, "epoch": 1804} {"train_loss": -11.986238479614258, "global_step": 303214, "epoch": 1804} {"train_loss": -11.771201133728027, "global_step": 303215, "epoch": 1804} {"train_loss": -12.077707290649414, "global_step": 303216, "epoch": 1804} {"train_loss": -12.017085075378418, "global_step": 303217, "epoch": 1804} {"train_loss": -11.999053955078125, "global_step": 303218, "epoch": 1804} {"train_loss": -11.929609298706055, "global_step": 303219, "epoch": 1804} {"train_loss": -11.954835891723633, "global_step": 303220, "epoch": 1804} {"train_loss": -12.102388381958008, "global_step": 303221, "epoch": 1804} {"train_loss": -12.424612045288086, "global_step": 303222, "epoch": 1804} {"train_loss": -12.11068344116211, "global_step": 303223, "epoch": 1804} {"train_loss": -12.143918991088867, "global_step": 303224, "epoch": 1804} {"train_loss": -12.058719635009766, "global_step": 303225, "epoch": 1804} {"train_loss": -12.158808708190918, "global_step": 303226, "epoch": 1804} {"train_loss": -12.202230453491211, "global_step": 303227, "epoch": 1804} {"train_loss": -12.160080909729004, "global_step": 303228, "epoch": 1804} {"train_loss": -12.126087188720703, "global_step": 303229, "epoch": 1804} {"train_loss": -12.298561096191406, "global_step": 303230, "epoch": 1804} {"train_loss": -12.018749237060547, "global_step": 303231, "epoch": 1804} {"train_loss": -12.150605201721191, "global_step": 303232, "epoch": 1804} {"train_loss": -12.062255859375, "global_step": 303233, "epoch": 1804} {"train_loss": -12.149421691894531, "global_step": 303234, "epoch": 1804} {"train_loss": -12.19904899597168, "global_step": 303235, "epoch": 1804} {"train_loss": -12.264789581298828, "global_step": 303236, "epoch": 1804} {"train_loss": -12.040465354919434, "global_step": 303237, "epoch": 1804} {"train_loss": -12.362457275390625, "global_step": 303238, "epoch": 1804} {"train_loss": -11.817219790958223, "global_step": 303239, "epoch": 1804, "val_loss": 280708.78125} {"train_loss": -12.151012420654297, "global_step": 303240, "epoch": 1805} {"train_loss": -12.068359375, "global_step": 303241, "epoch": 1805} {"train_loss": -12.310319900512695, "global_step": 303242, "epoch": 1805} {"train_loss": -12.391925811767578, "global_step": 303243, "epoch": 1805} {"train_loss": -12.003523826599121, "global_step": 303244, "epoch": 1805} {"train_loss": -12.446562767028809, "global_step": 303245, "epoch": 1805} {"train_loss": -12.263982772827148, "global_step": 303246, "epoch": 1805} {"train_loss": -12.298049926757812, "global_step": 303247, "epoch": 1805} {"train_loss": -12.554201126098633, "global_step": 303248, "epoch": 1805} {"train_loss": -12.211511611938477, "global_step": 303249, "epoch": 1805} {"train_loss": -12.405227661132812, "global_step": 303250, "epoch": 1805} {"train_loss": -12.244682312011719, "global_step": 303251, "epoch": 1805} {"train_loss": -12.331766128540039, "global_step": 303252, "epoch": 1805} {"train_loss": -12.236932754516602, "global_step": 303253, "epoch": 1805} {"train_loss": -12.583212852478027, "global_step": 303254, "epoch": 1805} {"train_loss": -12.316139221191406, "global_step": 303255, "epoch": 1805} {"train_loss": -12.2432222366333, "global_step": 303256, "epoch": 1805} {"train_loss": -11.784490585327148, "global_step": 303257, "epoch": 1805} {"train_loss": -11.79692554473877, "global_step": 303258, "epoch": 1805} {"train_loss": -12.297859191894531, "global_step": 303259, "epoch": 1805} {"train_loss": -11.968292236328125, "global_step": 303260, "epoch": 1805} {"train_loss": -12.344206809997559, "global_step": 303261, "epoch": 1805} {"train_loss": -12.047830581665039, "global_step": 303262, "epoch": 1805} {"train_loss": -12.341175079345703, "global_step": 303263, "epoch": 1805} {"train_loss": -12.297996520996094, "global_step": 303264, "epoch": 1805} {"train_loss": -12.331586837768555, "global_step": 303265, "epoch": 1805} {"train_loss": -12.065855979919434, "global_step": 303266, "epoch": 1805} {"train_loss": -11.841802597045898, "global_step": 303267, "epoch": 1805} {"train_loss": -11.984248161315918, "global_step": 303268, "epoch": 1805} {"train_loss": -11.605892181396484, "global_step": 303269, "epoch": 1805} {"train_loss": -12.436670303344727, "global_step": 303270, "epoch": 1805} {"train_loss": -12.076902389526367, "global_step": 303271, "epoch": 1805} {"train_loss": -11.733816146850586, "global_step": 303272, "epoch": 1805} {"train_loss": -12.208142280578613, "global_step": 303273, "epoch": 1805} {"train_loss": -11.70375919342041, "global_step": 303274, "epoch": 1805} {"train_loss": -12.113231658935547, "global_step": 303275, "epoch": 1805} {"train_loss": -11.695821762084961, "global_step": 303276, "epoch": 1805} {"train_loss": -11.84467887878418, "global_step": 303277, "epoch": 1805} {"train_loss": -11.916330337524414, "global_step": 303278, "epoch": 1805} {"train_loss": -11.986379623413086, "global_step": 303279, "epoch": 1805} {"train_loss": -11.577871322631836, "global_step": 303280, "epoch": 1805} {"train_loss": -11.815596580505371, "global_step": 303281, "epoch": 1805} {"train_loss": -11.717941284179688, "global_step": 303282, "epoch": 1805} {"train_loss": -11.514134407043457, "global_step": 303283, "epoch": 1805} {"train_loss": -11.718002319335938, "global_step": 303284, "epoch": 1805} {"train_loss": -12.058785438537598, "global_step": 303285, "epoch": 1805} {"train_loss": -10.322845458984375, "global_step": 303286, "epoch": 1805} {"train_loss": -11.684977531433105, "global_step": 303287, "epoch": 1805} {"train_loss": -10.373014450073242, "global_step": 303288, "epoch": 1805} {"train_loss": -11.057459831237793, "global_step": 303289, "epoch": 1805} {"train_loss": -11.32931137084961, "global_step": 303290, "epoch": 1805} {"train_loss": -11.879015922546387, "global_step": 303291, "epoch": 1805} {"train_loss": -10.957401275634766, "global_step": 303292, "epoch": 1805} {"train_loss": -11.274974822998047, "global_step": 303293, "epoch": 1805} {"train_loss": -11.479355812072754, "global_step": 303294, "epoch": 1805} {"train_loss": -11.496898651123047, "global_step": 303295, "epoch": 1805} {"train_loss": -11.856130599975586, "global_step": 303296, "epoch": 1805} {"train_loss": -11.421642303466797, "global_step": 303297, "epoch": 1805} {"train_loss": -11.428516387939453, "global_step": 303298, "epoch": 1805} {"train_loss": -11.594324111938477, "global_step": 303299, "epoch": 1805} {"train_loss": -10.874741554260254, "global_step": 303300, "epoch": 1805} {"train_loss": -11.371515274047852, "global_step": 303301, "epoch": 1805} {"train_loss": -11.530163764953613, "global_step": 303302, "epoch": 1805} {"train_loss": -10.96900463104248, "global_step": 303303, "epoch": 1805} {"train_loss": -11.296566009521484, "global_step": 303304, "epoch": 1805} {"train_loss": -11.952274322509766, "global_step": 303305, "epoch": 1805} {"train_loss": -10.768314361572266, "global_step": 303306, "epoch": 1805} {"train_loss": -11.150117874145508, "global_step": 303307, "epoch": 1805} {"train_loss": -12.019318580627441, "global_step": 303308, "epoch": 1805} {"train_loss": -11.014425277709961, "global_step": 303309, "epoch": 1805} {"train_loss": -11.884941101074219, "global_step": 303310, "epoch": 1805} {"train_loss": -11.84089183807373, "global_step": 303311, "epoch": 1805} {"train_loss": -11.381807327270508, "global_step": 303312, "epoch": 1805} {"train_loss": -11.623859405517578, "global_step": 303313, "epoch": 1805} {"train_loss": -11.812712669372559, "global_step": 303314, "epoch": 1805} {"train_loss": -11.89460277557373, "global_step": 303315, "epoch": 1805} {"train_loss": -11.76826286315918, "global_step": 303316, "epoch": 1805} {"train_loss": -11.83067798614502, "global_step": 303317, "epoch": 1805} {"train_loss": -11.589813232421875, "global_step": 303318, "epoch": 1805} {"train_loss": -12.294116973876953, "global_step": 303319, "epoch": 1805} {"train_loss": -12.09840202331543, "global_step": 303320, "epoch": 1805} {"train_loss": -11.995044708251953, "global_step": 303321, "epoch": 1805} {"train_loss": -11.76596736907959, "global_step": 303322, "epoch": 1805} {"train_loss": -11.688722610473633, "global_step": 303323, "epoch": 1805} {"train_loss": -11.938318252563477, "global_step": 303324, "epoch": 1805} {"train_loss": -11.959074020385742, "global_step": 303325, "epoch": 1805} {"train_loss": -11.518959045410156, "global_step": 303326, "epoch": 1805} {"train_loss": -12.31314468383789, "global_step": 303327, "epoch": 1805} {"train_loss": -11.886956214904785, "global_step": 303328, "epoch": 1805} {"train_loss": -12.260828018188477, "global_step": 303329, "epoch": 1805} {"train_loss": -12.168149948120117, "global_step": 303330, "epoch": 1805} {"train_loss": -11.877108573913574, "global_step": 303331, "epoch": 1805} {"train_loss": -12.049036026000977, "global_step": 303332, "epoch": 1805} {"train_loss": -12.053425788879395, "global_step": 303333, "epoch": 1805} {"train_loss": -11.788450241088867, "global_step": 303334, "epoch": 1805} {"train_loss": -11.894262313842773, "global_step": 303335, "epoch": 1805} {"train_loss": -11.487236022949219, "global_step": 303336, "epoch": 1805} {"train_loss": -10.732619285583496, "global_step": 303337, "epoch": 1805} {"train_loss": -11.665180206298828, "global_step": 303338, "epoch": 1805} {"train_loss": -10.747452735900879, "global_step": 303339, "epoch": 1805} {"train_loss": -10.310078620910645, "global_step": 303340, "epoch": 1805} {"train_loss": -10.508069038391113, "global_step": 303341, "epoch": 1805} {"train_loss": -10.39741325378418, "global_step": 303342, "epoch": 1805} {"train_loss": -12.000926971435547, "global_step": 303343, "epoch": 1805} {"train_loss": -10.569273948669434, "global_step": 303344, "epoch": 1805} {"train_loss": -11.727849960327148, "global_step": 303345, "epoch": 1805} {"train_loss": -11.734458923339844, "global_step": 303346, "epoch": 1805} {"train_loss": -11.395149230957031, "global_step": 303347, "epoch": 1805} {"train_loss": -11.82740592956543, "global_step": 303348, "epoch": 1805} {"train_loss": -11.80742073059082, "global_step": 303349, "epoch": 1805} {"train_loss": -12.12037467956543, "global_step": 303350, "epoch": 1805} {"train_loss": -11.723583221435547, "global_step": 303351, "epoch": 1805} {"train_loss": -12.296960830688477, "global_step": 303352, "epoch": 1805} {"train_loss": -11.745898246765137, "global_step": 303353, "epoch": 1805} {"train_loss": -12.350038528442383, "global_step": 303354, "epoch": 1805} {"train_loss": -12.019161224365234, "global_step": 303355, "epoch": 1805} {"train_loss": -12.012304306030273, "global_step": 303356, "epoch": 1805} {"train_loss": -12.044079780578613, "global_step": 303357, "epoch": 1805} {"train_loss": -12.179612159729004, "global_step": 303358, "epoch": 1805} {"train_loss": -11.82171630859375, "global_step": 303359, "epoch": 1805} {"train_loss": -12.0687894821167, "global_step": 303360, "epoch": 1805} {"train_loss": -12.280255317687988, "global_step": 303361, "epoch": 1805} {"train_loss": -12.339805603027344, "global_step": 303362, "epoch": 1805} {"train_loss": -12.180824279785156, "global_step": 303363, "epoch": 1805} {"train_loss": -12.116172790527344, "global_step": 303364, "epoch": 1805} {"train_loss": -12.128190994262695, "global_step": 303365, "epoch": 1805} {"train_loss": -12.414039611816406, "global_step": 303366, "epoch": 1805} {"train_loss": -12.132380485534668, "global_step": 303367, "epoch": 1805} {"train_loss": -12.111557006835938, "global_step": 303368, "epoch": 1805} {"train_loss": -12.397607803344727, "global_step": 303369, "epoch": 1805} {"train_loss": -12.193852424621582, "global_step": 303370, "epoch": 1805} {"train_loss": -12.37259578704834, "global_step": 303371, "epoch": 1805} {"train_loss": -12.130693435668945, "global_step": 303372, "epoch": 1805} {"train_loss": -12.294527053833008, "global_step": 303373, "epoch": 1805} {"train_loss": -11.988160133361816, "global_step": 303374, "epoch": 1805} {"train_loss": -12.141761779785156, "global_step": 303375, "epoch": 1805} {"train_loss": -12.332435607910156, "global_step": 303376, "epoch": 1805} {"train_loss": -12.271230697631836, "global_step": 303377, "epoch": 1805} {"train_loss": -12.342672348022461, "global_step": 303378, "epoch": 1805} {"train_loss": -12.33575439453125, "global_step": 303379, "epoch": 1805} {"train_loss": -12.144556045532227, "global_step": 303380, "epoch": 1805} {"train_loss": -12.587007522583008, "global_step": 303381, "epoch": 1805} {"train_loss": -12.582315444946289, "global_step": 303382, "epoch": 1805} {"train_loss": -12.338911056518555, "global_step": 303383, "epoch": 1805} {"train_loss": -12.431852340698242, "global_step": 303384, "epoch": 1805} {"train_loss": -12.146657943725586, "global_step": 303385, "epoch": 1805} {"train_loss": -12.147175788879395, "global_step": 303386, "epoch": 1805} {"train_loss": -12.569564819335938, "global_step": 303387, "epoch": 1805} {"train_loss": -12.39418888092041, "global_step": 303388, "epoch": 1805} {"train_loss": -12.279611587524414, "global_step": 303389, "epoch": 1805} {"train_loss": -12.25444221496582, "global_step": 303390, "epoch": 1805} {"train_loss": -12.3419189453125, "global_step": 303391, "epoch": 1805} {"train_loss": -11.716344833374023, "global_step": 303392, "epoch": 1805} {"train_loss": -12.001524925231934, "global_step": 303393, "epoch": 1805} {"train_loss": -12.140039443969727, "global_step": 303394, "epoch": 1805} {"train_loss": -11.279773712158203, "global_step": 303395, "epoch": 1805} {"train_loss": -12.566673278808594, "global_step": 303396, "epoch": 1805} {"train_loss": -11.431466102600098, "global_step": 303397, "epoch": 1805} {"train_loss": -11.77531623840332, "global_step": 303398, "epoch": 1805} {"train_loss": -11.882621765136719, "global_step": 303399, "epoch": 1805} {"train_loss": -12.175159454345703, "global_step": 303400, "epoch": 1805} {"train_loss": -11.316000938415527, "global_step": 303401, "epoch": 1805} {"train_loss": -12.24003791809082, "global_step": 303402, "epoch": 1805} {"train_loss": -11.731304168701172, "global_step": 303403, "epoch": 1805} {"train_loss": -12.1783447265625, "global_step": 303404, "epoch": 1805} {"train_loss": -11.28803539276123, "global_step": 303405, "epoch": 1805} {"train_loss": -11.281018257141113, "global_step": 303406, "epoch": 1805} {"train_loss": -11.874386248134432, "global_step": 303407, "epoch": 1805, "val_loss": 280379.09375, "train_action_mse_error": 2.669476270675659} {"train_loss": -11.664325714111328, "global_step": 303408, "epoch": 1806} {"train_loss": -11.493169784545898, "global_step": 303409, "epoch": 1806} {"train_loss": -11.551094055175781, "global_step": 303410, "epoch": 1806} {"train_loss": -11.679349899291992, "global_step": 303411, "epoch": 1806} {"train_loss": -12.033561706542969, "global_step": 303412, "epoch": 1806} {"train_loss": -11.598243713378906, "global_step": 303413, "epoch": 1806} {"train_loss": -11.542731285095215, "global_step": 303414, "epoch": 1806} {"train_loss": -11.60559368133545, "global_step": 303415, "epoch": 1806} {"train_loss": -12.127616882324219, "global_step": 303416, "epoch": 1806} {"train_loss": -11.579294204711914, "global_step": 303417, "epoch": 1806} {"train_loss": -11.945707321166992, "global_step": 303418, "epoch": 1806} {"train_loss": -11.908930778503418, "global_step": 303419, "epoch": 1806} {"train_loss": -11.904809951782227, "global_step": 303420, "epoch": 1806} {"train_loss": -12.149181365966797, "global_step": 303421, "epoch": 1806} {"train_loss": -11.982223510742188, "global_step": 303422, "epoch": 1806} {"train_loss": -12.11622428894043, "global_step": 303423, "epoch": 1806} {"train_loss": -11.899078369140625, "global_step": 303424, "epoch": 1806} {"train_loss": -12.211041450500488, "global_step": 303425, "epoch": 1806} {"train_loss": -11.687250137329102, "global_step": 303426, "epoch": 1806} {"train_loss": -12.309989929199219, "global_step": 303427, "epoch": 1806} {"train_loss": -11.798541069030762, "global_step": 303428, "epoch": 1806} {"train_loss": -11.93027114868164, "global_step": 303429, "epoch": 1806} {"train_loss": -11.932194709777832, "global_step": 303430, "epoch": 1806} {"train_loss": -12.21214771270752, "global_step": 303431, "epoch": 1806} {"train_loss": -12.030174255371094, "global_step": 303432, "epoch": 1806} {"train_loss": -11.848278045654297, "global_step": 303433, "epoch": 1806} {"train_loss": -12.072458267211914, "global_step": 303434, "epoch": 1806} {"train_loss": -11.635662078857422, "global_step": 303435, "epoch": 1806} {"train_loss": -12.28695297241211, "global_step": 303436, "epoch": 1806} {"train_loss": -11.73945140838623, "global_step": 303437, "epoch": 1806} {"train_loss": -11.943400382995605, "global_step": 303438, "epoch": 1806} {"train_loss": -11.387554168701172, "global_step": 303439, "epoch": 1806} {"train_loss": -12.069473266601562, "global_step": 303440, "epoch": 1806} {"train_loss": -11.797801971435547, "global_step": 303441, "epoch": 1806} {"train_loss": -11.947847366333008, "global_step": 303442, "epoch": 1806} {"train_loss": -12.229743003845215, "global_step": 303443, "epoch": 1806} {"train_loss": -12.01983642578125, "global_step": 303444, "epoch": 1806} {"train_loss": -11.936914443969727, "global_step": 303445, "epoch": 1806} {"train_loss": -12.340984344482422, "global_step": 303446, "epoch": 1806} {"train_loss": -12.252668380737305, "global_step": 303447, "epoch": 1806} {"train_loss": -12.33348560333252, "global_step": 303448, "epoch": 1806} {"train_loss": -12.130427360534668, "global_step": 303449, "epoch": 1806} {"train_loss": -12.304427146911621, "global_step": 303450, "epoch": 1806} {"train_loss": -11.5618257522583, "global_step": 303451, "epoch": 1806} {"train_loss": -12.223538398742676, "global_step": 303452, "epoch": 1806} {"train_loss": -11.770184516906738, "global_step": 303453, "epoch": 1806} {"train_loss": -12.173280715942383, "global_step": 303454, "epoch": 1806} {"train_loss": -12.165679931640625, "global_step": 303455, "epoch": 1806} {"train_loss": -12.031815528869629, "global_step": 303456, "epoch": 1806} {"train_loss": -11.995511054992676, "global_step": 303457, "epoch": 1806} {"train_loss": -12.149621963500977, "global_step": 303458, "epoch": 1806} {"train_loss": -11.928550720214844, "global_step": 303459, "epoch": 1806} {"train_loss": -12.158273696899414, "global_step": 303460, "epoch": 1806} {"train_loss": -12.437291145324707, "global_step": 303461, "epoch": 1806} {"train_loss": -12.173521041870117, "global_step": 303462, "epoch": 1806} {"train_loss": -12.131994247436523, "global_step": 303463, "epoch": 1806} {"train_loss": -11.90440845489502, "global_step": 303464, "epoch": 1806} {"train_loss": -12.299039840698242, "global_step": 303465, "epoch": 1806} {"train_loss": -12.2322359085083, "global_step": 303466, "epoch": 1806} {"train_loss": -12.352251052856445, "global_step": 303467, "epoch": 1806} {"train_loss": -12.36990737915039, "global_step": 303468, "epoch": 1806} {"train_loss": -12.357078552246094, "global_step": 303469, "epoch": 1806} {"train_loss": -12.27481460571289, "global_step": 303470, "epoch": 1806} {"train_loss": -12.344615936279297, "global_step": 303471, "epoch": 1806} {"train_loss": -12.31173324584961, "global_step": 303472, "epoch": 1806} {"train_loss": -11.891874313354492, "global_step": 303473, "epoch": 1806} {"train_loss": -12.130634307861328, "global_step": 303474, "epoch": 1806} {"train_loss": -12.186068534851074, "global_step": 303475, "epoch": 1806} {"train_loss": -11.893089294433594, "global_step": 303476, "epoch": 1806} {"train_loss": -11.84554672241211, "global_step": 303477, "epoch": 1806} {"train_loss": -12.346342086791992, "global_step": 303478, "epoch": 1806} {"train_loss": -12.24579906463623, "global_step": 303479, "epoch": 1806} {"train_loss": -12.237348556518555, "global_step": 303480, "epoch": 1806} {"train_loss": -12.215837478637695, "global_step": 303481, "epoch": 1806} {"train_loss": -12.379456520080566, "global_step": 303482, "epoch": 1806} {"train_loss": -12.217622756958008, "global_step": 303483, "epoch": 1806} {"train_loss": -12.352165222167969, "global_step": 303484, "epoch": 1806} {"train_loss": -12.205055236816406, "global_step": 303485, "epoch": 1806} {"train_loss": -12.117799758911133, "global_step": 303486, "epoch": 1806} {"train_loss": -12.221231460571289, "global_step": 303487, "epoch": 1806} {"train_loss": -12.551788330078125, "global_step": 303488, "epoch": 1806} {"train_loss": -11.580331802368164, "global_step": 303489, "epoch": 1806} {"train_loss": -11.025283813476562, "global_step": 303490, "epoch": 1806} {"train_loss": -11.72892951965332, "global_step": 303491, "epoch": 1806} {"train_loss": -11.373228073120117, "global_step": 303492, "epoch": 1806} {"train_loss": -12.476179122924805, "global_step": 303493, "epoch": 1806} {"train_loss": -11.798105239868164, "global_step": 303494, "epoch": 1806} {"train_loss": -12.069952011108398, "global_step": 303495, "epoch": 1806} {"train_loss": -11.981801986694336, "global_step": 303496, "epoch": 1806} {"train_loss": -12.187871932983398, "global_step": 303497, "epoch": 1806} {"train_loss": -11.582623481750488, "global_step": 303498, "epoch": 1806} {"train_loss": -12.351272583007812, "global_step": 303499, "epoch": 1806} {"train_loss": -11.913273811340332, "global_step": 303500, "epoch": 1806} {"train_loss": -11.756048202514648, "global_step": 303501, "epoch": 1806} {"train_loss": -11.748835563659668, "global_step": 303502, "epoch": 1806} {"train_loss": -11.842288970947266, "global_step": 303503, "epoch": 1806} {"train_loss": -12.25560188293457, "global_step": 303504, "epoch": 1806} {"train_loss": -11.714926719665527, "global_step": 303505, "epoch": 1806} {"train_loss": -10.105535507202148, "global_step": 303506, "epoch": 1806} {"train_loss": -10.829377174377441, "global_step": 303507, "epoch": 1806} {"train_loss": -11.83215618133545, "global_step": 303508, "epoch": 1806} {"train_loss": -11.277158737182617, "global_step": 303509, "epoch": 1806} {"train_loss": -10.64663028717041, "global_step": 303510, "epoch": 1806} {"train_loss": -11.699153900146484, "global_step": 303511, "epoch": 1806} {"train_loss": -10.821063995361328, "global_step": 303512, "epoch": 1806} {"train_loss": -10.389471054077148, "global_step": 303513, "epoch": 1806} {"train_loss": -11.784387588500977, "global_step": 303514, "epoch": 1806} {"train_loss": -9.989517211914062, "global_step": 303515, "epoch": 1806} {"train_loss": -11.652469635009766, "global_step": 303516, "epoch": 1806} {"train_loss": -11.098313331604004, "global_step": 303517, "epoch": 1806} {"train_loss": -10.518227577209473, "global_step": 303518, "epoch": 1806} {"train_loss": -12.074182510375977, "global_step": 303519, "epoch": 1806} {"train_loss": -9.539514541625977, "global_step": 303520, "epoch": 1806} {"train_loss": -10.86053466796875, "global_step": 303521, "epoch": 1806} {"train_loss": -11.566093444824219, "global_step": 303522, "epoch": 1806} {"train_loss": -11.357071876525879, "global_step": 303523, "epoch": 1806} {"train_loss": -11.441017150878906, "global_step": 303524, "epoch": 1806} {"train_loss": -10.956167221069336, "global_step": 303525, "epoch": 1806} {"train_loss": -10.761493682861328, "global_step": 303526, "epoch": 1806} {"train_loss": -12.097692489624023, "global_step": 303527, "epoch": 1806} {"train_loss": -11.723159790039062, "global_step": 303528, "epoch": 1806} {"train_loss": -11.506999969482422, "global_step": 303529, "epoch": 1806} {"train_loss": -10.880317687988281, "global_step": 303530, "epoch": 1806} {"train_loss": -10.790224075317383, "global_step": 303531, "epoch": 1806} {"train_loss": -10.78756046295166, "global_step": 303532, "epoch": 1806} {"train_loss": -11.118366241455078, "global_step": 303533, "epoch": 1806} {"train_loss": -11.575204849243164, "global_step": 303534, "epoch": 1806} {"train_loss": -11.294353485107422, "global_step": 303535, "epoch": 1806} {"train_loss": -11.508325576782227, "global_step": 303536, "epoch": 1806} {"train_loss": -11.417176246643066, "global_step": 303537, "epoch": 1806} {"train_loss": -11.631311416625977, "global_step": 303538, "epoch": 1806} {"train_loss": -11.423022270202637, "global_step": 303539, "epoch": 1806} {"train_loss": -11.758794784545898, "global_step": 303540, "epoch": 1806} {"train_loss": -11.229267120361328, "global_step": 303541, "epoch": 1806} {"train_loss": -11.707788467407227, "global_step": 303542, "epoch": 1806} {"train_loss": -11.523056030273438, "global_step": 303543, "epoch": 1806} {"train_loss": -11.717513084411621, "global_step": 303544, "epoch": 1806} {"train_loss": -11.628518104553223, "global_step": 303545, "epoch": 1806} {"train_loss": -11.809684753417969, "global_step": 303546, "epoch": 1806} {"train_loss": -11.74653434753418, "global_step": 303547, "epoch": 1806} {"train_loss": -11.671448707580566, "global_step": 303548, "epoch": 1806} {"train_loss": -11.885684967041016, "global_step": 303549, "epoch": 1806} {"train_loss": -11.958773612976074, "global_step": 303550, "epoch": 1806} {"train_loss": -12.067938804626465, "global_step": 303551, "epoch": 1806} {"train_loss": -11.871855735778809, "global_step": 303552, "epoch": 1806} {"train_loss": -11.911067962646484, "global_step": 303553, "epoch": 1806} {"train_loss": -12.136404037475586, "global_step": 303554, "epoch": 1806} {"train_loss": -11.916656494140625, "global_step": 303555, "epoch": 1806} {"train_loss": -11.915582656860352, "global_step": 303556, "epoch": 1806} {"train_loss": -11.82113265991211, "global_step": 303557, "epoch": 1806} {"train_loss": -11.733488082885742, "global_step": 303558, "epoch": 1806} {"train_loss": -11.883220672607422, "global_step": 303559, "epoch": 1806} {"train_loss": -11.629046440124512, "global_step": 303560, "epoch": 1806} {"train_loss": -11.906320571899414, "global_step": 303561, "epoch": 1806} {"train_loss": -11.504323959350586, "global_step": 303562, "epoch": 1806} {"train_loss": -12.012161254882812, "global_step": 303563, "epoch": 1806} {"train_loss": -12.189071655273438, "global_step": 303564, "epoch": 1806} {"train_loss": -11.840291976928711, "global_step": 303565, "epoch": 1806} {"train_loss": -12.162168502807617, "global_step": 303566, "epoch": 1806} {"train_loss": -11.737772941589355, "global_step": 303567, "epoch": 1806} {"train_loss": -12.136674880981445, "global_step": 303568, "epoch": 1806} {"train_loss": -11.868529319763184, "global_step": 303569, "epoch": 1806} {"train_loss": -12.180256843566895, "global_step": 303570, "epoch": 1806} {"train_loss": -11.824430465698242, "global_step": 303571, "epoch": 1806} {"train_loss": -12.209238052368164, "global_step": 303572, "epoch": 1806} {"train_loss": -11.915294647216797, "global_step": 303573, "epoch": 1806} {"train_loss": -11.802000045776367, "global_step": 303574, "epoch": 1806} {"train_loss": -11.800736637342544, "global_step": 303575, "epoch": 1806, "val_loss": 284133.0} {"train_loss": -11.927207946777344, "global_step": 303576, "epoch": 1807} {"train_loss": -11.680147171020508, "global_step": 303577, "epoch": 1807} {"train_loss": -11.57876205444336, "global_step": 303578, "epoch": 1807} {"train_loss": -11.872415542602539, "global_step": 303579, "epoch": 1807} {"train_loss": -11.638328552246094, "global_step": 303580, "epoch": 1807} {"train_loss": -11.527068138122559, "global_step": 303581, "epoch": 1807} {"train_loss": -11.497190475463867, "global_step": 303582, "epoch": 1807} {"train_loss": -12.137443542480469, "global_step": 303583, "epoch": 1807} {"train_loss": -11.463323593139648, "global_step": 303584, "epoch": 1807} {"train_loss": -11.920522689819336, "global_step": 303585, "epoch": 1807} {"train_loss": -11.655431747436523, "global_step": 303586, "epoch": 1807} {"train_loss": -11.881746292114258, "global_step": 303587, "epoch": 1807} {"train_loss": -12.043659210205078, "global_step": 303588, "epoch": 1807} {"train_loss": -11.006479263305664, "global_step": 303589, "epoch": 1807} {"train_loss": -12.23238754272461, "global_step": 303590, "epoch": 1807} {"train_loss": -11.281896591186523, "global_step": 303591, "epoch": 1807} {"train_loss": -12.029565811157227, "global_step": 303592, "epoch": 1807} {"train_loss": -11.725872039794922, "global_step": 303593, "epoch": 1807} {"train_loss": -12.19904899597168, "global_step": 303594, "epoch": 1807} {"train_loss": -11.887672424316406, "global_step": 303595, "epoch": 1807} {"train_loss": -11.608440399169922, "global_step": 303596, "epoch": 1807} {"train_loss": -11.872330665588379, "global_step": 303597, "epoch": 1807} {"train_loss": -11.69473648071289, "global_step": 303598, "epoch": 1807} {"train_loss": -12.007474899291992, "global_step": 303599, "epoch": 1807} {"train_loss": -11.898120880126953, "global_step": 303600, "epoch": 1807} {"train_loss": -11.902196884155273, "global_step": 303601, "epoch": 1807} {"train_loss": -11.90760612487793, "global_step": 303602, "epoch": 1807} {"train_loss": -11.910430908203125, "global_step": 303603, "epoch": 1807} {"train_loss": -12.024187088012695, "global_step": 303604, "epoch": 1807} {"train_loss": -11.64973258972168, "global_step": 303605, "epoch": 1807} {"train_loss": -12.029078483581543, "global_step": 303606, "epoch": 1807} {"train_loss": -11.854247093200684, "global_step": 303607, "epoch": 1807} {"train_loss": -12.30170726776123, "global_step": 303608, "epoch": 1807} {"train_loss": -11.463252067565918, "global_step": 303609, "epoch": 1807} {"train_loss": -12.290740966796875, "global_step": 303610, "epoch": 1807} {"train_loss": -11.804622650146484, "global_step": 303611, "epoch": 1807} {"train_loss": -12.227521896362305, "global_step": 303612, "epoch": 1807} {"train_loss": -12.232337951660156, "global_step": 303613, "epoch": 1807} {"train_loss": -12.118646621704102, "global_step": 303614, "epoch": 1807} {"train_loss": -12.184457778930664, "global_step": 303615, "epoch": 1807} {"train_loss": -11.903936386108398, "global_step": 303616, "epoch": 1807} {"train_loss": -12.325542449951172, "global_step": 303617, "epoch": 1807} {"train_loss": -11.728052139282227, "global_step": 303618, "epoch": 1807} {"train_loss": -12.306553840637207, "global_step": 303619, "epoch": 1807} {"train_loss": -11.852007865905762, "global_step": 303620, "epoch": 1807} {"train_loss": -12.391439437866211, "global_step": 303621, "epoch": 1807} {"train_loss": -12.168741226196289, "global_step": 303622, "epoch": 1807} {"train_loss": -12.146157264709473, "global_step": 303623, "epoch": 1807} {"train_loss": -12.120916366577148, "global_step": 303624, "epoch": 1807} {"train_loss": -12.364480018615723, "global_step": 303625, "epoch": 1807} {"train_loss": -12.323238372802734, "global_step": 303626, "epoch": 1807} {"train_loss": -12.494026184082031, "global_step": 303627, "epoch": 1807} {"train_loss": -12.190207481384277, "global_step": 303628, "epoch": 1807} {"train_loss": -12.30419921875, "global_step": 303629, "epoch": 1807} {"train_loss": -12.214844703674316, "global_step": 303630, "epoch": 1807} {"train_loss": -12.400520324707031, "global_step": 303631, "epoch": 1807} {"train_loss": -12.377510070800781, "global_step": 303632, "epoch": 1807} {"train_loss": -12.510725021362305, "global_step": 303633, "epoch": 1807} {"train_loss": -12.674188613891602, "global_step": 303634, "epoch": 1807} {"train_loss": -12.31110954284668, "global_step": 303635, "epoch": 1807} {"train_loss": -12.461823463439941, "global_step": 303636, "epoch": 1807} {"train_loss": -12.58189868927002, "global_step": 303637, "epoch": 1807} {"train_loss": -12.482921600341797, "global_step": 303638, "epoch": 1807} {"train_loss": -12.383163452148438, "global_step": 303639, "epoch": 1807} {"train_loss": -12.494380950927734, "global_step": 303640, "epoch": 1807} {"train_loss": -12.529884338378906, "global_step": 303641, "epoch": 1807} {"train_loss": -12.326493263244629, "global_step": 303642, "epoch": 1807} {"train_loss": -12.635332107543945, "global_step": 303643, "epoch": 1807} {"train_loss": -12.471153259277344, "global_step": 303644, "epoch": 1807} {"train_loss": -12.16403579711914, "global_step": 303645, "epoch": 1807} {"train_loss": -12.365923881530762, "global_step": 303646, "epoch": 1807} {"train_loss": -12.459075927734375, "global_step": 303647, "epoch": 1807} {"train_loss": -12.220858573913574, "global_step": 303648, "epoch": 1807} {"train_loss": -12.537010192871094, "global_step": 303649, "epoch": 1807} {"train_loss": -12.332728385925293, "global_step": 303650, "epoch": 1807} {"train_loss": -12.433412551879883, "global_step": 303651, "epoch": 1807} {"train_loss": -12.669361114501953, "global_step": 303652, "epoch": 1807} {"train_loss": -12.365304946899414, "global_step": 303653, "epoch": 1807} {"train_loss": -12.45811653137207, "global_step": 303654, "epoch": 1807} {"train_loss": -12.431604385375977, "global_step": 303655, "epoch": 1807} {"train_loss": -11.971654891967773, "global_step": 303656, "epoch": 1807} {"train_loss": -12.483521461486816, "global_step": 303657, "epoch": 1807} {"train_loss": -11.833932876586914, "global_step": 303658, "epoch": 1807} {"train_loss": -11.827720642089844, "global_step": 303659, "epoch": 1807} {"train_loss": -12.436807632446289, "global_step": 303660, "epoch": 1807} {"train_loss": -12.399124145507812, "global_step": 303661, "epoch": 1807} {"train_loss": -12.248971939086914, "global_step": 303662, "epoch": 1807} {"train_loss": -12.2261962890625, "global_step": 303663, "epoch": 1807} {"train_loss": -11.493659019470215, "global_step": 303664, "epoch": 1807} {"train_loss": -11.36787223815918, "global_step": 303665, "epoch": 1807} {"train_loss": -12.020134925842285, "global_step": 303666, "epoch": 1807} {"train_loss": -11.796327590942383, "global_step": 303667, "epoch": 1807} {"train_loss": -12.069740295410156, "global_step": 303668, "epoch": 1807} {"train_loss": -11.974199295043945, "global_step": 303669, "epoch": 1807} {"train_loss": -12.04007339477539, "global_step": 303670, "epoch": 1807} {"train_loss": -10.92048454284668, "global_step": 303671, "epoch": 1807} {"train_loss": -11.772344589233398, "global_step": 303672, "epoch": 1807} {"train_loss": -11.366783142089844, "global_step": 303673, "epoch": 1807} {"train_loss": -11.19679069519043, "global_step": 303674, "epoch": 1807} {"train_loss": -11.309686660766602, "global_step": 303675, "epoch": 1807} {"train_loss": -11.56203842163086, "global_step": 303676, "epoch": 1807} {"train_loss": -9.866812705993652, "global_step": 303677, "epoch": 1807} {"train_loss": -11.656549453735352, "global_step": 303678, "epoch": 1807} {"train_loss": -9.83137321472168, "global_step": 303679, "epoch": 1807} {"train_loss": -10.535799026489258, "global_step": 303680, "epoch": 1807} {"train_loss": -10.410737991333008, "global_step": 303681, "epoch": 1807} {"train_loss": -10.323308944702148, "global_step": 303682, "epoch": 1807} {"train_loss": -10.640114784240723, "global_step": 303683, "epoch": 1807} {"train_loss": -10.846136093139648, "global_step": 303684, "epoch": 1807} {"train_loss": -11.132303237915039, "global_step": 303685, "epoch": 1807} {"train_loss": -11.156732559204102, "global_step": 303686, "epoch": 1807} {"train_loss": -10.834199905395508, "global_step": 303687, "epoch": 1807} {"train_loss": -10.465667724609375, "global_step": 303688, "epoch": 1807} {"train_loss": -10.54731559753418, "global_step": 303689, "epoch": 1807} {"train_loss": -11.913265228271484, "global_step": 303690, "epoch": 1807} {"train_loss": -11.54686164855957, "global_step": 303691, "epoch": 1807} {"train_loss": -11.770370483398438, "global_step": 303692, "epoch": 1807} {"train_loss": -11.901676177978516, "global_step": 303693, "epoch": 1807} {"train_loss": -11.905861854553223, "global_step": 303694, "epoch": 1807} {"train_loss": -12.153829574584961, "global_step": 303695, "epoch": 1807} {"train_loss": -12.160799026489258, "global_step": 303696, "epoch": 1807} {"train_loss": -12.099061965942383, "global_step": 303697, "epoch": 1807} {"train_loss": -12.0565824508667, "global_step": 303698, "epoch": 1807} {"train_loss": -12.120979309082031, "global_step": 303699, "epoch": 1807} {"train_loss": -11.677507400512695, "global_step": 303700, "epoch": 1807} {"train_loss": -12.063797950744629, "global_step": 303701, "epoch": 1807} {"train_loss": -12.120832443237305, "global_step": 303702, "epoch": 1807} {"train_loss": -12.065610885620117, "global_step": 303703, "epoch": 1807} {"train_loss": -12.154964447021484, "global_step": 303704, "epoch": 1807} {"train_loss": -11.939453125, "global_step": 303705, "epoch": 1807} {"train_loss": -11.976003646850586, "global_step": 303706, "epoch": 1807} {"train_loss": -11.937691688537598, "global_step": 303707, "epoch": 1807} {"train_loss": -12.26040267944336, "global_step": 303708, "epoch": 1807} {"train_loss": -12.259243965148926, "global_step": 303709, "epoch": 1807} {"train_loss": -12.167052268981934, "global_step": 303710, "epoch": 1807} {"train_loss": -12.124029159545898, "global_step": 303711, "epoch": 1807} {"train_loss": -12.00424575805664, "global_step": 303712, "epoch": 1807} {"train_loss": -11.906343460083008, "global_step": 303713, "epoch": 1807} {"train_loss": -12.232951164245605, "global_step": 303714, "epoch": 1807} {"train_loss": -12.422769546508789, "global_step": 303715, "epoch": 1807} {"train_loss": -12.164398193359375, "global_step": 303716, "epoch": 1807} {"train_loss": -12.02592658996582, "global_step": 303717, "epoch": 1807} {"train_loss": -12.109785079956055, "global_step": 303718, "epoch": 1807} {"train_loss": -12.137155532836914, "global_step": 303719, "epoch": 1807} {"train_loss": -12.066242218017578, "global_step": 303720, "epoch": 1807} {"train_loss": -12.113157272338867, "global_step": 303721, "epoch": 1807} {"train_loss": -12.210836410522461, "global_step": 303722, "epoch": 1807} {"train_loss": -12.342565536499023, "global_step": 303723, "epoch": 1807} {"train_loss": -12.055373191833496, "global_step": 303724, "epoch": 1807} {"train_loss": -12.503392219543457, "global_step": 303725, "epoch": 1807} {"train_loss": -12.194906234741211, "global_step": 303726, "epoch": 1807} {"train_loss": -12.264167785644531, "global_step": 303727, "epoch": 1807} {"train_loss": -11.992210388183594, "global_step": 303728, "epoch": 1807} {"train_loss": -12.202744483947754, "global_step": 303729, "epoch": 1807} {"train_loss": -11.901521682739258, "global_step": 303730, "epoch": 1807} {"train_loss": -12.019366264343262, "global_step": 303731, "epoch": 1807} {"train_loss": -12.048040390014648, "global_step": 303732, "epoch": 1807} {"train_loss": -11.895350456237793, "global_step": 303733, "epoch": 1807} {"train_loss": -11.855119705200195, "global_step": 303734, "epoch": 1807} {"train_loss": -12.262123107910156, "global_step": 303735, "epoch": 1807} {"train_loss": -11.590139389038086, "global_step": 303736, "epoch": 1807} {"train_loss": -11.874593734741211, "global_step": 303737, "epoch": 1807} {"train_loss": -12.3930082321167, "global_step": 303738, "epoch": 1807} {"train_loss": -11.853504180908203, "global_step": 303739, "epoch": 1807} {"train_loss": -11.860706329345703, "global_step": 303740, "epoch": 1807} {"train_loss": -11.765799522399902, "global_step": 303741, "epoch": 1807} {"train_loss": -11.069032669067383, "global_step": 303742, "epoch": 1807} {"train_loss": -11.931330913589115, "global_step": 303743, "epoch": 1807, "val_loss": 277839.9375} {"train_loss": -11.449539184570312, "global_step": 303744, "epoch": 1808} {"train_loss": -11.738362312316895, "global_step": 303745, "epoch": 1808} {"train_loss": -12.096907615661621, "global_step": 303746, "epoch": 1808} {"train_loss": -11.656562805175781, "global_step": 303747, "epoch": 1808} {"train_loss": -11.904626846313477, "global_step": 303748, "epoch": 1808} {"train_loss": -11.954450607299805, "global_step": 303749, "epoch": 1808} {"train_loss": -11.981487274169922, "global_step": 303750, "epoch": 1808} {"train_loss": -12.075033187866211, "global_step": 303751, "epoch": 1808} {"train_loss": -12.022981643676758, "global_step": 303752, "epoch": 1808} {"train_loss": -12.010383605957031, "global_step": 303753, "epoch": 1808} {"train_loss": -12.13629150390625, "global_step": 303754, "epoch": 1808} {"train_loss": -11.571911811828613, "global_step": 303755, "epoch": 1808} {"train_loss": -11.788654327392578, "global_step": 303756, "epoch": 1808} {"train_loss": -12.00457763671875, "global_step": 303757, "epoch": 1808} {"train_loss": -10.534222602844238, "global_step": 303758, "epoch": 1808} {"train_loss": -11.754327774047852, "global_step": 303759, "epoch": 1808} {"train_loss": -11.491395950317383, "global_step": 303760, "epoch": 1808} {"train_loss": -11.930482864379883, "global_step": 303761, "epoch": 1808} {"train_loss": -11.997600555419922, "global_step": 303762, "epoch": 1808} {"train_loss": -11.645194053649902, "global_step": 303763, "epoch": 1808} {"train_loss": -11.708234786987305, "global_step": 303764, "epoch": 1808} {"train_loss": -12.167208671569824, "global_step": 303765, "epoch": 1808} {"train_loss": -11.962061882019043, "global_step": 303766, "epoch": 1808} {"train_loss": -11.765145301818848, "global_step": 303767, "epoch": 1808} {"train_loss": -11.530939102172852, "global_step": 303768, "epoch": 1808} {"train_loss": -11.456167221069336, "global_step": 303769, "epoch": 1808} {"train_loss": -11.670772552490234, "global_step": 303770, "epoch": 1808} {"train_loss": -11.896773338317871, "global_step": 303771, "epoch": 1808} {"train_loss": -11.512434005737305, "global_step": 303772, "epoch": 1808} {"train_loss": -11.644903182983398, "global_step": 303773, "epoch": 1808} {"train_loss": -10.694711685180664, "global_step": 303774, "epoch": 1808} {"train_loss": -11.669652938842773, "global_step": 303775, "epoch": 1808} {"train_loss": -10.69516372680664, "global_step": 303776, "epoch": 1808} {"train_loss": -11.451395034790039, "global_step": 303777, "epoch": 1808} {"train_loss": -11.169626235961914, "global_step": 303778, "epoch": 1808} {"train_loss": -11.318803787231445, "global_step": 303779, "epoch": 1808} {"train_loss": -11.017595291137695, "global_step": 303780, "epoch": 1808} {"train_loss": -11.76937484741211, "global_step": 303781, "epoch": 1808} {"train_loss": -10.599981307983398, "global_step": 303782, "epoch": 1808} {"train_loss": -11.249605178833008, "global_step": 303783, "epoch": 1808} {"train_loss": -10.836671829223633, "global_step": 303784, "epoch": 1808} {"train_loss": -10.856932640075684, "global_step": 303785, "epoch": 1808} {"train_loss": -11.653581619262695, "global_step": 303786, "epoch": 1808} {"train_loss": -10.217576026916504, "global_step": 303787, "epoch": 1808} {"train_loss": -11.481743812561035, "global_step": 303788, "epoch": 1808} {"train_loss": -10.692829132080078, "global_step": 303789, "epoch": 1808} {"train_loss": -11.509706497192383, "global_step": 303790, "epoch": 1808} {"train_loss": -10.710436820983887, "global_step": 303791, "epoch": 1808} {"train_loss": -11.439613342285156, "global_step": 303792, "epoch": 1808} {"train_loss": -11.066104888916016, "global_step": 303793, "epoch": 1808} {"train_loss": -11.719364166259766, "global_step": 303794, "epoch": 1808} {"train_loss": -10.68472957611084, "global_step": 303795, "epoch": 1808} {"train_loss": -11.845748901367188, "global_step": 303796, "epoch": 1808} {"train_loss": -10.963329315185547, "global_step": 303797, "epoch": 1808} {"train_loss": -11.570756912231445, "global_step": 303798, "epoch": 1808} {"train_loss": -11.247492790222168, "global_step": 303799, "epoch": 1808} {"train_loss": -11.386711120605469, "global_step": 303800, "epoch": 1808} {"train_loss": -11.049976348876953, "global_step": 303801, "epoch": 1808} {"train_loss": -11.450874328613281, "global_step": 303802, "epoch": 1808} {"train_loss": -11.989896774291992, "global_step": 303803, "epoch": 1808} {"train_loss": -10.961509704589844, "global_step": 303804, "epoch": 1808} {"train_loss": -11.27175235748291, "global_step": 303805, "epoch": 1808} {"train_loss": -12.054952621459961, "global_step": 303806, "epoch": 1808} {"train_loss": -11.426284790039062, "global_step": 303807, "epoch": 1808} {"train_loss": -11.669862747192383, "global_step": 303808, "epoch": 1808} {"train_loss": -11.905496597290039, "global_step": 303809, "epoch": 1808} {"train_loss": -11.350691795349121, "global_step": 303810, "epoch": 1808} {"train_loss": -12.071904182434082, "global_step": 303811, "epoch": 1808} {"train_loss": -11.490301132202148, "global_step": 303812, "epoch": 1808} {"train_loss": -11.584847450256348, "global_step": 303813, "epoch": 1808} {"train_loss": -11.525625228881836, "global_step": 303814, "epoch": 1808} {"train_loss": -12.100212097167969, "global_step": 303815, "epoch": 1808} {"train_loss": -11.83774185180664, "global_step": 303816, "epoch": 1808} {"train_loss": -11.983083724975586, "global_step": 303817, "epoch": 1808} {"train_loss": -11.910484313964844, "global_step": 303818, "epoch": 1808} {"train_loss": -11.787710189819336, "global_step": 303819, "epoch": 1808} {"train_loss": -11.74990463256836, "global_step": 303820, "epoch": 1808} {"train_loss": -11.55722427368164, "global_step": 303821, "epoch": 1808} {"train_loss": -12.085275650024414, "global_step": 303822, "epoch": 1808} {"train_loss": -11.820850372314453, "global_step": 303823, "epoch": 1808} {"train_loss": -12.214469909667969, "global_step": 303824, "epoch": 1808} {"train_loss": -11.643513679504395, "global_step": 303825, "epoch": 1808} {"train_loss": -12.09478759765625, "global_step": 303826, "epoch": 1808} {"train_loss": -11.751668930053711, "global_step": 303827, "epoch": 1808} {"train_loss": -12.147634506225586, "global_step": 303828, "epoch": 1808} {"train_loss": -12.159311294555664, "global_step": 303829, "epoch": 1808} {"train_loss": -11.826931953430176, "global_step": 303830, "epoch": 1808} {"train_loss": -12.096667289733887, "global_step": 303831, "epoch": 1808} {"train_loss": -11.703861236572266, "global_step": 303832, "epoch": 1808} {"train_loss": -12.16671371459961, "global_step": 303833, "epoch": 1808} {"train_loss": -11.885431289672852, "global_step": 303834, "epoch": 1808} {"train_loss": -11.793755531311035, "global_step": 303835, "epoch": 1808} {"train_loss": -11.654512405395508, "global_step": 303836, "epoch": 1808} {"train_loss": -11.883363723754883, "global_step": 303837, "epoch": 1808} {"train_loss": -11.432438850402832, "global_step": 303838, "epoch": 1808} {"train_loss": -11.928359985351562, "global_step": 303839, "epoch": 1808} {"train_loss": -11.579870223999023, "global_step": 303840, "epoch": 1808} {"train_loss": -11.377495765686035, "global_step": 303841, "epoch": 1808} {"train_loss": -11.74138355255127, "global_step": 303842, "epoch": 1808} {"train_loss": -12.18453598022461, "global_step": 303843, "epoch": 1808} {"train_loss": -11.723526000976562, "global_step": 303844, "epoch": 1808} {"train_loss": -11.947305679321289, "global_step": 303845, "epoch": 1808} {"train_loss": -11.724900245666504, "global_step": 303846, "epoch": 1808} {"train_loss": -11.719442367553711, "global_step": 303847, "epoch": 1808} {"train_loss": -11.74504280090332, "global_step": 303848, "epoch": 1808} {"train_loss": -11.896358489990234, "global_step": 303849, "epoch": 1808} {"train_loss": -11.802263259887695, "global_step": 303850, "epoch": 1808} {"train_loss": -11.608760833740234, "global_step": 303851, "epoch": 1808} {"train_loss": -12.11235523223877, "global_step": 303852, "epoch": 1808} {"train_loss": -11.553590774536133, "global_step": 303853, "epoch": 1808} {"train_loss": -12.178314208984375, "global_step": 303854, "epoch": 1808} {"train_loss": -11.696279525756836, "global_step": 303855, "epoch": 1808} {"train_loss": -12.06761646270752, "global_step": 303856, "epoch": 1808} {"train_loss": -12.091100692749023, "global_step": 303857, "epoch": 1808} {"train_loss": -11.913888931274414, "global_step": 303858, "epoch": 1808} {"train_loss": -11.934362411499023, "global_step": 303859, "epoch": 1808} {"train_loss": -12.164443969726562, "global_step": 303860, "epoch": 1808} {"train_loss": -11.95046615600586, "global_step": 303861, "epoch": 1808} {"train_loss": -12.02194595336914, "global_step": 303862, "epoch": 1808} {"train_loss": -11.448629379272461, "global_step": 303863, "epoch": 1808} {"train_loss": -12.213703155517578, "global_step": 303864, "epoch": 1808} {"train_loss": -11.631282806396484, "global_step": 303865, "epoch": 1808} {"train_loss": -11.724319458007812, "global_step": 303866, "epoch": 1808} {"train_loss": -12.306697845458984, "global_step": 303867, "epoch": 1808} {"train_loss": -11.69683837890625, "global_step": 303868, "epoch": 1808} {"train_loss": -12.389610290527344, "global_step": 303869, "epoch": 1808} {"train_loss": -12.01539421081543, "global_step": 303870, "epoch": 1808} {"train_loss": -11.847235679626465, "global_step": 303871, "epoch": 1808} {"train_loss": -12.228118896484375, "global_step": 303872, "epoch": 1808} {"train_loss": -11.881071090698242, "global_step": 303873, "epoch": 1808} {"train_loss": -11.832512855529785, "global_step": 303874, "epoch": 1808} {"train_loss": -12.340152740478516, "global_step": 303875, "epoch": 1808} {"train_loss": -11.616111755371094, "global_step": 303876, "epoch": 1808} {"train_loss": -11.325494766235352, "global_step": 303877, "epoch": 1808} {"train_loss": -12.124055862426758, "global_step": 303878, "epoch": 1808} {"train_loss": -11.556509017944336, "global_step": 303879, "epoch": 1808} {"train_loss": -11.631247520446777, "global_step": 303880, "epoch": 1808} {"train_loss": -11.653785705566406, "global_step": 303881, "epoch": 1808} {"train_loss": -11.504939079284668, "global_step": 303882, "epoch": 1808} {"train_loss": -11.843132019042969, "global_step": 303883, "epoch": 1808} {"train_loss": -12.008522033691406, "global_step": 303884, "epoch": 1808} {"train_loss": -11.267026901245117, "global_step": 303885, "epoch": 1808} {"train_loss": -12.12568473815918, "global_step": 303886, "epoch": 1808} {"train_loss": -11.248722076416016, "global_step": 303887, "epoch": 1808} {"train_loss": -11.919242858886719, "global_step": 303888, "epoch": 1808} {"train_loss": -11.752853393554688, "global_step": 303889, "epoch": 1808} {"train_loss": -12.414619445800781, "global_step": 303890, "epoch": 1808} {"train_loss": -11.802271842956543, "global_step": 303891, "epoch": 1808} {"train_loss": -12.07606315612793, "global_step": 303892, "epoch": 1808} {"train_loss": -11.821014404296875, "global_step": 303893, "epoch": 1808} {"train_loss": -12.054332733154297, "global_step": 303894, "epoch": 1808} {"train_loss": -11.859066009521484, "global_step": 303895, "epoch": 1808} {"train_loss": -12.317691802978516, "global_step": 303896, "epoch": 1808} {"train_loss": -11.89974594116211, "global_step": 303897, "epoch": 1808} {"train_loss": -12.225434303283691, "global_step": 303898, "epoch": 1808} {"train_loss": -12.073163986206055, "global_step": 303899, "epoch": 1808} {"train_loss": -12.363675117492676, "global_step": 303900, "epoch": 1808} {"train_loss": -12.024009704589844, "global_step": 303901, "epoch": 1808} {"train_loss": -12.246172904968262, "global_step": 303902, "epoch": 1808} {"train_loss": -12.223824501037598, "global_step": 303903, "epoch": 1808} {"train_loss": -12.118509292602539, "global_step": 303904, "epoch": 1808} {"train_loss": -12.07930850982666, "global_step": 303905, "epoch": 1808} {"train_loss": -12.454805374145508, "global_step": 303906, "epoch": 1808} {"train_loss": -12.273609161376953, "global_step": 303907, "epoch": 1808} {"train_loss": -12.301996231079102, "global_step": 303908, "epoch": 1808} {"train_loss": -12.400952339172363, "global_step": 303909, "epoch": 1808} {"train_loss": -12.203018188476562, "global_step": 303910, "epoch": 1808} {"train_loss": -11.745169809886388, "global_step": 303911, "epoch": 1808, "val_loss": 282257.28125} {"train_loss": -11.964998245239258, "global_step": 303912, "epoch": 1809} {"train_loss": -11.702781677246094, "global_step": 303913, "epoch": 1809} {"train_loss": -12.174627304077148, "global_step": 303914, "epoch": 1809} {"train_loss": -12.341970443725586, "global_step": 303915, "epoch": 1809} {"train_loss": -12.329814910888672, "global_step": 303916, "epoch": 1809} {"train_loss": -12.260207176208496, "global_step": 303917, "epoch": 1809} {"train_loss": -12.494587898254395, "global_step": 303918, "epoch": 1809} {"train_loss": -12.34345531463623, "global_step": 303919, "epoch": 1809} {"train_loss": -12.328065872192383, "global_step": 303920, "epoch": 1809} {"train_loss": -12.408137321472168, "global_step": 303921, "epoch": 1809} {"train_loss": -12.454326629638672, "global_step": 303922, "epoch": 1809} {"train_loss": -12.633892059326172, "global_step": 303923, "epoch": 1809} {"train_loss": -12.238081932067871, "global_step": 303924, "epoch": 1809} {"train_loss": -12.39394760131836, "global_step": 303925, "epoch": 1809} {"train_loss": -12.298099517822266, "global_step": 303926, "epoch": 1809} {"train_loss": -12.534319877624512, "global_step": 303927, "epoch": 1809} {"train_loss": -12.594873428344727, "global_step": 303928, "epoch": 1809} {"train_loss": -12.461162567138672, "global_step": 303929, "epoch": 1809} {"train_loss": -12.2022066116333, "global_step": 303930, "epoch": 1809} {"train_loss": -12.376132011413574, "global_step": 303931, "epoch": 1809} {"train_loss": -12.271672248840332, "global_step": 303932, "epoch": 1809} {"train_loss": -12.403681755065918, "global_step": 303933, "epoch": 1809} {"train_loss": -11.868135452270508, "global_step": 303934, "epoch": 1809} {"train_loss": -12.16048812866211, "global_step": 303935, "epoch": 1809} {"train_loss": -11.856450080871582, "global_step": 303936, "epoch": 1809} {"train_loss": -11.63099479675293, "global_step": 303937, "epoch": 1809} {"train_loss": -11.393564224243164, "global_step": 303938, "epoch": 1809} {"train_loss": -11.128473281860352, "global_step": 303939, "epoch": 1809} {"train_loss": -9.955818176269531, "global_step": 303940, "epoch": 1809} {"train_loss": -10.029218673706055, "global_step": 303941, "epoch": 1809} {"train_loss": -11.425710678100586, "global_step": 303942, "epoch": 1809} {"train_loss": -9.332406997680664, "global_step": 303943, "epoch": 1809} {"train_loss": -10.381120681762695, "global_step": 303944, "epoch": 1809} {"train_loss": -8.921606063842773, "global_step": 303945, "epoch": 1809} {"train_loss": -10.122032165527344, "global_step": 303946, "epoch": 1809} {"train_loss": -10.871683120727539, "global_step": 303947, "epoch": 1809} {"train_loss": -9.566487312316895, "global_step": 303948, "epoch": 1809} {"train_loss": -10.409043312072754, "global_step": 303949, "epoch": 1809} {"train_loss": -10.754058837890625, "global_step": 303950, "epoch": 1809} {"train_loss": -10.653491973876953, "global_step": 303951, "epoch": 1809} {"train_loss": -10.634382247924805, "global_step": 303952, "epoch": 1809} {"train_loss": -11.435857772827148, "global_step": 303953, "epoch": 1809} {"train_loss": -10.559898376464844, "global_step": 303954, "epoch": 1809} {"train_loss": -11.118112564086914, "global_step": 303955, "epoch": 1809} {"train_loss": -11.710491180419922, "global_step": 303956, "epoch": 1809} {"train_loss": -11.075525283813477, "global_step": 303957, "epoch": 1809} {"train_loss": -11.607572555541992, "global_step": 303958, "epoch": 1809} {"train_loss": -10.741578102111816, "global_step": 303959, "epoch": 1809} {"train_loss": -11.939363479614258, "global_step": 303960, "epoch": 1809} {"train_loss": -11.259434700012207, "global_step": 303961, "epoch": 1809} {"train_loss": -10.91032886505127, "global_step": 303962, "epoch": 1809} {"train_loss": -11.968667984008789, "global_step": 303963, "epoch": 1809} {"train_loss": -11.147624969482422, "global_step": 303964, "epoch": 1809} {"train_loss": -11.391075134277344, "global_step": 303965, "epoch": 1809} {"train_loss": -11.670233726501465, "global_step": 303966, "epoch": 1809} {"train_loss": -11.678467750549316, "global_step": 303967, "epoch": 1809} {"train_loss": -11.38194465637207, "global_step": 303968, "epoch": 1809} {"train_loss": -11.401302337646484, "global_step": 303969, "epoch": 1809} {"train_loss": -11.664620399475098, "global_step": 303970, "epoch": 1809} {"train_loss": -12.018084526062012, "global_step": 303971, "epoch": 1809} {"train_loss": -11.879871368408203, "global_step": 303972, "epoch": 1809} {"train_loss": -12.002716064453125, "global_step": 303973, "epoch": 1809} {"train_loss": -11.796642303466797, "global_step": 303974, "epoch": 1809} {"train_loss": -11.730476379394531, "global_step": 303975, "epoch": 1809} {"train_loss": -12.038970947265625, "global_step": 303976, "epoch": 1809} {"train_loss": -11.371844291687012, "global_step": 303977, "epoch": 1809} {"train_loss": -11.68686294555664, "global_step": 303978, "epoch": 1809} {"train_loss": -11.75394058227539, "global_step": 303979, "epoch": 1809} {"train_loss": -11.785419464111328, "global_step": 303980, "epoch": 1809} {"train_loss": -11.930129051208496, "global_step": 303981, "epoch": 1809} {"train_loss": -12.072975158691406, "global_step": 303982, "epoch": 1809} {"train_loss": -11.858969688415527, "global_step": 303983, "epoch": 1809} {"train_loss": -12.030044555664062, "global_step": 303984, "epoch": 1809} {"train_loss": -12.025777816772461, "global_step": 303985, "epoch": 1809} {"train_loss": -12.096853256225586, "global_step": 303986, "epoch": 1809} {"train_loss": -11.847637176513672, "global_step": 303987, "epoch": 1809} {"train_loss": -12.030034065246582, "global_step": 303988, "epoch": 1809} {"train_loss": -12.090963363647461, "global_step": 303989, "epoch": 1809} {"train_loss": -11.907899856567383, "global_step": 303990, "epoch": 1809} {"train_loss": -12.002181053161621, "global_step": 303991, "epoch": 1809} {"train_loss": -11.966180801391602, "global_step": 303992, "epoch": 1809} {"train_loss": -11.951009750366211, "global_step": 303993, "epoch": 1809} {"train_loss": -12.291304588317871, "global_step": 303994, "epoch": 1809} {"train_loss": -12.272086143493652, "global_step": 303995, "epoch": 1809} {"train_loss": -12.395493507385254, "global_step": 303996, "epoch": 1809} {"train_loss": -12.16408920288086, "global_step": 303997, "epoch": 1809} {"train_loss": -12.16723346710205, "global_step": 303998, "epoch": 1809} {"train_loss": -12.14963150024414, "global_step": 303999, "epoch": 1809} {"train_loss": -12.182647705078125, "global_step": 304000, "epoch": 1809} {"train_loss": -12.367448806762695, "global_step": 304001, "epoch": 1809} {"train_loss": -12.503402709960938, "global_step": 304002, "epoch": 1809} {"train_loss": -12.307918548583984, "global_step": 304003, "epoch": 1809} {"train_loss": -12.356252670288086, "global_step": 304004, "epoch": 1809} {"train_loss": -12.487445831298828, "global_step": 304005, "epoch": 1809} {"train_loss": -12.40550422668457, "global_step": 304006, "epoch": 1809} {"train_loss": -12.138773918151855, "global_step": 304007, "epoch": 1809} {"train_loss": -12.337479591369629, "global_step": 304008, "epoch": 1809} {"train_loss": -12.388099670410156, "global_step": 304009, "epoch": 1809} {"train_loss": -12.342101097106934, "global_step": 304010, "epoch": 1809} {"train_loss": -12.488064765930176, "global_step": 304011, "epoch": 1809} {"train_loss": -12.505900382995605, "global_step": 304012, "epoch": 1809} {"train_loss": -12.500479698181152, "global_step": 304013, "epoch": 1809} {"train_loss": -12.510658264160156, "global_step": 304014, "epoch": 1809} {"train_loss": -12.577332496643066, "global_step": 304015, "epoch": 1809} {"train_loss": -12.234794616699219, "global_step": 304016, "epoch": 1809} {"train_loss": -12.40570068359375, "global_step": 304017, "epoch": 1809} {"train_loss": -12.417999267578125, "global_step": 304018, "epoch": 1809} {"train_loss": -12.512969017028809, "global_step": 304019, "epoch": 1809} {"train_loss": -12.534931182861328, "global_step": 304020, "epoch": 1809} {"train_loss": -12.430265426635742, "global_step": 304021, "epoch": 1809} {"train_loss": -12.516331672668457, "global_step": 304022, "epoch": 1809} {"train_loss": -12.671640396118164, "global_step": 304023, "epoch": 1809} {"train_loss": -12.428062438964844, "global_step": 304024, "epoch": 1809} {"train_loss": -12.549850463867188, "global_step": 304025, "epoch": 1809} {"train_loss": -12.55125617980957, "global_step": 304026, "epoch": 1809} {"train_loss": -12.614768981933594, "global_step": 304027, "epoch": 1809} {"train_loss": -12.627694129943848, "global_step": 304028, "epoch": 1809} {"train_loss": -12.682329177856445, "global_step": 304029, "epoch": 1809} {"train_loss": -12.263522148132324, "global_step": 304030, "epoch": 1809} {"train_loss": -12.598020553588867, "global_step": 304031, "epoch": 1809} {"train_loss": -12.141825675964355, "global_step": 304032, "epoch": 1809} {"train_loss": -12.364009857177734, "global_step": 304033, "epoch": 1809} {"train_loss": -12.580801963806152, "global_step": 304034, "epoch": 1809} {"train_loss": -12.397817611694336, "global_step": 304035, "epoch": 1809} {"train_loss": -12.166109085083008, "global_step": 304036, "epoch": 1809} {"train_loss": -11.946515083312988, "global_step": 304037, "epoch": 1809} {"train_loss": -11.496194839477539, "global_step": 304038, "epoch": 1809} {"train_loss": -11.332436561584473, "global_step": 304039, "epoch": 1809} {"train_loss": -12.256378173828125, "global_step": 304040, "epoch": 1809} {"train_loss": -12.236307144165039, "global_step": 304041, "epoch": 1809} {"train_loss": -12.160118103027344, "global_step": 304042, "epoch": 1809} {"train_loss": -11.944509506225586, "global_step": 304043, "epoch": 1809} {"train_loss": -12.074665069580078, "global_step": 304044, "epoch": 1809} {"train_loss": -11.832036972045898, "global_step": 304045, "epoch": 1809} {"train_loss": -12.144246101379395, "global_step": 304046, "epoch": 1809} {"train_loss": -12.157387733459473, "global_step": 304047, "epoch": 1809} {"train_loss": -11.48604965209961, "global_step": 304048, "epoch": 1809} {"train_loss": -11.923168182373047, "global_step": 304049, "epoch": 1809} {"train_loss": -12.432559967041016, "global_step": 304050, "epoch": 1809} {"train_loss": -12.163565635681152, "global_step": 304051, "epoch": 1809} {"train_loss": -12.175858497619629, "global_step": 304052, "epoch": 1809} {"train_loss": -12.203722953796387, "global_step": 304053, "epoch": 1809} {"train_loss": -12.136013984680176, "global_step": 304054, "epoch": 1809} {"train_loss": -12.163881301879883, "global_step": 304055, "epoch": 1809} {"train_loss": -11.919941902160645, "global_step": 304056, "epoch": 1809} {"train_loss": -11.08728313446045, "global_step": 304057, "epoch": 1809} {"train_loss": -11.228683471679688, "global_step": 304058, "epoch": 1809} {"train_loss": -12.04473876953125, "global_step": 304059, "epoch": 1809} {"train_loss": -11.621969223022461, "global_step": 304060, "epoch": 1809} {"train_loss": -11.229297637939453, "global_step": 304061, "epoch": 1809} {"train_loss": -11.879485130310059, "global_step": 304062, "epoch": 1809} {"train_loss": -11.699033737182617, "global_step": 304063, "epoch": 1809} {"train_loss": -11.234288215637207, "global_step": 304064, "epoch": 1809} {"train_loss": -10.462540626525879, "global_step": 304065, "epoch": 1809} {"train_loss": -11.310922622680664, "global_step": 304066, "epoch": 1809} {"train_loss": -11.806575775146484, "global_step": 304067, "epoch": 1809} {"train_loss": -10.129167556762695, "global_step": 304068, "epoch": 1809} {"train_loss": -10.171398162841797, "global_step": 304069, "epoch": 1809} {"train_loss": -11.277830123901367, "global_step": 304070, "epoch": 1809} {"train_loss": -11.661737442016602, "global_step": 304071, "epoch": 1809} {"train_loss": -10.376479148864746, "global_step": 304072, "epoch": 1809} {"train_loss": -10.841014862060547, "global_step": 304073, "epoch": 1809} {"train_loss": -11.542062759399414, "global_step": 304074, "epoch": 1809} {"train_loss": -11.36831283569336, "global_step": 304075, "epoch": 1809} {"train_loss": -11.112982749938965, "global_step": 304076, "epoch": 1809} {"train_loss": -12.182415008544922, "global_step": 304077, "epoch": 1809} {"train_loss": -11.55947208404541, "global_step": 304078, "epoch": 1809} {"train_loss": -11.820967447190057, "global_step": 304079, "epoch": 1809, "val_loss": 279410.46875} {"train_loss": -11.388204574584961, "global_step": 304080, "epoch": 1810} {"train_loss": -11.955471992492676, "global_step": 304081, "epoch": 1810} {"train_loss": -11.623912811279297, "global_step": 304082, "epoch": 1810} {"train_loss": -10.859184265136719, "global_step": 304083, "epoch": 1810} {"train_loss": -11.401922225952148, "global_step": 304084, "epoch": 1810} {"train_loss": -11.443501472473145, "global_step": 304085, "epoch": 1810} {"train_loss": -10.694158554077148, "global_step": 304086, "epoch": 1810} {"train_loss": -11.622413635253906, "global_step": 304087, "epoch": 1810} {"train_loss": -10.713562965393066, "global_step": 304088, "epoch": 1810} {"train_loss": -11.247097969055176, "global_step": 304089, "epoch": 1810} {"train_loss": -10.749185562133789, "global_step": 304090, "epoch": 1810} {"train_loss": -11.665523529052734, "global_step": 304091, "epoch": 1810} {"train_loss": -10.750541687011719, "global_step": 304092, "epoch": 1810} {"train_loss": -11.837071418762207, "global_step": 304093, "epoch": 1810} {"train_loss": -10.824945449829102, "global_step": 304094, "epoch": 1810} {"train_loss": -11.271312713623047, "global_step": 304095, "epoch": 1810} {"train_loss": -11.307526588439941, "global_step": 304096, "epoch": 1810} {"train_loss": -11.164555549621582, "global_step": 304097, "epoch": 1810} {"train_loss": -11.31797981262207, "global_step": 304098, "epoch": 1810} {"train_loss": -10.745436668395996, "global_step": 304099, "epoch": 1810} {"train_loss": -11.557449340820312, "global_step": 304100, "epoch": 1810} {"train_loss": -10.970111846923828, "global_step": 304101, "epoch": 1810} {"train_loss": -11.842544555664062, "global_step": 304102, "epoch": 1810} {"train_loss": -11.120636940002441, "global_step": 304103, "epoch": 1810} {"train_loss": -12.10413932800293, "global_step": 304104, "epoch": 1810} {"train_loss": -11.497021675109863, "global_step": 304105, "epoch": 1810} {"train_loss": -11.678659439086914, "global_step": 304106, "epoch": 1810} {"train_loss": -11.78505802154541, "global_step": 304107, "epoch": 1810} {"train_loss": -11.59555435180664, "global_step": 304108, "epoch": 1810} {"train_loss": -11.464019775390625, "global_step": 304109, "epoch": 1810} {"train_loss": -11.414044380187988, "global_step": 304110, "epoch": 1810} {"train_loss": -11.568059921264648, "global_step": 304111, "epoch": 1810} {"train_loss": -11.61081314086914, "global_step": 304112, "epoch": 1810} {"train_loss": -11.617864608764648, "global_step": 304113, "epoch": 1810} {"train_loss": -12.046598434448242, "global_step": 304114, "epoch": 1810} {"train_loss": -12.002830505371094, "global_step": 304115, "epoch": 1810} {"train_loss": -12.164533615112305, "global_step": 304116, "epoch": 1810} {"train_loss": -11.690023422241211, "global_step": 304117, "epoch": 1810} {"train_loss": -12.008255004882812, "global_step": 304118, "epoch": 1810} {"train_loss": -12.227492332458496, "global_step": 304119, "epoch": 1810} {"train_loss": -11.74278736114502, "global_step": 304120, "epoch": 1810} {"train_loss": -11.232131958007812, "global_step": 304121, "epoch": 1810} {"train_loss": -11.681077003479004, "global_step": 304122, "epoch": 1810} {"train_loss": -12.02324104309082, "global_step": 304123, "epoch": 1810} {"train_loss": -11.679832458496094, "global_step": 304124, "epoch": 1810} {"train_loss": -11.769262313842773, "global_step": 304125, "epoch": 1810} {"train_loss": -11.997819900512695, "global_step": 304126, "epoch": 1810} {"train_loss": -11.59742546081543, "global_step": 304127, "epoch": 1810} {"train_loss": -11.943873405456543, "global_step": 304128, "epoch": 1810} {"train_loss": -12.131441116333008, "global_step": 304129, "epoch": 1810} {"train_loss": -11.720200538635254, "global_step": 304130, "epoch": 1810} {"train_loss": -12.250616073608398, "global_step": 304131, "epoch": 1810} {"train_loss": -11.558323860168457, "global_step": 304132, "epoch": 1810} {"train_loss": -11.745319366455078, "global_step": 304133, "epoch": 1810} {"train_loss": -12.103939056396484, "global_step": 304134, "epoch": 1810} {"train_loss": -11.649606704711914, "global_step": 304135, "epoch": 1810} {"train_loss": -12.047796249389648, "global_step": 304136, "epoch": 1810} {"train_loss": -11.862024307250977, "global_step": 304137, "epoch": 1810} {"train_loss": -11.725204467773438, "global_step": 304138, "epoch": 1810} {"train_loss": -11.947233200073242, "global_step": 304139, "epoch": 1810} {"train_loss": -12.058303833007812, "global_step": 304140, "epoch": 1810} {"train_loss": -12.16530704498291, "global_step": 304141, "epoch": 1810} {"train_loss": -12.367779731750488, "global_step": 304142, "epoch": 1810} {"train_loss": -12.139299392700195, "global_step": 304143, "epoch": 1810} {"train_loss": -12.230347633361816, "global_step": 304144, "epoch": 1810} {"train_loss": -12.069318771362305, "global_step": 304145, "epoch": 1810} {"train_loss": -12.182352066040039, "global_step": 304146, "epoch": 1810} {"train_loss": -12.230984687805176, "global_step": 304147, "epoch": 1810} {"train_loss": -12.112676620483398, "global_step": 304148, "epoch": 1810} {"train_loss": -12.161321640014648, "global_step": 304149, "epoch": 1810} {"train_loss": -12.26334285736084, "global_step": 304150, "epoch": 1810} {"train_loss": -12.245179176330566, "global_step": 304151, "epoch": 1810} {"train_loss": -12.357587814331055, "global_step": 304152, "epoch": 1810} {"train_loss": -12.213915824890137, "global_step": 304153, "epoch": 1810} {"train_loss": -12.31037712097168, "global_step": 304154, "epoch": 1810} {"train_loss": -12.070956230163574, "global_step": 304155, "epoch": 1810} {"train_loss": -12.028045654296875, "global_step": 304156, "epoch": 1810} {"train_loss": -12.278360366821289, "global_step": 304157, "epoch": 1810} {"train_loss": -11.95083236694336, "global_step": 304158, "epoch": 1810} {"train_loss": -12.015748977661133, "global_step": 304159, "epoch": 1810} {"train_loss": -12.326574325561523, "global_step": 304160, "epoch": 1810} {"train_loss": -11.996506690979004, "global_step": 304161, "epoch": 1810} {"train_loss": -12.121236801147461, "global_step": 304162, "epoch": 1810} {"train_loss": -12.046133995056152, "global_step": 304163, "epoch": 1810} {"train_loss": -12.028368949890137, "global_step": 304164, "epoch": 1810} {"train_loss": -12.18297004699707, "global_step": 304165, "epoch": 1810} {"train_loss": -12.15812873840332, "global_step": 304166, "epoch": 1810} {"train_loss": -12.131082534790039, "global_step": 304167, "epoch": 1810} {"train_loss": -11.982780456542969, "global_step": 304168, "epoch": 1810} {"train_loss": -12.008598327636719, "global_step": 304169, "epoch": 1810} {"train_loss": -12.518314361572266, "global_step": 304170, "epoch": 1810} {"train_loss": -12.20435905456543, "global_step": 304171, "epoch": 1810} {"train_loss": -12.276822090148926, "global_step": 304172, "epoch": 1810} {"train_loss": -11.84384536743164, "global_step": 304173, "epoch": 1810} {"train_loss": -12.156320571899414, "global_step": 304174, "epoch": 1810} {"train_loss": -12.027435302734375, "global_step": 304175, "epoch": 1810} {"train_loss": -11.982694625854492, "global_step": 304176, "epoch": 1810} {"train_loss": -11.724712371826172, "global_step": 304177, "epoch": 1810} {"train_loss": -12.217924118041992, "global_step": 304178, "epoch": 1810} {"train_loss": -11.658082008361816, "global_step": 304179, "epoch": 1810} {"train_loss": -11.667033195495605, "global_step": 304180, "epoch": 1810} {"train_loss": -11.53399658203125, "global_step": 304181, "epoch": 1810} {"train_loss": -11.897867202758789, "global_step": 304182, "epoch": 1810} {"train_loss": -12.04234790802002, "global_step": 304183, "epoch": 1810} {"train_loss": -11.548032760620117, "global_step": 304184, "epoch": 1810} {"train_loss": -12.424720764160156, "global_step": 304185, "epoch": 1810} {"train_loss": -12.34096908569336, "global_step": 304186, "epoch": 1810} {"train_loss": -12.090049743652344, "global_step": 304187, "epoch": 1810} {"train_loss": -11.913354873657227, "global_step": 304188, "epoch": 1810} {"train_loss": -12.261236190795898, "global_step": 304189, "epoch": 1810} {"train_loss": -11.683499336242676, "global_step": 304190, "epoch": 1810} {"train_loss": -11.772652626037598, "global_step": 304191, "epoch": 1810} {"train_loss": -11.929829597473145, "global_step": 304192, "epoch": 1810} {"train_loss": -11.655657768249512, "global_step": 304193, "epoch": 1810} {"train_loss": -11.962089538574219, "global_step": 304194, "epoch": 1810} {"train_loss": -11.759601593017578, "global_step": 304195, "epoch": 1810} {"train_loss": -11.827737808227539, "global_step": 304196, "epoch": 1810} {"train_loss": -11.050546646118164, "global_step": 304197, "epoch": 1810} {"train_loss": -11.66585636138916, "global_step": 304198, "epoch": 1810} {"train_loss": -12.20124626159668, "global_step": 304199, "epoch": 1810} {"train_loss": -11.868377685546875, "global_step": 304200, "epoch": 1810} {"train_loss": -12.060523986816406, "global_step": 304201, "epoch": 1810} {"train_loss": -12.235930442810059, "global_step": 304202, "epoch": 1810} {"train_loss": -11.8117036819458, "global_step": 304203, "epoch": 1810} {"train_loss": -12.376456260681152, "global_step": 304204, "epoch": 1810} {"train_loss": -11.703116416931152, "global_step": 304205, "epoch": 1810} {"train_loss": -12.075626373291016, "global_step": 304206, "epoch": 1810} {"train_loss": -11.956100463867188, "global_step": 304207, "epoch": 1810} {"train_loss": -12.246528625488281, "global_step": 304208, "epoch": 1810} {"train_loss": -12.248235702514648, "global_step": 304209, "epoch": 1810} {"train_loss": -12.001443862915039, "global_step": 304210, "epoch": 1810} {"train_loss": -11.64042854309082, "global_step": 304211, "epoch": 1810} {"train_loss": -12.160548210144043, "global_step": 304212, "epoch": 1810} {"train_loss": -12.196542739868164, "global_step": 304213, "epoch": 1810} {"train_loss": -11.506690979003906, "global_step": 304214, "epoch": 1810} {"train_loss": -12.187178611755371, "global_step": 304215, "epoch": 1810} {"train_loss": -11.941904067993164, "global_step": 304216, "epoch": 1810} {"train_loss": -11.883340835571289, "global_step": 304217, "epoch": 1810} {"train_loss": -11.843622207641602, "global_step": 304218, "epoch": 1810} {"train_loss": -12.079237937927246, "global_step": 304219, "epoch": 1810} {"train_loss": -11.771200180053711, "global_step": 304220, "epoch": 1810} {"train_loss": -11.927900314331055, "global_step": 304221, "epoch": 1810} {"train_loss": -12.21302604675293, "global_step": 304222, "epoch": 1810} {"train_loss": -11.79653549194336, "global_step": 304223, "epoch": 1810} {"train_loss": -11.910083770751953, "global_step": 304224, "epoch": 1810} {"train_loss": -11.737557411193848, "global_step": 304225, "epoch": 1810} {"train_loss": -10.288145065307617, "global_step": 304226, "epoch": 1810} {"train_loss": -11.632829666137695, "global_step": 304227, "epoch": 1810} {"train_loss": -11.8326997756958, "global_step": 304228, "epoch": 1810} {"train_loss": -11.75674057006836, "global_step": 304229, "epoch": 1810} {"train_loss": -12.016827583312988, "global_step": 304230, "epoch": 1810} {"train_loss": -11.710780143737793, "global_step": 304231, "epoch": 1810} {"train_loss": -11.937811851501465, "global_step": 304232, "epoch": 1810} {"train_loss": -11.828689575195312, "global_step": 304233, "epoch": 1810} {"train_loss": -11.277588844299316, "global_step": 304234, "epoch": 1810} {"train_loss": -11.09550666809082, "global_step": 304235, "epoch": 1810} {"train_loss": -12.271842956542969, "global_step": 304236, "epoch": 1810} {"train_loss": -10.81041145324707, "global_step": 304237, "epoch": 1810} {"train_loss": -10.472148895263672, "global_step": 304238, "epoch": 1810} {"train_loss": -11.450398445129395, "global_step": 304239, "epoch": 1810} {"train_loss": -11.10796070098877, "global_step": 304240, "epoch": 1810} {"train_loss": -11.280458450317383, "global_step": 304241, "epoch": 1810} {"train_loss": -11.519014358520508, "global_step": 304242, "epoch": 1810} {"train_loss": -11.059739112854004, "global_step": 304243, "epoch": 1810} {"train_loss": -10.850497245788574, "global_step": 304244, "epoch": 1810} {"train_loss": -10.426276206970215, "global_step": 304245, "epoch": 1810} {"train_loss": -10.036590576171875, "global_step": 304246, "epoch": 1810} {"train_loss": -11.76821946530115, "global_step": 304247, "epoch": 1810, "val_loss": 280107.75, "train_action_mse_error": 1.1640483140945435} {"train_loss": -11.371175765991211, "global_step": 304248, "epoch": 1811} {"train_loss": -11.134668350219727, "global_step": 304249, "epoch": 1811} {"train_loss": -11.082313537597656, "global_step": 304250, "epoch": 1811} {"train_loss": -10.557934761047363, "global_step": 304251, "epoch": 1811} {"train_loss": -11.600651741027832, "global_step": 304252, "epoch": 1811} {"train_loss": -10.968059539794922, "global_step": 304253, "epoch": 1811} {"train_loss": -11.26020336151123, "global_step": 304254, "epoch": 1811} {"train_loss": -10.813936233520508, "global_step": 304255, "epoch": 1811} {"train_loss": -11.828621864318848, "global_step": 304256, "epoch": 1811} {"train_loss": -11.47027587890625, "global_step": 304257, "epoch": 1811} {"train_loss": -11.90948486328125, "global_step": 304258, "epoch": 1811} {"train_loss": -11.722105979919434, "global_step": 304259, "epoch": 1811} {"train_loss": -11.592923164367676, "global_step": 304260, "epoch": 1811} {"train_loss": -11.948866844177246, "global_step": 304261, "epoch": 1811} {"train_loss": -12.016648292541504, "global_step": 304262, "epoch": 1811} {"train_loss": -12.147062301635742, "global_step": 304263, "epoch": 1811} {"train_loss": -12.126693725585938, "global_step": 304264, "epoch": 1811} {"train_loss": -12.079460144042969, "global_step": 304265, "epoch": 1811} {"train_loss": -11.934271812438965, "global_step": 304266, "epoch": 1811} {"train_loss": -11.885692596435547, "global_step": 304267, "epoch": 1811} {"train_loss": -12.195253372192383, "global_step": 304268, "epoch": 1811} {"train_loss": -11.77358341217041, "global_step": 304269, "epoch": 1811} {"train_loss": -12.095426559448242, "global_step": 304270, "epoch": 1811} {"train_loss": -11.938642501831055, "global_step": 304271, "epoch": 1811} {"train_loss": -12.028345108032227, "global_step": 304272, "epoch": 1811} {"train_loss": -12.031389236450195, "global_step": 304273, "epoch": 1811} {"train_loss": -12.29820442199707, "global_step": 304274, "epoch": 1811} {"train_loss": -12.038494110107422, "global_step": 304275, "epoch": 1811} {"train_loss": -11.922035217285156, "global_step": 304276, "epoch": 1811} {"train_loss": -11.84475040435791, "global_step": 304277, "epoch": 1811} {"train_loss": -12.248013496398926, "global_step": 304278, "epoch": 1811} {"train_loss": -12.397317886352539, "global_step": 304279, "epoch": 1811} {"train_loss": -12.076972961425781, "global_step": 304280, "epoch": 1811} {"train_loss": -12.467575073242188, "global_step": 304281, "epoch": 1811} {"train_loss": -11.916467666625977, "global_step": 304282, "epoch": 1811} {"train_loss": -12.285917282104492, "global_step": 304283, "epoch": 1811} {"train_loss": -12.102880477905273, "global_step": 304284, "epoch": 1811} {"train_loss": -12.284780502319336, "global_step": 304285, "epoch": 1811} {"train_loss": -12.465757369995117, "global_step": 304286, "epoch": 1811} {"train_loss": -11.986845016479492, "global_step": 304287, "epoch": 1811} {"train_loss": -12.254117965698242, "global_step": 304288, "epoch": 1811} {"train_loss": -12.557512283325195, "global_step": 304289, "epoch": 1811} {"train_loss": -12.299065589904785, "global_step": 304290, "epoch": 1811} {"train_loss": -12.405479431152344, "global_step": 304291, "epoch": 1811} {"train_loss": -12.353827476501465, "global_step": 304292, "epoch": 1811} {"train_loss": -12.320929527282715, "global_step": 304293, "epoch": 1811} {"train_loss": -12.247188568115234, "global_step": 304294, "epoch": 1811} {"train_loss": -12.070212364196777, "global_step": 304295, "epoch": 1811} {"train_loss": -12.326345443725586, "global_step": 304296, "epoch": 1811} {"train_loss": -12.39877700805664, "global_step": 304297, "epoch": 1811} {"train_loss": -12.364683151245117, "global_step": 304298, "epoch": 1811} {"train_loss": -12.392751693725586, "global_step": 304299, "epoch": 1811} {"train_loss": -12.422361373901367, "global_step": 304300, "epoch": 1811} {"train_loss": -12.501546859741211, "global_step": 304301, "epoch": 1811} {"train_loss": -12.045943260192871, "global_step": 304302, "epoch": 1811} {"train_loss": -12.439754486083984, "global_step": 304303, "epoch": 1811} {"train_loss": -12.457931518554688, "global_step": 304304, "epoch": 1811} {"train_loss": -12.317678451538086, "global_step": 304305, "epoch": 1811} {"train_loss": -12.64155387878418, "global_step": 304306, "epoch": 1811} {"train_loss": -12.392207145690918, "global_step": 304307, "epoch": 1811} {"train_loss": -12.332637786865234, "global_step": 304308, "epoch": 1811} {"train_loss": -12.534168243408203, "global_step": 304309, "epoch": 1811} {"train_loss": -12.487312316894531, "global_step": 304310, "epoch": 1811} {"train_loss": -12.251814842224121, "global_step": 304311, "epoch": 1811} {"train_loss": -12.153509140014648, "global_step": 304312, "epoch": 1811} {"train_loss": -12.432821273803711, "global_step": 304313, "epoch": 1811} {"train_loss": -12.305347442626953, "global_step": 304314, "epoch": 1811} {"train_loss": -12.164774894714355, "global_step": 304315, "epoch": 1811} {"train_loss": -12.272542953491211, "global_step": 304316, "epoch": 1811} {"train_loss": -12.332209587097168, "global_step": 304317, "epoch": 1811} {"train_loss": -12.4156494140625, "global_step": 304318, "epoch": 1811} {"train_loss": -12.352614402770996, "global_step": 304319, "epoch": 1811} {"train_loss": -12.38206672668457, "global_step": 304320, "epoch": 1811} {"train_loss": -12.705768585205078, "global_step": 304321, "epoch": 1811} {"train_loss": -12.331530570983887, "global_step": 304322, "epoch": 1811} {"train_loss": -12.607705116271973, "global_step": 304323, "epoch": 1811} {"train_loss": -12.575555801391602, "global_step": 304324, "epoch": 1811} {"train_loss": -12.595563888549805, "global_step": 304325, "epoch": 1811} {"train_loss": -12.371576309204102, "global_step": 304326, "epoch": 1811} {"train_loss": -12.036125183105469, "global_step": 304327, "epoch": 1811} {"train_loss": -12.062699317932129, "global_step": 304328, "epoch": 1811} {"train_loss": -12.104253768920898, "global_step": 304329, "epoch": 1811} {"train_loss": -12.246826171875, "global_step": 304330, "epoch": 1811} {"train_loss": -11.905527114868164, "global_step": 304331, "epoch": 1811} {"train_loss": -12.428888320922852, "global_step": 304332, "epoch": 1811} {"train_loss": -11.985311508178711, "global_step": 304333, "epoch": 1811} {"train_loss": -11.284751892089844, "global_step": 304334, "epoch": 1811} {"train_loss": -10.869050025939941, "global_step": 304335, "epoch": 1811} {"train_loss": -12.220447540283203, "global_step": 304336, "epoch": 1811} {"train_loss": -11.598896980285645, "global_step": 304337, "epoch": 1811} {"train_loss": -10.631807327270508, "global_step": 304338, "epoch": 1811} {"train_loss": -11.18005084991455, "global_step": 304339, "epoch": 1811} {"train_loss": -10.805244445800781, "global_step": 304340, "epoch": 1811} {"train_loss": -10.653623580932617, "global_step": 304341, "epoch": 1811} {"train_loss": -11.397111892700195, "global_step": 304342, "epoch": 1811} {"train_loss": -11.638972282409668, "global_step": 304343, "epoch": 1811} {"train_loss": -11.702217102050781, "global_step": 304344, "epoch": 1811} {"train_loss": -12.07540225982666, "global_step": 304345, "epoch": 1811} {"train_loss": -10.684016227722168, "global_step": 304346, "epoch": 1811} {"train_loss": -10.395797729492188, "global_step": 304347, "epoch": 1811} {"train_loss": -11.32772445678711, "global_step": 304348, "epoch": 1811} {"train_loss": -8.57676887512207, "global_step": 304349, "epoch": 1811} {"train_loss": -10.33698844909668, "global_step": 304350, "epoch": 1811} {"train_loss": -11.03689193725586, "global_step": 304351, "epoch": 1811} {"train_loss": -10.89857292175293, "global_step": 304352, "epoch": 1811} {"train_loss": -11.15794563293457, "global_step": 304353, "epoch": 1811} {"train_loss": -10.663861274719238, "global_step": 304354, "epoch": 1811} {"train_loss": -11.61451244354248, "global_step": 304355, "epoch": 1811} {"train_loss": -10.689603805541992, "global_step": 304356, "epoch": 1811} {"train_loss": -11.045389175415039, "global_step": 304357, "epoch": 1811} {"train_loss": -11.281563758850098, "global_step": 304358, "epoch": 1811} {"train_loss": -9.601003646850586, "global_step": 304359, "epoch": 1811} {"train_loss": -10.738969802856445, "global_step": 304360, "epoch": 1811} {"train_loss": -10.257492065429688, "global_step": 304361, "epoch": 1811} {"train_loss": -9.510496139526367, "global_step": 304362, "epoch": 1811} {"train_loss": -10.019182205200195, "global_step": 304363, "epoch": 1811} {"train_loss": -10.751312255859375, "global_step": 304364, "epoch": 1811} {"train_loss": -9.721699714660645, "global_step": 304365, "epoch": 1811} {"train_loss": -11.270795822143555, "global_step": 304366, "epoch": 1811} {"train_loss": -11.080436706542969, "global_step": 304367, "epoch": 1811} {"train_loss": -11.028812408447266, "global_step": 304368, "epoch": 1811} {"train_loss": -11.333404541015625, "global_step": 304369, "epoch": 1811} {"train_loss": -10.947031021118164, "global_step": 304370, "epoch": 1811} {"train_loss": -11.725345611572266, "global_step": 304371, "epoch": 1811} {"train_loss": -10.795208930969238, "global_step": 304372, "epoch": 1811} {"train_loss": -11.736886978149414, "global_step": 304373, "epoch": 1811} {"train_loss": -10.822174072265625, "global_step": 304374, "epoch": 1811} {"train_loss": -10.963807106018066, "global_step": 304375, "epoch": 1811} {"train_loss": -11.35204029083252, "global_step": 304376, "epoch": 1811} {"train_loss": -10.421026229858398, "global_step": 304377, "epoch": 1811} {"train_loss": -10.975590705871582, "global_step": 304378, "epoch": 1811} {"train_loss": -11.532153129577637, "global_step": 304379, "epoch": 1811} {"train_loss": -11.145196914672852, "global_step": 304380, "epoch": 1811} {"train_loss": -11.63170051574707, "global_step": 304381, "epoch": 1811} {"train_loss": -11.787887573242188, "global_step": 304382, "epoch": 1811} {"train_loss": -11.008651733398438, "global_step": 304383, "epoch": 1811} {"train_loss": -11.586118698120117, "global_step": 304384, "epoch": 1811} {"train_loss": -11.605561256408691, "global_step": 304385, "epoch": 1811} {"train_loss": -11.351064682006836, "global_step": 304386, "epoch": 1811} {"train_loss": -11.412151336669922, "global_step": 304387, "epoch": 1811} {"train_loss": -11.96273136138916, "global_step": 304388, "epoch": 1811} {"train_loss": -11.767717361450195, "global_step": 304389, "epoch": 1811} {"train_loss": -11.8245849609375, "global_step": 304390, "epoch": 1811} {"train_loss": -11.931644439697266, "global_step": 304391, "epoch": 1811} {"train_loss": -11.85012435913086, "global_step": 304392, "epoch": 1811} {"train_loss": -11.847536087036133, "global_step": 304393, "epoch": 1811} {"train_loss": -11.984121322631836, "global_step": 304394, "epoch": 1811} {"train_loss": -11.937829971313477, "global_step": 304395, "epoch": 1811} {"train_loss": -12.082149505615234, "global_step": 304396, "epoch": 1811} {"train_loss": -11.95252513885498, "global_step": 304397, "epoch": 1811} {"train_loss": -11.785443305969238, "global_step": 304398, "epoch": 1811} {"train_loss": -12.217443466186523, "global_step": 304399, "epoch": 1811} {"train_loss": -11.837793350219727, "global_step": 304400, "epoch": 1811} {"train_loss": -11.960267066955566, "global_step": 304401, "epoch": 1811} {"train_loss": -11.668869018554688, "global_step": 304402, "epoch": 1811} {"train_loss": -11.771519660949707, "global_step": 304403, "epoch": 1811} {"train_loss": -11.85595989227295, "global_step": 304404, "epoch": 1811} {"train_loss": -12.004648208618164, "global_step": 304405, "epoch": 1811} {"train_loss": -11.998186111450195, "global_step": 304406, "epoch": 1811} {"train_loss": -12.106013298034668, "global_step": 304407, "epoch": 1811} {"train_loss": -11.896074295043945, "global_step": 304408, "epoch": 1811} {"train_loss": -12.194910049438477, "global_step": 304409, "epoch": 1811} {"train_loss": -11.951604843139648, "global_step": 304410, "epoch": 1811} {"train_loss": -12.233123779296875, "global_step": 304411, "epoch": 1811} {"train_loss": -11.959218978881836, "global_step": 304412, "epoch": 1811} {"train_loss": -12.206356048583984, "global_step": 304413, "epoch": 1811} {"train_loss": -12.002132415771484, "global_step": 304414, "epoch": 1811} {"train_loss": -11.728140882083348, "global_step": 304415, "epoch": 1811, "val_loss": 279962.1875} {"train_loss": -11.798700332641602, "global_step": 304416, "epoch": 1812} {"train_loss": -12.283187866210938, "global_step": 304417, "epoch": 1812} {"train_loss": -12.040696144104004, "global_step": 304418, "epoch": 1812} {"train_loss": -12.242815971374512, "global_step": 304419, "epoch": 1812} {"train_loss": -12.273321151733398, "global_step": 304420, "epoch": 1812} {"train_loss": -12.387207984924316, "global_step": 304421, "epoch": 1812} {"train_loss": -12.090753555297852, "global_step": 304422, "epoch": 1812} {"train_loss": -12.317604064941406, "global_step": 304423, "epoch": 1812} {"train_loss": -12.07634162902832, "global_step": 304424, "epoch": 1812} {"train_loss": -11.907814025878906, "global_step": 304425, "epoch": 1812} {"train_loss": -12.013534545898438, "global_step": 304426, "epoch": 1812} {"train_loss": -12.23543930053711, "global_step": 304427, "epoch": 1812} {"train_loss": -11.756360054016113, "global_step": 304428, "epoch": 1812} {"train_loss": -12.187328338623047, "global_step": 304429, "epoch": 1812} {"train_loss": -11.653047561645508, "global_step": 304430, "epoch": 1812} {"train_loss": -12.013833045959473, "global_step": 304431, "epoch": 1812} {"train_loss": -11.725610733032227, "global_step": 304432, "epoch": 1812} {"train_loss": -12.037071228027344, "global_step": 304433, "epoch": 1812} {"train_loss": -11.393548965454102, "global_step": 304434, "epoch": 1812} {"train_loss": -12.10110855102539, "global_step": 304435, "epoch": 1812} {"train_loss": -11.863744735717773, "global_step": 304436, "epoch": 1812} {"train_loss": -11.812726974487305, "global_step": 304437, "epoch": 1812} {"train_loss": -12.103813171386719, "global_step": 304438, "epoch": 1812} {"train_loss": -12.000890731811523, "global_step": 304439, "epoch": 1812} {"train_loss": -12.137636184692383, "global_step": 304440, "epoch": 1812} {"train_loss": -11.99693489074707, "global_step": 304441, "epoch": 1812} {"train_loss": -11.994034767150879, "global_step": 304442, "epoch": 1812} {"train_loss": -12.070579528808594, "global_step": 304443, "epoch": 1812} {"train_loss": -12.209632873535156, "global_step": 304444, "epoch": 1812} {"train_loss": -12.176351547241211, "global_step": 304445, "epoch": 1812} {"train_loss": -12.173782348632812, "global_step": 304446, "epoch": 1812} {"train_loss": -12.30015754699707, "global_step": 304447, "epoch": 1812} {"train_loss": -12.274003982543945, "global_step": 304448, "epoch": 1812} {"train_loss": -12.112041473388672, "global_step": 304449, "epoch": 1812} {"train_loss": -12.264898300170898, "global_step": 304450, "epoch": 1812} {"train_loss": -12.434927940368652, "global_step": 304451, "epoch": 1812} {"train_loss": -11.813705444335938, "global_step": 304452, "epoch": 1812} {"train_loss": -11.869690895080566, "global_step": 304453, "epoch": 1812} {"train_loss": -11.842182159423828, "global_step": 304454, "epoch": 1812} {"train_loss": -12.217233657836914, "global_step": 304455, "epoch": 1812} {"train_loss": -11.60887336730957, "global_step": 304456, "epoch": 1812} {"train_loss": -11.641721725463867, "global_step": 304457, "epoch": 1812} {"train_loss": -11.82198429107666, "global_step": 304458, "epoch": 1812} {"train_loss": -12.295427322387695, "global_step": 304459, "epoch": 1812} {"train_loss": -12.186153411865234, "global_step": 304460, "epoch": 1812} {"train_loss": -11.67349624633789, "global_step": 304461, "epoch": 1812} {"train_loss": -12.378927230834961, "global_step": 304462, "epoch": 1812} {"train_loss": -11.936076164245605, "global_step": 304463, "epoch": 1812} {"train_loss": -11.520556449890137, "global_step": 304464, "epoch": 1812} {"train_loss": -11.868252754211426, "global_step": 304465, "epoch": 1812} {"train_loss": -12.089254379272461, "global_step": 304466, "epoch": 1812} {"train_loss": -11.8460111618042, "global_step": 304467, "epoch": 1812} {"train_loss": -11.832375526428223, "global_step": 304468, "epoch": 1812} {"train_loss": -11.700021743774414, "global_step": 304469, "epoch": 1812} {"train_loss": -10.766393661499023, "global_step": 304470, "epoch": 1812} {"train_loss": -12.033565521240234, "global_step": 304471, "epoch": 1812} {"train_loss": -11.074039459228516, "global_step": 304472, "epoch": 1812} {"train_loss": -11.362396240234375, "global_step": 304473, "epoch": 1812} {"train_loss": -11.981874465942383, "global_step": 304474, "epoch": 1812} {"train_loss": -11.240280151367188, "global_step": 304475, "epoch": 1812} {"train_loss": -11.83941650390625, "global_step": 304476, "epoch": 1812} {"train_loss": -10.749048233032227, "global_step": 304477, "epoch": 1812} {"train_loss": -11.312944412231445, "global_step": 304478, "epoch": 1812} {"train_loss": -11.314619064331055, "global_step": 304479, "epoch": 1812} {"train_loss": -10.418476104736328, "global_step": 304480, "epoch": 1812} {"train_loss": -12.01716423034668, "global_step": 304481, "epoch": 1812} {"train_loss": -10.35527229309082, "global_step": 304482, "epoch": 1812} {"train_loss": -11.564066886901855, "global_step": 304483, "epoch": 1812} {"train_loss": -11.73933219909668, "global_step": 304484, "epoch": 1812} {"train_loss": -11.248291969299316, "global_step": 304485, "epoch": 1812} {"train_loss": -12.003072738647461, "global_step": 304486, "epoch": 1812} {"train_loss": -10.837024688720703, "global_step": 304487, "epoch": 1812} {"train_loss": -11.652376174926758, "global_step": 304488, "epoch": 1812} {"train_loss": -11.669415473937988, "global_step": 304489, "epoch": 1812} {"train_loss": -11.343174934387207, "global_step": 304490, "epoch": 1812} {"train_loss": -11.730317115783691, "global_step": 304491, "epoch": 1812} {"train_loss": -11.746875762939453, "global_step": 304492, "epoch": 1812} {"train_loss": -11.378011703491211, "global_step": 304493, "epoch": 1812} {"train_loss": -11.948134422302246, "global_step": 304494, "epoch": 1812} {"train_loss": -11.896173477172852, "global_step": 304495, "epoch": 1812} {"train_loss": -11.901808738708496, "global_step": 304496, "epoch": 1812} {"train_loss": -12.177124977111816, "global_step": 304497, "epoch": 1812} {"train_loss": -11.651628494262695, "global_step": 304498, "epoch": 1812} {"train_loss": -12.13231086730957, "global_step": 304499, "epoch": 1812} {"train_loss": -11.83984375, "global_step": 304500, "epoch": 1812} {"train_loss": -11.868523597717285, "global_step": 304501, "epoch": 1812} {"train_loss": -12.16847038269043, "global_step": 304502, "epoch": 1812} {"train_loss": -11.849262237548828, "global_step": 304503, "epoch": 1812} {"train_loss": -11.834718704223633, "global_step": 304504, "epoch": 1812} {"train_loss": -11.96395206451416, "global_step": 304505, "epoch": 1812} {"train_loss": -12.060583114624023, "global_step": 304506, "epoch": 1812} {"train_loss": -11.887581825256348, "global_step": 304507, "epoch": 1812} {"train_loss": -12.19978141784668, "global_step": 304508, "epoch": 1812} {"train_loss": -12.253935813903809, "global_step": 304509, "epoch": 1812} {"train_loss": -12.240999221801758, "global_step": 304510, "epoch": 1812} {"train_loss": -12.177107810974121, "global_step": 304511, "epoch": 1812} {"train_loss": -12.251825332641602, "global_step": 304512, "epoch": 1812} {"train_loss": -12.258878707885742, "global_step": 304513, "epoch": 1812} {"train_loss": -12.307594299316406, "global_step": 304514, "epoch": 1812} {"train_loss": -12.2255277633667, "global_step": 304515, "epoch": 1812} {"train_loss": -12.315528869628906, "global_step": 304516, "epoch": 1812} {"train_loss": -12.281295776367188, "global_step": 304517, "epoch": 1812} {"train_loss": -12.253254890441895, "global_step": 304518, "epoch": 1812} {"train_loss": -12.319684028625488, "global_step": 304519, "epoch": 1812} {"train_loss": -12.173248291015625, "global_step": 304520, "epoch": 1812} {"train_loss": -12.269462585449219, "global_step": 304521, "epoch": 1812} {"train_loss": -12.06293773651123, "global_step": 304522, "epoch": 1812} {"train_loss": -12.255777359008789, "global_step": 304523, "epoch": 1812} {"train_loss": -11.905353546142578, "global_step": 304524, "epoch": 1812} {"train_loss": -11.635757446289062, "global_step": 304525, "epoch": 1812} {"train_loss": -12.16065502166748, "global_step": 304526, "epoch": 1812} {"train_loss": -12.376679420471191, "global_step": 304527, "epoch": 1812} {"train_loss": -11.992595672607422, "global_step": 304528, "epoch": 1812} {"train_loss": -12.547276496887207, "global_step": 304529, "epoch": 1812} {"train_loss": -12.188457489013672, "global_step": 304530, "epoch": 1812} {"train_loss": -12.246152877807617, "global_step": 304531, "epoch": 1812} {"train_loss": -12.365471839904785, "global_step": 304532, "epoch": 1812} {"train_loss": -11.879636764526367, "global_step": 304533, "epoch": 1812} {"train_loss": -12.401529312133789, "global_step": 304534, "epoch": 1812} {"train_loss": -11.42535400390625, "global_step": 304535, "epoch": 1812} {"train_loss": -11.442100524902344, "global_step": 304536, "epoch": 1812} {"train_loss": -12.182355880737305, "global_step": 304537, "epoch": 1812} {"train_loss": -11.994084358215332, "global_step": 304538, "epoch": 1812} {"train_loss": -11.071922302246094, "global_step": 304539, "epoch": 1812} {"train_loss": -12.210331916809082, "global_step": 304540, "epoch": 1812} {"train_loss": -10.354276657104492, "global_step": 304541, "epoch": 1812} {"train_loss": -12.018267631530762, "global_step": 304542, "epoch": 1812} {"train_loss": -10.762725830078125, "global_step": 304543, "epoch": 1812} {"train_loss": -11.270000457763672, "global_step": 304544, "epoch": 1812} {"train_loss": -12.06272029876709, "global_step": 304545, "epoch": 1812} {"train_loss": -10.817520141601562, "global_step": 304546, "epoch": 1812} {"train_loss": -11.434131622314453, "global_step": 304547, "epoch": 1812} {"train_loss": -11.495418548583984, "global_step": 304548, "epoch": 1812} {"train_loss": -10.373259544372559, "global_step": 304549, "epoch": 1812} {"train_loss": -10.676742553710938, "global_step": 304550, "epoch": 1812} {"train_loss": -10.905980110168457, "global_step": 304551, "epoch": 1812} {"train_loss": -11.757615089416504, "global_step": 304552, "epoch": 1812} {"train_loss": -10.480182647705078, "global_step": 304553, "epoch": 1812} {"train_loss": -10.955324172973633, "global_step": 304554, "epoch": 1812} {"train_loss": -9.807781219482422, "global_step": 304555, "epoch": 1812} {"train_loss": -10.224274635314941, "global_step": 304556, "epoch": 1812} {"train_loss": -11.577136993408203, "global_step": 304557, "epoch": 1812} {"train_loss": -11.411001205444336, "global_step": 304558, "epoch": 1812} {"train_loss": -11.476381301879883, "global_step": 304559, "epoch": 1812} {"train_loss": -11.604509353637695, "global_step": 304560, "epoch": 1812} {"train_loss": -11.121535301208496, "global_step": 304561, "epoch": 1812} {"train_loss": -11.139900207519531, "global_step": 304562, "epoch": 1812} {"train_loss": -12.018198013305664, "global_step": 304563, "epoch": 1812} {"train_loss": -11.36613655090332, "global_step": 304564, "epoch": 1812} {"train_loss": -11.518548965454102, "global_step": 304565, "epoch": 1812} {"train_loss": -11.641510009765625, "global_step": 304566, "epoch": 1812} {"train_loss": -11.697776794433594, "global_step": 304567, "epoch": 1812} {"train_loss": -11.409177780151367, "global_step": 304568, "epoch": 1812} {"train_loss": -11.759330749511719, "global_step": 304569, "epoch": 1812} {"train_loss": -11.429498672485352, "global_step": 304570, "epoch": 1812} {"train_loss": -11.868504524230957, "global_step": 304571, "epoch": 1812} {"train_loss": -11.729240417480469, "global_step": 304572, "epoch": 1812} {"train_loss": -11.854752540588379, "global_step": 304573, "epoch": 1812} {"train_loss": -11.843196868896484, "global_step": 304574, "epoch": 1812} {"train_loss": -11.472169876098633, "global_step": 304575, "epoch": 1812} {"train_loss": -12.058311462402344, "global_step": 304576, "epoch": 1812} {"train_loss": -11.663300514221191, "global_step": 304577, "epoch": 1812} {"train_loss": -12.098882675170898, "global_step": 304578, "epoch": 1812} {"train_loss": -11.895807266235352, "global_step": 304579, "epoch": 1812} {"train_loss": -11.995725631713867, "global_step": 304580, "epoch": 1812} {"train_loss": -12.117305755615234, "global_step": 304581, "epoch": 1812} {"train_loss": -12.112184524536133, "global_step": 304582, "epoch": 1812} {"train_loss": -11.78939275514512, "global_step": 304583, "epoch": 1812, "val_loss": 282990.34375} {"train_loss": -12.040485382080078, "global_step": 304584, "epoch": 1813} {"train_loss": -11.996984481811523, "global_step": 304585, "epoch": 1813} {"train_loss": -12.264732360839844, "global_step": 304586, "epoch": 1813} {"train_loss": -12.232315063476562, "global_step": 304587, "epoch": 1813} {"train_loss": -12.137889862060547, "global_step": 304588, "epoch": 1813} {"train_loss": -12.405649185180664, "global_step": 304589, "epoch": 1813} {"train_loss": -12.11611270904541, "global_step": 304590, "epoch": 1813} {"train_loss": -12.436476707458496, "global_step": 304591, "epoch": 1813} {"train_loss": -12.487970352172852, "global_step": 304592, "epoch": 1813} {"train_loss": -12.392509460449219, "global_step": 304593, "epoch": 1813} {"train_loss": -12.199275970458984, "global_step": 304594, "epoch": 1813} {"train_loss": -12.464607238769531, "global_step": 304595, "epoch": 1813} {"train_loss": -12.231460571289062, "global_step": 304596, "epoch": 1813} {"train_loss": -12.283882141113281, "global_step": 304597, "epoch": 1813} {"train_loss": -12.557811737060547, "global_step": 304598, "epoch": 1813} {"train_loss": -12.396981239318848, "global_step": 304599, "epoch": 1813} {"train_loss": -12.376968383789062, "global_step": 304600, "epoch": 1813} {"train_loss": -12.333902359008789, "global_step": 304601, "epoch": 1813} {"train_loss": -12.138824462890625, "global_step": 304602, "epoch": 1813} {"train_loss": -12.431018829345703, "global_step": 304603, "epoch": 1813} {"train_loss": -12.085437774658203, "global_step": 304604, "epoch": 1813} {"train_loss": -12.114582061767578, "global_step": 304605, "epoch": 1813} {"train_loss": -12.317134857177734, "global_step": 304606, "epoch": 1813} {"train_loss": -12.345125198364258, "global_step": 304607, "epoch": 1813} {"train_loss": -12.150819778442383, "global_step": 304608, "epoch": 1813} {"train_loss": -12.202982902526855, "global_step": 304609, "epoch": 1813} {"train_loss": -12.405926704406738, "global_step": 304610, "epoch": 1813} {"train_loss": -11.567142486572266, "global_step": 304611, "epoch": 1813} {"train_loss": -12.01761531829834, "global_step": 304612, "epoch": 1813} {"train_loss": -12.077643394470215, "global_step": 304613, "epoch": 1813} {"train_loss": -11.761053085327148, "global_step": 304614, "epoch": 1813} {"train_loss": -11.815103530883789, "global_step": 304615, "epoch": 1813} {"train_loss": -12.222024917602539, "global_step": 304616, "epoch": 1813} {"train_loss": -11.71871566772461, "global_step": 304617, "epoch": 1813} {"train_loss": -11.131646156311035, "global_step": 304618, "epoch": 1813} {"train_loss": -12.086324691772461, "global_step": 304619, "epoch": 1813} {"train_loss": -12.173540115356445, "global_step": 304620, "epoch": 1813} {"train_loss": -11.906007766723633, "global_step": 304621, "epoch": 1813} {"train_loss": -12.464174270629883, "global_step": 304622, "epoch": 1813} {"train_loss": -12.33751106262207, "global_step": 304623, "epoch": 1813} {"train_loss": -11.942380905151367, "global_step": 304624, "epoch": 1813} {"train_loss": -12.022139549255371, "global_step": 304625, "epoch": 1813} {"train_loss": -12.014309883117676, "global_step": 304626, "epoch": 1813} {"train_loss": -11.51473617553711, "global_step": 304627, "epoch": 1813} {"train_loss": -12.309785842895508, "global_step": 304628, "epoch": 1813} {"train_loss": -12.253049850463867, "global_step": 304629, "epoch": 1813} {"train_loss": -12.333869934082031, "global_step": 304630, "epoch": 1813} {"train_loss": -12.069840431213379, "global_step": 304631, "epoch": 1813} {"train_loss": -12.131686210632324, "global_step": 304632, "epoch": 1813} {"train_loss": -12.143739700317383, "global_step": 304633, "epoch": 1813} {"train_loss": -12.469730377197266, "global_step": 304634, "epoch": 1813} {"train_loss": -11.92945671081543, "global_step": 304635, "epoch": 1813} {"train_loss": -12.102571487426758, "global_step": 304636, "epoch": 1813} {"train_loss": -11.93602180480957, "global_step": 304637, "epoch": 1813} {"train_loss": -12.070367813110352, "global_step": 304638, "epoch": 1813} {"train_loss": -11.980384826660156, "global_step": 304639, "epoch": 1813} {"train_loss": -12.15928840637207, "global_step": 304640, "epoch": 1813} {"train_loss": -12.28176212310791, "global_step": 304641, "epoch": 1813} {"train_loss": -12.312549591064453, "global_step": 304642, "epoch": 1813} {"train_loss": -12.152382850646973, "global_step": 304643, "epoch": 1813} {"train_loss": -12.142997741699219, "global_step": 304644, "epoch": 1813} {"train_loss": -12.358489036560059, "global_step": 304645, "epoch": 1813} {"train_loss": -12.319070816040039, "global_step": 304646, "epoch": 1813} {"train_loss": -12.293691635131836, "global_step": 304647, "epoch": 1813} {"train_loss": -11.845455169677734, "global_step": 304648, "epoch": 1813} {"train_loss": -12.070813179016113, "global_step": 304649, "epoch": 1813} {"train_loss": -10.663028717041016, "global_step": 304650, "epoch": 1813} {"train_loss": -10.369720458984375, "global_step": 304651, "epoch": 1813} {"train_loss": -12.305797576904297, "global_step": 304652, "epoch": 1813} {"train_loss": -11.396637916564941, "global_step": 304653, "epoch": 1813} {"train_loss": -11.629692077636719, "global_step": 304654, "epoch": 1813} {"train_loss": -12.003166198730469, "global_step": 304655, "epoch": 1813} {"train_loss": -11.302936553955078, "global_step": 304656, "epoch": 1813} {"train_loss": -11.607044219970703, "global_step": 304657, "epoch": 1813} {"train_loss": -11.714155197143555, "global_step": 304658, "epoch": 1813} {"train_loss": -11.69729995727539, "global_step": 304659, "epoch": 1813} {"train_loss": -12.15834903717041, "global_step": 304660, "epoch": 1813} {"train_loss": -11.275171279907227, "global_step": 304661, "epoch": 1813} {"train_loss": -10.763959884643555, "global_step": 304662, "epoch": 1813} {"train_loss": -11.925504684448242, "global_step": 304663, "epoch": 1813} {"train_loss": -10.661775588989258, "global_step": 304664, "epoch": 1813} {"train_loss": -11.913206100463867, "global_step": 304665, "epoch": 1813} {"train_loss": -11.404033660888672, "global_step": 304666, "epoch": 1813} {"train_loss": -11.321743965148926, "global_step": 304667, "epoch": 1813} {"train_loss": -12.331337928771973, "global_step": 304668, "epoch": 1813} {"train_loss": -11.610749244689941, "global_step": 304669, "epoch": 1813} {"train_loss": -11.617753982543945, "global_step": 304670, "epoch": 1813} {"train_loss": -12.153873443603516, "global_step": 304671, "epoch": 1813} {"train_loss": -11.599671363830566, "global_step": 304672, "epoch": 1813} {"train_loss": -11.682395935058594, "global_step": 304673, "epoch": 1813} {"train_loss": -12.456384658813477, "global_step": 304674, "epoch": 1813} {"train_loss": -12.196955680847168, "global_step": 304675, "epoch": 1813} {"train_loss": -11.936612129211426, "global_step": 304676, "epoch": 1813} {"train_loss": -12.1743745803833, "global_step": 304677, "epoch": 1813} {"train_loss": -11.819180488586426, "global_step": 304678, "epoch": 1813} {"train_loss": -12.211846351623535, "global_step": 304679, "epoch": 1813} {"train_loss": -12.028177261352539, "global_step": 304680, "epoch": 1813} {"train_loss": -12.0344820022583, "global_step": 304681, "epoch": 1813} {"train_loss": -12.32593059539795, "global_step": 304682, "epoch": 1813} {"train_loss": -12.156414985656738, "global_step": 304683, "epoch": 1813} {"train_loss": -12.012591361999512, "global_step": 304684, "epoch": 1813} {"train_loss": -12.312127113342285, "global_step": 304685, "epoch": 1813} {"train_loss": -12.249814987182617, "global_step": 304686, "epoch": 1813} {"train_loss": -11.8436861038208, "global_step": 304687, "epoch": 1813} {"train_loss": -12.341514587402344, "global_step": 304688, "epoch": 1813} {"train_loss": -11.682455062866211, "global_step": 304689, "epoch": 1813} {"train_loss": -11.300329208374023, "global_step": 304690, "epoch": 1813} {"train_loss": -12.220770835876465, "global_step": 304691, "epoch": 1813} {"train_loss": -11.245925903320312, "global_step": 304692, "epoch": 1813} {"train_loss": -11.744526863098145, "global_step": 304693, "epoch": 1813} {"train_loss": -12.167902946472168, "global_step": 304694, "epoch": 1813} {"train_loss": -11.97973346710205, "global_step": 304695, "epoch": 1813} {"train_loss": -11.708885192871094, "global_step": 304696, "epoch": 1813} {"train_loss": -12.129170417785645, "global_step": 304697, "epoch": 1813} {"train_loss": -12.01120376586914, "global_step": 304698, "epoch": 1813} {"train_loss": -11.793588638305664, "global_step": 304699, "epoch": 1813} {"train_loss": -12.237554550170898, "global_step": 304700, "epoch": 1813} {"train_loss": -12.026655197143555, "global_step": 304701, "epoch": 1813} {"train_loss": -11.854690551757812, "global_step": 304702, "epoch": 1813} {"train_loss": -12.095329284667969, "global_step": 304703, "epoch": 1813} {"train_loss": -11.85473918914795, "global_step": 304704, "epoch": 1813} {"train_loss": -12.273569107055664, "global_step": 304705, "epoch": 1813} {"train_loss": -12.165477752685547, "global_step": 304706, "epoch": 1813} {"train_loss": -12.194822311401367, "global_step": 304707, "epoch": 1813} {"train_loss": -12.163894653320312, "global_step": 304708, "epoch": 1813} {"train_loss": -12.221818923950195, "global_step": 304709, "epoch": 1813} {"train_loss": -11.850008010864258, "global_step": 304710, "epoch": 1813} {"train_loss": -12.289066314697266, "global_step": 304711, "epoch": 1813} {"train_loss": -12.166459083557129, "global_step": 304712, "epoch": 1813} {"train_loss": -12.166038513183594, "global_step": 304713, "epoch": 1813} {"train_loss": -12.452168464660645, "global_step": 304714, "epoch": 1813} {"train_loss": -12.093480110168457, "global_step": 304715, "epoch": 1813} {"train_loss": -12.366912841796875, "global_step": 304716, "epoch": 1813} {"train_loss": -12.293621063232422, "global_step": 304717, "epoch": 1813} {"train_loss": -12.211913108825684, "global_step": 304718, "epoch": 1813} {"train_loss": -12.142123222351074, "global_step": 304719, "epoch": 1813} {"train_loss": -11.686588287353516, "global_step": 304720, "epoch": 1813} {"train_loss": -12.075825691223145, "global_step": 304721, "epoch": 1813} {"train_loss": -11.878769874572754, "global_step": 304722, "epoch": 1813} {"train_loss": -10.896512031555176, "global_step": 304723, "epoch": 1813} {"train_loss": -12.497518539428711, "global_step": 304724, "epoch": 1813} {"train_loss": -10.678668022155762, "global_step": 304725, "epoch": 1813} {"train_loss": -12.031288146972656, "global_step": 304726, "epoch": 1813} {"train_loss": -11.441610336303711, "global_step": 304727, "epoch": 1813} {"train_loss": -11.520438194274902, "global_step": 304728, "epoch": 1813} {"train_loss": -11.61172103881836, "global_step": 304729, "epoch": 1813} {"train_loss": -11.5817289352417, "global_step": 304730, "epoch": 1813} {"train_loss": -11.658015251159668, "global_step": 304731, "epoch": 1813} {"train_loss": -11.327844619750977, "global_step": 304732, "epoch": 1813} {"train_loss": -11.70810604095459, "global_step": 304733, "epoch": 1813} {"train_loss": -11.262582778930664, "global_step": 304734, "epoch": 1813} {"train_loss": -11.22422981262207, "global_step": 304735, "epoch": 1813} {"train_loss": -11.174224853515625, "global_step": 304736, "epoch": 1813} {"train_loss": -11.683149337768555, "global_step": 304737, "epoch": 1813} {"train_loss": -10.894205093383789, "global_step": 304738, "epoch": 1813} {"train_loss": -11.29779052734375, "global_step": 304739, "epoch": 1813} {"train_loss": -11.777811050415039, "global_step": 304740, "epoch": 1813} {"train_loss": -10.706991195678711, "global_step": 304741, "epoch": 1813} {"train_loss": -11.47948169708252, "global_step": 304742, "epoch": 1813} {"train_loss": -11.3067626953125, "global_step": 304743, "epoch": 1813} {"train_loss": -10.877378463745117, "global_step": 304744, "epoch": 1813} {"train_loss": -11.819860458374023, "global_step": 304745, "epoch": 1813} {"train_loss": -11.32347297668457, "global_step": 304746, "epoch": 1813} {"train_loss": -11.790163040161133, "global_step": 304747, "epoch": 1813} {"train_loss": -11.310969352722168, "global_step": 304748, "epoch": 1813} {"train_loss": -10.890146255493164, "global_step": 304749, "epoch": 1813} {"train_loss": -11.729864120483398, "global_step": 304750, "epoch": 1813} {"train_loss": -11.912554973647708, "global_step": 304751, "epoch": 1813, "val_loss": 284620.0625} {"train_loss": -11.803862571716309, "global_step": 304752, "epoch": 1814} {"train_loss": -12.078643798828125, "global_step": 304753, "epoch": 1814} {"train_loss": -11.4278564453125, "global_step": 304754, "epoch": 1814} {"train_loss": -11.357588768005371, "global_step": 304755, "epoch": 1814} {"train_loss": -11.730645179748535, "global_step": 304756, "epoch": 1814} {"train_loss": -11.493072509765625, "global_step": 304757, "epoch": 1814} {"train_loss": -11.611970901489258, "global_step": 304758, "epoch": 1814} {"train_loss": -11.799942016601562, "global_step": 304759, "epoch": 1814} {"train_loss": -11.844345092773438, "global_step": 304760, "epoch": 1814} {"train_loss": -11.554084777832031, "global_step": 304761, "epoch": 1814} {"train_loss": -11.940637588500977, "global_step": 304762, "epoch": 1814} {"train_loss": -11.696538925170898, "global_step": 304763, "epoch": 1814} {"train_loss": -11.857231140136719, "global_step": 304764, "epoch": 1814} {"train_loss": -11.832112312316895, "global_step": 304765, "epoch": 1814} {"train_loss": -11.739200592041016, "global_step": 304766, "epoch": 1814} {"train_loss": -11.856977462768555, "global_step": 304767, "epoch": 1814} {"train_loss": -11.646754264831543, "global_step": 304768, "epoch": 1814} {"train_loss": -12.239012718200684, "global_step": 304769, "epoch": 1814} {"train_loss": -11.658464431762695, "global_step": 304770, "epoch": 1814} {"train_loss": -12.227066993713379, "global_step": 304771, "epoch": 1814} {"train_loss": -11.927288055419922, "global_step": 304772, "epoch": 1814} {"train_loss": -11.996149063110352, "global_step": 304773, "epoch": 1814} {"train_loss": -12.076683044433594, "global_step": 304774, "epoch": 1814} {"train_loss": -12.02020263671875, "global_step": 304775, "epoch": 1814} {"train_loss": -11.898929595947266, "global_step": 304776, "epoch": 1814} {"train_loss": -11.814332962036133, "global_step": 304777, "epoch": 1814} {"train_loss": -12.085768699645996, "global_step": 304778, "epoch": 1814} {"train_loss": -12.014842987060547, "global_step": 304779, "epoch": 1814} {"train_loss": -12.146589279174805, "global_step": 304780, "epoch": 1814} {"train_loss": -11.838448524475098, "global_step": 304781, "epoch": 1814} {"train_loss": -11.903947830200195, "global_step": 304782, "epoch": 1814} {"train_loss": -12.229340553283691, "global_step": 304783, "epoch": 1814} {"train_loss": -12.188226699829102, "global_step": 304784, "epoch": 1814} {"train_loss": -12.150310516357422, "global_step": 304785, "epoch": 1814} {"train_loss": -11.893051147460938, "global_step": 304786, "epoch": 1814} {"train_loss": -12.033966064453125, "global_step": 304787, "epoch": 1814} {"train_loss": -12.001500129699707, "global_step": 304788, "epoch": 1814} {"train_loss": -12.214864730834961, "global_step": 304789, "epoch": 1814} {"train_loss": -12.171415328979492, "global_step": 304790, "epoch": 1814} {"train_loss": -12.119719505310059, "global_step": 304791, "epoch": 1814} {"train_loss": -11.972234725952148, "global_step": 304792, "epoch": 1814} {"train_loss": -11.709532737731934, "global_step": 304793, "epoch": 1814} {"train_loss": -12.07728385925293, "global_step": 304794, "epoch": 1814} {"train_loss": -11.76006031036377, "global_step": 304795, "epoch": 1814} {"train_loss": -11.985974311828613, "global_step": 304796, "epoch": 1814} {"train_loss": -11.940256118774414, "global_step": 304797, "epoch": 1814} {"train_loss": -12.331033706665039, "global_step": 304798, "epoch": 1814} {"train_loss": -11.779417037963867, "global_step": 304799, "epoch": 1814} {"train_loss": -12.250027656555176, "global_step": 304800, "epoch": 1814} {"train_loss": -11.781814575195312, "global_step": 304801, "epoch": 1814} {"train_loss": -12.149967193603516, "global_step": 304802, "epoch": 1814} {"train_loss": -11.784505844116211, "global_step": 304803, "epoch": 1814} {"train_loss": -12.180370330810547, "global_step": 304804, "epoch": 1814} {"train_loss": -12.346948623657227, "global_step": 304805, "epoch": 1814} {"train_loss": -12.017921447753906, "global_step": 304806, "epoch": 1814} {"train_loss": -12.397367477416992, "global_step": 304807, "epoch": 1814} {"train_loss": -12.143951416015625, "global_step": 304808, "epoch": 1814} {"train_loss": -12.193063735961914, "global_step": 304809, "epoch": 1814} {"train_loss": -11.895332336425781, "global_step": 304810, "epoch": 1814} {"train_loss": -11.658393859863281, "global_step": 304811, "epoch": 1814} {"train_loss": -11.672508239746094, "global_step": 304812, "epoch": 1814} {"train_loss": -12.040390968322754, "global_step": 304813, "epoch": 1814} {"train_loss": -11.593610763549805, "global_step": 304814, "epoch": 1814} {"train_loss": -11.807907104492188, "global_step": 304815, "epoch": 1814} {"train_loss": -12.333093643188477, "global_step": 304816, "epoch": 1814} {"train_loss": -11.677492141723633, "global_step": 304817, "epoch": 1814} {"train_loss": -11.68907642364502, "global_step": 304818, "epoch": 1814} {"train_loss": -11.962112426757812, "global_step": 304819, "epoch": 1814} {"train_loss": -12.071905136108398, "global_step": 304820, "epoch": 1814} {"train_loss": -12.06064224243164, "global_step": 304821, "epoch": 1814} {"train_loss": -12.506185531616211, "global_step": 304822, "epoch": 1814} {"train_loss": -11.900184631347656, "global_step": 304823, "epoch": 1814} {"train_loss": -12.319599151611328, "global_step": 304824, "epoch": 1814} {"train_loss": -11.83876895904541, "global_step": 304825, "epoch": 1814} {"train_loss": -12.034872055053711, "global_step": 304826, "epoch": 1814} {"train_loss": -12.283632278442383, "global_step": 304827, "epoch": 1814} {"train_loss": -12.219783782958984, "global_step": 304828, "epoch": 1814} {"train_loss": -12.059134483337402, "global_step": 304829, "epoch": 1814} {"train_loss": -12.142866134643555, "global_step": 304830, "epoch": 1814} {"train_loss": -11.439254760742188, "global_step": 304831, "epoch": 1814} {"train_loss": -12.12260627746582, "global_step": 304832, "epoch": 1814} {"train_loss": -10.865368843078613, "global_step": 304833, "epoch": 1814} {"train_loss": -11.2932767868042, "global_step": 304834, "epoch": 1814} {"train_loss": -11.617328643798828, "global_step": 304835, "epoch": 1814} {"train_loss": -10.996532440185547, "global_step": 304836, "epoch": 1814} {"train_loss": -11.964242935180664, "global_step": 304837, "epoch": 1814} {"train_loss": -10.987432479858398, "global_step": 304838, "epoch": 1814} {"train_loss": -11.561201095581055, "global_step": 304839, "epoch": 1814} {"train_loss": -11.299339294433594, "global_step": 304840, "epoch": 1814} {"train_loss": -11.620494842529297, "global_step": 304841, "epoch": 1814} {"train_loss": -11.915962219238281, "global_step": 304842, "epoch": 1814} {"train_loss": -11.55058765411377, "global_step": 304843, "epoch": 1814} {"train_loss": -11.841184616088867, "global_step": 304844, "epoch": 1814} {"train_loss": -11.671579360961914, "global_step": 304845, "epoch": 1814} {"train_loss": -11.242402076721191, "global_step": 304846, "epoch": 1814} {"train_loss": -12.238064765930176, "global_step": 304847, "epoch": 1814} {"train_loss": -11.668481826782227, "global_step": 304848, "epoch": 1814} {"train_loss": -11.694308280944824, "global_step": 304849, "epoch": 1814} {"train_loss": -11.098333358764648, "global_step": 304850, "epoch": 1814} {"train_loss": -10.804927825927734, "global_step": 304851, "epoch": 1814} {"train_loss": -11.640544891357422, "global_step": 304852, "epoch": 1814} {"train_loss": -10.136445999145508, "global_step": 304853, "epoch": 1814} {"train_loss": -11.284605026245117, "global_step": 304854, "epoch": 1814} {"train_loss": -10.85659408569336, "global_step": 304855, "epoch": 1814} {"train_loss": -10.296202659606934, "global_step": 304856, "epoch": 1814} {"train_loss": -10.278223037719727, "global_step": 304857, "epoch": 1814} {"train_loss": -10.061676025390625, "global_step": 304858, "epoch": 1814} {"train_loss": -11.071751594543457, "global_step": 304859, "epoch": 1814} {"train_loss": -11.044811248779297, "global_step": 304860, "epoch": 1814} {"train_loss": -11.324034690856934, "global_step": 304861, "epoch": 1814} {"train_loss": -10.944286346435547, "global_step": 304862, "epoch": 1814} {"train_loss": -11.699348449707031, "global_step": 304863, "epoch": 1814} {"train_loss": -11.59334945678711, "global_step": 304864, "epoch": 1814} {"train_loss": -11.9300537109375, "global_step": 304865, "epoch": 1814} {"train_loss": -11.279952049255371, "global_step": 304866, "epoch": 1814} {"train_loss": -12.042253494262695, "global_step": 304867, "epoch": 1814} {"train_loss": -11.701189041137695, "global_step": 304868, "epoch": 1814} {"train_loss": -12.092052459716797, "global_step": 304869, "epoch": 1814} {"train_loss": -11.675930976867676, "global_step": 304870, "epoch": 1814} {"train_loss": -11.823976516723633, "global_step": 304871, "epoch": 1814} {"train_loss": -11.783212661743164, "global_step": 304872, "epoch": 1814} {"train_loss": -12.008663177490234, "global_step": 304873, "epoch": 1814} {"train_loss": -11.736824035644531, "global_step": 304874, "epoch": 1814} {"train_loss": -12.118171691894531, "global_step": 304875, "epoch": 1814} {"train_loss": -12.070588111877441, "global_step": 304876, "epoch": 1814} {"train_loss": -11.880735397338867, "global_step": 304877, "epoch": 1814} {"train_loss": -11.956972122192383, "global_step": 304878, "epoch": 1814} {"train_loss": -11.641681671142578, "global_step": 304879, "epoch": 1814} {"train_loss": -12.110957145690918, "global_step": 304880, "epoch": 1814} {"train_loss": -11.831774711608887, "global_step": 304881, "epoch": 1814} {"train_loss": -11.888516426086426, "global_step": 304882, "epoch": 1814} {"train_loss": -11.780733108520508, "global_step": 304883, "epoch": 1814} {"train_loss": -11.154250144958496, "global_step": 304884, "epoch": 1814} {"train_loss": -11.790618896484375, "global_step": 304885, "epoch": 1814} {"train_loss": -11.680659294128418, "global_step": 304886, "epoch": 1814} {"train_loss": -11.476607322692871, "global_step": 304887, "epoch": 1814} {"train_loss": -10.93625259399414, "global_step": 304888, "epoch": 1814} {"train_loss": -11.04703426361084, "global_step": 304889, "epoch": 1814} {"train_loss": -11.856313705444336, "global_step": 304890, "epoch": 1814} {"train_loss": -11.569334030151367, "global_step": 304891, "epoch": 1814} {"train_loss": -11.946378707885742, "global_step": 304892, "epoch": 1814} {"train_loss": -11.396268844604492, "global_step": 304893, "epoch": 1814} {"train_loss": -11.691693305969238, "global_step": 304894, "epoch": 1814} {"train_loss": -10.966041564941406, "global_step": 304895, "epoch": 1814} {"train_loss": -11.866374969482422, "global_step": 304896, "epoch": 1814} {"train_loss": -11.086389541625977, "global_step": 304897, "epoch": 1814} {"train_loss": -10.666265487670898, "global_step": 304898, "epoch": 1814} {"train_loss": -11.402738571166992, "global_step": 304899, "epoch": 1814} {"train_loss": -10.78622817993164, "global_step": 304900, "epoch": 1814} {"train_loss": -11.35439395904541, "global_step": 304901, "epoch": 1814} {"train_loss": -11.353336334228516, "global_step": 304902, "epoch": 1814} {"train_loss": -11.830890655517578, "global_step": 304903, "epoch": 1814} {"train_loss": -11.115263938903809, "global_step": 304904, "epoch": 1814} {"train_loss": -11.39438247680664, "global_step": 304905, "epoch": 1814} {"train_loss": -11.295473098754883, "global_step": 304906, "epoch": 1814} {"train_loss": -11.300689697265625, "global_step": 304907, "epoch": 1814} {"train_loss": -11.479421615600586, "global_step": 304908, "epoch": 1814} {"train_loss": -11.894205093383789, "global_step": 304909, "epoch": 1814} {"train_loss": -11.363048553466797, "global_step": 304910, "epoch": 1814} {"train_loss": -11.766862869262695, "global_step": 304911, "epoch": 1814} {"train_loss": -11.932519912719727, "global_step": 304912, "epoch": 1814} {"train_loss": -11.879083633422852, "global_step": 304913, "epoch": 1814} {"train_loss": -11.572805404663086, "global_step": 304914, "epoch": 1814} {"train_loss": -12.077983856201172, "global_step": 304915, "epoch": 1814} {"train_loss": -11.596128463745117, "global_step": 304916, "epoch": 1814} {"train_loss": -11.586809158325195, "global_step": 304917, "epoch": 1814} {"train_loss": -11.456977844238281, "global_step": 304918, "epoch": 1814} {"train_loss": -11.70361145905086, "global_step": 304919, "epoch": 1814, "val_loss": 281148.84375} {"train_loss": -12.05279541015625, "global_step": 304920, "epoch": 1815} {"train_loss": -11.519452095031738, "global_step": 304921, "epoch": 1815} {"train_loss": -12.048255920410156, "global_step": 304922, "epoch": 1815} {"train_loss": -11.534651756286621, "global_step": 304923, "epoch": 1815} {"train_loss": -12.076359748840332, "global_step": 304924, "epoch": 1815} {"train_loss": -11.399114608764648, "global_step": 304925, "epoch": 1815} {"train_loss": -12.078527450561523, "global_step": 304926, "epoch": 1815} {"train_loss": -11.628211975097656, "global_step": 304927, "epoch": 1815} {"train_loss": -11.951149940490723, "global_step": 304928, "epoch": 1815} {"train_loss": -11.80681037902832, "global_step": 304929, "epoch": 1815} {"train_loss": -12.104073524475098, "global_step": 304930, "epoch": 1815} {"train_loss": -11.763526916503906, "global_step": 304931, "epoch": 1815} {"train_loss": -11.802046775817871, "global_step": 304932, "epoch": 1815} {"train_loss": -12.213981628417969, "global_step": 304933, "epoch": 1815} {"train_loss": -11.877334594726562, "global_step": 304934, "epoch": 1815} {"train_loss": -11.972209930419922, "global_step": 304935, "epoch": 1815} {"train_loss": -11.888460159301758, "global_step": 304936, "epoch": 1815} {"train_loss": -11.669828414916992, "global_step": 304937, "epoch": 1815} {"train_loss": -11.667088508605957, "global_step": 304938, "epoch": 1815} {"train_loss": -11.930047988891602, "global_step": 304939, "epoch": 1815} {"train_loss": -11.987052917480469, "global_step": 304940, "epoch": 1815} {"train_loss": -12.113655090332031, "global_step": 304941, "epoch": 1815} {"train_loss": -11.799810409545898, "global_step": 304942, "epoch": 1815} {"train_loss": -12.089895248413086, "global_step": 304943, "epoch": 1815} {"train_loss": -11.972744941711426, "global_step": 304944, "epoch": 1815} {"train_loss": -11.84953498840332, "global_step": 304945, "epoch": 1815} {"train_loss": -12.244466781616211, "global_step": 304946, "epoch": 1815} {"train_loss": -11.432576179504395, "global_step": 304947, "epoch": 1815} {"train_loss": -12.150245666503906, "global_step": 304948, "epoch": 1815} {"train_loss": -11.775060653686523, "global_step": 304949, "epoch": 1815} {"train_loss": -11.70269775390625, "global_step": 304950, "epoch": 1815} {"train_loss": -12.211929321289062, "global_step": 304951, "epoch": 1815} {"train_loss": -11.59457778930664, "global_step": 304952, "epoch": 1815} {"train_loss": -12.166889190673828, "global_step": 304953, "epoch": 1815} {"train_loss": -11.9310302734375, "global_step": 304954, "epoch": 1815} {"train_loss": -11.798477172851562, "global_step": 304955, "epoch": 1815} {"train_loss": -11.661113739013672, "global_step": 304956, "epoch": 1815} {"train_loss": -12.062145233154297, "global_step": 304957, "epoch": 1815} {"train_loss": -11.800710678100586, "global_step": 304958, "epoch": 1815} {"train_loss": -12.109081268310547, "global_step": 304959, "epoch": 1815} {"train_loss": -12.064075469970703, "global_step": 304960, "epoch": 1815} {"train_loss": -11.538329124450684, "global_step": 304961, "epoch": 1815} {"train_loss": -12.136964797973633, "global_step": 304962, "epoch": 1815} {"train_loss": -11.757659912109375, "global_step": 304963, "epoch": 1815} {"train_loss": -12.264408111572266, "global_step": 304964, "epoch": 1815} {"train_loss": -11.859766006469727, "global_step": 304965, "epoch": 1815} {"train_loss": -11.601224899291992, "global_step": 304966, "epoch": 1815} {"train_loss": -12.1585693359375, "global_step": 304967, "epoch": 1815} {"train_loss": -11.881258010864258, "global_step": 304968, "epoch": 1815} {"train_loss": -12.271900177001953, "global_step": 304969, "epoch": 1815} {"train_loss": -11.880879402160645, "global_step": 304970, "epoch": 1815} {"train_loss": -12.058329582214355, "global_step": 304971, "epoch": 1815} {"train_loss": -11.884029388427734, "global_step": 304972, "epoch": 1815} {"train_loss": -11.701231956481934, "global_step": 304973, "epoch": 1815} {"train_loss": -11.884243965148926, "global_step": 304974, "epoch": 1815} {"train_loss": -11.826583862304688, "global_step": 304975, "epoch": 1815} {"train_loss": -12.186528205871582, "global_step": 304976, "epoch": 1815} {"train_loss": -11.86037826538086, "global_step": 304977, "epoch": 1815} {"train_loss": -12.043380737304688, "global_step": 304978, "epoch": 1815} {"train_loss": -11.966526985168457, "global_step": 304979, "epoch": 1815} {"train_loss": -12.263080596923828, "global_step": 304980, "epoch": 1815} {"train_loss": -12.304471015930176, "global_step": 304981, "epoch": 1815} {"train_loss": -12.005470275878906, "global_step": 304982, "epoch": 1815} {"train_loss": -12.334845542907715, "global_step": 304983, "epoch": 1815} {"train_loss": -12.483105659484863, "global_step": 304984, "epoch": 1815} {"train_loss": -12.110301971435547, "global_step": 304985, "epoch": 1815} {"train_loss": -12.326141357421875, "global_step": 304986, "epoch": 1815} {"train_loss": -12.13387393951416, "global_step": 304987, "epoch": 1815} {"train_loss": -12.24233341217041, "global_step": 304988, "epoch": 1815} {"train_loss": -12.340335845947266, "global_step": 304989, "epoch": 1815} {"train_loss": -12.209712982177734, "global_step": 304990, "epoch": 1815} {"train_loss": -12.422884941101074, "global_step": 304991, "epoch": 1815} {"train_loss": -12.211424827575684, "global_step": 304992, "epoch": 1815} {"train_loss": -12.469112396240234, "global_step": 304993, "epoch": 1815} {"train_loss": -12.309850692749023, "global_step": 304994, "epoch": 1815} {"train_loss": -12.272605895996094, "global_step": 304995, "epoch": 1815} {"train_loss": -12.410501480102539, "global_step": 304996, "epoch": 1815} {"train_loss": -12.534101486206055, "global_step": 304997, "epoch": 1815} {"train_loss": -12.406371116638184, "global_step": 304998, "epoch": 1815} {"train_loss": -12.3295316696167, "global_step": 304999, "epoch": 1815} {"train_loss": -12.479145050048828, "global_step": 305000, "epoch": 1815} {"train_loss": -12.493871688842773, "global_step": 305001, "epoch": 1815} {"train_loss": -12.565052032470703, "global_step": 305002, "epoch": 1815} {"train_loss": -12.395505905151367, "global_step": 305003, "epoch": 1815} {"train_loss": -12.641402244567871, "global_step": 305004, "epoch": 1815} {"train_loss": -12.408557891845703, "global_step": 305005, "epoch": 1815} {"train_loss": -12.575216293334961, "global_step": 305006, "epoch": 1815} {"train_loss": -12.412460327148438, "global_step": 305007, "epoch": 1815} {"train_loss": -12.45880126953125, "global_step": 305008, "epoch": 1815} {"train_loss": -12.551406860351562, "global_step": 305009, "epoch": 1815} {"train_loss": -12.28136157989502, "global_step": 305010, "epoch": 1815} {"train_loss": -12.331846237182617, "global_step": 305011, "epoch": 1815} {"train_loss": -12.404027938842773, "global_step": 305012, "epoch": 1815} {"train_loss": -12.645296096801758, "global_step": 305013, "epoch": 1815} {"train_loss": -12.066689491271973, "global_step": 305014, "epoch": 1815} {"train_loss": -11.662673950195312, "global_step": 305015, "epoch": 1815} {"train_loss": -12.030803680419922, "global_step": 305016, "epoch": 1815} {"train_loss": -12.478047370910645, "global_step": 305017, "epoch": 1815} {"train_loss": -11.659478187561035, "global_step": 305018, "epoch": 1815} {"train_loss": -11.898884773254395, "global_step": 305019, "epoch": 1815} {"train_loss": -12.139562606811523, "global_step": 305020, "epoch": 1815} {"train_loss": -12.225110054016113, "global_step": 305021, "epoch": 1815} {"train_loss": -12.291315078735352, "global_step": 305022, "epoch": 1815} {"train_loss": -12.371221542358398, "global_step": 305023, "epoch": 1815} {"train_loss": -12.0865478515625, "global_step": 305024, "epoch": 1815} {"train_loss": -12.195858001708984, "global_step": 305025, "epoch": 1815} {"train_loss": -12.15898323059082, "global_step": 305026, "epoch": 1815} {"train_loss": -11.370452880859375, "global_step": 305027, "epoch": 1815} {"train_loss": -11.859354972839355, "global_step": 305028, "epoch": 1815} {"train_loss": -12.09493637084961, "global_step": 305029, "epoch": 1815} {"train_loss": -12.0552396774292, "global_step": 305030, "epoch": 1815} {"train_loss": -12.032474517822266, "global_step": 305031, "epoch": 1815} {"train_loss": -11.617876052856445, "global_step": 305032, "epoch": 1815} {"train_loss": -11.77743911743164, "global_step": 305033, "epoch": 1815} {"train_loss": -11.813053131103516, "global_step": 305034, "epoch": 1815} {"train_loss": -12.17078971862793, "global_step": 305035, "epoch": 1815} {"train_loss": -11.771173477172852, "global_step": 305036, "epoch": 1815} {"train_loss": -11.9617919921875, "global_step": 305037, "epoch": 1815} {"train_loss": -12.292346000671387, "global_step": 305038, "epoch": 1815} {"train_loss": -12.239770889282227, "global_step": 305039, "epoch": 1815} {"train_loss": -12.03470230102539, "global_step": 305040, "epoch": 1815} {"train_loss": -12.146001815795898, "global_step": 305041, "epoch": 1815} {"train_loss": -12.151206970214844, "global_step": 305042, "epoch": 1815} {"train_loss": -11.837666511535645, "global_step": 305043, "epoch": 1815} {"train_loss": -12.389019012451172, "global_step": 305044, "epoch": 1815} {"train_loss": -12.382950782775879, "global_step": 305045, "epoch": 1815} {"train_loss": -12.202127456665039, "global_step": 305046, "epoch": 1815} {"train_loss": -12.337696075439453, "global_step": 305047, "epoch": 1815} {"train_loss": -12.204895973205566, "global_step": 305048, "epoch": 1815} {"train_loss": -12.056900978088379, "global_step": 305049, "epoch": 1815} {"train_loss": -11.638474464416504, "global_step": 305050, "epoch": 1815} {"train_loss": -11.930316925048828, "global_step": 305051, "epoch": 1815} {"train_loss": -12.36011028289795, "global_step": 305052, "epoch": 1815} {"train_loss": -11.75019359588623, "global_step": 305053, "epoch": 1815} {"train_loss": -11.427734375, "global_step": 305054, "epoch": 1815} {"train_loss": -11.641290664672852, "global_step": 305055, "epoch": 1815} {"train_loss": -12.078006744384766, "global_step": 305056, "epoch": 1815} {"train_loss": -11.64769458770752, "global_step": 305057, "epoch": 1815} {"train_loss": -11.145572662353516, "global_step": 305058, "epoch": 1815} {"train_loss": -12.22288703918457, "global_step": 305059, "epoch": 1815} {"train_loss": -11.738336563110352, "global_step": 305060, "epoch": 1815} {"train_loss": -10.797491073608398, "global_step": 305061, "epoch": 1815} {"train_loss": -12.043588638305664, "global_step": 305062, "epoch": 1815} {"train_loss": -11.996358871459961, "global_step": 305063, "epoch": 1815} {"train_loss": -11.498832702636719, "global_step": 305064, "epoch": 1815} {"train_loss": -11.30286693572998, "global_step": 305065, "epoch": 1815} {"train_loss": -12.194311141967773, "global_step": 305066, "epoch": 1815} {"train_loss": -11.358720779418945, "global_step": 305067, "epoch": 1815} {"train_loss": -11.313934326171875, "global_step": 305068, "epoch": 1815} {"train_loss": -11.602514266967773, "global_step": 305069, "epoch": 1815} {"train_loss": -12.145734786987305, "global_step": 305070, "epoch": 1815} {"train_loss": -11.400745391845703, "global_step": 305071, "epoch": 1815} {"train_loss": -11.893159866333008, "global_step": 305072, "epoch": 1815} {"train_loss": -11.41986083984375, "global_step": 305073, "epoch": 1815} {"train_loss": -12.014595985412598, "global_step": 305074, "epoch": 1815} {"train_loss": -11.874792098999023, "global_step": 305075, "epoch": 1815} {"train_loss": -11.564716339111328, "global_step": 305076, "epoch": 1815} {"train_loss": -10.975550651550293, "global_step": 305077, "epoch": 1815} {"train_loss": -11.502429008483887, "global_step": 305078, "epoch": 1815} {"train_loss": -11.052048683166504, "global_step": 305079, "epoch": 1815} {"train_loss": -11.15760612487793, "global_step": 305080, "epoch": 1815} {"train_loss": -10.945940017700195, "global_step": 305081, "epoch": 1815} {"train_loss": -11.513145446777344, "global_step": 305082, "epoch": 1815} {"train_loss": -10.833333969116211, "global_step": 305083, "epoch": 1815} {"train_loss": -11.009452819824219, "global_step": 305084, "epoch": 1815} {"train_loss": -11.153118133544922, "global_step": 305085, "epoch": 1815} {"train_loss": -11.222548484802246, "global_step": 305086, "epoch": 1815} {"train_loss": -11.948087363016038, "global_step": 305087, "epoch": 1815, "val_loss": 281959.0, "train_action_mse_error": 1.6824268102645874} {"train_loss": -11.771514892578125, "global_step": 305088, "epoch": 1816} {"train_loss": -10.60183334350586, "global_step": 305089, "epoch": 1816} {"train_loss": -11.141928672790527, "global_step": 305090, "epoch": 1816} {"train_loss": -10.260492324829102, "global_step": 305091, "epoch": 1816} {"train_loss": -8.743487358093262, "global_step": 305092, "epoch": 1816} {"train_loss": -10.925188064575195, "global_step": 305093, "epoch": 1816} {"train_loss": -9.469186782836914, "global_step": 305094, "epoch": 1816} {"train_loss": -11.137434005737305, "global_step": 305095, "epoch": 1816} {"train_loss": -9.501045227050781, "global_step": 305096, "epoch": 1816} {"train_loss": -11.674500465393066, "global_step": 305097, "epoch": 1816} {"train_loss": -9.951881408691406, "global_step": 305098, "epoch": 1816} {"train_loss": -11.506176948547363, "global_step": 305099, "epoch": 1816} {"train_loss": -9.803037643432617, "global_step": 305100, "epoch": 1816} {"train_loss": -11.899741172790527, "global_step": 305101, "epoch": 1816} {"train_loss": -10.120842933654785, "global_step": 305102, "epoch": 1816} {"train_loss": -11.698291778564453, "global_step": 305103, "epoch": 1816} {"train_loss": -10.60086727142334, "global_step": 305104, "epoch": 1816} {"train_loss": -11.649105072021484, "global_step": 305105, "epoch": 1816} {"train_loss": -10.469367027282715, "global_step": 305106, "epoch": 1816} {"train_loss": -11.534396171569824, "global_step": 305107, "epoch": 1816} {"train_loss": -10.814920425415039, "global_step": 305108, "epoch": 1816} {"train_loss": -11.77059268951416, "global_step": 305109, "epoch": 1816} {"train_loss": -10.977924346923828, "global_step": 305110, "epoch": 1816} {"train_loss": -11.437591552734375, "global_step": 305111, "epoch": 1816} {"train_loss": -11.698230743408203, "global_step": 305112, "epoch": 1816} {"train_loss": -11.526848793029785, "global_step": 305113, "epoch": 1816} {"train_loss": -11.368404388427734, "global_step": 305114, "epoch": 1816} {"train_loss": -11.253607749938965, "global_step": 305115, "epoch": 1816} {"train_loss": -11.602361679077148, "global_step": 305116, "epoch": 1816} {"train_loss": -11.727474212646484, "global_step": 305117, "epoch": 1816} {"train_loss": -12.065123558044434, "global_step": 305118, "epoch": 1816} {"train_loss": -11.586167335510254, "global_step": 305119, "epoch": 1816} {"train_loss": -11.800174713134766, "global_step": 305120, "epoch": 1816} {"train_loss": -11.726755142211914, "global_step": 305121, "epoch": 1816} {"train_loss": -11.600179672241211, "global_step": 305122, "epoch": 1816} {"train_loss": -11.786837577819824, "global_step": 305123, "epoch": 1816} {"train_loss": -11.739150047302246, "global_step": 305124, "epoch": 1816} {"train_loss": -11.909646034240723, "global_step": 305125, "epoch": 1816} {"train_loss": -11.758264541625977, "global_step": 305126, "epoch": 1816} {"train_loss": -11.850122451782227, "global_step": 305127, "epoch": 1816} {"train_loss": -11.755300521850586, "global_step": 305128, "epoch": 1816} {"train_loss": -12.09661865234375, "global_step": 305129, "epoch": 1816} {"train_loss": -12.041193008422852, "global_step": 305130, "epoch": 1816} {"train_loss": -12.266153335571289, "global_step": 305131, "epoch": 1816} {"train_loss": -12.216928482055664, "global_step": 305132, "epoch": 1816} {"train_loss": -11.906082153320312, "global_step": 305133, "epoch": 1816} {"train_loss": -12.14437484741211, "global_step": 305134, "epoch": 1816} {"train_loss": -12.129700660705566, "global_step": 305135, "epoch": 1816} {"train_loss": -12.080469131469727, "global_step": 305136, "epoch": 1816} {"train_loss": -12.153839111328125, "global_step": 305137, "epoch": 1816} {"train_loss": -12.185578346252441, "global_step": 305138, "epoch": 1816} {"train_loss": -12.217842102050781, "global_step": 305139, "epoch": 1816} {"train_loss": -11.917863845825195, "global_step": 305140, "epoch": 1816} {"train_loss": -12.382341384887695, "global_step": 305141, "epoch": 1816} {"train_loss": -12.248176574707031, "global_step": 305142, "epoch": 1816} {"train_loss": -12.251060485839844, "global_step": 305143, "epoch": 1816} {"train_loss": -12.011249542236328, "global_step": 305144, "epoch": 1816} {"train_loss": -12.185575485229492, "global_step": 305145, "epoch": 1816} {"train_loss": -12.31201457977295, "global_step": 305146, "epoch": 1816} {"train_loss": -12.228373527526855, "global_step": 305147, "epoch": 1816} {"train_loss": -12.368030548095703, "global_step": 305148, "epoch": 1816} {"train_loss": -12.205523490905762, "global_step": 305149, "epoch": 1816} {"train_loss": -12.362152099609375, "global_step": 305150, "epoch": 1816} {"train_loss": -12.394190788269043, "global_step": 305151, "epoch": 1816} {"train_loss": -12.271605491638184, "global_step": 305152, "epoch": 1816} {"train_loss": -12.451356887817383, "global_step": 305153, "epoch": 1816} {"train_loss": -12.293478012084961, "global_step": 305154, "epoch": 1816} {"train_loss": -12.390829086303711, "global_step": 305155, "epoch": 1816} {"train_loss": -12.367847442626953, "global_step": 305156, "epoch": 1816} {"train_loss": -12.086071014404297, "global_step": 305157, "epoch": 1816} {"train_loss": -12.416394233703613, "global_step": 305158, "epoch": 1816} {"train_loss": -12.424505233764648, "global_step": 305159, "epoch": 1816} {"train_loss": -12.30961799621582, "global_step": 305160, "epoch": 1816} {"train_loss": -12.262683868408203, "global_step": 305161, "epoch": 1816} {"train_loss": -12.336511611938477, "global_step": 305162, "epoch": 1816} {"train_loss": -12.23846435546875, "global_step": 305163, "epoch": 1816} {"train_loss": -12.188478469848633, "global_step": 305164, "epoch": 1816} {"train_loss": -12.449331283569336, "global_step": 305165, "epoch": 1816} {"train_loss": -12.380239486694336, "global_step": 305166, "epoch": 1816} {"train_loss": -12.38772201538086, "global_step": 305167, "epoch": 1816} {"train_loss": -12.485981941223145, "global_step": 305168, "epoch": 1816} {"train_loss": -12.444762229919434, "global_step": 305169, "epoch": 1816} {"train_loss": -12.515811920166016, "global_step": 305170, "epoch": 1816} {"train_loss": -12.532401084899902, "global_step": 305171, "epoch": 1816} {"train_loss": -12.421659469604492, "global_step": 305172, "epoch": 1816} {"train_loss": -12.421711921691895, "global_step": 305173, "epoch": 1816} {"train_loss": -12.537336349487305, "global_step": 305174, "epoch": 1816} {"train_loss": -12.460151672363281, "global_step": 305175, "epoch": 1816} {"train_loss": -12.357519149780273, "global_step": 305176, "epoch": 1816} {"train_loss": -12.134660720825195, "global_step": 305177, "epoch": 1816} {"train_loss": -12.548507690429688, "global_step": 305178, "epoch": 1816} {"train_loss": -12.536336898803711, "global_step": 305179, "epoch": 1816} {"train_loss": -12.642570495605469, "global_step": 305180, "epoch": 1816} {"train_loss": -12.448354721069336, "global_step": 305181, "epoch": 1816} {"train_loss": -12.546219825744629, "global_step": 305182, "epoch": 1816} {"train_loss": -12.436586380004883, "global_step": 305183, "epoch": 1816} {"train_loss": -12.228483200073242, "global_step": 305184, "epoch": 1816} {"train_loss": -12.126561164855957, "global_step": 305185, "epoch": 1816} {"train_loss": -12.411104202270508, "global_step": 305186, "epoch": 1816} {"train_loss": -12.303491592407227, "global_step": 305187, "epoch": 1816} {"train_loss": -12.134122848510742, "global_step": 305188, "epoch": 1816} {"train_loss": -12.357810974121094, "global_step": 305189, "epoch": 1816} {"train_loss": -12.30510425567627, "global_step": 305190, "epoch": 1816} {"train_loss": -12.373344421386719, "global_step": 305191, "epoch": 1816} {"train_loss": -12.65557861328125, "global_step": 305192, "epoch": 1816} {"train_loss": -12.159958839416504, "global_step": 305193, "epoch": 1816} {"train_loss": -12.335262298583984, "global_step": 305194, "epoch": 1816} {"train_loss": -12.27491569519043, "global_step": 305195, "epoch": 1816} {"train_loss": -12.600790023803711, "global_step": 305196, "epoch": 1816} {"train_loss": -12.385749816894531, "global_step": 305197, "epoch": 1816} {"train_loss": -12.616708755493164, "global_step": 305198, "epoch": 1816} {"train_loss": -12.343317985534668, "global_step": 305199, "epoch": 1816} {"train_loss": -12.145090103149414, "global_step": 305200, "epoch": 1816} {"train_loss": -12.422765731811523, "global_step": 305201, "epoch": 1816} {"train_loss": -12.379705429077148, "global_step": 305202, "epoch": 1816} {"train_loss": -12.147945404052734, "global_step": 305203, "epoch": 1816} {"train_loss": -11.93482780456543, "global_step": 305204, "epoch": 1816} {"train_loss": -11.754314422607422, "global_step": 305205, "epoch": 1816} {"train_loss": -12.127094268798828, "global_step": 305206, "epoch": 1816} {"train_loss": -11.97464370727539, "global_step": 305207, "epoch": 1816} {"train_loss": -12.042433738708496, "global_step": 305208, "epoch": 1816} {"train_loss": -12.121805191040039, "global_step": 305209, "epoch": 1816} {"train_loss": -12.28376293182373, "global_step": 305210, "epoch": 1816} {"train_loss": -11.806267738342285, "global_step": 305211, "epoch": 1816} {"train_loss": -12.352602005004883, "global_step": 305212, "epoch": 1816} {"train_loss": -12.478583335876465, "global_step": 305213, "epoch": 1816} {"train_loss": -11.974607467651367, "global_step": 305214, "epoch": 1816} {"train_loss": -12.426558494567871, "global_step": 305215, "epoch": 1816} {"train_loss": -12.29593276977539, "global_step": 305216, "epoch": 1816} {"train_loss": -12.410872459411621, "global_step": 305217, "epoch": 1816} {"train_loss": -12.327568054199219, "global_step": 305218, "epoch": 1816} {"train_loss": -11.731199264526367, "global_step": 305219, "epoch": 1816} {"train_loss": -11.479907035827637, "global_step": 305220, "epoch": 1816} {"train_loss": -12.028637886047363, "global_step": 305221, "epoch": 1816} {"train_loss": -11.22195816040039, "global_step": 305222, "epoch": 1816} {"train_loss": -11.020928382873535, "global_step": 305223, "epoch": 1816} {"train_loss": -11.500557899475098, "global_step": 305224, "epoch": 1816} {"train_loss": -10.747337341308594, "global_step": 305225, "epoch": 1816} {"train_loss": -10.498973846435547, "global_step": 305226, "epoch": 1816} {"train_loss": -10.747207641601562, "global_step": 305227, "epoch": 1816} {"train_loss": -11.960928916931152, "global_step": 305228, "epoch": 1816} {"train_loss": -11.472631454467773, "global_step": 305229, "epoch": 1816} {"train_loss": -11.599784851074219, "global_step": 305230, "epoch": 1816} {"train_loss": -11.718963623046875, "global_step": 305231, "epoch": 1816} {"train_loss": -11.321907043457031, "global_step": 305232, "epoch": 1816} {"train_loss": -11.167351722717285, "global_step": 305233, "epoch": 1816} {"train_loss": -11.202534675598145, "global_step": 305234, "epoch": 1816} {"train_loss": -10.876370429992676, "global_step": 305235, "epoch": 1816} {"train_loss": -9.45115852355957, "global_step": 305236, "epoch": 1816} {"train_loss": -11.09253215789795, "global_step": 305237, "epoch": 1816} {"train_loss": -11.601107597351074, "global_step": 305238, "epoch": 1816} {"train_loss": -9.315389633178711, "global_step": 305239, "epoch": 1816} {"train_loss": -11.842905044555664, "global_step": 305240, "epoch": 1816} {"train_loss": -10.277448654174805, "global_step": 305241, "epoch": 1816} {"train_loss": -9.655527114868164, "global_step": 305242, "epoch": 1816} {"train_loss": -11.653289794921875, "global_step": 305243, "epoch": 1816} {"train_loss": -9.932098388671875, "global_step": 305244, "epoch": 1816} {"train_loss": -11.485918045043945, "global_step": 305245, "epoch": 1816} {"train_loss": -11.53001594543457, "global_step": 305246, "epoch": 1816} {"train_loss": -11.197649002075195, "global_step": 305247, "epoch": 1816} {"train_loss": -11.78895092010498, "global_step": 305248, "epoch": 1816} {"train_loss": -11.100374221801758, "global_step": 305249, "epoch": 1816} {"train_loss": -11.086713790893555, "global_step": 305250, "epoch": 1816} {"train_loss": -11.403253555297852, "global_step": 305251, "epoch": 1816} {"train_loss": -10.748589515686035, "global_step": 305252, "epoch": 1816} {"train_loss": -11.190813064575195, "global_step": 305253, "epoch": 1816} {"train_loss": -10.629194259643555, "global_step": 305254, "epoch": 1816} {"train_loss": -11.756212018785023, "global_step": 305255, "epoch": 1816, "val_loss": 274536.59375} {"train_loss": -10.307319641113281, "global_step": 305256, "epoch": 1817} {"train_loss": -11.612899780273438, "global_step": 305257, "epoch": 1817} {"train_loss": -10.61170768737793, "global_step": 305258, "epoch": 1817} {"train_loss": -10.878691673278809, "global_step": 305259, "epoch": 1817} {"train_loss": -11.087091445922852, "global_step": 305260, "epoch": 1817} {"train_loss": -10.993368148803711, "global_step": 305261, "epoch": 1817} {"train_loss": -11.602202415466309, "global_step": 305262, "epoch": 1817} {"train_loss": -11.000932693481445, "global_step": 305263, "epoch": 1817} {"train_loss": -11.790054321289062, "global_step": 305264, "epoch": 1817} {"train_loss": -10.60415267944336, "global_step": 305265, "epoch": 1817} {"train_loss": -11.516266822814941, "global_step": 305266, "epoch": 1817} {"train_loss": -10.352373123168945, "global_step": 305267, "epoch": 1817} {"train_loss": -11.980184555053711, "global_step": 305268, "epoch": 1817} {"train_loss": -10.765467643737793, "global_step": 305269, "epoch": 1817} {"train_loss": -11.658150672912598, "global_step": 305270, "epoch": 1817} {"train_loss": -11.34620475769043, "global_step": 305271, "epoch": 1817} {"train_loss": -11.710882186889648, "global_step": 305272, "epoch": 1817} {"train_loss": -11.621847152709961, "global_step": 305273, "epoch": 1817} {"train_loss": -11.637871742248535, "global_step": 305274, "epoch": 1817} {"train_loss": -11.55968952178955, "global_step": 305275, "epoch": 1817} {"train_loss": -11.100635528564453, "global_step": 305276, "epoch": 1817} {"train_loss": -11.690824508666992, "global_step": 305277, "epoch": 1817} {"train_loss": -11.927385330200195, "global_step": 305278, "epoch": 1817} {"train_loss": -11.237822532653809, "global_step": 305279, "epoch": 1817} {"train_loss": -11.819072723388672, "global_step": 305280, "epoch": 1817} {"train_loss": -11.482794761657715, "global_step": 305281, "epoch": 1817} {"train_loss": -11.500919342041016, "global_step": 305282, "epoch": 1817} {"train_loss": -11.905084609985352, "global_step": 305283, "epoch": 1817} {"train_loss": -11.858687400817871, "global_step": 305284, "epoch": 1817} {"train_loss": -11.776128768920898, "global_step": 305285, "epoch": 1817} {"train_loss": -11.971325874328613, "global_step": 305286, "epoch": 1817} {"train_loss": -11.845117568969727, "global_step": 305287, "epoch": 1817} {"train_loss": -11.91943645477295, "global_step": 305288, "epoch": 1817} {"train_loss": -11.920934677124023, "global_step": 305289, "epoch": 1817} {"train_loss": -11.87476921081543, "global_step": 305290, "epoch": 1817} {"train_loss": -11.93025016784668, "global_step": 305291, "epoch": 1817} {"train_loss": -11.913057327270508, "global_step": 305292, "epoch": 1817} {"train_loss": -11.921679496765137, "global_step": 305293, "epoch": 1817} {"train_loss": -11.984807014465332, "global_step": 305294, "epoch": 1817} {"train_loss": -11.943145751953125, "global_step": 305295, "epoch": 1817} {"train_loss": -12.027666091918945, "global_step": 305296, "epoch": 1817} {"train_loss": -12.14219856262207, "global_step": 305297, "epoch": 1817} {"train_loss": -12.022598266601562, "global_step": 305298, "epoch": 1817} {"train_loss": -12.252973556518555, "global_step": 305299, "epoch": 1817} {"train_loss": -12.243672370910645, "global_step": 305300, "epoch": 1817} {"train_loss": -11.793209075927734, "global_step": 305301, "epoch": 1817} {"train_loss": -12.04772663116455, "global_step": 305302, "epoch": 1817} {"train_loss": -12.139687538146973, "global_step": 305303, "epoch": 1817} {"train_loss": -12.115999221801758, "global_step": 305304, "epoch": 1817} {"train_loss": -12.199990272521973, "global_step": 305305, "epoch": 1817} {"train_loss": -12.295653343200684, "global_step": 305306, "epoch": 1817} {"train_loss": -12.174354553222656, "global_step": 305307, "epoch": 1817} {"train_loss": -12.24671459197998, "global_step": 305308, "epoch": 1817} {"train_loss": -12.236881256103516, "global_step": 305309, "epoch": 1817} {"train_loss": -12.217573165893555, "global_step": 305310, "epoch": 1817} {"train_loss": -12.249940872192383, "global_step": 305311, "epoch": 1817} {"train_loss": -12.158415794372559, "global_step": 305312, "epoch": 1817} {"train_loss": -12.289693832397461, "global_step": 305313, "epoch": 1817} {"train_loss": -12.46449089050293, "global_step": 305314, "epoch": 1817} {"train_loss": -12.278820037841797, "global_step": 305315, "epoch": 1817} {"train_loss": -12.322354316711426, "global_step": 305316, "epoch": 1817} {"train_loss": -12.451606750488281, "global_step": 305317, "epoch": 1817} {"train_loss": -12.487039566040039, "global_step": 305318, "epoch": 1817} {"train_loss": -12.491719245910645, "global_step": 305319, "epoch": 1817} {"train_loss": -12.418281555175781, "global_step": 305320, "epoch": 1817} {"train_loss": -12.168231010437012, "global_step": 305321, "epoch": 1817} {"train_loss": -12.471870422363281, "global_step": 305322, "epoch": 1817} {"train_loss": -12.385027885437012, "global_step": 305323, "epoch": 1817} {"train_loss": -12.480901718139648, "global_step": 305324, "epoch": 1817} {"train_loss": -12.425896644592285, "global_step": 305325, "epoch": 1817} {"train_loss": -12.450037002563477, "global_step": 305326, "epoch": 1817} {"train_loss": -12.440071105957031, "global_step": 305327, "epoch": 1817} {"train_loss": -12.489916801452637, "global_step": 305328, "epoch": 1817} {"train_loss": -12.195047378540039, "global_step": 305329, "epoch": 1817} {"train_loss": -12.590948104858398, "global_step": 305330, "epoch": 1817} {"train_loss": -12.46649169921875, "global_step": 305331, "epoch": 1817} {"train_loss": -12.423412322998047, "global_step": 305332, "epoch": 1817} {"train_loss": -12.423718452453613, "global_step": 305333, "epoch": 1817} {"train_loss": -12.104164123535156, "global_step": 305334, "epoch": 1817} {"train_loss": -12.367451667785645, "global_step": 305335, "epoch": 1817} {"train_loss": -12.40992546081543, "global_step": 305336, "epoch": 1817} {"train_loss": -12.291515350341797, "global_step": 305337, "epoch": 1817} {"train_loss": -12.49189567565918, "global_step": 305338, "epoch": 1817} {"train_loss": -12.224691390991211, "global_step": 305339, "epoch": 1817} {"train_loss": -12.479816436767578, "global_step": 305340, "epoch": 1817} {"train_loss": -12.389020919799805, "global_step": 305341, "epoch": 1817} {"train_loss": -11.897275924682617, "global_step": 305342, "epoch": 1817} {"train_loss": -12.069141387939453, "global_step": 305343, "epoch": 1817} {"train_loss": -12.348114013671875, "global_step": 305344, "epoch": 1817} {"train_loss": -11.97259521484375, "global_step": 305345, "epoch": 1817} {"train_loss": -12.068901062011719, "global_step": 305346, "epoch": 1817} {"train_loss": -12.434730529785156, "global_step": 305347, "epoch": 1817} {"train_loss": -12.330802917480469, "global_step": 305348, "epoch": 1817} {"train_loss": -12.408334732055664, "global_step": 305349, "epoch": 1817} {"train_loss": -12.467484474182129, "global_step": 305350, "epoch": 1817} {"train_loss": -12.24354076385498, "global_step": 305351, "epoch": 1817} {"train_loss": -11.766166687011719, "global_step": 305352, "epoch": 1817} {"train_loss": -12.027235984802246, "global_step": 305353, "epoch": 1817} {"train_loss": -12.294692039489746, "global_step": 305354, "epoch": 1817} {"train_loss": -12.150178909301758, "global_step": 305355, "epoch": 1817} {"train_loss": -11.260303497314453, "global_step": 305356, "epoch": 1817} {"train_loss": -11.117181777954102, "global_step": 305357, "epoch": 1817} {"train_loss": -11.953052520751953, "global_step": 305358, "epoch": 1817} {"train_loss": -10.131987571716309, "global_step": 305359, "epoch": 1817} {"train_loss": -11.218047142028809, "global_step": 305360, "epoch": 1817} {"train_loss": -9.362552642822266, "global_step": 305361, "epoch": 1817} {"train_loss": -10.390474319458008, "global_step": 305362, "epoch": 1817} {"train_loss": -10.808073043823242, "global_step": 305363, "epoch": 1817} {"train_loss": -11.2001953125, "global_step": 305364, "epoch": 1817} {"train_loss": -11.087440490722656, "global_step": 305365, "epoch": 1817} {"train_loss": -10.794651985168457, "global_step": 305366, "epoch": 1817} {"train_loss": -11.274320602416992, "global_step": 305367, "epoch": 1817} {"train_loss": -10.7861328125, "global_step": 305368, "epoch": 1817} {"train_loss": -11.60757064819336, "global_step": 305369, "epoch": 1817} {"train_loss": -11.20322322845459, "global_step": 305370, "epoch": 1817} {"train_loss": -11.780323028564453, "global_step": 305371, "epoch": 1817} {"train_loss": -11.487449645996094, "global_step": 305372, "epoch": 1817} {"train_loss": -11.864217758178711, "global_step": 305373, "epoch": 1817} {"train_loss": -11.703425407409668, "global_step": 305374, "epoch": 1817} {"train_loss": -11.65385627746582, "global_step": 305375, "epoch": 1817} {"train_loss": -11.97851276397705, "global_step": 305376, "epoch": 1817} {"train_loss": -11.70331859588623, "global_step": 305377, "epoch": 1817} {"train_loss": -11.755694389343262, "global_step": 305378, "epoch": 1817} {"train_loss": -11.948528289794922, "global_step": 305379, "epoch": 1817} {"train_loss": -11.854623794555664, "global_step": 305380, "epoch": 1817} {"train_loss": -11.397953033447266, "global_step": 305381, "epoch": 1817} {"train_loss": -11.451193809509277, "global_step": 305382, "epoch": 1817} {"train_loss": -10.911964416503906, "global_step": 305383, "epoch": 1817} {"train_loss": -11.901461601257324, "global_step": 305384, "epoch": 1817} {"train_loss": -11.819931030273438, "global_step": 305385, "epoch": 1817} {"train_loss": -11.780403137207031, "global_step": 305386, "epoch": 1817} {"train_loss": -11.930828094482422, "global_step": 305387, "epoch": 1817} {"train_loss": -11.766079902648926, "global_step": 305388, "epoch": 1817} {"train_loss": -11.766084671020508, "global_step": 305389, "epoch": 1817} {"train_loss": -11.36233901977539, "global_step": 305390, "epoch": 1817} {"train_loss": -11.869832992553711, "global_step": 305391, "epoch": 1817} {"train_loss": -11.382251739501953, "global_step": 305392, "epoch": 1817} {"train_loss": -11.414199829101562, "global_step": 305393, "epoch": 1817} {"train_loss": -11.523527145385742, "global_step": 305394, "epoch": 1817} {"train_loss": -11.707085609436035, "global_step": 305395, "epoch": 1817} {"train_loss": -12.244661331176758, "global_step": 305396, "epoch": 1817} {"train_loss": -11.353361129760742, "global_step": 305397, "epoch": 1817} {"train_loss": -11.406506538391113, "global_step": 305398, "epoch": 1817} {"train_loss": -11.626062393188477, "global_step": 305399, "epoch": 1817} {"train_loss": -11.699235916137695, "global_step": 305400, "epoch": 1817} {"train_loss": -11.67841625213623, "global_step": 305401, "epoch": 1817} {"train_loss": -11.869878768920898, "global_step": 305402, "epoch": 1817} {"train_loss": -11.986637115478516, "global_step": 305403, "epoch": 1817} {"train_loss": -11.822056770324707, "global_step": 305404, "epoch": 1817} {"train_loss": -11.923360824584961, "global_step": 305405, "epoch": 1817} {"train_loss": -11.762835502624512, "global_step": 305406, "epoch": 1817} {"train_loss": -12.20240592956543, "global_step": 305407, "epoch": 1817} {"train_loss": -11.785627365112305, "global_step": 305408, "epoch": 1817} {"train_loss": -12.189444541931152, "global_step": 305409, "epoch": 1817} {"train_loss": -11.834352493286133, "global_step": 305410, "epoch": 1817} {"train_loss": -12.356470108032227, "global_step": 305411, "epoch": 1817} {"train_loss": -12.103818893432617, "global_step": 305412, "epoch": 1817} {"train_loss": -12.239450454711914, "global_step": 305413, "epoch": 1817} {"train_loss": -12.06326961517334, "global_step": 305414, "epoch": 1817} {"train_loss": -12.218210220336914, "global_step": 305415, "epoch": 1817} {"train_loss": -12.185944557189941, "global_step": 305416, "epoch": 1817} {"train_loss": -12.048398971557617, "global_step": 305417, "epoch": 1817} {"train_loss": -12.299081802368164, "global_step": 305418, "epoch": 1817} {"train_loss": -12.270172119140625, "global_step": 305419, "epoch": 1817} {"train_loss": -12.258880615234375, "global_step": 305420, "epoch": 1817} {"train_loss": -12.467580795288086, "global_step": 305421, "epoch": 1817} {"train_loss": -12.283703804016113, "global_step": 305422, "epoch": 1817} {"train_loss": -11.837923901421684, "global_step": 305423, "epoch": 1817, "val_loss": 278772.65625} {"train_loss": -12.184020042419434, "global_step": 305424, "epoch": 1818} {"train_loss": -12.250530242919922, "global_step": 305425, "epoch": 1818} {"train_loss": -12.284122467041016, "global_step": 305426, "epoch": 1818} {"train_loss": -11.821096420288086, "global_step": 305427, "epoch": 1818} {"train_loss": -11.370842933654785, "global_step": 305428, "epoch": 1818} {"train_loss": -12.453182220458984, "global_step": 305429, "epoch": 1818} {"train_loss": -11.345388412475586, "global_step": 305430, "epoch": 1818} {"train_loss": -10.410433769226074, "global_step": 305431, "epoch": 1818} {"train_loss": -11.110870361328125, "global_step": 305432, "epoch": 1818} {"train_loss": -10.29206371307373, "global_step": 305433, "epoch": 1818} {"train_loss": -10.42015552520752, "global_step": 305434, "epoch": 1818} {"train_loss": -10.284110069274902, "global_step": 305435, "epoch": 1818} {"train_loss": -9.19503402709961, "global_step": 305436, "epoch": 1818} {"train_loss": -11.523329734802246, "global_step": 305437, "epoch": 1818} {"train_loss": -9.283121109008789, "global_step": 305438, "epoch": 1818} {"train_loss": -12.084153175354004, "global_step": 305439, "epoch": 1818} {"train_loss": -10.3889799118042, "global_step": 305440, "epoch": 1818} {"train_loss": -11.265154838562012, "global_step": 305441, "epoch": 1818} {"train_loss": -10.132365226745605, "global_step": 305442, "epoch": 1818} {"train_loss": -10.445406913757324, "global_step": 305443, "epoch": 1818} {"train_loss": -11.682441711425781, "global_step": 305444, "epoch": 1818} {"train_loss": -9.404501914978027, "global_step": 305445, "epoch": 1818} {"train_loss": -11.786568641662598, "global_step": 305446, "epoch": 1818} {"train_loss": -10.999345779418945, "global_step": 305447, "epoch": 1818} {"train_loss": -11.308197021484375, "global_step": 305448, "epoch": 1818} {"train_loss": -11.61371898651123, "global_step": 305449, "epoch": 1818} {"train_loss": -11.379463195800781, "global_step": 305450, "epoch": 1818} {"train_loss": -11.855720520019531, "global_step": 305451, "epoch": 1818} {"train_loss": -11.32473087310791, "global_step": 305452, "epoch": 1818} {"train_loss": -11.759799003601074, "global_step": 305453, "epoch": 1818} {"train_loss": -11.082417488098145, "global_step": 305454, "epoch": 1818} {"train_loss": -12.024818420410156, "global_step": 305455, "epoch": 1818} {"train_loss": -11.2774076461792, "global_step": 305456, "epoch": 1818} {"train_loss": -11.65312385559082, "global_step": 305457, "epoch": 1818} {"train_loss": -11.539632797241211, "global_step": 305458, "epoch": 1818} {"train_loss": -11.8472900390625, "global_step": 305459, "epoch": 1818} {"train_loss": -11.503349304199219, "global_step": 305460, "epoch": 1818} {"train_loss": -11.69696044921875, "global_step": 305461, "epoch": 1818} {"train_loss": -11.486701965332031, "global_step": 305462, "epoch": 1818} {"train_loss": -11.957620620727539, "global_step": 305463, "epoch": 1818} {"train_loss": -11.602128982543945, "global_step": 305464, "epoch": 1818} {"train_loss": -11.817789077758789, "global_step": 305465, "epoch": 1818} {"train_loss": -11.788145065307617, "global_step": 305466, "epoch": 1818} {"train_loss": -11.634452819824219, "global_step": 305467, "epoch": 1818} {"train_loss": -12.095582962036133, "global_step": 305468, "epoch": 1818} {"train_loss": -11.812816619873047, "global_step": 305469, "epoch": 1818} {"train_loss": -11.902807235717773, "global_step": 305470, "epoch": 1818} {"train_loss": -11.870262145996094, "global_step": 305471, "epoch": 1818} {"train_loss": -11.78024673461914, "global_step": 305472, "epoch": 1818} {"train_loss": -12.00718879699707, "global_step": 305473, "epoch": 1818} {"train_loss": -11.490734100341797, "global_step": 305474, "epoch": 1818} {"train_loss": -11.58082103729248, "global_step": 305475, "epoch": 1818} {"train_loss": -11.729252815246582, "global_step": 305476, "epoch": 1818} {"train_loss": -11.74057674407959, "global_step": 305477, "epoch": 1818} {"train_loss": -12.06096363067627, "global_step": 305478, "epoch": 1818} {"train_loss": -11.952627182006836, "global_step": 305479, "epoch": 1818} {"train_loss": -11.97462272644043, "global_step": 305480, "epoch": 1818} {"train_loss": -11.871904373168945, "global_step": 305481, "epoch": 1818} {"train_loss": -12.01848316192627, "global_step": 305482, "epoch": 1818} {"train_loss": -12.02995491027832, "global_step": 305483, "epoch": 1818} {"train_loss": -11.690996170043945, "global_step": 305484, "epoch": 1818} {"train_loss": -12.048297882080078, "global_step": 305485, "epoch": 1818} {"train_loss": -12.109834671020508, "global_step": 305486, "epoch": 1818} {"train_loss": -12.086320877075195, "global_step": 305487, "epoch": 1818} {"train_loss": -11.826164245605469, "global_step": 305488, "epoch": 1818} {"train_loss": -12.165390014648438, "global_step": 305489, "epoch": 1818} {"train_loss": -11.912660598754883, "global_step": 305490, "epoch": 1818} {"train_loss": -12.214073181152344, "global_step": 305491, "epoch": 1818} {"train_loss": -12.007630348205566, "global_step": 305492, "epoch": 1818} {"train_loss": -12.398271560668945, "global_step": 305493, "epoch": 1818} {"train_loss": -11.991903305053711, "global_step": 305494, "epoch": 1818} {"train_loss": -12.195558547973633, "global_step": 305495, "epoch": 1818} {"train_loss": -12.150646209716797, "global_step": 305496, "epoch": 1818} {"train_loss": -12.318523406982422, "global_step": 305497, "epoch": 1818} {"train_loss": -12.110762596130371, "global_step": 305498, "epoch": 1818} {"train_loss": -12.047197341918945, "global_step": 305499, "epoch": 1818} {"train_loss": -12.087143898010254, "global_step": 305500, "epoch": 1818} {"train_loss": -12.24676513671875, "global_step": 305501, "epoch": 1818} {"train_loss": -12.304848670959473, "global_step": 305502, "epoch": 1818} {"train_loss": -12.35774040222168, "global_step": 305503, "epoch": 1818} {"train_loss": -12.108991622924805, "global_step": 305504, "epoch": 1818} {"train_loss": -12.042990684509277, "global_step": 305505, "epoch": 1818} {"train_loss": -12.330167770385742, "global_step": 305506, "epoch": 1818} {"train_loss": -11.866409301757812, "global_step": 305507, "epoch": 1818} {"train_loss": -12.235857009887695, "global_step": 305508, "epoch": 1818} {"train_loss": -12.111167907714844, "global_step": 305509, "epoch": 1818} {"train_loss": -12.325143814086914, "global_step": 305510, "epoch": 1818} {"train_loss": -12.285446166992188, "global_step": 305511, "epoch": 1818} {"train_loss": -12.40044116973877, "global_step": 305512, "epoch": 1818} {"train_loss": -12.122870445251465, "global_step": 305513, "epoch": 1818} {"train_loss": -12.471975326538086, "global_step": 305514, "epoch": 1818} {"train_loss": -12.258379936218262, "global_step": 305515, "epoch": 1818} {"train_loss": -12.399262428283691, "global_step": 305516, "epoch": 1818} {"train_loss": -12.046693801879883, "global_step": 305517, "epoch": 1818} {"train_loss": -12.127344131469727, "global_step": 305518, "epoch": 1818} {"train_loss": -12.034931182861328, "global_step": 305519, "epoch": 1818} {"train_loss": -11.970623016357422, "global_step": 305520, "epoch": 1818} {"train_loss": -12.114572525024414, "global_step": 305521, "epoch": 1818} {"train_loss": -12.087369918823242, "global_step": 305522, "epoch": 1818} {"train_loss": -12.167757987976074, "global_step": 305523, "epoch": 1818} {"train_loss": -12.078781127929688, "global_step": 305524, "epoch": 1818} {"train_loss": -12.105947494506836, "global_step": 305525, "epoch": 1818} {"train_loss": -12.06058120727539, "global_step": 305526, "epoch": 1818} {"train_loss": -12.317377090454102, "global_step": 305527, "epoch": 1818} {"train_loss": -12.519163131713867, "global_step": 305528, "epoch": 1818} {"train_loss": -12.334564208984375, "global_step": 305529, "epoch": 1818} {"train_loss": -12.284707069396973, "global_step": 305530, "epoch": 1818} {"train_loss": -12.250139236450195, "global_step": 305531, "epoch": 1818} {"train_loss": -12.274627685546875, "global_step": 305532, "epoch": 1818} {"train_loss": -12.238637924194336, "global_step": 305533, "epoch": 1818} {"train_loss": -12.486474990844727, "global_step": 305534, "epoch": 1818} {"train_loss": -12.52380657196045, "global_step": 305535, "epoch": 1818} {"train_loss": -12.272758483886719, "global_step": 305536, "epoch": 1818} {"train_loss": -12.414603233337402, "global_step": 305537, "epoch": 1818} {"train_loss": -12.51010799407959, "global_step": 305538, "epoch": 1818} {"train_loss": -12.37028694152832, "global_step": 305539, "epoch": 1818} {"train_loss": -12.505704879760742, "global_step": 305540, "epoch": 1818} {"train_loss": -12.585445404052734, "global_step": 305541, "epoch": 1818} {"train_loss": -12.531898498535156, "global_step": 305542, "epoch": 1818} {"train_loss": -12.515460968017578, "global_step": 305543, "epoch": 1818} {"train_loss": -12.348755836486816, "global_step": 305544, "epoch": 1818} {"train_loss": -12.573554039001465, "global_step": 305545, "epoch": 1818} {"train_loss": -12.277280807495117, "global_step": 305546, "epoch": 1818} {"train_loss": -12.098888397216797, "global_step": 305547, "epoch": 1818} {"train_loss": -12.13111686706543, "global_step": 305548, "epoch": 1818} {"train_loss": -11.770214080810547, "global_step": 305549, "epoch": 1818} {"train_loss": -11.952043533325195, "global_step": 305550, "epoch": 1818} {"train_loss": -11.661843299865723, "global_step": 305551, "epoch": 1818} {"train_loss": -11.980552673339844, "global_step": 305552, "epoch": 1818} {"train_loss": -11.894402503967285, "global_step": 305553, "epoch": 1818} {"train_loss": -11.955867767333984, "global_step": 305554, "epoch": 1818} {"train_loss": -10.682692527770996, "global_step": 305555, "epoch": 1818} {"train_loss": -10.561795234680176, "global_step": 305556, "epoch": 1818} {"train_loss": -11.494731903076172, "global_step": 305557, "epoch": 1818} {"train_loss": -11.58804988861084, "global_step": 305558, "epoch": 1818} {"train_loss": -10.071603775024414, "global_step": 305559, "epoch": 1818} {"train_loss": -11.706462860107422, "global_step": 305560, "epoch": 1818} {"train_loss": -10.90733814239502, "global_step": 305561, "epoch": 1818} {"train_loss": -11.675836563110352, "global_step": 305562, "epoch": 1818} {"train_loss": -11.140690803527832, "global_step": 305563, "epoch": 1818} {"train_loss": -11.31878662109375, "global_step": 305564, "epoch": 1818} {"train_loss": -11.591554641723633, "global_step": 305565, "epoch": 1818} {"train_loss": -11.524645805358887, "global_step": 305566, "epoch": 1818} {"train_loss": -11.731616020202637, "global_step": 305567, "epoch": 1818} {"train_loss": -11.0301513671875, "global_step": 305568, "epoch": 1818} {"train_loss": -11.447715759277344, "global_step": 305569, "epoch": 1818} {"train_loss": -10.643842697143555, "global_step": 305570, "epoch": 1818} {"train_loss": -11.726387023925781, "global_step": 305571, "epoch": 1818} {"train_loss": -10.86617374420166, "global_step": 305572, "epoch": 1818} {"train_loss": -11.620965957641602, "global_step": 305573, "epoch": 1818} {"train_loss": -11.339019775390625, "global_step": 305574, "epoch": 1818} {"train_loss": -11.393468856811523, "global_step": 305575, "epoch": 1818} {"train_loss": -11.857398986816406, "global_step": 305576, "epoch": 1818} {"train_loss": -11.234813690185547, "global_step": 305577, "epoch": 1818} {"train_loss": -12.303348541259766, "global_step": 305578, "epoch": 1818} {"train_loss": -11.113582611083984, "global_step": 305579, "epoch": 1818} {"train_loss": -11.977766036987305, "global_step": 305580, "epoch": 1818} {"train_loss": -11.6976318359375, "global_step": 305581, "epoch": 1818} {"train_loss": -11.735757827758789, "global_step": 305582, "epoch": 1818} {"train_loss": -11.770780563354492, "global_step": 305583, "epoch": 1818} {"train_loss": -11.334162712097168, "global_step": 305584, "epoch": 1818} {"train_loss": -12.097803115844727, "global_step": 305585, "epoch": 1818} {"train_loss": -11.736885070800781, "global_step": 305586, "epoch": 1818} {"train_loss": -12.134037017822266, "global_step": 305587, "epoch": 1818} {"train_loss": -11.56608772277832, "global_step": 305588, "epoch": 1818} {"train_loss": -12.018613815307617, "global_step": 305589, "epoch": 1818} {"train_loss": -12.108257293701172, "global_step": 305590, "epoch": 1818} {"train_loss": -11.765535036722818, "global_step": 305591, "epoch": 1818, "val_loss": 278812.84375} {"train_loss": -11.782394409179688, "global_step": 305592, "epoch": 1819} {"train_loss": -12.039692878723145, "global_step": 305593, "epoch": 1819} {"train_loss": -11.743614196777344, "global_step": 305594, "epoch": 1819} {"train_loss": -11.828149795532227, "global_step": 305595, "epoch": 1819} {"train_loss": -11.515682220458984, "global_step": 305596, "epoch": 1819} {"train_loss": -12.058000564575195, "global_step": 305597, "epoch": 1819} {"train_loss": -11.679945945739746, "global_step": 305598, "epoch": 1819} {"train_loss": -12.15190601348877, "global_step": 305599, "epoch": 1819} {"train_loss": -11.588178634643555, "global_step": 305600, "epoch": 1819} {"train_loss": -12.10877799987793, "global_step": 305601, "epoch": 1819} {"train_loss": -11.671646118164062, "global_step": 305602, "epoch": 1819} {"train_loss": -12.24424934387207, "global_step": 305603, "epoch": 1819} {"train_loss": -11.699451446533203, "global_step": 305604, "epoch": 1819} {"train_loss": -11.81352424621582, "global_step": 305605, "epoch": 1819} {"train_loss": -11.881528854370117, "global_step": 305606, "epoch": 1819} {"train_loss": -12.056486129760742, "global_step": 305607, "epoch": 1819} {"train_loss": -12.054673194885254, "global_step": 305608, "epoch": 1819} {"train_loss": -12.018774032592773, "global_step": 305609, "epoch": 1819} {"train_loss": -11.636899948120117, "global_step": 305610, "epoch": 1819} {"train_loss": -11.84799575805664, "global_step": 305611, "epoch": 1819} {"train_loss": -11.760812759399414, "global_step": 305612, "epoch": 1819} {"train_loss": -11.963607788085938, "global_step": 305613, "epoch": 1819} {"train_loss": -12.038639068603516, "global_step": 305614, "epoch": 1819} {"train_loss": -12.124236106872559, "global_step": 305615, "epoch": 1819} {"train_loss": -12.118572235107422, "global_step": 305616, "epoch": 1819} {"train_loss": -11.993354797363281, "global_step": 305617, "epoch": 1819} {"train_loss": -12.030440330505371, "global_step": 305618, "epoch": 1819} {"train_loss": -11.943391799926758, "global_step": 305619, "epoch": 1819} {"train_loss": -12.041282653808594, "global_step": 305620, "epoch": 1819} {"train_loss": -12.336156845092773, "global_step": 305621, "epoch": 1819} {"train_loss": -11.926236152648926, "global_step": 305622, "epoch": 1819} {"train_loss": -11.853740692138672, "global_step": 305623, "epoch": 1819} {"train_loss": -12.394947052001953, "global_step": 305624, "epoch": 1819} {"train_loss": -11.856377601623535, "global_step": 305625, "epoch": 1819} {"train_loss": -12.450296401977539, "global_step": 305626, "epoch": 1819} {"train_loss": -12.183024406433105, "global_step": 305627, "epoch": 1819} {"train_loss": -12.144858360290527, "global_step": 305628, "epoch": 1819} {"train_loss": -11.901887893676758, "global_step": 305629, "epoch": 1819} {"train_loss": -12.34840202331543, "global_step": 305630, "epoch": 1819} {"train_loss": -12.228055953979492, "global_step": 305631, "epoch": 1819} {"train_loss": -11.9747953414917, "global_step": 305632, "epoch": 1819} {"train_loss": -12.225861549377441, "global_step": 305633, "epoch": 1819} {"train_loss": -12.027822494506836, "global_step": 305634, "epoch": 1819} {"train_loss": -12.040603637695312, "global_step": 305635, "epoch": 1819} {"train_loss": -12.317819595336914, "global_step": 305636, "epoch": 1819} {"train_loss": -11.461634635925293, "global_step": 305637, "epoch": 1819} {"train_loss": -11.574483871459961, "global_step": 305638, "epoch": 1819} {"train_loss": -11.977286338806152, "global_step": 305639, "epoch": 1819} {"train_loss": -11.853999137878418, "global_step": 305640, "epoch": 1819} {"train_loss": -11.291570663452148, "global_step": 305641, "epoch": 1819} {"train_loss": -11.67677116394043, "global_step": 305642, "epoch": 1819} {"train_loss": -12.16464614868164, "global_step": 305643, "epoch": 1819} {"train_loss": -11.194186210632324, "global_step": 305644, "epoch": 1819} {"train_loss": -11.488985061645508, "global_step": 305645, "epoch": 1819} {"train_loss": -11.653816223144531, "global_step": 305646, "epoch": 1819} {"train_loss": -11.675512313842773, "global_step": 305647, "epoch": 1819} {"train_loss": -12.336758613586426, "global_step": 305648, "epoch": 1819} {"train_loss": -11.98891830444336, "global_step": 305649, "epoch": 1819} {"train_loss": -12.010873794555664, "global_step": 305650, "epoch": 1819} {"train_loss": -12.358753204345703, "global_step": 305651, "epoch": 1819} {"train_loss": -12.314739227294922, "global_step": 305652, "epoch": 1819} {"train_loss": -12.226272583007812, "global_step": 305653, "epoch": 1819} {"train_loss": -12.346635818481445, "global_step": 305654, "epoch": 1819} {"train_loss": -12.23617935180664, "global_step": 305655, "epoch": 1819} {"train_loss": -12.391290664672852, "global_step": 305656, "epoch": 1819} {"train_loss": -12.073418617248535, "global_step": 305657, "epoch": 1819} {"train_loss": -12.31915283203125, "global_step": 305658, "epoch": 1819} {"train_loss": -12.103191375732422, "global_step": 305659, "epoch": 1819} {"train_loss": -12.652877807617188, "global_step": 305660, "epoch": 1819} {"train_loss": -12.252264976501465, "global_step": 305661, "epoch": 1819} {"train_loss": -12.237065315246582, "global_step": 305662, "epoch": 1819} {"train_loss": -12.027557373046875, "global_step": 305663, "epoch": 1819} {"train_loss": -12.327342987060547, "global_step": 305664, "epoch": 1819} {"train_loss": -12.08288860321045, "global_step": 305665, "epoch": 1819} {"train_loss": -12.235750198364258, "global_step": 305666, "epoch": 1819} {"train_loss": -12.339370727539062, "global_step": 305667, "epoch": 1819} {"train_loss": -12.248977661132812, "global_step": 305668, "epoch": 1819} {"train_loss": -12.318135261535645, "global_step": 305669, "epoch": 1819} {"train_loss": -12.214666366577148, "global_step": 305670, "epoch": 1819} {"train_loss": -12.346940994262695, "global_step": 305671, "epoch": 1819} {"train_loss": -11.91595458984375, "global_step": 305672, "epoch": 1819} {"train_loss": -11.68968391418457, "global_step": 305673, "epoch": 1819} {"train_loss": -12.086637496948242, "global_step": 305674, "epoch": 1819} {"train_loss": -12.259126663208008, "global_step": 305675, "epoch": 1819} {"train_loss": -12.005130767822266, "global_step": 305676, "epoch": 1819} {"train_loss": -12.344446182250977, "global_step": 305677, "epoch": 1819} {"train_loss": -11.996992111206055, "global_step": 305678, "epoch": 1819} {"train_loss": -12.250746726989746, "global_step": 305679, "epoch": 1819} {"train_loss": -11.617517471313477, "global_step": 305680, "epoch": 1819} {"train_loss": -12.382301330566406, "global_step": 305681, "epoch": 1819} {"train_loss": -12.15999984741211, "global_step": 305682, "epoch": 1819} {"train_loss": -12.065879821777344, "global_step": 305683, "epoch": 1819} {"train_loss": -12.134527206420898, "global_step": 305684, "epoch": 1819} {"train_loss": -12.30435848236084, "global_step": 305685, "epoch": 1819} {"train_loss": -11.576449394226074, "global_step": 305686, "epoch": 1819} {"train_loss": -12.135231018066406, "global_step": 305687, "epoch": 1819} {"train_loss": -11.314346313476562, "global_step": 305688, "epoch": 1819} {"train_loss": -11.581474304199219, "global_step": 305689, "epoch": 1819} {"train_loss": -12.03848934173584, "global_step": 305690, "epoch": 1819} {"train_loss": -11.9229097366333, "global_step": 305691, "epoch": 1819} {"train_loss": -10.95882797241211, "global_step": 305692, "epoch": 1819} {"train_loss": -11.971502304077148, "global_step": 305693, "epoch": 1819} {"train_loss": -11.558351516723633, "global_step": 305694, "epoch": 1819} {"train_loss": -11.730640411376953, "global_step": 305695, "epoch": 1819} {"train_loss": -11.974868774414062, "global_step": 305696, "epoch": 1819} {"train_loss": -11.825395584106445, "global_step": 305697, "epoch": 1819} {"train_loss": -11.575240135192871, "global_step": 305698, "epoch": 1819} {"train_loss": -11.331582069396973, "global_step": 305699, "epoch": 1819} {"train_loss": -11.472196578979492, "global_step": 305700, "epoch": 1819} {"train_loss": -11.206572532653809, "global_step": 305701, "epoch": 1819} {"train_loss": -11.181755065917969, "global_step": 305702, "epoch": 1819} {"train_loss": -11.066339492797852, "global_step": 305703, "epoch": 1819} {"train_loss": -11.0000581741333, "global_step": 305704, "epoch": 1819} {"train_loss": -11.337644577026367, "global_step": 305705, "epoch": 1819} {"train_loss": -10.36056900024414, "global_step": 305706, "epoch": 1819} {"train_loss": -12.056380271911621, "global_step": 305707, "epoch": 1819} {"train_loss": -10.637523651123047, "global_step": 305708, "epoch": 1819} {"train_loss": -10.973036766052246, "global_step": 305709, "epoch": 1819} {"train_loss": -11.315052032470703, "global_step": 305710, "epoch": 1819} {"train_loss": -11.363425254821777, "global_step": 305711, "epoch": 1819} {"train_loss": -11.936525344848633, "global_step": 305712, "epoch": 1819} {"train_loss": -10.426129341125488, "global_step": 305713, "epoch": 1819} {"train_loss": -10.951927185058594, "global_step": 305714, "epoch": 1819} {"train_loss": -11.037212371826172, "global_step": 305715, "epoch": 1819} {"train_loss": -9.591066360473633, "global_step": 305716, "epoch": 1819} {"train_loss": -10.93747329711914, "global_step": 305717, "epoch": 1819} {"train_loss": -11.338151931762695, "global_step": 305718, "epoch": 1819} {"train_loss": -11.148481369018555, "global_step": 305719, "epoch": 1819} {"train_loss": -11.479090690612793, "global_step": 305720, "epoch": 1819} {"train_loss": -10.31857681274414, "global_step": 305721, "epoch": 1819} {"train_loss": -11.265242576599121, "global_step": 305722, "epoch": 1819} {"train_loss": -10.603485107421875, "global_step": 305723, "epoch": 1819} {"train_loss": -11.672082901000977, "global_step": 305724, "epoch": 1819} {"train_loss": -11.116706848144531, "global_step": 305725, "epoch": 1819} {"train_loss": -11.682512283325195, "global_step": 305726, "epoch": 1819} {"train_loss": -11.322036743164062, "global_step": 305727, "epoch": 1819} {"train_loss": -11.704347610473633, "global_step": 305728, "epoch": 1819} {"train_loss": -11.03675651550293, "global_step": 305729, "epoch": 1819} {"train_loss": -11.899152755737305, "global_step": 305730, "epoch": 1819} {"train_loss": -11.248855590820312, "global_step": 305731, "epoch": 1819} {"train_loss": -12.02564525604248, "global_step": 305732, "epoch": 1819} {"train_loss": -10.98812484741211, "global_step": 305733, "epoch": 1819} {"train_loss": -11.389087677001953, "global_step": 305734, "epoch": 1819} {"train_loss": -11.729951858520508, "global_step": 305735, "epoch": 1819} {"train_loss": -11.113898277282715, "global_step": 305736, "epoch": 1819} {"train_loss": -11.910799026489258, "global_step": 305737, "epoch": 1819} {"train_loss": -11.4863862991333, "global_step": 305738, "epoch": 1819} {"train_loss": -11.800010681152344, "global_step": 305739, "epoch": 1819} {"train_loss": -11.897211074829102, "global_step": 305740, "epoch": 1819} {"train_loss": -11.633670806884766, "global_step": 305741, "epoch": 1819} {"train_loss": -11.68459701538086, "global_step": 305742, "epoch": 1819} {"train_loss": -11.939117431640625, "global_step": 305743, "epoch": 1819} {"train_loss": -11.721709251403809, "global_step": 305744, "epoch": 1819} {"train_loss": -11.955403327941895, "global_step": 305745, "epoch": 1819} {"train_loss": -11.791961669921875, "global_step": 305746, "epoch": 1819} {"train_loss": -11.920476913452148, "global_step": 305747, "epoch": 1819} {"train_loss": -12.126625061035156, "global_step": 305748, "epoch": 1819} {"train_loss": -12.112488746643066, "global_step": 305749, "epoch": 1819} {"train_loss": -11.734217643737793, "global_step": 305750, "epoch": 1819} {"train_loss": -12.277316093444824, "global_step": 305751, "epoch": 1819} {"train_loss": -11.891986846923828, "global_step": 305752, "epoch": 1819} {"train_loss": -12.254518508911133, "global_step": 305753, "epoch": 1819} {"train_loss": -12.258186340332031, "global_step": 305754, "epoch": 1819} {"train_loss": -11.81733512878418, "global_step": 305755, "epoch": 1819} {"train_loss": -12.090614318847656, "global_step": 305756, "epoch": 1819} {"train_loss": -12.023713111877441, "global_step": 305757, "epoch": 1819} {"train_loss": -12.153940200805664, "global_step": 305758, "epoch": 1819} {"train_loss": -11.803723346619378, "global_step": 305759, "epoch": 1819, "val_loss": 271095.6875} {"train_loss": -11.998148918151855, "global_step": 305760, "epoch": 1820} {"train_loss": -12.217203140258789, "global_step": 305761, "epoch": 1820} {"train_loss": -12.183704376220703, "global_step": 305762, "epoch": 1820} {"train_loss": -11.93294906616211, "global_step": 305763, "epoch": 1820} {"train_loss": -11.971552848815918, "global_step": 305764, "epoch": 1820} {"train_loss": -12.170726776123047, "global_step": 305765, "epoch": 1820} {"train_loss": -12.396991729736328, "global_step": 305766, "epoch": 1820} {"train_loss": -12.41250991821289, "global_step": 305767, "epoch": 1820} {"train_loss": -12.112810134887695, "global_step": 305768, "epoch": 1820} {"train_loss": -12.273300170898438, "global_step": 305769, "epoch": 1820} {"train_loss": -12.351003646850586, "global_step": 305770, "epoch": 1820} {"train_loss": -12.358590126037598, "global_step": 305771, "epoch": 1820} {"train_loss": -12.131498336791992, "global_step": 305772, "epoch": 1820} {"train_loss": -12.321290016174316, "global_step": 305773, "epoch": 1820} {"train_loss": -11.904254913330078, "global_step": 305774, "epoch": 1820} {"train_loss": -12.261423110961914, "global_step": 305775, "epoch": 1820} {"train_loss": -12.348983764648438, "global_step": 305776, "epoch": 1820} {"train_loss": -11.676197052001953, "global_step": 305777, "epoch": 1820} {"train_loss": -12.27299690246582, "global_step": 305778, "epoch": 1820} {"train_loss": -11.602456092834473, "global_step": 305779, "epoch": 1820} {"train_loss": -10.86495590209961, "global_step": 305780, "epoch": 1820} {"train_loss": -11.948270797729492, "global_step": 305781, "epoch": 1820} {"train_loss": -11.273944854736328, "global_step": 305782, "epoch": 1820} {"train_loss": -10.402059555053711, "global_step": 305783, "epoch": 1820} {"train_loss": -11.961240768432617, "global_step": 305784, "epoch": 1820} {"train_loss": -9.502933502197266, "global_step": 305785, "epoch": 1820} {"train_loss": -11.747237205505371, "global_step": 305786, "epoch": 1820} {"train_loss": -11.120506286621094, "global_step": 305787, "epoch": 1820} {"train_loss": -9.86088752746582, "global_step": 305788, "epoch": 1820} {"train_loss": -11.861372947692871, "global_step": 305789, "epoch": 1820} {"train_loss": -10.77762222290039, "global_step": 305790, "epoch": 1820} {"train_loss": -10.663126945495605, "global_step": 305791, "epoch": 1820} {"train_loss": -11.82773208618164, "global_step": 305792, "epoch": 1820} {"train_loss": -9.975152969360352, "global_step": 305793, "epoch": 1820} {"train_loss": -11.961406707763672, "global_step": 305794, "epoch": 1820} {"train_loss": -11.159591674804688, "global_step": 305795, "epoch": 1820} {"train_loss": -10.734441757202148, "global_step": 305796, "epoch": 1820} {"train_loss": -11.85274887084961, "global_step": 305797, "epoch": 1820} {"train_loss": -10.834161758422852, "global_step": 305798, "epoch": 1820} {"train_loss": -12.185310363769531, "global_step": 305799, "epoch": 1820} {"train_loss": -11.278615951538086, "global_step": 305800, "epoch": 1820} {"train_loss": -11.988788604736328, "global_step": 305801, "epoch": 1820} {"train_loss": -11.487436294555664, "global_step": 305802, "epoch": 1820} {"train_loss": -11.88717269897461, "global_step": 305803, "epoch": 1820} {"train_loss": -12.041803359985352, "global_step": 305804, "epoch": 1820} {"train_loss": -11.550565719604492, "global_step": 305805, "epoch": 1820} {"train_loss": -12.005905151367188, "global_step": 305806, "epoch": 1820} {"train_loss": -11.818756103515625, "global_step": 305807, "epoch": 1820} {"train_loss": -12.066568374633789, "global_step": 305808, "epoch": 1820} {"train_loss": -12.140457153320312, "global_step": 305809, "epoch": 1820} {"train_loss": -11.919919967651367, "global_step": 305810, "epoch": 1820} {"train_loss": -11.886856079101562, "global_step": 305811, "epoch": 1820} {"train_loss": -12.159953117370605, "global_step": 305812, "epoch": 1820} {"train_loss": -12.11830997467041, "global_step": 305813, "epoch": 1820} {"train_loss": -12.139421463012695, "global_step": 305814, "epoch": 1820} {"train_loss": -11.806315422058105, "global_step": 305815, "epoch": 1820} {"train_loss": -12.371702194213867, "global_step": 305816, "epoch": 1820} {"train_loss": -12.006136894226074, "global_step": 305817, "epoch": 1820} {"train_loss": -12.100678443908691, "global_step": 305818, "epoch": 1820} {"train_loss": -12.308679580688477, "global_step": 305819, "epoch": 1820} {"train_loss": -12.079883575439453, "global_step": 305820, "epoch": 1820} {"train_loss": -12.310012817382812, "global_step": 305821, "epoch": 1820} {"train_loss": -12.135879516601562, "global_step": 305822, "epoch": 1820} {"train_loss": -12.298591613769531, "global_step": 305823, "epoch": 1820} {"train_loss": -12.254789352416992, "global_step": 305824, "epoch": 1820} {"train_loss": -12.31344985961914, "global_step": 305825, "epoch": 1820} {"train_loss": -12.296924591064453, "global_step": 305826, "epoch": 1820} {"train_loss": -12.202122688293457, "global_step": 305827, "epoch": 1820} {"train_loss": -12.432551383972168, "global_step": 305828, "epoch": 1820} {"train_loss": -12.018505096435547, "global_step": 305829, "epoch": 1820} {"train_loss": -12.349414825439453, "global_step": 305830, "epoch": 1820} {"train_loss": -12.383337020874023, "global_step": 305831, "epoch": 1820} {"train_loss": -12.286827087402344, "global_step": 305832, "epoch": 1820} {"train_loss": -12.348936080932617, "global_step": 305833, "epoch": 1820} {"train_loss": -12.433209419250488, "global_step": 305834, "epoch": 1820} {"train_loss": -12.44826602935791, "global_step": 305835, "epoch": 1820} {"train_loss": -12.36014175415039, "global_step": 305836, "epoch": 1820} {"train_loss": -12.497672080993652, "global_step": 305837, "epoch": 1820} {"train_loss": -12.288152694702148, "global_step": 305838, "epoch": 1820} {"train_loss": -12.441658020019531, "global_step": 305839, "epoch": 1820} {"train_loss": -12.539339065551758, "global_step": 305840, "epoch": 1820} {"train_loss": -12.538912773132324, "global_step": 305841, "epoch": 1820} {"train_loss": -12.378629684448242, "global_step": 305842, "epoch": 1820} {"train_loss": -12.519357681274414, "global_step": 305843, "epoch": 1820} {"train_loss": -12.499863624572754, "global_step": 305844, "epoch": 1820} {"train_loss": -12.255428314208984, "global_step": 305845, "epoch": 1820} {"train_loss": -12.357468605041504, "global_step": 305846, "epoch": 1820} {"train_loss": -12.322299003601074, "global_step": 305847, "epoch": 1820} {"train_loss": -12.12604808807373, "global_step": 305848, "epoch": 1820} {"train_loss": -12.239078521728516, "global_step": 305849, "epoch": 1820} {"train_loss": -12.2576265335083, "global_step": 305850, "epoch": 1820} {"train_loss": -12.487960815429688, "global_step": 305851, "epoch": 1820} {"train_loss": -12.125341415405273, "global_step": 305852, "epoch": 1820} {"train_loss": -12.521080017089844, "global_step": 305853, "epoch": 1820} {"train_loss": -12.192501068115234, "global_step": 305854, "epoch": 1820} {"train_loss": -12.137301445007324, "global_step": 305855, "epoch": 1820} {"train_loss": -12.224181175231934, "global_step": 305856, "epoch": 1820} {"train_loss": -12.385091781616211, "global_step": 305857, "epoch": 1820} {"train_loss": -12.44186019897461, "global_step": 305858, "epoch": 1820} {"train_loss": -12.324087142944336, "global_step": 305859, "epoch": 1820} {"train_loss": -12.399114608764648, "global_step": 305860, "epoch": 1820} {"train_loss": -12.373520851135254, "global_step": 305861, "epoch": 1820} {"train_loss": -12.649065017700195, "global_step": 305862, "epoch": 1820} {"train_loss": -12.234518051147461, "global_step": 305863, "epoch": 1820} {"train_loss": -12.470344543457031, "global_step": 305864, "epoch": 1820} {"train_loss": -12.2093505859375, "global_step": 305865, "epoch": 1820} {"train_loss": -12.191909790039062, "global_step": 305866, "epoch": 1820} {"train_loss": -12.482379913330078, "global_step": 305867, "epoch": 1820} {"train_loss": -12.259317398071289, "global_step": 305868, "epoch": 1820} {"train_loss": -12.434816360473633, "global_step": 305869, "epoch": 1820} {"train_loss": -12.584612846374512, "global_step": 305870, "epoch": 1820} {"train_loss": -12.63878059387207, "global_step": 305871, "epoch": 1820} {"train_loss": -12.285670280456543, "global_step": 305872, "epoch": 1820} {"train_loss": -12.567428588867188, "global_step": 305873, "epoch": 1820} {"train_loss": -12.33279800415039, "global_step": 305874, "epoch": 1820} {"train_loss": -12.46570110321045, "global_step": 305875, "epoch": 1820} {"train_loss": -12.47311019897461, "global_step": 305876, "epoch": 1820} {"train_loss": -12.296564102172852, "global_step": 305877, "epoch": 1820} {"train_loss": -12.060267448425293, "global_step": 305878, "epoch": 1820} {"train_loss": -12.39181900024414, "global_step": 305879, "epoch": 1820} {"train_loss": -12.199402809143066, "global_step": 305880, "epoch": 1820} {"train_loss": -12.47245979309082, "global_step": 305881, "epoch": 1820} {"train_loss": -12.683113098144531, "global_step": 305882, "epoch": 1820} {"train_loss": -12.451459884643555, "global_step": 305883, "epoch": 1820} {"train_loss": -12.61719799041748, "global_step": 305884, "epoch": 1820} {"train_loss": -12.51970386505127, "global_step": 305885, "epoch": 1820} {"train_loss": -12.297778129577637, "global_step": 305886, "epoch": 1820} {"train_loss": -12.361379623413086, "global_step": 305887, "epoch": 1820} {"train_loss": -12.402534484863281, "global_step": 305888, "epoch": 1820} {"train_loss": -12.268499374389648, "global_step": 305889, "epoch": 1820} {"train_loss": -11.645883560180664, "global_step": 305890, "epoch": 1820} {"train_loss": -11.589215278625488, "global_step": 305891, "epoch": 1820} {"train_loss": -10.395662307739258, "global_step": 305892, "epoch": 1820} {"train_loss": -10.42837905883789, "global_step": 305893, "epoch": 1820} {"train_loss": -11.309101104736328, "global_step": 305894, "epoch": 1820} {"train_loss": -10.851499557495117, "global_step": 305895, "epoch": 1820} {"train_loss": -9.861222267150879, "global_step": 305896, "epoch": 1820} {"train_loss": -10.856566429138184, "global_step": 305897, "epoch": 1820} {"train_loss": -11.34061050415039, "global_step": 305898, "epoch": 1820} {"train_loss": -10.717313766479492, "global_step": 305899, "epoch": 1820} {"train_loss": -9.173285484313965, "global_step": 305900, "epoch": 1820} {"train_loss": -11.49966049194336, "global_step": 305901, "epoch": 1820} {"train_loss": -8.44841480255127, "global_step": 305902, "epoch": 1820} {"train_loss": -10.365431785583496, "global_step": 305903, "epoch": 1820} {"train_loss": -10.792951583862305, "global_step": 305904, "epoch": 1820} {"train_loss": -9.962400436401367, "global_step": 305905, "epoch": 1820} {"train_loss": -11.84713077545166, "global_step": 305906, "epoch": 1820} {"train_loss": -10.258216857910156, "global_step": 305907, "epoch": 1820} {"train_loss": -11.032902717590332, "global_step": 305908, "epoch": 1820} {"train_loss": -11.333518981933594, "global_step": 305909, "epoch": 1820} {"train_loss": -10.873376846313477, "global_step": 305910, "epoch": 1820} {"train_loss": -11.671531677246094, "global_step": 305911, "epoch": 1820} {"train_loss": -11.337848663330078, "global_step": 305912, "epoch": 1820} {"train_loss": -11.342466354370117, "global_step": 305913, "epoch": 1820} {"train_loss": -11.25361442565918, "global_step": 305914, "epoch": 1820} {"train_loss": -11.33853530883789, "global_step": 305915, "epoch": 1820} {"train_loss": -10.847969055175781, "global_step": 305916, "epoch": 1820} {"train_loss": -11.619808197021484, "global_step": 305917, "epoch": 1820} {"train_loss": -10.878290176391602, "global_step": 305918, "epoch": 1820} {"train_loss": -11.665987014770508, "global_step": 305919, "epoch": 1820} {"train_loss": -11.202905654907227, "global_step": 305920, "epoch": 1820} {"train_loss": -10.991668701171875, "global_step": 305921, "epoch": 1820} {"train_loss": -11.404391288757324, "global_step": 305922, "epoch": 1820} {"train_loss": -11.383978843688965, "global_step": 305923, "epoch": 1820} {"train_loss": -11.238052368164062, "global_step": 305924, "epoch": 1820} {"train_loss": -11.29620361328125, "global_step": 305925, "epoch": 1820} {"train_loss": -11.363277435302734, "global_step": 305926, "epoch": 1820} {"train_loss": -11.826937402997698, "global_step": 305927, "epoch": 1820, "val_loss": 278885.625, "train_action_mse_error": 1.8541316986083984} {"train_loss": -11.596315383911133, "global_step": 305928, "epoch": 1821} {"train_loss": -11.919805526733398, "global_step": 305929, "epoch": 1821} {"train_loss": -11.595355033874512, "global_step": 305930, "epoch": 1821} {"train_loss": -11.63648796081543, "global_step": 305931, "epoch": 1821} {"train_loss": -11.706910133361816, "global_step": 305932, "epoch": 1821} {"train_loss": -11.605863571166992, "global_step": 305933, "epoch": 1821} {"train_loss": -11.976705551147461, "global_step": 305934, "epoch": 1821} {"train_loss": -11.462264060974121, "global_step": 305935, "epoch": 1821} {"train_loss": -11.970403671264648, "global_step": 305936, "epoch": 1821} {"train_loss": -11.775280952453613, "global_step": 305937, "epoch": 1821} {"train_loss": -11.899962425231934, "global_step": 305938, "epoch": 1821} {"train_loss": -11.522987365722656, "global_step": 305939, "epoch": 1821} {"train_loss": -11.728031158447266, "global_step": 305940, "epoch": 1821} {"train_loss": -11.986912727355957, "global_step": 305941, "epoch": 1821} {"train_loss": -11.337747573852539, "global_step": 305942, "epoch": 1821} {"train_loss": -12.054956436157227, "global_step": 305943, "epoch": 1821} {"train_loss": -11.360254287719727, "global_step": 305944, "epoch": 1821} {"train_loss": -11.740694999694824, "global_step": 305945, "epoch": 1821} {"train_loss": -11.693130493164062, "global_step": 305946, "epoch": 1821} {"train_loss": -11.55033016204834, "global_step": 305947, "epoch": 1821} {"train_loss": -11.590729713439941, "global_step": 305948, "epoch": 1821} {"train_loss": -11.666414260864258, "global_step": 305949, "epoch": 1821} {"train_loss": -11.780725479125977, "global_step": 305950, "epoch": 1821} {"train_loss": -12.038084030151367, "global_step": 305951, "epoch": 1821} {"train_loss": -11.466106414794922, "global_step": 305952, "epoch": 1821} {"train_loss": -12.055484771728516, "global_step": 305953, "epoch": 1821} {"train_loss": -11.85910701751709, "global_step": 305954, "epoch": 1821} {"train_loss": -11.580354690551758, "global_step": 305955, "epoch": 1821} {"train_loss": -11.898681640625, "global_step": 305956, "epoch": 1821} {"train_loss": -11.122655868530273, "global_step": 305957, "epoch": 1821} {"train_loss": -11.986421585083008, "global_step": 305958, "epoch": 1821} {"train_loss": -11.512967109680176, "global_step": 305959, "epoch": 1821} {"train_loss": -11.878589630126953, "global_step": 305960, "epoch": 1821} {"train_loss": -12.116548538208008, "global_step": 305961, "epoch": 1821} {"train_loss": -11.63051986694336, "global_step": 305962, "epoch": 1821} {"train_loss": -11.895133018493652, "global_step": 305963, "epoch": 1821} {"train_loss": -11.705255508422852, "global_step": 305964, "epoch": 1821} {"train_loss": -12.227156639099121, "global_step": 305965, "epoch": 1821} {"train_loss": -11.598522186279297, "global_step": 305966, "epoch": 1821} {"train_loss": -12.078116416931152, "global_step": 305967, "epoch": 1821} {"train_loss": -11.603155136108398, "global_step": 305968, "epoch": 1821} {"train_loss": -11.964223861694336, "global_step": 305969, "epoch": 1821} {"train_loss": -11.990493774414062, "global_step": 305970, "epoch": 1821} {"train_loss": -11.958979606628418, "global_step": 305971, "epoch": 1821} {"train_loss": -12.288091659545898, "global_step": 305972, "epoch": 1821} {"train_loss": -12.010335922241211, "global_step": 305973, "epoch": 1821} {"train_loss": -12.069562911987305, "global_step": 305974, "epoch": 1821} {"train_loss": -11.931055068969727, "global_step": 305975, "epoch": 1821} {"train_loss": -12.126150131225586, "global_step": 305976, "epoch": 1821} {"train_loss": -12.116106986999512, "global_step": 305977, "epoch": 1821} {"train_loss": -11.982810974121094, "global_step": 305978, "epoch": 1821} {"train_loss": -12.205093383789062, "global_step": 305979, "epoch": 1821} {"train_loss": -11.984064102172852, "global_step": 305980, "epoch": 1821} {"train_loss": -11.59181022644043, "global_step": 305981, "epoch": 1821} {"train_loss": -11.866607666015625, "global_step": 305982, "epoch": 1821} {"train_loss": -11.384893417358398, "global_step": 305983, "epoch": 1821} {"train_loss": -11.599750518798828, "global_step": 305984, "epoch": 1821} {"train_loss": -11.818151473999023, "global_step": 305985, "epoch": 1821} {"train_loss": -11.154394149780273, "global_step": 305986, "epoch": 1821} {"train_loss": -11.89460563659668, "global_step": 305987, "epoch": 1821} {"train_loss": -11.384613990783691, "global_step": 305988, "epoch": 1821} {"train_loss": -11.597602844238281, "global_step": 305989, "epoch": 1821} {"train_loss": -11.865509033203125, "global_step": 305990, "epoch": 1821} {"train_loss": -11.646454811096191, "global_step": 305991, "epoch": 1821} {"train_loss": -11.753172874450684, "global_step": 305992, "epoch": 1821} {"train_loss": -11.682412147521973, "global_step": 305993, "epoch": 1821} {"train_loss": -12.228891372680664, "global_step": 305994, "epoch": 1821} {"train_loss": -11.435674667358398, "global_step": 305995, "epoch": 1821} {"train_loss": -12.07960033416748, "global_step": 305996, "epoch": 1821} {"train_loss": -11.565790176391602, "global_step": 305997, "epoch": 1821} {"train_loss": -11.960553169250488, "global_step": 305998, "epoch": 1821} {"train_loss": -11.408538818359375, "global_step": 305999, "epoch": 1821} {"train_loss": -11.868829727172852, "global_step": 306000, "epoch": 1821} {"train_loss": -11.926146507263184, "global_step": 306001, "epoch": 1821} {"train_loss": -11.981184005737305, "global_step": 306002, "epoch": 1821} {"train_loss": -12.00058364868164, "global_step": 306003, "epoch": 1821} {"train_loss": -12.253053665161133, "global_step": 306004, "epoch": 1821} {"train_loss": -11.740150451660156, "global_step": 306005, "epoch": 1821} {"train_loss": -12.185072898864746, "global_step": 306006, "epoch": 1821} {"train_loss": -11.415444374084473, "global_step": 306007, "epoch": 1821} {"train_loss": -12.153249740600586, "global_step": 306008, "epoch": 1821} {"train_loss": -11.712943077087402, "global_step": 306009, "epoch": 1821} {"train_loss": -11.811624526977539, "global_step": 306010, "epoch": 1821} {"train_loss": -12.001203536987305, "global_step": 306011, "epoch": 1821} {"train_loss": -11.782873153686523, "global_step": 306012, "epoch": 1821} {"train_loss": -11.922813415527344, "global_step": 306013, "epoch": 1821} {"train_loss": -11.995224952697754, "global_step": 306014, "epoch": 1821} {"train_loss": -12.14112663269043, "global_step": 306015, "epoch": 1821} {"train_loss": -12.020488739013672, "global_step": 306016, "epoch": 1821} {"train_loss": -12.048652648925781, "global_step": 306017, "epoch": 1821} {"train_loss": -12.35653305053711, "global_step": 306018, "epoch": 1821} {"train_loss": -12.23093032836914, "global_step": 306019, "epoch": 1821} {"train_loss": -12.29527473449707, "global_step": 306020, "epoch": 1821} {"train_loss": -12.232799530029297, "global_step": 306021, "epoch": 1821} {"train_loss": -12.208057403564453, "global_step": 306022, "epoch": 1821} {"train_loss": -12.327858924865723, "global_step": 306023, "epoch": 1821} {"train_loss": -11.899908065795898, "global_step": 306024, "epoch": 1821} {"train_loss": -12.171663284301758, "global_step": 306025, "epoch": 1821} {"train_loss": -12.392200469970703, "global_step": 306026, "epoch": 1821} {"train_loss": -12.004684448242188, "global_step": 306027, "epoch": 1821} {"train_loss": -12.329911231994629, "global_step": 306028, "epoch": 1821} {"train_loss": -12.143685340881348, "global_step": 306029, "epoch": 1821} {"train_loss": -12.422017097473145, "global_step": 306030, "epoch": 1821} {"train_loss": -11.996553421020508, "global_step": 306031, "epoch": 1821} {"train_loss": -12.269002914428711, "global_step": 306032, "epoch": 1821} {"train_loss": -12.429309844970703, "global_step": 306033, "epoch": 1821} {"train_loss": -12.480430603027344, "global_step": 306034, "epoch": 1821} {"train_loss": -12.538640975952148, "global_step": 306035, "epoch": 1821} {"train_loss": -12.40068244934082, "global_step": 306036, "epoch": 1821} {"train_loss": -12.171323776245117, "global_step": 306037, "epoch": 1821} {"train_loss": -12.403352737426758, "global_step": 306038, "epoch": 1821} {"train_loss": -12.33247184753418, "global_step": 306039, "epoch": 1821} {"train_loss": -12.35417366027832, "global_step": 306040, "epoch": 1821} {"train_loss": -12.536934852600098, "global_step": 306041, "epoch": 1821} {"train_loss": -12.607215881347656, "global_step": 306042, "epoch": 1821} {"train_loss": -12.466073989868164, "global_step": 306043, "epoch": 1821} {"train_loss": -12.227882385253906, "global_step": 306044, "epoch": 1821} {"train_loss": -12.560647964477539, "global_step": 306045, "epoch": 1821} {"train_loss": -12.461775779724121, "global_step": 306046, "epoch": 1821} {"train_loss": -12.660677909851074, "global_step": 306047, "epoch": 1821} {"train_loss": -12.663701057434082, "global_step": 306048, "epoch": 1821} {"train_loss": -12.463130950927734, "global_step": 306049, "epoch": 1821} {"train_loss": -12.56867504119873, "global_step": 306050, "epoch": 1821} {"train_loss": -12.571111679077148, "global_step": 306051, "epoch": 1821} {"train_loss": -12.638002395629883, "global_step": 306052, "epoch": 1821} {"train_loss": -12.508527755737305, "global_step": 306053, "epoch": 1821} {"train_loss": -12.592673301696777, "global_step": 306054, "epoch": 1821} {"train_loss": -12.627387046813965, "global_step": 306055, "epoch": 1821} {"train_loss": -12.403749465942383, "global_step": 306056, "epoch": 1821} {"train_loss": -12.380098342895508, "global_step": 306057, "epoch": 1821} {"train_loss": -12.688730239868164, "global_step": 306058, "epoch": 1821} {"train_loss": -12.281981468200684, "global_step": 306059, "epoch": 1821} {"train_loss": -12.277246475219727, "global_step": 306060, "epoch": 1821} {"train_loss": -12.525298118591309, "global_step": 306061, "epoch": 1821} {"train_loss": -11.987689971923828, "global_step": 306062, "epoch": 1821} {"train_loss": -12.036094665527344, "global_step": 306063, "epoch": 1821} {"train_loss": -12.289626121520996, "global_step": 306064, "epoch": 1821} {"train_loss": -12.282217979431152, "global_step": 306065, "epoch": 1821} {"train_loss": -11.974302291870117, "global_step": 306066, "epoch": 1821} {"train_loss": -12.274202346801758, "global_step": 306067, "epoch": 1821} {"train_loss": -12.019787788391113, "global_step": 306068, "epoch": 1821} {"train_loss": -12.26213264465332, "global_step": 306069, "epoch": 1821} {"train_loss": -11.11895751953125, "global_step": 306070, "epoch": 1821} {"train_loss": -11.564197540283203, "global_step": 306071, "epoch": 1821} {"train_loss": -12.14045238494873, "global_step": 306072, "epoch": 1821} {"train_loss": -12.182044982910156, "global_step": 306073, "epoch": 1821} {"train_loss": -11.76243782043457, "global_step": 306074, "epoch": 1821} {"train_loss": -12.230597496032715, "global_step": 306075, "epoch": 1821} {"train_loss": -12.228429794311523, "global_step": 306076, "epoch": 1821} {"train_loss": -11.60389518737793, "global_step": 306077, "epoch": 1821} {"train_loss": -10.857477188110352, "global_step": 306078, "epoch": 1821} {"train_loss": -11.74173355102539, "global_step": 306079, "epoch": 1821} {"train_loss": -12.296894073486328, "global_step": 306080, "epoch": 1821} {"train_loss": -11.77570915222168, "global_step": 306081, "epoch": 1821} {"train_loss": -12.175755500793457, "global_step": 306082, "epoch": 1821} {"train_loss": -11.539453506469727, "global_step": 306083, "epoch": 1821} {"train_loss": -11.811717987060547, "global_step": 306084, "epoch": 1821} {"train_loss": -12.454718589782715, "global_step": 306085, "epoch": 1821} {"train_loss": -11.618517875671387, "global_step": 306086, "epoch": 1821} {"train_loss": -11.395578384399414, "global_step": 306087, "epoch": 1821} {"train_loss": -12.011228561401367, "global_step": 306088, "epoch": 1821} {"train_loss": -12.172395706176758, "global_step": 306089, "epoch": 1821} {"train_loss": -11.656400680541992, "global_step": 306090, "epoch": 1821} {"train_loss": -11.79870319366455, "global_step": 306091, "epoch": 1821} {"train_loss": -12.169357299804688, "global_step": 306092, "epoch": 1821} {"train_loss": -12.393896102905273, "global_step": 306093, "epoch": 1821} {"train_loss": -12.25983715057373, "global_step": 306094, "epoch": 1821} {"train_loss": -11.989560751687913, "global_step": 306095, "epoch": 1821, "val_loss": 281645.15625} {"train_loss": -12.447430610656738, "global_step": 306096, "epoch": 1822} {"train_loss": -12.18502140045166, "global_step": 306097, "epoch": 1822} {"train_loss": -12.478984832763672, "global_step": 306098, "epoch": 1822} {"train_loss": -12.054840087890625, "global_step": 306099, "epoch": 1822} {"train_loss": -11.86403751373291, "global_step": 306100, "epoch": 1822} {"train_loss": -11.881752967834473, "global_step": 306101, "epoch": 1822} {"train_loss": -11.961851119995117, "global_step": 306102, "epoch": 1822} {"train_loss": -11.918403625488281, "global_step": 306103, "epoch": 1822} {"train_loss": -12.303168296813965, "global_step": 306104, "epoch": 1822} {"train_loss": -11.643486976623535, "global_step": 306105, "epoch": 1822} {"train_loss": -12.435080528259277, "global_step": 306106, "epoch": 1822} {"train_loss": -11.493412017822266, "global_step": 306107, "epoch": 1822} {"train_loss": -12.22859001159668, "global_step": 306108, "epoch": 1822} {"train_loss": -12.101775169372559, "global_step": 306109, "epoch": 1822} {"train_loss": -12.338024139404297, "global_step": 306110, "epoch": 1822} {"train_loss": -11.878013610839844, "global_step": 306111, "epoch": 1822} {"train_loss": -12.203484535217285, "global_step": 306112, "epoch": 1822} {"train_loss": -11.981527328491211, "global_step": 306113, "epoch": 1822} {"train_loss": -12.301547050476074, "global_step": 306114, "epoch": 1822} {"train_loss": -12.153529167175293, "global_step": 306115, "epoch": 1822} {"train_loss": -12.249483108520508, "global_step": 306116, "epoch": 1822} {"train_loss": -11.86273193359375, "global_step": 306117, "epoch": 1822} {"train_loss": -11.224252700805664, "global_step": 306118, "epoch": 1822} {"train_loss": -12.257553100585938, "global_step": 306119, "epoch": 1822} {"train_loss": -11.375265121459961, "global_step": 306120, "epoch": 1822} {"train_loss": -11.977684020996094, "global_step": 306121, "epoch": 1822} {"train_loss": -11.934425354003906, "global_step": 306122, "epoch": 1822} {"train_loss": -11.728048324584961, "global_step": 306123, "epoch": 1822} {"train_loss": -11.589859962463379, "global_step": 306124, "epoch": 1822} {"train_loss": -11.829475402832031, "global_step": 306125, "epoch": 1822} {"train_loss": -11.551298141479492, "global_step": 306126, "epoch": 1822} {"train_loss": -10.179157257080078, "global_step": 306127, "epoch": 1822} {"train_loss": -12.120685577392578, "global_step": 306128, "epoch": 1822} {"train_loss": -10.214765548706055, "global_step": 306129, "epoch": 1822} {"train_loss": -11.536042213439941, "global_step": 306130, "epoch": 1822} {"train_loss": -10.648794174194336, "global_step": 306131, "epoch": 1822} {"train_loss": -11.59487533569336, "global_step": 306132, "epoch": 1822} {"train_loss": -11.396836280822754, "global_step": 306133, "epoch": 1822} {"train_loss": -11.884137153625488, "global_step": 306134, "epoch": 1822} {"train_loss": -11.178220748901367, "global_step": 306135, "epoch": 1822} {"train_loss": -12.316167831420898, "global_step": 306136, "epoch": 1822} {"train_loss": -11.91016960144043, "global_step": 306137, "epoch": 1822} {"train_loss": -12.164285659790039, "global_step": 306138, "epoch": 1822} {"train_loss": -11.521665573120117, "global_step": 306139, "epoch": 1822} {"train_loss": -12.01816463470459, "global_step": 306140, "epoch": 1822} {"train_loss": -11.984548568725586, "global_step": 306141, "epoch": 1822} {"train_loss": -11.953144073486328, "global_step": 306142, "epoch": 1822} {"train_loss": -11.675029754638672, "global_step": 306143, "epoch": 1822} {"train_loss": -12.129304885864258, "global_step": 306144, "epoch": 1822} {"train_loss": -11.855317115783691, "global_step": 306145, "epoch": 1822} {"train_loss": -12.094414710998535, "global_step": 306146, "epoch": 1822} {"train_loss": -11.932158470153809, "global_step": 306147, "epoch": 1822} {"train_loss": -12.258308410644531, "global_step": 306148, "epoch": 1822} {"train_loss": -12.116117477416992, "global_step": 306149, "epoch": 1822} {"train_loss": -12.245794296264648, "global_step": 306150, "epoch": 1822} {"train_loss": -12.035011291503906, "global_step": 306151, "epoch": 1822} {"train_loss": -12.245503425598145, "global_step": 306152, "epoch": 1822} {"train_loss": -12.06304931640625, "global_step": 306153, "epoch": 1822} {"train_loss": -12.302862167358398, "global_step": 306154, "epoch": 1822} {"train_loss": -12.208768844604492, "global_step": 306155, "epoch": 1822} {"train_loss": -12.069429397583008, "global_step": 306156, "epoch": 1822} {"train_loss": -12.295022964477539, "global_step": 306157, "epoch": 1822} {"train_loss": -12.402769088745117, "global_step": 306158, "epoch": 1822} {"train_loss": -12.138130187988281, "global_step": 306159, "epoch": 1822} {"train_loss": -12.403919219970703, "global_step": 306160, "epoch": 1822} {"train_loss": -12.180814743041992, "global_step": 306161, "epoch": 1822} {"train_loss": -12.3038330078125, "global_step": 306162, "epoch": 1822} {"train_loss": -12.369832992553711, "global_step": 306163, "epoch": 1822} {"train_loss": -12.155216217041016, "global_step": 306164, "epoch": 1822} {"train_loss": -12.274287223815918, "global_step": 306165, "epoch": 1822} {"train_loss": -12.325606346130371, "global_step": 306166, "epoch": 1822} {"train_loss": -12.510808944702148, "global_step": 306167, "epoch": 1822} {"train_loss": -12.199670791625977, "global_step": 306168, "epoch": 1822} {"train_loss": -12.182045936584473, "global_step": 306169, "epoch": 1822} {"train_loss": -12.429146766662598, "global_step": 306170, "epoch": 1822} {"train_loss": -12.254350662231445, "global_step": 306171, "epoch": 1822} {"train_loss": -12.11555290222168, "global_step": 306172, "epoch": 1822} {"train_loss": -12.433406829833984, "global_step": 306173, "epoch": 1822} {"train_loss": -12.3173828125, "global_step": 306174, "epoch": 1822} {"train_loss": -11.90142822265625, "global_step": 306175, "epoch": 1822} {"train_loss": -12.257110595703125, "global_step": 306176, "epoch": 1822} {"train_loss": -12.42388916015625, "global_step": 306177, "epoch": 1822} {"train_loss": -12.259010314941406, "global_step": 306178, "epoch": 1822} {"train_loss": -11.655058860778809, "global_step": 306179, "epoch": 1822} {"train_loss": -12.100433349609375, "global_step": 306180, "epoch": 1822} {"train_loss": -12.612312316894531, "global_step": 306181, "epoch": 1822} {"train_loss": -11.948777198791504, "global_step": 306182, "epoch": 1822} {"train_loss": -11.358882904052734, "global_step": 306183, "epoch": 1822} {"train_loss": -12.454793930053711, "global_step": 306184, "epoch": 1822} {"train_loss": -12.199316024780273, "global_step": 306185, "epoch": 1822} {"train_loss": -11.53581428527832, "global_step": 306186, "epoch": 1822} {"train_loss": -11.844051361083984, "global_step": 306187, "epoch": 1822} {"train_loss": -11.921487808227539, "global_step": 306188, "epoch": 1822} {"train_loss": -12.17238712310791, "global_step": 306189, "epoch": 1822} {"train_loss": -11.781839370727539, "global_step": 306190, "epoch": 1822} {"train_loss": -12.032793045043945, "global_step": 306191, "epoch": 1822} {"train_loss": -12.135550498962402, "global_step": 306192, "epoch": 1822} {"train_loss": -12.253908157348633, "global_step": 306193, "epoch": 1822} {"train_loss": -11.670455932617188, "global_step": 306194, "epoch": 1822} {"train_loss": -11.862871170043945, "global_step": 306195, "epoch": 1822} {"train_loss": -12.026987075805664, "global_step": 306196, "epoch": 1822} {"train_loss": -11.8369779586792, "global_step": 306197, "epoch": 1822} {"train_loss": -10.919934272766113, "global_step": 306198, "epoch": 1822} {"train_loss": -11.936802864074707, "global_step": 306199, "epoch": 1822} {"train_loss": -11.303197860717773, "global_step": 306200, "epoch": 1822} {"train_loss": -10.874153137207031, "global_step": 306201, "epoch": 1822} {"train_loss": -11.348418235778809, "global_step": 306202, "epoch": 1822} {"train_loss": -11.624835968017578, "global_step": 306203, "epoch": 1822} {"train_loss": -9.978747367858887, "global_step": 306204, "epoch": 1822} {"train_loss": -12.023844718933105, "global_step": 306205, "epoch": 1822} {"train_loss": -11.601243019104004, "global_step": 306206, "epoch": 1822} {"train_loss": -10.551687240600586, "global_step": 306207, "epoch": 1822} {"train_loss": -12.10070514678955, "global_step": 306208, "epoch": 1822} {"train_loss": -10.165643692016602, "global_step": 306209, "epoch": 1822} {"train_loss": -11.421004295349121, "global_step": 306210, "epoch": 1822} {"train_loss": -11.289754867553711, "global_step": 306211, "epoch": 1822} {"train_loss": -10.958356857299805, "global_step": 306212, "epoch": 1822} {"train_loss": -11.529352188110352, "global_step": 306213, "epoch": 1822} {"train_loss": -10.87118148803711, "global_step": 306214, "epoch": 1822} {"train_loss": -11.554755210876465, "global_step": 306215, "epoch": 1822} {"train_loss": -10.74368953704834, "global_step": 306216, "epoch": 1822} {"train_loss": -11.771282196044922, "global_step": 306217, "epoch": 1822} {"train_loss": -11.489065170288086, "global_step": 306218, "epoch": 1822} {"train_loss": -11.61734676361084, "global_step": 306219, "epoch": 1822} {"train_loss": -11.442906379699707, "global_step": 306220, "epoch": 1822} {"train_loss": -11.755587577819824, "global_step": 306221, "epoch": 1822} {"train_loss": -11.757291793823242, "global_step": 306222, "epoch": 1822} {"train_loss": -11.581108093261719, "global_step": 306223, "epoch": 1822} {"train_loss": -12.237756729125977, "global_step": 306224, "epoch": 1822} {"train_loss": -11.820807456970215, "global_step": 306225, "epoch": 1822} {"train_loss": -12.266901969909668, "global_step": 306226, "epoch": 1822} {"train_loss": -11.684444427490234, "global_step": 306227, "epoch": 1822} {"train_loss": -12.136598587036133, "global_step": 306228, "epoch": 1822} {"train_loss": -12.284663200378418, "global_step": 306229, "epoch": 1822} {"train_loss": -11.743729591369629, "global_step": 306230, "epoch": 1822} {"train_loss": -12.198393821716309, "global_step": 306231, "epoch": 1822} {"train_loss": -11.878887176513672, "global_step": 306232, "epoch": 1822} {"train_loss": -11.903531074523926, "global_step": 306233, "epoch": 1822} {"train_loss": -12.259353637695312, "global_step": 306234, "epoch": 1822} {"train_loss": -12.029182434082031, "global_step": 306235, "epoch": 1822} {"train_loss": -12.212034225463867, "global_step": 306236, "epoch": 1822} {"train_loss": -12.189170837402344, "global_step": 306237, "epoch": 1822} {"train_loss": -12.215408325195312, "global_step": 306238, "epoch": 1822} {"train_loss": -12.161599159240723, "global_step": 306239, "epoch": 1822} {"train_loss": -12.156009674072266, "global_step": 306240, "epoch": 1822} {"train_loss": -12.120113372802734, "global_step": 306241, "epoch": 1822} {"train_loss": -12.343423843383789, "global_step": 306242, "epoch": 1822} {"train_loss": -12.224200248718262, "global_step": 306243, "epoch": 1822} {"train_loss": -12.062976837158203, "global_step": 306244, "epoch": 1822} {"train_loss": -12.201408386230469, "global_step": 306245, "epoch": 1822} {"train_loss": -12.080804824829102, "global_step": 306246, "epoch": 1822} {"train_loss": -11.97030258178711, "global_step": 306247, "epoch": 1822} {"train_loss": -12.289220809936523, "global_step": 306248, "epoch": 1822} {"train_loss": -12.026875495910645, "global_step": 306249, "epoch": 1822} {"train_loss": -11.488119125366211, "global_step": 306250, "epoch": 1822} {"train_loss": -12.245065689086914, "global_step": 306251, "epoch": 1822} {"train_loss": -11.776382446289062, "global_step": 306252, "epoch": 1822} {"train_loss": -11.609338760375977, "global_step": 306253, "epoch": 1822} {"train_loss": -12.223655700683594, "global_step": 306254, "epoch": 1822} {"train_loss": -11.577887535095215, "global_step": 306255, "epoch": 1822} {"train_loss": -11.809823989868164, "global_step": 306256, "epoch": 1822} {"train_loss": -11.774432182312012, "global_step": 306257, "epoch": 1822} {"train_loss": -10.686768531799316, "global_step": 306258, "epoch": 1822} {"train_loss": -11.528644561767578, "global_step": 306259, "epoch": 1822} {"train_loss": -10.611773490905762, "global_step": 306260, "epoch": 1822} {"train_loss": -10.71212100982666, "global_step": 306261, "epoch": 1822} {"train_loss": -11.161273956298828, "global_step": 306262, "epoch": 1822} {"train_loss": -11.8535125823248, "global_step": 306263, "epoch": 1822, "val_loss": 282860.40625} {"train_loss": -10.76756477355957, "global_step": 306264, "epoch": 1823} {"train_loss": -8.66031551361084, "global_step": 306265, "epoch": 1823} {"train_loss": -7.18098258972168, "global_step": 306266, "epoch": 1823} {"train_loss": -7.185247421264648, "global_step": 306267, "epoch": 1823} {"train_loss": -8.394512176513672, "global_step": 306268, "epoch": 1823} {"train_loss": -8.381160736083984, "global_step": 306269, "epoch": 1823} {"train_loss": -9.025009155273438, "global_step": 306270, "epoch": 1823} {"train_loss": -8.323049545288086, "global_step": 306271, "epoch": 1823} {"train_loss": -8.144596099853516, "global_step": 306272, "epoch": 1823} {"train_loss": -8.523062705993652, "global_step": 306273, "epoch": 1823} {"train_loss": -9.202986717224121, "global_step": 306274, "epoch": 1823} {"train_loss": -9.505462646484375, "global_step": 306275, "epoch": 1823} {"train_loss": -10.022679328918457, "global_step": 306276, "epoch": 1823} {"train_loss": -9.40353775024414, "global_step": 306277, "epoch": 1823} {"train_loss": -10.712724685668945, "global_step": 306278, "epoch": 1823} {"train_loss": -9.954861640930176, "global_step": 306279, "epoch": 1823} {"train_loss": -9.501773834228516, "global_step": 306280, "epoch": 1823} {"train_loss": -10.244832992553711, "global_step": 306281, "epoch": 1823} {"train_loss": -9.678754806518555, "global_step": 306282, "epoch": 1823} {"train_loss": -9.15888500213623, "global_step": 306283, "epoch": 1823} {"train_loss": -10.82309341430664, "global_step": 306284, "epoch": 1823} {"train_loss": -10.43764877319336, "global_step": 306285, "epoch": 1823} {"train_loss": -10.529285430908203, "global_step": 306286, "epoch": 1823} {"train_loss": -10.889694213867188, "global_step": 306287, "epoch": 1823} {"train_loss": -11.034120559692383, "global_step": 306288, "epoch": 1823} {"train_loss": -10.55500602722168, "global_step": 306289, "epoch": 1823} {"train_loss": -10.578487396240234, "global_step": 306290, "epoch": 1823} {"train_loss": -11.058439254760742, "global_step": 306291, "epoch": 1823} {"train_loss": -10.036155700683594, "global_step": 306292, "epoch": 1823} {"train_loss": -11.418954849243164, "global_step": 306293, "epoch": 1823} {"train_loss": -10.791200637817383, "global_step": 306294, "epoch": 1823} {"train_loss": -11.579345703125, "global_step": 306295, "epoch": 1823} {"train_loss": -11.334096908569336, "global_step": 306296, "epoch": 1823} {"train_loss": -11.159831047058105, "global_step": 306297, "epoch": 1823} {"train_loss": -11.257474899291992, "global_step": 306298, "epoch": 1823} {"train_loss": -11.029926300048828, "global_step": 306299, "epoch": 1823} {"train_loss": -11.30343246459961, "global_step": 306300, "epoch": 1823} {"train_loss": -11.105035781860352, "global_step": 306301, "epoch": 1823} {"train_loss": -11.44652271270752, "global_step": 306302, "epoch": 1823} {"train_loss": -11.415661811828613, "global_step": 306303, "epoch": 1823} {"train_loss": -11.45524787902832, "global_step": 306304, "epoch": 1823} {"train_loss": -11.143318176269531, "global_step": 306305, "epoch": 1823} {"train_loss": -11.400423049926758, "global_step": 306306, "epoch": 1823} {"train_loss": -11.64412784576416, "global_step": 306307, "epoch": 1823} {"train_loss": -10.876583099365234, "global_step": 306308, "epoch": 1823} {"train_loss": -11.480292320251465, "global_step": 306309, "epoch": 1823} {"train_loss": -11.005921363830566, "global_step": 306310, "epoch": 1823} {"train_loss": -11.438060760498047, "global_step": 306311, "epoch": 1823} {"train_loss": -11.438440322875977, "global_step": 306312, "epoch": 1823} {"train_loss": -11.365850448608398, "global_step": 306313, "epoch": 1823} {"train_loss": -11.667129516601562, "global_step": 306314, "epoch": 1823} {"train_loss": -11.258871078491211, "global_step": 306315, "epoch": 1823} {"train_loss": -11.723379135131836, "global_step": 306316, "epoch": 1823} {"train_loss": -11.803593635559082, "global_step": 306317, "epoch": 1823} {"train_loss": -11.30943489074707, "global_step": 306318, "epoch": 1823} {"train_loss": -11.89108943939209, "global_step": 306319, "epoch": 1823} {"train_loss": -11.778806686401367, "global_step": 306320, "epoch": 1823} {"train_loss": -11.31100845336914, "global_step": 306321, "epoch": 1823} {"train_loss": -11.96304702758789, "global_step": 306322, "epoch": 1823} {"train_loss": -11.601856231689453, "global_step": 306323, "epoch": 1823} {"train_loss": -11.79255485534668, "global_step": 306324, "epoch": 1823} {"train_loss": -11.83919906616211, "global_step": 306325, "epoch": 1823} {"train_loss": -11.677827835083008, "global_step": 306326, "epoch": 1823} {"train_loss": -11.884466171264648, "global_step": 306327, "epoch": 1823} {"train_loss": -11.663878440856934, "global_step": 306328, "epoch": 1823} {"train_loss": -11.960260391235352, "global_step": 306329, "epoch": 1823} {"train_loss": -12.027645111083984, "global_step": 306330, "epoch": 1823} {"train_loss": -11.88550090789795, "global_step": 306331, "epoch": 1823} {"train_loss": -11.965337753295898, "global_step": 306332, "epoch": 1823} {"train_loss": -11.703832626342773, "global_step": 306333, "epoch": 1823} {"train_loss": -11.899502754211426, "global_step": 306334, "epoch": 1823} {"train_loss": -11.903949737548828, "global_step": 306335, "epoch": 1823} {"train_loss": -11.811063766479492, "global_step": 306336, "epoch": 1823} {"train_loss": -11.82309341430664, "global_step": 306337, "epoch": 1823} {"train_loss": -11.788930892944336, "global_step": 306338, "epoch": 1823} {"train_loss": -11.939119338989258, "global_step": 306339, "epoch": 1823} {"train_loss": -11.941344261169434, "global_step": 306340, "epoch": 1823} {"train_loss": -12.107568740844727, "global_step": 306341, "epoch": 1823} {"train_loss": -11.88836669921875, "global_step": 306342, "epoch": 1823} {"train_loss": -12.049232482910156, "global_step": 306343, "epoch": 1823} {"train_loss": -12.0941162109375, "global_step": 306344, "epoch": 1823} {"train_loss": -12.046960830688477, "global_step": 306345, "epoch": 1823} {"train_loss": -12.081457138061523, "global_step": 306346, "epoch": 1823} {"train_loss": -11.995113372802734, "global_step": 306347, "epoch": 1823} {"train_loss": -12.158580780029297, "global_step": 306348, "epoch": 1823} {"train_loss": -12.159223556518555, "global_step": 306349, "epoch": 1823} {"train_loss": -12.203194618225098, "global_step": 306350, "epoch": 1823} {"train_loss": -12.12041187286377, "global_step": 306351, "epoch": 1823} {"train_loss": -12.365564346313477, "global_step": 306352, "epoch": 1823} {"train_loss": -12.069156646728516, "global_step": 306353, "epoch": 1823} {"train_loss": -11.996441841125488, "global_step": 306354, "epoch": 1823} {"train_loss": -12.304991722106934, "global_step": 306355, "epoch": 1823} {"train_loss": -12.233192443847656, "global_step": 306356, "epoch": 1823} {"train_loss": -11.944095611572266, "global_step": 306357, "epoch": 1823} {"train_loss": -12.148515701293945, "global_step": 306358, "epoch": 1823} {"train_loss": -11.723896980285645, "global_step": 306359, "epoch": 1823} {"train_loss": -12.160443305969238, "global_step": 306360, "epoch": 1823} {"train_loss": -12.189239501953125, "global_step": 306361, "epoch": 1823} {"train_loss": -12.035107612609863, "global_step": 306362, "epoch": 1823} {"train_loss": -12.426724433898926, "global_step": 306363, "epoch": 1823} {"train_loss": -12.167418479919434, "global_step": 306364, "epoch": 1823} {"train_loss": -12.265237808227539, "global_step": 306365, "epoch": 1823} {"train_loss": -12.217098236083984, "global_step": 306366, "epoch": 1823} {"train_loss": -12.266851425170898, "global_step": 306367, "epoch": 1823} {"train_loss": -12.17193603515625, "global_step": 306368, "epoch": 1823} {"train_loss": -12.148859024047852, "global_step": 306369, "epoch": 1823} {"train_loss": -12.180908203125, "global_step": 306370, "epoch": 1823} {"train_loss": -12.138237953186035, "global_step": 306371, "epoch": 1823} {"train_loss": -12.268701553344727, "global_step": 306372, "epoch": 1823} {"train_loss": -12.368634223937988, "global_step": 306373, "epoch": 1823} {"train_loss": -11.800450325012207, "global_step": 306374, "epoch": 1823} {"train_loss": -12.358823776245117, "global_step": 306375, "epoch": 1823} {"train_loss": -12.08944320678711, "global_step": 306376, "epoch": 1823} {"train_loss": -11.86674690246582, "global_step": 306377, "epoch": 1823} {"train_loss": -12.113323211669922, "global_step": 306378, "epoch": 1823} {"train_loss": -12.041799545288086, "global_step": 306379, "epoch": 1823} {"train_loss": -12.4090576171875, "global_step": 306380, "epoch": 1823} {"train_loss": -12.278902053833008, "global_step": 306381, "epoch": 1823} {"train_loss": -12.253018379211426, "global_step": 306382, "epoch": 1823} {"train_loss": -12.184162139892578, "global_step": 306383, "epoch": 1823} {"train_loss": -12.310965538024902, "global_step": 306384, "epoch": 1823} {"train_loss": -12.023884773254395, "global_step": 306385, "epoch": 1823} {"train_loss": -12.435667037963867, "global_step": 306386, "epoch": 1823} {"train_loss": -12.170951843261719, "global_step": 306387, "epoch": 1823} {"train_loss": -11.989381790161133, "global_step": 306388, "epoch": 1823} {"train_loss": -12.078902244567871, "global_step": 306389, "epoch": 1823} {"train_loss": -11.98853874206543, "global_step": 306390, "epoch": 1823} {"train_loss": -12.192094802856445, "global_step": 306391, "epoch": 1823} {"train_loss": -12.248805046081543, "global_step": 306392, "epoch": 1823} {"train_loss": -12.443981170654297, "global_step": 306393, "epoch": 1823} {"train_loss": -12.234373092651367, "global_step": 306394, "epoch": 1823} {"train_loss": -12.258338928222656, "global_step": 306395, "epoch": 1823} {"train_loss": -12.151361465454102, "global_step": 306396, "epoch": 1823} {"train_loss": -11.804946899414062, "global_step": 306397, "epoch": 1823} {"train_loss": -11.780399322509766, "global_step": 306398, "epoch": 1823} {"train_loss": -12.298519134521484, "global_step": 306399, "epoch": 1823} {"train_loss": -12.065281867980957, "global_step": 306400, "epoch": 1823} {"train_loss": -11.929462432861328, "global_step": 306401, "epoch": 1823} {"train_loss": -11.962576866149902, "global_step": 306402, "epoch": 1823} {"train_loss": -12.034695625305176, "global_step": 306403, "epoch": 1823} {"train_loss": -11.937840461730957, "global_step": 306404, "epoch": 1823} {"train_loss": -11.903926849365234, "global_step": 306405, "epoch": 1823} {"train_loss": -12.136338233947754, "global_step": 306406, "epoch": 1823} {"train_loss": -12.104279518127441, "global_step": 306407, "epoch": 1823} {"train_loss": -12.075809478759766, "global_step": 306408, "epoch": 1823} {"train_loss": -11.834909439086914, "global_step": 306409, "epoch": 1823} {"train_loss": -12.01121997833252, "global_step": 306410, "epoch": 1823} {"train_loss": -12.233919143676758, "global_step": 306411, "epoch": 1823} {"train_loss": -12.21839714050293, "global_step": 306412, "epoch": 1823} {"train_loss": -12.293852806091309, "global_step": 306413, "epoch": 1823} {"train_loss": -12.347789764404297, "global_step": 306414, "epoch": 1823} {"train_loss": -12.344834327697754, "global_step": 306415, "epoch": 1823} {"train_loss": -12.123064994812012, "global_step": 306416, "epoch": 1823} {"train_loss": -12.24505615234375, "global_step": 306417, "epoch": 1823} {"train_loss": -12.302156448364258, "global_step": 306418, "epoch": 1823} {"train_loss": -12.124246597290039, "global_step": 306419, "epoch": 1823} {"train_loss": -12.021978378295898, "global_step": 306420, "epoch": 1823} {"train_loss": -12.313733100891113, "global_step": 306421, "epoch": 1823} {"train_loss": -12.21335220336914, "global_step": 306422, "epoch": 1823} {"train_loss": -12.369199752807617, "global_step": 306423, "epoch": 1823} {"train_loss": -12.394279479980469, "global_step": 306424, "epoch": 1823} {"train_loss": -12.242643356323242, "global_step": 306425, "epoch": 1823} {"train_loss": -12.45543098449707, "global_step": 306426, "epoch": 1823} {"train_loss": -12.036864280700684, "global_step": 306427, "epoch": 1823} {"train_loss": -12.447969436645508, "global_step": 306428, "epoch": 1823} {"train_loss": -11.963777542114258, "global_step": 306429, "epoch": 1823} {"train_loss": -12.240428924560547, "global_step": 306430, "epoch": 1823} {"train_loss": -11.53726651555016, "global_step": 306431, "epoch": 1823, "val_loss": 281303.25} {"train_loss": -11.863986015319824, "global_step": 306432, "epoch": 1824} {"train_loss": -12.08023452758789, "global_step": 306433, "epoch": 1824} {"train_loss": -12.260444641113281, "global_step": 306434, "epoch": 1824} {"train_loss": -12.46656608581543, "global_step": 306435, "epoch": 1824} {"train_loss": -12.156975746154785, "global_step": 306436, "epoch": 1824} {"train_loss": -11.953824996948242, "global_step": 306437, "epoch": 1824} {"train_loss": -12.057079315185547, "global_step": 306438, "epoch": 1824} {"train_loss": -11.420209884643555, "global_step": 306439, "epoch": 1824} {"train_loss": -11.309530258178711, "global_step": 306440, "epoch": 1824} {"train_loss": -12.351306915283203, "global_step": 306441, "epoch": 1824} {"train_loss": -11.423261642456055, "global_step": 306442, "epoch": 1824} {"train_loss": -10.935808181762695, "global_step": 306443, "epoch": 1824} {"train_loss": -11.264225006103516, "global_step": 306444, "epoch": 1824} {"train_loss": -11.604740142822266, "global_step": 306445, "epoch": 1824} {"train_loss": -10.97457504272461, "global_step": 306446, "epoch": 1824} {"train_loss": -10.359407424926758, "global_step": 306447, "epoch": 1824} {"train_loss": -10.454352378845215, "global_step": 306448, "epoch": 1824} {"train_loss": -11.6614990234375, "global_step": 306449, "epoch": 1824} {"train_loss": -11.32377815246582, "global_step": 306450, "epoch": 1824} {"train_loss": -11.935523986816406, "global_step": 306451, "epoch": 1824} {"train_loss": -11.314547538757324, "global_step": 306452, "epoch": 1824} {"train_loss": -11.216976165771484, "global_step": 306453, "epoch": 1824} {"train_loss": -11.269813537597656, "global_step": 306454, "epoch": 1824} {"train_loss": -11.820798873901367, "global_step": 306455, "epoch": 1824} {"train_loss": -11.945074081420898, "global_step": 306456, "epoch": 1824} {"train_loss": -11.803367614746094, "global_step": 306457, "epoch": 1824} {"train_loss": -12.06320858001709, "global_step": 306458, "epoch": 1824} {"train_loss": -11.887775421142578, "global_step": 306459, "epoch": 1824} {"train_loss": -11.766168594360352, "global_step": 306460, "epoch": 1824} {"train_loss": -12.022290229797363, "global_step": 306461, "epoch": 1824} {"train_loss": -11.664079666137695, "global_step": 306462, "epoch": 1824} {"train_loss": -11.708654403686523, "global_step": 306463, "epoch": 1824} {"train_loss": -11.785409927368164, "global_step": 306464, "epoch": 1824} {"train_loss": -11.812471389770508, "global_step": 306465, "epoch": 1824} {"train_loss": -11.826488494873047, "global_step": 306466, "epoch": 1824} {"train_loss": -12.103955268859863, "global_step": 306467, "epoch": 1824} {"train_loss": -11.886098861694336, "global_step": 306468, "epoch": 1824} {"train_loss": -12.050758361816406, "global_step": 306469, "epoch": 1824} {"train_loss": -12.202287673950195, "global_step": 306470, "epoch": 1824} {"train_loss": -12.027900695800781, "global_step": 306471, "epoch": 1824} {"train_loss": -12.277816772460938, "global_step": 306472, "epoch": 1824} {"train_loss": -12.186028480529785, "global_step": 306473, "epoch": 1824} {"train_loss": -12.20826530456543, "global_step": 306474, "epoch": 1824} {"train_loss": -12.077262878417969, "global_step": 306475, "epoch": 1824} {"train_loss": -12.201469421386719, "global_step": 306476, "epoch": 1824} {"train_loss": -12.261411666870117, "global_step": 306477, "epoch": 1824} {"train_loss": -12.314846992492676, "global_step": 306478, "epoch": 1824} {"train_loss": -12.184179306030273, "global_step": 306479, "epoch": 1824} {"train_loss": -12.58343505859375, "global_step": 306480, "epoch": 1824} {"train_loss": -12.00179672241211, "global_step": 306481, "epoch": 1824} {"train_loss": -12.134005546569824, "global_step": 306482, "epoch": 1824} {"train_loss": -12.339791297912598, "global_step": 306483, "epoch": 1824} {"train_loss": -12.159516334533691, "global_step": 306484, "epoch": 1824} {"train_loss": -12.149364471435547, "global_step": 306485, "epoch": 1824} {"train_loss": -12.368085861206055, "global_step": 306486, "epoch": 1824} {"train_loss": -12.039403915405273, "global_step": 306487, "epoch": 1824} {"train_loss": -11.976181983947754, "global_step": 306488, "epoch": 1824} {"train_loss": -12.27680492401123, "global_step": 306489, "epoch": 1824} {"train_loss": -12.166723251342773, "global_step": 306490, "epoch": 1824} {"train_loss": -12.23637866973877, "global_step": 306491, "epoch": 1824} {"train_loss": -11.962056159973145, "global_step": 306492, "epoch": 1824} {"train_loss": -12.25286865234375, "global_step": 306493, "epoch": 1824} {"train_loss": -12.422468185424805, "global_step": 306494, "epoch": 1824} {"train_loss": -11.971517562866211, "global_step": 306495, "epoch": 1824} {"train_loss": -12.262975692749023, "global_step": 306496, "epoch": 1824} {"train_loss": -12.266571998596191, "global_step": 306497, "epoch": 1824} {"train_loss": -12.36250114440918, "global_step": 306498, "epoch": 1824} {"train_loss": -12.318445205688477, "global_step": 306499, "epoch": 1824} {"train_loss": -12.465618133544922, "global_step": 306500, "epoch": 1824} {"train_loss": -12.156194686889648, "global_step": 306501, "epoch": 1824} {"train_loss": -12.468435287475586, "global_step": 306502, "epoch": 1824} {"train_loss": -12.345260620117188, "global_step": 306503, "epoch": 1824} {"train_loss": -12.440581321716309, "global_step": 306504, "epoch": 1824} {"train_loss": -12.355400085449219, "global_step": 306505, "epoch": 1824} {"train_loss": -12.002359390258789, "global_step": 306506, "epoch": 1824} {"train_loss": -12.350750923156738, "global_step": 306507, "epoch": 1824} {"train_loss": -12.23543930053711, "global_step": 306508, "epoch": 1824} {"train_loss": -12.334115982055664, "global_step": 306509, "epoch": 1824} {"train_loss": -12.128056526184082, "global_step": 306510, "epoch": 1824} {"train_loss": -12.066176414489746, "global_step": 306511, "epoch": 1824} {"train_loss": -12.163426399230957, "global_step": 306512, "epoch": 1824} {"train_loss": -12.17245101928711, "global_step": 306513, "epoch": 1824} {"train_loss": -11.700647354125977, "global_step": 306514, "epoch": 1824} {"train_loss": -11.599241256713867, "global_step": 306515, "epoch": 1824} {"train_loss": -12.179560661315918, "global_step": 306516, "epoch": 1824} {"train_loss": -11.832686424255371, "global_step": 306517, "epoch": 1824} {"train_loss": -11.207499504089355, "global_step": 306518, "epoch": 1824} {"train_loss": -10.460441589355469, "global_step": 306519, "epoch": 1824} {"train_loss": -11.835006713867188, "global_step": 306520, "epoch": 1824} {"train_loss": -11.561809539794922, "global_step": 306521, "epoch": 1824} {"train_loss": -11.400396347045898, "global_step": 306522, "epoch": 1824} {"train_loss": -11.345184326171875, "global_step": 306523, "epoch": 1824} {"train_loss": -12.508779525756836, "global_step": 306524, "epoch": 1824} {"train_loss": -11.332027435302734, "global_step": 306525, "epoch": 1824} {"train_loss": -10.620304107666016, "global_step": 306526, "epoch": 1824} {"train_loss": -11.671842575073242, "global_step": 306527, "epoch": 1824} {"train_loss": -11.551156044006348, "global_step": 306528, "epoch": 1824} {"train_loss": -10.231861114501953, "global_step": 306529, "epoch": 1824} {"train_loss": -9.834860801696777, "global_step": 306530, "epoch": 1824} {"train_loss": -11.64112663269043, "global_step": 306531, "epoch": 1824} {"train_loss": -8.848257064819336, "global_step": 306532, "epoch": 1824} {"train_loss": -10.31590461730957, "global_step": 306533, "epoch": 1824} {"train_loss": -10.562368392944336, "global_step": 306534, "epoch": 1824} {"train_loss": -10.97807502746582, "global_step": 306535, "epoch": 1824} {"train_loss": -9.711350440979004, "global_step": 306536, "epoch": 1824} {"train_loss": -11.076622009277344, "global_step": 306537, "epoch": 1824} {"train_loss": -10.47303581237793, "global_step": 306538, "epoch": 1824} {"train_loss": -10.504021644592285, "global_step": 306539, "epoch": 1824} {"train_loss": -11.646585464477539, "global_step": 306540, "epoch": 1824} {"train_loss": -11.305306434631348, "global_step": 306541, "epoch": 1824} {"train_loss": -11.328439712524414, "global_step": 306542, "epoch": 1824} {"train_loss": -11.39870548248291, "global_step": 306543, "epoch": 1824} {"train_loss": -11.047462463378906, "global_step": 306544, "epoch": 1824} {"train_loss": -11.735795974731445, "global_step": 306545, "epoch": 1824} {"train_loss": -11.563621520996094, "global_step": 306546, "epoch": 1824} {"train_loss": -11.514739990234375, "global_step": 306547, "epoch": 1824} {"train_loss": -11.391300201416016, "global_step": 306548, "epoch": 1824} {"train_loss": -11.673198699951172, "global_step": 306549, "epoch": 1824} {"train_loss": -11.482112884521484, "global_step": 306550, "epoch": 1824} {"train_loss": -11.689348220825195, "global_step": 306551, "epoch": 1824} {"train_loss": -11.917325019836426, "global_step": 306552, "epoch": 1824} {"train_loss": -11.494558334350586, "global_step": 306553, "epoch": 1824} {"train_loss": -11.954689025878906, "global_step": 306554, "epoch": 1824} {"train_loss": -11.396608352661133, "global_step": 306555, "epoch": 1824} {"train_loss": -11.728158950805664, "global_step": 306556, "epoch": 1824} {"train_loss": -11.926799774169922, "global_step": 306557, "epoch": 1824} {"train_loss": -12.1029691696167, "global_step": 306558, "epoch": 1824} {"train_loss": -11.934626579284668, "global_step": 306559, "epoch": 1824} {"train_loss": -11.737910270690918, "global_step": 306560, "epoch": 1824} {"train_loss": -11.866613388061523, "global_step": 306561, "epoch": 1824} {"train_loss": -12.007713317871094, "global_step": 306562, "epoch": 1824} {"train_loss": -12.249906539916992, "global_step": 306563, "epoch": 1824} {"train_loss": -12.223525047302246, "global_step": 306564, "epoch": 1824} {"train_loss": -11.890708923339844, "global_step": 306565, "epoch": 1824} {"train_loss": -12.379623413085938, "global_step": 306566, "epoch": 1824} {"train_loss": -12.219919204711914, "global_step": 306567, "epoch": 1824} {"train_loss": -12.082908630371094, "global_step": 306568, "epoch": 1824} {"train_loss": -11.974309921264648, "global_step": 306569, "epoch": 1824} {"train_loss": -11.813444137573242, "global_step": 306570, "epoch": 1824} {"train_loss": -12.246971130371094, "global_step": 306571, "epoch": 1824} {"train_loss": -11.96514892578125, "global_step": 306572, "epoch": 1824} {"train_loss": -12.301761627197266, "global_step": 306573, "epoch": 1824} {"train_loss": -12.054630279541016, "global_step": 306574, "epoch": 1824} {"train_loss": -11.926534652709961, "global_step": 306575, "epoch": 1824} {"train_loss": -12.351993560791016, "global_step": 306576, "epoch": 1824} {"train_loss": -12.156023025512695, "global_step": 306577, "epoch": 1824} {"train_loss": -12.29100227355957, "global_step": 306578, "epoch": 1824} {"train_loss": -12.135892868041992, "global_step": 306579, "epoch": 1824} {"train_loss": -12.285642623901367, "global_step": 306580, "epoch": 1824} {"train_loss": -11.831632614135742, "global_step": 306581, "epoch": 1824} {"train_loss": -12.218928337097168, "global_step": 306582, "epoch": 1824} {"train_loss": -12.156601905822754, "global_step": 306583, "epoch": 1824} {"train_loss": -12.228680610656738, "global_step": 306584, "epoch": 1824} {"train_loss": -12.231861114501953, "global_step": 306585, "epoch": 1824} {"train_loss": -12.338336944580078, "global_step": 306586, "epoch": 1824} {"train_loss": -12.404594421386719, "global_step": 306587, "epoch": 1824} {"train_loss": -12.196477890014648, "global_step": 306588, "epoch": 1824} {"train_loss": -12.150710105895996, "global_step": 306589, "epoch": 1824} {"train_loss": -12.266295433044434, "global_step": 306590, "epoch": 1824} {"train_loss": -12.278358459472656, "global_step": 306591, "epoch": 1824} {"train_loss": -12.548027992248535, "global_step": 306592, "epoch": 1824} {"train_loss": -12.221816062927246, "global_step": 306593, "epoch": 1824} {"train_loss": -12.393933296203613, "global_step": 306594, "epoch": 1824} {"train_loss": -12.384563446044922, "global_step": 306595, "epoch": 1824} {"train_loss": -12.143566131591797, "global_step": 306596, "epoch": 1824} {"train_loss": -12.37629222869873, "global_step": 306597, "epoch": 1824} {"train_loss": -12.313285827636719, "global_step": 306598, "epoch": 1824} {"train_loss": -11.834010487511044, "global_step": 306599, "epoch": 1824, "val_loss": 281194.6875} {"train_loss": -11.841068267822266, "global_step": 306600, "epoch": 1825} {"train_loss": -12.367189407348633, "global_step": 306601, "epoch": 1825} {"train_loss": -11.990920066833496, "global_step": 306602, "epoch": 1825} {"train_loss": -12.349700927734375, "global_step": 306603, "epoch": 1825} {"train_loss": -11.812291145324707, "global_step": 306604, "epoch": 1825} {"train_loss": -12.272945404052734, "global_step": 306605, "epoch": 1825} {"train_loss": -11.459784507751465, "global_step": 306606, "epoch": 1825} {"train_loss": -12.271139144897461, "global_step": 306607, "epoch": 1825} {"train_loss": -12.114618301391602, "global_step": 306608, "epoch": 1825} {"train_loss": -11.859888076782227, "global_step": 306609, "epoch": 1825} {"train_loss": -12.003376960754395, "global_step": 306610, "epoch": 1825} {"train_loss": -11.478574752807617, "global_step": 306611, "epoch": 1825} {"train_loss": -11.972187042236328, "global_step": 306612, "epoch": 1825} {"train_loss": -11.976089477539062, "global_step": 306613, "epoch": 1825} {"train_loss": -12.204536437988281, "global_step": 306614, "epoch": 1825} {"train_loss": -12.061418533325195, "global_step": 306615, "epoch": 1825} {"train_loss": -12.279871940612793, "global_step": 306616, "epoch": 1825} {"train_loss": -12.297002792358398, "global_step": 306617, "epoch": 1825} {"train_loss": -11.883550643920898, "global_step": 306618, "epoch": 1825} {"train_loss": -12.298053741455078, "global_step": 306619, "epoch": 1825} {"train_loss": -12.010368347167969, "global_step": 306620, "epoch": 1825} {"train_loss": -12.199454307556152, "global_step": 306621, "epoch": 1825} {"train_loss": -12.48360824584961, "global_step": 306622, "epoch": 1825} {"train_loss": -12.068778991699219, "global_step": 306623, "epoch": 1825} {"train_loss": -11.734247207641602, "global_step": 306624, "epoch": 1825} {"train_loss": -12.694642066955566, "global_step": 306625, "epoch": 1825} {"train_loss": -11.872946739196777, "global_step": 306626, "epoch": 1825} {"train_loss": -11.46473503112793, "global_step": 306627, "epoch": 1825} {"train_loss": -11.522452354431152, "global_step": 306628, "epoch": 1825} {"train_loss": -12.402899742126465, "global_step": 306629, "epoch": 1825} {"train_loss": -11.980094909667969, "global_step": 306630, "epoch": 1825} {"train_loss": -12.41905403137207, "global_step": 306631, "epoch": 1825} {"train_loss": -11.794487953186035, "global_step": 306632, "epoch": 1825} {"train_loss": -11.752163887023926, "global_step": 306633, "epoch": 1825} {"train_loss": -12.104299545288086, "global_step": 306634, "epoch": 1825} {"train_loss": -12.022732734680176, "global_step": 306635, "epoch": 1825} {"train_loss": -12.195474624633789, "global_step": 306636, "epoch": 1825} {"train_loss": -12.172794342041016, "global_step": 306637, "epoch": 1825} {"train_loss": -12.208684921264648, "global_step": 306638, "epoch": 1825} {"train_loss": -12.37547492980957, "global_step": 306639, "epoch": 1825} {"train_loss": -12.22386360168457, "global_step": 306640, "epoch": 1825} {"train_loss": -12.494484901428223, "global_step": 306641, "epoch": 1825} {"train_loss": -12.224334716796875, "global_step": 306642, "epoch": 1825} {"train_loss": -12.491717338562012, "global_step": 306643, "epoch": 1825} {"train_loss": -12.188216209411621, "global_step": 306644, "epoch": 1825} {"train_loss": -12.149775505065918, "global_step": 306645, "epoch": 1825} {"train_loss": -12.260724067687988, "global_step": 306646, "epoch": 1825} {"train_loss": -12.522014617919922, "global_step": 306647, "epoch": 1825} {"train_loss": -12.230177879333496, "global_step": 306648, "epoch": 1825} {"train_loss": -12.410120010375977, "global_step": 306649, "epoch": 1825} {"train_loss": -12.13851547241211, "global_step": 306650, "epoch": 1825} {"train_loss": -12.505733489990234, "global_step": 306651, "epoch": 1825} {"train_loss": -12.403074264526367, "global_step": 306652, "epoch": 1825} {"train_loss": -12.216466903686523, "global_step": 306653, "epoch": 1825} {"train_loss": -12.56425666809082, "global_step": 306654, "epoch": 1825} {"train_loss": -12.444753646850586, "global_step": 306655, "epoch": 1825} {"train_loss": -12.554399490356445, "global_step": 306656, "epoch": 1825} {"train_loss": -12.2736177444458, "global_step": 306657, "epoch": 1825} {"train_loss": -12.496397018432617, "global_step": 306658, "epoch": 1825} {"train_loss": -12.415966033935547, "global_step": 306659, "epoch": 1825} {"train_loss": -12.32890796661377, "global_step": 306660, "epoch": 1825} {"train_loss": -12.471122741699219, "global_step": 306661, "epoch": 1825} {"train_loss": -12.25468635559082, "global_step": 306662, "epoch": 1825} {"train_loss": -12.405277252197266, "global_step": 306663, "epoch": 1825} {"train_loss": -12.435248374938965, "global_step": 306664, "epoch": 1825} {"train_loss": -12.437211036682129, "global_step": 306665, "epoch": 1825} {"train_loss": -12.158515930175781, "global_step": 306666, "epoch": 1825} {"train_loss": -12.4180908203125, "global_step": 306667, "epoch": 1825} {"train_loss": -11.509183883666992, "global_step": 306668, "epoch": 1825} {"train_loss": -11.932751655578613, "global_step": 306669, "epoch": 1825} {"train_loss": -11.943427085876465, "global_step": 306670, "epoch": 1825} {"train_loss": -12.454182624816895, "global_step": 306671, "epoch": 1825} {"train_loss": -12.109556198120117, "global_step": 306672, "epoch": 1825} {"train_loss": -12.320399284362793, "global_step": 306673, "epoch": 1825} {"train_loss": -11.82482624053955, "global_step": 306674, "epoch": 1825} {"train_loss": -12.4466552734375, "global_step": 306675, "epoch": 1825} {"train_loss": -12.044058799743652, "global_step": 306676, "epoch": 1825} {"train_loss": -12.199575424194336, "global_step": 306677, "epoch": 1825} {"train_loss": -11.891796112060547, "global_step": 306678, "epoch": 1825} {"train_loss": -12.290580749511719, "global_step": 306679, "epoch": 1825} {"train_loss": -11.306966781616211, "global_step": 306680, "epoch": 1825} {"train_loss": -11.214261054992676, "global_step": 306681, "epoch": 1825} {"train_loss": -12.170395851135254, "global_step": 306682, "epoch": 1825} {"train_loss": -9.82232666015625, "global_step": 306683, "epoch": 1825} {"train_loss": -10.413040161132812, "global_step": 306684, "epoch": 1825} {"train_loss": -7.60967493057251, "global_step": 306685, "epoch": 1825} {"train_loss": -7.63943338394165, "global_step": 306686, "epoch": 1825} {"train_loss": -6.9656901359558105, "global_step": 306687, "epoch": 1825} {"train_loss": -6.256660461425781, "global_step": 306688, "epoch": 1825} {"train_loss": -6.4920854568481445, "global_step": 306689, "epoch": 1825} {"train_loss": -7.440732002258301, "global_step": 306690, "epoch": 1825} {"train_loss": -7.006979465484619, "global_step": 306691, "epoch": 1825} {"train_loss": -7.137308120727539, "global_step": 306692, "epoch": 1825} {"train_loss": -8.065145492553711, "global_step": 306693, "epoch": 1825} {"train_loss": -7.975715160369873, "global_step": 306694, "epoch": 1825} {"train_loss": -8.148567199707031, "global_step": 306695, "epoch": 1825} {"train_loss": -7.574288368225098, "global_step": 306696, "epoch": 1825} {"train_loss": -8.09986400604248, "global_step": 306697, "epoch": 1825} {"train_loss": -8.017183303833008, "global_step": 306698, "epoch": 1825} {"train_loss": -8.190539360046387, "global_step": 306699, "epoch": 1825} {"train_loss": -8.932440757751465, "global_step": 306700, "epoch": 1825} {"train_loss": -8.59401798248291, "global_step": 306701, "epoch": 1825} {"train_loss": -9.184734344482422, "global_step": 306702, "epoch": 1825} {"train_loss": -9.040594100952148, "global_step": 306703, "epoch": 1825} {"train_loss": -9.203363418579102, "global_step": 306704, "epoch": 1825} {"train_loss": -9.887659072875977, "global_step": 306705, "epoch": 1825} {"train_loss": -9.92816162109375, "global_step": 306706, "epoch": 1825} {"train_loss": -10.388097763061523, "global_step": 306707, "epoch": 1825} {"train_loss": -10.358253479003906, "global_step": 306708, "epoch": 1825} {"train_loss": -10.712093353271484, "global_step": 306709, "epoch": 1825} {"train_loss": -10.068511009216309, "global_step": 306710, "epoch": 1825} {"train_loss": -10.565349578857422, "global_step": 306711, "epoch": 1825} {"train_loss": -9.052397727966309, "global_step": 306712, "epoch": 1825} {"train_loss": -9.88378620147705, "global_step": 306713, "epoch": 1825} {"train_loss": -9.956850051879883, "global_step": 306714, "epoch": 1825} {"train_loss": -9.599461555480957, "global_step": 306715, "epoch": 1825} {"train_loss": -9.626115798950195, "global_step": 306716, "epoch": 1825} {"train_loss": -10.711294174194336, "global_step": 306717, "epoch": 1825} {"train_loss": -10.398035049438477, "global_step": 306718, "epoch": 1825} {"train_loss": -10.346879005432129, "global_step": 306719, "epoch": 1825} {"train_loss": -10.870948791503906, "global_step": 306720, "epoch": 1825} {"train_loss": -10.83411693572998, "global_step": 306721, "epoch": 1825} {"train_loss": -11.141717910766602, "global_step": 306722, "epoch": 1825} {"train_loss": -10.64985466003418, "global_step": 306723, "epoch": 1825} {"train_loss": -11.689126968383789, "global_step": 306724, "epoch": 1825} {"train_loss": -11.330301284790039, "global_step": 306725, "epoch": 1825} {"train_loss": -11.318756103515625, "global_step": 306726, "epoch": 1825} {"train_loss": -11.434937477111816, "global_step": 306727, "epoch": 1825} {"train_loss": -11.56410026550293, "global_step": 306728, "epoch": 1825} {"train_loss": -11.713504791259766, "global_step": 306729, "epoch": 1825} {"train_loss": -11.762712478637695, "global_step": 306730, "epoch": 1825} {"train_loss": -11.447683334350586, "global_step": 306731, "epoch": 1825} {"train_loss": -11.866201400756836, "global_step": 306732, "epoch": 1825} {"train_loss": -11.805741310119629, "global_step": 306733, "epoch": 1825} {"train_loss": -11.708993911743164, "global_step": 306734, "epoch": 1825} {"train_loss": -11.531821250915527, "global_step": 306735, "epoch": 1825} {"train_loss": -11.759990692138672, "global_step": 306736, "epoch": 1825} {"train_loss": -11.834708213806152, "global_step": 306737, "epoch": 1825} {"train_loss": -11.70585823059082, "global_step": 306738, "epoch": 1825} {"train_loss": -11.731964111328125, "global_step": 306739, "epoch": 1825} {"train_loss": -11.63047981262207, "global_step": 306740, "epoch": 1825} {"train_loss": -11.826456069946289, "global_step": 306741, "epoch": 1825} {"train_loss": -11.850377082824707, "global_step": 306742, "epoch": 1825} {"train_loss": -11.768935203552246, "global_step": 306743, "epoch": 1825} {"train_loss": -11.878687858581543, "global_step": 306744, "epoch": 1825} {"train_loss": -11.765960693359375, "global_step": 306745, "epoch": 1825} {"train_loss": -12.042577743530273, "global_step": 306746, "epoch": 1825} {"train_loss": -11.758715629577637, "global_step": 306747, "epoch": 1825} {"train_loss": -11.969841957092285, "global_step": 306748, "epoch": 1825} {"train_loss": -11.960173606872559, "global_step": 306749, "epoch": 1825} {"train_loss": -12.105688095092773, "global_step": 306750, "epoch": 1825} {"train_loss": -12.23331069946289, "global_step": 306751, "epoch": 1825} {"train_loss": -12.089744567871094, "global_step": 306752, "epoch": 1825} {"train_loss": -12.109195709228516, "global_step": 306753, "epoch": 1825} {"train_loss": -12.0368013381958, "global_step": 306754, "epoch": 1825} {"train_loss": -12.247809410095215, "global_step": 306755, "epoch": 1825} {"train_loss": -12.086992263793945, "global_step": 306756, "epoch": 1825} {"train_loss": -12.146530151367188, "global_step": 306757, "epoch": 1825} {"train_loss": -11.824323654174805, "global_step": 306758, "epoch": 1825} {"train_loss": -12.139240264892578, "global_step": 306759, "epoch": 1825} {"train_loss": -12.026253700256348, "global_step": 306760, "epoch": 1825} {"train_loss": -12.03721809387207, "global_step": 306761, "epoch": 1825} {"train_loss": -12.143786430358887, "global_step": 306762, "epoch": 1825} {"train_loss": -12.265353202819824, "global_step": 306763, "epoch": 1825} {"train_loss": -12.223115921020508, "global_step": 306764, "epoch": 1825} {"train_loss": -12.272392272949219, "global_step": 306765, "epoch": 1825} {"train_loss": -12.102226257324219, "global_step": 306766, "epoch": 1825} {"train_loss": -11.332585672537485, "global_step": 306767, "epoch": 1825, "val_loss": 280590.78125, "train_action_mse_error": 3.4881012439727783} {"train_loss": -12.085733413696289, "global_step": 306768, "epoch": 1826} {"train_loss": -12.112953186035156, "global_step": 306769, "epoch": 1826} {"train_loss": -11.989883422851562, "global_step": 306770, "epoch": 1826} {"train_loss": -12.279830932617188, "global_step": 306771, "epoch": 1826} {"train_loss": -12.165724754333496, "global_step": 306772, "epoch": 1826} {"train_loss": -12.257975578308105, "global_step": 306773, "epoch": 1826} {"train_loss": -12.09619426727295, "global_step": 306774, "epoch": 1826} {"train_loss": -12.30021858215332, "global_step": 306775, "epoch": 1826} {"train_loss": -12.282812118530273, "global_step": 306776, "epoch": 1826} {"train_loss": -12.451692581176758, "global_step": 306777, "epoch": 1826} {"train_loss": -12.22674560546875, "global_step": 306778, "epoch": 1826} {"train_loss": -12.39361572265625, "global_step": 306779, "epoch": 1826} {"train_loss": -12.495712280273438, "global_step": 306780, "epoch": 1826} {"train_loss": -12.209122657775879, "global_step": 306781, "epoch": 1826} {"train_loss": -12.428972244262695, "global_step": 306782, "epoch": 1826} {"train_loss": -12.274476051330566, "global_step": 306783, "epoch": 1826} {"train_loss": -12.395822525024414, "global_step": 306784, "epoch": 1826} {"train_loss": -12.336017608642578, "global_step": 306785, "epoch": 1826} {"train_loss": -12.081977844238281, "global_step": 306786, "epoch": 1826} {"train_loss": -12.389955520629883, "global_step": 306787, "epoch": 1826} {"train_loss": -12.374238967895508, "global_step": 306788, "epoch": 1826} {"train_loss": -12.100135803222656, "global_step": 306789, "epoch": 1826} {"train_loss": -12.500761985778809, "global_step": 306790, "epoch": 1826} {"train_loss": -12.336624145507812, "global_step": 306791, "epoch": 1826} {"train_loss": -12.327287673950195, "global_step": 306792, "epoch": 1826} {"train_loss": -12.336264610290527, "global_step": 306793, "epoch": 1826} {"train_loss": -12.41081428527832, "global_step": 306794, "epoch": 1826} {"train_loss": -12.259784698486328, "global_step": 306795, "epoch": 1826} {"train_loss": -12.235746383666992, "global_step": 306796, "epoch": 1826} {"train_loss": -12.293619155883789, "global_step": 306797, "epoch": 1826} {"train_loss": -12.309820175170898, "global_step": 306798, "epoch": 1826} {"train_loss": -12.287700653076172, "global_step": 306799, "epoch": 1826} {"train_loss": -12.3248291015625, "global_step": 306800, "epoch": 1826} {"train_loss": -12.21290111541748, "global_step": 306801, "epoch": 1826} {"train_loss": -12.302568435668945, "global_step": 306802, "epoch": 1826} {"train_loss": -12.251605987548828, "global_step": 306803, "epoch": 1826} {"train_loss": -12.396072387695312, "global_step": 306804, "epoch": 1826} {"train_loss": -12.327908515930176, "global_step": 306805, "epoch": 1826} {"train_loss": -12.12943172454834, "global_step": 306806, "epoch": 1826} {"train_loss": -11.255314826965332, "global_step": 306807, "epoch": 1826} {"train_loss": -12.001375198364258, "global_step": 306808, "epoch": 1826} {"train_loss": -12.079580307006836, "global_step": 306809, "epoch": 1826} {"train_loss": -11.297924041748047, "global_step": 306810, "epoch": 1826} {"train_loss": -10.709615707397461, "global_step": 306811, "epoch": 1826} {"train_loss": -12.296611785888672, "global_step": 306812, "epoch": 1826} {"train_loss": -11.794090270996094, "global_step": 306813, "epoch": 1826} {"train_loss": -11.607975959777832, "global_step": 306814, "epoch": 1826} {"train_loss": -11.596086502075195, "global_step": 306815, "epoch": 1826} {"train_loss": -11.55603313446045, "global_step": 306816, "epoch": 1826} {"train_loss": -11.806295394897461, "global_step": 306817, "epoch": 1826} {"train_loss": -12.146966934204102, "global_step": 306818, "epoch": 1826} {"train_loss": -11.61379337310791, "global_step": 306819, "epoch": 1826} {"train_loss": -11.650065422058105, "global_step": 306820, "epoch": 1826} {"train_loss": -12.304250717163086, "global_step": 306821, "epoch": 1826} {"train_loss": -12.19228744506836, "global_step": 306822, "epoch": 1826} {"train_loss": -12.004219055175781, "global_step": 306823, "epoch": 1826} {"train_loss": -12.30319595336914, "global_step": 306824, "epoch": 1826} {"train_loss": -12.051538467407227, "global_step": 306825, "epoch": 1826} {"train_loss": -12.204883575439453, "global_step": 306826, "epoch": 1826} {"train_loss": -12.288070678710938, "global_step": 306827, "epoch": 1826} {"train_loss": -12.260626792907715, "global_step": 306828, "epoch": 1826} {"train_loss": -12.307557106018066, "global_step": 306829, "epoch": 1826} {"train_loss": -12.225109100341797, "global_step": 306830, "epoch": 1826} {"train_loss": -12.308344841003418, "global_step": 306831, "epoch": 1826} {"train_loss": -12.367469787597656, "global_step": 306832, "epoch": 1826} {"train_loss": -12.155055046081543, "global_step": 306833, "epoch": 1826} {"train_loss": -12.543739318847656, "global_step": 306834, "epoch": 1826} {"train_loss": -12.494163513183594, "global_step": 306835, "epoch": 1826} {"train_loss": -12.424997329711914, "global_step": 306836, "epoch": 1826} {"train_loss": -12.324897766113281, "global_step": 306837, "epoch": 1826} {"train_loss": -12.353752136230469, "global_step": 306838, "epoch": 1826} {"train_loss": -12.233966827392578, "global_step": 306839, "epoch": 1826} {"train_loss": -12.029184341430664, "global_step": 306840, "epoch": 1826} {"train_loss": -12.145769119262695, "global_step": 306841, "epoch": 1826} {"train_loss": -12.420897483825684, "global_step": 306842, "epoch": 1826} {"train_loss": -12.279991149902344, "global_step": 306843, "epoch": 1826} {"train_loss": -12.062211990356445, "global_step": 306844, "epoch": 1826} {"train_loss": -12.104761123657227, "global_step": 306845, "epoch": 1826} {"train_loss": -12.355365753173828, "global_step": 306846, "epoch": 1826} {"train_loss": -12.200691223144531, "global_step": 306847, "epoch": 1826} {"train_loss": -11.936348915100098, "global_step": 306848, "epoch": 1826} {"train_loss": -12.336344718933105, "global_step": 306849, "epoch": 1826} {"train_loss": -12.167582511901855, "global_step": 306850, "epoch": 1826} {"train_loss": -12.371482849121094, "global_step": 306851, "epoch": 1826} {"train_loss": -11.382226943969727, "global_step": 306852, "epoch": 1826} {"train_loss": -12.013331413269043, "global_step": 306853, "epoch": 1826} {"train_loss": -12.41610050201416, "global_step": 306854, "epoch": 1826} {"train_loss": -12.254104614257812, "global_step": 306855, "epoch": 1826} {"train_loss": -12.001842498779297, "global_step": 306856, "epoch": 1826} {"train_loss": -11.985416412353516, "global_step": 306857, "epoch": 1826} {"train_loss": -11.911742210388184, "global_step": 306858, "epoch": 1826} {"train_loss": -12.031208038330078, "global_step": 306859, "epoch": 1826} {"train_loss": -12.094892501831055, "global_step": 306860, "epoch": 1826} {"train_loss": -12.095405578613281, "global_step": 306861, "epoch": 1826} {"train_loss": -11.936908721923828, "global_step": 306862, "epoch": 1826} {"train_loss": -12.4086332321167, "global_step": 306863, "epoch": 1826} {"train_loss": -11.749563217163086, "global_step": 306864, "epoch": 1826} {"train_loss": -11.67161750793457, "global_step": 306865, "epoch": 1826} {"train_loss": -11.249425888061523, "global_step": 306866, "epoch": 1826} {"train_loss": -12.032684326171875, "global_step": 306867, "epoch": 1826} {"train_loss": -10.845073699951172, "global_step": 306868, "epoch": 1826} {"train_loss": -11.809581756591797, "global_step": 306869, "epoch": 1826} {"train_loss": -11.726478576660156, "global_step": 306870, "epoch": 1826} {"train_loss": -11.117588996887207, "global_step": 306871, "epoch": 1826} {"train_loss": -11.258673667907715, "global_step": 306872, "epoch": 1826} {"train_loss": -12.04627799987793, "global_step": 306873, "epoch": 1826} {"train_loss": -11.076371192932129, "global_step": 306874, "epoch": 1826} {"train_loss": -11.592024803161621, "global_step": 306875, "epoch": 1826} {"train_loss": -11.269410133361816, "global_step": 306876, "epoch": 1826} {"train_loss": -11.098408699035645, "global_step": 306877, "epoch": 1826} {"train_loss": -11.979698181152344, "global_step": 306878, "epoch": 1826} {"train_loss": -10.651945114135742, "global_step": 306879, "epoch": 1826} {"train_loss": -10.259382247924805, "global_step": 306880, "epoch": 1826} {"train_loss": -11.601846694946289, "global_step": 306881, "epoch": 1826} {"train_loss": -11.493122100830078, "global_step": 306882, "epoch": 1826} {"train_loss": -11.009943008422852, "global_step": 306883, "epoch": 1826} {"train_loss": -11.412816047668457, "global_step": 306884, "epoch": 1826} {"train_loss": -11.865378379821777, "global_step": 306885, "epoch": 1826} {"train_loss": -11.65237808227539, "global_step": 306886, "epoch": 1826} {"train_loss": -11.533703804016113, "global_step": 306887, "epoch": 1826} {"train_loss": -11.7718505859375, "global_step": 306888, "epoch": 1826} {"train_loss": -11.157669067382812, "global_step": 306889, "epoch": 1826} {"train_loss": -11.499435424804688, "global_step": 306890, "epoch": 1826} {"train_loss": -10.641995429992676, "global_step": 306891, "epoch": 1826} {"train_loss": -11.002161026000977, "global_step": 306892, "epoch": 1826} {"train_loss": -10.882471084594727, "global_step": 306893, "epoch": 1826} {"train_loss": -10.692167282104492, "global_step": 306894, "epoch": 1826} {"train_loss": -10.973492622375488, "global_step": 306895, "epoch": 1826} {"train_loss": -10.632026672363281, "global_step": 306896, "epoch": 1826} {"train_loss": -11.277847290039062, "global_step": 306897, "epoch": 1826} {"train_loss": -10.936980247497559, "global_step": 306898, "epoch": 1826} {"train_loss": -11.166068077087402, "global_step": 306899, "epoch": 1826} {"train_loss": -9.507144927978516, "global_step": 306900, "epoch": 1826} {"train_loss": -10.609572410583496, "global_step": 306901, "epoch": 1826} {"train_loss": -10.736980438232422, "global_step": 306902, "epoch": 1826} {"train_loss": -10.934772491455078, "global_step": 306903, "epoch": 1826} {"train_loss": -10.29887580871582, "global_step": 306904, "epoch": 1826} {"train_loss": -11.504838943481445, "global_step": 306905, "epoch": 1826} {"train_loss": -10.805044174194336, "global_step": 306906, "epoch": 1826} {"train_loss": -11.706356048583984, "global_step": 306907, "epoch": 1826} {"train_loss": -11.319303512573242, "global_step": 306908, "epoch": 1826} {"train_loss": -11.797453880310059, "global_step": 306909, "epoch": 1826} {"train_loss": -11.257781982421875, "global_step": 306910, "epoch": 1826} {"train_loss": -11.813549041748047, "global_step": 306911, "epoch": 1826} {"train_loss": -11.695051193237305, "global_step": 306912, "epoch": 1826} {"train_loss": -11.942042350769043, "global_step": 306913, "epoch": 1826} {"train_loss": -11.468595504760742, "global_step": 306914, "epoch": 1826} {"train_loss": -12.055728912353516, "global_step": 306915, "epoch": 1826} {"train_loss": -11.61739730834961, "global_step": 306916, "epoch": 1826} {"train_loss": -12.072782516479492, "global_step": 306917, "epoch": 1826} {"train_loss": -12.049860000610352, "global_step": 306918, "epoch": 1826} {"train_loss": -12.089609146118164, "global_step": 306919, "epoch": 1826} {"train_loss": -11.95408821105957, "global_step": 306920, "epoch": 1826} {"train_loss": -12.112081527709961, "global_step": 306921, "epoch": 1826} {"train_loss": -12.077954292297363, "global_step": 306922, "epoch": 1826} {"train_loss": -12.137346267700195, "global_step": 306923, "epoch": 1826} {"train_loss": -12.145201683044434, "global_step": 306924, "epoch": 1826} {"train_loss": -11.975112915039062, "global_step": 306925, "epoch": 1826} {"train_loss": -12.238907814025879, "global_step": 306926, "epoch": 1826} {"train_loss": -11.796390533447266, "global_step": 306927, "epoch": 1826} {"train_loss": -12.132293701171875, "global_step": 306928, "epoch": 1826} {"train_loss": -12.170312881469727, "global_step": 306929, "epoch": 1826} {"train_loss": -12.091680526733398, "global_step": 306930, "epoch": 1826} {"train_loss": -12.19729232788086, "global_step": 306931, "epoch": 1826} {"train_loss": -12.009246826171875, "global_step": 306932, "epoch": 1826} {"train_loss": -12.281572341918945, "global_step": 306933, "epoch": 1826} {"train_loss": -12.263086318969727, "global_step": 306934, "epoch": 1826} {"train_loss": -11.871541153816949, "global_step": 306935, "epoch": 1826, "val_loss": 279863.34375} {"train_loss": -12.283138275146484, "global_step": 306936, "epoch": 1827} {"train_loss": -11.945497512817383, "global_step": 306937, "epoch": 1827} {"train_loss": -12.343518257141113, "global_step": 306938, "epoch": 1827} {"train_loss": -12.082023620605469, "global_step": 306939, "epoch": 1827} {"train_loss": -12.547536849975586, "global_step": 306940, "epoch": 1827} {"train_loss": -11.957576751708984, "global_step": 306941, "epoch": 1827} {"train_loss": -12.31466007232666, "global_step": 306942, "epoch": 1827} {"train_loss": -12.357915878295898, "global_step": 306943, "epoch": 1827} {"train_loss": -11.991843223571777, "global_step": 306944, "epoch": 1827} {"train_loss": -12.262898445129395, "global_step": 306945, "epoch": 1827} {"train_loss": -11.925118446350098, "global_step": 306946, "epoch": 1827} {"train_loss": -12.127277374267578, "global_step": 306947, "epoch": 1827} {"train_loss": -12.490419387817383, "global_step": 306948, "epoch": 1827} {"train_loss": -12.289081573486328, "global_step": 306949, "epoch": 1827} {"train_loss": -12.149147033691406, "global_step": 306950, "epoch": 1827} {"train_loss": -12.26368522644043, "global_step": 306951, "epoch": 1827} {"train_loss": -12.20280647277832, "global_step": 306952, "epoch": 1827} {"train_loss": -12.389822006225586, "global_step": 306953, "epoch": 1827} {"train_loss": -12.303476333618164, "global_step": 306954, "epoch": 1827} {"train_loss": -12.22925090789795, "global_step": 306955, "epoch": 1827} {"train_loss": -12.367743492126465, "global_step": 306956, "epoch": 1827} {"train_loss": -12.071815490722656, "global_step": 306957, "epoch": 1827} {"train_loss": -12.41850471496582, "global_step": 306958, "epoch": 1827} {"train_loss": -12.552763938903809, "global_step": 306959, "epoch": 1827} {"train_loss": -12.299559593200684, "global_step": 306960, "epoch": 1827} {"train_loss": -12.323251724243164, "global_step": 306961, "epoch": 1827} {"train_loss": -12.437070846557617, "global_step": 306962, "epoch": 1827} {"train_loss": -12.332979202270508, "global_step": 306963, "epoch": 1827} {"train_loss": -12.392183303833008, "global_step": 306964, "epoch": 1827} {"train_loss": -12.362749099731445, "global_step": 306965, "epoch": 1827} {"train_loss": -12.377846717834473, "global_step": 306966, "epoch": 1827} {"train_loss": -12.194129943847656, "global_step": 306967, "epoch": 1827} {"train_loss": -12.52271556854248, "global_step": 306968, "epoch": 1827} {"train_loss": -12.350255966186523, "global_step": 306969, "epoch": 1827} {"train_loss": -12.15719985961914, "global_step": 306970, "epoch": 1827} {"train_loss": -12.428390502929688, "global_step": 306971, "epoch": 1827} {"train_loss": -12.64846134185791, "global_step": 306972, "epoch": 1827} {"train_loss": -12.308002471923828, "global_step": 306973, "epoch": 1827} {"train_loss": -12.468635559082031, "global_step": 306974, "epoch": 1827} {"train_loss": -12.263273239135742, "global_step": 306975, "epoch": 1827} {"train_loss": -12.566640853881836, "global_step": 306976, "epoch": 1827} {"train_loss": -12.366035461425781, "global_step": 306977, "epoch": 1827} {"train_loss": -12.573893547058105, "global_step": 306978, "epoch": 1827} {"train_loss": -12.009259223937988, "global_step": 306979, "epoch": 1827} {"train_loss": -12.376471519470215, "global_step": 306980, "epoch": 1827} {"train_loss": -12.303431510925293, "global_step": 306981, "epoch": 1827} {"train_loss": -12.296205520629883, "global_step": 306982, "epoch": 1827} {"train_loss": -12.390928268432617, "global_step": 306983, "epoch": 1827} {"train_loss": -12.645912170410156, "global_step": 306984, "epoch": 1827} {"train_loss": -12.682828903198242, "global_step": 306985, "epoch": 1827} {"train_loss": -12.585098266601562, "global_step": 306986, "epoch": 1827} {"train_loss": -12.355589866638184, "global_step": 306987, "epoch": 1827} {"train_loss": -12.500996589660645, "global_step": 306988, "epoch": 1827} {"train_loss": -12.40442943572998, "global_step": 306989, "epoch": 1827} {"train_loss": -11.829626083374023, "global_step": 306990, "epoch": 1827} {"train_loss": -11.387285232543945, "global_step": 306991, "epoch": 1827} {"train_loss": -11.628546714782715, "global_step": 306992, "epoch": 1827} {"train_loss": -11.948472023010254, "global_step": 306993, "epoch": 1827} {"train_loss": -11.899343490600586, "global_step": 306994, "epoch": 1827} {"train_loss": -11.93362808227539, "global_step": 306995, "epoch": 1827} {"train_loss": -12.402066230773926, "global_step": 306996, "epoch": 1827} {"train_loss": -11.463485717773438, "global_step": 306997, "epoch": 1827} {"train_loss": -11.884347915649414, "global_step": 306998, "epoch": 1827} {"train_loss": -11.701659202575684, "global_step": 306999, "epoch": 1827} {"train_loss": -10.537680625915527, "global_step": 307000, "epoch": 1827} {"train_loss": -10.479874610900879, "global_step": 307001, "epoch": 1827} {"train_loss": -11.59095573425293, "global_step": 307002, "epoch": 1827} {"train_loss": -9.791723251342773, "global_step": 307003, "epoch": 1827} {"train_loss": -10.405332565307617, "global_step": 307004, "epoch": 1827} {"train_loss": -11.861089706420898, "global_step": 307005, "epoch": 1827} {"train_loss": -10.314840316772461, "global_step": 307006, "epoch": 1827} {"train_loss": -11.564218521118164, "global_step": 307007, "epoch": 1827} {"train_loss": -10.377412796020508, "global_step": 307008, "epoch": 1827} {"train_loss": -11.838568687438965, "global_step": 307009, "epoch": 1827} {"train_loss": -10.4609375, "global_step": 307010, "epoch": 1827} {"train_loss": -12.264391899108887, "global_step": 307011, "epoch": 1827} {"train_loss": -11.381880760192871, "global_step": 307012, "epoch": 1827} {"train_loss": -12.012500762939453, "global_step": 307013, "epoch": 1827} {"train_loss": -11.469283103942871, "global_step": 307014, "epoch": 1827} {"train_loss": -11.770499229431152, "global_step": 307015, "epoch": 1827} {"train_loss": -10.387372970581055, "global_step": 307016, "epoch": 1827} {"train_loss": -11.236089706420898, "global_step": 307017, "epoch": 1827} {"train_loss": -10.864676475524902, "global_step": 307018, "epoch": 1827} {"train_loss": -11.705158233642578, "global_step": 307019, "epoch": 1827} {"train_loss": -11.623348236083984, "global_step": 307020, "epoch": 1827} {"train_loss": -11.353157043457031, "global_step": 307021, "epoch": 1827} {"train_loss": -11.45042610168457, "global_step": 307022, "epoch": 1827} {"train_loss": -11.789384841918945, "global_step": 307023, "epoch": 1827} {"train_loss": -11.915180206298828, "global_step": 307024, "epoch": 1827} {"train_loss": -11.412745475769043, "global_step": 307025, "epoch": 1827} {"train_loss": -11.770478248596191, "global_step": 307026, "epoch": 1827} {"train_loss": -11.751699447631836, "global_step": 307027, "epoch": 1827} {"train_loss": -11.914209365844727, "global_step": 307028, "epoch": 1827} {"train_loss": -11.646729469299316, "global_step": 307029, "epoch": 1827} {"train_loss": -11.498239517211914, "global_step": 307030, "epoch": 1827} {"train_loss": -11.792912483215332, "global_step": 307031, "epoch": 1827} {"train_loss": -11.532861709594727, "global_step": 307032, "epoch": 1827} {"train_loss": -11.51058578491211, "global_step": 307033, "epoch": 1827} {"train_loss": -11.547348976135254, "global_step": 307034, "epoch": 1827} {"train_loss": -11.301531791687012, "global_step": 307035, "epoch": 1827} {"train_loss": -12.0880126953125, "global_step": 307036, "epoch": 1827} {"train_loss": -11.467615127563477, "global_step": 307037, "epoch": 1827} {"train_loss": -11.917652130126953, "global_step": 307038, "epoch": 1827} {"train_loss": -11.929033279418945, "global_step": 307039, "epoch": 1827} {"train_loss": -11.556400299072266, "global_step": 307040, "epoch": 1827} {"train_loss": -12.182186126708984, "global_step": 307041, "epoch": 1827} {"train_loss": -11.846088409423828, "global_step": 307042, "epoch": 1827} {"train_loss": -11.492959976196289, "global_step": 307043, "epoch": 1827} {"train_loss": -12.238462448120117, "global_step": 307044, "epoch": 1827} {"train_loss": -11.204431533813477, "global_step": 307045, "epoch": 1827} {"train_loss": -12.370512008666992, "global_step": 307046, "epoch": 1827} {"train_loss": -11.592329978942871, "global_step": 307047, "epoch": 1827} {"train_loss": -11.85955810546875, "global_step": 307048, "epoch": 1827} {"train_loss": -11.93255615234375, "global_step": 307049, "epoch": 1827} {"train_loss": -11.62527084350586, "global_step": 307050, "epoch": 1827} {"train_loss": -12.084151268005371, "global_step": 307051, "epoch": 1827} {"train_loss": -11.655929565429688, "global_step": 307052, "epoch": 1827} {"train_loss": -12.090828895568848, "global_step": 307053, "epoch": 1827} {"train_loss": -11.900324821472168, "global_step": 307054, "epoch": 1827} {"train_loss": -11.879194259643555, "global_step": 307055, "epoch": 1827} {"train_loss": -11.849067687988281, "global_step": 307056, "epoch": 1827} {"train_loss": -11.19198989868164, "global_step": 307057, "epoch": 1827} {"train_loss": -10.988912582397461, "global_step": 307058, "epoch": 1827} {"train_loss": -11.599615097045898, "global_step": 307059, "epoch": 1827} {"train_loss": -11.30224323272705, "global_step": 307060, "epoch": 1827} {"train_loss": -10.848505020141602, "global_step": 307061, "epoch": 1827} {"train_loss": -12.210700988769531, "global_step": 307062, "epoch": 1827} {"train_loss": -11.02846908569336, "global_step": 307063, "epoch": 1827} {"train_loss": -10.799467086791992, "global_step": 307064, "epoch": 1827} {"train_loss": -11.773118019104004, "global_step": 307065, "epoch": 1827} {"train_loss": -10.529535293579102, "global_step": 307066, "epoch": 1827} {"train_loss": -12.105911254882812, "global_step": 307067, "epoch": 1827} {"train_loss": -10.71045207977295, "global_step": 307068, "epoch": 1827} {"train_loss": -11.452495574951172, "global_step": 307069, "epoch": 1827} {"train_loss": -10.624785423278809, "global_step": 307070, "epoch": 1827} {"train_loss": -10.263720512390137, "global_step": 307071, "epoch": 1827} {"train_loss": -10.396484375, "global_step": 307072, "epoch": 1827} {"train_loss": -11.263809204101562, "global_step": 307073, "epoch": 1827} {"train_loss": -9.519749641418457, "global_step": 307074, "epoch": 1827} {"train_loss": -11.668012619018555, "global_step": 307075, "epoch": 1827} {"train_loss": -10.680923461914062, "global_step": 307076, "epoch": 1827} {"train_loss": -10.726466178894043, "global_step": 307077, "epoch": 1827} {"train_loss": -11.556406021118164, "global_step": 307078, "epoch": 1827} {"train_loss": -9.678338050842285, "global_step": 307079, "epoch": 1827} {"train_loss": -11.368497848510742, "global_step": 307080, "epoch": 1827} {"train_loss": -10.376764297485352, "global_step": 307081, "epoch": 1827} {"train_loss": -11.080178260803223, "global_step": 307082, "epoch": 1827} {"train_loss": -11.031554222106934, "global_step": 307083, "epoch": 1827} {"train_loss": -11.43979263305664, "global_step": 307084, "epoch": 1827} {"train_loss": -11.671894073486328, "global_step": 307085, "epoch": 1827} {"train_loss": -11.696846008300781, "global_step": 307086, "epoch": 1827} {"train_loss": -11.508600234985352, "global_step": 307087, "epoch": 1827} {"train_loss": -11.5114107131958, "global_step": 307088, "epoch": 1827} {"train_loss": -11.69675350189209, "global_step": 307089, "epoch": 1827} {"train_loss": -11.482198715209961, "global_step": 307090, "epoch": 1827} {"train_loss": -11.535257339477539, "global_step": 307091, "epoch": 1827} {"train_loss": -11.9157133102417, "global_step": 307092, "epoch": 1827} {"train_loss": -11.679766654968262, "global_step": 307093, "epoch": 1827} {"train_loss": -11.814910888671875, "global_step": 307094, "epoch": 1827} {"train_loss": -12.054101943969727, "global_step": 307095, "epoch": 1827} {"train_loss": -11.752616882324219, "global_step": 307096, "epoch": 1827} {"train_loss": -12.059664726257324, "global_step": 307097, "epoch": 1827} {"train_loss": -11.819128036499023, "global_step": 307098, "epoch": 1827} {"train_loss": -11.996709823608398, "global_step": 307099, "epoch": 1827} {"train_loss": -11.88366985321045, "global_step": 307100, "epoch": 1827} {"train_loss": -12.050668716430664, "global_step": 307101, "epoch": 1827} {"train_loss": -11.912193298339844, "global_step": 307102, "epoch": 1827} {"train_loss": -11.744457562764486, "global_step": 307103, "epoch": 1827, "val_loss": 279978.625} {"train_loss": -12.100379943847656, "global_step": 307104, "epoch": 1828} {"train_loss": -11.813730239868164, "global_step": 307105, "epoch": 1828} {"train_loss": -11.950438499450684, "global_step": 307106, "epoch": 1828} {"train_loss": -12.123294830322266, "global_step": 307107, "epoch": 1828} {"train_loss": -12.006025314331055, "global_step": 307108, "epoch": 1828} {"train_loss": -11.83552074432373, "global_step": 307109, "epoch": 1828} {"train_loss": -12.127466201782227, "global_step": 307110, "epoch": 1828} {"train_loss": -12.07625675201416, "global_step": 307111, "epoch": 1828} {"train_loss": -12.012741088867188, "global_step": 307112, "epoch": 1828} {"train_loss": -12.21175765991211, "global_step": 307113, "epoch": 1828} {"train_loss": -12.00086784362793, "global_step": 307114, "epoch": 1828} {"train_loss": -12.202486038208008, "global_step": 307115, "epoch": 1828} {"train_loss": -12.227148056030273, "global_step": 307116, "epoch": 1828} {"train_loss": -12.025850296020508, "global_step": 307117, "epoch": 1828} {"train_loss": -12.236642837524414, "global_step": 307118, "epoch": 1828} {"train_loss": -12.068351745605469, "global_step": 307119, "epoch": 1828} {"train_loss": -12.07785415649414, "global_step": 307120, "epoch": 1828} {"train_loss": -12.149474143981934, "global_step": 307121, "epoch": 1828} {"train_loss": -12.076408386230469, "global_step": 307122, "epoch": 1828} {"train_loss": -12.157721519470215, "global_step": 307123, "epoch": 1828} {"train_loss": -12.064906120300293, "global_step": 307124, "epoch": 1828} {"train_loss": -12.09880542755127, "global_step": 307125, "epoch": 1828} {"train_loss": -12.13813591003418, "global_step": 307126, "epoch": 1828} {"train_loss": -12.160528182983398, "global_step": 307127, "epoch": 1828} {"train_loss": -12.039777755737305, "global_step": 307128, "epoch": 1828} {"train_loss": -12.199907302856445, "global_step": 307129, "epoch": 1828} {"train_loss": -12.159492492675781, "global_step": 307130, "epoch": 1828} {"train_loss": -12.132990837097168, "global_step": 307131, "epoch": 1828} {"train_loss": -12.263550758361816, "global_step": 307132, "epoch": 1828} {"train_loss": -11.799098014831543, "global_step": 307133, "epoch": 1828} {"train_loss": -11.620485305786133, "global_step": 307134, "epoch": 1828} {"train_loss": -12.247108459472656, "global_step": 307135, "epoch": 1828} {"train_loss": -11.619656562805176, "global_step": 307136, "epoch": 1828} {"train_loss": -12.205358505249023, "global_step": 307137, "epoch": 1828} {"train_loss": -12.00326919555664, "global_step": 307138, "epoch": 1828} {"train_loss": -11.704111099243164, "global_step": 307139, "epoch": 1828} {"train_loss": -12.200718879699707, "global_step": 307140, "epoch": 1828} {"train_loss": -11.822461128234863, "global_step": 307141, "epoch": 1828} {"train_loss": -12.154167175292969, "global_step": 307142, "epoch": 1828} {"train_loss": -12.083452224731445, "global_step": 307143, "epoch": 1828} {"train_loss": -11.449527740478516, "global_step": 307144, "epoch": 1828} {"train_loss": -12.143871307373047, "global_step": 307145, "epoch": 1828} {"train_loss": -12.048818588256836, "global_step": 307146, "epoch": 1828} {"train_loss": -12.093221664428711, "global_step": 307147, "epoch": 1828} {"train_loss": -11.951446533203125, "global_step": 307148, "epoch": 1828} {"train_loss": -11.166315078735352, "global_step": 307149, "epoch": 1828} {"train_loss": -11.326252937316895, "global_step": 307150, "epoch": 1828} {"train_loss": -12.052404403686523, "global_step": 307151, "epoch": 1828} {"train_loss": -10.18023681640625, "global_step": 307152, "epoch": 1828} {"train_loss": -11.047113418579102, "global_step": 307153, "epoch": 1828} {"train_loss": -10.788385391235352, "global_step": 307154, "epoch": 1828} {"train_loss": -11.995826721191406, "global_step": 307155, "epoch": 1828} {"train_loss": -11.335367202758789, "global_step": 307156, "epoch": 1828} {"train_loss": -12.056243896484375, "global_step": 307157, "epoch": 1828} {"train_loss": -11.866615295410156, "global_step": 307158, "epoch": 1828} {"train_loss": -11.368353843688965, "global_step": 307159, "epoch": 1828} {"train_loss": -11.642011642456055, "global_step": 307160, "epoch": 1828} {"train_loss": -11.29574203491211, "global_step": 307161, "epoch": 1828} {"train_loss": -11.826899528503418, "global_step": 307162, "epoch": 1828} {"train_loss": -12.01119613647461, "global_step": 307163, "epoch": 1828} {"train_loss": -12.191474914550781, "global_step": 307164, "epoch": 1828} {"train_loss": -11.19863510131836, "global_step": 307165, "epoch": 1828} {"train_loss": -12.043547630310059, "global_step": 307166, "epoch": 1828} {"train_loss": -11.536781311035156, "global_step": 307167, "epoch": 1828} {"train_loss": -12.138571739196777, "global_step": 307168, "epoch": 1828} {"train_loss": -11.930034637451172, "global_step": 307169, "epoch": 1828} {"train_loss": -12.18082046508789, "global_step": 307170, "epoch": 1828} {"train_loss": -11.39126968383789, "global_step": 307171, "epoch": 1828} {"train_loss": -12.291786193847656, "global_step": 307172, "epoch": 1828} {"train_loss": -11.832199096679688, "global_step": 307173, "epoch": 1828} {"train_loss": -12.07158088684082, "global_step": 307174, "epoch": 1828} {"train_loss": -11.732203483581543, "global_step": 307175, "epoch": 1828} {"train_loss": -12.221305847167969, "global_step": 307176, "epoch": 1828} {"train_loss": -12.07900619506836, "global_step": 307177, "epoch": 1828} {"train_loss": -12.04183578491211, "global_step": 307178, "epoch": 1828} {"train_loss": -12.462425231933594, "global_step": 307179, "epoch": 1828} {"train_loss": -12.084424018859863, "global_step": 307180, "epoch": 1828} {"train_loss": -11.967338562011719, "global_step": 307181, "epoch": 1828} {"train_loss": -12.303801536560059, "global_step": 307182, "epoch": 1828} {"train_loss": -12.271010398864746, "global_step": 307183, "epoch": 1828} {"train_loss": -12.446706771850586, "global_step": 307184, "epoch": 1828} {"train_loss": -12.20937442779541, "global_step": 307185, "epoch": 1828} {"train_loss": -12.261222839355469, "global_step": 307186, "epoch": 1828} {"train_loss": -12.430810928344727, "global_step": 307187, "epoch": 1828} {"train_loss": -12.345645904541016, "global_step": 307188, "epoch": 1828} {"train_loss": -12.142282485961914, "global_step": 307189, "epoch": 1828} {"train_loss": -12.361555099487305, "global_step": 307190, "epoch": 1828} {"train_loss": -12.262117385864258, "global_step": 307191, "epoch": 1828} {"train_loss": -12.053584098815918, "global_step": 307192, "epoch": 1828} {"train_loss": -12.053818702697754, "global_step": 307193, "epoch": 1828} {"train_loss": -12.342828750610352, "global_step": 307194, "epoch": 1828} {"train_loss": -11.802382469177246, "global_step": 307195, "epoch": 1828} {"train_loss": -12.142526626586914, "global_step": 307196, "epoch": 1828} {"train_loss": -12.371187210083008, "global_step": 307197, "epoch": 1828} {"train_loss": -12.279489517211914, "global_step": 307198, "epoch": 1828} {"train_loss": -12.281621932983398, "global_step": 307199, "epoch": 1828} {"train_loss": -12.423225402832031, "global_step": 307200, "epoch": 1828} {"train_loss": -12.34404182434082, "global_step": 307201, "epoch": 1828} {"train_loss": -12.308183670043945, "global_step": 307202, "epoch": 1828} {"train_loss": -12.483802795410156, "global_step": 307203, "epoch": 1828} {"train_loss": -12.19331169128418, "global_step": 307204, "epoch": 1828} {"train_loss": -12.191564559936523, "global_step": 307205, "epoch": 1828} {"train_loss": -12.476897239685059, "global_step": 307206, "epoch": 1828} {"train_loss": -11.942909240722656, "global_step": 307207, "epoch": 1828} {"train_loss": -12.097925186157227, "global_step": 307208, "epoch": 1828} {"train_loss": -11.79047966003418, "global_step": 307209, "epoch": 1828} {"train_loss": -11.907472610473633, "global_step": 307210, "epoch": 1828} {"train_loss": -12.143732070922852, "global_step": 307211, "epoch": 1828} {"train_loss": -11.979368209838867, "global_step": 307212, "epoch": 1828} {"train_loss": -11.91738510131836, "global_step": 307213, "epoch": 1828} {"train_loss": -11.879232406616211, "global_step": 307214, "epoch": 1828} {"train_loss": -12.266481399536133, "global_step": 307215, "epoch": 1828} {"train_loss": -12.332452774047852, "global_step": 307216, "epoch": 1828} {"train_loss": -12.234060287475586, "global_step": 307217, "epoch": 1828} {"train_loss": -12.439227104187012, "global_step": 307218, "epoch": 1828} {"train_loss": -12.43568229675293, "global_step": 307219, "epoch": 1828} {"train_loss": -12.510324478149414, "global_step": 307220, "epoch": 1828} {"train_loss": -12.408010482788086, "global_step": 307221, "epoch": 1828} {"train_loss": -12.344156265258789, "global_step": 307222, "epoch": 1828} {"train_loss": -12.475364685058594, "global_step": 307223, "epoch": 1828} {"train_loss": -12.280807495117188, "global_step": 307224, "epoch": 1828} {"train_loss": -12.138660430908203, "global_step": 307225, "epoch": 1828} {"train_loss": -12.275259017944336, "global_step": 307226, "epoch": 1828} {"train_loss": -12.211771965026855, "global_step": 307227, "epoch": 1828} {"train_loss": -11.55053424835205, "global_step": 307228, "epoch": 1828} {"train_loss": -11.805731773376465, "global_step": 307229, "epoch": 1828} {"train_loss": -12.374741554260254, "global_step": 307230, "epoch": 1828} {"train_loss": -12.110502243041992, "global_step": 307231, "epoch": 1828} {"train_loss": -11.378060340881348, "global_step": 307232, "epoch": 1828} {"train_loss": -11.895120620727539, "global_step": 307233, "epoch": 1828} {"train_loss": -12.19249439239502, "global_step": 307234, "epoch": 1828} {"train_loss": -12.128129959106445, "global_step": 307235, "epoch": 1828} {"train_loss": -11.897721290588379, "global_step": 307236, "epoch": 1828} {"train_loss": -12.492830276489258, "global_step": 307237, "epoch": 1828} {"train_loss": -11.866554260253906, "global_step": 307238, "epoch": 1828} {"train_loss": -11.512993812561035, "global_step": 307239, "epoch": 1828} {"train_loss": -12.05203914642334, "global_step": 307240, "epoch": 1828} {"train_loss": -12.195646286010742, "global_step": 307241, "epoch": 1828} {"train_loss": -11.890355110168457, "global_step": 307242, "epoch": 1828} {"train_loss": -12.212629318237305, "global_step": 307243, "epoch": 1828} {"train_loss": -11.90798568725586, "global_step": 307244, "epoch": 1828} {"train_loss": -11.188440322875977, "global_step": 307245, "epoch": 1828} {"train_loss": -11.783538818359375, "global_step": 307246, "epoch": 1828} {"train_loss": -11.327322006225586, "global_step": 307247, "epoch": 1828} {"train_loss": -12.06698226928711, "global_step": 307248, "epoch": 1828} {"train_loss": -11.459941864013672, "global_step": 307249, "epoch": 1828} {"train_loss": -11.636306762695312, "global_step": 307250, "epoch": 1828} {"train_loss": -11.886199951171875, "global_step": 307251, "epoch": 1828} {"train_loss": -11.19773006439209, "global_step": 307252, "epoch": 1828} {"train_loss": -11.135300636291504, "global_step": 307253, "epoch": 1828} {"train_loss": -10.574028968811035, "global_step": 307254, "epoch": 1828} {"train_loss": -10.927153587341309, "global_step": 307255, "epoch": 1828} {"train_loss": -8.772987365722656, "global_step": 307256, "epoch": 1828} {"train_loss": -8.451095581054688, "global_step": 307257, "epoch": 1828} {"train_loss": -8.75121021270752, "global_step": 307258, "epoch": 1828} {"train_loss": -9.079028129577637, "global_step": 307259, "epoch": 1828} {"train_loss": -9.220613479614258, "global_step": 307260, "epoch": 1828} {"train_loss": -8.498177528381348, "global_step": 307261, "epoch": 1828} {"train_loss": -8.353870391845703, "global_step": 307262, "epoch": 1828} {"train_loss": -8.916388511657715, "global_step": 307263, "epoch": 1828} {"train_loss": -6.921905994415283, "global_step": 307264, "epoch": 1828} {"train_loss": -8.11758804321289, "global_step": 307265, "epoch": 1828} {"train_loss": -10.466075897216797, "global_step": 307266, "epoch": 1828} {"train_loss": -9.492240905761719, "global_step": 307267, "epoch": 1828} {"train_loss": -9.479257583618164, "global_step": 307268, "epoch": 1828} {"train_loss": -9.90852165222168, "global_step": 307269, "epoch": 1828} {"train_loss": -9.735708236694336, "global_step": 307270, "epoch": 1828} {"train_loss": -11.696795046329498, "global_step": 307271, "epoch": 1828, "val_loss": 279168.4375} {"train_loss": -10.742652893066406, "global_step": 307272, "epoch": 1829} {"train_loss": -10.45401382446289, "global_step": 307273, "epoch": 1829} {"train_loss": -10.475054740905762, "global_step": 307274, "epoch": 1829} {"train_loss": -11.043781280517578, "global_step": 307275, "epoch": 1829} {"train_loss": -10.892908096313477, "global_step": 307276, "epoch": 1829} {"train_loss": -11.033581733703613, "global_step": 307277, "epoch": 1829} {"train_loss": -11.553718566894531, "global_step": 307278, "epoch": 1829} {"train_loss": -10.09775161743164, "global_step": 307279, "epoch": 1829} {"train_loss": -11.43040657043457, "global_step": 307280, "epoch": 1829} {"train_loss": -10.551521301269531, "global_step": 307281, "epoch": 1829} {"train_loss": -11.824287414550781, "global_step": 307282, "epoch": 1829} {"train_loss": -10.926718711853027, "global_step": 307283, "epoch": 1829} {"train_loss": -10.959365844726562, "global_step": 307284, "epoch": 1829} {"train_loss": -11.093365669250488, "global_step": 307285, "epoch": 1829} {"train_loss": -11.463102340698242, "global_step": 307286, "epoch": 1829} {"train_loss": -10.691431045532227, "global_step": 307287, "epoch": 1829} {"train_loss": -11.369446754455566, "global_step": 307288, "epoch": 1829} {"train_loss": -10.562915802001953, "global_step": 307289, "epoch": 1829} {"train_loss": -11.453680038452148, "global_step": 307290, "epoch": 1829} {"train_loss": -10.872161865234375, "global_step": 307291, "epoch": 1829} {"train_loss": -11.176733016967773, "global_step": 307292, "epoch": 1829} {"train_loss": -11.238373756408691, "global_step": 307293, "epoch": 1829} {"train_loss": -11.47542667388916, "global_step": 307294, "epoch": 1829} {"train_loss": -11.319003105163574, "global_step": 307295, "epoch": 1829} {"train_loss": -11.207430839538574, "global_step": 307296, "epoch": 1829} {"train_loss": -11.599222183227539, "global_step": 307297, "epoch": 1829} {"train_loss": -11.361867904663086, "global_step": 307298, "epoch": 1829} {"train_loss": -11.817657470703125, "global_step": 307299, "epoch": 1829} {"train_loss": -11.349145889282227, "global_step": 307300, "epoch": 1829} {"train_loss": -11.812578201293945, "global_step": 307301, "epoch": 1829} {"train_loss": -11.502473831176758, "global_step": 307302, "epoch": 1829} {"train_loss": -11.820773124694824, "global_step": 307303, "epoch": 1829} {"train_loss": -11.573726654052734, "global_step": 307304, "epoch": 1829} {"train_loss": -11.943544387817383, "global_step": 307305, "epoch": 1829} {"train_loss": -11.582396507263184, "global_step": 307306, "epoch": 1829} {"train_loss": -11.770956039428711, "global_step": 307307, "epoch": 1829} {"train_loss": -11.529667854309082, "global_step": 307308, "epoch": 1829} {"train_loss": -11.843771934509277, "global_step": 307309, "epoch": 1829} {"train_loss": -11.330368041992188, "global_step": 307310, "epoch": 1829} {"train_loss": -11.889156341552734, "global_step": 307311, "epoch": 1829} {"train_loss": -11.474750518798828, "global_step": 307312, "epoch": 1829} {"train_loss": -11.949749946594238, "global_step": 307313, "epoch": 1829} {"train_loss": -11.521575927734375, "global_step": 307314, "epoch": 1829} {"train_loss": -11.529756546020508, "global_step": 307315, "epoch": 1829} {"train_loss": -11.936423301696777, "global_step": 307316, "epoch": 1829} {"train_loss": -11.581872940063477, "global_step": 307317, "epoch": 1829} {"train_loss": -11.583986282348633, "global_step": 307318, "epoch": 1829} {"train_loss": -11.781805038452148, "global_step": 307319, "epoch": 1829} {"train_loss": -11.646026611328125, "global_step": 307320, "epoch": 1829} {"train_loss": -11.335457801818848, "global_step": 307321, "epoch": 1829} {"train_loss": -11.720806121826172, "global_step": 307322, "epoch": 1829} {"train_loss": -11.488723754882812, "global_step": 307323, "epoch": 1829} {"train_loss": -11.681341171264648, "global_step": 307324, "epoch": 1829} {"train_loss": -11.460997581481934, "global_step": 307325, "epoch": 1829} {"train_loss": -11.980504035949707, "global_step": 307326, "epoch": 1829} {"train_loss": -11.828405380249023, "global_step": 307327, "epoch": 1829} {"train_loss": -12.017613410949707, "global_step": 307328, "epoch": 1829} {"train_loss": -11.73228645324707, "global_step": 307329, "epoch": 1829} {"train_loss": -11.607821464538574, "global_step": 307330, "epoch": 1829} {"train_loss": -11.813837051391602, "global_step": 307331, "epoch": 1829} {"train_loss": -12.065187454223633, "global_step": 307332, "epoch": 1829} {"train_loss": -11.457033157348633, "global_step": 307333, "epoch": 1829} {"train_loss": -12.242476463317871, "global_step": 307334, "epoch": 1829} {"train_loss": -11.467293739318848, "global_step": 307335, "epoch": 1829} {"train_loss": -12.116393089294434, "global_step": 307336, "epoch": 1829} {"train_loss": -11.998302459716797, "global_step": 307337, "epoch": 1829} {"train_loss": -11.914514541625977, "global_step": 307338, "epoch": 1829} {"train_loss": -12.020153045654297, "global_step": 307339, "epoch": 1829} {"train_loss": -12.02351188659668, "global_step": 307340, "epoch": 1829} {"train_loss": -11.83993148803711, "global_step": 307341, "epoch": 1829} {"train_loss": -12.252510070800781, "global_step": 307342, "epoch": 1829} {"train_loss": -11.730165481567383, "global_step": 307343, "epoch": 1829} {"train_loss": -12.233163833618164, "global_step": 307344, "epoch": 1829} {"train_loss": -11.873987197875977, "global_step": 307345, "epoch": 1829} {"train_loss": -12.072698593139648, "global_step": 307346, "epoch": 1829} {"train_loss": -12.014969825744629, "global_step": 307347, "epoch": 1829} {"train_loss": -11.7219820022583, "global_step": 307348, "epoch": 1829} {"train_loss": -12.183703422546387, "global_step": 307349, "epoch": 1829} {"train_loss": -11.863990783691406, "global_step": 307350, "epoch": 1829} {"train_loss": -12.085939407348633, "global_step": 307351, "epoch": 1829} {"train_loss": -11.852741241455078, "global_step": 307352, "epoch": 1829} {"train_loss": -11.708508491516113, "global_step": 307353, "epoch": 1829} {"train_loss": -12.294780731201172, "global_step": 307354, "epoch": 1829} {"train_loss": -11.9943265914917, "global_step": 307355, "epoch": 1829} {"train_loss": -12.212657928466797, "global_step": 307356, "epoch": 1829} {"train_loss": -12.159406661987305, "global_step": 307357, "epoch": 1829} {"train_loss": -12.348946571350098, "global_step": 307358, "epoch": 1829} {"train_loss": -12.292068481445312, "global_step": 307359, "epoch": 1829} {"train_loss": -12.18902587890625, "global_step": 307360, "epoch": 1829} {"train_loss": -12.280633926391602, "global_step": 307361, "epoch": 1829} {"train_loss": -12.340544700622559, "global_step": 307362, "epoch": 1829} {"train_loss": -12.254722595214844, "global_step": 307363, "epoch": 1829} {"train_loss": -12.184869766235352, "global_step": 307364, "epoch": 1829} {"train_loss": -12.472322463989258, "global_step": 307365, "epoch": 1829} {"train_loss": -12.002693176269531, "global_step": 307366, "epoch": 1829} {"train_loss": -12.396220207214355, "global_step": 307367, "epoch": 1829} {"train_loss": -12.34536361694336, "global_step": 307368, "epoch": 1829} {"train_loss": -12.242208480834961, "global_step": 307369, "epoch": 1829} {"train_loss": -12.42602825164795, "global_step": 307370, "epoch": 1829} {"train_loss": -12.270757675170898, "global_step": 307371, "epoch": 1829} {"train_loss": -12.22856330871582, "global_step": 307372, "epoch": 1829} {"train_loss": -12.310663223266602, "global_step": 307373, "epoch": 1829} {"train_loss": -12.273405075073242, "global_step": 307374, "epoch": 1829} {"train_loss": -12.260498046875, "global_step": 307375, "epoch": 1829} {"train_loss": -12.396089553833008, "global_step": 307376, "epoch": 1829} {"train_loss": -12.455182075500488, "global_step": 307377, "epoch": 1829} {"train_loss": -12.232035636901855, "global_step": 307378, "epoch": 1829} {"train_loss": -11.912155151367188, "global_step": 307379, "epoch": 1829} {"train_loss": -12.158773422241211, "global_step": 307380, "epoch": 1829} {"train_loss": -12.142191886901855, "global_step": 307381, "epoch": 1829} {"train_loss": -11.840290069580078, "global_step": 307382, "epoch": 1829} {"train_loss": -12.387723922729492, "global_step": 307383, "epoch": 1829} {"train_loss": -11.989086151123047, "global_step": 307384, "epoch": 1829} {"train_loss": -12.598918914794922, "global_step": 307385, "epoch": 1829} {"train_loss": -11.791496276855469, "global_step": 307386, "epoch": 1829} {"train_loss": -11.976036071777344, "global_step": 307387, "epoch": 1829} {"train_loss": -12.036224365234375, "global_step": 307388, "epoch": 1829} {"train_loss": -11.652606964111328, "global_step": 307389, "epoch": 1829} {"train_loss": -12.036173820495605, "global_step": 307390, "epoch": 1829} {"train_loss": -12.17359447479248, "global_step": 307391, "epoch": 1829} {"train_loss": -11.71462631225586, "global_step": 307392, "epoch": 1829} {"train_loss": -12.684814453125, "global_step": 307393, "epoch": 1829} {"train_loss": -11.952278137207031, "global_step": 307394, "epoch": 1829} {"train_loss": -12.368073463439941, "global_step": 307395, "epoch": 1829} {"train_loss": -12.474077224731445, "global_step": 307396, "epoch": 1829} {"train_loss": -11.833955764770508, "global_step": 307397, "epoch": 1829} {"train_loss": -12.211977005004883, "global_step": 307398, "epoch": 1829} {"train_loss": -11.86916446685791, "global_step": 307399, "epoch": 1829} {"train_loss": -12.202922821044922, "global_step": 307400, "epoch": 1829} {"train_loss": -11.901054382324219, "global_step": 307401, "epoch": 1829} {"train_loss": -11.656006813049316, "global_step": 307402, "epoch": 1829} {"train_loss": -12.150217056274414, "global_step": 307403, "epoch": 1829} {"train_loss": -11.766243934631348, "global_step": 307404, "epoch": 1829} {"train_loss": -11.498716354370117, "global_step": 307405, "epoch": 1829} {"train_loss": -12.20622730255127, "global_step": 307406, "epoch": 1829} {"train_loss": -12.198305130004883, "global_step": 307407, "epoch": 1829} {"train_loss": -12.192403793334961, "global_step": 307408, "epoch": 1829} {"train_loss": -12.221599578857422, "global_step": 307409, "epoch": 1829} {"train_loss": -12.271818161010742, "global_step": 307410, "epoch": 1829} {"train_loss": -12.239856719970703, "global_step": 307411, "epoch": 1829} {"train_loss": -12.312347412109375, "global_step": 307412, "epoch": 1829} {"train_loss": -12.24868392944336, "global_step": 307413, "epoch": 1829} {"train_loss": -12.165743827819824, "global_step": 307414, "epoch": 1829} {"train_loss": -11.735885620117188, "global_step": 307415, "epoch": 1829} {"train_loss": -12.039570808410645, "global_step": 307416, "epoch": 1829} {"train_loss": -12.163959503173828, "global_step": 307417, "epoch": 1829} {"train_loss": -12.064979553222656, "global_step": 307418, "epoch": 1829} {"train_loss": -11.64112377166748, "global_step": 307419, "epoch": 1829} {"train_loss": -12.309078216552734, "global_step": 307420, "epoch": 1829} {"train_loss": -11.57249641418457, "global_step": 307421, "epoch": 1829} {"train_loss": -12.062522888183594, "global_step": 307422, "epoch": 1829} {"train_loss": -11.962539672851562, "global_step": 307423, "epoch": 1829} {"train_loss": -12.421910285949707, "global_step": 307424, "epoch": 1829} {"train_loss": -11.812479019165039, "global_step": 307425, "epoch": 1829} {"train_loss": -12.065835952758789, "global_step": 307426, "epoch": 1829} {"train_loss": -11.885025024414062, "global_step": 307427, "epoch": 1829} {"train_loss": -11.982358932495117, "global_step": 307428, "epoch": 1829} {"train_loss": -11.89045524597168, "global_step": 307429, "epoch": 1829} {"train_loss": -12.142936706542969, "global_step": 307430, "epoch": 1829} {"train_loss": -10.992945671081543, "global_step": 307431, "epoch": 1829} {"train_loss": -11.648950576782227, "global_step": 307432, "epoch": 1829} {"train_loss": -11.894933700561523, "global_step": 307433, "epoch": 1829} {"train_loss": -11.19105339050293, "global_step": 307434, "epoch": 1829} {"train_loss": -10.709053993225098, "global_step": 307435, "epoch": 1829} {"train_loss": -12.012725830078125, "global_step": 307436, "epoch": 1829} {"train_loss": -10.125978469848633, "global_step": 307437, "epoch": 1829} {"train_loss": -10.366127014160156, "global_step": 307438, "epoch": 1829} {"train_loss": -11.78573100907462, "global_step": 307439, "epoch": 1829, "val_loss": 280780.59375} {"train_loss": -11.004874229431152, "global_step": 307440, "epoch": 1830} {"train_loss": -10.489747047424316, "global_step": 307441, "epoch": 1830} {"train_loss": -10.876859664916992, "global_step": 307442, "epoch": 1830} {"train_loss": -9.442465782165527, "global_step": 307443, "epoch": 1830} {"train_loss": -10.284648895263672, "global_step": 307444, "epoch": 1830} {"train_loss": -10.5359525680542, "global_step": 307445, "epoch": 1830} {"train_loss": -10.1886625289917, "global_step": 307446, "epoch": 1830} {"train_loss": -10.391924858093262, "global_step": 307447, "epoch": 1830} {"train_loss": -10.221982955932617, "global_step": 307448, "epoch": 1830} {"train_loss": -10.436421394348145, "global_step": 307449, "epoch": 1830} {"train_loss": -10.664531707763672, "global_step": 307450, "epoch": 1830} {"train_loss": -10.583781242370605, "global_step": 307451, "epoch": 1830} {"train_loss": -9.937870979309082, "global_step": 307452, "epoch": 1830} {"train_loss": -10.571443557739258, "global_step": 307453, "epoch": 1830} {"train_loss": -10.887426376342773, "global_step": 307454, "epoch": 1830} {"train_loss": -11.539363861083984, "global_step": 307455, "epoch": 1830} {"train_loss": -11.27852725982666, "global_step": 307456, "epoch": 1830} {"train_loss": -11.368680953979492, "global_step": 307457, "epoch": 1830} {"train_loss": -10.717567443847656, "global_step": 307458, "epoch": 1830} {"train_loss": -10.515180587768555, "global_step": 307459, "epoch": 1830} {"train_loss": -10.656940460205078, "global_step": 307460, "epoch": 1830} {"train_loss": -11.52585506439209, "global_step": 307461, "epoch": 1830} {"train_loss": -10.067741394042969, "global_step": 307462, "epoch": 1830} {"train_loss": -11.356616973876953, "global_step": 307463, "epoch": 1830} {"train_loss": -10.741600036621094, "global_step": 307464, "epoch": 1830} {"train_loss": -11.018486976623535, "global_step": 307465, "epoch": 1830} {"train_loss": -10.022619247436523, "global_step": 307466, "epoch": 1830} {"train_loss": -11.519540786743164, "global_step": 307467, "epoch": 1830} {"train_loss": -10.15071964263916, "global_step": 307468, "epoch": 1830} {"train_loss": -11.269026756286621, "global_step": 307469, "epoch": 1830} {"train_loss": -11.152996063232422, "global_step": 307470, "epoch": 1830} {"train_loss": -11.935280799865723, "global_step": 307471, "epoch": 1830} {"train_loss": -11.263948440551758, "global_step": 307472, "epoch": 1830} {"train_loss": -11.682574272155762, "global_step": 307473, "epoch": 1830} {"train_loss": -11.60958194732666, "global_step": 307474, "epoch": 1830} {"train_loss": -11.193300247192383, "global_step": 307475, "epoch": 1830} {"train_loss": -11.592205047607422, "global_step": 307476, "epoch": 1830} {"train_loss": -11.824531555175781, "global_step": 307477, "epoch": 1830} {"train_loss": -11.868040084838867, "global_step": 307478, "epoch": 1830} {"train_loss": -11.871429443359375, "global_step": 307479, "epoch": 1830} {"train_loss": -11.75450611114502, "global_step": 307480, "epoch": 1830} {"train_loss": -11.642192840576172, "global_step": 307481, "epoch": 1830} {"train_loss": -11.914240837097168, "global_step": 307482, "epoch": 1830} {"train_loss": -11.735428810119629, "global_step": 307483, "epoch": 1830} {"train_loss": -11.913729667663574, "global_step": 307484, "epoch": 1830} {"train_loss": -12.04825210571289, "global_step": 307485, "epoch": 1830} {"train_loss": -12.051666259765625, "global_step": 307486, "epoch": 1830} {"train_loss": -11.70987319946289, "global_step": 307487, "epoch": 1830} {"train_loss": -11.929106712341309, "global_step": 307488, "epoch": 1830} {"train_loss": -11.871379852294922, "global_step": 307489, "epoch": 1830} {"train_loss": -11.981569290161133, "global_step": 307490, "epoch": 1830} {"train_loss": -12.154644012451172, "global_step": 307491, "epoch": 1830} {"train_loss": -11.822616577148438, "global_step": 307492, "epoch": 1830} {"train_loss": -11.969944953918457, "global_step": 307493, "epoch": 1830} {"train_loss": -12.30194091796875, "global_step": 307494, "epoch": 1830} {"train_loss": -11.938043594360352, "global_step": 307495, "epoch": 1830} {"train_loss": -12.060646057128906, "global_step": 307496, "epoch": 1830} {"train_loss": -12.18316650390625, "global_step": 307497, "epoch": 1830} {"train_loss": -12.217636108398438, "global_step": 307498, "epoch": 1830} {"train_loss": -12.18825912475586, "global_step": 307499, "epoch": 1830} {"train_loss": -12.206327438354492, "global_step": 307500, "epoch": 1830} {"train_loss": -12.173208236694336, "global_step": 307501, "epoch": 1830} {"train_loss": -12.175179481506348, "global_step": 307502, "epoch": 1830} {"train_loss": -11.915457725524902, "global_step": 307503, "epoch": 1830} {"train_loss": -12.367799758911133, "global_step": 307504, "epoch": 1830} {"train_loss": -12.279861450195312, "global_step": 307505, "epoch": 1830} {"train_loss": -12.380533218383789, "global_step": 307506, "epoch": 1830} {"train_loss": -12.236804962158203, "global_step": 307507, "epoch": 1830} {"train_loss": -12.51033878326416, "global_step": 307508, "epoch": 1830} {"train_loss": -12.167655944824219, "global_step": 307509, "epoch": 1830} {"train_loss": -12.338882446289062, "global_step": 307510, "epoch": 1830} {"train_loss": -12.377969741821289, "global_step": 307511, "epoch": 1830} {"train_loss": -12.341114044189453, "global_step": 307512, "epoch": 1830} {"train_loss": -12.194507598876953, "global_step": 307513, "epoch": 1830} {"train_loss": -12.3869047164917, "global_step": 307514, "epoch": 1830} {"train_loss": -12.336524963378906, "global_step": 307515, "epoch": 1830} {"train_loss": -12.284912109375, "global_step": 307516, "epoch": 1830} {"train_loss": -12.379207611083984, "global_step": 307517, "epoch": 1830} {"train_loss": -12.372992515563965, "global_step": 307518, "epoch": 1830} {"train_loss": -12.39199161529541, "global_step": 307519, "epoch": 1830} {"train_loss": -12.316801071166992, "global_step": 307520, "epoch": 1830} {"train_loss": -12.186636924743652, "global_step": 307521, "epoch": 1830} {"train_loss": -12.225086212158203, "global_step": 307522, "epoch": 1830} {"train_loss": -12.069849967956543, "global_step": 307523, "epoch": 1830} {"train_loss": -12.187702178955078, "global_step": 307524, "epoch": 1830} {"train_loss": -12.158132553100586, "global_step": 307525, "epoch": 1830} {"train_loss": -12.133851051330566, "global_step": 307526, "epoch": 1830} {"train_loss": -12.472309112548828, "global_step": 307527, "epoch": 1830} {"train_loss": -12.182077407836914, "global_step": 307528, "epoch": 1830} {"train_loss": -12.221790313720703, "global_step": 307529, "epoch": 1830} {"train_loss": -12.310308456420898, "global_step": 307530, "epoch": 1830} {"train_loss": -12.254581451416016, "global_step": 307531, "epoch": 1830} {"train_loss": -11.869306564331055, "global_step": 307532, "epoch": 1830} {"train_loss": -12.237092971801758, "global_step": 307533, "epoch": 1830} {"train_loss": -12.155759811401367, "global_step": 307534, "epoch": 1830} {"train_loss": -12.538511276245117, "global_step": 307535, "epoch": 1830} {"train_loss": -12.373235702514648, "global_step": 307536, "epoch": 1830} {"train_loss": -12.184947967529297, "global_step": 307537, "epoch": 1830} {"train_loss": -12.07947063446045, "global_step": 307538, "epoch": 1830} {"train_loss": -12.123856544494629, "global_step": 307539, "epoch": 1830} {"train_loss": -11.592754364013672, "global_step": 307540, "epoch": 1830} {"train_loss": -12.008803367614746, "global_step": 307541, "epoch": 1830} {"train_loss": -12.255979537963867, "global_step": 307542, "epoch": 1830} {"train_loss": -12.253118515014648, "global_step": 307543, "epoch": 1830} {"train_loss": -11.641159057617188, "global_step": 307544, "epoch": 1830} {"train_loss": -12.347060203552246, "global_step": 307545, "epoch": 1830} {"train_loss": -11.84714412689209, "global_step": 307546, "epoch": 1830} {"train_loss": -12.342533111572266, "global_step": 307547, "epoch": 1830} {"train_loss": -11.69576644897461, "global_step": 307548, "epoch": 1830} {"train_loss": -12.302865982055664, "global_step": 307549, "epoch": 1830} {"train_loss": -12.079729080200195, "global_step": 307550, "epoch": 1830} {"train_loss": -11.901655197143555, "global_step": 307551, "epoch": 1830} {"train_loss": -11.957016944885254, "global_step": 307552, "epoch": 1830} {"train_loss": -11.836555480957031, "global_step": 307553, "epoch": 1830} {"train_loss": -11.317316055297852, "global_step": 307554, "epoch": 1830} {"train_loss": -10.238578796386719, "global_step": 307555, "epoch": 1830} {"train_loss": -12.117213249206543, "global_step": 307556, "epoch": 1830} {"train_loss": -10.803001403808594, "global_step": 307557, "epoch": 1830} {"train_loss": -11.25023365020752, "global_step": 307558, "epoch": 1830} {"train_loss": -10.793400764465332, "global_step": 307559, "epoch": 1830} {"train_loss": -9.812186241149902, "global_step": 307560, "epoch": 1830} {"train_loss": -11.254541397094727, "global_step": 307561, "epoch": 1830} {"train_loss": -11.087159156799316, "global_step": 307562, "epoch": 1830} {"train_loss": -9.909200668334961, "global_step": 307563, "epoch": 1830} {"train_loss": -11.278128623962402, "global_step": 307564, "epoch": 1830} {"train_loss": -8.214725494384766, "global_step": 307565, "epoch": 1830} {"train_loss": -8.894978523254395, "global_step": 307566, "epoch": 1830} {"train_loss": -10.161231994628906, "global_step": 307567, "epoch": 1830} {"train_loss": -8.55600357055664, "global_step": 307568, "epoch": 1830} {"train_loss": -9.777726173400879, "global_step": 307569, "epoch": 1830} {"train_loss": -8.331502914428711, "global_step": 307570, "epoch": 1830} {"train_loss": -9.81019401550293, "global_step": 307571, "epoch": 1830} {"train_loss": -9.256511688232422, "global_step": 307572, "epoch": 1830} {"train_loss": -7.747430324554443, "global_step": 307573, "epoch": 1830} {"train_loss": -10.320449829101562, "global_step": 307574, "epoch": 1830} {"train_loss": -9.791345596313477, "global_step": 307575, "epoch": 1830} {"train_loss": -8.837004661560059, "global_step": 307576, "epoch": 1830} {"train_loss": -9.53338623046875, "global_step": 307577, "epoch": 1830} {"train_loss": -10.981358528137207, "global_step": 307578, "epoch": 1830} {"train_loss": -9.768726348876953, "global_step": 307579, "epoch": 1830} {"train_loss": -10.40722942352295, "global_step": 307580, "epoch": 1830} {"train_loss": -10.858407974243164, "global_step": 307581, "epoch": 1830} {"train_loss": -9.299642562866211, "global_step": 307582, "epoch": 1830} {"train_loss": -10.020345687866211, "global_step": 307583, "epoch": 1830} {"train_loss": -11.059042930603027, "global_step": 307584, "epoch": 1830} {"train_loss": -10.882652282714844, "global_step": 307585, "epoch": 1830} {"train_loss": -11.208901405334473, "global_step": 307586, "epoch": 1830} {"train_loss": -10.508825302124023, "global_step": 307587, "epoch": 1830} {"train_loss": -10.701095581054688, "global_step": 307588, "epoch": 1830} {"train_loss": -11.148517608642578, "global_step": 307589, "epoch": 1830} {"train_loss": -11.279088973999023, "global_step": 307590, "epoch": 1830} {"train_loss": -10.957572937011719, "global_step": 307591, "epoch": 1830} {"train_loss": -11.530582427978516, "global_step": 307592, "epoch": 1830} {"train_loss": -11.596232414245605, "global_step": 307593, "epoch": 1830} {"train_loss": -11.34299087524414, "global_step": 307594, "epoch": 1830} {"train_loss": -11.386112213134766, "global_step": 307595, "epoch": 1830} {"train_loss": -11.463722229003906, "global_step": 307596, "epoch": 1830} {"train_loss": -11.236715316772461, "global_step": 307597, "epoch": 1830} {"train_loss": -11.594484329223633, "global_step": 307598, "epoch": 1830} {"train_loss": -11.019378662109375, "global_step": 307599, "epoch": 1830} {"train_loss": -11.19783878326416, "global_step": 307600, "epoch": 1830} {"train_loss": -11.08266830444336, "global_step": 307601, "epoch": 1830} {"train_loss": -11.382003784179688, "global_step": 307602, "epoch": 1830} {"train_loss": -11.77609634399414, "global_step": 307603, "epoch": 1830} {"train_loss": -11.2398099899292, "global_step": 307604, "epoch": 1830} {"train_loss": -11.345582008361816, "global_step": 307605, "epoch": 1830} {"train_loss": -11.584970474243164, "global_step": 307606, "epoch": 1830} {"train_loss": -11.335048820291247, "global_step": 307607, "epoch": 1830, "val_loss": 273310.71875, "train_action_mse_error": 5.208158493041992} {"train_loss": -11.652442932128906, "global_step": 307608, "epoch": 1831} {"train_loss": -11.878633499145508, "global_step": 307609, "epoch": 1831} {"train_loss": -11.76771354675293, "global_step": 307610, "epoch": 1831} {"train_loss": -11.578611373901367, "global_step": 307611, "epoch": 1831} {"train_loss": -11.785953521728516, "global_step": 307612, "epoch": 1831} {"train_loss": -11.784233093261719, "global_step": 307613, "epoch": 1831} {"train_loss": -11.559112548828125, "global_step": 307614, "epoch": 1831} {"train_loss": -11.834168434143066, "global_step": 307615, "epoch": 1831} {"train_loss": -11.719406127929688, "global_step": 307616, "epoch": 1831} {"train_loss": -11.695093154907227, "global_step": 307617, "epoch": 1831} {"train_loss": -11.508651733398438, "global_step": 307618, "epoch": 1831} {"train_loss": -11.576810836791992, "global_step": 307619, "epoch": 1831} {"train_loss": -11.912792205810547, "global_step": 307620, "epoch": 1831} {"train_loss": -11.726043701171875, "global_step": 307621, "epoch": 1831} {"train_loss": -11.733125686645508, "global_step": 307622, "epoch": 1831} {"train_loss": -11.945782661437988, "global_step": 307623, "epoch": 1831} {"train_loss": -11.901355743408203, "global_step": 307624, "epoch": 1831} {"train_loss": -11.936471939086914, "global_step": 307625, "epoch": 1831} {"train_loss": -11.73042106628418, "global_step": 307626, "epoch": 1831} {"train_loss": -12.032134056091309, "global_step": 307627, "epoch": 1831} {"train_loss": -11.796331405639648, "global_step": 307628, "epoch": 1831} {"train_loss": -11.934211730957031, "global_step": 307629, "epoch": 1831} {"train_loss": -11.835230827331543, "global_step": 307630, "epoch": 1831} {"train_loss": -12.15546989440918, "global_step": 307631, "epoch": 1831} {"train_loss": -12.038695335388184, "global_step": 307632, "epoch": 1831} {"train_loss": -12.153632164001465, "global_step": 307633, "epoch": 1831} {"train_loss": -12.10673713684082, "global_step": 307634, "epoch": 1831} {"train_loss": -12.026725769042969, "global_step": 307635, "epoch": 1831} {"train_loss": -11.884197235107422, "global_step": 307636, "epoch": 1831} {"train_loss": -12.23495864868164, "global_step": 307637, "epoch": 1831} {"train_loss": -12.329427719116211, "global_step": 307638, "epoch": 1831} {"train_loss": -12.081375122070312, "global_step": 307639, "epoch": 1831} {"train_loss": -12.187990188598633, "global_step": 307640, "epoch": 1831} {"train_loss": -12.10527229309082, "global_step": 307641, "epoch": 1831} {"train_loss": -12.248269081115723, "global_step": 307642, "epoch": 1831} {"train_loss": -12.063411712646484, "global_step": 307643, "epoch": 1831} {"train_loss": -12.127607345581055, "global_step": 307644, "epoch": 1831} {"train_loss": -12.183773040771484, "global_step": 307645, "epoch": 1831} {"train_loss": -12.446466445922852, "global_step": 307646, "epoch": 1831} {"train_loss": -12.162103652954102, "global_step": 307647, "epoch": 1831} {"train_loss": -12.192144393920898, "global_step": 307648, "epoch": 1831} {"train_loss": -12.281758308410645, "global_step": 307649, "epoch": 1831} {"train_loss": -12.18856143951416, "global_step": 307650, "epoch": 1831} {"train_loss": -12.261109352111816, "global_step": 307651, "epoch": 1831} {"train_loss": -12.327356338500977, "global_step": 307652, "epoch": 1831} {"train_loss": -12.068817138671875, "global_step": 307653, "epoch": 1831} {"train_loss": -12.280586242675781, "global_step": 307654, "epoch": 1831} {"train_loss": -12.177297592163086, "global_step": 307655, "epoch": 1831} {"train_loss": -12.231119155883789, "global_step": 307656, "epoch": 1831} {"train_loss": -12.10377311706543, "global_step": 307657, "epoch": 1831} {"train_loss": -12.015243530273438, "global_step": 307658, "epoch": 1831} {"train_loss": -12.21216869354248, "global_step": 307659, "epoch": 1831} {"train_loss": -12.485597610473633, "global_step": 307660, "epoch": 1831} {"train_loss": -12.148043632507324, "global_step": 307661, "epoch": 1831} {"train_loss": -12.261272430419922, "global_step": 307662, "epoch": 1831} {"train_loss": -12.167074203491211, "global_step": 307663, "epoch": 1831} {"train_loss": -12.049320220947266, "global_step": 307664, "epoch": 1831} {"train_loss": -12.26718521118164, "global_step": 307665, "epoch": 1831} {"train_loss": -12.348482131958008, "global_step": 307666, "epoch": 1831} {"train_loss": -12.158058166503906, "global_step": 307667, "epoch": 1831} {"train_loss": -12.194076538085938, "global_step": 307668, "epoch": 1831} {"train_loss": -12.447834014892578, "global_step": 307669, "epoch": 1831} {"train_loss": -12.092466354370117, "global_step": 307670, "epoch": 1831} {"train_loss": -12.369325637817383, "global_step": 307671, "epoch": 1831} {"train_loss": -12.337272644042969, "global_step": 307672, "epoch": 1831} {"train_loss": -12.099897384643555, "global_step": 307673, "epoch": 1831} {"train_loss": -11.925896644592285, "global_step": 307674, "epoch": 1831} {"train_loss": -12.623798370361328, "global_step": 307675, "epoch": 1831} {"train_loss": -11.985020637512207, "global_step": 307676, "epoch": 1831} {"train_loss": -12.422883987426758, "global_step": 307677, "epoch": 1831} {"train_loss": -12.208717346191406, "global_step": 307678, "epoch": 1831} {"train_loss": -12.521284103393555, "global_step": 307679, "epoch": 1831} {"train_loss": -12.309860229492188, "global_step": 307680, "epoch": 1831} {"train_loss": -12.46884536743164, "global_step": 307681, "epoch": 1831} {"train_loss": -12.158835411071777, "global_step": 307682, "epoch": 1831} {"train_loss": -12.316261291503906, "global_step": 307683, "epoch": 1831} {"train_loss": -12.356082916259766, "global_step": 307684, "epoch": 1831} {"train_loss": -12.103711128234863, "global_step": 307685, "epoch": 1831} {"train_loss": -12.553077697753906, "global_step": 307686, "epoch": 1831} {"train_loss": -12.34878158569336, "global_step": 307687, "epoch": 1831} {"train_loss": -11.972620964050293, "global_step": 307688, "epoch": 1831} {"train_loss": -12.38062858581543, "global_step": 307689, "epoch": 1831} {"train_loss": -12.095878601074219, "global_step": 307690, "epoch": 1831} {"train_loss": -11.807840347290039, "global_step": 307691, "epoch": 1831} {"train_loss": -12.227664947509766, "global_step": 307692, "epoch": 1831} {"train_loss": -12.279987335205078, "global_step": 307693, "epoch": 1831} {"train_loss": -11.642046928405762, "global_step": 307694, "epoch": 1831} {"train_loss": -12.302577018737793, "global_step": 307695, "epoch": 1831} {"train_loss": -12.229124069213867, "global_step": 307696, "epoch": 1831} {"train_loss": -12.069820404052734, "global_step": 307697, "epoch": 1831} {"train_loss": -12.166851043701172, "global_step": 307698, "epoch": 1831} {"train_loss": -12.159217834472656, "global_step": 307699, "epoch": 1831} {"train_loss": -11.647174835205078, "global_step": 307700, "epoch": 1831} {"train_loss": -12.360307693481445, "global_step": 307701, "epoch": 1831} {"train_loss": -11.750170707702637, "global_step": 307702, "epoch": 1831} {"train_loss": -11.880356788635254, "global_step": 307703, "epoch": 1831} {"train_loss": -12.286165237426758, "global_step": 307704, "epoch": 1831} {"train_loss": -12.437759399414062, "global_step": 307705, "epoch": 1831} {"train_loss": -12.051704406738281, "global_step": 307706, "epoch": 1831} {"train_loss": -12.085884094238281, "global_step": 307707, "epoch": 1831} {"train_loss": -12.225671768188477, "global_step": 307708, "epoch": 1831} {"train_loss": -12.037689208984375, "global_step": 307709, "epoch": 1831} {"train_loss": -12.220975875854492, "global_step": 307710, "epoch": 1831} {"train_loss": -12.251532554626465, "global_step": 307711, "epoch": 1831} {"train_loss": -11.706653594970703, "global_step": 307712, "epoch": 1831} {"train_loss": -11.69812297821045, "global_step": 307713, "epoch": 1831} {"train_loss": -12.2120361328125, "global_step": 307714, "epoch": 1831} {"train_loss": -11.803699493408203, "global_step": 307715, "epoch": 1831} {"train_loss": -11.60439682006836, "global_step": 307716, "epoch": 1831} {"train_loss": -12.023187637329102, "global_step": 307717, "epoch": 1831} {"train_loss": -11.542213439941406, "global_step": 307718, "epoch": 1831} {"train_loss": -12.01340103149414, "global_step": 307719, "epoch": 1831} {"train_loss": -10.924263000488281, "global_step": 307720, "epoch": 1831} {"train_loss": -9.589531898498535, "global_step": 307721, "epoch": 1831} {"train_loss": -10.134361267089844, "global_step": 307722, "epoch": 1831} {"train_loss": -8.640083312988281, "global_step": 307723, "epoch": 1831} {"train_loss": -8.190924644470215, "global_step": 307724, "epoch": 1831} {"train_loss": -7.598892688751221, "global_step": 307725, "epoch": 1831} {"train_loss": -8.704703330993652, "global_step": 307726, "epoch": 1831} {"train_loss": -9.516292572021484, "global_step": 307727, "epoch": 1831} {"train_loss": -8.978599548339844, "global_step": 307728, "epoch": 1831} {"train_loss": -8.416848182678223, "global_step": 307729, "epoch": 1831} {"train_loss": -9.760137557983398, "global_step": 307730, "epoch": 1831} {"train_loss": -9.223033905029297, "global_step": 307731, "epoch": 1831} {"train_loss": -10.492000579833984, "global_step": 307732, "epoch": 1831} {"train_loss": -8.265838623046875, "global_step": 307733, "epoch": 1831} {"train_loss": -9.224699020385742, "global_step": 307734, "epoch": 1831} {"train_loss": -9.120630264282227, "global_step": 307735, "epoch": 1831} {"train_loss": -8.487823486328125, "global_step": 307736, "epoch": 1831} {"train_loss": -9.489670753479004, "global_step": 307737, "epoch": 1831} {"train_loss": -9.196748733520508, "global_step": 307738, "epoch": 1831} {"train_loss": -7.860010623931885, "global_step": 307739, "epoch": 1831} {"train_loss": -8.77983570098877, "global_step": 307740, "epoch": 1831} {"train_loss": -9.433341979980469, "global_step": 307741, "epoch": 1831} {"train_loss": -9.514472961425781, "global_step": 307742, "epoch": 1831} {"train_loss": -9.911378860473633, "global_step": 307743, "epoch": 1831} {"train_loss": -9.817354202270508, "global_step": 307744, "epoch": 1831} {"train_loss": -9.666824340820312, "global_step": 307745, "epoch": 1831} {"train_loss": -10.019636154174805, "global_step": 307746, "epoch": 1831} {"train_loss": -10.236995697021484, "global_step": 307747, "epoch": 1831} {"train_loss": -10.226153373718262, "global_step": 307748, "epoch": 1831} {"train_loss": -11.160799026489258, "global_step": 307749, "epoch": 1831} {"train_loss": -9.995711326599121, "global_step": 307750, "epoch": 1831} {"train_loss": -11.06883716583252, "global_step": 307751, "epoch": 1831} {"train_loss": -10.367914199829102, "global_step": 307752, "epoch": 1831} {"train_loss": -10.989593505859375, "global_step": 307753, "epoch": 1831} {"train_loss": -10.720101356506348, "global_step": 307754, "epoch": 1831} {"train_loss": -10.745366096496582, "global_step": 307755, "epoch": 1831} {"train_loss": -10.742768287658691, "global_step": 307756, "epoch": 1831} {"train_loss": -10.58210277557373, "global_step": 307757, "epoch": 1831} {"train_loss": -10.721441268920898, "global_step": 307758, "epoch": 1831} {"train_loss": -11.22340202331543, "global_step": 307759, "epoch": 1831} {"train_loss": -10.981937408447266, "global_step": 307760, "epoch": 1831} {"train_loss": -11.257232666015625, "global_step": 307761, "epoch": 1831} {"train_loss": -10.997880935668945, "global_step": 307762, "epoch": 1831} {"train_loss": -11.26984977722168, "global_step": 307763, "epoch": 1831} {"train_loss": -11.239923477172852, "global_step": 307764, "epoch": 1831} {"train_loss": -11.062257766723633, "global_step": 307765, "epoch": 1831} {"train_loss": -11.482063293457031, "global_step": 307766, "epoch": 1831} {"train_loss": -11.399654388427734, "global_step": 307767, "epoch": 1831} {"train_loss": -11.582599639892578, "global_step": 307768, "epoch": 1831} {"train_loss": -10.898357391357422, "global_step": 307769, "epoch": 1831} {"train_loss": -11.450969696044922, "global_step": 307770, "epoch": 1831} {"train_loss": -11.172508239746094, "global_step": 307771, "epoch": 1831} {"train_loss": -11.63022518157959, "global_step": 307772, "epoch": 1831} {"train_loss": -11.599833488464355, "global_step": 307773, "epoch": 1831} {"train_loss": -11.505208969116211, "global_step": 307774, "epoch": 1831} {"train_loss": -11.438980931327457, "global_step": 307775, "epoch": 1831, "val_loss": 272896.53125} {"train_loss": -11.244750022888184, "global_step": 307776, "epoch": 1832} {"train_loss": -11.648765563964844, "global_step": 307777, "epoch": 1832} {"train_loss": -11.596635818481445, "global_step": 307778, "epoch": 1832} {"train_loss": -11.680755615234375, "global_step": 307779, "epoch": 1832} {"train_loss": -11.72642707824707, "global_step": 307780, "epoch": 1832} {"train_loss": -11.6944580078125, "global_step": 307781, "epoch": 1832} {"train_loss": -11.584705352783203, "global_step": 307782, "epoch": 1832} {"train_loss": -11.429489135742188, "global_step": 307783, "epoch": 1832} {"train_loss": -11.738130569458008, "global_step": 307784, "epoch": 1832} {"train_loss": -11.73647403717041, "global_step": 307785, "epoch": 1832} {"train_loss": -11.808030128479004, "global_step": 307786, "epoch": 1832} {"train_loss": -11.855379104614258, "global_step": 307787, "epoch": 1832} {"train_loss": -11.805116653442383, "global_step": 307788, "epoch": 1832} {"train_loss": -12.003898620605469, "global_step": 307789, "epoch": 1832} {"train_loss": -11.98589038848877, "global_step": 307790, "epoch": 1832} {"train_loss": -11.912416458129883, "global_step": 307791, "epoch": 1832} {"train_loss": -12.033159255981445, "global_step": 307792, "epoch": 1832} {"train_loss": -11.863890647888184, "global_step": 307793, "epoch": 1832} {"train_loss": -12.107341766357422, "global_step": 307794, "epoch": 1832} {"train_loss": -11.830204010009766, "global_step": 307795, "epoch": 1832} {"train_loss": -11.886371612548828, "global_step": 307796, "epoch": 1832} {"train_loss": -12.060163497924805, "global_step": 307797, "epoch": 1832} {"train_loss": -12.056413650512695, "global_step": 307798, "epoch": 1832} {"train_loss": -12.132692337036133, "global_step": 307799, "epoch": 1832} {"train_loss": -11.724432945251465, "global_step": 307800, "epoch": 1832} {"train_loss": -11.813800811767578, "global_step": 307801, "epoch": 1832} {"train_loss": -12.223109245300293, "global_step": 307802, "epoch": 1832} {"train_loss": -11.895721435546875, "global_step": 307803, "epoch": 1832} {"train_loss": -11.927968978881836, "global_step": 307804, "epoch": 1832} {"train_loss": -11.958499908447266, "global_step": 307805, "epoch": 1832} {"train_loss": -12.092862129211426, "global_step": 307806, "epoch": 1832} {"train_loss": -12.035987854003906, "global_step": 307807, "epoch": 1832} {"train_loss": -12.031024932861328, "global_step": 307808, "epoch": 1832} {"train_loss": -12.056527137756348, "global_step": 307809, "epoch": 1832} {"train_loss": -11.874872207641602, "global_step": 307810, "epoch": 1832} {"train_loss": -12.031572341918945, "global_step": 307811, "epoch": 1832} {"train_loss": -12.069734573364258, "global_step": 307812, "epoch": 1832} {"train_loss": -12.119308471679688, "global_step": 307813, "epoch": 1832} {"train_loss": -12.249041557312012, "global_step": 307814, "epoch": 1832} {"train_loss": -12.090535163879395, "global_step": 307815, "epoch": 1832} {"train_loss": -12.312840461730957, "global_step": 307816, "epoch": 1832} {"train_loss": -12.179269790649414, "global_step": 307817, "epoch": 1832} {"train_loss": -12.269394874572754, "global_step": 307818, "epoch": 1832} {"train_loss": -12.213188171386719, "global_step": 307819, "epoch": 1832} {"train_loss": -12.248384475708008, "global_step": 307820, "epoch": 1832} {"train_loss": -12.052082061767578, "global_step": 307821, "epoch": 1832} {"train_loss": -12.209973335266113, "global_step": 307822, "epoch": 1832} {"train_loss": -12.225549697875977, "global_step": 307823, "epoch": 1832} {"train_loss": -12.161101341247559, "global_step": 307824, "epoch": 1832} {"train_loss": -12.225481033325195, "global_step": 307825, "epoch": 1832} {"train_loss": -12.440250396728516, "global_step": 307826, "epoch": 1832} {"train_loss": -12.19389533996582, "global_step": 307827, "epoch": 1832} {"train_loss": -12.22641372680664, "global_step": 307828, "epoch": 1832} {"train_loss": -12.294994354248047, "global_step": 307829, "epoch": 1832} {"train_loss": -12.41218090057373, "global_step": 307830, "epoch": 1832} {"train_loss": -12.370302200317383, "global_step": 307831, "epoch": 1832} {"train_loss": -12.24268627166748, "global_step": 307832, "epoch": 1832} {"train_loss": -12.397662162780762, "global_step": 307833, "epoch": 1832} {"train_loss": -12.46384048461914, "global_step": 307834, "epoch": 1832} {"train_loss": -12.352779388427734, "global_step": 307835, "epoch": 1832} {"train_loss": -12.526422500610352, "global_step": 307836, "epoch": 1832} {"train_loss": -12.287483215332031, "global_step": 307837, "epoch": 1832} {"train_loss": -12.473533630371094, "global_step": 307838, "epoch": 1832} {"train_loss": -12.44126033782959, "global_step": 307839, "epoch": 1832} {"train_loss": -12.429771423339844, "global_step": 307840, "epoch": 1832} {"train_loss": -12.37983512878418, "global_step": 307841, "epoch": 1832} {"train_loss": -12.478492736816406, "global_step": 307842, "epoch": 1832} {"train_loss": -12.520172119140625, "global_step": 307843, "epoch": 1832} {"train_loss": -12.390512466430664, "global_step": 307844, "epoch": 1832} {"train_loss": -12.347957611083984, "global_step": 307845, "epoch": 1832} {"train_loss": -12.542383193969727, "global_step": 307846, "epoch": 1832} {"train_loss": -12.187291145324707, "global_step": 307847, "epoch": 1832} {"train_loss": -12.276437759399414, "global_step": 307848, "epoch": 1832} {"train_loss": -12.029026985168457, "global_step": 307849, "epoch": 1832} {"train_loss": -12.076168060302734, "global_step": 307850, "epoch": 1832} {"train_loss": -12.122259140014648, "global_step": 307851, "epoch": 1832} {"train_loss": -12.393547058105469, "global_step": 307852, "epoch": 1832} {"train_loss": -11.634157180786133, "global_step": 307853, "epoch": 1832} {"train_loss": -12.543073654174805, "global_step": 307854, "epoch": 1832} {"train_loss": -11.735611915588379, "global_step": 307855, "epoch": 1832} {"train_loss": -12.141721725463867, "global_step": 307856, "epoch": 1832} {"train_loss": -11.511297225952148, "global_step": 307857, "epoch": 1832} {"train_loss": -12.290579795837402, "global_step": 307858, "epoch": 1832} {"train_loss": -11.790695190429688, "global_step": 307859, "epoch": 1832} {"train_loss": -12.086119651794434, "global_step": 307860, "epoch": 1832} {"train_loss": -11.217458724975586, "global_step": 307861, "epoch": 1832} {"train_loss": -11.276308059692383, "global_step": 307862, "epoch": 1832} {"train_loss": -11.406803131103516, "global_step": 307863, "epoch": 1832} {"train_loss": -9.516241073608398, "global_step": 307864, "epoch": 1832} {"train_loss": -9.488868713378906, "global_step": 307865, "epoch": 1832} {"train_loss": -10.562699317932129, "global_step": 307866, "epoch": 1832} {"train_loss": -7.654826641082764, "global_step": 307867, "epoch": 1832} {"train_loss": -8.146551132202148, "global_step": 307868, "epoch": 1832} {"train_loss": -8.392693519592285, "global_step": 307869, "epoch": 1832} {"train_loss": -9.162835121154785, "global_step": 307870, "epoch": 1832} {"train_loss": -9.43740463256836, "global_step": 307871, "epoch": 1832} {"train_loss": -9.701271057128906, "global_step": 307872, "epoch": 1832} {"train_loss": -9.499838829040527, "global_step": 307873, "epoch": 1832} {"train_loss": -10.153165817260742, "global_step": 307874, "epoch": 1832} {"train_loss": -10.770092010498047, "global_step": 307875, "epoch": 1832} {"train_loss": -10.732686042785645, "global_step": 307876, "epoch": 1832} {"train_loss": -11.419771194458008, "global_step": 307877, "epoch": 1832} {"train_loss": -11.094791412353516, "global_step": 307878, "epoch": 1832} {"train_loss": -10.840818405151367, "global_step": 307879, "epoch": 1832} {"train_loss": -10.843840599060059, "global_step": 307880, "epoch": 1832} {"train_loss": -10.893216133117676, "global_step": 307881, "epoch": 1832} {"train_loss": -10.82455062866211, "global_step": 307882, "epoch": 1832} {"train_loss": -11.054435729980469, "global_step": 307883, "epoch": 1832} {"train_loss": -11.03504467010498, "global_step": 307884, "epoch": 1832} {"train_loss": -11.306547164916992, "global_step": 307885, "epoch": 1832} {"train_loss": -10.990874290466309, "global_step": 307886, "epoch": 1832} {"train_loss": -11.118729591369629, "global_step": 307887, "epoch": 1832} {"train_loss": -10.334624290466309, "global_step": 307888, "epoch": 1832} {"train_loss": -10.560413360595703, "global_step": 307889, "epoch": 1832} {"train_loss": -11.567407608032227, "global_step": 307890, "epoch": 1832} {"train_loss": -10.668525695800781, "global_step": 307891, "epoch": 1832} {"train_loss": -11.612112045288086, "global_step": 307892, "epoch": 1832} {"train_loss": -10.82932186126709, "global_step": 307893, "epoch": 1832} {"train_loss": -10.930268287658691, "global_step": 307894, "epoch": 1832} {"train_loss": -10.896886825561523, "global_step": 307895, "epoch": 1832} {"train_loss": -11.318756103515625, "global_step": 307896, "epoch": 1832} {"train_loss": -10.80458927154541, "global_step": 307897, "epoch": 1832} {"train_loss": -10.997655868530273, "global_step": 307898, "epoch": 1832} {"train_loss": -11.327287673950195, "global_step": 307899, "epoch": 1832} {"train_loss": -11.156305313110352, "global_step": 307900, "epoch": 1832} {"train_loss": -11.793447494506836, "global_step": 307901, "epoch": 1832} {"train_loss": -10.568923950195312, "global_step": 307902, "epoch": 1832} {"train_loss": -11.244966506958008, "global_step": 307903, "epoch": 1832} {"train_loss": -10.884882926940918, "global_step": 307904, "epoch": 1832} {"train_loss": -11.43281078338623, "global_step": 307905, "epoch": 1832} {"train_loss": -10.910520553588867, "global_step": 307906, "epoch": 1832} {"train_loss": -11.257989883422852, "global_step": 307907, "epoch": 1832} {"train_loss": -11.09061336517334, "global_step": 307908, "epoch": 1832} {"train_loss": -11.301361083984375, "global_step": 307909, "epoch": 1832} {"train_loss": -11.348917007446289, "global_step": 307910, "epoch": 1832} {"train_loss": -11.062097549438477, "global_step": 307911, "epoch": 1832} {"train_loss": -11.410222053527832, "global_step": 307912, "epoch": 1832} {"train_loss": -11.026358604431152, "global_step": 307913, "epoch": 1832} {"train_loss": -11.46320915222168, "global_step": 307914, "epoch": 1832} {"train_loss": -11.0712890625, "global_step": 307915, "epoch": 1832} {"train_loss": -11.321402549743652, "global_step": 307916, "epoch": 1832} {"train_loss": -11.492420196533203, "global_step": 307917, "epoch": 1832} {"train_loss": -10.995716094970703, "global_step": 307918, "epoch": 1832} {"train_loss": -11.6212739944458, "global_step": 307919, "epoch": 1832} {"train_loss": -11.353683471679688, "global_step": 307920, "epoch": 1832} {"train_loss": -11.380398750305176, "global_step": 307921, "epoch": 1832} {"train_loss": -11.688490867614746, "global_step": 307922, "epoch": 1832} {"train_loss": -11.340354919433594, "global_step": 307923, "epoch": 1832} {"train_loss": -11.755607604980469, "global_step": 307924, "epoch": 1832} {"train_loss": -11.87557601928711, "global_step": 307925, "epoch": 1832} {"train_loss": -11.514759063720703, "global_step": 307926, "epoch": 1832} {"train_loss": -11.925021171569824, "global_step": 307927, "epoch": 1832} {"train_loss": -11.912908554077148, "global_step": 307928, "epoch": 1832} {"train_loss": -11.739858627319336, "global_step": 307929, "epoch": 1832} {"train_loss": -11.937843322753906, "global_step": 307930, "epoch": 1832} {"train_loss": -11.895862579345703, "global_step": 307931, "epoch": 1832} {"train_loss": -11.598196029663086, "global_step": 307932, "epoch": 1832} {"train_loss": -12.007604598999023, "global_step": 307933, "epoch": 1832} {"train_loss": -12.023972511291504, "global_step": 307934, "epoch": 1832} {"train_loss": -12.01896858215332, "global_step": 307935, "epoch": 1832} {"train_loss": -12.029520988464355, "global_step": 307936, "epoch": 1832} {"train_loss": -11.7560453414917, "global_step": 307937, "epoch": 1832} {"train_loss": -11.880533218383789, "global_step": 307938, "epoch": 1832} {"train_loss": -11.963683128356934, "global_step": 307939, "epoch": 1832} {"train_loss": -11.861856460571289, "global_step": 307940, "epoch": 1832} {"train_loss": -11.632987976074219, "global_step": 307941, "epoch": 1832} {"train_loss": -11.975992202758789, "global_step": 307942, "epoch": 1832} {"train_loss": -11.575076599915823, "global_step": 307943, "epoch": 1832, "val_loss": 282342.53125} {"train_loss": -11.930337905883789, "global_step": 307944, "epoch": 1833} {"train_loss": -12.241314888000488, "global_step": 307945, "epoch": 1833} {"train_loss": -11.96254825592041, "global_step": 307946, "epoch": 1833} {"train_loss": -11.94825553894043, "global_step": 307947, "epoch": 1833} {"train_loss": -12.316472053527832, "global_step": 307948, "epoch": 1833} {"train_loss": -12.011781692504883, "global_step": 307949, "epoch": 1833} {"train_loss": -12.132000923156738, "global_step": 307950, "epoch": 1833} {"train_loss": -12.283525466918945, "global_step": 307951, "epoch": 1833} {"train_loss": -12.004870414733887, "global_step": 307952, "epoch": 1833} {"train_loss": -12.280412673950195, "global_step": 307953, "epoch": 1833} {"train_loss": -11.912094116210938, "global_step": 307954, "epoch": 1833} {"train_loss": -12.367084503173828, "global_step": 307955, "epoch": 1833} {"train_loss": -12.025812149047852, "global_step": 307956, "epoch": 1833} {"train_loss": -12.231128692626953, "global_step": 307957, "epoch": 1833} {"train_loss": -12.234869003295898, "global_step": 307958, "epoch": 1833} {"train_loss": -11.931517601013184, "global_step": 307959, "epoch": 1833} {"train_loss": -12.277261734008789, "global_step": 307960, "epoch": 1833} {"train_loss": -12.105802536010742, "global_step": 307961, "epoch": 1833} {"train_loss": -12.394712448120117, "global_step": 307962, "epoch": 1833} {"train_loss": -12.117188453674316, "global_step": 307963, "epoch": 1833} {"train_loss": -12.280501365661621, "global_step": 307964, "epoch": 1833} {"train_loss": -12.066081047058105, "global_step": 307965, "epoch": 1833} {"train_loss": -12.415607452392578, "global_step": 307966, "epoch": 1833} {"train_loss": -12.327885627746582, "global_step": 307967, "epoch": 1833} {"train_loss": -12.388640403747559, "global_step": 307968, "epoch": 1833} {"train_loss": -12.267655372619629, "global_step": 307969, "epoch": 1833} {"train_loss": -12.396269798278809, "global_step": 307970, "epoch": 1833} {"train_loss": -12.30364990234375, "global_step": 307971, "epoch": 1833} {"train_loss": -12.440370559692383, "global_step": 307972, "epoch": 1833} {"train_loss": -12.488372802734375, "global_step": 307973, "epoch": 1833} {"train_loss": -12.425270080566406, "global_step": 307974, "epoch": 1833} {"train_loss": -12.426464080810547, "global_step": 307975, "epoch": 1833} {"train_loss": -12.46072006225586, "global_step": 307976, "epoch": 1833} {"train_loss": -12.38711929321289, "global_step": 307977, "epoch": 1833} {"train_loss": -12.434440612792969, "global_step": 307978, "epoch": 1833} {"train_loss": -12.416711807250977, "global_step": 307979, "epoch": 1833} {"train_loss": -12.31080436706543, "global_step": 307980, "epoch": 1833} {"train_loss": -12.109696388244629, "global_step": 307981, "epoch": 1833} {"train_loss": -12.527960777282715, "global_step": 307982, "epoch": 1833} {"train_loss": -12.047223091125488, "global_step": 307983, "epoch": 1833} {"train_loss": -12.410839080810547, "global_step": 307984, "epoch": 1833} {"train_loss": -12.40886116027832, "global_step": 307985, "epoch": 1833} {"train_loss": -11.984978675842285, "global_step": 307986, "epoch": 1833} {"train_loss": -12.190262794494629, "global_step": 307987, "epoch": 1833} {"train_loss": -12.122472763061523, "global_step": 307988, "epoch": 1833} {"train_loss": -11.993471145629883, "global_step": 307989, "epoch": 1833} {"train_loss": -12.226644515991211, "global_step": 307990, "epoch": 1833} {"train_loss": -11.782419204711914, "global_step": 307991, "epoch": 1833} {"train_loss": -12.305598258972168, "global_step": 307992, "epoch": 1833} {"train_loss": -12.393853187561035, "global_step": 307993, "epoch": 1833} {"train_loss": -12.023296356201172, "global_step": 307994, "epoch": 1833} {"train_loss": -11.384943962097168, "global_step": 307995, "epoch": 1833} {"train_loss": -12.29590129852295, "global_step": 307996, "epoch": 1833} {"train_loss": -12.072755813598633, "global_step": 307997, "epoch": 1833} {"train_loss": -11.335314750671387, "global_step": 307998, "epoch": 1833} {"train_loss": -12.42611312866211, "global_step": 307999, "epoch": 1833} {"train_loss": -11.089885711669922, "global_step": 308000, "epoch": 1833} {"train_loss": -12.0574951171875, "global_step": 308001, "epoch": 1833} {"train_loss": -11.809732437133789, "global_step": 308002, "epoch": 1833} {"train_loss": -11.833904266357422, "global_step": 308003, "epoch": 1833} {"train_loss": -12.327532768249512, "global_step": 308004, "epoch": 1833} {"train_loss": -11.76244068145752, "global_step": 308005, "epoch": 1833} {"train_loss": -12.24382209777832, "global_step": 308006, "epoch": 1833} {"train_loss": -12.205211639404297, "global_step": 308007, "epoch": 1833} {"train_loss": -11.97531795501709, "global_step": 308008, "epoch": 1833} {"train_loss": -12.179119110107422, "global_step": 308009, "epoch": 1833} {"train_loss": -12.237064361572266, "global_step": 308010, "epoch": 1833} {"train_loss": -12.046590805053711, "global_step": 308011, "epoch": 1833} {"train_loss": -12.366432189941406, "global_step": 308012, "epoch": 1833} {"train_loss": -12.33072280883789, "global_step": 308013, "epoch": 1833} {"train_loss": -12.28321647644043, "global_step": 308014, "epoch": 1833} {"train_loss": -12.435944557189941, "global_step": 308015, "epoch": 1833} {"train_loss": -12.479118347167969, "global_step": 308016, "epoch": 1833} {"train_loss": -12.15921401977539, "global_step": 308017, "epoch": 1833} {"train_loss": -12.213859558105469, "global_step": 308018, "epoch": 1833} {"train_loss": -12.1109619140625, "global_step": 308019, "epoch": 1833} {"train_loss": -12.220247268676758, "global_step": 308020, "epoch": 1833} {"train_loss": -12.046331405639648, "global_step": 308021, "epoch": 1833} {"train_loss": -12.350025177001953, "global_step": 308022, "epoch": 1833} {"train_loss": -12.288118362426758, "global_step": 308023, "epoch": 1833} {"train_loss": -12.271254539489746, "global_step": 308024, "epoch": 1833} {"train_loss": -12.209243774414062, "global_step": 308025, "epoch": 1833} {"train_loss": -12.670568466186523, "global_step": 308026, "epoch": 1833} {"train_loss": -12.401470184326172, "global_step": 308027, "epoch": 1833} {"train_loss": -12.282097816467285, "global_step": 308028, "epoch": 1833} {"train_loss": -12.165763854980469, "global_step": 308029, "epoch": 1833} {"train_loss": -12.275103569030762, "global_step": 308030, "epoch": 1833} {"train_loss": -11.799602508544922, "global_step": 308031, "epoch": 1833} {"train_loss": -12.130739212036133, "global_step": 308032, "epoch": 1833} {"train_loss": -12.342900276184082, "global_step": 308033, "epoch": 1833} {"train_loss": -11.278207778930664, "global_step": 308034, "epoch": 1833} {"train_loss": -10.946966171264648, "global_step": 308035, "epoch": 1833} {"train_loss": -12.372827529907227, "global_step": 308036, "epoch": 1833} {"train_loss": -11.776222229003906, "global_step": 308037, "epoch": 1833} {"train_loss": -11.060821533203125, "global_step": 308038, "epoch": 1833} {"train_loss": -12.256671905517578, "global_step": 308039, "epoch": 1833} {"train_loss": -10.750049591064453, "global_step": 308040, "epoch": 1833} {"train_loss": -10.353282928466797, "global_step": 308041, "epoch": 1833} {"train_loss": -11.748159408569336, "global_step": 308042, "epoch": 1833} {"train_loss": -11.825525283813477, "global_step": 308043, "epoch": 1833} {"train_loss": -10.905845642089844, "global_step": 308044, "epoch": 1833} {"train_loss": -10.98680305480957, "global_step": 308045, "epoch": 1833} {"train_loss": -11.860250473022461, "global_step": 308046, "epoch": 1833} {"train_loss": -11.039213180541992, "global_step": 308047, "epoch": 1833} {"train_loss": -11.144462585449219, "global_step": 308048, "epoch": 1833} {"train_loss": -11.32176685333252, "global_step": 308049, "epoch": 1833} {"train_loss": -11.773345947265625, "global_step": 308050, "epoch": 1833} {"train_loss": -10.728171348571777, "global_step": 308051, "epoch": 1833} {"train_loss": -12.104930877685547, "global_step": 308052, "epoch": 1833} {"train_loss": -11.182743072509766, "global_step": 308053, "epoch": 1833} {"train_loss": -11.589818000793457, "global_step": 308054, "epoch": 1833} {"train_loss": -11.422466278076172, "global_step": 308055, "epoch": 1833} {"train_loss": -10.307218551635742, "global_step": 308056, "epoch": 1833} {"train_loss": -12.171382904052734, "global_step": 308057, "epoch": 1833} {"train_loss": -10.119683265686035, "global_step": 308058, "epoch": 1833} {"train_loss": -12.226795196533203, "global_step": 308059, "epoch": 1833} {"train_loss": -10.021444320678711, "global_step": 308060, "epoch": 1833} {"train_loss": -11.406688690185547, "global_step": 308061, "epoch": 1833} {"train_loss": -10.92466926574707, "global_step": 308062, "epoch": 1833} {"train_loss": -10.661338806152344, "global_step": 308063, "epoch": 1833} {"train_loss": -11.362571716308594, "global_step": 308064, "epoch": 1833} {"train_loss": -10.728796005249023, "global_step": 308065, "epoch": 1833} {"train_loss": -11.181276321411133, "global_step": 308066, "epoch": 1833} {"train_loss": -11.253310203552246, "global_step": 308067, "epoch": 1833} {"train_loss": -11.827103614807129, "global_step": 308068, "epoch": 1833} {"train_loss": -11.41057014465332, "global_step": 308069, "epoch": 1833} {"train_loss": -11.782925605773926, "global_step": 308070, "epoch": 1833} {"train_loss": -11.281976699829102, "global_step": 308071, "epoch": 1833} {"train_loss": -11.291812896728516, "global_step": 308072, "epoch": 1833} {"train_loss": -11.352703094482422, "global_step": 308073, "epoch": 1833} {"train_loss": -11.389196395874023, "global_step": 308074, "epoch": 1833} {"train_loss": -11.933001518249512, "global_step": 308075, "epoch": 1833} {"train_loss": -11.360868453979492, "global_step": 308076, "epoch": 1833} {"train_loss": -11.90084457397461, "global_step": 308077, "epoch": 1833} {"train_loss": -11.376458168029785, "global_step": 308078, "epoch": 1833} {"train_loss": -11.656393051147461, "global_step": 308079, "epoch": 1833} {"train_loss": -11.144523620605469, "global_step": 308080, "epoch": 1833} {"train_loss": -11.616632461547852, "global_step": 308081, "epoch": 1833} {"train_loss": -11.489439010620117, "global_step": 308082, "epoch": 1833} {"train_loss": -11.8399019241333, "global_step": 308083, "epoch": 1833} {"train_loss": -11.525171279907227, "global_step": 308084, "epoch": 1833} {"train_loss": -11.279600143432617, "global_step": 308085, "epoch": 1833} {"train_loss": -11.915018081665039, "global_step": 308086, "epoch": 1833} {"train_loss": -11.497320175170898, "global_step": 308087, "epoch": 1833} {"train_loss": -11.830839157104492, "global_step": 308088, "epoch": 1833} {"train_loss": -11.890705108642578, "global_step": 308089, "epoch": 1833} {"train_loss": -11.723276138305664, "global_step": 308090, "epoch": 1833} {"train_loss": -11.897089958190918, "global_step": 308091, "epoch": 1833} {"train_loss": -11.800838470458984, "global_step": 308092, "epoch": 1833} {"train_loss": -11.666478157043457, "global_step": 308093, "epoch": 1833} {"train_loss": -11.673545837402344, "global_step": 308094, "epoch": 1833} {"train_loss": -11.89434814453125, "global_step": 308095, "epoch": 1833} {"train_loss": -12.009353637695312, "global_step": 308096, "epoch": 1833} {"train_loss": -11.83346939086914, "global_step": 308097, "epoch": 1833} {"train_loss": -12.17271614074707, "global_step": 308098, "epoch": 1833} {"train_loss": -11.969676971435547, "global_step": 308099, "epoch": 1833} {"train_loss": -12.128570556640625, "global_step": 308100, "epoch": 1833} {"train_loss": -11.995399475097656, "global_step": 308101, "epoch": 1833} {"train_loss": -12.09771728515625, "global_step": 308102, "epoch": 1833} {"train_loss": -11.83115005493164, "global_step": 308103, "epoch": 1833} {"train_loss": -12.140169143676758, "global_step": 308104, "epoch": 1833} {"train_loss": -12.058935165405273, "global_step": 308105, "epoch": 1833} {"train_loss": -12.101449966430664, "global_step": 308106, "epoch": 1833} {"train_loss": -12.185098648071289, "global_step": 308107, "epoch": 1833} {"train_loss": -11.912861824035645, "global_step": 308108, "epoch": 1833} {"train_loss": -12.04880142211914, "global_step": 308109, "epoch": 1833} {"train_loss": -12.262724876403809, "global_step": 308110, "epoch": 1833} {"train_loss": -11.890448553221566, "global_step": 308111, "epoch": 1833, "val_loss": 281979.28125} {"train_loss": -12.16896915435791, "global_step": 308112, "epoch": 1834} {"train_loss": -12.313766479492188, "global_step": 308113, "epoch": 1834} {"train_loss": -12.160375595092773, "global_step": 308114, "epoch": 1834} {"train_loss": -12.405715942382812, "global_step": 308115, "epoch": 1834} {"train_loss": -12.332769393920898, "global_step": 308116, "epoch": 1834} {"train_loss": -12.063023567199707, "global_step": 308117, "epoch": 1834} {"train_loss": -12.2619047164917, "global_step": 308118, "epoch": 1834} {"train_loss": -12.265167236328125, "global_step": 308119, "epoch": 1834} {"train_loss": -12.434846878051758, "global_step": 308120, "epoch": 1834} {"train_loss": -12.257736206054688, "global_step": 308121, "epoch": 1834} {"train_loss": -12.18380355834961, "global_step": 308122, "epoch": 1834} {"train_loss": -12.255781173706055, "global_step": 308123, "epoch": 1834} {"train_loss": -12.406498908996582, "global_step": 308124, "epoch": 1834} {"train_loss": -12.061251640319824, "global_step": 308125, "epoch": 1834} {"train_loss": -12.364505767822266, "global_step": 308126, "epoch": 1834} {"train_loss": -11.879562377929688, "global_step": 308127, "epoch": 1834} {"train_loss": -12.353219985961914, "global_step": 308128, "epoch": 1834} {"train_loss": -12.350203514099121, "global_step": 308129, "epoch": 1834} {"train_loss": -12.41972541809082, "global_step": 308130, "epoch": 1834} {"train_loss": -12.037957191467285, "global_step": 308131, "epoch": 1834} {"train_loss": -12.021883964538574, "global_step": 308132, "epoch": 1834} {"train_loss": -12.475822448730469, "global_step": 308133, "epoch": 1834} {"train_loss": -11.953969955444336, "global_step": 308134, "epoch": 1834} {"train_loss": -11.522135734558105, "global_step": 308135, "epoch": 1834} {"train_loss": -11.118938446044922, "global_step": 308136, "epoch": 1834} {"train_loss": -12.055032730102539, "global_step": 308137, "epoch": 1834} {"train_loss": -10.665491104125977, "global_step": 308138, "epoch": 1834} {"train_loss": -10.834753036499023, "global_step": 308139, "epoch": 1834} {"train_loss": -12.307917594909668, "global_step": 308140, "epoch": 1834} {"train_loss": -11.874493598937988, "global_step": 308141, "epoch": 1834} {"train_loss": -11.492720603942871, "global_step": 308142, "epoch": 1834} {"train_loss": -11.911590576171875, "global_step": 308143, "epoch": 1834} {"train_loss": -11.883501052856445, "global_step": 308144, "epoch": 1834} {"train_loss": -11.667654037475586, "global_step": 308145, "epoch": 1834} {"train_loss": -12.319501876831055, "global_step": 308146, "epoch": 1834} {"train_loss": -11.987829208374023, "global_step": 308147, "epoch": 1834} {"train_loss": -12.052603721618652, "global_step": 308148, "epoch": 1834} {"train_loss": -12.251676559448242, "global_step": 308149, "epoch": 1834} {"train_loss": -12.196342468261719, "global_step": 308150, "epoch": 1834} {"train_loss": -12.03007698059082, "global_step": 308151, "epoch": 1834} {"train_loss": -12.497579574584961, "global_step": 308152, "epoch": 1834} {"train_loss": -11.991395950317383, "global_step": 308153, "epoch": 1834} {"train_loss": -12.079362869262695, "global_step": 308154, "epoch": 1834} {"train_loss": -11.932589530944824, "global_step": 308155, "epoch": 1834} {"train_loss": -12.419731140136719, "global_step": 308156, "epoch": 1834} {"train_loss": -11.990432739257812, "global_step": 308157, "epoch": 1834} {"train_loss": -12.470653533935547, "global_step": 308158, "epoch": 1834} {"train_loss": -11.992523193359375, "global_step": 308159, "epoch": 1834} {"train_loss": -12.312528610229492, "global_step": 308160, "epoch": 1834} {"train_loss": -12.117990493774414, "global_step": 308161, "epoch": 1834} {"train_loss": -12.421995162963867, "global_step": 308162, "epoch": 1834} {"train_loss": -11.849689483642578, "global_step": 308163, "epoch": 1834} {"train_loss": -12.168435096740723, "global_step": 308164, "epoch": 1834} {"train_loss": -12.228893280029297, "global_step": 308165, "epoch": 1834} {"train_loss": -12.126045227050781, "global_step": 308166, "epoch": 1834} {"train_loss": -12.175384521484375, "global_step": 308167, "epoch": 1834} {"train_loss": -12.275146484375, "global_step": 308168, "epoch": 1834} {"train_loss": -12.299501419067383, "global_step": 308169, "epoch": 1834} {"train_loss": -12.31988525390625, "global_step": 308170, "epoch": 1834} {"train_loss": -12.307243347167969, "global_step": 308171, "epoch": 1834} {"train_loss": -12.262269973754883, "global_step": 308172, "epoch": 1834} {"train_loss": -12.432231903076172, "global_step": 308173, "epoch": 1834} {"train_loss": -12.476070404052734, "global_step": 308174, "epoch": 1834} {"train_loss": -12.330350875854492, "global_step": 308175, "epoch": 1834} {"train_loss": -12.364230155944824, "global_step": 308176, "epoch": 1834} {"train_loss": -12.548568725585938, "global_step": 308177, "epoch": 1834} {"train_loss": -12.386497497558594, "global_step": 308178, "epoch": 1834} {"train_loss": -12.448633193969727, "global_step": 308179, "epoch": 1834} {"train_loss": -12.40802001953125, "global_step": 308180, "epoch": 1834} {"train_loss": -12.61102294921875, "global_step": 308181, "epoch": 1834} {"train_loss": -12.251974105834961, "global_step": 308182, "epoch": 1834} {"train_loss": -12.313405990600586, "global_step": 308183, "epoch": 1834} {"train_loss": -12.201440811157227, "global_step": 308184, "epoch": 1834} {"train_loss": -12.300350189208984, "global_step": 308185, "epoch": 1834} {"train_loss": -12.259366989135742, "global_step": 308186, "epoch": 1834} {"train_loss": -11.90163516998291, "global_step": 308187, "epoch": 1834} {"train_loss": -11.989755630493164, "global_step": 308188, "epoch": 1834} {"train_loss": -12.52175235748291, "global_step": 308189, "epoch": 1834} {"train_loss": -12.252474784851074, "global_step": 308190, "epoch": 1834} {"train_loss": -12.239112854003906, "global_step": 308191, "epoch": 1834} {"train_loss": -12.487346649169922, "global_step": 308192, "epoch": 1834} {"train_loss": -11.720890045166016, "global_step": 308193, "epoch": 1834} {"train_loss": -11.544124603271484, "global_step": 308194, "epoch": 1834} {"train_loss": -12.127181053161621, "global_step": 308195, "epoch": 1834} {"train_loss": -11.044649124145508, "global_step": 308196, "epoch": 1834} {"train_loss": -10.59222412109375, "global_step": 308197, "epoch": 1834} {"train_loss": -11.979296684265137, "global_step": 308198, "epoch": 1834} {"train_loss": -11.813314437866211, "global_step": 308199, "epoch": 1834} {"train_loss": -10.709007263183594, "global_step": 308200, "epoch": 1834} {"train_loss": -11.252650260925293, "global_step": 308201, "epoch": 1834} {"train_loss": -12.326345443725586, "global_step": 308202, "epoch": 1834} {"train_loss": -11.66054916381836, "global_step": 308203, "epoch": 1834} {"train_loss": -11.805506706237793, "global_step": 308204, "epoch": 1834} {"train_loss": -11.75697135925293, "global_step": 308205, "epoch": 1834} {"train_loss": -11.149004936218262, "global_step": 308206, "epoch": 1834} {"train_loss": -12.09347152709961, "global_step": 308207, "epoch": 1834} {"train_loss": -11.877725601196289, "global_step": 308208, "epoch": 1834} {"train_loss": -11.410951614379883, "global_step": 308209, "epoch": 1834} {"train_loss": -12.014304161071777, "global_step": 308210, "epoch": 1834} {"train_loss": -11.319581985473633, "global_step": 308211, "epoch": 1834} {"train_loss": -12.194522857666016, "global_step": 308212, "epoch": 1834} {"train_loss": -11.574844360351562, "global_step": 308213, "epoch": 1834} {"train_loss": -11.938273429870605, "global_step": 308214, "epoch": 1834} {"train_loss": -11.30366325378418, "global_step": 308215, "epoch": 1834} {"train_loss": -11.040190696716309, "global_step": 308216, "epoch": 1834} {"train_loss": -10.197332382202148, "global_step": 308217, "epoch": 1834} {"train_loss": -10.798625946044922, "global_step": 308218, "epoch": 1834} {"train_loss": -11.378969192504883, "global_step": 308219, "epoch": 1834} {"train_loss": -10.761387825012207, "global_step": 308220, "epoch": 1834} {"train_loss": -11.264652252197266, "global_step": 308221, "epoch": 1834} {"train_loss": -11.326254844665527, "global_step": 308222, "epoch": 1834} {"train_loss": -11.252832412719727, "global_step": 308223, "epoch": 1834} {"train_loss": -11.212003707885742, "global_step": 308224, "epoch": 1834} {"train_loss": -10.490303039550781, "global_step": 308225, "epoch": 1834} {"train_loss": -10.760080337524414, "global_step": 308226, "epoch": 1834} {"train_loss": -11.123540878295898, "global_step": 308227, "epoch": 1834} {"train_loss": -10.93525505065918, "global_step": 308228, "epoch": 1834} {"train_loss": -9.991557121276855, "global_step": 308229, "epoch": 1834} {"train_loss": -11.218482971191406, "global_step": 308230, "epoch": 1834} {"train_loss": -10.528909683227539, "global_step": 308231, "epoch": 1834} {"train_loss": -9.683794021606445, "global_step": 308232, "epoch": 1834} {"train_loss": -11.017253875732422, "global_step": 308233, "epoch": 1834} {"train_loss": -11.17243480682373, "global_step": 308234, "epoch": 1834} {"train_loss": -10.925670623779297, "global_step": 308235, "epoch": 1834} {"train_loss": -11.336368560791016, "global_step": 308236, "epoch": 1834} {"train_loss": -10.835655212402344, "global_step": 308237, "epoch": 1834} {"train_loss": -10.874013900756836, "global_step": 308238, "epoch": 1834} {"train_loss": -10.980528831481934, "global_step": 308239, "epoch": 1834} {"train_loss": -11.31197738647461, "global_step": 308240, "epoch": 1834} {"train_loss": -10.678060531616211, "global_step": 308241, "epoch": 1834} {"train_loss": -11.049623489379883, "global_step": 308242, "epoch": 1834} {"train_loss": -10.713945388793945, "global_step": 308243, "epoch": 1834} {"train_loss": -10.708467483520508, "global_step": 308244, "epoch": 1834} {"train_loss": -10.772212982177734, "global_step": 308245, "epoch": 1834} {"train_loss": -11.803611755371094, "global_step": 308246, "epoch": 1834} {"train_loss": -10.78260612487793, "global_step": 308247, "epoch": 1834} {"train_loss": -11.702109336853027, "global_step": 308248, "epoch": 1834} {"train_loss": -10.420936584472656, "global_step": 308249, "epoch": 1834} {"train_loss": -11.50798511505127, "global_step": 308250, "epoch": 1834} {"train_loss": -11.192668914794922, "global_step": 308251, "epoch": 1834} {"train_loss": -11.840699195861816, "global_step": 308252, "epoch": 1834} {"train_loss": -10.975530624389648, "global_step": 308253, "epoch": 1834} {"train_loss": -11.625670433044434, "global_step": 308254, "epoch": 1834} {"train_loss": -10.733479499816895, "global_step": 308255, "epoch": 1834} {"train_loss": -11.768041610717773, "global_step": 308256, "epoch": 1834} {"train_loss": -11.610834121704102, "global_step": 308257, "epoch": 1834} {"train_loss": -11.356618881225586, "global_step": 308258, "epoch": 1834} {"train_loss": -11.732852935791016, "global_step": 308259, "epoch": 1834} {"train_loss": -12.099905967712402, "global_step": 308260, "epoch": 1834} {"train_loss": -11.584070205688477, "global_step": 308261, "epoch": 1834} {"train_loss": -12.015213012695312, "global_step": 308262, "epoch": 1834} {"train_loss": -11.575094223022461, "global_step": 308263, "epoch": 1834} {"train_loss": -11.837370872497559, "global_step": 308264, "epoch": 1834} {"train_loss": -11.586145401000977, "global_step": 308265, "epoch": 1834} {"train_loss": -11.662213325500488, "global_step": 308266, "epoch": 1834} {"train_loss": -11.784669876098633, "global_step": 308267, "epoch": 1834} {"train_loss": -11.965021133422852, "global_step": 308268, "epoch": 1834} {"train_loss": -11.988360404968262, "global_step": 308269, "epoch": 1834} {"train_loss": -11.94713306427002, "global_step": 308270, "epoch": 1834} {"train_loss": -11.78070068359375, "global_step": 308271, "epoch": 1834} {"train_loss": -12.047423362731934, "global_step": 308272, "epoch": 1834} {"train_loss": -11.702447891235352, "global_step": 308273, "epoch": 1834} {"train_loss": -12.287771224975586, "global_step": 308274, "epoch": 1834} {"train_loss": -11.603405952453613, "global_step": 308275, "epoch": 1834} {"train_loss": -12.113199234008789, "global_step": 308276, "epoch": 1834} {"train_loss": -12.12151050567627, "global_step": 308277, "epoch": 1834} {"train_loss": -12.132400512695312, "global_step": 308278, "epoch": 1834} {"train_loss": -11.756354735011147, "global_step": 308279, "epoch": 1834, "val_loss": 282307.875} {"train_loss": -12.206151008605957, "global_step": 308280, "epoch": 1835} {"train_loss": -11.935663223266602, "global_step": 308281, "epoch": 1835} {"train_loss": -12.168312072753906, "global_step": 308282, "epoch": 1835} {"train_loss": -12.180726051330566, "global_step": 308283, "epoch": 1835} {"train_loss": -12.039371490478516, "global_step": 308284, "epoch": 1835} {"train_loss": -12.186071395874023, "global_step": 308285, "epoch": 1835} {"train_loss": -12.153826713562012, "global_step": 308286, "epoch": 1835} {"train_loss": -12.294942855834961, "global_step": 308287, "epoch": 1835} {"train_loss": -12.060955047607422, "global_step": 308288, "epoch": 1835} {"train_loss": -11.817516326904297, "global_step": 308289, "epoch": 1835} {"train_loss": -12.113720893859863, "global_step": 308290, "epoch": 1835} {"train_loss": -12.218494415283203, "global_step": 308291, "epoch": 1835} {"train_loss": -12.28335952758789, "global_step": 308292, "epoch": 1835} {"train_loss": -12.057839393615723, "global_step": 308293, "epoch": 1835} {"train_loss": -12.227449417114258, "global_step": 308294, "epoch": 1835} {"train_loss": -12.030668258666992, "global_step": 308295, "epoch": 1835} {"train_loss": -12.147558212280273, "global_step": 308296, "epoch": 1835} {"train_loss": -12.24639892578125, "global_step": 308297, "epoch": 1835} {"train_loss": -12.282862663269043, "global_step": 308298, "epoch": 1835} {"train_loss": -12.058429718017578, "global_step": 308299, "epoch": 1835} {"train_loss": -12.214534759521484, "global_step": 308300, "epoch": 1835} {"train_loss": -11.99244499206543, "global_step": 308301, "epoch": 1835} {"train_loss": -12.194684982299805, "global_step": 308302, "epoch": 1835} {"train_loss": -12.151013374328613, "global_step": 308303, "epoch": 1835} {"train_loss": -12.229256629943848, "global_step": 308304, "epoch": 1835} {"train_loss": -12.179254531860352, "global_step": 308305, "epoch": 1835} {"train_loss": -12.191843032836914, "global_step": 308306, "epoch": 1835} {"train_loss": -12.27379035949707, "global_step": 308307, "epoch": 1835} {"train_loss": -12.316895484924316, "global_step": 308308, "epoch": 1835} {"train_loss": -12.468582153320312, "global_step": 308309, "epoch": 1835} {"train_loss": -12.48807144165039, "global_step": 308310, "epoch": 1835} {"train_loss": -12.3064546585083, "global_step": 308311, "epoch": 1835} {"train_loss": -12.544443130493164, "global_step": 308312, "epoch": 1835} {"train_loss": -12.383010864257812, "global_step": 308313, "epoch": 1835} {"train_loss": -12.25999641418457, "global_step": 308314, "epoch": 1835} {"train_loss": -12.62773323059082, "global_step": 308315, "epoch": 1835} {"train_loss": -12.33868408203125, "global_step": 308316, "epoch": 1835} {"train_loss": -12.360370635986328, "global_step": 308317, "epoch": 1835} {"train_loss": -12.451026916503906, "global_step": 308318, "epoch": 1835} {"train_loss": -12.52609920501709, "global_step": 308319, "epoch": 1835} {"train_loss": -12.242911338806152, "global_step": 308320, "epoch": 1835} {"train_loss": -12.533233642578125, "global_step": 308321, "epoch": 1835} {"train_loss": -12.40694522857666, "global_step": 308322, "epoch": 1835} {"train_loss": -12.128353118896484, "global_step": 308323, "epoch": 1835} {"train_loss": -12.358453750610352, "global_step": 308324, "epoch": 1835} {"train_loss": -12.568321228027344, "global_step": 308325, "epoch": 1835} {"train_loss": -12.39144515991211, "global_step": 308326, "epoch": 1835} {"train_loss": -12.19992446899414, "global_step": 308327, "epoch": 1835} {"train_loss": -12.366458892822266, "global_step": 308328, "epoch": 1835} {"train_loss": -12.428893089294434, "global_step": 308329, "epoch": 1835} {"train_loss": -12.29062557220459, "global_step": 308330, "epoch": 1835} {"train_loss": -12.466185569763184, "global_step": 308331, "epoch": 1835} {"train_loss": -12.356278419494629, "global_step": 308332, "epoch": 1835} {"train_loss": -12.118392944335938, "global_step": 308333, "epoch": 1835} {"train_loss": -12.368693351745605, "global_step": 308334, "epoch": 1835} {"train_loss": -12.39659309387207, "global_step": 308335, "epoch": 1835} {"train_loss": -12.541004180908203, "global_step": 308336, "epoch": 1835} {"train_loss": -12.431709289550781, "global_step": 308337, "epoch": 1835} {"train_loss": -12.356355667114258, "global_step": 308338, "epoch": 1835} {"train_loss": -12.649539947509766, "global_step": 308339, "epoch": 1835} {"train_loss": -12.340400695800781, "global_step": 308340, "epoch": 1835} {"train_loss": -12.126358032226562, "global_step": 308341, "epoch": 1835} {"train_loss": -12.53387451171875, "global_step": 308342, "epoch": 1835} {"train_loss": -12.104572296142578, "global_step": 308343, "epoch": 1835} {"train_loss": -12.479900360107422, "global_step": 308344, "epoch": 1835} {"train_loss": -12.223698616027832, "global_step": 308345, "epoch": 1835} {"train_loss": -12.484569549560547, "global_step": 308346, "epoch": 1835} {"train_loss": -12.311113357543945, "global_step": 308347, "epoch": 1835} {"train_loss": -12.107427597045898, "global_step": 308348, "epoch": 1835} {"train_loss": -12.08404541015625, "global_step": 308349, "epoch": 1835} {"train_loss": -12.354307174682617, "global_step": 308350, "epoch": 1835} {"train_loss": -12.339767456054688, "global_step": 308351, "epoch": 1835} {"train_loss": -12.237054824829102, "global_step": 308352, "epoch": 1835} {"train_loss": -12.305076599121094, "global_step": 308353, "epoch": 1835} {"train_loss": -12.239019393920898, "global_step": 308354, "epoch": 1835} {"train_loss": -12.120763778686523, "global_step": 308355, "epoch": 1835} {"train_loss": -12.209190368652344, "global_step": 308356, "epoch": 1835} {"train_loss": -12.049064636230469, "global_step": 308357, "epoch": 1835} {"train_loss": -12.301295280456543, "global_step": 308358, "epoch": 1835} {"train_loss": -12.264739990234375, "global_step": 308359, "epoch": 1835} {"train_loss": -12.546213150024414, "global_step": 308360, "epoch": 1835} {"train_loss": -12.186226844787598, "global_step": 308361, "epoch": 1835} {"train_loss": -12.085408210754395, "global_step": 308362, "epoch": 1835} {"train_loss": -12.186372756958008, "global_step": 308363, "epoch": 1835} {"train_loss": -11.83991813659668, "global_step": 308364, "epoch": 1835} {"train_loss": -11.628775596618652, "global_step": 308365, "epoch": 1835} {"train_loss": -10.706063270568848, "global_step": 308366, "epoch": 1835} {"train_loss": -10.424468040466309, "global_step": 308367, "epoch": 1835} {"train_loss": -11.842991828918457, "global_step": 308368, "epoch": 1835} {"train_loss": -10.135843276977539, "global_step": 308369, "epoch": 1835} {"train_loss": -9.95217227935791, "global_step": 308370, "epoch": 1835} {"train_loss": -10.72917366027832, "global_step": 308371, "epoch": 1835} {"train_loss": -8.380118370056152, "global_step": 308372, "epoch": 1835} {"train_loss": -7.588212013244629, "global_step": 308373, "epoch": 1835} {"train_loss": -10.169154167175293, "global_step": 308374, "epoch": 1835} {"train_loss": -5.864386558532715, "global_step": 308375, "epoch": 1835} {"train_loss": -6.248412132263184, "global_step": 308376, "epoch": 1835} {"train_loss": -5.376540184020996, "global_step": 308377, "epoch": 1835} {"train_loss": -5.126603126525879, "global_step": 308378, "epoch": 1835} {"train_loss": -5.389447212219238, "global_step": 308379, "epoch": 1835} {"train_loss": -5.907666206359863, "global_step": 308380, "epoch": 1835} {"train_loss": -6.194225311279297, "global_step": 308381, "epoch": 1835} {"train_loss": -5.5449934005737305, "global_step": 308382, "epoch": 1835} {"train_loss": -6.248408317565918, "global_step": 308383, "epoch": 1835} {"train_loss": -7.17426061630249, "global_step": 308384, "epoch": 1835} {"train_loss": -6.909940719604492, "global_step": 308385, "epoch": 1835} {"train_loss": -6.831474781036377, "global_step": 308386, "epoch": 1835} {"train_loss": -6.707816123962402, "global_step": 308387, "epoch": 1835} {"train_loss": -7.222177028656006, "global_step": 308388, "epoch": 1835} {"train_loss": -6.860594749450684, "global_step": 308389, "epoch": 1835} {"train_loss": -7.214313507080078, "global_step": 308390, "epoch": 1835} {"train_loss": -8.129612922668457, "global_step": 308391, "epoch": 1835} {"train_loss": -8.084651947021484, "global_step": 308392, "epoch": 1835} {"train_loss": -7.580548286437988, "global_step": 308393, "epoch": 1835} {"train_loss": -8.168388366699219, "global_step": 308394, "epoch": 1835} {"train_loss": -8.728755950927734, "global_step": 308395, "epoch": 1835} {"train_loss": -7.83054256439209, "global_step": 308396, "epoch": 1835} {"train_loss": -8.855948448181152, "global_step": 308397, "epoch": 1835} {"train_loss": -8.33973503112793, "global_step": 308398, "epoch": 1835} {"train_loss": -8.580883026123047, "global_step": 308399, "epoch": 1835} {"train_loss": -9.818363189697266, "global_step": 308400, "epoch": 1835} {"train_loss": -9.562152862548828, "global_step": 308401, "epoch": 1835} {"train_loss": -10.091545104980469, "global_step": 308402, "epoch": 1835} {"train_loss": -10.209342956542969, "global_step": 308403, "epoch": 1835} {"train_loss": -9.942765235900879, "global_step": 308404, "epoch": 1835} {"train_loss": -10.854787826538086, "global_step": 308405, "epoch": 1835} {"train_loss": -10.37887954711914, "global_step": 308406, "epoch": 1835} {"train_loss": -11.118040084838867, "global_step": 308407, "epoch": 1835} {"train_loss": -10.473502159118652, "global_step": 308408, "epoch": 1835} {"train_loss": -10.597067832946777, "global_step": 308409, "epoch": 1835} {"train_loss": -10.946853637695312, "global_step": 308410, "epoch": 1835} {"train_loss": -10.9930419921875, "global_step": 308411, "epoch": 1835} {"train_loss": -10.558547973632812, "global_step": 308412, "epoch": 1835} {"train_loss": -11.04040241241455, "global_step": 308413, "epoch": 1835} {"train_loss": -11.305667877197266, "global_step": 308414, "epoch": 1835} {"train_loss": -10.91154670715332, "global_step": 308415, "epoch": 1835} {"train_loss": -11.503101348876953, "global_step": 308416, "epoch": 1835} {"train_loss": -10.52042007446289, "global_step": 308417, "epoch": 1835} {"train_loss": -11.376914024353027, "global_step": 308418, "epoch": 1835} {"train_loss": -11.324714660644531, "global_step": 308419, "epoch": 1835} {"train_loss": -11.573654174804688, "global_step": 308420, "epoch": 1835} {"train_loss": -11.24705982208252, "global_step": 308421, "epoch": 1835} {"train_loss": -11.58020305633545, "global_step": 308422, "epoch": 1835} {"train_loss": -11.424793243408203, "global_step": 308423, "epoch": 1835} {"train_loss": -11.584409713745117, "global_step": 308424, "epoch": 1835} {"train_loss": -11.472678184509277, "global_step": 308425, "epoch": 1835} {"train_loss": -11.673933029174805, "global_step": 308426, "epoch": 1835} {"train_loss": -11.429547309875488, "global_step": 308427, "epoch": 1835} {"train_loss": -11.832897186279297, "global_step": 308428, "epoch": 1835} {"train_loss": -11.603178024291992, "global_step": 308429, "epoch": 1835} {"train_loss": -11.81665325164795, "global_step": 308430, "epoch": 1835} {"train_loss": -11.735403060913086, "global_step": 308431, "epoch": 1835} {"train_loss": -11.932991027832031, "global_step": 308432, "epoch": 1835} {"train_loss": -11.747058868408203, "global_step": 308433, "epoch": 1835} {"train_loss": -11.739057540893555, "global_step": 308434, "epoch": 1835} {"train_loss": -11.740615844726562, "global_step": 308435, "epoch": 1835} {"train_loss": -11.833273887634277, "global_step": 308436, "epoch": 1835} {"train_loss": -11.998294830322266, "global_step": 308437, "epoch": 1835} {"train_loss": -12.04096794128418, "global_step": 308438, "epoch": 1835} {"train_loss": -11.803786277770996, "global_step": 308439, "epoch": 1835} {"train_loss": -12.095200538635254, "global_step": 308440, "epoch": 1835} {"train_loss": -11.944389343261719, "global_step": 308441, "epoch": 1835} {"train_loss": -12.118754386901855, "global_step": 308442, "epoch": 1835} {"train_loss": -11.913167953491211, "global_step": 308443, "epoch": 1835} {"train_loss": -12.233600616455078, "global_step": 308444, "epoch": 1835} {"train_loss": -12.004755020141602, "global_step": 308445, "epoch": 1835} {"train_loss": -11.925278663635254, "global_step": 308446, "epoch": 1835} {"train_loss": -11.090322202160245, "global_step": 308447, "epoch": 1835, "val_loss": 276014.59375, "train_action_mse_error": 0.7292912006378174} {"train_loss": -11.984073638916016, "global_step": 308448, "epoch": 1836} {"train_loss": -12.061964988708496, "global_step": 308449, "epoch": 1836} {"train_loss": -12.218099594116211, "global_step": 308450, "epoch": 1836} {"train_loss": -11.904569625854492, "global_step": 308451, "epoch": 1836} {"train_loss": -11.956561088562012, "global_step": 308452, "epoch": 1836} {"train_loss": -12.228654861450195, "global_step": 308453, "epoch": 1836} {"train_loss": -12.034446716308594, "global_step": 308454, "epoch": 1836} {"train_loss": -12.162124633789062, "global_step": 308455, "epoch": 1836} {"train_loss": -12.12955093383789, "global_step": 308456, "epoch": 1836} {"train_loss": -12.084117889404297, "global_step": 308457, "epoch": 1836} {"train_loss": -11.984884262084961, "global_step": 308458, "epoch": 1836} {"train_loss": -12.056169509887695, "global_step": 308459, "epoch": 1836} {"train_loss": -12.036216735839844, "global_step": 308460, "epoch": 1836} {"train_loss": -11.911565780639648, "global_step": 308461, "epoch": 1836} {"train_loss": -12.249212265014648, "global_step": 308462, "epoch": 1836} {"train_loss": -12.125078201293945, "global_step": 308463, "epoch": 1836} {"train_loss": -12.192070960998535, "global_step": 308464, "epoch": 1836} {"train_loss": -12.219686508178711, "global_step": 308465, "epoch": 1836} {"train_loss": -12.300396919250488, "global_step": 308466, "epoch": 1836} {"train_loss": -12.241841316223145, "global_step": 308467, "epoch": 1836} {"train_loss": -12.213178634643555, "global_step": 308468, "epoch": 1836} {"train_loss": -12.133487701416016, "global_step": 308469, "epoch": 1836} {"train_loss": -12.244491577148438, "global_step": 308470, "epoch": 1836} {"train_loss": -12.10308837890625, "global_step": 308471, "epoch": 1836} {"train_loss": -12.014211654663086, "global_step": 308472, "epoch": 1836} {"train_loss": -12.410985946655273, "global_step": 308473, "epoch": 1836} {"train_loss": -12.18720817565918, "global_step": 308474, "epoch": 1836} {"train_loss": -12.234609603881836, "global_step": 308475, "epoch": 1836} {"train_loss": -12.263980865478516, "global_step": 308476, "epoch": 1836} {"train_loss": -12.155238151550293, "global_step": 308477, "epoch": 1836} {"train_loss": -12.212974548339844, "global_step": 308478, "epoch": 1836} {"train_loss": -12.209558486938477, "global_step": 308479, "epoch": 1836} {"train_loss": -11.93443775177002, "global_step": 308480, "epoch": 1836} {"train_loss": -11.916666984558105, "global_step": 308481, "epoch": 1836} {"train_loss": -11.081939697265625, "global_step": 308482, "epoch": 1836} {"train_loss": -11.981203079223633, "global_step": 308483, "epoch": 1836} {"train_loss": -11.656517028808594, "global_step": 308484, "epoch": 1836} {"train_loss": -11.596122741699219, "global_step": 308485, "epoch": 1836} {"train_loss": -10.667078971862793, "global_step": 308486, "epoch": 1836} {"train_loss": -11.502408981323242, "global_step": 308487, "epoch": 1836} {"train_loss": -11.11424732208252, "global_step": 308488, "epoch": 1836} {"train_loss": -11.094157218933105, "global_step": 308489, "epoch": 1836} {"train_loss": -11.208541870117188, "global_step": 308490, "epoch": 1836} {"train_loss": -11.448078155517578, "global_step": 308491, "epoch": 1836} {"train_loss": -11.152621269226074, "global_step": 308492, "epoch": 1836} {"train_loss": -11.887713432312012, "global_step": 308493, "epoch": 1836} {"train_loss": -11.675819396972656, "global_step": 308494, "epoch": 1836} {"train_loss": -11.524747848510742, "global_step": 308495, "epoch": 1836} {"train_loss": -11.93317699432373, "global_step": 308496, "epoch": 1836} {"train_loss": -11.524173736572266, "global_step": 308497, "epoch": 1836} {"train_loss": -12.024511337280273, "global_step": 308498, "epoch": 1836} {"train_loss": -11.498819351196289, "global_step": 308499, "epoch": 1836} {"train_loss": -11.433141708374023, "global_step": 308500, "epoch": 1836} {"train_loss": -11.135509490966797, "global_step": 308501, "epoch": 1836} {"train_loss": -11.506902694702148, "global_step": 308502, "epoch": 1836} {"train_loss": -10.908623695373535, "global_step": 308503, "epoch": 1836} {"train_loss": -11.636282920837402, "global_step": 308504, "epoch": 1836} {"train_loss": -11.38134765625, "global_step": 308505, "epoch": 1836} {"train_loss": -11.89416217803955, "global_step": 308506, "epoch": 1836} {"train_loss": -11.816874504089355, "global_step": 308507, "epoch": 1836} {"train_loss": -11.712262153625488, "global_step": 308508, "epoch": 1836} {"train_loss": -11.669376373291016, "global_step": 308509, "epoch": 1836} {"train_loss": -11.498403549194336, "global_step": 308510, "epoch": 1836} {"train_loss": -11.779472351074219, "global_step": 308511, "epoch": 1836} {"train_loss": -11.258201599121094, "global_step": 308512, "epoch": 1836} {"train_loss": -12.079919815063477, "global_step": 308513, "epoch": 1836} {"train_loss": -11.810867309570312, "global_step": 308514, "epoch": 1836} {"train_loss": -12.061113357543945, "global_step": 308515, "epoch": 1836} {"train_loss": -11.963168144226074, "global_step": 308516, "epoch": 1836} {"train_loss": -11.667797088623047, "global_step": 308517, "epoch": 1836} {"train_loss": -11.895706176757812, "global_step": 308518, "epoch": 1836} {"train_loss": -11.769081115722656, "global_step": 308519, "epoch": 1836} {"train_loss": -11.955280303955078, "global_step": 308520, "epoch": 1836} {"train_loss": -12.0518217086792, "global_step": 308521, "epoch": 1836} {"train_loss": -11.777168273925781, "global_step": 308522, "epoch": 1836} {"train_loss": -12.042158126831055, "global_step": 308523, "epoch": 1836} {"train_loss": -11.580757141113281, "global_step": 308524, "epoch": 1836} {"train_loss": -12.176755905151367, "global_step": 308525, "epoch": 1836} {"train_loss": -11.89194393157959, "global_step": 308526, "epoch": 1836} {"train_loss": -11.794151306152344, "global_step": 308527, "epoch": 1836} {"train_loss": -12.133142471313477, "global_step": 308528, "epoch": 1836} {"train_loss": -12.080439567565918, "global_step": 308529, "epoch": 1836} {"train_loss": -12.316886901855469, "global_step": 308530, "epoch": 1836} {"train_loss": -12.040091514587402, "global_step": 308531, "epoch": 1836} {"train_loss": -11.948583602905273, "global_step": 308532, "epoch": 1836} {"train_loss": -12.316032409667969, "global_step": 308533, "epoch": 1836} {"train_loss": -11.724217414855957, "global_step": 308534, "epoch": 1836} {"train_loss": -11.776189804077148, "global_step": 308535, "epoch": 1836} {"train_loss": -12.05282974243164, "global_step": 308536, "epoch": 1836} {"train_loss": -12.146734237670898, "global_step": 308537, "epoch": 1836} {"train_loss": -11.906086921691895, "global_step": 308538, "epoch": 1836} {"train_loss": -11.76813793182373, "global_step": 308539, "epoch": 1836} {"train_loss": -12.249916076660156, "global_step": 308540, "epoch": 1836} {"train_loss": -12.08331298828125, "global_step": 308541, "epoch": 1836} {"train_loss": -11.960838317871094, "global_step": 308542, "epoch": 1836} {"train_loss": -12.007055282592773, "global_step": 308543, "epoch": 1836} {"train_loss": -12.130550384521484, "global_step": 308544, "epoch": 1836} {"train_loss": -12.362653732299805, "global_step": 308545, "epoch": 1836} {"train_loss": -11.689702033996582, "global_step": 308546, "epoch": 1836} {"train_loss": -12.123294830322266, "global_step": 308547, "epoch": 1836} {"train_loss": -12.36375617980957, "global_step": 308548, "epoch": 1836} {"train_loss": -11.790008544921875, "global_step": 308549, "epoch": 1836} {"train_loss": -11.08242130279541, "global_step": 308550, "epoch": 1836} {"train_loss": -11.87521743774414, "global_step": 308551, "epoch": 1836} {"train_loss": -12.060150146484375, "global_step": 308552, "epoch": 1836} {"train_loss": -12.021928787231445, "global_step": 308553, "epoch": 1836} {"train_loss": -11.846059799194336, "global_step": 308554, "epoch": 1836} {"train_loss": -12.253751754760742, "global_step": 308555, "epoch": 1836} {"train_loss": -11.95055103302002, "global_step": 308556, "epoch": 1836} {"train_loss": -12.384511947631836, "global_step": 308557, "epoch": 1836} {"train_loss": -11.907794952392578, "global_step": 308558, "epoch": 1836} {"train_loss": -11.940528869628906, "global_step": 308559, "epoch": 1836} {"train_loss": -11.75920581817627, "global_step": 308560, "epoch": 1836} {"train_loss": -12.069917678833008, "global_step": 308561, "epoch": 1836} {"train_loss": -12.475177764892578, "global_step": 308562, "epoch": 1836} {"train_loss": -12.359537124633789, "global_step": 308563, "epoch": 1836} {"train_loss": -12.317239761352539, "global_step": 308564, "epoch": 1836} {"train_loss": -12.415189743041992, "global_step": 308565, "epoch": 1836} {"train_loss": -12.316211700439453, "global_step": 308566, "epoch": 1836} {"train_loss": -12.428313255310059, "global_step": 308567, "epoch": 1836} {"train_loss": -12.266735076904297, "global_step": 308568, "epoch": 1836} {"train_loss": -12.259979248046875, "global_step": 308569, "epoch": 1836} {"train_loss": -12.189157485961914, "global_step": 308570, "epoch": 1836} {"train_loss": -12.130167961120605, "global_step": 308571, "epoch": 1836} {"train_loss": -12.182046890258789, "global_step": 308572, "epoch": 1836} {"train_loss": -12.437786102294922, "global_step": 308573, "epoch": 1836} {"train_loss": -11.943687438964844, "global_step": 308574, "epoch": 1836} {"train_loss": -11.514311790466309, "global_step": 308575, "epoch": 1836} {"train_loss": -11.879863739013672, "global_step": 308576, "epoch": 1836} {"train_loss": -12.514595031738281, "global_step": 308577, "epoch": 1836} {"train_loss": -11.73176383972168, "global_step": 308578, "epoch": 1836} {"train_loss": -10.606584548950195, "global_step": 308579, "epoch": 1836} {"train_loss": -12.651383399963379, "global_step": 308580, "epoch": 1836} {"train_loss": -10.502298355102539, "global_step": 308581, "epoch": 1836} {"train_loss": -9.08304214477539, "global_step": 308582, "epoch": 1836} {"train_loss": -10.886899948120117, "global_step": 308583, "epoch": 1836} {"train_loss": -9.139915466308594, "global_step": 308584, "epoch": 1836} {"train_loss": -9.77122688293457, "global_step": 308585, "epoch": 1836} {"train_loss": -8.112196922302246, "global_step": 308586, "epoch": 1836} {"train_loss": -9.9812650680542, "global_step": 308587, "epoch": 1836} {"train_loss": -10.93964958190918, "global_step": 308588, "epoch": 1836} {"train_loss": -9.707727432250977, "global_step": 308589, "epoch": 1836} {"train_loss": -9.434534072875977, "global_step": 308590, "epoch": 1836} {"train_loss": -11.465923309326172, "global_step": 308591, "epoch": 1836} {"train_loss": -10.782271385192871, "global_step": 308592, "epoch": 1836} {"train_loss": -11.016066551208496, "global_step": 308593, "epoch": 1836} {"train_loss": -11.250663757324219, "global_step": 308594, "epoch": 1836} {"train_loss": -9.339874267578125, "global_step": 308595, "epoch": 1836} {"train_loss": -11.678504943847656, "global_step": 308596, "epoch": 1836} {"train_loss": -9.401582717895508, "global_step": 308597, "epoch": 1836} {"train_loss": -11.242084503173828, "global_step": 308598, "epoch": 1836} {"train_loss": -11.587638854980469, "global_step": 308599, "epoch": 1836} {"train_loss": -11.213600158691406, "global_step": 308600, "epoch": 1836} {"train_loss": -11.190485954284668, "global_step": 308601, "epoch": 1836} {"train_loss": -10.405532836914062, "global_step": 308602, "epoch": 1836} {"train_loss": -11.196979522705078, "global_step": 308603, "epoch": 1836} {"train_loss": -10.385900497436523, "global_step": 308604, "epoch": 1836} {"train_loss": -10.98930549621582, "global_step": 308605, "epoch": 1836} {"train_loss": -11.182063102722168, "global_step": 308606, "epoch": 1836} {"train_loss": -11.781526565551758, "global_step": 308607, "epoch": 1836} {"train_loss": -11.233839988708496, "global_step": 308608, "epoch": 1836} {"train_loss": -11.76077651977539, "global_step": 308609, "epoch": 1836} {"train_loss": -11.221843719482422, "global_step": 308610, "epoch": 1836} {"train_loss": -11.674178123474121, "global_step": 308611, "epoch": 1836} {"train_loss": -11.554793357849121, "global_step": 308612, "epoch": 1836} {"train_loss": -11.212301254272461, "global_step": 308613, "epoch": 1836} {"train_loss": -11.369121551513672, "global_step": 308614, "epoch": 1836} {"train_loss": -11.672328023683457, "global_step": 308615, "epoch": 1836, "val_loss": 272994.46875} {"train_loss": -11.814017295837402, "global_step": 308616, "epoch": 1837} {"train_loss": -11.704935073852539, "global_step": 308617, "epoch": 1837} {"train_loss": -11.484696388244629, "global_step": 308618, "epoch": 1837} {"train_loss": -11.400874137878418, "global_step": 308619, "epoch": 1837} {"train_loss": -11.847679138183594, "global_step": 308620, "epoch": 1837} {"train_loss": -11.567377090454102, "global_step": 308621, "epoch": 1837} {"train_loss": -11.811077117919922, "global_step": 308622, "epoch": 1837} {"train_loss": -11.811105728149414, "global_step": 308623, "epoch": 1837} {"train_loss": -11.955144882202148, "global_step": 308624, "epoch": 1837} {"train_loss": -12.059915542602539, "global_step": 308625, "epoch": 1837} {"train_loss": -11.840190887451172, "global_step": 308626, "epoch": 1837} {"train_loss": -11.892085075378418, "global_step": 308627, "epoch": 1837} {"train_loss": -11.925670623779297, "global_step": 308628, "epoch": 1837} {"train_loss": -12.109945297241211, "global_step": 308629, "epoch": 1837} {"train_loss": -12.027667999267578, "global_step": 308630, "epoch": 1837} {"train_loss": -12.121746063232422, "global_step": 308631, "epoch": 1837} {"train_loss": -12.154775619506836, "global_step": 308632, "epoch": 1837} {"train_loss": -11.590251922607422, "global_step": 308633, "epoch": 1837} {"train_loss": -12.114617347717285, "global_step": 308634, "epoch": 1837} {"train_loss": -12.084013938903809, "global_step": 308635, "epoch": 1837} {"train_loss": -12.07846450805664, "global_step": 308636, "epoch": 1837} {"train_loss": -11.980292320251465, "global_step": 308637, "epoch": 1837} {"train_loss": -11.945799827575684, "global_step": 308638, "epoch": 1837} {"train_loss": -11.993265151977539, "global_step": 308639, "epoch": 1837} {"train_loss": -11.856640815734863, "global_step": 308640, "epoch": 1837} {"train_loss": -12.068805694580078, "global_step": 308641, "epoch": 1837} {"train_loss": -11.89957332611084, "global_step": 308642, "epoch": 1837} {"train_loss": -11.728265762329102, "global_step": 308643, "epoch": 1837} {"train_loss": -12.336488723754883, "global_step": 308644, "epoch": 1837} {"train_loss": -11.904987335205078, "global_step": 308645, "epoch": 1837} {"train_loss": -11.955533981323242, "global_step": 308646, "epoch": 1837} {"train_loss": -12.19949722290039, "global_step": 308647, "epoch": 1837} {"train_loss": -11.920391082763672, "global_step": 308648, "epoch": 1837} {"train_loss": -12.021921157836914, "global_step": 308649, "epoch": 1837} {"train_loss": -11.378288269042969, "global_step": 308650, "epoch": 1837} {"train_loss": -11.791335105895996, "global_step": 308651, "epoch": 1837} {"train_loss": -11.628944396972656, "global_step": 308652, "epoch": 1837} {"train_loss": -12.167254447937012, "global_step": 308653, "epoch": 1837} {"train_loss": -11.960770606994629, "global_step": 308654, "epoch": 1837} {"train_loss": -12.02553939819336, "global_step": 308655, "epoch": 1837} {"train_loss": -11.823951721191406, "global_step": 308656, "epoch": 1837} {"train_loss": -11.947351455688477, "global_step": 308657, "epoch": 1837} {"train_loss": -11.86593246459961, "global_step": 308658, "epoch": 1837} {"train_loss": -11.870132446289062, "global_step": 308659, "epoch": 1837} {"train_loss": -12.203779220581055, "global_step": 308660, "epoch": 1837} {"train_loss": -11.604646682739258, "global_step": 308661, "epoch": 1837} {"train_loss": -12.305801391601562, "global_step": 308662, "epoch": 1837} {"train_loss": -11.905982971191406, "global_step": 308663, "epoch": 1837} {"train_loss": -11.766683578491211, "global_step": 308664, "epoch": 1837} {"train_loss": -12.151724815368652, "global_step": 308665, "epoch": 1837} {"train_loss": -11.666452407836914, "global_step": 308666, "epoch": 1837} {"train_loss": -12.128898620605469, "global_step": 308667, "epoch": 1837} {"train_loss": -11.823593139648438, "global_step": 308668, "epoch": 1837} {"train_loss": -11.585044860839844, "global_step": 308669, "epoch": 1837} {"train_loss": -11.987154006958008, "global_step": 308670, "epoch": 1837} {"train_loss": -11.621248245239258, "global_step": 308671, "epoch": 1837} {"train_loss": -11.868947982788086, "global_step": 308672, "epoch": 1837} {"train_loss": -11.596603393554688, "global_step": 308673, "epoch": 1837} {"train_loss": -11.937272071838379, "global_step": 308674, "epoch": 1837} {"train_loss": -11.44094181060791, "global_step": 308675, "epoch": 1837} {"train_loss": -12.15868091583252, "global_step": 308676, "epoch": 1837} {"train_loss": -11.788935661315918, "global_step": 308677, "epoch": 1837} {"train_loss": -11.869426727294922, "global_step": 308678, "epoch": 1837} {"train_loss": -11.747133255004883, "global_step": 308679, "epoch": 1837} {"train_loss": -11.878811836242676, "global_step": 308680, "epoch": 1837} {"train_loss": -11.457566261291504, "global_step": 308681, "epoch": 1837} {"train_loss": -11.861942291259766, "global_step": 308682, "epoch": 1837} {"train_loss": -11.103963851928711, "global_step": 308683, "epoch": 1837} {"train_loss": -12.247615814208984, "global_step": 308684, "epoch": 1837} {"train_loss": -11.514703750610352, "global_step": 308685, "epoch": 1837} {"train_loss": -12.174659729003906, "global_step": 308686, "epoch": 1837} {"train_loss": -11.449684143066406, "global_step": 308687, "epoch": 1837} {"train_loss": -12.302926063537598, "global_step": 308688, "epoch": 1837} {"train_loss": -11.692001342773438, "global_step": 308689, "epoch": 1837} {"train_loss": -11.844188690185547, "global_step": 308690, "epoch": 1837} {"train_loss": -11.813003540039062, "global_step": 308691, "epoch": 1837} {"train_loss": -12.084718704223633, "global_step": 308692, "epoch": 1837} {"train_loss": -12.245424270629883, "global_step": 308693, "epoch": 1837} {"train_loss": -12.019948959350586, "global_step": 308694, "epoch": 1837} {"train_loss": -12.31712818145752, "global_step": 308695, "epoch": 1837} {"train_loss": -12.206823348999023, "global_step": 308696, "epoch": 1837} {"train_loss": -12.22512149810791, "global_step": 308697, "epoch": 1837} {"train_loss": -12.098579406738281, "global_step": 308698, "epoch": 1837} {"train_loss": -12.333358764648438, "global_step": 308699, "epoch": 1837} {"train_loss": -12.52397346496582, "global_step": 308700, "epoch": 1837} {"train_loss": -12.32459831237793, "global_step": 308701, "epoch": 1837} {"train_loss": -12.123475074768066, "global_step": 308702, "epoch": 1837} {"train_loss": -12.351486206054688, "global_step": 308703, "epoch": 1837} {"train_loss": -12.283119201660156, "global_step": 308704, "epoch": 1837} {"train_loss": -12.344727516174316, "global_step": 308705, "epoch": 1837} {"train_loss": -12.241621017456055, "global_step": 308706, "epoch": 1837} {"train_loss": -12.273957252502441, "global_step": 308707, "epoch": 1837} {"train_loss": -12.329171180725098, "global_step": 308708, "epoch": 1837} {"train_loss": -12.327651023864746, "global_step": 308709, "epoch": 1837} {"train_loss": -12.199217796325684, "global_step": 308710, "epoch": 1837} {"train_loss": -12.333414077758789, "global_step": 308711, "epoch": 1837} {"train_loss": -12.209169387817383, "global_step": 308712, "epoch": 1837} {"train_loss": -12.063300132751465, "global_step": 308713, "epoch": 1837} {"train_loss": -12.317913055419922, "global_step": 308714, "epoch": 1837} {"train_loss": -12.068758964538574, "global_step": 308715, "epoch": 1837} {"train_loss": -12.373125076293945, "global_step": 308716, "epoch": 1837} {"train_loss": -12.187870025634766, "global_step": 308717, "epoch": 1837} {"train_loss": -11.893526077270508, "global_step": 308718, "epoch": 1837} {"train_loss": -12.318638801574707, "global_step": 308719, "epoch": 1837} {"train_loss": -11.79606819152832, "global_step": 308720, "epoch": 1837} {"train_loss": -12.024459838867188, "global_step": 308721, "epoch": 1837} {"train_loss": -12.338570594787598, "global_step": 308722, "epoch": 1837} {"train_loss": -12.194084167480469, "global_step": 308723, "epoch": 1837} {"train_loss": -12.449447631835938, "global_step": 308724, "epoch": 1837} {"train_loss": -12.308911323547363, "global_step": 308725, "epoch": 1837} {"train_loss": -12.17210578918457, "global_step": 308726, "epoch": 1837} {"train_loss": -12.433611869812012, "global_step": 308727, "epoch": 1837} {"train_loss": -12.280641555786133, "global_step": 308728, "epoch": 1837} {"train_loss": -11.892601013183594, "global_step": 308729, "epoch": 1837} {"train_loss": -12.102916717529297, "global_step": 308730, "epoch": 1837} {"train_loss": -12.27815055847168, "global_step": 308731, "epoch": 1837} {"train_loss": -12.378204345703125, "global_step": 308732, "epoch": 1837} {"train_loss": -12.352704048156738, "global_step": 308733, "epoch": 1837} {"train_loss": -11.664958000183105, "global_step": 308734, "epoch": 1837} {"train_loss": -12.084487915039062, "global_step": 308735, "epoch": 1837} {"train_loss": -11.966550827026367, "global_step": 308736, "epoch": 1837} {"train_loss": -12.221899032592773, "global_step": 308737, "epoch": 1837} {"train_loss": -11.881389617919922, "global_step": 308738, "epoch": 1837} {"train_loss": -11.840105056762695, "global_step": 308739, "epoch": 1837} {"train_loss": -11.461799621582031, "global_step": 308740, "epoch": 1837} {"train_loss": -12.136868476867676, "global_step": 308741, "epoch": 1837} {"train_loss": -12.151060104370117, "global_step": 308742, "epoch": 1837} {"train_loss": -11.833454132080078, "global_step": 308743, "epoch": 1837} {"train_loss": -11.636764526367188, "global_step": 308744, "epoch": 1837} {"train_loss": -12.209989547729492, "global_step": 308745, "epoch": 1837} {"train_loss": -11.308185577392578, "global_step": 308746, "epoch": 1837} {"train_loss": -11.311354637145996, "global_step": 308747, "epoch": 1837} {"train_loss": -11.759506225585938, "global_step": 308748, "epoch": 1837} {"train_loss": -10.565878868103027, "global_step": 308749, "epoch": 1837} {"train_loss": -9.583503723144531, "global_step": 308750, "epoch": 1837} {"train_loss": -11.550310134887695, "global_step": 308751, "epoch": 1837} {"train_loss": -11.889175415039062, "global_step": 308752, "epoch": 1837} {"train_loss": -9.449472427368164, "global_step": 308753, "epoch": 1837} {"train_loss": -11.513057708740234, "global_step": 308754, "epoch": 1837} {"train_loss": -11.764780044555664, "global_step": 308755, "epoch": 1837} {"train_loss": -11.30087661743164, "global_step": 308756, "epoch": 1837} {"train_loss": -11.823447227478027, "global_step": 308757, "epoch": 1837} {"train_loss": -11.1307373046875, "global_step": 308758, "epoch": 1837} {"train_loss": -11.433494567871094, "global_step": 308759, "epoch": 1837} {"train_loss": -11.379874229431152, "global_step": 308760, "epoch": 1837} {"train_loss": -11.461151123046875, "global_step": 308761, "epoch": 1837} {"train_loss": -11.414724349975586, "global_step": 308762, "epoch": 1837} {"train_loss": -11.66706657409668, "global_step": 308763, "epoch": 1837} {"train_loss": -11.411252975463867, "global_step": 308764, "epoch": 1837} {"train_loss": -11.787469863891602, "global_step": 308765, "epoch": 1837} {"train_loss": -11.792594909667969, "global_step": 308766, "epoch": 1837} {"train_loss": -11.842741012573242, "global_step": 308767, "epoch": 1837} {"train_loss": -11.645797729492188, "global_step": 308768, "epoch": 1837} {"train_loss": -11.837484359741211, "global_step": 308769, "epoch": 1837} {"train_loss": -11.77645206451416, "global_step": 308770, "epoch": 1837} {"train_loss": -11.866342544555664, "global_step": 308771, "epoch": 1837} {"train_loss": -11.730734825134277, "global_step": 308772, "epoch": 1837} {"train_loss": -12.093429565429688, "global_step": 308773, "epoch": 1837} {"train_loss": -11.234466552734375, "global_step": 308774, "epoch": 1837} {"train_loss": -11.44663143157959, "global_step": 308775, "epoch": 1837} {"train_loss": -11.861194610595703, "global_step": 308776, "epoch": 1837} {"train_loss": -11.726053237915039, "global_step": 308777, "epoch": 1837} {"train_loss": -11.685622215270996, "global_step": 308778, "epoch": 1837} {"train_loss": -12.11923885345459, "global_step": 308779, "epoch": 1837} {"train_loss": -11.948454856872559, "global_step": 308780, "epoch": 1837} {"train_loss": -11.918879508972168, "global_step": 308781, "epoch": 1837} {"train_loss": -11.892860412597656, "global_step": 308782, "epoch": 1837} {"train_loss": -11.885362619445438, "global_step": 308783, "epoch": 1837, "val_loss": 277069.34375} {"train_loss": -11.97439193725586, "global_step": 308784, "epoch": 1838} {"train_loss": -11.75900936126709, "global_step": 308785, "epoch": 1838} {"train_loss": -12.263751983642578, "global_step": 308786, "epoch": 1838} {"train_loss": -12.284994125366211, "global_step": 308787, "epoch": 1838} {"train_loss": -12.185525894165039, "global_step": 308788, "epoch": 1838} {"train_loss": -11.855552673339844, "global_step": 308789, "epoch": 1838} {"train_loss": -11.977017402648926, "global_step": 308790, "epoch": 1838} {"train_loss": -11.943929672241211, "global_step": 308791, "epoch": 1838} {"train_loss": -11.951692581176758, "global_step": 308792, "epoch": 1838} {"train_loss": -12.224088668823242, "global_step": 308793, "epoch": 1838} {"train_loss": -11.947749137878418, "global_step": 308794, "epoch": 1838} {"train_loss": -12.203709602355957, "global_step": 308795, "epoch": 1838} {"train_loss": -11.934601783752441, "global_step": 308796, "epoch": 1838} {"train_loss": -11.63111686706543, "global_step": 308797, "epoch": 1838} {"train_loss": -11.91571044921875, "global_step": 308798, "epoch": 1838} {"train_loss": -11.939523696899414, "global_step": 308799, "epoch": 1838} {"train_loss": -11.88603401184082, "global_step": 308800, "epoch": 1838} {"train_loss": -11.855491638183594, "global_step": 308801, "epoch": 1838} {"train_loss": -11.964120864868164, "global_step": 308802, "epoch": 1838} {"train_loss": -11.513622283935547, "global_step": 308803, "epoch": 1838} {"train_loss": -12.078411102294922, "global_step": 308804, "epoch": 1838} {"train_loss": -11.65011978149414, "global_step": 308805, "epoch": 1838} {"train_loss": -12.060303688049316, "global_step": 308806, "epoch": 1838} {"train_loss": -11.933023452758789, "global_step": 308807, "epoch": 1838} {"train_loss": -12.159139633178711, "global_step": 308808, "epoch": 1838} {"train_loss": -11.201050758361816, "global_step": 308809, "epoch": 1838} {"train_loss": -11.917318344116211, "global_step": 308810, "epoch": 1838} {"train_loss": -11.486587524414062, "global_step": 308811, "epoch": 1838} {"train_loss": -11.437267303466797, "global_step": 308812, "epoch": 1838} {"train_loss": -12.233685493469238, "global_step": 308813, "epoch": 1838} {"train_loss": -11.8019380569458, "global_step": 308814, "epoch": 1838} {"train_loss": -11.714374542236328, "global_step": 308815, "epoch": 1838} {"train_loss": -11.850286483764648, "global_step": 308816, "epoch": 1838} {"train_loss": -11.830663681030273, "global_step": 308817, "epoch": 1838} {"train_loss": -11.785726547241211, "global_step": 308818, "epoch": 1838} {"train_loss": -12.149192810058594, "global_step": 308819, "epoch": 1838} {"train_loss": -12.06769847869873, "global_step": 308820, "epoch": 1838} {"train_loss": -12.020198822021484, "global_step": 308821, "epoch": 1838} {"train_loss": -12.270214080810547, "global_step": 308822, "epoch": 1838} {"train_loss": -11.829410552978516, "global_step": 308823, "epoch": 1838} {"train_loss": -12.085870742797852, "global_step": 308824, "epoch": 1838} {"train_loss": -11.691017150878906, "global_step": 308825, "epoch": 1838} {"train_loss": -11.880965232849121, "global_step": 308826, "epoch": 1838} {"train_loss": -11.407060623168945, "global_step": 308827, "epoch": 1838} {"train_loss": -12.115763664245605, "global_step": 308828, "epoch": 1838} {"train_loss": -11.425865173339844, "global_step": 308829, "epoch": 1838} {"train_loss": -12.185622215270996, "global_step": 308830, "epoch": 1838} {"train_loss": -12.017951011657715, "global_step": 308831, "epoch": 1838} {"train_loss": -11.444851875305176, "global_step": 308832, "epoch": 1838} {"train_loss": -11.466714859008789, "global_step": 308833, "epoch": 1838} {"train_loss": -11.03547191619873, "global_step": 308834, "epoch": 1838} {"train_loss": -11.248821258544922, "global_step": 308835, "epoch": 1838} {"train_loss": -11.095161437988281, "global_step": 308836, "epoch": 1838} {"train_loss": -11.567878723144531, "global_step": 308837, "epoch": 1838} {"train_loss": -11.373233795166016, "global_step": 308838, "epoch": 1838} {"train_loss": -12.097728729248047, "global_step": 308839, "epoch": 1838} {"train_loss": -11.4768705368042, "global_step": 308840, "epoch": 1838} {"train_loss": -12.00468635559082, "global_step": 308841, "epoch": 1838} {"train_loss": -12.062230110168457, "global_step": 308842, "epoch": 1838} {"train_loss": -11.680998802185059, "global_step": 308843, "epoch": 1838} {"train_loss": -12.095809936523438, "global_step": 308844, "epoch": 1838} {"train_loss": -11.51778793334961, "global_step": 308845, "epoch": 1838} {"train_loss": -11.703380584716797, "global_step": 308846, "epoch": 1838} {"train_loss": -11.73801040649414, "global_step": 308847, "epoch": 1838} {"train_loss": -11.534123420715332, "global_step": 308848, "epoch": 1838} {"train_loss": -10.909818649291992, "global_step": 308849, "epoch": 1838} {"train_loss": -12.081989288330078, "global_step": 308850, "epoch": 1838} {"train_loss": -11.150792121887207, "global_step": 308851, "epoch": 1838} {"train_loss": -12.054960250854492, "global_step": 308852, "epoch": 1838} {"train_loss": -11.754642486572266, "global_step": 308853, "epoch": 1838} {"train_loss": -11.626687049865723, "global_step": 308854, "epoch": 1838} {"train_loss": -11.814334869384766, "global_step": 308855, "epoch": 1838} {"train_loss": -11.777048110961914, "global_step": 308856, "epoch": 1838} {"train_loss": -11.87491226196289, "global_step": 308857, "epoch": 1838} {"train_loss": -11.728090286254883, "global_step": 308858, "epoch": 1838} {"train_loss": -11.680331230163574, "global_step": 308859, "epoch": 1838} {"train_loss": -12.04210090637207, "global_step": 308860, "epoch": 1838} {"train_loss": -12.241203308105469, "global_step": 308861, "epoch": 1838} {"train_loss": -12.044260025024414, "global_step": 308862, "epoch": 1838} {"train_loss": -11.510342597961426, "global_step": 308863, "epoch": 1838} {"train_loss": -12.212831497192383, "global_step": 308864, "epoch": 1838} {"train_loss": -11.351722717285156, "global_step": 308865, "epoch": 1838} {"train_loss": -12.240360260009766, "global_step": 308866, "epoch": 1838} {"train_loss": -11.746109008789062, "global_step": 308867, "epoch": 1838} {"train_loss": -11.955106735229492, "global_step": 308868, "epoch": 1838} {"train_loss": -11.92741584777832, "global_step": 308869, "epoch": 1838} {"train_loss": -11.912671089172363, "global_step": 308870, "epoch": 1838} {"train_loss": -12.097634315490723, "global_step": 308871, "epoch": 1838} {"train_loss": -11.99802017211914, "global_step": 308872, "epoch": 1838} {"train_loss": -12.21117877960205, "global_step": 308873, "epoch": 1838} {"train_loss": -11.71469497680664, "global_step": 308874, "epoch": 1838} {"train_loss": -11.65863037109375, "global_step": 308875, "epoch": 1838} {"train_loss": -11.741006851196289, "global_step": 308876, "epoch": 1838} {"train_loss": -11.734282493591309, "global_step": 308877, "epoch": 1838} {"train_loss": -11.792349815368652, "global_step": 308878, "epoch": 1838} {"train_loss": -11.135648727416992, "global_step": 308879, "epoch": 1838} {"train_loss": -12.092364311218262, "global_step": 308880, "epoch": 1838} {"train_loss": -11.738155364990234, "global_step": 308881, "epoch": 1838} {"train_loss": -11.662195205688477, "global_step": 308882, "epoch": 1838} {"train_loss": -12.044748306274414, "global_step": 308883, "epoch": 1838} {"train_loss": -11.536636352539062, "global_step": 308884, "epoch": 1838} {"train_loss": -11.92431926727295, "global_step": 308885, "epoch": 1838} {"train_loss": -11.895097732543945, "global_step": 308886, "epoch": 1838} {"train_loss": -11.560073852539062, "global_step": 308887, "epoch": 1838} {"train_loss": -12.222152709960938, "global_step": 308888, "epoch": 1838} {"train_loss": -11.160215377807617, "global_step": 308889, "epoch": 1838} {"train_loss": -11.486459732055664, "global_step": 308890, "epoch": 1838} {"train_loss": -12.002723693847656, "global_step": 308891, "epoch": 1838} {"train_loss": -11.38406753540039, "global_step": 308892, "epoch": 1838} {"train_loss": -11.920522689819336, "global_step": 308893, "epoch": 1838} {"train_loss": -11.248915672302246, "global_step": 308894, "epoch": 1838} {"train_loss": -11.638699531555176, "global_step": 308895, "epoch": 1838} {"train_loss": -11.979430198669434, "global_step": 308896, "epoch": 1838} {"train_loss": -11.449407577514648, "global_step": 308897, "epoch": 1838} {"train_loss": -11.98824405670166, "global_step": 308898, "epoch": 1838} {"train_loss": -11.375435829162598, "global_step": 308899, "epoch": 1838} {"train_loss": -11.925628662109375, "global_step": 308900, "epoch": 1838} {"train_loss": -11.563697814941406, "global_step": 308901, "epoch": 1838} {"train_loss": -11.700138092041016, "global_step": 308902, "epoch": 1838} {"train_loss": -12.338783264160156, "global_step": 308903, "epoch": 1838} {"train_loss": -11.604681968688965, "global_step": 308904, "epoch": 1838} {"train_loss": -12.007980346679688, "global_step": 308905, "epoch": 1838} {"train_loss": -11.922468185424805, "global_step": 308906, "epoch": 1838} {"train_loss": -12.123785018920898, "global_step": 308907, "epoch": 1838} {"train_loss": -11.863383293151855, "global_step": 308908, "epoch": 1838} {"train_loss": -11.934181213378906, "global_step": 308909, "epoch": 1838} {"train_loss": -12.109161376953125, "global_step": 308910, "epoch": 1838} {"train_loss": -11.78687572479248, "global_step": 308911, "epoch": 1838} {"train_loss": -12.005796432495117, "global_step": 308912, "epoch": 1838} {"train_loss": -11.926202774047852, "global_step": 308913, "epoch": 1838} {"train_loss": -12.320965766906738, "global_step": 308914, "epoch": 1838} {"train_loss": -11.918641090393066, "global_step": 308915, "epoch": 1838} {"train_loss": -11.960859298706055, "global_step": 308916, "epoch": 1838} {"train_loss": -12.226838111877441, "global_step": 308917, "epoch": 1838} {"train_loss": -11.782729148864746, "global_step": 308918, "epoch": 1838} {"train_loss": -12.333024978637695, "global_step": 308919, "epoch": 1838} {"train_loss": -12.197351455688477, "global_step": 308920, "epoch": 1838} {"train_loss": -12.02968978881836, "global_step": 308921, "epoch": 1838} {"train_loss": -12.389701843261719, "global_step": 308922, "epoch": 1838} {"train_loss": -12.067273139953613, "global_step": 308923, "epoch": 1838} {"train_loss": -11.937408447265625, "global_step": 308924, "epoch": 1838} {"train_loss": -12.38812255859375, "global_step": 308925, "epoch": 1838} {"train_loss": -11.825998306274414, "global_step": 308926, "epoch": 1838} {"train_loss": -12.25881576538086, "global_step": 308927, "epoch": 1838} {"train_loss": -12.333049774169922, "global_step": 308928, "epoch": 1838} {"train_loss": -12.22724723815918, "global_step": 308929, "epoch": 1838} {"train_loss": -12.271444320678711, "global_step": 308930, "epoch": 1838} {"train_loss": -11.809700965881348, "global_step": 308931, "epoch": 1838} {"train_loss": -12.30754280090332, "global_step": 308932, "epoch": 1838} {"train_loss": -12.086376190185547, "global_step": 308933, "epoch": 1838} {"train_loss": -11.503204345703125, "global_step": 308934, "epoch": 1838} {"train_loss": -11.815362930297852, "global_step": 308935, "epoch": 1838} {"train_loss": -12.353155136108398, "global_step": 308936, "epoch": 1838} {"train_loss": -11.972769737243652, "global_step": 308937, "epoch": 1838} {"train_loss": -12.073326110839844, "global_step": 308938, "epoch": 1838} {"train_loss": -11.92033576965332, "global_step": 308939, "epoch": 1838} {"train_loss": -12.183591842651367, "global_step": 308940, "epoch": 1838} {"train_loss": -11.829938888549805, "global_step": 308941, "epoch": 1838} {"train_loss": -11.983561515808105, "global_step": 308942, "epoch": 1838} {"train_loss": -11.832186698913574, "global_step": 308943, "epoch": 1838} {"train_loss": -11.439355850219727, "global_step": 308944, "epoch": 1838} {"train_loss": -12.06915283203125, "global_step": 308945, "epoch": 1838} {"train_loss": -11.378805160522461, "global_step": 308946, "epoch": 1838} {"train_loss": -11.920063018798828, "global_step": 308947, "epoch": 1838} {"train_loss": -11.857080459594727, "global_step": 308948, "epoch": 1838} {"train_loss": -11.958368301391602, "global_step": 308949, "epoch": 1838} {"train_loss": -12.0558500289917, "global_step": 308950, "epoch": 1838} {"train_loss": -11.859363022304716, "global_step": 308951, "epoch": 1838, "val_loss": 279362.84375} {"train_loss": -12.246225357055664, "global_step": 308952, "epoch": 1839} {"train_loss": -11.706316947937012, "global_step": 308953, "epoch": 1839} {"train_loss": -11.959779739379883, "global_step": 308954, "epoch": 1839} {"train_loss": -12.033868789672852, "global_step": 308955, "epoch": 1839} {"train_loss": -12.257041931152344, "global_step": 308956, "epoch": 1839} {"train_loss": -11.669516563415527, "global_step": 308957, "epoch": 1839} {"train_loss": -11.80125617980957, "global_step": 308958, "epoch": 1839} {"train_loss": -11.997148513793945, "global_step": 308959, "epoch": 1839} {"train_loss": -11.58303451538086, "global_step": 308960, "epoch": 1839} {"train_loss": -11.5020751953125, "global_step": 308961, "epoch": 1839} {"train_loss": -12.194723129272461, "global_step": 308962, "epoch": 1839} {"train_loss": -11.734994888305664, "global_step": 308963, "epoch": 1839} {"train_loss": -11.48907470703125, "global_step": 308964, "epoch": 1839} {"train_loss": -11.481986045837402, "global_step": 308965, "epoch": 1839} {"train_loss": -10.969270706176758, "global_step": 308966, "epoch": 1839} {"train_loss": -11.650697708129883, "global_step": 308967, "epoch": 1839} {"train_loss": -11.676959991455078, "global_step": 308968, "epoch": 1839} {"train_loss": -11.544148445129395, "global_step": 308969, "epoch": 1839} {"train_loss": -11.454742431640625, "global_step": 308970, "epoch": 1839} {"train_loss": -11.61620807647705, "global_step": 308971, "epoch": 1839} {"train_loss": -11.992416381835938, "global_step": 308972, "epoch": 1839} {"train_loss": -11.51687240600586, "global_step": 308973, "epoch": 1839} {"train_loss": -10.783020973205566, "global_step": 308974, "epoch": 1839} {"train_loss": -12.285578727722168, "global_step": 308975, "epoch": 1839} {"train_loss": -11.395875930786133, "global_step": 308976, "epoch": 1839} {"train_loss": -10.541671752929688, "global_step": 308977, "epoch": 1839} {"train_loss": -11.89553165435791, "global_step": 308978, "epoch": 1839} {"train_loss": -10.8504056930542, "global_step": 308979, "epoch": 1839} {"train_loss": -9.346808433532715, "global_step": 308980, "epoch": 1839} {"train_loss": -11.25661849975586, "global_step": 308981, "epoch": 1839} {"train_loss": -8.75486946105957, "global_step": 308982, "epoch": 1839} {"train_loss": -11.448774337768555, "global_step": 308983, "epoch": 1839} {"train_loss": -7.628314971923828, "global_step": 308984, "epoch": 1839} {"train_loss": -7.6389312744140625, "global_step": 308985, "epoch": 1839} {"train_loss": -7.999330997467041, "global_step": 308986, "epoch": 1839} {"train_loss": -7.533816814422607, "global_step": 308987, "epoch": 1839} {"train_loss": -8.591899871826172, "global_step": 308988, "epoch": 1839} {"train_loss": -8.358823776245117, "global_step": 308989, "epoch": 1839} {"train_loss": -8.798120498657227, "global_step": 308990, "epoch": 1839} {"train_loss": -9.11141586303711, "global_step": 308991, "epoch": 1839} {"train_loss": -7.440622806549072, "global_step": 308992, "epoch": 1839} {"train_loss": -8.926384925842285, "global_step": 308993, "epoch": 1839} {"train_loss": -9.827046394348145, "global_step": 308994, "epoch": 1839} {"train_loss": -9.694887161254883, "global_step": 308995, "epoch": 1839} {"train_loss": -10.74653434753418, "global_step": 308996, "epoch": 1839} {"train_loss": -9.843503952026367, "global_step": 308997, "epoch": 1839} {"train_loss": -11.19215202331543, "global_step": 308998, "epoch": 1839} {"train_loss": -10.001408576965332, "global_step": 308999, "epoch": 1839} {"train_loss": -10.76303482055664, "global_step": 309000, "epoch": 1839} {"train_loss": -10.195940017700195, "global_step": 309001, "epoch": 1839} {"train_loss": -10.130838394165039, "global_step": 309002, "epoch": 1839} {"train_loss": -10.832486152648926, "global_step": 309003, "epoch": 1839} {"train_loss": -11.15745735168457, "global_step": 309004, "epoch": 1839} {"train_loss": -10.935855865478516, "global_step": 309005, "epoch": 1839} {"train_loss": -11.442798614501953, "global_step": 309006, "epoch": 1839} {"train_loss": -11.439428329467773, "global_step": 309007, "epoch": 1839} {"train_loss": -11.382345199584961, "global_step": 309008, "epoch": 1839} {"train_loss": -11.450087547302246, "global_step": 309009, "epoch": 1839} {"train_loss": -11.11293888092041, "global_step": 309010, "epoch": 1839} {"train_loss": -11.559378623962402, "global_step": 309011, "epoch": 1839} {"train_loss": -11.345541000366211, "global_step": 309012, "epoch": 1839} {"train_loss": -11.519010543823242, "global_step": 309013, "epoch": 1839} {"train_loss": -11.61054515838623, "global_step": 309014, "epoch": 1839} {"train_loss": -11.776026725769043, "global_step": 309015, "epoch": 1839} {"train_loss": -11.725295066833496, "global_step": 309016, "epoch": 1839} {"train_loss": -11.424272537231445, "global_step": 309017, "epoch": 1839} {"train_loss": -11.94310474395752, "global_step": 309018, "epoch": 1839} {"train_loss": -11.927855491638184, "global_step": 309019, "epoch": 1839} {"train_loss": -11.665905952453613, "global_step": 309020, "epoch": 1839} {"train_loss": -11.873588562011719, "global_step": 309021, "epoch": 1839} {"train_loss": -11.861270904541016, "global_step": 309022, "epoch": 1839} {"train_loss": -11.992897033691406, "global_step": 309023, "epoch": 1839} {"train_loss": -11.952860832214355, "global_step": 309024, "epoch": 1839} {"train_loss": -11.809174537658691, "global_step": 309025, "epoch": 1839} {"train_loss": -11.820154190063477, "global_step": 309026, "epoch": 1839} {"train_loss": -12.046195030212402, "global_step": 309027, "epoch": 1839} {"train_loss": -11.787199020385742, "global_step": 309028, "epoch": 1839} {"train_loss": -12.014829635620117, "global_step": 309029, "epoch": 1839} {"train_loss": -12.046915054321289, "global_step": 309030, "epoch": 1839} {"train_loss": -12.064567565917969, "global_step": 309031, "epoch": 1839} {"train_loss": -11.90407657623291, "global_step": 309032, "epoch": 1839} {"train_loss": -12.140012741088867, "global_step": 309033, "epoch": 1839} {"train_loss": -11.727678298950195, "global_step": 309034, "epoch": 1839} {"train_loss": -11.934104919433594, "global_step": 309035, "epoch": 1839} {"train_loss": -12.003793716430664, "global_step": 309036, "epoch": 1839} {"train_loss": -11.886311531066895, "global_step": 309037, "epoch": 1839} {"train_loss": -12.056010246276855, "global_step": 309038, "epoch": 1839} {"train_loss": -12.105072021484375, "global_step": 309039, "epoch": 1839} {"train_loss": -12.091577529907227, "global_step": 309040, "epoch": 1839} {"train_loss": -12.138381958007812, "global_step": 309041, "epoch": 1839} {"train_loss": -12.262594223022461, "global_step": 309042, "epoch": 1839} {"train_loss": -12.214954376220703, "global_step": 309043, "epoch": 1839} {"train_loss": -12.12182331085205, "global_step": 309044, "epoch": 1839} {"train_loss": -12.163307189941406, "global_step": 309045, "epoch": 1839} {"train_loss": -12.186393737792969, "global_step": 309046, "epoch": 1839} {"train_loss": -12.14079475402832, "global_step": 309047, "epoch": 1839} {"train_loss": -12.24256420135498, "global_step": 309048, "epoch": 1839} {"train_loss": -12.227790832519531, "global_step": 309049, "epoch": 1839} {"train_loss": -12.238204956054688, "global_step": 309050, "epoch": 1839} {"train_loss": -12.466602325439453, "global_step": 309051, "epoch": 1839} {"train_loss": -12.4413423538208, "global_step": 309052, "epoch": 1839} {"train_loss": -12.302511215209961, "global_step": 309053, "epoch": 1839} {"train_loss": -12.192102432250977, "global_step": 309054, "epoch": 1839} {"train_loss": -12.433588027954102, "global_step": 309055, "epoch": 1839} {"train_loss": -12.35600471496582, "global_step": 309056, "epoch": 1839} {"train_loss": -12.295341491699219, "global_step": 309057, "epoch": 1839} {"train_loss": -12.24854850769043, "global_step": 309058, "epoch": 1839} {"train_loss": -12.074739456176758, "global_step": 309059, "epoch": 1839} {"train_loss": -12.334097862243652, "global_step": 309060, "epoch": 1839} {"train_loss": -12.210426330566406, "global_step": 309061, "epoch": 1839} {"train_loss": -12.107503890991211, "global_step": 309062, "epoch": 1839} {"train_loss": -12.277056694030762, "global_step": 309063, "epoch": 1839} {"train_loss": -12.1846284866333, "global_step": 309064, "epoch": 1839} {"train_loss": -11.938562393188477, "global_step": 309065, "epoch": 1839} {"train_loss": -12.384483337402344, "global_step": 309066, "epoch": 1839} {"train_loss": -12.401098251342773, "global_step": 309067, "epoch": 1839} {"train_loss": -12.0615816116333, "global_step": 309068, "epoch": 1839} {"train_loss": -11.959264755249023, "global_step": 309069, "epoch": 1839} {"train_loss": -12.420171737670898, "global_step": 309070, "epoch": 1839} {"train_loss": -12.329085350036621, "global_step": 309071, "epoch": 1839} {"train_loss": -12.243518829345703, "global_step": 309072, "epoch": 1839} {"train_loss": -12.572826385498047, "global_step": 309073, "epoch": 1839} {"train_loss": -12.401612281799316, "global_step": 309074, "epoch": 1839} {"train_loss": -12.235787391662598, "global_step": 309075, "epoch": 1839} {"train_loss": -12.334890365600586, "global_step": 309076, "epoch": 1839} {"train_loss": -12.351469993591309, "global_step": 309077, "epoch": 1839} {"train_loss": -12.205137252807617, "global_step": 309078, "epoch": 1839} {"train_loss": -12.280804634094238, "global_step": 309079, "epoch": 1839} {"train_loss": -12.484006881713867, "global_step": 309080, "epoch": 1839} {"train_loss": -12.324405670166016, "global_step": 309081, "epoch": 1839} {"train_loss": -12.62096118927002, "global_step": 309082, "epoch": 1839} {"train_loss": -12.157660484313965, "global_step": 309083, "epoch": 1839} {"train_loss": -11.935144424438477, "global_step": 309084, "epoch": 1839} {"train_loss": -12.520870208740234, "global_step": 309085, "epoch": 1839} {"train_loss": -12.478607177734375, "global_step": 309086, "epoch": 1839} {"train_loss": -12.548372268676758, "global_step": 309087, "epoch": 1839} {"train_loss": -12.378623008728027, "global_step": 309088, "epoch": 1839} {"train_loss": -12.312445640563965, "global_step": 309089, "epoch": 1839} {"train_loss": -12.58018684387207, "global_step": 309090, "epoch": 1839} {"train_loss": -12.465181350708008, "global_step": 309091, "epoch": 1839} {"train_loss": -12.387819290161133, "global_step": 309092, "epoch": 1839} {"train_loss": -12.522043228149414, "global_step": 309093, "epoch": 1839} {"train_loss": -12.40216064453125, "global_step": 309094, "epoch": 1839} {"train_loss": -12.570159912109375, "global_step": 309095, "epoch": 1839} {"train_loss": -12.425893783569336, "global_step": 309096, "epoch": 1839} {"train_loss": -12.436180114746094, "global_step": 309097, "epoch": 1839} {"train_loss": -12.590285301208496, "global_step": 309098, "epoch": 1839} {"train_loss": -12.713472366333008, "global_step": 309099, "epoch": 1839} {"train_loss": -12.66893196105957, "global_step": 309100, "epoch": 1839} {"train_loss": -12.665950775146484, "global_step": 309101, "epoch": 1839} {"train_loss": -12.517759323120117, "global_step": 309102, "epoch": 1839} {"train_loss": -11.98109245300293, "global_step": 309103, "epoch": 1839} {"train_loss": -12.65958023071289, "global_step": 309104, "epoch": 1839} {"train_loss": -12.229323387145996, "global_step": 309105, "epoch": 1839} {"train_loss": -12.34858512878418, "global_step": 309106, "epoch": 1839} {"train_loss": -11.228309631347656, "global_step": 309107, "epoch": 1839} {"train_loss": -11.637755393981934, "global_step": 309108, "epoch": 1839} {"train_loss": -12.316841125488281, "global_step": 309109, "epoch": 1839} {"train_loss": -11.361766815185547, "global_step": 309110, "epoch": 1839} {"train_loss": -10.965518951416016, "global_step": 309111, "epoch": 1839} {"train_loss": -10.539475440979004, "global_step": 309112, "epoch": 1839} {"train_loss": -9.515501022338867, "global_step": 309113, "epoch": 1839} {"train_loss": -10.756051063537598, "global_step": 309114, "epoch": 1839} {"train_loss": -9.844050407409668, "global_step": 309115, "epoch": 1839} {"train_loss": -9.038808822631836, "global_step": 309116, "epoch": 1839} {"train_loss": -8.967029571533203, "global_step": 309117, "epoch": 1839} {"train_loss": -9.325937271118164, "global_step": 309118, "epoch": 1839} {"train_loss": -11.520022332668304, "global_step": 309119, "epoch": 1839, "val_loss": 279743.5625} {"train_loss": -8.334970474243164, "global_step": 309120, "epoch": 1840} {"train_loss": -8.437958717346191, "global_step": 309121, "epoch": 1840} {"train_loss": -8.28056812286377, "global_step": 309122, "epoch": 1840} {"train_loss": -8.302781105041504, "global_step": 309123, "epoch": 1840} {"train_loss": -8.695236206054688, "global_step": 309124, "epoch": 1840} {"train_loss": -9.045112609863281, "global_step": 309125, "epoch": 1840} {"train_loss": -9.417974472045898, "global_step": 309126, "epoch": 1840} {"train_loss": -9.300220489501953, "global_step": 309127, "epoch": 1840} {"train_loss": -11.189062118530273, "global_step": 309128, "epoch": 1840} {"train_loss": -9.870214462280273, "global_step": 309129, "epoch": 1840} {"train_loss": -10.031536102294922, "global_step": 309130, "epoch": 1840} {"train_loss": -11.056503295898438, "global_step": 309131, "epoch": 1840} {"train_loss": -9.897577285766602, "global_step": 309132, "epoch": 1840} {"train_loss": -10.518399238586426, "global_step": 309133, "epoch": 1840} {"train_loss": -9.455041885375977, "global_step": 309134, "epoch": 1840} {"train_loss": -10.228815078735352, "global_step": 309135, "epoch": 1840} {"train_loss": -9.787601470947266, "global_step": 309136, "epoch": 1840} {"train_loss": -10.250314712524414, "global_step": 309137, "epoch": 1840} {"train_loss": -10.729534149169922, "global_step": 309138, "epoch": 1840} {"train_loss": -10.520744323730469, "global_step": 309139, "epoch": 1840} {"train_loss": -10.09021282196045, "global_step": 309140, "epoch": 1840} {"train_loss": -11.386232376098633, "global_step": 309141, "epoch": 1840} {"train_loss": -9.953191757202148, "global_step": 309142, "epoch": 1840} {"train_loss": -10.924834251403809, "global_step": 309143, "epoch": 1840} {"train_loss": -10.922323226928711, "global_step": 309144, "epoch": 1840} {"train_loss": -10.382177352905273, "global_step": 309145, "epoch": 1840} {"train_loss": -10.836732864379883, "global_step": 309146, "epoch": 1840} {"train_loss": -11.12603759765625, "global_step": 309147, "epoch": 1840} {"train_loss": -11.028000831604004, "global_step": 309148, "epoch": 1840} {"train_loss": -11.049474716186523, "global_step": 309149, "epoch": 1840} {"train_loss": -10.979385375976562, "global_step": 309150, "epoch": 1840} {"train_loss": -11.169210433959961, "global_step": 309151, "epoch": 1840} {"train_loss": -11.73759651184082, "global_step": 309152, "epoch": 1840} {"train_loss": -11.21275520324707, "global_step": 309153, "epoch": 1840} {"train_loss": -11.67580795288086, "global_step": 309154, "epoch": 1840} {"train_loss": -11.427812576293945, "global_step": 309155, "epoch": 1840} {"train_loss": -11.573817253112793, "global_step": 309156, "epoch": 1840} {"train_loss": -11.477380752563477, "global_step": 309157, "epoch": 1840} {"train_loss": -11.586477279663086, "global_step": 309158, "epoch": 1840} {"train_loss": -11.54043960571289, "global_step": 309159, "epoch": 1840} {"train_loss": -11.947162628173828, "global_step": 309160, "epoch": 1840} {"train_loss": -11.444022178649902, "global_step": 309161, "epoch": 1840} {"train_loss": -11.896262168884277, "global_step": 309162, "epoch": 1840} {"train_loss": -11.612272262573242, "global_step": 309163, "epoch": 1840} {"train_loss": -12.118047714233398, "global_step": 309164, "epoch": 1840} {"train_loss": -11.673571586608887, "global_step": 309165, "epoch": 1840} {"train_loss": -11.910036087036133, "global_step": 309166, "epoch": 1840} {"train_loss": -11.813191413879395, "global_step": 309167, "epoch": 1840} {"train_loss": -12.052990913391113, "global_step": 309168, "epoch": 1840} {"train_loss": -12.053060531616211, "global_step": 309169, "epoch": 1840} {"train_loss": -12.084789276123047, "global_step": 309170, "epoch": 1840} {"train_loss": -11.890219688415527, "global_step": 309171, "epoch": 1840} {"train_loss": -12.152061462402344, "global_step": 309172, "epoch": 1840} {"train_loss": -11.92457389831543, "global_step": 309173, "epoch": 1840} {"train_loss": -12.219240188598633, "global_step": 309174, "epoch": 1840} {"train_loss": -12.114582061767578, "global_step": 309175, "epoch": 1840} {"train_loss": -12.069489479064941, "global_step": 309176, "epoch": 1840} {"train_loss": -12.26638412475586, "global_step": 309177, "epoch": 1840} {"train_loss": -12.176058769226074, "global_step": 309178, "epoch": 1840} {"train_loss": -12.078550338745117, "global_step": 309179, "epoch": 1840} {"train_loss": -12.135533332824707, "global_step": 309180, "epoch": 1840} {"train_loss": -12.138107299804688, "global_step": 309181, "epoch": 1840} {"train_loss": -12.080976486206055, "global_step": 309182, "epoch": 1840} {"train_loss": -12.00407886505127, "global_step": 309183, "epoch": 1840} {"train_loss": -12.041633605957031, "global_step": 309184, "epoch": 1840} {"train_loss": -12.125151634216309, "global_step": 309185, "epoch": 1840} {"train_loss": -12.340047836303711, "global_step": 309186, "epoch": 1840} {"train_loss": -12.175283432006836, "global_step": 309187, "epoch": 1840} {"train_loss": -12.30917739868164, "global_step": 309188, "epoch": 1840} {"train_loss": -12.259395599365234, "global_step": 309189, "epoch": 1840} {"train_loss": -12.292051315307617, "global_step": 309190, "epoch": 1840} {"train_loss": -12.281631469726562, "global_step": 309191, "epoch": 1840} {"train_loss": -12.067598342895508, "global_step": 309192, "epoch": 1840} {"train_loss": -12.210177421569824, "global_step": 309193, "epoch": 1840} {"train_loss": -12.028858184814453, "global_step": 309194, "epoch": 1840} {"train_loss": -12.184798240661621, "global_step": 309195, "epoch": 1840} {"train_loss": -12.209928512573242, "global_step": 309196, "epoch": 1840} {"train_loss": -12.579580307006836, "global_step": 309197, "epoch": 1840} {"train_loss": -12.124410629272461, "global_step": 309198, "epoch": 1840} {"train_loss": -12.203554153442383, "global_step": 309199, "epoch": 1840} {"train_loss": -12.34970474243164, "global_step": 309200, "epoch": 1840} {"train_loss": -11.931739807128906, "global_step": 309201, "epoch": 1840} {"train_loss": -12.571853637695312, "global_step": 309202, "epoch": 1840} {"train_loss": -12.140047073364258, "global_step": 309203, "epoch": 1840} {"train_loss": -12.393396377563477, "global_step": 309204, "epoch": 1840} {"train_loss": -12.064370155334473, "global_step": 309205, "epoch": 1840} {"train_loss": -12.274137496948242, "global_step": 309206, "epoch": 1840} {"train_loss": -12.419336318969727, "global_step": 309207, "epoch": 1840} {"train_loss": -12.173152923583984, "global_step": 309208, "epoch": 1840} {"train_loss": -12.28314208984375, "global_step": 309209, "epoch": 1840} {"train_loss": -12.429974555969238, "global_step": 309210, "epoch": 1840} {"train_loss": -12.26650333404541, "global_step": 309211, "epoch": 1840} {"train_loss": -12.173791885375977, "global_step": 309212, "epoch": 1840} {"train_loss": -12.01108169555664, "global_step": 309213, "epoch": 1840} {"train_loss": -12.10158920288086, "global_step": 309214, "epoch": 1840} {"train_loss": -12.176101684570312, "global_step": 309215, "epoch": 1840} {"train_loss": -11.84776496887207, "global_step": 309216, "epoch": 1840} {"train_loss": -12.258686065673828, "global_step": 309217, "epoch": 1840} {"train_loss": -12.357912063598633, "global_step": 309218, "epoch": 1840} {"train_loss": -12.290264129638672, "global_step": 309219, "epoch": 1840} {"train_loss": -12.019118309020996, "global_step": 309220, "epoch": 1840} {"train_loss": -12.36447811126709, "global_step": 309221, "epoch": 1840} {"train_loss": -12.354393005371094, "global_step": 309222, "epoch": 1840} {"train_loss": -12.201005935668945, "global_step": 309223, "epoch": 1840} {"train_loss": -11.896492004394531, "global_step": 309224, "epoch": 1840} {"train_loss": -11.684142112731934, "global_step": 309225, "epoch": 1840} {"train_loss": -11.742898941040039, "global_step": 309226, "epoch": 1840} {"train_loss": -11.981966018676758, "global_step": 309227, "epoch": 1840} {"train_loss": -12.438600540161133, "global_step": 309228, "epoch": 1840} {"train_loss": -12.270030975341797, "global_step": 309229, "epoch": 1840} {"train_loss": -12.455013275146484, "global_step": 309230, "epoch": 1840} {"train_loss": -12.212934494018555, "global_step": 309231, "epoch": 1840} {"train_loss": -12.502537727355957, "global_step": 309232, "epoch": 1840} {"train_loss": -12.194355010986328, "global_step": 309233, "epoch": 1840} {"train_loss": -12.606148719787598, "global_step": 309234, "epoch": 1840} {"train_loss": -12.215468406677246, "global_step": 309235, "epoch": 1840} {"train_loss": -12.219749450683594, "global_step": 309236, "epoch": 1840} {"train_loss": -12.146227836608887, "global_step": 309237, "epoch": 1840} {"train_loss": -12.472790718078613, "global_step": 309238, "epoch": 1840} {"train_loss": -12.505847930908203, "global_step": 309239, "epoch": 1840} {"train_loss": -12.311368942260742, "global_step": 309240, "epoch": 1840} {"train_loss": -12.15468978881836, "global_step": 309241, "epoch": 1840} {"train_loss": -12.540485382080078, "global_step": 309242, "epoch": 1840} {"train_loss": -12.347393989562988, "global_step": 309243, "epoch": 1840} {"train_loss": -12.138771057128906, "global_step": 309244, "epoch": 1840} {"train_loss": -11.983036041259766, "global_step": 309245, "epoch": 1840} {"train_loss": -12.456425666809082, "global_step": 309246, "epoch": 1840} {"train_loss": -12.19984245300293, "global_step": 309247, "epoch": 1840} {"train_loss": -11.774879455566406, "global_step": 309248, "epoch": 1840} {"train_loss": -11.916767120361328, "global_step": 309249, "epoch": 1840} {"train_loss": -12.461183547973633, "global_step": 309250, "epoch": 1840} {"train_loss": -12.48868179321289, "global_step": 309251, "epoch": 1840} {"train_loss": -11.671988487243652, "global_step": 309252, "epoch": 1840} {"train_loss": -11.416110038757324, "global_step": 309253, "epoch": 1840} {"train_loss": -12.275728225708008, "global_step": 309254, "epoch": 1840} {"train_loss": -12.132288932800293, "global_step": 309255, "epoch": 1840} {"train_loss": -11.958314895629883, "global_step": 309256, "epoch": 1840} {"train_loss": -12.476919174194336, "global_step": 309257, "epoch": 1840} {"train_loss": -12.41697883605957, "global_step": 309258, "epoch": 1840} {"train_loss": -12.16602611541748, "global_step": 309259, "epoch": 1840} {"train_loss": -12.042797088623047, "global_step": 309260, "epoch": 1840} {"train_loss": -11.548576354980469, "global_step": 309261, "epoch": 1840} {"train_loss": -12.185098648071289, "global_step": 309262, "epoch": 1840} {"train_loss": -12.168183326721191, "global_step": 309263, "epoch": 1840} {"train_loss": -11.143265724182129, "global_step": 309264, "epoch": 1840} {"train_loss": -11.446798324584961, "global_step": 309265, "epoch": 1840} {"train_loss": -11.73443603515625, "global_step": 309266, "epoch": 1840} {"train_loss": -11.949024200439453, "global_step": 309267, "epoch": 1840} {"train_loss": -12.141632080078125, "global_step": 309268, "epoch": 1840} {"train_loss": -11.887519836425781, "global_step": 309269, "epoch": 1840} {"train_loss": -11.867578506469727, "global_step": 309270, "epoch": 1840} {"train_loss": -11.924816131591797, "global_step": 309271, "epoch": 1840} {"train_loss": -12.327957153320312, "global_step": 309272, "epoch": 1840} {"train_loss": -11.056131362915039, "global_step": 309273, "epoch": 1840} {"train_loss": -9.913511276245117, "global_step": 309274, "epoch": 1840} {"train_loss": -10.699651718139648, "global_step": 309275, "epoch": 1840} {"train_loss": -11.836381912231445, "global_step": 309276, "epoch": 1840} {"train_loss": -9.285731315612793, "global_step": 309277, "epoch": 1840} {"train_loss": -11.264374732971191, "global_step": 309278, "epoch": 1840} {"train_loss": -10.461020469665527, "global_step": 309279, "epoch": 1840} {"train_loss": -10.556390762329102, "global_step": 309280, "epoch": 1840} {"train_loss": -10.686601638793945, "global_step": 309281, "epoch": 1840} {"train_loss": -10.724729537963867, "global_step": 309282, "epoch": 1840} {"train_loss": -10.17138385772705, "global_step": 309283, "epoch": 1840} {"train_loss": -10.907204627990723, "global_step": 309284, "epoch": 1840} {"train_loss": -10.207976341247559, "global_step": 309285, "epoch": 1840} {"train_loss": -10.996179580688477, "global_step": 309286, "epoch": 1840} {"train_loss": -11.58314531757718, "global_step": 309287, "epoch": 1840, "val_loss": 285620.59375, "train_action_mse_error": 1.6939021348953247} {"train_loss": -10.49151611328125, "global_step": 309288, "epoch": 1841} {"train_loss": -10.973426818847656, "global_step": 309289, "epoch": 1841} {"train_loss": -11.169886589050293, "global_step": 309290, "epoch": 1841} {"train_loss": -9.842887878417969, "global_step": 309291, "epoch": 1841} {"train_loss": -11.627035140991211, "global_step": 309292, "epoch": 1841} {"train_loss": -10.87382698059082, "global_step": 309293, "epoch": 1841} {"train_loss": -11.189186096191406, "global_step": 309294, "epoch": 1841} {"train_loss": -11.213682174682617, "global_step": 309295, "epoch": 1841} {"train_loss": -11.235923767089844, "global_step": 309296, "epoch": 1841} {"train_loss": -11.639444351196289, "global_step": 309297, "epoch": 1841} {"train_loss": -11.345040321350098, "global_step": 309298, "epoch": 1841} {"train_loss": -11.287103652954102, "global_step": 309299, "epoch": 1841} {"train_loss": -10.793808937072754, "global_step": 309300, "epoch": 1841} {"train_loss": -11.658464431762695, "global_step": 309301, "epoch": 1841} {"train_loss": -9.496624946594238, "global_step": 309302, "epoch": 1841} {"train_loss": -11.699278831481934, "global_step": 309303, "epoch": 1841} {"train_loss": -10.548894882202148, "global_step": 309304, "epoch": 1841} {"train_loss": -11.346821784973145, "global_step": 309305, "epoch": 1841} {"train_loss": -10.423836708068848, "global_step": 309306, "epoch": 1841} {"train_loss": -11.548738479614258, "global_step": 309307, "epoch": 1841} {"train_loss": -10.574807167053223, "global_step": 309308, "epoch": 1841} {"train_loss": -11.834296226501465, "global_step": 309309, "epoch": 1841} {"train_loss": -10.863991737365723, "global_step": 309310, "epoch": 1841} {"train_loss": -11.58349609375, "global_step": 309311, "epoch": 1841} {"train_loss": -11.111300468444824, "global_step": 309312, "epoch": 1841} {"train_loss": -11.253654479980469, "global_step": 309313, "epoch": 1841} {"train_loss": -11.367155075073242, "global_step": 309314, "epoch": 1841} {"train_loss": -11.43301010131836, "global_step": 309315, "epoch": 1841} {"train_loss": -11.176637649536133, "global_step": 309316, "epoch": 1841} {"train_loss": -11.666938781738281, "global_step": 309317, "epoch": 1841} {"train_loss": -11.555675506591797, "global_step": 309318, "epoch": 1841} {"train_loss": -11.532491683959961, "global_step": 309319, "epoch": 1841} {"train_loss": -11.536561965942383, "global_step": 309320, "epoch": 1841} {"train_loss": -11.637123107910156, "global_step": 309321, "epoch": 1841} {"train_loss": -11.9451904296875, "global_step": 309322, "epoch": 1841} {"train_loss": -11.858366012573242, "global_step": 309323, "epoch": 1841} {"train_loss": -11.76450252532959, "global_step": 309324, "epoch": 1841} {"train_loss": -11.728581428527832, "global_step": 309325, "epoch": 1841} {"train_loss": -11.491384506225586, "global_step": 309326, "epoch": 1841} {"train_loss": -11.767597198486328, "global_step": 309327, "epoch": 1841} {"train_loss": -11.76217269897461, "global_step": 309328, "epoch": 1841} {"train_loss": -11.743353843688965, "global_step": 309329, "epoch": 1841} {"train_loss": -11.947282791137695, "global_step": 309330, "epoch": 1841} {"train_loss": -11.674952507019043, "global_step": 309331, "epoch": 1841} {"train_loss": -12.229281425476074, "global_step": 309332, "epoch": 1841} {"train_loss": -11.774898529052734, "global_step": 309333, "epoch": 1841} {"train_loss": -12.144760131835938, "global_step": 309334, "epoch": 1841} {"train_loss": -11.766464233398438, "global_step": 309335, "epoch": 1841} {"train_loss": -12.234121322631836, "global_step": 309336, "epoch": 1841} {"train_loss": -11.93739128112793, "global_step": 309337, "epoch": 1841} {"train_loss": -12.217880249023438, "global_step": 309338, "epoch": 1841} {"train_loss": -11.809770584106445, "global_step": 309339, "epoch": 1841} {"train_loss": -11.964971542358398, "global_step": 309340, "epoch": 1841} {"train_loss": -12.01863956451416, "global_step": 309341, "epoch": 1841} {"train_loss": -12.161317825317383, "global_step": 309342, "epoch": 1841} {"train_loss": -12.226195335388184, "global_step": 309343, "epoch": 1841} {"train_loss": -12.05883502960205, "global_step": 309344, "epoch": 1841} {"train_loss": -12.094232559204102, "global_step": 309345, "epoch": 1841} {"train_loss": -12.287187576293945, "global_step": 309346, "epoch": 1841} {"train_loss": -12.140453338623047, "global_step": 309347, "epoch": 1841} {"train_loss": -12.249256134033203, "global_step": 309348, "epoch": 1841} {"train_loss": -11.992240905761719, "global_step": 309349, "epoch": 1841} {"train_loss": -12.156962394714355, "global_step": 309350, "epoch": 1841} {"train_loss": -12.052019119262695, "global_step": 309351, "epoch": 1841} {"train_loss": -12.148225784301758, "global_step": 309352, "epoch": 1841} {"train_loss": -12.066041946411133, "global_step": 309353, "epoch": 1841} {"train_loss": -11.906952857971191, "global_step": 309354, "epoch": 1841} {"train_loss": -12.114076614379883, "global_step": 309355, "epoch": 1841} {"train_loss": -12.092582702636719, "global_step": 309356, "epoch": 1841} {"train_loss": -12.391609191894531, "global_step": 309357, "epoch": 1841} {"train_loss": -12.028072357177734, "global_step": 309358, "epoch": 1841} {"train_loss": -12.165318489074707, "global_step": 309359, "epoch": 1841} {"train_loss": -12.507996559143066, "global_step": 309360, "epoch": 1841} {"train_loss": -12.358007431030273, "global_step": 309361, "epoch": 1841} {"train_loss": -12.395187377929688, "global_step": 309362, "epoch": 1841} {"train_loss": -12.384551048278809, "global_step": 309363, "epoch": 1841} {"train_loss": -12.313809394836426, "global_step": 309364, "epoch": 1841} {"train_loss": -12.222628593444824, "global_step": 309365, "epoch": 1841} {"train_loss": -12.337395668029785, "global_step": 309366, "epoch": 1841} {"train_loss": -12.395339012145996, "global_step": 309367, "epoch": 1841} {"train_loss": -12.341850280761719, "global_step": 309368, "epoch": 1841} {"train_loss": -12.221941947937012, "global_step": 309369, "epoch": 1841} {"train_loss": -12.330110549926758, "global_step": 309370, "epoch": 1841} {"train_loss": -12.365473747253418, "global_step": 309371, "epoch": 1841} {"train_loss": -12.4854736328125, "global_step": 309372, "epoch": 1841} {"train_loss": -11.961954116821289, "global_step": 309373, "epoch": 1841} {"train_loss": -12.524502754211426, "global_step": 309374, "epoch": 1841} {"train_loss": -11.737613677978516, "global_step": 309375, "epoch": 1841} {"train_loss": -12.12635612487793, "global_step": 309376, "epoch": 1841} {"train_loss": -12.065667152404785, "global_step": 309377, "epoch": 1841} {"train_loss": -11.787593841552734, "global_step": 309378, "epoch": 1841} {"train_loss": -11.65831184387207, "global_step": 309379, "epoch": 1841} {"train_loss": -11.98417854309082, "global_step": 309380, "epoch": 1841} {"train_loss": -12.450763702392578, "global_step": 309381, "epoch": 1841} {"train_loss": -12.038618087768555, "global_step": 309382, "epoch": 1841} {"train_loss": -12.125067710876465, "global_step": 309383, "epoch": 1841} {"train_loss": -12.533843994140625, "global_step": 309384, "epoch": 1841} {"train_loss": -12.36697006225586, "global_step": 309385, "epoch": 1841} {"train_loss": -12.45728874206543, "global_step": 309386, "epoch": 1841} {"train_loss": -12.265974044799805, "global_step": 309387, "epoch": 1841} {"train_loss": -12.156579971313477, "global_step": 309388, "epoch": 1841} {"train_loss": -12.076360702514648, "global_step": 309389, "epoch": 1841} {"train_loss": -11.214682579040527, "global_step": 309390, "epoch": 1841} {"train_loss": -11.959925651550293, "global_step": 309391, "epoch": 1841} {"train_loss": -12.294906616210938, "global_step": 309392, "epoch": 1841} {"train_loss": -12.182008743286133, "global_step": 309393, "epoch": 1841} {"train_loss": -12.12576675415039, "global_step": 309394, "epoch": 1841} {"train_loss": -12.430158615112305, "global_step": 309395, "epoch": 1841} {"train_loss": -12.093917846679688, "global_step": 309396, "epoch": 1841} {"train_loss": -11.56320571899414, "global_step": 309397, "epoch": 1841} {"train_loss": -12.028276443481445, "global_step": 309398, "epoch": 1841} {"train_loss": -12.460943222045898, "global_step": 309399, "epoch": 1841} {"train_loss": -11.790417671203613, "global_step": 309400, "epoch": 1841} {"train_loss": -11.108108520507812, "global_step": 309401, "epoch": 1841} {"train_loss": -12.122867584228516, "global_step": 309402, "epoch": 1841} {"train_loss": -12.067974090576172, "global_step": 309403, "epoch": 1841} {"train_loss": -11.046834945678711, "global_step": 309404, "epoch": 1841} {"train_loss": -11.103802680969238, "global_step": 309405, "epoch": 1841} {"train_loss": -11.966360092163086, "global_step": 309406, "epoch": 1841} {"train_loss": -12.437908172607422, "global_step": 309407, "epoch": 1841} {"train_loss": -11.400379180908203, "global_step": 309408, "epoch": 1841} {"train_loss": -10.813870429992676, "global_step": 309409, "epoch": 1841} {"train_loss": -12.278238296508789, "global_step": 309410, "epoch": 1841} {"train_loss": -10.767983436584473, "global_step": 309411, "epoch": 1841} {"train_loss": -11.262696266174316, "global_step": 309412, "epoch": 1841} {"train_loss": -11.895386695861816, "global_step": 309413, "epoch": 1841} {"train_loss": -11.915216445922852, "global_step": 309414, "epoch": 1841} {"train_loss": -11.380983352661133, "global_step": 309415, "epoch": 1841} {"train_loss": -11.802982330322266, "global_step": 309416, "epoch": 1841} {"train_loss": -11.997900009155273, "global_step": 309417, "epoch": 1841} {"train_loss": -11.717245101928711, "global_step": 309418, "epoch": 1841} {"train_loss": -11.691131591796875, "global_step": 309419, "epoch": 1841} {"train_loss": -11.495226860046387, "global_step": 309420, "epoch": 1841} {"train_loss": -11.64315128326416, "global_step": 309421, "epoch": 1841} {"train_loss": -11.992818832397461, "global_step": 309422, "epoch": 1841} {"train_loss": -11.323177337646484, "global_step": 309423, "epoch": 1841} {"train_loss": -11.825884819030762, "global_step": 309424, "epoch": 1841} {"train_loss": -11.480405807495117, "global_step": 309425, "epoch": 1841} {"train_loss": -12.259425163269043, "global_step": 309426, "epoch": 1841} {"train_loss": -11.453232765197754, "global_step": 309427, "epoch": 1841} {"train_loss": -12.029951095581055, "global_step": 309428, "epoch": 1841} {"train_loss": -11.751691818237305, "global_step": 309429, "epoch": 1841} {"train_loss": -11.877323150634766, "global_step": 309430, "epoch": 1841} {"train_loss": -11.993114471435547, "global_step": 309431, "epoch": 1841} {"train_loss": -11.918495178222656, "global_step": 309432, "epoch": 1841} {"train_loss": -12.178021430969238, "global_step": 309433, "epoch": 1841} {"train_loss": -11.859952926635742, "global_step": 309434, "epoch": 1841} {"train_loss": -11.829330444335938, "global_step": 309435, "epoch": 1841} {"train_loss": -11.940431594848633, "global_step": 309436, "epoch": 1841} {"train_loss": -11.502054214477539, "global_step": 309437, "epoch": 1841} {"train_loss": -12.159223556518555, "global_step": 309438, "epoch": 1841} {"train_loss": -11.915616035461426, "global_step": 309439, "epoch": 1841} {"train_loss": -11.535873413085938, "global_step": 309440, "epoch": 1841} {"train_loss": -12.223118782043457, "global_step": 309441, "epoch": 1841} {"train_loss": -11.602776527404785, "global_step": 309442, "epoch": 1841} {"train_loss": -11.85125732421875, "global_step": 309443, "epoch": 1841} {"train_loss": -12.252384185791016, "global_step": 309444, "epoch": 1841} {"train_loss": -12.043862342834473, "global_step": 309445, "epoch": 1841} {"train_loss": -11.989765167236328, "global_step": 309446, "epoch": 1841} {"train_loss": -11.854768753051758, "global_step": 309447, "epoch": 1841} {"train_loss": -11.778526306152344, "global_step": 309448, "epoch": 1841} {"train_loss": -12.125223159790039, "global_step": 309449, "epoch": 1841} {"train_loss": -11.930135726928711, "global_step": 309450, "epoch": 1841} {"train_loss": -11.84527587890625, "global_step": 309451, "epoch": 1841} {"train_loss": -12.081233978271484, "global_step": 309452, "epoch": 1841} {"train_loss": -11.311781883239746, "global_step": 309453, "epoch": 1841} {"train_loss": -12.337240219116211, "global_step": 309454, "epoch": 1841} {"train_loss": -11.799504251707168, "global_step": 309455, "epoch": 1841, "val_loss": 283635.96875} {"train_loss": -12.092357635498047, "global_step": 309456, "epoch": 1842} {"train_loss": -12.083471298217773, "global_step": 309457, "epoch": 1842} {"train_loss": -12.01971435546875, "global_step": 309458, "epoch": 1842} {"train_loss": -12.095902442932129, "global_step": 309459, "epoch": 1842} {"train_loss": -12.254029273986816, "global_step": 309460, "epoch": 1842} {"train_loss": -12.258687973022461, "global_step": 309461, "epoch": 1842} {"train_loss": -11.83910846710205, "global_step": 309462, "epoch": 1842} {"train_loss": -11.773681640625, "global_step": 309463, "epoch": 1842} {"train_loss": -11.853132247924805, "global_step": 309464, "epoch": 1842} {"train_loss": -11.997535705566406, "global_step": 309465, "epoch": 1842} {"train_loss": -11.868224143981934, "global_step": 309466, "epoch": 1842} {"train_loss": -12.161888122558594, "global_step": 309467, "epoch": 1842} {"train_loss": -11.850542068481445, "global_step": 309468, "epoch": 1842} {"train_loss": -12.091836929321289, "global_step": 309469, "epoch": 1842} {"train_loss": -11.966803550720215, "global_step": 309470, "epoch": 1842} {"train_loss": -12.014074325561523, "global_step": 309471, "epoch": 1842} {"train_loss": -12.365619659423828, "global_step": 309472, "epoch": 1842} {"train_loss": -11.867810249328613, "global_step": 309473, "epoch": 1842} {"train_loss": -12.427593231201172, "global_step": 309474, "epoch": 1842} {"train_loss": -12.018509864807129, "global_step": 309475, "epoch": 1842} {"train_loss": -12.580794334411621, "global_step": 309476, "epoch": 1842} {"train_loss": -12.062599182128906, "global_step": 309477, "epoch": 1842} {"train_loss": -12.11788272857666, "global_step": 309478, "epoch": 1842} {"train_loss": -12.232665061950684, "global_step": 309479, "epoch": 1842} {"train_loss": -11.783329010009766, "global_step": 309480, "epoch": 1842} {"train_loss": -12.04367733001709, "global_step": 309481, "epoch": 1842} {"train_loss": -11.804577827453613, "global_step": 309482, "epoch": 1842} {"train_loss": -10.30306339263916, "global_step": 309483, "epoch": 1842} {"train_loss": -11.213003158569336, "global_step": 309484, "epoch": 1842} {"train_loss": -11.524599075317383, "global_step": 309485, "epoch": 1842} {"train_loss": -10.797525405883789, "global_step": 309486, "epoch": 1842} {"train_loss": -11.81520938873291, "global_step": 309487, "epoch": 1842} {"train_loss": -11.19133186340332, "global_step": 309488, "epoch": 1842} {"train_loss": -10.494178771972656, "global_step": 309489, "epoch": 1842} {"train_loss": -10.714269638061523, "global_step": 309490, "epoch": 1842} {"train_loss": -11.166206359863281, "global_step": 309491, "epoch": 1842} {"train_loss": -9.888628005981445, "global_step": 309492, "epoch": 1842} {"train_loss": -10.110629081726074, "global_step": 309493, "epoch": 1842} {"train_loss": -11.253971099853516, "global_step": 309494, "epoch": 1842} {"train_loss": -8.90896987915039, "global_step": 309495, "epoch": 1842} {"train_loss": -10.564386367797852, "global_step": 309496, "epoch": 1842} {"train_loss": -11.49953842163086, "global_step": 309497, "epoch": 1842} {"train_loss": -11.11305046081543, "global_step": 309498, "epoch": 1842} {"train_loss": -10.691211700439453, "global_step": 309499, "epoch": 1842} {"train_loss": -12.124214172363281, "global_step": 309500, "epoch": 1842} {"train_loss": -10.444612503051758, "global_step": 309501, "epoch": 1842} {"train_loss": -11.92642879486084, "global_step": 309502, "epoch": 1842} {"train_loss": -10.73006820678711, "global_step": 309503, "epoch": 1842} {"train_loss": -11.59144401550293, "global_step": 309504, "epoch": 1842} {"train_loss": -11.834095001220703, "global_step": 309505, "epoch": 1842} {"train_loss": -11.029722213745117, "global_step": 309506, "epoch": 1842} {"train_loss": -11.859844207763672, "global_step": 309507, "epoch": 1842} {"train_loss": -10.862434387207031, "global_step": 309508, "epoch": 1842} {"train_loss": -12.09370231628418, "global_step": 309509, "epoch": 1842} {"train_loss": -11.440279006958008, "global_step": 309510, "epoch": 1842} {"train_loss": -11.864095687866211, "global_step": 309511, "epoch": 1842} {"train_loss": -11.64944076538086, "global_step": 309512, "epoch": 1842} {"train_loss": -11.72804069519043, "global_step": 309513, "epoch": 1842} {"train_loss": -11.943258285522461, "global_step": 309514, "epoch": 1842} {"train_loss": -11.808530807495117, "global_step": 309515, "epoch": 1842} {"train_loss": -11.994906425476074, "global_step": 309516, "epoch": 1842} {"train_loss": -11.726468086242676, "global_step": 309517, "epoch": 1842} {"train_loss": -11.842158317565918, "global_step": 309518, "epoch": 1842} {"train_loss": -11.87907886505127, "global_step": 309519, "epoch": 1842} {"train_loss": -11.997081756591797, "global_step": 309520, "epoch": 1842} {"train_loss": -12.077285766601562, "global_step": 309521, "epoch": 1842} {"train_loss": -12.128284454345703, "global_step": 309522, "epoch": 1842} {"train_loss": -11.98160171508789, "global_step": 309523, "epoch": 1842} {"train_loss": -11.761894226074219, "global_step": 309524, "epoch": 1842} {"train_loss": -12.20383358001709, "global_step": 309525, "epoch": 1842} {"train_loss": -11.86841106414795, "global_step": 309526, "epoch": 1842} {"train_loss": -12.1263427734375, "global_step": 309527, "epoch": 1842} {"train_loss": -11.856945037841797, "global_step": 309528, "epoch": 1842} {"train_loss": -12.215818405151367, "global_step": 309529, "epoch": 1842} {"train_loss": -11.9932279586792, "global_step": 309530, "epoch": 1842} {"train_loss": -12.062482833862305, "global_step": 309531, "epoch": 1842} {"train_loss": -11.828083038330078, "global_step": 309532, "epoch": 1842} {"train_loss": -12.423395156860352, "global_step": 309533, "epoch": 1842} {"train_loss": -12.155481338500977, "global_step": 309534, "epoch": 1842} {"train_loss": -12.218328475952148, "global_step": 309535, "epoch": 1842} {"train_loss": -12.174846649169922, "global_step": 309536, "epoch": 1842} {"train_loss": -12.264528274536133, "global_step": 309537, "epoch": 1842} {"train_loss": -12.14451789855957, "global_step": 309538, "epoch": 1842} {"train_loss": -12.323016166687012, "global_step": 309539, "epoch": 1842} {"train_loss": -12.169825553894043, "global_step": 309540, "epoch": 1842} {"train_loss": -12.14699935913086, "global_step": 309541, "epoch": 1842} {"train_loss": -12.177358627319336, "global_step": 309542, "epoch": 1842} {"train_loss": -12.587602615356445, "global_step": 309543, "epoch": 1842} {"train_loss": -12.392148971557617, "global_step": 309544, "epoch": 1842} {"train_loss": -12.357234954833984, "global_step": 309545, "epoch": 1842} {"train_loss": -12.485916137695312, "global_step": 309546, "epoch": 1842} {"train_loss": -12.350598335266113, "global_step": 309547, "epoch": 1842} {"train_loss": -12.293964385986328, "global_step": 309548, "epoch": 1842} {"train_loss": -12.369958877563477, "global_step": 309549, "epoch": 1842} {"train_loss": -12.517874717712402, "global_step": 309550, "epoch": 1842} {"train_loss": -12.195150375366211, "global_step": 309551, "epoch": 1842} {"train_loss": -12.328776359558105, "global_step": 309552, "epoch": 1842} {"train_loss": -12.382518768310547, "global_step": 309553, "epoch": 1842} {"train_loss": -12.419561386108398, "global_step": 309554, "epoch": 1842} {"train_loss": -12.329916000366211, "global_step": 309555, "epoch": 1842} {"train_loss": -12.393052101135254, "global_step": 309556, "epoch": 1842} {"train_loss": -12.62750244140625, "global_step": 309557, "epoch": 1842} {"train_loss": -12.394603729248047, "global_step": 309558, "epoch": 1842} {"train_loss": -12.390542984008789, "global_step": 309559, "epoch": 1842} {"train_loss": -12.45318603515625, "global_step": 309560, "epoch": 1842} {"train_loss": -12.390087127685547, "global_step": 309561, "epoch": 1842} {"train_loss": -12.51279067993164, "global_step": 309562, "epoch": 1842} {"train_loss": -12.459997177124023, "global_step": 309563, "epoch": 1842} {"train_loss": -12.433412551879883, "global_step": 309564, "epoch": 1842} {"train_loss": -12.569124221801758, "global_step": 309565, "epoch": 1842} {"train_loss": -12.472071647644043, "global_step": 309566, "epoch": 1842} {"train_loss": -12.551580429077148, "global_step": 309567, "epoch": 1842} {"train_loss": -12.144932746887207, "global_step": 309568, "epoch": 1842} {"train_loss": -12.37669849395752, "global_step": 309569, "epoch": 1842} {"train_loss": -12.38354206085205, "global_step": 309570, "epoch": 1842} {"train_loss": -12.031691551208496, "global_step": 309571, "epoch": 1842} {"train_loss": -12.300363540649414, "global_step": 309572, "epoch": 1842} {"train_loss": -12.659187316894531, "global_step": 309573, "epoch": 1842} {"train_loss": -12.248294830322266, "global_step": 309574, "epoch": 1842} {"train_loss": -12.370624542236328, "global_step": 309575, "epoch": 1842} {"train_loss": -12.35243034362793, "global_step": 309576, "epoch": 1842} {"train_loss": -12.132673263549805, "global_step": 309577, "epoch": 1842} {"train_loss": -12.170610427856445, "global_step": 309578, "epoch": 1842} {"train_loss": -12.267179489135742, "global_step": 309579, "epoch": 1842} {"train_loss": -12.232851028442383, "global_step": 309580, "epoch": 1842} {"train_loss": -11.84796142578125, "global_step": 309581, "epoch": 1842} {"train_loss": -12.423629760742188, "global_step": 309582, "epoch": 1842} {"train_loss": -12.03136920928955, "global_step": 309583, "epoch": 1842} {"train_loss": -12.177680969238281, "global_step": 309584, "epoch": 1842} {"train_loss": -11.27529525756836, "global_step": 309585, "epoch": 1842} {"train_loss": -11.91166877746582, "global_step": 309586, "epoch": 1842} {"train_loss": -11.408014297485352, "global_step": 309587, "epoch": 1842} {"train_loss": -11.825078964233398, "global_step": 309588, "epoch": 1842} {"train_loss": -10.809098243713379, "global_step": 309589, "epoch": 1842} {"train_loss": -11.664076805114746, "global_step": 309590, "epoch": 1842} {"train_loss": -11.444610595703125, "global_step": 309591, "epoch": 1842} {"train_loss": -11.808351516723633, "global_step": 309592, "epoch": 1842} {"train_loss": -10.956782341003418, "global_step": 309593, "epoch": 1842} {"train_loss": -11.284782409667969, "global_step": 309594, "epoch": 1842} {"train_loss": -11.992971420288086, "global_step": 309595, "epoch": 1842} {"train_loss": -11.45469856262207, "global_step": 309596, "epoch": 1842} {"train_loss": -11.122573852539062, "global_step": 309597, "epoch": 1842} {"train_loss": -12.275142669677734, "global_step": 309598, "epoch": 1842} {"train_loss": -11.203675270080566, "global_step": 309599, "epoch": 1842} {"train_loss": -12.472143173217773, "global_step": 309600, "epoch": 1842} {"train_loss": -11.350691795349121, "global_step": 309601, "epoch": 1842} {"train_loss": -11.90060806274414, "global_step": 309602, "epoch": 1842} {"train_loss": -11.805782318115234, "global_step": 309603, "epoch": 1842} {"train_loss": -11.732913970947266, "global_step": 309604, "epoch": 1842} {"train_loss": -11.421871185302734, "global_step": 309605, "epoch": 1842} {"train_loss": -11.932943344116211, "global_step": 309606, "epoch": 1842} {"train_loss": -11.183609008789062, "global_step": 309607, "epoch": 1842} {"train_loss": -11.79183578491211, "global_step": 309608, "epoch": 1842} {"train_loss": -11.636275291442871, "global_step": 309609, "epoch": 1842} {"train_loss": -11.530832290649414, "global_step": 309610, "epoch": 1842} {"train_loss": -11.822105407714844, "global_step": 309611, "epoch": 1842} {"train_loss": -12.032062530517578, "global_step": 309612, "epoch": 1842} {"train_loss": -10.79505729675293, "global_step": 309613, "epoch": 1842} {"train_loss": -11.706474304199219, "global_step": 309614, "epoch": 1842} {"train_loss": -11.867250442504883, "global_step": 309615, "epoch": 1842} {"train_loss": -11.51494026184082, "global_step": 309616, "epoch": 1842} {"train_loss": -10.928108215332031, "global_step": 309617, "epoch": 1842} {"train_loss": -11.022214889526367, "global_step": 309618, "epoch": 1842} {"train_loss": -11.175132751464844, "global_step": 309619, "epoch": 1842} {"train_loss": -10.227092742919922, "global_step": 309620, "epoch": 1842} {"train_loss": -11.24331283569336, "global_step": 309621, "epoch": 1842} {"train_loss": -10.92434024810791, "global_step": 309622, "epoch": 1842} {"train_loss": -11.819071894600278, "global_step": 309623, "epoch": 1842, "val_loss": 287609.9375} {"train_loss": -10.349493026733398, "global_step": 309624, "epoch": 1843} {"train_loss": -11.403159141540527, "global_step": 309625, "epoch": 1843} {"train_loss": -10.803841590881348, "global_step": 309626, "epoch": 1843} {"train_loss": -11.195653915405273, "global_step": 309627, "epoch": 1843} {"train_loss": -10.481542587280273, "global_step": 309628, "epoch": 1843} {"train_loss": -11.300025939941406, "global_step": 309629, "epoch": 1843} {"train_loss": -9.332788467407227, "global_step": 309630, "epoch": 1843} {"train_loss": -10.312505722045898, "global_step": 309631, "epoch": 1843} {"train_loss": -9.950516700744629, "global_step": 309632, "epoch": 1843} {"train_loss": -11.133844375610352, "global_step": 309633, "epoch": 1843} {"train_loss": -10.616218566894531, "global_step": 309634, "epoch": 1843} {"train_loss": -10.822032928466797, "global_step": 309635, "epoch": 1843} {"train_loss": -11.332059860229492, "global_step": 309636, "epoch": 1843} {"train_loss": -10.96946907043457, "global_step": 309637, "epoch": 1843} {"train_loss": -10.853496551513672, "global_step": 309638, "epoch": 1843} {"train_loss": -10.90685749053955, "global_step": 309639, "epoch": 1843} {"train_loss": -11.155340194702148, "global_step": 309640, "epoch": 1843} {"train_loss": -11.329574584960938, "global_step": 309641, "epoch": 1843} {"train_loss": -11.048408508300781, "global_step": 309642, "epoch": 1843} {"train_loss": -11.260082244873047, "global_step": 309643, "epoch": 1843} {"train_loss": -11.061481475830078, "global_step": 309644, "epoch": 1843} {"train_loss": -11.372486114501953, "global_step": 309645, "epoch": 1843} {"train_loss": -11.964547157287598, "global_step": 309646, "epoch": 1843} {"train_loss": -10.916784286499023, "global_step": 309647, "epoch": 1843} {"train_loss": -11.473341941833496, "global_step": 309648, "epoch": 1843} {"train_loss": -11.525947570800781, "global_step": 309649, "epoch": 1843} {"train_loss": -11.385000228881836, "global_step": 309650, "epoch": 1843} {"train_loss": -11.350605964660645, "global_step": 309651, "epoch": 1843} {"train_loss": -11.752650260925293, "global_step": 309652, "epoch": 1843} {"train_loss": -11.313314437866211, "global_step": 309653, "epoch": 1843} {"train_loss": -11.972115516662598, "global_step": 309654, "epoch": 1843} {"train_loss": -11.380849838256836, "global_step": 309655, "epoch": 1843} {"train_loss": -11.816946029663086, "global_step": 309656, "epoch": 1843} {"train_loss": -11.621639251708984, "global_step": 309657, "epoch": 1843} {"train_loss": -11.523937225341797, "global_step": 309658, "epoch": 1843} {"train_loss": -11.642871856689453, "global_step": 309659, "epoch": 1843} {"train_loss": -11.398727416992188, "global_step": 309660, "epoch": 1843} {"train_loss": -11.69295883178711, "global_step": 309661, "epoch": 1843} {"train_loss": -11.584085464477539, "global_step": 309662, "epoch": 1843} {"train_loss": -11.536121368408203, "global_step": 309663, "epoch": 1843} {"train_loss": -11.831880569458008, "global_step": 309664, "epoch": 1843} {"train_loss": -11.731420516967773, "global_step": 309665, "epoch": 1843} {"train_loss": -11.477560043334961, "global_step": 309666, "epoch": 1843} {"train_loss": -11.599047660827637, "global_step": 309667, "epoch": 1843} {"train_loss": -11.853034973144531, "global_step": 309668, "epoch": 1843} {"train_loss": -11.858739852905273, "global_step": 309669, "epoch": 1843} {"train_loss": -11.925105094909668, "global_step": 309670, "epoch": 1843} {"train_loss": -12.01199722290039, "global_step": 309671, "epoch": 1843} {"train_loss": -12.00673770904541, "global_step": 309672, "epoch": 1843} {"train_loss": -11.815239906311035, "global_step": 309673, "epoch": 1843} {"train_loss": -11.94942855834961, "global_step": 309674, "epoch": 1843} {"train_loss": -12.030418395996094, "global_step": 309675, "epoch": 1843} {"train_loss": -12.149282455444336, "global_step": 309676, "epoch": 1843} {"train_loss": -11.976097106933594, "global_step": 309677, "epoch": 1843} {"train_loss": -12.208224296569824, "global_step": 309678, "epoch": 1843} {"train_loss": -12.242267608642578, "global_step": 309679, "epoch": 1843} {"train_loss": -12.039676666259766, "global_step": 309680, "epoch": 1843} {"train_loss": -12.167335510253906, "global_step": 309681, "epoch": 1843} {"train_loss": -12.189826011657715, "global_step": 309682, "epoch": 1843} {"train_loss": -12.27822208404541, "global_step": 309683, "epoch": 1843} {"train_loss": -12.262594223022461, "global_step": 309684, "epoch": 1843} {"train_loss": -11.961970329284668, "global_step": 309685, "epoch": 1843} {"train_loss": -12.212514877319336, "global_step": 309686, "epoch": 1843} {"train_loss": -12.175053596496582, "global_step": 309687, "epoch": 1843} {"train_loss": -12.171347618103027, "global_step": 309688, "epoch": 1843} {"train_loss": -11.705780029296875, "global_step": 309689, "epoch": 1843} {"train_loss": -12.29142951965332, "global_step": 309690, "epoch": 1843} {"train_loss": -12.055536270141602, "global_step": 309691, "epoch": 1843} {"train_loss": -12.403313636779785, "global_step": 309692, "epoch": 1843} {"train_loss": -12.210714340209961, "global_step": 309693, "epoch": 1843} {"train_loss": -12.247539520263672, "global_step": 309694, "epoch": 1843} {"train_loss": -12.39790153503418, "global_step": 309695, "epoch": 1843} {"train_loss": -12.197656631469727, "global_step": 309696, "epoch": 1843} {"train_loss": -12.350213050842285, "global_step": 309697, "epoch": 1843} {"train_loss": -12.223920822143555, "global_step": 309698, "epoch": 1843} {"train_loss": -12.373714447021484, "global_step": 309699, "epoch": 1843} {"train_loss": -12.25692367553711, "global_step": 309700, "epoch": 1843} {"train_loss": -12.247295379638672, "global_step": 309701, "epoch": 1843} {"train_loss": -11.895682334899902, "global_step": 309702, "epoch": 1843} {"train_loss": -12.292632102966309, "global_step": 309703, "epoch": 1843} {"train_loss": -12.406270980834961, "global_step": 309704, "epoch": 1843} {"train_loss": -12.052376747131348, "global_step": 309705, "epoch": 1843} {"train_loss": -12.526620864868164, "global_step": 309706, "epoch": 1843} {"train_loss": -12.217412948608398, "global_step": 309707, "epoch": 1843} {"train_loss": -12.395452499389648, "global_step": 309708, "epoch": 1843} {"train_loss": -12.38546085357666, "global_step": 309709, "epoch": 1843} {"train_loss": -12.40787124633789, "global_step": 309710, "epoch": 1843} {"train_loss": -12.369245529174805, "global_step": 309711, "epoch": 1843} {"train_loss": -12.2164945602417, "global_step": 309712, "epoch": 1843} {"train_loss": -12.157508850097656, "global_step": 309713, "epoch": 1843} {"train_loss": -12.384808540344238, "global_step": 309714, "epoch": 1843} {"train_loss": -12.356491088867188, "global_step": 309715, "epoch": 1843} {"train_loss": -12.500009536743164, "global_step": 309716, "epoch": 1843} {"train_loss": -12.617233276367188, "global_step": 309717, "epoch": 1843} {"train_loss": -12.47620677947998, "global_step": 309718, "epoch": 1843} {"train_loss": -12.722136497497559, "global_step": 309719, "epoch": 1843} {"train_loss": -12.494819641113281, "global_step": 309720, "epoch": 1843} {"train_loss": -12.421550750732422, "global_step": 309721, "epoch": 1843} {"train_loss": -12.558213233947754, "global_step": 309722, "epoch": 1843} {"train_loss": -12.431167602539062, "global_step": 309723, "epoch": 1843} {"train_loss": -12.49608039855957, "global_step": 309724, "epoch": 1843} {"train_loss": -12.456201553344727, "global_step": 309725, "epoch": 1843} {"train_loss": -12.525304794311523, "global_step": 309726, "epoch": 1843} {"train_loss": -12.343982696533203, "global_step": 309727, "epoch": 1843} {"train_loss": -12.481867790222168, "global_step": 309728, "epoch": 1843} {"train_loss": -12.241230964660645, "global_step": 309729, "epoch": 1843} {"train_loss": -12.25631332397461, "global_step": 309730, "epoch": 1843} {"train_loss": -11.914942741394043, "global_step": 309731, "epoch": 1843} {"train_loss": -12.312435150146484, "global_step": 309732, "epoch": 1843} {"train_loss": -12.419083595275879, "global_step": 309733, "epoch": 1843} {"train_loss": -12.207342147827148, "global_step": 309734, "epoch": 1843} {"train_loss": -11.963668823242188, "global_step": 309735, "epoch": 1843} {"train_loss": -12.194478988647461, "global_step": 309736, "epoch": 1843} {"train_loss": -12.00369644165039, "global_step": 309737, "epoch": 1843} {"train_loss": -12.357710838317871, "global_step": 309738, "epoch": 1843} {"train_loss": -12.559186935424805, "global_step": 309739, "epoch": 1843} {"train_loss": -12.250847816467285, "global_step": 309740, "epoch": 1843} {"train_loss": -11.9677734375, "global_step": 309741, "epoch": 1843} {"train_loss": -11.95228099822998, "global_step": 309742, "epoch": 1843} {"train_loss": -12.300858497619629, "global_step": 309743, "epoch": 1843} {"train_loss": -12.506281852722168, "global_step": 309744, "epoch": 1843} {"train_loss": -12.544778823852539, "global_step": 309745, "epoch": 1843} {"train_loss": -12.548179626464844, "global_step": 309746, "epoch": 1843} {"train_loss": -12.454472541809082, "global_step": 309747, "epoch": 1843} {"train_loss": -12.339841842651367, "global_step": 309748, "epoch": 1843} {"train_loss": -12.347270965576172, "global_step": 309749, "epoch": 1843} {"train_loss": -12.107658386230469, "global_step": 309750, "epoch": 1843} {"train_loss": -12.14441967010498, "global_step": 309751, "epoch": 1843} {"train_loss": -12.524555206298828, "global_step": 309752, "epoch": 1843} {"train_loss": -12.51060676574707, "global_step": 309753, "epoch": 1843} {"train_loss": -12.441987991333008, "global_step": 309754, "epoch": 1843} {"train_loss": -12.17281436920166, "global_step": 309755, "epoch": 1843} {"train_loss": -12.347206115722656, "global_step": 309756, "epoch": 1843} {"train_loss": -12.393905639648438, "global_step": 309757, "epoch": 1843} {"train_loss": -12.382421493530273, "global_step": 309758, "epoch": 1843} {"train_loss": -11.784300804138184, "global_step": 309759, "epoch": 1843} {"train_loss": -12.317415237426758, "global_step": 309760, "epoch": 1843} {"train_loss": -12.08621883392334, "global_step": 309761, "epoch": 1843} {"train_loss": -12.304914474487305, "global_step": 309762, "epoch": 1843} {"train_loss": -11.903724670410156, "global_step": 309763, "epoch": 1843} {"train_loss": -12.10523509979248, "global_step": 309764, "epoch": 1843} {"train_loss": -12.297754287719727, "global_step": 309765, "epoch": 1843} {"train_loss": -11.982852935791016, "global_step": 309766, "epoch": 1843} {"train_loss": -11.857307434082031, "global_step": 309767, "epoch": 1843} {"train_loss": -11.616074562072754, "global_step": 309768, "epoch": 1843} {"train_loss": -11.503702163696289, "global_step": 309769, "epoch": 1843} {"train_loss": -11.19832706451416, "global_step": 309770, "epoch": 1843} {"train_loss": -12.058439254760742, "global_step": 309771, "epoch": 1843} {"train_loss": -11.180575370788574, "global_step": 309772, "epoch": 1843} {"train_loss": -11.40926742553711, "global_step": 309773, "epoch": 1843} {"train_loss": -10.72834587097168, "global_step": 309774, "epoch": 1843} {"train_loss": -12.01365852355957, "global_step": 309775, "epoch": 1843} {"train_loss": -11.054649353027344, "global_step": 309776, "epoch": 1843} {"train_loss": -9.918366432189941, "global_step": 309777, "epoch": 1843} {"train_loss": -10.789628982543945, "global_step": 309778, "epoch": 1843} {"train_loss": -10.100226402282715, "global_step": 309779, "epoch": 1843} {"train_loss": -9.478022575378418, "global_step": 309780, "epoch": 1843} {"train_loss": -10.12037181854248, "global_step": 309781, "epoch": 1843} {"train_loss": -9.71159553527832, "global_step": 309782, "epoch": 1843} {"train_loss": -9.590616226196289, "global_step": 309783, "epoch": 1843} {"train_loss": -9.506759643554688, "global_step": 309784, "epoch": 1843} {"train_loss": -8.909308433532715, "global_step": 309785, "epoch": 1843} {"train_loss": -11.044036865234375, "global_step": 309786, "epoch": 1843} {"train_loss": -9.184099197387695, "global_step": 309787, "epoch": 1843} {"train_loss": -10.708724021911621, "global_step": 309788, "epoch": 1843} {"train_loss": -10.219273567199707, "global_step": 309789, "epoch": 1843} {"train_loss": -9.803572654724121, "global_step": 309790, "epoch": 1843} {"train_loss": -11.728078410738991, "global_step": 309791, "epoch": 1843, "val_loss": 278919.5} {"train_loss": -9.314628601074219, "global_step": 309792, "epoch": 1844} {"train_loss": -9.541900634765625, "global_step": 309793, "epoch": 1844} {"train_loss": -9.74018669128418, "global_step": 309794, "epoch": 1844} {"train_loss": -10.245469093322754, "global_step": 309795, "epoch": 1844} {"train_loss": -9.172450065612793, "global_step": 309796, "epoch": 1844} {"train_loss": -9.85234260559082, "global_step": 309797, "epoch": 1844} {"train_loss": -10.56026554107666, "global_step": 309798, "epoch": 1844} {"train_loss": -10.377896308898926, "global_step": 309799, "epoch": 1844} {"train_loss": -11.020259857177734, "global_step": 309800, "epoch": 1844} {"train_loss": -10.386899948120117, "global_step": 309801, "epoch": 1844} {"train_loss": -10.630531311035156, "global_step": 309802, "epoch": 1844} {"train_loss": -11.02058219909668, "global_step": 309803, "epoch": 1844} {"train_loss": -10.969910621643066, "global_step": 309804, "epoch": 1844} {"train_loss": -10.733348846435547, "global_step": 309805, "epoch": 1844} {"train_loss": -11.62154483795166, "global_step": 309806, "epoch": 1844} {"train_loss": -11.0237398147583, "global_step": 309807, "epoch": 1844} {"train_loss": -11.15025520324707, "global_step": 309808, "epoch": 1844} {"train_loss": -11.344969749450684, "global_step": 309809, "epoch": 1844} {"train_loss": -11.279401779174805, "global_step": 309810, "epoch": 1844} {"train_loss": -11.462310791015625, "global_step": 309811, "epoch": 1844} {"train_loss": -11.522315979003906, "global_step": 309812, "epoch": 1844} {"train_loss": -11.855137825012207, "global_step": 309813, "epoch": 1844} {"train_loss": -11.511913299560547, "global_step": 309814, "epoch": 1844} {"train_loss": -11.675854682922363, "global_step": 309815, "epoch": 1844} {"train_loss": -11.80848503112793, "global_step": 309816, "epoch": 1844} {"train_loss": -11.571657180786133, "global_step": 309817, "epoch": 1844} {"train_loss": -11.710774421691895, "global_step": 309818, "epoch": 1844} {"train_loss": -11.60428237915039, "global_step": 309819, "epoch": 1844} {"train_loss": -11.621023178100586, "global_step": 309820, "epoch": 1844} {"train_loss": -11.497756958007812, "global_step": 309821, "epoch": 1844} {"train_loss": -11.892535209655762, "global_step": 309822, "epoch": 1844} {"train_loss": -12.073691368103027, "global_step": 309823, "epoch": 1844} {"train_loss": -11.567047119140625, "global_step": 309824, "epoch": 1844} {"train_loss": -12.1565523147583, "global_step": 309825, "epoch": 1844} {"train_loss": -11.72332763671875, "global_step": 309826, "epoch": 1844} {"train_loss": -11.887483596801758, "global_step": 309827, "epoch": 1844} {"train_loss": -11.996814727783203, "global_step": 309828, "epoch": 1844} {"train_loss": -11.830284118652344, "global_step": 309829, "epoch": 1844} {"train_loss": -12.277536392211914, "global_step": 309830, "epoch": 1844} {"train_loss": -12.07611083984375, "global_step": 309831, "epoch": 1844} {"train_loss": -12.003639221191406, "global_step": 309832, "epoch": 1844} {"train_loss": -12.145113945007324, "global_step": 309833, "epoch": 1844} {"train_loss": -11.856040954589844, "global_step": 309834, "epoch": 1844} {"train_loss": -12.117509841918945, "global_step": 309835, "epoch": 1844} {"train_loss": -12.14910888671875, "global_step": 309836, "epoch": 1844} {"train_loss": -12.01713752746582, "global_step": 309837, "epoch": 1844} {"train_loss": -12.312549591064453, "global_step": 309838, "epoch": 1844} {"train_loss": -12.07205581665039, "global_step": 309839, "epoch": 1844} {"train_loss": -12.348407745361328, "global_step": 309840, "epoch": 1844} {"train_loss": -12.089180946350098, "global_step": 309841, "epoch": 1844} {"train_loss": -12.121301651000977, "global_step": 309842, "epoch": 1844} {"train_loss": -12.159318923950195, "global_step": 309843, "epoch": 1844} {"train_loss": -12.14804744720459, "global_step": 309844, "epoch": 1844} {"train_loss": -11.804632186889648, "global_step": 309845, "epoch": 1844} {"train_loss": -12.31187915802002, "global_step": 309846, "epoch": 1844} {"train_loss": -12.156875610351562, "global_step": 309847, "epoch": 1844} {"train_loss": -12.261417388916016, "global_step": 309848, "epoch": 1844} {"train_loss": -12.194599151611328, "global_step": 309849, "epoch": 1844} {"train_loss": -11.917137145996094, "global_step": 309850, "epoch": 1844} {"train_loss": -12.187382698059082, "global_step": 309851, "epoch": 1844} {"train_loss": -12.219375610351562, "global_step": 309852, "epoch": 1844} {"train_loss": -12.228992462158203, "global_step": 309853, "epoch": 1844} {"train_loss": -12.19943618774414, "global_step": 309854, "epoch": 1844} {"train_loss": -12.186193466186523, "global_step": 309855, "epoch": 1844} {"train_loss": -12.361967086791992, "global_step": 309856, "epoch": 1844} {"train_loss": -12.308067321777344, "global_step": 309857, "epoch": 1844} {"train_loss": -12.466436386108398, "global_step": 309858, "epoch": 1844} {"train_loss": -12.35099983215332, "global_step": 309859, "epoch": 1844} {"train_loss": -12.372932434082031, "global_step": 309860, "epoch": 1844} {"train_loss": -12.297897338867188, "global_step": 309861, "epoch": 1844} {"train_loss": -12.320087432861328, "global_step": 309862, "epoch": 1844} {"train_loss": -12.469310760498047, "global_step": 309863, "epoch": 1844} {"train_loss": -12.30711555480957, "global_step": 309864, "epoch": 1844} {"train_loss": -12.471959114074707, "global_step": 309865, "epoch": 1844} {"train_loss": -12.316915512084961, "global_step": 309866, "epoch": 1844} {"train_loss": -12.28853988647461, "global_step": 309867, "epoch": 1844} {"train_loss": -12.410680770874023, "global_step": 309868, "epoch": 1844} {"train_loss": -12.540384292602539, "global_step": 309869, "epoch": 1844} {"train_loss": -12.219636917114258, "global_step": 309870, "epoch": 1844} {"train_loss": -12.441305160522461, "global_step": 309871, "epoch": 1844} {"train_loss": -12.02844524383545, "global_step": 309872, "epoch": 1844} {"train_loss": -12.039647102355957, "global_step": 309873, "epoch": 1844} {"train_loss": -12.17821216583252, "global_step": 309874, "epoch": 1844} {"train_loss": -12.30557632446289, "global_step": 309875, "epoch": 1844} {"train_loss": -11.984176635742188, "global_step": 309876, "epoch": 1844} {"train_loss": -11.817270278930664, "global_step": 309877, "epoch": 1844} {"train_loss": -12.309185028076172, "global_step": 309878, "epoch": 1844} {"train_loss": -11.738241195678711, "global_step": 309879, "epoch": 1844} {"train_loss": -11.785308837890625, "global_step": 309880, "epoch": 1844} {"train_loss": -11.888843536376953, "global_step": 309881, "epoch": 1844} {"train_loss": -11.668686866760254, "global_step": 309882, "epoch": 1844} {"train_loss": -10.63292121887207, "global_step": 309883, "epoch": 1844} {"train_loss": -10.73233413696289, "global_step": 309884, "epoch": 1844} {"train_loss": -11.053394317626953, "global_step": 309885, "epoch": 1844} {"train_loss": -10.718481063842773, "global_step": 309886, "epoch": 1844} {"train_loss": -11.267828941345215, "global_step": 309887, "epoch": 1844} {"train_loss": -10.873319625854492, "global_step": 309888, "epoch": 1844} {"train_loss": -10.399112701416016, "global_step": 309889, "epoch": 1844} {"train_loss": -10.583142280578613, "global_step": 309890, "epoch": 1844} {"train_loss": -10.353992462158203, "global_step": 309891, "epoch": 1844} {"train_loss": -10.013333320617676, "global_step": 309892, "epoch": 1844} {"train_loss": -11.549870491027832, "global_step": 309893, "epoch": 1844} {"train_loss": -10.057403564453125, "global_step": 309894, "epoch": 1844} {"train_loss": -10.690786361694336, "global_step": 309895, "epoch": 1844} {"train_loss": -9.56779670715332, "global_step": 309896, "epoch": 1844} {"train_loss": -9.391400337219238, "global_step": 309897, "epoch": 1844} {"train_loss": -9.643815994262695, "global_step": 309898, "epoch": 1844} {"train_loss": -11.19588851928711, "global_step": 309899, "epoch": 1844} {"train_loss": -10.281230926513672, "global_step": 309900, "epoch": 1844} {"train_loss": -10.272090911865234, "global_step": 309901, "epoch": 1844} {"train_loss": -11.408317565917969, "global_step": 309902, "epoch": 1844} {"train_loss": -11.272970199584961, "global_step": 309903, "epoch": 1844} {"train_loss": -11.156784057617188, "global_step": 309904, "epoch": 1844} {"train_loss": -10.997345924377441, "global_step": 309905, "epoch": 1844} {"train_loss": -10.402538299560547, "global_step": 309906, "epoch": 1844} {"train_loss": -11.012869834899902, "global_step": 309907, "epoch": 1844} {"train_loss": -11.410568237304688, "global_step": 309908, "epoch": 1844} {"train_loss": -10.498811721801758, "global_step": 309909, "epoch": 1844} {"train_loss": -11.058148384094238, "global_step": 309910, "epoch": 1844} {"train_loss": -10.631109237670898, "global_step": 309911, "epoch": 1844} {"train_loss": -11.598325729370117, "global_step": 309912, "epoch": 1844} {"train_loss": -11.519652366638184, "global_step": 309913, "epoch": 1844} {"train_loss": -11.495631217956543, "global_step": 309914, "epoch": 1844} {"train_loss": -11.43198299407959, "global_step": 309915, "epoch": 1844} {"train_loss": -11.408246040344238, "global_step": 309916, "epoch": 1844} {"train_loss": -11.044224739074707, "global_step": 309917, "epoch": 1844} {"train_loss": -11.257976531982422, "global_step": 309918, "epoch": 1844} {"train_loss": -11.364033699035645, "global_step": 309919, "epoch": 1844} {"train_loss": -11.269651412963867, "global_step": 309920, "epoch": 1844} {"train_loss": -11.600468635559082, "global_step": 309921, "epoch": 1844} {"train_loss": -11.21894645690918, "global_step": 309922, "epoch": 1844} {"train_loss": -11.57303237915039, "global_step": 309923, "epoch": 1844} {"train_loss": -11.034463882446289, "global_step": 309924, "epoch": 1844} {"train_loss": -11.334061622619629, "global_step": 309925, "epoch": 1844} {"train_loss": -11.51959228515625, "global_step": 309926, "epoch": 1844} {"train_loss": -11.211883544921875, "global_step": 309927, "epoch": 1844} {"train_loss": -11.962274551391602, "global_step": 309928, "epoch": 1844} {"train_loss": -11.019866943359375, "global_step": 309929, "epoch": 1844} {"train_loss": -11.62409782409668, "global_step": 309930, "epoch": 1844} {"train_loss": -11.839515686035156, "global_step": 309931, "epoch": 1844} {"train_loss": -11.71169376373291, "global_step": 309932, "epoch": 1844} {"train_loss": -11.825862884521484, "global_step": 309933, "epoch": 1844} {"train_loss": -11.860496520996094, "global_step": 309934, "epoch": 1844} {"train_loss": -11.795358657836914, "global_step": 309935, "epoch": 1844} {"train_loss": -12.039453506469727, "global_step": 309936, "epoch": 1844} {"train_loss": -11.829042434692383, "global_step": 309937, "epoch": 1844} {"train_loss": -11.630470275878906, "global_step": 309938, "epoch": 1844} {"train_loss": -11.997581481933594, "global_step": 309939, "epoch": 1844} {"train_loss": -11.790757179260254, "global_step": 309940, "epoch": 1844} {"train_loss": -11.950326919555664, "global_step": 309941, "epoch": 1844} {"train_loss": -12.033975601196289, "global_step": 309942, "epoch": 1844} {"train_loss": -11.794857025146484, "global_step": 309943, "epoch": 1844} {"train_loss": -11.950827598571777, "global_step": 309944, "epoch": 1844} {"train_loss": -11.84665298461914, "global_step": 309945, "epoch": 1844} {"train_loss": -12.211209297180176, "global_step": 309946, "epoch": 1844} {"train_loss": -11.936525344848633, "global_step": 309947, "epoch": 1844} {"train_loss": -12.143014907836914, "global_step": 309948, "epoch": 1844} {"train_loss": -11.99747085571289, "global_step": 309949, "epoch": 1844} {"train_loss": -12.089690208435059, "global_step": 309950, "epoch": 1844} {"train_loss": -11.934183120727539, "global_step": 309951, "epoch": 1844} {"train_loss": -12.116361618041992, "global_step": 309952, "epoch": 1844} {"train_loss": -12.35308837890625, "global_step": 309953, "epoch": 1844} {"train_loss": -12.202765464782715, "global_step": 309954, "epoch": 1844} {"train_loss": -12.0930814743042, "global_step": 309955, "epoch": 1844} {"train_loss": -12.336862564086914, "global_step": 309956, "epoch": 1844} {"train_loss": -12.344648361206055, "global_step": 309957, "epoch": 1844} {"train_loss": -12.229867935180664, "global_step": 309958, "epoch": 1844} {"train_loss": -11.559859820774623, "global_step": 309959, "epoch": 1844, "val_loss": 283508.90625} {"train_loss": -12.2747802734375, "global_step": 309960, "epoch": 1845} {"train_loss": -12.442975044250488, "global_step": 309961, "epoch": 1845} {"train_loss": -12.209478378295898, "global_step": 309962, "epoch": 1845} {"train_loss": -12.393765449523926, "global_step": 309963, "epoch": 1845} {"train_loss": -12.531791687011719, "global_step": 309964, "epoch": 1845} {"train_loss": -12.516483306884766, "global_step": 309965, "epoch": 1845} {"train_loss": -12.46322250366211, "global_step": 309966, "epoch": 1845} {"train_loss": -12.49239444732666, "global_step": 309967, "epoch": 1845} {"train_loss": -12.453924179077148, "global_step": 309968, "epoch": 1845} {"train_loss": -12.322219848632812, "global_step": 309969, "epoch": 1845} {"train_loss": -12.380924224853516, "global_step": 309970, "epoch": 1845} {"train_loss": -12.160964965820312, "global_step": 309971, "epoch": 1845} {"train_loss": -12.457765579223633, "global_step": 309972, "epoch": 1845} {"train_loss": -12.463533401489258, "global_step": 309973, "epoch": 1845} {"train_loss": -12.458471298217773, "global_step": 309974, "epoch": 1845} {"train_loss": -12.442500114440918, "global_step": 309975, "epoch": 1845} {"train_loss": -12.252681732177734, "global_step": 309976, "epoch": 1845} {"train_loss": -12.388250350952148, "global_step": 309977, "epoch": 1845} {"train_loss": -12.56675910949707, "global_step": 309978, "epoch": 1845} {"train_loss": -12.516085624694824, "global_step": 309979, "epoch": 1845} {"train_loss": -12.65031909942627, "global_step": 309980, "epoch": 1845} {"train_loss": -12.53446102142334, "global_step": 309981, "epoch": 1845} {"train_loss": -12.623488426208496, "global_step": 309982, "epoch": 1845} {"train_loss": -12.399755477905273, "global_step": 309983, "epoch": 1845} {"train_loss": -12.443737030029297, "global_step": 309984, "epoch": 1845} {"train_loss": -12.671504020690918, "global_step": 309985, "epoch": 1845} {"train_loss": -12.513409614562988, "global_step": 309986, "epoch": 1845} {"train_loss": -12.546744346618652, "global_step": 309987, "epoch": 1845} {"train_loss": -12.493169784545898, "global_step": 309988, "epoch": 1845} {"train_loss": -12.565330505371094, "global_step": 309989, "epoch": 1845} {"train_loss": -12.500812530517578, "global_step": 309990, "epoch": 1845} {"train_loss": -12.592790603637695, "global_step": 309991, "epoch": 1845} {"train_loss": -12.622430801391602, "global_step": 309992, "epoch": 1845} {"train_loss": -12.528379440307617, "global_step": 309993, "epoch": 1845} {"train_loss": -12.265951156616211, "global_step": 309994, "epoch": 1845} {"train_loss": -12.557723999023438, "global_step": 309995, "epoch": 1845} {"train_loss": -12.560606002807617, "global_step": 309996, "epoch": 1845} {"train_loss": -12.274295806884766, "global_step": 309997, "epoch": 1845} {"train_loss": -12.539555549621582, "global_step": 309998, "epoch": 1845} {"train_loss": -12.444775581359863, "global_step": 309999, "epoch": 1845} {"train_loss": -12.154178619384766, "global_step": 310000, "epoch": 1845} {"train_loss": -12.317184448242188, "global_step": 310001, "epoch": 1845} {"train_loss": -12.374523162841797, "global_step": 310002, "epoch": 1845} {"train_loss": -11.873777389526367, "global_step": 310003, "epoch": 1845} {"train_loss": -11.818286895751953, "global_step": 310004, "epoch": 1845} {"train_loss": -12.311426162719727, "global_step": 310005, "epoch": 1845} {"train_loss": -12.131961822509766, "global_step": 310006, "epoch": 1845} {"train_loss": -11.85617446899414, "global_step": 310007, "epoch": 1845} {"train_loss": -11.857137680053711, "global_step": 310008, "epoch": 1845} {"train_loss": -11.868795394897461, "global_step": 310009, "epoch": 1845} {"train_loss": -11.677787780761719, "global_step": 310010, "epoch": 1845} {"train_loss": -11.89113998413086, "global_step": 310011, "epoch": 1845} {"train_loss": -12.102350234985352, "global_step": 310012, "epoch": 1845} {"train_loss": -11.459678649902344, "global_step": 310013, "epoch": 1845} {"train_loss": -11.76684284210205, "global_step": 310014, "epoch": 1845} {"train_loss": -11.745622634887695, "global_step": 310015, "epoch": 1845} {"train_loss": -11.553232192993164, "global_step": 310016, "epoch": 1845} {"train_loss": -11.568284034729004, "global_step": 310017, "epoch": 1845} {"train_loss": -12.1670560836792, "global_step": 310018, "epoch": 1845} {"train_loss": -11.013077735900879, "global_step": 310019, "epoch": 1845} {"train_loss": -11.703763008117676, "global_step": 310020, "epoch": 1845} {"train_loss": -11.826745986938477, "global_step": 310021, "epoch": 1845} {"train_loss": -11.43089771270752, "global_step": 310022, "epoch": 1845} {"train_loss": -12.061042785644531, "global_step": 310023, "epoch": 1845} {"train_loss": -10.875025749206543, "global_step": 310024, "epoch": 1845} {"train_loss": -11.717429161071777, "global_step": 310025, "epoch": 1845} {"train_loss": -12.016347885131836, "global_step": 310026, "epoch": 1845} {"train_loss": -11.403223037719727, "global_step": 310027, "epoch": 1845} {"train_loss": -11.59744644165039, "global_step": 310028, "epoch": 1845} {"train_loss": -11.95560073852539, "global_step": 310029, "epoch": 1845} {"train_loss": -11.357738494873047, "global_step": 310030, "epoch": 1845} {"train_loss": -11.525007247924805, "global_step": 310031, "epoch": 1845} {"train_loss": -11.648879051208496, "global_step": 310032, "epoch": 1845} {"train_loss": -11.002918243408203, "global_step": 310033, "epoch": 1845} {"train_loss": -11.529903411865234, "global_step": 310034, "epoch": 1845} {"train_loss": -11.771160125732422, "global_step": 310035, "epoch": 1845} {"train_loss": -11.093953132629395, "global_step": 310036, "epoch": 1845} {"train_loss": -12.131277084350586, "global_step": 310037, "epoch": 1845} {"train_loss": -11.556608200073242, "global_step": 310038, "epoch": 1845} {"train_loss": -11.764811515808105, "global_step": 310039, "epoch": 1845} {"train_loss": -12.050268173217773, "global_step": 310040, "epoch": 1845} {"train_loss": -12.00822639465332, "global_step": 310041, "epoch": 1845} {"train_loss": -11.9549560546875, "global_step": 310042, "epoch": 1845} {"train_loss": -11.779300689697266, "global_step": 310043, "epoch": 1845} {"train_loss": -11.484695434570312, "global_step": 310044, "epoch": 1845} {"train_loss": -11.08773422241211, "global_step": 310045, "epoch": 1845} {"train_loss": -11.59237289428711, "global_step": 310046, "epoch": 1845} {"train_loss": -11.378867149353027, "global_step": 310047, "epoch": 1845} {"train_loss": -10.98270034790039, "global_step": 310048, "epoch": 1845} {"train_loss": -12.06974983215332, "global_step": 310049, "epoch": 1845} {"train_loss": -11.446805953979492, "global_step": 310050, "epoch": 1845} {"train_loss": -11.866795539855957, "global_step": 310051, "epoch": 1845} {"train_loss": -11.773117065429688, "global_step": 310052, "epoch": 1845} {"train_loss": -12.051586151123047, "global_step": 310053, "epoch": 1845} {"train_loss": -11.981330871582031, "global_step": 310054, "epoch": 1845} {"train_loss": -11.854696273803711, "global_step": 310055, "epoch": 1845} {"train_loss": -12.234384536743164, "global_step": 310056, "epoch": 1845} {"train_loss": -12.019577026367188, "global_step": 310057, "epoch": 1845} {"train_loss": -12.160953521728516, "global_step": 310058, "epoch": 1845} {"train_loss": -11.794065475463867, "global_step": 310059, "epoch": 1845} {"train_loss": -11.98742961883545, "global_step": 310060, "epoch": 1845} {"train_loss": -11.995302200317383, "global_step": 310061, "epoch": 1845} {"train_loss": -11.804752349853516, "global_step": 310062, "epoch": 1845} {"train_loss": -12.344261169433594, "global_step": 310063, "epoch": 1845} {"train_loss": -11.791581153869629, "global_step": 310064, "epoch": 1845} {"train_loss": -12.181662559509277, "global_step": 310065, "epoch": 1845} {"train_loss": -12.048309326171875, "global_step": 310066, "epoch": 1845} {"train_loss": -12.092338562011719, "global_step": 310067, "epoch": 1845} {"train_loss": -12.209845542907715, "global_step": 310068, "epoch": 1845} {"train_loss": -11.347558975219727, "global_step": 310069, "epoch": 1845} {"train_loss": -11.531471252441406, "global_step": 310070, "epoch": 1845} {"train_loss": -11.647846221923828, "global_step": 310071, "epoch": 1845} {"train_loss": -12.148313522338867, "global_step": 310072, "epoch": 1845} {"train_loss": -11.816703796386719, "global_step": 310073, "epoch": 1845} {"train_loss": -12.215292930603027, "global_step": 310074, "epoch": 1845} {"train_loss": -11.897823333740234, "global_step": 310075, "epoch": 1845} {"train_loss": -12.447803497314453, "global_step": 310076, "epoch": 1845} {"train_loss": -11.759258270263672, "global_step": 310077, "epoch": 1845} {"train_loss": -12.063071250915527, "global_step": 310078, "epoch": 1845} {"train_loss": -11.76312255859375, "global_step": 310079, "epoch": 1845} {"train_loss": -12.094508171081543, "global_step": 310080, "epoch": 1845} {"train_loss": -12.034614562988281, "global_step": 310081, "epoch": 1845} {"train_loss": -12.009941101074219, "global_step": 310082, "epoch": 1845} {"train_loss": -11.976913452148438, "global_step": 310083, "epoch": 1845} {"train_loss": -11.706559181213379, "global_step": 310084, "epoch": 1845} {"train_loss": -11.488656997680664, "global_step": 310085, "epoch": 1845} {"train_loss": -12.098142623901367, "global_step": 310086, "epoch": 1845} {"train_loss": -11.876811981201172, "global_step": 310087, "epoch": 1845} {"train_loss": -12.11270809173584, "global_step": 310088, "epoch": 1845} {"train_loss": -11.64570426940918, "global_step": 310089, "epoch": 1845} {"train_loss": -12.092508316040039, "global_step": 310090, "epoch": 1845} {"train_loss": -12.095098495483398, "global_step": 310091, "epoch": 1845} {"train_loss": -12.396265029907227, "global_step": 310092, "epoch": 1845} {"train_loss": -11.994037628173828, "global_step": 310093, "epoch": 1845} {"train_loss": -12.389848709106445, "global_step": 310094, "epoch": 1845} {"train_loss": -12.156708717346191, "global_step": 310095, "epoch": 1845} {"train_loss": -12.256957054138184, "global_step": 310096, "epoch": 1845} {"train_loss": -12.37146282196045, "global_step": 310097, "epoch": 1845} {"train_loss": -12.193840026855469, "global_step": 310098, "epoch": 1845} {"train_loss": -12.303934097290039, "global_step": 310099, "epoch": 1845} {"train_loss": -12.291226387023926, "global_step": 310100, "epoch": 1845} {"train_loss": -11.792739868164062, "global_step": 310101, "epoch": 1845} {"train_loss": -12.537721633911133, "global_step": 310102, "epoch": 1845} {"train_loss": -11.734888076782227, "global_step": 310103, "epoch": 1845} {"train_loss": -12.106162071228027, "global_step": 310104, "epoch": 1845} {"train_loss": -11.910921096801758, "global_step": 310105, "epoch": 1845} {"train_loss": -11.074195861816406, "global_step": 310106, "epoch": 1845} {"train_loss": -10.245954513549805, "global_step": 310107, "epoch": 1845} {"train_loss": -10.845870018005371, "global_step": 310108, "epoch": 1845} {"train_loss": -10.779134750366211, "global_step": 310109, "epoch": 1845} {"train_loss": -10.654556274414062, "global_step": 310110, "epoch": 1845} {"train_loss": -11.538190841674805, "global_step": 310111, "epoch": 1845} {"train_loss": -9.708754539489746, "global_step": 310112, "epoch": 1845} {"train_loss": -11.226340293884277, "global_step": 310113, "epoch": 1845} {"train_loss": -10.577921867370605, "global_step": 310114, "epoch": 1845} {"train_loss": -10.285593032836914, "global_step": 310115, "epoch": 1845} {"train_loss": -11.196456909179688, "global_step": 310116, "epoch": 1845} {"train_loss": -10.605393409729004, "global_step": 310117, "epoch": 1845} {"train_loss": -11.283405303955078, "global_step": 310118, "epoch": 1845} {"train_loss": -10.966389656066895, "global_step": 310119, "epoch": 1845} {"train_loss": -10.700563430786133, "global_step": 310120, "epoch": 1845} {"train_loss": -10.539737701416016, "global_step": 310121, "epoch": 1845} {"train_loss": -10.661792755126953, "global_step": 310122, "epoch": 1845} {"train_loss": -10.897960662841797, "global_step": 310123, "epoch": 1845} {"train_loss": -11.452564239501953, "global_step": 310124, "epoch": 1845} {"train_loss": -10.069316864013672, "global_step": 310125, "epoch": 1845} {"train_loss": -11.47555160522461, "global_step": 310126, "epoch": 1845} {"train_loss": -11.865698820068722, "global_step": 310127, "epoch": 1845, "val_loss": 281638.78125, "train_action_mse_error": 0.9711997509002686} {"train_loss": -11.026352882385254, "global_step": 310128, "epoch": 1846} {"train_loss": -10.76901626586914, "global_step": 310129, "epoch": 1846} {"train_loss": -10.644471168518066, "global_step": 310130, "epoch": 1846} {"train_loss": -10.546098709106445, "global_step": 310131, "epoch": 1846} {"train_loss": -10.853816986083984, "global_step": 310132, "epoch": 1846} {"train_loss": -11.423271179199219, "global_step": 310133, "epoch": 1846} {"train_loss": -10.529083251953125, "global_step": 310134, "epoch": 1846} {"train_loss": -11.642309188842773, "global_step": 310135, "epoch": 1846} {"train_loss": -11.563405990600586, "global_step": 310136, "epoch": 1846} {"train_loss": -11.35645866394043, "global_step": 310137, "epoch": 1846} {"train_loss": -12.036948204040527, "global_step": 310138, "epoch": 1846} {"train_loss": -11.338279724121094, "global_step": 310139, "epoch": 1846} {"train_loss": -11.725773811340332, "global_step": 310140, "epoch": 1846} {"train_loss": -11.847423553466797, "global_step": 310141, "epoch": 1846} {"train_loss": -11.622326850891113, "global_step": 310142, "epoch": 1846} {"train_loss": -12.23670482635498, "global_step": 310143, "epoch": 1846} {"train_loss": -12.046570777893066, "global_step": 310144, "epoch": 1846} {"train_loss": -11.965621948242188, "global_step": 310145, "epoch": 1846} {"train_loss": -12.174148559570312, "global_step": 310146, "epoch": 1846} {"train_loss": -11.810492515563965, "global_step": 310147, "epoch": 1846} {"train_loss": -12.134376525878906, "global_step": 310148, "epoch": 1846} {"train_loss": -11.621565818786621, "global_step": 310149, "epoch": 1846} {"train_loss": -12.039726257324219, "global_step": 310150, "epoch": 1846} {"train_loss": -12.069843292236328, "global_step": 310151, "epoch": 1846} {"train_loss": -11.965072631835938, "global_step": 310152, "epoch": 1846} {"train_loss": -12.06256103515625, "global_step": 310153, "epoch": 1846} {"train_loss": -12.276890754699707, "global_step": 310154, "epoch": 1846} {"train_loss": -12.12969970703125, "global_step": 310155, "epoch": 1846} {"train_loss": -12.316755294799805, "global_step": 310156, "epoch": 1846} {"train_loss": -12.08540153503418, "global_step": 310157, "epoch": 1846} {"train_loss": -11.981082916259766, "global_step": 310158, "epoch": 1846} {"train_loss": -12.02315616607666, "global_step": 310159, "epoch": 1846} {"train_loss": -12.19918441772461, "global_step": 310160, "epoch": 1846} {"train_loss": -12.261674880981445, "global_step": 310161, "epoch": 1846} {"train_loss": -12.115232467651367, "global_step": 310162, "epoch": 1846} {"train_loss": -12.059957504272461, "global_step": 310163, "epoch": 1846} {"train_loss": -12.173179626464844, "global_step": 310164, "epoch": 1846} {"train_loss": -12.328754425048828, "global_step": 310165, "epoch": 1846} {"train_loss": -12.074455261230469, "global_step": 310166, "epoch": 1846} {"train_loss": -12.263266563415527, "global_step": 310167, "epoch": 1846} {"train_loss": -12.218120574951172, "global_step": 310168, "epoch": 1846} {"train_loss": -12.098946571350098, "global_step": 310169, "epoch": 1846} {"train_loss": -12.019205093383789, "global_step": 310170, "epoch": 1846} {"train_loss": -12.327619552612305, "global_step": 310171, "epoch": 1846} {"train_loss": -12.17929458618164, "global_step": 310172, "epoch": 1846} {"train_loss": -12.288339614868164, "global_step": 310173, "epoch": 1846} {"train_loss": -12.210556983947754, "global_step": 310174, "epoch": 1846} {"train_loss": -12.348365783691406, "global_step": 310175, "epoch": 1846} {"train_loss": -12.276334762573242, "global_step": 310176, "epoch": 1846} {"train_loss": -12.15633773803711, "global_step": 310177, "epoch": 1846} {"train_loss": -12.599862098693848, "global_step": 310178, "epoch": 1846} {"train_loss": -11.876803398132324, "global_step": 310179, "epoch": 1846} {"train_loss": -12.419349670410156, "global_step": 310180, "epoch": 1846} {"train_loss": -12.278162956237793, "global_step": 310181, "epoch": 1846} {"train_loss": -12.416711807250977, "global_step": 310182, "epoch": 1846} {"train_loss": -12.29429817199707, "global_step": 310183, "epoch": 1846} {"train_loss": -12.245023727416992, "global_step": 310184, "epoch": 1846} {"train_loss": -12.033687591552734, "global_step": 310185, "epoch": 1846} {"train_loss": -12.462871551513672, "global_step": 310186, "epoch": 1846} {"train_loss": -12.139215469360352, "global_step": 310187, "epoch": 1846} {"train_loss": -12.51300048828125, "global_step": 310188, "epoch": 1846} {"train_loss": -12.31043815612793, "global_step": 310189, "epoch": 1846} {"train_loss": -11.627384185791016, "global_step": 310190, "epoch": 1846} {"train_loss": -12.169864654541016, "global_step": 310191, "epoch": 1846} {"train_loss": -12.237895965576172, "global_step": 310192, "epoch": 1846} {"train_loss": -11.779390335083008, "global_step": 310193, "epoch": 1846} {"train_loss": -12.247150421142578, "global_step": 310194, "epoch": 1846} {"train_loss": -11.36944580078125, "global_step": 310195, "epoch": 1846} {"train_loss": -12.170772552490234, "global_step": 310196, "epoch": 1846} {"train_loss": -11.898676872253418, "global_step": 310197, "epoch": 1846} {"train_loss": -11.350696563720703, "global_step": 310198, "epoch": 1846} {"train_loss": -12.371216773986816, "global_step": 310199, "epoch": 1846} {"train_loss": -10.585171699523926, "global_step": 310200, "epoch": 1846} {"train_loss": -11.738086700439453, "global_step": 310201, "epoch": 1846} {"train_loss": -11.929831504821777, "global_step": 310202, "epoch": 1846} {"train_loss": -10.865460395812988, "global_step": 310203, "epoch": 1846} {"train_loss": -11.580971717834473, "global_step": 310204, "epoch": 1846} {"train_loss": -12.093099594116211, "global_step": 310205, "epoch": 1846} {"train_loss": -10.944543838500977, "global_step": 310206, "epoch": 1846} {"train_loss": -11.539205551147461, "global_step": 310207, "epoch": 1846} {"train_loss": -11.422672271728516, "global_step": 310208, "epoch": 1846} {"train_loss": -12.003357887268066, "global_step": 310209, "epoch": 1846} {"train_loss": -11.901914596557617, "global_step": 310210, "epoch": 1846} {"train_loss": -11.493086814880371, "global_step": 310211, "epoch": 1846} {"train_loss": -12.251816749572754, "global_step": 310212, "epoch": 1846} {"train_loss": -11.622108459472656, "global_step": 310213, "epoch": 1846} {"train_loss": -12.313739776611328, "global_step": 310214, "epoch": 1846} {"train_loss": -11.79769515991211, "global_step": 310215, "epoch": 1846} {"train_loss": -11.851066589355469, "global_step": 310216, "epoch": 1846} {"train_loss": -12.159923553466797, "global_step": 310217, "epoch": 1846} {"train_loss": -11.666422843933105, "global_step": 310218, "epoch": 1846} {"train_loss": -11.994625091552734, "global_step": 310219, "epoch": 1846} {"train_loss": -11.724393844604492, "global_step": 310220, "epoch": 1846} {"train_loss": -12.270882606506348, "global_step": 310221, "epoch": 1846} {"train_loss": -11.723478317260742, "global_step": 310222, "epoch": 1846} {"train_loss": -12.04792594909668, "global_step": 310223, "epoch": 1846} {"train_loss": -12.347896575927734, "global_step": 310224, "epoch": 1846} {"train_loss": -12.240556716918945, "global_step": 310225, "epoch": 1846} {"train_loss": -12.362178802490234, "global_step": 310226, "epoch": 1846} {"train_loss": -12.11158561706543, "global_step": 310227, "epoch": 1846} {"train_loss": -12.188852310180664, "global_step": 310228, "epoch": 1846} {"train_loss": -12.170293807983398, "global_step": 310229, "epoch": 1846} {"train_loss": -12.041461944580078, "global_step": 310230, "epoch": 1846} {"train_loss": -12.030981063842773, "global_step": 310231, "epoch": 1846} {"train_loss": -12.2252779006958, "global_step": 310232, "epoch": 1846} {"train_loss": -11.565692901611328, "global_step": 310233, "epoch": 1846} {"train_loss": -11.950422286987305, "global_step": 310234, "epoch": 1846} {"train_loss": -11.476461410522461, "global_step": 310235, "epoch": 1846} {"train_loss": -11.452817916870117, "global_step": 310236, "epoch": 1846} {"train_loss": -10.662485122680664, "global_step": 310237, "epoch": 1846} {"train_loss": -11.529644012451172, "global_step": 310238, "epoch": 1846} {"train_loss": -10.844525337219238, "global_step": 310239, "epoch": 1846} {"train_loss": -11.444263458251953, "global_step": 310240, "epoch": 1846} {"train_loss": -11.60522174835205, "global_step": 310241, "epoch": 1846} {"train_loss": -11.299199104309082, "global_step": 310242, "epoch": 1846} {"train_loss": -11.155342102050781, "global_step": 310243, "epoch": 1846} {"train_loss": -11.96688461303711, "global_step": 310244, "epoch": 1846} {"train_loss": -11.406511306762695, "global_step": 310245, "epoch": 1846} {"train_loss": -12.14616870880127, "global_step": 310246, "epoch": 1846} {"train_loss": -11.865348815917969, "global_step": 310247, "epoch": 1846} {"train_loss": -11.689409255981445, "global_step": 310248, "epoch": 1846} {"train_loss": -12.151105880737305, "global_step": 310249, "epoch": 1846} {"train_loss": -12.044004440307617, "global_step": 310250, "epoch": 1846} {"train_loss": -12.071728706359863, "global_step": 310251, "epoch": 1846} {"train_loss": -11.955561637878418, "global_step": 310252, "epoch": 1846} {"train_loss": -11.915128707885742, "global_step": 310253, "epoch": 1846} {"train_loss": -12.200287818908691, "global_step": 310254, "epoch": 1846} {"train_loss": -12.07872486114502, "global_step": 310255, "epoch": 1846} {"train_loss": -11.97429084777832, "global_step": 310256, "epoch": 1846} {"train_loss": -12.270151138305664, "global_step": 310257, "epoch": 1846} {"train_loss": -12.055676460266113, "global_step": 310258, "epoch": 1846} {"train_loss": -12.282590866088867, "global_step": 310259, "epoch": 1846} {"train_loss": -12.089988708496094, "global_step": 310260, "epoch": 1846} {"train_loss": -11.84829044342041, "global_step": 310261, "epoch": 1846} {"train_loss": -11.904354095458984, "global_step": 310262, "epoch": 1846} {"train_loss": -12.370412826538086, "global_step": 310263, "epoch": 1846} {"train_loss": -12.097818374633789, "global_step": 310264, "epoch": 1846} {"train_loss": -12.465551376342773, "global_step": 310265, "epoch": 1846} {"train_loss": -12.16982650756836, "global_step": 310266, "epoch": 1846} {"train_loss": -12.14195728302002, "global_step": 310267, "epoch": 1846} {"train_loss": -12.11107349395752, "global_step": 310268, "epoch": 1846} {"train_loss": -11.952683448791504, "global_step": 310269, "epoch": 1846} {"train_loss": -12.15397834777832, "global_step": 310270, "epoch": 1846} {"train_loss": -11.821662902832031, "global_step": 310271, "epoch": 1846} {"train_loss": -11.4697265625, "global_step": 310272, "epoch": 1846} {"train_loss": -11.80602741241455, "global_step": 310273, "epoch": 1846} {"train_loss": -11.441766738891602, "global_step": 310274, "epoch": 1846} {"train_loss": -11.264739990234375, "global_step": 310275, "epoch": 1846} {"train_loss": -11.754638671875, "global_step": 310276, "epoch": 1846} {"train_loss": -10.450069427490234, "global_step": 310277, "epoch": 1846} {"train_loss": -11.776152610778809, "global_step": 310278, "epoch": 1846} {"train_loss": -11.502289772033691, "global_step": 310279, "epoch": 1846} {"train_loss": -11.531168937683105, "global_step": 310280, "epoch": 1846} {"train_loss": -11.869723320007324, "global_step": 310281, "epoch": 1846} {"train_loss": -11.431596755981445, "global_step": 310282, "epoch": 1846} {"train_loss": -10.974424362182617, "global_step": 310283, "epoch": 1846} {"train_loss": -11.975198745727539, "global_step": 310284, "epoch": 1846} {"train_loss": -11.411043167114258, "global_step": 310285, "epoch": 1846} {"train_loss": -11.47023868560791, "global_step": 310286, "epoch": 1846} {"train_loss": -11.9346342086792, "global_step": 310287, "epoch": 1846} {"train_loss": -11.40726375579834, "global_step": 310288, "epoch": 1846} {"train_loss": -12.221883773803711, "global_step": 310289, "epoch": 1846} {"train_loss": -11.725204467773438, "global_step": 310290, "epoch": 1846} {"train_loss": -11.812593460083008, "global_step": 310291, "epoch": 1846} {"train_loss": -11.38158130645752, "global_step": 310292, "epoch": 1846} {"train_loss": -11.669419288635254, "global_step": 310293, "epoch": 1846} {"train_loss": -11.689839363098145, "global_step": 310294, "epoch": 1846} {"train_loss": -11.854159752527872, "global_step": 310295, "epoch": 1846, "val_loss": 284280.0} {"train_loss": -10.710248947143555, "global_step": 310296, "epoch": 1847} {"train_loss": -11.777933120727539, "global_step": 310297, "epoch": 1847} {"train_loss": -11.093634605407715, "global_step": 310298, "epoch": 1847} {"train_loss": -11.175243377685547, "global_step": 310299, "epoch": 1847} {"train_loss": -11.589909553527832, "global_step": 310300, "epoch": 1847} {"train_loss": -11.122536659240723, "global_step": 310301, "epoch": 1847} {"train_loss": -11.992340087890625, "global_step": 310302, "epoch": 1847} {"train_loss": -11.406944274902344, "global_step": 310303, "epoch": 1847} {"train_loss": -12.114526748657227, "global_step": 310304, "epoch": 1847} {"train_loss": -11.501700401306152, "global_step": 310305, "epoch": 1847} {"train_loss": -11.981876373291016, "global_step": 310306, "epoch": 1847} {"train_loss": -11.885501861572266, "global_step": 310307, "epoch": 1847} {"train_loss": -12.000452041625977, "global_step": 310308, "epoch": 1847} {"train_loss": -12.041900634765625, "global_step": 310309, "epoch": 1847} {"train_loss": -12.044236183166504, "global_step": 310310, "epoch": 1847} {"train_loss": -11.98743724822998, "global_step": 310311, "epoch": 1847} {"train_loss": -12.019268989562988, "global_step": 310312, "epoch": 1847} {"train_loss": -11.979301452636719, "global_step": 310313, "epoch": 1847} {"train_loss": -12.022991180419922, "global_step": 310314, "epoch": 1847} {"train_loss": -12.057000160217285, "global_step": 310315, "epoch": 1847} {"train_loss": -12.175529479980469, "global_step": 310316, "epoch": 1847} {"train_loss": -12.128138542175293, "global_step": 310317, "epoch": 1847} {"train_loss": -11.998506546020508, "global_step": 310318, "epoch": 1847} {"train_loss": -12.201211929321289, "global_step": 310319, "epoch": 1847} {"train_loss": -12.004414558410645, "global_step": 310320, "epoch": 1847} {"train_loss": -12.130343437194824, "global_step": 310321, "epoch": 1847} {"train_loss": -12.204580307006836, "global_step": 310322, "epoch": 1847} {"train_loss": -12.29116153717041, "global_step": 310323, "epoch": 1847} {"train_loss": -12.379782676696777, "global_step": 310324, "epoch": 1847} {"train_loss": -12.164285659790039, "global_step": 310325, "epoch": 1847} {"train_loss": -11.790895462036133, "global_step": 310326, "epoch": 1847} {"train_loss": -12.38770580291748, "global_step": 310327, "epoch": 1847} {"train_loss": -12.090986251831055, "global_step": 310328, "epoch": 1847} {"train_loss": -12.387340545654297, "global_step": 310329, "epoch": 1847} {"train_loss": -12.361515045166016, "global_step": 310330, "epoch": 1847} {"train_loss": -12.272272109985352, "global_step": 310331, "epoch": 1847} {"train_loss": -12.295822143554688, "global_step": 310332, "epoch": 1847} {"train_loss": -12.124983787536621, "global_step": 310333, "epoch": 1847} {"train_loss": -12.151659965515137, "global_step": 310334, "epoch": 1847} {"train_loss": -12.234795570373535, "global_step": 310335, "epoch": 1847} {"train_loss": -12.19774341583252, "global_step": 310336, "epoch": 1847} {"train_loss": -12.255189895629883, "global_step": 310337, "epoch": 1847} {"train_loss": -12.25935173034668, "global_step": 310338, "epoch": 1847} {"train_loss": -12.273788452148438, "global_step": 310339, "epoch": 1847} {"train_loss": -12.020952224731445, "global_step": 310340, "epoch": 1847} {"train_loss": -12.167181968688965, "global_step": 310341, "epoch": 1847} {"train_loss": -12.181437492370605, "global_step": 310342, "epoch": 1847} {"train_loss": -12.290879249572754, "global_step": 310343, "epoch": 1847} {"train_loss": -12.396775245666504, "global_step": 310344, "epoch": 1847} {"train_loss": -12.582996368408203, "global_step": 310345, "epoch": 1847} {"train_loss": -12.245606422424316, "global_step": 310346, "epoch": 1847} {"train_loss": -12.523712158203125, "global_step": 310347, "epoch": 1847} {"train_loss": -12.398492813110352, "global_step": 310348, "epoch": 1847} {"train_loss": -12.366077423095703, "global_step": 310349, "epoch": 1847} {"train_loss": -12.320354461669922, "global_step": 310350, "epoch": 1847} {"train_loss": -12.372539520263672, "global_step": 310351, "epoch": 1847} {"train_loss": -12.439648628234863, "global_step": 310352, "epoch": 1847} {"train_loss": -12.539106369018555, "global_step": 310353, "epoch": 1847} {"train_loss": -12.351236343383789, "global_step": 310354, "epoch": 1847} {"train_loss": -12.314913749694824, "global_step": 310355, "epoch": 1847} {"train_loss": -12.522969245910645, "global_step": 310356, "epoch": 1847} {"train_loss": -12.237852096557617, "global_step": 310357, "epoch": 1847} {"train_loss": -12.175077438354492, "global_step": 310358, "epoch": 1847} {"train_loss": -12.428245544433594, "global_step": 310359, "epoch": 1847} {"train_loss": -12.281698226928711, "global_step": 310360, "epoch": 1847} {"train_loss": -12.00560188293457, "global_step": 310361, "epoch": 1847} {"train_loss": -12.078258514404297, "global_step": 310362, "epoch": 1847} {"train_loss": -12.123799324035645, "global_step": 310363, "epoch": 1847} {"train_loss": -11.337729454040527, "global_step": 310364, "epoch": 1847} {"train_loss": -12.2766752243042, "global_step": 310365, "epoch": 1847} {"train_loss": -12.107054710388184, "global_step": 310366, "epoch": 1847} {"train_loss": -10.579867362976074, "global_step": 310367, "epoch": 1847} {"train_loss": -12.212438583374023, "global_step": 310368, "epoch": 1847} {"train_loss": -11.242193222045898, "global_step": 310369, "epoch": 1847} {"train_loss": -10.311708450317383, "global_step": 310370, "epoch": 1847} {"train_loss": -11.61189079284668, "global_step": 310371, "epoch": 1847} {"train_loss": -9.275491714477539, "global_step": 310372, "epoch": 1847} {"train_loss": -9.205310821533203, "global_step": 310373, "epoch": 1847} {"train_loss": -8.256847381591797, "global_step": 310374, "epoch": 1847} {"train_loss": -8.990723609924316, "global_step": 310375, "epoch": 1847} {"train_loss": -9.898128509521484, "global_step": 310376, "epoch": 1847} {"train_loss": -10.842613220214844, "global_step": 310377, "epoch": 1847} {"train_loss": -9.057558059692383, "global_step": 310378, "epoch": 1847} {"train_loss": -10.258111953735352, "global_step": 310379, "epoch": 1847} {"train_loss": -10.91556167602539, "global_step": 310380, "epoch": 1847} {"train_loss": -10.227864265441895, "global_step": 310381, "epoch": 1847} {"train_loss": -10.615306854248047, "global_step": 310382, "epoch": 1847} {"train_loss": -11.484639167785645, "global_step": 310383, "epoch": 1847} {"train_loss": -10.241684913635254, "global_step": 310384, "epoch": 1847} {"train_loss": -9.855988502502441, "global_step": 310385, "epoch": 1847} {"train_loss": -10.450611114501953, "global_step": 310386, "epoch": 1847} {"train_loss": -10.547000885009766, "global_step": 310387, "epoch": 1847} {"train_loss": -9.559810638427734, "global_step": 310388, "epoch": 1847} {"train_loss": -9.841777801513672, "global_step": 310389, "epoch": 1847} {"train_loss": -9.498042106628418, "global_step": 310390, "epoch": 1847} {"train_loss": -10.978902816772461, "global_step": 310391, "epoch": 1847} {"train_loss": -9.444745063781738, "global_step": 310392, "epoch": 1847} {"train_loss": -10.044113159179688, "global_step": 310393, "epoch": 1847} {"train_loss": -10.900206565856934, "global_step": 310394, "epoch": 1847} {"train_loss": -10.766838073730469, "global_step": 310395, "epoch": 1847} {"train_loss": -10.674485206604004, "global_step": 310396, "epoch": 1847} {"train_loss": -10.757062911987305, "global_step": 310397, "epoch": 1847} {"train_loss": -10.545424461364746, "global_step": 310398, "epoch": 1847} {"train_loss": -10.631452560424805, "global_step": 310399, "epoch": 1847} {"train_loss": -10.655393600463867, "global_step": 310400, "epoch": 1847} {"train_loss": -10.926146507263184, "global_step": 310401, "epoch": 1847} {"train_loss": -11.381863594055176, "global_step": 310402, "epoch": 1847} {"train_loss": -10.895610809326172, "global_step": 310403, "epoch": 1847} {"train_loss": -11.275331497192383, "global_step": 310404, "epoch": 1847} {"train_loss": -11.429654121398926, "global_step": 310405, "epoch": 1847} {"train_loss": -11.58796501159668, "global_step": 310406, "epoch": 1847} {"train_loss": -10.93314266204834, "global_step": 310407, "epoch": 1847} {"train_loss": -11.534261703491211, "global_step": 310408, "epoch": 1847} {"train_loss": -11.14157485961914, "global_step": 310409, "epoch": 1847} {"train_loss": -11.702424049377441, "global_step": 310410, "epoch": 1847} {"train_loss": -11.124349594116211, "global_step": 310411, "epoch": 1847} {"train_loss": -11.526819229125977, "global_step": 310412, "epoch": 1847} {"train_loss": -11.55935001373291, "global_step": 310413, "epoch": 1847} {"train_loss": -11.521939277648926, "global_step": 310414, "epoch": 1847} {"train_loss": -11.591047286987305, "global_step": 310415, "epoch": 1847} {"train_loss": -11.659619331359863, "global_step": 310416, "epoch": 1847} {"train_loss": -11.256263732910156, "global_step": 310417, "epoch": 1847} {"train_loss": -11.212833404541016, "global_step": 310418, "epoch": 1847} {"train_loss": -11.581098556518555, "global_step": 310419, "epoch": 1847} {"train_loss": -11.092580795288086, "global_step": 310420, "epoch": 1847} {"train_loss": -11.625631332397461, "global_step": 310421, "epoch": 1847} {"train_loss": -11.291338920593262, "global_step": 310422, "epoch": 1847} {"train_loss": -11.663432121276855, "global_step": 310423, "epoch": 1847} {"train_loss": -11.34937858581543, "global_step": 310424, "epoch": 1847} {"train_loss": -11.631217956542969, "global_step": 310425, "epoch": 1847} {"train_loss": -11.818952560424805, "global_step": 310426, "epoch": 1847} {"train_loss": -11.474992752075195, "global_step": 310427, "epoch": 1847} {"train_loss": -11.345972061157227, "global_step": 310428, "epoch": 1847} {"train_loss": -11.912020683288574, "global_step": 310429, "epoch": 1847} {"train_loss": -11.464778900146484, "global_step": 310430, "epoch": 1847} {"train_loss": -11.629609107971191, "global_step": 310431, "epoch": 1847} {"train_loss": -11.659059524536133, "global_step": 310432, "epoch": 1847} {"train_loss": -11.66650390625, "global_step": 310433, "epoch": 1847} {"train_loss": -11.526329040527344, "global_step": 310434, "epoch": 1847} {"train_loss": -11.493282318115234, "global_step": 310435, "epoch": 1847} {"train_loss": -11.93283462524414, "global_step": 310436, "epoch": 1847} {"train_loss": -11.375059127807617, "global_step": 310437, "epoch": 1847} {"train_loss": -12.130866050720215, "global_step": 310438, "epoch": 1847} {"train_loss": -11.761819839477539, "global_step": 310439, "epoch": 1847} {"train_loss": -11.220003128051758, "global_step": 310440, "epoch": 1847} {"train_loss": -11.999711036682129, "global_step": 310441, "epoch": 1847} {"train_loss": -11.214555740356445, "global_step": 310442, "epoch": 1847} {"train_loss": -11.588241577148438, "global_step": 310443, "epoch": 1847} {"train_loss": -11.8812255859375, "global_step": 310444, "epoch": 1847} {"train_loss": -11.200697898864746, "global_step": 310445, "epoch": 1847} {"train_loss": -11.492773056030273, "global_step": 310446, "epoch": 1847} {"train_loss": -11.970155715942383, "global_step": 310447, "epoch": 1847} {"train_loss": -11.668706893920898, "global_step": 310448, "epoch": 1847} {"train_loss": -12.009119033813477, "global_step": 310449, "epoch": 1847} {"train_loss": -11.907930374145508, "global_step": 310450, "epoch": 1847} {"train_loss": -11.38429069519043, "global_step": 310451, "epoch": 1847} {"train_loss": -12.014944076538086, "global_step": 310452, "epoch": 1847} {"train_loss": -11.854755401611328, "global_step": 310453, "epoch": 1847} {"train_loss": -11.85203742980957, "global_step": 310454, "epoch": 1847} {"train_loss": -11.922259330749512, "global_step": 310455, "epoch": 1847} {"train_loss": -12.07735824584961, "global_step": 310456, "epoch": 1847} {"train_loss": -12.020781517028809, "global_step": 310457, "epoch": 1847} {"train_loss": -11.907353401184082, "global_step": 310458, "epoch": 1847} {"train_loss": -12.188650131225586, "global_step": 310459, "epoch": 1847} {"train_loss": -11.99691390991211, "global_step": 310460, "epoch": 1847} {"train_loss": -12.19739818572998, "global_step": 310461, "epoch": 1847} {"train_loss": -12.092551231384277, "global_step": 310462, "epoch": 1847} {"train_loss": -11.548794723692394, "global_step": 310463, "epoch": 1847, "val_loss": 279649.46875} {"train_loss": -12.13491153717041, "global_step": 310464, "epoch": 1848} {"train_loss": -12.37930679321289, "global_step": 310465, "epoch": 1848} {"train_loss": -12.260533332824707, "global_step": 310466, "epoch": 1848} {"train_loss": -12.13750171661377, "global_step": 310467, "epoch": 1848} {"train_loss": -12.226663589477539, "global_step": 310468, "epoch": 1848} {"train_loss": -12.164351463317871, "global_step": 310469, "epoch": 1848} {"train_loss": -12.299139976501465, "global_step": 310470, "epoch": 1848} {"train_loss": -11.964677810668945, "global_step": 310471, "epoch": 1848} {"train_loss": -12.13326644897461, "global_step": 310472, "epoch": 1848} {"train_loss": -12.215456008911133, "global_step": 310473, "epoch": 1848} {"train_loss": -12.292856216430664, "global_step": 310474, "epoch": 1848} {"train_loss": -11.922289848327637, "global_step": 310475, "epoch": 1848} {"train_loss": -12.17856502532959, "global_step": 310476, "epoch": 1848} {"train_loss": -12.194580078125, "global_step": 310477, "epoch": 1848} {"train_loss": -12.17823314666748, "global_step": 310478, "epoch": 1848} {"train_loss": -12.537410736083984, "global_step": 310479, "epoch": 1848} {"train_loss": -12.020358085632324, "global_step": 310480, "epoch": 1848} {"train_loss": -12.192415237426758, "global_step": 310481, "epoch": 1848} {"train_loss": -12.213996887207031, "global_step": 310482, "epoch": 1848} {"train_loss": -12.025644302368164, "global_step": 310483, "epoch": 1848} {"train_loss": -12.218990325927734, "global_step": 310484, "epoch": 1848} {"train_loss": -11.80343246459961, "global_step": 310485, "epoch": 1848} {"train_loss": -12.027936935424805, "global_step": 310486, "epoch": 1848} {"train_loss": -11.905173301696777, "global_step": 310487, "epoch": 1848} {"train_loss": -12.139068603515625, "global_step": 310488, "epoch": 1848} {"train_loss": -11.611061096191406, "global_step": 310489, "epoch": 1848} {"train_loss": -11.877485275268555, "global_step": 310490, "epoch": 1848} {"train_loss": -12.387811660766602, "global_step": 310491, "epoch": 1848} {"train_loss": -11.913434982299805, "global_step": 310492, "epoch": 1848} {"train_loss": -12.02421760559082, "global_step": 310493, "epoch": 1848} {"train_loss": -12.071067810058594, "global_step": 310494, "epoch": 1848} {"train_loss": -12.313116073608398, "global_step": 310495, "epoch": 1848} {"train_loss": -12.159727096557617, "global_step": 310496, "epoch": 1848} {"train_loss": -12.29986572265625, "global_step": 310497, "epoch": 1848} {"train_loss": -12.427706718444824, "global_step": 310498, "epoch": 1848} {"train_loss": -12.07122802734375, "global_step": 310499, "epoch": 1848} {"train_loss": -12.355026245117188, "global_step": 310500, "epoch": 1848} {"train_loss": -12.279561996459961, "global_step": 310501, "epoch": 1848} {"train_loss": -12.464038848876953, "global_step": 310502, "epoch": 1848} {"train_loss": -12.33741569519043, "global_step": 310503, "epoch": 1848} {"train_loss": -12.196144104003906, "global_step": 310504, "epoch": 1848} {"train_loss": -12.223371505737305, "global_step": 310505, "epoch": 1848} {"train_loss": -12.453937530517578, "global_step": 310506, "epoch": 1848} {"train_loss": -12.530691146850586, "global_step": 310507, "epoch": 1848} {"train_loss": -12.421307563781738, "global_step": 310508, "epoch": 1848} {"train_loss": -12.386375427246094, "global_step": 310509, "epoch": 1848} {"train_loss": -12.415199279785156, "global_step": 310510, "epoch": 1848} {"train_loss": -12.461380004882812, "global_step": 310511, "epoch": 1848} {"train_loss": -12.38257122039795, "global_step": 310512, "epoch": 1848} {"train_loss": -12.504741668701172, "global_step": 310513, "epoch": 1848} {"train_loss": -12.438932418823242, "global_step": 310514, "epoch": 1848} {"train_loss": -12.653881072998047, "global_step": 310515, "epoch": 1848} {"train_loss": -12.289787292480469, "global_step": 310516, "epoch": 1848} {"train_loss": -12.43759822845459, "global_step": 310517, "epoch": 1848} {"train_loss": -12.366089820861816, "global_step": 310518, "epoch": 1848} {"train_loss": -12.492582321166992, "global_step": 310519, "epoch": 1848} {"train_loss": -12.460750579833984, "global_step": 310520, "epoch": 1848} {"train_loss": -12.288778305053711, "global_step": 310521, "epoch": 1848} {"train_loss": -11.951620101928711, "global_step": 310522, "epoch": 1848} {"train_loss": -12.006939888000488, "global_step": 310523, "epoch": 1848} {"train_loss": -12.370011329650879, "global_step": 310524, "epoch": 1848} {"train_loss": -12.316511154174805, "global_step": 310525, "epoch": 1848} {"train_loss": -11.578575134277344, "global_step": 310526, "epoch": 1848} {"train_loss": -10.718082427978516, "global_step": 310527, "epoch": 1848} {"train_loss": -9.676513671875, "global_step": 310528, "epoch": 1848} {"train_loss": -11.626359939575195, "global_step": 310529, "epoch": 1848} {"train_loss": -8.720330238342285, "global_step": 310530, "epoch": 1848} {"train_loss": -10.489837646484375, "global_step": 310531, "epoch": 1848} {"train_loss": -9.059549331665039, "global_step": 310532, "epoch": 1848} {"train_loss": -11.459896087646484, "global_step": 310533, "epoch": 1848} {"train_loss": -10.874828338623047, "global_step": 310534, "epoch": 1848} {"train_loss": -9.806142807006836, "global_step": 310535, "epoch": 1848} {"train_loss": -11.862241744995117, "global_step": 310536, "epoch": 1848} {"train_loss": -11.408975601196289, "global_step": 310537, "epoch": 1848} {"train_loss": -10.642304420471191, "global_step": 310538, "epoch": 1848} {"train_loss": -10.679313659667969, "global_step": 310539, "epoch": 1848} {"train_loss": -11.783013343811035, "global_step": 310540, "epoch": 1848} {"train_loss": -9.997196197509766, "global_step": 310541, "epoch": 1848} {"train_loss": -11.07534408569336, "global_step": 310542, "epoch": 1848} {"train_loss": -9.543290138244629, "global_step": 310543, "epoch": 1848} {"train_loss": -11.09370231628418, "global_step": 310544, "epoch": 1848} {"train_loss": -9.718913078308105, "global_step": 310545, "epoch": 1848} {"train_loss": -10.29709529876709, "global_step": 310546, "epoch": 1848} {"train_loss": -10.16236686706543, "global_step": 310547, "epoch": 1848} {"train_loss": -9.774123191833496, "global_step": 310548, "epoch": 1848} {"train_loss": -8.7584228515625, "global_step": 310549, "epoch": 1848} {"train_loss": -9.275972366333008, "global_step": 310550, "epoch": 1848} {"train_loss": -10.969158172607422, "global_step": 310551, "epoch": 1848} {"train_loss": -8.88224983215332, "global_step": 310552, "epoch": 1848} {"train_loss": -7.381037712097168, "global_step": 310553, "epoch": 1848} {"train_loss": -10.111506462097168, "global_step": 310554, "epoch": 1848} {"train_loss": -9.381088256835938, "global_step": 310555, "epoch": 1848} {"train_loss": -9.714736938476562, "global_step": 310556, "epoch": 1848} {"train_loss": -8.811984062194824, "global_step": 310557, "epoch": 1848} {"train_loss": -10.696496963500977, "global_step": 310558, "epoch": 1848} {"train_loss": -8.84292984008789, "global_step": 310559, "epoch": 1848} {"train_loss": -9.1756591796875, "global_step": 310560, "epoch": 1848} {"train_loss": -11.055295944213867, "global_step": 310561, "epoch": 1848} {"train_loss": -9.805648803710938, "global_step": 310562, "epoch": 1848} {"train_loss": -10.481795310974121, "global_step": 310563, "epoch": 1848} {"train_loss": -10.708056449890137, "global_step": 310564, "epoch": 1848} {"train_loss": -10.357168197631836, "global_step": 310565, "epoch": 1848} {"train_loss": -11.441091537475586, "global_step": 310566, "epoch": 1848} {"train_loss": -10.415863037109375, "global_step": 310567, "epoch": 1848} {"train_loss": -10.897115707397461, "global_step": 310568, "epoch": 1848} {"train_loss": -10.87693977355957, "global_step": 310569, "epoch": 1848} {"train_loss": -10.962728500366211, "global_step": 310570, "epoch": 1848} {"train_loss": -11.038265228271484, "global_step": 310571, "epoch": 1848} {"train_loss": -11.327007293701172, "global_step": 310572, "epoch": 1848} {"train_loss": -11.518787384033203, "global_step": 310573, "epoch": 1848} {"train_loss": -11.078344345092773, "global_step": 310574, "epoch": 1848} {"train_loss": -11.460886001586914, "global_step": 310575, "epoch": 1848} {"train_loss": -11.443544387817383, "global_step": 310576, "epoch": 1848} {"train_loss": -11.43648910522461, "global_step": 310577, "epoch": 1848} {"train_loss": -11.954062461853027, "global_step": 310578, "epoch": 1848} {"train_loss": -11.621366500854492, "global_step": 310579, "epoch": 1848} {"train_loss": -11.646617889404297, "global_step": 310580, "epoch": 1848} {"train_loss": -12.05204963684082, "global_step": 310581, "epoch": 1848} {"train_loss": -11.62563419342041, "global_step": 310582, "epoch": 1848} {"train_loss": -11.996301651000977, "global_step": 310583, "epoch": 1848} {"train_loss": -11.686370849609375, "global_step": 310584, "epoch": 1848} {"train_loss": -11.69257926940918, "global_step": 310585, "epoch": 1848} {"train_loss": -11.564208984375, "global_step": 310586, "epoch": 1848} {"train_loss": -12.007654190063477, "global_step": 310587, "epoch": 1848} {"train_loss": -11.761369705200195, "global_step": 310588, "epoch": 1848} {"train_loss": -11.778498649597168, "global_step": 310589, "epoch": 1848} {"train_loss": -11.838391304016113, "global_step": 310590, "epoch": 1848} {"train_loss": -11.97432804107666, "global_step": 310591, "epoch": 1848} {"train_loss": -12.13723373413086, "global_step": 310592, "epoch": 1848} {"train_loss": -11.908366203308105, "global_step": 310593, "epoch": 1848} {"train_loss": -12.068771362304688, "global_step": 310594, "epoch": 1848} {"train_loss": -12.082887649536133, "global_step": 310595, "epoch": 1848} {"train_loss": -11.981032371520996, "global_step": 310596, "epoch": 1848} {"train_loss": -12.064842224121094, "global_step": 310597, "epoch": 1848} {"train_loss": -12.058172225952148, "global_step": 310598, "epoch": 1848} {"train_loss": -11.982874870300293, "global_step": 310599, "epoch": 1848} {"train_loss": -12.026969909667969, "global_step": 310600, "epoch": 1848} {"train_loss": -11.964822769165039, "global_step": 310601, "epoch": 1848} {"train_loss": -11.958471298217773, "global_step": 310602, "epoch": 1848} {"train_loss": -12.062541007995605, "global_step": 310603, "epoch": 1848} {"train_loss": -12.184280395507812, "global_step": 310604, "epoch": 1848} {"train_loss": -12.031736373901367, "global_step": 310605, "epoch": 1848} {"train_loss": -12.086406707763672, "global_step": 310606, "epoch": 1848} {"train_loss": -12.122008323669434, "global_step": 310607, "epoch": 1848} {"train_loss": -12.288591384887695, "global_step": 310608, "epoch": 1848} {"train_loss": -12.30893325805664, "global_step": 310609, "epoch": 1848} {"train_loss": -12.08541202545166, "global_step": 310610, "epoch": 1848} {"train_loss": -12.112075805664062, "global_step": 310611, "epoch": 1848} {"train_loss": -12.43138313293457, "global_step": 310612, "epoch": 1848} {"train_loss": -12.313277244567871, "global_step": 310613, "epoch": 1848} {"train_loss": -12.389250755310059, "global_step": 310614, "epoch": 1848} {"train_loss": -12.253150939941406, "global_step": 310615, "epoch": 1848} {"train_loss": -12.149259567260742, "global_step": 310616, "epoch": 1848} {"train_loss": -12.047285079956055, "global_step": 310617, "epoch": 1848} {"train_loss": -12.322031021118164, "global_step": 310618, "epoch": 1848} {"train_loss": -11.875617980957031, "global_step": 310619, "epoch": 1848} {"train_loss": -12.05169677734375, "global_step": 310620, "epoch": 1848} {"train_loss": -12.166815757751465, "global_step": 310621, "epoch": 1848} {"train_loss": -12.333024978637695, "global_step": 310622, "epoch": 1848} {"train_loss": -12.135852813720703, "global_step": 310623, "epoch": 1848} {"train_loss": -12.027542114257812, "global_step": 310624, "epoch": 1848} {"train_loss": -11.948248863220215, "global_step": 310625, "epoch": 1848} {"train_loss": -12.307147979736328, "global_step": 310626, "epoch": 1848} {"train_loss": -11.837362289428711, "global_step": 310627, "epoch": 1848} {"train_loss": -12.103097915649414, "global_step": 310628, "epoch": 1848} {"train_loss": -12.205639839172363, "global_step": 310629, "epoch": 1848} {"train_loss": -12.173489570617676, "global_step": 310630, "epoch": 1848} {"train_loss": -11.596399278867812, "global_step": 310631, "epoch": 1848, "val_loss": 279666.40625} {"train_loss": -12.22486686706543, "global_step": 310632, "epoch": 1849} {"train_loss": -11.96449089050293, "global_step": 310633, "epoch": 1849} {"train_loss": -12.38178825378418, "global_step": 310634, "epoch": 1849} {"train_loss": -12.265155792236328, "global_step": 310635, "epoch": 1849} {"train_loss": -12.200077056884766, "global_step": 310636, "epoch": 1849} {"train_loss": -11.928888320922852, "global_step": 310637, "epoch": 1849} {"train_loss": -12.444818496704102, "global_step": 310638, "epoch": 1849} {"train_loss": -11.602925300598145, "global_step": 310639, "epoch": 1849} {"train_loss": -11.855615615844727, "global_step": 310640, "epoch": 1849} {"train_loss": -11.744865417480469, "global_step": 310641, "epoch": 1849} {"train_loss": -11.905865669250488, "global_step": 310642, "epoch": 1849} {"train_loss": -12.10537338256836, "global_step": 310643, "epoch": 1849} {"train_loss": -12.009546279907227, "global_step": 310644, "epoch": 1849} {"train_loss": -12.103230476379395, "global_step": 310645, "epoch": 1849} {"train_loss": -12.227038383483887, "global_step": 310646, "epoch": 1849} {"train_loss": -12.10430908203125, "global_step": 310647, "epoch": 1849} {"train_loss": -12.100170135498047, "global_step": 310648, "epoch": 1849} {"train_loss": -11.91804027557373, "global_step": 310649, "epoch": 1849} {"train_loss": -12.25220775604248, "global_step": 310650, "epoch": 1849} {"train_loss": -11.959611892700195, "global_step": 310651, "epoch": 1849} {"train_loss": -12.287253379821777, "global_step": 310652, "epoch": 1849} {"train_loss": -11.852278709411621, "global_step": 310653, "epoch": 1849} {"train_loss": -11.967206954956055, "global_step": 310654, "epoch": 1849} {"train_loss": -12.064298629760742, "global_step": 310655, "epoch": 1849} {"train_loss": -11.624807357788086, "global_step": 310656, "epoch": 1849} {"train_loss": -12.512267112731934, "global_step": 310657, "epoch": 1849} {"train_loss": -11.976900100708008, "global_step": 310658, "epoch": 1849} {"train_loss": -12.264344215393066, "global_step": 310659, "epoch": 1849} {"train_loss": -12.154394149780273, "global_step": 310660, "epoch": 1849} {"train_loss": -12.316274642944336, "global_step": 310661, "epoch": 1849} {"train_loss": -12.368851661682129, "global_step": 310662, "epoch": 1849} {"train_loss": -12.250505447387695, "global_step": 310663, "epoch": 1849} {"train_loss": -12.155841827392578, "global_step": 310664, "epoch": 1849} {"train_loss": -12.07152271270752, "global_step": 310665, "epoch": 1849} {"train_loss": -12.384908676147461, "global_step": 310666, "epoch": 1849} {"train_loss": -12.158917427062988, "global_step": 310667, "epoch": 1849} {"train_loss": -12.124077796936035, "global_step": 310668, "epoch": 1849} {"train_loss": -11.746819496154785, "global_step": 310669, "epoch": 1849} {"train_loss": -11.234987258911133, "global_step": 310670, "epoch": 1849} {"train_loss": -9.13290023803711, "global_step": 310671, "epoch": 1849} {"train_loss": -11.095317840576172, "global_step": 310672, "epoch": 1849} {"train_loss": -8.64217758178711, "global_step": 310673, "epoch": 1849} {"train_loss": -9.04508113861084, "global_step": 310674, "epoch": 1849} {"train_loss": -7.773292064666748, "global_step": 310675, "epoch": 1849} {"train_loss": -10.20376968383789, "global_step": 310676, "epoch": 1849} {"train_loss": -8.643478393554688, "global_step": 310677, "epoch": 1849} {"train_loss": -9.439252853393555, "global_step": 310678, "epoch": 1849} {"train_loss": -6.354925632476807, "global_step": 310679, "epoch": 1849} {"train_loss": -6.390405654907227, "global_step": 310680, "epoch": 1849} {"train_loss": -7.017171859741211, "global_step": 310681, "epoch": 1849} {"train_loss": -7.839577674865723, "global_step": 310682, "epoch": 1849} {"train_loss": -7.252796173095703, "global_step": 310683, "epoch": 1849} {"train_loss": -8.046865463256836, "global_step": 310684, "epoch": 1849} {"train_loss": -8.585208892822266, "global_step": 310685, "epoch": 1849} {"train_loss": -9.100354194641113, "global_step": 310686, "epoch": 1849} {"train_loss": -6.995602130889893, "global_step": 310687, "epoch": 1849} {"train_loss": -8.49428939819336, "global_step": 310688, "epoch": 1849} {"train_loss": -7.473694801330566, "global_step": 310689, "epoch": 1849} {"train_loss": -8.580924987792969, "global_step": 310690, "epoch": 1849} {"train_loss": -8.928877830505371, "global_step": 310691, "epoch": 1849} {"train_loss": -9.052753448486328, "global_step": 310692, "epoch": 1849} {"train_loss": -9.55406665802002, "global_step": 310693, "epoch": 1849} {"train_loss": -9.806561470031738, "global_step": 310694, "epoch": 1849} {"train_loss": -10.40178108215332, "global_step": 310695, "epoch": 1849} {"train_loss": -10.063531875610352, "global_step": 310696, "epoch": 1849} {"train_loss": -9.67367172241211, "global_step": 310697, "epoch": 1849} {"train_loss": -10.30649185180664, "global_step": 310698, "epoch": 1849} {"train_loss": -10.43090534210205, "global_step": 310699, "epoch": 1849} {"train_loss": -10.099846839904785, "global_step": 310700, "epoch": 1849} {"train_loss": -10.689308166503906, "global_step": 310701, "epoch": 1849} {"train_loss": -10.734048843383789, "global_step": 310702, "epoch": 1849} {"train_loss": -10.896982192993164, "global_step": 310703, "epoch": 1849} {"train_loss": -11.167137145996094, "global_step": 310704, "epoch": 1849} {"train_loss": -11.034387588500977, "global_step": 310705, "epoch": 1849} {"train_loss": -11.070241928100586, "global_step": 310706, "epoch": 1849} {"train_loss": -11.350259780883789, "global_step": 310707, "epoch": 1849} {"train_loss": -11.044487953186035, "global_step": 310708, "epoch": 1849} {"train_loss": -11.14013671875, "global_step": 310709, "epoch": 1849} {"train_loss": -11.159900665283203, "global_step": 310710, "epoch": 1849} {"train_loss": -11.219383239746094, "global_step": 310711, "epoch": 1849} {"train_loss": -11.035901069641113, "global_step": 310712, "epoch": 1849} {"train_loss": -11.308160781860352, "global_step": 310713, "epoch": 1849} {"train_loss": -11.188819885253906, "global_step": 310714, "epoch": 1849} {"train_loss": -11.386853218078613, "global_step": 310715, "epoch": 1849} {"train_loss": -11.353392601013184, "global_step": 310716, "epoch": 1849} {"train_loss": -11.333685874938965, "global_step": 310717, "epoch": 1849} {"train_loss": -10.909886360168457, "global_step": 310718, "epoch": 1849} {"train_loss": -10.7389554977417, "global_step": 310719, "epoch": 1849} {"train_loss": -11.527212142944336, "global_step": 310720, "epoch": 1849} {"train_loss": -11.60313606262207, "global_step": 310721, "epoch": 1849} {"train_loss": -11.465164184570312, "global_step": 310722, "epoch": 1849} {"train_loss": -11.430831909179688, "global_step": 310723, "epoch": 1849} {"train_loss": -11.663032531738281, "global_step": 310724, "epoch": 1849} {"train_loss": -11.403068542480469, "global_step": 310725, "epoch": 1849} {"train_loss": -11.95367431640625, "global_step": 310726, "epoch": 1849} {"train_loss": -11.49532699584961, "global_step": 310727, "epoch": 1849} {"train_loss": -11.673807144165039, "global_step": 310728, "epoch": 1849} {"train_loss": -11.840415000915527, "global_step": 310729, "epoch": 1849} {"train_loss": -11.636688232421875, "global_step": 310730, "epoch": 1849} {"train_loss": -11.924674034118652, "global_step": 310731, "epoch": 1849} {"train_loss": -11.720579147338867, "global_step": 310732, "epoch": 1849} {"train_loss": -12.021531105041504, "global_step": 310733, "epoch": 1849} {"train_loss": -11.789738655090332, "global_step": 310734, "epoch": 1849} {"train_loss": -11.808298110961914, "global_step": 310735, "epoch": 1849} {"train_loss": -11.913862228393555, "global_step": 310736, "epoch": 1849} {"train_loss": -11.52672290802002, "global_step": 310737, "epoch": 1849} {"train_loss": -11.89037036895752, "global_step": 310738, "epoch": 1849} {"train_loss": -11.962335586547852, "global_step": 310739, "epoch": 1849} {"train_loss": -11.970159530639648, "global_step": 310740, "epoch": 1849} {"train_loss": -12.015305519104004, "global_step": 310741, "epoch": 1849} {"train_loss": -12.048883438110352, "global_step": 310742, "epoch": 1849} {"train_loss": -12.035475730895996, "global_step": 310743, "epoch": 1849} {"train_loss": -11.929930686950684, "global_step": 310744, "epoch": 1849} {"train_loss": -12.060171127319336, "global_step": 310745, "epoch": 1849} {"train_loss": -11.69608211517334, "global_step": 310746, "epoch": 1849} {"train_loss": -11.848686218261719, "global_step": 310747, "epoch": 1849} {"train_loss": -11.86967658996582, "global_step": 310748, "epoch": 1849} {"train_loss": -11.999444007873535, "global_step": 310749, "epoch": 1849} {"train_loss": -12.134050369262695, "global_step": 310750, "epoch": 1849} {"train_loss": -12.050140380859375, "global_step": 310751, "epoch": 1849} {"train_loss": -12.08759593963623, "global_step": 310752, "epoch": 1849} {"train_loss": -12.160948753356934, "global_step": 310753, "epoch": 1849} {"train_loss": -11.941892623901367, "global_step": 310754, "epoch": 1849} {"train_loss": -11.952165603637695, "global_step": 310755, "epoch": 1849} {"train_loss": -11.893802642822266, "global_step": 310756, "epoch": 1849} {"train_loss": -12.000054359436035, "global_step": 310757, "epoch": 1849} {"train_loss": -12.014572143554688, "global_step": 310758, "epoch": 1849} {"train_loss": -11.862529754638672, "global_step": 310759, "epoch": 1849} {"train_loss": -12.294901847839355, "global_step": 310760, "epoch": 1849} {"train_loss": -12.283061981201172, "global_step": 310761, "epoch": 1849} {"train_loss": -12.220235824584961, "global_step": 310762, "epoch": 1849} {"train_loss": -12.163941383361816, "global_step": 310763, "epoch": 1849} {"train_loss": -12.11717414855957, "global_step": 310764, "epoch": 1849} {"train_loss": -12.313761711120605, "global_step": 310765, "epoch": 1849} {"train_loss": -12.264280319213867, "global_step": 310766, "epoch": 1849} {"train_loss": -12.196037292480469, "global_step": 310767, "epoch": 1849} {"train_loss": -12.22035026550293, "global_step": 310768, "epoch": 1849} {"train_loss": -12.345621109008789, "global_step": 310769, "epoch": 1849} {"train_loss": -12.078277587890625, "global_step": 310770, "epoch": 1849} {"train_loss": -12.473442077636719, "global_step": 310771, "epoch": 1849} {"train_loss": -12.228109359741211, "global_step": 310772, "epoch": 1849} {"train_loss": -12.270660400390625, "global_step": 310773, "epoch": 1849} {"train_loss": -12.343957901000977, "global_step": 310774, "epoch": 1849} {"train_loss": -12.075087547302246, "global_step": 310775, "epoch": 1849} {"train_loss": -12.288331031799316, "global_step": 310776, "epoch": 1849} {"train_loss": -11.980486869812012, "global_step": 310777, "epoch": 1849} {"train_loss": -11.829233169555664, "global_step": 310778, "epoch": 1849} {"train_loss": -11.882560729980469, "global_step": 310779, "epoch": 1849} {"train_loss": -11.710857391357422, "global_step": 310780, "epoch": 1849} {"train_loss": -12.515445709228516, "global_step": 310781, "epoch": 1849} {"train_loss": -11.886346817016602, "global_step": 310782, "epoch": 1849} {"train_loss": -11.792840003967285, "global_step": 310783, "epoch": 1849} {"train_loss": -12.201969146728516, "global_step": 310784, "epoch": 1849} {"train_loss": -11.306720733642578, "global_step": 310785, "epoch": 1849} {"train_loss": -12.210811614990234, "global_step": 310786, "epoch": 1849} {"train_loss": -11.886258125305176, "global_step": 310787, "epoch": 1849} {"train_loss": -11.984586715698242, "global_step": 310788, "epoch": 1849} {"train_loss": -12.306941986083984, "global_step": 310789, "epoch": 1849} {"train_loss": -11.915645599365234, "global_step": 310790, "epoch": 1849} {"train_loss": -12.234861373901367, "global_step": 310791, "epoch": 1849} {"train_loss": -11.934104919433594, "global_step": 310792, "epoch": 1849} {"train_loss": -11.740161895751953, "global_step": 310793, "epoch": 1849} {"train_loss": -12.30411434173584, "global_step": 310794, "epoch": 1849} {"train_loss": -11.631609916687012, "global_step": 310795, "epoch": 1849} {"train_loss": -12.207605361938477, "global_step": 310796, "epoch": 1849} {"train_loss": -11.914909362792969, "global_step": 310797, "epoch": 1849} {"train_loss": -12.366188049316406, "global_step": 310798, "epoch": 1849} {"train_loss": -11.332451902684712, "global_step": 310799, "epoch": 1849, "val_loss": 276737.21875} {"train_loss": -12.145319938659668, "global_step": 310800, "epoch": 1850} {"train_loss": -12.361549377441406, "global_step": 310801, "epoch": 1850} {"train_loss": -12.030573844909668, "global_step": 310802, "epoch": 1850} {"train_loss": -11.937071800231934, "global_step": 310803, "epoch": 1850} {"train_loss": -12.184179306030273, "global_step": 310804, "epoch": 1850} {"train_loss": -12.03964614868164, "global_step": 310805, "epoch": 1850} {"train_loss": -11.435752868652344, "global_step": 310806, "epoch": 1850} {"train_loss": -11.966285705566406, "global_step": 310807, "epoch": 1850} {"train_loss": -11.726791381835938, "global_step": 310808, "epoch": 1850} {"train_loss": -11.095258712768555, "global_step": 310809, "epoch": 1850} {"train_loss": -11.955991744995117, "global_step": 310810, "epoch": 1850} {"train_loss": -11.677337646484375, "global_step": 310811, "epoch": 1850} {"train_loss": -11.078218460083008, "global_step": 310812, "epoch": 1850} {"train_loss": -11.48432731628418, "global_step": 310813, "epoch": 1850} {"train_loss": -11.343497276306152, "global_step": 310814, "epoch": 1850} {"train_loss": -11.895212173461914, "global_step": 310815, "epoch": 1850} {"train_loss": -11.890883445739746, "global_step": 310816, "epoch": 1850} {"train_loss": -11.186317443847656, "global_step": 310817, "epoch": 1850} {"train_loss": -11.581612586975098, "global_step": 310818, "epoch": 1850} {"train_loss": -11.709467887878418, "global_step": 310819, "epoch": 1850} {"train_loss": -11.791606903076172, "global_step": 310820, "epoch": 1850} {"train_loss": -11.291102409362793, "global_step": 310821, "epoch": 1850} {"train_loss": -9.911901473999023, "global_step": 310822, "epoch": 1850} {"train_loss": -9.816741943359375, "global_step": 310823, "epoch": 1850} {"train_loss": -10.795759201049805, "global_step": 310824, "epoch": 1850} {"train_loss": -10.551572799682617, "global_step": 310825, "epoch": 1850} {"train_loss": -10.619436264038086, "global_step": 310826, "epoch": 1850} {"train_loss": -9.864720344543457, "global_step": 310827, "epoch": 1850} {"train_loss": -11.459166526794434, "global_step": 310828, "epoch": 1850} {"train_loss": -9.882356643676758, "global_step": 310829, "epoch": 1850} {"train_loss": -10.01327896118164, "global_step": 310830, "epoch": 1850} {"train_loss": -11.130088806152344, "global_step": 310831, "epoch": 1850} {"train_loss": -10.592216491699219, "global_step": 310832, "epoch": 1850} {"train_loss": -11.213578224182129, "global_step": 310833, "epoch": 1850} {"train_loss": -11.085119247436523, "global_step": 310834, "epoch": 1850} {"train_loss": -10.894974708557129, "global_step": 310835, "epoch": 1850} {"train_loss": -11.03822135925293, "global_step": 310836, "epoch": 1850} {"train_loss": -11.494192123413086, "global_step": 310837, "epoch": 1850} {"train_loss": -10.210956573486328, "global_step": 310838, "epoch": 1850} {"train_loss": -11.339529037475586, "global_step": 310839, "epoch": 1850} {"train_loss": -10.5174560546875, "global_step": 310840, "epoch": 1850} {"train_loss": -11.38322639465332, "global_step": 310841, "epoch": 1850} {"train_loss": -10.490509033203125, "global_step": 310842, "epoch": 1850} {"train_loss": -11.422785758972168, "global_step": 310843, "epoch": 1850} {"train_loss": -11.142048835754395, "global_step": 310844, "epoch": 1850} {"train_loss": -11.00347900390625, "global_step": 310845, "epoch": 1850} {"train_loss": -11.597291946411133, "global_step": 310846, "epoch": 1850} {"train_loss": -10.853426933288574, "global_step": 310847, "epoch": 1850} {"train_loss": -11.64558219909668, "global_step": 310848, "epoch": 1850} {"train_loss": -10.437541961669922, "global_step": 310849, "epoch": 1850} {"train_loss": -11.752044677734375, "global_step": 310850, "epoch": 1850} {"train_loss": -11.057767868041992, "global_step": 310851, "epoch": 1850} {"train_loss": -11.670384407043457, "global_step": 310852, "epoch": 1850} {"train_loss": -11.048843383789062, "global_step": 310853, "epoch": 1850} {"train_loss": -11.311535835266113, "global_step": 310854, "epoch": 1850} {"train_loss": -10.783726692199707, "global_step": 310855, "epoch": 1850} {"train_loss": -11.292869567871094, "global_step": 310856, "epoch": 1850} {"train_loss": -10.802324295043945, "global_step": 310857, "epoch": 1850} {"train_loss": -11.570640563964844, "global_step": 310858, "epoch": 1850} {"train_loss": -10.996163368225098, "global_step": 310859, "epoch": 1850} {"train_loss": -11.30525016784668, "global_step": 310860, "epoch": 1850} {"train_loss": -10.731237411499023, "global_step": 310861, "epoch": 1850} {"train_loss": -10.82684326171875, "global_step": 310862, "epoch": 1850} {"train_loss": -11.21953010559082, "global_step": 310863, "epoch": 1850} {"train_loss": -11.434442520141602, "global_step": 310864, "epoch": 1850} {"train_loss": -11.163983345031738, "global_step": 310865, "epoch": 1850} {"train_loss": -11.089969635009766, "global_step": 310866, "epoch": 1850} {"train_loss": -11.532352447509766, "global_step": 310867, "epoch": 1850} {"train_loss": -11.410940170288086, "global_step": 310868, "epoch": 1850} {"train_loss": -11.609014511108398, "global_step": 310869, "epoch": 1850} {"train_loss": -11.577007293701172, "global_step": 310870, "epoch": 1850} {"train_loss": -11.553345680236816, "global_step": 310871, "epoch": 1850} {"train_loss": -11.704851150512695, "global_step": 310872, "epoch": 1850} {"train_loss": -11.788402557373047, "global_step": 310873, "epoch": 1850} {"train_loss": -11.50101089477539, "global_step": 310874, "epoch": 1850} {"train_loss": -11.638513565063477, "global_step": 310875, "epoch": 1850} {"train_loss": -11.587911605834961, "global_step": 310876, "epoch": 1850} {"train_loss": -11.815704345703125, "global_step": 310877, "epoch": 1850} {"train_loss": -11.91098403930664, "global_step": 310878, "epoch": 1850} {"train_loss": -11.857837677001953, "global_step": 310879, "epoch": 1850} {"train_loss": -11.878823280334473, "global_step": 310880, "epoch": 1850} {"train_loss": -12.023269653320312, "global_step": 310881, "epoch": 1850} {"train_loss": -11.716885566711426, "global_step": 310882, "epoch": 1850} {"train_loss": -11.973247528076172, "global_step": 310883, "epoch": 1850} {"train_loss": -12.121265411376953, "global_step": 310884, "epoch": 1850} {"train_loss": -12.08615779876709, "global_step": 310885, "epoch": 1850} {"train_loss": -12.060738563537598, "global_step": 310886, "epoch": 1850} {"train_loss": -12.12720775604248, "global_step": 310887, "epoch": 1850} {"train_loss": -11.735764503479004, "global_step": 310888, "epoch": 1850} {"train_loss": -11.969230651855469, "global_step": 310889, "epoch": 1850} {"train_loss": -11.930892944335938, "global_step": 310890, "epoch": 1850} {"train_loss": -12.107806205749512, "global_step": 310891, "epoch": 1850} {"train_loss": -12.162849426269531, "global_step": 310892, "epoch": 1850} {"train_loss": -11.794962882995605, "global_step": 310893, "epoch": 1850} {"train_loss": -12.075450897216797, "global_step": 310894, "epoch": 1850} {"train_loss": -12.237171173095703, "global_step": 310895, "epoch": 1850} {"train_loss": -12.250883102416992, "global_step": 310896, "epoch": 1850} {"train_loss": -12.203372955322266, "global_step": 310897, "epoch": 1850} {"train_loss": -12.177999496459961, "global_step": 310898, "epoch": 1850} {"train_loss": -12.080232620239258, "global_step": 310899, "epoch": 1850} {"train_loss": -12.21742057800293, "global_step": 310900, "epoch": 1850} {"train_loss": -12.252302169799805, "global_step": 310901, "epoch": 1850} {"train_loss": -12.207157135009766, "global_step": 310902, "epoch": 1850} {"train_loss": -12.032564163208008, "global_step": 310903, "epoch": 1850} {"train_loss": -12.146690368652344, "global_step": 310904, "epoch": 1850} {"train_loss": -12.180245399475098, "global_step": 310905, "epoch": 1850} {"train_loss": -12.361934661865234, "global_step": 310906, "epoch": 1850} {"train_loss": -12.259465217590332, "global_step": 310907, "epoch": 1850} {"train_loss": -12.201435089111328, "global_step": 310908, "epoch": 1850} {"train_loss": -12.283098220825195, "global_step": 310909, "epoch": 1850} {"train_loss": -12.188908576965332, "global_step": 310910, "epoch": 1850} {"train_loss": -12.345579147338867, "global_step": 310911, "epoch": 1850} {"train_loss": -12.216217041015625, "global_step": 310912, "epoch": 1850} {"train_loss": -12.179903030395508, "global_step": 310913, "epoch": 1850} {"train_loss": -12.206869125366211, "global_step": 310914, "epoch": 1850} {"train_loss": -12.272076606750488, "global_step": 310915, "epoch": 1850} {"train_loss": -12.397616386413574, "global_step": 310916, "epoch": 1850} {"train_loss": -12.025524139404297, "global_step": 310917, "epoch": 1850} {"train_loss": -12.298118591308594, "global_step": 310918, "epoch": 1850} {"train_loss": -12.147590637207031, "global_step": 310919, "epoch": 1850} {"train_loss": -12.455848693847656, "global_step": 310920, "epoch": 1850} {"train_loss": -12.3317232131958, "global_step": 310921, "epoch": 1850} {"train_loss": -12.501214027404785, "global_step": 310922, "epoch": 1850} {"train_loss": -12.391738891601562, "global_step": 310923, "epoch": 1850} {"train_loss": -12.154369354248047, "global_step": 310924, "epoch": 1850} {"train_loss": -12.188294410705566, "global_step": 310925, "epoch": 1850} {"train_loss": -12.51361083984375, "global_step": 310926, "epoch": 1850} {"train_loss": -12.400657653808594, "global_step": 310927, "epoch": 1850} {"train_loss": -12.461211204528809, "global_step": 310928, "epoch": 1850} {"train_loss": -12.421770095825195, "global_step": 310929, "epoch": 1850} {"train_loss": -12.4578857421875, "global_step": 310930, "epoch": 1850} {"train_loss": -12.231170654296875, "global_step": 310931, "epoch": 1850} {"train_loss": -12.471563339233398, "global_step": 310932, "epoch": 1850} {"train_loss": -12.386308670043945, "global_step": 310933, "epoch": 1850} {"train_loss": -12.438997268676758, "global_step": 310934, "epoch": 1850} {"train_loss": -12.309869766235352, "global_step": 310935, "epoch": 1850} {"train_loss": -12.396926879882812, "global_step": 310936, "epoch": 1850} {"train_loss": -12.332362174987793, "global_step": 310937, "epoch": 1850} {"train_loss": -12.370792388916016, "global_step": 310938, "epoch": 1850} {"train_loss": -12.186454772949219, "global_step": 310939, "epoch": 1850} {"train_loss": -12.461824417114258, "global_step": 310940, "epoch": 1850} {"train_loss": -12.26452922821045, "global_step": 310941, "epoch": 1850} {"train_loss": -12.153440475463867, "global_step": 310942, "epoch": 1850} {"train_loss": -12.020120620727539, "global_step": 310943, "epoch": 1850} {"train_loss": -12.177630424499512, "global_step": 310944, "epoch": 1850} {"train_loss": -12.314859390258789, "global_step": 310945, "epoch": 1850} {"train_loss": -12.298849105834961, "global_step": 310946, "epoch": 1850} {"train_loss": -12.220349311828613, "global_step": 310947, "epoch": 1850} {"train_loss": -11.71079158782959, "global_step": 310948, "epoch": 1850} {"train_loss": -11.014374732971191, "global_step": 310949, "epoch": 1850} {"train_loss": -11.261285781860352, "global_step": 310950, "epoch": 1850} {"train_loss": -12.141058921813965, "global_step": 310951, "epoch": 1850} {"train_loss": -11.683774948120117, "global_step": 310952, "epoch": 1850} {"train_loss": -12.154243469238281, "global_step": 310953, "epoch": 1850} {"train_loss": -11.738990783691406, "global_step": 310954, "epoch": 1850} {"train_loss": -12.257518768310547, "global_step": 310955, "epoch": 1850} {"train_loss": -11.719856262207031, "global_step": 310956, "epoch": 1850} {"train_loss": -11.543692588806152, "global_step": 310957, "epoch": 1850} {"train_loss": -11.325407981872559, "global_step": 310958, "epoch": 1850} {"train_loss": -10.995124816894531, "global_step": 310959, "epoch": 1850} {"train_loss": -11.726627349853516, "global_step": 310960, "epoch": 1850} {"train_loss": -11.543121337890625, "global_step": 310961, "epoch": 1850} {"train_loss": -11.964935302734375, "global_step": 310962, "epoch": 1850} {"train_loss": -11.957489013671875, "global_step": 310963, "epoch": 1850} {"train_loss": -11.87550163269043, "global_step": 310964, "epoch": 1850} {"train_loss": -11.833053588867188, "global_step": 310965, "epoch": 1850} {"train_loss": -11.716872215270996, "global_step": 310966, "epoch": 1850} {"train_loss": -11.70321402095613, "global_step": 310967, "epoch": 1850, "train/sim_max_reward_0": 0.5509494960518223, "train/sim_max_reward_1": 0.983593718294306, "train/sim_max_reward_2": 0.00667194960286843, "train/sim_max_reward_3": 0.30027961676303394, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.7246044936284646, "test/sim_max_reward_4400000": 0.9753321157373068, "test/sim_max_reward_4400001": 0.42640684636923043, "test/sim_max_reward_4400002": 0.9925204102445616, "test/sim_max_reward_4400003": 0.07871374581788795, "test/sim_max_reward_4400004": 0.5909918715841277, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 0.9603475720877283, "test/sim_max_reward_4400007": 0.983687899584717, "test/sim_max_reward_4400008": 0.5843266611643847, "test/sim_max_reward_4400009": 0.448833156700655, "test/sim_max_reward_4400010": 0.9660444554366294, "test/sim_max_reward_4400011": 0.9909540224798741, "test/sim_max_reward_4400012": 0.9515283680160802, "test/sim_max_reward_4400013": 0.9485939497150417, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 0.9902174424101706, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.1192029135656554, "test/sim_max_reward_4400018": 0.9628328125541529, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.6979766509796717, "test/sim_max_reward_4400022": 0.9666563787050862, "test/sim_max_reward_4400023": 0.13876733800905225, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.703766190179998, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.17142414629354574, "test/sim_max_reward_4400028": 1.0, "test/sim_max_reward_4400029": 0.4077095486749391, "test/sim_max_reward_4400030": 0.9943640772461774, "test/sim_max_reward_4400031": 0.9649982115555988, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.5471620501077582, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.9787276885849191, "test/sim_max_reward_4400036": 0.3733477565670756, "test/sim_max_reward_4400037": 0.9695436772526459, "test/sim_max_reward_4400038": 0.31261384191462116, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.14460901111289867, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.9639382106899561, "test/sim_max_reward_4400044": 0.5782914938473734, "test/sim_max_reward_4400045": 0.4479713637605107, "test/sim_max_reward_4400046": 1.0, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.5943498790567492, "test/mean_score": 0.5768492637925146, "val_loss": 282420.1875, "train_action_mse_error": 1.5812366008758545} {"train_loss": -10.839319229125977, "global_step": 310968, "epoch": 1851} {"train_loss": -11.835232734680176, "global_step": 310969, "epoch": 1851} {"train_loss": -10.936624526977539, "global_step": 310970, "epoch": 1851} {"train_loss": -11.74793529510498, "global_step": 310971, "epoch": 1851} {"train_loss": -11.277711868286133, "global_step": 310972, "epoch": 1851} {"train_loss": -11.959290504455566, "global_step": 310973, "epoch": 1851} {"train_loss": -11.372007369995117, "global_step": 310974, "epoch": 1851} {"train_loss": -11.814220428466797, "global_step": 310975, "epoch": 1851} {"train_loss": -11.400157928466797, "global_step": 310976, "epoch": 1851} {"train_loss": -11.575603485107422, "global_step": 310977, "epoch": 1851} {"train_loss": -11.13758659362793, "global_step": 310978, "epoch": 1851} {"train_loss": -11.595032691955566, "global_step": 310979, "epoch": 1851} {"train_loss": -11.788484573364258, "global_step": 310980, "epoch": 1851} {"train_loss": -11.312682151794434, "global_step": 310981, "epoch": 1851} {"train_loss": -11.709232330322266, "global_step": 310982, "epoch": 1851} {"train_loss": -10.626999855041504, "global_step": 310983, "epoch": 1851} {"train_loss": -11.191030502319336, "global_step": 310984, "epoch": 1851} {"train_loss": -10.700408935546875, "global_step": 310985, "epoch": 1851} {"train_loss": -11.63447093963623, "global_step": 310986, "epoch": 1851} {"train_loss": -11.20786190032959, "global_step": 310987, "epoch": 1851} {"train_loss": -11.617122650146484, "global_step": 310988, "epoch": 1851} {"train_loss": -11.51002311706543, "global_step": 310989, "epoch": 1851} {"train_loss": -11.477283477783203, "global_step": 310990, "epoch": 1851} {"train_loss": -12.091514587402344, "global_step": 310991, "epoch": 1851} {"train_loss": -11.607059478759766, "global_step": 310992, "epoch": 1851} {"train_loss": -11.664834022521973, "global_step": 310993, "epoch": 1851} {"train_loss": -11.247703552246094, "global_step": 310994, "epoch": 1851} {"train_loss": -11.030342102050781, "global_step": 310995, "epoch": 1851} {"train_loss": -11.06413745880127, "global_step": 310996, "epoch": 1851} {"train_loss": -11.030069351196289, "global_step": 310997, "epoch": 1851} {"train_loss": -11.256860733032227, "global_step": 310998, "epoch": 1851} {"train_loss": -11.562395095825195, "global_step": 310999, "epoch": 1851} {"train_loss": -10.762112617492676, "global_step": 311000, "epoch": 1851} {"train_loss": -10.673219680786133, "global_step": 311001, "epoch": 1851} {"train_loss": -10.571739196777344, "global_step": 311002, "epoch": 1851} {"train_loss": -9.706249237060547, "global_step": 311003, "epoch": 1851} {"train_loss": -11.639127731323242, "global_step": 311004, "epoch": 1851} {"train_loss": -9.4564208984375, "global_step": 311005, "epoch": 1851} {"train_loss": -10.942508697509766, "global_step": 311006, "epoch": 1851} {"train_loss": -11.146408081054688, "global_step": 311007, "epoch": 1851} {"train_loss": -10.688833236694336, "global_step": 311008, "epoch": 1851} {"train_loss": -10.795633316040039, "global_step": 311009, "epoch": 1851} {"train_loss": -11.778416633605957, "global_step": 311010, "epoch": 1851} {"train_loss": -10.555639266967773, "global_step": 311011, "epoch": 1851} {"train_loss": -11.231588363647461, "global_step": 311012, "epoch": 1851} {"train_loss": -10.57710075378418, "global_step": 311013, "epoch": 1851} {"train_loss": -11.203838348388672, "global_step": 311014, "epoch": 1851} {"train_loss": -11.375263214111328, "global_step": 311015, "epoch": 1851} {"train_loss": -11.463626861572266, "global_step": 311016, "epoch": 1851} {"train_loss": -10.76268196105957, "global_step": 311017, "epoch": 1851} {"train_loss": -12.007570266723633, "global_step": 311018, "epoch": 1851} {"train_loss": -11.32581615447998, "global_step": 311019, "epoch": 1851} {"train_loss": -11.7633638381958, "global_step": 311020, "epoch": 1851} {"train_loss": -11.34586238861084, "global_step": 311021, "epoch": 1851} {"train_loss": -11.849571228027344, "global_step": 311022, "epoch": 1851} {"train_loss": -11.617165565490723, "global_step": 311023, "epoch": 1851} {"train_loss": -11.909219741821289, "global_step": 311024, "epoch": 1851} {"train_loss": -11.932459831237793, "global_step": 311025, "epoch": 1851} {"train_loss": -11.787406921386719, "global_step": 311026, "epoch": 1851} {"train_loss": -12.045318603515625, "global_step": 311027, "epoch": 1851} {"train_loss": -12.004596710205078, "global_step": 311028, "epoch": 1851} {"train_loss": -11.989557266235352, "global_step": 311029, "epoch": 1851} {"train_loss": -12.044536590576172, "global_step": 311030, "epoch": 1851} {"train_loss": -12.007087707519531, "global_step": 311031, "epoch": 1851} {"train_loss": -12.108438491821289, "global_step": 311032, "epoch": 1851} {"train_loss": -11.866525650024414, "global_step": 311033, "epoch": 1851} {"train_loss": -11.680097579956055, "global_step": 311034, "epoch": 1851} {"train_loss": -11.914350509643555, "global_step": 311035, "epoch": 1851} {"train_loss": -11.87450122833252, "global_step": 311036, "epoch": 1851} {"train_loss": -11.94294261932373, "global_step": 311037, "epoch": 1851} {"train_loss": -11.71007251739502, "global_step": 311038, "epoch": 1851} {"train_loss": -11.814727783203125, "global_step": 311039, "epoch": 1851} {"train_loss": -12.077155113220215, "global_step": 311040, "epoch": 1851} {"train_loss": -11.692447662353516, "global_step": 311041, "epoch": 1851} {"train_loss": -12.091314315795898, "global_step": 311042, "epoch": 1851} {"train_loss": -11.85793685913086, "global_step": 311043, "epoch": 1851} {"train_loss": -12.253623962402344, "global_step": 311044, "epoch": 1851} {"train_loss": -12.08336067199707, "global_step": 311045, "epoch": 1851} {"train_loss": -12.028160095214844, "global_step": 311046, "epoch": 1851} {"train_loss": -12.1934814453125, "global_step": 311047, "epoch": 1851} {"train_loss": -11.999445915222168, "global_step": 311048, "epoch": 1851} {"train_loss": -11.792978286743164, "global_step": 311049, "epoch": 1851} {"train_loss": -11.899039268493652, "global_step": 311050, "epoch": 1851} {"train_loss": -12.113740921020508, "global_step": 311051, "epoch": 1851} {"train_loss": -11.809270858764648, "global_step": 311052, "epoch": 1851} {"train_loss": -12.361010551452637, "global_step": 311053, "epoch": 1851} {"train_loss": -11.53265380859375, "global_step": 311054, "epoch": 1851} {"train_loss": -12.194683074951172, "global_step": 311055, "epoch": 1851} {"train_loss": -11.676000595092773, "global_step": 311056, "epoch": 1851} {"train_loss": -12.191225051879883, "global_step": 311057, "epoch": 1851} {"train_loss": -11.907641410827637, "global_step": 311058, "epoch": 1851} {"train_loss": -12.113256454467773, "global_step": 311059, "epoch": 1851} {"train_loss": -12.160176277160645, "global_step": 311060, "epoch": 1851} {"train_loss": -12.008223533630371, "global_step": 311061, "epoch": 1851} {"train_loss": -12.339432716369629, "global_step": 311062, "epoch": 1851} {"train_loss": -11.809687614440918, "global_step": 311063, "epoch": 1851} {"train_loss": -12.382854461669922, "global_step": 311064, "epoch": 1851} {"train_loss": -11.959293365478516, "global_step": 311065, "epoch": 1851} {"train_loss": -12.261874198913574, "global_step": 311066, "epoch": 1851} {"train_loss": -12.334482192993164, "global_step": 311067, "epoch": 1851} {"train_loss": -12.329647064208984, "global_step": 311068, "epoch": 1851} {"train_loss": -12.389873504638672, "global_step": 311069, "epoch": 1851} {"train_loss": -12.251346588134766, "global_step": 311070, "epoch": 1851} {"train_loss": -12.092437744140625, "global_step": 311071, "epoch": 1851} {"train_loss": -12.339299201965332, "global_step": 311072, "epoch": 1851} {"train_loss": -12.146722793579102, "global_step": 311073, "epoch": 1851} {"train_loss": -12.093019485473633, "global_step": 311074, "epoch": 1851} {"train_loss": -12.363290786743164, "global_step": 311075, "epoch": 1851} {"train_loss": -12.261962890625, "global_step": 311076, "epoch": 1851} {"train_loss": -12.303750991821289, "global_step": 311077, "epoch": 1851} {"train_loss": -12.19784164428711, "global_step": 311078, "epoch": 1851} {"train_loss": -12.311318397521973, "global_step": 311079, "epoch": 1851} {"train_loss": -12.400344848632812, "global_step": 311080, "epoch": 1851} {"train_loss": -12.502923965454102, "global_step": 311081, "epoch": 1851} {"train_loss": -12.27726936340332, "global_step": 311082, "epoch": 1851} {"train_loss": -12.338785171508789, "global_step": 311083, "epoch": 1851} {"train_loss": -12.436676025390625, "global_step": 311084, "epoch": 1851} {"train_loss": -12.290910720825195, "global_step": 311085, "epoch": 1851} {"train_loss": -12.247659683227539, "global_step": 311086, "epoch": 1851} {"train_loss": -11.872297286987305, "global_step": 311087, "epoch": 1851} {"train_loss": -12.189638137817383, "global_step": 311088, "epoch": 1851} {"train_loss": -12.346025466918945, "global_step": 311089, "epoch": 1851} {"train_loss": -12.41954231262207, "global_step": 311090, "epoch": 1851} {"train_loss": -12.152389526367188, "global_step": 311091, "epoch": 1851} {"train_loss": -12.4693021774292, "global_step": 311092, "epoch": 1851} {"train_loss": -12.060007095336914, "global_step": 311093, "epoch": 1851} {"train_loss": -12.256425857543945, "global_step": 311094, "epoch": 1851} {"train_loss": -12.336183547973633, "global_step": 311095, "epoch": 1851} {"train_loss": -12.052934646606445, "global_step": 311096, "epoch": 1851} {"train_loss": -12.51016616821289, "global_step": 311097, "epoch": 1851} {"train_loss": -11.455020904541016, "global_step": 311098, "epoch": 1851} {"train_loss": -12.192054748535156, "global_step": 311099, "epoch": 1851} {"train_loss": -12.316597938537598, "global_step": 311100, "epoch": 1851} {"train_loss": -12.076684951782227, "global_step": 311101, "epoch": 1851} {"train_loss": -12.231364250183105, "global_step": 311102, "epoch": 1851} {"train_loss": -12.176507949829102, "global_step": 311103, "epoch": 1851} {"train_loss": -11.724536895751953, "global_step": 311104, "epoch": 1851} {"train_loss": -12.326364517211914, "global_step": 311105, "epoch": 1851} {"train_loss": -12.049753189086914, "global_step": 311106, "epoch": 1851} {"train_loss": -11.966533660888672, "global_step": 311107, "epoch": 1851} {"train_loss": -12.494392395019531, "global_step": 311108, "epoch": 1851} {"train_loss": -12.040534019470215, "global_step": 311109, "epoch": 1851} {"train_loss": -12.159761428833008, "global_step": 311110, "epoch": 1851} {"train_loss": -12.071718215942383, "global_step": 311111, "epoch": 1851} {"train_loss": -12.342252731323242, "global_step": 311112, "epoch": 1851} {"train_loss": -12.089679718017578, "global_step": 311113, "epoch": 1851} {"train_loss": -12.25478744506836, "global_step": 311114, "epoch": 1851} {"train_loss": -11.786062240600586, "global_step": 311115, "epoch": 1851} {"train_loss": -12.309562683105469, "global_step": 311116, "epoch": 1851} {"train_loss": -12.306009292602539, "global_step": 311117, "epoch": 1851} {"train_loss": -12.194564819335938, "global_step": 311118, "epoch": 1851} {"train_loss": -11.907137870788574, "global_step": 311119, "epoch": 1851} {"train_loss": -11.941057205200195, "global_step": 311120, "epoch": 1851} {"train_loss": -11.499930381774902, "global_step": 311121, "epoch": 1851} {"train_loss": -11.868146896362305, "global_step": 311122, "epoch": 1851} {"train_loss": -12.220009803771973, "global_step": 311123, "epoch": 1851} {"train_loss": -11.64960765838623, "global_step": 311124, "epoch": 1851} {"train_loss": -12.098487854003906, "global_step": 311125, "epoch": 1851} {"train_loss": -12.126346588134766, "global_step": 311126, "epoch": 1851} {"train_loss": -11.557424545288086, "global_step": 311127, "epoch": 1851} {"train_loss": -11.726829528808594, "global_step": 311128, "epoch": 1851} {"train_loss": -11.884260177612305, "global_step": 311129, "epoch": 1851} {"train_loss": -11.695016860961914, "global_step": 311130, "epoch": 1851} {"train_loss": -11.48598861694336, "global_step": 311131, "epoch": 1851} {"train_loss": -12.170980453491211, "global_step": 311132, "epoch": 1851} {"train_loss": -11.681007385253906, "global_step": 311133, "epoch": 1851} {"train_loss": -11.60920524597168, "global_step": 311134, "epoch": 1851} {"train_loss": -11.79450283731733, "global_step": 311135, "epoch": 1851, "val_loss": 283397.90625} {"train_loss": -11.137887954711914, "global_step": 311136, "epoch": 1852} {"train_loss": -11.955039978027344, "global_step": 311137, "epoch": 1852} {"train_loss": -11.688483238220215, "global_step": 311138, "epoch": 1852} {"train_loss": -12.023887634277344, "global_step": 311139, "epoch": 1852} {"train_loss": -11.799728393554688, "global_step": 311140, "epoch": 1852} {"train_loss": -11.620344161987305, "global_step": 311141, "epoch": 1852} {"train_loss": -11.93072509765625, "global_step": 311142, "epoch": 1852} {"train_loss": -11.621047973632812, "global_step": 311143, "epoch": 1852} {"train_loss": -10.237771987915039, "global_step": 311144, "epoch": 1852} {"train_loss": -11.49399471282959, "global_step": 311145, "epoch": 1852} {"train_loss": -10.673053741455078, "global_step": 311146, "epoch": 1852} {"train_loss": -11.734376907348633, "global_step": 311147, "epoch": 1852} {"train_loss": -10.763940811157227, "global_step": 311148, "epoch": 1852} {"train_loss": -10.639656066894531, "global_step": 311149, "epoch": 1852} {"train_loss": -10.878384590148926, "global_step": 311150, "epoch": 1852} {"train_loss": -10.3499174118042, "global_step": 311151, "epoch": 1852} {"train_loss": -10.835573196411133, "global_step": 311152, "epoch": 1852} {"train_loss": -10.224344253540039, "global_step": 311153, "epoch": 1852} {"train_loss": -10.842092514038086, "global_step": 311154, "epoch": 1852} {"train_loss": -9.692659378051758, "global_step": 311155, "epoch": 1852} {"train_loss": -9.999061584472656, "global_step": 311156, "epoch": 1852} {"train_loss": -10.5256929397583, "global_step": 311157, "epoch": 1852} {"train_loss": -10.52740478515625, "global_step": 311158, "epoch": 1852} {"train_loss": -10.609848022460938, "global_step": 311159, "epoch": 1852} {"train_loss": -10.316848754882812, "global_step": 311160, "epoch": 1852} {"train_loss": -10.105308532714844, "global_step": 311161, "epoch": 1852} {"train_loss": -11.553079605102539, "global_step": 311162, "epoch": 1852} {"train_loss": -9.69485855102539, "global_step": 311163, "epoch": 1852} {"train_loss": -10.667094230651855, "global_step": 311164, "epoch": 1852} {"train_loss": -10.403929710388184, "global_step": 311165, "epoch": 1852} {"train_loss": -10.062297821044922, "global_step": 311166, "epoch": 1852} {"train_loss": -10.527472496032715, "global_step": 311167, "epoch": 1852} {"train_loss": -9.679766654968262, "global_step": 311168, "epoch": 1852} {"train_loss": -10.10771369934082, "global_step": 311169, "epoch": 1852} {"train_loss": -9.70559310913086, "global_step": 311170, "epoch": 1852} {"train_loss": -9.350992202758789, "global_step": 311171, "epoch": 1852} {"train_loss": -10.530902862548828, "global_step": 311172, "epoch": 1852} {"train_loss": -10.1055908203125, "global_step": 311173, "epoch": 1852} {"train_loss": -10.114889144897461, "global_step": 311174, "epoch": 1852} {"train_loss": -11.027708053588867, "global_step": 311175, "epoch": 1852} {"train_loss": -10.72791576385498, "global_step": 311176, "epoch": 1852} {"train_loss": -11.354475021362305, "global_step": 311177, "epoch": 1852} {"train_loss": -11.219996452331543, "global_step": 311178, "epoch": 1852} {"train_loss": -10.68614387512207, "global_step": 311179, "epoch": 1852} {"train_loss": -11.687320709228516, "global_step": 311180, "epoch": 1852} {"train_loss": -10.691484451293945, "global_step": 311181, "epoch": 1852} {"train_loss": -11.675140380859375, "global_step": 311182, "epoch": 1852} {"train_loss": -11.036380767822266, "global_step": 311183, "epoch": 1852} {"train_loss": -11.52094554901123, "global_step": 311184, "epoch": 1852} {"train_loss": -11.27455997467041, "global_step": 311185, "epoch": 1852} {"train_loss": -11.11872673034668, "global_step": 311186, "epoch": 1852} {"train_loss": -11.92921257019043, "global_step": 311187, "epoch": 1852} {"train_loss": -11.457111358642578, "global_step": 311188, "epoch": 1852} {"train_loss": -11.255285263061523, "global_step": 311189, "epoch": 1852} {"train_loss": -11.802940368652344, "global_step": 311190, "epoch": 1852} {"train_loss": -11.11589241027832, "global_step": 311191, "epoch": 1852} {"train_loss": -11.654153823852539, "global_step": 311192, "epoch": 1852} {"train_loss": -11.468023300170898, "global_step": 311193, "epoch": 1852} {"train_loss": -11.731578826904297, "global_step": 311194, "epoch": 1852} {"train_loss": -11.723965644836426, "global_step": 311195, "epoch": 1852} {"train_loss": -11.39352035522461, "global_step": 311196, "epoch": 1852} {"train_loss": -11.503772735595703, "global_step": 311197, "epoch": 1852} {"train_loss": -11.67365837097168, "global_step": 311198, "epoch": 1852} {"train_loss": -11.58840560913086, "global_step": 311199, "epoch": 1852} {"train_loss": -11.90119743347168, "global_step": 311200, "epoch": 1852} {"train_loss": -11.539809226989746, "global_step": 311201, "epoch": 1852} {"train_loss": -12.005135536193848, "global_step": 311202, "epoch": 1852} {"train_loss": -11.856056213378906, "global_step": 311203, "epoch": 1852} {"train_loss": -11.79573917388916, "global_step": 311204, "epoch": 1852} {"train_loss": -11.95276927947998, "global_step": 311205, "epoch": 1852} {"train_loss": -11.938112258911133, "global_step": 311206, "epoch": 1852} {"train_loss": -12.016475677490234, "global_step": 311207, "epoch": 1852} {"train_loss": -12.057913780212402, "global_step": 311208, "epoch": 1852} {"train_loss": -11.995745658874512, "global_step": 311209, "epoch": 1852} {"train_loss": -12.202412605285645, "global_step": 311210, "epoch": 1852} {"train_loss": -12.164234161376953, "global_step": 311211, "epoch": 1852} {"train_loss": -12.02411937713623, "global_step": 311212, "epoch": 1852} {"train_loss": -12.0023193359375, "global_step": 311213, "epoch": 1852} {"train_loss": -12.03804874420166, "global_step": 311214, "epoch": 1852} {"train_loss": -11.999127388000488, "global_step": 311215, "epoch": 1852} {"train_loss": -12.1641263961792, "global_step": 311216, "epoch": 1852} {"train_loss": -12.196182250976562, "global_step": 311217, "epoch": 1852} {"train_loss": -12.01700210571289, "global_step": 311218, "epoch": 1852} {"train_loss": -12.117879867553711, "global_step": 311219, "epoch": 1852} {"train_loss": -12.045766830444336, "global_step": 311220, "epoch": 1852} {"train_loss": -12.22559928894043, "global_step": 311221, "epoch": 1852} {"train_loss": -12.225255012512207, "global_step": 311222, "epoch": 1852} {"train_loss": -12.216215133666992, "global_step": 311223, "epoch": 1852} {"train_loss": -12.26674747467041, "global_step": 311224, "epoch": 1852} {"train_loss": -11.878219604492188, "global_step": 311225, "epoch": 1852} {"train_loss": -12.251810073852539, "global_step": 311226, "epoch": 1852} {"train_loss": -12.368461608886719, "global_step": 311227, "epoch": 1852} {"train_loss": -12.154104232788086, "global_step": 311228, "epoch": 1852} {"train_loss": -12.272903442382812, "global_step": 311229, "epoch": 1852} {"train_loss": -11.934333801269531, "global_step": 311230, "epoch": 1852} {"train_loss": -12.315848350524902, "global_step": 311231, "epoch": 1852} {"train_loss": -12.096123695373535, "global_step": 311232, "epoch": 1852} {"train_loss": -12.126382827758789, "global_step": 311233, "epoch": 1852} {"train_loss": -11.907866477966309, "global_step": 311234, "epoch": 1852} {"train_loss": -12.017069816589355, "global_step": 311235, "epoch": 1852} {"train_loss": -12.26704216003418, "global_step": 311236, "epoch": 1852} {"train_loss": -12.201427459716797, "global_step": 311237, "epoch": 1852} {"train_loss": -12.209857940673828, "global_step": 311238, "epoch": 1852} {"train_loss": -12.053512573242188, "global_step": 311239, "epoch": 1852} {"train_loss": -12.329060554504395, "global_step": 311240, "epoch": 1852} {"train_loss": -12.332318305969238, "global_step": 311241, "epoch": 1852} {"train_loss": -12.284485816955566, "global_step": 311242, "epoch": 1852} {"train_loss": -12.29045581817627, "global_step": 311243, "epoch": 1852} {"train_loss": -12.322216033935547, "global_step": 311244, "epoch": 1852} {"train_loss": -12.357799530029297, "global_step": 311245, "epoch": 1852} {"train_loss": -12.33361530303955, "global_step": 311246, "epoch": 1852} {"train_loss": -12.018013000488281, "global_step": 311247, "epoch": 1852} {"train_loss": -12.379987716674805, "global_step": 311248, "epoch": 1852} {"train_loss": -12.345407485961914, "global_step": 311249, "epoch": 1852} {"train_loss": -12.51882553100586, "global_step": 311250, "epoch": 1852} {"train_loss": -12.403373718261719, "global_step": 311251, "epoch": 1852} {"train_loss": -12.19881820678711, "global_step": 311252, "epoch": 1852} {"train_loss": -12.461591720581055, "global_step": 311253, "epoch": 1852} {"train_loss": -12.152751922607422, "global_step": 311254, "epoch": 1852} {"train_loss": -12.449651718139648, "global_step": 311255, "epoch": 1852} {"train_loss": -12.262990951538086, "global_step": 311256, "epoch": 1852} {"train_loss": -12.298785209655762, "global_step": 311257, "epoch": 1852} {"train_loss": -12.557687759399414, "global_step": 311258, "epoch": 1852} {"train_loss": -12.394672393798828, "global_step": 311259, "epoch": 1852} {"train_loss": -12.391239166259766, "global_step": 311260, "epoch": 1852} {"train_loss": -12.405641555786133, "global_step": 311261, "epoch": 1852} {"train_loss": -12.376376152038574, "global_step": 311262, "epoch": 1852} {"train_loss": -12.266304016113281, "global_step": 311263, "epoch": 1852} {"train_loss": -12.366320610046387, "global_step": 311264, "epoch": 1852} {"train_loss": -12.402759552001953, "global_step": 311265, "epoch": 1852} {"train_loss": -12.405305862426758, "global_step": 311266, "epoch": 1852} {"train_loss": -12.449644088745117, "global_step": 311267, "epoch": 1852} {"train_loss": -12.561859130859375, "global_step": 311268, "epoch": 1852} {"train_loss": -12.491846084594727, "global_step": 311269, "epoch": 1852} {"train_loss": -12.485037803649902, "global_step": 311270, "epoch": 1852} {"train_loss": -12.333297729492188, "global_step": 311271, "epoch": 1852} {"train_loss": -12.530757904052734, "global_step": 311272, "epoch": 1852} {"train_loss": -12.58206558227539, "global_step": 311273, "epoch": 1852} {"train_loss": -12.623861312866211, "global_step": 311274, "epoch": 1852} {"train_loss": -12.622293472290039, "global_step": 311275, "epoch": 1852} {"train_loss": -12.662395477294922, "global_step": 311276, "epoch": 1852} {"train_loss": -12.619856834411621, "global_step": 311277, "epoch": 1852} {"train_loss": -12.678836822509766, "global_step": 311278, "epoch": 1852} {"train_loss": -12.560861587524414, "global_step": 311279, "epoch": 1852} {"train_loss": -12.639904975891113, "global_step": 311280, "epoch": 1852} {"train_loss": -12.528142929077148, "global_step": 311281, "epoch": 1852} {"train_loss": -12.586225509643555, "global_step": 311282, "epoch": 1852} {"train_loss": -12.824857711791992, "global_step": 311283, "epoch": 1852} {"train_loss": -12.740492820739746, "global_step": 311284, "epoch": 1852} {"train_loss": -12.421478271484375, "global_step": 311285, "epoch": 1852} {"train_loss": -12.40652084350586, "global_step": 311286, "epoch": 1852} {"train_loss": -12.698397636413574, "global_step": 311287, "epoch": 1852} {"train_loss": -12.630830764770508, "global_step": 311288, "epoch": 1852} {"train_loss": -12.489068031311035, "global_step": 311289, "epoch": 1852} {"train_loss": -11.827975273132324, "global_step": 311290, "epoch": 1852} {"train_loss": -11.82286262512207, "global_step": 311291, "epoch": 1852} {"train_loss": -11.263199806213379, "global_step": 311292, "epoch": 1852} {"train_loss": -12.651895523071289, "global_step": 311293, "epoch": 1852} {"train_loss": -10.650967597961426, "global_step": 311294, "epoch": 1852} {"train_loss": -11.544954299926758, "global_step": 311295, "epoch": 1852} {"train_loss": -11.847092628479004, "global_step": 311296, "epoch": 1852} {"train_loss": -11.032075881958008, "global_step": 311297, "epoch": 1852} {"train_loss": -10.852920532226562, "global_step": 311298, "epoch": 1852} {"train_loss": -9.920273780822754, "global_step": 311299, "epoch": 1852} {"train_loss": -11.803970336914062, "global_step": 311300, "epoch": 1852} {"train_loss": -12.014816284179688, "global_step": 311301, "epoch": 1852} {"train_loss": -10.675747871398926, "global_step": 311302, "epoch": 1852} {"train_loss": -11.70055475689116, "global_step": 311303, "epoch": 1852, "val_loss": 286252.6875} {"train_loss": -11.04892635345459, "global_step": 311304, "epoch": 1853} {"train_loss": -11.841470718383789, "global_step": 311305, "epoch": 1853} {"train_loss": -11.590234756469727, "global_step": 311306, "epoch": 1853} {"train_loss": -11.603551864624023, "global_step": 311307, "epoch": 1853} {"train_loss": -11.478713035583496, "global_step": 311308, "epoch": 1853} {"train_loss": -10.705333709716797, "global_step": 311309, "epoch": 1853} {"train_loss": -10.429287910461426, "global_step": 311310, "epoch": 1853} {"train_loss": -11.555394172668457, "global_step": 311311, "epoch": 1853} {"train_loss": -10.27669906616211, "global_step": 311312, "epoch": 1853} {"train_loss": -11.381952285766602, "global_step": 311313, "epoch": 1853} {"train_loss": -11.408411026000977, "global_step": 311314, "epoch": 1853} {"train_loss": -10.842059135437012, "global_step": 311315, "epoch": 1853} {"train_loss": -11.207171440124512, "global_step": 311316, "epoch": 1853} {"train_loss": -11.175707817077637, "global_step": 311317, "epoch": 1853} {"train_loss": -11.4175443649292, "global_step": 311318, "epoch": 1853} {"train_loss": -10.670766830444336, "global_step": 311319, "epoch": 1853} {"train_loss": -11.706622123718262, "global_step": 311320, "epoch": 1853} {"train_loss": -11.427865028381348, "global_step": 311321, "epoch": 1853} {"train_loss": -11.55201530456543, "global_step": 311322, "epoch": 1853} {"train_loss": -11.343337059020996, "global_step": 311323, "epoch": 1853} {"train_loss": -11.624288558959961, "global_step": 311324, "epoch": 1853} {"train_loss": -11.250797271728516, "global_step": 311325, "epoch": 1853} {"train_loss": -11.61376667022705, "global_step": 311326, "epoch": 1853} {"train_loss": -10.851137161254883, "global_step": 311327, "epoch": 1853} {"train_loss": -11.227226257324219, "global_step": 311328, "epoch": 1853} {"train_loss": -11.670307159423828, "global_step": 311329, "epoch": 1853} {"train_loss": -10.518826484680176, "global_step": 311330, "epoch": 1853} {"train_loss": -11.621367454528809, "global_step": 311331, "epoch": 1853} {"train_loss": -10.876477241516113, "global_step": 311332, "epoch": 1853} {"train_loss": -11.859893798828125, "global_step": 311333, "epoch": 1853} {"train_loss": -10.834080696105957, "global_step": 311334, "epoch": 1853} {"train_loss": -11.68127155303955, "global_step": 311335, "epoch": 1853} {"train_loss": -11.305290222167969, "global_step": 311336, "epoch": 1853} {"train_loss": -11.810401916503906, "global_step": 311337, "epoch": 1853} {"train_loss": -11.71422290802002, "global_step": 311338, "epoch": 1853} {"train_loss": -11.403778076171875, "global_step": 311339, "epoch": 1853} {"train_loss": -12.00561237335205, "global_step": 311340, "epoch": 1853} {"train_loss": -10.979070663452148, "global_step": 311341, "epoch": 1853} {"train_loss": -11.91601848602295, "global_step": 311342, "epoch": 1853} {"train_loss": -11.445917129516602, "global_step": 311343, "epoch": 1853} {"train_loss": -11.685005187988281, "global_step": 311344, "epoch": 1853} {"train_loss": -11.370150566101074, "global_step": 311345, "epoch": 1853} {"train_loss": -11.813709259033203, "global_step": 311346, "epoch": 1853} {"train_loss": -11.603160858154297, "global_step": 311347, "epoch": 1853} {"train_loss": -11.642183303833008, "global_step": 311348, "epoch": 1853} {"train_loss": -11.749663352966309, "global_step": 311349, "epoch": 1853} {"train_loss": -11.458953857421875, "global_step": 311350, "epoch": 1853} {"train_loss": -11.940919876098633, "global_step": 311351, "epoch": 1853} {"train_loss": -11.558062553405762, "global_step": 311352, "epoch": 1853} {"train_loss": -11.640758514404297, "global_step": 311353, "epoch": 1853} {"train_loss": -11.499797821044922, "global_step": 311354, "epoch": 1853} {"train_loss": -11.706087112426758, "global_step": 311355, "epoch": 1853} {"train_loss": -11.738140106201172, "global_step": 311356, "epoch": 1853} {"train_loss": -11.65744400024414, "global_step": 311357, "epoch": 1853} {"train_loss": -11.916478157043457, "global_step": 311358, "epoch": 1853} {"train_loss": -11.256292343139648, "global_step": 311359, "epoch": 1853} {"train_loss": -11.890192031860352, "global_step": 311360, "epoch": 1853} {"train_loss": -11.590810775756836, "global_step": 311361, "epoch": 1853} {"train_loss": -11.817411422729492, "global_step": 311362, "epoch": 1853} {"train_loss": -11.349445343017578, "global_step": 311363, "epoch": 1853} {"train_loss": -11.981077194213867, "global_step": 311364, "epoch": 1853} {"train_loss": -11.080755233764648, "global_step": 311365, "epoch": 1853} {"train_loss": -11.459498405456543, "global_step": 311366, "epoch": 1853} {"train_loss": -11.015848159790039, "global_step": 311367, "epoch": 1853} {"train_loss": -10.960336685180664, "global_step": 311368, "epoch": 1853} {"train_loss": -12.07314682006836, "global_step": 311369, "epoch": 1853} {"train_loss": -11.187541961669922, "global_step": 311370, "epoch": 1853} {"train_loss": -11.792762756347656, "global_step": 311371, "epoch": 1853} {"train_loss": -11.438488960266113, "global_step": 311372, "epoch": 1853} {"train_loss": -11.740790367126465, "global_step": 311373, "epoch": 1853} {"train_loss": -11.679916381835938, "global_step": 311374, "epoch": 1853} {"train_loss": -11.559267044067383, "global_step": 311375, "epoch": 1853} {"train_loss": -11.293745040893555, "global_step": 311376, "epoch": 1853} {"train_loss": -11.9862060546875, "global_step": 311377, "epoch": 1853} {"train_loss": -11.776334762573242, "global_step": 311378, "epoch": 1853} {"train_loss": -11.85653305053711, "global_step": 311379, "epoch": 1853} {"train_loss": -11.723508834838867, "global_step": 311380, "epoch": 1853} {"train_loss": -10.964746475219727, "global_step": 311381, "epoch": 1853} {"train_loss": -11.597921371459961, "global_step": 311382, "epoch": 1853} {"train_loss": -11.052578926086426, "global_step": 311383, "epoch": 1853} {"train_loss": -11.207481384277344, "global_step": 311384, "epoch": 1853} {"train_loss": -11.4271240234375, "global_step": 311385, "epoch": 1853} {"train_loss": -11.24557876586914, "global_step": 311386, "epoch": 1853} {"train_loss": -11.496236801147461, "global_step": 311387, "epoch": 1853} {"train_loss": -11.422282218933105, "global_step": 311388, "epoch": 1853} {"train_loss": -11.534826278686523, "global_step": 311389, "epoch": 1853} {"train_loss": -11.620319366455078, "global_step": 311390, "epoch": 1853} {"train_loss": -11.514602661132812, "global_step": 311391, "epoch": 1853} {"train_loss": -11.345172882080078, "global_step": 311392, "epoch": 1853} {"train_loss": -11.96608829498291, "global_step": 311393, "epoch": 1853} {"train_loss": -11.150362014770508, "global_step": 311394, "epoch": 1853} {"train_loss": -12.225604057312012, "global_step": 311395, "epoch": 1853} {"train_loss": -11.438636779785156, "global_step": 311396, "epoch": 1853} {"train_loss": -11.794642448425293, "global_step": 311397, "epoch": 1853} {"train_loss": -12.050760269165039, "global_step": 311398, "epoch": 1853} {"train_loss": -11.720821380615234, "global_step": 311399, "epoch": 1853} {"train_loss": -12.202733993530273, "global_step": 311400, "epoch": 1853} {"train_loss": -11.794815063476562, "global_step": 311401, "epoch": 1853} {"train_loss": -12.163002014160156, "global_step": 311402, "epoch": 1853} {"train_loss": -11.830028533935547, "global_step": 311403, "epoch": 1853} {"train_loss": -11.898947715759277, "global_step": 311404, "epoch": 1853} {"train_loss": -12.003665924072266, "global_step": 311405, "epoch": 1853} {"train_loss": -12.133570671081543, "global_step": 311406, "epoch": 1853} {"train_loss": -11.553165435791016, "global_step": 311407, "epoch": 1853} {"train_loss": -12.08485221862793, "global_step": 311408, "epoch": 1853} {"train_loss": -11.71745777130127, "global_step": 311409, "epoch": 1853} {"train_loss": -12.085948944091797, "global_step": 311410, "epoch": 1853} {"train_loss": -11.968436241149902, "global_step": 311411, "epoch": 1853} {"train_loss": -11.865937232971191, "global_step": 311412, "epoch": 1853} {"train_loss": -12.30061149597168, "global_step": 311413, "epoch": 1853} {"train_loss": -11.863798141479492, "global_step": 311414, "epoch": 1853} {"train_loss": -12.265373229980469, "global_step": 311415, "epoch": 1853} {"train_loss": -11.839832305908203, "global_step": 311416, "epoch": 1853} {"train_loss": -12.129454612731934, "global_step": 311417, "epoch": 1853} {"train_loss": -12.081466674804688, "global_step": 311418, "epoch": 1853} {"train_loss": -12.029699325561523, "global_step": 311419, "epoch": 1853} {"train_loss": -12.188383102416992, "global_step": 311420, "epoch": 1853} {"train_loss": -12.16618537902832, "global_step": 311421, "epoch": 1853} {"train_loss": -12.297466278076172, "global_step": 311422, "epoch": 1853} {"train_loss": -12.280866622924805, "global_step": 311423, "epoch": 1853} {"train_loss": -12.261804580688477, "global_step": 311424, "epoch": 1853} {"train_loss": -12.243943214416504, "global_step": 311425, "epoch": 1853} {"train_loss": -12.261716842651367, "global_step": 311426, "epoch": 1853} {"train_loss": -12.324399948120117, "global_step": 311427, "epoch": 1853} {"train_loss": -12.20943832397461, "global_step": 311428, "epoch": 1853} {"train_loss": -12.359844207763672, "global_step": 311429, "epoch": 1853} {"train_loss": -12.183987617492676, "global_step": 311430, "epoch": 1853} {"train_loss": -12.403656005859375, "global_step": 311431, "epoch": 1853} {"train_loss": -12.395120620727539, "global_step": 311432, "epoch": 1853} {"train_loss": -12.471084594726562, "global_step": 311433, "epoch": 1853} {"train_loss": -12.4711332321167, "global_step": 311434, "epoch": 1853} {"train_loss": -12.402448654174805, "global_step": 311435, "epoch": 1853} {"train_loss": -12.532596588134766, "global_step": 311436, "epoch": 1853} {"train_loss": -12.66411304473877, "global_step": 311437, "epoch": 1853} {"train_loss": -12.555170059204102, "global_step": 311438, "epoch": 1853} {"train_loss": -12.392587661743164, "global_step": 311439, "epoch": 1853} {"train_loss": -12.583610534667969, "global_step": 311440, "epoch": 1853} {"train_loss": -12.561376571655273, "global_step": 311441, "epoch": 1853} {"train_loss": -12.52255630493164, "global_step": 311442, "epoch": 1853} {"train_loss": -12.369640350341797, "global_step": 311443, "epoch": 1853} {"train_loss": -12.591306686401367, "global_step": 311444, "epoch": 1853} {"train_loss": -12.576319694519043, "global_step": 311445, "epoch": 1853} {"train_loss": -12.393552780151367, "global_step": 311446, "epoch": 1853} {"train_loss": -12.350769996643066, "global_step": 311447, "epoch": 1853} {"train_loss": -12.490629196166992, "global_step": 311448, "epoch": 1853} {"train_loss": -12.366653442382812, "global_step": 311449, "epoch": 1853} {"train_loss": -12.269535064697266, "global_step": 311450, "epoch": 1853} {"train_loss": -12.575014114379883, "global_step": 311451, "epoch": 1853} {"train_loss": -12.613091468811035, "global_step": 311452, "epoch": 1853} {"train_loss": -12.217657089233398, "global_step": 311453, "epoch": 1853} {"train_loss": -12.217490196228027, "global_step": 311454, "epoch": 1853} {"train_loss": -12.52528190612793, "global_step": 311455, "epoch": 1853} {"train_loss": -12.373900413513184, "global_step": 311456, "epoch": 1853} {"train_loss": -12.331280708312988, "global_step": 311457, "epoch": 1853} {"train_loss": -12.129501342773438, "global_step": 311458, "epoch": 1853} {"train_loss": -12.58901596069336, "global_step": 311459, "epoch": 1853} {"train_loss": -12.565275192260742, "global_step": 311460, "epoch": 1853} {"train_loss": -12.582530975341797, "global_step": 311461, "epoch": 1853} {"train_loss": -12.535501480102539, "global_step": 311462, "epoch": 1853} {"train_loss": -12.669918060302734, "global_step": 311463, "epoch": 1853} {"train_loss": -12.437748908996582, "global_step": 311464, "epoch": 1853} {"train_loss": -12.478231430053711, "global_step": 311465, "epoch": 1853} {"train_loss": -12.430488586425781, "global_step": 311466, "epoch": 1853} {"train_loss": -12.628486633300781, "global_step": 311467, "epoch": 1853} {"train_loss": -12.447532653808594, "global_step": 311468, "epoch": 1853} {"train_loss": -12.296918869018555, "global_step": 311469, "epoch": 1853} {"train_loss": -12.68737506866455, "global_step": 311470, "epoch": 1853} {"train_loss": -11.825352067039127, "global_step": 311471, "epoch": 1853, "val_loss": 284574.78125} {"train_loss": -12.303878784179688, "global_step": 311472, "epoch": 1854} {"train_loss": -12.01543140411377, "global_step": 311473, "epoch": 1854} {"train_loss": -12.27578353881836, "global_step": 311474, "epoch": 1854} {"train_loss": -11.751548767089844, "global_step": 311475, "epoch": 1854} {"train_loss": -12.083616256713867, "global_step": 311476, "epoch": 1854} {"train_loss": -11.20070743560791, "global_step": 311477, "epoch": 1854} {"train_loss": -11.204898834228516, "global_step": 311478, "epoch": 1854} {"train_loss": -11.444387435913086, "global_step": 311479, "epoch": 1854} {"train_loss": -11.825716972351074, "global_step": 311480, "epoch": 1854} {"train_loss": -12.425304412841797, "global_step": 311481, "epoch": 1854} {"train_loss": -11.608024597167969, "global_step": 311482, "epoch": 1854} {"train_loss": -11.761114120483398, "global_step": 311483, "epoch": 1854} {"train_loss": -10.989587783813477, "global_step": 311484, "epoch": 1854} {"train_loss": -11.758543014526367, "global_step": 311485, "epoch": 1854} {"train_loss": -11.766117095947266, "global_step": 311486, "epoch": 1854} {"train_loss": -11.991259574890137, "global_step": 311487, "epoch": 1854} {"train_loss": -11.541790008544922, "global_step": 311488, "epoch": 1854} {"train_loss": -12.204526901245117, "global_step": 311489, "epoch": 1854} {"train_loss": -11.96931266784668, "global_step": 311490, "epoch": 1854} {"train_loss": -12.14012336730957, "global_step": 311491, "epoch": 1854} {"train_loss": -11.673215866088867, "global_step": 311492, "epoch": 1854} {"train_loss": -11.98130989074707, "global_step": 311493, "epoch": 1854} {"train_loss": -12.198433876037598, "global_step": 311494, "epoch": 1854} {"train_loss": -12.063575744628906, "global_step": 311495, "epoch": 1854} {"train_loss": -12.292745590209961, "global_step": 311496, "epoch": 1854} {"train_loss": -11.422351837158203, "global_step": 311497, "epoch": 1854} {"train_loss": -11.298752784729004, "global_step": 311498, "epoch": 1854} {"train_loss": -11.79897689819336, "global_step": 311499, "epoch": 1854} {"train_loss": -8.914546966552734, "global_step": 311500, "epoch": 1854} {"train_loss": -9.507301330566406, "global_step": 311501, "epoch": 1854} {"train_loss": -10.023467063903809, "global_step": 311502, "epoch": 1854} {"train_loss": -9.54974365234375, "global_step": 311503, "epoch": 1854} {"train_loss": -8.547433853149414, "global_step": 311504, "epoch": 1854} {"train_loss": -8.695131301879883, "global_step": 311505, "epoch": 1854} {"train_loss": -10.482536315917969, "global_step": 311506, "epoch": 1854} {"train_loss": -10.212356567382812, "global_step": 311507, "epoch": 1854} {"train_loss": -9.272772789001465, "global_step": 311508, "epoch": 1854} {"train_loss": -8.278404235839844, "global_step": 311509, "epoch": 1854} {"train_loss": -10.760501861572266, "global_step": 311510, "epoch": 1854} {"train_loss": -10.058804512023926, "global_step": 311511, "epoch": 1854} {"train_loss": -11.51959228515625, "global_step": 311512, "epoch": 1854} {"train_loss": -10.491714477539062, "global_step": 311513, "epoch": 1854} {"train_loss": -11.526262283325195, "global_step": 311514, "epoch": 1854} {"train_loss": -10.730854034423828, "global_step": 311515, "epoch": 1854} {"train_loss": -11.665163040161133, "global_step": 311516, "epoch": 1854} {"train_loss": -10.924517631530762, "global_step": 311517, "epoch": 1854} {"train_loss": -11.093165397644043, "global_step": 311518, "epoch": 1854} {"train_loss": -11.461173057556152, "global_step": 311519, "epoch": 1854} {"train_loss": -11.113130569458008, "global_step": 311520, "epoch": 1854} {"train_loss": -11.932514190673828, "global_step": 311521, "epoch": 1854} {"train_loss": -11.418563842773438, "global_step": 311522, "epoch": 1854} {"train_loss": -12.034175872802734, "global_step": 311523, "epoch": 1854} {"train_loss": -11.647613525390625, "global_step": 311524, "epoch": 1854} {"train_loss": -12.074677467346191, "global_step": 311525, "epoch": 1854} {"train_loss": -11.831963539123535, "global_step": 311526, "epoch": 1854} {"train_loss": -12.037843704223633, "global_step": 311527, "epoch": 1854} {"train_loss": -11.837976455688477, "global_step": 311528, "epoch": 1854} {"train_loss": -12.046710968017578, "global_step": 311529, "epoch": 1854} {"train_loss": -12.091752052307129, "global_step": 311530, "epoch": 1854} {"train_loss": -12.02726936340332, "global_step": 311531, "epoch": 1854} {"train_loss": -12.091026306152344, "global_step": 311532, "epoch": 1854} {"train_loss": -11.91139030456543, "global_step": 311533, "epoch": 1854} {"train_loss": -12.164898872375488, "global_step": 311534, "epoch": 1854} {"train_loss": -12.307708740234375, "global_step": 311535, "epoch": 1854} {"train_loss": -12.128803253173828, "global_step": 311536, "epoch": 1854} {"train_loss": -11.656397819519043, "global_step": 311537, "epoch": 1854} {"train_loss": -12.192001342773438, "global_step": 311538, "epoch": 1854} {"train_loss": -11.725500106811523, "global_step": 311539, "epoch": 1854} {"train_loss": -11.858011245727539, "global_step": 311540, "epoch": 1854} {"train_loss": -11.951973915100098, "global_step": 311541, "epoch": 1854} {"train_loss": -11.656623840332031, "global_step": 311542, "epoch": 1854} {"train_loss": -12.066031455993652, "global_step": 311543, "epoch": 1854} {"train_loss": -11.676948547363281, "global_step": 311544, "epoch": 1854} {"train_loss": -11.913518905639648, "global_step": 311545, "epoch": 1854} {"train_loss": -11.860300064086914, "global_step": 311546, "epoch": 1854} {"train_loss": -11.942239761352539, "global_step": 311547, "epoch": 1854} {"train_loss": -12.01625919342041, "global_step": 311548, "epoch": 1854} {"train_loss": -12.013659477233887, "global_step": 311549, "epoch": 1854} {"train_loss": -12.277606964111328, "global_step": 311550, "epoch": 1854} {"train_loss": -11.766151428222656, "global_step": 311551, "epoch": 1854} {"train_loss": -12.293442726135254, "global_step": 311552, "epoch": 1854} {"train_loss": -11.944619178771973, "global_step": 311553, "epoch": 1854} {"train_loss": -12.435185432434082, "global_step": 311554, "epoch": 1854} {"train_loss": -11.932808876037598, "global_step": 311555, "epoch": 1854} {"train_loss": -12.292545318603516, "global_step": 311556, "epoch": 1854} {"train_loss": -11.986038208007812, "global_step": 311557, "epoch": 1854} {"train_loss": -12.157755851745605, "global_step": 311558, "epoch": 1854} {"train_loss": -12.48204231262207, "global_step": 311559, "epoch": 1854} {"train_loss": -12.139439582824707, "global_step": 311560, "epoch": 1854} {"train_loss": -12.217777252197266, "global_step": 311561, "epoch": 1854} {"train_loss": -12.17473030090332, "global_step": 311562, "epoch": 1854} {"train_loss": -12.34371280670166, "global_step": 311563, "epoch": 1854} {"train_loss": -12.086278915405273, "global_step": 311564, "epoch": 1854} {"train_loss": -12.11688232421875, "global_step": 311565, "epoch": 1854} {"train_loss": -12.187932968139648, "global_step": 311566, "epoch": 1854} {"train_loss": -12.138654708862305, "global_step": 311567, "epoch": 1854} {"train_loss": -11.98996353149414, "global_step": 311568, "epoch": 1854} {"train_loss": -12.160066604614258, "global_step": 311569, "epoch": 1854} {"train_loss": -12.287283897399902, "global_step": 311570, "epoch": 1854} {"train_loss": -11.999736785888672, "global_step": 311571, "epoch": 1854} {"train_loss": -12.251585960388184, "global_step": 311572, "epoch": 1854} {"train_loss": -12.042476654052734, "global_step": 311573, "epoch": 1854} {"train_loss": -11.905939102172852, "global_step": 311574, "epoch": 1854} {"train_loss": -12.256096839904785, "global_step": 311575, "epoch": 1854} {"train_loss": -11.629154205322266, "global_step": 311576, "epoch": 1854} {"train_loss": -12.46231746673584, "global_step": 311577, "epoch": 1854} {"train_loss": -12.313074111938477, "global_step": 311578, "epoch": 1854} {"train_loss": -12.622136116027832, "global_step": 311579, "epoch": 1854} {"train_loss": -12.213464736938477, "global_step": 311580, "epoch": 1854} {"train_loss": -12.354339599609375, "global_step": 311581, "epoch": 1854} {"train_loss": -12.293710708618164, "global_step": 311582, "epoch": 1854} {"train_loss": -12.496862411499023, "global_step": 311583, "epoch": 1854} {"train_loss": -12.355611801147461, "global_step": 311584, "epoch": 1854} {"train_loss": -12.386823654174805, "global_step": 311585, "epoch": 1854} {"train_loss": -12.472606658935547, "global_step": 311586, "epoch": 1854} {"train_loss": -12.272082328796387, "global_step": 311587, "epoch": 1854} {"train_loss": -12.307516098022461, "global_step": 311588, "epoch": 1854} {"train_loss": -12.071077346801758, "global_step": 311589, "epoch": 1854} {"train_loss": -12.080509185791016, "global_step": 311590, "epoch": 1854} {"train_loss": -12.302919387817383, "global_step": 311591, "epoch": 1854} {"train_loss": -12.184369087219238, "global_step": 311592, "epoch": 1854} {"train_loss": -12.256747245788574, "global_step": 311593, "epoch": 1854} {"train_loss": -12.38541030883789, "global_step": 311594, "epoch": 1854} {"train_loss": -12.340879440307617, "global_step": 311595, "epoch": 1854} {"train_loss": -12.490859985351562, "global_step": 311596, "epoch": 1854} {"train_loss": -12.368379592895508, "global_step": 311597, "epoch": 1854} {"train_loss": -12.318500518798828, "global_step": 311598, "epoch": 1854} {"train_loss": -12.031599044799805, "global_step": 311599, "epoch": 1854} {"train_loss": -11.717569351196289, "global_step": 311600, "epoch": 1854} {"train_loss": -11.990641593933105, "global_step": 311601, "epoch": 1854} {"train_loss": -12.213199615478516, "global_step": 311602, "epoch": 1854} {"train_loss": -12.230724334716797, "global_step": 311603, "epoch": 1854} {"train_loss": -11.690552711486816, "global_step": 311604, "epoch": 1854} {"train_loss": -11.196788787841797, "global_step": 311605, "epoch": 1854} {"train_loss": -11.14240550994873, "global_step": 311606, "epoch": 1854} {"train_loss": -12.006582260131836, "global_step": 311607, "epoch": 1854} {"train_loss": -12.00088119506836, "global_step": 311608, "epoch": 1854} {"train_loss": -10.56877326965332, "global_step": 311609, "epoch": 1854} {"train_loss": -11.728900909423828, "global_step": 311610, "epoch": 1854} {"train_loss": -12.121173858642578, "global_step": 311611, "epoch": 1854} {"train_loss": -10.662374496459961, "global_step": 311612, "epoch": 1854} {"train_loss": -10.136054992675781, "global_step": 311613, "epoch": 1854} {"train_loss": -12.152074813842773, "global_step": 311614, "epoch": 1854} {"train_loss": -11.268831253051758, "global_step": 311615, "epoch": 1854} {"train_loss": -9.729331016540527, "global_step": 311616, "epoch": 1854} {"train_loss": -11.140758514404297, "global_step": 311617, "epoch": 1854} {"train_loss": -10.87968921661377, "global_step": 311618, "epoch": 1854} {"train_loss": -9.58414077758789, "global_step": 311619, "epoch": 1854} {"train_loss": -11.592037200927734, "global_step": 311620, "epoch": 1854} {"train_loss": -9.168930053710938, "global_step": 311621, "epoch": 1854} {"train_loss": -10.532856941223145, "global_step": 311622, "epoch": 1854} {"train_loss": -9.380426406860352, "global_step": 311623, "epoch": 1854} {"train_loss": -10.463807106018066, "global_step": 311624, "epoch": 1854} {"train_loss": -10.691644668579102, "global_step": 311625, "epoch": 1854} {"train_loss": -10.09895133972168, "global_step": 311626, "epoch": 1854} {"train_loss": -11.608814239501953, "global_step": 311627, "epoch": 1854} {"train_loss": -10.675559997558594, "global_step": 311628, "epoch": 1854} {"train_loss": -11.508932113647461, "global_step": 311629, "epoch": 1854} {"train_loss": -10.716903686523438, "global_step": 311630, "epoch": 1854} {"train_loss": -11.56181526184082, "global_step": 311631, "epoch": 1854} {"train_loss": -10.758907318115234, "global_step": 311632, "epoch": 1854} {"train_loss": -12.018406867980957, "global_step": 311633, "epoch": 1854} {"train_loss": -11.00640869140625, "global_step": 311634, "epoch": 1854} {"train_loss": -11.87508487701416, "global_step": 311635, "epoch": 1854} {"train_loss": -11.166029930114746, "global_step": 311636, "epoch": 1854} {"train_loss": -11.706451416015625, "global_step": 311637, "epoch": 1854} {"train_loss": -11.47804069519043, "global_step": 311638, "epoch": 1854} {"train_loss": -11.598187492007302, "global_step": 311639, "epoch": 1854, "val_loss": 279867.15625} {"train_loss": -10.817750930786133, "global_step": 311640, "epoch": 1855} {"train_loss": -11.662075996398926, "global_step": 311641, "epoch": 1855} {"train_loss": -11.191829681396484, "global_step": 311642, "epoch": 1855} {"train_loss": -11.660905838012695, "global_step": 311643, "epoch": 1855} {"train_loss": -11.600153923034668, "global_step": 311644, "epoch": 1855} {"train_loss": -11.793521881103516, "global_step": 311645, "epoch": 1855} {"train_loss": -11.81828498840332, "global_step": 311646, "epoch": 1855} {"train_loss": -11.96093463897705, "global_step": 311647, "epoch": 1855} {"train_loss": -11.617156982421875, "global_step": 311648, "epoch": 1855} {"train_loss": -11.899234771728516, "global_step": 311649, "epoch": 1855} {"train_loss": -11.738945007324219, "global_step": 311650, "epoch": 1855} {"train_loss": -11.821340560913086, "global_step": 311651, "epoch": 1855} {"train_loss": -11.852374076843262, "global_step": 311652, "epoch": 1855} {"train_loss": -12.074800491333008, "global_step": 311653, "epoch": 1855} {"train_loss": -12.1271333694458, "global_step": 311654, "epoch": 1855} {"train_loss": -11.833847999572754, "global_step": 311655, "epoch": 1855} {"train_loss": -11.949248313903809, "global_step": 311656, "epoch": 1855} {"train_loss": -11.894319534301758, "global_step": 311657, "epoch": 1855} {"train_loss": -12.124131202697754, "global_step": 311658, "epoch": 1855} {"train_loss": -11.94044303894043, "global_step": 311659, "epoch": 1855} {"train_loss": -12.096324920654297, "global_step": 311660, "epoch": 1855} {"train_loss": -12.155618667602539, "global_step": 311661, "epoch": 1855} {"train_loss": -12.064626693725586, "global_step": 311662, "epoch": 1855} {"train_loss": -12.13609504699707, "global_step": 311663, "epoch": 1855} {"train_loss": -12.05627155303955, "global_step": 311664, "epoch": 1855} {"train_loss": -12.24654769897461, "global_step": 311665, "epoch": 1855} {"train_loss": -12.176666259765625, "global_step": 311666, "epoch": 1855} {"train_loss": -12.120532989501953, "global_step": 311667, "epoch": 1855} {"train_loss": -12.345907211303711, "global_step": 311668, "epoch": 1855} {"train_loss": -12.136085510253906, "global_step": 311669, "epoch": 1855} {"train_loss": -12.30075740814209, "global_step": 311670, "epoch": 1855} {"train_loss": -12.006071090698242, "global_step": 311671, "epoch": 1855} {"train_loss": -12.412675857543945, "global_step": 311672, "epoch": 1855} {"train_loss": -12.291701316833496, "global_step": 311673, "epoch": 1855} {"train_loss": -12.142267227172852, "global_step": 311674, "epoch": 1855} {"train_loss": -12.323393821716309, "global_step": 311675, "epoch": 1855} {"train_loss": -12.32225227355957, "global_step": 311676, "epoch": 1855} {"train_loss": -12.441878318786621, "global_step": 311677, "epoch": 1855} {"train_loss": -12.13337516784668, "global_step": 311678, "epoch": 1855} {"train_loss": -12.34631061553955, "global_step": 311679, "epoch": 1855} {"train_loss": -12.078850746154785, "global_step": 311680, "epoch": 1855} {"train_loss": -12.129932403564453, "global_step": 311681, "epoch": 1855} {"train_loss": -12.217122077941895, "global_step": 311682, "epoch": 1855} {"train_loss": -12.184171676635742, "global_step": 311683, "epoch": 1855} {"train_loss": -12.443750381469727, "global_step": 311684, "epoch": 1855} {"train_loss": -12.487444877624512, "global_step": 311685, "epoch": 1855} {"train_loss": -12.156698226928711, "global_step": 311686, "epoch": 1855} {"train_loss": -12.327927589416504, "global_step": 311687, "epoch": 1855} {"train_loss": -12.544443130493164, "global_step": 311688, "epoch": 1855} {"train_loss": -12.4722261428833, "global_step": 311689, "epoch": 1855} {"train_loss": -12.329565048217773, "global_step": 311690, "epoch": 1855} {"train_loss": -12.401834487915039, "global_step": 311691, "epoch": 1855} {"train_loss": -12.377497673034668, "global_step": 311692, "epoch": 1855} {"train_loss": -12.239316940307617, "global_step": 311693, "epoch": 1855} {"train_loss": -12.626142501831055, "global_step": 311694, "epoch": 1855} {"train_loss": -12.293408393859863, "global_step": 311695, "epoch": 1855} {"train_loss": -12.640351295471191, "global_step": 311696, "epoch": 1855} {"train_loss": -12.166833877563477, "global_step": 311697, "epoch": 1855} {"train_loss": -12.398361206054688, "global_step": 311698, "epoch": 1855} {"train_loss": -12.306575775146484, "global_step": 311699, "epoch": 1855} {"train_loss": -12.277183532714844, "global_step": 311700, "epoch": 1855} {"train_loss": -12.646323204040527, "global_step": 311701, "epoch": 1855} {"train_loss": -12.379154205322266, "global_step": 311702, "epoch": 1855} {"train_loss": -12.487059593200684, "global_step": 311703, "epoch": 1855} {"train_loss": -12.353382110595703, "global_step": 311704, "epoch": 1855} {"train_loss": -12.239140510559082, "global_step": 311705, "epoch": 1855} {"train_loss": -12.115362167358398, "global_step": 311706, "epoch": 1855} {"train_loss": -12.447416305541992, "global_step": 311707, "epoch": 1855} {"train_loss": -12.149633407592773, "global_step": 311708, "epoch": 1855} {"train_loss": -12.576417922973633, "global_step": 311709, "epoch": 1855} {"train_loss": -12.213720321655273, "global_step": 311710, "epoch": 1855} {"train_loss": -11.872306823730469, "global_step": 311711, "epoch": 1855} {"train_loss": -11.876627922058105, "global_step": 311712, "epoch": 1855} {"train_loss": -11.347918510437012, "global_step": 311713, "epoch": 1855} {"train_loss": -12.300965309143066, "global_step": 311714, "epoch": 1855} {"train_loss": -11.972504615783691, "global_step": 311715, "epoch": 1855} {"train_loss": -11.951029777526855, "global_step": 311716, "epoch": 1855} {"train_loss": -12.064539909362793, "global_step": 311717, "epoch": 1855} {"train_loss": -11.595233917236328, "global_step": 311718, "epoch": 1855} {"train_loss": -11.729194641113281, "global_step": 311719, "epoch": 1855} {"train_loss": -12.186433792114258, "global_step": 311720, "epoch": 1855} {"train_loss": -10.403319358825684, "global_step": 311721, "epoch": 1855} {"train_loss": -12.111180305480957, "global_step": 311722, "epoch": 1855} {"train_loss": -10.656742095947266, "global_step": 311723, "epoch": 1855} {"train_loss": -11.77374267578125, "global_step": 311724, "epoch": 1855} {"train_loss": -11.676813125610352, "global_step": 311725, "epoch": 1855} {"train_loss": -10.860026359558105, "global_step": 311726, "epoch": 1855} {"train_loss": -11.264222145080566, "global_step": 311727, "epoch": 1855} {"train_loss": -12.05544376373291, "global_step": 311728, "epoch": 1855} {"train_loss": -11.0185546875, "global_step": 311729, "epoch": 1855} {"train_loss": -10.500001907348633, "global_step": 311730, "epoch": 1855} {"train_loss": -11.751167297363281, "global_step": 311731, "epoch": 1855} {"train_loss": -11.305780410766602, "global_step": 311732, "epoch": 1855} {"train_loss": -10.84908390045166, "global_step": 311733, "epoch": 1855} {"train_loss": -11.552197456359863, "global_step": 311734, "epoch": 1855} {"train_loss": -11.544776916503906, "global_step": 311735, "epoch": 1855} {"train_loss": -11.835655212402344, "global_step": 311736, "epoch": 1855} {"train_loss": -11.528680801391602, "global_step": 311737, "epoch": 1855} {"train_loss": -11.77823257446289, "global_step": 311738, "epoch": 1855} {"train_loss": -11.67777156829834, "global_step": 311739, "epoch": 1855} {"train_loss": -11.605802536010742, "global_step": 311740, "epoch": 1855} {"train_loss": -11.996162414550781, "global_step": 311741, "epoch": 1855} {"train_loss": -11.1359224319458, "global_step": 311742, "epoch": 1855} {"train_loss": -11.887272834777832, "global_step": 311743, "epoch": 1855} {"train_loss": -11.249224662780762, "global_step": 311744, "epoch": 1855} {"train_loss": -10.303955078125, "global_step": 311745, "epoch": 1855} {"train_loss": -11.328245162963867, "global_step": 311746, "epoch": 1855} {"train_loss": -10.957554817199707, "global_step": 311747, "epoch": 1855} {"train_loss": -11.672222137451172, "global_step": 311748, "epoch": 1855} {"train_loss": -11.230299949645996, "global_step": 311749, "epoch": 1855} {"train_loss": -11.642622947692871, "global_step": 311750, "epoch": 1855} {"train_loss": -12.124372482299805, "global_step": 311751, "epoch": 1855} {"train_loss": -11.787660598754883, "global_step": 311752, "epoch": 1855} {"train_loss": -11.87813949584961, "global_step": 311753, "epoch": 1855} {"train_loss": -12.010293960571289, "global_step": 311754, "epoch": 1855} {"train_loss": -12.128091812133789, "global_step": 311755, "epoch": 1855} {"train_loss": -11.757481575012207, "global_step": 311756, "epoch": 1855} {"train_loss": -11.969793319702148, "global_step": 311757, "epoch": 1855} {"train_loss": -12.14840316772461, "global_step": 311758, "epoch": 1855} {"train_loss": -12.013467788696289, "global_step": 311759, "epoch": 1855} {"train_loss": -11.949365615844727, "global_step": 311760, "epoch": 1855} {"train_loss": -11.960281372070312, "global_step": 311761, "epoch": 1855} {"train_loss": -12.023092269897461, "global_step": 311762, "epoch": 1855} {"train_loss": -12.13306999206543, "global_step": 311763, "epoch": 1855} {"train_loss": -11.946199417114258, "global_step": 311764, "epoch": 1855} {"train_loss": -12.191815376281738, "global_step": 311765, "epoch": 1855} {"train_loss": -12.276104927062988, "global_step": 311766, "epoch": 1855} {"train_loss": -11.969560623168945, "global_step": 311767, "epoch": 1855} {"train_loss": -12.44825553894043, "global_step": 311768, "epoch": 1855} {"train_loss": -12.05941104888916, "global_step": 311769, "epoch": 1855} {"train_loss": -12.212328910827637, "global_step": 311770, "epoch": 1855} {"train_loss": -12.034523963928223, "global_step": 311771, "epoch": 1855} {"train_loss": -12.018133163452148, "global_step": 311772, "epoch": 1855} {"train_loss": -12.358299255371094, "global_step": 311773, "epoch": 1855} {"train_loss": -12.021854400634766, "global_step": 311774, "epoch": 1855} {"train_loss": -12.16867446899414, "global_step": 311775, "epoch": 1855} {"train_loss": -11.966158866882324, "global_step": 311776, "epoch": 1855} {"train_loss": -12.081365585327148, "global_step": 311777, "epoch": 1855} {"train_loss": -12.229681968688965, "global_step": 311778, "epoch": 1855} {"train_loss": -11.844002723693848, "global_step": 311779, "epoch": 1855} {"train_loss": -12.382728576660156, "global_step": 311780, "epoch": 1855} {"train_loss": -11.796778678894043, "global_step": 311781, "epoch": 1855} {"train_loss": -12.463516235351562, "global_step": 311782, "epoch": 1855} {"train_loss": -12.169794082641602, "global_step": 311783, "epoch": 1855} {"train_loss": -12.263228416442871, "global_step": 311784, "epoch": 1855} {"train_loss": -12.174339294433594, "global_step": 311785, "epoch": 1855} {"train_loss": -12.167524337768555, "global_step": 311786, "epoch": 1855} {"train_loss": -12.276658058166504, "global_step": 311787, "epoch": 1855} {"train_loss": -12.282020568847656, "global_step": 311788, "epoch": 1855} {"train_loss": -12.594003677368164, "global_step": 311789, "epoch": 1855} {"train_loss": -12.394664764404297, "global_step": 311790, "epoch": 1855} {"train_loss": -12.428995132446289, "global_step": 311791, "epoch": 1855} {"train_loss": -12.378087043762207, "global_step": 311792, "epoch": 1855} {"train_loss": -12.36343002319336, "global_step": 311793, "epoch": 1855} {"train_loss": -12.150849342346191, "global_step": 311794, "epoch": 1855} {"train_loss": -12.083664894104004, "global_step": 311795, "epoch": 1855} {"train_loss": -12.465221405029297, "global_step": 311796, "epoch": 1855} {"train_loss": -12.241552352905273, "global_step": 311797, "epoch": 1855} {"train_loss": -12.261194229125977, "global_step": 311798, "epoch": 1855} {"train_loss": -12.478063583374023, "global_step": 311799, "epoch": 1855} {"train_loss": -11.928953170776367, "global_step": 311800, "epoch": 1855} {"train_loss": -12.202877044677734, "global_step": 311801, "epoch": 1855} {"train_loss": -12.282785415649414, "global_step": 311802, "epoch": 1855} {"train_loss": -12.084707260131836, "global_step": 311803, "epoch": 1855} {"train_loss": -12.061605453491211, "global_step": 311804, "epoch": 1855} {"train_loss": -12.133143424987793, "global_step": 311805, "epoch": 1855} {"train_loss": -12.383267402648926, "global_step": 311806, "epoch": 1855} {"train_loss": -11.996456049737477, "global_step": 311807, "epoch": 1855, "val_loss": 282441.0, "train_action_mse_error": 1.5360931158065796} {"train_loss": -12.455016136169434, "global_step": 311808, "epoch": 1856} {"train_loss": -12.40829086303711, "global_step": 311809, "epoch": 1856} {"train_loss": -12.359681129455566, "global_step": 311810, "epoch": 1856} {"train_loss": -12.49221420288086, "global_step": 311811, "epoch": 1856} {"train_loss": -12.12085247039795, "global_step": 311812, "epoch": 1856} {"train_loss": -12.021387100219727, "global_step": 311813, "epoch": 1856} {"train_loss": -12.24526596069336, "global_step": 311814, "epoch": 1856} {"train_loss": -12.222817420959473, "global_step": 311815, "epoch": 1856} {"train_loss": -12.276426315307617, "global_step": 311816, "epoch": 1856} {"train_loss": -12.45285415649414, "global_step": 311817, "epoch": 1856} {"train_loss": -11.977779388427734, "global_step": 311818, "epoch": 1856} {"train_loss": -12.153564453125, "global_step": 311819, "epoch": 1856} {"train_loss": -12.315197944641113, "global_step": 311820, "epoch": 1856} {"train_loss": -12.198248863220215, "global_step": 311821, "epoch": 1856} {"train_loss": -11.641883850097656, "global_step": 311822, "epoch": 1856} {"train_loss": -11.519542694091797, "global_step": 311823, "epoch": 1856} {"train_loss": -11.883268356323242, "global_step": 311824, "epoch": 1856} {"train_loss": -12.171920776367188, "global_step": 311825, "epoch": 1856} {"train_loss": -11.74543285369873, "global_step": 311826, "epoch": 1856} {"train_loss": -12.358135223388672, "global_step": 311827, "epoch": 1856} {"train_loss": -12.034852981567383, "global_step": 311828, "epoch": 1856} {"train_loss": -12.574721336364746, "global_step": 311829, "epoch": 1856} {"train_loss": -12.370577812194824, "global_step": 311830, "epoch": 1856} {"train_loss": -12.079931259155273, "global_step": 311831, "epoch": 1856} {"train_loss": -11.272869110107422, "global_step": 311832, "epoch": 1856} {"train_loss": -11.339740753173828, "global_step": 311833, "epoch": 1856} {"train_loss": -11.514267921447754, "global_step": 311834, "epoch": 1856} {"train_loss": -11.413946151733398, "global_step": 311835, "epoch": 1856} {"train_loss": -12.293769836425781, "global_step": 311836, "epoch": 1856} {"train_loss": -12.516624450683594, "global_step": 311837, "epoch": 1856} {"train_loss": -12.187509536743164, "global_step": 311838, "epoch": 1856} {"train_loss": -11.984088897705078, "global_step": 311839, "epoch": 1856} {"train_loss": -12.20710563659668, "global_step": 311840, "epoch": 1856} {"train_loss": -12.028824806213379, "global_step": 311841, "epoch": 1856} {"train_loss": -12.337175369262695, "global_step": 311842, "epoch": 1856} {"train_loss": -12.3611421585083, "global_step": 311843, "epoch": 1856} {"train_loss": -12.185492515563965, "global_step": 311844, "epoch": 1856} {"train_loss": -12.277722358703613, "global_step": 311845, "epoch": 1856} {"train_loss": -12.402088165283203, "global_step": 311846, "epoch": 1856} {"train_loss": -12.41354751586914, "global_step": 311847, "epoch": 1856} {"train_loss": -12.278839111328125, "global_step": 311848, "epoch": 1856} {"train_loss": -12.22630786895752, "global_step": 311849, "epoch": 1856} {"train_loss": -12.34451675415039, "global_step": 311850, "epoch": 1856} {"train_loss": -12.692344665527344, "global_step": 311851, "epoch": 1856} {"train_loss": -12.526870727539062, "global_step": 311852, "epoch": 1856} {"train_loss": -12.242047309875488, "global_step": 311853, "epoch": 1856} {"train_loss": -12.555303573608398, "global_step": 311854, "epoch": 1856} {"train_loss": -11.776467323303223, "global_step": 311855, "epoch": 1856} {"train_loss": -11.730323791503906, "global_step": 311856, "epoch": 1856} {"train_loss": -12.106807708740234, "global_step": 311857, "epoch": 1856} {"train_loss": -11.555742263793945, "global_step": 311858, "epoch": 1856} {"train_loss": -12.177433013916016, "global_step": 311859, "epoch": 1856} {"train_loss": -11.579834938049316, "global_step": 311860, "epoch": 1856} {"train_loss": -11.770105361938477, "global_step": 311861, "epoch": 1856} {"train_loss": -11.9976167678833, "global_step": 311862, "epoch": 1856} {"train_loss": -11.109824180603027, "global_step": 311863, "epoch": 1856} {"train_loss": -11.501945495605469, "global_step": 311864, "epoch": 1856} {"train_loss": -11.139286041259766, "global_step": 311865, "epoch": 1856} {"train_loss": -9.652544975280762, "global_step": 311866, "epoch": 1856} {"train_loss": -11.309361457824707, "global_step": 311867, "epoch": 1856} {"train_loss": -10.284527778625488, "global_step": 311868, "epoch": 1856} {"train_loss": -9.601593017578125, "global_step": 311869, "epoch": 1856} {"train_loss": -11.857460021972656, "global_step": 311870, "epoch": 1856} {"train_loss": -9.760852813720703, "global_step": 311871, "epoch": 1856} {"train_loss": -11.96072769165039, "global_step": 311872, "epoch": 1856} {"train_loss": -10.735136985778809, "global_step": 311873, "epoch": 1856} {"train_loss": -9.207132339477539, "global_step": 311874, "epoch": 1856} {"train_loss": -9.369991302490234, "global_step": 311875, "epoch": 1856} {"train_loss": -10.988349914550781, "global_step": 311876, "epoch": 1856} {"train_loss": -9.87935733795166, "global_step": 311877, "epoch": 1856} {"train_loss": -9.824518203735352, "global_step": 311878, "epoch": 1856} {"train_loss": -12.041411399841309, "global_step": 311879, "epoch": 1856} {"train_loss": -10.88629150390625, "global_step": 311880, "epoch": 1856} {"train_loss": -10.664194107055664, "global_step": 311881, "epoch": 1856} {"train_loss": -10.77878475189209, "global_step": 311882, "epoch": 1856} {"train_loss": -10.156482696533203, "global_step": 311883, "epoch": 1856} {"train_loss": -10.487350463867188, "global_step": 311884, "epoch": 1856} {"train_loss": -9.421544075012207, "global_step": 311885, "epoch": 1856} {"train_loss": -11.235408782958984, "global_step": 311886, "epoch": 1856} {"train_loss": -9.789219856262207, "global_step": 311887, "epoch": 1856} {"train_loss": -9.495594024658203, "global_step": 311888, "epoch": 1856} {"train_loss": -10.122369766235352, "global_step": 311889, "epoch": 1856} {"train_loss": -11.445840835571289, "global_step": 311890, "epoch": 1856} {"train_loss": -9.409360885620117, "global_step": 311891, "epoch": 1856} {"train_loss": -10.312835693359375, "global_step": 311892, "epoch": 1856} {"train_loss": -11.038150787353516, "global_step": 311893, "epoch": 1856} {"train_loss": -9.498268127441406, "global_step": 311894, "epoch": 1856} {"train_loss": -10.906328201293945, "global_step": 311895, "epoch": 1856} {"train_loss": -10.613079071044922, "global_step": 311896, "epoch": 1856} {"train_loss": -9.203184127807617, "global_step": 311897, "epoch": 1856} {"train_loss": -11.317974090576172, "global_step": 311898, "epoch": 1856} {"train_loss": -11.130884170532227, "global_step": 311899, "epoch": 1856} {"train_loss": -9.933042526245117, "global_step": 311900, "epoch": 1856} {"train_loss": -11.764827728271484, "global_step": 311901, "epoch": 1856} {"train_loss": -10.757722854614258, "global_step": 311902, "epoch": 1856} {"train_loss": -10.997468948364258, "global_step": 311903, "epoch": 1856} {"train_loss": -11.934966087341309, "global_step": 311904, "epoch": 1856} {"train_loss": -11.069082260131836, "global_step": 311905, "epoch": 1856} {"train_loss": -11.606913566589355, "global_step": 311906, "epoch": 1856} {"train_loss": -11.835841178894043, "global_step": 311907, "epoch": 1856} {"train_loss": -11.38270092010498, "global_step": 311908, "epoch": 1856} {"train_loss": -11.748538970947266, "global_step": 311909, "epoch": 1856} {"train_loss": -11.976133346557617, "global_step": 311910, "epoch": 1856} {"train_loss": -11.727724075317383, "global_step": 311911, "epoch": 1856} {"train_loss": -11.959066390991211, "global_step": 311912, "epoch": 1856} {"train_loss": -11.805814743041992, "global_step": 311913, "epoch": 1856} {"train_loss": -12.017885208129883, "global_step": 311914, "epoch": 1856} {"train_loss": -11.826641082763672, "global_step": 311915, "epoch": 1856} {"train_loss": -11.792512893676758, "global_step": 311916, "epoch": 1856} {"train_loss": -11.998249053955078, "global_step": 311917, "epoch": 1856} {"train_loss": -11.688425064086914, "global_step": 311918, "epoch": 1856} {"train_loss": -11.783199310302734, "global_step": 311919, "epoch": 1856} {"train_loss": -12.09110164642334, "global_step": 311920, "epoch": 1856} {"train_loss": -11.656610488891602, "global_step": 311921, "epoch": 1856} {"train_loss": -11.855870246887207, "global_step": 311922, "epoch": 1856} {"train_loss": -12.151041030883789, "global_step": 311923, "epoch": 1856} {"train_loss": -11.697652816772461, "global_step": 311924, "epoch": 1856} {"train_loss": -12.186134338378906, "global_step": 311925, "epoch": 1856} {"train_loss": -11.94261646270752, "global_step": 311926, "epoch": 1856} {"train_loss": -11.969522476196289, "global_step": 311927, "epoch": 1856} {"train_loss": -12.085542678833008, "global_step": 311928, "epoch": 1856} {"train_loss": -12.143847465515137, "global_step": 311929, "epoch": 1856} {"train_loss": -12.096227645874023, "global_step": 311930, "epoch": 1856} {"train_loss": -12.213775634765625, "global_step": 311931, "epoch": 1856} {"train_loss": -12.036751747131348, "global_step": 311932, "epoch": 1856} {"train_loss": -11.931611061096191, "global_step": 311933, "epoch": 1856} {"train_loss": -12.14956283569336, "global_step": 311934, "epoch": 1856} {"train_loss": -12.151243209838867, "global_step": 311935, "epoch": 1856} {"train_loss": -12.045308113098145, "global_step": 311936, "epoch": 1856} {"train_loss": -11.9812650680542, "global_step": 311937, "epoch": 1856} {"train_loss": -11.995072364807129, "global_step": 311938, "epoch": 1856} {"train_loss": -12.159263610839844, "global_step": 311939, "epoch": 1856} {"train_loss": -12.248122215270996, "global_step": 311940, "epoch": 1856} {"train_loss": -12.312137603759766, "global_step": 311941, "epoch": 1856} {"train_loss": -12.129343032836914, "global_step": 311942, "epoch": 1856} {"train_loss": -11.940818786621094, "global_step": 311943, "epoch": 1856} {"train_loss": -12.158988952636719, "global_step": 311944, "epoch": 1856} {"train_loss": -12.242681503295898, "global_step": 311945, "epoch": 1856} {"train_loss": -12.015996932983398, "global_step": 311946, "epoch": 1856} {"train_loss": -12.20692253112793, "global_step": 311947, "epoch": 1856} {"train_loss": -12.253500938415527, "global_step": 311948, "epoch": 1856} {"train_loss": -12.006364822387695, "global_step": 311949, "epoch": 1856} {"train_loss": -12.099740982055664, "global_step": 311950, "epoch": 1856} {"train_loss": -12.25044059753418, "global_step": 311951, "epoch": 1856} {"train_loss": -12.143449783325195, "global_step": 311952, "epoch": 1856} {"train_loss": -12.399045944213867, "global_step": 311953, "epoch": 1856} {"train_loss": -12.368341445922852, "global_step": 311954, "epoch": 1856} {"train_loss": -12.294166564941406, "global_step": 311955, "epoch": 1856} {"train_loss": -12.182619094848633, "global_step": 311956, "epoch": 1856} {"train_loss": -12.01095962524414, "global_step": 311957, "epoch": 1856} {"train_loss": -12.307170867919922, "global_step": 311958, "epoch": 1856} {"train_loss": -12.229949951171875, "global_step": 311959, "epoch": 1856} {"train_loss": -12.367011070251465, "global_step": 311960, "epoch": 1856} {"train_loss": -12.154938697814941, "global_step": 311961, "epoch": 1856} {"train_loss": -12.376691818237305, "global_step": 311962, "epoch": 1856} {"train_loss": -12.273279190063477, "global_step": 311963, "epoch": 1856} {"train_loss": -12.17251968383789, "global_step": 311964, "epoch": 1856} {"train_loss": -12.378799438476562, "global_step": 311965, "epoch": 1856} {"train_loss": -12.115164756774902, "global_step": 311966, "epoch": 1856} {"train_loss": -12.426295280456543, "global_step": 311967, "epoch": 1856} {"train_loss": -12.039762496948242, "global_step": 311968, "epoch": 1856} {"train_loss": -12.491352081298828, "global_step": 311969, "epoch": 1856} {"train_loss": -12.136923789978027, "global_step": 311970, "epoch": 1856} {"train_loss": -12.341097831726074, "global_step": 311971, "epoch": 1856} {"train_loss": -12.133220672607422, "global_step": 311972, "epoch": 1856} {"train_loss": -12.201250076293945, "global_step": 311973, "epoch": 1856} {"train_loss": -12.295215606689453, "global_step": 311974, "epoch": 1856} {"train_loss": -11.705214812642051, "global_step": 311975, "epoch": 1856, "val_loss": 283595.40625} {"train_loss": -12.249622344970703, "global_step": 311976, "epoch": 1857} {"train_loss": -11.818492889404297, "global_step": 311977, "epoch": 1857} {"train_loss": -12.142435073852539, "global_step": 311978, "epoch": 1857} {"train_loss": -12.332779884338379, "global_step": 311979, "epoch": 1857} {"train_loss": -12.469440460205078, "global_step": 311980, "epoch": 1857} {"train_loss": -12.382022857666016, "global_step": 311981, "epoch": 1857} {"train_loss": -12.151527404785156, "global_step": 311982, "epoch": 1857} {"train_loss": -12.117677688598633, "global_step": 311983, "epoch": 1857} {"train_loss": -12.304487228393555, "global_step": 311984, "epoch": 1857} {"train_loss": -12.005514144897461, "global_step": 311985, "epoch": 1857} {"train_loss": -12.117874145507812, "global_step": 311986, "epoch": 1857} {"train_loss": -12.310724258422852, "global_step": 311987, "epoch": 1857} {"train_loss": -11.94588851928711, "global_step": 311988, "epoch": 1857} {"train_loss": -12.179988861083984, "global_step": 311989, "epoch": 1857} {"train_loss": -12.347331047058105, "global_step": 311990, "epoch": 1857} {"train_loss": -12.303230285644531, "global_step": 311991, "epoch": 1857} {"train_loss": -12.281574249267578, "global_step": 311992, "epoch": 1857} {"train_loss": -12.452985763549805, "global_step": 311993, "epoch": 1857} {"train_loss": -12.385648727416992, "global_step": 311994, "epoch": 1857} {"train_loss": -12.427596092224121, "global_step": 311995, "epoch": 1857} {"train_loss": -12.437772750854492, "global_step": 311996, "epoch": 1857} {"train_loss": -12.295134544372559, "global_step": 311997, "epoch": 1857} {"train_loss": -12.482132911682129, "global_step": 311998, "epoch": 1857} {"train_loss": -12.333372116088867, "global_step": 311999, "epoch": 1857} {"train_loss": -12.522439956665039, "global_step": 312000, "epoch": 1857} {"train_loss": -12.490106582641602, "global_step": 312001, "epoch": 1857} {"train_loss": -12.606914520263672, "global_step": 312002, "epoch": 1857} {"train_loss": -12.250772476196289, "global_step": 312003, "epoch": 1857} {"train_loss": -12.54733657836914, "global_step": 312004, "epoch": 1857} {"train_loss": -12.469067573547363, "global_step": 312005, "epoch": 1857} {"train_loss": -12.438013076782227, "global_step": 312006, "epoch": 1857} {"train_loss": -12.405746459960938, "global_step": 312007, "epoch": 1857} {"train_loss": -12.668366432189941, "global_step": 312008, "epoch": 1857} {"train_loss": -12.47592544555664, "global_step": 312009, "epoch": 1857} {"train_loss": -11.957038879394531, "global_step": 312010, "epoch": 1857} {"train_loss": -11.434061050415039, "global_step": 312011, "epoch": 1857} {"train_loss": -11.77060317993164, "global_step": 312012, "epoch": 1857} {"train_loss": -11.738174438476562, "global_step": 312013, "epoch": 1857} {"train_loss": -12.08103084564209, "global_step": 312014, "epoch": 1857} {"train_loss": -12.018421173095703, "global_step": 312015, "epoch": 1857} {"train_loss": -12.13547134399414, "global_step": 312016, "epoch": 1857} {"train_loss": -12.068986892700195, "global_step": 312017, "epoch": 1857} {"train_loss": -11.919073104858398, "global_step": 312018, "epoch": 1857} {"train_loss": -12.459644317626953, "global_step": 312019, "epoch": 1857} {"train_loss": -12.127096176147461, "global_step": 312020, "epoch": 1857} {"train_loss": -11.660877227783203, "global_step": 312021, "epoch": 1857} {"train_loss": -11.726215362548828, "global_step": 312022, "epoch": 1857} {"train_loss": -12.320537567138672, "global_step": 312023, "epoch": 1857} {"train_loss": -12.053674697875977, "global_step": 312024, "epoch": 1857} {"train_loss": -11.119510650634766, "global_step": 312025, "epoch": 1857} {"train_loss": -10.867435455322266, "global_step": 312026, "epoch": 1857} {"train_loss": -11.711594581604004, "global_step": 312027, "epoch": 1857} {"train_loss": -11.773819923400879, "global_step": 312028, "epoch": 1857} {"train_loss": -10.881998062133789, "global_step": 312029, "epoch": 1857} {"train_loss": -11.029138565063477, "global_step": 312030, "epoch": 1857} {"train_loss": -11.51756477355957, "global_step": 312031, "epoch": 1857} {"train_loss": -9.892009735107422, "global_step": 312032, "epoch": 1857} {"train_loss": -11.213085174560547, "global_step": 312033, "epoch": 1857} {"train_loss": -9.097028732299805, "global_step": 312034, "epoch": 1857} {"train_loss": -11.269088745117188, "global_step": 312035, "epoch": 1857} {"train_loss": -9.818878173828125, "global_step": 312036, "epoch": 1857} {"train_loss": -11.099641799926758, "global_step": 312037, "epoch": 1857} {"train_loss": -9.229551315307617, "global_step": 312038, "epoch": 1857} {"train_loss": -9.135528564453125, "global_step": 312039, "epoch": 1857} {"train_loss": -9.97770881652832, "global_step": 312040, "epoch": 1857} {"train_loss": -10.904536247253418, "global_step": 312041, "epoch": 1857} {"train_loss": -9.884265899658203, "global_step": 312042, "epoch": 1857} {"train_loss": -9.554743766784668, "global_step": 312043, "epoch": 1857} {"train_loss": -10.538871765136719, "global_step": 312044, "epoch": 1857} {"train_loss": -8.853941917419434, "global_step": 312045, "epoch": 1857} {"train_loss": -9.570886611938477, "global_step": 312046, "epoch": 1857} {"train_loss": -8.823384284973145, "global_step": 312047, "epoch": 1857} {"train_loss": -9.282413482666016, "global_step": 312048, "epoch": 1857} {"train_loss": -8.857973098754883, "global_step": 312049, "epoch": 1857} {"train_loss": -9.895730972290039, "global_step": 312050, "epoch": 1857} {"train_loss": -9.969137191772461, "global_step": 312051, "epoch": 1857} {"train_loss": -9.291543960571289, "global_step": 312052, "epoch": 1857} {"train_loss": -9.566314697265625, "global_step": 312053, "epoch": 1857} {"train_loss": -10.785053253173828, "global_step": 312054, "epoch": 1857} {"train_loss": -10.352585792541504, "global_step": 312055, "epoch": 1857} {"train_loss": -9.522382736206055, "global_step": 312056, "epoch": 1857} {"train_loss": -10.471582412719727, "global_step": 312057, "epoch": 1857} {"train_loss": -10.779224395751953, "global_step": 312058, "epoch": 1857} {"train_loss": -9.944717407226562, "global_step": 312059, "epoch": 1857} {"train_loss": -11.342631340026855, "global_step": 312060, "epoch": 1857} {"train_loss": -11.030256271362305, "global_step": 312061, "epoch": 1857} {"train_loss": -11.287269592285156, "global_step": 312062, "epoch": 1857} {"train_loss": -11.713354110717773, "global_step": 312063, "epoch": 1857} {"train_loss": -11.193463325500488, "global_step": 312064, "epoch": 1857} {"train_loss": -11.422300338745117, "global_step": 312065, "epoch": 1857} {"train_loss": -11.262672424316406, "global_step": 312066, "epoch": 1857} {"train_loss": -11.365436553955078, "global_step": 312067, "epoch": 1857} {"train_loss": -11.896967887878418, "global_step": 312068, "epoch": 1857} {"train_loss": -11.172239303588867, "global_step": 312069, "epoch": 1857} {"train_loss": -11.656745910644531, "global_step": 312070, "epoch": 1857} {"train_loss": -11.487890243530273, "global_step": 312071, "epoch": 1857} {"train_loss": -11.715624809265137, "global_step": 312072, "epoch": 1857} {"train_loss": -11.470266342163086, "global_step": 312073, "epoch": 1857} {"train_loss": -11.237349510192871, "global_step": 312074, "epoch": 1857} {"train_loss": -11.86968994140625, "global_step": 312075, "epoch": 1857} {"train_loss": -11.360288619995117, "global_step": 312076, "epoch": 1857} {"train_loss": -11.724048614501953, "global_step": 312077, "epoch": 1857} {"train_loss": -11.653629302978516, "global_step": 312078, "epoch": 1857} {"train_loss": -11.34823989868164, "global_step": 312079, "epoch": 1857} {"train_loss": -11.878777503967285, "global_step": 312080, "epoch": 1857} {"train_loss": -11.52250862121582, "global_step": 312081, "epoch": 1857} {"train_loss": -11.685419082641602, "global_step": 312082, "epoch": 1857} {"train_loss": -11.948190689086914, "global_step": 312083, "epoch": 1857} {"train_loss": -11.570834159851074, "global_step": 312084, "epoch": 1857} {"train_loss": -12.052928924560547, "global_step": 312085, "epoch": 1857} {"train_loss": -11.940279960632324, "global_step": 312086, "epoch": 1857} {"train_loss": -11.88515853881836, "global_step": 312087, "epoch": 1857} {"train_loss": -11.91472339630127, "global_step": 312088, "epoch": 1857} {"train_loss": -11.833063125610352, "global_step": 312089, "epoch": 1857} {"train_loss": -11.782797813415527, "global_step": 312090, "epoch": 1857} {"train_loss": -12.068093299865723, "global_step": 312091, "epoch": 1857} {"train_loss": -12.026334762573242, "global_step": 312092, "epoch": 1857} {"train_loss": -12.053805351257324, "global_step": 312093, "epoch": 1857} {"train_loss": -12.070028305053711, "global_step": 312094, "epoch": 1857} {"train_loss": -11.980365753173828, "global_step": 312095, "epoch": 1857} {"train_loss": -12.128995895385742, "global_step": 312096, "epoch": 1857} {"train_loss": -12.185049057006836, "global_step": 312097, "epoch": 1857} {"train_loss": -12.039571762084961, "global_step": 312098, "epoch": 1857} {"train_loss": -12.209602355957031, "global_step": 312099, "epoch": 1857} {"train_loss": -12.113245010375977, "global_step": 312100, "epoch": 1857} {"train_loss": -12.31924819946289, "global_step": 312101, "epoch": 1857} {"train_loss": -12.336196899414062, "global_step": 312102, "epoch": 1857} {"train_loss": -12.11478042602539, "global_step": 312103, "epoch": 1857} {"train_loss": -12.329381942749023, "global_step": 312104, "epoch": 1857} {"train_loss": -12.140804290771484, "global_step": 312105, "epoch": 1857} {"train_loss": -12.355467796325684, "global_step": 312106, "epoch": 1857} {"train_loss": -11.913647651672363, "global_step": 312107, "epoch": 1857} {"train_loss": -12.332548141479492, "global_step": 312108, "epoch": 1857} {"train_loss": -12.062479019165039, "global_step": 312109, "epoch": 1857} {"train_loss": -12.332606315612793, "global_step": 312110, "epoch": 1857} {"train_loss": -12.077719688415527, "global_step": 312111, "epoch": 1857} {"train_loss": -12.264692306518555, "global_step": 312112, "epoch": 1857} {"train_loss": -12.025341987609863, "global_step": 312113, "epoch": 1857} {"train_loss": -11.977579116821289, "global_step": 312114, "epoch": 1857} {"train_loss": -12.204875946044922, "global_step": 312115, "epoch": 1857} {"train_loss": -12.176712036132812, "global_step": 312116, "epoch": 1857} {"train_loss": -12.064214706420898, "global_step": 312117, "epoch": 1857} {"train_loss": -12.232402801513672, "global_step": 312118, "epoch": 1857} {"train_loss": -12.082426071166992, "global_step": 312119, "epoch": 1857} {"train_loss": -12.222759246826172, "global_step": 312120, "epoch": 1857} {"train_loss": -12.081368446350098, "global_step": 312121, "epoch": 1857} {"train_loss": -12.177104949951172, "global_step": 312122, "epoch": 1857} {"train_loss": -12.36867618560791, "global_step": 312123, "epoch": 1857} {"train_loss": -12.168397903442383, "global_step": 312124, "epoch": 1857} {"train_loss": -12.377238273620605, "global_step": 312125, "epoch": 1857} {"train_loss": -12.287454605102539, "global_step": 312126, "epoch": 1857} {"train_loss": -12.51236629486084, "global_step": 312127, "epoch": 1857} {"train_loss": -12.24797248840332, "global_step": 312128, "epoch": 1857} {"train_loss": -12.133613586425781, "global_step": 312129, "epoch": 1857} {"train_loss": -12.327016830444336, "global_step": 312130, "epoch": 1857} {"train_loss": -12.103445053100586, "global_step": 312131, "epoch": 1857} {"train_loss": -12.458220481872559, "global_step": 312132, "epoch": 1857} {"train_loss": -12.07513427734375, "global_step": 312133, "epoch": 1857} {"train_loss": -12.372398376464844, "global_step": 312134, "epoch": 1857} {"train_loss": -12.385021209716797, "global_step": 312135, "epoch": 1857} {"train_loss": -11.945520401000977, "global_step": 312136, "epoch": 1857} {"train_loss": -12.44863510131836, "global_step": 312137, "epoch": 1857} {"train_loss": -12.058469772338867, "global_step": 312138, "epoch": 1857} {"train_loss": -12.219881057739258, "global_step": 312139, "epoch": 1857} {"train_loss": -12.272374153137207, "global_step": 312140, "epoch": 1857} {"train_loss": -12.038679122924805, "global_step": 312141, "epoch": 1857} {"train_loss": -12.17398452758789, "global_step": 312142, "epoch": 1857} {"train_loss": -11.666918493452526, "global_step": 312143, "epoch": 1857, "val_loss": 281769.28125} {"train_loss": -12.104864120483398, "global_step": 312144, "epoch": 1858} {"train_loss": -12.016469955444336, "global_step": 312145, "epoch": 1858} {"train_loss": -12.27328872680664, "global_step": 312146, "epoch": 1858} {"train_loss": -12.239216804504395, "global_step": 312147, "epoch": 1858} {"train_loss": -12.121408462524414, "global_step": 312148, "epoch": 1858} {"train_loss": -12.241913795471191, "global_step": 312149, "epoch": 1858} {"train_loss": -12.434234619140625, "global_step": 312150, "epoch": 1858} {"train_loss": -12.318696975708008, "global_step": 312151, "epoch": 1858} {"train_loss": -11.96487808227539, "global_step": 312152, "epoch": 1858} {"train_loss": -12.421547889709473, "global_step": 312153, "epoch": 1858} {"train_loss": -12.568477630615234, "global_step": 312154, "epoch": 1858} {"train_loss": -12.071259498596191, "global_step": 312155, "epoch": 1858} {"train_loss": -11.592081069946289, "global_step": 312156, "epoch": 1858} {"train_loss": -11.531679153442383, "global_step": 312157, "epoch": 1858} {"train_loss": -12.040919303894043, "global_step": 312158, "epoch": 1858} {"train_loss": -12.237581253051758, "global_step": 312159, "epoch": 1858} {"train_loss": -11.653753280639648, "global_step": 312160, "epoch": 1858} {"train_loss": -12.159370422363281, "global_step": 312161, "epoch": 1858} {"train_loss": -12.250439643859863, "global_step": 312162, "epoch": 1858} {"train_loss": -12.087824821472168, "global_step": 312163, "epoch": 1858} {"train_loss": -11.224992752075195, "global_step": 312164, "epoch": 1858} {"train_loss": -11.939159393310547, "global_step": 312165, "epoch": 1858} {"train_loss": -12.303306579589844, "global_step": 312166, "epoch": 1858} {"train_loss": -11.29987907409668, "global_step": 312167, "epoch": 1858} {"train_loss": -11.659139633178711, "global_step": 312168, "epoch": 1858} {"train_loss": -11.882362365722656, "global_step": 312169, "epoch": 1858} {"train_loss": -11.542509078979492, "global_step": 312170, "epoch": 1858} {"train_loss": -11.855894088745117, "global_step": 312171, "epoch": 1858} {"train_loss": -11.177009582519531, "global_step": 312172, "epoch": 1858} {"train_loss": -10.063151359558105, "global_step": 312173, "epoch": 1858} {"train_loss": -8.014113426208496, "global_step": 312174, "epoch": 1858} {"train_loss": -8.762889862060547, "global_step": 312175, "epoch": 1858} {"train_loss": -9.26456069946289, "global_step": 312176, "epoch": 1858} {"train_loss": -9.167753219604492, "global_step": 312177, "epoch": 1858} {"train_loss": -8.903522491455078, "global_step": 312178, "epoch": 1858} {"train_loss": -9.181039810180664, "global_step": 312179, "epoch": 1858} {"train_loss": -9.5465669631958, "global_step": 312180, "epoch": 1858} {"train_loss": -9.584531784057617, "global_step": 312181, "epoch": 1858} {"train_loss": -9.71665096282959, "global_step": 312182, "epoch": 1858} {"train_loss": -9.65408706665039, "global_step": 312183, "epoch": 1858} {"train_loss": -9.69006633758545, "global_step": 312184, "epoch": 1858} {"train_loss": -9.744731903076172, "global_step": 312185, "epoch": 1858} {"train_loss": -8.40075397491455, "global_step": 312186, "epoch": 1858} {"train_loss": -10.602803230285645, "global_step": 312187, "epoch": 1858} {"train_loss": -9.338075637817383, "global_step": 312188, "epoch": 1858} {"train_loss": -9.951680183410645, "global_step": 312189, "epoch": 1858} {"train_loss": -7.799065113067627, "global_step": 312190, "epoch": 1858} {"train_loss": -9.00281047821045, "global_step": 312191, "epoch": 1858} {"train_loss": -9.184093475341797, "global_step": 312192, "epoch": 1858} {"train_loss": -9.546930313110352, "global_step": 312193, "epoch": 1858} {"train_loss": -10.092700958251953, "global_step": 312194, "epoch": 1858} {"train_loss": -10.79925537109375, "global_step": 312195, "epoch": 1858} {"train_loss": -9.369343757629395, "global_step": 312196, "epoch": 1858} {"train_loss": -11.09423542022705, "global_step": 312197, "epoch": 1858} {"train_loss": -10.077725410461426, "global_step": 312198, "epoch": 1858} {"train_loss": -10.507144927978516, "global_step": 312199, "epoch": 1858} {"train_loss": -9.90676498413086, "global_step": 312200, "epoch": 1858} {"train_loss": -10.745966911315918, "global_step": 312201, "epoch": 1858} {"train_loss": -10.247058868408203, "global_step": 312202, "epoch": 1858} {"train_loss": -10.942195892333984, "global_step": 312203, "epoch": 1858} {"train_loss": -10.890945434570312, "global_step": 312204, "epoch": 1858} {"train_loss": -11.001748085021973, "global_step": 312205, "epoch": 1858} {"train_loss": -11.3710298538208, "global_step": 312206, "epoch": 1858} {"train_loss": -11.483037948608398, "global_step": 312207, "epoch": 1858} {"train_loss": -10.776643753051758, "global_step": 312208, "epoch": 1858} {"train_loss": -11.661325454711914, "global_step": 312209, "epoch": 1858} {"train_loss": -11.19642448425293, "global_step": 312210, "epoch": 1858} {"train_loss": -11.65438175201416, "global_step": 312211, "epoch": 1858} {"train_loss": -11.49289608001709, "global_step": 312212, "epoch": 1858} {"train_loss": -11.490854263305664, "global_step": 312213, "epoch": 1858} {"train_loss": -11.651627540588379, "global_step": 312214, "epoch": 1858} {"train_loss": -11.441393852233887, "global_step": 312215, "epoch": 1858} {"train_loss": -11.743936538696289, "global_step": 312216, "epoch": 1858} {"train_loss": -11.525437355041504, "global_step": 312217, "epoch": 1858} {"train_loss": -11.271001815795898, "global_step": 312218, "epoch": 1858} {"train_loss": -11.258060455322266, "global_step": 312219, "epoch": 1858} {"train_loss": -11.655949592590332, "global_step": 312220, "epoch": 1858} {"train_loss": -11.33088493347168, "global_step": 312221, "epoch": 1858} {"train_loss": -11.756709098815918, "global_step": 312222, "epoch": 1858} {"train_loss": -11.430941581726074, "global_step": 312223, "epoch": 1858} {"train_loss": -11.358210563659668, "global_step": 312224, "epoch": 1858} {"train_loss": -11.896646499633789, "global_step": 312225, "epoch": 1858} {"train_loss": -11.51715087890625, "global_step": 312226, "epoch": 1858} {"train_loss": -11.094894409179688, "global_step": 312227, "epoch": 1858} {"train_loss": -11.938602447509766, "global_step": 312228, "epoch": 1858} {"train_loss": -11.716609001159668, "global_step": 312229, "epoch": 1858} {"train_loss": -11.650772094726562, "global_step": 312230, "epoch": 1858} {"train_loss": -11.719221115112305, "global_step": 312231, "epoch": 1858} {"train_loss": -11.83652400970459, "global_step": 312232, "epoch": 1858} {"train_loss": -11.926620483398438, "global_step": 312233, "epoch": 1858} {"train_loss": -12.109990119934082, "global_step": 312234, "epoch": 1858} {"train_loss": -11.928047180175781, "global_step": 312235, "epoch": 1858} {"train_loss": -11.919279098510742, "global_step": 312236, "epoch": 1858} {"train_loss": -11.880645751953125, "global_step": 312237, "epoch": 1858} {"train_loss": -11.867600440979004, "global_step": 312238, "epoch": 1858} {"train_loss": -12.049615859985352, "global_step": 312239, "epoch": 1858} {"train_loss": -11.942939758300781, "global_step": 312240, "epoch": 1858} {"train_loss": -12.117527961730957, "global_step": 312241, "epoch": 1858} {"train_loss": -12.089879989624023, "global_step": 312242, "epoch": 1858} {"train_loss": -11.934741020202637, "global_step": 312243, "epoch": 1858} {"train_loss": -12.119100570678711, "global_step": 312244, "epoch": 1858} {"train_loss": -12.06233024597168, "global_step": 312245, "epoch": 1858} {"train_loss": -12.170172691345215, "global_step": 312246, "epoch": 1858} {"train_loss": -12.236222267150879, "global_step": 312247, "epoch": 1858} {"train_loss": -12.052204132080078, "global_step": 312248, "epoch": 1858} {"train_loss": -12.171062469482422, "global_step": 312249, "epoch": 1858} {"train_loss": -12.034421920776367, "global_step": 312250, "epoch": 1858} {"train_loss": -11.972677230834961, "global_step": 312251, "epoch": 1858} {"train_loss": -12.204479217529297, "global_step": 312252, "epoch": 1858} {"train_loss": -12.18420696258545, "global_step": 312253, "epoch": 1858} {"train_loss": -12.342812538146973, "global_step": 312254, "epoch": 1858} {"train_loss": -12.272479057312012, "global_step": 312255, "epoch": 1858} {"train_loss": -12.127641677856445, "global_step": 312256, "epoch": 1858} {"train_loss": -12.092090606689453, "global_step": 312257, "epoch": 1858} {"train_loss": -12.142143249511719, "global_step": 312258, "epoch": 1858} {"train_loss": -12.199143409729004, "global_step": 312259, "epoch": 1858} {"train_loss": -12.354389190673828, "global_step": 312260, "epoch": 1858} {"train_loss": -12.297569274902344, "global_step": 312261, "epoch": 1858} {"train_loss": -12.396164894104004, "global_step": 312262, "epoch": 1858} {"train_loss": -12.12771224975586, "global_step": 312263, "epoch": 1858} {"train_loss": -12.102073669433594, "global_step": 312264, "epoch": 1858} {"train_loss": -12.140706062316895, "global_step": 312265, "epoch": 1858} {"train_loss": -12.44945240020752, "global_step": 312266, "epoch": 1858} {"train_loss": -12.10743236541748, "global_step": 312267, "epoch": 1858} {"train_loss": -12.474241256713867, "global_step": 312268, "epoch": 1858} {"train_loss": -12.461645126342773, "global_step": 312269, "epoch": 1858} {"train_loss": -12.43533992767334, "global_step": 312270, "epoch": 1858} {"train_loss": -12.183704376220703, "global_step": 312271, "epoch": 1858} {"train_loss": -12.245731353759766, "global_step": 312272, "epoch": 1858} {"train_loss": -12.25875186920166, "global_step": 312273, "epoch": 1858} {"train_loss": -12.158125877380371, "global_step": 312274, "epoch": 1858} {"train_loss": -11.981413841247559, "global_step": 312275, "epoch": 1858} {"train_loss": -12.296769142150879, "global_step": 312276, "epoch": 1858} {"train_loss": -12.280914306640625, "global_step": 312277, "epoch": 1858} {"train_loss": -12.169071197509766, "global_step": 312278, "epoch": 1858} {"train_loss": -12.335168838500977, "global_step": 312279, "epoch": 1858} {"train_loss": -12.438552856445312, "global_step": 312280, "epoch": 1858} {"train_loss": -12.293359756469727, "global_step": 312281, "epoch": 1858} {"train_loss": -12.007266998291016, "global_step": 312282, "epoch": 1858} {"train_loss": -12.200676918029785, "global_step": 312283, "epoch": 1858} {"train_loss": -12.15805435180664, "global_step": 312284, "epoch": 1858} {"train_loss": -12.478212356567383, "global_step": 312285, "epoch": 1858} {"train_loss": -12.172935485839844, "global_step": 312286, "epoch": 1858} {"train_loss": -12.434699058532715, "global_step": 312287, "epoch": 1858} {"train_loss": -12.480653762817383, "global_step": 312288, "epoch": 1858} {"train_loss": -12.482583045959473, "global_step": 312289, "epoch": 1858} {"train_loss": -12.253669738769531, "global_step": 312290, "epoch": 1858} {"train_loss": -12.32484245300293, "global_step": 312291, "epoch": 1858} {"train_loss": -12.204672813415527, "global_step": 312292, "epoch": 1858} {"train_loss": -12.393865585327148, "global_step": 312293, "epoch": 1858} {"train_loss": -12.16588306427002, "global_step": 312294, "epoch": 1858} {"train_loss": -12.448814392089844, "global_step": 312295, "epoch": 1858} {"train_loss": -12.221330642700195, "global_step": 312296, "epoch": 1858} {"train_loss": -12.224054336547852, "global_step": 312297, "epoch": 1858} {"train_loss": -12.322757720947266, "global_step": 312298, "epoch": 1858} {"train_loss": -12.141153335571289, "global_step": 312299, "epoch": 1858} {"train_loss": -12.378898620605469, "global_step": 312300, "epoch": 1858} {"train_loss": -12.61301326751709, "global_step": 312301, "epoch": 1858} {"train_loss": -12.306479454040527, "global_step": 312302, "epoch": 1858} {"train_loss": -12.44974136352539, "global_step": 312303, "epoch": 1858} {"train_loss": -12.548848152160645, "global_step": 312304, "epoch": 1858} {"train_loss": -12.478038787841797, "global_step": 312305, "epoch": 1858} {"train_loss": -12.559142112731934, "global_step": 312306, "epoch": 1858} {"train_loss": -12.507633209228516, "global_step": 312307, "epoch": 1858} {"train_loss": -12.453786849975586, "global_step": 312308, "epoch": 1858} {"train_loss": -12.533449172973633, "global_step": 312309, "epoch": 1858} {"train_loss": -12.166566848754883, "global_step": 312310, "epoch": 1858} {"train_loss": -11.577048980054402, "global_step": 312311, "epoch": 1858, "val_loss": 285329.34375} {"train_loss": -12.025274276733398, "global_step": 312312, "epoch": 1859} {"train_loss": -11.968938827514648, "global_step": 312313, "epoch": 1859} {"train_loss": -12.043451309204102, "global_step": 312314, "epoch": 1859} {"train_loss": -11.726509094238281, "global_step": 312315, "epoch": 1859} {"train_loss": -11.909246444702148, "global_step": 312316, "epoch": 1859} {"train_loss": -10.911039352416992, "global_step": 312317, "epoch": 1859} {"train_loss": -11.53668212890625, "global_step": 312318, "epoch": 1859} {"train_loss": -10.277095794677734, "global_step": 312319, "epoch": 1859} {"train_loss": -11.346758842468262, "global_step": 312320, "epoch": 1859} {"train_loss": -10.563100814819336, "global_step": 312321, "epoch": 1859} {"train_loss": -10.783184051513672, "global_step": 312322, "epoch": 1859} {"train_loss": -10.863652229309082, "global_step": 312323, "epoch": 1859} {"train_loss": -10.548038482666016, "global_step": 312324, "epoch": 1859} {"train_loss": -11.687673568725586, "global_step": 312325, "epoch": 1859} {"train_loss": -9.953154563903809, "global_step": 312326, "epoch": 1859} {"train_loss": -11.892821311950684, "global_step": 312327, "epoch": 1859} {"train_loss": -11.025649070739746, "global_step": 312328, "epoch": 1859} {"train_loss": -9.235984802246094, "global_step": 312329, "epoch": 1859} {"train_loss": -10.31177043914795, "global_step": 312330, "epoch": 1859} {"train_loss": -8.677570343017578, "global_step": 312331, "epoch": 1859} {"train_loss": -10.489643096923828, "global_step": 312332, "epoch": 1859} {"train_loss": -8.496853828430176, "global_step": 312333, "epoch": 1859} {"train_loss": -9.781291961669922, "global_step": 312334, "epoch": 1859} {"train_loss": -8.796300888061523, "global_step": 312335, "epoch": 1859} {"train_loss": -10.664900779724121, "global_step": 312336, "epoch": 1859} {"train_loss": -9.079959869384766, "global_step": 312337, "epoch": 1859} {"train_loss": -8.720519065856934, "global_step": 312338, "epoch": 1859} {"train_loss": -10.301108360290527, "global_step": 312339, "epoch": 1859} {"train_loss": -9.687980651855469, "global_step": 312340, "epoch": 1859} {"train_loss": -10.808731079101562, "global_step": 312341, "epoch": 1859} {"train_loss": -9.065797805786133, "global_step": 312342, "epoch": 1859} {"train_loss": -10.910585403442383, "global_step": 312343, "epoch": 1859} {"train_loss": -8.737419128417969, "global_step": 312344, "epoch": 1859} {"train_loss": -9.46807861328125, "global_step": 312345, "epoch": 1859} {"train_loss": -9.065771102905273, "global_step": 312346, "epoch": 1859} {"train_loss": -10.085159301757812, "global_step": 312347, "epoch": 1859} {"train_loss": -9.436105728149414, "global_step": 312348, "epoch": 1859} {"train_loss": -9.301076889038086, "global_step": 312349, "epoch": 1859} {"train_loss": -10.39190673828125, "global_step": 312350, "epoch": 1859} {"train_loss": -9.664833068847656, "global_step": 312351, "epoch": 1859} {"train_loss": -10.67808723449707, "global_step": 312352, "epoch": 1859} {"train_loss": -9.789867401123047, "global_step": 312353, "epoch": 1859} {"train_loss": -10.586153030395508, "global_step": 312354, "epoch": 1859} {"train_loss": -10.742009162902832, "global_step": 312355, "epoch": 1859} {"train_loss": -11.45524787902832, "global_step": 312356, "epoch": 1859} {"train_loss": -11.201239585876465, "global_step": 312357, "epoch": 1859} {"train_loss": -11.618379592895508, "global_step": 312358, "epoch": 1859} {"train_loss": -11.040642738342285, "global_step": 312359, "epoch": 1859} {"train_loss": -10.976171493530273, "global_step": 312360, "epoch": 1859} {"train_loss": -11.181111335754395, "global_step": 312361, "epoch": 1859} {"train_loss": -10.985103607177734, "global_step": 312362, "epoch": 1859} {"train_loss": -11.300110816955566, "global_step": 312363, "epoch": 1859} {"train_loss": -11.296884536743164, "global_step": 312364, "epoch": 1859} {"train_loss": -11.136320114135742, "global_step": 312365, "epoch": 1859} {"train_loss": -11.235119819641113, "global_step": 312366, "epoch": 1859} {"train_loss": -11.246418952941895, "global_step": 312367, "epoch": 1859} {"train_loss": -11.592775344848633, "global_step": 312368, "epoch": 1859} {"train_loss": -10.785112380981445, "global_step": 312369, "epoch": 1859} {"train_loss": -11.676889419555664, "global_step": 312370, "epoch": 1859} {"train_loss": -11.094656944274902, "global_step": 312371, "epoch": 1859} {"train_loss": -11.407331466674805, "global_step": 312372, "epoch": 1859} {"train_loss": -11.358957290649414, "global_step": 312373, "epoch": 1859} {"train_loss": -11.468177795410156, "global_step": 312374, "epoch": 1859} {"train_loss": -11.490410804748535, "global_step": 312375, "epoch": 1859} {"train_loss": -11.551283836364746, "global_step": 312376, "epoch": 1859} {"train_loss": -11.575155258178711, "global_step": 312377, "epoch": 1859} {"train_loss": -11.445892333984375, "global_step": 312378, "epoch": 1859} {"train_loss": -11.870878219604492, "global_step": 312379, "epoch": 1859} {"train_loss": -11.64767074584961, "global_step": 312380, "epoch": 1859} {"train_loss": -11.501753807067871, "global_step": 312381, "epoch": 1859} {"train_loss": -11.671972274780273, "global_step": 312382, "epoch": 1859} {"train_loss": -11.512174606323242, "global_step": 312383, "epoch": 1859} {"train_loss": -11.536031723022461, "global_step": 312384, "epoch": 1859} {"train_loss": -11.397720336914062, "global_step": 312385, "epoch": 1859} {"train_loss": -11.812599182128906, "global_step": 312386, "epoch": 1859} {"train_loss": -11.158356666564941, "global_step": 312387, "epoch": 1859} {"train_loss": -11.921332359313965, "global_step": 312388, "epoch": 1859} {"train_loss": -11.797869682312012, "global_step": 312389, "epoch": 1859} {"train_loss": -11.826852798461914, "global_step": 312390, "epoch": 1859} {"train_loss": -11.74928092956543, "global_step": 312391, "epoch": 1859} {"train_loss": -11.951857566833496, "global_step": 312392, "epoch": 1859} {"train_loss": -11.78142261505127, "global_step": 312393, "epoch": 1859} {"train_loss": -11.883620262145996, "global_step": 312394, "epoch": 1859} {"train_loss": -11.666389465332031, "global_step": 312395, "epoch": 1859} {"train_loss": -12.015893936157227, "global_step": 312396, "epoch": 1859} {"train_loss": -12.112935066223145, "global_step": 312397, "epoch": 1859} {"train_loss": -12.07088851928711, "global_step": 312398, "epoch": 1859} {"train_loss": -11.946820259094238, "global_step": 312399, "epoch": 1859} {"train_loss": -11.898022651672363, "global_step": 312400, "epoch": 1859} {"train_loss": -12.02315902709961, "global_step": 312401, "epoch": 1859} {"train_loss": -12.010432243347168, "global_step": 312402, "epoch": 1859} {"train_loss": -12.049905776977539, "global_step": 312403, "epoch": 1859} {"train_loss": -12.057506561279297, "global_step": 312404, "epoch": 1859} {"train_loss": -12.112845420837402, "global_step": 312405, "epoch": 1859} {"train_loss": -11.88386344909668, "global_step": 312406, "epoch": 1859} {"train_loss": -12.233898162841797, "global_step": 312407, "epoch": 1859} {"train_loss": -12.044184684753418, "global_step": 312408, "epoch": 1859} {"train_loss": -12.224143028259277, "global_step": 312409, "epoch": 1859} {"train_loss": -12.185412406921387, "global_step": 312410, "epoch": 1859} {"train_loss": -12.242494583129883, "global_step": 312411, "epoch": 1859} {"train_loss": -12.336121559143066, "global_step": 312412, "epoch": 1859} {"train_loss": -12.271026611328125, "global_step": 312413, "epoch": 1859} {"train_loss": -12.285523414611816, "global_step": 312414, "epoch": 1859} {"train_loss": -12.354703903198242, "global_step": 312415, "epoch": 1859} {"train_loss": -12.292915344238281, "global_step": 312416, "epoch": 1859} {"train_loss": -12.376359939575195, "global_step": 312417, "epoch": 1859} {"train_loss": -12.295717239379883, "global_step": 312418, "epoch": 1859} {"train_loss": -12.286152839660645, "global_step": 312419, "epoch": 1859} {"train_loss": -12.307258605957031, "global_step": 312420, "epoch": 1859} {"train_loss": -12.259592056274414, "global_step": 312421, "epoch": 1859} {"train_loss": -12.361454010009766, "global_step": 312422, "epoch": 1859} {"train_loss": -12.365821838378906, "global_step": 312423, "epoch": 1859} {"train_loss": -12.244277954101562, "global_step": 312424, "epoch": 1859} {"train_loss": -12.408241271972656, "global_step": 312425, "epoch": 1859} {"train_loss": -12.301133155822754, "global_step": 312426, "epoch": 1859} {"train_loss": -12.414546966552734, "global_step": 312427, "epoch": 1859} {"train_loss": -12.35124397277832, "global_step": 312428, "epoch": 1859} {"train_loss": -12.311236381530762, "global_step": 312429, "epoch": 1859} {"train_loss": -12.483878135681152, "global_step": 312430, "epoch": 1859} {"train_loss": -12.373006820678711, "global_step": 312431, "epoch": 1859} {"train_loss": -12.364113807678223, "global_step": 312432, "epoch": 1859} {"train_loss": -12.493499755859375, "global_step": 312433, "epoch": 1859} {"train_loss": -12.44337272644043, "global_step": 312434, "epoch": 1859} {"train_loss": -12.539420127868652, "global_step": 312435, "epoch": 1859} {"train_loss": -12.361411094665527, "global_step": 312436, "epoch": 1859} {"train_loss": -12.51868724822998, "global_step": 312437, "epoch": 1859} {"train_loss": -12.539212226867676, "global_step": 312438, "epoch": 1859} {"train_loss": -12.41519546508789, "global_step": 312439, "epoch": 1859} {"train_loss": -12.371149063110352, "global_step": 312440, "epoch": 1859} {"train_loss": -12.456265449523926, "global_step": 312441, "epoch": 1859} {"train_loss": -12.409599304199219, "global_step": 312442, "epoch": 1859} {"train_loss": -12.665681838989258, "global_step": 312443, "epoch": 1859} {"train_loss": -12.590441703796387, "global_step": 312444, "epoch": 1859} {"train_loss": -12.507638931274414, "global_step": 312445, "epoch": 1859} {"train_loss": -12.448848724365234, "global_step": 312446, "epoch": 1859} {"train_loss": -12.483755111694336, "global_step": 312447, "epoch": 1859} {"train_loss": -12.497356414794922, "global_step": 312448, "epoch": 1859} {"train_loss": -12.527061462402344, "global_step": 312449, "epoch": 1859} {"train_loss": -12.5386323928833, "global_step": 312450, "epoch": 1859} {"train_loss": -12.558353424072266, "global_step": 312451, "epoch": 1859} {"train_loss": -12.567098617553711, "global_step": 312452, "epoch": 1859} {"train_loss": -12.698575973510742, "global_step": 312453, "epoch": 1859} {"train_loss": -12.462114334106445, "global_step": 312454, "epoch": 1859} {"train_loss": -12.4046630859375, "global_step": 312455, "epoch": 1859} {"train_loss": -12.573138236999512, "global_step": 312456, "epoch": 1859} {"train_loss": -12.016680717468262, "global_step": 312457, "epoch": 1859} {"train_loss": -12.483034133911133, "global_step": 312458, "epoch": 1859} {"train_loss": -12.446273803710938, "global_step": 312459, "epoch": 1859} {"train_loss": -12.183420181274414, "global_step": 312460, "epoch": 1859} {"train_loss": -11.904804229736328, "global_step": 312461, "epoch": 1859} {"train_loss": -12.4204740524292, "global_step": 312462, "epoch": 1859} {"train_loss": -12.583221435546875, "global_step": 312463, "epoch": 1859} {"train_loss": -12.352377891540527, "global_step": 312464, "epoch": 1859} {"train_loss": -12.685190200805664, "global_step": 312465, "epoch": 1859} {"train_loss": -12.203117370605469, "global_step": 312466, "epoch": 1859} {"train_loss": -12.556516647338867, "global_step": 312467, "epoch": 1859} {"train_loss": -12.00334358215332, "global_step": 312468, "epoch": 1859} {"train_loss": -12.123075485229492, "global_step": 312469, "epoch": 1859} {"train_loss": -12.201812744140625, "global_step": 312470, "epoch": 1859} {"train_loss": -12.221904754638672, "global_step": 312471, "epoch": 1859} {"train_loss": -12.66438102722168, "global_step": 312472, "epoch": 1859} {"train_loss": -12.222607612609863, "global_step": 312473, "epoch": 1859} {"train_loss": -11.71297836303711, "global_step": 312474, "epoch": 1859} {"train_loss": -12.13725471496582, "global_step": 312475, "epoch": 1859} {"train_loss": -11.279825210571289, "global_step": 312476, "epoch": 1859} {"train_loss": -11.837868690490723, "global_step": 312477, "epoch": 1859} {"train_loss": -12.076030731201172, "global_step": 312478, "epoch": 1859} {"train_loss": -11.57955515384674, "global_step": 312479, "epoch": 1859, "val_loss": 281029.25} {"train_loss": -11.734827041625977, "global_step": 312480, "epoch": 1860} {"train_loss": -11.052677154541016, "global_step": 312481, "epoch": 1860} {"train_loss": -11.470664978027344, "global_step": 312482, "epoch": 1860} {"train_loss": -10.954668998718262, "global_step": 312483, "epoch": 1860} {"train_loss": -12.254955291748047, "global_step": 312484, "epoch": 1860} {"train_loss": -10.864925384521484, "global_step": 312485, "epoch": 1860} {"train_loss": -12.338134765625, "global_step": 312486, "epoch": 1860} {"train_loss": -10.834149360656738, "global_step": 312487, "epoch": 1860} {"train_loss": -11.580333709716797, "global_step": 312488, "epoch": 1860} {"train_loss": -11.065229415893555, "global_step": 312489, "epoch": 1860} {"train_loss": -12.24757194519043, "global_step": 312490, "epoch": 1860} {"train_loss": -11.152419090270996, "global_step": 312491, "epoch": 1860} {"train_loss": -12.030517578125, "global_step": 312492, "epoch": 1860} {"train_loss": -11.658164978027344, "global_step": 312493, "epoch": 1860} {"train_loss": -11.771915435791016, "global_step": 312494, "epoch": 1860} {"train_loss": -11.599864959716797, "global_step": 312495, "epoch": 1860} {"train_loss": -12.195751190185547, "global_step": 312496, "epoch": 1860} {"train_loss": -11.469890594482422, "global_step": 312497, "epoch": 1860} {"train_loss": -12.033449172973633, "global_step": 312498, "epoch": 1860} {"train_loss": -12.090526580810547, "global_step": 312499, "epoch": 1860} {"train_loss": -11.989421844482422, "global_step": 312500, "epoch": 1860} {"train_loss": -12.250188827514648, "global_step": 312501, "epoch": 1860} {"train_loss": -12.13731575012207, "global_step": 312502, "epoch": 1860} {"train_loss": -12.026729583740234, "global_step": 312503, "epoch": 1860} {"train_loss": -11.594861030578613, "global_step": 312504, "epoch": 1860} {"train_loss": -11.772737503051758, "global_step": 312505, "epoch": 1860} {"train_loss": -12.00782299041748, "global_step": 312506, "epoch": 1860} {"train_loss": -11.542503356933594, "global_step": 312507, "epoch": 1860} {"train_loss": -11.611849784851074, "global_step": 312508, "epoch": 1860} {"train_loss": -11.905875205993652, "global_step": 312509, "epoch": 1860} {"train_loss": -10.841707229614258, "global_step": 312510, "epoch": 1860} {"train_loss": -11.315666198730469, "global_step": 312511, "epoch": 1860} {"train_loss": -11.651857376098633, "global_step": 312512, "epoch": 1860} {"train_loss": -11.901063919067383, "global_step": 312513, "epoch": 1860} {"train_loss": -11.979827880859375, "global_step": 312514, "epoch": 1860} {"train_loss": -11.57962417602539, "global_step": 312515, "epoch": 1860} {"train_loss": -10.872116088867188, "global_step": 312516, "epoch": 1860} {"train_loss": -12.01466178894043, "global_step": 312517, "epoch": 1860} {"train_loss": -9.815479278564453, "global_step": 312518, "epoch": 1860} {"train_loss": -10.990409851074219, "global_step": 312519, "epoch": 1860} {"train_loss": -8.800970077514648, "global_step": 312520, "epoch": 1860} {"train_loss": -11.02776050567627, "global_step": 312521, "epoch": 1860} {"train_loss": -11.36658000946045, "global_step": 312522, "epoch": 1860} {"train_loss": -11.047257423400879, "global_step": 312523, "epoch": 1860} {"train_loss": -11.591976165771484, "global_step": 312524, "epoch": 1860} {"train_loss": -10.088594436645508, "global_step": 312525, "epoch": 1860} {"train_loss": -10.323467254638672, "global_step": 312526, "epoch": 1860} {"train_loss": -11.676152229309082, "global_step": 312527, "epoch": 1860} {"train_loss": -11.518617630004883, "global_step": 312528, "epoch": 1860} {"train_loss": -10.96536636352539, "global_step": 312529, "epoch": 1860} {"train_loss": -12.1031494140625, "global_step": 312530, "epoch": 1860} {"train_loss": -11.239166259765625, "global_step": 312531, "epoch": 1860} {"train_loss": -11.226247787475586, "global_step": 312532, "epoch": 1860} {"train_loss": -11.956801414489746, "global_step": 312533, "epoch": 1860} {"train_loss": -11.029210090637207, "global_step": 312534, "epoch": 1860} {"train_loss": -12.009450912475586, "global_step": 312535, "epoch": 1860} {"train_loss": -11.32327651977539, "global_step": 312536, "epoch": 1860} {"train_loss": -11.492094039916992, "global_step": 312537, "epoch": 1860} {"train_loss": -11.6514310836792, "global_step": 312538, "epoch": 1860} {"train_loss": -11.254877090454102, "global_step": 312539, "epoch": 1860} {"train_loss": -11.862709999084473, "global_step": 312540, "epoch": 1860} {"train_loss": -10.920631408691406, "global_step": 312541, "epoch": 1860} {"train_loss": -11.134662628173828, "global_step": 312542, "epoch": 1860} {"train_loss": -11.721206665039062, "global_step": 312543, "epoch": 1860} {"train_loss": -11.445951461791992, "global_step": 312544, "epoch": 1860} {"train_loss": -11.14608383178711, "global_step": 312545, "epoch": 1860} {"train_loss": -11.98639965057373, "global_step": 312546, "epoch": 1860} {"train_loss": -11.310418128967285, "global_step": 312547, "epoch": 1860} {"train_loss": -11.859628677368164, "global_step": 312548, "epoch": 1860} {"train_loss": -11.002930641174316, "global_step": 312549, "epoch": 1860} {"train_loss": -11.39391040802002, "global_step": 312550, "epoch": 1860} {"train_loss": -11.452747344970703, "global_step": 312551, "epoch": 1860} {"train_loss": -11.460074424743652, "global_step": 312552, "epoch": 1860} {"train_loss": -11.28419303894043, "global_step": 312553, "epoch": 1860} {"train_loss": -10.773619651794434, "global_step": 312554, "epoch": 1860} {"train_loss": -11.24222469329834, "global_step": 312555, "epoch": 1860} {"train_loss": -10.638923645019531, "global_step": 312556, "epoch": 1860} {"train_loss": -11.65853214263916, "global_step": 312557, "epoch": 1860} {"train_loss": -9.689798355102539, "global_step": 312558, "epoch": 1860} {"train_loss": -10.275062561035156, "global_step": 312559, "epoch": 1860} {"train_loss": -11.016111373901367, "global_step": 312560, "epoch": 1860} {"train_loss": -10.500362396240234, "global_step": 312561, "epoch": 1860} {"train_loss": -11.406315803527832, "global_step": 312562, "epoch": 1860} {"train_loss": -10.819375038146973, "global_step": 312563, "epoch": 1860} {"train_loss": -10.72083854675293, "global_step": 312564, "epoch": 1860} {"train_loss": -10.943400382995605, "global_step": 312565, "epoch": 1860} {"train_loss": -11.24783992767334, "global_step": 312566, "epoch": 1860} {"train_loss": -11.001836776733398, "global_step": 312567, "epoch": 1860} {"train_loss": -11.899246215820312, "global_step": 312568, "epoch": 1860} {"train_loss": -10.960514068603516, "global_step": 312569, "epoch": 1860} {"train_loss": -11.367544174194336, "global_step": 312570, "epoch": 1860} {"train_loss": -11.348793983459473, "global_step": 312571, "epoch": 1860} {"train_loss": -11.56381607055664, "global_step": 312572, "epoch": 1860} {"train_loss": -11.40791130065918, "global_step": 312573, "epoch": 1860} {"train_loss": -11.907537460327148, "global_step": 312574, "epoch": 1860} {"train_loss": -11.88122272491455, "global_step": 312575, "epoch": 1860} {"train_loss": -11.764923095703125, "global_step": 312576, "epoch": 1860} {"train_loss": -12.074609756469727, "global_step": 312577, "epoch": 1860} {"train_loss": -11.76303482055664, "global_step": 312578, "epoch": 1860} {"train_loss": -12.206483840942383, "global_step": 312579, "epoch": 1860} {"train_loss": -11.90665054321289, "global_step": 312580, "epoch": 1860} {"train_loss": -12.028709411621094, "global_step": 312581, "epoch": 1860} {"train_loss": -11.847355842590332, "global_step": 312582, "epoch": 1860} {"train_loss": -11.882564544677734, "global_step": 312583, "epoch": 1860} {"train_loss": -12.045668601989746, "global_step": 312584, "epoch": 1860} {"train_loss": -12.150721549987793, "global_step": 312585, "epoch": 1860} {"train_loss": -12.310623168945312, "global_step": 312586, "epoch": 1860} {"train_loss": -11.813642501831055, "global_step": 312587, "epoch": 1860} {"train_loss": -11.881832122802734, "global_step": 312588, "epoch": 1860} {"train_loss": -12.083585739135742, "global_step": 312589, "epoch": 1860} {"train_loss": -12.056563377380371, "global_step": 312590, "epoch": 1860} {"train_loss": -12.251401901245117, "global_step": 312591, "epoch": 1860} {"train_loss": -12.316431045532227, "global_step": 312592, "epoch": 1860} {"train_loss": -11.993069648742676, "global_step": 312593, "epoch": 1860} {"train_loss": -12.050618171691895, "global_step": 312594, "epoch": 1860} {"train_loss": -12.283882141113281, "global_step": 312595, "epoch": 1860} {"train_loss": -12.115825653076172, "global_step": 312596, "epoch": 1860} {"train_loss": -12.162691116333008, "global_step": 312597, "epoch": 1860} {"train_loss": -12.161426544189453, "global_step": 312598, "epoch": 1860} {"train_loss": -12.079744338989258, "global_step": 312599, "epoch": 1860} {"train_loss": -12.261499404907227, "global_step": 312600, "epoch": 1860} {"train_loss": -12.148885726928711, "global_step": 312601, "epoch": 1860} {"train_loss": -12.199995040893555, "global_step": 312602, "epoch": 1860} {"train_loss": -12.113183975219727, "global_step": 312603, "epoch": 1860} {"train_loss": -12.09076976776123, "global_step": 312604, "epoch": 1860} {"train_loss": -12.10445785522461, "global_step": 312605, "epoch": 1860} {"train_loss": -12.017078399658203, "global_step": 312606, "epoch": 1860} {"train_loss": -12.384472846984863, "global_step": 312607, "epoch": 1860} {"train_loss": -12.136213302612305, "global_step": 312608, "epoch": 1860} {"train_loss": -12.316511154174805, "global_step": 312609, "epoch": 1860} {"train_loss": -12.451904296875, "global_step": 312610, "epoch": 1860} {"train_loss": -12.21556568145752, "global_step": 312611, "epoch": 1860} {"train_loss": -12.07121753692627, "global_step": 312612, "epoch": 1860} {"train_loss": -12.308467864990234, "global_step": 312613, "epoch": 1860} {"train_loss": -12.230034828186035, "global_step": 312614, "epoch": 1860} {"train_loss": -12.391969680786133, "global_step": 312615, "epoch": 1860} {"train_loss": -12.226579666137695, "global_step": 312616, "epoch": 1860} {"train_loss": -12.409770011901855, "global_step": 312617, "epoch": 1860} {"train_loss": -12.320718765258789, "global_step": 312618, "epoch": 1860} {"train_loss": -11.992524147033691, "global_step": 312619, "epoch": 1860} {"train_loss": -11.965608596801758, "global_step": 312620, "epoch": 1860} {"train_loss": -12.56451416015625, "global_step": 312621, "epoch": 1860} {"train_loss": -12.069557189941406, "global_step": 312622, "epoch": 1860} {"train_loss": -12.39185619354248, "global_step": 312623, "epoch": 1860} {"train_loss": -12.430492401123047, "global_step": 312624, "epoch": 1860} {"train_loss": -12.571697235107422, "global_step": 312625, "epoch": 1860} {"train_loss": -12.449570655822754, "global_step": 312626, "epoch": 1860} {"train_loss": -12.40144157409668, "global_step": 312627, "epoch": 1860} {"train_loss": -12.414082527160645, "global_step": 312628, "epoch": 1860} {"train_loss": -12.528158187866211, "global_step": 312629, "epoch": 1860} {"train_loss": -12.284265518188477, "global_step": 312630, "epoch": 1860} {"train_loss": -12.216804504394531, "global_step": 312631, "epoch": 1860} {"train_loss": -12.338801383972168, "global_step": 312632, "epoch": 1860} {"train_loss": -12.070329666137695, "global_step": 312633, "epoch": 1860} {"train_loss": -12.341228485107422, "global_step": 312634, "epoch": 1860} {"train_loss": -12.25455093383789, "global_step": 312635, "epoch": 1860} {"train_loss": -11.387096405029297, "global_step": 312636, "epoch": 1860} {"train_loss": -11.392717361450195, "global_step": 312637, "epoch": 1860} {"train_loss": -11.686936378479004, "global_step": 312638, "epoch": 1860} {"train_loss": -11.99030876159668, "global_step": 312639, "epoch": 1860} {"train_loss": -10.684335708618164, "global_step": 312640, "epoch": 1860} {"train_loss": -10.312616348266602, "global_step": 312641, "epoch": 1860} {"train_loss": -10.360811233520508, "global_step": 312642, "epoch": 1860} {"train_loss": -10.812649726867676, "global_step": 312643, "epoch": 1860} {"train_loss": -10.496225357055664, "global_step": 312644, "epoch": 1860} {"train_loss": -11.583559036254883, "global_step": 312645, "epoch": 1860} {"train_loss": -9.01558780670166, "global_step": 312646, "epoch": 1860} {"train_loss": -11.632220949445452, "global_step": 312647, "epoch": 1860, "val_loss": 281916.75, "train_action_mse_error": 1.825981855392456} {"train_loss": -7.256026268005371, "global_step": 312648, "epoch": 1861} {"train_loss": -7.804691314697266, "global_step": 312649, "epoch": 1861} {"train_loss": -7.13618278503418, "global_step": 312650, "epoch": 1861} {"train_loss": -7.14716911315918, "global_step": 312651, "epoch": 1861} {"train_loss": -9.022923469543457, "global_step": 312652, "epoch": 1861} {"train_loss": -9.681623458862305, "global_step": 312653, "epoch": 1861} {"train_loss": -8.747323989868164, "global_step": 312654, "epoch": 1861} {"train_loss": -10.890528678894043, "global_step": 312655, "epoch": 1861} {"train_loss": -10.460468292236328, "global_step": 312656, "epoch": 1861} {"train_loss": -10.98420524597168, "global_step": 312657, "epoch": 1861} {"train_loss": -11.061869621276855, "global_step": 312658, "epoch": 1861} {"train_loss": -10.763362884521484, "global_step": 312659, "epoch": 1861} {"train_loss": -10.254440307617188, "global_step": 312660, "epoch": 1861} {"train_loss": -10.520641326904297, "global_step": 312661, "epoch": 1861} {"train_loss": -10.327499389648438, "global_step": 312662, "epoch": 1861} {"train_loss": -10.459210395812988, "global_step": 312663, "epoch": 1861} {"train_loss": -11.036396026611328, "global_step": 312664, "epoch": 1861} {"train_loss": -11.071041107177734, "global_step": 312665, "epoch": 1861} {"train_loss": -11.435529708862305, "global_step": 312666, "epoch": 1861} {"train_loss": -10.570568084716797, "global_step": 312667, "epoch": 1861} {"train_loss": -11.64790153503418, "global_step": 312668, "epoch": 1861} {"train_loss": -11.438057899475098, "global_step": 312669, "epoch": 1861} {"train_loss": -11.313377380371094, "global_step": 312670, "epoch": 1861} {"train_loss": -11.79615306854248, "global_step": 312671, "epoch": 1861} {"train_loss": -11.363754272460938, "global_step": 312672, "epoch": 1861} {"train_loss": -12.014026641845703, "global_step": 312673, "epoch": 1861} {"train_loss": -11.852019309997559, "global_step": 312674, "epoch": 1861} {"train_loss": -11.743022918701172, "global_step": 312675, "epoch": 1861} {"train_loss": -11.90334701538086, "global_step": 312676, "epoch": 1861} {"train_loss": -11.9157133102417, "global_step": 312677, "epoch": 1861} {"train_loss": -11.939835548400879, "global_step": 312678, "epoch": 1861} {"train_loss": -11.827266693115234, "global_step": 312679, "epoch": 1861} {"train_loss": -11.872806549072266, "global_step": 312680, "epoch": 1861} {"train_loss": -11.924507141113281, "global_step": 312681, "epoch": 1861} {"train_loss": -11.94247817993164, "global_step": 312682, "epoch": 1861} {"train_loss": -12.01239013671875, "global_step": 312683, "epoch": 1861} {"train_loss": -12.057506561279297, "global_step": 312684, "epoch": 1861} {"train_loss": -12.032838821411133, "global_step": 312685, "epoch": 1861} {"train_loss": -12.155559539794922, "global_step": 312686, "epoch": 1861} {"train_loss": -11.71532154083252, "global_step": 312687, "epoch": 1861} {"train_loss": -11.829063415527344, "global_step": 312688, "epoch": 1861} {"train_loss": -11.66808795928955, "global_step": 312689, "epoch": 1861} {"train_loss": -12.065011978149414, "global_step": 312690, "epoch": 1861} {"train_loss": -12.147449493408203, "global_step": 312691, "epoch": 1861} {"train_loss": -11.903059959411621, "global_step": 312692, "epoch": 1861} {"train_loss": -12.09054946899414, "global_step": 312693, "epoch": 1861} {"train_loss": -11.952560424804688, "global_step": 312694, "epoch": 1861} {"train_loss": -12.135795593261719, "global_step": 312695, "epoch": 1861} {"train_loss": -12.142454147338867, "global_step": 312696, "epoch": 1861} {"train_loss": -12.262638092041016, "global_step": 312697, "epoch": 1861} {"train_loss": -12.109884262084961, "global_step": 312698, "epoch": 1861} {"train_loss": -12.1500825881958, "global_step": 312699, "epoch": 1861} {"train_loss": -12.249715805053711, "global_step": 312700, "epoch": 1861} {"train_loss": -12.265663146972656, "global_step": 312701, "epoch": 1861} {"train_loss": -11.975177764892578, "global_step": 312702, "epoch": 1861} {"train_loss": -12.198646545410156, "global_step": 312703, "epoch": 1861} {"train_loss": -12.125996589660645, "global_step": 312704, "epoch": 1861} {"train_loss": -12.189245223999023, "global_step": 312705, "epoch": 1861} {"train_loss": -12.038802146911621, "global_step": 312706, "epoch": 1861} {"train_loss": -12.023406982421875, "global_step": 312707, "epoch": 1861} {"train_loss": -11.939342498779297, "global_step": 312708, "epoch": 1861} {"train_loss": -12.178398132324219, "global_step": 312709, "epoch": 1861} {"train_loss": -11.978595733642578, "global_step": 312710, "epoch": 1861} {"train_loss": -12.31291675567627, "global_step": 312711, "epoch": 1861} {"train_loss": -11.990872383117676, "global_step": 312712, "epoch": 1861} {"train_loss": -12.331253051757812, "global_step": 312713, "epoch": 1861} {"train_loss": -12.11632251739502, "global_step": 312714, "epoch": 1861} {"train_loss": -12.136112213134766, "global_step": 312715, "epoch": 1861} {"train_loss": -11.979687690734863, "global_step": 312716, "epoch": 1861} {"train_loss": -12.294198036193848, "global_step": 312717, "epoch": 1861} {"train_loss": -11.9856595993042, "global_step": 312718, "epoch": 1861} {"train_loss": -11.942916870117188, "global_step": 312719, "epoch": 1861} {"train_loss": -12.375823020935059, "global_step": 312720, "epoch": 1861} {"train_loss": -12.080703735351562, "global_step": 312721, "epoch": 1861} {"train_loss": -12.235600471496582, "global_step": 312722, "epoch": 1861} {"train_loss": -12.31507396697998, "global_step": 312723, "epoch": 1861} {"train_loss": -12.17163372039795, "global_step": 312724, "epoch": 1861} {"train_loss": -12.469472885131836, "global_step": 312725, "epoch": 1861} {"train_loss": -12.12283992767334, "global_step": 312726, "epoch": 1861} {"train_loss": -12.060847282409668, "global_step": 312727, "epoch": 1861} {"train_loss": -12.112950325012207, "global_step": 312728, "epoch": 1861} {"train_loss": -12.21351432800293, "global_step": 312729, "epoch": 1861} {"train_loss": -11.815442085266113, "global_step": 312730, "epoch": 1861} {"train_loss": -12.053346633911133, "global_step": 312731, "epoch": 1861} {"train_loss": -12.34075927734375, "global_step": 312732, "epoch": 1861} {"train_loss": -12.05697250366211, "global_step": 312733, "epoch": 1861} {"train_loss": -12.398235321044922, "global_step": 312734, "epoch": 1861} {"train_loss": -12.050390243530273, "global_step": 312735, "epoch": 1861} {"train_loss": -12.018964767456055, "global_step": 312736, "epoch": 1861} {"train_loss": -12.341452598571777, "global_step": 312737, "epoch": 1861} {"train_loss": -12.042281150817871, "global_step": 312738, "epoch": 1861} {"train_loss": -12.323380470275879, "global_step": 312739, "epoch": 1861} {"train_loss": -12.480237007141113, "global_step": 312740, "epoch": 1861} {"train_loss": -12.15118408203125, "global_step": 312741, "epoch": 1861} {"train_loss": -12.434244155883789, "global_step": 312742, "epoch": 1861} {"train_loss": -12.284154891967773, "global_step": 312743, "epoch": 1861} {"train_loss": -12.025205612182617, "global_step": 312744, "epoch": 1861} {"train_loss": -12.358675956726074, "global_step": 312745, "epoch": 1861} {"train_loss": -12.037580490112305, "global_step": 312746, "epoch": 1861} {"train_loss": -11.833108901977539, "global_step": 312747, "epoch": 1861} {"train_loss": -12.235465049743652, "global_step": 312748, "epoch": 1861} {"train_loss": -12.575319290161133, "global_step": 312749, "epoch": 1861} {"train_loss": -12.160173416137695, "global_step": 312750, "epoch": 1861} {"train_loss": -12.234546661376953, "global_step": 312751, "epoch": 1861} {"train_loss": -12.3920259475708, "global_step": 312752, "epoch": 1861} {"train_loss": -12.10623550415039, "global_step": 312753, "epoch": 1861} {"train_loss": -12.276865005493164, "global_step": 312754, "epoch": 1861} {"train_loss": -12.54389762878418, "global_step": 312755, "epoch": 1861} {"train_loss": -12.199712753295898, "global_step": 312756, "epoch": 1861} {"train_loss": -12.18259048461914, "global_step": 312757, "epoch": 1861} {"train_loss": -12.239202499389648, "global_step": 312758, "epoch": 1861} {"train_loss": -12.271554946899414, "global_step": 312759, "epoch": 1861} {"train_loss": -11.970438003540039, "global_step": 312760, "epoch": 1861} {"train_loss": -12.20376968383789, "global_step": 312761, "epoch": 1861} {"train_loss": -12.15597152709961, "global_step": 312762, "epoch": 1861} {"train_loss": -12.016746520996094, "global_step": 312763, "epoch": 1861} {"train_loss": -12.303339004516602, "global_step": 312764, "epoch": 1861} {"train_loss": -12.153746604919434, "global_step": 312765, "epoch": 1861} {"train_loss": -12.185057640075684, "global_step": 312766, "epoch": 1861} {"train_loss": -12.383803367614746, "global_step": 312767, "epoch": 1861} {"train_loss": -12.108909606933594, "global_step": 312768, "epoch": 1861} {"train_loss": -12.4263277053833, "global_step": 312769, "epoch": 1861} {"train_loss": -12.48925495147705, "global_step": 312770, "epoch": 1861} {"train_loss": -12.239006996154785, "global_step": 312771, "epoch": 1861} {"train_loss": -12.390281677246094, "global_step": 312772, "epoch": 1861} {"train_loss": -12.240633010864258, "global_step": 312773, "epoch": 1861} {"train_loss": -12.368473052978516, "global_step": 312774, "epoch": 1861} {"train_loss": -12.363588333129883, "global_step": 312775, "epoch": 1861} {"train_loss": -12.32994556427002, "global_step": 312776, "epoch": 1861} {"train_loss": -12.45467758178711, "global_step": 312777, "epoch": 1861} {"train_loss": -12.172113418579102, "global_step": 312778, "epoch": 1861} {"train_loss": -12.330388069152832, "global_step": 312779, "epoch": 1861} {"train_loss": -12.391178131103516, "global_step": 312780, "epoch": 1861} {"train_loss": -12.587108612060547, "global_step": 312781, "epoch": 1861} {"train_loss": -12.417156219482422, "global_step": 312782, "epoch": 1861} {"train_loss": -12.026599884033203, "global_step": 312783, "epoch": 1861} {"train_loss": -11.453948020935059, "global_step": 312784, "epoch": 1861} {"train_loss": -11.741308212280273, "global_step": 312785, "epoch": 1861} {"train_loss": -11.513704299926758, "global_step": 312786, "epoch": 1861} {"train_loss": -12.539155960083008, "global_step": 312787, "epoch": 1861} {"train_loss": -11.625272750854492, "global_step": 312788, "epoch": 1861} {"train_loss": -10.963533401489258, "global_step": 312789, "epoch": 1861} {"train_loss": -10.833198547363281, "global_step": 312790, "epoch": 1861} {"train_loss": -11.711990356445312, "global_step": 312791, "epoch": 1861} {"train_loss": -12.20891284942627, "global_step": 312792, "epoch": 1861} {"train_loss": -11.756759643554688, "global_step": 312793, "epoch": 1861} {"train_loss": -10.743231773376465, "global_step": 312794, "epoch": 1861} {"train_loss": -11.893855094909668, "global_step": 312795, "epoch": 1861} {"train_loss": -12.070919036865234, "global_step": 312796, "epoch": 1861} {"train_loss": -10.901334762573242, "global_step": 312797, "epoch": 1861} {"train_loss": -11.668115615844727, "global_step": 312798, "epoch": 1861} {"train_loss": -11.769339561462402, "global_step": 312799, "epoch": 1861} {"train_loss": -12.025409698486328, "global_step": 312800, "epoch": 1861} {"train_loss": -11.600652694702148, "global_step": 312801, "epoch": 1861} {"train_loss": -11.041268348693848, "global_step": 312802, "epoch": 1861} {"train_loss": -10.720012664794922, "global_step": 312803, "epoch": 1861} {"train_loss": -10.789981842041016, "global_step": 312804, "epoch": 1861} {"train_loss": -9.32492446899414, "global_step": 312805, "epoch": 1861} {"train_loss": -11.96590805053711, "global_step": 312806, "epoch": 1861} {"train_loss": -9.763456344604492, "global_step": 312807, "epoch": 1861} {"train_loss": -9.04942798614502, "global_step": 312808, "epoch": 1861} {"train_loss": -10.083074569702148, "global_step": 312809, "epoch": 1861} {"train_loss": -10.171152114868164, "global_step": 312810, "epoch": 1861} {"train_loss": -10.856833457946777, "global_step": 312811, "epoch": 1861} {"train_loss": -10.411107063293457, "global_step": 312812, "epoch": 1861} {"train_loss": -9.741065979003906, "global_step": 312813, "epoch": 1861} {"train_loss": -11.017387390136719, "global_step": 312814, "epoch": 1861} {"train_loss": -11.645492672920227, "global_step": 312815, "epoch": 1861, "val_loss": 279330.03125} {"train_loss": -9.618247985839844, "global_step": 312816, "epoch": 1862} {"train_loss": -9.437956809997559, "global_step": 312817, "epoch": 1862} {"train_loss": -10.90680980682373, "global_step": 312818, "epoch": 1862} {"train_loss": -9.446745872497559, "global_step": 312819, "epoch": 1862} {"train_loss": -11.235441207885742, "global_step": 312820, "epoch": 1862} {"train_loss": -9.618993759155273, "global_step": 312821, "epoch": 1862} {"train_loss": -9.18990707397461, "global_step": 312822, "epoch": 1862} {"train_loss": -8.857898712158203, "global_step": 312823, "epoch": 1862} {"train_loss": -9.560233116149902, "global_step": 312824, "epoch": 1862} {"train_loss": -9.291099548339844, "global_step": 312825, "epoch": 1862} {"train_loss": -11.203041076660156, "global_step": 312826, "epoch": 1862} {"train_loss": -11.066903114318848, "global_step": 312827, "epoch": 1862} {"train_loss": -10.827041625976562, "global_step": 312828, "epoch": 1862} {"train_loss": -11.316228866577148, "global_step": 312829, "epoch": 1862} {"train_loss": -11.207511901855469, "global_step": 312830, "epoch": 1862} {"train_loss": -10.321710586547852, "global_step": 312831, "epoch": 1862} {"train_loss": -11.11166000366211, "global_step": 312832, "epoch": 1862} {"train_loss": -10.914411544799805, "global_step": 312833, "epoch": 1862} {"train_loss": -10.67725944519043, "global_step": 312834, "epoch": 1862} {"train_loss": -10.835790634155273, "global_step": 312835, "epoch": 1862} {"train_loss": -11.44823169708252, "global_step": 312836, "epoch": 1862} {"train_loss": -10.901296615600586, "global_step": 312837, "epoch": 1862} {"train_loss": -11.757935523986816, "global_step": 312838, "epoch": 1862} {"train_loss": -11.164682388305664, "global_step": 312839, "epoch": 1862} {"train_loss": -11.775589942932129, "global_step": 312840, "epoch": 1862} {"train_loss": -11.313899040222168, "global_step": 312841, "epoch": 1862} {"train_loss": -11.686563491821289, "global_step": 312842, "epoch": 1862} {"train_loss": -11.421711921691895, "global_step": 312843, "epoch": 1862} {"train_loss": -11.62598705291748, "global_step": 312844, "epoch": 1862} {"train_loss": -11.861307144165039, "global_step": 312845, "epoch": 1862} {"train_loss": -11.742940902709961, "global_step": 312846, "epoch": 1862} {"train_loss": -11.793901443481445, "global_step": 312847, "epoch": 1862} {"train_loss": -11.78831672668457, "global_step": 312848, "epoch": 1862} {"train_loss": -11.537919998168945, "global_step": 312849, "epoch": 1862} {"train_loss": -11.722752571105957, "global_step": 312850, "epoch": 1862} {"train_loss": -11.934603691101074, "global_step": 312851, "epoch": 1862} {"train_loss": -11.356338500976562, "global_step": 312852, "epoch": 1862} {"train_loss": -12.092494010925293, "global_step": 312853, "epoch": 1862} {"train_loss": -11.70030689239502, "global_step": 312854, "epoch": 1862} {"train_loss": -12.010292053222656, "global_step": 312855, "epoch": 1862} {"train_loss": -11.943492889404297, "global_step": 312856, "epoch": 1862} {"train_loss": -11.984258651733398, "global_step": 312857, "epoch": 1862} {"train_loss": -11.949413299560547, "global_step": 312858, "epoch": 1862} {"train_loss": -12.040067672729492, "global_step": 312859, "epoch": 1862} {"train_loss": -12.060420036315918, "global_step": 312860, "epoch": 1862} {"train_loss": -12.100580215454102, "global_step": 312861, "epoch": 1862} {"train_loss": -11.95656681060791, "global_step": 312862, "epoch": 1862} {"train_loss": -12.066080093383789, "global_step": 312863, "epoch": 1862} {"train_loss": -12.135176658630371, "global_step": 312864, "epoch": 1862} {"train_loss": -11.989416122436523, "global_step": 312865, "epoch": 1862} {"train_loss": -12.056787490844727, "global_step": 312866, "epoch": 1862} {"train_loss": -11.97258186340332, "global_step": 312867, "epoch": 1862} {"train_loss": -12.067992210388184, "global_step": 312868, "epoch": 1862} {"train_loss": -12.129341125488281, "global_step": 312869, "epoch": 1862} {"train_loss": -11.89881706237793, "global_step": 312870, "epoch": 1862} {"train_loss": -12.410350799560547, "global_step": 312871, "epoch": 1862} {"train_loss": -12.279518127441406, "global_step": 312872, "epoch": 1862} {"train_loss": -12.110291481018066, "global_step": 312873, "epoch": 1862} {"train_loss": -12.093011856079102, "global_step": 312874, "epoch": 1862} {"train_loss": -12.122137069702148, "global_step": 312875, "epoch": 1862} {"train_loss": -12.188375473022461, "global_step": 312876, "epoch": 1862} {"train_loss": -12.130033493041992, "global_step": 312877, "epoch": 1862} {"train_loss": -12.26626968383789, "global_step": 312878, "epoch": 1862} {"train_loss": -12.196974754333496, "global_step": 312879, "epoch": 1862} {"train_loss": -12.32999324798584, "global_step": 312880, "epoch": 1862} {"train_loss": -12.198803901672363, "global_step": 312881, "epoch": 1862} {"train_loss": -12.346651077270508, "global_step": 312882, "epoch": 1862} {"train_loss": -12.187528610229492, "global_step": 312883, "epoch": 1862} {"train_loss": -12.190957069396973, "global_step": 312884, "epoch": 1862} {"train_loss": -12.262178421020508, "global_step": 312885, "epoch": 1862} {"train_loss": -12.309038162231445, "global_step": 312886, "epoch": 1862} {"train_loss": -12.394264221191406, "global_step": 312887, "epoch": 1862} {"train_loss": -12.525636672973633, "global_step": 312888, "epoch": 1862} {"train_loss": -12.110655784606934, "global_step": 312889, "epoch": 1862} {"train_loss": -12.140915870666504, "global_step": 312890, "epoch": 1862} {"train_loss": -12.434833526611328, "global_step": 312891, "epoch": 1862} {"train_loss": -12.488956451416016, "global_step": 312892, "epoch": 1862} {"train_loss": -12.546982765197754, "global_step": 312893, "epoch": 1862} {"train_loss": -12.100915908813477, "global_step": 312894, "epoch": 1862} {"train_loss": -12.358978271484375, "global_step": 312895, "epoch": 1862} {"train_loss": -12.474462509155273, "global_step": 312896, "epoch": 1862} {"train_loss": -11.955148696899414, "global_step": 312897, "epoch": 1862} {"train_loss": -12.403575897216797, "global_step": 312898, "epoch": 1862} {"train_loss": -12.297561645507812, "global_step": 312899, "epoch": 1862} {"train_loss": -12.444358825683594, "global_step": 312900, "epoch": 1862} {"train_loss": -12.39975357055664, "global_step": 312901, "epoch": 1862} {"train_loss": -12.288944244384766, "global_step": 312902, "epoch": 1862} {"train_loss": -12.171573638916016, "global_step": 312903, "epoch": 1862} {"train_loss": -12.446282386779785, "global_step": 312904, "epoch": 1862} {"train_loss": -12.420191764831543, "global_step": 312905, "epoch": 1862} {"train_loss": -12.398685455322266, "global_step": 312906, "epoch": 1862} {"train_loss": -12.490544319152832, "global_step": 312907, "epoch": 1862} {"train_loss": -12.086641311645508, "global_step": 312908, "epoch": 1862} {"train_loss": -12.402772903442383, "global_step": 312909, "epoch": 1862} {"train_loss": -12.369601249694824, "global_step": 312910, "epoch": 1862} {"train_loss": -12.37717056274414, "global_step": 312911, "epoch": 1862} {"train_loss": -12.475419998168945, "global_step": 312912, "epoch": 1862} {"train_loss": -12.02574634552002, "global_step": 312913, "epoch": 1862} {"train_loss": -12.397933959960938, "global_step": 312914, "epoch": 1862} {"train_loss": -12.498834609985352, "global_step": 312915, "epoch": 1862} {"train_loss": -11.86345100402832, "global_step": 312916, "epoch": 1862} {"train_loss": -11.69143009185791, "global_step": 312917, "epoch": 1862} {"train_loss": -12.353384017944336, "global_step": 312918, "epoch": 1862} {"train_loss": -12.143308639526367, "global_step": 312919, "epoch": 1862} {"train_loss": -12.392943382263184, "global_step": 312920, "epoch": 1862} {"train_loss": -12.609217643737793, "global_step": 312921, "epoch": 1862} {"train_loss": -12.632649421691895, "global_step": 312922, "epoch": 1862} {"train_loss": -12.099472045898438, "global_step": 312923, "epoch": 1862} {"train_loss": -11.950475692749023, "global_step": 312924, "epoch": 1862} {"train_loss": -12.390281677246094, "global_step": 312925, "epoch": 1862} {"train_loss": -12.131200790405273, "global_step": 312926, "epoch": 1862} {"train_loss": -11.770696640014648, "global_step": 312927, "epoch": 1862} {"train_loss": -11.693178176879883, "global_step": 312928, "epoch": 1862} {"train_loss": -12.466352462768555, "global_step": 312929, "epoch": 1862} {"train_loss": -12.155616760253906, "global_step": 312930, "epoch": 1862} {"train_loss": -11.825416564941406, "global_step": 312931, "epoch": 1862} {"train_loss": -12.185992240905762, "global_step": 312932, "epoch": 1862} {"train_loss": -12.430627822875977, "global_step": 312933, "epoch": 1862} {"train_loss": -12.056105613708496, "global_step": 312934, "epoch": 1862} {"train_loss": -12.388751983642578, "global_step": 312935, "epoch": 1862} {"train_loss": -12.539541244506836, "global_step": 312936, "epoch": 1862} {"train_loss": -12.322458267211914, "global_step": 312937, "epoch": 1862} {"train_loss": -12.055869102478027, "global_step": 312938, "epoch": 1862} {"train_loss": -12.299510955810547, "global_step": 312939, "epoch": 1862} {"train_loss": -12.413675308227539, "global_step": 312940, "epoch": 1862} {"train_loss": -12.223556518554688, "global_step": 312941, "epoch": 1862} {"train_loss": -12.195181846618652, "global_step": 312942, "epoch": 1862} {"train_loss": -12.17542839050293, "global_step": 312943, "epoch": 1862} {"train_loss": -12.165056228637695, "global_step": 312944, "epoch": 1862} {"train_loss": -11.96725845336914, "global_step": 312945, "epoch": 1862} {"train_loss": -12.505534172058105, "global_step": 312946, "epoch": 1862} {"train_loss": -11.790359497070312, "global_step": 312947, "epoch": 1862} {"train_loss": -11.426596641540527, "global_step": 312948, "epoch": 1862} {"train_loss": -12.384603500366211, "global_step": 312949, "epoch": 1862} {"train_loss": -12.062567710876465, "global_step": 312950, "epoch": 1862} {"train_loss": -11.120758056640625, "global_step": 312951, "epoch": 1862} {"train_loss": -11.57570743560791, "global_step": 312952, "epoch": 1862} {"train_loss": -11.475202560424805, "global_step": 312953, "epoch": 1862} {"train_loss": -11.809408187866211, "global_step": 312954, "epoch": 1862} {"train_loss": -11.745899200439453, "global_step": 312955, "epoch": 1862} {"train_loss": -11.863855361938477, "global_step": 312956, "epoch": 1862} {"train_loss": -8.828110694885254, "global_step": 312957, "epoch": 1862} {"train_loss": -12.186860084533691, "global_step": 312958, "epoch": 1862} {"train_loss": -9.47874641418457, "global_step": 312959, "epoch": 1862} {"train_loss": -9.878861427307129, "global_step": 312960, "epoch": 1862} {"train_loss": -10.47187614440918, "global_step": 312961, "epoch": 1862} {"train_loss": -9.470046043395996, "global_step": 312962, "epoch": 1862} {"train_loss": -10.668656349182129, "global_step": 312963, "epoch": 1862} {"train_loss": -8.488889694213867, "global_step": 312964, "epoch": 1862} {"train_loss": -8.786023139953613, "global_step": 312965, "epoch": 1862} {"train_loss": -9.453977584838867, "global_step": 312966, "epoch": 1862} {"train_loss": -9.847625732421875, "global_step": 312967, "epoch": 1862} {"train_loss": -9.81857681274414, "global_step": 312968, "epoch": 1862} {"train_loss": -9.164791107177734, "global_step": 312969, "epoch": 1862} {"train_loss": -9.249792098999023, "global_step": 312970, "epoch": 1862} {"train_loss": -9.503719329833984, "global_step": 312971, "epoch": 1862} {"train_loss": -9.27302360534668, "global_step": 312972, "epoch": 1862} {"train_loss": -9.871564865112305, "global_step": 312973, "epoch": 1862} {"train_loss": -10.900790214538574, "global_step": 312974, "epoch": 1862} {"train_loss": -10.747489929199219, "global_step": 312975, "epoch": 1862} {"train_loss": -10.72420883178711, "global_step": 312976, "epoch": 1862} {"train_loss": -10.650012969970703, "global_step": 312977, "epoch": 1862} {"train_loss": -10.772832870483398, "global_step": 312978, "epoch": 1862} {"train_loss": -11.29095458984375, "global_step": 312979, "epoch": 1862} {"train_loss": -10.5250244140625, "global_step": 312980, "epoch": 1862} {"train_loss": -10.951892852783203, "global_step": 312981, "epoch": 1862} {"train_loss": -10.842686653137207, "global_step": 312982, "epoch": 1862} {"train_loss": -11.55716556026822, "global_step": 312983, "epoch": 1862, "val_loss": 278676.71875} {"train_loss": -11.372894287109375, "global_step": 312984, "epoch": 1863} {"train_loss": -11.267457962036133, "global_step": 312985, "epoch": 1863} {"train_loss": -11.588196754455566, "global_step": 312986, "epoch": 1863} {"train_loss": -11.420480728149414, "global_step": 312987, "epoch": 1863} {"train_loss": -11.786921501159668, "global_step": 312988, "epoch": 1863} {"train_loss": -11.816221237182617, "global_step": 312989, "epoch": 1863} {"train_loss": -11.504152297973633, "global_step": 312990, "epoch": 1863} {"train_loss": -11.39753532409668, "global_step": 312991, "epoch": 1863} {"train_loss": -11.653640747070312, "global_step": 312992, "epoch": 1863} {"train_loss": -11.787809371948242, "global_step": 312993, "epoch": 1863} {"train_loss": -11.786130905151367, "global_step": 312994, "epoch": 1863} {"train_loss": -11.758857727050781, "global_step": 312995, "epoch": 1863} {"train_loss": -11.667852401733398, "global_step": 312996, "epoch": 1863} {"train_loss": -11.736806869506836, "global_step": 312997, "epoch": 1863} {"train_loss": -11.825249671936035, "global_step": 312998, "epoch": 1863} {"train_loss": -11.939391136169434, "global_step": 312999, "epoch": 1863} {"train_loss": -11.811084747314453, "global_step": 313000, "epoch": 1863} {"train_loss": -11.73774528503418, "global_step": 313001, "epoch": 1863} {"train_loss": -11.961116790771484, "global_step": 313002, "epoch": 1863} {"train_loss": -12.0210599899292, "global_step": 313003, "epoch": 1863} {"train_loss": -11.87138557434082, "global_step": 313004, "epoch": 1863} {"train_loss": -12.04981803894043, "global_step": 313005, "epoch": 1863} {"train_loss": -11.677638053894043, "global_step": 313006, "epoch": 1863} {"train_loss": -12.146841049194336, "global_step": 313007, "epoch": 1863} {"train_loss": -11.927835464477539, "global_step": 313008, "epoch": 1863} {"train_loss": -11.948004722595215, "global_step": 313009, "epoch": 1863} {"train_loss": -12.144126892089844, "global_step": 313010, "epoch": 1863} {"train_loss": -11.927986145019531, "global_step": 313011, "epoch": 1863} {"train_loss": -11.912071228027344, "global_step": 313012, "epoch": 1863} {"train_loss": -12.072773933410645, "global_step": 313013, "epoch": 1863} {"train_loss": -11.983222961425781, "global_step": 313014, "epoch": 1863} {"train_loss": -12.101511001586914, "global_step": 313015, "epoch": 1863} {"train_loss": -11.86890697479248, "global_step": 313016, "epoch": 1863} {"train_loss": -11.994976043701172, "global_step": 313017, "epoch": 1863} {"train_loss": -11.666655540466309, "global_step": 313018, "epoch": 1863} {"train_loss": -12.109052658081055, "global_step": 313019, "epoch": 1863} {"train_loss": -11.73302936553955, "global_step": 313020, "epoch": 1863} {"train_loss": -12.003517150878906, "global_step": 313021, "epoch": 1863} {"train_loss": -11.952341079711914, "global_step": 313022, "epoch": 1863} {"train_loss": -11.907466888427734, "global_step": 313023, "epoch": 1863} {"train_loss": -11.79587173461914, "global_step": 313024, "epoch": 1863} {"train_loss": -11.939048767089844, "global_step": 313025, "epoch": 1863} {"train_loss": -12.09267807006836, "global_step": 313026, "epoch": 1863} {"train_loss": -11.97282600402832, "global_step": 313027, "epoch": 1863} {"train_loss": -12.081058502197266, "global_step": 313028, "epoch": 1863} {"train_loss": -12.063674926757812, "global_step": 313029, "epoch": 1863} {"train_loss": -11.978212356567383, "global_step": 313030, "epoch": 1863} {"train_loss": -12.233625411987305, "global_step": 313031, "epoch": 1863} {"train_loss": -11.992680549621582, "global_step": 313032, "epoch": 1863} {"train_loss": -11.930730819702148, "global_step": 313033, "epoch": 1863} {"train_loss": -12.265745162963867, "global_step": 313034, "epoch": 1863} {"train_loss": -12.058040618896484, "global_step": 313035, "epoch": 1863} {"train_loss": -12.143688201904297, "global_step": 313036, "epoch": 1863} {"train_loss": -12.140091896057129, "global_step": 313037, "epoch": 1863} {"train_loss": -11.866692543029785, "global_step": 313038, "epoch": 1863} {"train_loss": -12.2841215133667, "global_step": 313039, "epoch": 1863} {"train_loss": -12.032466888427734, "global_step": 313040, "epoch": 1863} {"train_loss": -12.365012168884277, "global_step": 313041, "epoch": 1863} {"train_loss": -11.951461791992188, "global_step": 313042, "epoch": 1863} {"train_loss": -12.136037826538086, "global_step": 313043, "epoch": 1863} {"train_loss": -11.818126678466797, "global_step": 313044, "epoch": 1863} {"train_loss": -12.166461944580078, "global_step": 313045, "epoch": 1863} {"train_loss": -12.117465019226074, "global_step": 313046, "epoch": 1863} {"train_loss": -12.225013732910156, "global_step": 313047, "epoch": 1863} {"train_loss": -12.378623962402344, "global_step": 313048, "epoch": 1863} {"train_loss": -11.946943283081055, "global_step": 313049, "epoch": 1863} {"train_loss": -11.971860885620117, "global_step": 313050, "epoch": 1863} {"train_loss": -12.112945556640625, "global_step": 313051, "epoch": 1863} {"train_loss": -12.500449180603027, "global_step": 313052, "epoch": 1863} {"train_loss": -12.37850570678711, "global_step": 313053, "epoch": 1863} {"train_loss": -12.186188697814941, "global_step": 313054, "epoch": 1863} {"train_loss": -12.321599006652832, "global_step": 313055, "epoch": 1863} {"train_loss": -12.338530540466309, "global_step": 313056, "epoch": 1863} {"train_loss": -12.029569625854492, "global_step": 313057, "epoch": 1863} {"train_loss": -12.15954875946045, "global_step": 313058, "epoch": 1863} {"train_loss": -12.180139541625977, "global_step": 313059, "epoch": 1863} {"train_loss": -12.180240631103516, "global_step": 313060, "epoch": 1863} {"train_loss": -12.446449279785156, "global_step": 313061, "epoch": 1863} {"train_loss": -12.137961387634277, "global_step": 313062, "epoch": 1863} {"train_loss": -11.969442367553711, "global_step": 313063, "epoch": 1863} {"train_loss": -12.113500595092773, "global_step": 313064, "epoch": 1863} {"train_loss": -11.961994171142578, "global_step": 313065, "epoch": 1863} {"train_loss": -11.535072326660156, "global_step": 313066, "epoch": 1863} {"train_loss": -11.892557144165039, "global_step": 313067, "epoch": 1863} {"train_loss": -12.455636978149414, "global_step": 313068, "epoch": 1863} {"train_loss": -12.295819282531738, "global_step": 313069, "epoch": 1863} {"train_loss": -12.05305290222168, "global_step": 313070, "epoch": 1863} {"train_loss": -12.07077407836914, "global_step": 313071, "epoch": 1863} {"train_loss": -12.226593017578125, "global_step": 313072, "epoch": 1863} {"train_loss": -12.166679382324219, "global_step": 313073, "epoch": 1863} {"train_loss": -12.345638275146484, "global_step": 313074, "epoch": 1863} {"train_loss": -12.294612884521484, "global_step": 313075, "epoch": 1863} {"train_loss": -12.32634162902832, "global_step": 313076, "epoch": 1863} {"train_loss": -12.322258949279785, "global_step": 313077, "epoch": 1863} {"train_loss": -11.68086051940918, "global_step": 313078, "epoch": 1863} {"train_loss": -12.321125030517578, "global_step": 313079, "epoch": 1863} {"train_loss": -12.05737018585205, "global_step": 313080, "epoch": 1863} {"train_loss": -12.383461952209473, "global_step": 313081, "epoch": 1863} {"train_loss": -11.79648208618164, "global_step": 313082, "epoch": 1863} {"train_loss": -11.670475959777832, "global_step": 313083, "epoch": 1863} {"train_loss": -11.97961139678955, "global_step": 313084, "epoch": 1863} {"train_loss": -11.447595596313477, "global_step": 313085, "epoch": 1863} {"train_loss": -12.551050186157227, "global_step": 313086, "epoch": 1863} {"train_loss": -11.500832557678223, "global_step": 313087, "epoch": 1863} {"train_loss": -12.094331741333008, "global_step": 313088, "epoch": 1863} {"train_loss": -11.583271026611328, "global_step": 313089, "epoch": 1863} {"train_loss": -12.078948974609375, "global_step": 313090, "epoch": 1863} {"train_loss": -11.795072555541992, "global_step": 313091, "epoch": 1863} {"train_loss": -12.22347640991211, "global_step": 313092, "epoch": 1863} {"train_loss": -12.160238265991211, "global_step": 313093, "epoch": 1863} {"train_loss": -12.177196502685547, "global_step": 313094, "epoch": 1863} {"train_loss": -12.235636711120605, "global_step": 313095, "epoch": 1863} {"train_loss": -11.332826614379883, "global_step": 313096, "epoch": 1863} {"train_loss": -11.659128189086914, "global_step": 313097, "epoch": 1863} {"train_loss": -12.106157302856445, "global_step": 313098, "epoch": 1863} {"train_loss": -10.861665725708008, "global_step": 313099, "epoch": 1863} {"train_loss": -10.939529418945312, "global_step": 313100, "epoch": 1863} {"train_loss": -11.815483093261719, "global_step": 313101, "epoch": 1863} {"train_loss": -11.04145622253418, "global_step": 313102, "epoch": 1863} {"train_loss": -10.378393173217773, "global_step": 313103, "epoch": 1863} {"train_loss": -9.966769218444824, "global_step": 313104, "epoch": 1863} {"train_loss": -11.629497528076172, "global_step": 313105, "epoch": 1863} {"train_loss": -10.412074089050293, "global_step": 313106, "epoch": 1863} {"train_loss": -12.360308647155762, "global_step": 313107, "epoch": 1863} {"train_loss": -11.209123611450195, "global_step": 313108, "epoch": 1863} {"train_loss": -12.276177406311035, "global_step": 313109, "epoch": 1863} {"train_loss": -10.790124893188477, "global_step": 313110, "epoch": 1863} {"train_loss": -11.48301887512207, "global_step": 313111, "epoch": 1863} {"train_loss": -11.214325904846191, "global_step": 313112, "epoch": 1863} {"train_loss": -11.535449981689453, "global_step": 313113, "epoch": 1863} {"train_loss": -10.950691223144531, "global_step": 313114, "epoch": 1863} {"train_loss": -11.71916389465332, "global_step": 313115, "epoch": 1863} {"train_loss": -11.540770530700684, "global_step": 313116, "epoch": 1863} {"train_loss": -11.442778587341309, "global_step": 313117, "epoch": 1863} {"train_loss": -11.958525657653809, "global_step": 313118, "epoch": 1863} {"train_loss": -11.22061824798584, "global_step": 313119, "epoch": 1863} {"train_loss": -11.613262176513672, "global_step": 313120, "epoch": 1863} {"train_loss": -11.55356216430664, "global_step": 313121, "epoch": 1863} {"train_loss": -11.869566917419434, "global_step": 313122, "epoch": 1863} {"train_loss": -11.837495803833008, "global_step": 313123, "epoch": 1863} {"train_loss": -12.020156860351562, "global_step": 313124, "epoch": 1863} {"train_loss": -11.8731689453125, "global_step": 313125, "epoch": 1863} {"train_loss": -11.670198440551758, "global_step": 313126, "epoch": 1863} {"train_loss": -12.104000091552734, "global_step": 313127, "epoch": 1863} {"train_loss": -11.113458633422852, "global_step": 313128, "epoch": 1863} {"train_loss": -12.252250671386719, "global_step": 313129, "epoch": 1863} {"train_loss": -11.440177917480469, "global_step": 313130, "epoch": 1863} {"train_loss": -11.714345932006836, "global_step": 313131, "epoch": 1863} {"train_loss": -12.026100158691406, "global_step": 313132, "epoch": 1863} {"train_loss": -11.741189002990723, "global_step": 313133, "epoch": 1863} {"train_loss": -12.289741516113281, "global_step": 313134, "epoch": 1863} {"train_loss": -11.685428619384766, "global_step": 313135, "epoch": 1863} {"train_loss": -11.13879680633545, "global_step": 313136, "epoch": 1863} {"train_loss": -12.005821228027344, "global_step": 313137, "epoch": 1863} {"train_loss": -10.988662719726562, "global_step": 313138, "epoch": 1863} {"train_loss": -11.755306243896484, "global_step": 313139, "epoch": 1863} {"train_loss": -11.322553634643555, "global_step": 313140, "epoch": 1863} {"train_loss": -11.246920585632324, "global_step": 313141, "epoch": 1863} {"train_loss": -11.509370803833008, "global_step": 313142, "epoch": 1863} {"train_loss": -11.090065002441406, "global_step": 313143, "epoch": 1863} {"train_loss": -11.106584548950195, "global_step": 313144, "epoch": 1863} {"train_loss": -11.907177925109863, "global_step": 313145, "epoch": 1863} {"train_loss": -10.95926570892334, "global_step": 313146, "epoch": 1863} {"train_loss": -12.071573257446289, "global_step": 313147, "epoch": 1863} {"train_loss": -11.60445785522461, "global_step": 313148, "epoch": 1863} {"train_loss": -11.994697570800781, "global_step": 313149, "epoch": 1863} {"train_loss": -12.059823989868164, "global_step": 313150, "epoch": 1863} {"train_loss": -11.838118933496022, "global_step": 313151, "epoch": 1863, "val_loss": 283218.46875} {"train_loss": -12.092142105102539, "global_step": 313152, "epoch": 1864} {"train_loss": -11.775806427001953, "global_step": 313153, "epoch": 1864} {"train_loss": -11.941476821899414, "global_step": 313154, "epoch": 1864} {"train_loss": -11.57922077178955, "global_step": 313155, "epoch": 1864} {"train_loss": -11.555237770080566, "global_step": 313156, "epoch": 1864} {"train_loss": -11.916633605957031, "global_step": 313157, "epoch": 1864} {"train_loss": -11.621295928955078, "global_step": 313158, "epoch": 1864} {"train_loss": -11.97885513305664, "global_step": 313159, "epoch": 1864} {"train_loss": -11.52423095703125, "global_step": 313160, "epoch": 1864} {"train_loss": -11.947839736938477, "global_step": 313161, "epoch": 1864} {"train_loss": -11.637781143188477, "global_step": 313162, "epoch": 1864} {"train_loss": -11.72335147857666, "global_step": 313163, "epoch": 1864} {"train_loss": -11.959760665893555, "global_step": 313164, "epoch": 1864} {"train_loss": -11.936384201049805, "global_step": 313165, "epoch": 1864} {"train_loss": -11.83693790435791, "global_step": 313166, "epoch": 1864} {"train_loss": -11.635337829589844, "global_step": 313167, "epoch": 1864} {"train_loss": -11.460358619689941, "global_step": 313168, "epoch": 1864} {"train_loss": -12.244979858398438, "global_step": 313169, "epoch": 1864} {"train_loss": -11.38095474243164, "global_step": 313170, "epoch": 1864} {"train_loss": -12.103338241577148, "global_step": 313171, "epoch": 1864} {"train_loss": -11.113025665283203, "global_step": 313172, "epoch": 1864} {"train_loss": -12.255451202392578, "global_step": 313173, "epoch": 1864} {"train_loss": -11.584542274475098, "global_step": 313174, "epoch": 1864} {"train_loss": -11.796616554260254, "global_step": 313175, "epoch": 1864} {"train_loss": -11.475240707397461, "global_step": 313176, "epoch": 1864} {"train_loss": -11.804012298583984, "global_step": 313177, "epoch": 1864} {"train_loss": -11.87147045135498, "global_step": 313178, "epoch": 1864} {"train_loss": -11.54755973815918, "global_step": 313179, "epoch": 1864} {"train_loss": -11.975698471069336, "global_step": 313180, "epoch": 1864} {"train_loss": -11.660086631774902, "global_step": 313181, "epoch": 1864} {"train_loss": -12.009727478027344, "global_step": 313182, "epoch": 1864} {"train_loss": -11.648550033569336, "global_step": 313183, "epoch": 1864} {"train_loss": -11.74106502532959, "global_step": 313184, "epoch": 1864} {"train_loss": -11.460512161254883, "global_step": 313185, "epoch": 1864} {"train_loss": -11.900074005126953, "global_step": 313186, "epoch": 1864} {"train_loss": -11.495655059814453, "global_step": 313187, "epoch": 1864} {"train_loss": -12.191768646240234, "global_step": 313188, "epoch": 1864} {"train_loss": -11.921789169311523, "global_step": 313189, "epoch": 1864} {"train_loss": -11.553056716918945, "global_step": 313190, "epoch": 1864} {"train_loss": -12.208778381347656, "global_step": 313191, "epoch": 1864} {"train_loss": -11.71019172668457, "global_step": 313192, "epoch": 1864} {"train_loss": -11.955282211303711, "global_step": 313193, "epoch": 1864} {"train_loss": -12.08745002746582, "global_step": 313194, "epoch": 1864} {"train_loss": -12.092792510986328, "global_step": 313195, "epoch": 1864} {"train_loss": -11.866105079650879, "global_step": 313196, "epoch": 1864} {"train_loss": -11.971267700195312, "global_step": 313197, "epoch": 1864} {"train_loss": -12.254791259765625, "global_step": 313198, "epoch": 1864} {"train_loss": -12.316336631774902, "global_step": 313199, "epoch": 1864} {"train_loss": -12.306647300720215, "global_step": 313200, "epoch": 1864} {"train_loss": -12.05114459991455, "global_step": 313201, "epoch": 1864} {"train_loss": -12.181193351745605, "global_step": 313202, "epoch": 1864} {"train_loss": -11.839034080505371, "global_step": 313203, "epoch": 1864} {"train_loss": -11.90732192993164, "global_step": 313204, "epoch": 1864} {"train_loss": -12.081933975219727, "global_step": 313205, "epoch": 1864} {"train_loss": -12.30427074432373, "global_step": 313206, "epoch": 1864} {"train_loss": -12.004081726074219, "global_step": 313207, "epoch": 1864} {"train_loss": -12.12630844116211, "global_step": 313208, "epoch": 1864} {"train_loss": -11.953099250793457, "global_step": 313209, "epoch": 1864} {"train_loss": -12.114057540893555, "global_step": 313210, "epoch": 1864} {"train_loss": -12.365646362304688, "global_step": 313211, "epoch": 1864} {"train_loss": -12.033231735229492, "global_step": 313212, "epoch": 1864} {"train_loss": -12.129150390625, "global_step": 313213, "epoch": 1864} {"train_loss": -12.09699821472168, "global_step": 313214, "epoch": 1864} {"train_loss": -11.712129592895508, "global_step": 313215, "epoch": 1864} {"train_loss": -12.117809295654297, "global_step": 313216, "epoch": 1864} {"train_loss": -11.309581756591797, "global_step": 313217, "epoch": 1864} {"train_loss": -12.091754913330078, "global_step": 313218, "epoch": 1864} {"train_loss": -10.988685607910156, "global_step": 313219, "epoch": 1864} {"train_loss": -11.647602081298828, "global_step": 313220, "epoch": 1864} {"train_loss": -11.42375373840332, "global_step": 313221, "epoch": 1864} {"train_loss": -11.40201187133789, "global_step": 313222, "epoch": 1864} {"train_loss": -11.292160034179688, "global_step": 313223, "epoch": 1864} {"train_loss": -10.988458633422852, "global_step": 313224, "epoch": 1864} {"train_loss": -11.037503242492676, "global_step": 313225, "epoch": 1864} {"train_loss": -10.471602439880371, "global_step": 313226, "epoch": 1864} {"train_loss": -11.696699142456055, "global_step": 313227, "epoch": 1864} {"train_loss": -11.257650375366211, "global_step": 313228, "epoch": 1864} {"train_loss": -10.00540542602539, "global_step": 313229, "epoch": 1864} {"train_loss": -12.236842155456543, "global_step": 313230, "epoch": 1864} {"train_loss": -10.412178039550781, "global_step": 313231, "epoch": 1864} {"train_loss": -11.905290603637695, "global_step": 313232, "epoch": 1864} {"train_loss": -10.979293823242188, "global_step": 313233, "epoch": 1864} {"train_loss": -11.238531112670898, "global_step": 313234, "epoch": 1864} {"train_loss": -11.023478507995605, "global_step": 313235, "epoch": 1864} {"train_loss": -11.270861625671387, "global_step": 313236, "epoch": 1864} {"train_loss": -11.916159629821777, "global_step": 313237, "epoch": 1864} {"train_loss": -11.593490600585938, "global_step": 313238, "epoch": 1864} {"train_loss": -11.423115730285645, "global_step": 313239, "epoch": 1864} {"train_loss": -11.832027435302734, "global_step": 313240, "epoch": 1864} {"train_loss": -11.456960678100586, "global_step": 313241, "epoch": 1864} {"train_loss": -12.24256420135498, "global_step": 313242, "epoch": 1864} {"train_loss": -11.900198936462402, "global_step": 313243, "epoch": 1864} {"train_loss": -11.801525115966797, "global_step": 313244, "epoch": 1864} {"train_loss": -11.930000305175781, "global_step": 313245, "epoch": 1864} {"train_loss": -11.887358665466309, "global_step": 313246, "epoch": 1864} {"train_loss": -12.201475143432617, "global_step": 313247, "epoch": 1864} {"train_loss": -12.01022720336914, "global_step": 313248, "epoch": 1864} {"train_loss": -12.006603240966797, "global_step": 313249, "epoch": 1864} {"train_loss": -12.133206367492676, "global_step": 313250, "epoch": 1864} {"train_loss": -12.225269317626953, "global_step": 313251, "epoch": 1864} {"train_loss": -11.945396423339844, "global_step": 313252, "epoch": 1864} {"train_loss": -12.155826568603516, "global_step": 313253, "epoch": 1864} {"train_loss": -11.954202651977539, "global_step": 313254, "epoch": 1864} {"train_loss": -12.10694694519043, "global_step": 313255, "epoch": 1864} {"train_loss": -12.250680923461914, "global_step": 313256, "epoch": 1864} {"train_loss": -12.233957290649414, "global_step": 313257, "epoch": 1864} {"train_loss": -12.236091613769531, "global_step": 313258, "epoch": 1864} {"train_loss": -12.451820373535156, "global_step": 313259, "epoch": 1864} {"train_loss": -12.063302040100098, "global_step": 313260, "epoch": 1864} {"train_loss": -12.411691665649414, "global_step": 313261, "epoch": 1864} {"train_loss": -12.308820724487305, "global_step": 313262, "epoch": 1864} {"train_loss": -12.228156089782715, "global_step": 313263, "epoch": 1864} {"train_loss": -12.428184509277344, "global_step": 313264, "epoch": 1864} {"train_loss": -12.350700378417969, "global_step": 313265, "epoch": 1864} {"train_loss": -12.287365913391113, "global_step": 313266, "epoch": 1864} {"train_loss": -12.344419479370117, "global_step": 313267, "epoch": 1864} {"train_loss": -12.025996208190918, "global_step": 313268, "epoch": 1864} {"train_loss": -12.338357925415039, "global_step": 313269, "epoch": 1864} {"train_loss": -11.94986343383789, "global_step": 313270, "epoch": 1864} {"train_loss": -12.310141563415527, "global_step": 313271, "epoch": 1864} {"train_loss": -12.126761436462402, "global_step": 313272, "epoch": 1864} {"train_loss": -12.381977081298828, "global_step": 313273, "epoch": 1864} {"train_loss": -12.380104064941406, "global_step": 313274, "epoch": 1864} {"train_loss": -12.366010665893555, "global_step": 313275, "epoch": 1864} {"train_loss": -12.351455688476562, "global_step": 313276, "epoch": 1864} {"train_loss": -12.365543365478516, "global_step": 313277, "epoch": 1864} {"train_loss": -12.519338607788086, "global_step": 313278, "epoch": 1864} {"train_loss": -12.10822868347168, "global_step": 313279, "epoch": 1864} {"train_loss": -12.300750732421875, "global_step": 313280, "epoch": 1864} {"train_loss": -12.323749542236328, "global_step": 313281, "epoch": 1864} {"train_loss": -12.480887413024902, "global_step": 313282, "epoch": 1864} {"train_loss": -12.343606948852539, "global_step": 313283, "epoch": 1864} {"train_loss": -12.104509353637695, "global_step": 313284, "epoch": 1864} {"train_loss": -12.332910537719727, "global_step": 313285, "epoch": 1864} {"train_loss": -12.341178894042969, "global_step": 313286, "epoch": 1864} {"train_loss": -11.900777816772461, "global_step": 313287, "epoch": 1864} {"train_loss": -11.313638687133789, "global_step": 313288, "epoch": 1864} {"train_loss": -11.828500747680664, "global_step": 313289, "epoch": 1864} {"train_loss": -12.216716766357422, "global_step": 313290, "epoch": 1864} {"train_loss": -11.87147045135498, "global_step": 313291, "epoch": 1864} {"train_loss": -11.645413398742676, "global_step": 313292, "epoch": 1864} {"train_loss": -12.351371765136719, "global_step": 313293, "epoch": 1864} {"train_loss": -11.272721290588379, "global_step": 313294, "epoch": 1864} {"train_loss": -11.025161743164062, "global_step": 313295, "epoch": 1864} {"train_loss": -11.519281387329102, "global_step": 313296, "epoch": 1864} {"train_loss": -12.016687393188477, "global_step": 313297, "epoch": 1864} {"train_loss": -9.534186363220215, "global_step": 313298, "epoch": 1864} {"train_loss": -10.855169296264648, "global_step": 313299, "epoch": 1864} {"train_loss": -10.025050163269043, "global_step": 313300, "epoch": 1864} {"train_loss": -9.08887767791748, "global_step": 313301, "epoch": 1864} {"train_loss": -8.474604606628418, "global_step": 313302, "epoch": 1864} {"train_loss": -9.841056823730469, "global_step": 313303, "epoch": 1864} {"train_loss": -9.590174674987793, "global_step": 313304, "epoch": 1864} {"train_loss": -9.020275115966797, "global_step": 313305, "epoch": 1864} {"train_loss": -9.113308906555176, "global_step": 313306, "epoch": 1864} {"train_loss": -8.417348861694336, "global_step": 313307, "epoch": 1864} {"train_loss": -10.052363395690918, "global_step": 313308, "epoch": 1864} {"train_loss": -10.447633743286133, "global_step": 313309, "epoch": 1864} {"train_loss": -9.970090866088867, "global_step": 313310, "epoch": 1864} {"train_loss": -8.650315284729004, "global_step": 313311, "epoch": 1864} {"train_loss": -9.255082130432129, "global_step": 313312, "epoch": 1864} {"train_loss": -10.582362174987793, "global_step": 313313, "epoch": 1864} {"train_loss": -10.97461223602295, "global_step": 313314, "epoch": 1864} {"train_loss": -9.767662048339844, "global_step": 313315, "epoch": 1864} {"train_loss": -10.665739059448242, "global_step": 313316, "epoch": 1864} {"train_loss": -10.815683364868164, "global_step": 313317, "epoch": 1864} {"train_loss": -10.340707778930664, "global_step": 313318, "epoch": 1864} {"train_loss": -11.605754176775614, "global_step": 313319, "epoch": 1864, "val_loss": 284070.375} {"train_loss": -10.672703742980957, "global_step": 313320, "epoch": 1865} {"train_loss": -9.564733505249023, "global_step": 313321, "epoch": 1865} {"train_loss": -9.971525192260742, "global_step": 313322, "epoch": 1865} {"train_loss": -11.21951675415039, "global_step": 313323, "epoch": 1865} {"train_loss": -9.597394943237305, "global_step": 313324, "epoch": 1865} {"train_loss": -10.020856857299805, "global_step": 313325, "epoch": 1865} {"train_loss": -11.573982238769531, "global_step": 313326, "epoch": 1865} {"train_loss": -10.606548309326172, "global_step": 313327, "epoch": 1865} {"train_loss": -10.963662147521973, "global_step": 313328, "epoch": 1865} {"train_loss": -11.195079803466797, "global_step": 313329, "epoch": 1865} {"train_loss": -10.474576950073242, "global_step": 313330, "epoch": 1865} {"train_loss": -11.227794647216797, "global_step": 313331, "epoch": 1865} {"train_loss": -11.459455490112305, "global_step": 313332, "epoch": 1865} {"train_loss": -10.682782173156738, "global_step": 313333, "epoch": 1865} {"train_loss": -11.45467758178711, "global_step": 313334, "epoch": 1865} {"train_loss": -11.491531372070312, "global_step": 313335, "epoch": 1865} {"train_loss": -10.808971405029297, "global_step": 313336, "epoch": 1865} {"train_loss": -11.524483680725098, "global_step": 313337, "epoch": 1865} {"train_loss": -11.610788345336914, "global_step": 313338, "epoch": 1865} {"train_loss": -11.161792755126953, "global_step": 313339, "epoch": 1865} {"train_loss": -11.52495002746582, "global_step": 313340, "epoch": 1865} {"train_loss": -11.690801620483398, "global_step": 313341, "epoch": 1865} {"train_loss": -11.192939758300781, "global_step": 313342, "epoch": 1865} {"train_loss": -11.828786849975586, "global_step": 313343, "epoch": 1865} {"train_loss": -11.831164360046387, "global_step": 313344, "epoch": 1865} {"train_loss": -11.823799133300781, "global_step": 313345, "epoch": 1865} {"train_loss": -11.668529510498047, "global_step": 313346, "epoch": 1865} {"train_loss": -11.471396446228027, "global_step": 313347, "epoch": 1865} {"train_loss": -11.647083282470703, "global_step": 313348, "epoch": 1865} {"train_loss": -11.769347190856934, "global_step": 313349, "epoch": 1865} {"train_loss": -11.82850456237793, "global_step": 313350, "epoch": 1865} {"train_loss": -11.823812484741211, "global_step": 313351, "epoch": 1865} {"train_loss": -11.817955017089844, "global_step": 313352, "epoch": 1865} {"train_loss": -11.871990203857422, "global_step": 313353, "epoch": 1865} {"train_loss": -11.874292373657227, "global_step": 313354, "epoch": 1865} {"train_loss": -11.976278305053711, "global_step": 313355, "epoch": 1865} {"train_loss": -12.075836181640625, "global_step": 313356, "epoch": 1865} {"train_loss": -11.793131828308105, "global_step": 313357, "epoch": 1865} {"train_loss": -11.756172180175781, "global_step": 313358, "epoch": 1865} {"train_loss": -11.872188568115234, "global_step": 313359, "epoch": 1865} {"train_loss": -12.109795570373535, "global_step": 313360, "epoch": 1865} {"train_loss": -12.110881805419922, "global_step": 313361, "epoch": 1865} {"train_loss": -11.95417594909668, "global_step": 313362, "epoch": 1865} {"train_loss": -11.967061996459961, "global_step": 313363, "epoch": 1865} {"train_loss": -11.882001876831055, "global_step": 313364, "epoch": 1865} {"train_loss": -12.007147789001465, "global_step": 313365, "epoch": 1865} {"train_loss": -12.114750862121582, "global_step": 313366, "epoch": 1865} {"train_loss": -12.157953262329102, "global_step": 313367, "epoch": 1865} {"train_loss": -12.127725601196289, "global_step": 313368, "epoch": 1865} {"train_loss": -12.230721473693848, "global_step": 313369, "epoch": 1865} {"train_loss": -12.184368133544922, "global_step": 313370, "epoch": 1865} {"train_loss": -12.301586151123047, "global_step": 313371, "epoch": 1865} {"train_loss": -12.07127571105957, "global_step": 313372, "epoch": 1865} {"train_loss": -12.032327651977539, "global_step": 313373, "epoch": 1865} {"train_loss": -12.373823165893555, "global_step": 313374, "epoch": 1865} {"train_loss": -12.273580551147461, "global_step": 313375, "epoch": 1865} {"train_loss": -12.178573608398438, "global_step": 313376, "epoch": 1865} {"train_loss": -12.145390510559082, "global_step": 313377, "epoch": 1865} {"train_loss": -12.308725357055664, "global_step": 313378, "epoch": 1865} {"train_loss": -12.415922164916992, "global_step": 313379, "epoch": 1865} {"train_loss": -12.210447311401367, "global_step": 313380, "epoch": 1865} {"train_loss": -12.47842025756836, "global_step": 313381, "epoch": 1865} {"train_loss": -12.237323760986328, "global_step": 313382, "epoch": 1865} {"train_loss": -12.279748916625977, "global_step": 313383, "epoch": 1865} {"train_loss": -12.403913497924805, "global_step": 313384, "epoch": 1865} {"train_loss": -12.231941223144531, "global_step": 313385, "epoch": 1865} {"train_loss": -12.453903198242188, "global_step": 313386, "epoch": 1865} {"train_loss": -12.151603698730469, "global_step": 313387, "epoch": 1865} {"train_loss": -12.411405563354492, "global_step": 313388, "epoch": 1865} {"train_loss": -12.359187126159668, "global_step": 313389, "epoch": 1865} {"train_loss": -12.499421119689941, "global_step": 313390, "epoch": 1865} {"train_loss": -12.577692985534668, "global_step": 313391, "epoch": 1865} {"train_loss": -12.34609603881836, "global_step": 313392, "epoch": 1865} {"train_loss": -12.526984214782715, "global_step": 313393, "epoch": 1865} {"train_loss": -12.169475555419922, "global_step": 313394, "epoch": 1865} {"train_loss": -12.33189582824707, "global_step": 313395, "epoch": 1865} {"train_loss": -12.54025650024414, "global_step": 313396, "epoch": 1865} {"train_loss": -12.36608600616455, "global_step": 313397, "epoch": 1865} {"train_loss": -12.355440139770508, "global_step": 313398, "epoch": 1865} {"train_loss": -12.423421859741211, "global_step": 313399, "epoch": 1865} {"train_loss": -12.530386924743652, "global_step": 313400, "epoch": 1865} {"train_loss": -12.457672119140625, "global_step": 313401, "epoch": 1865} {"train_loss": -12.280771255493164, "global_step": 313402, "epoch": 1865} {"train_loss": -12.244426727294922, "global_step": 313403, "epoch": 1865} {"train_loss": -12.174448013305664, "global_step": 313404, "epoch": 1865} {"train_loss": -12.509525299072266, "global_step": 313405, "epoch": 1865} {"train_loss": -12.466330528259277, "global_step": 313406, "epoch": 1865} {"train_loss": -12.489845275878906, "global_step": 313407, "epoch": 1865} {"train_loss": -12.348413467407227, "global_step": 313408, "epoch": 1865} {"train_loss": -12.58788013458252, "global_step": 313409, "epoch": 1865} {"train_loss": -12.649826049804688, "global_step": 313410, "epoch": 1865} {"train_loss": -12.506631851196289, "global_step": 313411, "epoch": 1865} {"train_loss": -12.671625137329102, "global_step": 313412, "epoch": 1865} {"train_loss": -12.337757110595703, "global_step": 313413, "epoch": 1865} {"train_loss": -12.656499862670898, "global_step": 313414, "epoch": 1865} {"train_loss": -12.319509506225586, "global_step": 313415, "epoch": 1865} {"train_loss": -12.369047164916992, "global_step": 313416, "epoch": 1865} {"train_loss": -12.603938102722168, "global_step": 313417, "epoch": 1865} {"train_loss": -12.324874877929688, "global_step": 313418, "epoch": 1865} {"train_loss": -12.557449340820312, "global_step": 313419, "epoch": 1865} {"train_loss": -12.356168746948242, "global_step": 313420, "epoch": 1865} {"train_loss": -12.050921440124512, "global_step": 313421, "epoch": 1865} {"train_loss": -11.863978385925293, "global_step": 313422, "epoch": 1865} {"train_loss": -12.62391185760498, "global_step": 313423, "epoch": 1865} {"train_loss": -12.508041381835938, "global_step": 313424, "epoch": 1865} {"train_loss": -12.320204734802246, "global_step": 313425, "epoch": 1865} {"train_loss": -12.435916900634766, "global_step": 313426, "epoch": 1865} {"train_loss": -12.679338455200195, "global_step": 313427, "epoch": 1865} {"train_loss": -12.611756324768066, "global_step": 313428, "epoch": 1865} {"train_loss": -12.541571617126465, "global_step": 313429, "epoch": 1865} {"train_loss": -12.655560493469238, "global_step": 313430, "epoch": 1865} {"train_loss": -12.554105758666992, "global_step": 313431, "epoch": 1865} {"train_loss": -12.543224334716797, "global_step": 313432, "epoch": 1865} {"train_loss": -12.592155456542969, "global_step": 313433, "epoch": 1865} {"train_loss": -12.638683319091797, "global_step": 313434, "epoch": 1865} {"train_loss": -12.672988891601562, "global_step": 313435, "epoch": 1865} {"train_loss": -12.802244186401367, "global_step": 313436, "epoch": 1865} {"train_loss": -12.770781517028809, "global_step": 313437, "epoch": 1865} {"train_loss": -12.648375511169434, "global_step": 313438, "epoch": 1865} {"train_loss": -12.68701171875, "global_step": 313439, "epoch": 1865} {"train_loss": -12.600090980529785, "global_step": 313440, "epoch": 1865} {"train_loss": -12.62349796295166, "global_step": 313441, "epoch": 1865} {"train_loss": -12.010889053344727, "global_step": 313442, "epoch": 1865} {"train_loss": -12.228590965270996, "global_step": 313443, "epoch": 1865} {"train_loss": -12.326536178588867, "global_step": 313444, "epoch": 1865} {"train_loss": -12.5313138961792, "global_step": 313445, "epoch": 1865} {"train_loss": -11.552391052246094, "global_step": 313446, "epoch": 1865} {"train_loss": -11.255056381225586, "global_step": 313447, "epoch": 1865} {"train_loss": -11.735067367553711, "global_step": 313448, "epoch": 1865} {"train_loss": -12.274311065673828, "global_step": 313449, "epoch": 1865} {"train_loss": -12.162036895751953, "global_step": 313450, "epoch": 1865} {"train_loss": -12.532625198364258, "global_step": 313451, "epoch": 1865} {"train_loss": -11.650157928466797, "global_step": 313452, "epoch": 1865} {"train_loss": -12.176692962646484, "global_step": 313453, "epoch": 1865} {"train_loss": -11.860597610473633, "global_step": 313454, "epoch": 1865} {"train_loss": -11.551424980163574, "global_step": 313455, "epoch": 1865} {"train_loss": -11.563304901123047, "global_step": 313456, "epoch": 1865} {"train_loss": -12.478260040283203, "global_step": 313457, "epoch": 1865} {"train_loss": -11.837998390197754, "global_step": 313458, "epoch": 1865} {"train_loss": -11.022159576416016, "global_step": 313459, "epoch": 1865} {"train_loss": -11.564458847045898, "global_step": 313460, "epoch": 1865} {"train_loss": -9.973592758178711, "global_step": 313461, "epoch": 1865} {"train_loss": -11.221771240234375, "global_step": 313462, "epoch": 1865} {"train_loss": -9.590848922729492, "global_step": 313463, "epoch": 1865} {"train_loss": -11.412029266357422, "global_step": 313464, "epoch": 1865} {"train_loss": -10.238837242126465, "global_step": 313465, "epoch": 1865} {"train_loss": -9.596169471740723, "global_step": 313466, "epoch": 1865} {"train_loss": -9.583829879760742, "global_step": 313467, "epoch": 1865} {"train_loss": -11.0256986618042, "global_step": 313468, "epoch": 1865} {"train_loss": -9.641365051269531, "global_step": 313469, "epoch": 1865} {"train_loss": -10.7212553024292, "global_step": 313470, "epoch": 1865} {"train_loss": -11.058521270751953, "global_step": 313471, "epoch": 1865} {"train_loss": -9.728021621704102, "global_step": 313472, "epoch": 1865} {"train_loss": -11.772314071655273, "global_step": 313473, "epoch": 1865} {"train_loss": -10.956905364990234, "global_step": 313474, "epoch": 1865} {"train_loss": -11.311562538146973, "global_step": 313475, "epoch": 1865} {"train_loss": -11.849620819091797, "global_step": 313476, "epoch": 1865} {"train_loss": -11.431550979614258, "global_step": 313477, "epoch": 1865} {"train_loss": -10.811214447021484, "global_step": 313478, "epoch": 1865} {"train_loss": -11.127811431884766, "global_step": 313479, "epoch": 1865} {"train_loss": -11.881967544555664, "global_step": 313480, "epoch": 1865} {"train_loss": -11.209517478942871, "global_step": 313481, "epoch": 1865} {"train_loss": -11.104103088378906, "global_step": 313482, "epoch": 1865} {"train_loss": -11.3805513381958, "global_step": 313483, "epoch": 1865} {"train_loss": -10.817727088928223, "global_step": 313484, "epoch": 1865} {"train_loss": -11.014690399169922, "global_step": 313485, "epoch": 1865} {"train_loss": -10.702396392822266, "global_step": 313486, "epoch": 1865} {"train_loss": -11.82423644406455, "global_step": 313487, "epoch": 1865, "val_loss": 281591.46875, "train_action_mse_error": 0.8710291981697083} {"train_loss": -10.991487503051758, "global_step": 313488, "epoch": 1866} {"train_loss": -11.770974159240723, "global_step": 313489, "epoch": 1866} {"train_loss": -10.707233428955078, "global_step": 313490, "epoch": 1866} {"train_loss": -10.553068161010742, "global_step": 313491, "epoch": 1866} {"train_loss": -11.368696212768555, "global_step": 313492, "epoch": 1866} {"train_loss": -10.687101364135742, "global_step": 313493, "epoch": 1866} {"train_loss": -10.918462753295898, "global_step": 313494, "epoch": 1866} {"train_loss": -9.513805389404297, "global_step": 313495, "epoch": 1866} {"train_loss": -10.565492630004883, "global_step": 313496, "epoch": 1866} {"train_loss": -10.411844253540039, "global_step": 313497, "epoch": 1866} {"train_loss": -10.952680587768555, "global_step": 313498, "epoch": 1866} {"train_loss": -9.108973503112793, "global_step": 313499, "epoch": 1866} {"train_loss": -10.94924545288086, "global_step": 313500, "epoch": 1866} {"train_loss": -9.787111282348633, "global_step": 313501, "epoch": 1866} {"train_loss": -10.268909454345703, "global_step": 313502, "epoch": 1866} {"train_loss": -9.937644004821777, "global_step": 313503, "epoch": 1866} {"train_loss": -10.346445083618164, "global_step": 313504, "epoch": 1866} {"train_loss": -10.912130355834961, "global_step": 313505, "epoch": 1866} {"train_loss": -9.30302619934082, "global_step": 313506, "epoch": 1866} {"train_loss": -11.767050743103027, "global_step": 313507, "epoch": 1866} {"train_loss": -9.777539253234863, "global_step": 313508, "epoch": 1866} {"train_loss": -11.816873550415039, "global_step": 313509, "epoch": 1866} {"train_loss": -10.291594505310059, "global_step": 313510, "epoch": 1866} {"train_loss": -11.472663879394531, "global_step": 313511, "epoch": 1866} {"train_loss": -10.7457857131958, "global_step": 313512, "epoch": 1866} {"train_loss": -11.335195541381836, "global_step": 313513, "epoch": 1866} {"train_loss": -11.138450622558594, "global_step": 313514, "epoch": 1866} {"train_loss": -11.216348648071289, "global_step": 313515, "epoch": 1866} {"train_loss": -11.684150695800781, "global_step": 313516, "epoch": 1866} {"train_loss": -11.321547508239746, "global_step": 313517, "epoch": 1866} {"train_loss": -11.658780097961426, "global_step": 313518, "epoch": 1866} {"train_loss": -11.483959197998047, "global_step": 313519, "epoch": 1866} {"train_loss": -11.765556335449219, "global_step": 313520, "epoch": 1866} {"train_loss": -11.475225448608398, "global_step": 313521, "epoch": 1866} {"train_loss": -11.6673583984375, "global_step": 313522, "epoch": 1866} {"train_loss": -11.498727798461914, "global_step": 313523, "epoch": 1866} {"train_loss": -11.564628601074219, "global_step": 313524, "epoch": 1866} {"train_loss": -11.694731712341309, "global_step": 313525, "epoch": 1866} {"train_loss": -11.657146453857422, "global_step": 313526, "epoch": 1866} {"train_loss": -11.898504257202148, "global_step": 313527, "epoch": 1866} {"train_loss": -11.624113082885742, "global_step": 313528, "epoch": 1866} {"train_loss": -11.853050231933594, "global_step": 313529, "epoch": 1866} {"train_loss": -11.618291854858398, "global_step": 313530, "epoch": 1866} {"train_loss": -12.051253318786621, "global_step": 313531, "epoch": 1866} {"train_loss": -11.879460334777832, "global_step": 313532, "epoch": 1866} {"train_loss": -11.990833282470703, "global_step": 313533, "epoch": 1866} {"train_loss": -11.921356201171875, "global_step": 313534, "epoch": 1866} {"train_loss": -11.729429244995117, "global_step": 313535, "epoch": 1866} {"train_loss": -12.02083969116211, "global_step": 313536, "epoch": 1866} {"train_loss": -11.939067840576172, "global_step": 313537, "epoch": 1866} {"train_loss": -12.098969459533691, "global_step": 313538, "epoch": 1866} {"train_loss": -12.102550506591797, "global_step": 313539, "epoch": 1866} {"train_loss": -11.77737808227539, "global_step": 313540, "epoch": 1866} {"train_loss": -11.936460494995117, "global_step": 313541, "epoch": 1866} {"train_loss": -12.075974464416504, "global_step": 313542, "epoch": 1866} {"train_loss": -12.26617431640625, "global_step": 313543, "epoch": 1866} {"train_loss": -11.729095458984375, "global_step": 313544, "epoch": 1866} {"train_loss": -12.14599895477295, "global_step": 313545, "epoch": 1866} {"train_loss": -12.250123977661133, "global_step": 313546, "epoch": 1866} {"train_loss": -12.212226867675781, "global_step": 313547, "epoch": 1866} {"train_loss": -12.105801582336426, "global_step": 313548, "epoch": 1866} {"train_loss": -12.187451362609863, "global_step": 313549, "epoch": 1866} {"train_loss": -12.133224487304688, "global_step": 313550, "epoch": 1866} {"train_loss": -12.201641082763672, "global_step": 313551, "epoch": 1866} {"train_loss": -12.253679275512695, "global_step": 313552, "epoch": 1866} {"train_loss": -12.063995361328125, "global_step": 313553, "epoch": 1866} {"train_loss": -12.421582221984863, "global_step": 313554, "epoch": 1866} {"train_loss": -12.040285110473633, "global_step": 313555, "epoch": 1866} {"train_loss": -12.168785095214844, "global_step": 313556, "epoch": 1866} {"train_loss": -12.0618314743042, "global_step": 313557, "epoch": 1866} {"train_loss": -12.271753311157227, "global_step": 313558, "epoch": 1866} {"train_loss": -12.063518524169922, "global_step": 313559, "epoch": 1866} {"train_loss": -12.028037071228027, "global_step": 313560, "epoch": 1866} {"train_loss": -12.098270416259766, "global_step": 313561, "epoch": 1866} {"train_loss": -12.174530982971191, "global_step": 313562, "epoch": 1866} {"train_loss": -12.22001838684082, "global_step": 313563, "epoch": 1866} {"train_loss": -12.008584976196289, "global_step": 313564, "epoch": 1866} {"train_loss": -12.341943740844727, "global_step": 313565, "epoch": 1866} {"train_loss": -11.985218048095703, "global_step": 313566, "epoch": 1866} {"train_loss": -12.314753532409668, "global_step": 313567, "epoch": 1866} {"train_loss": -11.93846321105957, "global_step": 313568, "epoch": 1866} {"train_loss": -12.307014465332031, "global_step": 313569, "epoch": 1866} {"train_loss": -12.098188400268555, "global_step": 313570, "epoch": 1866} {"train_loss": -12.244344711303711, "global_step": 313571, "epoch": 1866} {"train_loss": -12.313497543334961, "global_step": 313572, "epoch": 1866} {"train_loss": -12.133066177368164, "global_step": 313573, "epoch": 1866} {"train_loss": -12.0836181640625, "global_step": 313574, "epoch": 1866} {"train_loss": -12.382408142089844, "global_step": 313575, "epoch": 1866} {"train_loss": -11.745308876037598, "global_step": 313576, "epoch": 1866} {"train_loss": -12.092511177062988, "global_step": 313577, "epoch": 1866} {"train_loss": -12.369760513305664, "global_step": 313578, "epoch": 1866} {"train_loss": -12.46021556854248, "global_step": 313579, "epoch": 1866} {"train_loss": -12.083311080932617, "global_step": 313580, "epoch": 1866} {"train_loss": -12.17165756225586, "global_step": 313581, "epoch": 1866} {"train_loss": -12.247037887573242, "global_step": 313582, "epoch": 1866} {"train_loss": -12.098769187927246, "global_step": 313583, "epoch": 1866} {"train_loss": -12.453968048095703, "global_step": 313584, "epoch": 1866} {"train_loss": -12.467887878417969, "global_step": 313585, "epoch": 1866} {"train_loss": -12.326993942260742, "global_step": 313586, "epoch": 1866} {"train_loss": -12.317326545715332, "global_step": 313587, "epoch": 1866} {"train_loss": -12.489240646362305, "global_step": 313588, "epoch": 1866} {"train_loss": -12.393441200256348, "global_step": 313589, "epoch": 1866} {"train_loss": -12.520017623901367, "global_step": 313590, "epoch": 1866} {"train_loss": -12.221700668334961, "global_step": 313591, "epoch": 1866} {"train_loss": -12.150078773498535, "global_step": 313592, "epoch": 1866} {"train_loss": -12.047357559204102, "global_step": 313593, "epoch": 1866} {"train_loss": -12.358983993530273, "global_step": 313594, "epoch": 1866} {"train_loss": -12.15864372253418, "global_step": 313595, "epoch": 1866} {"train_loss": -12.094293594360352, "global_step": 313596, "epoch": 1866} {"train_loss": -12.202716827392578, "global_step": 313597, "epoch": 1866} {"train_loss": -12.024701118469238, "global_step": 313598, "epoch": 1866} {"train_loss": -11.907504081726074, "global_step": 313599, "epoch": 1866} {"train_loss": -11.80951976776123, "global_step": 313600, "epoch": 1866} {"train_loss": -11.396581649780273, "global_step": 313601, "epoch": 1866} {"train_loss": -10.275422096252441, "global_step": 313602, "epoch": 1866} {"train_loss": -12.205942153930664, "global_step": 313603, "epoch": 1866} {"train_loss": -10.296377182006836, "global_step": 313604, "epoch": 1866} {"train_loss": -12.37297534942627, "global_step": 313605, "epoch": 1866} {"train_loss": -11.732154846191406, "global_step": 313606, "epoch": 1866} {"train_loss": -12.182684898376465, "global_step": 313607, "epoch": 1866} {"train_loss": -12.176051139831543, "global_step": 313608, "epoch": 1866} {"train_loss": -12.250608444213867, "global_step": 313609, "epoch": 1866} {"train_loss": -11.912395477294922, "global_step": 313610, "epoch": 1866} {"train_loss": -12.088547706604004, "global_step": 313611, "epoch": 1866} {"train_loss": -11.960725784301758, "global_step": 313612, "epoch": 1866} {"train_loss": -11.757339477539062, "global_step": 313613, "epoch": 1866} {"train_loss": -11.98046588897705, "global_step": 313614, "epoch": 1866} {"train_loss": -11.562858581542969, "global_step": 313615, "epoch": 1866} {"train_loss": -11.556350708007812, "global_step": 313616, "epoch": 1866} {"train_loss": -11.7517728805542, "global_step": 313617, "epoch": 1866} {"train_loss": -11.067729949951172, "global_step": 313618, "epoch": 1866} {"train_loss": -11.437660217285156, "global_step": 313619, "epoch": 1866} {"train_loss": -12.029999732971191, "global_step": 313620, "epoch": 1866} {"train_loss": -11.09404182434082, "global_step": 313621, "epoch": 1866} {"train_loss": -11.926976203918457, "global_step": 313622, "epoch": 1866} {"train_loss": -11.96772575378418, "global_step": 313623, "epoch": 1866} {"train_loss": -12.19454574584961, "global_step": 313624, "epoch": 1866} {"train_loss": -12.08686637878418, "global_step": 313625, "epoch": 1866} {"train_loss": -11.801694869995117, "global_step": 313626, "epoch": 1866} {"train_loss": -11.93966293334961, "global_step": 313627, "epoch": 1866} {"train_loss": -12.382728576660156, "global_step": 313628, "epoch": 1866} {"train_loss": -11.980664253234863, "global_step": 313629, "epoch": 1866} {"train_loss": -12.326805114746094, "global_step": 313630, "epoch": 1866} {"train_loss": -12.070094108581543, "global_step": 313631, "epoch": 1866} {"train_loss": -12.265551567077637, "global_step": 313632, "epoch": 1866} {"train_loss": -11.843216896057129, "global_step": 313633, "epoch": 1866} {"train_loss": -12.018014907836914, "global_step": 313634, "epoch": 1866} {"train_loss": -12.033356666564941, "global_step": 313635, "epoch": 1866} {"train_loss": -12.415884017944336, "global_step": 313636, "epoch": 1866} {"train_loss": -12.030908584594727, "global_step": 313637, "epoch": 1866} {"train_loss": -12.242596626281738, "global_step": 313638, "epoch": 1866} {"train_loss": -12.003167152404785, "global_step": 313639, "epoch": 1866} {"train_loss": -12.268404006958008, "global_step": 313640, "epoch": 1866} {"train_loss": -12.146598815917969, "global_step": 313641, "epoch": 1866} {"train_loss": -12.253732681274414, "global_step": 313642, "epoch": 1866} {"train_loss": -12.465202331542969, "global_step": 313643, "epoch": 1866} {"train_loss": -12.508247375488281, "global_step": 313644, "epoch": 1866} {"train_loss": -12.224153518676758, "global_step": 313645, "epoch": 1866} {"train_loss": -12.555273056030273, "global_step": 313646, "epoch": 1866} {"train_loss": -12.06336784362793, "global_step": 313647, "epoch": 1866} {"train_loss": -12.42636489868164, "global_step": 313648, "epoch": 1866} {"train_loss": -12.54254150390625, "global_step": 313649, "epoch": 1866} {"train_loss": -12.454748153686523, "global_step": 313650, "epoch": 1866} {"train_loss": -12.398893356323242, "global_step": 313651, "epoch": 1866} {"train_loss": -12.211841583251953, "global_step": 313652, "epoch": 1866} {"train_loss": -12.437275886535645, "global_step": 313653, "epoch": 1866} {"train_loss": -12.40810775756836, "global_step": 313654, "epoch": 1866} {"train_loss": -11.806350929396492, "global_step": 313655, "epoch": 1866, "val_loss": 283060.59375} {"train_loss": -12.396516799926758, "global_step": 313656, "epoch": 1867} {"train_loss": -12.400123596191406, "global_step": 313657, "epoch": 1867} {"train_loss": -12.570537567138672, "global_step": 313658, "epoch": 1867} {"train_loss": -12.4052152633667, "global_step": 313659, "epoch": 1867} {"train_loss": -12.500999450683594, "global_step": 313660, "epoch": 1867} {"train_loss": -12.293128967285156, "global_step": 313661, "epoch": 1867} {"train_loss": -12.416570663452148, "global_step": 313662, "epoch": 1867} {"train_loss": -12.605090141296387, "global_step": 313663, "epoch": 1867} {"train_loss": -12.444194793701172, "global_step": 313664, "epoch": 1867} {"train_loss": -12.537145614624023, "global_step": 313665, "epoch": 1867} {"train_loss": -12.202949523925781, "global_step": 313666, "epoch": 1867} {"train_loss": -12.043510437011719, "global_step": 313667, "epoch": 1867} {"train_loss": -11.850677490234375, "global_step": 313668, "epoch": 1867} {"train_loss": -11.851165771484375, "global_step": 313669, "epoch": 1867} {"train_loss": -11.637128829956055, "global_step": 313670, "epoch": 1867} {"train_loss": -11.100550651550293, "global_step": 313671, "epoch": 1867} {"train_loss": -11.926702499389648, "global_step": 313672, "epoch": 1867} {"train_loss": -12.166783332824707, "global_step": 313673, "epoch": 1867} {"train_loss": -11.768299102783203, "global_step": 313674, "epoch": 1867} {"train_loss": -10.872186660766602, "global_step": 313675, "epoch": 1867} {"train_loss": -11.817594528198242, "global_step": 313676, "epoch": 1867} {"train_loss": -11.993066787719727, "global_step": 313677, "epoch": 1867} {"train_loss": -11.09499740600586, "global_step": 313678, "epoch": 1867} {"train_loss": -11.417146682739258, "global_step": 313679, "epoch": 1867} {"train_loss": -11.603109359741211, "global_step": 313680, "epoch": 1867} {"train_loss": -11.527667999267578, "global_step": 313681, "epoch": 1867} {"train_loss": -11.693122863769531, "global_step": 313682, "epoch": 1867} {"train_loss": -12.145894050598145, "global_step": 313683, "epoch": 1867} {"train_loss": -11.775381088256836, "global_step": 313684, "epoch": 1867} {"train_loss": -11.990656852722168, "global_step": 313685, "epoch": 1867} {"train_loss": -12.021636962890625, "global_step": 313686, "epoch": 1867} {"train_loss": -11.965917587280273, "global_step": 313687, "epoch": 1867} {"train_loss": -12.218908309936523, "global_step": 313688, "epoch": 1867} {"train_loss": -12.125958442687988, "global_step": 313689, "epoch": 1867} {"train_loss": -12.331338882446289, "global_step": 313690, "epoch": 1867} {"train_loss": -12.332622528076172, "global_step": 313691, "epoch": 1867} {"train_loss": -12.318920135498047, "global_step": 313692, "epoch": 1867} {"train_loss": -11.586759567260742, "global_step": 313693, "epoch": 1867} {"train_loss": -11.878539085388184, "global_step": 313694, "epoch": 1867} {"train_loss": -11.94189739227295, "global_step": 313695, "epoch": 1867} {"train_loss": -11.897951126098633, "global_step": 313696, "epoch": 1867} {"train_loss": -10.981858253479004, "global_step": 313697, "epoch": 1867} {"train_loss": -12.168865203857422, "global_step": 313698, "epoch": 1867} {"train_loss": -12.096076011657715, "global_step": 313699, "epoch": 1867} {"train_loss": -11.189815521240234, "global_step": 313700, "epoch": 1867} {"train_loss": -11.882868766784668, "global_step": 313701, "epoch": 1867} {"train_loss": -11.368945121765137, "global_step": 313702, "epoch": 1867} {"train_loss": -11.044187545776367, "global_step": 313703, "epoch": 1867} {"train_loss": -11.395983695983887, "global_step": 313704, "epoch": 1867} {"train_loss": -10.652091026306152, "global_step": 313705, "epoch": 1867} {"train_loss": -10.283018112182617, "global_step": 313706, "epoch": 1867} {"train_loss": -10.76752758026123, "global_step": 313707, "epoch": 1867} {"train_loss": -9.997920036315918, "global_step": 313708, "epoch": 1867} {"train_loss": -10.311893463134766, "global_step": 313709, "epoch": 1867} {"train_loss": -10.158824920654297, "global_step": 313710, "epoch": 1867} {"train_loss": -10.317179679870605, "global_step": 313711, "epoch": 1867} {"train_loss": -9.901359558105469, "global_step": 313712, "epoch": 1867} {"train_loss": -11.592203140258789, "global_step": 313713, "epoch": 1867} {"train_loss": -9.98624038696289, "global_step": 313714, "epoch": 1867} {"train_loss": -11.050451278686523, "global_step": 313715, "epoch": 1867} {"train_loss": -11.207229614257812, "global_step": 313716, "epoch": 1867} {"train_loss": -10.428022384643555, "global_step": 313717, "epoch": 1867} {"train_loss": -11.735451698303223, "global_step": 313718, "epoch": 1867} {"train_loss": -10.21579360961914, "global_step": 313719, "epoch": 1867} {"train_loss": -11.690943717956543, "global_step": 313720, "epoch": 1867} {"train_loss": -11.12687873840332, "global_step": 313721, "epoch": 1867} {"train_loss": -11.54811954498291, "global_step": 313722, "epoch": 1867} {"train_loss": -11.413634300231934, "global_step": 313723, "epoch": 1867} {"train_loss": -11.25885009765625, "global_step": 313724, "epoch": 1867} {"train_loss": -11.489511489868164, "global_step": 313725, "epoch": 1867} {"train_loss": -11.418329238891602, "global_step": 313726, "epoch": 1867} {"train_loss": -11.843411445617676, "global_step": 313727, "epoch": 1867} {"train_loss": -11.827561378479004, "global_step": 313728, "epoch": 1867} {"train_loss": -11.916231155395508, "global_step": 313729, "epoch": 1867} {"train_loss": -12.047075271606445, "global_step": 313730, "epoch": 1867} {"train_loss": -11.674631118774414, "global_step": 313731, "epoch": 1867} {"train_loss": -12.100977897644043, "global_step": 313732, "epoch": 1867} {"train_loss": -12.020695686340332, "global_step": 313733, "epoch": 1867} {"train_loss": -12.026609420776367, "global_step": 313734, "epoch": 1867} {"train_loss": -11.681706428527832, "global_step": 313735, "epoch": 1867} {"train_loss": -12.171773910522461, "global_step": 313736, "epoch": 1867} {"train_loss": -12.164640426635742, "global_step": 313737, "epoch": 1867} {"train_loss": -12.164583206176758, "global_step": 313738, "epoch": 1867} {"train_loss": -12.04658031463623, "global_step": 313739, "epoch": 1867} {"train_loss": -12.196783065795898, "global_step": 313740, "epoch": 1867} {"train_loss": -12.241427421569824, "global_step": 313741, "epoch": 1867} {"train_loss": -12.153205871582031, "global_step": 313742, "epoch": 1867} {"train_loss": -12.129992485046387, "global_step": 313743, "epoch": 1867} {"train_loss": -12.132055282592773, "global_step": 313744, "epoch": 1867} {"train_loss": -12.122446060180664, "global_step": 313745, "epoch": 1867} {"train_loss": -11.89454460144043, "global_step": 313746, "epoch": 1867} {"train_loss": -12.116292953491211, "global_step": 313747, "epoch": 1867} {"train_loss": -12.026458740234375, "global_step": 313748, "epoch": 1867} {"train_loss": -12.135234832763672, "global_step": 313749, "epoch": 1867} {"train_loss": -12.216745376586914, "global_step": 313750, "epoch": 1867} {"train_loss": -11.805496215820312, "global_step": 313751, "epoch": 1867} {"train_loss": -12.372186660766602, "global_step": 313752, "epoch": 1867} {"train_loss": -11.592975616455078, "global_step": 313753, "epoch": 1867} {"train_loss": -11.737349510192871, "global_step": 313754, "epoch": 1867} {"train_loss": -11.889244079589844, "global_step": 313755, "epoch": 1867} {"train_loss": -11.316823959350586, "global_step": 313756, "epoch": 1867} {"train_loss": -11.38714599609375, "global_step": 313757, "epoch": 1867} {"train_loss": -12.171136856079102, "global_step": 313758, "epoch": 1867} {"train_loss": -11.59939193725586, "global_step": 313759, "epoch": 1867} {"train_loss": -12.049449920654297, "global_step": 313760, "epoch": 1867} {"train_loss": -11.266305923461914, "global_step": 313761, "epoch": 1867} {"train_loss": -11.396320343017578, "global_step": 313762, "epoch": 1867} {"train_loss": -12.458578109741211, "global_step": 313763, "epoch": 1867} {"train_loss": -11.26184368133545, "global_step": 313764, "epoch": 1867} {"train_loss": -12.186554908752441, "global_step": 313765, "epoch": 1867} {"train_loss": -11.704307556152344, "global_step": 313766, "epoch": 1867} {"train_loss": -11.866552352905273, "global_step": 313767, "epoch": 1867} {"train_loss": -11.973514556884766, "global_step": 313768, "epoch": 1867} {"train_loss": -11.747078895568848, "global_step": 313769, "epoch": 1867} {"train_loss": -11.918940544128418, "global_step": 313770, "epoch": 1867} {"train_loss": -11.88271713256836, "global_step": 313771, "epoch": 1867} {"train_loss": -11.96394157409668, "global_step": 313772, "epoch": 1867} {"train_loss": -12.225873947143555, "global_step": 313773, "epoch": 1867} {"train_loss": -12.022321701049805, "global_step": 313774, "epoch": 1867} {"train_loss": -12.114717483520508, "global_step": 313775, "epoch": 1867} {"train_loss": -11.997464179992676, "global_step": 313776, "epoch": 1867} {"train_loss": -12.056622505187988, "global_step": 313777, "epoch": 1867} {"train_loss": -12.267837524414062, "global_step": 313778, "epoch": 1867} {"train_loss": -11.951353073120117, "global_step": 313779, "epoch": 1867} {"train_loss": -12.168645858764648, "global_step": 313780, "epoch": 1867} {"train_loss": -12.030302047729492, "global_step": 313781, "epoch": 1867} {"train_loss": -11.672867774963379, "global_step": 313782, "epoch": 1867} {"train_loss": -12.287782669067383, "global_step": 313783, "epoch": 1867} {"train_loss": -11.7815580368042, "global_step": 313784, "epoch": 1867} {"train_loss": -12.069608688354492, "global_step": 313785, "epoch": 1867} {"train_loss": -12.337708473205566, "global_step": 313786, "epoch": 1867} {"train_loss": -12.153406143188477, "global_step": 313787, "epoch": 1867} {"train_loss": -11.918571472167969, "global_step": 313788, "epoch": 1867} {"train_loss": -11.907447814941406, "global_step": 313789, "epoch": 1867} {"train_loss": -11.92552375793457, "global_step": 313790, "epoch": 1867} {"train_loss": -12.393989562988281, "global_step": 313791, "epoch": 1867} {"train_loss": -11.855043411254883, "global_step": 313792, "epoch": 1867} {"train_loss": -12.170400619506836, "global_step": 313793, "epoch": 1867} {"train_loss": -12.447559356689453, "global_step": 313794, "epoch": 1867} {"train_loss": -12.423232078552246, "global_step": 313795, "epoch": 1867} {"train_loss": -12.296655654907227, "global_step": 313796, "epoch": 1867} {"train_loss": -12.359407424926758, "global_step": 313797, "epoch": 1867} {"train_loss": -12.436971664428711, "global_step": 313798, "epoch": 1867} {"train_loss": -12.605463027954102, "global_step": 313799, "epoch": 1867} {"train_loss": -12.494277000427246, "global_step": 313800, "epoch": 1867} {"train_loss": -12.497916221618652, "global_step": 313801, "epoch": 1867} {"train_loss": -12.381847381591797, "global_step": 313802, "epoch": 1867} {"train_loss": -12.376115798950195, "global_step": 313803, "epoch": 1867} {"train_loss": -12.182632446289062, "global_step": 313804, "epoch": 1867} {"train_loss": -12.368584632873535, "global_step": 313805, "epoch": 1867} {"train_loss": -12.489131927490234, "global_step": 313806, "epoch": 1867} {"train_loss": -12.341840744018555, "global_step": 313807, "epoch": 1867} {"train_loss": -12.355629920959473, "global_step": 313808, "epoch": 1867} {"train_loss": -12.489500045776367, "global_step": 313809, "epoch": 1867} {"train_loss": -12.531146049499512, "global_step": 313810, "epoch": 1867} {"train_loss": -12.444038391113281, "global_step": 313811, "epoch": 1867} {"train_loss": -12.541748046875, "global_step": 313812, "epoch": 1867} {"train_loss": -12.240951538085938, "global_step": 313813, "epoch": 1867} {"train_loss": -11.920269966125488, "global_step": 313814, "epoch": 1867} {"train_loss": -12.139137268066406, "global_step": 313815, "epoch": 1867} {"train_loss": -12.520368576049805, "global_step": 313816, "epoch": 1867} {"train_loss": -12.229294776916504, "global_step": 313817, "epoch": 1867} {"train_loss": -12.375595092773438, "global_step": 313818, "epoch": 1867} {"train_loss": -12.407742500305176, "global_step": 313819, "epoch": 1867} {"train_loss": -12.401193618774414, "global_step": 313820, "epoch": 1867} {"train_loss": -12.427852630615234, "global_step": 313821, "epoch": 1867} {"train_loss": -12.436564445495605, "global_step": 313822, "epoch": 1867} {"train_loss": -11.879259518214635, "global_step": 313823, "epoch": 1867, "val_loss": 285006.375} {"train_loss": -12.437408447265625, "global_step": 313824, "epoch": 1868} {"train_loss": -12.28986930847168, "global_step": 313825, "epoch": 1868} {"train_loss": -12.324687957763672, "global_step": 313826, "epoch": 1868} {"train_loss": -12.533443450927734, "global_step": 313827, "epoch": 1868} {"train_loss": -12.3067626953125, "global_step": 313828, "epoch": 1868} {"train_loss": -12.153312683105469, "global_step": 313829, "epoch": 1868} {"train_loss": -12.160444259643555, "global_step": 313830, "epoch": 1868} {"train_loss": -12.128745079040527, "global_step": 313831, "epoch": 1868} {"train_loss": -12.117873191833496, "global_step": 313832, "epoch": 1868} {"train_loss": -12.018537521362305, "global_step": 313833, "epoch": 1868} {"train_loss": -12.203241348266602, "global_step": 313834, "epoch": 1868} {"train_loss": -12.136069297790527, "global_step": 313835, "epoch": 1868} {"train_loss": -12.272408485412598, "global_step": 313836, "epoch": 1868} {"train_loss": -11.664608001708984, "global_step": 313837, "epoch": 1868} {"train_loss": -11.37773323059082, "global_step": 313838, "epoch": 1868} {"train_loss": -11.068702697753906, "global_step": 313839, "epoch": 1868} {"train_loss": -11.974405288696289, "global_step": 313840, "epoch": 1868} {"train_loss": -9.617023468017578, "global_step": 313841, "epoch": 1868} {"train_loss": -10.743022918701172, "global_step": 313842, "epoch": 1868} {"train_loss": -9.670022010803223, "global_step": 313843, "epoch": 1868} {"train_loss": -11.273283004760742, "global_step": 313844, "epoch": 1868} {"train_loss": -10.266566276550293, "global_step": 313845, "epoch": 1868} {"train_loss": -9.468781471252441, "global_step": 313846, "epoch": 1868} {"train_loss": -9.882676124572754, "global_step": 313847, "epoch": 1868} {"train_loss": -11.49765396118164, "global_step": 313848, "epoch": 1868} {"train_loss": -9.667850494384766, "global_step": 313849, "epoch": 1868} {"train_loss": -10.126676559448242, "global_step": 313850, "epoch": 1868} {"train_loss": -10.35973834991455, "global_step": 313851, "epoch": 1868} {"train_loss": -10.476836204528809, "global_step": 313852, "epoch": 1868} {"train_loss": -9.607477188110352, "global_step": 313853, "epoch": 1868} {"train_loss": -8.449914932250977, "global_step": 313854, "epoch": 1868} {"train_loss": -10.269587516784668, "global_step": 313855, "epoch": 1868} {"train_loss": -10.608936309814453, "global_step": 313856, "epoch": 1868} {"train_loss": -9.649442672729492, "global_step": 313857, "epoch": 1868} {"train_loss": -10.955395698547363, "global_step": 313858, "epoch": 1868} {"train_loss": -10.026712417602539, "global_step": 313859, "epoch": 1868} {"train_loss": -10.508139610290527, "global_step": 313860, "epoch": 1868} {"train_loss": -10.928186416625977, "global_step": 313861, "epoch": 1868} {"train_loss": -8.686371803283691, "global_step": 313862, "epoch": 1868} {"train_loss": -10.784160614013672, "global_step": 313863, "epoch": 1868} {"train_loss": -10.699728965759277, "global_step": 313864, "epoch": 1868} {"train_loss": -9.64531421661377, "global_step": 313865, "epoch": 1868} {"train_loss": -10.069047927856445, "global_step": 313866, "epoch": 1868} {"train_loss": -11.083972930908203, "global_step": 313867, "epoch": 1868} {"train_loss": -9.944165229797363, "global_step": 313868, "epoch": 1868} {"train_loss": -10.479279518127441, "global_step": 313869, "epoch": 1868} {"train_loss": -10.794431686401367, "global_step": 313870, "epoch": 1868} {"train_loss": -9.845344543457031, "global_step": 313871, "epoch": 1868} {"train_loss": -10.778651237487793, "global_step": 313872, "epoch": 1868} {"train_loss": -9.668272018432617, "global_step": 313873, "epoch": 1868} {"train_loss": -10.945693016052246, "global_step": 313874, "epoch": 1868} {"train_loss": -9.93304443359375, "global_step": 313875, "epoch": 1868} {"train_loss": -10.75905990600586, "global_step": 313876, "epoch": 1868} {"train_loss": -10.269875526428223, "global_step": 313877, "epoch": 1868} {"train_loss": -10.391752243041992, "global_step": 313878, "epoch": 1868} {"train_loss": -10.761199951171875, "global_step": 313879, "epoch": 1868} {"train_loss": -11.459375381469727, "global_step": 313880, "epoch": 1868} {"train_loss": -10.865560531616211, "global_step": 313881, "epoch": 1868} {"train_loss": -11.438396453857422, "global_step": 313882, "epoch": 1868} {"train_loss": -11.663244247436523, "global_step": 313883, "epoch": 1868} {"train_loss": -11.439680099487305, "global_step": 313884, "epoch": 1868} {"train_loss": -11.124208450317383, "global_step": 313885, "epoch": 1868} {"train_loss": -11.74892807006836, "global_step": 313886, "epoch": 1868} {"train_loss": -11.418169021606445, "global_step": 313887, "epoch": 1868} {"train_loss": -11.728776931762695, "global_step": 313888, "epoch": 1868} {"train_loss": -11.947443008422852, "global_step": 313889, "epoch": 1868} {"train_loss": -12.01687240600586, "global_step": 313890, "epoch": 1868} {"train_loss": -11.67085075378418, "global_step": 313891, "epoch": 1868} {"train_loss": -11.637965202331543, "global_step": 313892, "epoch": 1868} {"train_loss": -12.0692138671875, "global_step": 313893, "epoch": 1868} {"train_loss": -11.992483139038086, "global_step": 313894, "epoch": 1868} {"train_loss": -12.206428527832031, "global_step": 313895, "epoch": 1868} {"train_loss": -11.895792007446289, "global_step": 313896, "epoch": 1868} {"train_loss": -11.619139671325684, "global_step": 313897, "epoch": 1868} {"train_loss": -11.859760284423828, "global_step": 313898, "epoch": 1868} {"train_loss": -12.017572402954102, "global_step": 313899, "epoch": 1868} {"train_loss": -11.795741081237793, "global_step": 313900, "epoch": 1868} {"train_loss": -12.094386100769043, "global_step": 313901, "epoch": 1868} {"train_loss": -11.957819938659668, "global_step": 313902, "epoch": 1868} {"train_loss": -12.017382621765137, "global_step": 313903, "epoch": 1868} {"train_loss": -12.006304740905762, "global_step": 313904, "epoch": 1868} {"train_loss": -12.007461547851562, "global_step": 313905, "epoch": 1868} {"train_loss": -12.124833106994629, "global_step": 313906, "epoch": 1868} {"train_loss": -12.183077812194824, "global_step": 313907, "epoch": 1868} {"train_loss": -11.994821548461914, "global_step": 313908, "epoch": 1868} {"train_loss": -12.239974975585938, "global_step": 313909, "epoch": 1868} {"train_loss": -12.032829284667969, "global_step": 313910, "epoch": 1868} {"train_loss": -12.249988555908203, "global_step": 313911, "epoch": 1868} {"train_loss": -12.103321075439453, "global_step": 313912, "epoch": 1868} {"train_loss": -12.21921157836914, "global_step": 313913, "epoch": 1868} {"train_loss": -12.265987396240234, "global_step": 313914, "epoch": 1868} {"train_loss": -12.100486755371094, "global_step": 313915, "epoch": 1868} {"train_loss": -12.14948844909668, "global_step": 313916, "epoch": 1868} {"train_loss": -12.053262710571289, "global_step": 313917, "epoch": 1868} {"train_loss": -12.244196891784668, "global_step": 313918, "epoch": 1868} {"train_loss": -12.203367233276367, "global_step": 313919, "epoch": 1868} {"train_loss": -12.248139381408691, "global_step": 313920, "epoch": 1868} {"train_loss": -12.279293060302734, "global_step": 313921, "epoch": 1868} {"train_loss": -12.31834602355957, "global_step": 313922, "epoch": 1868} {"train_loss": -12.215499877929688, "global_step": 313923, "epoch": 1868} {"train_loss": -12.344602584838867, "global_step": 313924, "epoch": 1868} {"train_loss": -12.406805038452148, "global_step": 313925, "epoch": 1868} {"train_loss": -12.332769393920898, "global_step": 313926, "epoch": 1868} {"train_loss": -12.328245162963867, "global_step": 313927, "epoch": 1868} {"train_loss": -12.418231964111328, "global_step": 313928, "epoch": 1868} {"train_loss": -12.560453414916992, "global_step": 313929, "epoch": 1868} {"train_loss": -12.239646911621094, "global_step": 313930, "epoch": 1868} {"train_loss": -12.499537467956543, "global_step": 313931, "epoch": 1868} {"train_loss": -12.30527400970459, "global_step": 313932, "epoch": 1868} {"train_loss": -12.362274169921875, "global_step": 313933, "epoch": 1868} {"train_loss": -12.307357788085938, "global_step": 313934, "epoch": 1868} {"train_loss": -12.2275390625, "global_step": 313935, "epoch": 1868} {"train_loss": -12.504966735839844, "global_step": 313936, "epoch": 1868} {"train_loss": -12.435745239257812, "global_step": 313937, "epoch": 1868} {"train_loss": -12.461994171142578, "global_step": 313938, "epoch": 1868} {"train_loss": -12.51984977722168, "global_step": 313939, "epoch": 1868} {"train_loss": -12.514331817626953, "global_step": 313940, "epoch": 1868} {"train_loss": -12.448253631591797, "global_step": 313941, "epoch": 1868} {"train_loss": -12.594487190246582, "global_step": 313942, "epoch": 1868} {"train_loss": -12.51841926574707, "global_step": 313943, "epoch": 1868} {"train_loss": -12.450511932373047, "global_step": 313944, "epoch": 1868} {"train_loss": -12.4795503616333, "global_step": 313945, "epoch": 1868} {"train_loss": -12.519954681396484, "global_step": 313946, "epoch": 1868} {"train_loss": -12.42166519165039, "global_step": 313947, "epoch": 1868} {"train_loss": -12.336799621582031, "global_step": 313948, "epoch": 1868} {"train_loss": -12.417750358581543, "global_step": 313949, "epoch": 1868} {"train_loss": -11.998799324035645, "global_step": 313950, "epoch": 1868} {"train_loss": -11.885530471801758, "global_step": 313951, "epoch": 1868} {"train_loss": -12.137069702148438, "global_step": 313952, "epoch": 1868} {"train_loss": -12.614090919494629, "global_step": 313953, "epoch": 1868} {"train_loss": -12.021712303161621, "global_step": 313954, "epoch": 1868} {"train_loss": -11.060840606689453, "global_step": 313955, "epoch": 1868} {"train_loss": -11.610451698303223, "global_step": 313956, "epoch": 1868} {"train_loss": -12.07924747467041, "global_step": 313957, "epoch": 1868} {"train_loss": -12.38930892944336, "global_step": 313958, "epoch": 1868} {"train_loss": -11.54256820678711, "global_step": 313959, "epoch": 1868} {"train_loss": -11.482664108276367, "global_step": 313960, "epoch": 1868} {"train_loss": -11.496660232543945, "global_step": 313961, "epoch": 1868} {"train_loss": -12.463479995727539, "global_step": 313962, "epoch": 1868} {"train_loss": -11.929302215576172, "global_step": 313963, "epoch": 1868} {"train_loss": -12.210307121276855, "global_step": 313964, "epoch": 1868} {"train_loss": -11.84988784790039, "global_step": 313965, "epoch": 1868} {"train_loss": -12.182880401611328, "global_step": 313966, "epoch": 1868} {"train_loss": -12.043628692626953, "global_step": 313967, "epoch": 1868} {"train_loss": -11.254465103149414, "global_step": 313968, "epoch": 1868} {"train_loss": -12.034103393554688, "global_step": 313969, "epoch": 1868} {"train_loss": -12.254415512084961, "global_step": 313970, "epoch": 1868} {"train_loss": -11.915742874145508, "global_step": 313971, "epoch": 1868} {"train_loss": -11.650501251220703, "global_step": 313972, "epoch": 1868} {"train_loss": -11.570404052734375, "global_step": 313973, "epoch": 1868} {"train_loss": -11.60600757598877, "global_step": 313974, "epoch": 1868} {"train_loss": -11.691652297973633, "global_step": 313975, "epoch": 1868} {"train_loss": -11.530915260314941, "global_step": 313976, "epoch": 1868} {"train_loss": -11.916681289672852, "global_step": 313977, "epoch": 1868} {"train_loss": -11.138452529907227, "global_step": 313978, "epoch": 1868} {"train_loss": -11.577038764953613, "global_step": 313979, "epoch": 1868} {"train_loss": -11.95504093170166, "global_step": 313980, "epoch": 1868} {"train_loss": -11.727420806884766, "global_step": 313981, "epoch": 1868} {"train_loss": -10.902233123779297, "global_step": 313982, "epoch": 1868} {"train_loss": -12.064230918884277, "global_step": 313983, "epoch": 1868} {"train_loss": -11.648162841796875, "global_step": 313984, "epoch": 1868} {"train_loss": -11.282098770141602, "global_step": 313985, "epoch": 1868} {"train_loss": -12.097668647766113, "global_step": 313986, "epoch": 1868} {"train_loss": -12.076107025146484, "global_step": 313987, "epoch": 1868} {"train_loss": -12.129136085510254, "global_step": 313988, "epoch": 1868} {"train_loss": -11.913726806640625, "global_step": 313989, "epoch": 1868} {"train_loss": -11.976086616516113, "global_step": 313990, "epoch": 1868} {"train_loss": -11.603656558763413, "global_step": 313991, "epoch": 1868, "val_loss": 283137.46875} {"train_loss": -11.797245025634766, "global_step": 313992, "epoch": 1869} {"train_loss": -12.427986145019531, "global_step": 313993, "epoch": 1869} {"train_loss": -12.259166717529297, "global_step": 313994, "epoch": 1869} {"train_loss": -12.069281578063965, "global_step": 313995, "epoch": 1869} {"train_loss": -12.005230903625488, "global_step": 313996, "epoch": 1869} {"train_loss": -11.999591827392578, "global_step": 313997, "epoch": 1869} {"train_loss": -11.749738693237305, "global_step": 313998, "epoch": 1869} {"train_loss": -11.949939727783203, "global_step": 313999, "epoch": 1869} {"train_loss": -12.229164123535156, "global_step": 314000, "epoch": 1869} {"train_loss": -11.221476554870605, "global_step": 314001, "epoch": 1869} {"train_loss": -10.86551284790039, "global_step": 314002, "epoch": 1869} {"train_loss": -12.449886322021484, "global_step": 314003, "epoch": 1869} {"train_loss": -10.821137428283691, "global_step": 314004, "epoch": 1869} {"train_loss": -11.195969581604004, "global_step": 314005, "epoch": 1869} {"train_loss": -12.328672409057617, "global_step": 314006, "epoch": 1869} {"train_loss": -10.397345542907715, "global_step": 314007, "epoch": 1869} {"train_loss": -11.525362968444824, "global_step": 314008, "epoch": 1869} {"train_loss": -11.79738712310791, "global_step": 314009, "epoch": 1869} {"train_loss": -10.558855056762695, "global_step": 314010, "epoch": 1869} {"train_loss": -11.396014213562012, "global_step": 314011, "epoch": 1869} {"train_loss": -11.638052940368652, "global_step": 314012, "epoch": 1869} {"train_loss": -11.102275848388672, "global_step": 314013, "epoch": 1869} {"train_loss": -11.351583480834961, "global_step": 314014, "epoch": 1869} {"train_loss": -11.419204711914062, "global_step": 314015, "epoch": 1869} {"train_loss": -10.836126327514648, "global_step": 314016, "epoch": 1869} {"train_loss": -11.835424423217773, "global_step": 314017, "epoch": 1869} {"train_loss": -11.420223236083984, "global_step": 314018, "epoch": 1869} {"train_loss": -11.38308048248291, "global_step": 314019, "epoch": 1869} {"train_loss": -11.897636413574219, "global_step": 314020, "epoch": 1869} {"train_loss": -11.849919319152832, "global_step": 314021, "epoch": 1869} {"train_loss": -11.868935585021973, "global_step": 314022, "epoch": 1869} {"train_loss": -11.73779582977295, "global_step": 314023, "epoch": 1869} {"train_loss": -11.776330947875977, "global_step": 314024, "epoch": 1869} {"train_loss": -11.345392227172852, "global_step": 314025, "epoch": 1869} {"train_loss": -12.05648422241211, "global_step": 314026, "epoch": 1869} {"train_loss": -11.677054405212402, "global_step": 314027, "epoch": 1869} {"train_loss": -11.50275707244873, "global_step": 314028, "epoch": 1869} {"train_loss": -11.724918365478516, "global_step": 314029, "epoch": 1869} {"train_loss": -11.296789169311523, "global_step": 314030, "epoch": 1869} {"train_loss": -11.348390579223633, "global_step": 314031, "epoch": 1869} {"train_loss": -10.817903518676758, "global_step": 314032, "epoch": 1869} {"train_loss": -11.824410438537598, "global_step": 314033, "epoch": 1869} {"train_loss": -10.980405807495117, "global_step": 314034, "epoch": 1869} {"train_loss": -11.69743824005127, "global_step": 314035, "epoch": 1869} {"train_loss": -11.495853424072266, "global_step": 314036, "epoch": 1869} {"train_loss": -11.222808837890625, "global_step": 314037, "epoch": 1869} {"train_loss": -11.655384063720703, "global_step": 314038, "epoch": 1869} {"train_loss": -11.409984588623047, "global_step": 314039, "epoch": 1869} {"train_loss": -11.648104667663574, "global_step": 314040, "epoch": 1869} {"train_loss": -11.386099815368652, "global_step": 314041, "epoch": 1869} {"train_loss": -11.88214111328125, "global_step": 314042, "epoch": 1869} {"train_loss": -11.686041831970215, "global_step": 314043, "epoch": 1869} {"train_loss": -11.719878196716309, "global_step": 314044, "epoch": 1869} {"train_loss": -11.799100875854492, "global_step": 314045, "epoch": 1869} {"train_loss": -11.841634750366211, "global_step": 314046, "epoch": 1869} {"train_loss": -12.06824016571045, "global_step": 314047, "epoch": 1869} {"train_loss": -12.195563316345215, "global_step": 314048, "epoch": 1869} {"train_loss": -12.130453109741211, "global_step": 314049, "epoch": 1869} {"train_loss": -12.299428939819336, "global_step": 314050, "epoch": 1869} {"train_loss": -12.16740608215332, "global_step": 314051, "epoch": 1869} {"train_loss": -11.903867721557617, "global_step": 314052, "epoch": 1869} {"train_loss": -11.804364204406738, "global_step": 314053, "epoch": 1869} {"train_loss": -11.774250030517578, "global_step": 314054, "epoch": 1869} {"train_loss": -12.322017669677734, "global_step": 314055, "epoch": 1869} {"train_loss": -11.986047744750977, "global_step": 314056, "epoch": 1869} {"train_loss": -12.230379104614258, "global_step": 314057, "epoch": 1869} {"train_loss": -12.002544403076172, "global_step": 314058, "epoch": 1869} {"train_loss": -11.902154922485352, "global_step": 314059, "epoch": 1869} {"train_loss": -12.073116302490234, "global_step": 314060, "epoch": 1869} {"train_loss": -11.889432907104492, "global_step": 314061, "epoch": 1869} {"train_loss": -12.01095199584961, "global_step": 314062, "epoch": 1869} {"train_loss": -12.18081283569336, "global_step": 314063, "epoch": 1869} {"train_loss": -11.996953964233398, "global_step": 314064, "epoch": 1869} {"train_loss": -12.454116821289062, "global_step": 314065, "epoch": 1869} {"train_loss": -12.098848342895508, "global_step": 314066, "epoch": 1869} {"train_loss": -12.40286636352539, "global_step": 314067, "epoch": 1869} {"train_loss": -12.233356475830078, "global_step": 314068, "epoch": 1869} {"train_loss": -12.192524909973145, "global_step": 314069, "epoch": 1869} {"train_loss": -12.38123607635498, "global_step": 314070, "epoch": 1869} {"train_loss": -12.302059173583984, "global_step": 314071, "epoch": 1869} {"train_loss": -12.321720123291016, "global_step": 314072, "epoch": 1869} {"train_loss": -12.304985046386719, "global_step": 314073, "epoch": 1869} {"train_loss": -12.286397933959961, "global_step": 314074, "epoch": 1869} {"train_loss": -12.211453437805176, "global_step": 314075, "epoch": 1869} {"train_loss": -12.083837509155273, "global_step": 314076, "epoch": 1869} {"train_loss": -12.166813850402832, "global_step": 314077, "epoch": 1869} {"train_loss": -11.921835899353027, "global_step": 314078, "epoch": 1869} {"train_loss": -12.327842712402344, "global_step": 314079, "epoch": 1869} {"train_loss": -11.442401885986328, "global_step": 314080, "epoch": 1869} {"train_loss": -11.552953720092773, "global_step": 314081, "epoch": 1869} {"train_loss": -12.101842880249023, "global_step": 314082, "epoch": 1869} {"train_loss": -11.18275260925293, "global_step": 314083, "epoch": 1869} {"train_loss": -12.534309387207031, "global_step": 314084, "epoch": 1869} {"train_loss": -11.604381561279297, "global_step": 314085, "epoch": 1869} {"train_loss": -11.76699161529541, "global_step": 314086, "epoch": 1869} {"train_loss": -11.789375305175781, "global_step": 314087, "epoch": 1869} {"train_loss": -11.308368682861328, "global_step": 314088, "epoch": 1869} {"train_loss": -11.521739959716797, "global_step": 314089, "epoch": 1869} {"train_loss": -11.976722717285156, "global_step": 314090, "epoch": 1869} {"train_loss": -11.64059829711914, "global_step": 314091, "epoch": 1869} {"train_loss": -12.075521469116211, "global_step": 314092, "epoch": 1869} {"train_loss": -11.913496971130371, "global_step": 314093, "epoch": 1869} {"train_loss": -11.820798873901367, "global_step": 314094, "epoch": 1869} {"train_loss": -11.877058029174805, "global_step": 314095, "epoch": 1869} {"train_loss": -11.754646301269531, "global_step": 314096, "epoch": 1869} {"train_loss": -11.954362869262695, "global_step": 314097, "epoch": 1869} {"train_loss": -11.21676254272461, "global_step": 314098, "epoch": 1869} {"train_loss": -11.876452445983887, "global_step": 314099, "epoch": 1869} {"train_loss": -11.920324325561523, "global_step": 314100, "epoch": 1869} {"train_loss": -11.809167861938477, "global_step": 314101, "epoch": 1869} {"train_loss": -12.063474655151367, "global_step": 314102, "epoch": 1869} {"train_loss": -11.62963581085205, "global_step": 314103, "epoch": 1869} {"train_loss": -12.036111831665039, "global_step": 314104, "epoch": 1869} {"train_loss": -11.76173210144043, "global_step": 314105, "epoch": 1869} {"train_loss": -11.95237922668457, "global_step": 314106, "epoch": 1869} {"train_loss": -12.398650169372559, "global_step": 314107, "epoch": 1869} {"train_loss": -12.185636520385742, "global_step": 314108, "epoch": 1869} {"train_loss": -12.371095657348633, "global_step": 314109, "epoch": 1869} {"train_loss": -12.256027221679688, "global_step": 314110, "epoch": 1869} {"train_loss": -12.32100772857666, "global_step": 314111, "epoch": 1869} {"train_loss": -12.211509704589844, "global_step": 314112, "epoch": 1869} {"train_loss": -12.016870498657227, "global_step": 314113, "epoch": 1869} {"train_loss": -12.439250946044922, "global_step": 314114, "epoch": 1869} {"train_loss": -12.065079689025879, "global_step": 314115, "epoch": 1869} {"train_loss": -12.18401050567627, "global_step": 314116, "epoch": 1869} {"train_loss": -12.40436840057373, "global_step": 314117, "epoch": 1869} {"train_loss": -12.23905086517334, "global_step": 314118, "epoch": 1869} {"train_loss": -12.237726211547852, "global_step": 314119, "epoch": 1869} {"train_loss": -12.126344680786133, "global_step": 314120, "epoch": 1869} {"train_loss": -12.383275985717773, "global_step": 314121, "epoch": 1869} {"train_loss": -12.008447647094727, "global_step": 314122, "epoch": 1869} {"train_loss": -12.054651260375977, "global_step": 314123, "epoch": 1869} {"train_loss": -12.137923240661621, "global_step": 314124, "epoch": 1869} {"train_loss": -12.220745086669922, "global_step": 314125, "epoch": 1869} {"train_loss": -12.515396118164062, "global_step": 314126, "epoch": 1869} {"train_loss": -12.121736526489258, "global_step": 314127, "epoch": 1869} {"train_loss": -12.245758056640625, "global_step": 314128, "epoch": 1869} {"train_loss": -11.859846115112305, "global_step": 314129, "epoch": 1869} {"train_loss": -12.446181297302246, "global_step": 314130, "epoch": 1869} {"train_loss": -12.137401580810547, "global_step": 314131, "epoch": 1869} {"train_loss": -12.225547790527344, "global_step": 314132, "epoch": 1869} {"train_loss": -12.254708290100098, "global_step": 314133, "epoch": 1869} {"train_loss": -12.174787521362305, "global_step": 314134, "epoch": 1869} {"train_loss": -12.021743774414062, "global_step": 314135, "epoch": 1869} {"train_loss": -12.563701629638672, "global_step": 314136, "epoch": 1869} {"train_loss": -12.248973846435547, "global_step": 314137, "epoch": 1869} {"train_loss": -12.305328369140625, "global_step": 314138, "epoch": 1869} {"train_loss": -12.612592697143555, "global_step": 314139, "epoch": 1869} {"train_loss": -12.429304122924805, "global_step": 314140, "epoch": 1869} {"train_loss": -12.301870346069336, "global_step": 314141, "epoch": 1869} {"train_loss": -12.02090072631836, "global_step": 314142, "epoch": 1869} {"train_loss": -12.525829315185547, "global_step": 314143, "epoch": 1869} {"train_loss": -11.773736953735352, "global_step": 314144, "epoch": 1869} {"train_loss": -12.45710563659668, "global_step": 314145, "epoch": 1869} {"train_loss": -12.175230026245117, "global_step": 314146, "epoch": 1869} {"train_loss": -12.498834609985352, "global_step": 314147, "epoch": 1869} {"train_loss": -12.061190605163574, "global_step": 314148, "epoch": 1869} {"train_loss": -12.277063369750977, "global_step": 314149, "epoch": 1869} {"train_loss": -11.763883590698242, "global_step": 314150, "epoch": 1869} {"train_loss": -12.132335662841797, "global_step": 314151, "epoch": 1869} {"train_loss": -12.051315307617188, "global_step": 314152, "epoch": 1869} {"train_loss": -12.183124542236328, "global_step": 314153, "epoch": 1869} {"train_loss": -11.857863426208496, "global_step": 314154, "epoch": 1869} {"train_loss": -11.61140251159668, "global_step": 314155, "epoch": 1869} {"train_loss": -12.206685066223145, "global_step": 314156, "epoch": 1869} {"train_loss": -11.754497528076172, "global_step": 314157, "epoch": 1869} {"train_loss": -11.614892959594727, "global_step": 314158, "epoch": 1869} {"train_loss": -11.915267314229693, "global_step": 314159, "epoch": 1869, "val_loss": 279641.96875} {"train_loss": -11.988212585449219, "global_step": 314160, "epoch": 1870} {"train_loss": -12.152250289916992, "global_step": 314161, "epoch": 1870} {"train_loss": -11.628877639770508, "global_step": 314162, "epoch": 1870} {"train_loss": -12.180253982543945, "global_step": 314163, "epoch": 1870} {"train_loss": -11.716789245605469, "global_step": 314164, "epoch": 1870} {"train_loss": -11.639081954956055, "global_step": 314165, "epoch": 1870} {"train_loss": -11.319074630737305, "global_step": 314166, "epoch": 1870} {"train_loss": -11.320474624633789, "global_step": 314167, "epoch": 1870} {"train_loss": -11.317638397216797, "global_step": 314168, "epoch": 1870} {"train_loss": -11.243610382080078, "global_step": 314169, "epoch": 1870} {"train_loss": -10.805123329162598, "global_step": 314170, "epoch": 1870} {"train_loss": -11.78464126586914, "global_step": 314171, "epoch": 1870} {"train_loss": -11.53283977508545, "global_step": 314172, "epoch": 1870} {"train_loss": -10.952839851379395, "global_step": 314173, "epoch": 1870} {"train_loss": -12.194334983825684, "global_step": 314174, "epoch": 1870} {"train_loss": -11.136373519897461, "global_step": 314175, "epoch": 1870} {"train_loss": -11.746828079223633, "global_step": 314176, "epoch": 1870} {"train_loss": -11.618560791015625, "global_step": 314177, "epoch": 1870} {"train_loss": -12.171156883239746, "global_step": 314178, "epoch": 1870} {"train_loss": -11.94650650024414, "global_step": 314179, "epoch": 1870} {"train_loss": -11.747657775878906, "global_step": 314180, "epoch": 1870} {"train_loss": -12.08924674987793, "global_step": 314181, "epoch": 1870} {"train_loss": -11.794719696044922, "global_step": 314182, "epoch": 1870} {"train_loss": -12.06806755065918, "global_step": 314183, "epoch": 1870} {"train_loss": -12.233165740966797, "global_step": 314184, "epoch": 1870} {"train_loss": -11.712730407714844, "global_step": 314185, "epoch": 1870} {"train_loss": -11.603622436523438, "global_step": 314186, "epoch": 1870} {"train_loss": -12.061279296875, "global_step": 314187, "epoch": 1870} {"train_loss": -11.898118019104004, "global_step": 314188, "epoch": 1870} {"train_loss": -12.065263748168945, "global_step": 314189, "epoch": 1870} {"train_loss": -12.05215835571289, "global_step": 314190, "epoch": 1870} {"train_loss": -11.817136764526367, "global_step": 314191, "epoch": 1870} {"train_loss": -12.21052360534668, "global_step": 314192, "epoch": 1870} {"train_loss": -11.915510177612305, "global_step": 314193, "epoch": 1870} {"train_loss": -11.798882484436035, "global_step": 314194, "epoch": 1870} {"train_loss": -11.588423728942871, "global_step": 314195, "epoch": 1870} {"train_loss": -11.431017875671387, "global_step": 314196, "epoch": 1870} {"train_loss": -12.032258987426758, "global_step": 314197, "epoch": 1870} {"train_loss": -11.87550163269043, "global_step": 314198, "epoch": 1870} {"train_loss": -11.581522941589355, "global_step": 314199, "epoch": 1870} {"train_loss": -12.167706489562988, "global_step": 314200, "epoch": 1870} {"train_loss": -11.833195686340332, "global_step": 314201, "epoch": 1870} {"train_loss": -12.080215454101562, "global_step": 314202, "epoch": 1870} {"train_loss": -11.715425491333008, "global_step": 314203, "epoch": 1870} {"train_loss": -11.814370155334473, "global_step": 314204, "epoch": 1870} {"train_loss": -11.490472793579102, "global_step": 314205, "epoch": 1870} {"train_loss": -12.111806869506836, "global_step": 314206, "epoch": 1870} {"train_loss": -11.860668182373047, "global_step": 314207, "epoch": 1870} {"train_loss": -11.415468215942383, "global_step": 314208, "epoch": 1870} {"train_loss": -11.793779373168945, "global_step": 314209, "epoch": 1870} {"train_loss": -11.329561233520508, "global_step": 314210, "epoch": 1870} {"train_loss": -10.721052169799805, "global_step": 314211, "epoch": 1870} {"train_loss": -11.21126651763916, "global_step": 314212, "epoch": 1870} {"train_loss": -10.332599639892578, "global_step": 314213, "epoch": 1870} {"train_loss": -11.60427188873291, "global_step": 314214, "epoch": 1870} {"train_loss": -11.083630561828613, "global_step": 314215, "epoch": 1870} {"train_loss": -10.907838821411133, "global_step": 314216, "epoch": 1870} {"train_loss": -11.036354064941406, "global_step": 314217, "epoch": 1870} {"train_loss": -10.70231819152832, "global_step": 314218, "epoch": 1870} {"train_loss": -10.434350967407227, "global_step": 314219, "epoch": 1870} {"train_loss": -11.046890258789062, "global_step": 314220, "epoch": 1870} {"train_loss": -10.337475776672363, "global_step": 314221, "epoch": 1870} {"train_loss": -11.938619613647461, "global_step": 314222, "epoch": 1870} {"train_loss": -11.269643783569336, "global_step": 314223, "epoch": 1870} {"train_loss": -10.923749923706055, "global_step": 314224, "epoch": 1870} {"train_loss": -11.44531536102295, "global_step": 314225, "epoch": 1870} {"train_loss": -10.987543106079102, "global_step": 314226, "epoch": 1870} {"train_loss": -11.779199600219727, "global_step": 314227, "epoch": 1870} {"train_loss": -10.987607955932617, "global_step": 314228, "epoch": 1870} {"train_loss": -10.668704986572266, "global_step": 314229, "epoch": 1870} {"train_loss": -10.934492111206055, "global_step": 314230, "epoch": 1870} {"train_loss": -11.096656799316406, "global_step": 314231, "epoch": 1870} {"train_loss": -10.719179153442383, "global_step": 314232, "epoch": 1870} {"train_loss": -11.217336654663086, "global_step": 314233, "epoch": 1870} {"train_loss": -11.699562072753906, "global_step": 314234, "epoch": 1870} {"train_loss": -11.715736389160156, "global_step": 314235, "epoch": 1870} {"train_loss": -11.602700233459473, "global_step": 314236, "epoch": 1870} {"train_loss": -11.752342224121094, "global_step": 314237, "epoch": 1870} {"train_loss": -11.720010757446289, "global_step": 314238, "epoch": 1870} {"train_loss": -11.634187698364258, "global_step": 314239, "epoch": 1870} {"train_loss": -11.599092483520508, "global_step": 314240, "epoch": 1870} {"train_loss": -11.808025360107422, "global_step": 314241, "epoch": 1870} {"train_loss": -12.006441116333008, "global_step": 314242, "epoch": 1870} {"train_loss": -11.826700210571289, "global_step": 314243, "epoch": 1870} {"train_loss": -11.836977005004883, "global_step": 314244, "epoch": 1870} {"train_loss": -12.129878997802734, "global_step": 314245, "epoch": 1870} {"train_loss": -12.16952896118164, "global_step": 314246, "epoch": 1870} {"train_loss": -12.057586669921875, "global_step": 314247, "epoch": 1870} {"train_loss": -11.839316368103027, "global_step": 314248, "epoch": 1870} {"train_loss": -11.787420272827148, "global_step": 314249, "epoch": 1870} {"train_loss": -12.137635231018066, "global_step": 314250, "epoch": 1870} {"train_loss": -12.021024703979492, "global_step": 314251, "epoch": 1870} {"train_loss": -12.269023895263672, "global_step": 314252, "epoch": 1870} {"train_loss": -12.102887153625488, "global_step": 314253, "epoch": 1870} {"train_loss": -11.95580005645752, "global_step": 314254, "epoch": 1870} {"train_loss": -12.160866737365723, "global_step": 314255, "epoch": 1870} {"train_loss": -12.092540740966797, "global_step": 314256, "epoch": 1870} {"train_loss": -12.249914169311523, "global_step": 314257, "epoch": 1870} {"train_loss": -12.121713638305664, "global_step": 314258, "epoch": 1870} {"train_loss": -11.923491477966309, "global_step": 314259, "epoch": 1870} {"train_loss": -12.158056259155273, "global_step": 314260, "epoch": 1870} {"train_loss": -12.331487655639648, "global_step": 314261, "epoch": 1870} {"train_loss": -12.023895263671875, "global_step": 314262, "epoch": 1870} {"train_loss": -12.355751037597656, "global_step": 314263, "epoch": 1870} {"train_loss": -12.4567289352417, "global_step": 314264, "epoch": 1870} {"train_loss": -12.363597869873047, "global_step": 314265, "epoch": 1870} {"train_loss": -12.29069709777832, "global_step": 314266, "epoch": 1870} {"train_loss": -12.340675354003906, "global_step": 314267, "epoch": 1870} {"train_loss": -12.241849899291992, "global_step": 314268, "epoch": 1870} {"train_loss": -12.383922576904297, "global_step": 314269, "epoch": 1870} {"train_loss": -12.552286148071289, "global_step": 314270, "epoch": 1870} {"train_loss": -12.371308326721191, "global_step": 314271, "epoch": 1870} {"train_loss": -12.552519798278809, "global_step": 314272, "epoch": 1870} {"train_loss": -12.481014251708984, "global_step": 314273, "epoch": 1870} {"train_loss": -12.247591018676758, "global_step": 314274, "epoch": 1870} {"train_loss": -12.18467903137207, "global_step": 314275, "epoch": 1870} {"train_loss": -12.309953689575195, "global_step": 314276, "epoch": 1870} {"train_loss": -12.344758987426758, "global_step": 314277, "epoch": 1870} {"train_loss": -12.25838851928711, "global_step": 314278, "epoch": 1870} {"train_loss": -12.375997543334961, "global_step": 314279, "epoch": 1870} {"train_loss": -12.268901824951172, "global_step": 314280, "epoch": 1870} {"train_loss": -12.445232391357422, "global_step": 314281, "epoch": 1870} {"train_loss": -12.339621543884277, "global_step": 314282, "epoch": 1870} {"train_loss": -12.47717571258545, "global_step": 314283, "epoch": 1870} {"train_loss": -12.35234260559082, "global_step": 314284, "epoch": 1870} {"train_loss": -12.421730041503906, "global_step": 314285, "epoch": 1870} {"train_loss": -12.447603225708008, "global_step": 314286, "epoch": 1870} {"train_loss": -12.262791633605957, "global_step": 314287, "epoch": 1870} {"train_loss": -12.230781555175781, "global_step": 314288, "epoch": 1870} {"train_loss": -12.235833168029785, "global_step": 314289, "epoch": 1870} {"train_loss": -12.502889633178711, "global_step": 314290, "epoch": 1870} {"train_loss": -12.224977493286133, "global_step": 314291, "epoch": 1870} {"train_loss": -12.476251602172852, "global_step": 314292, "epoch": 1870} {"train_loss": -12.575237274169922, "global_step": 314293, "epoch": 1870} {"train_loss": -12.59778881072998, "global_step": 314294, "epoch": 1870} {"train_loss": -12.39923095703125, "global_step": 314295, "epoch": 1870} {"train_loss": -12.699056625366211, "global_step": 314296, "epoch": 1870} {"train_loss": -12.61600112915039, "global_step": 314297, "epoch": 1870} {"train_loss": -12.431877136230469, "global_step": 314298, "epoch": 1870} {"train_loss": -12.509551048278809, "global_step": 314299, "epoch": 1870} {"train_loss": -12.779397964477539, "global_step": 314300, "epoch": 1870} {"train_loss": -12.520904541015625, "global_step": 314301, "epoch": 1870} {"train_loss": -12.464401245117188, "global_step": 314302, "epoch": 1870} {"train_loss": -12.253223419189453, "global_step": 314303, "epoch": 1870} {"train_loss": -12.555547714233398, "global_step": 314304, "epoch": 1870} {"train_loss": -12.152149200439453, "global_step": 314305, "epoch": 1870} {"train_loss": -10.49751091003418, "global_step": 314306, "epoch": 1870} {"train_loss": -12.030618667602539, "global_step": 314307, "epoch": 1870} {"train_loss": -11.30181884765625, "global_step": 314308, "epoch": 1870} {"train_loss": -9.732038497924805, "global_step": 314309, "epoch": 1870} {"train_loss": -10.298728942871094, "global_step": 314310, "epoch": 1870} {"train_loss": -12.061009407043457, "global_step": 314311, "epoch": 1870} {"train_loss": -9.895910263061523, "global_step": 314312, "epoch": 1870} {"train_loss": -12.128277778625488, "global_step": 314313, "epoch": 1870} {"train_loss": -10.13250732421875, "global_step": 314314, "epoch": 1870} {"train_loss": -12.083642959594727, "global_step": 314315, "epoch": 1870} {"train_loss": -10.373077392578125, "global_step": 314316, "epoch": 1870} {"train_loss": -11.141677856445312, "global_step": 314317, "epoch": 1870} {"train_loss": -10.909884452819824, "global_step": 314318, "epoch": 1870} {"train_loss": -11.807889938354492, "global_step": 314319, "epoch": 1870} {"train_loss": -10.994729995727539, "global_step": 314320, "epoch": 1870} {"train_loss": -11.621156692504883, "global_step": 314321, "epoch": 1870} {"train_loss": -11.470697402954102, "global_step": 314322, "epoch": 1870} {"train_loss": -11.018402099609375, "global_step": 314323, "epoch": 1870} {"train_loss": -11.832854270935059, "global_step": 314324, "epoch": 1870} {"train_loss": -11.48981761932373, "global_step": 314325, "epoch": 1870} {"train_loss": -11.172525405883789, "global_step": 314326, "epoch": 1870} {"train_loss": -11.777080683481126, "global_step": 314327, "epoch": 1870, "val_loss": 287875.34375, "train_action_mse_error": 1.4368464946746826} {"train_loss": -10.665863037109375, "global_step": 314328, "epoch": 1871} {"train_loss": -10.92165756225586, "global_step": 314329, "epoch": 1871} {"train_loss": -11.089694023132324, "global_step": 314330, "epoch": 1871} {"train_loss": -10.416236877441406, "global_step": 314331, "epoch": 1871} {"train_loss": -11.533283233642578, "global_step": 314332, "epoch": 1871} {"train_loss": -10.317399024963379, "global_step": 314333, "epoch": 1871} {"train_loss": -11.648984909057617, "global_step": 314334, "epoch": 1871} {"train_loss": -11.020951271057129, "global_step": 314335, "epoch": 1871} {"train_loss": -11.447856903076172, "global_step": 314336, "epoch": 1871} {"train_loss": -11.709138870239258, "global_step": 314337, "epoch": 1871} {"train_loss": -10.965738296508789, "global_step": 314338, "epoch": 1871} {"train_loss": -11.567110061645508, "global_step": 314339, "epoch": 1871} {"train_loss": -11.268697738647461, "global_step": 314340, "epoch": 1871} {"train_loss": -11.74519157409668, "global_step": 314341, "epoch": 1871} {"train_loss": -11.342154502868652, "global_step": 314342, "epoch": 1871} {"train_loss": -11.463464736938477, "global_step": 314343, "epoch": 1871} {"train_loss": -11.911958694458008, "global_step": 314344, "epoch": 1871} {"train_loss": -11.437257766723633, "global_step": 314345, "epoch": 1871} {"train_loss": -11.746667861938477, "global_step": 314346, "epoch": 1871} {"train_loss": -11.51530647277832, "global_step": 314347, "epoch": 1871} {"train_loss": -11.73613166809082, "global_step": 314348, "epoch": 1871} {"train_loss": -11.834725379943848, "global_step": 314349, "epoch": 1871} {"train_loss": -11.770963668823242, "global_step": 314350, "epoch": 1871} {"train_loss": -11.893487930297852, "global_step": 314351, "epoch": 1871} {"train_loss": -12.051109313964844, "global_step": 314352, "epoch": 1871} {"train_loss": -11.861898422241211, "global_step": 314353, "epoch": 1871} {"train_loss": -12.171546936035156, "global_step": 314354, "epoch": 1871} {"train_loss": -12.284801483154297, "global_step": 314355, "epoch": 1871} {"train_loss": -12.080217361450195, "global_step": 314356, "epoch": 1871} {"train_loss": -11.986400604248047, "global_step": 314357, "epoch": 1871} {"train_loss": -12.12441635131836, "global_step": 314358, "epoch": 1871} {"train_loss": -12.284708023071289, "global_step": 314359, "epoch": 1871} {"train_loss": -12.249034881591797, "global_step": 314360, "epoch": 1871} {"train_loss": -12.420388221740723, "global_step": 314361, "epoch": 1871} {"train_loss": -12.270914077758789, "global_step": 314362, "epoch": 1871} {"train_loss": -12.31857967376709, "global_step": 314363, "epoch": 1871} {"train_loss": -12.265932083129883, "global_step": 314364, "epoch": 1871} {"train_loss": -12.340994834899902, "global_step": 314365, "epoch": 1871} {"train_loss": -12.601849555969238, "global_step": 314366, "epoch": 1871} {"train_loss": -12.081230163574219, "global_step": 314367, "epoch": 1871} {"train_loss": -12.318985939025879, "global_step": 314368, "epoch": 1871} {"train_loss": -12.315664291381836, "global_step": 314369, "epoch": 1871} {"train_loss": -12.528480529785156, "global_step": 314370, "epoch": 1871} {"train_loss": -12.393045425415039, "global_step": 314371, "epoch": 1871} {"train_loss": -12.056695938110352, "global_step": 314372, "epoch": 1871} {"train_loss": -12.245004653930664, "global_step": 314373, "epoch": 1871} {"train_loss": -12.281135559082031, "global_step": 314374, "epoch": 1871} {"train_loss": -12.249902725219727, "global_step": 314375, "epoch": 1871} {"train_loss": -12.267284393310547, "global_step": 314376, "epoch": 1871} {"train_loss": -12.463567733764648, "global_step": 314377, "epoch": 1871} {"train_loss": -12.12497329711914, "global_step": 314378, "epoch": 1871} {"train_loss": -12.455862045288086, "global_step": 314379, "epoch": 1871} {"train_loss": -12.011362075805664, "global_step": 314380, "epoch": 1871} {"train_loss": -12.151684761047363, "global_step": 314381, "epoch": 1871} {"train_loss": -12.32362174987793, "global_step": 314382, "epoch": 1871} {"train_loss": -11.971322059631348, "global_step": 314383, "epoch": 1871} {"train_loss": -12.42829704284668, "global_step": 314384, "epoch": 1871} {"train_loss": -12.380541801452637, "global_step": 314385, "epoch": 1871} {"train_loss": -12.14798641204834, "global_step": 314386, "epoch": 1871} {"train_loss": -12.203163146972656, "global_step": 314387, "epoch": 1871} {"train_loss": -12.557150840759277, "global_step": 314388, "epoch": 1871} {"train_loss": -11.792688369750977, "global_step": 314389, "epoch": 1871} {"train_loss": -11.333762168884277, "global_step": 314390, "epoch": 1871} {"train_loss": -11.840156555175781, "global_step": 314391, "epoch": 1871} {"train_loss": -12.42941665649414, "global_step": 314392, "epoch": 1871} {"train_loss": -12.02728271484375, "global_step": 314393, "epoch": 1871} {"train_loss": -11.750944137573242, "global_step": 314394, "epoch": 1871} {"train_loss": -12.269628524780273, "global_step": 314395, "epoch": 1871} {"train_loss": -12.158926010131836, "global_step": 314396, "epoch": 1871} {"train_loss": -12.210927963256836, "global_step": 314397, "epoch": 1871} {"train_loss": -12.59646987915039, "global_step": 314398, "epoch": 1871} {"train_loss": -12.131023406982422, "global_step": 314399, "epoch": 1871} {"train_loss": -12.322244644165039, "global_step": 314400, "epoch": 1871} {"train_loss": -12.238439559936523, "global_step": 314401, "epoch": 1871} {"train_loss": -12.174217224121094, "global_step": 314402, "epoch": 1871} {"train_loss": -12.08208179473877, "global_step": 314403, "epoch": 1871} {"train_loss": -12.282073974609375, "global_step": 314404, "epoch": 1871} {"train_loss": -11.838918685913086, "global_step": 314405, "epoch": 1871} {"train_loss": -12.39212703704834, "global_step": 314406, "epoch": 1871} {"train_loss": -12.210784912109375, "global_step": 314407, "epoch": 1871} {"train_loss": -12.178828239440918, "global_step": 314408, "epoch": 1871} {"train_loss": -12.204023361206055, "global_step": 314409, "epoch": 1871} {"train_loss": -12.559160232543945, "global_step": 314410, "epoch": 1871} {"train_loss": -12.149477005004883, "global_step": 314411, "epoch": 1871} {"train_loss": -11.902484893798828, "global_step": 314412, "epoch": 1871} {"train_loss": -12.462220191955566, "global_step": 314413, "epoch": 1871} {"train_loss": -12.29350757598877, "global_step": 314414, "epoch": 1871} {"train_loss": -12.354930877685547, "global_step": 314415, "epoch": 1871} {"train_loss": -12.46383285522461, "global_step": 314416, "epoch": 1871} {"train_loss": -12.477190017700195, "global_step": 314417, "epoch": 1871} {"train_loss": -12.28701114654541, "global_step": 314418, "epoch": 1871} {"train_loss": -12.517905235290527, "global_step": 314419, "epoch": 1871} {"train_loss": -12.282327651977539, "global_step": 314420, "epoch": 1871} {"train_loss": -11.813735961914062, "global_step": 314421, "epoch": 1871} {"train_loss": -11.981171607971191, "global_step": 314422, "epoch": 1871} {"train_loss": -12.352764129638672, "global_step": 314423, "epoch": 1871} {"train_loss": -11.839000701904297, "global_step": 314424, "epoch": 1871} {"train_loss": -11.422088623046875, "global_step": 314425, "epoch": 1871} {"train_loss": -12.360794067382812, "global_step": 314426, "epoch": 1871} {"train_loss": -12.257746696472168, "global_step": 314427, "epoch": 1871} {"train_loss": -11.212139129638672, "global_step": 314428, "epoch": 1871} {"train_loss": -11.74510383605957, "global_step": 314429, "epoch": 1871} {"train_loss": -12.370439529418945, "global_step": 314430, "epoch": 1871} {"train_loss": -11.504459381103516, "global_step": 314431, "epoch": 1871} {"train_loss": -11.487226486206055, "global_step": 314432, "epoch": 1871} {"train_loss": -11.523287773132324, "global_step": 314433, "epoch": 1871} {"train_loss": -11.410285949707031, "global_step": 314434, "epoch": 1871} {"train_loss": -10.372882843017578, "global_step": 314435, "epoch": 1871} {"train_loss": -10.844925880432129, "global_step": 314436, "epoch": 1871} {"train_loss": -9.776239395141602, "global_step": 314437, "epoch": 1871} {"train_loss": -11.177377700805664, "global_step": 314438, "epoch": 1871} {"train_loss": -11.08576774597168, "global_step": 314439, "epoch": 1871} {"train_loss": -10.494245529174805, "global_step": 314440, "epoch": 1871} {"train_loss": -11.595661163330078, "global_step": 314441, "epoch": 1871} {"train_loss": -10.588689804077148, "global_step": 314442, "epoch": 1871} {"train_loss": -12.044515609741211, "global_step": 314443, "epoch": 1871} {"train_loss": -10.765518188476562, "global_step": 314444, "epoch": 1871} {"train_loss": -11.872736930847168, "global_step": 314445, "epoch": 1871} {"train_loss": -11.301055908203125, "global_step": 314446, "epoch": 1871} {"train_loss": -10.887929916381836, "global_step": 314447, "epoch": 1871} {"train_loss": -12.10862922668457, "global_step": 314448, "epoch": 1871} {"train_loss": -11.395951271057129, "global_step": 314449, "epoch": 1871} {"train_loss": -10.889233589172363, "global_step": 314450, "epoch": 1871} {"train_loss": -11.521350860595703, "global_step": 314451, "epoch": 1871} {"train_loss": -10.453777313232422, "global_step": 314452, "epoch": 1871} {"train_loss": -11.315668106079102, "global_step": 314453, "epoch": 1871} {"train_loss": -10.479223251342773, "global_step": 314454, "epoch": 1871} {"train_loss": -11.23991584777832, "global_step": 314455, "epoch": 1871} {"train_loss": -11.204845428466797, "global_step": 314456, "epoch": 1871} {"train_loss": -11.35464859008789, "global_step": 314457, "epoch": 1871} {"train_loss": -11.626572608947754, "global_step": 314458, "epoch": 1871} {"train_loss": -11.190998077392578, "global_step": 314459, "epoch": 1871} {"train_loss": -11.933441162109375, "global_step": 314460, "epoch": 1871} {"train_loss": -11.002286911010742, "global_step": 314461, "epoch": 1871} {"train_loss": -11.956300735473633, "global_step": 314462, "epoch": 1871} {"train_loss": -11.628373146057129, "global_step": 314463, "epoch": 1871} {"train_loss": -11.415472030639648, "global_step": 314464, "epoch": 1871} {"train_loss": -11.964029312133789, "global_step": 314465, "epoch": 1871} {"train_loss": -11.716575622558594, "global_step": 314466, "epoch": 1871} {"train_loss": -11.926143646240234, "global_step": 314467, "epoch": 1871} {"train_loss": -11.591306686401367, "global_step": 314468, "epoch": 1871} {"train_loss": -11.648280143737793, "global_step": 314469, "epoch": 1871} {"train_loss": -12.033498764038086, "global_step": 314470, "epoch": 1871} {"train_loss": -11.475261688232422, "global_step": 314471, "epoch": 1871} {"train_loss": -11.664521217346191, "global_step": 314472, "epoch": 1871} {"train_loss": -11.68055248260498, "global_step": 314473, "epoch": 1871} {"train_loss": -11.318303108215332, "global_step": 314474, "epoch": 1871} {"train_loss": -12.108071327209473, "global_step": 314475, "epoch": 1871} {"train_loss": -11.477434158325195, "global_step": 314476, "epoch": 1871} {"train_loss": -11.822538375854492, "global_step": 314477, "epoch": 1871} {"train_loss": -11.974395751953125, "global_step": 314478, "epoch": 1871} {"train_loss": -11.877382278442383, "global_step": 314479, "epoch": 1871} {"train_loss": -12.003196716308594, "global_step": 314480, "epoch": 1871} {"train_loss": -11.541997909545898, "global_step": 314481, "epoch": 1871} {"train_loss": -11.65277099609375, "global_step": 314482, "epoch": 1871} {"train_loss": -11.826616287231445, "global_step": 314483, "epoch": 1871} {"train_loss": -11.517277717590332, "global_step": 314484, "epoch": 1871} {"train_loss": -11.50284481048584, "global_step": 314485, "epoch": 1871} {"train_loss": -10.326140403747559, "global_step": 314486, "epoch": 1871} {"train_loss": -12.249940872192383, "global_step": 314487, "epoch": 1871} {"train_loss": -11.483123779296875, "global_step": 314488, "epoch": 1871} {"train_loss": -11.061700820922852, "global_step": 314489, "epoch": 1871} {"train_loss": -11.397671699523926, "global_step": 314490, "epoch": 1871} {"train_loss": -11.195633888244629, "global_step": 314491, "epoch": 1871} {"train_loss": -11.604887962341309, "global_step": 314492, "epoch": 1871} {"train_loss": -11.599945068359375, "global_step": 314493, "epoch": 1871} {"train_loss": -11.246464729309082, "global_step": 314494, "epoch": 1871} {"train_loss": -11.769495220411391, "global_step": 314495, "epoch": 1871, "val_loss": 286829.40625} {"train_loss": -11.996166229248047, "global_step": 314496, "epoch": 1872} {"train_loss": -11.737428665161133, "global_step": 314497, "epoch": 1872} {"train_loss": -11.859859466552734, "global_step": 314498, "epoch": 1872} {"train_loss": -11.701014518737793, "global_step": 314499, "epoch": 1872} {"train_loss": -11.635025024414062, "global_step": 314500, "epoch": 1872} {"train_loss": -11.079146385192871, "global_step": 314501, "epoch": 1872} {"train_loss": -12.061365127563477, "global_step": 314502, "epoch": 1872} {"train_loss": -10.995254516601562, "global_step": 314503, "epoch": 1872} {"train_loss": -11.728358268737793, "global_step": 314504, "epoch": 1872} {"train_loss": -10.97974967956543, "global_step": 314505, "epoch": 1872} {"train_loss": -11.416128158569336, "global_step": 314506, "epoch": 1872} {"train_loss": -11.530266761779785, "global_step": 314507, "epoch": 1872} {"train_loss": -11.135374069213867, "global_step": 314508, "epoch": 1872} {"train_loss": -11.317760467529297, "global_step": 314509, "epoch": 1872} {"train_loss": -11.797015190124512, "global_step": 314510, "epoch": 1872} {"train_loss": -11.488238334655762, "global_step": 314511, "epoch": 1872} {"train_loss": -11.693846702575684, "global_step": 314512, "epoch": 1872} {"train_loss": -11.172182083129883, "global_step": 314513, "epoch": 1872} {"train_loss": -11.766295433044434, "global_step": 314514, "epoch": 1872} {"train_loss": -11.325648307800293, "global_step": 314515, "epoch": 1872} {"train_loss": -11.420971870422363, "global_step": 314516, "epoch": 1872} {"train_loss": -11.757190704345703, "global_step": 314517, "epoch": 1872} {"train_loss": -11.544194221496582, "global_step": 314518, "epoch": 1872} {"train_loss": -12.048990249633789, "global_step": 314519, "epoch": 1872} {"train_loss": -11.586783409118652, "global_step": 314520, "epoch": 1872} {"train_loss": -12.197057723999023, "global_step": 314521, "epoch": 1872} {"train_loss": -11.919475555419922, "global_step": 314522, "epoch": 1872} {"train_loss": -12.048421859741211, "global_step": 314523, "epoch": 1872} {"train_loss": -11.931286811828613, "global_step": 314524, "epoch": 1872} {"train_loss": -12.162023544311523, "global_step": 314525, "epoch": 1872} {"train_loss": -11.451644897460938, "global_step": 314526, "epoch": 1872} {"train_loss": -12.36089038848877, "global_step": 314527, "epoch": 1872} {"train_loss": -11.675581932067871, "global_step": 314528, "epoch": 1872} {"train_loss": -12.236007690429688, "global_step": 314529, "epoch": 1872} {"train_loss": -11.856517791748047, "global_step": 314530, "epoch": 1872} {"train_loss": -12.194074630737305, "global_step": 314531, "epoch": 1872} {"train_loss": -12.281455039978027, "global_step": 314532, "epoch": 1872} {"train_loss": -12.104161262512207, "global_step": 314533, "epoch": 1872} {"train_loss": -12.102466583251953, "global_step": 314534, "epoch": 1872} {"train_loss": -11.957157135009766, "global_step": 314535, "epoch": 1872} {"train_loss": -12.092798233032227, "global_step": 314536, "epoch": 1872} {"train_loss": -11.781820297241211, "global_step": 314537, "epoch": 1872} {"train_loss": -12.244850158691406, "global_step": 314538, "epoch": 1872} {"train_loss": -11.75330924987793, "global_step": 314539, "epoch": 1872} {"train_loss": -12.22689437866211, "global_step": 314540, "epoch": 1872} {"train_loss": -12.064249038696289, "global_step": 314541, "epoch": 1872} {"train_loss": -11.97458267211914, "global_step": 314542, "epoch": 1872} {"train_loss": -11.931846618652344, "global_step": 314543, "epoch": 1872} {"train_loss": -12.12180233001709, "global_step": 314544, "epoch": 1872} {"train_loss": -12.166780471801758, "global_step": 314545, "epoch": 1872} {"train_loss": -12.388072967529297, "global_step": 314546, "epoch": 1872} {"train_loss": -12.334195137023926, "global_step": 314547, "epoch": 1872} {"train_loss": -12.284682273864746, "global_step": 314548, "epoch": 1872} {"train_loss": -12.400413513183594, "global_step": 314549, "epoch": 1872} {"train_loss": -12.339102745056152, "global_step": 314550, "epoch": 1872} {"train_loss": -12.438224792480469, "global_step": 314551, "epoch": 1872} {"train_loss": -12.35391616821289, "global_step": 314552, "epoch": 1872} {"train_loss": -12.298965454101562, "global_step": 314553, "epoch": 1872} {"train_loss": -12.144449234008789, "global_step": 314554, "epoch": 1872} {"train_loss": -12.290757179260254, "global_step": 314555, "epoch": 1872} {"train_loss": -12.28341293334961, "global_step": 314556, "epoch": 1872} {"train_loss": -11.997486114501953, "global_step": 314557, "epoch": 1872} {"train_loss": -12.030684471130371, "global_step": 314558, "epoch": 1872} {"train_loss": -11.916535377502441, "global_step": 314559, "epoch": 1872} {"train_loss": -12.24942684173584, "global_step": 314560, "epoch": 1872} {"train_loss": -12.270147323608398, "global_step": 314561, "epoch": 1872} {"train_loss": -12.330060005187988, "global_step": 314562, "epoch": 1872} {"train_loss": -11.892810821533203, "global_step": 314563, "epoch": 1872} {"train_loss": -12.003841400146484, "global_step": 314564, "epoch": 1872} {"train_loss": -12.273687362670898, "global_step": 314565, "epoch": 1872} {"train_loss": -11.937320709228516, "global_step": 314566, "epoch": 1872} {"train_loss": -11.964116096496582, "global_step": 314567, "epoch": 1872} {"train_loss": -11.457252502441406, "global_step": 314568, "epoch": 1872} {"train_loss": -11.993807792663574, "global_step": 314569, "epoch": 1872} {"train_loss": -12.11121654510498, "global_step": 314570, "epoch": 1872} {"train_loss": -11.896675109863281, "global_step": 314571, "epoch": 1872} {"train_loss": -12.33469295501709, "global_step": 314572, "epoch": 1872} {"train_loss": -11.90098762512207, "global_step": 314573, "epoch": 1872} {"train_loss": -12.483671188354492, "global_step": 314574, "epoch": 1872} {"train_loss": -12.094024658203125, "global_step": 314575, "epoch": 1872} {"train_loss": -12.146621704101562, "global_step": 314576, "epoch": 1872} {"train_loss": -11.760894775390625, "global_step": 314577, "epoch": 1872} {"train_loss": -12.298985481262207, "global_step": 314578, "epoch": 1872} {"train_loss": -12.394214630126953, "global_step": 314579, "epoch": 1872} {"train_loss": -12.043414115905762, "global_step": 314580, "epoch": 1872} {"train_loss": -12.430967330932617, "global_step": 314581, "epoch": 1872} {"train_loss": -12.306774139404297, "global_step": 314582, "epoch": 1872} {"train_loss": -11.925714492797852, "global_step": 314583, "epoch": 1872} {"train_loss": -12.134081840515137, "global_step": 314584, "epoch": 1872} {"train_loss": -11.942584991455078, "global_step": 314585, "epoch": 1872} {"train_loss": -12.588445663452148, "global_step": 314586, "epoch": 1872} {"train_loss": -11.733458518981934, "global_step": 314587, "epoch": 1872} {"train_loss": -12.39799690246582, "global_step": 314588, "epoch": 1872} {"train_loss": -12.180216789245605, "global_step": 314589, "epoch": 1872} {"train_loss": -12.300821304321289, "global_step": 314590, "epoch": 1872} {"train_loss": -12.190359115600586, "global_step": 314591, "epoch": 1872} {"train_loss": -12.320984840393066, "global_step": 314592, "epoch": 1872} {"train_loss": -12.126789093017578, "global_step": 314593, "epoch": 1872} {"train_loss": -12.467531204223633, "global_step": 314594, "epoch": 1872} {"train_loss": -12.188335418701172, "global_step": 314595, "epoch": 1872} {"train_loss": -12.139352798461914, "global_step": 314596, "epoch": 1872} {"train_loss": -12.389041900634766, "global_step": 314597, "epoch": 1872} {"train_loss": -12.609957695007324, "global_step": 314598, "epoch": 1872} {"train_loss": -12.131200790405273, "global_step": 314599, "epoch": 1872} {"train_loss": -12.453567504882812, "global_step": 314600, "epoch": 1872} {"train_loss": -12.319082260131836, "global_step": 314601, "epoch": 1872} {"train_loss": -12.057014465332031, "global_step": 314602, "epoch": 1872} {"train_loss": -11.742201805114746, "global_step": 314603, "epoch": 1872} {"train_loss": -11.888412475585938, "global_step": 314604, "epoch": 1872} {"train_loss": -12.15192699432373, "global_step": 314605, "epoch": 1872} {"train_loss": -11.62509536743164, "global_step": 314606, "epoch": 1872} {"train_loss": -12.025227546691895, "global_step": 314607, "epoch": 1872} {"train_loss": -12.240381240844727, "global_step": 314608, "epoch": 1872} {"train_loss": -11.362234115600586, "global_step": 314609, "epoch": 1872} {"train_loss": -11.392507553100586, "global_step": 314610, "epoch": 1872} {"train_loss": -11.978225708007812, "global_step": 314611, "epoch": 1872} {"train_loss": -12.121437072753906, "global_step": 314612, "epoch": 1872} {"train_loss": -12.136251449584961, "global_step": 314613, "epoch": 1872} {"train_loss": -12.177285194396973, "global_step": 314614, "epoch": 1872} {"train_loss": -11.937915802001953, "global_step": 314615, "epoch": 1872} {"train_loss": -12.059971809387207, "global_step": 314616, "epoch": 1872} {"train_loss": -12.033805847167969, "global_step": 314617, "epoch": 1872} {"train_loss": -11.733358383178711, "global_step": 314618, "epoch": 1872} {"train_loss": -11.554283142089844, "global_step": 314619, "epoch": 1872} {"train_loss": -10.976896286010742, "global_step": 314620, "epoch": 1872} {"train_loss": -10.78584098815918, "global_step": 314621, "epoch": 1872} {"train_loss": -12.04903793334961, "global_step": 314622, "epoch": 1872} {"train_loss": -10.749037742614746, "global_step": 314623, "epoch": 1872} {"train_loss": -11.500345230102539, "global_step": 314624, "epoch": 1872} {"train_loss": -11.724071502685547, "global_step": 314625, "epoch": 1872} {"train_loss": -11.30301284790039, "global_step": 314626, "epoch": 1872} {"train_loss": -12.005751609802246, "global_step": 314627, "epoch": 1872} {"train_loss": -11.482272148132324, "global_step": 314628, "epoch": 1872} {"train_loss": -11.72858715057373, "global_step": 314629, "epoch": 1872} {"train_loss": -11.380044937133789, "global_step": 314630, "epoch": 1872} {"train_loss": -12.035942077636719, "global_step": 314631, "epoch": 1872} {"train_loss": -11.669898986816406, "global_step": 314632, "epoch": 1872} {"train_loss": -11.539430618286133, "global_step": 314633, "epoch": 1872} {"train_loss": -11.64258098602295, "global_step": 314634, "epoch": 1872} {"train_loss": -11.25456428527832, "global_step": 314635, "epoch": 1872} {"train_loss": -11.623720169067383, "global_step": 314636, "epoch": 1872} {"train_loss": -11.634748458862305, "global_step": 314637, "epoch": 1872} {"train_loss": -11.023334503173828, "global_step": 314638, "epoch": 1872} {"train_loss": -11.569440841674805, "global_step": 314639, "epoch": 1872} {"train_loss": -11.137459754943848, "global_step": 314640, "epoch": 1872} {"train_loss": -11.550827026367188, "global_step": 314641, "epoch": 1872} {"train_loss": -11.78370475769043, "global_step": 314642, "epoch": 1872} {"train_loss": -11.802358627319336, "global_step": 314643, "epoch": 1872} {"train_loss": -11.741788864135742, "global_step": 314644, "epoch": 1872} {"train_loss": -11.82153034210205, "global_step": 314645, "epoch": 1872} {"train_loss": -11.876368522644043, "global_step": 314646, "epoch": 1872} {"train_loss": -11.509683609008789, "global_step": 314647, "epoch": 1872} {"train_loss": -11.904956817626953, "global_step": 314648, "epoch": 1872} {"train_loss": -11.638374328613281, "global_step": 314649, "epoch": 1872} {"train_loss": -10.478473663330078, "global_step": 314650, "epoch": 1872} {"train_loss": -10.716970443725586, "global_step": 314651, "epoch": 1872} {"train_loss": -11.193098068237305, "global_step": 314652, "epoch": 1872} {"train_loss": -10.977104187011719, "global_step": 314653, "epoch": 1872} {"train_loss": -10.859018325805664, "global_step": 314654, "epoch": 1872} {"train_loss": -11.109521865844727, "global_step": 314655, "epoch": 1872} {"train_loss": -11.397432327270508, "global_step": 314656, "epoch": 1872} {"train_loss": -11.620784759521484, "global_step": 314657, "epoch": 1872} {"train_loss": -11.159950256347656, "global_step": 314658, "epoch": 1872} {"train_loss": -11.061933517456055, "global_step": 314659, "epoch": 1872} {"train_loss": -11.78759765625, "global_step": 314660, "epoch": 1872} {"train_loss": -11.122441291809082, "global_step": 314661, "epoch": 1872} {"train_loss": -11.785294532775879, "global_step": 314662, "epoch": 1872} {"train_loss": -11.842936396598816, "global_step": 314663, "epoch": 1872, "val_loss": 284656.875} {"train_loss": -10.462878227233887, "global_step": 314664, "epoch": 1873} {"train_loss": -11.852879524230957, "global_step": 314665, "epoch": 1873} {"train_loss": -10.744881629943848, "global_step": 314666, "epoch": 1873} {"train_loss": -11.80601978302002, "global_step": 314667, "epoch": 1873} {"train_loss": -11.011409759521484, "global_step": 314668, "epoch": 1873} {"train_loss": -11.780569076538086, "global_step": 314669, "epoch": 1873} {"train_loss": -11.850189208984375, "global_step": 314670, "epoch": 1873} {"train_loss": -11.71910572052002, "global_step": 314671, "epoch": 1873} {"train_loss": -11.931259155273438, "global_step": 314672, "epoch": 1873} {"train_loss": -11.975133895874023, "global_step": 314673, "epoch": 1873} {"train_loss": -11.710243225097656, "global_step": 314674, "epoch": 1873} {"train_loss": -12.27383804321289, "global_step": 314675, "epoch": 1873} {"train_loss": -12.01282024383545, "global_step": 314676, "epoch": 1873} {"train_loss": -11.869781494140625, "global_step": 314677, "epoch": 1873} {"train_loss": -12.193811416625977, "global_step": 314678, "epoch": 1873} {"train_loss": -11.969902992248535, "global_step": 314679, "epoch": 1873} {"train_loss": -11.964874267578125, "global_step": 314680, "epoch": 1873} {"train_loss": -12.02940845489502, "global_step": 314681, "epoch": 1873} {"train_loss": -11.497081756591797, "global_step": 314682, "epoch": 1873} {"train_loss": -12.163673400878906, "global_step": 314683, "epoch": 1873} {"train_loss": -11.629680633544922, "global_step": 314684, "epoch": 1873} {"train_loss": -12.188024520874023, "global_step": 314685, "epoch": 1873} {"train_loss": -11.96596622467041, "global_step": 314686, "epoch": 1873} {"train_loss": -11.599122047424316, "global_step": 314687, "epoch": 1873} {"train_loss": -12.25727367401123, "global_step": 314688, "epoch": 1873} {"train_loss": -11.633871078491211, "global_step": 314689, "epoch": 1873} {"train_loss": -11.892601013183594, "global_step": 314690, "epoch": 1873} {"train_loss": -11.856094360351562, "global_step": 314691, "epoch": 1873} {"train_loss": -11.391382217407227, "global_step": 314692, "epoch": 1873} {"train_loss": -12.095836639404297, "global_step": 314693, "epoch": 1873} {"train_loss": -11.336441993713379, "global_step": 314694, "epoch": 1873} {"train_loss": -11.95338249206543, "global_step": 314695, "epoch": 1873} {"train_loss": -12.112032890319824, "global_step": 314696, "epoch": 1873} {"train_loss": -11.441819190979004, "global_step": 314697, "epoch": 1873} {"train_loss": -12.11731243133545, "global_step": 314698, "epoch": 1873} {"train_loss": -11.749963760375977, "global_step": 314699, "epoch": 1873} {"train_loss": -11.970870018005371, "global_step": 314700, "epoch": 1873} {"train_loss": -12.348505020141602, "global_step": 314701, "epoch": 1873} {"train_loss": -11.914521217346191, "global_step": 314702, "epoch": 1873} {"train_loss": -12.210901260375977, "global_step": 314703, "epoch": 1873} {"train_loss": -11.933609008789062, "global_step": 314704, "epoch": 1873} {"train_loss": -12.146929740905762, "global_step": 314705, "epoch": 1873} {"train_loss": -12.202281951904297, "global_step": 314706, "epoch": 1873} {"train_loss": -11.79568862915039, "global_step": 314707, "epoch": 1873} {"train_loss": -12.037832260131836, "global_step": 314708, "epoch": 1873} {"train_loss": -12.24665355682373, "global_step": 314709, "epoch": 1873} {"train_loss": -11.969284057617188, "global_step": 314710, "epoch": 1873} {"train_loss": -12.23488998413086, "global_step": 314711, "epoch": 1873} {"train_loss": -12.0340576171875, "global_step": 314712, "epoch": 1873} {"train_loss": -11.971893310546875, "global_step": 314713, "epoch": 1873} {"train_loss": -12.171335220336914, "global_step": 314714, "epoch": 1873} {"train_loss": -12.02101993560791, "global_step": 314715, "epoch": 1873} {"train_loss": -12.059089660644531, "global_step": 314716, "epoch": 1873} {"train_loss": -11.678573608398438, "global_step": 314717, "epoch": 1873} {"train_loss": -11.748897552490234, "global_step": 314718, "epoch": 1873} {"train_loss": -11.869702339172363, "global_step": 314719, "epoch": 1873} {"train_loss": -11.578409194946289, "global_step": 314720, "epoch": 1873} {"train_loss": -12.394044876098633, "global_step": 314721, "epoch": 1873} {"train_loss": -11.89407730102539, "global_step": 314722, "epoch": 1873} {"train_loss": -11.828110694885254, "global_step": 314723, "epoch": 1873} {"train_loss": -12.113018035888672, "global_step": 314724, "epoch": 1873} {"train_loss": -11.722585678100586, "global_step": 314725, "epoch": 1873} {"train_loss": -11.99081802368164, "global_step": 314726, "epoch": 1873} {"train_loss": -11.699413299560547, "global_step": 314727, "epoch": 1873} {"train_loss": -11.572040557861328, "global_step": 314728, "epoch": 1873} {"train_loss": -11.882027626037598, "global_step": 314729, "epoch": 1873} {"train_loss": -11.126814842224121, "global_step": 314730, "epoch": 1873} {"train_loss": -11.358946800231934, "global_step": 314731, "epoch": 1873} {"train_loss": -11.869738578796387, "global_step": 314732, "epoch": 1873} {"train_loss": -11.690092086791992, "global_step": 314733, "epoch": 1873} {"train_loss": -12.125219345092773, "global_step": 314734, "epoch": 1873} {"train_loss": -11.596972465515137, "global_step": 314735, "epoch": 1873} {"train_loss": -12.046696662902832, "global_step": 314736, "epoch": 1873} {"train_loss": -11.749241828918457, "global_step": 314737, "epoch": 1873} {"train_loss": -12.041094779968262, "global_step": 314738, "epoch": 1873} {"train_loss": -11.87978744506836, "global_step": 314739, "epoch": 1873} {"train_loss": -12.260753631591797, "global_step": 314740, "epoch": 1873} {"train_loss": -11.747431755065918, "global_step": 314741, "epoch": 1873} {"train_loss": -12.195237159729004, "global_step": 314742, "epoch": 1873} {"train_loss": -11.90550422668457, "global_step": 314743, "epoch": 1873} {"train_loss": -12.08316421508789, "global_step": 314744, "epoch": 1873} {"train_loss": -12.12083625793457, "global_step": 314745, "epoch": 1873} {"train_loss": -11.804425239562988, "global_step": 314746, "epoch": 1873} {"train_loss": -12.226829528808594, "global_step": 314747, "epoch": 1873} {"train_loss": -12.298254013061523, "global_step": 314748, "epoch": 1873} {"train_loss": -12.168386459350586, "global_step": 314749, "epoch": 1873} {"train_loss": -12.229888916015625, "global_step": 314750, "epoch": 1873} {"train_loss": -12.257460594177246, "global_step": 314751, "epoch": 1873} {"train_loss": -12.010053634643555, "global_step": 314752, "epoch": 1873} {"train_loss": -12.015485763549805, "global_step": 314753, "epoch": 1873} {"train_loss": -12.332708358764648, "global_step": 314754, "epoch": 1873} {"train_loss": -12.14087963104248, "global_step": 314755, "epoch": 1873} {"train_loss": -12.046919822692871, "global_step": 314756, "epoch": 1873} {"train_loss": -12.179086685180664, "global_step": 314757, "epoch": 1873} {"train_loss": -12.08057975769043, "global_step": 314758, "epoch": 1873} {"train_loss": -12.094661712646484, "global_step": 314759, "epoch": 1873} {"train_loss": -12.263357162475586, "global_step": 314760, "epoch": 1873} {"train_loss": -12.25126838684082, "global_step": 314761, "epoch": 1873} {"train_loss": -12.3399658203125, "global_step": 314762, "epoch": 1873} {"train_loss": -12.465548515319824, "global_step": 314763, "epoch": 1873} {"train_loss": -12.543581008911133, "global_step": 314764, "epoch": 1873} {"train_loss": -12.482086181640625, "global_step": 314765, "epoch": 1873} {"train_loss": -12.476842880249023, "global_step": 314766, "epoch": 1873} {"train_loss": -12.44752311706543, "global_step": 314767, "epoch": 1873} {"train_loss": -12.561217308044434, "global_step": 314768, "epoch": 1873} {"train_loss": -12.347055435180664, "global_step": 314769, "epoch": 1873} {"train_loss": -12.51340389251709, "global_step": 314770, "epoch": 1873} {"train_loss": -12.539375305175781, "global_step": 314771, "epoch": 1873} {"train_loss": -12.284173965454102, "global_step": 314772, "epoch": 1873} {"train_loss": -12.455648422241211, "global_step": 314773, "epoch": 1873} {"train_loss": -12.409269332885742, "global_step": 314774, "epoch": 1873} {"train_loss": -12.300847053527832, "global_step": 314775, "epoch": 1873} {"train_loss": -12.139727592468262, "global_step": 314776, "epoch": 1873} {"train_loss": -12.33060073852539, "global_step": 314777, "epoch": 1873} {"train_loss": -11.736856460571289, "global_step": 314778, "epoch": 1873} {"train_loss": -12.033045768737793, "global_step": 314779, "epoch": 1873} {"train_loss": -12.08012580871582, "global_step": 314780, "epoch": 1873} {"train_loss": -11.857617378234863, "global_step": 314781, "epoch": 1873} {"train_loss": -12.229101181030273, "global_step": 314782, "epoch": 1873} {"train_loss": -12.140151977539062, "global_step": 314783, "epoch": 1873} {"train_loss": -11.391578674316406, "global_step": 314784, "epoch": 1873} {"train_loss": -11.61684513092041, "global_step": 314785, "epoch": 1873} {"train_loss": -12.061341285705566, "global_step": 314786, "epoch": 1873} {"train_loss": -11.422991752624512, "global_step": 314787, "epoch": 1873} {"train_loss": -10.909378051757812, "global_step": 314788, "epoch": 1873} {"train_loss": -11.682722091674805, "global_step": 314789, "epoch": 1873} {"train_loss": -11.496468544006348, "global_step": 314790, "epoch": 1873} {"train_loss": -10.997420310974121, "global_step": 314791, "epoch": 1873} {"train_loss": -10.848426818847656, "global_step": 314792, "epoch": 1873} {"train_loss": -11.197708129882812, "global_step": 314793, "epoch": 1873} {"train_loss": -8.328083992004395, "global_step": 314794, "epoch": 1873} {"train_loss": -8.397544860839844, "global_step": 314795, "epoch": 1873} {"train_loss": -8.440059661865234, "global_step": 314796, "epoch": 1873} {"train_loss": -10.017194747924805, "global_step": 314797, "epoch": 1873} {"train_loss": -10.140510559082031, "global_step": 314798, "epoch": 1873} {"train_loss": -8.732404708862305, "global_step": 314799, "epoch": 1873} {"train_loss": -9.313764572143555, "global_step": 314800, "epoch": 1873} {"train_loss": -9.907353401184082, "global_step": 314801, "epoch": 1873} {"train_loss": -10.645883560180664, "global_step": 314802, "epoch": 1873} {"train_loss": -10.399005889892578, "global_step": 314803, "epoch": 1873} {"train_loss": -10.446954727172852, "global_step": 314804, "epoch": 1873} {"train_loss": -11.00401496887207, "global_step": 314805, "epoch": 1873} {"train_loss": -9.987070083618164, "global_step": 314806, "epoch": 1873} {"train_loss": -10.601510047912598, "global_step": 314807, "epoch": 1873} {"train_loss": -10.616915702819824, "global_step": 314808, "epoch": 1873} {"train_loss": -10.413419723510742, "global_step": 314809, "epoch": 1873} {"train_loss": -10.565118789672852, "global_step": 314810, "epoch": 1873} {"train_loss": -11.450299263000488, "global_step": 314811, "epoch": 1873} {"train_loss": -10.733613967895508, "global_step": 314812, "epoch": 1873} {"train_loss": -11.677901268005371, "global_step": 314813, "epoch": 1873} {"train_loss": -10.548562049865723, "global_step": 314814, "epoch": 1873} {"train_loss": -11.358314514160156, "global_step": 314815, "epoch": 1873} {"train_loss": -11.243011474609375, "global_step": 314816, "epoch": 1873} {"train_loss": -10.95956039428711, "global_step": 314817, "epoch": 1873} {"train_loss": -11.199037551879883, "global_step": 314818, "epoch": 1873} {"train_loss": -10.710582733154297, "global_step": 314819, "epoch": 1873} {"train_loss": -10.398797035217285, "global_step": 314820, "epoch": 1873} {"train_loss": -10.144856452941895, "global_step": 314821, "epoch": 1873} {"train_loss": -10.39901065826416, "global_step": 314822, "epoch": 1873} {"train_loss": -10.486480712890625, "global_step": 314823, "epoch": 1873} {"train_loss": -10.291601181030273, "global_step": 314824, "epoch": 1873} {"train_loss": -10.92177963256836, "global_step": 314825, "epoch": 1873} {"train_loss": -10.396750450134277, "global_step": 314826, "epoch": 1873} {"train_loss": -11.118194580078125, "global_step": 314827, "epoch": 1873} {"train_loss": -9.907491683959961, "global_step": 314828, "epoch": 1873} {"train_loss": -11.435640335083008, "global_step": 314829, "epoch": 1873} {"train_loss": -9.711503982543945, "global_step": 314830, "epoch": 1873} {"train_loss": -11.584780483018784, "global_step": 314831, "epoch": 1873, "val_loss": 284131.3125} {"train_loss": -10.37904167175293, "global_step": 314832, "epoch": 1874} {"train_loss": -10.268526077270508, "global_step": 314833, "epoch": 1874} {"train_loss": -10.927377700805664, "global_step": 314834, "epoch": 1874} {"train_loss": -10.634745597839355, "global_step": 314835, "epoch": 1874} {"train_loss": -11.345888137817383, "global_step": 314836, "epoch": 1874} {"train_loss": -10.780904769897461, "global_step": 314837, "epoch": 1874} {"train_loss": -11.289894104003906, "global_step": 314838, "epoch": 1874} {"train_loss": -10.715652465820312, "global_step": 314839, "epoch": 1874} {"train_loss": -11.516233444213867, "global_step": 314840, "epoch": 1874} {"train_loss": -10.86452865600586, "global_step": 314841, "epoch": 1874} {"train_loss": -11.151321411132812, "global_step": 314842, "epoch": 1874} {"train_loss": -11.781490325927734, "global_step": 314843, "epoch": 1874} {"train_loss": -10.916802406311035, "global_step": 314844, "epoch": 1874} {"train_loss": -11.66263198852539, "global_step": 314845, "epoch": 1874} {"train_loss": -11.25286865234375, "global_step": 314846, "epoch": 1874} {"train_loss": -11.62918472290039, "global_step": 314847, "epoch": 1874} {"train_loss": -11.559881210327148, "global_step": 314848, "epoch": 1874} {"train_loss": -11.260725975036621, "global_step": 314849, "epoch": 1874} {"train_loss": -11.586294174194336, "global_step": 314850, "epoch": 1874} {"train_loss": -11.408575057983398, "global_step": 314851, "epoch": 1874} {"train_loss": -11.715853691101074, "global_step": 314852, "epoch": 1874} {"train_loss": -11.34839916229248, "global_step": 314853, "epoch": 1874} {"train_loss": -11.922086715698242, "global_step": 314854, "epoch": 1874} {"train_loss": -11.705975532531738, "global_step": 314855, "epoch": 1874} {"train_loss": -11.590444564819336, "global_step": 314856, "epoch": 1874} {"train_loss": -11.780256271362305, "global_step": 314857, "epoch": 1874} {"train_loss": -11.944860458374023, "global_step": 314858, "epoch": 1874} {"train_loss": -11.768659591674805, "global_step": 314859, "epoch": 1874} {"train_loss": -12.124982833862305, "global_step": 314860, "epoch": 1874} {"train_loss": -11.954978942871094, "global_step": 314861, "epoch": 1874} {"train_loss": -11.837892532348633, "global_step": 314862, "epoch": 1874} {"train_loss": -11.859440803527832, "global_step": 314863, "epoch": 1874} {"train_loss": -11.750007629394531, "global_step": 314864, "epoch": 1874} {"train_loss": -11.815083503723145, "global_step": 314865, "epoch": 1874} {"train_loss": -12.031712532043457, "global_step": 314866, "epoch": 1874} {"train_loss": -12.116986274719238, "global_step": 314867, "epoch": 1874} {"train_loss": -12.11292839050293, "global_step": 314868, "epoch": 1874} {"train_loss": -12.035804748535156, "global_step": 314869, "epoch": 1874} {"train_loss": -11.981705665588379, "global_step": 314870, "epoch": 1874} {"train_loss": -12.253460884094238, "global_step": 314871, "epoch": 1874} {"train_loss": -12.29813003540039, "global_step": 314872, "epoch": 1874} {"train_loss": -12.226949691772461, "global_step": 314873, "epoch": 1874} {"train_loss": -12.151297569274902, "global_step": 314874, "epoch": 1874} {"train_loss": -12.059327125549316, "global_step": 314875, "epoch": 1874} {"train_loss": -11.9962158203125, "global_step": 314876, "epoch": 1874} {"train_loss": -12.061136245727539, "global_step": 314877, "epoch": 1874} {"train_loss": -12.317124366760254, "global_step": 314878, "epoch": 1874} {"train_loss": -12.196480751037598, "global_step": 314879, "epoch": 1874} {"train_loss": -12.286425590515137, "global_step": 314880, "epoch": 1874} {"train_loss": -12.08012580871582, "global_step": 314881, "epoch": 1874} {"train_loss": -12.365588188171387, "global_step": 314882, "epoch": 1874} {"train_loss": -12.140597343444824, "global_step": 314883, "epoch": 1874} {"train_loss": -12.318035125732422, "global_step": 314884, "epoch": 1874} {"train_loss": -12.371613502502441, "global_step": 314885, "epoch": 1874} {"train_loss": -12.295013427734375, "global_step": 314886, "epoch": 1874} {"train_loss": -12.211210250854492, "global_step": 314887, "epoch": 1874} {"train_loss": -12.298075675964355, "global_step": 314888, "epoch": 1874} {"train_loss": -12.40457534790039, "global_step": 314889, "epoch": 1874} {"train_loss": -12.430047988891602, "global_step": 314890, "epoch": 1874} {"train_loss": -12.347304344177246, "global_step": 314891, "epoch": 1874} {"train_loss": -12.266212463378906, "global_step": 314892, "epoch": 1874} {"train_loss": -12.470932960510254, "global_step": 314893, "epoch": 1874} {"train_loss": -12.527007102966309, "global_step": 314894, "epoch": 1874} {"train_loss": -12.340795516967773, "global_step": 314895, "epoch": 1874} {"train_loss": -12.44991683959961, "global_step": 314896, "epoch": 1874} {"train_loss": -12.44355583190918, "global_step": 314897, "epoch": 1874} {"train_loss": -12.510852813720703, "global_step": 314898, "epoch": 1874} {"train_loss": -12.381094932556152, "global_step": 314899, "epoch": 1874} {"train_loss": -12.299304962158203, "global_step": 314900, "epoch": 1874} {"train_loss": -12.55165958404541, "global_step": 314901, "epoch": 1874} {"train_loss": -12.417284965515137, "global_step": 314902, "epoch": 1874} {"train_loss": -12.394026756286621, "global_step": 314903, "epoch": 1874} {"train_loss": -12.288700103759766, "global_step": 314904, "epoch": 1874} {"train_loss": -12.423276901245117, "global_step": 314905, "epoch": 1874} {"train_loss": -12.325765609741211, "global_step": 314906, "epoch": 1874} {"train_loss": -12.353546142578125, "global_step": 314907, "epoch": 1874} {"train_loss": -12.389715194702148, "global_step": 314908, "epoch": 1874} {"train_loss": -12.523308753967285, "global_step": 314909, "epoch": 1874} {"train_loss": -12.376785278320312, "global_step": 314910, "epoch": 1874} {"train_loss": -12.43774127960205, "global_step": 314911, "epoch": 1874} {"train_loss": -12.5252685546875, "global_step": 314912, "epoch": 1874} {"train_loss": -11.970335006713867, "global_step": 314913, "epoch": 1874} {"train_loss": -12.50703239440918, "global_step": 314914, "epoch": 1874} {"train_loss": -12.519059181213379, "global_step": 314915, "epoch": 1874} {"train_loss": -12.305276870727539, "global_step": 314916, "epoch": 1874} {"train_loss": -12.398014068603516, "global_step": 314917, "epoch": 1874} {"train_loss": -12.38115119934082, "global_step": 314918, "epoch": 1874} {"train_loss": -12.42856502532959, "global_step": 314919, "epoch": 1874} {"train_loss": -12.484471321105957, "global_step": 314920, "epoch": 1874} {"train_loss": -12.297679901123047, "global_step": 314921, "epoch": 1874} {"train_loss": -12.586181640625, "global_step": 314922, "epoch": 1874} {"train_loss": -12.290513038635254, "global_step": 314923, "epoch": 1874} {"train_loss": -12.436380386352539, "global_step": 314924, "epoch": 1874} {"train_loss": -12.403192520141602, "global_step": 314925, "epoch": 1874} {"train_loss": -12.409666061401367, "global_step": 314926, "epoch": 1874} {"train_loss": -12.397797584533691, "global_step": 314927, "epoch": 1874} {"train_loss": -12.586893081665039, "global_step": 314928, "epoch": 1874} {"train_loss": -12.467084884643555, "global_step": 314929, "epoch": 1874} {"train_loss": -12.600793838500977, "global_step": 314930, "epoch": 1874} {"train_loss": -11.990211486816406, "global_step": 314931, "epoch": 1874} {"train_loss": -12.44090461730957, "global_step": 314932, "epoch": 1874} {"train_loss": -12.484724044799805, "global_step": 314933, "epoch": 1874} {"train_loss": -12.529064178466797, "global_step": 314934, "epoch": 1874} {"train_loss": -11.784698486328125, "global_step": 314935, "epoch": 1874} {"train_loss": -11.796566009521484, "global_step": 314936, "epoch": 1874} {"train_loss": -12.114954948425293, "global_step": 314937, "epoch": 1874} {"train_loss": -12.226381301879883, "global_step": 314938, "epoch": 1874} {"train_loss": -12.107990264892578, "global_step": 314939, "epoch": 1874} {"train_loss": -11.707477569580078, "global_step": 314940, "epoch": 1874} {"train_loss": -12.039764404296875, "global_step": 314941, "epoch": 1874} {"train_loss": -12.492240905761719, "global_step": 314942, "epoch": 1874} {"train_loss": -11.92164421081543, "global_step": 314943, "epoch": 1874} {"train_loss": -12.288061141967773, "global_step": 314944, "epoch": 1874} {"train_loss": -11.273605346679688, "global_step": 314945, "epoch": 1874} {"train_loss": -11.99531364440918, "global_step": 314946, "epoch": 1874} {"train_loss": -12.274055480957031, "global_step": 314947, "epoch": 1874} {"train_loss": -12.272367477416992, "global_step": 314948, "epoch": 1874} {"train_loss": -11.823308944702148, "global_step": 314949, "epoch": 1874} {"train_loss": -10.963894844055176, "global_step": 314950, "epoch": 1874} {"train_loss": -11.997941970825195, "global_step": 314951, "epoch": 1874} {"train_loss": -11.361473083496094, "global_step": 314952, "epoch": 1874} {"train_loss": -11.437800407409668, "global_step": 314953, "epoch": 1874} {"train_loss": -10.422747611999512, "global_step": 314954, "epoch": 1874} {"train_loss": -10.097991943359375, "global_step": 314955, "epoch": 1874} {"train_loss": -11.088300704956055, "global_step": 314956, "epoch": 1874} {"train_loss": -9.078901290893555, "global_step": 314957, "epoch": 1874} {"train_loss": -10.006204605102539, "global_step": 314958, "epoch": 1874} {"train_loss": -8.762613296508789, "global_step": 314959, "epoch": 1874} {"train_loss": -10.502128601074219, "global_step": 314960, "epoch": 1874} {"train_loss": -10.024744987487793, "global_step": 314961, "epoch": 1874} {"train_loss": -9.745237350463867, "global_step": 314962, "epoch": 1874} {"train_loss": -8.736067771911621, "global_step": 314963, "epoch": 1874} {"train_loss": -10.683164596557617, "global_step": 314964, "epoch": 1874} {"train_loss": -10.875019073486328, "global_step": 314965, "epoch": 1874} {"train_loss": -9.657012939453125, "global_step": 314966, "epoch": 1874} {"train_loss": -10.668176651000977, "global_step": 314967, "epoch": 1874} {"train_loss": -10.710102081298828, "global_step": 314968, "epoch": 1874} {"train_loss": -9.559499740600586, "global_step": 314969, "epoch": 1874} {"train_loss": -10.898480415344238, "global_step": 314970, "epoch": 1874} {"train_loss": -9.751317024230957, "global_step": 314971, "epoch": 1874} {"train_loss": -10.746123313903809, "global_step": 314972, "epoch": 1874} {"train_loss": -10.216876983642578, "global_step": 314973, "epoch": 1874} {"train_loss": -10.954282760620117, "global_step": 314974, "epoch": 1874} {"train_loss": -10.462944984436035, "global_step": 314975, "epoch": 1874} {"train_loss": -11.287851333618164, "global_step": 314976, "epoch": 1874} {"train_loss": -11.108020782470703, "global_step": 314977, "epoch": 1874} {"train_loss": -10.605436325073242, "global_step": 314978, "epoch": 1874} {"train_loss": -11.08507251739502, "global_step": 314979, "epoch": 1874} {"train_loss": -11.31190299987793, "global_step": 314980, "epoch": 1874} {"train_loss": -10.713106155395508, "global_step": 314981, "epoch": 1874} {"train_loss": -11.273397445678711, "global_step": 314982, "epoch": 1874} {"train_loss": -11.545129776000977, "global_step": 314983, "epoch": 1874} {"train_loss": -11.432647705078125, "global_step": 314984, "epoch": 1874} {"train_loss": -11.214296340942383, "global_step": 314985, "epoch": 1874} {"train_loss": -11.379150390625, "global_step": 314986, "epoch": 1874} {"train_loss": -11.401739120483398, "global_step": 314987, "epoch": 1874} {"train_loss": -11.673267364501953, "global_step": 314988, "epoch": 1874} {"train_loss": -11.678173065185547, "global_step": 314989, "epoch": 1874} {"train_loss": -11.558045387268066, "global_step": 314990, "epoch": 1874} {"train_loss": -11.8129301071167, "global_step": 314991, "epoch": 1874} {"train_loss": -11.874613761901855, "global_step": 314992, "epoch": 1874} {"train_loss": -11.472334861755371, "global_step": 314993, "epoch": 1874} {"train_loss": -11.852686882019043, "global_step": 314994, "epoch": 1874} {"train_loss": -11.716524124145508, "global_step": 314995, "epoch": 1874} {"train_loss": -11.78913688659668, "global_step": 314996, "epoch": 1874} {"train_loss": -11.689724922180176, "global_step": 314997, "epoch": 1874} {"train_loss": -12.049997329711914, "global_step": 314998, "epoch": 1874} {"train_loss": -11.690621285211472, "global_step": 314999, "epoch": 1874, "val_loss": 272729.28125} {"train_loss": -12.067072868347168, "global_step": 315000, "epoch": 1875} {"train_loss": -11.541757583618164, "global_step": 315001, "epoch": 1875} {"train_loss": -12.04698657989502, "global_step": 315002, "epoch": 1875} {"train_loss": -11.92867374420166, "global_step": 315003, "epoch": 1875} {"train_loss": -11.967714309692383, "global_step": 315004, "epoch": 1875} {"train_loss": -12.10228157043457, "global_step": 315005, "epoch": 1875} {"train_loss": -11.77134895324707, "global_step": 315006, "epoch": 1875} {"train_loss": -12.264652252197266, "global_step": 315007, "epoch": 1875} {"train_loss": -12.062382698059082, "global_step": 315008, "epoch": 1875} {"train_loss": -11.825393676757812, "global_step": 315009, "epoch": 1875} {"train_loss": -12.084546089172363, "global_step": 315010, "epoch": 1875} {"train_loss": -11.798334121704102, "global_step": 315011, "epoch": 1875} {"train_loss": -11.951387405395508, "global_step": 315012, "epoch": 1875} {"train_loss": -12.113130569458008, "global_step": 315013, "epoch": 1875} {"train_loss": -11.707275390625, "global_step": 315014, "epoch": 1875} {"train_loss": -12.29444408416748, "global_step": 315015, "epoch": 1875} {"train_loss": -12.0964994430542, "global_step": 315016, "epoch": 1875} {"train_loss": -12.322269439697266, "global_step": 315017, "epoch": 1875} {"train_loss": -12.089889526367188, "global_step": 315018, "epoch": 1875} {"train_loss": -12.116737365722656, "global_step": 315019, "epoch": 1875} {"train_loss": -11.776121139526367, "global_step": 315020, "epoch": 1875} {"train_loss": -12.279345512390137, "global_step": 315021, "epoch": 1875} {"train_loss": -11.93862533569336, "global_step": 315022, "epoch": 1875} {"train_loss": -12.450920104980469, "global_step": 315023, "epoch": 1875} {"train_loss": -11.82070541381836, "global_step": 315024, "epoch": 1875} {"train_loss": -12.075281143188477, "global_step": 315025, "epoch": 1875} {"train_loss": -11.88228988647461, "global_step": 315026, "epoch": 1875} {"train_loss": -12.373403549194336, "global_step": 315027, "epoch": 1875} {"train_loss": -11.667157173156738, "global_step": 315028, "epoch": 1875} {"train_loss": -12.093684196472168, "global_step": 315029, "epoch": 1875} {"train_loss": -11.956888198852539, "global_step": 315030, "epoch": 1875} {"train_loss": -11.8621187210083, "global_step": 315031, "epoch": 1875} {"train_loss": -12.028428077697754, "global_step": 315032, "epoch": 1875} {"train_loss": -11.97197437286377, "global_step": 315033, "epoch": 1875} {"train_loss": -12.114301681518555, "global_step": 315034, "epoch": 1875} {"train_loss": -12.029989242553711, "global_step": 315035, "epoch": 1875} {"train_loss": -11.962278366088867, "global_step": 315036, "epoch": 1875} {"train_loss": -11.615189552307129, "global_step": 315037, "epoch": 1875} {"train_loss": -12.354930877685547, "global_step": 315038, "epoch": 1875} {"train_loss": -12.024971961975098, "global_step": 315039, "epoch": 1875} {"train_loss": -11.963672637939453, "global_step": 315040, "epoch": 1875} {"train_loss": -12.067794799804688, "global_step": 315041, "epoch": 1875} {"train_loss": -12.093104362487793, "global_step": 315042, "epoch": 1875} {"train_loss": -11.898663520812988, "global_step": 315043, "epoch": 1875} {"train_loss": -12.201875686645508, "global_step": 315044, "epoch": 1875} {"train_loss": -11.944435119628906, "global_step": 315045, "epoch": 1875} {"train_loss": -12.009735107421875, "global_step": 315046, "epoch": 1875} {"train_loss": -12.222002983093262, "global_step": 315047, "epoch": 1875} {"train_loss": -12.392698287963867, "global_step": 315048, "epoch": 1875} {"train_loss": -12.43120002746582, "global_step": 315049, "epoch": 1875} {"train_loss": -12.44943618774414, "global_step": 315050, "epoch": 1875} {"train_loss": -12.121374130249023, "global_step": 315051, "epoch": 1875} {"train_loss": -12.139907836914062, "global_step": 315052, "epoch": 1875} {"train_loss": -12.380937576293945, "global_step": 315053, "epoch": 1875} {"train_loss": -12.284561157226562, "global_step": 315054, "epoch": 1875} {"train_loss": -12.144552230834961, "global_step": 315055, "epoch": 1875} {"train_loss": -12.092636108398438, "global_step": 315056, "epoch": 1875} {"train_loss": -12.281852722167969, "global_step": 315057, "epoch": 1875} {"train_loss": -12.250147819519043, "global_step": 315058, "epoch": 1875} {"train_loss": -12.394441604614258, "global_step": 315059, "epoch": 1875} {"train_loss": -12.349569320678711, "global_step": 315060, "epoch": 1875} {"train_loss": -12.210142135620117, "global_step": 315061, "epoch": 1875} {"train_loss": -12.362716674804688, "global_step": 315062, "epoch": 1875} {"train_loss": -12.348932266235352, "global_step": 315063, "epoch": 1875} {"train_loss": -12.055999755859375, "global_step": 315064, "epoch": 1875} {"train_loss": -12.23324203491211, "global_step": 315065, "epoch": 1875} {"train_loss": -12.018022537231445, "global_step": 315066, "epoch": 1875} {"train_loss": -12.026472091674805, "global_step": 315067, "epoch": 1875} {"train_loss": -12.403498649597168, "global_step": 315068, "epoch": 1875} {"train_loss": -12.175934791564941, "global_step": 315069, "epoch": 1875} {"train_loss": -12.262187957763672, "global_step": 315070, "epoch": 1875} {"train_loss": -12.20677375793457, "global_step": 315071, "epoch": 1875} {"train_loss": -12.618912696838379, "global_step": 315072, "epoch": 1875} {"train_loss": -12.29006576538086, "global_step": 315073, "epoch": 1875} {"train_loss": -12.031647682189941, "global_step": 315074, "epoch": 1875} {"train_loss": -11.959997177124023, "global_step": 315075, "epoch": 1875} {"train_loss": -12.483417510986328, "global_step": 315076, "epoch": 1875} {"train_loss": -12.190445899963379, "global_step": 315077, "epoch": 1875} {"train_loss": -12.419021606445312, "global_step": 315078, "epoch": 1875} {"train_loss": -11.920723915100098, "global_step": 315079, "epoch": 1875} {"train_loss": -11.999626159667969, "global_step": 315080, "epoch": 1875} {"train_loss": -11.947717666625977, "global_step": 315081, "epoch": 1875} {"train_loss": -12.029722213745117, "global_step": 315082, "epoch": 1875} {"train_loss": -12.177651405334473, "global_step": 315083, "epoch": 1875} {"train_loss": -11.903732299804688, "global_step": 315084, "epoch": 1875} {"train_loss": -11.762033462524414, "global_step": 315085, "epoch": 1875} {"train_loss": -11.412771224975586, "global_step": 315086, "epoch": 1875} {"train_loss": -11.892473220825195, "global_step": 315087, "epoch": 1875} {"train_loss": -11.119025230407715, "global_step": 315088, "epoch": 1875} {"train_loss": -11.958382606506348, "global_step": 315089, "epoch": 1875} {"train_loss": -11.74075698852539, "global_step": 315090, "epoch": 1875} {"train_loss": -11.409149169921875, "global_step": 315091, "epoch": 1875} {"train_loss": -11.00617790222168, "global_step": 315092, "epoch": 1875} {"train_loss": -11.803435325622559, "global_step": 315093, "epoch": 1875} {"train_loss": -11.995166778564453, "global_step": 315094, "epoch": 1875} {"train_loss": -10.836421012878418, "global_step": 315095, "epoch": 1875} {"train_loss": -10.829504013061523, "global_step": 315096, "epoch": 1875} {"train_loss": -11.018728256225586, "global_step": 315097, "epoch": 1875} {"train_loss": -11.94494915008545, "global_step": 315098, "epoch": 1875} {"train_loss": -11.547407150268555, "global_step": 315099, "epoch": 1875} {"train_loss": -11.678836822509766, "global_step": 315100, "epoch": 1875} {"train_loss": -12.09992790222168, "global_step": 315101, "epoch": 1875} {"train_loss": -11.408400535583496, "global_step": 315102, "epoch": 1875} {"train_loss": -11.520059585571289, "global_step": 315103, "epoch": 1875} {"train_loss": -11.321951866149902, "global_step": 315104, "epoch": 1875} {"train_loss": -11.853975296020508, "global_step": 315105, "epoch": 1875} {"train_loss": -11.574289321899414, "global_step": 315106, "epoch": 1875} {"train_loss": -12.1787748336792, "global_step": 315107, "epoch": 1875} {"train_loss": -11.043452262878418, "global_step": 315108, "epoch": 1875} {"train_loss": -12.158632278442383, "global_step": 315109, "epoch": 1875} {"train_loss": -11.334178924560547, "global_step": 315110, "epoch": 1875} {"train_loss": -12.206268310546875, "global_step": 315111, "epoch": 1875} {"train_loss": -12.218242645263672, "global_step": 315112, "epoch": 1875} {"train_loss": -11.686214447021484, "global_step": 315113, "epoch": 1875} {"train_loss": -12.052446365356445, "global_step": 315114, "epoch": 1875} {"train_loss": -12.012672424316406, "global_step": 315115, "epoch": 1875} {"train_loss": -11.908597946166992, "global_step": 315116, "epoch": 1875} {"train_loss": -11.763225555419922, "global_step": 315117, "epoch": 1875} {"train_loss": -11.91097640991211, "global_step": 315118, "epoch": 1875} {"train_loss": -12.334182739257812, "global_step": 315119, "epoch": 1875} {"train_loss": -12.299135208129883, "global_step": 315120, "epoch": 1875} {"train_loss": -12.227880477905273, "global_step": 315121, "epoch": 1875} {"train_loss": -12.100183486938477, "global_step": 315122, "epoch": 1875} {"train_loss": -12.273175239562988, "global_step": 315123, "epoch": 1875} {"train_loss": -11.531679153442383, "global_step": 315124, "epoch": 1875} {"train_loss": -12.022696495056152, "global_step": 315125, "epoch": 1875} {"train_loss": -11.69875717163086, "global_step": 315126, "epoch": 1875} {"train_loss": -11.956295013427734, "global_step": 315127, "epoch": 1875} {"train_loss": -11.978307723999023, "global_step": 315128, "epoch": 1875} {"train_loss": -11.902654647827148, "global_step": 315129, "epoch": 1875} {"train_loss": -12.093755722045898, "global_step": 315130, "epoch": 1875} {"train_loss": -12.151317596435547, "global_step": 315131, "epoch": 1875} {"train_loss": -11.94198989868164, "global_step": 315132, "epoch": 1875} {"train_loss": -11.934950828552246, "global_step": 315133, "epoch": 1875} {"train_loss": -11.899572372436523, "global_step": 315134, "epoch": 1875} {"train_loss": -11.731435775756836, "global_step": 315135, "epoch": 1875} {"train_loss": -12.013765335083008, "global_step": 315136, "epoch": 1875} {"train_loss": -12.064648628234863, "global_step": 315137, "epoch": 1875} {"train_loss": -11.581502914428711, "global_step": 315138, "epoch": 1875} {"train_loss": -11.91307258605957, "global_step": 315139, "epoch": 1875} {"train_loss": -12.230443000793457, "global_step": 315140, "epoch": 1875} {"train_loss": -11.652469635009766, "global_step": 315141, "epoch": 1875} {"train_loss": -12.06208610534668, "global_step": 315142, "epoch": 1875} {"train_loss": -12.113367080688477, "global_step": 315143, "epoch": 1875} {"train_loss": -11.695699691772461, "global_step": 315144, "epoch": 1875} {"train_loss": -11.921309471130371, "global_step": 315145, "epoch": 1875} {"train_loss": -11.834672927856445, "global_step": 315146, "epoch": 1875} {"train_loss": -12.237974166870117, "global_step": 315147, "epoch": 1875} {"train_loss": -11.984498977661133, "global_step": 315148, "epoch": 1875} {"train_loss": -11.696224212646484, "global_step": 315149, "epoch": 1875} {"train_loss": -12.370125770568848, "global_step": 315150, "epoch": 1875} {"train_loss": -11.538142204284668, "global_step": 315151, "epoch": 1875} {"train_loss": -11.698087692260742, "global_step": 315152, "epoch": 1875} {"train_loss": -11.762489318847656, "global_step": 315153, "epoch": 1875} {"train_loss": -10.464807510375977, "global_step": 315154, "epoch": 1875} {"train_loss": -12.039127349853516, "global_step": 315155, "epoch": 1875} {"train_loss": -10.900361061096191, "global_step": 315156, "epoch": 1875} {"train_loss": -11.923288345336914, "global_step": 315157, "epoch": 1875} {"train_loss": -10.592681884765625, "global_step": 315158, "epoch": 1875} {"train_loss": -12.156135559082031, "global_step": 315159, "epoch": 1875} {"train_loss": -11.355766296386719, "global_step": 315160, "epoch": 1875} {"train_loss": -11.7620267868042, "global_step": 315161, "epoch": 1875} {"train_loss": -11.366600036621094, "global_step": 315162, "epoch": 1875} {"train_loss": -11.474874496459961, "global_step": 315163, "epoch": 1875} {"train_loss": -11.953920364379883, "global_step": 315164, "epoch": 1875} {"train_loss": -10.952367782592773, "global_step": 315165, "epoch": 1875} {"train_loss": -11.697717666625977, "global_step": 315166, "epoch": 1875} {"train_loss": -11.920704359099979, "global_step": 315167, "epoch": 1875, "val_loss": 277498.75, "train_action_mse_error": 0.7162135243415833} {"train_loss": -11.01968002319336, "global_step": 315168, "epoch": 1876} {"train_loss": -11.462785720825195, "global_step": 315169, "epoch": 1876} {"train_loss": -11.493096351623535, "global_step": 315170, "epoch": 1876} {"train_loss": -11.66836166381836, "global_step": 315171, "epoch": 1876} {"train_loss": -11.580650329589844, "global_step": 315172, "epoch": 1876} {"train_loss": -11.66543197631836, "global_step": 315173, "epoch": 1876} {"train_loss": -11.523481369018555, "global_step": 315174, "epoch": 1876} {"train_loss": -11.65945053100586, "global_step": 315175, "epoch": 1876} {"train_loss": -11.413856506347656, "global_step": 315176, "epoch": 1876} {"train_loss": -11.553377151489258, "global_step": 315177, "epoch": 1876} {"train_loss": -11.745113372802734, "global_step": 315178, "epoch": 1876} {"train_loss": -11.466349601745605, "global_step": 315179, "epoch": 1876} {"train_loss": -11.747106552124023, "global_step": 315180, "epoch": 1876} {"train_loss": -11.783697128295898, "global_step": 315181, "epoch": 1876} {"train_loss": -11.931703567504883, "global_step": 315182, "epoch": 1876} {"train_loss": -11.575035095214844, "global_step": 315183, "epoch": 1876} {"train_loss": -11.858427047729492, "global_step": 315184, "epoch": 1876} {"train_loss": -11.313901901245117, "global_step": 315185, "epoch": 1876} {"train_loss": -11.615983963012695, "global_step": 315186, "epoch": 1876} {"train_loss": -11.38624382019043, "global_step": 315187, "epoch": 1876} {"train_loss": -10.986921310424805, "global_step": 315188, "epoch": 1876} {"train_loss": -11.656238555908203, "global_step": 315189, "epoch": 1876} {"train_loss": -10.725658416748047, "global_step": 315190, "epoch": 1876} {"train_loss": -11.646065711975098, "global_step": 315191, "epoch": 1876} {"train_loss": -10.559440612792969, "global_step": 315192, "epoch": 1876} {"train_loss": -11.750407218933105, "global_step": 315193, "epoch": 1876} {"train_loss": -10.368940353393555, "global_step": 315194, "epoch": 1876} {"train_loss": -11.60505199432373, "global_step": 315195, "epoch": 1876} {"train_loss": -10.569868087768555, "global_step": 315196, "epoch": 1876} {"train_loss": -12.053093910217285, "global_step": 315197, "epoch": 1876} {"train_loss": -10.952643394470215, "global_step": 315198, "epoch": 1876} {"train_loss": -11.9446439743042, "global_step": 315199, "epoch": 1876} {"train_loss": -11.370458602905273, "global_step": 315200, "epoch": 1876} {"train_loss": -11.857521057128906, "global_step": 315201, "epoch": 1876} {"train_loss": -10.921026229858398, "global_step": 315202, "epoch": 1876} {"train_loss": -12.125984191894531, "global_step": 315203, "epoch": 1876} {"train_loss": -10.81541633605957, "global_step": 315204, "epoch": 1876} {"train_loss": -11.967178344726562, "global_step": 315205, "epoch": 1876} {"train_loss": -11.524049758911133, "global_step": 315206, "epoch": 1876} {"train_loss": -11.237457275390625, "global_step": 315207, "epoch": 1876} {"train_loss": -11.809518814086914, "global_step": 315208, "epoch": 1876} {"train_loss": -11.395115852355957, "global_step": 315209, "epoch": 1876} {"train_loss": -11.638532638549805, "global_step": 315210, "epoch": 1876} {"train_loss": -11.749765396118164, "global_step": 315211, "epoch": 1876} {"train_loss": -11.307731628417969, "global_step": 315212, "epoch": 1876} {"train_loss": -11.952710151672363, "global_step": 315213, "epoch": 1876} {"train_loss": -11.699009895324707, "global_step": 315214, "epoch": 1876} {"train_loss": -11.717281341552734, "global_step": 315215, "epoch": 1876} {"train_loss": -12.1112060546875, "global_step": 315216, "epoch": 1876} {"train_loss": -11.993778228759766, "global_step": 315217, "epoch": 1876} {"train_loss": -12.140240669250488, "global_step": 315218, "epoch": 1876} {"train_loss": -12.228375434875488, "global_step": 315219, "epoch": 1876} {"train_loss": -12.175543785095215, "global_step": 315220, "epoch": 1876} {"train_loss": -12.093090057373047, "global_step": 315221, "epoch": 1876} {"train_loss": -12.372726440429688, "global_step": 315222, "epoch": 1876} {"train_loss": -12.027112007141113, "global_step": 315223, "epoch": 1876} {"train_loss": -12.114028930664062, "global_step": 315224, "epoch": 1876} {"train_loss": -12.179685592651367, "global_step": 315225, "epoch": 1876} {"train_loss": -12.045455932617188, "global_step": 315226, "epoch": 1876} {"train_loss": -12.406109809875488, "global_step": 315227, "epoch": 1876} {"train_loss": -12.22941780090332, "global_step": 315228, "epoch": 1876} {"train_loss": -12.086834907531738, "global_step": 315229, "epoch": 1876} {"train_loss": -11.977811813354492, "global_step": 315230, "epoch": 1876} {"train_loss": -12.21636962890625, "global_step": 315231, "epoch": 1876} {"train_loss": -12.185932159423828, "global_step": 315232, "epoch": 1876} {"train_loss": -12.13139820098877, "global_step": 315233, "epoch": 1876} {"train_loss": -12.236188888549805, "global_step": 315234, "epoch": 1876} {"train_loss": -12.04655933380127, "global_step": 315235, "epoch": 1876} {"train_loss": -12.192211151123047, "global_step": 315236, "epoch": 1876} {"train_loss": -12.109966278076172, "global_step": 315237, "epoch": 1876} {"train_loss": -12.216599464416504, "global_step": 315238, "epoch": 1876} {"train_loss": -11.924384117126465, "global_step": 315239, "epoch": 1876} {"train_loss": -11.856821060180664, "global_step": 315240, "epoch": 1876} {"train_loss": -12.253738403320312, "global_step": 315241, "epoch": 1876} {"train_loss": -12.129049301147461, "global_step": 315242, "epoch": 1876} {"train_loss": -11.687463760375977, "global_step": 315243, "epoch": 1876} {"train_loss": -12.167665481567383, "global_step": 315244, "epoch": 1876} {"train_loss": -11.973871231079102, "global_step": 315245, "epoch": 1876} {"train_loss": -10.641172409057617, "global_step": 315246, "epoch": 1876} {"train_loss": -12.13939094543457, "global_step": 315247, "epoch": 1876} {"train_loss": -10.906513214111328, "global_step": 315248, "epoch": 1876} {"train_loss": -11.521017074584961, "global_step": 315249, "epoch": 1876} {"train_loss": -11.826563835144043, "global_step": 315250, "epoch": 1876} {"train_loss": -11.371959686279297, "global_step": 315251, "epoch": 1876} {"train_loss": -11.080770492553711, "global_step": 315252, "epoch": 1876} {"train_loss": -12.240730285644531, "global_step": 315253, "epoch": 1876} {"train_loss": -11.795310974121094, "global_step": 315254, "epoch": 1876} {"train_loss": -12.059663772583008, "global_step": 315255, "epoch": 1876} {"train_loss": -12.116363525390625, "global_step": 315256, "epoch": 1876} {"train_loss": -12.2884521484375, "global_step": 315257, "epoch": 1876} {"train_loss": -12.236772537231445, "global_step": 315258, "epoch": 1876} {"train_loss": -11.875482559204102, "global_step": 315259, "epoch": 1876} {"train_loss": -12.050415992736816, "global_step": 315260, "epoch": 1876} {"train_loss": -12.230878829956055, "global_step": 315261, "epoch": 1876} {"train_loss": -11.762994766235352, "global_step": 315262, "epoch": 1876} {"train_loss": -12.129968643188477, "global_step": 315263, "epoch": 1876} {"train_loss": -11.946303367614746, "global_step": 315264, "epoch": 1876} {"train_loss": -12.192522048950195, "global_step": 315265, "epoch": 1876} {"train_loss": -12.135966300964355, "global_step": 315266, "epoch": 1876} {"train_loss": -12.403096199035645, "global_step": 315267, "epoch": 1876} {"train_loss": -11.891794204711914, "global_step": 315268, "epoch": 1876} {"train_loss": -12.16738510131836, "global_step": 315269, "epoch": 1876} {"train_loss": -12.158364295959473, "global_step": 315270, "epoch": 1876} {"train_loss": -12.135900497436523, "global_step": 315271, "epoch": 1876} {"train_loss": -12.191926002502441, "global_step": 315272, "epoch": 1876} {"train_loss": -12.31114387512207, "global_step": 315273, "epoch": 1876} {"train_loss": -12.283327102661133, "global_step": 315274, "epoch": 1876} {"train_loss": -12.192059516906738, "global_step": 315275, "epoch": 1876} {"train_loss": -12.18728256225586, "global_step": 315276, "epoch": 1876} {"train_loss": -12.314342498779297, "global_step": 315277, "epoch": 1876} {"train_loss": -12.161664962768555, "global_step": 315278, "epoch": 1876} {"train_loss": -12.318544387817383, "global_step": 315279, "epoch": 1876} {"train_loss": -11.80975341796875, "global_step": 315280, "epoch": 1876} {"train_loss": -12.425210952758789, "global_step": 315281, "epoch": 1876} {"train_loss": -11.831412315368652, "global_step": 315282, "epoch": 1876} {"train_loss": -11.268206596374512, "global_step": 315283, "epoch": 1876} {"train_loss": -12.040218353271484, "global_step": 315284, "epoch": 1876} {"train_loss": -12.306066513061523, "global_step": 315285, "epoch": 1876} {"train_loss": -11.455666542053223, "global_step": 315286, "epoch": 1876} {"train_loss": -12.143491744995117, "global_step": 315287, "epoch": 1876} {"train_loss": -12.307840347290039, "global_step": 315288, "epoch": 1876} {"train_loss": -11.370306015014648, "global_step": 315289, "epoch": 1876} {"train_loss": -12.181408882141113, "global_step": 315290, "epoch": 1876} {"train_loss": -11.807222366333008, "global_step": 315291, "epoch": 1876} {"train_loss": -12.13694953918457, "global_step": 315292, "epoch": 1876} {"train_loss": -11.594649314880371, "global_step": 315293, "epoch": 1876} {"train_loss": -11.962312698364258, "global_step": 315294, "epoch": 1876} {"train_loss": -11.95803451538086, "global_step": 315295, "epoch": 1876} {"train_loss": -11.88511848449707, "global_step": 315296, "epoch": 1876} {"train_loss": -11.829951286315918, "global_step": 315297, "epoch": 1876} {"train_loss": -12.031064987182617, "global_step": 315298, "epoch": 1876} {"train_loss": -11.769521713256836, "global_step": 315299, "epoch": 1876} {"train_loss": -11.603959083557129, "global_step": 315300, "epoch": 1876} {"train_loss": -11.719711303710938, "global_step": 315301, "epoch": 1876} {"train_loss": -11.710132598876953, "global_step": 315302, "epoch": 1876} {"train_loss": -12.179964065551758, "global_step": 315303, "epoch": 1876} {"train_loss": -11.976602554321289, "global_step": 315304, "epoch": 1876} {"train_loss": -11.448471069335938, "global_step": 315305, "epoch": 1876} {"train_loss": -12.088577270507812, "global_step": 315306, "epoch": 1876} {"train_loss": -11.963326454162598, "global_step": 315307, "epoch": 1876} {"train_loss": -12.115152359008789, "global_step": 315308, "epoch": 1876} {"train_loss": -11.982096672058105, "global_step": 315309, "epoch": 1876} {"train_loss": -11.401573181152344, "global_step": 315310, "epoch": 1876} {"train_loss": -11.988458633422852, "global_step": 315311, "epoch": 1876} {"train_loss": -11.805112838745117, "global_step": 315312, "epoch": 1876} {"train_loss": -11.450929641723633, "global_step": 315313, "epoch": 1876} {"train_loss": -11.852581024169922, "global_step": 315314, "epoch": 1876} {"train_loss": -11.515531539916992, "global_step": 315315, "epoch": 1876} {"train_loss": -11.31523323059082, "global_step": 315316, "epoch": 1876} {"train_loss": -11.821235656738281, "global_step": 315317, "epoch": 1876} {"train_loss": -11.739421844482422, "global_step": 315318, "epoch": 1876} {"train_loss": -11.169130325317383, "global_step": 315319, "epoch": 1876} {"train_loss": -12.191055297851562, "global_step": 315320, "epoch": 1876} {"train_loss": -10.705482482910156, "global_step": 315321, "epoch": 1876} {"train_loss": -12.081339836120605, "global_step": 315322, "epoch": 1876} {"train_loss": -11.562856674194336, "global_step": 315323, "epoch": 1876} {"train_loss": -11.938688278198242, "global_step": 315324, "epoch": 1876} {"train_loss": -11.829288482666016, "global_step": 315325, "epoch": 1876} {"train_loss": -11.532662391662598, "global_step": 315326, "epoch": 1876} {"train_loss": -12.238167762756348, "global_step": 315327, "epoch": 1876} {"train_loss": -11.712297439575195, "global_step": 315328, "epoch": 1876} {"train_loss": -12.035568237304688, "global_step": 315329, "epoch": 1876} {"train_loss": -11.567472457885742, "global_step": 315330, "epoch": 1876} {"train_loss": -12.052136421203613, "global_step": 315331, "epoch": 1876} {"train_loss": -11.813992500305176, "global_step": 315332, "epoch": 1876} {"train_loss": -11.898908615112305, "global_step": 315333, "epoch": 1876} {"train_loss": -11.67222785949707, "global_step": 315334, "epoch": 1876} {"train_loss": -11.808388868967691, "global_step": 315335, "epoch": 1876, "val_loss": 279229.5} {"train_loss": -11.565739631652832, "global_step": 315336, "epoch": 1877} {"train_loss": -12.023921966552734, "global_step": 315337, "epoch": 1877} {"train_loss": -11.833126068115234, "global_step": 315338, "epoch": 1877} {"train_loss": -12.013847351074219, "global_step": 315339, "epoch": 1877} {"train_loss": -11.660996437072754, "global_step": 315340, "epoch": 1877} {"train_loss": -12.027496337890625, "global_step": 315341, "epoch": 1877} {"train_loss": -12.053256034851074, "global_step": 315342, "epoch": 1877} {"train_loss": -11.782625198364258, "global_step": 315343, "epoch": 1877} {"train_loss": -12.007553100585938, "global_step": 315344, "epoch": 1877} {"train_loss": -11.474059104919434, "global_step": 315345, "epoch": 1877} {"train_loss": -12.288883209228516, "global_step": 315346, "epoch": 1877} {"train_loss": -11.989980697631836, "global_step": 315347, "epoch": 1877} {"train_loss": -12.278274536132812, "global_step": 315348, "epoch": 1877} {"train_loss": -12.333547592163086, "global_step": 315349, "epoch": 1877} {"train_loss": -11.899415016174316, "global_step": 315350, "epoch": 1877} {"train_loss": -12.342168807983398, "global_step": 315351, "epoch": 1877} {"train_loss": -11.949081420898438, "global_step": 315352, "epoch": 1877} {"train_loss": -12.25903034210205, "global_step": 315353, "epoch": 1877} {"train_loss": -12.169363021850586, "global_step": 315354, "epoch": 1877} {"train_loss": -11.915840148925781, "global_step": 315355, "epoch": 1877} {"train_loss": -12.051246643066406, "global_step": 315356, "epoch": 1877} {"train_loss": -12.156322479248047, "global_step": 315357, "epoch": 1877} {"train_loss": -12.298578262329102, "global_step": 315358, "epoch": 1877} {"train_loss": -12.081523895263672, "global_step": 315359, "epoch": 1877} {"train_loss": -12.205198287963867, "global_step": 315360, "epoch": 1877} {"train_loss": -12.256503105163574, "global_step": 315361, "epoch": 1877} {"train_loss": -12.297365188598633, "global_step": 315362, "epoch": 1877} {"train_loss": -12.312233924865723, "global_step": 315363, "epoch": 1877} {"train_loss": -12.104056358337402, "global_step": 315364, "epoch": 1877} {"train_loss": -12.4329195022583, "global_step": 315365, "epoch": 1877} {"train_loss": -12.209033966064453, "global_step": 315366, "epoch": 1877} {"train_loss": -12.353822708129883, "global_step": 315367, "epoch": 1877} {"train_loss": -12.041156768798828, "global_step": 315368, "epoch": 1877} {"train_loss": -12.328319549560547, "global_step": 315369, "epoch": 1877} {"train_loss": -12.369226455688477, "global_step": 315370, "epoch": 1877} {"train_loss": -12.337331771850586, "global_step": 315371, "epoch": 1877} {"train_loss": -12.181267738342285, "global_step": 315372, "epoch": 1877} {"train_loss": -12.19269847869873, "global_step": 315373, "epoch": 1877} {"train_loss": -12.39918327331543, "global_step": 315374, "epoch": 1877} {"train_loss": -12.116108894348145, "global_step": 315375, "epoch": 1877} {"train_loss": -12.433610916137695, "global_step": 315376, "epoch": 1877} {"train_loss": -12.232295989990234, "global_step": 315377, "epoch": 1877} {"train_loss": -12.243095397949219, "global_step": 315378, "epoch": 1877} {"train_loss": -12.080536842346191, "global_step": 315379, "epoch": 1877} {"train_loss": -12.34240436553955, "global_step": 315380, "epoch": 1877} {"train_loss": -12.125120162963867, "global_step": 315381, "epoch": 1877} {"train_loss": -12.551519393920898, "global_step": 315382, "epoch": 1877} {"train_loss": -12.249076843261719, "global_step": 315383, "epoch": 1877} {"train_loss": -12.386200904846191, "global_step": 315384, "epoch": 1877} {"train_loss": -12.528182983398438, "global_step": 315385, "epoch": 1877} {"train_loss": -12.457611083984375, "global_step": 315386, "epoch": 1877} {"train_loss": -12.44219970703125, "global_step": 315387, "epoch": 1877} {"train_loss": -12.538774490356445, "global_step": 315388, "epoch": 1877} {"train_loss": -12.556833267211914, "global_step": 315389, "epoch": 1877} {"train_loss": -12.4873046875, "global_step": 315390, "epoch": 1877} {"train_loss": -12.413185119628906, "global_step": 315391, "epoch": 1877} {"train_loss": -12.616683006286621, "global_step": 315392, "epoch": 1877} {"train_loss": -12.374370574951172, "global_step": 315393, "epoch": 1877} {"train_loss": -12.3052339553833, "global_step": 315394, "epoch": 1877} {"train_loss": -12.401941299438477, "global_step": 315395, "epoch": 1877} {"train_loss": -12.346384048461914, "global_step": 315396, "epoch": 1877} {"train_loss": -12.32160472869873, "global_step": 315397, "epoch": 1877} {"train_loss": -12.28343391418457, "global_step": 315398, "epoch": 1877} {"train_loss": -12.504851341247559, "global_step": 315399, "epoch": 1877} {"train_loss": -12.334207534790039, "global_step": 315400, "epoch": 1877} {"train_loss": -12.43163776397705, "global_step": 315401, "epoch": 1877} {"train_loss": -12.424878120422363, "global_step": 315402, "epoch": 1877} {"train_loss": -12.620940208435059, "global_step": 315403, "epoch": 1877} {"train_loss": -12.093413352966309, "global_step": 315404, "epoch": 1877} {"train_loss": -12.543985366821289, "global_step": 315405, "epoch": 1877} {"train_loss": -12.500266075134277, "global_step": 315406, "epoch": 1877} {"train_loss": -12.608614921569824, "global_step": 315407, "epoch": 1877} {"train_loss": -11.906005859375, "global_step": 315408, "epoch": 1877} {"train_loss": -11.872164726257324, "global_step": 315409, "epoch": 1877} {"train_loss": -11.584086418151855, "global_step": 315410, "epoch": 1877} {"train_loss": -12.137151718139648, "global_step": 315411, "epoch": 1877} {"train_loss": -11.893735885620117, "global_step": 315412, "epoch": 1877} {"train_loss": -12.131792068481445, "global_step": 315413, "epoch": 1877} {"train_loss": -11.816219329833984, "global_step": 315414, "epoch": 1877} {"train_loss": -11.763073921203613, "global_step": 315415, "epoch": 1877} {"train_loss": -11.46286392211914, "global_step": 315416, "epoch": 1877} {"train_loss": -10.569952964782715, "global_step": 315417, "epoch": 1877} {"train_loss": -9.651025772094727, "global_step": 315418, "epoch": 1877} {"train_loss": -11.665059089660645, "global_step": 315419, "epoch": 1877} {"train_loss": -11.277983665466309, "global_step": 315420, "epoch": 1877} {"train_loss": -10.910149574279785, "global_step": 315421, "epoch": 1877} {"train_loss": -11.791969299316406, "global_step": 315422, "epoch": 1877} {"train_loss": -11.384069442749023, "global_step": 315423, "epoch": 1877} {"train_loss": -10.194390296936035, "global_step": 315424, "epoch": 1877} {"train_loss": -11.701842308044434, "global_step": 315425, "epoch": 1877} {"train_loss": -11.277409553527832, "global_step": 315426, "epoch": 1877} {"train_loss": -11.845701217651367, "global_step": 315427, "epoch": 1877} {"train_loss": -11.404825210571289, "global_step": 315428, "epoch": 1877} {"train_loss": -11.574982643127441, "global_step": 315429, "epoch": 1877} {"train_loss": -11.777286529541016, "global_step": 315430, "epoch": 1877} {"train_loss": -11.87218189239502, "global_step": 315431, "epoch": 1877} {"train_loss": -11.860944747924805, "global_step": 315432, "epoch": 1877} {"train_loss": -11.785675048828125, "global_step": 315433, "epoch": 1877} {"train_loss": -11.93659782409668, "global_step": 315434, "epoch": 1877} {"train_loss": -12.05833911895752, "global_step": 315435, "epoch": 1877} {"train_loss": -11.938977241516113, "global_step": 315436, "epoch": 1877} {"train_loss": -12.212483406066895, "global_step": 315437, "epoch": 1877} {"train_loss": -11.906126976013184, "global_step": 315438, "epoch": 1877} {"train_loss": -11.326473236083984, "global_step": 315439, "epoch": 1877} {"train_loss": -11.584972381591797, "global_step": 315440, "epoch": 1877} {"train_loss": -12.044856071472168, "global_step": 315441, "epoch": 1877} {"train_loss": -11.754919052124023, "global_step": 315442, "epoch": 1877} {"train_loss": -11.451390266418457, "global_step": 315443, "epoch": 1877} {"train_loss": -11.872806549072266, "global_step": 315444, "epoch": 1877} {"train_loss": -11.856502532958984, "global_step": 315445, "epoch": 1877} {"train_loss": -10.900932312011719, "global_step": 315446, "epoch": 1877} {"train_loss": -11.947092056274414, "global_step": 315447, "epoch": 1877} {"train_loss": -11.473331451416016, "global_step": 315448, "epoch": 1877} {"train_loss": -10.88711929321289, "global_step": 315449, "epoch": 1877} {"train_loss": -11.989812850952148, "global_step": 315450, "epoch": 1877} {"train_loss": -11.305418014526367, "global_step": 315451, "epoch": 1877} {"train_loss": -11.194543838500977, "global_step": 315452, "epoch": 1877} {"train_loss": -11.121769905090332, "global_step": 315453, "epoch": 1877} {"train_loss": -10.016921997070312, "global_step": 315454, "epoch": 1877} {"train_loss": -9.787267684936523, "global_step": 315455, "epoch": 1877} {"train_loss": -9.615583419799805, "global_step": 315456, "epoch": 1877} {"train_loss": -8.414246559143066, "global_step": 315457, "epoch": 1877} {"train_loss": -7.252894401550293, "global_step": 315458, "epoch": 1877} {"train_loss": -7.485185623168945, "global_step": 315459, "epoch": 1877} {"train_loss": -6.535155773162842, "global_step": 315460, "epoch": 1877} {"train_loss": -7.446351051330566, "global_step": 315461, "epoch": 1877} {"train_loss": -7.574450969696045, "global_step": 315462, "epoch": 1877} {"train_loss": -8.394294738769531, "global_step": 315463, "epoch": 1877} {"train_loss": -9.620351791381836, "global_step": 315464, "epoch": 1877} {"train_loss": -9.618501663208008, "global_step": 315465, "epoch": 1877} {"train_loss": -8.643951416015625, "global_step": 315466, "epoch": 1877} {"train_loss": -8.450799942016602, "global_step": 315467, "epoch": 1877} {"train_loss": -9.07307243347168, "global_step": 315468, "epoch": 1877} {"train_loss": -10.447824478149414, "global_step": 315469, "epoch": 1877} {"train_loss": -10.041196823120117, "global_step": 315470, "epoch": 1877} {"train_loss": -10.392393112182617, "global_step": 315471, "epoch": 1877} {"train_loss": -10.185614585876465, "global_step": 315472, "epoch": 1877} {"train_loss": -10.595233917236328, "global_step": 315473, "epoch": 1877} {"train_loss": -10.71948528289795, "global_step": 315474, "epoch": 1877} {"train_loss": -10.626662254333496, "global_step": 315475, "epoch": 1877} {"train_loss": -10.82811450958252, "global_step": 315476, "epoch": 1877} {"train_loss": -10.76194953918457, "global_step": 315477, "epoch": 1877} {"train_loss": -11.248950958251953, "global_step": 315478, "epoch": 1877} {"train_loss": -11.224897384643555, "global_step": 315479, "epoch": 1877} {"train_loss": -11.458024024963379, "global_step": 315480, "epoch": 1877} {"train_loss": -11.587913513183594, "global_step": 315481, "epoch": 1877} {"train_loss": -11.400136947631836, "global_step": 315482, "epoch": 1877} {"train_loss": -11.579856872558594, "global_step": 315483, "epoch": 1877} {"train_loss": -11.40038776397705, "global_step": 315484, "epoch": 1877} {"train_loss": -11.252013206481934, "global_step": 315485, "epoch": 1877} {"train_loss": -11.733118057250977, "global_step": 315486, "epoch": 1877} {"train_loss": -11.596242904663086, "global_step": 315487, "epoch": 1877} {"train_loss": -11.509201049804688, "global_step": 315488, "epoch": 1877} {"train_loss": -11.711026191711426, "global_step": 315489, "epoch": 1877} {"train_loss": -11.792749404907227, "global_step": 315490, "epoch": 1877} {"train_loss": -11.766324996948242, "global_step": 315491, "epoch": 1877} {"train_loss": -11.904927253723145, "global_step": 315492, "epoch": 1877} {"train_loss": -11.260692596435547, "global_step": 315493, "epoch": 1877} {"train_loss": -11.358224868774414, "global_step": 315494, "epoch": 1877} {"train_loss": -11.86911678314209, "global_step": 315495, "epoch": 1877} {"train_loss": -11.310734748840332, "global_step": 315496, "epoch": 1877} {"train_loss": -11.652410507202148, "global_step": 315497, "epoch": 1877} {"train_loss": -12.044349670410156, "global_step": 315498, "epoch": 1877} {"train_loss": -11.651644706726074, "global_step": 315499, "epoch": 1877} {"train_loss": -11.744370460510254, "global_step": 315500, "epoch": 1877} {"train_loss": -11.723182678222656, "global_step": 315501, "epoch": 1877} {"train_loss": -11.802891731262207, "global_step": 315502, "epoch": 1877} {"train_loss": -11.531360717046828, "global_step": 315503, "epoch": 1877, "val_loss": 280209.90625} {"train_loss": -11.978791236877441, "global_step": 315504, "epoch": 1878} {"train_loss": -11.909955978393555, "global_step": 315505, "epoch": 1878} {"train_loss": -11.928735733032227, "global_step": 315506, "epoch": 1878} {"train_loss": -11.959785461425781, "global_step": 315507, "epoch": 1878} {"train_loss": -11.975383758544922, "global_step": 315508, "epoch": 1878} {"train_loss": -12.020910263061523, "global_step": 315509, "epoch": 1878} {"train_loss": -11.963509559631348, "global_step": 315510, "epoch": 1878} {"train_loss": -11.622356414794922, "global_step": 315511, "epoch": 1878} {"train_loss": -12.115045547485352, "global_step": 315512, "epoch": 1878} {"train_loss": -11.975265502929688, "global_step": 315513, "epoch": 1878} {"train_loss": -11.88097858428955, "global_step": 315514, "epoch": 1878} {"train_loss": -12.054132461547852, "global_step": 315515, "epoch": 1878} {"train_loss": -11.999342918395996, "global_step": 315516, "epoch": 1878} {"train_loss": -12.143183708190918, "global_step": 315517, "epoch": 1878} {"train_loss": -12.023911476135254, "global_step": 315518, "epoch": 1878} {"train_loss": -11.987518310546875, "global_step": 315519, "epoch": 1878} {"train_loss": -12.154546737670898, "global_step": 315520, "epoch": 1878} {"train_loss": -11.642572402954102, "global_step": 315521, "epoch": 1878} {"train_loss": -12.180545806884766, "global_step": 315522, "epoch": 1878} {"train_loss": -11.84662914276123, "global_step": 315523, "epoch": 1878} {"train_loss": -12.164237976074219, "global_step": 315524, "epoch": 1878} {"train_loss": -12.065906524658203, "global_step": 315525, "epoch": 1878} {"train_loss": -11.925161361694336, "global_step": 315526, "epoch": 1878} {"train_loss": -12.378984451293945, "global_step": 315527, "epoch": 1878} {"train_loss": -12.037681579589844, "global_step": 315528, "epoch": 1878} {"train_loss": -11.991293907165527, "global_step": 315529, "epoch": 1878} {"train_loss": -12.1240234375, "global_step": 315530, "epoch": 1878} {"train_loss": -12.309839248657227, "global_step": 315531, "epoch": 1878} {"train_loss": -12.06008243560791, "global_step": 315532, "epoch": 1878} {"train_loss": -12.318557739257812, "global_step": 315533, "epoch": 1878} {"train_loss": -12.170883178710938, "global_step": 315534, "epoch": 1878} {"train_loss": -12.156009674072266, "global_step": 315535, "epoch": 1878} {"train_loss": -12.197759628295898, "global_step": 315536, "epoch": 1878} {"train_loss": -12.06142520904541, "global_step": 315537, "epoch": 1878} {"train_loss": -12.222049713134766, "global_step": 315538, "epoch": 1878} {"train_loss": -12.049361228942871, "global_step": 315539, "epoch": 1878} {"train_loss": -12.243173599243164, "global_step": 315540, "epoch": 1878} {"train_loss": -11.891109466552734, "global_step": 315541, "epoch": 1878} {"train_loss": -12.089665412902832, "global_step": 315542, "epoch": 1878} {"train_loss": -12.201967239379883, "global_step": 315543, "epoch": 1878} {"train_loss": -11.811847686767578, "global_step": 315544, "epoch": 1878} {"train_loss": -12.381929397583008, "global_step": 315545, "epoch": 1878} {"train_loss": -12.125991821289062, "global_step": 315546, "epoch": 1878} {"train_loss": -12.13082504272461, "global_step": 315547, "epoch": 1878} {"train_loss": -12.441168785095215, "global_step": 315548, "epoch": 1878} {"train_loss": -12.050021171569824, "global_step": 315549, "epoch": 1878} {"train_loss": -12.483894348144531, "global_step": 315550, "epoch": 1878} {"train_loss": -12.292366027832031, "global_step": 315551, "epoch": 1878} {"train_loss": -12.27595043182373, "global_step": 315552, "epoch": 1878} {"train_loss": -12.225578308105469, "global_step": 315553, "epoch": 1878} {"train_loss": -12.110928535461426, "global_step": 315554, "epoch": 1878} {"train_loss": -12.134419441223145, "global_step": 315555, "epoch": 1878} {"train_loss": -12.335973739624023, "global_step": 315556, "epoch": 1878} {"train_loss": -12.170287132263184, "global_step": 315557, "epoch": 1878} {"train_loss": -12.358587265014648, "global_step": 315558, "epoch": 1878} {"train_loss": -12.113723754882812, "global_step": 315559, "epoch": 1878} {"train_loss": -12.030867576599121, "global_step": 315560, "epoch": 1878} {"train_loss": -12.526910781860352, "global_step": 315561, "epoch": 1878} {"train_loss": -11.991046905517578, "global_step": 315562, "epoch": 1878} {"train_loss": -12.096879959106445, "global_step": 315563, "epoch": 1878} {"train_loss": -12.458529472351074, "global_step": 315564, "epoch": 1878} {"train_loss": -12.01063060760498, "global_step": 315565, "epoch": 1878} {"train_loss": -12.431510925292969, "global_step": 315566, "epoch": 1878} {"train_loss": -12.459527969360352, "global_step": 315567, "epoch": 1878} {"train_loss": -12.315420150756836, "global_step": 315568, "epoch": 1878} {"train_loss": -12.250846862792969, "global_step": 315569, "epoch": 1878} {"train_loss": -12.615341186523438, "global_step": 315570, "epoch": 1878} {"train_loss": -12.379936218261719, "global_step": 315571, "epoch": 1878} {"train_loss": -12.435861587524414, "global_step": 315572, "epoch": 1878} {"train_loss": -12.460774421691895, "global_step": 315573, "epoch": 1878} {"train_loss": -12.35765552520752, "global_step": 315574, "epoch": 1878} {"train_loss": -12.186656951904297, "global_step": 315575, "epoch": 1878} {"train_loss": -12.363622665405273, "global_step": 315576, "epoch": 1878} {"train_loss": -12.422794342041016, "global_step": 315577, "epoch": 1878} {"train_loss": -12.428924560546875, "global_step": 315578, "epoch": 1878} {"train_loss": -12.333198547363281, "global_step": 315579, "epoch": 1878} {"train_loss": -12.579571723937988, "global_step": 315580, "epoch": 1878} {"train_loss": -12.581619262695312, "global_step": 315581, "epoch": 1878} {"train_loss": -12.521279335021973, "global_step": 315582, "epoch": 1878} {"train_loss": -12.285263061523438, "global_step": 315583, "epoch": 1878} {"train_loss": -12.184986114501953, "global_step": 315584, "epoch": 1878} {"train_loss": -12.607268333435059, "global_step": 315585, "epoch": 1878} {"train_loss": -12.321603775024414, "global_step": 315586, "epoch": 1878} {"train_loss": -11.500553131103516, "global_step": 315587, "epoch": 1878} {"train_loss": -12.289294242858887, "global_step": 315588, "epoch": 1878} {"train_loss": -11.83221435546875, "global_step": 315589, "epoch": 1878} {"train_loss": -11.124518394470215, "global_step": 315590, "epoch": 1878} {"train_loss": -11.862716674804688, "global_step": 315591, "epoch": 1878} {"train_loss": -12.249975204467773, "global_step": 315592, "epoch": 1878} {"train_loss": -12.278484344482422, "global_step": 315593, "epoch": 1878} {"train_loss": -11.214828491210938, "global_step": 315594, "epoch": 1878} {"train_loss": -11.527338027954102, "global_step": 315595, "epoch": 1878} {"train_loss": -11.565906524658203, "global_step": 315596, "epoch": 1878} {"train_loss": -12.360979080200195, "global_step": 315597, "epoch": 1878} {"train_loss": -12.181324005126953, "global_step": 315598, "epoch": 1878} {"train_loss": -11.481884956359863, "global_step": 315599, "epoch": 1878} {"train_loss": -12.088068008422852, "global_step": 315600, "epoch": 1878} {"train_loss": -12.143077850341797, "global_step": 315601, "epoch": 1878} {"train_loss": -11.974016189575195, "global_step": 315602, "epoch": 1878} {"train_loss": -11.798179626464844, "global_step": 315603, "epoch": 1878} {"train_loss": -12.179415702819824, "global_step": 315604, "epoch": 1878} {"train_loss": -12.265233039855957, "global_step": 315605, "epoch": 1878} {"train_loss": -11.683257102966309, "global_step": 315606, "epoch": 1878} {"train_loss": -11.456804275512695, "global_step": 315607, "epoch": 1878} {"train_loss": -12.372295379638672, "global_step": 315608, "epoch": 1878} {"train_loss": -11.917749404907227, "global_step": 315609, "epoch": 1878} {"train_loss": -11.575149536132812, "global_step": 315610, "epoch": 1878} {"train_loss": -12.245889663696289, "global_step": 315611, "epoch": 1878} {"train_loss": -11.144462585449219, "global_step": 315612, "epoch": 1878} {"train_loss": -11.112895965576172, "global_step": 315613, "epoch": 1878} {"train_loss": -12.126809120178223, "global_step": 315614, "epoch": 1878} {"train_loss": -10.41535758972168, "global_step": 315615, "epoch": 1878} {"train_loss": -11.97538948059082, "global_step": 315616, "epoch": 1878} {"train_loss": -11.402615547180176, "global_step": 315617, "epoch": 1878} {"train_loss": -11.21914005279541, "global_step": 315618, "epoch": 1878} {"train_loss": -12.09819507598877, "global_step": 315619, "epoch": 1878} {"train_loss": -10.895804405212402, "global_step": 315620, "epoch": 1878} {"train_loss": -11.950522422790527, "global_step": 315621, "epoch": 1878} {"train_loss": -10.085468292236328, "global_step": 315622, "epoch": 1878} {"train_loss": -11.296163558959961, "global_step": 315623, "epoch": 1878} {"train_loss": -11.93227767944336, "global_step": 315624, "epoch": 1878} {"train_loss": -10.679059982299805, "global_step": 315625, "epoch": 1878} {"train_loss": -11.571355819702148, "global_step": 315626, "epoch": 1878} {"train_loss": -11.369630813598633, "global_step": 315627, "epoch": 1878} {"train_loss": -12.037343978881836, "global_step": 315628, "epoch": 1878} {"train_loss": -11.7349214553833, "global_step": 315629, "epoch": 1878} {"train_loss": -10.763561248779297, "global_step": 315630, "epoch": 1878} {"train_loss": -11.387895584106445, "global_step": 315631, "epoch": 1878} {"train_loss": -10.492515563964844, "global_step": 315632, "epoch": 1878} {"train_loss": -10.692155838012695, "global_step": 315633, "epoch": 1878} {"train_loss": -10.73017406463623, "global_step": 315634, "epoch": 1878} {"train_loss": -11.245647430419922, "global_step": 315635, "epoch": 1878} {"train_loss": -10.649274826049805, "global_step": 315636, "epoch": 1878} {"train_loss": -10.904362678527832, "global_step": 315637, "epoch": 1878} {"train_loss": -11.486740112304688, "global_step": 315638, "epoch": 1878} {"train_loss": -10.239444732666016, "global_step": 315639, "epoch": 1878} {"train_loss": -11.761015892028809, "global_step": 315640, "epoch": 1878} {"train_loss": -10.476799011230469, "global_step": 315641, "epoch": 1878} {"train_loss": -11.830964088439941, "global_step": 315642, "epoch": 1878} {"train_loss": -11.38614273071289, "global_step": 315643, "epoch": 1878} {"train_loss": -11.37382984161377, "global_step": 315644, "epoch": 1878} {"train_loss": -11.685157775878906, "global_step": 315645, "epoch": 1878} {"train_loss": -11.71557903289795, "global_step": 315646, "epoch": 1878} {"train_loss": -11.889427185058594, "global_step": 315647, "epoch": 1878} {"train_loss": -11.348855972290039, "global_step": 315648, "epoch": 1878} {"train_loss": -11.737543106079102, "global_step": 315649, "epoch": 1878} {"train_loss": -11.141153335571289, "global_step": 315650, "epoch": 1878} {"train_loss": -11.704501152038574, "global_step": 315651, "epoch": 1878} {"train_loss": -11.767650604248047, "global_step": 315652, "epoch": 1878} {"train_loss": -11.055473327636719, "global_step": 315653, "epoch": 1878} {"train_loss": -10.914474487304688, "global_step": 315654, "epoch": 1878} {"train_loss": -10.729220390319824, "global_step": 315655, "epoch": 1878} {"train_loss": -11.843859672546387, "global_step": 315656, "epoch": 1878} {"train_loss": -10.678561210632324, "global_step": 315657, "epoch": 1878} {"train_loss": -11.3924560546875, "global_step": 315658, "epoch": 1878} {"train_loss": -11.140704154968262, "global_step": 315659, "epoch": 1878} {"train_loss": -11.038188934326172, "global_step": 315660, "epoch": 1878} {"train_loss": -11.441628456115723, "global_step": 315661, "epoch": 1878} {"train_loss": -10.959985733032227, "global_step": 315662, "epoch": 1878} {"train_loss": -11.24755859375, "global_step": 315663, "epoch": 1878} {"train_loss": -11.285820007324219, "global_step": 315664, "epoch": 1878} {"train_loss": -11.482645034790039, "global_step": 315665, "epoch": 1878} {"train_loss": -11.661645889282227, "global_step": 315666, "epoch": 1878} {"train_loss": -11.814922332763672, "global_step": 315667, "epoch": 1878} {"train_loss": -11.836376190185547, "global_step": 315668, "epoch": 1878} {"train_loss": -11.42718505859375, "global_step": 315669, "epoch": 1878} {"train_loss": -11.943882942199707, "global_step": 315670, "epoch": 1878} {"train_loss": -11.830032149950663, "global_step": 315671, "epoch": 1878, "val_loss": 284851.03125} {"train_loss": -11.716352462768555, "global_step": 315672, "epoch": 1879} {"train_loss": -12.035430908203125, "global_step": 315673, "epoch": 1879} {"train_loss": -11.678470611572266, "global_step": 315674, "epoch": 1879} {"train_loss": -11.854246139526367, "global_step": 315675, "epoch": 1879} {"train_loss": -11.776625633239746, "global_step": 315676, "epoch": 1879} {"train_loss": -11.903733253479004, "global_step": 315677, "epoch": 1879} {"train_loss": -11.874059677124023, "global_step": 315678, "epoch": 1879} {"train_loss": -12.107762336730957, "global_step": 315679, "epoch": 1879} {"train_loss": -11.965649604797363, "global_step": 315680, "epoch": 1879} {"train_loss": -11.883478164672852, "global_step": 315681, "epoch": 1879} {"train_loss": -12.003894805908203, "global_step": 315682, "epoch": 1879} {"train_loss": -12.269432067871094, "global_step": 315683, "epoch": 1879} {"train_loss": -12.065382957458496, "global_step": 315684, "epoch": 1879} {"train_loss": -12.002083778381348, "global_step": 315685, "epoch": 1879} {"train_loss": -12.191085815429688, "global_step": 315686, "epoch": 1879} {"train_loss": -11.841705322265625, "global_step": 315687, "epoch": 1879} {"train_loss": -11.959768295288086, "global_step": 315688, "epoch": 1879} {"train_loss": -12.071410179138184, "global_step": 315689, "epoch": 1879} {"train_loss": -11.698833465576172, "global_step": 315690, "epoch": 1879} {"train_loss": -12.127588272094727, "global_step": 315691, "epoch": 1879} {"train_loss": -11.828872680664062, "global_step": 315692, "epoch": 1879} {"train_loss": -12.129600524902344, "global_step": 315693, "epoch": 1879} {"train_loss": -11.985652923583984, "global_step": 315694, "epoch": 1879} {"train_loss": -12.062358856201172, "global_step": 315695, "epoch": 1879} {"train_loss": -12.12366008758545, "global_step": 315696, "epoch": 1879} {"train_loss": -11.965108871459961, "global_step": 315697, "epoch": 1879} {"train_loss": -12.17680835723877, "global_step": 315698, "epoch": 1879} {"train_loss": -12.127494812011719, "global_step": 315699, "epoch": 1879} {"train_loss": -11.806673049926758, "global_step": 315700, "epoch": 1879} {"train_loss": -12.082527160644531, "global_step": 315701, "epoch": 1879} {"train_loss": -11.71013069152832, "global_step": 315702, "epoch": 1879} {"train_loss": -11.813474655151367, "global_step": 315703, "epoch": 1879} {"train_loss": -12.21537971496582, "global_step": 315704, "epoch": 1879} {"train_loss": -11.710257530212402, "global_step": 315705, "epoch": 1879} {"train_loss": -12.227508544921875, "global_step": 315706, "epoch": 1879} {"train_loss": -12.006749153137207, "global_step": 315707, "epoch": 1879} {"train_loss": -12.407220840454102, "global_step": 315708, "epoch": 1879} {"train_loss": -12.035473823547363, "global_step": 315709, "epoch": 1879} {"train_loss": -11.967074394226074, "global_step": 315710, "epoch": 1879} {"train_loss": -12.104777336120605, "global_step": 315711, "epoch": 1879} {"train_loss": -11.65681266784668, "global_step": 315712, "epoch": 1879} {"train_loss": -12.061983108520508, "global_step": 315713, "epoch": 1879} {"train_loss": -12.192564010620117, "global_step": 315714, "epoch": 1879} {"train_loss": -12.212677001953125, "global_step": 315715, "epoch": 1879} {"train_loss": -11.698535919189453, "global_step": 315716, "epoch": 1879} {"train_loss": -11.808313369750977, "global_step": 315717, "epoch": 1879} {"train_loss": -11.622089385986328, "global_step": 315718, "epoch": 1879} {"train_loss": -11.857945442199707, "global_step": 315719, "epoch": 1879} {"train_loss": -11.821353912353516, "global_step": 315720, "epoch": 1879} {"train_loss": -11.646556854248047, "global_step": 315721, "epoch": 1879} {"train_loss": -12.186517715454102, "global_step": 315722, "epoch": 1879} {"train_loss": -11.768414497375488, "global_step": 315723, "epoch": 1879} {"train_loss": -11.961130142211914, "global_step": 315724, "epoch": 1879} {"train_loss": -11.773303985595703, "global_step": 315725, "epoch": 1879} {"train_loss": -11.711080551147461, "global_step": 315726, "epoch": 1879} {"train_loss": -11.371331214904785, "global_step": 315727, "epoch": 1879} {"train_loss": -11.486368179321289, "global_step": 315728, "epoch": 1879} {"train_loss": -10.589076042175293, "global_step": 315729, "epoch": 1879} {"train_loss": -11.655685424804688, "global_step": 315730, "epoch": 1879} {"train_loss": -11.042041778564453, "global_step": 315731, "epoch": 1879} {"train_loss": -11.24317741394043, "global_step": 315732, "epoch": 1879} {"train_loss": -11.205643653869629, "global_step": 315733, "epoch": 1879} {"train_loss": -10.994843482971191, "global_step": 315734, "epoch": 1879} {"train_loss": -12.069236755371094, "global_step": 315735, "epoch": 1879} {"train_loss": -11.10113525390625, "global_step": 315736, "epoch": 1879} {"train_loss": -12.007610321044922, "global_step": 315737, "epoch": 1879} {"train_loss": -11.300150871276855, "global_step": 315738, "epoch": 1879} {"train_loss": -11.915719032287598, "global_step": 315739, "epoch": 1879} {"train_loss": -11.701369285583496, "global_step": 315740, "epoch": 1879} {"train_loss": -11.517383575439453, "global_step": 315741, "epoch": 1879} {"train_loss": -11.502548217773438, "global_step": 315742, "epoch": 1879} {"train_loss": -12.063041687011719, "global_step": 315743, "epoch": 1879} {"train_loss": -11.823572158813477, "global_step": 315744, "epoch": 1879} {"train_loss": -12.047447204589844, "global_step": 315745, "epoch": 1879} {"train_loss": -11.808187484741211, "global_step": 315746, "epoch": 1879} {"train_loss": -11.812063217163086, "global_step": 315747, "epoch": 1879} {"train_loss": -11.625110626220703, "global_step": 315748, "epoch": 1879} {"train_loss": -12.004769325256348, "global_step": 315749, "epoch": 1879} {"train_loss": -11.720749855041504, "global_step": 315750, "epoch": 1879} {"train_loss": -12.104475021362305, "global_step": 315751, "epoch": 1879} {"train_loss": -11.792689323425293, "global_step": 315752, "epoch": 1879} {"train_loss": -12.135377883911133, "global_step": 315753, "epoch": 1879} {"train_loss": -12.146238327026367, "global_step": 315754, "epoch": 1879} {"train_loss": -11.692996978759766, "global_step": 315755, "epoch": 1879} {"train_loss": -12.217723846435547, "global_step": 315756, "epoch": 1879} {"train_loss": -12.099089622497559, "global_step": 315757, "epoch": 1879} {"train_loss": -12.226938247680664, "global_step": 315758, "epoch": 1879} {"train_loss": -11.971555709838867, "global_step": 315759, "epoch": 1879} {"train_loss": -11.868302345275879, "global_step": 315760, "epoch": 1879} {"train_loss": -12.135589599609375, "global_step": 315761, "epoch": 1879} {"train_loss": -12.217896461486816, "global_step": 315762, "epoch": 1879} {"train_loss": -12.157559394836426, "global_step": 315763, "epoch": 1879} {"train_loss": -12.094480514526367, "global_step": 315764, "epoch": 1879} {"train_loss": -12.162367820739746, "global_step": 315765, "epoch": 1879} {"train_loss": -11.97865104675293, "global_step": 315766, "epoch": 1879} {"train_loss": -12.218335151672363, "global_step": 315767, "epoch": 1879} {"train_loss": -11.963719367980957, "global_step": 315768, "epoch": 1879} {"train_loss": -11.991165161132812, "global_step": 315769, "epoch": 1879} {"train_loss": -12.38136100769043, "global_step": 315770, "epoch": 1879} {"train_loss": -12.159255981445312, "global_step": 315771, "epoch": 1879} {"train_loss": -12.181029319763184, "global_step": 315772, "epoch": 1879} {"train_loss": -12.167285919189453, "global_step": 315773, "epoch": 1879} {"train_loss": -12.214520454406738, "global_step": 315774, "epoch": 1879} {"train_loss": -11.992959022521973, "global_step": 315775, "epoch": 1879} {"train_loss": -12.393367767333984, "global_step": 315776, "epoch": 1879} {"train_loss": -12.267685890197754, "global_step": 315777, "epoch": 1879} {"train_loss": -12.485496520996094, "global_step": 315778, "epoch": 1879} {"train_loss": -12.364139556884766, "global_step": 315779, "epoch": 1879} {"train_loss": -12.411088943481445, "global_step": 315780, "epoch": 1879} {"train_loss": -12.304994583129883, "global_step": 315781, "epoch": 1879} {"train_loss": -12.359781265258789, "global_step": 315782, "epoch": 1879} {"train_loss": -12.264103889465332, "global_step": 315783, "epoch": 1879} {"train_loss": -12.511146545410156, "global_step": 315784, "epoch": 1879} {"train_loss": -12.44271183013916, "global_step": 315785, "epoch": 1879} {"train_loss": -12.414480209350586, "global_step": 315786, "epoch": 1879} {"train_loss": -12.620033264160156, "global_step": 315787, "epoch": 1879} {"train_loss": -12.61008071899414, "global_step": 315788, "epoch": 1879} {"train_loss": -12.527559280395508, "global_step": 315789, "epoch": 1879} {"train_loss": -12.516592025756836, "global_step": 315790, "epoch": 1879} {"train_loss": -12.600553512573242, "global_step": 315791, "epoch": 1879} {"train_loss": -12.625511169433594, "global_step": 315792, "epoch": 1879} {"train_loss": -12.67117691040039, "global_step": 315793, "epoch": 1879} {"train_loss": -12.537336349487305, "global_step": 315794, "epoch": 1879} {"train_loss": -12.69114875793457, "global_step": 315795, "epoch": 1879} {"train_loss": -12.588741302490234, "global_step": 315796, "epoch": 1879} {"train_loss": -12.438810348510742, "global_step": 315797, "epoch": 1879} {"train_loss": -12.532623291015625, "global_step": 315798, "epoch": 1879} {"train_loss": -12.335423469543457, "global_step": 315799, "epoch": 1879} {"train_loss": -12.31106948852539, "global_step": 315800, "epoch": 1879} {"train_loss": -12.58287239074707, "global_step": 315801, "epoch": 1879} {"train_loss": -12.428129196166992, "global_step": 315802, "epoch": 1879} {"train_loss": -12.535970687866211, "global_step": 315803, "epoch": 1879} {"train_loss": -12.543195724487305, "global_step": 315804, "epoch": 1879} {"train_loss": -12.605939865112305, "global_step": 315805, "epoch": 1879} {"train_loss": -12.473451614379883, "global_step": 315806, "epoch": 1879} {"train_loss": -12.54081916809082, "global_step": 315807, "epoch": 1879} {"train_loss": -12.41501235961914, "global_step": 315808, "epoch": 1879} {"train_loss": -12.376602172851562, "global_step": 315809, "epoch": 1879} {"train_loss": -11.336423873901367, "global_step": 315810, "epoch": 1879} {"train_loss": -10.246685028076172, "global_step": 315811, "epoch": 1879} {"train_loss": -12.46533203125, "global_step": 315812, "epoch": 1879} {"train_loss": -12.233224868774414, "global_step": 315813, "epoch": 1879} {"train_loss": -12.001001358032227, "global_step": 315814, "epoch": 1879} {"train_loss": -11.57919979095459, "global_step": 315815, "epoch": 1879} {"train_loss": -12.54783821105957, "global_step": 315816, "epoch": 1879} {"train_loss": -12.094511985778809, "global_step": 315817, "epoch": 1879} {"train_loss": -11.965002059936523, "global_step": 315818, "epoch": 1879} {"train_loss": -11.932939529418945, "global_step": 315819, "epoch": 1879} {"train_loss": -12.277901649475098, "global_step": 315820, "epoch": 1879} {"train_loss": -12.362203598022461, "global_step": 315821, "epoch": 1879} {"train_loss": -11.972813606262207, "global_step": 315822, "epoch": 1879} {"train_loss": -11.992711067199707, "global_step": 315823, "epoch": 1879} {"train_loss": -11.453934669494629, "global_step": 315824, "epoch": 1879} {"train_loss": -12.30040454864502, "global_step": 315825, "epoch": 1879} {"train_loss": -11.79052734375, "global_step": 315826, "epoch": 1879} {"train_loss": -12.458839416503906, "global_step": 315827, "epoch": 1879} {"train_loss": -11.434733390808105, "global_step": 315828, "epoch": 1879} {"train_loss": -11.599294662475586, "global_step": 315829, "epoch": 1879} {"train_loss": -12.416585922241211, "global_step": 315830, "epoch": 1879} {"train_loss": -12.177513122558594, "global_step": 315831, "epoch": 1879} {"train_loss": -11.702129364013672, "global_step": 315832, "epoch": 1879} {"train_loss": -11.853300094604492, "global_step": 315833, "epoch": 1879} {"train_loss": -12.373468399047852, "global_step": 315834, "epoch": 1879} {"train_loss": -11.714888572692871, "global_step": 315835, "epoch": 1879} {"train_loss": -11.725337028503418, "global_step": 315836, "epoch": 1879} {"train_loss": -12.311239242553711, "global_step": 315837, "epoch": 1879} {"train_loss": -12.150409698486328, "global_step": 315838, "epoch": 1879} {"train_loss": -12.026047263826642, "global_step": 315839, "epoch": 1879, "val_loss": 280155.875} {"train_loss": -12.292332649230957, "global_step": 315840, "epoch": 1880} {"train_loss": -12.156137466430664, "global_step": 315841, "epoch": 1880} {"train_loss": -11.958356857299805, "global_step": 315842, "epoch": 1880} {"train_loss": -12.41847038269043, "global_step": 315843, "epoch": 1880} {"train_loss": -11.57227897644043, "global_step": 315844, "epoch": 1880} {"train_loss": -10.738903045654297, "global_step": 315845, "epoch": 1880} {"train_loss": -11.118428230285645, "global_step": 315846, "epoch": 1880} {"train_loss": -12.281789779663086, "global_step": 315847, "epoch": 1880} {"train_loss": -10.892873764038086, "global_step": 315848, "epoch": 1880} {"train_loss": -10.194417953491211, "global_step": 315849, "epoch": 1880} {"train_loss": -12.05146598815918, "global_step": 315850, "epoch": 1880} {"train_loss": -10.967413902282715, "global_step": 315851, "epoch": 1880} {"train_loss": -11.155441284179688, "global_step": 315852, "epoch": 1880} {"train_loss": -11.019781112670898, "global_step": 315853, "epoch": 1880} {"train_loss": -11.008101463317871, "global_step": 315854, "epoch": 1880} {"train_loss": -8.910038948059082, "global_step": 315855, "epoch": 1880} {"train_loss": -9.32506275177002, "global_step": 315856, "epoch": 1880} {"train_loss": -9.198710441589355, "global_step": 315857, "epoch": 1880} {"train_loss": -11.753867149353027, "global_step": 315858, "epoch": 1880} {"train_loss": -8.997522354125977, "global_step": 315859, "epoch": 1880} {"train_loss": -12.124435424804688, "global_step": 315860, "epoch": 1880} {"train_loss": -9.994418144226074, "global_step": 315861, "epoch": 1880} {"train_loss": -11.561168670654297, "global_step": 315862, "epoch": 1880} {"train_loss": -9.674758911132812, "global_step": 315863, "epoch": 1880} {"train_loss": -10.295135498046875, "global_step": 315864, "epoch": 1880} {"train_loss": -10.720855712890625, "global_step": 315865, "epoch": 1880} {"train_loss": -9.424673080444336, "global_step": 315866, "epoch": 1880} {"train_loss": -10.821578979492188, "global_step": 315867, "epoch": 1880} {"train_loss": -8.358163833618164, "global_step": 315868, "epoch": 1880} {"train_loss": -7.321145057678223, "global_step": 315869, "epoch": 1880} {"train_loss": -8.565474510192871, "global_step": 315870, "epoch": 1880} {"train_loss": -7.899289131164551, "global_step": 315871, "epoch": 1880} {"train_loss": -8.230968475341797, "global_step": 315872, "epoch": 1880} {"train_loss": -9.958820343017578, "global_step": 315873, "epoch": 1880} {"train_loss": -10.269155502319336, "global_step": 315874, "epoch": 1880} {"train_loss": -9.225044250488281, "global_step": 315875, "epoch": 1880} {"train_loss": -9.305598258972168, "global_step": 315876, "epoch": 1880} {"train_loss": -9.428321838378906, "global_step": 315877, "epoch": 1880} {"train_loss": -10.330379486083984, "global_step": 315878, "epoch": 1880} {"train_loss": -9.771028518676758, "global_step": 315879, "epoch": 1880} {"train_loss": -10.34479808807373, "global_step": 315880, "epoch": 1880} {"train_loss": -10.58268928527832, "global_step": 315881, "epoch": 1880} {"train_loss": -10.597953796386719, "global_step": 315882, "epoch": 1880} {"train_loss": -10.5478515625, "global_step": 315883, "epoch": 1880} {"train_loss": -10.755128860473633, "global_step": 315884, "epoch": 1880} {"train_loss": -10.53096866607666, "global_step": 315885, "epoch": 1880} {"train_loss": -10.419038772583008, "global_step": 315886, "epoch": 1880} {"train_loss": -11.149717330932617, "global_step": 315887, "epoch": 1880} {"train_loss": -11.454058647155762, "global_step": 315888, "epoch": 1880} {"train_loss": -11.376867294311523, "global_step": 315889, "epoch": 1880} {"train_loss": -11.381280899047852, "global_step": 315890, "epoch": 1880} {"train_loss": -11.356735229492188, "global_step": 315891, "epoch": 1880} {"train_loss": -11.345128059387207, "global_step": 315892, "epoch": 1880} {"train_loss": -11.559643745422363, "global_step": 315893, "epoch": 1880} {"train_loss": -11.341985702514648, "global_step": 315894, "epoch": 1880} {"train_loss": -11.30277156829834, "global_step": 315895, "epoch": 1880} {"train_loss": -11.521438598632812, "global_step": 315896, "epoch": 1880} {"train_loss": -11.601285934448242, "global_step": 315897, "epoch": 1880} {"train_loss": -11.695035934448242, "global_step": 315898, "epoch": 1880} {"train_loss": -11.880717277526855, "global_step": 315899, "epoch": 1880} {"train_loss": -11.807560920715332, "global_step": 315900, "epoch": 1880} {"train_loss": -11.713607788085938, "global_step": 315901, "epoch": 1880} {"train_loss": -11.579145431518555, "global_step": 315902, "epoch": 1880} {"train_loss": -11.948801040649414, "global_step": 315903, "epoch": 1880} {"train_loss": -11.663249015808105, "global_step": 315904, "epoch": 1880} {"train_loss": -11.708395004272461, "global_step": 315905, "epoch": 1880} {"train_loss": -11.814803123474121, "global_step": 315906, "epoch": 1880} {"train_loss": -11.759014129638672, "global_step": 315907, "epoch": 1880} {"train_loss": -11.95604133605957, "global_step": 315908, "epoch": 1880} {"train_loss": -11.644732475280762, "global_step": 315909, "epoch": 1880} {"train_loss": -11.90512752532959, "global_step": 315910, "epoch": 1880} {"train_loss": -11.972522735595703, "global_step": 315911, "epoch": 1880} {"train_loss": -12.145919799804688, "global_step": 315912, "epoch": 1880} {"train_loss": -11.849535942077637, "global_step": 315913, "epoch": 1880} {"train_loss": -11.786785125732422, "global_step": 315914, "epoch": 1880} {"train_loss": -11.717591285705566, "global_step": 315915, "epoch": 1880} {"train_loss": -11.907829284667969, "global_step": 315916, "epoch": 1880} {"train_loss": -11.938715934753418, "global_step": 315917, "epoch": 1880} {"train_loss": -12.10396957397461, "global_step": 315918, "epoch": 1880} {"train_loss": -11.907218933105469, "global_step": 315919, "epoch": 1880} {"train_loss": -12.10816478729248, "global_step": 315920, "epoch": 1880} {"train_loss": -12.155275344848633, "global_step": 315921, "epoch": 1880} {"train_loss": -12.064794540405273, "global_step": 315922, "epoch": 1880} {"train_loss": -12.08652114868164, "global_step": 315923, "epoch": 1880} {"train_loss": -11.954511642456055, "global_step": 315924, "epoch": 1880} {"train_loss": -12.259115219116211, "global_step": 315925, "epoch": 1880} {"train_loss": -12.033720016479492, "global_step": 315926, "epoch": 1880} {"train_loss": -12.040996551513672, "global_step": 315927, "epoch": 1880} {"train_loss": -12.221120834350586, "global_step": 315928, "epoch": 1880} {"train_loss": -12.263277053833008, "global_step": 315929, "epoch": 1880} {"train_loss": -12.16189193725586, "global_step": 315930, "epoch": 1880} {"train_loss": -12.214011192321777, "global_step": 315931, "epoch": 1880} {"train_loss": -12.285860061645508, "global_step": 315932, "epoch": 1880} {"train_loss": -12.213066101074219, "global_step": 315933, "epoch": 1880} {"train_loss": -12.317586898803711, "global_step": 315934, "epoch": 1880} {"train_loss": -12.198122024536133, "global_step": 315935, "epoch": 1880} {"train_loss": -12.240828514099121, "global_step": 315936, "epoch": 1880} {"train_loss": -12.21865463256836, "global_step": 315937, "epoch": 1880} {"train_loss": -12.080238342285156, "global_step": 315938, "epoch": 1880} {"train_loss": -12.281416893005371, "global_step": 315939, "epoch": 1880} {"train_loss": -12.20218276977539, "global_step": 315940, "epoch": 1880} {"train_loss": -11.950329780578613, "global_step": 315941, "epoch": 1880} {"train_loss": -12.51910400390625, "global_step": 315942, "epoch": 1880} {"train_loss": -12.292123794555664, "global_step": 315943, "epoch": 1880} {"train_loss": -12.296445846557617, "global_step": 315944, "epoch": 1880} {"train_loss": -12.379449844360352, "global_step": 315945, "epoch": 1880} {"train_loss": -12.01106071472168, "global_step": 315946, "epoch": 1880} {"train_loss": -12.400494575500488, "global_step": 315947, "epoch": 1880} {"train_loss": -11.92652702331543, "global_step": 315948, "epoch": 1880} {"train_loss": -12.372919082641602, "global_step": 315949, "epoch": 1880} {"train_loss": -12.206855773925781, "global_step": 315950, "epoch": 1880} {"train_loss": -12.325037956237793, "global_step": 315951, "epoch": 1880} {"train_loss": -12.233819961547852, "global_step": 315952, "epoch": 1880} {"train_loss": -12.422627449035645, "global_step": 315953, "epoch": 1880} {"train_loss": -12.454710006713867, "global_step": 315954, "epoch": 1880} {"train_loss": -12.245161056518555, "global_step": 315955, "epoch": 1880} {"train_loss": -12.44908332824707, "global_step": 315956, "epoch": 1880} {"train_loss": -12.23800277709961, "global_step": 315957, "epoch": 1880} {"train_loss": -12.498346328735352, "global_step": 315958, "epoch": 1880} {"train_loss": -12.419698715209961, "global_step": 315959, "epoch": 1880} {"train_loss": -12.339534759521484, "global_step": 315960, "epoch": 1880} {"train_loss": -12.361004829406738, "global_step": 315961, "epoch": 1880} {"train_loss": -12.396949768066406, "global_step": 315962, "epoch": 1880} {"train_loss": -12.610398292541504, "global_step": 315963, "epoch": 1880} {"train_loss": -12.187267303466797, "global_step": 315964, "epoch": 1880} {"train_loss": -12.433247566223145, "global_step": 315965, "epoch": 1880} {"train_loss": -12.419522285461426, "global_step": 315966, "epoch": 1880} {"train_loss": -12.512992858886719, "global_step": 315967, "epoch": 1880} {"train_loss": -12.399345397949219, "global_step": 315968, "epoch": 1880} {"train_loss": -12.524985313415527, "global_step": 315969, "epoch": 1880} {"train_loss": -12.636147499084473, "global_step": 315970, "epoch": 1880} {"train_loss": -12.548111915588379, "global_step": 315971, "epoch": 1880} {"train_loss": -12.591804504394531, "global_step": 315972, "epoch": 1880} {"train_loss": -12.398576736450195, "global_step": 315973, "epoch": 1880} {"train_loss": -12.575366020202637, "global_step": 315974, "epoch": 1880} {"train_loss": -12.669363021850586, "global_step": 315975, "epoch": 1880} {"train_loss": -12.363202095031738, "global_step": 315976, "epoch": 1880} {"train_loss": -12.583035469055176, "global_step": 315977, "epoch": 1880} {"train_loss": -12.463516235351562, "global_step": 315978, "epoch": 1880} {"train_loss": -12.48836612701416, "global_step": 315979, "epoch": 1880} {"train_loss": -12.608721733093262, "global_step": 315980, "epoch": 1880} {"train_loss": -12.396976470947266, "global_step": 315981, "epoch": 1880} {"train_loss": -12.674306869506836, "global_step": 315982, "epoch": 1880} {"train_loss": -12.459869384765625, "global_step": 315983, "epoch": 1880} {"train_loss": -12.522146224975586, "global_step": 315984, "epoch": 1880} {"train_loss": -12.197582244873047, "global_step": 315985, "epoch": 1880} {"train_loss": -12.045991897583008, "global_step": 315986, "epoch": 1880} {"train_loss": -12.369915008544922, "global_step": 315987, "epoch": 1880} {"train_loss": -12.17570686340332, "global_step": 315988, "epoch": 1880} {"train_loss": -11.755422592163086, "global_step": 315989, "epoch": 1880} {"train_loss": -12.663318634033203, "global_step": 315990, "epoch": 1880} {"train_loss": -11.314027786254883, "global_step": 315991, "epoch": 1880} {"train_loss": -10.510860443115234, "global_step": 315992, "epoch": 1880} {"train_loss": -11.29764461517334, "global_step": 315993, "epoch": 1880} {"train_loss": -11.10979175567627, "global_step": 315994, "epoch": 1880} {"train_loss": -9.213370323181152, "global_step": 315995, "epoch": 1880} {"train_loss": -10.47372055053711, "global_step": 315996, "epoch": 1880} {"train_loss": -7.556090831756592, "global_step": 315997, "epoch": 1880} {"train_loss": -8.130046844482422, "global_step": 315998, "epoch": 1880} {"train_loss": -7.246561050415039, "global_step": 315999, "epoch": 1880} {"train_loss": -7.084501266479492, "global_step": 316000, "epoch": 1880} {"train_loss": -7.846312522888184, "global_step": 316001, "epoch": 1880} {"train_loss": -8.379472732543945, "global_step": 316002, "epoch": 1880} {"train_loss": -9.556316375732422, "global_step": 316003, "epoch": 1880} {"train_loss": -9.532644271850586, "global_step": 316004, "epoch": 1880} {"train_loss": -9.112765312194824, "global_step": 316005, "epoch": 1880} {"train_loss": -9.801628112792969, "global_step": 316006, "epoch": 1880} {"train_loss": -11.349159754457927, "global_step": 316007, "epoch": 1880, "val_loss": 280935.84375, "train_action_mse_error": 3.1379780769348145} {"train_loss": -9.209228515625, "global_step": 316008, "epoch": 1881} {"train_loss": -10.533854484558105, "global_step": 316009, "epoch": 1881} {"train_loss": -10.683757781982422, "global_step": 316010, "epoch": 1881} {"train_loss": -10.403898239135742, "global_step": 316011, "epoch": 1881} {"train_loss": -9.814899444580078, "global_step": 316012, "epoch": 1881} {"train_loss": -11.003875732421875, "global_step": 316013, "epoch": 1881} {"train_loss": -10.807607650756836, "global_step": 316014, "epoch": 1881} {"train_loss": -10.36921501159668, "global_step": 316015, "epoch": 1881} {"train_loss": -10.839435577392578, "global_step": 316016, "epoch": 1881} {"train_loss": -10.09408950805664, "global_step": 316017, "epoch": 1881} {"train_loss": -10.367942810058594, "global_step": 316018, "epoch": 1881} {"train_loss": -10.42544174194336, "global_step": 316019, "epoch": 1881} {"train_loss": -9.971935272216797, "global_step": 316020, "epoch": 1881} {"train_loss": -11.55817985534668, "global_step": 316021, "epoch": 1881} {"train_loss": -10.48042106628418, "global_step": 316022, "epoch": 1881} {"train_loss": -11.231172561645508, "global_step": 316023, "epoch": 1881} {"train_loss": -11.177175521850586, "global_step": 316024, "epoch": 1881} {"train_loss": -11.220535278320312, "global_step": 316025, "epoch": 1881} {"train_loss": -10.699945449829102, "global_step": 316026, "epoch": 1881} {"train_loss": -11.71796989440918, "global_step": 316027, "epoch": 1881} {"train_loss": -11.16433334350586, "global_step": 316028, "epoch": 1881} {"train_loss": -11.927526473999023, "global_step": 316029, "epoch": 1881} {"train_loss": -11.599533081054688, "global_step": 316030, "epoch": 1881} {"train_loss": -11.451919555664062, "global_step": 316031, "epoch": 1881} {"train_loss": -11.433051109313965, "global_step": 316032, "epoch": 1881} {"train_loss": -11.618749618530273, "global_step": 316033, "epoch": 1881} {"train_loss": -11.458808898925781, "global_step": 316034, "epoch": 1881} {"train_loss": -11.759321212768555, "global_step": 316035, "epoch": 1881} {"train_loss": -11.674222946166992, "global_step": 316036, "epoch": 1881} {"train_loss": -11.562875747680664, "global_step": 316037, "epoch": 1881} {"train_loss": -11.736642837524414, "global_step": 316038, "epoch": 1881} {"train_loss": -11.479875564575195, "global_step": 316039, "epoch": 1881} {"train_loss": -11.8865327835083, "global_step": 316040, "epoch": 1881} {"train_loss": -11.748401641845703, "global_step": 316041, "epoch": 1881} {"train_loss": -12.101374626159668, "global_step": 316042, "epoch": 1881} {"train_loss": -12.127676963806152, "global_step": 316043, "epoch": 1881} {"train_loss": -11.96080493927002, "global_step": 316044, "epoch": 1881} {"train_loss": -11.964958190917969, "global_step": 316045, "epoch": 1881} {"train_loss": -11.929695129394531, "global_step": 316046, "epoch": 1881} {"train_loss": -12.040657043457031, "global_step": 316047, "epoch": 1881} {"train_loss": -11.930402755737305, "global_step": 316048, "epoch": 1881} {"train_loss": -11.973150253295898, "global_step": 316049, "epoch": 1881} {"train_loss": -12.074234962463379, "global_step": 316050, "epoch": 1881} {"train_loss": -12.056641578674316, "global_step": 316051, "epoch": 1881} {"train_loss": -12.092750549316406, "global_step": 316052, "epoch": 1881} {"train_loss": -12.015432357788086, "global_step": 316053, "epoch": 1881} {"train_loss": -12.08825969696045, "global_step": 316054, "epoch": 1881} {"train_loss": -12.07915210723877, "global_step": 316055, "epoch": 1881} {"train_loss": -12.093664169311523, "global_step": 316056, "epoch": 1881} {"train_loss": -12.315938949584961, "global_step": 316057, "epoch": 1881} {"train_loss": -12.153695106506348, "global_step": 316058, "epoch": 1881} {"train_loss": -12.183455467224121, "global_step": 316059, "epoch": 1881} {"train_loss": -12.230491638183594, "global_step": 316060, "epoch": 1881} {"train_loss": -12.175918579101562, "global_step": 316061, "epoch": 1881} {"train_loss": -12.153942108154297, "global_step": 316062, "epoch": 1881} {"train_loss": -12.162018775939941, "global_step": 316063, "epoch": 1881} {"train_loss": -12.239235877990723, "global_step": 316064, "epoch": 1881} {"train_loss": -12.022624015808105, "global_step": 316065, "epoch": 1881} {"train_loss": -12.242053985595703, "global_step": 316066, "epoch": 1881} {"train_loss": -12.102155685424805, "global_step": 316067, "epoch": 1881} {"train_loss": -12.257420539855957, "global_step": 316068, "epoch": 1881} {"train_loss": -11.974288940429688, "global_step": 316069, "epoch": 1881} {"train_loss": -12.107478141784668, "global_step": 316070, "epoch": 1881} {"train_loss": -12.376497268676758, "global_step": 316071, "epoch": 1881} {"train_loss": -12.324180603027344, "global_step": 316072, "epoch": 1881} {"train_loss": -12.213597297668457, "global_step": 316073, "epoch": 1881} {"train_loss": -12.098880767822266, "global_step": 316074, "epoch": 1881} {"train_loss": -12.209699630737305, "global_step": 316075, "epoch": 1881} {"train_loss": -12.135647773742676, "global_step": 316076, "epoch": 1881} {"train_loss": -12.123394012451172, "global_step": 316077, "epoch": 1881} {"train_loss": -11.930354118347168, "global_step": 316078, "epoch": 1881} {"train_loss": -12.297466278076172, "global_step": 316079, "epoch": 1881} {"train_loss": -12.127325057983398, "global_step": 316080, "epoch": 1881} {"train_loss": -12.30183219909668, "global_step": 316081, "epoch": 1881} {"train_loss": -12.160308837890625, "global_step": 316082, "epoch": 1881} {"train_loss": -12.3640775680542, "global_step": 316083, "epoch": 1881} {"train_loss": -12.21921157836914, "global_step": 316084, "epoch": 1881} {"train_loss": -12.46217155456543, "global_step": 316085, "epoch": 1881} {"train_loss": -12.336843490600586, "global_step": 316086, "epoch": 1881} {"train_loss": -12.467535972595215, "global_step": 316087, "epoch": 1881} {"train_loss": -12.324972152709961, "global_step": 316088, "epoch": 1881} {"train_loss": -12.420618057250977, "global_step": 316089, "epoch": 1881} {"train_loss": -12.161250114440918, "global_step": 316090, "epoch": 1881} {"train_loss": -12.38949203491211, "global_step": 316091, "epoch": 1881} {"train_loss": -12.434030532836914, "global_step": 316092, "epoch": 1881} {"train_loss": -12.386993408203125, "global_step": 316093, "epoch": 1881} {"train_loss": -12.275396347045898, "global_step": 316094, "epoch": 1881} {"train_loss": -12.370426177978516, "global_step": 316095, "epoch": 1881} {"train_loss": -12.498580932617188, "global_step": 316096, "epoch": 1881} {"train_loss": -12.468860626220703, "global_step": 316097, "epoch": 1881} {"train_loss": -12.432973861694336, "global_step": 316098, "epoch": 1881} {"train_loss": -12.425787925720215, "global_step": 316099, "epoch": 1881} {"train_loss": -12.389493942260742, "global_step": 316100, "epoch": 1881} {"train_loss": -12.486330032348633, "global_step": 316101, "epoch": 1881} {"train_loss": -12.410881042480469, "global_step": 316102, "epoch": 1881} {"train_loss": -12.20001220703125, "global_step": 316103, "epoch": 1881} {"train_loss": -12.648368835449219, "global_step": 316104, "epoch": 1881} {"train_loss": -12.402302742004395, "global_step": 316105, "epoch": 1881} {"train_loss": -12.010514259338379, "global_step": 316106, "epoch": 1881} {"train_loss": -12.570576667785645, "global_step": 316107, "epoch": 1881} {"train_loss": -12.355911254882812, "global_step": 316108, "epoch": 1881} {"train_loss": -12.300296783447266, "global_step": 316109, "epoch": 1881} {"train_loss": -12.250137329101562, "global_step": 316110, "epoch": 1881} {"train_loss": -12.227874755859375, "global_step": 316111, "epoch": 1881} {"train_loss": -12.213122367858887, "global_step": 316112, "epoch": 1881} {"train_loss": -12.35197639465332, "global_step": 316113, "epoch": 1881} {"train_loss": -12.121639251708984, "global_step": 316114, "epoch": 1881} {"train_loss": -11.822526931762695, "global_step": 316115, "epoch": 1881} {"train_loss": -11.795873641967773, "global_step": 316116, "epoch": 1881} {"train_loss": -11.769113540649414, "global_step": 316117, "epoch": 1881} {"train_loss": -10.975610733032227, "global_step": 316118, "epoch": 1881} {"train_loss": -11.500652313232422, "global_step": 316119, "epoch": 1881} {"train_loss": -10.889839172363281, "global_step": 316120, "epoch": 1881} {"train_loss": -11.381991386413574, "global_step": 316121, "epoch": 1881} {"train_loss": -10.98088550567627, "global_step": 316122, "epoch": 1881} {"train_loss": -11.826592445373535, "global_step": 316123, "epoch": 1881} {"train_loss": -10.032268524169922, "global_step": 316124, "epoch": 1881} {"train_loss": -10.209172248840332, "global_step": 316125, "epoch": 1881} {"train_loss": -11.265342712402344, "global_step": 316126, "epoch": 1881} {"train_loss": -11.730656623840332, "global_step": 316127, "epoch": 1881} {"train_loss": -10.603267669677734, "global_step": 316128, "epoch": 1881} {"train_loss": -11.076908111572266, "global_step": 316129, "epoch": 1881} {"train_loss": -11.671343803405762, "global_step": 316130, "epoch": 1881} {"train_loss": -10.311031341552734, "global_step": 316131, "epoch": 1881} {"train_loss": -11.709884643554688, "global_step": 316132, "epoch": 1881} {"train_loss": -9.348857879638672, "global_step": 316133, "epoch": 1881} {"train_loss": -11.9501953125, "global_step": 316134, "epoch": 1881} {"train_loss": -10.574045181274414, "global_step": 316135, "epoch": 1881} {"train_loss": -10.586666107177734, "global_step": 316136, "epoch": 1881} {"train_loss": -11.714201927185059, "global_step": 316137, "epoch": 1881} {"train_loss": -10.329471588134766, "global_step": 316138, "epoch": 1881} {"train_loss": -11.919239044189453, "global_step": 316139, "epoch": 1881} {"train_loss": -11.051719665527344, "global_step": 316140, "epoch": 1881} {"train_loss": -11.69844913482666, "global_step": 316141, "epoch": 1881} {"train_loss": -11.628114700317383, "global_step": 316142, "epoch": 1881} {"train_loss": -11.058025360107422, "global_step": 316143, "epoch": 1881} {"train_loss": -12.04723834991455, "global_step": 316144, "epoch": 1881} {"train_loss": -11.262044906616211, "global_step": 316145, "epoch": 1881} {"train_loss": -12.132645606994629, "global_step": 316146, "epoch": 1881} {"train_loss": -11.699529647827148, "global_step": 316147, "epoch": 1881} {"train_loss": -11.87052059173584, "global_step": 316148, "epoch": 1881} {"train_loss": -11.455785751342773, "global_step": 316149, "epoch": 1881} {"train_loss": -11.767210006713867, "global_step": 316150, "epoch": 1881} {"train_loss": -11.929319381713867, "global_step": 316151, "epoch": 1881} {"train_loss": -11.51255989074707, "global_step": 316152, "epoch": 1881} {"train_loss": -12.003608703613281, "global_step": 316153, "epoch": 1881} {"train_loss": -11.380708694458008, "global_step": 316154, "epoch": 1881} {"train_loss": -11.832550048828125, "global_step": 316155, "epoch": 1881} {"train_loss": -11.353227615356445, "global_step": 316156, "epoch": 1881} {"train_loss": -11.396398544311523, "global_step": 316157, "epoch": 1881} {"train_loss": -11.897668838500977, "global_step": 316158, "epoch": 1881} {"train_loss": -11.788835525512695, "global_step": 316159, "epoch": 1881} {"train_loss": -11.836097717285156, "global_step": 316160, "epoch": 1881} {"train_loss": -11.944609642028809, "global_step": 316161, "epoch": 1881} {"train_loss": -12.21284294128418, "global_step": 316162, "epoch": 1881} {"train_loss": -11.869793891906738, "global_step": 316163, "epoch": 1881} {"train_loss": -12.126176834106445, "global_step": 316164, "epoch": 1881} {"train_loss": -11.770743370056152, "global_step": 316165, "epoch": 1881} {"train_loss": -12.268623352050781, "global_step": 316166, "epoch": 1881} {"train_loss": -11.70706558227539, "global_step": 316167, "epoch": 1881} {"train_loss": -11.721900939941406, "global_step": 316168, "epoch": 1881} {"train_loss": -12.051236152648926, "global_step": 316169, "epoch": 1881} {"train_loss": -11.920282363891602, "global_step": 316170, "epoch": 1881} {"train_loss": -12.132265090942383, "global_step": 316171, "epoch": 1881} {"train_loss": -11.884342193603516, "global_step": 316172, "epoch": 1881} {"train_loss": -12.253753662109375, "global_step": 316173, "epoch": 1881} {"train_loss": -11.89301872253418, "global_step": 316174, "epoch": 1881} {"train_loss": -11.726669805390495, "global_step": 316175, "epoch": 1881, "val_loss": 287002.34375} {"train_loss": -12.137880325317383, "global_step": 316176, "epoch": 1882} {"train_loss": -12.119632720947266, "global_step": 316177, "epoch": 1882} {"train_loss": -11.966099739074707, "global_step": 316178, "epoch": 1882} {"train_loss": -12.319818496704102, "global_step": 316179, "epoch": 1882} {"train_loss": -11.96312141418457, "global_step": 316180, "epoch": 1882} {"train_loss": -12.323183059692383, "global_step": 316181, "epoch": 1882} {"train_loss": -12.06231689453125, "global_step": 316182, "epoch": 1882} {"train_loss": -12.310888290405273, "global_step": 316183, "epoch": 1882} {"train_loss": -12.185504913330078, "global_step": 316184, "epoch": 1882} {"train_loss": -12.413843154907227, "global_step": 316185, "epoch": 1882} {"train_loss": -12.284712791442871, "global_step": 316186, "epoch": 1882} {"train_loss": -12.465888977050781, "global_step": 316187, "epoch": 1882} {"train_loss": -12.30210018157959, "global_step": 316188, "epoch": 1882} {"train_loss": -12.289580345153809, "global_step": 316189, "epoch": 1882} {"train_loss": -12.337114334106445, "global_step": 316190, "epoch": 1882} {"train_loss": -12.399177551269531, "global_step": 316191, "epoch": 1882} {"train_loss": -12.225614547729492, "global_step": 316192, "epoch": 1882} {"train_loss": -12.074377059936523, "global_step": 316193, "epoch": 1882} {"train_loss": -12.170635223388672, "global_step": 316194, "epoch": 1882} {"train_loss": -12.31910514831543, "global_step": 316195, "epoch": 1882} {"train_loss": -12.12313175201416, "global_step": 316196, "epoch": 1882} {"train_loss": -12.419078826904297, "global_step": 316197, "epoch": 1882} {"train_loss": -12.161413192749023, "global_step": 316198, "epoch": 1882} {"train_loss": -12.18062973022461, "global_step": 316199, "epoch": 1882} {"train_loss": -12.134252548217773, "global_step": 316200, "epoch": 1882} {"train_loss": -11.97933578491211, "global_step": 316201, "epoch": 1882} {"train_loss": -12.104957580566406, "global_step": 316202, "epoch": 1882} {"train_loss": -12.06954574584961, "global_step": 316203, "epoch": 1882} {"train_loss": -12.27251148223877, "global_step": 316204, "epoch": 1882} {"train_loss": -11.944601058959961, "global_step": 316205, "epoch": 1882} {"train_loss": -11.904806137084961, "global_step": 316206, "epoch": 1882} {"train_loss": -11.920408248901367, "global_step": 316207, "epoch": 1882} {"train_loss": -12.128084182739258, "global_step": 316208, "epoch": 1882} {"train_loss": -11.707925796508789, "global_step": 316209, "epoch": 1882} {"train_loss": -11.986993789672852, "global_step": 316210, "epoch": 1882} {"train_loss": -10.78431224822998, "global_step": 316211, "epoch": 1882} {"train_loss": -12.018280982971191, "global_step": 316212, "epoch": 1882} {"train_loss": -11.775022506713867, "global_step": 316213, "epoch": 1882} {"train_loss": -11.401039123535156, "global_step": 316214, "epoch": 1882} {"train_loss": -11.58242130279541, "global_step": 316215, "epoch": 1882} {"train_loss": -11.919743537902832, "global_step": 316216, "epoch": 1882} {"train_loss": -11.285781860351562, "global_step": 316217, "epoch": 1882} {"train_loss": -11.72210693359375, "global_step": 316218, "epoch": 1882} {"train_loss": -11.940651893615723, "global_step": 316219, "epoch": 1882} {"train_loss": -11.03006362915039, "global_step": 316220, "epoch": 1882} {"train_loss": -12.269932746887207, "global_step": 316221, "epoch": 1882} {"train_loss": -10.735403060913086, "global_step": 316222, "epoch": 1882} {"train_loss": -11.419561386108398, "global_step": 316223, "epoch": 1882} {"train_loss": -11.94091796875, "global_step": 316224, "epoch": 1882} {"train_loss": -11.132078170776367, "global_step": 316225, "epoch": 1882} {"train_loss": -11.983179092407227, "global_step": 316226, "epoch": 1882} {"train_loss": -11.266170501708984, "global_step": 316227, "epoch": 1882} {"train_loss": -11.723342895507812, "global_step": 316228, "epoch": 1882} {"train_loss": -11.95401382446289, "global_step": 316229, "epoch": 1882} {"train_loss": -11.007438659667969, "global_step": 316230, "epoch": 1882} {"train_loss": -12.094329833984375, "global_step": 316231, "epoch": 1882} {"train_loss": -11.255874633789062, "global_step": 316232, "epoch": 1882} {"train_loss": -12.022867202758789, "global_step": 316233, "epoch": 1882} {"train_loss": -11.689266204833984, "global_step": 316234, "epoch": 1882} {"train_loss": -10.6519136428833, "global_step": 316235, "epoch": 1882} {"train_loss": -11.874527931213379, "global_step": 316236, "epoch": 1882} {"train_loss": -11.451286315917969, "global_step": 316237, "epoch": 1882} {"train_loss": -11.797950744628906, "global_step": 316238, "epoch": 1882} {"train_loss": -11.704635620117188, "global_step": 316239, "epoch": 1882} {"train_loss": -11.589765548706055, "global_step": 316240, "epoch": 1882} {"train_loss": -11.21377944946289, "global_step": 316241, "epoch": 1882} {"train_loss": -11.86472225189209, "global_step": 316242, "epoch": 1882} {"train_loss": -11.235638618469238, "global_step": 316243, "epoch": 1882} {"train_loss": -11.031083106994629, "global_step": 316244, "epoch": 1882} {"train_loss": -10.695024490356445, "global_step": 316245, "epoch": 1882} {"train_loss": -10.539517402648926, "global_step": 316246, "epoch": 1882} {"train_loss": -10.734405517578125, "global_step": 316247, "epoch": 1882} {"train_loss": -10.763758659362793, "global_step": 316248, "epoch": 1882} {"train_loss": -10.802705764770508, "global_step": 316249, "epoch": 1882} {"train_loss": -10.674477577209473, "global_step": 316250, "epoch": 1882} {"train_loss": -9.95769214630127, "global_step": 316251, "epoch": 1882} {"train_loss": -10.923986434936523, "global_step": 316252, "epoch": 1882} {"train_loss": -9.285186767578125, "global_step": 316253, "epoch": 1882} {"train_loss": -10.50455093383789, "global_step": 316254, "epoch": 1882} {"train_loss": -10.057348251342773, "global_step": 316255, "epoch": 1882} {"train_loss": -9.739339828491211, "global_step": 316256, "epoch": 1882} {"train_loss": -9.898393630981445, "global_step": 316257, "epoch": 1882} {"train_loss": -9.927148818969727, "global_step": 316258, "epoch": 1882} {"train_loss": -8.764055252075195, "global_step": 316259, "epoch": 1882} {"train_loss": -8.10955810546875, "global_step": 316260, "epoch": 1882} {"train_loss": -10.20505142211914, "global_step": 316261, "epoch": 1882} {"train_loss": -11.288936614990234, "global_step": 316262, "epoch": 1882} {"train_loss": -9.746866226196289, "global_step": 316263, "epoch": 1882} {"train_loss": -9.566261291503906, "global_step": 316264, "epoch": 1882} {"train_loss": -11.128029823303223, "global_step": 316265, "epoch": 1882} {"train_loss": -10.088363647460938, "global_step": 316266, "epoch": 1882} {"train_loss": -10.036444664001465, "global_step": 316267, "epoch": 1882} {"train_loss": -10.460640907287598, "global_step": 316268, "epoch": 1882} {"train_loss": -10.276224136352539, "global_step": 316269, "epoch": 1882} {"train_loss": -11.079338073730469, "global_step": 316270, "epoch": 1882} {"train_loss": -10.816993713378906, "global_step": 316271, "epoch": 1882} {"train_loss": -10.900227546691895, "global_step": 316272, "epoch": 1882} {"train_loss": -10.751997947692871, "global_step": 316273, "epoch": 1882} {"train_loss": -11.385688781738281, "global_step": 316274, "epoch": 1882} {"train_loss": -10.97291374206543, "global_step": 316275, "epoch": 1882} {"train_loss": -11.452495574951172, "global_step": 316276, "epoch": 1882} {"train_loss": -10.991886138916016, "global_step": 316277, "epoch": 1882} {"train_loss": -11.3551607131958, "global_step": 316278, "epoch": 1882} {"train_loss": -11.42866039276123, "global_step": 316279, "epoch": 1882} {"train_loss": -11.01943588256836, "global_step": 316280, "epoch": 1882} {"train_loss": -11.104923248291016, "global_step": 316281, "epoch": 1882} {"train_loss": -11.612961769104004, "global_step": 316282, "epoch": 1882} {"train_loss": -10.971773147583008, "global_step": 316283, "epoch": 1882} {"train_loss": -11.331403732299805, "global_step": 316284, "epoch": 1882} {"train_loss": -11.683006286621094, "global_step": 316285, "epoch": 1882} {"train_loss": -10.844120025634766, "global_step": 316286, "epoch": 1882} {"train_loss": -11.68174934387207, "global_step": 316287, "epoch": 1882} {"train_loss": -11.262622833251953, "global_step": 316288, "epoch": 1882} {"train_loss": -10.841846466064453, "global_step": 316289, "epoch": 1882} {"train_loss": -11.546440124511719, "global_step": 316290, "epoch": 1882} {"train_loss": -11.797523498535156, "global_step": 316291, "epoch": 1882} {"train_loss": -11.489872932434082, "global_step": 316292, "epoch": 1882} {"train_loss": -11.940112113952637, "global_step": 316293, "epoch": 1882} {"train_loss": -11.750927925109863, "global_step": 316294, "epoch": 1882} {"train_loss": -11.657730102539062, "global_step": 316295, "epoch": 1882} {"train_loss": -11.800336837768555, "global_step": 316296, "epoch": 1882} {"train_loss": -11.83969497680664, "global_step": 316297, "epoch": 1882} {"train_loss": -11.866508483886719, "global_step": 316298, "epoch": 1882} {"train_loss": -11.920624732971191, "global_step": 316299, "epoch": 1882} {"train_loss": -11.612985610961914, "global_step": 316300, "epoch": 1882} {"train_loss": -11.13865852355957, "global_step": 316301, "epoch": 1882} {"train_loss": -12.027589797973633, "global_step": 316302, "epoch": 1882} {"train_loss": -11.827274322509766, "global_step": 316303, "epoch": 1882} {"train_loss": -11.827507972717285, "global_step": 316304, "epoch": 1882} {"train_loss": -12.098249435424805, "global_step": 316305, "epoch": 1882} {"train_loss": -12.005386352539062, "global_step": 316306, "epoch": 1882} {"train_loss": -12.021767616271973, "global_step": 316307, "epoch": 1882} {"train_loss": -12.115257263183594, "global_step": 316308, "epoch": 1882} {"train_loss": -11.857765197753906, "global_step": 316309, "epoch": 1882} {"train_loss": -12.175226211547852, "global_step": 316310, "epoch": 1882} {"train_loss": -11.986801147460938, "global_step": 316311, "epoch": 1882} {"train_loss": -12.07049560546875, "global_step": 316312, "epoch": 1882} {"train_loss": -12.246650695800781, "global_step": 316313, "epoch": 1882} {"train_loss": -12.10940170288086, "global_step": 316314, "epoch": 1882} {"train_loss": -12.120264053344727, "global_step": 316315, "epoch": 1882} {"train_loss": -12.070745468139648, "global_step": 316316, "epoch": 1882} {"train_loss": -12.25706958770752, "global_step": 316317, "epoch": 1882} {"train_loss": -11.98017692565918, "global_step": 316318, "epoch": 1882} {"train_loss": -12.237354278564453, "global_step": 316319, "epoch": 1882} {"train_loss": -12.047233581542969, "global_step": 316320, "epoch": 1882} {"train_loss": -12.18449592590332, "global_step": 316321, "epoch": 1882} {"train_loss": -12.242137908935547, "global_step": 316322, "epoch": 1882} {"train_loss": -12.264660835266113, "global_step": 316323, "epoch": 1882} {"train_loss": -12.148185729980469, "global_step": 316324, "epoch": 1882} {"train_loss": -12.220436096191406, "global_step": 316325, "epoch": 1882} {"train_loss": -12.19165325164795, "global_step": 316326, "epoch": 1882} {"train_loss": -12.298040390014648, "global_step": 316327, "epoch": 1882} {"train_loss": -11.971455574035645, "global_step": 316328, "epoch": 1882} {"train_loss": -12.140871047973633, "global_step": 316329, "epoch": 1882} {"train_loss": -12.208353042602539, "global_step": 316330, "epoch": 1882} {"train_loss": -12.32499885559082, "global_step": 316331, "epoch": 1882} {"train_loss": -12.224992752075195, "global_step": 316332, "epoch": 1882} {"train_loss": -12.281436920166016, "global_step": 316333, "epoch": 1882} {"train_loss": -12.224602699279785, "global_step": 316334, "epoch": 1882} {"train_loss": -12.398584365844727, "global_step": 316335, "epoch": 1882} {"train_loss": -12.379639625549316, "global_step": 316336, "epoch": 1882} {"train_loss": -12.32110595703125, "global_step": 316337, "epoch": 1882} {"train_loss": -12.409521102905273, "global_step": 316338, "epoch": 1882} {"train_loss": -12.339905738830566, "global_step": 316339, "epoch": 1882} {"train_loss": -12.251663208007812, "global_step": 316340, "epoch": 1882} {"train_loss": -12.50417709350586, "global_step": 316341, "epoch": 1882} {"train_loss": -12.465482711791992, "global_step": 316342, "epoch": 1882} {"train_loss": -11.593165874481201, "global_step": 316343, "epoch": 1882, "val_loss": 283116.78125} {"train_loss": -12.455010414123535, "global_step": 316344, "epoch": 1883} {"train_loss": -12.400392532348633, "global_step": 316345, "epoch": 1883} {"train_loss": -12.489594459533691, "global_step": 316346, "epoch": 1883} {"train_loss": -12.554546356201172, "global_step": 316347, "epoch": 1883} {"train_loss": -12.614686965942383, "global_step": 316348, "epoch": 1883} {"train_loss": -12.452251434326172, "global_step": 316349, "epoch": 1883} {"train_loss": -12.543766021728516, "global_step": 316350, "epoch": 1883} {"train_loss": -12.446483612060547, "global_step": 316351, "epoch": 1883} {"train_loss": -12.656702041625977, "global_step": 316352, "epoch": 1883} {"train_loss": -12.118439674377441, "global_step": 316353, "epoch": 1883} {"train_loss": -12.449403762817383, "global_step": 316354, "epoch": 1883} {"train_loss": -12.099297523498535, "global_step": 316355, "epoch": 1883} {"train_loss": -12.53062629699707, "global_step": 316356, "epoch": 1883} {"train_loss": -12.439926147460938, "global_step": 316357, "epoch": 1883} {"train_loss": -12.145638465881348, "global_step": 316358, "epoch": 1883} {"train_loss": -12.550755500793457, "global_step": 316359, "epoch": 1883} {"train_loss": -12.47848129272461, "global_step": 316360, "epoch": 1883} {"train_loss": -12.177207946777344, "global_step": 316361, "epoch": 1883} {"train_loss": -12.145299911499023, "global_step": 316362, "epoch": 1883} {"train_loss": -12.509821891784668, "global_step": 316363, "epoch": 1883} {"train_loss": -12.447305679321289, "global_step": 316364, "epoch": 1883} {"train_loss": -12.49925422668457, "global_step": 316365, "epoch": 1883} {"train_loss": -12.413101196289062, "global_step": 316366, "epoch": 1883} {"train_loss": -12.227832794189453, "global_step": 316367, "epoch": 1883} {"train_loss": -12.382412910461426, "global_step": 316368, "epoch": 1883} {"train_loss": -12.694765090942383, "global_step": 316369, "epoch": 1883} {"train_loss": -12.372049331665039, "global_step": 316370, "epoch": 1883} {"train_loss": -12.484637260437012, "global_step": 316371, "epoch": 1883} {"train_loss": -12.552730560302734, "global_step": 316372, "epoch": 1883} {"train_loss": -12.400044441223145, "global_step": 316373, "epoch": 1883} {"train_loss": -12.34400463104248, "global_step": 316374, "epoch": 1883} {"train_loss": -12.644586563110352, "global_step": 316375, "epoch": 1883} {"train_loss": -12.38882827758789, "global_step": 316376, "epoch": 1883} {"train_loss": -12.671716690063477, "global_step": 316377, "epoch": 1883} {"train_loss": -12.39498519897461, "global_step": 316378, "epoch": 1883} {"train_loss": -12.377248764038086, "global_step": 316379, "epoch": 1883} {"train_loss": -12.27047348022461, "global_step": 316380, "epoch": 1883} {"train_loss": -12.356514930725098, "global_step": 316381, "epoch": 1883} {"train_loss": -12.180074691772461, "global_step": 316382, "epoch": 1883} {"train_loss": -12.414522171020508, "global_step": 316383, "epoch": 1883} {"train_loss": -12.046850204467773, "global_step": 316384, "epoch": 1883} {"train_loss": -11.234136581420898, "global_step": 316385, "epoch": 1883} {"train_loss": -11.971460342407227, "global_step": 316386, "epoch": 1883} {"train_loss": -12.080853462219238, "global_step": 316387, "epoch": 1883} {"train_loss": -11.661310195922852, "global_step": 316388, "epoch": 1883} {"train_loss": -11.628177642822266, "global_step": 316389, "epoch": 1883} {"train_loss": -11.517478942871094, "global_step": 316390, "epoch": 1883} {"train_loss": -12.50791072845459, "global_step": 316391, "epoch": 1883} {"train_loss": -11.937795639038086, "global_step": 316392, "epoch": 1883} {"train_loss": -11.105155944824219, "global_step": 316393, "epoch": 1883} {"train_loss": -12.102009773254395, "global_step": 316394, "epoch": 1883} {"train_loss": -11.756589889526367, "global_step": 316395, "epoch": 1883} {"train_loss": -10.464897155761719, "global_step": 316396, "epoch": 1883} {"train_loss": -12.060342788696289, "global_step": 316397, "epoch": 1883} {"train_loss": -11.712141990661621, "global_step": 316398, "epoch": 1883} {"train_loss": -10.907991409301758, "global_step": 316399, "epoch": 1883} {"train_loss": -11.312193870544434, "global_step": 316400, "epoch": 1883} {"train_loss": -11.05067253112793, "global_step": 316401, "epoch": 1883} {"train_loss": -10.607160568237305, "global_step": 316402, "epoch": 1883} {"train_loss": -10.75655746459961, "global_step": 316403, "epoch": 1883} {"train_loss": -11.810270309448242, "global_step": 316404, "epoch": 1883} {"train_loss": -10.622584342956543, "global_step": 316405, "epoch": 1883} {"train_loss": -11.885278701782227, "global_step": 316406, "epoch": 1883} {"train_loss": -11.204689025878906, "global_step": 316407, "epoch": 1883} {"train_loss": -12.146851539611816, "global_step": 316408, "epoch": 1883} {"train_loss": -11.567341804504395, "global_step": 316409, "epoch": 1883} {"train_loss": -11.547840118408203, "global_step": 316410, "epoch": 1883} {"train_loss": -11.501537322998047, "global_step": 316411, "epoch": 1883} {"train_loss": -11.648527145385742, "global_step": 316412, "epoch": 1883} {"train_loss": -11.648884773254395, "global_step": 316413, "epoch": 1883} {"train_loss": -12.13490104675293, "global_step": 316414, "epoch": 1883} {"train_loss": -11.198511123657227, "global_step": 316415, "epoch": 1883} {"train_loss": -11.795162200927734, "global_step": 316416, "epoch": 1883} {"train_loss": -11.363975524902344, "global_step": 316417, "epoch": 1883} {"train_loss": -11.38089370727539, "global_step": 316418, "epoch": 1883} {"train_loss": -11.604904174804688, "global_step": 316419, "epoch": 1883} {"train_loss": -10.017118453979492, "global_step": 316420, "epoch": 1883} {"train_loss": -11.793655395507812, "global_step": 316421, "epoch": 1883} {"train_loss": -9.729747772216797, "global_step": 316422, "epoch": 1883} {"train_loss": -11.845900535583496, "global_step": 316423, "epoch": 1883} {"train_loss": -9.980833053588867, "global_step": 316424, "epoch": 1883} {"train_loss": -11.352283477783203, "global_step": 316425, "epoch": 1883} {"train_loss": -11.11014175415039, "global_step": 316426, "epoch": 1883} {"train_loss": -10.774822235107422, "global_step": 316427, "epoch": 1883} {"train_loss": -11.282381057739258, "global_step": 316428, "epoch": 1883} {"train_loss": -11.431683540344238, "global_step": 316429, "epoch": 1883} {"train_loss": -11.711200714111328, "global_step": 316430, "epoch": 1883} {"train_loss": -11.18923282623291, "global_step": 316431, "epoch": 1883} {"train_loss": -11.390665054321289, "global_step": 316432, "epoch": 1883} {"train_loss": -11.89346694946289, "global_step": 316433, "epoch": 1883} {"train_loss": -10.937705993652344, "global_step": 316434, "epoch": 1883} {"train_loss": -12.185153007507324, "global_step": 316435, "epoch": 1883} {"train_loss": -10.469629287719727, "global_step": 316436, "epoch": 1883} {"train_loss": -11.684520721435547, "global_step": 316437, "epoch": 1883} {"train_loss": -11.111556053161621, "global_step": 316438, "epoch": 1883} {"train_loss": -10.798823356628418, "global_step": 316439, "epoch": 1883} {"train_loss": -11.931005477905273, "global_step": 316440, "epoch": 1883} {"train_loss": -10.42432975769043, "global_step": 316441, "epoch": 1883} {"train_loss": -11.529077529907227, "global_step": 316442, "epoch": 1883} {"train_loss": -11.229454040527344, "global_step": 316443, "epoch": 1883} {"train_loss": -10.649194717407227, "global_step": 316444, "epoch": 1883} {"train_loss": -11.3961181640625, "global_step": 316445, "epoch": 1883} {"train_loss": -10.84984016418457, "global_step": 316446, "epoch": 1883} {"train_loss": -11.269573211669922, "global_step": 316447, "epoch": 1883} {"train_loss": -11.16312026977539, "global_step": 316448, "epoch": 1883} {"train_loss": -9.73028564453125, "global_step": 316449, "epoch": 1883} {"train_loss": -10.645682334899902, "global_step": 316450, "epoch": 1883} {"train_loss": -11.046440124511719, "global_step": 316451, "epoch": 1883} {"train_loss": -10.868934631347656, "global_step": 316452, "epoch": 1883} {"train_loss": -11.068552017211914, "global_step": 316453, "epoch": 1883} {"train_loss": -11.558826446533203, "global_step": 316454, "epoch": 1883} {"train_loss": -10.399258613586426, "global_step": 316455, "epoch": 1883} {"train_loss": -11.602531433105469, "global_step": 316456, "epoch": 1883} {"train_loss": -11.354025840759277, "global_step": 316457, "epoch": 1883} {"train_loss": -11.271888732910156, "global_step": 316458, "epoch": 1883} {"train_loss": -11.932952880859375, "global_step": 316459, "epoch": 1883} {"train_loss": -11.316317558288574, "global_step": 316460, "epoch": 1883} {"train_loss": -11.785762786865234, "global_step": 316461, "epoch": 1883} {"train_loss": -11.862667083740234, "global_step": 316462, "epoch": 1883} {"train_loss": -11.496740341186523, "global_step": 316463, "epoch": 1883} {"train_loss": -11.857595443725586, "global_step": 316464, "epoch": 1883} {"train_loss": -11.796318054199219, "global_step": 316465, "epoch": 1883} {"train_loss": -11.600503921508789, "global_step": 316466, "epoch": 1883} {"train_loss": -11.995877265930176, "global_step": 316467, "epoch": 1883} {"train_loss": -11.63172721862793, "global_step": 316468, "epoch": 1883} {"train_loss": -11.77071762084961, "global_step": 316469, "epoch": 1883} {"train_loss": -11.536232948303223, "global_step": 316470, "epoch": 1883} {"train_loss": -11.524908065795898, "global_step": 316471, "epoch": 1883} {"train_loss": -11.951640129089355, "global_step": 316472, "epoch": 1883} {"train_loss": -11.621315956115723, "global_step": 316473, "epoch": 1883} {"train_loss": -11.977216720581055, "global_step": 316474, "epoch": 1883} {"train_loss": -11.648157119750977, "global_step": 316475, "epoch": 1883} {"train_loss": -11.84158992767334, "global_step": 316476, "epoch": 1883} {"train_loss": -11.554497718811035, "global_step": 316477, "epoch": 1883} {"train_loss": -11.790907859802246, "global_step": 316478, "epoch": 1883} {"train_loss": -11.905399322509766, "global_step": 316479, "epoch": 1883} {"train_loss": -11.984014511108398, "global_step": 316480, "epoch": 1883} {"train_loss": -11.93729019165039, "global_step": 316481, "epoch": 1883} {"train_loss": -12.03888988494873, "global_step": 316482, "epoch": 1883} {"train_loss": -12.003414154052734, "global_step": 316483, "epoch": 1883} {"train_loss": -11.807759284973145, "global_step": 316484, "epoch": 1883} {"train_loss": -12.017301559448242, "global_step": 316485, "epoch": 1883} {"train_loss": -12.02664566040039, "global_step": 316486, "epoch": 1883} {"train_loss": -12.03603458404541, "global_step": 316487, "epoch": 1883} {"train_loss": -11.870813369750977, "global_step": 316488, "epoch": 1883} {"train_loss": -12.128355026245117, "global_step": 316489, "epoch": 1883} {"train_loss": -11.889381408691406, "global_step": 316490, "epoch": 1883} {"train_loss": -12.221726417541504, "global_step": 316491, "epoch": 1883} {"train_loss": -11.842073440551758, "global_step": 316492, "epoch": 1883} {"train_loss": -12.013359069824219, "global_step": 316493, "epoch": 1883} {"train_loss": -12.14560317993164, "global_step": 316494, "epoch": 1883} {"train_loss": -12.102884292602539, "global_step": 316495, "epoch": 1883} {"train_loss": -12.272245407104492, "global_step": 316496, "epoch": 1883} {"train_loss": -12.003273963928223, "global_step": 316497, "epoch": 1883} {"train_loss": -12.366140365600586, "global_step": 316498, "epoch": 1883} {"train_loss": -12.067508697509766, "global_step": 316499, "epoch": 1883} {"train_loss": -12.033242225646973, "global_step": 316500, "epoch": 1883} {"train_loss": -12.461420059204102, "global_step": 316501, "epoch": 1883} {"train_loss": -12.402997970581055, "global_step": 316502, "epoch": 1883} {"train_loss": -12.285143852233887, "global_step": 316503, "epoch": 1883} {"train_loss": -12.326061248779297, "global_step": 316504, "epoch": 1883} {"train_loss": -12.240355491638184, "global_step": 316505, "epoch": 1883} {"train_loss": -12.316648483276367, "global_step": 316506, "epoch": 1883} {"train_loss": -12.280214309692383, "global_step": 316507, "epoch": 1883} {"train_loss": -12.160171508789062, "global_step": 316508, "epoch": 1883} {"train_loss": -12.12801456451416, "global_step": 316509, "epoch": 1883} {"train_loss": -12.117985725402832, "global_step": 316510, "epoch": 1883} {"train_loss": -11.779211912836347, "global_step": 316511, "epoch": 1883, "val_loss": 286553.5625} {"train_loss": -12.50434684753418, "global_step": 316512, "epoch": 1884} {"train_loss": -12.262962341308594, "global_step": 316513, "epoch": 1884} {"train_loss": -12.573369026184082, "global_step": 316514, "epoch": 1884} {"train_loss": -12.386407852172852, "global_step": 316515, "epoch": 1884} {"train_loss": -11.871467590332031, "global_step": 316516, "epoch": 1884} {"train_loss": -12.420265197753906, "global_step": 316517, "epoch": 1884} {"train_loss": -12.221653938293457, "global_step": 316518, "epoch": 1884} {"train_loss": -12.245887756347656, "global_step": 316519, "epoch": 1884} {"train_loss": -12.316478729248047, "global_step": 316520, "epoch": 1884} {"train_loss": -12.148666381835938, "global_step": 316521, "epoch": 1884} {"train_loss": -12.250040054321289, "global_step": 316522, "epoch": 1884} {"train_loss": -11.889440536499023, "global_step": 316523, "epoch": 1884} {"train_loss": -12.201375961303711, "global_step": 316524, "epoch": 1884} {"train_loss": -12.238390922546387, "global_step": 316525, "epoch": 1884} {"train_loss": -11.452800750732422, "global_step": 316526, "epoch": 1884} {"train_loss": -11.24447250366211, "global_step": 316527, "epoch": 1884} {"train_loss": -11.861743927001953, "global_step": 316528, "epoch": 1884} {"train_loss": -11.711923599243164, "global_step": 316529, "epoch": 1884} {"train_loss": -11.214905738830566, "global_step": 316530, "epoch": 1884} {"train_loss": -11.780391693115234, "global_step": 316531, "epoch": 1884} {"train_loss": -11.78931999206543, "global_step": 316532, "epoch": 1884} {"train_loss": -9.702812194824219, "global_step": 316533, "epoch": 1884} {"train_loss": -11.428010940551758, "global_step": 316534, "epoch": 1884} {"train_loss": -10.241886138916016, "global_step": 316535, "epoch": 1884} {"train_loss": -10.162296295166016, "global_step": 316536, "epoch": 1884} {"train_loss": -10.791648864746094, "global_step": 316537, "epoch": 1884} {"train_loss": -9.237560272216797, "global_step": 316538, "epoch": 1884} {"train_loss": -9.333531379699707, "global_step": 316539, "epoch": 1884} {"train_loss": -8.502711296081543, "global_step": 316540, "epoch": 1884} {"train_loss": -8.56903076171875, "global_step": 316541, "epoch": 1884} {"train_loss": -11.47153091430664, "global_step": 316542, "epoch": 1884} {"train_loss": -8.632867813110352, "global_step": 316543, "epoch": 1884} {"train_loss": -10.177199363708496, "global_step": 316544, "epoch": 1884} {"train_loss": -10.547393798828125, "global_step": 316545, "epoch": 1884} {"train_loss": -10.490152359008789, "global_step": 316546, "epoch": 1884} {"train_loss": -10.76706314086914, "global_step": 316547, "epoch": 1884} {"train_loss": -11.44564437866211, "global_step": 316548, "epoch": 1884} {"train_loss": -10.949505805969238, "global_step": 316549, "epoch": 1884} {"train_loss": -11.190850257873535, "global_step": 316550, "epoch": 1884} {"train_loss": -11.50932502746582, "global_step": 316551, "epoch": 1884} {"train_loss": -11.19281005859375, "global_step": 316552, "epoch": 1884} {"train_loss": -11.700643539428711, "global_step": 316553, "epoch": 1884} {"train_loss": -11.745621681213379, "global_step": 316554, "epoch": 1884} {"train_loss": -11.39730167388916, "global_step": 316555, "epoch": 1884} {"train_loss": -11.437188148498535, "global_step": 316556, "epoch": 1884} {"train_loss": -11.849424362182617, "global_step": 316557, "epoch": 1884} {"train_loss": -11.661739349365234, "global_step": 316558, "epoch": 1884} {"train_loss": -11.523971557617188, "global_step": 316559, "epoch": 1884} {"train_loss": -11.93116569519043, "global_step": 316560, "epoch": 1884} {"train_loss": -11.838484764099121, "global_step": 316561, "epoch": 1884} {"train_loss": -11.929361343383789, "global_step": 316562, "epoch": 1884} {"train_loss": -11.750682830810547, "global_step": 316563, "epoch": 1884} {"train_loss": -11.836441993713379, "global_step": 316564, "epoch": 1884} {"train_loss": -11.691983222961426, "global_step": 316565, "epoch": 1884} {"train_loss": -12.126995086669922, "global_step": 316566, "epoch": 1884} {"train_loss": -11.818883895874023, "global_step": 316567, "epoch": 1884} {"train_loss": -12.218923568725586, "global_step": 316568, "epoch": 1884} {"train_loss": -11.635398864746094, "global_step": 316569, "epoch": 1884} {"train_loss": -12.27911376953125, "global_step": 316570, "epoch": 1884} {"train_loss": -11.85285758972168, "global_step": 316571, "epoch": 1884} {"train_loss": -12.230563163757324, "global_step": 316572, "epoch": 1884} {"train_loss": -12.049659729003906, "global_step": 316573, "epoch": 1884} {"train_loss": -12.179054260253906, "global_step": 316574, "epoch": 1884} {"train_loss": -12.13818645477295, "global_step": 316575, "epoch": 1884} {"train_loss": -12.18664264678955, "global_step": 316576, "epoch": 1884} {"train_loss": -12.28365707397461, "global_step": 316577, "epoch": 1884} {"train_loss": -12.234781265258789, "global_step": 316578, "epoch": 1884} {"train_loss": -12.170181274414062, "global_step": 316579, "epoch": 1884} {"train_loss": -12.293131828308105, "global_step": 316580, "epoch": 1884} {"train_loss": -12.16832160949707, "global_step": 316581, "epoch": 1884} {"train_loss": -12.4336519241333, "global_step": 316582, "epoch": 1884} {"train_loss": -12.19360637664795, "global_step": 316583, "epoch": 1884} {"train_loss": -12.192777633666992, "global_step": 316584, "epoch": 1884} {"train_loss": -12.247615814208984, "global_step": 316585, "epoch": 1884} {"train_loss": -12.245322227478027, "global_step": 316586, "epoch": 1884} {"train_loss": -12.312240600585938, "global_step": 316587, "epoch": 1884} {"train_loss": -12.248088836669922, "global_step": 316588, "epoch": 1884} {"train_loss": -12.144752502441406, "global_step": 316589, "epoch": 1884} {"train_loss": -12.385075569152832, "global_step": 316590, "epoch": 1884} {"train_loss": -12.244522094726562, "global_step": 316591, "epoch": 1884} {"train_loss": -12.312837600708008, "global_step": 316592, "epoch": 1884} {"train_loss": -12.283576965332031, "global_step": 316593, "epoch": 1884} {"train_loss": -12.377253532409668, "global_step": 316594, "epoch": 1884} {"train_loss": -12.194765090942383, "global_step": 316595, "epoch": 1884} {"train_loss": -11.935396194458008, "global_step": 316596, "epoch": 1884} {"train_loss": -12.155189514160156, "global_step": 316597, "epoch": 1884} {"train_loss": -12.01010513305664, "global_step": 316598, "epoch": 1884} {"train_loss": -12.086706161499023, "global_step": 316599, "epoch": 1884} {"train_loss": -12.182711601257324, "global_step": 316600, "epoch": 1884} {"train_loss": -12.153902053833008, "global_step": 316601, "epoch": 1884} {"train_loss": -12.108302116394043, "global_step": 316602, "epoch": 1884} {"train_loss": -11.778292655944824, "global_step": 316603, "epoch": 1884} {"train_loss": -11.69042682647705, "global_step": 316604, "epoch": 1884} {"train_loss": -11.34616470336914, "global_step": 316605, "epoch": 1884} {"train_loss": -12.098840713500977, "global_step": 316606, "epoch": 1884} {"train_loss": -12.323328018188477, "global_step": 316607, "epoch": 1884} {"train_loss": -11.727643013000488, "global_step": 316608, "epoch": 1884} {"train_loss": -11.969688415527344, "global_step": 316609, "epoch": 1884} {"train_loss": -12.24052619934082, "global_step": 316610, "epoch": 1884} {"train_loss": -11.963608741760254, "global_step": 316611, "epoch": 1884} {"train_loss": -12.155177116394043, "global_step": 316612, "epoch": 1884} {"train_loss": -11.910107612609863, "global_step": 316613, "epoch": 1884} {"train_loss": -12.177894592285156, "global_step": 316614, "epoch": 1884} {"train_loss": -11.941253662109375, "global_step": 316615, "epoch": 1884} {"train_loss": -11.998649597167969, "global_step": 316616, "epoch": 1884} {"train_loss": -12.380287170410156, "global_step": 316617, "epoch": 1884} {"train_loss": -12.159614562988281, "global_step": 316618, "epoch": 1884} {"train_loss": -12.49336051940918, "global_step": 316619, "epoch": 1884} {"train_loss": -12.223211288452148, "global_step": 316620, "epoch": 1884} {"train_loss": -11.747360229492188, "global_step": 316621, "epoch": 1884} {"train_loss": -12.134281158447266, "global_step": 316622, "epoch": 1884} {"train_loss": -11.82430648803711, "global_step": 316623, "epoch": 1884} {"train_loss": -12.340339660644531, "global_step": 316624, "epoch": 1884} {"train_loss": -11.953241348266602, "global_step": 316625, "epoch": 1884} {"train_loss": -11.807159423828125, "global_step": 316626, "epoch": 1884} {"train_loss": -12.272422790527344, "global_step": 316627, "epoch": 1884} {"train_loss": -11.856817245483398, "global_step": 316628, "epoch": 1884} {"train_loss": -11.74071979522705, "global_step": 316629, "epoch": 1884} {"train_loss": -11.870452880859375, "global_step": 316630, "epoch": 1884} {"train_loss": -11.594891548156738, "global_step": 316631, "epoch": 1884} {"train_loss": -12.098944664001465, "global_step": 316632, "epoch": 1884} {"train_loss": -11.078653335571289, "global_step": 316633, "epoch": 1884} {"train_loss": -11.593252182006836, "global_step": 316634, "epoch": 1884} {"train_loss": -12.366464614868164, "global_step": 316635, "epoch": 1884} {"train_loss": -11.371938705444336, "global_step": 316636, "epoch": 1884} {"train_loss": -12.078502655029297, "global_step": 316637, "epoch": 1884} {"train_loss": -12.048347473144531, "global_step": 316638, "epoch": 1884} {"train_loss": -11.843342781066895, "global_step": 316639, "epoch": 1884} {"train_loss": -12.314460754394531, "global_step": 316640, "epoch": 1884} {"train_loss": -11.78312873840332, "global_step": 316641, "epoch": 1884} {"train_loss": -11.70762825012207, "global_step": 316642, "epoch": 1884} {"train_loss": -11.933650970458984, "global_step": 316643, "epoch": 1884} {"train_loss": -11.722379684448242, "global_step": 316644, "epoch": 1884} {"train_loss": -12.436467170715332, "global_step": 316645, "epoch": 1884} {"train_loss": -11.847347259521484, "global_step": 316646, "epoch": 1884} {"train_loss": -12.088653564453125, "global_step": 316647, "epoch": 1884} {"train_loss": -11.847951889038086, "global_step": 316648, "epoch": 1884} {"train_loss": -11.97736644744873, "global_step": 316649, "epoch": 1884} {"train_loss": -12.529111862182617, "global_step": 316650, "epoch": 1884} {"train_loss": -11.993195533752441, "global_step": 316651, "epoch": 1884} {"train_loss": -12.428987503051758, "global_step": 316652, "epoch": 1884} {"train_loss": -11.85822868347168, "global_step": 316653, "epoch": 1884} {"train_loss": -12.19783878326416, "global_step": 316654, "epoch": 1884} {"train_loss": -11.793865203857422, "global_step": 316655, "epoch": 1884} {"train_loss": -12.17818546295166, "global_step": 316656, "epoch": 1884} {"train_loss": -12.094602584838867, "global_step": 316657, "epoch": 1884} {"train_loss": -12.349974632263184, "global_step": 316658, "epoch": 1884} {"train_loss": -11.98613452911377, "global_step": 316659, "epoch": 1884} {"train_loss": -12.136801719665527, "global_step": 316660, "epoch": 1884} {"train_loss": -12.188108444213867, "global_step": 316661, "epoch": 1884} {"train_loss": -12.173973083496094, "global_step": 316662, "epoch": 1884} {"train_loss": -12.156338691711426, "global_step": 316663, "epoch": 1884} {"train_loss": -11.659110069274902, "global_step": 316664, "epoch": 1884} {"train_loss": -12.265673637390137, "global_step": 316665, "epoch": 1884} {"train_loss": -11.888477325439453, "global_step": 316666, "epoch": 1884} {"train_loss": -12.027668952941895, "global_step": 316667, "epoch": 1884} {"train_loss": -12.272311210632324, "global_step": 316668, "epoch": 1884} {"train_loss": -11.683736801147461, "global_step": 316669, "epoch": 1884} {"train_loss": -12.237541198730469, "global_step": 316670, "epoch": 1884} {"train_loss": -11.604169845581055, "global_step": 316671, "epoch": 1884} {"train_loss": -11.729918479919434, "global_step": 316672, "epoch": 1884} {"train_loss": -12.290647506713867, "global_step": 316673, "epoch": 1884} {"train_loss": -11.65113353729248, "global_step": 316674, "epoch": 1884} {"train_loss": -12.266892433166504, "global_step": 316675, "epoch": 1884} {"train_loss": -11.961164474487305, "global_step": 316676, "epoch": 1884} {"train_loss": -12.007312774658203, "global_step": 316677, "epoch": 1884} {"train_loss": -11.882364273071289, "global_step": 316678, "epoch": 1884} {"train_loss": -11.816805039133344, "global_step": 316679, "epoch": 1884, "val_loss": 287311.1875} {"train_loss": -11.389076232910156, "global_step": 316680, "epoch": 1885} {"train_loss": -12.141206741333008, "global_step": 316681, "epoch": 1885} {"train_loss": -11.359098434448242, "global_step": 316682, "epoch": 1885} {"train_loss": -11.679045677185059, "global_step": 316683, "epoch": 1885} {"train_loss": -12.214011192321777, "global_step": 316684, "epoch": 1885} {"train_loss": -11.466474533081055, "global_step": 316685, "epoch": 1885} {"train_loss": -12.186593055725098, "global_step": 316686, "epoch": 1885} {"train_loss": -11.379022598266602, "global_step": 316687, "epoch": 1885} {"train_loss": -12.28204345703125, "global_step": 316688, "epoch": 1885} {"train_loss": -11.405988693237305, "global_step": 316689, "epoch": 1885} {"train_loss": -11.959653854370117, "global_step": 316690, "epoch": 1885} {"train_loss": -11.763290405273438, "global_step": 316691, "epoch": 1885} {"train_loss": -12.363889694213867, "global_step": 316692, "epoch": 1885} {"train_loss": -11.983782768249512, "global_step": 316693, "epoch": 1885} {"train_loss": -12.500859260559082, "global_step": 316694, "epoch": 1885} {"train_loss": -11.665548324584961, "global_step": 316695, "epoch": 1885} {"train_loss": -12.041277885437012, "global_step": 316696, "epoch": 1885} {"train_loss": -11.865058898925781, "global_step": 316697, "epoch": 1885} {"train_loss": -12.11783218383789, "global_step": 316698, "epoch": 1885} {"train_loss": -11.76439094543457, "global_step": 316699, "epoch": 1885} {"train_loss": -12.164236068725586, "global_step": 316700, "epoch": 1885} {"train_loss": -11.721064567565918, "global_step": 316701, "epoch": 1885} {"train_loss": -11.957347869873047, "global_step": 316702, "epoch": 1885} {"train_loss": -11.975839614868164, "global_step": 316703, "epoch": 1885} {"train_loss": -12.061969757080078, "global_step": 316704, "epoch": 1885} {"train_loss": -12.460529327392578, "global_step": 316705, "epoch": 1885} {"train_loss": -12.346839904785156, "global_step": 316706, "epoch": 1885} {"train_loss": -12.177680969238281, "global_step": 316707, "epoch": 1885} {"train_loss": -12.247407913208008, "global_step": 316708, "epoch": 1885} {"train_loss": -12.075023651123047, "global_step": 316709, "epoch": 1885} {"train_loss": -12.38392448425293, "global_step": 316710, "epoch": 1885} {"train_loss": -12.262750625610352, "global_step": 316711, "epoch": 1885} {"train_loss": -12.438194274902344, "global_step": 316712, "epoch": 1885} {"train_loss": -12.359086990356445, "global_step": 316713, "epoch": 1885} {"train_loss": -12.339935302734375, "global_step": 316714, "epoch": 1885} {"train_loss": -12.16295337677002, "global_step": 316715, "epoch": 1885} {"train_loss": -12.14541244506836, "global_step": 316716, "epoch": 1885} {"train_loss": -12.364372253417969, "global_step": 316717, "epoch": 1885} {"train_loss": -12.34134292602539, "global_step": 316718, "epoch": 1885} {"train_loss": -12.300975799560547, "global_step": 316719, "epoch": 1885} {"train_loss": -12.471668243408203, "global_step": 316720, "epoch": 1885} {"train_loss": -12.447403907775879, "global_step": 316721, "epoch": 1885} {"train_loss": -12.35250186920166, "global_step": 316722, "epoch": 1885} {"train_loss": -12.547767639160156, "global_step": 316723, "epoch": 1885} {"train_loss": -12.338873863220215, "global_step": 316724, "epoch": 1885} {"train_loss": -12.00644302368164, "global_step": 316725, "epoch": 1885} {"train_loss": -11.989816665649414, "global_step": 316726, "epoch": 1885} {"train_loss": -12.178380012512207, "global_step": 316727, "epoch": 1885} {"train_loss": -11.662330627441406, "global_step": 316728, "epoch": 1885} {"train_loss": -10.433574676513672, "global_step": 316729, "epoch": 1885} {"train_loss": -11.217562675476074, "global_step": 316730, "epoch": 1885} {"train_loss": -12.112833023071289, "global_step": 316731, "epoch": 1885} {"train_loss": -11.676301002502441, "global_step": 316732, "epoch": 1885} {"train_loss": -12.14532470703125, "global_step": 316733, "epoch": 1885} {"train_loss": -11.110252380371094, "global_step": 316734, "epoch": 1885} {"train_loss": -11.931878089904785, "global_step": 316735, "epoch": 1885} {"train_loss": -11.808364868164062, "global_step": 316736, "epoch": 1885} {"train_loss": -10.867910385131836, "global_step": 316737, "epoch": 1885} {"train_loss": -12.040026664733887, "global_step": 316738, "epoch": 1885} {"train_loss": -11.266075134277344, "global_step": 316739, "epoch": 1885} {"train_loss": -11.853229522705078, "global_step": 316740, "epoch": 1885} {"train_loss": -11.573094367980957, "global_step": 316741, "epoch": 1885} {"train_loss": -11.130195617675781, "global_step": 316742, "epoch": 1885} {"train_loss": -11.200080871582031, "global_step": 316743, "epoch": 1885} {"train_loss": -11.35367202758789, "global_step": 316744, "epoch": 1885} {"train_loss": -10.995321273803711, "global_step": 316745, "epoch": 1885} {"train_loss": -11.10798454284668, "global_step": 316746, "epoch": 1885} {"train_loss": -11.800678253173828, "global_step": 316747, "epoch": 1885} {"train_loss": -11.885332107543945, "global_step": 316748, "epoch": 1885} {"train_loss": -11.955039978027344, "global_step": 316749, "epoch": 1885} {"train_loss": -12.235122680664062, "global_step": 316750, "epoch": 1885} {"train_loss": -11.934038162231445, "global_step": 316751, "epoch": 1885} {"train_loss": -11.825881004333496, "global_step": 316752, "epoch": 1885} {"train_loss": -12.142036437988281, "global_step": 316753, "epoch": 1885} {"train_loss": -12.007589340209961, "global_step": 316754, "epoch": 1885} {"train_loss": -11.956551551818848, "global_step": 316755, "epoch": 1885} {"train_loss": -12.234880447387695, "global_step": 316756, "epoch": 1885} {"train_loss": -11.945783615112305, "global_step": 316757, "epoch": 1885} {"train_loss": -11.545309066772461, "global_step": 316758, "epoch": 1885} {"train_loss": -11.961442947387695, "global_step": 316759, "epoch": 1885} {"train_loss": -11.969705581665039, "global_step": 316760, "epoch": 1885} {"train_loss": -11.887893676757812, "global_step": 316761, "epoch": 1885} {"train_loss": -12.158164978027344, "global_step": 316762, "epoch": 1885} {"train_loss": -11.930376052856445, "global_step": 316763, "epoch": 1885} {"train_loss": -11.586854934692383, "global_step": 316764, "epoch": 1885} {"train_loss": -12.245176315307617, "global_step": 316765, "epoch": 1885} {"train_loss": -11.792670249938965, "global_step": 316766, "epoch": 1885} {"train_loss": -11.855657577514648, "global_step": 316767, "epoch": 1885} {"train_loss": -12.261194229125977, "global_step": 316768, "epoch": 1885} {"train_loss": -12.177739143371582, "global_step": 316769, "epoch": 1885} {"train_loss": -12.03973388671875, "global_step": 316770, "epoch": 1885} {"train_loss": -11.766866683959961, "global_step": 316771, "epoch": 1885} {"train_loss": -11.497896194458008, "global_step": 316772, "epoch": 1885} {"train_loss": -11.628955841064453, "global_step": 316773, "epoch": 1885} {"train_loss": -12.000994682312012, "global_step": 316774, "epoch": 1885} {"train_loss": -11.544313430786133, "global_step": 316775, "epoch": 1885} {"train_loss": -11.82361125946045, "global_step": 316776, "epoch": 1885} {"train_loss": -11.735820770263672, "global_step": 316777, "epoch": 1885} {"train_loss": -12.187527656555176, "global_step": 316778, "epoch": 1885} {"train_loss": -11.472479820251465, "global_step": 316779, "epoch": 1885} {"train_loss": -11.670047760009766, "global_step": 316780, "epoch": 1885} {"train_loss": -12.103300094604492, "global_step": 316781, "epoch": 1885} {"train_loss": -12.438276290893555, "global_step": 316782, "epoch": 1885} {"train_loss": -11.463083267211914, "global_step": 316783, "epoch": 1885} {"train_loss": -11.862249374389648, "global_step": 316784, "epoch": 1885} {"train_loss": -10.379464149475098, "global_step": 316785, "epoch": 1885} {"train_loss": -12.036521911621094, "global_step": 316786, "epoch": 1885} {"train_loss": -10.963333129882812, "global_step": 316787, "epoch": 1885} {"train_loss": -10.163662910461426, "global_step": 316788, "epoch": 1885} {"train_loss": -11.28342056274414, "global_step": 316789, "epoch": 1885} {"train_loss": -8.399871826171875, "global_step": 316790, "epoch": 1885} {"train_loss": -8.69415283203125, "global_step": 316791, "epoch": 1885} {"train_loss": -7.955180644989014, "global_step": 316792, "epoch": 1885} {"train_loss": -9.861153602600098, "global_step": 316793, "epoch": 1885} {"train_loss": -8.728391647338867, "global_step": 316794, "epoch": 1885} {"train_loss": -7.892171859741211, "global_step": 316795, "epoch": 1885} {"train_loss": -6.987593650817871, "global_step": 316796, "epoch": 1885} {"train_loss": -7.105422019958496, "global_step": 316797, "epoch": 1885} {"train_loss": -8.566377639770508, "global_step": 316798, "epoch": 1885} {"train_loss": -8.192755699157715, "global_step": 316799, "epoch": 1885} {"train_loss": -9.051728248596191, "global_step": 316800, "epoch": 1885} {"train_loss": -8.644025802612305, "global_step": 316801, "epoch": 1885} {"train_loss": -8.88082218170166, "global_step": 316802, "epoch": 1885} {"train_loss": -9.092031478881836, "global_step": 316803, "epoch": 1885} {"train_loss": -8.175424575805664, "global_step": 316804, "epoch": 1885} {"train_loss": -9.412155151367188, "global_step": 316805, "epoch": 1885} {"train_loss": -9.43974781036377, "global_step": 316806, "epoch": 1885} {"train_loss": -9.253641128540039, "global_step": 316807, "epoch": 1885} {"train_loss": -9.883492469787598, "global_step": 316808, "epoch": 1885} {"train_loss": -10.298271179199219, "global_step": 316809, "epoch": 1885} {"train_loss": -9.804412841796875, "global_step": 316810, "epoch": 1885} {"train_loss": -10.418399810791016, "global_step": 316811, "epoch": 1885} {"train_loss": -10.89449691772461, "global_step": 316812, "epoch": 1885} {"train_loss": -10.651448249816895, "global_step": 316813, "epoch": 1885} {"train_loss": -10.329530715942383, "global_step": 316814, "epoch": 1885} {"train_loss": -11.32583236694336, "global_step": 316815, "epoch": 1885} {"train_loss": -10.88219165802002, "global_step": 316816, "epoch": 1885} {"train_loss": -11.072635650634766, "global_step": 316817, "epoch": 1885} {"train_loss": -11.3452787399292, "global_step": 316818, "epoch": 1885} {"train_loss": -11.193708419799805, "global_step": 316819, "epoch": 1885} {"train_loss": -11.142266273498535, "global_step": 316820, "epoch": 1885} {"train_loss": -11.230925559997559, "global_step": 316821, "epoch": 1885} {"train_loss": -11.175400733947754, "global_step": 316822, "epoch": 1885} {"train_loss": -11.246030807495117, "global_step": 316823, "epoch": 1885} {"train_loss": -11.615819931030273, "global_step": 316824, "epoch": 1885} {"train_loss": -11.280009269714355, "global_step": 316825, "epoch": 1885} {"train_loss": -11.52942943572998, "global_step": 316826, "epoch": 1885} {"train_loss": -11.439554214477539, "global_step": 316827, "epoch": 1885} {"train_loss": -11.609100341796875, "global_step": 316828, "epoch": 1885} {"train_loss": -11.815600395202637, "global_step": 316829, "epoch": 1885} {"train_loss": -11.947065353393555, "global_step": 316830, "epoch": 1885} {"train_loss": -11.573204040527344, "global_step": 316831, "epoch": 1885} {"train_loss": -11.698440551757812, "global_step": 316832, "epoch": 1885} {"train_loss": -11.616386413574219, "global_step": 316833, "epoch": 1885} {"train_loss": -11.624055862426758, "global_step": 316834, "epoch": 1885} {"train_loss": -12.08133602142334, "global_step": 316835, "epoch": 1885} {"train_loss": -11.805973052978516, "global_step": 316836, "epoch": 1885} {"train_loss": -11.592384338378906, "global_step": 316837, "epoch": 1885} {"train_loss": -12.055420875549316, "global_step": 316838, "epoch": 1885} {"train_loss": -11.98033618927002, "global_step": 316839, "epoch": 1885} {"train_loss": -12.057088851928711, "global_step": 316840, "epoch": 1885} {"train_loss": -11.957191467285156, "global_step": 316841, "epoch": 1885} {"train_loss": -12.052408218383789, "global_step": 316842, "epoch": 1885} {"train_loss": -11.813209533691406, "global_step": 316843, "epoch": 1885} {"train_loss": -12.099251747131348, "global_step": 316844, "epoch": 1885} {"train_loss": -12.046603202819824, "global_step": 316845, "epoch": 1885} {"train_loss": -12.127809524536133, "global_step": 316846, "epoch": 1885} {"train_loss": -11.403017756484804, "global_step": 316847, "epoch": 1885, "val_loss": 273515.75, "train_action_mse_error": 5.125661849975586} {"train_loss": -12.16769027709961, "global_step": 316848, "epoch": 1886} {"train_loss": -11.987882614135742, "global_step": 316849, "epoch": 1886} {"train_loss": -12.087099075317383, "global_step": 316850, "epoch": 1886} {"train_loss": -12.009358406066895, "global_step": 316851, "epoch": 1886} {"train_loss": -12.05781078338623, "global_step": 316852, "epoch": 1886} {"train_loss": -12.203954696655273, "global_step": 316853, "epoch": 1886} {"train_loss": -12.133713722229004, "global_step": 316854, "epoch": 1886} {"train_loss": -12.042516708374023, "global_step": 316855, "epoch": 1886} {"train_loss": -11.97607707977295, "global_step": 316856, "epoch": 1886} {"train_loss": -12.395824432373047, "global_step": 316857, "epoch": 1886} {"train_loss": -12.135480880737305, "global_step": 316858, "epoch": 1886} {"train_loss": -12.336128234863281, "global_step": 316859, "epoch": 1886} {"train_loss": -12.081966400146484, "global_step": 316860, "epoch": 1886} {"train_loss": -12.21663761138916, "global_step": 316861, "epoch": 1886} {"train_loss": -12.26341438293457, "global_step": 316862, "epoch": 1886} {"train_loss": -12.168952941894531, "global_step": 316863, "epoch": 1886} {"train_loss": -12.242313385009766, "global_step": 316864, "epoch": 1886} {"train_loss": -12.33100414276123, "global_step": 316865, "epoch": 1886} {"train_loss": -12.265951156616211, "global_step": 316866, "epoch": 1886} {"train_loss": -12.045158386230469, "global_step": 316867, "epoch": 1886} {"train_loss": -12.246957778930664, "global_step": 316868, "epoch": 1886} {"train_loss": -12.432952880859375, "global_step": 316869, "epoch": 1886} {"train_loss": -12.029668807983398, "global_step": 316870, "epoch": 1886} {"train_loss": -12.144645690917969, "global_step": 316871, "epoch": 1886} {"train_loss": -11.899797439575195, "global_step": 316872, "epoch": 1886} {"train_loss": -11.710051536560059, "global_step": 316873, "epoch": 1886} {"train_loss": -12.371710777282715, "global_step": 316874, "epoch": 1886} {"train_loss": -11.954861640930176, "global_step": 316875, "epoch": 1886} {"train_loss": -11.277870178222656, "global_step": 316876, "epoch": 1886} {"train_loss": -11.997407913208008, "global_step": 316877, "epoch": 1886} {"train_loss": -11.347993850708008, "global_step": 316878, "epoch": 1886} {"train_loss": -11.504348754882812, "global_step": 316879, "epoch": 1886} {"train_loss": -11.688522338867188, "global_step": 316880, "epoch": 1886} {"train_loss": -10.757580757141113, "global_step": 316881, "epoch": 1886} {"train_loss": -11.903491973876953, "global_step": 316882, "epoch": 1886} {"train_loss": -11.756427764892578, "global_step": 316883, "epoch": 1886} {"train_loss": -11.214667320251465, "global_step": 316884, "epoch": 1886} {"train_loss": -12.115446090698242, "global_step": 316885, "epoch": 1886} {"train_loss": -10.492135047912598, "global_step": 316886, "epoch": 1886} {"train_loss": -11.728716850280762, "global_step": 316887, "epoch": 1886} {"train_loss": -11.437803268432617, "global_step": 316888, "epoch": 1886} {"train_loss": -11.38599681854248, "global_step": 316889, "epoch": 1886} {"train_loss": -11.9219388961792, "global_step": 316890, "epoch": 1886} {"train_loss": -11.598709106445312, "global_step": 316891, "epoch": 1886} {"train_loss": -11.941231727600098, "global_step": 316892, "epoch": 1886} {"train_loss": -10.73764419555664, "global_step": 316893, "epoch": 1886} {"train_loss": -11.908360481262207, "global_step": 316894, "epoch": 1886} {"train_loss": -11.214127540588379, "global_step": 316895, "epoch": 1886} {"train_loss": -11.37138557434082, "global_step": 316896, "epoch": 1886} {"train_loss": -11.60369873046875, "global_step": 316897, "epoch": 1886} {"train_loss": -11.025129318237305, "global_step": 316898, "epoch": 1886} {"train_loss": -11.480600357055664, "global_step": 316899, "epoch": 1886} {"train_loss": -10.165712356567383, "global_step": 316900, "epoch": 1886} {"train_loss": -11.844290733337402, "global_step": 316901, "epoch": 1886} {"train_loss": -10.543448448181152, "global_step": 316902, "epoch": 1886} {"train_loss": -12.394209861755371, "global_step": 316903, "epoch": 1886} {"train_loss": -10.520377159118652, "global_step": 316904, "epoch": 1886} {"train_loss": -11.999195098876953, "global_step": 316905, "epoch": 1886} {"train_loss": -10.941368103027344, "global_step": 316906, "epoch": 1886} {"train_loss": -11.549467086791992, "global_step": 316907, "epoch": 1886} {"train_loss": -11.511894226074219, "global_step": 316908, "epoch": 1886} {"train_loss": -11.499905586242676, "global_step": 316909, "epoch": 1886} {"train_loss": -11.893959045410156, "global_step": 316910, "epoch": 1886} {"train_loss": -12.059598922729492, "global_step": 316911, "epoch": 1886} {"train_loss": -11.815912246704102, "global_step": 316912, "epoch": 1886} {"train_loss": -12.14205551147461, "global_step": 316913, "epoch": 1886} {"train_loss": -11.660022735595703, "global_step": 316914, "epoch": 1886} {"train_loss": -12.075681686401367, "global_step": 316915, "epoch": 1886} {"train_loss": -11.848854064941406, "global_step": 316916, "epoch": 1886} {"train_loss": -11.926237106323242, "global_step": 316917, "epoch": 1886} {"train_loss": -11.747177124023438, "global_step": 316918, "epoch": 1886} {"train_loss": -11.93063735961914, "global_step": 316919, "epoch": 1886} {"train_loss": -11.816147804260254, "global_step": 316920, "epoch": 1886} {"train_loss": -11.864936828613281, "global_step": 316921, "epoch": 1886} {"train_loss": -12.210248947143555, "global_step": 316922, "epoch": 1886} {"train_loss": -11.946117401123047, "global_step": 316923, "epoch": 1886} {"train_loss": -12.05059814453125, "global_step": 316924, "epoch": 1886} {"train_loss": -12.229520797729492, "global_step": 316925, "epoch": 1886} {"train_loss": -11.441324234008789, "global_step": 316926, "epoch": 1886} {"train_loss": -12.164605140686035, "global_step": 316927, "epoch": 1886} {"train_loss": -11.93852710723877, "global_step": 316928, "epoch": 1886} {"train_loss": -12.075933456420898, "global_step": 316929, "epoch": 1886} {"train_loss": -12.129166603088379, "global_step": 316930, "epoch": 1886} {"train_loss": -12.322407722473145, "global_step": 316931, "epoch": 1886} {"train_loss": -12.267576217651367, "global_step": 316932, "epoch": 1886} {"train_loss": -12.094799041748047, "global_step": 316933, "epoch": 1886} {"train_loss": -12.24267864227295, "global_step": 316934, "epoch": 1886} {"train_loss": -12.25040054321289, "global_step": 316935, "epoch": 1886} {"train_loss": -11.851594924926758, "global_step": 316936, "epoch": 1886} {"train_loss": -11.96382999420166, "global_step": 316937, "epoch": 1886} {"train_loss": -12.139562606811523, "global_step": 316938, "epoch": 1886} {"train_loss": -12.019699096679688, "global_step": 316939, "epoch": 1886} {"train_loss": -12.18324089050293, "global_step": 316940, "epoch": 1886} {"train_loss": -11.931133270263672, "global_step": 316941, "epoch": 1886} {"train_loss": -12.002537727355957, "global_step": 316942, "epoch": 1886} {"train_loss": -11.915596961975098, "global_step": 316943, "epoch": 1886} {"train_loss": -12.277027130126953, "global_step": 316944, "epoch": 1886} {"train_loss": -11.733510971069336, "global_step": 316945, "epoch": 1886} {"train_loss": -12.056573867797852, "global_step": 316946, "epoch": 1886} {"train_loss": -11.58051872253418, "global_step": 316947, "epoch": 1886} {"train_loss": -12.014582633972168, "global_step": 316948, "epoch": 1886} {"train_loss": -11.706300735473633, "global_step": 316949, "epoch": 1886} {"train_loss": -11.479097366333008, "global_step": 316950, "epoch": 1886} {"train_loss": -11.93690013885498, "global_step": 316951, "epoch": 1886} {"train_loss": -11.93933391571045, "global_step": 316952, "epoch": 1886} {"train_loss": -12.055561065673828, "global_step": 316953, "epoch": 1886} {"train_loss": -11.659688949584961, "global_step": 316954, "epoch": 1886} {"train_loss": -12.04065990447998, "global_step": 316955, "epoch": 1886} {"train_loss": -11.464509963989258, "global_step": 316956, "epoch": 1886} {"train_loss": -11.947900772094727, "global_step": 316957, "epoch": 1886} {"train_loss": -12.304769515991211, "global_step": 316958, "epoch": 1886} {"train_loss": -11.968765258789062, "global_step": 316959, "epoch": 1886} {"train_loss": -12.128496170043945, "global_step": 316960, "epoch": 1886} {"train_loss": -12.14511489868164, "global_step": 316961, "epoch": 1886} {"train_loss": -12.319631576538086, "global_step": 316962, "epoch": 1886} {"train_loss": -12.003447532653809, "global_step": 316963, "epoch": 1886} {"train_loss": -12.317276954650879, "global_step": 316964, "epoch": 1886} {"train_loss": -11.731593132019043, "global_step": 316965, "epoch": 1886} {"train_loss": -12.031864166259766, "global_step": 316966, "epoch": 1886} {"train_loss": -11.440793991088867, "global_step": 316967, "epoch": 1886} {"train_loss": -11.976909637451172, "global_step": 316968, "epoch": 1886} {"train_loss": -11.196248054504395, "global_step": 316969, "epoch": 1886} {"train_loss": -11.587336540222168, "global_step": 316970, "epoch": 1886} {"train_loss": -11.75953483581543, "global_step": 316971, "epoch": 1886} {"train_loss": -11.993449211120605, "global_step": 316972, "epoch": 1886} {"train_loss": -11.754850387573242, "global_step": 316973, "epoch": 1886} {"train_loss": -11.871792793273926, "global_step": 316974, "epoch": 1886} {"train_loss": -11.772666931152344, "global_step": 316975, "epoch": 1886} {"train_loss": -11.73469066619873, "global_step": 316976, "epoch": 1886} {"train_loss": -11.828299522399902, "global_step": 316977, "epoch": 1886} {"train_loss": -11.804574966430664, "global_step": 316978, "epoch": 1886} {"train_loss": -11.788251876831055, "global_step": 316979, "epoch": 1886} {"train_loss": -11.966032981872559, "global_step": 316980, "epoch": 1886} {"train_loss": -11.71453857421875, "global_step": 316981, "epoch": 1886} {"train_loss": -11.511533737182617, "global_step": 316982, "epoch": 1886} {"train_loss": -12.190774917602539, "global_step": 316983, "epoch": 1886} {"train_loss": -11.217742919921875, "global_step": 316984, "epoch": 1886} {"train_loss": -12.092338562011719, "global_step": 316985, "epoch": 1886} {"train_loss": -11.466554641723633, "global_step": 316986, "epoch": 1886} {"train_loss": -10.845738410949707, "global_step": 316987, "epoch": 1886} {"train_loss": -11.603153228759766, "global_step": 316988, "epoch": 1886} {"train_loss": -11.289766311645508, "global_step": 316989, "epoch": 1886} {"train_loss": -11.676825523376465, "global_step": 316990, "epoch": 1886} {"train_loss": -12.01140022277832, "global_step": 316991, "epoch": 1886} {"train_loss": -11.624746322631836, "global_step": 316992, "epoch": 1886} {"train_loss": -11.750816345214844, "global_step": 316993, "epoch": 1886} {"train_loss": -11.857345581054688, "global_step": 316994, "epoch": 1886} {"train_loss": -11.864574432373047, "global_step": 316995, "epoch": 1886} {"train_loss": -12.002923011779785, "global_step": 316996, "epoch": 1886} {"train_loss": -12.024748802185059, "global_step": 316997, "epoch": 1886} {"train_loss": -11.732290267944336, "global_step": 316998, "epoch": 1886} {"train_loss": -12.183572769165039, "global_step": 316999, "epoch": 1886} {"train_loss": -12.070433616638184, "global_step": 317000, "epoch": 1886} {"train_loss": -12.036725044250488, "global_step": 317001, "epoch": 1886} {"train_loss": -11.92162799835205, "global_step": 317002, "epoch": 1886} {"train_loss": -12.016389846801758, "global_step": 317003, "epoch": 1886} {"train_loss": -12.191361427307129, "global_step": 317004, "epoch": 1886} {"train_loss": -12.343611717224121, "global_step": 317005, "epoch": 1886} {"train_loss": -12.043725967407227, "global_step": 317006, "epoch": 1886} {"train_loss": -12.284407615661621, "global_step": 317007, "epoch": 1886} {"train_loss": -11.960653305053711, "global_step": 317008, "epoch": 1886} {"train_loss": -12.221531867980957, "global_step": 317009, "epoch": 1886} {"train_loss": -12.142501831054688, "global_step": 317010, "epoch": 1886} {"train_loss": -11.47597599029541, "global_step": 317011, "epoch": 1886} {"train_loss": -12.280919075012207, "global_step": 317012, "epoch": 1886} {"train_loss": -11.934139251708984, "global_step": 317013, "epoch": 1886} {"train_loss": -11.943477630615234, "global_step": 317014, "epoch": 1886} {"train_loss": -11.852611184120178, "global_step": 317015, "epoch": 1886, "val_loss": 276404.65625} {"train_loss": -11.81583023071289, "global_step": 317016, "epoch": 1887} {"train_loss": -11.874994277954102, "global_step": 317017, "epoch": 1887} {"train_loss": -11.672057151794434, "global_step": 317018, "epoch": 1887} {"train_loss": -11.458475112915039, "global_step": 317019, "epoch": 1887} {"train_loss": -11.81311321258545, "global_step": 317020, "epoch": 1887} {"train_loss": -11.844097137451172, "global_step": 317021, "epoch": 1887} {"train_loss": -12.034326553344727, "global_step": 317022, "epoch": 1887} {"train_loss": -12.159334182739258, "global_step": 317023, "epoch": 1887} {"train_loss": -11.895769119262695, "global_step": 317024, "epoch": 1887} {"train_loss": -12.08939266204834, "global_step": 317025, "epoch": 1887} {"train_loss": -12.001731872558594, "global_step": 317026, "epoch": 1887} {"train_loss": -11.991592407226562, "global_step": 317027, "epoch": 1887} {"train_loss": -12.228271484375, "global_step": 317028, "epoch": 1887} {"train_loss": -11.978994369506836, "global_step": 317029, "epoch": 1887} {"train_loss": -12.320149421691895, "global_step": 317030, "epoch": 1887} {"train_loss": -12.141533851623535, "global_step": 317031, "epoch": 1887} {"train_loss": -12.471343994140625, "global_step": 317032, "epoch": 1887} {"train_loss": -12.260955810546875, "global_step": 317033, "epoch": 1887} {"train_loss": -12.281532287597656, "global_step": 317034, "epoch": 1887} {"train_loss": -12.243340492248535, "global_step": 317035, "epoch": 1887} {"train_loss": -12.443989753723145, "global_step": 317036, "epoch": 1887} {"train_loss": -12.450571060180664, "global_step": 317037, "epoch": 1887} {"train_loss": -12.48343276977539, "global_step": 317038, "epoch": 1887} {"train_loss": -12.447259902954102, "global_step": 317039, "epoch": 1887} {"train_loss": -12.360177993774414, "global_step": 317040, "epoch": 1887} {"train_loss": -12.385961532592773, "global_step": 317041, "epoch": 1887} {"train_loss": -12.412033081054688, "global_step": 317042, "epoch": 1887} {"train_loss": -12.66450309753418, "global_step": 317043, "epoch": 1887} {"train_loss": -12.20872688293457, "global_step": 317044, "epoch": 1887} {"train_loss": -12.607589721679688, "global_step": 317045, "epoch": 1887} {"train_loss": -12.288165092468262, "global_step": 317046, "epoch": 1887} {"train_loss": -12.460051536560059, "global_step": 317047, "epoch": 1887} {"train_loss": -12.562923431396484, "global_step": 317048, "epoch": 1887} {"train_loss": -12.38833999633789, "global_step": 317049, "epoch": 1887} {"train_loss": -12.45707893371582, "global_step": 317050, "epoch": 1887} {"train_loss": -12.374032974243164, "global_step": 317051, "epoch": 1887} {"train_loss": -12.229337692260742, "global_step": 317052, "epoch": 1887} {"train_loss": -12.546775817871094, "global_step": 317053, "epoch": 1887} {"train_loss": -12.416265487670898, "global_step": 317054, "epoch": 1887} {"train_loss": -12.589653015136719, "global_step": 317055, "epoch": 1887} {"train_loss": -12.385008811950684, "global_step": 317056, "epoch": 1887} {"train_loss": -12.55583667755127, "global_step": 317057, "epoch": 1887} {"train_loss": -12.395787239074707, "global_step": 317058, "epoch": 1887} {"train_loss": -12.592517852783203, "global_step": 317059, "epoch": 1887} {"train_loss": -12.38555908203125, "global_step": 317060, "epoch": 1887} {"train_loss": -11.834256172180176, "global_step": 317061, "epoch": 1887} {"train_loss": -12.022268295288086, "global_step": 317062, "epoch": 1887} {"train_loss": -11.705174446105957, "global_step": 317063, "epoch": 1887} {"train_loss": -11.442994117736816, "global_step": 317064, "epoch": 1887} {"train_loss": -10.895729064941406, "global_step": 317065, "epoch": 1887} {"train_loss": -11.634798049926758, "global_step": 317066, "epoch": 1887} {"train_loss": -11.207331657409668, "global_step": 317067, "epoch": 1887} {"train_loss": -10.570076942443848, "global_step": 317068, "epoch": 1887} {"train_loss": -11.68294906616211, "global_step": 317069, "epoch": 1887} {"train_loss": -12.070520401000977, "global_step": 317070, "epoch": 1887} {"train_loss": -10.93571662902832, "global_step": 317071, "epoch": 1887} {"train_loss": -11.032121658325195, "global_step": 317072, "epoch": 1887} {"train_loss": -11.723833084106445, "global_step": 317073, "epoch": 1887} {"train_loss": -11.296009063720703, "global_step": 317074, "epoch": 1887} {"train_loss": -10.914519309997559, "global_step": 317075, "epoch": 1887} {"train_loss": -11.16110610961914, "global_step": 317076, "epoch": 1887} {"train_loss": -9.048636436462402, "global_step": 317077, "epoch": 1887} {"train_loss": -7.8249945640563965, "global_step": 317078, "epoch": 1887} {"train_loss": -9.065086364746094, "global_step": 317079, "epoch": 1887} {"train_loss": -11.06736946105957, "global_step": 317080, "epoch": 1887} {"train_loss": -10.475765228271484, "global_step": 317081, "epoch": 1887} {"train_loss": -10.188405990600586, "global_step": 317082, "epoch": 1887} {"train_loss": -10.049010276794434, "global_step": 317083, "epoch": 1887} {"train_loss": -10.883310317993164, "global_step": 317084, "epoch": 1887} {"train_loss": -10.823427200317383, "global_step": 317085, "epoch": 1887} {"train_loss": -11.872203826904297, "global_step": 317086, "epoch": 1887} {"train_loss": -11.158285140991211, "global_step": 317087, "epoch": 1887} {"train_loss": -10.84666633605957, "global_step": 317088, "epoch": 1887} {"train_loss": -11.066201210021973, "global_step": 317089, "epoch": 1887} {"train_loss": -11.014644622802734, "global_step": 317090, "epoch": 1887} {"train_loss": -11.314002990722656, "global_step": 317091, "epoch": 1887} {"train_loss": -11.329511642456055, "global_step": 317092, "epoch": 1887} {"train_loss": -10.840381622314453, "global_step": 317093, "epoch": 1887} {"train_loss": -10.42819881439209, "global_step": 317094, "epoch": 1887} {"train_loss": -10.956095695495605, "global_step": 317095, "epoch": 1887} {"train_loss": -11.15167236328125, "global_step": 317096, "epoch": 1887} {"train_loss": -10.142745971679688, "global_step": 317097, "epoch": 1887} {"train_loss": -10.790618896484375, "global_step": 317098, "epoch": 1887} {"train_loss": -11.176860809326172, "global_step": 317099, "epoch": 1887} {"train_loss": -10.814095497131348, "global_step": 317100, "epoch": 1887} {"train_loss": -11.478851318359375, "global_step": 317101, "epoch": 1887} {"train_loss": -11.264459609985352, "global_step": 317102, "epoch": 1887} {"train_loss": -11.447697639465332, "global_step": 317103, "epoch": 1887} {"train_loss": -11.072111129760742, "global_step": 317104, "epoch": 1887} {"train_loss": -11.647506713867188, "global_step": 317105, "epoch": 1887} {"train_loss": -11.234745025634766, "global_step": 317106, "epoch": 1887} {"train_loss": -11.317822456359863, "global_step": 317107, "epoch": 1887} {"train_loss": -11.6806058883667, "global_step": 317108, "epoch": 1887} {"train_loss": -11.601926803588867, "global_step": 317109, "epoch": 1887} {"train_loss": -11.568181991577148, "global_step": 317110, "epoch": 1887} {"train_loss": -11.41026496887207, "global_step": 317111, "epoch": 1887} {"train_loss": -11.320859909057617, "global_step": 317112, "epoch": 1887} {"train_loss": -11.81617546081543, "global_step": 317113, "epoch": 1887} {"train_loss": -11.309917449951172, "global_step": 317114, "epoch": 1887} {"train_loss": -11.575100898742676, "global_step": 317115, "epoch": 1887} {"train_loss": -11.693899154663086, "global_step": 317116, "epoch": 1887} {"train_loss": -11.205921173095703, "global_step": 317117, "epoch": 1887} {"train_loss": -11.994169235229492, "global_step": 317118, "epoch": 1887} {"train_loss": -11.594520568847656, "global_step": 317119, "epoch": 1887} {"train_loss": -11.760997772216797, "global_step": 317120, "epoch": 1887} {"train_loss": -11.585748672485352, "global_step": 317121, "epoch": 1887} {"train_loss": -11.603994369506836, "global_step": 317122, "epoch": 1887} {"train_loss": -11.884590148925781, "global_step": 317123, "epoch": 1887} {"train_loss": -11.686840057373047, "global_step": 317124, "epoch": 1887} {"train_loss": -11.733577728271484, "global_step": 317125, "epoch": 1887} {"train_loss": -11.672430038452148, "global_step": 317126, "epoch": 1887} {"train_loss": -11.45434284210205, "global_step": 317127, "epoch": 1887} {"train_loss": -11.880475997924805, "global_step": 317128, "epoch": 1887} {"train_loss": -10.945948600769043, "global_step": 317129, "epoch": 1887} {"train_loss": -11.855292320251465, "global_step": 317130, "epoch": 1887} {"train_loss": -11.52420425415039, "global_step": 317131, "epoch": 1887} {"train_loss": -11.26274299621582, "global_step": 317132, "epoch": 1887} {"train_loss": -11.956582069396973, "global_step": 317133, "epoch": 1887} {"train_loss": -11.402410507202148, "global_step": 317134, "epoch": 1887} {"train_loss": -11.56256103515625, "global_step": 317135, "epoch": 1887} {"train_loss": -12.17186164855957, "global_step": 317136, "epoch": 1887} {"train_loss": -11.55554485321045, "global_step": 317137, "epoch": 1887} {"train_loss": -11.852696418762207, "global_step": 317138, "epoch": 1887} {"train_loss": -12.049330711364746, "global_step": 317139, "epoch": 1887} {"train_loss": -11.173128128051758, "global_step": 317140, "epoch": 1887} {"train_loss": -12.157535552978516, "global_step": 317141, "epoch": 1887} {"train_loss": -11.500812530517578, "global_step": 317142, "epoch": 1887} {"train_loss": -11.806768417358398, "global_step": 317143, "epoch": 1887} {"train_loss": -12.135000228881836, "global_step": 317144, "epoch": 1887} {"train_loss": -12.0087890625, "global_step": 317145, "epoch": 1887} {"train_loss": -12.038694381713867, "global_step": 317146, "epoch": 1887} {"train_loss": -12.255550384521484, "global_step": 317147, "epoch": 1887} {"train_loss": -12.086759567260742, "global_step": 317148, "epoch": 1887} {"train_loss": -12.064797401428223, "global_step": 317149, "epoch": 1887} {"train_loss": -12.156816482543945, "global_step": 317150, "epoch": 1887} {"train_loss": -12.323101043701172, "global_step": 317151, "epoch": 1887} {"train_loss": -12.29450798034668, "global_step": 317152, "epoch": 1887} {"train_loss": -12.147153854370117, "global_step": 317153, "epoch": 1887} {"train_loss": -12.456883430480957, "global_step": 317154, "epoch": 1887} {"train_loss": -12.297220230102539, "global_step": 317155, "epoch": 1887} {"train_loss": -12.135295867919922, "global_step": 317156, "epoch": 1887} {"train_loss": -12.164237976074219, "global_step": 317157, "epoch": 1887} {"train_loss": -12.207115173339844, "global_step": 317158, "epoch": 1887} {"train_loss": -12.346907615661621, "global_step": 317159, "epoch": 1887} {"train_loss": -12.421364784240723, "global_step": 317160, "epoch": 1887} {"train_loss": -12.197352409362793, "global_step": 317161, "epoch": 1887} {"train_loss": -12.349712371826172, "global_step": 317162, "epoch": 1887} {"train_loss": -12.339022636413574, "global_step": 317163, "epoch": 1887} {"train_loss": -12.313697814941406, "global_step": 317164, "epoch": 1887} {"train_loss": -12.230615615844727, "global_step": 317165, "epoch": 1887} {"train_loss": -12.296086311340332, "global_step": 317166, "epoch": 1887} {"train_loss": -12.33742904663086, "global_step": 317167, "epoch": 1887} {"train_loss": -12.092967987060547, "global_step": 317168, "epoch": 1887} {"train_loss": -12.18459415435791, "global_step": 317169, "epoch": 1887} {"train_loss": -12.309330940246582, "global_step": 317170, "epoch": 1887} {"train_loss": -12.287904739379883, "global_step": 317171, "epoch": 1887} {"train_loss": -12.301700592041016, "global_step": 317172, "epoch": 1887} {"train_loss": -12.169599533081055, "global_step": 317173, "epoch": 1887} {"train_loss": -12.387147903442383, "global_step": 317174, "epoch": 1887} {"train_loss": -12.301437377929688, "global_step": 317175, "epoch": 1887} {"train_loss": -12.472091674804688, "global_step": 317176, "epoch": 1887} {"train_loss": -12.36734390258789, "global_step": 317177, "epoch": 1887} {"train_loss": -12.408332824707031, "global_step": 317178, "epoch": 1887} {"train_loss": -12.410714149475098, "global_step": 317179, "epoch": 1887} {"train_loss": -12.305625915527344, "global_step": 317180, "epoch": 1887} {"train_loss": -12.52481746673584, "global_step": 317181, "epoch": 1887} {"train_loss": -12.299488067626953, "global_step": 317182, "epoch": 1887} {"train_loss": -11.768170297145844, "global_step": 317183, "epoch": 1887, "val_loss": 276412.9375} {"train_loss": -12.594649314880371, "global_step": 317184, "epoch": 1888} {"train_loss": -12.34339427947998, "global_step": 317185, "epoch": 1888} {"train_loss": -12.602481842041016, "global_step": 317186, "epoch": 1888} {"train_loss": -12.514511108398438, "global_step": 317187, "epoch": 1888} {"train_loss": -12.647875785827637, "global_step": 317188, "epoch": 1888} {"train_loss": -12.600746154785156, "global_step": 317189, "epoch": 1888} {"train_loss": -12.411014556884766, "global_step": 317190, "epoch": 1888} {"train_loss": -12.54738998413086, "global_step": 317191, "epoch": 1888} {"train_loss": -12.461837768554688, "global_step": 317192, "epoch": 1888} {"train_loss": -12.700418472290039, "global_step": 317193, "epoch": 1888} {"train_loss": -12.264135360717773, "global_step": 317194, "epoch": 1888} {"train_loss": -12.194887161254883, "global_step": 317195, "epoch": 1888} {"train_loss": -12.455437660217285, "global_step": 317196, "epoch": 1888} {"train_loss": -12.280576705932617, "global_step": 317197, "epoch": 1888} {"train_loss": -12.56148910522461, "global_step": 317198, "epoch": 1888} {"train_loss": -12.693880081176758, "global_step": 317199, "epoch": 1888} {"train_loss": -12.651466369628906, "global_step": 317200, "epoch": 1888} {"train_loss": -12.455514907836914, "global_step": 317201, "epoch": 1888} {"train_loss": -12.070116996765137, "global_step": 317202, "epoch": 1888} {"train_loss": -12.590675354003906, "global_step": 317203, "epoch": 1888} {"train_loss": -12.42379379272461, "global_step": 317204, "epoch": 1888} {"train_loss": -12.182168960571289, "global_step": 317205, "epoch": 1888} {"train_loss": -12.041009902954102, "global_step": 317206, "epoch": 1888} {"train_loss": -11.864725112915039, "global_step": 317207, "epoch": 1888} {"train_loss": -12.01542854309082, "global_step": 317208, "epoch": 1888} {"train_loss": -12.241747856140137, "global_step": 317209, "epoch": 1888} {"train_loss": -12.240232467651367, "global_step": 317210, "epoch": 1888} {"train_loss": -12.265881538391113, "global_step": 317211, "epoch": 1888} {"train_loss": -11.913530349731445, "global_step": 317212, "epoch": 1888} {"train_loss": -12.090005874633789, "global_step": 317213, "epoch": 1888} {"train_loss": -12.140868186950684, "global_step": 317214, "epoch": 1888} {"train_loss": -12.52545166015625, "global_step": 317215, "epoch": 1888} {"train_loss": -12.191383361816406, "global_step": 317216, "epoch": 1888} {"train_loss": -11.349681854248047, "global_step": 317217, "epoch": 1888} {"train_loss": -11.058347702026367, "global_step": 317218, "epoch": 1888} {"train_loss": -11.756875991821289, "global_step": 317219, "epoch": 1888} {"train_loss": -11.377824783325195, "global_step": 317220, "epoch": 1888} {"train_loss": -8.928023338317871, "global_step": 317221, "epoch": 1888} {"train_loss": -10.638179779052734, "global_step": 317222, "epoch": 1888} {"train_loss": -10.230245590209961, "global_step": 317223, "epoch": 1888} {"train_loss": -11.394210815429688, "global_step": 317224, "epoch": 1888} {"train_loss": -10.58120059967041, "global_step": 317225, "epoch": 1888} {"train_loss": -10.162857055664062, "global_step": 317226, "epoch": 1888} {"train_loss": -11.253410339355469, "global_step": 317227, "epoch": 1888} {"train_loss": -9.613420486450195, "global_step": 317228, "epoch": 1888} {"train_loss": -11.258445739746094, "global_step": 317229, "epoch": 1888} {"train_loss": -11.292823791503906, "global_step": 317230, "epoch": 1888} {"train_loss": -10.841718673706055, "global_step": 317231, "epoch": 1888} {"train_loss": -11.113183975219727, "global_step": 317232, "epoch": 1888} {"train_loss": -11.358602523803711, "global_step": 317233, "epoch": 1888} {"train_loss": -11.490880012512207, "global_step": 317234, "epoch": 1888} {"train_loss": -11.098198890686035, "global_step": 317235, "epoch": 1888} {"train_loss": -11.738396644592285, "global_step": 317236, "epoch": 1888} {"train_loss": -11.678007125854492, "global_step": 317237, "epoch": 1888} {"train_loss": -11.814018249511719, "global_step": 317238, "epoch": 1888} {"train_loss": -12.008499145507812, "global_step": 317239, "epoch": 1888} {"train_loss": -11.569684028625488, "global_step": 317240, "epoch": 1888} {"train_loss": -11.788737297058105, "global_step": 317241, "epoch": 1888} {"train_loss": -12.07280158996582, "global_step": 317242, "epoch": 1888} {"train_loss": -11.872013092041016, "global_step": 317243, "epoch": 1888} {"train_loss": -11.401089668273926, "global_step": 317244, "epoch": 1888} {"train_loss": -12.369349479675293, "global_step": 317245, "epoch": 1888} {"train_loss": -11.505523681640625, "global_step": 317246, "epoch": 1888} {"train_loss": -12.021976470947266, "global_step": 317247, "epoch": 1888} {"train_loss": -11.290056228637695, "global_step": 317248, "epoch": 1888} {"train_loss": -11.463205337524414, "global_step": 317249, "epoch": 1888} {"train_loss": -11.249570846557617, "global_step": 317250, "epoch": 1888} {"train_loss": -11.908880233764648, "global_step": 317251, "epoch": 1888} {"train_loss": -11.470069885253906, "global_step": 317252, "epoch": 1888} {"train_loss": -11.835185050964355, "global_step": 317253, "epoch": 1888} {"train_loss": -11.75838851928711, "global_step": 317254, "epoch": 1888} {"train_loss": -12.100875854492188, "global_step": 317255, "epoch": 1888} {"train_loss": -11.880746841430664, "global_step": 317256, "epoch": 1888} {"train_loss": -12.004295349121094, "global_step": 317257, "epoch": 1888} {"train_loss": -11.593392372131348, "global_step": 317258, "epoch": 1888} {"train_loss": -12.278944969177246, "global_step": 317259, "epoch": 1888} {"train_loss": -11.483236312866211, "global_step": 317260, "epoch": 1888} {"train_loss": -12.047676086425781, "global_step": 317261, "epoch": 1888} {"train_loss": -11.348928451538086, "global_step": 317262, "epoch": 1888} {"train_loss": -12.139931678771973, "global_step": 317263, "epoch": 1888} {"train_loss": -11.259708404541016, "global_step": 317264, "epoch": 1888} {"train_loss": -11.66684341430664, "global_step": 317265, "epoch": 1888} {"train_loss": -11.760440826416016, "global_step": 317266, "epoch": 1888} {"train_loss": -11.586095809936523, "global_step": 317267, "epoch": 1888} {"train_loss": -12.003704071044922, "global_step": 317268, "epoch": 1888} {"train_loss": -11.675287246704102, "global_step": 317269, "epoch": 1888} {"train_loss": -12.149022102355957, "global_step": 317270, "epoch": 1888} {"train_loss": -11.830925941467285, "global_step": 317271, "epoch": 1888} {"train_loss": -12.12937068939209, "global_step": 317272, "epoch": 1888} {"train_loss": -12.112528800964355, "global_step": 317273, "epoch": 1888} {"train_loss": -11.920300483703613, "global_step": 317274, "epoch": 1888} {"train_loss": -11.766101837158203, "global_step": 317275, "epoch": 1888} {"train_loss": -11.317996978759766, "global_step": 317276, "epoch": 1888} {"train_loss": -11.48851490020752, "global_step": 317277, "epoch": 1888} {"train_loss": -11.946014404296875, "global_step": 317278, "epoch": 1888} {"train_loss": -11.528590202331543, "global_step": 317279, "epoch": 1888} {"train_loss": -11.723321914672852, "global_step": 317280, "epoch": 1888} {"train_loss": -11.634515762329102, "global_step": 317281, "epoch": 1888} {"train_loss": -11.907489776611328, "global_step": 317282, "epoch": 1888} {"train_loss": -12.212501525878906, "global_step": 317283, "epoch": 1888} {"train_loss": -11.979057312011719, "global_step": 317284, "epoch": 1888} {"train_loss": -12.227027893066406, "global_step": 317285, "epoch": 1888} {"train_loss": -11.747637748718262, "global_step": 317286, "epoch": 1888} {"train_loss": -12.30430793762207, "global_step": 317287, "epoch": 1888} {"train_loss": -12.007574081420898, "global_step": 317288, "epoch": 1888} {"train_loss": -12.056358337402344, "global_step": 317289, "epoch": 1888} {"train_loss": -12.262044906616211, "global_step": 317290, "epoch": 1888} {"train_loss": -12.185131072998047, "global_step": 317291, "epoch": 1888} {"train_loss": -12.273591995239258, "global_step": 317292, "epoch": 1888} {"train_loss": -12.164278030395508, "global_step": 317293, "epoch": 1888} {"train_loss": -12.381916046142578, "global_step": 317294, "epoch": 1888} {"train_loss": -12.297711372375488, "global_step": 317295, "epoch": 1888} {"train_loss": -12.443628311157227, "global_step": 317296, "epoch": 1888} {"train_loss": -12.085345268249512, "global_step": 317297, "epoch": 1888} {"train_loss": -12.406978607177734, "global_step": 317298, "epoch": 1888} {"train_loss": -12.342491149902344, "global_step": 317299, "epoch": 1888} {"train_loss": -12.396635055541992, "global_step": 317300, "epoch": 1888} {"train_loss": -12.416633605957031, "global_step": 317301, "epoch": 1888} {"train_loss": -12.574193954467773, "global_step": 317302, "epoch": 1888} {"train_loss": -12.334061622619629, "global_step": 317303, "epoch": 1888} {"train_loss": -12.489054679870605, "global_step": 317304, "epoch": 1888} {"train_loss": -12.51643180847168, "global_step": 317305, "epoch": 1888} {"train_loss": -12.332512855529785, "global_step": 317306, "epoch": 1888} {"train_loss": -12.533757209777832, "global_step": 317307, "epoch": 1888} {"train_loss": -12.288701057434082, "global_step": 317308, "epoch": 1888} {"train_loss": -12.448548316955566, "global_step": 317309, "epoch": 1888} {"train_loss": -12.433036804199219, "global_step": 317310, "epoch": 1888} {"train_loss": -12.384038925170898, "global_step": 317311, "epoch": 1888} {"train_loss": -12.546422958374023, "global_step": 317312, "epoch": 1888} {"train_loss": -12.415328979492188, "global_step": 317313, "epoch": 1888} {"train_loss": -12.47018814086914, "global_step": 317314, "epoch": 1888} {"train_loss": -12.509004592895508, "global_step": 317315, "epoch": 1888} {"train_loss": -12.611991882324219, "global_step": 317316, "epoch": 1888} {"train_loss": -12.496191024780273, "global_step": 317317, "epoch": 1888} {"train_loss": -12.476242065429688, "global_step": 317318, "epoch": 1888} {"train_loss": -12.612960815429688, "global_step": 317319, "epoch": 1888} {"train_loss": -12.531229972839355, "global_step": 317320, "epoch": 1888} {"train_loss": -12.568595886230469, "global_step": 317321, "epoch": 1888} {"train_loss": -12.410329818725586, "global_step": 317322, "epoch": 1888} {"train_loss": -12.654450416564941, "global_step": 317323, "epoch": 1888} {"train_loss": -12.422697067260742, "global_step": 317324, "epoch": 1888} {"train_loss": -12.068855285644531, "global_step": 317325, "epoch": 1888} {"train_loss": -12.162932395935059, "global_step": 317326, "epoch": 1888} {"train_loss": -12.274593353271484, "global_step": 317327, "epoch": 1888} {"train_loss": -12.052722930908203, "global_step": 317328, "epoch": 1888} {"train_loss": -12.33355712890625, "global_step": 317329, "epoch": 1888} {"train_loss": -12.27376937866211, "global_step": 317330, "epoch": 1888} {"train_loss": -12.248342514038086, "global_step": 317331, "epoch": 1888} {"train_loss": -12.421931266784668, "global_step": 317332, "epoch": 1888} {"train_loss": -12.064009666442871, "global_step": 317333, "epoch": 1888} {"train_loss": -10.644002914428711, "global_step": 317334, "epoch": 1888} {"train_loss": -9.309566497802734, "global_step": 317335, "epoch": 1888} {"train_loss": -11.68004322052002, "global_step": 317336, "epoch": 1888} {"train_loss": -9.435379028320312, "global_step": 317337, "epoch": 1888} {"train_loss": -10.924330711364746, "global_step": 317338, "epoch": 1888} {"train_loss": -11.346352577209473, "global_step": 317339, "epoch": 1888} {"train_loss": -10.158210754394531, "global_step": 317340, "epoch": 1888} {"train_loss": -11.801108360290527, "global_step": 317341, "epoch": 1888} {"train_loss": -10.325206756591797, "global_step": 317342, "epoch": 1888} {"train_loss": -11.3190336227417, "global_step": 317343, "epoch": 1888} {"train_loss": -11.238213539123535, "global_step": 317344, "epoch": 1888} {"train_loss": -11.177726745605469, "global_step": 317345, "epoch": 1888} {"train_loss": -10.825343132019043, "global_step": 317346, "epoch": 1888} {"train_loss": -11.775259971618652, "global_step": 317347, "epoch": 1888} {"train_loss": -11.34299373626709, "global_step": 317348, "epoch": 1888} {"train_loss": -11.539329528808594, "global_step": 317349, "epoch": 1888} {"train_loss": -11.250300407409668, "global_step": 317350, "epoch": 1888} {"train_loss": -11.871857092494057, "global_step": 317351, "epoch": 1888, "val_loss": 279815.34375} {"train_loss": -10.890130996704102, "global_step": 317352, "epoch": 1889} {"train_loss": -11.893695831298828, "global_step": 317353, "epoch": 1889} {"train_loss": -11.44611930847168, "global_step": 317354, "epoch": 1889} {"train_loss": -11.01762580871582, "global_step": 317355, "epoch": 1889} {"train_loss": -11.264291763305664, "global_step": 317356, "epoch": 1889} {"train_loss": -11.087390899658203, "global_step": 317357, "epoch": 1889} {"train_loss": -10.215007781982422, "global_step": 317358, "epoch": 1889} {"train_loss": -11.174675941467285, "global_step": 317359, "epoch": 1889} {"train_loss": -10.271308898925781, "global_step": 317360, "epoch": 1889} {"train_loss": -11.000221252441406, "global_step": 317361, "epoch": 1889} {"train_loss": -9.894545555114746, "global_step": 317362, "epoch": 1889} {"train_loss": -11.092625617980957, "global_step": 317363, "epoch": 1889} {"train_loss": -10.097192764282227, "global_step": 317364, "epoch": 1889} {"train_loss": -11.939506530761719, "global_step": 317365, "epoch": 1889} {"train_loss": -10.656879425048828, "global_step": 317366, "epoch": 1889} {"train_loss": -11.170208930969238, "global_step": 317367, "epoch": 1889} {"train_loss": -11.676191329956055, "global_step": 317368, "epoch": 1889} {"train_loss": -11.108427047729492, "global_step": 317369, "epoch": 1889} {"train_loss": -11.727152824401855, "global_step": 317370, "epoch": 1889} {"train_loss": -10.817704200744629, "global_step": 317371, "epoch": 1889} {"train_loss": -11.2725830078125, "global_step": 317372, "epoch": 1889} {"train_loss": -11.286678314208984, "global_step": 317373, "epoch": 1889} {"train_loss": -10.556403160095215, "global_step": 317374, "epoch": 1889} {"train_loss": -11.66301155090332, "global_step": 317375, "epoch": 1889} {"train_loss": -11.222270011901855, "global_step": 317376, "epoch": 1889} {"train_loss": -10.883707046508789, "global_step": 317377, "epoch": 1889} {"train_loss": -11.653528213500977, "global_step": 317378, "epoch": 1889} {"train_loss": -11.210430145263672, "global_step": 317379, "epoch": 1889} {"train_loss": -11.312065124511719, "global_step": 317380, "epoch": 1889} {"train_loss": -11.806129455566406, "global_step": 317381, "epoch": 1889} {"train_loss": -10.814231872558594, "global_step": 317382, "epoch": 1889} {"train_loss": -11.875734329223633, "global_step": 317383, "epoch": 1889} {"train_loss": -11.145352363586426, "global_step": 317384, "epoch": 1889} {"train_loss": -11.231779098510742, "global_step": 317385, "epoch": 1889} {"train_loss": -11.248065948486328, "global_step": 317386, "epoch": 1889} {"train_loss": -11.08761978149414, "global_step": 317387, "epoch": 1889} {"train_loss": -11.898987770080566, "global_step": 317388, "epoch": 1889} {"train_loss": -11.460501670837402, "global_step": 317389, "epoch": 1889} {"train_loss": -11.384881019592285, "global_step": 317390, "epoch": 1889} {"train_loss": -11.897482872009277, "global_step": 317391, "epoch": 1889} {"train_loss": -11.914979934692383, "global_step": 317392, "epoch": 1889} {"train_loss": -11.646501541137695, "global_step": 317393, "epoch": 1889} {"train_loss": -12.099639892578125, "global_step": 317394, "epoch": 1889} {"train_loss": -11.966069221496582, "global_step": 317395, "epoch": 1889} {"train_loss": -11.790626525878906, "global_step": 317396, "epoch": 1889} {"train_loss": -11.883894920349121, "global_step": 317397, "epoch": 1889} {"train_loss": -11.953432083129883, "global_step": 317398, "epoch": 1889} {"train_loss": -11.945045471191406, "global_step": 317399, "epoch": 1889} {"train_loss": -11.839252471923828, "global_step": 317400, "epoch": 1889} {"train_loss": -11.939374923706055, "global_step": 317401, "epoch": 1889} {"train_loss": -12.197286605834961, "global_step": 317402, "epoch": 1889} {"train_loss": -12.00013542175293, "global_step": 317403, "epoch": 1889} {"train_loss": -12.062858581542969, "global_step": 317404, "epoch": 1889} {"train_loss": -12.186487197875977, "global_step": 317405, "epoch": 1889} {"train_loss": -12.27469253540039, "global_step": 317406, "epoch": 1889} {"train_loss": -12.005475997924805, "global_step": 317407, "epoch": 1889} {"train_loss": -12.185646057128906, "global_step": 317408, "epoch": 1889} {"train_loss": -12.291091918945312, "global_step": 317409, "epoch": 1889} {"train_loss": -12.160941123962402, "global_step": 317410, "epoch": 1889} {"train_loss": -12.348276138305664, "global_step": 317411, "epoch": 1889} {"train_loss": -12.085590362548828, "global_step": 317412, "epoch": 1889} {"train_loss": -12.35861587524414, "global_step": 317413, "epoch": 1889} {"train_loss": -12.057731628417969, "global_step": 317414, "epoch": 1889} {"train_loss": -12.204120635986328, "global_step": 317415, "epoch": 1889} {"train_loss": -12.238061904907227, "global_step": 317416, "epoch": 1889} {"train_loss": -12.180915832519531, "global_step": 317417, "epoch": 1889} {"train_loss": -12.05672836303711, "global_step": 317418, "epoch": 1889} {"train_loss": -12.328607559204102, "global_step": 317419, "epoch": 1889} {"train_loss": -12.316671371459961, "global_step": 317420, "epoch": 1889} {"train_loss": -12.242483139038086, "global_step": 317421, "epoch": 1889} {"train_loss": -12.234947204589844, "global_step": 317422, "epoch": 1889} {"train_loss": -12.186345100402832, "global_step": 317423, "epoch": 1889} {"train_loss": -12.282776832580566, "global_step": 317424, "epoch": 1889} {"train_loss": -12.49062728881836, "global_step": 317425, "epoch": 1889} {"train_loss": -12.205581665039062, "global_step": 317426, "epoch": 1889} {"train_loss": -12.277820587158203, "global_step": 317427, "epoch": 1889} {"train_loss": -12.475523948669434, "global_step": 317428, "epoch": 1889} {"train_loss": -12.350709915161133, "global_step": 317429, "epoch": 1889} {"train_loss": -12.338438034057617, "global_step": 317430, "epoch": 1889} {"train_loss": -12.189318656921387, "global_step": 317431, "epoch": 1889} {"train_loss": -12.575048446655273, "global_step": 317432, "epoch": 1889} {"train_loss": -12.210777282714844, "global_step": 317433, "epoch": 1889} {"train_loss": -12.551839828491211, "global_step": 317434, "epoch": 1889} {"train_loss": -12.121448516845703, "global_step": 317435, "epoch": 1889} {"train_loss": -12.258783340454102, "global_step": 317436, "epoch": 1889} {"train_loss": -12.172285079956055, "global_step": 317437, "epoch": 1889} {"train_loss": -12.019196510314941, "global_step": 317438, "epoch": 1889} {"train_loss": -12.470541000366211, "global_step": 317439, "epoch": 1889} {"train_loss": -12.249044418334961, "global_step": 317440, "epoch": 1889} {"train_loss": -12.171674728393555, "global_step": 317441, "epoch": 1889} {"train_loss": -11.90417766571045, "global_step": 317442, "epoch": 1889} {"train_loss": -11.943302154541016, "global_step": 317443, "epoch": 1889} {"train_loss": -12.230499267578125, "global_step": 317444, "epoch": 1889} {"train_loss": -12.004667282104492, "global_step": 317445, "epoch": 1889} {"train_loss": -12.240467071533203, "global_step": 317446, "epoch": 1889} {"train_loss": -12.348140716552734, "global_step": 317447, "epoch": 1889} {"train_loss": -12.04156494140625, "global_step": 317448, "epoch": 1889} {"train_loss": -12.212509155273438, "global_step": 317449, "epoch": 1889} {"train_loss": -11.831901550292969, "global_step": 317450, "epoch": 1889} {"train_loss": -12.398496627807617, "global_step": 317451, "epoch": 1889} {"train_loss": -12.264554977416992, "global_step": 317452, "epoch": 1889} {"train_loss": -12.037917137145996, "global_step": 317453, "epoch": 1889} {"train_loss": -12.244667053222656, "global_step": 317454, "epoch": 1889} {"train_loss": -12.34579849243164, "global_step": 317455, "epoch": 1889} {"train_loss": -12.105461120605469, "global_step": 317456, "epoch": 1889} {"train_loss": -12.119847297668457, "global_step": 317457, "epoch": 1889} {"train_loss": -12.124366760253906, "global_step": 317458, "epoch": 1889} {"train_loss": -12.26998519897461, "global_step": 317459, "epoch": 1889} {"train_loss": -12.342140197753906, "global_step": 317460, "epoch": 1889} {"train_loss": -12.028768539428711, "global_step": 317461, "epoch": 1889} {"train_loss": -12.154748916625977, "global_step": 317462, "epoch": 1889} {"train_loss": -12.13141918182373, "global_step": 317463, "epoch": 1889} {"train_loss": -11.82023811340332, "global_step": 317464, "epoch": 1889} {"train_loss": -12.070686340332031, "global_step": 317465, "epoch": 1889} {"train_loss": -11.8651123046875, "global_step": 317466, "epoch": 1889} {"train_loss": -11.797109603881836, "global_step": 317467, "epoch": 1889} {"train_loss": -12.278829574584961, "global_step": 317468, "epoch": 1889} {"train_loss": -11.572690963745117, "global_step": 317469, "epoch": 1889} {"train_loss": -12.19282054901123, "global_step": 317470, "epoch": 1889} {"train_loss": -11.995035171508789, "global_step": 317471, "epoch": 1889} {"train_loss": -11.868889808654785, "global_step": 317472, "epoch": 1889} {"train_loss": -10.843161582946777, "global_step": 317473, "epoch": 1889} {"train_loss": -11.280386924743652, "global_step": 317474, "epoch": 1889} {"train_loss": -10.981208801269531, "global_step": 317475, "epoch": 1889} {"train_loss": -11.961986541748047, "global_step": 317476, "epoch": 1889} {"train_loss": -10.442889213562012, "global_step": 317477, "epoch": 1889} {"train_loss": -11.895576477050781, "global_step": 317478, "epoch": 1889} {"train_loss": -11.508792877197266, "global_step": 317479, "epoch": 1889} {"train_loss": -11.633186340332031, "global_step": 317480, "epoch": 1889} {"train_loss": -11.881172180175781, "global_step": 317481, "epoch": 1889} {"train_loss": -11.340679168701172, "global_step": 317482, "epoch": 1889} {"train_loss": -11.32034969329834, "global_step": 317483, "epoch": 1889} {"train_loss": -10.927221298217773, "global_step": 317484, "epoch": 1889} {"train_loss": -11.464600563049316, "global_step": 317485, "epoch": 1889} {"train_loss": -11.167509078979492, "global_step": 317486, "epoch": 1889} {"train_loss": -11.77751350402832, "global_step": 317487, "epoch": 1889} {"train_loss": -11.636051177978516, "global_step": 317488, "epoch": 1889} {"train_loss": -11.905007362365723, "global_step": 317489, "epoch": 1889} {"train_loss": -12.02275276184082, "global_step": 317490, "epoch": 1889} {"train_loss": -11.715330123901367, "global_step": 317491, "epoch": 1889} {"train_loss": -11.831809997558594, "global_step": 317492, "epoch": 1889} {"train_loss": -11.90388298034668, "global_step": 317493, "epoch": 1889} {"train_loss": -11.686914443969727, "global_step": 317494, "epoch": 1889} {"train_loss": -11.70481014251709, "global_step": 317495, "epoch": 1889} {"train_loss": -11.557487487792969, "global_step": 317496, "epoch": 1889} {"train_loss": -10.697676658630371, "global_step": 317497, "epoch": 1889} {"train_loss": -11.686331748962402, "global_step": 317498, "epoch": 1889} {"train_loss": -11.378093719482422, "global_step": 317499, "epoch": 1889} {"train_loss": -11.779643058776855, "global_step": 317500, "epoch": 1889} {"train_loss": -10.987364768981934, "global_step": 317501, "epoch": 1889} {"train_loss": -11.54911994934082, "global_step": 317502, "epoch": 1889} {"train_loss": -11.679181098937988, "global_step": 317503, "epoch": 1889} {"train_loss": -11.674140930175781, "global_step": 317504, "epoch": 1889} {"train_loss": -11.38587760925293, "global_step": 317505, "epoch": 1889} {"train_loss": -11.825872421264648, "global_step": 317506, "epoch": 1889} {"train_loss": -11.858097076416016, "global_step": 317507, "epoch": 1889} {"train_loss": -11.729681015014648, "global_step": 317508, "epoch": 1889} {"train_loss": -11.25121021270752, "global_step": 317509, "epoch": 1889} {"train_loss": -11.815958023071289, "global_step": 317510, "epoch": 1889} {"train_loss": -11.164335250854492, "global_step": 317511, "epoch": 1889} {"train_loss": -11.931110382080078, "global_step": 317512, "epoch": 1889} {"train_loss": -11.598276138305664, "global_step": 317513, "epoch": 1889} {"train_loss": -11.751263618469238, "global_step": 317514, "epoch": 1889} {"train_loss": -11.967573165893555, "global_step": 317515, "epoch": 1889} {"train_loss": -10.845520973205566, "global_step": 317516, "epoch": 1889} {"train_loss": -12.386618614196777, "global_step": 317517, "epoch": 1889} {"train_loss": -11.553657531738281, "global_step": 317518, "epoch": 1889} {"train_loss": -11.74793891679673, "global_step": 317519, "epoch": 1889, "val_loss": 280341.625} {"train_loss": -12.214115142822266, "global_step": 317520, "epoch": 1890} {"train_loss": -11.90719985961914, "global_step": 317521, "epoch": 1890} {"train_loss": -12.16359806060791, "global_step": 317522, "epoch": 1890} {"train_loss": -11.682955741882324, "global_step": 317523, "epoch": 1890} {"train_loss": -12.143113136291504, "global_step": 317524, "epoch": 1890} {"train_loss": -12.02549934387207, "global_step": 317525, "epoch": 1890} {"train_loss": -12.280278205871582, "global_step": 317526, "epoch": 1890} {"train_loss": -12.17239761352539, "global_step": 317527, "epoch": 1890} {"train_loss": -11.833127975463867, "global_step": 317528, "epoch": 1890} {"train_loss": -12.356983184814453, "global_step": 317529, "epoch": 1890} {"train_loss": -12.06313705444336, "global_step": 317530, "epoch": 1890} {"train_loss": -12.347967147827148, "global_step": 317531, "epoch": 1890} {"train_loss": -12.19007682800293, "global_step": 317532, "epoch": 1890} {"train_loss": -12.119317054748535, "global_step": 317533, "epoch": 1890} {"train_loss": -12.159835815429688, "global_step": 317534, "epoch": 1890} {"train_loss": -12.001286506652832, "global_step": 317535, "epoch": 1890} {"train_loss": -12.406837463378906, "global_step": 317536, "epoch": 1890} {"train_loss": -12.341816902160645, "global_step": 317537, "epoch": 1890} {"train_loss": -12.45295524597168, "global_step": 317538, "epoch": 1890} {"train_loss": -12.347915649414062, "global_step": 317539, "epoch": 1890} {"train_loss": -12.334492683410645, "global_step": 317540, "epoch": 1890} {"train_loss": -12.277017593383789, "global_step": 317541, "epoch": 1890} {"train_loss": -12.234701156616211, "global_step": 317542, "epoch": 1890} {"train_loss": -12.354394912719727, "global_step": 317543, "epoch": 1890} {"train_loss": -12.373353958129883, "global_step": 317544, "epoch": 1890} {"train_loss": -12.31176471710205, "global_step": 317545, "epoch": 1890} {"train_loss": -12.448786735534668, "global_step": 317546, "epoch": 1890} {"train_loss": -12.50977897644043, "global_step": 317547, "epoch": 1890} {"train_loss": -12.386908531188965, "global_step": 317548, "epoch": 1890} {"train_loss": -12.365964889526367, "global_step": 317549, "epoch": 1890} {"train_loss": -12.617557525634766, "global_step": 317550, "epoch": 1890} {"train_loss": -12.431113243103027, "global_step": 317551, "epoch": 1890} {"train_loss": -12.153665542602539, "global_step": 317552, "epoch": 1890} {"train_loss": -12.22659969329834, "global_step": 317553, "epoch": 1890} {"train_loss": -12.4077787399292, "global_step": 317554, "epoch": 1890} {"train_loss": -12.382529258728027, "global_step": 317555, "epoch": 1890} {"train_loss": -12.481365203857422, "global_step": 317556, "epoch": 1890} {"train_loss": -12.704938888549805, "global_step": 317557, "epoch": 1890} {"train_loss": -12.157418251037598, "global_step": 317558, "epoch": 1890} {"train_loss": -12.46232795715332, "global_step": 317559, "epoch": 1890} {"train_loss": -12.42345905303955, "global_step": 317560, "epoch": 1890} {"train_loss": -12.701051712036133, "global_step": 317561, "epoch": 1890} {"train_loss": -12.403040885925293, "global_step": 317562, "epoch": 1890} {"train_loss": -12.592835426330566, "global_step": 317563, "epoch": 1890} {"train_loss": -12.334285736083984, "global_step": 317564, "epoch": 1890} {"train_loss": -12.613763809204102, "global_step": 317565, "epoch": 1890} {"train_loss": -12.090685844421387, "global_step": 317566, "epoch": 1890} {"train_loss": -12.062591552734375, "global_step": 317567, "epoch": 1890} {"train_loss": -12.250933647155762, "global_step": 317568, "epoch": 1890} {"train_loss": -12.25118637084961, "global_step": 317569, "epoch": 1890} {"train_loss": -12.686697006225586, "global_step": 317570, "epoch": 1890} {"train_loss": -11.930999755859375, "global_step": 317571, "epoch": 1890} {"train_loss": -12.534873008728027, "global_step": 317572, "epoch": 1890} {"train_loss": -11.972168922424316, "global_step": 317573, "epoch": 1890} {"train_loss": -12.54283332824707, "global_step": 317574, "epoch": 1890} {"train_loss": -12.2103271484375, "global_step": 317575, "epoch": 1890} {"train_loss": -12.333642959594727, "global_step": 317576, "epoch": 1890} {"train_loss": -12.394708633422852, "global_step": 317577, "epoch": 1890} {"train_loss": -12.17751693725586, "global_step": 317578, "epoch": 1890} {"train_loss": -12.408937454223633, "global_step": 317579, "epoch": 1890} {"train_loss": -12.3323335647583, "global_step": 317580, "epoch": 1890} {"train_loss": -12.54463005065918, "global_step": 317581, "epoch": 1890} {"train_loss": -12.340343475341797, "global_step": 317582, "epoch": 1890} {"train_loss": -12.382607460021973, "global_step": 317583, "epoch": 1890} {"train_loss": -11.607019424438477, "global_step": 317584, "epoch": 1890} {"train_loss": -11.799062728881836, "global_step": 317585, "epoch": 1890} {"train_loss": -12.421031951904297, "global_step": 317586, "epoch": 1890} {"train_loss": -11.442998886108398, "global_step": 317587, "epoch": 1890} {"train_loss": -10.647390365600586, "global_step": 317588, "epoch": 1890} {"train_loss": -11.538728713989258, "global_step": 317589, "epoch": 1890} {"train_loss": -12.413095474243164, "global_step": 317590, "epoch": 1890} {"train_loss": -11.005395889282227, "global_step": 317591, "epoch": 1890} {"train_loss": -11.60774040222168, "global_step": 317592, "epoch": 1890} {"train_loss": -11.210795402526855, "global_step": 317593, "epoch": 1890} {"train_loss": -12.246628761291504, "global_step": 317594, "epoch": 1890} {"train_loss": -11.214046478271484, "global_step": 317595, "epoch": 1890} {"train_loss": -10.167606353759766, "global_step": 317596, "epoch": 1890} {"train_loss": -11.342273712158203, "global_step": 317597, "epoch": 1890} {"train_loss": -11.801921844482422, "global_step": 317598, "epoch": 1890} {"train_loss": -9.067880630493164, "global_step": 317599, "epoch": 1890} {"train_loss": -10.596919059753418, "global_step": 317600, "epoch": 1890} {"train_loss": -10.55522346496582, "global_step": 317601, "epoch": 1890} {"train_loss": -9.982156753540039, "global_step": 317602, "epoch": 1890} {"train_loss": -10.284324645996094, "global_step": 317603, "epoch": 1890} {"train_loss": -11.520217895507812, "global_step": 317604, "epoch": 1890} {"train_loss": -10.976784706115723, "global_step": 317605, "epoch": 1890} {"train_loss": -10.965215682983398, "global_step": 317606, "epoch": 1890} {"train_loss": -10.934605598449707, "global_step": 317607, "epoch": 1890} {"train_loss": -11.056353569030762, "global_step": 317608, "epoch": 1890} {"train_loss": -11.020524978637695, "global_step": 317609, "epoch": 1890} {"train_loss": -10.698025703430176, "global_step": 317610, "epoch": 1890} {"train_loss": -11.400627136230469, "global_step": 317611, "epoch": 1890} {"train_loss": -10.654069900512695, "global_step": 317612, "epoch": 1890} {"train_loss": -11.724987030029297, "global_step": 317613, "epoch": 1890} {"train_loss": -11.37553596496582, "global_step": 317614, "epoch": 1890} {"train_loss": -11.601232528686523, "global_step": 317615, "epoch": 1890} {"train_loss": -11.981110572814941, "global_step": 317616, "epoch": 1890} {"train_loss": -11.627307891845703, "global_step": 317617, "epoch": 1890} {"train_loss": -11.879449844360352, "global_step": 317618, "epoch": 1890} {"train_loss": -11.950223922729492, "global_step": 317619, "epoch": 1890} {"train_loss": -12.001043319702148, "global_step": 317620, "epoch": 1890} {"train_loss": -11.454158782958984, "global_step": 317621, "epoch": 1890} {"train_loss": -11.700706481933594, "global_step": 317622, "epoch": 1890} {"train_loss": -11.970556259155273, "global_step": 317623, "epoch": 1890} {"train_loss": -11.556236267089844, "global_step": 317624, "epoch": 1890} {"train_loss": -12.099383354187012, "global_step": 317625, "epoch": 1890} {"train_loss": -11.885464668273926, "global_step": 317626, "epoch": 1890} {"train_loss": -11.927328109741211, "global_step": 317627, "epoch": 1890} {"train_loss": -11.762338638305664, "global_step": 317628, "epoch": 1890} {"train_loss": -11.414932250976562, "global_step": 317629, "epoch": 1890} {"train_loss": -11.713350296020508, "global_step": 317630, "epoch": 1890} {"train_loss": -11.107733726501465, "global_step": 317631, "epoch": 1890} {"train_loss": -11.313947677612305, "global_step": 317632, "epoch": 1890} {"train_loss": -10.748640060424805, "global_step": 317633, "epoch": 1890} {"train_loss": -11.635268211364746, "global_step": 317634, "epoch": 1890} {"train_loss": -11.458368301391602, "global_step": 317635, "epoch": 1890} {"train_loss": -12.049654006958008, "global_step": 317636, "epoch": 1890} {"train_loss": -11.357978820800781, "global_step": 317637, "epoch": 1890} {"train_loss": -11.660055160522461, "global_step": 317638, "epoch": 1890} {"train_loss": -11.256942749023438, "global_step": 317639, "epoch": 1890} {"train_loss": -12.229214668273926, "global_step": 317640, "epoch": 1890} {"train_loss": -11.411809921264648, "global_step": 317641, "epoch": 1890} {"train_loss": -11.931468963623047, "global_step": 317642, "epoch": 1890} {"train_loss": -11.927270889282227, "global_step": 317643, "epoch": 1890} {"train_loss": -11.878204345703125, "global_step": 317644, "epoch": 1890} {"train_loss": -11.847162246704102, "global_step": 317645, "epoch": 1890} {"train_loss": -12.084640502929688, "global_step": 317646, "epoch": 1890} {"train_loss": -11.94849681854248, "global_step": 317647, "epoch": 1890} {"train_loss": -12.056461334228516, "global_step": 317648, "epoch": 1890} {"train_loss": -11.888684272766113, "global_step": 317649, "epoch": 1890} {"train_loss": -12.092254638671875, "global_step": 317650, "epoch": 1890} {"train_loss": -12.003812789916992, "global_step": 317651, "epoch": 1890} {"train_loss": -11.89286994934082, "global_step": 317652, "epoch": 1890} {"train_loss": -12.192636489868164, "global_step": 317653, "epoch": 1890} {"train_loss": -11.837812423706055, "global_step": 317654, "epoch": 1890} {"train_loss": -11.838869094848633, "global_step": 317655, "epoch": 1890} {"train_loss": -12.154468536376953, "global_step": 317656, "epoch": 1890} {"train_loss": -11.698548316955566, "global_step": 317657, "epoch": 1890} {"train_loss": -12.16293716430664, "global_step": 317658, "epoch": 1890} {"train_loss": -11.858059883117676, "global_step": 317659, "epoch": 1890} {"train_loss": -11.987829208374023, "global_step": 317660, "epoch": 1890} {"train_loss": -12.086030960083008, "global_step": 317661, "epoch": 1890} {"train_loss": -11.835638046264648, "global_step": 317662, "epoch": 1890} {"train_loss": -11.95138168334961, "global_step": 317663, "epoch": 1890} {"train_loss": -11.732086181640625, "global_step": 317664, "epoch": 1890} {"train_loss": -12.083776473999023, "global_step": 317665, "epoch": 1890} {"train_loss": -11.767032623291016, "global_step": 317666, "epoch": 1890} {"train_loss": -11.956470489501953, "global_step": 317667, "epoch": 1890} {"train_loss": -11.983400344848633, "global_step": 317668, "epoch": 1890} {"train_loss": -12.001296997070312, "global_step": 317669, "epoch": 1890} {"train_loss": -11.848556518554688, "global_step": 317670, "epoch": 1890} {"train_loss": -11.939395904541016, "global_step": 317671, "epoch": 1890} {"train_loss": -11.522835731506348, "global_step": 317672, "epoch": 1890} {"train_loss": -12.1142578125, "global_step": 317673, "epoch": 1890} {"train_loss": -11.141077041625977, "global_step": 317674, "epoch": 1890} {"train_loss": -11.867046356201172, "global_step": 317675, "epoch": 1890} {"train_loss": -12.195880889892578, "global_step": 317676, "epoch": 1890} {"train_loss": -11.847381591796875, "global_step": 317677, "epoch": 1890} {"train_loss": -11.977925300598145, "global_step": 317678, "epoch": 1890} {"train_loss": -11.612703323364258, "global_step": 317679, "epoch": 1890} {"train_loss": -11.616608619689941, "global_step": 317680, "epoch": 1890} {"train_loss": -11.746085166931152, "global_step": 317681, "epoch": 1890} {"train_loss": -11.654369354248047, "global_step": 317682, "epoch": 1890} {"train_loss": -11.295816421508789, "global_step": 317683, "epoch": 1890} {"train_loss": -12.204191207885742, "global_step": 317684, "epoch": 1890} {"train_loss": -11.303886413574219, "global_step": 317685, "epoch": 1890} {"train_loss": -11.554675102233887, "global_step": 317686, "epoch": 1890} {"train_loss": -11.863537725948152, "global_step": 317687, "epoch": 1890, "val_loss": 283912.5625, "train_action_mse_error": 1.2176318168640137} {"train_loss": -11.673166275024414, "global_step": 317688, "epoch": 1891} {"train_loss": -12.210912704467773, "global_step": 317689, "epoch": 1891} {"train_loss": -11.637757301330566, "global_step": 317690, "epoch": 1891} {"train_loss": -11.649063110351562, "global_step": 317691, "epoch": 1891} {"train_loss": -11.684499740600586, "global_step": 317692, "epoch": 1891} {"train_loss": -11.827690124511719, "global_step": 317693, "epoch": 1891} {"train_loss": -12.072054862976074, "global_step": 317694, "epoch": 1891} {"train_loss": -11.66396427154541, "global_step": 317695, "epoch": 1891} {"train_loss": -12.23077392578125, "global_step": 317696, "epoch": 1891} {"train_loss": -11.514313697814941, "global_step": 317697, "epoch": 1891} {"train_loss": -11.804800033569336, "global_step": 317698, "epoch": 1891} {"train_loss": -11.147659301757812, "global_step": 317699, "epoch": 1891} {"train_loss": -11.90726089477539, "global_step": 317700, "epoch": 1891} {"train_loss": -10.772850036621094, "global_step": 317701, "epoch": 1891} {"train_loss": -11.67805290222168, "global_step": 317702, "epoch": 1891} {"train_loss": -10.295211791992188, "global_step": 317703, "epoch": 1891} {"train_loss": -11.676647186279297, "global_step": 317704, "epoch": 1891} {"train_loss": -10.513249397277832, "global_step": 317705, "epoch": 1891} {"train_loss": -11.923067092895508, "global_step": 317706, "epoch": 1891} {"train_loss": -10.895769119262695, "global_step": 317707, "epoch": 1891} {"train_loss": -11.389921188354492, "global_step": 317708, "epoch": 1891} {"train_loss": -11.297319412231445, "global_step": 317709, "epoch": 1891} {"train_loss": -11.95987606048584, "global_step": 317710, "epoch": 1891} {"train_loss": -11.114575386047363, "global_step": 317711, "epoch": 1891} {"train_loss": -11.843667030334473, "global_step": 317712, "epoch": 1891} {"train_loss": -11.790922164916992, "global_step": 317713, "epoch": 1891} {"train_loss": -12.037616729736328, "global_step": 317714, "epoch": 1891} {"train_loss": -11.614731788635254, "global_step": 317715, "epoch": 1891} {"train_loss": -11.658652305603027, "global_step": 317716, "epoch": 1891} {"train_loss": -11.740396499633789, "global_step": 317717, "epoch": 1891} {"train_loss": -11.712095260620117, "global_step": 317718, "epoch": 1891} {"train_loss": -11.53057861328125, "global_step": 317719, "epoch": 1891} {"train_loss": -12.100038528442383, "global_step": 317720, "epoch": 1891} {"train_loss": -10.76895523071289, "global_step": 317721, "epoch": 1891} {"train_loss": -12.085198402404785, "global_step": 317722, "epoch": 1891} {"train_loss": -11.254371643066406, "global_step": 317723, "epoch": 1891} {"train_loss": -11.37635612487793, "global_step": 317724, "epoch": 1891} {"train_loss": -12.081581115722656, "global_step": 317725, "epoch": 1891} {"train_loss": -11.485562324523926, "global_step": 317726, "epoch": 1891} {"train_loss": -12.004213333129883, "global_step": 317727, "epoch": 1891} {"train_loss": -11.954017639160156, "global_step": 317728, "epoch": 1891} {"train_loss": -11.745427131652832, "global_step": 317729, "epoch": 1891} {"train_loss": -12.280811309814453, "global_step": 317730, "epoch": 1891} {"train_loss": -11.858341217041016, "global_step": 317731, "epoch": 1891} {"train_loss": -12.179378509521484, "global_step": 317732, "epoch": 1891} {"train_loss": -11.963323593139648, "global_step": 317733, "epoch": 1891} {"train_loss": -12.002656936645508, "global_step": 317734, "epoch": 1891} {"train_loss": -12.064888000488281, "global_step": 317735, "epoch": 1891} {"train_loss": -11.800520896911621, "global_step": 317736, "epoch": 1891} {"train_loss": -11.763051986694336, "global_step": 317737, "epoch": 1891} {"train_loss": -11.449212074279785, "global_step": 317738, "epoch": 1891} {"train_loss": -12.22773551940918, "global_step": 317739, "epoch": 1891} {"train_loss": -11.94068717956543, "global_step": 317740, "epoch": 1891} {"train_loss": -11.89012336730957, "global_step": 317741, "epoch": 1891} {"train_loss": -12.095847129821777, "global_step": 317742, "epoch": 1891} {"train_loss": -12.064260482788086, "global_step": 317743, "epoch": 1891} {"train_loss": -11.889669418334961, "global_step": 317744, "epoch": 1891} {"train_loss": -12.11042594909668, "global_step": 317745, "epoch": 1891} {"train_loss": -11.77164077758789, "global_step": 317746, "epoch": 1891} {"train_loss": -12.062501907348633, "global_step": 317747, "epoch": 1891} {"train_loss": -12.336658477783203, "global_step": 317748, "epoch": 1891} {"train_loss": -12.16858196258545, "global_step": 317749, "epoch": 1891} {"train_loss": -12.03564453125, "global_step": 317750, "epoch": 1891} {"train_loss": -12.140345573425293, "global_step": 317751, "epoch": 1891} {"train_loss": -12.044898986816406, "global_step": 317752, "epoch": 1891} {"train_loss": -12.131817817687988, "global_step": 317753, "epoch": 1891} {"train_loss": -12.079025268554688, "global_step": 317754, "epoch": 1891} {"train_loss": -12.360238075256348, "global_step": 317755, "epoch": 1891} {"train_loss": -11.708067893981934, "global_step": 317756, "epoch": 1891} {"train_loss": -12.27724838256836, "global_step": 317757, "epoch": 1891} {"train_loss": -11.766288757324219, "global_step": 317758, "epoch": 1891} {"train_loss": -12.316764831542969, "global_step": 317759, "epoch": 1891} {"train_loss": -11.769401550292969, "global_step": 317760, "epoch": 1891} {"train_loss": -11.992595672607422, "global_step": 317761, "epoch": 1891} {"train_loss": -12.107343673706055, "global_step": 317762, "epoch": 1891} {"train_loss": -12.025688171386719, "global_step": 317763, "epoch": 1891} {"train_loss": -12.330735206604004, "global_step": 317764, "epoch": 1891} {"train_loss": -12.10130500793457, "global_step": 317765, "epoch": 1891} {"train_loss": -12.079240798950195, "global_step": 317766, "epoch": 1891} {"train_loss": -11.831670761108398, "global_step": 317767, "epoch": 1891} {"train_loss": -12.171157836914062, "global_step": 317768, "epoch": 1891} {"train_loss": -12.321832656860352, "global_step": 317769, "epoch": 1891} {"train_loss": -11.864702224731445, "global_step": 317770, "epoch": 1891} {"train_loss": -12.275283813476562, "global_step": 317771, "epoch": 1891} {"train_loss": -12.226411819458008, "global_step": 317772, "epoch": 1891} {"train_loss": -12.18333625793457, "global_step": 317773, "epoch": 1891} {"train_loss": -12.274778366088867, "global_step": 317774, "epoch": 1891} {"train_loss": -12.409319877624512, "global_step": 317775, "epoch": 1891} {"train_loss": -12.247913360595703, "global_step": 317776, "epoch": 1891} {"train_loss": -12.345664978027344, "global_step": 317777, "epoch": 1891} {"train_loss": -12.092073440551758, "global_step": 317778, "epoch": 1891} {"train_loss": -12.351605415344238, "global_step": 317779, "epoch": 1891} {"train_loss": -12.331514358520508, "global_step": 317780, "epoch": 1891} {"train_loss": -12.439855575561523, "global_step": 317781, "epoch": 1891} {"train_loss": -12.404147148132324, "global_step": 317782, "epoch": 1891} {"train_loss": -12.240484237670898, "global_step": 317783, "epoch": 1891} {"train_loss": -12.084037780761719, "global_step": 317784, "epoch": 1891} {"train_loss": -12.311914443969727, "global_step": 317785, "epoch": 1891} {"train_loss": -12.357421875, "global_step": 317786, "epoch": 1891} {"train_loss": -12.200353622436523, "global_step": 317787, "epoch": 1891} {"train_loss": -12.3541259765625, "global_step": 317788, "epoch": 1891} {"train_loss": -12.319242477416992, "global_step": 317789, "epoch": 1891} {"train_loss": -12.348562240600586, "global_step": 317790, "epoch": 1891} {"train_loss": -12.2125883102417, "global_step": 317791, "epoch": 1891} {"train_loss": -12.478710174560547, "global_step": 317792, "epoch": 1891} {"train_loss": -12.173027992248535, "global_step": 317793, "epoch": 1891} {"train_loss": -12.384293556213379, "global_step": 317794, "epoch": 1891} {"train_loss": -12.16157341003418, "global_step": 317795, "epoch": 1891} {"train_loss": -12.463808059692383, "global_step": 317796, "epoch": 1891} {"train_loss": -12.144710540771484, "global_step": 317797, "epoch": 1891} {"train_loss": -12.20010757446289, "global_step": 317798, "epoch": 1891} {"train_loss": -11.527772903442383, "global_step": 317799, "epoch": 1891} {"train_loss": -12.321735382080078, "global_step": 317800, "epoch": 1891} {"train_loss": -12.10858154296875, "global_step": 317801, "epoch": 1891} {"train_loss": -11.83736801147461, "global_step": 317802, "epoch": 1891} {"train_loss": -12.207683563232422, "global_step": 317803, "epoch": 1891} {"train_loss": -12.425588607788086, "global_step": 317804, "epoch": 1891} {"train_loss": -12.229734420776367, "global_step": 317805, "epoch": 1891} {"train_loss": -11.991350173950195, "global_step": 317806, "epoch": 1891} {"train_loss": -11.007222175598145, "global_step": 317807, "epoch": 1891} {"train_loss": -10.289068222045898, "global_step": 317808, "epoch": 1891} {"train_loss": -12.009679794311523, "global_step": 317809, "epoch": 1891} {"train_loss": -11.859153747558594, "global_step": 317810, "epoch": 1891} {"train_loss": -11.812032699584961, "global_step": 317811, "epoch": 1891} {"train_loss": -11.510383605957031, "global_step": 317812, "epoch": 1891} {"train_loss": -12.106830596923828, "global_step": 317813, "epoch": 1891} {"train_loss": -11.667652130126953, "global_step": 317814, "epoch": 1891} {"train_loss": -12.20904541015625, "global_step": 317815, "epoch": 1891} {"train_loss": -11.770496368408203, "global_step": 317816, "epoch": 1891} {"train_loss": -11.906559944152832, "global_step": 317817, "epoch": 1891} {"train_loss": -11.33385944366455, "global_step": 317818, "epoch": 1891} {"train_loss": -11.718183517456055, "global_step": 317819, "epoch": 1891} {"train_loss": -11.747576713562012, "global_step": 317820, "epoch": 1891} {"train_loss": -12.131784439086914, "global_step": 317821, "epoch": 1891} {"train_loss": -11.252108573913574, "global_step": 317822, "epoch": 1891} {"train_loss": -11.005484580993652, "global_step": 317823, "epoch": 1891} {"train_loss": -11.712231636047363, "global_step": 317824, "epoch": 1891} {"train_loss": -11.179695129394531, "global_step": 317825, "epoch": 1891} {"train_loss": -11.774110794067383, "global_step": 317826, "epoch": 1891} {"train_loss": -11.349865913391113, "global_step": 317827, "epoch": 1891} {"train_loss": -11.562765121459961, "global_step": 317828, "epoch": 1891} {"train_loss": -10.752931594848633, "global_step": 317829, "epoch": 1891} {"train_loss": -9.757816314697266, "global_step": 317830, "epoch": 1891} {"train_loss": -11.278846740722656, "global_step": 317831, "epoch": 1891} {"train_loss": -9.642792701721191, "global_step": 317832, "epoch": 1891} {"train_loss": -11.821784973144531, "global_step": 317833, "epoch": 1891} {"train_loss": -10.29091739654541, "global_step": 317834, "epoch": 1891} {"train_loss": -10.615396499633789, "global_step": 317835, "epoch": 1891} {"train_loss": -10.990166664123535, "global_step": 317836, "epoch": 1891} {"train_loss": -10.40857982635498, "global_step": 317837, "epoch": 1891} {"train_loss": -11.13351821899414, "global_step": 317838, "epoch": 1891} {"train_loss": -10.938604354858398, "global_step": 317839, "epoch": 1891} {"train_loss": -11.76477336883545, "global_step": 317840, "epoch": 1891} {"train_loss": -10.494386672973633, "global_step": 317841, "epoch": 1891} {"train_loss": -11.399288177490234, "global_step": 317842, "epoch": 1891} {"train_loss": -10.244138717651367, "global_step": 317843, "epoch": 1891} {"train_loss": -11.087089538574219, "global_step": 317844, "epoch": 1891} {"train_loss": -10.277565002441406, "global_step": 317845, "epoch": 1891} {"train_loss": -10.985426902770996, "global_step": 317846, "epoch": 1891} {"train_loss": -10.612993240356445, "global_step": 317847, "epoch": 1891} {"train_loss": -10.236342430114746, "global_step": 317848, "epoch": 1891} {"train_loss": -11.295808792114258, "global_step": 317849, "epoch": 1891} {"train_loss": -11.04176139831543, "global_step": 317850, "epoch": 1891} {"train_loss": -11.957545280456543, "global_step": 317851, "epoch": 1891} {"train_loss": -11.267738342285156, "global_step": 317852, "epoch": 1891} {"train_loss": -11.918731689453125, "global_step": 317853, "epoch": 1891} {"train_loss": -11.530182838439941, "global_step": 317854, "epoch": 1891} {"train_loss": -11.737572125026158, "global_step": 317855, "epoch": 1891, "val_loss": 282630.84375} {"train_loss": -11.972831726074219, "global_step": 317856, "epoch": 1892} {"train_loss": -11.98919677734375, "global_step": 317857, "epoch": 1892} {"train_loss": -10.729814529418945, "global_step": 317858, "epoch": 1892} {"train_loss": -11.839970588684082, "global_step": 317859, "epoch": 1892} {"train_loss": -11.958680152893066, "global_step": 317860, "epoch": 1892} {"train_loss": -11.706045150756836, "global_step": 317861, "epoch": 1892} {"train_loss": -12.109061241149902, "global_step": 317862, "epoch": 1892} {"train_loss": -11.610040664672852, "global_step": 317863, "epoch": 1892} {"train_loss": -11.698081016540527, "global_step": 317864, "epoch": 1892} {"train_loss": -12.048006057739258, "global_step": 317865, "epoch": 1892} {"train_loss": -11.951153755187988, "global_step": 317866, "epoch": 1892} {"train_loss": -11.780548095703125, "global_step": 317867, "epoch": 1892} {"train_loss": -11.736703872680664, "global_step": 317868, "epoch": 1892} {"train_loss": -11.58283805847168, "global_step": 317869, "epoch": 1892} {"train_loss": -11.905075073242188, "global_step": 317870, "epoch": 1892} {"train_loss": -11.969335556030273, "global_step": 317871, "epoch": 1892} {"train_loss": -12.05805778503418, "global_step": 317872, "epoch": 1892} {"train_loss": -12.19716739654541, "global_step": 317873, "epoch": 1892} {"train_loss": -11.875490188598633, "global_step": 317874, "epoch": 1892} {"train_loss": -11.924196243286133, "global_step": 317875, "epoch": 1892} {"train_loss": -11.855206489562988, "global_step": 317876, "epoch": 1892} {"train_loss": -11.942461013793945, "global_step": 317877, "epoch": 1892} {"train_loss": -12.207358360290527, "global_step": 317878, "epoch": 1892} {"train_loss": -12.054956436157227, "global_step": 317879, "epoch": 1892} {"train_loss": -11.8916654586792, "global_step": 317880, "epoch": 1892} {"train_loss": -11.9754638671875, "global_step": 317881, "epoch": 1892} {"train_loss": -12.214874267578125, "global_step": 317882, "epoch": 1892} {"train_loss": -11.815906524658203, "global_step": 317883, "epoch": 1892} {"train_loss": -12.065855026245117, "global_step": 317884, "epoch": 1892} {"train_loss": -12.151105880737305, "global_step": 317885, "epoch": 1892} {"train_loss": -11.898862838745117, "global_step": 317886, "epoch": 1892} {"train_loss": -12.480779647827148, "global_step": 317887, "epoch": 1892} {"train_loss": -12.185089111328125, "global_step": 317888, "epoch": 1892} {"train_loss": -12.29205322265625, "global_step": 317889, "epoch": 1892} {"train_loss": -12.1328763961792, "global_step": 317890, "epoch": 1892} {"train_loss": -12.212837219238281, "global_step": 317891, "epoch": 1892} {"train_loss": -12.471391677856445, "global_step": 317892, "epoch": 1892} {"train_loss": -12.277417182922363, "global_step": 317893, "epoch": 1892} {"train_loss": -12.320343017578125, "global_step": 317894, "epoch": 1892} {"train_loss": -12.259864807128906, "global_step": 317895, "epoch": 1892} {"train_loss": -12.327051162719727, "global_step": 317896, "epoch": 1892} {"train_loss": -12.317756652832031, "global_step": 317897, "epoch": 1892} {"train_loss": -12.405964851379395, "global_step": 317898, "epoch": 1892} {"train_loss": -12.289670944213867, "global_step": 317899, "epoch": 1892} {"train_loss": -12.19729232788086, "global_step": 317900, "epoch": 1892} {"train_loss": -12.340188980102539, "global_step": 317901, "epoch": 1892} {"train_loss": -12.33785629272461, "global_step": 317902, "epoch": 1892} {"train_loss": -12.360897064208984, "global_step": 317903, "epoch": 1892} {"train_loss": -12.393438339233398, "global_step": 317904, "epoch": 1892} {"train_loss": -12.271735191345215, "global_step": 317905, "epoch": 1892} {"train_loss": -12.526033401489258, "global_step": 317906, "epoch": 1892} {"train_loss": -12.39108943939209, "global_step": 317907, "epoch": 1892} {"train_loss": -12.495216369628906, "global_step": 317908, "epoch": 1892} {"train_loss": -12.42452335357666, "global_step": 317909, "epoch": 1892} {"train_loss": -12.443414688110352, "global_step": 317910, "epoch": 1892} {"train_loss": -12.545965194702148, "global_step": 317911, "epoch": 1892} {"train_loss": -12.2849760055542, "global_step": 317912, "epoch": 1892} {"train_loss": -12.225752830505371, "global_step": 317913, "epoch": 1892} {"train_loss": -12.454399108886719, "global_step": 317914, "epoch": 1892} {"train_loss": -12.327077865600586, "global_step": 317915, "epoch": 1892} {"train_loss": -12.468441009521484, "global_step": 317916, "epoch": 1892} {"train_loss": -12.321817398071289, "global_step": 317917, "epoch": 1892} {"train_loss": -12.29318618774414, "global_step": 317918, "epoch": 1892} {"train_loss": -12.503885269165039, "global_step": 317919, "epoch": 1892} {"train_loss": -12.603013038635254, "global_step": 317920, "epoch": 1892} {"train_loss": -12.362031936645508, "global_step": 317921, "epoch": 1892} {"train_loss": -12.41122055053711, "global_step": 317922, "epoch": 1892} {"train_loss": -12.121542930603027, "global_step": 317923, "epoch": 1892} {"train_loss": -12.280535697937012, "global_step": 317924, "epoch": 1892} {"train_loss": -12.25738525390625, "global_step": 317925, "epoch": 1892} {"train_loss": -12.242463111877441, "global_step": 317926, "epoch": 1892} {"train_loss": -12.201644897460938, "global_step": 317927, "epoch": 1892} {"train_loss": -12.732492446899414, "global_step": 317928, "epoch": 1892} {"train_loss": -11.935342788696289, "global_step": 317929, "epoch": 1892} {"train_loss": -12.184297561645508, "global_step": 317930, "epoch": 1892} {"train_loss": -12.332404136657715, "global_step": 317931, "epoch": 1892} {"train_loss": -12.1688871383667, "global_step": 317932, "epoch": 1892} {"train_loss": -12.078031539916992, "global_step": 317933, "epoch": 1892} {"train_loss": -12.229130744934082, "global_step": 317934, "epoch": 1892} {"train_loss": -12.1280517578125, "global_step": 317935, "epoch": 1892} {"train_loss": -12.013968467712402, "global_step": 317936, "epoch": 1892} {"train_loss": -11.428228378295898, "global_step": 317937, "epoch": 1892} {"train_loss": -11.553937911987305, "global_step": 317938, "epoch": 1892} {"train_loss": -12.037680625915527, "global_step": 317939, "epoch": 1892} {"train_loss": -10.903219223022461, "global_step": 317940, "epoch": 1892} {"train_loss": -10.744892120361328, "global_step": 317941, "epoch": 1892} {"train_loss": -10.951410293579102, "global_step": 317942, "epoch": 1892} {"train_loss": -9.134238243103027, "global_step": 317943, "epoch": 1892} {"train_loss": -9.2704496383667, "global_step": 317944, "epoch": 1892} {"train_loss": -10.048213958740234, "global_step": 317945, "epoch": 1892} {"train_loss": -8.079345703125, "global_step": 317946, "epoch": 1892} {"train_loss": -10.857648849487305, "global_step": 317947, "epoch": 1892} {"train_loss": -9.375298500061035, "global_step": 317948, "epoch": 1892} {"train_loss": -10.173479080200195, "global_step": 317949, "epoch": 1892} {"train_loss": -11.60157585144043, "global_step": 317950, "epoch": 1892} {"train_loss": -9.46141242980957, "global_step": 317951, "epoch": 1892} {"train_loss": -11.688989639282227, "global_step": 317952, "epoch": 1892} {"train_loss": -9.977490425109863, "global_step": 317953, "epoch": 1892} {"train_loss": -10.162155151367188, "global_step": 317954, "epoch": 1892} {"train_loss": -10.122258186340332, "global_step": 317955, "epoch": 1892} {"train_loss": -10.289528846740723, "global_step": 317956, "epoch": 1892} {"train_loss": -10.393753051757812, "global_step": 317957, "epoch": 1892} {"train_loss": -11.374923706054688, "global_step": 317958, "epoch": 1892} {"train_loss": -10.309548377990723, "global_step": 317959, "epoch": 1892} {"train_loss": -10.213038444519043, "global_step": 317960, "epoch": 1892} {"train_loss": -11.748075485229492, "global_step": 317961, "epoch": 1892} {"train_loss": -10.113572120666504, "global_step": 317962, "epoch": 1892} {"train_loss": -11.582121849060059, "global_step": 317963, "epoch": 1892} {"train_loss": -10.44662857055664, "global_step": 317964, "epoch": 1892} {"train_loss": -11.396970748901367, "global_step": 317965, "epoch": 1892} {"train_loss": -11.34427547454834, "global_step": 317966, "epoch": 1892} {"train_loss": -11.305367469787598, "global_step": 317967, "epoch": 1892} {"train_loss": -11.525879859924316, "global_step": 317968, "epoch": 1892} {"train_loss": -11.049137115478516, "global_step": 317969, "epoch": 1892} {"train_loss": -11.353958129882812, "global_step": 317970, "epoch": 1892} {"train_loss": -11.543230056762695, "global_step": 317971, "epoch": 1892} {"train_loss": -11.571403503417969, "global_step": 317972, "epoch": 1892} {"train_loss": -11.904662132263184, "global_step": 317973, "epoch": 1892} {"train_loss": -11.605134963989258, "global_step": 317974, "epoch": 1892} {"train_loss": -11.545778274536133, "global_step": 317975, "epoch": 1892} {"train_loss": -11.795119285583496, "global_step": 317976, "epoch": 1892} {"train_loss": -11.36683177947998, "global_step": 317977, "epoch": 1892} {"train_loss": -12.095436096191406, "global_step": 317978, "epoch": 1892} {"train_loss": -11.505447387695312, "global_step": 317979, "epoch": 1892} {"train_loss": -11.956866264343262, "global_step": 317980, "epoch": 1892} {"train_loss": -11.437023162841797, "global_step": 317981, "epoch": 1892} {"train_loss": -11.83517837524414, "global_step": 317982, "epoch": 1892} {"train_loss": -11.524419784545898, "global_step": 317983, "epoch": 1892} {"train_loss": -11.777631759643555, "global_step": 317984, "epoch": 1892} {"train_loss": -11.873278617858887, "global_step": 317985, "epoch": 1892} {"train_loss": -11.903106689453125, "global_step": 317986, "epoch": 1892} {"train_loss": -11.616922378540039, "global_step": 317987, "epoch": 1892} {"train_loss": -11.886112213134766, "global_step": 317988, "epoch": 1892} {"train_loss": -11.684835433959961, "global_step": 317989, "epoch": 1892} {"train_loss": -11.861207962036133, "global_step": 317990, "epoch": 1892} {"train_loss": -11.72016716003418, "global_step": 317991, "epoch": 1892} {"train_loss": -11.964462280273438, "global_step": 317992, "epoch": 1892} {"train_loss": -11.925304412841797, "global_step": 317993, "epoch": 1892} {"train_loss": -11.743196487426758, "global_step": 317994, "epoch": 1892} {"train_loss": -12.137322425842285, "global_step": 317995, "epoch": 1892} {"train_loss": -12.146942138671875, "global_step": 317996, "epoch": 1892} {"train_loss": -11.882569313049316, "global_step": 317997, "epoch": 1892} {"train_loss": -12.041400909423828, "global_step": 317998, "epoch": 1892} {"train_loss": -12.11125373840332, "global_step": 317999, "epoch": 1892} {"train_loss": -12.129623413085938, "global_step": 318000, "epoch": 1892} {"train_loss": -12.20543384552002, "global_step": 318001, "epoch": 1892} {"train_loss": -12.159199714660645, "global_step": 318002, "epoch": 1892} {"train_loss": -12.2522611618042, "global_step": 318003, "epoch": 1892} {"train_loss": -12.252634048461914, "global_step": 318004, "epoch": 1892} {"train_loss": -12.348396301269531, "global_step": 318005, "epoch": 1892} {"train_loss": -12.241584777832031, "global_step": 318006, "epoch": 1892} {"train_loss": -12.306570053100586, "global_step": 318007, "epoch": 1892} {"train_loss": -12.349635124206543, "global_step": 318008, "epoch": 1892} {"train_loss": -12.041831970214844, "global_step": 318009, "epoch": 1892} {"train_loss": -12.268857955932617, "global_step": 318010, "epoch": 1892} {"train_loss": -12.39552116394043, "global_step": 318011, "epoch": 1892} {"train_loss": -12.274162292480469, "global_step": 318012, "epoch": 1892} {"train_loss": -12.349126815795898, "global_step": 318013, "epoch": 1892} {"train_loss": -12.291435241699219, "global_step": 318014, "epoch": 1892} {"train_loss": -12.306740760803223, "global_step": 318015, "epoch": 1892} {"train_loss": -12.370079040527344, "global_step": 318016, "epoch": 1892} {"train_loss": -12.536890029907227, "global_step": 318017, "epoch": 1892} {"train_loss": -12.462482452392578, "global_step": 318018, "epoch": 1892} {"train_loss": -12.417251586914062, "global_step": 318019, "epoch": 1892} {"train_loss": -12.183789253234863, "global_step": 318020, "epoch": 1892} {"train_loss": -12.402042388916016, "global_step": 318021, "epoch": 1892} {"train_loss": -12.411211013793945, "global_step": 318022, "epoch": 1892} {"train_loss": -11.809492230415344, "global_step": 318023, "epoch": 1892, "val_loss": 284557.40625} {"train_loss": -12.351716995239258, "global_step": 318024, "epoch": 1893} {"train_loss": -12.456592559814453, "global_step": 318025, "epoch": 1893} {"train_loss": -12.277774810791016, "global_step": 318026, "epoch": 1893} {"train_loss": -12.1334867477417, "global_step": 318027, "epoch": 1893} {"train_loss": -12.290238380432129, "global_step": 318028, "epoch": 1893} {"train_loss": -12.367979049682617, "global_step": 318029, "epoch": 1893} {"train_loss": -12.311576843261719, "global_step": 318030, "epoch": 1893} {"train_loss": -12.23322868347168, "global_step": 318031, "epoch": 1893} {"train_loss": -12.448480606079102, "global_step": 318032, "epoch": 1893} {"train_loss": -12.396284103393555, "global_step": 318033, "epoch": 1893} {"train_loss": -12.515822410583496, "global_step": 318034, "epoch": 1893} {"train_loss": -12.325554847717285, "global_step": 318035, "epoch": 1893} {"train_loss": -12.339856147766113, "global_step": 318036, "epoch": 1893} {"train_loss": -12.436144828796387, "global_step": 318037, "epoch": 1893} {"train_loss": -12.438091278076172, "global_step": 318038, "epoch": 1893} {"train_loss": -12.38758659362793, "global_step": 318039, "epoch": 1893} {"train_loss": -12.684281349182129, "global_step": 318040, "epoch": 1893} {"train_loss": -12.567638397216797, "global_step": 318041, "epoch": 1893} {"train_loss": -12.634203910827637, "global_step": 318042, "epoch": 1893} {"train_loss": -12.449602127075195, "global_step": 318043, "epoch": 1893} {"train_loss": -12.329490661621094, "global_step": 318044, "epoch": 1893} {"train_loss": -12.503786087036133, "global_step": 318045, "epoch": 1893} {"train_loss": -12.338984489440918, "global_step": 318046, "epoch": 1893} {"train_loss": -12.559266090393066, "global_step": 318047, "epoch": 1893} {"train_loss": -12.630393981933594, "global_step": 318048, "epoch": 1893} {"train_loss": -12.682910919189453, "global_step": 318049, "epoch": 1893} {"train_loss": -12.549699783325195, "global_step": 318050, "epoch": 1893} {"train_loss": -12.574377059936523, "global_step": 318051, "epoch": 1893} {"train_loss": -12.682668685913086, "global_step": 318052, "epoch": 1893} {"train_loss": -12.503164291381836, "global_step": 318053, "epoch": 1893} {"train_loss": -12.633994102478027, "global_step": 318054, "epoch": 1893} {"train_loss": -12.454288482666016, "global_step": 318055, "epoch": 1893} {"train_loss": -12.60665225982666, "global_step": 318056, "epoch": 1893} {"train_loss": -12.45755386352539, "global_step": 318057, "epoch": 1893} {"train_loss": -12.286383628845215, "global_step": 318058, "epoch": 1893} {"train_loss": -12.478418350219727, "global_step": 318059, "epoch": 1893} {"train_loss": -12.364274978637695, "global_step": 318060, "epoch": 1893} {"train_loss": -11.913244247436523, "global_step": 318061, "epoch": 1893} {"train_loss": -11.736315727233887, "global_step": 318062, "epoch": 1893} {"train_loss": -11.949312210083008, "global_step": 318063, "epoch": 1893} {"train_loss": -12.387325286865234, "global_step": 318064, "epoch": 1893} {"train_loss": -11.763766288757324, "global_step": 318065, "epoch": 1893} {"train_loss": -10.827887535095215, "global_step": 318066, "epoch": 1893} {"train_loss": -11.161846160888672, "global_step": 318067, "epoch": 1893} {"train_loss": -12.256080627441406, "global_step": 318068, "epoch": 1893} {"train_loss": -11.535521507263184, "global_step": 318069, "epoch": 1893} {"train_loss": -11.034758567810059, "global_step": 318070, "epoch": 1893} {"train_loss": -12.274642944335938, "global_step": 318071, "epoch": 1893} {"train_loss": -9.74135684967041, "global_step": 318072, "epoch": 1893} {"train_loss": -10.293142318725586, "global_step": 318073, "epoch": 1893} {"train_loss": -12.09354305267334, "global_step": 318074, "epoch": 1893} {"train_loss": -10.588608741760254, "global_step": 318075, "epoch": 1893} {"train_loss": -11.275310516357422, "global_step": 318076, "epoch": 1893} {"train_loss": -12.061369895935059, "global_step": 318077, "epoch": 1893} {"train_loss": -9.811407089233398, "global_step": 318078, "epoch": 1893} {"train_loss": -11.243478775024414, "global_step": 318079, "epoch": 1893} {"train_loss": -11.82246208190918, "global_step": 318080, "epoch": 1893} {"train_loss": -10.928672790527344, "global_step": 318081, "epoch": 1893} {"train_loss": -11.576684951782227, "global_step": 318082, "epoch": 1893} {"train_loss": -11.988547325134277, "global_step": 318083, "epoch": 1893} {"train_loss": -11.875272750854492, "global_step": 318084, "epoch": 1893} {"train_loss": -11.871950149536133, "global_step": 318085, "epoch": 1893} {"train_loss": -11.888046264648438, "global_step": 318086, "epoch": 1893} {"train_loss": -11.867619514465332, "global_step": 318087, "epoch": 1893} {"train_loss": -11.734525680541992, "global_step": 318088, "epoch": 1893} {"train_loss": -11.997922897338867, "global_step": 318089, "epoch": 1893} {"train_loss": -11.80489730834961, "global_step": 318090, "epoch": 1893} {"train_loss": -12.100885391235352, "global_step": 318091, "epoch": 1893} {"train_loss": -11.974309921264648, "global_step": 318092, "epoch": 1893} {"train_loss": -11.535350799560547, "global_step": 318093, "epoch": 1893} {"train_loss": -11.951372146606445, "global_step": 318094, "epoch": 1893} {"train_loss": -11.281022071838379, "global_step": 318095, "epoch": 1893} {"train_loss": -11.229769706726074, "global_step": 318096, "epoch": 1893} {"train_loss": -11.508467674255371, "global_step": 318097, "epoch": 1893} {"train_loss": -12.196792602539062, "global_step": 318098, "epoch": 1893} {"train_loss": -11.525190353393555, "global_step": 318099, "epoch": 1893} {"train_loss": -11.713700294494629, "global_step": 318100, "epoch": 1893} {"train_loss": -12.090824127197266, "global_step": 318101, "epoch": 1893} {"train_loss": -11.874361038208008, "global_step": 318102, "epoch": 1893} {"train_loss": -12.153454780578613, "global_step": 318103, "epoch": 1893} {"train_loss": -11.505537033081055, "global_step": 318104, "epoch": 1893} {"train_loss": -11.433830261230469, "global_step": 318105, "epoch": 1893} {"train_loss": -11.776540756225586, "global_step": 318106, "epoch": 1893} {"train_loss": -12.050487518310547, "global_step": 318107, "epoch": 1893} {"train_loss": -11.656715393066406, "global_step": 318108, "epoch": 1893} {"train_loss": -12.214544296264648, "global_step": 318109, "epoch": 1893} {"train_loss": -11.438003540039062, "global_step": 318110, "epoch": 1893} {"train_loss": -12.098275184631348, "global_step": 318111, "epoch": 1893} {"train_loss": -11.878438949584961, "global_step": 318112, "epoch": 1893} {"train_loss": -11.592403411865234, "global_step": 318113, "epoch": 1893} {"train_loss": -11.944400787353516, "global_step": 318114, "epoch": 1893} {"train_loss": -11.494853973388672, "global_step": 318115, "epoch": 1893} {"train_loss": -12.045760154724121, "global_step": 318116, "epoch": 1893} {"train_loss": -11.9207124710083, "global_step": 318117, "epoch": 1893} {"train_loss": -12.03665542602539, "global_step": 318118, "epoch": 1893} {"train_loss": -11.733147621154785, "global_step": 318119, "epoch": 1893} {"train_loss": -11.947296142578125, "global_step": 318120, "epoch": 1893} {"train_loss": -11.826143264770508, "global_step": 318121, "epoch": 1893} {"train_loss": -11.363149642944336, "global_step": 318122, "epoch": 1893} {"train_loss": -11.95638656616211, "global_step": 318123, "epoch": 1893} {"train_loss": -11.223966598510742, "global_step": 318124, "epoch": 1893} {"train_loss": -11.800273895263672, "global_step": 318125, "epoch": 1893} {"train_loss": -10.812345504760742, "global_step": 318126, "epoch": 1893} {"train_loss": -11.883941650390625, "global_step": 318127, "epoch": 1893} {"train_loss": -11.420056343078613, "global_step": 318128, "epoch": 1893} {"train_loss": -11.231733322143555, "global_step": 318129, "epoch": 1893} {"train_loss": -11.611732482910156, "global_step": 318130, "epoch": 1893} {"train_loss": -10.746442794799805, "global_step": 318131, "epoch": 1893} {"train_loss": -11.585296630859375, "global_step": 318132, "epoch": 1893} {"train_loss": -11.481093406677246, "global_step": 318133, "epoch": 1893} {"train_loss": -12.156524658203125, "global_step": 318134, "epoch": 1893} {"train_loss": -11.988945960998535, "global_step": 318135, "epoch": 1893} {"train_loss": -11.99543285369873, "global_step": 318136, "epoch": 1893} {"train_loss": -11.669795989990234, "global_step": 318137, "epoch": 1893} {"train_loss": -12.012460708618164, "global_step": 318138, "epoch": 1893} {"train_loss": -12.144613265991211, "global_step": 318139, "epoch": 1893} {"train_loss": -12.287454605102539, "global_step": 318140, "epoch": 1893} {"train_loss": -11.957067489624023, "global_step": 318141, "epoch": 1893} {"train_loss": -12.187126159667969, "global_step": 318142, "epoch": 1893} {"train_loss": -12.2322359085083, "global_step": 318143, "epoch": 1893} {"train_loss": -12.08043384552002, "global_step": 318144, "epoch": 1893} {"train_loss": -12.095925331115723, "global_step": 318145, "epoch": 1893} {"train_loss": -12.147224426269531, "global_step": 318146, "epoch": 1893} {"train_loss": -12.302605628967285, "global_step": 318147, "epoch": 1893} {"train_loss": -12.075379371643066, "global_step": 318148, "epoch": 1893} {"train_loss": -12.39823055267334, "global_step": 318149, "epoch": 1893} {"train_loss": -12.340313911437988, "global_step": 318150, "epoch": 1893} {"train_loss": -12.422893524169922, "global_step": 318151, "epoch": 1893} {"train_loss": -12.192144393920898, "global_step": 318152, "epoch": 1893} {"train_loss": -12.368063926696777, "global_step": 318153, "epoch": 1893} {"train_loss": -12.43515396118164, "global_step": 318154, "epoch": 1893} {"train_loss": -12.094757080078125, "global_step": 318155, "epoch": 1893} {"train_loss": -12.436630249023438, "global_step": 318156, "epoch": 1893} {"train_loss": -12.305085182189941, "global_step": 318157, "epoch": 1893} {"train_loss": -12.550675392150879, "global_step": 318158, "epoch": 1893} {"train_loss": -12.240734100341797, "global_step": 318159, "epoch": 1893} {"train_loss": -12.322649002075195, "global_step": 318160, "epoch": 1893} {"train_loss": -12.350855827331543, "global_step": 318161, "epoch": 1893} {"train_loss": -12.26863956451416, "global_step": 318162, "epoch": 1893} {"train_loss": -12.392389297485352, "global_step": 318163, "epoch": 1893} {"train_loss": -12.343879699707031, "global_step": 318164, "epoch": 1893} {"train_loss": -12.394721031188965, "global_step": 318165, "epoch": 1893} {"train_loss": -12.268194198608398, "global_step": 318166, "epoch": 1893} {"train_loss": -12.484156608581543, "global_step": 318167, "epoch": 1893} {"train_loss": -12.408428192138672, "global_step": 318168, "epoch": 1893} {"train_loss": -12.538331031799316, "global_step": 318169, "epoch": 1893} {"train_loss": -12.19278335571289, "global_step": 318170, "epoch": 1893} {"train_loss": -12.28994369506836, "global_step": 318171, "epoch": 1893} {"train_loss": -12.24925708770752, "global_step": 318172, "epoch": 1893} {"train_loss": -12.182601928710938, "global_step": 318173, "epoch": 1893} {"train_loss": -12.198955535888672, "global_step": 318174, "epoch": 1893} {"train_loss": -11.675987243652344, "global_step": 318175, "epoch": 1893} {"train_loss": -11.637353897094727, "global_step": 318176, "epoch": 1893} {"train_loss": -11.560895919799805, "global_step": 318177, "epoch": 1893} {"train_loss": -11.611161231994629, "global_step": 318178, "epoch": 1893} {"train_loss": -11.728549003601074, "global_step": 318179, "epoch": 1893} {"train_loss": -11.589211463928223, "global_step": 318180, "epoch": 1893} {"train_loss": -11.705240249633789, "global_step": 318181, "epoch": 1893} {"train_loss": -11.87211799621582, "global_step": 318182, "epoch": 1893} {"train_loss": -11.896345138549805, "global_step": 318183, "epoch": 1893} {"train_loss": -11.791585922241211, "global_step": 318184, "epoch": 1893} {"train_loss": -11.544939041137695, "global_step": 318185, "epoch": 1893} {"train_loss": -11.26695728302002, "global_step": 318186, "epoch": 1893} {"train_loss": -11.628636360168457, "global_step": 318187, "epoch": 1893} {"train_loss": -11.364380836486816, "global_step": 318188, "epoch": 1893} {"train_loss": -11.906966209411621, "global_step": 318189, "epoch": 1893} {"train_loss": -10.806459426879883, "global_step": 318190, "epoch": 1893} {"train_loss": -11.950558565911793, "global_step": 318191, "epoch": 1893, "val_loss": 283786.0625} {"train_loss": -11.173444747924805, "global_step": 318192, "epoch": 1894} {"train_loss": -11.287562370300293, "global_step": 318193, "epoch": 1894} {"train_loss": -11.48216438293457, "global_step": 318194, "epoch": 1894} {"train_loss": -11.219043731689453, "global_step": 318195, "epoch": 1894} {"train_loss": -11.47736644744873, "global_step": 318196, "epoch": 1894} {"train_loss": -11.069731712341309, "global_step": 318197, "epoch": 1894} {"train_loss": -11.064830780029297, "global_step": 318198, "epoch": 1894} {"train_loss": -11.34390926361084, "global_step": 318199, "epoch": 1894} {"train_loss": -10.809392929077148, "global_step": 318200, "epoch": 1894} {"train_loss": -10.834259986877441, "global_step": 318201, "epoch": 1894} {"train_loss": -11.535432815551758, "global_step": 318202, "epoch": 1894} {"train_loss": -10.889152526855469, "global_step": 318203, "epoch": 1894} {"train_loss": -11.593045234680176, "global_step": 318204, "epoch": 1894} {"train_loss": -11.137499809265137, "global_step": 318205, "epoch": 1894} {"train_loss": -11.638378143310547, "global_step": 318206, "epoch": 1894} {"train_loss": -10.732034683227539, "global_step": 318207, "epoch": 1894} {"train_loss": -11.745899200439453, "global_step": 318208, "epoch": 1894} {"train_loss": -11.606990814208984, "global_step": 318209, "epoch": 1894} {"train_loss": -11.665678024291992, "global_step": 318210, "epoch": 1894} {"train_loss": -11.569708824157715, "global_step": 318211, "epoch": 1894} {"train_loss": -11.44063949584961, "global_step": 318212, "epoch": 1894} {"train_loss": -11.852262496948242, "global_step": 318213, "epoch": 1894} {"train_loss": -11.742277145385742, "global_step": 318214, "epoch": 1894} {"train_loss": -11.741802215576172, "global_step": 318215, "epoch": 1894} {"train_loss": -11.608429908752441, "global_step": 318216, "epoch": 1894} {"train_loss": -11.848407745361328, "global_step": 318217, "epoch": 1894} {"train_loss": -11.472955703735352, "global_step": 318218, "epoch": 1894} {"train_loss": -12.228477478027344, "global_step": 318219, "epoch": 1894} {"train_loss": -11.623967170715332, "global_step": 318220, "epoch": 1894} {"train_loss": -12.011857986450195, "global_step": 318221, "epoch": 1894} {"train_loss": -12.000846862792969, "global_step": 318222, "epoch": 1894} {"train_loss": -11.848859786987305, "global_step": 318223, "epoch": 1894} {"train_loss": -12.26999282836914, "global_step": 318224, "epoch": 1894} {"train_loss": -11.67156982421875, "global_step": 318225, "epoch": 1894} {"train_loss": -11.867402076721191, "global_step": 318226, "epoch": 1894} {"train_loss": -11.803642272949219, "global_step": 318227, "epoch": 1894} {"train_loss": -11.807846069335938, "global_step": 318228, "epoch": 1894} {"train_loss": -12.011529922485352, "global_step": 318229, "epoch": 1894} {"train_loss": -11.762223243713379, "global_step": 318230, "epoch": 1894} {"train_loss": -12.221625328063965, "global_step": 318231, "epoch": 1894} {"train_loss": -11.620421409606934, "global_step": 318232, "epoch": 1894} {"train_loss": -12.22686767578125, "global_step": 318233, "epoch": 1894} {"train_loss": -11.997947692871094, "global_step": 318234, "epoch": 1894} {"train_loss": -11.720453262329102, "global_step": 318235, "epoch": 1894} {"train_loss": -12.206443786621094, "global_step": 318236, "epoch": 1894} {"train_loss": -11.761030197143555, "global_step": 318237, "epoch": 1894} {"train_loss": -12.127777099609375, "global_step": 318238, "epoch": 1894} {"train_loss": -12.099669456481934, "global_step": 318239, "epoch": 1894} {"train_loss": -12.041166305541992, "global_step": 318240, "epoch": 1894} {"train_loss": -12.376794815063477, "global_step": 318241, "epoch": 1894} {"train_loss": -12.172294616699219, "global_step": 318242, "epoch": 1894} {"train_loss": -12.200461387634277, "global_step": 318243, "epoch": 1894} {"train_loss": -11.812845230102539, "global_step": 318244, "epoch": 1894} {"train_loss": -12.058979034423828, "global_step": 318245, "epoch": 1894} {"train_loss": -12.137609481811523, "global_step": 318246, "epoch": 1894} {"train_loss": -12.03841781616211, "global_step": 318247, "epoch": 1894} {"train_loss": -12.117347717285156, "global_step": 318248, "epoch": 1894} {"train_loss": -11.99775505065918, "global_step": 318249, "epoch": 1894} {"train_loss": -12.023802757263184, "global_step": 318250, "epoch": 1894} {"train_loss": -11.980218887329102, "global_step": 318251, "epoch": 1894} {"train_loss": -11.736200332641602, "global_step": 318252, "epoch": 1894} {"train_loss": -12.138421058654785, "global_step": 318253, "epoch": 1894} {"train_loss": -12.099130630493164, "global_step": 318254, "epoch": 1894} {"train_loss": -11.640110969543457, "global_step": 318255, "epoch": 1894} {"train_loss": -12.338916778564453, "global_step": 318256, "epoch": 1894} {"train_loss": -11.41604995727539, "global_step": 318257, "epoch": 1894} {"train_loss": -12.131004333496094, "global_step": 318258, "epoch": 1894} {"train_loss": -11.74676513671875, "global_step": 318259, "epoch": 1894} {"train_loss": -11.440101623535156, "global_step": 318260, "epoch": 1894} {"train_loss": -12.392887115478516, "global_step": 318261, "epoch": 1894} {"train_loss": -11.912853240966797, "global_step": 318262, "epoch": 1894} {"train_loss": -12.111190795898438, "global_step": 318263, "epoch": 1894} {"train_loss": -12.101753234863281, "global_step": 318264, "epoch": 1894} {"train_loss": -12.103128433227539, "global_step": 318265, "epoch": 1894} {"train_loss": -12.00711727142334, "global_step": 318266, "epoch": 1894} {"train_loss": -12.28231143951416, "global_step": 318267, "epoch": 1894} {"train_loss": -12.180769920349121, "global_step": 318268, "epoch": 1894} {"train_loss": -12.218232154846191, "global_step": 318269, "epoch": 1894} {"train_loss": -12.265456199645996, "global_step": 318270, "epoch": 1894} {"train_loss": -12.18452262878418, "global_step": 318271, "epoch": 1894} {"train_loss": -12.498661041259766, "global_step": 318272, "epoch": 1894} {"train_loss": -11.935680389404297, "global_step": 318273, "epoch": 1894} {"train_loss": -12.322237014770508, "global_step": 318274, "epoch": 1894} {"train_loss": -12.021974563598633, "global_step": 318275, "epoch": 1894} {"train_loss": -12.287220001220703, "global_step": 318276, "epoch": 1894} {"train_loss": -12.474189758300781, "global_step": 318277, "epoch": 1894} {"train_loss": -12.403339385986328, "global_step": 318278, "epoch": 1894} {"train_loss": -12.38076114654541, "global_step": 318279, "epoch": 1894} {"train_loss": -12.42772388458252, "global_step": 318280, "epoch": 1894} {"train_loss": -12.525918960571289, "global_step": 318281, "epoch": 1894} {"train_loss": -12.46810531616211, "global_step": 318282, "epoch": 1894} {"train_loss": -12.51800537109375, "global_step": 318283, "epoch": 1894} {"train_loss": -12.249551773071289, "global_step": 318284, "epoch": 1894} {"train_loss": -12.45875358581543, "global_step": 318285, "epoch": 1894} {"train_loss": -12.335962295532227, "global_step": 318286, "epoch": 1894} {"train_loss": -12.232993125915527, "global_step": 318287, "epoch": 1894} {"train_loss": -12.275505065917969, "global_step": 318288, "epoch": 1894} {"train_loss": -12.328865051269531, "global_step": 318289, "epoch": 1894} {"train_loss": -12.19516372680664, "global_step": 318290, "epoch": 1894} {"train_loss": -12.547073364257812, "global_step": 318291, "epoch": 1894} {"train_loss": -11.781808853149414, "global_step": 318292, "epoch": 1894} {"train_loss": -12.2531156539917, "global_step": 318293, "epoch": 1894} {"train_loss": -12.224189758300781, "global_step": 318294, "epoch": 1894} {"train_loss": -12.363714218139648, "global_step": 318295, "epoch": 1894} {"train_loss": -12.151986122131348, "global_step": 318296, "epoch": 1894} {"train_loss": -11.996694564819336, "global_step": 318297, "epoch": 1894} {"train_loss": -12.0526123046875, "global_step": 318298, "epoch": 1894} {"train_loss": -12.218250274658203, "global_step": 318299, "epoch": 1894} {"train_loss": -11.592901229858398, "global_step": 318300, "epoch": 1894} {"train_loss": -11.67248249053955, "global_step": 318301, "epoch": 1894} {"train_loss": -12.431482315063477, "global_step": 318302, "epoch": 1894} {"train_loss": -12.291873931884766, "global_step": 318303, "epoch": 1894} {"train_loss": -11.74481201171875, "global_step": 318304, "epoch": 1894} {"train_loss": -12.153038024902344, "global_step": 318305, "epoch": 1894} {"train_loss": -11.28689956665039, "global_step": 318306, "epoch": 1894} {"train_loss": -11.87270736694336, "global_step": 318307, "epoch": 1894} {"train_loss": -11.627594947814941, "global_step": 318308, "epoch": 1894} {"train_loss": -12.029112815856934, "global_step": 318309, "epoch": 1894} {"train_loss": -11.449450492858887, "global_step": 318310, "epoch": 1894} {"train_loss": -12.428864479064941, "global_step": 318311, "epoch": 1894} {"train_loss": -11.279693603515625, "global_step": 318312, "epoch": 1894} {"train_loss": -11.930964469909668, "global_step": 318313, "epoch": 1894} {"train_loss": -11.759757041931152, "global_step": 318314, "epoch": 1894} {"train_loss": -12.219278335571289, "global_step": 318315, "epoch": 1894} {"train_loss": -11.470159530639648, "global_step": 318316, "epoch": 1894} {"train_loss": -12.059652328491211, "global_step": 318317, "epoch": 1894} {"train_loss": -11.362519264221191, "global_step": 318318, "epoch": 1894} {"train_loss": -12.171451568603516, "global_step": 318319, "epoch": 1894} {"train_loss": -11.17481803894043, "global_step": 318320, "epoch": 1894} {"train_loss": -12.166473388671875, "global_step": 318321, "epoch": 1894} {"train_loss": -10.500448226928711, "global_step": 318322, "epoch": 1894} {"train_loss": -11.026092529296875, "global_step": 318323, "epoch": 1894} {"train_loss": -11.499959945678711, "global_step": 318324, "epoch": 1894} {"train_loss": -9.183156967163086, "global_step": 318325, "epoch": 1894} {"train_loss": -11.806564331054688, "global_step": 318326, "epoch": 1894} {"train_loss": -9.19009780883789, "global_step": 318327, "epoch": 1894} {"train_loss": -9.94045352935791, "global_step": 318328, "epoch": 1894} {"train_loss": -9.33818244934082, "global_step": 318329, "epoch": 1894} {"train_loss": -11.439854621887207, "global_step": 318330, "epoch": 1894} {"train_loss": -8.356252670288086, "global_step": 318331, "epoch": 1894} {"train_loss": -7.900023937225342, "global_step": 318332, "epoch": 1894} {"train_loss": -10.547950744628906, "global_step": 318333, "epoch": 1894} {"train_loss": -10.331421852111816, "global_step": 318334, "epoch": 1894} {"train_loss": -8.956741333007812, "global_step": 318335, "epoch": 1894} {"train_loss": -11.3931245803833, "global_step": 318336, "epoch": 1894} {"train_loss": -10.481120109558105, "global_step": 318337, "epoch": 1894} {"train_loss": -10.429788589477539, "global_step": 318338, "epoch": 1894} {"train_loss": -11.372879028320312, "global_step": 318339, "epoch": 1894} {"train_loss": -9.489266395568848, "global_step": 318340, "epoch": 1894} {"train_loss": -10.378328323364258, "global_step": 318341, "epoch": 1894} {"train_loss": -11.49334716796875, "global_step": 318342, "epoch": 1894} {"train_loss": -10.752799987792969, "global_step": 318343, "epoch": 1894} {"train_loss": -11.515421867370605, "global_step": 318344, "epoch": 1894} {"train_loss": -10.832635879516602, "global_step": 318345, "epoch": 1894} {"train_loss": -10.954561233520508, "global_step": 318346, "epoch": 1894} {"train_loss": -10.133341789245605, "global_step": 318347, "epoch": 1894} {"train_loss": -10.827974319458008, "global_step": 318348, "epoch": 1894} {"train_loss": -9.410028457641602, "global_step": 318349, "epoch": 1894} {"train_loss": -11.934586524963379, "global_step": 318350, "epoch": 1894} {"train_loss": -9.375749588012695, "global_step": 318351, "epoch": 1894} {"train_loss": -11.148941993713379, "global_step": 318352, "epoch": 1894} {"train_loss": -11.069986343383789, "global_step": 318353, "epoch": 1894} {"train_loss": -10.201370239257812, "global_step": 318354, "epoch": 1894} {"train_loss": -11.223197937011719, "global_step": 318355, "epoch": 1894} {"train_loss": -10.774667739868164, "global_step": 318356, "epoch": 1894} {"train_loss": -11.034257888793945, "global_step": 318357, "epoch": 1894} {"train_loss": -10.144808769226074, "global_step": 318358, "epoch": 1894} {"train_loss": -11.58420884893054, "global_step": 318359, "epoch": 1894, "val_loss": 273815.3125} {"train_loss": -10.327045440673828, "global_step": 318360, "epoch": 1895} {"train_loss": -11.69201946258545, "global_step": 318361, "epoch": 1895} {"train_loss": -11.202299118041992, "global_step": 318362, "epoch": 1895} {"train_loss": -10.958748817443848, "global_step": 318363, "epoch": 1895} {"train_loss": -11.243114471435547, "global_step": 318364, "epoch": 1895} {"train_loss": -11.251590728759766, "global_step": 318365, "epoch": 1895} {"train_loss": -11.515663146972656, "global_step": 318366, "epoch": 1895} {"train_loss": -11.200323104858398, "global_step": 318367, "epoch": 1895} {"train_loss": -11.779630661010742, "global_step": 318368, "epoch": 1895} {"train_loss": -11.416465759277344, "global_step": 318369, "epoch": 1895} {"train_loss": -11.32099437713623, "global_step": 318370, "epoch": 1895} {"train_loss": -11.736408233642578, "global_step": 318371, "epoch": 1895} {"train_loss": -11.461069107055664, "global_step": 318372, "epoch": 1895} {"train_loss": -11.686052322387695, "global_step": 318373, "epoch": 1895} {"train_loss": -11.773231506347656, "global_step": 318374, "epoch": 1895} {"train_loss": -11.194293022155762, "global_step": 318375, "epoch": 1895} {"train_loss": -11.739540100097656, "global_step": 318376, "epoch": 1895} {"train_loss": -10.967750549316406, "global_step": 318377, "epoch": 1895} {"train_loss": -12.003437042236328, "global_step": 318378, "epoch": 1895} {"train_loss": -11.034282684326172, "global_step": 318379, "epoch": 1895} {"train_loss": -11.626937866210938, "global_step": 318380, "epoch": 1895} {"train_loss": -11.381318092346191, "global_step": 318381, "epoch": 1895} {"train_loss": -11.315954208374023, "global_step": 318382, "epoch": 1895} {"train_loss": -11.94395637512207, "global_step": 318383, "epoch": 1895} {"train_loss": -11.664321899414062, "global_step": 318384, "epoch": 1895} {"train_loss": -11.943841934204102, "global_step": 318385, "epoch": 1895} {"train_loss": -11.657508850097656, "global_step": 318386, "epoch": 1895} {"train_loss": -11.639404296875, "global_step": 318387, "epoch": 1895} {"train_loss": -11.759325981140137, "global_step": 318388, "epoch": 1895} {"train_loss": -11.697826385498047, "global_step": 318389, "epoch": 1895} {"train_loss": -11.993152618408203, "global_step": 318390, "epoch": 1895} {"train_loss": -11.741317749023438, "global_step": 318391, "epoch": 1895} {"train_loss": -12.064334869384766, "global_step": 318392, "epoch": 1895} {"train_loss": -11.841533660888672, "global_step": 318393, "epoch": 1895} {"train_loss": -11.438583374023438, "global_step": 318394, "epoch": 1895} {"train_loss": -11.83525562286377, "global_step": 318395, "epoch": 1895} {"train_loss": -11.691661834716797, "global_step": 318396, "epoch": 1895} {"train_loss": -11.981505393981934, "global_step": 318397, "epoch": 1895} {"train_loss": -11.830012321472168, "global_step": 318398, "epoch": 1895} {"train_loss": -12.003809928894043, "global_step": 318399, "epoch": 1895} {"train_loss": -11.77443790435791, "global_step": 318400, "epoch": 1895} {"train_loss": -12.041162490844727, "global_step": 318401, "epoch": 1895} {"train_loss": -11.772369384765625, "global_step": 318402, "epoch": 1895} {"train_loss": -11.43812370300293, "global_step": 318403, "epoch": 1895} {"train_loss": -12.236330032348633, "global_step": 318404, "epoch": 1895} {"train_loss": -11.594779968261719, "global_step": 318405, "epoch": 1895} {"train_loss": -11.951836585998535, "global_step": 318406, "epoch": 1895} {"train_loss": -11.897005081176758, "global_step": 318407, "epoch": 1895} {"train_loss": -11.955774307250977, "global_step": 318408, "epoch": 1895} {"train_loss": -12.020605087280273, "global_step": 318409, "epoch": 1895} {"train_loss": -11.876795768737793, "global_step": 318410, "epoch": 1895} {"train_loss": -11.96865463256836, "global_step": 318411, "epoch": 1895} {"train_loss": -9.808443069458008, "global_step": 318412, "epoch": 1895} {"train_loss": -11.455362319946289, "global_step": 318413, "epoch": 1895} {"train_loss": -11.232568740844727, "global_step": 318414, "epoch": 1895} {"train_loss": -10.11632251739502, "global_step": 318415, "epoch": 1895} {"train_loss": -9.882925033569336, "global_step": 318416, "epoch": 1895} {"train_loss": -11.123414039611816, "global_step": 318417, "epoch": 1895} {"train_loss": -11.695737838745117, "global_step": 318418, "epoch": 1895} {"train_loss": -11.314801216125488, "global_step": 318419, "epoch": 1895} {"train_loss": -10.663431167602539, "global_step": 318420, "epoch": 1895} {"train_loss": -11.202363967895508, "global_step": 318421, "epoch": 1895} {"train_loss": -11.238458633422852, "global_step": 318422, "epoch": 1895} {"train_loss": -10.905523300170898, "global_step": 318423, "epoch": 1895} {"train_loss": -11.416662216186523, "global_step": 318424, "epoch": 1895} {"train_loss": -11.407432556152344, "global_step": 318425, "epoch": 1895} {"train_loss": -10.829231262207031, "global_step": 318426, "epoch": 1895} {"train_loss": -11.281824111938477, "global_step": 318427, "epoch": 1895} {"train_loss": -11.36241340637207, "global_step": 318428, "epoch": 1895} {"train_loss": -11.390728950500488, "global_step": 318429, "epoch": 1895} {"train_loss": -11.689229965209961, "global_step": 318430, "epoch": 1895} {"train_loss": -11.588808059692383, "global_step": 318431, "epoch": 1895} {"train_loss": -11.50963020324707, "global_step": 318432, "epoch": 1895} {"train_loss": -11.611324310302734, "global_step": 318433, "epoch": 1895} {"train_loss": -11.783600807189941, "global_step": 318434, "epoch": 1895} {"train_loss": -11.769986152648926, "global_step": 318435, "epoch": 1895} {"train_loss": -11.559308052062988, "global_step": 318436, "epoch": 1895} {"train_loss": -11.7918119430542, "global_step": 318437, "epoch": 1895} {"train_loss": -11.621192932128906, "global_step": 318438, "epoch": 1895} {"train_loss": -11.340472221374512, "global_step": 318439, "epoch": 1895} {"train_loss": -11.762918472290039, "global_step": 318440, "epoch": 1895} {"train_loss": -12.173145294189453, "global_step": 318441, "epoch": 1895} {"train_loss": -11.55013370513916, "global_step": 318442, "epoch": 1895} {"train_loss": -11.957433700561523, "global_step": 318443, "epoch": 1895} {"train_loss": -11.676332473754883, "global_step": 318444, "epoch": 1895} {"train_loss": -11.675247192382812, "global_step": 318445, "epoch": 1895} {"train_loss": -11.488739013671875, "global_step": 318446, "epoch": 1895} {"train_loss": -11.772418022155762, "global_step": 318447, "epoch": 1895} {"train_loss": -11.691360473632812, "global_step": 318448, "epoch": 1895} {"train_loss": -11.835067749023438, "global_step": 318449, "epoch": 1895} {"train_loss": -11.62580680847168, "global_step": 318450, "epoch": 1895} {"train_loss": -11.595232009887695, "global_step": 318451, "epoch": 1895} {"train_loss": -12.101593017578125, "global_step": 318452, "epoch": 1895} {"train_loss": -11.936891555786133, "global_step": 318453, "epoch": 1895} {"train_loss": -11.808566093444824, "global_step": 318454, "epoch": 1895} {"train_loss": -11.320253372192383, "global_step": 318455, "epoch": 1895} {"train_loss": -12.028509140014648, "global_step": 318456, "epoch": 1895} {"train_loss": -11.833106994628906, "global_step": 318457, "epoch": 1895} {"train_loss": -12.08518123626709, "global_step": 318458, "epoch": 1895} {"train_loss": -11.852601051330566, "global_step": 318459, "epoch": 1895} {"train_loss": -12.186025619506836, "global_step": 318460, "epoch": 1895} {"train_loss": -11.840065002441406, "global_step": 318461, "epoch": 1895} {"train_loss": -12.164478302001953, "global_step": 318462, "epoch": 1895} {"train_loss": -11.973844528198242, "global_step": 318463, "epoch": 1895} {"train_loss": -11.739533424377441, "global_step": 318464, "epoch": 1895} {"train_loss": -12.158193588256836, "global_step": 318465, "epoch": 1895} {"train_loss": -12.194451332092285, "global_step": 318466, "epoch": 1895} {"train_loss": -12.15340518951416, "global_step": 318467, "epoch": 1895} {"train_loss": -12.01361083984375, "global_step": 318468, "epoch": 1895} {"train_loss": -12.091226577758789, "global_step": 318469, "epoch": 1895} {"train_loss": -12.063546180725098, "global_step": 318470, "epoch": 1895} {"train_loss": -12.11980152130127, "global_step": 318471, "epoch": 1895} {"train_loss": -12.012690544128418, "global_step": 318472, "epoch": 1895} {"train_loss": -12.19143295288086, "global_step": 318473, "epoch": 1895} {"train_loss": -12.1309814453125, "global_step": 318474, "epoch": 1895} {"train_loss": -12.441625595092773, "global_step": 318475, "epoch": 1895} {"train_loss": -12.152351379394531, "global_step": 318476, "epoch": 1895} {"train_loss": -12.03205680847168, "global_step": 318477, "epoch": 1895} {"train_loss": -11.998002052307129, "global_step": 318478, "epoch": 1895} {"train_loss": -12.268621444702148, "global_step": 318479, "epoch": 1895} {"train_loss": -12.211549758911133, "global_step": 318480, "epoch": 1895} {"train_loss": -12.047883033752441, "global_step": 318481, "epoch": 1895} {"train_loss": -12.16461181640625, "global_step": 318482, "epoch": 1895} {"train_loss": -12.050606727600098, "global_step": 318483, "epoch": 1895} {"train_loss": -12.077596664428711, "global_step": 318484, "epoch": 1895} {"train_loss": -12.226696014404297, "global_step": 318485, "epoch": 1895} {"train_loss": -12.240290641784668, "global_step": 318486, "epoch": 1895} {"train_loss": -12.392682075500488, "global_step": 318487, "epoch": 1895} {"train_loss": -11.822503089904785, "global_step": 318488, "epoch": 1895} {"train_loss": -12.135231971740723, "global_step": 318489, "epoch": 1895} {"train_loss": -12.080525398254395, "global_step": 318490, "epoch": 1895} {"train_loss": -12.079902648925781, "global_step": 318491, "epoch": 1895} {"train_loss": -12.182908058166504, "global_step": 318492, "epoch": 1895} {"train_loss": -12.28786849975586, "global_step": 318493, "epoch": 1895} {"train_loss": -12.227945327758789, "global_step": 318494, "epoch": 1895} {"train_loss": -12.114818572998047, "global_step": 318495, "epoch": 1895} {"train_loss": -11.653548240661621, "global_step": 318496, "epoch": 1895} {"train_loss": -12.00725269317627, "global_step": 318497, "epoch": 1895} {"train_loss": -12.08962345123291, "global_step": 318498, "epoch": 1895} {"train_loss": -11.834033966064453, "global_step": 318499, "epoch": 1895} {"train_loss": -11.803497314453125, "global_step": 318500, "epoch": 1895} {"train_loss": -11.600957870483398, "global_step": 318501, "epoch": 1895} {"train_loss": -11.065814971923828, "global_step": 318502, "epoch": 1895} {"train_loss": -11.935182571411133, "global_step": 318503, "epoch": 1895} {"train_loss": -10.92384147644043, "global_step": 318504, "epoch": 1895} {"train_loss": -11.359935760498047, "global_step": 318505, "epoch": 1895} {"train_loss": -11.18271541595459, "global_step": 318506, "epoch": 1895} {"train_loss": -11.255985260009766, "global_step": 318507, "epoch": 1895} {"train_loss": -9.415578842163086, "global_step": 318508, "epoch": 1895} {"train_loss": -10.366758346557617, "global_step": 318509, "epoch": 1895} {"train_loss": -8.295254707336426, "global_step": 318510, "epoch": 1895} {"train_loss": -8.815298080444336, "global_step": 318511, "epoch": 1895} {"train_loss": -8.667777061462402, "global_step": 318512, "epoch": 1895} {"train_loss": -9.175621032714844, "global_step": 318513, "epoch": 1895} {"train_loss": -8.9240083694458, "global_step": 318514, "epoch": 1895} {"train_loss": -9.886602401733398, "global_step": 318515, "epoch": 1895} {"train_loss": -10.294363021850586, "global_step": 318516, "epoch": 1895} {"train_loss": -10.326776504516602, "global_step": 318517, "epoch": 1895} {"train_loss": -9.030467987060547, "global_step": 318518, "epoch": 1895} {"train_loss": -8.372722625732422, "global_step": 318519, "epoch": 1895} {"train_loss": -9.247960090637207, "global_step": 318520, "epoch": 1895} {"train_loss": -10.858931541442871, "global_step": 318521, "epoch": 1895} {"train_loss": -9.953134536743164, "global_step": 318522, "epoch": 1895} {"train_loss": -10.12900447845459, "global_step": 318523, "epoch": 1895} {"train_loss": -10.520380020141602, "global_step": 318524, "epoch": 1895} {"train_loss": -10.968957901000977, "global_step": 318525, "epoch": 1895} {"train_loss": -10.124822616577148, "global_step": 318526, "epoch": 1895} {"train_loss": -11.458228105590457, "global_step": 318527, "epoch": 1895, "val_loss": 284234.6875, "train_action_mse_error": 0.9074089527130127} {"train_loss": -10.994351387023926, "global_step": 318528, "epoch": 1896} {"train_loss": -10.294158935546875, "global_step": 318529, "epoch": 1896} {"train_loss": -11.532670021057129, "global_step": 318530, "epoch": 1896} {"train_loss": -10.160869598388672, "global_step": 318531, "epoch": 1896} {"train_loss": -10.960052490234375, "global_step": 318532, "epoch": 1896} {"train_loss": -11.65140151977539, "global_step": 318533, "epoch": 1896} {"train_loss": -11.315668106079102, "global_step": 318534, "epoch": 1896} {"train_loss": -11.08198356628418, "global_step": 318535, "epoch": 1896} {"train_loss": -11.756772994995117, "global_step": 318536, "epoch": 1896} {"train_loss": -10.985925674438477, "global_step": 318537, "epoch": 1896} {"train_loss": -11.904342651367188, "global_step": 318538, "epoch": 1896} {"train_loss": -11.639579772949219, "global_step": 318539, "epoch": 1896} {"train_loss": -11.814355850219727, "global_step": 318540, "epoch": 1896} {"train_loss": -11.982627868652344, "global_step": 318541, "epoch": 1896} {"train_loss": -11.962749481201172, "global_step": 318542, "epoch": 1896} {"train_loss": -11.980212211608887, "global_step": 318543, "epoch": 1896} {"train_loss": -12.016746520996094, "global_step": 318544, "epoch": 1896} {"train_loss": -11.95884895324707, "global_step": 318545, "epoch": 1896} {"train_loss": -11.83806324005127, "global_step": 318546, "epoch": 1896} {"train_loss": -12.024280548095703, "global_step": 318547, "epoch": 1896} {"train_loss": -11.897000312805176, "global_step": 318548, "epoch": 1896} {"train_loss": -12.173693656921387, "global_step": 318549, "epoch": 1896} {"train_loss": -11.862886428833008, "global_step": 318550, "epoch": 1896} {"train_loss": -11.977425575256348, "global_step": 318551, "epoch": 1896} {"train_loss": -11.708139419555664, "global_step": 318552, "epoch": 1896} {"train_loss": -12.211101531982422, "global_step": 318553, "epoch": 1896} {"train_loss": -11.660923957824707, "global_step": 318554, "epoch": 1896} {"train_loss": -11.898517608642578, "global_step": 318555, "epoch": 1896} {"train_loss": -11.891965866088867, "global_step": 318556, "epoch": 1896} {"train_loss": -11.972944259643555, "global_step": 318557, "epoch": 1896} {"train_loss": -11.91947078704834, "global_step": 318558, "epoch": 1896} {"train_loss": -11.919943809509277, "global_step": 318559, "epoch": 1896} {"train_loss": -11.418693542480469, "global_step": 318560, "epoch": 1896} {"train_loss": -11.85224723815918, "global_step": 318561, "epoch": 1896} {"train_loss": -11.595788955688477, "global_step": 318562, "epoch": 1896} {"train_loss": -12.197896957397461, "global_step": 318563, "epoch": 1896} {"train_loss": -11.655984878540039, "global_step": 318564, "epoch": 1896} {"train_loss": -11.96023941040039, "global_step": 318565, "epoch": 1896} {"train_loss": -11.89178466796875, "global_step": 318566, "epoch": 1896} {"train_loss": -12.097200393676758, "global_step": 318567, "epoch": 1896} {"train_loss": -12.046599388122559, "global_step": 318568, "epoch": 1896} {"train_loss": -11.906107902526855, "global_step": 318569, "epoch": 1896} {"train_loss": -12.303705215454102, "global_step": 318570, "epoch": 1896} {"train_loss": -11.922334671020508, "global_step": 318571, "epoch": 1896} {"train_loss": -12.204543113708496, "global_step": 318572, "epoch": 1896} {"train_loss": -12.127655029296875, "global_step": 318573, "epoch": 1896} {"train_loss": -11.971806526184082, "global_step": 318574, "epoch": 1896} {"train_loss": -12.120245933532715, "global_step": 318575, "epoch": 1896} {"train_loss": -12.160501480102539, "global_step": 318576, "epoch": 1896} {"train_loss": -12.235450744628906, "global_step": 318577, "epoch": 1896} {"train_loss": -12.160024642944336, "global_step": 318578, "epoch": 1896} {"train_loss": -12.421653747558594, "global_step": 318579, "epoch": 1896} {"train_loss": -12.140533447265625, "global_step": 318580, "epoch": 1896} {"train_loss": -12.172170639038086, "global_step": 318581, "epoch": 1896} {"train_loss": -12.44906997680664, "global_step": 318582, "epoch": 1896} {"train_loss": -12.247564315795898, "global_step": 318583, "epoch": 1896} {"train_loss": -12.411937713623047, "global_step": 318584, "epoch": 1896} {"train_loss": -12.190776824951172, "global_step": 318585, "epoch": 1896} {"train_loss": -12.446754455566406, "global_step": 318586, "epoch": 1896} {"train_loss": -12.249116897583008, "global_step": 318587, "epoch": 1896} {"train_loss": -12.122649192810059, "global_step": 318588, "epoch": 1896} {"train_loss": -12.365655899047852, "global_step": 318589, "epoch": 1896} {"train_loss": -12.318544387817383, "global_step": 318590, "epoch": 1896} {"train_loss": -12.234109878540039, "global_step": 318591, "epoch": 1896} {"train_loss": -12.35644817352295, "global_step": 318592, "epoch": 1896} {"train_loss": -12.480928421020508, "global_step": 318593, "epoch": 1896} {"train_loss": -11.976472854614258, "global_step": 318594, "epoch": 1896} {"train_loss": -12.492865562438965, "global_step": 318595, "epoch": 1896} {"train_loss": -12.298434257507324, "global_step": 318596, "epoch": 1896} {"train_loss": -12.320518493652344, "global_step": 318597, "epoch": 1896} {"train_loss": -12.35605239868164, "global_step": 318598, "epoch": 1896} {"train_loss": -12.224241256713867, "global_step": 318599, "epoch": 1896} {"train_loss": -12.346784591674805, "global_step": 318600, "epoch": 1896} {"train_loss": -12.331523895263672, "global_step": 318601, "epoch": 1896} {"train_loss": -12.549517631530762, "global_step": 318602, "epoch": 1896} {"train_loss": -12.246421813964844, "global_step": 318603, "epoch": 1896} {"train_loss": -12.195751190185547, "global_step": 318604, "epoch": 1896} {"train_loss": -12.458440780639648, "global_step": 318605, "epoch": 1896} {"train_loss": -12.231088638305664, "global_step": 318606, "epoch": 1896} {"train_loss": -12.647928237915039, "global_step": 318607, "epoch": 1896} {"train_loss": -12.012121200561523, "global_step": 318608, "epoch": 1896} {"train_loss": -12.420060157775879, "global_step": 318609, "epoch": 1896} {"train_loss": -12.450702667236328, "global_step": 318610, "epoch": 1896} {"train_loss": -12.379472732543945, "global_step": 318611, "epoch": 1896} {"train_loss": -12.333057403564453, "global_step": 318612, "epoch": 1896} {"train_loss": -11.799676895141602, "global_step": 318613, "epoch": 1896} {"train_loss": -12.325462341308594, "global_step": 318614, "epoch": 1896} {"train_loss": -12.03203010559082, "global_step": 318615, "epoch": 1896} {"train_loss": -11.814300537109375, "global_step": 318616, "epoch": 1896} {"train_loss": -12.37750244140625, "global_step": 318617, "epoch": 1896} {"train_loss": -11.949671745300293, "global_step": 318618, "epoch": 1896} {"train_loss": -11.475476264953613, "global_step": 318619, "epoch": 1896} {"train_loss": -11.943159103393555, "global_step": 318620, "epoch": 1896} {"train_loss": -12.375554084777832, "global_step": 318621, "epoch": 1896} {"train_loss": -11.90989875793457, "global_step": 318622, "epoch": 1896} {"train_loss": -12.072554588317871, "global_step": 318623, "epoch": 1896} {"train_loss": -11.719356536865234, "global_step": 318624, "epoch": 1896} {"train_loss": -10.489900588989258, "global_step": 318625, "epoch": 1896} {"train_loss": -12.257434844970703, "global_step": 318626, "epoch": 1896} {"train_loss": -11.101540565490723, "global_step": 318627, "epoch": 1896} {"train_loss": -11.43479061126709, "global_step": 318628, "epoch": 1896} {"train_loss": -10.877971649169922, "global_step": 318629, "epoch": 1896} {"train_loss": -11.997833251953125, "global_step": 318630, "epoch": 1896} {"train_loss": -10.770453453063965, "global_step": 318631, "epoch": 1896} {"train_loss": -11.395730018615723, "global_step": 318632, "epoch": 1896} {"train_loss": -12.125419616699219, "global_step": 318633, "epoch": 1896} {"train_loss": -12.111690521240234, "global_step": 318634, "epoch": 1896} {"train_loss": -11.852062225341797, "global_step": 318635, "epoch": 1896} {"train_loss": -12.171207427978516, "global_step": 318636, "epoch": 1896} {"train_loss": -11.91727066040039, "global_step": 318637, "epoch": 1896} {"train_loss": -12.140625, "global_step": 318638, "epoch": 1896} {"train_loss": -11.856117248535156, "global_step": 318639, "epoch": 1896} {"train_loss": -11.97824478149414, "global_step": 318640, "epoch": 1896} {"train_loss": -12.002069473266602, "global_step": 318641, "epoch": 1896} {"train_loss": -12.101888656616211, "global_step": 318642, "epoch": 1896} {"train_loss": -11.620437622070312, "global_step": 318643, "epoch": 1896} {"train_loss": -11.617301940917969, "global_step": 318644, "epoch": 1896} {"train_loss": -12.11181926727295, "global_step": 318645, "epoch": 1896} {"train_loss": -11.6153564453125, "global_step": 318646, "epoch": 1896} {"train_loss": -11.909887313842773, "global_step": 318647, "epoch": 1896} {"train_loss": -12.304023742675781, "global_step": 318648, "epoch": 1896} {"train_loss": -11.889071464538574, "global_step": 318649, "epoch": 1896} {"train_loss": -12.102285385131836, "global_step": 318650, "epoch": 1896} {"train_loss": -12.42595386505127, "global_step": 318651, "epoch": 1896} {"train_loss": -11.790787696838379, "global_step": 318652, "epoch": 1896} {"train_loss": -12.512160301208496, "global_step": 318653, "epoch": 1896} {"train_loss": -11.78055191040039, "global_step": 318654, "epoch": 1896} {"train_loss": -11.675596237182617, "global_step": 318655, "epoch": 1896} {"train_loss": -12.360437393188477, "global_step": 318656, "epoch": 1896} {"train_loss": -12.19366455078125, "global_step": 318657, "epoch": 1896} {"train_loss": -12.291704177856445, "global_step": 318658, "epoch": 1896} {"train_loss": -11.986127853393555, "global_step": 318659, "epoch": 1896} {"train_loss": -12.154074668884277, "global_step": 318660, "epoch": 1896} {"train_loss": -11.85299301147461, "global_step": 318661, "epoch": 1896} {"train_loss": -12.045392990112305, "global_step": 318662, "epoch": 1896} {"train_loss": -11.72731876373291, "global_step": 318663, "epoch": 1896} {"train_loss": -11.54589557647705, "global_step": 318664, "epoch": 1896} {"train_loss": -12.288789749145508, "global_step": 318665, "epoch": 1896} {"train_loss": -11.891386032104492, "global_step": 318666, "epoch": 1896} {"train_loss": -12.072752952575684, "global_step": 318667, "epoch": 1896} {"train_loss": -11.257290840148926, "global_step": 318668, "epoch": 1896} {"train_loss": -11.539374351501465, "global_step": 318669, "epoch": 1896} {"train_loss": -11.578636169433594, "global_step": 318670, "epoch": 1896} {"train_loss": -12.020591735839844, "global_step": 318671, "epoch": 1896} {"train_loss": -11.865386962890625, "global_step": 318672, "epoch": 1896} {"train_loss": -12.081302642822266, "global_step": 318673, "epoch": 1896} {"train_loss": -11.73214340209961, "global_step": 318674, "epoch": 1896} {"train_loss": -11.640241622924805, "global_step": 318675, "epoch": 1896} {"train_loss": -11.827709197998047, "global_step": 318676, "epoch": 1896} {"train_loss": -12.165678024291992, "global_step": 318677, "epoch": 1896} {"train_loss": -12.104070663452148, "global_step": 318678, "epoch": 1896} {"train_loss": -11.415363311767578, "global_step": 318679, "epoch": 1896} {"train_loss": -12.383993148803711, "global_step": 318680, "epoch": 1896} {"train_loss": -11.608816146850586, "global_step": 318681, "epoch": 1896} {"train_loss": -11.383907318115234, "global_step": 318682, "epoch": 1896} {"train_loss": -11.247041702270508, "global_step": 318683, "epoch": 1896} {"train_loss": -11.800342559814453, "global_step": 318684, "epoch": 1896} {"train_loss": -11.702659606933594, "global_step": 318685, "epoch": 1896} {"train_loss": -11.729555130004883, "global_step": 318686, "epoch": 1896} {"train_loss": -11.854066848754883, "global_step": 318687, "epoch": 1896} {"train_loss": -11.534107208251953, "global_step": 318688, "epoch": 1896} {"train_loss": -12.145923614501953, "global_step": 318689, "epoch": 1896} {"train_loss": -11.838964462280273, "global_step": 318690, "epoch": 1896} {"train_loss": -12.224976539611816, "global_step": 318691, "epoch": 1896} {"train_loss": -11.756580352783203, "global_step": 318692, "epoch": 1896} {"train_loss": -12.315279006958008, "global_step": 318693, "epoch": 1896} {"train_loss": -11.595128059387207, "global_step": 318694, "epoch": 1896} {"train_loss": -11.93009610970815, "global_step": 318695, "epoch": 1896, "val_loss": 285840.75} {"train_loss": -11.489426612854004, "global_step": 318696, "epoch": 1897} {"train_loss": -12.066744804382324, "global_step": 318697, "epoch": 1897} {"train_loss": -11.73967170715332, "global_step": 318698, "epoch": 1897} {"train_loss": -11.768390655517578, "global_step": 318699, "epoch": 1897} {"train_loss": -11.553890228271484, "global_step": 318700, "epoch": 1897} {"train_loss": -11.809076309204102, "global_step": 318701, "epoch": 1897} {"train_loss": -11.759058952331543, "global_step": 318702, "epoch": 1897} {"train_loss": -11.338508605957031, "global_step": 318703, "epoch": 1897} {"train_loss": -11.819141387939453, "global_step": 318704, "epoch": 1897} {"train_loss": -11.914407730102539, "global_step": 318705, "epoch": 1897} {"train_loss": -11.817462921142578, "global_step": 318706, "epoch": 1897} {"train_loss": -12.112526893615723, "global_step": 318707, "epoch": 1897} {"train_loss": -11.886348724365234, "global_step": 318708, "epoch": 1897} {"train_loss": -11.94662857055664, "global_step": 318709, "epoch": 1897} {"train_loss": -11.819865226745605, "global_step": 318710, "epoch": 1897} {"train_loss": -11.995699882507324, "global_step": 318711, "epoch": 1897} {"train_loss": -11.86733627319336, "global_step": 318712, "epoch": 1897} {"train_loss": -11.803295135498047, "global_step": 318713, "epoch": 1897} {"train_loss": -11.682088851928711, "global_step": 318714, "epoch": 1897} {"train_loss": -11.449773788452148, "global_step": 318715, "epoch": 1897} {"train_loss": -11.523565292358398, "global_step": 318716, "epoch": 1897} {"train_loss": -11.429312705993652, "global_step": 318717, "epoch": 1897} {"train_loss": -12.17902660369873, "global_step": 318718, "epoch": 1897} {"train_loss": -11.099991798400879, "global_step": 318719, "epoch": 1897} {"train_loss": -12.298046112060547, "global_step": 318720, "epoch": 1897} {"train_loss": -11.608642578125, "global_step": 318721, "epoch": 1897} {"train_loss": -12.156116485595703, "global_step": 318722, "epoch": 1897} {"train_loss": -11.774921417236328, "global_step": 318723, "epoch": 1897} {"train_loss": -11.993900299072266, "global_step": 318724, "epoch": 1897} {"train_loss": -11.727110862731934, "global_step": 318725, "epoch": 1897} {"train_loss": -12.021333694458008, "global_step": 318726, "epoch": 1897} {"train_loss": -11.330735206604004, "global_step": 318727, "epoch": 1897} {"train_loss": -12.211338996887207, "global_step": 318728, "epoch": 1897} {"train_loss": -11.578890800476074, "global_step": 318729, "epoch": 1897} {"train_loss": -11.575268745422363, "global_step": 318730, "epoch": 1897} {"train_loss": -11.802013397216797, "global_step": 318731, "epoch": 1897} {"train_loss": -11.733502388000488, "global_step": 318732, "epoch": 1897} {"train_loss": -11.549457550048828, "global_step": 318733, "epoch": 1897} {"train_loss": -12.20819091796875, "global_step": 318734, "epoch": 1897} {"train_loss": -11.84710693359375, "global_step": 318735, "epoch": 1897} {"train_loss": -11.744104385375977, "global_step": 318736, "epoch": 1897} {"train_loss": -12.062492370605469, "global_step": 318737, "epoch": 1897} {"train_loss": -11.100341796875, "global_step": 318738, "epoch": 1897} {"train_loss": -12.150289535522461, "global_step": 318739, "epoch": 1897} {"train_loss": -11.11560344696045, "global_step": 318740, "epoch": 1897} {"train_loss": -11.812606811523438, "global_step": 318741, "epoch": 1897} {"train_loss": -11.826032638549805, "global_step": 318742, "epoch": 1897} {"train_loss": -11.345958709716797, "global_step": 318743, "epoch": 1897} {"train_loss": -12.192325592041016, "global_step": 318744, "epoch": 1897} {"train_loss": -11.131063461303711, "global_step": 318745, "epoch": 1897} {"train_loss": -11.888760566711426, "global_step": 318746, "epoch": 1897} {"train_loss": -11.593477249145508, "global_step": 318747, "epoch": 1897} {"train_loss": -12.046483993530273, "global_step": 318748, "epoch": 1897} {"train_loss": -11.582856178283691, "global_step": 318749, "epoch": 1897} {"train_loss": -12.092283248901367, "global_step": 318750, "epoch": 1897} {"train_loss": -11.509563446044922, "global_step": 318751, "epoch": 1897} {"train_loss": -11.804969787597656, "global_step": 318752, "epoch": 1897} {"train_loss": -11.880416870117188, "global_step": 318753, "epoch": 1897} {"train_loss": -12.042128562927246, "global_step": 318754, "epoch": 1897} {"train_loss": -12.176055908203125, "global_step": 318755, "epoch": 1897} {"train_loss": -12.12055778503418, "global_step": 318756, "epoch": 1897} {"train_loss": -11.992839813232422, "global_step": 318757, "epoch": 1897} {"train_loss": -12.180562019348145, "global_step": 318758, "epoch": 1897} {"train_loss": -12.087888717651367, "global_step": 318759, "epoch": 1897} {"train_loss": -12.26637077331543, "global_step": 318760, "epoch": 1897} {"train_loss": -11.81120491027832, "global_step": 318761, "epoch": 1897} {"train_loss": -12.34465503692627, "global_step": 318762, "epoch": 1897} {"train_loss": -12.150952339172363, "global_step": 318763, "epoch": 1897} {"train_loss": -12.32301139831543, "global_step": 318764, "epoch": 1897} {"train_loss": -12.227176666259766, "global_step": 318765, "epoch": 1897} {"train_loss": -12.134536743164062, "global_step": 318766, "epoch": 1897} {"train_loss": -12.279285430908203, "global_step": 318767, "epoch": 1897} {"train_loss": -11.845653533935547, "global_step": 318768, "epoch": 1897} {"train_loss": -12.040234565734863, "global_step": 318769, "epoch": 1897} {"train_loss": -11.689350128173828, "global_step": 318770, "epoch": 1897} {"train_loss": -11.919631958007812, "global_step": 318771, "epoch": 1897} {"train_loss": -11.37434196472168, "global_step": 318772, "epoch": 1897} {"train_loss": -11.016368865966797, "global_step": 318773, "epoch": 1897} {"train_loss": -11.039671897888184, "global_step": 318774, "epoch": 1897} {"train_loss": -10.74907112121582, "global_step": 318775, "epoch": 1897} {"train_loss": -10.775821685791016, "global_step": 318776, "epoch": 1897} {"train_loss": -10.149767875671387, "global_step": 318777, "epoch": 1897} {"train_loss": -10.83739948272705, "global_step": 318778, "epoch": 1897} {"train_loss": -10.927960395812988, "global_step": 318779, "epoch": 1897} {"train_loss": -11.689538955688477, "global_step": 318780, "epoch": 1897} {"train_loss": -10.659395217895508, "global_step": 318781, "epoch": 1897} {"train_loss": -11.031940460205078, "global_step": 318782, "epoch": 1897} {"train_loss": -10.471471786499023, "global_step": 318783, "epoch": 1897} {"train_loss": -10.233649253845215, "global_step": 318784, "epoch": 1897} {"train_loss": -11.113542556762695, "global_step": 318785, "epoch": 1897} {"train_loss": -8.77993392944336, "global_step": 318786, "epoch": 1897} {"train_loss": -10.182859420776367, "global_step": 318787, "epoch": 1897} {"train_loss": -8.852256774902344, "global_step": 318788, "epoch": 1897} {"train_loss": -9.943729400634766, "global_step": 318789, "epoch": 1897} {"train_loss": -9.131683349609375, "global_step": 318790, "epoch": 1897} {"train_loss": -9.947952270507812, "global_step": 318791, "epoch": 1897} {"train_loss": -10.334877014160156, "global_step": 318792, "epoch": 1897} {"train_loss": -10.033226013183594, "global_step": 318793, "epoch": 1897} {"train_loss": -11.360395431518555, "global_step": 318794, "epoch": 1897} {"train_loss": -10.128572463989258, "global_step": 318795, "epoch": 1897} {"train_loss": -11.610528945922852, "global_step": 318796, "epoch": 1897} {"train_loss": -10.783452987670898, "global_step": 318797, "epoch": 1897} {"train_loss": -10.9020357131958, "global_step": 318798, "epoch": 1897} {"train_loss": -10.87989616394043, "global_step": 318799, "epoch": 1897} {"train_loss": -11.525053977966309, "global_step": 318800, "epoch": 1897} {"train_loss": -11.377010345458984, "global_step": 318801, "epoch": 1897} {"train_loss": -11.477846145629883, "global_step": 318802, "epoch": 1897} {"train_loss": -11.632649421691895, "global_step": 318803, "epoch": 1897} {"train_loss": -11.11998176574707, "global_step": 318804, "epoch": 1897} {"train_loss": -11.659625053405762, "global_step": 318805, "epoch": 1897} {"train_loss": -11.532350540161133, "global_step": 318806, "epoch": 1897} {"train_loss": -11.186917304992676, "global_step": 318807, "epoch": 1897} {"train_loss": -11.984185218811035, "global_step": 318808, "epoch": 1897} {"train_loss": -11.305418014526367, "global_step": 318809, "epoch": 1897} {"train_loss": -11.833989143371582, "global_step": 318810, "epoch": 1897} {"train_loss": -11.645600318908691, "global_step": 318811, "epoch": 1897} {"train_loss": -11.76431655883789, "global_step": 318812, "epoch": 1897} {"train_loss": -11.82729721069336, "global_step": 318813, "epoch": 1897} {"train_loss": -11.830190658569336, "global_step": 318814, "epoch": 1897} {"train_loss": -11.83680534362793, "global_step": 318815, "epoch": 1897} {"train_loss": -11.851491928100586, "global_step": 318816, "epoch": 1897} {"train_loss": -11.93468189239502, "global_step": 318817, "epoch": 1897} {"train_loss": -11.932748794555664, "global_step": 318818, "epoch": 1897} {"train_loss": -11.720982551574707, "global_step": 318819, "epoch": 1897} {"train_loss": -12.00964641571045, "global_step": 318820, "epoch": 1897} {"train_loss": -11.929932594299316, "global_step": 318821, "epoch": 1897} {"train_loss": -12.008359909057617, "global_step": 318822, "epoch": 1897} {"train_loss": -12.051162719726562, "global_step": 318823, "epoch": 1897} {"train_loss": -11.699553489685059, "global_step": 318824, "epoch": 1897} {"train_loss": -11.960796356201172, "global_step": 318825, "epoch": 1897} {"train_loss": -11.896341323852539, "global_step": 318826, "epoch": 1897} {"train_loss": -12.053661346435547, "global_step": 318827, "epoch": 1897} {"train_loss": -11.880428314208984, "global_step": 318828, "epoch": 1897} {"train_loss": -12.156834602355957, "global_step": 318829, "epoch": 1897} {"train_loss": -11.990129470825195, "global_step": 318830, "epoch": 1897} {"train_loss": -12.062183380126953, "global_step": 318831, "epoch": 1897} {"train_loss": -12.019184112548828, "global_step": 318832, "epoch": 1897} {"train_loss": -12.030496597290039, "global_step": 318833, "epoch": 1897} {"train_loss": -12.144050598144531, "global_step": 318834, "epoch": 1897} {"train_loss": -12.13206672668457, "global_step": 318835, "epoch": 1897} {"train_loss": -12.090144157409668, "global_step": 318836, "epoch": 1897} {"train_loss": -12.208395957946777, "global_step": 318837, "epoch": 1897} {"train_loss": -12.201654434204102, "global_step": 318838, "epoch": 1897} {"train_loss": -12.176204681396484, "global_step": 318839, "epoch": 1897} {"train_loss": -12.067401885986328, "global_step": 318840, "epoch": 1897} {"train_loss": -12.300655364990234, "global_step": 318841, "epoch": 1897} {"train_loss": -12.370786666870117, "global_step": 318842, "epoch": 1897} {"train_loss": -12.143823623657227, "global_step": 318843, "epoch": 1897} {"train_loss": -12.208157539367676, "global_step": 318844, "epoch": 1897} {"train_loss": -12.166598320007324, "global_step": 318845, "epoch": 1897} {"train_loss": -12.210307121276855, "global_step": 318846, "epoch": 1897} {"train_loss": -12.328133583068848, "global_step": 318847, "epoch": 1897} {"train_loss": -12.23209285736084, "global_step": 318848, "epoch": 1897} {"train_loss": -12.337010383605957, "global_step": 318849, "epoch": 1897} {"train_loss": -12.244608879089355, "global_step": 318850, "epoch": 1897} {"train_loss": -12.33281421661377, "global_step": 318851, "epoch": 1897} {"train_loss": -12.27900505065918, "global_step": 318852, "epoch": 1897} {"train_loss": -12.401252746582031, "global_step": 318853, "epoch": 1897} {"train_loss": -12.448989868164062, "global_step": 318854, "epoch": 1897} {"train_loss": -12.31968879699707, "global_step": 318855, "epoch": 1897} {"train_loss": -12.473158836364746, "global_step": 318856, "epoch": 1897} {"train_loss": -12.115516662597656, "global_step": 318857, "epoch": 1897} {"train_loss": -12.519787788391113, "global_step": 318858, "epoch": 1897} {"train_loss": -12.424304008483887, "global_step": 318859, "epoch": 1897} {"train_loss": -12.444971084594727, "global_step": 318860, "epoch": 1897} {"train_loss": -12.561644554138184, "global_step": 318861, "epoch": 1897} {"train_loss": -12.37099552154541, "global_step": 318862, "epoch": 1897} {"train_loss": -11.68977986063276, "global_step": 318863, "epoch": 1897, "val_loss": 284923.75} {"train_loss": -12.429941177368164, "global_step": 318864, "epoch": 1898} {"train_loss": -12.476480484008789, "global_step": 318865, "epoch": 1898} {"train_loss": -12.370538711547852, "global_step": 318866, "epoch": 1898} {"train_loss": -12.269535064697266, "global_step": 318867, "epoch": 1898} {"train_loss": -12.071691513061523, "global_step": 318868, "epoch": 1898} {"train_loss": -12.187498092651367, "global_step": 318869, "epoch": 1898} {"train_loss": -11.2780122756958, "global_step": 318870, "epoch": 1898} {"train_loss": -11.412915229797363, "global_step": 318871, "epoch": 1898} {"train_loss": -12.166093826293945, "global_step": 318872, "epoch": 1898} {"train_loss": -11.786615371704102, "global_step": 318873, "epoch": 1898} {"train_loss": -11.595373153686523, "global_step": 318874, "epoch": 1898} {"train_loss": -12.129919052124023, "global_step": 318875, "epoch": 1898} {"train_loss": -12.135285377502441, "global_step": 318876, "epoch": 1898} {"train_loss": -11.975985527038574, "global_step": 318877, "epoch": 1898} {"train_loss": -11.992286682128906, "global_step": 318878, "epoch": 1898} {"train_loss": -12.360601425170898, "global_step": 318879, "epoch": 1898} {"train_loss": -12.249521255493164, "global_step": 318880, "epoch": 1898} {"train_loss": -12.004440307617188, "global_step": 318881, "epoch": 1898} {"train_loss": -11.948225021362305, "global_step": 318882, "epoch": 1898} {"train_loss": -11.610713958740234, "global_step": 318883, "epoch": 1898} {"train_loss": -12.162276268005371, "global_step": 318884, "epoch": 1898} {"train_loss": -11.908849716186523, "global_step": 318885, "epoch": 1898} {"train_loss": -12.32003402709961, "global_step": 318886, "epoch": 1898} {"train_loss": -12.191264152526855, "global_step": 318887, "epoch": 1898} {"train_loss": -12.139586448669434, "global_step": 318888, "epoch": 1898} {"train_loss": -12.209070205688477, "global_step": 318889, "epoch": 1898} {"train_loss": -12.152811050415039, "global_step": 318890, "epoch": 1898} {"train_loss": -12.110527038574219, "global_step": 318891, "epoch": 1898} {"train_loss": -12.095355987548828, "global_step": 318892, "epoch": 1898} {"train_loss": -12.033867835998535, "global_step": 318893, "epoch": 1898} {"train_loss": -11.678703308105469, "global_step": 318894, "epoch": 1898} {"train_loss": -11.870611190795898, "global_step": 318895, "epoch": 1898} {"train_loss": -11.286735534667969, "global_step": 318896, "epoch": 1898} {"train_loss": -11.682193756103516, "global_step": 318897, "epoch": 1898} {"train_loss": -11.483089447021484, "global_step": 318898, "epoch": 1898} {"train_loss": -11.58047103881836, "global_step": 318899, "epoch": 1898} {"train_loss": -10.959528923034668, "global_step": 318900, "epoch": 1898} {"train_loss": -12.029817581176758, "global_step": 318901, "epoch": 1898} {"train_loss": -11.305561065673828, "global_step": 318902, "epoch": 1898} {"train_loss": -11.77531623840332, "global_step": 318903, "epoch": 1898} {"train_loss": -11.771955490112305, "global_step": 318904, "epoch": 1898} {"train_loss": -11.86390495300293, "global_step": 318905, "epoch": 1898} {"train_loss": -11.961557388305664, "global_step": 318906, "epoch": 1898} {"train_loss": -12.323588371276855, "global_step": 318907, "epoch": 1898} {"train_loss": -12.16305160522461, "global_step": 318908, "epoch": 1898} {"train_loss": -11.987871170043945, "global_step": 318909, "epoch": 1898} {"train_loss": -12.366935729980469, "global_step": 318910, "epoch": 1898} {"train_loss": -11.502113342285156, "global_step": 318911, "epoch": 1898} {"train_loss": -11.882617950439453, "global_step": 318912, "epoch": 1898} {"train_loss": -12.212135314941406, "global_step": 318913, "epoch": 1898} {"train_loss": -11.749590873718262, "global_step": 318914, "epoch": 1898} {"train_loss": -11.2933349609375, "global_step": 318915, "epoch": 1898} {"train_loss": -12.138471603393555, "global_step": 318916, "epoch": 1898} {"train_loss": -11.385087966918945, "global_step": 318917, "epoch": 1898} {"train_loss": -10.471484184265137, "global_step": 318918, "epoch": 1898} {"train_loss": -12.297430038452148, "global_step": 318919, "epoch": 1898} {"train_loss": -10.897350311279297, "global_step": 318920, "epoch": 1898} {"train_loss": -11.380374908447266, "global_step": 318921, "epoch": 1898} {"train_loss": -12.085884094238281, "global_step": 318922, "epoch": 1898} {"train_loss": -11.361679077148438, "global_step": 318923, "epoch": 1898} {"train_loss": -11.35882568359375, "global_step": 318924, "epoch": 1898} {"train_loss": -11.75688362121582, "global_step": 318925, "epoch": 1898} {"train_loss": -11.881962776184082, "global_step": 318926, "epoch": 1898} {"train_loss": -12.129256248474121, "global_step": 318927, "epoch": 1898} {"train_loss": -11.787056922912598, "global_step": 318928, "epoch": 1898} {"train_loss": -12.166990280151367, "global_step": 318929, "epoch": 1898} {"train_loss": -11.468934059143066, "global_step": 318930, "epoch": 1898} {"train_loss": -11.148101806640625, "global_step": 318931, "epoch": 1898} {"train_loss": -11.710000991821289, "global_step": 318932, "epoch": 1898} {"train_loss": -11.994735717773438, "global_step": 318933, "epoch": 1898} {"train_loss": -12.077903747558594, "global_step": 318934, "epoch": 1898} {"train_loss": -12.090097427368164, "global_step": 318935, "epoch": 1898} {"train_loss": -12.073698043823242, "global_step": 318936, "epoch": 1898} {"train_loss": -12.30282974243164, "global_step": 318937, "epoch": 1898} {"train_loss": -11.843544006347656, "global_step": 318938, "epoch": 1898} {"train_loss": -12.177184104919434, "global_step": 318939, "epoch": 1898} {"train_loss": -11.997123718261719, "global_step": 318940, "epoch": 1898} {"train_loss": -12.291802406311035, "global_step": 318941, "epoch": 1898} {"train_loss": -11.658873558044434, "global_step": 318942, "epoch": 1898} {"train_loss": -11.871076583862305, "global_step": 318943, "epoch": 1898} {"train_loss": -11.907280921936035, "global_step": 318944, "epoch": 1898} {"train_loss": -11.811210632324219, "global_step": 318945, "epoch": 1898} {"train_loss": -11.759407043457031, "global_step": 318946, "epoch": 1898} {"train_loss": -12.269723892211914, "global_step": 318947, "epoch": 1898} {"train_loss": -12.103277206420898, "global_step": 318948, "epoch": 1898} {"train_loss": -12.21810531616211, "global_step": 318949, "epoch": 1898} {"train_loss": -12.577423095703125, "global_step": 318950, "epoch": 1898} {"train_loss": -12.322077751159668, "global_step": 318951, "epoch": 1898} {"train_loss": -12.101863861083984, "global_step": 318952, "epoch": 1898} {"train_loss": -12.416790008544922, "global_step": 318953, "epoch": 1898} {"train_loss": -12.227359771728516, "global_step": 318954, "epoch": 1898} {"train_loss": -12.473470687866211, "global_step": 318955, "epoch": 1898} {"train_loss": -12.556793212890625, "global_step": 318956, "epoch": 1898} {"train_loss": -12.30411434173584, "global_step": 318957, "epoch": 1898} {"train_loss": -12.443696975708008, "global_step": 318958, "epoch": 1898} {"train_loss": -12.580526351928711, "global_step": 318959, "epoch": 1898} {"train_loss": -12.261163711547852, "global_step": 318960, "epoch": 1898} {"train_loss": -12.52340316772461, "global_step": 318961, "epoch": 1898} {"train_loss": -12.313780784606934, "global_step": 318962, "epoch": 1898} {"train_loss": -12.483349800109863, "global_step": 318963, "epoch": 1898} {"train_loss": -12.564384460449219, "global_step": 318964, "epoch": 1898} {"train_loss": -12.363882064819336, "global_step": 318965, "epoch": 1898} {"train_loss": -12.307909965515137, "global_step": 318966, "epoch": 1898} {"train_loss": -12.578533172607422, "global_step": 318967, "epoch": 1898} {"train_loss": -12.536928176879883, "global_step": 318968, "epoch": 1898} {"train_loss": -12.257558822631836, "global_step": 318969, "epoch": 1898} {"train_loss": -11.940698623657227, "global_step": 318970, "epoch": 1898} {"train_loss": -12.369074821472168, "global_step": 318971, "epoch": 1898} {"train_loss": -12.382266998291016, "global_step": 318972, "epoch": 1898} {"train_loss": -12.220857620239258, "global_step": 318973, "epoch": 1898} {"train_loss": -12.037790298461914, "global_step": 318974, "epoch": 1898} {"train_loss": -12.655585289001465, "global_step": 318975, "epoch": 1898} {"train_loss": -12.381032943725586, "global_step": 318976, "epoch": 1898} {"train_loss": -12.250359535217285, "global_step": 318977, "epoch": 1898} {"train_loss": -12.271211624145508, "global_step": 318978, "epoch": 1898} {"train_loss": -12.143577575683594, "global_step": 318979, "epoch": 1898} {"train_loss": -11.666444778442383, "global_step": 318980, "epoch": 1898} {"train_loss": -11.572433471679688, "global_step": 318981, "epoch": 1898} {"train_loss": -11.465450286865234, "global_step": 318982, "epoch": 1898} {"train_loss": -12.470415115356445, "global_step": 318983, "epoch": 1898} {"train_loss": -12.38026237487793, "global_step": 318984, "epoch": 1898} {"train_loss": -12.307153701782227, "global_step": 318985, "epoch": 1898} {"train_loss": -12.376059532165527, "global_step": 318986, "epoch": 1898} {"train_loss": -12.30003547668457, "global_step": 318987, "epoch": 1898} {"train_loss": -12.478199005126953, "global_step": 318988, "epoch": 1898} {"train_loss": -12.460771560668945, "global_step": 318989, "epoch": 1898} {"train_loss": -12.409309387207031, "global_step": 318990, "epoch": 1898} {"train_loss": -12.34508228302002, "global_step": 318991, "epoch": 1898} {"train_loss": -12.599597930908203, "global_step": 318992, "epoch": 1898} {"train_loss": -12.635982513427734, "global_step": 318993, "epoch": 1898} {"train_loss": -12.566976547241211, "global_step": 318994, "epoch": 1898} {"train_loss": -12.608362197875977, "global_step": 318995, "epoch": 1898} {"train_loss": -12.666173934936523, "global_step": 318996, "epoch": 1898} {"train_loss": -12.665066719055176, "global_step": 318997, "epoch": 1898} {"train_loss": -12.530145645141602, "global_step": 318998, "epoch": 1898} {"train_loss": -12.853767395019531, "global_step": 318999, "epoch": 1898} {"train_loss": -12.533982276916504, "global_step": 319000, "epoch": 1898} {"train_loss": -12.303043365478516, "global_step": 319001, "epoch": 1898} {"train_loss": -12.181121826171875, "global_step": 319002, "epoch": 1898} {"train_loss": -12.429720878601074, "global_step": 319003, "epoch": 1898} {"train_loss": -12.61248779296875, "global_step": 319004, "epoch": 1898} {"train_loss": -12.258554458618164, "global_step": 319005, "epoch": 1898} {"train_loss": -11.427521705627441, "global_step": 319006, "epoch": 1898} {"train_loss": -10.627686500549316, "global_step": 319007, "epoch": 1898} {"train_loss": -11.57437801361084, "global_step": 319008, "epoch": 1898} {"train_loss": -11.49846076965332, "global_step": 319009, "epoch": 1898} {"train_loss": -10.71192455291748, "global_step": 319010, "epoch": 1898} {"train_loss": -11.586868286132812, "global_step": 319011, "epoch": 1898} {"train_loss": -11.205537796020508, "global_step": 319012, "epoch": 1898} {"train_loss": -10.060379028320312, "global_step": 319013, "epoch": 1898} {"train_loss": -10.50395679473877, "global_step": 319014, "epoch": 1898} {"train_loss": -9.516523361206055, "global_step": 319015, "epoch": 1898} {"train_loss": -8.715560913085938, "global_step": 319016, "epoch": 1898} {"train_loss": -7.312845230102539, "global_step": 319017, "epoch": 1898} {"train_loss": -10.033708572387695, "global_step": 319018, "epoch": 1898} {"train_loss": -6.634075164794922, "global_step": 319019, "epoch": 1898} {"train_loss": -8.5911865234375, "global_step": 319020, "epoch": 1898} {"train_loss": -6.307705879211426, "global_step": 319021, "epoch": 1898} {"train_loss": -5.605816841125488, "global_step": 319022, "epoch": 1898} {"train_loss": -5.8260931968688965, "global_step": 319023, "epoch": 1898} {"train_loss": -5.692517280578613, "global_step": 319024, "epoch": 1898} {"train_loss": -6.464394569396973, "global_step": 319025, "epoch": 1898} {"train_loss": -6.990656852722168, "global_step": 319026, "epoch": 1898} {"train_loss": -6.633404731750488, "global_step": 319027, "epoch": 1898} {"train_loss": -6.187898635864258, "global_step": 319028, "epoch": 1898} {"train_loss": -6.8087005615234375, "global_step": 319029, "epoch": 1898} {"train_loss": -6.857557773590088, "global_step": 319030, "epoch": 1898} {"train_loss": -11.522516057604836, "global_step": 319031, "epoch": 1898, "val_loss": 283354.625} {"train_loss": -7.419940948486328, "global_step": 319032, "epoch": 1899} {"train_loss": -7.006819725036621, "global_step": 319033, "epoch": 1899} {"train_loss": -7.492960453033447, "global_step": 319034, "epoch": 1899} {"train_loss": -7.37858772277832, "global_step": 319035, "epoch": 1899} {"train_loss": -8.19761848449707, "global_step": 319036, "epoch": 1899} {"train_loss": -8.29802131652832, "global_step": 319037, "epoch": 1899} {"train_loss": -8.283967971801758, "global_step": 319038, "epoch": 1899} {"train_loss": -8.946521759033203, "global_step": 319039, "epoch": 1899} {"train_loss": -8.224454879760742, "global_step": 319040, "epoch": 1899} {"train_loss": -8.02227783203125, "global_step": 319041, "epoch": 1899} {"train_loss": -8.401025772094727, "global_step": 319042, "epoch": 1899} {"train_loss": -9.56574821472168, "global_step": 319043, "epoch": 1899} {"train_loss": -8.708974838256836, "global_step": 319044, "epoch": 1899} {"train_loss": -8.450675010681152, "global_step": 319045, "epoch": 1899} {"train_loss": -9.066370010375977, "global_step": 319046, "epoch": 1899} {"train_loss": -9.415451049804688, "global_step": 319047, "epoch": 1899} {"train_loss": -9.29012680053711, "global_step": 319048, "epoch": 1899} {"train_loss": -9.367609024047852, "global_step": 319049, "epoch": 1899} {"train_loss": -10.227829933166504, "global_step": 319050, "epoch": 1899} {"train_loss": -10.320853233337402, "global_step": 319051, "epoch": 1899} {"train_loss": -9.841852188110352, "global_step": 319052, "epoch": 1899} {"train_loss": -10.406509399414062, "global_step": 319053, "epoch": 1899} {"train_loss": -10.612586975097656, "global_step": 319054, "epoch": 1899} {"train_loss": -10.057016372680664, "global_step": 319055, "epoch": 1899} {"train_loss": -10.538516998291016, "global_step": 319056, "epoch": 1899} {"train_loss": -11.022242546081543, "global_step": 319057, "epoch": 1899} {"train_loss": -10.585065841674805, "global_step": 319058, "epoch": 1899} {"train_loss": -10.503193855285645, "global_step": 319059, "epoch": 1899} {"train_loss": -11.440176010131836, "global_step": 319060, "epoch": 1899} {"train_loss": -10.57716178894043, "global_step": 319061, "epoch": 1899} {"train_loss": -10.518415451049805, "global_step": 319062, "epoch": 1899} {"train_loss": -11.236421585083008, "global_step": 319063, "epoch": 1899} {"train_loss": -11.431272506713867, "global_step": 319064, "epoch": 1899} {"train_loss": -11.114452362060547, "global_step": 319065, "epoch": 1899} {"train_loss": -11.57833480834961, "global_step": 319066, "epoch": 1899} {"train_loss": -11.693361282348633, "global_step": 319067, "epoch": 1899} {"train_loss": -11.474958419799805, "global_step": 319068, "epoch": 1899} {"train_loss": -11.75480842590332, "global_step": 319069, "epoch": 1899} {"train_loss": -11.66693115234375, "global_step": 319070, "epoch": 1899} {"train_loss": -11.674583435058594, "global_step": 319071, "epoch": 1899} {"train_loss": -11.745925903320312, "global_step": 319072, "epoch": 1899} {"train_loss": -11.717425346374512, "global_step": 319073, "epoch": 1899} {"train_loss": -11.811258316040039, "global_step": 319074, "epoch": 1899} {"train_loss": -11.803913116455078, "global_step": 319075, "epoch": 1899} {"train_loss": -11.729987144470215, "global_step": 319076, "epoch": 1899} {"train_loss": -11.474163055419922, "global_step": 319077, "epoch": 1899} {"train_loss": -11.649435043334961, "global_step": 319078, "epoch": 1899} {"train_loss": -11.45305061340332, "global_step": 319079, "epoch": 1899} {"train_loss": -11.749604225158691, "global_step": 319080, "epoch": 1899} {"train_loss": -11.834107398986816, "global_step": 319081, "epoch": 1899} {"train_loss": -11.461034774780273, "global_step": 319082, "epoch": 1899} {"train_loss": -12.01982307434082, "global_step": 319083, "epoch": 1899} {"train_loss": -11.585247039794922, "global_step": 319084, "epoch": 1899} {"train_loss": -11.966026306152344, "global_step": 319085, "epoch": 1899} {"train_loss": -11.813350677490234, "global_step": 319086, "epoch": 1899} {"train_loss": -11.825775146484375, "global_step": 319087, "epoch": 1899} {"train_loss": -12.068083763122559, "global_step": 319088, "epoch": 1899} {"train_loss": -11.946890830993652, "global_step": 319089, "epoch": 1899} {"train_loss": -12.081043243408203, "global_step": 319090, "epoch": 1899} {"train_loss": -11.789861679077148, "global_step": 319091, "epoch": 1899} {"train_loss": -11.91898250579834, "global_step": 319092, "epoch": 1899} {"train_loss": -12.092850685119629, "global_step": 319093, "epoch": 1899} {"train_loss": -11.748167037963867, "global_step": 319094, "epoch": 1899} {"train_loss": -11.98931884765625, "global_step": 319095, "epoch": 1899} {"train_loss": -12.068693161010742, "global_step": 319096, "epoch": 1899} {"train_loss": -12.020180702209473, "global_step": 319097, "epoch": 1899} {"train_loss": -11.927746772766113, "global_step": 319098, "epoch": 1899} {"train_loss": -11.89448070526123, "global_step": 319099, "epoch": 1899} {"train_loss": -11.996415138244629, "global_step": 319100, "epoch": 1899} {"train_loss": -11.862826347351074, "global_step": 319101, "epoch": 1899} {"train_loss": -12.225822448730469, "global_step": 319102, "epoch": 1899} {"train_loss": -11.598138809204102, "global_step": 319103, "epoch": 1899} {"train_loss": -12.19940185546875, "global_step": 319104, "epoch": 1899} {"train_loss": -11.910408020019531, "global_step": 319105, "epoch": 1899} {"train_loss": -11.880638122558594, "global_step": 319106, "epoch": 1899} {"train_loss": -12.031290054321289, "global_step": 319107, "epoch": 1899} {"train_loss": -11.956531524658203, "global_step": 319108, "epoch": 1899} {"train_loss": -11.784438133239746, "global_step": 319109, "epoch": 1899} {"train_loss": -12.130758285522461, "global_step": 319110, "epoch": 1899} {"train_loss": -12.201333045959473, "global_step": 319111, "epoch": 1899} {"train_loss": -11.88107681274414, "global_step": 319112, "epoch": 1899} {"train_loss": -12.306861877441406, "global_step": 319113, "epoch": 1899} {"train_loss": -11.826722145080566, "global_step": 319114, "epoch": 1899} {"train_loss": -12.174938201904297, "global_step": 319115, "epoch": 1899} {"train_loss": -11.643355369567871, "global_step": 319116, "epoch": 1899} {"train_loss": -12.270624160766602, "global_step": 319117, "epoch": 1899} {"train_loss": -11.78488540649414, "global_step": 319118, "epoch": 1899} {"train_loss": -12.142587661743164, "global_step": 319119, "epoch": 1899} {"train_loss": -12.027334213256836, "global_step": 319120, "epoch": 1899} {"train_loss": -12.259730339050293, "global_step": 319121, "epoch": 1899} {"train_loss": -11.758478164672852, "global_step": 319122, "epoch": 1899} {"train_loss": -12.040547370910645, "global_step": 319123, "epoch": 1899} {"train_loss": -12.165262222290039, "global_step": 319124, "epoch": 1899} {"train_loss": -11.768777847290039, "global_step": 319125, "epoch": 1899} {"train_loss": -12.158590316772461, "global_step": 319126, "epoch": 1899} {"train_loss": -12.183370590209961, "global_step": 319127, "epoch": 1899} {"train_loss": -11.915384292602539, "global_step": 319128, "epoch": 1899} {"train_loss": -12.13404655456543, "global_step": 319129, "epoch": 1899} {"train_loss": -12.28687858581543, "global_step": 319130, "epoch": 1899} {"train_loss": -12.033576011657715, "global_step": 319131, "epoch": 1899} {"train_loss": -12.169434547424316, "global_step": 319132, "epoch": 1899} {"train_loss": -12.178075790405273, "global_step": 319133, "epoch": 1899} {"train_loss": -12.2748441696167, "global_step": 319134, "epoch": 1899} {"train_loss": -12.286937713623047, "global_step": 319135, "epoch": 1899} {"train_loss": -12.083065032958984, "global_step": 319136, "epoch": 1899} {"train_loss": -12.30685043334961, "global_step": 319137, "epoch": 1899} {"train_loss": -12.15517520904541, "global_step": 319138, "epoch": 1899} {"train_loss": -12.129858016967773, "global_step": 319139, "epoch": 1899} {"train_loss": -12.085254669189453, "global_step": 319140, "epoch": 1899} {"train_loss": -11.721109390258789, "global_step": 319141, "epoch": 1899} {"train_loss": -11.922455787658691, "global_step": 319142, "epoch": 1899} {"train_loss": -12.041412353515625, "global_step": 319143, "epoch": 1899} {"train_loss": -11.64030933380127, "global_step": 319144, "epoch": 1899} {"train_loss": -12.250301361083984, "global_step": 319145, "epoch": 1899} {"train_loss": -12.029120445251465, "global_step": 319146, "epoch": 1899} {"train_loss": -11.738903045654297, "global_step": 319147, "epoch": 1899} {"train_loss": -12.00319766998291, "global_step": 319148, "epoch": 1899} {"train_loss": -11.982622146606445, "global_step": 319149, "epoch": 1899} {"train_loss": -12.222784042358398, "global_step": 319150, "epoch": 1899} {"train_loss": -12.189558029174805, "global_step": 319151, "epoch": 1899} {"train_loss": -11.592097282409668, "global_step": 319152, "epoch": 1899} {"train_loss": -12.037872314453125, "global_step": 319153, "epoch": 1899} {"train_loss": -12.276420593261719, "global_step": 319154, "epoch": 1899} {"train_loss": -11.89989948272705, "global_step": 319155, "epoch": 1899} {"train_loss": -11.863452911376953, "global_step": 319156, "epoch": 1899} {"train_loss": -12.267487525939941, "global_step": 319157, "epoch": 1899} {"train_loss": -12.160717010498047, "global_step": 319158, "epoch": 1899} {"train_loss": -11.955629348754883, "global_step": 319159, "epoch": 1899} {"train_loss": -12.137425422668457, "global_step": 319160, "epoch": 1899} {"train_loss": -12.392946243286133, "global_step": 319161, "epoch": 1899} {"train_loss": -12.481698989868164, "global_step": 319162, "epoch": 1899} {"train_loss": -12.384430885314941, "global_step": 319163, "epoch": 1899} {"train_loss": -12.363344192504883, "global_step": 319164, "epoch": 1899} {"train_loss": -12.080615997314453, "global_step": 319165, "epoch": 1899} {"train_loss": -12.325827598571777, "global_step": 319166, "epoch": 1899} {"train_loss": -12.257096290588379, "global_step": 319167, "epoch": 1899} {"train_loss": -11.916943550109863, "global_step": 319168, "epoch": 1899} {"train_loss": -12.030088424682617, "global_step": 319169, "epoch": 1899} {"train_loss": -12.09283447265625, "global_step": 319170, "epoch": 1899} {"train_loss": -11.342256546020508, "global_step": 319171, "epoch": 1899} {"train_loss": -10.985536575317383, "global_step": 319172, "epoch": 1899} {"train_loss": -11.227903366088867, "global_step": 319173, "epoch": 1899} {"train_loss": -10.849369049072266, "global_step": 319174, "epoch": 1899} {"train_loss": -9.12339973449707, "global_step": 319175, "epoch": 1899} {"train_loss": -10.95279312133789, "global_step": 319176, "epoch": 1899} {"train_loss": -9.30102252960205, "global_step": 319177, "epoch": 1899} {"train_loss": -7.667784690856934, "global_step": 319178, "epoch": 1899} {"train_loss": -7.481445789337158, "global_step": 319179, "epoch": 1899} {"train_loss": -7.555880546569824, "global_step": 319180, "epoch": 1899} {"train_loss": -8.303600311279297, "global_step": 319181, "epoch": 1899} {"train_loss": -8.093929290771484, "global_step": 319182, "epoch": 1899} {"train_loss": -8.840459823608398, "global_step": 319183, "epoch": 1899} {"train_loss": -9.059505462646484, "global_step": 319184, "epoch": 1899} {"train_loss": -9.50202751159668, "global_step": 319185, "epoch": 1899} {"train_loss": -9.702754974365234, "global_step": 319186, "epoch": 1899} {"train_loss": -8.711074829101562, "global_step": 319187, "epoch": 1899} {"train_loss": -9.98208236694336, "global_step": 319188, "epoch": 1899} {"train_loss": -10.571849822998047, "global_step": 319189, "epoch": 1899} {"train_loss": -10.25117015838623, "global_step": 319190, "epoch": 1899} {"train_loss": -11.261260986328125, "global_step": 319191, "epoch": 1899} {"train_loss": -10.062021255493164, "global_step": 319192, "epoch": 1899} {"train_loss": -9.899665832519531, "global_step": 319193, "epoch": 1899} {"train_loss": -8.610267639160156, "global_step": 319194, "epoch": 1899} {"train_loss": -10.295284271240234, "global_step": 319195, "epoch": 1899} {"train_loss": -9.113054275512695, "global_step": 319196, "epoch": 1899} {"train_loss": -8.687206268310547, "global_step": 319197, "epoch": 1899} {"train_loss": -10.754297256469727, "global_step": 319198, "epoch": 1899} {"train_loss": -11.048272376968747, "global_step": 319199, "epoch": 1899, "val_loss": 282832.75} {"train_loss": -7.228104591369629, "global_step": 319200, "epoch": 1900} {"train_loss": -8.786291122436523, "global_step": 319201, "epoch": 1900} {"train_loss": -8.374139785766602, "global_step": 319202, "epoch": 1900} {"train_loss": -8.887938499450684, "global_step": 319203, "epoch": 1900} {"train_loss": -9.774471282958984, "global_step": 319204, "epoch": 1900} {"train_loss": -8.141626358032227, "global_step": 319205, "epoch": 1900} {"train_loss": -8.635177612304688, "global_step": 319206, "epoch": 1900} {"train_loss": -9.490324020385742, "global_step": 319207, "epoch": 1900} {"train_loss": -10.11979866027832, "global_step": 319208, "epoch": 1900} {"train_loss": -9.397777557373047, "global_step": 319209, "epoch": 1900} {"train_loss": -9.132230758666992, "global_step": 319210, "epoch": 1900} {"train_loss": -9.88552188873291, "global_step": 319211, "epoch": 1900} {"train_loss": -10.017195701599121, "global_step": 319212, "epoch": 1900} {"train_loss": -10.86001205444336, "global_step": 319213, "epoch": 1900} {"train_loss": -9.105634689331055, "global_step": 319214, "epoch": 1900} {"train_loss": -9.68805980682373, "global_step": 319215, "epoch": 1900} {"train_loss": -10.292567253112793, "global_step": 319216, "epoch": 1900} {"train_loss": -10.93061637878418, "global_step": 319217, "epoch": 1900} {"train_loss": -10.90632438659668, "global_step": 319218, "epoch": 1900} {"train_loss": -10.583405494689941, "global_step": 319219, "epoch": 1900} {"train_loss": -11.144584655761719, "global_step": 319220, "epoch": 1900} {"train_loss": -11.273012161254883, "global_step": 319221, "epoch": 1900} {"train_loss": -10.982736587524414, "global_step": 319222, "epoch": 1900} {"train_loss": -11.606142044067383, "global_step": 319223, "epoch": 1900} {"train_loss": -11.538114547729492, "global_step": 319224, "epoch": 1900} {"train_loss": -10.96066665649414, "global_step": 319225, "epoch": 1900} {"train_loss": -11.252443313598633, "global_step": 319226, "epoch": 1900} {"train_loss": -11.350560188293457, "global_step": 319227, "epoch": 1900} {"train_loss": -11.112060546875, "global_step": 319228, "epoch": 1900} {"train_loss": -11.60185432434082, "global_step": 319229, "epoch": 1900} {"train_loss": -11.24726390838623, "global_step": 319230, "epoch": 1900} {"train_loss": -11.436382293701172, "global_step": 319231, "epoch": 1900} {"train_loss": -11.445404052734375, "global_step": 319232, "epoch": 1900} {"train_loss": -11.443382263183594, "global_step": 319233, "epoch": 1900} {"train_loss": -10.964790344238281, "global_step": 319234, "epoch": 1900} {"train_loss": -11.42561149597168, "global_step": 319235, "epoch": 1900} {"train_loss": -11.430862426757812, "global_step": 319236, "epoch": 1900} {"train_loss": -11.248485565185547, "global_step": 319237, "epoch": 1900} {"train_loss": -11.678959846496582, "global_step": 319238, "epoch": 1900} {"train_loss": -11.498298645019531, "global_step": 319239, "epoch": 1900} {"train_loss": -11.263158798217773, "global_step": 319240, "epoch": 1900} {"train_loss": -11.594158172607422, "global_step": 319241, "epoch": 1900} {"train_loss": -11.648896217346191, "global_step": 319242, "epoch": 1900} {"train_loss": -11.662097930908203, "global_step": 319243, "epoch": 1900} {"train_loss": -11.789697647094727, "global_step": 319244, "epoch": 1900} {"train_loss": -11.893165588378906, "global_step": 319245, "epoch": 1900} {"train_loss": -11.763256072998047, "global_step": 319246, "epoch": 1900} {"train_loss": -11.788697242736816, "global_step": 319247, "epoch": 1900} {"train_loss": -11.923148155212402, "global_step": 319248, "epoch": 1900} {"train_loss": -11.822254180908203, "global_step": 319249, "epoch": 1900} {"train_loss": -12.065411567687988, "global_step": 319250, "epoch": 1900} {"train_loss": -11.955653190612793, "global_step": 319251, "epoch": 1900} {"train_loss": -11.933738708496094, "global_step": 319252, "epoch": 1900} {"train_loss": -12.033769607543945, "global_step": 319253, "epoch": 1900} {"train_loss": -12.025238037109375, "global_step": 319254, "epoch": 1900} {"train_loss": -12.004341125488281, "global_step": 319255, "epoch": 1900} {"train_loss": -12.071002960205078, "global_step": 319256, "epoch": 1900} {"train_loss": -12.145665168762207, "global_step": 319257, "epoch": 1900} {"train_loss": -12.083459854125977, "global_step": 319258, "epoch": 1900} {"train_loss": -11.962719917297363, "global_step": 319259, "epoch": 1900} {"train_loss": -12.256644248962402, "global_step": 319260, "epoch": 1900} {"train_loss": -12.243928909301758, "global_step": 319261, "epoch": 1900} {"train_loss": -12.251227378845215, "global_step": 319262, "epoch": 1900} {"train_loss": -12.235455513000488, "global_step": 319263, "epoch": 1900} {"train_loss": -12.102989196777344, "global_step": 319264, "epoch": 1900} {"train_loss": -12.204517364501953, "global_step": 319265, "epoch": 1900} {"train_loss": -12.081932067871094, "global_step": 319266, "epoch": 1900} {"train_loss": -12.182888984680176, "global_step": 319267, "epoch": 1900} {"train_loss": -12.257582664489746, "global_step": 319268, "epoch": 1900} {"train_loss": -12.252629280090332, "global_step": 319269, "epoch": 1900} {"train_loss": -12.246840476989746, "global_step": 319270, "epoch": 1900} {"train_loss": -12.118427276611328, "global_step": 319271, "epoch": 1900} {"train_loss": -12.241632461547852, "global_step": 319272, "epoch": 1900} {"train_loss": -12.3206787109375, "global_step": 319273, "epoch": 1900} {"train_loss": -12.418838500976562, "global_step": 319274, "epoch": 1900} {"train_loss": -12.253791809082031, "global_step": 319275, "epoch": 1900} {"train_loss": -12.269876480102539, "global_step": 319276, "epoch": 1900} {"train_loss": -12.222055435180664, "global_step": 319277, "epoch": 1900} {"train_loss": -12.286011695861816, "global_step": 319278, "epoch": 1900} {"train_loss": -12.304900169372559, "global_step": 319279, "epoch": 1900} {"train_loss": -12.331441879272461, "global_step": 319280, "epoch": 1900} {"train_loss": -12.316341400146484, "global_step": 319281, "epoch": 1900} {"train_loss": -12.402109146118164, "global_step": 319282, "epoch": 1900} {"train_loss": -12.370052337646484, "global_step": 319283, "epoch": 1900} {"train_loss": -12.322399139404297, "global_step": 319284, "epoch": 1900} {"train_loss": -12.20988655090332, "global_step": 319285, "epoch": 1900} {"train_loss": -12.307783126831055, "global_step": 319286, "epoch": 1900} {"train_loss": -12.482681274414062, "global_step": 319287, "epoch": 1900} {"train_loss": -12.427783966064453, "global_step": 319288, "epoch": 1900} {"train_loss": -12.28516960144043, "global_step": 319289, "epoch": 1900} {"train_loss": -12.395584106445312, "global_step": 319290, "epoch": 1900} {"train_loss": -12.40112590789795, "global_step": 319291, "epoch": 1900} {"train_loss": -12.627979278564453, "global_step": 319292, "epoch": 1900} {"train_loss": -12.315256118774414, "global_step": 319293, "epoch": 1900} {"train_loss": -12.274345397949219, "global_step": 319294, "epoch": 1900} {"train_loss": -12.161623001098633, "global_step": 319295, "epoch": 1900} {"train_loss": -12.072473526000977, "global_step": 319296, "epoch": 1900} {"train_loss": -12.229467391967773, "global_step": 319297, "epoch": 1900} {"train_loss": -12.401049613952637, "global_step": 319298, "epoch": 1900} {"train_loss": -12.1235933303833, "global_step": 319299, "epoch": 1900} {"train_loss": -12.615798950195312, "global_step": 319300, "epoch": 1900} {"train_loss": -11.999302864074707, "global_step": 319301, "epoch": 1900} {"train_loss": -12.281181335449219, "global_step": 319302, "epoch": 1900} {"train_loss": -12.137794494628906, "global_step": 319303, "epoch": 1900} {"train_loss": -12.20977783203125, "global_step": 319304, "epoch": 1900} {"train_loss": -12.134092330932617, "global_step": 319305, "epoch": 1900} {"train_loss": -12.557785034179688, "global_step": 319306, "epoch": 1900} {"train_loss": -12.435123443603516, "global_step": 319307, "epoch": 1900} {"train_loss": -12.284214973449707, "global_step": 319308, "epoch": 1900} {"train_loss": -12.389274597167969, "global_step": 319309, "epoch": 1900} {"train_loss": -12.171101570129395, "global_step": 319310, "epoch": 1900} {"train_loss": -12.093820571899414, "global_step": 319311, "epoch": 1900} {"train_loss": -12.19328784942627, "global_step": 319312, "epoch": 1900} {"train_loss": -12.117218017578125, "global_step": 319313, "epoch": 1900} {"train_loss": -11.473038673400879, "global_step": 319314, "epoch": 1900} {"train_loss": -11.946538925170898, "global_step": 319315, "epoch": 1900} {"train_loss": -12.365035057067871, "global_step": 319316, "epoch": 1900} {"train_loss": -12.233624458312988, "global_step": 319317, "epoch": 1900} {"train_loss": -11.994534492492676, "global_step": 319318, "epoch": 1900} {"train_loss": -12.410690307617188, "global_step": 319319, "epoch": 1900} {"train_loss": -11.988715171813965, "global_step": 319320, "epoch": 1900} {"train_loss": -11.936976432800293, "global_step": 319321, "epoch": 1900} {"train_loss": -12.388080596923828, "global_step": 319322, "epoch": 1900} {"train_loss": -11.56419563293457, "global_step": 319323, "epoch": 1900} {"train_loss": -11.31568431854248, "global_step": 319324, "epoch": 1900} {"train_loss": -10.892362594604492, "global_step": 319325, "epoch": 1900} {"train_loss": -11.872715950012207, "global_step": 319326, "epoch": 1900} {"train_loss": -12.115793228149414, "global_step": 319327, "epoch": 1900} {"train_loss": -11.931622505187988, "global_step": 319328, "epoch": 1900} {"train_loss": -11.898089408874512, "global_step": 319329, "epoch": 1900} {"train_loss": -12.221975326538086, "global_step": 319330, "epoch": 1900} {"train_loss": -12.21937370300293, "global_step": 319331, "epoch": 1900} {"train_loss": -12.170318603515625, "global_step": 319332, "epoch": 1900} {"train_loss": -11.884243965148926, "global_step": 319333, "epoch": 1900} {"train_loss": -11.780963897705078, "global_step": 319334, "epoch": 1900} {"train_loss": -12.177383422851562, "global_step": 319335, "epoch": 1900} {"train_loss": -11.560425758361816, "global_step": 319336, "epoch": 1900} {"train_loss": -10.625480651855469, "global_step": 319337, "epoch": 1900} {"train_loss": -11.629878997802734, "global_step": 319338, "epoch": 1900} {"train_loss": -11.111709594726562, "global_step": 319339, "epoch": 1900} {"train_loss": -12.247779846191406, "global_step": 319340, "epoch": 1900} {"train_loss": -11.365144729614258, "global_step": 319341, "epoch": 1900} {"train_loss": -11.293787002563477, "global_step": 319342, "epoch": 1900} {"train_loss": -11.576423645019531, "global_step": 319343, "epoch": 1900} {"train_loss": -11.658974647521973, "global_step": 319344, "epoch": 1900} {"train_loss": -10.641134262084961, "global_step": 319345, "epoch": 1900} {"train_loss": -10.815545082092285, "global_step": 319346, "epoch": 1900} {"train_loss": -10.800432205200195, "global_step": 319347, "epoch": 1900} {"train_loss": -11.044672966003418, "global_step": 319348, "epoch": 1900} {"train_loss": -10.365975379943848, "global_step": 319349, "epoch": 1900} {"train_loss": -11.355127334594727, "global_step": 319350, "epoch": 1900} {"train_loss": -11.57614517211914, "global_step": 319351, "epoch": 1900} {"train_loss": -11.739044189453125, "global_step": 319352, "epoch": 1900} {"train_loss": -11.556549072265625, "global_step": 319353, "epoch": 1900} {"train_loss": -11.782644271850586, "global_step": 319354, "epoch": 1900} {"train_loss": -11.41016960144043, "global_step": 319355, "epoch": 1900} {"train_loss": -11.537847518920898, "global_step": 319356, "epoch": 1900} {"train_loss": -11.220598220825195, "global_step": 319357, "epoch": 1900} {"train_loss": -12.01445198059082, "global_step": 319358, "epoch": 1900} {"train_loss": -11.59925651550293, "global_step": 319359, "epoch": 1900} {"train_loss": -12.072047233581543, "global_step": 319360, "epoch": 1900} {"train_loss": -11.544058799743652, "global_step": 319361, "epoch": 1900} {"train_loss": -11.997411727905273, "global_step": 319362, "epoch": 1900} {"train_loss": -11.685888290405273, "global_step": 319363, "epoch": 1900} {"train_loss": -12.114614486694336, "global_step": 319364, "epoch": 1900} {"train_loss": -11.611412048339844, "global_step": 319365, "epoch": 1900} {"train_loss": -11.625362396240234, "global_step": 319366, "epoch": 1900} {"train_loss": -11.589666054362343, "global_step": 319367, "epoch": 1900, "train/sim_max_reward_0": 0.6065813361042237, "train/sim_max_reward_1": 0.9070078451177844, "train/sim_max_reward_2": 0.021865501306097337, "train/sim_max_reward_3": 0.4679106597202788, "train/sim_max_reward_4": 0.9847587263632083, "train/sim_max_reward_5": 0.1931792625906985, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.39624491509556875, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.4924928280134281, "test/sim_max_reward_4400004": 0.5259305367653898, "test/sim_max_reward_4400005": 0.9620343285239227, "test/sim_max_reward_4400006": 0.3379542261319795, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 0.5773586650054333, "test/sim_max_reward_4400009": 0.03231879776770341, "test/sim_max_reward_4400010": 0.6918307111780185, "test/sim_max_reward_4400011": 0.9796269800386951, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 0.184585472671095, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.9774273680775991, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.9588549708262283, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.6086344182390482, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.16754609235015097, "test/sim_max_reward_4400028": 0.9886694022405019, "test/sim_max_reward_4400029": 0.41603827434770685, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.70712337184939, "test/sim_max_reward_4400033": 0.9999497476247049, "test/sim_max_reward_4400034": 0.9963272703092926, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.3663920647729463, "test/sim_max_reward_4400037": 0.9999917113807667, "test/sim_max_reward_4400038": 0.3305086597687459, "test/sim_max_reward_4400039": 0.41307188651708066, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.4091135797856821, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.3547773606067312, "test/sim_max_reward_4400044": 0.9912005119943272, "test/sim_max_reward_4400045": 0.056241493877991405, "test/sim_max_reward_4400046": 0.9984069159457948, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.5302172218670486, "test/mean_score": 0.5860699043701184, "val_loss": 285110.625, "train_action_mse_error": 0.41180288791656494} {"train_loss": -10.862327575683594, "global_step": 319368, "epoch": 1901} {"train_loss": -11.816828727722168, "global_step": 319369, "epoch": 1901} {"train_loss": -11.137981414794922, "global_step": 319370, "epoch": 1901} {"train_loss": -10.99524974822998, "global_step": 319371, "epoch": 1901} {"train_loss": -10.752728462219238, "global_step": 319372, "epoch": 1901} {"train_loss": -10.575085639953613, "global_step": 319373, "epoch": 1901} {"train_loss": -10.821187973022461, "global_step": 319374, "epoch": 1901} {"train_loss": -10.489768981933594, "global_step": 319375, "epoch": 1901} {"train_loss": -9.654754638671875, "global_step": 319376, "epoch": 1901} {"train_loss": -9.723233222961426, "global_step": 319377, "epoch": 1901} {"train_loss": -10.808176040649414, "global_step": 319378, "epoch": 1901} {"train_loss": -11.141937255859375, "global_step": 319379, "epoch": 1901} {"train_loss": -11.06900691986084, "global_step": 319380, "epoch": 1901} {"train_loss": -10.772351264953613, "global_step": 319381, "epoch": 1901} {"train_loss": -11.89127254486084, "global_step": 319382, "epoch": 1901} {"train_loss": -11.122453689575195, "global_step": 319383, "epoch": 1901} {"train_loss": -11.402530670166016, "global_step": 319384, "epoch": 1901} {"train_loss": -11.285672187805176, "global_step": 319385, "epoch": 1901} {"train_loss": -11.359954833984375, "global_step": 319386, "epoch": 1901} {"train_loss": -11.613556861877441, "global_step": 319387, "epoch": 1901} {"train_loss": -11.253899574279785, "global_step": 319388, "epoch": 1901} {"train_loss": -11.655821800231934, "global_step": 319389, "epoch": 1901} {"train_loss": -11.416836738586426, "global_step": 319390, "epoch": 1901} {"train_loss": -11.779241561889648, "global_step": 319391, "epoch": 1901} {"train_loss": -11.68991470336914, "global_step": 319392, "epoch": 1901} {"train_loss": -11.657878875732422, "global_step": 319393, "epoch": 1901} {"train_loss": -11.454084396362305, "global_step": 319394, "epoch": 1901} {"train_loss": -11.693427085876465, "global_step": 319395, "epoch": 1901} {"train_loss": -11.717217445373535, "global_step": 319396, "epoch": 1901} {"train_loss": -11.849018096923828, "global_step": 319397, "epoch": 1901} {"train_loss": -11.125121116638184, "global_step": 319398, "epoch": 1901} {"train_loss": -11.858295440673828, "global_step": 319399, "epoch": 1901} {"train_loss": -11.6934232711792, "global_step": 319400, "epoch": 1901} {"train_loss": -12.130285263061523, "global_step": 319401, "epoch": 1901} {"train_loss": -11.776103973388672, "global_step": 319402, "epoch": 1901} {"train_loss": -12.10811710357666, "global_step": 319403, "epoch": 1901} {"train_loss": -11.91889476776123, "global_step": 319404, "epoch": 1901} {"train_loss": -12.34788703918457, "global_step": 319405, "epoch": 1901} {"train_loss": -11.856010437011719, "global_step": 319406, "epoch": 1901} {"train_loss": -12.161970138549805, "global_step": 319407, "epoch": 1901} {"train_loss": -12.23780632019043, "global_step": 319408, "epoch": 1901} {"train_loss": -12.21845817565918, "global_step": 319409, "epoch": 1901} {"train_loss": -12.137240409851074, "global_step": 319410, "epoch": 1901} {"train_loss": -12.037675857543945, "global_step": 319411, "epoch": 1901} {"train_loss": -12.073690414428711, "global_step": 319412, "epoch": 1901} {"train_loss": -12.288298606872559, "global_step": 319413, "epoch": 1901} {"train_loss": -11.993375778198242, "global_step": 319414, "epoch": 1901} {"train_loss": -12.373841285705566, "global_step": 319415, "epoch": 1901} {"train_loss": -12.077710151672363, "global_step": 319416, "epoch": 1901} {"train_loss": -12.26827621459961, "global_step": 319417, "epoch": 1901} {"train_loss": -12.368551254272461, "global_step": 319418, "epoch": 1901} {"train_loss": -12.156149864196777, "global_step": 319419, "epoch": 1901} {"train_loss": -12.24646282196045, "global_step": 319420, "epoch": 1901} {"train_loss": -12.281991958618164, "global_step": 319421, "epoch": 1901} {"train_loss": -12.432369232177734, "global_step": 319422, "epoch": 1901} {"train_loss": -12.06523323059082, "global_step": 319423, "epoch": 1901} {"train_loss": -12.389047622680664, "global_step": 319424, "epoch": 1901} {"train_loss": -12.172414779663086, "global_step": 319425, "epoch": 1901} {"train_loss": -12.2857027053833, "global_step": 319426, "epoch": 1901} {"train_loss": -12.12673568725586, "global_step": 319427, "epoch": 1901} {"train_loss": -12.329994201660156, "global_step": 319428, "epoch": 1901} {"train_loss": -12.065577507019043, "global_step": 319429, "epoch": 1901} {"train_loss": -12.374651908874512, "global_step": 319430, "epoch": 1901} {"train_loss": -12.309396743774414, "global_step": 319431, "epoch": 1901} {"train_loss": -12.260501861572266, "global_step": 319432, "epoch": 1901} {"train_loss": -12.233251571655273, "global_step": 319433, "epoch": 1901} {"train_loss": -12.306632995605469, "global_step": 319434, "epoch": 1901} {"train_loss": -12.44593334197998, "global_step": 319435, "epoch": 1901} {"train_loss": -12.498108863830566, "global_step": 319436, "epoch": 1901} {"train_loss": -12.315908432006836, "global_step": 319437, "epoch": 1901} {"train_loss": -12.536664962768555, "global_step": 319438, "epoch": 1901} {"train_loss": -12.444040298461914, "global_step": 319439, "epoch": 1901} {"train_loss": -12.574816703796387, "global_step": 319440, "epoch": 1901} {"train_loss": -12.425613403320312, "global_step": 319441, "epoch": 1901} {"train_loss": -12.336414337158203, "global_step": 319442, "epoch": 1901} {"train_loss": -12.088987350463867, "global_step": 319443, "epoch": 1901} {"train_loss": -12.35787582397461, "global_step": 319444, "epoch": 1901} {"train_loss": -12.485267639160156, "global_step": 319445, "epoch": 1901} {"train_loss": -12.411510467529297, "global_step": 319446, "epoch": 1901} {"train_loss": -12.375726699829102, "global_step": 319447, "epoch": 1901} {"train_loss": -12.455840110778809, "global_step": 319448, "epoch": 1901} {"train_loss": -12.337098121643066, "global_step": 319449, "epoch": 1901} {"train_loss": -12.383819580078125, "global_step": 319450, "epoch": 1901} {"train_loss": -12.380861282348633, "global_step": 319451, "epoch": 1901} {"train_loss": -12.141542434692383, "global_step": 319452, "epoch": 1901} {"train_loss": -12.35588264465332, "global_step": 319453, "epoch": 1901} {"train_loss": -12.102970123291016, "global_step": 319454, "epoch": 1901} {"train_loss": -12.400165557861328, "global_step": 319455, "epoch": 1901} {"train_loss": -12.102141380310059, "global_step": 319456, "epoch": 1901} {"train_loss": -12.001516342163086, "global_step": 319457, "epoch": 1901} {"train_loss": -12.500419616699219, "global_step": 319458, "epoch": 1901} {"train_loss": -12.270832061767578, "global_step": 319459, "epoch": 1901} {"train_loss": -11.541133880615234, "global_step": 319460, "epoch": 1901} {"train_loss": -11.861109733581543, "global_step": 319461, "epoch": 1901} {"train_loss": -12.12175178527832, "global_step": 319462, "epoch": 1901} {"train_loss": -12.059955596923828, "global_step": 319463, "epoch": 1901} {"train_loss": -12.208139419555664, "global_step": 319464, "epoch": 1901} {"train_loss": -12.109880447387695, "global_step": 319465, "epoch": 1901} {"train_loss": -11.789289474487305, "global_step": 319466, "epoch": 1901} {"train_loss": -12.299570083618164, "global_step": 319467, "epoch": 1901} {"train_loss": -12.18617057800293, "global_step": 319468, "epoch": 1901} {"train_loss": -11.348360061645508, "global_step": 319469, "epoch": 1901} {"train_loss": -11.980131149291992, "global_step": 319470, "epoch": 1901} {"train_loss": -12.20280647277832, "global_step": 319471, "epoch": 1901} {"train_loss": -11.308370590209961, "global_step": 319472, "epoch": 1901} {"train_loss": -11.500053405761719, "global_step": 319473, "epoch": 1901} {"train_loss": -12.060795783996582, "global_step": 319474, "epoch": 1901} {"train_loss": -11.312467575073242, "global_step": 319475, "epoch": 1901} {"train_loss": -12.094072341918945, "global_step": 319476, "epoch": 1901} {"train_loss": -11.743476867675781, "global_step": 319477, "epoch": 1901} {"train_loss": -10.868555068969727, "global_step": 319478, "epoch": 1901} {"train_loss": -11.87974739074707, "global_step": 319479, "epoch": 1901} {"train_loss": -11.691082000732422, "global_step": 319480, "epoch": 1901} {"train_loss": -11.350625991821289, "global_step": 319481, "epoch": 1901} {"train_loss": -10.314456939697266, "global_step": 319482, "epoch": 1901} {"train_loss": -11.194219589233398, "global_step": 319483, "epoch": 1901} {"train_loss": -11.815431594848633, "global_step": 319484, "epoch": 1901} {"train_loss": -10.261523246765137, "global_step": 319485, "epoch": 1901} {"train_loss": -10.483665466308594, "global_step": 319486, "epoch": 1901} {"train_loss": -11.642849922180176, "global_step": 319487, "epoch": 1901} {"train_loss": -10.259969711303711, "global_step": 319488, "epoch": 1901} {"train_loss": -9.639638900756836, "global_step": 319489, "epoch": 1901} {"train_loss": -10.818989753723145, "global_step": 319490, "epoch": 1901} {"train_loss": -9.195538520812988, "global_step": 319491, "epoch": 1901} {"train_loss": -8.967191696166992, "global_step": 319492, "epoch": 1901} {"train_loss": -10.154752731323242, "global_step": 319493, "epoch": 1901} {"train_loss": -8.725238800048828, "global_step": 319494, "epoch": 1901} {"train_loss": -7.756148338317871, "global_step": 319495, "epoch": 1901} {"train_loss": -8.220118522644043, "global_step": 319496, "epoch": 1901} {"train_loss": -8.897052764892578, "global_step": 319497, "epoch": 1901} {"train_loss": -7.954019546508789, "global_step": 319498, "epoch": 1901} {"train_loss": -8.217334747314453, "global_step": 319499, "epoch": 1901} {"train_loss": -8.468718528747559, "global_step": 319500, "epoch": 1901} {"train_loss": -9.100942611694336, "global_step": 319501, "epoch": 1901} {"train_loss": -8.909557342529297, "global_step": 319502, "epoch": 1901} {"train_loss": -9.07890796661377, "global_step": 319503, "epoch": 1901} {"train_loss": -8.635652542114258, "global_step": 319504, "epoch": 1901} {"train_loss": -8.998823165893555, "global_step": 319505, "epoch": 1901} {"train_loss": -9.215353012084961, "global_step": 319506, "epoch": 1901} {"train_loss": -8.957130432128906, "global_step": 319507, "epoch": 1901} {"train_loss": -9.508197784423828, "global_step": 319508, "epoch": 1901} {"train_loss": -9.318880081176758, "global_step": 319509, "epoch": 1901} {"train_loss": -9.754426002502441, "global_step": 319510, "epoch": 1901} {"train_loss": -9.554634094238281, "global_step": 319511, "epoch": 1901} {"train_loss": -9.002788543701172, "global_step": 319512, "epoch": 1901} {"train_loss": -10.022092819213867, "global_step": 319513, "epoch": 1901} {"train_loss": -10.004984855651855, "global_step": 319514, "epoch": 1901} {"train_loss": -9.399628639221191, "global_step": 319515, "epoch": 1901} {"train_loss": -10.137126922607422, "global_step": 319516, "epoch": 1901} {"train_loss": -9.604205131530762, "global_step": 319517, "epoch": 1901} {"train_loss": -9.597980499267578, "global_step": 319518, "epoch": 1901} {"train_loss": -10.500432014465332, "global_step": 319519, "epoch": 1901} {"train_loss": -10.412694931030273, "global_step": 319520, "epoch": 1901} {"train_loss": -10.921106338500977, "global_step": 319521, "epoch": 1901} {"train_loss": -10.315197944641113, "global_step": 319522, "epoch": 1901} {"train_loss": -10.808969497680664, "global_step": 319523, "epoch": 1901} {"train_loss": -11.027103424072266, "global_step": 319524, "epoch": 1901} {"train_loss": -10.788679122924805, "global_step": 319525, "epoch": 1901} {"train_loss": -11.360800743103027, "global_step": 319526, "epoch": 1901} {"train_loss": -11.103372573852539, "global_step": 319527, "epoch": 1901} {"train_loss": -10.819779396057129, "global_step": 319528, "epoch": 1901} {"train_loss": -11.151178359985352, "global_step": 319529, "epoch": 1901} {"train_loss": -11.11746597290039, "global_step": 319530, "epoch": 1901} {"train_loss": -11.44968032836914, "global_step": 319531, "epoch": 1901} {"train_loss": -11.00007438659668, "global_step": 319532, "epoch": 1901} {"train_loss": -11.24980354309082, "global_step": 319533, "epoch": 1901} {"train_loss": -11.07780647277832, "global_step": 319534, "epoch": 1901} {"train_loss": -11.256285587946573, "global_step": 319535, "epoch": 1901, "val_loss": 284211.78125} {"train_loss": -11.464591026306152, "global_step": 319536, "epoch": 1902} {"train_loss": -11.119064331054688, "global_step": 319537, "epoch": 1902} {"train_loss": -11.901551246643066, "global_step": 319538, "epoch": 1902} {"train_loss": -11.050764083862305, "global_step": 319539, "epoch": 1902} {"train_loss": -11.878141403198242, "global_step": 319540, "epoch": 1902} {"train_loss": -11.069901466369629, "global_step": 319541, "epoch": 1902} {"train_loss": -11.877321243286133, "global_step": 319542, "epoch": 1902} {"train_loss": -11.162467002868652, "global_step": 319543, "epoch": 1902} {"train_loss": -10.976858139038086, "global_step": 319544, "epoch": 1902} {"train_loss": -11.310667037963867, "global_step": 319545, "epoch": 1902} {"train_loss": -10.704723358154297, "global_step": 319546, "epoch": 1902} {"train_loss": -11.705341339111328, "global_step": 319547, "epoch": 1902} {"train_loss": -11.015876770019531, "global_step": 319548, "epoch": 1902} {"train_loss": -11.66971206665039, "global_step": 319549, "epoch": 1902} {"train_loss": -11.434646606445312, "global_step": 319550, "epoch": 1902} {"train_loss": -11.446757316589355, "global_step": 319551, "epoch": 1902} {"train_loss": -11.68759536743164, "global_step": 319552, "epoch": 1902} {"train_loss": -11.337581634521484, "global_step": 319553, "epoch": 1902} {"train_loss": -11.799646377563477, "global_step": 319554, "epoch": 1902} {"train_loss": -11.774829864501953, "global_step": 319555, "epoch": 1902} {"train_loss": -11.648234367370605, "global_step": 319556, "epoch": 1902} {"train_loss": -11.83477783203125, "global_step": 319557, "epoch": 1902} {"train_loss": -11.97370719909668, "global_step": 319558, "epoch": 1902} {"train_loss": -11.879049301147461, "global_step": 319559, "epoch": 1902} {"train_loss": -11.658771514892578, "global_step": 319560, "epoch": 1902} {"train_loss": -11.913843154907227, "global_step": 319561, "epoch": 1902} {"train_loss": -11.81500244140625, "global_step": 319562, "epoch": 1902} {"train_loss": -11.915035247802734, "global_step": 319563, "epoch": 1902} {"train_loss": -12.146421432495117, "global_step": 319564, "epoch": 1902} {"train_loss": -12.169093132019043, "global_step": 319565, "epoch": 1902} {"train_loss": -12.047711372375488, "global_step": 319566, "epoch": 1902} {"train_loss": -12.21768569946289, "global_step": 319567, "epoch": 1902} {"train_loss": -11.973251342773438, "global_step": 319568, "epoch": 1902} {"train_loss": -12.046065330505371, "global_step": 319569, "epoch": 1902} {"train_loss": -12.186141014099121, "global_step": 319570, "epoch": 1902} {"train_loss": -11.985771179199219, "global_step": 319571, "epoch": 1902} {"train_loss": -12.02092170715332, "global_step": 319572, "epoch": 1902} {"train_loss": -11.942011833190918, "global_step": 319573, "epoch": 1902} {"train_loss": -12.090714454650879, "global_step": 319574, "epoch": 1902} {"train_loss": -11.920707702636719, "global_step": 319575, "epoch": 1902} {"train_loss": -12.135732650756836, "global_step": 319576, "epoch": 1902} {"train_loss": -12.16642951965332, "global_step": 319577, "epoch": 1902} {"train_loss": -12.086755752563477, "global_step": 319578, "epoch": 1902} {"train_loss": -12.33778190612793, "global_step": 319579, "epoch": 1902} {"train_loss": -12.156523704528809, "global_step": 319580, "epoch": 1902} {"train_loss": -12.168365478515625, "global_step": 319581, "epoch": 1902} {"train_loss": -12.16944408416748, "global_step": 319582, "epoch": 1902} {"train_loss": -12.119622230529785, "global_step": 319583, "epoch": 1902} {"train_loss": -12.144268035888672, "global_step": 319584, "epoch": 1902} {"train_loss": -12.271839141845703, "global_step": 319585, "epoch": 1902} {"train_loss": -12.110941886901855, "global_step": 319586, "epoch": 1902} {"train_loss": -12.35342025756836, "global_step": 319587, "epoch": 1902} {"train_loss": -12.226470947265625, "global_step": 319588, "epoch": 1902} {"train_loss": -12.35148811340332, "global_step": 319589, "epoch": 1902} {"train_loss": -12.24616813659668, "global_step": 319590, "epoch": 1902} {"train_loss": -11.967754364013672, "global_step": 319591, "epoch": 1902} {"train_loss": -12.201284408569336, "global_step": 319592, "epoch": 1902} {"train_loss": -12.260764122009277, "global_step": 319593, "epoch": 1902} {"train_loss": -12.227171897888184, "global_step": 319594, "epoch": 1902} {"train_loss": -12.33888053894043, "global_step": 319595, "epoch": 1902} {"train_loss": -12.376168251037598, "global_step": 319596, "epoch": 1902} {"train_loss": -12.309024810791016, "global_step": 319597, "epoch": 1902} {"train_loss": -12.430368423461914, "global_step": 319598, "epoch": 1902} {"train_loss": -12.293933868408203, "global_step": 319599, "epoch": 1902} {"train_loss": -12.380078315734863, "global_step": 319600, "epoch": 1902} {"train_loss": -12.567395210266113, "global_step": 319601, "epoch": 1902} {"train_loss": -12.48099136352539, "global_step": 319602, "epoch": 1902} {"train_loss": -12.411405563354492, "global_step": 319603, "epoch": 1902} {"train_loss": -12.517818450927734, "global_step": 319604, "epoch": 1902} {"train_loss": -12.364377975463867, "global_step": 319605, "epoch": 1902} {"train_loss": -12.580045700073242, "global_step": 319606, "epoch": 1902} {"train_loss": -12.376762390136719, "global_step": 319607, "epoch": 1902} {"train_loss": -12.482528686523438, "global_step": 319608, "epoch": 1902} {"train_loss": -12.585049629211426, "global_step": 319609, "epoch": 1902} {"train_loss": -12.449954986572266, "global_step": 319610, "epoch": 1902} {"train_loss": -12.557598114013672, "global_step": 319611, "epoch": 1902} {"train_loss": -12.605252265930176, "global_step": 319612, "epoch": 1902} {"train_loss": -12.367680549621582, "global_step": 319613, "epoch": 1902} {"train_loss": -12.521254539489746, "global_step": 319614, "epoch": 1902} {"train_loss": -12.493504524230957, "global_step": 319615, "epoch": 1902} {"train_loss": -12.446695327758789, "global_step": 319616, "epoch": 1902} {"train_loss": -12.402274131774902, "global_step": 319617, "epoch": 1902} {"train_loss": -12.330934524536133, "global_step": 319618, "epoch": 1902} {"train_loss": -11.534417152404785, "global_step": 319619, "epoch": 1902} {"train_loss": -11.258453369140625, "global_step": 319620, "epoch": 1902} {"train_loss": -11.388632774353027, "global_step": 319621, "epoch": 1902} {"train_loss": -12.250772476196289, "global_step": 319622, "epoch": 1902} {"train_loss": -10.245511054992676, "global_step": 319623, "epoch": 1902} {"train_loss": -11.510622024536133, "global_step": 319624, "epoch": 1902} {"train_loss": -12.03419303894043, "global_step": 319625, "epoch": 1902} {"train_loss": -10.488983154296875, "global_step": 319626, "epoch": 1902} {"train_loss": -12.298752784729004, "global_step": 319627, "epoch": 1902} {"train_loss": -11.075284957885742, "global_step": 319628, "epoch": 1902} {"train_loss": -11.397706031799316, "global_step": 319629, "epoch": 1902} {"train_loss": -10.725051879882812, "global_step": 319630, "epoch": 1902} {"train_loss": -12.101692199707031, "global_step": 319631, "epoch": 1902} {"train_loss": -11.425361633300781, "global_step": 319632, "epoch": 1902} {"train_loss": -11.08981704711914, "global_step": 319633, "epoch": 1902} {"train_loss": -10.006213188171387, "global_step": 319634, "epoch": 1902} {"train_loss": -12.03342056274414, "global_step": 319635, "epoch": 1902} {"train_loss": -11.171285629272461, "global_step": 319636, "epoch": 1902} {"train_loss": -11.333081245422363, "global_step": 319637, "epoch": 1902} {"train_loss": -9.304765701293945, "global_step": 319638, "epoch": 1902} {"train_loss": -9.277141571044922, "global_step": 319639, "epoch": 1902} {"train_loss": -10.023674011230469, "global_step": 319640, "epoch": 1902} {"train_loss": -11.31074047088623, "global_step": 319641, "epoch": 1902} {"train_loss": -8.37582015991211, "global_step": 319642, "epoch": 1902} {"train_loss": -7.880022048950195, "global_step": 319643, "epoch": 1902} {"train_loss": -8.528375625610352, "global_step": 319644, "epoch": 1902} {"train_loss": -8.612433433532715, "global_step": 319645, "epoch": 1902} {"train_loss": -8.744425773620605, "global_step": 319646, "epoch": 1902} {"train_loss": -9.519814491271973, "global_step": 319647, "epoch": 1902} {"train_loss": -8.300177574157715, "global_step": 319648, "epoch": 1902} {"train_loss": -8.707527160644531, "global_step": 319649, "epoch": 1902} {"train_loss": -9.773107528686523, "global_step": 319650, "epoch": 1902} {"train_loss": -9.605688095092773, "global_step": 319651, "epoch": 1902} {"train_loss": -10.069458961486816, "global_step": 319652, "epoch": 1902} {"train_loss": -11.028402328491211, "global_step": 319653, "epoch": 1902} {"train_loss": -10.960857391357422, "global_step": 319654, "epoch": 1902} {"train_loss": -11.87647819519043, "global_step": 319655, "epoch": 1902} {"train_loss": -11.244020462036133, "global_step": 319656, "epoch": 1902} {"train_loss": -9.941961288452148, "global_step": 319657, "epoch": 1902} {"train_loss": -11.105838775634766, "global_step": 319658, "epoch": 1902} {"train_loss": -10.841506958007812, "global_step": 319659, "epoch": 1902} {"train_loss": -10.278316497802734, "global_step": 319660, "epoch": 1902} {"train_loss": -11.351676940917969, "global_step": 319661, "epoch": 1902} {"train_loss": -9.756821632385254, "global_step": 319662, "epoch": 1902} {"train_loss": -9.846354484558105, "global_step": 319663, "epoch": 1902} {"train_loss": -10.808333396911621, "global_step": 319664, "epoch": 1902} {"train_loss": -10.834299087524414, "global_step": 319665, "epoch": 1902} {"train_loss": -9.543014526367188, "global_step": 319666, "epoch": 1902} {"train_loss": -10.527271270751953, "global_step": 319667, "epoch": 1902} {"train_loss": -11.34971809387207, "global_step": 319668, "epoch": 1902} {"train_loss": -10.061042785644531, "global_step": 319669, "epoch": 1902} {"train_loss": -11.013021469116211, "global_step": 319670, "epoch": 1902} {"train_loss": -11.326614379882812, "global_step": 319671, "epoch": 1902} {"train_loss": -10.988654136657715, "global_step": 319672, "epoch": 1902} {"train_loss": -10.883157730102539, "global_step": 319673, "epoch": 1902} {"train_loss": -11.74171257019043, "global_step": 319674, "epoch": 1902} {"train_loss": -10.868990898132324, "global_step": 319675, "epoch": 1902} {"train_loss": -11.50855827331543, "global_step": 319676, "epoch": 1902} {"train_loss": -11.719589233398438, "global_step": 319677, "epoch": 1902} {"train_loss": -11.683357238769531, "global_step": 319678, "epoch": 1902} {"train_loss": -11.37881851196289, "global_step": 319679, "epoch": 1902} {"train_loss": -11.661632537841797, "global_step": 319680, "epoch": 1902} {"train_loss": -11.733882904052734, "global_step": 319681, "epoch": 1902} {"train_loss": -11.490815162658691, "global_step": 319682, "epoch": 1902} {"train_loss": -11.993810653686523, "global_step": 319683, "epoch": 1902} {"train_loss": -11.774731636047363, "global_step": 319684, "epoch": 1902} {"train_loss": -11.847644805908203, "global_step": 319685, "epoch": 1902} {"train_loss": -11.890472412109375, "global_step": 319686, "epoch": 1902} {"train_loss": -11.634454727172852, "global_step": 319687, "epoch": 1902} {"train_loss": -11.882909774780273, "global_step": 319688, "epoch": 1902} {"train_loss": -11.791403770446777, "global_step": 319689, "epoch": 1902} {"train_loss": -11.892107009887695, "global_step": 319690, "epoch": 1902} {"train_loss": -11.977596282958984, "global_step": 319691, "epoch": 1902} {"train_loss": -12.101839065551758, "global_step": 319692, "epoch": 1902} {"train_loss": -12.126665115356445, "global_step": 319693, "epoch": 1902} {"train_loss": -11.89474868774414, "global_step": 319694, "epoch": 1902} {"train_loss": -11.972643852233887, "global_step": 319695, "epoch": 1902} {"train_loss": -12.149848937988281, "global_step": 319696, "epoch": 1902} {"train_loss": -12.189762115478516, "global_step": 319697, "epoch": 1902} {"train_loss": -11.797203063964844, "global_step": 319698, "epoch": 1902} {"train_loss": -11.85542106628418, "global_step": 319699, "epoch": 1902} {"train_loss": -11.942931175231934, "global_step": 319700, "epoch": 1902} {"train_loss": -12.16438102722168, "global_step": 319701, "epoch": 1902} {"train_loss": -12.153691291809082, "global_step": 319702, "epoch": 1902} {"train_loss": -11.499321137155805, "global_step": 319703, "epoch": 1902, "val_loss": 283120.53125} {"train_loss": -11.986523628234863, "global_step": 319704, "epoch": 1903} {"train_loss": -12.011283874511719, "global_step": 319705, "epoch": 1903} {"train_loss": -12.199851036071777, "global_step": 319706, "epoch": 1903} {"train_loss": -12.059160232543945, "global_step": 319707, "epoch": 1903} {"train_loss": -11.920828819274902, "global_step": 319708, "epoch": 1903} {"train_loss": -12.178037643432617, "global_step": 319709, "epoch": 1903} {"train_loss": -12.151792526245117, "global_step": 319710, "epoch": 1903} {"train_loss": -12.122509956359863, "global_step": 319711, "epoch": 1903} {"train_loss": -12.195930480957031, "global_step": 319712, "epoch": 1903} {"train_loss": -12.040544509887695, "global_step": 319713, "epoch": 1903} {"train_loss": -12.072892189025879, "global_step": 319714, "epoch": 1903} {"train_loss": -12.245155334472656, "global_step": 319715, "epoch": 1903} {"train_loss": -12.131731986999512, "global_step": 319716, "epoch": 1903} {"train_loss": -12.307891845703125, "global_step": 319717, "epoch": 1903} {"train_loss": -12.266120910644531, "global_step": 319718, "epoch": 1903} {"train_loss": -12.248722076416016, "global_step": 319719, "epoch": 1903} {"train_loss": -12.265386581420898, "global_step": 319720, "epoch": 1903} {"train_loss": -12.103875160217285, "global_step": 319721, "epoch": 1903} {"train_loss": -12.3729248046875, "global_step": 319722, "epoch": 1903} {"train_loss": -12.346933364868164, "global_step": 319723, "epoch": 1903} {"train_loss": -12.198345184326172, "global_step": 319724, "epoch": 1903} {"train_loss": -12.43195915222168, "global_step": 319725, "epoch": 1903} {"train_loss": -12.15501594543457, "global_step": 319726, "epoch": 1903} {"train_loss": -12.515380859375, "global_step": 319727, "epoch": 1903} {"train_loss": -12.215666770935059, "global_step": 319728, "epoch": 1903} {"train_loss": -12.402473449707031, "global_step": 319729, "epoch": 1903} {"train_loss": -12.334815979003906, "global_step": 319730, "epoch": 1903} {"train_loss": -12.22038459777832, "global_step": 319731, "epoch": 1903} {"train_loss": -12.440160751342773, "global_step": 319732, "epoch": 1903} {"train_loss": -12.162216186523438, "global_step": 319733, "epoch": 1903} {"train_loss": -12.183189392089844, "global_step": 319734, "epoch": 1903} {"train_loss": -12.441022872924805, "global_step": 319735, "epoch": 1903} {"train_loss": -12.262462615966797, "global_step": 319736, "epoch": 1903} {"train_loss": -12.564444541931152, "global_step": 319737, "epoch": 1903} {"train_loss": -12.560616493225098, "global_step": 319738, "epoch": 1903} {"train_loss": -12.445945739746094, "global_step": 319739, "epoch": 1903} {"train_loss": -12.551676750183105, "global_step": 319740, "epoch": 1903} {"train_loss": -12.342988967895508, "global_step": 319741, "epoch": 1903} {"train_loss": -12.412744522094727, "global_step": 319742, "epoch": 1903} {"train_loss": -12.401056289672852, "global_step": 319743, "epoch": 1903} {"train_loss": -12.46847152709961, "global_step": 319744, "epoch": 1903} {"train_loss": -12.209419250488281, "global_step": 319745, "epoch": 1903} {"train_loss": -12.359185218811035, "global_step": 319746, "epoch": 1903} {"train_loss": -12.342559814453125, "global_step": 319747, "epoch": 1903} {"train_loss": -12.334413528442383, "global_step": 319748, "epoch": 1903} {"train_loss": -12.068743705749512, "global_step": 319749, "epoch": 1903} {"train_loss": -11.91740608215332, "global_step": 319750, "epoch": 1903} {"train_loss": -11.650394439697266, "global_step": 319751, "epoch": 1903} {"train_loss": -12.198607444763184, "global_step": 319752, "epoch": 1903} {"train_loss": -12.174602508544922, "global_step": 319753, "epoch": 1903} {"train_loss": -11.310396194458008, "global_step": 319754, "epoch": 1903} {"train_loss": -11.468942642211914, "global_step": 319755, "epoch": 1903} {"train_loss": -11.437443733215332, "global_step": 319756, "epoch": 1903} {"train_loss": -11.277698516845703, "global_step": 319757, "epoch": 1903} {"train_loss": -11.921731948852539, "global_step": 319758, "epoch": 1903} {"train_loss": -12.007179260253906, "global_step": 319759, "epoch": 1903} {"train_loss": -12.191068649291992, "global_step": 319760, "epoch": 1903} {"train_loss": -12.248764038085938, "global_step": 319761, "epoch": 1903} {"train_loss": -12.324984550476074, "global_step": 319762, "epoch": 1903} {"train_loss": -12.366539001464844, "global_step": 319763, "epoch": 1903} {"train_loss": -12.122322082519531, "global_step": 319764, "epoch": 1903} {"train_loss": -12.209830284118652, "global_step": 319765, "epoch": 1903} {"train_loss": -11.878843307495117, "global_step": 319766, "epoch": 1903} {"train_loss": -12.323589324951172, "global_step": 319767, "epoch": 1903} {"train_loss": -11.710149765014648, "global_step": 319768, "epoch": 1903} {"train_loss": -12.184377670288086, "global_step": 319769, "epoch": 1903} {"train_loss": -11.897706985473633, "global_step": 319770, "epoch": 1903} {"train_loss": -11.831231117248535, "global_step": 319771, "epoch": 1903} {"train_loss": -10.860895156860352, "global_step": 319772, "epoch": 1903} {"train_loss": -11.585756301879883, "global_step": 319773, "epoch": 1903} {"train_loss": -12.362174034118652, "global_step": 319774, "epoch": 1903} {"train_loss": -11.802274703979492, "global_step": 319775, "epoch": 1903} {"train_loss": -11.674846649169922, "global_step": 319776, "epoch": 1903} {"train_loss": -11.680408477783203, "global_step": 319777, "epoch": 1903} {"train_loss": -12.087809562683105, "global_step": 319778, "epoch": 1903} {"train_loss": -12.212949752807617, "global_step": 319779, "epoch": 1903} {"train_loss": -11.791730880737305, "global_step": 319780, "epoch": 1903} {"train_loss": -12.111373901367188, "global_step": 319781, "epoch": 1903} {"train_loss": -12.09160041809082, "global_step": 319782, "epoch": 1903} {"train_loss": -11.837879180908203, "global_step": 319783, "epoch": 1903} {"train_loss": -11.501343727111816, "global_step": 319784, "epoch": 1903} {"train_loss": -11.652365684509277, "global_step": 319785, "epoch": 1903} {"train_loss": -10.930971145629883, "global_step": 319786, "epoch": 1903} {"train_loss": -11.61505126953125, "global_step": 319787, "epoch": 1903} {"train_loss": -10.838471412658691, "global_step": 319788, "epoch": 1903} {"train_loss": -11.744044303894043, "global_step": 319789, "epoch": 1903} {"train_loss": -11.778768539428711, "global_step": 319790, "epoch": 1903} {"train_loss": -11.378414154052734, "global_step": 319791, "epoch": 1903} {"train_loss": -11.806495666503906, "global_step": 319792, "epoch": 1903} {"train_loss": -10.817590713500977, "global_step": 319793, "epoch": 1903} {"train_loss": -11.772125244140625, "global_step": 319794, "epoch": 1903} {"train_loss": -12.112252235412598, "global_step": 319795, "epoch": 1903} {"train_loss": -11.891318321228027, "global_step": 319796, "epoch": 1903} {"train_loss": -11.770248413085938, "global_step": 319797, "epoch": 1903} {"train_loss": -11.548370361328125, "global_step": 319798, "epoch": 1903} {"train_loss": -11.668701171875, "global_step": 319799, "epoch": 1903} {"train_loss": -11.620721817016602, "global_step": 319800, "epoch": 1903} {"train_loss": -11.924427032470703, "global_step": 319801, "epoch": 1903} {"train_loss": -11.798637390136719, "global_step": 319802, "epoch": 1903} {"train_loss": -12.226194381713867, "global_step": 319803, "epoch": 1903} {"train_loss": -11.881509780883789, "global_step": 319804, "epoch": 1903} {"train_loss": -12.259523391723633, "global_step": 319805, "epoch": 1903} {"train_loss": -12.021343231201172, "global_step": 319806, "epoch": 1903} {"train_loss": -11.875411033630371, "global_step": 319807, "epoch": 1903} {"train_loss": -11.734806060791016, "global_step": 319808, "epoch": 1903} {"train_loss": -12.15317440032959, "global_step": 319809, "epoch": 1903} {"train_loss": -11.609498977661133, "global_step": 319810, "epoch": 1903} {"train_loss": -11.488759994506836, "global_step": 319811, "epoch": 1903} {"train_loss": -11.287814140319824, "global_step": 319812, "epoch": 1903} {"train_loss": -11.400625228881836, "global_step": 319813, "epoch": 1903} {"train_loss": -12.251853942871094, "global_step": 319814, "epoch": 1903} {"train_loss": -11.742645263671875, "global_step": 319815, "epoch": 1903} {"train_loss": -11.87278938293457, "global_step": 319816, "epoch": 1903} {"train_loss": -11.90351676940918, "global_step": 319817, "epoch": 1903} {"train_loss": -11.777992248535156, "global_step": 319818, "epoch": 1903} {"train_loss": -11.756766319274902, "global_step": 319819, "epoch": 1903} {"train_loss": -11.764002799987793, "global_step": 319820, "epoch": 1903} {"train_loss": -11.666507720947266, "global_step": 319821, "epoch": 1903} {"train_loss": -11.669233322143555, "global_step": 319822, "epoch": 1903} {"train_loss": -11.112825393676758, "global_step": 319823, "epoch": 1903} {"train_loss": -11.647778511047363, "global_step": 319824, "epoch": 1903} {"train_loss": -11.464818000793457, "global_step": 319825, "epoch": 1903} {"train_loss": -11.464365005493164, "global_step": 319826, "epoch": 1903} {"train_loss": -12.037429809570312, "global_step": 319827, "epoch": 1903} {"train_loss": -11.130515098571777, "global_step": 319828, "epoch": 1903} {"train_loss": -11.290212631225586, "global_step": 319829, "epoch": 1903} {"train_loss": -12.008708000183105, "global_step": 319830, "epoch": 1903} {"train_loss": -10.719637870788574, "global_step": 319831, "epoch": 1903} {"train_loss": -10.905921936035156, "global_step": 319832, "epoch": 1903} {"train_loss": -10.897424697875977, "global_step": 319833, "epoch": 1903} {"train_loss": -11.156661987304688, "global_step": 319834, "epoch": 1903} {"train_loss": -11.71936321258545, "global_step": 319835, "epoch": 1903} {"train_loss": -11.73270320892334, "global_step": 319836, "epoch": 1903} {"train_loss": -11.58960247039795, "global_step": 319837, "epoch": 1903} {"train_loss": -11.954607009887695, "global_step": 319838, "epoch": 1903} {"train_loss": -11.168275833129883, "global_step": 319839, "epoch": 1903} {"train_loss": -11.907429695129395, "global_step": 319840, "epoch": 1903} {"train_loss": -11.347261428833008, "global_step": 319841, "epoch": 1903} {"train_loss": -11.657706260681152, "global_step": 319842, "epoch": 1903} {"train_loss": -11.843841552734375, "global_step": 319843, "epoch": 1903} {"train_loss": -11.642829895019531, "global_step": 319844, "epoch": 1903} {"train_loss": -12.082094192504883, "global_step": 319845, "epoch": 1903} {"train_loss": -11.465779304504395, "global_step": 319846, "epoch": 1903} {"train_loss": -11.544469833374023, "global_step": 319847, "epoch": 1903} {"train_loss": -11.896810531616211, "global_step": 319848, "epoch": 1903} {"train_loss": -11.618653297424316, "global_step": 319849, "epoch": 1903} {"train_loss": -12.177663803100586, "global_step": 319850, "epoch": 1903} {"train_loss": -11.743413925170898, "global_step": 319851, "epoch": 1903} {"train_loss": -12.158212661743164, "global_step": 319852, "epoch": 1903} {"train_loss": -12.18480396270752, "global_step": 319853, "epoch": 1903} {"train_loss": -11.749446868896484, "global_step": 319854, "epoch": 1903} {"train_loss": -12.322864532470703, "global_step": 319855, "epoch": 1903} {"train_loss": -11.699968338012695, "global_step": 319856, "epoch": 1903} {"train_loss": -12.220008850097656, "global_step": 319857, "epoch": 1903} {"train_loss": -12.101828575134277, "global_step": 319858, "epoch": 1903} {"train_loss": -12.056546211242676, "global_step": 319859, "epoch": 1903} {"train_loss": -12.201449394226074, "global_step": 319860, "epoch": 1903} {"train_loss": -11.684242248535156, "global_step": 319861, "epoch": 1903} {"train_loss": -11.895881652832031, "global_step": 319862, "epoch": 1903} {"train_loss": -11.947858810424805, "global_step": 319863, "epoch": 1903} {"train_loss": -11.253358840942383, "global_step": 319864, "epoch": 1903} {"train_loss": -12.168310165405273, "global_step": 319865, "epoch": 1903} {"train_loss": -12.135287284851074, "global_step": 319866, "epoch": 1903} {"train_loss": -11.555438041687012, "global_step": 319867, "epoch": 1903} {"train_loss": -11.437482833862305, "global_step": 319868, "epoch": 1903} {"train_loss": -11.466894149780273, "global_step": 319869, "epoch": 1903} {"train_loss": -11.846956253051758, "global_step": 319870, "epoch": 1903} {"train_loss": -11.88965205919175, "global_step": 319871, "epoch": 1903, "val_loss": 283535.875} {"train_loss": -11.79961109161377, "global_step": 319872, "epoch": 1904} {"train_loss": -9.843748092651367, "global_step": 319873, "epoch": 1904} {"train_loss": -11.893518447875977, "global_step": 319874, "epoch": 1904} {"train_loss": -10.619138717651367, "global_step": 319875, "epoch": 1904} {"train_loss": -11.383859634399414, "global_step": 319876, "epoch": 1904} {"train_loss": -11.968981742858887, "global_step": 319877, "epoch": 1904} {"train_loss": -11.679415702819824, "global_step": 319878, "epoch": 1904} {"train_loss": -11.684221267700195, "global_step": 319879, "epoch": 1904} {"train_loss": -11.488121032714844, "global_step": 319880, "epoch": 1904} {"train_loss": -11.675943374633789, "global_step": 319881, "epoch": 1904} {"train_loss": -11.8047513961792, "global_step": 319882, "epoch": 1904} {"train_loss": -11.598722457885742, "global_step": 319883, "epoch": 1904} {"train_loss": -11.454206466674805, "global_step": 319884, "epoch": 1904} {"train_loss": -12.099283218383789, "global_step": 319885, "epoch": 1904} {"train_loss": -11.819705963134766, "global_step": 319886, "epoch": 1904} {"train_loss": -11.957358360290527, "global_step": 319887, "epoch": 1904} {"train_loss": -12.076333999633789, "global_step": 319888, "epoch": 1904} {"train_loss": -12.13638973236084, "global_step": 319889, "epoch": 1904} {"train_loss": -11.909860610961914, "global_step": 319890, "epoch": 1904} {"train_loss": -11.91588020324707, "global_step": 319891, "epoch": 1904} {"train_loss": -11.772003173828125, "global_step": 319892, "epoch": 1904} {"train_loss": -10.810079574584961, "global_step": 319893, "epoch": 1904} {"train_loss": -12.0665864944458, "global_step": 319894, "epoch": 1904} {"train_loss": -12.046234130859375, "global_step": 319895, "epoch": 1904} {"train_loss": -12.00489616394043, "global_step": 319896, "epoch": 1904} {"train_loss": -12.161698341369629, "global_step": 319897, "epoch": 1904} {"train_loss": -11.853837966918945, "global_step": 319898, "epoch": 1904} {"train_loss": -12.164977073669434, "global_step": 319899, "epoch": 1904} {"train_loss": -11.844837188720703, "global_step": 319900, "epoch": 1904} {"train_loss": -12.381488800048828, "global_step": 319901, "epoch": 1904} {"train_loss": -11.496315002441406, "global_step": 319902, "epoch": 1904} {"train_loss": -11.973708152770996, "global_step": 319903, "epoch": 1904} {"train_loss": -11.660896301269531, "global_step": 319904, "epoch": 1904} {"train_loss": -12.0557861328125, "global_step": 319905, "epoch": 1904} {"train_loss": -11.72198486328125, "global_step": 319906, "epoch": 1904} {"train_loss": -11.90011215209961, "global_step": 319907, "epoch": 1904} {"train_loss": -12.073432922363281, "global_step": 319908, "epoch": 1904} {"train_loss": -11.952276229858398, "global_step": 319909, "epoch": 1904} {"train_loss": -12.10566520690918, "global_step": 319910, "epoch": 1904} {"train_loss": -12.139774322509766, "global_step": 319911, "epoch": 1904} {"train_loss": -12.325531005859375, "global_step": 319912, "epoch": 1904} {"train_loss": -11.830162048339844, "global_step": 319913, "epoch": 1904} {"train_loss": -12.13180923461914, "global_step": 319914, "epoch": 1904} {"train_loss": -12.24036979675293, "global_step": 319915, "epoch": 1904} {"train_loss": -12.345706939697266, "global_step": 319916, "epoch": 1904} {"train_loss": -12.438544273376465, "global_step": 319917, "epoch": 1904} {"train_loss": -12.263250350952148, "global_step": 319918, "epoch": 1904} {"train_loss": -12.568716049194336, "global_step": 319919, "epoch": 1904} {"train_loss": -12.340360641479492, "global_step": 319920, "epoch": 1904} {"train_loss": -12.297457695007324, "global_step": 319921, "epoch": 1904} {"train_loss": -12.33419132232666, "global_step": 319922, "epoch": 1904} {"train_loss": -12.284643173217773, "global_step": 319923, "epoch": 1904} {"train_loss": -12.531389236450195, "global_step": 319924, "epoch": 1904} {"train_loss": -12.431529998779297, "global_step": 319925, "epoch": 1904} {"train_loss": -12.4690523147583, "global_step": 319926, "epoch": 1904} {"train_loss": -12.470486640930176, "global_step": 319927, "epoch": 1904} {"train_loss": -12.360040664672852, "global_step": 319928, "epoch": 1904} {"train_loss": -12.359504699707031, "global_step": 319929, "epoch": 1904} {"train_loss": -12.559602737426758, "global_step": 319930, "epoch": 1904} {"train_loss": -12.057245254516602, "global_step": 319931, "epoch": 1904} {"train_loss": -12.414701461791992, "global_step": 319932, "epoch": 1904} {"train_loss": -12.40730094909668, "global_step": 319933, "epoch": 1904} {"train_loss": -12.557456970214844, "global_step": 319934, "epoch": 1904} {"train_loss": -11.89321517944336, "global_step": 319935, "epoch": 1904} {"train_loss": -12.360634803771973, "global_step": 319936, "epoch": 1904} {"train_loss": -12.393816947937012, "global_step": 319937, "epoch": 1904} {"train_loss": -12.542570114135742, "global_step": 319938, "epoch": 1904} {"train_loss": -12.513946533203125, "global_step": 319939, "epoch": 1904} {"train_loss": -12.475255966186523, "global_step": 319940, "epoch": 1904} {"train_loss": -12.523306846618652, "global_step": 319941, "epoch": 1904} {"train_loss": -12.329231262207031, "global_step": 319942, "epoch": 1904} {"train_loss": -11.951719284057617, "global_step": 319943, "epoch": 1904} {"train_loss": -11.659969329833984, "global_step": 319944, "epoch": 1904} {"train_loss": -11.827691078186035, "global_step": 319945, "epoch": 1904} {"train_loss": -11.968912124633789, "global_step": 319946, "epoch": 1904} {"train_loss": -11.560982704162598, "global_step": 319947, "epoch": 1904} {"train_loss": -12.331323623657227, "global_step": 319948, "epoch": 1904} {"train_loss": -11.590120315551758, "global_step": 319949, "epoch": 1904} {"train_loss": -11.373794555664062, "global_step": 319950, "epoch": 1904} {"train_loss": -10.271860122680664, "global_step": 319951, "epoch": 1904} {"train_loss": -11.910185813903809, "global_step": 319952, "epoch": 1904} {"train_loss": -11.626213073730469, "global_step": 319953, "epoch": 1904} {"train_loss": -11.681666374206543, "global_step": 319954, "epoch": 1904} {"train_loss": -11.788067817687988, "global_step": 319955, "epoch": 1904} {"train_loss": -11.89054012298584, "global_step": 319956, "epoch": 1904} {"train_loss": -11.357061386108398, "global_step": 319957, "epoch": 1904} {"train_loss": -11.920099258422852, "global_step": 319958, "epoch": 1904} {"train_loss": -11.958001136779785, "global_step": 319959, "epoch": 1904} {"train_loss": -11.691003799438477, "global_step": 319960, "epoch": 1904} {"train_loss": -12.159530639648438, "global_step": 319961, "epoch": 1904} {"train_loss": -11.727762222290039, "global_step": 319962, "epoch": 1904} {"train_loss": -11.574893951416016, "global_step": 319963, "epoch": 1904} {"train_loss": -12.101419448852539, "global_step": 319964, "epoch": 1904} {"train_loss": -12.015654563903809, "global_step": 319965, "epoch": 1904} {"train_loss": -12.026459693908691, "global_step": 319966, "epoch": 1904} {"train_loss": -12.096456527709961, "global_step": 319967, "epoch": 1904} {"train_loss": -11.279781341552734, "global_step": 319968, "epoch": 1904} {"train_loss": -11.016197204589844, "global_step": 319969, "epoch": 1904} {"train_loss": -10.343311309814453, "global_step": 319970, "epoch": 1904} {"train_loss": -11.59127426147461, "global_step": 319971, "epoch": 1904} {"train_loss": -10.462777137756348, "global_step": 319972, "epoch": 1904} {"train_loss": -10.724910736083984, "global_step": 319973, "epoch": 1904} {"train_loss": -10.5133056640625, "global_step": 319974, "epoch": 1904} {"train_loss": -10.327098846435547, "global_step": 319975, "epoch": 1904} {"train_loss": -11.131345748901367, "global_step": 319976, "epoch": 1904} {"train_loss": -9.240955352783203, "global_step": 319977, "epoch": 1904} {"train_loss": -11.279680252075195, "global_step": 319978, "epoch": 1904} {"train_loss": -11.157510757446289, "global_step": 319979, "epoch": 1904} {"train_loss": -10.150657653808594, "global_step": 319980, "epoch": 1904} {"train_loss": -12.024079322814941, "global_step": 319981, "epoch": 1904} {"train_loss": -10.228010177612305, "global_step": 319982, "epoch": 1904} {"train_loss": -10.926986694335938, "global_step": 319983, "epoch": 1904} {"train_loss": -10.928208351135254, "global_step": 319984, "epoch": 1904} {"train_loss": -10.133722305297852, "global_step": 319985, "epoch": 1904} {"train_loss": -11.377567291259766, "global_step": 319986, "epoch": 1904} {"train_loss": -8.99780559539795, "global_step": 319987, "epoch": 1904} {"train_loss": -11.421713829040527, "global_step": 319988, "epoch": 1904} {"train_loss": -9.723867416381836, "global_step": 319989, "epoch": 1904} {"train_loss": -10.824615478515625, "global_step": 319990, "epoch": 1904} {"train_loss": -9.708551406860352, "global_step": 319991, "epoch": 1904} {"train_loss": -11.156892776489258, "global_step": 319992, "epoch": 1904} {"train_loss": -8.980128288269043, "global_step": 319993, "epoch": 1904} {"train_loss": -10.331963539123535, "global_step": 319994, "epoch": 1904} {"train_loss": -9.891298294067383, "global_step": 319995, "epoch": 1904} {"train_loss": -10.969903945922852, "global_step": 319996, "epoch": 1904} {"train_loss": -9.81422233581543, "global_step": 319997, "epoch": 1904} {"train_loss": -10.176774978637695, "global_step": 319998, "epoch": 1904} {"train_loss": -11.139480590820312, "global_step": 319999, "epoch": 1904} {"train_loss": -10.268424987792969, "global_step": 320000, "epoch": 1904} {"train_loss": -11.617491722106934, "global_step": 320001, "epoch": 1904} {"train_loss": -10.909394264221191, "global_step": 320002, "epoch": 1904} {"train_loss": -10.943079948425293, "global_step": 320003, "epoch": 1904} {"train_loss": -10.994718551635742, "global_step": 320004, "epoch": 1904} {"train_loss": -11.338111877441406, "global_step": 320005, "epoch": 1904} {"train_loss": -11.038379669189453, "global_step": 320006, "epoch": 1904} {"train_loss": -11.713727951049805, "global_step": 320007, "epoch": 1904} {"train_loss": -10.870713233947754, "global_step": 320008, "epoch": 1904} {"train_loss": -11.393678665161133, "global_step": 320009, "epoch": 1904} {"train_loss": -11.459888458251953, "global_step": 320010, "epoch": 1904} {"train_loss": -11.600662231445312, "global_step": 320011, "epoch": 1904} {"train_loss": -10.785640716552734, "global_step": 320012, "epoch": 1904} {"train_loss": -11.601966857910156, "global_step": 320013, "epoch": 1904} {"train_loss": -11.268097877502441, "global_step": 320014, "epoch": 1904} {"train_loss": -11.440711975097656, "global_step": 320015, "epoch": 1904} {"train_loss": -11.620250701904297, "global_step": 320016, "epoch": 1904} {"train_loss": -11.738968849182129, "global_step": 320017, "epoch": 1904} {"train_loss": -11.46932315826416, "global_step": 320018, "epoch": 1904} {"train_loss": -12.010412216186523, "global_step": 320019, "epoch": 1904} {"train_loss": -11.694782257080078, "global_step": 320020, "epoch": 1904} {"train_loss": -11.579853057861328, "global_step": 320021, "epoch": 1904} {"train_loss": -12.014632225036621, "global_step": 320022, "epoch": 1904} {"train_loss": -11.421487808227539, "global_step": 320023, "epoch": 1904} {"train_loss": -11.98393440246582, "global_step": 320024, "epoch": 1904} {"train_loss": -11.822248458862305, "global_step": 320025, "epoch": 1904} {"train_loss": -12.049764633178711, "global_step": 320026, "epoch": 1904} {"train_loss": -11.823681831359863, "global_step": 320027, "epoch": 1904} {"train_loss": -11.99437141418457, "global_step": 320028, "epoch": 1904} {"train_loss": -12.128445625305176, "global_step": 320029, "epoch": 1904} {"train_loss": -11.712596893310547, "global_step": 320030, "epoch": 1904} {"train_loss": -12.023839950561523, "global_step": 320031, "epoch": 1904} {"train_loss": -12.020744323730469, "global_step": 320032, "epoch": 1904} {"train_loss": -11.817408561706543, "global_step": 320033, "epoch": 1904} {"train_loss": -11.957117080688477, "global_step": 320034, "epoch": 1904} {"train_loss": -12.058284759521484, "global_step": 320035, "epoch": 1904} {"train_loss": -11.986021041870117, "global_step": 320036, "epoch": 1904} {"train_loss": -12.035648345947266, "global_step": 320037, "epoch": 1904} {"train_loss": -11.942980766296387, "global_step": 320038, "epoch": 1904} {"train_loss": -11.60827376161303, "global_step": 320039, "epoch": 1904, "val_loss": 287532.46875} {"train_loss": -12.24157428741455, "global_step": 320040, "epoch": 1905} {"train_loss": -12.252395629882812, "global_step": 320041, "epoch": 1905} {"train_loss": -11.99415111541748, "global_step": 320042, "epoch": 1905} {"train_loss": -12.06607437133789, "global_step": 320043, "epoch": 1905} {"train_loss": -12.160442352294922, "global_step": 320044, "epoch": 1905} {"train_loss": -12.182281494140625, "global_step": 320045, "epoch": 1905} {"train_loss": -12.101273536682129, "global_step": 320046, "epoch": 1905} {"train_loss": -12.126792907714844, "global_step": 320047, "epoch": 1905} {"train_loss": -12.191300392150879, "global_step": 320048, "epoch": 1905} {"train_loss": -12.282174110412598, "global_step": 320049, "epoch": 1905} {"train_loss": -12.290291786193848, "global_step": 320050, "epoch": 1905} {"train_loss": -12.28720474243164, "global_step": 320051, "epoch": 1905} {"train_loss": -12.329963684082031, "global_step": 320052, "epoch": 1905} {"train_loss": -12.407262802124023, "global_step": 320053, "epoch": 1905} {"train_loss": -12.284320831298828, "global_step": 320054, "epoch": 1905} {"train_loss": -12.416149139404297, "global_step": 320055, "epoch": 1905} {"train_loss": -12.310402870178223, "global_step": 320056, "epoch": 1905} {"train_loss": -12.340588569641113, "global_step": 320057, "epoch": 1905} {"train_loss": -12.245403289794922, "global_step": 320058, "epoch": 1905} {"train_loss": -12.161233901977539, "global_step": 320059, "epoch": 1905} {"train_loss": -12.321365356445312, "global_step": 320060, "epoch": 1905} {"train_loss": -12.496551513671875, "global_step": 320061, "epoch": 1905} {"train_loss": -12.150181770324707, "global_step": 320062, "epoch": 1905} {"train_loss": -12.27465534210205, "global_step": 320063, "epoch": 1905} {"train_loss": -12.351987838745117, "global_step": 320064, "epoch": 1905} {"train_loss": -12.148890495300293, "global_step": 320065, "epoch": 1905} {"train_loss": -12.101607322692871, "global_step": 320066, "epoch": 1905} {"train_loss": -12.330930709838867, "global_step": 320067, "epoch": 1905} {"train_loss": -12.29362964630127, "global_step": 320068, "epoch": 1905} {"train_loss": -12.391880989074707, "global_step": 320069, "epoch": 1905} {"train_loss": -12.440196990966797, "global_step": 320070, "epoch": 1905} {"train_loss": -12.599676132202148, "global_step": 320071, "epoch": 1905} {"train_loss": -12.317399024963379, "global_step": 320072, "epoch": 1905} {"train_loss": -12.48227310180664, "global_step": 320073, "epoch": 1905} {"train_loss": -12.496026992797852, "global_step": 320074, "epoch": 1905} {"train_loss": -12.543495178222656, "global_step": 320075, "epoch": 1905} {"train_loss": -12.307170867919922, "global_step": 320076, "epoch": 1905} {"train_loss": -12.501940727233887, "global_step": 320077, "epoch": 1905} {"train_loss": -12.364418029785156, "global_step": 320078, "epoch": 1905} {"train_loss": -11.900176048278809, "global_step": 320079, "epoch": 1905} {"train_loss": -12.099855422973633, "global_step": 320080, "epoch": 1905} {"train_loss": -12.510679244995117, "global_step": 320081, "epoch": 1905} {"train_loss": -12.051176071166992, "global_step": 320082, "epoch": 1905} {"train_loss": -11.32931900024414, "global_step": 320083, "epoch": 1905} {"train_loss": -12.096878051757812, "global_step": 320084, "epoch": 1905} {"train_loss": -12.272539138793945, "global_step": 320085, "epoch": 1905} {"train_loss": -11.797367095947266, "global_step": 320086, "epoch": 1905} {"train_loss": -11.109333038330078, "global_step": 320087, "epoch": 1905} {"train_loss": -10.818628311157227, "global_step": 320088, "epoch": 1905} {"train_loss": -12.137344360351562, "global_step": 320089, "epoch": 1905} {"train_loss": -11.779495239257812, "global_step": 320090, "epoch": 1905} {"train_loss": -12.391727447509766, "global_step": 320091, "epoch": 1905} {"train_loss": -11.902322769165039, "global_step": 320092, "epoch": 1905} {"train_loss": -12.13985538482666, "global_step": 320093, "epoch": 1905} {"train_loss": -12.07998275756836, "global_step": 320094, "epoch": 1905} {"train_loss": -11.96329116821289, "global_step": 320095, "epoch": 1905} {"train_loss": -12.28436279296875, "global_step": 320096, "epoch": 1905} {"train_loss": -12.013257026672363, "global_step": 320097, "epoch": 1905} {"train_loss": -12.210464477539062, "global_step": 320098, "epoch": 1905} {"train_loss": -11.588140487670898, "global_step": 320099, "epoch": 1905} {"train_loss": -12.022518157958984, "global_step": 320100, "epoch": 1905} {"train_loss": -11.907844543457031, "global_step": 320101, "epoch": 1905} {"train_loss": -11.494821548461914, "global_step": 320102, "epoch": 1905} {"train_loss": -11.008298873901367, "global_step": 320103, "epoch": 1905} {"train_loss": -11.518752098083496, "global_step": 320104, "epoch": 1905} {"train_loss": -10.971477508544922, "global_step": 320105, "epoch": 1905} {"train_loss": -11.845595359802246, "global_step": 320106, "epoch": 1905} {"train_loss": -11.961767196655273, "global_step": 320107, "epoch": 1905} {"train_loss": -11.558304786682129, "global_step": 320108, "epoch": 1905} {"train_loss": -11.18401050567627, "global_step": 320109, "epoch": 1905} {"train_loss": -11.328771591186523, "global_step": 320110, "epoch": 1905} {"train_loss": -11.36669921875, "global_step": 320111, "epoch": 1905} {"train_loss": -10.086109161376953, "global_step": 320112, "epoch": 1905} {"train_loss": -10.442290306091309, "global_step": 320113, "epoch": 1905} {"train_loss": -8.678850173950195, "global_step": 320114, "epoch": 1905} {"train_loss": -8.712240219116211, "global_step": 320115, "epoch": 1905} {"train_loss": -9.665462493896484, "global_step": 320116, "epoch": 1905} {"train_loss": -10.980684280395508, "global_step": 320117, "epoch": 1905} {"train_loss": -9.607664108276367, "global_step": 320118, "epoch": 1905} {"train_loss": -8.745770454406738, "global_step": 320119, "epoch": 1905} {"train_loss": -9.62031364440918, "global_step": 320120, "epoch": 1905} {"train_loss": -10.27992057800293, "global_step": 320121, "epoch": 1905} {"train_loss": -10.763751983642578, "global_step": 320122, "epoch": 1905} {"train_loss": -10.127957344055176, "global_step": 320123, "epoch": 1905} {"train_loss": -11.222731590270996, "global_step": 320124, "epoch": 1905} {"train_loss": -10.934782028198242, "global_step": 320125, "epoch": 1905} {"train_loss": -10.204988479614258, "global_step": 320126, "epoch": 1905} {"train_loss": -10.311270713806152, "global_step": 320127, "epoch": 1905} {"train_loss": -9.330078125, "global_step": 320128, "epoch": 1905} {"train_loss": -9.646289825439453, "global_step": 320129, "epoch": 1905} {"train_loss": -10.25585651397705, "global_step": 320130, "epoch": 1905} {"train_loss": -10.044462203979492, "global_step": 320131, "epoch": 1905} {"train_loss": -9.878776550292969, "global_step": 320132, "epoch": 1905} {"train_loss": -10.974319458007812, "global_step": 320133, "epoch": 1905} {"train_loss": -9.381593704223633, "global_step": 320134, "epoch": 1905} {"train_loss": -10.795191764831543, "global_step": 320135, "epoch": 1905} {"train_loss": -10.709667205810547, "global_step": 320136, "epoch": 1905} {"train_loss": -10.52946662902832, "global_step": 320137, "epoch": 1905} {"train_loss": -10.852243423461914, "global_step": 320138, "epoch": 1905} {"train_loss": -11.508660316467285, "global_step": 320139, "epoch": 1905} {"train_loss": -11.15346622467041, "global_step": 320140, "epoch": 1905} {"train_loss": -11.336803436279297, "global_step": 320141, "epoch": 1905} {"train_loss": -11.200404167175293, "global_step": 320142, "epoch": 1905} {"train_loss": -11.421342849731445, "global_step": 320143, "epoch": 1905} {"train_loss": -11.330574989318848, "global_step": 320144, "epoch": 1905} {"train_loss": -11.292547225952148, "global_step": 320145, "epoch": 1905} {"train_loss": -11.376880645751953, "global_step": 320146, "epoch": 1905} {"train_loss": -11.153997421264648, "global_step": 320147, "epoch": 1905} {"train_loss": -11.333179473876953, "global_step": 320148, "epoch": 1905} {"train_loss": -11.414587020874023, "global_step": 320149, "epoch": 1905} {"train_loss": -11.815208435058594, "global_step": 320150, "epoch": 1905} {"train_loss": -11.272080421447754, "global_step": 320151, "epoch": 1905} {"train_loss": -11.56907844543457, "global_step": 320152, "epoch": 1905} {"train_loss": -11.527053833007812, "global_step": 320153, "epoch": 1905} {"train_loss": -11.776735305786133, "global_step": 320154, "epoch": 1905} {"train_loss": -11.75973129272461, "global_step": 320155, "epoch": 1905} {"train_loss": -11.65311050415039, "global_step": 320156, "epoch": 1905} {"train_loss": -11.857007026672363, "global_step": 320157, "epoch": 1905} {"train_loss": -11.61396598815918, "global_step": 320158, "epoch": 1905} {"train_loss": -11.704448699951172, "global_step": 320159, "epoch": 1905} {"train_loss": -11.883285522460938, "global_step": 320160, "epoch": 1905} {"train_loss": -11.825069427490234, "global_step": 320161, "epoch": 1905} {"train_loss": -11.848114013671875, "global_step": 320162, "epoch": 1905} {"train_loss": -12.025175094604492, "global_step": 320163, "epoch": 1905} {"train_loss": -11.742844581604004, "global_step": 320164, "epoch": 1905} {"train_loss": -12.0549955368042, "global_step": 320165, "epoch": 1905} {"train_loss": -11.87905502319336, "global_step": 320166, "epoch": 1905} {"train_loss": -11.709939956665039, "global_step": 320167, "epoch": 1905} {"train_loss": -12.098076820373535, "global_step": 320168, "epoch": 1905} {"train_loss": -11.677312850952148, "global_step": 320169, "epoch": 1905} {"train_loss": -12.002443313598633, "global_step": 320170, "epoch": 1905} {"train_loss": -12.023107528686523, "global_step": 320171, "epoch": 1905} {"train_loss": -12.050224304199219, "global_step": 320172, "epoch": 1905} {"train_loss": -11.892704963684082, "global_step": 320173, "epoch": 1905} {"train_loss": -12.108979225158691, "global_step": 320174, "epoch": 1905} {"train_loss": -11.856406211853027, "global_step": 320175, "epoch": 1905} {"train_loss": -12.081497192382812, "global_step": 320176, "epoch": 1905} {"train_loss": -12.12826156616211, "global_step": 320177, "epoch": 1905} {"train_loss": -12.205893516540527, "global_step": 320178, "epoch": 1905} {"train_loss": -11.700400352478027, "global_step": 320179, "epoch": 1905} {"train_loss": -12.159964561462402, "global_step": 320180, "epoch": 1905} {"train_loss": -11.950614929199219, "global_step": 320181, "epoch": 1905} {"train_loss": -11.960640907287598, "global_step": 320182, "epoch": 1905} {"train_loss": -12.207817077636719, "global_step": 320183, "epoch": 1905} {"train_loss": -12.171747207641602, "global_step": 320184, "epoch": 1905} {"train_loss": -11.844776153564453, "global_step": 320185, "epoch": 1905} {"train_loss": -12.056558609008789, "global_step": 320186, "epoch": 1905} {"train_loss": -11.799016952514648, "global_step": 320187, "epoch": 1905} {"train_loss": -12.222053527832031, "global_step": 320188, "epoch": 1905} {"train_loss": -11.803382873535156, "global_step": 320189, "epoch": 1905} {"train_loss": -12.050302505493164, "global_step": 320190, "epoch": 1905} {"train_loss": -12.128124237060547, "global_step": 320191, "epoch": 1905} {"train_loss": -11.922189712524414, "global_step": 320192, "epoch": 1905} {"train_loss": -12.218896865844727, "global_step": 320193, "epoch": 1905} {"train_loss": -11.868898391723633, "global_step": 320194, "epoch": 1905} {"train_loss": -12.021605491638184, "global_step": 320195, "epoch": 1905} {"train_loss": -11.879372596740723, "global_step": 320196, "epoch": 1905} {"train_loss": -12.274093627929688, "global_step": 320197, "epoch": 1905} {"train_loss": -12.12559700012207, "global_step": 320198, "epoch": 1905} {"train_loss": -12.202581405639648, "global_step": 320199, "epoch": 1905} {"train_loss": -12.31074333190918, "global_step": 320200, "epoch": 1905} {"train_loss": -12.192377090454102, "global_step": 320201, "epoch": 1905} {"train_loss": -12.328754425048828, "global_step": 320202, "epoch": 1905} {"train_loss": -11.95000171661377, "global_step": 320203, "epoch": 1905} {"train_loss": -12.107479095458984, "global_step": 320204, "epoch": 1905} {"train_loss": -12.337759017944336, "global_step": 320205, "epoch": 1905} {"train_loss": -12.302240371704102, "global_step": 320206, "epoch": 1905} {"train_loss": -11.662970247722807, "global_step": 320207, "epoch": 1905, "val_loss": 280982.96875, "train_action_mse_error": 1.0230540037155151} {"train_loss": -12.482330322265625, "global_step": 320208, "epoch": 1906} {"train_loss": -12.169303894042969, "global_step": 320209, "epoch": 1906} {"train_loss": -12.372878074645996, "global_step": 320210, "epoch": 1906} {"train_loss": -12.329665184020996, "global_step": 320211, "epoch": 1906} {"train_loss": -12.2713623046875, "global_step": 320212, "epoch": 1906} {"train_loss": -12.349800109863281, "global_step": 320213, "epoch": 1906} {"train_loss": -12.224930763244629, "global_step": 320214, "epoch": 1906} {"train_loss": -12.469549179077148, "global_step": 320215, "epoch": 1906} {"train_loss": -12.194737434387207, "global_step": 320216, "epoch": 1906} {"train_loss": -12.239288330078125, "global_step": 320217, "epoch": 1906} {"train_loss": -12.259895324707031, "global_step": 320218, "epoch": 1906} {"train_loss": -12.163704872131348, "global_step": 320219, "epoch": 1906} {"train_loss": -12.571382522583008, "global_step": 320220, "epoch": 1906} {"train_loss": -12.25293254852295, "global_step": 320221, "epoch": 1906} {"train_loss": -12.327014923095703, "global_step": 320222, "epoch": 1906} {"train_loss": -12.165523529052734, "global_step": 320223, "epoch": 1906} {"train_loss": -12.187134742736816, "global_step": 320224, "epoch": 1906} {"train_loss": -12.678617477416992, "global_step": 320225, "epoch": 1906} {"train_loss": -12.31678295135498, "global_step": 320226, "epoch": 1906} {"train_loss": -12.330657958984375, "global_step": 320227, "epoch": 1906} {"train_loss": -12.440366744995117, "global_step": 320228, "epoch": 1906} {"train_loss": -12.14903450012207, "global_step": 320229, "epoch": 1906} {"train_loss": -12.28138542175293, "global_step": 320230, "epoch": 1906} {"train_loss": -12.530313491821289, "global_step": 320231, "epoch": 1906} {"train_loss": -12.140475273132324, "global_step": 320232, "epoch": 1906} {"train_loss": -12.429931640625, "global_step": 320233, "epoch": 1906} {"train_loss": -12.34062385559082, "global_step": 320234, "epoch": 1906} {"train_loss": -12.62142562866211, "global_step": 320235, "epoch": 1906} {"train_loss": -12.427543640136719, "global_step": 320236, "epoch": 1906} {"train_loss": -12.071462631225586, "global_step": 320237, "epoch": 1906} {"train_loss": -12.621623039245605, "global_step": 320238, "epoch": 1906} {"train_loss": -12.331430435180664, "global_step": 320239, "epoch": 1906} {"train_loss": -12.133745193481445, "global_step": 320240, "epoch": 1906} {"train_loss": -12.174461364746094, "global_step": 320241, "epoch": 1906} {"train_loss": -12.575614929199219, "global_step": 320242, "epoch": 1906} {"train_loss": -11.910245895385742, "global_step": 320243, "epoch": 1906} {"train_loss": -12.05124282836914, "global_step": 320244, "epoch": 1906} {"train_loss": -11.89314079284668, "global_step": 320245, "epoch": 1906} {"train_loss": -11.891172409057617, "global_step": 320246, "epoch": 1906} {"train_loss": -11.818461418151855, "global_step": 320247, "epoch": 1906} {"train_loss": -11.57213020324707, "global_step": 320248, "epoch": 1906} {"train_loss": -12.18596076965332, "global_step": 320249, "epoch": 1906} {"train_loss": -10.950738906860352, "global_step": 320250, "epoch": 1906} {"train_loss": -10.495382308959961, "global_step": 320251, "epoch": 1906} {"train_loss": -12.036251068115234, "global_step": 320252, "epoch": 1906} {"train_loss": -11.877164840698242, "global_step": 320253, "epoch": 1906} {"train_loss": -10.974750518798828, "global_step": 320254, "epoch": 1906} {"train_loss": -12.24212646484375, "global_step": 320255, "epoch": 1906} {"train_loss": -10.822311401367188, "global_step": 320256, "epoch": 1906} {"train_loss": -11.028047561645508, "global_step": 320257, "epoch": 1906} {"train_loss": -12.248390197753906, "global_step": 320258, "epoch": 1906} {"train_loss": -12.07905101776123, "global_step": 320259, "epoch": 1906} {"train_loss": -12.112607955932617, "global_step": 320260, "epoch": 1906} {"train_loss": -11.839412689208984, "global_step": 320261, "epoch": 1906} {"train_loss": -11.892799377441406, "global_step": 320262, "epoch": 1906} {"train_loss": -11.932491302490234, "global_step": 320263, "epoch": 1906} {"train_loss": -11.90324878692627, "global_step": 320264, "epoch": 1906} {"train_loss": -12.132601737976074, "global_step": 320265, "epoch": 1906} {"train_loss": -11.293031692504883, "global_step": 320266, "epoch": 1906} {"train_loss": -12.183913230895996, "global_step": 320267, "epoch": 1906} {"train_loss": -11.394916534423828, "global_step": 320268, "epoch": 1906} {"train_loss": -12.019096374511719, "global_step": 320269, "epoch": 1906} {"train_loss": -11.553254127502441, "global_step": 320270, "epoch": 1906} {"train_loss": -12.017457962036133, "global_step": 320271, "epoch": 1906} {"train_loss": -11.049795150756836, "global_step": 320272, "epoch": 1906} {"train_loss": -12.158404350280762, "global_step": 320273, "epoch": 1906} {"train_loss": -11.72744369506836, "global_step": 320274, "epoch": 1906} {"train_loss": -11.527095794677734, "global_step": 320275, "epoch": 1906} {"train_loss": -10.091398239135742, "global_step": 320276, "epoch": 1906} {"train_loss": -10.087589263916016, "global_step": 320277, "epoch": 1906} {"train_loss": -10.57933235168457, "global_step": 320278, "epoch": 1906} {"train_loss": -10.138517379760742, "global_step": 320279, "epoch": 1906} {"train_loss": -9.236696243286133, "global_step": 320280, "epoch": 1906} {"train_loss": -9.489123344421387, "global_step": 320281, "epoch": 1906} {"train_loss": -10.760974884033203, "global_step": 320282, "epoch": 1906} {"train_loss": -9.593846321105957, "global_step": 320283, "epoch": 1906} {"train_loss": -9.79731559753418, "global_step": 320284, "epoch": 1906} {"train_loss": -10.058462142944336, "global_step": 320285, "epoch": 1906} {"train_loss": -11.25739860534668, "global_step": 320286, "epoch": 1906} {"train_loss": -9.298851013183594, "global_step": 320287, "epoch": 1906} {"train_loss": -11.568256378173828, "global_step": 320288, "epoch": 1906} {"train_loss": -9.955869674682617, "global_step": 320289, "epoch": 1906} {"train_loss": -11.517578125, "global_step": 320290, "epoch": 1906} {"train_loss": -10.597829818725586, "global_step": 320291, "epoch": 1906} {"train_loss": -11.501174926757812, "global_step": 320292, "epoch": 1906} {"train_loss": -10.421976089477539, "global_step": 320293, "epoch": 1906} {"train_loss": -11.812225341796875, "global_step": 320294, "epoch": 1906} {"train_loss": -10.96021842956543, "global_step": 320295, "epoch": 1906} {"train_loss": -11.382792472839355, "global_step": 320296, "epoch": 1906} {"train_loss": -10.974446296691895, "global_step": 320297, "epoch": 1906} {"train_loss": -11.38794231414795, "global_step": 320298, "epoch": 1906} {"train_loss": -11.371381759643555, "global_step": 320299, "epoch": 1906} {"train_loss": -11.81451416015625, "global_step": 320300, "epoch": 1906} {"train_loss": -11.4650297164917, "global_step": 320301, "epoch": 1906} {"train_loss": -11.966987609863281, "global_step": 320302, "epoch": 1906} {"train_loss": -11.727336883544922, "global_step": 320303, "epoch": 1906} {"train_loss": -11.8612642288208, "global_step": 320304, "epoch": 1906} {"train_loss": -11.286402702331543, "global_step": 320305, "epoch": 1906} {"train_loss": -11.545112609863281, "global_step": 320306, "epoch": 1906} {"train_loss": -11.407567977905273, "global_step": 320307, "epoch": 1906} {"train_loss": -12.054088592529297, "global_step": 320308, "epoch": 1906} {"train_loss": -11.460224151611328, "global_step": 320309, "epoch": 1906} {"train_loss": -12.122154235839844, "global_step": 320310, "epoch": 1906} {"train_loss": -11.487590789794922, "global_step": 320311, "epoch": 1906} {"train_loss": -11.788073539733887, "global_step": 320312, "epoch": 1906} {"train_loss": -11.852370262145996, "global_step": 320313, "epoch": 1906} {"train_loss": -11.509872436523438, "global_step": 320314, "epoch": 1906} {"train_loss": -11.692131042480469, "global_step": 320315, "epoch": 1906} {"train_loss": -11.8836088180542, "global_step": 320316, "epoch": 1906} {"train_loss": -11.734399795532227, "global_step": 320317, "epoch": 1906} {"train_loss": -12.090065002441406, "global_step": 320318, "epoch": 1906} {"train_loss": -11.73586654663086, "global_step": 320319, "epoch": 1906} {"train_loss": -11.97517204284668, "global_step": 320320, "epoch": 1906} {"train_loss": -11.903388977050781, "global_step": 320321, "epoch": 1906} {"train_loss": -12.083320617675781, "global_step": 320322, "epoch": 1906} {"train_loss": -12.046733856201172, "global_step": 320323, "epoch": 1906} {"train_loss": -12.060510635375977, "global_step": 320324, "epoch": 1906} {"train_loss": -11.879007339477539, "global_step": 320325, "epoch": 1906} {"train_loss": -12.286372184753418, "global_step": 320326, "epoch": 1906} {"train_loss": -11.775928497314453, "global_step": 320327, "epoch": 1906} {"train_loss": -11.952608108520508, "global_step": 320328, "epoch": 1906} {"train_loss": -12.198688507080078, "global_step": 320329, "epoch": 1906} {"train_loss": -11.64348030090332, "global_step": 320330, "epoch": 1906} {"train_loss": -12.096160888671875, "global_step": 320331, "epoch": 1906} {"train_loss": -11.952582359313965, "global_step": 320332, "epoch": 1906} {"train_loss": -12.099800109863281, "global_step": 320333, "epoch": 1906} {"train_loss": -12.08234977722168, "global_step": 320334, "epoch": 1906} {"train_loss": -12.09732437133789, "global_step": 320335, "epoch": 1906} {"train_loss": -12.153448104858398, "global_step": 320336, "epoch": 1906} {"train_loss": -12.076620101928711, "global_step": 320337, "epoch": 1906} {"train_loss": -12.019939422607422, "global_step": 320338, "epoch": 1906} {"train_loss": -11.885711669921875, "global_step": 320339, "epoch": 1906} {"train_loss": -11.964179992675781, "global_step": 320340, "epoch": 1906} {"train_loss": -12.069477081298828, "global_step": 320341, "epoch": 1906} {"train_loss": -12.255279541015625, "global_step": 320342, "epoch": 1906} {"train_loss": -12.396448135375977, "global_step": 320343, "epoch": 1906} {"train_loss": -12.288681030273438, "global_step": 320344, "epoch": 1906} {"train_loss": -12.33216667175293, "global_step": 320345, "epoch": 1906} {"train_loss": -12.099851608276367, "global_step": 320346, "epoch": 1906} {"train_loss": -12.257450103759766, "global_step": 320347, "epoch": 1906} {"train_loss": -12.135262489318848, "global_step": 320348, "epoch": 1906} {"train_loss": -12.232210159301758, "global_step": 320349, "epoch": 1906} {"train_loss": -12.154654502868652, "global_step": 320350, "epoch": 1906} {"train_loss": -12.268800735473633, "global_step": 320351, "epoch": 1906} {"train_loss": -12.334211349487305, "global_step": 320352, "epoch": 1906} {"train_loss": -12.200273513793945, "global_step": 320353, "epoch": 1906} {"train_loss": -11.893078804016113, "global_step": 320354, "epoch": 1906} {"train_loss": -12.06009292602539, "global_step": 320355, "epoch": 1906} {"train_loss": -11.851447105407715, "global_step": 320356, "epoch": 1906} {"train_loss": -12.296625137329102, "global_step": 320357, "epoch": 1906} {"train_loss": -12.303365707397461, "global_step": 320358, "epoch": 1906} {"train_loss": -12.199795722961426, "global_step": 320359, "epoch": 1906} {"train_loss": -11.806207656860352, "global_step": 320360, "epoch": 1906} {"train_loss": -11.872802734375, "global_step": 320361, "epoch": 1906} {"train_loss": -12.180293083190918, "global_step": 320362, "epoch": 1906} {"train_loss": -11.924591064453125, "global_step": 320363, "epoch": 1906} {"train_loss": -11.739776611328125, "global_step": 320364, "epoch": 1906} {"train_loss": -12.386885643005371, "global_step": 320365, "epoch": 1906} {"train_loss": -12.137929916381836, "global_step": 320366, "epoch": 1906} {"train_loss": -11.794952392578125, "global_step": 320367, "epoch": 1906} {"train_loss": -11.925324440002441, "global_step": 320368, "epoch": 1906} {"train_loss": -11.959734916687012, "global_step": 320369, "epoch": 1906} {"train_loss": -11.822053909301758, "global_step": 320370, "epoch": 1906} {"train_loss": -11.832608222961426, "global_step": 320371, "epoch": 1906} {"train_loss": -11.799592971801758, "global_step": 320372, "epoch": 1906} {"train_loss": -11.293805122375488, "global_step": 320373, "epoch": 1906} {"train_loss": -12.362371444702148, "global_step": 320374, "epoch": 1906} {"train_loss": -11.792661439804803, "global_step": 320375, "epoch": 1906, "val_loss": 282336.25} {"train_loss": -11.79061508178711, "global_step": 320376, "epoch": 1907} {"train_loss": -12.192604064941406, "global_step": 320377, "epoch": 1907} {"train_loss": -11.938362121582031, "global_step": 320378, "epoch": 1907} {"train_loss": -12.058887481689453, "global_step": 320379, "epoch": 1907} {"train_loss": -11.847472190856934, "global_step": 320380, "epoch": 1907} {"train_loss": -12.212947845458984, "global_step": 320381, "epoch": 1907} {"train_loss": -12.20195198059082, "global_step": 320382, "epoch": 1907} {"train_loss": -12.285106658935547, "global_step": 320383, "epoch": 1907} {"train_loss": -12.111376762390137, "global_step": 320384, "epoch": 1907} {"train_loss": -11.840309143066406, "global_step": 320385, "epoch": 1907} {"train_loss": -12.265369415283203, "global_step": 320386, "epoch": 1907} {"train_loss": -12.249092102050781, "global_step": 320387, "epoch": 1907} {"train_loss": -12.198960304260254, "global_step": 320388, "epoch": 1907} {"train_loss": -12.132369995117188, "global_step": 320389, "epoch": 1907} {"train_loss": -11.714552879333496, "global_step": 320390, "epoch": 1907} {"train_loss": -12.069029808044434, "global_step": 320391, "epoch": 1907} {"train_loss": -11.977684020996094, "global_step": 320392, "epoch": 1907} {"train_loss": -12.467796325683594, "global_step": 320393, "epoch": 1907} {"train_loss": -11.784327507019043, "global_step": 320394, "epoch": 1907} {"train_loss": -12.325822830200195, "global_step": 320395, "epoch": 1907} {"train_loss": -12.413161277770996, "global_step": 320396, "epoch": 1907} {"train_loss": -11.949735641479492, "global_step": 320397, "epoch": 1907} {"train_loss": -11.971939086914062, "global_step": 320398, "epoch": 1907} {"train_loss": -12.284805297851562, "global_step": 320399, "epoch": 1907} {"train_loss": -11.283292770385742, "global_step": 320400, "epoch": 1907} {"train_loss": -11.650678634643555, "global_step": 320401, "epoch": 1907} {"train_loss": -12.177728652954102, "global_step": 320402, "epoch": 1907} {"train_loss": -11.466455459594727, "global_step": 320403, "epoch": 1907} {"train_loss": -11.130218505859375, "global_step": 320404, "epoch": 1907} {"train_loss": -11.252443313598633, "global_step": 320405, "epoch": 1907} {"train_loss": -11.832563400268555, "global_step": 320406, "epoch": 1907} {"train_loss": -11.043259620666504, "global_step": 320407, "epoch": 1907} {"train_loss": -11.406003952026367, "global_step": 320408, "epoch": 1907} {"train_loss": -12.024755477905273, "global_step": 320409, "epoch": 1907} {"train_loss": -11.093337059020996, "global_step": 320410, "epoch": 1907} {"train_loss": -11.04476547241211, "global_step": 320411, "epoch": 1907} {"train_loss": -11.652154922485352, "global_step": 320412, "epoch": 1907} {"train_loss": -10.677885055541992, "global_step": 320413, "epoch": 1907} {"train_loss": -10.504619598388672, "global_step": 320414, "epoch": 1907} {"train_loss": -11.412884712219238, "global_step": 320415, "epoch": 1907} {"train_loss": -9.892803192138672, "global_step": 320416, "epoch": 1907} {"train_loss": -10.243728637695312, "global_step": 320417, "epoch": 1907} {"train_loss": -11.038490295410156, "global_step": 320418, "epoch": 1907} {"train_loss": -9.932332038879395, "global_step": 320419, "epoch": 1907} {"train_loss": -11.209774017333984, "global_step": 320420, "epoch": 1907} {"train_loss": -10.972633361816406, "global_step": 320421, "epoch": 1907} {"train_loss": -10.102370262145996, "global_step": 320422, "epoch": 1907} {"train_loss": -11.441757202148438, "global_step": 320423, "epoch": 1907} {"train_loss": -10.012781143188477, "global_step": 320424, "epoch": 1907} {"train_loss": -11.22792911529541, "global_step": 320425, "epoch": 1907} {"train_loss": -11.02629280090332, "global_step": 320426, "epoch": 1907} {"train_loss": -11.39926815032959, "global_step": 320427, "epoch": 1907} {"train_loss": -11.396503448486328, "global_step": 320428, "epoch": 1907} {"train_loss": -11.09164810180664, "global_step": 320429, "epoch": 1907} {"train_loss": -11.443563461303711, "global_step": 320430, "epoch": 1907} {"train_loss": -11.350345611572266, "global_step": 320431, "epoch": 1907} {"train_loss": -11.506170272827148, "global_step": 320432, "epoch": 1907} {"train_loss": -11.678550720214844, "global_step": 320433, "epoch": 1907} {"train_loss": -11.19927978515625, "global_step": 320434, "epoch": 1907} {"train_loss": -11.667529106140137, "global_step": 320435, "epoch": 1907} {"train_loss": -11.712724685668945, "global_step": 320436, "epoch": 1907} {"train_loss": -11.807437896728516, "global_step": 320437, "epoch": 1907} {"train_loss": -11.860435485839844, "global_step": 320438, "epoch": 1907} {"train_loss": -11.960599899291992, "global_step": 320439, "epoch": 1907} {"train_loss": -11.94357681274414, "global_step": 320440, "epoch": 1907} {"train_loss": -11.91592788696289, "global_step": 320441, "epoch": 1907} {"train_loss": -11.923280715942383, "global_step": 320442, "epoch": 1907} {"train_loss": -11.891746520996094, "global_step": 320443, "epoch": 1907} {"train_loss": -11.932666778564453, "global_step": 320444, "epoch": 1907} {"train_loss": -11.87204360961914, "global_step": 320445, "epoch": 1907} {"train_loss": -12.178524017333984, "global_step": 320446, "epoch": 1907} {"train_loss": -11.951164245605469, "global_step": 320447, "epoch": 1907} {"train_loss": -11.981101989746094, "global_step": 320448, "epoch": 1907} {"train_loss": -11.862174034118652, "global_step": 320449, "epoch": 1907} {"train_loss": -12.073076248168945, "global_step": 320450, "epoch": 1907} {"train_loss": -12.00602912902832, "global_step": 320451, "epoch": 1907} {"train_loss": -12.197277069091797, "global_step": 320452, "epoch": 1907} {"train_loss": -12.053977966308594, "global_step": 320453, "epoch": 1907} {"train_loss": -11.708145141601562, "global_step": 320454, "epoch": 1907} {"train_loss": -12.332330703735352, "global_step": 320455, "epoch": 1907} {"train_loss": -12.233753204345703, "global_step": 320456, "epoch": 1907} {"train_loss": -12.477561950683594, "global_step": 320457, "epoch": 1907} {"train_loss": -12.321052551269531, "global_step": 320458, "epoch": 1907} {"train_loss": -12.09667682647705, "global_step": 320459, "epoch": 1907} {"train_loss": -12.220161437988281, "global_step": 320460, "epoch": 1907} {"train_loss": -12.33731460571289, "global_step": 320461, "epoch": 1907} {"train_loss": -12.381241798400879, "global_step": 320462, "epoch": 1907} {"train_loss": -12.307071685791016, "global_step": 320463, "epoch": 1907} {"train_loss": -12.186123847961426, "global_step": 320464, "epoch": 1907} {"train_loss": -12.196520805358887, "global_step": 320465, "epoch": 1907} {"train_loss": -12.231206893920898, "global_step": 320466, "epoch": 1907} {"train_loss": -12.42448616027832, "global_step": 320467, "epoch": 1907} {"train_loss": -12.21247673034668, "global_step": 320468, "epoch": 1907} {"train_loss": -12.393777847290039, "global_step": 320469, "epoch": 1907} {"train_loss": -12.199831008911133, "global_step": 320470, "epoch": 1907} {"train_loss": -11.960210800170898, "global_step": 320471, "epoch": 1907} {"train_loss": -12.366979598999023, "global_step": 320472, "epoch": 1907} {"train_loss": -12.402107238769531, "global_step": 320473, "epoch": 1907} {"train_loss": -12.419915199279785, "global_step": 320474, "epoch": 1907} {"train_loss": -12.29201889038086, "global_step": 320475, "epoch": 1907} {"train_loss": -12.400337219238281, "global_step": 320476, "epoch": 1907} {"train_loss": -12.492745399475098, "global_step": 320477, "epoch": 1907} {"train_loss": -12.481378555297852, "global_step": 320478, "epoch": 1907} {"train_loss": -12.295154571533203, "global_step": 320479, "epoch": 1907} {"train_loss": -12.551509857177734, "global_step": 320480, "epoch": 1907} {"train_loss": -12.49421501159668, "global_step": 320481, "epoch": 1907} {"train_loss": -12.564376831054688, "global_step": 320482, "epoch": 1907} {"train_loss": -12.261054992675781, "global_step": 320483, "epoch": 1907} {"train_loss": -12.51045036315918, "global_step": 320484, "epoch": 1907} {"train_loss": -12.314146041870117, "global_step": 320485, "epoch": 1907} {"train_loss": -12.43460464477539, "global_step": 320486, "epoch": 1907} {"train_loss": -12.37039852142334, "global_step": 320487, "epoch": 1907} {"train_loss": -12.201775550842285, "global_step": 320488, "epoch": 1907} {"train_loss": -12.454890251159668, "global_step": 320489, "epoch": 1907} {"train_loss": -12.40469741821289, "global_step": 320490, "epoch": 1907} {"train_loss": -12.483515739440918, "global_step": 320491, "epoch": 1907} {"train_loss": -12.31123161315918, "global_step": 320492, "epoch": 1907} {"train_loss": -12.598143577575684, "global_step": 320493, "epoch": 1907} {"train_loss": -12.235504150390625, "global_step": 320494, "epoch": 1907} {"train_loss": -12.489100456237793, "global_step": 320495, "epoch": 1907} {"train_loss": -12.683672904968262, "global_step": 320496, "epoch": 1907} {"train_loss": -12.44680118560791, "global_step": 320497, "epoch": 1907} {"train_loss": -12.627191543579102, "global_step": 320498, "epoch": 1907} {"train_loss": -12.367185592651367, "global_step": 320499, "epoch": 1907} {"train_loss": -12.272844314575195, "global_step": 320500, "epoch": 1907} {"train_loss": -11.981712341308594, "global_step": 320501, "epoch": 1907} {"train_loss": -12.157403945922852, "global_step": 320502, "epoch": 1907} {"train_loss": -12.296720504760742, "global_step": 320503, "epoch": 1907} {"train_loss": -12.299123764038086, "global_step": 320504, "epoch": 1907} {"train_loss": -12.293139457702637, "global_step": 320505, "epoch": 1907} {"train_loss": -12.026138305664062, "global_step": 320506, "epoch": 1907} {"train_loss": -12.433658599853516, "global_step": 320507, "epoch": 1907} {"train_loss": -11.995765686035156, "global_step": 320508, "epoch": 1907} {"train_loss": -12.52886962890625, "global_step": 320509, "epoch": 1907} {"train_loss": -12.249950408935547, "global_step": 320510, "epoch": 1907} {"train_loss": -12.520133018493652, "global_step": 320511, "epoch": 1907} {"train_loss": -11.92587947845459, "global_step": 320512, "epoch": 1907} {"train_loss": -11.856293678283691, "global_step": 320513, "epoch": 1907} {"train_loss": -11.700916290283203, "global_step": 320514, "epoch": 1907} {"train_loss": -12.25752067565918, "global_step": 320515, "epoch": 1907} {"train_loss": -12.485116958618164, "global_step": 320516, "epoch": 1907} {"train_loss": -11.58542251586914, "global_step": 320517, "epoch": 1907} {"train_loss": -11.931188583374023, "global_step": 320518, "epoch": 1907} {"train_loss": -12.139159202575684, "global_step": 320519, "epoch": 1907} {"train_loss": -12.05160903930664, "global_step": 320520, "epoch": 1907} {"train_loss": -12.186644554138184, "global_step": 320521, "epoch": 1907} {"train_loss": -11.021312713623047, "global_step": 320522, "epoch": 1907} {"train_loss": -12.027793884277344, "global_step": 320523, "epoch": 1907} {"train_loss": -12.033260345458984, "global_step": 320524, "epoch": 1907} {"train_loss": -12.039552688598633, "global_step": 320525, "epoch": 1907} {"train_loss": -11.821088790893555, "global_step": 320526, "epoch": 1907} {"train_loss": -11.514962196350098, "global_step": 320527, "epoch": 1907} {"train_loss": -11.556310653686523, "global_step": 320528, "epoch": 1907} {"train_loss": -11.893736839294434, "global_step": 320529, "epoch": 1907} {"train_loss": -12.091935157775879, "global_step": 320530, "epoch": 1907} {"train_loss": -11.347301483154297, "global_step": 320531, "epoch": 1907} {"train_loss": -11.715803146362305, "global_step": 320532, "epoch": 1907} {"train_loss": -11.558164596557617, "global_step": 320533, "epoch": 1907} {"train_loss": -12.161301612854004, "global_step": 320534, "epoch": 1907} {"train_loss": -12.119976043701172, "global_step": 320535, "epoch": 1907} {"train_loss": -12.183944702148438, "global_step": 320536, "epoch": 1907} {"train_loss": -12.054075241088867, "global_step": 320537, "epoch": 1907} {"train_loss": -12.131246566772461, "global_step": 320538, "epoch": 1907} {"train_loss": -11.889415740966797, "global_step": 320539, "epoch": 1907} {"train_loss": -11.561799049377441, "global_step": 320540, "epoch": 1907} {"train_loss": -11.681135177612305, "global_step": 320541, "epoch": 1907} {"train_loss": -11.610584259033203, "global_step": 320542, "epoch": 1907} {"train_loss": -11.910030069805327, "global_step": 320543, "epoch": 1907, "val_loss": 284495.625} {"train_loss": -11.384988784790039, "global_step": 320544, "epoch": 1908} {"train_loss": -10.694780349731445, "global_step": 320545, "epoch": 1908} {"train_loss": -11.143853187561035, "global_step": 320546, "epoch": 1908} {"train_loss": -10.317522048950195, "global_step": 320547, "epoch": 1908} {"train_loss": -10.293118476867676, "global_step": 320548, "epoch": 1908} {"train_loss": -9.370668411254883, "global_step": 320549, "epoch": 1908} {"train_loss": -10.40997314453125, "global_step": 320550, "epoch": 1908} {"train_loss": -9.482419967651367, "global_step": 320551, "epoch": 1908} {"train_loss": -8.192176818847656, "global_step": 320552, "epoch": 1908} {"train_loss": -8.439240455627441, "global_step": 320553, "epoch": 1908} {"train_loss": -8.088397979736328, "global_step": 320554, "epoch": 1908} {"train_loss": -7.130539894104004, "global_step": 320555, "epoch": 1908} {"train_loss": -8.116628646850586, "global_step": 320556, "epoch": 1908} {"train_loss": -8.366048812866211, "global_step": 320557, "epoch": 1908} {"train_loss": -8.786547660827637, "global_step": 320558, "epoch": 1908} {"train_loss": -9.444114685058594, "global_step": 320559, "epoch": 1908} {"train_loss": -8.804376602172852, "global_step": 320560, "epoch": 1908} {"train_loss": -9.310723304748535, "global_step": 320561, "epoch": 1908} {"train_loss": -9.679420471191406, "global_step": 320562, "epoch": 1908} {"train_loss": -10.884078025817871, "global_step": 320563, "epoch": 1908} {"train_loss": -10.143956184387207, "global_step": 320564, "epoch": 1908} {"train_loss": -10.907052993774414, "global_step": 320565, "epoch": 1908} {"train_loss": -10.306917190551758, "global_step": 320566, "epoch": 1908} {"train_loss": -11.41379165649414, "global_step": 320567, "epoch": 1908} {"train_loss": -10.972806930541992, "global_step": 320568, "epoch": 1908} {"train_loss": -10.911136627197266, "global_step": 320569, "epoch": 1908} {"train_loss": -10.989206314086914, "global_step": 320570, "epoch": 1908} {"train_loss": -10.744156837463379, "global_step": 320571, "epoch": 1908} {"train_loss": -11.359436988830566, "global_step": 320572, "epoch": 1908} {"train_loss": -11.585945129394531, "global_step": 320573, "epoch": 1908} {"train_loss": -11.390974044799805, "global_step": 320574, "epoch": 1908} {"train_loss": -11.350383758544922, "global_step": 320575, "epoch": 1908} {"train_loss": -11.407779693603516, "global_step": 320576, "epoch": 1908} {"train_loss": -11.317730903625488, "global_step": 320577, "epoch": 1908} {"train_loss": -11.666650772094727, "global_step": 320578, "epoch": 1908} {"train_loss": -11.433030128479004, "global_step": 320579, "epoch": 1908} {"train_loss": -11.875618934631348, "global_step": 320580, "epoch": 1908} {"train_loss": -11.712987899780273, "global_step": 320581, "epoch": 1908} {"train_loss": -11.63514518737793, "global_step": 320582, "epoch": 1908} {"train_loss": -12.046041488647461, "global_step": 320583, "epoch": 1908} {"train_loss": -11.716819763183594, "global_step": 320584, "epoch": 1908} {"train_loss": -11.494189262390137, "global_step": 320585, "epoch": 1908} {"train_loss": -11.796113014221191, "global_step": 320586, "epoch": 1908} {"train_loss": -11.546554565429688, "global_step": 320587, "epoch": 1908} {"train_loss": -11.949284553527832, "global_step": 320588, "epoch": 1908} {"train_loss": -12.056539535522461, "global_step": 320589, "epoch": 1908} {"train_loss": -11.59968376159668, "global_step": 320590, "epoch": 1908} {"train_loss": -11.530048370361328, "global_step": 320591, "epoch": 1908} {"train_loss": -11.789411544799805, "global_step": 320592, "epoch": 1908} {"train_loss": -11.681439399719238, "global_step": 320593, "epoch": 1908} {"train_loss": -11.603706359863281, "global_step": 320594, "epoch": 1908} {"train_loss": -12.097000122070312, "global_step": 320595, "epoch": 1908} {"train_loss": -11.578322410583496, "global_step": 320596, "epoch": 1908} {"train_loss": -11.970766067504883, "global_step": 320597, "epoch": 1908} {"train_loss": -11.905416488647461, "global_step": 320598, "epoch": 1908} {"train_loss": -11.730687141418457, "global_step": 320599, "epoch": 1908} {"train_loss": -11.999114990234375, "global_step": 320600, "epoch": 1908} {"train_loss": -11.674934387207031, "global_step": 320601, "epoch": 1908} {"train_loss": -12.128824234008789, "global_step": 320602, "epoch": 1908} {"train_loss": -11.836442947387695, "global_step": 320603, "epoch": 1908} {"train_loss": -11.996018409729004, "global_step": 320604, "epoch": 1908} {"train_loss": -12.042457580566406, "global_step": 320605, "epoch": 1908} {"train_loss": -12.052152633666992, "global_step": 320606, "epoch": 1908} {"train_loss": -11.984118461608887, "global_step": 320607, "epoch": 1908} {"train_loss": -12.348638534545898, "global_step": 320608, "epoch": 1908} {"train_loss": -11.925752639770508, "global_step": 320609, "epoch": 1908} {"train_loss": -12.219018936157227, "global_step": 320610, "epoch": 1908} {"train_loss": -12.074613571166992, "global_step": 320611, "epoch": 1908} {"train_loss": -12.125324249267578, "global_step": 320612, "epoch": 1908} {"train_loss": -12.318428993225098, "global_step": 320613, "epoch": 1908} {"train_loss": -12.235393524169922, "global_step": 320614, "epoch": 1908} {"train_loss": -12.305320739746094, "global_step": 320615, "epoch": 1908} {"train_loss": -12.094491958618164, "global_step": 320616, "epoch": 1908} {"train_loss": -12.150217056274414, "global_step": 320617, "epoch": 1908} {"train_loss": -12.03668212890625, "global_step": 320618, "epoch": 1908} {"train_loss": -12.3676118850708, "global_step": 320619, "epoch": 1908} {"train_loss": -12.28985595703125, "global_step": 320620, "epoch": 1908} {"train_loss": -12.29063606262207, "global_step": 320621, "epoch": 1908} {"train_loss": -12.134952545166016, "global_step": 320622, "epoch": 1908} {"train_loss": -12.031982421875, "global_step": 320623, "epoch": 1908} {"train_loss": -12.338350296020508, "global_step": 320624, "epoch": 1908} {"train_loss": -12.244756698608398, "global_step": 320625, "epoch": 1908} {"train_loss": -12.286436080932617, "global_step": 320626, "epoch": 1908} {"train_loss": -12.337346076965332, "global_step": 320627, "epoch": 1908} {"train_loss": -11.58698558807373, "global_step": 320628, "epoch": 1908} {"train_loss": -12.268847465515137, "global_step": 320629, "epoch": 1908} {"train_loss": -11.99262809753418, "global_step": 320630, "epoch": 1908} {"train_loss": -11.946680068969727, "global_step": 320631, "epoch": 1908} {"train_loss": -12.218585968017578, "global_step": 320632, "epoch": 1908} {"train_loss": -11.751781463623047, "global_step": 320633, "epoch": 1908} {"train_loss": -11.454704284667969, "global_step": 320634, "epoch": 1908} {"train_loss": -12.205354690551758, "global_step": 320635, "epoch": 1908} {"train_loss": -11.359054565429688, "global_step": 320636, "epoch": 1908} {"train_loss": -12.047581672668457, "global_step": 320637, "epoch": 1908} {"train_loss": -11.985541343688965, "global_step": 320638, "epoch": 1908} {"train_loss": -11.390743255615234, "global_step": 320639, "epoch": 1908} {"train_loss": -12.322591781616211, "global_step": 320640, "epoch": 1908} {"train_loss": -11.505890846252441, "global_step": 320641, "epoch": 1908} {"train_loss": -12.179100036621094, "global_step": 320642, "epoch": 1908} {"train_loss": -12.019241333007812, "global_step": 320643, "epoch": 1908} {"train_loss": -11.789501190185547, "global_step": 320644, "epoch": 1908} {"train_loss": -12.107138633728027, "global_step": 320645, "epoch": 1908} {"train_loss": -11.903118133544922, "global_step": 320646, "epoch": 1908} {"train_loss": -11.58884048461914, "global_step": 320647, "epoch": 1908} {"train_loss": -12.113128662109375, "global_step": 320648, "epoch": 1908} {"train_loss": -11.844879150390625, "global_step": 320649, "epoch": 1908} {"train_loss": -11.942304611206055, "global_step": 320650, "epoch": 1908} {"train_loss": -12.379596710205078, "global_step": 320651, "epoch": 1908} {"train_loss": -11.987305641174316, "global_step": 320652, "epoch": 1908} {"train_loss": -12.440614700317383, "global_step": 320653, "epoch": 1908} {"train_loss": -12.423646926879883, "global_step": 320654, "epoch": 1908} {"train_loss": -12.164347648620605, "global_step": 320655, "epoch": 1908} {"train_loss": -12.332923889160156, "global_step": 320656, "epoch": 1908} {"train_loss": -12.54643440246582, "global_step": 320657, "epoch": 1908} {"train_loss": -12.490934371948242, "global_step": 320658, "epoch": 1908} {"train_loss": -12.135527610778809, "global_step": 320659, "epoch": 1908} {"train_loss": -12.136544227600098, "global_step": 320660, "epoch": 1908} {"train_loss": -12.200149536132812, "global_step": 320661, "epoch": 1908} {"train_loss": -12.449261665344238, "global_step": 320662, "epoch": 1908} {"train_loss": -12.108049392700195, "global_step": 320663, "epoch": 1908} {"train_loss": -12.277971267700195, "global_step": 320664, "epoch": 1908} {"train_loss": -12.141298294067383, "global_step": 320665, "epoch": 1908} {"train_loss": -12.47100830078125, "global_step": 320666, "epoch": 1908} {"train_loss": -12.183332443237305, "global_step": 320667, "epoch": 1908} {"train_loss": -12.030890464782715, "global_step": 320668, "epoch": 1908} {"train_loss": -12.24074935913086, "global_step": 320669, "epoch": 1908} {"train_loss": -11.918392181396484, "global_step": 320670, "epoch": 1908} {"train_loss": -12.292027473449707, "global_step": 320671, "epoch": 1908} {"train_loss": -12.569075584411621, "global_step": 320672, "epoch": 1908} {"train_loss": -11.62339973449707, "global_step": 320673, "epoch": 1908} {"train_loss": -12.124652862548828, "global_step": 320674, "epoch": 1908} {"train_loss": -11.999594688415527, "global_step": 320675, "epoch": 1908} {"train_loss": -12.198572158813477, "global_step": 320676, "epoch": 1908} {"train_loss": -12.319476127624512, "global_step": 320677, "epoch": 1908} {"train_loss": -12.244110107421875, "global_step": 320678, "epoch": 1908} {"train_loss": -11.80244255065918, "global_step": 320679, "epoch": 1908} {"train_loss": -11.726264953613281, "global_step": 320680, "epoch": 1908} {"train_loss": -12.069674491882324, "global_step": 320681, "epoch": 1908} {"train_loss": -10.701499938964844, "global_step": 320682, "epoch": 1908} {"train_loss": -11.50473403930664, "global_step": 320683, "epoch": 1908} {"train_loss": -9.85440731048584, "global_step": 320684, "epoch": 1908} {"train_loss": -10.82099437713623, "global_step": 320685, "epoch": 1908} {"train_loss": -11.066558837890625, "global_step": 320686, "epoch": 1908} {"train_loss": -10.297014236450195, "global_step": 320687, "epoch": 1908} {"train_loss": -11.956762313842773, "global_step": 320688, "epoch": 1908} {"train_loss": -9.987417221069336, "global_step": 320689, "epoch": 1908} {"train_loss": -11.884208679199219, "global_step": 320690, "epoch": 1908} {"train_loss": -11.334550857543945, "global_step": 320691, "epoch": 1908} {"train_loss": -10.908306121826172, "global_step": 320692, "epoch": 1908} {"train_loss": -11.922011375427246, "global_step": 320693, "epoch": 1908} {"train_loss": -10.497102737426758, "global_step": 320694, "epoch": 1908} {"train_loss": -11.47719955444336, "global_step": 320695, "epoch": 1908} {"train_loss": -11.013914108276367, "global_step": 320696, "epoch": 1908} {"train_loss": -10.879936218261719, "global_step": 320697, "epoch": 1908} {"train_loss": -11.130131721496582, "global_step": 320698, "epoch": 1908} {"train_loss": -9.568021774291992, "global_step": 320699, "epoch": 1908} {"train_loss": -12.086448669433594, "global_step": 320700, "epoch": 1908} {"train_loss": -10.760805130004883, "global_step": 320701, "epoch": 1908} {"train_loss": -11.800426483154297, "global_step": 320702, "epoch": 1908} {"train_loss": -10.756379127502441, "global_step": 320703, "epoch": 1908} {"train_loss": -11.253061294555664, "global_step": 320704, "epoch": 1908} {"train_loss": -11.383721351623535, "global_step": 320705, "epoch": 1908} {"train_loss": -11.236205101013184, "global_step": 320706, "epoch": 1908} {"train_loss": -12.036112785339355, "global_step": 320707, "epoch": 1908} {"train_loss": -11.466331481933594, "global_step": 320708, "epoch": 1908} {"train_loss": -11.361791610717773, "global_step": 320709, "epoch": 1908} {"train_loss": -11.845539093017578, "global_step": 320710, "epoch": 1908} {"train_loss": -11.471411409832182, "global_step": 320711, "epoch": 1908, "val_loss": 286287.09375} {"train_loss": -11.797904014587402, "global_step": 320712, "epoch": 1909} {"train_loss": -11.507184982299805, "global_step": 320713, "epoch": 1909} {"train_loss": -11.487336158752441, "global_step": 320714, "epoch": 1909} {"train_loss": -11.226577758789062, "global_step": 320715, "epoch": 1909} {"train_loss": -11.184978485107422, "global_step": 320716, "epoch": 1909} {"train_loss": -11.584081649780273, "global_step": 320717, "epoch": 1909} {"train_loss": -10.982394218444824, "global_step": 320718, "epoch": 1909} {"train_loss": -11.570525169372559, "global_step": 320719, "epoch": 1909} {"train_loss": -11.22967529296875, "global_step": 320720, "epoch": 1909} {"train_loss": -11.766457557678223, "global_step": 320721, "epoch": 1909} {"train_loss": -11.127374649047852, "global_step": 320722, "epoch": 1909} {"train_loss": -11.690094947814941, "global_step": 320723, "epoch": 1909} {"train_loss": -11.562225341796875, "global_step": 320724, "epoch": 1909} {"train_loss": -10.994217872619629, "global_step": 320725, "epoch": 1909} {"train_loss": -11.692789077758789, "global_step": 320726, "epoch": 1909} {"train_loss": -11.002767562866211, "global_step": 320727, "epoch": 1909} {"train_loss": -11.916783332824707, "global_step": 320728, "epoch": 1909} {"train_loss": -11.063450813293457, "global_step": 320729, "epoch": 1909} {"train_loss": -11.7941312789917, "global_step": 320730, "epoch": 1909} {"train_loss": -11.099813461303711, "global_step": 320731, "epoch": 1909} {"train_loss": -11.759265899658203, "global_step": 320732, "epoch": 1909} {"train_loss": -11.256591796875, "global_step": 320733, "epoch": 1909} {"train_loss": -12.144378662109375, "global_step": 320734, "epoch": 1909} {"train_loss": -11.396675109863281, "global_step": 320735, "epoch": 1909} {"train_loss": -12.153037071228027, "global_step": 320736, "epoch": 1909} {"train_loss": -10.799002647399902, "global_step": 320737, "epoch": 1909} {"train_loss": -11.957117080688477, "global_step": 320738, "epoch": 1909} {"train_loss": -11.343223571777344, "global_step": 320739, "epoch": 1909} {"train_loss": -11.946584701538086, "global_step": 320740, "epoch": 1909} {"train_loss": -11.520238876342773, "global_step": 320741, "epoch": 1909} {"train_loss": -12.240035057067871, "global_step": 320742, "epoch": 1909} {"train_loss": -11.457113265991211, "global_step": 320743, "epoch": 1909} {"train_loss": -12.205480575561523, "global_step": 320744, "epoch": 1909} {"train_loss": -11.820396423339844, "global_step": 320745, "epoch": 1909} {"train_loss": -12.057300567626953, "global_step": 320746, "epoch": 1909} {"train_loss": -11.995969772338867, "global_step": 320747, "epoch": 1909} {"train_loss": -11.938630104064941, "global_step": 320748, "epoch": 1909} {"train_loss": -11.776363372802734, "global_step": 320749, "epoch": 1909} {"train_loss": -12.052505493164062, "global_step": 320750, "epoch": 1909} {"train_loss": -11.936616897583008, "global_step": 320751, "epoch": 1909} {"train_loss": -12.14548110961914, "global_step": 320752, "epoch": 1909} {"train_loss": -12.17299747467041, "global_step": 320753, "epoch": 1909} {"train_loss": -12.184518814086914, "global_step": 320754, "epoch": 1909} {"train_loss": -12.169380187988281, "global_step": 320755, "epoch": 1909} {"train_loss": -12.075284004211426, "global_step": 320756, "epoch": 1909} {"train_loss": -12.48744010925293, "global_step": 320757, "epoch": 1909} {"train_loss": -12.168977737426758, "global_step": 320758, "epoch": 1909} {"train_loss": -12.235968589782715, "global_step": 320759, "epoch": 1909} {"train_loss": -12.310314178466797, "global_step": 320760, "epoch": 1909} {"train_loss": -12.26092529296875, "global_step": 320761, "epoch": 1909} {"train_loss": -12.314102172851562, "global_step": 320762, "epoch": 1909} {"train_loss": -12.390266418457031, "global_step": 320763, "epoch": 1909} {"train_loss": -12.344182968139648, "global_step": 320764, "epoch": 1909} {"train_loss": -11.878515243530273, "global_step": 320765, "epoch": 1909} {"train_loss": -12.403958320617676, "global_step": 320766, "epoch": 1909} {"train_loss": -12.35802936553955, "global_step": 320767, "epoch": 1909} {"train_loss": -12.336519241333008, "global_step": 320768, "epoch": 1909} {"train_loss": -12.444306373596191, "global_step": 320769, "epoch": 1909} {"train_loss": -12.271820068359375, "global_step": 320770, "epoch": 1909} {"train_loss": -12.302621841430664, "global_step": 320771, "epoch": 1909} {"train_loss": -12.180808067321777, "global_step": 320772, "epoch": 1909} {"train_loss": -12.049665451049805, "global_step": 320773, "epoch": 1909} {"train_loss": -12.246971130371094, "global_step": 320774, "epoch": 1909} {"train_loss": -12.395156860351562, "global_step": 320775, "epoch": 1909} {"train_loss": -12.522216796875, "global_step": 320776, "epoch": 1909} {"train_loss": -12.422670364379883, "global_step": 320777, "epoch": 1909} {"train_loss": -12.345357894897461, "global_step": 320778, "epoch": 1909} {"train_loss": -12.426229476928711, "global_step": 320779, "epoch": 1909} {"train_loss": -12.418907165527344, "global_step": 320780, "epoch": 1909} {"train_loss": -12.510961532592773, "global_step": 320781, "epoch": 1909} {"train_loss": -12.26216983795166, "global_step": 320782, "epoch": 1909} {"train_loss": -12.514410018920898, "global_step": 320783, "epoch": 1909} {"train_loss": -12.249717712402344, "global_step": 320784, "epoch": 1909} {"train_loss": -12.641444206237793, "global_step": 320785, "epoch": 1909} {"train_loss": -12.432453155517578, "global_step": 320786, "epoch": 1909} {"train_loss": -11.937312126159668, "global_step": 320787, "epoch": 1909} {"train_loss": -12.359245300292969, "global_step": 320788, "epoch": 1909} {"train_loss": -12.437097549438477, "global_step": 320789, "epoch": 1909} {"train_loss": -12.479393005371094, "global_step": 320790, "epoch": 1909} {"train_loss": -12.343830108642578, "global_step": 320791, "epoch": 1909} {"train_loss": -12.564001083374023, "global_step": 320792, "epoch": 1909} {"train_loss": -12.250919342041016, "global_step": 320793, "epoch": 1909} {"train_loss": -11.948888778686523, "global_step": 320794, "epoch": 1909} {"train_loss": -11.065431594848633, "global_step": 320795, "epoch": 1909} {"train_loss": -10.697246551513672, "global_step": 320796, "epoch": 1909} {"train_loss": -12.383271217346191, "global_step": 320797, "epoch": 1909} {"train_loss": -12.094954490661621, "global_step": 320798, "epoch": 1909} {"train_loss": -11.061043739318848, "global_step": 320799, "epoch": 1909} {"train_loss": -11.611721992492676, "global_step": 320800, "epoch": 1909} {"train_loss": -12.046436309814453, "global_step": 320801, "epoch": 1909} {"train_loss": -11.991155624389648, "global_step": 320802, "epoch": 1909} {"train_loss": -11.63674545288086, "global_step": 320803, "epoch": 1909} {"train_loss": -12.029806137084961, "global_step": 320804, "epoch": 1909} {"train_loss": -12.04711627960205, "global_step": 320805, "epoch": 1909} {"train_loss": -12.155698776245117, "global_step": 320806, "epoch": 1909} {"train_loss": -11.636124610900879, "global_step": 320807, "epoch": 1909} {"train_loss": -12.40993881225586, "global_step": 320808, "epoch": 1909} {"train_loss": -11.881278991699219, "global_step": 320809, "epoch": 1909} {"train_loss": -12.392544746398926, "global_step": 320810, "epoch": 1909} {"train_loss": -12.350563049316406, "global_step": 320811, "epoch": 1909} {"train_loss": -12.372087478637695, "global_step": 320812, "epoch": 1909} {"train_loss": -12.203922271728516, "global_step": 320813, "epoch": 1909} {"train_loss": -12.19914436340332, "global_step": 320814, "epoch": 1909} {"train_loss": -12.448104858398438, "global_step": 320815, "epoch": 1909} {"train_loss": -12.008523941040039, "global_step": 320816, "epoch": 1909} {"train_loss": -12.26471996307373, "global_step": 320817, "epoch": 1909} {"train_loss": -12.37183666229248, "global_step": 320818, "epoch": 1909} {"train_loss": -12.37126350402832, "global_step": 320819, "epoch": 1909} {"train_loss": -12.541918754577637, "global_step": 320820, "epoch": 1909} {"train_loss": -12.398880004882812, "global_step": 320821, "epoch": 1909} {"train_loss": -12.208375930786133, "global_step": 320822, "epoch": 1909} {"train_loss": -12.312164306640625, "global_step": 320823, "epoch": 1909} {"train_loss": -12.236263275146484, "global_step": 320824, "epoch": 1909} {"train_loss": -12.499083518981934, "global_step": 320825, "epoch": 1909} {"train_loss": -12.365214347839355, "global_step": 320826, "epoch": 1909} {"train_loss": -12.409845352172852, "global_step": 320827, "epoch": 1909} {"train_loss": -12.490327835083008, "global_step": 320828, "epoch": 1909} {"train_loss": -12.057889938354492, "global_step": 320829, "epoch": 1909} {"train_loss": -12.219539642333984, "global_step": 320830, "epoch": 1909} {"train_loss": -12.214776992797852, "global_step": 320831, "epoch": 1909} {"train_loss": -11.923133850097656, "global_step": 320832, "epoch": 1909} {"train_loss": -12.466445922851562, "global_step": 320833, "epoch": 1909} {"train_loss": -12.1375150680542, "global_step": 320834, "epoch": 1909} {"train_loss": -12.405515670776367, "global_step": 320835, "epoch": 1909} {"train_loss": -12.323378562927246, "global_step": 320836, "epoch": 1909} {"train_loss": -12.336499214172363, "global_step": 320837, "epoch": 1909} {"train_loss": -12.236976623535156, "global_step": 320838, "epoch": 1909} {"train_loss": -12.446739196777344, "global_step": 320839, "epoch": 1909} {"train_loss": -12.163641929626465, "global_step": 320840, "epoch": 1909} {"train_loss": -12.381243705749512, "global_step": 320841, "epoch": 1909} {"train_loss": -12.329999923706055, "global_step": 320842, "epoch": 1909} {"train_loss": -12.281715393066406, "global_step": 320843, "epoch": 1909} {"train_loss": -12.359024047851562, "global_step": 320844, "epoch": 1909} {"train_loss": -12.035307884216309, "global_step": 320845, "epoch": 1909} {"train_loss": -12.375635147094727, "global_step": 320846, "epoch": 1909} {"train_loss": -12.001866340637207, "global_step": 320847, "epoch": 1909} {"train_loss": -12.060707092285156, "global_step": 320848, "epoch": 1909} {"train_loss": -12.521591186523438, "global_step": 320849, "epoch": 1909} {"train_loss": -11.774293899536133, "global_step": 320850, "epoch": 1909} {"train_loss": -11.417022705078125, "global_step": 320851, "epoch": 1909} {"train_loss": -12.144075393676758, "global_step": 320852, "epoch": 1909} {"train_loss": -11.912668228149414, "global_step": 320853, "epoch": 1909} {"train_loss": -11.747986793518066, "global_step": 320854, "epoch": 1909} {"train_loss": -11.555978775024414, "global_step": 320855, "epoch": 1909} {"train_loss": -11.717117309570312, "global_step": 320856, "epoch": 1909} {"train_loss": -11.492836952209473, "global_step": 320857, "epoch": 1909} {"train_loss": -9.863260269165039, "global_step": 320858, "epoch": 1909} {"train_loss": -10.703916549682617, "global_step": 320859, "epoch": 1909} {"train_loss": -10.552506446838379, "global_step": 320860, "epoch": 1909} {"train_loss": -9.799753189086914, "global_step": 320861, "epoch": 1909} {"train_loss": -9.302083969116211, "global_step": 320862, "epoch": 1909} {"train_loss": -10.373212814331055, "global_step": 320863, "epoch": 1909} {"train_loss": -9.74416732788086, "global_step": 320864, "epoch": 1909} {"train_loss": -10.632776260375977, "global_step": 320865, "epoch": 1909} {"train_loss": -10.907835006713867, "global_step": 320866, "epoch": 1909} {"train_loss": -10.550033569335938, "global_step": 320867, "epoch": 1909} {"train_loss": -11.559242248535156, "global_step": 320868, "epoch": 1909} {"train_loss": -10.064672470092773, "global_step": 320869, "epoch": 1909} {"train_loss": -11.307218551635742, "global_step": 320870, "epoch": 1909} {"train_loss": -10.13670539855957, "global_step": 320871, "epoch": 1909} {"train_loss": -10.526945114135742, "global_step": 320872, "epoch": 1909} {"train_loss": -11.008563995361328, "global_step": 320873, "epoch": 1909} {"train_loss": -10.657657623291016, "global_step": 320874, "epoch": 1909} {"train_loss": -11.042651176452637, "global_step": 320875, "epoch": 1909} {"train_loss": -11.230203628540039, "global_step": 320876, "epoch": 1909} {"train_loss": -10.817885398864746, "global_step": 320877, "epoch": 1909} {"train_loss": -10.91807746887207, "global_step": 320878, "epoch": 1909} {"train_loss": -11.82540376413436, "global_step": 320879, "epoch": 1909, "val_loss": 280141.34375} {"train_loss": -10.998523712158203, "global_step": 320880, "epoch": 1910} {"train_loss": -9.261209487915039, "global_step": 320881, "epoch": 1910} {"train_loss": -11.2200927734375, "global_step": 320882, "epoch": 1910} {"train_loss": -9.591741561889648, "global_step": 320883, "epoch": 1910} {"train_loss": -9.311626434326172, "global_step": 320884, "epoch": 1910} {"train_loss": -10.58082389831543, "global_step": 320885, "epoch": 1910} {"train_loss": -9.353475570678711, "global_step": 320886, "epoch": 1910} {"train_loss": -8.955123901367188, "global_step": 320887, "epoch": 1910} {"train_loss": -10.319487571716309, "global_step": 320888, "epoch": 1910} {"train_loss": -10.489436149597168, "global_step": 320889, "epoch": 1910} {"train_loss": -10.164695739746094, "global_step": 320890, "epoch": 1910} {"train_loss": -10.906572341918945, "global_step": 320891, "epoch": 1910} {"train_loss": -10.19561767578125, "global_step": 320892, "epoch": 1910} {"train_loss": -10.350923538208008, "global_step": 320893, "epoch": 1910} {"train_loss": -10.780198097229004, "global_step": 320894, "epoch": 1910} {"train_loss": -9.49166488647461, "global_step": 320895, "epoch": 1910} {"train_loss": -11.388811111450195, "global_step": 320896, "epoch": 1910} {"train_loss": -10.561639785766602, "global_step": 320897, "epoch": 1910} {"train_loss": -10.725777626037598, "global_step": 320898, "epoch": 1910} {"train_loss": -11.017618179321289, "global_step": 320899, "epoch": 1910} {"train_loss": -10.758045196533203, "global_step": 320900, "epoch": 1910} {"train_loss": -10.894393920898438, "global_step": 320901, "epoch": 1910} {"train_loss": -10.883309364318848, "global_step": 320902, "epoch": 1910} {"train_loss": -10.726993560791016, "global_step": 320903, "epoch": 1910} {"train_loss": -10.766952514648438, "global_step": 320904, "epoch": 1910} {"train_loss": -10.695688247680664, "global_step": 320905, "epoch": 1910} {"train_loss": -10.11920166015625, "global_step": 320906, "epoch": 1910} {"train_loss": -10.994902610778809, "global_step": 320907, "epoch": 1910} {"train_loss": -11.063398361206055, "global_step": 320908, "epoch": 1910} {"train_loss": -10.469120025634766, "global_step": 320909, "epoch": 1910} {"train_loss": -11.696622848510742, "global_step": 320910, "epoch": 1910} {"train_loss": -10.636455535888672, "global_step": 320911, "epoch": 1910} {"train_loss": -11.265522003173828, "global_step": 320912, "epoch": 1910} {"train_loss": -11.01659107208252, "global_step": 320913, "epoch": 1910} {"train_loss": -11.536495208740234, "global_step": 320914, "epoch": 1910} {"train_loss": -11.077756881713867, "global_step": 320915, "epoch": 1910} {"train_loss": -11.260059356689453, "global_step": 320916, "epoch": 1910} {"train_loss": -11.464142799377441, "global_step": 320917, "epoch": 1910} {"train_loss": -11.267778396606445, "global_step": 320918, "epoch": 1910} {"train_loss": -11.722845077514648, "global_step": 320919, "epoch": 1910} {"train_loss": -11.281712532043457, "global_step": 320920, "epoch": 1910} {"train_loss": -11.377815246582031, "global_step": 320921, "epoch": 1910} {"train_loss": -11.699256896972656, "global_step": 320922, "epoch": 1910} {"train_loss": -11.472970962524414, "global_step": 320923, "epoch": 1910} {"train_loss": -11.814074516296387, "global_step": 320924, "epoch": 1910} {"train_loss": -11.586067199707031, "global_step": 320925, "epoch": 1910} {"train_loss": -11.527984619140625, "global_step": 320926, "epoch": 1910} {"train_loss": -11.734905242919922, "global_step": 320927, "epoch": 1910} {"train_loss": -11.772815704345703, "global_step": 320928, "epoch": 1910} {"train_loss": -11.873727798461914, "global_step": 320929, "epoch": 1910} {"train_loss": -11.828020095825195, "global_step": 320930, "epoch": 1910} {"train_loss": -11.596874237060547, "global_step": 320931, "epoch": 1910} {"train_loss": -11.52646255493164, "global_step": 320932, "epoch": 1910} {"train_loss": -11.833528518676758, "global_step": 320933, "epoch": 1910} {"train_loss": -12.012481689453125, "global_step": 320934, "epoch": 1910} {"train_loss": -11.841453552246094, "global_step": 320935, "epoch": 1910} {"train_loss": -12.078973770141602, "global_step": 320936, "epoch": 1910} {"train_loss": -11.793046951293945, "global_step": 320937, "epoch": 1910} {"train_loss": -11.819541931152344, "global_step": 320938, "epoch": 1910} {"train_loss": -11.99931812286377, "global_step": 320939, "epoch": 1910} {"train_loss": -12.129461288452148, "global_step": 320940, "epoch": 1910} {"train_loss": -12.10260009765625, "global_step": 320941, "epoch": 1910} {"train_loss": -12.032968521118164, "global_step": 320942, "epoch": 1910} {"train_loss": -12.137568473815918, "global_step": 320943, "epoch": 1910} {"train_loss": -12.198885917663574, "global_step": 320944, "epoch": 1910} {"train_loss": -12.163912773132324, "global_step": 320945, "epoch": 1910} {"train_loss": -12.015251159667969, "global_step": 320946, "epoch": 1910} {"train_loss": -12.073136329650879, "global_step": 320947, "epoch": 1910} {"train_loss": -12.32244873046875, "global_step": 320948, "epoch": 1910} {"train_loss": -12.109865188598633, "global_step": 320949, "epoch": 1910} {"train_loss": -12.194631576538086, "global_step": 320950, "epoch": 1910} {"train_loss": -12.134880065917969, "global_step": 320951, "epoch": 1910} {"train_loss": -12.172883987426758, "global_step": 320952, "epoch": 1910} {"train_loss": -12.060869216918945, "global_step": 320953, "epoch": 1910} {"train_loss": -12.172904968261719, "global_step": 320954, "epoch": 1910} {"train_loss": -12.394795417785645, "global_step": 320955, "epoch": 1910} {"train_loss": -12.310281753540039, "global_step": 320956, "epoch": 1910} {"train_loss": -11.902780532836914, "global_step": 320957, "epoch": 1910} {"train_loss": -12.346035957336426, "global_step": 320958, "epoch": 1910} {"train_loss": -12.10026741027832, "global_step": 320959, "epoch": 1910} {"train_loss": -12.448923110961914, "global_step": 320960, "epoch": 1910} {"train_loss": -11.986871719360352, "global_step": 320961, "epoch": 1910} {"train_loss": -12.245351791381836, "global_step": 320962, "epoch": 1910} {"train_loss": -12.29169750213623, "global_step": 320963, "epoch": 1910} {"train_loss": -12.30767822265625, "global_step": 320964, "epoch": 1910} {"train_loss": -12.394355773925781, "global_step": 320965, "epoch": 1910} {"train_loss": -12.436368942260742, "global_step": 320966, "epoch": 1910} {"train_loss": -12.515645980834961, "global_step": 320967, "epoch": 1910} {"train_loss": -12.494325637817383, "global_step": 320968, "epoch": 1910} {"train_loss": -12.347387313842773, "global_step": 320969, "epoch": 1910} {"train_loss": -12.498025894165039, "global_step": 320970, "epoch": 1910} {"train_loss": -12.34563159942627, "global_step": 320971, "epoch": 1910} {"train_loss": -12.41091251373291, "global_step": 320972, "epoch": 1910} {"train_loss": -12.452792167663574, "global_step": 320973, "epoch": 1910} {"train_loss": -12.416942596435547, "global_step": 320974, "epoch": 1910} {"train_loss": -12.468564987182617, "global_step": 320975, "epoch": 1910} {"train_loss": -12.386170387268066, "global_step": 320976, "epoch": 1910} {"train_loss": -12.383583068847656, "global_step": 320977, "epoch": 1910} {"train_loss": -12.497154235839844, "global_step": 320978, "epoch": 1910} {"train_loss": -12.22541618347168, "global_step": 320979, "epoch": 1910} {"train_loss": -12.509729385375977, "global_step": 320980, "epoch": 1910} {"train_loss": -12.336759567260742, "global_step": 320981, "epoch": 1910} {"train_loss": -12.362726211547852, "global_step": 320982, "epoch": 1910} {"train_loss": -12.487300872802734, "global_step": 320983, "epoch": 1910} {"train_loss": -12.620403289794922, "global_step": 320984, "epoch": 1910} {"train_loss": -12.366096496582031, "global_step": 320985, "epoch": 1910} {"train_loss": -12.357525825500488, "global_step": 320986, "epoch": 1910} {"train_loss": -12.273500442504883, "global_step": 320987, "epoch": 1910} {"train_loss": -12.59811782836914, "global_step": 320988, "epoch": 1910} {"train_loss": -12.645763397216797, "global_step": 320989, "epoch": 1910} {"train_loss": -12.389076232910156, "global_step": 320990, "epoch": 1910} {"train_loss": -12.504383087158203, "global_step": 320991, "epoch": 1910} {"train_loss": -12.568916320800781, "global_step": 320992, "epoch": 1910} {"train_loss": -12.547431945800781, "global_step": 320993, "epoch": 1910} {"train_loss": -12.593101501464844, "global_step": 320994, "epoch": 1910} {"train_loss": -12.371903419494629, "global_step": 320995, "epoch": 1910} {"train_loss": -12.46764087677002, "global_step": 320996, "epoch": 1910} {"train_loss": -12.534618377685547, "global_step": 320997, "epoch": 1910} {"train_loss": -12.645549774169922, "global_step": 320998, "epoch": 1910} {"train_loss": -12.306535720825195, "global_step": 320999, "epoch": 1910} {"train_loss": -12.591903686523438, "global_step": 321000, "epoch": 1910} {"train_loss": -12.295393943786621, "global_step": 321001, "epoch": 1910} {"train_loss": -12.643213272094727, "global_step": 321002, "epoch": 1910} {"train_loss": -12.72287368774414, "global_step": 321003, "epoch": 1910} {"train_loss": -12.711485862731934, "global_step": 321004, "epoch": 1910} {"train_loss": -12.515142440795898, "global_step": 321005, "epoch": 1910} {"train_loss": -12.638537406921387, "global_step": 321006, "epoch": 1910} {"train_loss": -12.68460464477539, "global_step": 321007, "epoch": 1910} {"train_loss": -12.390694618225098, "global_step": 321008, "epoch": 1910} {"train_loss": -12.135543823242188, "global_step": 321009, "epoch": 1910} {"train_loss": -12.179740905761719, "global_step": 321010, "epoch": 1910} {"train_loss": -12.33032512664795, "global_step": 321011, "epoch": 1910} {"train_loss": -12.566441535949707, "global_step": 321012, "epoch": 1910} {"train_loss": -12.745737075805664, "global_step": 321013, "epoch": 1910} {"train_loss": -12.614410400390625, "global_step": 321014, "epoch": 1910} {"train_loss": -12.52844524383545, "global_step": 321015, "epoch": 1910} {"train_loss": -12.527612686157227, "global_step": 321016, "epoch": 1910} {"train_loss": -12.516166687011719, "global_step": 321017, "epoch": 1910} {"train_loss": -11.844404220581055, "global_step": 321018, "epoch": 1910} {"train_loss": -10.458127975463867, "global_step": 321019, "epoch": 1910} {"train_loss": -11.794105529785156, "global_step": 321020, "epoch": 1910} {"train_loss": -11.873943328857422, "global_step": 321021, "epoch": 1910} {"train_loss": -12.497811317443848, "global_step": 321022, "epoch": 1910} {"train_loss": -10.82779312133789, "global_step": 321023, "epoch": 1910} {"train_loss": -9.236763000488281, "global_step": 321024, "epoch": 1910} {"train_loss": -11.470840454101562, "global_step": 321025, "epoch": 1910} {"train_loss": -8.810736656188965, "global_step": 321026, "epoch": 1910} {"train_loss": -11.471214294433594, "global_step": 321027, "epoch": 1910} {"train_loss": -9.803502082824707, "global_step": 321028, "epoch": 1910} {"train_loss": -10.397920608520508, "global_step": 321029, "epoch": 1910} {"train_loss": -9.133512496948242, "global_step": 321030, "epoch": 1910} {"train_loss": -10.616817474365234, "global_step": 321031, "epoch": 1910} {"train_loss": -8.629701614379883, "global_step": 321032, "epoch": 1910} {"train_loss": -9.787660598754883, "global_step": 321033, "epoch": 1910} {"train_loss": -7.634840965270996, "global_step": 321034, "epoch": 1910} {"train_loss": -8.836868286132812, "global_step": 321035, "epoch": 1910} {"train_loss": -8.623842239379883, "global_step": 321036, "epoch": 1910} {"train_loss": -9.094796180725098, "global_step": 321037, "epoch": 1910} {"train_loss": -9.940608978271484, "global_step": 321038, "epoch": 1910} {"train_loss": -9.31955623626709, "global_step": 321039, "epoch": 1910} {"train_loss": -9.698391914367676, "global_step": 321040, "epoch": 1910} {"train_loss": -9.867713928222656, "global_step": 321041, "epoch": 1910} {"train_loss": -9.418292999267578, "global_step": 321042, "epoch": 1910} {"train_loss": -10.33592700958252, "global_step": 321043, "epoch": 1910} {"train_loss": -9.914227485656738, "global_step": 321044, "epoch": 1910} {"train_loss": -10.004613876342773, "global_step": 321045, "epoch": 1910} {"train_loss": -10.706886291503906, "global_step": 321046, "epoch": 1910} {"train_loss": -11.48060473373958, "global_step": 321047, "epoch": 1910, "val_loss": 279787.96875, "train_action_mse_error": 4.278959274291992} {"train_loss": -11.007587432861328, "global_step": 321048, "epoch": 1911} {"train_loss": -10.809021949768066, "global_step": 321049, "epoch": 1911} {"train_loss": -10.6715087890625, "global_step": 321050, "epoch": 1911} {"train_loss": -11.094175338745117, "global_step": 321051, "epoch": 1911} {"train_loss": -10.689126968383789, "global_step": 321052, "epoch": 1911} {"train_loss": -11.158269882202148, "global_step": 321053, "epoch": 1911} {"train_loss": -10.756536483764648, "global_step": 321054, "epoch": 1911} {"train_loss": -11.289799690246582, "global_step": 321055, "epoch": 1911} {"train_loss": -11.426117897033691, "global_step": 321056, "epoch": 1911} {"train_loss": -11.616969108581543, "global_step": 321057, "epoch": 1911} {"train_loss": -11.976635932922363, "global_step": 321058, "epoch": 1911} {"train_loss": -11.577138900756836, "global_step": 321059, "epoch": 1911} {"train_loss": -11.52450180053711, "global_step": 321060, "epoch": 1911} {"train_loss": -11.726356506347656, "global_step": 321061, "epoch": 1911} {"train_loss": -11.006282806396484, "global_step": 321062, "epoch": 1911} {"train_loss": -11.958623886108398, "global_step": 321063, "epoch": 1911} {"train_loss": -11.459280014038086, "global_step": 321064, "epoch": 1911} {"train_loss": -12.077142715454102, "global_step": 321065, "epoch": 1911} {"train_loss": -11.797557830810547, "global_step": 321066, "epoch": 1911} {"train_loss": -11.63809585571289, "global_step": 321067, "epoch": 1911} {"train_loss": -11.92497444152832, "global_step": 321068, "epoch": 1911} {"train_loss": -11.88516616821289, "global_step": 321069, "epoch": 1911} {"train_loss": -11.739062309265137, "global_step": 321070, "epoch": 1911} {"train_loss": -12.166460037231445, "global_step": 321071, "epoch": 1911} {"train_loss": -12.015225410461426, "global_step": 321072, "epoch": 1911} {"train_loss": -12.122835159301758, "global_step": 321073, "epoch": 1911} {"train_loss": -12.091168403625488, "global_step": 321074, "epoch": 1911} {"train_loss": -11.827569961547852, "global_step": 321075, "epoch": 1911} {"train_loss": -12.027215957641602, "global_step": 321076, "epoch": 1911} {"train_loss": -12.133035659790039, "global_step": 321077, "epoch": 1911} {"train_loss": -11.975736618041992, "global_step": 321078, "epoch": 1911} {"train_loss": -12.379433631896973, "global_step": 321079, "epoch": 1911} {"train_loss": -12.048185348510742, "global_step": 321080, "epoch": 1911} {"train_loss": -12.040140151977539, "global_step": 321081, "epoch": 1911} {"train_loss": -12.217058181762695, "global_step": 321082, "epoch": 1911} {"train_loss": -12.226805686950684, "global_step": 321083, "epoch": 1911} {"train_loss": -12.106204986572266, "global_step": 321084, "epoch": 1911} {"train_loss": -12.331724166870117, "global_step": 321085, "epoch": 1911} {"train_loss": -11.969691276550293, "global_step": 321086, "epoch": 1911} {"train_loss": -12.253395080566406, "global_step": 321087, "epoch": 1911} {"train_loss": -11.861268997192383, "global_step": 321088, "epoch": 1911} {"train_loss": -12.241323471069336, "global_step": 321089, "epoch": 1911} {"train_loss": -11.867624282836914, "global_step": 321090, "epoch": 1911} {"train_loss": -12.209051132202148, "global_step": 321091, "epoch": 1911} {"train_loss": -11.847799301147461, "global_step": 321092, "epoch": 1911} {"train_loss": -12.282707214355469, "global_step": 321093, "epoch": 1911} {"train_loss": -12.0684814453125, "global_step": 321094, "epoch": 1911} {"train_loss": -12.144084930419922, "global_step": 321095, "epoch": 1911} {"train_loss": -11.937633514404297, "global_step": 321096, "epoch": 1911} {"train_loss": -11.784209251403809, "global_step": 321097, "epoch": 1911} {"train_loss": -12.255127906799316, "global_step": 321098, "epoch": 1911} {"train_loss": -12.1666841506958, "global_step": 321099, "epoch": 1911} {"train_loss": -12.324365615844727, "global_step": 321100, "epoch": 1911} {"train_loss": -12.07041072845459, "global_step": 321101, "epoch": 1911} {"train_loss": -12.146446228027344, "global_step": 321102, "epoch": 1911} {"train_loss": -12.097758293151855, "global_step": 321103, "epoch": 1911} {"train_loss": -12.119750022888184, "global_step": 321104, "epoch": 1911} {"train_loss": -12.226875305175781, "global_step": 321105, "epoch": 1911} {"train_loss": -12.366889953613281, "global_step": 321106, "epoch": 1911} {"train_loss": -12.30389404296875, "global_step": 321107, "epoch": 1911} {"train_loss": -12.19874382019043, "global_step": 321108, "epoch": 1911} {"train_loss": -12.453201293945312, "global_step": 321109, "epoch": 1911} {"train_loss": -12.396596908569336, "global_step": 321110, "epoch": 1911} {"train_loss": -12.50684928894043, "global_step": 321111, "epoch": 1911} {"train_loss": -12.317461013793945, "global_step": 321112, "epoch": 1911} {"train_loss": -12.329293251037598, "global_step": 321113, "epoch": 1911} {"train_loss": -12.183114051818848, "global_step": 321114, "epoch": 1911} {"train_loss": -12.274758338928223, "global_step": 321115, "epoch": 1911} {"train_loss": -12.203804969787598, "global_step": 321116, "epoch": 1911} {"train_loss": -11.77569580078125, "global_step": 321117, "epoch": 1911} {"train_loss": -11.706809997558594, "global_step": 321118, "epoch": 1911} {"train_loss": -11.78271198272705, "global_step": 321119, "epoch": 1911} {"train_loss": -10.841360092163086, "global_step": 321120, "epoch": 1911} {"train_loss": -11.7009916305542, "global_step": 321121, "epoch": 1911} {"train_loss": -12.059795379638672, "global_step": 321122, "epoch": 1911} {"train_loss": -12.056126594543457, "global_step": 321123, "epoch": 1911} {"train_loss": -12.077252388000488, "global_step": 321124, "epoch": 1911} {"train_loss": -12.27535343170166, "global_step": 321125, "epoch": 1911} {"train_loss": -11.67367172241211, "global_step": 321126, "epoch": 1911} {"train_loss": -12.491548538208008, "global_step": 321127, "epoch": 1911} {"train_loss": -11.911346435546875, "global_step": 321128, "epoch": 1911} {"train_loss": -12.201164245605469, "global_step": 321129, "epoch": 1911} {"train_loss": -11.717824935913086, "global_step": 321130, "epoch": 1911} {"train_loss": -12.268633842468262, "global_step": 321131, "epoch": 1911} {"train_loss": -11.907293319702148, "global_step": 321132, "epoch": 1911} {"train_loss": -12.058951377868652, "global_step": 321133, "epoch": 1911} {"train_loss": -11.693408012390137, "global_step": 321134, "epoch": 1911} {"train_loss": -11.926910400390625, "global_step": 321135, "epoch": 1911} {"train_loss": -12.0540189743042, "global_step": 321136, "epoch": 1911} {"train_loss": -11.430649757385254, "global_step": 321137, "epoch": 1911} {"train_loss": -11.92785358428955, "global_step": 321138, "epoch": 1911} {"train_loss": -11.440993309020996, "global_step": 321139, "epoch": 1911} {"train_loss": -12.448589324951172, "global_step": 321140, "epoch": 1911} {"train_loss": -11.918947219848633, "global_step": 321141, "epoch": 1911} {"train_loss": -12.028114318847656, "global_step": 321142, "epoch": 1911} {"train_loss": -12.07337760925293, "global_step": 321143, "epoch": 1911} {"train_loss": -12.034703254699707, "global_step": 321144, "epoch": 1911} {"train_loss": -11.49464225769043, "global_step": 321145, "epoch": 1911} {"train_loss": -12.237611770629883, "global_step": 321146, "epoch": 1911} {"train_loss": -11.666135787963867, "global_step": 321147, "epoch": 1911} {"train_loss": -12.466419219970703, "global_step": 321148, "epoch": 1911} {"train_loss": -11.87891960144043, "global_step": 321149, "epoch": 1911} {"train_loss": -12.168930053710938, "global_step": 321150, "epoch": 1911} {"train_loss": -12.35238265991211, "global_step": 321151, "epoch": 1911} {"train_loss": -12.097343444824219, "global_step": 321152, "epoch": 1911} {"train_loss": -12.325398445129395, "global_step": 321153, "epoch": 1911} {"train_loss": -12.265414237976074, "global_step": 321154, "epoch": 1911} {"train_loss": -12.206079483032227, "global_step": 321155, "epoch": 1911} {"train_loss": -12.160987854003906, "global_step": 321156, "epoch": 1911} {"train_loss": -12.235077857971191, "global_step": 321157, "epoch": 1911} {"train_loss": -12.283313751220703, "global_step": 321158, "epoch": 1911} {"train_loss": -12.401397705078125, "global_step": 321159, "epoch": 1911} {"train_loss": -12.292204856872559, "global_step": 321160, "epoch": 1911} {"train_loss": -12.390417098999023, "global_step": 321161, "epoch": 1911} {"train_loss": -12.34982681274414, "global_step": 321162, "epoch": 1911} {"train_loss": -12.40945053100586, "global_step": 321163, "epoch": 1911} {"train_loss": -12.41018295288086, "global_step": 321164, "epoch": 1911} {"train_loss": -12.472399711608887, "global_step": 321165, "epoch": 1911} {"train_loss": -12.33907413482666, "global_step": 321166, "epoch": 1911} {"train_loss": -12.63018798828125, "global_step": 321167, "epoch": 1911} {"train_loss": -12.324833869934082, "global_step": 321168, "epoch": 1911} {"train_loss": -11.853901863098145, "global_step": 321169, "epoch": 1911} {"train_loss": -12.314529418945312, "global_step": 321170, "epoch": 1911} {"train_loss": -12.020904541015625, "global_step": 321171, "epoch": 1911} {"train_loss": -12.611551284790039, "global_step": 321172, "epoch": 1911} {"train_loss": -12.242863655090332, "global_step": 321173, "epoch": 1911} {"train_loss": -12.550432205200195, "global_step": 321174, "epoch": 1911} {"train_loss": -12.189807891845703, "global_step": 321175, "epoch": 1911} {"train_loss": -12.335268020629883, "global_step": 321176, "epoch": 1911} {"train_loss": -12.470029830932617, "global_step": 321177, "epoch": 1911} {"train_loss": -12.078121185302734, "global_step": 321178, "epoch": 1911} {"train_loss": -12.233528137207031, "global_step": 321179, "epoch": 1911} {"train_loss": -12.327913284301758, "global_step": 321180, "epoch": 1911} {"train_loss": -12.205416679382324, "global_step": 321181, "epoch": 1911} {"train_loss": -12.323139190673828, "global_step": 321182, "epoch": 1911} {"train_loss": -12.247636795043945, "global_step": 321183, "epoch": 1911} {"train_loss": -12.205831527709961, "global_step": 321184, "epoch": 1911} {"train_loss": -11.583755493164062, "global_step": 321185, "epoch": 1911} {"train_loss": -12.293739318847656, "global_step": 321186, "epoch": 1911} {"train_loss": -11.773229598999023, "global_step": 321187, "epoch": 1911} {"train_loss": -12.19845962524414, "global_step": 321188, "epoch": 1911} {"train_loss": -12.041770935058594, "global_step": 321189, "epoch": 1911} {"train_loss": -12.158624649047852, "global_step": 321190, "epoch": 1911} {"train_loss": -11.837119102478027, "global_step": 321191, "epoch": 1911} {"train_loss": -11.765966415405273, "global_step": 321192, "epoch": 1911} {"train_loss": -12.065016746520996, "global_step": 321193, "epoch": 1911} {"train_loss": -11.78317642211914, "global_step": 321194, "epoch": 1911} {"train_loss": -11.712902069091797, "global_step": 321195, "epoch": 1911} {"train_loss": -10.828054428100586, "global_step": 321196, "epoch": 1911} {"train_loss": -11.801239013671875, "global_step": 321197, "epoch": 1911} {"train_loss": -10.741716384887695, "global_step": 321198, "epoch": 1911} {"train_loss": -12.066354751586914, "global_step": 321199, "epoch": 1911} {"train_loss": -11.734180450439453, "global_step": 321200, "epoch": 1911} {"train_loss": -11.95197582244873, "global_step": 321201, "epoch": 1911} {"train_loss": -11.029098510742188, "global_step": 321202, "epoch": 1911} {"train_loss": -12.158437728881836, "global_step": 321203, "epoch": 1911} {"train_loss": -11.469452857971191, "global_step": 321204, "epoch": 1911} {"train_loss": -11.534067153930664, "global_step": 321205, "epoch": 1911} {"train_loss": -11.557283401489258, "global_step": 321206, "epoch": 1911} {"train_loss": -11.858114242553711, "global_step": 321207, "epoch": 1911} {"train_loss": -11.835957527160645, "global_step": 321208, "epoch": 1911} {"train_loss": -11.258476257324219, "global_step": 321209, "epoch": 1911} {"train_loss": -10.670806884765625, "global_step": 321210, "epoch": 1911} {"train_loss": -11.224447250366211, "global_step": 321211, "epoch": 1911} {"train_loss": -10.193622589111328, "global_step": 321212, "epoch": 1911} {"train_loss": -10.751773834228516, "global_step": 321213, "epoch": 1911} {"train_loss": -10.878877639770508, "global_step": 321214, "epoch": 1911} {"train_loss": -11.925760008039928, "global_step": 321215, "epoch": 1911, "val_loss": 287926.625} {"train_loss": -10.740077018737793, "global_step": 321216, "epoch": 1912} {"train_loss": -10.712825775146484, "global_step": 321217, "epoch": 1912} {"train_loss": -10.751825332641602, "global_step": 321218, "epoch": 1912} {"train_loss": -10.565139770507812, "global_step": 321219, "epoch": 1912} {"train_loss": -11.505692481994629, "global_step": 321220, "epoch": 1912} {"train_loss": -11.058024406433105, "global_step": 321221, "epoch": 1912} {"train_loss": -12.017921447753906, "global_step": 321222, "epoch": 1912} {"train_loss": -11.199625968933105, "global_step": 321223, "epoch": 1912} {"train_loss": -11.31130599975586, "global_step": 321224, "epoch": 1912} {"train_loss": -10.876749038696289, "global_step": 321225, "epoch": 1912} {"train_loss": -11.510320663452148, "global_step": 321226, "epoch": 1912} {"train_loss": -10.791624069213867, "global_step": 321227, "epoch": 1912} {"train_loss": -11.152549743652344, "global_step": 321228, "epoch": 1912} {"train_loss": -11.617328643798828, "global_step": 321229, "epoch": 1912} {"train_loss": -11.09515380859375, "global_step": 321230, "epoch": 1912} {"train_loss": -10.7163724899292, "global_step": 321231, "epoch": 1912} {"train_loss": -11.066198348999023, "global_step": 321232, "epoch": 1912} {"train_loss": -10.42803955078125, "global_step": 321233, "epoch": 1912} {"train_loss": -10.896799087524414, "global_step": 321234, "epoch": 1912} {"train_loss": -11.012443542480469, "global_step": 321235, "epoch": 1912} {"train_loss": -11.026373863220215, "global_step": 321236, "epoch": 1912} {"train_loss": -10.855329513549805, "global_step": 321237, "epoch": 1912} {"train_loss": -11.196220397949219, "global_step": 321238, "epoch": 1912} {"train_loss": -10.693342208862305, "global_step": 321239, "epoch": 1912} {"train_loss": -10.757641792297363, "global_step": 321240, "epoch": 1912} {"train_loss": -11.294853210449219, "global_step": 321241, "epoch": 1912} {"train_loss": -10.734107971191406, "global_step": 321242, "epoch": 1912} {"train_loss": -11.775444030761719, "global_step": 321243, "epoch": 1912} {"train_loss": -11.395132064819336, "global_step": 321244, "epoch": 1912} {"train_loss": -11.442341804504395, "global_step": 321245, "epoch": 1912} {"train_loss": -11.52639389038086, "global_step": 321246, "epoch": 1912} {"train_loss": -11.503908157348633, "global_step": 321247, "epoch": 1912} {"train_loss": -11.664146423339844, "global_step": 321248, "epoch": 1912} {"train_loss": -11.70285415649414, "global_step": 321249, "epoch": 1912} {"train_loss": -11.362360000610352, "global_step": 321250, "epoch": 1912} {"train_loss": -11.851080894470215, "global_step": 321251, "epoch": 1912} {"train_loss": -11.95814323425293, "global_step": 321252, "epoch": 1912} {"train_loss": -11.967496871948242, "global_step": 321253, "epoch": 1912} {"train_loss": -12.055974960327148, "global_step": 321254, "epoch": 1912} {"train_loss": -11.539084434509277, "global_step": 321255, "epoch": 1912} {"train_loss": -12.138309478759766, "global_step": 321256, "epoch": 1912} {"train_loss": -11.77519702911377, "global_step": 321257, "epoch": 1912} {"train_loss": -11.925536155700684, "global_step": 321258, "epoch": 1912} {"train_loss": -12.017420768737793, "global_step": 321259, "epoch": 1912} {"train_loss": -11.78911304473877, "global_step": 321260, "epoch": 1912} {"train_loss": -12.168426513671875, "global_step": 321261, "epoch": 1912} {"train_loss": -11.927800178527832, "global_step": 321262, "epoch": 1912} {"train_loss": -12.292295455932617, "global_step": 321263, "epoch": 1912} {"train_loss": -12.226983070373535, "global_step": 321264, "epoch": 1912} {"train_loss": -12.127737998962402, "global_step": 321265, "epoch": 1912} {"train_loss": -11.95594596862793, "global_step": 321266, "epoch": 1912} {"train_loss": -11.961080551147461, "global_step": 321267, "epoch": 1912} {"train_loss": -12.183055877685547, "global_step": 321268, "epoch": 1912} {"train_loss": -11.929118156433105, "global_step": 321269, "epoch": 1912} {"train_loss": -12.176480293273926, "global_step": 321270, "epoch": 1912} {"train_loss": -12.078472137451172, "global_step": 321271, "epoch": 1912} {"train_loss": -12.035880088806152, "global_step": 321272, "epoch": 1912} {"train_loss": -12.31279468536377, "global_step": 321273, "epoch": 1912} {"train_loss": -11.8691987991333, "global_step": 321274, "epoch": 1912} {"train_loss": -11.963452339172363, "global_step": 321275, "epoch": 1912} {"train_loss": -12.087823867797852, "global_step": 321276, "epoch": 1912} {"train_loss": -12.056770324707031, "global_step": 321277, "epoch": 1912} {"train_loss": -11.836372375488281, "global_step": 321278, "epoch": 1912} {"train_loss": -12.238557815551758, "global_step": 321279, "epoch": 1912} {"train_loss": -11.94986343383789, "global_step": 321280, "epoch": 1912} {"train_loss": -12.100729942321777, "global_step": 321281, "epoch": 1912} {"train_loss": -11.977314949035645, "global_step": 321282, "epoch": 1912} {"train_loss": -12.08954906463623, "global_step": 321283, "epoch": 1912} {"train_loss": -12.374593734741211, "global_step": 321284, "epoch": 1912} {"train_loss": -12.089622497558594, "global_step": 321285, "epoch": 1912} {"train_loss": -12.381803512573242, "global_step": 321286, "epoch": 1912} {"train_loss": -11.979944229125977, "global_step": 321287, "epoch": 1912} {"train_loss": -12.122907638549805, "global_step": 321288, "epoch": 1912} {"train_loss": -12.15311050415039, "global_step": 321289, "epoch": 1912} {"train_loss": -11.959938049316406, "global_step": 321290, "epoch": 1912} {"train_loss": -12.087308883666992, "global_step": 321291, "epoch": 1912} {"train_loss": -11.737716674804688, "global_step": 321292, "epoch": 1912} {"train_loss": -12.32093620300293, "global_step": 321293, "epoch": 1912} {"train_loss": -11.92563247680664, "global_step": 321294, "epoch": 1912} {"train_loss": -11.986948013305664, "global_step": 321295, "epoch": 1912} {"train_loss": -12.263794898986816, "global_step": 321296, "epoch": 1912} {"train_loss": -12.07962703704834, "global_step": 321297, "epoch": 1912} {"train_loss": -12.40473461151123, "global_step": 321298, "epoch": 1912} {"train_loss": -12.206357955932617, "global_step": 321299, "epoch": 1912} {"train_loss": -12.424756050109863, "global_step": 321300, "epoch": 1912} {"train_loss": -12.094987869262695, "global_step": 321301, "epoch": 1912} {"train_loss": -12.456629753112793, "global_step": 321302, "epoch": 1912} {"train_loss": -12.119546890258789, "global_step": 321303, "epoch": 1912} {"train_loss": -12.208782196044922, "global_step": 321304, "epoch": 1912} {"train_loss": -12.09420394897461, "global_step": 321305, "epoch": 1912} {"train_loss": -12.251775741577148, "global_step": 321306, "epoch": 1912} {"train_loss": -12.338539123535156, "global_step": 321307, "epoch": 1912} {"train_loss": -12.21250057220459, "global_step": 321308, "epoch": 1912} {"train_loss": -12.327383995056152, "global_step": 321309, "epoch": 1912} {"train_loss": -11.954669952392578, "global_step": 321310, "epoch": 1912} {"train_loss": -12.409394264221191, "global_step": 321311, "epoch": 1912} {"train_loss": -12.156673431396484, "global_step": 321312, "epoch": 1912} {"train_loss": -12.271505355834961, "global_step": 321313, "epoch": 1912} {"train_loss": -12.39421272277832, "global_step": 321314, "epoch": 1912} {"train_loss": -11.873201370239258, "global_step": 321315, "epoch": 1912} {"train_loss": -12.3815336227417, "global_step": 321316, "epoch": 1912} {"train_loss": -11.74229621887207, "global_step": 321317, "epoch": 1912} {"train_loss": -12.306392669677734, "global_step": 321318, "epoch": 1912} {"train_loss": -12.159238815307617, "global_step": 321319, "epoch": 1912} {"train_loss": -12.046812057495117, "global_step": 321320, "epoch": 1912} {"train_loss": -12.297657012939453, "global_step": 321321, "epoch": 1912} {"train_loss": -11.867769241333008, "global_step": 321322, "epoch": 1912} {"train_loss": -12.506146430969238, "global_step": 321323, "epoch": 1912} {"train_loss": -12.11448860168457, "global_step": 321324, "epoch": 1912} {"train_loss": -12.266669273376465, "global_step": 321325, "epoch": 1912} {"train_loss": -11.906085968017578, "global_step": 321326, "epoch": 1912} {"train_loss": -12.318519592285156, "global_step": 321327, "epoch": 1912} {"train_loss": -12.416223526000977, "global_step": 321328, "epoch": 1912} {"train_loss": -12.077878952026367, "global_step": 321329, "epoch": 1912} {"train_loss": -12.179309844970703, "global_step": 321330, "epoch": 1912} {"train_loss": -12.217787742614746, "global_step": 321331, "epoch": 1912} {"train_loss": -12.471269607543945, "global_step": 321332, "epoch": 1912} {"train_loss": -12.024198532104492, "global_step": 321333, "epoch": 1912} {"train_loss": -11.958154678344727, "global_step": 321334, "epoch": 1912} {"train_loss": -12.468103408813477, "global_step": 321335, "epoch": 1912} {"train_loss": -12.048852920532227, "global_step": 321336, "epoch": 1912} {"train_loss": -11.570185661315918, "global_step": 321337, "epoch": 1912} {"train_loss": -11.024384498596191, "global_step": 321338, "epoch": 1912} {"train_loss": -10.750326156616211, "global_step": 321339, "epoch": 1912} {"train_loss": -11.451751708984375, "global_step": 321340, "epoch": 1912} {"train_loss": -12.208934783935547, "global_step": 321341, "epoch": 1912} {"train_loss": -10.657503128051758, "global_step": 321342, "epoch": 1912} {"train_loss": -10.356884956359863, "global_step": 321343, "epoch": 1912} {"train_loss": -11.609950065612793, "global_step": 321344, "epoch": 1912} {"train_loss": -9.678356170654297, "global_step": 321345, "epoch": 1912} {"train_loss": -10.288890838623047, "global_step": 321346, "epoch": 1912} {"train_loss": -11.427959442138672, "global_step": 321347, "epoch": 1912} {"train_loss": -9.95416259765625, "global_step": 321348, "epoch": 1912} {"train_loss": -11.092308044433594, "global_step": 321349, "epoch": 1912} {"train_loss": -11.838129043579102, "global_step": 321350, "epoch": 1912} {"train_loss": -11.448556900024414, "global_step": 321351, "epoch": 1912} {"train_loss": -11.563695907592773, "global_step": 321352, "epoch": 1912} {"train_loss": -12.111875534057617, "global_step": 321353, "epoch": 1912} {"train_loss": -11.66514778137207, "global_step": 321354, "epoch": 1912} {"train_loss": -11.967734336853027, "global_step": 321355, "epoch": 1912} {"train_loss": -11.61902904510498, "global_step": 321356, "epoch": 1912} {"train_loss": -11.936171531677246, "global_step": 321357, "epoch": 1912} {"train_loss": -12.031316757202148, "global_step": 321358, "epoch": 1912} {"train_loss": -12.439682960510254, "global_step": 321359, "epoch": 1912} {"train_loss": -11.819767951965332, "global_step": 321360, "epoch": 1912} {"train_loss": -12.199544906616211, "global_step": 321361, "epoch": 1912} {"train_loss": -12.039762496948242, "global_step": 321362, "epoch": 1912} {"train_loss": -11.894455909729004, "global_step": 321363, "epoch": 1912} {"train_loss": -12.21805191040039, "global_step": 321364, "epoch": 1912} {"train_loss": -11.926549911499023, "global_step": 321365, "epoch": 1912} {"train_loss": -12.1807279586792, "global_step": 321366, "epoch": 1912} {"train_loss": -12.12324047088623, "global_step": 321367, "epoch": 1912} {"train_loss": -12.165329933166504, "global_step": 321368, "epoch": 1912} {"train_loss": -12.332197189331055, "global_step": 321369, "epoch": 1912} {"train_loss": -12.116908073425293, "global_step": 321370, "epoch": 1912} {"train_loss": -12.21823501586914, "global_step": 321371, "epoch": 1912} {"train_loss": -12.03643798828125, "global_step": 321372, "epoch": 1912} {"train_loss": -12.342673301696777, "global_step": 321373, "epoch": 1912} {"train_loss": -12.215679168701172, "global_step": 321374, "epoch": 1912} {"train_loss": -12.205242156982422, "global_step": 321375, "epoch": 1912} {"train_loss": -12.07087516784668, "global_step": 321376, "epoch": 1912} {"train_loss": -12.284720420837402, "global_step": 321377, "epoch": 1912} {"train_loss": -11.913808822631836, "global_step": 321378, "epoch": 1912} {"train_loss": -12.335256576538086, "global_step": 321379, "epoch": 1912} {"train_loss": -12.209905624389648, "global_step": 321380, "epoch": 1912} {"train_loss": -12.005823135375977, "global_step": 321381, "epoch": 1912} {"train_loss": -12.089927673339844, "global_step": 321382, "epoch": 1912} {"train_loss": -11.808653899601527, "global_step": 321383, "epoch": 1912, "val_loss": 286789.25} {"train_loss": -11.937171936035156, "global_step": 321384, "epoch": 1913} {"train_loss": -12.111980438232422, "global_step": 321385, "epoch": 1913} {"train_loss": -11.961896896362305, "global_step": 321386, "epoch": 1913} {"train_loss": -11.696727752685547, "global_step": 321387, "epoch": 1913} {"train_loss": -11.826091766357422, "global_step": 321388, "epoch": 1913} {"train_loss": -11.830533027648926, "global_step": 321389, "epoch": 1913} {"train_loss": -11.804709434509277, "global_step": 321390, "epoch": 1913} {"train_loss": -12.097977638244629, "global_step": 321391, "epoch": 1913} {"train_loss": -11.828760147094727, "global_step": 321392, "epoch": 1913} {"train_loss": -11.623719215393066, "global_step": 321393, "epoch": 1913} {"train_loss": -12.068441390991211, "global_step": 321394, "epoch": 1913} {"train_loss": -12.182632446289062, "global_step": 321395, "epoch": 1913} {"train_loss": -11.822403907775879, "global_step": 321396, "epoch": 1913} {"train_loss": -12.02911376953125, "global_step": 321397, "epoch": 1913} {"train_loss": -12.210967063903809, "global_step": 321398, "epoch": 1913} {"train_loss": -11.863933563232422, "global_step": 321399, "epoch": 1913} {"train_loss": -11.793930053710938, "global_step": 321400, "epoch": 1913} {"train_loss": -11.848393440246582, "global_step": 321401, "epoch": 1913} {"train_loss": -12.177656173706055, "global_step": 321402, "epoch": 1913} {"train_loss": -11.782381057739258, "global_step": 321403, "epoch": 1913} {"train_loss": -11.819450378417969, "global_step": 321404, "epoch": 1913} {"train_loss": -12.456869125366211, "global_step": 321405, "epoch": 1913} {"train_loss": -11.536543846130371, "global_step": 321406, "epoch": 1913} {"train_loss": -12.2019624710083, "global_step": 321407, "epoch": 1913} {"train_loss": -11.989343643188477, "global_step": 321408, "epoch": 1913} {"train_loss": -12.306273460388184, "global_step": 321409, "epoch": 1913} {"train_loss": -12.167501449584961, "global_step": 321410, "epoch": 1913} {"train_loss": -12.10898208618164, "global_step": 321411, "epoch": 1913} {"train_loss": -11.677955627441406, "global_step": 321412, "epoch": 1913} {"train_loss": -11.822388648986816, "global_step": 321413, "epoch": 1913} {"train_loss": -12.308175086975098, "global_step": 321414, "epoch": 1913} {"train_loss": -12.184138298034668, "global_step": 321415, "epoch": 1913} {"train_loss": -11.97248649597168, "global_step": 321416, "epoch": 1913} {"train_loss": -12.199392318725586, "global_step": 321417, "epoch": 1913} {"train_loss": -12.01369857788086, "global_step": 321418, "epoch": 1913} {"train_loss": -11.875117301940918, "global_step": 321419, "epoch": 1913} {"train_loss": -11.93368911743164, "global_step": 321420, "epoch": 1913} {"train_loss": -11.193544387817383, "global_step": 321421, "epoch": 1913} {"train_loss": -11.712946891784668, "global_step": 321422, "epoch": 1913} {"train_loss": -11.845817565917969, "global_step": 321423, "epoch": 1913} {"train_loss": -11.370141983032227, "global_step": 321424, "epoch": 1913} {"train_loss": -11.583318710327148, "global_step": 321425, "epoch": 1913} {"train_loss": -11.780752182006836, "global_step": 321426, "epoch": 1913} {"train_loss": -11.875385284423828, "global_step": 321427, "epoch": 1913} {"train_loss": -11.991067886352539, "global_step": 321428, "epoch": 1913} {"train_loss": -11.463174819946289, "global_step": 321429, "epoch": 1913} {"train_loss": -11.663375854492188, "global_step": 321430, "epoch": 1913} {"train_loss": -11.153104782104492, "global_step": 321431, "epoch": 1913} {"train_loss": -11.61149787902832, "global_step": 321432, "epoch": 1913} {"train_loss": -11.671902656555176, "global_step": 321433, "epoch": 1913} {"train_loss": -11.61091136932373, "global_step": 321434, "epoch": 1913} {"train_loss": -11.59326171875, "global_step": 321435, "epoch": 1913} {"train_loss": -11.529708862304688, "global_step": 321436, "epoch": 1913} {"train_loss": -11.322380065917969, "global_step": 321437, "epoch": 1913} {"train_loss": -11.753690719604492, "global_step": 321438, "epoch": 1913} {"train_loss": -12.090155601501465, "global_step": 321439, "epoch": 1913} {"train_loss": -11.730911254882812, "global_step": 321440, "epoch": 1913} {"train_loss": -11.77843189239502, "global_step": 321441, "epoch": 1913} {"train_loss": -11.810140609741211, "global_step": 321442, "epoch": 1913} {"train_loss": -11.646710395812988, "global_step": 321443, "epoch": 1913} {"train_loss": -12.133888244628906, "global_step": 321444, "epoch": 1913} {"train_loss": -11.662164688110352, "global_step": 321445, "epoch": 1913} {"train_loss": -11.785486221313477, "global_step": 321446, "epoch": 1913} {"train_loss": -12.19110107421875, "global_step": 321447, "epoch": 1913} {"train_loss": -11.604129791259766, "global_step": 321448, "epoch": 1913} {"train_loss": -11.930130004882812, "global_step": 321449, "epoch": 1913} {"train_loss": -11.993331909179688, "global_step": 321450, "epoch": 1913} {"train_loss": -11.462851524353027, "global_step": 321451, "epoch": 1913} {"train_loss": -11.570836067199707, "global_step": 321452, "epoch": 1913} {"train_loss": -11.755624771118164, "global_step": 321453, "epoch": 1913} {"train_loss": -11.176520347595215, "global_step": 321454, "epoch": 1913} {"train_loss": -11.478517532348633, "global_step": 321455, "epoch": 1913} {"train_loss": -11.194796562194824, "global_step": 321456, "epoch": 1913} {"train_loss": -11.591439247131348, "global_step": 321457, "epoch": 1913} {"train_loss": -11.119483947753906, "global_step": 321458, "epoch": 1913} {"train_loss": -11.177123069763184, "global_step": 321459, "epoch": 1913} {"train_loss": -11.565945625305176, "global_step": 321460, "epoch": 1913} {"train_loss": -11.27706241607666, "global_step": 321461, "epoch": 1913} {"train_loss": -11.91292953491211, "global_step": 321462, "epoch": 1913} {"train_loss": -11.917637825012207, "global_step": 321463, "epoch": 1913} {"train_loss": -11.891315460205078, "global_step": 321464, "epoch": 1913} {"train_loss": -11.801885604858398, "global_step": 321465, "epoch": 1913} {"train_loss": -11.959907531738281, "global_step": 321466, "epoch": 1913} {"train_loss": -12.079578399658203, "global_step": 321467, "epoch": 1913} {"train_loss": -11.854167938232422, "global_step": 321468, "epoch": 1913} {"train_loss": -12.061485290527344, "global_step": 321469, "epoch": 1913} {"train_loss": -11.900336265563965, "global_step": 321470, "epoch": 1913} {"train_loss": -12.113882064819336, "global_step": 321471, "epoch": 1913} {"train_loss": -11.837251663208008, "global_step": 321472, "epoch": 1913} {"train_loss": -12.13901424407959, "global_step": 321473, "epoch": 1913} {"train_loss": -11.711719512939453, "global_step": 321474, "epoch": 1913} {"train_loss": -12.132515907287598, "global_step": 321475, "epoch": 1913} {"train_loss": -11.672669410705566, "global_step": 321476, "epoch": 1913} {"train_loss": -11.769508361816406, "global_step": 321477, "epoch": 1913} {"train_loss": -11.569317817687988, "global_step": 321478, "epoch": 1913} {"train_loss": -11.394975662231445, "global_step": 321479, "epoch": 1913} {"train_loss": -11.905150413513184, "global_step": 321480, "epoch": 1913} {"train_loss": -11.870931625366211, "global_step": 321481, "epoch": 1913} {"train_loss": -11.995877265930176, "global_step": 321482, "epoch": 1913} {"train_loss": -11.930122375488281, "global_step": 321483, "epoch": 1913} {"train_loss": -11.515104293823242, "global_step": 321484, "epoch": 1913} {"train_loss": -12.2422513961792, "global_step": 321485, "epoch": 1913} {"train_loss": -11.830483436584473, "global_step": 321486, "epoch": 1913} {"train_loss": -11.992589950561523, "global_step": 321487, "epoch": 1913} {"train_loss": -11.791742324829102, "global_step": 321488, "epoch": 1913} {"train_loss": -11.856474876403809, "global_step": 321489, "epoch": 1913} {"train_loss": -11.830489158630371, "global_step": 321490, "epoch": 1913} {"train_loss": -11.806397438049316, "global_step": 321491, "epoch": 1913} {"train_loss": -12.266803741455078, "global_step": 321492, "epoch": 1913} {"train_loss": -11.281502723693848, "global_step": 321493, "epoch": 1913} {"train_loss": -12.008712768554688, "global_step": 321494, "epoch": 1913} {"train_loss": -11.878954887390137, "global_step": 321495, "epoch": 1913} {"train_loss": -12.297845840454102, "global_step": 321496, "epoch": 1913} {"train_loss": -11.996539115905762, "global_step": 321497, "epoch": 1913} {"train_loss": -12.002036094665527, "global_step": 321498, "epoch": 1913} {"train_loss": -12.235198974609375, "global_step": 321499, "epoch": 1913} {"train_loss": -11.818891525268555, "global_step": 321500, "epoch": 1913} {"train_loss": -11.990501403808594, "global_step": 321501, "epoch": 1913} {"train_loss": -12.094721794128418, "global_step": 321502, "epoch": 1913} {"train_loss": -11.77612018585205, "global_step": 321503, "epoch": 1913} {"train_loss": -12.06013298034668, "global_step": 321504, "epoch": 1913} {"train_loss": -11.87696647644043, "global_step": 321505, "epoch": 1913} {"train_loss": -11.342886924743652, "global_step": 321506, "epoch": 1913} {"train_loss": -12.213425636291504, "global_step": 321507, "epoch": 1913} {"train_loss": -11.394490242004395, "global_step": 321508, "epoch": 1913} {"train_loss": -12.169782638549805, "global_step": 321509, "epoch": 1913} {"train_loss": -12.076242446899414, "global_step": 321510, "epoch": 1913} {"train_loss": -11.870738983154297, "global_step": 321511, "epoch": 1913} {"train_loss": -11.75108814239502, "global_step": 321512, "epoch": 1913} {"train_loss": -11.767885208129883, "global_step": 321513, "epoch": 1913} {"train_loss": -11.781312942504883, "global_step": 321514, "epoch": 1913} {"train_loss": -11.997392654418945, "global_step": 321515, "epoch": 1913} {"train_loss": -11.663965225219727, "global_step": 321516, "epoch": 1913} {"train_loss": -11.95327091217041, "global_step": 321517, "epoch": 1913} {"train_loss": -12.215141296386719, "global_step": 321518, "epoch": 1913} {"train_loss": -11.991634368896484, "global_step": 321519, "epoch": 1913} {"train_loss": -12.61977481842041, "global_step": 321520, "epoch": 1913} {"train_loss": -11.991683006286621, "global_step": 321521, "epoch": 1913} {"train_loss": -12.26401138305664, "global_step": 321522, "epoch": 1913} {"train_loss": -12.060721397399902, "global_step": 321523, "epoch": 1913} {"train_loss": -12.234834671020508, "global_step": 321524, "epoch": 1913} {"train_loss": -12.309249877929688, "global_step": 321525, "epoch": 1913} {"train_loss": -12.229069709777832, "global_step": 321526, "epoch": 1913} {"train_loss": -12.395389556884766, "global_step": 321527, "epoch": 1913} {"train_loss": -12.31967544555664, "global_step": 321528, "epoch": 1913} {"train_loss": -12.371278762817383, "global_step": 321529, "epoch": 1913} {"train_loss": -12.565424919128418, "global_step": 321530, "epoch": 1913} {"train_loss": -12.360275268554688, "global_step": 321531, "epoch": 1913} {"train_loss": -12.3885498046875, "global_step": 321532, "epoch": 1913} {"train_loss": -12.370378494262695, "global_step": 321533, "epoch": 1913} {"train_loss": -12.196062088012695, "global_step": 321534, "epoch": 1913} {"train_loss": -12.392038345336914, "global_step": 321535, "epoch": 1913} {"train_loss": -12.409465789794922, "global_step": 321536, "epoch": 1913} {"train_loss": -12.206831932067871, "global_step": 321537, "epoch": 1913} {"train_loss": -12.490279197692871, "global_step": 321538, "epoch": 1913} {"train_loss": -12.408449172973633, "global_step": 321539, "epoch": 1913} {"train_loss": -12.0458345413208, "global_step": 321540, "epoch": 1913} {"train_loss": -12.187284469604492, "global_step": 321541, "epoch": 1913} {"train_loss": -12.168537139892578, "global_step": 321542, "epoch": 1913} {"train_loss": -12.425057411193848, "global_step": 321543, "epoch": 1913} {"train_loss": -12.430843353271484, "global_step": 321544, "epoch": 1913} {"train_loss": -12.354456901550293, "global_step": 321545, "epoch": 1913} {"train_loss": -12.26999282836914, "global_step": 321546, "epoch": 1913} {"train_loss": -12.519949913024902, "global_step": 321547, "epoch": 1913} {"train_loss": -12.006478309631348, "global_step": 321548, "epoch": 1913} {"train_loss": -12.333856582641602, "global_step": 321549, "epoch": 1913} {"train_loss": -12.465826988220215, "global_step": 321550, "epoch": 1913} {"train_loss": -11.92588092031933, "global_step": 321551, "epoch": 1913, "val_loss": 286219.21875} {"train_loss": -11.97568130493164, "global_step": 321552, "epoch": 1914} {"train_loss": -12.545448303222656, "global_step": 321553, "epoch": 1914} {"train_loss": -12.231508255004883, "global_step": 321554, "epoch": 1914} {"train_loss": -11.952288627624512, "global_step": 321555, "epoch": 1914} {"train_loss": -12.512134552001953, "global_step": 321556, "epoch": 1914} {"train_loss": -11.833720207214355, "global_step": 321557, "epoch": 1914} {"train_loss": -11.969489097595215, "global_step": 321558, "epoch": 1914} {"train_loss": -12.029485702514648, "global_step": 321559, "epoch": 1914} {"train_loss": -12.450601577758789, "global_step": 321560, "epoch": 1914} {"train_loss": -12.316873550415039, "global_step": 321561, "epoch": 1914} {"train_loss": -12.388822555541992, "global_step": 321562, "epoch": 1914} {"train_loss": -12.350028038024902, "global_step": 321563, "epoch": 1914} {"train_loss": -12.499662399291992, "global_step": 321564, "epoch": 1914} {"train_loss": -12.23029613494873, "global_step": 321565, "epoch": 1914} {"train_loss": -12.064306259155273, "global_step": 321566, "epoch": 1914} {"train_loss": -12.533697128295898, "global_step": 321567, "epoch": 1914} {"train_loss": -12.326055526733398, "global_step": 321568, "epoch": 1914} {"train_loss": -12.372754096984863, "global_step": 321569, "epoch": 1914} {"train_loss": -11.851160049438477, "global_step": 321570, "epoch": 1914} {"train_loss": -12.260345458984375, "global_step": 321571, "epoch": 1914} {"train_loss": -12.342843055725098, "global_step": 321572, "epoch": 1914} {"train_loss": -12.110845565795898, "global_step": 321573, "epoch": 1914} {"train_loss": -12.079607009887695, "global_step": 321574, "epoch": 1914} {"train_loss": -12.048408508300781, "global_step": 321575, "epoch": 1914} {"train_loss": -12.304258346557617, "global_step": 321576, "epoch": 1914} {"train_loss": -11.704130172729492, "global_step": 321577, "epoch": 1914} {"train_loss": -12.189811706542969, "global_step": 321578, "epoch": 1914} {"train_loss": -11.932746887207031, "global_step": 321579, "epoch": 1914} {"train_loss": -11.98648452758789, "global_step": 321580, "epoch": 1914} {"train_loss": -10.296869277954102, "global_step": 321581, "epoch": 1914} {"train_loss": -11.819928169250488, "global_step": 321582, "epoch": 1914} {"train_loss": -10.883044242858887, "global_step": 321583, "epoch": 1914} {"train_loss": -11.077960014343262, "global_step": 321584, "epoch": 1914} {"train_loss": -12.483556747436523, "global_step": 321585, "epoch": 1914} {"train_loss": -11.39525032043457, "global_step": 321586, "epoch": 1914} {"train_loss": -11.7153902053833, "global_step": 321587, "epoch": 1914} {"train_loss": -11.957473754882812, "global_step": 321588, "epoch": 1914} {"train_loss": -9.84868049621582, "global_step": 321589, "epoch": 1914} {"train_loss": -11.727243423461914, "global_step": 321590, "epoch": 1914} {"train_loss": -12.020013809204102, "global_step": 321591, "epoch": 1914} {"train_loss": -10.693159103393555, "global_step": 321592, "epoch": 1914} {"train_loss": -11.840738296508789, "global_step": 321593, "epoch": 1914} {"train_loss": -11.641939163208008, "global_step": 321594, "epoch": 1914} {"train_loss": -9.521859169006348, "global_step": 321595, "epoch": 1914} {"train_loss": -12.175701141357422, "global_step": 321596, "epoch": 1914} {"train_loss": -10.961936950683594, "global_step": 321597, "epoch": 1914} {"train_loss": -11.162490844726562, "global_step": 321598, "epoch": 1914} {"train_loss": -11.229267120361328, "global_step": 321599, "epoch": 1914} {"train_loss": -9.672306060791016, "global_step": 321600, "epoch": 1914} {"train_loss": -11.659910202026367, "global_step": 321601, "epoch": 1914} {"train_loss": -9.381851196289062, "global_step": 321602, "epoch": 1914} {"train_loss": -8.815067291259766, "global_step": 321603, "epoch": 1914} {"train_loss": -9.185261726379395, "global_step": 321604, "epoch": 1914} {"train_loss": -8.778753280639648, "global_step": 321605, "epoch": 1914} {"train_loss": -11.151920318603516, "global_step": 321606, "epoch": 1914} {"train_loss": -9.350908279418945, "global_step": 321607, "epoch": 1914} {"train_loss": -11.086475372314453, "global_step": 321608, "epoch": 1914} {"train_loss": -10.565696716308594, "global_step": 321609, "epoch": 1914} {"train_loss": -10.72175407409668, "global_step": 321610, "epoch": 1914} {"train_loss": -11.133331298828125, "global_step": 321611, "epoch": 1914} {"train_loss": -11.419184684753418, "global_step": 321612, "epoch": 1914} {"train_loss": -10.98454475402832, "global_step": 321613, "epoch": 1914} {"train_loss": -11.129049301147461, "global_step": 321614, "epoch": 1914} {"train_loss": -10.577762603759766, "global_step": 321615, "epoch": 1914} {"train_loss": -11.342758178710938, "global_step": 321616, "epoch": 1914} {"train_loss": -10.76357650756836, "global_step": 321617, "epoch": 1914} {"train_loss": -11.525542259216309, "global_step": 321618, "epoch": 1914} {"train_loss": -11.767261505126953, "global_step": 321619, "epoch": 1914} {"train_loss": -11.165872573852539, "global_step": 321620, "epoch": 1914} {"train_loss": -11.759237289428711, "global_step": 321621, "epoch": 1914} {"train_loss": -11.818796157836914, "global_step": 321622, "epoch": 1914} {"train_loss": -10.97805404663086, "global_step": 321623, "epoch": 1914} {"train_loss": -11.518014907836914, "global_step": 321624, "epoch": 1914} {"train_loss": -11.56387996673584, "global_step": 321625, "epoch": 1914} {"train_loss": -11.386381149291992, "global_step": 321626, "epoch": 1914} {"train_loss": -11.972307205200195, "global_step": 321627, "epoch": 1914} {"train_loss": -11.194199562072754, "global_step": 321628, "epoch": 1914} {"train_loss": -11.909354209899902, "global_step": 321629, "epoch": 1914} {"train_loss": -11.471817016601562, "global_step": 321630, "epoch": 1914} {"train_loss": -11.088623046875, "global_step": 321631, "epoch": 1914} {"train_loss": -11.238359451293945, "global_step": 321632, "epoch": 1914} {"train_loss": -11.447076797485352, "global_step": 321633, "epoch": 1914} {"train_loss": -11.138516426086426, "global_step": 321634, "epoch": 1914} {"train_loss": -11.445450782775879, "global_step": 321635, "epoch": 1914} {"train_loss": -11.262144088745117, "global_step": 321636, "epoch": 1914} {"train_loss": -11.646462440490723, "global_step": 321637, "epoch": 1914} {"train_loss": -11.542052268981934, "global_step": 321638, "epoch": 1914} {"train_loss": -11.479957580566406, "global_step": 321639, "epoch": 1914} {"train_loss": -11.609580039978027, "global_step": 321640, "epoch": 1914} {"train_loss": -11.439847946166992, "global_step": 321641, "epoch": 1914} {"train_loss": -12.030399322509766, "global_step": 321642, "epoch": 1914} {"train_loss": -11.63872241973877, "global_step": 321643, "epoch": 1914} {"train_loss": -11.863725662231445, "global_step": 321644, "epoch": 1914} {"train_loss": -11.77159595489502, "global_step": 321645, "epoch": 1914} {"train_loss": -11.829435348510742, "global_step": 321646, "epoch": 1914} {"train_loss": -11.365375518798828, "global_step": 321647, "epoch": 1914} {"train_loss": -11.909624099731445, "global_step": 321648, "epoch": 1914} {"train_loss": -11.522537231445312, "global_step": 321649, "epoch": 1914} {"train_loss": -12.187180519104004, "global_step": 321650, "epoch": 1914} {"train_loss": -11.899271011352539, "global_step": 321651, "epoch": 1914} {"train_loss": -11.735982894897461, "global_step": 321652, "epoch": 1914} {"train_loss": -12.17873764038086, "global_step": 321653, "epoch": 1914} {"train_loss": -11.951889991760254, "global_step": 321654, "epoch": 1914} {"train_loss": -11.932130813598633, "global_step": 321655, "epoch": 1914} {"train_loss": -12.220771789550781, "global_step": 321656, "epoch": 1914} {"train_loss": -11.977005004882812, "global_step": 321657, "epoch": 1914} {"train_loss": -11.95297622680664, "global_step": 321658, "epoch": 1914} {"train_loss": -12.111305236816406, "global_step": 321659, "epoch": 1914} {"train_loss": -11.699833869934082, "global_step": 321660, "epoch": 1914} {"train_loss": -12.195337295532227, "global_step": 321661, "epoch": 1914} {"train_loss": -12.28543472290039, "global_step": 321662, "epoch": 1914} {"train_loss": -11.930922508239746, "global_step": 321663, "epoch": 1914} {"train_loss": -12.207630157470703, "global_step": 321664, "epoch": 1914} {"train_loss": -12.021005630493164, "global_step": 321665, "epoch": 1914} {"train_loss": -12.298766136169434, "global_step": 321666, "epoch": 1914} {"train_loss": -12.2755126953125, "global_step": 321667, "epoch": 1914} {"train_loss": -12.136773109436035, "global_step": 321668, "epoch": 1914} {"train_loss": -12.246406555175781, "global_step": 321669, "epoch": 1914} {"train_loss": -12.099431991577148, "global_step": 321670, "epoch": 1914} {"train_loss": -12.157766342163086, "global_step": 321671, "epoch": 1914} {"train_loss": -12.411405563354492, "global_step": 321672, "epoch": 1914} {"train_loss": -12.291971206665039, "global_step": 321673, "epoch": 1914} {"train_loss": -12.09012508392334, "global_step": 321674, "epoch": 1914} {"train_loss": -12.186502456665039, "global_step": 321675, "epoch": 1914} {"train_loss": -12.154979705810547, "global_step": 321676, "epoch": 1914} {"train_loss": -12.250280380249023, "global_step": 321677, "epoch": 1914} {"train_loss": -12.332823753356934, "global_step": 321678, "epoch": 1914} {"train_loss": -12.254744529724121, "global_step": 321679, "epoch": 1914} {"train_loss": -12.287946701049805, "global_step": 321680, "epoch": 1914} {"train_loss": -12.168477058410645, "global_step": 321681, "epoch": 1914} {"train_loss": -12.438542366027832, "global_step": 321682, "epoch": 1914} {"train_loss": -12.439661979675293, "global_step": 321683, "epoch": 1914} {"train_loss": -12.462346076965332, "global_step": 321684, "epoch": 1914} {"train_loss": -12.251014709472656, "global_step": 321685, "epoch": 1914} {"train_loss": -12.569252014160156, "global_step": 321686, "epoch": 1914} {"train_loss": -12.458789825439453, "global_step": 321687, "epoch": 1914} {"train_loss": -12.59286880493164, "global_step": 321688, "epoch": 1914} {"train_loss": -12.35783863067627, "global_step": 321689, "epoch": 1914} {"train_loss": -12.510787963867188, "global_step": 321690, "epoch": 1914} {"train_loss": -12.485877990722656, "global_step": 321691, "epoch": 1914} {"train_loss": -12.405763626098633, "global_step": 321692, "epoch": 1914} {"train_loss": -12.459358215332031, "global_step": 321693, "epoch": 1914} {"train_loss": -12.35296630859375, "global_step": 321694, "epoch": 1914} {"train_loss": -12.415814399719238, "global_step": 321695, "epoch": 1914} {"train_loss": -12.487628936767578, "global_step": 321696, "epoch": 1914} {"train_loss": -12.577764511108398, "global_step": 321697, "epoch": 1914} {"train_loss": -12.216431617736816, "global_step": 321698, "epoch": 1914} {"train_loss": -12.127689361572266, "global_step": 321699, "epoch": 1914} {"train_loss": -12.507387161254883, "global_step": 321700, "epoch": 1914} {"train_loss": -12.147977828979492, "global_step": 321701, "epoch": 1914} {"train_loss": -12.15571403503418, "global_step": 321702, "epoch": 1914} {"train_loss": -11.959283828735352, "global_step": 321703, "epoch": 1914} {"train_loss": -11.900397300720215, "global_step": 321704, "epoch": 1914} {"train_loss": -12.195822715759277, "global_step": 321705, "epoch": 1914} {"train_loss": -11.322752952575684, "global_step": 321706, "epoch": 1914} {"train_loss": -11.184527397155762, "global_step": 321707, "epoch": 1914} {"train_loss": -11.366547584533691, "global_step": 321708, "epoch": 1914} {"train_loss": -12.08700180053711, "global_step": 321709, "epoch": 1914} {"train_loss": -11.46745491027832, "global_step": 321710, "epoch": 1914} {"train_loss": -11.643627166748047, "global_step": 321711, "epoch": 1914} {"train_loss": -11.282865524291992, "global_step": 321712, "epoch": 1914} {"train_loss": -10.763461112976074, "global_step": 321713, "epoch": 1914} {"train_loss": -12.01756477355957, "global_step": 321714, "epoch": 1914} {"train_loss": -11.797456741333008, "global_step": 321715, "epoch": 1914} {"train_loss": -10.910550117492676, "global_step": 321716, "epoch": 1914} {"train_loss": -11.434863090515137, "global_step": 321717, "epoch": 1914} {"train_loss": -11.655573844909668, "global_step": 321718, "epoch": 1914} {"train_loss": -11.724652806917826, "global_step": 321719, "epoch": 1914, "val_loss": 282178.3125} {"train_loss": -9.864107131958008, "global_step": 321720, "epoch": 1915} {"train_loss": -11.926094055175781, "global_step": 321721, "epoch": 1915} {"train_loss": -10.929244995117188, "global_step": 321722, "epoch": 1915} {"train_loss": -12.03152084350586, "global_step": 321723, "epoch": 1915} {"train_loss": -11.80688762664795, "global_step": 321724, "epoch": 1915} {"train_loss": -11.269298553466797, "global_step": 321725, "epoch": 1915} {"train_loss": -11.56564712524414, "global_step": 321726, "epoch": 1915} {"train_loss": -12.047950744628906, "global_step": 321727, "epoch": 1915} {"train_loss": -11.67477798461914, "global_step": 321728, "epoch": 1915} {"train_loss": -11.370363235473633, "global_step": 321729, "epoch": 1915} {"train_loss": -12.073955535888672, "global_step": 321730, "epoch": 1915} {"train_loss": -11.46961784362793, "global_step": 321731, "epoch": 1915} {"train_loss": -11.773951530456543, "global_step": 321732, "epoch": 1915} {"train_loss": -11.973238945007324, "global_step": 321733, "epoch": 1915} {"train_loss": -11.468009948730469, "global_step": 321734, "epoch": 1915} {"train_loss": -11.504030227661133, "global_step": 321735, "epoch": 1915} {"train_loss": -11.622906684875488, "global_step": 321736, "epoch": 1915} {"train_loss": -12.057624816894531, "global_step": 321737, "epoch": 1915} {"train_loss": -11.68523120880127, "global_step": 321738, "epoch": 1915} {"train_loss": -11.925575256347656, "global_step": 321739, "epoch": 1915} {"train_loss": -12.008739471435547, "global_step": 321740, "epoch": 1915} {"train_loss": -11.752838134765625, "global_step": 321741, "epoch": 1915} {"train_loss": -12.128752708435059, "global_step": 321742, "epoch": 1915} {"train_loss": -11.469560623168945, "global_step": 321743, "epoch": 1915} {"train_loss": -12.200225830078125, "global_step": 321744, "epoch": 1915} {"train_loss": -11.644399642944336, "global_step": 321745, "epoch": 1915} {"train_loss": -11.920753479003906, "global_step": 321746, "epoch": 1915} {"train_loss": -12.342281341552734, "global_step": 321747, "epoch": 1915} {"train_loss": -11.832306861877441, "global_step": 321748, "epoch": 1915} {"train_loss": -11.897062301635742, "global_step": 321749, "epoch": 1915} {"train_loss": -11.734801292419434, "global_step": 321750, "epoch": 1915} {"train_loss": -11.981796264648438, "global_step": 321751, "epoch": 1915} {"train_loss": -11.892326354980469, "global_step": 321752, "epoch": 1915} {"train_loss": -12.189164161682129, "global_step": 321753, "epoch": 1915} {"train_loss": -11.817949295043945, "global_step": 321754, "epoch": 1915} {"train_loss": -11.63055419921875, "global_step": 321755, "epoch": 1915} {"train_loss": -11.709842681884766, "global_step": 321756, "epoch": 1915} {"train_loss": -11.71904182434082, "global_step": 321757, "epoch": 1915} {"train_loss": -11.416611671447754, "global_step": 321758, "epoch": 1915} {"train_loss": -11.671770095825195, "global_step": 321759, "epoch": 1915} {"train_loss": -10.694721221923828, "global_step": 321760, "epoch": 1915} {"train_loss": -11.072347640991211, "global_step": 321761, "epoch": 1915} {"train_loss": -11.242252349853516, "global_step": 321762, "epoch": 1915} {"train_loss": -11.414655685424805, "global_step": 321763, "epoch": 1915} {"train_loss": -11.457109451293945, "global_step": 321764, "epoch": 1915} {"train_loss": -11.26651382446289, "global_step": 321765, "epoch": 1915} {"train_loss": -11.460607528686523, "global_step": 321766, "epoch": 1915} {"train_loss": -11.44015121459961, "global_step": 321767, "epoch": 1915} {"train_loss": -11.084371566772461, "global_step": 321768, "epoch": 1915} {"train_loss": -11.498540878295898, "global_step": 321769, "epoch": 1915} {"train_loss": -10.558884620666504, "global_step": 321770, "epoch": 1915} {"train_loss": -12.115530014038086, "global_step": 321771, "epoch": 1915} {"train_loss": -11.372044563293457, "global_step": 321772, "epoch": 1915} {"train_loss": -11.812432289123535, "global_step": 321773, "epoch": 1915} {"train_loss": -11.914765357971191, "global_step": 321774, "epoch": 1915} {"train_loss": -11.966535568237305, "global_step": 321775, "epoch": 1915} {"train_loss": -12.071735382080078, "global_step": 321776, "epoch": 1915} {"train_loss": -11.900016784667969, "global_step": 321777, "epoch": 1915} {"train_loss": -11.986461639404297, "global_step": 321778, "epoch": 1915} {"train_loss": -12.12531852722168, "global_step": 321779, "epoch": 1915} {"train_loss": -11.997725486755371, "global_step": 321780, "epoch": 1915} {"train_loss": -11.96004581451416, "global_step": 321781, "epoch": 1915} {"train_loss": -11.360925674438477, "global_step": 321782, "epoch": 1915} {"train_loss": -12.132383346557617, "global_step": 321783, "epoch": 1915} {"train_loss": -11.451347351074219, "global_step": 321784, "epoch": 1915} {"train_loss": -11.53543472290039, "global_step": 321785, "epoch": 1915} {"train_loss": -11.576251983642578, "global_step": 321786, "epoch": 1915} {"train_loss": -10.818998336791992, "global_step": 321787, "epoch": 1915} {"train_loss": -11.780670166015625, "global_step": 321788, "epoch": 1915} {"train_loss": -11.219820976257324, "global_step": 321789, "epoch": 1915} {"train_loss": -10.926643371582031, "global_step": 321790, "epoch": 1915} {"train_loss": -11.450132369995117, "global_step": 321791, "epoch": 1915} {"train_loss": -11.223808288574219, "global_step": 321792, "epoch": 1915} {"train_loss": -11.307666778564453, "global_step": 321793, "epoch": 1915} {"train_loss": -10.48866081237793, "global_step": 321794, "epoch": 1915} {"train_loss": -11.140727043151855, "global_step": 321795, "epoch": 1915} {"train_loss": -10.880865097045898, "global_step": 321796, "epoch": 1915} {"train_loss": -11.787839889526367, "global_step": 321797, "epoch": 1915} {"train_loss": -11.399761199951172, "global_step": 321798, "epoch": 1915} {"train_loss": -12.008102416992188, "global_step": 321799, "epoch": 1915} {"train_loss": -11.704851150512695, "global_step": 321800, "epoch": 1915} {"train_loss": -11.952367782592773, "global_step": 321801, "epoch": 1915} {"train_loss": -12.001812934875488, "global_step": 321802, "epoch": 1915} {"train_loss": -11.290634155273438, "global_step": 321803, "epoch": 1915} {"train_loss": -11.93092155456543, "global_step": 321804, "epoch": 1915} {"train_loss": -11.559504508972168, "global_step": 321805, "epoch": 1915} {"train_loss": -11.490994453430176, "global_step": 321806, "epoch": 1915} {"train_loss": -11.686357498168945, "global_step": 321807, "epoch": 1915} {"train_loss": -11.54830551147461, "global_step": 321808, "epoch": 1915} {"train_loss": -11.741348266601562, "global_step": 321809, "epoch": 1915} {"train_loss": -12.066518783569336, "global_step": 321810, "epoch": 1915} {"train_loss": -11.805487632751465, "global_step": 321811, "epoch": 1915} {"train_loss": -12.053348541259766, "global_step": 321812, "epoch": 1915} {"train_loss": -11.98098373413086, "global_step": 321813, "epoch": 1915} {"train_loss": -11.997638702392578, "global_step": 321814, "epoch": 1915} {"train_loss": -12.228772163391113, "global_step": 321815, "epoch": 1915} {"train_loss": -12.206809997558594, "global_step": 321816, "epoch": 1915} {"train_loss": -11.734079360961914, "global_step": 321817, "epoch": 1915} {"train_loss": -12.070926666259766, "global_step": 321818, "epoch": 1915} {"train_loss": -12.124650955200195, "global_step": 321819, "epoch": 1915} {"train_loss": -11.92495346069336, "global_step": 321820, "epoch": 1915} {"train_loss": -12.125741004943848, "global_step": 321821, "epoch": 1915} {"train_loss": -12.057942390441895, "global_step": 321822, "epoch": 1915} {"train_loss": -11.573253631591797, "global_step": 321823, "epoch": 1915} {"train_loss": -12.097670555114746, "global_step": 321824, "epoch": 1915} {"train_loss": -12.005136489868164, "global_step": 321825, "epoch": 1915} {"train_loss": -12.044361114501953, "global_step": 321826, "epoch": 1915} {"train_loss": -12.113183975219727, "global_step": 321827, "epoch": 1915} {"train_loss": -12.269952774047852, "global_step": 321828, "epoch": 1915} {"train_loss": -12.247041702270508, "global_step": 321829, "epoch": 1915} {"train_loss": -12.006000518798828, "global_step": 321830, "epoch": 1915} {"train_loss": -12.321243286132812, "global_step": 321831, "epoch": 1915} {"train_loss": -12.218167304992676, "global_step": 321832, "epoch": 1915} {"train_loss": -12.230241775512695, "global_step": 321833, "epoch": 1915} {"train_loss": -12.477296829223633, "global_step": 321834, "epoch": 1915} {"train_loss": -12.148237228393555, "global_step": 321835, "epoch": 1915} {"train_loss": -12.389567375183105, "global_step": 321836, "epoch": 1915} {"train_loss": -12.2857666015625, "global_step": 321837, "epoch": 1915} {"train_loss": -12.317171096801758, "global_step": 321838, "epoch": 1915} {"train_loss": -12.453533172607422, "global_step": 321839, "epoch": 1915} {"train_loss": -12.417411804199219, "global_step": 321840, "epoch": 1915} {"train_loss": -12.342608451843262, "global_step": 321841, "epoch": 1915} {"train_loss": -12.476335525512695, "global_step": 321842, "epoch": 1915} {"train_loss": -12.276918411254883, "global_step": 321843, "epoch": 1915} {"train_loss": -12.281022071838379, "global_step": 321844, "epoch": 1915} {"train_loss": -12.476234436035156, "global_step": 321845, "epoch": 1915} {"train_loss": -12.370936393737793, "global_step": 321846, "epoch": 1915} {"train_loss": -12.62812614440918, "global_step": 321847, "epoch": 1915} {"train_loss": -12.385198593139648, "global_step": 321848, "epoch": 1915} {"train_loss": -12.316085815429688, "global_step": 321849, "epoch": 1915} {"train_loss": -12.340787887573242, "global_step": 321850, "epoch": 1915} {"train_loss": -12.505943298339844, "global_step": 321851, "epoch": 1915} {"train_loss": -11.960930824279785, "global_step": 321852, "epoch": 1915} {"train_loss": -12.416351318359375, "global_step": 321853, "epoch": 1915} {"train_loss": -12.107187271118164, "global_step": 321854, "epoch": 1915} {"train_loss": -12.080757141113281, "global_step": 321855, "epoch": 1915} {"train_loss": -12.584014892578125, "global_step": 321856, "epoch": 1915} {"train_loss": -11.742667198181152, "global_step": 321857, "epoch": 1915} {"train_loss": -12.387205123901367, "global_step": 321858, "epoch": 1915} {"train_loss": -12.436673164367676, "global_step": 321859, "epoch": 1915} {"train_loss": -12.331465721130371, "global_step": 321860, "epoch": 1915} {"train_loss": -12.484418869018555, "global_step": 321861, "epoch": 1915} {"train_loss": -12.505083084106445, "global_step": 321862, "epoch": 1915} {"train_loss": -11.850526809692383, "global_step": 321863, "epoch": 1915} {"train_loss": -12.173917770385742, "global_step": 321864, "epoch": 1915} {"train_loss": -12.360801696777344, "global_step": 321865, "epoch": 1915} {"train_loss": -12.493722915649414, "global_step": 321866, "epoch": 1915} {"train_loss": -12.124868392944336, "global_step": 321867, "epoch": 1915} {"train_loss": -12.509550094604492, "global_step": 321868, "epoch": 1915} {"train_loss": -12.462095260620117, "global_step": 321869, "epoch": 1915} {"train_loss": -12.370440483093262, "global_step": 321870, "epoch": 1915} {"train_loss": -12.277063369750977, "global_step": 321871, "epoch": 1915} {"train_loss": -12.148921966552734, "global_step": 321872, "epoch": 1915} {"train_loss": -12.501888275146484, "global_step": 321873, "epoch": 1915} {"train_loss": -12.423051834106445, "global_step": 321874, "epoch": 1915} {"train_loss": -12.031478881835938, "global_step": 321875, "epoch": 1915} {"train_loss": -12.288589477539062, "global_step": 321876, "epoch": 1915} {"train_loss": -12.459239959716797, "global_step": 321877, "epoch": 1915} {"train_loss": -12.320374488830566, "global_step": 321878, "epoch": 1915} {"train_loss": -12.018513679504395, "global_step": 321879, "epoch": 1915} {"train_loss": -12.14123249053955, "global_step": 321880, "epoch": 1915} {"train_loss": -12.518129348754883, "global_step": 321881, "epoch": 1915} {"train_loss": -12.061103820800781, "global_step": 321882, "epoch": 1915} {"train_loss": -12.321952819824219, "global_step": 321883, "epoch": 1915} {"train_loss": -12.021581649780273, "global_step": 321884, "epoch": 1915} {"train_loss": -12.61275863647461, "global_step": 321885, "epoch": 1915} {"train_loss": -12.407940864562988, "global_step": 321886, "epoch": 1915} {"train_loss": -11.900845993132819, "global_step": 321887, "epoch": 1915, "val_loss": 283377.125, "train_action_mse_error": 4.832493782043457} {"train_loss": -12.306167602539062, "global_step": 321888, "epoch": 1916} {"train_loss": -12.075339317321777, "global_step": 321889, "epoch": 1916} {"train_loss": -11.907413482666016, "global_step": 321890, "epoch": 1916} {"train_loss": -11.073419570922852, "global_step": 321891, "epoch": 1916} {"train_loss": -11.220276832580566, "global_step": 321892, "epoch": 1916} {"train_loss": -11.230524063110352, "global_step": 321893, "epoch": 1916} {"train_loss": -8.889787673950195, "global_step": 321894, "epoch": 1916} {"train_loss": -10.221319198608398, "global_step": 321895, "epoch": 1916} {"train_loss": -7.465672492980957, "global_step": 321896, "epoch": 1916} {"train_loss": -10.973044395446777, "global_step": 321897, "epoch": 1916} {"train_loss": -9.825491905212402, "global_step": 321898, "epoch": 1916} {"train_loss": -10.844924926757812, "global_step": 321899, "epoch": 1916} {"train_loss": -11.066255569458008, "global_step": 321900, "epoch": 1916} {"train_loss": -11.217606544494629, "global_step": 321901, "epoch": 1916} {"train_loss": -10.233625411987305, "global_step": 321902, "epoch": 1916} {"train_loss": -10.629103660583496, "global_step": 321903, "epoch": 1916} {"train_loss": -9.005598068237305, "global_step": 321904, "epoch": 1916} {"train_loss": -9.679153442382812, "global_step": 321905, "epoch": 1916} {"train_loss": -8.725896835327148, "global_step": 321906, "epoch": 1916} {"train_loss": -9.379179000854492, "global_step": 321907, "epoch": 1916} {"train_loss": -9.752411842346191, "global_step": 321908, "epoch": 1916} {"train_loss": -10.887779235839844, "global_step": 321909, "epoch": 1916} {"train_loss": -9.371582984924316, "global_step": 321910, "epoch": 1916} {"train_loss": -11.396970748901367, "global_step": 321911, "epoch": 1916} {"train_loss": -10.768383026123047, "global_step": 321912, "epoch": 1916} {"train_loss": -10.94699478149414, "global_step": 321913, "epoch": 1916} {"train_loss": -11.15878677368164, "global_step": 321914, "epoch": 1916} {"train_loss": -11.402116775512695, "global_step": 321915, "epoch": 1916} {"train_loss": -10.846443176269531, "global_step": 321916, "epoch": 1916} {"train_loss": -11.485250473022461, "global_step": 321917, "epoch": 1916} {"train_loss": -11.09095573425293, "global_step": 321918, "epoch": 1916} {"train_loss": -11.45184326171875, "global_step": 321919, "epoch": 1916} {"train_loss": -11.408466339111328, "global_step": 321920, "epoch": 1916} {"train_loss": -11.234855651855469, "global_step": 321921, "epoch": 1916} {"train_loss": -11.72696304321289, "global_step": 321922, "epoch": 1916} {"train_loss": -11.282621383666992, "global_step": 321923, "epoch": 1916} {"train_loss": -11.472589492797852, "global_step": 321924, "epoch": 1916} {"train_loss": -11.95764446258545, "global_step": 321925, "epoch": 1916} {"train_loss": -11.45914077758789, "global_step": 321926, "epoch": 1916} {"train_loss": -12.020145416259766, "global_step": 321927, "epoch": 1916} {"train_loss": -11.976981163024902, "global_step": 321928, "epoch": 1916} {"train_loss": -12.08947467803955, "global_step": 321929, "epoch": 1916} {"train_loss": -12.06491756439209, "global_step": 321930, "epoch": 1916} {"train_loss": -11.898045539855957, "global_step": 321931, "epoch": 1916} {"train_loss": -12.081180572509766, "global_step": 321932, "epoch": 1916} {"train_loss": -12.049308776855469, "global_step": 321933, "epoch": 1916} {"train_loss": -12.031469345092773, "global_step": 321934, "epoch": 1916} {"train_loss": -12.097099304199219, "global_step": 321935, "epoch": 1916} {"train_loss": -12.021329879760742, "global_step": 321936, "epoch": 1916} {"train_loss": -11.831649780273438, "global_step": 321937, "epoch": 1916} {"train_loss": -11.791229248046875, "global_step": 321938, "epoch": 1916} {"train_loss": -11.78088092803955, "global_step": 321939, "epoch": 1916} {"train_loss": -11.932546615600586, "global_step": 321940, "epoch": 1916} {"train_loss": -11.94343376159668, "global_step": 321941, "epoch": 1916} {"train_loss": -12.055989265441895, "global_step": 321942, "epoch": 1916} {"train_loss": -11.931283950805664, "global_step": 321943, "epoch": 1916} {"train_loss": -11.985785484313965, "global_step": 321944, "epoch": 1916} {"train_loss": -11.955850601196289, "global_step": 321945, "epoch": 1916} {"train_loss": -11.684925079345703, "global_step": 321946, "epoch": 1916} {"train_loss": -11.728836059570312, "global_step": 321947, "epoch": 1916} {"train_loss": -11.996760368347168, "global_step": 321948, "epoch": 1916} {"train_loss": -11.960432052612305, "global_step": 321949, "epoch": 1916} {"train_loss": -11.683769226074219, "global_step": 321950, "epoch": 1916} {"train_loss": -11.977458000183105, "global_step": 321951, "epoch": 1916} {"train_loss": -12.190383911132812, "global_step": 321952, "epoch": 1916} {"train_loss": -12.133466720581055, "global_step": 321953, "epoch": 1916} {"train_loss": -12.13162612915039, "global_step": 321954, "epoch": 1916} {"train_loss": -12.30894660949707, "global_step": 321955, "epoch": 1916} {"train_loss": -12.27999496459961, "global_step": 321956, "epoch": 1916} {"train_loss": -12.414942741394043, "global_step": 321957, "epoch": 1916} {"train_loss": -12.12389087677002, "global_step": 321958, "epoch": 1916} {"train_loss": -12.137693405151367, "global_step": 321959, "epoch": 1916} {"train_loss": -12.330863952636719, "global_step": 321960, "epoch": 1916} {"train_loss": -12.168834686279297, "global_step": 321961, "epoch": 1916} {"train_loss": -12.49493408203125, "global_step": 321962, "epoch": 1916} {"train_loss": -12.13741397857666, "global_step": 321963, "epoch": 1916} {"train_loss": -12.38359260559082, "global_step": 321964, "epoch": 1916} {"train_loss": -12.28713321685791, "global_step": 321965, "epoch": 1916} {"train_loss": -12.295722961425781, "global_step": 321966, "epoch": 1916} {"train_loss": -12.458740234375, "global_step": 321967, "epoch": 1916} {"train_loss": -12.173299789428711, "global_step": 321968, "epoch": 1916} {"train_loss": -12.511531829833984, "global_step": 321969, "epoch": 1916} {"train_loss": -12.233682632446289, "global_step": 321970, "epoch": 1916} {"train_loss": -12.647418022155762, "global_step": 321971, "epoch": 1916} {"train_loss": -12.097023963928223, "global_step": 321972, "epoch": 1916} {"train_loss": -12.099152565002441, "global_step": 321973, "epoch": 1916} {"train_loss": -12.463844299316406, "global_step": 321974, "epoch": 1916} {"train_loss": -12.426230430603027, "global_step": 321975, "epoch": 1916} {"train_loss": -12.232918739318848, "global_step": 321976, "epoch": 1916} {"train_loss": -12.217138290405273, "global_step": 321977, "epoch": 1916} {"train_loss": -12.263336181640625, "global_step": 321978, "epoch": 1916} {"train_loss": -12.528055191040039, "global_step": 321979, "epoch": 1916} {"train_loss": -12.434621810913086, "global_step": 321980, "epoch": 1916} {"train_loss": -12.026418685913086, "global_step": 321981, "epoch": 1916} {"train_loss": -12.444637298583984, "global_step": 321982, "epoch": 1916} {"train_loss": -12.361814498901367, "global_step": 321983, "epoch": 1916} {"train_loss": -12.226825714111328, "global_step": 321984, "epoch": 1916} {"train_loss": -11.70670223236084, "global_step": 321985, "epoch": 1916} {"train_loss": -12.255302429199219, "global_step": 321986, "epoch": 1916} {"train_loss": -12.317118644714355, "global_step": 321987, "epoch": 1916} {"train_loss": -12.43867015838623, "global_step": 321988, "epoch": 1916} {"train_loss": -12.27902889251709, "global_step": 321989, "epoch": 1916} {"train_loss": -12.24677848815918, "global_step": 321990, "epoch": 1916} {"train_loss": -12.178165435791016, "global_step": 321991, "epoch": 1916} {"train_loss": -11.773396492004395, "global_step": 321992, "epoch": 1916} {"train_loss": -12.526033401489258, "global_step": 321993, "epoch": 1916} {"train_loss": -11.943603515625, "global_step": 321994, "epoch": 1916} {"train_loss": -12.158934593200684, "global_step": 321995, "epoch": 1916} {"train_loss": -12.360804557800293, "global_step": 321996, "epoch": 1916} {"train_loss": -12.285674095153809, "global_step": 321997, "epoch": 1916} {"train_loss": -11.822877883911133, "global_step": 321998, "epoch": 1916} {"train_loss": -12.356868743896484, "global_step": 321999, "epoch": 1916} {"train_loss": -12.129648208618164, "global_step": 322000, "epoch": 1916} {"train_loss": -12.320096015930176, "global_step": 322001, "epoch": 1916} {"train_loss": -12.221809387207031, "global_step": 322002, "epoch": 1916} {"train_loss": -12.083477973937988, "global_step": 322003, "epoch": 1916} {"train_loss": -12.27889633178711, "global_step": 322004, "epoch": 1916} {"train_loss": -12.342585563659668, "global_step": 322005, "epoch": 1916} {"train_loss": -12.33183479309082, "global_step": 322006, "epoch": 1916} {"train_loss": -12.485302925109863, "global_step": 322007, "epoch": 1916} {"train_loss": -12.452873229980469, "global_step": 322008, "epoch": 1916} {"train_loss": -12.337440490722656, "global_step": 322009, "epoch": 1916} {"train_loss": -12.551580429077148, "global_step": 322010, "epoch": 1916} {"train_loss": -12.423675537109375, "global_step": 322011, "epoch": 1916} {"train_loss": -12.198598861694336, "global_step": 322012, "epoch": 1916} {"train_loss": -12.064626693725586, "global_step": 322013, "epoch": 1916} {"train_loss": -11.818172454833984, "global_step": 322014, "epoch": 1916} {"train_loss": -12.248226165771484, "global_step": 322015, "epoch": 1916} {"train_loss": -12.492220878601074, "global_step": 322016, "epoch": 1916} {"train_loss": -12.2718505859375, "global_step": 322017, "epoch": 1916} {"train_loss": -12.107986450195312, "global_step": 322018, "epoch": 1916} {"train_loss": -12.050050735473633, "global_step": 322019, "epoch": 1916} {"train_loss": -12.25358772277832, "global_step": 322020, "epoch": 1916} {"train_loss": -11.895490646362305, "global_step": 322021, "epoch": 1916} {"train_loss": -12.067756652832031, "global_step": 322022, "epoch": 1916} {"train_loss": -11.456758499145508, "global_step": 322023, "epoch": 1916} {"train_loss": -12.323885917663574, "global_step": 322024, "epoch": 1916} {"train_loss": -11.302155494689941, "global_step": 322025, "epoch": 1916} {"train_loss": -12.446107864379883, "global_step": 322026, "epoch": 1916} {"train_loss": -10.838866233825684, "global_step": 322027, "epoch": 1916} {"train_loss": -11.72829818725586, "global_step": 322028, "epoch": 1916} {"train_loss": -11.938743591308594, "global_step": 322029, "epoch": 1916} {"train_loss": -11.939399719238281, "global_step": 322030, "epoch": 1916} {"train_loss": -12.04023265838623, "global_step": 322031, "epoch": 1916} {"train_loss": -12.224684715270996, "global_step": 322032, "epoch": 1916} {"train_loss": -12.183113098144531, "global_step": 322033, "epoch": 1916} {"train_loss": -11.971138954162598, "global_step": 322034, "epoch": 1916} {"train_loss": -11.671637535095215, "global_step": 322035, "epoch": 1916} {"train_loss": -12.367176055908203, "global_step": 322036, "epoch": 1916} {"train_loss": -12.43745231628418, "global_step": 322037, "epoch": 1916} {"train_loss": -12.152385711669922, "global_step": 322038, "epoch": 1916} {"train_loss": -11.717361450195312, "global_step": 322039, "epoch": 1916} {"train_loss": -11.311635971069336, "global_step": 322040, "epoch": 1916} {"train_loss": -12.190114974975586, "global_step": 322041, "epoch": 1916} {"train_loss": -11.718955993652344, "global_step": 322042, "epoch": 1916} {"train_loss": -10.662812232971191, "global_step": 322043, "epoch": 1916} {"train_loss": -11.84130859375, "global_step": 322044, "epoch": 1916} {"train_loss": -11.165115356445312, "global_step": 322045, "epoch": 1916} {"train_loss": -10.476630210876465, "global_step": 322046, "epoch": 1916} {"train_loss": -11.94647216796875, "global_step": 322047, "epoch": 1916} {"train_loss": -11.473075866699219, "global_step": 322048, "epoch": 1916} {"train_loss": -10.883502960205078, "global_step": 322049, "epoch": 1916} {"train_loss": -11.508001327514648, "global_step": 322050, "epoch": 1916} {"train_loss": -11.818188667297363, "global_step": 322051, "epoch": 1916} {"train_loss": -11.313774108886719, "global_step": 322052, "epoch": 1916} {"train_loss": -11.674283027648926, "global_step": 322053, "epoch": 1916} {"train_loss": -11.258279800415039, "global_step": 322054, "epoch": 1916} {"train_loss": -11.745777555874415, "global_step": 322055, "epoch": 1916, "val_loss": 287632.90625} {"train_loss": -11.494800567626953, "global_step": 322056, "epoch": 1917} {"train_loss": -11.041913032531738, "global_step": 322057, "epoch": 1917} {"train_loss": -11.571907043457031, "global_step": 322058, "epoch": 1917} {"train_loss": -11.684165954589844, "global_step": 322059, "epoch": 1917} {"train_loss": -11.535263061523438, "global_step": 322060, "epoch": 1917} {"train_loss": -12.110635757446289, "global_step": 322061, "epoch": 1917} {"train_loss": -11.316082954406738, "global_step": 322062, "epoch": 1917} {"train_loss": -11.67563247680664, "global_step": 322063, "epoch": 1917} {"train_loss": -10.852386474609375, "global_step": 322064, "epoch": 1917} {"train_loss": -11.299554824829102, "global_step": 322065, "epoch": 1917} {"train_loss": -11.814284324645996, "global_step": 322066, "epoch": 1917} {"train_loss": -11.489177703857422, "global_step": 322067, "epoch": 1917} {"train_loss": -11.94765567779541, "global_step": 322068, "epoch": 1917} {"train_loss": -11.458549499511719, "global_step": 322069, "epoch": 1917} {"train_loss": -12.056646347045898, "global_step": 322070, "epoch": 1917} {"train_loss": -11.547628402709961, "global_step": 322071, "epoch": 1917} {"train_loss": -11.971040725708008, "global_step": 322072, "epoch": 1917} {"train_loss": -12.194411277770996, "global_step": 322073, "epoch": 1917} {"train_loss": -11.891525268554688, "global_step": 322074, "epoch": 1917} {"train_loss": -12.127906799316406, "global_step": 322075, "epoch": 1917} {"train_loss": -12.061744689941406, "global_step": 322076, "epoch": 1917} {"train_loss": -11.888157844543457, "global_step": 322077, "epoch": 1917} {"train_loss": -12.141788482666016, "global_step": 322078, "epoch": 1917} {"train_loss": -11.992863655090332, "global_step": 322079, "epoch": 1917} {"train_loss": -12.033374786376953, "global_step": 322080, "epoch": 1917} {"train_loss": -12.048175811767578, "global_step": 322081, "epoch": 1917} {"train_loss": -11.086654663085938, "global_step": 322082, "epoch": 1917} {"train_loss": -11.430261611938477, "global_step": 322083, "epoch": 1917} {"train_loss": -11.789270401000977, "global_step": 322084, "epoch": 1917} {"train_loss": -11.502226829528809, "global_step": 322085, "epoch": 1917} {"train_loss": -11.926811218261719, "global_step": 322086, "epoch": 1917} {"train_loss": -11.75924301147461, "global_step": 322087, "epoch": 1917} {"train_loss": -11.941362380981445, "global_step": 322088, "epoch": 1917} {"train_loss": -12.114423751831055, "global_step": 322089, "epoch": 1917} {"train_loss": -11.988454818725586, "global_step": 322090, "epoch": 1917} {"train_loss": -11.875107765197754, "global_step": 322091, "epoch": 1917} {"train_loss": -12.227784156799316, "global_step": 322092, "epoch": 1917} {"train_loss": -11.86319351196289, "global_step": 322093, "epoch": 1917} {"train_loss": -12.12139892578125, "global_step": 322094, "epoch": 1917} {"train_loss": -12.015634536743164, "global_step": 322095, "epoch": 1917} {"train_loss": -12.160806655883789, "global_step": 322096, "epoch": 1917} {"train_loss": -11.930959701538086, "global_step": 322097, "epoch": 1917} {"train_loss": -12.086803436279297, "global_step": 322098, "epoch": 1917} {"train_loss": -12.246367454528809, "global_step": 322099, "epoch": 1917} {"train_loss": -12.338228225708008, "global_step": 322100, "epoch": 1917} {"train_loss": -12.010581970214844, "global_step": 322101, "epoch": 1917} {"train_loss": -12.468320846557617, "global_step": 322102, "epoch": 1917} {"train_loss": -12.079421997070312, "global_step": 322103, "epoch": 1917} {"train_loss": -12.246379852294922, "global_step": 322104, "epoch": 1917} {"train_loss": -11.961812973022461, "global_step": 322105, "epoch": 1917} {"train_loss": -12.160750389099121, "global_step": 322106, "epoch": 1917} {"train_loss": -12.08344554901123, "global_step": 322107, "epoch": 1917} {"train_loss": -12.033075332641602, "global_step": 322108, "epoch": 1917} {"train_loss": -12.196889877319336, "global_step": 322109, "epoch": 1917} {"train_loss": -12.165587425231934, "global_step": 322110, "epoch": 1917} {"train_loss": -12.086034774780273, "global_step": 322111, "epoch": 1917} {"train_loss": -12.017721176147461, "global_step": 322112, "epoch": 1917} {"train_loss": -12.389270782470703, "global_step": 322113, "epoch": 1917} {"train_loss": -12.299899101257324, "global_step": 322114, "epoch": 1917} {"train_loss": -12.27273941040039, "global_step": 322115, "epoch": 1917} {"train_loss": -12.126325607299805, "global_step": 322116, "epoch": 1917} {"train_loss": -12.26792049407959, "global_step": 322117, "epoch": 1917} {"train_loss": -12.262842178344727, "global_step": 322118, "epoch": 1917} {"train_loss": -12.144815444946289, "global_step": 322119, "epoch": 1917} {"train_loss": -11.916696548461914, "global_step": 322120, "epoch": 1917} {"train_loss": -11.905862808227539, "global_step": 322121, "epoch": 1917} {"train_loss": -11.7198486328125, "global_step": 322122, "epoch": 1917} {"train_loss": -12.181205749511719, "global_step": 322123, "epoch": 1917} {"train_loss": -11.92861270904541, "global_step": 322124, "epoch": 1917} {"train_loss": -12.089333534240723, "global_step": 322125, "epoch": 1917} {"train_loss": -12.34912395477295, "global_step": 322126, "epoch": 1917} {"train_loss": -12.118715286254883, "global_step": 322127, "epoch": 1917} {"train_loss": -11.85509967803955, "global_step": 322128, "epoch": 1917} {"train_loss": -12.181842803955078, "global_step": 322129, "epoch": 1917} {"train_loss": -12.010660171508789, "global_step": 322130, "epoch": 1917} {"train_loss": -11.760404586791992, "global_step": 322131, "epoch": 1917} {"train_loss": -12.284647941589355, "global_step": 322132, "epoch": 1917} {"train_loss": -12.233141899108887, "global_step": 322133, "epoch": 1917} {"train_loss": -12.234109878540039, "global_step": 322134, "epoch": 1917} {"train_loss": -11.941466331481934, "global_step": 322135, "epoch": 1917} {"train_loss": -12.448589324951172, "global_step": 322136, "epoch": 1917} {"train_loss": -11.804625511169434, "global_step": 322137, "epoch": 1917} {"train_loss": -11.608118057250977, "global_step": 322138, "epoch": 1917} {"train_loss": -12.179017066955566, "global_step": 322139, "epoch": 1917} {"train_loss": -12.050289154052734, "global_step": 322140, "epoch": 1917} {"train_loss": -12.208585739135742, "global_step": 322141, "epoch": 1917} {"train_loss": -12.044920921325684, "global_step": 322142, "epoch": 1917} {"train_loss": -11.831334114074707, "global_step": 322143, "epoch": 1917} {"train_loss": -12.212240219116211, "global_step": 322144, "epoch": 1917} {"train_loss": -12.249008178710938, "global_step": 322145, "epoch": 1917} {"train_loss": -12.35384750366211, "global_step": 322146, "epoch": 1917} {"train_loss": -12.420711517333984, "global_step": 322147, "epoch": 1917} {"train_loss": -12.462632179260254, "global_step": 322148, "epoch": 1917} {"train_loss": -12.09727668762207, "global_step": 322149, "epoch": 1917} {"train_loss": -12.235963821411133, "global_step": 322150, "epoch": 1917} {"train_loss": -12.545644760131836, "global_step": 322151, "epoch": 1917} {"train_loss": -12.189528465270996, "global_step": 322152, "epoch": 1917} {"train_loss": -12.259424209594727, "global_step": 322153, "epoch": 1917} {"train_loss": -12.300935745239258, "global_step": 322154, "epoch": 1917} {"train_loss": -12.07263469696045, "global_step": 322155, "epoch": 1917} {"train_loss": -11.821223258972168, "global_step": 322156, "epoch": 1917} {"train_loss": -12.343826293945312, "global_step": 322157, "epoch": 1917} {"train_loss": -11.662310600280762, "global_step": 322158, "epoch": 1917} {"train_loss": -11.528606414794922, "global_step": 322159, "epoch": 1917} {"train_loss": -12.211494445800781, "global_step": 322160, "epoch": 1917} {"train_loss": -12.464611053466797, "global_step": 322161, "epoch": 1917} {"train_loss": -12.533700942993164, "global_step": 322162, "epoch": 1917} {"train_loss": -12.348100662231445, "global_step": 322163, "epoch": 1917} {"train_loss": -12.307760238647461, "global_step": 322164, "epoch": 1917} {"train_loss": -12.017608642578125, "global_step": 322165, "epoch": 1917} {"train_loss": -12.496394157409668, "global_step": 322166, "epoch": 1917} {"train_loss": -11.518054008483887, "global_step": 322167, "epoch": 1917} {"train_loss": -11.937806129455566, "global_step": 322168, "epoch": 1917} {"train_loss": -11.410015106201172, "global_step": 322169, "epoch": 1917} {"train_loss": -12.088440895080566, "global_step": 322170, "epoch": 1917} {"train_loss": -11.656755447387695, "global_step": 322171, "epoch": 1917} {"train_loss": -12.080284118652344, "global_step": 322172, "epoch": 1917} {"train_loss": -12.06179428100586, "global_step": 322173, "epoch": 1917} {"train_loss": -11.979660034179688, "global_step": 322174, "epoch": 1917} {"train_loss": -12.053709983825684, "global_step": 322175, "epoch": 1917} {"train_loss": -12.084660530090332, "global_step": 322176, "epoch": 1917} {"train_loss": -12.06346607208252, "global_step": 322177, "epoch": 1917} {"train_loss": -12.297555923461914, "global_step": 322178, "epoch": 1917} {"train_loss": -11.856788635253906, "global_step": 322179, "epoch": 1917} {"train_loss": -11.854690551757812, "global_step": 322180, "epoch": 1917} {"train_loss": -11.371814727783203, "global_step": 322181, "epoch": 1917} {"train_loss": -11.754867553710938, "global_step": 322182, "epoch": 1917} {"train_loss": -11.484025955200195, "global_step": 322183, "epoch": 1917} {"train_loss": -10.400413513183594, "global_step": 322184, "epoch": 1917} {"train_loss": -12.009103775024414, "global_step": 322185, "epoch": 1917} {"train_loss": -11.18834114074707, "global_step": 322186, "epoch": 1917} {"train_loss": -11.376086235046387, "global_step": 322187, "epoch": 1917} {"train_loss": -11.764659881591797, "global_step": 322188, "epoch": 1917} {"train_loss": -10.987737655639648, "global_step": 322189, "epoch": 1917} {"train_loss": -11.119274139404297, "global_step": 322190, "epoch": 1917} {"train_loss": -11.750028610229492, "global_step": 322191, "epoch": 1917} {"train_loss": -11.199178695678711, "global_step": 322192, "epoch": 1917} {"train_loss": -11.197253227233887, "global_step": 322193, "epoch": 1917} {"train_loss": -11.560876846313477, "global_step": 322194, "epoch": 1917} {"train_loss": -10.41576099395752, "global_step": 322195, "epoch": 1917} {"train_loss": -10.751314163208008, "global_step": 322196, "epoch": 1917} {"train_loss": -11.17801570892334, "global_step": 322197, "epoch": 1917} {"train_loss": -10.916328430175781, "global_step": 322198, "epoch": 1917} {"train_loss": -11.740850448608398, "global_step": 322199, "epoch": 1917} {"train_loss": -10.89012336730957, "global_step": 322200, "epoch": 1917} {"train_loss": -11.716304779052734, "global_step": 322201, "epoch": 1917} {"train_loss": -9.82529354095459, "global_step": 322202, "epoch": 1917} {"train_loss": -11.063663482666016, "global_step": 322203, "epoch": 1917} {"train_loss": -11.057258605957031, "global_step": 322204, "epoch": 1917} {"train_loss": -11.031965255737305, "global_step": 322205, "epoch": 1917} {"train_loss": -10.561819076538086, "global_step": 322206, "epoch": 1917} {"train_loss": -10.67092514038086, "global_step": 322207, "epoch": 1917} {"train_loss": -10.541528701782227, "global_step": 322208, "epoch": 1917} {"train_loss": -10.255721092224121, "global_step": 322209, "epoch": 1917} {"train_loss": -10.124921798706055, "global_step": 322210, "epoch": 1917} {"train_loss": -11.812931060791016, "global_step": 322211, "epoch": 1917} {"train_loss": -10.015924453735352, "global_step": 322212, "epoch": 1917} {"train_loss": -11.527827262878418, "global_step": 322213, "epoch": 1917} {"train_loss": -10.452836990356445, "global_step": 322214, "epoch": 1917} {"train_loss": -10.257257461547852, "global_step": 322215, "epoch": 1917} {"train_loss": -10.503351211547852, "global_step": 322216, "epoch": 1917} {"train_loss": -10.732078552246094, "global_step": 322217, "epoch": 1917} {"train_loss": -9.716264724731445, "global_step": 322218, "epoch": 1917} {"train_loss": -11.771113395690918, "global_step": 322219, "epoch": 1917} {"train_loss": -10.822195053100586, "global_step": 322220, "epoch": 1917} {"train_loss": -11.617547988891602, "global_step": 322221, "epoch": 1917} {"train_loss": -10.88898754119873, "global_step": 322222, "epoch": 1917} {"train_loss": -11.746107277416048, "global_step": 322223, "epoch": 1917, "val_loss": 288419.1875} {"train_loss": -10.369546890258789, "global_step": 322224, "epoch": 1918} {"train_loss": -11.26746940612793, "global_step": 322225, "epoch": 1918} {"train_loss": -10.702919006347656, "global_step": 322226, "epoch": 1918} {"train_loss": -10.837884902954102, "global_step": 322227, "epoch": 1918} {"train_loss": -11.080018997192383, "global_step": 322228, "epoch": 1918} {"train_loss": -10.082529067993164, "global_step": 322229, "epoch": 1918} {"train_loss": -11.250905990600586, "global_step": 322230, "epoch": 1918} {"train_loss": -9.556660652160645, "global_step": 322231, "epoch": 1918} {"train_loss": -10.978696823120117, "global_step": 322232, "epoch": 1918} {"train_loss": -10.8377685546875, "global_step": 322233, "epoch": 1918} {"train_loss": -11.00804615020752, "global_step": 322234, "epoch": 1918} {"train_loss": -10.053747177124023, "global_step": 322235, "epoch": 1918} {"train_loss": -10.441447257995605, "global_step": 322236, "epoch": 1918} {"train_loss": -11.961544036865234, "global_step": 322237, "epoch": 1918} {"train_loss": -10.450311660766602, "global_step": 322238, "epoch": 1918} {"train_loss": -11.559958457946777, "global_step": 322239, "epoch": 1918} {"train_loss": -11.26082992553711, "global_step": 322240, "epoch": 1918} {"train_loss": -11.126808166503906, "global_step": 322241, "epoch": 1918} {"train_loss": -11.903003692626953, "global_step": 322242, "epoch": 1918} {"train_loss": -11.430368423461914, "global_step": 322243, "epoch": 1918} {"train_loss": -11.642610549926758, "global_step": 322244, "epoch": 1918} {"train_loss": -11.795478820800781, "global_step": 322245, "epoch": 1918} {"train_loss": -11.942529678344727, "global_step": 322246, "epoch": 1918} {"train_loss": -11.78075885772705, "global_step": 322247, "epoch": 1918} {"train_loss": -11.851452827453613, "global_step": 322248, "epoch": 1918} {"train_loss": -11.755765914916992, "global_step": 322249, "epoch": 1918} {"train_loss": -11.608907699584961, "global_step": 322250, "epoch": 1918} {"train_loss": -11.997560501098633, "global_step": 322251, "epoch": 1918} {"train_loss": -11.838309288024902, "global_step": 322252, "epoch": 1918} {"train_loss": -11.914094924926758, "global_step": 322253, "epoch": 1918} {"train_loss": -12.200112342834473, "global_step": 322254, "epoch": 1918} {"train_loss": -12.02486801147461, "global_step": 322255, "epoch": 1918} {"train_loss": -11.810399055480957, "global_step": 322256, "epoch": 1918} {"train_loss": -11.956764221191406, "global_step": 322257, "epoch": 1918} {"train_loss": -12.005594253540039, "global_step": 322258, "epoch": 1918} {"train_loss": -12.170174598693848, "global_step": 322259, "epoch": 1918} {"train_loss": -11.96285629272461, "global_step": 322260, "epoch": 1918} {"train_loss": -12.11297607421875, "global_step": 322261, "epoch": 1918} {"train_loss": -11.843764305114746, "global_step": 322262, "epoch": 1918} {"train_loss": -12.143835067749023, "global_step": 322263, "epoch": 1918} {"train_loss": -12.184968948364258, "global_step": 322264, "epoch": 1918} {"train_loss": -11.997842788696289, "global_step": 322265, "epoch": 1918} {"train_loss": -12.185993194580078, "global_step": 322266, "epoch": 1918} {"train_loss": -12.110544204711914, "global_step": 322267, "epoch": 1918} {"train_loss": -12.116388320922852, "global_step": 322268, "epoch": 1918} {"train_loss": -12.016599655151367, "global_step": 322269, "epoch": 1918} {"train_loss": -12.255430221557617, "global_step": 322270, "epoch": 1918} {"train_loss": -11.96986198425293, "global_step": 322271, "epoch": 1918} {"train_loss": -12.28984260559082, "global_step": 322272, "epoch": 1918} {"train_loss": -12.39570426940918, "global_step": 322273, "epoch": 1918} {"train_loss": -12.129741668701172, "global_step": 322274, "epoch": 1918} {"train_loss": -12.396557807922363, "global_step": 322275, "epoch": 1918} {"train_loss": -12.189451217651367, "global_step": 322276, "epoch": 1918} {"train_loss": -12.256135940551758, "global_step": 322277, "epoch": 1918} {"train_loss": -12.498376846313477, "global_step": 322278, "epoch": 1918} {"train_loss": -12.284597396850586, "global_step": 322279, "epoch": 1918} {"train_loss": -12.194058418273926, "global_step": 322280, "epoch": 1918} {"train_loss": -12.303292274475098, "global_step": 322281, "epoch": 1918} {"train_loss": -12.158658981323242, "global_step": 322282, "epoch": 1918} {"train_loss": -12.319714546203613, "global_step": 322283, "epoch": 1918} {"train_loss": -12.302398681640625, "global_step": 322284, "epoch": 1918} {"train_loss": -12.292332649230957, "global_step": 322285, "epoch": 1918} {"train_loss": -12.156792640686035, "global_step": 322286, "epoch": 1918} {"train_loss": -12.437189102172852, "global_step": 322287, "epoch": 1918} {"train_loss": -12.172126770019531, "global_step": 322288, "epoch": 1918} {"train_loss": -12.060534477233887, "global_step": 322289, "epoch": 1918} {"train_loss": -12.290975570678711, "global_step": 322290, "epoch": 1918} {"train_loss": -12.04897689819336, "global_step": 322291, "epoch": 1918} {"train_loss": -12.257701873779297, "global_step": 322292, "epoch": 1918} {"train_loss": -12.384753227233887, "global_step": 322293, "epoch": 1918} {"train_loss": -12.342031478881836, "global_step": 322294, "epoch": 1918} {"train_loss": -12.356447219848633, "global_step": 322295, "epoch": 1918} {"train_loss": -12.351409912109375, "global_step": 322296, "epoch": 1918} {"train_loss": -12.288092613220215, "global_step": 322297, "epoch": 1918} {"train_loss": -12.100854873657227, "global_step": 322298, "epoch": 1918} {"train_loss": -12.343973159790039, "global_step": 322299, "epoch": 1918} {"train_loss": -12.345382690429688, "global_step": 322300, "epoch": 1918} {"train_loss": -12.4147367477417, "global_step": 322301, "epoch": 1918} {"train_loss": -12.271796226501465, "global_step": 322302, "epoch": 1918} {"train_loss": -12.406134605407715, "global_step": 322303, "epoch": 1918} {"train_loss": -12.33259391784668, "global_step": 322304, "epoch": 1918} {"train_loss": -12.062887191772461, "global_step": 322305, "epoch": 1918} {"train_loss": -12.169538497924805, "global_step": 322306, "epoch": 1918} {"train_loss": -12.193821907043457, "global_step": 322307, "epoch": 1918} {"train_loss": -12.192151069641113, "global_step": 322308, "epoch": 1918} {"train_loss": -12.440106391906738, "global_step": 322309, "epoch": 1918} {"train_loss": -12.019509315490723, "global_step": 322310, "epoch": 1918} {"train_loss": -12.289674758911133, "global_step": 322311, "epoch": 1918} {"train_loss": -12.507575988769531, "global_step": 322312, "epoch": 1918} {"train_loss": -12.350284576416016, "global_step": 322313, "epoch": 1918} {"train_loss": -12.346549987792969, "global_step": 322314, "epoch": 1918} {"train_loss": -12.335101127624512, "global_step": 322315, "epoch": 1918} {"train_loss": -12.280040740966797, "global_step": 322316, "epoch": 1918} {"train_loss": -12.433099746704102, "global_step": 322317, "epoch": 1918} {"train_loss": -12.37049674987793, "global_step": 322318, "epoch": 1918} {"train_loss": -12.311450004577637, "global_step": 322319, "epoch": 1918} {"train_loss": -12.055915832519531, "global_step": 322320, "epoch": 1918} {"train_loss": -12.409590721130371, "global_step": 322321, "epoch": 1918} {"train_loss": -12.227612495422363, "global_step": 322322, "epoch": 1918} {"train_loss": -12.233906745910645, "global_step": 322323, "epoch": 1918} {"train_loss": -12.307720184326172, "global_step": 322324, "epoch": 1918} {"train_loss": -12.090248107910156, "global_step": 322325, "epoch": 1918} {"train_loss": -12.36976146697998, "global_step": 322326, "epoch": 1918} {"train_loss": -12.224678039550781, "global_step": 322327, "epoch": 1918} {"train_loss": -12.41823673248291, "global_step": 322328, "epoch": 1918} {"train_loss": -12.202579498291016, "global_step": 322329, "epoch": 1918} {"train_loss": -12.389145851135254, "global_step": 322330, "epoch": 1918} {"train_loss": -12.172776222229004, "global_step": 322331, "epoch": 1918} {"train_loss": -11.987349510192871, "global_step": 322332, "epoch": 1918} {"train_loss": -12.122139930725098, "global_step": 322333, "epoch": 1918} {"train_loss": -12.507858276367188, "global_step": 322334, "epoch": 1918} {"train_loss": -12.248380661010742, "global_step": 322335, "epoch": 1918} {"train_loss": -11.428495407104492, "global_step": 322336, "epoch": 1918} {"train_loss": -11.885847091674805, "global_step": 322337, "epoch": 1918} {"train_loss": -11.747734069824219, "global_step": 322338, "epoch": 1918} {"train_loss": -12.323826789855957, "global_step": 322339, "epoch": 1918} {"train_loss": -11.17364501953125, "global_step": 322340, "epoch": 1918} {"train_loss": -10.873083114624023, "global_step": 322341, "epoch": 1918} {"train_loss": -11.438457489013672, "global_step": 322342, "epoch": 1918} {"train_loss": -11.550307273864746, "global_step": 322343, "epoch": 1918} {"train_loss": -8.947065353393555, "global_step": 322344, "epoch": 1918} {"train_loss": -11.510957717895508, "global_step": 322345, "epoch": 1918} {"train_loss": -9.287899017333984, "global_step": 322346, "epoch": 1918} {"train_loss": -8.200723648071289, "global_step": 322347, "epoch": 1918} {"train_loss": -8.0484037399292, "global_step": 322348, "epoch": 1918} {"train_loss": -8.704812049865723, "global_step": 322349, "epoch": 1918} {"train_loss": -10.698073387145996, "global_step": 322350, "epoch": 1918} {"train_loss": -9.634668350219727, "global_step": 322351, "epoch": 1918} {"train_loss": -8.110918045043945, "global_step": 322352, "epoch": 1918} {"train_loss": -9.923565864562988, "global_step": 322353, "epoch": 1918} {"train_loss": -7.316537857055664, "global_step": 322354, "epoch": 1918} {"train_loss": -8.966300964355469, "global_step": 322355, "epoch": 1918} {"train_loss": -10.300149917602539, "global_step": 322356, "epoch": 1918} {"train_loss": -9.455384254455566, "global_step": 322357, "epoch": 1918} {"train_loss": -10.291160583496094, "global_step": 322358, "epoch": 1918} {"train_loss": -8.408265113830566, "global_step": 322359, "epoch": 1918} {"train_loss": -10.155899047851562, "global_step": 322360, "epoch": 1918} {"train_loss": -9.869279861450195, "global_step": 322361, "epoch": 1918} {"train_loss": -10.189809799194336, "global_step": 322362, "epoch": 1918} {"train_loss": -10.336755752563477, "global_step": 322363, "epoch": 1918} {"train_loss": -11.714635848999023, "global_step": 322364, "epoch": 1918} {"train_loss": -10.117525100708008, "global_step": 322365, "epoch": 1918} {"train_loss": -11.425256729125977, "global_step": 322366, "epoch": 1918} {"train_loss": -10.455860137939453, "global_step": 322367, "epoch": 1918} {"train_loss": -10.771575927734375, "global_step": 322368, "epoch": 1918} {"train_loss": -11.54731559753418, "global_step": 322369, "epoch": 1918} {"train_loss": -10.728370666503906, "global_step": 322370, "epoch": 1918} {"train_loss": -11.156794548034668, "global_step": 322371, "epoch": 1918} {"train_loss": -11.20933723449707, "global_step": 322372, "epoch": 1918} {"train_loss": -11.687967300415039, "global_step": 322373, "epoch": 1918} {"train_loss": -11.23629093170166, "global_step": 322374, "epoch": 1918} {"train_loss": -11.776372909545898, "global_step": 322375, "epoch": 1918} {"train_loss": -11.452802658081055, "global_step": 322376, "epoch": 1918} {"train_loss": -11.803668975830078, "global_step": 322377, "epoch": 1918} {"train_loss": -11.627573013305664, "global_step": 322378, "epoch": 1918} {"train_loss": -11.554605484008789, "global_step": 322379, "epoch": 1918} {"train_loss": -11.330583572387695, "global_step": 322380, "epoch": 1918} {"train_loss": -11.777483940124512, "global_step": 322381, "epoch": 1918} {"train_loss": -11.529546737670898, "global_step": 322382, "epoch": 1918} {"train_loss": -11.22683334350586, "global_step": 322383, "epoch": 1918} {"train_loss": -11.910367965698242, "global_step": 322384, "epoch": 1918} {"train_loss": -11.789922714233398, "global_step": 322385, "epoch": 1918} {"train_loss": -11.781554222106934, "global_step": 322386, "epoch": 1918} {"train_loss": -11.81536865234375, "global_step": 322387, "epoch": 1918} {"train_loss": -11.713594436645508, "global_step": 322388, "epoch": 1918} {"train_loss": -11.848798751831055, "global_step": 322389, "epoch": 1918} {"train_loss": -11.40308952331543, "global_step": 322390, "epoch": 1918} {"train_loss": -11.547976851463318, "global_step": 322391, "epoch": 1918, "val_loss": 273949.125} {"train_loss": -11.425756454467773, "global_step": 322392, "epoch": 1919} {"train_loss": -11.935242652893066, "global_step": 322393, "epoch": 1919} {"train_loss": -11.911571502685547, "global_step": 322394, "epoch": 1919} {"train_loss": -11.891788482666016, "global_step": 322395, "epoch": 1919} {"train_loss": -11.985976219177246, "global_step": 322396, "epoch": 1919} {"train_loss": -11.835661888122559, "global_step": 322397, "epoch": 1919} {"train_loss": -12.03377914428711, "global_step": 322398, "epoch": 1919} {"train_loss": -12.015466690063477, "global_step": 322399, "epoch": 1919} {"train_loss": -12.046116828918457, "global_step": 322400, "epoch": 1919} {"train_loss": -12.060260772705078, "global_step": 322401, "epoch": 1919} {"train_loss": -12.056642532348633, "global_step": 322402, "epoch": 1919} {"train_loss": -12.009941101074219, "global_step": 322403, "epoch": 1919} {"train_loss": -12.185211181640625, "global_step": 322404, "epoch": 1919} {"train_loss": -11.683515548706055, "global_step": 322405, "epoch": 1919} {"train_loss": -11.877534866333008, "global_step": 322406, "epoch": 1919} {"train_loss": -12.03089714050293, "global_step": 322407, "epoch": 1919} {"train_loss": -12.071893692016602, "global_step": 322408, "epoch": 1919} {"train_loss": -11.960986137390137, "global_step": 322409, "epoch": 1919} {"train_loss": -11.865983963012695, "global_step": 322410, "epoch": 1919} {"train_loss": -11.856256484985352, "global_step": 322411, "epoch": 1919} {"train_loss": -12.0794677734375, "global_step": 322412, "epoch": 1919} {"train_loss": -12.06931209564209, "global_step": 322413, "epoch": 1919} {"train_loss": -12.044685363769531, "global_step": 322414, "epoch": 1919} {"train_loss": -12.124190330505371, "global_step": 322415, "epoch": 1919} {"train_loss": -12.29800033569336, "global_step": 322416, "epoch": 1919} {"train_loss": -12.133832931518555, "global_step": 322417, "epoch": 1919} {"train_loss": -12.197197914123535, "global_step": 322418, "epoch": 1919} {"train_loss": -12.402399063110352, "global_step": 322419, "epoch": 1919} {"train_loss": -12.14122200012207, "global_step": 322420, "epoch": 1919} {"train_loss": -12.31356430053711, "global_step": 322421, "epoch": 1919} {"train_loss": -12.48164176940918, "global_step": 322422, "epoch": 1919} {"train_loss": -12.071199417114258, "global_step": 322423, "epoch": 1919} {"train_loss": -12.344526290893555, "global_step": 322424, "epoch": 1919} {"train_loss": -12.202537536621094, "global_step": 322425, "epoch": 1919} {"train_loss": -12.313544273376465, "global_step": 322426, "epoch": 1919} {"train_loss": -12.204957008361816, "global_step": 322427, "epoch": 1919} {"train_loss": -12.346476554870605, "global_step": 322428, "epoch": 1919} {"train_loss": -12.270133018493652, "global_step": 322429, "epoch": 1919} {"train_loss": -12.293472290039062, "global_step": 322430, "epoch": 1919} {"train_loss": -12.377870559692383, "global_step": 322431, "epoch": 1919} {"train_loss": -12.410696029663086, "global_step": 322432, "epoch": 1919} {"train_loss": -12.340072631835938, "global_step": 322433, "epoch": 1919} {"train_loss": -12.195633888244629, "global_step": 322434, "epoch": 1919} {"train_loss": -12.367757797241211, "global_step": 322435, "epoch": 1919} {"train_loss": -12.48525333404541, "global_step": 322436, "epoch": 1919} {"train_loss": -12.267053604125977, "global_step": 322437, "epoch": 1919} {"train_loss": -12.456554412841797, "global_step": 322438, "epoch": 1919} {"train_loss": -12.169515609741211, "global_step": 322439, "epoch": 1919} {"train_loss": -12.168718338012695, "global_step": 322440, "epoch": 1919} {"train_loss": -12.500690460205078, "global_step": 322441, "epoch": 1919} {"train_loss": -12.360282897949219, "global_step": 322442, "epoch": 1919} {"train_loss": -12.291775703430176, "global_step": 322443, "epoch": 1919} {"train_loss": -12.281871795654297, "global_step": 322444, "epoch": 1919} {"train_loss": -12.332557678222656, "global_step": 322445, "epoch": 1919} {"train_loss": -12.42660140991211, "global_step": 322446, "epoch": 1919} {"train_loss": -12.400272369384766, "global_step": 322447, "epoch": 1919} {"train_loss": -12.416723251342773, "global_step": 322448, "epoch": 1919} {"train_loss": -12.38414478302002, "global_step": 322449, "epoch": 1919} {"train_loss": -12.323838233947754, "global_step": 322450, "epoch": 1919} {"train_loss": -12.638457298278809, "global_step": 322451, "epoch": 1919} {"train_loss": -12.567717552185059, "global_step": 322452, "epoch": 1919} {"train_loss": -12.313425064086914, "global_step": 322453, "epoch": 1919} {"train_loss": -12.013566017150879, "global_step": 322454, "epoch": 1919} {"train_loss": -12.574577331542969, "global_step": 322455, "epoch": 1919} {"train_loss": -12.389453887939453, "global_step": 322456, "epoch": 1919} {"train_loss": -12.524320602416992, "global_step": 322457, "epoch": 1919} {"train_loss": -12.41567611694336, "global_step": 322458, "epoch": 1919} {"train_loss": -12.616024017333984, "global_step": 322459, "epoch": 1919} {"train_loss": -12.404708862304688, "global_step": 322460, "epoch": 1919} {"train_loss": -12.596745491027832, "global_step": 322461, "epoch": 1919} {"train_loss": -12.705395698547363, "global_step": 322462, "epoch": 1919} {"train_loss": -12.55982494354248, "global_step": 322463, "epoch": 1919} {"train_loss": -12.6685209274292, "global_step": 322464, "epoch": 1919} {"train_loss": -12.383170127868652, "global_step": 322465, "epoch": 1919} {"train_loss": -12.68470573425293, "global_step": 322466, "epoch": 1919} {"train_loss": -12.34523868560791, "global_step": 322467, "epoch": 1919} {"train_loss": -12.515745162963867, "global_step": 322468, "epoch": 1919} {"train_loss": -12.238348960876465, "global_step": 322469, "epoch": 1919} {"train_loss": -12.495423316955566, "global_step": 322470, "epoch": 1919} {"train_loss": -12.564988136291504, "global_step": 322471, "epoch": 1919} {"train_loss": -12.719295501708984, "global_step": 322472, "epoch": 1919} {"train_loss": -12.408712387084961, "global_step": 322473, "epoch": 1919} {"train_loss": -12.459343910217285, "global_step": 322474, "epoch": 1919} {"train_loss": -12.317071914672852, "global_step": 322475, "epoch": 1919} {"train_loss": -12.359991073608398, "global_step": 322476, "epoch": 1919} {"train_loss": -12.409464836120605, "global_step": 322477, "epoch": 1919} {"train_loss": -12.153865814208984, "global_step": 322478, "epoch": 1919} {"train_loss": -12.313840866088867, "global_step": 322479, "epoch": 1919} {"train_loss": -12.194091796875, "global_step": 322480, "epoch": 1919} {"train_loss": -12.495626449584961, "global_step": 322481, "epoch": 1919} {"train_loss": -11.77508544921875, "global_step": 322482, "epoch": 1919} {"train_loss": -12.31173324584961, "global_step": 322483, "epoch": 1919} {"train_loss": -12.227160453796387, "global_step": 322484, "epoch": 1919} {"train_loss": -12.542464256286621, "global_step": 322485, "epoch": 1919} {"train_loss": -12.223581314086914, "global_step": 322486, "epoch": 1919} {"train_loss": -12.629583358764648, "global_step": 322487, "epoch": 1919} {"train_loss": -12.024879455566406, "global_step": 322488, "epoch": 1919} {"train_loss": -12.432802200317383, "global_step": 322489, "epoch": 1919} {"train_loss": -12.284640312194824, "global_step": 322490, "epoch": 1919} {"train_loss": -12.112344741821289, "global_step": 322491, "epoch": 1919} {"train_loss": -12.436759948730469, "global_step": 322492, "epoch": 1919} {"train_loss": -12.030847549438477, "global_step": 322493, "epoch": 1919} {"train_loss": -12.034445762634277, "global_step": 322494, "epoch": 1919} {"train_loss": -11.34414291381836, "global_step": 322495, "epoch": 1919} {"train_loss": -10.83637523651123, "global_step": 322496, "epoch": 1919} {"train_loss": -11.171817779541016, "global_step": 322497, "epoch": 1919} {"train_loss": -11.122675895690918, "global_step": 322498, "epoch": 1919} {"train_loss": -10.868206024169922, "global_step": 322499, "epoch": 1919} {"train_loss": -11.068130493164062, "global_step": 322500, "epoch": 1919} {"train_loss": -8.819938659667969, "global_step": 322501, "epoch": 1919} {"train_loss": -10.4020414352417, "global_step": 322502, "epoch": 1919} {"train_loss": -8.799187660217285, "global_step": 322503, "epoch": 1919} {"train_loss": -9.143745422363281, "global_step": 322504, "epoch": 1919} {"train_loss": -7.875984191894531, "global_step": 322505, "epoch": 1919} {"train_loss": -10.74825668334961, "global_step": 322506, "epoch": 1919} {"train_loss": -10.701801300048828, "global_step": 322507, "epoch": 1919} {"train_loss": -9.364269256591797, "global_step": 322508, "epoch": 1919} {"train_loss": -9.955011367797852, "global_step": 322509, "epoch": 1919} {"train_loss": -9.243522644042969, "global_step": 322510, "epoch": 1919} {"train_loss": -9.85490608215332, "global_step": 322511, "epoch": 1919} {"train_loss": -10.503619194030762, "global_step": 322512, "epoch": 1919} {"train_loss": -10.993669509887695, "global_step": 322513, "epoch": 1919} {"train_loss": -9.835653305053711, "global_step": 322514, "epoch": 1919} {"train_loss": -10.573158264160156, "global_step": 322515, "epoch": 1919} {"train_loss": -10.018146514892578, "global_step": 322516, "epoch": 1919} {"train_loss": -11.275676727294922, "global_step": 322517, "epoch": 1919} {"train_loss": -10.983330726623535, "global_step": 322518, "epoch": 1919} {"train_loss": -10.733731269836426, "global_step": 322519, "epoch": 1919} {"train_loss": -10.858587265014648, "global_step": 322520, "epoch": 1919} {"train_loss": -11.605462074279785, "global_step": 322521, "epoch": 1919} {"train_loss": -11.633867263793945, "global_step": 322522, "epoch": 1919} {"train_loss": -11.265649795532227, "global_step": 322523, "epoch": 1919} {"train_loss": -11.574254989624023, "global_step": 322524, "epoch": 1919} {"train_loss": -11.267261505126953, "global_step": 322525, "epoch": 1919} {"train_loss": -11.202533721923828, "global_step": 322526, "epoch": 1919} {"train_loss": -11.556327819824219, "global_step": 322527, "epoch": 1919} {"train_loss": -10.985584259033203, "global_step": 322528, "epoch": 1919} {"train_loss": -11.923084259033203, "global_step": 322529, "epoch": 1919} {"train_loss": -10.83137321472168, "global_step": 322530, "epoch": 1919} {"train_loss": -11.160554885864258, "global_step": 322531, "epoch": 1919} {"train_loss": -10.627045631408691, "global_step": 322532, "epoch": 1919} {"train_loss": -10.894793510437012, "global_step": 322533, "epoch": 1919} {"train_loss": -11.596334457397461, "global_step": 322534, "epoch": 1919} {"train_loss": -11.140790939331055, "global_step": 322535, "epoch": 1919} {"train_loss": -11.254343032836914, "global_step": 322536, "epoch": 1919} {"train_loss": -11.45921516418457, "global_step": 322537, "epoch": 1919} {"train_loss": -11.130581855773926, "global_step": 322538, "epoch": 1919} {"train_loss": -11.447742462158203, "global_step": 322539, "epoch": 1919} {"train_loss": -11.26324462890625, "global_step": 322540, "epoch": 1919} {"train_loss": -11.281683921813965, "global_step": 322541, "epoch": 1919} {"train_loss": -11.332003593444824, "global_step": 322542, "epoch": 1919} {"train_loss": -11.529139518737793, "global_step": 322543, "epoch": 1919} {"train_loss": -11.38955307006836, "global_step": 322544, "epoch": 1919} {"train_loss": -11.96963882446289, "global_step": 322545, "epoch": 1919} {"train_loss": -11.407459259033203, "global_step": 322546, "epoch": 1919} {"train_loss": -11.756278991699219, "global_step": 322547, "epoch": 1919} {"train_loss": -11.731666564941406, "global_step": 322548, "epoch": 1919} {"train_loss": -11.781306266784668, "global_step": 322549, "epoch": 1919} {"train_loss": -11.63268756866455, "global_step": 322550, "epoch": 1919} {"train_loss": -11.864070892333984, "global_step": 322551, "epoch": 1919} {"train_loss": -11.779434204101562, "global_step": 322552, "epoch": 1919} {"train_loss": -11.970033645629883, "global_step": 322553, "epoch": 1919} {"train_loss": -11.941905975341797, "global_step": 322554, "epoch": 1919} {"train_loss": -11.996175765991211, "global_step": 322555, "epoch": 1919} {"train_loss": -11.821701049804688, "global_step": 322556, "epoch": 1919} {"train_loss": -12.094727516174316, "global_step": 322557, "epoch": 1919} {"train_loss": -11.780438423156738, "global_step": 322558, "epoch": 1919} {"train_loss": -11.78005990527925, "global_step": 322559, "epoch": 1919, "val_loss": 285384.25} {"train_loss": -12.185622215270996, "global_step": 322560, "epoch": 1920} {"train_loss": -11.816593170166016, "global_step": 322561, "epoch": 1920} {"train_loss": -11.944053649902344, "global_step": 322562, "epoch": 1920} {"train_loss": -11.939313888549805, "global_step": 322563, "epoch": 1920} {"train_loss": -12.179227828979492, "global_step": 322564, "epoch": 1920} {"train_loss": -12.077702522277832, "global_step": 322565, "epoch": 1920} {"train_loss": -12.241695404052734, "global_step": 322566, "epoch": 1920} {"train_loss": -12.24412727355957, "global_step": 322567, "epoch": 1920} {"train_loss": -12.238966941833496, "global_step": 322568, "epoch": 1920} {"train_loss": -12.144683837890625, "global_step": 322569, "epoch": 1920} {"train_loss": -12.299089431762695, "global_step": 322570, "epoch": 1920} {"train_loss": -12.168601989746094, "global_step": 322571, "epoch": 1920} {"train_loss": -12.165225982666016, "global_step": 322572, "epoch": 1920} {"train_loss": -12.15272331237793, "global_step": 322573, "epoch": 1920} {"train_loss": -12.188007354736328, "global_step": 322574, "epoch": 1920} {"train_loss": -12.113102912902832, "global_step": 322575, "epoch": 1920} {"train_loss": -12.267916679382324, "global_step": 322576, "epoch": 1920} {"train_loss": -12.202539443969727, "global_step": 322577, "epoch": 1920} {"train_loss": -12.266298294067383, "global_step": 322578, "epoch": 1920} {"train_loss": -12.350225448608398, "global_step": 322579, "epoch": 1920} {"train_loss": -12.302265167236328, "global_step": 322580, "epoch": 1920} {"train_loss": -12.304572105407715, "global_step": 322581, "epoch": 1920} {"train_loss": -12.34195327758789, "global_step": 322582, "epoch": 1920} {"train_loss": -12.406169891357422, "global_step": 322583, "epoch": 1920} {"train_loss": -12.232553482055664, "global_step": 322584, "epoch": 1920} {"train_loss": -12.383275985717773, "global_step": 322585, "epoch": 1920} {"train_loss": -12.212553024291992, "global_step": 322586, "epoch": 1920} {"train_loss": -12.340215682983398, "global_step": 322587, "epoch": 1920} {"train_loss": -12.356376647949219, "global_step": 322588, "epoch": 1920} {"train_loss": -12.384628295898438, "global_step": 322589, "epoch": 1920} {"train_loss": -12.63692855834961, "global_step": 322590, "epoch": 1920} {"train_loss": -12.356206893920898, "global_step": 322591, "epoch": 1920} {"train_loss": -12.303726196289062, "global_step": 322592, "epoch": 1920} {"train_loss": -12.584251403808594, "global_step": 322593, "epoch": 1920} {"train_loss": -12.356945037841797, "global_step": 322594, "epoch": 1920} {"train_loss": -12.36732292175293, "global_step": 322595, "epoch": 1920} {"train_loss": -12.456801414489746, "global_step": 322596, "epoch": 1920} {"train_loss": -12.61182975769043, "global_step": 322597, "epoch": 1920} {"train_loss": -12.570326805114746, "global_step": 322598, "epoch": 1920} {"train_loss": -12.316659927368164, "global_step": 322599, "epoch": 1920} {"train_loss": -12.54829216003418, "global_step": 322600, "epoch": 1920} {"train_loss": -12.432641983032227, "global_step": 322601, "epoch": 1920} {"train_loss": -12.472238540649414, "global_step": 322602, "epoch": 1920} {"train_loss": -12.489670753479004, "global_step": 322603, "epoch": 1920} {"train_loss": -12.283723831176758, "global_step": 322604, "epoch": 1920} {"train_loss": -12.534444808959961, "global_step": 322605, "epoch": 1920} {"train_loss": -12.440811157226562, "global_step": 322606, "epoch": 1920} {"train_loss": -12.420618057250977, "global_step": 322607, "epoch": 1920} {"train_loss": -12.419361114501953, "global_step": 322608, "epoch": 1920} {"train_loss": -12.307055473327637, "global_step": 322609, "epoch": 1920} {"train_loss": -12.359003067016602, "global_step": 322610, "epoch": 1920} {"train_loss": -12.582767486572266, "global_step": 322611, "epoch": 1920} {"train_loss": -12.477014541625977, "global_step": 322612, "epoch": 1920} {"train_loss": -12.438363075256348, "global_step": 322613, "epoch": 1920} {"train_loss": -12.571073532104492, "global_step": 322614, "epoch": 1920} {"train_loss": -12.676841735839844, "global_step": 322615, "epoch": 1920} {"train_loss": -12.657400131225586, "global_step": 322616, "epoch": 1920} {"train_loss": -12.543659210205078, "global_step": 322617, "epoch": 1920} {"train_loss": -12.681670188903809, "global_step": 322618, "epoch": 1920} {"train_loss": -12.487919807434082, "global_step": 322619, "epoch": 1920} {"train_loss": -12.446741104125977, "global_step": 322620, "epoch": 1920} {"train_loss": -12.383910179138184, "global_step": 322621, "epoch": 1920} {"train_loss": -12.624811172485352, "global_step": 322622, "epoch": 1920} {"train_loss": -12.754755973815918, "global_step": 322623, "epoch": 1920} {"train_loss": -12.764904975891113, "global_step": 322624, "epoch": 1920} {"train_loss": -12.64195442199707, "global_step": 322625, "epoch": 1920} {"train_loss": -12.688508033752441, "global_step": 322626, "epoch": 1920} {"train_loss": -12.447931289672852, "global_step": 322627, "epoch": 1920} {"train_loss": -12.791911125183105, "global_step": 322628, "epoch": 1920} {"train_loss": -12.314411163330078, "global_step": 322629, "epoch": 1920} {"train_loss": -12.78133773803711, "global_step": 322630, "epoch": 1920} {"train_loss": -12.265678405761719, "global_step": 322631, "epoch": 1920} {"train_loss": -12.406310081481934, "global_step": 322632, "epoch": 1920} {"train_loss": -12.853067398071289, "global_step": 322633, "epoch": 1920} {"train_loss": -12.534075736999512, "global_step": 322634, "epoch": 1920} {"train_loss": -11.870655059814453, "global_step": 322635, "epoch": 1920} {"train_loss": -10.300529479980469, "global_step": 322636, "epoch": 1920} {"train_loss": -10.74848461151123, "global_step": 322637, "epoch": 1920} {"train_loss": -11.289419174194336, "global_step": 322638, "epoch": 1920} {"train_loss": -11.527341842651367, "global_step": 322639, "epoch": 1920} {"train_loss": -11.581886291503906, "global_step": 322640, "epoch": 1920} {"train_loss": -11.052445411682129, "global_step": 322641, "epoch": 1920} {"train_loss": -11.680215835571289, "global_step": 322642, "epoch": 1920} {"train_loss": -11.949196815490723, "global_step": 322643, "epoch": 1920} {"train_loss": -11.716804504394531, "global_step": 322644, "epoch": 1920} {"train_loss": -11.655452728271484, "global_step": 322645, "epoch": 1920} {"train_loss": -11.113567352294922, "global_step": 322646, "epoch": 1920} {"train_loss": -10.348548889160156, "global_step": 322647, "epoch": 1920} {"train_loss": -10.858732223510742, "global_step": 322648, "epoch": 1920} {"train_loss": -12.042366027832031, "global_step": 322649, "epoch": 1920} {"train_loss": -10.496788024902344, "global_step": 322650, "epoch": 1920} {"train_loss": -11.793441772460938, "global_step": 322651, "epoch": 1920} {"train_loss": -10.53533935546875, "global_step": 322652, "epoch": 1920} {"train_loss": -9.929666519165039, "global_step": 322653, "epoch": 1920} {"train_loss": -10.487499237060547, "global_step": 322654, "epoch": 1920} {"train_loss": -10.452088356018066, "global_step": 322655, "epoch": 1920} {"train_loss": -11.358367919921875, "global_step": 322656, "epoch": 1920} {"train_loss": -9.244169235229492, "global_step": 322657, "epoch": 1920} {"train_loss": -11.849830627441406, "global_step": 322658, "epoch": 1920} {"train_loss": -9.869731903076172, "global_step": 322659, "epoch": 1920} {"train_loss": -10.57872200012207, "global_step": 322660, "epoch": 1920} {"train_loss": -11.604928970336914, "global_step": 322661, "epoch": 1920} {"train_loss": -10.121322631835938, "global_step": 322662, "epoch": 1920} {"train_loss": -11.411128044128418, "global_step": 322663, "epoch": 1920} {"train_loss": -10.543703079223633, "global_step": 322664, "epoch": 1920} {"train_loss": -11.210525512695312, "global_step": 322665, "epoch": 1920} {"train_loss": -11.093574523925781, "global_step": 322666, "epoch": 1920} {"train_loss": -10.665787696838379, "global_step": 322667, "epoch": 1920} {"train_loss": -11.41334056854248, "global_step": 322668, "epoch": 1920} {"train_loss": -10.608367919921875, "global_step": 322669, "epoch": 1920} {"train_loss": -11.223430633544922, "global_step": 322670, "epoch": 1920} {"train_loss": -10.468975067138672, "global_step": 322671, "epoch": 1920} {"train_loss": -10.687457084655762, "global_step": 322672, "epoch": 1920} {"train_loss": -11.515560150146484, "global_step": 322673, "epoch": 1920} {"train_loss": -10.560585021972656, "global_step": 322674, "epoch": 1920} {"train_loss": -10.588811874389648, "global_step": 322675, "epoch": 1920} {"train_loss": -11.502885818481445, "global_step": 322676, "epoch": 1920} {"train_loss": -10.324728012084961, "global_step": 322677, "epoch": 1920} {"train_loss": -11.23294734954834, "global_step": 322678, "epoch": 1920} {"train_loss": -10.584352493286133, "global_step": 322679, "epoch": 1920} {"train_loss": -11.000905990600586, "global_step": 322680, "epoch": 1920} {"train_loss": -11.342018127441406, "global_step": 322681, "epoch": 1920} {"train_loss": -10.49574089050293, "global_step": 322682, "epoch": 1920} {"train_loss": -11.444297790527344, "global_step": 322683, "epoch": 1920} {"train_loss": -10.62379264831543, "global_step": 322684, "epoch": 1920} {"train_loss": -11.742094039916992, "global_step": 322685, "epoch": 1920} {"train_loss": -11.157569885253906, "global_step": 322686, "epoch": 1920} {"train_loss": -10.779714584350586, "global_step": 322687, "epoch": 1920} {"train_loss": -11.492568969726562, "global_step": 322688, "epoch": 1920} {"train_loss": -10.677162170410156, "global_step": 322689, "epoch": 1920} {"train_loss": -11.775640487670898, "global_step": 322690, "epoch": 1920} {"train_loss": -11.092884063720703, "global_step": 322691, "epoch": 1920} {"train_loss": -11.279231071472168, "global_step": 322692, "epoch": 1920} {"train_loss": -11.483148574829102, "global_step": 322693, "epoch": 1920} {"train_loss": -11.41621208190918, "global_step": 322694, "epoch": 1920} {"train_loss": -11.64108657836914, "global_step": 322695, "epoch": 1920} {"train_loss": -11.18557357788086, "global_step": 322696, "epoch": 1920} {"train_loss": -11.358182907104492, "global_step": 322697, "epoch": 1920} {"train_loss": -11.667580604553223, "global_step": 322698, "epoch": 1920} {"train_loss": -11.39913558959961, "global_step": 322699, "epoch": 1920} {"train_loss": -11.923666000366211, "global_step": 322700, "epoch": 1920} {"train_loss": -11.62112045288086, "global_step": 322701, "epoch": 1920} {"train_loss": -11.418437957763672, "global_step": 322702, "epoch": 1920} {"train_loss": -11.492201805114746, "global_step": 322703, "epoch": 1920} {"train_loss": -11.88125991821289, "global_step": 322704, "epoch": 1920} {"train_loss": -11.49530029296875, "global_step": 322705, "epoch": 1920} {"train_loss": -11.911870002746582, "global_step": 322706, "epoch": 1920} {"train_loss": -11.89860725402832, "global_step": 322707, "epoch": 1920} {"train_loss": -11.871458053588867, "global_step": 322708, "epoch": 1920} {"train_loss": -11.983564376831055, "global_step": 322709, "epoch": 1920} {"train_loss": -12.256807327270508, "global_step": 322710, "epoch": 1920} {"train_loss": -11.78602409362793, "global_step": 322711, "epoch": 1920} {"train_loss": -11.684638977050781, "global_step": 322712, "epoch": 1920} {"train_loss": -12.04305362701416, "global_step": 322713, "epoch": 1920} {"train_loss": -11.991169929504395, "global_step": 322714, "epoch": 1920} {"train_loss": -12.145991325378418, "global_step": 322715, "epoch": 1920} {"train_loss": -11.899527549743652, "global_step": 322716, "epoch": 1920} {"train_loss": -12.044567108154297, "global_step": 322717, "epoch": 1920} {"train_loss": -11.975875854492188, "global_step": 322718, "epoch": 1920} {"train_loss": -12.221567153930664, "global_step": 322719, "epoch": 1920} {"train_loss": -12.210139274597168, "global_step": 322720, "epoch": 1920} {"train_loss": -11.923896789550781, "global_step": 322721, "epoch": 1920} {"train_loss": -12.193304061889648, "global_step": 322722, "epoch": 1920} {"train_loss": -12.229418754577637, "global_step": 322723, "epoch": 1920} {"train_loss": -12.25072193145752, "global_step": 322724, "epoch": 1920} {"train_loss": -12.14301872253418, "global_step": 322725, "epoch": 1920} {"train_loss": -12.419819831848145, "global_step": 322726, "epoch": 1920} {"train_loss": -11.805826164427257, "global_step": 322727, "epoch": 1920, "val_loss": 288251.21875, "train_action_mse_error": 0.9520184993743896} {"train_loss": -12.20057487487793, "global_step": 322728, "epoch": 1921} {"train_loss": -12.130699157714844, "global_step": 322729, "epoch": 1921} {"train_loss": -12.181999206542969, "global_step": 322730, "epoch": 1921} {"train_loss": -12.24260425567627, "global_step": 322731, "epoch": 1921} {"train_loss": -12.352985382080078, "global_step": 322732, "epoch": 1921} {"train_loss": -12.248774528503418, "global_step": 322733, "epoch": 1921} {"train_loss": -12.11784553527832, "global_step": 322734, "epoch": 1921} {"train_loss": -12.542677879333496, "global_step": 322735, "epoch": 1921} {"train_loss": -12.258745193481445, "global_step": 322736, "epoch": 1921} {"train_loss": -12.490379333496094, "global_step": 322737, "epoch": 1921} {"train_loss": -12.388517379760742, "global_step": 322738, "epoch": 1921} {"train_loss": -12.412841796875, "global_step": 322739, "epoch": 1921} {"train_loss": -12.26333999633789, "global_step": 322740, "epoch": 1921} {"train_loss": -12.384306907653809, "global_step": 322741, "epoch": 1921} {"train_loss": -12.260812759399414, "global_step": 322742, "epoch": 1921} {"train_loss": -12.361509323120117, "global_step": 322743, "epoch": 1921} {"train_loss": -12.304817199707031, "global_step": 322744, "epoch": 1921} {"train_loss": -12.430333137512207, "global_step": 322745, "epoch": 1921} {"train_loss": -12.552045822143555, "global_step": 322746, "epoch": 1921} {"train_loss": -12.240686416625977, "global_step": 322747, "epoch": 1921} {"train_loss": -12.391672134399414, "global_step": 322748, "epoch": 1921} {"train_loss": -12.358148574829102, "global_step": 322749, "epoch": 1921} {"train_loss": -12.49979019165039, "global_step": 322750, "epoch": 1921} {"train_loss": -12.462385177612305, "global_step": 322751, "epoch": 1921} {"train_loss": -12.519878387451172, "global_step": 322752, "epoch": 1921} {"train_loss": -12.25143051147461, "global_step": 322753, "epoch": 1921} {"train_loss": -12.395795822143555, "global_step": 322754, "epoch": 1921} {"train_loss": -12.477962493896484, "global_step": 322755, "epoch": 1921} {"train_loss": -12.336819648742676, "global_step": 322756, "epoch": 1921} {"train_loss": -12.376764297485352, "global_step": 322757, "epoch": 1921} {"train_loss": -12.514881134033203, "global_step": 322758, "epoch": 1921} {"train_loss": -12.47432804107666, "global_step": 322759, "epoch": 1921} {"train_loss": -12.560806274414062, "global_step": 322760, "epoch": 1921} {"train_loss": -12.245071411132812, "global_step": 322761, "epoch": 1921} {"train_loss": -12.536866188049316, "global_step": 322762, "epoch": 1921} {"train_loss": -12.447977066040039, "global_step": 322763, "epoch": 1921} {"train_loss": -12.690120697021484, "global_step": 322764, "epoch": 1921} {"train_loss": -12.514138221740723, "global_step": 322765, "epoch": 1921} {"train_loss": -12.467090606689453, "global_step": 322766, "epoch": 1921} {"train_loss": -12.27022933959961, "global_step": 322767, "epoch": 1921} {"train_loss": -12.234949111938477, "global_step": 322768, "epoch": 1921} {"train_loss": -12.362525939941406, "global_step": 322769, "epoch": 1921} {"train_loss": -12.278215408325195, "global_step": 322770, "epoch": 1921} {"train_loss": -12.475858688354492, "global_step": 322771, "epoch": 1921} {"train_loss": -12.57012939453125, "global_step": 322772, "epoch": 1921} {"train_loss": -12.641777038574219, "global_step": 322773, "epoch": 1921} {"train_loss": -12.3021240234375, "global_step": 322774, "epoch": 1921} {"train_loss": -12.184393882751465, "global_step": 322775, "epoch": 1921} {"train_loss": -12.312191009521484, "global_step": 322776, "epoch": 1921} {"train_loss": -12.471380233764648, "global_step": 322777, "epoch": 1921} {"train_loss": -12.314393043518066, "global_step": 322778, "epoch": 1921} {"train_loss": -12.205621719360352, "global_step": 322779, "epoch": 1921} {"train_loss": -12.333097457885742, "global_step": 322780, "epoch": 1921} {"train_loss": -12.205145835876465, "global_step": 322781, "epoch": 1921} {"train_loss": -12.002408981323242, "global_step": 322782, "epoch": 1921} {"train_loss": -12.642423629760742, "global_step": 322783, "epoch": 1921} {"train_loss": -12.070762634277344, "global_step": 322784, "epoch": 1921} {"train_loss": -12.361822128295898, "global_step": 322785, "epoch": 1921} {"train_loss": -11.937653541564941, "global_step": 322786, "epoch": 1921} {"train_loss": -11.620946884155273, "global_step": 322787, "epoch": 1921} {"train_loss": -11.456695556640625, "global_step": 322788, "epoch": 1921} {"train_loss": -12.119659423828125, "global_step": 322789, "epoch": 1921} {"train_loss": -11.938725471496582, "global_step": 322790, "epoch": 1921} {"train_loss": -12.118645668029785, "global_step": 322791, "epoch": 1921} {"train_loss": -11.408126831054688, "global_step": 322792, "epoch": 1921} {"train_loss": -10.346882820129395, "global_step": 322793, "epoch": 1921} {"train_loss": -11.421372413635254, "global_step": 322794, "epoch": 1921} {"train_loss": -12.597766876220703, "global_step": 322795, "epoch": 1921} {"train_loss": -12.093482971191406, "global_step": 322796, "epoch": 1921} {"train_loss": -11.16221809387207, "global_step": 322797, "epoch": 1921} {"train_loss": -11.926998138427734, "global_step": 322798, "epoch": 1921} {"train_loss": -12.322283744812012, "global_step": 322799, "epoch": 1921} {"train_loss": -12.455770492553711, "global_step": 322800, "epoch": 1921} {"train_loss": -12.289803504943848, "global_step": 322801, "epoch": 1921} {"train_loss": -12.601581573486328, "global_step": 322802, "epoch": 1921} {"train_loss": -12.301300048828125, "global_step": 322803, "epoch": 1921} {"train_loss": -12.190217971801758, "global_step": 322804, "epoch": 1921} {"train_loss": -12.072859764099121, "global_step": 322805, "epoch": 1921} {"train_loss": -12.226705551147461, "global_step": 322806, "epoch": 1921} {"train_loss": -12.270633697509766, "global_step": 322807, "epoch": 1921} {"train_loss": -12.543793678283691, "global_step": 322808, "epoch": 1921} {"train_loss": -11.328289031982422, "global_step": 322809, "epoch": 1921} {"train_loss": -12.025798797607422, "global_step": 322810, "epoch": 1921} {"train_loss": -11.50826644897461, "global_step": 322811, "epoch": 1921} {"train_loss": -10.299736022949219, "global_step": 322812, "epoch": 1921} {"train_loss": -10.627653121948242, "global_step": 322813, "epoch": 1921} {"train_loss": -10.829183578491211, "global_step": 322814, "epoch": 1921} {"train_loss": -11.166142463684082, "global_step": 322815, "epoch": 1921} {"train_loss": -10.787487030029297, "global_step": 322816, "epoch": 1921} {"train_loss": -11.206942558288574, "global_step": 322817, "epoch": 1921} {"train_loss": -11.74854850769043, "global_step": 322818, "epoch": 1921} {"train_loss": -11.071868896484375, "global_step": 322819, "epoch": 1921} {"train_loss": -11.791927337646484, "global_step": 322820, "epoch": 1921} {"train_loss": -10.895431518554688, "global_step": 322821, "epoch": 1921} {"train_loss": -10.501254081726074, "global_step": 322822, "epoch": 1921} {"train_loss": -11.072868347167969, "global_step": 322823, "epoch": 1921} {"train_loss": -10.492080688476562, "global_step": 322824, "epoch": 1921} {"train_loss": -11.101722717285156, "global_step": 322825, "epoch": 1921} {"train_loss": -10.154666900634766, "global_step": 322826, "epoch": 1921} {"train_loss": -10.339902877807617, "global_step": 322827, "epoch": 1921} {"train_loss": -10.302498817443848, "global_step": 322828, "epoch": 1921} {"train_loss": -10.781177520751953, "global_step": 322829, "epoch": 1921} {"train_loss": -9.850769996643066, "global_step": 322830, "epoch": 1921} {"train_loss": -8.130400657653809, "global_step": 322831, "epoch": 1921} {"train_loss": -8.09771728515625, "global_step": 322832, "epoch": 1921} {"train_loss": -9.58120059967041, "global_step": 322833, "epoch": 1921} {"train_loss": -10.522562026977539, "global_step": 322834, "epoch": 1921} {"train_loss": -9.757733345031738, "global_step": 322835, "epoch": 1921} {"train_loss": -9.051490783691406, "global_step": 322836, "epoch": 1921} {"train_loss": -9.254436492919922, "global_step": 322837, "epoch": 1921} {"train_loss": -10.356048583984375, "global_step": 322838, "epoch": 1921} {"train_loss": -9.575443267822266, "global_step": 322839, "epoch": 1921} {"train_loss": -10.506765365600586, "global_step": 322840, "epoch": 1921} {"train_loss": -10.614999771118164, "global_step": 322841, "epoch": 1921} {"train_loss": -11.246399879455566, "global_step": 322842, "epoch": 1921} {"train_loss": -11.439544677734375, "global_step": 322843, "epoch": 1921} {"train_loss": -10.93090534210205, "global_step": 322844, "epoch": 1921} {"train_loss": -11.446609497070312, "global_step": 322845, "epoch": 1921} {"train_loss": -11.330259323120117, "global_step": 322846, "epoch": 1921} {"train_loss": -10.512041091918945, "global_step": 322847, "epoch": 1921} {"train_loss": -10.79563045501709, "global_step": 322848, "epoch": 1921} {"train_loss": -11.132185935974121, "global_step": 322849, "epoch": 1921} {"train_loss": -11.354304313659668, "global_step": 322850, "epoch": 1921} {"train_loss": -11.487627029418945, "global_step": 322851, "epoch": 1921} {"train_loss": -10.870221138000488, "global_step": 322852, "epoch": 1921} {"train_loss": -11.199616432189941, "global_step": 322853, "epoch": 1921} {"train_loss": -11.317804336547852, "global_step": 322854, "epoch": 1921} {"train_loss": -11.07785415649414, "global_step": 322855, "epoch": 1921} {"train_loss": -11.414398193359375, "global_step": 322856, "epoch": 1921} {"train_loss": -11.302111625671387, "global_step": 322857, "epoch": 1921} {"train_loss": -11.39303207397461, "global_step": 322858, "epoch": 1921} {"train_loss": -11.720836639404297, "global_step": 322859, "epoch": 1921} {"train_loss": -11.187908172607422, "global_step": 322860, "epoch": 1921} {"train_loss": -11.332822799682617, "global_step": 322861, "epoch": 1921} {"train_loss": -11.394027709960938, "global_step": 322862, "epoch": 1921} {"train_loss": -11.663978576660156, "global_step": 322863, "epoch": 1921} {"train_loss": -11.23652458190918, "global_step": 322864, "epoch": 1921} {"train_loss": -11.679853439331055, "global_step": 322865, "epoch": 1921} {"train_loss": -11.062374114990234, "global_step": 322866, "epoch": 1921} {"train_loss": -11.902314186096191, "global_step": 322867, "epoch": 1921} {"train_loss": -11.532593727111816, "global_step": 322868, "epoch": 1921} {"train_loss": -11.683916091918945, "global_step": 322869, "epoch": 1921} {"train_loss": -11.790691375732422, "global_step": 322870, "epoch": 1921} {"train_loss": -11.71643352508545, "global_step": 322871, "epoch": 1921} {"train_loss": -11.526880264282227, "global_step": 322872, "epoch": 1921} {"train_loss": -11.976236343383789, "global_step": 322873, "epoch": 1921} {"train_loss": -11.58919906616211, "global_step": 322874, "epoch": 1921} {"train_loss": -11.653203964233398, "global_step": 322875, "epoch": 1921} {"train_loss": -11.879520416259766, "global_step": 322876, "epoch": 1921} {"train_loss": -11.369195938110352, "global_step": 322877, "epoch": 1921} {"train_loss": -11.695971488952637, "global_step": 322878, "epoch": 1921} {"train_loss": -11.791130065917969, "global_step": 322879, "epoch": 1921} {"train_loss": -11.629390716552734, "global_step": 322880, "epoch": 1921} {"train_loss": -12.125518798828125, "global_step": 322881, "epoch": 1921} {"train_loss": -11.943645477294922, "global_step": 322882, "epoch": 1921} {"train_loss": -12.096916198730469, "global_step": 322883, "epoch": 1921} {"train_loss": -11.834040641784668, "global_step": 322884, "epoch": 1921} {"train_loss": -12.013267517089844, "global_step": 322885, "epoch": 1921} {"train_loss": -11.856298446655273, "global_step": 322886, "epoch": 1921} {"train_loss": -11.985089302062988, "global_step": 322887, "epoch": 1921} {"train_loss": -12.050287246704102, "global_step": 322888, "epoch": 1921} {"train_loss": -12.145706176757812, "global_step": 322889, "epoch": 1921} {"train_loss": -12.08837890625, "global_step": 322890, "epoch": 1921} {"train_loss": -12.140755653381348, "global_step": 322891, "epoch": 1921} {"train_loss": -12.163604736328125, "global_step": 322892, "epoch": 1921} {"train_loss": -12.270566940307617, "global_step": 322893, "epoch": 1921} {"train_loss": -12.046884536743164, "global_step": 322894, "epoch": 1921} {"train_loss": -11.690877840632485, "global_step": 322895, "epoch": 1921, "val_loss": 287351.40625} {"train_loss": -12.151748657226562, "global_step": 322896, "epoch": 1922} {"train_loss": -12.30221939086914, "global_step": 322897, "epoch": 1922} {"train_loss": -12.051852226257324, "global_step": 322898, "epoch": 1922} {"train_loss": -12.28351879119873, "global_step": 322899, "epoch": 1922} {"train_loss": -12.362921714782715, "global_step": 322900, "epoch": 1922} {"train_loss": -12.220172882080078, "global_step": 322901, "epoch": 1922} {"train_loss": -12.503447532653809, "global_step": 322902, "epoch": 1922} {"train_loss": -12.053462982177734, "global_step": 322903, "epoch": 1922} {"train_loss": -12.180343627929688, "global_step": 322904, "epoch": 1922} {"train_loss": -12.169944763183594, "global_step": 322905, "epoch": 1922} {"train_loss": -12.259773254394531, "global_step": 322906, "epoch": 1922} {"train_loss": -12.209630966186523, "global_step": 322907, "epoch": 1922} {"train_loss": -11.918436050415039, "global_step": 322908, "epoch": 1922} {"train_loss": -11.837716102600098, "global_step": 322909, "epoch": 1922} {"train_loss": -11.958710670471191, "global_step": 322910, "epoch": 1922} {"train_loss": -10.864694595336914, "global_step": 322911, "epoch": 1922} {"train_loss": -11.992779731750488, "global_step": 322912, "epoch": 1922} {"train_loss": -12.118307113647461, "global_step": 322913, "epoch": 1922} {"train_loss": -12.165915489196777, "global_step": 322914, "epoch": 1922} {"train_loss": -11.861059188842773, "global_step": 322915, "epoch": 1922} {"train_loss": -12.138873100280762, "global_step": 322916, "epoch": 1922} {"train_loss": -12.002842903137207, "global_step": 322917, "epoch": 1922} {"train_loss": -12.17758560180664, "global_step": 322918, "epoch": 1922} {"train_loss": -12.2875337600708, "global_step": 322919, "epoch": 1922} {"train_loss": -12.476924896240234, "global_step": 322920, "epoch": 1922} {"train_loss": -12.125720977783203, "global_step": 322921, "epoch": 1922} {"train_loss": -12.00238037109375, "global_step": 322922, "epoch": 1922} {"train_loss": -12.30882453918457, "global_step": 322923, "epoch": 1922} {"train_loss": -12.042612075805664, "global_step": 322924, "epoch": 1922} {"train_loss": -12.439659118652344, "global_step": 322925, "epoch": 1922} {"train_loss": -12.217652320861816, "global_step": 322926, "epoch": 1922} {"train_loss": -12.157413482666016, "global_step": 322927, "epoch": 1922} {"train_loss": -12.275280952453613, "global_step": 322928, "epoch": 1922} {"train_loss": -12.536152839660645, "global_step": 322929, "epoch": 1922} {"train_loss": -12.354476928710938, "global_step": 322930, "epoch": 1922} {"train_loss": -12.242300033569336, "global_step": 322931, "epoch": 1922} {"train_loss": -12.2227201461792, "global_step": 322932, "epoch": 1922} {"train_loss": -12.405984878540039, "global_step": 322933, "epoch": 1922} {"train_loss": -12.517210006713867, "global_step": 322934, "epoch": 1922} {"train_loss": -12.453105926513672, "global_step": 322935, "epoch": 1922} {"train_loss": -12.349543571472168, "global_step": 322936, "epoch": 1922} {"train_loss": -12.403570175170898, "global_step": 322937, "epoch": 1922} {"train_loss": -12.25221061706543, "global_step": 322938, "epoch": 1922} {"train_loss": -12.209965705871582, "global_step": 322939, "epoch": 1922} {"train_loss": -12.170289039611816, "global_step": 322940, "epoch": 1922} {"train_loss": -12.234367370605469, "global_step": 322941, "epoch": 1922} {"train_loss": -12.044758796691895, "global_step": 322942, "epoch": 1922} {"train_loss": -12.508190155029297, "global_step": 322943, "epoch": 1922} {"train_loss": -11.925899505615234, "global_step": 322944, "epoch": 1922} {"train_loss": -12.080304145812988, "global_step": 322945, "epoch": 1922} {"train_loss": -12.33638858795166, "global_step": 322946, "epoch": 1922} {"train_loss": -12.383903503417969, "global_step": 322947, "epoch": 1922} {"train_loss": -12.448800086975098, "global_step": 322948, "epoch": 1922} {"train_loss": -12.55043888092041, "global_step": 322949, "epoch": 1922} {"train_loss": -12.53870964050293, "global_step": 322950, "epoch": 1922} {"train_loss": -12.405941009521484, "global_step": 322951, "epoch": 1922} {"train_loss": -12.605034828186035, "global_step": 322952, "epoch": 1922} {"train_loss": -12.35206413269043, "global_step": 322953, "epoch": 1922} {"train_loss": -12.679372787475586, "global_step": 322954, "epoch": 1922} {"train_loss": -12.429461479187012, "global_step": 322955, "epoch": 1922} {"train_loss": -12.630054473876953, "global_step": 322956, "epoch": 1922} {"train_loss": -12.454309463500977, "global_step": 322957, "epoch": 1922} {"train_loss": -12.428532600402832, "global_step": 322958, "epoch": 1922} {"train_loss": -12.372045516967773, "global_step": 322959, "epoch": 1922} {"train_loss": -12.478120803833008, "global_step": 322960, "epoch": 1922} {"train_loss": -11.68777847290039, "global_step": 322961, "epoch": 1922} {"train_loss": -12.73532772064209, "global_step": 322962, "epoch": 1922} {"train_loss": -12.079946517944336, "global_step": 322963, "epoch": 1922} {"train_loss": -11.481298446655273, "global_step": 322964, "epoch": 1922} {"train_loss": -12.110662460327148, "global_step": 322965, "epoch": 1922} {"train_loss": -11.540157318115234, "global_step": 322966, "epoch": 1922} {"train_loss": -11.09822940826416, "global_step": 322967, "epoch": 1922} {"train_loss": -11.25117015838623, "global_step": 322968, "epoch": 1922} {"train_loss": -11.666287422180176, "global_step": 322969, "epoch": 1922} {"train_loss": -11.040268898010254, "global_step": 322970, "epoch": 1922} {"train_loss": -12.102746963500977, "global_step": 322971, "epoch": 1922} {"train_loss": -11.22260570526123, "global_step": 322972, "epoch": 1922} {"train_loss": -11.446432113647461, "global_step": 322973, "epoch": 1922} {"train_loss": -11.23398208618164, "global_step": 322974, "epoch": 1922} {"train_loss": -11.560376167297363, "global_step": 322975, "epoch": 1922} {"train_loss": -10.656363487243652, "global_step": 322976, "epoch": 1922} {"train_loss": -10.008455276489258, "global_step": 322977, "epoch": 1922} {"train_loss": -11.782691955566406, "global_step": 322978, "epoch": 1922} {"train_loss": -10.943275451660156, "global_step": 322979, "epoch": 1922} {"train_loss": -11.211135864257812, "global_step": 322980, "epoch": 1922} {"train_loss": -11.94007682800293, "global_step": 322981, "epoch": 1922} {"train_loss": -10.9602632522583, "global_step": 322982, "epoch": 1922} {"train_loss": -11.023334503173828, "global_step": 322983, "epoch": 1922} {"train_loss": -11.820174217224121, "global_step": 322984, "epoch": 1922} {"train_loss": -11.382802963256836, "global_step": 322985, "epoch": 1922} {"train_loss": -11.286452293395996, "global_step": 322986, "epoch": 1922} {"train_loss": -11.391888618469238, "global_step": 322987, "epoch": 1922} {"train_loss": -11.183008193969727, "global_step": 322988, "epoch": 1922} {"train_loss": -11.17370891571045, "global_step": 322989, "epoch": 1922} {"train_loss": -10.775568008422852, "global_step": 322990, "epoch": 1922} {"train_loss": -8.946695327758789, "global_step": 322991, "epoch": 1922} {"train_loss": -9.381937026977539, "global_step": 322992, "epoch": 1922} {"train_loss": -11.374837875366211, "global_step": 322993, "epoch": 1922} {"train_loss": -10.195138931274414, "global_step": 322994, "epoch": 1922} {"train_loss": -10.909061431884766, "global_step": 322995, "epoch": 1922} {"train_loss": -11.076238632202148, "global_step": 322996, "epoch": 1922} {"train_loss": -10.782777786254883, "global_step": 322997, "epoch": 1922} {"train_loss": -11.14840316772461, "global_step": 322998, "epoch": 1922} {"train_loss": -11.300771713256836, "global_step": 322999, "epoch": 1922} {"train_loss": -11.47275161743164, "global_step": 323000, "epoch": 1922} {"train_loss": -11.685153007507324, "global_step": 323001, "epoch": 1922} {"train_loss": -10.908821105957031, "global_step": 323002, "epoch": 1922} {"train_loss": -11.634160995483398, "global_step": 323003, "epoch": 1922} {"train_loss": -10.698158264160156, "global_step": 323004, "epoch": 1922} {"train_loss": -11.656916618347168, "global_step": 323005, "epoch": 1922} {"train_loss": -10.637158393859863, "global_step": 323006, "epoch": 1922} {"train_loss": -11.305397033691406, "global_step": 323007, "epoch": 1922} {"train_loss": -10.759822845458984, "global_step": 323008, "epoch": 1922} {"train_loss": -11.04574203491211, "global_step": 323009, "epoch": 1922} {"train_loss": -10.901250839233398, "global_step": 323010, "epoch": 1922} {"train_loss": -11.679169654846191, "global_step": 323011, "epoch": 1922} {"train_loss": -11.17275333404541, "global_step": 323012, "epoch": 1922} {"train_loss": -11.678180694580078, "global_step": 323013, "epoch": 1922} {"train_loss": -11.195877075195312, "global_step": 323014, "epoch": 1922} {"train_loss": -11.495994567871094, "global_step": 323015, "epoch": 1922} {"train_loss": -11.65900993347168, "global_step": 323016, "epoch": 1922} {"train_loss": -11.812788009643555, "global_step": 323017, "epoch": 1922} {"train_loss": -11.694449424743652, "global_step": 323018, "epoch": 1922} {"train_loss": -11.436185836791992, "global_step": 323019, "epoch": 1922} {"train_loss": -11.550973892211914, "global_step": 323020, "epoch": 1922} {"train_loss": -11.16792106628418, "global_step": 323021, "epoch": 1922} {"train_loss": -11.794269561767578, "global_step": 323022, "epoch": 1922} {"train_loss": -11.081438064575195, "global_step": 323023, "epoch": 1922} {"train_loss": -11.686904907226562, "global_step": 323024, "epoch": 1922} {"train_loss": -11.471297264099121, "global_step": 323025, "epoch": 1922} {"train_loss": -11.558945655822754, "global_step": 323026, "epoch": 1922} {"train_loss": -11.586625099182129, "global_step": 323027, "epoch": 1922} {"train_loss": -11.769819259643555, "global_step": 323028, "epoch": 1922} {"train_loss": -11.447402954101562, "global_step": 323029, "epoch": 1922} {"train_loss": -11.696220397949219, "global_step": 323030, "epoch": 1922} {"train_loss": -11.673017501831055, "global_step": 323031, "epoch": 1922} {"train_loss": -11.047330856323242, "global_step": 323032, "epoch": 1922} {"train_loss": -12.003114700317383, "global_step": 323033, "epoch": 1922} {"train_loss": -11.6610107421875, "global_step": 323034, "epoch": 1922} {"train_loss": -11.811206817626953, "global_step": 323035, "epoch": 1922} {"train_loss": -11.564674377441406, "global_step": 323036, "epoch": 1922} {"train_loss": -12.086633682250977, "global_step": 323037, "epoch": 1922} {"train_loss": -11.736715316772461, "global_step": 323038, "epoch": 1922} {"train_loss": -12.182584762573242, "global_step": 323039, "epoch": 1922} {"train_loss": -11.873540878295898, "global_step": 323040, "epoch": 1922} {"train_loss": -12.129974365234375, "global_step": 323041, "epoch": 1922} {"train_loss": -11.941535949707031, "global_step": 323042, "epoch": 1922} {"train_loss": -12.043558120727539, "global_step": 323043, "epoch": 1922} {"train_loss": -12.094433784484863, "global_step": 323044, "epoch": 1922} {"train_loss": -12.037044525146484, "global_step": 323045, "epoch": 1922} {"train_loss": -12.32252025604248, "global_step": 323046, "epoch": 1922} {"train_loss": -12.074697494506836, "global_step": 323047, "epoch": 1922} {"train_loss": -12.029037475585938, "global_step": 323048, "epoch": 1922} {"train_loss": -11.571418762207031, "global_step": 323049, "epoch": 1922} {"train_loss": -12.072513580322266, "global_step": 323050, "epoch": 1922} {"train_loss": -11.558303833007812, "global_step": 323051, "epoch": 1922} {"train_loss": -12.261573791503906, "global_step": 323052, "epoch": 1922} {"train_loss": -11.882450103759766, "global_step": 323053, "epoch": 1922} {"train_loss": -12.241209030151367, "global_step": 323054, "epoch": 1922} {"train_loss": -11.818642616271973, "global_step": 323055, "epoch": 1922} {"train_loss": -12.314981460571289, "global_step": 323056, "epoch": 1922} {"train_loss": -11.851572036743164, "global_step": 323057, "epoch": 1922} {"train_loss": -12.293549537658691, "global_step": 323058, "epoch": 1922} {"train_loss": -11.910911560058594, "global_step": 323059, "epoch": 1922} {"train_loss": -12.285573959350586, "global_step": 323060, "epoch": 1922} {"train_loss": -11.95484733581543, "global_step": 323061, "epoch": 1922} {"train_loss": -12.190337181091309, "global_step": 323062, "epoch": 1922} {"train_loss": -11.791796706971668, "global_step": 323063, "epoch": 1922, "val_loss": 284259.53125} {"train_loss": -12.075724601745605, "global_step": 323064, "epoch": 1923} {"train_loss": -12.047136306762695, "global_step": 323065, "epoch": 1923} {"train_loss": -12.280683517456055, "global_step": 323066, "epoch": 1923} {"train_loss": -12.07614517211914, "global_step": 323067, "epoch": 1923} {"train_loss": -12.090505599975586, "global_step": 323068, "epoch": 1923} {"train_loss": -11.848925590515137, "global_step": 323069, "epoch": 1923} {"train_loss": -12.300989151000977, "global_step": 323070, "epoch": 1923} {"train_loss": -11.844263076782227, "global_step": 323071, "epoch": 1923} {"train_loss": -12.340473175048828, "global_step": 323072, "epoch": 1923} {"train_loss": -11.909992218017578, "global_step": 323073, "epoch": 1923} {"train_loss": -12.122933387756348, "global_step": 323074, "epoch": 1923} {"train_loss": -11.84814453125, "global_step": 323075, "epoch": 1923} {"train_loss": -12.280655860900879, "global_step": 323076, "epoch": 1923} {"train_loss": -11.999980926513672, "global_step": 323077, "epoch": 1923} {"train_loss": -12.41681957244873, "global_step": 323078, "epoch": 1923} {"train_loss": -12.085733413696289, "global_step": 323079, "epoch": 1923} {"train_loss": -12.221237182617188, "global_step": 323080, "epoch": 1923} {"train_loss": -12.032537460327148, "global_step": 323081, "epoch": 1923} {"train_loss": -12.27617073059082, "global_step": 323082, "epoch": 1923} {"train_loss": -12.202740669250488, "global_step": 323083, "epoch": 1923} {"train_loss": -12.412592887878418, "global_step": 323084, "epoch": 1923} {"train_loss": -12.09646224975586, "global_step": 323085, "epoch": 1923} {"train_loss": -12.223936080932617, "global_step": 323086, "epoch": 1923} {"train_loss": -12.40945816040039, "global_step": 323087, "epoch": 1923} {"train_loss": -12.30961799621582, "global_step": 323088, "epoch": 1923} {"train_loss": -12.357776641845703, "global_step": 323089, "epoch": 1923} {"train_loss": -12.350091934204102, "global_step": 323090, "epoch": 1923} {"train_loss": -12.409433364868164, "global_step": 323091, "epoch": 1923} {"train_loss": -12.472082138061523, "global_step": 323092, "epoch": 1923} {"train_loss": -12.490983009338379, "global_step": 323093, "epoch": 1923} {"train_loss": -12.430938720703125, "global_step": 323094, "epoch": 1923} {"train_loss": -12.399796485900879, "global_step": 323095, "epoch": 1923} {"train_loss": -12.548504829406738, "global_step": 323096, "epoch": 1923} {"train_loss": -12.337869644165039, "global_step": 323097, "epoch": 1923} {"train_loss": -12.481569290161133, "global_step": 323098, "epoch": 1923} {"train_loss": -12.562705993652344, "global_step": 323099, "epoch": 1923} {"train_loss": -12.477859497070312, "global_step": 323100, "epoch": 1923} {"train_loss": -12.519083023071289, "global_step": 323101, "epoch": 1923} {"train_loss": -12.206127166748047, "global_step": 323102, "epoch": 1923} {"train_loss": -12.623517990112305, "global_step": 323103, "epoch": 1923} {"train_loss": -12.5050630569458, "global_step": 323104, "epoch": 1923} {"train_loss": -12.44957160949707, "global_step": 323105, "epoch": 1923} {"train_loss": -12.504908561706543, "global_step": 323106, "epoch": 1923} {"train_loss": -12.424539566040039, "global_step": 323107, "epoch": 1923} {"train_loss": -12.544870376586914, "global_step": 323108, "epoch": 1923} {"train_loss": -12.538002014160156, "global_step": 323109, "epoch": 1923} {"train_loss": -12.46315860748291, "global_step": 323110, "epoch": 1923} {"train_loss": -12.456024169921875, "global_step": 323111, "epoch": 1923} {"train_loss": -12.605806350708008, "global_step": 323112, "epoch": 1923} {"train_loss": -12.354324340820312, "global_step": 323113, "epoch": 1923} {"train_loss": -12.411598205566406, "global_step": 323114, "epoch": 1923} {"train_loss": -12.26840591430664, "global_step": 323115, "epoch": 1923} {"train_loss": -12.539185523986816, "global_step": 323116, "epoch": 1923} {"train_loss": -12.360459327697754, "global_step": 323117, "epoch": 1923} {"train_loss": -12.165359497070312, "global_step": 323118, "epoch": 1923} {"train_loss": -12.108261108398438, "global_step": 323119, "epoch": 1923} {"train_loss": -11.71147346496582, "global_step": 323120, "epoch": 1923} {"train_loss": -10.932920455932617, "global_step": 323121, "epoch": 1923} {"train_loss": -12.096242904663086, "global_step": 323122, "epoch": 1923} {"train_loss": -11.758039474487305, "global_step": 323123, "epoch": 1923} {"train_loss": -11.597476959228516, "global_step": 323124, "epoch": 1923} {"train_loss": -10.683913230895996, "global_step": 323125, "epoch": 1923} {"train_loss": -10.949888229370117, "global_step": 323126, "epoch": 1923} {"train_loss": -11.918340682983398, "global_step": 323127, "epoch": 1923} {"train_loss": -11.765874862670898, "global_step": 323128, "epoch": 1923} {"train_loss": -11.163741111755371, "global_step": 323129, "epoch": 1923} {"train_loss": -10.934337615966797, "global_step": 323130, "epoch": 1923} {"train_loss": -10.439218521118164, "global_step": 323131, "epoch": 1923} {"train_loss": -11.123661994934082, "global_step": 323132, "epoch": 1923} {"train_loss": -12.207271575927734, "global_step": 323133, "epoch": 1923} {"train_loss": -11.266593933105469, "global_step": 323134, "epoch": 1923} {"train_loss": -11.693634033203125, "global_step": 323135, "epoch": 1923} {"train_loss": -11.147090911865234, "global_step": 323136, "epoch": 1923} {"train_loss": -11.926671981811523, "global_step": 323137, "epoch": 1923} {"train_loss": -11.870695114135742, "global_step": 323138, "epoch": 1923} {"train_loss": -11.912735939025879, "global_step": 323139, "epoch": 1923} {"train_loss": -11.185068130493164, "global_step": 323140, "epoch": 1923} {"train_loss": -11.936328887939453, "global_step": 323141, "epoch": 1923} {"train_loss": -11.366656303405762, "global_step": 323142, "epoch": 1923} {"train_loss": -11.874897956848145, "global_step": 323143, "epoch": 1923} {"train_loss": -11.76164436340332, "global_step": 323144, "epoch": 1923} {"train_loss": -11.679608345031738, "global_step": 323145, "epoch": 1923} {"train_loss": -12.101400375366211, "global_step": 323146, "epoch": 1923} {"train_loss": -11.890054702758789, "global_step": 323147, "epoch": 1923} {"train_loss": -12.16823959350586, "global_step": 323148, "epoch": 1923} {"train_loss": -12.089055061340332, "global_step": 323149, "epoch": 1923} {"train_loss": -11.727365493774414, "global_step": 323150, "epoch": 1923} {"train_loss": -11.796260833740234, "global_step": 323151, "epoch": 1923} {"train_loss": -11.847816467285156, "global_step": 323152, "epoch": 1923} {"train_loss": -11.83905029296875, "global_step": 323153, "epoch": 1923} {"train_loss": -11.369285583496094, "global_step": 323154, "epoch": 1923} {"train_loss": -12.176827430725098, "global_step": 323155, "epoch": 1923} {"train_loss": -11.443492889404297, "global_step": 323156, "epoch": 1923} {"train_loss": -11.694931030273438, "global_step": 323157, "epoch": 1923} {"train_loss": -11.26749324798584, "global_step": 323158, "epoch": 1923} {"train_loss": -12.112455368041992, "global_step": 323159, "epoch": 1923} {"train_loss": -11.826273918151855, "global_step": 323160, "epoch": 1923} {"train_loss": -11.85236930847168, "global_step": 323161, "epoch": 1923} {"train_loss": -11.118066787719727, "global_step": 323162, "epoch": 1923} {"train_loss": -11.442124366760254, "global_step": 323163, "epoch": 1923} {"train_loss": -11.961641311645508, "global_step": 323164, "epoch": 1923} {"train_loss": -11.447422981262207, "global_step": 323165, "epoch": 1923} {"train_loss": -11.489187240600586, "global_step": 323166, "epoch": 1923} {"train_loss": -11.515617370605469, "global_step": 323167, "epoch": 1923} {"train_loss": -11.2413330078125, "global_step": 323168, "epoch": 1923} {"train_loss": -12.068811416625977, "global_step": 323169, "epoch": 1923} {"train_loss": -11.227807998657227, "global_step": 323170, "epoch": 1923} {"train_loss": -11.21780776977539, "global_step": 323171, "epoch": 1923} {"train_loss": -12.05681037902832, "global_step": 323172, "epoch": 1923} {"train_loss": -11.348626136779785, "global_step": 323173, "epoch": 1923} {"train_loss": -11.985984802246094, "global_step": 323174, "epoch": 1923} {"train_loss": -11.56702995300293, "global_step": 323175, "epoch": 1923} {"train_loss": -11.66906452178955, "global_step": 323176, "epoch": 1923} {"train_loss": -11.835760116577148, "global_step": 323177, "epoch": 1923} {"train_loss": -11.96868896484375, "global_step": 323178, "epoch": 1923} {"train_loss": -11.866641998291016, "global_step": 323179, "epoch": 1923} {"train_loss": -11.744633674621582, "global_step": 323180, "epoch": 1923} {"train_loss": -11.942316055297852, "global_step": 323181, "epoch": 1923} {"train_loss": -11.544456481933594, "global_step": 323182, "epoch": 1923} {"train_loss": -11.473346710205078, "global_step": 323183, "epoch": 1923} {"train_loss": -11.756481170654297, "global_step": 323184, "epoch": 1923} {"train_loss": -11.329532623291016, "global_step": 323185, "epoch": 1923} {"train_loss": -11.920217514038086, "global_step": 323186, "epoch": 1923} {"train_loss": -12.160688400268555, "global_step": 323187, "epoch": 1923} {"train_loss": -11.626617431640625, "global_step": 323188, "epoch": 1923} {"train_loss": -12.167737007141113, "global_step": 323189, "epoch": 1923} {"train_loss": -11.983720779418945, "global_step": 323190, "epoch": 1923} {"train_loss": -12.298568725585938, "global_step": 323191, "epoch": 1923} {"train_loss": -12.040148735046387, "global_step": 323192, "epoch": 1923} {"train_loss": -12.382682800292969, "global_step": 323193, "epoch": 1923} {"train_loss": -12.07481861114502, "global_step": 323194, "epoch": 1923} {"train_loss": -12.180286407470703, "global_step": 323195, "epoch": 1923} {"train_loss": -12.002849578857422, "global_step": 323196, "epoch": 1923} {"train_loss": -11.976685523986816, "global_step": 323197, "epoch": 1923} {"train_loss": -12.126810073852539, "global_step": 323198, "epoch": 1923} {"train_loss": -12.125923156738281, "global_step": 323199, "epoch": 1923} {"train_loss": -11.977167129516602, "global_step": 323200, "epoch": 1923} {"train_loss": -12.088136672973633, "global_step": 323201, "epoch": 1923} {"train_loss": -12.145284652709961, "global_step": 323202, "epoch": 1923} {"train_loss": -12.451763153076172, "global_step": 323203, "epoch": 1923} {"train_loss": -11.841446876525879, "global_step": 323204, "epoch": 1923} {"train_loss": -12.329569816589355, "global_step": 323205, "epoch": 1923} {"train_loss": -11.949291229248047, "global_step": 323206, "epoch": 1923} {"train_loss": -12.337221145629883, "global_step": 323207, "epoch": 1923} {"train_loss": -12.20815658569336, "global_step": 323208, "epoch": 1923} {"train_loss": -12.153886795043945, "global_step": 323209, "epoch": 1923} {"train_loss": -12.421224594116211, "global_step": 323210, "epoch": 1923} {"train_loss": -12.344289779663086, "global_step": 323211, "epoch": 1923} {"train_loss": -12.289985656738281, "global_step": 323212, "epoch": 1923} {"train_loss": -12.460860252380371, "global_step": 323213, "epoch": 1923} {"train_loss": -12.650045394897461, "global_step": 323214, "epoch": 1923} {"train_loss": -12.148061752319336, "global_step": 323215, "epoch": 1923} {"train_loss": -12.45208740234375, "global_step": 323216, "epoch": 1923} {"train_loss": -11.93239974975586, "global_step": 323217, "epoch": 1923} {"train_loss": -12.556278228759766, "global_step": 323218, "epoch": 1923} {"train_loss": -11.756332397460938, "global_step": 323219, "epoch": 1923} {"train_loss": -12.483251571655273, "global_step": 323220, "epoch": 1923} {"train_loss": -12.174947738647461, "global_step": 323221, "epoch": 1923} {"train_loss": -12.201918601989746, "global_step": 323222, "epoch": 1923} {"train_loss": -11.687814712524414, "global_step": 323223, "epoch": 1923} {"train_loss": -12.60944938659668, "global_step": 323224, "epoch": 1923} {"train_loss": -11.82608699798584, "global_step": 323225, "epoch": 1923} {"train_loss": -12.150472640991211, "global_step": 323226, "epoch": 1923} {"train_loss": -12.633087158203125, "global_step": 323227, "epoch": 1923} {"train_loss": -12.366266250610352, "global_step": 323228, "epoch": 1923} {"train_loss": -12.046834945678711, "global_step": 323229, "epoch": 1923} {"train_loss": -12.227090835571289, "global_step": 323230, "epoch": 1923} {"train_loss": -12.002970281101408, "global_step": 323231, "epoch": 1923, "val_loss": 285363.3125} {"train_loss": -12.437479019165039, "global_step": 323232, "epoch": 1924} {"train_loss": -12.538957595825195, "global_step": 323233, "epoch": 1924} {"train_loss": -12.51695442199707, "global_step": 323234, "epoch": 1924} {"train_loss": -12.403952598571777, "global_step": 323235, "epoch": 1924} {"train_loss": -12.559310913085938, "global_step": 323236, "epoch": 1924} {"train_loss": -12.406750679016113, "global_step": 323237, "epoch": 1924} {"train_loss": -12.500492095947266, "global_step": 323238, "epoch": 1924} {"train_loss": -12.132740020751953, "global_step": 323239, "epoch": 1924} {"train_loss": -12.42293930053711, "global_step": 323240, "epoch": 1924} {"train_loss": -12.406108856201172, "global_step": 323241, "epoch": 1924} {"train_loss": -12.43606948852539, "global_step": 323242, "epoch": 1924} {"train_loss": -12.526725769042969, "global_step": 323243, "epoch": 1924} {"train_loss": -12.377334594726562, "global_step": 323244, "epoch": 1924} {"train_loss": -12.35551643371582, "global_step": 323245, "epoch": 1924} {"train_loss": -12.4972562789917, "global_step": 323246, "epoch": 1924} {"train_loss": -12.085572242736816, "global_step": 323247, "epoch": 1924} {"train_loss": -12.154584884643555, "global_step": 323248, "epoch": 1924} {"train_loss": -12.488513946533203, "global_step": 323249, "epoch": 1924} {"train_loss": -12.549540519714355, "global_step": 323250, "epoch": 1924} {"train_loss": -12.197102546691895, "global_step": 323251, "epoch": 1924} {"train_loss": -12.302824974060059, "global_step": 323252, "epoch": 1924} {"train_loss": -12.262863159179688, "global_step": 323253, "epoch": 1924} {"train_loss": -12.320353507995605, "global_step": 323254, "epoch": 1924} {"train_loss": -12.049497604370117, "global_step": 323255, "epoch": 1924} {"train_loss": -11.729328155517578, "global_step": 323256, "epoch": 1924} {"train_loss": -12.515310287475586, "global_step": 323257, "epoch": 1924} {"train_loss": -11.833431243896484, "global_step": 323258, "epoch": 1924} {"train_loss": -11.769880294799805, "global_step": 323259, "epoch": 1924} {"train_loss": -11.634716987609863, "global_step": 323260, "epoch": 1924} {"train_loss": -11.98134994506836, "global_step": 323261, "epoch": 1924} {"train_loss": -12.0213623046875, "global_step": 323262, "epoch": 1924} {"train_loss": -12.029563903808594, "global_step": 323263, "epoch": 1924} {"train_loss": -11.757946968078613, "global_step": 323264, "epoch": 1924} {"train_loss": -11.92885971069336, "global_step": 323265, "epoch": 1924} {"train_loss": -12.378905296325684, "global_step": 323266, "epoch": 1924} {"train_loss": -11.890058517456055, "global_step": 323267, "epoch": 1924} {"train_loss": -11.92959213256836, "global_step": 323268, "epoch": 1924} {"train_loss": -11.911691665649414, "global_step": 323269, "epoch": 1924} {"train_loss": -12.588693618774414, "global_step": 323270, "epoch": 1924} {"train_loss": -11.64163589477539, "global_step": 323271, "epoch": 1924} {"train_loss": -11.706573486328125, "global_step": 323272, "epoch": 1924} {"train_loss": -12.234807968139648, "global_step": 323273, "epoch": 1924} {"train_loss": -11.764518737792969, "global_step": 323274, "epoch": 1924} {"train_loss": -10.636505126953125, "global_step": 323275, "epoch": 1924} {"train_loss": -11.754096031188965, "global_step": 323276, "epoch": 1924} {"train_loss": -11.766244888305664, "global_step": 323277, "epoch": 1924} {"train_loss": -11.26657485961914, "global_step": 323278, "epoch": 1924} {"train_loss": -10.998298645019531, "global_step": 323279, "epoch": 1924} {"train_loss": -11.973883628845215, "global_step": 323280, "epoch": 1924} {"train_loss": -10.7503662109375, "global_step": 323281, "epoch": 1924} {"train_loss": -12.189922332763672, "global_step": 323282, "epoch": 1924} {"train_loss": -11.19746208190918, "global_step": 323283, "epoch": 1924} {"train_loss": -11.661057472229004, "global_step": 323284, "epoch": 1924} {"train_loss": -12.075057983398438, "global_step": 323285, "epoch": 1924} {"train_loss": -12.120588302612305, "global_step": 323286, "epoch": 1924} {"train_loss": -11.975406646728516, "global_step": 323287, "epoch": 1924} {"train_loss": -11.729971885681152, "global_step": 323288, "epoch": 1924} {"train_loss": -11.960126876831055, "global_step": 323289, "epoch": 1924} {"train_loss": -11.64155387878418, "global_step": 323290, "epoch": 1924} {"train_loss": -12.116623878479004, "global_step": 323291, "epoch": 1924} {"train_loss": -11.857243537902832, "global_step": 323292, "epoch": 1924} {"train_loss": -11.837905883789062, "global_step": 323293, "epoch": 1924} {"train_loss": -12.034892082214355, "global_step": 323294, "epoch": 1924} {"train_loss": -11.895559310913086, "global_step": 323295, "epoch": 1924} {"train_loss": -12.362200736999512, "global_step": 323296, "epoch": 1924} {"train_loss": -12.382795333862305, "global_step": 323297, "epoch": 1924} {"train_loss": -12.033395767211914, "global_step": 323298, "epoch": 1924} {"train_loss": -12.167332649230957, "global_step": 323299, "epoch": 1924} {"train_loss": -12.132291793823242, "global_step": 323300, "epoch": 1924} {"train_loss": -12.160754203796387, "global_step": 323301, "epoch": 1924} {"train_loss": -12.064223289489746, "global_step": 323302, "epoch": 1924} {"train_loss": -12.254425048828125, "global_step": 323303, "epoch": 1924} {"train_loss": -11.76524829864502, "global_step": 323304, "epoch": 1924} {"train_loss": -12.092068672180176, "global_step": 323305, "epoch": 1924} {"train_loss": -12.012042045593262, "global_step": 323306, "epoch": 1924} {"train_loss": -11.979738235473633, "global_step": 323307, "epoch": 1924} {"train_loss": -12.128238677978516, "global_step": 323308, "epoch": 1924} {"train_loss": -11.820520401000977, "global_step": 323309, "epoch": 1924} {"train_loss": -11.73556900024414, "global_step": 323310, "epoch": 1924} {"train_loss": -11.96548843383789, "global_step": 323311, "epoch": 1924} {"train_loss": -12.456491470336914, "global_step": 323312, "epoch": 1924} {"train_loss": -12.11052131652832, "global_step": 323313, "epoch": 1924} {"train_loss": -12.118562698364258, "global_step": 323314, "epoch": 1924} {"train_loss": -12.22057819366455, "global_step": 323315, "epoch": 1924} {"train_loss": -11.830738067626953, "global_step": 323316, "epoch": 1924} {"train_loss": -12.32636833190918, "global_step": 323317, "epoch": 1924} {"train_loss": -12.24693489074707, "global_step": 323318, "epoch": 1924} {"train_loss": -12.072141647338867, "global_step": 323319, "epoch": 1924} {"train_loss": -12.264978408813477, "global_step": 323320, "epoch": 1924} {"train_loss": -11.874967575073242, "global_step": 323321, "epoch": 1924} {"train_loss": -12.09388542175293, "global_step": 323322, "epoch": 1924} {"train_loss": -11.907849311828613, "global_step": 323323, "epoch": 1924} {"train_loss": -12.161459922790527, "global_step": 323324, "epoch": 1924} {"train_loss": -11.416970252990723, "global_step": 323325, "epoch": 1924} {"train_loss": -11.981461524963379, "global_step": 323326, "epoch": 1924} {"train_loss": -11.499805450439453, "global_step": 323327, "epoch": 1924} {"train_loss": -10.766637802124023, "global_step": 323328, "epoch": 1924} {"train_loss": -11.653739929199219, "global_step": 323329, "epoch": 1924} {"train_loss": -11.682271003723145, "global_step": 323330, "epoch": 1924} {"train_loss": -11.159344673156738, "global_step": 323331, "epoch": 1924} {"train_loss": -10.765555381774902, "global_step": 323332, "epoch": 1924} {"train_loss": -12.268150329589844, "global_step": 323333, "epoch": 1924} {"train_loss": -10.983129501342773, "global_step": 323334, "epoch": 1924} {"train_loss": -12.035873413085938, "global_step": 323335, "epoch": 1924} {"train_loss": -11.660497665405273, "global_step": 323336, "epoch": 1924} {"train_loss": -11.661910057067871, "global_step": 323337, "epoch": 1924} {"train_loss": -11.680317878723145, "global_step": 323338, "epoch": 1924} {"train_loss": -11.699748992919922, "global_step": 323339, "epoch": 1924} {"train_loss": -11.788363456726074, "global_step": 323340, "epoch": 1924} {"train_loss": -11.977982521057129, "global_step": 323341, "epoch": 1924} {"train_loss": -11.90401840209961, "global_step": 323342, "epoch": 1924} {"train_loss": -11.850122451782227, "global_step": 323343, "epoch": 1924} {"train_loss": -12.184273719787598, "global_step": 323344, "epoch": 1924} {"train_loss": -12.142179489135742, "global_step": 323345, "epoch": 1924} {"train_loss": -11.819666862487793, "global_step": 323346, "epoch": 1924} {"train_loss": -11.886503219604492, "global_step": 323347, "epoch": 1924} {"train_loss": -11.99567985534668, "global_step": 323348, "epoch": 1924} {"train_loss": -12.064104080200195, "global_step": 323349, "epoch": 1924} {"train_loss": -11.995122909545898, "global_step": 323350, "epoch": 1924} {"train_loss": -11.520416259765625, "global_step": 323351, "epoch": 1924} {"train_loss": -12.149128913879395, "global_step": 323352, "epoch": 1924} {"train_loss": -12.128704071044922, "global_step": 323353, "epoch": 1924} {"train_loss": -12.174881935119629, "global_step": 323354, "epoch": 1924} {"train_loss": -11.558359146118164, "global_step": 323355, "epoch": 1924} {"train_loss": -11.747267723083496, "global_step": 323356, "epoch": 1924} {"train_loss": -12.182580947875977, "global_step": 323357, "epoch": 1924} {"train_loss": -11.424457550048828, "global_step": 323358, "epoch": 1924} {"train_loss": -12.308631896972656, "global_step": 323359, "epoch": 1924} {"train_loss": -11.522459983825684, "global_step": 323360, "epoch": 1924} {"train_loss": -12.122482299804688, "global_step": 323361, "epoch": 1924} {"train_loss": -11.508979797363281, "global_step": 323362, "epoch": 1924} {"train_loss": -11.959064483642578, "global_step": 323363, "epoch": 1924} {"train_loss": -11.550305366516113, "global_step": 323364, "epoch": 1924} {"train_loss": -12.257041931152344, "global_step": 323365, "epoch": 1924} {"train_loss": -11.765798568725586, "global_step": 323366, "epoch": 1924} {"train_loss": -11.960691452026367, "global_step": 323367, "epoch": 1924} {"train_loss": -11.938146591186523, "global_step": 323368, "epoch": 1924} {"train_loss": -12.106671333312988, "global_step": 323369, "epoch": 1924} {"train_loss": -11.962825775146484, "global_step": 323370, "epoch": 1924} {"train_loss": -12.205073356628418, "global_step": 323371, "epoch": 1924} {"train_loss": -12.054308891296387, "global_step": 323372, "epoch": 1924} {"train_loss": -12.294309616088867, "global_step": 323373, "epoch": 1924} {"train_loss": -12.36728286743164, "global_step": 323374, "epoch": 1924} {"train_loss": -11.983649253845215, "global_step": 323375, "epoch": 1924} {"train_loss": -12.105905532836914, "global_step": 323376, "epoch": 1924} {"train_loss": -11.970298767089844, "global_step": 323377, "epoch": 1924} {"train_loss": -12.135503768920898, "global_step": 323378, "epoch": 1924} {"train_loss": -12.251493453979492, "global_step": 323379, "epoch": 1924} {"train_loss": -12.174249649047852, "global_step": 323380, "epoch": 1924} {"train_loss": -12.086427688598633, "global_step": 323381, "epoch": 1924} {"train_loss": -12.406462669372559, "global_step": 323382, "epoch": 1924} {"train_loss": -11.927632331848145, "global_step": 323383, "epoch": 1924} {"train_loss": -12.435922622680664, "global_step": 323384, "epoch": 1924} {"train_loss": -11.976343154907227, "global_step": 323385, "epoch": 1924} {"train_loss": -12.18436050415039, "global_step": 323386, "epoch": 1924} {"train_loss": -12.114883422851562, "global_step": 323387, "epoch": 1924} {"train_loss": -12.387447357177734, "global_step": 323388, "epoch": 1924} {"train_loss": -12.09354019165039, "global_step": 323389, "epoch": 1924} {"train_loss": -12.162739753723145, "global_step": 323390, "epoch": 1924} {"train_loss": -12.266807556152344, "global_step": 323391, "epoch": 1924} {"train_loss": -11.996376991271973, "global_step": 323392, "epoch": 1924} {"train_loss": -11.94940185546875, "global_step": 323393, "epoch": 1924} {"train_loss": -12.371766090393066, "global_step": 323394, "epoch": 1924} {"train_loss": -12.057106971740723, "global_step": 323395, "epoch": 1924} {"train_loss": -12.363361358642578, "global_step": 323396, "epoch": 1924} {"train_loss": -12.265755653381348, "global_step": 323397, "epoch": 1924} {"train_loss": -12.416352272033691, "global_step": 323398, "epoch": 1924} {"train_loss": -12.000252536364965, "global_step": 323399, "epoch": 1924, "val_loss": 287127.4375} {"train_loss": -12.359955787658691, "global_step": 323400, "epoch": 1925} {"train_loss": -12.516828536987305, "global_step": 323401, "epoch": 1925} {"train_loss": -12.272849082946777, "global_step": 323402, "epoch": 1925} {"train_loss": -12.327722549438477, "global_step": 323403, "epoch": 1925} {"train_loss": -12.517410278320312, "global_step": 323404, "epoch": 1925} {"train_loss": -12.502012252807617, "global_step": 323405, "epoch": 1925} {"train_loss": -12.483083724975586, "global_step": 323406, "epoch": 1925} {"train_loss": -12.329769134521484, "global_step": 323407, "epoch": 1925} {"train_loss": -12.251522064208984, "global_step": 323408, "epoch": 1925} {"train_loss": -12.410232543945312, "global_step": 323409, "epoch": 1925} {"train_loss": -12.566137313842773, "global_step": 323410, "epoch": 1925} {"train_loss": -12.566786766052246, "global_step": 323411, "epoch": 1925} {"train_loss": -12.450401306152344, "global_step": 323412, "epoch": 1925} {"train_loss": -12.527576446533203, "global_step": 323413, "epoch": 1925} {"train_loss": -12.203134536743164, "global_step": 323414, "epoch": 1925} {"train_loss": -12.182828903198242, "global_step": 323415, "epoch": 1925} {"train_loss": -12.25010871887207, "global_step": 323416, "epoch": 1925} {"train_loss": -12.445261001586914, "global_step": 323417, "epoch": 1925} {"train_loss": -11.733624458312988, "global_step": 323418, "epoch": 1925} {"train_loss": -11.64767074584961, "global_step": 323419, "epoch": 1925} {"train_loss": -12.375603675842285, "global_step": 323420, "epoch": 1925} {"train_loss": -12.333072662353516, "global_step": 323421, "epoch": 1925} {"train_loss": -12.152952194213867, "global_step": 323422, "epoch": 1925} {"train_loss": -12.416604042053223, "global_step": 323423, "epoch": 1925} {"train_loss": -12.586311340332031, "global_step": 323424, "epoch": 1925} {"train_loss": -10.98744010925293, "global_step": 323425, "epoch": 1925} {"train_loss": -11.29222297668457, "global_step": 323426, "epoch": 1925} {"train_loss": -12.769405364990234, "global_step": 323427, "epoch": 1925} {"train_loss": -11.722372055053711, "global_step": 323428, "epoch": 1925} {"train_loss": -10.949029922485352, "global_step": 323429, "epoch": 1925} {"train_loss": -12.124664306640625, "global_step": 323430, "epoch": 1925} {"train_loss": -11.339487075805664, "global_step": 323431, "epoch": 1925} {"train_loss": -11.008109092712402, "global_step": 323432, "epoch": 1925} {"train_loss": -11.590307235717773, "global_step": 323433, "epoch": 1925} {"train_loss": -12.288908958435059, "global_step": 323434, "epoch": 1925} {"train_loss": -11.247154235839844, "global_step": 323435, "epoch": 1925} {"train_loss": -12.084331512451172, "global_step": 323436, "epoch": 1925} {"train_loss": -11.602607727050781, "global_step": 323437, "epoch": 1925} {"train_loss": -11.065900802612305, "global_step": 323438, "epoch": 1925} {"train_loss": -10.64712905883789, "global_step": 323439, "epoch": 1925} {"train_loss": -10.846866607666016, "global_step": 323440, "epoch": 1925} {"train_loss": -10.173225402832031, "global_step": 323441, "epoch": 1925} {"train_loss": -10.958191871643066, "global_step": 323442, "epoch": 1925} {"train_loss": -12.04098892211914, "global_step": 323443, "epoch": 1925} {"train_loss": -10.027164459228516, "global_step": 323444, "epoch": 1925} {"train_loss": -11.849411010742188, "global_step": 323445, "epoch": 1925} {"train_loss": -11.759653091430664, "global_step": 323446, "epoch": 1925} {"train_loss": -11.29296875, "global_step": 323447, "epoch": 1925} {"train_loss": -12.071004867553711, "global_step": 323448, "epoch": 1925} {"train_loss": -12.161191940307617, "global_step": 323449, "epoch": 1925} {"train_loss": -11.84283447265625, "global_step": 323450, "epoch": 1925} {"train_loss": -12.03451156616211, "global_step": 323451, "epoch": 1925} {"train_loss": -11.676801681518555, "global_step": 323452, "epoch": 1925} {"train_loss": -11.548748016357422, "global_step": 323453, "epoch": 1925} {"train_loss": -11.678131103515625, "global_step": 323454, "epoch": 1925} {"train_loss": -11.830669403076172, "global_step": 323455, "epoch": 1925} {"train_loss": -11.875959396362305, "global_step": 323456, "epoch": 1925} {"train_loss": -11.820996284484863, "global_step": 323457, "epoch": 1925} {"train_loss": -11.815884590148926, "global_step": 323458, "epoch": 1925} {"train_loss": -11.789005279541016, "global_step": 323459, "epoch": 1925} {"train_loss": -11.788673400878906, "global_step": 323460, "epoch": 1925} {"train_loss": -11.52755355834961, "global_step": 323461, "epoch": 1925} {"train_loss": -11.922176361083984, "global_step": 323462, "epoch": 1925} {"train_loss": -11.795141220092773, "global_step": 323463, "epoch": 1925} {"train_loss": -11.677094459533691, "global_step": 323464, "epoch": 1925} {"train_loss": -11.78974723815918, "global_step": 323465, "epoch": 1925} {"train_loss": -11.168624877929688, "global_step": 323466, "epoch": 1925} {"train_loss": -12.087472915649414, "global_step": 323467, "epoch": 1925} {"train_loss": -11.731202125549316, "global_step": 323468, "epoch": 1925} {"train_loss": -12.048055648803711, "global_step": 323469, "epoch": 1925} {"train_loss": -12.196678161621094, "global_step": 323470, "epoch": 1925} {"train_loss": -11.761096954345703, "global_step": 323471, "epoch": 1925} {"train_loss": -12.176267623901367, "global_step": 323472, "epoch": 1925} {"train_loss": -11.58344841003418, "global_step": 323473, "epoch": 1925} {"train_loss": -11.713111877441406, "global_step": 323474, "epoch": 1925} {"train_loss": -11.929253578186035, "global_step": 323475, "epoch": 1925} {"train_loss": -11.304579734802246, "global_step": 323476, "epoch": 1925} {"train_loss": -11.805866241455078, "global_step": 323477, "epoch": 1925} {"train_loss": -11.930874824523926, "global_step": 323478, "epoch": 1925} {"train_loss": -11.710906982421875, "global_step": 323479, "epoch": 1925} {"train_loss": -11.98750114440918, "global_step": 323480, "epoch": 1925} {"train_loss": -11.641382217407227, "global_step": 323481, "epoch": 1925} {"train_loss": -11.43380355834961, "global_step": 323482, "epoch": 1925} {"train_loss": -11.77389144897461, "global_step": 323483, "epoch": 1925} {"train_loss": -11.770307540893555, "global_step": 323484, "epoch": 1925} {"train_loss": -11.786211013793945, "global_step": 323485, "epoch": 1925} {"train_loss": -12.00541877746582, "global_step": 323486, "epoch": 1925} {"train_loss": -11.901214599609375, "global_step": 323487, "epoch": 1925} {"train_loss": -11.551223754882812, "global_step": 323488, "epoch": 1925} {"train_loss": -12.097051620483398, "global_step": 323489, "epoch": 1925} {"train_loss": -11.721948623657227, "global_step": 323490, "epoch": 1925} {"train_loss": -11.812042236328125, "global_step": 323491, "epoch": 1925} {"train_loss": -12.173696517944336, "global_step": 323492, "epoch": 1925} {"train_loss": -11.396614074707031, "global_step": 323493, "epoch": 1925} {"train_loss": -11.864571571350098, "global_step": 323494, "epoch": 1925} {"train_loss": -12.266357421875, "global_step": 323495, "epoch": 1925} {"train_loss": -11.848817825317383, "global_step": 323496, "epoch": 1925} {"train_loss": -12.208100318908691, "global_step": 323497, "epoch": 1925} {"train_loss": -11.65922737121582, "global_step": 323498, "epoch": 1925} {"train_loss": -11.677739143371582, "global_step": 323499, "epoch": 1925} {"train_loss": -12.232183456420898, "global_step": 323500, "epoch": 1925} {"train_loss": -11.324719429016113, "global_step": 323501, "epoch": 1925} {"train_loss": -12.284628868103027, "global_step": 323502, "epoch": 1925} {"train_loss": -12.052303314208984, "global_step": 323503, "epoch": 1925} {"train_loss": -11.931953430175781, "global_step": 323504, "epoch": 1925} {"train_loss": -12.191221237182617, "global_step": 323505, "epoch": 1925} {"train_loss": -12.121604919433594, "global_step": 323506, "epoch": 1925} {"train_loss": -12.230241775512695, "global_step": 323507, "epoch": 1925} {"train_loss": -12.387613296508789, "global_step": 323508, "epoch": 1925} {"train_loss": -11.736801147460938, "global_step": 323509, "epoch": 1925} {"train_loss": -12.21596908569336, "global_step": 323510, "epoch": 1925} {"train_loss": -11.833047866821289, "global_step": 323511, "epoch": 1925} {"train_loss": -12.23648452758789, "global_step": 323512, "epoch": 1925} {"train_loss": -11.93706226348877, "global_step": 323513, "epoch": 1925} {"train_loss": -11.934065818786621, "global_step": 323514, "epoch": 1925} {"train_loss": -11.456275939941406, "global_step": 323515, "epoch": 1925} {"train_loss": -10.364133834838867, "global_step": 323516, "epoch": 1925} {"train_loss": -11.690017700195312, "global_step": 323517, "epoch": 1925} {"train_loss": -9.977657318115234, "global_step": 323518, "epoch": 1925} {"train_loss": -11.187700271606445, "global_step": 323519, "epoch": 1925} {"train_loss": -10.756921768188477, "global_step": 323520, "epoch": 1925} {"train_loss": -10.36474609375, "global_step": 323521, "epoch": 1925} {"train_loss": -11.434836387634277, "global_step": 323522, "epoch": 1925} {"train_loss": -10.345542907714844, "global_step": 323523, "epoch": 1925} {"train_loss": -10.382177352905273, "global_step": 323524, "epoch": 1925} {"train_loss": -11.789371490478516, "global_step": 323525, "epoch": 1925} {"train_loss": -10.702705383300781, "global_step": 323526, "epoch": 1925} {"train_loss": -11.611553192138672, "global_step": 323527, "epoch": 1925} {"train_loss": -11.195920944213867, "global_step": 323528, "epoch": 1925} {"train_loss": -11.752010345458984, "global_step": 323529, "epoch": 1925} {"train_loss": -12.139358520507812, "global_step": 323530, "epoch": 1925} {"train_loss": -10.530317306518555, "global_step": 323531, "epoch": 1925} {"train_loss": -11.595584869384766, "global_step": 323532, "epoch": 1925} {"train_loss": -11.601298332214355, "global_step": 323533, "epoch": 1925} {"train_loss": -10.754609107971191, "global_step": 323534, "epoch": 1925} {"train_loss": -11.912172317504883, "global_step": 323535, "epoch": 1925} {"train_loss": -11.082621574401855, "global_step": 323536, "epoch": 1925} {"train_loss": -10.496673583984375, "global_step": 323537, "epoch": 1925} {"train_loss": -10.394599914550781, "global_step": 323538, "epoch": 1925} {"train_loss": -9.820845603942871, "global_step": 323539, "epoch": 1925} {"train_loss": -10.833351135253906, "global_step": 323540, "epoch": 1925} {"train_loss": -10.756372451782227, "global_step": 323541, "epoch": 1925} {"train_loss": -10.320154190063477, "global_step": 323542, "epoch": 1925} {"train_loss": -10.813983917236328, "global_step": 323543, "epoch": 1925} {"train_loss": -10.925450325012207, "global_step": 323544, "epoch": 1925} {"train_loss": -9.866294860839844, "global_step": 323545, "epoch": 1925} {"train_loss": -10.841166496276855, "global_step": 323546, "epoch": 1925} {"train_loss": -9.850757598876953, "global_step": 323547, "epoch": 1925} {"train_loss": -9.220088958740234, "global_step": 323548, "epoch": 1925} {"train_loss": -10.669645309448242, "global_step": 323549, "epoch": 1925} {"train_loss": -9.300464630126953, "global_step": 323550, "epoch": 1925} {"train_loss": -10.61041259765625, "global_step": 323551, "epoch": 1925} {"train_loss": -10.646275520324707, "global_step": 323552, "epoch": 1925} {"train_loss": -11.592988014221191, "global_step": 323553, "epoch": 1925} {"train_loss": -11.349255561828613, "global_step": 323554, "epoch": 1925} {"train_loss": -12.226741790771484, "global_step": 323555, "epoch": 1925} {"train_loss": -11.007444381713867, "global_step": 323556, "epoch": 1925} {"train_loss": -12.03575325012207, "global_step": 323557, "epoch": 1925} {"train_loss": -11.395242691040039, "global_step": 323558, "epoch": 1925} {"train_loss": -11.906085014343262, "global_step": 323559, "epoch": 1925} {"train_loss": -11.491177558898926, "global_step": 323560, "epoch": 1925} {"train_loss": -11.637393951416016, "global_step": 323561, "epoch": 1925} {"train_loss": -11.812339782714844, "global_step": 323562, "epoch": 1925} {"train_loss": -12.021326065063477, "global_step": 323563, "epoch": 1925} {"train_loss": -11.949346542358398, "global_step": 323564, "epoch": 1925} {"train_loss": -11.971953392028809, "global_step": 323565, "epoch": 1925} {"train_loss": -11.949875831604004, "global_step": 323566, "epoch": 1925} {"train_loss": -11.615624944368998, "global_step": 323567, "epoch": 1925, "val_loss": 285190.8125, "train_action_mse_error": 0.46995809674263} {"train_loss": -11.617488861083984, "global_step": 323568, "epoch": 1926} {"train_loss": -11.890717506408691, "global_step": 323569, "epoch": 1926} {"train_loss": -11.921640396118164, "global_step": 323570, "epoch": 1926} {"train_loss": -12.035870552062988, "global_step": 323571, "epoch": 1926} {"train_loss": -12.13868522644043, "global_step": 323572, "epoch": 1926} {"train_loss": -11.952683448791504, "global_step": 323573, "epoch": 1926} {"train_loss": -12.042365074157715, "global_step": 323574, "epoch": 1926} {"train_loss": -11.97420883178711, "global_step": 323575, "epoch": 1926} {"train_loss": -11.958520889282227, "global_step": 323576, "epoch": 1926} {"train_loss": -12.201239585876465, "global_step": 323577, "epoch": 1926} {"train_loss": -12.279216766357422, "global_step": 323578, "epoch": 1926} {"train_loss": -12.19343376159668, "global_step": 323579, "epoch": 1926} {"train_loss": -12.08083724975586, "global_step": 323580, "epoch": 1926} {"train_loss": -12.430242538452148, "global_step": 323581, "epoch": 1926} {"train_loss": -12.218196868896484, "global_step": 323582, "epoch": 1926} {"train_loss": -12.295337677001953, "global_step": 323583, "epoch": 1926} {"train_loss": -12.186769485473633, "global_step": 323584, "epoch": 1926} {"train_loss": -12.285666465759277, "global_step": 323585, "epoch": 1926} {"train_loss": -12.218088150024414, "global_step": 323586, "epoch": 1926} {"train_loss": -12.172513961791992, "global_step": 323587, "epoch": 1926} {"train_loss": -12.124885559082031, "global_step": 323588, "epoch": 1926} {"train_loss": -12.228277206420898, "global_step": 323589, "epoch": 1926} {"train_loss": -12.112401962280273, "global_step": 323590, "epoch": 1926} {"train_loss": -12.275215148925781, "global_step": 323591, "epoch": 1926} {"train_loss": -12.334198951721191, "global_step": 323592, "epoch": 1926} {"train_loss": -12.283271789550781, "global_step": 323593, "epoch": 1926} {"train_loss": -12.459906578063965, "global_step": 323594, "epoch": 1926} {"train_loss": -12.306333541870117, "global_step": 323595, "epoch": 1926} {"train_loss": -12.217997550964355, "global_step": 323596, "epoch": 1926} {"train_loss": -12.345100402832031, "global_step": 323597, "epoch": 1926} {"train_loss": -12.406230926513672, "global_step": 323598, "epoch": 1926} {"train_loss": -12.285921096801758, "global_step": 323599, "epoch": 1926} {"train_loss": -12.474435806274414, "global_step": 323600, "epoch": 1926} {"train_loss": -12.237527847290039, "global_step": 323601, "epoch": 1926} {"train_loss": -12.458314895629883, "global_step": 323602, "epoch": 1926} {"train_loss": -12.21129035949707, "global_step": 323603, "epoch": 1926} {"train_loss": -12.333457946777344, "global_step": 323604, "epoch": 1926} {"train_loss": -12.429131507873535, "global_step": 323605, "epoch": 1926} {"train_loss": -12.164962768554688, "global_step": 323606, "epoch": 1926} {"train_loss": -12.549240112304688, "global_step": 323607, "epoch": 1926} {"train_loss": -12.521503448486328, "global_step": 323608, "epoch": 1926} {"train_loss": -12.614564895629883, "global_step": 323609, "epoch": 1926} {"train_loss": -12.671772003173828, "global_step": 323610, "epoch": 1926} {"train_loss": -12.488714218139648, "global_step": 323611, "epoch": 1926} {"train_loss": -12.36859130859375, "global_step": 323612, "epoch": 1926} {"train_loss": -12.667818069458008, "global_step": 323613, "epoch": 1926} {"train_loss": -12.616813659667969, "global_step": 323614, "epoch": 1926} {"train_loss": -12.427468299865723, "global_step": 323615, "epoch": 1926} {"train_loss": -12.349950790405273, "global_step": 323616, "epoch": 1926} {"train_loss": -12.44883918762207, "global_step": 323617, "epoch": 1926} {"train_loss": -12.421684265136719, "global_step": 323618, "epoch": 1926} {"train_loss": -12.441417694091797, "global_step": 323619, "epoch": 1926} {"train_loss": -12.530826568603516, "global_step": 323620, "epoch": 1926} {"train_loss": -12.254302978515625, "global_step": 323621, "epoch": 1926} {"train_loss": -12.294845581054688, "global_step": 323622, "epoch": 1926} {"train_loss": -12.182880401611328, "global_step": 323623, "epoch": 1926} {"train_loss": -12.712516784667969, "global_step": 323624, "epoch": 1926} {"train_loss": -12.519535064697266, "global_step": 323625, "epoch": 1926} {"train_loss": -12.401052474975586, "global_step": 323626, "epoch": 1926} {"train_loss": -12.524852752685547, "global_step": 323627, "epoch": 1926} {"train_loss": -12.452987670898438, "global_step": 323628, "epoch": 1926} {"train_loss": -12.194939613342285, "global_step": 323629, "epoch": 1926} {"train_loss": -12.002798080444336, "global_step": 323630, "epoch": 1926} {"train_loss": -12.457832336425781, "global_step": 323631, "epoch": 1926} {"train_loss": -12.268716812133789, "global_step": 323632, "epoch": 1926} {"train_loss": -11.83272933959961, "global_step": 323633, "epoch": 1926} {"train_loss": -12.492780685424805, "global_step": 323634, "epoch": 1926} {"train_loss": -12.183923721313477, "global_step": 323635, "epoch": 1926} {"train_loss": -12.349031448364258, "global_step": 323636, "epoch": 1926} {"train_loss": -12.173330307006836, "global_step": 323637, "epoch": 1926} {"train_loss": -12.647292137145996, "global_step": 323638, "epoch": 1926} {"train_loss": -11.882625579833984, "global_step": 323639, "epoch": 1926} {"train_loss": -12.34775447845459, "global_step": 323640, "epoch": 1926} {"train_loss": -12.022464752197266, "global_step": 323641, "epoch": 1926} {"train_loss": -12.392051696777344, "global_step": 323642, "epoch": 1926} {"train_loss": -12.13155746459961, "global_step": 323643, "epoch": 1926} {"train_loss": -11.727010726928711, "global_step": 323644, "epoch": 1926} {"train_loss": -12.003881454467773, "global_step": 323645, "epoch": 1926} {"train_loss": -12.037571907043457, "global_step": 323646, "epoch": 1926} {"train_loss": -11.800165176391602, "global_step": 323647, "epoch": 1926} {"train_loss": -11.546005249023438, "global_step": 323648, "epoch": 1926} {"train_loss": -11.136316299438477, "global_step": 323649, "epoch": 1926} {"train_loss": -10.602206230163574, "global_step": 323650, "epoch": 1926} {"train_loss": -11.134225845336914, "global_step": 323651, "epoch": 1926} {"train_loss": -11.296384811401367, "global_step": 323652, "epoch": 1926} {"train_loss": -11.20383358001709, "global_step": 323653, "epoch": 1926} {"train_loss": -11.416543006896973, "global_step": 323654, "epoch": 1926} {"train_loss": -10.767839431762695, "global_step": 323655, "epoch": 1926} {"train_loss": -12.103304862976074, "global_step": 323656, "epoch": 1926} {"train_loss": -11.234169006347656, "global_step": 323657, "epoch": 1926} {"train_loss": -10.421937942504883, "global_step": 323658, "epoch": 1926} {"train_loss": -9.210994720458984, "global_step": 323659, "epoch": 1926} {"train_loss": -8.643388748168945, "global_step": 323660, "epoch": 1926} {"train_loss": -9.755577087402344, "global_step": 323661, "epoch": 1926} {"train_loss": -9.140070915222168, "global_step": 323662, "epoch": 1926} {"train_loss": -7.352293968200684, "global_step": 323663, "epoch": 1926} {"train_loss": -8.484090805053711, "global_step": 323664, "epoch": 1926} {"train_loss": -9.196039199829102, "global_step": 323665, "epoch": 1926} {"train_loss": -10.405895233154297, "global_step": 323666, "epoch": 1926} {"train_loss": -8.615062713623047, "global_step": 323667, "epoch": 1926} {"train_loss": -8.558021545410156, "global_step": 323668, "epoch": 1926} {"train_loss": -9.35498332977295, "global_step": 323669, "epoch": 1926} {"train_loss": -10.36561393737793, "global_step": 323670, "epoch": 1926} {"train_loss": -9.590295791625977, "global_step": 323671, "epoch": 1926} {"train_loss": -10.304336547851562, "global_step": 323672, "epoch": 1926} {"train_loss": -8.32413387298584, "global_step": 323673, "epoch": 1926} {"train_loss": -9.775687217712402, "global_step": 323674, "epoch": 1926} {"train_loss": -8.958131790161133, "global_step": 323675, "epoch": 1926} {"train_loss": -8.346302032470703, "global_step": 323676, "epoch": 1926} {"train_loss": -8.885519027709961, "global_step": 323677, "epoch": 1926} {"train_loss": -8.508695602416992, "global_step": 323678, "epoch": 1926} {"train_loss": -9.4280366897583, "global_step": 323679, "epoch": 1926} {"train_loss": -8.8336181640625, "global_step": 323680, "epoch": 1926} {"train_loss": -9.816690444946289, "global_step": 323681, "epoch": 1926} {"train_loss": -9.20627212524414, "global_step": 323682, "epoch": 1926} {"train_loss": -9.906715393066406, "global_step": 323683, "epoch": 1926} {"train_loss": -9.806679725646973, "global_step": 323684, "epoch": 1926} {"train_loss": -9.056079864501953, "global_step": 323685, "epoch": 1926} {"train_loss": -10.441965103149414, "global_step": 323686, "epoch": 1926} {"train_loss": -10.1627197265625, "global_step": 323687, "epoch": 1926} {"train_loss": -9.292613983154297, "global_step": 323688, "epoch": 1926} {"train_loss": -11.554241180419922, "global_step": 323689, "epoch": 1926} {"train_loss": -9.976736068725586, "global_step": 323690, "epoch": 1926} {"train_loss": -11.031123161315918, "global_step": 323691, "epoch": 1926} {"train_loss": -11.269150733947754, "global_step": 323692, "epoch": 1926} {"train_loss": -10.28510570526123, "global_step": 323693, "epoch": 1926} {"train_loss": -11.208261489868164, "global_step": 323694, "epoch": 1926} {"train_loss": -11.178610801696777, "global_step": 323695, "epoch": 1926} {"train_loss": -10.732465744018555, "global_step": 323696, "epoch": 1926} {"train_loss": -11.48757553100586, "global_step": 323697, "epoch": 1926} {"train_loss": -11.227802276611328, "global_step": 323698, "epoch": 1926} {"train_loss": -11.264747619628906, "global_step": 323699, "epoch": 1926} {"train_loss": -11.69144344329834, "global_step": 323700, "epoch": 1926} {"train_loss": -11.385519027709961, "global_step": 323701, "epoch": 1926} {"train_loss": -11.408187866210938, "global_step": 323702, "epoch": 1926} {"train_loss": -11.50967788696289, "global_step": 323703, "epoch": 1926} {"train_loss": -11.148571014404297, "global_step": 323704, "epoch": 1926} {"train_loss": -11.23225212097168, "global_step": 323705, "epoch": 1926} {"train_loss": -11.74269962310791, "global_step": 323706, "epoch": 1926} {"train_loss": -11.409944534301758, "global_step": 323707, "epoch": 1926} {"train_loss": -11.835334777832031, "global_step": 323708, "epoch": 1926} {"train_loss": -11.905900955200195, "global_step": 323709, "epoch": 1926} {"train_loss": -11.65729808807373, "global_step": 323710, "epoch": 1926} {"train_loss": -11.756529808044434, "global_step": 323711, "epoch": 1926} {"train_loss": -11.662031173706055, "global_step": 323712, "epoch": 1926} {"train_loss": -11.763734817504883, "global_step": 323713, "epoch": 1926} {"train_loss": -11.961252212524414, "global_step": 323714, "epoch": 1926} {"train_loss": -11.698708534240723, "global_step": 323715, "epoch": 1926} {"train_loss": -11.877166748046875, "global_step": 323716, "epoch": 1926} {"train_loss": -11.803804397583008, "global_step": 323717, "epoch": 1926} {"train_loss": -11.636850357055664, "global_step": 323718, "epoch": 1926} {"train_loss": -11.952396392822266, "global_step": 323719, "epoch": 1926} {"train_loss": -11.815568923950195, "global_step": 323720, "epoch": 1926} {"train_loss": -11.89676284790039, "global_step": 323721, "epoch": 1926} {"train_loss": -11.782188415527344, "global_step": 323722, "epoch": 1926} {"train_loss": -11.941489219665527, "global_step": 323723, "epoch": 1926} {"train_loss": -11.847709655761719, "global_step": 323724, "epoch": 1926} {"train_loss": -11.761680603027344, "global_step": 323725, "epoch": 1926} {"train_loss": -11.873453140258789, "global_step": 323726, "epoch": 1926} {"train_loss": -11.89647388458252, "global_step": 323727, "epoch": 1926} {"train_loss": -11.828454971313477, "global_step": 323728, "epoch": 1926} {"train_loss": -12.07310676574707, "global_step": 323729, "epoch": 1926} {"train_loss": -12.037237167358398, "global_step": 323730, "epoch": 1926} {"train_loss": -11.991580963134766, "global_step": 323731, "epoch": 1926} {"train_loss": -12.080278396606445, "global_step": 323732, "epoch": 1926} {"train_loss": -11.878114700317383, "global_step": 323733, "epoch": 1926} {"train_loss": -11.995101928710938, "global_step": 323734, "epoch": 1926} {"train_loss": -11.46877372264862, "global_step": 323735, "epoch": 1926, "val_loss": 278387.6875} {"train_loss": -12.053227424621582, "global_step": 323736, "epoch": 1927} {"train_loss": -12.006965637207031, "global_step": 323737, "epoch": 1927} {"train_loss": -11.864208221435547, "global_step": 323738, "epoch": 1927} {"train_loss": -12.136585235595703, "global_step": 323739, "epoch": 1927} {"train_loss": -12.139591217041016, "global_step": 323740, "epoch": 1927} {"train_loss": -12.034811019897461, "global_step": 323741, "epoch": 1927} {"train_loss": -12.215755462646484, "global_step": 323742, "epoch": 1927} {"train_loss": -12.273880004882812, "global_step": 323743, "epoch": 1927} {"train_loss": -12.161243438720703, "global_step": 323744, "epoch": 1927} {"train_loss": -12.290452003479004, "global_step": 323745, "epoch": 1927} {"train_loss": -12.271463394165039, "global_step": 323746, "epoch": 1927} {"train_loss": -12.352821350097656, "global_step": 323747, "epoch": 1927} {"train_loss": -12.29407024383545, "global_step": 323748, "epoch": 1927} {"train_loss": -12.256686210632324, "global_step": 323749, "epoch": 1927} {"train_loss": -12.162988662719727, "global_step": 323750, "epoch": 1927} {"train_loss": -12.306279182434082, "global_step": 323751, "epoch": 1927} {"train_loss": -12.276427268981934, "global_step": 323752, "epoch": 1927} {"train_loss": -12.333633422851562, "global_step": 323753, "epoch": 1927} {"train_loss": -12.327268600463867, "global_step": 323754, "epoch": 1927} {"train_loss": -12.312812805175781, "global_step": 323755, "epoch": 1927} {"train_loss": -12.356796264648438, "global_step": 323756, "epoch": 1927} {"train_loss": -12.468013763427734, "global_step": 323757, "epoch": 1927} {"train_loss": -12.247138977050781, "global_step": 323758, "epoch": 1927} {"train_loss": -12.412734985351562, "global_step": 323759, "epoch": 1927} {"train_loss": -12.432113647460938, "global_step": 323760, "epoch": 1927} {"train_loss": -12.390751838684082, "global_step": 323761, "epoch": 1927} {"train_loss": -12.468311309814453, "global_step": 323762, "epoch": 1927} {"train_loss": -12.32414722442627, "global_step": 323763, "epoch": 1927} {"train_loss": -12.399439811706543, "global_step": 323764, "epoch": 1927} {"train_loss": -12.286239624023438, "global_step": 323765, "epoch": 1927} {"train_loss": -12.309240341186523, "global_step": 323766, "epoch": 1927} {"train_loss": -12.593427658081055, "global_step": 323767, "epoch": 1927} {"train_loss": -12.536510467529297, "global_step": 323768, "epoch": 1927} {"train_loss": -12.33802604675293, "global_step": 323769, "epoch": 1927} {"train_loss": -12.350688934326172, "global_step": 323770, "epoch": 1927} {"train_loss": -12.388927459716797, "global_step": 323771, "epoch": 1927} {"train_loss": -12.314857482910156, "global_step": 323772, "epoch": 1927} {"train_loss": -12.557411193847656, "global_step": 323773, "epoch": 1927} {"train_loss": -12.459123611450195, "global_step": 323774, "epoch": 1927} {"train_loss": -12.469024658203125, "global_step": 323775, "epoch": 1927} {"train_loss": -12.40852165222168, "global_step": 323776, "epoch": 1927} {"train_loss": -12.42326545715332, "global_step": 323777, "epoch": 1927} {"train_loss": -12.537429809570312, "global_step": 323778, "epoch": 1927} {"train_loss": -12.408323287963867, "global_step": 323779, "epoch": 1927} {"train_loss": -12.443876266479492, "global_step": 323780, "epoch": 1927} {"train_loss": -12.584028244018555, "global_step": 323781, "epoch": 1927} {"train_loss": -12.650049209594727, "global_step": 323782, "epoch": 1927} {"train_loss": -12.433764457702637, "global_step": 323783, "epoch": 1927} {"train_loss": -12.776805877685547, "global_step": 323784, "epoch": 1927} {"train_loss": -12.243474960327148, "global_step": 323785, "epoch": 1927} {"train_loss": -12.634735107421875, "global_step": 323786, "epoch": 1927} {"train_loss": -12.518121719360352, "global_step": 323787, "epoch": 1927} {"train_loss": -12.435508728027344, "global_step": 323788, "epoch": 1927} {"train_loss": -12.195220947265625, "global_step": 323789, "epoch": 1927} {"train_loss": -12.30597972869873, "global_step": 323790, "epoch": 1927} {"train_loss": -12.666450500488281, "global_step": 323791, "epoch": 1927} {"train_loss": -12.53422737121582, "global_step": 323792, "epoch": 1927} {"train_loss": -12.5499906539917, "global_step": 323793, "epoch": 1927} {"train_loss": -12.285503387451172, "global_step": 323794, "epoch": 1927} {"train_loss": -12.503667831420898, "global_step": 323795, "epoch": 1927} {"train_loss": -12.585714340209961, "global_step": 323796, "epoch": 1927} {"train_loss": -12.70730209350586, "global_step": 323797, "epoch": 1927} {"train_loss": -12.417195320129395, "global_step": 323798, "epoch": 1927} {"train_loss": -12.460306167602539, "global_step": 323799, "epoch": 1927} {"train_loss": -12.472972869873047, "global_step": 323800, "epoch": 1927} {"train_loss": -12.36445426940918, "global_step": 323801, "epoch": 1927} {"train_loss": -12.662912368774414, "global_step": 323802, "epoch": 1927} {"train_loss": -12.205423355102539, "global_step": 323803, "epoch": 1927} {"train_loss": -12.268821716308594, "global_step": 323804, "epoch": 1927} {"train_loss": -12.284244537353516, "global_step": 323805, "epoch": 1927} {"train_loss": -12.185508728027344, "global_step": 323806, "epoch": 1927} {"train_loss": -12.065221786499023, "global_step": 323807, "epoch": 1927} {"train_loss": -12.157968521118164, "global_step": 323808, "epoch": 1927} {"train_loss": -11.976760864257812, "global_step": 323809, "epoch": 1927} {"train_loss": -12.271492958068848, "global_step": 323810, "epoch": 1927} {"train_loss": -12.433927536010742, "global_step": 323811, "epoch": 1927} {"train_loss": -11.816827774047852, "global_step": 323812, "epoch": 1927} {"train_loss": -12.311594009399414, "global_step": 323813, "epoch": 1927} {"train_loss": -11.914796829223633, "global_step": 323814, "epoch": 1927} {"train_loss": -12.215746879577637, "global_step": 323815, "epoch": 1927} {"train_loss": -11.840242385864258, "global_step": 323816, "epoch": 1927} {"train_loss": -12.609040260314941, "global_step": 323817, "epoch": 1927} {"train_loss": -11.614166259765625, "global_step": 323818, "epoch": 1927} {"train_loss": -12.145605087280273, "global_step": 323819, "epoch": 1927} {"train_loss": -12.017629623413086, "global_step": 323820, "epoch": 1927} {"train_loss": -12.15077018737793, "global_step": 323821, "epoch": 1927} {"train_loss": -11.830293655395508, "global_step": 323822, "epoch": 1927} {"train_loss": -11.694320678710938, "global_step": 323823, "epoch": 1927} {"train_loss": -11.941771507263184, "global_step": 323824, "epoch": 1927} {"train_loss": -11.025190353393555, "global_step": 323825, "epoch": 1927} {"train_loss": -11.518081665039062, "global_step": 323826, "epoch": 1927} {"train_loss": -10.199607849121094, "global_step": 323827, "epoch": 1927} {"train_loss": -12.060219764709473, "global_step": 323828, "epoch": 1927} {"train_loss": -9.87663745880127, "global_step": 323829, "epoch": 1927} {"train_loss": -11.558464050292969, "global_step": 323830, "epoch": 1927} {"train_loss": -10.515493392944336, "global_step": 323831, "epoch": 1927} {"train_loss": -10.974482536315918, "global_step": 323832, "epoch": 1927} {"train_loss": -10.215387344360352, "global_step": 323833, "epoch": 1927} {"train_loss": -11.413665771484375, "global_step": 323834, "epoch": 1927} {"train_loss": -9.985858917236328, "global_step": 323835, "epoch": 1927} {"train_loss": -11.267251968383789, "global_step": 323836, "epoch": 1927} {"train_loss": -9.817684173583984, "global_step": 323837, "epoch": 1927} {"train_loss": -11.15836238861084, "global_step": 323838, "epoch": 1927} {"train_loss": -10.119384765625, "global_step": 323839, "epoch": 1927} {"train_loss": -9.602998733520508, "global_step": 323840, "epoch": 1927} {"train_loss": -9.200323104858398, "global_step": 323841, "epoch": 1927} {"train_loss": -8.564552307128906, "global_step": 323842, "epoch": 1927} {"train_loss": -10.471292495727539, "global_step": 323843, "epoch": 1927} {"train_loss": -9.325836181640625, "global_step": 323844, "epoch": 1927} {"train_loss": -10.70997428894043, "global_step": 323845, "epoch": 1927} {"train_loss": -9.040252685546875, "global_step": 323846, "epoch": 1927} {"train_loss": -9.746808052062988, "global_step": 323847, "epoch": 1927} {"train_loss": -9.164213180541992, "global_step": 323848, "epoch": 1927} {"train_loss": -10.35877799987793, "global_step": 323849, "epoch": 1927} {"train_loss": -9.97839069366455, "global_step": 323850, "epoch": 1927} {"train_loss": -10.809378623962402, "global_step": 323851, "epoch": 1927} {"train_loss": -10.670523643493652, "global_step": 323852, "epoch": 1927} {"train_loss": -10.38664436340332, "global_step": 323853, "epoch": 1927} {"train_loss": -10.714010238647461, "global_step": 323854, "epoch": 1927} {"train_loss": -10.152667999267578, "global_step": 323855, "epoch": 1927} {"train_loss": -11.068105697631836, "global_step": 323856, "epoch": 1927} {"train_loss": -10.786773681640625, "global_step": 323857, "epoch": 1927} {"train_loss": -10.850335121154785, "global_step": 323858, "epoch": 1927} {"train_loss": -10.4957275390625, "global_step": 323859, "epoch": 1927} {"train_loss": -10.91472053527832, "global_step": 323860, "epoch": 1927} {"train_loss": -9.774435997009277, "global_step": 323861, "epoch": 1927} {"train_loss": -11.113919258117676, "global_step": 323862, "epoch": 1927} {"train_loss": -10.198009490966797, "global_step": 323863, "epoch": 1927} {"train_loss": -11.027322769165039, "global_step": 323864, "epoch": 1927} {"train_loss": -10.759176254272461, "global_step": 323865, "epoch": 1927} {"train_loss": -10.864014625549316, "global_step": 323866, "epoch": 1927} {"train_loss": -11.200799942016602, "global_step": 323867, "epoch": 1927} {"train_loss": -10.436290740966797, "global_step": 323868, "epoch": 1927} {"train_loss": -10.804439544677734, "global_step": 323869, "epoch": 1927} {"train_loss": -11.419482231140137, "global_step": 323870, "epoch": 1927} {"train_loss": -10.818647384643555, "global_step": 323871, "epoch": 1927} {"train_loss": -11.319035530090332, "global_step": 323872, "epoch": 1927} {"train_loss": -11.381031036376953, "global_step": 323873, "epoch": 1927} {"train_loss": -11.183082580566406, "global_step": 323874, "epoch": 1927} {"train_loss": -11.506912231445312, "global_step": 323875, "epoch": 1927} {"train_loss": -11.29382610321045, "global_step": 323876, "epoch": 1927} {"train_loss": -11.588981628417969, "global_step": 323877, "epoch": 1927} {"train_loss": -11.565903663635254, "global_step": 323878, "epoch": 1927} {"train_loss": -11.623056411743164, "global_step": 323879, "epoch": 1927} {"train_loss": -11.617137908935547, "global_step": 323880, "epoch": 1927} {"train_loss": -11.848470687866211, "global_step": 323881, "epoch": 1927} {"train_loss": -11.553126335144043, "global_step": 323882, "epoch": 1927} {"train_loss": -11.75820541381836, "global_step": 323883, "epoch": 1927} {"train_loss": -11.668388366699219, "global_step": 323884, "epoch": 1927} {"train_loss": -11.730813980102539, "global_step": 323885, "epoch": 1927} {"train_loss": -11.716004371643066, "global_step": 323886, "epoch": 1927} {"train_loss": -11.743184089660645, "global_step": 323887, "epoch": 1927} {"train_loss": -11.996063232421875, "global_step": 323888, "epoch": 1927} {"train_loss": -11.951518058776855, "global_step": 323889, "epoch": 1927} {"train_loss": -11.757186889648438, "global_step": 323890, "epoch": 1927} {"train_loss": -11.687772750854492, "global_step": 323891, "epoch": 1927} {"train_loss": -11.853411674499512, "global_step": 323892, "epoch": 1927} {"train_loss": -11.974366188049316, "global_step": 323893, "epoch": 1927} {"train_loss": -11.733246803283691, "global_step": 323894, "epoch": 1927} {"train_loss": -11.756641387939453, "global_step": 323895, "epoch": 1927} {"train_loss": -12.090498924255371, "global_step": 323896, "epoch": 1927} {"train_loss": -11.939205169677734, "global_step": 323897, "epoch": 1927} {"train_loss": -11.975971221923828, "global_step": 323898, "epoch": 1927} {"train_loss": -11.976820945739746, "global_step": 323899, "epoch": 1927} {"train_loss": -11.940738677978516, "global_step": 323900, "epoch": 1927} {"train_loss": -11.95793628692627, "global_step": 323901, "epoch": 1927} {"train_loss": -11.811848640441895, "global_step": 323902, "epoch": 1927} {"train_loss": -11.690773975281488, "global_step": 323903, "epoch": 1927, "val_loss": 281812.0} {"train_loss": -12.165182113647461, "global_step": 323904, "epoch": 1928} {"train_loss": -12.094825744628906, "global_step": 323905, "epoch": 1928} {"train_loss": -11.899312973022461, "global_step": 323906, "epoch": 1928} {"train_loss": -12.343708038330078, "global_step": 323907, "epoch": 1928} {"train_loss": -11.995443344116211, "global_step": 323908, "epoch": 1928} {"train_loss": -12.039416313171387, "global_step": 323909, "epoch": 1928} {"train_loss": -12.013466835021973, "global_step": 323910, "epoch": 1928} {"train_loss": -12.242064476013184, "global_step": 323911, "epoch": 1928} {"train_loss": -11.995440483093262, "global_step": 323912, "epoch": 1928} {"train_loss": -12.291999816894531, "global_step": 323913, "epoch": 1928} {"train_loss": -12.059281349182129, "global_step": 323914, "epoch": 1928} {"train_loss": -12.41644287109375, "global_step": 323915, "epoch": 1928} {"train_loss": -12.181110382080078, "global_step": 323916, "epoch": 1928} {"train_loss": -11.936466217041016, "global_step": 323917, "epoch": 1928} {"train_loss": -12.110980987548828, "global_step": 323918, "epoch": 1928} {"train_loss": -12.126018524169922, "global_step": 323919, "epoch": 1928} {"train_loss": -12.210853576660156, "global_step": 323920, "epoch": 1928} {"train_loss": -12.209293365478516, "global_step": 323921, "epoch": 1928} {"train_loss": -12.387407302856445, "global_step": 323922, "epoch": 1928} {"train_loss": -12.10500717163086, "global_step": 323923, "epoch": 1928} {"train_loss": -12.219459533691406, "global_step": 323924, "epoch": 1928} {"train_loss": -12.223928451538086, "global_step": 323925, "epoch": 1928} {"train_loss": -12.360807418823242, "global_step": 323926, "epoch": 1928} {"train_loss": -12.077998161315918, "global_step": 323927, "epoch": 1928} {"train_loss": -12.388286590576172, "global_step": 323928, "epoch": 1928} {"train_loss": -12.261787414550781, "global_step": 323929, "epoch": 1928} {"train_loss": -12.460795402526855, "global_step": 323930, "epoch": 1928} {"train_loss": -12.206911087036133, "global_step": 323931, "epoch": 1928} {"train_loss": -12.275272369384766, "global_step": 323932, "epoch": 1928} {"train_loss": -12.332218170166016, "global_step": 323933, "epoch": 1928} {"train_loss": -12.280824661254883, "global_step": 323934, "epoch": 1928} {"train_loss": -12.53140926361084, "global_step": 323935, "epoch": 1928} {"train_loss": -12.205484390258789, "global_step": 323936, "epoch": 1928} {"train_loss": -12.569690704345703, "global_step": 323937, "epoch": 1928} {"train_loss": -12.20349407196045, "global_step": 323938, "epoch": 1928} {"train_loss": -12.251168251037598, "global_step": 323939, "epoch": 1928} {"train_loss": -12.296875, "global_step": 323940, "epoch": 1928} {"train_loss": -12.193161010742188, "global_step": 323941, "epoch": 1928} {"train_loss": -12.452762603759766, "global_step": 323942, "epoch": 1928} {"train_loss": -11.952760696411133, "global_step": 323943, "epoch": 1928} {"train_loss": -12.396987915039062, "global_step": 323944, "epoch": 1928} {"train_loss": -12.412120819091797, "global_step": 323945, "epoch": 1928} {"train_loss": -12.314172744750977, "global_step": 323946, "epoch": 1928} {"train_loss": -12.493093490600586, "global_step": 323947, "epoch": 1928} {"train_loss": -12.206256866455078, "global_step": 323948, "epoch": 1928} {"train_loss": -12.386554718017578, "global_step": 323949, "epoch": 1928} {"train_loss": -12.488295555114746, "global_step": 323950, "epoch": 1928} {"train_loss": -12.3694429397583, "global_step": 323951, "epoch": 1928} {"train_loss": -12.513492584228516, "global_step": 323952, "epoch": 1928} {"train_loss": -12.530950546264648, "global_step": 323953, "epoch": 1928} {"train_loss": -12.552618026733398, "global_step": 323954, "epoch": 1928} {"train_loss": -12.5773286819458, "global_step": 323955, "epoch": 1928} {"train_loss": -12.266097068786621, "global_step": 323956, "epoch": 1928} {"train_loss": -12.451066970825195, "global_step": 323957, "epoch": 1928} {"train_loss": -12.46047306060791, "global_step": 323958, "epoch": 1928} {"train_loss": -12.167413711547852, "global_step": 323959, "epoch": 1928} {"train_loss": -12.153684616088867, "global_step": 323960, "epoch": 1928} {"train_loss": -12.335148811340332, "global_step": 323961, "epoch": 1928} {"train_loss": -12.160035133361816, "global_step": 323962, "epoch": 1928} {"train_loss": -11.943658828735352, "global_step": 323963, "epoch": 1928} {"train_loss": -12.149612426757812, "global_step": 323964, "epoch": 1928} {"train_loss": -12.201156616210938, "global_step": 323965, "epoch": 1928} {"train_loss": -11.92514419555664, "global_step": 323966, "epoch": 1928} {"train_loss": -12.22413444519043, "global_step": 323967, "epoch": 1928} {"train_loss": -12.339900970458984, "global_step": 323968, "epoch": 1928} {"train_loss": -11.832338333129883, "global_step": 323969, "epoch": 1928} {"train_loss": -11.918561935424805, "global_step": 323970, "epoch": 1928} {"train_loss": -12.371503829956055, "global_step": 323971, "epoch": 1928} {"train_loss": -12.099649429321289, "global_step": 323972, "epoch": 1928} {"train_loss": -11.970410346984863, "global_step": 323973, "epoch": 1928} {"train_loss": -12.199840545654297, "global_step": 323974, "epoch": 1928} {"train_loss": -12.224231719970703, "global_step": 323975, "epoch": 1928} {"train_loss": -12.191588401794434, "global_step": 323976, "epoch": 1928} {"train_loss": -11.976969718933105, "global_step": 323977, "epoch": 1928} {"train_loss": -12.210357666015625, "global_step": 323978, "epoch": 1928} {"train_loss": -11.94384765625, "global_step": 323979, "epoch": 1928} {"train_loss": -11.885059356689453, "global_step": 323980, "epoch": 1928} {"train_loss": -12.30765151977539, "global_step": 323981, "epoch": 1928} {"train_loss": -12.466869354248047, "global_step": 323982, "epoch": 1928} {"train_loss": -12.109318733215332, "global_step": 323983, "epoch": 1928} {"train_loss": -11.7615327835083, "global_step": 323984, "epoch": 1928} {"train_loss": -11.578962326049805, "global_step": 323985, "epoch": 1928} {"train_loss": -11.923920631408691, "global_step": 323986, "epoch": 1928} {"train_loss": -12.048707008361816, "global_step": 323987, "epoch": 1928} {"train_loss": -12.171991348266602, "global_step": 323988, "epoch": 1928} {"train_loss": -12.114280700683594, "global_step": 323989, "epoch": 1928} {"train_loss": -12.267170906066895, "global_step": 323990, "epoch": 1928} {"train_loss": -12.099685668945312, "global_step": 323991, "epoch": 1928} {"train_loss": -12.000276565551758, "global_step": 323992, "epoch": 1928} {"train_loss": -12.309610366821289, "global_step": 323993, "epoch": 1928} {"train_loss": -12.49687385559082, "global_step": 323994, "epoch": 1928} {"train_loss": -11.748371124267578, "global_step": 323995, "epoch": 1928} {"train_loss": -12.059309959411621, "global_step": 323996, "epoch": 1928} {"train_loss": -11.934120178222656, "global_step": 323997, "epoch": 1928} {"train_loss": -12.659295082092285, "global_step": 323998, "epoch": 1928} {"train_loss": -11.948009490966797, "global_step": 323999, "epoch": 1928} {"train_loss": -12.007097244262695, "global_step": 324000, "epoch": 1928} {"train_loss": -12.155513763427734, "global_step": 324001, "epoch": 1928} {"train_loss": -11.976128578186035, "global_step": 324002, "epoch": 1928} {"train_loss": -12.222200393676758, "global_step": 324003, "epoch": 1928} {"train_loss": -12.234269142150879, "global_step": 324004, "epoch": 1928} {"train_loss": -12.11941146850586, "global_step": 324005, "epoch": 1928} {"train_loss": -12.45608901977539, "global_step": 324006, "epoch": 1928} {"train_loss": -11.907242774963379, "global_step": 324007, "epoch": 1928} {"train_loss": -11.436351776123047, "global_step": 324008, "epoch": 1928} {"train_loss": -11.910188674926758, "global_step": 324009, "epoch": 1928} {"train_loss": -11.732807159423828, "global_step": 324010, "epoch": 1928} {"train_loss": -10.903260231018066, "global_step": 324011, "epoch": 1928} {"train_loss": -11.057266235351562, "global_step": 324012, "epoch": 1928} {"train_loss": -10.29196834564209, "global_step": 324013, "epoch": 1928} {"train_loss": -11.459235191345215, "global_step": 324014, "epoch": 1928} {"train_loss": -9.817386627197266, "global_step": 324015, "epoch": 1928} {"train_loss": -12.053211212158203, "global_step": 324016, "epoch": 1928} {"train_loss": -11.0762357711792, "global_step": 324017, "epoch": 1928} {"train_loss": -10.658863067626953, "global_step": 324018, "epoch": 1928} {"train_loss": -10.67090129852295, "global_step": 324019, "epoch": 1928} {"train_loss": -10.997648239135742, "global_step": 324020, "epoch": 1928} {"train_loss": -11.226494789123535, "global_step": 324021, "epoch": 1928} {"train_loss": -10.562973022460938, "global_step": 324022, "epoch": 1928} {"train_loss": -11.346444129943848, "global_step": 324023, "epoch": 1928} {"train_loss": -10.672922134399414, "global_step": 324024, "epoch": 1928} {"train_loss": -10.925469398498535, "global_step": 324025, "epoch": 1928} {"train_loss": -10.409571647644043, "global_step": 324026, "epoch": 1928} {"train_loss": -11.08038330078125, "global_step": 324027, "epoch": 1928} {"train_loss": -11.148324966430664, "global_step": 324028, "epoch": 1928} {"train_loss": -11.279769897460938, "global_step": 324029, "epoch": 1928} {"train_loss": -11.222574234008789, "global_step": 324030, "epoch": 1928} {"train_loss": -11.270187377929688, "global_step": 324031, "epoch": 1928} {"train_loss": -11.686761856079102, "global_step": 324032, "epoch": 1928} {"train_loss": -11.378385543823242, "global_step": 324033, "epoch": 1928} {"train_loss": -11.394233703613281, "global_step": 324034, "epoch": 1928} {"train_loss": -11.787839889526367, "global_step": 324035, "epoch": 1928} {"train_loss": -11.574612617492676, "global_step": 324036, "epoch": 1928} {"train_loss": -11.749874114990234, "global_step": 324037, "epoch": 1928} {"train_loss": -11.432563781738281, "global_step": 324038, "epoch": 1928} {"train_loss": -11.693733215332031, "global_step": 324039, "epoch": 1928} {"train_loss": -11.581720352172852, "global_step": 324040, "epoch": 1928} {"train_loss": -11.540797233581543, "global_step": 324041, "epoch": 1928} {"train_loss": -11.730290412902832, "global_step": 324042, "epoch": 1928} {"train_loss": -11.715228080749512, "global_step": 324043, "epoch": 1928} {"train_loss": -11.340585708618164, "global_step": 324044, "epoch": 1928} {"train_loss": -11.709781646728516, "global_step": 324045, "epoch": 1928} {"train_loss": -11.810855865478516, "global_step": 324046, "epoch": 1928} {"train_loss": -12.051654815673828, "global_step": 324047, "epoch": 1928} {"train_loss": -12.184432029724121, "global_step": 324048, "epoch": 1928} {"train_loss": -11.707521438598633, "global_step": 324049, "epoch": 1928} {"train_loss": -12.142492294311523, "global_step": 324050, "epoch": 1928} {"train_loss": -11.90938663482666, "global_step": 324051, "epoch": 1928} {"train_loss": -11.90709114074707, "global_step": 324052, "epoch": 1928} {"train_loss": -11.661653518676758, "global_step": 324053, "epoch": 1928} {"train_loss": -11.767045974731445, "global_step": 324054, "epoch": 1928} {"train_loss": -11.760228157043457, "global_step": 324055, "epoch": 1928} {"train_loss": -11.786861419677734, "global_step": 324056, "epoch": 1928} {"train_loss": -11.468138694763184, "global_step": 324057, "epoch": 1928} {"train_loss": -11.602960586547852, "global_step": 324058, "epoch": 1928} {"train_loss": -11.984498023986816, "global_step": 324059, "epoch": 1928} {"train_loss": -11.387639999389648, "global_step": 324060, "epoch": 1928} {"train_loss": -12.01919937133789, "global_step": 324061, "epoch": 1928} {"train_loss": -11.657365798950195, "global_step": 324062, "epoch": 1928} {"train_loss": -12.070405006408691, "global_step": 324063, "epoch": 1928} {"train_loss": -11.577133178710938, "global_step": 324064, "epoch": 1928} {"train_loss": -11.929512023925781, "global_step": 324065, "epoch": 1928} {"train_loss": -11.958537101745605, "global_step": 324066, "epoch": 1928} {"train_loss": -11.644506454467773, "global_step": 324067, "epoch": 1928} {"train_loss": -12.148932456970215, "global_step": 324068, "epoch": 1928} {"train_loss": -11.590639114379883, "global_step": 324069, "epoch": 1928} {"train_loss": -12.104084014892578, "global_step": 324070, "epoch": 1928} {"train_loss": -11.926419411386762, "global_step": 324071, "epoch": 1928, "val_loss": 287796.4375} {"train_loss": -11.889792442321777, "global_step": 324072, "epoch": 1929} {"train_loss": -12.095647811889648, "global_step": 324073, "epoch": 1929} {"train_loss": -12.037355422973633, "global_step": 324074, "epoch": 1929} {"train_loss": -11.964494705200195, "global_step": 324075, "epoch": 1929} {"train_loss": -12.044683456420898, "global_step": 324076, "epoch": 1929} {"train_loss": -12.09074592590332, "global_step": 324077, "epoch": 1929} {"train_loss": -11.927084922790527, "global_step": 324078, "epoch": 1929} {"train_loss": -12.259888648986816, "global_step": 324079, "epoch": 1929} {"train_loss": -12.13837718963623, "global_step": 324080, "epoch": 1929} {"train_loss": -12.248266220092773, "global_step": 324081, "epoch": 1929} {"train_loss": -12.177947998046875, "global_step": 324082, "epoch": 1929} {"train_loss": -12.275283813476562, "global_step": 324083, "epoch": 1929} {"train_loss": -11.93962574005127, "global_step": 324084, "epoch": 1929} {"train_loss": -12.268192291259766, "global_step": 324085, "epoch": 1929} {"train_loss": -11.99540901184082, "global_step": 324086, "epoch": 1929} {"train_loss": -12.101828575134277, "global_step": 324087, "epoch": 1929} {"train_loss": -12.06019401550293, "global_step": 324088, "epoch": 1929} {"train_loss": -12.399015426635742, "global_step": 324089, "epoch": 1929} {"train_loss": -12.363030433654785, "global_step": 324090, "epoch": 1929} {"train_loss": -12.296985626220703, "global_step": 324091, "epoch": 1929} {"train_loss": -12.148778915405273, "global_step": 324092, "epoch": 1929} {"train_loss": -12.308645248413086, "global_step": 324093, "epoch": 1929} {"train_loss": -12.174278259277344, "global_step": 324094, "epoch": 1929} {"train_loss": -12.370329856872559, "global_step": 324095, "epoch": 1929} {"train_loss": -12.209839820861816, "global_step": 324096, "epoch": 1929} {"train_loss": -12.206090927124023, "global_step": 324097, "epoch": 1929} {"train_loss": -12.535394668579102, "global_step": 324098, "epoch": 1929} {"train_loss": -12.225213050842285, "global_step": 324099, "epoch": 1929} {"train_loss": -12.291616439819336, "global_step": 324100, "epoch": 1929} {"train_loss": -12.40715217590332, "global_step": 324101, "epoch": 1929} {"train_loss": -12.49055004119873, "global_step": 324102, "epoch": 1929} {"train_loss": -12.249027252197266, "global_step": 324103, "epoch": 1929} {"train_loss": -12.478095054626465, "global_step": 324104, "epoch": 1929} {"train_loss": -12.348639488220215, "global_step": 324105, "epoch": 1929} {"train_loss": -12.269613265991211, "global_step": 324106, "epoch": 1929} {"train_loss": -12.137287139892578, "global_step": 324107, "epoch": 1929} {"train_loss": -12.307689666748047, "global_step": 324108, "epoch": 1929} {"train_loss": -12.41339111328125, "global_step": 324109, "epoch": 1929} {"train_loss": -12.439695358276367, "global_step": 324110, "epoch": 1929} {"train_loss": -12.342957496643066, "global_step": 324111, "epoch": 1929} {"train_loss": -12.647806167602539, "global_step": 324112, "epoch": 1929} {"train_loss": -12.309063911437988, "global_step": 324113, "epoch": 1929} {"train_loss": -12.475790023803711, "global_step": 324114, "epoch": 1929} {"train_loss": -12.523662567138672, "global_step": 324115, "epoch": 1929} {"train_loss": -12.438468933105469, "global_step": 324116, "epoch": 1929} {"train_loss": -12.390426635742188, "global_step": 324117, "epoch": 1929} {"train_loss": -12.581727981567383, "global_step": 324118, "epoch": 1929} {"train_loss": -12.310810089111328, "global_step": 324119, "epoch": 1929} {"train_loss": -12.421195030212402, "global_step": 324120, "epoch": 1929} {"train_loss": -12.55484390258789, "global_step": 324121, "epoch": 1929} {"train_loss": -12.257643699645996, "global_step": 324122, "epoch": 1929} {"train_loss": -12.206180572509766, "global_step": 324123, "epoch": 1929} {"train_loss": -12.450247764587402, "global_step": 324124, "epoch": 1929} {"train_loss": -12.432459831237793, "global_step": 324125, "epoch": 1929} {"train_loss": -11.897408485412598, "global_step": 324126, "epoch": 1929} {"train_loss": -11.539944648742676, "global_step": 324127, "epoch": 1929} {"train_loss": -12.280990600585938, "global_step": 324128, "epoch": 1929} {"train_loss": -12.153952598571777, "global_step": 324129, "epoch": 1929} {"train_loss": -11.647321701049805, "global_step": 324130, "epoch": 1929} {"train_loss": -12.331730842590332, "global_step": 324131, "epoch": 1929} {"train_loss": -12.390054702758789, "global_step": 324132, "epoch": 1929} {"train_loss": -12.406170845031738, "global_step": 324133, "epoch": 1929} {"train_loss": -12.059496879577637, "global_step": 324134, "epoch": 1929} {"train_loss": -12.368061065673828, "global_step": 324135, "epoch": 1929} {"train_loss": -12.497303009033203, "global_step": 324136, "epoch": 1929} {"train_loss": -12.443534851074219, "global_step": 324137, "epoch": 1929} {"train_loss": -12.55412483215332, "global_step": 324138, "epoch": 1929} {"train_loss": -12.501943588256836, "global_step": 324139, "epoch": 1929} {"train_loss": -12.6975736618042, "global_step": 324140, "epoch": 1929} {"train_loss": -12.307037353515625, "global_step": 324141, "epoch": 1929} {"train_loss": -12.260967254638672, "global_step": 324142, "epoch": 1929} {"train_loss": -11.96141242980957, "global_step": 324143, "epoch": 1929} {"train_loss": -12.650956153869629, "global_step": 324144, "epoch": 1929} {"train_loss": -11.391140937805176, "global_step": 324145, "epoch": 1929} {"train_loss": -10.360237121582031, "global_step": 324146, "epoch": 1929} {"train_loss": -10.28631591796875, "global_step": 324147, "epoch": 1929} {"train_loss": -11.585808753967285, "global_step": 324148, "epoch": 1929} {"train_loss": -10.512341499328613, "global_step": 324149, "epoch": 1929} {"train_loss": -11.114645957946777, "global_step": 324150, "epoch": 1929} {"train_loss": -10.969722747802734, "global_step": 324151, "epoch": 1929} {"train_loss": -11.245057106018066, "global_step": 324152, "epoch": 1929} {"train_loss": -11.365720748901367, "global_step": 324153, "epoch": 1929} {"train_loss": -11.855579376220703, "global_step": 324154, "epoch": 1929} {"train_loss": -11.975308418273926, "global_step": 324155, "epoch": 1929} {"train_loss": -12.100746154785156, "global_step": 324156, "epoch": 1929} {"train_loss": -11.476175308227539, "global_step": 324157, "epoch": 1929} {"train_loss": -10.930929183959961, "global_step": 324158, "epoch": 1929} {"train_loss": -10.915318489074707, "global_step": 324159, "epoch": 1929} {"train_loss": -12.013190269470215, "global_step": 324160, "epoch": 1929} {"train_loss": -11.259302139282227, "global_step": 324161, "epoch": 1929} {"train_loss": -11.090253829956055, "global_step": 324162, "epoch": 1929} {"train_loss": -10.745645523071289, "global_step": 324163, "epoch": 1929} {"train_loss": -10.922396659851074, "global_step": 324164, "epoch": 1929} {"train_loss": -10.736806869506836, "global_step": 324165, "epoch": 1929} {"train_loss": -9.63962459564209, "global_step": 324166, "epoch": 1929} {"train_loss": -10.582597732543945, "global_step": 324167, "epoch": 1929} {"train_loss": -9.422873497009277, "global_step": 324168, "epoch": 1929} {"train_loss": -10.879870414733887, "global_step": 324169, "epoch": 1929} {"train_loss": -9.531713485717773, "global_step": 324170, "epoch": 1929} {"train_loss": -10.852843284606934, "global_step": 324171, "epoch": 1929} {"train_loss": -10.134806632995605, "global_step": 324172, "epoch": 1929} {"train_loss": -9.659294128417969, "global_step": 324173, "epoch": 1929} {"train_loss": -9.54553508758545, "global_step": 324174, "epoch": 1929} {"train_loss": -9.297797203063965, "global_step": 324175, "epoch": 1929} {"train_loss": -10.17538070678711, "global_step": 324176, "epoch": 1929} {"train_loss": -10.330652236938477, "global_step": 324177, "epoch": 1929} {"train_loss": -9.280801773071289, "global_step": 324178, "epoch": 1929} {"train_loss": -10.805684089660645, "global_step": 324179, "epoch": 1929} {"train_loss": -9.68477725982666, "global_step": 324180, "epoch": 1929} {"train_loss": -10.007490158081055, "global_step": 324181, "epoch": 1929} {"train_loss": -10.104443550109863, "global_step": 324182, "epoch": 1929} {"train_loss": -11.264215469360352, "global_step": 324183, "epoch": 1929} {"train_loss": -10.053044319152832, "global_step": 324184, "epoch": 1929} {"train_loss": -11.297737121582031, "global_step": 324185, "epoch": 1929} {"train_loss": -10.565771102905273, "global_step": 324186, "epoch": 1929} {"train_loss": -10.699600219726562, "global_step": 324187, "epoch": 1929} {"train_loss": -11.231481552124023, "global_step": 324188, "epoch": 1929} {"train_loss": -10.97593879699707, "global_step": 324189, "epoch": 1929} {"train_loss": -11.024785995483398, "global_step": 324190, "epoch": 1929} {"train_loss": -11.200393676757812, "global_step": 324191, "epoch": 1929} {"train_loss": -11.443855285644531, "global_step": 324192, "epoch": 1929} {"train_loss": -11.304956436157227, "global_step": 324193, "epoch": 1929} {"train_loss": -11.750043869018555, "global_step": 324194, "epoch": 1929} {"train_loss": -11.405508041381836, "global_step": 324195, "epoch": 1929} {"train_loss": -11.732361793518066, "global_step": 324196, "epoch": 1929} {"train_loss": -11.446672439575195, "global_step": 324197, "epoch": 1929} {"train_loss": -11.927949905395508, "global_step": 324198, "epoch": 1929} {"train_loss": -10.770723342895508, "global_step": 324199, "epoch": 1929} {"train_loss": -11.823256492614746, "global_step": 324200, "epoch": 1929} {"train_loss": -11.308135032653809, "global_step": 324201, "epoch": 1929} {"train_loss": -11.636955261230469, "global_step": 324202, "epoch": 1929} {"train_loss": -11.860698699951172, "global_step": 324203, "epoch": 1929} {"train_loss": -11.889936447143555, "global_step": 324204, "epoch": 1929} {"train_loss": -11.726662635803223, "global_step": 324205, "epoch": 1929} {"train_loss": -12.067696571350098, "global_step": 324206, "epoch": 1929} {"train_loss": -11.583346366882324, "global_step": 324207, "epoch": 1929} {"train_loss": -11.75648307800293, "global_step": 324208, "epoch": 1929} {"train_loss": -11.808940887451172, "global_step": 324209, "epoch": 1929} {"train_loss": -11.659624099731445, "global_step": 324210, "epoch": 1929} {"train_loss": -11.691352844238281, "global_step": 324211, "epoch": 1929} {"train_loss": -11.82347297668457, "global_step": 324212, "epoch": 1929} {"train_loss": -11.792213439941406, "global_step": 324213, "epoch": 1929} {"train_loss": -12.119256019592285, "global_step": 324214, "epoch": 1929} {"train_loss": -11.662826538085938, "global_step": 324215, "epoch": 1929} {"train_loss": -11.991795539855957, "global_step": 324216, "epoch": 1929} {"train_loss": -11.80245304107666, "global_step": 324217, "epoch": 1929} {"train_loss": -11.96369743347168, "global_step": 324218, "epoch": 1929} {"train_loss": -11.752113342285156, "global_step": 324219, "epoch": 1929} {"train_loss": -12.029786109924316, "global_step": 324220, "epoch": 1929} {"train_loss": -11.912378311157227, "global_step": 324221, "epoch": 1929} {"train_loss": -12.02861213684082, "global_step": 324222, "epoch": 1929} {"train_loss": -11.953374862670898, "global_step": 324223, "epoch": 1929} {"train_loss": -12.078662872314453, "global_step": 324224, "epoch": 1929} {"train_loss": -12.031381607055664, "global_step": 324225, "epoch": 1929} {"train_loss": -12.020914077758789, "global_step": 324226, "epoch": 1929} {"train_loss": -11.862764358520508, "global_step": 324227, "epoch": 1929} {"train_loss": -12.186280250549316, "global_step": 324228, "epoch": 1929} {"train_loss": -11.507579803466797, "global_step": 324229, "epoch": 1929} {"train_loss": -12.169122695922852, "global_step": 324230, "epoch": 1929} {"train_loss": -11.874612808227539, "global_step": 324231, "epoch": 1929} {"train_loss": -12.118647575378418, "global_step": 324232, "epoch": 1929} {"train_loss": -11.80807876586914, "global_step": 324233, "epoch": 1929} {"train_loss": -12.155840873718262, "global_step": 324234, "epoch": 1929} {"train_loss": -11.883199691772461, "global_step": 324235, "epoch": 1929} {"train_loss": -12.168030738830566, "global_step": 324236, "epoch": 1929} {"train_loss": -12.137916564941406, "global_step": 324237, "epoch": 1929} {"train_loss": -11.988801002502441, "global_step": 324238, "epoch": 1929} {"train_loss": -11.705825090408325, "global_step": 324239, "epoch": 1929, "val_loss": 287080.90625} {"train_loss": -12.125776290893555, "global_step": 324240, "epoch": 1930} {"train_loss": -12.124041557312012, "global_step": 324241, "epoch": 1930} {"train_loss": -12.132619857788086, "global_step": 324242, "epoch": 1930} {"train_loss": -12.25313949584961, "global_step": 324243, "epoch": 1930} {"train_loss": -12.263313293457031, "global_step": 324244, "epoch": 1930} {"train_loss": -12.383231163024902, "global_step": 324245, "epoch": 1930} {"train_loss": -12.17892074584961, "global_step": 324246, "epoch": 1930} {"train_loss": -12.545478820800781, "global_step": 324247, "epoch": 1930} {"train_loss": -12.32227897644043, "global_step": 324248, "epoch": 1930} {"train_loss": -12.155410766601562, "global_step": 324249, "epoch": 1930} {"train_loss": -12.223590850830078, "global_step": 324250, "epoch": 1930} {"train_loss": -12.412101745605469, "global_step": 324251, "epoch": 1930} {"train_loss": -12.33501148223877, "global_step": 324252, "epoch": 1930} {"train_loss": -12.263542175292969, "global_step": 324253, "epoch": 1930} {"train_loss": -12.585036277770996, "global_step": 324254, "epoch": 1930} {"train_loss": -12.410332679748535, "global_step": 324255, "epoch": 1930} {"train_loss": -12.487483978271484, "global_step": 324256, "epoch": 1930} {"train_loss": -12.42741584777832, "global_step": 324257, "epoch": 1930} {"train_loss": -12.113292694091797, "global_step": 324258, "epoch": 1930} {"train_loss": -12.438085556030273, "global_step": 324259, "epoch": 1930} {"train_loss": -12.346903800964355, "global_step": 324260, "epoch": 1930} {"train_loss": -12.388784408569336, "global_step": 324261, "epoch": 1930} {"train_loss": -12.482980728149414, "global_step": 324262, "epoch": 1930} {"train_loss": -12.426114082336426, "global_step": 324263, "epoch": 1930} {"train_loss": -12.46725845336914, "global_step": 324264, "epoch": 1930} {"train_loss": -12.483397483825684, "global_step": 324265, "epoch": 1930} {"train_loss": -12.387653350830078, "global_step": 324266, "epoch": 1930} {"train_loss": -12.257305145263672, "global_step": 324267, "epoch": 1930} {"train_loss": -12.072477340698242, "global_step": 324268, "epoch": 1930} {"train_loss": -12.114590644836426, "global_step": 324269, "epoch": 1930} {"train_loss": -12.019745826721191, "global_step": 324270, "epoch": 1930} {"train_loss": -12.078115463256836, "global_step": 324271, "epoch": 1930} {"train_loss": -12.274551391601562, "global_step": 324272, "epoch": 1930} {"train_loss": -11.761520385742188, "global_step": 324273, "epoch": 1930} {"train_loss": -12.375234603881836, "global_step": 324274, "epoch": 1930} {"train_loss": -11.74770736694336, "global_step": 324275, "epoch": 1930} {"train_loss": -12.120257377624512, "global_step": 324276, "epoch": 1930} {"train_loss": -12.15106201171875, "global_step": 324277, "epoch": 1930} {"train_loss": -11.718951225280762, "global_step": 324278, "epoch": 1930} {"train_loss": -11.751306533813477, "global_step": 324279, "epoch": 1930} {"train_loss": -12.289148330688477, "global_step": 324280, "epoch": 1930} {"train_loss": -11.696556091308594, "global_step": 324281, "epoch": 1930} {"train_loss": -12.272406578063965, "global_step": 324282, "epoch": 1930} {"train_loss": -12.123841285705566, "global_step": 324283, "epoch": 1930} {"train_loss": -11.67032241821289, "global_step": 324284, "epoch": 1930} {"train_loss": -11.6054105758667, "global_step": 324285, "epoch": 1930} {"train_loss": -11.9166259765625, "global_step": 324286, "epoch": 1930} {"train_loss": -11.446969985961914, "global_step": 324287, "epoch": 1930} {"train_loss": -11.820328712463379, "global_step": 324288, "epoch": 1930} {"train_loss": -11.473769187927246, "global_step": 324289, "epoch": 1930} {"train_loss": -10.258169174194336, "global_step": 324290, "epoch": 1930} {"train_loss": -12.097731590270996, "global_step": 324291, "epoch": 1930} {"train_loss": -11.540693283081055, "global_step": 324292, "epoch": 1930} {"train_loss": -10.846122741699219, "global_step": 324293, "epoch": 1930} {"train_loss": -11.53689193725586, "global_step": 324294, "epoch": 1930} {"train_loss": -11.652259826660156, "global_step": 324295, "epoch": 1930} {"train_loss": -11.875791549682617, "global_step": 324296, "epoch": 1930} {"train_loss": -12.09231948852539, "global_step": 324297, "epoch": 1930} {"train_loss": -11.68417739868164, "global_step": 324298, "epoch": 1930} {"train_loss": -11.654102325439453, "global_step": 324299, "epoch": 1930} {"train_loss": -11.88925838470459, "global_step": 324300, "epoch": 1930} {"train_loss": -12.0635986328125, "global_step": 324301, "epoch": 1930} {"train_loss": -12.044391632080078, "global_step": 324302, "epoch": 1930} {"train_loss": -12.049354553222656, "global_step": 324303, "epoch": 1930} {"train_loss": -11.75765323638916, "global_step": 324304, "epoch": 1930} {"train_loss": -11.895275115966797, "global_step": 324305, "epoch": 1930} {"train_loss": -11.921625137329102, "global_step": 324306, "epoch": 1930} {"train_loss": -12.295181274414062, "global_step": 324307, "epoch": 1930} {"train_loss": -11.760705947875977, "global_step": 324308, "epoch": 1930} {"train_loss": -12.066661834716797, "global_step": 324309, "epoch": 1930} {"train_loss": -12.128488540649414, "global_step": 324310, "epoch": 1930} {"train_loss": -11.844189643859863, "global_step": 324311, "epoch": 1930} {"train_loss": -11.721948623657227, "global_step": 324312, "epoch": 1930} {"train_loss": -11.990060806274414, "global_step": 324313, "epoch": 1930} {"train_loss": -12.123534202575684, "global_step": 324314, "epoch": 1930} {"train_loss": -11.689373016357422, "global_step": 324315, "epoch": 1930} {"train_loss": -12.096830368041992, "global_step": 324316, "epoch": 1930} {"train_loss": -11.97789478302002, "global_step": 324317, "epoch": 1930} {"train_loss": -12.038758277893066, "global_step": 324318, "epoch": 1930} {"train_loss": -11.639974594116211, "global_step": 324319, "epoch": 1930} {"train_loss": -12.10400104522705, "global_step": 324320, "epoch": 1930} {"train_loss": -11.86954116821289, "global_step": 324321, "epoch": 1930} {"train_loss": -11.093154907226562, "global_step": 324322, "epoch": 1930} {"train_loss": -11.920650482177734, "global_step": 324323, "epoch": 1930} {"train_loss": -12.379668235778809, "global_step": 324324, "epoch": 1930} {"train_loss": -12.191020965576172, "global_step": 324325, "epoch": 1930} {"train_loss": -12.142599105834961, "global_step": 324326, "epoch": 1930} {"train_loss": -12.036049842834473, "global_step": 324327, "epoch": 1930} {"train_loss": -11.924657821655273, "global_step": 324328, "epoch": 1930} {"train_loss": -12.348796844482422, "global_step": 324329, "epoch": 1930} {"train_loss": -12.354063034057617, "global_step": 324330, "epoch": 1930} {"train_loss": -12.220149040222168, "global_step": 324331, "epoch": 1930} {"train_loss": -12.232376098632812, "global_step": 324332, "epoch": 1930} {"train_loss": -12.388556480407715, "global_step": 324333, "epoch": 1930} {"train_loss": -11.890111923217773, "global_step": 324334, "epoch": 1930} {"train_loss": -12.301878929138184, "global_step": 324335, "epoch": 1930} {"train_loss": -12.118711471557617, "global_step": 324336, "epoch": 1930} {"train_loss": -12.257495880126953, "global_step": 324337, "epoch": 1930} {"train_loss": -12.154264450073242, "global_step": 324338, "epoch": 1930} {"train_loss": -12.412376403808594, "global_step": 324339, "epoch": 1930} {"train_loss": -11.795137405395508, "global_step": 324340, "epoch": 1930} {"train_loss": -11.93249797821045, "global_step": 324341, "epoch": 1930} {"train_loss": -12.157124519348145, "global_step": 324342, "epoch": 1930} {"train_loss": -11.79749584197998, "global_step": 324343, "epoch": 1930} {"train_loss": -12.147334098815918, "global_step": 324344, "epoch": 1930} {"train_loss": -12.429849624633789, "global_step": 324345, "epoch": 1930} {"train_loss": -12.060418128967285, "global_step": 324346, "epoch": 1930} {"train_loss": -12.350114822387695, "global_step": 324347, "epoch": 1930} {"train_loss": -11.986028671264648, "global_step": 324348, "epoch": 1930} {"train_loss": -12.13764762878418, "global_step": 324349, "epoch": 1930} {"train_loss": -12.169373512268066, "global_step": 324350, "epoch": 1930} {"train_loss": -11.863012313842773, "global_step": 324351, "epoch": 1930} {"train_loss": -11.939165115356445, "global_step": 324352, "epoch": 1930} {"train_loss": -12.163642883300781, "global_step": 324353, "epoch": 1930} {"train_loss": -11.881855010986328, "global_step": 324354, "epoch": 1930} {"train_loss": -11.620887756347656, "global_step": 324355, "epoch": 1930} {"train_loss": -11.990193367004395, "global_step": 324356, "epoch": 1930} {"train_loss": -11.111538887023926, "global_step": 324357, "epoch": 1930} {"train_loss": -11.742403984069824, "global_step": 324358, "epoch": 1930} {"train_loss": -11.32265567779541, "global_step": 324359, "epoch": 1930} {"train_loss": -10.391733169555664, "global_step": 324360, "epoch": 1930} {"train_loss": -11.45645523071289, "global_step": 324361, "epoch": 1930} {"train_loss": -12.116344451904297, "global_step": 324362, "epoch": 1930} {"train_loss": -10.438051223754883, "global_step": 324363, "epoch": 1930} {"train_loss": -11.571069717407227, "global_step": 324364, "epoch": 1930} {"train_loss": -11.677728652954102, "global_step": 324365, "epoch": 1930} {"train_loss": -10.895872116088867, "global_step": 324366, "epoch": 1930} {"train_loss": -12.030967712402344, "global_step": 324367, "epoch": 1930} {"train_loss": -11.780396461486816, "global_step": 324368, "epoch": 1930} {"train_loss": -10.771102905273438, "global_step": 324369, "epoch": 1930} {"train_loss": -11.918179512023926, "global_step": 324370, "epoch": 1930} {"train_loss": -11.785505294799805, "global_step": 324371, "epoch": 1930} {"train_loss": -11.818045616149902, "global_step": 324372, "epoch": 1930} {"train_loss": -11.370708465576172, "global_step": 324373, "epoch": 1930} {"train_loss": -11.6787691116333, "global_step": 324374, "epoch": 1930} {"train_loss": -11.153804779052734, "global_step": 324375, "epoch": 1930} {"train_loss": -11.508672714233398, "global_step": 324376, "epoch": 1930} {"train_loss": -11.799293518066406, "global_step": 324377, "epoch": 1930} {"train_loss": -11.641257286071777, "global_step": 324378, "epoch": 1930} {"train_loss": -11.944400787353516, "global_step": 324379, "epoch": 1930} {"train_loss": -11.457540512084961, "global_step": 324380, "epoch": 1930} {"train_loss": -11.313741683959961, "global_step": 324381, "epoch": 1930} {"train_loss": -11.277185440063477, "global_step": 324382, "epoch": 1930} {"train_loss": -11.452205657958984, "global_step": 324383, "epoch": 1930} {"train_loss": -11.799479484558105, "global_step": 324384, "epoch": 1930} {"train_loss": -11.787178039550781, "global_step": 324385, "epoch": 1930} {"train_loss": -11.865509033203125, "global_step": 324386, "epoch": 1930} {"train_loss": -11.677106857299805, "global_step": 324387, "epoch": 1930} {"train_loss": -11.844780921936035, "global_step": 324388, "epoch": 1930} {"train_loss": -11.69753646850586, "global_step": 324389, "epoch": 1930} {"train_loss": -12.114961624145508, "global_step": 324390, "epoch": 1930} {"train_loss": -11.744606018066406, "global_step": 324391, "epoch": 1930} {"train_loss": -11.609468460083008, "global_step": 324392, "epoch": 1930} {"train_loss": -11.708499908447266, "global_step": 324393, "epoch": 1930} {"train_loss": -11.505949020385742, "global_step": 324394, "epoch": 1930} {"train_loss": -11.933414459228516, "global_step": 324395, "epoch": 1930} {"train_loss": -11.822417259216309, "global_step": 324396, "epoch": 1930} {"train_loss": -12.07607364654541, "global_step": 324397, "epoch": 1930} {"train_loss": -12.191028594970703, "global_step": 324398, "epoch": 1930} {"train_loss": -11.870930671691895, "global_step": 324399, "epoch": 1930} {"train_loss": -11.853902816772461, "global_step": 324400, "epoch": 1930} {"train_loss": -12.0693359375, "global_step": 324401, "epoch": 1930} {"train_loss": -11.957921981811523, "global_step": 324402, "epoch": 1930} {"train_loss": -12.044081687927246, "global_step": 324403, "epoch": 1930} {"train_loss": -11.972810745239258, "global_step": 324404, "epoch": 1930} {"train_loss": -11.763014793395996, "global_step": 324405, "epoch": 1930} {"train_loss": -11.959604263305664, "global_step": 324406, "epoch": 1930} {"train_loss": -11.92225182056427, "global_step": 324407, "epoch": 1930, "val_loss": 285108.09375, "train_action_mse_error": 0.6984849572181702} {"train_loss": -11.52168083190918, "global_step": 324408, "epoch": 1931} {"train_loss": -11.8749418258667, "global_step": 324409, "epoch": 1931} {"train_loss": -11.915223121643066, "global_step": 324410, "epoch": 1931} {"train_loss": -12.359912872314453, "global_step": 324411, "epoch": 1931} {"train_loss": -11.404932022094727, "global_step": 324412, "epoch": 1931} {"train_loss": -11.759899139404297, "global_step": 324413, "epoch": 1931} {"train_loss": -11.601106643676758, "global_step": 324414, "epoch": 1931} {"train_loss": -11.787784576416016, "global_step": 324415, "epoch": 1931} {"train_loss": -11.199812889099121, "global_step": 324416, "epoch": 1931} {"train_loss": -11.583703994750977, "global_step": 324417, "epoch": 1931} {"train_loss": -11.704994201660156, "global_step": 324418, "epoch": 1931} {"train_loss": -12.190635681152344, "global_step": 324419, "epoch": 1931} {"train_loss": -12.038921356201172, "global_step": 324420, "epoch": 1931} {"train_loss": -11.550362586975098, "global_step": 324421, "epoch": 1931} {"train_loss": -12.389738082885742, "global_step": 324422, "epoch": 1931} {"train_loss": -11.904891014099121, "global_step": 324423, "epoch": 1931} {"train_loss": -12.100696563720703, "global_step": 324424, "epoch": 1931} {"train_loss": -12.122940063476562, "global_step": 324425, "epoch": 1931} {"train_loss": -12.374194145202637, "global_step": 324426, "epoch": 1931} {"train_loss": -11.65281867980957, "global_step": 324427, "epoch": 1931} {"train_loss": -12.311622619628906, "global_step": 324428, "epoch": 1931} {"train_loss": -12.478721618652344, "global_step": 324429, "epoch": 1931} {"train_loss": -12.421112060546875, "global_step": 324430, "epoch": 1931} {"train_loss": -12.347685813903809, "global_step": 324431, "epoch": 1931} {"train_loss": -12.44182014465332, "global_step": 324432, "epoch": 1931} {"train_loss": -12.349143981933594, "global_step": 324433, "epoch": 1931} {"train_loss": -12.423338890075684, "global_step": 324434, "epoch": 1931} {"train_loss": -12.296236038208008, "global_step": 324435, "epoch": 1931} {"train_loss": -12.385009765625, "global_step": 324436, "epoch": 1931} {"train_loss": -12.05815601348877, "global_step": 324437, "epoch": 1931} {"train_loss": -12.264284133911133, "global_step": 324438, "epoch": 1931} {"train_loss": -12.283208847045898, "global_step": 324439, "epoch": 1931} {"train_loss": -12.129609107971191, "global_step": 324440, "epoch": 1931} {"train_loss": -12.361978530883789, "global_step": 324441, "epoch": 1931} {"train_loss": -11.371253967285156, "global_step": 324442, "epoch": 1931} {"train_loss": -12.448163032531738, "global_step": 324443, "epoch": 1931} {"train_loss": -12.473125457763672, "global_step": 324444, "epoch": 1931} {"train_loss": -12.426154136657715, "global_step": 324445, "epoch": 1931} {"train_loss": -12.381637573242188, "global_step": 324446, "epoch": 1931} {"train_loss": -12.230016708374023, "global_step": 324447, "epoch": 1931} {"train_loss": -12.236665725708008, "global_step": 324448, "epoch": 1931} {"train_loss": -12.409518241882324, "global_step": 324449, "epoch": 1931} {"train_loss": -12.157596588134766, "global_step": 324450, "epoch": 1931} {"train_loss": -12.484978675842285, "global_step": 324451, "epoch": 1931} {"train_loss": -12.374494552612305, "global_step": 324452, "epoch": 1931} {"train_loss": -12.643474578857422, "global_step": 324453, "epoch": 1931} {"train_loss": -12.414347648620605, "global_step": 324454, "epoch": 1931} {"train_loss": -12.11231803894043, "global_step": 324455, "epoch": 1931} {"train_loss": -12.332107543945312, "global_step": 324456, "epoch": 1931} {"train_loss": -12.343154907226562, "global_step": 324457, "epoch": 1931} {"train_loss": -12.178387641906738, "global_step": 324458, "epoch": 1931} {"train_loss": -12.503828048706055, "global_step": 324459, "epoch": 1931} {"train_loss": -12.408012390136719, "global_step": 324460, "epoch": 1931} {"train_loss": -12.179826736450195, "global_step": 324461, "epoch": 1931} {"train_loss": -12.154470443725586, "global_step": 324462, "epoch": 1931} {"train_loss": -12.121307373046875, "global_step": 324463, "epoch": 1931} {"train_loss": -11.104342460632324, "global_step": 324464, "epoch": 1931} {"train_loss": -10.763103485107422, "global_step": 324465, "epoch": 1931} {"train_loss": -12.237018585205078, "global_step": 324466, "epoch": 1931} {"train_loss": -12.082986831665039, "global_step": 324467, "epoch": 1931} {"train_loss": -11.451171875, "global_step": 324468, "epoch": 1931} {"train_loss": -11.242347717285156, "global_step": 324469, "epoch": 1931} {"train_loss": -11.47464370727539, "global_step": 324470, "epoch": 1931} {"train_loss": -10.087514877319336, "global_step": 324471, "epoch": 1931} {"train_loss": -10.596517562866211, "global_step": 324472, "epoch": 1931} {"train_loss": -11.005810737609863, "global_step": 324473, "epoch": 1931} {"train_loss": -9.649782180786133, "global_step": 324474, "epoch": 1931} {"train_loss": -9.641557693481445, "global_step": 324475, "epoch": 1931} {"train_loss": -9.983865737915039, "global_step": 324476, "epoch": 1931} {"train_loss": -11.073440551757812, "global_step": 324477, "epoch": 1931} {"train_loss": -10.199209213256836, "global_step": 324478, "epoch": 1931} {"train_loss": -10.941980361938477, "global_step": 324479, "epoch": 1931} {"train_loss": -10.132318496704102, "global_step": 324480, "epoch": 1931} {"train_loss": -10.574127197265625, "global_step": 324481, "epoch": 1931} {"train_loss": -10.788941383361816, "global_step": 324482, "epoch": 1931} {"train_loss": -11.652702331542969, "global_step": 324483, "epoch": 1931} {"train_loss": -11.956851959228516, "global_step": 324484, "epoch": 1931} {"train_loss": -11.36207103729248, "global_step": 324485, "epoch": 1931} {"train_loss": -11.99374771118164, "global_step": 324486, "epoch": 1931} {"train_loss": -11.681574821472168, "global_step": 324487, "epoch": 1931} {"train_loss": -11.886924743652344, "global_step": 324488, "epoch": 1931} {"train_loss": -11.793787002563477, "global_step": 324489, "epoch": 1931} {"train_loss": -11.640308380126953, "global_step": 324490, "epoch": 1931} {"train_loss": -11.942028045654297, "global_step": 324491, "epoch": 1931} {"train_loss": -11.752130508422852, "global_step": 324492, "epoch": 1931} {"train_loss": -11.933603286743164, "global_step": 324493, "epoch": 1931} {"train_loss": -11.628368377685547, "global_step": 324494, "epoch": 1931} {"train_loss": -11.24299430847168, "global_step": 324495, "epoch": 1931} {"train_loss": -12.08476448059082, "global_step": 324496, "epoch": 1931} {"train_loss": -10.836965560913086, "global_step": 324497, "epoch": 1931} {"train_loss": -11.91505241394043, "global_step": 324498, "epoch": 1931} {"train_loss": -11.297843933105469, "global_step": 324499, "epoch": 1931} {"train_loss": -11.081352233886719, "global_step": 324500, "epoch": 1931} {"train_loss": -11.593717575073242, "global_step": 324501, "epoch": 1931} {"train_loss": -10.351383209228516, "global_step": 324502, "epoch": 1931} {"train_loss": -11.209101676940918, "global_step": 324503, "epoch": 1931} {"train_loss": -11.050329208374023, "global_step": 324504, "epoch": 1931} {"train_loss": -10.943841934204102, "global_step": 324505, "epoch": 1931} {"train_loss": -11.90286636352539, "global_step": 324506, "epoch": 1931} {"train_loss": -11.022309303283691, "global_step": 324507, "epoch": 1931} {"train_loss": -11.540914535522461, "global_step": 324508, "epoch": 1931} {"train_loss": -10.920503616333008, "global_step": 324509, "epoch": 1931} {"train_loss": -11.820260047912598, "global_step": 324510, "epoch": 1931} {"train_loss": -11.440882682800293, "global_step": 324511, "epoch": 1931} {"train_loss": -12.004791259765625, "global_step": 324512, "epoch": 1931} {"train_loss": -11.729818344116211, "global_step": 324513, "epoch": 1931} {"train_loss": -11.784734725952148, "global_step": 324514, "epoch": 1931} {"train_loss": -11.598186492919922, "global_step": 324515, "epoch": 1931} {"train_loss": -11.931113243103027, "global_step": 324516, "epoch": 1931} {"train_loss": -11.553277969360352, "global_step": 324517, "epoch": 1931} {"train_loss": -11.781340599060059, "global_step": 324518, "epoch": 1931} {"train_loss": -11.956531524658203, "global_step": 324519, "epoch": 1931} {"train_loss": -11.672386169433594, "global_step": 324520, "epoch": 1931} {"train_loss": -11.77822494506836, "global_step": 324521, "epoch": 1931} {"train_loss": -11.77869987487793, "global_step": 324522, "epoch": 1931} {"train_loss": -12.005285263061523, "global_step": 324523, "epoch": 1931} {"train_loss": -11.577754974365234, "global_step": 324524, "epoch": 1931} {"train_loss": -12.177553176879883, "global_step": 324525, "epoch": 1931} {"train_loss": -11.887880325317383, "global_step": 324526, "epoch": 1931} {"train_loss": -11.993858337402344, "global_step": 324527, "epoch": 1931} {"train_loss": -11.980027198791504, "global_step": 324528, "epoch": 1931} {"train_loss": -12.02627944946289, "global_step": 324529, "epoch": 1931} {"train_loss": -12.115547180175781, "global_step": 324530, "epoch": 1931} {"train_loss": -12.114322662353516, "global_step": 324531, "epoch": 1931} {"train_loss": -11.961684226989746, "global_step": 324532, "epoch": 1931} {"train_loss": -11.85779094696045, "global_step": 324533, "epoch": 1931} {"train_loss": -11.710688591003418, "global_step": 324534, "epoch": 1931} {"train_loss": -11.49190902709961, "global_step": 324535, "epoch": 1931} {"train_loss": -12.002220153808594, "global_step": 324536, "epoch": 1931} {"train_loss": -11.70274543762207, "global_step": 324537, "epoch": 1931} {"train_loss": -12.162039756774902, "global_step": 324538, "epoch": 1931} {"train_loss": -11.467482566833496, "global_step": 324539, "epoch": 1931} {"train_loss": -12.299360275268555, "global_step": 324540, "epoch": 1931} {"train_loss": -11.94413948059082, "global_step": 324541, "epoch": 1931} {"train_loss": -12.073736190795898, "global_step": 324542, "epoch": 1931} {"train_loss": -11.567368507385254, "global_step": 324543, "epoch": 1931} {"train_loss": -11.827232360839844, "global_step": 324544, "epoch": 1931} {"train_loss": -11.791155815124512, "global_step": 324545, "epoch": 1931} {"train_loss": -11.671072006225586, "global_step": 324546, "epoch": 1931} {"train_loss": -12.16561508178711, "global_step": 324547, "epoch": 1931} {"train_loss": -11.273681640625, "global_step": 324548, "epoch": 1931} {"train_loss": -12.184886932373047, "global_step": 324549, "epoch": 1931} {"train_loss": -11.310863494873047, "global_step": 324550, "epoch": 1931} {"train_loss": -11.751086235046387, "global_step": 324551, "epoch": 1931} {"train_loss": -11.838373184204102, "global_step": 324552, "epoch": 1931} {"train_loss": -11.57189655303955, "global_step": 324553, "epoch": 1931} {"train_loss": -11.60073471069336, "global_step": 324554, "epoch": 1931} {"train_loss": -11.65481948852539, "global_step": 324555, "epoch": 1931} {"train_loss": -12.10335922241211, "global_step": 324556, "epoch": 1931} {"train_loss": -11.7404146194458, "global_step": 324557, "epoch": 1931} {"train_loss": -11.896159172058105, "global_step": 324558, "epoch": 1931} {"train_loss": -12.116378784179688, "global_step": 324559, "epoch": 1931} {"train_loss": -11.876121520996094, "global_step": 324560, "epoch": 1931} {"train_loss": -11.842845916748047, "global_step": 324561, "epoch": 1931} {"train_loss": -12.209636688232422, "global_step": 324562, "epoch": 1931} {"train_loss": -11.9089937210083, "global_step": 324563, "epoch": 1931} {"train_loss": -12.048038482666016, "global_step": 324564, "epoch": 1931} {"train_loss": -11.781383514404297, "global_step": 324565, "epoch": 1931} {"train_loss": -12.040380477905273, "global_step": 324566, "epoch": 1931} {"train_loss": -12.243656158447266, "global_step": 324567, "epoch": 1931} {"train_loss": -12.215580940246582, "global_step": 324568, "epoch": 1931} {"train_loss": -12.176996231079102, "global_step": 324569, "epoch": 1931} {"train_loss": -12.161011695861816, "global_step": 324570, "epoch": 1931} {"train_loss": -12.086544036865234, "global_step": 324571, "epoch": 1931} {"train_loss": -11.818305969238281, "global_step": 324572, "epoch": 1931} {"train_loss": -12.237371444702148, "global_step": 324573, "epoch": 1931} {"train_loss": -11.989579200744629, "global_step": 324574, "epoch": 1931} {"train_loss": -11.780991821061997, "global_step": 324575, "epoch": 1931, "val_loss": 289947.53125} {"train_loss": -12.071016311645508, "global_step": 324576, "epoch": 1932} {"train_loss": -11.733284950256348, "global_step": 324577, "epoch": 1932} {"train_loss": -12.348102569580078, "global_step": 324578, "epoch": 1932} {"train_loss": -11.927692413330078, "global_step": 324579, "epoch": 1932} {"train_loss": -11.815413475036621, "global_step": 324580, "epoch": 1932} {"train_loss": -11.931121826171875, "global_step": 324581, "epoch": 1932} {"train_loss": -12.280597686767578, "global_step": 324582, "epoch": 1932} {"train_loss": -11.612205505371094, "global_step": 324583, "epoch": 1932} {"train_loss": -12.102344512939453, "global_step": 324584, "epoch": 1932} {"train_loss": -12.098459243774414, "global_step": 324585, "epoch": 1932} {"train_loss": -12.191920280456543, "global_step": 324586, "epoch": 1932} {"train_loss": -11.79032039642334, "global_step": 324587, "epoch": 1932} {"train_loss": -11.935175895690918, "global_step": 324588, "epoch": 1932} {"train_loss": -11.851139068603516, "global_step": 324589, "epoch": 1932} {"train_loss": -11.957483291625977, "global_step": 324590, "epoch": 1932} {"train_loss": -12.488890647888184, "global_step": 324591, "epoch": 1932} {"train_loss": -11.961260795593262, "global_step": 324592, "epoch": 1932} {"train_loss": -12.426728248596191, "global_step": 324593, "epoch": 1932} {"train_loss": -11.994295120239258, "global_step": 324594, "epoch": 1932} {"train_loss": -11.98617172241211, "global_step": 324595, "epoch": 1932} {"train_loss": -11.644811630249023, "global_step": 324596, "epoch": 1932} {"train_loss": -11.544332504272461, "global_step": 324597, "epoch": 1932} {"train_loss": -12.023446083068848, "global_step": 324598, "epoch": 1932} {"train_loss": -11.391345977783203, "global_step": 324599, "epoch": 1932} {"train_loss": -12.123453140258789, "global_step": 324600, "epoch": 1932} {"train_loss": -11.046049118041992, "global_step": 324601, "epoch": 1932} {"train_loss": -12.054977416992188, "global_step": 324602, "epoch": 1932} {"train_loss": -11.488606452941895, "global_step": 324603, "epoch": 1932} {"train_loss": -11.80375862121582, "global_step": 324604, "epoch": 1932} {"train_loss": -11.875301361083984, "global_step": 324605, "epoch": 1932} {"train_loss": -11.546539306640625, "global_step": 324606, "epoch": 1932} {"train_loss": -12.170117378234863, "global_step": 324607, "epoch": 1932} {"train_loss": -11.782256126403809, "global_step": 324608, "epoch": 1932} {"train_loss": -11.946002960205078, "global_step": 324609, "epoch": 1932} {"train_loss": -11.981840133666992, "global_step": 324610, "epoch": 1932} {"train_loss": -11.892641067504883, "global_step": 324611, "epoch": 1932} {"train_loss": -11.512913703918457, "global_step": 324612, "epoch": 1932} {"train_loss": -11.744318962097168, "global_step": 324613, "epoch": 1932} {"train_loss": -11.850455284118652, "global_step": 324614, "epoch": 1932} {"train_loss": -11.245732307434082, "global_step": 324615, "epoch": 1932} {"train_loss": -12.332895278930664, "global_step": 324616, "epoch": 1932} {"train_loss": -11.709291458129883, "global_step": 324617, "epoch": 1932} {"train_loss": -12.130714416503906, "global_step": 324618, "epoch": 1932} {"train_loss": -11.744779586791992, "global_step": 324619, "epoch": 1932} {"train_loss": -11.289815902709961, "global_step": 324620, "epoch": 1932} {"train_loss": -12.150728225708008, "global_step": 324621, "epoch": 1932} {"train_loss": -11.086748123168945, "global_step": 324622, "epoch": 1932} {"train_loss": -11.864811897277832, "global_step": 324623, "epoch": 1932} {"train_loss": -11.067471504211426, "global_step": 324624, "epoch": 1932} {"train_loss": -11.671390533447266, "global_step": 324625, "epoch": 1932} {"train_loss": -11.823221206665039, "global_step": 324626, "epoch": 1932} {"train_loss": -11.727502822875977, "global_step": 324627, "epoch": 1932} {"train_loss": -11.570213317871094, "global_step": 324628, "epoch": 1932} {"train_loss": -11.783072471618652, "global_step": 324629, "epoch": 1932} {"train_loss": -10.695613861083984, "global_step": 324630, "epoch": 1932} {"train_loss": -11.251991271972656, "global_step": 324631, "epoch": 1932} {"train_loss": -10.845041275024414, "global_step": 324632, "epoch": 1932} {"train_loss": -11.293302536010742, "global_step": 324633, "epoch": 1932} {"train_loss": -11.511421203613281, "global_step": 324634, "epoch": 1932} {"train_loss": -10.881695747375488, "global_step": 324635, "epoch": 1932} {"train_loss": -11.927288055419922, "global_step": 324636, "epoch": 1932} {"train_loss": -11.394207000732422, "global_step": 324637, "epoch": 1932} {"train_loss": -12.003044128417969, "global_step": 324638, "epoch": 1932} {"train_loss": -11.61422348022461, "global_step": 324639, "epoch": 1932} {"train_loss": -11.681398391723633, "global_step": 324640, "epoch": 1932} {"train_loss": -12.142820358276367, "global_step": 324641, "epoch": 1932} {"train_loss": -11.563405990600586, "global_step": 324642, "epoch": 1932} {"train_loss": -12.072708129882812, "global_step": 324643, "epoch": 1932} {"train_loss": -11.61701774597168, "global_step": 324644, "epoch": 1932} {"train_loss": -12.040093421936035, "global_step": 324645, "epoch": 1932} {"train_loss": -12.102659225463867, "global_step": 324646, "epoch": 1932} {"train_loss": -11.746805191040039, "global_step": 324647, "epoch": 1932} {"train_loss": -12.175918579101562, "global_step": 324648, "epoch": 1932} {"train_loss": -11.8775634765625, "global_step": 324649, "epoch": 1932} {"train_loss": -11.802865982055664, "global_step": 324650, "epoch": 1932} {"train_loss": -12.412748336791992, "global_step": 324651, "epoch": 1932} {"train_loss": -11.62171745300293, "global_step": 324652, "epoch": 1932} {"train_loss": -11.816750526428223, "global_step": 324653, "epoch": 1932} {"train_loss": -12.011258125305176, "global_step": 324654, "epoch": 1932} {"train_loss": -11.450034141540527, "global_step": 324655, "epoch": 1932} {"train_loss": -12.363338470458984, "global_step": 324656, "epoch": 1932} {"train_loss": -11.641321182250977, "global_step": 324657, "epoch": 1932} {"train_loss": -12.115978240966797, "global_step": 324658, "epoch": 1932} {"train_loss": -11.733528137207031, "global_step": 324659, "epoch": 1932} {"train_loss": -11.858287811279297, "global_step": 324660, "epoch": 1932} {"train_loss": -11.231764793395996, "global_step": 324661, "epoch": 1932} {"train_loss": -12.217584609985352, "global_step": 324662, "epoch": 1932} {"train_loss": -11.807769775390625, "global_step": 324663, "epoch": 1932} {"train_loss": -11.797370910644531, "global_step": 324664, "epoch": 1932} {"train_loss": -12.140140533447266, "global_step": 324665, "epoch": 1932} {"train_loss": -12.248766899108887, "global_step": 324666, "epoch": 1932} {"train_loss": -12.17018985748291, "global_step": 324667, "epoch": 1932} {"train_loss": -12.071050643920898, "global_step": 324668, "epoch": 1932} {"train_loss": -12.340787887573242, "global_step": 324669, "epoch": 1932} {"train_loss": -12.08640193939209, "global_step": 324670, "epoch": 1932} {"train_loss": -12.212871551513672, "global_step": 324671, "epoch": 1932} {"train_loss": -12.185632705688477, "global_step": 324672, "epoch": 1932} {"train_loss": -12.318964958190918, "global_step": 324673, "epoch": 1932} {"train_loss": -11.965705871582031, "global_step": 324674, "epoch": 1932} {"train_loss": -12.337628364562988, "global_step": 324675, "epoch": 1932} {"train_loss": -12.093735694885254, "global_step": 324676, "epoch": 1932} {"train_loss": -12.305187225341797, "global_step": 324677, "epoch": 1932} {"train_loss": -11.86194133758545, "global_step": 324678, "epoch": 1932} {"train_loss": -12.171783447265625, "global_step": 324679, "epoch": 1932} {"train_loss": -11.757648468017578, "global_step": 324680, "epoch": 1932} {"train_loss": -11.372003555297852, "global_step": 324681, "epoch": 1932} {"train_loss": -11.975651741027832, "global_step": 324682, "epoch": 1932} {"train_loss": -12.119503021240234, "global_step": 324683, "epoch": 1932} {"train_loss": -11.76693344116211, "global_step": 324684, "epoch": 1932} {"train_loss": -11.140975952148438, "global_step": 324685, "epoch": 1932} {"train_loss": -11.483650207519531, "global_step": 324686, "epoch": 1932} {"train_loss": -11.911733627319336, "global_step": 324687, "epoch": 1932} {"train_loss": -11.085620880126953, "global_step": 324688, "epoch": 1932} {"train_loss": -11.708930015563965, "global_step": 324689, "epoch": 1932} {"train_loss": -10.946083068847656, "global_step": 324690, "epoch": 1932} {"train_loss": -11.188167572021484, "global_step": 324691, "epoch": 1932} {"train_loss": -11.828644752502441, "global_step": 324692, "epoch": 1932} {"train_loss": -11.864173889160156, "global_step": 324693, "epoch": 1932} {"train_loss": -11.894813537597656, "global_step": 324694, "epoch": 1932} {"train_loss": -12.12529468536377, "global_step": 324695, "epoch": 1932} {"train_loss": -12.23520278930664, "global_step": 324696, "epoch": 1932} {"train_loss": -11.884936332702637, "global_step": 324697, "epoch": 1932} {"train_loss": -11.869333267211914, "global_step": 324698, "epoch": 1932} {"train_loss": -12.352901458740234, "global_step": 324699, "epoch": 1932} {"train_loss": -11.748811721801758, "global_step": 324700, "epoch": 1932} {"train_loss": -12.008116722106934, "global_step": 324701, "epoch": 1932} {"train_loss": -11.765789031982422, "global_step": 324702, "epoch": 1932} {"train_loss": -12.074982643127441, "global_step": 324703, "epoch": 1932} {"train_loss": -10.971769332885742, "global_step": 324704, "epoch": 1932} {"train_loss": -11.823512077331543, "global_step": 324705, "epoch": 1932} {"train_loss": -11.23214340209961, "global_step": 324706, "epoch": 1932} {"train_loss": -11.22840690612793, "global_step": 324707, "epoch": 1932} {"train_loss": -10.998300552368164, "global_step": 324708, "epoch": 1932} {"train_loss": -9.926935195922852, "global_step": 324709, "epoch": 1932} {"train_loss": -10.999942779541016, "global_step": 324710, "epoch": 1932} {"train_loss": -11.053565979003906, "global_step": 324711, "epoch": 1932} {"train_loss": -11.663858413696289, "global_step": 324712, "epoch": 1932} {"train_loss": -11.633868217468262, "global_step": 324713, "epoch": 1932} {"train_loss": -11.198143005371094, "global_step": 324714, "epoch": 1932} {"train_loss": -11.226423263549805, "global_step": 324715, "epoch": 1932} {"train_loss": -11.950912475585938, "global_step": 324716, "epoch": 1932} {"train_loss": -11.360563278198242, "global_step": 324717, "epoch": 1932} {"train_loss": -12.37097454071045, "global_step": 324718, "epoch": 1932} {"train_loss": -11.703635215759277, "global_step": 324719, "epoch": 1932} {"train_loss": -11.902811050415039, "global_step": 324720, "epoch": 1932} {"train_loss": -11.95627498626709, "global_step": 324721, "epoch": 1932} {"train_loss": -11.987037658691406, "global_step": 324722, "epoch": 1932} {"train_loss": -12.101991653442383, "global_step": 324723, "epoch": 1932} {"train_loss": -12.165557861328125, "global_step": 324724, "epoch": 1932} {"train_loss": -12.256423950195312, "global_step": 324725, "epoch": 1932} {"train_loss": -12.112374305725098, "global_step": 324726, "epoch": 1932} {"train_loss": -12.230947494506836, "global_step": 324727, "epoch": 1932} {"train_loss": -12.061365127563477, "global_step": 324728, "epoch": 1932} {"train_loss": -12.208311080932617, "global_step": 324729, "epoch": 1932} {"train_loss": -12.177420616149902, "global_step": 324730, "epoch": 1932} {"train_loss": -12.085563659667969, "global_step": 324731, "epoch": 1932} {"train_loss": -11.830869674682617, "global_step": 324732, "epoch": 1932} {"train_loss": -11.904024124145508, "global_step": 324733, "epoch": 1932} {"train_loss": -11.280893325805664, "global_step": 324734, "epoch": 1932} {"train_loss": -11.926246643066406, "global_step": 324735, "epoch": 1932} {"train_loss": -11.750106811523438, "global_step": 324736, "epoch": 1932} {"train_loss": -11.546268463134766, "global_step": 324737, "epoch": 1932} {"train_loss": -12.12313461303711, "global_step": 324738, "epoch": 1932} {"train_loss": -11.649898529052734, "global_step": 324739, "epoch": 1932} {"train_loss": -11.918036460876465, "global_step": 324740, "epoch": 1932} {"train_loss": -12.287307739257812, "global_step": 324741, "epoch": 1932} {"train_loss": -12.030826568603516, "global_step": 324742, "epoch": 1932} {"train_loss": -11.804773790495735, "global_step": 324743, "epoch": 1932, "val_loss": 288321.65625} {"train_loss": -12.060121536254883, "global_step": 324744, "epoch": 1933} {"train_loss": -12.198341369628906, "global_step": 324745, "epoch": 1933} {"train_loss": -11.493144989013672, "global_step": 324746, "epoch": 1933} {"train_loss": -12.102008819580078, "global_step": 324747, "epoch": 1933} {"train_loss": -11.996308326721191, "global_step": 324748, "epoch": 1933} {"train_loss": -11.684046745300293, "global_step": 324749, "epoch": 1933} {"train_loss": -12.098180770874023, "global_step": 324750, "epoch": 1933} {"train_loss": -12.085762023925781, "global_step": 324751, "epoch": 1933} {"train_loss": -11.949963569641113, "global_step": 324752, "epoch": 1933} {"train_loss": -12.30936336517334, "global_step": 324753, "epoch": 1933} {"train_loss": -11.986990928649902, "global_step": 324754, "epoch": 1933} {"train_loss": -12.230883598327637, "global_step": 324755, "epoch": 1933} {"train_loss": -11.920387268066406, "global_step": 324756, "epoch": 1933} {"train_loss": -12.295557022094727, "global_step": 324757, "epoch": 1933} {"train_loss": -12.023200988769531, "global_step": 324758, "epoch": 1933} {"train_loss": -12.196159362792969, "global_step": 324759, "epoch": 1933} {"train_loss": -12.332984924316406, "global_step": 324760, "epoch": 1933} {"train_loss": -11.806173324584961, "global_step": 324761, "epoch": 1933} {"train_loss": -12.188407897949219, "global_step": 324762, "epoch": 1933} {"train_loss": -12.042611122131348, "global_step": 324763, "epoch": 1933} {"train_loss": -12.111783981323242, "global_step": 324764, "epoch": 1933} {"train_loss": -12.099943161010742, "global_step": 324765, "epoch": 1933} {"train_loss": -11.699451446533203, "global_step": 324766, "epoch": 1933} {"train_loss": -12.367022514343262, "global_step": 324767, "epoch": 1933} {"train_loss": -12.246121406555176, "global_step": 324768, "epoch": 1933} {"train_loss": -12.17568588256836, "global_step": 324769, "epoch": 1933} {"train_loss": -11.994226455688477, "global_step": 324770, "epoch": 1933} {"train_loss": -12.156538009643555, "global_step": 324771, "epoch": 1933} {"train_loss": -12.020973205566406, "global_step": 324772, "epoch": 1933} {"train_loss": -12.199382781982422, "global_step": 324773, "epoch": 1933} {"train_loss": -12.009397506713867, "global_step": 324774, "epoch": 1933} {"train_loss": -11.215764999389648, "global_step": 324775, "epoch": 1933} {"train_loss": -12.094413757324219, "global_step": 324776, "epoch": 1933} {"train_loss": -12.003076553344727, "global_step": 324777, "epoch": 1933} {"train_loss": -12.27100658416748, "global_step": 324778, "epoch": 1933} {"train_loss": -12.198526382446289, "global_step": 324779, "epoch": 1933} {"train_loss": -11.99484634399414, "global_step": 324780, "epoch": 1933} {"train_loss": -12.416451454162598, "global_step": 324781, "epoch": 1933} {"train_loss": -12.252811431884766, "global_step": 324782, "epoch": 1933} {"train_loss": -12.33747386932373, "global_step": 324783, "epoch": 1933} {"train_loss": -12.008073806762695, "global_step": 324784, "epoch": 1933} {"train_loss": -12.344422340393066, "global_step": 324785, "epoch": 1933} {"train_loss": -12.009519577026367, "global_step": 324786, "epoch": 1933} {"train_loss": -11.849470138549805, "global_step": 324787, "epoch": 1933} {"train_loss": -12.027345657348633, "global_step": 324788, "epoch": 1933} {"train_loss": -12.41122817993164, "global_step": 324789, "epoch": 1933} {"train_loss": -12.082723617553711, "global_step": 324790, "epoch": 1933} {"train_loss": -11.903189659118652, "global_step": 324791, "epoch": 1933} {"train_loss": -12.217252731323242, "global_step": 324792, "epoch": 1933} {"train_loss": -12.10639762878418, "global_step": 324793, "epoch": 1933} {"train_loss": -12.077667236328125, "global_step": 324794, "epoch": 1933} {"train_loss": -12.499566078186035, "global_step": 324795, "epoch": 1933} {"train_loss": -12.223134994506836, "global_step": 324796, "epoch": 1933} {"train_loss": -12.26891040802002, "global_step": 324797, "epoch": 1933} {"train_loss": -12.091643333435059, "global_step": 324798, "epoch": 1933} {"train_loss": -12.109624862670898, "global_step": 324799, "epoch": 1933} {"train_loss": -12.324440002441406, "global_step": 324800, "epoch": 1933} {"train_loss": -12.051765441894531, "global_step": 324801, "epoch": 1933} {"train_loss": -12.282807350158691, "global_step": 324802, "epoch": 1933} {"train_loss": -11.616531372070312, "global_step": 324803, "epoch": 1933} {"train_loss": -12.075590133666992, "global_step": 324804, "epoch": 1933} {"train_loss": -12.000720977783203, "global_step": 324805, "epoch": 1933} {"train_loss": -11.678102493286133, "global_step": 324806, "epoch": 1933} {"train_loss": -11.867033004760742, "global_step": 324807, "epoch": 1933} {"train_loss": -12.182920455932617, "global_step": 324808, "epoch": 1933} {"train_loss": -12.063812255859375, "global_step": 324809, "epoch": 1933} {"train_loss": -11.985523223876953, "global_step": 324810, "epoch": 1933} {"train_loss": -12.412919998168945, "global_step": 324811, "epoch": 1933} {"train_loss": -12.149069786071777, "global_step": 324812, "epoch": 1933} {"train_loss": -12.058070182800293, "global_step": 324813, "epoch": 1933} {"train_loss": -11.976341247558594, "global_step": 324814, "epoch": 1933} {"train_loss": -12.278059959411621, "global_step": 324815, "epoch": 1933} {"train_loss": -11.815361022949219, "global_step": 324816, "epoch": 1933} {"train_loss": -12.357633590698242, "global_step": 324817, "epoch": 1933} {"train_loss": -12.335866928100586, "global_step": 324818, "epoch": 1933} {"train_loss": -12.265340805053711, "global_step": 324819, "epoch": 1933} {"train_loss": -11.58993148803711, "global_step": 324820, "epoch": 1933} {"train_loss": -12.326845169067383, "global_step": 324821, "epoch": 1933} {"train_loss": -11.679049491882324, "global_step": 324822, "epoch": 1933} {"train_loss": -11.800254821777344, "global_step": 324823, "epoch": 1933} {"train_loss": -11.76998233795166, "global_step": 324824, "epoch": 1933} {"train_loss": -12.121343612670898, "global_step": 324825, "epoch": 1933} {"train_loss": -11.847537994384766, "global_step": 324826, "epoch": 1933} {"train_loss": -11.371188163757324, "global_step": 324827, "epoch": 1933} {"train_loss": -12.300518035888672, "global_step": 324828, "epoch": 1933} {"train_loss": -11.980578422546387, "global_step": 324829, "epoch": 1933} {"train_loss": -12.24761962890625, "global_step": 324830, "epoch": 1933} {"train_loss": -11.629678726196289, "global_step": 324831, "epoch": 1933} {"train_loss": -11.912422180175781, "global_step": 324832, "epoch": 1933} {"train_loss": -12.18425464630127, "global_step": 324833, "epoch": 1933} {"train_loss": -12.148515701293945, "global_step": 324834, "epoch": 1933} {"train_loss": -12.134330749511719, "global_step": 324835, "epoch": 1933} {"train_loss": -12.232019424438477, "global_step": 324836, "epoch": 1933} {"train_loss": -12.273294448852539, "global_step": 324837, "epoch": 1933} {"train_loss": -12.174629211425781, "global_step": 324838, "epoch": 1933} {"train_loss": -12.306951522827148, "global_step": 324839, "epoch": 1933} {"train_loss": -12.362457275390625, "global_step": 324840, "epoch": 1933} {"train_loss": -12.389567375183105, "global_step": 324841, "epoch": 1933} {"train_loss": -12.166613578796387, "global_step": 324842, "epoch": 1933} {"train_loss": -12.511287689208984, "global_step": 324843, "epoch": 1933} {"train_loss": -11.970836639404297, "global_step": 324844, "epoch": 1933} {"train_loss": -12.440423965454102, "global_step": 324845, "epoch": 1933} {"train_loss": -12.080266952514648, "global_step": 324846, "epoch": 1933} {"train_loss": -12.4912109375, "global_step": 324847, "epoch": 1933} {"train_loss": -12.152090072631836, "global_step": 324848, "epoch": 1933} {"train_loss": -12.309892654418945, "global_step": 324849, "epoch": 1933} {"train_loss": -12.04963493347168, "global_step": 324850, "epoch": 1933} {"train_loss": -12.432453155517578, "global_step": 324851, "epoch": 1933} {"train_loss": -12.411608695983887, "global_step": 324852, "epoch": 1933} {"train_loss": -12.007058143615723, "global_step": 324853, "epoch": 1933} {"train_loss": -12.245719909667969, "global_step": 324854, "epoch": 1933} {"train_loss": -12.456442832946777, "global_step": 324855, "epoch": 1933} {"train_loss": -12.476293563842773, "global_step": 324856, "epoch": 1933} {"train_loss": -12.297283172607422, "global_step": 324857, "epoch": 1933} {"train_loss": -12.436185836791992, "global_step": 324858, "epoch": 1933} {"train_loss": -12.47068977355957, "global_step": 324859, "epoch": 1933} {"train_loss": -12.523809432983398, "global_step": 324860, "epoch": 1933} {"train_loss": -12.471332550048828, "global_step": 324861, "epoch": 1933} {"train_loss": -12.5557861328125, "global_step": 324862, "epoch": 1933} {"train_loss": -12.052497863769531, "global_step": 324863, "epoch": 1933} {"train_loss": -12.728231430053711, "global_step": 324864, "epoch": 1933} {"train_loss": -12.082222938537598, "global_step": 324865, "epoch": 1933} {"train_loss": -12.474225044250488, "global_step": 324866, "epoch": 1933} {"train_loss": -12.254801750183105, "global_step": 324867, "epoch": 1933} {"train_loss": -12.489988327026367, "global_step": 324868, "epoch": 1933} {"train_loss": -11.599858283996582, "global_step": 324869, "epoch": 1933} {"train_loss": -12.217304229736328, "global_step": 324870, "epoch": 1933} {"train_loss": -11.707809448242188, "global_step": 324871, "epoch": 1933} {"train_loss": -12.20489501953125, "global_step": 324872, "epoch": 1933} {"train_loss": -11.425691604614258, "global_step": 324873, "epoch": 1933} {"train_loss": -11.891650199890137, "global_step": 324874, "epoch": 1933} {"train_loss": -11.985956192016602, "global_step": 324875, "epoch": 1933} {"train_loss": -10.856535911560059, "global_step": 324876, "epoch": 1933} {"train_loss": -11.283243179321289, "global_step": 324877, "epoch": 1933} {"train_loss": -11.964925765991211, "global_step": 324878, "epoch": 1933} {"train_loss": -8.151212692260742, "global_step": 324879, "epoch": 1933} {"train_loss": -8.854988098144531, "global_step": 324880, "epoch": 1933} {"train_loss": -9.200176239013672, "global_step": 324881, "epoch": 1933} {"train_loss": -11.034734725952148, "global_step": 324882, "epoch": 1933} {"train_loss": -9.846177101135254, "global_step": 324883, "epoch": 1933} {"train_loss": -8.054037094116211, "global_step": 324884, "epoch": 1933} {"train_loss": -7.8387932777404785, "global_step": 324885, "epoch": 1933} {"train_loss": -7.531972885131836, "global_step": 324886, "epoch": 1933} {"train_loss": -8.520922660827637, "global_step": 324887, "epoch": 1933} {"train_loss": -9.070650100708008, "global_step": 324888, "epoch": 1933} {"train_loss": -10.050884246826172, "global_step": 324889, "epoch": 1933} {"train_loss": -9.833688735961914, "global_step": 324890, "epoch": 1933} {"train_loss": -11.116101264953613, "global_step": 324891, "epoch": 1933} {"train_loss": -10.587727546691895, "global_step": 324892, "epoch": 1933} {"train_loss": -11.092548370361328, "global_step": 324893, "epoch": 1933} {"train_loss": -10.515995979309082, "global_step": 324894, "epoch": 1933} {"train_loss": -10.89552116394043, "global_step": 324895, "epoch": 1933} {"train_loss": -10.48924446105957, "global_step": 324896, "epoch": 1933} {"train_loss": -10.53738784790039, "global_step": 324897, "epoch": 1933} {"train_loss": -10.93139362335205, "global_step": 324898, "epoch": 1933} {"train_loss": -10.592982292175293, "global_step": 324899, "epoch": 1933} {"train_loss": -11.260778427124023, "global_step": 324900, "epoch": 1933} {"train_loss": -10.827815055847168, "global_step": 324901, "epoch": 1933} {"train_loss": -11.440570831298828, "global_step": 324902, "epoch": 1933} {"train_loss": -11.523193359375, "global_step": 324903, "epoch": 1933} {"train_loss": -11.539798736572266, "global_step": 324904, "epoch": 1933} {"train_loss": -11.720611572265625, "global_step": 324905, "epoch": 1933} {"train_loss": -11.603226661682129, "global_step": 324906, "epoch": 1933} {"train_loss": -11.462789535522461, "global_step": 324907, "epoch": 1933} {"train_loss": -11.451562881469727, "global_step": 324908, "epoch": 1933} {"train_loss": -10.815028190612793, "global_step": 324909, "epoch": 1933} {"train_loss": -11.896178245544434, "global_step": 324910, "epoch": 1933} {"train_loss": -11.75944508541198, "global_step": 324911, "epoch": 1933, "val_loss": 275980.5625} {"train_loss": -11.627893447875977, "global_step": 324912, "epoch": 1934} {"train_loss": -11.734538078308105, "global_step": 324913, "epoch": 1934} {"train_loss": -11.571101188659668, "global_step": 324914, "epoch": 1934} {"train_loss": -11.646678924560547, "global_step": 324915, "epoch": 1934} {"train_loss": -11.99979019165039, "global_step": 324916, "epoch": 1934} {"train_loss": -11.924480438232422, "global_step": 324917, "epoch": 1934} {"train_loss": -11.598482131958008, "global_step": 324918, "epoch": 1934} {"train_loss": -12.077463150024414, "global_step": 324919, "epoch": 1934} {"train_loss": -12.167747497558594, "global_step": 324920, "epoch": 1934} {"train_loss": -11.990686416625977, "global_step": 324921, "epoch": 1934} {"train_loss": -11.94559097290039, "global_step": 324922, "epoch": 1934} {"train_loss": -12.058510780334473, "global_step": 324923, "epoch": 1934} {"train_loss": -11.858237266540527, "global_step": 324924, "epoch": 1934} {"train_loss": -11.933574676513672, "global_step": 324925, "epoch": 1934} {"train_loss": -11.848688125610352, "global_step": 324926, "epoch": 1934} {"train_loss": -11.89763069152832, "global_step": 324927, "epoch": 1934} {"train_loss": -12.251304626464844, "global_step": 324928, "epoch": 1934} {"train_loss": -11.781566619873047, "global_step": 324929, "epoch": 1934} {"train_loss": -12.205546379089355, "global_step": 324930, "epoch": 1934} {"train_loss": -12.068275451660156, "global_step": 324931, "epoch": 1934} {"train_loss": -11.729057312011719, "global_step": 324932, "epoch": 1934} {"train_loss": -12.357284545898438, "global_step": 324933, "epoch": 1934} {"train_loss": -11.996591567993164, "global_step": 324934, "epoch": 1934} {"train_loss": -12.026354789733887, "global_step": 324935, "epoch": 1934} {"train_loss": -12.251803398132324, "global_step": 324936, "epoch": 1934} {"train_loss": -11.94158935546875, "global_step": 324937, "epoch": 1934} {"train_loss": -12.243000984191895, "global_step": 324938, "epoch": 1934} {"train_loss": -12.203556060791016, "global_step": 324939, "epoch": 1934} {"train_loss": -12.104047775268555, "global_step": 324940, "epoch": 1934} {"train_loss": -12.308328628540039, "global_step": 324941, "epoch": 1934} {"train_loss": -11.596346855163574, "global_step": 324942, "epoch": 1934} {"train_loss": -12.32948112487793, "global_step": 324943, "epoch": 1934} {"train_loss": -12.056851387023926, "global_step": 324944, "epoch": 1934} {"train_loss": -12.026115417480469, "global_step": 324945, "epoch": 1934} {"train_loss": -12.059016227722168, "global_step": 324946, "epoch": 1934} {"train_loss": -11.722264289855957, "global_step": 324947, "epoch": 1934} {"train_loss": -12.210619926452637, "global_step": 324948, "epoch": 1934} {"train_loss": -11.840560913085938, "global_step": 324949, "epoch": 1934} {"train_loss": -11.868494033813477, "global_step": 324950, "epoch": 1934} {"train_loss": -12.059435844421387, "global_step": 324951, "epoch": 1934} {"train_loss": -11.872905731201172, "global_step": 324952, "epoch": 1934} {"train_loss": -11.935189247131348, "global_step": 324953, "epoch": 1934} {"train_loss": -11.99630355834961, "global_step": 324954, "epoch": 1934} {"train_loss": -11.912925720214844, "global_step": 324955, "epoch": 1934} {"train_loss": -12.10984992980957, "global_step": 324956, "epoch": 1934} {"train_loss": -11.668415069580078, "global_step": 324957, "epoch": 1934} {"train_loss": -11.919358253479004, "global_step": 324958, "epoch": 1934} {"train_loss": -11.85412883758545, "global_step": 324959, "epoch": 1934} {"train_loss": -11.531810760498047, "global_step": 324960, "epoch": 1934} {"train_loss": -12.224699020385742, "global_step": 324961, "epoch": 1934} {"train_loss": -11.174177169799805, "global_step": 324962, "epoch": 1934} {"train_loss": -12.086468696594238, "global_step": 324963, "epoch": 1934} {"train_loss": -11.622322082519531, "global_step": 324964, "epoch": 1934} {"train_loss": -12.05006217956543, "global_step": 324965, "epoch": 1934} {"train_loss": -11.599109649658203, "global_step": 324966, "epoch": 1934} {"train_loss": -11.648759841918945, "global_step": 324967, "epoch": 1934} {"train_loss": -11.524738311767578, "global_step": 324968, "epoch": 1934} {"train_loss": -11.973589897155762, "global_step": 324969, "epoch": 1934} {"train_loss": -11.62070083618164, "global_step": 324970, "epoch": 1934} {"train_loss": -12.241786003112793, "global_step": 324971, "epoch": 1934} {"train_loss": -11.895927429199219, "global_step": 324972, "epoch": 1934} {"train_loss": -11.852055549621582, "global_step": 324973, "epoch": 1934} {"train_loss": -11.959949493408203, "global_step": 324974, "epoch": 1934} {"train_loss": -11.317544937133789, "global_step": 324975, "epoch": 1934} {"train_loss": -11.086223602294922, "global_step": 324976, "epoch": 1934} {"train_loss": -11.000935554504395, "global_step": 324977, "epoch": 1934} {"train_loss": -11.182531356811523, "global_step": 324978, "epoch": 1934} {"train_loss": -11.198646545410156, "global_step": 324979, "epoch": 1934} {"train_loss": -11.720678329467773, "global_step": 324980, "epoch": 1934} {"train_loss": -11.906634330749512, "global_step": 324981, "epoch": 1934} {"train_loss": -11.136595726013184, "global_step": 324982, "epoch": 1934} {"train_loss": -11.98495101928711, "global_step": 324983, "epoch": 1934} {"train_loss": -11.475714683532715, "global_step": 324984, "epoch": 1934} {"train_loss": -12.174644470214844, "global_step": 324985, "epoch": 1934} {"train_loss": -11.532598495483398, "global_step": 324986, "epoch": 1934} {"train_loss": -12.129862785339355, "global_step": 324987, "epoch": 1934} {"train_loss": -11.208267211914062, "global_step": 324988, "epoch": 1934} {"train_loss": -11.74563217163086, "global_step": 324989, "epoch": 1934} {"train_loss": -11.448290824890137, "global_step": 324990, "epoch": 1934} {"train_loss": -11.668952941894531, "global_step": 324991, "epoch": 1934} {"train_loss": -11.68412971496582, "global_step": 324992, "epoch": 1934} {"train_loss": -11.299968719482422, "global_step": 324993, "epoch": 1934} {"train_loss": -12.195184707641602, "global_step": 324994, "epoch": 1934} {"train_loss": -11.591194152832031, "global_step": 324995, "epoch": 1934} {"train_loss": -11.752665519714355, "global_step": 324996, "epoch": 1934} {"train_loss": -11.441154479980469, "global_step": 324997, "epoch": 1934} {"train_loss": -11.73595905303955, "global_step": 324998, "epoch": 1934} {"train_loss": -11.62348747253418, "global_step": 324999, "epoch": 1934} {"train_loss": -11.551774024963379, "global_step": 325000, "epoch": 1934} {"train_loss": -12.191211700439453, "global_step": 325001, "epoch": 1934} {"train_loss": -11.311012268066406, "global_step": 325002, "epoch": 1934} {"train_loss": -12.072616577148438, "global_step": 325003, "epoch": 1934} {"train_loss": -11.564053535461426, "global_step": 325004, "epoch": 1934} {"train_loss": -11.81116771697998, "global_step": 325005, "epoch": 1934} {"train_loss": -11.172367095947266, "global_step": 325006, "epoch": 1934} {"train_loss": -11.214313507080078, "global_step": 325007, "epoch": 1934} {"train_loss": -12.321782112121582, "global_step": 325008, "epoch": 1934} {"train_loss": -11.620834350585938, "global_step": 325009, "epoch": 1934} {"train_loss": -12.225656509399414, "global_step": 325010, "epoch": 1934} {"train_loss": -11.77476692199707, "global_step": 325011, "epoch": 1934} {"train_loss": -11.379959106445312, "global_step": 325012, "epoch": 1934} {"train_loss": -12.196224212646484, "global_step": 325013, "epoch": 1934} {"train_loss": -11.767679214477539, "global_step": 325014, "epoch": 1934} {"train_loss": -12.293885231018066, "global_step": 325015, "epoch": 1934} {"train_loss": -11.683822631835938, "global_step": 325016, "epoch": 1934} {"train_loss": -11.756620407104492, "global_step": 325017, "epoch": 1934} {"train_loss": -12.21984577178955, "global_step": 325018, "epoch": 1934} {"train_loss": -12.061418533325195, "global_step": 325019, "epoch": 1934} {"train_loss": -11.734814643859863, "global_step": 325020, "epoch": 1934} {"train_loss": -12.078296661376953, "global_step": 325021, "epoch": 1934} {"train_loss": -11.711788177490234, "global_step": 325022, "epoch": 1934} {"train_loss": -12.032394409179688, "global_step": 325023, "epoch": 1934} {"train_loss": -11.857162475585938, "global_step": 325024, "epoch": 1934} {"train_loss": -11.419260025024414, "global_step": 325025, "epoch": 1934} {"train_loss": -12.248941421508789, "global_step": 325026, "epoch": 1934} {"train_loss": -11.855417251586914, "global_step": 325027, "epoch": 1934} {"train_loss": -12.06576156616211, "global_step": 325028, "epoch": 1934} {"train_loss": -11.997801780700684, "global_step": 325029, "epoch": 1934} {"train_loss": -12.043848037719727, "global_step": 325030, "epoch": 1934} {"train_loss": -12.084245681762695, "global_step": 325031, "epoch": 1934} {"train_loss": -11.840370178222656, "global_step": 325032, "epoch": 1934} {"train_loss": -11.736176490783691, "global_step": 325033, "epoch": 1934} {"train_loss": -12.058897972106934, "global_step": 325034, "epoch": 1934} {"train_loss": -12.124666213989258, "global_step": 325035, "epoch": 1934} {"train_loss": -11.898731231689453, "global_step": 325036, "epoch": 1934} {"train_loss": -12.326584815979004, "global_step": 325037, "epoch": 1934} {"train_loss": -11.958340644836426, "global_step": 325038, "epoch": 1934} {"train_loss": -12.401745796203613, "global_step": 325039, "epoch": 1934} {"train_loss": -11.811624526977539, "global_step": 325040, "epoch": 1934} {"train_loss": -12.428178787231445, "global_step": 325041, "epoch": 1934} {"train_loss": -12.09581184387207, "global_step": 325042, "epoch": 1934} {"train_loss": -12.143814086914062, "global_step": 325043, "epoch": 1934} {"train_loss": -12.362548828125, "global_step": 325044, "epoch": 1934} {"train_loss": -12.040605545043945, "global_step": 325045, "epoch": 1934} {"train_loss": -12.25905704498291, "global_step": 325046, "epoch": 1934} {"train_loss": -11.823795318603516, "global_step": 325047, "epoch": 1934} {"train_loss": -11.94668960571289, "global_step": 325048, "epoch": 1934} {"train_loss": -12.113235473632812, "global_step": 325049, "epoch": 1934} {"train_loss": -11.753852844238281, "global_step": 325050, "epoch": 1934} {"train_loss": -11.868732452392578, "global_step": 325051, "epoch": 1934} {"train_loss": -11.83237075805664, "global_step": 325052, "epoch": 1934} {"train_loss": -12.30959415435791, "global_step": 325053, "epoch": 1934} {"train_loss": -11.832645416259766, "global_step": 325054, "epoch": 1934} {"train_loss": -12.225231170654297, "global_step": 325055, "epoch": 1934} {"train_loss": -12.266871452331543, "global_step": 325056, "epoch": 1934} {"train_loss": -11.252105712890625, "global_step": 325057, "epoch": 1934} {"train_loss": -12.234325408935547, "global_step": 325058, "epoch": 1934} {"train_loss": -11.171989440917969, "global_step": 325059, "epoch": 1934} {"train_loss": -11.788856506347656, "global_step": 325060, "epoch": 1934} {"train_loss": -11.877813339233398, "global_step": 325061, "epoch": 1934} {"train_loss": -10.262779235839844, "global_step": 325062, "epoch": 1934} {"train_loss": -12.066295623779297, "global_step": 325063, "epoch": 1934} {"train_loss": -10.572284698486328, "global_step": 325064, "epoch": 1934} {"train_loss": -11.925378799438477, "global_step": 325065, "epoch": 1934} {"train_loss": -10.419122695922852, "global_step": 325066, "epoch": 1934} {"train_loss": -11.163107872009277, "global_step": 325067, "epoch": 1934} {"train_loss": -11.664928436279297, "global_step": 325068, "epoch": 1934} {"train_loss": -11.054051399230957, "global_step": 325069, "epoch": 1934} {"train_loss": -11.884845733642578, "global_step": 325070, "epoch": 1934} {"train_loss": -11.42729377746582, "global_step": 325071, "epoch": 1934} {"train_loss": -11.42867374420166, "global_step": 325072, "epoch": 1934} {"train_loss": -11.261711120605469, "global_step": 325073, "epoch": 1934} {"train_loss": -11.061185836791992, "global_step": 325074, "epoch": 1934} {"train_loss": -11.644352912902832, "global_step": 325075, "epoch": 1934} {"train_loss": -11.41695785522461, "global_step": 325076, "epoch": 1934} {"train_loss": -11.60448169708252, "global_step": 325077, "epoch": 1934} {"train_loss": -11.558257102966309, "global_step": 325078, "epoch": 1934} {"train_loss": -11.807524726504372, "global_step": 325079, "epoch": 1934, "val_loss": 284912.40625} {"train_loss": -11.566452026367188, "global_step": 325080, "epoch": 1935} {"train_loss": -11.605037689208984, "global_step": 325081, "epoch": 1935} {"train_loss": -11.665842056274414, "global_step": 325082, "epoch": 1935} {"train_loss": -11.72152042388916, "global_step": 325083, "epoch": 1935} {"train_loss": -11.58395767211914, "global_step": 325084, "epoch": 1935} {"train_loss": -11.75039291381836, "global_step": 325085, "epoch": 1935} {"train_loss": -11.740861892700195, "global_step": 325086, "epoch": 1935} {"train_loss": -11.229816436767578, "global_step": 325087, "epoch": 1935} {"train_loss": -11.71617317199707, "global_step": 325088, "epoch": 1935} {"train_loss": -11.527924537658691, "global_step": 325089, "epoch": 1935} {"train_loss": -12.00603199005127, "global_step": 325090, "epoch": 1935} {"train_loss": -11.668234825134277, "global_step": 325091, "epoch": 1935} {"train_loss": -11.603052139282227, "global_step": 325092, "epoch": 1935} {"train_loss": -11.774799346923828, "global_step": 325093, "epoch": 1935} {"train_loss": -11.830622673034668, "global_step": 325094, "epoch": 1935} {"train_loss": -12.1255464553833, "global_step": 325095, "epoch": 1935} {"train_loss": -11.833717346191406, "global_step": 325096, "epoch": 1935} {"train_loss": -11.69283390045166, "global_step": 325097, "epoch": 1935} {"train_loss": -11.52128791809082, "global_step": 325098, "epoch": 1935} {"train_loss": -11.971753120422363, "global_step": 325099, "epoch": 1935} {"train_loss": -11.445534706115723, "global_step": 325100, "epoch": 1935} {"train_loss": -11.980424880981445, "global_step": 325101, "epoch": 1935} {"train_loss": -11.302886962890625, "global_step": 325102, "epoch": 1935} {"train_loss": -11.846288681030273, "global_step": 325103, "epoch": 1935} {"train_loss": -11.873296737670898, "global_step": 325104, "epoch": 1935} {"train_loss": -10.906230926513672, "global_step": 325105, "epoch": 1935} {"train_loss": -11.982036590576172, "global_step": 325106, "epoch": 1935} {"train_loss": -11.684747695922852, "global_step": 325107, "epoch": 1935} {"train_loss": -12.133906364440918, "global_step": 325108, "epoch": 1935} {"train_loss": -11.9083890914917, "global_step": 325109, "epoch": 1935} {"train_loss": -11.58609676361084, "global_step": 325110, "epoch": 1935} {"train_loss": -12.149203300476074, "global_step": 325111, "epoch": 1935} {"train_loss": -11.568426132202148, "global_step": 325112, "epoch": 1935} {"train_loss": -12.16598892211914, "global_step": 325113, "epoch": 1935} {"train_loss": -11.373126983642578, "global_step": 325114, "epoch": 1935} {"train_loss": -12.161727905273438, "global_step": 325115, "epoch": 1935} {"train_loss": -12.096348762512207, "global_step": 325116, "epoch": 1935} {"train_loss": -11.880577087402344, "global_step": 325117, "epoch": 1935} {"train_loss": -12.1473388671875, "global_step": 325118, "epoch": 1935} {"train_loss": -11.91732406616211, "global_step": 325119, "epoch": 1935} {"train_loss": -12.117759704589844, "global_step": 325120, "epoch": 1935} {"train_loss": -11.891685485839844, "global_step": 325121, "epoch": 1935} {"train_loss": -12.211355209350586, "global_step": 325122, "epoch": 1935} {"train_loss": -12.200531005859375, "global_step": 325123, "epoch": 1935} {"train_loss": -12.165971755981445, "global_step": 325124, "epoch": 1935} {"train_loss": -11.826966285705566, "global_step": 325125, "epoch": 1935} {"train_loss": -12.343716621398926, "global_step": 325126, "epoch": 1935} {"train_loss": -12.065469741821289, "global_step": 325127, "epoch": 1935} {"train_loss": -11.995131492614746, "global_step": 325128, "epoch": 1935} {"train_loss": -12.42910385131836, "global_step": 325129, "epoch": 1935} {"train_loss": -12.023882865905762, "global_step": 325130, "epoch": 1935} {"train_loss": -11.980291366577148, "global_step": 325131, "epoch": 1935} {"train_loss": -11.65316390991211, "global_step": 325132, "epoch": 1935} {"train_loss": -12.210845947265625, "global_step": 325133, "epoch": 1935} {"train_loss": -11.962312698364258, "global_step": 325134, "epoch": 1935} {"train_loss": -11.773181915283203, "global_step": 325135, "epoch": 1935} {"train_loss": -12.29271411895752, "global_step": 325136, "epoch": 1935} {"train_loss": -12.077585220336914, "global_step": 325137, "epoch": 1935} {"train_loss": -12.328288078308105, "global_step": 325138, "epoch": 1935} {"train_loss": -12.191028594970703, "global_step": 325139, "epoch": 1935} {"train_loss": -12.274710655212402, "global_step": 325140, "epoch": 1935} {"train_loss": -12.135229110717773, "global_step": 325141, "epoch": 1935} {"train_loss": -12.265643119812012, "global_step": 325142, "epoch": 1935} {"train_loss": -12.450708389282227, "global_step": 325143, "epoch": 1935} {"train_loss": -12.215410232543945, "global_step": 325144, "epoch": 1935} {"train_loss": -12.336278915405273, "global_step": 325145, "epoch": 1935} {"train_loss": -12.427501678466797, "global_step": 325146, "epoch": 1935} {"train_loss": -12.517256736755371, "global_step": 325147, "epoch": 1935} {"train_loss": -12.155555725097656, "global_step": 325148, "epoch": 1935} {"train_loss": -12.43471908569336, "global_step": 325149, "epoch": 1935} {"train_loss": -12.15807819366455, "global_step": 325150, "epoch": 1935} {"train_loss": -12.40300178527832, "global_step": 325151, "epoch": 1935} {"train_loss": -12.248645782470703, "global_step": 325152, "epoch": 1935} {"train_loss": -12.408113479614258, "global_step": 325153, "epoch": 1935} {"train_loss": -12.558614730834961, "global_step": 325154, "epoch": 1935} {"train_loss": -12.20496940612793, "global_step": 325155, "epoch": 1935} {"train_loss": -12.546951293945312, "global_step": 325156, "epoch": 1935} {"train_loss": -12.445756912231445, "global_step": 325157, "epoch": 1935} {"train_loss": -12.326254844665527, "global_step": 325158, "epoch": 1935} {"train_loss": -12.412199020385742, "global_step": 325159, "epoch": 1935} {"train_loss": -12.433774948120117, "global_step": 325160, "epoch": 1935} {"train_loss": -12.555757522583008, "global_step": 325161, "epoch": 1935} {"train_loss": -12.559968948364258, "global_step": 325162, "epoch": 1935} {"train_loss": -12.131292343139648, "global_step": 325163, "epoch": 1935} {"train_loss": -12.545940399169922, "global_step": 325164, "epoch": 1935} {"train_loss": -12.136177062988281, "global_step": 325165, "epoch": 1935} {"train_loss": -12.368959426879883, "global_step": 325166, "epoch": 1935} {"train_loss": -12.637643814086914, "global_step": 325167, "epoch": 1935} {"train_loss": -12.516990661621094, "global_step": 325168, "epoch": 1935} {"train_loss": -12.477279663085938, "global_step": 325169, "epoch": 1935} {"train_loss": -12.485306739807129, "global_step": 325170, "epoch": 1935} {"train_loss": -12.539786338806152, "global_step": 325171, "epoch": 1935} {"train_loss": -12.408065795898438, "global_step": 325172, "epoch": 1935} {"train_loss": -12.41230583190918, "global_step": 325173, "epoch": 1935} {"train_loss": -12.336397171020508, "global_step": 325174, "epoch": 1935} {"train_loss": -12.740464210510254, "global_step": 325175, "epoch": 1935} {"train_loss": -12.578791618347168, "global_step": 325176, "epoch": 1935} {"train_loss": -12.738460540771484, "global_step": 325177, "epoch": 1935} {"train_loss": -12.737421035766602, "global_step": 325178, "epoch": 1935} {"train_loss": -12.573923110961914, "global_step": 325179, "epoch": 1935} {"train_loss": -12.750604629516602, "global_step": 325180, "epoch": 1935} {"train_loss": -12.647163391113281, "global_step": 325181, "epoch": 1935} {"train_loss": -12.501718521118164, "global_step": 325182, "epoch": 1935} {"train_loss": -12.566826820373535, "global_step": 325183, "epoch": 1935} {"train_loss": -12.733884811401367, "global_step": 325184, "epoch": 1935} {"train_loss": -12.537933349609375, "global_step": 325185, "epoch": 1935} {"train_loss": -12.674524307250977, "global_step": 325186, "epoch": 1935} {"train_loss": -12.762771606445312, "global_step": 325187, "epoch": 1935} {"train_loss": -12.740297317504883, "global_step": 325188, "epoch": 1935} {"train_loss": -12.522682189941406, "global_step": 325189, "epoch": 1935} {"train_loss": -12.311441421508789, "global_step": 325190, "epoch": 1935} {"train_loss": -12.440288543701172, "global_step": 325191, "epoch": 1935} {"train_loss": -12.454158782958984, "global_step": 325192, "epoch": 1935} {"train_loss": -12.575803756713867, "global_step": 325193, "epoch": 1935} {"train_loss": -12.28653335571289, "global_step": 325194, "epoch": 1935} {"train_loss": -11.880998611450195, "global_step": 325195, "epoch": 1935} {"train_loss": -11.758506774902344, "global_step": 325196, "epoch": 1935} {"train_loss": -11.408086776733398, "global_step": 325197, "epoch": 1935} {"train_loss": -11.209644317626953, "global_step": 325198, "epoch": 1935} {"train_loss": -11.235466957092285, "global_step": 325199, "epoch": 1935} {"train_loss": -11.794249534606934, "global_step": 325200, "epoch": 1935} {"train_loss": -11.78672981262207, "global_step": 325201, "epoch": 1935} {"train_loss": -10.149486541748047, "global_step": 325202, "epoch": 1935} {"train_loss": -8.357848167419434, "global_step": 325203, "epoch": 1935} {"train_loss": -8.52863597869873, "global_step": 325204, "epoch": 1935} {"train_loss": -8.40781021118164, "global_step": 325205, "epoch": 1935} {"train_loss": -9.818689346313477, "global_step": 325206, "epoch": 1935} {"train_loss": -10.044034004211426, "global_step": 325207, "epoch": 1935} {"train_loss": -9.111175537109375, "global_step": 325208, "epoch": 1935} {"train_loss": -9.329423904418945, "global_step": 325209, "epoch": 1935} {"train_loss": -10.771219253540039, "global_step": 325210, "epoch": 1935} {"train_loss": -9.704684257507324, "global_step": 325211, "epoch": 1935} {"train_loss": -9.99490737915039, "global_step": 325212, "epoch": 1935} {"train_loss": -11.771617889404297, "global_step": 325213, "epoch": 1935} {"train_loss": -10.499340057373047, "global_step": 325214, "epoch": 1935} {"train_loss": -10.430736541748047, "global_step": 325215, "epoch": 1935} {"train_loss": -10.829511642456055, "global_step": 325216, "epoch": 1935} {"train_loss": -11.405941009521484, "global_step": 325217, "epoch": 1935} {"train_loss": -11.29307746887207, "global_step": 325218, "epoch": 1935} {"train_loss": -11.692729949951172, "global_step": 325219, "epoch": 1935} {"train_loss": -11.061717987060547, "global_step": 325220, "epoch": 1935} {"train_loss": -10.985050201416016, "global_step": 325221, "epoch": 1935} {"train_loss": -11.751023292541504, "global_step": 325222, "epoch": 1935} {"train_loss": -11.842729568481445, "global_step": 325223, "epoch": 1935} {"train_loss": -11.049270629882812, "global_step": 325224, "epoch": 1935} {"train_loss": -11.390022277832031, "global_step": 325225, "epoch": 1935} {"train_loss": -11.709346771240234, "global_step": 325226, "epoch": 1935} {"train_loss": -11.46729564666748, "global_step": 325227, "epoch": 1935} {"train_loss": -11.476747512817383, "global_step": 325228, "epoch": 1935} {"train_loss": -11.777366638183594, "global_step": 325229, "epoch": 1935} {"train_loss": -11.559286117553711, "global_step": 325230, "epoch": 1935} {"train_loss": -12.31916618347168, "global_step": 325231, "epoch": 1935} {"train_loss": -11.452790260314941, "global_step": 325232, "epoch": 1935} {"train_loss": -12.097709655761719, "global_step": 325233, "epoch": 1935} {"train_loss": -11.538426399230957, "global_step": 325234, "epoch": 1935} {"train_loss": -11.567669868469238, "global_step": 325235, "epoch": 1935} {"train_loss": -11.996112823486328, "global_step": 325236, "epoch": 1935} {"train_loss": -11.530021667480469, "global_step": 325237, "epoch": 1935} {"train_loss": -11.409171104431152, "global_step": 325238, "epoch": 1935} {"train_loss": -12.12684440612793, "global_step": 325239, "epoch": 1935} {"train_loss": -11.741905212402344, "global_step": 325240, "epoch": 1935} {"train_loss": -11.950421333312988, "global_step": 325241, "epoch": 1935} {"train_loss": -11.855634689331055, "global_step": 325242, "epoch": 1935} {"train_loss": -11.840597152709961, "global_step": 325243, "epoch": 1935} {"train_loss": -11.72429370880127, "global_step": 325244, "epoch": 1935} {"train_loss": -11.768472671508789, "global_step": 325245, "epoch": 1935} {"train_loss": -12.029020309448242, "global_step": 325246, "epoch": 1935} {"train_loss": -11.828949150584993, "global_step": 325247, "epoch": 1935, "val_loss": 284455.4375, "train_action_mse_error": 4.858470916748047} {"train_loss": -11.9315767288208, "global_step": 325248, "epoch": 1936} {"train_loss": -11.686532974243164, "global_step": 325249, "epoch": 1936} {"train_loss": -11.889850616455078, "global_step": 325250, "epoch": 1936} {"train_loss": -11.697021484375, "global_step": 325251, "epoch": 1936} {"train_loss": -11.875961303710938, "global_step": 325252, "epoch": 1936} {"train_loss": -12.083049774169922, "global_step": 325253, "epoch": 1936} {"train_loss": -11.89454174041748, "global_step": 325254, "epoch": 1936} {"train_loss": -11.799819946289062, "global_step": 325255, "epoch": 1936} {"train_loss": -11.494609832763672, "global_step": 325256, "epoch": 1936} {"train_loss": -11.970266342163086, "global_step": 325257, "epoch": 1936} {"train_loss": -11.984148025512695, "global_step": 325258, "epoch": 1936} {"train_loss": -11.81814193725586, "global_step": 325259, "epoch": 1936} {"train_loss": -11.56152057647705, "global_step": 325260, "epoch": 1936} {"train_loss": -11.537165641784668, "global_step": 325261, "epoch": 1936} {"train_loss": -11.346391677856445, "global_step": 325262, "epoch": 1936} {"train_loss": -11.130977630615234, "global_step": 325263, "epoch": 1936} {"train_loss": -11.61330795288086, "global_step": 325264, "epoch": 1936} {"train_loss": -12.039299011230469, "global_step": 325265, "epoch": 1936} {"train_loss": -11.90515422821045, "global_step": 325266, "epoch": 1936} {"train_loss": -11.886028289794922, "global_step": 325267, "epoch": 1936} {"train_loss": -11.764248847961426, "global_step": 325268, "epoch": 1936} {"train_loss": -11.96302604675293, "global_step": 325269, "epoch": 1936} {"train_loss": -12.174650192260742, "global_step": 325270, "epoch": 1936} {"train_loss": -11.57717227935791, "global_step": 325271, "epoch": 1936} {"train_loss": -12.126956939697266, "global_step": 325272, "epoch": 1936} {"train_loss": -11.96004867553711, "global_step": 325273, "epoch": 1936} {"train_loss": -11.964859962463379, "global_step": 325274, "epoch": 1936} {"train_loss": -12.317919731140137, "global_step": 325275, "epoch": 1936} {"train_loss": -11.918084144592285, "global_step": 325276, "epoch": 1936} {"train_loss": -12.006721496582031, "global_step": 325277, "epoch": 1936} {"train_loss": -12.057440757751465, "global_step": 325278, "epoch": 1936} {"train_loss": -11.985345840454102, "global_step": 325279, "epoch": 1936} {"train_loss": -12.171133041381836, "global_step": 325280, "epoch": 1936} {"train_loss": -11.791351318359375, "global_step": 325281, "epoch": 1936} {"train_loss": -11.453557968139648, "global_step": 325282, "epoch": 1936} {"train_loss": -11.973219871520996, "global_step": 325283, "epoch": 1936} {"train_loss": -11.34539794921875, "global_step": 325284, "epoch": 1936} {"train_loss": -11.691764831542969, "global_step": 325285, "epoch": 1936} {"train_loss": -11.63020133972168, "global_step": 325286, "epoch": 1936} {"train_loss": -11.776586532592773, "global_step": 325287, "epoch": 1936} {"train_loss": -11.759628295898438, "global_step": 325288, "epoch": 1936} {"train_loss": -11.635976791381836, "global_step": 325289, "epoch": 1936} {"train_loss": -12.163110733032227, "global_step": 325290, "epoch": 1936} {"train_loss": -11.312643051147461, "global_step": 325291, "epoch": 1936} {"train_loss": -11.73017692565918, "global_step": 325292, "epoch": 1936} {"train_loss": -11.409797668457031, "global_step": 325293, "epoch": 1936} {"train_loss": -12.054586410522461, "global_step": 325294, "epoch": 1936} {"train_loss": -11.419239044189453, "global_step": 325295, "epoch": 1936} {"train_loss": -11.96412181854248, "global_step": 325296, "epoch": 1936} {"train_loss": -11.135221481323242, "global_step": 325297, "epoch": 1936} {"train_loss": -12.278947830200195, "global_step": 325298, "epoch": 1936} {"train_loss": -11.892670631408691, "global_step": 325299, "epoch": 1936} {"train_loss": -12.04977798461914, "global_step": 325300, "epoch": 1936} {"train_loss": -11.977721214294434, "global_step": 325301, "epoch": 1936} {"train_loss": -11.775996208190918, "global_step": 325302, "epoch": 1936} {"train_loss": -12.088287353515625, "global_step": 325303, "epoch": 1936} {"train_loss": -11.704763412475586, "global_step": 325304, "epoch": 1936} {"train_loss": -11.746028900146484, "global_step": 325305, "epoch": 1936} {"train_loss": -11.84097671508789, "global_step": 325306, "epoch": 1936} {"train_loss": -12.10059642791748, "global_step": 325307, "epoch": 1936} {"train_loss": -12.142765998840332, "global_step": 325308, "epoch": 1936} {"train_loss": -12.020675659179688, "global_step": 325309, "epoch": 1936} {"train_loss": -12.057045936584473, "global_step": 325310, "epoch": 1936} {"train_loss": -12.11246109008789, "global_step": 325311, "epoch": 1936} {"train_loss": -11.881386756896973, "global_step": 325312, "epoch": 1936} {"train_loss": -12.261336326599121, "global_step": 325313, "epoch": 1936} {"train_loss": -11.468664169311523, "global_step": 325314, "epoch": 1936} {"train_loss": -11.931692123413086, "global_step": 325315, "epoch": 1936} {"train_loss": -12.140859603881836, "global_step": 325316, "epoch": 1936} {"train_loss": -11.888211250305176, "global_step": 325317, "epoch": 1936} {"train_loss": -11.996070861816406, "global_step": 325318, "epoch": 1936} {"train_loss": -12.094034194946289, "global_step": 325319, "epoch": 1936} {"train_loss": -11.990687370300293, "global_step": 325320, "epoch": 1936} {"train_loss": -11.767398834228516, "global_step": 325321, "epoch": 1936} {"train_loss": -12.329365730285645, "global_step": 325322, "epoch": 1936} {"train_loss": -11.958117485046387, "global_step": 325323, "epoch": 1936} {"train_loss": -12.127291679382324, "global_step": 325324, "epoch": 1936} {"train_loss": -12.24487590789795, "global_step": 325325, "epoch": 1936} {"train_loss": -12.26612377166748, "global_step": 325326, "epoch": 1936} {"train_loss": -12.147832870483398, "global_step": 325327, "epoch": 1936} {"train_loss": -12.170581817626953, "global_step": 325328, "epoch": 1936} {"train_loss": -11.879627227783203, "global_step": 325329, "epoch": 1936} {"train_loss": -12.065460205078125, "global_step": 325330, "epoch": 1936} {"train_loss": -12.175454139709473, "global_step": 325331, "epoch": 1936} {"train_loss": -11.507854461669922, "global_step": 325332, "epoch": 1936} {"train_loss": -11.567184448242188, "global_step": 325333, "epoch": 1936} {"train_loss": -12.497264862060547, "global_step": 325334, "epoch": 1936} {"train_loss": -11.94064712524414, "global_step": 325335, "epoch": 1936} {"train_loss": -11.794537544250488, "global_step": 325336, "epoch": 1936} {"train_loss": -12.357627868652344, "global_step": 325337, "epoch": 1936} {"train_loss": -11.672233581542969, "global_step": 325338, "epoch": 1936} {"train_loss": -12.263355255126953, "global_step": 325339, "epoch": 1936} {"train_loss": -11.722951889038086, "global_step": 325340, "epoch": 1936} {"train_loss": -12.272333145141602, "global_step": 325341, "epoch": 1936} {"train_loss": -12.089717864990234, "global_step": 325342, "epoch": 1936} {"train_loss": -12.16204833984375, "global_step": 325343, "epoch": 1936} {"train_loss": -12.009559631347656, "global_step": 325344, "epoch": 1936} {"train_loss": -12.49103832244873, "global_step": 325345, "epoch": 1936} {"train_loss": -12.236169815063477, "global_step": 325346, "epoch": 1936} {"train_loss": -12.047407150268555, "global_step": 325347, "epoch": 1936} {"train_loss": -12.458061218261719, "global_step": 325348, "epoch": 1936} {"train_loss": -12.13336181640625, "global_step": 325349, "epoch": 1936} {"train_loss": -12.439984321594238, "global_step": 325350, "epoch": 1936} {"train_loss": -12.281633377075195, "global_step": 325351, "epoch": 1936} {"train_loss": -12.399724960327148, "global_step": 325352, "epoch": 1936} {"train_loss": -12.088781356811523, "global_step": 325353, "epoch": 1936} {"train_loss": -12.30842399597168, "global_step": 325354, "epoch": 1936} {"train_loss": -12.305830001831055, "global_step": 325355, "epoch": 1936} {"train_loss": -12.016279220581055, "global_step": 325356, "epoch": 1936} {"train_loss": -12.029869079589844, "global_step": 325357, "epoch": 1936} {"train_loss": -12.488387107849121, "global_step": 325358, "epoch": 1936} {"train_loss": -11.997373580932617, "global_step": 325359, "epoch": 1936} {"train_loss": -12.23284912109375, "global_step": 325360, "epoch": 1936} {"train_loss": -12.041894912719727, "global_step": 325361, "epoch": 1936} {"train_loss": -11.756868362426758, "global_step": 325362, "epoch": 1936} {"train_loss": -10.94594955444336, "global_step": 325363, "epoch": 1936} {"train_loss": -11.226797103881836, "global_step": 325364, "epoch": 1936} {"train_loss": -10.97681713104248, "global_step": 325365, "epoch": 1936} {"train_loss": -11.671960830688477, "global_step": 325366, "epoch": 1936} {"train_loss": -11.559377670288086, "global_step": 325367, "epoch": 1936} {"train_loss": -10.93149471282959, "global_step": 325368, "epoch": 1936} {"train_loss": -11.129035949707031, "global_step": 325369, "epoch": 1936} {"train_loss": -8.443428993225098, "global_step": 325370, "epoch": 1936} {"train_loss": -8.55612564086914, "global_step": 325371, "epoch": 1936} {"train_loss": -9.37147331237793, "global_step": 325372, "epoch": 1936} {"train_loss": -10.861939430236816, "global_step": 325373, "epoch": 1936} {"train_loss": -9.992353439331055, "global_step": 325374, "epoch": 1936} {"train_loss": -10.507837295532227, "global_step": 325375, "epoch": 1936} {"train_loss": -10.615819931030273, "global_step": 325376, "epoch": 1936} {"train_loss": -10.038825035095215, "global_step": 325377, "epoch": 1936} {"train_loss": -11.369815826416016, "global_step": 325378, "epoch": 1936} {"train_loss": -10.618170738220215, "global_step": 325379, "epoch": 1936} {"train_loss": -11.726335525512695, "global_step": 325380, "epoch": 1936} {"train_loss": -10.79296588897705, "global_step": 325381, "epoch": 1936} {"train_loss": -11.699195861816406, "global_step": 325382, "epoch": 1936} {"train_loss": -10.514320373535156, "global_step": 325383, "epoch": 1936} {"train_loss": -10.717409133911133, "global_step": 325384, "epoch": 1936} {"train_loss": -10.893383026123047, "global_step": 325385, "epoch": 1936} {"train_loss": -11.13204574584961, "global_step": 325386, "epoch": 1936} {"train_loss": -10.422258377075195, "global_step": 325387, "epoch": 1936} {"train_loss": -12.030391693115234, "global_step": 325388, "epoch": 1936} {"train_loss": -10.4375581741333, "global_step": 325389, "epoch": 1936} {"train_loss": -11.987542152404785, "global_step": 325390, "epoch": 1936} {"train_loss": -10.290563583374023, "global_step": 325391, "epoch": 1936} {"train_loss": -11.508493423461914, "global_step": 325392, "epoch": 1936} {"train_loss": -10.545393943786621, "global_step": 325393, "epoch": 1936} {"train_loss": -11.296981811523438, "global_step": 325394, "epoch": 1936} {"train_loss": -10.767925262451172, "global_step": 325395, "epoch": 1936} {"train_loss": -10.82211685180664, "global_step": 325396, "epoch": 1936} {"train_loss": -10.592723846435547, "global_step": 325397, "epoch": 1936} {"train_loss": -11.057462692260742, "global_step": 325398, "epoch": 1936} {"train_loss": -11.118968963623047, "global_step": 325399, "epoch": 1936} {"train_loss": -10.524394035339355, "global_step": 325400, "epoch": 1936} {"train_loss": -11.783437728881836, "global_step": 325401, "epoch": 1936} {"train_loss": -11.186836242675781, "global_step": 325402, "epoch": 1936} {"train_loss": -11.922809600830078, "global_step": 325403, "epoch": 1936} {"train_loss": -11.708027839660645, "global_step": 325404, "epoch": 1936} {"train_loss": -11.827768325805664, "global_step": 325405, "epoch": 1936} {"train_loss": -11.336589813232422, "global_step": 325406, "epoch": 1936} {"train_loss": -11.797649383544922, "global_step": 325407, "epoch": 1936} {"train_loss": -11.485210418701172, "global_step": 325408, "epoch": 1936} {"train_loss": -11.982802391052246, "global_step": 325409, "epoch": 1936} {"train_loss": -11.752093315124512, "global_step": 325410, "epoch": 1936} {"train_loss": -11.929972648620605, "global_step": 325411, "epoch": 1936} {"train_loss": -11.856063842773438, "global_step": 325412, "epoch": 1936} {"train_loss": -11.62612533569336, "global_step": 325413, "epoch": 1936} {"train_loss": -11.663151741027832, "global_step": 325414, "epoch": 1936} {"train_loss": -11.66115557012104, "global_step": 325415, "epoch": 1936, "val_loss": 289386.0625} {"train_loss": -12.021463394165039, "global_step": 325416, "epoch": 1937} {"train_loss": -11.843944549560547, "global_step": 325417, "epoch": 1937} {"train_loss": -11.967561721801758, "global_step": 325418, "epoch": 1937} {"train_loss": -11.962295532226562, "global_step": 325419, "epoch": 1937} {"train_loss": -12.076406478881836, "global_step": 325420, "epoch": 1937} {"train_loss": -11.945640563964844, "global_step": 325421, "epoch": 1937} {"train_loss": -12.010516166687012, "global_step": 325422, "epoch": 1937} {"train_loss": -11.960988998413086, "global_step": 325423, "epoch": 1937} {"train_loss": -11.99761962890625, "global_step": 325424, "epoch": 1937} {"train_loss": -12.003472328186035, "global_step": 325425, "epoch": 1937} {"train_loss": -11.904029846191406, "global_step": 325426, "epoch": 1937} {"train_loss": -12.27340316772461, "global_step": 325427, "epoch": 1937} {"train_loss": -11.918389320373535, "global_step": 325428, "epoch": 1937} {"train_loss": -12.077256202697754, "global_step": 325429, "epoch": 1937} {"train_loss": -12.275290489196777, "global_step": 325430, "epoch": 1937} {"train_loss": -11.622819900512695, "global_step": 325431, "epoch": 1937} {"train_loss": -11.440853118896484, "global_step": 325432, "epoch": 1937} {"train_loss": -11.7462739944458, "global_step": 325433, "epoch": 1937} {"train_loss": -11.977607727050781, "global_step": 325434, "epoch": 1937} {"train_loss": -12.118368148803711, "global_step": 325435, "epoch": 1937} {"train_loss": -11.941481590270996, "global_step": 325436, "epoch": 1937} {"train_loss": -12.149463653564453, "global_step": 325437, "epoch": 1937} {"train_loss": -11.588441848754883, "global_step": 325438, "epoch": 1937} {"train_loss": -12.035942077636719, "global_step": 325439, "epoch": 1937} {"train_loss": -12.133353233337402, "global_step": 325440, "epoch": 1937} {"train_loss": -12.127326965332031, "global_step": 325441, "epoch": 1937} {"train_loss": -11.712727546691895, "global_step": 325442, "epoch": 1937} {"train_loss": -12.203028678894043, "global_step": 325443, "epoch": 1937} {"train_loss": -11.928167343139648, "global_step": 325444, "epoch": 1937} {"train_loss": -12.043891906738281, "global_step": 325445, "epoch": 1937} {"train_loss": -12.188569068908691, "global_step": 325446, "epoch": 1937} {"train_loss": -12.017043113708496, "global_step": 325447, "epoch": 1937} {"train_loss": -12.281627655029297, "global_step": 325448, "epoch": 1937} {"train_loss": -11.82647705078125, "global_step": 325449, "epoch": 1937} {"train_loss": -12.266369819641113, "global_step": 325450, "epoch": 1937} {"train_loss": -12.343806266784668, "global_step": 325451, "epoch": 1937} {"train_loss": -12.15742015838623, "global_step": 325452, "epoch": 1937} {"train_loss": -12.214425086975098, "global_step": 325453, "epoch": 1937} {"train_loss": -11.97287368774414, "global_step": 325454, "epoch": 1937} {"train_loss": -12.035614013671875, "global_step": 325455, "epoch": 1937} {"train_loss": -12.282264709472656, "global_step": 325456, "epoch": 1937} {"train_loss": -12.228239059448242, "global_step": 325457, "epoch": 1937} {"train_loss": -12.304216384887695, "global_step": 325458, "epoch": 1937} {"train_loss": -12.202311515808105, "global_step": 325459, "epoch": 1937} {"train_loss": -12.363021850585938, "global_step": 325460, "epoch": 1937} {"train_loss": -12.40713882446289, "global_step": 325461, "epoch": 1937} {"train_loss": -12.46210765838623, "global_step": 325462, "epoch": 1937} {"train_loss": -12.25326919555664, "global_step": 325463, "epoch": 1937} {"train_loss": -12.445236206054688, "global_step": 325464, "epoch": 1937} {"train_loss": -12.42277717590332, "global_step": 325465, "epoch": 1937} {"train_loss": -12.348747253417969, "global_step": 325466, "epoch": 1937} {"train_loss": -12.328279495239258, "global_step": 325467, "epoch": 1937} {"train_loss": -12.266387939453125, "global_step": 325468, "epoch": 1937} {"train_loss": -12.539652824401855, "global_step": 325469, "epoch": 1937} {"train_loss": -12.438350677490234, "global_step": 325470, "epoch": 1937} {"train_loss": -12.689912796020508, "global_step": 325471, "epoch": 1937} {"train_loss": -12.32156753540039, "global_step": 325472, "epoch": 1937} {"train_loss": -12.411935806274414, "global_step": 325473, "epoch": 1937} {"train_loss": -12.464963912963867, "global_step": 325474, "epoch": 1937} {"train_loss": -11.972886085510254, "global_step": 325475, "epoch": 1937} {"train_loss": -12.168840408325195, "global_step": 325476, "epoch": 1937} {"train_loss": -12.36144733428955, "global_step": 325477, "epoch": 1937} {"train_loss": -12.073090553283691, "global_step": 325478, "epoch": 1937} {"train_loss": -11.421058654785156, "global_step": 325479, "epoch": 1937} {"train_loss": -12.187490463256836, "global_step": 325480, "epoch": 1937} {"train_loss": -12.163873672485352, "global_step": 325481, "epoch": 1937} {"train_loss": -11.843597412109375, "global_step": 325482, "epoch": 1937} {"train_loss": -12.133825302124023, "global_step": 325483, "epoch": 1937} {"train_loss": -12.250585556030273, "global_step": 325484, "epoch": 1937} {"train_loss": -11.513643264770508, "global_step": 325485, "epoch": 1937} {"train_loss": -12.181831359863281, "global_step": 325486, "epoch": 1937} {"train_loss": -12.589709281921387, "global_step": 325487, "epoch": 1937} {"train_loss": -12.233476638793945, "global_step": 325488, "epoch": 1937} {"train_loss": -11.895895004272461, "global_step": 325489, "epoch": 1937} {"train_loss": -12.246989250183105, "global_step": 325490, "epoch": 1937} {"train_loss": -12.242330551147461, "global_step": 325491, "epoch": 1937} {"train_loss": -11.713948249816895, "global_step": 325492, "epoch": 1937} {"train_loss": -11.747060775756836, "global_step": 325493, "epoch": 1937} {"train_loss": -12.286059379577637, "global_step": 325494, "epoch": 1937} {"train_loss": -12.085256576538086, "global_step": 325495, "epoch": 1937} {"train_loss": -11.455936431884766, "global_step": 325496, "epoch": 1937} {"train_loss": -12.357230186462402, "global_step": 325497, "epoch": 1937} {"train_loss": -11.975137710571289, "global_step": 325498, "epoch": 1937} {"train_loss": -11.674704551696777, "global_step": 325499, "epoch": 1937} {"train_loss": -11.1555814743042, "global_step": 325500, "epoch": 1937} {"train_loss": -12.332944869995117, "global_step": 325501, "epoch": 1937} {"train_loss": -11.230833053588867, "global_step": 325502, "epoch": 1937} {"train_loss": -11.3629150390625, "global_step": 325503, "epoch": 1937} {"train_loss": -12.208633422851562, "global_step": 325504, "epoch": 1937} {"train_loss": -12.083112716674805, "global_step": 325505, "epoch": 1937} {"train_loss": -11.794792175292969, "global_step": 325506, "epoch": 1937} {"train_loss": -12.045246124267578, "global_step": 325507, "epoch": 1937} {"train_loss": -11.025858879089355, "global_step": 325508, "epoch": 1937} {"train_loss": -10.632673263549805, "global_step": 325509, "epoch": 1937} {"train_loss": -11.657337188720703, "global_step": 325510, "epoch": 1937} {"train_loss": -11.746760368347168, "global_step": 325511, "epoch": 1937} {"train_loss": -10.920271873474121, "global_step": 325512, "epoch": 1937} {"train_loss": -11.937671661376953, "global_step": 325513, "epoch": 1937} {"train_loss": -11.298133850097656, "global_step": 325514, "epoch": 1937} {"train_loss": -11.458026885986328, "global_step": 325515, "epoch": 1937} {"train_loss": -11.92968463897705, "global_step": 325516, "epoch": 1937} {"train_loss": -11.402682304382324, "global_step": 325517, "epoch": 1937} {"train_loss": -11.475172996520996, "global_step": 325518, "epoch": 1937} {"train_loss": -11.94388198852539, "global_step": 325519, "epoch": 1937} {"train_loss": -11.254417419433594, "global_step": 325520, "epoch": 1937} {"train_loss": -11.776622772216797, "global_step": 325521, "epoch": 1937} {"train_loss": -12.10899543762207, "global_step": 325522, "epoch": 1937} {"train_loss": -11.385581970214844, "global_step": 325523, "epoch": 1937} {"train_loss": -12.101378440856934, "global_step": 325524, "epoch": 1937} {"train_loss": -11.770097732543945, "global_step": 325525, "epoch": 1937} {"train_loss": -11.891487121582031, "global_step": 325526, "epoch": 1937} {"train_loss": -12.344731330871582, "global_step": 325527, "epoch": 1937} {"train_loss": -11.913203239440918, "global_step": 325528, "epoch": 1937} {"train_loss": -12.451704025268555, "global_step": 325529, "epoch": 1937} {"train_loss": -11.401996612548828, "global_step": 325530, "epoch": 1937} {"train_loss": -12.117140769958496, "global_step": 325531, "epoch": 1937} {"train_loss": -12.050643920898438, "global_step": 325532, "epoch": 1937} {"train_loss": -11.807437896728516, "global_step": 325533, "epoch": 1937} {"train_loss": -12.1532564163208, "global_step": 325534, "epoch": 1937} {"train_loss": -12.3677978515625, "global_step": 325535, "epoch": 1937} {"train_loss": -12.340765953063965, "global_step": 325536, "epoch": 1937} {"train_loss": -12.291461944580078, "global_step": 325537, "epoch": 1937} {"train_loss": -12.372307777404785, "global_step": 325538, "epoch": 1937} {"train_loss": -12.392004013061523, "global_step": 325539, "epoch": 1937} {"train_loss": -12.298301696777344, "global_step": 325540, "epoch": 1937} {"train_loss": -12.06783676147461, "global_step": 325541, "epoch": 1937} {"train_loss": -12.318246841430664, "global_step": 325542, "epoch": 1937} {"train_loss": -12.311875343322754, "global_step": 325543, "epoch": 1937} {"train_loss": -12.196311950683594, "global_step": 325544, "epoch": 1937} {"train_loss": -12.276695251464844, "global_step": 325545, "epoch": 1937} {"train_loss": -12.13461971282959, "global_step": 325546, "epoch": 1937} {"train_loss": -12.1514892578125, "global_step": 325547, "epoch": 1937} {"train_loss": -12.412395477294922, "global_step": 325548, "epoch": 1937} {"train_loss": -12.281213760375977, "global_step": 325549, "epoch": 1937} {"train_loss": -12.07305908203125, "global_step": 325550, "epoch": 1937} {"train_loss": -12.216961860656738, "global_step": 325551, "epoch": 1937} {"train_loss": -12.187148094177246, "global_step": 325552, "epoch": 1937} {"train_loss": -12.391797065734863, "global_step": 325553, "epoch": 1937} {"train_loss": -12.547281265258789, "global_step": 325554, "epoch": 1937} {"train_loss": -12.239733695983887, "global_step": 325555, "epoch": 1937} {"train_loss": -12.410174369812012, "global_step": 325556, "epoch": 1937} {"train_loss": -12.318655967712402, "global_step": 325557, "epoch": 1937} {"train_loss": -12.107709884643555, "global_step": 325558, "epoch": 1937} {"train_loss": -12.293001174926758, "global_step": 325559, "epoch": 1937} {"train_loss": -12.154731750488281, "global_step": 325560, "epoch": 1937} {"train_loss": -12.179743766784668, "global_step": 325561, "epoch": 1937} {"train_loss": -12.575458526611328, "global_step": 325562, "epoch": 1937} {"train_loss": -12.362592697143555, "global_step": 325563, "epoch": 1937} {"train_loss": -12.511433601379395, "global_step": 325564, "epoch": 1937} {"train_loss": -12.480156898498535, "global_step": 325565, "epoch": 1937} {"train_loss": -12.236443519592285, "global_step": 325566, "epoch": 1937} {"train_loss": -12.350357055664062, "global_step": 325567, "epoch": 1937} {"train_loss": -12.33112907409668, "global_step": 325568, "epoch": 1937} {"train_loss": -12.389602661132812, "global_step": 325569, "epoch": 1937} {"train_loss": -12.27730941772461, "global_step": 325570, "epoch": 1937} {"train_loss": -12.443204879760742, "global_step": 325571, "epoch": 1937} {"train_loss": -12.259963035583496, "global_step": 325572, "epoch": 1937} {"train_loss": -12.458198547363281, "global_step": 325573, "epoch": 1937} {"train_loss": -12.130111694335938, "global_step": 325574, "epoch": 1937} {"train_loss": -12.548319816589355, "global_step": 325575, "epoch": 1937} {"train_loss": -12.28140640258789, "global_step": 325576, "epoch": 1937} {"train_loss": -12.286199569702148, "global_step": 325577, "epoch": 1937} {"train_loss": -12.094951629638672, "global_step": 325578, "epoch": 1937} {"train_loss": -12.434176445007324, "global_step": 325579, "epoch": 1937} {"train_loss": -12.288200378417969, "global_step": 325580, "epoch": 1937} {"train_loss": -12.399706840515137, "global_step": 325581, "epoch": 1937} {"train_loss": -12.645721435546875, "global_step": 325582, "epoch": 1937} {"train_loss": -12.082878277415322, "global_step": 325583, "epoch": 1937, "val_loss": 286985.78125} {"train_loss": -12.26953125, "global_step": 325584, "epoch": 1938} {"train_loss": -12.425118446350098, "global_step": 325585, "epoch": 1938} {"train_loss": -12.662980079650879, "global_step": 325586, "epoch": 1938} {"train_loss": -12.372953414916992, "global_step": 325587, "epoch": 1938} {"train_loss": -12.34366226196289, "global_step": 325588, "epoch": 1938} {"train_loss": -12.573783874511719, "global_step": 325589, "epoch": 1938} {"train_loss": -12.341268539428711, "global_step": 325590, "epoch": 1938} {"train_loss": -12.525344848632812, "global_step": 325591, "epoch": 1938} {"train_loss": -11.791586875915527, "global_step": 325592, "epoch": 1938} {"train_loss": -11.884682655334473, "global_step": 325593, "epoch": 1938} {"train_loss": -11.910720825195312, "global_step": 325594, "epoch": 1938} {"train_loss": -12.369400978088379, "global_step": 325595, "epoch": 1938} {"train_loss": -12.274492263793945, "global_step": 325596, "epoch": 1938} {"train_loss": -12.386394500732422, "global_step": 325597, "epoch": 1938} {"train_loss": -12.408132553100586, "global_step": 325598, "epoch": 1938} {"train_loss": -12.290801048278809, "global_step": 325599, "epoch": 1938} {"train_loss": -12.272095680236816, "global_step": 325600, "epoch": 1938} {"train_loss": -12.318312644958496, "global_step": 325601, "epoch": 1938} {"train_loss": -12.323515892028809, "global_step": 325602, "epoch": 1938} {"train_loss": -12.08076000213623, "global_step": 325603, "epoch": 1938} {"train_loss": -12.407987594604492, "global_step": 325604, "epoch": 1938} {"train_loss": -12.216402053833008, "global_step": 325605, "epoch": 1938} {"train_loss": -12.239469528198242, "global_step": 325606, "epoch": 1938} {"train_loss": -11.219650268554688, "global_step": 325607, "epoch": 1938} {"train_loss": -10.954452514648438, "global_step": 325608, "epoch": 1938} {"train_loss": -10.696130752563477, "global_step": 325609, "epoch": 1938} {"train_loss": -11.65786361694336, "global_step": 325610, "epoch": 1938} {"train_loss": -12.15224838256836, "global_step": 325611, "epoch": 1938} {"train_loss": -11.279396057128906, "global_step": 325612, "epoch": 1938} {"train_loss": -10.931946754455566, "global_step": 325613, "epoch": 1938} {"train_loss": -11.390741348266602, "global_step": 325614, "epoch": 1938} {"train_loss": -11.915233612060547, "global_step": 325615, "epoch": 1938} {"train_loss": -11.83800983428955, "global_step": 325616, "epoch": 1938} {"train_loss": -12.329870223999023, "global_step": 325617, "epoch": 1938} {"train_loss": -11.649866104125977, "global_step": 325618, "epoch": 1938} {"train_loss": -11.825066566467285, "global_step": 325619, "epoch": 1938} {"train_loss": -12.373886108398438, "global_step": 325620, "epoch": 1938} {"train_loss": -11.225591659545898, "global_step": 325621, "epoch": 1938} {"train_loss": -12.044393539428711, "global_step": 325622, "epoch": 1938} {"train_loss": -11.778173446655273, "global_step": 325623, "epoch": 1938} {"train_loss": -11.85000228881836, "global_step": 325624, "epoch": 1938} {"train_loss": -10.952022552490234, "global_step": 325625, "epoch": 1938} {"train_loss": -12.10212230682373, "global_step": 325626, "epoch": 1938} {"train_loss": -11.543817520141602, "global_step": 325627, "epoch": 1938} {"train_loss": -11.213949203491211, "global_step": 325628, "epoch": 1938} {"train_loss": -11.307881355285645, "global_step": 325629, "epoch": 1938} {"train_loss": -12.365608215332031, "global_step": 325630, "epoch": 1938} {"train_loss": -10.91049861907959, "global_step": 325631, "epoch": 1938} {"train_loss": -11.688648223876953, "global_step": 325632, "epoch": 1938} {"train_loss": -11.882076263427734, "global_step": 325633, "epoch": 1938} {"train_loss": -11.69775390625, "global_step": 325634, "epoch": 1938} {"train_loss": -11.997403144836426, "global_step": 325635, "epoch": 1938} {"train_loss": -11.899862289428711, "global_step": 325636, "epoch": 1938} {"train_loss": -12.187969207763672, "global_step": 325637, "epoch": 1938} {"train_loss": -11.603710174560547, "global_step": 325638, "epoch": 1938} {"train_loss": -11.851367950439453, "global_step": 325639, "epoch": 1938} {"train_loss": -12.10378360748291, "global_step": 325640, "epoch": 1938} {"train_loss": -12.319770812988281, "global_step": 325641, "epoch": 1938} {"train_loss": -11.999478340148926, "global_step": 325642, "epoch": 1938} {"train_loss": -11.960311889648438, "global_step": 325643, "epoch": 1938} {"train_loss": -12.38407039642334, "global_step": 325644, "epoch": 1938} {"train_loss": -12.112641334533691, "global_step": 325645, "epoch": 1938} {"train_loss": -12.33334732055664, "global_step": 325646, "epoch": 1938} {"train_loss": -12.089216232299805, "global_step": 325647, "epoch": 1938} {"train_loss": -12.277654647827148, "global_step": 325648, "epoch": 1938} {"train_loss": -11.77877426147461, "global_step": 325649, "epoch": 1938} {"train_loss": -12.216569900512695, "global_step": 325650, "epoch": 1938} {"train_loss": -12.117904663085938, "global_step": 325651, "epoch": 1938} {"train_loss": -12.257232666015625, "global_step": 325652, "epoch": 1938} {"train_loss": -12.315452575683594, "global_step": 325653, "epoch": 1938} {"train_loss": -12.245038032531738, "global_step": 325654, "epoch": 1938} {"train_loss": -12.12945556640625, "global_step": 325655, "epoch": 1938} {"train_loss": -12.417695045471191, "global_step": 325656, "epoch": 1938} {"train_loss": -12.175897598266602, "global_step": 325657, "epoch": 1938} {"train_loss": -12.055635452270508, "global_step": 325658, "epoch": 1938} {"train_loss": -12.256511688232422, "global_step": 325659, "epoch": 1938} {"train_loss": -12.425400733947754, "global_step": 325660, "epoch": 1938} {"train_loss": -12.415132522583008, "global_step": 325661, "epoch": 1938} {"train_loss": -12.32486343383789, "global_step": 325662, "epoch": 1938} {"train_loss": -12.140338897705078, "global_step": 325663, "epoch": 1938} {"train_loss": -11.970657348632812, "global_step": 325664, "epoch": 1938} {"train_loss": -12.453981399536133, "global_step": 325665, "epoch": 1938} {"train_loss": -12.39218521118164, "global_step": 325666, "epoch": 1938} {"train_loss": -12.056154251098633, "global_step": 325667, "epoch": 1938} {"train_loss": -12.32868480682373, "global_step": 325668, "epoch": 1938} {"train_loss": -12.375946998596191, "global_step": 325669, "epoch": 1938} {"train_loss": -12.291855812072754, "global_step": 325670, "epoch": 1938} {"train_loss": -12.395933151245117, "global_step": 325671, "epoch": 1938} {"train_loss": -12.268810272216797, "global_step": 325672, "epoch": 1938} {"train_loss": -12.440347671508789, "global_step": 325673, "epoch": 1938} {"train_loss": -11.566910743713379, "global_step": 325674, "epoch": 1938} {"train_loss": -12.321918487548828, "global_step": 325675, "epoch": 1938} {"train_loss": -12.089932441711426, "global_step": 325676, "epoch": 1938} {"train_loss": -12.359110832214355, "global_step": 325677, "epoch": 1938} {"train_loss": -11.726720809936523, "global_step": 325678, "epoch": 1938} {"train_loss": -12.067355155944824, "global_step": 325679, "epoch": 1938} {"train_loss": -11.284818649291992, "global_step": 325680, "epoch": 1938} {"train_loss": -11.69061279296875, "global_step": 325681, "epoch": 1938} {"train_loss": -10.206991195678711, "global_step": 325682, "epoch": 1938} {"train_loss": -10.495464324951172, "global_step": 325683, "epoch": 1938} {"train_loss": -11.343238830566406, "global_step": 325684, "epoch": 1938} {"train_loss": -9.726703643798828, "global_step": 325685, "epoch": 1938} {"train_loss": -10.507640838623047, "global_step": 325686, "epoch": 1938} {"train_loss": -10.850815773010254, "global_step": 325687, "epoch": 1938} {"train_loss": -11.15605354309082, "global_step": 325688, "epoch": 1938} {"train_loss": -10.172388076782227, "global_step": 325689, "epoch": 1938} {"train_loss": -12.211080551147461, "global_step": 325690, "epoch": 1938} {"train_loss": -9.784956932067871, "global_step": 325691, "epoch": 1938} {"train_loss": -11.412277221679688, "global_step": 325692, "epoch": 1938} {"train_loss": -11.718587875366211, "global_step": 325693, "epoch": 1938} {"train_loss": -10.517434120178223, "global_step": 325694, "epoch": 1938} {"train_loss": -11.986346244812012, "global_step": 325695, "epoch": 1938} {"train_loss": -10.71898078918457, "global_step": 325696, "epoch": 1938} {"train_loss": -12.085490226745605, "global_step": 325697, "epoch": 1938} {"train_loss": -10.487988471984863, "global_step": 325698, "epoch": 1938} {"train_loss": -11.97146987915039, "global_step": 325699, "epoch": 1938} {"train_loss": -11.170490264892578, "global_step": 325700, "epoch": 1938} {"train_loss": -11.562408447265625, "global_step": 325701, "epoch": 1938} {"train_loss": -11.104875564575195, "global_step": 325702, "epoch": 1938} {"train_loss": -11.242759704589844, "global_step": 325703, "epoch": 1938} {"train_loss": -10.897558212280273, "global_step": 325704, "epoch": 1938} {"train_loss": -10.764875411987305, "global_step": 325705, "epoch": 1938} {"train_loss": -11.377972602844238, "global_step": 325706, "epoch": 1938} {"train_loss": -9.688079833984375, "global_step": 325707, "epoch": 1938} {"train_loss": -10.84593677520752, "global_step": 325708, "epoch": 1938} {"train_loss": -9.757818222045898, "global_step": 325709, "epoch": 1938} {"train_loss": -9.717634201049805, "global_step": 325710, "epoch": 1938} {"train_loss": -10.107563018798828, "global_step": 325711, "epoch": 1938} {"train_loss": -9.604736328125, "global_step": 325712, "epoch": 1938} {"train_loss": -9.293750762939453, "global_step": 325713, "epoch": 1938} {"train_loss": -8.937509536743164, "global_step": 325714, "epoch": 1938} {"train_loss": -9.593098640441895, "global_step": 325715, "epoch": 1938} {"train_loss": -11.23403549194336, "global_step": 325716, "epoch": 1938} {"train_loss": -9.863336563110352, "global_step": 325717, "epoch": 1938} {"train_loss": -10.608499526977539, "global_step": 325718, "epoch": 1938} {"train_loss": -11.275127410888672, "global_step": 325719, "epoch": 1938} {"train_loss": -10.800239562988281, "global_step": 325720, "epoch": 1938} {"train_loss": -11.305891036987305, "global_step": 325721, "epoch": 1938} {"train_loss": -11.225455284118652, "global_step": 325722, "epoch": 1938} {"train_loss": -10.99571704864502, "global_step": 325723, "epoch": 1938} {"train_loss": -11.796899795532227, "global_step": 325724, "epoch": 1938} {"train_loss": -11.372529983520508, "global_step": 325725, "epoch": 1938} {"train_loss": -11.782632827758789, "global_step": 325726, "epoch": 1938} {"train_loss": -11.53969955444336, "global_step": 325727, "epoch": 1938} {"train_loss": -11.087813377380371, "global_step": 325728, "epoch": 1938} {"train_loss": -11.72661018371582, "global_step": 325729, "epoch": 1938} {"train_loss": -11.275069236755371, "global_step": 325730, "epoch": 1938} {"train_loss": -11.593594551086426, "global_step": 325731, "epoch": 1938} {"train_loss": -11.745955467224121, "global_step": 325732, "epoch": 1938} {"train_loss": -11.651294708251953, "global_step": 325733, "epoch": 1938} {"train_loss": -11.51636028289795, "global_step": 325734, "epoch": 1938} {"train_loss": -11.91732406616211, "global_step": 325735, "epoch": 1938} {"train_loss": -12.002447128295898, "global_step": 325736, "epoch": 1938} {"train_loss": -11.969907760620117, "global_step": 325737, "epoch": 1938} {"train_loss": -11.883001327514648, "global_step": 325738, "epoch": 1938} {"train_loss": -11.916259765625, "global_step": 325739, "epoch": 1938} {"train_loss": -11.706501960754395, "global_step": 325740, "epoch": 1938} {"train_loss": -12.013654708862305, "global_step": 325741, "epoch": 1938} {"train_loss": -12.00973129272461, "global_step": 325742, "epoch": 1938} {"train_loss": -11.62513542175293, "global_step": 325743, "epoch": 1938} {"train_loss": -11.998434066772461, "global_step": 325744, "epoch": 1938} {"train_loss": -11.918102264404297, "global_step": 325745, "epoch": 1938} {"train_loss": -11.709230422973633, "global_step": 325746, "epoch": 1938} {"train_loss": -12.248026847839355, "global_step": 325747, "epoch": 1938} {"train_loss": -11.812688827514648, "global_step": 325748, "epoch": 1938} {"train_loss": -11.874773025512695, "global_step": 325749, "epoch": 1938} {"train_loss": -12.090636253356934, "global_step": 325750, "epoch": 1938} {"train_loss": -11.655025544620695, "global_step": 325751, "epoch": 1938, "val_loss": 281511.875} {"train_loss": -12.009021759033203, "global_step": 325752, "epoch": 1939} {"train_loss": -12.348283767700195, "global_step": 325753, "epoch": 1939} {"train_loss": -12.161712646484375, "global_step": 325754, "epoch": 1939} {"train_loss": -12.151456832885742, "global_step": 325755, "epoch": 1939} {"train_loss": -12.253555297851562, "global_step": 325756, "epoch": 1939} {"train_loss": -12.161433219909668, "global_step": 325757, "epoch": 1939} {"train_loss": -12.150615692138672, "global_step": 325758, "epoch": 1939} {"train_loss": -12.153339385986328, "global_step": 325759, "epoch": 1939} {"train_loss": -12.16084098815918, "global_step": 325760, "epoch": 1939} {"train_loss": -12.238850593566895, "global_step": 325761, "epoch": 1939} {"train_loss": -12.003170013427734, "global_step": 325762, "epoch": 1939} {"train_loss": -12.161552429199219, "global_step": 325763, "epoch": 1939} {"train_loss": -12.190194129943848, "global_step": 325764, "epoch": 1939} {"train_loss": -12.39987564086914, "global_step": 325765, "epoch": 1939} {"train_loss": -12.066019058227539, "global_step": 325766, "epoch": 1939} {"train_loss": -12.403841972351074, "global_step": 325767, "epoch": 1939} {"train_loss": -12.237536430358887, "global_step": 325768, "epoch": 1939} {"train_loss": -12.097633361816406, "global_step": 325769, "epoch": 1939} {"train_loss": -12.301376342773438, "global_step": 325770, "epoch": 1939} {"train_loss": -12.22523021697998, "global_step": 325771, "epoch": 1939} {"train_loss": -12.36314868927002, "global_step": 325772, "epoch": 1939} {"train_loss": -12.398775100708008, "global_step": 325773, "epoch": 1939} {"train_loss": -12.33001708984375, "global_step": 325774, "epoch": 1939} {"train_loss": -12.453604698181152, "global_step": 325775, "epoch": 1939} {"train_loss": -12.41394329071045, "global_step": 325776, "epoch": 1939} {"train_loss": -12.367149353027344, "global_step": 325777, "epoch": 1939} {"train_loss": -12.287069320678711, "global_step": 325778, "epoch": 1939} {"train_loss": -12.271736145019531, "global_step": 325779, "epoch": 1939} {"train_loss": -12.373939514160156, "global_step": 325780, "epoch": 1939} {"train_loss": -12.377559661865234, "global_step": 325781, "epoch": 1939} {"train_loss": -12.200328826904297, "global_step": 325782, "epoch": 1939} {"train_loss": -12.591394424438477, "global_step": 325783, "epoch": 1939} {"train_loss": -12.155108451843262, "global_step": 325784, "epoch": 1939} {"train_loss": -12.378729820251465, "global_step": 325785, "epoch": 1939} {"train_loss": -12.317380905151367, "global_step": 325786, "epoch": 1939} {"train_loss": -12.404935836791992, "global_step": 325787, "epoch": 1939} {"train_loss": -12.2064208984375, "global_step": 325788, "epoch": 1939} {"train_loss": -12.39624309539795, "global_step": 325789, "epoch": 1939} {"train_loss": -12.338738441467285, "global_step": 325790, "epoch": 1939} {"train_loss": -12.107192039489746, "global_step": 325791, "epoch": 1939} {"train_loss": -12.383277893066406, "global_step": 325792, "epoch": 1939} {"train_loss": -12.241495132446289, "global_step": 325793, "epoch": 1939} {"train_loss": -12.152351379394531, "global_step": 325794, "epoch": 1939} {"train_loss": -12.421777725219727, "global_step": 325795, "epoch": 1939} {"train_loss": -12.42076587677002, "global_step": 325796, "epoch": 1939} {"train_loss": -12.198419570922852, "global_step": 325797, "epoch": 1939} {"train_loss": -12.20732307434082, "global_step": 325798, "epoch": 1939} {"train_loss": -12.247007369995117, "global_step": 325799, "epoch": 1939} {"train_loss": -12.079211235046387, "global_step": 325800, "epoch": 1939} {"train_loss": -11.820514678955078, "global_step": 325801, "epoch": 1939} {"train_loss": -12.315486907958984, "global_step": 325802, "epoch": 1939} {"train_loss": -12.20601749420166, "global_step": 325803, "epoch": 1939} {"train_loss": -11.857425689697266, "global_step": 325804, "epoch": 1939} {"train_loss": -12.569143295288086, "global_step": 325805, "epoch": 1939} {"train_loss": -12.021147727966309, "global_step": 325806, "epoch": 1939} {"train_loss": -11.86823844909668, "global_step": 325807, "epoch": 1939} {"train_loss": -12.047001838684082, "global_step": 325808, "epoch": 1939} {"train_loss": -12.313445091247559, "global_step": 325809, "epoch": 1939} {"train_loss": -12.191879272460938, "global_step": 325810, "epoch": 1939} {"train_loss": -12.431680679321289, "global_step": 325811, "epoch": 1939} {"train_loss": -12.293522834777832, "global_step": 325812, "epoch": 1939} {"train_loss": -11.946847915649414, "global_step": 325813, "epoch": 1939} {"train_loss": -11.119315147399902, "global_step": 325814, "epoch": 1939} {"train_loss": -12.448558807373047, "global_step": 325815, "epoch": 1939} {"train_loss": -12.417146682739258, "global_step": 325816, "epoch": 1939} {"train_loss": -12.288240432739258, "global_step": 325817, "epoch": 1939} {"train_loss": -11.942248344421387, "global_step": 325818, "epoch": 1939} {"train_loss": -12.415385246276855, "global_step": 325819, "epoch": 1939} {"train_loss": -12.232946395874023, "global_step": 325820, "epoch": 1939} {"train_loss": -11.967018127441406, "global_step": 325821, "epoch": 1939} {"train_loss": -12.457744598388672, "global_step": 325822, "epoch": 1939} {"train_loss": -12.113719940185547, "global_step": 325823, "epoch": 1939} {"train_loss": -11.583646774291992, "global_step": 325824, "epoch": 1939} {"train_loss": -12.388376235961914, "global_step": 325825, "epoch": 1939} {"train_loss": -12.124374389648438, "global_step": 325826, "epoch": 1939} {"train_loss": -11.57945728302002, "global_step": 325827, "epoch": 1939} {"train_loss": -11.414264678955078, "global_step": 325828, "epoch": 1939} {"train_loss": -12.287450790405273, "global_step": 325829, "epoch": 1939} {"train_loss": -11.728368759155273, "global_step": 325830, "epoch": 1939} {"train_loss": -11.47217845916748, "global_step": 325831, "epoch": 1939} {"train_loss": -12.066610336303711, "global_step": 325832, "epoch": 1939} {"train_loss": -11.841882705688477, "global_step": 325833, "epoch": 1939} {"train_loss": -11.12973403930664, "global_step": 325834, "epoch": 1939} {"train_loss": -12.372631072998047, "global_step": 325835, "epoch": 1939} {"train_loss": -11.784914016723633, "global_step": 325836, "epoch": 1939} {"train_loss": -11.175586700439453, "global_step": 325837, "epoch": 1939} {"train_loss": -12.437747955322266, "global_step": 325838, "epoch": 1939} {"train_loss": -11.442549705505371, "global_step": 325839, "epoch": 1939} {"train_loss": -11.44720458984375, "global_step": 325840, "epoch": 1939} {"train_loss": -12.1185302734375, "global_step": 325841, "epoch": 1939} {"train_loss": -11.75227165222168, "global_step": 325842, "epoch": 1939} {"train_loss": -12.25851821899414, "global_step": 325843, "epoch": 1939} {"train_loss": -12.092033386230469, "global_step": 325844, "epoch": 1939} {"train_loss": -12.106183052062988, "global_step": 325845, "epoch": 1939} {"train_loss": -11.798589706420898, "global_step": 325846, "epoch": 1939} {"train_loss": -12.180171966552734, "global_step": 325847, "epoch": 1939} {"train_loss": -12.486352920532227, "global_step": 325848, "epoch": 1939} {"train_loss": -11.977746963500977, "global_step": 325849, "epoch": 1939} {"train_loss": -11.763056755065918, "global_step": 325850, "epoch": 1939} {"train_loss": -12.232938766479492, "global_step": 325851, "epoch": 1939} {"train_loss": -12.066234588623047, "global_step": 325852, "epoch": 1939} {"train_loss": -11.812545776367188, "global_step": 325853, "epoch": 1939} {"train_loss": -12.137018203735352, "global_step": 325854, "epoch": 1939} {"train_loss": -11.82533073425293, "global_step": 325855, "epoch": 1939} {"train_loss": -11.633071899414062, "global_step": 325856, "epoch": 1939} {"train_loss": -12.105522155761719, "global_step": 325857, "epoch": 1939} {"train_loss": -11.197490692138672, "global_step": 325858, "epoch": 1939} {"train_loss": -10.933572769165039, "global_step": 325859, "epoch": 1939} {"train_loss": -12.056324005126953, "global_step": 325860, "epoch": 1939} {"train_loss": -11.717710494995117, "global_step": 325861, "epoch": 1939} {"train_loss": -10.58095932006836, "global_step": 325862, "epoch": 1939} {"train_loss": -11.644981384277344, "global_step": 325863, "epoch": 1939} {"train_loss": -10.32778263092041, "global_step": 325864, "epoch": 1939} {"train_loss": -11.379432678222656, "global_step": 325865, "epoch": 1939} {"train_loss": -11.004463195800781, "global_step": 325866, "epoch": 1939} {"train_loss": -10.797980308532715, "global_step": 325867, "epoch": 1939} {"train_loss": -12.004225730895996, "global_step": 325868, "epoch": 1939} {"train_loss": -10.519128799438477, "global_step": 325869, "epoch": 1939} {"train_loss": -10.658562660217285, "global_step": 325870, "epoch": 1939} {"train_loss": -11.768579483032227, "global_step": 325871, "epoch": 1939} {"train_loss": -11.111111640930176, "global_step": 325872, "epoch": 1939} {"train_loss": -11.29926872253418, "global_step": 325873, "epoch": 1939} {"train_loss": -11.820855140686035, "global_step": 325874, "epoch": 1939} {"train_loss": -11.133522033691406, "global_step": 325875, "epoch": 1939} {"train_loss": -12.252663612365723, "global_step": 325876, "epoch": 1939} {"train_loss": -11.257967948913574, "global_step": 325877, "epoch": 1939} {"train_loss": -11.687575340270996, "global_step": 325878, "epoch": 1939} {"train_loss": -11.629980087280273, "global_step": 325879, "epoch": 1939} {"train_loss": -11.763524055480957, "global_step": 325880, "epoch": 1939} {"train_loss": -11.95728588104248, "global_step": 325881, "epoch": 1939} {"train_loss": -11.668478012084961, "global_step": 325882, "epoch": 1939} {"train_loss": -12.052273750305176, "global_step": 325883, "epoch": 1939} {"train_loss": -11.730183601379395, "global_step": 325884, "epoch": 1939} {"train_loss": -12.161613464355469, "global_step": 325885, "epoch": 1939} {"train_loss": -11.632155418395996, "global_step": 325886, "epoch": 1939} {"train_loss": -11.71528434753418, "global_step": 325887, "epoch": 1939} {"train_loss": -11.980335235595703, "global_step": 325888, "epoch": 1939} {"train_loss": -11.195423126220703, "global_step": 325889, "epoch": 1939} {"train_loss": -12.12948989868164, "global_step": 325890, "epoch": 1939} {"train_loss": -11.225435256958008, "global_step": 325891, "epoch": 1939} {"train_loss": -11.780278205871582, "global_step": 325892, "epoch": 1939} {"train_loss": -12.091403007507324, "global_step": 325893, "epoch": 1939} {"train_loss": -11.816720962524414, "global_step": 325894, "epoch": 1939} {"train_loss": -12.01258659362793, "global_step": 325895, "epoch": 1939} {"train_loss": -11.938546180725098, "global_step": 325896, "epoch": 1939} {"train_loss": -12.067290306091309, "global_step": 325897, "epoch": 1939} {"train_loss": -11.989121437072754, "global_step": 325898, "epoch": 1939} {"train_loss": -12.039697647094727, "global_step": 325899, "epoch": 1939} {"train_loss": -12.290531158447266, "global_step": 325900, "epoch": 1939} {"train_loss": -12.264513969421387, "global_step": 325901, "epoch": 1939} {"train_loss": -11.944087982177734, "global_step": 325902, "epoch": 1939} {"train_loss": -12.363516807556152, "global_step": 325903, "epoch": 1939} {"train_loss": -11.92043399810791, "global_step": 325904, "epoch": 1939} {"train_loss": -12.04844856262207, "global_step": 325905, "epoch": 1939} {"train_loss": -11.926563262939453, "global_step": 325906, "epoch": 1939} {"train_loss": -12.165558815002441, "global_step": 325907, "epoch": 1939} {"train_loss": -11.95954704284668, "global_step": 325908, "epoch": 1939} {"train_loss": -12.154826164245605, "global_step": 325909, "epoch": 1939} {"train_loss": -12.045446395874023, "global_step": 325910, "epoch": 1939} {"train_loss": -12.341726303100586, "global_step": 325911, "epoch": 1939} {"train_loss": -12.143426895141602, "global_step": 325912, "epoch": 1939} {"train_loss": -12.119681358337402, "global_step": 325913, "epoch": 1939} {"train_loss": -12.210302352905273, "global_step": 325914, "epoch": 1939} {"train_loss": -12.399768829345703, "global_step": 325915, "epoch": 1939} {"train_loss": -12.204543113708496, "global_step": 325916, "epoch": 1939} {"train_loss": -12.341167449951172, "global_step": 325917, "epoch": 1939} {"train_loss": -12.425168991088867, "global_step": 325918, "epoch": 1939} {"train_loss": -11.989560700598217, "global_step": 325919, "epoch": 1939, "val_loss": 285088.1875} {"train_loss": -12.426186561584473, "global_step": 325920, "epoch": 1940} {"train_loss": -12.064008712768555, "global_step": 325921, "epoch": 1940} {"train_loss": -12.564970016479492, "global_step": 325922, "epoch": 1940} {"train_loss": -12.455204010009766, "global_step": 325923, "epoch": 1940} {"train_loss": -12.379396438598633, "global_step": 325924, "epoch": 1940} {"train_loss": -12.556089401245117, "global_step": 325925, "epoch": 1940} {"train_loss": -12.128111839294434, "global_step": 325926, "epoch": 1940} {"train_loss": -12.330673217773438, "global_step": 325927, "epoch": 1940} {"train_loss": -12.42702865600586, "global_step": 325928, "epoch": 1940} {"train_loss": -12.073860168457031, "global_step": 325929, "epoch": 1940} {"train_loss": -12.297799110412598, "global_step": 325930, "epoch": 1940} {"train_loss": -12.16236400604248, "global_step": 325931, "epoch": 1940} {"train_loss": -12.228296279907227, "global_step": 325932, "epoch": 1940} {"train_loss": -12.354642868041992, "global_step": 325933, "epoch": 1940} {"train_loss": -12.054256439208984, "global_step": 325934, "epoch": 1940} {"train_loss": -12.44413948059082, "global_step": 325935, "epoch": 1940} {"train_loss": -12.161057472229004, "global_step": 325936, "epoch": 1940} {"train_loss": -12.128793716430664, "global_step": 325937, "epoch": 1940} {"train_loss": -12.26849365234375, "global_step": 325938, "epoch": 1940} {"train_loss": -12.458832740783691, "global_step": 325939, "epoch": 1940} {"train_loss": -12.177793502807617, "global_step": 325940, "epoch": 1940} {"train_loss": -12.238887786865234, "global_step": 325941, "epoch": 1940} {"train_loss": -12.38451862335205, "global_step": 325942, "epoch": 1940} {"train_loss": -11.11792278289795, "global_step": 325943, "epoch": 1940} {"train_loss": -11.434788703918457, "global_step": 325944, "epoch": 1940} {"train_loss": -12.159059524536133, "global_step": 325945, "epoch": 1940} {"train_loss": -12.281648635864258, "global_step": 325946, "epoch": 1940} {"train_loss": -10.952922821044922, "global_step": 325947, "epoch": 1940} {"train_loss": -11.904231071472168, "global_step": 325948, "epoch": 1940} {"train_loss": -12.256987571716309, "global_step": 325949, "epoch": 1940} {"train_loss": -11.465660095214844, "global_step": 325950, "epoch": 1940} {"train_loss": -12.219513893127441, "global_step": 325951, "epoch": 1940} {"train_loss": -12.00438404083252, "global_step": 325952, "epoch": 1940} {"train_loss": -11.498048782348633, "global_step": 325953, "epoch": 1940} {"train_loss": -12.362003326416016, "global_step": 325954, "epoch": 1940} {"train_loss": -11.857864379882812, "global_step": 325955, "epoch": 1940} {"train_loss": -12.03451919555664, "global_step": 325956, "epoch": 1940} {"train_loss": -12.371925354003906, "global_step": 325957, "epoch": 1940} {"train_loss": -11.79538631439209, "global_step": 325958, "epoch": 1940} {"train_loss": -11.998920440673828, "global_step": 325959, "epoch": 1940} {"train_loss": -12.098461151123047, "global_step": 325960, "epoch": 1940} {"train_loss": -12.056297302246094, "global_step": 325961, "epoch": 1940} {"train_loss": -12.247905731201172, "global_step": 325962, "epoch": 1940} {"train_loss": -12.124715805053711, "global_step": 325963, "epoch": 1940} {"train_loss": -11.598795890808105, "global_step": 325964, "epoch": 1940} {"train_loss": -12.287660598754883, "global_step": 325965, "epoch": 1940} {"train_loss": -12.033041954040527, "global_step": 325966, "epoch": 1940} {"train_loss": -11.939811706542969, "global_step": 325967, "epoch": 1940} {"train_loss": -12.09695053100586, "global_step": 325968, "epoch": 1940} {"train_loss": -11.77322769165039, "global_step": 325969, "epoch": 1940} {"train_loss": -12.13299560546875, "global_step": 325970, "epoch": 1940} {"train_loss": -12.159608840942383, "global_step": 325971, "epoch": 1940} {"train_loss": -12.278532028198242, "global_step": 325972, "epoch": 1940} {"train_loss": -12.072242736816406, "global_step": 325973, "epoch": 1940} {"train_loss": -12.167925834655762, "global_step": 325974, "epoch": 1940} {"train_loss": -12.3704833984375, "global_step": 325975, "epoch": 1940} {"train_loss": -12.056744575500488, "global_step": 325976, "epoch": 1940} {"train_loss": -12.023059844970703, "global_step": 325977, "epoch": 1940} {"train_loss": -12.362434387207031, "global_step": 325978, "epoch": 1940} {"train_loss": -12.182662963867188, "global_step": 325979, "epoch": 1940} {"train_loss": -12.387954711914062, "global_step": 325980, "epoch": 1940} {"train_loss": -12.458980560302734, "global_step": 325981, "epoch": 1940} {"train_loss": -11.982093811035156, "global_step": 325982, "epoch": 1940} {"train_loss": -12.162858009338379, "global_step": 325983, "epoch": 1940} {"train_loss": -12.37455940246582, "global_step": 325984, "epoch": 1940} {"train_loss": -11.772541046142578, "global_step": 325985, "epoch": 1940} {"train_loss": -12.360450744628906, "global_step": 325986, "epoch": 1940} {"train_loss": -11.251752853393555, "global_step": 325987, "epoch": 1940} {"train_loss": -12.274213790893555, "global_step": 325988, "epoch": 1940} {"train_loss": -12.21713638305664, "global_step": 325989, "epoch": 1940} {"train_loss": -11.431199073791504, "global_step": 325990, "epoch": 1940} {"train_loss": -12.029027938842773, "global_step": 325991, "epoch": 1940} {"train_loss": -11.5841646194458, "global_step": 325992, "epoch": 1940} {"train_loss": -11.627256393432617, "global_step": 325993, "epoch": 1940} {"train_loss": -12.049642562866211, "global_step": 325994, "epoch": 1940} {"train_loss": -12.012796401977539, "global_step": 325995, "epoch": 1940} {"train_loss": -11.77542495727539, "global_step": 325996, "epoch": 1940} {"train_loss": -11.664287567138672, "global_step": 325997, "epoch": 1940} {"train_loss": -12.386085510253906, "global_step": 325998, "epoch": 1940} {"train_loss": -11.628326416015625, "global_step": 325999, "epoch": 1940} {"train_loss": -12.11432933807373, "global_step": 326000, "epoch": 1940} {"train_loss": -11.861867904663086, "global_step": 326001, "epoch": 1940} {"train_loss": -12.456546783447266, "global_step": 326002, "epoch": 1940} {"train_loss": -11.996988296508789, "global_step": 326003, "epoch": 1940} {"train_loss": -12.452919960021973, "global_step": 326004, "epoch": 1940} {"train_loss": -11.861525535583496, "global_step": 326005, "epoch": 1940} {"train_loss": -12.261249542236328, "global_step": 326006, "epoch": 1940} {"train_loss": -12.013236999511719, "global_step": 326007, "epoch": 1940} {"train_loss": -12.081155776977539, "global_step": 326008, "epoch": 1940} {"train_loss": -12.140592575073242, "global_step": 326009, "epoch": 1940} {"train_loss": -12.203859329223633, "global_step": 326010, "epoch": 1940} {"train_loss": -11.772504806518555, "global_step": 326011, "epoch": 1940} {"train_loss": -12.338733673095703, "global_step": 326012, "epoch": 1940} {"train_loss": -12.030701637268066, "global_step": 326013, "epoch": 1940} {"train_loss": -11.929361343383789, "global_step": 326014, "epoch": 1940} {"train_loss": -11.538290023803711, "global_step": 326015, "epoch": 1940} {"train_loss": -12.482117652893066, "global_step": 326016, "epoch": 1940} {"train_loss": -11.124771118164062, "global_step": 326017, "epoch": 1940} {"train_loss": -11.997803688049316, "global_step": 326018, "epoch": 1940} {"train_loss": -11.571636199951172, "global_step": 326019, "epoch": 1940} {"train_loss": -12.224874496459961, "global_step": 326020, "epoch": 1940} {"train_loss": -12.110689163208008, "global_step": 326021, "epoch": 1940} {"train_loss": -12.05050277709961, "global_step": 326022, "epoch": 1940} {"train_loss": -12.088933944702148, "global_step": 326023, "epoch": 1940} {"train_loss": -11.894990921020508, "global_step": 326024, "epoch": 1940} {"train_loss": -12.248891830444336, "global_step": 326025, "epoch": 1940} {"train_loss": -11.733068466186523, "global_step": 326026, "epoch": 1940} {"train_loss": -11.767735481262207, "global_step": 326027, "epoch": 1940} {"train_loss": -12.096700668334961, "global_step": 326028, "epoch": 1940} {"train_loss": -11.744312286376953, "global_step": 326029, "epoch": 1940} {"train_loss": -11.958100318908691, "global_step": 326030, "epoch": 1940} {"train_loss": -12.16413688659668, "global_step": 326031, "epoch": 1940} {"train_loss": -11.700971603393555, "global_step": 326032, "epoch": 1940} {"train_loss": -11.9915771484375, "global_step": 326033, "epoch": 1940} {"train_loss": -11.977254867553711, "global_step": 326034, "epoch": 1940} {"train_loss": -11.77090835571289, "global_step": 326035, "epoch": 1940} {"train_loss": -12.365068435668945, "global_step": 326036, "epoch": 1940} {"train_loss": -12.006771087646484, "global_step": 326037, "epoch": 1940} {"train_loss": -12.346603393554688, "global_step": 326038, "epoch": 1940} {"train_loss": -11.79109001159668, "global_step": 326039, "epoch": 1940} {"train_loss": -12.220805168151855, "global_step": 326040, "epoch": 1940} {"train_loss": -11.906816482543945, "global_step": 326041, "epoch": 1940} {"train_loss": -12.327237129211426, "global_step": 326042, "epoch": 1940} {"train_loss": -11.978872299194336, "global_step": 326043, "epoch": 1940} {"train_loss": -12.53734302520752, "global_step": 326044, "epoch": 1940} {"train_loss": -12.424564361572266, "global_step": 326045, "epoch": 1940} {"train_loss": -12.386831283569336, "global_step": 326046, "epoch": 1940} {"train_loss": -11.928597450256348, "global_step": 326047, "epoch": 1940} {"train_loss": -12.493263244628906, "global_step": 326048, "epoch": 1940} {"train_loss": -12.231070518493652, "global_step": 326049, "epoch": 1940} {"train_loss": -12.154553413391113, "global_step": 326050, "epoch": 1940} {"train_loss": -11.895694732666016, "global_step": 326051, "epoch": 1940} {"train_loss": -12.10485553741455, "global_step": 326052, "epoch": 1940} {"train_loss": -12.110428810119629, "global_step": 326053, "epoch": 1940} {"train_loss": -12.265384674072266, "global_step": 326054, "epoch": 1940} {"train_loss": -11.361955642700195, "global_step": 326055, "epoch": 1940} {"train_loss": -11.608325958251953, "global_step": 326056, "epoch": 1940} {"train_loss": -10.98687744140625, "global_step": 326057, "epoch": 1940} {"train_loss": -11.621700286865234, "global_step": 326058, "epoch": 1940} {"train_loss": -11.590600967407227, "global_step": 326059, "epoch": 1940} {"train_loss": -11.555803298950195, "global_step": 326060, "epoch": 1940} {"train_loss": -11.635781288146973, "global_step": 326061, "epoch": 1940} {"train_loss": -11.999489784240723, "global_step": 326062, "epoch": 1940} {"train_loss": -11.069190979003906, "global_step": 326063, "epoch": 1940} {"train_loss": -11.500308990478516, "global_step": 326064, "epoch": 1940} {"train_loss": -12.131475448608398, "global_step": 326065, "epoch": 1940} {"train_loss": -11.195028305053711, "global_step": 326066, "epoch": 1940} {"train_loss": -12.131173133850098, "global_step": 326067, "epoch": 1940} {"train_loss": -11.771504402160645, "global_step": 326068, "epoch": 1940} {"train_loss": -11.53143310546875, "global_step": 326069, "epoch": 1940} {"train_loss": -11.459836959838867, "global_step": 326070, "epoch": 1940} {"train_loss": -11.891756057739258, "global_step": 326071, "epoch": 1940} {"train_loss": -11.157805442810059, "global_step": 326072, "epoch": 1940} {"train_loss": -10.850566864013672, "global_step": 326073, "epoch": 1940} {"train_loss": -11.018767356872559, "global_step": 326074, "epoch": 1940} {"train_loss": -11.384883880615234, "global_step": 326075, "epoch": 1940} {"train_loss": -10.760523796081543, "global_step": 326076, "epoch": 1940} {"train_loss": -10.477558135986328, "global_step": 326077, "epoch": 1940} {"train_loss": -9.918055534362793, "global_step": 326078, "epoch": 1940} {"train_loss": -11.579978942871094, "global_step": 326079, "epoch": 1940} {"train_loss": -9.562868118286133, "global_step": 326080, "epoch": 1940} {"train_loss": -11.073076248168945, "global_step": 326081, "epoch": 1940} {"train_loss": -10.7128324508667, "global_step": 326082, "epoch": 1940} {"train_loss": -10.235860824584961, "global_step": 326083, "epoch": 1940} {"train_loss": -10.1159029006958, "global_step": 326084, "epoch": 1940} {"train_loss": -10.504544258117676, "global_step": 326085, "epoch": 1940} {"train_loss": -10.3217134475708, "global_step": 326086, "epoch": 1940} {"train_loss": -11.88230378287179, "global_step": 326087, "epoch": 1940, "val_loss": 283449.03125, "train_action_mse_error": 3.0119237899780273} {"train_loss": -10.92313289642334, "global_step": 326088, "epoch": 1941} {"train_loss": -9.196653366088867, "global_step": 326089, "epoch": 1941} {"train_loss": -10.487164497375488, "global_step": 326090, "epoch": 1941} {"train_loss": -9.120941162109375, "global_step": 326091, "epoch": 1941} {"train_loss": -10.546035766601562, "global_step": 326092, "epoch": 1941} {"train_loss": -9.588512420654297, "global_step": 326093, "epoch": 1941} {"train_loss": -11.100972175598145, "global_step": 326094, "epoch": 1941} {"train_loss": -9.440704345703125, "global_step": 326095, "epoch": 1941} {"train_loss": -11.671102523803711, "global_step": 326096, "epoch": 1941} {"train_loss": -10.051478385925293, "global_step": 326097, "epoch": 1941} {"train_loss": -10.851205825805664, "global_step": 326098, "epoch": 1941} {"train_loss": -10.88525104522705, "global_step": 326099, "epoch": 1941} {"train_loss": -11.109392166137695, "global_step": 326100, "epoch": 1941} {"train_loss": -10.853755950927734, "global_step": 326101, "epoch": 1941} {"train_loss": -11.541010856628418, "global_step": 326102, "epoch": 1941} {"train_loss": -10.544018745422363, "global_step": 326103, "epoch": 1941} {"train_loss": -11.436713218688965, "global_step": 326104, "epoch": 1941} {"train_loss": -10.816308975219727, "global_step": 326105, "epoch": 1941} {"train_loss": -11.41751766204834, "global_step": 326106, "epoch": 1941} {"train_loss": -10.547754287719727, "global_step": 326107, "epoch": 1941} {"train_loss": -11.065927505493164, "global_step": 326108, "epoch": 1941} {"train_loss": -11.563159942626953, "global_step": 326109, "epoch": 1941} {"train_loss": -11.721647262573242, "global_step": 326110, "epoch": 1941} {"train_loss": -11.297733306884766, "global_step": 326111, "epoch": 1941} {"train_loss": -11.702970504760742, "global_step": 326112, "epoch": 1941} {"train_loss": -11.413433074951172, "global_step": 326113, "epoch": 1941} {"train_loss": -11.369885444641113, "global_step": 326114, "epoch": 1941} {"train_loss": -11.531783103942871, "global_step": 326115, "epoch": 1941} {"train_loss": -11.183459281921387, "global_step": 326116, "epoch": 1941} {"train_loss": -11.649242401123047, "global_step": 326117, "epoch": 1941} {"train_loss": -11.370187759399414, "global_step": 326118, "epoch": 1941} {"train_loss": -11.42277717590332, "global_step": 326119, "epoch": 1941} {"train_loss": -11.819597244262695, "global_step": 326120, "epoch": 1941} {"train_loss": -11.657087326049805, "global_step": 326121, "epoch": 1941} {"train_loss": -11.525544166564941, "global_step": 326122, "epoch": 1941} {"train_loss": -11.970637321472168, "global_step": 326123, "epoch": 1941} {"train_loss": -11.9716157913208, "global_step": 326124, "epoch": 1941} {"train_loss": -11.987503051757812, "global_step": 326125, "epoch": 1941} {"train_loss": -11.757628440856934, "global_step": 326126, "epoch": 1941} {"train_loss": -11.881664276123047, "global_step": 326127, "epoch": 1941} {"train_loss": -11.724141120910645, "global_step": 326128, "epoch": 1941} {"train_loss": -11.850991249084473, "global_step": 326129, "epoch": 1941} {"train_loss": -11.93205451965332, "global_step": 326130, "epoch": 1941} {"train_loss": -11.591943740844727, "global_step": 326131, "epoch": 1941} {"train_loss": -11.947885513305664, "global_step": 326132, "epoch": 1941} {"train_loss": -11.751571655273438, "global_step": 326133, "epoch": 1941} {"train_loss": -11.781776428222656, "global_step": 326134, "epoch": 1941} {"train_loss": -12.151376724243164, "global_step": 326135, "epoch": 1941} {"train_loss": -11.80290412902832, "global_step": 326136, "epoch": 1941} {"train_loss": -11.97139835357666, "global_step": 326137, "epoch": 1941} {"train_loss": -12.023772239685059, "global_step": 326138, "epoch": 1941} {"train_loss": -12.022432327270508, "global_step": 326139, "epoch": 1941} {"train_loss": -12.066761016845703, "global_step": 326140, "epoch": 1941} {"train_loss": -11.916353225708008, "global_step": 326141, "epoch": 1941} {"train_loss": -11.912925720214844, "global_step": 326142, "epoch": 1941} {"train_loss": -12.114629745483398, "global_step": 326143, "epoch": 1941} {"train_loss": -12.044417381286621, "global_step": 326144, "epoch": 1941} {"train_loss": -12.091196060180664, "global_step": 326145, "epoch": 1941} {"train_loss": -12.099218368530273, "global_step": 326146, "epoch": 1941} {"train_loss": -12.217769622802734, "global_step": 326147, "epoch": 1941} {"train_loss": -12.276029586791992, "global_step": 326148, "epoch": 1941} {"train_loss": -12.24769401550293, "global_step": 326149, "epoch": 1941} {"train_loss": -12.258099555969238, "global_step": 326150, "epoch": 1941} {"train_loss": -12.175581932067871, "global_step": 326151, "epoch": 1941} {"train_loss": -12.201370239257812, "global_step": 326152, "epoch": 1941} {"train_loss": -12.448953628540039, "global_step": 326153, "epoch": 1941} {"train_loss": -11.874345779418945, "global_step": 326154, "epoch": 1941} {"train_loss": -12.379666328430176, "global_step": 326155, "epoch": 1941} {"train_loss": -12.281135559082031, "global_step": 326156, "epoch": 1941} {"train_loss": -12.37810230255127, "global_step": 326157, "epoch": 1941} {"train_loss": -12.143903732299805, "global_step": 326158, "epoch": 1941} {"train_loss": -12.378071784973145, "global_step": 326159, "epoch": 1941} {"train_loss": -12.19668960571289, "global_step": 326160, "epoch": 1941} {"train_loss": -12.336104393005371, "global_step": 326161, "epoch": 1941} {"train_loss": -12.315620422363281, "global_step": 326162, "epoch": 1941} {"train_loss": -12.301725387573242, "global_step": 326163, "epoch": 1941} {"train_loss": -12.315851211547852, "global_step": 326164, "epoch": 1941} {"train_loss": -12.435333251953125, "global_step": 326165, "epoch": 1941} {"train_loss": -12.335786819458008, "global_step": 326166, "epoch": 1941} {"train_loss": -12.284747123718262, "global_step": 326167, "epoch": 1941} {"train_loss": -12.146186828613281, "global_step": 326168, "epoch": 1941} {"train_loss": -12.51402473449707, "global_step": 326169, "epoch": 1941} {"train_loss": -12.211398124694824, "global_step": 326170, "epoch": 1941} {"train_loss": -12.290555953979492, "global_step": 326171, "epoch": 1941} {"train_loss": -12.175849914550781, "global_step": 326172, "epoch": 1941} {"train_loss": -12.41970443725586, "global_step": 326173, "epoch": 1941} {"train_loss": -12.331690788269043, "global_step": 326174, "epoch": 1941} {"train_loss": -12.545170783996582, "global_step": 326175, "epoch": 1941} {"train_loss": -12.321142196655273, "global_step": 326176, "epoch": 1941} {"train_loss": -12.15788459777832, "global_step": 326177, "epoch": 1941} {"train_loss": -12.269453048706055, "global_step": 326178, "epoch": 1941} {"train_loss": -12.29053020477295, "global_step": 326179, "epoch": 1941} {"train_loss": -12.400293350219727, "global_step": 326180, "epoch": 1941} {"train_loss": -12.316596984863281, "global_step": 326181, "epoch": 1941} {"train_loss": -12.243993759155273, "global_step": 326182, "epoch": 1941} {"train_loss": -12.399248123168945, "global_step": 326183, "epoch": 1941} {"train_loss": -12.513643264770508, "global_step": 326184, "epoch": 1941} {"train_loss": -12.160085678100586, "global_step": 326185, "epoch": 1941} {"train_loss": -12.189929008483887, "global_step": 326186, "epoch": 1941} {"train_loss": -12.240846633911133, "global_step": 326187, "epoch": 1941} {"train_loss": -11.72978687286377, "global_step": 326188, "epoch": 1941} {"train_loss": -12.704041481018066, "global_step": 326189, "epoch": 1941} {"train_loss": -12.00960636138916, "global_step": 326190, "epoch": 1941} {"train_loss": -12.614811897277832, "global_step": 326191, "epoch": 1941} {"train_loss": -12.192390441894531, "global_step": 326192, "epoch": 1941} {"train_loss": -12.379094123840332, "global_step": 326193, "epoch": 1941} {"train_loss": -12.498968124389648, "global_step": 326194, "epoch": 1941} {"train_loss": -12.458765029907227, "global_step": 326195, "epoch": 1941} {"train_loss": -12.491610527038574, "global_step": 326196, "epoch": 1941} {"train_loss": -12.417993545532227, "global_step": 326197, "epoch": 1941} {"train_loss": -12.72419548034668, "global_step": 326198, "epoch": 1941} {"train_loss": -12.46666145324707, "global_step": 326199, "epoch": 1941} {"train_loss": -12.450336456298828, "global_step": 326200, "epoch": 1941} {"train_loss": -12.65256118774414, "global_step": 326201, "epoch": 1941} {"train_loss": -12.18307876586914, "global_step": 326202, "epoch": 1941} {"train_loss": -12.408720016479492, "global_step": 326203, "epoch": 1941} {"train_loss": -12.559188842773438, "global_step": 326204, "epoch": 1941} {"train_loss": -12.303037643432617, "global_step": 326205, "epoch": 1941} {"train_loss": -12.395130157470703, "global_step": 326206, "epoch": 1941} {"train_loss": -12.502031326293945, "global_step": 326207, "epoch": 1941} {"train_loss": -11.832576751708984, "global_step": 326208, "epoch": 1941} {"train_loss": -12.077695846557617, "global_step": 326209, "epoch": 1941} {"train_loss": -12.320478439331055, "global_step": 326210, "epoch": 1941} {"train_loss": -12.090163230895996, "global_step": 326211, "epoch": 1941} {"train_loss": -11.701080322265625, "global_step": 326212, "epoch": 1941} {"train_loss": -11.681068420410156, "global_step": 326213, "epoch": 1941} {"train_loss": -12.57354736328125, "global_step": 326214, "epoch": 1941} {"train_loss": -12.172280311584473, "global_step": 326215, "epoch": 1941} {"train_loss": -12.037946701049805, "global_step": 326216, "epoch": 1941} {"train_loss": -11.3336181640625, "global_step": 326217, "epoch": 1941} {"train_loss": -12.002632141113281, "global_step": 326218, "epoch": 1941} {"train_loss": -9.954081535339355, "global_step": 326219, "epoch": 1941} {"train_loss": -12.046064376831055, "global_step": 326220, "epoch": 1941} {"train_loss": -11.256937026977539, "global_step": 326221, "epoch": 1941} {"train_loss": -10.401382446289062, "global_step": 326222, "epoch": 1941} {"train_loss": -11.451292037963867, "global_step": 326223, "epoch": 1941} {"train_loss": -10.181059837341309, "global_step": 326224, "epoch": 1941} {"train_loss": -9.703289985656738, "global_step": 326225, "epoch": 1941} {"train_loss": -12.188652038574219, "global_step": 326226, "epoch": 1941} {"train_loss": -10.3714017868042, "global_step": 326227, "epoch": 1941} {"train_loss": -10.779388427734375, "global_step": 326228, "epoch": 1941} {"train_loss": -12.16776180267334, "global_step": 326229, "epoch": 1941} {"train_loss": -11.383302688598633, "global_step": 326230, "epoch": 1941} {"train_loss": -11.85128116607666, "global_step": 326231, "epoch": 1941} {"train_loss": -11.64571762084961, "global_step": 326232, "epoch": 1941} {"train_loss": -11.07351303100586, "global_step": 326233, "epoch": 1941} {"train_loss": -11.830266952514648, "global_step": 326234, "epoch": 1941} {"train_loss": -11.444429397583008, "global_step": 326235, "epoch": 1941} {"train_loss": -11.340526580810547, "global_step": 326236, "epoch": 1941} {"train_loss": -11.59639835357666, "global_step": 326237, "epoch": 1941} {"train_loss": -11.115743637084961, "global_step": 326238, "epoch": 1941} {"train_loss": -12.182317733764648, "global_step": 326239, "epoch": 1941} {"train_loss": -11.004545211791992, "global_step": 326240, "epoch": 1941} {"train_loss": -11.993910789489746, "global_step": 326241, "epoch": 1941} {"train_loss": -11.233909606933594, "global_step": 326242, "epoch": 1941} {"train_loss": -12.019660949707031, "global_step": 326243, "epoch": 1941} {"train_loss": -11.358322143554688, "global_step": 326244, "epoch": 1941} {"train_loss": -11.934505462646484, "global_step": 326245, "epoch": 1941} {"train_loss": -11.685523986816406, "global_step": 326246, "epoch": 1941} {"train_loss": -11.539022445678711, "global_step": 326247, "epoch": 1941} {"train_loss": -12.0410737991333, "global_step": 326248, "epoch": 1941} {"train_loss": -11.185070037841797, "global_step": 326249, "epoch": 1941} {"train_loss": -11.729618072509766, "global_step": 326250, "epoch": 1941} {"train_loss": -11.562960624694824, "global_step": 326251, "epoch": 1941} {"train_loss": -11.33836841583252, "global_step": 326252, "epoch": 1941} {"train_loss": -11.971203804016113, "global_step": 326253, "epoch": 1941} {"train_loss": -11.62828254699707, "global_step": 326254, "epoch": 1941} {"train_loss": -11.765390912691752, "global_step": 326255, "epoch": 1941, "val_loss": 288258.25} {"train_loss": -11.488225936889648, "global_step": 326256, "epoch": 1942} {"train_loss": -10.91792106628418, "global_step": 326257, "epoch": 1942} {"train_loss": -11.73440170288086, "global_step": 326258, "epoch": 1942} {"train_loss": -11.596071243286133, "global_step": 326259, "epoch": 1942} {"train_loss": -12.031770706176758, "global_step": 326260, "epoch": 1942} {"train_loss": -11.964568138122559, "global_step": 326261, "epoch": 1942} {"train_loss": -12.09451961517334, "global_step": 326262, "epoch": 1942} {"train_loss": -11.982540130615234, "global_step": 326263, "epoch": 1942} {"train_loss": -11.847134590148926, "global_step": 326264, "epoch": 1942} {"train_loss": -12.147970199584961, "global_step": 326265, "epoch": 1942} {"train_loss": -12.099760055541992, "global_step": 326266, "epoch": 1942} {"train_loss": -12.126838684082031, "global_step": 326267, "epoch": 1942} {"train_loss": -12.320295333862305, "global_step": 326268, "epoch": 1942} {"train_loss": -12.019786834716797, "global_step": 326269, "epoch": 1942} {"train_loss": -12.216882705688477, "global_step": 326270, "epoch": 1942} {"train_loss": -12.14993667602539, "global_step": 326271, "epoch": 1942} {"train_loss": -12.30160140991211, "global_step": 326272, "epoch": 1942} {"train_loss": -12.246088981628418, "global_step": 326273, "epoch": 1942} {"train_loss": -12.243678092956543, "global_step": 326274, "epoch": 1942} {"train_loss": -12.304039001464844, "global_step": 326275, "epoch": 1942} {"train_loss": -12.427742958068848, "global_step": 326276, "epoch": 1942} {"train_loss": -12.384817123413086, "global_step": 326277, "epoch": 1942} {"train_loss": -12.019726753234863, "global_step": 326278, "epoch": 1942} {"train_loss": -12.268133163452148, "global_step": 326279, "epoch": 1942} {"train_loss": -11.856542587280273, "global_step": 326280, "epoch": 1942} {"train_loss": -12.276671409606934, "global_step": 326281, "epoch": 1942} {"train_loss": -12.141763687133789, "global_step": 326282, "epoch": 1942} {"train_loss": -12.252175331115723, "global_step": 326283, "epoch": 1942} {"train_loss": -12.405732154846191, "global_step": 326284, "epoch": 1942} {"train_loss": -12.175034523010254, "global_step": 326285, "epoch": 1942} {"train_loss": -12.398224830627441, "global_step": 326286, "epoch": 1942} {"train_loss": -12.05540657043457, "global_step": 326287, "epoch": 1942} {"train_loss": -12.391033172607422, "global_step": 326288, "epoch": 1942} {"train_loss": -12.298861503601074, "global_step": 326289, "epoch": 1942} {"train_loss": -12.328771591186523, "global_step": 326290, "epoch": 1942} {"train_loss": -12.420858383178711, "global_step": 326291, "epoch": 1942} {"train_loss": -12.371363639831543, "global_step": 326292, "epoch": 1942} {"train_loss": -12.258719444274902, "global_step": 326293, "epoch": 1942} {"train_loss": -12.27108097076416, "global_step": 326294, "epoch": 1942} {"train_loss": -12.157464981079102, "global_step": 326295, "epoch": 1942} {"train_loss": -12.41420841217041, "global_step": 326296, "epoch": 1942} {"train_loss": -12.26230239868164, "global_step": 326297, "epoch": 1942} {"train_loss": -12.194149017333984, "global_step": 326298, "epoch": 1942} {"train_loss": -12.312212944030762, "global_step": 326299, "epoch": 1942} {"train_loss": -12.178445816040039, "global_step": 326300, "epoch": 1942} {"train_loss": -12.127689361572266, "global_step": 326301, "epoch": 1942} {"train_loss": -12.386869430541992, "global_step": 326302, "epoch": 1942} {"train_loss": -12.171846389770508, "global_step": 326303, "epoch": 1942} {"train_loss": -11.936220169067383, "global_step": 326304, "epoch": 1942} {"train_loss": -12.25200080871582, "global_step": 326305, "epoch": 1942} {"train_loss": -11.992785453796387, "global_step": 326306, "epoch": 1942} {"train_loss": -12.409770011901855, "global_step": 326307, "epoch": 1942} {"train_loss": -11.737485885620117, "global_step": 326308, "epoch": 1942} {"train_loss": -11.916032791137695, "global_step": 326309, "epoch": 1942} {"train_loss": -11.973841667175293, "global_step": 326310, "epoch": 1942} {"train_loss": -11.09265422821045, "global_step": 326311, "epoch": 1942} {"train_loss": -12.045010566711426, "global_step": 326312, "epoch": 1942} {"train_loss": -11.686127662658691, "global_step": 326313, "epoch": 1942} {"train_loss": -12.057205200195312, "global_step": 326314, "epoch": 1942} {"train_loss": -12.246267318725586, "global_step": 326315, "epoch": 1942} {"train_loss": -11.943744659423828, "global_step": 326316, "epoch": 1942} {"train_loss": -12.405332565307617, "global_step": 326317, "epoch": 1942} {"train_loss": -11.375786781311035, "global_step": 326318, "epoch": 1942} {"train_loss": -12.349656105041504, "global_step": 326319, "epoch": 1942} {"train_loss": -11.310176849365234, "global_step": 326320, "epoch": 1942} {"train_loss": -11.32992935180664, "global_step": 326321, "epoch": 1942} {"train_loss": -12.021159172058105, "global_step": 326322, "epoch": 1942} {"train_loss": -11.791248321533203, "global_step": 326323, "epoch": 1942} {"train_loss": -12.124715805053711, "global_step": 326324, "epoch": 1942} {"train_loss": -11.745668411254883, "global_step": 326325, "epoch": 1942} {"train_loss": -12.093466758728027, "global_step": 326326, "epoch": 1942} {"train_loss": -11.803791046142578, "global_step": 326327, "epoch": 1942} {"train_loss": -12.101616859436035, "global_step": 326328, "epoch": 1942} {"train_loss": -11.843263626098633, "global_step": 326329, "epoch": 1942} {"train_loss": -11.063425064086914, "global_step": 326330, "epoch": 1942} {"train_loss": -12.435967445373535, "global_step": 326331, "epoch": 1942} {"train_loss": -11.220279693603516, "global_step": 326332, "epoch": 1942} {"train_loss": -11.909592628479004, "global_step": 326333, "epoch": 1942} {"train_loss": -11.0780029296875, "global_step": 326334, "epoch": 1942} {"train_loss": -11.53321647644043, "global_step": 326335, "epoch": 1942} {"train_loss": -12.080175399780273, "global_step": 326336, "epoch": 1942} {"train_loss": -11.074132919311523, "global_step": 326337, "epoch": 1942} {"train_loss": -12.379303932189941, "global_step": 326338, "epoch": 1942} {"train_loss": -11.830122947692871, "global_step": 326339, "epoch": 1942} {"train_loss": -11.879168510437012, "global_step": 326340, "epoch": 1942} {"train_loss": -12.022354125976562, "global_step": 326341, "epoch": 1942} {"train_loss": -12.199204444885254, "global_step": 326342, "epoch": 1942} {"train_loss": -12.104087829589844, "global_step": 326343, "epoch": 1942} {"train_loss": -11.967572212219238, "global_step": 326344, "epoch": 1942} {"train_loss": -12.183969497680664, "global_step": 326345, "epoch": 1942} {"train_loss": -11.810937881469727, "global_step": 326346, "epoch": 1942} {"train_loss": -12.367331504821777, "global_step": 326347, "epoch": 1942} {"train_loss": -12.243188858032227, "global_step": 326348, "epoch": 1942} {"train_loss": -12.173576354980469, "global_step": 326349, "epoch": 1942} {"train_loss": -12.304914474487305, "global_step": 326350, "epoch": 1942} {"train_loss": -12.172735214233398, "global_step": 326351, "epoch": 1942} {"train_loss": -12.425743103027344, "global_step": 326352, "epoch": 1942} {"train_loss": -12.164731979370117, "global_step": 326353, "epoch": 1942} {"train_loss": -11.714893341064453, "global_step": 326354, "epoch": 1942} {"train_loss": -12.35993766784668, "global_step": 326355, "epoch": 1942} {"train_loss": -12.131155967712402, "global_step": 326356, "epoch": 1942} {"train_loss": -12.081014633178711, "global_step": 326357, "epoch": 1942} {"train_loss": -12.409809112548828, "global_step": 326358, "epoch": 1942} {"train_loss": -12.177302360534668, "global_step": 326359, "epoch": 1942} {"train_loss": -12.246930122375488, "global_step": 326360, "epoch": 1942} {"train_loss": -12.380702018737793, "global_step": 326361, "epoch": 1942} {"train_loss": -12.34832763671875, "global_step": 326362, "epoch": 1942} {"train_loss": -12.36572265625, "global_step": 326363, "epoch": 1942} {"train_loss": -12.336065292358398, "global_step": 326364, "epoch": 1942} {"train_loss": -12.297552108764648, "global_step": 326365, "epoch": 1942} {"train_loss": -12.383005142211914, "global_step": 326366, "epoch": 1942} {"train_loss": -12.371099472045898, "global_step": 326367, "epoch": 1942} {"train_loss": -12.24756908416748, "global_step": 326368, "epoch": 1942} {"train_loss": -12.326295852661133, "global_step": 326369, "epoch": 1942} {"train_loss": -12.100570678710938, "global_step": 326370, "epoch": 1942} {"train_loss": -12.017801284790039, "global_step": 326371, "epoch": 1942} {"train_loss": -12.396018981933594, "global_step": 326372, "epoch": 1942} {"train_loss": -11.814252853393555, "global_step": 326373, "epoch": 1942} {"train_loss": -11.637237548828125, "global_step": 326374, "epoch": 1942} {"train_loss": -12.153386116027832, "global_step": 326375, "epoch": 1942} {"train_loss": -11.448935508728027, "global_step": 326376, "epoch": 1942} {"train_loss": -11.374627113342285, "global_step": 326377, "epoch": 1942} {"train_loss": -12.255797386169434, "global_step": 326378, "epoch": 1942} {"train_loss": -12.024482727050781, "global_step": 326379, "epoch": 1942} {"train_loss": -11.206533432006836, "global_step": 326380, "epoch": 1942} {"train_loss": -11.726511001586914, "global_step": 326381, "epoch": 1942} {"train_loss": -11.116710662841797, "global_step": 326382, "epoch": 1942} {"train_loss": -10.529394149780273, "global_step": 326383, "epoch": 1942} {"train_loss": -10.105859756469727, "global_step": 326384, "epoch": 1942} {"train_loss": -11.49738883972168, "global_step": 326385, "epoch": 1942} {"train_loss": -9.558381080627441, "global_step": 326386, "epoch": 1942} {"train_loss": -11.690567016601562, "global_step": 326387, "epoch": 1942} {"train_loss": -10.95341682434082, "global_step": 326388, "epoch": 1942} {"train_loss": -10.078531265258789, "global_step": 326389, "epoch": 1942} {"train_loss": -11.787212371826172, "global_step": 326390, "epoch": 1942} {"train_loss": -11.39091682434082, "global_step": 326391, "epoch": 1942} {"train_loss": -10.454389572143555, "global_step": 326392, "epoch": 1942} {"train_loss": -12.272724151611328, "global_step": 326393, "epoch": 1942} {"train_loss": -11.11260986328125, "global_step": 326394, "epoch": 1942} {"train_loss": -11.939130783081055, "global_step": 326395, "epoch": 1942} {"train_loss": -11.53113842010498, "global_step": 326396, "epoch": 1942} {"train_loss": -10.33243179321289, "global_step": 326397, "epoch": 1942} {"train_loss": -10.052385330200195, "global_step": 326398, "epoch": 1942} {"train_loss": -10.338935852050781, "global_step": 326399, "epoch": 1942} {"train_loss": -10.612066268920898, "global_step": 326400, "epoch": 1942} {"train_loss": -10.252057075500488, "global_step": 326401, "epoch": 1942} {"train_loss": -10.908243179321289, "global_step": 326402, "epoch": 1942} {"train_loss": -10.832454681396484, "global_step": 326403, "epoch": 1942} {"train_loss": -11.127775192260742, "global_step": 326404, "epoch": 1942} {"train_loss": -11.225103378295898, "global_step": 326405, "epoch": 1942} {"train_loss": -11.039874076843262, "global_step": 326406, "epoch": 1942} {"train_loss": -10.485156059265137, "global_step": 326407, "epoch": 1942} {"train_loss": -11.471611976623535, "global_step": 326408, "epoch": 1942} {"train_loss": -11.34072494506836, "global_step": 326409, "epoch": 1942} {"train_loss": -11.307158470153809, "global_step": 326410, "epoch": 1942} {"train_loss": -11.684610366821289, "global_step": 326411, "epoch": 1942} {"train_loss": -11.374116897583008, "global_step": 326412, "epoch": 1942} {"train_loss": -11.25661849975586, "global_step": 326413, "epoch": 1942} {"train_loss": -11.4152250289917, "global_step": 326414, "epoch": 1942} {"train_loss": -11.542808532714844, "global_step": 326415, "epoch": 1942} {"train_loss": -11.40064811706543, "global_step": 326416, "epoch": 1942} {"train_loss": -11.663827896118164, "global_step": 326417, "epoch": 1942} {"train_loss": -11.378058433532715, "global_step": 326418, "epoch": 1942} {"train_loss": -11.716202735900879, "global_step": 326419, "epoch": 1942} {"train_loss": -11.75782585144043, "global_step": 326420, "epoch": 1942} {"train_loss": -11.658327102661133, "global_step": 326421, "epoch": 1942} {"train_loss": -12.170430183410645, "global_step": 326422, "epoch": 1942} {"train_loss": -11.818107173556374, "global_step": 326423, "epoch": 1942, "val_loss": 281992.3125} {"train_loss": -12.043853759765625, "global_step": 326424, "epoch": 1943} {"train_loss": -11.77743911743164, "global_step": 326425, "epoch": 1943} {"train_loss": -11.62125015258789, "global_step": 326426, "epoch": 1943} {"train_loss": -12.09096908569336, "global_step": 326427, "epoch": 1943} {"train_loss": -11.976507186889648, "global_step": 326428, "epoch": 1943} {"train_loss": -11.98930549621582, "global_step": 326429, "epoch": 1943} {"train_loss": -11.960269927978516, "global_step": 326430, "epoch": 1943} {"train_loss": -12.185728073120117, "global_step": 326431, "epoch": 1943} {"train_loss": -12.244340896606445, "global_step": 326432, "epoch": 1943} {"train_loss": -12.260778427124023, "global_step": 326433, "epoch": 1943} {"train_loss": -12.411994934082031, "global_step": 326434, "epoch": 1943} {"train_loss": -12.121725082397461, "global_step": 326435, "epoch": 1943} {"train_loss": -12.177486419677734, "global_step": 326436, "epoch": 1943} {"train_loss": -12.092256546020508, "global_step": 326437, "epoch": 1943} {"train_loss": -12.132527351379395, "global_step": 326438, "epoch": 1943} {"train_loss": -12.179450988769531, "global_step": 326439, "epoch": 1943} {"train_loss": -12.175027847290039, "global_step": 326440, "epoch": 1943} {"train_loss": -12.207595825195312, "global_step": 326441, "epoch": 1943} {"train_loss": -11.914621353149414, "global_step": 326442, "epoch": 1943} {"train_loss": -12.151476860046387, "global_step": 326443, "epoch": 1943} {"train_loss": -12.458379745483398, "global_step": 326444, "epoch": 1943} {"train_loss": -12.270652770996094, "global_step": 326445, "epoch": 1943} {"train_loss": -12.259177207946777, "global_step": 326446, "epoch": 1943} {"train_loss": -12.232008934020996, "global_step": 326447, "epoch": 1943} {"train_loss": -12.234136581420898, "global_step": 326448, "epoch": 1943} {"train_loss": -12.390539169311523, "global_step": 326449, "epoch": 1943} {"train_loss": -12.288825988769531, "global_step": 326450, "epoch": 1943} {"train_loss": -12.535625457763672, "global_step": 326451, "epoch": 1943} {"train_loss": -12.141332626342773, "global_step": 326452, "epoch": 1943} {"train_loss": -12.289250373840332, "global_step": 326453, "epoch": 1943} {"train_loss": -12.404745101928711, "global_step": 326454, "epoch": 1943} {"train_loss": -12.462048530578613, "global_step": 326455, "epoch": 1943} {"train_loss": -12.5098876953125, "global_step": 326456, "epoch": 1943} {"train_loss": -12.588432312011719, "global_step": 326457, "epoch": 1943} {"train_loss": -12.512237548828125, "global_step": 326458, "epoch": 1943} {"train_loss": -12.592409133911133, "global_step": 326459, "epoch": 1943} {"train_loss": -12.547697067260742, "global_step": 326460, "epoch": 1943} {"train_loss": -12.501713752746582, "global_step": 326461, "epoch": 1943} {"train_loss": -12.426892280578613, "global_step": 326462, "epoch": 1943} {"train_loss": -12.379873275756836, "global_step": 326463, "epoch": 1943} {"train_loss": -12.512447357177734, "global_step": 326464, "epoch": 1943} {"train_loss": -12.563270568847656, "global_step": 326465, "epoch": 1943} {"train_loss": -12.246379852294922, "global_step": 326466, "epoch": 1943} {"train_loss": -12.20051383972168, "global_step": 326467, "epoch": 1943} {"train_loss": -12.531004905700684, "global_step": 326468, "epoch": 1943} {"train_loss": -12.309587478637695, "global_step": 326469, "epoch": 1943} {"train_loss": -12.362849235534668, "global_step": 326470, "epoch": 1943} {"train_loss": -12.724763870239258, "global_step": 326471, "epoch": 1943} {"train_loss": -12.250205993652344, "global_step": 326472, "epoch": 1943} {"train_loss": -11.690552711486816, "global_step": 326473, "epoch": 1943} {"train_loss": -11.992819786071777, "global_step": 326474, "epoch": 1943} {"train_loss": -12.43105697631836, "global_step": 326475, "epoch": 1943} {"train_loss": -12.495275497436523, "global_step": 326476, "epoch": 1943} {"train_loss": -12.31580924987793, "global_step": 326477, "epoch": 1943} {"train_loss": -12.45348834991455, "global_step": 326478, "epoch": 1943} {"train_loss": -12.376676559448242, "global_step": 326479, "epoch": 1943} {"train_loss": -12.107990264892578, "global_step": 326480, "epoch": 1943} {"train_loss": -12.299582481384277, "global_step": 326481, "epoch": 1943} {"train_loss": -12.452744483947754, "global_step": 326482, "epoch": 1943} {"train_loss": -12.147770881652832, "global_step": 326483, "epoch": 1943} {"train_loss": -12.012697219848633, "global_step": 326484, "epoch": 1943} {"train_loss": -12.083223342895508, "global_step": 326485, "epoch": 1943} {"train_loss": -12.228681564331055, "global_step": 326486, "epoch": 1943} {"train_loss": -12.554075241088867, "global_step": 326487, "epoch": 1943} {"train_loss": -12.177790641784668, "global_step": 326488, "epoch": 1943} {"train_loss": -12.520421981811523, "global_step": 326489, "epoch": 1943} {"train_loss": -12.344122886657715, "global_step": 326490, "epoch": 1943} {"train_loss": -12.41229248046875, "global_step": 326491, "epoch": 1943} {"train_loss": -12.45554256439209, "global_step": 326492, "epoch": 1943} {"train_loss": -11.953489303588867, "global_step": 326493, "epoch": 1943} {"train_loss": -12.080301284790039, "global_step": 326494, "epoch": 1943} {"train_loss": -12.436067581176758, "global_step": 326495, "epoch": 1943} {"train_loss": -11.784948348999023, "global_step": 326496, "epoch": 1943} {"train_loss": -12.156725883483887, "global_step": 326497, "epoch": 1943} {"train_loss": -12.577916145324707, "global_step": 326498, "epoch": 1943} {"train_loss": -12.405054092407227, "global_step": 326499, "epoch": 1943} {"train_loss": -12.319565773010254, "global_step": 326500, "epoch": 1943} {"train_loss": -12.010251998901367, "global_step": 326501, "epoch": 1943} {"train_loss": -12.047338485717773, "global_step": 326502, "epoch": 1943} {"train_loss": -12.210111618041992, "global_step": 326503, "epoch": 1943} {"train_loss": -12.521326065063477, "global_step": 326504, "epoch": 1943} {"train_loss": -12.423633575439453, "global_step": 326505, "epoch": 1943} {"train_loss": -12.391312599182129, "global_step": 326506, "epoch": 1943} {"train_loss": -12.40854549407959, "global_step": 326507, "epoch": 1943} {"train_loss": -12.365852355957031, "global_step": 326508, "epoch": 1943} {"train_loss": -12.405210494995117, "global_step": 326509, "epoch": 1943} {"train_loss": -12.27766227722168, "global_step": 326510, "epoch": 1943} {"train_loss": -12.171331405639648, "global_step": 326511, "epoch": 1943} {"train_loss": -12.452524185180664, "global_step": 326512, "epoch": 1943} {"train_loss": -12.523157119750977, "global_step": 326513, "epoch": 1943} {"train_loss": -12.253915786743164, "global_step": 326514, "epoch": 1943} {"train_loss": -12.024640083312988, "global_step": 326515, "epoch": 1943} {"train_loss": -12.592230796813965, "global_step": 326516, "epoch": 1943} {"train_loss": -11.871042251586914, "global_step": 326517, "epoch": 1943} {"train_loss": -11.92311954498291, "global_step": 326518, "epoch": 1943} {"train_loss": -12.550107955932617, "global_step": 326519, "epoch": 1943} {"train_loss": -12.371910095214844, "global_step": 326520, "epoch": 1943} {"train_loss": -11.977261543273926, "global_step": 326521, "epoch": 1943} {"train_loss": -12.153379440307617, "global_step": 326522, "epoch": 1943} {"train_loss": -12.388628005981445, "global_step": 326523, "epoch": 1943} {"train_loss": -12.153940200805664, "global_step": 326524, "epoch": 1943} {"train_loss": -12.346808433532715, "global_step": 326525, "epoch": 1943} {"train_loss": -12.268898010253906, "global_step": 326526, "epoch": 1943} {"train_loss": -11.93989372253418, "global_step": 326527, "epoch": 1943} {"train_loss": -12.034116744995117, "global_step": 326528, "epoch": 1943} {"train_loss": -11.861607551574707, "global_step": 326529, "epoch": 1943} {"train_loss": -11.681842803955078, "global_step": 326530, "epoch": 1943} {"train_loss": -12.265714645385742, "global_step": 326531, "epoch": 1943} {"train_loss": -12.03390121459961, "global_step": 326532, "epoch": 1943} {"train_loss": -11.783069610595703, "global_step": 326533, "epoch": 1943} {"train_loss": -11.94299602508545, "global_step": 326534, "epoch": 1943} {"train_loss": -11.991138458251953, "global_step": 326535, "epoch": 1943} {"train_loss": -10.560075759887695, "global_step": 326536, "epoch": 1943} {"train_loss": -12.004575729370117, "global_step": 326537, "epoch": 1943} {"train_loss": -11.604402542114258, "global_step": 326538, "epoch": 1943} {"train_loss": -11.534371376037598, "global_step": 326539, "epoch": 1943} {"train_loss": -11.902265548706055, "global_step": 326540, "epoch": 1943} {"train_loss": -12.142696380615234, "global_step": 326541, "epoch": 1943} {"train_loss": -10.958359718322754, "global_step": 326542, "epoch": 1943} {"train_loss": -11.106284141540527, "global_step": 326543, "epoch": 1943} {"train_loss": -11.958915710449219, "global_step": 326544, "epoch": 1943} {"train_loss": -11.101875305175781, "global_step": 326545, "epoch": 1943} {"train_loss": -10.803215026855469, "global_step": 326546, "epoch": 1943} {"train_loss": -11.287899017333984, "global_step": 326547, "epoch": 1943} {"train_loss": -11.969135284423828, "global_step": 326548, "epoch": 1943} {"train_loss": -11.399889945983887, "global_step": 326549, "epoch": 1943} {"train_loss": -11.968764305114746, "global_step": 326550, "epoch": 1943} {"train_loss": -10.98617935180664, "global_step": 326551, "epoch": 1943} {"train_loss": -10.941959381103516, "global_step": 326552, "epoch": 1943} {"train_loss": -10.833001136779785, "global_step": 326553, "epoch": 1943} {"train_loss": -11.716842651367188, "global_step": 326554, "epoch": 1943} {"train_loss": -10.667383193969727, "global_step": 326555, "epoch": 1943} {"train_loss": -11.592371940612793, "global_step": 326556, "epoch": 1943} {"train_loss": -10.38801383972168, "global_step": 326557, "epoch": 1943} {"train_loss": -10.121535301208496, "global_step": 326558, "epoch": 1943} {"train_loss": -11.326770782470703, "global_step": 326559, "epoch": 1943} {"train_loss": -9.988418579101562, "global_step": 326560, "epoch": 1943} {"train_loss": -9.463247299194336, "global_step": 326561, "epoch": 1943} {"train_loss": -11.33597183227539, "global_step": 326562, "epoch": 1943} {"train_loss": -10.274325370788574, "global_step": 326563, "epoch": 1943} {"train_loss": -10.438551902770996, "global_step": 326564, "epoch": 1943} {"train_loss": -11.655742645263672, "global_step": 326565, "epoch": 1943} {"train_loss": -11.053935050964355, "global_step": 326566, "epoch": 1943} {"train_loss": -11.485982894897461, "global_step": 326567, "epoch": 1943} {"train_loss": -11.492403030395508, "global_step": 326568, "epoch": 1943} {"train_loss": -11.400466918945312, "global_step": 326569, "epoch": 1943} {"train_loss": -11.623004913330078, "global_step": 326570, "epoch": 1943} {"train_loss": -10.768213272094727, "global_step": 326571, "epoch": 1943} {"train_loss": -11.798992156982422, "global_step": 326572, "epoch": 1943} {"train_loss": -10.643848419189453, "global_step": 326573, "epoch": 1943} {"train_loss": -11.711160659790039, "global_step": 326574, "epoch": 1943} {"train_loss": -10.515151023864746, "global_step": 326575, "epoch": 1943} {"train_loss": -11.278654098510742, "global_step": 326576, "epoch": 1943} {"train_loss": -11.759520530700684, "global_step": 326577, "epoch": 1943} {"train_loss": -11.497964859008789, "global_step": 326578, "epoch": 1943} {"train_loss": -12.041603088378906, "global_step": 326579, "epoch": 1943} {"train_loss": -11.940908432006836, "global_step": 326580, "epoch": 1943} {"train_loss": -11.663658142089844, "global_step": 326581, "epoch": 1943} {"train_loss": -12.015277862548828, "global_step": 326582, "epoch": 1943} {"train_loss": -11.512428283691406, "global_step": 326583, "epoch": 1943} {"train_loss": -11.973278045654297, "global_step": 326584, "epoch": 1943} {"train_loss": -11.70802116394043, "global_step": 326585, "epoch": 1943} {"train_loss": -11.558406829833984, "global_step": 326586, "epoch": 1943} {"train_loss": -11.83680534362793, "global_step": 326587, "epoch": 1943} {"train_loss": -11.923227310180664, "global_step": 326588, "epoch": 1943} {"train_loss": -12.006441116333008, "global_step": 326589, "epoch": 1943} {"train_loss": -11.628314018249512, "global_step": 326590, "epoch": 1943} {"train_loss": -11.938695918946038, "global_step": 326591, "epoch": 1943, "val_loss": 282213.625} {"train_loss": -11.704743385314941, "global_step": 326592, "epoch": 1944} {"train_loss": -11.536505699157715, "global_step": 326593, "epoch": 1944} {"train_loss": -11.599370956420898, "global_step": 326594, "epoch": 1944} {"train_loss": -11.80002212524414, "global_step": 326595, "epoch": 1944} {"train_loss": -11.711387634277344, "global_step": 326596, "epoch": 1944} {"train_loss": -11.599526405334473, "global_step": 326597, "epoch": 1944} {"train_loss": -11.326947212219238, "global_step": 326598, "epoch": 1944} {"train_loss": -11.728796005249023, "global_step": 326599, "epoch": 1944} {"train_loss": -11.549010276794434, "global_step": 326600, "epoch": 1944} {"train_loss": -11.778688430786133, "global_step": 326601, "epoch": 1944} {"train_loss": -11.60434341430664, "global_step": 326602, "epoch": 1944} {"train_loss": -11.600139617919922, "global_step": 326603, "epoch": 1944} {"train_loss": -11.423040390014648, "global_step": 326604, "epoch": 1944} {"train_loss": -11.66827392578125, "global_step": 326605, "epoch": 1944} {"train_loss": -11.09225082397461, "global_step": 326606, "epoch": 1944} {"train_loss": -11.76225757598877, "global_step": 326607, "epoch": 1944} {"train_loss": -11.780261993408203, "global_step": 326608, "epoch": 1944} {"train_loss": -11.440366744995117, "global_step": 326609, "epoch": 1944} {"train_loss": -12.09969425201416, "global_step": 326610, "epoch": 1944} {"train_loss": -11.264266967773438, "global_step": 326611, "epoch": 1944} {"train_loss": -12.095705032348633, "global_step": 326612, "epoch": 1944} {"train_loss": -11.565387725830078, "global_step": 326613, "epoch": 1944} {"train_loss": -11.557409286499023, "global_step": 326614, "epoch": 1944} {"train_loss": -12.00259017944336, "global_step": 326615, "epoch": 1944} {"train_loss": -11.306848526000977, "global_step": 326616, "epoch": 1944} {"train_loss": -12.085884094238281, "global_step": 326617, "epoch": 1944} {"train_loss": -11.782859802246094, "global_step": 326618, "epoch": 1944} {"train_loss": -11.749032020568848, "global_step": 326619, "epoch": 1944} {"train_loss": -12.11859130859375, "global_step": 326620, "epoch": 1944} {"train_loss": -11.550386428833008, "global_step": 326621, "epoch": 1944} {"train_loss": -12.110395431518555, "global_step": 326622, "epoch": 1944} {"train_loss": -11.824092864990234, "global_step": 326623, "epoch": 1944} {"train_loss": -11.892576217651367, "global_step": 326624, "epoch": 1944} {"train_loss": -12.107501983642578, "global_step": 326625, "epoch": 1944} {"train_loss": -12.021764755249023, "global_step": 326626, "epoch": 1944} {"train_loss": -12.18021011352539, "global_step": 326627, "epoch": 1944} {"train_loss": -12.126394271850586, "global_step": 326628, "epoch": 1944} {"train_loss": -11.942214012145996, "global_step": 326629, "epoch": 1944} {"train_loss": -11.942283630371094, "global_step": 326630, "epoch": 1944} {"train_loss": -12.109386444091797, "global_step": 326631, "epoch": 1944} {"train_loss": -12.08587646484375, "global_step": 326632, "epoch": 1944} {"train_loss": -12.226396560668945, "global_step": 326633, "epoch": 1944} {"train_loss": -12.440522193908691, "global_step": 326634, "epoch": 1944} {"train_loss": -12.169450759887695, "global_step": 326635, "epoch": 1944} {"train_loss": -12.38772201538086, "global_step": 326636, "epoch": 1944} {"train_loss": -12.147994995117188, "global_step": 326637, "epoch": 1944} {"train_loss": -12.48167610168457, "global_step": 326638, "epoch": 1944} {"train_loss": -12.168752670288086, "global_step": 326639, "epoch": 1944} {"train_loss": -12.373676300048828, "global_step": 326640, "epoch": 1944} {"train_loss": -12.39089584350586, "global_step": 326641, "epoch": 1944} {"train_loss": -12.201168060302734, "global_step": 326642, "epoch": 1944} {"train_loss": -12.296512603759766, "global_step": 326643, "epoch": 1944} {"train_loss": -11.971429824829102, "global_step": 326644, "epoch": 1944} {"train_loss": -12.219720840454102, "global_step": 326645, "epoch": 1944} {"train_loss": -12.233627319335938, "global_step": 326646, "epoch": 1944} {"train_loss": -11.949308395385742, "global_step": 326647, "epoch": 1944} {"train_loss": -12.285881042480469, "global_step": 326648, "epoch": 1944} {"train_loss": -12.373139381408691, "global_step": 326649, "epoch": 1944} {"train_loss": -12.497753143310547, "global_step": 326650, "epoch": 1944} {"train_loss": -12.162113189697266, "global_step": 326651, "epoch": 1944} {"train_loss": -12.364630699157715, "global_step": 326652, "epoch": 1944} {"train_loss": -12.529949188232422, "global_step": 326653, "epoch": 1944} {"train_loss": -12.463257789611816, "global_step": 326654, "epoch": 1944} {"train_loss": -12.554058074951172, "global_step": 326655, "epoch": 1944} {"train_loss": -12.416175842285156, "global_step": 326656, "epoch": 1944} {"train_loss": -12.354597091674805, "global_step": 326657, "epoch": 1944} {"train_loss": -12.290227890014648, "global_step": 326658, "epoch": 1944} {"train_loss": -12.425321578979492, "global_step": 326659, "epoch": 1944} {"train_loss": -12.381402015686035, "global_step": 326660, "epoch": 1944} {"train_loss": -12.499086380004883, "global_step": 326661, "epoch": 1944} {"train_loss": -12.523422241210938, "global_step": 326662, "epoch": 1944} {"train_loss": -12.52558422088623, "global_step": 326663, "epoch": 1944} {"train_loss": -12.660285949707031, "global_step": 326664, "epoch": 1944} {"train_loss": -12.55909538269043, "global_step": 326665, "epoch": 1944} {"train_loss": -12.405732154846191, "global_step": 326666, "epoch": 1944} {"train_loss": -12.51017951965332, "global_step": 326667, "epoch": 1944} {"train_loss": -12.523406982421875, "global_step": 326668, "epoch": 1944} {"train_loss": -12.684643745422363, "global_step": 326669, "epoch": 1944} {"train_loss": -12.532272338867188, "global_step": 326670, "epoch": 1944} {"train_loss": -12.483386993408203, "global_step": 326671, "epoch": 1944} {"train_loss": -12.702392578125, "global_step": 326672, "epoch": 1944} {"train_loss": -12.588784217834473, "global_step": 326673, "epoch": 1944} {"train_loss": -12.310941696166992, "global_step": 326674, "epoch": 1944} {"train_loss": -12.34237289428711, "global_step": 326675, "epoch": 1944} {"train_loss": -12.45687198638916, "global_step": 326676, "epoch": 1944} {"train_loss": -12.438674926757812, "global_step": 326677, "epoch": 1944} {"train_loss": -12.434367179870605, "global_step": 326678, "epoch": 1944} {"train_loss": -12.706353187561035, "global_step": 326679, "epoch": 1944} {"train_loss": -12.567020416259766, "global_step": 326680, "epoch": 1944} {"train_loss": -12.523670196533203, "global_step": 326681, "epoch": 1944} {"train_loss": -12.6674165725708, "global_step": 326682, "epoch": 1944} {"train_loss": -12.270109176635742, "global_step": 326683, "epoch": 1944} {"train_loss": -12.492058753967285, "global_step": 326684, "epoch": 1944} {"train_loss": -12.305070877075195, "global_step": 326685, "epoch": 1944} {"train_loss": -12.47918701171875, "global_step": 326686, "epoch": 1944} {"train_loss": -12.341315269470215, "global_step": 326687, "epoch": 1944} {"train_loss": -12.198295593261719, "global_step": 326688, "epoch": 1944} {"train_loss": -12.458858489990234, "global_step": 326689, "epoch": 1944} {"train_loss": -12.402713775634766, "global_step": 326690, "epoch": 1944} {"train_loss": -12.584573745727539, "global_step": 326691, "epoch": 1944} {"train_loss": -12.408676147460938, "global_step": 326692, "epoch": 1944} {"train_loss": -12.487616539001465, "global_step": 326693, "epoch": 1944} {"train_loss": -12.204261779785156, "global_step": 326694, "epoch": 1944} {"train_loss": -12.291871070861816, "global_step": 326695, "epoch": 1944} {"train_loss": -12.589698791503906, "global_step": 326696, "epoch": 1944} {"train_loss": -12.209297180175781, "global_step": 326697, "epoch": 1944} {"train_loss": -11.882416725158691, "global_step": 326698, "epoch": 1944} {"train_loss": -11.436912536621094, "global_step": 326699, "epoch": 1944} {"train_loss": -12.419143676757812, "global_step": 326700, "epoch": 1944} {"train_loss": -11.757816314697266, "global_step": 326701, "epoch": 1944} {"train_loss": -11.746192932128906, "global_step": 326702, "epoch": 1944} {"train_loss": -12.262126922607422, "global_step": 326703, "epoch": 1944} {"train_loss": -12.272859573364258, "global_step": 326704, "epoch": 1944} {"train_loss": -12.5027437210083, "global_step": 326705, "epoch": 1944} {"train_loss": -12.339911460876465, "global_step": 326706, "epoch": 1944} {"train_loss": -12.1273193359375, "global_step": 326707, "epoch": 1944} {"train_loss": -11.583242416381836, "global_step": 326708, "epoch": 1944} {"train_loss": -12.501688003540039, "global_step": 326709, "epoch": 1944} {"train_loss": -12.013620376586914, "global_step": 326710, "epoch": 1944} {"train_loss": -11.968826293945312, "global_step": 326711, "epoch": 1944} {"train_loss": -12.006902694702148, "global_step": 326712, "epoch": 1944} {"train_loss": -12.07808780670166, "global_step": 326713, "epoch": 1944} {"train_loss": -12.427206039428711, "global_step": 326714, "epoch": 1944} {"train_loss": -11.99172306060791, "global_step": 326715, "epoch": 1944} {"train_loss": -12.356107711791992, "global_step": 326716, "epoch": 1944} {"train_loss": -12.340803146362305, "global_step": 326717, "epoch": 1944} {"train_loss": -11.669221878051758, "global_step": 326718, "epoch": 1944} {"train_loss": -10.791549682617188, "global_step": 326719, "epoch": 1944} {"train_loss": -11.786730766296387, "global_step": 326720, "epoch": 1944} {"train_loss": -11.846537590026855, "global_step": 326721, "epoch": 1944} {"train_loss": -10.172712326049805, "global_step": 326722, "epoch": 1944} {"train_loss": -10.258735656738281, "global_step": 326723, "epoch": 1944} {"train_loss": -11.894998550415039, "global_step": 326724, "epoch": 1944} {"train_loss": -11.982805252075195, "global_step": 326725, "epoch": 1944} {"train_loss": -11.838294982910156, "global_step": 326726, "epoch": 1944} {"train_loss": -11.759982109069824, "global_step": 326727, "epoch": 1944} {"train_loss": -11.4284029006958, "global_step": 326728, "epoch": 1944} {"train_loss": -12.035253524780273, "global_step": 326729, "epoch": 1944} {"train_loss": -12.29330825805664, "global_step": 326730, "epoch": 1944} {"train_loss": -11.380491256713867, "global_step": 326731, "epoch": 1944} {"train_loss": -10.779593467712402, "global_step": 326732, "epoch": 1944} {"train_loss": -11.312878608703613, "global_step": 326733, "epoch": 1944} {"train_loss": -12.506599426269531, "global_step": 326734, "epoch": 1944} {"train_loss": -11.227153778076172, "global_step": 326735, "epoch": 1944} {"train_loss": -10.83858871459961, "global_step": 326736, "epoch": 1944} {"train_loss": -11.921202659606934, "global_step": 326737, "epoch": 1944} {"train_loss": -11.399206161499023, "global_step": 326738, "epoch": 1944} {"train_loss": -10.944314956665039, "global_step": 326739, "epoch": 1944} {"train_loss": -11.868955612182617, "global_step": 326740, "epoch": 1944} {"train_loss": -11.26073932647705, "global_step": 326741, "epoch": 1944} {"train_loss": -9.883102416992188, "global_step": 326742, "epoch": 1944} {"train_loss": -11.129684448242188, "global_step": 326743, "epoch": 1944} {"train_loss": -9.500085830688477, "global_step": 326744, "epoch": 1944} {"train_loss": -10.774557113647461, "global_step": 326745, "epoch": 1944} {"train_loss": -10.12180233001709, "global_step": 326746, "epoch": 1944} {"train_loss": -9.5404052734375, "global_step": 326747, "epoch": 1944} {"train_loss": -9.855852127075195, "global_step": 326748, "epoch": 1944} {"train_loss": -10.894023895263672, "global_step": 326749, "epoch": 1944} {"train_loss": -10.708070755004883, "global_step": 326750, "epoch": 1944} {"train_loss": -10.663368225097656, "global_step": 326751, "epoch": 1944} {"train_loss": -11.483850479125977, "global_step": 326752, "epoch": 1944} {"train_loss": -11.266406059265137, "global_step": 326753, "epoch": 1944} {"train_loss": -11.558311462402344, "global_step": 326754, "epoch": 1944} {"train_loss": -11.882259368896484, "global_step": 326755, "epoch": 1944} {"train_loss": -10.69553279876709, "global_step": 326756, "epoch": 1944} {"train_loss": -11.873391151428223, "global_step": 326757, "epoch": 1944} {"train_loss": -10.806970596313477, "global_step": 326758, "epoch": 1944} {"train_loss": -11.90647884777614, "global_step": 326759, "epoch": 1944, "val_loss": 281251.84375} {"train_loss": -10.80986499786377, "global_step": 326760, "epoch": 1945} {"train_loss": -11.229560852050781, "global_step": 326761, "epoch": 1945} {"train_loss": -11.487638473510742, "global_step": 326762, "epoch": 1945} {"train_loss": -11.315836906433105, "global_step": 326763, "epoch": 1945} {"train_loss": -11.162673950195312, "global_step": 326764, "epoch": 1945} {"train_loss": -11.937332153320312, "global_step": 326765, "epoch": 1945} {"train_loss": -11.149457931518555, "global_step": 326766, "epoch": 1945} {"train_loss": -11.839080810546875, "global_step": 326767, "epoch": 1945} {"train_loss": -11.823062896728516, "global_step": 326768, "epoch": 1945} {"train_loss": -12.01545524597168, "global_step": 326769, "epoch": 1945} {"train_loss": -11.18681526184082, "global_step": 326770, "epoch": 1945} {"train_loss": -11.825526237487793, "global_step": 326771, "epoch": 1945} {"train_loss": -11.55217170715332, "global_step": 326772, "epoch": 1945} {"train_loss": -11.683629989624023, "global_step": 326773, "epoch": 1945} {"train_loss": -11.52065658569336, "global_step": 326774, "epoch": 1945} {"train_loss": -11.070570945739746, "global_step": 326775, "epoch": 1945} {"train_loss": -11.597209930419922, "global_step": 326776, "epoch": 1945} {"train_loss": -11.690810203552246, "global_step": 326777, "epoch": 1945} {"train_loss": -11.330398559570312, "global_step": 326778, "epoch": 1945} {"train_loss": -11.733805656433105, "global_step": 326779, "epoch": 1945} {"train_loss": -11.90054702758789, "global_step": 326780, "epoch": 1945} {"train_loss": -11.31126594543457, "global_step": 326781, "epoch": 1945} {"train_loss": -11.88218879699707, "global_step": 326782, "epoch": 1945} {"train_loss": -11.600967407226562, "global_step": 326783, "epoch": 1945} {"train_loss": -11.784643173217773, "global_step": 326784, "epoch": 1945} {"train_loss": -11.807225227355957, "global_step": 326785, "epoch": 1945} {"train_loss": -11.674917221069336, "global_step": 326786, "epoch": 1945} {"train_loss": -12.063641548156738, "global_step": 326787, "epoch": 1945} {"train_loss": -11.908918380737305, "global_step": 326788, "epoch": 1945} {"train_loss": -11.9790620803833, "global_step": 326789, "epoch": 1945} {"train_loss": -12.089876174926758, "global_step": 326790, "epoch": 1945} {"train_loss": -11.853569030761719, "global_step": 326791, "epoch": 1945} {"train_loss": -12.262311935424805, "global_step": 326792, "epoch": 1945} {"train_loss": -12.057563781738281, "global_step": 326793, "epoch": 1945} {"train_loss": -11.917688369750977, "global_step": 326794, "epoch": 1945} {"train_loss": -12.002278327941895, "global_step": 326795, "epoch": 1945} {"train_loss": -11.926117897033691, "global_step": 326796, "epoch": 1945} {"train_loss": -12.254215240478516, "global_step": 326797, "epoch": 1945} {"train_loss": -11.757230758666992, "global_step": 326798, "epoch": 1945} {"train_loss": -12.196349143981934, "global_step": 326799, "epoch": 1945} {"train_loss": -12.366766929626465, "global_step": 326800, "epoch": 1945} {"train_loss": -12.299699783325195, "global_step": 326801, "epoch": 1945} {"train_loss": -11.975996971130371, "global_step": 326802, "epoch": 1945} {"train_loss": -12.415521621704102, "global_step": 326803, "epoch": 1945} {"train_loss": -12.128896713256836, "global_step": 326804, "epoch": 1945} {"train_loss": -12.267988204956055, "global_step": 326805, "epoch": 1945} {"train_loss": -12.164534568786621, "global_step": 326806, "epoch": 1945} {"train_loss": -12.34375, "global_step": 326807, "epoch": 1945} {"train_loss": -12.280319213867188, "global_step": 326808, "epoch": 1945} {"train_loss": -12.492469787597656, "global_step": 326809, "epoch": 1945} {"train_loss": -12.258584022521973, "global_step": 326810, "epoch": 1945} {"train_loss": -12.306756019592285, "global_step": 326811, "epoch": 1945} {"train_loss": -12.089920043945312, "global_step": 326812, "epoch": 1945} {"train_loss": -12.526249885559082, "global_step": 326813, "epoch": 1945} {"train_loss": -12.36540412902832, "global_step": 326814, "epoch": 1945} {"train_loss": -12.430608749389648, "global_step": 326815, "epoch": 1945} {"train_loss": -12.348395347595215, "global_step": 326816, "epoch": 1945} {"train_loss": -12.578272819519043, "global_step": 326817, "epoch": 1945} {"train_loss": -12.375679016113281, "global_step": 326818, "epoch": 1945} {"train_loss": -12.333708763122559, "global_step": 326819, "epoch": 1945} {"train_loss": -12.339934349060059, "global_step": 326820, "epoch": 1945} {"train_loss": -12.447576522827148, "global_step": 326821, "epoch": 1945} {"train_loss": -12.432575225830078, "global_step": 326822, "epoch": 1945} {"train_loss": -12.611594200134277, "global_step": 326823, "epoch": 1945} {"train_loss": -12.480430603027344, "global_step": 326824, "epoch": 1945} {"train_loss": -12.278108596801758, "global_step": 326825, "epoch": 1945} {"train_loss": -12.577272415161133, "global_step": 326826, "epoch": 1945} {"train_loss": -12.607133865356445, "global_step": 326827, "epoch": 1945} {"train_loss": -12.418184280395508, "global_step": 326828, "epoch": 1945} {"train_loss": -12.544315338134766, "global_step": 326829, "epoch": 1945} {"train_loss": -12.571258544921875, "global_step": 326830, "epoch": 1945} {"train_loss": -12.397289276123047, "global_step": 326831, "epoch": 1945} {"train_loss": -12.543952941894531, "global_step": 326832, "epoch": 1945} {"train_loss": -12.43642807006836, "global_step": 326833, "epoch": 1945} {"train_loss": -12.64649486541748, "global_step": 326834, "epoch": 1945} {"train_loss": -12.665700912475586, "global_step": 326835, "epoch": 1945} {"train_loss": -12.695735931396484, "global_step": 326836, "epoch": 1945} {"train_loss": -12.691489219665527, "global_step": 326837, "epoch": 1945} {"train_loss": -12.611857414245605, "global_step": 326838, "epoch": 1945} {"train_loss": -12.66480827331543, "global_step": 326839, "epoch": 1945} {"train_loss": -12.67349624633789, "global_step": 326840, "epoch": 1945} {"train_loss": -12.665241241455078, "global_step": 326841, "epoch": 1945} {"train_loss": -12.747386932373047, "global_step": 326842, "epoch": 1945} {"train_loss": -12.60628890991211, "global_step": 326843, "epoch": 1945} {"train_loss": -12.646862030029297, "global_step": 326844, "epoch": 1945} {"train_loss": -12.6817045211792, "global_step": 326845, "epoch": 1945} {"train_loss": -12.540535926818848, "global_step": 326846, "epoch": 1945} {"train_loss": -12.706188201904297, "global_step": 326847, "epoch": 1945} {"train_loss": -12.358530044555664, "global_step": 326848, "epoch": 1945} {"train_loss": -12.804380416870117, "global_step": 326849, "epoch": 1945} {"train_loss": -12.693416595458984, "global_step": 326850, "epoch": 1945} {"train_loss": -12.260587692260742, "global_step": 326851, "epoch": 1945} {"train_loss": -11.962600708007812, "global_step": 326852, "epoch": 1945} {"train_loss": -12.16754150390625, "global_step": 326853, "epoch": 1945} {"train_loss": -12.523313522338867, "global_step": 326854, "epoch": 1945} {"train_loss": -12.739473342895508, "global_step": 326855, "epoch": 1945} {"train_loss": -12.448413848876953, "global_step": 326856, "epoch": 1945} {"train_loss": -12.63522720336914, "global_step": 326857, "epoch": 1945} {"train_loss": -12.646981239318848, "global_step": 326858, "epoch": 1945} {"train_loss": -12.396805763244629, "global_step": 326859, "epoch": 1945} {"train_loss": -11.984302520751953, "global_step": 326860, "epoch": 1945} {"train_loss": -10.798768043518066, "global_step": 326861, "epoch": 1945} {"train_loss": -10.067405700683594, "global_step": 326862, "epoch": 1945} {"train_loss": -10.761445045471191, "global_step": 326863, "epoch": 1945} {"train_loss": -11.713340759277344, "global_step": 326864, "epoch": 1945} {"train_loss": -9.360416412353516, "global_step": 326865, "epoch": 1945} {"train_loss": -9.702840805053711, "global_step": 326866, "epoch": 1945} {"train_loss": -11.524887084960938, "global_step": 326867, "epoch": 1945} {"train_loss": -10.744126319885254, "global_step": 326868, "epoch": 1945} {"train_loss": -12.248313903808594, "global_step": 326869, "epoch": 1945} {"train_loss": -10.953125953674316, "global_step": 326870, "epoch": 1945} {"train_loss": -12.08281135559082, "global_step": 326871, "epoch": 1945} {"train_loss": -11.512812614440918, "global_step": 326872, "epoch": 1945} {"train_loss": -10.28730583190918, "global_step": 326873, "epoch": 1945} {"train_loss": -11.90316390991211, "global_step": 326874, "epoch": 1945} {"train_loss": -10.622943878173828, "global_step": 326875, "epoch": 1945} {"train_loss": -12.15770149230957, "global_step": 326876, "epoch": 1945} {"train_loss": -10.8939208984375, "global_step": 326877, "epoch": 1945} {"train_loss": -11.442272186279297, "global_step": 326878, "epoch": 1945} {"train_loss": -11.645187377929688, "global_step": 326879, "epoch": 1945} {"train_loss": -10.797216415405273, "global_step": 326880, "epoch": 1945} {"train_loss": -11.593234062194824, "global_step": 326881, "epoch": 1945} {"train_loss": -11.82188606262207, "global_step": 326882, "epoch": 1945} {"train_loss": -11.192136764526367, "global_step": 326883, "epoch": 1945} {"train_loss": -11.157684326171875, "global_step": 326884, "epoch": 1945} {"train_loss": -12.112603187561035, "global_step": 326885, "epoch": 1945} {"train_loss": -11.576911926269531, "global_step": 326886, "epoch": 1945} {"train_loss": -11.711957931518555, "global_step": 326887, "epoch": 1945} {"train_loss": -11.995674133300781, "global_step": 326888, "epoch": 1945} {"train_loss": -12.215465545654297, "global_step": 326889, "epoch": 1945} {"train_loss": -11.345874786376953, "global_step": 326890, "epoch": 1945} {"train_loss": -11.477071762084961, "global_step": 326891, "epoch": 1945} {"train_loss": -11.896738052368164, "global_step": 326892, "epoch": 1945} {"train_loss": -11.836262702941895, "global_step": 326893, "epoch": 1945} {"train_loss": -12.09615707397461, "global_step": 326894, "epoch": 1945} {"train_loss": -12.131141662597656, "global_step": 326895, "epoch": 1945} {"train_loss": -11.693387031555176, "global_step": 326896, "epoch": 1945} {"train_loss": -12.337055206298828, "global_step": 326897, "epoch": 1945} {"train_loss": -11.550211906433105, "global_step": 326898, "epoch": 1945} {"train_loss": -12.05526351928711, "global_step": 326899, "epoch": 1945} {"train_loss": -11.73947525024414, "global_step": 326900, "epoch": 1945} {"train_loss": -11.72018814086914, "global_step": 326901, "epoch": 1945} {"train_loss": -11.698756217956543, "global_step": 326902, "epoch": 1945} {"train_loss": -11.551158905029297, "global_step": 326903, "epoch": 1945} {"train_loss": -11.41301441192627, "global_step": 326904, "epoch": 1945} {"train_loss": -10.842902183532715, "global_step": 326905, "epoch": 1945} {"train_loss": -11.09174919128418, "global_step": 326906, "epoch": 1945} {"train_loss": -11.657739639282227, "global_step": 326907, "epoch": 1945} {"train_loss": -10.986191749572754, "global_step": 326908, "epoch": 1945} {"train_loss": -11.600278854370117, "global_step": 326909, "epoch": 1945} {"train_loss": -11.088943481445312, "global_step": 326910, "epoch": 1945} {"train_loss": -11.725715637207031, "global_step": 326911, "epoch": 1945} {"train_loss": -11.088689804077148, "global_step": 326912, "epoch": 1945} {"train_loss": -11.677059173583984, "global_step": 326913, "epoch": 1945} {"train_loss": -11.39372444152832, "global_step": 326914, "epoch": 1945} {"train_loss": -11.850409507751465, "global_step": 326915, "epoch": 1945} {"train_loss": -11.826865196228027, "global_step": 326916, "epoch": 1945} {"train_loss": -11.78856086730957, "global_step": 326917, "epoch": 1945} {"train_loss": -11.45645523071289, "global_step": 326918, "epoch": 1945} {"train_loss": -11.729263305664062, "global_step": 326919, "epoch": 1945} {"train_loss": -11.729372024536133, "global_step": 326920, "epoch": 1945} {"train_loss": -11.839756965637207, "global_step": 326921, "epoch": 1945} {"train_loss": -11.868647575378418, "global_step": 326922, "epoch": 1945} {"train_loss": -11.871503829956055, "global_step": 326923, "epoch": 1945} {"train_loss": -11.858989715576172, "global_step": 326924, "epoch": 1945} {"train_loss": -11.940544128417969, "global_step": 326925, "epoch": 1945} {"train_loss": -11.869491577148438, "global_step": 326926, "epoch": 1945} {"train_loss": -11.89171270529429, "global_step": 326927, "epoch": 1945, "val_loss": 284081.78125, "train_action_mse_error": 3.1305601596832275} {"train_loss": -11.993009567260742, "global_step": 326928, "epoch": 1946} {"train_loss": -11.939332962036133, "global_step": 326929, "epoch": 1946} {"train_loss": -11.751699447631836, "global_step": 326930, "epoch": 1946} {"train_loss": -11.493080139160156, "global_step": 326931, "epoch": 1946} {"train_loss": -11.494933128356934, "global_step": 326932, "epoch": 1946} {"train_loss": -11.398918151855469, "global_step": 326933, "epoch": 1946} {"train_loss": -11.329907417297363, "global_step": 326934, "epoch": 1946} {"train_loss": -11.309017181396484, "global_step": 326935, "epoch": 1946} {"train_loss": -10.267145156860352, "global_step": 326936, "epoch": 1946} {"train_loss": -11.07388687133789, "global_step": 326937, "epoch": 1946} {"train_loss": -10.806768417358398, "global_step": 326938, "epoch": 1946} {"train_loss": -11.313292503356934, "global_step": 326939, "epoch": 1946} {"train_loss": -11.485454559326172, "global_step": 326940, "epoch": 1946} {"train_loss": -11.526039123535156, "global_step": 326941, "epoch": 1946} {"train_loss": -10.937055587768555, "global_step": 326942, "epoch": 1946} {"train_loss": -10.916738510131836, "global_step": 326943, "epoch": 1946} {"train_loss": -11.792144775390625, "global_step": 326944, "epoch": 1946} {"train_loss": -11.442293167114258, "global_step": 326945, "epoch": 1946} {"train_loss": -11.92731761932373, "global_step": 326946, "epoch": 1946} {"train_loss": -11.769222259521484, "global_step": 326947, "epoch": 1946} {"train_loss": -12.18134880065918, "global_step": 326948, "epoch": 1946} {"train_loss": -11.933286666870117, "global_step": 326949, "epoch": 1946} {"train_loss": -11.670355796813965, "global_step": 326950, "epoch": 1946} {"train_loss": -12.068231582641602, "global_step": 326951, "epoch": 1946} {"train_loss": -11.822307586669922, "global_step": 326952, "epoch": 1946} {"train_loss": -11.806577682495117, "global_step": 326953, "epoch": 1946} {"train_loss": -12.07335090637207, "global_step": 326954, "epoch": 1946} {"train_loss": -11.93381118774414, "global_step": 326955, "epoch": 1946} {"train_loss": -11.908023834228516, "global_step": 326956, "epoch": 1946} {"train_loss": -12.209754943847656, "global_step": 326957, "epoch": 1946} {"train_loss": -11.770343780517578, "global_step": 326958, "epoch": 1946} {"train_loss": -12.30567455291748, "global_step": 326959, "epoch": 1946} {"train_loss": -11.817634582519531, "global_step": 326960, "epoch": 1946} {"train_loss": -11.692028999328613, "global_step": 326961, "epoch": 1946} {"train_loss": -11.90432357788086, "global_step": 326962, "epoch": 1946} {"train_loss": -11.880958557128906, "global_step": 326963, "epoch": 1946} {"train_loss": -12.061649322509766, "global_step": 326964, "epoch": 1946} {"train_loss": -11.974813461303711, "global_step": 326965, "epoch": 1946} {"train_loss": -12.085302352905273, "global_step": 326966, "epoch": 1946} {"train_loss": -11.952444076538086, "global_step": 326967, "epoch": 1946} {"train_loss": -12.09842300415039, "global_step": 326968, "epoch": 1946} {"train_loss": -12.060226440429688, "global_step": 326969, "epoch": 1946} {"train_loss": -12.304566383361816, "global_step": 326970, "epoch": 1946} {"train_loss": -12.01572036743164, "global_step": 326971, "epoch": 1946} {"train_loss": -12.338560104370117, "global_step": 326972, "epoch": 1946} {"train_loss": -12.057035446166992, "global_step": 326973, "epoch": 1946} {"train_loss": -12.159574508666992, "global_step": 326974, "epoch": 1946} {"train_loss": -12.18927001953125, "global_step": 326975, "epoch": 1946} {"train_loss": -11.641204833984375, "global_step": 326976, "epoch": 1946} {"train_loss": -12.09566593170166, "global_step": 326977, "epoch": 1946} {"train_loss": -12.046797752380371, "global_step": 326978, "epoch": 1946} {"train_loss": -12.130257606506348, "global_step": 326979, "epoch": 1946} {"train_loss": -11.7987060546875, "global_step": 326980, "epoch": 1946} {"train_loss": -12.182329177856445, "global_step": 326981, "epoch": 1946} {"train_loss": -11.588481903076172, "global_step": 326982, "epoch": 1946} {"train_loss": -12.179631233215332, "global_step": 326983, "epoch": 1946} {"train_loss": -11.938871383666992, "global_step": 326984, "epoch": 1946} {"train_loss": -11.993849754333496, "global_step": 326985, "epoch": 1946} {"train_loss": -11.955317497253418, "global_step": 326986, "epoch": 1946} {"train_loss": -10.878543853759766, "global_step": 326987, "epoch": 1946} {"train_loss": -12.047750473022461, "global_step": 326988, "epoch": 1946} {"train_loss": -11.001033782958984, "global_step": 326989, "epoch": 1946} {"train_loss": -11.931771278381348, "global_step": 326990, "epoch": 1946} {"train_loss": -11.415889739990234, "global_step": 326991, "epoch": 1946} {"train_loss": -11.160518646240234, "global_step": 326992, "epoch": 1946} {"train_loss": -12.09299087524414, "global_step": 326993, "epoch": 1946} {"train_loss": -11.453271865844727, "global_step": 326994, "epoch": 1946} {"train_loss": -12.022703170776367, "global_step": 326995, "epoch": 1946} {"train_loss": -11.838693618774414, "global_step": 326996, "epoch": 1946} {"train_loss": -11.872774124145508, "global_step": 326997, "epoch": 1946} {"train_loss": -12.28818130493164, "global_step": 326998, "epoch": 1946} {"train_loss": -11.624945640563965, "global_step": 326999, "epoch": 1946} {"train_loss": -11.956360816955566, "global_step": 327000, "epoch": 1946} {"train_loss": -11.921781539916992, "global_step": 327001, "epoch": 1946} {"train_loss": -12.269967079162598, "global_step": 327002, "epoch": 1946} {"train_loss": -12.120370864868164, "global_step": 327003, "epoch": 1946} {"train_loss": -12.379716873168945, "global_step": 327004, "epoch": 1946} {"train_loss": -12.324256896972656, "global_step": 327005, "epoch": 1946} {"train_loss": -12.162579536437988, "global_step": 327006, "epoch": 1946} {"train_loss": -12.27635669708252, "global_step": 327007, "epoch": 1946} {"train_loss": -12.41717529296875, "global_step": 327008, "epoch": 1946} {"train_loss": -12.244644165039062, "global_step": 327009, "epoch": 1946} {"train_loss": -12.470827102661133, "global_step": 327010, "epoch": 1946} {"train_loss": -12.337101936340332, "global_step": 327011, "epoch": 1946} {"train_loss": -12.128059387207031, "global_step": 327012, "epoch": 1946} {"train_loss": -12.510488510131836, "global_step": 327013, "epoch": 1946} {"train_loss": -12.276715278625488, "global_step": 327014, "epoch": 1946} {"train_loss": -12.37881851196289, "global_step": 327015, "epoch": 1946} {"train_loss": -12.304082870483398, "global_step": 327016, "epoch": 1946} {"train_loss": -12.412206649780273, "global_step": 327017, "epoch": 1946} {"train_loss": -12.501035690307617, "global_step": 327018, "epoch": 1946} {"train_loss": -12.39319133758545, "global_step": 327019, "epoch": 1946} {"train_loss": -12.332601547241211, "global_step": 327020, "epoch": 1946} {"train_loss": -12.356710433959961, "global_step": 327021, "epoch": 1946} {"train_loss": -12.484779357910156, "global_step": 327022, "epoch": 1946} {"train_loss": -12.463069915771484, "global_step": 327023, "epoch": 1946} {"train_loss": -12.501180648803711, "global_step": 327024, "epoch": 1946} {"train_loss": -12.681400299072266, "global_step": 327025, "epoch": 1946} {"train_loss": -12.316056251525879, "global_step": 327026, "epoch": 1946} {"train_loss": -12.531750679016113, "global_step": 327027, "epoch": 1946} {"train_loss": -12.520329475402832, "global_step": 327028, "epoch": 1946} {"train_loss": -12.511173248291016, "global_step": 327029, "epoch": 1946} {"train_loss": -12.540481567382812, "global_step": 327030, "epoch": 1946} {"train_loss": -12.446483612060547, "global_step": 327031, "epoch": 1946} {"train_loss": -12.314132690429688, "global_step": 327032, "epoch": 1946} {"train_loss": -12.543601036071777, "global_step": 327033, "epoch": 1946} {"train_loss": -12.28684139251709, "global_step": 327034, "epoch": 1946} {"train_loss": -12.36402702331543, "global_step": 327035, "epoch": 1946} {"train_loss": -12.081546783447266, "global_step": 327036, "epoch": 1946} {"train_loss": -11.76487922668457, "global_step": 327037, "epoch": 1946} {"train_loss": -12.096811294555664, "global_step": 327038, "epoch": 1946} {"train_loss": -12.345073699951172, "global_step": 327039, "epoch": 1946} {"train_loss": -11.543760299682617, "global_step": 327040, "epoch": 1946} {"train_loss": -11.89834976196289, "global_step": 327041, "epoch": 1946} {"train_loss": -11.920320510864258, "global_step": 327042, "epoch": 1946} {"train_loss": -12.23486328125, "global_step": 327043, "epoch": 1946} {"train_loss": -11.744128227233887, "global_step": 327044, "epoch": 1946} {"train_loss": -12.313826560974121, "global_step": 327045, "epoch": 1946} {"train_loss": -11.664113998413086, "global_step": 327046, "epoch": 1946} {"train_loss": -11.86964225769043, "global_step": 327047, "epoch": 1946} {"train_loss": -11.713783264160156, "global_step": 327048, "epoch": 1946} {"train_loss": -12.545553207397461, "global_step": 327049, "epoch": 1946} {"train_loss": -11.91030502319336, "global_step": 327050, "epoch": 1946} {"train_loss": -12.371191024780273, "global_step": 327051, "epoch": 1946} {"train_loss": -12.138046264648438, "global_step": 327052, "epoch": 1946} {"train_loss": -12.292346954345703, "global_step": 327053, "epoch": 1946} {"train_loss": -12.249032974243164, "global_step": 327054, "epoch": 1946} {"train_loss": -11.91279411315918, "global_step": 327055, "epoch": 1946} {"train_loss": -12.282905578613281, "global_step": 327056, "epoch": 1946} {"train_loss": -12.244029998779297, "global_step": 327057, "epoch": 1946} {"train_loss": -12.462682723999023, "global_step": 327058, "epoch": 1946} {"train_loss": -11.733162879943848, "global_step": 327059, "epoch": 1946} {"train_loss": -12.344545364379883, "global_step": 327060, "epoch": 1946} {"train_loss": -11.85588264465332, "global_step": 327061, "epoch": 1946} {"train_loss": -11.397560119628906, "global_step": 327062, "epoch": 1946} {"train_loss": -12.405458450317383, "global_step": 327063, "epoch": 1946} {"train_loss": -11.604860305786133, "global_step": 327064, "epoch": 1946} {"train_loss": -11.22310733795166, "global_step": 327065, "epoch": 1946} {"train_loss": -11.7418794631958, "global_step": 327066, "epoch": 1946} {"train_loss": -11.650481224060059, "global_step": 327067, "epoch": 1946} {"train_loss": -9.556604385375977, "global_step": 327068, "epoch": 1946} {"train_loss": -10.697158813476562, "global_step": 327069, "epoch": 1946} {"train_loss": -11.180278778076172, "global_step": 327070, "epoch": 1946} {"train_loss": -8.607210159301758, "global_step": 327071, "epoch": 1946} {"train_loss": -9.47258186340332, "global_step": 327072, "epoch": 1946} {"train_loss": -10.859428405761719, "global_step": 327073, "epoch": 1946} {"train_loss": -10.033679962158203, "global_step": 327074, "epoch": 1946} {"train_loss": -9.786351203918457, "global_step": 327075, "epoch": 1946} {"train_loss": -11.583518028259277, "global_step": 327076, "epoch": 1946} {"train_loss": -9.85368824005127, "global_step": 327077, "epoch": 1946} {"train_loss": -11.87339973449707, "global_step": 327078, "epoch": 1946} {"train_loss": -10.768531799316406, "global_step": 327079, "epoch": 1946} {"train_loss": -10.964695930480957, "global_step": 327080, "epoch": 1946} {"train_loss": -11.169412612915039, "global_step": 327081, "epoch": 1946} {"train_loss": -10.93387222290039, "global_step": 327082, "epoch": 1946} {"train_loss": -11.949972152709961, "global_step": 327083, "epoch": 1946} {"train_loss": -11.133077621459961, "global_step": 327084, "epoch": 1946} {"train_loss": -11.570385932922363, "global_step": 327085, "epoch": 1946} {"train_loss": -11.067349433898926, "global_step": 327086, "epoch": 1946} {"train_loss": -11.75057315826416, "global_step": 327087, "epoch": 1946} {"train_loss": -11.59304141998291, "global_step": 327088, "epoch": 1946} {"train_loss": -11.277341842651367, "global_step": 327089, "epoch": 1946} {"train_loss": -11.949996948242188, "global_step": 327090, "epoch": 1946} {"train_loss": -11.576725006103516, "global_step": 327091, "epoch": 1946} {"train_loss": -12.022175788879395, "global_step": 327092, "epoch": 1946} {"train_loss": -11.828694343566895, "global_step": 327093, "epoch": 1946} {"train_loss": -11.906169891357422, "global_step": 327094, "epoch": 1946} {"train_loss": -11.81537511802855, "global_step": 327095, "epoch": 1946, "val_loss": 280793.15625} {"train_loss": -12.09053897857666, "global_step": 327096, "epoch": 1947} {"train_loss": -12.123403549194336, "global_step": 327097, "epoch": 1947} {"train_loss": -12.202473640441895, "global_step": 327098, "epoch": 1947} {"train_loss": -11.971626281738281, "global_step": 327099, "epoch": 1947} {"train_loss": -12.070295333862305, "global_step": 327100, "epoch": 1947} {"train_loss": -11.918706893920898, "global_step": 327101, "epoch": 1947} {"train_loss": -11.910515785217285, "global_step": 327102, "epoch": 1947} {"train_loss": -12.03169059753418, "global_step": 327103, "epoch": 1947} {"train_loss": -11.615516662597656, "global_step": 327104, "epoch": 1947} {"train_loss": -12.095954895019531, "global_step": 327105, "epoch": 1947} {"train_loss": -11.603836059570312, "global_step": 327106, "epoch": 1947} {"train_loss": -11.75874137878418, "global_step": 327107, "epoch": 1947} {"train_loss": -12.383033752441406, "global_step": 327108, "epoch": 1947} {"train_loss": -12.06272029876709, "global_step": 327109, "epoch": 1947} {"train_loss": -12.106938362121582, "global_step": 327110, "epoch": 1947} {"train_loss": -11.820425033569336, "global_step": 327111, "epoch": 1947} {"train_loss": -12.18475341796875, "global_step": 327112, "epoch": 1947} {"train_loss": -11.964133262634277, "global_step": 327113, "epoch": 1947} {"train_loss": -12.2307710647583, "global_step": 327114, "epoch": 1947} {"train_loss": -12.083908081054688, "global_step": 327115, "epoch": 1947} {"train_loss": -11.889490127563477, "global_step": 327116, "epoch": 1947} {"train_loss": -12.34536361694336, "global_step": 327117, "epoch": 1947} {"train_loss": -11.78006362915039, "global_step": 327118, "epoch": 1947} {"train_loss": -11.826986312866211, "global_step": 327119, "epoch": 1947} {"train_loss": -12.059341430664062, "global_step": 327120, "epoch": 1947} {"train_loss": -12.149740219116211, "global_step": 327121, "epoch": 1947} {"train_loss": -12.09776782989502, "global_step": 327122, "epoch": 1947} {"train_loss": -12.292173385620117, "global_step": 327123, "epoch": 1947} {"train_loss": -12.238465309143066, "global_step": 327124, "epoch": 1947} {"train_loss": -12.175989151000977, "global_step": 327125, "epoch": 1947} {"train_loss": -12.327997207641602, "global_step": 327126, "epoch": 1947} {"train_loss": -12.28680419921875, "global_step": 327127, "epoch": 1947} {"train_loss": -12.382118225097656, "global_step": 327128, "epoch": 1947} {"train_loss": -12.237709045410156, "global_step": 327129, "epoch": 1947} {"train_loss": -12.291043281555176, "global_step": 327130, "epoch": 1947} {"train_loss": -12.513848304748535, "global_step": 327131, "epoch": 1947} {"train_loss": -12.245941162109375, "global_step": 327132, "epoch": 1947} {"train_loss": -12.534923553466797, "global_step": 327133, "epoch": 1947} {"train_loss": -11.46031379699707, "global_step": 327134, "epoch": 1947} {"train_loss": -12.489860534667969, "global_step": 327135, "epoch": 1947} {"train_loss": -12.393841743469238, "global_step": 327136, "epoch": 1947} {"train_loss": -12.722834587097168, "global_step": 327137, "epoch": 1947} {"train_loss": -12.435140609741211, "global_step": 327138, "epoch": 1947} {"train_loss": -12.198562622070312, "global_step": 327139, "epoch": 1947} {"train_loss": -12.403199195861816, "global_step": 327140, "epoch": 1947} {"train_loss": -12.381553649902344, "global_step": 327141, "epoch": 1947} {"train_loss": -12.193117141723633, "global_step": 327142, "epoch": 1947} {"train_loss": -12.278024673461914, "global_step": 327143, "epoch": 1947} {"train_loss": -12.515429496765137, "global_step": 327144, "epoch": 1947} {"train_loss": -12.439550399780273, "global_step": 327145, "epoch": 1947} {"train_loss": -12.489116668701172, "global_step": 327146, "epoch": 1947} {"train_loss": -12.25722885131836, "global_step": 327147, "epoch": 1947} {"train_loss": -12.422037124633789, "global_step": 327148, "epoch": 1947} {"train_loss": -12.443896293640137, "global_step": 327149, "epoch": 1947} {"train_loss": -12.474124908447266, "global_step": 327150, "epoch": 1947} {"train_loss": -11.89185619354248, "global_step": 327151, "epoch": 1947} {"train_loss": -12.409952163696289, "global_step": 327152, "epoch": 1947} {"train_loss": -12.568626403808594, "global_step": 327153, "epoch": 1947} {"train_loss": -12.183509826660156, "global_step": 327154, "epoch": 1947} {"train_loss": -12.317852973937988, "global_step": 327155, "epoch": 1947} {"train_loss": -12.290660858154297, "global_step": 327156, "epoch": 1947} {"train_loss": -12.395818710327148, "global_step": 327157, "epoch": 1947} {"train_loss": -12.134462356567383, "global_step": 327158, "epoch": 1947} {"train_loss": -12.362051010131836, "global_step": 327159, "epoch": 1947} {"train_loss": -11.81113052368164, "global_step": 327160, "epoch": 1947} {"train_loss": -11.748388290405273, "global_step": 327161, "epoch": 1947} {"train_loss": -12.102705955505371, "global_step": 327162, "epoch": 1947} {"train_loss": -11.250309944152832, "global_step": 327163, "epoch": 1947} {"train_loss": -11.472790718078613, "global_step": 327164, "epoch": 1947} {"train_loss": -11.51136302947998, "global_step": 327165, "epoch": 1947} {"train_loss": -11.133872985839844, "global_step": 327166, "epoch": 1947} {"train_loss": -10.793954849243164, "global_step": 327167, "epoch": 1947} {"train_loss": -10.928915023803711, "global_step": 327168, "epoch": 1947} {"train_loss": -11.793885231018066, "global_step": 327169, "epoch": 1947} {"train_loss": -12.08050537109375, "global_step": 327170, "epoch": 1947} {"train_loss": -11.190807342529297, "global_step": 327171, "epoch": 1947} {"train_loss": -12.266586303710938, "global_step": 327172, "epoch": 1947} {"train_loss": -11.949361801147461, "global_step": 327173, "epoch": 1947} {"train_loss": -12.502397537231445, "global_step": 327174, "epoch": 1947} {"train_loss": -12.275649070739746, "global_step": 327175, "epoch": 1947} {"train_loss": -12.167553901672363, "global_step": 327176, "epoch": 1947} {"train_loss": -12.064661979675293, "global_step": 327177, "epoch": 1947} {"train_loss": -12.194401741027832, "global_step": 327178, "epoch": 1947} {"train_loss": -12.094325065612793, "global_step": 327179, "epoch": 1947} {"train_loss": -11.896080017089844, "global_step": 327180, "epoch": 1947} {"train_loss": -12.199442863464355, "global_step": 327181, "epoch": 1947} {"train_loss": -12.354642868041992, "global_step": 327182, "epoch": 1947} {"train_loss": -12.021686553955078, "global_step": 327183, "epoch": 1947} {"train_loss": -11.969717025756836, "global_step": 327184, "epoch": 1947} {"train_loss": -12.287765502929688, "global_step": 327185, "epoch": 1947} {"train_loss": -12.19721794128418, "global_step": 327186, "epoch": 1947} {"train_loss": -12.172562599182129, "global_step": 327187, "epoch": 1947} {"train_loss": -12.30145263671875, "global_step": 327188, "epoch": 1947} {"train_loss": -12.302604675292969, "global_step": 327189, "epoch": 1947} {"train_loss": -12.356916427612305, "global_step": 327190, "epoch": 1947} {"train_loss": -11.796873092651367, "global_step": 327191, "epoch": 1947} {"train_loss": -12.102883338928223, "global_step": 327192, "epoch": 1947} {"train_loss": -12.387895584106445, "global_step": 327193, "epoch": 1947} {"train_loss": -12.273920059204102, "global_step": 327194, "epoch": 1947} {"train_loss": -12.373481750488281, "global_step": 327195, "epoch": 1947} {"train_loss": -12.173097610473633, "global_step": 327196, "epoch": 1947} {"train_loss": -12.304277420043945, "global_step": 327197, "epoch": 1947} {"train_loss": -12.135608673095703, "global_step": 327198, "epoch": 1947} {"train_loss": -11.872478485107422, "global_step": 327199, "epoch": 1947} {"train_loss": -11.942863464355469, "global_step": 327200, "epoch": 1947} {"train_loss": -12.382644653320312, "global_step": 327201, "epoch": 1947} {"train_loss": -12.225706100463867, "global_step": 327202, "epoch": 1947} {"train_loss": -12.318671226501465, "global_step": 327203, "epoch": 1947} {"train_loss": -12.168328285217285, "global_step": 327204, "epoch": 1947} {"train_loss": -12.218338012695312, "global_step": 327205, "epoch": 1947} {"train_loss": -12.142677307128906, "global_step": 327206, "epoch": 1947} {"train_loss": -12.246819496154785, "global_step": 327207, "epoch": 1947} {"train_loss": -12.071882247924805, "global_step": 327208, "epoch": 1947} {"train_loss": -11.813210487365723, "global_step": 327209, "epoch": 1947} {"train_loss": -12.058079719543457, "global_step": 327210, "epoch": 1947} {"train_loss": -12.223803520202637, "global_step": 327211, "epoch": 1947} {"train_loss": -11.407238006591797, "global_step": 327212, "epoch": 1947} {"train_loss": -12.033437728881836, "global_step": 327213, "epoch": 1947} {"train_loss": -12.379007339477539, "global_step": 327214, "epoch": 1947} {"train_loss": -11.558608055114746, "global_step": 327215, "epoch": 1947} {"train_loss": -12.088263511657715, "global_step": 327216, "epoch": 1947} {"train_loss": -12.410723686218262, "global_step": 327217, "epoch": 1947} {"train_loss": -12.206425666809082, "global_step": 327218, "epoch": 1947} {"train_loss": -12.445269584655762, "global_step": 327219, "epoch": 1947} {"train_loss": -12.210626602172852, "global_step": 327220, "epoch": 1947} {"train_loss": -12.128868103027344, "global_step": 327221, "epoch": 1947} {"train_loss": -12.19688606262207, "global_step": 327222, "epoch": 1947} {"train_loss": -12.216983795166016, "global_step": 327223, "epoch": 1947} {"train_loss": -12.302923202514648, "global_step": 327224, "epoch": 1947} {"train_loss": -12.362330436706543, "global_step": 327225, "epoch": 1947} {"train_loss": -12.08434009552002, "global_step": 327226, "epoch": 1947} {"train_loss": -12.451318740844727, "global_step": 327227, "epoch": 1947} {"train_loss": -12.210092544555664, "global_step": 327228, "epoch": 1947} {"train_loss": -12.341270446777344, "global_step": 327229, "epoch": 1947} {"train_loss": -12.034092903137207, "global_step": 327230, "epoch": 1947} {"train_loss": -12.091121673583984, "global_step": 327231, "epoch": 1947} {"train_loss": -11.714603424072266, "global_step": 327232, "epoch": 1947} {"train_loss": -11.42768669128418, "global_step": 327233, "epoch": 1947} {"train_loss": -11.264473915100098, "global_step": 327234, "epoch": 1947} {"train_loss": -11.830986022949219, "global_step": 327235, "epoch": 1947} {"train_loss": -11.857037544250488, "global_step": 327236, "epoch": 1947} {"train_loss": -12.227156639099121, "global_step": 327237, "epoch": 1947} {"train_loss": -12.410395622253418, "global_step": 327238, "epoch": 1947} {"train_loss": -11.446650505065918, "global_step": 327239, "epoch": 1947} {"train_loss": -11.972522735595703, "global_step": 327240, "epoch": 1947} {"train_loss": -12.033527374267578, "global_step": 327241, "epoch": 1947} {"train_loss": -11.506324768066406, "global_step": 327242, "epoch": 1947} {"train_loss": -11.68789005279541, "global_step": 327243, "epoch": 1947} {"train_loss": -11.156811714172363, "global_step": 327244, "epoch": 1947} {"train_loss": -10.386279106140137, "global_step": 327245, "epoch": 1947} {"train_loss": -11.75576400756836, "global_step": 327246, "epoch": 1947} {"train_loss": -11.357887268066406, "global_step": 327247, "epoch": 1947} {"train_loss": -10.924140930175781, "global_step": 327248, "epoch": 1947} {"train_loss": -11.641977310180664, "global_step": 327249, "epoch": 1947} {"train_loss": -10.780181884765625, "global_step": 327250, "epoch": 1947} {"train_loss": -11.784637451171875, "global_step": 327251, "epoch": 1947} {"train_loss": -11.470148086547852, "global_step": 327252, "epoch": 1947} {"train_loss": -12.199320793151855, "global_step": 327253, "epoch": 1947} {"train_loss": -11.626523971557617, "global_step": 327254, "epoch": 1947} {"train_loss": -12.019859313964844, "global_step": 327255, "epoch": 1947} {"train_loss": -11.836840629577637, "global_step": 327256, "epoch": 1947} {"train_loss": -11.756203651428223, "global_step": 327257, "epoch": 1947} {"train_loss": -12.009547233581543, "global_step": 327258, "epoch": 1947} {"train_loss": -11.493392944335938, "global_step": 327259, "epoch": 1947} {"train_loss": -11.558324813842773, "global_step": 327260, "epoch": 1947} {"train_loss": -12.05231761932373, "global_step": 327261, "epoch": 1947} {"train_loss": -11.932819366455078, "global_step": 327262, "epoch": 1947} {"train_loss": -12.029901947293963, "global_step": 327263, "epoch": 1947, "val_loss": 284054.78125} {"train_loss": -12.077530860900879, "global_step": 327264, "epoch": 1948} {"train_loss": -10.972346305847168, "global_step": 327265, "epoch": 1948} {"train_loss": -11.38404369354248, "global_step": 327266, "epoch": 1948} {"train_loss": -11.387434005737305, "global_step": 327267, "epoch": 1948} {"train_loss": -10.875219345092773, "global_step": 327268, "epoch": 1948} {"train_loss": -11.267448425292969, "global_step": 327269, "epoch": 1948} {"train_loss": -11.181631088256836, "global_step": 327270, "epoch": 1948} {"train_loss": -11.873594284057617, "global_step": 327271, "epoch": 1948} {"train_loss": -11.513782501220703, "global_step": 327272, "epoch": 1948} {"train_loss": -11.781757354736328, "global_step": 327273, "epoch": 1948} {"train_loss": -11.910026550292969, "global_step": 327274, "epoch": 1948} {"train_loss": -10.977437973022461, "global_step": 327275, "epoch": 1948} {"train_loss": -11.396478652954102, "global_step": 327276, "epoch": 1948} {"train_loss": -11.691904067993164, "global_step": 327277, "epoch": 1948} {"train_loss": -10.400392532348633, "global_step": 327278, "epoch": 1948} {"train_loss": -12.167304039001465, "global_step": 327279, "epoch": 1948} {"train_loss": -10.894293785095215, "global_step": 327280, "epoch": 1948} {"train_loss": -10.849327087402344, "global_step": 327281, "epoch": 1948} {"train_loss": -12.128229141235352, "global_step": 327282, "epoch": 1948} {"train_loss": -10.913211822509766, "global_step": 327283, "epoch": 1948} {"train_loss": -11.980040550231934, "global_step": 327284, "epoch": 1948} {"train_loss": -11.310483932495117, "global_step": 327285, "epoch": 1948} {"train_loss": -12.020559310913086, "global_step": 327286, "epoch": 1948} {"train_loss": -11.910300254821777, "global_step": 327287, "epoch": 1948} {"train_loss": -11.865680694580078, "global_step": 327288, "epoch": 1948} {"train_loss": -11.693378448486328, "global_step": 327289, "epoch": 1948} {"train_loss": -12.042158126831055, "global_step": 327290, "epoch": 1948} {"train_loss": -12.269959449768066, "global_step": 327291, "epoch": 1948} {"train_loss": -12.24571418762207, "global_step": 327292, "epoch": 1948} {"train_loss": -12.188422203063965, "global_step": 327293, "epoch": 1948} {"train_loss": -12.061332702636719, "global_step": 327294, "epoch": 1948} {"train_loss": -12.18807315826416, "global_step": 327295, "epoch": 1948} {"train_loss": -12.23735237121582, "global_step": 327296, "epoch": 1948} {"train_loss": -12.050585746765137, "global_step": 327297, "epoch": 1948} {"train_loss": -12.145881652832031, "global_step": 327298, "epoch": 1948} {"train_loss": -12.054141998291016, "global_step": 327299, "epoch": 1948} {"train_loss": -12.014781951904297, "global_step": 327300, "epoch": 1948} {"train_loss": -12.47359848022461, "global_step": 327301, "epoch": 1948} {"train_loss": -12.09417724609375, "global_step": 327302, "epoch": 1948} {"train_loss": -12.246513366699219, "global_step": 327303, "epoch": 1948} {"train_loss": -12.111766815185547, "global_step": 327304, "epoch": 1948} {"train_loss": -12.100852012634277, "global_step": 327305, "epoch": 1948} {"train_loss": -12.185190200805664, "global_step": 327306, "epoch": 1948} {"train_loss": -12.20755386352539, "global_step": 327307, "epoch": 1948} {"train_loss": -12.340566635131836, "global_step": 327308, "epoch": 1948} {"train_loss": -12.103035926818848, "global_step": 327309, "epoch": 1948} {"train_loss": -12.128021240234375, "global_step": 327310, "epoch": 1948} {"train_loss": -12.469490051269531, "global_step": 327311, "epoch": 1948} {"train_loss": -12.477632522583008, "global_step": 327312, "epoch": 1948} {"train_loss": -12.229775428771973, "global_step": 327313, "epoch": 1948} {"train_loss": -12.486446380615234, "global_step": 327314, "epoch": 1948} {"train_loss": -12.310266494750977, "global_step": 327315, "epoch": 1948} {"train_loss": -12.345846176147461, "global_step": 327316, "epoch": 1948} {"train_loss": -12.316919326782227, "global_step": 327317, "epoch": 1948} {"train_loss": -12.341724395751953, "global_step": 327318, "epoch": 1948} {"train_loss": -12.162391662597656, "global_step": 327319, "epoch": 1948} {"train_loss": -12.468679428100586, "global_step": 327320, "epoch": 1948} {"train_loss": -12.010124206542969, "global_step": 327321, "epoch": 1948} {"train_loss": -12.334357261657715, "global_step": 327322, "epoch": 1948} {"train_loss": -12.354963302612305, "global_step": 327323, "epoch": 1948} {"train_loss": -12.19575309753418, "global_step": 327324, "epoch": 1948} {"train_loss": -12.452702522277832, "global_step": 327325, "epoch": 1948} {"train_loss": -12.051286697387695, "global_step": 327326, "epoch": 1948} {"train_loss": -12.069927215576172, "global_step": 327327, "epoch": 1948} {"train_loss": -12.337471008300781, "global_step": 327328, "epoch": 1948} {"train_loss": -12.048935890197754, "global_step": 327329, "epoch": 1948} {"train_loss": -11.938544273376465, "global_step": 327330, "epoch": 1948} {"train_loss": -12.327899932861328, "global_step": 327331, "epoch": 1948} {"train_loss": -12.036998748779297, "global_step": 327332, "epoch": 1948} {"train_loss": -12.424259185791016, "global_step": 327333, "epoch": 1948} {"train_loss": -12.273466110229492, "global_step": 327334, "epoch": 1948} {"train_loss": -11.629919052124023, "global_step": 327335, "epoch": 1948} {"train_loss": -12.323270797729492, "global_step": 327336, "epoch": 1948} {"train_loss": -12.101469039916992, "global_step": 327337, "epoch": 1948} {"train_loss": -11.155782699584961, "global_step": 327338, "epoch": 1948} {"train_loss": -11.505376815795898, "global_step": 327339, "epoch": 1948} {"train_loss": -11.779784202575684, "global_step": 327340, "epoch": 1948} {"train_loss": -11.903261184692383, "global_step": 327341, "epoch": 1948} {"train_loss": -11.488027572631836, "global_step": 327342, "epoch": 1948} {"train_loss": -11.09323501586914, "global_step": 327343, "epoch": 1948} {"train_loss": -12.151330947875977, "global_step": 327344, "epoch": 1948} {"train_loss": -11.607870101928711, "global_step": 327345, "epoch": 1948} {"train_loss": -11.479230880737305, "global_step": 327346, "epoch": 1948} {"train_loss": -11.779306411743164, "global_step": 327347, "epoch": 1948} {"train_loss": -11.137136459350586, "global_step": 327348, "epoch": 1948} {"train_loss": -9.53834342956543, "global_step": 327349, "epoch": 1948} {"train_loss": -11.589767456054688, "global_step": 327350, "epoch": 1948} {"train_loss": -9.869014739990234, "global_step": 327351, "epoch": 1948} {"train_loss": -8.587125778198242, "global_step": 327352, "epoch": 1948} {"train_loss": -8.762737274169922, "global_step": 327353, "epoch": 1948} {"train_loss": -6.9692535400390625, "global_step": 327354, "epoch": 1948} {"train_loss": -7.730578422546387, "global_step": 327355, "epoch": 1948} {"train_loss": -9.475189208984375, "global_step": 327356, "epoch": 1948} {"train_loss": -9.899947166442871, "global_step": 327357, "epoch": 1948} {"train_loss": -6.9672651290893555, "global_step": 327358, "epoch": 1948} {"train_loss": -8.389043807983398, "global_step": 327359, "epoch": 1948} {"train_loss": -8.046762466430664, "global_step": 327360, "epoch": 1948} {"train_loss": -8.924192428588867, "global_step": 327361, "epoch": 1948} {"train_loss": -9.276473999023438, "global_step": 327362, "epoch": 1948} {"train_loss": -8.749139785766602, "global_step": 327363, "epoch": 1948} {"train_loss": -10.29249095916748, "global_step": 327364, "epoch": 1948} {"train_loss": -9.418967247009277, "global_step": 327365, "epoch": 1948} {"train_loss": -10.281621932983398, "global_step": 327366, "epoch": 1948} {"train_loss": -9.582801818847656, "global_step": 327367, "epoch": 1948} {"train_loss": -11.281518936157227, "global_step": 327368, "epoch": 1948} {"train_loss": -8.323469161987305, "global_step": 327369, "epoch": 1948} {"train_loss": -9.650970458984375, "global_step": 327370, "epoch": 1948} {"train_loss": -10.366121292114258, "global_step": 327371, "epoch": 1948} {"train_loss": -9.129475593566895, "global_step": 327372, "epoch": 1948} {"train_loss": -10.796491622924805, "global_step": 327373, "epoch": 1948} {"train_loss": -10.015045166015625, "global_step": 327374, "epoch": 1948} {"train_loss": -11.083434104919434, "global_step": 327375, "epoch": 1948} {"train_loss": -10.686315536499023, "global_step": 327376, "epoch": 1948} {"train_loss": -10.33901596069336, "global_step": 327377, "epoch": 1948} {"train_loss": -11.236421585083008, "global_step": 327378, "epoch": 1948} {"train_loss": -10.746123313903809, "global_step": 327379, "epoch": 1948} {"train_loss": -11.034433364868164, "global_step": 327380, "epoch": 1948} {"train_loss": -11.526116371154785, "global_step": 327381, "epoch": 1948} {"train_loss": -10.863516807556152, "global_step": 327382, "epoch": 1948} {"train_loss": -11.453865051269531, "global_step": 327383, "epoch": 1948} {"train_loss": -11.180047035217285, "global_step": 327384, "epoch": 1948} {"train_loss": -11.463082313537598, "global_step": 327385, "epoch": 1948} {"train_loss": -11.090744018554688, "global_step": 327386, "epoch": 1948} {"train_loss": -11.561751365661621, "global_step": 327387, "epoch": 1948} {"train_loss": -11.074170112609863, "global_step": 327388, "epoch": 1948} {"train_loss": -11.324105262756348, "global_step": 327389, "epoch": 1948} {"train_loss": -11.737926483154297, "global_step": 327390, "epoch": 1948} {"train_loss": -11.315505981445312, "global_step": 327391, "epoch": 1948} {"train_loss": -11.551949501037598, "global_step": 327392, "epoch": 1948} {"train_loss": -11.57198429107666, "global_step": 327393, "epoch": 1948} {"train_loss": -11.420124053955078, "global_step": 327394, "epoch": 1948} {"train_loss": -11.314906120300293, "global_step": 327395, "epoch": 1948} {"train_loss": -11.775177001953125, "global_step": 327396, "epoch": 1948} {"train_loss": -11.82123851776123, "global_step": 327397, "epoch": 1948} {"train_loss": -11.236289024353027, "global_step": 327398, "epoch": 1948} {"train_loss": -12.04952335357666, "global_step": 327399, "epoch": 1948} {"train_loss": -11.227274894714355, "global_step": 327400, "epoch": 1948} {"train_loss": -11.769478797912598, "global_step": 327401, "epoch": 1948} {"train_loss": -11.657476425170898, "global_step": 327402, "epoch": 1948} {"train_loss": -11.650172233581543, "global_step": 327403, "epoch": 1948} {"train_loss": -11.496986389160156, "global_step": 327404, "epoch": 1948} {"train_loss": -11.65693473815918, "global_step": 327405, "epoch": 1948} {"train_loss": -11.625421524047852, "global_step": 327406, "epoch": 1948} {"train_loss": -11.705257415771484, "global_step": 327407, "epoch": 1948} {"train_loss": -11.940898895263672, "global_step": 327408, "epoch": 1948} {"train_loss": -11.600602149963379, "global_step": 327409, "epoch": 1948} {"train_loss": -11.829198837280273, "global_step": 327410, "epoch": 1948} {"train_loss": -11.889866828918457, "global_step": 327411, "epoch": 1948} {"train_loss": -11.744483947753906, "global_step": 327412, "epoch": 1948} {"train_loss": -12.070368766784668, "global_step": 327413, "epoch": 1948} {"train_loss": -11.803093910217285, "global_step": 327414, "epoch": 1948} {"train_loss": -12.061254501342773, "global_step": 327415, "epoch": 1948} {"train_loss": -11.829675674438477, "global_step": 327416, "epoch": 1948} {"train_loss": -12.154014587402344, "global_step": 327417, "epoch": 1948} {"train_loss": -12.026510238647461, "global_step": 327418, "epoch": 1948} {"train_loss": -12.045402526855469, "global_step": 327419, "epoch": 1948} {"train_loss": -12.078519821166992, "global_step": 327420, "epoch": 1948} {"train_loss": -12.06893539428711, "global_step": 327421, "epoch": 1948} {"train_loss": -12.167298316955566, "global_step": 327422, "epoch": 1948} {"train_loss": -12.194070816040039, "global_step": 327423, "epoch": 1948} {"train_loss": -12.09735107421875, "global_step": 327424, "epoch": 1948} {"train_loss": -12.299111366271973, "global_step": 327425, "epoch": 1948} {"train_loss": -11.954344749450684, "global_step": 327426, "epoch": 1948} {"train_loss": -12.119441986083984, "global_step": 327427, "epoch": 1948} {"train_loss": -12.38429069519043, "global_step": 327428, "epoch": 1948} {"train_loss": -12.190656661987305, "global_step": 327429, "epoch": 1948} {"train_loss": -12.23577880859375, "global_step": 327430, "epoch": 1948} {"train_loss": -11.41333784375872, "global_step": 327431, "epoch": 1948, "val_loss": 286955.75} {"train_loss": -12.175479888916016, "global_step": 327432, "epoch": 1949} {"train_loss": -12.269878387451172, "global_step": 327433, "epoch": 1949} {"train_loss": -12.150541305541992, "global_step": 327434, "epoch": 1949} {"train_loss": -12.247560501098633, "global_step": 327435, "epoch": 1949} {"train_loss": -11.865297317504883, "global_step": 327436, "epoch": 1949} {"train_loss": -12.420494079589844, "global_step": 327437, "epoch": 1949} {"train_loss": -12.018113136291504, "global_step": 327438, "epoch": 1949} {"train_loss": -12.26176929473877, "global_step": 327439, "epoch": 1949} {"train_loss": -12.257881164550781, "global_step": 327440, "epoch": 1949} {"train_loss": -12.326333045959473, "global_step": 327441, "epoch": 1949} {"train_loss": -12.329041481018066, "global_step": 327442, "epoch": 1949} {"train_loss": -12.24410629272461, "global_step": 327443, "epoch": 1949} {"train_loss": -12.398615837097168, "global_step": 327444, "epoch": 1949} {"train_loss": -12.246970176696777, "global_step": 327445, "epoch": 1949} {"train_loss": -12.155123710632324, "global_step": 327446, "epoch": 1949} {"train_loss": -12.235628128051758, "global_step": 327447, "epoch": 1949} {"train_loss": -12.34348201751709, "global_step": 327448, "epoch": 1949} {"train_loss": -12.363574981689453, "global_step": 327449, "epoch": 1949} {"train_loss": -12.467855453491211, "global_step": 327450, "epoch": 1949} {"train_loss": -12.329927444458008, "global_step": 327451, "epoch": 1949} {"train_loss": -12.414497375488281, "global_step": 327452, "epoch": 1949} {"train_loss": -12.363319396972656, "global_step": 327453, "epoch": 1949} {"train_loss": -12.350748062133789, "global_step": 327454, "epoch": 1949} {"train_loss": -12.346476554870605, "global_step": 327455, "epoch": 1949} {"train_loss": -12.498981475830078, "global_step": 327456, "epoch": 1949} {"train_loss": -12.40684700012207, "global_step": 327457, "epoch": 1949} {"train_loss": -12.574199676513672, "global_step": 327458, "epoch": 1949} {"train_loss": -12.299932479858398, "global_step": 327459, "epoch": 1949} {"train_loss": -12.301546096801758, "global_step": 327460, "epoch": 1949} {"train_loss": -12.649641036987305, "global_step": 327461, "epoch": 1949} {"train_loss": -12.405956268310547, "global_step": 327462, "epoch": 1949} {"train_loss": -12.676950454711914, "global_step": 327463, "epoch": 1949} {"train_loss": -12.208478927612305, "global_step": 327464, "epoch": 1949} {"train_loss": -12.514260292053223, "global_step": 327465, "epoch": 1949} {"train_loss": -12.401585578918457, "global_step": 327466, "epoch": 1949} {"train_loss": -12.532302856445312, "global_step": 327467, "epoch": 1949} {"train_loss": -12.43223762512207, "global_step": 327468, "epoch": 1949} {"train_loss": -12.354601860046387, "global_step": 327469, "epoch": 1949} {"train_loss": -12.37977409362793, "global_step": 327470, "epoch": 1949} {"train_loss": -12.587224960327148, "global_step": 327471, "epoch": 1949} {"train_loss": -12.385187149047852, "global_step": 327472, "epoch": 1949} {"train_loss": -12.51928424835205, "global_step": 327473, "epoch": 1949} {"train_loss": -12.534486770629883, "global_step": 327474, "epoch": 1949} {"train_loss": -12.648529052734375, "global_step": 327475, "epoch": 1949} {"train_loss": -12.591207504272461, "global_step": 327476, "epoch": 1949} {"train_loss": -12.691730499267578, "global_step": 327477, "epoch": 1949} {"train_loss": -12.546875953674316, "global_step": 327478, "epoch": 1949} {"train_loss": -12.60843563079834, "global_step": 327479, "epoch": 1949} {"train_loss": -12.739971160888672, "global_step": 327480, "epoch": 1949} {"train_loss": -12.547718048095703, "global_step": 327481, "epoch": 1949} {"train_loss": -12.805465698242188, "global_step": 327482, "epoch": 1949} {"train_loss": -12.548027992248535, "global_step": 327483, "epoch": 1949} {"train_loss": -12.643548965454102, "global_step": 327484, "epoch": 1949} {"train_loss": -12.663496971130371, "global_step": 327485, "epoch": 1949} {"train_loss": -12.576725006103516, "global_step": 327486, "epoch": 1949} {"train_loss": -12.574542999267578, "global_step": 327487, "epoch": 1949} {"train_loss": -12.625585556030273, "global_step": 327488, "epoch": 1949} {"train_loss": -12.52284049987793, "global_step": 327489, "epoch": 1949} {"train_loss": -12.439888000488281, "global_step": 327490, "epoch": 1949} {"train_loss": -12.342909812927246, "global_step": 327491, "epoch": 1949} {"train_loss": -12.726188659667969, "global_step": 327492, "epoch": 1949} {"train_loss": -11.982004165649414, "global_step": 327493, "epoch": 1949} {"train_loss": -12.38387680053711, "global_step": 327494, "epoch": 1949} {"train_loss": -12.158147811889648, "global_step": 327495, "epoch": 1949} {"train_loss": -11.907829284667969, "global_step": 327496, "epoch": 1949} {"train_loss": -12.520903587341309, "global_step": 327497, "epoch": 1949} {"train_loss": -12.205480575561523, "global_step": 327498, "epoch": 1949} {"train_loss": -12.389790534973145, "global_step": 327499, "epoch": 1949} {"train_loss": -12.47584056854248, "global_step": 327500, "epoch": 1949} {"train_loss": -12.132673263549805, "global_step": 327501, "epoch": 1949} {"train_loss": -11.960677146911621, "global_step": 327502, "epoch": 1949} {"train_loss": -10.70587158203125, "global_step": 327503, "epoch": 1949} {"train_loss": -10.751310348510742, "global_step": 327504, "epoch": 1949} {"train_loss": -12.07356071472168, "global_step": 327505, "epoch": 1949} {"train_loss": -11.664793014526367, "global_step": 327506, "epoch": 1949} {"train_loss": -11.628639221191406, "global_step": 327507, "epoch": 1949} {"train_loss": -11.149337768554688, "global_step": 327508, "epoch": 1949} {"train_loss": -12.126384735107422, "global_step": 327509, "epoch": 1949} {"train_loss": -11.778031349182129, "global_step": 327510, "epoch": 1949} {"train_loss": -10.733797073364258, "global_step": 327511, "epoch": 1949} {"train_loss": -11.109855651855469, "global_step": 327512, "epoch": 1949} {"train_loss": -12.148258209228516, "global_step": 327513, "epoch": 1949} {"train_loss": -11.928899765014648, "global_step": 327514, "epoch": 1949} {"train_loss": -11.758916854858398, "global_step": 327515, "epoch": 1949} {"train_loss": -11.465058326721191, "global_step": 327516, "epoch": 1949} {"train_loss": -12.040472030639648, "global_step": 327517, "epoch": 1949} {"train_loss": -11.900684356689453, "global_step": 327518, "epoch": 1949} {"train_loss": -11.915897369384766, "global_step": 327519, "epoch": 1949} {"train_loss": -12.215816497802734, "global_step": 327520, "epoch": 1949} {"train_loss": -11.590188026428223, "global_step": 327521, "epoch": 1949} {"train_loss": -11.752333641052246, "global_step": 327522, "epoch": 1949} {"train_loss": -11.953917503356934, "global_step": 327523, "epoch": 1949} {"train_loss": -10.91696548461914, "global_step": 327524, "epoch": 1949} {"train_loss": -12.01974868774414, "global_step": 327525, "epoch": 1949} {"train_loss": -12.05312728881836, "global_step": 327526, "epoch": 1949} {"train_loss": -11.02486801147461, "global_step": 327527, "epoch": 1949} {"train_loss": -12.115562438964844, "global_step": 327528, "epoch": 1949} {"train_loss": -11.122435569763184, "global_step": 327529, "epoch": 1949} {"train_loss": -11.872769355773926, "global_step": 327530, "epoch": 1949} {"train_loss": -11.824633598327637, "global_step": 327531, "epoch": 1949} {"train_loss": -11.810012817382812, "global_step": 327532, "epoch": 1949} {"train_loss": -11.627275466918945, "global_step": 327533, "epoch": 1949} {"train_loss": -12.29623031616211, "global_step": 327534, "epoch": 1949} {"train_loss": -11.145564079284668, "global_step": 327535, "epoch": 1949} {"train_loss": -12.032116889953613, "global_step": 327536, "epoch": 1949} {"train_loss": -11.615620613098145, "global_step": 327537, "epoch": 1949} {"train_loss": -11.924697875976562, "global_step": 327538, "epoch": 1949} {"train_loss": -11.860919952392578, "global_step": 327539, "epoch": 1949} {"train_loss": -12.071642875671387, "global_step": 327540, "epoch": 1949} {"train_loss": -12.185219764709473, "global_step": 327541, "epoch": 1949} {"train_loss": -11.998653411865234, "global_step": 327542, "epoch": 1949} {"train_loss": -12.050628662109375, "global_step": 327543, "epoch": 1949} {"train_loss": -12.338357925415039, "global_step": 327544, "epoch": 1949} {"train_loss": -11.784651756286621, "global_step": 327545, "epoch": 1949} {"train_loss": -12.22223949432373, "global_step": 327546, "epoch": 1949} {"train_loss": -11.988773345947266, "global_step": 327547, "epoch": 1949} {"train_loss": -12.303836822509766, "global_step": 327548, "epoch": 1949} {"train_loss": -11.815535545349121, "global_step": 327549, "epoch": 1949} {"train_loss": -12.330448150634766, "global_step": 327550, "epoch": 1949} {"train_loss": -11.896074295043945, "global_step": 327551, "epoch": 1949} {"train_loss": -12.522674560546875, "global_step": 327552, "epoch": 1949} {"train_loss": -12.254106521606445, "global_step": 327553, "epoch": 1949} {"train_loss": -11.920036315917969, "global_step": 327554, "epoch": 1949} {"train_loss": -12.183236122131348, "global_step": 327555, "epoch": 1949} {"train_loss": -12.063627243041992, "global_step": 327556, "epoch": 1949} {"train_loss": -12.330792427062988, "global_step": 327557, "epoch": 1949} {"train_loss": -12.290899276733398, "global_step": 327558, "epoch": 1949} {"train_loss": -12.208207130432129, "global_step": 327559, "epoch": 1949} {"train_loss": -12.30116081237793, "global_step": 327560, "epoch": 1949} {"train_loss": -12.299565315246582, "global_step": 327561, "epoch": 1949} {"train_loss": -12.31844711303711, "global_step": 327562, "epoch": 1949} {"train_loss": -12.522736549377441, "global_step": 327563, "epoch": 1949} {"train_loss": -12.227140426635742, "global_step": 327564, "epoch": 1949} {"train_loss": -12.527039527893066, "global_step": 327565, "epoch": 1949} {"train_loss": -12.409988403320312, "global_step": 327566, "epoch": 1949} {"train_loss": -11.76772689819336, "global_step": 327567, "epoch": 1949} {"train_loss": -12.554632186889648, "global_step": 327568, "epoch": 1949} {"train_loss": -12.39093017578125, "global_step": 327569, "epoch": 1949} {"train_loss": -12.501845359802246, "global_step": 327570, "epoch": 1949} {"train_loss": -12.150602340698242, "global_step": 327571, "epoch": 1949} {"train_loss": -12.373441696166992, "global_step": 327572, "epoch": 1949} {"train_loss": -12.476936340332031, "global_step": 327573, "epoch": 1949} {"train_loss": -12.529693603515625, "global_step": 327574, "epoch": 1949} {"train_loss": -12.137084007263184, "global_step": 327575, "epoch": 1949} {"train_loss": -12.410661697387695, "global_step": 327576, "epoch": 1949} {"train_loss": -12.519440650939941, "global_step": 327577, "epoch": 1949} {"train_loss": -12.199857711791992, "global_step": 327578, "epoch": 1949} {"train_loss": -12.437031745910645, "global_step": 327579, "epoch": 1949} {"train_loss": -12.274735450744629, "global_step": 327580, "epoch": 1949} {"train_loss": -12.064983367919922, "global_step": 327581, "epoch": 1949} {"train_loss": -12.34487533569336, "global_step": 327582, "epoch": 1949} {"train_loss": -12.486148834228516, "global_step": 327583, "epoch": 1949} {"train_loss": -12.486160278320312, "global_step": 327584, "epoch": 1949} {"train_loss": -12.302066802978516, "global_step": 327585, "epoch": 1949} {"train_loss": -12.667442321777344, "global_step": 327586, "epoch": 1949} {"train_loss": -12.504524230957031, "global_step": 327587, "epoch": 1949} {"train_loss": -11.778535842895508, "global_step": 327588, "epoch": 1949} {"train_loss": -11.81106185913086, "global_step": 327589, "epoch": 1949} {"train_loss": -12.289480209350586, "global_step": 327590, "epoch": 1949} {"train_loss": -10.694456100463867, "global_step": 327591, "epoch": 1949} {"train_loss": -11.708720207214355, "global_step": 327592, "epoch": 1949} {"train_loss": -12.43661880493164, "global_step": 327593, "epoch": 1949} {"train_loss": -11.123270988464355, "global_step": 327594, "epoch": 1949} {"train_loss": -10.765329360961914, "global_step": 327595, "epoch": 1949} {"train_loss": -12.13827896118164, "global_step": 327596, "epoch": 1949} {"train_loss": -11.905866622924805, "global_step": 327597, "epoch": 1949} {"train_loss": -11.626062393188477, "global_step": 327598, "epoch": 1949} {"train_loss": -12.149166629427956, "global_step": 327599, "epoch": 1949, "val_loss": 287109.0} {"train_loss": -11.424936294555664, "global_step": 327600, "epoch": 1950} {"train_loss": -11.396027565002441, "global_step": 327601, "epoch": 1950} {"train_loss": -11.957329750061035, "global_step": 327602, "epoch": 1950} {"train_loss": -10.753470420837402, "global_step": 327603, "epoch": 1950} {"train_loss": -11.605672836303711, "global_step": 327604, "epoch": 1950} {"train_loss": -12.102811813354492, "global_step": 327605, "epoch": 1950} {"train_loss": -10.950292587280273, "global_step": 327606, "epoch": 1950} {"train_loss": -11.919530868530273, "global_step": 327607, "epoch": 1950} {"train_loss": -11.4921875, "global_step": 327608, "epoch": 1950} {"train_loss": -12.06041145324707, "global_step": 327609, "epoch": 1950} {"train_loss": -12.271665573120117, "global_step": 327610, "epoch": 1950} {"train_loss": -11.3453369140625, "global_step": 327611, "epoch": 1950} {"train_loss": -12.182141304016113, "global_step": 327612, "epoch": 1950} {"train_loss": -11.44440746307373, "global_step": 327613, "epoch": 1950} {"train_loss": -11.915294647216797, "global_step": 327614, "epoch": 1950} {"train_loss": -12.232412338256836, "global_step": 327615, "epoch": 1950} {"train_loss": -12.101377487182617, "global_step": 327616, "epoch": 1950} {"train_loss": -11.944222450256348, "global_step": 327617, "epoch": 1950} {"train_loss": -11.89887809753418, "global_step": 327618, "epoch": 1950} {"train_loss": -12.468769073486328, "global_step": 327619, "epoch": 1950} {"train_loss": -11.836397171020508, "global_step": 327620, "epoch": 1950} {"train_loss": -11.97298526763916, "global_step": 327621, "epoch": 1950} {"train_loss": -12.162757873535156, "global_step": 327622, "epoch": 1950} {"train_loss": -11.990257263183594, "global_step": 327623, "epoch": 1950} {"train_loss": -12.058635711669922, "global_step": 327624, "epoch": 1950} {"train_loss": -12.130411148071289, "global_step": 327625, "epoch": 1950} {"train_loss": -12.445869445800781, "global_step": 327626, "epoch": 1950} {"train_loss": -11.905376434326172, "global_step": 327627, "epoch": 1950} {"train_loss": -12.302009582519531, "global_step": 327628, "epoch": 1950} {"train_loss": -12.400917053222656, "global_step": 327629, "epoch": 1950} {"train_loss": -12.305476188659668, "global_step": 327630, "epoch": 1950} {"train_loss": -12.115646362304688, "global_step": 327631, "epoch": 1950} {"train_loss": -12.463743209838867, "global_step": 327632, "epoch": 1950} {"train_loss": -12.564680099487305, "global_step": 327633, "epoch": 1950} {"train_loss": -12.194475173950195, "global_step": 327634, "epoch": 1950} {"train_loss": -12.36188793182373, "global_step": 327635, "epoch": 1950} {"train_loss": -12.474316596984863, "global_step": 327636, "epoch": 1950} {"train_loss": -12.334324836730957, "global_step": 327637, "epoch": 1950} {"train_loss": -12.278114318847656, "global_step": 327638, "epoch": 1950} {"train_loss": -12.700372695922852, "global_step": 327639, "epoch": 1950} {"train_loss": -12.0775146484375, "global_step": 327640, "epoch": 1950} {"train_loss": -11.597556114196777, "global_step": 327641, "epoch": 1950} {"train_loss": -12.341694831848145, "global_step": 327642, "epoch": 1950} {"train_loss": -12.088272094726562, "global_step": 327643, "epoch": 1950} {"train_loss": -11.920167922973633, "global_step": 327644, "epoch": 1950} {"train_loss": -12.00312328338623, "global_step": 327645, "epoch": 1950} {"train_loss": -12.171344757080078, "global_step": 327646, "epoch": 1950} {"train_loss": -11.673519134521484, "global_step": 327647, "epoch": 1950} {"train_loss": -12.356269836425781, "global_step": 327648, "epoch": 1950} {"train_loss": -12.080087661743164, "global_step": 327649, "epoch": 1950} {"train_loss": -12.20724868774414, "global_step": 327650, "epoch": 1950} {"train_loss": -11.829191207885742, "global_step": 327651, "epoch": 1950} {"train_loss": -11.58930778503418, "global_step": 327652, "epoch": 1950} {"train_loss": -12.137923240661621, "global_step": 327653, "epoch": 1950} {"train_loss": -12.103286743164062, "global_step": 327654, "epoch": 1950} {"train_loss": -12.29987621307373, "global_step": 327655, "epoch": 1950} {"train_loss": -12.290360450744629, "global_step": 327656, "epoch": 1950} {"train_loss": -12.179726600646973, "global_step": 327657, "epoch": 1950} {"train_loss": -12.359563827514648, "global_step": 327658, "epoch": 1950} {"train_loss": -12.160468101501465, "global_step": 327659, "epoch": 1950} {"train_loss": -12.047647476196289, "global_step": 327660, "epoch": 1950} {"train_loss": -11.838676452636719, "global_step": 327661, "epoch": 1950} {"train_loss": -11.936012268066406, "global_step": 327662, "epoch": 1950} {"train_loss": -11.548592567443848, "global_step": 327663, "epoch": 1950} {"train_loss": -11.693572044372559, "global_step": 327664, "epoch": 1950} {"train_loss": -11.841362953186035, "global_step": 327665, "epoch": 1950} {"train_loss": -10.359931945800781, "global_step": 327666, "epoch": 1950} {"train_loss": -11.95139217376709, "global_step": 327667, "epoch": 1950} {"train_loss": -11.099918365478516, "global_step": 327668, "epoch": 1950} {"train_loss": -11.619826316833496, "global_step": 327669, "epoch": 1950} {"train_loss": -10.30978012084961, "global_step": 327670, "epoch": 1950} {"train_loss": -11.91589641571045, "global_step": 327671, "epoch": 1950} {"train_loss": -10.842391967773438, "global_step": 327672, "epoch": 1950} {"train_loss": -10.837631225585938, "global_step": 327673, "epoch": 1950} {"train_loss": -11.470512390136719, "global_step": 327674, "epoch": 1950} {"train_loss": -11.560454368591309, "global_step": 327675, "epoch": 1950} {"train_loss": -10.187034606933594, "global_step": 327676, "epoch": 1950} {"train_loss": -11.611780166625977, "global_step": 327677, "epoch": 1950} {"train_loss": -10.419483184814453, "global_step": 327678, "epoch": 1950} {"train_loss": -10.78895092010498, "global_step": 327679, "epoch": 1950} {"train_loss": -11.358077049255371, "global_step": 327680, "epoch": 1950} {"train_loss": -11.2452974319458, "global_step": 327681, "epoch": 1950} {"train_loss": -10.629264831542969, "global_step": 327682, "epoch": 1950} {"train_loss": -11.520038604736328, "global_step": 327683, "epoch": 1950} {"train_loss": -11.4829683303833, "global_step": 327684, "epoch": 1950} {"train_loss": -11.359654426574707, "global_step": 327685, "epoch": 1950} {"train_loss": -11.469718933105469, "global_step": 327686, "epoch": 1950} {"train_loss": -11.361177444458008, "global_step": 327687, "epoch": 1950} {"train_loss": -11.881962776184082, "global_step": 327688, "epoch": 1950} {"train_loss": -11.436148643493652, "global_step": 327689, "epoch": 1950} {"train_loss": -11.339517593383789, "global_step": 327690, "epoch": 1950} {"train_loss": -11.747976303100586, "global_step": 327691, "epoch": 1950} {"train_loss": -11.086858749389648, "global_step": 327692, "epoch": 1950} {"train_loss": -11.614538192749023, "global_step": 327693, "epoch": 1950} {"train_loss": -10.851366996765137, "global_step": 327694, "epoch": 1950} {"train_loss": -11.665376663208008, "global_step": 327695, "epoch": 1950} {"train_loss": -11.704968452453613, "global_step": 327696, "epoch": 1950} {"train_loss": -11.715678215026855, "global_step": 327697, "epoch": 1950} {"train_loss": -12.119312286376953, "global_step": 327698, "epoch": 1950} {"train_loss": -11.487260818481445, "global_step": 327699, "epoch": 1950} {"train_loss": -12.056190490722656, "global_step": 327700, "epoch": 1950} {"train_loss": -11.493903160095215, "global_step": 327701, "epoch": 1950} {"train_loss": -11.932756423950195, "global_step": 327702, "epoch": 1950} {"train_loss": -12.169678688049316, "global_step": 327703, "epoch": 1950} {"train_loss": -11.603126525878906, "global_step": 327704, "epoch": 1950} {"train_loss": -12.297611236572266, "global_step": 327705, "epoch": 1950} {"train_loss": -11.809618949890137, "global_step": 327706, "epoch": 1950} {"train_loss": -12.019685745239258, "global_step": 327707, "epoch": 1950} {"train_loss": -12.370283126831055, "global_step": 327708, "epoch": 1950} {"train_loss": -11.734628677368164, "global_step": 327709, "epoch": 1950} {"train_loss": -11.973026275634766, "global_step": 327710, "epoch": 1950} {"train_loss": -12.153009414672852, "global_step": 327711, "epoch": 1950} {"train_loss": -11.810188293457031, "global_step": 327712, "epoch": 1950} {"train_loss": -12.346986770629883, "global_step": 327713, "epoch": 1950} {"train_loss": -12.048783302307129, "global_step": 327714, "epoch": 1950} {"train_loss": -12.00827407836914, "global_step": 327715, "epoch": 1950} {"train_loss": -12.364850997924805, "global_step": 327716, "epoch": 1950} {"train_loss": -11.956428527832031, "global_step": 327717, "epoch": 1950} {"train_loss": -12.434734344482422, "global_step": 327718, "epoch": 1950} {"train_loss": -12.037483215332031, "global_step": 327719, "epoch": 1950} {"train_loss": -12.41162109375, "global_step": 327720, "epoch": 1950} {"train_loss": -12.171788215637207, "global_step": 327721, "epoch": 1950} {"train_loss": -12.25709342956543, "global_step": 327722, "epoch": 1950} {"train_loss": -12.420042037963867, "global_step": 327723, "epoch": 1950} {"train_loss": -12.087270736694336, "global_step": 327724, "epoch": 1950} {"train_loss": -12.304929733276367, "global_step": 327725, "epoch": 1950} {"train_loss": -12.28957748413086, "global_step": 327726, "epoch": 1950} {"train_loss": -12.246784210205078, "global_step": 327727, "epoch": 1950} {"train_loss": -12.440725326538086, "global_step": 327728, "epoch": 1950} {"train_loss": -12.442092895507812, "global_step": 327729, "epoch": 1950} {"train_loss": -12.501358985900879, "global_step": 327730, "epoch": 1950} {"train_loss": -12.243904113769531, "global_step": 327731, "epoch": 1950} {"train_loss": -12.402532577514648, "global_step": 327732, "epoch": 1950} {"train_loss": -12.340581893920898, "global_step": 327733, "epoch": 1950} {"train_loss": -12.19206428527832, "global_step": 327734, "epoch": 1950} {"train_loss": -12.594768524169922, "global_step": 327735, "epoch": 1950} {"train_loss": -12.28734016418457, "global_step": 327736, "epoch": 1950} {"train_loss": -12.260232925415039, "global_step": 327737, "epoch": 1950} {"train_loss": -12.066064834594727, "global_step": 327738, "epoch": 1950} {"train_loss": -12.422218322753906, "global_step": 327739, "epoch": 1950} {"train_loss": -12.331974029541016, "global_step": 327740, "epoch": 1950} {"train_loss": -12.330708503723145, "global_step": 327741, "epoch": 1950} {"train_loss": -12.380441665649414, "global_step": 327742, "epoch": 1950} {"train_loss": -12.599346160888672, "global_step": 327743, "epoch": 1950} {"train_loss": -12.401676177978516, "global_step": 327744, "epoch": 1950} {"train_loss": -12.502913475036621, "global_step": 327745, "epoch": 1950} {"train_loss": -12.497220993041992, "global_step": 327746, "epoch": 1950} {"train_loss": -12.516854286193848, "global_step": 327747, "epoch": 1950} {"train_loss": -12.554368019104004, "global_step": 327748, "epoch": 1950} {"train_loss": -12.42470645904541, "global_step": 327749, "epoch": 1950} {"train_loss": -12.52842903137207, "global_step": 327750, "epoch": 1950} {"train_loss": -12.396148681640625, "global_step": 327751, "epoch": 1950} {"train_loss": -12.466259002685547, "global_step": 327752, "epoch": 1950} {"train_loss": -12.62244701385498, "global_step": 327753, "epoch": 1950} {"train_loss": -12.177886009216309, "global_step": 327754, "epoch": 1950} {"train_loss": -12.429121971130371, "global_step": 327755, "epoch": 1950} {"train_loss": -12.269172668457031, "global_step": 327756, "epoch": 1950} {"train_loss": -12.331600189208984, "global_step": 327757, "epoch": 1950} {"train_loss": -12.428119659423828, "global_step": 327758, "epoch": 1950} {"train_loss": -12.401077270507812, "global_step": 327759, "epoch": 1950} {"train_loss": -12.33306884765625, "global_step": 327760, "epoch": 1950} {"train_loss": -12.305644989013672, "global_step": 327761, "epoch": 1950} {"train_loss": -12.412982940673828, "global_step": 327762, "epoch": 1950} {"train_loss": -12.41207504272461, "global_step": 327763, "epoch": 1950} {"train_loss": -12.231319427490234, "global_step": 327764, "epoch": 1950} {"train_loss": -12.226066589355469, "global_step": 327765, "epoch": 1950} {"train_loss": -11.9937744140625, "global_step": 327766, "epoch": 1950} {"train_loss": -11.968264574096317, "global_step": 327767, "epoch": 1950, "train/sim_max_reward_0": 0.5432642953736946, "train/sim_max_reward_1": 0.98819023356651, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.4777618405275561, "train/sim_max_reward_4": 0.9591415388374126, "train/sim_max_reward_5": 0.5908922381093508, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.3718626924717968, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.9293104491978254, "test/sim_max_reward_4400004": 0.410377042570065, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 0.45241565902493164, "test/sim_max_reward_4400008": 0.5220915343594948, "test/sim_max_reward_4400009": 0.4153367141939946, "test/sim_max_reward_4400010": 0.9808225335348596, "test/sim_max_reward_4400011": 0.9761659852260308, "test/sim_max_reward_4400012": 0.9978896774088192, "test/sim_max_reward_4400013": 0.9667241823867863, "test/sim_max_reward_4400014": 0.3348730307853941, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9874027994344944, "test/sim_max_reward_4400019": 0.7186555170693147, "test/sim_max_reward_4400020": 0.614934323844812, "test/sim_max_reward_4400021": 0.6051324160173975, "test/sim_max_reward_4400022": 0.9814665393995062, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.3651178683049682, "test/sim_max_reward_4400025": 0.5413525340115211, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.5087079206419342, "test/sim_max_reward_4400028": 0.017100746913841898, "test/sim_max_reward_4400029": 1.0, "test/sim_max_reward_4400030": 0.3851210596400913, "test/sim_max_reward_4400031": 0.9730830819981354, "test/sim_max_reward_4400032": 0.10226862381363383, "test/sim_max_reward_4400033": 0.6352989991580278, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.36236030063599434, "test/sim_max_reward_4400037": 0.9944773328413914, "test/sim_max_reward_4400038": 0.29894921771488736, "test/sim_max_reward_4400039": 0.4120055698654263, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9623238979803755, "test/sim_max_reward_4400042": 0.007957278371513303, "test/sim_max_reward_4400043": 0.9117861492820553, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.9827084888277744, "test/sim_max_reward_4400046": 0.3002453035105801, "test/sim_max_reward_4400047": 0.9947671570437358, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.3090302550822929, "train/mean_score": 0.593208357735754, "test/mean_score": 0.5922889693387146, "val_loss": 284557.84375, "train_action_mse_error": 3.4509215354919434} {"train_loss": -11.68014144897461, "global_step": 327768, "epoch": 1951} {"train_loss": -11.344684600830078, "global_step": 327769, "epoch": 1951} {"train_loss": -12.2031831741333, "global_step": 327770, "epoch": 1951} {"train_loss": -11.5191650390625, "global_step": 327771, "epoch": 1951} {"train_loss": -10.889081954956055, "global_step": 327772, "epoch": 1951} {"train_loss": -12.331323623657227, "global_step": 327773, "epoch": 1951} {"train_loss": -10.988835334777832, "global_step": 327774, "epoch": 1951} {"train_loss": -11.818516731262207, "global_step": 327775, "epoch": 1951} {"train_loss": -11.88843059539795, "global_step": 327776, "epoch": 1951} {"train_loss": -11.471460342407227, "global_step": 327777, "epoch": 1951} {"train_loss": -10.97264575958252, "global_step": 327778, "epoch": 1951} {"train_loss": -12.066912651062012, "global_step": 327779, "epoch": 1951} {"train_loss": -11.684930801391602, "global_step": 327780, "epoch": 1951} {"train_loss": -12.072371482849121, "global_step": 327781, "epoch": 1951} {"train_loss": -11.748306274414062, "global_step": 327782, "epoch": 1951} {"train_loss": -12.260276794433594, "global_step": 327783, "epoch": 1951} {"train_loss": -11.94451904296875, "global_step": 327784, "epoch": 1951} {"train_loss": -12.149307250976562, "global_step": 327785, "epoch": 1951} {"train_loss": -11.901336669921875, "global_step": 327786, "epoch": 1951} {"train_loss": -12.142044067382812, "global_step": 327787, "epoch": 1951} {"train_loss": -11.968271255493164, "global_step": 327788, "epoch": 1951} {"train_loss": -11.718404769897461, "global_step": 327789, "epoch": 1951} {"train_loss": -12.216750144958496, "global_step": 327790, "epoch": 1951} {"train_loss": -11.773409843444824, "global_step": 327791, "epoch": 1951} {"train_loss": -11.952285766601562, "global_step": 327792, "epoch": 1951} {"train_loss": -12.22866439819336, "global_step": 327793, "epoch": 1951} {"train_loss": -11.730247497558594, "global_step": 327794, "epoch": 1951} {"train_loss": -12.127462387084961, "global_step": 327795, "epoch": 1951} {"train_loss": -11.481637001037598, "global_step": 327796, "epoch": 1951} {"train_loss": -12.219804763793945, "global_step": 327797, "epoch": 1951} {"train_loss": -12.130186080932617, "global_step": 327798, "epoch": 1951} {"train_loss": -11.61311149597168, "global_step": 327799, "epoch": 1951} {"train_loss": -11.854228019714355, "global_step": 327800, "epoch": 1951} {"train_loss": -12.224733352661133, "global_step": 327801, "epoch": 1951} {"train_loss": -11.75037670135498, "global_step": 327802, "epoch": 1951} {"train_loss": -11.82558822631836, "global_step": 327803, "epoch": 1951} {"train_loss": -12.131000518798828, "global_step": 327804, "epoch": 1951} {"train_loss": -11.739547729492188, "global_step": 327805, "epoch": 1951} {"train_loss": -11.92951774597168, "global_step": 327806, "epoch": 1951} {"train_loss": -12.037363052368164, "global_step": 327807, "epoch": 1951} {"train_loss": -11.83793830871582, "global_step": 327808, "epoch": 1951} {"train_loss": -12.201374053955078, "global_step": 327809, "epoch": 1951} {"train_loss": -11.985008239746094, "global_step": 327810, "epoch": 1951} {"train_loss": -12.010855674743652, "global_step": 327811, "epoch": 1951} {"train_loss": -11.853631973266602, "global_step": 327812, "epoch": 1951} {"train_loss": -12.159181594848633, "global_step": 327813, "epoch": 1951} {"train_loss": -11.921031951904297, "global_step": 327814, "epoch": 1951} {"train_loss": -12.235454559326172, "global_step": 327815, "epoch": 1951} {"train_loss": -11.807958602905273, "global_step": 327816, "epoch": 1951} {"train_loss": -11.942696571350098, "global_step": 327817, "epoch": 1951} {"train_loss": -12.363924026489258, "global_step": 327818, "epoch": 1951} {"train_loss": -11.92395305633545, "global_step": 327819, "epoch": 1951} {"train_loss": -11.870453834533691, "global_step": 327820, "epoch": 1951} {"train_loss": -12.057903289794922, "global_step": 327821, "epoch": 1951} {"train_loss": -11.818493843078613, "global_step": 327822, "epoch": 1951} {"train_loss": -11.85536003112793, "global_step": 327823, "epoch": 1951} {"train_loss": -12.04712200164795, "global_step": 327824, "epoch": 1951} {"train_loss": -11.918479919433594, "global_step": 327825, "epoch": 1951} {"train_loss": -12.271653175354004, "global_step": 327826, "epoch": 1951} {"train_loss": -11.478089332580566, "global_step": 327827, "epoch": 1951} {"train_loss": -11.86335277557373, "global_step": 327828, "epoch": 1951} {"train_loss": -11.656473159790039, "global_step": 327829, "epoch": 1951} {"train_loss": -10.382535934448242, "global_step": 327830, "epoch": 1951} {"train_loss": -11.156055450439453, "global_step": 327831, "epoch": 1951} {"train_loss": -11.009586334228516, "global_step": 327832, "epoch": 1951} {"train_loss": -11.240196228027344, "global_step": 327833, "epoch": 1951} {"train_loss": -10.825017929077148, "global_step": 327834, "epoch": 1951} {"train_loss": -9.239460945129395, "global_step": 327835, "epoch": 1951} {"train_loss": -7.790102005004883, "global_step": 327836, "epoch": 1951} {"train_loss": -8.886456489562988, "global_step": 327837, "epoch": 1951} {"train_loss": -10.143472671508789, "global_step": 327838, "epoch": 1951} {"train_loss": -10.384383201599121, "global_step": 327839, "epoch": 1951} {"train_loss": -8.510653495788574, "global_step": 327840, "epoch": 1951} {"train_loss": -8.243115425109863, "global_step": 327841, "epoch": 1951} {"train_loss": -7.722614288330078, "global_step": 327842, "epoch": 1951} {"train_loss": -8.294189453125, "global_step": 327843, "epoch": 1951} {"train_loss": -9.024287223815918, "global_step": 327844, "epoch": 1951} {"train_loss": -9.616436004638672, "global_step": 327845, "epoch": 1951} {"train_loss": -9.89148235321045, "global_step": 327846, "epoch": 1951} {"train_loss": -9.67536449432373, "global_step": 327847, "epoch": 1951} {"train_loss": -10.900413513183594, "global_step": 327848, "epoch": 1951} {"train_loss": -10.680482864379883, "global_step": 327849, "epoch": 1951} {"train_loss": -11.375320434570312, "global_step": 327850, "epoch": 1951} {"train_loss": -11.392660140991211, "global_step": 327851, "epoch": 1951} {"train_loss": -11.085482597351074, "global_step": 327852, "epoch": 1951} {"train_loss": -11.475685119628906, "global_step": 327853, "epoch": 1951} {"train_loss": -11.728160858154297, "global_step": 327854, "epoch": 1951} {"train_loss": -11.516717910766602, "global_step": 327855, "epoch": 1951} {"train_loss": -11.757165908813477, "global_step": 327856, "epoch": 1951} {"train_loss": -11.849283218383789, "global_step": 327857, "epoch": 1951} {"train_loss": -11.608966827392578, "global_step": 327858, "epoch": 1951} {"train_loss": -11.85932445526123, "global_step": 327859, "epoch": 1951} {"train_loss": -11.81684684753418, "global_step": 327860, "epoch": 1951} {"train_loss": -12.058219909667969, "global_step": 327861, "epoch": 1951} {"train_loss": -11.90910530090332, "global_step": 327862, "epoch": 1951} {"train_loss": -11.924760818481445, "global_step": 327863, "epoch": 1951} {"train_loss": -11.980857849121094, "global_step": 327864, "epoch": 1951} {"train_loss": -12.04928970336914, "global_step": 327865, "epoch": 1951} {"train_loss": -11.995728492736816, "global_step": 327866, "epoch": 1951} {"train_loss": -11.632369995117188, "global_step": 327867, "epoch": 1951} {"train_loss": -11.96365737915039, "global_step": 327868, "epoch": 1951} {"train_loss": -12.06140422821045, "global_step": 327869, "epoch": 1951} {"train_loss": -12.224784851074219, "global_step": 327870, "epoch": 1951} {"train_loss": -12.168497085571289, "global_step": 327871, "epoch": 1951} {"train_loss": -12.021411895751953, "global_step": 327872, "epoch": 1951} {"train_loss": -12.335214614868164, "global_step": 327873, "epoch": 1951} {"train_loss": -12.044055938720703, "global_step": 327874, "epoch": 1951} {"train_loss": -12.276230812072754, "global_step": 327875, "epoch": 1951} {"train_loss": -12.265262603759766, "global_step": 327876, "epoch": 1951} {"train_loss": -12.21145248413086, "global_step": 327877, "epoch": 1951} {"train_loss": -12.166749954223633, "global_step": 327878, "epoch": 1951} {"train_loss": -12.401056289672852, "global_step": 327879, "epoch": 1951} {"train_loss": -12.131739616394043, "global_step": 327880, "epoch": 1951} {"train_loss": -12.2783784866333, "global_step": 327881, "epoch": 1951} {"train_loss": -12.17090892791748, "global_step": 327882, "epoch": 1951} {"train_loss": -12.204012870788574, "global_step": 327883, "epoch": 1951} {"train_loss": -12.133716583251953, "global_step": 327884, "epoch": 1951} {"train_loss": -12.297236442565918, "global_step": 327885, "epoch": 1951} {"train_loss": -12.441696166992188, "global_step": 327886, "epoch": 1951} {"train_loss": -12.378321647644043, "global_step": 327887, "epoch": 1951} {"train_loss": -12.45897102355957, "global_step": 327888, "epoch": 1951} {"train_loss": -12.469990730285645, "global_step": 327889, "epoch": 1951} {"train_loss": -12.291191101074219, "global_step": 327890, "epoch": 1951} {"train_loss": -12.177006721496582, "global_step": 327891, "epoch": 1951} {"train_loss": -12.376385688781738, "global_step": 327892, "epoch": 1951} {"train_loss": -12.44262981414795, "global_step": 327893, "epoch": 1951} {"train_loss": -12.460220336914062, "global_step": 327894, "epoch": 1951} {"train_loss": -12.32536506652832, "global_step": 327895, "epoch": 1951} {"train_loss": -12.324748992919922, "global_step": 327896, "epoch": 1951} {"train_loss": -12.377963066101074, "global_step": 327897, "epoch": 1951} {"train_loss": -12.368623733520508, "global_step": 327898, "epoch": 1951} {"train_loss": -12.270172119140625, "global_step": 327899, "epoch": 1951} {"train_loss": -12.330784797668457, "global_step": 327900, "epoch": 1951} {"train_loss": -12.228963851928711, "global_step": 327901, "epoch": 1951} {"train_loss": -12.146331787109375, "global_step": 327902, "epoch": 1951} {"train_loss": -12.229530334472656, "global_step": 327903, "epoch": 1951} {"train_loss": -12.54440689086914, "global_step": 327904, "epoch": 1951} {"train_loss": -12.189352035522461, "global_step": 327905, "epoch": 1951} {"train_loss": -12.001014709472656, "global_step": 327906, "epoch": 1951} {"train_loss": -12.412925720214844, "global_step": 327907, "epoch": 1951} {"train_loss": -12.623188018798828, "global_step": 327908, "epoch": 1951} {"train_loss": -12.091668128967285, "global_step": 327909, "epoch": 1951} {"train_loss": -11.999720573425293, "global_step": 327910, "epoch": 1951} {"train_loss": -12.495868682861328, "global_step": 327911, "epoch": 1951} {"train_loss": -12.2849760055542, "global_step": 327912, "epoch": 1951} {"train_loss": -12.525480270385742, "global_step": 327913, "epoch": 1951} {"train_loss": -12.258600234985352, "global_step": 327914, "epoch": 1951} {"train_loss": -12.468408584594727, "global_step": 327915, "epoch": 1951} {"train_loss": -12.353531837463379, "global_step": 327916, "epoch": 1951} {"train_loss": -12.31509780883789, "global_step": 327917, "epoch": 1951} {"train_loss": -12.132010459899902, "global_step": 327918, "epoch": 1951} {"train_loss": -12.3038911819458, "global_step": 327919, "epoch": 1951} {"train_loss": -12.39584732055664, "global_step": 327920, "epoch": 1951} {"train_loss": -12.557092666625977, "global_step": 327921, "epoch": 1951} {"train_loss": -12.51854419708252, "global_step": 327922, "epoch": 1951} {"train_loss": -12.646381378173828, "global_step": 327923, "epoch": 1951} {"train_loss": -12.661409378051758, "global_step": 327924, "epoch": 1951} {"train_loss": -12.493995666503906, "global_step": 327925, "epoch": 1951} {"train_loss": -12.440189361572266, "global_step": 327926, "epoch": 1951} {"train_loss": -12.485424041748047, "global_step": 327927, "epoch": 1951} {"train_loss": -12.673646926879883, "global_step": 327928, "epoch": 1951} {"train_loss": -12.395517349243164, "global_step": 327929, "epoch": 1951} {"train_loss": -12.53732967376709, "global_step": 327930, "epoch": 1951} {"train_loss": -12.49524974822998, "global_step": 327931, "epoch": 1951} {"train_loss": -12.316186904907227, "global_step": 327932, "epoch": 1951} {"train_loss": -12.726968765258789, "global_step": 327933, "epoch": 1951} {"train_loss": -12.26999568939209, "global_step": 327934, "epoch": 1951} {"train_loss": -11.786428332328796, "global_step": 327935, "epoch": 1951, "val_loss": 283232.6875} {"train_loss": -12.313959121704102, "global_step": 327936, "epoch": 1952} {"train_loss": -12.359832763671875, "global_step": 327937, "epoch": 1952} {"train_loss": -12.49821949005127, "global_step": 327938, "epoch": 1952} {"train_loss": -12.472600936889648, "global_step": 327939, "epoch": 1952} {"train_loss": -12.25524616241455, "global_step": 327940, "epoch": 1952} {"train_loss": -12.398310661315918, "global_step": 327941, "epoch": 1952} {"train_loss": -12.470376968383789, "global_step": 327942, "epoch": 1952} {"train_loss": -12.634981155395508, "global_step": 327943, "epoch": 1952} {"train_loss": -12.626461029052734, "global_step": 327944, "epoch": 1952} {"train_loss": -12.618232727050781, "global_step": 327945, "epoch": 1952} {"train_loss": -12.6790771484375, "global_step": 327946, "epoch": 1952} {"train_loss": -12.116716384887695, "global_step": 327947, "epoch": 1952} {"train_loss": -12.844273567199707, "global_step": 327948, "epoch": 1952} {"train_loss": -12.458855628967285, "global_step": 327949, "epoch": 1952} {"train_loss": -12.576937675476074, "global_step": 327950, "epoch": 1952} {"train_loss": -12.533867835998535, "global_step": 327951, "epoch": 1952} {"train_loss": -12.104837417602539, "global_step": 327952, "epoch": 1952} {"train_loss": -11.856590270996094, "global_step": 327953, "epoch": 1952} {"train_loss": -11.575183868408203, "global_step": 327954, "epoch": 1952} {"train_loss": -11.670525550842285, "global_step": 327955, "epoch": 1952} {"train_loss": -11.387147903442383, "global_step": 327956, "epoch": 1952} {"train_loss": -11.624090194702148, "global_step": 327957, "epoch": 1952} {"train_loss": -12.036842346191406, "global_step": 327958, "epoch": 1952} {"train_loss": -10.247628211975098, "global_step": 327959, "epoch": 1952} {"train_loss": -9.86943244934082, "global_step": 327960, "epoch": 1952} {"train_loss": -9.948655128479004, "global_step": 327961, "epoch": 1952} {"train_loss": -12.103511810302734, "global_step": 327962, "epoch": 1952} {"train_loss": -10.675697326660156, "global_step": 327963, "epoch": 1952} {"train_loss": -11.536757469177246, "global_step": 327964, "epoch": 1952} {"train_loss": -9.900923728942871, "global_step": 327965, "epoch": 1952} {"train_loss": -11.70359992980957, "global_step": 327966, "epoch": 1952} {"train_loss": -9.804388999938965, "global_step": 327967, "epoch": 1952} {"train_loss": -11.247198104858398, "global_step": 327968, "epoch": 1952} {"train_loss": -9.962602615356445, "global_step": 327969, "epoch": 1952} {"train_loss": -10.966175079345703, "global_step": 327970, "epoch": 1952} {"train_loss": -10.609275817871094, "global_step": 327971, "epoch": 1952} {"train_loss": -9.512626647949219, "global_step": 327972, "epoch": 1952} {"train_loss": -11.92025375366211, "global_step": 327973, "epoch": 1952} {"train_loss": -9.602563858032227, "global_step": 327974, "epoch": 1952} {"train_loss": -9.573497772216797, "global_step": 327975, "epoch": 1952} {"train_loss": -10.826040267944336, "global_step": 327976, "epoch": 1952} {"train_loss": -10.182096481323242, "global_step": 327977, "epoch": 1952} {"train_loss": -10.546915054321289, "global_step": 327978, "epoch": 1952} {"train_loss": -10.354854583740234, "global_step": 327979, "epoch": 1952} {"train_loss": -11.113382339477539, "global_step": 327980, "epoch": 1952} {"train_loss": -11.221158981323242, "global_step": 327981, "epoch": 1952} {"train_loss": -9.702472686767578, "global_step": 327982, "epoch": 1952} {"train_loss": -11.57351016998291, "global_step": 327983, "epoch": 1952} {"train_loss": -10.662986755371094, "global_step": 327984, "epoch": 1952} {"train_loss": -11.24069881439209, "global_step": 327985, "epoch": 1952} {"train_loss": -11.227999687194824, "global_step": 327986, "epoch": 1952} {"train_loss": -11.320893287658691, "global_step": 327987, "epoch": 1952} {"train_loss": -11.804256439208984, "global_step": 327988, "epoch": 1952} {"train_loss": -11.25930404663086, "global_step": 327989, "epoch": 1952} {"train_loss": -11.162824630737305, "global_step": 327990, "epoch": 1952} {"train_loss": -11.58122730255127, "global_step": 327991, "epoch": 1952} {"train_loss": -11.293180465698242, "global_step": 327992, "epoch": 1952} {"train_loss": -11.530590057373047, "global_step": 327993, "epoch": 1952} {"train_loss": -11.754451751708984, "global_step": 327994, "epoch": 1952} {"train_loss": -11.05051040649414, "global_step": 327995, "epoch": 1952} {"train_loss": -11.719188690185547, "global_step": 327996, "epoch": 1952} {"train_loss": -11.265507698059082, "global_step": 327997, "epoch": 1952} {"train_loss": -11.69504165649414, "global_step": 327998, "epoch": 1952} {"train_loss": -11.021533012390137, "global_step": 327999, "epoch": 1952} {"train_loss": -11.17670726776123, "global_step": 328000, "epoch": 1952} {"train_loss": -11.787647247314453, "global_step": 328001, "epoch": 1952} {"train_loss": -10.828629493713379, "global_step": 328002, "epoch": 1952} {"train_loss": -12.185547828674316, "global_step": 328003, "epoch": 1952} {"train_loss": -10.707269668579102, "global_step": 328004, "epoch": 1952} {"train_loss": -12.008852005004883, "global_step": 328005, "epoch": 1952} {"train_loss": -11.078107833862305, "global_step": 328006, "epoch": 1952} {"train_loss": -12.179712295532227, "global_step": 328007, "epoch": 1952} {"train_loss": -11.670185089111328, "global_step": 328008, "epoch": 1952} {"train_loss": -11.755327224731445, "global_step": 328009, "epoch": 1952} {"train_loss": -11.52869701385498, "global_step": 328010, "epoch": 1952} {"train_loss": -12.072423934936523, "global_step": 328011, "epoch": 1952} {"train_loss": -11.81468391418457, "global_step": 328012, "epoch": 1952} {"train_loss": -12.106054306030273, "global_step": 328013, "epoch": 1952} {"train_loss": -11.97160530090332, "global_step": 328014, "epoch": 1952} {"train_loss": -12.151551246643066, "global_step": 328015, "epoch": 1952} {"train_loss": -12.065842628479004, "global_step": 328016, "epoch": 1952} {"train_loss": -12.013040542602539, "global_step": 328017, "epoch": 1952} {"train_loss": -12.180000305175781, "global_step": 328018, "epoch": 1952} {"train_loss": -12.188624382019043, "global_step": 328019, "epoch": 1952} {"train_loss": -11.995248794555664, "global_step": 328020, "epoch": 1952} {"train_loss": -12.236952781677246, "global_step": 328021, "epoch": 1952} {"train_loss": -11.715038299560547, "global_step": 328022, "epoch": 1952} {"train_loss": -12.14287281036377, "global_step": 328023, "epoch": 1952} {"train_loss": -11.734977722167969, "global_step": 328024, "epoch": 1952} {"train_loss": -12.25004768371582, "global_step": 328025, "epoch": 1952} {"train_loss": -12.091155052185059, "global_step": 328026, "epoch": 1952} {"train_loss": -11.804271697998047, "global_step": 328027, "epoch": 1952} {"train_loss": -12.160477638244629, "global_step": 328028, "epoch": 1952} {"train_loss": -12.089776039123535, "global_step": 328029, "epoch": 1952} {"train_loss": -12.230741500854492, "global_step": 328030, "epoch": 1952} {"train_loss": -12.170531272888184, "global_step": 328031, "epoch": 1952} {"train_loss": -12.132431030273438, "global_step": 328032, "epoch": 1952} {"train_loss": -12.058425903320312, "global_step": 328033, "epoch": 1952} {"train_loss": -12.34719181060791, "global_step": 328034, "epoch": 1952} {"train_loss": -12.009933471679688, "global_step": 328035, "epoch": 1952} {"train_loss": -12.458176612854004, "global_step": 328036, "epoch": 1952} {"train_loss": -12.283660888671875, "global_step": 328037, "epoch": 1952} {"train_loss": -12.378265380859375, "global_step": 328038, "epoch": 1952} {"train_loss": -12.22313117980957, "global_step": 328039, "epoch": 1952} {"train_loss": -12.385222434997559, "global_step": 328040, "epoch": 1952} {"train_loss": -12.307836532592773, "global_step": 328041, "epoch": 1952} {"train_loss": -12.226595878601074, "global_step": 328042, "epoch": 1952} {"train_loss": -12.526374816894531, "global_step": 328043, "epoch": 1952} {"train_loss": -12.155951499938965, "global_step": 328044, "epoch": 1952} {"train_loss": -12.47199821472168, "global_step": 328045, "epoch": 1952} {"train_loss": -12.238386154174805, "global_step": 328046, "epoch": 1952} {"train_loss": -12.12835693359375, "global_step": 328047, "epoch": 1952} {"train_loss": -12.495784759521484, "global_step": 328048, "epoch": 1952} {"train_loss": -12.251458168029785, "global_step": 328049, "epoch": 1952} {"train_loss": -12.233646392822266, "global_step": 328050, "epoch": 1952} {"train_loss": -12.377527236938477, "global_step": 328051, "epoch": 1952} {"train_loss": -12.585606575012207, "global_step": 328052, "epoch": 1952} {"train_loss": -12.269037246704102, "global_step": 328053, "epoch": 1952} {"train_loss": -12.099278450012207, "global_step": 328054, "epoch": 1952} {"train_loss": -12.710739135742188, "global_step": 328055, "epoch": 1952} {"train_loss": -12.245019912719727, "global_step": 328056, "epoch": 1952} {"train_loss": -12.414008140563965, "global_step": 328057, "epoch": 1952} {"train_loss": -12.426458358764648, "global_step": 328058, "epoch": 1952} {"train_loss": -12.554994583129883, "global_step": 328059, "epoch": 1952} {"train_loss": -12.459321022033691, "global_step": 328060, "epoch": 1952} {"train_loss": -12.398547172546387, "global_step": 328061, "epoch": 1952} {"train_loss": -11.916341781616211, "global_step": 328062, "epoch": 1952} {"train_loss": -12.202693939208984, "global_step": 328063, "epoch": 1952} {"train_loss": -12.253719329833984, "global_step": 328064, "epoch": 1952} {"train_loss": -12.265422821044922, "global_step": 328065, "epoch": 1952} {"train_loss": -12.486747741699219, "global_step": 328066, "epoch": 1952} {"train_loss": -12.309986114501953, "global_step": 328067, "epoch": 1952} {"train_loss": -12.412353515625, "global_step": 328068, "epoch": 1952} {"train_loss": -12.198095321655273, "global_step": 328069, "epoch": 1952} {"train_loss": -11.997076034545898, "global_step": 328070, "epoch": 1952} {"train_loss": -12.636679649353027, "global_step": 328071, "epoch": 1952} {"train_loss": -12.242061614990234, "global_step": 328072, "epoch": 1952} {"train_loss": -12.405202865600586, "global_step": 328073, "epoch": 1952} {"train_loss": -12.377439498901367, "global_step": 328074, "epoch": 1952} {"train_loss": -11.997547149658203, "global_step": 328075, "epoch": 1952} {"train_loss": -12.059979438781738, "global_step": 328076, "epoch": 1952} {"train_loss": -12.525994300842285, "global_step": 328077, "epoch": 1952} {"train_loss": -12.07119083404541, "global_step": 328078, "epoch": 1952} {"train_loss": -12.111637115478516, "global_step": 328079, "epoch": 1952} {"train_loss": -12.122743606567383, "global_step": 328080, "epoch": 1952} {"train_loss": -12.501266479492188, "global_step": 328081, "epoch": 1952} {"train_loss": -11.923730850219727, "global_step": 328082, "epoch": 1952} {"train_loss": -12.681763648986816, "global_step": 328083, "epoch": 1952} {"train_loss": -12.111108779907227, "global_step": 328084, "epoch": 1952} {"train_loss": -12.553474426269531, "global_step": 328085, "epoch": 1952} {"train_loss": -11.936092376708984, "global_step": 328086, "epoch": 1952} {"train_loss": -12.711801528930664, "global_step": 328087, "epoch": 1952} {"train_loss": -12.185195922851562, "global_step": 328088, "epoch": 1952} {"train_loss": -12.436769485473633, "global_step": 328089, "epoch": 1952} {"train_loss": -12.291363716125488, "global_step": 328090, "epoch": 1952} {"train_loss": -12.567110061645508, "global_step": 328091, "epoch": 1952} {"train_loss": -12.357595443725586, "global_step": 328092, "epoch": 1952} {"train_loss": -12.349709510803223, "global_step": 328093, "epoch": 1952} {"train_loss": -12.315669059753418, "global_step": 328094, "epoch": 1952} {"train_loss": -12.238524436950684, "global_step": 328095, "epoch": 1952} {"train_loss": -11.535720825195312, "global_step": 328096, "epoch": 1952} {"train_loss": -12.461623191833496, "global_step": 328097, "epoch": 1952} {"train_loss": -12.615474700927734, "global_step": 328098, "epoch": 1952} {"train_loss": -12.1842041015625, "global_step": 328099, "epoch": 1952} {"train_loss": -12.493634223937988, "global_step": 328100, "epoch": 1952} {"train_loss": -12.285892486572266, "global_step": 328101, "epoch": 1952} {"train_loss": -12.223170280456543, "global_step": 328102, "epoch": 1952} {"train_loss": -11.865737699327015, "global_step": 328103, "epoch": 1952, "val_loss": 285075.4375} {"train_loss": -11.584077835083008, "global_step": 328104, "epoch": 1953} {"train_loss": -12.048187255859375, "global_step": 328105, "epoch": 1953} {"train_loss": -10.278953552246094, "global_step": 328106, "epoch": 1953} {"train_loss": -11.249387741088867, "global_step": 328107, "epoch": 1953} {"train_loss": -11.51064395904541, "global_step": 328108, "epoch": 1953} {"train_loss": -10.87146282196045, "global_step": 328109, "epoch": 1953} {"train_loss": -11.357515335083008, "global_step": 328110, "epoch": 1953} {"train_loss": -10.548306465148926, "global_step": 328111, "epoch": 1953} {"train_loss": -10.798072814941406, "global_step": 328112, "epoch": 1953} {"train_loss": -10.100038528442383, "global_step": 328113, "epoch": 1953} {"train_loss": -10.437176704406738, "global_step": 328114, "epoch": 1953} {"train_loss": -9.43548583984375, "global_step": 328115, "epoch": 1953} {"train_loss": -11.213207244873047, "global_step": 328116, "epoch": 1953} {"train_loss": -9.158260345458984, "global_step": 328117, "epoch": 1953} {"train_loss": -10.97652816772461, "global_step": 328118, "epoch": 1953} {"train_loss": -10.567225456237793, "global_step": 328119, "epoch": 1953} {"train_loss": -11.415128707885742, "global_step": 328120, "epoch": 1953} {"train_loss": -11.443134307861328, "global_step": 328121, "epoch": 1953} {"train_loss": -11.40163516998291, "global_step": 328122, "epoch": 1953} {"train_loss": -11.460787773132324, "global_step": 328123, "epoch": 1953} {"train_loss": -11.274250984191895, "global_step": 328124, "epoch": 1953} {"train_loss": -11.798686981201172, "global_step": 328125, "epoch": 1953} {"train_loss": -10.970968246459961, "global_step": 328126, "epoch": 1953} {"train_loss": -11.686982154846191, "global_step": 328127, "epoch": 1953} {"train_loss": -11.40536880493164, "global_step": 328128, "epoch": 1953} {"train_loss": -11.174019813537598, "global_step": 328129, "epoch": 1953} {"train_loss": -11.374988555908203, "global_step": 328130, "epoch": 1953} {"train_loss": -11.362003326416016, "global_step": 328131, "epoch": 1953} {"train_loss": -11.519502639770508, "global_step": 328132, "epoch": 1953} {"train_loss": -11.928522109985352, "global_step": 328133, "epoch": 1953} {"train_loss": -11.248395919799805, "global_step": 328134, "epoch": 1953} {"train_loss": -11.570262908935547, "global_step": 328135, "epoch": 1953} {"train_loss": -11.420233726501465, "global_step": 328136, "epoch": 1953} {"train_loss": -10.16030502319336, "global_step": 328137, "epoch": 1953} {"train_loss": -11.206900596618652, "global_step": 328138, "epoch": 1953} {"train_loss": -10.763826370239258, "global_step": 328139, "epoch": 1953} {"train_loss": -9.970592498779297, "global_step": 328140, "epoch": 1953} {"train_loss": -11.786638259887695, "global_step": 328141, "epoch": 1953} {"train_loss": -10.814363479614258, "global_step": 328142, "epoch": 1953} {"train_loss": -11.226661682128906, "global_step": 328143, "epoch": 1953} {"train_loss": -11.294305801391602, "global_step": 328144, "epoch": 1953} {"train_loss": -11.296274185180664, "global_step": 328145, "epoch": 1953} {"train_loss": -11.729707717895508, "global_step": 328146, "epoch": 1953} {"train_loss": -11.0616455078125, "global_step": 328147, "epoch": 1953} {"train_loss": -11.8561429977417, "global_step": 328148, "epoch": 1953} {"train_loss": -11.334453582763672, "global_step": 328149, "epoch": 1953} {"train_loss": -11.970466613769531, "global_step": 328150, "epoch": 1953} {"train_loss": -10.454078674316406, "global_step": 328151, "epoch": 1953} {"train_loss": -11.235872268676758, "global_step": 328152, "epoch": 1953} {"train_loss": -10.843722343444824, "global_step": 328153, "epoch": 1953} {"train_loss": -11.024435043334961, "global_step": 328154, "epoch": 1953} {"train_loss": -10.980124473571777, "global_step": 328155, "epoch": 1953} {"train_loss": -11.654994010925293, "global_step": 328156, "epoch": 1953} {"train_loss": -11.37290096282959, "global_step": 328157, "epoch": 1953} {"train_loss": -11.486343383789062, "global_step": 328158, "epoch": 1953} {"train_loss": -11.747965812683105, "global_step": 328159, "epoch": 1953} {"train_loss": -11.029228210449219, "global_step": 328160, "epoch": 1953} {"train_loss": -11.890674591064453, "global_step": 328161, "epoch": 1953} {"train_loss": -11.408027648925781, "global_step": 328162, "epoch": 1953} {"train_loss": -12.052120208740234, "global_step": 328163, "epoch": 1953} {"train_loss": -11.268630981445312, "global_step": 328164, "epoch": 1953} {"train_loss": -12.107559204101562, "global_step": 328165, "epoch": 1953} {"train_loss": -11.270214080810547, "global_step": 328166, "epoch": 1953} {"train_loss": -11.734073638916016, "global_step": 328167, "epoch": 1953} {"train_loss": -11.369874954223633, "global_step": 328168, "epoch": 1953} {"train_loss": -11.964582443237305, "global_step": 328169, "epoch": 1953} {"train_loss": -11.644905090332031, "global_step": 328170, "epoch": 1953} {"train_loss": -11.598278999328613, "global_step": 328171, "epoch": 1953} {"train_loss": -11.712791442871094, "global_step": 328172, "epoch": 1953} {"train_loss": -12.032768249511719, "global_step": 328173, "epoch": 1953} {"train_loss": -12.139779090881348, "global_step": 328174, "epoch": 1953} {"train_loss": -12.169337272644043, "global_step": 328175, "epoch": 1953} {"train_loss": -12.053389549255371, "global_step": 328176, "epoch": 1953} {"train_loss": -11.97816276550293, "global_step": 328177, "epoch": 1953} {"train_loss": -12.069023132324219, "global_step": 328178, "epoch": 1953} {"train_loss": -12.156187057495117, "global_step": 328179, "epoch": 1953} {"train_loss": -11.943258285522461, "global_step": 328180, "epoch": 1953} {"train_loss": -11.986120223999023, "global_step": 328181, "epoch": 1953} {"train_loss": -12.247848510742188, "global_step": 328182, "epoch": 1953} {"train_loss": -11.880712509155273, "global_step": 328183, "epoch": 1953} {"train_loss": -11.320206642150879, "global_step": 328184, "epoch": 1953} {"train_loss": -12.167284965515137, "global_step": 328185, "epoch": 1953} {"train_loss": -12.280966758728027, "global_step": 328186, "epoch": 1953} {"train_loss": -11.777412414550781, "global_step": 328187, "epoch": 1953} {"train_loss": -12.272172927856445, "global_step": 328188, "epoch": 1953} {"train_loss": -12.06606674194336, "global_step": 328189, "epoch": 1953} {"train_loss": -12.153993606567383, "global_step": 328190, "epoch": 1953} {"train_loss": -12.007640838623047, "global_step": 328191, "epoch": 1953} {"train_loss": -12.111661911010742, "global_step": 328192, "epoch": 1953} {"train_loss": -11.523831367492676, "global_step": 328193, "epoch": 1953} {"train_loss": -12.217214584350586, "global_step": 328194, "epoch": 1953} {"train_loss": -12.158098220825195, "global_step": 328195, "epoch": 1953} {"train_loss": -12.275753021240234, "global_step": 328196, "epoch": 1953} {"train_loss": -12.387473106384277, "global_step": 328197, "epoch": 1953} {"train_loss": -12.498798370361328, "global_step": 328198, "epoch": 1953} {"train_loss": -12.405579566955566, "global_step": 328199, "epoch": 1953} {"train_loss": -12.267437934875488, "global_step": 328200, "epoch": 1953} {"train_loss": -12.319847106933594, "global_step": 328201, "epoch": 1953} {"train_loss": -12.514057159423828, "global_step": 328202, "epoch": 1953} {"train_loss": -12.255109786987305, "global_step": 328203, "epoch": 1953} {"train_loss": -12.316905975341797, "global_step": 328204, "epoch": 1953} {"train_loss": -12.359087944030762, "global_step": 328205, "epoch": 1953} {"train_loss": -12.426496505737305, "global_step": 328206, "epoch": 1953} {"train_loss": -12.158855438232422, "global_step": 328207, "epoch": 1953} {"train_loss": -12.414813995361328, "global_step": 328208, "epoch": 1953} {"train_loss": -12.462688446044922, "global_step": 328209, "epoch": 1953} {"train_loss": -12.46595573425293, "global_step": 328210, "epoch": 1953} {"train_loss": -12.48000717163086, "global_step": 328211, "epoch": 1953} {"train_loss": -12.47182846069336, "global_step": 328212, "epoch": 1953} {"train_loss": -12.301424026489258, "global_step": 328213, "epoch": 1953} {"train_loss": -12.399600982666016, "global_step": 328214, "epoch": 1953} {"train_loss": -12.360149383544922, "global_step": 328215, "epoch": 1953} {"train_loss": -12.384258270263672, "global_step": 328216, "epoch": 1953} {"train_loss": -12.357257843017578, "global_step": 328217, "epoch": 1953} {"train_loss": -12.366598129272461, "global_step": 328218, "epoch": 1953} {"train_loss": -12.39995002746582, "global_step": 328219, "epoch": 1953} {"train_loss": -12.445406913757324, "global_step": 328220, "epoch": 1953} {"train_loss": -12.540759086608887, "global_step": 328221, "epoch": 1953} {"train_loss": -12.397029876708984, "global_step": 328222, "epoch": 1953} {"train_loss": -12.338345527648926, "global_step": 328223, "epoch": 1953} {"train_loss": -12.31639289855957, "global_step": 328224, "epoch": 1953} {"train_loss": -12.424185752868652, "global_step": 328225, "epoch": 1953} {"train_loss": -12.446098327636719, "global_step": 328226, "epoch": 1953} {"train_loss": -12.663982391357422, "global_step": 328227, "epoch": 1953} {"train_loss": -12.548151016235352, "global_step": 328228, "epoch": 1953} {"train_loss": -12.507152557373047, "global_step": 328229, "epoch": 1953} {"train_loss": -12.627620697021484, "global_step": 328230, "epoch": 1953} {"train_loss": -12.481369018554688, "global_step": 328231, "epoch": 1953} {"train_loss": -12.440736770629883, "global_step": 328232, "epoch": 1953} {"train_loss": -12.533036231994629, "global_step": 328233, "epoch": 1953} {"train_loss": -12.49886703491211, "global_step": 328234, "epoch": 1953} {"train_loss": -12.642802238464355, "global_step": 328235, "epoch": 1953} {"train_loss": -12.506591796875, "global_step": 328236, "epoch": 1953} {"train_loss": -12.442948341369629, "global_step": 328237, "epoch": 1953} {"train_loss": -12.571479797363281, "global_step": 328238, "epoch": 1953} {"train_loss": -11.852657318115234, "global_step": 328239, "epoch": 1953} {"train_loss": -11.861248016357422, "global_step": 328240, "epoch": 1953} {"train_loss": -12.525985717773438, "global_step": 328241, "epoch": 1953} {"train_loss": -11.672433853149414, "global_step": 328242, "epoch": 1953} {"train_loss": -11.693931579589844, "global_step": 328243, "epoch": 1953} {"train_loss": -12.373899459838867, "global_step": 328244, "epoch": 1953} {"train_loss": -12.581525802612305, "global_step": 328245, "epoch": 1953} {"train_loss": -11.892607688903809, "global_step": 328246, "epoch": 1953} {"train_loss": -12.626391410827637, "global_step": 328247, "epoch": 1953} {"train_loss": -12.342533111572266, "global_step": 328248, "epoch": 1953} {"train_loss": -12.691850662231445, "global_step": 328249, "epoch": 1953} {"train_loss": -12.41277027130127, "global_step": 328250, "epoch": 1953} {"train_loss": -12.382946014404297, "global_step": 328251, "epoch": 1953} {"train_loss": -12.384868621826172, "global_step": 328252, "epoch": 1953} {"train_loss": -12.530879974365234, "global_step": 328253, "epoch": 1953} {"train_loss": -12.442094802856445, "global_step": 328254, "epoch": 1953} {"train_loss": -12.389505386352539, "global_step": 328255, "epoch": 1953} {"train_loss": -12.362268447875977, "global_step": 328256, "epoch": 1953} {"train_loss": -12.306800842285156, "global_step": 328257, "epoch": 1953} {"train_loss": -12.545830726623535, "global_step": 328258, "epoch": 1953} {"train_loss": -12.616739273071289, "global_step": 328259, "epoch": 1953} {"train_loss": -12.383499145507812, "global_step": 328260, "epoch": 1953} {"train_loss": -12.723897933959961, "global_step": 328261, "epoch": 1953} {"train_loss": -12.398197174072266, "global_step": 328262, "epoch": 1953} {"train_loss": -12.64521312713623, "global_step": 328263, "epoch": 1953} {"train_loss": -12.756266593933105, "global_step": 328264, "epoch": 1953} {"train_loss": -12.41606330871582, "global_step": 328265, "epoch": 1953} {"train_loss": -12.374510765075684, "global_step": 328266, "epoch": 1953} {"train_loss": -12.469561576843262, "global_step": 328267, "epoch": 1953} {"train_loss": -12.201391220092773, "global_step": 328268, "epoch": 1953} {"train_loss": -12.378669738769531, "global_step": 328269, "epoch": 1953} {"train_loss": -12.334866523742676, "global_step": 328270, "epoch": 1953} {"train_loss": -11.86683838140397, "global_step": 328271, "epoch": 1953, "val_loss": 284106.1875} {"train_loss": -12.541862487792969, "global_step": 328272, "epoch": 1954} {"train_loss": -11.901224136352539, "global_step": 328273, "epoch": 1954} {"train_loss": -12.136390686035156, "global_step": 328274, "epoch": 1954} {"train_loss": -10.187273025512695, "global_step": 328275, "epoch": 1954} {"train_loss": -9.803659439086914, "global_step": 328276, "epoch": 1954} {"train_loss": -9.395410537719727, "global_step": 328277, "epoch": 1954} {"train_loss": -9.378267288208008, "global_step": 328278, "epoch": 1954} {"train_loss": -10.08236312866211, "global_step": 328279, "epoch": 1954} {"train_loss": -8.298760414123535, "global_step": 328280, "epoch": 1954} {"train_loss": -9.315861701965332, "global_step": 328281, "epoch": 1954} {"train_loss": -9.05671215057373, "global_step": 328282, "epoch": 1954} {"train_loss": -10.069103240966797, "global_step": 328283, "epoch": 1954} {"train_loss": -10.462118148803711, "global_step": 328284, "epoch": 1954} {"train_loss": -10.193897247314453, "global_step": 328285, "epoch": 1954} {"train_loss": -10.271275520324707, "global_step": 328286, "epoch": 1954} {"train_loss": -11.166614532470703, "global_step": 328287, "epoch": 1954} {"train_loss": -11.160677909851074, "global_step": 328288, "epoch": 1954} {"train_loss": -11.017683029174805, "global_step": 328289, "epoch": 1954} {"train_loss": -10.567449569702148, "global_step": 328290, "epoch": 1954} {"train_loss": -11.098286628723145, "global_step": 328291, "epoch": 1954} {"train_loss": -10.727863311767578, "global_step": 328292, "epoch": 1954} {"train_loss": -11.728238105773926, "global_step": 328293, "epoch": 1954} {"train_loss": -11.077518463134766, "global_step": 328294, "epoch": 1954} {"train_loss": -11.82577133178711, "global_step": 328295, "epoch": 1954} {"train_loss": -10.801645278930664, "global_step": 328296, "epoch": 1954} {"train_loss": -11.284736633300781, "global_step": 328297, "epoch": 1954} {"train_loss": -10.833415031433105, "global_step": 328298, "epoch": 1954} {"train_loss": -11.18478012084961, "global_step": 328299, "epoch": 1954} {"train_loss": -11.883405685424805, "global_step": 328300, "epoch": 1954} {"train_loss": -11.323890686035156, "global_step": 328301, "epoch": 1954} {"train_loss": -11.375727653503418, "global_step": 328302, "epoch": 1954} {"train_loss": -11.677542686462402, "global_step": 328303, "epoch": 1954} {"train_loss": -11.760575294494629, "global_step": 328304, "epoch": 1954} {"train_loss": -11.158007621765137, "global_step": 328305, "epoch": 1954} {"train_loss": -11.989474296569824, "global_step": 328306, "epoch": 1954} {"train_loss": -11.532785415649414, "global_step": 328307, "epoch": 1954} {"train_loss": -11.874174118041992, "global_step": 328308, "epoch": 1954} {"train_loss": -11.668558120727539, "global_step": 328309, "epoch": 1954} {"train_loss": -11.620903015136719, "global_step": 328310, "epoch": 1954} {"train_loss": -11.907608032226562, "global_step": 328311, "epoch": 1954} {"train_loss": -11.851524353027344, "global_step": 328312, "epoch": 1954} {"train_loss": -11.981012344360352, "global_step": 328313, "epoch": 1954} {"train_loss": -11.995646476745605, "global_step": 328314, "epoch": 1954} {"train_loss": -11.979703903198242, "global_step": 328315, "epoch": 1954} {"train_loss": -11.72779369354248, "global_step": 328316, "epoch": 1954} {"train_loss": -12.0224609375, "global_step": 328317, "epoch": 1954} {"train_loss": -11.799558639526367, "global_step": 328318, "epoch": 1954} {"train_loss": -12.01348876953125, "global_step": 328319, "epoch": 1954} {"train_loss": -12.14151668548584, "global_step": 328320, "epoch": 1954} {"train_loss": -12.19589614868164, "global_step": 328321, "epoch": 1954} {"train_loss": -11.986530303955078, "global_step": 328322, "epoch": 1954} {"train_loss": -12.174945831298828, "global_step": 328323, "epoch": 1954} {"train_loss": -12.268392562866211, "global_step": 328324, "epoch": 1954} {"train_loss": -11.883152961730957, "global_step": 328325, "epoch": 1954} {"train_loss": -12.281926155090332, "global_step": 328326, "epoch": 1954} {"train_loss": -12.185482025146484, "global_step": 328327, "epoch": 1954} {"train_loss": -12.23015022277832, "global_step": 328328, "epoch": 1954} {"train_loss": -12.090195655822754, "global_step": 328329, "epoch": 1954} {"train_loss": -12.113080978393555, "global_step": 328330, "epoch": 1954} {"train_loss": -12.309526443481445, "global_step": 328331, "epoch": 1954} {"train_loss": -12.433500289916992, "global_step": 328332, "epoch": 1954} {"train_loss": -12.435961723327637, "global_step": 328333, "epoch": 1954} {"train_loss": -12.530521392822266, "global_step": 328334, "epoch": 1954} {"train_loss": -12.345965385437012, "global_step": 328335, "epoch": 1954} {"train_loss": -12.579416275024414, "global_step": 328336, "epoch": 1954} {"train_loss": -12.365654945373535, "global_step": 328337, "epoch": 1954} {"train_loss": -12.514925956726074, "global_step": 328338, "epoch": 1954} {"train_loss": -12.591833114624023, "global_step": 328339, "epoch": 1954} {"train_loss": -12.508983612060547, "global_step": 328340, "epoch": 1954} {"train_loss": -12.323442459106445, "global_step": 328341, "epoch": 1954} {"train_loss": -12.458908081054688, "global_step": 328342, "epoch": 1954} {"train_loss": -12.307032585144043, "global_step": 328343, "epoch": 1954} {"train_loss": -12.240981101989746, "global_step": 328344, "epoch": 1954} {"train_loss": -12.391854286193848, "global_step": 328345, "epoch": 1954} {"train_loss": -12.17062759399414, "global_step": 328346, "epoch": 1954} {"train_loss": -12.455581665039062, "global_step": 328347, "epoch": 1954} {"train_loss": -12.455938339233398, "global_step": 328348, "epoch": 1954} {"train_loss": -12.393633842468262, "global_step": 328349, "epoch": 1954} {"train_loss": -12.04495620727539, "global_step": 328350, "epoch": 1954} {"train_loss": -12.20637035369873, "global_step": 328351, "epoch": 1954} {"train_loss": -12.181564331054688, "global_step": 328352, "epoch": 1954} {"train_loss": -11.976993560791016, "global_step": 328353, "epoch": 1954} {"train_loss": -12.31326675415039, "global_step": 328354, "epoch": 1954} {"train_loss": -11.276065826416016, "global_step": 328355, "epoch": 1954} {"train_loss": -10.244943618774414, "global_step": 328356, "epoch": 1954} {"train_loss": -12.174534797668457, "global_step": 328357, "epoch": 1954} {"train_loss": -11.277437210083008, "global_step": 328358, "epoch": 1954} {"train_loss": -10.705227851867676, "global_step": 328359, "epoch": 1954} {"train_loss": -11.512795448303223, "global_step": 328360, "epoch": 1954} {"train_loss": -11.736940383911133, "global_step": 328361, "epoch": 1954} {"train_loss": -11.460817337036133, "global_step": 328362, "epoch": 1954} {"train_loss": -11.49409008026123, "global_step": 328363, "epoch": 1954} {"train_loss": -12.08505630493164, "global_step": 328364, "epoch": 1954} {"train_loss": -10.747692108154297, "global_step": 328365, "epoch": 1954} {"train_loss": -11.553145408630371, "global_step": 328366, "epoch": 1954} {"train_loss": -10.128814697265625, "global_step": 328367, "epoch": 1954} {"train_loss": -10.16573715209961, "global_step": 328368, "epoch": 1954} {"train_loss": -11.547087669372559, "global_step": 328369, "epoch": 1954} {"train_loss": -10.028058052062988, "global_step": 328370, "epoch": 1954} {"train_loss": -11.925936698913574, "global_step": 328371, "epoch": 1954} {"train_loss": -11.212697982788086, "global_step": 328372, "epoch": 1954} {"train_loss": -11.376362800598145, "global_step": 328373, "epoch": 1954} {"train_loss": -11.974822998046875, "global_step": 328374, "epoch": 1954} {"train_loss": -11.133913040161133, "global_step": 328375, "epoch": 1954} {"train_loss": -11.9517822265625, "global_step": 328376, "epoch": 1954} {"train_loss": -11.556991577148438, "global_step": 328377, "epoch": 1954} {"train_loss": -12.11620044708252, "global_step": 328378, "epoch": 1954} {"train_loss": -11.34666919708252, "global_step": 328379, "epoch": 1954} {"train_loss": -11.437732696533203, "global_step": 328380, "epoch": 1954} {"train_loss": -11.596342086791992, "global_step": 328381, "epoch": 1954} {"train_loss": -11.33383560180664, "global_step": 328382, "epoch": 1954} {"train_loss": -12.107248306274414, "global_step": 328383, "epoch": 1954} {"train_loss": -11.64716911315918, "global_step": 328384, "epoch": 1954} {"train_loss": -11.925524711608887, "global_step": 328385, "epoch": 1954} {"train_loss": -11.922111511230469, "global_step": 328386, "epoch": 1954} {"train_loss": -11.552995681762695, "global_step": 328387, "epoch": 1954} {"train_loss": -11.990930557250977, "global_step": 328388, "epoch": 1954} {"train_loss": -11.426477432250977, "global_step": 328389, "epoch": 1954} {"train_loss": -12.008466720581055, "global_step": 328390, "epoch": 1954} {"train_loss": -11.922494888305664, "global_step": 328391, "epoch": 1954} {"train_loss": -11.869325637817383, "global_step": 328392, "epoch": 1954} {"train_loss": -12.01894760131836, "global_step": 328393, "epoch": 1954} {"train_loss": -11.542539596557617, "global_step": 328394, "epoch": 1954} {"train_loss": -12.044473648071289, "global_step": 328395, "epoch": 1954} {"train_loss": -11.549473762512207, "global_step": 328396, "epoch": 1954} {"train_loss": -11.608598709106445, "global_step": 328397, "epoch": 1954} {"train_loss": -12.248435020446777, "global_step": 328398, "epoch": 1954} {"train_loss": -11.854599952697754, "global_step": 328399, "epoch": 1954} {"train_loss": -12.114255905151367, "global_step": 328400, "epoch": 1954} {"train_loss": -11.963955879211426, "global_step": 328401, "epoch": 1954} {"train_loss": -12.059152603149414, "global_step": 328402, "epoch": 1954} {"train_loss": -12.16593074798584, "global_step": 328403, "epoch": 1954} {"train_loss": -12.14668083190918, "global_step": 328404, "epoch": 1954} {"train_loss": -11.881965637207031, "global_step": 328405, "epoch": 1954} {"train_loss": -12.050138473510742, "global_step": 328406, "epoch": 1954} {"train_loss": -12.371353149414062, "global_step": 328407, "epoch": 1954} {"train_loss": -12.339599609375, "global_step": 328408, "epoch": 1954} {"train_loss": -12.306480407714844, "global_step": 328409, "epoch": 1954} {"train_loss": -12.247156143188477, "global_step": 328410, "epoch": 1954} {"train_loss": -12.253559112548828, "global_step": 328411, "epoch": 1954} {"train_loss": -12.263463973999023, "global_step": 328412, "epoch": 1954} {"train_loss": -11.95326042175293, "global_step": 328413, "epoch": 1954} {"train_loss": -12.514801025390625, "global_step": 328414, "epoch": 1954} {"train_loss": -11.880688667297363, "global_step": 328415, "epoch": 1954} {"train_loss": -12.393418312072754, "global_step": 328416, "epoch": 1954} {"train_loss": -12.320842742919922, "global_step": 328417, "epoch": 1954} {"train_loss": -11.80936050415039, "global_step": 328418, "epoch": 1954} {"train_loss": -12.378721237182617, "global_step": 328419, "epoch": 1954} {"train_loss": -11.923318862915039, "global_step": 328420, "epoch": 1954} {"train_loss": -12.392391204833984, "global_step": 328421, "epoch": 1954} {"train_loss": -11.93863582611084, "global_step": 328422, "epoch": 1954} {"train_loss": -12.247915267944336, "global_step": 328423, "epoch": 1954} {"train_loss": -12.023386001586914, "global_step": 328424, "epoch": 1954} {"train_loss": -12.34315013885498, "global_step": 328425, "epoch": 1954} {"train_loss": -12.326613426208496, "global_step": 328426, "epoch": 1954} {"train_loss": -11.930814743041992, "global_step": 328427, "epoch": 1954} {"train_loss": -12.379902839660645, "global_step": 328428, "epoch": 1954} {"train_loss": -12.376338958740234, "global_step": 328429, "epoch": 1954} {"train_loss": -12.389022827148438, "global_step": 328430, "epoch": 1954} {"train_loss": -12.548412322998047, "global_step": 328431, "epoch": 1954} {"train_loss": -12.346033096313477, "global_step": 328432, "epoch": 1954} {"train_loss": -12.28083610534668, "global_step": 328433, "epoch": 1954} {"train_loss": -12.235452651977539, "global_step": 328434, "epoch": 1954} {"train_loss": -12.508756637573242, "global_step": 328435, "epoch": 1954} {"train_loss": -12.584342956542969, "global_step": 328436, "epoch": 1954} {"train_loss": -12.311901092529297, "global_step": 328437, "epoch": 1954} {"train_loss": -12.37985897064209, "global_step": 328438, "epoch": 1954} {"train_loss": -11.72678363890875, "global_step": 328439, "epoch": 1954, "val_loss": 287449.21875} {"train_loss": -12.096254348754883, "global_step": 328440, "epoch": 1955} {"train_loss": -11.889745712280273, "global_step": 328441, "epoch": 1955} {"train_loss": -11.764566421508789, "global_step": 328442, "epoch": 1955} {"train_loss": -12.363536834716797, "global_step": 328443, "epoch": 1955} {"train_loss": -12.060068130493164, "global_step": 328444, "epoch": 1955} {"train_loss": -12.190696716308594, "global_step": 328445, "epoch": 1955} {"train_loss": -12.00390625, "global_step": 328446, "epoch": 1955} {"train_loss": -12.165302276611328, "global_step": 328447, "epoch": 1955} {"train_loss": -11.829819679260254, "global_step": 328448, "epoch": 1955} {"train_loss": -11.886457443237305, "global_step": 328449, "epoch": 1955} {"train_loss": -11.171566009521484, "global_step": 328450, "epoch": 1955} {"train_loss": -11.542510986328125, "global_step": 328451, "epoch": 1955} {"train_loss": -11.614673614501953, "global_step": 328452, "epoch": 1955} {"train_loss": -11.951526641845703, "global_step": 328453, "epoch": 1955} {"train_loss": -11.276570320129395, "global_step": 328454, "epoch": 1955} {"train_loss": -11.997214317321777, "global_step": 328455, "epoch": 1955} {"train_loss": -11.94723129272461, "global_step": 328456, "epoch": 1955} {"train_loss": -11.608827590942383, "global_step": 328457, "epoch": 1955} {"train_loss": -12.409425735473633, "global_step": 328458, "epoch": 1955} {"train_loss": -12.026723861694336, "global_step": 328459, "epoch": 1955} {"train_loss": -11.598121643066406, "global_step": 328460, "epoch": 1955} {"train_loss": -12.091952323913574, "global_step": 328461, "epoch": 1955} {"train_loss": -11.893171310424805, "global_step": 328462, "epoch": 1955} {"train_loss": -11.711590766906738, "global_step": 328463, "epoch": 1955} {"train_loss": -11.88206672668457, "global_step": 328464, "epoch": 1955} {"train_loss": -12.016355514526367, "global_step": 328465, "epoch": 1955} {"train_loss": -11.552343368530273, "global_step": 328466, "epoch": 1955} {"train_loss": -12.10474967956543, "global_step": 328467, "epoch": 1955} {"train_loss": -12.124237060546875, "global_step": 328468, "epoch": 1955} {"train_loss": -12.131149291992188, "global_step": 328469, "epoch": 1955} {"train_loss": -12.291687965393066, "global_step": 328470, "epoch": 1955} {"train_loss": -12.1643705368042, "global_step": 328471, "epoch": 1955} {"train_loss": -11.923417091369629, "global_step": 328472, "epoch": 1955} {"train_loss": -12.158147811889648, "global_step": 328473, "epoch": 1955} {"train_loss": -11.98034381866455, "global_step": 328474, "epoch": 1955} {"train_loss": -11.57888412475586, "global_step": 328475, "epoch": 1955} {"train_loss": -12.160027503967285, "global_step": 328476, "epoch": 1955} {"train_loss": -11.769020080566406, "global_step": 328477, "epoch": 1955} {"train_loss": -11.56386947631836, "global_step": 328478, "epoch": 1955} {"train_loss": -12.04025650024414, "global_step": 328479, "epoch": 1955} {"train_loss": -11.55016040802002, "global_step": 328480, "epoch": 1955} {"train_loss": -11.516863822937012, "global_step": 328481, "epoch": 1955} {"train_loss": -12.304794311523438, "global_step": 328482, "epoch": 1955} {"train_loss": -11.262960433959961, "global_step": 328483, "epoch": 1955} {"train_loss": -11.605039596557617, "global_step": 328484, "epoch": 1955} {"train_loss": -12.247093200683594, "global_step": 328485, "epoch": 1955} {"train_loss": -12.175467491149902, "global_step": 328486, "epoch": 1955} {"train_loss": -11.21990966796875, "global_step": 328487, "epoch": 1955} {"train_loss": -12.430163383483887, "global_step": 328488, "epoch": 1955} {"train_loss": -11.457351684570312, "global_step": 328489, "epoch": 1955} {"train_loss": -12.205804824829102, "global_step": 328490, "epoch": 1955} {"train_loss": -11.676801681518555, "global_step": 328491, "epoch": 1955} {"train_loss": -11.872953414916992, "global_step": 328492, "epoch": 1955} {"train_loss": -11.810916900634766, "global_step": 328493, "epoch": 1955} {"train_loss": -11.704622268676758, "global_step": 328494, "epoch": 1955} {"train_loss": -11.367900848388672, "global_step": 328495, "epoch": 1955} {"train_loss": -12.190681457519531, "global_step": 328496, "epoch": 1955} {"train_loss": -11.709163665771484, "global_step": 328497, "epoch": 1955} {"train_loss": -12.106035232543945, "global_step": 328498, "epoch": 1955} {"train_loss": -11.918878555297852, "global_step": 328499, "epoch": 1955} {"train_loss": -12.035637855529785, "global_step": 328500, "epoch": 1955} {"train_loss": -11.731229782104492, "global_step": 328501, "epoch": 1955} {"train_loss": -12.080815315246582, "global_step": 328502, "epoch": 1955} {"train_loss": -12.2010498046875, "global_step": 328503, "epoch": 1955} {"train_loss": -11.957963943481445, "global_step": 328504, "epoch": 1955} {"train_loss": -12.265586853027344, "global_step": 328505, "epoch": 1955} {"train_loss": -12.314155578613281, "global_step": 328506, "epoch": 1955} {"train_loss": -12.373427391052246, "global_step": 328507, "epoch": 1955} {"train_loss": -12.202716827392578, "global_step": 328508, "epoch": 1955} {"train_loss": -12.297083854675293, "global_step": 328509, "epoch": 1955} {"train_loss": -12.489279747009277, "global_step": 328510, "epoch": 1955} {"train_loss": -12.48534107208252, "global_step": 328511, "epoch": 1955} {"train_loss": -12.530485153198242, "global_step": 328512, "epoch": 1955} {"train_loss": -12.209756851196289, "global_step": 328513, "epoch": 1955} {"train_loss": -12.29836654663086, "global_step": 328514, "epoch": 1955} {"train_loss": -12.297266006469727, "global_step": 328515, "epoch": 1955} {"train_loss": -12.126319885253906, "global_step": 328516, "epoch": 1955} {"train_loss": -12.193400382995605, "global_step": 328517, "epoch": 1955} {"train_loss": -12.380393981933594, "global_step": 328518, "epoch": 1955} {"train_loss": -11.98004150390625, "global_step": 328519, "epoch": 1955} {"train_loss": -12.449942588806152, "global_step": 328520, "epoch": 1955} {"train_loss": -12.391862869262695, "global_step": 328521, "epoch": 1955} {"train_loss": -12.371112823486328, "global_step": 328522, "epoch": 1955} {"train_loss": -12.244872093200684, "global_step": 328523, "epoch": 1955} {"train_loss": -12.270708084106445, "global_step": 328524, "epoch": 1955} {"train_loss": -12.110154151916504, "global_step": 328525, "epoch": 1955} {"train_loss": -12.105070114135742, "global_step": 328526, "epoch": 1955} {"train_loss": -12.207978248596191, "global_step": 328527, "epoch": 1955} {"train_loss": -12.238632202148438, "global_step": 328528, "epoch": 1955} {"train_loss": -12.33462905883789, "global_step": 328529, "epoch": 1955} {"train_loss": -11.120208740234375, "global_step": 328530, "epoch": 1955} {"train_loss": -12.30650520324707, "global_step": 328531, "epoch": 1955} {"train_loss": -12.212855339050293, "global_step": 328532, "epoch": 1955} {"train_loss": -12.039188385009766, "global_step": 328533, "epoch": 1955} {"train_loss": -12.24905776977539, "global_step": 328534, "epoch": 1955} {"train_loss": -12.413961410522461, "global_step": 328535, "epoch": 1955} {"train_loss": -12.228904724121094, "global_step": 328536, "epoch": 1955} {"train_loss": -12.251794815063477, "global_step": 328537, "epoch": 1955} {"train_loss": -12.21101188659668, "global_step": 328538, "epoch": 1955} {"train_loss": -12.06689453125, "global_step": 328539, "epoch": 1955} {"train_loss": -12.433237075805664, "global_step": 328540, "epoch": 1955} {"train_loss": -11.670812606811523, "global_step": 328541, "epoch": 1955} {"train_loss": -11.70041561126709, "global_step": 328542, "epoch": 1955} {"train_loss": -12.113235473632812, "global_step": 328543, "epoch": 1955} {"train_loss": -12.24135684967041, "global_step": 328544, "epoch": 1955} {"train_loss": -11.523496627807617, "global_step": 328545, "epoch": 1955} {"train_loss": -11.636770248413086, "global_step": 328546, "epoch": 1955} {"train_loss": -12.120441436767578, "global_step": 328547, "epoch": 1955} {"train_loss": -12.227712631225586, "global_step": 328548, "epoch": 1955} {"train_loss": -12.143896102905273, "global_step": 328549, "epoch": 1955} {"train_loss": -12.003610610961914, "global_step": 328550, "epoch": 1955} {"train_loss": -12.380340576171875, "global_step": 328551, "epoch": 1955} {"train_loss": -11.977300643920898, "global_step": 328552, "epoch": 1955} {"train_loss": -11.947450637817383, "global_step": 328553, "epoch": 1955} {"train_loss": -12.154973983764648, "global_step": 328554, "epoch": 1955} {"train_loss": -12.032963752746582, "global_step": 328555, "epoch": 1955} {"train_loss": -11.828304290771484, "global_step": 328556, "epoch": 1955} {"train_loss": -12.097930908203125, "global_step": 328557, "epoch": 1955} {"train_loss": -12.31944465637207, "global_step": 328558, "epoch": 1955} {"train_loss": -12.402884483337402, "global_step": 328559, "epoch": 1955} {"train_loss": -12.261364936828613, "global_step": 328560, "epoch": 1955} {"train_loss": -12.459060668945312, "global_step": 328561, "epoch": 1955} {"train_loss": -12.465312004089355, "global_step": 328562, "epoch": 1955} {"train_loss": -12.56302261352539, "global_step": 328563, "epoch": 1955} {"train_loss": -12.44959545135498, "global_step": 328564, "epoch": 1955} {"train_loss": -12.442174911499023, "global_step": 328565, "epoch": 1955} {"train_loss": -12.24817180633545, "global_step": 328566, "epoch": 1955} {"train_loss": -12.731374740600586, "global_step": 328567, "epoch": 1955} {"train_loss": -12.524767875671387, "global_step": 328568, "epoch": 1955} {"train_loss": -12.59377670288086, "global_step": 328569, "epoch": 1955} {"train_loss": -12.568341255187988, "global_step": 328570, "epoch": 1955} {"train_loss": -12.672103881835938, "global_step": 328571, "epoch": 1955} {"train_loss": -12.40292739868164, "global_step": 328572, "epoch": 1955} {"train_loss": -12.639176368713379, "global_step": 328573, "epoch": 1955} {"train_loss": -12.426834106445312, "global_step": 328574, "epoch": 1955} {"train_loss": -12.609173774719238, "global_step": 328575, "epoch": 1955} {"train_loss": -12.390549659729004, "global_step": 328576, "epoch": 1955} {"train_loss": -12.521684646606445, "global_step": 328577, "epoch": 1955} {"train_loss": -12.343476295471191, "global_step": 328578, "epoch": 1955} {"train_loss": -12.552453994750977, "global_step": 328579, "epoch": 1955} {"train_loss": -12.654533386230469, "global_step": 328580, "epoch": 1955} {"train_loss": -12.399810791015625, "global_step": 328581, "epoch": 1955} {"train_loss": -11.921791076660156, "global_step": 328582, "epoch": 1955} {"train_loss": -11.882174491882324, "global_step": 328583, "epoch": 1955} {"train_loss": -11.557519912719727, "global_step": 328584, "epoch": 1955} {"train_loss": -12.560789108276367, "global_step": 328585, "epoch": 1955} {"train_loss": -12.367838859558105, "global_step": 328586, "epoch": 1955} {"train_loss": -11.835140228271484, "global_step": 328587, "epoch": 1955} {"train_loss": -12.00920295715332, "global_step": 328588, "epoch": 1955} {"train_loss": -12.191276550292969, "global_step": 328589, "epoch": 1955} {"train_loss": -12.48676872253418, "global_step": 328590, "epoch": 1955} {"train_loss": -12.44333267211914, "global_step": 328591, "epoch": 1955} {"train_loss": -12.451017379760742, "global_step": 328592, "epoch": 1955} {"train_loss": -12.030941009521484, "global_step": 328593, "epoch": 1955} {"train_loss": -11.831494331359863, "global_step": 328594, "epoch": 1955} {"train_loss": -11.621241569519043, "global_step": 328595, "epoch": 1955} {"train_loss": -11.170549392700195, "global_step": 328596, "epoch": 1955} {"train_loss": -10.270153045654297, "global_step": 328597, "epoch": 1955} {"train_loss": -8.906524658203125, "global_step": 328598, "epoch": 1955} {"train_loss": -11.035860061645508, "global_step": 328599, "epoch": 1955} {"train_loss": -9.58539867401123, "global_step": 328600, "epoch": 1955} {"train_loss": -8.299901962280273, "global_step": 328601, "epoch": 1955} {"train_loss": -8.718420028686523, "global_step": 328602, "epoch": 1955} {"train_loss": -9.494620323181152, "global_step": 328603, "epoch": 1955} {"train_loss": -9.957219123840332, "global_step": 328604, "epoch": 1955} {"train_loss": -8.390920639038086, "global_step": 328605, "epoch": 1955} {"train_loss": -9.17909049987793, "global_step": 328606, "epoch": 1955} {"train_loss": -11.913080005418687, "global_step": 328607, "epoch": 1955, "val_loss": 284313.5625, "train_action_mse_error": 1.6494108438491821} {"train_loss": -9.122995376586914, "global_step": 328608, "epoch": 1956} {"train_loss": -8.388056755065918, "global_step": 328609, "epoch": 1956} {"train_loss": -9.239104270935059, "global_step": 328610, "epoch": 1956} {"train_loss": -10.470979690551758, "global_step": 328611, "epoch": 1956} {"train_loss": -8.822921752929688, "global_step": 328612, "epoch": 1956} {"train_loss": -8.292669296264648, "global_step": 328613, "epoch": 1956} {"train_loss": -8.246371269226074, "global_step": 328614, "epoch": 1956} {"train_loss": -8.627185821533203, "global_step": 328615, "epoch": 1956} {"train_loss": -9.150426864624023, "global_step": 328616, "epoch": 1956} {"train_loss": -9.891071319580078, "global_step": 328617, "epoch": 1956} {"train_loss": -9.773406982421875, "global_step": 328618, "epoch": 1956} {"train_loss": -9.005895614624023, "global_step": 328619, "epoch": 1956} {"train_loss": -9.336505889892578, "global_step": 328620, "epoch": 1956} {"train_loss": -10.32540512084961, "global_step": 328621, "epoch": 1956} {"train_loss": -9.443168640136719, "global_step": 328622, "epoch": 1956} {"train_loss": -10.134808540344238, "global_step": 328623, "epoch": 1956} {"train_loss": -8.946155548095703, "global_step": 328624, "epoch": 1956} {"train_loss": -10.436004638671875, "global_step": 328625, "epoch": 1956} {"train_loss": -10.363147735595703, "global_step": 328626, "epoch": 1956} {"train_loss": -10.423069953918457, "global_step": 328627, "epoch": 1956} {"train_loss": -10.973506927490234, "global_step": 328628, "epoch": 1956} {"train_loss": -11.195960998535156, "global_step": 328629, "epoch": 1956} {"train_loss": -10.933916091918945, "global_step": 328630, "epoch": 1956} {"train_loss": -10.75095272064209, "global_step": 328631, "epoch": 1956} {"train_loss": -11.319856643676758, "global_step": 328632, "epoch": 1956} {"train_loss": -11.075471878051758, "global_step": 328633, "epoch": 1956} {"train_loss": -10.471673965454102, "global_step": 328634, "epoch": 1956} {"train_loss": -11.732967376708984, "global_step": 328635, "epoch": 1956} {"train_loss": -11.158218383789062, "global_step": 328636, "epoch": 1956} {"train_loss": -11.885143280029297, "global_step": 328637, "epoch": 1956} {"train_loss": -11.386940002441406, "global_step": 328638, "epoch": 1956} {"train_loss": -11.742721557617188, "global_step": 328639, "epoch": 1956} {"train_loss": -11.578116416931152, "global_step": 328640, "epoch": 1956} {"train_loss": -11.600460052490234, "global_step": 328641, "epoch": 1956} {"train_loss": -11.813175201416016, "global_step": 328642, "epoch": 1956} {"train_loss": -11.87789535522461, "global_step": 328643, "epoch": 1956} {"train_loss": -11.613767623901367, "global_step": 328644, "epoch": 1956} {"train_loss": -12.103435516357422, "global_step": 328645, "epoch": 1956} {"train_loss": -11.912393569946289, "global_step": 328646, "epoch": 1956} {"train_loss": -11.997800827026367, "global_step": 328647, "epoch": 1956} {"train_loss": -11.773189544677734, "global_step": 328648, "epoch": 1956} {"train_loss": -11.949728012084961, "global_step": 328649, "epoch": 1956} {"train_loss": -11.96895694732666, "global_step": 328650, "epoch": 1956} {"train_loss": -11.624380111694336, "global_step": 328651, "epoch": 1956} {"train_loss": -12.11207103729248, "global_step": 328652, "epoch": 1956} {"train_loss": -11.684157371520996, "global_step": 328653, "epoch": 1956} {"train_loss": -12.047496795654297, "global_step": 328654, "epoch": 1956} {"train_loss": -11.778719902038574, "global_step": 328655, "epoch": 1956} {"train_loss": -12.008477210998535, "global_step": 328656, "epoch": 1956} {"train_loss": -12.00822639465332, "global_step": 328657, "epoch": 1956} {"train_loss": -12.003691673278809, "global_step": 328658, "epoch": 1956} {"train_loss": -11.900402069091797, "global_step": 328659, "epoch": 1956} {"train_loss": -11.879181861877441, "global_step": 328660, "epoch": 1956} {"train_loss": -11.923622131347656, "global_step": 328661, "epoch": 1956} {"train_loss": -11.795747756958008, "global_step": 328662, "epoch": 1956} {"train_loss": -12.06629753112793, "global_step": 328663, "epoch": 1956} {"train_loss": -11.939952850341797, "global_step": 328664, "epoch": 1956} {"train_loss": -12.14187240600586, "global_step": 328665, "epoch": 1956} {"train_loss": -12.130186080932617, "global_step": 328666, "epoch": 1956} {"train_loss": -12.277496337890625, "global_step": 328667, "epoch": 1956} {"train_loss": -11.909294128417969, "global_step": 328668, "epoch": 1956} {"train_loss": -12.146968841552734, "global_step": 328669, "epoch": 1956} {"train_loss": -11.948001861572266, "global_step": 328670, "epoch": 1956} {"train_loss": -11.934289932250977, "global_step": 328671, "epoch": 1956} {"train_loss": -12.060615539550781, "global_step": 328672, "epoch": 1956} {"train_loss": -12.239057540893555, "global_step": 328673, "epoch": 1956} {"train_loss": -12.121152877807617, "global_step": 328674, "epoch": 1956} {"train_loss": -12.170690536499023, "global_step": 328675, "epoch": 1956} {"train_loss": -12.115029335021973, "global_step": 328676, "epoch": 1956} {"train_loss": -12.28037166595459, "global_step": 328677, "epoch": 1956} {"train_loss": -11.800832748413086, "global_step": 328678, "epoch": 1956} {"train_loss": -12.202566146850586, "global_step": 328679, "epoch": 1956} {"train_loss": -11.957189559936523, "global_step": 328680, "epoch": 1956} {"train_loss": -11.672551155090332, "global_step": 328681, "epoch": 1956} {"train_loss": -11.822815895080566, "global_step": 328682, "epoch": 1956} {"train_loss": -11.466423034667969, "global_step": 328683, "epoch": 1956} {"train_loss": -10.691510200500488, "global_step": 328684, "epoch": 1956} {"train_loss": -10.180656433105469, "global_step": 328685, "epoch": 1956} {"train_loss": -11.21939754486084, "global_step": 328686, "epoch": 1956} {"train_loss": -10.616439819335938, "global_step": 328687, "epoch": 1956} {"train_loss": -10.766572952270508, "global_step": 328688, "epoch": 1956} {"train_loss": -11.117877960205078, "global_step": 328689, "epoch": 1956} {"train_loss": -10.620953559875488, "global_step": 328690, "epoch": 1956} {"train_loss": -11.818796157836914, "global_step": 328691, "epoch": 1956} {"train_loss": -11.143397331237793, "global_step": 328692, "epoch": 1956} {"train_loss": -11.804999351501465, "global_step": 328693, "epoch": 1956} {"train_loss": -11.869619369506836, "global_step": 328694, "epoch": 1956} {"train_loss": -11.465734481811523, "global_step": 328695, "epoch": 1956} {"train_loss": -11.978459358215332, "global_step": 328696, "epoch": 1956} {"train_loss": -11.299081802368164, "global_step": 328697, "epoch": 1956} {"train_loss": -12.020376205444336, "global_step": 328698, "epoch": 1956} {"train_loss": -11.327162742614746, "global_step": 328699, "epoch": 1956} {"train_loss": -11.71389389038086, "global_step": 328700, "epoch": 1956} {"train_loss": -11.909170150756836, "global_step": 328701, "epoch": 1956} {"train_loss": -11.176586151123047, "global_step": 328702, "epoch": 1956} {"train_loss": -11.924485206604004, "global_step": 328703, "epoch": 1956} {"train_loss": -10.921674728393555, "global_step": 328704, "epoch": 1956} {"train_loss": -12.051071166992188, "global_step": 328705, "epoch": 1956} {"train_loss": -12.004127502441406, "global_step": 328706, "epoch": 1956} {"train_loss": -11.345516204833984, "global_step": 328707, "epoch": 1956} {"train_loss": -11.889975547790527, "global_step": 328708, "epoch": 1956} {"train_loss": -11.461114883422852, "global_step": 328709, "epoch": 1956} {"train_loss": -11.648672103881836, "global_step": 328710, "epoch": 1956} {"train_loss": -11.52692985534668, "global_step": 328711, "epoch": 1956} {"train_loss": -11.676591873168945, "global_step": 328712, "epoch": 1956} {"train_loss": -11.821636199951172, "global_step": 328713, "epoch": 1956} {"train_loss": -11.673162460327148, "global_step": 328714, "epoch": 1956} {"train_loss": -12.261553764343262, "global_step": 328715, "epoch": 1956} {"train_loss": -11.801664352416992, "global_step": 328716, "epoch": 1956} {"train_loss": -12.318696975708008, "global_step": 328717, "epoch": 1956} {"train_loss": -11.987616539001465, "global_step": 328718, "epoch": 1956} {"train_loss": -12.019109725952148, "global_step": 328719, "epoch": 1956} {"train_loss": -12.379988670349121, "global_step": 328720, "epoch": 1956} {"train_loss": -12.178862571716309, "global_step": 328721, "epoch": 1956} {"train_loss": -12.20556640625, "global_step": 328722, "epoch": 1956} {"train_loss": -12.324837684631348, "global_step": 328723, "epoch": 1956} {"train_loss": -12.059953689575195, "global_step": 328724, "epoch": 1956} {"train_loss": -12.337327003479004, "global_step": 328725, "epoch": 1956} {"train_loss": -12.110677719116211, "global_step": 328726, "epoch": 1956} {"train_loss": -12.061149597167969, "global_step": 328727, "epoch": 1956} {"train_loss": -12.244363784790039, "global_step": 328728, "epoch": 1956} {"train_loss": -12.210796356201172, "global_step": 328729, "epoch": 1956} {"train_loss": -12.086814880371094, "global_step": 328730, "epoch": 1956} {"train_loss": -12.35260009765625, "global_step": 328731, "epoch": 1956} {"train_loss": -12.130248069763184, "global_step": 328732, "epoch": 1956} {"train_loss": -12.311017036437988, "global_step": 328733, "epoch": 1956} {"train_loss": -12.391593933105469, "global_step": 328734, "epoch": 1956} {"train_loss": -12.224676132202148, "global_step": 328735, "epoch": 1956} {"train_loss": -12.496391296386719, "global_step": 328736, "epoch": 1956} {"train_loss": -12.447553634643555, "global_step": 328737, "epoch": 1956} {"train_loss": -12.468096733093262, "global_step": 328738, "epoch": 1956} {"train_loss": -12.569087982177734, "global_step": 328739, "epoch": 1956} {"train_loss": -12.47251033782959, "global_step": 328740, "epoch": 1956} {"train_loss": -12.454679489135742, "global_step": 328741, "epoch": 1956} {"train_loss": -12.370135307312012, "global_step": 328742, "epoch": 1956} {"train_loss": -12.327486038208008, "global_step": 328743, "epoch": 1956} {"train_loss": -12.497560501098633, "global_step": 328744, "epoch": 1956} {"train_loss": -12.514758110046387, "global_step": 328745, "epoch": 1956} {"train_loss": -12.346454620361328, "global_step": 328746, "epoch": 1956} {"train_loss": -12.644021034240723, "global_step": 328747, "epoch": 1956} {"train_loss": -12.413125991821289, "global_step": 328748, "epoch": 1956} {"train_loss": -12.303800582885742, "global_step": 328749, "epoch": 1956} {"train_loss": -12.555859565734863, "global_step": 328750, "epoch": 1956} {"train_loss": -12.344954490661621, "global_step": 328751, "epoch": 1956} {"train_loss": -12.57539176940918, "global_step": 328752, "epoch": 1956} {"train_loss": -12.685966491699219, "global_step": 328753, "epoch": 1956} {"train_loss": -12.657411575317383, "global_step": 328754, "epoch": 1956} {"train_loss": -12.443174362182617, "global_step": 328755, "epoch": 1956} {"train_loss": -12.552827835083008, "global_step": 328756, "epoch": 1956} {"train_loss": -12.673702239990234, "global_step": 328757, "epoch": 1956} {"train_loss": -12.550607681274414, "global_step": 328758, "epoch": 1956} {"train_loss": -12.580078125, "global_step": 328759, "epoch": 1956} {"train_loss": -12.55016803741455, "global_step": 328760, "epoch": 1956} {"train_loss": -12.666297912597656, "global_step": 328761, "epoch": 1956} {"train_loss": -12.722360610961914, "global_step": 328762, "epoch": 1956} {"train_loss": -12.751412391662598, "global_step": 328763, "epoch": 1956} {"train_loss": -12.709673881530762, "global_step": 328764, "epoch": 1956} {"train_loss": -12.785250663757324, "global_step": 328765, "epoch": 1956} {"train_loss": -12.700636863708496, "global_step": 328766, "epoch": 1956} {"train_loss": -12.771743774414062, "global_step": 328767, "epoch": 1956} {"train_loss": -12.695449829101562, "global_step": 328768, "epoch": 1956} {"train_loss": -12.777384757995605, "global_step": 328769, "epoch": 1956} {"train_loss": -12.42495059967041, "global_step": 328770, "epoch": 1956} {"train_loss": -12.499296188354492, "global_step": 328771, "epoch": 1956} {"train_loss": -12.820804595947266, "global_step": 328772, "epoch": 1956} {"train_loss": -12.66567611694336, "global_step": 328773, "epoch": 1956} {"train_loss": -12.84626579284668, "global_step": 328774, "epoch": 1956} {"train_loss": -11.67860339936756, "global_step": 328775, "epoch": 1956, "val_loss": 288445.34375} {"train_loss": -12.501413345336914, "global_step": 328776, "epoch": 1957} {"train_loss": -12.45173168182373, "global_step": 328777, "epoch": 1957} {"train_loss": -12.487613677978516, "global_step": 328778, "epoch": 1957} {"train_loss": -12.741678237915039, "global_step": 328779, "epoch": 1957} {"train_loss": -12.724093437194824, "global_step": 328780, "epoch": 1957} {"train_loss": -12.376960754394531, "global_step": 328781, "epoch": 1957} {"train_loss": -12.760976791381836, "global_step": 328782, "epoch": 1957} {"train_loss": -12.572650909423828, "global_step": 328783, "epoch": 1957} {"train_loss": -12.678144454956055, "global_step": 328784, "epoch": 1957} {"train_loss": -12.667641639709473, "global_step": 328785, "epoch": 1957} {"train_loss": -12.625693321228027, "global_step": 328786, "epoch": 1957} {"train_loss": -12.58616828918457, "global_step": 328787, "epoch": 1957} {"train_loss": -12.105403900146484, "global_step": 328788, "epoch": 1957} {"train_loss": -12.237966537475586, "global_step": 328789, "epoch": 1957} {"train_loss": -11.786279678344727, "global_step": 328790, "epoch": 1957} {"train_loss": -12.279712677001953, "global_step": 328791, "epoch": 1957} {"train_loss": -11.416504859924316, "global_step": 328792, "epoch": 1957} {"train_loss": -11.176261901855469, "global_step": 328793, "epoch": 1957} {"train_loss": -10.815979957580566, "global_step": 328794, "epoch": 1957} {"train_loss": -11.575431823730469, "global_step": 328795, "epoch": 1957} {"train_loss": -10.013888359069824, "global_step": 328796, "epoch": 1957} {"train_loss": -10.097311019897461, "global_step": 328797, "epoch": 1957} {"train_loss": -12.377822875976562, "global_step": 328798, "epoch": 1957} {"train_loss": -8.848000526428223, "global_step": 328799, "epoch": 1957} {"train_loss": -11.088354110717773, "global_step": 328800, "epoch": 1957} {"train_loss": -10.682941436767578, "global_step": 328801, "epoch": 1957} {"train_loss": -10.513466835021973, "global_step": 328802, "epoch": 1957} {"train_loss": -11.38542652130127, "global_step": 328803, "epoch": 1957} {"train_loss": -11.859565734863281, "global_step": 328804, "epoch": 1957} {"train_loss": -11.263101577758789, "global_step": 328805, "epoch": 1957} {"train_loss": -11.766828536987305, "global_step": 328806, "epoch": 1957} {"train_loss": -11.32023811340332, "global_step": 328807, "epoch": 1957} {"train_loss": -10.60818862915039, "global_step": 328808, "epoch": 1957} {"train_loss": -11.281259536743164, "global_step": 328809, "epoch": 1957} {"train_loss": -11.791780471801758, "global_step": 328810, "epoch": 1957} {"train_loss": -11.241825103759766, "global_step": 328811, "epoch": 1957} {"train_loss": -11.937219619750977, "global_step": 328812, "epoch": 1957} {"train_loss": -12.306818008422852, "global_step": 328813, "epoch": 1957} {"train_loss": -11.035778045654297, "global_step": 328814, "epoch": 1957} {"train_loss": -11.796836853027344, "global_step": 328815, "epoch": 1957} {"train_loss": -10.578598976135254, "global_step": 328816, "epoch": 1957} {"train_loss": -10.655891418457031, "global_step": 328817, "epoch": 1957} {"train_loss": -11.011642456054688, "global_step": 328818, "epoch": 1957} {"train_loss": -11.119452476501465, "global_step": 328819, "epoch": 1957} {"train_loss": -10.1964111328125, "global_step": 328820, "epoch": 1957} {"train_loss": -11.596372604370117, "global_step": 328821, "epoch": 1957} {"train_loss": -10.898393630981445, "global_step": 328822, "epoch": 1957} {"train_loss": -11.623542785644531, "global_step": 328823, "epoch": 1957} {"train_loss": -11.327476501464844, "global_step": 328824, "epoch": 1957} {"train_loss": -11.484210968017578, "global_step": 328825, "epoch": 1957} {"train_loss": -12.16093921661377, "global_step": 328826, "epoch": 1957} {"train_loss": -11.41592788696289, "global_step": 328827, "epoch": 1957} {"train_loss": -12.033794403076172, "global_step": 328828, "epoch": 1957} {"train_loss": -11.386720657348633, "global_step": 328829, "epoch": 1957} {"train_loss": -11.819347381591797, "global_step": 328830, "epoch": 1957} {"train_loss": -11.570425987243652, "global_step": 328831, "epoch": 1957} {"train_loss": -11.905402183532715, "global_step": 328832, "epoch": 1957} {"train_loss": -11.647941589355469, "global_step": 328833, "epoch": 1957} {"train_loss": -11.455690383911133, "global_step": 328834, "epoch": 1957} {"train_loss": -11.612274169921875, "global_step": 328835, "epoch": 1957} {"train_loss": -11.593297958374023, "global_step": 328836, "epoch": 1957} {"train_loss": -11.746783256530762, "global_step": 328837, "epoch": 1957} {"train_loss": -11.035400390625, "global_step": 328838, "epoch": 1957} {"train_loss": -11.056081771850586, "global_step": 328839, "epoch": 1957} {"train_loss": -11.482237815856934, "global_step": 328840, "epoch": 1957} {"train_loss": -11.702125549316406, "global_step": 328841, "epoch": 1957} {"train_loss": -11.867376327514648, "global_step": 328842, "epoch": 1957} {"train_loss": -11.331809043884277, "global_step": 328843, "epoch": 1957} {"train_loss": -11.714215278625488, "global_step": 328844, "epoch": 1957} {"train_loss": -11.649303436279297, "global_step": 328845, "epoch": 1957} {"train_loss": -11.362588882446289, "global_step": 328846, "epoch": 1957} {"train_loss": -12.069015502929688, "global_step": 328847, "epoch": 1957} {"train_loss": -11.706037521362305, "global_step": 328848, "epoch": 1957} {"train_loss": -12.191068649291992, "global_step": 328849, "epoch": 1957} {"train_loss": -11.64356803894043, "global_step": 328850, "epoch": 1957} {"train_loss": -11.863343238830566, "global_step": 328851, "epoch": 1957} {"train_loss": -11.714430809020996, "global_step": 328852, "epoch": 1957} {"train_loss": -11.793715476989746, "global_step": 328853, "epoch": 1957} {"train_loss": -11.63551139831543, "global_step": 328854, "epoch": 1957} {"train_loss": -11.60580825805664, "global_step": 328855, "epoch": 1957} {"train_loss": -11.658299446105957, "global_step": 328856, "epoch": 1957} {"train_loss": -12.070757865905762, "global_step": 328857, "epoch": 1957} {"train_loss": -12.14006519317627, "global_step": 328858, "epoch": 1957} {"train_loss": -11.875710487365723, "global_step": 328859, "epoch": 1957} {"train_loss": -11.631673812866211, "global_step": 328860, "epoch": 1957} {"train_loss": -11.56856918334961, "global_step": 328861, "epoch": 1957} {"train_loss": -12.010917663574219, "global_step": 328862, "epoch": 1957} {"train_loss": -11.861120223999023, "global_step": 328863, "epoch": 1957} {"train_loss": -11.794840812683105, "global_step": 328864, "epoch": 1957} {"train_loss": -11.773796081542969, "global_step": 328865, "epoch": 1957} {"train_loss": -11.891851425170898, "global_step": 328866, "epoch": 1957} {"train_loss": -11.771081924438477, "global_step": 328867, "epoch": 1957} {"train_loss": -11.87271499633789, "global_step": 328868, "epoch": 1957} {"train_loss": -11.263873100280762, "global_step": 328869, "epoch": 1957} {"train_loss": -11.490882873535156, "global_step": 328870, "epoch": 1957} {"train_loss": -10.492817878723145, "global_step": 328871, "epoch": 1957} {"train_loss": -12.26957893371582, "global_step": 328872, "epoch": 1957} {"train_loss": -11.08997917175293, "global_step": 328873, "epoch": 1957} {"train_loss": -11.731407165527344, "global_step": 328874, "epoch": 1957} {"train_loss": -11.77176284790039, "global_step": 328875, "epoch": 1957} {"train_loss": -11.204219818115234, "global_step": 328876, "epoch": 1957} {"train_loss": -12.000040054321289, "global_step": 328877, "epoch": 1957} {"train_loss": -11.56829833984375, "global_step": 328878, "epoch": 1957} {"train_loss": -12.157474517822266, "global_step": 328879, "epoch": 1957} {"train_loss": -11.356685638427734, "global_step": 328880, "epoch": 1957} {"train_loss": -12.161675453186035, "global_step": 328881, "epoch": 1957} {"train_loss": -10.99840259552002, "global_step": 328882, "epoch": 1957} {"train_loss": -11.750288009643555, "global_step": 328883, "epoch": 1957} {"train_loss": -11.778249740600586, "global_step": 328884, "epoch": 1957} {"train_loss": -11.853218078613281, "global_step": 328885, "epoch": 1957} {"train_loss": -12.29123592376709, "global_step": 328886, "epoch": 1957} {"train_loss": -11.951570510864258, "global_step": 328887, "epoch": 1957} {"train_loss": -12.128551483154297, "global_step": 328888, "epoch": 1957} {"train_loss": -12.194879531860352, "global_step": 328889, "epoch": 1957} {"train_loss": -12.287349700927734, "global_step": 328890, "epoch": 1957} {"train_loss": -12.172839164733887, "global_step": 328891, "epoch": 1957} {"train_loss": -12.341302871704102, "global_step": 328892, "epoch": 1957} {"train_loss": -12.242294311523438, "global_step": 328893, "epoch": 1957} {"train_loss": -12.303168296813965, "global_step": 328894, "epoch": 1957} {"train_loss": -12.293266296386719, "global_step": 328895, "epoch": 1957} {"train_loss": -12.229427337646484, "global_step": 328896, "epoch": 1957} {"train_loss": -12.245477676391602, "global_step": 328897, "epoch": 1957} {"train_loss": -11.977523803710938, "global_step": 328898, "epoch": 1957} {"train_loss": -12.25296401977539, "global_step": 328899, "epoch": 1957} {"train_loss": -12.546534538269043, "global_step": 328900, "epoch": 1957} {"train_loss": -12.500255584716797, "global_step": 328901, "epoch": 1957} {"train_loss": -12.248800277709961, "global_step": 328902, "epoch": 1957} {"train_loss": -12.291189193725586, "global_step": 328903, "epoch": 1957} {"train_loss": -12.417732238769531, "global_step": 328904, "epoch": 1957} {"train_loss": -12.4810791015625, "global_step": 328905, "epoch": 1957} {"train_loss": -12.38375473022461, "global_step": 328906, "epoch": 1957} {"train_loss": -12.203496932983398, "global_step": 328907, "epoch": 1957} {"train_loss": -12.509498596191406, "global_step": 328908, "epoch": 1957} {"train_loss": -12.282322883605957, "global_step": 328909, "epoch": 1957} {"train_loss": -12.38039779663086, "global_step": 328910, "epoch": 1957} {"train_loss": -12.304161071777344, "global_step": 328911, "epoch": 1957} {"train_loss": -12.446033477783203, "global_step": 328912, "epoch": 1957} {"train_loss": -12.327749252319336, "global_step": 328913, "epoch": 1957} {"train_loss": -12.30270004272461, "global_step": 328914, "epoch": 1957} {"train_loss": -12.480226516723633, "global_step": 328915, "epoch": 1957} {"train_loss": -12.549846649169922, "global_step": 328916, "epoch": 1957} {"train_loss": -12.441914558410645, "global_step": 328917, "epoch": 1957} {"train_loss": -12.448701858520508, "global_step": 328918, "epoch": 1957} {"train_loss": -12.51070785522461, "global_step": 328919, "epoch": 1957} {"train_loss": -12.502470016479492, "global_step": 328920, "epoch": 1957} {"train_loss": -12.525851249694824, "global_step": 328921, "epoch": 1957} {"train_loss": -12.49388313293457, "global_step": 328922, "epoch": 1957} {"train_loss": -12.467757225036621, "global_step": 328923, "epoch": 1957} {"train_loss": -12.431940078735352, "global_step": 328924, "epoch": 1957} {"train_loss": -12.553239822387695, "global_step": 328925, "epoch": 1957} {"train_loss": -12.550637245178223, "global_step": 328926, "epoch": 1957} {"train_loss": -12.661598205566406, "global_step": 328927, "epoch": 1957} {"train_loss": -12.636150360107422, "global_step": 328928, "epoch": 1957} {"train_loss": -12.7672758102417, "global_step": 328929, "epoch": 1957} {"train_loss": -12.63058090209961, "global_step": 328930, "epoch": 1957} {"train_loss": -12.494356155395508, "global_step": 328931, "epoch": 1957} {"train_loss": -12.740835189819336, "global_step": 328932, "epoch": 1957} {"train_loss": -12.62894344329834, "global_step": 328933, "epoch": 1957} {"train_loss": -12.802642822265625, "global_step": 328934, "epoch": 1957} {"train_loss": -12.676599502563477, "global_step": 328935, "epoch": 1957} {"train_loss": -12.442567825317383, "global_step": 328936, "epoch": 1957} {"train_loss": -12.296268463134766, "global_step": 328937, "epoch": 1957} {"train_loss": -12.206557273864746, "global_step": 328938, "epoch": 1957} {"train_loss": -11.957696914672852, "global_step": 328939, "epoch": 1957} {"train_loss": -12.255462646484375, "global_step": 328940, "epoch": 1957} {"train_loss": -12.374744415283203, "global_step": 328941, "epoch": 1957} {"train_loss": -12.413847923278809, "global_step": 328942, "epoch": 1957} {"train_loss": -11.889643135524931, "global_step": 328943, "epoch": 1957, "val_loss": 287427.65625} {"train_loss": -12.718334197998047, "global_step": 328944, "epoch": 1958} {"train_loss": -12.107715606689453, "global_step": 328945, "epoch": 1958} {"train_loss": -11.019783020019531, "global_step": 328946, "epoch": 1958} {"train_loss": -11.08997917175293, "global_step": 328947, "epoch": 1958} {"train_loss": -11.758917808532715, "global_step": 328948, "epoch": 1958} {"train_loss": -11.703325271606445, "global_step": 328949, "epoch": 1958} {"train_loss": -11.459390640258789, "global_step": 328950, "epoch": 1958} {"train_loss": -11.734851837158203, "global_step": 328951, "epoch": 1958} {"train_loss": -11.033373832702637, "global_step": 328952, "epoch": 1958} {"train_loss": -11.315213203430176, "global_step": 328953, "epoch": 1958} {"train_loss": -11.862883567810059, "global_step": 328954, "epoch": 1958} {"train_loss": -11.541007995605469, "global_step": 328955, "epoch": 1958} {"train_loss": -10.484949111938477, "global_step": 328956, "epoch": 1958} {"train_loss": -11.960794448852539, "global_step": 328957, "epoch": 1958} {"train_loss": -9.798036575317383, "global_step": 328958, "epoch": 1958} {"train_loss": -11.712796211242676, "global_step": 328959, "epoch": 1958} {"train_loss": -8.820722579956055, "global_step": 328960, "epoch": 1958} {"train_loss": -9.0946626663208, "global_step": 328961, "epoch": 1958} {"train_loss": -11.938087463378906, "global_step": 328962, "epoch": 1958} {"train_loss": -9.579986572265625, "global_step": 328963, "epoch": 1958} {"train_loss": -11.470834732055664, "global_step": 328964, "epoch": 1958} {"train_loss": -11.473493576049805, "global_step": 328965, "epoch": 1958} {"train_loss": -10.9334716796875, "global_step": 328966, "epoch": 1958} {"train_loss": -11.39296817779541, "global_step": 328967, "epoch": 1958} {"train_loss": -11.434334754943848, "global_step": 328968, "epoch": 1958} {"train_loss": -11.97774887084961, "global_step": 328969, "epoch": 1958} {"train_loss": -11.787074089050293, "global_step": 328970, "epoch": 1958} {"train_loss": -11.76095199584961, "global_step": 328971, "epoch": 1958} {"train_loss": -11.742677688598633, "global_step": 328972, "epoch": 1958} {"train_loss": -11.508317947387695, "global_step": 328973, "epoch": 1958} {"train_loss": -11.589727401733398, "global_step": 328974, "epoch": 1958} {"train_loss": -11.603301048278809, "global_step": 328975, "epoch": 1958} {"train_loss": -11.694377899169922, "global_step": 328976, "epoch": 1958} {"train_loss": -11.737611770629883, "global_step": 328977, "epoch": 1958} {"train_loss": -11.778840065002441, "global_step": 328978, "epoch": 1958} {"train_loss": -11.686590194702148, "global_step": 328979, "epoch": 1958} {"train_loss": -11.162917137145996, "global_step": 328980, "epoch": 1958} {"train_loss": -12.32895278930664, "global_step": 328981, "epoch": 1958} {"train_loss": -11.19237995147705, "global_step": 328982, "epoch": 1958} {"train_loss": -11.70404052734375, "global_step": 328983, "epoch": 1958} {"train_loss": -11.748373985290527, "global_step": 328984, "epoch": 1958} {"train_loss": -12.042708396911621, "global_step": 328985, "epoch": 1958} {"train_loss": -11.782697677612305, "global_step": 328986, "epoch": 1958} {"train_loss": -11.615400314331055, "global_step": 328987, "epoch": 1958} {"train_loss": -12.159709930419922, "global_step": 328988, "epoch": 1958} {"train_loss": -12.037900924682617, "global_step": 328989, "epoch": 1958} {"train_loss": -11.873584747314453, "global_step": 328990, "epoch": 1958} {"train_loss": -12.257808685302734, "global_step": 328991, "epoch": 1958} {"train_loss": -11.972220420837402, "global_step": 328992, "epoch": 1958} {"train_loss": -12.241172790527344, "global_step": 328993, "epoch": 1958} {"train_loss": -12.321849822998047, "global_step": 328994, "epoch": 1958} {"train_loss": -12.128080368041992, "global_step": 328995, "epoch": 1958} {"train_loss": -12.312559127807617, "global_step": 328996, "epoch": 1958} {"train_loss": -12.24934196472168, "global_step": 328997, "epoch": 1958} {"train_loss": -12.15235710144043, "global_step": 328998, "epoch": 1958} {"train_loss": -12.20219898223877, "global_step": 328999, "epoch": 1958} {"train_loss": -12.450040817260742, "global_step": 329000, "epoch": 1958} {"train_loss": -12.166482925415039, "global_step": 329001, "epoch": 1958} {"train_loss": -12.40915584564209, "global_step": 329002, "epoch": 1958} {"train_loss": -12.062700271606445, "global_step": 329003, "epoch": 1958} {"train_loss": -12.354012489318848, "global_step": 329004, "epoch": 1958} {"train_loss": -12.328380584716797, "global_step": 329005, "epoch": 1958} {"train_loss": -12.373753547668457, "global_step": 329006, "epoch": 1958} {"train_loss": -12.245858192443848, "global_step": 329007, "epoch": 1958} {"train_loss": -12.37299633026123, "global_step": 329008, "epoch": 1958} {"train_loss": -12.156805038452148, "global_step": 329009, "epoch": 1958} {"train_loss": -12.027549743652344, "global_step": 329010, "epoch": 1958} {"train_loss": -12.02995777130127, "global_step": 329011, "epoch": 1958} {"train_loss": -12.215042114257812, "global_step": 329012, "epoch": 1958} {"train_loss": -11.93619155883789, "global_step": 329013, "epoch": 1958} {"train_loss": -12.387939453125, "global_step": 329014, "epoch": 1958} {"train_loss": -12.206908226013184, "global_step": 329015, "epoch": 1958} {"train_loss": -12.057562828063965, "global_step": 329016, "epoch": 1958} {"train_loss": -11.781654357910156, "global_step": 329017, "epoch": 1958} {"train_loss": -11.971633911132812, "global_step": 329018, "epoch": 1958} {"train_loss": -12.132802963256836, "global_step": 329019, "epoch": 1958} {"train_loss": -11.711867332458496, "global_step": 329020, "epoch": 1958} {"train_loss": -12.052325248718262, "global_step": 329021, "epoch": 1958} {"train_loss": -12.305587768554688, "global_step": 329022, "epoch": 1958} {"train_loss": -12.215582847595215, "global_step": 329023, "epoch": 1958} {"train_loss": -12.32232666015625, "global_step": 329024, "epoch": 1958} {"train_loss": -12.237257957458496, "global_step": 329025, "epoch": 1958} {"train_loss": -12.34792709350586, "global_step": 329026, "epoch": 1958} {"train_loss": -11.96051025390625, "global_step": 329027, "epoch": 1958} {"train_loss": -12.637386322021484, "global_step": 329028, "epoch": 1958} {"train_loss": -12.435945510864258, "global_step": 329029, "epoch": 1958} {"train_loss": -12.389081954956055, "global_step": 329030, "epoch": 1958} {"train_loss": -12.395793914794922, "global_step": 329031, "epoch": 1958} {"train_loss": -12.338834762573242, "global_step": 329032, "epoch": 1958} {"train_loss": -12.311580657958984, "global_step": 329033, "epoch": 1958} {"train_loss": -12.069559097290039, "global_step": 329034, "epoch": 1958} {"train_loss": -12.282818794250488, "global_step": 329035, "epoch": 1958} {"train_loss": -12.314353942871094, "global_step": 329036, "epoch": 1958} {"train_loss": -11.928730010986328, "global_step": 329037, "epoch": 1958} {"train_loss": -12.562665939331055, "global_step": 329038, "epoch": 1958} {"train_loss": -11.850641250610352, "global_step": 329039, "epoch": 1958} {"train_loss": -12.206064224243164, "global_step": 329040, "epoch": 1958} {"train_loss": -11.956123352050781, "global_step": 329041, "epoch": 1958} {"train_loss": -12.494794845581055, "global_step": 329042, "epoch": 1958} {"train_loss": -12.013250350952148, "global_step": 329043, "epoch": 1958} {"train_loss": -11.410831451416016, "global_step": 329044, "epoch": 1958} {"train_loss": -11.559015274047852, "global_step": 329045, "epoch": 1958} {"train_loss": -12.428410530090332, "global_step": 329046, "epoch": 1958} {"train_loss": -11.639113426208496, "global_step": 329047, "epoch": 1958} {"train_loss": -12.249218940734863, "global_step": 329048, "epoch": 1958} {"train_loss": -12.11463737487793, "global_step": 329049, "epoch": 1958} {"train_loss": -12.31732177734375, "global_step": 329050, "epoch": 1958} {"train_loss": -12.223711967468262, "global_step": 329051, "epoch": 1958} {"train_loss": -12.12080192565918, "global_step": 329052, "epoch": 1958} {"train_loss": -11.92963981628418, "global_step": 329053, "epoch": 1958} {"train_loss": -11.838333129882812, "global_step": 329054, "epoch": 1958} {"train_loss": -11.598134994506836, "global_step": 329055, "epoch": 1958} {"train_loss": -10.420365333557129, "global_step": 329056, "epoch": 1958} {"train_loss": -11.799447059631348, "global_step": 329057, "epoch": 1958} {"train_loss": -11.403091430664062, "global_step": 329058, "epoch": 1958} {"train_loss": -11.839292526245117, "global_step": 329059, "epoch": 1958} {"train_loss": -11.84695053100586, "global_step": 329060, "epoch": 1958} {"train_loss": -11.967146873474121, "global_step": 329061, "epoch": 1958} {"train_loss": -11.953025817871094, "global_step": 329062, "epoch": 1958} {"train_loss": -11.340270042419434, "global_step": 329063, "epoch": 1958} {"train_loss": -12.422393798828125, "global_step": 329064, "epoch": 1958} {"train_loss": -11.92254638671875, "global_step": 329065, "epoch": 1958} {"train_loss": -12.319269180297852, "global_step": 329066, "epoch": 1958} {"train_loss": -11.758586883544922, "global_step": 329067, "epoch": 1958} {"train_loss": -12.152263641357422, "global_step": 329068, "epoch": 1958} {"train_loss": -11.952339172363281, "global_step": 329069, "epoch": 1958} {"train_loss": -12.515332221984863, "global_step": 329070, "epoch": 1958} {"train_loss": -12.153388977050781, "global_step": 329071, "epoch": 1958} {"train_loss": -12.166065216064453, "global_step": 329072, "epoch": 1958} {"train_loss": -11.984406471252441, "global_step": 329073, "epoch": 1958} {"train_loss": -12.165374755859375, "global_step": 329074, "epoch": 1958} {"train_loss": -11.795872688293457, "global_step": 329075, "epoch": 1958} {"train_loss": -11.925291061401367, "global_step": 329076, "epoch": 1958} {"train_loss": -11.895411491394043, "global_step": 329077, "epoch": 1958} {"train_loss": -12.29861831665039, "global_step": 329078, "epoch": 1958} {"train_loss": -12.112222671508789, "global_step": 329079, "epoch": 1958} {"train_loss": -12.016674041748047, "global_step": 329080, "epoch": 1958} {"train_loss": -11.84370231628418, "global_step": 329081, "epoch": 1958} {"train_loss": -12.142355918884277, "global_step": 329082, "epoch": 1958} {"train_loss": -11.756303787231445, "global_step": 329083, "epoch": 1958} {"train_loss": -11.347939491271973, "global_step": 329084, "epoch": 1958} {"train_loss": -12.275936126708984, "global_step": 329085, "epoch": 1958} {"train_loss": -11.657017707824707, "global_step": 329086, "epoch": 1958} {"train_loss": -11.339071273803711, "global_step": 329087, "epoch": 1958} {"train_loss": -11.769227981567383, "global_step": 329088, "epoch": 1958} {"train_loss": -11.815343856811523, "global_step": 329089, "epoch": 1958} {"train_loss": -11.652761459350586, "global_step": 329090, "epoch": 1958} {"train_loss": -12.136032104492188, "global_step": 329091, "epoch": 1958} {"train_loss": -11.303902626037598, "global_step": 329092, "epoch": 1958} {"train_loss": -12.377781867980957, "global_step": 329093, "epoch": 1958} {"train_loss": -11.17176628112793, "global_step": 329094, "epoch": 1958} {"train_loss": -12.136177062988281, "global_step": 329095, "epoch": 1958} {"train_loss": -12.061424255371094, "global_step": 329096, "epoch": 1958} {"train_loss": -11.717071533203125, "global_step": 329097, "epoch": 1958} {"train_loss": -12.487297058105469, "global_step": 329098, "epoch": 1958} {"train_loss": -11.679058074951172, "global_step": 329099, "epoch": 1958} {"train_loss": -11.940872192382812, "global_step": 329100, "epoch": 1958} {"train_loss": -12.19083309173584, "global_step": 329101, "epoch": 1958} {"train_loss": -11.38485050201416, "global_step": 329102, "epoch": 1958} {"train_loss": -12.436052322387695, "global_step": 329103, "epoch": 1958} {"train_loss": -11.258891105651855, "global_step": 329104, "epoch": 1958} {"train_loss": -11.672204971313477, "global_step": 329105, "epoch": 1958} {"train_loss": -12.179634094238281, "global_step": 329106, "epoch": 1958} {"train_loss": -11.303672790527344, "global_step": 329107, "epoch": 1958} {"train_loss": -12.115665435791016, "global_step": 329108, "epoch": 1958} {"train_loss": -11.372989654541016, "global_step": 329109, "epoch": 1958} {"train_loss": -12.35250473022461, "global_step": 329110, "epoch": 1958} {"train_loss": -11.863565354120164, "global_step": 329111, "epoch": 1958, "val_loss": 286966.78125} {"train_loss": -11.85286808013916, "global_step": 329112, "epoch": 1959} {"train_loss": -11.811060905456543, "global_step": 329113, "epoch": 1959} {"train_loss": -11.810717582702637, "global_step": 329114, "epoch": 1959} {"train_loss": -11.988256454467773, "global_step": 329115, "epoch": 1959} {"train_loss": -12.048439979553223, "global_step": 329116, "epoch": 1959} {"train_loss": -12.205978393554688, "global_step": 329117, "epoch": 1959} {"train_loss": -12.200531959533691, "global_step": 329118, "epoch": 1959} {"train_loss": -12.41391372680664, "global_step": 329119, "epoch": 1959} {"train_loss": -12.221999168395996, "global_step": 329120, "epoch": 1959} {"train_loss": -12.489734649658203, "global_step": 329121, "epoch": 1959} {"train_loss": -12.487163543701172, "global_step": 329122, "epoch": 1959} {"train_loss": -12.21153450012207, "global_step": 329123, "epoch": 1959} {"train_loss": -12.498781204223633, "global_step": 329124, "epoch": 1959} {"train_loss": -12.580550193786621, "global_step": 329125, "epoch": 1959} {"train_loss": -12.36661148071289, "global_step": 329126, "epoch": 1959} {"train_loss": -12.101611137390137, "global_step": 329127, "epoch": 1959} {"train_loss": -12.056968688964844, "global_step": 329128, "epoch": 1959} {"train_loss": -12.474087715148926, "global_step": 329129, "epoch": 1959} {"train_loss": -12.23337173461914, "global_step": 329130, "epoch": 1959} {"train_loss": -12.240900039672852, "global_step": 329131, "epoch": 1959} {"train_loss": -12.272991180419922, "global_step": 329132, "epoch": 1959} {"train_loss": -12.077310562133789, "global_step": 329133, "epoch": 1959} {"train_loss": -12.404644966125488, "global_step": 329134, "epoch": 1959} {"train_loss": -12.02513599395752, "global_step": 329135, "epoch": 1959} {"train_loss": -12.329177856445312, "global_step": 329136, "epoch": 1959} {"train_loss": -12.52874755859375, "global_step": 329137, "epoch": 1959} {"train_loss": -12.252071380615234, "global_step": 329138, "epoch": 1959} {"train_loss": -12.506708145141602, "global_step": 329139, "epoch": 1959} {"train_loss": -12.18847942352295, "global_step": 329140, "epoch": 1959} {"train_loss": -12.458425521850586, "global_step": 329141, "epoch": 1959} {"train_loss": -12.51319694519043, "global_step": 329142, "epoch": 1959} {"train_loss": -12.426797866821289, "global_step": 329143, "epoch": 1959} {"train_loss": -12.309952735900879, "global_step": 329144, "epoch": 1959} {"train_loss": -12.287456512451172, "global_step": 329145, "epoch": 1959} {"train_loss": -12.330717086791992, "global_step": 329146, "epoch": 1959} {"train_loss": -12.38259506225586, "global_step": 329147, "epoch": 1959} {"train_loss": -12.395901679992676, "global_step": 329148, "epoch": 1959} {"train_loss": -12.303583145141602, "global_step": 329149, "epoch": 1959} {"train_loss": -12.413461685180664, "global_step": 329150, "epoch": 1959} {"train_loss": -12.54141616821289, "global_step": 329151, "epoch": 1959} {"train_loss": -12.4912109375, "global_step": 329152, "epoch": 1959} {"train_loss": -12.24193000793457, "global_step": 329153, "epoch": 1959} {"train_loss": -12.47203254699707, "global_step": 329154, "epoch": 1959} {"train_loss": -12.489227294921875, "global_step": 329155, "epoch": 1959} {"train_loss": -12.300224304199219, "global_step": 329156, "epoch": 1959} {"train_loss": -11.923282623291016, "global_step": 329157, "epoch": 1959} {"train_loss": -12.553043365478516, "global_step": 329158, "epoch": 1959} {"train_loss": -12.533699035644531, "global_step": 329159, "epoch": 1959} {"train_loss": -12.04508113861084, "global_step": 329160, "epoch": 1959} {"train_loss": -12.002065658569336, "global_step": 329161, "epoch": 1959} {"train_loss": -11.80709457397461, "global_step": 329162, "epoch": 1959} {"train_loss": -11.786910057067871, "global_step": 329163, "epoch": 1959} {"train_loss": -12.383430480957031, "global_step": 329164, "epoch": 1959} {"train_loss": -12.070396423339844, "global_step": 329165, "epoch": 1959} {"train_loss": -11.773792266845703, "global_step": 329166, "epoch": 1959} {"train_loss": -12.167985916137695, "global_step": 329167, "epoch": 1959} {"train_loss": -12.512739181518555, "global_step": 329168, "epoch": 1959} {"train_loss": -12.04176139831543, "global_step": 329169, "epoch": 1959} {"train_loss": -12.429927825927734, "global_step": 329170, "epoch": 1959} {"train_loss": -12.023958206176758, "global_step": 329171, "epoch": 1959} {"train_loss": -12.423786163330078, "global_step": 329172, "epoch": 1959} {"train_loss": -11.786884307861328, "global_step": 329173, "epoch": 1959} {"train_loss": -12.195731163024902, "global_step": 329174, "epoch": 1959} {"train_loss": -12.190498352050781, "global_step": 329175, "epoch": 1959} {"train_loss": -12.088628768920898, "global_step": 329176, "epoch": 1959} {"train_loss": -12.375297546386719, "global_step": 329177, "epoch": 1959} {"train_loss": -11.591850280761719, "global_step": 329178, "epoch": 1959} {"train_loss": -12.265640258789062, "global_step": 329179, "epoch": 1959} {"train_loss": -12.259291648864746, "global_step": 329180, "epoch": 1959} {"train_loss": -11.797645568847656, "global_step": 329181, "epoch": 1959} {"train_loss": -11.951898574829102, "global_step": 329182, "epoch": 1959} {"train_loss": -12.256526947021484, "global_step": 329183, "epoch": 1959} {"train_loss": -11.959678649902344, "global_step": 329184, "epoch": 1959} {"train_loss": -12.622685432434082, "global_step": 329185, "epoch": 1959} {"train_loss": -12.226743698120117, "global_step": 329186, "epoch": 1959} {"train_loss": -12.056665420532227, "global_step": 329187, "epoch": 1959} {"train_loss": -12.522209167480469, "global_step": 329188, "epoch": 1959} {"train_loss": -12.354742050170898, "global_step": 329189, "epoch": 1959} {"train_loss": -12.223812103271484, "global_step": 329190, "epoch": 1959} {"train_loss": -12.204747200012207, "global_step": 329191, "epoch": 1959} {"train_loss": -12.496360778808594, "global_step": 329192, "epoch": 1959} {"train_loss": -12.348637580871582, "global_step": 329193, "epoch": 1959} {"train_loss": -12.091169357299805, "global_step": 329194, "epoch": 1959} {"train_loss": -12.261714935302734, "global_step": 329195, "epoch": 1959} {"train_loss": -12.34337043762207, "global_step": 329196, "epoch": 1959} {"train_loss": -12.338872909545898, "global_step": 329197, "epoch": 1959} {"train_loss": -11.35226821899414, "global_step": 329198, "epoch": 1959} {"train_loss": -12.251507759094238, "global_step": 329199, "epoch": 1959} {"train_loss": -12.224599838256836, "global_step": 329200, "epoch": 1959} {"train_loss": -12.266044616699219, "global_step": 329201, "epoch": 1959} {"train_loss": -12.111895561218262, "global_step": 329202, "epoch": 1959} {"train_loss": -12.482686996459961, "global_step": 329203, "epoch": 1959} {"train_loss": -12.261869430541992, "global_step": 329204, "epoch": 1959} {"train_loss": -11.790602684020996, "global_step": 329205, "epoch": 1959} {"train_loss": -11.902511596679688, "global_step": 329206, "epoch": 1959} {"train_loss": -11.655731201171875, "global_step": 329207, "epoch": 1959} {"train_loss": -11.710915565490723, "global_step": 329208, "epoch": 1959} {"train_loss": -11.599298477172852, "global_step": 329209, "epoch": 1959} {"train_loss": -10.82918930053711, "global_step": 329210, "epoch": 1959} {"train_loss": -11.080549240112305, "global_step": 329211, "epoch": 1959} {"train_loss": -11.794449806213379, "global_step": 329212, "epoch": 1959} {"train_loss": -9.708800315856934, "global_step": 329213, "epoch": 1959} {"train_loss": -11.862371444702148, "global_step": 329214, "epoch": 1959} {"train_loss": -11.67886734008789, "global_step": 329215, "epoch": 1959} {"train_loss": -10.984081268310547, "global_step": 329216, "epoch": 1959} {"train_loss": -11.718071937561035, "global_step": 329217, "epoch": 1959} {"train_loss": -11.976081848144531, "global_step": 329218, "epoch": 1959} {"train_loss": -10.95248031616211, "global_step": 329219, "epoch": 1959} {"train_loss": -11.790383338928223, "global_step": 329220, "epoch": 1959} {"train_loss": -11.688157081604004, "global_step": 329221, "epoch": 1959} {"train_loss": -12.112115859985352, "global_step": 329222, "epoch": 1959} {"train_loss": -11.684895515441895, "global_step": 329223, "epoch": 1959} {"train_loss": -12.370819091796875, "global_step": 329224, "epoch": 1959} {"train_loss": -11.776094436645508, "global_step": 329225, "epoch": 1959} {"train_loss": -12.142664909362793, "global_step": 329226, "epoch": 1959} {"train_loss": -11.819457054138184, "global_step": 329227, "epoch": 1959} {"train_loss": -11.731403350830078, "global_step": 329228, "epoch": 1959} {"train_loss": -11.823719024658203, "global_step": 329229, "epoch": 1959} {"train_loss": -11.924421310424805, "global_step": 329230, "epoch": 1959} {"train_loss": -12.275728225708008, "global_step": 329231, "epoch": 1959} {"train_loss": -12.297471046447754, "global_step": 329232, "epoch": 1959} {"train_loss": -12.2119779586792, "global_step": 329233, "epoch": 1959} {"train_loss": -11.896781921386719, "global_step": 329234, "epoch": 1959} {"train_loss": -12.41584300994873, "global_step": 329235, "epoch": 1959} {"train_loss": -12.443279266357422, "global_step": 329236, "epoch": 1959} {"train_loss": -12.129764556884766, "global_step": 329237, "epoch": 1959} {"train_loss": -12.198799133300781, "global_step": 329238, "epoch": 1959} {"train_loss": -12.235448837280273, "global_step": 329239, "epoch": 1959} {"train_loss": -12.23210334777832, "global_step": 329240, "epoch": 1959} {"train_loss": -12.591014862060547, "global_step": 329241, "epoch": 1959} {"train_loss": -12.01164436340332, "global_step": 329242, "epoch": 1959} {"train_loss": -12.276103973388672, "global_step": 329243, "epoch": 1959} {"train_loss": -12.008279800415039, "global_step": 329244, "epoch": 1959} {"train_loss": -11.850305557250977, "global_step": 329245, "epoch": 1959} {"train_loss": -12.038639068603516, "global_step": 329246, "epoch": 1959} {"train_loss": -12.185873031616211, "global_step": 329247, "epoch": 1959} {"train_loss": -11.894134521484375, "global_step": 329248, "epoch": 1959} {"train_loss": -12.304859161376953, "global_step": 329249, "epoch": 1959} {"train_loss": -12.285000801086426, "global_step": 329250, "epoch": 1959} {"train_loss": -12.170315742492676, "global_step": 329251, "epoch": 1959} {"train_loss": -12.272483825683594, "global_step": 329252, "epoch": 1959} {"train_loss": -11.93709659576416, "global_step": 329253, "epoch": 1959} {"train_loss": -12.382247924804688, "global_step": 329254, "epoch": 1959} {"train_loss": -11.862576484680176, "global_step": 329255, "epoch": 1959} {"train_loss": -11.675567626953125, "global_step": 329256, "epoch": 1959} {"train_loss": -12.239360809326172, "global_step": 329257, "epoch": 1959} {"train_loss": -11.716691970825195, "global_step": 329258, "epoch": 1959} {"train_loss": -11.702577590942383, "global_step": 329259, "epoch": 1959} {"train_loss": -11.921711921691895, "global_step": 329260, "epoch": 1959} {"train_loss": -12.348194122314453, "global_step": 329261, "epoch": 1959} {"train_loss": -11.785089492797852, "global_step": 329262, "epoch": 1959} {"train_loss": -12.128410339355469, "global_step": 329263, "epoch": 1959} {"train_loss": -11.228517532348633, "global_step": 329264, "epoch": 1959} {"train_loss": -11.752934455871582, "global_step": 329265, "epoch": 1959} {"train_loss": -11.364670753479004, "global_step": 329266, "epoch": 1959} {"train_loss": -11.333950996398926, "global_step": 329267, "epoch": 1959} {"train_loss": -10.967565536499023, "global_step": 329268, "epoch": 1959} {"train_loss": -10.566118240356445, "global_step": 329269, "epoch": 1959} {"train_loss": -11.009801864624023, "global_step": 329270, "epoch": 1959} {"train_loss": -11.096452713012695, "global_step": 329271, "epoch": 1959} {"train_loss": -9.689484596252441, "global_step": 329272, "epoch": 1959} {"train_loss": -10.491813659667969, "global_step": 329273, "epoch": 1959} {"train_loss": -11.520502090454102, "global_step": 329274, "epoch": 1959} {"train_loss": -10.687856674194336, "global_step": 329275, "epoch": 1959} {"train_loss": -10.627166748046875, "global_step": 329276, "epoch": 1959} {"train_loss": -10.709419250488281, "global_step": 329277, "epoch": 1959} {"train_loss": -11.62476921081543, "global_step": 329278, "epoch": 1959} {"train_loss": -11.992777126176017, "global_step": 329279, "epoch": 1959, "val_loss": 283517.28125} {"train_loss": -11.58291244506836, "global_step": 329280, "epoch": 1960} {"train_loss": -11.11591911315918, "global_step": 329281, "epoch": 1960} {"train_loss": -10.78346061706543, "global_step": 329282, "epoch": 1960} {"train_loss": -11.755998611450195, "global_step": 329283, "epoch": 1960} {"train_loss": -11.222427368164062, "global_step": 329284, "epoch": 1960} {"train_loss": -11.70516300201416, "global_step": 329285, "epoch": 1960} {"train_loss": -11.63455581665039, "global_step": 329286, "epoch": 1960} {"train_loss": -11.548049926757812, "global_step": 329287, "epoch": 1960} {"train_loss": -12.07220458984375, "global_step": 329288, "epoch": 1960} {"train_loss": -11.341928482055664, "global_step": 329289, "epoch": 1960} {"train_loss": -11.981096267700195, "global_step": 329290, "epoch": 1960} {"train_loss": -11.551088333129883, "global_step": 329291, "epoch": 1960} {"train_loss": -11.300676345825195, "global_step": 329292, "epoch": 1960} {"train_loss": -11.986167907714844, "global_step": 329293, "epoch": 1960} {"train_loss": -11.85136604309082, "global_step": 329294, "epoch": 1960} {"train_loss": -11.805709838867188, "global_step": 329295, "epoch": 1960} {"train_loss": -11.889792442321777, "global_step": 329296, "epoch": 1960} {"train_loss": -11.653263092041016, "global_step": 329297, "epoch": 1960} {"train_loss": -12.096622467041016, "global_step": 329298, "epoch": 1960} {"train_loss": -11.693222045898438, "global_step": 329299, "epoch": 1960} {"train_loss": -11.874374389648438, "global_step": 329300, "epoch": 1960} {"train_loss": -11.663183212280273, "global_step": 329301, "epoch": 1960} {"train_loss": -11.864280700683594, "global_step": 329302, "epoch": 1960} {"train_loss": -11.93182373046875, "global_step": 329303, "epoch": 1960} {"train_loss": -12.161967277526855, "global_step": 329304, "epoch": 1960} {"train_loss": -11.625528335571289, "global_step": 329305, "epoch": 1960} {"train_loss": -12.06621265411377, "global_step": 329306, "epoch": 1960} {"train_loss": -11.732312202453613, "global_step": 329307, "epoch": 1960} {"train_loss": -12.062286376953125, "global_step": 329308, "epoch": 1960} {"train_loss": -12.227470397949219, "global_step": 329309, "epoch": 1960} {"train_loss": -11.812721252441406, "global_step": 329310, "epoch": 1960} {"train_loss": -11.9880952835083, "global_step": 329311, "epoch": 1960} {"train_loss": -11.687515258789062, "global_step": 329312, "epoch": 1960} {"train_loss": -11.963479995727539, "global_step": 329313, "epoch": 1960} {"train_loss": -12.124267578125, "global_step": 329314, "epoch": 1960} {"train_loss": -12.095882415771484, "global_step": 329315, "epoch": 1960} {"train_loss": -12.250787734985352, "global_step": 329316, "epoch": 1960} {"train_loss": -11.916418075561523, "global_step": 329317, "epoch": 1960} {"train_loss": -11.996763229370117, "global_step": 329318, "epoch": 1960} {"train_loss": -12.398805618286133, "global_step": 329319, "epoch": 1960} {"train_loss": -12.122983932495117, "global_step": 329320, "epoch": 1960} {"train_loss": -12.142199516296387, "global_step": 329321, "epoch": 1960} {"train_loss": -11.968320846557617, "global_step": 329322, "epoch": 1960} {"train_loss": -11.861676216125488, "global_step": 329323, "epoch": 1960} {"train_loss": -11.886041641235352, "global_step": 329324, "epoch": 1960} {"train_loss": -12.213752746582031, "global_step": 329325, "epoch": 1960} {"train_loss": -11.951395034790039, "global_step": 329326, "epoch": 1960} {"train_loss": -12.351645469665527, "global_step": 329327, "epoch": 1960} {"train_loss": -12.19809627532959, "global_step": 329328, "epoch": 1960} {"train_loss": -12.377584457397461, "global_step": 329329, "epoch": 1960} {"train_loss": -12.112238883972168, "global_step": 329330, "epoch": 1960} {"train_loss": -12.278955459594727, "global_step": 329331, "epoch": 1960} {"train_loss": -12.216176986694336, "global_step": 329332, "epoch": 1960} {"train_loss": -12.30346393585205, "global_step": 329333, "epoch": 1960} {"train_loss": -12.461166381835938, "global_step": 329334, "epoch": 1960} {"train_loss": -12.461498260498047, "global_step": 329335, "epoch": 1960} {"train_loss": -12.446048736572266, "global_step": 329336, "epoch": 1960} {"train_loss": -12.206865310668945, "global_step": 329337, "epoch": 1960} {"train_loss": -12.412851333618164, "global_step": 329338, "epoch": 1960} {"train_loss": -12.408723831176758, "global_step": 329339, "epoch": 1960} {"train_loss": -12.560221672058105, "global_step": 329340, "epoch": 1960} {"train_loss": -12.08603286743164, "global_step": 329341, "epoch": 1960} {"train_loss": -12.417455673217773, "global_step": 329342, "epoch": 1960} {"train_loss": -12.422826766967773, "global_step": 329343, "epoch": 1960} {"train_loss": -12.377335548400879, "global_step": 329344, "epoch": 1960} {"train_loss": -12.063558578491211, "global_step": 329345, "epoch": 1960} {"train_loss": -12.299810409545898, "global_step": 329346, "epoch": 1960} {"train_loss": -12.526403427124023, "global_step": 329347, "epoch": 1960} {"train_loss": -12.45029067993164, "global_step": 329348, "epoch": 1960} {"train_loss": -12.556644439697266, "global_step": 329349, "epoch": 1960} {"train_loss": -12.433929443359375, "global_step": 329350, "epoch": 1960} {"train_loss": -12.528305053710938, "global_step": 329351, "epoch": 1960} {"train_loss": -12.434327125549316, "global_step": 329352, "epoch": 1960} {"train_loss": -12.628719329833984, "global_step": 329353, "epoch": 1960} {"train_loss": -12.351865768432617, "global_step": 329354, "epoch": 1960} {"train_loss": -12.454398155212402, "global_step": 329355, "epoch": 1960} {"train_loss": -12.249149322509766, "global_step": 329356, "epoch": 1960} {"train_loss": -12.079500198364258, "global_step": 329357, "epoch": 1960} {"train_loss": -12.615239143371582, "global_step": 329358, "epoch": 1960} {"train_loss": -12.313488006591797, "global_step": 329359, "epoch": 1960} {"train_loss": -11.439926147460938, "global_step": 329360, "epoch": 1960} {"train_loss": -12.32992935180664, "global_step": 329361, "epoch": 1960} {"train_loss": -12.409221649169922, "global_step": 329362, "epoch": 1960} {"train_loss": -11.743236541748047, "global_step": 329363, "epoch": 1960} {"train_loss": -11.727884292602539, "global_step": 329364, "epoch": 1960} {"train_loss": -12.379438400268555, "global_step": 329365, "epoch": 1960} {"train_loss": -11.539827346801758, "global_step": 329366, "epoch": 1960} {"train_loss": -11.702238082885742, "global_step": 329367, "epoch": 1960} {"train_loss": -12.353751182556152, "global_step": 329368, "epoch": 1960} {"train_loss": -11.722349166870117, "global_step": 329369, "epoch": 1960} {"train_loss": -11.644414901733398, "global_step": 329370, "epoch": 1960} {"train_loss": -12.190552711486816, "global_step": 329371, "epoch": 1960} {"train_loss": -11.294454574584961, "global_step": 329372, "epoch": 1960} {"train_loss": -12.31583023071289, "global_step": 329373, "epoch": 1960} {"train_loss": -11.7818603515625, "global_step": 329374, "epoch": 1960} {"train_loss": -11.125726699829102, "global_step": 329375, "epoch": 1960} {"train_loss": -12.066728591918945, "global_step": 329376, "epoch": 1960} {"train_loss": -12.354448318481445, "global_step": 329377, "epoch": 1960} {"train_loss": -12.285223960876465, "global_step": 329378, "epoch": 1960} {"train_loss": -12.083656311035156, "global_step": 329379, "epoch": 1960} {"train_loss": -12.210533142089844, "global_step": 329380, "epoch": 1960} {"train_loss": -12.148001670837402, "global_step": 329381, "epoch": 1960} {"train_loss": -12.619892120361328, "global_step": 329382, "epoch": 1960} {"train_loss": -12.146915435791016, "global_step": 329383, "epoch": 1960} {"train_loss": -12.507064819335938, "global_step": 329384, "epoch": 1960} {"train_loss": -12.206110000610352, "global_step": 329385, "epoch": 1960} {"train_loss": -12.64803695678711, "global_step": 329386, "epoch": 1960} {"train_loss": -12.420267105102539, "global_step": 329387, "epoch": 1960} {"train_loss": -12.377714157104492, "global_step": 329388, "epoch": 1960} {"train_loss": -12.516561508178711, "global_step": 329389, "epoch": 1960} {"train_loss": -12.479681015014648, "global_step": 329390, "epoch": 1960} {"train_loss": -12.168724060058594, "global_step": 329391, "epoch": 1960} {"train_loss": -12.375955581665039, "global_step": 329392, "epoch": 1960} {"train_loss": -12.016944885253906, "global_step": 329393, "epoch": 1960} {"train_loss": -12.160305976867676, "global_step": 329394, "epoch": 1960} {"train_loss": -12.054086685180664, "global_step": 329395, "epoch": 1960} {"train_loss": -11.902595520019531, "global_step": 329396, "epoch": 1960} {"train_loss": -11.438496589660645, "global_step": 329397, "epoch": 1960} {"train_loss": -11.92943000793457, "global_step": 329398, "epoch": 1960} {"train_loss": -11.446247100830078, "global_step": 329399, "epoch": 1960} {"train_loss": -11.967191696166992, "global_step": 329400, "epoch": 1960} {"train_loss": -11.054879188537598, "global_step": 329401, "epoch": 1960} {"train_loss": -11.7825288772583, "global_step": 329402, "epoch": 1960} {"train_loss": -11.391868591308594, "global_step": 329403, "epoch": 1960} {"train_loss": -10.443489074707031, "global_step": 329404, "epoch": 1960} {"train_loss": -11.766645431518555, "global_step": 329405, "epoch": 1960} {"train_loss": -10.966379165649414, "global_step": 329406, "epoch": 1960} {"train_loss": -11.170310974121094, "global_step": 329407, "epoch": 1960} {"train_loss": -11.695718765258789, "global_step": 329408, "epoch": 1960} {"train_loss": -10.257625579833984, "global_step": 329409, "epoch": 1960} {"train_loss": -11.996847152709961, "global_step": 329410, "epoch": 1960} {"train_loss": -11.492679595947266, "global_step": 329411, "epoch": 1960} {"train_loss": -11.974770545959473, "global_step": 329412, "epoch": 1960} {"train_loss": -11.325490951538086, "global_step": 329413, "epoch": 1960} {"train_loss": -11.07308578491211, "global_step": 329414, "epoch": 1960} {"train_loss": -12.093193054199219, "global_step": 329415, "epoch": 1960} {"train_loss": -11.542797088623047, "global_step": 329416, "epoch": 1960} {"train_loss": -12.343605041503906, "global_step": 329417, "epoch": 1960} {"train_loss": -11.33224868774414, "global_step": 329418, "epoch": 1960} {"train_loss": -11.568649291992188, "global_step": 329419, "epoch": 1960} {"train_loss": -11.911552429199219, "global_step": 329420, "epoch": 1960} {"train_loss": -11.407939910888672, "global_step": 329421, "epoch": 1960} {"train_loss": -11.598846435546875, "global_step": 329422, "epoch": 1960} {"train_loss": -11.617391586303711, "global_step": 329423, "epoch": 1960} {"train_loss": -11.366607666015625, "global_step": 329424, "epoch": 1960} {"train_loss": -11.025794982910156, "global_step": 329425, "epoch": 1960} {"train_loss": -11.332820892333984, "global_step": 329426, "epoch": 1960} {"train_loss": -11.109689712524414, "global_step": 329427, "epoch": 1960} {"train_loss": -11.560699462890625, "global_step": 329428, "epoch": 1960} {"train_loss": -10.962026596069336, "global_step": 329429, "epoch": 1960} {"train_loss": -10.998794555664062, "global_step": 329430, "epoch": 1960} {"train_loss": -10.687267303466797, "global_step": 329431, "epoch": 1960} {"train_loss": -10.421598434448242, "global_step": 329432, "epoch": 1960} {"train_loss": -10.65241527557373, "global_step": 329433, "epoch": 1960} {"train_loss": -10.470193862915039, "global_step": 329434, "epoch": 1960} {"train_loss": -11.750165939331055, "global_step": 329435, "epoch": 1960} {"train_loss": -10.450451850891113, "global_step": 329436, "epoch": 1960} {"train_loss": -11.84575080871582, "global_step": 329437, "epoch": 1960} {"train_loss": -11.115683555603027, "global_step": 329438, "epoch": 1960} {"train_loss": -11.42241096496582, "global_step": 329439, "epoch": 1960} {"train_loss": -12.026111602783203, "global_step": 329440, "epoch": 1960} {"train_loss": -11.708576202392578, "global_step": 329441, "epoch": 1960} {"train_loss": -11.979354858398438, "global_step": 329442, "epoch": 1960} {"train_loss": -11.841940879821777, "global_step": 329443, "epoch": 1960} {"train_loss": -11.80060863494873, "global_step": 329444, "epoch": 1960} {"train_loss": -12.053592681884766, "global_step": 329445, "epoch": 1960} {"train_loss": -11.595006942749023, "global_step": 329446, "epoch": 1960} {"train_loss": -11.87035900638217, "global_step": 329447, "epoch": 1960, "val_loss": 287303.59375, "train_action_mse_error": 1.2909971475601196} {"train_loss": -11.6070556640625, "global_step": 329448, "epoch": 1961} {"train_loss": -11.929646492004395, "global_step": 329449, "epoch": 1961} {"train_loss": -11.601395606994629, "global_step": 329450, "epoch": 1961} {"train_loss": -11.945566177368164, "global_step": 329451, "epoch": 1961} {"train_loss": -11.906854629516602, "global_step": 329452, "epoch": 1961} {"train_loss": -11.894569396972656, "global_step": 329453, "epoch": 1961} {"train_loss": -12.226672172546387, "global_step": 329454, "epoch": 1961} {"train_loss": -11.811553955078125, "global_step": 329455, "epoch": 1961} {"train_loss": -12.152536392211914, "global_step": 329456, "epoch": 1961} {"train_loss": -11.815813064575195, "global_step": 329457, "epoch": 1961} {"train_loss": -12.094547271728516, "global_step": 329458, "epoch": 1961} {"train_loss": -12.131475448608398, "global_step": 329459, "epoch": 1961} {"train_loss": -12.282320976257324, "global_step": 329460, "epoch": 1961} {"train_loss": -11.935064315795898, "global_step": 329461, "epoch": 1961} {"train_loss": -11.951153755187988, "global_step": 329462, "epoch": 1961} {"train_loss": -11.98170280456543, "global_step": 329463, "epoch": 1961} {"train_loss": -12.031126022338867, "global_step": 329464, "epoch": 1961} {"train_loss": -12.239540100097656, "global_step": 329465, "epoch": 1961} {"train_loss": -11.723541259765625, "global_step": 329466, "epoch": 1961} {"train_loss": -12.096715927124023, "global_step": 329467, "epoch": 1961} {"train_loss": -11.613781929016113, "global_step": 329468, "epoch": 1961} {"train_loss": -12.143730163574219, "global_step": 329469, "epoch": 1961} {"train_loss": -11.935552597045898, "global_step": 329470, "epoch": 1961} {"train_loss": -12.071911811828613, "global_step": 329471, "epoch": 1961} {"train_loss": -12.113004684448242, "global_step": 329472, "epoch": 1961} {"train_loss": -12.285404205322266, "global_step": 329473, "epoch": 1961} {"train_loss": -12.217731475830078, "global_step": 329474, "epoch": 1961} {"train_loss": -12.303293228149414, "global_step": 329475, "epoch": 1961} {"train_loss": -12.024585723876953, "global_step": 329476, "epoch": 1961} {"train_loss": -12.447197914123535, "global_step": 329477, "epoch": 1961} {"train_loss": -12.36717414855957, "global_step": 329478, "epoch": 1961} {"train_loss": -12.373473167419434, "global_step": 329479, "epoch": 1961} {"train_loss": -12.573392868041992, "global_step": 329480, "epoch": 1961} {"train_loss": -12.306052207946777, "global_step": 329481, "epoch": 1961} {"train_loss": -12.266561508178711, "global_step": 329482, "epoch": 1961} {"train_loss": -12.320938110351562, "global_step": 329483, "epoch": 1961} {"train_loss": -12.563209533691406, "global_step": 329484, "epoch": 1961} {"train_loss": -12.441198348999023, "global_step": 329485, "epoch": 1961} {"train_loss": -12.41879653930664, "global_step": 329486, "epoch": 1961} {"train_loss": -12.33059310913086, "global_step": 329487, "epoch": 1961} {"train_loss": -12.554159164428711, "global_step": 329488, "epoch": 1961} {"train_loss": -12.563233375549316, "global_step": 329489, "epoch": 1961} {"train_loss": -12.421760559082031, "global_step": 329490, "epoch": 1961} {"train_loss": -12.449700355529785, "global_step": 329491, "epoch": 1961} {"train_loss": -12.308606147766113, "global_step": 329492, "epoch": 1961} {"train_loss": -12.60159969329834, "global_step": 329493, "epoch": 1961} {"train_loss": -12.45805835723877, "global_step": 329494, "epoch": 1961} {"train_loss": -12.462419509887695, "global_step": 329495, "epoch": 1961} {"train_loss": -12.613945007324219, "global_step": 329496, "epoch": 1961} {"train_loss": -12.362434387207031, "global_step": 329497, "epoch": 1961} {"train_loss": -12.43588638305664, "global_step": 329498, "epoch": 1961} {"train_loss": -12.309335708618164, "global_step": 329499, "epoch": 1961} {"train_loss": -12.54465103149414, "global_step": 329500, "epoch": 1961} {"train_loss": -12.243476867675781, "global_step": 329501, "epoch": 1961} {"train_loss": -12.65948486328125, "global_step": 329502, "epoch": 1961} {"train_loss": -12.394132614135742, "global_step": 329503, "epoch": 1961} {"train_loss": -12.420839309692383, "global_step": 329504, "epoch": 1961} {"train_loss": -12.599172592163086, "global_step": 329505, "epoch": 1961} {"train_loss": -12.436224937438965, "global_step": 329506, "epoch": 1961} {"train_loss": -12.648689270019531, "global_step": 329507, "epoch": 1961} {"train_loss": -12.367114067077637, "global_step": 329508, "epoch": 1961} {"train_loss": -12.661529541015625, "global_step": 329509, "epoch": 1961} {"train_loss": -12.731454849243164, "global_step": 329510, "epoch": 1961} {"train_loss": -12.461006164550781, "global_step": 329511, "epoch": 1961} {"train_loss": -12.466939926147461, "global_step": 329512, "epoch": 1961} {"train_loss": -12.649175643920898, "global_step": 329513, "epoch": 1961} {"train_loss": -12.733182907104492, "global_step": 329514, "epoch": 1961} {"train_loss": -12.499731063842773, "global_step": 329515, "epoch": 1961} {"train_loss": -12.328146934509277, "global_step": 329516, "epoch": 1961} {"train_loss": -12.763081550598145, "global_step": 329517, "epoch": 1961} {"train_loss": -12.660070419311523, "global_step": 329518, "epoch": 1961} {"train_loss": -12.684450149536133, "global_step": 329519, "epoch": 1961} {"train_loss": -12.637446403503418, "global_step": 329520, "epoch": 1961} {"train_loss": -12.445561408996582, "global_step": 329521, "epoch": 1961} {"train_loss": -12.455288887023926, "global_step": 329522, "epoch": 1961} {"train_loss": -12.164885520935059, "global_step": 329523, "epoch": 1961} {"train_loss": -12.58897590637207, "global_step": 329524, "epoch": 1961} {"train_loss": -12.557962417602539, "global_step": 329525, "epoch": 1961} {"train_loss": -11.970888137817383, "global_step": 329526, "epoch": 1961} {"train_loss": -11.635575294494629, "global_step": 329527, "epoch": 1961} {"train_loss": -11.334268569946289, "global_step": 329528, "epoch": 1961} {"train_loss": -10.215526580810547, "global_step": 329529, "epoch": 1961} {"train_loss": -11.730191230773926, "global_step": 329530, "epoch": 1961} {"train_loss": -11.876665115356445, "global_step": 329531, "epoch": 1961} {"train_loss": -9.033426284790039, "global_step": 329532, "epoch": 1961} {"train_loss": -12.109930038452148, "global_step": 329533, "epoch": 1961} {"train_loss": -11.26126480102539, "global_step": 329534, "epoch": 1961} {"train_loss": -9.51021957397461, "global_step": 329535, "epoch": 1961} {"train_loss": -11.271866798400879, "global_step": 329536, "epoch": 1961} {"train_loss": -12.222599029541016, "global_step": 329537, "epoch": 1961} {"train_loss": -11.100760459899902, "global_step": 329538, "epoch": 1961} {"train_loss": -9.379437446594238, "global_step": 329539, "epoch": 1961} {"train_loss": -11.048351287841797, "global_step": 329540, "epoch": 1961} {"train_loss": -11.657926559448242, "global_step": 329541, "epoch": 1961} {"train_loss": -10.630146026611328, "global_step": 329542, "epoch": 1961} {"train_loss": -12.005027770996094, "global_step": 329543, "epoch": 1961} {"train_loss": -11.612837791442871, "global_step": 329544, "epoch": 1961} {"train_loss": -11.209232330322266, "global_step": 329545, "epoch": 1961} {"train_loss": -11.47411060333252, "global_step": 329546, "epoch": 1961} {"train_loss": -11.352025985717773, "global_step": 329547, "epoch": 1961} {"train_loss": -11.736471176147461, "global_step": 329548, "epoch": 1961} {"train_loss": -12.479022026062012, "global_step": 329549, "epoch": 1961} {"train_loss": -11.549178123474121, "global_step": 329550, "epoch": 1961} {"train_loss": -12.11388874053955, "global_step": 329551, "epoch": 1961} {"train_loss": -11.755577087402344, "global_step": 329552, "epoch": 1961} {"train_loss": -12.096918106079102, "global_step": 329553, "epoch": 1961} {"train_loss": -12.028303146362305, "global_step": 329554, "epoch": 1961} {"train_loss": -11.31700325012207, "global_step": 329555, "epoch": 1961} {"train_loss": -11.833633422851562, "global_step": 329556, "epoch": 1961} {"train_loss": -11.769683837890625, "global_step": 329557, "epoch": 1961} {"train_loss": -11.461122512817383, "global_step": 329558, "epoch": 1961} {"train_loss": -11.695785522460938, "global_step": 329559, "epoch": 1961} {"train_loss": -10.141916275024414, "global_step": 329560, "epoch": 1961} {"train_loss": -11.10533618927002, "global_step": 329561, "epoch": 1961} {"train_loss": -10.8470458984375, "global_step": 329562, "epoch": 1961} {"train_loss": -10.250804901123047, "global_step": 329563, "epoch": 1961} {"train_loss": -10.755940437316895, "global_step": 329564, "epoch": 1961} {"train_loss": -10.008500099182129, "global_step": 329565, "epoch": 1961} {"train_loss": -9.806318283081055, "global_step": 329566, "epoch": 1961} {"train_loss": -10.916227340698242, "global_step": 329567, "epoch": 1961} {"train_loss": -9.92863941192627, "global_step": 329568, "epoch": 1961} {"train_loss": -10.414901733398438, "global_step": 329569, "epoch": 1961} {"train_loss": -11.030994415283203, "global_step": 329570, "epoch": 1961} {"train_loss": -9.78128433227539, "global_step": 329571, "epoch": 1961} {"train_loss": -10.846175193786621, "global_step": 329572, "epoch": 1961} {"train_loss": -11.10892391204834, "global_step": 329573, "epoch": 1961} {"train_loss": -10.66855239868164, "global_step": 329574, "epoch": 1961} {"train_loss": -12.06345272064209, "global_step": 329575, "epoch": 1961} {"train_loss": -11.356575012207031, "global_step": 329576, "epoch": 1961} {"train_loss": -11.078076362609863, "global_step": 329577, "epoch": 1961} {"train_loss": -11.897209167480469, "global_step": 329578, "epoch": 1961} {"train_loss": -11.130636215209961, "global_step": 329579, "epoch": 1961} {"train_loss": -11.235028266906738, "global_step": 329580, "epoch": 1961} {"train_loss": -12.123504638671875, "global_step": 329581, "epoch": 1961} {"train_loss": -10.915079116821289, "global_step": 329582, "epoch": 1961} {"train_loss": -11.780162811279297, "global_step": 329583, "epoch": 1961} {"train_loss": -11.706356048583984, "global_step": 329584, "epoch": 1961} {"train_loss": -11.186870574951172, "global_step": 329585, "epoch": 1961} {"train_loss": -12.01126766204834, "global_step": 329586, "epoch": 1961} {"train_loss": -11.799553871154785, "global_step": 329587, "epoch": 1961} {"train_loss": -11.559598922729492, "global_step": 329588, "epoch": 1961} {"train_loss": -11.598748207092285, "global_step": 329589, "epoch": 1961} {"train_loss": -12.055713653564453, "global_step": 329590, "epoch": 1961} {"train_loss": -11.906744956970215, "global_step": 329591, "epoch": 1961} {"train_loss": -12.223398208618164, "global_step": 329592, "epoch": 1961} {"train_loss": -11.820520401000977, "global_step": 329593, "epoch": 1961} {"train_loss": -11.82937240600586, "global_step": 329594, "epoch": 1961} {"train_loss": -11.976990699768066, "global_step": 329595, "epoch": 1961} {"train_loss": -11.807310104370117, "global_step": 329596, "epoch": 1961} {"train_loss": -12.331302642822266, "global_step": 329597, "epoch": 1961} {"train_loss": -11.898283004760742, "global_step": 329598, "epoch": 1961} {"train_loss": -11.825034141540527, "global_step": 329599, "epoch": 1961} {"train_loss": -12.284549713134766, "global_step": 329600, "epoch": 1961} {"train_loss": -12.194408416748047, "global_step": 329601, "epoch": 1961} {"train_loss": -12.353575706481934, "global_step": 329602, "epoch": 1961} {"train_loss": -12.201948165893555, "global_step": 329603, "epoch": 1961} {"train_loss": -12.301271438598633, "global_step": 329604, "epoch": 1961} {"train_loss": -12.185150146484375, "global_step": 329605, "epoch": 1961} {"train_loss": -12.236284255981445, "global_step": 329606, "epoch": 1961} {"train_loss": -12.020386695861816, "global_step": 329607, "epoch": 1961} {"train_loss": -12.276267051696777, "global_step": 329608, "epoch": 1961} {"train_loss": -12.186258316040039, "global_step": 329609, "epoch": 1961} {"train_loss": -12.216320991516113, "global_step": 329610, "epoch": 1961} {"train_loss": -12.460418701171875, "global_step": 329611, "epoch": 1961} {"train_loss": -12.163042068481445, "global_step": 329612, "epoch": 1961} {"train_loss": -12.218502044677734, "global_step": 329613, "epoch": 1961} {"train_loss": -12.254783630371094, "global_step": 329614, "epoch": 1961} {"train_loss": -11.867710198674883, "global_step": 329615, "epoch": 1961, "val_loss": 288238.15625} {"train_loss": -12.341971397399902, "global_step": 329616, "epoch": 1962} {"train_loss": -12.219437599182129, "global_step": 329617, "epoch": 1962} {"train_loss": -12.439974784851074, "global_step": 329618, "epoch": 1962} {"train_loss": -12.358601570129395, "global_step": 329619, "epoch": 1962} {"train_loss": -12.472925186157227, "global_step": 329620, "epoch": 1962} {"train_loss": -12.414678573608398, "global_step": 329621, "epoch": 1962} {"train_loss": -12.530570983886719, "global_step": 329622, "epoch": 1962} {"train_loss": -12.425193786621094, "global_step": 329623, "epoch": 1962} {"train_loss": -12.554912567138672, "global_step": 329624, "epoch": 1962} {"train_loss": -12.668825149536133, "global_step": 329625, "epoch": 1962} {"train_loss": -12.51505184173584, "global_step": 329626, "epoch": 1962} {"train_loss": -12.666943550109863, "global_step": 329627, "epoch": 1962} {"train_loss": -12.604238510131836, "global_step": 329628, "epoch": 1962} {"train_loss": -12.495645523071289, "global_step": 329629, "epoch": 1962} {"train_loss": -12.578908920288086, "global_step": 329630, "epoch": 1962} {"train_loss": -12.536880493164062, "global_step": 329631, "epoch": 1962} {"train_loss": -12.455224990844727, "global_step": 329632, "epoch": 1962} {"train_loss": -12.40003776550293, "global_step": 329633, "epoch": 1962} {"train_loss": -12.492897033691406, "global_step": 329634, "epoch": 1962} {"train_loss": -12.761478424072266, "global_step": 329635, "epoch": 1962} {"train_loss": -12.752565383911133, "global_step": 329636, "epoch": 1962} {"train_loss": -12.58794116973877, "global_step": 329637, "epoch": 1962} {"train_loss": -12.511159896850586, "global_step": 329638, "epoch": 1962} {"train_loss": -12.54660701751709, "global_step": 329639, "epoch": 1962} {"train_loss": -12.482288360595703, "global_step": 329640, "epoch": 1962} {"train_loss": -12.59358024597168, "global_step": 329641, "epoch": 1962} {"train_loss": -12.291353225708008, "global_step": 329642, "epoch": 1962} {"train_loss": -12.708781242370605, "global_step": 329643, "epoch": 1962} {"train_loss": -12.624996185302734, "global_step": 329644, "epoch": 1962} {"train_loss": -12.522268295288086, "global_step": 329645, "epoch": 1962} {"train_loss": -12.579277992248535, "global_step": 329646, "epoch": 1962} {"train_loss": -12.5910062789917, "global_step": 329647, "epoch": 1962} {"train_loss": -12.684076309204102, "global_step": 329648, "epoch": 1962} {"train_loss": -12.799619674682617, "global_step": 329649, "epoch": 1962} {"train_loss": -12.56070327758789, "global_step": 329650, "epoch": 1962} {"train_loss": -12.643415451049805, "global_step": 329651, "epoch": 1962} {"train_loss": -12.690570831298828, "global_step": 329652, "epoch": 1962} {"train_loss": -12.719036102294922, "global_step": 329653, "epoch": 1962} {"train_loss": -12.536572456359863, "global_step": 329654, "epoch": 1962} {"train_loss": -12.66238021850586, "global_step": 329655, "epoch": 1962} {"train_loss": -12.334274291992188, "global_step": 329656, "epoch": 1962} {"train_loss": -12.643733024597168, "global_step": 329657, "epoch": 1962} {"train_loss": -12.511726379394531, "global_step": 329658, "epoch": 1962} {"train_loss": -12.603236198425293, "global_step": 329659, "epoch": 1962} {"train_loss": -12.421205520629883, "global_step": 329660, "epoch": 1962} {"train_loss": -12.570840835571289, "global_step": 329661, "epoch": 1962} {"train_loss": -12.34431266784668, "global_step": 329662, "epoch": 1962} {"train_loss": -12.282127380371094, "global_step": 329663, "epoch": 1962} {"train_loss": -12.308427810668945, "global_step": 329664, "epoch": 1962} {"train_loss": -11.088741302490234, "global_step": 329665, "epoch": 1962} {"train_loss": -9.430707931518555, "global_step": 329666, "epoch": 1962} {"train_loss": -11.279273986816406, "global_step": 329667, "epoch": 1962} {"train_loss": -9.758447647094727, "global_step": 329668, "epoch": 1962} {"train_loss": -6.145810127258301, "global_step": 329669, "epoch": 1962} {"train_loss": -7.710297584533691, "global_step": 329670, "epoch": 1962} {"train_loss": -6.832732200622559, "global_step": 329671, "epoch": 1962} {"train_loss": -7.173084259033203, "global_step": 329672, "epoch": 1962} {"train_loss": -6.884315490722656, "global_step": 329673, "epoch": 1962} {"train_loss": -6.755062580108643, "global_step": 329674, "epoch": 1962} {"train_loss": -7.075491428375244, "global_step": 329675, "epoch": 1962} {"train_loss": -7.111281871795654, "global_step": 329676, "epoch": 1962} {"train_loss": -6.973577499389648, "global_step": 329677, "epoch": 1962} {"train_loss": -7.456241607666016, "global_step": 329678, "epoch": 1962} {"train_loss": -8.57246208190918, "global_step": 329679, "epoch": 1962} {"train_loss": -9.945507049560547, "global_step": 329680, "epoch": 1962} {"train_loss": -9.178528785705566, "global_step": 329681, "epoch": 1962} {"train_loss": -9.087722778320312, "global_step": 329682, "epoch": 1962} {"train_loss": -9.321151733398438, "global_step": 329683, "epoch": 1962} {"train_loss": -9.454758644104004, "global_step": 329684, "epoch": 1962} {"train_loss": -9.947498321533203, "global_step": 329685, "epoch": 1962} {"train_loss": -9.796436309814453, "global_step": 329686, "epoch": 1962} {"train_loss": -10.814132690429688, "global_step": 329687, "epoch": 1962} {"train_loss": -10.038461685180664, "global_step": 329688, "epoch": 1962} {"train_loss": -10.696477890014648, "global_step": 329689, "epoch": 1962} {"train_loss": -10.717562675476074, "global_step": 329690, "epoch": 1962} {"train_loss": -10.629264831542969, "global_step": 329691, "epoch": 1962} {"train_loss": -11.250181198120117, "global_step": 329692, "epoch": 1962} {"train_loss": -11.153541564941406, "global_step": 329693, "epoch": 1962} {"train_loss": -11.05000114440918, "global_step": 329694, "epoch": 1962} {"train_loss": -11.148082733154297, "global_step": 329695, "epoch": 1962} {"train_loss": -11.31301498413086, "global_step": 329696, "epoch": 1962} {"train_loss": -11.514883041381836, "global_step": 329697, "epoch": 1962} {"train_loss": -11.395580291748047, "global_step": 329698, "epoch": 1962} {"train_loss": -11.322527885437012, "global_step": 329699, "epoch": 1962} {"train_loss": -11.22252082824707, "global_step": 329700, "epoch": 1962} {"train_loss": -11.166101455688477, "global_step": 329701, "epoch": 1962} {"train_loss": -11.559398651123047, "global_step": 329702, "epoch": 1962} {"train_loss": -11.345027923583984, "global_step": 329703, "epoch": 1962} {"train_loss": -11.03640365600586, "global_step": 329704, "epoch": 1962} {"train_loss": -11.3699951171875, "global_step": 329705, "epoch": 1962} {"train_loss": -11.233816146850586, "global_step": 329706, "epoch": 1962} {"train_loss": -11.547142028808594, "global_step": 329707, "epoch": 1962} {"train_loss": -11.170486450195312, "global_step": 329708, "epoch": 1962} {"train_loss": -11.836909294128418, "global_step": 329709, "epoch": 1962} {"train_loss": -11.603632926940918, "global_step": 329710, "epoch": 1962} {"train_loss": -11.937111854553223, "global_step": 329711, "epoch": 1962} {"train_loss": -12.188555717468262, "global_step": 329712, "epoch": 1962} {"train_loss": -11.684181213378906, "global_step": 329713, "epoch": 1962} {"train_loss": -12.095369338989258, "global_step": 329714, "epoch": 1962} {"train_loss": -11.363614082336426, "global_step": 329715, "epoch": 1962} {"train_loss": -11.530933380126953, "global_step": 329716, "epoch": 1962} {"train_loss": -11.77779769897461, "global_step": 329717, "epoch": 1962} {"train_loss": -12.010906219482422, "global_step": 329718, "epoch": 1962} {"train_loss": -12.126774787902832, "global_step": 329719, "epoch": 1962} {"train_loss": -11.813362121582031, "global_step": 329720, "epoch": 1962} {"train_loss": -11.995489120483398, "global_step": 329721, "epoch": 1962} {"train_loss": -11.93166732788086, "global_step": 329722, "epoch": 1962} {"train_loss": -11.705904006958008, "global_step": 329723, "epoch": 1962} {"train_loss": -12.07313346862793, "global_step": 329724, "epoch": 1962} {"train_loss": -11.82573127746582, "global_step": 329725, "epoch": 1962} {"train_loss": -11.647260665893555, "global_step": 329726, "epoch": 1962} {"train_loss": -11.986279487609863, "global_step": 329727, "epoch": 1962} {"train_loss": -11.844425201416016, "global_step": 329728, "epoch": 1962} {"train_loss": -12.153615951538086, "global_step": 329729, "epoch": 1962} {"train_loss": -11.674507141113281, "global_step": 329730, "epoch": 1962} {"train_loss": -12.276336669921875, "global_step": 329731, "epoch": 1962} {"train_loss": -11.951713562011719, "global_step": 329732, "epoch": 1962} {"train_loss": -12.224533081054688, "global_step": 329733, "epoch": 1962} {"train_loss": -12.321405410766602, "global_step": 329734, "epoch": 1962} {"train_loss": -12.235530853271484, "global_step": 329735, "epoch": 1962} {"train_loss": -12.129201889038086, "global_step": 329736, "epoch": 1962} {"train_loss": -12.340869903564453, "global_step": 329737, "epoch": 1962} {"train_loss": -11.931586265563965, "global_step": 329738, "epoch": 1962} {"train_loss": -12.210433959960938, "global_step": 329739, "epoch": 1962} {"train_loss": -12.047883987426758, "global_step": 329740, "epoch": 1962} {"train_loss": -11.674057960510254, "global_step": 329741, "epoch": 1962} {"train_loss": -12.032386779785156, "global_step": 329742, "epoch": 1962} {"train_loss": -12.085862159729004, "global_step": 329743, "epoch": 1962} {"train_loss": -12.24409008026123, "global_step": 329744, "epoch": 1962} {"train_loss": -12.238138198852539, "global_step": 329745, "epoch": 1962} {"train_loss": -12.216297149658203, "global_step": 329746, "epoch": 1962} {"train_loss": -12.441940307617188, "global_step": 329747, "epoch": 1962} {"train_loss": -12.05036449432373, "global_step": 329748, "epoch": 1962} {"train_loss": -12.379796981811523, "global_step": 329749, "epoch": 1962} {"train_loss": -12.009902954101562, "global_step": 329750, "epoch": 1962} {"train_loss": -11.838333129882812, "global_step": 329751, "epoch": 1962} {"train_loss": -12.31148910522461, "global_step": 329752, "epoch": 1962} {"train_loss": -12.395102500915527, "global_step": 329753, "epoch": 1962} {"train_loss": -11.556865692138672, "global_step": 329754, "epoch": 1962} {"train_loss": -12.188386917114258, "global_step": 329755, "epoch": 1962} {"train_loss": -11.831351280212402, "global_step": 329756, "epoch": 1962} {"train_loss": -12.36417007446289, "global_step": 329757, "epoch": 1962} {"train_loss": -11.801310539245605, "global_step": 329758, "epoch": 1962} {"train_loss": -12.133071899414062, "global_step": 329759, "epoch": 1962} {"train_loss": -12.053956031799316, "global_step": 329760, "epoch": 1962} {"train_loss": -12.078508377075195, "global_step": 329761, "epoch": 1962} {"train_loss": -12.220329284667969, "global_step": 329762, "epoch": 1962} {"train_loss": -11.951835632324219, "global_step": 329763, "epoch": 1962} {"train_loss": -12.075103759765625, "global_step": 329764, "epoch": 1962} {"train_loss": -12.045735359191895, "global_step": 329765, "epoch": 1962} {"train_loss": -12.062639236450195, "global_step": 329766, "epoch": 1962} {"train_loss": -12.028575897216797, "global_step": 329767, "epoch": 1962} {"train_loss": -12.179141998291016, "global_step": 329768, "epoch": 1962} {"train_loss": -12.463041305541992, "global_step": 329769, "epoch": 1962} {"train_loss": -12.246337890625, "global_step": 329770, "epoch": 1962} {"train_loss": -12.138408660888672, "global_step": 329771, "epoch": 1962} {"train_loss": -11.943110466003418, "global_step": 329772, "epoch": 1962} {"train_loss": -12.08454418182373, "global_step": 329773, "epoch": 1962} {"train_loss": -11.78916072845459, "global_step": 329774, "epoch": 1962} {"train_loss": -12.239259719848633, "global_step": 329775, "epoch": 1962} {"train_loss": -11.657587051391602, "global_step": 329776, "epoch": 1962} {"train_loss": -11.664527893066406, "global_step": 329777, "epoch": 1962} {"train_loss": -11.5296630859375, "global_step": 329778, "epoch": 1962} {"train_loss": -10.922411918640137, "global_step": 329779, "epoch": 1962} {"train_loss": -11.895271301269531, "global_step": 329780, "epoch": 1962} {"train_loss": -10.920111656188965, "global_step": 329781, "epoch": 1962} {"train_loss": -12.321792602539062, "global_step": 329782, "epoch": 1962} {"train_loss": -11.568889098508018, "global_step": 329783, "epoch": 1962, "val_loss": 290178.125} {"train_loss": -12.122249603271484, "global_step": 329784, "epoch": 1963} {"train_loss": -11.19064712524414, "global_step": 329785, "epoch": 1963} {"train_loss": -11.993995666503906, "global_step": 329786, "epoch": 1963} {"train_loss": -11.555233001708984, "global_step": 329787, "epoch": 1963} {"train_loss": -11.802438735961914, "global_step": 329788, "epoch": 1963} {"train_loss": -11.704272270202637, "global_step": 329789, "epoch": 1963} {"train_loss": -11.94454288482666, "global_step": 329790, "epoch": 1963} {"train_loss": -11.582124710083008, "global_step": 329791, "epoch": 1963} {"train_loss": -11.466337203979492, "global_step": 329792, "epoch": 1963} {"train_loss": -11.942444801330566, "global_step": 329793, "epoch": 1963} {"train_loss": -11.956964492797852, "global_step": 329794, "epoch": 1963} {"train_loss": -11.708490371704102, "global_step": 329795, "epoch": 1963} {"train_loss": -12.185150146484375, "global_step": 329796, "epoch": 1963} {"train_loss": -11.86098861694336, "global_step": 329797, "epoch": 1963} {"train_loss": -12.19636058807373, "global_step": 329798, "epoch": 1963} {"train_loss": -12.244744300842285, "global_step": 329799, "epoch": 1963} {"train_loss": -12.054847717285156, "global_step": 329800, "epoch": 1963} {"train_loss": -12.36233901977539, "global_step": 329801, "epoch": 1963} {"train_loss": -12.168254852294922, "global_step": 329802, "epoch": 1963} {"train_loss": -12.304377555847168, "global_step": 329803, "epoch": 1963} {"train_loss": -12.280790328979492, "global_step": 329804, "epoch": 1963} {"train_loss": -12.199466705322266, "global_step": 329805, "epoch": 1963} {"train_loss": -12.491650581359863, "global_step": 329806, "epoch": 1963} {"train_loss": -12.208858489990234, "global_step": 329807, "epoch": 1963} {"train_loss": -12.472909927368164, "global_step": 329808, "epoch": 1963} {"train_loss": -12.158730506896973, "global_step": 329809, "epoch": 1963} {"train_loss": -12.256599426269531, "global_step": 329810, "epoch": 1963} {"train_loss": -12.298986434936523, "global_step": 329811, "epoch": 1963} {"train_loss": -12.104960441589355, "global_step": 329812, "epoch": 1963} {"train_loss": -12.314545631408691, "global_step": 329813, "epoch": 1963} {"train_loss": -12.196952819824219, "global_step": 329814, "epoch": 1963} {"train_loss": -12.433019638061523, "global_step": 329815, "epoch": 1963} {"train_loss": -12.194459915161133, "global_step": 329816, "epoch": 1963} {"train_loss": -12.321584701538086, "global_step": 329817, "epoch": 1963} {"train_loss": -12.209495544433594, "global_step": 329818, "epoch": 1963} {"train_loss": -12.257039070129395, "global_step": 329819, "epoch": 1963} {"train_loss": -12.113554000854492, "global_step": 329820, "epoch": 1963} {"train_loss": -12.047853469848633, "global_step": 329821, "epoch": 1963} {"train_loss": -12.405763626098633, "global_step": 329822, "epoch": 1963} {"train_loss": -12.260068893432617, "global_step": 329823, "epoch": 1963} {"train_loss": -11.695642471313477, "global_step": 329824, "epoch": 1963} {"train_loss": -11.96253490447998, "global_step": 329825, "epoch": 1963} {"train_loss": -12.193132400512695, "global_step": 329826, "epoch": 1963} {"train_loss": -11.810937881469727, "global_step": 329827, "epoch": 1963} {"train_loss": -11.783050537109375, "global_step": 329828, "epoch": 1963} {"train_loss": -12.176006317138672, "global_step": 329829, "epoch": 1963} {"train_loss": -12.790164947509766, "global_step": 329830, "epoch": 1963} {"train_loss": -11.788578987121582, "global_step": 329831, "epoch": 1963} {"train_loss": -12.296516418457031, "global_step": 329832, "epoch": 1963} {"train_loss": -12.30923080444336, "global_step": 329833, "epoch": 1963} {"train_loss": -10.915258407592773, "global_step": 329834, "epoch": 1963} {"train_loss": -11.569107055664062, "global_step": 329835, "epoch": 1963} {"train_loss": -11.115090370178223, "global_step": 329836, "epoch": 1963} {"train_loss": -10.766729354858398, "global_step": 329837, "epoch": 1963} {"train_loss": -10.958166122436523, "global_step": 329838, "epoch": 1963} {"train_loss": -10.543521881103516, "global_step": 329839, "epoch": 1963} {"train_loss": -11.814516067504883, "global_step": 329840, "epoch": 1963} {"train_loss": -10.353145599365234, "global_step": 329841, "epoch": 1963} {"train_loss": -11.736149787902832, "global_step": 329842, "epoch": 1963} {"train_loss": -9.991695404052734, "global_step": 329843, "epoch": 1963} {"train_loss": -11.075329780578613, "global_step": 329844, "epoch": 1963} {"train_loss": -10.51699447631836, "global_step": 329845, "epoch": 1963} {"train_loss": -9.466290473937988, "global_step": 329846, "epoch": 1963} {"train_loss": -8.828302383422852, "global_step": 329847, "epoch": 1963} {"train_loss": -9.284029006958008, "global_step": 329848, "epoch": 1963} {"train_loss": -9.871212005615234, "global_step": 329849, "epoch": 1963} {"train_loss": -9.982856750488281, "global_step": 329850, "epoch": 1963} {"train_loss": -9.669843673706055, "global_step": 329851, "epoch": 1963} {"train_loss": -10.152362823486328, "global_step": 329852, "epoch": 1963} {"train_loss": -9.659355163574219, "global_step": 329853, "epoch": 1963} {"train_loss": -10.299503326416016, "global_step": 329854, "epoch": 1963} {"train_loss": -10.458999633789062, "global_step": 329855, "epoch": 1963} {"train_loss": -10.872674942016602, "global_step": 329856, "epoch": 1963} {"train_loss": -10.581704139709473, "global_step": 329857, "epoch": 1963} {"train_loss": -11.565773963928223, "global_step": 329858, "epoch": 1963} {"train_loss": -11.125051498413086, "global_step": 329859, "epoch": 1963} {"train_loss": -11.058865547180176, "global_step": 329860, "epoch": 1963} {"train_loss": -11.403948783874512, "global_step": 329861, "epoch": 1963} {"train_loss": -10.99060344696045, "global_step": 329862, "epoch": 1963} {"train_loss": -11.452877044677734, "global_step": 329863, "epoch": 1963} {"train_loss": -11.64566707611084, "global_step": 329864, "epoch": 1963} {"train_loss": -11.413389205932617, "global_step": 329865, "epoch": 1963} {"train_loss": -11.955120086669922, "global_step": 329866, "epoch": 1963} {"train_loss": -11.304935455322266, "global_step": 329867, "epoch": 1963} {"train_loss": -11.977450370788574, "global_step": 329868, "epoch": 1963} {"train_loss": -11.320930480957031, "global_step": 329869, "epoch": 1963} {"train_loss": -11.456998825073242, "global_step": 329870, "epoch": 1963} {"train_loss": -11.798391342163086, "global_step": 329871, "epoch": 1963} {"train_loss": -11.651490211486816, "global_step": 329872, "epoch": 1963} {"train_loss": -11.858573913574219, "global_step": 329873, "epoch": 1963} {"train_loss": -11.845184326171875, "global_step": 329874, "epoch": 1963} {"train_loss": -11.956090927124023, "global_step": 329875, "epoch": 1963} {"train_loss": -11.707460403442383, "global_step": 329876, "epoch": 1963} {"train_loss": -11.978036880493164, "global_step": 329877, "epoch": 1963} {"train_loss": -11.546945571899414, "global_step": 329878, "epoch": 1963} {"train_loss": -12.108003616333008, "global_step": 329879, "epoch": 1963} {"train_loss": -12.047504425048828, "global_step": 329880, "epoch": 1963} {"train_loss": -12.120672225952148, "global_step": 329881, "epoch": 1963} {"train_loss": -11.979286193847656, "global_step": 329882, "epoch": 1963} {"train_loss": -12.207075119018555, "global_step": 329883, "epoch": 1963} {"train_loss": -12.221535682678223, "global_step": 329884, "epoch": 1963} {"train_loss": -12.235204696655273, "global_step": 329885, "epoch": 1963} {"train_loss": -12.37673568725586, "global_step": 329886, "epoch": 1963} {"train_loss": -12.243903160095215, "global_step": 329887, "epoch": 1963} {"train_loss": -12.156886100769043, "global_step": 329888, "epoch": 1963} {"train_loss": -12.296942710876465, "global_step": 329889, "epoch": 1963} {"train_loss": -12.096902847290039, "global_step": 329890, "epoch": 1963} {"train_loss": -12.29672622680664, "global_step": 329891, "epoch": 1963} {"train_loss": -12.094770431518555, "global_step": 329892, "epoch": 1963} {"train_loss": -12.221924781799316, "global_step": 329893, "epoch": 1963} {"train_loss": -12.173330307006836, "global_step": 329894, "epoch": 1963} {"train_loss": -12.389379501342773, "global_step": 329895, "epoch": 1963} {"train_loss": -12.276008605957031, "global_step": 329896, "epoch": 1963} {"train_loss": -12.012056350708008, "global_step": 329897, "epoch": 1963} {"train_loss": -12.322148323059082, "global_step": 329898, "epoch": 1963} {"train_loss": -11.99663257598877, "global_step": 329899, "epoch": 1963} {"train_loss": -12.170036315917969, "global_step": 329900, "epoch": 1963} {"train_loss": -11.901843070983887, "global_step": 329901, "epoch": 1963} {"train_loss": -12.347033500671387, "global_step": 329902, "epoch": 1963} {"train_loss": -12.050487518310547, "global_step": 329903, "epoch": 1963} {"train_loss": -12.446334838867188, "global_step": 329904, "epoch": 1963} {"train_loss": -12.179206848144531, "global_step": 329905, "epoch": 1963} {"train_loss": -12.012741088867188, "global_step": 329906, "epoch": 1963} {"train_loss": -12.217806816101074, "global_step": 329907, "epoch": 1963} {"train_loss": -12.122663497924805, "global_step": 329908, "epoch": 1963} {"train_loss": -12.36499309539795, "global_step": 329909, "epoch": 1963} {"train_loss": -12.081616401672363, "global_step": 329910, "epoch": 1963} {"train_loss": -12.366822242736816, "global_step": 329911, "epoch": 1963} {"train_loss": -12.329151153564453, "global_step": 329912, "epoch": 1963} {"train_loss": -12.364139556884766, "global_step": 329913, "epoch": 1963} {"train_loss": -12.316043853759766, "global_step": 329914, "epoch": 1963} {"train_loss": -12.203446388244629, "global_step": 329915, "epoch": 1963} {"train_loss": -12.219327926635742, "global_step": 329916, "epoch": 1963} {"train_loss": -12.300118446350098, "global_step": 329917, "epoch": 1963} {"train_loss": -12.218040466308594, "global_step": 329918, "epoch": 1963} {"train_loss": -12.296526908874512, "global_step": 329919, "epoch": 1963} {"train_loss": -12.268516540527344, "global_step": 329920, "epoch": 1963} {"train_loss": -12.169242858886719, "global_step": 329921, "epoch": 1963} {"train_loss": -12.169950485229492, "global_step": 329922, "epoch": 1963} {"train_loss": -12.15707778930664, "global_step": 329923, "epoch": 1963} {"train_loss": -12.00529670715332, "global_step": 329924, "epoch": 1963} {"train_loss": -11.588479995727539, "global_step": 329925, "epoch": 1963} {"train_loss": -11.272676467895508, "global_step": 329926, "epoch": 1963} {"train_loss": -10.331489562988281, "global_step": 329927, "epoch": 1963} {"train_loss": -11.636529922485352, "global_step": 329928, "epoch": 1963} {"train_loss": -9.469806671142578, "global_step": 329929, "epoch": 1963} {"train_loss": -11.491944313049316, "global_step": 329930, "epoch": 1963} {"train_loss": -10.878484725952148, "global_step": 329931, "epoch": 1963} {"train_loss": -10.485977172851562, "global_step": 329932, "epoch": 1963} {"train_loss": -11.079774856567383, "global_step": 329933, "epoch": 1963} {"train_loss": -9.634347915649414, "global_step": 329934, "epoch": 1963} {"train_loss": -11.434356689453125, "global_step": 329935, "epoch": 1963} {"train_loss": -10.01762580871582, "global_step": 329936, "epoch": 1963} {"train_loss": -11.041394233703613, "global_step": 329937, "epoch": 1963} {"train_loss": -10.832220077514648, "global_step": 329938, "epoch": 1963} {"train_loss": -11.996259689331055, "global_step": 329939, "epoch": 1963} {"train_loss": -10.679573059082031, "global_step": 329940, "epoch": 1963} {"train_loss": -11.653202056884766, "global_step": 329941, "epoch": 1963} {"train_loss": -11.897509574890137, "global_step": 329942, "epoch": 1963} {"train_loss": -11.695219993591309, "global_step": 329943, "epoch": 1963} {"train_loss": -12.186967849731445, "global_step": 329944, "epoch": 1963} {"train_loss": -11.021773338317871, "global_step": 329945, "epoch": 1963} {"train_loss": -12.104825973510742, "global_step": 329946, "epoch": 1963} {"train_loss": -11.678653717041016, "global_step": 329947, "epoch": 1963} {"train_loss": -11.988783836364746, "global_step": 329948, "epoch": 1963} {"train_loss": -11.787283897399902, "global_step": 329949, "epoch": 1963} {"train_loss": -11.954614639282227, "global_step": 329950, "epoch": 1963} {"train_loss": -11.683726872716631, "global_step": 329951, "epoch": 1963, "val_loss": 285614.25} {"train_loss": -12.26771354675293, "global_step": 329952, "epoch": 1964} {"train_loss": -11.836650848388672, "global_step": 329953, "epoch": 1964} {"train_loss": -12.188013076782227, "global_step": 329954, "epoch": 1964} {"train_loss": -11.914714813232422, "global_step": 329955, "epoch": 1964} {"train_loss": -12.348270416259766, "global_step": 329956, "epoch": 1964} {"train_loss": -11.918256759643555, "global_step": 329957, "epoch": 1964} {"train_loss": -11.894428253173828, "global_step": 329958, "epoch": 1964} {"train_loss": -11.837617874145508, "global_step": 329959, "epoch": 1964} {"train_loss": -12.075881004333496, "global_step": 329960, "epoch": 1964} {"train_loss": -12.137048721313477, "global_step": 329961, "epoch": 1964} {"train_loss": -11.605060577392578, "global_step": 329962, "epoch": 1964} {"train_loss": -12.270817756652832, "global_step": 329963, "epoch": 1964} {"train_loss": -11.23584270477295, "global_step": 329964, "epoch": 1964} {"train_loss": -12.099494934082031, "global_step": 329965, "epoch": 1964} {"train_loss": -11.813047409057617, "global_step": 329966, "epoch": 1964} {"train_loss": -12.091838836669922, "global_step": 329967, "epoch": 1964} {"train_loss": -12.095866203308105, "global_step": 329968, "epoch": 1964} {"train_loss": -12.1063871383667, "global_step": 329969, "epoch": 1964} {"train_loss": -12.223388671875, "global_step": 329970, "epoch": 1964} {"train_loss": -12.009660720825195, "global_step": 329971, "epoch": 1964} {"train_loss": -12.06303596496582, "global_step": 329972, "epoch": 1964} {"train_loss": -12.299158096313477, "global_step": 329973, "epoch": 1964} {"train_loss": -12.172587394714355, "global_step": 329974, "epoch": 1964} {"train_loss": -12.31973934173584, "global_step": 329975, "epoch": 1964} {"train_loss": -12.313663482666016, "global_step": 329976, "epoch": 1964} {"train_loss": -12.275918960571289, "global_step": 329977, "epoch": 1964} {"train_loss": -12.260038375854492, "global_step": 329978, "epoch": 1964} {"train_loss": -12.178743362426758, "global_step": 329979, "epoch": 1964} {"train_loss": -12.366059303283691, "global_step": 329980, "epoch": 1964} {"train_loss": -12.120721817016602, "global_step": 329981, "epoch": 1964} {"train_loss": -12.26848030090332, "global_step": 329982, "epoch": 1964} {"train_loss": -12.113040924072266, "global_step": 329983, "epoch": 1964} {"train_loss": -12.518677711486816, "global_step": 329984, "epoch": 1964} {"train_loss": -12.205606460571289, "global_step": 329985, "epoch": 1964} {"train_loss": -12.317658424377441, "global_step": 329986, "epoch": 1964} {"train_loss": -12.413561820983887, "global_step": 329987, "epoch": 1964} {"train_loss": -12.030957221984863, "global_step": 329988, "epoch": 1964} {"train_loss": -12.50051212310791, "global_step": 329989, "epoch": 1964} {"train_loss": -12.145286560058594, "global_step": 329990, "epoch": 1964} {"train_loss": -12.397150039672852, "global_step": 329991, "epoch": 1964} {"train_loss": -12.443599700927734, "global_step": 329992, "epoch": 1964} {"train_loss": -12.217642784118652, "global_step": 329993, "epoch": 1964} {"train_loss": -12.674741744995117, "global_step": 329994, "epoch": 1964} {"train_loss": -12.360612869262695, "global_step": 329995, "epoch": 1964} {"train_loss": -12.403885841369629, "global_step": 329996, "epoch": 1964} {"train_loss": -12.329405784606934, "global_step": 329997, "epoch": 1964} {"train_loss": -12.282791137695312, "global_step": 329998, "epoch": 1964} {"train_loss": -12.312807083129883, "global_step": 329999, "epoch": 1964} {"train_loss": -12.45174789428711, "global_step": 330000, "epoch": 1964} {"train_loss": -12.51574420928955, "global_step": 330001, "epoch": 1964} {"train_loss": -12.49995231628418, "global_step": 330002, "epoch": 1964} {"train_loss": -12.093165397644043, "global_step": 330003, "epoch": 1964} {"train_loss": -12.322481155395508, "global_step": 330004, "epoch": 1964} {"train_loss": -12.392352104187012, "global_step": 330005, "epoch": 1964} {"train_loss": -12.312231063842773, "global_step": 330006, "epoch": 1964} {"train_loss": -12.507516860961914, "global_step": 330007, "epoch": 1964} {"train_loss": -12.391222953796387, "global_step": 330008, "epoch": 1964} {"train_loss": -11.884612083435059, "global_step": 330009, "epoch": 1964} {"train_loss": -12.512226104736328, "global_step": 330010, "epoch": 1964} {"train_loss": -12.53552532196045, "global_step": 330011, "epoch": 1964} {"train_loss": -12.372785568237305, "global_step": 330012, "epoch": 1964} {"train_loss": -12.382528305053711, "global_step": 330013, "epoch": 1964} {"train_loss": -12.65107536315918, "global_step": 330014, "epoch": 1964} {"train_loss": -12.24432373046875, "global_step": 330015, "epoch": 1964} {"train_loss": -12.39307689666748, "global_step": 330016, "epoch": 1964} {"train_loss": -12.548513412475586, "global_step": 330017, "epoch": 1964} {"train_loss": -12.375253677368164, "global_step": 330018, "epoch": 1964} {"train_loss": -12.575121879577637, "global_step": 330019, "epoch": 1964} {"train_loss": -12.299381256103516, "global_step": 330020, "epoch": 1964} {"train_loss": -12.254484176635742, "global_step": 330021, "epoch": 1964} {"train_loss": -12.327911376953125, "global_step": 330022, "epoch": 1964} {"train_loss": -12.12945556640625, "global_step": 330023, "epoch": 1964} {"train_loss": -12.500144958496094, "global_step": 330024, "epoch": 1964} {"train_loss": -12.228431701660156, "global_step": 330025, "epoch": 1964} {"train_loss": -12.592947006225586, "global_step": 330026, "epoch": 1964} {"train_loss": -11.969310760498047, "global_step": 330027, "epoch": 1964} {"train_loss": -11.102975845336914, "global_step": 330028, "epoch": 1964} {"train_loss": -10.538034439086914, "global_step": 330029, "epoch": 1964} {"train_loss": -9.763049125671387, "global_step": 330030, "epoch": 1964} {"train_loss": -9.484635353088379, "global_step": 330031, "epoch": 1964} {"train_loss": -9.112029075622559, "global_step": 330032, "epoch": 1964} {"train_loss": -10.193504333496094, "global_step": 330033, "epoch": 1964} {"train_loss": -10.253898620605469, "global_step": 330034, "epoch": 1964} {"train_loss": -9.46929931640625, "global_step": 330035, "epoch": 1964} {"train_loss": -11.36784553527832, "global_step": 330036, "epoch": 1964} {"train_loss": -10.917576789855957, "global_step": 330037, "epoch": 1964} {"train_loss": -10.277080535888672, "global_step": 330038, "epoch": 1964} {"train_loss": -11.156730651855469, "global_step": 330039, "epoch": 1964} {"train_loss": -11.04481315612793, "global_step": 330040, "epoch": 1964} {"train_loss": -11.26784896850586, "global_step": 330041, "epoch": 1964} {"train_loss": -11.173431396484375, "global_step": 330042, "epoch": 1964} {"train_loss": -11.155923843383789, "global_step": 330043, "epoch": 1964} {"train_loss": -11.151577949523926, "global_step": 330044, "epoch": 1964} {"train_loss": -10.26738166809082, "global_step": 330045, "epoch": 1964} {"train_loss": -12.024538040161133, "global_step": 330046, "epoch": 1964} {"train_loss": -10.39765739440918, "global_step": 330047, "epoch": 1964} {"train_loss": -10.71601676940918, "global_step": 330048, "epoch": 1964} {"train_loss": -10.707157135009766, "global_step": 330049, "epoch": 1964} {"train_loss": -10.166584014892578, "global_step": 330050, "epoch": 1964} {"train_loss": -10.314172744750977, "global_step": 330051, "epoch": 1964} {"train_loss": -10.582195281982422, "global_step": 330052, "epoch": 1964} {"train_loss": -9.930356979370117, "global_step": 330053, "epoch": 1964} {"train_loss": -10.230955123901367, "global_step": 330054, "epoch": 1964} {"train_loss": -10.969644546508789, "global_step": 330055, "epoch": 1964} {"train_loss": -10.183234214782715, "global_step": 330056, "epoch": 1964} {"train_loss": -11.216907501220703, "global_step": 330057, "epoch": 1964} {"train_loss": -10.578174591064453, "global_step": 330058, "epoch": 1964} {"train_loss": -9.648804664611816, "global_step": 330059, "epoch": 1964} {"train_loss": -11.81126880645752, "global_step": 330060, "epoch": 1964} {"train_loss": -10.609933853149414, "global_step": 330061, "epoch": 1964} {"train_loss": -10.832067489624023, "global_step": 330062, "epoch": 1964} {"train_loss": -10.870582580566406, "global_step": 330063, "epoch": 1964} {"train_loss": -11.67402458190918, "global_step": 330064, "epoch": 1964} {"train_loss": -10.33575439453125, "global_step": 330065, "epoch": 1964} {"train_loss": -11.348133087158203, "global_step": 330066, "epoch": 1964} {"train_loss": -11.292680740356445, "global_step": 330067, "epoch": 1964} {"train_loss": -11.162637710571289, "global_step": 330068, "epoch": 1964} {"train_loss": -11.689220428466797, "global_step": 330069, "epoch": 1964} {"train_loss": -11.733232498168945, "global_step": 330070, "epoch": 1964} {"train_loss": -11.678472518920898, "global_step": 330071, "epoch": 1964} {"train_loss": -11.906553268432617, "global_step": 330072, "epoch": 1964} {"train_loss": -11.926349639892578, "global_step": 330073, "epoch": 1964} {"train_loss": -11.597137451171875, "global_step": 330074, "epoch": 1964} {"train_loss": -11.69615364074707, "global_step": 330075, "epoch": 1964} {"train_loss": -11.808725357055664, "global_step": 330076, "epoch": 1964} {"train_loss": -11.811315536499023, "global_step": 330077, "epoch": 1964} {"train_loss": -11.782572746276855, "global_step": 330078, "epoch": 1964} {"train_loss": -12.076930046081543, "global_step": 330079, "epoch": 1964} {"train_loss": -11.715917587280273, "global_step": 330080, "epoch": 1964} {"train_loss": -11.991463661193848, "global_step": 330081, "epoch": 1964} {"train_loss": -11.647859573364258, "global_step": 330082, "epoch": 1964} {"train_loss": -12.11128044128418, "global_step": 330083, "epoch": 1964} {"train_loss": -12.09814453125, "global_step": 330084, "epoch": 1964} {"train_loss": -11.949678421020508, "global_step": 330085, "epoch": 1964} {"train_loss": -12.381399154663086, "global_step": 330086, "epoch": 1964} {"train_loss": -11.875335693359375, "global_step": 330087, "epoch": 1964} {"train_loss": -12.355655670166016, "global_step": 330088, "epoch": 1964} {"train_loss": -12.073321342468262, "global_step": 330089, "epoch": 1964} {"train_loss": -12.136871337890625, "global_step": 330090, "epoch": 1964} {"train_loss": -11.729009628295898, "global_step": 330091, "epoch": 1964} {"train_loss": -12.132139205932617, "global_step": 330092, "epoch": 1964} {"train_loss": -12.135540008544922, "global_step": 330093, "epoch": 1964} {"train_loss": -11.937870025634766, "global_step": 330094, "epoch": 1964} {"train_loss": -12.022045135498047, "global_step": 330095, "epoch": 1964} {"train_loss": -12.133077621459961, "global_step": 330096, "epoch": 1964} {"train_loss": -12.011061668395996, "global_step": 330097, "epoch": 1964} {"train_loss": -12.129968643188477, "global_step": 330098, "epoch": 1964} {"train_loss": -11.978435516357422, "global_step": 330099, "epoch": 1964} {"train_loss": -11.383995056152344, "global_step": 330100, "epoch": 1964} {"train_loss": -12.006160736083984, "global_step": 330101, "epoch": 1964} {"train_loss": -12.203818321228027, "global_step": 330102, "epoch": 1964} {"train_loss": -11.927851676940918, "global_step": 330103, "epoch": 1964} {"train_loss": -12.122417449951172, "global_step": 330104, "epoch": 1964} {"train_loss": -11.936983108520508, "global_step": 330105, "epoch": 1964} {"train_loss": -12.275527954101562, "global_step": 330106, "epoch": 1964} {"train_loss": -11.820744514465332, "global_step": 330107, "epoch": 1964} {"train_loss": -11.960765838623047, "global_step": 330108, "epoch": 1964} {"train_loss": -12.157054901123047, "global_step": 330109, "epoch": 1964} {"train_loss": -12.0196533203125, "global_step": 330110, "epoch": 1964} {"train_loss": -12.341451644897461, "global_step": 330111, "epoch": 1964} {"train_loss": -12.111284255981445, "global_step": 330112, "epoch": 1964} {"train_loss": -11.968082427978516, "global_step": 330113, "epoch": 1964} {"train_loss": -12.177687644958496, "global_step": 330114, "epoch": 1964} {"train_loss": -11.993663787841797, "global_step": 330115, "epoch": 1964} {"train_loss": -12.317571640014648, "global_step": 330116, "epoch": 1964} {"train_loss": -12.416132926940918, "global_step": 330117, "epoch": 1964} {"train_loss": -11.972381591796875, "global_step": 330118, "epoch": 1964} {"train_loss": -11.783186895506722, "global_step": 330119, "epoch": 1964, "val_loss": 289441.71875} {"train_loss": -12.348922729492188, "global_step": 330120, "epoch": 1965} {"train_loss": -12.173725128173828, "global_step": 330121, "epoch": 1965} {"train_loss": -12.25244140625, "global_step": 330122, "epoch": 1965} {"train_loss": -12.330577850341797, "global_step": 330123, "epoch": 1965} {"train_loss": -12.198673248291016, "global_step": 330124, "epoch": 1965} {"train_loss": -12.334142684936523, "global_step": 330125, "epoch": 1965} {"train_loss": -12.281997680664062, "global_step": 330126, "epoch": 1965} {"train_loss": -12.089229583740234, "global_step": 330127, "epoch": 1965} {"train_loss": -12.16079330444336, "global_step": 330128, "epoch": 1965} {"train_loss": -12.25932502746582, "global_step": 330129, "epoch": 1965} {"train_loss": -12.31928825378418, "global_step": 330130, "epoch": 1965} {"train_loss": -12.400423049926758, "global_step": 330131, "epoch": 1965} {"train_loss": -12.277016639709473, "global_step": 330132, "epoch": 1965} {"train_loss": -12.529172897338867, "global_step": 330133, "epoch": 1965} {"train_loss": -12.6339750289917, "global_step": 330134, "epoch": 1965} {"train_loss": -12.252918243408203, "global_step": 330135, "epoch": 1965} {"train_loss": -11.902036666870117, "global_step": 330136, "epoch": 1965} {"train_loss": -12.286452293395996, "global_step": 330137, "epoch": 1965} {"train_loss": -12.318986892700195, "global_step": 330138, "epoch": 1965} {"train_loss": -12.18238639831543, "global_step": 330139, "epoch": 1965} {"train_loss": -12.337881088256836, "global_step": 330140, "epoch": 1965} {"train_loss": -12.067144393920898, "global_step": 330141, "epoch": 1965} {"train_loss": -12.392292022705078, "global_step": 330142, "epoch": 1965} {"train_loss": -12.361282348632812, "global_step": 330143, "epoch": 1965} {"train_loss": -12.26282024383545, "global_step": 330144, "epoch": 1965} {"train_loss": -12.304071426391602, "global_step": 330145, "epoch": 1965} {"train_loss": -11.853531837463379, "global_step": 330146, "epoch": 1965} {"train_loss": -12.15084171295166, "global_step": 330147, "epoch": 1965} {"train_loss": -11.949033737182617, "global_step": 330148, "epoch": 1965} {"train_loss": -11.908214569091797, "global_step": 330149, "epoch": 1965} {"train_loss": -12.206498146057129, "global_step": 330150, "epoch": 1965} {"train_loss": -12.207084655761719, "global_step": 330151, "epoch": 1965} {"train_loss": -11.88487434387207, "global_step": 330152, "epoch": 1965} {"train_loss": -12.352813720703125, "global_step": 330153, "epoch": 1965} {"train_loss": -12.100396156311035, "global_step": 330154, "epoch": 1965} {"train_loss": -11.541597366333008, "global_step": 330155, "epoch": 1965} {"train_loss": -12.13451862335205, "global_step": 330156, "epoch": 1965} {"train_loss": -12.330413818359375, "global_step": 330157, "epoch": 1965} {"train_loss": -12.342777252197266, "global_step": 330158, "epoch": 1965} {"train_loss": -12.077508926391602, "global_step": 330159, "epoch": 1965} {"train_loss": -12.337931632995605, "global_step": 330160, "epoch": 1965} {"train_loss": -11.865160942077637, "global_step": 330161, "epoch": 1965} {"train_loss": -12.267919540405273, "global_step": 330162, "epoch": 1965} {"train_loss": -12.097460746765137, "global_step": 330163, "epoch": 1965} {"train_loss": -12.333819389343262, "global_step": 330164, "epoch": 1965} {"train_loss": -12.528375625610352, "global_step": 330165, "epoch": 1965} {"train_loss": -12.374309539794922, "global_step": 330166, "epoch": 1965} {"train_loss": -12.507627487182617, "global_step": 330167, "epoch": 1965} {"train_loss": -12.167964935302734, "global_step": 330168, "epoch": 1965} {"train_loss": -12.321575164794922, "global_step": 330169, "epoch": 1965} {"train_loss": -12.392935752868652, "global_step": 330170, "epoch": 1965} {"train_loss": -11.97415542602539, "global_step": 330171, "epoch": 1965} {"train_loss": -11.891263961791992, "global_step": 330172, "epoch": 1965} {"train_loss": -11.967403411865234, "global_step": 330173, "epoch": 1965} {"train_loss": -12.53256607055664, "global_step": 330174, "epoch": 1965} {"train_loss": -11.1132173538208, "global_step": 330175, "epoch": 1965} {"train_loss": -10.563526153564453, "global_step": 330176, "epoch": 1965} {"train_loss": -11.94737434387207, "global_step": 330177, "epoch": 1965} {"train_loss": -11.96076774597168, "global_step": 330178, "epoch": 1965} {"train_loss": -11.03532886505127, "global_step": 330179, "epoch": 1965} {"train_loss": -11.189306259155273, "global_step": 330180, "epoch": 1965} {"train_loss": -12.060457229614258, "global_step": 330181, "epoch": 1965} {"train_loss": -10.011384963989258, "global_step": 330182, "epoch": 1965} {"train_loss": -12.194703102111816, "global_step": 330183, "epoch": 1965} {"train_loss": -10.007061004638672, "global_step": 330184, "epoch": 1965} {"train_loss": -9.975528717041016, "global_step": 330185, "epoch": 1965} {"train_loss": -11.547579765319824, "global_step": 330186, "epoch": 1965} {"train_loss": -10.988615036010742, "global_step": 330187, "epoch": 1965} {"train_loss": -10.105525016784668, "global_step": 330188, "epoch": 1965} {"train_loss": -11.062482833862305, "global_step": 330189, "epoch": 1965} {"train_loss": -10.69742488861084, "global_step": 330190, "epoch": 1965} {"train_loss": -10.481348037719727, "global_step": 330191, "epoch": 1965} {"train_loss": -10.746556282043457, "global_step": 330192, "epoch": 1965} {"train_loss": -10.754980087280273, "global_step": 330193, "epoch": 1965} {"train_loss": -10.494040489196777, "global_step": 330194, "epoch": 1965} {"train_loss": -10.870231628417969, "global_step": 330195, "epoch": 1965} {"train_loss": -10.14531135559082, "global_step": 330196, "epoch": 1965} {"train_loss": -10.664093017578125, "global_step": 330197, "epoch": 1965} {"train_loss": -11.217735290527344, "global_step": 330198, "epoch": 1965} {"train_loss": -10.454120635986328, "global_step": 330199, "epoch": 1965} {"train_loss": -11.441308975219727, "global_step": 330200, "epoch": 1965} {"train_loss": -10.631917953491211, "global_step": 330201, "epoch": 1965} {"train_loss": -10.919303894042969, "global_step": 330202, "epoch": 1965} {"train_loss": -10.998552322387695, "global_step": 330203, "epoch": 1965} {"train_loss": -10.223093032836914, "global_step": 330204, "epoch": 1965} {"train_loss": -11.234294891357422, "global_step": 330205, "epoch": 1965} {"train_loss": -10.951519012451172, "global_step": 330206, "epoch": 1965} {"train_loss": -11.028310775756836, "global_step": 330207, "epoch": 1965} {"train_loss": -10.813579559326172, "global_step": 330208, "epoch": 1965} {"train_loss": -11.39923095703125, "global_step": 330209, "epoch": 1965} {"train_loss": -12.026592254638672, "global_step": 330210, "epoch": 1965} {"train_loss": -11.63784408569336, "global_step": 330211, "epoch": 1965} {"train_loss": -11.71218204498291, "global_step": 330212, "epoch": 1965} {"train_loss": -11.346919059753418, "global_step": 330213, "epoch": 1965} {"train_loss": -11.845319747924805, "global_step": 330214, "epoch": 1965} {"train_loss": -11.782720565795898, "global_step": 330215, "epoch": 1965} {"train_loss": -11.880779266357422, "global_step": 330216, "epoch": 1965} {"train_loss": -11.945779800415039, "global_step": 330217, "epoch": 1965} {"train_loss": -11.846384048461914, "global_step": 330218, "epoch": 1965} {"train_loss": -12.08654499053955, "global_step": 330219, "epoch": 1965} {"train_loss": -11.872230529785156, "global_step": 330220, "epoch": 1965} {"train_loss": -12.097457885742188, "global_step": 330221, "epoch": 1965} {"train_loss": -11.741209983825684, "global_step": 330222, "epoch": 1965} {"train_loss": -12.027576446533203, "global_step": 330223, "epoch": 1965} {"train_loss": -11.818195343017578, "global_step": 330224, "epoch": 1965} {"train_loss": -12.06100845336914, "global_step": 330225, "epoch": 1965} {"train_loss": -12.018082618713379, "global_step": 330226, "epoch": 1965} {"train_loss": -12.120620727539062, "global_step": 330227, "epoch": 1965} {"train_loss": -11.92671012878418, "global_step": 330228, "epoch": 1965} {"train_loss": -12.066122055053711, "global_step": 330229, "epoch": 1965} {"train_loss": -12.092208862304688, "global_step": 330230, "epoch": 1965} {"train_loss": -12.203445434570312, "global_step": 330231, "epoch": 1965} {"train_loss": -12.071256637573242, "global_step": 330232, "epoch": 1965} {"train_loss": -12.113818168640137, "global_step": 330233, "epoch": 1965} {"train_loss": -12.250340461730957, "global_step": 330234, "epoch": 1965} {"train_loss": -12.047259330749512, "global_step": 330235, "epoch": 1965} {"train_loss": -12.1592435836792, "global_step": 330236, "epoch": 1965} {"train_loss": -12.056838989257812, "global_step": 330237, "epoch": 1965} {"train_loss": -12.31026840209961, "global_step": 330238, "epoch": 1965} {"train_loss": -11.968223571777344, "global_step": 330239, "epoch": 1965} {"train_loss": -12.415449142456055, "global_step": 330240, "epoch": 1965} {"train_loss": -12.091898918151855, "global_step": 330241, "epoch": 1965} {"train_loss": -12.167219161987305, "global_step": 330242, "epoch": 1965} {"train_loss": -12.074002265930176, "global_step": 330243, "epoch": 1965} {"train_loss": -12.202041625976562, "global_step": 330244, "epoch": 1965} {"train_loss": -12.421730995178223, "global_step": 330245, "epoch": 1965} {"train_loss": -12.125749588012695, "global_step": 330246, "epoch": 1965} {"train_loss": -12.618145942687988, "global_step": 330247, "epoch": 1965} {"train_loss": -12.349640846252441, "global_step": 330248, "epoch": 1965} {"train_loss": -12.490265846252441, "global_step": 330249, "epoch": 1965} {"train_loss": -12.467840194702148, "global_step": 330250, "epoch": 1965} {"train_loss": -12.283791542053223, "global_step": 330251, "epoch": 1965} {"train_loss": -12.372247695922852, "global_step": 330252, "epoch": 1965} {"train_loss": -12.40249252319336, "global_step": 330253, "epoch": 1965} {"train_loss": -12.352177619934082, "global_step": 330254, "epoch": 1965} {"train_loss": -12.414009094238281, "global_step": 330255, "epoch": 1965} {"train_loss": -12.193801879882812, "global_step": 330256, "epoch": 1965} {"train_loss": -12.336353302001953, "global_step": 330257, "epoch": 1965} {"train_loss": -12.266914367675781, "global_step": 330258, "epoch": 1965} {"train_loss": -11.98434066772461, "global_step": 330259, "epoch": 1965} {"train_loss": -12.003732681274414, "global_step": 330260, "epoch": 1965} {"train_loss": -12.179901123046875, "global_step": 330261, "epoch": 1965} {"train_loss": -12.028419494628906, "global_step": 330262, "epoch": 1965} {"train_loss": -12.17248821258545, "global_step": 330263, "epoch": 1965} {"train_loss": -12.172466278076172, "global_step": 330264, "epoch": 1965} {"train_loss": -12.080154418945312, "global_step": 330265, "epoch": 1965} {"train_loss": -12.105783462524414, "global_step": 330266, "epoch": 1965} {"train_loss": -12.39094066619873, "global_step": 330267, "epoch": 1965} {"train_loss": -12.100980758666992, "global_step": 330268, "epoch": 1965} {"train_loss": -12.215282440185547, "global_step": 330269, "epoch": 1965} {"train_loss": -12.12027645111084, "global_step": 330270, "epoch": 1965} {"train_loss": -12.49278450012207, "global_step": 330271, "epoch": 1965} {"train_loss": -12.222631454467773, "global_step": 330272, "epoch": 1965} {"train_loss": -12.144445419311523, "global_step": 330273, "epoch": 1965} {"train_loss": -12.37397289276123, "global_step": 330274, "epoch": 1965} {"train_loss": -12.616158485412598, "global_step": 330275, "epoch": 1965} {"train_loss": -12.55274772644043, "global_step": 330276, "epoch": 1965} {"train_loss": -12.349081039428711, "global_step": 330277, "epoch": 1965} {"train_loss": -12.373323440551758, "global_step": 330278, "epoch": 1965} {"train_loss": -12.518718719482422, "global_step": 330279, "epoch": 1965} {"train_loss": -12.316753387451172, "global_step": 330280, "epoch": 1965} {"train_loss": -12.432689666748047, "global_step": 330281, "epoch": 1965} {"train_loss": -12.51447868347168, "global_step": 330282, "epoch": 1965} {"train_loss": -12.591339111328125, "global_step": 330283, "epoch": 1965} {"train_loss": -12.185583114624023, "global_step": 330284, "epoch": 1965} {"train_loss": -12.623270988464355, "global_step": 330285, "epoch": 1965} {"train_loss": -12.393712997436523, "global_step": 330286, "epoch": 1965} {"train_loss": -11.922999052774339, "global_step": 330287, "epoch": 1965, "val_loss": 286084.6875, "train_action_mse_error": 1.2778494358062744} {"train_loss": -12.184320449829102, "global_step": 330288, "epoch": 1966} {"train_loss": -12.497455596923828, "global_step": 330289, "epoch": 1966} {"train_loss": -12.45754623413086, "global_step": 330290, "epoch": 1966} {"train_loss": -12.573017120361328, "global_step": 330291, "epoch": 1966} {"train_loss": -12.306861877441406, "global_step": 330292, "epoch": 1966} {"train_loss": -12.601115226745605, "global_step": 330293, "epoch": 1966} {"train_loss": -12.519530296325684, "global_step": 330294, "epoch": 1966} {"train_loss": -12.492080688476562, "global_step": 330295, "epoch": 1966} {"train_loss": -12.406407356262207, "global_step": 330296, "epoch": 1966} {"train_loss": -12.406070709228516, "global_step": 330297, "epoch": 1966} {"train_loss": -12.323013305664062, "global_step": 330298, "epoch": 1966} {"train_loss": -12.488714218139648, "global_step": 330299, "epoch": 1966} {"train_loss": -12.671201705932617, "global_step": 330300, "epoch": 1966} {"train_loss": -12.196996688842773, "global_step": 330301, "epoch": 1966} {"train_loss": -12.24917984008789, "global_step": 330302, "epoch": 1966} {"train_loss": -12.467406272888184, "global_step": 330303, "epoch": 1966} {"train_loss": -12.429697036743164, "global_step": 330304, "epoch": 1966} {"train_loss": -12.116032600402832, "global_step": 330305, "epoch": 1966} {"train_loss": -12.072439193725586, "global_step": 330306, "epoch": 1966} {"train_loss": -12.387609481811523, "global_step": 330307, "epoch": 1966} {"train_loss": -12.367547988891602, "global_step": 330308, "epoch": 1966} {"train_loss": -12.252695083618164, "global_step": 330309, "epoch": 1966} {"train_loss": -12.06249713897705, "global_step": 330310, "epoch": 1966} {"train_loss": -12.174409866333008, "global_step": 330311, "epoch": 1966} {"train_loss": -12.042850494384766, "global_step": 330312, "epoch": 1966} {"train_loss": -10.65645980834961, "global_step": 330313, "epoch": 1966} {"train_loss": -11.312230110168457, "global_step": 330314, "epoch": 1966} {"train_loss": -11.967453002929688, "global_step": 330315, "epoch": 1966} {"train_loss": -12.08181095123291, "global_step": 330316, "epoch": 1966} {"train_loss": -11.19923210144043, "global_step": 330317, "epoch": 1966} {"train_loss": -11.648719787597656, "global_step": 330318, "epoch": 1966} {"train_loss": -12.017131805419922, "global_step": 330319, "epoch": 1966} {"train_loss": -12.030923843383789, "global_step": 330320, "epoch": 1966} {"train_loss": -11.022525787353516, "global_step": 330321, "epoch": 1966} {"train_loss": -11.638501167297363, "global_step": 330322, "epoch": 1966} {"train_loss": -11.677154541015625, "global_step": 330323, "epoch": 1966} {"train_loss": -11.61896800994873, "global_step": 330324, "epoch": 1966} {"train_loss": -12.027435302734375, "global_step": 330325, "epoch": 1966} {"train_loss": -11.269878387451172, "global_step": 330326, "epoch": 1966} {"train_loss": -11.69888973236084, "global_step": 330327, "epoch": 1966} {"train_loss": -11.674076080322266, "global_step": 330328, "epoch": 1966} {"train_loss": -9.974701881408691, "global_step": 330329, "epoch": 1966} {"train_loss": -10.673822402954102, "global_step": 330330, "epoch": 1966} {"train_loss": -10.224905014038086, "global_step": 330331, "epoch": 1966} {"train_loss": -10.317028999328613, "global_step": 330332, "epoch": 1966} {"train_loss": -10.895608901977539, "global_step": 330333, "epoch": 1966} {"train_loss": -10.427911758422852, "global_step": 330334, "epoch": 1966} {"train_loss": -9.654512405395508, "global_step": 330335, "epoch": 1966} {"train_loss": -11.072065353393555, "global_step": 330336, "epoch": 1966} {"train_loss": -11.404695510864258, "global_step": 330337, "epoch": 1966} {"train_loss": -10.627874374389648, "global_step": 330338, "epoch": 1966} {"train_loss": -11.88001823425293, "global_step": 330339, "epoch": 1966} {"train_loss": -11.51430892944336, "global_step": 330340, "epoch": 1966} {"train_loss": -10.62100601196289, "global_step": 330341, "epoch": 1966} {"train_loss": -11.910697937011719, "global_step": 330342, "epoch": 1966} {"train_loss": -10.682228088378906, "global_step": 330343, "epoch": 1966} {"train_loss": -11.592205047607422, "global_step": 330344, "epoch": 1966} {"train_loss": -11.388638496398926, "global_step": 330345, "epoch": 1966} {"train_loss": -10.016826629638672, "global_step": 330346, "epoch": 1966} {"train_loss": -11.073941230773926, "global_step": 330347, "epoch": 1966} {"train_loss": -10.80661392211914, "global_step": 330348, "epoch": 1966} {"train_loss": -11.309306144714355, "global_step": 330349, "epoch": 1966} {"train_loss": -10.689724922180176, "global_step": 330350, "epoch": 1966} {"train_loss": -10.94499397277832, "global_step": 330351, "epoch": 1966} {"train_loss": -11.766111373901367, "global_step": 330352, "epoch": 1966} {"train_loss": -10.92872428894043, "global_step": 330353, "epoch": 1966} {"train_loss": -11.682424545288086, "global_step": 330354, "epoch": 1966} {"train_loss": -11.271960258483887, "global_step": 330355, "epoch": 1966} {"train_loss": -11.654751777648926, "global_step": 330356, "epoch": 1966} {"train_loss": -11.74679183959961, "global_step": 330357, "epoch": 1966} {"train_loss": -11.39711856842041, "global_step": 330358, "epoch": 1966} {"train_loss": -11.550318717956543, "global_step": 330359, "epoch": 1966} {"train_loss": -11.485365867614746, "global_step": 330360, "epoch": 1966} {"train_loss": -11.016440391540527, "global_step": 330361, "epoch": 1966} {"train_loss": -11.821344375610352, "global_step": 330362, "epoch": 1966} {"train_loss": -11.172554016113281, "global_step": 330363, "epoch": 1966} {"train_loss": -12.233282089233398, "global_step": 330364, "epoch": 1966} {"train_loss": -11.200311660766602, "global_step": 330365, "epoch": 1966} {"train_loss": -11.493236541748047, "global_step": 330366, "epoch": 1966} {"train_loss": -11.496480941772461, "global_step": 330367, "epoch": 1966} {"train_loss": -11.565143585205078, "global_step": 330368, "epoch": 1966} {"train_loss": -11.757806777954102, "global_step": 330369, "epoch": 1966} {"train_loss": -11.73432731628418, "global_step": 330370, "epoch": 1966} {"train_loss": -11.564990997314453, "global_step": 330371, "epoch": 1966} {"train_loss": -12.197994232177734, "global_step": 330372, "epoch": 1966} {"train_loss": -11.70569133758545, "global_step": 330373, "epoch": 1966} {"train_loss": -11.890008926391602, "global_step": 330374, "epoch": 1966} {"train_loss": -11.868948936462402, "global_step": 330375, "epoch": 1966} {"train_loss": -11.447754859924316, "global_step": 330376, "epoch": 1966} {"train_loss": -11.911746978759766, "global_step": 330377, "epoch": 1966} {"train_loss": -11.5660982131958, "global_step": 330378, "epoch": 1966} {"train_loss": -11.791258811950684, "global_step": 330379, "epoch": 1966} {"train_loss": -11.765884399414062, "global_step": 330380, "epoch": 1966} {"train_loss": -11.60409927368164, "global_step": 330381, "epoch": 1966} {"train_loss": -11.888354301452637, "global_step": 330382, "epoch": 1966} {"train_loss": -11.631235122680664, "global_step": 330383, "epoch": 1966} {"train_loss": -12.068840026855469, "global_step": 330384, "epoch": 1966} {"train_loss": -11.831298828125, "global_step": 330385, "epoch": 1966} {"train_loss": -11.984095573425293, "global_step": 330386, "epoch": 1966} {"train_loss": -12.090251922607422, "global_step": 330387, "epoch": 1966} {"train_loss": -12.112957000732422, "global_step": 330388, "epoch": 1966} {"train_loss": -12.022054672241211, "global_step": 330389, "epoch": 1966} {"train_loss": -12.376848220825195, "global_step": 330390, "epoch": 1966} {"train_loss": -12.167642593383789, "global_step": 330391, "epoch": 1966} {"train_loss": -11.960698127746582, "global_step": 330392, "epoch": 1966} {"train_loss": -12.170233726501465, "global_step": 330393, "epoch": 1966} {"train_loss": -12.455629348754883, "global_step": 330394, "epoch": 1966} {"train_loss": -12.24411392211914, "global_step": 330395, "epoch": 1966} {"train_loss": -12.349176406860352, "global_step": 330396, "epoch": 1966} {"train_loss": -12.087444305419922, "global_step": 330397, "epoch": 1966} {"train_loss": -12.024943351745605, "global_step": 330398, "epoch": 1966} {"train_loss": -12.283554077148438, "global_step": 330399, "epoch": 1966} {"train_loss": -12.139982223510742, "global_step": 330400, "epoch": 1966} {"train_loss": -12.317522048950195, "global_step": 330401, "epoch": 1966} {"train_loss": -12.24288558959961, "global_step": 330402, "epoch": 1966} {"train_loss": -12.360699653625488, "global_step": 330403, "epoch": 1966} {"train_loss": -12.540338516235352, "global_step": 330404, "epoch": 1966} {"train_loss": -12.463068008422852, "global_step": 330405, "epoch": 1966} {"train_loss": -12.488574028015137, "global_step": 330406, "epoch": 1966} {"train_loss": -12.394234657287598, "global_step": 330407, "epoch": 1966} {"train_loss": -12.528857231140137, "global_step": 330408, "epoch": 1966} {"train_loss": -12.372580528259277, "global_step": 330409, "epoch": 1966} {"train_loss": -12.29775619506836, "global_step": 330410, "epoch": 1966} {"train_loss": -12.357963562011719, "global_step": 330411, "epoch": 1966} {"train_loss": -12.429757118225098, "global_step": 330412, "epoch": 1966} {"train_loss": -12.062882423400879, "global_step": 330413, "epoch": 1966} {"train_loss": -12.502477645874023, "global_step": 330414, "epoch": 1966} {"train_loss": -12.057472229003906, "global_step": 330415, "epoch": 1966} {"train_loss": -12.514043807983398, "global_step": 330416, "epoch": 1966} {"train_loss": -12.266122817993164, "global_step": 330417, "epoch": 1966} {"train_loss": -12.438385963439941, "global_step": 330418, "epoch": 1966} {"train_loss": -12.347204208374023, "global_step": 330419, "epoch": 1966} {"train_loss": -12.301684379577637, "global_step": 330420, "epoch": 1966} {"train_loss": -12.44543170928955, "global_step": 330421, "epoch": 1966} {"train_loss": -12.098337173461914, "global_step": 330422, "epoch": 1966} {"train_loss": -11.68478775024414, "global_step": 330423, "epoch": 1966} {"train_loss": -12.359000205993652, "global_step": 330424, "epoch": 1966} {"train_loss": -12.451608657836914, "global_step": 330425, "epoch": 1966} {"train_loss": -11.651050567626953, "global_step": 330426, "epoch": 1966} {"train_loss": -11.906195640563965, "global_step": 330427, "epoch": 1966} {"train_loss": -12.300714492797852, "global_step": 330428, "epoch": 1966} {"train_loss": -12.480415344238281, "global_step": 330429, "epoch": 1966} {"train_loss": -12.21821403503418, "global_step": 330430, "epoch": 1966} {"train_loss": -12.420259475708008, "global_step": 330431, "epoch": 1966} {"train_loss": -12.18341064453125, "global_step": 330432, "epoch": 1966} {"train_loss": -12.399218559265137, "global_step": 330433, "epoch": 1966} {"train_loss": -11.721813201904297, "global_step": 330434, "epoch": 1966} {"train_loss": -11.994428634643555, "global_step": 330435, "epoch": 1966} {"train_loss": -12.217412948608398, "global_step": 330436, "epoch": 1966} {"train_loss": -12.269888877868652, "global_step": 330437, "epoch": 1966} {"train_loss": -12.420568466186523, "global_step": 330438, "epoch": 1966} {"train_loss": -12.300107955932617, "global_step": 330439, "epoch": 1966} {"train_loss": -12.382097244262695, "global_step": 330440, "epoch": 1966} {"train_loss": -12.433871269226074, "global_step": 330441, "epoch": 1966} {"train_loss": -12.189141273498535, "global_step": 330442, "epoch": 1966} {"train_loss": -12.295806884765625, "global_step": 330443, "epoch": 1966} {"train_loss": -12.178333282470703, "global_step": 330444, "epoch": 1966} {"train_loss": -12.504883766174316, "global_step": 330445, "epoch": 1966} {"train_loss": -12.046445846557617, "global_step": 330446, "epoch": 1966} {"train_loss": -12.375167846679688, "global_step": 330447, "epoch": 1966} {"train_loss": -12.071162223815918, "global_step": 330448, "epoch": 1966} {"train_loss": -12.04445743560791, "global_step": 330449, "epoch": 1966} {"train_loss": -12.18625259399414, "global_step": 330450, "epoch": 1966} {"train_loss": -12.184846878051758, "global_step": 330451, "epoch": 1966} {"train_loss": -12.105781555175781, "global_step": 330452, "epoch": 1966} {"train_loss": -12.178688049316406, "global_step": 330453, "epoch": 1966} {"train_loss": -11.88974380493164, "global_step": 330454, "epoch": 1966} {"train_loss": -11.881266355514526, "global_step": 330455, "epoch": 1966, "val_loss": 286837.28125} {"train_loss": -12.193735122680664, "global_step": 330456, "epoch": 1967} {"train_loss": -12.262104034423828, "global_step": 330457, "epoch": 1967} {"train_loss": -11.803131103515625, "global_step": 330458, "epoch": 1967} {"train_loss": -12.517417907714844, "global_step": 330459, "epoch": 1967} {"train_loss": -11.99628734588623, "global_step": 330460, "epoch": 1967} {"train_loss": -12.477767944335938, "global_step": 330461, "epoch": 1967} {"train_loss": -11.857537269592285, "global_step": 330462, "epoch": 1967} {"train_loss": -12.279472351074219, "global_step": 330463, "epoch": 1967} {"train_loss": -11.552316665649414, "global_step": 330464, "epoch": 1967} {"train_loss": -12.385295867919922, "global_step": 330465, "epoch": 1967} {"train_loss": -12.132835388183594, "global_step": 330466, "epoch": 1967} {"train_loss": -12.285391807556152, "global_step": 330467, "epoch": 1967} {"train_loss": -12.311960220336914, "global_step": 330468, "epoch": 1967} {"train_loss": -12.480069160461426, "global_step": 330469, "epoch": 1967} {"train_loss": -12.173410415649414, "global_step": 330470, "epoch": 1967} {"train_loss": -12.282142639160156, "global_step": 330471, "epoch": 1967} {"train_loss": -12.250587463378906, "global_step": 330472, "epoch": 1967} {"train_loss": -11.893880844116211, "global_step": 330473, "epoch": 1967} {"train_loss": -11.851186752319336, "global_step": 330474, "epoch": 1967} {"train_loss": -11.942501068115234, "global_step": 330475, "epoch": 1967} {"train_loss": -12.345806121826172, "global_step": 330476, "epoch": 1967} {"train_loss": -12.171120643615723, "global_step": 330477, "epoch": 1967} {"train_loss": -11.573209762573242, "global_step": 330478, "epoch": 1967} {"train_loss": -11.178290367126465, "global_step": 330479, "epoch": 1967} {"train_loss": -11.709600448608398, "global_step": 330480, "epoch": 1967} {"train_loss": -12.228656768798828, "global_step": 330481, "epoch": 1967} {"train_loss": -10.999005317687988, "global_step": 330482, "epoch": 1967} {"train_loss": -11.276054382324219, "global_step": 330483, "epoch": 1967} {"train_loss": -11.791743278503418, "global_step": 330484, "epoch": 1967} {"train_loss": -9.939990997314453, "global_step": 330485, "epoch": 1967} {"train_loss": -10.76483154296875, "global_step": 330486, "epoch": 1967} {"train_loss": -11.495840072631836, "global_step": 330487, "epoch": 1967} {"train_loss": -10.040082931518555, "global_step": 330488, "epoch": 1967} {"train_loss": -9.020709991455078, "global_step": 330489, "epoch": 1967} {"train_loss": -9.92671012878418, "global_step": 330490, "epoch": 1967} {"train_loss": -10.796609878540039, "global_step": 330491, "epoch": 1967} {"train_loss": -10.28622055053711, "global_step": 330492, "epoch": 1967} {"train_loss": -9.480167388916016, "global_step": 330493, "epoch": 1967} {"train_loss": -11.159584045410156, "global_step": 330494, "epoch": 1967} {"train_loss": -11.041727066040039, "global_step": 330495, "epoch": 1967} {"train_loss": -11.03989315032959, "global_step": 330496, "epoch": 1967} {"train_loss": -11.160612106323242, "global_step": 330497, "epoch": 1967} {"train_loss": -11.63726806640625, "global_step": 330498, "epoch": 1967} {"train_loss": -10.526300430297852, "global_step": 330499, "epoch": 1967} {"train_loss": -11.299776077270508, "global_step": 330500, "epoch": 1967} {"train_loss": -10.77175521850586, "global_step": 330501, "epoch": 1967} {"train_loss": -11.509698867797852, "global_step": 330502, "epoch": 1967} {"train_loss": -10.773248672485352, "global_step": 330503, "epoch": 1967} {"train_loss": -11.339466094970703, "global_step": 330504, "epoch": 1967} {"train_loss": -11.407201766967773, "global_step": 330505, "epoch": 1967} {"train_loss": -10.889516830444336, "global_step": 330506, "epoch": 1967} {"train_loss": -11.040246963500977, "global_step": 330507, "epoch": 1967} {"train_loss": -10.743759155273438, "global_step": 330508, "epoch": 1967} {"train_loss": -8.6502685546875, "global_step": 330509, "epoch": 1967} {"train_loss": -11.740751266479492, "global_step": 330510, "epoch": 1967} {"train_loss": -9.537946701049805, "global_step": 330511, "epoch": 1967} {"train_loss": -11.47956657409668, "global_step": 330512, "epoch": 1967} {"train_loss": -10.102500915527344, "global_step": 330513, "epoch": 1967} {"train_loss": -11.644264221191406, "global_step": 330514, "epoch": 1967} {"train_loss": -10.27629280090332, "global_step": 330515, "epoch": 1967} {"train_loss": -11.651334762573242, "global_step": 330516, "epoch": 1967} {"train_loss": -10.527509689331055, "global_step": 330517, "epoch": 1967} {"train_loss": -11.288840293884277, "global_step": 330518, "epoch": 1967} {"train_loss": -10.536646842956543, "global_step": 330519, "epoch": 1967} {"train_loss": -11.561409950256348, "global_step": 330520, "epoch": 1967} {"train_loss": -10.383119583129883, "global_step": 330521, "epoch": 1967} {"train_loss": -11.575239181518555, "global_step": 330522, "epoch": 1967} {"train_loss": -11.158084869384766, "global_step": 330523, "epoch": 1967} {"train_loss": -11.531044006347656, "global_step": 330524, "epoch": 1967} {"train_loss": -11.384203910827637, "global_step": 330525, "epoch": 1967} {"train_loss": -11.044268608093262, "global_step": 330526, "epoch": 1967} {"train_loss": -11.334564208984375, "global_step": 330527, "epoch": 1967} {"train_loss": -11.23514175415039, "global_step": 330528, "epoch": 1967} {"train_loss": -11.967109680175781, "global_step": 330529, "epoch": 1967} {"train_loss": -11.037513732910156, "global_step": 330530, "epoch": 1967} {"train_loss": -12.06192684173584, "global_step": 330531, "epoch": 1967} {"train_loss": -11.42031192779541, "global_step": 330532, "epoch": 1967} {"train_loss": -11.709661483764648, "global_step": 330533, "epoch": 1967} {"train_loss": -11.355855941772461, "global_step": 330534, "epoch": 1967} {"train_loss": -11.554468154907227, "global_step": 330535, "epoch": 1967} {"train_loss": -11.846170425415039, "global_step": 330536, "epoch": 1967} {"train_loss": -11.597805976867676, "global_step": 330537, "epoch": 1967} {"train_loss": -11.855396270751953, "global_step": 330538, "epoch": 1967} {"train_loss": -11.482182502746582, "global_step": 330539, "epoch": 1967} {"train_loss": -12.162805557250977, "global_step": 330540, "epoch": 1967} {"train_loss": -11.658687591552734, "global_step": 330541, "epoch": 1967} {"train_loss": -12.026630401611328, "global_step": 330542, "epoch": 1967} {"train_loss": -11.758075714111328, "global_step": 330543, "epoch": 1967} {"train_loss": -12.101070404052734, "global_step": 330544, "epoch": 1967} {"train_loss": -11.8734712600708, "global_step": 330545, "epoch": 1967} {"train_loss": -11.702943801879883, "global_step": 330546, "epoch": 1967} {"train_loss": -12.205901145935059, "global_step": 330547, "epoch": 1967} {"train_loss": -11.496578216552734, "global_step": 330548, "epoch": 1967} {"train_loss": -11.941728591918945, "global_step": 330549, "epoch": 1967} {"train_loss": -11.801263809204102, "global_step": 330550, "epoch": 1967} {"train_loss": -12.060369491577148, "global_step": 330551, "epoch": 1967} {"train_loss": -11.886434555053711, "global_step": 330552, "epoch": 1967} {"train_loss": -11.69758415222168, "global_step": 330553, "epoch": 1967} {"train_loss": -12.061124801635742, "global_step": 330554, "epoch": 1967} {"train_loss": -11.992229461669922, "global_step": 330555, "epoch": 1967} {"train_loss": -12.186861038208008, "global_step": 330556, "epoch": 1967} {"train_loss": -11.982939720153809, "global_step": 330557, "epoch": 1967} {"train_loss": -12.152305603027344, "global_step": 330558, "epoch": 1967} {"train_loss": -12.085282325744629, "global_step": 330559, "epoch": 1967} {"train_loss": -12.17146110534668, "global_step": 330560, "epoch": 1967} {"train_loss": -12.099891662597656, "global_step": 330561, "epoch": 1967} {"train_loss": -12.328615188598633, "global_step": 330562, "epoch": 1967} {"train_loss": -11.993382453918457, "global_step": 330563, "epoch": 1967} {"train_loss": -12.316783905029297, "global_step": 330564, "epoch": 1967} {"train_loss": -12.25167465209961, "global_step": 330565, "epoch": 1967} {"train_loss": -12.19289779663086, "global_step": 330566, "epoch": 1967} {"train_loss": -12.154273986816406, "global_step": 330567, "epoch": 1967} {"train_loss": -12.099193572998047, "global_step": 330568, "epoch": 1967} {"train_loss": -12.28083324432373, "global_step": 330569, "epoch": 1967} {"train_loss": -12.083219528198242, "global_step": 330570, "epoch": 1967} {"train_loss": -12.530655860900879, "global_step": 330571, "epoch": 1967} {"train_loss": -12.147594451904297, "global_step": 330572, "epoch": 1967} {"train_loss": -12.272017478942871, "global_step": 330573, "epoch": 1967} {"train_loss": -12.324600219726562, "global_step": 330574, "epoch": 1967} {"train_loss": -12.072439193725586, "global_step": 330575, "epoch": 1967} {"train_loss": -12.343280792236328, "global_step": 330576, "epoch": 1967} {"train_loss": -12.301393508911133, "global_step": 330577, "epoch": 1967} {"train_loss": -12.260221481323242, "global_step": 330578, "epoch": 1967} {"train_loss": -11.74547004699707, "global_step": 330579, "epoch": 1967} {"train_loss": -12.262519836425781, "global_step": 330580, "epoch": 1967} {"train_loss": -12.372356414794922, "global_step": 330581, "epoch": 1967} {"train_loss": -12.445070266723633, "global_step": 330582, "epoch": 1967} {"train_loss": -12.461376190185547, "global_step": 330583, "epoch": 1967} {"train_loss": -12.380410194396973, "global_step": 330584, "epoch": 1967} {"train_loss": -12.50003433227539, "global_step": 330585, "epoch": 1967} {"train_loss": -12.286043167114258, "global_step": 330586, "epoch": 1967} {"train_loss": -12.554373741149902, "global_step": 330587, "epoch": 1967} {"train_loss": -12.432819366455078, "global_step": 330588, "epoch": 1967} {"train_loss": -12.533852577209473, "global_step": 330589, "epoch": 1967} {"train_loss": -12.589658737182617, "global_step": 330590, "epoch": 1967} {"train_loss": -12.708517074584961, "global_step": 330591, "epoch": 1967} {"train_loss": -12.417715072631836, "global_step": 330592, "epoch": 1967} {"train_loss": -12.645613670349121, "global_step": 330593, "epoch": 1967} {"train_loss": -12.465171813964844, "global_step": 330594, "epoch": 1967} {"train_loss": -12.824182510375977, "global_step": 330595, "epoch": 1967} {"train_loss": -12.428359985351562, "global_step": 330596, "epoch": 1967} {"train_loss": -12.677228927612305, "global_step": 330597, "epoch": 1967} {"train_loss": -12.638622283935547, "global_step": 330598, "epoch": 1967} {"train_loss": -12.601191520690918, "global_step": 330599, "epoch": 1967} {"train_loss": -12.49356460571289, "global_step": 330600, "epoch": 1967} {"train_loss": -12.539113998413086, "global_step": 330601, "epoch": 1967} {"train_loss": -12.47103214263916, "global_step": 330602, "epoch": 1967} {"train_loss": -12.380437850952148, "global_step": 330603, "epoch": 1967} {"train_loss": -12.632820129394531, "global_step": 330604, "epoch": 1967} {"train_loss": -12.711576461791992, "global_step": 330605, "epoch": 1967} {"train_loss": -12.551918029785156, "global_step": 330606, "epoch": 1967} {"train_loss": -12.54807186126709, "global_step": 330607, "epoch": 1967} {"train_loss": -12.539918899536133, "global_step": 330608, "epoch": 1967} {"train_loss": -12.568065643310547, "global_step": 330609, "epoch": 1967} {"train_loss": -12.627458572387695, "global_step": 330610, "epoch": 1967} {"train_loss": -12.11566162109375, "global_step": 330611, "epoch": 1967} {"train_loss": -12.584583282470703, "global_step": 330612, "epoch": 1967} {"train_loss": -12.462767601013184, "global_step": 330613, "epoch": 1967} {"train_loss": -12.278043746948242, "global_step": 330614, "epoch": 1967} {"train_loss": -12.402959823608398, "global_step": 330615, "epoch": 1967} {"train_loss": -12.161706924438477, "global_step": 330616, "epoch": 1967} {"train_loss": -12.548168182373047, "global_step": 330617, "epoch": 1967} {"train_loss": -12.70604133605957, "global_step": 330618, "epoch": 1967} {"train_loss": -12.029640197753906, "global_step": 330619, "epoch": 1967} {"train_loss": -12.427413940429688, "global_step": 330620, "epoch": 1967} {"train_loss": -12.073080062866211, "global_step": 330621, "epoch": 1967} {"train_loss": -12.414113998413086, "global_step": 330622, "epoch": 1967} {"train_loss": -11.810251604943048, "global_step": 330623, "epoch": 1967, "val_loss": 289008.15625} {"train_loss": -11.907377243041992, "global_step": 330624, "epoch": 1968} {"train_loss": -12.426033973693848, "global_step": 330625, "epoch": 1968} {"train_loss": -11.877363204956055, "global_step": 330626, "epoch": 1968} {"train_loss": -11.98090648651123, "global_step": 330627, "epoch": 1968} {"train_loss": -12.04434871673584, "global_step": 330628, "epoch": 1968} {"train_loss": -10.88907527923584, "global_step": 330629, "epoch": 1968} {"train_loss": -10.685811996459961, "global_step": 330630, "epoch": 1968} {"train_loss": -12.001810073852539, "global_step": 330631, "epoch": 1968} {"train_loss": -9.979761123657227, "global_step": 330632, "epoch": 1968} {"train_loss": -11.907201766967773, "global_step": 330633, "epoch": 1968} {"train_loss": -11.276586532592773, "global_step": 330634, "epoch": 1968} {"train_loss": -11.950448989868164, "global_step": 330635, "epoch": 1968} {"train_loss": -11.756450653076172, "global_step": 330636, "epoch": 1968} {"train_loss": -11.545751571655273, "global_step": 330637, "epoch": 1968} {"train_loss": -12.014745712280273, "global_step": 330638, "epoch": 1968} {"train_loss": -11.59726333618164, "global_step": 330639, "epoch": 1968} {"train_loss": -11.911067008972168, "global_step": 330640, "epoch": 1968} {"train_loss": -10.928542137145996, "global_step": 330641, "epoch": 1968} {"train_loss": -12.017426490783691, "global_step": 330642, "epoch": 1968} {"train_loss": -11.10745620727539, "global_step": 330643, "epoch": 1968} {"train_loss": -10.66307258605957, "global_step": 330644, "epoch": 1968} {"train_loss": -10.950310707092285, "global_step": 330645, "epoch": 1968} {"train_loss": -11.122547149658203, "global_step": 330646, "epoch": 1968} {"train_loss": -11.656152725219727, "global_step": 330647, "epoch": 1968} {"train_loss": -9.356246948242188, "global_step": 330648, "epoch": 1968} {"train_loss": -11.56987190246582, "global_step": 330649, "epoch": 1968} {"train_loss": -10.479158401489258, "global_step": 330650, "epoch": 1968} {"train_loss": -9.024877548217773, "global_step": 330651, "epoch": 1968} {"train_loss": -10.176130294799805, "global_step": 330652, "epoch": 1968} {"train_loss": -10.689833641052246, "global_step": 330653, "epoch": 1968} {"train_loss": -10.34293270111084, "global_step": 330654, "epoch": 1968} {"train_loss": -10.542648315429688, "global_step": 330655, "epoch": 1968} {"train_loss": -10.47579574584961, "global_step": 330656, "epoch": 1968} {"train_loss": -9.248451232910156, "global_step": 330657, "epoch": 1968} {"train_loss": -10.793266296386719, "global_step": 330658, "epoch": 1968} {"train_loss": -9.831148147583008, "global_step": 330659, "epoch": 1968} {"train_loss": -10.056861877441406, "global_step": 330660, "epoch": 1968} {"train_loss": -10.02098274230957, "global_step": 330661, "epoch": 1968} {"train_loss": -9.941842079162598, "global_step": 330662, "epoch": 1968} {"train_loss": -11.344825744628906, "global_step": 330663, "epoch": 1968} {"train_loss": -10.12093448638916, "global_step": 330664, "epoch": 1968} {"train_loss": -10.748018264770508, "global_step": 330665, "epoch": 1968} {"train_loss": -11.492283821105957, "global_step": 330666, "epoch": 1968} {"train_loss": -10.796072006225586, "global_step": 330667, "epoch": 1968} {"train_loss": -10.820382118225098, "global_step": 330668, "epoch": 1968} {"train_loss": -11.214773178100586, "global_step": 330669, "epoch": 1968} {"train_loss": -10.296921730041504, "global_step": 330670, "epoch": 1968} {"train_loss": -11.092893600463867, "global_step": 330671, "epoch": 1968} {"train_loss": -10.724180221557617, "global_step": 330672, "epoch": 1968} {"train_loss": -10.230693817138672, "global_step": 330673, "epoch": 1968} {"train_loss": -10.22213363647461, "global_step": 330674, "epoch": 1968} {"train_loss": -11.023305892944336, "global_step": 330675, "epoch": 1968} {"train_loss": -11.075258255004883, "global_step": 330676, "epoch": 1968} {"train_loss": -10.894460678100586, "global_step": 330677, "epoch": 1968} {"train_loss": -11.097429275512695, "global_step": 330678, "epoch": 1968} {"train_loss": -11.139120101928711, "global_step": 330679, "epoch": 1968} {"train_loss": -10.966255187988281, "global_step": 330680, "epoch": 1968} {"train_loss": -11.160604476928711, "global_step": 330681, "epoch": 1968} {"train_loss": -11.604236602783203, "global_step": 330682, "epoch": 1968} {"train_loss": -10.981664657592773, "global_step": 330683, "epoch": 1968} {"train_loss": -10.17807674407959, "global_step": 330684, "epoch": 1968} {"train_loss": -11.830497741699219, "global_step": 330685, "epoch": 1968} {"train_loss": -10.878717422485352, "global_step": 330686, "epoch": 1968} {"train_loss": -11.566559791564941, "global_step": 330687, "epoch": 1968} {"train_loss": -11.425711631774902, "global_step": 330688, "epoch": 1968} {"train_loss": -11.357057571411133, "global_step": 330689, "epoch": 1968} {"train_loss": -11.488725662231445, "global_step": 330690, "epoch": 1968} {"train_loss": -11.839134216308594, "global_step": 330691, "epoch": 1968} {"train_loss": -11.163646697998047, "global_step": 330692, "epoch": 1968} {"train_loss": -11.846280097961426, "global_step": 330693, "epoch": 1968} {"train_loss": -11.78436279296875, "global_step": 330694, "epoch": 1968} {"train_loss": -11.115795135498047, "global_step": 330695, "epoch": 1968} {"train_loss": -11.96157455444336, "global_step": 330696, "epoch": 1968} {"train_loss": -11.10838508605957, "global_step": 330697, "epoch": 1968} {"train_loss": -11.456071853637695, "global_step": 330698, "epoch": 1968} {"train_loss": -11.760330200195312, "global_step": 330699, "epoch": 1968} {"train_loss": -11.195158004760742, "global_step": 330700, "epoch": 1968} {"train_loss": -11.38743782043457, "global_step": 330701, "epoch": 1968} {"train_loss": -11.772765159606934, "global_step": 330702, "epoch": 1968} {"train_loss": -11.401235580444336, "global_step": 330703, "epoch": 1968} {"train_loss": -11.564678192138672, "global_step": 330704, "epoch": 1968} {"train_loss": -12.04090690612793, "global_step": 330705, "epoch": 1968} {"train_loss": -11.268836975097656, "global_step": 330706, "epoch": 1968} {"train_loss": -11.688323974609375, "global_step": 330707, "epoch": 1968} {"train_loss": -11.912300109863281, "global_step": 330708, "epoch": 1968} {"train_loss": -11.719511032104492, "global_step": 330709, "epoch": 1968} {"train_loss": -11.714241027832031, "global_step": 330710, "epoch": 1968} {"train_loss": -11.928449630737305, "global_step": 330711, "epoch": 1968} {"train_loss": -11.580184936523438, "global_step": 330712, "epoch": 1968} {"train_loss": -11.835531234741211, "global_step": 330713, "epoch": 1968} {"train_loss": -11.828957557678223, "global_step": 330714, "epoch": 1968} {"train_loss": -11.908472061157227, "global_step": 330715, "epoch": 1968} {"train_loss": -12.111982345581055, "global_step": 330716, "epoch": 1968} {"train_loss": -11.9923734664917, "global_step": 330717, "epoch": 1968} {"train_loss": -12.143835067749023, "global_step": 330718, "epoch": 1968} {"train_loss": -12.155745506286621, "global_step": 330719, "epoch": 1968} {"train_loss": -12.132506370544434, "global_step": 330720, "epoch": 1968} {"train_loss": -12.007112503051758, "global_step": 330721, "epoch": 1968} {"train_loss": -12.148443222045898, "global_step": 330722, "epoch": 1968} {"train_loss": -11.987771034240723, "global_step": 330723, "epoch": 1968} {"train_loss": -12.270320892333984, "global_step": 330724, "epoch": 1968} {"train_loss": -12.251670837402344, "global_step": 330725, "epoch": 1968} {"train_loss": -12.229442596435547, "global_step": 330726, "epoch": 1968} {"train_loss": -12.209402084350586, "global_step": 330727, "epoch": 1968} {"train_loss": -12.259468078613281, "global_step": 330728, "epoch": 1968} {"train_loss": -12.177712440490723, "global_step": 330729, "epoch": 1968} {"train_loss": -12.247518539428711, "global_step": 330730, "epoch": 1968} {"train_loss": -12.26348876953125, "global_step": 330731, "epoch": 1968} {"train_loss": -12.267000198364258, "global_step": 330732, "epoch": 1968} {"train_loss": -12.143688201904297, "global_step": 330733, "epoch": 1968} {"train_loss": -12.425582885742188, "global_step": 330734, "epoch": 1968} {"train_loss": -12.472843170166016, "global_step": 330735, "epoch": 1968} {"train_loss": -12.43407917022705, "global_step": 330736, "epoch": 1968} {"train_loss": -12.369148254394531, "global_step": 330737, "epoch": 1968} {"train_loss": -12.367395401000977, "global_step": 330738, "epoch": 1968} {"train_loss": -12.145020484924316, "global_step": 330739, "epoch": 1968} {"train_loss": -12.544636726379395, "global_step": 330740, "epoch": 1968} {"train_loss": -12.337545394897461, "global_step": 330741, "epoch": 1968} {"train_loss": -12.27127742767334, "global_step": 330742, "epoch": 1968} {"train_loss": -12.386348724365234, "global_step": 330743, "epoch": 1968} {"train_loss": -12.382084846496582, "global_step": 330744, "epoch": 1968} {"train_loss": -12.436666488647461, "global_step": 330745, "epoch": 1968} {"train_loss": -12.483356475830078, "global_step": 330746, "epoch": 1968} {"train_loss": -12.273029327392578, "global_step": 330747, "epoch": 1968} {"train_loss": -12.54228401184082, "global_step": 330748, "epoch": 1968} {"train_loss": -12.439990997314453, "global_step": 330749, "epoch": 1968} {"train_loss": -12.47352123260498, "global_step": 330750, "epoch": 1968} {"train_loss": -12.536565780639648, "global_step": 330751, "epoch": 1968} {"train_loss": -12.425897598266602, "global_step": 330752, "epoch": 1968} {"train_loss": -12.480947494506836, "global_step": 330753, "epoch": 1968} {"train_loss": -12.595564842224121, "global_step": 330754, "epoch": 1968} {"train_loss": -12.441492080688477, "global_step": 330755, "epoch": 1968} {"train_loss": -12.498369216918945, "global_step": 330756, "epoch": 1968} {"train_loss": -12.418766021728516, "global_step": 330757, "epoch": 1968} {"train_loss": -12.426913261413574, "global_step": 330758, "epoch": 1968} {"train_loss": -12.670787811279297, "global_step": 330759, "epoch": 1968} {"train_loss": -12.550640106201172, "global_step": 330760, "epoch": 1968} {"train_loss": -12.597999572753906, "global_step": 330761, "epoch": 1968} {"train_loss": -12.743764877319336, "global_step": 330762, "epoch": 1968} {"train_loss": -12.541446685791016, "global_step": 330763, "epoch": 1968} {"train_loss": -12.662422180175781, "global_step": 330764, "epoch": 1968} {"train_loss": -12.697701454162598, "global_step": 330765, "epoch": 1968} {"train_loss": -12.420158386230469, "global_step": 330766, "epoch": 1968} {"train_loss": -12.723073959350586, "global_step": 330767, "epoch": 1968} {"train_loss": -12.513875961303711, "global_step": 330768, "epoch": 1968} {"train_loss": -12.58547592163086, "global_step": 330769, "epoch": 1968} {"train_loss": -12.774243354797363, "global_step": 330770, "epoch": 1968} {"train_loss": -12.69100570678711, "global_step": 330771, "epoch": 1968} {"train_loss": -12.503974914550781, "global_step": 330772, "epoch": 1968} {"train_loss": -12.60464859008789, "global_step": 330773, "epoch": 1968} {"train_loss": -12.540264129638672, "global_step": 330774, "epoch": 1968} {"train_loss": -12.678173065185547, "global_step": 330775, "epoch": 1968} {"train_loss": -12.442791938781738, "global_step": 330776, "epoch": 1968} {"train_loss": -12.58636474609375, "global_step": 330777, "epoch": 1968} {"train_loss": -12.551225662231445, "global_step": 330778, "epoch": 1968} {"train_loss": -12.617801666259766, "global_step": 330779, "epoch": 1968} {"train_loss": -12.469817161560059, "global_step": 330780, "epoch": 1968} {"train_loss": -12.673625946044922, "global_step": 330781, "epoch": 1968} {"train_loss": -12.400070190429688, "global_step": 330782, "epoch": 1968} {"train_loss": -12.539066314697266, "global_step": 330783, "epoch": 1968} {"train_loss": -12.668355941772461, "global_step": 330784, "epoch": 1968} {"train_loss": -12.476631164550781, "global_step": 330785, "epoch": 1968} {"train_loss": -12.507827758789062, "global_step": 330786, "epoch": 1968} {"train_loss": -12.715290069580078, "global_step": 330787, "epoch": 1968} {"train_loss": -12.303443908691406, "global_step": 330788, "epoch": 1968} {"train_loss": -12.504444122314453, "global_step": 330789, "epoch": 1968} {"train_loss": -12.649299621582031, "global_step": 330790, "epoch": 1968} {"train_loss": -11.73939641884395, "global_step": 330791, "epoch": 1968, "val_loss": 286844.8125} {"train_loss": -12.439626693725586, "global_step": 330792, "epoch": 1969} {"train_loss": -12.695480346679688, "global_step": 330793, "epoch": 1969} {"train_loss": -12.29809284210205, "global_step": 330794, "epoch": 1969} {"train_loss": -12.443580627441406, "global_step": 330795, "epoch": 1969} {"train_loss": -12.552375793457031, "global_step": 330796, "epoch": 1969} {"train_loss": -12.356242179870605, "global_step": 330797, "epoch": 1969} {"train_loss": -12.134215354919434, "global_step": 330798, "epoch": 1969} {"train_loss": -11.890556335449219, "global_step": 330799, "epoch": 1969} {"train_loss": -12.659387588500977, "global_step": 330800, "epoch": 1969} {"train_loss": -12.531974792480469, "global_step": 330801, "epoch": 1969} {"train_loss": -12.18084716796875, "global_step": 330802, "epoch": 1969} {"train_loss": -12.035408973693848, "global_step": 330803, "epoch": 1969} {"train_loss": -12.540050506591797, "global_step": 330804, "epoch": 1969} {"train_loss": -12.457855224609375, "global_step": 330805, "epoch": 1969} {"train_loss": -12.681422233581543, "global_step": 330806, "epoch": 1969} {"train_loss": -12.023096084594727, "global_step": 330807, "epoch": 1969} {"train_loss": -12.020806312561035, "global_step": 330808, "epoch": 1969} {"train_loss": -11.929888725280762, "global_step": 330809, "epoch": 1969} {"train_loss": -12.072165489196777, "global_step": 330810, "epoch": 1969} {"train_loss": -12.215923309326172, "global_step": 330811, "epoch": 1969} {"train_loss": -12.171981811523438, "global_step": 330812, "epoch": 1969} {"train_loss": -11.641386985778809, "global_step": 330813, "epoch": 1969} {"train_loss": -12.209917068481445, "global_step": 330814, "epoch": 1969} {"train_loss": -12.120054244995117, "global_step": 330815, "epoch": 1969} {"train_loss": -12.310295104980469, "global_step": 330816, "epoch": 1969} {"train_loss": -12.127897262573242, "global_step": 330817, "epoch": 1969} {"train_loss": -12.08148193359375, "global_step": 330818, "epoch": 1969} {"train_loss": -12.207900047302246, "global_step": 330819, "epoch": 1969} {"train_loss": -12.593549728393555, "global_step": 330820, "epoch": 1969} {"train_loss": -12.00156307220459, "global_step": 330821, "epoch": 1969} {"train_loss": -12.381889343261719, "global_step": 330822, "epoch": 1969} {"train_loss": -12.301860809326172, "global_step": 330823, "epoch": 1969} {"train_loss": -11.431593894958496, "global_step": 330824, "epoch": 1969} {"train_loss": -11.039398193359375, "global_step": 330825, "epoch": 1969} {"train_loss": -12.368907928466797, "global_step": 330826, "epoch": 1969} {"train_loss": -11.728630065917969, "global_step": 330827, "epoch": 1969} {"train_loss": -10.999903678894043, "global_step": 330828, "epoch": 1969} {"train_loss": -11.768890380859375, "global_step": 330829, "epoch": 1969} {"train_loss": -11.937803268432617, "global_step": 330830, "epoch": 1969} {"train_loss": -11.404335975646973, "global_step": 330831, "epoch": 1969} {"train_loss": -12.00025749206543, "global_step": 330832, "epoch": 1969} {"train_loss": -11.886955261230469, "global_step": 330833, "epoch": 1969} {"train_loss": -11.507903099060059, "global_step": 330834, "epoch": 1969} {"train_loss": -12.218365669250488, "global_step": 330835, "epoch": 1969} {"train_loss": -10.748970031738281, "global_step": 330836, "epoch": 1969} {"train_loss": -10.646467208862305, "global_step": 330837, "epoch": 1969} {"train_loss": -10.5545654296875, "global_step": 330838, "epoch": 1969} {"train_loss": -12.124246597290039, "global_step": 330839, "epoch": 1969} {"train_loss": -11.1297607421875, "global_step": 330840, "epoch": 1969} {"train_loss": -11.90492057800293, "global_step": 330841, "epoch": 1969} {"train_loss": -10.387133598327637, "global_step": 330842, "epoch": 1969} {"train_loss": -10.75439453125, "global_step": 330843, "epoch": 1969} {"train_loss": -9.835761070251465, "global_step": 330844, "epoch": 1969} {"train_loss": -10.194955825805664, "global_step": 330845, "epoch": 1969} {"train_loss": -10.182573318481445, "global_step": 330846, "epoch": 1969} {"train_loss": -10.199254035949707, "global_step": 330847, "epoch": 1969} {"train_loss": -9.566387176513672, "global_step": 330848, "epoch": 1969} {"train_loss": -10.752286911010742, "global_step": 330849, "epoch": 1969} {"train_loss": -10.202343940734863, "global_step": 330850, "epoch": 1969} {"train_loss": -9.749969482421875, "global_step": 330851, "epoch": 1969} {"train_loss": -9.328516006469727, "global_step": 330852, "epoch": 1969} {"train_loss": -11.730316162109375, "global_step": 330853, "epoch": 1969} {"train_loss": -10.051152229309082, "global_step": 330854, "epoch": 1969} {"train_loss": -11.690433502197266, "global_step": 330855, "epoch": 1969} {"train_loss": -10.133068084716797, "global_step": 330856, "epoch": 1969} {"train_loss": -11.520896911621094, "global_step": 330857, "epoch": 1969} {"train_loss": -8.928539276123047, "global_step": 330858, "epoch": 1969} {"train_loss": -11.465387344360352, "global_step": 330859, "epoch": 1969} {"train_loss": -10.340082168579102, "global_step": 330860, "epoch": 1969} {"train_loss": -11.159967422485352, "global_step": 330861, "epoch": 1969} {"train_loss": -10.675259590148926, "global_step": 330862, "epoch": 1969} {"train_loss": -11.687313079833984, "global_step": 330863, "epoch": 1969} {"train_loss": -10.250397682189941, "global_step": 330864, "epoch": 1969} {"train_loss": -12.019977569580078, "global_step": 330865, "epoch": 1969} {"train_loss": -11.002421379089355, "global_step": 330866, "epoch": 1969} {"train_loss": -11.87118911743164, "global_step": 330867, "epoch": 1969} {"train_loss": -11.628020286560059, "global_step": 330868, "epoch": 1969} {"train_loss": -11.873184204101562, "global_step": 330869, "epoch": 1969} {"train_loss": -11.719602584838867, "global_step": 330870, "epoch": 1969} {"train_loss": -11.809167861938477, "global_step": 330871, "epoch": 1969} {"train_loss": -11.903544425964355, "global_step": 330872, "epoch": 1969} {"train_loss": -11.41690444946289, "global_step": 330873, "epoch": 1969} {"train_loss": -11.660085678100586, "global_step": 330874, "epoch": 1969} {"train_loss": -11.926057815551758, "global_step": 330875, "epoch": 1969} {"train_loss": -11.302186012268066, "global_step": 330876, "epoch": 1969} {"train_loss": -11.930310249328613, "global_step": 330877, "epoch": 1969} {"train_loss": -11.447681427001953, "global_step": 330878, "epoch": 1969} {"train_loss": -12.079689025878906, "global_step": 330879, "epoch": 1969} {"train_loss": -11.892023086547852, "global_step": 330880, "epoch": 1969} {"train_loss": -11.480493545532227, "global_step": 330881, "epoch": 1969} {"train_loss": -11.960562705993652, "global_step": 330882, "epoch": 1969} {"train_loss": -11.70614242553711, "global_step": 330883, "epoch": 1969} {"train_loss": -12.209500312805176, "global_step": 330884, "epoch": 1969} {"train_loss": -12.30431079864502, "global_step": 330885, "epoch": 1969} {"train_loss": -11.847110748291016, "global_step": 330886, "epoch": 1969} {"train_loss": -12.217154502868652, "global_step": 330887, "epoch": 1969} {"train_loss": -11.302818298339844, "global_step": 330888, "epoch": 1969} {"train_loss": -12.148038864135742, "global_step": 330889, "epoch": 1969} {"train_loss": -11.866598129272461, "global_step": 330890, "epoch": 1969} {"train_loss": -11.777565002441406, "global_step": 330891, "epoch": 1969} {"train_loss": -11.399957656860352, "global_step": 330892, "epoch": 1969} {"train_loss": -11.662041664123535, "global_step": 330893, "epoch": 1969} {"train_loss": -12.059285163879395, "global_step": 330894, "epoch": 1969} {"train_loss": -11.484919548034668, "global_step": 330895, "epoch": 1969} {"train_loss": -12.009065628051758, "global_step": 330896, "epoch": 1969} {"train_loss": -11.92817211151123, "global_step": 330897, "epoch": 1969} {"train_loss": -11.924383163452148, "global_step": 330898, "epoch": 1969} {"train_loss": -12.0503511428833, "global_step": 330899, "epoch": 1969} {"train_loss": -12.026911735534668, "global_step": 330900, "epoch": 1969} {"train_loss": -12.269966125488281, "global_step": 330901, "epoch": 1969} {"train_loss": -12.116630554199219, "global_step": 330902, "epoch": 1969} {"train_loss": -12.12106704711914, "global_step": 330903, "epoch": 1969} {"train_loss": -12.141818046569824, "global_step": 330904, "epoch": 1969} {"train_loss": -12.24502182006836, "global_step": 330905, "epoch": 1969} {"train_loss": -12.199932098388672, "global_step": 330906, "epoch": 1969} {"train_loss": -12.112445831298828, "global_step": 330907, "epoch": 1969} {"train_loss": -12.296769142150879, "global_step": 330908, "epoch": 1969} {"train_loss": -12.099920272827148, "global_step": 330909, "epoch": 1969} {"train_loss": -12.283498764038086, "global_step": 330910, "epoch": 1969} {"train_loss": -12.10054874420166, "global_step": 330911, "epoch": 1969} {"train_loss": -12.25228214263916, "global_step": 330912, "epoch": 1969} {"train_loss": -12.143026351928711, "global_step": 330913, "epoch": 1969} {"train_loss": -12.302066802978516, "global_step": 330914, "epoch": 1969} {"train_loss": -12.366065979003906, "global_step": 330915, "epoch": 1969} {"train_loss": -12.111357688903809, "global_step": 330916, "epoch": 1969} {"train_loss": -12.3049955368042, "global_step": 330917, "epoch": 1969} {"train_loss": -12.183022499084473, "global_step": 330918, "epoch": 1969} {"train_loss": -12.374744415283203, "global_step": 330919, "epoch": 1969} {"train_loss": -12.558235168457031, "global_step": 330920, "epoch": 1969} {"train_loss": -12.318475723266602, "global_step": 330921, "epoch": 1969} {"train_loss": -12.638047218322754, "global_step": 330922, "epoch": 1969} {"train_loss": -12.553077697753906, "global_step": 330923, "epoch": 1969} {"train_loss": -12.406980514526367, "global_step": 330924, "epoch": 1969} {"train_loss": -12.404683113098145, "global_step": 330925, "epoch": 1969} {"train_loss": -12.446218490600586, "global_step": 330926, "epoch": 1969} {"train_loss": -12.36745834350586, "global_step": 330927, "epoch": 1969} {"train_loss": -12.508899688720703, "global_step": 330928, "epoch": 1969} {"train_loss": -12.275467872619629, "global_step": 330929, "epoch": 1969} {"train_loss": -12.55146598815918, "global_step": 330930, "epoch": 1969} {"train_loss": -12.284215927124023, "global_step": 330931, "epoch": 1969} {"train_loss": -12.46619987487793, "global_step": 330932, "epoch": 1969} {"train_loss": -12.324529647827148, "global_step": 330933, "epoch": 1969} {"train_loss": -12.601665496826172, "global_step": 330934, "epoch": 1969} {"train_loss": -12.428567886352539, "global_step": 330935, "epoch": 1969} {"train_loss": -12.572311401367188, "global_step": 330936, "epoch": 1969} {"train_loss": -12.43967056274414, "global_step": 330937, "epoch": 1969} {"train_loss": -12.48306655883789, "global_step": 330938, "epoch": 1969} {"train_loss": -12.402769088745117, "global_step": 330939, "epoch": 1969} {"train_loss": -12.303812026977539, "global_step": 330940, "epoch": 1969} {"train_loss": -12.35539436340332, "global_step": 330941, "epoch": 1969} {"train_loss": -12.299572944641113, "global_step": 330942, "epoch": 1969} {"train_loss": -10.463868141174316, "global_step": 330943, "epoch": 1969} {"train_loss": -10.681854248046875, "global_step": 330944, "epoch": 1969} {"train_loss": -11.926481246948242, "global_step": 330945, "epoch": 1969} {"train_loss": -9.664416313171387, "global_step": 330946, "epoch": 1969} {"train_loss": -10.916297912597656, "global_step": 330947, "epoch": 1969} {"train_loss": -12.320590019226074, "global_step": 330948, "epoch": 1969} {"train_loss": -10.631539344787598, "global_step": 330949, "epoch": 1969} {"train_loss": -12.22614574432373, "global_step": 330950, "epoch": 1969} {"train_loss": -10.392423629760742, "global_step": 330951, "epoch": 1969} {"train_loss": -11.703868865966797, "global_step": 330952, "epoch": 1969} {"train_loss": -10.887171745300293, "global_step": 330953, "epoch": 1969} {"train_loss": -9.892251968383789, "global_step": 330954, "epoch": 1969} {"train_loss": -11.381431579589844, "global_step": 330955, "epoch": 1969} {"train_loss": -10.967517852783203, "global_step": 330956, "epoch": 1969} {"train_loss": -10.981739044189453, "global_step": 330957, "epoch": 1969} {"train_loss": -11.097870826721191, "global_step": 330958, "epoch": 1969} {"train_loss": -11.724382252920241, "global_step": 330959, "epoch": 1969, "val_loss": 288885.9375} {"train_loss": -11.56413459777832, "global_step": 330960, "epoch": 1970} {"train_loss": -11.419305801391602, "global_step": 330961, "epoch": 1970} {"train_loss": -11.176494598388672, "global_step": 330962, "epoch": 1970} {"train_loss": -11.86795425415039, "global_step": 330963, "epoch": 1970} {"train_loss": -11.858305931091309, "global_step": 330964, "epoch": 1970} {"train_loss": -11.431995391845703, "global_step": 330965, "epoch": 1970} {"train_loss": -11.450767517089844, "global_step": 330966, "epoch": 1970} {"train_loss": -11.53115463256836, "global_step": 330967, "epoch": 1970} {"train_loss": -11.867069244384766, "global_step": 330968, "epoch": 1970} {"train_loss": -12.096155166625977, "global_step": 330969, "epoch": 1970} {"train_loss": -11.672342300415039, "global_step": 330970, "epoch": 1970} {"train_loss": -11.99735164642334, "global_step": 330971, "epoch": 1970} {"train_loss": -12.000896453857422, "global_step": 330972, "epoch": 1970} {"train_loss": -12.127038955688477, "global_step": 330973, "epoch": 1970} {"train_loss": -12.144989013671875, "global_step": 330974, "epoch": 1970} {"train_loss": -11.910780906677246, "global_step": 330975, "epoch": 1970} {"train_loss": -12.145149230957031, "global_step": 330976, "epoch": 1970} {"train_loss": -12.179460525512695, "global_step": 330977, "epoch": 1970} {"train_loss": -12.107538223266602, "global_step": 330978, "epoch": 1970} {"train_loss": -11.823802947998047, "global_step": 330979, "epoch": 1970} {"train_loss": -12.270379066467285, "global_step": 330980, "epoch": 1970} {"train_loss": -12.203217506408691, "global_step": 330981, "epoch": 1970} {"train_loss": -12.12130355834961, "global_step": 330982, "epoch": 1970} {"train_loss": -12.41645622253418, "global_step": 330983, "epoch": 1970} {"train_loss": -11.956670761108398, "global_step": 330984, "epoch": 1970} {"train_loss": -12.044327735900879, "global_step": 330985, "epoch": 1970} {"train_loss": -12.036161422729492, "global_step": 330986, "epoch": 1970} {"train_loss": -12.38534927368164, "global_step": 330987, "epoch": 1970} {"train_loss": -12.167856216430664, "global_step": 330988, "epoch": 1970} {"train_loss": -12.089195251464844, "global_step": 330989, "epoch": 1970} {"train_loss": -12.033546447753906, "global_step": 330990, "epoch": 1970} {"train_loss": -12.04871940612793, "global_step": 330991, "epoch": 1970} {"train_loss": -12.218047142028809, "global_step": 330992, "epoch": 1970} {"train_loss": -12.073647499084473, "global_step": 330993, "epoch": 1970} {"train_loss": -12.387516021728516, "global_step": 330994, "epoch": 1970} {"train_loss": -11.985389709472656, "global_step": 330995, "epoch": 1970} {"train_loss": -12.425079345703125, "global_step": 330996, "epoch": 1970} {"train_loss": -12.057479858398438, "global_step": 330997, "epoch": 1970} {"train_loss": -12.145666122436523, "global_step": 330998, "epoch": 1970} {"train_loss": -12.157281875610352, "global_step": 330999, "epoch": 1970} {"train_loss": -12.396541595458984, "global_step": 331000, "epoch": 1970} {"train_loss": -12.088592529296875, "global_step": 331001, "epoch": 1970} {"train_loss": -12.198183059692383, "global_step": 331002, "epoch": 1970} {"train_loss": -12.362180709838867, "global_step": 331003, "epoch": 1970} {"train_loss": -12.135334968566895, "global_step": 331004, "epoch": 1970} {"train_loss": -12.449252128601074, "global_step": 331005, "epoch": 1970} {"train_loss": -12.153529167175293, "global_step": 331006, "epoch": 1970} {"train_loss": -12.251516342163086, "global_step": 331007, "epoch": 1970} {"train_loss": -11.997800827026367, "global_step": 331008, "epoch": 1970} {"train_loss": -12.421407699584961, "global_step": 331009, "epoch": 1970} {"train_loss": -12.383527755737305, "global_step": 331010, "epoch": 1970} {"train_loss": -12.423460006713867, "global_step": 331011, "epoch": 1970} {"train_loss": -12.471551895141602, "global_step": 331012, "epoch": 1970} {"train_loss": -12.591669082641602, "global_step": 331013, "epoch": 1970} {"train_loss": -12.258010864257812, "global_step": 331014, "epoch": 1970} {"train_loss": -12.510444641113281, "global_step": 331015, "epoch": 1970} {"train_loss": -12.704089164733887, "global_step": 331016, "epoch": 1970} {"train_loss": -12.582782745361328, "global_step": 331017, "epoch": 1970} {"train_loss": -12.669013977050781, "global_step": 331018, "epoch": 1970} {"train_loss": -12.494710922241211, "global_step": 331019, "epoch": 1970} {"train_loss": -12.511027336120605, "global_step": 331020, "epoch": 1970} {"train_loss": -12.521964073181152, "global_step": 331021, "epoch": 1970} {"train_loss": -12.63623332977295, "global_step": 331022, "epoch": 1970} {"train_loss": -12.488232612609863, "global_step": 331023, "epoch": 1970} {"train_loss": -12.529966354370117, "global_step": 331024, "epoch": 1970} {"train_loss": -12.301549911499023, "global_step": 331025, "epoch": 1970} {"train_loss": -12.5249662399292, "global_step": 331026, "epoch": 1970} {"train_loss": -12.616769790649414, "global_step": 331027, "epoch": 1970} {"train_loss": -12.276532173156738, "global_step": 331028, "epoch": 1970} {"train_loss": -12.284368515014648, "global_step": 331029, "epoch": 1970} {"train_loss": -12.467442512512207, "global_step": 331030, "epoch": 1970} {"train_loss": -12.16462516784668, "global_step": 331031, "epoch": 1970} {"train_loss": -11.717836380004883, "global_step": 331032, "epoch": 1970} {"train_loss": -12.247976303100586, "global_step": 331033, "epoch": 1970} {"train_loss": -12.010910034179688, "global_step": 331034, "epoch": 1970} {"train_loss": -12.497220039367676, "global_step": 331035, "epoch": 1970} {"train_loss": -11.988292694091797, "global_step": 331036, "epoch": 1970} {"train_loss": -12.1270112991333, "global_step": 331037, "epoch": 1970} {"train_loss": -12.348302841186523, "global_step": 331038, "epoch": 1970} {"train_loss": -12.1538667678833, "global_step": 331039, "epoch": 1970} {"train_loss": -12.198945999145508, "global_step": 331040, "epoch": 1970} {"train_loss": -12.297574043273926, "global_step": 331041, "epoch": 1970} {"train_loss": -12.34534740447998, "global_step": 331042, "epoch": 1970} {"train_loss": -12.303736686706543, "global_step": 331043, "epoch": 1970} {"train_loss": -12.43659496307373, "global_step": 331044, "epoch": 1970} {"train_loss": -12.220224380493164, "global_step": 331045, "epoch": 1970} {"train_loss": -12.528952598571777, "global_step": 331046, "epoch": 1970} {"train_loss": -12.172842979431152, "global_step": 331047, "epoch": 1970} {"train_loss": -12.220768928527832, "global_step": 331048, "epoch": 1970} {"train_loss": -12.464691162109375, "global_step": 331049, "epoch": 1970} {"train_loss": -12.653120994567871, "global_step": 331050, "epoch": 1970} {"train_loss": -12.413890838623047, "global_step": 331051, "epoch": 1970} {"train_loss": -12.43016242980957, "global_step": 331052, "epoch": 1970} {"train_loss": -12.615737915039062, "global_step": 331053, "epoch": 1970} {"train_loss": -12.21606159210205, "global_step": 331054, "epoch": 1970} {"train_loss": -11.450271606445312, "global_step": 331055, "epoch": 1970} {"train_loss": -12.128145217895508, "global_step": 331056, "epoch": 1970} {"train_loss": -11.815160751342773, "global_step": 331057, "epoch": 1970} {"train_loss": -11.967121124267578, "global_step": 331058, "epoch": 1970} {"train_loss": -12.229601860046387, "global_step": 331059, "epoch": 1970} {"train_loss": -12.292874336242676, "global_step": 331060, "epoch": 1970} {"train_loss": -12.12785530090332, "global_step": 331061, "epoch": 1970} {"train_loss": -11.783096313476562, "global_step": 331062, "epoch": 1970} {"train_loss": -11.72298812866211, "global_step": 331063, "epoch": 1970} {"train_loss": -11.833762168884277, "global_step": 331064, "epoch": 1970} {"train_loss": -12.202892303466797, "global_step": 331065, "epoch": 1970} {"train_loss": -11.960558891296387, "global_step": 331066, "epoch": 1970} {"train_loss": -11.963203430175781, "global_step": 331067, "epoch": 1970} {"train_loss": -12.101495742797852, "global_step": 331068, "epoch": 1970} {"train_loss": -12.296052932739258, "global_step": 331069, "epoch": 1970} {"train_loss": -12.137541770935059, "global_step": 331070, "epoch": 1970} {"train_loss": -11.58191204071045, "global_step": 331071, "epoch": 1970} {"train_loss": -12.081989288330078, "global_step": 331072, "epoch": 1970} {"train_loss": -12.537532806396484, "global_step": 331073, "epoch": 1970} {"train_loss": -11.515134811401367, "global_step": 331074, "epoch": 1970} {"train_loss": -11.984711647033691, "global_step": 331075, "epoch": 1970} {"train_loss": -11.714117050170898, "global_step": 331076, "epoch": 1970} {"train_loss": -12.50507926940918, "global_step": 331077, "epoch": 1970} {"train_loss": -11.748577117919922, "global_step": 331078, "epoch": 1970} {"train_loss": -11.13467788696289, "global_step": 331079, "epoch": 1970} {"train_loss": -11.87315845489502, "global_step": 331080, "epoch": 1970} {"train_loss": -11.36384391784668, "global_step": 331081, "epoch": 1970} {"train_loss": -11.157468795776367, "global_step": 331082, "epoch": 1970} {"train_loss": -11.828994750976562, "global_step": 331083, "epoch": 1970} {"train_loss": -11.085128784179688, "global_step": 331084, "epoch": 1970} {"train_loss": -10.80875301361084, "global_step": 331085, "epoch": 1970} {"train_loss": -11.652471542358398, "global_step": 331086, "epoch": 1970} {"train_loss": -10.282670974731445, "global_step": 331087, "epoch": 1970} {"train_loss": -10.910248756408691, "global_step": 331088, "epoch": 1970} {"train_loss": -10.929122924804688, "global_step": 331089, "epoch": 1970} {"train_loss": -7.245875358581543, "global_step": 331090, "epoch": 1970} {"train_loss": -8.2965087890625, "global_step": 331091, "epoch": 1970} {"train_loss": -7.720401287078857, "global_step": 331092, "epoch": 1970} {"train_loss": -6.873006820678711, "global_step": 331093, "epoch": 1970} {"train_loss": -8.455583572387695, "global_step": 331094, "epoch": 1970} {"train_loss": -9.004707336425781, "global_step": 331095, "epoch": 1970} {"train_loss": -9.126653671264648, "global_step": 331096, "epoch": 1970} {"train_loss": -9.173306465148926, "global_step": 331097, "epoch": 1970} {"train_loss": -9.057334899902344, "global_step": 331098, "epoch": 1970} {"train_loss": -9.33732795715332, "global_step": 331099, "epoch": 1970} {"train_loss": -9.948503494262695, "global_step": 331100, "epoch": 1970} {"train_loss": -10.374491691589355, "global_step": 331101, "epoch": 1970} {"train_loss": -9.865372657775879, "global_step": 331102, "epoch": 1970} {"train_loss": -10.017023086547852, "global_step": 331103, "epoch": 1970} {"train_loss": -10.258745193481445, "global_step": 331104, "epoch": 1970} {"train_loss": -10.246465682983398, "global_step": 331105, "epoch": 1970} {"train_loss": -10.331243515014648, "global_step": 331106, "epoch": 1970} {"train_loss": -10.38399887084961, "global_step": 331107, "epoch": 1970} {"train_loss": -11.184877395629883, "global_step": 331108, "epoch": 1970} {"train_loss": -10.242504119873047, "global_step": 331109, "epoch": 1970} {"train_loss": -11.214536666870117, "global_step": 331110, "epoch": 1970} {"train_loss": -10.814434051513672, "global_step": 331111, "epoch": 1970} {"train_loss": -10.685983657836914, "global_step": 331112, "epoch": 1970} {"train_loss": -10.953763961791992, "global_step": 331113, "epoch": 1970} {"train_loss": -10.809015274047852, "global_step": 331114, "epoch": 1970} {"train_loss": -10.786345481872559, "global_step": 331115, "epoch": 1970} {"train_loss": -11.514062881469727, "global_step": 331116, "epoch": 1970} {"train_loss": -11.44184684753418, "global_step": 331117, "epoch": 1970} {"train_loss": -11.210234642028809, "global_step": 331118, "epoch": 1970} {"train_loss": -11.690673828125, "global_step": 331119, "epoch": 1970} {"train_loss": -11.427773475646973, "global_step": 331120, "epoch": 1970} {"train_loss": -11.518863677978516, "global_step": 331121, "epoch": 1970} {"train_loss": -12.017810821533203, "global_step": 331122, "epoch": 1970} {"train_loss": -11.42490005493164, "global_step": 331123, "epoch": 1970} {"train_loss": -11.837318420410156, "global_step": 331124, "epoch": 1970} {"train_loss": -11.718171119689941, "global_step": 331125, "epoch": 1970} {"train_loss": -11.816377639770508, "global_step": 331126, "epoch": 1970} {"train_loss": -11.67823037363234, "global_step": 331127, "epoch": 1970, "val_loss": 286495.53125, "train_action_mse_error": 0.4793027341365814} {"train_loss": -11.760229110717773, "global_step": 331128, "epoch": 1971} {"train_loss": -11.884187698364258, "global_step": 331129, "epoch": 1971} {"train_loss": -11.939395904541016, "global_step": 331130, "epoch": 1971} {"train_loss": -11.62491226196289, "global_step": 331131, "epoch": 1971} {"train_loss": -12.013110160827637, "global_step": 331132, "epoch": 1971} {"train_loss": -11.69369888305664, "global_step": 331133, "epoch": 1971} {"train_loss": -11.972990036010742, "global_step": 331134, "epoch": 1971} {"train_loss": -12.179499626159668, "global_step": 331135, "epoch": 1971} {"train_loss": -11.961023330688477, "global_step": 331136, "epoch": 1971} {"train_loss": -12.012136459350586, "global_step": 331137, "epoch": 1971} {"train_loss": -11.96662712097168, "global_step": 331138, "epoch": 1971} {"train_loss": -12.157804489135742, "global_step": 331139, "epoch": 1971} {"train_loss": -12.11214542388916, "global_step": 331140, "epoch": 1971} {"train_loss": -11.976491928100586, "global_step": 331141, "epoch": 1971} {"train_loss": -12.198262214660645, "global_step": 331142, "epoch": 1971} {"train_loss": -12.205060958862305, "global_step": 331143, "epoch": 1971} {"train_loss": -12.305517196655273, "global_step": 331144, "epoch": 1971} {"train_loss": -12.051290512084961, "global_step": 331145, "epoch": 1971} {"train_loss": -12.343279838562012, "global_step": 331146, "epoch": 1971} {"train_loss": -12.147035598754883, "global_step": 331147, "epoch": 1971} {"train_loss": -12.081201553344727, "global_step": 331148, "epoch": 1971} {"train_loss": -12.259740829467773, "global_step": 331149, "epoch": 1971} {"train_loss": -12.191205978393555, "global_step": 331150, "epoch": 1971} {"train_loss": -12.050008773803711, "global_step": 331151, "epoch": 1971} {"train_loss": -12.226728439331055, "global_step": 331152, "epoch": 1971} {"train_loss": -12.216312408447266, "global_step": 331153, "epoch": 1971} {"train_loss": -12.092832565307617, "global_step": 331154, "epoch": 1971} {"train_loss": -12.206622123718262, "global_step": 331155, "epoch": 1971} {"train_loss": -12.397960662841797, "global_step": 331156, "epoch": 1971} {"train_loss": -12.170896530151367, "global_step": 331157, "epoch": 1971} {"train_loss": -12.277740478515625, "global_step": 331158, "epoch": 1971} {"train_loss": -12.4426851272583, "global_step": 331159, "epoch": 1971} {"train_loss": -12.172969818115234, "global_step": 331160, "epoch": 1971} {"train_loss": -12.512653350830078, "global_step": 331161, "epoch": 1971} {"train_loss": -12.278120994567871, "global_step": 331162, "epoch": 1971} {"train_loss": -12.152022361755371, "global_step": 331163, "epoch": 1971} {"train_loss": -12.339595794677734, "global_step": 331164, "epoch": 1971} {"train_loss": -12.457633972167969, "global_step": 331165, "epoch": 1971} {"train_loss": -12.357406616210938, "global_step": 331166, "epoch": 1971} {"train_loss": -12.458035469055176, "global_step": 331167, "epoch": 1971} {"train_loss": -12.466571807861328, "global_step": 331168, "epoch": 1971} {"train_loss": -12.380499839782715, "global_step": 331169, "epoch": 1971} {"train_loss": -12.280014991760254, "global_step": 331170, "epoch": 1971} {"train_loss": -12.45946979522705, "global_step": 331171, "epoch": 1971} {"train_loss": -12.23308277130127, "global_step": 331172, "epoch": 1971} {"train_loss": -12.480491638183594, "global_step": 331173, "epoch": 1971} {"train_loss": -12.412008285522461, "global_step": 331174, "epoch": 1971} {"train_loss": -12.486608505249023, "global_step": 331175, "epoch": 1971} {"train_loss": -12.57274055480957, "global_step": 331176, "epoch": 1971} {"train_loss": -12.336496353149414, "global_step": 331177, "epoch": 1971} {"train_loss": -12.51915168762207, "global_step": 331178, "epoch": 1971} {"train_loss": -12.373199462890625, "global_step": 331179, "epoch": 1971} {"train_loss": -12.65106201171875, "global_step": 331180, "epoch": 1971} {"train_loss": -12.337013244628906, "global_step": 331181, "epoch": 1971} {"train_loss": -12.052970886230469, "global_step": 331182, "epoch": 1971} {"train_loss": -12.336681365966797, "global_step": 331183, "epoch": 1971} {"train_loss": -12.51730728149414, "global_step": 331184, "epoch": 1971} {"train_loss": -12.287575721740723, "global_step": 331185, "epoch": 1971} {"train_loss": -12.459156036376953, "global_step": 331186, "epoch": 1971} {"train_loss": -12.232261657714844, "global_step": 331187, "epoch": 1971} {"train_loss": -12.519681930541992, "global_step": 331188, "epoch": 1971} {"train_loss": -12.337793350219727, "global_step": 331189, "epoch": 1971} {"train_loss": -12.330937385559082, "global_step": 331190, "epoch": 1971} {"train_loss": -12.494359970092773, "global_step": 331191, "epoch": 1971} {"train_loss": -12.409524917602539, "global_step": 331192, "epoch": 1971} {"train_loss": -12.634873390197754, "global_step": 331193, "epoch": 1971} {"train_loss": -12.312165260314941, "global_step": 331194, "epoch": 1971} {"train_loss": -12.453817367553711, "global_step": 331195, "epoch": 1971} {"train_loss": -12.293325424194336, "global_step": 331196, "epoch": 1971} {"train_loss": -12.576820373535156, "global_step": 331197, "epoch": 1971} {"train_loss": -12.111129760742188, "global_step": 331198, "epoch": 1971} {"train_loss": -12.101678848266602, "global_step": 331199, "epoch": 1971} {"train_loss": -12.010688781738281, "global_step": 331200, "epoch": 1971} {"train_loss": -12.471261978149414, "global_step": 331201, "epoch": 1971} {"train_loss": -12.110772132873535, "global_step": 331202, "epoch": 1971} {"train_loss": -11.980045318603516, "global_step": 331203, "epoch": 1971} {"train_loss": -12.249205589294434, "global_step": 331204, "epoch": 1971} {"train_loss": -12.04435920715332, "global_step": 331205, "epoch": 1971} {"train_loss": -11.452964782714844, "global_step": 331206, "epoch": 1971} {"train_loss": -11.854193687438965, "global_step": 331207, "epoch": 1971} {"train_loss": -12.32304573059082, "global_step": 331208, "epoch": 1971} {"train_loss": -11.272613525390625, "global_step": 331209, "epoch": 1971} {"train_loss": -11.99209976196289, "global_step": 331210, "epoch": 1971} {"train_loss": -12.188934326171875, "global_step": 331211, "epoch": 1971} {"train_loss": -11.784017562866211, "global_step": 331212, "epoch": 1971} {"train_loss": -11.89934253692627, "global_step": 331213, "epoch": 1971} {"train_loss": -12.064924240112305, "global_step": 331214, "epoch": 1971} {"train_loss": -11.898774147033691, "global_step": 331215, "epoch": 1971} {"train_loss": -11.951053619384766, "global_step": 331216, "epoch": 1971} {"train_loss": -12.146757125854492, "global_step": 331217, "epoch": 1971} {"train_loss": -11.553388595581055, "global_step": 331218, "epoch": 1971} {"train_loss": -11.885889053344727, "global_step": 331219, "epoch": 1971} {"train_loss": -11.854820251464844, "global_step": 331220, "epoch": 1971} {"train_loss": -11.045727729797363, "global_step": 331221, "epoch": 1971} {"train_loss": -12.01052188873291, "global_step": 331222, "epoch": 1971} {"train_loss": -11.920758247375488, "global_step": 331223, "epoch": 1971} {"train_loss": -12.156339645385742, "global_step": 331224, "epoch": 1971} {"train_loss": -11.99085807800293, "global_step": 331225, "epoch": 1971} {"train_loss": -11.864984512329102, "global_step": 331226, "epoch": 1971} {"train_loss": -11.754594802856445, "global_step": 331227, "epoch": 1971} {"train_loss": -12.110685348510742, "global_step": 331228, "epoch": 1971} {"train_loss": -12.310302734375, "global_step": 331229, "epoch": 1971} {"train_loss": -11.828683853149414, "global_step": 331230, "epoch": 1971} {"train_loss": -12.227684020996094, "global_step": 331231, "epoch": 1971} {"train_loss": -12.09512996673584, "global_step": 331232, "epoch": 1971} {"train_loss": -11.436214447021484, "global_step": 331233, "epoch": 1971} {"train_loss": -12.123804092407227, "global_step": 331234, "epoch": 1971} {"train_loss": -11.071054458618164, "global_step": 331235, "epoch": 1971} {"train_loss": -12.499313354492188, "global_step": 331236, "epoch": 1971} {"train_loss": -11.494110107421875, "global_step": 331237, "epoch": 1971} {"train_loss": -12.368363380432129, "global_step": 331238, "epoch": 1971} {"train_loss": -11.505376815795898, "global_step": 331239, "epoch": 1971} {"train_loss": -12.38122272491455, "global_step": 331240, "epoch": 1971} {"train_loss": -11.553471565246582, "global_step": 331241, "epoch": 1971} {"train_loss": -12.084766387939453, "global_step": 331242, "epoch": 1971} {"train_loss": -11.665236473083496, "global_step": 331243, "epoch": 1971} {"train_loss": -11.914961814880371, "global_step": 331244, "epoch": 1971} {"train_loss": -11.751883506774902, "global_step": 331245, "epoch": 1971} {"train_loss": -11.727133750915527, "global_step": 331246, "epoch": 1971} {"train_loss": -11.716381072998047, "global_step": 331247, "epoch": 1971} {"train_loss": -11.590851783752441, "global_step": 331248, "epoch": 1971} {"train_loss": -11.307485580444336, "global_step": 331249, "epoch": 1971} {"train_loss": -11.766987800598145, "global_step": 331250, "epoch": 1971} {"train_loss": -11.60601806640625, "global_step": 331251, "epoch": 1971} {"train_loss": -11.551517486572266, "global_step": 331252, "epoch": 1971} {"train_loss": -12.025360107421875, "global_step": 331253, "epoch": 1971} {"train_loss": -11.838598251342773, "global_step": 331254, "epoch": 1971} {"train_loss": -11.340632438659668, "global_step": 331255, "epoch": 1971} {"train_loss": -12.195652961730957, "global_step": 331256, "epoch": 1971} {"train_loss": -11.81991958618164, "global_step": 331257, "epoch": 1971} {"train_loss": -12.382678985595703, "global_step": 331258, "epoch": 1971} {"train_loss": -11.964344024658203, "global_step": 331259, "epoch": 1971} {"train_loss": -12.244914054870605, "global_step": 331260, "epoch": 1971} {"train_loss": -12.353394508361816, "global_step": 331261, "epoch": 1971} {"train_loss": -12.125747680664062, "global_step": 331262, "epoch": 1971} {"train_loss": -12.40863037109375, "global_step": 331263, "epoch": 1971} {"train_loss": -12.290094375610352, "global_step": 331264, "epoch": 1971} {"train_loss": -12.451362609863281, "global_step": 331265, "epoch": 1971} {"train_loss": -12.174559593200684, "global_step": 331266, "epoch": 1971} {"train_loss": -12.239916801452637, "global_step": 331267, "epoch": 1971} {"train_loss": -12.276159286499023, "global_step": 331268, "epoch": 1971} {"train_loss": -12.207292556762695, "global_step": 331269, "epoch": 1971} {"train_loss": -12.320056915283203, "global_step": 331270, "epoch": 1971} {"train_loss": -12.112960815429688, "global_step": 331271, "epoch": 1971} {"train_loss": -11.909456253051758, "global_step": 331272, "epoch": 1971} {"train_loss": -11.80244255065918, "global_step": 331273, "epoch": 1971} {"train_loss": -12.396493911743164, "global_step": 331274, "epoch": 1971} {"train_loss": -12.33098030090332, "global_step": 331275, "epoch": 1971} {"train_loss": -12.150652885437012, "global_step": 331276, "epoch": 1971} {"train_loss": -12.129627227783203, "global_step": 331277, "epoch": 1971} {"train_loss": -11.994586944580078, "global_step": 331278, "epoch": 1971} {"train_loss": -12.436963081359863, "global_step": 331279, "epoch": 1971} {"train_loss": -11.985450744628906, "global_step": 331280, "epoch": 1971} {"train_loss": -12.063583374023438, "global_step": 331281, "epoch": 1971} {"train_loss": -12.309799194335938, "global_step": 331282, "epoch": 1971} {"train_loss": -12.02170181274414, "global_step": 331283, "epoch": 1971} {"train_loss": -12.008552551269531, "global_step": 331284, "epoch": 1971} {"train_loss": -12.114299774169922, "global_step": 331285, "epoch": 1971} {"train_loss": -11.777843475341797, "global_step": 331286, "epoch": 1971} {"train_loss": -11.666973114013672, "global_step": 331287, "epoch": 1971} {"train_loss": -11.579168319702148, "global_step": 331288, "epoch": 1971} {"train_loss": -12.036966323852539, "global_step": 331289, "epoch": 1971} {"train_loss": -11.994937896728516, "global_step": 331290, "epoch": 1971} {"train_loss": -12.28394889831543, "global_step": 331291, "epoch": 1971} {"train_loss": -12.157462120056152, "global_step": 331292, "epoch": 1971} {"train_loss": -12.158116340637207, "global_step": 331293, "epoch": 1971} {"train_loss": -11.924707412719727, "global_step": 331294, "epoch": 1971} {"train_loss": -12.093334288824172, "global_step": 331295, "epoch": 1971, "val_loss": 288058.1875} {"train_loss": -12.116846084594727, "global_step": 331296, "epoch": 1972} {"train_loss": -12.008002281188965, "global_step": 331297, "epoch": 1972} {"train_loss": -11.990418434143066, "global_step": 331298, "epoch": 1972} {"train_loss": -12.362384796142578, "global_step": 331299, "epoch": 1972} {"train_loss": -12.112964630126953, "global_step": 331300, "epoch": 1972} {"train_loss": -12.455148696899414, "global_step": 331301, "epoch": 1972} {"train_loss": -11.963021278381348, "global_step": 331302, "epoch": 1972} {"train_loss": -12.437662124633789, "global_step": 331303, "epoch": 1972} {"train_loss": -12.266454696655273, "global_step": 331304, "epoch": 1972} {"train_loss": -12.377553939819336, "global_step": 331305, "epoch": 1972} {"train_loss": -12.410538673400879, "global_step": 331306, "epoch": 1972} {"train_loss": -12.565558433532715, "global_step": 331307, "epoch": 1972} {"train_loss": -12.192778587341309, "global_step": 331308, "epoch": 1972} {"train_loss": -12.300171852111816, "global_step": 331309, "epoch": 1972} {"train_loss": -12.330055236816406, "global_step": 331310, "epoch": 1972} {"train_loss": -12.408589363098145, "global_step": 331311, "epoch": 1972} {"train_loss": -12.712403297424316, "global_step": 331312, "epoch": 1972} {"train_loss": -12.088581085205078, "global_step": 331313, "epoch": 1972} {"train_loss": -12.002721786499023, "global_step": 331314, "epoch": 1972} {"train_loss": -11.596808433532715, "global_step": 331315, "epoch": 1972} {"train_loss": -11.938247680664062, "global_step": 331316, "epoch": 1972} {"train_loss": -11.928349494934082, "global_step": 331317, "epoch": 1972} {"train_loss": -10.831711769104004, "global_step": 331318, "epoch": 1972} {"train_loss": -10.91381549835205, "global_step": 331319, "epoch": 1972} {"train_loss": -10.13432788848877, "global_step": 331320, "epoch": 1972} {"train_loss": -11.806230545043945, "global_step": 331321, "epoch": 1972} {"train_loss": -10.679008483886719, "global_step": 331322, "epoch": 1972} {"train_loss": -10.108236312866211, "global_step": 331323, "epoch": 1972} {"train_loss": -11.043880462646484, "global_step": 331324, "epoch": 1972} {"train_loss": -11.61790943145752, "global_step": 331325, "epoch": 1972} {"train_loss": -10.71619987487793, "global_step": 331326, "epoch": 1972} {"train_loss": -11.408905029296875, "global_step": 331327, "epoch": 1972} {"train_loss": -11.313543319702148, "global_step": 331328, "epoch": 1972} {"train_loss": -11.796268463134766, "global_step": 331329, "epoch": 1972} {"train_loss": -11.170945167541504, "global_step": 331330, "epoch": 1972} {"train_loss": -11.519765853881836, "global_step": 331331, "epoch": 1972} {"train_loss": -11.889677047729492, "global_step": 331332, "epoch": 1972} {"train_loss": -11.769216537475586, "global_step": 331333, "epoch": 1972} {"train_loss": -11.62315559387207, "global_step": 331334, "epoch": 1972} {"train_loss": -12.298307418823242, "global_step": 331335, "epoch": 1972} {"train_loss": -11.784225463867188, "global_step": 331336, "epoch": 1972} {"train_loss": -11.843843460083008, "global_step": 331337, "epoch": 1972} {"train_loss": -12.026192665100098, "global_step": 331338, "epoch": 1972} {"train_loss": -11.844883918762207, "global_step": 331339, "epoch": 1972} {"train_loss": -11.886711120605469, "global_step": 331340, "epoch": 1972} {"train_loss": -12.149826049804688, "global_step": 331341, "epoch": 1972} {"train_loss": -12.166120529174805, "global_step": 331342, "epoch": 1972} {"train_loss": -11.974388122558594, "global_step": 331343, "epoch": 1972} {"train_loss": -12.132745742797852, "global_step": 331344, "epoch": 1972} {"train_loss": -12.185616493225098, "global_step": 331345, "epoch": 1972} {"train_loss": -12.051916122436523, "global_step": 331346, "epoch": 1972} {"train_loss": -12.116519927978516, "global_step": 331347, "epoch": 1972} {"train_loss": -12.282469749450684, "global_step": 331348, "epoch": 1972} {"train_loss": -12.375423431396484, "global_step": 331349, "epoch": 1972} {"train_loss": -12.377378463745117, "global_step": 331350, "epoch": 1972} {"train_loss": -12.149064064025879, "global_step": 331351, "epoch": 1972} {"train_loss": -12.333232879638672, "global_step": 331352, "epoch": 1972} {"train_loss": -12.345320701599121, "global_step": 331353, "epoch": 1972} {"train_loss": -12.424480438232422, "global_step": 331354, "epoch": 1972} {"train_loss": -12.40707778930664, "global_step": 331355, "epoch": 1972} {"train_loss": -12.390340805053711, "global_step": 331356, "epoch": 1972} {"train_loss": -12.318269729614258, "global_step": 331357, "epoch": 1972} {"train_loss": -12.42074203491211, "global_step": 331358, "epoch": 1972} {"train_loss": -12.407794952392578, "global_step": 331359, "epoch": 1972} {"train_loss": -12.094951629638672, "global_step": 331360, "epoch": 1972} {"train_loss": -12.536027908325195, "global_step": 331361, "epoch": 1972} {"train_loss": -12.337414741516113, "global_step": 331362, "epoch": 1972} {"train_loss": -12.118486404418945, "global_step": 331363, "epoch": 1972} {"train_loss": -12.234847068786621, "global_step": 331364, "epoch": 1972} {"train_loss": -12.364370346069336, "global_step": 331365, "epoch": 1972} {"train_loss": -12.278421401977539, "global_step": 331366, "epoch": 1972} {"train_loss": -12.322449684143066, "global_step": 331367, "epoch": 1972} {"train_loss": -12.47816276550293, "global_step": 331368, "epoch": 1972} {"train_loss": -12.3104248046875, "global_step": 331369, "epoch": 1972} {"train_loss": -12.381352424621582, "global_step": 331370, "epoch": 1972} {"train_loss": -12.150152206420898, "global_step": 331371, "epoch": 1972} {"train_loss": -12.410408020019531, "global_step": 331372, "epoch": 1972} {"train_loss": -12.07248306274414, "global_step": 331373, "epoch": 1972} {"train_loss": -12.589618682861328, "global_step": 331374, "epoch": 1972} {"train_loss": -12.178474426269531, "global_step": 331375, "epoch": 1972} {"train_loss": -12.228527069091797, "global_step": 331376, "epoch": 1972} {"train_loss": -12.196518898010254, "global_step": 331377, "epoch": 1972} {"train_loss": -12.302974700927734, "global_step": 331378, "epoch": 1972} {"train_loss": -12.112727165222168, "global_step": 331379, "epoch": 1972} {"train_loss": -12.045058250427246, "global_step": 331380, "epoch": 1972} {"train_loss": -11.848245620727539, "global_step": 331381, "epoch": 1972} {"train_loss": -12.396893501281738, "global_step": 331382, "epoch": 1972} {"train_loss": -11.899113655090332, "global_step": 331383, "epoch": 1972} {"train_loss": -11.325895309448242, "global_step": 331384, "epoch": 1972} {"train_loss": -11.87814712524414, "global_step": 331385, "epoch": 1972} {"train_loss": -12.234772682189941, "global_step": 331386, "epoch": 1972} {"train_loss": -12.440406799316406, "global_step": 331387, "epoch": 1972} {"train_loss": -12.41331672668457, "global_step": 331388, "epoch": 1972} {"train_loss": -12.321372032165527, "global_step": 331389, "epoch": 1972} {"train_loss": -11.839546203613281, "global_step": 331390, "epoch": 1972} {"train_loss": -12.549884796142578, "global_step": 331391, "epoch": 1972} {"train_loss": -12.107433319091797, "global_step": 331392, "epoch": 1972} {"train_loss": -11.889894485473633, "global_step": 331393, "epoch": 1972} {"train_loss": -10.958806991577148, "global_step": 331394, "epoch": 1972} {"train_loss": -12.348918914794922, "global_step": 331395, "epoch": 1972} {"train_loss": -11.845867156982422, "global_step": 331396, "epoch": 1972} {"train_loss": -11.453389167785645, "global_step": 331397, "epoch": 1972} {"train_loss": -11.983902931213379, "global_step": 331398, "epoch": 1972} {"train_loss": -11.844483375549316, "global_step": 331399, "epoch": 1972} {"train_loss": -11.183109283447266, "global_step": 331400, "epoch": 1972} {"train_loss": -11.706162452697754, "global_step": 331401, "epoch": 1972} {"train_loss": -10.749391555786133, "global_step": 331402, "epoch": 1972} {"train_loss": -11.379829406738281, "global_step": 331403, "epoch": 1972} {"train_loss": -12.375079154968262, "global_step": 331404, "epoch": 1972} {"train_loss": -11.637351036071777, "global_step": 331405, "epoch": 1972} {"train_loss": -11.633825302124023, "global_step": 331406, "epoch": 1972} {"train_loss": -12.083595275878906, "global_step": 331407, "epoch": 1972} {"train_loss": -11.880941390991211, "global_step": 331408, "epoch": 1972} {"train_loss": -12.016397476196289, "global_step": 331409, "epoch": 1972} {"train_loss": -11.74676513671875, "global_step": 331410, "epoch": 1972} {"train_loss": -12.240287780761719, "global_step": 331411, "epoch": 1972} {"train_loss": -12.154973030090332, "global_step": 331412, "epoch": 1972} {"train_loss": -11.902247428894043, "global_step": 331413, "epoch": 1972} {"train_loss": -12.330650329589844, "global_step": 331414, "epoch": 1972} {"train_loss": -12.115745544433594, "global_step": 331415, "epoch": 1972} {"train_loss": -12.043697357177734, "global_step": 331416, "epoch": 1972} {"train_loss": -12.38817024230957, "global_step": 331417, "epoch": 1972} {"train_loss": -12.250995635986328, "global_step": 331418, "epoch": 1972} {"train_loss": -12.236030578613281, "global_step": 331419, "epoch": 1972} {"train_loss": -12.09241771697998, "global_step": 331420, "epoch": 1972} {"train_loss": -12.313457489013672, "global_step": 331421, "epoch": 1972} {"train_loss": -11.462640762329102, "global_step": 331422, "epoch": 1972} {"train_loss": -11.826654434204102, "global_step": 331423, "epoch": 1972} {"train_loss": -11.898199081420898, "global_step": 331424, "epoch": 1972} {"train_loss": -11.795431137084961, "global_step": 331425, "epoch": 1972} {"train_loss": -11.712251663208008, "global_step": 331426, "epoch": 1972} {"train_loss": -11.843433380126953, "global_step": 331427, "epoch": 1972} {"train_loss": -11.503143310546875, "global_step": 331428, "epoch": 1972} {"train_loss": -12.28634262084961, "global_step": 331429, "epoch": 1972} {"train_loss": -11.855049133300781, "global_step": 331430, "epoch": 1972} {"train_loss": -12.380084991455078, "global_step": 331431, "epoch": 1972} {"train_loss": -11.856233596801758, "global_step": 331432, "epoch": 1972} {"train_loss": -11.96107292175293, "global_step": 331433, "epoch": 1972} {"train_loss": -12.132741928100586, "global_step": 331434, "epoch": 1972} {"train_loss": -12.105433464050293, "global_step": 331435, "epoch": 1972} {"train_loss": -12.194588661193848, "global_step": 331436, "epoch": 1972} {"train_loss": -12.310016632080078, "global_step": 331437, "epoch": 1972} {"train_loss": -12.344892501831055, "global_step": 331438, "epoch": 1972} {"train_loss": -12.402864456176758, "global_step": 331439, "epoch": 1972} {"train_loss": -12.315332412719727, "global_step": 331440, "epoch": 1972} {"train_loss": -12.375181198120117, "global_step": 331441, "epoch": 1972} {"train_loss": -12.2846097946167, "global_step": 331442, "epoch": 1972} {"train_loss": -12.501394271850586, "global_step": 331443, "epoch": 1972} {"train_loss": -12.42609977722168, "global_step": 331444, "epoch": 1972} {"train_loss": -12.424561500549316, "global_step": 331445, "epoch": 1972} {"train_loss": -12.452302932739258, "global_step": 331446, "epoch": 1972} {"train_loss": -12.338369369506836, "global_step": 331447, "epoch": 1972} {"train_loss": -12.453967094421387, "global_step": 331448, "epoch": 1972} {"train_loss": -12.376459121704102, "global_step": 331449, "epoch": 1972} {"train_loss": -12.489255905151367, "global_step": 331450, "epoch": 1972} {"train_loss": -12.63575553894043, "global_step": 331451, "epoch": 1972} {"train_loss": -12.548601150512695, "global_step": 331452, "epoch": 1972} {"train_loss": -12.654149055480957, "global_step": 331453, "epoch": 1972} {"train_loss": -12.273548126220703, "global_step": 331454, "epoch": 1972} {"train_loss": -12.358589172363281, "global_step": 331455, "epoch": 1972} {"train_loss": -12.651172637939453, "global_step": 331456, "epoch": 1972} {"train_loss": -12.394556045532227, "global_step": 331457, "epoch": 1972} {"train_loss": -12.243751525878906, "global_step": 331458, "epoch": 1972} {"train_loss": -12.25999641418457, "global_step": 331459, "epoch": 1972} {"train_loss": -12.378250122070312, "global_step": 331460, "epoch": 1972} {"train_loss": -12.508268356323242, "global_step": 331461, "epoch": 1972} {"train_loss": -12.497422218322754, "global_step": 331462, "epoch": 1972} {"train_loss": -12.056300089472817, "global_step": 331463, "epoch": 1972, "val_loss": 285980.46875} {"train_loss": -12.520511627197266, "global_step": 331464, "epoch": 1973} {"train_loss": -11.986602783203125, "global_step": 331465, "epoch": 1973} {"train_loss": -12.287629127502441, "global_step": 331466, "epoch": 1973} {"train_loss": -12.319692611694336, "global_step": 331467, "epoch": 1973} {"train_loss": -12.51324462890625, "global_step": 331468, "epoch": 1973} {"train_loss": -11.99509048461914, "global_step": 331469, "epoch": 1973} {"train_loss": -11.794261932373047, "global_step": 331470, "epoch": 1973} {"train_loss": -11.901344299316406, "global_step": 331471, "epoch": 1973} {"train_loss": -11.742737770080566, "global_step": 331472, "epoch": 1973} {"train_loss": -11.775101661682129, "global_step": 331473, "epoch": 1973} {"train_loss": -10.859098434448242, "global_step": 331474, "epoch": 1973} {"train_loss": -11.837016105651855, "global_step": 331475, "epoch": 1973} {"train_loss": -11.700122833251953, "global_step": 331476, "epoch": 1973} {"train_loss": -11.503206253051758, "global_step": 331477, "epoch": 1973} {"train_loss": -12.137439727783203, "global_step": 331478, "epoch": 1973} {"train_loss": -11.825064659118652, "global_step": 331479, "epoch": 1973} {"train_loss": -11.74051284790039, "global_step": 331480, "epoch": 1973} {"train_loss": -11.836614608764648, "global_step": 331481, "epoch": 1973} {"train_loss": -11.741357803344727, "global_step": 331482, "epoch": 1973} {"train_loss": -12.316259384155273, "global_step": 331483, "epoch": 1973} {"train_loss": -11.316908836364746, "global_step": 331484, "epoch": 1973} {"train_loss": -12.310953140258789, "global_step": 331485, "epoch": 1973} {"train_loss": -11.995035171508789, "global_step": 331486, "epoch": 1973} {"train_loss": -10.864599227905273, "global_step": 331487, "epoch": 1973} {"train_loss": -10.60291576385498, "global_step": 331488, "epoch": 1973} {"train_loss": -11.283445358276367, "global_step": 331489, "epoch": 1973} {"train_loss": -11.497926712036133, "global_step": 331490, "epoch": 1973} {"train_loss": -10.426976203918457, "global_step": 331491, "epoch": 1973} {"train_loss": -11.838851928710938, "global_step": 331492, "epoch": 1973} {"train_loss": -11.667787551879883, "global_step": 331493, "epoch": 1973} {"train_loss": -11.052995681762695, "global_step": 331494, "epoch": 1973} {"train_loss": -10.448020935058594, "global_step": 331495, "epoch": 1973} {"train_loss": -11.529272079467773, "global_step": 331496, "epoch": 1973} {"train_loss": -9.956502914428711, "global_step": 331497, "epoch": 1973} {"train_loss": -11.353938102722168, "global_step": 331498, "epoch": 1973} {"train_loss": -9.87635612487793, "global_step": 331499, "epoch": 1973} {"train_loss": -10.005308151245117, "global_step": 331500, "epoch": 1973} {"train_loss": -12.178638458251953, "global_step": 331501, "epoch": 1973} {"train_loss": -10.119451522827148, "global_step": 331502, "epoch": 1973} {"train_loss": -11.418149948120117, "global_step": 331503, "epoch": 1973} {"train_loss": -11.129020690917969, "global_step": 331504, "epoch": 1973} {"train_loss": -10.967916488647461, "global_step": 331505, "epoch": 1973} {"train_loss": -10.968147277832031, "global_step": 331506, "epoch": 1973} {"train_loss": -10.651005744934082, "global_step": 331507, "epoch": 1973} {"train_loss": -11.619345664978027, "global_step": 331508, "epoch": 1973} {"train_loss": -11.40966796875, "global_step": 331509, "epoch": 1973} {"train_loss": -11.464700698852539, "global_step": 331510, "epoch": 1973} {"train_loss": -11.663023948669434, "global_step": 331511, "epoch": 1973} {"train_loss": -11.706103324890137, "global_step": 331512, "epoch": 1973} {"train_loss": -11.844282150268555, "global_step": 331513, "epoch": 1973} {"train_loss": -11.860937118530273, "global_step": 331514, "epoch": 1973} {"train_loss": -11.826946258544922, "global_step": 331515, "epoch": 1973} {"train_loss": -11.927789688110352, "global_step": 331516, "epoch": 1973} {"train_loss": -12.036701202392578, "global_step": 331517, "epoch": 1973} {"train_loss": -12.055851936340332, "global_step": 331518, "epoch": 1973} {"train_loss": -11.847021102905273, "global_step": 331519, "epoch": 1973} {"train_loss": -12.27708911895752, "global_step": 331520, "epoch": 1973} {"train_loss": -11.971296310424805, "global_step": 331521, "epoch": 1973} {"train_loss": -11.985441207885742, "global_step": 331522, "epoch": 1973} {"train_loss": -12.02104377746582, "global_step": 331523, "epoch": 1973} {"train_loss": -12.192328453063965, "global_step": 331524, "epoch": 1973} {"train_loss": -12.34979248046875, "global_step": 331525, "epoch": 1973} {"train_loss": -11.923442840576172, "global_step": 331526, "epoch": 1973} {"train_loss": -12.041339874267578, "global_step": 331527, "epoch": 1973} {"train_loss": -12.068166732788086, "global_step": 331528, "epoch": 1973} {"train_loss": -11.856000900268555, "global_step": 331529, "epoch": 1973} {"train_loss": -12.19670295715332, "global_step": 331530, "epoch": 1973} {"train_loss": -12.166933059692383, "global_step": 331531, "epoch": 1973} {"train_loss": -12.235603332519531, "global_step": 331532, "epoch": 1973} {"train_loss": -11.883277893066406, "global_step": 331533, "epoch": 1973} {"train_loss": -12.132598876953125, "global_step": 331534, "epoch": 1973} {"train_loss": -12.070526123046875, "global_step": 331535, "epoch": 1973} {"train_loss": -12.331683158874512, "global_step": 331536, "epoch": 1973} {"train_loss": -12.00621223449707, "global_step": 331537, "epoch": 1973} {"train_loss": -11.94491958618164, "global_step": 331538, "epoch": 1973} {"train_loss": -11.622435569763184, "global_step": 331539, "epoch": 1973} {"train_loss": -12.009617805480957, "global_step": 331540, "epoch": 1973} {"train_loss": -12.123233795166016, "global_step": 331541, "epoch": 1973} {"train_loss": -12.200098991394043, "global_step": 331542, "epoch": 1973} {"train_loss": -11.957898139953613, "global_step": 331543, "epoch": 1973} {"train_loss": -11.642252922058105, "global_step": 331544, "epoch": 1973} {"train_loss": -12.220793724060059, "global_step": 331545, "epoch": 1973} {"train_loss": -12.034814834594727, "global_step": 331546, "epoch": 1973} {"train_loss": -11.997495651245117, "global_step": 331547, "epoch": 1973} {"train_loss": -11.975618362426758, "global_step": 331548, "epoch": 1973} {"train_loss": -12.457805633544922, "global_step": 331549, "epoch": 1973} {"train_loss": -12.354303359985352, "global_step": 331550, "epoch": 1973} {"train_loss": -12.132073402404785, "global_step": 331551, "epoch": 1973} {"train_loss": -12.500511169433594, "global_step": 331552, "epoch": 1973} {"train_loss": -12.339402198791504, "global_step": 331553, "epoch": 1973} {"train_loss": -12.335043907165527, "global_step": 331554, "epoch": 1973} {"train_loss": -12.318347930908203, "global_step": 331555, "epoch": 1973} {"train_loss": -12.366747856140137, "global_step": 331556, "epoch": 1973} {"train_loss": -12.390647888183594, "global_step": 331557, "epoch": 1973} {"train_loss": -12.33173942565918, "global_step": 331558, "epoch": 1973} {"train_loss": -12.410567283630371, "global_step": 331559, "epoch": 1973} {"train_loss": -12.457395553588867, "global_step": 331560, "epoch": 1973} {"train_loss": -12.629624366760254, "global_step": 331561, "epoch": 1973} {"train_loss": -11.708417892456055, "global_step": 331562, "epoch": 1973} {"train_loss": -12.39089584350586, "global_step": 331563, "epoch": 1973} {"train_loss": -12.237237930297852, "global_step": 331564, "epoch": 1973} {"train_loss": -11.749824523925781, "global_step": 331565, "epoch": 1973} {"train_loss": -12.516138076782227, "global_step": 331566, "epoch": 1973} {"train_loss": -12.27188491821289, "global_step": 331567, "epoch": 1973} {"train_loss": -12.236783981323242, "global_step": 331568, "epoch": 1973} {"train_loss": -12.470001220703125, "global_step": 331569, "epoch": 1973} {"train_loss": -12.290369033813477, "global_step": 331570, "epoch": 1973} {"train_loss": -12.387263298034668, "global_step": 331571, "epoch": 1973} {"train_loss": -12.568901062011719, "global_step": 331572, "epoch": 1973} {"train_loss": -12.524513244628906, "global_step": 331573, "epoch": 1973} {"train_loss": -12.31629753112793, "global_step": 331574, "epoch": 1973} {"train_loss": -12.35548210144043, "global_step": 331575, "epoch": 1973} {"train_loss": -12.173933029174805, "global_step": 331576, "epoch": 1973} {"train_loss": -11.85641860961914, "global_step": 331577, "epoch": 1973} {"train_loss": -12.600446701049805, "global_step": 331578, "epoch": 1973} {"train_loss": -12.208680152893066, "global_step": 331579, "epoch": 1973} {"train_loss": -12.192028999328613, "global_step": 331580, "epoch": 1973} {"train_loss": -11.46515941619873, "global_step": 331581, "epoch": 1973} {"train_loss": -12.019352912902832, "global_step": 331582, "epoch": 1973} {"train_loss": -11.843820571899414, "global_step": 331583, "epoch": 1973} {"train_loss": -12.727508544921875, "global_step": 331584, "epoch": 1973} {"train_loss": -12.052648544311523, "global_step": 331585, "epoch": 1973} {"train_loss": -11.802203178405762, "global_step": 331586, "epoch": 1973} {"train_loss": -11.920062065124512, "global_step": 331587, "epoch": 1973} {"train_loss": -12.31325626373291, "global_step": 331588, "epoch": 1973} {"train_loss": -12.366659164428711, "global_step": 331589, "epoch": 1973} {"train_loss": -12.180913925170898, "global_step": 331590, "epoch": 1973} {"train_loss": -12.16842269897461, "global_step": 331591, "epoch": 1973} {"train_loss": -12.554876327514648, "global_step": 331592, "epoch": 1973} {"train_loss": -12.427013397216797, "global_step": 331593, "epoch": 1973} {"train_loss": -11.677011489868164, "global_step": 331594, "epoch": 1973} {"train_loss": -12.418756484985352, "global_step": 331595, "epoch": 1973} {"train_loss": -12.080267906188965, "global_step": 331596, "epoch": 1973} {"train_loss": -11.94079875946045, "global_step": 331597, "epoch": 1973} {"train_loss": -11.379670143127441, "global_step": 331598, "epoch": 1973} {"train_loss": -11.619902610778809, "global_step": 331599, "epoch": 1973} {"train_loss": -11.973825454711914, "global_step": 331600, "epoch": 1973} {"train_loss": -12.360176086425781, "global_step": 331601, "epoch": 1973} {"train_loss": -12.13702392578125, "global_step": 331602, "epoch": 1973} {"train_loss": -12.009195327758789, "global_step": 331603, "epoch": 1973} {"train_loss": -12.341720581054688, "global_step": 331604, "epoch": 1973} {"train_loss": -12.019774436950684, "global_step": 331605, "epoch": 1973} {"train_loss": -11.497143745422363, "global_step": 331606, "epoch": 1973} {"train_loss": -11.946049690246582, "global_step": 331607, "epoch": 1973} {"train_loss": -11.832134246826172, "global_step": 331608, "epoch": 1973} {"train_loss": -11.563695907592773, "global_step": 331609, "epoch": 1973} {"train_loss": -11.958829879760742, "global_step": 331610, "epoch": 1973} {"train_loss": -12.128425598144531, "global_step": 331611, "epoch": 1973} {"train_loss": -11.686567306518555, "global_step": 331612, "epoch": 1973} {"train_loss": -11.558685302734375, "global_step": 331613, "epoch": 1973} {"train_loss": -12.328097343444824, "global_step": 331614, "epoch": 1973} {"train_loss": -11.396642684936523, "global_step": 331615, "epoch": 1973} {"train_loss": -10.378460884094238, "global_step": 331616, "epoch": 1973} {"train_loss": -11.963102340698242, "global_step": 331617, "epoch": 1973} {"train_loss": -9.576136589050293, "global_step": 331618, "epoch": 1973} {"train_loss": -11.36567497253418, "global_step": 331619, "epoch": 1973} {"train_loss": -9.637675285339355, "global_step": 331620, "epoch": 1973} {"train_loss": -9.227250099182129, "global_step": 331621, "epoch": 1973} {"train_loss": -8.29397964477539, "global_step": 331622, "epoch": 1973} {"train_loss": -10.2022066116333, "global_step": 331623, "epoch": 1973} {"train_loss": -10.07835578918457, "global_step": 331624, "epoch": 1973} {"train_loss": -10.843534469604492, "global_step": 331625, "epoch": 1973} {"train_loss": -8.958759307861328, "global_step": 331626, "epoch": 1973} {"train_loss": -11.541765213012695, "global_step": 331627, "epoch": 1973} {"train_loss": -8.770166397094727, "global_step": 331628, "epoch": 1973} {"train_loss": -10.095935821533203, "global_step": 331629, "epoch": 1973} {"train_loss": -10.256722450256348, "global_step": 331630, "epoch": 1973} {"train_loss": -11.725274460656303, "global_step": 331631, "epoch": 1973, "val_loss": 282788.90625} {"train_loss": -8.99639892578125, "global_step": 331632, "epoch": 1974} {"train_loss": -11.272275924682617, "global_step": 331633, "epoch": 1974} {"train_loss": -8.992949485778809, "global_step": 331634, "epoch": 1974} {"train_loss": -9.696072578430176, "global_step": 331635, "epoch": 1974} {"train_loss": -11.222043991088867, "global_step": 331636, "epoch": 1974} {"train_loss": -11.114840507507324, "global_step": 331637, "epoch": 1974} {"train_loss": -11.0016508102417, "global_step": 331638, "epoch": 1974} {"train_loss": -11.206077575683594, "global_step": 331639, "epoch": 1974} {"train_loss": -11.125540733337402, "global_step": 331640, "epoch": 1974} {"train_loss": -11.335929870605469, "global_step": 331641, "epoch": 1974} {"train_loss": -11.642258644104004, "global_step": 331642, "epoch": 1974} {"train_loss": -11.491020202636719, "global_step": 331643, "epoch": 1974} {"train_loss": -11.624343872070312, "global_step": 331644, "epoch": 1974} {"train_loss": -11.577325820922852, "global_step": 331645, "epoch": 1974} {"train_loss": -11.622982025146484, "global_step": 331646, "epoch": 1974} {"train_loss": -12.004762649536133, "global_step": 331647, "epoch": 1974} {"train_loss": -12.025402069091797, "global_step": 331648, "epoch": 1974} {"train_loss": -12.085868835449219, "global_step": 331649, "epoch": 1974} {"train_loss": -11.679988861083984, "global_step": 331650, "epoch": 1974} {"train_loss": -11.877635955810547, "global_step": 331651, "epoch": 1974} {"train_loss": -11.964957237243652, "global_step": 331652, "epoch": 1974} {"train_loss": -11.815973281860352, "global_step": 331653, "epoch": 1974} {"train_loss": -12.142935752868652, "global_step": 331654, "epoch": 1974} {"train_loss": -11.800081253051758, "global_step": 331655, "epoch": 1974} {"train_loss": -11.873916625976562, "global_step": 331656, "epoch": 1974} {"train_loss": -12.235978126525879, "global_step": 331657, "epoch": 1974} {"train_loss": -11.980270385742188, "global_step": 331658, "epoch": 1974} {"train_loss": -12.00027084350586, "global_step": 331659, "epoch": 1974} {"train_loss": -11.961458206176758, "global_step": 331660, "epoch": 1974} {"train_loss": -12.063760757446289, "global_step": 331661, "epoch": 1974} {"train_loss": -12.406728744506836, "global_step": 331662, "epoch": 1974} {"train_loss": -12.069574356079102, "global_step": 331663, "epoch": 1974} {"train_loss": -12.423057556152344, "global_step": 331664, "epoch": 1974} {"train_loss": -12.118696212768555, "global_step": 331665, "epoch": 1974} {"train_loss": -12.2509765625, "global_step": 331666, "epoch": 1974} {"train_loss": -11.928072929382324, "global_step": 331667, "epoch": 1974} {"train_loss": -12.185148239135742, "global_step": 331668, "epoch": 1974} {"train_loss": -12.198681831359863, "global_step": 331669, "epoch": 1974} {"train_loss": -12.119588851928711, "global_step": 331670, "epoch": 1974} {"train_loss": -12.296690940856934, "global_step": 331671, "epoch": 1974} {"train_loss": -12.125022888183594, "global_step": 331672, "epoch": 1974} {"train_loss": -12.371357917785645, "global_step": 331673, "epoch": 1974} {"train_loss": -12.339071273803711, "global_step": 331674, "epoch": 1974} {"train_loss": -12.389312744140625, "global_step": 331675, "epoch": 1974} {"train_loss": -12.387897491455078, "global_step": 331676, "epoch": 1974} {"train_loss": -12.162879943847656, "global_step": 331677, "epoch": 1974} {"train_loss": -12.33559799194336, "global_step": 331678, "epoch": 1974} {"train_loss": -11.890588760375977, "global_step": 331679, "epoch": 1974} {"train_loss": -12.19709587097168, "global_step": 331680, "epoch": 1974} {"train_loss": -12.213264465332031, "global_step": 331681, "epoch": 1974} {"train_loss": -11.97911548614502, "global_step": 331682, "epoch": 1974} {"train_loss": -12.309743881225586, "global_step": 331683, "epoch": 1974} {"train_loss": -12.383219718933105, "global_step": 331684, "epoch": 1974} {"train_loss": -12.34253215789795, "global_step": 331685, "epoch": 1974} {"train_loss": -12.382572174072266, "global_step": 331686, "epoch": 1974} {"train_loss": -12.446023941040039, "global_step": 331687, "epoch": 1974} {"train_loss": -12.314862251281738, "global_step": 331688, "epoch": 1974} {"train_loss": -12.489590644836426, "global_step": 331689, "epoch": 1974} {"train_loss": -12.275714874267578, "global_step": 331690, "epoch": 1974} {"train_loss": -12.296123504638672, "global_step": 331691, "epoch": 1974} {"train_loss": -12.353386878967285, "global_step": 331692, "epoch": 1974} {"train_loss": -12.615331649780273, "global_step": 331693, "epoch": 1974} {"train_loss": -12.388120651245117, "global_step": 331694, "epoch": 1974} {"train_loss": -12.35963249206543, "global_step": 331695, "epoch": 1974} {"train_loss": -12.417949676513672, "global_step": 331696, "epoch": 1974} {"train_loss": -12.396125793457031, "global_step": 331697, "epoch": 1974} {"train_loss": -12.52537727355957, "global_step": 331698, "epoch": 1974} {"train_loss": -12.482868194580078, "global_step": 331699, "epoch": 1974} {"train_loss": -12.534490585327148, "global_step": 331700, "epoch": 1974} {"train_loss": -12.645544052124023, "global_step": 331701, "epoch": 1974} {"train_loss": -12.741117477416992, "global_step": 331702, "epoch": 1974} {"train_loss": -12.559022903442383, "global_step": 331703, "epoch": 1974} {"train_loss": -12.472667694091797, "global_step": 331704, "epoch": 1974} {"train_loss": -12.464449882507324, "global_step": 331705, "epoch": 1974} {"train_loss": -12.654884338378906, "global_step": 331706, "epoch": 1974} {"train_loss": -12.309464454650879, "global_step": 331707, "epoch": 1974} {"train_loss": -12.423399925231934, "global_step": 331708, "epoch": 1974} {"train_loss": -12.474401473999023, "global_step": 331709, "epoch": 1974} {"train_loss": -12.503928184509277, "global_step": 331710, "epoch": 1974} {"train_loss": -12.432672500610352, "global_step": 331711, "epoch": 1974} {"train_loss": -12.568131446838379, "global_step": 331712, "epoch": 1974} {"train_loss": -12.207846641540527, "global_step": 331713, "epoch": 1974} {"train_loss": -12.45709228515625, "global_step": 331714, "epoch": 1974} {"train_loss": -12.469345092773438, "global_step": 331715, "epoch": 1974} {"train_loss": -12.658272743225098, "global_step": 331716, "epoch": 1974} {"train_loss": -12.584321975708008, "global_step": 331717, "epoch": 1974} {"train_loss": -12.319221496582031, "global_step": 331718, "epoch": 1974} {"train_loss": -12.647404670715332, "global_step": 331719, "epoch": 1974} {"train_loss": -12.181312561035156, "global_step": 331720, "epoch": 1974} {"train_loss": -12.53322982788086, "global_step": 331721, "epoch": 1974} {"train_loss": -12.665000915527344, "global_step": 331722, "epoch": 1974} {"train_loss": -12.544212341308594, "global_step": 331723, "epoch": 1974} {"train_loss": -12.61069107055664, "global_step": 331724, "epoch": 1974} {"train_loss": -12.543659210205078, "global_step": 331725, "epoch": 1974} {"train_loss": -12.453763961791992, "global_step": 331726, "epoch": 1974} {"train_loss": -12.845245361328125, "global_step": 331727, "epoch": 1974} {"train_loss": -12.752750396728516, "global_step": 331728, "epoch": 1974} {"train_loss": -12.547371864318848, "global_step": 331729, "epoch": 1974} {"train_loss": -12.693069458007812, "global_step": 331730, "epoch": 1974} {"train_loss": -12.388001441955566, "global_step": 331731, "epoch": 1974} {"train_loss": -12.518362045288086, "global_step": 331732, "epoch": 1974} {"train_loss": -12.462604522705078, "global_step": 331733, "epoch": 1974} {"train_loss": -12.203564643859863, "global_step": 331734, "epoch": 1974} {"train_loss": -12.457256317138672, "global_step": 331735, "epoch": 1974} {"train_loss": -12.658235549926758, "global_step": 331736, "epoch": 1974} {"train_loss": -12.577573776245117, "global_step": 331737, "epoch": 1974} {"train_loss": -11.835622787475586, "global_step": 331738, "epoch": 1974} {"train_loss": -12.22767448425293, "global_step": 331739, "epoch": 1974} {"train_loss": -11.68704605102539, "global_step": 331740, "epoch": 1974} {"train_loss": -12.368707656860352, "global_step": 331741, "epoch": 1974} {"train_loss": -11.431427001953125, "global_step": 331742, "epoch": 1974} {"train_loss": -12.262382507324219, "global_step": 331743, "epoch": 1974} {"train_loss": -11.052776336669922, "global_step": 331744, "epoch": 1974} {"train_loss": -10.854061126708984, "global_step": 331745, "epoch": 1974} {"train_loss": -11.525497436523438, "global_step": 331746, "epoch": 1974} {"train_loss": -11.49169921875, "global_step": 331747, "epoch": 1974} {"train_loss": -11.208394050598145, "global_step": 331748, "epoch": 1974} {"train_loss": -11.153268814086914, "global_step": 331749, "epoch": 1974} {"train_loss": -11.747713088989258, "global_step": 331750, "epoch": 1974} {"train_loss": -11.065637588500977, "global_step": 331751, "epoch": 1974} {"train_loss": -12.276712417602539, "global_step": 331752, "epoch": 1974} {"train_loss": -10.756143569946289, "global_step": 331753, "epoch": 1974} {"train_loss": -11.470987319946289, "global_step": 331754, "epoch": 1974} {"train_loss": -11.30533218383789, "global_step": 331755, "epoch": 1974} {"train_loss": -11.672102928161621, "global_step": 331756, "epoch": 1974} {"train_loss": -12.098481178283691, "global_step": 331757, "epoch": 1974} {"train_loss": -12.206592559814453, "global_step": 331758, "epoch": 1974} {"train_loss": -11.646690368652344, "global_step": 331759, "epoch": 1974} {"train_loss": -12.062440872192383, "global_step": 331760, "epoch": 1974} {"train_loss": -11.849028587341309, "global_step": 331761, "epoch": 1974} {"train_loss": -10.321855545043945, "global_step": 331762, "epoch": 1974} {"train_loss": -10.026800155639648, "global_step": 331763, "epoch": 1974} {"train_loss": -9.951333999633789, "global_step": 331764, "epoch": 1974} {"train_loss": -8.405595779418945, "global_step": 331765, "epoch": 1974} {"train_loss": -7.144986152648926, "global_step": 331766, "epoch": 1974} {"train_loss": -9.342842102050781, "global_step": 331767, "epoch": 1974} {"train_loss": -9.390990257263184, "global_step": 331768, "epoch": 1974} {"train_loss": -9.258703231811523, "global_step": 331769, "epoch": 1974} {"train_loss": -9.533899307250977, "global_step": 331770, "epoch": 1974} {"train_loss": -7.8648481369018555, "global_step": 331771, "epoch": 1974} {"train_loss": -8.76823616027832, "global_step": 331772, "epoch": 1974} {"train_loss": -10.351773262023926, "global_step": 331773, "epoch": 1974} {"train_loss": -9.297840118408203, "global_step": 331774, "epoch": 1974} {"train_loss": -8.14043140411377, "global_step": 331775, "epoch": 1974} {"train_loss": -10.574935913085938, "global_step": 331776, "epoch": 1974} {"train_loss": -8.734081268310547, "global_step": 331777, "epoch": 1974} {"train_loss": -8.048624038696289, "global_step": 331778, "epoch": 1974} {"train_loss": -10.010941505432129, "global_step": 331779, "epoch": 1974} {"train_loss": -9.742345809936523, "global_step": 331780, "epoch": 1974} {"train_loss": -8.929488182067871, "global_step": 331781, "epoch": 1974} {"train_loss": -9.161598205566406, "global_step": 331782, "epoch": 1974} {"train_loss": -10.769848823547363, "global_step": 331783, "epoch": 1974} {"train_loss": -10.51462459564209, "global_step": 331784, "epoch": 1974} {"train_loss": -9.269749641418457, "global_step": 331785, "epoch": 1974} {"train_loss": -10.334213256835938, "global_step": 331786, "epoch": 1974} {"train_loss": -10.846637725830078, "global_step": 331787, "epoch": 1974} {"train_loss": -10.658191680908203, "global_step": 331788, "epoch": 1974} {"train_loss": -10.481168746948242, "global_step": 331789, "epoch": 1974} {"train_loss": -10.91363525390625, "global_step": 331790, "epoch": 1974} {"train_loss": -10.40157413482666, "global_step": 331791, "epoch": 1974} {"train_loss": -11.034442901611328, "global_step": 331792, "epoch": 1974} {"train_loss": -11.37582015991211, "global_step": 331793, "epoch": 1974} {"train_loss": -10.554405212402344, "global_step": 331794, "epoch": 1974} {"train_loss": -11.64634895324707, "global_step": 331795, "epoch": 1974} {"train_loss": -11.093377113342285, "global_step": 331796, "epoch": 1974} {"train_loss": -11.197633743286133, "global_step": 331797, "epoch": 1974} {"train_loss": -11.107194900512695, "global_step": 331798, "epoch": 1974} {"train_loss": -11.561117921556745, "global_step": 331799, "epoch": 1974, "val_loss": 285158.40625} {"train_loss": -11.774272918701172, "global_step": 331800, "epoch": 1975} {"train_loss": -11.726946830749512, "global_step": 331801, "epoch": 1975} {"train_loss": -11.361662864685059, "global_step": 331802, "epoch": 1975} {"train_loss": -11.600297927856445, "global_step": 331803, "epoch": 1975} {"train_loss": -11.98519515991211, "global_step": 331804, "epoch": 1975} {"train_loss": -11.835999488830566, "global_step": 331805, "epoch": 1975} {"train_loss": -11.679694175720215, "global_step": 331806, "epoch": 1975} {"train_loss": -11.971551895141602, "global_step": 331807, "epoch": 1975} {"train_loss": -11.592424392700195, "global_step": 331808, "epoch": 1975} {"train_loss": -11.779376983642578, "global_step": 331809, "epoch": 1975} {"train_loss": -11.925837516784668, "global_step": 331810, "epoch": 1975} {"train_loss": -11.803243637084961, "global_step": 331811, "epoch": 1975} {"train_loss": -11.9996919631958, "global_step": 331812, "epoch": 1975} {"train_loss": -11.960018157958984, "global_step": 331813, "epoch": 1975} {"train_loss": -11.841521263122559, "global_step": 331814, "epoch": 1975} {"train_loss": -11.80999755859375, "global_step": 331815, "epoch": 1975} {"train_loss": -12.050885200500488, "global_step": 331816, "epoch": 1975} {"train_loss": -12.08245849609375, "global_step": 331817, "epoch": 1975} {"train_loss": -12.102165222167969, "global_step": 331818, "epoch": 1975} {"train_loss": -11.932101249694824, "global_step": 331819, "epoch": 1975} {"train_loss": -12.064666748046875, "global_step": 331820, "epoch": 1975} {"train_loss": -12.09483528137207, "global_step": 331821, "epoch": 1975} {"train_loss": -12.097198486328125, "global_step": 331822, "epoch": 1975} {"train_loss": -11.971481323242188, "global_step": 331823, "epoch": 1975} {"train_loss": -11.955344200134277, "global_step": 331824, "epoch": 1975} {"train_loss": -11.914928436279297, "global_step": 331825, "epoch": 1975} {"train_loss": -12.138834953308105, "global_step": 331826, "epoch": 1975} {"train_loss": -12.255574226379395, "global_step": 331827, "epoch": 1975} {"train_loss": -12.044801712036133, "global_step": 331828, "epoch": 1975} {"train_loss": -12.232804298400879, "global_step": 331829, "epoch": 1975} {"train_loss": -12.283557891845703, "global_step": 331830, "epoch": 1975} {"train_loss": -12.110321998596191, "global_step": 331831, "epoch": 1975} {"train_loss": -12.291157722473145, "global_step": 331832, "epoch": 1975} {"train_loss": -12.025066375732422, "global_step": 331833, "epoch": 1975} {"train_loss": -12.016618728637695, "global_step": 331834, "epoch": 1975} {"train_loss": -12.102806091308594, "global_step": 331835, "epoch": 1975} {"train_loss": -12.18131160736084, "global_step": 331836, "epoch": 1975} {"train_loss": -12.152299880981445, "global_step": 331837, "epoch": 1975} {"train_loss": -12.175840377807617, "global_step": 331838, "epoch": 1975} {"train_loss": -12.228796005249023, "global_step": 331839, "epoch": 1975} {"train_loss": -12.357481002807617, "global_step": 331840, "epoch": 1975} {"train_loss": -12.159378051757812, "global_step": 331841, "epoch": 1975} {"train_loss": -12.350176811218262, "global_step": 331842, "epoch": 1975} {"train_loss": -12.208966255187988, "global_step": 331843, "epoch": 1975} {"train_loss": -12.194161415100098, "global_step": 331844, "epoch": 1975} {"train_loss": -12.360182762145996, "global_step": 331845, "epoch": 1975} {"train_loss": -12.259584426879883, "global_step": 331846, "epoch": 1975} {"train_loss": -12.165283203125, "global_step": 331847, "epoch": 1975} {"train_loss": -12.314807891845703, "global_step": 331848, "epoch": 1975} {"train_loss": -11.98056411743164, "global_step": 331849, "epoch": 1975} {"train_loss": -12.248884201049805, "global_step": 331850, "epoch": 1975} {"train_loss": -12.435954093933105, "global_step": 331851, "epoch": 1975} {"train_loss": -12.46773910522461, "global_step": 331852, "epoch": 1975} {"train_loss": -12.039619445800781, "global_step": 331853, "epoch": 1975} {"train_loss": -12.422801971435547, "global_step": 331854, "epoch": 1975} {"train_loss": -12.315792083740234, "global_step": 331855, "epoch": 1975} {"train_loss": -12.37681770324707, "global_step": 331856, "epoch": 1975} {"train_loss": -12.374977111816406, "global_step": 331857, "epoch": 1975} {"train_loss": -12.382284164428711, "global_step": 331858, "epoch": 1975} {"train_loss": -12.48095417022705, "global_step": 331859, "epoch": 1975} {"train_loss": -12.222325325012207, "global_step": 331860, "epoch": 1975} {"train_loss": -12.542276382446289, "global_step": 331861, "epoch": 1975} {"train_loss": -12.416797637939453, "global_step": 331862, "epoch": 1975} {"train_loss": -12.295553207397461, "global_step": 331863, "epoch": 1975} {"train_loss": -12.399703979492188, "global_step": 331864, "epoch": 1975} {"train_loss": -12.42249870300293, "global_step": 331865, "epoch": 1975} {"train_loss": -12.455148696899414, "global_step": 331866, "epoch": 1975} {"train_loss": -12.458822250366211, "global_step": 331867, "epoch": 1975} {"train_loss": -12.38206672668457, "global_step": 331868, "epoch": 1975} {"train_loss": -12.42483901977539, "global_step": 331869, "epoch": 1975} {"train_loss": -12.449979782104492, "global_step": 331870, "epoch": 1975} {"train_loss": -12.019142150878906, "global_step": 331871, "epoch": 1975} {"train_loss": -12.29561996459961, "global_step": 331872, "epoch": 1975} {"train_loss": -12.339628219604492, "global_step": 331873, "epoch": 1975} {"train_loss": -12.334274291992188, "global_step": 331874, "epoch": 1975} {"train_loss": -12.468366622924805, "global_step": 331875, "epoch": 1975} {"train_loss": -12.518912315368652, "global_step": 331876, "epoch": 1975} {"train_loss": -12.346646308898926, "global_step": 331877, "epoch": 1975} {"train_loss": -12.680727005004883, "global_step": 331878, "epoch": 1975} {"train_loss": -12.372906684875488, "global_step": 331879, "epoch": 1975} {"train_loss": -12.618290901184082, "global_step": 331880, "epoch": 1975} {"train_loss": -12.604371070861816, "global_step": 331881, "epoch": 1975} {"train_loss": -12.664352416992188, "global_step": 331882, "epoch": 1975} {"train_loss": -12.530380249023438, "global_step": 331883, "epoch": 1975} {"train_loss": -12.369300842285156, "global_step": 331884, "epoch": 1975} {"train_loss": -12.601058006286621, "global_step": 331885, "epoch": 1975} {"train_loss": -12.357431411743164, "global_step": 331886, "epoch": 1975} {"train_loss": -12.219026565551758, "global_step": 331887, "epoch": 1975} {"train_loss": -12.378662109375, "global_step": 331888, "epoch": 1975} {"train_loss": -12.25545883178711, "global_step": 331889, "epoch": 1975} {"train_loss": -12.385009765625, "global_step": 331890, "epoch": 1975} {"train_loss": -11.882617950439453, "global_step": 331891, "epoch": 1975} {"train_loss": -12.434652328491211, "global_step": 331892, "epoch": 1975} {"train_loss": -11.750250816345215, "global_step": 331893, "epoch": 1975} {"train_loss": -11.848970413208008, "global_step": 331894, "epoch": 1975} {"train_loss": -11.758848190307617, "global_step": 331895, "epoch": 1975} {"train_loss": -10.869945526123047, "global_step": 331896, "epoch": 1975} {"train_loss": -11.981586456298828, "global_step": 331897, "epoch": 1975} {"train_loss": -12.113689422607422, "global_step": 331898, "epoch": 1975} {"train_loss": -11.840837478637695, "global_step": 331899, "epoch": 1975} {"train_loss": -12.040349960327148, "global_step": 331900, "epoch": 1975} {"train_loss": -12.069633483886719, "global_step": 331901, "epoch": 1975} {"train_loss": -11.678943634033203, "global_step": 331902, "epoch": 1975} {"train_loss": -12.34136962890625, "global_step": 331903, "epoch": 1975} {"train_loss": -12.482281684875488, "global_step": 331904, "epoch": 1975} {"train_loss": -11.794808387756348, "global_step": 331905, "epoch": 1975} {"train_loss": -11.744794845581055, "global_step": 331906, "epoch": 1975} {"train_loss": -11.803077697753906, "global_step": 331907, "epoch": 1975} {"train_loss": -11.748358726501465, "global_step": 331908, "epoch": 1975} {"train_loss": -12.343015670776367, "global_step": 331909, "epoch": 1975} {"train_loss": -11.018437385559082, "global_step": 331910, "epoch": 1975} {"train_loss": -10.887253761291504, "global_step": 331911, "epoch": 1975} {"train_loss": -11.785526275634766, "global_step": 331912, "epoch": 1975} {"train_loss": -10.07055377960205, "global_step": 331913, "epoch": 1975} {"train_loss": -9.893527030944824, "global_step": 331914, "epoch": 1975} {"train_loss": -9.580667495727539, "global_step": 331915, "epoch": 1975} {"train_loss": -11.60651969909668, "global_step": 331916, "epoch": 1975} {"train_loss": -10.495697021484375, "global_step": 331917, "epoch": 1975} {"train_loss": -9.609427452087402, "global_step": 331918, "epoch": 1975} {"train_loss": -9.845629692077637, "global_step": 331919, "epoch": 1975} {"train_loss": -10.11316967010498, "global_step": 331920, "epoch": 1975} {"train_loss": -10.083223342895508, "global_step": 331921, "epoch": 1975} {"train_loss": -10.294132232666016, "global_step": 331922, "epoch": 1975} {"train_loss": -11.319819450378418, "global_step": 331923, "epoch": 1975} {"train_loss": -9.982184410095215, "global_step": 331924, "epoch": 1975} {"train_loss": -10.648995399475098, "global_step": 331925, "epoch": 1975} {"train_loss": -10.968307495117188, "global_step": 331926, "epoch": 1975} {"train_loss": -11.301040649414062, "global_step": 331927, "epoch": 1975} {"train_loss": -10.600947380065918, "global_step": 331928, "epoch": 1975} {"train_loss": -11.136076927185059, "global_step": 331929, "epoch": 1975} {"train_loss": -9.412239074707031, "global_step": 331930, "epoch": 1975} {"train_loss": -10.818441390991211, "global_step": 331931, "epoch": 1975} {"train_loss": -10.537534713745117, "global_step": 331932, "epoch": 1975} {"train_loss": -10.545022010803223, "global_step": 331933, "epoch": 1975} {"train_loss": -10.425813674926758, "global_step": 331934, "epoch": 1975} {"train_loss": -10.983053207397461, "global_step": 331935, "epoch": 1975} {"train_loss": -10.71394157409668, "global_step": 331936, "epoch": 1975} {"train_loss": -11.52457332611084, "global_step": 331937, "epoch": 1975} {"train_loss": -10.774463653564453, "global_step": 331938, "epoch": 1975} {"train_loss": -11.821612358093262, "global_step": 331939, "epoch": 1975} {"train_loss": -11.219035148620605, "global_step": 331940, "epoch": 1975} {"train_loss": -11.244290351867676, "global_step": 331941, "epoch": 1975} {"train_loss": -11.780374526977539, "global_step": 331942, "epoch": 1975} {"train_loss": -11.533841133117676, "global_step": 331943, "epoch": 1975} {"train_loss": -11.3449068069458, "global_step": 331944, "epoch": 1975} {"train_loss": -11.26285171508789, "global_step": 331945, "epoch": 1975} {"train_loss": -10.413398742675781, "global_step": 331946, "epoch": 1975} {"train_loss": -11.916759490966797, "global_step": 331947, "epoch": 1975} {"train_loss": -10.892685890197754, "global_step": 331948, "epoch": 1975} {"train_loss": -10.890300750732422, "global_step": 331949, "epoch": 1975} {"train_loss": -11.425304412841797, "global_step": 331950, "epoch": 1975} {"train_loss": -10.886468887329102, "global_step": 331951, "epoch": 1975} {"train_loss": -10.879980087280273, "global_step": 331952, "epoch": 1975} {"train_loss": -11.50953197479248, "global_step": 331953, "epoch": 1975} {"train_loss": -11.61612319946289, "global_step": 331954, "epoch": 1975} {"train_loss": -10.945306777954102, "global_step": 331955, "epoch": 1975} {"train_loss": -11.599312782287598, "global_step": 331956, "epoch": 1975} {"train_loss": -11.249773979187012, "global_step": 331957, "epoch": 1975} {"train_loss": -11.733392715454102, "global_step": 331958, "epoch": 1975} {"train_loss": -11.729575157165527, "global_step": 331959, "epoch": 1975} {"train_loss": -11.646111488342285, "global_step": 331960, "epoch": 1975} {"train_loss": -11.468107223510742, "global_step": 331961, "epoch": 1975} {"train_loss": -11.58480453491211, "global_step": 331962, "epoch": 1975} {"train_loss": -11.624536514282227, "global_step": 331963, "epoch": 1975} {"train_loss": -11.744688034057617, "global_step": 331964, "epoch": 1975} {"train_loss": -11.717622756958008, "global_step": 331965, "epoch": 1975} {"train_loss": -11.706832885742188, "global_step": 331966, "epoch": 1975} {"train_loss": -11.753975646836418, "global_step": 331967, "epoch": 1975, "val_loss": 285670.4375, "train_action_mse_error": 1.673933982849121} {"train_loss": -11.979373931884766, "global_step": 331968, "epoch": 1976} {"train_loss": -11.629600524902344, "global_step": 331969, "epoch": 1976} {"train_loss": -11.872482299804688, "global_step": 331970, "epoch": 1976} {"train_loss": -11.86080551147461, "global_step": 331971, "epoch": 1976} {"train_loss": -11.737096786499023, "global_step": 331972, "epoch": 1976} {"train_loss": -11.871915817260742, "global_step": 331973, "epoch": 1976} {"train_loss": -11.814184188842773, "global_step": 331974, "epoch": 1976} {"train_loss": -12.042351722717285, "global_step": 331975, "epoch": 1976} {"train_loss": -11.993992805480957, "global_step": 331976, "epoch": 1976} {"train_loss": -12.091012954711914, "global_step": 331977, "epoch": 1976} {"train_loss": -12.046157836914062, "global_step": 331978, "epoch": 1976} {"train_loss": -11.811601638793945, "global_step": 331979, "epoch": 1976} {"train_loss": -12.043752670288086, "global_step": 331980, "epoch": 1976} {"train_loss": -11.998398780822754, "global_step": 331981, "epoch": 1976} {"train_loss": -11.848644256591797, "global_step": 331982, "epoch": 1976} {"train_loss": -12.034177780151367, "global_step": 331983, "epoch": 1976} {"train_loss": -11.61469841003418, "global_step": 331984, "epoch": 1976} {"train_loss": -12.066116333007812, "global_step": 331985, "epoch": 1976} {"train_loss": -11.836882591247559, "global_step": 331986, "epoch": 1976} {"train_loss": -11.929216384887695, "global_step": 331987, "epoch": 1976} {"train_loss": -11.91739273071289, "global_step": 331988, "epoch": 1976} {"train_loss": -12.086141586303711, "global_step": 331989, "epoch": 1976} {"train_loss": -11.661759376525879, "global_step": 331990, "epoch": 1976} {"train_loss": -12.15958023071289, "global_step": 331991, "epoch": 1976} {"train_loss": -11.723344802856445, "global_step": 331992, "epoch": 1976} {"train_loss": -12.183940887451172, "global_step": 331993, "epoch": 1976} {"train_loss": -12.094710350036621, "global_step": 331994, "epoch": 1976} {"train_loss": -11.938097953796387, "global_step": 331995, "epoch": 1976} {"train_loss": -12.176668167114258, "global_step": 331996, "epoch": 1976} {"train_loss": -12.29928207397461, "global_step": 331997, "epoch": 1976} {"train_loss": -12.191719055175781, "global_step": 331998, "epoch": 1976} {"train_loss": -12.253963470458984, "global_step": 331999, "epoch": 1976} {"train_loss": -12.19540786743164, "global_step": 332000, "epoch": 1976} {"train_loss": -12.224090576171875, "global_step": 332001, "epoch": 1976} {"train_loss": -12.2161865234375, "global_step": 332002, "epoch": 1976} {"train_loss": -12.26667594909668, "global_step": 332003, "epoch": 1976} {"train_loss": -12.201437950134277, "global_step": 332004, "epoch": 1976} {"train_loss": -12.361028671264648, "global_step": 332005, "epoch": 1976} {"train_loss": -12.313446044921875, "global_step": 332006, "epoch": 1976} {"train_loss": -12.281866073608398, "global_step": 332007, "epoch": 1976} {"train_loss": -12.051237106323242, "global_step": 332008, "epoch": 1976} {"train_loss": -12.393462181091309, "global_step": 332009, "epoch": 1976} {"train_loss": -12.29729175567627, "global_step": 332010, "epoch": 1976} {"train_loss": -12.24998950958252, "global_step": 332011, "epoch": 1976} {"train_loss": -12.430737495422363, "global_step": 332012, "epoch": 1976} {"train_loss": -12.274740219116211, "global_step": 332013, "epoch": 1976} {"train_loss": -12.190070152282715, "global_step": 332014, "epoch": 1976} {"train_loss": -12.363420486450195, "global_step": 332015, "epoch": 1976} {"train_loss": -12.411059379577637, "global_step": 332016, "epoch": 1976} {"train_loss": -12.073945999145508, "global_step": 332017, "epoch": 1976} {"train_loss": -12.134126663208008, "global_step": 332018, "epoch": 1976} {"train_loss": -12.275848388671875, "global_step": 332019, "epoch": 1976} {"train_loss": -12.204015731811523, "global_step": 332020, "epoch": 1976} {"train_loss": -12.320056915283203, "global_step": 332021, "epoch": 1976} {"train_loss": -12.608602523803711, "global_step": 332022, "epoch": 1976} {"train_loss": -12.474061965942383, "global_step": 332023, "epoch": 1976} {"train_loss": -12.498456954956055, "global_step": 332024, "epoch": 1976} {"train_loss": -12.613052368164062, "global_step": 332025, "epoch": 1976} {"train_loss": -12.378820419311523, "global_step": 332026, "epoch": 1976} {"train_loss": -12.532732963562012, "global_step": 332027, "epoch": 1976} {"train_loss": -12.317739486694336, "global_step": 332028, "epoch": 1976} {"train_loss": -12.421470642089844, "global_step": 332029, "epoch": 1976} {"train_loss": -12.473516464233398, "global_step": 332030, "epoch": 1976} {"train_loss": -12.50969123840332, "global_step": 332031, "epoch": 1976} {"train_loss": -12.540474891662598, "global_step": 332032, "epoch": 1976} {"train_loss": -12.451245307922363, "global_step": 332033, "epoch": 1976} {"train_loss": -12.233959197998047, "global_step": 332034, "epoch": 1976} {"train_loss": -11.733607292175293, "global_step": 332035, "epoch": 1976} {"train_loss": -12.287567138671875, "global_step": 332036, "epoch": 1976} {"train_loss": -12.48483657836914, "global_step": 332037, "epoch": 1976} {"train_loss": -11.938448905944824, "global_step": 332038, "epoch": 1976} {"train_loss": -11.063421249389648, "global_step": 332039, "epoch": 1976} {"train_loss": -11.224997520446777, "global_step": 332040, "epoch": 1976} {"train_loss": -12.14822769165039, "global_step": 332041, "epoch": 1976} {"train_loss": -11.33250904083252, "global_step": 332042, "epoch": 1976} {"train_loss": -11.281728744506836, "global_step": 332043, "epoch": 1976} {"train_loss": -12.434980392456055, "global_step": 332044, "epoch": 1976} {"train_loss": -11.362825393676758, "global_step": 332045, "epoch": 1976} {"train_loss": -10.453224182128906, "global_step": 332046, "epoch": 1976} {"train_loss": -12.07200813293457, "global_step": 332047, "epoch": 1976} {"train_loss": -10.164632797241211, "global_step": 332048, "epoch": 1976} {"train_loss": -11.758440017700195, "global_step": 332049, "epoch": 1976} {"train_loss": -10.955008506774902, "global_step": 332050, "epoch": 1976} {"train_loss": -10.931472778320312, "global_step": 332051, "epoch": 1976} {"train_loss": -11.02631950378418, "global_step": 332052, "epoch": 1976} {"train_loss": -9.917356491088867, "global_step": 332053, "epoch": 1976} {"train_loss": -11.877603530883789, "global_step": 332054, "epoch": 1976} {"train_loss": -10.470514297485352, "global_step": 332055, "epoch": 1976} {"train_loss": -11.241741180419922, "global_step": 332056, "epoch": 1976} {"train_loss": -10.79116153717041, "global_step": 332057, "epoch": 1976} {"train_loss": -11.800883293151855, "global_step": 332058, "epoch": 1976} {"train_loss": -10.923931121826172, "global_step": 332059, "epoch": 1976} {"train_loss": -10.965561866760254, "global_step": 332060, "epoch": 1976} {"train_loss": -11.213123321533203, "global_step": 332061, "epoch": 1976} {"train_loss": -11.419596672058105, "global_step": 332062, "epoch": 1976} {"train_loss": -11.469600677490234, "global_step": 332063, "epoch": 1976} {"train_loss": -11.294496536254883, "global_step": 332064, "epoch": 1976} {"train_loss": -11.496570587158203, "global_step": 332065, "epoch": 1976} {"train_loss": -11.618359565734863, "global_step": 332066, "epoch": 1976} {"train_loss": -12.316324234008789, "global_step": 332067, "epoch": 1976} {"train_loss": -12.275154113769531, "global_step": 332068, "epoch": 1976} {"train_loss": -12.072278022766113, "global_step": 332069, "epoch": 1976} {"train_loss": -12.277202606201172, "global_step": 332070, "epoch": 1976} {"train_loss": -12.064172744750977, "global_step": 332071, "epoch": 1976} {"train_loss": -12.190287590026855, "global_step": 332072, "epoch": 1976} {"train_loss": -12.082634925842285, "global_step": 332073, "epoch": 1976} {"train_loss": -12.337373733520508, "global_step": 332074, "epoch": 1976} {"train_loss": -12.308841705322266, "global_step": 332075, "epoch": 1976} {"train_loss": -12.107149124145508, "global_step": 332076, "epoch": 1976} {"train_loss": -12.31121826171875, "global_step": 332077, "epoch": 1976} {"train_loss": -12.31873893737793, "global_step": 332078, "epoch": 1976} {"train_loss": -12.265581130981445, "global_step": 332079, "epoch": 1976} {"train_loss": -12.0692138671875, "global_step": 332080, "epoch": 1976} {"train_loss": -12.345216751098633, "global_step": 332081, "epoch": 1976} {"train_loss": -12.261497497558594, "global_step": 332082, "epoch": 1976} {"train_loss": -12.372991561889648, "global_step": 332083, "epoch": 1976} {"train_loss": -12.271527290344238, "global_step": 332084, "epoch": 1976} {"train_loss": -12.005868911743164, "global_step": 332085, "epoch": 1976} {"train_loss": -12.187307357788086, "global_step": 332086, "epoch": 1976} {"train_loss": -12.222476959228516, "global_step": 332087, "epoch": 1976} {"train_loss": -12.225271224975586, "global_step": 332088, "epoch": 1976} {"train_loss": -12.017288208007812, "global_step": 332089, "epoch": 1976} {"train_loss": -12.457710266113281, "global_step": 332090, "epoch": 1976} {"train_loss": -12.262632369995117, "global_step": 332091, "epoch": 1976} {"train_loss": -12.463631629943848, "global_step": 332092, "epoch": 1976} {"train_loss": -12.168068885803223, "global_step": 332093, "epoch": 1976} {"train_loss": -12.456287384033203, "global_step": 332094, "epoch": 1976} {"train_loss": -12.467374801635742, "global_step": 332095, "epoch": 1976} {"train_loss": -12.334394454956055, "global_step": 332096, "epoch": 1976} {"train_loss": -12.485081672668457, "global_step": 332097, "epoch": 1976} {"train_loss": -12.22840690612793, "global_step": 332098, "epoch": 1976} {"train_loss": -12.593667984008789, "global_step": 332099, "epoch": 1976} {"train_loss": -12.319267272949219, "global_step": 332100, "epoch": 1976} {"train_loss": -12.66911506652832, "global_step": 332101, "epoch": 1976} {"train_loss": -12.32142162322998, "global_step": 332102, "epoch": 1976} {"train_loss": -12.451953887939453, "global_step": 332103, "epoch": 1976} {"train_loss": -12.372060775756836, "global_step": 332104, "epoch": 1976} {"train_loss": -12.36135482788086, "global_step": 332105, "epoch": 1976} {"train_loss": -12.543985366821289, "global_step": 332106, "epoch": 1976} {"train_loss": -12.33395767211914, "global_step": 332107, "epoch": 1976} {"train_loss": -12.620758056640625, "global_step": 332108, "epoch": 1976} {"train_loss": -12.204692840576172, "global_step": 332109, "epoch": 1976} {"train_loss": -12.507848739624023, "global_step": 332110, "epoch": 1976} {"train_loss": -12.488945007324219, "global_step": 332111, "epoch": 1976} {"train_loss": -12.655071258544922, "global_step": 332112, "epoch": 1976} {"train_loss": -12.649675369262695, "global_step": 332113, "epoch": 1976} {"train_loss": -12.541210174560547, "global_step": 332114, "epoch": 1976} {"train_loss": -12.558401107788086, "global_step": 332115, "epoch": 1976} {"train_loss": -12.44968318939209, "global_step": 332116, "epoch": 1976} {"train_loss": -12.633306503295898, "global_step": 332117, "epoch": 1976} {"train_loss": -12.899009704589844, "global_step": 332118, "epoch": 1976} {"train_loss": -12.362589836120605, "global_step": 332119, "epoch": 1976} {"train_loss": -12.372085571289062, "global_step": 332120, "epoch": 1976} {"train_loss": -12.302637100219727, "global_step": 332121, "epoch": 1976} {"train_loss": -12.031972885131836, "global_step": 332122, "epoch": 1976} {"train_loss": -11.144386291503906, "global_step": 332123, "epoch": 1976} {"train_loss": -11.388326644897461, "global_step": 332124, "epoch": 1976} {"train_loss": -10.82934284210205, "global_step": 332125, "epoch": 1976} {"train_loss": -11.708609580993652, "global_step": 332126, "epoch": 1976} {"train_loss": -11.950094223022461, "global_step": 332127, "epoch": 1976} {"train_loss": -9.882912635803223, "global_step": 332128, "epoch": 1976} {"train_loss": -11.303628921508789, "global_step": 332129, "epoch": 1976} {"train_loss": -8.600138664245605, "global_step": 332130, "epoch": 1976} {"train_loss": -9.847904205322266, "global_step": 332131, "epoch": 1976} {"train_loss": -10.566692352294922, "global_step": 332132, "epoch": 1976} {"train_loss": -9.513681411743164, "global_step": 332133, "epoch": 1976} {"train_loss": -10.868377685546875, "global_step": 332134, "epoch": 1976} {"train_loss": -11.947593456222897, "global_step": 332135, "epoch": 1976, "val_loss": 283889.875} {"train_loss": -9.698810577392578, "global_step": 332136, "epoch": 1977} {"train_loss": -10.98115062713623, "global_step": 332137, "epoch": 1977} {"train_loss": -9.675273895263672, "global_step": 332138, "epoch": 1977} {"train_loss": -9.911240577697754, "global_step": 332139, "epoch": 1977} {"train_loss": -10.838563919067383, "global_step": 332140, "epoch": 1977} {"train_loss": -9.926151275634766, "global_step": 332141, "epoch": 1977} {"train_loss": -10.492969512939453, "global_step": 332142, "epoch": 1977} {"train_loss": -10.993249893188477, "global_step": 332143, "epoch": 1977} {"train_loss": -10.353212356567383, "global_step": 332144, "epoch": 1977} {"train_loss": -10.350478172302246, "global_step": 332145, "epoch": 1977} {"train_loss": -11.022175788879395, "global_step": 332146, "epoch": 1977} {"train_loss": -10.0238618850708, "global_step": 332147, "epoch": 1977} {"train_loss": -11.42681884765625, "global_step": 332148, "epoch": 1977} {"train_loss": -10.687036514282227, "global_step": 332149, "epoch": 1977} {"train_loss": -11.73671817779541, "global_step": 332150, "epoch": 1977} {"train_loss": -11.308504104614258, "global_step": 332151, "epoch": 1977} {"train_loss": -11.34517765045166, "global_step": 332152, "epoch": 1977} {"train_loss": -11.872589111328125, "global_step": 332153, "epoch": 1977} {"train_loss": -11.254720687866211, "global_step": 332154, "epoch": 1977} {"train_loss": -11.874002456665039, "global_step": 332155, "epoch": 1977} {"train_loss": -11.335679054260254, "global_step": 332156, "epoch": 1977} {"train_loss": -11.867246627807617, "global_step": 332157, "epoch": 1977} {"train_loss": -11.432499885559082, "global_step": 332158, "epoch": 1977} {"train_loss": -11.573641777038574, "global_step": 332159, "epoch": 1977} {"train_loss": -11.764860153198242, "global_step": 332160, "epoch": 1977} {"train_loss": -11.576412200927734, "global_step": 332161, "epoch": 1977} {"train_loss": -12.055170059204102, "global_step": 332162, "epoch": 1977} {"train_loss": -11.938520431518555, "global_step": 332163, "epoch": 1977} {"train_loss": -11.847488403320312, "global_step": 332164, "epoch": 1977} {"train_loss": -12.04696273803711, "global_step": 332165, "epoch": 1977} {"train_loss": -11.944365501403809, "global_step": 332166, "epoch": 1977} {"train_loss": -11.81603717803955, "global_step": 332167, "epoch": 1977} {"train_loss": -11.570996284484863, "global_step": 332168, "epoch": 1977} {"train_loss": -11.889734268188477, "global_step": 332169, "epoch": 1977} {"train_loss": -11.609127044677734, "global_step": 332170, "epoch": 1977} {"train_loss": -11.918473243713379, "global_step": 332171, "epoch": 1977} {"train_loss": -12.043192863464355, "global_step": 332172, "epoch": 1977} {"train_loss": -12.10460090637207, "global_step": 332173, "epoch": 1977} {"train_loss": -12.190160751342773, "global_step": 332174, "epoch": 1977} {"train_loss": -11.809187889099121, "global_step": 332175, "epoch": 1977} {"train_loss": -12.248340606689453, "global_step": 332176, "epoch": 1977} {"train_loss": -11.695998191833496, "global_step": 332177, "epoch": 1977} {"train_loss": -11.92642593383789, "global_step": 332178, "epoch": 1977} {"train_loss": -11.892641067504883, "global_step": 332179, "epoch": 1977} {"train_loss": -11.477973937988281, "global_step": 332180, "epoch": 1977} {"train_loss": -11.61910629272461, "global_step": 332181, "epoch": 1977} {"train_loss": -11.476560592651367, "global_step": 332182, "epoch": 1977} {"train_loss": -11.511897087097168, "global_step": 332183, "epoch": 1977} {"train_loss": -11.817495346069336, "global_step": 332184, "epoch": 1977} {"train_loss": -11.438909530639648, "global_step": 332185, "epoch": 1977} {"train_loss": -12.036067962646484, "global_step": 332186, "epoch": 1977} {"train_loss": -12.074991226196289, "global_step": 332187, "epoch": 1977} {"train_loss": -11.967795372009277, "global_step": 332188, "epoch": 1977} {"train_loss": -12.333589553833008, "global_step": 332189, "epoch": 1977} {"train_loss": -12.118711471557617, "global_step": 332190, "epoch": 1977} {"train_loss": -12.247917175292969, "global_step": 332191, "epoch": 1977} {"train_loss": -12.162041664123535, "global_step": 332192, "epoch": 1977} {"train_loss": -12.190561294555664, "global_step": 332193, "epoch": 1977} {"train_loss": -12.19601821899414, "global_step": 332194, "epoch": 1977} {"train_loss": -12.202383041381836, "global_step": 332195, "epoch": 1977} {"train_loss": -12.161815643310547, "global_step": 332196, "epoch": 1977} {"train_loss": -12.247342109680176, "global_step": 332197, "epoch": 1977} {"train_loss": -12.0790376663208, "global_step": 332198, "epoch": 1977} {"train_loss": -12.317806243896484, "global_step": 332199, "epoch": 1977} {"train_loss": -12.311759948730469, "global_step": 332200, "epoch": 1977} {"train_loss": -11.988860130310059, "global_step": 332201, "epoch": 1977} {"train_loss": -12.166770935058594, "global_step": 332202, "epoch": 1977} {"train_loss": -12.332449913024902, "global_step": 332203, "epoch": 1977} {"train_loss": -12.296878814697266, "global_step": 332204, "epoch": 1977} {"train_loss": -12.492494583129883, "global_step": 332205, "epoch": 1977} {"train_loss": -12.420225143432617, "global_step": 332206, "epoch": 1977} {"train_loss": -12.360306739807129, "global_step": 332207, "epoch": 1977} {"train_loss": -12.472026824951172, "global_step": 332208, "epoch": 1977} {"train_loss": -12.357295989990234, "global_step": 332209, "epoch": 1977} {"train_loss": -12.40468692779541, "global_step": 332210, "epoch": 1977} {"train_loss": -12.19604206085205, "global_step": 332211, "epoch": 1977} {"train_loss": -12.266525268554688, "global_step": 332212, "epoch": 1977} {"train_loss": -12.206787109375, "global_step": 332213, "epoch": 1977} {"train_loss": -12.291040420532227, "global_step": 332214, "epoch": 1977} {"train_loss": -12.61864185333252, "global_step": 332215, "epoch": 1977} {"train_loss": -12.385832786560059, "global_step": 332216, "epoch": 1977} {"train_loss": -12.364221572875977, "global_step": 332217, "epoch": 1977} {"train_loss": -12.496055603027344, "global_step": 332218, "epoch": 1977} {"train_loss": -12.346007347106934, "global_step": 332219, "epoch": 1977} {"train_loss": -12.361759185791016, "global_step": 332220, "epoch": 1977} {"train_loss": -12.67823314666748, "global_step": 332221, "epoch": 1977} {"train_loss": -12.082246780395508, "global_step": 332222, "epoch": 1977} {"train_loss": -12.53816032409668, "global_step": 332223, "epoch": 1977} {"train_loss": -12.432449340820312, "global_step": 332224, "epoch": 1977} {"train_loss": -12.535551071166992, "global_step": 332225, "epoch": 1977} {"train_loss": -12.67276382446289, "global_step": 332226, "epoch": 1977} {"train_loss": -12.592732429504395, "global_step": 332227, "epoch": 1977} {"train_loss": -12.407306671142578, "global_step": 332228, "epoch": 1977} {"train_loss": -12.692015647888184, "global_step": 332229, "epoch": 1977} {"train_loss": -12.586862564086914, "global_step": 332230, "epoch": 1977} {"train_loss": -12.654498100280762, "global_step": 332231, "epoch": 1977} {"train_loss": -12.63058853149414, "global_step": 332232, "epoch": 1977} {"train_loss": -12.565214157104492, "global_step": 332233, "epoch": 1977} {"train_loss": -12.535188674926758, "global_step": 332234, "epoch": 1977} {"train_loss": -12.59898853302002, "global_step": 332235, "epoch": 1977} {"train_loss": -12.57928466796875, "global_step": 332236, "epoch": 1977} {"train_loss": -12.639362335205078, "global_step": 332237, "epoch": 1977} {"train_loss": -12.573455810546875, "global_step": 332238, "epoch": 1977} {"train_loss": -12.8028564453125, "global_step": 332239, "epoch": 1977} {"train_loss": -12.50911808013916, "global_step": 332240, "epoch": 1977} {"train_loss": -12.606517791748047, "global_step": 332241, "epoch": 1977} {"train_loss": -12.50600814819336, "global_step": 332242, "epoch": 1977} {"train_loss": -12.561935424804688, "global_step": 332243, "epoch": 1977} {"train_loss": -12.525261878967285, "global_step": 332244, "epoch": 1977} {"train_loss": -12.224457740783691, "global_step": 332245, "epoch": 1977} {"train_loss": -12.35836410522461, "global_step": 332246, "epoch": 1977} {"train_loss": -12.528607368469238, "global_step": 332247, "epoch": 1977} {"train_loss": -11.416608810424805, "global_step": 332248, "epoch": 1977} {"train_loss": -11.193453788757324, "global_step": 332249, "epoch": 1977} {"train_loss": -12.090875625610352, "global_step": 332250, "epoch": 1977} {"train_loss": -11.147404670715332, "global_step": 332251, "epoch": 1977} {"train_loss": -11.293804168701172, "global_step": 332252, "epoch": 1977} {"train_loss": -10.028867721557617, "global_step": 332253, "epoch": 1977} {"train_loss": -10.469348907470703, "global_step": 332254, "epoch": 1977} {"train_loss": -11.490070343017578, "global_step": 332255, "epoch": 1977} {"train_loss": -9.88298511505127, "global_step": 332256, "epoch": 1977} {"train_loss": -11.64181137084961, "global_step": 332257, "epoch": 1977} {"train_loss": -11.518450736999512, "global_step": 332258, "epoch": 1977} {"train_loss": -9.54351806640625, "global_step": 332259, "epoch": 1977} {"train_loss": -11.51588249206543, "global_step": 332260, "epoch": 1977} {"train_loss": -8.867593765258789, "global_step": 332261, "epoch": 1977} {"train_loss": -11.574739456176758, "global_step": 332262, "epoch": 1977} {"train_loss": -10.481485366821289, "global_step": 332263, "epoch": 1977} {"train_loss": -10.402624130249023, "global_step": 332264, "epoch": 1977} {"train_loss": -11.158507347106934, "global_step": 332265, "epoch": 1977} {"train_loss": -7.860411643981934, "global_step": 332266, "epoch": 1977} {"train_loss": -11.796222686767578, "global_step": 332267, "epoch": 1977} {"train_loss": -9.12169361114502, "global_step": 332268, "epoch": 1977} {"train_loss": -10.500448226928711, "global_step": 332269, "epoch": 1977} {"train_loss": -9.309954643249512, "global_step": 332270, "epoch": 1977} {"train_loss": -11.776702880859375, "global_step": 332271, "epoch": 1977} {"train_loss": -10.247869491577148, "global_step": 332272, "epoch": 1977} {"train_loss": -11.197970390319824, "global_step": 332273, "epoch": 1977} {"train_loss": -10.769408226013184, "global_step": 332274, "epoch": 1977} {"train_loss": -9.982633590698242, "global_step": 332275, "epoch": 1977} {"train_loss": -11.750636100769043, "global_step": 332276, "epoch": 1977} {"train_loss": -10.871681213378906, "global_step": 332277, "epoch": 1977} {"train_loss": -11.618670463562012, "global_step": 332278, "epoch": 1977} {"train_loss": -10.799363136291504, "global_step": 332279, "epoch": 1977} {"train_loss": -11.568020820617676, "global_step": 332280, "epoch": 1977} {"train_loss": -11.455493927001953, "global_step": 332281, "epoch": 1977} {"train_loss": -11.34523868560791, "global_step": 332282, "epoch": 1977} {"train_loss": -11.657543182373047, "global_step": 332283, "epoch": 1977} {"train_loss": -11.555994033813477, "global_step": 332284, "epoch": 1977} {"train_loss": -11.477621078491211, "global_step": 332285, "epoch": 1977} {"train_loss": -11.818880081176758, "global_step": 332286, "epoch": 1977} {"train_loss": -11.58740234375, "global_step": 332287, "epoch": 1977} {"train_loss": -11.855607986450195, "global_step": 332288, "epoch": 1977} {"train_loss": -12.090995788574219, "global_step": 332289, "epoch": 1977} {"train_loss": -12.00684642791748, "global_step": 332290, "epoch": 1977} {"train_loss": -12.041313171386719, "global_step": 332291, "epoch": 1977} {"train_loss": -12.027069091796875, "global_step": 332292, "epoch": 1977} {"train_loss": -11.85562515258789, "global_step": 332293, "epoch": 1977} {"train_loss": -11.823148727416992, "global_step": 332294, "epoch": 1977} {"train_loss": -11.967493057250977, "global_step": 332295, "epoch": 1977} {"train_loss": -12.01619815826416, "global_step": 332296, "epoch": 1977} {"train_loss": -12.24991512298584, "global_step": 332297, "epoch": 1977} {"train_loss": -11.96236801147461, "global_step": 332298, "epoch": 1977} {"train_loss": -12.132819175720215, "global_step": 332299, "epoch": 1977} {"train_loss": -12.186422348022461, "global_step": 332300, "epoch": 1977} {"train_loss": -11.877906799316406, "global_step": 332301, "epoch": 1977} {"train_loss": -12.119290351867676, "global_step": 332302, "epoch": 1977} {"train_loss": -11.699023797398521, "global_step": 332303, "epoch": 1977, "val_loss": 289382.59375} {"train_loss": -12.162343978881836, "global_step": 332304, "epoch": 1978} {"train_loss": -12.194839477539062, "global_step": 332305, "epoch": 1978} {"train_loss": -12.077896118164062, "global_step": 332306, "epoch": 1978} {"train_loss": -12.35861873626709, "global_step": 332307, "epoch": 1978} {"train_loss": -12.1547212600708, "global_step": 332308, "epoch": 1978} {"train_loss": -12.17737865447998, "global_step": 332309, "epoch": 1978} {"train_loss": -12.045135498046875, "global_step": 332310, "epoch": 1978} {"train_loss": -12.082412719726562, "global_step": 332311, "epoch": 1978} {"train_loss": -12.22222900390625, "global_step": 332312, "epoch": 1978} {"train_loss": -11.962149620056152, "global_step": 332313, "epoch": 1978} {"train_loss": -12.14566707611084, "global_step": 332314, "epoch": 1978} {"train_loss": -12.300573348999023, "global_step": 332315, "epoch": 1978} {"train_loss": -12.093282699584961, "global_step": 332316, "epoch": 1978} {"train_loss": -12.462299346923828, "global_step": 332317, "epoch": 1978} {"train_loss": -12.185077667236328, "global_step": 332318, "epoch": 1978} {"train_loss": -12.227869033813477, "global_step": 332319, "epoch": 1978} {"train_loss": -12.058738708496094, "global_step": 332320, "epoch": 1978} {"train_loss": -12.139217376708984, "global_step": 332321, "epoch": 1978} {"train_loss": -12.392887115478516, "global_step": 332322, "epoch": 1978} {"train_loss": -12.031792640686035, "global_step": 332323, "epoch": 1978} {"train_loss": -12.458281517028809, "global_step": 332324, "epoch": 1978} {"train_loss": -12.10582160949707, "global_step": 332325, "epoch": 1978} {"train_loss": -12.201460838317871, "global_step": 332326, "epoch": 1978} {"train_loss": -12.262149810791016, "global_step": 332327, "epoch": 1978} {"train_loss": -12.165312767028809, "global_step": 332328, "epoch": 1978} {"train_loss": -12.122230529785156, "global_step": 332329, "epoch": 1978} {"train_loss": -12.621125221252441, "global_step": 332330, "epoch": 1978} {"train_loss": -12.036674499511719, "global_step": 332331, "epoch": 1978} {"train_loss": -12.741643905639648, "global_step": 332332, "epoch": 1978} {"train_loss": -12.231061935424805, "global_step": 332333, "epoch": 1978} {"train_loss": -12.212821006774902, "global_step": 332334, "epoch": 1978} {"train_loss": -12.472921371459961, "global_step": 332335, "epoch": 1978} {"train_loss": -12.430185317993164, "global_step": 332336, "epoch": 1978} {"train_loss": -12.36099624633789, "global_step": 332337, "epoch": 1978} {"train_loss": -12.39195442199707, "global_step": 332338, "epoch": 1978} {"train_loss": -12.234273910522461, "global_step": 332339, "epoch": 1978} {"train_loss": -12.432780265808105, "global_step": 332340, "epoch": 1978} {"train_loss": -12.368837356567383, "global_step": 332341, "epoch": 1978} {"train_loss": -12.550819396972656, "global_step": 332342, "epoch": 1978} {"train_loss": -12.245686531066895, "global_step": 332343, "epoch": 1978} {"train_loss": -12.701784133911133, "global_step": 332344, "epoch": 1978} {"train_loss": -11.945754051208496, "global_step": 332345, "epoch": 1978} {"train_loss": -12.223071098327637, "global_step": 332346, "epoch": 1978} {"train_loss": -11.981361389160156, "global_step": 332347, "epoch": 1978} {"train_loss": -12.530082702636719, "global_step": 332348, "epoch": 1978} {"train_loss": -11.973402976989746, "global_step": 332349, "epoch": 1978} {"train_loss": -12.571895599365234, "global_step": 332350, "epoch": 1978} {"train_loss": -12.501193046569824, "global_step": 332351, "epoch": 1978} {"train_loss": -12.575166702270508, "global_step": 332352, "epoch": 1978} {"train_loss": -12.191014289855957, "global_step": 332353, "epoch": 1978} {"train_loss": -12.367485046386719, "global_step": 332354, "epoch": 1978} {"train_loss": -12.612161636352539, "global_step": 332355, "epoch": 1978} {"train_loss": -12.556840896606445, "global_step": 332356, "epoch": 1978} {"train_loss": -12.278570175170898, "global_step": 332357, "epoch": 1978} {"train_loss": -12.468652725219727, "global_step": 332358, "epoch": 1978} {"train_loss": -12.584173202514648, "global_step": 332359, "epoch": 1978} {"train_loss": -12.482078552246094, "global_step": 332360, "epoch": 1978} {"train_loss": -12.426387786865234, "global_step": 332361, "epoch": 1978} {"train_loss": -12.637985229492188, "global_step": 332362, "epoch": 1978} {"train_loss": -12.440969467163086, "global_step": 332363, "epoch": 1978} {"train_loss": -12.267559051513672, "global_step": 332364, "epoch": 1978} {"train_loss": -12.194228172302246, "global_step": 332365, "epoch": 1978} {"train_loss": -12.427484512329102, "global_step": 332366, "epoch": 1978} {"train_loss": -12.544955253601074, "global_step": 332367, "epoch": 1978} {"train_loss": -11.606203079223633, "global_step": 332368, "epoch": 1978} {"train_loss": -11.367307662963867, "global_step": 332369, "epoch": 1978} {"train_loss": -12.180770874023438, "global_step": 332370, "epoch": 1978} {"train_loss": -12.48434066772461, "global_step": 332371, "epoch": 1978} {"train_loss": -11.977588653564453, "global_step": 332372, "epoch": 1978} {"train_loss": -11.87518310546875, "global_step": 332373, "epoch": 1978} {"train_loss": -12.309904098510742, "global_step": 332374, "epoch": 1978} {"train_loss": -12.32594108581543, "global_step": 332375, "epoch": 1978} {"train_loss": -12.19480037689209, "global_step": 332376, "epoch": 1978} {"train_loss": -12.411964416503906, "global_step": 332377, "epoch": 1978} {"train_loss": -12.144283294677734, "global_step": 332378, "epoch": 1978} {"train_loss": -12.345504760742188, "global_step": 332379, "epoch": 1978} {"train_loss": -12.435697555541992, "global_step": 332380, "epoch": 1978} {"train_loss": -11.440818786621094, "global_step": 332381, "epoch": 1978} {"train_loss": -12.206607818603516, "global_step": 332382, "epoch": 1978} {"train_loss": -12.365578651428223, "global_step": 332383, "epoch": 1978} {"train_loss": -12.136646270751953, "global_step": 332384, "epoch": 1978} {"train_loss": -12.210933685302734, "global_step": 332385, "epoch": 1978} {"train_loss": -12.525946617126465, "global_step": 332386, "epoch": 1978} {"train_loss": -12.073114395141602, "global_step": 332387, "epoch": 1978} {"train_loss": -12.145374298095703, "global_step": 332388, "epoch": 1978} {"train_loss": -12.244271278381348, "global_step": 332389, "epoch": 1978} {"train_loss": -12.578754425048828, "global_step": 332390, "epoch": 1978} {"train_loss": -12.522154808044434, "global_step": 332391, "epoch": 1978} {"train_loss": -12.051572799682617, "global_step": 332392, "epoch": 1978} {"train_loss": -11.000758171081543, "global_step": 332393, "epoch": 1978} {"train_loss": -11.796548843383789, "global_step": 332394, "epoch": 1978} {"train_loss": -12.171998977661133, "global_step": 332395, "epoch": 1978} {"train_loss": -12.274150848388672, "global_step": 332396, "epoch": 1978} {"train_loss": -12.076396942138672, "global_step": 332397, "epoch": 1978} {"train_loss": -12.221037864685059, "global_step": 332398, "epoch": 1978} {"train_loss": -12.12182331085205, "global_step": 332399, "epoch": 1978} {"train_loss": -11.905839920043945, "global_step": 332400, "epoch": 1978} {"train_loss": -12.088874816894531, "global_step": 332401, "epoch": 1978} {"train_loss": -12.091508865356445, "global_step": 332402, "epoch": 1978} {"train_loss": -12.012386322021484, "global_step": 332403, "epoch": 1978} {"train_loss": -12.303990364074707, "global_step": 332404, "epoch": 1978} {"train_loss": -11.319377899169922, "global_step": 332405, "epoch": 1978} {"train_loss": -10.487926483154297, "global_step": 332406, "epoch": 1978} {"train_loss": -11.307661056518555, "global_step": 332407, "epoch": 1978} {"train_loss": -12.051187515258789, "global_step": 332408, "epoch": 1978} {"train_loss": -10.508464813232422, "global_step": 332409, "epoch": 1978} {"train_loss": -12.079246520996094, "global_step": 332410, "epoch": 1978} {"train_loss": -10.971193313598633, "global_step": 332411, "epoch": 1978} {"train_loss": -12.310957908630371, "global_step": 332412, "epoch": 1978} {"train_loss": -11.621809005737305, "global_step": 332413, "epoch": 1978} {"train_loss": -11.66663932800293, "global_step": 332414, "epoch": 1978} {"train_loss": -11.375266075134277, "global_step": 332415, "epoch": 1978} {"train_loss": -11.77305793762207, "global_step": 332416, "epoch": 1978} {"train_loss": -11.836738586425781, "global_step": 332417, "epoch": 1978} {"train_loss": -10.917784690856934, "global_step": 332418, "epoch": 1978} {"train_loss": -11.286245346069336, "global_step": 332419, "epoch": 1978} {"train_loss": -11.41667366027832, "global_step": 332420, "epoch": 1978} {"train_loss": -12.043266296386719, "global_step": 332421, "epoch": 1978} {"train_loss": -11.296852111816406, "global_step": 332422, "epoch": 1978} {"train_loss": -12.101367950439453, "global_step": 332423, "epoch": 1978} {"train_loss": -11.120903015136719, "global_step": 332424, "epoch": 1978} {"train_loss": -11.727374076843262, "global_step": 332425, "epoch": 1978} {"train_loss": -11.982706069946289, "global_step": 332426, "epoch": 1978} {"train_loss": -11.529991149902344, "global_step": 332427, "epoch": 1978} {"train_loss": -12.008989334106445, "global_step": 332428, "epoch": 1978} {"train_loss": -11.663631439208984, "global_step": 332429, "epoch": 1978} {"train_loss": -11.244969367980957, "global_step": 332430, "epoch": 1978} {"train_loss": -11.98678207397461, "global_step": 332431, "epoch": 1978} {"train_loss": -11.453261375427246, "global_step": 332432, "epoch": 1978} {"train_loss": -12.115886688232422, "global_step": 332433, "epoch": 1978} {"train_loss": -11.636302947998047, "global_step": 332434, "epoch": 1978} {"train_loss": -11.133752822875977, "global_step": 332435, "epoch": 1978} {"train_loss": -11.64362621307373, "global_step": 332436, "epoch": 1978} {"train_loss": -10.435968399047852, "global_step": 332437, "epoch": 1978} {"train_loss": -12.282617568969727, "global_step": 332438, "epoch": 1978} {"train_loss": -11.107545852661133, "global_step": 332439, "epoch": 1978} {"train_loss": -11.901488304138184, "global_step": 332440, "epoch": 1978} {"train_loss": -10.771333694458008, "global_step": 332441, "epoch": 1978} {"train_loss": -10.934884071350098, "global_step": 332442, "epoch": 1978} {"train_loss": -10.963213920593262, "global_step": 332443, "epoch": 1978} {"train_loss": -10.89173412322998, "global_step": 332444, "epoch": 1978} {"train_loss": -11.742713928222656, "global_step": 332445, "epoch": 1978} {"train_loss": -10.544168472290039, "global_step": 332446, "epoch": 1978} {"train_loss": -11.307708740234375, "global_step": 332447, "epoch": 1978} {"train_loss": -10.227272033691406, "global_step": 332448, "epoch": 1978} {"train_loss": -10.60085678100586, "global_step": 332449, "epoch": 1978} {"train_loss": -9.400233268737793, "global_step": 332450, "epoch": 1978} {"train_loss": -9.871981620788574, "global_step": 332451, "epoch": 1978} {"train_loss": -10.478658676147461, "global_step": 332452, "epoch": 1978} {"train_loss": -10.934728622436523, "global_step": 332453, "epoch": 1978} {"train_loss": -10.786993026733398, "global_step": 332454, "epoch": 1978} {"train_loss": -11.657942771911621, "global_step": 332455, "epoch": 1978} {"train_loss": -10.697430610656738, "global_step": 332456, "epoch": 1978} {"train_loss": -10.255446434020996, "global_step": 332457, "epoch": 1978} {"train_loss": -11.196905136108398, "global_step": 332458, "epoch": 1978} {"train_loss": -10.464177131652832, "global_step": 332459, "epoch": 1978} {"train_loss": -11.963970184326172, "global_step": 332460, "epoch": 1978} {"train_loss": -10.82986068725586, "global_step": 332461, "epoch": 1978} {"train_loss": -11.156006813049316, "global_step": 332462, "epoch": 1978} {"train_loss": -11.519145965576172, "global_step": 332463, "epoch": 1978} {"train_loss": -11.500919342041016, "global_step": 332464, "epoch": 1978} {"train_loss": -11.709607124328613, "global_step": 332465, "epoch": 1978} {"train_loss": -11.82050895690918, "global_step": 332466, "epoch": 1978} {"train_loss": -11.482006072998047, "global_step": 332467, "epoch": 1978} {"train_loss": -11.758604049682617, "global_step": 332468, "epoch": 1978} {"train_loss": -11.702434539794922, "global_step": 332469, "epoch": 1978} {"train_loss": -12.016961097717285, "global_step": 332470, "epoch": 1978} {"train_loss": -11.87009122258141, "global_step": 332471, "epoch": 1978, "val_loss": 288518.375} {"train_loss": -12.016477584838867, "global_step": 332472, "epoch": 1979} {"train_loss": -11.923384666442871, "global_step": 332473, "epoch": 1979} {"train_loss": -11.77391529083252, "global_step": 332474, "epoch": 1979} {"train_loss": -11.755273818969727, "global_step": 332475, "epoch": 1979} {"train_loss": -11.843334197998047, "global_step": 332476, "epoch": 1979} {"train_loss": -11.718244552612305, "global_step": 332477, "epoch": 1979} {"train_loss": -12.048467636108398, "global_step": 332478, "epoch": 1979} {"train_loss": -11.742932319641113, "global_step": 332479, "epoch": 1979} {"train_loss": -12.049412727355957, "global_step": 332480, "epoch": 1979} {"train_loss": -12.22202205657959, "global_step": 332481, "epoch": 1979} {"train_loss": -12.192428588867188, "global_step": 332482, "epoch": 1979} {"train_loss": -12.055697441101074, "global_step": 332483, "epoch": 1979} {"train_loss": -12.265467643737793, "global_step": 332484, "epoch": 1979} {"train_loss": -12.14688777923584, "global_step": 332485, "epoch": 1979} {"train_loss": -12.252819061279297, "global_step": 332486, "epoch": 1979} {"train_loss": -12.239809036254883, "global_step": 332487, "epoch": 1979} {"train_loss": -12.004561424255371, "global_step": 332488, "epoch": 1979} {"train_loss": -12.343494415283203, "global_step": 332489, "epoch": 1979} {"train_loss": -12.187358856201172, "global_step": 332490, "epoch": 1979} {"train_loss": -12.286019325256348, "global_step": 332491, "epoch": 1979} {"train_loss": -11.977580070495605, "global_step": 332492, "epoch": 1979} {"train_loss": -12.426124572753906, "global_step": 332493, "epoch": 1979} {"train_loss": -12.287851333618164, "global_step": 332494, "epoch": 1979} {"train_loss": -12.325069427490234, "global_step": 332495, "epoch": 1979} {"train_loss": -12.349943161010742, "global_step": 332496, "epoch": 1979} {"train_loss": -12.334657669067383, "global_step": 332497, "epoch": 1979} {"train_loss": -12.300878524780273, "global_step": 332498, "epoch": 1979} {"train_loss": -12.280559539794922, "global_step": 332499, "epoch": 1979} {"train_loss": -12.16380500793457, "global_step": 332500, "epoch": 1979} {"train_loss": -12.332066535949707, "global_step": 332501, "epoch": 1979} {"train_loss": -12.272819519042969, "global_step": 332502, "epoch": 1979} {"train_loss": -12.006475448608398, "global_step": 332503, "epoch": 1979} {"train_loss": -12.282154083251953, "global_step": 332504, "epoch": 1979} {"train_loss": -12.273157119750977, "global_step": 332505, "epoch": 1979} {"train_loss": -12.454292297363281, "global_step": 332506, "epoch": 1979} {"train_loss": -12.205971717834473, "global_step": 332507, "epoch": 1979} {"train_loss": -12.445340156555176, "global_step": 332508, "epoch": 1979} {"train_loss": -12.395939826965332, "global_step": 332509, "epoch": 1979} {"train_loss": -12.34136962890625, "global_step": 332510, "epoch": 1979} {"train_loss": -12.342931747436523, "global_step": 332511, "epoch": 1979} {"train_loss": -12.555668830871582, "global_step": 332512, "epoch": 1979} {"train_loss": -12.48056411743164, "global_step": 332513, "epoch": 1979} {"train_loss": -12.530838012695312, "global_step": 332514, "epoch": 1979} {"train_loss": -12.538778305053711, "global_step": 332515, "epoch": 1979} {"train_loss": -12.362373352050781, "global_step": 332516, "epoch": 1979} {"train_loss": -12.283658981323242, "global_step": 332517, "epoch": 1979} {"train_loss": -12.290194511413574, "global_step": 332518, "epoch": 1979} {"train_loss": -12.41925048828125, "global_step": 332519, "epoch": 1979} {"train_loss": -12.367050170898438, "global_step": 332520, "epoch": 1979} {"train_loss": -12.261445999145508, "global_step": 332521, "epoch": 1979} {"train_loss": -12.402199745178223, "global_step": 332522, "epoch": 1979} {"train_loss": -12.45236587524414, "global_step": 332523, "epoch": 1979} {"train_loss": -12.539716720581055, "global_step": 332524, "epoch": 1979} {"train_loss": -12.680461883544922, "global_step": 332525, "epoch": 1979} {"train_loss": -12.636190414428711, "global_step": 332526, "epoch": 1979} {"train_loss": -12.593545913696289, "global_step": 332527, "epoch": 1979} {"train_loss": -12.576040267944336, "global_step": 332528, "epoch": 1979} {"train_loss": -12.610673904418945, "global_step": 332529, "epoch": 1979} {"train_loss": -12.63332748413086, "global_step": 332530, "epoch": 1979} {"train_loss": -12.460003852844238, "global_step": 332531, "epoch": 1979} {"train_loss": -12.57044506072998, "global_step": 332532, "epoch": 1979} {"train_loss": -12.515443801879883, "global_step": 332533, "epoch": 1979} {"train_loss": -12.504528045654297, "global_step": 332534, "epoch": 1979} {"train_loss": -12.459394454956055, "global_step": 332535, "epoch": 1979} {"train_loss": -12.685911178588867, "global_step": 332536, "epoch": 1979} {"train_loss": -12.474997520446777, "global_step": 332537, "epoch": 1979} {"train_loss": -12.326641082763672, "global_step": 332538, "epoch": 1979} {"train_loss": -12.503835678100586, "global_step": 332539, "epoch": 1979} {"train_loss": -12.618304252624512, "global_step": 332540, "epoch": 1979} {"train_loss": -12.548331260681152, "global_step": 332541, "epoch": 1979} {"train_loss": -12.765974044799805, "global_step": 332542, "epoch": 1979} {"train_loss": -12.481590270996094, "global_step": 332543, "epoch": 1979} {"train_loss": -12.634113311767578, "global_step": 332544, "epoch": 1979} {"train_loss": -12.52876091003418, "global_step": 332545, "epoch": 1979} {"train_loss": -12.45040512084961, "global_step": 332546, "epoch": 1979} {"train_loss": -12.531501770019531, "global_step": 332547, "epoch": 1979} {"train_loss": -12.302569389343262, "global_step": 332548, "epoch": 1979} {"train_loss": -12.049551010131836, "global_step": 332549, "epoch": 1979} {"train_loss": -12.453827857971191, "global_step": 332550, "epoch": 1979} {"train_loss": -12.670869827270508, "global_step": 332551, "epoch": 1979} {"train_loss": -12.273971557617188, "global_step": 332552, "epoch": 1979} {"train_loss": -12.24954891204834, "global_step": 332553, "epoch": 1979} {"train_loss": -11.041528701782227, "global_step": 332554, "epoch": 1979} {"train_loss": -10.370393753051758, "global_step": 332555, "epoch": 1979} {"train_loss": -11.57368278503418, "global_step": 332556, "epoch": 1979} {"train_loss": -11.958316802978516, "global_step": 332557, "epoch": 1979} {"train_loss": -11.024040222167969, "global_step": 332558, "epoch": 1979} {"train_loss": -11.928053855895996, "global_step": 332559, "epoch": 1979} {"train_loss": -9.807207107543945, "global_step": 332560, "epoch": 1979} {"train_loss": -11.717595100402832, "global_step": 332561, "epoch": 1979} {"train_loss": -11.101879119873047, "global_step": 332562, "epoch": 1979} {"train_loss": -11.091626167297363, "global_step": 332563, "epoch": 1979} {"train_loss": -10.67650032043457, "global_step": 332564, "epoch": 1979} {"train_loss": -11.267667770385742, "global_step": 332565, "epoch": 1979} {"train_loss": -11.636598587036133, "global_step": 332566, "epoch": 1979} {"train_loss": -10.22381591796875, "global_step": 332567, "epoch": 1979} {"train_loss": -10.917476654052734, "global_step": 332568, "epoch": 1979} {"train_loss": -10.609405517578125, "global_step": 332569, "epoch": 1979} {"train_loss": -11.555839538574219, "global_step": 332570, "epoch": 1979} {"train_loss": -11.596632957458496, "global_step": 332571, "epoch": 1979} {"train_loss": -11.70015811920166, "global_step": 332572, "epoch": 1979} {"train_loss": -11.44015884399414, "global_step": 332573, "epoch": 1979} {"train_loss": -10.313067436218262, "global_step": 332574, "epoch": 1979} {"train_loss": -10.038528442382812, "global_step": 332575, "epoch": 1979} {"train_loss": -11.174774169921875, "global_step": 332576, "epoch": 1979} {"train_loss": -9.278594970703125, "global_step": 332577, "epoch": 1979} {"train_loss": -9.172386169433594, "global_step": 332578, "epoch": 1979} {"train_loss": -10.092527389526367, "global_step": 332579, "epoch": 1979} {"train_loss": -9.06048583984375, "global_step": 332580, "epoch": 1979} {"train_loss": -10.073920249938965, "global_step": 332581, "epoch": 1979} {"train_loss": -10.046573638916016, "global_step": 332582, "epoch": 1979} {"train_loss": -9.13222885131836, "global_step": 332583, "epoch": 1979} {"train_loss": -8.311334609985352, "global_step": 332584, "epoch": 1979} {"train_loss": -8.81618881225586, "global_step": 332585, "epoch": 1979} {"train_loss": -9.257599830627441, "global_step": 332586, "epoch": 1979} {"train_loss": -9.252391815185547, "global_step": 332587, "epoch": 1979} {"train_loss": -10.047760009765625, "global_step": 332588, "epoch": 1979} {"train_loss": -9.985260009765625, "global_step": 332589, "epoch": 1979} {"train_loss": -9.72097396850586, "global_step": 332590, "epoch": 1979} {"train_loss": -11.249439239501953, "global_step": 332591, "epoch": 1979} {"train_loss": -10.261190414428711, "global_step": 332592, "epoch": 1979} {"train_loss": -11.447707176208496, "global_step": 332593, "epoch": 1979} {"train_loss": -10.92377758026123, "global_step": 332594, "epoch": 1979} {"train_loss": -11.150323867797852, "global_step": 332595, "epoch": 1979} {"train_loss": -10.975236892700195, "global_step": 332596, "epoch": 1979} {"train_loss": -11.413543701171875, "global_step": 332597, "epoch": 1979} {"train_loss": -10.603694915771484, "global_step": 332598, "epoch": 1979} {"train_loss": -11.570348739624023, "global_step": 332599, "epoch": 1979} {"train_loss": -10.5845947265625, "global_step": 332600, "epoch": 1979} {"train_loss": -11.502382278442383, "global_step": 332601, "epoch": 1979} {"train_loss": -11.265581130981445, "global_step": 332602, "epoch": 1979} {"train_loss": -10.588258743286133, "global_step": 332603, "epoch": 1979} {"train_loss": -11.532524108886719, "global_step": 332604, "epoch": 1979} {"train_loss": -10.992106437683105, "global_step": 332605, "epoch": 1979} {"train_loss": -11.339523315429688, "global_step": 332606, "epoch": 1979} {"train_loss": -11.274148941040039, "global_step": 332607, "epoch": 1979} {"train_loss": -11.546338081359863, "global_step": 332608, "epoch": 1979} {"train_loss": -11.149106979370117, "global_step": 332609, "epoch": 1979} {"train_loss": -11.720666885375977, "global_step": 332610, "epoch": 1979} {"train_loss": -11.084458351135254, "global_step": 332611, "epoch": 1979} {"train_loss": -11.603340148925781, "global_step": 332612, "epoch": 1979} {"train_loss": -11.406951904296875, "global_step": 332613, "epoch": 1979} {"train_loss": -11.942340850830078, "global_step": 332614, "epoch": 1979} {"train_loss": -12.034180641174316, "global_step": 332615, "epoch": 1979} {"train_loss": -11.738628387451172, "global_step": 332616, "epoch": 1979} {"train_loss": -11.756829261779785, "global_step": 332617, "epoch": 1979} {"train_loss": -12.004753112792969, "global_step": 332618, "epoch": 1979} {"train_loss": -11.571621894836426, "global_step": 332619, "epoch": 1979} {"train_loss": -12.051061630249023, "global_step": 332620, "epoch": 1979} {"train_loss": -11.822092056274414, "global_step": 332621, "epoch": 1979} {"train_loss": -11.844442367553711, "global_step": 332622, "epoch": 1979} {"train_loss": -11.985727310180664, "global_step": 332623, "epoch": 1979} {"train_loss": -11.84295654296875, "global_step": 332624, "epoch": 1979} {"train_loss": -11.886920928955078, "global_step": 332625, "epoch": 1979} {"train_loss": -12.31167984008789, "global_step": 332626, "epoch": 1979} {"train_loss": -11.884227752685547, "global_step": 332627, "epoch": 1979} {"train_loss": -12.019769668579102, "global_step": 332628, "epoch": 1979} {"train_loss": -11.907144546508789, "global_step": 332629, "epoch": 1979} {"train_loss": -12.155749320983887, "global_step": 332630, "epoch": 1979} {"train_loss": -12.070247650146484, "global_step": 332631, "epoch": 1979} {"train_loss": -12.028837203979492, "global_step": 332632, "epoch": 1979} {"train_loss": -11.954938888549805, "global_step": 332633, "epoch": 1979} {"train_loss": -12.232351303100586, "global_step": 332634, "epoch": 1979} {"train_loss": -12.08552360534668, "global_step": 332635, "epoch": 1979} {"train_loss": -12.158103942871094, "global_step": 332636, "epoch": 1979} {"train_loss": -12.020069122314453, "global_step": 332637, "epoch": 1979} {"train_loss": -12.071683883666992, "global_step": 332638, "epoch": 1979} {"train_loss": -11.707676336878823, "global_step": 332639, "epoch": 1979, "val_loss": 282459.9375} {"train_loss": -12.216205596923828, "global_step": 332640, "epoch": 1980} {"train_loss": -11.868778228759766, "global_step": 332641, "epoch": 1980} {"train_loss": -12.136825561523438, "global_step": 332642, "epoch": 1980} {"train_loss": -11.83295726776123, "global_step": 332643, "epoch": 1980} {"train_loss": -12.307182312011719, "global_step": 332644, "epoch": 1980} {"train_loss": -12.119877815246582, "global_step": 332645, "epoch": 1980} {"train_loss": -12.395548820495605, "global_step": 332646, "epoch": 1980} {"train_loss": -12.126167297363281, "global_step": 332647, "epoch": 1980} {"train_loss": -12.285062789916992, "global_step": 332648, "epoch": 1980} {"train_loss": -12.189785957336426, "global_step": 332649, "epoch": 1980} {"train_loss": -12.320655822753906, "global_step": 332650, "epoch": 1980} {"train_loss": -12.372994422912598, "global_step": 332651, "epoch": 1980} {"train_loss": -12.377838134765625, "global_step": 332652, "epoch": 1980} {"train_loss": -12.51594352722168, "global_step": 332653, "epoch": 1980} {"train_loss": -12.463813781738281, "global_step": 332654, "epoch": 1980} {"train_loss": -12.460315704345703, "global_step": 332655, "epoch": 1980} {"train_loss": -12.305903434753418, "global_step": 332656, "epoch": 1980} {"train_loss": -12.539700508117676, "global_step": 332657, "epoch": 1980} {"train_loss": -12.208968162536621, "global_step": 332658, "epoch": 1980} {"train_loss": -12.292118072509766, "global_step": 332659, "epoch": 1980} {"train_loss": -12.266979217529297, "global_step": 332660, "epoch": 1980} {"train_loss": -12.469278335571289, "global_step": 332661, "epoch": 1980} {"train_loss": -12.197556495666504, "global_step": 332662, "epoch": 1980} {"train_loss": -12.387628555297852, "global_step": 332663, "epoch": 1980} {"train_loss": -12.195843696594238, "global_step": 332664, "epoch": 1980} {"train_loss": -12.268438339233398, "global_step": 332665, "epoch": 1980} {"train_loss": -12.488463401794434, "global_step": 332666, "epoch": 1980} {"train_loss": -12.352754592895508, "global_step": 332667, "epoch": 1980} {"train_loss": -12.502479553222656, "global_step": 332668, "epoch": 1980} {"train_loss": -12.320082664489746, "global_step": 332669, "epoch": 1980} {"train_loss": -12.250589370727539, "global_step": 332670, "epoch": 1980} {"train_loss": -12.379815101623535, "global_step": 332671, "epoch": 1980} {"train_loss": -12.515920639038086, "global_step": 332672, "epoch": 1980} {"train_loss": -12.566521644592285, "global_step": 332673, "epoch": 1980} {"train_loss": -12.477070808410645, "global_step": 332674, "epoch": 1980} {"train_loss": -12.43535041809082, "global_step": 332675, "epoch": 1980} {"train_loss": -12.457139015197754, "global_step": 332676, "epoch": 1980} {"train_loss": -12.561698913574219, "global_step": 332677, "epoch": 1980} {"train_loss": -12.391157150268555, "global_step": 332678, "epoch": 1980} {"train_loss": -12.7428617477417, "global_step": 332679, "epoch": 1980} {"train_loss": -12.558749198913574, "global_step": 332680, "epoch": 1980} {"train_loss": -12.424474716186523, "global_step": 332681, "epoch": 1980} {"train_loss": -12.728963851928711, "global_step": 332682, "epoch": 1980} {"train_loss": -12.446243286132812, "global_step": 332683, "epoch": 1980} {"train_loss": -12.475049018859863, "global_step": 332684, "epoch": 1980} {"train_loss": -12.591625213623047, "global_step": 332685, "epoch": 1980} {"train_loss": -12.639705657958984, "global_step": 332686, "epoch": 1980} {"train_loss": -11.910494804382324, "global_step": 332687, "epoch": 1980} {"train_loss": -12.20893669128418, "global_step": 332688, "epoch": 1980} {"train_loss": -12.590188980102539, "global_step": 332689, "epoch": 1980} {"train_loss": -11.775932312011719, "global_step": 332690, "epoch": 1980} {"train_loss": -11.883381843566895, "global_step": 332691, "epoch": 1980} {"train_loss": -12.369855880737305, "global_step": 332692, "epoch": 1980} {"train_loss": -12.339292526245117, "global_step": 332693, "epoch": 1980} {"train_loss": -12.459463119506836, "global_step": 332694, "epoch": 1980} {"train_loss": -11.917438507080078, "global_step": 332695, "epoch": 1980} {"train_loss": -12.460981369018555, "global_step": 332696, "epoch": 1980} {"train_loss": -12.291046142578125, "global_step": 332697, "epoch": 1980} {"train_loss": -12.331521034240723, "global_step": 332698, "epoch": 1980} {"train_loss": -12.409282684326172, "global_step": 332699, "epoch": 1980} {"train_loss": -12.154376983642578, "global_step": 332700, "epoch": 1980} {"train_loss": -12.497844696044922, "global_step": 332701, "epoch": 1980} {"train_loss": -12.394152641296387, "global_step": 332702, "epoch": 1980} {"train_loss": -12.34531307220459, "global_step": 332703, "epoch": 1980} {"train_loss": -12.359768867492676, "global_step": 332704, "epoch": 1980} {"train_loss": -12.513710975646973, "global_step": 332705, "epoch": 1980} {"train_loss": -12.282325744628906, "global_step": 332706, "epoch": 1980} {"train_loss": -12.301475524902344, "global_step": 332707, "epoch": 1980} {"train_loss": -12.31324577331543, "global_step": 332708, "epoch": 1980} {"train_loss": -12.184739112854004, "global_step": 332709, "epoch": 1980} {"train_loss": -11.805915832519531, "global_step": 332710, "epoch": 1980} {"train_loss": -11.917791366577148, "global_step": 332711, "epoch": 1980} {"train_loss": -11.8998441696167, "global_step": 332712, "epoch": 1980} {"train_loss": -12.103804588317871, "global_step": 332713, "epoch": 1980} {"train_loss": -11.357765197753906, "global_step": 332714, "epoch": 1980} {"train_loss": -12.207548141479492, "global_step": 332715, "epoch": 1980} {"train_loss": -10.387716293334961, "global_step": 332716, "epoch": 1980} {"train_loss": -10.296676635742188, "global_step": 332717, "epoch": 1980} {"train_loss": -10.39951229095459, "global_step": 332718, "epoch": 1980} {"train_loss": -12.023300170898438, "global_step": 332719, "epoch": 1980} {"train_loss": -9.263659477233887, "global_step": 332720, "epoch": 1980} {"train_loss": -10.580483436584473, "global_step": 332721, "epoch": 1980} {"train_loss": -8.450132369995117, "global_step": 332722, "epoch": 1980} {"train_loss": -8.15304946899414, "global_step": 332723, "epoch": 1980} {"train_loss": -8.447517395019531, "global_step": 332724, "epoch": 1980} {"train_loss": -8.284492492675781, "global_step": 332725, "epoch": 1980} {"train_loss": -10.294136047363281, "global_step": 332726, "epoch": 1980} {"train_loss": -9.325246810913086, "global_step": 332727, "epoch": 1980} {"train_loss": -9.293755531311035, "global_step": 332728, "epoch": 1980} {"train_loss": -8.312606811523438, "global_step": 332729, "epoch": 1980} {"train_loss": -8.02639389038086, "global_step": 332730, "epoch": 1980} {"train_loss": -7.984346389770508, "global_step": 332731, "epoch": 1980} {"train_loss": -8.101179122924805, "global_step": 332732, "epoch": 1980} {"train_loss": -8.44803237915039, "global_step": 332733, "epoch": 1980} {"train_loss": -9.03201961517334, "global_step": 332734, "epoch": 1980} {"train_loss": -9.177300453186035, "global_step": 332735, "epoch": 1980} {"train_loss": -9.962242126464844, "global_step": 332736, "epoch": 1980} {"train_loss": -9.81506633758545, "global_step": 332737, "epoch": 1980} {"train_loss": -10.577219009399414, "global_step": 332738, "epoch": 1980} {"train_loss": -10.319608688354492, "global_step": 332739, "epoch": 1980} {"train_loss": -11.032308578491211, "global_step": 332740, "epoch": 1980} {"train_loss": -10.767253875732422, "global_step": 332741, "epoch": 1980} {"train_loss": -10.994929313659668, "global_step": 332742, "epoch": 1980} {"train_loss": -11.204931259155273, "global_step": 332743, "epoch": 1980} {"train_loss": -11.136800765991211, "global_step": 332744, "epoch": 1980} {"train_loss": -11.013387680053711, "global_step": 332745, "epoch": 1980} {"train_loss": -11.281877517700195, "global_step": 332746, "epoch": 1980} {"train_loss": -11.503030776977539, "global_step": 332747, "epoch": 1980} {"train_loss": -11.779786109924316, "global_step": 332748, "epoch": 1980} {"train_loss": -11.773136138916016, "global_step": 332749, "epoch": 1980} {"train_loss": -11.80828857421875, "global_step": 332750, "epoch": 1980} {"train_loss": -11.843221664428711, "global_step": 332751, "epoch": 1980} {"train_loss": -11.96058464050293, "global_step": 332752, "epoch": 1980} {"train_loss": -11.911600112915039, "global_step": 332753, "epoch": 1980} {"train_loss": -12.06362533569336, "global_step": 332754, "epoch": 1980} {"train_loss": -12.04049301147461, "global_step": 332755, "epoch": 1980} {"train_loss": -12.024154663085938, "global_step": 332756, "epoch": 1980} {"train_loss": -11.978270530700684, "global_step": 332757, "epoch": 1980} {"train_loss": -12.129992485046387, "global_step": 332758, "epoch": 1980} {"train_loss": -11.926849365234375, "global_step": 332759, "epoch": 1980} {"train_loss": -11.905773162841797, "global_step": 332760, "epoch": 1980} {"train_loss": -11.803875923156738, "global_step": 332761, "epoch": 1980} {"train_loss": -12.02984619140625, "global_step": 332762, "epoch": 1980} {"train_loss": -12.095359802246094, "global_step": 332763, "epoch": 1980} {"train_loss": -12.341758728027344, "global_step": 332764, "epoch": 1980} {"train_loss": -11.829803466796875, "global_step": 332765, "epoch": 1980} {"train_loss": -12.104755401611328, "global_step": 332766, "epoch": 1980} {"train_loss": -11.969407081604004, "global_step": 332767, "epoch": 1980} {"train_loss": -12.015949249267578, "global_step": 332768, "epoch": 1980} {"train_loss": -12.162172317504883, "global_step": 332769, "epoch": 1980} {"train_loss": -12.20568561553955, "global_step": 332770, "epoch": 1980} {"train_loss": -12.07369613647461, "global_step": 332771, "epoch": 1980} {"train_loss": -12.067245483398438, "global_step": 332772, "epoch": 1980} {"train_loss": -12.169427871704102, "global_step": 332773, "epoch": 1980} {"train_loss": -12.351638793945312, "global_step": 332774, "epoch": 1980} {"train_loss": -12.286888122558594, "global_step": 332775, "epoch": 1980} {"train_loss": -12.180704116821289, "global_step": 332776, "epoch": 1980} {"train_loss": -12.126091003417969, "global_step": 332777, "epoch": 1980} {"train_loss": -12.290397644042969, "global_step": 332778, "epoch": 1980} {"train_loss": -12.405452728271484, "global_step": 332779, "epoch": 1980} {"train_loss": -12.199224472045898, "global_step": 332780, "epoch": 1980} {"train_loss": -12.088578224182129, "global_step": 332781, "epoch": 1980} {"train_loss": -12.274478912353516, "global_step": 332782, "epoch": 1980} {"train_loss": -12.404779434204102, "global_step": 332783, "epoch": 1980} {"train_loss": -12.131291389465332, "global_step": 332784, "epoch": 1980} {"train_loss": -12.279114723205566, "global_step": 332785, "epoch": 1980} {"train_loss": -12.33862018585205, "global_step": 332786, "epoch": 1980} {"train_loss": -12.354900360107422, "global_step": 332787, "epoch": 1980} {"train_loss": -12.090374946594238, "global_step": 332788, "epoch": 1980} {"train_loss": -12.360607147216797, "global_step": 332789, "epoch": 1980} {"train_loss": -12.095715522766113, "global_step": 332790, "epoch": 1980} {"train_loss": -12.429920196533203, "global_step": 332791, "epoch": 1980} {"train_loss": -12.29228401184082, "global_step": 332792, "epoch": 1980} {"train_loss": -12.325572967529297, "global_step": 332793, "epoch": 1980} {"train_loss": -12.384787559509277, "global_step": 332794, "epoch": 1980} {"train_loss": -12.531615257263184, "global_step": 332795, "epoch": 1980} {"train_loss": -12.25950813293457, "global_step": 332796, "epoch": 1980} {"train_loss": -12.324472427368164, "global_step": 332797, "epoch": 1980} {"train_loss": -12.380926132202148, "global_step": 332798, "epoch": 1980} {"train_loss": -12.137887954711914, "global_step": 332799, "epoch": 1980} {"train_loss": -12.199178695678711, "global_step": 332800, "epoch": 1980} {"train_loss": -12.374201774597168, "global_step": 332801, "epoch": 1980} {"train_loss": -11.812582015991211, "global_step": 332802, "epoch": 1980} {"train_loss": -12.069988250732422, "global_step": 332803, "epoch": 1980} {"train_loss": -12.19028377532959, "global_step": 332804, "epoch": 1980} {"train_loss": -11.593388557434082, "global_step": 332805, "epoch": 1980} {"train_loss": -11.34157657623291, "global_step": 332806, "epoch": 1980} {"train_loss": -11.763290518806095, "global_step": 332807, "epoch": 1980, "val_loss": 285549.1875, "train_action_mse_error": 2.1976096630096436} {"train_loss": -12.054448127746582, "global_step": 332808, "epoch": 1981} {"train_loss": -12.099013328552246, "global_step": 332809, "epoch": 1981} {"train_loss": -12.302833557128906, "global_step": 332810, "epoch": 1981} {"train_loss": -12.451557159423828, "global_step": 332811, "epoch": 1981} {"train_loss": -12.086796760559082, "global_step": 332812, "epoch": 1981} {"train_loss": -12.314918518066406, "global_step": 332813, "epoch": 1981} {"train_loss": -12.000907897949219, "global_step": 332814, "epoch": 1981} {"train_loss": -12.008602142333984, "global_step": 332815, "epoch": 1981} {"train_loss": -12.207240104675293, "global_step": 332816, "epoch": 1981} {"train_loss": -11.609021186828613, "global_step": 332817, "epoch": 1981} {"train_loss": -11.852951049804688, "global_step": 332818, "epoch": 1981} {"train_loss": -10.814546585083008, "global_step": 332819, "epoch": 1981} {"train_loss": -10.440130233764648, "global_step": 332820, "epoch": 1981} {"train_loss": -11.69979190826416, "global_step": 332821, "epoch": 1981} {"train_loss": -11.376785278320312, "global_step": 332822, "epoch": 1981} {"train_loss": -11.389095306396484, "global_step": 332823, "epoch": 1981} {"train_loss": -11.91648006439209, "global_step": 332824, "epoch": 1981} {"train_loss": -11.364876747131348, "global_step": 332825, "epoch": 1981} {"train_loss": -12.016151428222656, "global_step": 332826, "epoch": 1981} {"train_loss": -11.073382377624512, "global_step": 332827, "epoch": 1981} {"train_loss": -11.659087181091309, "global_step": 332828, "epoch": 1981} {"train_loss": -11.429193496704102, "global_step": 332829, "epoch": 1981} {"train_loss": -11.59992790222168, "global_step": 332830, "epoch": 1981} {"train_loss": -11.598204612731934, "global_step": 332831, "epoch": 1981} {"train_loss": -11.935365676879883, "global_step": 332832, "epoch": 1981} {"train_loss": -11.830217361450195, "global_step": 332833, "epoch": 1981} {"train_loss": -12.040943145751953, "global_step": 332834, "epoch": 1981} {"train_loss": -11.658832550048828, "global_step": 332835, "epoch": 1981} {"train_loss": -12.085384368896484, "global_step": 332836, "epoch": 1981} {"train_loss": -12.087932586669922, "global_step": 332837, "epoch": 1981} {"train_loss": -11.924966812133789, "global_step": 332838, "epoch": 1981} {"train_loss": -11.534854888916016, "global_step": 332839, "epoch": 1981} {"train_loss": -12.250404357910156, "global_step": 332840, "epoch": 1981} {"train_loss": -11.899065017700195, "global_step": 332841, "epoch": 1981} {"train_loss": -11.929476737976074, "global_step": 332842, "epoch": 1981} {"train_loss": -12.12862777709961, "global_step": 332843, "epoch": 1981} {"train_loss": -11.79224681854248, "global_step": 332844, "epoch": 1981} {"train_loss": -11.989860534667969, "global_step": 332845, "epoch": 1981} {"train_loss": -12.031899452209473, "global_step": 332846, "epoch": 1981} {"train_loss": -11.479296684265137, "global_step": 332847, "epoch": 1981} {"train_loss": -11.705667495727539, "global_step": 332848, "epoch": 1981} {"train_loss": -11.691514015197754, "global_step": 332849, "epoch": 1981} {"train_loss": -11.848214149475098, "global_step": 332850, "epoch": 1981} {"train_loss": -11.186376571655273, "global_step": 332851, "epoch": 1981} {"train_loss": -11.804810523986816, "global_step": 332852, "epoch": 1981} {"train_loss": -11.209830284118652, "global_step": 332853, "epoch": 1981} {"train_loss": -12.06395149230957, "global_step": 332854, "epoch": 1981} {"train_loss": -11.5307035446167, "global_step": 332855, "epoch": 1981} {"train_loss": -12.025619506835938, "global_step": 332856, "epoch": 1981} {"train_loss": -12.03294563293457, "global_step": 332857, "epoch": 1981} {"train_loss": -11.537415504455566, "global_step": 332858, "epoch": 1981} {"train_loss": -12.27256965637207, "global_step": 332859, "epoch": 1981} {"train_loss": -11.743642807006836, "global_step": 332860, "epoch": 1981} {"train_loss": -12.172676086425781, "global_step": 332861, "epoch": 1981} {"train_loss": -11.963859558105469, "global_step": 332862, "epoch": 1981} {"train_loss": -11.986356735229492, "global_step": 332863, "epoch": 1981} {"train_loss": -12.369510650634766, "global_step": 332864, "epoch": 1981} {"train_loss": -12.133840560913086, "global_step": 332865, "epoch": 1981} {"train_loss": -11.864810943603516, "global_step": 332866, "epoch": 1981} {"train_loss": -11.865546226501465, "global_step": 332867, "epoch": 1981} {"train_loss": -11.961944580078125, "global_step": 332868, "epoch": 1981} {"train_loss": -11.730979919433594, "global_step": 332869, "epoch": 1981} {"train_loss": -11.784873962402344, "global_step": 332870, "epoch": 1981} {"train_loss": -11.7186279296875, "global_step": 332871, "epoch": 1981} {"train_loss": -12.175765991210938, "global_step": 332872, "epoch": 1981} {"train_loss": -11.764701843261719, "global_step": 332873, "epoch": 1981} {"train_loss": -11.527692794799805, "global_step": 332874, "epoch": 1981} {"train_loss": -12.175168991088867, "global_step": 332875, "epoch": 1981} {"train_loss": -11.538069725036621, "global_step": 332876, "epoch": 1981} {"train_loss": -11.903257369995117, "global_step": 332877, "epoch": 1981} {"train_loss": -12.173194885253906, "global_step": 332878, "epoch": 1981} {"train_loss": -11.789020538330078, "global_step": 332879, "epoch": 1981} {"train_loss": -12.327916145324707, "global_step": 332880, "epoch": 1981} {"train_loss": -11.798845291137695, "global_step": 332881, "epoch": 1981} {"train_loss": -12.492658615112305, "global_step": 332882, "epoch": 1981} {"train_loss": -12.144208908081055, "global_step": 332883, "epoch": 1981} {"train_loss": -11.814483642578125, "global_step": 332884, "epoch": 1981} {"train_loss": -12.318138122558594, "global_step": 332885, "epoch": 1981} {"train_loss": -11.945245742797852, "global_step": 332886, "epoch": 1981} {"train_loss": -11.829700469970703, "global_step": 332887, "epoch": 1981} {"train_loss": -12.328184127807617, "global_step": 332888, "epoch": 1981} {"train_loss": -11.882993698120117, "global_step": 332889, "epoch": 1981} {"train_loss": -12.305036544799805, "global_step": 332890, "epoch": 1981} {"train_loss": -12.301703453063965, "global_step": 332891, "epoch": 1981} {"train_loss": -12.119085311889648, "global_step": 332892, "epoch": 1981} {"train_loss": -12.262155532836914, "global_step": 332893, "epoch": 1981} {"train_loss": -12.085531234741211, "global_step": 332894, "epoch": 1981} {"train_loss": -12.219047546386719, "global_step": 332895, "epoch": 1981} {"train_loss": -12.243355751037598, "global_step": 332896, "epoch": 1981} {"train_loss": -12.032903671264648, "global_step": 332897, "epoch": 1981} {"train_loss": -12.077455520629883, "global_step": 332898, "epoch": 1981} {"train_loss": -12.071393966674805, "global_step": 332899, "epoch": 1981} {"train_loss": -12.140981674194336, "global_step": 332900, "epoch": 1981} {"train_loss": -11.964396476745605, "global_step": 332901, "epoch": 1981} {"train_loss": -12.367813110351562, "global_step": 332902, "epoch": 1981} {"train_loss": -11.707292556762695, "global_step": 332903, "epoch": 1981} {"train_loss": -12.136775016784668, "global_step": 332904, "epoch": 1981} {"train_loss": -12.039535522460938, "global_step": 332905, "epoch": 1981} {"train_loss": -12.09447956085205, "global_step": 332906, "epoch": 1981} {"train_loss": -11.367509841918945, "global_step": 332907, "epoch": 1981} {"train_loss": -12.246684074401855, "global_step": 332908, "epoch": 1981} {"train_loss": -12.049629211425781, "global_step": 332909, "epoch": 1981} {"train_loss": -11.744783401489258, "global_step": 332910, "epoch": 1981} {"train_loss": -12.200980186462402, "global_step": 332911, "epoch": 1981} {"train_loss": -12.493494987487793, "global_step": 332912, "epoch": 1981} {"train_loss": -12.403802871704102, "global_step": 332913, "epoch": 1981} {"train_loss": -12.108745574951172, "global_step": 332914, "epoch": 1981} {"train_loss": -12.251259803771973, "global_step": 332915, "epoch": 1981} {"train_loss": -12.376489639282227, "global_step": 332916, "epoch": 1981} {"train_loss": -12.283220291137695, "global_step": 332917, "epoch": 1981} {"train_loss": -12.492036819458008, "global_step": 332918, "epoch": 1981} {"train_loss": -11.862682342529297, "global_step": 332919, "epoch": 1981} {"train_loss": -12.372147560119629, "global_step": 332920, "epoch": 1981} {"train_loss": -11.788670539855957, "global_step": 332921, "epoch": 1981} {"train_loss": -11.910590171813965, "global_step": 332922, "epoch": 1981} {"train_loss": -12.199989318847656, "global_step": 332923, "epoch": 1981} {"train_loss": -11.940055847167969, "global_step": 332924, "epoch": 1981} {"train_loss": -10.989757537841797, "global_step": 332925, "epoch": 1981} {"train_loss": -12.03625202178955, "global_step": 332926, "epoch": 1981} {"train_loss": -11.691276550292969, "global_step": 332927, "epoch": 1981} {"train_loss": -11.121891021728516, "global_step": 332928, "epoch": 1981} {"train_loss": -12.219791412353516, "global_step": 332929, "epoch": 1981} {"train_loss": -11.07166862487793, "global_step": 332930, "epoch": 1981} {"train_loss": -12.61843490600586, "global_step": 332931, "epoch": 1981} {"train_loss": -11.136433601379395, "global_step": 332932, "epoch": 1981} {"train_loss": -11.509649276733398, "global_step": 332933, "epoch": 1981} {"train_loss": -11.950227737426758, "global_step": 332934, "epoch": 1981} {"train_loss": -10.514341354370117, "global_step": 332935, "epoch": 1981} {"train_loss": -12.283590316772461, "global_step": 332936, "epoch": 1981} {"train_loss": -9.799375534057617, "global_step": 332937, "epoch": 1981} {"train_loss": -10.434379577636719, "global_step": 332938, "epoch": 1981} {"train_loss": -9.938944816589355, "global_step": 332939, "epoch": 1981} {"train_loss": -10.329306602478027, "global_step": 332940, "epoch": 1981} {"train_loss": -9.267690658569336, "global_step": 332941, "epoch": 1981} {"train_loss": -10.702556610107422, "global_step": 332942, "epoch": 1981} {"train_loss": -10.279851913452148, "global_step": 332943, "epoch": 1981} {"train_loss": -11.221153259277344, "global_step": 332944, "epoch": 1981} {"train_loss": -10.366076469421387, "global_step": 332945, "epoch": 1981} {"train_loss": -11.112055778503418, "global_step": 332946, "epoch": 1981} {"train_loss": -11.705887794494629, "global_step": 332947, "epoch": 1981} {"train_loss": -11.418861389160156, "global_step": 332948, "epoch": 1981} {"train_loss": -11.32415771484375, "global_step": 332949, "epoch": 1981} {"train_loss": -12.03026008605957, "global_step": 332950, "epoch": 1981} {"train_loss": -11.27257251739502, "global_step": 332951, "epoch": 1981} {"train_loss": -11.850671768188477, "global_step": 332952, "epoch": 1981} {"train_loss": -11.679595947265625, "global_step": 332953, "epoch": 1981} {"train_loss": -11.430989265441895, "global_step": 332954, "epoch": 1981} {"train_loss": -11.576125144958496, "global_step": 332955, "epoch": 1981} {"train_loss": -11.123964309692383, "global_step": 332956, "epoch": 1981} {"train_loss": -11.247343063354492, "global_step": 332957, "epoch": 1981} {"train_loss": -11.342989921569824, "global_step": 332958, "epoch": 1981} {"train_loss": -9.908655166625977, "global_step": 332959, "epoch": 1981} {"train_loss": -11.629122734069824, "global_step": 332960, "epoch": 1981} {"train_loss": -9.563084602355957, "global_step": 332961, "epoch": 1981} {"train_loss": -10.331777572631836, "global_step": 332962, "epoch": 1981} {"train_loss": -11.512832641601562, "global_step": 332963, "epoch": 1981} {"train_loss": -10.255329132080078, "global_step": 332964, "epoch": 1981} {"train_loss": -11.06777572631836, "global_step": 332965, "epoch": 1981} {"train_loss": -9.902402877807617, "global_step": 332966, "epoch": 1981} {"train_loss": -11.337417602539062, "global_step": 332967, "epoch": 1981} {"train_loss": -10.728395462036133, "global_step": 332968, "epoch": 1981} {"train_loss": -11.165855407714844, "global_step": 332969, "epoch": 1981} {"train_loss": -10.542013168334961, "global_step": 332970, "epoch": 1981} {"train_loss": -11.163352966308594, "global_step": 332971, "epoch": 1981} {"train_loss": -11.287153244018555, "global_step": 332972, "epoch": 1981} {"train_loss": -10.860222816467285, "global_step": 332973, "epoch": 1981} {"train_loss": -11.460186958312988, "global_step": 332974, "epoch": 1981} {"train_loss": -11.672513223829723, "global_step": 332975, "epoch": 1981, "val_loss": 284241.6875} {"train_loss": -11.00100040435791, "global_step": 332976, "epoch": 1982} {"train_loss": -11.511329650878906, "global_step": 332977, "epoch": 1982} {"train_loss": -11.408283233642578, "global_step": 332978, "epoch": 1982} {"train_loss": -11.554492950439453, "global_step": 332979, "epoch": 1982} {"train_loss": -11.501615524291992, "global_step": 332980, "epoch": 1982} {"train_loss": -11.641508102416992, "global_step": 332981, "epoch": 1982} {"train_loss": -11.468794822692871, "global_step": 332982, "epoch": 1982} {"train_loss": -11.804939270019531, "global_step": 332983, "epoch": 1982} {"train_loss": -11.509963989257812, "global_step": 332984, "epoch": 1982} {"train_loss": -11.534095764160156, "global_step": 332985, "epoch": 1982} {"train_loss": -12.027022361755371, "global_step": 332986, "epoch": 1982} {"train_loss": -11.233083724975586, "global_step": 332987, "epoch": 1982} {"train_loss": -11.894588470458984, "global_step": 332988, "epoch": 1982} {"train_loss": -11.748594284057617, "global_step": 332989, "epoch": 1982} {"train_loss": -11.509594917297363, "global_step": 332990, "epoch": 1982} {"train_loss": -12.075660705566406, "global_step": 332991, "epoch": 1982} {"train_loss": -11.642799377441406, "global_step": 332992, "epoch": 1982} {"train_loss": -11.605728149414062, "global_step": 332993, "epoch": 1982} {"train_loss": -11.768329620361328, "global_step": 332994, "epoch": 1982} {"train_loss": -11.244937896728516, "global_step": 332995, "epoch": 1982} {"train_loss": -11.59515380859375, "global_step": 332996, "epoch": 1982} {"train_loss": -11.638338088989258, "global_step": 332997, "epoch": 1982} {"train_loss": -11.600322723388672, "global_step": 332998, "epoch": 1982} {"train_loss": -12.269058227539062, "global_step": 332999, "epoch": 1982} {"train_loss": -11.776124954223633, "global_step": 333000, "epoch": 1982} {"train_loss": -12.003859519958496, "global_step": 333001, "epoch": 1982} {"train_loss": -12.174412727355957, "global_step": 333002, "epoch": 1982} {"train_loss": -12.082470893859863, "global_step": 333003, "epoch": 1982} {"train_loss": -12.070777893066406, "global_step": 333004, "epoch": 1982} {"train_loss": -11.923430442810059, "global_step": 333005, "epoch": 1982} {"train_loss": -12.058425903320312, "global_step": 333006, "epoch": 1982} {"train_loss": -12.006616592407227, "global_step": 333007, "epoch": 1982} {"train_loss": -12.159391403198242, "global_step": 333008, "epoch": 1982} {"train_loss": -12.208551406860352, "global_step": 333009, "epoch": 1982} {"train_loss": -12.295753479003906, "global_step": 333010, "epoch": 1982} {"train_loss": -12.056480407714844, "global_step": 333011, "epoch": 1982} {"train_loss": -12.080227851867676, "global_step": 333012, "epoch": 1982} {"train_loss": -12.001962661743164, "global_step": 333013, "epoch": 1982} {"train_loss": -12.02015495300293, "global_step": 333014, "epoch": 1982} {"train_loss": -11.986321449279785, "global_step": 333015, "epoch": 1982} {"train_loss": -12.142309188842773, "global_step": 333016, "epoch": 1982} {"train_loss": -11.771183013916016, "global_step": 333017, "epoch": 1982} {"train_loss": -12.318046569824219, "global_step": 333018, "epoch": 1982} {"train_loss": -12.076616287231445, "global_step": 333019, "epoch": 1982} {"train_loss": -11.947360038757324, "global_step": 333020, "epoch": 1982} {"train_loss": -12.483642578125, "global_step": 333021, "epoch": 1982} {"train_loss": -12.165868759155273, "global_step": 333022, "epoch": 1982} {"train_loss": -11.973745346069336, "global_step": 333023, "epoch": 1982} {"train_loss": -12.394797325134277, "global_step": 333024, "epoch": 1982} {"train_loss": -12.024206161499023, "global_step": 333025, "epoch": 1982} {"train_loss": -12.237979888916016, "global_step": 333026, "epoch": 1982} {"train_loss": -12.27888011932373, "global_step": 333027, "epoch": 1982} {"train_loss": -12.30302906036377, "global_step": 333028, "epoch": 1982} {"train_loss": -12.519081115722656, "global_step": 333029, "epoch": 1982} {"train_loss": -12.297223091125488, "global_step": 333030, "epoch": 1982} {"train_loss": -12.419219970703125, "global_step": 333031, "epoch": 1982} {"train_loss": -12.107398986816406, "global_step": 333032, "epoch": 1982} {"train_loss": -12.270444869995117, "global_step": 333033, "epoch": 1982} {"train_loss": -12.391796112060547, "global_step": 333034, "epoch": 1982} {"train_loss": -12.242530822753906, "global_step": 333035, "epoch": 1982} {"train_loss": -12.354814529418945, "global_step": 333036, "epoch": 1982} {"train_loss": -12.269786834716797, "global_step": 333037, "epoch": 1982} {"train_loss": -12.388350486755371, "global_step": 333038, "epoch": 1982} {"train_loss": -12.511256217956543, "global_step": 333039, "epoch": 1982} {"train_loss": -12.07335090637207, "global_step": 333040, "epoch": 1982} {"train_loss": -12.433465003967285, "global_step": 333041, "epoch": 1982} {"train_loss": -12.412559509277344, "global_step": 333042, "epoch": 1982} {"train_loss": -12.508554458618164, "global_step": 333043, "epoch": 1982} {"train_loss": -12.350591659545898, "global_step": 333044, "epoch": 1982} {"train_loss": -12.248780250549316, "global_step": 333045, "epoch": 1982} {"train_loss": -12.600257873535156, "global_step": 333046, "epoch": 1982} {"train_loss": -12.363006591796875, "global_step": 333047, "epoch": 1982} {"train_loss": -12.595743179321289, "global_step": 333048, "epoch": 1982} {"train_loss": -12.514347076416016, "global_step": 333049, "epoch": 1982} {"train_loss": -12.458857536315918, "global_step": 333050, "epoch": 1982} {"train_loss": -12.52666187286377, "global_step": 333051, "epoch": 1982} {"train_loss": -12.722134590148926, "global_step": 333052, "epoch": 1982} {"train_loss": -12.595903396606445, "global_step": 333053, "epoch": 1982} {"train_loss": -12.601325988769531, "global_step": 333054, "epoch": 1982} {"train_loss": -12.436929702758789, "global_step": 333055, "epoch": 1982} {"train_loss": -12.500426292419434, "global_step": 333056, "epoch": 1982} {"train_loss": -12.286712646484375, "global_step": 333057, "epoch": 1982} {"train_loss": -12.63818359375, "global_step": 333058, "epoch": 1982} {"train_loss": -12.489267349243164, "global_step": 333059, "epoch": 1982} {"train_loss": -12.589632034301758, "global_step": 333060, "epoch": 1982} {"train_loss": -12.499600410461426, "global_step": 333061, "epoch": 1982} {"train_loss": -12.5874605178833, "global_step": 333062, "epoch": 1982} {"train_loss": -12.593246459960938, "global_step": 333063, "epoch": 1982} {"train_loss": -12.576607704162598, "global_step": 333064, "epoch": 1982} {"train_loss": -12.431915283203125, "global_step": 333065, "epoch": 1982} {"train_loss": -12.618314743041992, "global_step": 333066, "epoch": 1982} {"train_loss": -12.601244926452637, "global_step": 333067, "epoch": 1982} {"train_loss": -12.4275484085083, "global_step": 333068, "epoch": 1982} {"train_loss": -12.40412425994873, "global_step": 333069, "epoch": 1982} {"train_loss": -12.58963394165039, "global_step": 333070, "epoch": 1982} {"train_loss": -12.249467849731445, "global_step": 333071, "epoch": 1982} {"train_loss": -12.28782844543457, "global_step": 333072, "epoch": 1982} {"train_loss": -12.12785530090332, "global_step": 333073, "epoch": 1982} {"train_loss": -12.182682037353516, "global_step": 333074, "epoch": 1982} {"train_loss": -12.1297025680542, "global_step": 333075, "epoch": 1982} {"train_loss": -12.484161376953125, "global_step": 333076, "epoch": 1982} {"train_loss": -12.308399200439453, "global_step": 333077, "epoch": 1982} {"train_loss": -12.332096099853516, "global_step": 333078, "epoch": 1982} {"train_loss": -12.336795806884766, "global_step": 333079, "epoch": 1982} {"train_loss": -12.535575866699219, "global_step": 333080, "epoch": 1982} {"train_loss": -12.342584609985352, "global_step": 333081, "epoch": 1982} {"train_loss": -12.534528732299805, "global_step": 333082, "epoch": 1982} {"train_loss": -12.349273681640625, "global_step": 333083, "epoch": 1982} {"train_loss": -12.13077449798584, "global_step": 333084, "epoch": 1982} {"train_loss": -12.618924140930176, "global_step": 333085, "epoch": 1982} {"train_loss": -12.123245239257812, "global_step": 333086, "epoch": 1982} {"train_loss": -12.171754837036133, "global_step": 333087, "epoch": 1982} {"train_loss": -12.16235637664795, "global_step": 333088, "epoch": 1982} {"train_loss": -11.90813159942627, "global_step": 333089, "epoch": 1982} {"train_loss": -10.906003952026367, "global_step": 333090, "epoch": 1982} {"train_loss": -11.27543830871582, "global_step": 333091, "epoch": 1982} {"train_loss": -11.79254150390625, "global_step": 333092, "epoch": 1982} {"train_loss": -12.177501678466797, "global_step": 333093, "epoch": 1982} {"train_loss": -11.791341781616211, "global_step": 333094, "epoch": 1982} {"train_loss": -10.812058448791504, "global_step": 333095, "epoch": 1982} {"train_loss": -12.230470657348633, "global_step": 333096, "epoch": 1982} {"train_loss": -10.684635162353516, "global_step": 333097, "epoch": 1982} {"train_loss": -10.266910552978516, "global_step": 333098, "epoch": 1982} {"train_loss": -12.215182304382324, "global_step": 333099, "epoch": 1982} {"train_loss": -11.922172546386719, "global_step": 333100, "epoch": 1982} {"train_loss": -11.742473602294922, "global_step": 333101, "epoch": 1982} {"train_loss": -11.983953475952148, "global_step": 333102, "epoch": 1982} {"train_loss": -12.409187316894531, "global_step": 333103, "epoch": 1982} {"train_loss": -11.923358917236328, "global_step": 333104, "epoch": 1982} {"train_loss": -11.760831832885742, "global_step": 333105, "epoch": 1982} {"train_loss": -12.23664665222168, "global_step": 333106, "epoch": 1982} {"train_loss": -11.944185256958008, "global_step": 333107, "epoch": 1982} {"train_loss": -12.23740005493164, "global_step": 333108, "epoch": 1982} {"train_loss": -11.630620002746582, "global_step": 333109, "epoch": 1982} {"train_loss": -12.335949897766113, "global_step": 333110, "epoch": 1982} {"train_loss": -12.026432037353516, "global_step": 333111, "epoch": 1982} {"train_loss": -12.201238632202148, "global_step": 333112, "epoch": 1982} {"train_loss": -11.786334991455078, "global_step": 333113, "epoch": 1982} {"train_loss": -12.496204376220703, "global_step": 333114, "epoch": 1982} {"train_loss": -12.150732040405273, "global_step": 333115, "epoch": 1982} {"train_loss": -12.345685005187988, "global_step": 333116, "epoch": 1982} {"train_loss": -12.133840560913086, "global_step": 333117, "epoch": 1982} {"train_loss": -12.19747543334961, "global_step": 333118, "epoch": 1982} {"train_loss": -12.22059440612793, "global_step": 333119, "epoch": 1982} {"train_loss": -12.074594497680664, "global_step": 333120, "epoch": 1982} {"train_loss": -12.331317901611328, "global_step": 333121, "epoch": 1982} {"train_loss": -11.820781707763672, "global_step": 333122, "epoch": 1982} {"train_loss": -12.412893295288086, "global_step": 333123, "epoch": 1982} {"train_loss": -12.223479270935059, "global_step": 333124, "epoch": 1982} {"train_loss": -11.997560501098633, "global_step": 333125, "epoch": 1982} {"train_loss": -12.25795841217041, "global_step": 333126, "epoch": 1982} {"train_loss": -12.199943542480469, "global_step": 333127, "epoch": 1982} {"train_loss": -12.223251342773438, "global_step": 333128, "epoch": 1982} {"train_loss": -12.317112922668457, "global_step": 333129, "epoch": 1982} {"train_loss": -12.436965942382812, "global_step": 333130, "epoch": 1982} {"train_loss": -12.178703308105469, "global_step": 333131, "epoch": 1982} {"train_loss": -12.568036079406738, "global_step": 333132, "epoch": 1982} {"train_loss": -12.372385025024414, "global_step": 333133, "epoch": 1982} {"train_loss": -12.488896369934082, "global_step": 333134, "epoch": 1982} {"train_loss": -12.389183044433594, "global_step": 333135, "epoch": 1982} {"train_loss": -12.113807678222656, "global_step": 333136, "epoch": 1982} {"train_loss": -12.10629940032959, "global_step": 333137, "epoch": 1982} {"train_loss": -12.52987289428711, "global_step": 333138, "epoch": 1982} {"train_loss": -11.534103393554688, "global_step": 333139, "epoch": 1982} {"train_loss": -11.122982025146484, "global_step": 333140, "epoch": 1982} {"train_loss": -12.307942390441895, "global_step": 333141, "epoch": 1982} {"train_loss": -11.829224586486816, "global_step": 333142, "epoch": 1982} {"train_loss": -12.103640130587987, "global_step": 333143, "epoch": 1982, "val_loss": 284764.65625} {"train_loss": -12.426469802856445, "global_step": 333144, "epoch": 1983} {"train_loss": -10.892374038696289, "global_step": 333145, "epoch": 1983} {"train_loss": -11.429208755493164, "global_step": 333146, "epoch": 1983} {"train_loss": -11.766193389892578, "global_step": 333147, "epoch": 1983} {"train_loss": -11.551351547241211, "global_step": 333148, "epoch": 1983} {"train_loss": -11.995328903198242, "global_step": 333149, "epoch": 1983} {"train_loss": -11.235118865966797, "global_step": 333150, "epoch": 1983} {"train_loss": -11.719207763671875, "global_step": 333151, "epoch": 1983} {"train_loss": -11.34669303894043, "global_step": 333152, "epoch": 1983} {"train_loss": -11.564064979553223, "global_step": 333153, "epoch": 1983} {"train_loss": -11.484639167785645, "global_step": 333154, "epoch": 1983} {"train_loss": -10.428417205810547, "global_step": 333155, "epoch": 1983} {"train_loss": -10.241724967956543, "global_step": 333156, "epoch": 1983} {"train_loss": -11.77993392944336, "global_step": 333157, "epoch": 1983} {"train_loss": -10.470035552978516, "global_step": 333158, "epoch": 1983} {"train_loss": -10.996593475341797, "global_step": 333159, "epoch": 1983} {"train_loss": -9.735429763793945, "global_step": 333160, "epoch": 1983} {"train_loss": -10.902307510375977, "global_step": 333161, "epoch": 1983} {"train_loss": -11.304255485534668, "global_step": 333162, "epoch": 1983} {"train_loss": -11.467430114746094, "global_step": 333163, "epoch": 1983} {"train_loss": -11.492555618286133, "global_step": 333164, "epoch": 1983} {"train_loss": -11.637187957763672, "global_step": 333165, "epoch": 1983} {"train_loss": -11.312426567077637, "global_step": 333166, "epoch": 1983} {"train_loss": -11.99540901184082, "global_step": 333167, "epoch": 1983} {"train_loss": -11.575948715209961, "global_step": 333168, "epoch": 1983} {"train_loss": -11.30948257446289, "global_step": 333169, "epoch": 1983} {"train_loss": -12.014579772949219, "global_step": 333170, "epoch": 1983} {"train_loss": -11.513387680053711, "global_step": 333171, "epoch": 1983} {"train_loss": -11.98083209991455, "global_step": 333172, "epoch": 1983} {"train_loss": -11.785497665405273, "global_step": 333173, "epoch": 1983} {"train_loss": -11.657365798950195, "global_step": 333174, "epoch": 1983} {"train_loss": -12.031076431274414, "global_step": 333175, "epoch": 1983} {"train_loss": -11.075620651245117, "global_step": 333176, "epoch": 1983} {"train_loss": -11.4541015625, "global_step": 333177, "epoch": 1983} {"train_loss": -11.081489562988281, "global_step": 333178, "epoch": 1983} {"train_loss": -9.839345932006836, "global_step": 333179, "epoch": 1983} {"train_loss": -10.251272201538086, "global_step": 333180, "epoch": 1983} {"train_loss": -11.400178909301758, "global_step": 333181, "epoch": 1983} {"train_loss": -10.550688743591309, "global_step": 333182, "epoch": 1983} {"train_loss": -10.364082336425781, "global_step": 333183, "epoch": 1983} {"train_loss": -11.496650695800781, "global_step": 333184, "epoch": 1983} {"train_loss": -10.593870162963867, "global_step": 333185, "epoch": 1983} {"train_loss": -10.96864128112793, "global_step": 333186, "epoch": 1983} {"train_loss": -10.397100448608398, "global_step": 333187, "epoch": 1983} {"train_loss": -9.114209175109863, "global_step": 333188, "epoch": 1983} {"train_loss": -11.167423248291016, "global_step": 333189, "epoch": 1983} {"train_loss": -9.593655586242676, "global_step": 333190, "epoch": 1983} {"train_loss": -10.83053970336914, "global_step": 333191, "epoch": 1983} {"train_loss": -10.305075645446777, "global_step": 333192, "epoch": 1983} {"train_loss": -10.570989608764648, "global_step": 333193, "epoch": 1983} {"train_loss": -9.57100772857666, "global_step": 333194, "epoch": 1983} {"train_loss": -11.036237716674805, "global_step": 333195, "epoch": 1983} {"train_loss": -10.262369155883789, "global_step": 333196, "epoch": 1983} {"train_loss": -11.85651969909668, "global_step": 333197, "epoch": 1983} {"train_loss": -10.58370590209961, "global_step": 333198, "epoch": 1983} {"train_loss": -11.44566535949707, "global_step": 333199, "epoch": 1983} {"train_loss": -11.567094802856445, "global_step": 333200, "epoch": 1983} {"train_loss": -10.915786743164062, "global_step": 333201, "epoch": 1983} {"train_loss": -10.762566566467285, "global_step": 333202, "epoch": 1983} {"train_loss": -12.056154251098633, "global_step": 333203, "epoch": 1983} {"train_loss": -11.006355285644531, "global_step": 333204, "epoch": 1983} {"train_loss": -11.532405853271484, "global_step": 333205, "epoch": 1983} {"train_loss": -11.70736312866211, "global_step": 333206, "epoch": 1983} {"train_loss": -10.91038990020752, "global_step": 333207, "epoch": 1983} {"train_loss": -11.263981819152832, "global_step": 333208, "epoch": 1983} {"train_loss": -11.624961853027344, "global_step": 333209, "epoch": 1983} {"train_loss": -11.394962310791016, "global_step": 333210, "epoch": 1983} {"train_loss": -11.433063507080078, "global_step": 333211, "epoch": 1983} {"train_loss": -11.574718475341797, "global_step": 333212, "epoch": 1983} {"train_loss": -11.237553596496582, "global_step": 333213, "epoch": 1983} {"train_loss": -11.932380676269531, "global_step": 333214, "epoch": 1983} {"train_loss": -11.68110466003418, "global_step": 333215, "epoch": 1983} {"train_loss": -11.806785583496094, "global_step": 333216, "epoch": 1983} {"train_loss": -11.291980743408203, "global_step": 333217, "epoch": 1983} {"train_loss": -11.967767715454102, "global_step": 333218, "epoch": 1983} {"train_loss": -11.664571762084961, "global_step": 333219, "epoch": 1983} {"train_loss": -11.605727195739746, "global_step": 333220, "epoch": 1983} {"train_loss": -11.889765739440918, "global_step": 333221, "epoch": 1983} {"train_loss": -11.506858825683594, "global_step": 333222, "epoch": 1983} {"train_loss": -11.80109691619873, "global_step": 333223, "epoch": 1983} {"train_loss": -11.989145278930664, "global_step": 333224, "epoch": 1983} {"train_loss": -11.754618644714355, "global_step": 333225, "epoch": 1983} {"train_loss": -11.831439971923828, "global_step": 333226, "epoch": 1983} {"train_loss": -11.885771751403809, "global_step": 333227, "epoch": 1983} {"train_loss": -11.698384284973145, "global_step": 333228, "epoch": 1983} {"train_loss": -11.988604545593262, "global_step": 333229, "epoch": 1983} {"train_loss": -12.21185302734375, "global_step": 333230, "epoch": 1983} {"train_loss": -12.126945495605469, "global_step": 333231, "epoch": 1983} {"train_loss": -12.00296688079834, "global_step": 333232, "epoch": 1983} {"train_loss": -12.136503219604492, "global_step": 333233, "epoch": 1983} {"train_loss": -12.184759140014648, "global_step": 333234, "epoch": 1983} {"train_loss": -12.179682731628418, "global_step": 333235, "epoch": 1983} {"train_loss": -12.107831954956055, "global_step": 333236, "epoch": 1983} {"train_loss": -12.065523147583008, "global_step": 333237, "epoch": 1983} {"train_loss": -12.36566162109375, "global_step": 333238, "epoch": 1983} {"train_loss": -12.32554817199707, "global_step": 333239, "epoch": 1983} {"train_loss": -12.051368713378906, "global_step": 333240, "epoch": 1983} {"train_loss": -12.359947204589844, "global_step": 333241, "epoch": 1983} {"train_loss": -12.08016586303711, "global_step": 333242, "epoch": 1983} {"train_loss": -12.309219360351562, "global_step": 333243, "epoch": 1983} {"train_loss": -12.242998123168945, "global_step": 333244, "epoch": 1983} {"train_loss": -12.398687362670898, "global_step": 333245, "epoch": 1983} {"train_loss": -12.304786682128906, "global_step": 333246, "epoch": 1983} {"train_loss": -12.325296401977539, "global_step": 333247, "epoch": 1983} {"train_loss": -12.292438507080078, "global_step": 333248, "epoch": 1983} {"train_loss": -12.31375503540039, "global_step": 333249, "epoch": 1983} {"train_loss": -12.521068572998047, "global_step": 333250, "epoch": 1983} {"train_loss": -12.444522857666016, "global_step": 333251, "epoch": 1983} {"train_loss": -12.43051815032959, "global_step": 333252, "epoch": 1983} {"train_loss": -12.351219177246094, "global_step": 333253, "epoch": 1983} {"train_loss": -12.264091491699219, "global_step": 333254, "epoch": 1983} {"train_loss": -12.483016014099121, "global_step": 333255, "epoch": 1983} {"train_loss": -12.37691879272461, "global_step": 333256, "epoch": 1983} {"train_loss": -12.37205982208252, "global_step": 333257, "epoch": 1983} {"train_loss": -12.429071426391602, "global_step": 333258, "epoch": 1983} {"train_loss": -12.426843643188477, "global_step": 333259, "epoch": 1983} {"train_loss": -12.501579284667969, "global_step": 333260, "epoch": 1983} {"train_loss": -12.459228515625, "global_step": 333261, "epoch": 1983} {"train_loss": -12.184213638305664, "global_step": 333262, "epoch": 1983} {"train_loss": -12.618148803710938, "global_step": 333263, "epoch": 1983} {"train_loss": -12.56004810333252, "global_step": 333264, "epoch": 1983} {"train_loss": -12.474924087524414, "global_step": 333265, "epoch": 1983} {"train_loss": -12.374272346496582, "global_step": 333266, "epoch": 1983} {"train_loss": -12.425191879272461, "global_step": 333267, "epoch": 1983} {"train_loss": -12.480653762817383, "global_step": 333268, "epoch": 1983} {"train_loss": -12.535808563232422, "global_step": 333269, "epoch": 1983} {"train_loss": -12.613611221313477, "global_step": 333270, "epoch": 1983} {"train_loss": -12.51205062866211, "global_step": 333271, "epoch": 1983} {"train_loss": -12.483071327209473, "global_step": 333272, "epoch": 1983} {"train_loss": -12.61247444152832, "global_step": 333273, "epoch": 1983} {"train_loss": -12.654476165771484, "global_step": 333274, "epoch": 1983} {"train_loss": -12.608354568481445, "global_step": 333275, "epoch": 1983} {"train_loss": -12.56076431274414, "global_step": 333276, "epoch": 1983} {"train_loss": -12.620723724365234, "global_step": 333277, "epoch": 1983} {"train_loss": -12.639494895935059, "global_step": 333278, "epoch": 1983} {"train_loss": -12.695449829101562, "global_step": 333279, "epoch": 1983} {"train_loss": -12.590465545654297, "global_step": 333280, "epoch": 1983} {"train_loss": -12.673286437988281, "global_step": 333281, "epoch": 1983} {"train_loss": -12.42821979522705, "global_step": 333282, "epoch": 1983} {"train_loss": -12.53514575958252, "global_step": 333283, "epoch": 1983} {"train_loss": -12.795459747314453, "global_step": 333284, "epoch": 1983} {"train_loss": -12.516548156738281, "global_step": 333285, "epoch": 1983} {"train_loss": -12.5841064453125, "global_step": 333286, "epoch": 1983} {"train_loss": -12.556543350219727, "global_step": 333287, "epoch": 1983} {"train_loss": -12.657012939453125, "global_step": 333288, "epoch": 1983} {"train_loss": -12.688995361328125, "global_step": 333289, "epoch": 1983} {"train_loss": -12.435302734375, "global_step": 333290, "epoch": 1983} {"train_loss": -12.199132919311523, "global_step": 333291, "epoch": 1983} {"train_loss": -12.432525634765625, "global_step": 333292, "epoch": 1983} {"train_loss": -12.41915512084961, "global_step": 333293, "epoch": 1983} {"train_loss": -12.583467483520508, "global_step": 333294, "epoch": 1983} {"train_loss": -12.551692962646484, "global_step": 333295, "epoch": 1983} {"train_loss": -12.78505802154541, "global_step": 333296, "epoch": 1983} {"train_loss": -12.497713088989258, "global_step": 333297, "epoch": 1983} {"train_loss": -12.63768196105957, "global_step": 333298, "epoch": 1983} {"train_loss": -12.627796173095703, "global_step": 333299, "epoch": 1983} {"train_loss": -12.64954948425293, "global_step": 333300, "epoch": 1983} {"train_loss": -12.64777660369873, "global_step": 333301, "epoch": 1983} {"train_loss": -12.60909366607666, "global_step": 333302, "epoch": 1983} {"train_loss": -12.473579406738281, "global_step": 333303, "epoch": 1983} {"train_loss": -12.425479888916016, "global_step": 333304, "epoch": 1983} {"train_loss": -12.757506370544434, "global_step": 333305, "epoch": 1983} {"train_loss": -12.841211318969727, "global_step": 333306, "epoch": 1983} {"train_loss": -12.277811050415039, "global_step": 333307, "epoch": 1983} {"train_loss": -11.813945770263672, "global_step": 333308, "epoch": 1983} {"train_loss": -12.194952964782715, "global_step": 333309, "epoch": 1983} {"train_loss": -12.447643280029297, "global_step": 333310, "epoch": 1983} {"train_loss": -11.83244746639615, "global_step": 333311, "epoch": 1983, "val_loss": 287552.875} {"train_loss": -11.471776962280273, "global_step": 333312, "epoch": 1984} {"train_loss": -12.16383171081543, "global_step": 333313, "epoch": 1984} {"train_loss": -12.13557243347168, "global_step": 333314, "epoch": 1984} {"train_loss": -12.096112251281738, "global_step": 333315, "epoch": 1984} {"train_loss": -10.839816093444824, "global_step": 333316, "epoch": 1984} {"train_loss": -10.524576187133789, "global_step": 333317, "epoch": 1984} {"train_loss": -10.68636417388916, "global_step": 333318, "epoch": 1984} {"train_loss": -10.129240036010742, "global_step": 333319, "epoch": 1984} {"train_loss": -9.38015365600586, "global_step": 333320, "epoch": 1984} {"train_loss": -9.232150077819824, "global_step": 333321, "epoch": 1984} {"train_loss": -11.036775588989258, "global_step": 333322, "epoch": 1984} {"train_loss": -9.603301048278809, "global_step": 333323, "epoch": 1984} {"train_loss": -9.605660438537598, "global_step": 333324, "epoch": 1984} {"train_loss": -11.452352523803711, "global_step": 333325, "epoch": 1984} {"train_loss": -10.179222106933594, "global_step": 333326, "epoch": 1984} {"train_loss": -11.049856185913086, "global_step": 333327, "epoch": 1984} {"train_loss": -10.734870910644531, "global_step": 333328, "epoch": 1984} {"train_loss": -9.113685607910156, "global_step": 333329, "epoch": 1984} {"train_loss": -11.191450119018555, "global_step": 333330, "epoch": 1984} {"train_loss": -9.61130142211914, "global_step": 333331, "epoch": 1984} {"train_loss": -9.400321006774902, "global_step": 333332, "epoch": 1984} {"train_loss": -9.560042381286621, "global_step": 333333, "epoch": 1984} {"train_loss": -10.815109252929688, "global_step": 333334, "epoch": 1984} {"train_loss": -8.91571044921875, "global_step": 333335, "epoch": 1984} {"train_loss": -10.076595306396484, "global_step": 333336, "epoch": 1984} {"train_loss": -9.975632667541504, "global_step": 333337, "epoch": 1984} {"train_loss": -10.485865592956543, "global_step": 333338, "epoch": 1984} {"train_loss": -10.794527053833008, "global_step": 333339, "epoch": 1984} {"train_loss": -10.287540435791016, "global_step": 333340, "epoch": 1984} {"train_loss": -11.289241790771484, "global_step": 333341, "epoch": 1984} {"train_loss": -11.074640274047852, "global_step": 333342, "epoch": 1984} {"train_loss": -11.712323188781738, "global_step": 333343, "epoch": 1984} {"train_loss": -11.512537002563477, "global_step": 333344, "epoch": 1984} {"train_loss": -11.74603271484375, "global_step": 333345, "epoch": 1984} {"train_loss": -11.315868377685547, "global_step": 333346, "epoch": 1984} {"train_loss": -11.231815338134766, "global_step": 333347, "epoch": 1984} {"train_loss": -11.410703659057617, "global_step": 333348, "epoch": 1984} {"train_loss": -10.843505859375, "global_step": 333349, "epoch": 1984} {"train_loss": -11.670588493347168, "global_step": 333350, "epoch": 1984} {"train_loss": -11.128067970275879, "global_step": 333351, "epoch": 1984} {"train_loss": -11.656205177307129, "global_step": 333352, "epoch": 1984} {"train_loss": -11.465206146240234, "global_step": 333353, "epoch": 1984} {"train_loss": -11.634693145751953, "global_step": 333354, "epoch": 1984} {"train_loss": -11.695328712463379, "global_step": 333355, "epoch": 1984} {"train_loss": -12.01510238647461, "global_step": 333356, "epoch": 1984} {"train_loss": -11.74172592163086, "global_step": 333357, "epoch": 1984} {"train_loss": -12.123017311096191, "global_step": 333358, "epoch": 1984} {"train_loss": -11.742591857910156, "global_step": 333359, "epoch": 1984} {"train_loss": -12.080523490905762, "global_step": 333360, "epoch": 1984} {"train_loss": -11.765487670898438, "global_step": 333361, "epoch": 1984} {"train_loss": -12.158291816711426, "global_step": 333362, "epoch": 1984} {"train_loss": -11.881688117980957, "global_step": 333363, "epoch": 1984} {"train_loss": -12.089578628540039, "global_step": 333364, "epoch": 1984} {"train_loss": -11.979248046875, "global_step": 333365, "epoch": 1984} {"train_loss": -11.834571838378906, "global_step": 333366, "epoch": 1984} {"train_loss": -11.96614933013916, "global_step": 333367, "epoch": 1984} {"train_loss": -11.7951021194458, "global_step": 333368, "epoch": 1984} {"train_loss": -12.120532035827637, "global_step": 333369, "epoch": 1984} {"train_loss": -12.037301063537598, "global_step": 333370, "epoch": 1984} {"train_loss": -12.1995267868042, "global_step": 333371, "epoch": 1984} {"train_loss": -12.279450416564941, "global_step": 333372, "epoch": 1984} {"train_loss": -12.051401138305664, "global_step": 333373, "epoch": 1984} {"train_loss": -12.302288055419922, "global_step": 333374, "epoch": 1984} {"train_loss": -11.925434112548828, "global_step": 333375, "epoch": 1984} {"train_loss": -12.211544036865234, "global_step": 333376, "epoch": 1984} {"train_loss": -12.355890274047852, "global_step": 333377, "epoch": 1984} {"train_loss": -12.362603187561035, "global_step": 333378, "epoch": 1984} {"train_loss": -12.338571548461914, "global_step": 333379, "epoch": 1984} {"train_loss": -12.227262496948242, "global_step": 333380, "epoch": 1984} {"train_loss": -12.389021873474121, "global_step": 333381, "epoch": 1984} {"train_loss": -12.234016418457031, "global_step": 333382, "epoch": 1984} {"train_loss": -12.309314727783203, "global_step": 333383, "epoch": 1984} {"train_loss": -12.213105201721191, "global_step": 333384, "epoch": 1984} {"train_loss": -12.429031372070312, "global_step": 333385, "epoch": 1984} {"train_loss": -12.224809646606445, "global_step": 333386, "epoch": 1984} {"train_loss": -12.354314804077148, "global_step": 333387, "epoch": 1984} {"train_loss": -12.202587127685547, "global_step": 333388, "epoch": 1984} {"train_loss": -12.222332000732422, "global_step": 333389, "epoch": 1984} {"train_loss": -12.204524993896484, "global_step": 333390, "epoch": 1984} {"train_loss": -12.56016731262207, "global_step": 333391, "epoch": 1984} {"train_loss": -12.469720840454102, "global_step": 333392, "epoch": 1984} {"train_loss": -12.478218078613281, "global_step": 333393, "epoch": 1984} {"train_loss": -12.345515251159668, "global_step": 333394, "epoch": 1984} {"train_loss": -12.555347442626953, "global_step": 333395, "epoch": 1984} {"train_loss": -12.313973426818848, "global_step": 333396, "epoch": 1984} {"train_loss": -12.448586463928223, "global_step": 333397, "epoch": 1984} {"train_loss": -12.156572341918945, "global_step": 333398, "epoch": 1984} {"train_loss": -12.439059257507324, "global_step": 333399, "epoch": 1984} {"train_loss": -12.358415603637695, "global_step": 333400, "epoch": 1984} {"train_loss": -12.630536079406738, "global_step": 333401, "epoch": 1984} {"train_loss": -12.353494644165039, "global_step": 333402, "epoch": 1984} {"train_loss": -12.452102661132812, "global_step": 333403, "epoch": 1984} {"train_loss": -12.497010231018066, "global_step": 333404, "epoch": 1984} {"train_loss": -12.44871997833252, "global_step": 333405, "epoch": 1984} {"train_loss": -12.51835823059082, "global_step": 333406, "epoch": 1984} {"train_loss": -12.377161026000977, "global_step": 333407, "epoch": 1984} {"train_loss": -12.664125442504883, "global_step": 333408, "epoch": 1984} {"train_loss": -12.511749267578125, "global_step": 333409, "epoch": 1984} {"train_loss": -12.633012771606445, "global_step": 333410, "epoch": 1984} {"train_loss": -12.345613479614258, "global_step": 333411, "epoch": 1984} {"train_loss": -12.469715118408203, "global_step": 333412, "epoch": 1984} {"train_loss": -12.523273468017578, "global_step": 333413, "epoch": 1984} {"train_loss": -12.334026336669922, "global_step": 333414, "epoch": 1984} {"train_loss": -12.420035362243652, "global_step": 333415, "epoch": 1984} {"train_loss": -12.357321739196777, "global_step": 333416, "epoch": 1984} {"train_loss": -12.351083755493164, "global_step": 333417, "epoch": 1984} {"train_loss": -12.417863845825195, "global_step": 333418, "epoch": 1984} {"train_loss": -12.5621337890625, "global_step": 333419, "epoch": 1984} {"train_loss": -12.343421936035156, "global_step": 333420, "epoch": 1984} {"train_loss": -12.51388931274414, "global_step": 333421, "epoch": 1984} {"train_loss": -12.423250198364258, "global_step": 333422, "epoch": 1984} {"train_loss": -12.193037033081055, "global_step": 333423, "epoch": 1984} {"train_loss": -11.725290298461914, "global_step": 333424, "epoch": 1984} {"train_loss": -12.327136993408203, "global_step": 333425, "epoch": 1984} {"train_loss": -12.33935546875, "global_step": 333426, "epoch": 1984} {"train_loss": -12.447392463684082, "global_step": 333427, "epoch": 1984} {"train_loss": -12.315376281738281, "global_step": 333428, "epoch": 1984} {"train_loss": -12.647048950195312, "global_step": 333429, "epoch": 1984} {"train_loss": -12.256026268005371, "global_step": 333430, "epoch": 1984} {"train_loss": -12.466053009033203, "global_step": 333431, "epoch": 1984} {"train_loss": -12.274325370788574, "global_step": 333432, "epoch": 1984} {"train_loss": -12.230998992919922, "global_step": 333433, "epoch": 1984} {"train_loss": -12.52606201171875, "global_step": 333434, "epoch": 1984} {"train_loss": -12.431327819824219, "global_step": 333435, "epoch": 1984} {"train_loss": -12.428924560546875, "global_step": 333436, "epoch": 1984} {"train_loss": -12.211610794067383, "global_step": 333437, "epoch": 1984} {"train_loss": -12.493045806884766, "global_step": 333438, "epoch": 1984} {"train_loss": -11.681682586669922, "global_step": 333439, "epoch": 1984} {"train_loss": -11.802775382995605, "global_step": 333440, "epoch": 1984} {"train_loss": -11.995478630065918, "global_step": 333441, "epoch": 1984} {"train_loss": -11.260369300842285, "global_step": 333442, "epoch": 1984} {"train_loss": -11.020095825195312, "global_step": 333443, "epoch": 1984} {"train_loss": -11.409784317016602, "global_step": 333444, "epoch": 1984} {"train_loss": -11.14604377746582, "global_step": 333445, "epoch": 1984} {"train_loss": -10.996895790100098, "global_step": 333446, "epoch": 1984} {"train_loss": -11.423442840576172, "global_step": 333447, "epoch": 1984} {"train_loss": -10.261096954345703, "global_step": 333448, "epoch": 1984} {"train_loss": -12.311710357666016, "global_step": 333449, "epoch": 1984} {"train_loss": -11.1859130859375, "global_step": 333450, "epoch": 1984} {"train_loss": -12.180530548095703, "global_step": 333451, "epoch": 1984} {"train_loss": -11.297771453857422, "global_step": 333452, "epoch": 1984} {"train_loss": -11.331209182739258, "global_step": 333453, "epoch": 1984} {"train_loss": -12.012876510620117, "global_step": 333454, "epoch": 1984} {"train_loss": -11.180221557617188, "global_step": 333455, "epoch": 1984} {"train_loss": -11.558218002319336, "global_step": 333456, "epoch": 1984} {"train_loss": -11.489410400390625, "global_step": 333457, "epoch": 1984} {"train_loss": -11.852249145507812, "global_step": 333458, "epoch": 1984} {"train_loss": -10.774435043334961, "global_step": 333459, "epoch": 1984} {"train_loss": -11.406753540039062, "global_step": 333460, "epoch": 1984} {"train_loss": -11.078346252441406, "global_step": 333461, "epoch": 1984} {"train_loss": -11.783697128295898, "global_step": 333462, "epoch": 1984} {"train_loss": -11.5512113571167, "global_step": 333463, "epoch": 1984} {"train_loss": -11.938069343566895, "global_step": 333464, "epoch": 1984} {"train_loss": -11.480520248413086, "global_step": 333465, "epoch": 1984} {"train_loss": -11.291074752807617, "global_step": 333466, "epoch": 1984} {"train_loss": -11.894989013671875, "global_step": 333467, "epoch": 1984} {"train_loss": -12.181843757629395, "global_step": 333468, "epoch": 1984} {"train_loss": -11.905070304870605, "global_step": 333469, "epoch": 1984} {"train_loss": -12.11646556854248, "global_step": 333470, "epoch": 1984} {"train_loss": -11.862432479858398, "global_step": 333471, "epoch": 1984} {"train_loss": -12.146612167358398, "global_step": 333472, "epoch": 1984} {"train_loss": -11.912264823913574, "global_step": 333473, "epoch": 1984} {"train_loss": -12.112614631652832, "global_step": 333474, "epoch": 1984} {"train_loss": -11.577932357788086, "global_step": 333475, "epoch": 1984} {"train_loss": -11.332408905029297, "global_step": 333476, "epoch": 1984} {"train_loss": -11.728532791137695, "global_step": 333477, "epoch": 1984} {"train_loss": -11.590245246887207, "global_step": 333478, "epoch": 1984} {"train_loss": -11.7184545312609, "global_step": 333479, "epoch": 1984, "val_loss": 284178.09375} {"train_loss": -11.174164772033691, "global_step": 333480, "epoch": 1985} {"train_loss": -11.552927017211914, "global_step": 333481, "epoch": 1985} {"train_loss": -11.346476554870605, "global_step": 333482, "epoch": 1985} {"train_loss": -11.594720840454102, "global_step": 333483, "epoch": 1985} {"train_loss": -11.419828414916992, "global_step": 333484, "epoch": 1985} {"train_loss": -12.031938552856445, "global_step": 333485, "epoch": 1985} {"train_loss": -11.22071647644043, "global_step": 333486, "epoch": 1985} {"train_loss": -11.980426788330078, "global_step": 333487, "epoch": 1985} {"train_loss": -11.642314910888672, "global_step": 333488, "epoch": 1985} {"train_loss": -12.173134803771973, "global_step": 333489, "epoch": 1985} {"train_loss": -11.697983741760254, "global_step": 333490, "epoch": 1985} {"train_loss": -11.949075698852539, "global_step": 333491, "epoch": 1985} {"train_loss": -11.761068344116211, "global_step": 333492, "epoch": 1985} {"train_loss": -12.11172103881836, "global_step": 333493, "epoch": 1985} {"train_loss": -11.79074764251709, "global_step": 333494, "epoch": 1985} {"train_loss": -12.315105438232422, "global_step": 333495, "epoch": 1985} {"train_loss": -12.109563827514648, "global_step": 333496, "epoch": 1985} {"train_loss": -12.044975280761719, "global_step": 333497, "epoch": 1985} {"train_loss": -12.450806617736816, "global_step": 333498, "epoch": 1985} {"train_loss": -12.163766860961914, "global_step": 333499, "epoch": 1985} {"train_loss": -12.32011604309082, "global_step": 333500, "epoch": 1985} {"train_loss": -12.083423614501953, "global_step": 333501, "epoch": 1985} {"train_loss": -12.39843463897705, "global_step": 333502, "epoch": 1985} {"train_loss": -12.402349472045898, "global_step": 333503, "epoch": 1985} {"train_loss": -11.858678817749023, "global_step": 333504, "epoch": 1985} {"train_loss": -12.535564422607422, "global_step": 333505, "epoch": 1985} {"train_loss": -12.16946029663086, "global_step": 333506, "epoch": 1985} {"train_loss": -12.204793930053711, "global_step": 333507, "epoch": 1985} {"train_loss": -12.15664291381836, "global_step": 333508, "epoch": 1985} {"train_loss": -12.018644332885742, "global_step": 333509, "epoch": 1985} {"train_loss": -12.286422729492188, "global_step": 333510, "epoch": 1985} {"train_loss": -12.287887573242188, "global_step": 333511, "epoch": 1985} {"train_loss": -12.05663013458252, "global_step": 333512, "epoch": 1985} {"train_loss": -12.292726516723633, "global_step": 333513, "epoch": 1985} {"train_loss": -12.262752532958984, "global_step": 333514, "epoch": 1985} {"train_loss": -12.50710391998291, "global_step": 333515, "epoch": 1985} {"train_loss": -12.1503324508667, "global_step": 333516, "epoch": 1985} {"train_loss": -12.31888484954834, "global_step": 333517, "epoch": 1985} {"train_loss": -12.358659744262695, "global_step": 333518, "epoch": 1985} {"train_loss": -12.260287284851074, "global_step": 333519, "epoch": 1985} {"train_loss": -12.506624221801758, "global_step": 333520, "epoch": 1985} {"train_loss": -12.388776779174805, "global_step": 333521, "epoch": 1985} {"train_loss": -12.426359176635742, "global_step": 333522, "epoch": 1985} {"train_loss": -12.196662902832031, "global_step": 333523, "epoch": 1985} {"train_loss": -12.155752182006836, "global_step": 333524, "epoch": 1985} {"train_loss": -12.275588035583496, "global_step": 333525, "epoch": 1985} {"train_loss": -12.485322952270508, "global_step": 333526, "epoch": 1985} {"train_loss": -12.139513969421387, "global_step": 333527, "epoch": 1985} {"train_loss": -12.160959243774414, "global_step": 333528, "epoch": 1985} {"train_loss": -12.384568214416504, "global_step": 333529, "epoch": 1985} {"train_loss": -12.26783561706543, "global_step": 333530, "epoch": 1985} {"train_loss": -12.243881225585938, "global_step": 333531, "epoch": 1985} {"train_loss": -12.167311668395996, "global_step": 333532, "epoch": 1985} {"train_loss": -12.293867111206055, "global_step": 333533, "epoch": 1985} {"train_loss": -11.728048324584961, "global_step": 333534, "epoch": 1985} {"train_loss": -11.92953872680664, "global_step": 333535, "epoch": 1985} {"train_loss": -12.468032836914062, "global_step": 333536, "epoch": 1985} {"train_loss": -11.989904403686523, "global_step": 333537, "epoch": 1985} {"train_loss": -12.179560661315918, "global_step": 333538, "epoch": 1985} {"train_loss": -11.824775695800781, "global_step": 333539, "epoch": 1985} {"train_loss": -11.376259803771973, "global_step": 333540, "epoch": 1985} {"train_loss": -10.808879852294922, "global_step": 333541, "epoch": 1985} {"train_loss": -11.240734100341797, "global_step": 333542, "epoch": 1985} {"train_loss": -11.762958526611328, "global_step": 333543, "epoch": 1985} {"train_loss": -10.557707786560059, "global_step": 333544, "epoch": 1985} {"train_loss": -11.512084007263184, "global_step": 333545, "epoch": 1985} {"train_loss": -10.681632995605469, "global_step": 333546, "epoch": 1985} {"train_loss": -11.585935592651367, "global_step": 333547, "epoch": 1985} {"train_loss": -10.518651962280273, "global_step": 333548, "epoch": 1985} {"train_loss": -11.496651649475098, "global_step": 333549, "epoch": 1985} {"train_loss": -9.85097885131836, "global_step": 333550, "epoch": 1985} {"train_loss": -12.015499114990234, "global_step": 333551, "epoch": 1985} {"train_loss": -10.085533142089844, "global_step": 333552, "epoch": 1985} {"train_loss": -9.92742919921875, "global_step": 333553, "epoch": 1985} {"train_loss": -11.167724609375, "global_step": 333554, "epoch": 1985} {"train_loss": -9.517145156860352, "global_step": 333555, "epoch": 1985} {"train_loss": -11.556806564331055, "global_step": 333556, "epoch": 1985} {"train_loss": -11.287996292114258, "global_step": 333557, "epoch": 1985} {"train_loss": -10.414173126220703, "global_step": 333558, "epoch": 1985} {"train_loss": -11.433309555053711, "global_step": 333559, "epoch": 1985} {"train_loss": -10.716524124145508, "global_step": 333560, "epoch": 1985} {"train_loss": -10.769329071044922, "global_step": 333561, "epoch": 1985} {"train_loss": -10.094073295593262, "global_step": 333562, "epoch": 1985} {"train_loss": -10.71566390991211, "global_step": 333563, "epoch": 1985} {"train_loss": -10.847704887390137, "global_step": 333564, "epoch": 1985} {"train_loss": -10.145009994506836, "global_step": 333565, "epoch": 1985} {"train_loss": -10.554728507995605, "global_step": 333566, "epoch": 1985} {"train_loss": -10.636032104492188, "global_step": 333567, "epoch": 1985} {"train_loss": -11.324085235595703, "global_step": 333568, "epoch": 1985} {"train_loss": -10.20521354675293, "global_step": 333569, "epoch": 1985} {"train_loss": -11.67213249206543, "global_step": 333570, "epoch": 1985} {"train_loss": -11.375537872314453, "global_step": 333571, "epoch": 1985} {"train_loss": -11.388029098510742, "global_step": 333572, "epoch": 1985} {"train_loss": -12.002829551696777, "global_step": 333573, "epoch": 1985} {"train_loss": -11.5153169631958, "global_step": 333574, "epoch": 1985} {"train_loss": -11.608686447143555, "global_step": 333575, "epoch": 1985} {"train_loss": -11.54732894897461, "global_step": 333576, "epoch": 1985} {"train_loss": -11.17502498626709, "global_step": 333577, "epoch": 1985} {"train_loss": -11.558826446533203, "global_step": 333578, "epoch": 1985} {"train_loss": -12.051305770874023, "global_step": 333579, "epoch": 1985} {"train_loss": -11.597041130065918, "global_step": 333580, "epoch": 1985} {"train_loss": -11.681509017944336, "global_step": 333581, "epoch": 1985} {"train_loss": -11.710655212402344, "global_step": 333582, "epoch": 1985} {"train_loss": -11.554946899414062, "global_step": 333583, "epoch": 1985} {"train_loss": -12.028083801269531, "global_step": 333584, "epoch": 1985} {"train_loss": -11.746514320373535, "global_step": 333585, "epoch": 1985} {"train_loss": -11.908565521240234, "global_step": 333586, "epoch": 1985} {"train_loss": -12.126970291137695, "global_step": 333587, "epoch": 1985} {"train_loss": -11.900838851928711, "global_step": 333588, "epoch": 1985} {"train_loss": -12.23558235168457, "global_step": 333589, "epoch": 1985} {"train_loss": -11.902435302734375, "global_step": 333590, "epoch": 1985} {"train_loss": -12.163336753845215, "global_step": 333591, "epoch": 1985} {"train_loss": -12.008102416992188, "global_step": 333592, "epoch": 1985} {"train_loss": -11.900337219238281, "global_step": 333593, "epoch": 1985} {"train_loss": -12.355262756347656, "global_step": 333594, "epoch": 1985} {"train_loss": -12.125215530395508, "global_step": 333595, "epoch": 1985} {"train_loss": -12.010168075561523, "global_step": 333596, "epoch": 1985} {"train_loss": -12.033714294433594, "global_step": 333597, "epoch": 1985} {"train_loss": -12.083072662353516, "global_step": 333598, "epoch": 1985} {"train_loss": -12.090499877929688, "global_step": 333599, "epoch": 1985} {"train_loss": -12.108489990234375, "global_step": 333600, "epoch": 1985} {"train_loss": -11.95555305480957, "global_step": 333601, "epoch": 1985} {"train_loss": -11.813408851623535, "global_step": 333602, "epoch": 1985} {"train_loss": -11.971649169921875, "global_step": 333603, "epoch": 1985} {"train_loss": -12.01133918762207, "global_step": 333604, "epoch": 1985} {"train_loss": -12.189566612243652, "global_step": 333605, "epoch": 1985} {"train_loss": -12.107355117797852, "global_step": 333606, "epoch": 1985} {"train_loss": -12.135176658630371, "global_step": 333607, "epoch": 1985} {"train_loss": -12.234529495239258, "global_step": 333608, "epoch": 1985} {"train_loss": -12.08880615234375, "global_step": 333609, "epoch": 1985} {"train_loss": -12.141286849975586, "global_step": 333610, "epoch": 1985} {"train_loss": -12.208032608032227, "global_step": 333611, "epoch": 1985} {"train_loss": -12.159530639648438, "global_step": 333612, "epoch": 1985} {"train_loss": -12.03291130065918, "global_step": 333613, "epoch": 1985} {"train_loss": -12.028841018676758, "global_step": 333614, "epoch": 1985} {"train_loss": -11.939775466918945, "global_step": 333615, "epoch": 1985} {"train_loss": -12.12915325164795, "global_step": 333616, "epoch": 1985} {"train_loss": -11.913326263427734, "global_step": 333617, "epoch": 1985} {"train_loss": -11.635396957397461, "global_step": 333618, "epoch": 1985} {"train_loss": -12.377763748168945, "global_step": 333619, "epoch": 1985} {"train_loss": -11.639169692993164, "global_step": 333620, "epoch": 1985} {"train_loss": -11.940299987792969, "global_step": 333621, "epoch": 1985} {"train_loss": -12.400154113769531, "global_step": 333622, "epoch": 1985} {"train_loss": -12.042957305908203, "global_step": 333623, "epoch": 1985} {"train_loss": -12.44314193725586, "global_step": 333624, "epoch": 1985} {"train_loss": -12.287151336669922, "global_step": 333625, "epoch": 1985} {"train_loss": -12.121423721313477, "global_step": 333626, "epoch": 1985} {"train_loss": -12.200154304504395, "global_step": 333627, "epoch": 1985} {"train_loss": -12.23601245880127, "global_step": 333628, "epoch": 1985} {"train_loss": -12.339866638183594, "global_step": 333629, "epoch": 1985} {"train_loss": -12.148366928100586, "global_step": 333630, "epoch": 1985} {"train_loss": -12.375679016113281, "global_step": 333631, "epoch": 1985} {"train_loss": -12.23898983001709, "global_step": 333632, "epoch": 1985} {"train_loss": -12.384998321533203, "global_step": 333633, "epoch": 1985} {"train_loss": -12.133331298828125, "global_step": 333634, "epoch": 1985} {"train_loss": -12.438039779663086, "global_step": 333635, "epoch": 1985} {"train_loss": -12.439509391784668, "global_step": 333636, "epoch": 1985} {"train_loss": -12.341087341308594, "global_step": 333637, "epoch": 1985} {"train_loss": -12.481575012207031, "global_step": 333638, "epoch": 1985} {"train_loss": -12.322477340698242, "global_step": 333639, "epoch": 1985} {"train_loss": -12.525636672973633, "global_step": 333640, "epoch": 1985} {"train_loss": -11.898317337036133, "global_step": 333641, "epoch": 1985} {"train_loss": -12.266557693481445, "global_step": 333642, "epoch": 1985} {"train_loss": -12.305700302124023, "global_step": 333643, "epoch": 1985} {"train_loss": -12.245704650878906, "global_step": 333644, "epoch": 1985} {"train_loss": -12.41823959350586, "global_step": 333645, "epoch": 1985} {"train_loss": -12.189597129821777, "global_step": 333646, "epoch": 1985} {"train_loss": -11.843151904287792, "global_step": 333647, "epoch": 1985, "val_loss": 287087.8125, "train_action_mse_error": 0.7112526893615723} {"train_loss": -12.123659133911133, "global_step": 333648, "epoch": 1986} {"train_loss": -12.337567329406738, "global_step": 333649, "epoch": 1986} {"train_loss": -12.209052085876465, "global_step": 333650, "epoch": 1986} {"train_loss": -12.03584098815918, "global_step": 333651, "epoch": 1986} {"train_loss": -11.56380558013916, "global_step": 333652, "epoch": 1986} {"train_loss": -11.908864974975586, "global_step": 333653, "epoch": 1986} {"train_loss": -12.110895156860352, "global_step": 333654, "epoch": 1986} {"train_loss": -11.797903060913086, "global_step": 333655, "epoch": 1986} {"train_loss": -11.324382781982422, "global_step": 333656, "epoch": 1986} {"train_loss": -12.367158889770508, "global_step": 333657, "epoch": 1986} {"train_loss": -11.449697494506836, "global_step": 333658, "epoch": 1986} {"train_loss": -10.881915092468262, "global_step": 333659, "epoch": 1986} {"train_loss": -11.449007034301758, "global_step": 333660, "epoch": 1986} {"train_loss": -11.315387725830078, "global_step": 333661, "epoch": 1986} {"train_loss": -11.477581024169922, "global_step": 333662, "epoch": 1986} {"train_loss": -11.386215209960938, "global_step": 333663, "epoch": 1986} {"train_loss": -11.72856330871582, "global_step": 333664, "epoch": 1986} {"train_loss": -10.730728149414062, "global_step": 333665, "epoch": 1986} {"train_loss": -11.122615814208984, "global_step": 333666, "epoch": 1986} {"train_loss": -10.942429542541504, "global_step": 333667, "epoch": 1986} {"train_loss": -10.162660598754883, "global_step": 333668, "epoch": 1986} {"train_loss": -12.045005798339844, "global_step": 333669, "epoch": 1986} {"train_loss": -10.637992858886719, "global_step": 333670, "epoch": 1986} {"train_loss": -11.627464294433594, "global_step": 333671, "epoch": 1986} {"train_loss": -11.095514297485352, "global_step": 333672, "epoch": 1986} {"train_loss": -11.257566452026367, "global_step": 333673, "epoch": 1986} {"train_loss": -10.829079627990723, "global_step": 333674, "epoch": 1986} {"train_loss": -10.973154067993164, "global_step": 333675, "epoch": 1986} {"train_loss": -10.823909759521484, "global_step": 333676, "epoch": 1986} {"train_loss": -11.028312683105469, "global_step": 333677, "epoch": 1986} {"train_loss": -11.290067672729492, "global_step": 333678, "epoch": 1986} {"train_loss": -11.877365112304688, "global_step": 333679, "epoch": 1986} {"train_loss": -11.244538307189941, "global_step": 333680, "epoch": 1986} {"train_loss": -11.828778266906738, "global_step": 333681, "epoch": 1986} {"train_loss": -11.749673843383789, "global_step": 333682, "epoch": 1986} {"train_loss": -11.36895751953125, "global_step": 333683, "epoch": 1986} {"train_loss": -11.895071983337402, "global_step": 333684, "epoch": 1986} {"train_loss": -11.432113647460938, "global_step": 333685, "epoch": 1986} {"train_loss": -12.036285400390625, "global_step": 333686, "epoch": 1986} {"train_loss": -12.056098937988281, "global_step": 333687, "epoch": 1986} {"train_loss": -11.716451644897461, "global_step": 333688, "epoch": 1986} {"train_loss": -11.511693000793457, "global_step": 333689, "epoch": 1986} {"train_loss": -11.955300331115723, "global_step": 333690, "epoch": 1986} {"train_loss": -11.664000511169434, "global_step": 333691, "epoch": 1986} {"train_loss": -11.957070350646973, "global_step": 333692, "epoch": 1986} {"train_loss": -11.928668975830078, "global_step": 333693, "epoch": 1986} {"train_loss": -11.888090133666992, "global_step": 333694, "epoch": 1986} {"train_loss": -11.807075500488281, "global_step": 333695, "epoch": 1986} {"train_loss": -11.848886489868164, "global_step": 333696, "epoch": 1986} {"train_loss": -11.794289588928223, "global_step": 333697, "epoch": 1986} {"train_loss": -11.681940078735352, "global_step": 333698, "epoch": 1986} {"train_loss": -12.220162391662598, "global_step": 333699, "epoch": 1986} {"train_loss": -11.598616600036621, "global_step": 333700, "epoch": 1986} {"train_loss": -12.170069694519043, "global_step": 333701, "epoch": 1986} {"train_loss": -12.249309539794922, "global_step": 333702, "epoch": 1986} {"train_loss": -12.173800468444824, "global_step": 333703, "epoch": 1986} {"train_loss": -11.85616683959961, "global_step": 333704, "epoch": 1986} {"train_loss": -11.93641185760498, "global_step": 333705, "epoch": 1986} {"train_loss": -12.10743522644043, "global_step": 333706, "epoch": 1986} {"train_loss": -12.069281578063965, "global_step": 333707, "epoch": 1986} {"train_loss": -12.179723739624023, "global_step": 333708, "epoch": 1986} {"train_loss": -12.177504539489746, "global_step": 333709, "epoch": 1986} {"train_loss": -12.309534072875977, "global_step": 333710, "epoch": 1986} {"train_loss": -12.171993255615234, "global_step": 333711, "epoch": 1986} {"train_loss": -12.18533706665039, "global_step": 333712, "epoch": 1986} {"train_loss": -12.095404624938965, "global_step": 333713, "epoch": 1986} {"train_loss": -12.295475006103516, "global_step": 333714, "epoch": 1986} {"train_loss": -12.050046920776367, "global_step": 333715, "epoch": 1986} {"train_loss": -12.131648063659668, "global_step": 333716, "epoch": 1986} {"train_loss": -12.242855072021484, "global_step": 333717, "epoch": 1986} {"train_loss": -12.50358772277832, "global_step": 333718, "epoch": 1986} {"train_loss": -12.231857299804688, "global_step": 333719, "epoch": 1986} {"train_loss": -12.292577743530273, "global_step": 333720, "epoch": 1986} {"train_loss": -12.419504165649414, "global_step": 333721, "epoch": 1986} {"train_loss": -12.396787643432617, "global_step": 333722, "epoch": 1986} {"train_loss": -12.439952850341797, "global_step": 333723, "epoch": 1986} {"train_loss": -12.489497184753418, "global_step": 333724, "epoch": 1986} {"train_loss": -12.405274391174316, "global_step": 333725, "epoch": 1986} {"train_loss": -12.454680442810059, "global_step": 333726, "epoch": 1986} {"train_loss": -12.45079517364502, "global_step": 333727, "epoch": 1986} {"train_loss": -12.310527801513672, "global_step": 333728, "epoch": 1986} {"train_loss": -12.460498809814453, "global_step": 333729, "epoch": 1986} {"train_loss": -12.524794578552246, "global_step": 333730, "epoch": 1986} {"train_loss": -12.360342025756836, "global_step": 333731, "epoch": 1986} {"train_loss": -12.465904235839844, "global_step": 333732, "epoch": 1986} {"train_loss": -12.420465469360352, "global_step": 333733, "epoch": 1986} {"train_loss": -12.195082664489746, "global_step": 333734, "epoch": 1986} {"train_loss": -12.23460865020752, "global_step": 333735, "epoch": 1986} {"train_loss": -11.902434349060059, "global_step": 333736, "epoch": 1986} {"train_loss": -11.884864807128906, "global_step": 333737, "epoch": 1986} {"train_loss": -11.974515914916992, "global_step": 333738, "epoch": 1986} {"train_loss": -12.31541919708252, "global_step": 333739, "epoch": 1986} {"train_loss": -11.671058654785156, "global_step": 333740, "epoch": 1986} {"train_loss": -12.215819358825684, "global_step": 333741, "epoch": 1986} {"train_loss": -11.89273452758789, "global_step": 333742, "epoch": 1986} {"train_loss": -12.178141593933105, "global_step": 333743, "epoch": 1986} {"train_loss": -12.08694076538086, "global_step": 333744, "epoch": 1986} {"train_loss": -12.26671314239502, "global_step": 333745, "epoch": 1986} {"train_loss": -12.117879867553711, "global_step": 333746, "epoch": 1986} {"train_loss": -12.37569808959961, "global_step": 333747, "epoch": 1986} {"train_loss": -12.468223571777344, "global_step": 333748, "epoch": 1986} {"train_loss": -12.21123218536377, "global_step": 333749, "epoch": 1986} {"train_loss": -12.476593017578125, "global_step": 333750, "epoch": 1986} {"train_loss": -12.567752838134766, "global_step": 333751, "epoch": 1986} {"train_loss": -12.440984725952148, "global_step": 333752, "epoch": 1986} {"train_loss": -12.659374237060547, "global_step": 333753, "epoch": 1986} {"train_loss": -12.646387100219727, "global_step": 333754, "epoch": 1986} {"train_loss": -12.378856658935547, "global_step": 333755, "epoch": 1986} {"train_loss": -12.39816951751709, "global_step": 333756, "epoch": 1986} {"train_loss": -12.084579467773438, "global_step": 333757, "epoch": 1986} {"train_loss": -12.28725814819336, "global_step": 333758, "epoch": 1986} {"train_loss": -12.379531860351562, "global_step": 333759, "epoch": 1986} {"train_loss": -12.101587295532227, "global_step": 333760, "epoch": 1986} {"train_loss": -12.569884300231934, "global_step": 333761, "epoch": 1986} {"train_loss": -12.604106903076172, "global_step": 333762, "epoch": 1986} {"train_loss": -12.461702346801758, "global_step": 333763, "epoch": 1986} {"train_loss": -12.4554443359375, "global_step": 333764, "epoch": 1986} {"train_loss": -12.559791564941406, "global_step": 333765, "epoch": 1986} {"train_loss": -12.150687217712402, "global_step": 333766, "epoch": 1986} {"train_loss": -11.764713287353516, "global_step": 333767, "epoch": 1986} {"train_loss": -12.221805572509766, "global_step": 333768, "epoch": 1986} {"train_loss": -12.290349960327148, "global_step": 333769, "epoch": 1986} {"train_loss": -10.912432670593262, "global_step": 333770, "epoch": 1986} {"train_loss": -10.398219108581543, "global_step": 333771, "epoch": 1986} {"train_loss": -12.569256782531738, "global_step": 333772, "epoch": 1986} {"train_loss": -10.528863906860352, "global_step": 333773, "epoch": 1986} {"train_loss": -12.005634307861328, "global_step": 333774, "epoch": 1986} {"train_loss": -10.621569633483887, "global_step": 333775, "epoch": 1986} {"train_loss": -10.796674728393555, "global_step": 333776, "epoch": 1986} {"train_loss": -11.805259704589844, "global_step": 333777, "epoch": 1986} {"train_loss": -10.667699813842773, "global_step": 333778, "epoch": 1986} {"train_loss": -12.203033447265625, "global_step": 333779, "epoch": 1986} {"train_loss": -10.54831314086914, "global_step": 333780, "epoch": 1986} {"train_loss": -11.810089111328125, "global_step": 333781, "epoch": 1986} {"train_loss": -10.708338737487793, "global_step": 333782, "epoch": 1986} {"train_loss": -10.766120910644531, "global_step": 333783, "epoch": 1986} {"train_loss": -11.52831745147705, "global_step": 333784, "epoch": 1986} {"train_loss": -10.51931095123291, "global_step": 333785, "epoch": 1986} {"train_loss": -12.236876487731934, "global_step": 333786, "epoch": 1986} {"train_loss": -10.594182968139648, "global_step": 333787, "epoch": 1986} {"train_loss": -12.254737854003906, "global_step": 333788, "epoch": 1986} {"train_loss": -11.258647918701172, "global_step": 333789, "epoch": 1986} {"train_loss": -11.715205192565918, "global_step": 333790, "epoch": 1986} {"train_loss": -11.897777557373047, "global_step": 333791, "epoch": 1986} {"train_loss": -11.81768798828125, "global_step": 333792, "epoch": 1986} {"train_loss": -11.707538604736328, "global_step": 333793, "epoch": 1986} {"train_loss": -11.707619667053223, "global_step": 333794, "epoch": 1986} {"train_loss": -12.010814666748047, "global_step": 333795, "epoch": 1986} {"train_loss": -11.701894760131836, "global_step": 333796, "epoch": 1986} {"train_loss": -10.902115821838379, "global_step": 333797, "epoch": 1986} {"train_loss": -11.51343822479248, "global_step": 333798, "epoch": 1986} {"train_loss": -11.4303560256958, "global_step": 333799, "epoch": 1986} {"train_loss": -11.906557083129883, "global_step": 333800, "epoch": 1986} {"train_loss": -12.048576354980469, "global_step": 333801, "epoch": 1986} {"train_loss": -11.922577857971191, "global_step": 333802, "epoch": 1986} {"train_loss": -11.961555480957031, "global_step": 333803, "epoch": 1986} {"train_loss": -11.781614303588867, "global_step": 333804, "epoch": 1986} {"train_loss": -12.054594039916992, "global_step": 333805, "epoch": 1986} {"train_loss": -11.710626602172852, "global_step": 333806, "epoch": 1986} {"train_loss": -12.094562530517578, "global_step": 333807, "epoch": 1986} {"train_loss": -11.854047775268555, "global_step": 333808, "epoch": 1986} {"train_loss": -12.082746505737305, "global_step": 333809, "epoch": 1986} {"train_loss": -12.20817756652832, "global_step": 333810, "epoch": 1986} {"train_loss": -12.092399597167969, "global_step": 333811, "epoch": 1986} {"train_loss": -11.988176345825195, "global_step": 333812, "epoch": 1986} {"train_loss": -12.262914657592773, "global_step": 333813, "epoch": 1986} {"train_loss": -12.145018577575684, "global_step": 333814, "epoch": 1986} {"train_loss": -11.861568456604367, "global_step": 333815, "epoch": 1986, "val_loss": 288145.375} {"train_loss": -11.531898498535156, "global_step": 333816, "epoch": 1987} {"train_loss": -12.199525833129883, "global_step": 333817, "epoch": 1987} {"train_loss": -11.902776718139648, "global_step": 333818, "epoch": 1987} {"train_loss": -11.938577651977539, "global_step": 333819, "epoch": 1987} {"train_loss": -12.195539474487305, "global_step": 333820, "epoch": 1987} {"train_loss": -11.942123413085938, "global_step": 333821, "epoch": 1987} {"train_loss": -12.123826026916504, "global_step": 333822, "epoch": 1987} {"train_loss": -12.081620216369629, "global_step": 333823, "epoch": 1987} {"train_loss": -11.682785987854004, "global_step": 333824, "epoch": 1987} {"train_loss": -11.439990997314453, "global_step": 333825, "epoch": 1987} {"train_loss": -11.593354225158691, "global_step": 333826, "epoch": 1987} {"train_loss": -11.576181411743164, "global_step": 333827, "epoch": 1987} {"train_loss": -11.999096870422363, "global_step": 333828, "epoch": 1987} {"train_loss": -11.827688217163086, "global_step": 333829, "epoch": 1987} {"train_loss": -11.855870246887207, "global_step": 333830, "epoch": 1987} {"train_loss": -11.896445274353027, "global_step": 333831, "epoch": 1987} {"train_loss": -12.10069465637207, "global_step": 333832, "epoch": 1987} {"train_loss": -11.257465362548828, "global_step": 333833, "epoch": 1987} {"train_loss": -12.056584358215332, "global_step": 333834, "epoch": 1987} {"train_loss": -11.211186408996582, "global_step": 333835, "epoch": 1987} {"train_loss": -11.861494064331055, "global_step": 333836, "epoch": 1987} {"train_loss": -11.424018859863281, "global_step": 333837, "epoch": 1987} {"train_loss": -11.919275283813477, "global_step": 333838, "epoch": 1987} {"train_loss": -11.802515983581543, "global_step": 333839, "epoch": 1987} {"train_loss": -11.603002548217773, "global_step": 333840, "epoch": 1987} {"train_loss": -11.74424934387207, "global_step": 333841, "epoch": 1987} {"train_loss": -11.500162124633789, "global_step": 333842, "epoch": 1987} {"train_loss": -11.83140754699707, "global_step": 333843, "epoch": 1987} {"train_loss": -11.297958374023438, "global_step": 333844, "epoch": 1987} {"train_loss": -11.721540451049805, "global_step": 333845, "epoch": 1987} {"train_loss": -11.194589614868164, "global_step": 333846, "epoch": 1987} {"train_loss": -11.141775131225586, "global_step": 333847, "epoch": 1987} {"train_loss": -11.459821701049805, "global_step": 333848, "epoch": 1987} {"train_loss": -10.0635404586792, "global_step": 333849, "epoch": 1987} {"train_loss": -11.782230377197266, "global_step": 333850, "epoch": 1987} {"train_loss": -10.555916786193848, "global_step": 333851, "epoch": 1987} {"train_loss": -11.995504379272461, "global_step": 333852, "epoch": 1987} {"train_loss": -10.810247421264648, "global_step": 333853, "epoch": 1987} {"train_loss": -12.053410530090332, "global_step": 333854, "epoch": 1987} {"train_loss": -10.818046569824219, "global_step": 333855, "epoch": 1987} {"train_loss": -11.949509620666504, "global_step": 333856, "epoch": 1987} {"train_loss": -11.11177921295166, "global_step": 333857, "epoch": 1987} {"train_loss": -12.07228946685791, "global_step": 333858, "epoch": 1987} {"train_loss": -11.431830406188965, "global_step": 333859, "epoch": 1987} {"train_loss": -11.96142578125, "global_step": 333860, "epoch": 1987} {"train_loss": -11.577314376831055, "global_step": 333861, "epoch": 1987} {"train_loss": -11.977270126342773, "global_step": 333862, "epoch": 1987} {"train_loss": -11.869701385498047, "global_step": 333863, "epoch": 1987} {"train_loss": -12.003472328186035, "global_step": 333864, "epoch": 1987} {"train_loss": -11.75454330444336, "global_step": 333865, "epoch": 1987} {"train_loss": -11.957233428955078, "global_step": 333866, "epoch": 1987} {"train_loss": -11.99746036529541, "global_step": 333867, "epoch": 1987} {"train_loss": -12.122678756713867, "global_step": 333868, "epoch": 1987} {"train_loss": -11.881369590759277, "global_step": 333869, "epoch": 1987} {"train_loss": -11.878488540649414, "global_step": 333870, "epoch": 1987} {"train_loss": -11.766145706176758, "global_step": 333871, "epoch": 1987} {"train_loss": -11.704924583435059, "global_step": 333872, "epoch": 1987} {"train_loss": -11.855243682861328, "global_step": 333873, "epoch": 1987} {"train_loss": -11.81929874420166, "global_step": 333874, "epoch": 1987} {"train_loss": -12.028663635253906, "global_step": 333875, "epoch": 1987} {"train_loss": -12.1864595413208, "global_step": 333876, "epoch": 1987} {"train_loss": -12.150253295898438, "global_step": 333877, "epoch": 1987} {"train_loss": -12.299830436706543, "global_step": 333878, "epoch": 1987} {"train_loss": -12.044307708740234, "global_step": 333879, "epoch": 1987} {"train_loss": -12.33476734161377, "global_step": 333880, "epoch": 1987} {"train_loss": -11.923712730407715, "global_step": 333881, "epoch": 1987} {"train_loss": -12.282675743103027, "global_step": 333882, "epoch": 1987} {"train_loss": -12.075474739074707, "global_step": 333883, "epoch": 1987} {"train_loss": -12.326131820678711, "global_step": 333884, "epoch": 1987} {"train_loss": -12.156472206115723, "global_step": 333885, "epoch": 1987} {"train_loss": -12.58102798461914, "global_step": 333886, "epoch": 1987} {"train_loss": -12.115471839904785, "global_step": 333887, "epoch": 1987} {"train_loss": -12.324796676635742, "global_step": 333888, "epoch": 1987} {"train_loss": -12.221941947937012, "global_step": 333889, "epoch": 1987} {"train_loss": -12.364557266235352, "global_step": 333890, "epoch": 1987} {"train_loss": -12.152297973632812, "global_step": 333891, "epoch": 1987} {"train_loss": -12.102666854858398, "global_step": 333892, "epoch": 1987} {"train_loss": -12.2124605178833, "global_step": 333893, "epoch": 1987} {"train_loss": -12.262170791625977, "global_step": 333894, "epoch": 1987} {"train_loss": -12.137977600097656, "global_step": 333895, "epoch": 1987} {"train_loss": -12.517356872558594, "global_step": 333896, "epoch": 1987} {"train_loss": -12.113380432128906, "global_step": 333897, "epoch": 1987} {"train_loss": -12.329252243041992, "global_step": 333898, "epoch": 1987} {"train_loss": -12.373363494873047, "global_step": 333899, "epoch": 1987} {"train_loss": -12.67436408996582, "global_step": 333900, "epoch": 1987} {"train_loss": -12.467823028564453, "global_step": 333901, "epoch": 1987} {"train_loss": -12.445137977600098, "global_step": 333902, "epoch": 1987} {"train_loss": -12.686286926269531, "global_step": 333903, "epoch": 1987} {"train_loss": -12.271907806396484, "global_step": 333904, "epoch": 1987} {"train_loss": -12.50057601928711, "global_step": 333905, "epoch": 1987} {"train_loss": -12.454145431518555, "global_step": 333906, "epoch": 1987} {"train_loss": -12.456379890441895, "global_step": 333907, "epoch": 1987} {"train_loss": -12.48959732055664, "global_step": 333908, "epoch": 1987} {"train_loss": -12.656797409057617, "global_step": 333909, "epoch": 1987} {"train_loss": -12.415814399719238, "global_step": 333910, "epoch": 1987} {"train_loss": -12.574920654296875, "global_step": 333911, "epoch": 1987} {"train_loss": -12.577800750732422, "global_step": 333912, "epoch": 1987} {"train_loss": -12.700965881347656, "global_step": 333913, "epoch": 1987} {"train_loss": -12.557832717895508, "global_step": 333914, "epoch": 1987} {"train_loss": -12.533613204956055, "global_step": 333915, "epoch": 1987} {"train_loss": -12.456474304199219, "global_step": 333916, "epoch": 1987} {"train_loss": -12.740616798400879, "global_step": 333917, "epoch": 1987} {"train_loss": -12.456056594848633, "global_step": 333918, "epoch": 1987} {"train_loss": -12.72614574432373, "global_step": 333919, "epoch": 1987} {"train_loss": -12.410778045654297, "global_step": 333920, "epoch": 1987} {"train_loss": -12.273983001708984, "global_step": 333921, "epoch": 1987} {"train_loss": -12.564311981201172, "global_step": 333922, "epoch": 1987} {"train_loss": -12.621496200561523, "global_step": 333923, "epoch": 1987} {"train_loss": -12.575204849243164, "global_step": 333924, "epoch": 1987} {"train_loss": -12.06466293334961, "global_step": 333925, "epoch": 1987} {"train_loss": -12.449337005615234, "global_step": 333926, "epoch": 1987} {"train_loss": -12.54311752319336, "global_step": 333927, "epoch": 1987} {"train_loss": -12.215757369995117, "global_step": 333928, "epoch": 1987} {"train_loss": -11.755069732666016, "global_step": 333929, "epoch": 1987} {"train_loss": -12.230499267578125, "global_step": 333930, "epoch": 1987} {"train_loss": -11.7880859375, "global_step": 333931, "epoch": 1987} {"train_loss": -12.571737289428711, "global_step": 333932, "epoch": 1987} {"train_loss": -11.57573413848877, "global_step": 333933, "epoch": 1987} {"train_loss": -12.334461212158203, "global_step": 333934, "epoch": 1987} {"train_loss": -12.07264518737793, "global_step": 333935, "epoch": 1987} {"train_loss": -12.436732292175293, "global_step": 333936, "epoch": 1987} {"train_loss": -12.414335250854492, "global_step": 333937, "epoch": 1987} {"train_loss": -12.64525318145752, "global_step": 333938, "epoch": 1987} {"train_loss": -12.285640716552734, "global_step": 333939, "epoch": 1987} {"train_loss": -11.859861373901367, "global_step": 333940, "epoch": 1987} {"train_loss": -12.277761459350586, "global_step": 333941, "epoch": 1987} {"train_loss": -12.014358520507812, "global_step": 333942, "epoch": 1987} {"train_loss": -12.67288589477539, "global_step": 333943, "epoch": 1987} {"train_loss": -12.403820037841797, "global_step": 333944, "epoch": 1987} {"train_loss": -12.693473815917969, "global_step": 333945, "epoch": 1987} {"train_loss": -12.405698776245117, "global_step": 333946, "epoch": 1987} {"train_loss": -12.246133804321289, "global_step": 333947, "epoch": 1987} {"train_loss": -11.649398803710938, "global_step": 333948, "epoch": 1987} {"train_loss": -11.777902603149414, "global_step": 333949, "epoch": 1987} {"train_loss": -11.657272338867188, "global_step": 333950, "epoch": 1987} {"train_loss": -12.477209091186523, "global_step": 333951, "epoch": 1987} {"train_loss": -11.334017753601074, "global_step": 333952, "epoch": 1987} {"train_loss": -11.563472747802734, "global_step": 333953, "epoch": 1987} {"train_loss": -11.586138725280762, "global_step": 333954, "epoch": 1987} {"train_loss": -12.497354507446289, "global_step": 333955, "epoch": 1987} {"train_loss": -12.085981369018555, "global_step": 333956, "epoch": 1987} {"train_loss": -11.880973815917969, "global_step": 333957, "epoch": 1987} {"train_loss": -10.539058685302734, "global_step": 333958, "epoch": 1987} {"train_loss": -12.334988594055176, "global_step": 333959, "epoch": 1987} {"train_loss": -11.782532691955566, "global_step": 333960, "epoch": 1987} {"train_loss": -10.852957725524902, "global_step": 333961, "epoch": 1987} {"train_loss": -11.944530487060547, "global_step": 333962, "epoch": 1987} {"train_loss": -12.23957633972168, "global_step": 333963, "epoch": 1987} {"train_loss": -9.565226554870605, "global_step": 333964, "epoch": 1987} {"train_loss": -11.842275619506836, "global_step": 333965, "epoch": 1987} {"train_loss": -11.201424598693848, "global_step": 333966, "epoch": 1987} {"train_loss": -11.365028381347656, "global_step": 333967, "epoch": 1987} {"train_loss": -12.282808303833008, "global_step": 333968, "epoch": 1987} {"train_loss": -11.424893379211426, "global_step": 333969, "epoch": 1987} {"train_loss": -11.340911865234375, "global_step": 333970, "epoch": 1987} {"train_loss": -12.321374893188477, "global_step": 333971, "epoch": 1987} {"train_loss": -11.45643424987793, "global_step": 333972, "epoch": 1987} {"train_loss": -10.903094291687012, "global_step": 333973, "epoch": 1987} {"train_loss": -12.355842590332031, "global_step": 333974, "epoch": 1987} {"train_loss": -11.61923885345459, "global_step": 333975, "epoch": 1987} {"train_loss": -11.660079956054688, "global_step": 333976, "epoch": 1987} {"train_loss": -11.694601058959961, "global_step": 333977, "epoch": 1987} {"train_loss": -12.337336540222168, "global_step": 333978, "epoch": 1987} {"train_loss": -11.588142395019531, "global_step": 333979, "epoch": 1987} {"train_loss": -11.835912704467773, "global_step": 333980, "epoch": 1987} {"train_loss": -11.778343200683594, "global_step": 333981, "epoch": 1987} {"train_loss": -11.529768943786621, "global_step": 333982, "epoch": 1987} {"train_loss": -11.969359244619097, "global_step": 333983, "epoch": 1987, "val_loss": 288909.5} {"train_loss": -12.394996643066406, "global_step": 333984, "epoch": 1988} {"train_loss": -12.290497779846191, "global_step": 333985, "epoch": 1988} {"train_loss": -12.268697738647461, "global_step": 333986, "epoch": 1988} {"train_loss": -12.233076095581055, "global_step": 333987, "epoch": 1988} {"train_loss": -12.153711318969727, "global_step": 333988, "epoch": 1988} {"train_loss": -12.194474220275879, "global_step": 333989, "epoch": 1988} {"train_loss": -12.255335807800293, "global_step": 333990, "epoch": 1988} {"train_loss": -11.904610633850098, "global_step": 333991, "epoch": 1988} {"train_loss": -12.476414680480957, "global_step": 333992, "epoch": 1988} {"train_loss": -11.913554191589355, "global_step": 333993, "epoch": 1988} {"train_loss": -12.029003143310547, "global_step": 333994, "epoch": 1988} {"train_loss": -12.093162536621094, "global_step": 333995, "epoch": 1988} {"train_loss": -12.110483169555664, "global_step": 333996, "epoch": 1988} {"train_loss": -12.161348342895508, "global_step": 333997, "epoch": 1988} {"train_loss": -11.983410835266113, "global_step": 333998, "epoch": 1988} {"train_loss": -12.137395858764648, "global_step": 333999, "epoch": 1988} {"train_loss": -11.858848571777344, "global_step": 334000, "epoch": 1988} {"train_loss": -11.863380432128906, "global_step": 334001, "epoch": 1988} {"train_loss": -11.780296325683594, "global_step": 334002, "epoch": 1988} {"train_loss": -10.560754776000977, "global_step": 334003, "epoch": 1988} {"train_loss": -11.614764213562012, "global_step": 334004, "epoch": 1988} {"train_loss": -11.987066268920898, "global_step": 334005, "epoch": 1988} {"train_loss": -10.61149787902832, "global_step": 334006, "epoch": 1988} {"train_loss": -11.38426685333252, "global_step": 334007, "epoch": 1988} {"train_loss": -11.22744369506836, "global_step": 334008, "epoch": 1988} {"train_loss": -10.227065086364746, "global_step": 334009, "epoch": 1988} {"train_loss": -11.054187774658203, "global_step": 334010, "epoch": 1988} {"train_loss": -10.076597213745117, "global_step": 334011, "epoch": 1988} {"train_loss": -11.284075736999512, "global_step": 334012, "epoch": 1988} {"train_loss": -9.178037643432617, "global_step": 334013, "epoch": 1988} {"train_loss": -10.951915740966797, "global_step": 334014, "epoch": 1988} {"train_loss": -9.050710678100586, "global_step": 334015, "epoch": 1988} {"train_loss": -11.661188125610352, "global_step": 334016, "epoch": 1988} {"train_loss": -8.449317932128906, "global_step": 334017, "epoch": 1988} {"train_loss": -9.286867141723633, "global_step": 334018, "epoch": 1988} {"train_loss": -10.496650695800781, "global_step": 334019, "epoch": 1988} {"train_loss": -9.802879333496094, "global_step": 334020, "epoch": 1988} {"train_loss": -10.71408748626709, "global_step": 334021, "epoch": 1988} {"train_loss": -8.52704906463623, "global_step": 334022, "epoch": 1988} {"train_loss": -10.627525329589844, "global_step": 334023, "epoch": 1988} {"train_loss": -10.296895027160645, "global_step": 334024, "epoch": 1988} {"train_loss": -10.01009464263916, "global_step": 334025, "epoch": 1988} {"train_loss": -9.731391906738281, "global_step": 334026, "epoch": 1988} {"train_loss": -10.786283493041992, "global_step": 334027, "epoch": 1988} {"train_loss": -10.507612228393555, "global_step": 334028, "epoch": 1988} {"train_loss": -9.359420776367188, "global_step": 334029, "epoch": 1988} {"train_loss": -11.741044044494629, "global_step": 334030, "epoch": 1988} {"train_loss": -9.947576522827148, "global_step": 334031, "epoch": 1988} {"train_loss": -11.150158882141113, "global_step": 334032, "epoch": 1988} {"train_loss": -10.183365821838379, "global_step": 334033, "epoch": 1988} {"train_loss": -10.376373291015625, "global_step": 334034, "epoch": 1988} {"train_loss": -10.781064987182617, "global_step": 334035, "epoch": 1988} {"train_loss": -11.01278305053711, "global_step": 334036, "epoch": 1988} {"train_loss": -11.395912170410156, "global_step": 334037, "epoch": 1988} {"train_loss": -10.48238754272461, "global_step": 334038, "epoch": 1988} {"train_loss": -11.740034103393555, "global_step": 334039, "epoch": 1988} {"train_loss": -10.685845375061035, "global_step": 334040, "epoch": 1988} {"train_loss": -11.0044527053833, "global_step": 334041, "epoch": 1988} {"train_loss": -11.260534286499023, "global_step": 334042, "epoch": 1988} {"train_loss": -10.840522766113281, "global_step": 334043, "epoch": 1988} {"train_loss": -11.429792404174805, "global_step": 334044, "epoch": 1988} {"train_loss": -11.480850219726562, "global_step": 334045, "epoch": 1988} {"train_loss": -11.729212760925293, "global_step": 334046, "epoch": 1988} {"train_loss": -11.451433181762695, "global_step": 334047, "epoch": 1988} {"train_loss": -11.974337577819824, "global_step": 334048, "epoch": 1988} {"train_loss": -11.82752799987793, "global_step": 334049, "epoch": 1988} {"train_loss": -11.639817237854004, "global_step": 334050, "epoch": 1988} {"train_loss": -12.166459083557129, "global_step": 334051, "epoch": 1988} {"train_loss": -11.722002029418945, "global_step": 334052, "epoch": 1988} {"train_loss": -12.109115600585938, "global_step": 334053, "epoch": 1988} {"train_loss": -11.620320320129395, "global_step": 334054, "epoch": 1988} {"train_loss": -11.893972396850586, "global_step": 334055, "epoch": 1988} {"train_loss": -11.706836700439453, "global_step": 334056, "epoch": 1988} {"train_loss": -11.86509895324707, "global_step": 334057, "epoch": 1988} {"train_loss": -11.88282585144043, "global_step": 334058, "epoch": 1988} {"train_loss": -11.848175048828125, "global_step": 334059, "epoch": 1988} {"train_loss": -12.00423526763916, "global_step": 334060, "epoch": 1988} {"train_loss": -11.726070404052734, "global_step": 334061, "epoch": 1988} {"train_loss": -12.011877059936523, "global_step": 334062, "epoch": 1988} {"train_loss": -12.007003784179688, "global_step": 334063, "epoch": 1988} {"train_loss": -12.14683723449707, "global_step": 334064, "epoch": 1988} {"train_loss": -12.224162101745605, "global_step": 334065, "epoch": 1988} {"train_loss": -12.008209228515625, "global_step": 334066, "epoch": 1988} {"train_loss": -12.241884231567383, "global_step": 334067, "epoch": 1988} {"train_loss": -12.196544647216797, "global_step": 334068, "epoch": 1988} {"train_loss": -12.232111930847168, "global_step": 334069, "epoch": 1988} {"train_loss": -12.239802360534668, "global_step": 334070, "epoch": 1988} {"train_loss": -12.122051239013672, "global_step": 334071, "epoch": 1988} {"train_loss": -12.182310104370117, "global_step": 334072, "epoch": 1988} {"train_loss": -12.135210037231445, "global_step": 334073, "epoch": 1988} {"train_loss": -11.878055572509766, "global_step": 334074, "epoch": 1988} {"train_loss": -12.351244926452637, "global_step": 334075, "epoch": 1988} {"train_loss": -12.037342071533203, "global_step": 334076, "epoch": 1988} {"train_loss": -12.171756744384766, "global_step": 334077, "epoch": 1988} {"train_loss": -12.10335922241211, "global_step": 334078, "epoch": 1988} {"train_loss": -12.367219924926758, "global_step": 334079, "epoch": 1988} {"train_loss": -12.241435050964355, "global_step": 334080, "epoch": 1988} {"train_loss": -12.377036094665527, "global_step": 334081, "epoch": 1988} {"train_loss": -12.339812278747559, "global_step": 334082, "epoch": 1988} {"train_loss": -12.376518249511719, "global_step": 334083, "epoch": 1988} {"train_loss": -12.340825080871582, "global_step": 334084, "epoch": 1988} {"train_loss": -12.327556610107422, "global_step": 334085, "epoch": 1988} {"train_loss": -12.340797424316406, "global_step": 334086, "epoch": 1988} {"train_loss": -12.205402374267578, "global_step": 334087, "epoch": 1988} {"train_loss": -12.20783805847168, "global_step": 334088, "epoch": 1988} {"train_loss": -12.407941818237305, "global_step": 334089, "epoch": 1988} {"train_loss": -12.200526237487793, "global_step": 334090, "epoch": 1988} {"train_loss": -12.306905746459961, "global_step": 334091, "epoch": 1988} {"train_loss": -12.28426742553711, "global_step": 334092, "epoch": 1988} {"train_loss": -12.435193061828613, "global_step": 334093, "epoch": 1988} {"train_loss": -12.291160583496094, "global_step": 334094, "epoch": 1988} {"train_loss": -12.059725761413574, "global_step": 334095, "epoch": 1988} {"train_loss": -12.39975357055664, "global_step": 334096, "epoch": 1988} {"train_loss": -12.141441345214844, "global_step": 334097, "epoch": 1988} {"train_loss": -12.40198040008545, "global_step": 334098, "epoch": 1988} {"train_loss": -12.146203994750977, "global_step": 334099, "epoch": 1988} {"train_loss": -12.581082344055176, "global_step": 334100, "epoch": 1988} {"train_loss": -12.254505157470703, "global_step": 334101, "epoch": 1988} {"train_loss": -12.341306686401367, "global_step": 334102, "epoch": 1988} {"train_loss": -12.044842720031738, "global_step": 334103, "epoch": 1988} {"train_loss": -12.363181114196777, "global_step": 334104, "epoch": 1988} {"train_loss": -12.190460205078125, "global_step": 334105, "epoch": 1988} {"train_loss": -12.361621856689453, "global_step": 334106, "epoch": 1988} {"train_loss": -12.06803035736084, "global_step": 334107, "epoch": 1988} {"train_loss": -12.341266632080078, "global_step": 334108, "epoch": 1988} {"train_loss": -12.437732696533203, "global_step": 334109, "epoch": 1988} {"train_loss": -12.275225639343262, "global_step": 334110, "epoch": 1988} {"train_loss": -12.430716514587402, "global_step": 334111, "epoch": 1988} {"train_loss": -12.429729461669922, "global_step": 334112, "epoch": 1988} {"train_loss": -12.4246826171875, "global_step": 334113, "epoch": 1988} {"train_loss": -12.568266868591309, "global_step": 334114, "epoch": 1988} {"train_loss": -12.504453659057617, "global_step": 334115, "epoch": 1988} {"train_loss": -12.50709056854248, "global_step": 334116, "epoch": 1988} {"train_loss": -12.6029634475708, "global_step": 334117, "epoch": 1988} {"train_loss": -12.486970901489258, "global_step": 334118, "epoch": 1988} {"train_loss": -12.397573471069336, "global_step": 334119, "epoch": 1988} {"train_loss": -12.47435188293457, "global_step": 334120, "epoch": 1988} {"train_loss": -12.406829833984375, "global_step": 334121, "epoch": 1988} {"train_loss": -12.503305435180664, "global_step": 334122, "epoch": 1988} {"train_loss": -12.616704940795898, "global_step": 334123, "epoch": 1988} {"train_loss": -12.350933074951172, "global_step": 334124, "epoch": 1988} {"train_loss": -12.422087669372559, "global_step": 334125, "epoch": 1988} {"train_loss": -12.321741104125977, "global_step": 334126, "epoch": 1988} {"train_loss": -12.530074119567871, "global_step": 334127, "epoch": 1988} {"train_loss": -12.667696952819824, "global_step": 334128, "epoch": 1988} {"train_loss": -12.382426261901855, "global_step": 334129, "epoch": 1988} {"train_loss": -12.638507843017578, "global_step": 334130, "epoch": 1988} {"train_loss": -12.500179290771484, "global_step": 334131, "epoch": 1988} {"train_loss": -12.370157241821289, "global_step": 334132, "epoch": 1988} {"train_loss": -12.525190353393555, "global_step": 334133, "epoch": 1988} {"train_loss": -12.637626647949219, "global_step": 334134, "epoch": 1988} {"train_loss": -12.485477447509766, "global_step": 334135, "epoch": 1988} {"train_loss": -12.11500072479248, "global_step": 334136, "epoch": 1988} {"train_loss": -12.41517448425293, "global_step": 334137, "epoch": 1988} {"train_loss": -12.3521728515625, "global_step": 334138, "epoch": 1988} {"train_loss": -12.190788269042969, "global_step": 334139, "epoch": 1988} {"train_loss": -12.616477012634277, "global_step": 334140, "epoch": 1988} {"train_loss": -11.675832748413086, "global_step": 334141, "epoch": 1988} {"train_loss": -9.469728469848633, "global_step": 334142, "epoch": 1988} {"train_loss": -9.250373840332031, "global_step": 334143, "epoch": 1988} {"train_loss": -11.391161918640137, "global_step": 334144, "epoch": 1988} {"train_loss": -11.940618515014648, "global_step": 334145, "epoch": 1988} {"train_loss": -9.235109329223633, "global_step": 334146, "epoch": 1988} {"train_loss": -11.770191192626953, "global_step": 334147, "epoch": 1988} {"train_loss": -11.106030464172363, "global_step": 334148, "epoch": 1988} {"train_loss": -8.069528579711914, "global_step": 334149, "epoch": 1988} {"train_loss": -9.456212997436523, "global_step": 334150, "epoch": 1988} {"train_loss": -11.672421750568208, "global_step": 334151, "epoch": 1988, "val_loss": 282466.1875} {"train_loss": -8.753910064697266, "global_step": 334152, "epoch": 1989} {"train_loss": -8.047356605529785, "global_step": 334153, "epoch": 1989} {"train_loss": -9.398555755615234, "global_step": 334154, "epoch": 1989} {"train_loss": -9.645179748535156, "global_step": 334155, "epoch": 1989} {"train_loss": -9.337099075317383, "global_step": 334156, "epoch": 1989} {"train_loss": -10.052501678466797, "global_step": 334157, "epoch": 1989} {"train_loss": -10.688711166381836, "global_step": 334158, "epoch": 1989} {"train_loss": -10.983351707458496, "global_step": 334159, "epoch": 1989} {"train_loss": -10.494043350219727, "global_step": 334160, "epoch": 1989} {"train_loss": -10.78526782989502, "global_step": 334161, "epoch": 1989} {"train_loss": -10.916340827941895, "global_step": 334162, "epoch": 1989} {"train_loss": -9.31859016418457, "global_step": 334163, "epoch": 1989} {"train_loss": -10.298933982849121, "global_step": 334164, "epoch": 1989} {"train_loss": -10.468733787536621, "global_step": 334165, "epoch": 1989} {"train_loss": -10.378144264221191, "global_step": 334166, "epoch": 1989} {"train_loss": -10.213578224182129, "global_step": 334167, "epoch": 1989} {"train_loss": -10.885322570800781, "global_step": 334168, "epoch": 1989} {"train_loss": -10.828611373901367, "global_step": 334169, "epoch": 1989} {"train_loss": -10.578786849975586, "global_step": 334170, "epoch": 1989} {"train_loss": -11.297585487365723, "global_step": 334171, "epoch": 1989} {"train_loss": -10.201242446899414, "global_step": 334172, "epoch": 1989} {"train_loss": -11.495201110839844, "global_step": 334173, "epoch": 1989} {"train_loss": -10.88086223602295, "global_step": 334174, "epoch": 1989} {"train_loss": -11.453203201293945, "global_step": 334175, "epoch": 1989} {"train_loss": -11.070610046386719, "global_step": 334176, "epoch": 1989} {"train_loss": -11.370311737060547, "global_step": 334177, "epoch": 1989} {"train_loss": -11.304590225219727, "global_step": 334178, "epoch": 1989} {"train_loss": -11.458931922912598, "global_step": 334179, "epoch": 1989} {"train_loss": -11.451313972473145, "global_step": 334180, "epoch": 1989} {"train_loss": -11.691205978393555, "global_step": 334181, "epoch": 1989} {"train_loss": -11.7339506149292, "global_step": 334182, "epoch": 1989} {"train_loss": -11.612281799316406, "global_step": 334183, "epoch": 1989} {"train_loss": -11.855819702148438, "global_step": 334184, "epoch": 1989} {"train_loss": -11.664273262023926, "global_step": 334185, "epoch": 1989} {"train_loss": -11.486324310302734, "global_step": 334186, "epoch": 1989} {"train_loss": -11.710824966430664, "global_step": 334187, "epoch": 1989} {"train_loss": -11.743586540222168, "global_step": 334188, "epoch": 1989} {"train_loss": -11.707606315612793, "global_step": 334189, "epoch": 1989} {"train_loss": -11.723008155822754, "global_step": 334190, "epoch": 1989} {"train_loss": -11.887568473815918, "global_step": 334191, "epoch": 1989} {"train_loss": -11.813264846801758, "global_step": 334192, "epoch": 1989} {"train_loss": -11.895269393920898, "global_step": 334193, "epoch": 1989} {"train_loss": -11.874914169311523, "global_step": 334194, "epoch": 1989} {"train_loss": -12.027566909790039, "global_step": 334195, "epoch": 1989} {"train_loss": -12.137012481689453, "global_step": 334196, "epoch": 1989} {"train_loss": -12.223102569580078, "global_step": 334197, "epoch": 1989} {"train_loss": -12.092437744140625, "global_step": 334198, "epoch": 1989} {"train_loss": -11.775490760803223, "global_step": 334199, "epoch": 1989} {"train_loss": -12.22895622253418, "global_step": 334200, "epoch": 1989} {"train_loss": -11.84776496887207, "global_step": 334201, "epoch": 1989} {"train_loss": -12.112977981567383, "global_step": 334202, "epoch": 1989} {"train_loss": -11.937565803527832, "global_step": 334203, "epoch": 1989} {"train_loss": -12.082035064697266, "global_step": 334204, "epoch": 1989} {"train_loss": -12.177389144897461, "global_step": 334205, "epoch": 1989} {"train_loss": -11.91422176361084, "global_step": 334206, "epoch": 1989} {"train_loss": -12.108969688415527, "global_step": 334207, "epoch": 1989} {"train_loss": -11.940971374511719, "global_step": 334208, "epoch": 1989} {"train_loss": -12.214174270629883, "global_step": 334209, "epoch": 1989} {"train_loss": -11.934104919433594, "global_step": 334210, "epoch": 1989} {"train_loss": -11.954837799072266, "global_step": 334211, "epoch": 1989} {"train_loss": -11.9927978515625, "global_step": 334212, "epoch": 1989} {"train_loss": -12.277315139770508, "global_step": 334213, "epoch": 1989} {"train_loss": -11.773490905761719, "global_step": 334214, "epoch": 1989} {"train_loss": -12.191399574279785, "global_step": 334215, "epoch": 1989} {"train_loss": -12.138846397399902, "global_step": 334216, "epoch": 1989} {"train_loss": -12.156256675720215, "global_step": 334217, "epoch": 1989} {"train_loss": -12.052330017089844, "global_step": 334218, "epoch": 1989} {"train_loss": -11.814697265625, "global_step": 334219, "epoch": 1989} {"train_loss": -12.3041410446167, "global_step": 334220, "epoch": 1989} {"train_loss": -11.99163818359375, "global_step": 334221, "epoch": 1989} {"train_loss": -12.153596878051758, "global_step": 334222, "epoch": 1989} {"train_loss": -12.089349746704102, "global_step": 334223, "epoch": 1989} {"train_loss": -12.267184257507324, "global_step": 334224, "epoch": 1989} {"train_loss": -12.162612915039062, "global_step": 334225, "epoch": 1989} {"train_loss": -12.173797607421875, "global_step": 334226, "epoch": 1989} {"train_loss": -12.150444030761719, "global_step": 334227, "epoch": 1989} {"train_loss": -12.136246681213379, "global_step": 334228, "epoch": 1989} {"train_loss": -11.90567398071289, "global_step": 334229, "epoch": 1989} {"train_loss": -12.24455451965332, "global_step": 334230, "epoch": 1989} {"train_loss": -12.094722747802734, "global_step": 334231, "epoch": 1989} {"train_loss": -12.209230422973633, "global_step": 334232, "epoch": 1989} {"train_loss": -11.8253755569458, "global_step": 334233, "epoch": 1989} {"train_loss": -12.233735084533691, "global_step": 334234, "epoch": 1989} {"train_loss": -12.226781845092773, "global_step": 334235, "epoch": 1989} {"train_loss": -12.22659683227539, "global_step": 334236, "epoch": 1989} {"train_loss": -12.230255126953125, "global_step": 334237, "epoch": 1989} {"train_loss": -11.925098419189453, "global_step": 334238, "epoch": 1989} {"train_loss": -12.26817512512207, "global_step": 334239, "epoch": 1989} {"train_loss": -12.118155479431152, "global_step": 334240, "epoch": 1989} {"train_loss": -12.059958457946777, "global_step": 334241, "epoch": 1989} {"train_loss": -12.313568115234375, "global_step": 334242, "epoch": 1989} {"train_loss": -12.164222717285156, "global_step": 334243, "epoch": 1989} {"train_loss": -12.440886497497559, "global_step": 334244, "epoch": 1989} {"train_loss": -12.485970497131348, "global_step": 334245, "epoch": 1989} {"train_loss": -12.478744506835938, "global_step": 334246, "epoch": 1989} {"train_loss": -12.300832748413086, "global_step": 334247, "epoch": 1989} {"train_loss": -12.351727485656738, "global_step": 334248, "epoch": 1989} {"train_loss": -12.370536804199219, "global_step": 334249, "epoch": 1989} {"train_loss": -12.351024627685547, "global_step": 334250, "epoch": 1989} {"train_loss": -12.291118621826172, "global_step": 334251, "epoch": 1989} {"train_loss": -12.559598922729492, "global_step": 334252, "epoch": 1989} {"train_loss": -12.527543067932129, "global_step": 334253, "epoch": 1989} {"train_loss": -12.630924224853516, "global_step": 334254, "epoch": 1989} {"train_loss": -12.534830093383789, "global_step": 334255, "epoch": 1989} {"train_loss": -12.437856674194336, "global_step": 334256, "epoch": 1989} {"train_loss": -12.661930084228516, "global_step": 334257, "epoch": 1989} {"train_loss": -12.284326553344727, "global_step": 334258, "epoch": 1989} {"train_loss": -12.630464553833008, "global_step": 334259, "epoch": 1989} {"train_loss": -12.595056533813477, "global_step": 334260, "epoch": 1989} {"train_loss": -12.569174766540527, "global_step": 334261, "epoch": 1989} {"train_loss": -12.43880844116211, "global_step": 334262, "epoch": 1989} {"train_loss": -12.486438751220703, "global_step": 334263, "epoch": 1989} {"train_loss": -12.595930099487305, "global_step": 334264, "epoch": 1989} {"train_loss": -12.667099952697754, "global_step": 334265, "epoch": 1989} {"train_loss": -12.576444625854492, "global_step": 334266, "epoch": 1989} {"train_loss": -12.669964790344238, "global_step": 334267, "epoch": 1989} {"train_loss": -12.50905990600586, "global_step": 334268, "epoch": 1989} {"train_loss": -12.364219665527344, "global_step": 334269, "epoch": 1989} {"train_loss": -12.509880065917969, "global_step": 334270, "epoch": 1989} {"train_loss": -12.33290958404541, "global_step": 334271, "epoch": 1989} {"train_loss": -12.497541427612305, "global_step": 334272, "epoch": 1989} {"train_loss": -12.264748573303223, "global_step": 334273, "epoch": 1989} {"train_loss": -12.22901725769043, "global_step": 334274, "epoch": 1989} {"train_loss": -12.402324676513672, "global_step": 334275, "epoch": 1989} {"train_loss": -12.173774719238281, "global_step": 334276, "epoch": 1989} {"train_loss": -12.209912300109863, "global_step": 334277, "epoch": 1989} {"train_loss": -12.511484146118164, "global_step": 334278, "epoch": 1989} {"train_loss": -12.291423797607422, "global_step": 334279, "epoch": 1989} {"train_loss": -12.384675979614258, "global_step": 334280, "epoch": 1989} {"train_loss": -12.279047966003418, "global_step": 334281, "epoch": 1989} {"train_loss": -12.156609535217285, "global_step": 334282, "epoch": 1989} {"train_loss": -12.2591552734375, "global_step": 334283, "epoch": 1989} {"train_loss": -12.135916709899902, "global_step": 334284, "epoch": 1989} {"train_loss": -12.057537078857422, "global_step": 334285, "epoch": 1989} {"train_loss": -12.49350357055664, "global_step": 334286, "epoch": 1989} {"train_loss": -12.382322311401367, "global_step": 334287, "epoch": 1989} {"train_loss": -11.794145584106445, "global_step": 334288, "epoch": 1989} {"train_loss": -12.402931213378906, "global_step": 334289, "epoch": 1989} {"train_loss": -12.067875862121582, "global_step": 334290, "epoch": 1989} {"train_loss": -12.191746711730957, "global_step": 334291, "epoch": 1989} {"train_loss": -12.19269847869873, "global_step": 334292, "epoch": 1989} {"train_loss": -12.247337341308594, "global_step": 334293, "epoch": 1989} {"train_loss": -11.956893920898438, "global_step": 334294, "epoch": 1989} {"train_loss": -12.279666900634766, "global_step": 334295, "epoch": 1989} {"train_loss": -11.383401870727539, "global_step": 334296, "epoch": 1989} {"train_loss": -9.947247505187988, "global_step": 334297, "epoch": 1989} {"train_loss": -10.988471984863281, "global_step": 334298, "epoch": 1989} {"train_loss": -11.745643615722656, "global_step": 334299, "epoch": 1989} {"train_loss": -10.017709732055664, "global_step": 334300, "epoch": 1989} {"train_loss": -10.345827102661133, "global_step": 334301, "epoch": 1989} {"train_loss": -9.344412803649902, "global_step": 334302, "epoch": 1989} {"train_loss": -8.10757827758789, "global_step": 334303, "epoch": 1989} {"train_loss": -7.388720512390137, "global_step": 334304, "epoch": 1989} {"train_loss": -8.153787612915039, "global_step": 334305, "epoch": 1989} {"train_loss": -9.639814376831055, "global_step": 334306, "epoch": 1989} {"train_loss": -8.68034553527832, "global_step": 334307, "epoch": 1989} {"train_loss": -9.633535385131836, "global_step": 334308, "epoch": 1989} {"train_loss": -10.076478958129883, "global_step": 334309, "epoch": 1989} {"train_loss": -10.277619361877441, "global_step": 334310, "epoch": 1989} {"train_loss": -10.05154800415039, "global_step": 334311, "epoch": 1989} {"train_loss": -10.408920288085938, "global_step": 334312, "epoch": 1989} {"train_loss": -10.079667091369629, "global_step": 334313, "epoch": 1989} {"train_loss": -11.262617111206055, "global_step": 334314, "epoch": 1989} {"train_loss": -10.160441398620605, "global_step": 334315, "epoch": 1989} {"train_loss": -11.245925903320312, "global_step": 334316, "epoch": 1989} {"train_loss": -10.504091262817383, "global_step": 334317, "epoch": 1989} {"train_loss": -10.67718505859375, "global_step": 334318, "epoch": 1989} {"train_loss": -11.585228585061573, "global_step": 334319, "epoch": 1989, "val_loss": 280156.78125} {"train_loss": -10.270938873291016, "global_step": 334320, "epoch": 1990} {"train_loss": -10.250560760498047, "global_step": 334321, "epoch": 1990} {"train_loss": -10.102508544921875, "global_step": 334322, "epoch": 1990} {"train_loss": -11.036823272705078, "global_step": 334323, "epoch": 1990} {"train_loss": -10.353605270385742, "global_step": 334324, "epoch": 1990} {"train_loss": -11.85509204864502, "global_step": 334325, "epoch": 1990} {"train_loss": -10.793769836425781, "global_step": 334326, "epoch": 1990} {"train_loss": -11.583985328674316, "global_step": 334327, "epoch": 1990} {"train_loss": -10.891997337341309, "global_step": 334328, "epoch": 1990} {"train_loss": -11.641145706176758, "global_step": 334329, "epoch": 1990} {"train_loss": -11.418664932250977, "global_step": 334330, "epoch": 1990} {"train_loss": -11.846292495727539, "global_step": 334331, "epoch": 1990} {"train_loss": -11.340849876403809, "global_step": 334332, "epoch": 1990} {"train_loss": -11.368610382080078, "global_step": 334333, "epoch": 1990} {"train_loss": -11.52865219116211, "global_step": 334334, "epoch": 1990} {"train_loss": -11.015060424804688, "global_step": 334335, "epoch": 1990} {"train_loss": -11.785313606262207, "global_step": 334336, "epoch": 1990} {"train_loss": -11.050835609436035, "global_step": 334337, "epoch": 1990} {"train_loss": -12.010906219482422, "global_step": 334338, "epoch": 1990} {"train_loss": -11.23615837097168, "global_step": 334339, "epoch": 1990} {"train_loss": -11.859256744384766, "global_step": 334340, "epoch": 1990} {"train_loss": -11.215625762939453, "global_step": 334341, "epoch": 1990} {"train_loss": -11.566887855529785, "global_step": 334342, "epoch": 1990} {"train_loss": -11.943170547485352, "global_step": 334343, "epoch": 1990} {"train_loss": -11.853235244750977, "global_step": 334344, "epoch": 1990} {"train_loss": -11.696483612060547, "global_step": 334345, "epoch": 1990} {"train_loss": -11.928993225097656, "global_step": 334346, "epoch": 1990} {"train_loss": -11.645244598388672, "global_step": 334347, "epoch": 1990} {"train_loss": -11.64362907409668, "global_step": 334348, "epoch": 1990} {"train_loss": -11.997138977050781, "global_step": 334349, "epoch": 1990} {"train_loss": -11.38742446899414, "global_step": 334350, "epoch": 1990} {"train_loss": -11.83683967590332, "global_step": 334351, "epoch": 1990} {"train_loss": -12.075652122497559, "global_step": 334352, "epoch": 1990} {"train_loss": -11.389310836791992, "global_step": 334353, "epoch": 1990} {"train_loss": -11.84085464477539, "global_step": 334354, "epoch": 1990} {"train_loss": -11.191839218139648, "global_step": 334355, "epoch": 1990} {"train_loss": -11.747063636779785, "global_step": 334356, "epoch": 1990} {"train_loss": -11.780556678771973, "global_step": 334357, "epoch": 1990} {"train_loss": -11.861810684204102, "global_step": 334358, "epoch": 1990} {"train_loss": -11.525630950927734, "global_step": 334359, "epoch": 1990} {"train_loss": -12.022134780883789, "global_step": 334360, "epoch": 1990} {"train_loss": -11.366796493530273, "global_step": 334361, "epoch": 1990} {"train_loss": -11.920463562011719, "global_step": 334362, "epoch": 1990} {"train_loss": -11.91362476348877, "global_step": 334363, "epoch": 1990} {"train_loss": -11.87298583984375, "global_step": 334364, "epoch": 1990} {"train_loss": -11.963321685791016, "global_step": 334365, "epoch": 1990} {"train_loss": -11.767702102661133, "global_step": 334366, "epoch": 1990} {"train_loss": -11.906547546386719, "global_step": 334367, "epoch": 1990} {"train_loss": -11.914318084716797, "global_step": 334368, "epoch": 1990} {"train_loss": -12.235218048095703, "global_step": 334369, "epoch": 1990} {"train_loss": -11.989891052246094, "global_step": 334370, "epoch": 1990} {"train_loss": -12.122821807861328, "global_step": 334371, "epoch": 1990} {"train_loss": -12.182292938232422, "global_step": 334372, "epoch": 1990} {"train_loss": -11.893470764160156, "global_step": 334373, "epoch": 1990} {"train_loss": -12.371162414550781, "global_step": 334374, "epoch": 1990} {"train_loss": -12.184553146362305, "global_step": 334375, "epoch": 1990} {"train_loss": -12.181943893432617, "global_step": 334376, "epoch": 1990} {"train_loss": -12.195762634277344, "global_step": 334377, "epoch": 1990} {"train_loss": -12.128835678100586, "global_step": 334378, "epoch": 1990} {"train_loss": -12.18365478515625, "global_step": 334379, "epoch": 1990} {"train_loss": -12.187387466430664, "global_step": 334380, "epoch": 1990} {"train_loss": -12.082286834716797, "global_step": 334381, "epoch": 1990} {"train_loss": -12.075653076171875, "global_step": 334382, "epoch": 1990} {"train_loss": -12.280082702636719, "global_step": 334383, "epoch": 1990} {"train_loss": -12.39422607421875, "global_step": 334384, "epoch": 1990} {"train_loss": -12.1822509765625, "global_step": 334385, "epoch": 1990} {"train_loss": -12.425350189208984, "global_step": 334386, "epoch": 1990} {"train_loss": -12.276408195495605, "global_step": 334387, "epoch": 1990} {"train_loss": -12.428756713867188, "global_step": 334388, "epoch": 1990} {"train_loss": -12.39877700805664, "global_step": 334389, "epoch": 1990} {"train_loss": -12.37679672241211, "global_step": 334390, "epoch": 1990} {"train_loss": -12.147233963012695, "global_step": 334391, "epoch": 1990} {"train_loss": -12.451639175415039, "global_step": 334392, "epoch": 1990} {"train_loss": -12.202404022216797, "global_step": 334393, "epoch": 1990} {"train_loss": -12.42534351348877, "global_step": 334394, "epoch": 1990} {"train_loss": -12.531036376953125, "global_step": 334395, "epoch": 1990} {"train_loss": -12.403902053833008, "global_step": 334396, "epoch": 1990} {"train_loss": -12.046518325805664, "global_step": 334397, "epoch": 1990} {"train_loss": -12.491792678833008, "global_step": 334398, "epoch": 1990} {"train_loss": -12.50554084777832, "global_step": 334399, "epoch": 1990} {"train_loss": -12.261223793029785, "global_step": 334400, "epoch": 1990} {"train_loss": -12.420982360839844, "global_step": 334401, "epoch": 1990} {"train_loss": -12.384564399719238, "global_step": 334402, "epoch": 1990} {"train_loss": -12.447453498840332, "global_step": 334403, "epoch": 1990} {"train_loss": -12.479792594909668, "global_step": 334404, "epoch": 1990} {"train_loss": -12.588106155395508, "global_step": 334405, "epoch": 1990} {"train_loss": -12.548818588256836, "global_step": 334406, "epoch": 1990} {"train_loss": -12.53463363647461, "global_step": 334407, "epoch": 1990} {"train_loss": -12.563902854919434, "global_step": 334408, "epoch": 1990} {"train_loss": -12.461328506469727, "global_step": 334409, "epoch": 1990} {"train_loss": -12.557355880737305, "global_step": 334410, "epoch": 1990} {"train_loss": -12.49392032623291, "global_step": 334411, "epoch": 1990} {"train_loss": -12.464658737182617, "global_step": 334412, "epoch": 1990} {"train_loss": -12.444892883300781, "global_step": 334413, "epoch": 1990} {"train_loss": -12.187503814697266, "global_step": 334414, "epoch": 1990} {"train_loss": -12.40135383605957, "global_step": 334415, "epoch": 1990} {"train_loss": -12.507513999938965, "global_step": 334416, "epoch": 1990} {"train_loss": -12.809350967407227, "global_step": 334417, "epoch": 1990} {"train_loss": -12.538529396057129, "global_step": 334418, "epoch": 1990} {"train_loss": -12.652322769165039, "global_step": 334419, "epoch": 1990} {"train_loss": -12.555864334106445, "global_step": 334420, "epoch": 1990} {"train_loss": -12.455341339111328, "global_step": 334421, "epoch": 1990} {"train_loss": -12.390146255493164, "global_step": 334422, "epoch": 1990} {"train_loss": -12.006275177001953, "global_step": 334423, "epoch": 1990} {"train_loss": -12.556957244873047, "global_step": 334424, "epoch": 1990} {"train_loss": -12.498069763183594, "global_step": 334425, "epoch": 1990} {"train_loss": -11.885932922363281, "global_step": 334426, "epoch": 1990} {"train_loss": -11.605295181274414, "global_step": 334427, "epoch": 1990} {"train_loss": -12.195016860961914, "global_step": 334428, "epoch": 1990} {"train_loss": -12.536770820617676, "global_step": 334429, "epoch": 1990} {"train_loss": -12.634418487548828, "global_step": 334430, "epoch": 1990} {"train_loss": -12.55921459197998, "global_step": 334431, "epoch": 1990} {"train_loss": -12.454643249511719, "global_step": 334432, "epoch": 1990} {"train_loss": -12.067384719848633, "global_step": 334433, "epoch": 1990} {"train_loss": -12.416473388671875, "global_step": 334434, "epoch": 1990} {"train_loss": -12.509140014648438, "global_step": 334435, "epoch": 1990} {"train_loss": -12.30197811126709, "global_step": 334436, "epoch": 1990} {"train_loss": -12.028956413269043, "global_step": 334437, "epoch": 1990} {"train_loss": -12.759055137634277, "global_step": 334438, "epoch": 1990} {"train_loss": -12.210407257080078, "global_step": 334439, "epoch": 1990} {"train_loss": -11.570756912231445, "global_step": 334440, "epoch": 1990} {"train_loss": -12.097352981567383, "global_step": 334441, "epoch": 1990} {"train_loss": -12.2266845703125, "global_step": 334442, "epoch": 1990} {"train_loss": -10.72634220123291, "global_step": 334443, "epoch": 1990} {"train_loss": -11.217025756835938, "global_step": 334444, "epoch": 1990} {"train_loss": -11.616548538208008, "global_step": 334445, "epoch": 1990} {"train_loss": -9.570088386535645, "global_step": 334446, "epoch": 1990} {"train_loss": -8.987215042114258, "global_step": 334447, "epoch": 1990} {"train_loss": -8.139707565307617, "global_step": 334448, "epoch": 1990} {"train_loss": -9.410109519958496, "global_step": 334449, "epoch": 1990} {"train_loss": -10.146328926086426, "global_step": 334450, "epoch": 1990} {"train_loss": -9.135497093200684, "global_step": 334451, "epoch": 1990} {"train_loss": -9.792558670043945, "global_step": 334452, "epoch": 1990} {"train_loss": -8.762091636657715, "global_step": 334453, "epoch": 1990} {"train_loss": -8.36367416381836, "global_step": 334454, "epoch": 1990} {"train_loss": -7.77735710144043, "global_step": 334455, "epoch": 1990} {"train_loss": -9.187033653259277, "global_step": 334456, "epoch": 1990} {"train_loss": -9.526481628417969, "global_step": 334457, "epoch": 1990} {"train_loss": -9.705535888671875, "global_step": 334458, "epoch": 1990} {"train_loss": -9.523721694946289, "global_step": 334459, "epoch": 1990} {"train_loss": -9.173369407653809, "global_step": 334460, "epoch": 1990} {"train_loss": -11.152502059936523, "global_step": 334461, "epoch": 1990} {"train_loss": -10.403524398803711, "global_step": 334462, "epoch": 1990} {"train_loss": -11.192298889160156, "global_step": 334463, "epoch": 1990} {"train_loss": -11.167956352233887, "global_step": 334464, "epoch": 1990} {"train_loss": -11.03032398223877, "global_step": 334465, "epoch": 1990} {"train_loss": -10.710821151733398, "global_step": 334466, "epoch": 1990} {"train_loss": -11.259965896606445, "global_step": 334467, "epoch": 1990} {"train_loss": -11.067606925964355, "global_step": 334468, "epoch": 1990} {"train_loss": -11.561450958251953, "global_step": 334469, "epoch": 1990} {"train_loss": -11.223852157592773, "global_step": 334470, "epoch": 1990} {"train_loss": -11.377157211303711, "global_step": 334471, "epoch": 1990} {"train_loss": -10.715065002441406, "global_step": 334472, "epoch": 1990} {"train_loss": -11.092938423156738, "global_step": 334473, "epoch": 1990} {"train_loss": -10.769824981689453, "global_step": 334474, "epoch": 1990} {"train_loss": -11.581068992614746, "global_step": 334475, "epoch": 1990} {"train_loss": -10.888811111450195, "global_step": 334476, "epoch": 1990} {"train_loss": -11.690577507019043, "global_step": 334477, "epoch": 1990} {"train_loss": -11.333443641662598, "global_step": 334478, "epoch": 1990} {"train_loss": -11.792279243469238, "global_step": 334479, "epoch": 1990} {"train_loss": -11.383027076721191, "global_step": 334480, "epoch": 1990} {"train_loss": -11.562471389770508, "global_step": 334481, "epoch": 1990} {"train_loss": -11.5398588180542, "global_step": 334482, "epoch": 1990} {"train_loss": -11.661746978759766, "global_step": 334483, "epoch": 1990} {"train_loss": -11.661771774291992, "global_step": 334484, "epoch": 1990} {"train_loss": -11.688823699951172, "global_step": 334485, "epoch": 1990} {"train_loss": -11.709310531616211, "global_step": 334486, "epoch": 1990} {"train_loss": -11.617517306691123, "global_step": 334487, "epoch": 1990, "val_loss": 279879.4375, "train_action_mse_error": 1.1485334634780884} {"train_loss": -11.607436180114746, "global_step": 334488, "epoch": 1991} {"train_loss": -11.281930923461914, "global_step": 334489, "epoch": 1991} {"train_loss": -11.575489044189453, "global_step": 334490, "epoch": 1991} {"train_loss": -11.448356628417969, "global_step": 334491, "epoch": 1991} {"train_loss": -11.61526107788086, "global_step": 334492, "epoch": 1991} {"train_loss": -11.439411163330078, "global_step": 334493, "epoch": 1991} {"train_loss": -11.453519821166992, "global_step": 334494, "epoch": 1991} {"train_loss": -11.913307189941406, "global_step": 334495, "epoch": 1991} {"train_loss": -11.77995491027832, "global_step": 334496, "epoch": 1991} {"train_loss": -11.787912368774414, "global_step": 334497, "epoch": 1991} {"train_loss": -11.44503402709961, "global_step": 334498, "epoch": 1991} {"train_loss": -11.884336471557617, "global_step": 334499, "epoch": 1991} {"train_loss": -11.677345275878906, "global_step": 334500, "epoch": 1991} {"train_loss": -12.180130958557129, "global_step": 334501, "epoch": 1991} {"train_loss": -11.777719497680664, "global_step": 334502, "epoch": 1991} {"train_loss": -11.922077178955078, "global_step": 334503, "epoch": 1991} {"train_loss": -11.93563461303711, "global_step": 334504, "epoch": 1991} {"train_loss": -11.938166618347168, "global_step": 334505, "epoch": 1991} {"train_loss": -12.137655258178711, "global_step": 334506, "epoch": 1991} {"train_loss": -12.012088775634766, "global_step": 334507, "epoch": 1991} {"train_loss": -11.98744010925293, "global_step": 334508, "epoch": 1991} {"train_loss": -11.871316909790039, "global_step": 334509, "epoch": 1991} {"train_loss": -12.186308860778809, "global_step": 334510, "epoch": 1991} {"train_loss": -11.924765586853027, "global_step": 334511, "epoch": 1991} {"train_loss": -12.275972366333008, "global_step": 334512, "epoch": 1991} {"train_loss": -11.970757484436035, "global_step": 334513, "epoch": 1991} {"train_loss": -12.229024887084961, "global_step": 334514, "epoch": 1991} {"train_loss": -12.244976997375488, "global_step": 334515, "epoch": 1991} {"train_loss": -11.923361778259277, "global_step": 334516, "epoch": 1991} {"train_loss": -12.255437850952148, "global_step": 334517, "epoch": 1991} {"train_loss": -12.22410774230957, "global_step": 334518, "epoch": 1991} {"train_loss": -12.241594314575195, "global_step": 334519, "epoch": 1991} {"train_loss": -12.304227828979492, "global_step": 334520, "epoch": 1991} {"train_loss": -12.273277282714844, "global_step": 334521, "epoch": 1991} {"train_loss": -12.08425521850586, "global_step": 334522, "epoch": 1991} {"train_loss": -12.425033569335938, "global_step": 334523, "epoch": 1991} {"train_loss": -12.353591918945312, "global_step": 334524, "epoch": 1991} {"train_loss": -12.265721321105957, "global_step": 334525, "epoch": 1991} {"train_loss": -12.45488166809082, "global_step": 334526, "epoch": 1991} {"train_loss": -12.475425720214844, "global_step": 334527, "epoch": 1991} {"train_loss": -12.374711990356445, "global_step": 334528, "epoch": 1991} {"train_loss": -12.53982925415039, "global_step": 334529, "epoch": 1991} {"train_loss": -12.598831176757812, "global_step": 334530, "epoch": 1991} {"train_loss": -12.480377197265625, "global_step": 334531, "epoch": 1991} {"train_loss": -12.557760238647461, "global_step": 334532, "epoch": 1991} {"train_loss": -12.18937873840332, "global_step": 334533, "epoch": 1991} {"train_loss": -12.482455253601074, "global_step": 334534, "epoch": 1991} {"train_loss": -12.322043418884277, "global_step": 334535, "epoch": 1991} {"train_loss": -12.341490745544434, "global_step": 334536, "epoch": 1991} {"train_loss": -12.589977264404297, "global_step": 334537, "epoch": 1991} {"train_loss": -12.459205627441406, "global_step": 334538, "epoch": 1991} {"train_loss": -12.463324546813965, "global_step": 334539, "epoch": 1991} {"train_loss": -12.086023330688477, "global_step": 334540, "epoch": 1991} {"train_loss": -12.41724681854248, "global_step": 334541, "epoch": 1991} {"train_loss": -12.368122100830078, "global_step": 334542, "epoch": 1991} {"train_loss": -12.506584167480469, "global_step": 334543, "epoch": 1991} {"train_loss": -12.51531982421875, "global_step": 334544, "epoch": 1991} {"train_loss": -12.330217361450195, "global_step": 334545, "epoch": 1991} {"train_loss": -12.633428573608398, "global_step": 334546, "epoch": 1991} {"train_loss": -12.443284034729004, "global_step": 334547, "epoch": 1991} {"train_loss": -12.30797004699707, "global_step": 334548, "epoch": 1991} {"train_loss": -12.576391220092773, "global_step": 334549, "epoch": 1991} {"train_loss": -12.292375564575195, "global_step": 334550, "epoch": 1991} {"train_loss": -12.237072944641113, "global_step": 334551, "epoch": 1991} {"train_loss": -12.259142875671387, "global_step": 334552, "epoch": 1991} {"train_loss": -12.38987922668457, "global_step": 334553, "epoch": 1991} {"train_loss": -12.564407348632812, "global_step": 334554, "epoch": 1991} {"train_loss": -12.088120460510254, "global_step": 334555, "epoch": 1991} {"train_loss": -12.567177772521973, "global_step": 334556, "epoch": 1991} {"train_loss": -12.52274227142334, "global_step": 334557, "epoch": 1991} {"train_loss": -12.38366413116455, "global_step": 334558, "epoch": 1991} {"train_loss": -12.43267822265625, "global_step": 334559, "epoch": 1991} {"train_loss": -12.77538776397705, "global_step": 334560, "epoch": 1991} {"train_loss": -12.441402435302734, "global_step": 334561, "epoch": 1991} {"train_loss": -12.55708122253418, "global_step": 334562, "epoch": 1991} {"train_loss": -12.577278137207031, "global_step": 334563, "epoch": 1991} {"train_loss": -12.517637252807617, "global_step": 334564, "epoch": 1991} {"train_loss": -12.571775436401367, "global_step": 334565, "epoch": 1991} {"train_loss": -12.375749588012695, "global_step": 334566, "epoch": 1991} {"train_loss": -12.476678848266602, "global_step": 334567, "epoch": 1991} {"train_loss": -12.563138961791992, "global_step": 334568, "epoch": 1991} {"train_loss": -12.608560562133789, "global_step": 334569, "epoch": 1991} {"train_loss": -12.379348754882812, "global_step": 334570, "epoch": 1991} {"train_loss": -12.371772766113281, "global_step": 334571, "epoch": 1991} {"train_loss": -12.34790325164795, "global_step": 334572, "epoch": 1991} {"train_loss": -12.526058197021484, "global_step": 334573, "epoch": 1991} {"train_loss": -11.699515342712402, "global_step": 334574, "epoch": 1991} {"train_loss": -11.904160499572754, "global_step": 334575, "epoch": 1991} {"train_loss": -11.553024291992188, "global_step": 334576, "epoch": 1991} {"train_loss": -9.614814758300781, "global_step": 334577, "epoch": 1991} {"train_loss": -10.023635864257812, "global_step": 334578, "epoch": 1991} {"train_loss": -11.528942108154297, "global_step": 334579, "epoch": 1991} {"train_loss": -10.16352653503418, "global_step": 334580, "epoch": 1991} {"train_loss": -10.391626358032227, "global_step": 334581, "epoch": 1991} {"train_loss": -11.188119888305664, "global_step": 334582, "epoch": 1991} {"train_loss": -11.569197654724121, "global_step": 334583, "epoch": 1991} {"train_loss": -10.384747505187988, "global_step": 334584, "epoch": 1991} {"train_loss": -10.69317626953125, "global_step": 334585, "epoch": 1991} {"train_loss": -10.370502471923828, "global_step": 334586, "epoch": 1991} {"train_loss": -10.835488319396973, "global_step": 334587, "epoch": 1991} {"train_loss": -11.52016830444336, "global_step": 334588, "epoch": 1991} {"train_loss": -11.037004470825195, "global_step": 334589, "epoch": 1991} {"train_loss": -11.684514045715332, "global_step": 334590, "epoch": 1991} {"train_loss": -10.246036529541016, "global_step": 334591, "epoch": 1991} {"train_loss": -11.786269187927246, "global_step": 334592, "epoch": 1991} {"train_loss": -10.963072776794434, "global_step": 334593, "epoch": 1991} {"train_loss": -10.950836181640625, "global_step": 334594, "epoch": 1991} {"train_loss": -10.679075241088867, "global_step": 334595, "epoch": 1991} {"train_loss": -9.846821784973145, "global_step": 334596, "epoch": 1991} {"train_loss": -10.056055068969727, "global_step": 334597, "epoch": 1991} {"train_loss": -11.540356636047363, "global_step": 334598, "epoch": 1991} {"train_loss": -9.12948989868164, "global_step": 334599, "epoch": 1991} {"train_loss": -12.000381469726562, "global_step": 334600, "epoch": 1991} {"train_loss": -10.301916122436523, "global_step": 334601, "epoch": 1991} {"train_loss": -11.142273902893066, "global_step": 334602, "epoch": 1991} {"train_loss": -10.625226020812988, "global_step": 334603, "epoch": 1991} {"train_loss": -10.143239974975586, "global_step": 334604, "epoch": 1991} {"train_loss": -10.592580795288086, "global_step": 334605, "epoch": 1991} {"train_loss": -11.14796257019043, "global_step": 334606, "epoch": 1991} {"train_loss": -11.000011444091797, "global_step": 334607, "epoch": 1991} {"train_loss": -11.425634384155273, "global_step": 334608, "epoch": 1991} {"train_loss": -11.538389205932617, "global_step": 334609, "epoch": 1991} {"train_loss": -11.440614700317383, "global_step": 334610, "epoch": 1991} {"train_loss": -11.572330474853516, "global_step": 334611, "epoch": 1991} {"train_loss": -12.029133796691895, "global_step": 334612, "epoch": 1991} {"train_loss": -11.441625595092773, "global_step": 334613, "epoch": 1991} {"train_loss": -11.808469772338867, "global_step": 334614, "epoch": 1991} {"train_loss": -11.73164176940918, "global_step": 334615, "epoch": 1991} {"train_loss": -11.657746315002441, "global_step": 334616, "epoch": 1991} {"train_loss": -11.815042495727539, "global_step": 334617, "epoch": 1991} {"train_loss": -11.609434127807617, "global_step": 334618, "epoch": 1991} {"train_loss": -12.027786254882812, "global_step": 334619, "epoch": 1991} {"train_loss": -11.790122032165527, "global_step": 334620, "epoch": 1991} {"train_loss": -11.880730628967285, "global_step": 334621, "epoch": 1991} {"train_loss": -11.922443389892578, "global_step": 334622, "epoch": 1991} {"train_loss": -11.73361587524414, "global_step": 334623, "epoch": 1991} {"train_loss": -12.14468002319336, "global_step": 334624, "epoch": 1991} {"train_loss": -12.045628547668457, "global_step": 334625, "epoch": 1991} {"train_loss": -11.755516052246094, "global_step": 334626, "epoch": 1991} {"train_loss": -12.01582145690918, "global_step": 334627, "epoch": 1991} {"train_loss": -11.680351257324219, "global_step": 334628, "epoch": 1991} {"train_loss": -12.22424030303955, "global_step": 334629, "epoch": 1991} {"train_loss": -11.999980926513672, "global_step": 334630, "epoch": 1991} {"train_loss": -12.193638801574707, "global_step": 334631, "epoch": 1991} {"train_loss": -11.999576568603516, "global_step": 334632, "epoch": 1991} {"train_loss": -12.274053573608398, "global_step": 334633, "epoch": 1991} {"train_loss": -12.276865005493164, "global_step": 334634, "epoch": 1991} {"train_loss": -12.22030258178711, "global_step": 334635, "epoch": 1991} {"train_loss": -12.20321273803711, "global_step": 334636, "epoch": 1991} {"train_loss": -12.114245414733887, "global_step": 334637, "epoch": 1991} {"train_loss": -12.123144149780273, "global_step": 334638, "epoch": 1991} {"train_loss": -12.3524169921875, "global_step": 334639, "epoch": 1991} {"train_loss": -12.244128227233887, "global_step": 334640, "epoch": 1991} {"train_loss": -12.23691177368164, "global_step": 334641, "epoch": 1991} {"train_loss": -12.039376258850098, "global_step": 334642, "epoch": 1991} {"train_loss": -11.989542007446289, "global_step": 334643, "epoch": 1991} {"train_loss": -11.973027229309082, "global_step": 334644, "epoch": 1991} {"train_loss": -12.193330764770508, "global_step": 334645, "epoch": 1991} {"train_loss": -12.239545822143555, "global_step": 334646, "epoch": 1991} {"train_loss": -12.19032096862793, "global_step": 334647, "epoch": 1991} {"train_loss": -12.460102081298828, "global_step": 334648, "epoch": 1991} {"train_loss": -11.919590950012207, "global_step": 334649, "epoch": 1991} {"train_loss": -12.34692096710205, "global_step": 334650, "epoch": 1991} {"train_loss": -12.066352844238281, "global_step": 334651, "epoch": 1991} {"train_loss": -12.411107063293457, "global_step": 334652, "epoch": 1991} {"train_loss": -12.2039213180542, "global_step": 334653, "epoch": 1991} {"train_loss": -12.036092758178711, "global_step": 334654, "epoch": 1991} {"train_loss": -11.877762726375035, "global_step": 334655, "epoch": 1991, "val_loss": 287704.46875} {"train_loss": -12.202880859375, "global_step": 334656, "epoch": 1992} {"train_loss": -12.580205917358398, "global_step": 334657, "epoch": 1992} {"train_loss": -12.319168090820312, "global_step": 334658, "epoch": 1992} {"train_loss": -12.425880432128906, "global_step": 334659, "epoch": 1992} {"train_loss": -12.341678619384766, "global_step": 334660, "epoch": 1992} {"train_loss": -12.189891815185547, "global_step": 334661, "epoch": 1992} {"train_loss": -12.479423522949219, "global_step": 334662, "epoch": 1992} {"train_loss": -12.472436904907227, "global_step": 334663, "epoch": 1992} {"train_loss": -12.59810733795166, "global_step": 334664, "epoch": 1992} {"train_loss": -12.319278717041016, "global_step": 334665, "epoch": 1992} {"train_loss": -12.113224029541016, "global_step": 334666, "epoch": 1992} {"train_loss": -12.145462036132812, "global_step": 334667, "epoch": 1992} {"train_loss": -12.385257720947266, "global_step": 334668, "epoch": 1992} {"train_loss": -11.983100891113281, "global_step": 334669, "epoch": 1992} {"train_loss": -12.234708786010742, "global_step": 334670, "epoch": 1992} {"train_loss": -12.122852325439453, "global_step": 334671, "epoch": 1992} {"train_loss": -12.3603515625, "global_step": 334672, "epoch": 1992} {"train_loss": -12.076072692871094, "global_step": 334673, "epoch": 1992} {"train_loss": -12.062080383300781, "global_step": 334674, "epoch": 1992} {"train_loss": -11.809019088745117, "global_step": 334675, "epoch": 1992} {"train_loss": -12.201730728149414, "global_step": 334676, "epoch": 1992} {"train_loss": -11.843647956848145, "global_step": 334677, "epoch": 1992} {"train_loss": -11.869281768798828, "global_step": 334678, "epoch": 1992} {"train_loss": -11.699531555175781, "global_step": 334679, "epoch": 1992} {"train_loss": -11.529728889465332, "global_step": 334680, "epoch": 1992} {"train_loss": -12.211162567138672, "global_step": 334681, "epoch": 1992} {"train_loss": -12.25814437866211, "global_step": 334682, "epoch": 1992} {"train_loss": -11.735023498535156, "global_step": 334683, "epoch": 1992} {"train_loss": -12.459373474121094, "global_step": 334684, "epoch": 1992} {"train_loss": -12.167043685913086, "global_step": 334685, "epoch": 1992} {"train_loss": -12.367929458618164, "global_step": 334686, "epoch": 1992} {"train_loss": -12.078421592712402, "global_step": 334687, "epoch": 1992} {"train_loss": -12.254621505737305, "global_step": 334688, "epoch": 1992} {"train_loss": -12.028564453125, "global_step": 334689, "epoch": 1992} {"train_loss": -11.6793212890625, "global_step": 334690, "epoch": 1992} {"train_loss": -11.823596954345703, "global_step": 334691, "epoch": 1992} {"train_loss": -11.385696411132812, "global_step": 334692, "epoch": 1992} {"train_loss": -11.385091781616211, "global_step": 334693, "epoch": 1992} {"train_loss": -11.010546684265137, "global_step": 334694, "epoch": 1992} {"train_loss": -10.843520164489746, "global_step": 334695, "epoch": 1992} {"train_loss": -12.237436294555664, "global_step": 334696, "epoch": 1992} {"train_loss": -11.836583137512207, "global_step": 334697, "epoch": 1992} {"train_loss": -11.426936149597168, "global_step": 334698, "epoch": 1992} {"train_loss": -11.432378768920898, "global_step": 334699, "epoch": 1992} {"train_loss": -11.805668830871582, "global_step": 334700, "epoch": 1992} {"train_loss": -12.007705688476562, "global_step": 334701, "epoch": 1992} {"train_loss": -10.715304374694824, "global_step": 334702, "epoch": 1992} {"train_loss": -11.812606811523438, "global_step": 334703, "epoch": 1992} {"train_loss": -11.832969665527344, "global_step": 334704, "epoch": 1992} {"train_loss": -12.282121658325195, "global_step": 334705, "epoch": 1992} {"train_loss": -12.25244140625, "global_step": 334706, "epoch": 1992} {"train_loss": -11.929333686828613, "global_step": 334707, "epoch": 1992} {"train_loss": -11.839829444885254, "global_step": 334708, "epoch": 1992} {"train_loss": -11.725651741027832, "global_step": 334709, "epoch": 1992} {"train_loss": -12.028098106384277, "global_step": 334710, "epoch": 1992} {"train_loss": -11.697110176086426, "global_step": 334711, "epoch": 1992} {"train_loss": -10.596630096435547, "global_step": 334712, "epoch": 1992} {"train_loss": -11.845054626464844, "global_step": 334713, "epoch": 1992} {"train_loss": -11.81604290008545, "global_step": 334714, "epoch": 1992} {"train_loss": -12.132028579711914, "global_step": 334715, "epoch": 1992} {"train_loss": -11.869163513183594, "global_step": 334716, "epoch": 1992} {"train_loss": -11.973490715026855, "global_step": 334717, "epoch": 1992} {"train_loss": -11.987722396850586, "global_step": 334718, "epoch": 1992} {"train_loss": -11.974048614501953, "global_step": 334719, "epoch": 1992} {"train_loss": -12.096365928649902, "global_step": 334720, "epoch": 1992} {"train_loss": -11.850759506225586, "global_step": 334721, "epoch": 1992} {"train_loss": -12.242315292358398, "global_step": 334722, "epoch": 1992} {"train_loss": -12.070951461791992, "global_step": 334723, "epoch": 1992} {"train_loss": -12.182995796203613, "global_step": 334724, "epoch": 1992} {"train_loss": -12.192991256713867, "global_step": 334725, "epoch": 1992} {"train_loss": -12.217451095581055, "global_step": 334726, "epoch": 1992} {"train_loss": -11.875955581665039, "global_step": 334727, "epoch": 1992} {"train_loss": -12.356847763061523, "global_step": 334728, "epoch": 1992} {"train_loss": -12.152321815490723, "global_step": 334729, "epoch": 1992} {"train_loss": -12.23938274383545, "global_step": 334730, "epoch": 1992} {"train_loss": -12.212318420410156, "global_step": 334731, "epoch": 1992} {"train_loss": -12.01517391204834, "global_step": 334732, "epoch": 1992} {"train_loss": -12.37582778930664, "global_step": 334733, "epoch": 1992} {"train_loss": -12.040863037109375, "global_step": 334734, "epoch": 1992} {"train_loss": -12.300236701965332, "global_step": 334735, "epoch": 1992} {"train_loss": -12.18807601928711, "global_step": 334736, "epoch": 1992} {"train_loss": -12.37399673461914, "global_step": 334737, "epoch": 1992} {"train_loss": -12.192455291748047, "global_step": 334738, "epoch": 1992} {"train_loss": -12.17807388305664, "global_step": 334739, "epoch": 1992} {"train_loss": -12.425477981567383, "global_step": 334740, "epoch": 1992} {"train_loss": -12.107421875, "global_step": 334741, "epoch": 1992} {"train_loss": -12.170652389526367, "global_step": 334742, "epoch": 1992} {"train_loss": -12.355364799499512, "global_step": 334743, "epoch": 1992} {"train_loss": -11.930680274963379, "global_step": 334744, "epoch": 1992} {"train_loss": -12.38084602355957, "global_step": 334745, "epoch": 1992} {"train_loss": -12.385269165039062, "global_step": 334746, "epoch": 1992} {"train_loss": -11.657570838928223, "global_step": 334747, "epoch": 1992} {"train_loss": -12.372724533081055, "global_step": 334748, "epoch": 1992} {"train_loss": -11.602916717529297, "global_step": 334749, "epoch": 1992} {"train_loss": -11.766620635986328, "global_step": 334750, "epoch": 1992} {"train_loss": -12.489845275878906, "global_step": 334751, "epoch": 1992} {"train_loss": -12.357006072998047, "global_step": 334752, "epoch": 1992} {"train_loss": -11.961008071899414, "global_step": 334753, "epoch": 1992} {"train_loss": -12.052827835083008, "global_step": 334754, "epoch": 1992} {"train_loss": -11.986175537109375, "global_step": 334755, "epoch": 1992} {"train_loss": -11.17105484008789, "global_step": 334756, "epoch": 1992} {"train_loss": -12.55875301361084, "global_step": 334757, "epoch": 1992} {"train_loss": -11.035494804382324, "global_step": 334758, "epoch": 1992} {"train_loss": -10.537885665893555, "global_step": 334759, "epoch": 1992} {"train_loss": -12.257803916931152, "global_step": 334760, "epoch": 1992} {"train_loss": -11.473199844360352, "global_step": 334761, "epoch": 1992} {"train_loss": -11.79751205444336, "global_step": 334762, "epoch": 1992} {"train_loss": -12.081933975219727, "global_step": 334763, "epoch": 1992} {"train_loss": -11.472845077514648, "global_step": 334764, "epoch": 1992} {"train_loss": -12.183591842651367, "global_step": 334765, "epoch": 1992} {"train_loss": -11.613761901855469, "global_step": 334766, "epoch": 1992} {"train_loss": -12.098008155822754, "global_step": 334767, "epoch": 1992} {"train_loss": -11.897319793701172, "global_step": 334768, "epoch": 1992} {"train_loss": -12.334510803222656, "global_step": 334769, "epoch": 1992} {"train_loss": -12.34361457824707, "global_step": 334770, "epoch": 1992} {"train_loss": -12.137667655944824, "global_step": 334771, "epoch": 1992} {"train_loss": -12.264110565185547, "global_step": 334772, "epoch": 1992} {"train_loss": -12.278636932373047, "global_step": 334773, "epoch": 1992} {"train_loss": -12.177270889282227, "global_step": 334774, "epoch": 1992} {"train_loss": -12.030500411987305, "global_step": 334775, "epoch": 1992} {"train_loss": -12.074355125427246, "global_step": 334776, "epoch": 1992} {"train_loss": -12.080307006835938, "global_step": 334777, "epoch": 1992} {"train_loss": -11.347482681274414, "global_step": 334778, "epoch": 1992} {"train_loss": -12.438928604125977, "global_step": 334779, "epoch": 1992} {"train_loss": -12.096887588500977, "global_step": 334780, "epoch": 1992} {"train_loss": -11.980298042297363, "global_step": 334781, "epoch": 1992} {"train_loss": -12.326071739196777, "global_step": 334782, "epoch": 1992} {"train_loss": -11.14206314086914, "global_step": 334783, "epoch": 1992} {"train_loss": -11.37087345123291, "global_step": 334784, "epoch": 1992} {"train_loss": -12.558855056762695, "global_step": 334785, "epoch": 1992} {"train_loss": -12.022675514221191, "global_step": 334786, "epoch": 1992} {"train_loss": -12.022350311279297, "global_step": 334787, "epoch": 1992} {"train_loss": -12.211309432983398, "global_step": 334788, "epoch": 1992} {"train_loss": -12.329385757446289, "global_step": 334789, "epoch": 1992} {"train_loss": -11.908458709716797, "global_step": 334790, "epoch": 1992} {"train_loss": -12.448707580566406, "global_step": 334791, "epoch": 1992} {"train_loss": -12.360119819641113, "global_step": 334792, "epoch": 1992} {"train_loss": -12.298474311828613, "global_step": 334793, "epoch": 1992} {"train_loss": -12.408185005187988, "global_step": 334794, "epoch": 1992} {"train_loss": -12.208307266235352, "global_step": 334795, "epoch": 1992} {"train_loss": -12.255229949951172, "global_step": 334796, "epoch": 1992} {"train_loss": -12.334264755249023, "global_step": 334797, "epoch": 1992} {"train_loss": -12.37736701965332, "global_step": 334798, "epoch": 1992} {"train_loss": -12.420085906982422, "global_step": 334799, "epoch": 1992} {"train_loss": -12.507810592651367, "global_step": 334800, "epoch": 1992} {"train_loss": -12.630128860473633, "global_step": 334801, "epoch": 1992} {"train_loss": -12.710132598876953, "global_step": 334802, "epoch": 1992} {"train_loss": -12.153072357177734, "global_step": 334803, "epoch": 1992} {"train_loss": -12.458260536193848, "global_step": 334804, "epoch": 1992} {"train_loss": -12.328951835632324, "global_step": 334805, "epoch": 1992} {"train_loss": -12.478631019592285, "global_step": 334806, "epoch": 1992} {"train_loss": -12.381071090698242, "global_step": 334807, "epoch": 1992} {"train_loss": -12.377309799194336, "global_step": 334808, "epoch": 1992} {"train_loss": -12.500345230102539, "global_step": 334809, "epoch": 1992} {"train_loss": -12.240951538085938, "global_step": 334810, "epoch": 1992} {"train_loss": -12.427594184875488, "global_step": 334811, "epoch": 1992} {"train_loss": -12.334959983825684, "global_step": 334812, "epoch": 1992} {"train_loss": -12.292749404907227, "global_step": 334813, "epoch": 1992} {"train_loss": -12.234355926513672, "global_step": 334814, "epoch": 1992} {"train_loss": -12.668764114379883, "global_step": 334815, "epoch": 1992} {"train_loss": -12.281134605407715, "global_step": 334816, "epoch": 1992} {"train_loss": -12.527036666870117, "global_step": 334817, "epoch": 1992} {"train_loss": -12.157272338867188, "global_step": 334818, "epoch": 1992} {"train_loss": -12.525185585021973, "global_step": 334819, "epoch": 1992} {"train_loss": -12.586508750915527, "global_step": 334820, "epoch": 1992} {"train_loss": -12.70444107055664, "global_step": 334821, "epoch": 1992} {"train_loss": -12.427294731140137, "global_step": 334822, "epoch": 1992} {"train_loss": -12.081959151086354, "global_step": 334823, "epoch": 1992, "val_loss": 290600.625} {"train_loss": -12.361581802368164, "global_step": 334824, "epoch": 1993} {"train_loss": -12.17794132232666, "global_step": 334825, "epoch": 1993} {"train_loss": -12.059562683105469, "global_step": 334826, "epoch": 1993} {"train_loss": -12.46323013305664, "global_step": 334827, "epoch": 1993} {"train_loss": -11.731295585632324, "global_step": 334828, "epoch": 1993} {"train_loss": -10.241521835327148, "global_step": 334829, "epoch": 1993} {"train_loss": -12.367949485778809, "global_step": 334830, "epoch": 1993} {"train_loss": -11.914048194885254, "global_step": 334831, "epoch": 1993} {"train_loss": -11.581463813781738, "global_step": 334832, "epoch": 1993} {"train_loss": -12.520100593566895, "global_step": 334833, "epoch": 1993} {"train_loss": -12.375041961669922, "global_step": 334834, "epoch": 1993} {"train_loss": -11.861827850341797, "global_step": 334835, "epoch": 1993} {"train_loss": -12.086283683776855, "global_step": 334836, "epoch": 1993} {"train_loss": -11.851391792297363, "global_step": 334837, "epoch": 1993} {"train_loss": -12.049753189086914, "global_step": 334838, "epoch": 1993} {"train_loss": -11.85781192779541, "global_step": 334839, "epoch": 1993} {"train_loss": -12.34775161743164, "global_step": 334840, "epoch": 1993} {"train_loss": -11.542381286621094, "global_step": 334841, "epoch": 1993} {"train_loss": -11.763969421386719, "global_step": 334842, "epoch": 1993} {"train_loss": -12.231023788452148, "global_step": 334843, "epoch": 1993} {"train_loss": -12.067461013793945, "global_step": 334844, "epoch": 1993} {"train_loss": -11.943511009216309, "global_step": 334845, "epoch": 1993} {"train_loss": -11.841597557067871, "global_step": 334846, "epoch": 1993} {"train_loss": -11.881661415100098, "global_step": 334847, "epoch": 1993} {"train_loss": -11.002248764038086, "global_step": 334848, "epoch": 1993} {"train_loss": -11.78284740447998, "global_step": 334849, "epoch": 1993} {"train_loss": -10.657820701599121, "global_step": 334850, "epoch": 1993} {"train_loss": -11.590166091918945, "global_step": 334851, "epoch": 1993} {"train_loss": -10.651365280151367, "global_step": 334852, "epoch": 1993} {"train_loss": -11.348737716674805, "global_step": 334853, "epoch": 1993} {"train_loss": -10.610336303710938, "global_step": 334854, "epoch": 1993} {"train_loss": -10.265085220336914, "global_step": 334855, "epoch": 1993} {"train_loss": -11.268404006958008, "global_step": 334856, "epoch": 1993} {"train_loss": -10.67172622680664, "global_step": 334857, "epoch": 1993} {"train_loss": -12.30769157409668, "global_step": 334858, "epoch": 1993} {"train_loss": -10.60213851928711, "global_step": 334859, "epoch": 1993} {"train_loss": -11.030704498291016, "global_step": 334860, "epoch": 1993} {"train_loss": -10.971946716308594, "global_step": 334861, "epoch": 1993} {"train_loss": -12.039694786071777, "global_step": 334862, "epoch": 1993} {"train_loss": -11.603858947753906, "global_step": 334863, "epoch": 1993} {"train_loss": -11.428228378295898, "global_step": 334864, "epoch": 1993} {"train_loss": -12.052112579345703, "global_step": 334865, "epoch": 1993} {"train_loss": -11.606056213378906, "global_step": 334866, "epoch": 1993} {"train_loss": -11.50156307220459, "global_step": 334867, "epoch": 1993} {"train_loss": -11.83979606628418, "global_step": 334868, "epoch": 1993} {"train_loss": -11.278564453125, "global_step": 334869, "epoch": 1993} {"train_loss": -11.62397575378418, "global_step": 334870, "epoch": 1993} {"train_loss": -11.595869064331055, "global_step": 334871, "epoch": 1993} {"train_loss": -11.03490161895752, "global_step": 334872, "epoch": 1993} {"train_loss": -11.116046905517578, "global_step": 334873, "epoch": 1993} {"train_loss": -11.66132926940918, "global_step": 334874, "epoch": 1993} {"train_loss": -11.528276443481445, "global_step": 334875, "epoch": 1993} {"train_loss": -11.557461738586426, "global_step": 334876, "epoch": 1993} {"train_loss": -10.863569259643555, "global_step": 334877, "epoch": 1993} {"train_loss": -11.83561897277832, "global_step": 334878, "epoch": 1993} {"train_loss": -11.162052154541016, "global_step": 334879, "epoch": 1993} {"train_loss": -11.391380310058594, "global_step": 334880, "epoch": 1993} {"train_loss": -11.47301197052002, "global_step": 334881, "epoch": 1993} {"train_loss": -11.416269302368164, "global_step": 334882, "epoch": 1993} {"train_loss": -11.774822235107422, "global_step": 334883, "epoch": 1993} {"train_loss": -11.764888763427734, "global_step": 334884, "epoch": 1993} {"train_loss": -12.151065826416016, "global_step": 334885, "epoch": 1993} {"train_loss": -12.22128677368164, "global_step": 334886, "epoch": 1993} {"train_loss": -11.700839042663574, "global_step": 334887, "epoch": 1993} {"train_loss": -12.145157814025879, "global_step": 334888, "epoch": 1993} {"train_loss": -11.946809768676758, "global_step": 334889, "epoch": 1993} {"train_loss": -12.239500045776367, "global_step": 334890, "epoch": 1993} {"train_loss": -11.929322242736816, "global_step": 334891, "epoch": 1993} {"train_loss": -12.293405532836914, "global_step": 334892, "epoch": 1993} {"train_loss": -12.01055908203125, "global_step": 334893, "epoch": 1993} {"train_loss": -11.646329879760742, "global_step": 334894, "epoch": 1993} {"train_loss": -12.12185287475586, "global_step": 334895, "epoch": 1993} {"train_loss": -12.141155242919922, "global_step": 334896, "epoch": 1993} {"train_loss": -12.13487434387207, "global_step": 334897, "epoch": 1993} {"train_loss": -12.378189086914062, "global_step": 334898, "epoch": 1993} {"train_loss": -12.384801864624023, "global_step": 334899, "epoch": 1993} {"train_loss": -12.241277694702148, "global_step": 334900, "epoch": 1993} {"train_loss": -12.115106582641602, "global_step": 334901, "epoch": 1993} {"train_loss": -12.037022590637207, "global_step": 334902, "epoch": 1993} {"train_loss": -12.142050743103027, "global_step": 334903, "epoch": 1993} {"train_loss": -12.29026985168457, "global_step": 334904, "epoch": 1993} {"train_loss": -12.16977310180664, "global_step": 334905, "epoch": 1993} {"train_loss": -12.372152328491211, "global_step": 334906, "epoch": 1993} {"train_loss": -12.325174331665039, "global_step": 334907, "epoch": 1993} {"train_loss": -12.370405197143555, "global_step": 334908, "epoch": 1993} {"train_loss": -12.271875381469727, "global_step": 334909, "epoch": 1993} {"train_loss": -11.887983322143555, "global_step": 334910, "epoch": 1993} {"train_loss": -12.41523551940918, "global_step": 334911, "epoch": 1993} {"train_loss": -12.080318450927734, "global_step": 334912, "epoch": 1993} {"train_loss": -12.11284065246582, "global_step": 334913, "epoch": 1993} {"train_loss": -11.781965255737305, "global_step": 334914, "epoch": 1993} {"train_loss": -12.00893783569336, "global_step": 334915, "epoch": 1993} {"train_loss": -11.983861923217773, "global_step": 334916, "epoch": 1993} {"train_loss": -12.08700180053711, "global_step": 334917, "epoch": 1993} {"train_loss": -12.249759674072266, "global_step": 334918, "epoch": 1993} {"train_loss": -12.4104642868042, "global_step": 334919, "epoch": 1993} {"train_loss": -12.118017196655273, "global_step": 334920, "epoch": 1993} {"train_loss": -11.886293411254883, "global_step": 334921, "epoch": 1993} {"train_loss": -12.226648330688477, "global_step": 334922, "epoch": 1993} {"train_loss": -12.044615745544434, "global_step": 334923, "epoch": 1993} {"train_loss": -12.372282981872559, "global_step": 334924, "epoch": 1993} {"train_loss": -12.218992233276367, "global_step": 334925, "epoch": 1993} {"train_loss": -11.907902717590332, "global_step": 334926, "epoch": 1993} {"train_loss": -12.095121383666992, "global_step": 334927, "epoch": 1993} {"train_loss": -11.453472137451172, "global_step": 334928, "epoch": 1993} {"train_loss": -11.895036697387695, "global_step": 334929, "epoch": 1993} {"train_loss": -11.73863697052002, "global_step": 334930, "epoch": 1993} {"train_loss": -12.331317901611328, "global_step": 334931, "epoch": 1993} {"train_loss": -11.356391906738281, "global_step": 334932, "epoch": 1993} {"train_loss": -12.162679672241211, "global_step": 334933, "epoch": 1993} {"train_loss": -11.686420440673828, "global_step": 334934, "epoch": 1993} {"train_loss": -11.00308609008789, "global_step": 334935, "epoch": 1993} {"train_loss": -11.965253829956055, "global_step": 334936, "epoch": 1993} {"train_loss": -10.740020751953125, "global_step": 334937, "epoch": 1993} {"train_loss": -11.349949836730957, "global_step": 334938, "epoch": 1993} {"train_loss": -11.018831253051758, "global_step": 334939, "epoch": 1993} {"train_loss": -8.990545272827148, "global_step": 334940, "epoch": 1993} {"train_loss": -10.065685272216797, "global_step": 334941, "epoch": 1993} {"train_loss": -10.84805965423584, "global_step": 334942, "epoch": 1993} {"train_loss": -10.779237747192383, "global_step": 334943, "epoch": 1993} {"train_loss": -10.717927932739258, "global_step": 334944, "epoch": 1993} {"train_loss": -11.90475845336914, "global_step": 334945, "epoch": 1993} {"train_loss": -10.852897644042969, "global_step": 334946, "epoch": 1993} {"train_loss": -11.022279739379883, "global_step": 334947, "epoch": 1993} {"train_loss": -11.307965278625488, "global_step": 334948, "epoch": 1993} {"train_loss": -10.165186882019043, "global_step": 334949, "epoch": 1993} {"train_loss": -12.009685516357422, "global_step": 334950, "epoch": 1993} {"train_loss": -10.95480728149414, "global_step": 334951, "epoch": 1993} {"train_loss": -11.574445724487305, "global_step": 334952, "epoch": 1993} {"train_loss": -11.595983505249023, "global_step": 334953, "epoch": 1993} {"train_loss": -10.688305854797363, "global_step": 334954, "epoch": 1993} {"train_loss": -11.985440254211426, "global_step": 334955, "epoch": 1993} {"train_loss": -11.243958473205566, "global_step": 334956, "epoch": 1993} {"train_loss": -11.089557647705078, "global_step": 334957, "epoch": 1993} {"train_loss": -11.961851119995117, "global_step": 334958, "epoch": 1993} {"train_loss": -11.14938735961914, "global_step": 334959, "epoch": 1993} {"train_loss": -12.034354209899902, "global_step": 334960, "epoch": 1993} {"train_loss": -11.864587783813477, "global_step": 334961, "epoch": 1993} {"train_loss": -11.556435585021973, "global_step": 334962, "epoch": 1993} {"train_loss": -11.99407958984375, "global_step": 334963, "epoch": 1993} {"train_loss": -11.820939064025879, "global_step": 334964, "epoch": 1993} {"train_loss": -12.148515701293945, "global_step": 334965, "epoch": 1993} {"train_loss": -11.925262451171875, "global_step": 334966, "epoch": 1993} {"train_loss": -12.144033432006836, "global_step": 334967, "epoch": 1993} {"train_loss": -11.914201736450195, "global_step": 334968, "epoch": 1993} {"train_loss": -12.062406539916992, "global_step": 334969, "epoch": 1993} {"train_loss": -11.83008098602295, "global_step": 334970, "epoch": 1993} {"train_loss": -11.0869140625, "global_step": 334971, "epoch": 1993} {"train_loss": -12.228858947753906, "global_step": 334972, "epoch": 1993} {"train_loss": -11.135562896728516, "global_step": 334973, "epoch": 1993} {"train_loss": -11.743505477905273, "global_step": 334974, "epoch": 1993} {"train_loss": -11.257135391235352, "global_step": 334975, "epoch": 1993} {"train_loss": -11.675209999084473, "global_step": 334976, "epoch": 1993} {"train_loss": -11.855684280395508, "global_step": 334977, "epoch": 1993} {"train_loss": -11.936203002929688, "global_step": 334978, "epoch": 1993} {"train_loss": -11.765134811401367, "global_step": 334979, "epoch": 1993} {"train_loss": -11.542919158935547, "global_step": 334980, "epoch": 1993} {"train_loss": -11.993722915649414, "global_step": 334981, "epoch": 1993} {"train_loss": -11.771538734436035, "global_step": 334982, "epoch": 1993} {"train_loss": -12.074408531188965, "global_step": 334983, "epoch": 1993} {"train_loss": -11.532772064208984, "global_step": 334984, "epoch": 1993} {"train_loss": -12.049505233764648, "global_step": 334985, "epoch": 1993} {"train_loss": -11.465547561645508, "global_step": 334986, "epoch": 1993} {"train_loss": -11.884482383728027, "global_step": 334987, "epoch": 1993} {"train_loss": -11.725522994995117, "global_step": 334988, "epoch": 1993} {"train_loss": -11.865663528442383, "global_step": 334989, "epoch": 1993} {"train_loss": -11.87904167175293, "global_step": 334990, "epoch": 1993} {"train_loss": -11.70060072058723, "global_step": 334991, "epoch": 1993, "val_loss": 287097.46875} {"train_loss": -11.720308303833008, "global_step": 334992, "epoch": 1994} {"train_loss": -11.214298248291016, "global_step": 334993, "epoch": 1994} {"train_loss": -11.990745544433594, "global_step": 334994, "epoch": 1994} {"train_loss": -11.917596817016602, "global_step": 334995, "epoch": 1994} {"train_loss": -12.072610855102539, "global_step": 334996, "epoch": 1994} {"train_loss": -12.138729095458984, "global_step": 334997, "epoch": 1994} {"train_loss": -12.189627647399902, "global_step": 334998, "epoch": 1994} {"train_loss": -12.230972290039062, "global_step": 334999, "epoch": 1994} {"train_loss": -12.098201751708984, "global_step": 335000, "epoch": 1994} {"train_loss": -12.26199722290039, "global_step": 335001, "epoch": 1994} {"train_loss": -12.3890962600708, "global_step": 335002, "epoch": 1994} {"train_loss": -12.219282150268555, "global_step": 335003, "epoch": 1994} {"train_loss": -12.236618041992188, "global_step": 335004, "epoch": 1994} {"train_loss": -12.142171859741211, "global_step": 335005, "epoch": 1994} {"train_loss": -12.287771224975586, "global_step": 335006, "epoch": 1994} {"train_loss": -11.561844825744629, "global_step": 335007, "epoch": 1994} {"train_loss": -12.419281005859375, "global_step": 335008, "epoch": 1994} {"train_loss": -12.18450927734375, "global_step": 335009, "epoch": 1994} {"train_loss": -12.096543312072754, "global_step": 335010, "epoch": 1994} {"train_loss": -12.11312484741211, "global_step": 335011, "epoch": 1994} {"train_loss": -12.319561004638672, "global_step": 335012, "epoch": 1994} {"train_loss": -12.428298950195312, "global_step": 335013, "epoch": 1994} {"train_loss": -12.338748931884766, "global_step": 335014, "epoch": 1994} {"train_loss": -12.342743873596191, "global_step": 335015, "epoch": 1994} {"train_loss": -12.421632766723633, "global_step": 335016, "epoch": 1994} {"train_loss": -12.355928421020508, "global_step": 335017, "epoch": 1994} {"train_loss": -12.298028945922852, "global_step": 335018, "epoch": 1994} {"train_loss": -12.42742919921875, "global_step": 335019, "epoch": 1994} {"train_loss": -12.09907341003418, "global_step": 335020, "epoch": 1994} {"train_loss": -12.186744689941406, "global_step": 335021, "epoch": 1994} {"train_loss": -12.213451385498047, "global_step": 335022, "epoch": 1994} {"train_loss": -12.177690505981445, "global_step": 335023, "epoch": 1994} {"train_loss": -12.285993576049805, "global_step": 335024, "epoch": 1994} {"train_loss": -12.110538482666016, "global_step": 335025, "epoch": 1994} {"train_loss": -11.789470672607422, "global_step": 335026, "epoch": 1994} {"train_loss": -12.14583969116211, "global_step": 335027, "epoch": 1994} {"train_loss": -12.215978622436523, "global_step": 335028, "epoch": 1994} {"train_loss": -11.971674919128418, "global_step": 335029, "epoch": 1994} {"train_loss": -12.262052536010742, "global_step": 335030, "epoch": 1994} {"train_loss": -12.171009063720703, "global_step": 335031, "epoch": 1994} {"train_loss": -12.490280151367188, "global_step": 335032, "epoch": 1994} {"train_loss": -12.21650505065918, "global_step": 335033, "epoch": 1994} {"train_loss": -12.400217056274414, "global_step": 335034, "epoch": 1994} {"train_loss": -12.476663589477539, "global_step": 335035, "epoch": 1994} {"train_loss": -12.325834274291992, "global_step": 335036, "epoch": 1994} {"train_loss": -12.59579086303711, "global_step": 335037, "epoch": 1994} {"train_loss": -12.416147232055664, "global_step": 335038, "epoch": 1994} {"train_loss": -12.183967590332031, "global_step": 335039, "epoch": 1994} {"train_loss": -12.060548782348633, "global_step": 335040, "epoch": 1994} {"train_loss": -12.40101432800293, "global_step": 335041, "epoch": 1994} {"train_loss": -12.088326454162598, "global_step": 335042, "epoch": 1994} {"train_loss": -12.508419036865234, "global_step": 335043, "epoch": 1994} {"train_loss": -12.214385032653809, "global_step": 335044, "epoch": 1994} {"train_loss": -12.618148803710938, "global_step": 335045, "epoch": 1994} {"train_loss": -12.336074829101562, "global_step": 335046, "epoch": 1994} {"train_loss": -12.32547378540039, "global_step": 335047, "epoch": 1994} {"train_loss": -12.283023834228516, "global_step": 335048, "epoch": 1994} {"train_loss": -12.18983268737793, "global_step": 335049, "epoch": 1994} {"train_loss": -12.319694519042969, "global_step": 335050, "epoch": 1994} {"train_loss": -12.780937194824219, "global_step": 335051, "epoch": 1994} {"train_loss": -12.523260116577148, "global_step": 335052, "epoch": 1994} {"train_loss": -12.749269485473633, "global_step": 335053, "epoch": 1994} {"train_loss": -12.58652114868164, "global_step": 335054, "epoch": 1994} {"train_loss": -12.339439392089844, "global_step": 335055, "epoch": 1994} {"train_loss": -12.097311019897461, "global_step": 335056, "epoch": 1994} {"train_loss": -12.508559226989746, "global_step": 335057, "epoch": 1994} {"train_loss": -12.219440460205078, "global_step": 335058, "epoch": 1994} {"train_loss": -12.412240982055664, "global_step": 335059, "epoch": 1994} {"train_loss": -12.236505508422852, "global_step": 335060, "epoch": 1994} {"train_loss": -12.153240203857422, "global_step": 335061, "epoch": 1994} {"train_loss": -12.175188064575195, "global_step": 335062, "epoch": 1994} {"train_loss": -11.948570251464844, "global_step": 335063, "epoch": 1994} {"train_loss": -11.03246021270752, "global_step": 335064, "epoch": 1994} {"train_loss": -12.076963424682617, "global_step": 335065, "epoch": 1994} {"train_loss": -11.01237678527832, "global_step": 335066, "epoch": 1994} {"train_loss": -9.937535285949707, "global_step": 335067, "epoch": 1994} {"train_loss": -12.275127410888672, "global_step": 335068, "epoch": 1994} {"train_loss": -8.019683837890625, "global_step": 335069, "epoch": 1994} {"train_loss": -11.59664535522461, "global_step": 335070, "epoch": 1994} {"train_loss": -8.93991756439209, "global_step": 335071, "epoch": 1994} {"train_loss": -9.572065353393555, "global_step": 335072, "epoch": 1994} {"train_loss": -10.945028305053711, "global_step": 335073, "epoch": 1994} {"train_loss": -10.152568817138672, "global_step": 335074, "epoch": 1994} {"train_loss": -9.44273567199707, "global_step": 335075, "epoch": 1994} {"train_loss": -10.555481910705566, "global_step": 335076, "epoch": 1994} {"train_loss": -10.94372272491455, "global_step": 335077, "epoch": 1994} {"train_loss": -9.973902702331543, "global_step": 335078, "epoch": 1994} {"train_loss": -10.879006385803223, "global_step": 335079, "epoch": 1994} {"train_loss": -11.418926239013672, "global_step": 335080, "epoch": 1994} {"train_loss": -10.760520935058594, "global_step": 335081, "epoch": 1994} {"train_loss": -9.69064712524414, "global_step": 335082, "epoch": 1994} {"train_loss": -11.725808143615723, "global_step": 335083, "epoch": 1994} {"train_loss": -10.058731079101562, "global_step": 335084, "epoch": 1994} {"train_loss": -11.937891960144043, "global_step": 335085, "epoch": 1994} {"train_loss": -10.216608047485352, "global_step": 335086, "epoch": 1994} {"train_loss": -11.41862678527832, "global_step": 335087, "epoch": 1994} {"train_loss": -9.27503776550293, "global_step": 335088, "epoch": 1994} {"train_loss": -11.624542236328125, "global_step": 335089, "epoch": 1994} {"train_loss": -9.4199800491333, "global_step": 335090, "epoch": 1994} {"train_loss": -9.443422317504883, "global_step": 335091, "epoch": 1994} {"train_loss": -10.83731460571289, "global_step": 335092, "epoch": 1994} {"train_loss": -10.603605270385742, "global_step": 335093, "epoch": 1994} {"train_loss": -10.511659622192383, "global_step": 335094, "epoch": 1994} {"train_loss": -10.188496589660645, "global_step": 335095, "epoch": 1994} {"train_loss": -10.912942886352539, "global_step": 335096, "epoch": 1994} {"train_loss": -9.34721565246582, "global_step": 335097, "epoch": 1994} {"train_loss": -11.758307456970215, "global_step": 335098, "epoch": 1994} {"train_loss": -10.48243522644043, "global_step": 335099, "epoch": 1994} {"train_loss": -10.589168548583984, "global_step": 335100, "epoch": 1994} {"train_loss": -11.641658782958984, "global_step": 335101, "epoch": 1994} {"train_loss": -10.847099304199219, "global_step": 335102, "epoch": 1994} {"train_loss": -11.354491233825684, "global_step": 335103, "epoch": 1994} {"train_loss": -11.815568923950195, "global_step": 335104, "epoch": 1994} {"train_loss": -11.208423614501953, "global_step": 335105, "epoch": 1994} {"train_loss": -11.291973114013672, "global_step": 335106, "epoch": 1994} {"train_loss": -11.66537094116211, "global_step": 335107, "epoch": 1994} {"train_loss": -11.253478050231934, "global_step": 335108, "epoch": 1994} {"train_loss": -11.268064498901367, "global_step": 335109, "epoch": 1994} {"train_loss": -11.866313934326172, "global_step": 335110, "epoch": 1994} {"train_loss": -11.290157318115234, "global_step": 335111, "epoch": 1994} {"train_loss": -11.59379768371582, "global_step": 335112, "epoch": 1994} {"train_loss": -11.560148239135742, "global_step": 335113, "epoch": 1994} {"train_loss": -11.678741455078125, "global_step": 335114, "epoch": 1994} {"train_loss": -11.9303617477417, "global_step": 335115, "epoch": 1994} {"train_loss": -11.63309097290039, "global_step": 335116, "epoch": 1994} {"train_loss": -11.881223678588867, "global_step": 335117, "epoch": 1994} {"train_loss": -11.866265296936035, "global_step": 335118, "epoch": 1994} {"train_loss": -11.800551414489746, "global_step": 335119, "epoch": 1994} {"train_loss": -11.988304138183594, "global_step": 335120, "epoch": 1994} {"train_loss": -11.869464874267578, "global_step": 335121, "epoch": 1994} {"train_loss": -12.016792297363281, "global_step": 335122, "epoch": 1994} {"train_loss": -12.066750526428223, "global_step": 335123, "epoch": 1994} {"train_loss": -12.18653678894043, "global_step": 335124, "epoch": 1994} {"train_loss": -11.8842134475708, "global_step": 335125, "epoch": 1994} {"train_loss": -12.089683532714844, "global_step": 335126, "epoch": 1994} {"train_loss": -12.15179443359375, "global_step": 335127, "epoch": 1994} {"train_loss": -12.230180740356445, "global_step": 335128, "epoch": 1994} {"train_loss": -12.147199630737305, "global_step": 335129, "epoch": 1994} {"train_loss": -12.176431655883789, "global_step": 335130, "epoch": 1994} {"train_loss": -12.178349494934082, "global_step": 335131, "epoch": 1994} {"train_loss": -12.073182106018066, "global_step": 335132, "epoch": 1994} {"train_loss": -12.328475952148438, "global_step": 335133, "epoch": 1994} {"train_loss": -12.152199745178223, "global_step": 335134, "epoch": 1994} {"train_loss": -12.313262939453125, "global_step": 335135, "epoch": 1994} {"train_loss": -12.334232330322266, "global_step": 335136, "epoch": 1994} {"train_loss": -12.225805282592773, "global_step": 335137, "epoch": 1994} {"train_loss": -12.372016906738281, "global_step": 335138, "epoch": 1994} {"train_loss": -12.192559242248535, "global_step": 335139, "epoch": 1994} {"train_loss": -12.320112228393555, "global_step": 335140, "epoch": 1994} {"train_loss": -12.23318099975586, "global_step": 335141, "epoch": 1994} {"train_loss": -12.153948783874512, "global_step": 335142, "epoch": 1994} {"train_loss": -12.411664962768555, "global_step": 335143, "epoch": 1994} {"train_loss": -12.327583312988281, "global_step": 335144, "epoch": 1994} {"train_loss": -12.489006996154785, "global_step": 335145, "epoch": 1994} {"train_loss": -12.465982437133789, "global_step": 335146, "epoch": 1994} {"train_loss": -12.545108795166016, "global_step": 335147, "epoch": 1994} {"train_loss": -12.324848175048828, "global_step": 335148, "epoch": 1994} {"train_loss": -12.411794662475586, "global_step": 335149, "epoch": 1994} {"train_loss": -12.391831398010254, "global_step": 335150, "epoch": 1994} {"train_loss": -12.489501953125, "global_step": 335151, "epoch": 1994} {"train_loss": -12.531194686889648, "global_step": 335152, "epoch": 1994} {"train_loss": -12.412559509277344, "global_step": 335153, "epoch": 1994} {"train_loss": -12.519619941711426, "global_step": 335154, "epoch": 1994} {"train_loss": -12.651185989379883, "global_step": 335155, "epoch": 1994} {"train_loss": -12.478753089904785, "global_step": 335156, "epoch": 1994} {"train_loss": -12.480990409851074, "global_step": 335157, "epoch": 1994} {"train_loss": -12.404219627380371, "global_step": 335158, "epoch": 1994} {"train_loss": -11.797089355332512, "global_step": 335159, "epoch": 1994, "val_loss": 288519.0625} {"train_loss": -12.559686660766602, "global_step": 335160, "epoch": 1995} {"train_loss": -12.508071899414062, "global_step": 335161, "epoch": 1995} {"train_loss": -12.715128898620605, "global_step": 335162, "epoch": 1995} {"train_loss": -12.508933067321777, "global_step": 335163, "epoch": 1995} {"train_loss": -12.482873916625977, "global_step": 335164, "epoch": 1995} {"train_loss": -12.445344924926758, "global_step": 335165, "epoch": 1995} {"train_loss": -12.224372863769531, "global_step": 335166, "epoch": 1995} {"train_loss": -12.611175537109375, "global_step": 335167, "epoch": 1995} {"train_loss": -12.521814346313477, "global_step": 335168, "epoch": 1995} {"train_loss": -12.501354217529297, "global_step": 335169, "epoch": 1995} {"train_loss": -12.435579299926758, "global_step": 335170, "epoch": 1995} {"train_loss": -12.657147407531738, "global_step": 335171, "epoch": 1995} {"train_loss": -12.391685485839844, "global_step": 335172, "epoch": 1995} {"train_loss": -12.149862289428711, "global_step": 335173, "epoch": 1995} {"train_loss": -12.192304611206055, "global_step": 335174, "epoch": 1995} {"train_loss": -12.34011459350586, "global_step": 335175, "epoch": 1995} {"train_loss": -12.46139907836914, "global_step": 335176, "epoch": 1995} {"train_loss": -12.603897094726562, "global_step": 335177, "epoch": 1995} {"train_loss": -12.266592025756836, "global_step": 335178, "epoch": 1995} {"train_loss": -12.480525016784668, "global_step": 335179, "epoch": 1995} {"train_loss": -12.476983070373535, "global_step": 335180, "epoch": 1995} {"train_loss": -12.542623519897461, "global_step": 335181, "epoch": 1995} {"train_loss": -12.297853469848633, "global_step": 335182, "epoch": 1995} {"train_loss": -12.05402946472168, "global_step": 335183, "epoch": 1995} {"train_loss": -12.176642417907715, "global_step": 335184, "epoch": 1995} {"train_loss": -12.508996963500977, "global_step": 335185, "epoch": 1995} {"train_loss": -12.071520805358887, "global_step": 335186, "epoch": 1995} {"train_loss": -11.853311538696289, "global_step": 335187, "epoch": 1995} {"train_loss": -12.175962448120117, "global_step": 335188, "epoch": 1995} {"train_loss": -12.588153839111328, "global_step": 335189, "epoch": 1995} {"train_loss": -12.414239883422852, "global_step": 335190, "epoch": 1995} {"train_loss": -11.631487846374512, "global_step": 335191, "epoch": 1995} {"train_loss": -11.854362487792969, "global_step": 335192, "epoch": 1995} {"train_loss": -12.56488037109375, "global_step": 335193, "epoch": 1995} {"train_loss": -12.53499984741211, "global_step": 335194, "epoch": 1995} {"train_loss": -11.572587966918945, "global_step": 335195, "epoch": 1995} {"train_loss": -11.646240234375, "global_step": 335196, "epoch": 1995} {"train_loss": -11.655868530273438, "global_step": 335197, "epoch": 1995} {"train_loss": -12.224494934082031, "global_step": 335198, "epoch": 1995} {"train_loss": -10.340893745422363, "global_step": 335199, "epoch": 1995} {"train_loss": -11.989082336425781, "global_step": 335200, "epoch": 1995} {"train_loss": -9.776350975036621, "global_step": 335201, "epoch": 1995} {"train_loss": -11.231515884399414, "global_step": 335202, "epoch": 1995} {"train_loss": -10.227190017700195, "global_step": 335203, "epoch": 1995} {"train_loss": -11.280142784118652, "global_step": 335204, "epoch": 1995} {"train_loss": -10.840624809265137, "global_step": 335205, "epoch": 1995} {"train_loss": -10.194941520690918, "global_step": 335206, "epoch": 1995} {"train_loss": -11.006794929504395, "global_step": 335207, "epoch": 1995} {"train_loss": -10.603494644165039, "global_step": 335208, "epoch": 1995} {"train_loss": -10.509028434753418, "global_step": 335209, "epoch": 1995} {"train_loss": -11.671401977539062, "global_step": 335210, "epoch": 1995} {"train_loss": -10.026527404785156, "global_step": 335211, "epoch": 1995} {"train_loss": -11.523368835449219, "global_step": 335212, "epoch": 1995} {"train_loss": -10.947433471679688, "global_step": 335213, "epoch": 1995} {"train_loss": -10.826484680175781, "global_step": 335214, "epoch": 1995} {"train_loss": -11.706989288330078, "global_step": 335215, "epoch": 1995} {"train_loss": -10.952155113220215, "global_step": 335216, "epoch": 1995} {"train_loss": -11.542552947998047, "global_step": 335217, "epoch": 1995} {"train_loss": -11.591728210449219, "global_step": 335218, "epoch": 1995} {"train_loss": -11.027566909790039, "global_step": 335219, "epoch": 1995} {"train_loss": -12.044771194458008, "global_step": 335220, "epoch": 1995} {"train_loss": -10.367005348205566, "global_step": 335221, "epoch": 1995} {"train_loss": -11.637947082519531, "global_step": 335222, "epoch": 1995} {"train_loss": -11.188149452209473, "global_step": 335223, "epoch": 1995} {"train_loss": -11.044992446899414, "global_step": 335224, "epoch": 1995} {"train_loss": -11.329996109008789, "global_step": 335225, "epoch": 1995} {"train_loss": -11.175681114196777, "global_step": 335226, "epoch": 1995} {"train_loss": -11.657171249389648, "global_step": 335227, "epoch": 1995} {"train_loss": -11.040096282958984, "global_step": 335228, "epoch": 1995} {"train_loss": -11.513151168823242, "global_step": 335229, "epoch": 1995} {"train_loss": -11.071453094482422, "global_step": 335230, "epoch": 1995} {"train_loss": -11.738466262817383, "global_step": 335231, "epoch": 1995} {"train_loss": -11.2833890914917, "global_step": 335232, "epoch": 1995} {"train_loss": -11.714420318603516, "global_step": 335233, "epoch": 1995} {"train_loss": -11.64267349243164, "global_step": 335234, "epoch": 1995} {"train_loss": -11.669401168823242, "global_step": 335235, "epoch": 1995} {"train_loss": -11.539101600646973, "global_step": 335236, "epoch": 1995} {"train_loss": -11.456306457519531, "global_step": 335237, "epoch": 1995} {"train_loss": -11.961400985717773, "global_step": 335238, "epoch": 1995} {"train_loss": -11.778444290161133, "global_step": 335239, "epoch": 1995} {"train_loss": -12.093559265136719, "global_step": 335240, "epoch": 1995} {"train_loss": -11.696927070617676, "global_step": 335241, "epoch": 1995} {"train_loss": -11.695600509643555, "global_step": 335242, "epoch": 1995} {"train_loss": -11.982463836669922, "global_step": 335243, "epoch": 1995} {"train_loss": -11.462698936462402, "global_step": 335244, "epoch": 1995} {"train_loss": -11.952106475830078, "global_step": 335245, "epoch": 1995} {"train_loss": -11.366620063781738, "global_step": 335246, "epoch": 1995} {"train_loss": -11.785030364990234, "global_step": 335247, "epoch": 1995} {"train_loss": -11.794710159301758, "global_step": 335248, "epoch": 1995} {"train_loss": -12.007709503173828, "global_step": 335249, "epoch": 1995} {"train_loss": -11.775819778442383, "global_step": 335250, "epoch": 1995} {"train_loss": -11.563726425170898, "global_step": 335251, "epoch": 1995} {"train_loss": -11.49055290222168, "global_step": 335252, "epoch": 1995} {"train_loss": -12.154677391052246, "global_step": 335253, "epoch": 1995} {"train_loss": -12.209301948547363, "global_step": 335254, "epoch": 1995} {"train_loss": -12.176812171936035, "global_step": 335255, "epoch": 1995} {"train_loss": -11.953057289123535, "global_step": 335256, "epoch": 1995} {"train_loss": -11.898941040039062, "global_step": 335257, "epoch": 1995} {"train_loss": -11.995866775512695, "global_step": 335258, "epoch": 1995} {"train_loss": -12.211620330810547, "global_step": 335259, "epoch": 1995} {"train_loss": -12.2073335647583, "global_step": 335260, "epoch": 1995} {"train_loss": -12.256339073181152, "global_step": 335261, "epoch": 1995} {"train_loss": -12.004888534545898, "global_step": 335262, "epoch": 1995} {"train_loss": -12.341446876525879, "global_step": 335263, "epoch": 1995} {"train_loss": -11.912728309631348, "global_step": 335264, "epoch": 1995} {"train_loss": -12.282872200012207, "global_step": 335265, "epoch": 1995} {"train_loss": -12.210311889648438, "global_step": 335266, "epoch": 1995} {"train_loss": -12.105985641479492, "global_step": 335267, "epoch": 1995} {"train_loss": -12.25593090057373, "global_step": 335268, "epoch": 1995} {"train_loss": -12.223947525024414, "global_step": 335269, "epoch": 1995} {"train_loss": -12.722625732421875, "global_step": 335270, "epoch": 1995} {"train_loss": -12.239142417907715, "global_step": 335271, "epoch": 1995} {"train_loss": -12.214896202087402, "global_step": 335272, "epoch": 1995} {"train_loss": -12.192869186401367, "global_step": 335273, "epoch": 1995} {"train_loss": -12.317573547363281, "global_step": 335274, "epoch": 1995} {"train_loss": -12.292204856872559, "global_step": 335275, "epoch": 1995} {"train_loss": -12.182068824768066, "global_step": 335276, "epoch": 1995} {"train_loss": -12.274343490600586, "global_step": 335277, "epoch": 1995} {"train_loss": -12.311761856079102, "global_step": 335278, "epoch": 1995} {"train_loss": -12.252143859863281, "global_step": 335279, "epoch": 1995} {"train_loss": -12.264201164245605, "global_step": 335280, "epoch": 1995} {"train_loss": -12.096059799194336, "global_step": 335281, "epoch": 1995} {"train_loss": -12.24112606048584, "global_step": 335282, "epoch": 1995} {"train_loss": -12.055727005004883, "global_step": 335283, "epoch": 1995} {"train_loss": -12.395139694213867, "global_step": 335284, "epoch": 1995} {"train_loss": -12.249405860900879, "global_step": 335285, "epoch": 1995} {"train_loss": -11.776496887207031, "global_step": 335286, "epoch": 1995} {"train_loss": -12.335536003112793, "global_step": 335287, "epoch": 1995} {"train_loss": -12.097058296203613, "global_step": 335288, "epoch": 1995} {"train_loss": -12.406240463256836, "global_step": 335289, "epoch": 1995} {"train_loss": -12.346881866455078, "global_step": 335290, "epoch": 1995} {"train_loss": -12.3836669921875, "global_step": 335291, "epoch": 1995} {"train_loss": -12.47468090057373, "global_step": 335292, "epoch": 1995} {"train_loss": -12.457098960876465, "global_step": 335293, "epoch": 1995} {"train_loss": -12.452415466308594, "global_step": 335294, "epoch": 1995} {"train_loss": -12.466097831726074, "global_step": 335295, "epoch": 1995} {"train_loss": -12.409006118774414, "global_step": 335296, "epoch": 1995} {"train_loss": -12.4911527633667, "global_step": 335297, "epoch": 1995} {"train_loss": -12.619333267211914, "global_step": 335298, "epoch": 1995} {"train_loss": -12.521993637084961, "global_step": 335299, "epoch": 1995} {"train_loss": -12.549625396728516, "global_step": 335300, "epoch": 1995} {"train_loss": -12.562302589416504, "global_step": 335301, "epoch": 1995} {"train_loss": -12.45485782623291, "global_step": 335302, "epoch": 1995} {"train_loss": -12.602828979492188, "global_step": 335303, "epoch": 1995} {"train_loss": -12.346424102783203, "global_step": 335304, "epoch": 1995} {"train_loss": -12.481348037719727, "global_step": 335305, "epoch": 1995} {"train_loss": -12.453588485717773, "global_step": 335306, "epoch": 1995} {"train_loss": -12.485126495361328, "global_step": 335307, "epoch": 1995} {"train_loss": -12.20820426940918, "global_step": 335308, "epoch": 1995} {"train_loss": -12.638664245605469, "global_step": 335309, "epoch": 1995} {"train_loss": -12.46856689453125, "global_step": 335310, "epoch": 1995} {"train_loss": -12.272680282592773, "global_step": 335311, "epoch": 1995} {"train_loss": -12.40961742401123, "global_step": 335312, "epoch": 1995} {"train_loss": -12.592948913574219, "global_step": 335313, "epoch": 1995} {"train_loss": -12.584494590759277, "global_step": 335314, "epoch": 1995} {"train_loss": -12.488807678222656, "global_step": 335315, "epoch": 1995} {"train_loss": -12.532039642333984, "global_step": 335316, "epoch": 1995} {"train_loss": -12.425140380859375, "global_step": 335317, "epoch": 1995} {"train_loss": -12.490081787109375, "global_step": 335318, "epoch": 1995} {"train_loss": -12.424676895141602, "global_step": 335319, "epoch": 1995} {"train_loss": -12.598245620727539, "global_step": 335320, "epoch": 1995} {"train_loss": -12.59213924407959, "global_step": 335321, "epoch": 1995} {"train_loss": -12.544581413269043, "global_step": 335322, "epoch": 1995} {"train_loss": -12.440207481384277, "global_step": 335323, "epoch": 1995} {"train_loss": -12.192432403564453, "global_step": 335324, "epoch": 1995} {"train_loss": -12.619930267333984, "global_step": 335325, "epoch": 1995} {"train_loss": -12.325773239135742, "global_step": 335326, "epoch": 1995} {"train_loss": -12.003391492934455, "global_step": 335327, "epoch": 1995, "val_loss": 288697.84375, "train_action_mse_error": 4.352718830108643} {"train_loss": -12.22408676147461, "global_step": 335328, "epoch": 1996} {"train_loss": -11.974681854248047, "global_step": 335329, "epoch": 1996} {"train_loss": -11.848182678222656, "global_step": 335330, "epoch": 1996} {"train_loss": -12.252038955688477, "global_step": 335331, "epoch": 1996} {"train_loss": -12.171491622924805, "global_step": 335332, "epoch": 1996} {"train_loss": -12.258355140686035, "global_step": 335333, "epoch": 1996} {"train_loss": -10.955190658569336, "global_step": 335334, "epoch": 1996} {"train_loss": -10.829397201538086, "global_step": 335335, "epoch": 1996} {"train_loss": -10.66290283203125, "global_step": 335336, "epoch": 1996} {"train_loss": -12.274234771728516, "global_step": 335337, "epoch": 1996} {"train_loss": -11.556625366210938, "global_step": 335338, "epoch": 1996} {"train_loss": -11.09124755859375, "global_step": 335339, "epoch": 1996} {"train_loss": -11.988237380981445, "global_step": 335340, "epoch": 1996} {"train_loss": -8.44961166381836, "global_step": 335341, "epoch": 1996} {"train_loss": -10.331852912902832, "global_step": 335342, "epoch": 1996} {"train_loss": -9.496835708618164, "global_step": 335343, "epoch": 1996} {"train_loss": -8.591864585876465, "global_step": 335344, "epoch": 1996} {"train_loss": -9.03286361694336, "global_step": 335345, "epoch": 1996} {"train_loss": -10.309137344360352, "global_step": 335346, "epoch": 1996} {"train_loss": -7.015344619750977, "global_step": 335347, "epoch": 1996} {"train_loss": -9.816850662231445, "global_step": 335348, "epoch": 1996} {"train_loss": -8.291644096374512, "global_step": 335349, "epoch": 1996} {"train_loss": -9.11525821685791, "global_step": 335350, "epoch": 1996} {"train_loss": -7.4323859214782715, "global_step": 335351, "epoch": 1996} {"train_loss": -7.3979902267456055, "global_step": 335352, "epoch": 1996} {"train_loss": -6.758174419403076, "global_step": 335353, "epoch": 1996} {"train_loss": -7.927430152893066, "global_step": 335354, "epoch": 1996} {"train_loss": -8.809088706970215, "global_step": 335355, "epoch": 1996} {"train_loss": -8.974178314208984, "global_step": 335356, "epoch": 1996} {"train_loss": -8.04764175415039, "global_step": 335357, "epoch": 1996} {"train_loss": -9.458370208740234, "global_step": 335358, "epoch": 1996} {"train_loss": -9.419681549072266, "global_step": 335359, "epoch": 1996} {"train_loss": -8.9074125289917, "global_step": 335360, "epoch": 1996} {"train_loss": -8.917498588562012, "global_step": 335361, "epoch": 1996} {"train_loss": -11.094836235046387, "global_step": 335362, "epoch": 1996} {"train_loss": -8.976680755615234, "global_step": 335363, "epoch": 1996} {"train_loss": -10.360121726989746, "global_step": 335364, "epoch": 1996} {"train_loss": -10.435880661010742, "global_step": 335365, "epoch": 1996} {"train_loss": -10.659967422485352, "global_step": 335366, "epoch": 1996} {"train_loss": -10.830236434936523, "global_step": 335367, "epoch": 1996} {"train_loss": -10.609321594238281, "global_step": 335368, "epoch": 1996} {"train_loss": -11.223358154296875, "global_step": 335369, "epoch": 1996} {"train_loss": -11.46927547454834, "global_step": 335370, "epoch": 1996} {"train_loss": -11.041194915771484, "global_step": 335371, "epoch": 1996} {"train_loss": -11.51250171661377, "global_step": 335372, "epoch": 1996} {"train_loss": -11.260663032531738, "global_step": 335373, "epoch": 1996} {"train_loss": -11.425115585327148, "global_step": 335374, "epoch": 1996} {"train_loss": -11.361456871032715, "global_step": 335375, "epoch": 1996} {"train_loss": -11.535615921020508, "global_step": 335376, "epoch": 1996} {"train_loss": -11.728231430053711, "global_step": 335377, "epoch": 1996} {"train_loss": -11.616899490356445, "global_step": 335378, "epoch": 1996} {"train_loss": -12.030872344970703, "global_step": 335379, "epoch": 1996} {"train_loss": -11.893514633178711, "global_step": 335380, "epoch": 1996} {"train_loss": -11.792943954467773, "global_step": 335381, "epoch": 1996} {"train_loss": -11.922414779663086, "global_step": 335382, "epoch": 1996} {"train_loss": -11.784404754638672, "global_step": 335383, "epoch": 1996} {"train_loss": -11.657557487487793, "global_step": 335384, "epoch": 1996} {"train_loss": -11.78005599975586, "global_step": 335385, "epoch": 1996} {"train_loss": -11.917693138122559, "global_step": 335386, "epoch": 1996} {"train_loss": -11.745022773742676, "global_step": 335387, "epoch": 1996} {"train_loss": -11.789556503295898, "global_step": 335388, "epoch": 1996} {"train_loss": -12.128433227539062, "global_step": 335389, "epoch": 1996} {"train_loss": -11.741941452026367, "global_step": 335390, "epoch": 1996} {"train_loss": -11.934341430664062, "global_step": 335391, "epoch": 1996} {"train_loss": -12.023050308227539, "global_step": 335392, "epoch": 1996} {"train_loss": -11.859728813171387, "global_step": 335393, "epoch": 1996} {"train_loss": -12.054740905761719, "global_step": 335394, "epoch": 1996} {"train_loss": -12.24892807006836, "global_step": 335395, "epoch": 1996} {"train_loss": -12.022713661193848, "global_step": 335396, "epoch": 1996} {"train_loss": -12.16168212890625, "global_step": 335397, "epoch": 1996} {"train_loss": -11.970398902893066, "global_step": 335398, "epoch": 1996} {"train_loss": -12.208063125610352, "global_step": 335399, "epoch": 1996} {"train_loss": -11.76628303527832, "global_step": 335400, "epoch": 1996} {"train_loss": -11.952252388000488, "global_step": 335401, "epoch": 1996} {"train_loss": -11.96584701538086, "global_step": 335402, "epoch": 1996} {"train_loss": -12.300958633422852, "global_step": 335403, "epoch": 1996} {"train_loss": -12.16458511352539, "global_step": 335404, "epoch": 1996} {"train_loss": -12.285100936889648, "global_step": 335405, "epoch": 1996} {"train_loss": -12.142374038696289, "global_step": 335406, "epoch": 1996} {"train_loss": -12.303800582885742, "global_step": 335407, "epoch": 1996} {"train_loss": -11.99588680267334, "global_step": 335408, "epoch": 1996} {"train_loss": -12.346630096435547, "global_step": 335409, "epoch": 1996} {"train_loss": -12.270956993103027, "global_step": 335410, "epoch": 1996} {"train_loss": -12.154016494750977, "global_step": 335411, "epoch": 1996} {"train_loss": -12.238641738891602, "global_step": 335412, "epoch": 1996} {"train_loss": -12.317429542541504, "global_step": 335413, "epoch": 1996} {"train_loss": -12.13496208190918, "global_step": 335414, "epoch": 1996} {"train_loss": -12.311264038085938, "global_step": 335415, "epoch": 1996} {"train_loss": -12.354637145996094, "global_step": 335416, "epoch": 1996} {"train_loss": -12.040943145751953, "global_step": 335417, "epoch": 1996} {"train_loss": -12.429997444152832, "global_step": 335418, "epoch": 1996} {"train_loss": -12.284463882446289, "global_step": 335419, "epoch": 1996} {"train_loss": -12.42908763885498, "global_step": 335420, "epoch": 1996} {"train_loss": -12.062383651733398, "global_step": 335421, "epoch": 1996} {"train_loss": -12.449902534484863, "global_step": 335422, "epoch": 1996} {"train_loss": -12.381490707397461, "global_step": 335423, "epoch": 1996} {"train_loss": -12.61504077911377, "global_step": 335424, "epoch": 1996} {"train_loss": -12.506875991821289, "global_step": 335425, "epoch": 1996} {"train_loss": -12.507255554199219, "global_step": 335426, "epoch": 1996} {"train_loss": -12.298078536987305, "global_step": 335427, "epoch": 1996} {"train_loss": -12.176735877990723, "global_step": 335428, "epoch": 1996} {"train_loss": -12.174432754516602, "global_step": 335429, "epoch": 1996} {"train_loss": -12.439058303833008, "global_step": 335430, "epoch": 1996} {"train_loss": -12.510982513427734, "global_step": 335431, "epoch": 1996} {"train_loss": -12.29011344909668, "global_step": 335432, "epoch": 1996} {"train_loss": -12.470510482788086, "global_step": 335433, "epoch": 1996} {"train_loss": -12.532495498657227, "global_step": 335434, "epoch": 1996} {"train_loss": -12.268312454223633, "global_step": 335435, "epoch": 1996} {"train_loss": -12.417007446289062, "global_step": 335436, "epoch": 1996} {"train_loss": -12.390769004821777, "global_step": 335437, "epoch": 1996} {"train_loss": -12.682251930236816, "global_step": 335438, "epoch": 1996} {"train_loss": -12.565244674682617, "global_step": 335439, "epoch": 1996} {"train_loss": -12.53062915802002, "global_step": 335440, "epoch": 1996} {"train_loss": -12.671218872070312, "global_step": 335441, "epoch": 1996} {"train_loss": -12.414813995361328, "global_step": 335442, "epoch": 1996} {"train_loss": -12.328742980957031, "global_step": 335443, "epoch": 1996} {"train_loss": -12.652767181396484, "global_step": 335444, "epoch": 1996} {"train_loss": -12.596671104431152, "global_step": 335445, "epoch": 1996} {"train_loss": -12.326597213745117, "global_step": 335446, "epoch": 1996} {"train_loss": -12.608758926391602, "global_step": 335447, "epoch": 1996} {"train_loss": -12.416440963745117, "global_step": 335448, "epoch": 1996} {"train_loss": -12.61262321472168, "global_step": 335449, "epoch": 1996} {"train_loss": -12.488229751586914, "global_step": 335450, "epoch": 1996} {"train_loss": -12.426101684570312, "global_step": 335451, "epoch": 1996} {"train_loss": -12.308370590209961, "global_step": 335452, "epoch": 1996} {"train_loss": -12.489917755126953, "global_step": 335453, "epoch": 1996} {"train_loss": -12.347882270812988, "global_step": 335454, "epoch": 1996} {"train_loss": -12.612356185913086, "global_step": 335455, "epoch": 1996} {"train_loss": -12.624099731445312, "global_step": 335456, "epoch": 1996} {"train_loss": -12.51768684387207, "global_step": 335457, "epoch": 1996} {"train_loss": -12.642349243164062, "global_step": 335458, "epoch": 1996} {"train_loss": -12.548531532287598, "global_step": 335459, "epoch": 1996} {"train_loss": -12.566774368286133, "global_step": 335460, "epoch": 1996} {"train_loss": -12.426175117492676, "global_step": 335461, "epoch": 1996} {"train_loss": -12.21685791015625, "global_step": 335462, "epoch": 1996} {"train_loss": -12.01053237915039, "global_step": 335463, "epoch": 1996} {"train_loss": -12.669946670532227, "global_step": 335464, "epoch": 1996} {"train_loss": -12.528148651123047, "global_step": 335465, "epoch": 1996} {"train_loss": -12.419846534729004, "global_step": 335466, "epoch": 1996} {"train_loss": -11.830061912536621, "global_step": 335467, "epoch": 1996} {"train_loss": -12.067118644714355, "global_step": 335468, "epoch": 1996} {"train_loss": -11.907491683959961, "global_step": 335469, "epoch": 1996} {"train_loss": -12.371410369873047, "global_step": 335470, "epoch": 1996} {"train_loss": -11.273443222045898, "global_step": 335471, "epoch": 1996} {"train_loss": -10.380232810974121, "global_step": 335472, "epoch": 1996} {"train_loss": -10.607349395751953, "global_step": 335473, "epoch": 1996} {"train_loss": -9.817230224609375, "global_step": 335474, "epoch": 1996} {"train_loss": -8.761754035949707, "global_step": 335475, "epoch": 1996} {"train_loss": -9.278592109680176, "global_step": 335476, "epoch": 1996} {"train_loss": -9.944369316101074, "global_step": 335477, "epoch": 1996} {"train_loss": -10.714813232421875, "global_step": 335478, "epoch": 1996} {"train_loss": -9.055912971496582, "global_step": 335479, "epoch": 1996} {"train_loss": -11.974075317382812, "global_step": 335480, "epoch": 1996} {"train_loss": -9.710700035095215, "global_step": 335481, "epoch": 1996} {"train_loss": -10.961365699768066, "global_step": 335482, "epoch": 1996} {"train_loss": -11.362215042114258, "global_step": 335483, "epoch": 1996} {"train_loss": -9.96243667602539, "global_step": 335484, "epoch": 1996} {"train_loss": -11.57101821899414, "global_step": 335485, "epoch": 1996} {"train_loss": -10.660463333129883, "global_step": 335486, "epoch": 1996} {"train_loss": -11.344976425170898, "global_step": 335487, "epoch": 1996} {"train_loss": -11.153352737426758, "global_step": 335488, "epoch": 1996} {"train_loss": -11.05514907836914, "global_step": 335489, "epoch": 1996} {"train_loss": -10.611006736755371, "global_step": 335490, "epoch": 1996} {"train_loss": -11.021829605102539, "global_step": 335491, "epoch": 1996} {"train_loss": -9.084907531738281, "global_step": 335492, "epoch": 1996} {"train_loss": -11.676355361938477, "global_step": 335493, "epoch": 1996} {"train_loss": -10.072433471679688, "global_step": 335494, "epoch": 1996} {"train_loss": -11.379141296659197, "global_step": 335495, "epoch": 1996, "val_loss": 284136.375} {"train_loss": -10.092262268066406, "global_step": 335496, "epoch": 1997} {"train_loss": -8.423192977905273, "global_step": 335497, "epoch": 1997} {"train_loss": -8.905217170715332, "global_step": 335498, "epoch": 1997} {"train_loss": -10.700008392333984, "global_step": 335499, "epoch": 1997} {"train_loss": -10.245882034301758, "global_step": 335500, "epoch": 1997} {"train_loss": -10.960612297058105, "global_step": 335501, "epoch": 1997} {"train_loss": -10.737226486206055, "global_step": 335502, "epoch": 1997} {"train_loss": -11.303004264831543, "global_step": 335503, "epoch": 1997} {"train_loss": -9.950233459472656, "global_step": 335504, "epoch": 1997} {"train_loss": -10.86129093170166, "global_step": 335505, "epoch": 1997} {"train_loss": -11.418144226074219, "global_step": 335506, "epoch": 1997} {"train_loss": -10.18826675415039, "global_step": 335507, "epoch": 1997} {"train_loss": -11.500431060791016, "global_step": 335508, "epoch": 1997} {"train_loss": -10.888162612915039, "global_step": 335509, "epoch": 1997} {"train_loss": -11.088508605957031, "global_step": 335510, "epoch": 1997} {"train_loss": -11.83873176574707, "global_step": 335511, "epoch": 1997} {"train_loss": -11.566737174987793, "global_step": 335512, "epoch": 1997} {"train_loss": -11.053117752075195, "global_step": 335513, "epoch": 1997} {"train_loss": -11.758295059204102, "global_step": 335514, "epoch": 1997} {"train_loss": -11.20242691040039, "global_step": 335515, "epoch": 1997} {"train_loss": -11.485529899597168, "global_step": 335516, "epoch": 1997} {"train_loss": -11.61217212677002, "global_step": 335517, "epoch": 1997} {"train_loss": -11.668146133422852, "global_step": 335518, "epoch": 1997} {"train_loss": -11.567516326904297, "global_step": 335519, "epoch": 1997} {"train_loss": -11.782648086547852, "global_step": 335520, "epoch": 1997} {"train_loss": -11.565300941467285, "global_step": 335521, "epoch": 1997} {"train_loss": -11.653106689453125, "global_step": 335522, "epoch": 1997} {"train_loss": -11.571252822875977, "global_step": 335523, "epoch": 1997} {"train_loss": -11.507017135620117, "global_step": 335524, "epoch": 1997} {"train_loss": -11.925329208374023, "global_step": 335525, "epoch": 1997} {"train_loss": -11.630805969238281, "global_step": 335526, "epoch": 1997} {"train_loss": -11.584052085876465, "global_step": 335527, "epoch": 1997} {"train_loss": -11.653844833374023, "global_step": 335528, "epoch": 1997} {"train_loss": -12.153448104858398, "global_step": 335529, "epoch": 1997} {"train_loss": -11.71246337890625, "global_step": 335530, "epoch": 1997} {"train_loss": -11.259583473205566, "global_step": 335531, "epoch": 1997} {"train_loss": -11.858860969543457, "global_step": 335532, "epoch": 1997} {"train_loss": -11.407647132873535, "global_step": 335533, "epoch": 1997} {"train_loss": -11.597745895385742, "global_step": 335534, "epoch": 1997} {"train_loss": -12.065561294555664, "global_step": 335535, "epoch": 1997} {"train_loss": -11.735390663146973, "global_step": 335536, "epoch": 1997} {"train_loss": -11.651008605957031, "global_step": 335537, "epoch": 1997} {"train_loss": -11.824670791625977, "global_step": 335538, "epoch": 1997} {"train_loss": -11.825511932373047, "global_step": 335539, "epoch": 1997} {"train_loss": -11.805633544921875, "global_step": 335540, "epoch": 1997} {"train_loss": -12.189709663391113, "global_step": 335541, "epoch": 1997} {"train_loss": -11.804671287536621, "global_step": 335542, "epoch": 1997} {"train_loss": -12.15241813659668, "global_step": 335543, "epoch": 1997} {"train_loss": -11.546968460083008, "global_step": 335544, "epoch": 1997} {"train_loss": -12.181037902832031, "global_step": 335545, "epoch": 1997} {"train_loss": -11.522919654846191, "global_step": 335546, "epoch": 1997} {"train_loss": -12.213871002197266, "global_step": 335547, "epoch": 1997} {"train_loss": -11.766310691833496, "global_step": 335548, "epoch": 1997} {"train_loss": -11.88418960571289, "global_step": 335549, "epoch": 1997} {"train_loss": -12.060362815856934, "global_step": 335550, "epoch": 1997} {"train_loss": -12.13858699798584, "global_step": 335551, "epoch": 1997} {"train_loss": -12.02424430847168, "global_step": 335552, "epoch": 1997} {"train_loss": -12.008415222167969, "global_step": 335553, "epoch": 1997} {"train_loss": -11.916123390197754, "global_step": 335554, "epoch": 1997} {"train_loss": -11.848255157470703, "global_step": 335555, "epoch": 1997} {"train_loss": -12.212520599365234, "global_step": 335556, "epoch": 1997} {"train_loss": -12.118488311767578, "global_step": 335557, "epoch": 1997} {"train_loss": -11.95563793182373, "global_step": 335558, "epoch": 1997} {"train_loss": -12.232515335083008, "global_step": 335559, "epoch": 1997} {"train_loss": -12.091056823730469, "global_step": 335560, "epoch": 1997} {"train_loss": -12.184846878051758, "global_step": 335561, "epoch": 1997} {"train_loss": -12.509883880615234, "global_step": 335562, "epoch": 1997} {"train_loss": -11.951677322387695, "global_step": 335563, "epoch": 1997} {"train_loss": -12.461982727050781, "global_step": 335564, "epoch": 1997} {"train_loss": -12.159561157226562, "global_step": 335565, "epoch": 1997} {"train_loss": -12.2000732421875, "global_step": 335566, "epoch": 1997} {"train_loss": -12.32154655456543, "global_step": 335567, "epoch": 1997} {"train_loss": -12.451236724853516, "global_step": 335568, "epoch": 1997} {"train_loss": -12.211348533630371, "global_step": 335569, "epoch": 1997} {"train_loss": -12.464482307434082, "global_step": 335570, "epoch": 1997} {"train_loss": -12.276344299316406, "global_step": 335571, "epoch": 1997} {"train_loss": -12.368770599365234, "global_step": 335572, "epoch": 1997} {"train_loss": -12.442554473876953, "global_step": 335573, "epoch": 1997} {"train_loss": -12.456439971923828, "global_step": 335574, "epoch": 1997} {"train_loss": -12.24836540222168, "global_step": 335575, "epoch": 1997} {"train_loss": -12.453802108764648, "global_step": 335576, "epoch": 1997} {"train_loss": -12.459956169128418, "global_step": 335577, "epoch": 1997} {"train_loss": -12.419877052307129, "global_step": 335578, "epoch": 1997} {"train_loss": -12.540810585021973, "global_step": 335579, "epoch": 1997} {"train_loss": -12.418941497802734, "global_step": 335580, "epoch": 1997} {"train_loss": -12.408626556396484, "global_step": 335581, "epoch": 1997} {"train_loss": -12.411575317382812, "global_step": 335582, "epoch": 1997} {"train_loss": -12.36416244506836, "global_step": 335583, "epoch": 1997} {"train_loss": -12.440537452697754, "global_step": 335584, "epoch": 1997} {"train_loss": -12.483190536499023, "global_step": 335585, "epoch": 1997} {"train_loss": -12.336772918701172, "global_step": 335586, "epoch": 1997} {"train_loss": -12.49773120880127, "global_step": 335587, "epoch": 1997} {"train_loss": -12.507275581359863, "global_step": 335588, "epoch": 1997} {"train_loss": -12.382646560668945, "global_step": 335589, "epoch": 1997} {"train_loss": -12.357100486755371, "global_step": 335590, "epoch": 1997} {"train_loss": -12.402510643005371, "global_step": 335591, "epoch": 1997} {"train_loss": -12.492082595825195, "global_step": 335592, "epoch": 1997} {"train_loss": -12.592907905578613, "global_step": 335593, "epoch": 1997} {"train_loss": -12.625896453857422, "global_step": 335594, "epoch": 1997} {"train_loss": -12.601045608520508, "global_step": 335595, "epoch": 1997} {"train_loss": -12.628726959228516, "global_step": 335596, "epoch": 1997} {"train_loss": -12.590527534484863, "global_step": 335597, "epoch": 1997} {"train_loss": -12.392746925354004, "global_step": 335598, "epoch": 1997} {"train_loss": -12.476662635803223, "global_step": 335599, "epoch": 1997} {"train_loss": -12.702676773071289, "global_step": 335600, "epoch": 1997} {"train_loss": -12.65211296081543, "global_step": 335601, "epoch": 1997} {"train_loss": -12.352970123291016, "global_step": 335602, "epoch": 1997} {"train_loss": -12.361337661743164, "global_step": 335603, "epoch": 1997} {"train_loss": -12.353973388671875, "global_step": 335604, "epoch": 1997} {"train_loss": -12.20452880859375, "global_step": 335605, "epoch": 1997} {"train_loss": -12.380290985107422, "global_step": 335606, "epoch": 1997} {"train_loss": -12.280036926269531, "global_step": 335607, "epoch": 1997} {"train_loss": -11.71374797821045, "global_step": 335608, "epoch": 1997} {"train_loss": -11.723493576049805, "global_step": 335609, "epoch": 1997} {"train_loss": -9.820837020874023, "global_step": 335610, "epoch": 1997} {"train_loss": -12.308427810668945, "global_step": 335611, "epoch": 1997} {"train_loss": -10.131373405456543, "global_step": 335612, "epoch": 1997} {"train_loss": -10.653963088989258, "global_step": 335613, "epoch": 1997} {"train_loss": -10.991731643676758, "global_step": 335614, "epoch": 1997} {"train_loss": -8.918737411499023, "global_step": 335615, "epoch": 1997} {"train_loss": -10.464567184448242, "global_step": 335616, "epoch": 1997} {"train_loss": -7.668794631958008, "global_step": 335617, "epoch": 1997} {"train_loss": -10.171810150146484, "global_step": 335618, "epoch": 1997} {"train_loss": -9.45051383972168, "global_step": 335619, "epoch": 1997} {"train_loss": -9.30041790008545, "global_step": 335620, "epoch": 1997} {"train_loss": -9.354405403137207, "global_step": 335621, "epoch": 1997} {"train_loss": -8.81618881225586, "global_step": 335622, "epoch": 1997} {"train_loss": -8.587384223937988, "global_step": 335623, "epoch": 1997} {"train_loss": -11.172977447509766, "global_step": 335624, "epoch": 1997} {"train_loss": -9.389552116394043, "global_step": 335625, "epoch": 1997} {"train_loss": -9.501991271972656, "global_step": 335626, "epoch": 1997} {"train_loss": -11.389902114868164, "global_step": 335627, "epoch": 1997} {"train_loss": -9.94970989227295, "global_step": 335628, "epoch": 1997} {"train_loss": -10.36329174041748, "global_step": 335629, "epoch": 1997} {"train_loss": -10.487656593322754, "global_step": 335630, "epoch": 1997} {"train_loss": -10.530061721801758, "global_step": 335631, "epoch": 1997} {"train_loss": -11.733535766601562, "global_step": 335632, "epoch": 1997} {"train_loss": -10.005351066589355, "global_step": 335633, "epoch": 1997} {"train_loss": -11.834166526794434, "global_step": 335634, "epoch": 1997} {"train_loss": -10.576505661010742, "global_step": 335635, "epoch": 1997} {"train_loss": -11.11939811706543, "global_step": 335636, "epoch": 1997} {"train_loss": -11.248865127563477, "global_step": 335637, "epoch": 1997} {"train_loss": -11.056854248046875, "global_step": 335638, "epoch": 1997} {"train_loss": -10.684467315673828, "global_step": 335639, "epoch": 1997} {"train_loss": -10.76617431640625, "global_step": 335640, "epoch": 1997} {"train_loss": -10.648210525512695, "global_step": 335641, "epoch": 1997} {"train_loss": -10.879928588867188, "global_step": 335642, "epoch": 1997} {"train_loss": -11.736801147460938, "global_step": 335643, "epoch": 1997} {"train_loss": -10.412938117980957, "global_step": 335644, "epoch": 1997} {"train_loss": -11.671314239501953, "global_step": 335645, "epoch": 1997} {"train_loss": -10.64231014251709, "global_step": 335646, "epoch": 1997} {"train_loss": -11.980179786682129, "global_step": 335647, "epoch": 1997} {"train_loss": -11.211015701293945, "global_step": 335648, "epoch": 1997} {"train_loss": -11.632919311523438, "global_step": 335649, "epoch": 1997} {"train_loss": -11.889814376831055, "global_step": 335650, "epoch": 1997} {"train_loss": -11.673091888427734, "global_step": 335651, "epoch": 1997} {"train_loss": -11.911699295043945, "global_step": 335652, "epoch": 1997} {"train_loss": -11.426328659057617, "global_step": 335653, "epoch": 1997} {"train_loss": -12.02334213256836, "global_step": 335654, "epoch": 1997} {"train_loss": -11.728403091430664, "global_step": 335655, "epoch": 1997} {"train_loss": -11.948209762573242, "global_step": 335656, "epoch": 1997} {"train_loss": -11.88405990600586, "global_step": 335657, "epoch": 1997} {"train_loss": -11.62456226348877, "global_step": 335658, "epoch": 1997} {"train_loss": -11.809200286865234, "global_step": 335659, "epoch": 1997} {"train_loss": -12.02694320678711, "global_step": 335660, "epoch": 1997} {"train_loss": -12.008989334106445, "global_step": 335661, "epoch": 1997} {"train_loss": -11.98917007446289, "global_step": 335662, "epoch": 1997} {"train_loss": -11.53990496340252, "global_step": 335663, "epoch": 1997, "val_loss": 287058.09375} {"train_loss": -12.249238014221191, "global_step": 335664, "epoch": 1998} {"train_loss": -12.172996520996094, "global_step": 335665, "epoch": 1998} {"train_loss": -12.167415618896484, "global_step": 335666, "epoch": 1998} {"train_loss": -12.377913475036621, "global_step": 335667, "epoch": 1998} {"train_loss": -12.228364944458008, "global_step": 335668, "epoch": 1998} {"train_loss": -12.323507308959961, "global_step": 335669, "epoch": 1998} {"train_loss": -12.246847152709961, "global_step": 335670, "epoch": 1998} {"train_loss": -12.131650924682617, "global_step": 335671, "epoch": 1998} {"train_loss": -12.097662925720215, "global_step": 335672, "epoch": 1998} {"train_loss": -12.368770599365234, "global_step": 335673, "epoch": 1998} {"train_loss": -12.143686294555664, "global_step": 335674, "epoch": 1998} {"train_loss": -12.364006996154785, "global_step": 335675, "epoch": 1998} {"train_loss": -12.287961959838867, "global_step": 335676, "epoch": 1998} {"train_loss": -12.178570747375488, "global_step": 335677, "epoch": 1998} {"train_loss": -12.346273422241211, "global_step": 335678, "epoch": 1998} {"train_loss": -12.331604957580566, "global_step": 335679, "epoch": 1998} {"train_loss": -12.395153999328613, "global_step": 335680, "epoch": 1998} {"train_loss": -12.53421401977539, "global_step": 335681, "epoch": 1998} {"train_loss": -12.270641326904297, "global_step": 335682, "epoch": 1998} {"train_loss": -12.279462814331055, "global_step": 335683, "epoch": 1998} {"train_loss": -12.380997657775879, "global_step": 335684, "epoch": 1998} {"train_loss": -12.221002578735352, "global_step": 335685, "epoch": 1998} {"train_loss": -12.165887832641602, "global_step": 335686, "epoch": 1998} {"train_loss": -12.212362289428711, "global_step": 335687, "epoch": 1998} {"train_loss": -12.335904121398926, "global_step": 335688, "epoch": 1998} {"train_loss": -12.397578239440918, "global_step": 335689, "epoch": 1998} {"train_loss": -12.145320892333984, "global_step": 335690, "epoch": 1998} {"train_loss": -12.349586486816406, "global_step": 335691, "epoch": 1998} {"train_loss": -12.429977416992188, "global_step": 335692, "epoch": 1998} {"train_loss": -12.425149917602539, "global_step": 335693, "epoch": 1998} {"train_loss": -12.149686813354492, "global_step": 335694, "epoch": 1998} {"train_loss": -12.226000785827637, "global_step": 335695, "epoch": 1998} {"train_loss": -12.281843185424805, "global_step": 335696, "epoch": 1998} {"train_loss": -12.317808151245117, "global_step": 335697, "epoch": 1998} {"train_loss": -12.193958282470703, "global_step": 335698, "epoch": 1998} {"train_loss": -12.509170532226562, "global_step": 335699, "epoch": 1998} {"train_loss": -12.206480979919434, "global_step": 335700, "epoch": 1998} {"train_loss": -12.532452583312988, "global_step": 335701, "epoch": 1998} {"train_loss": -12.314229011535645, "global_step": 335702, "epoch": 1998} {"train_loss": -12.449682235717773, "global_step": 335703, "epoch": 1998} {"train_loss": -12.266401290893555, "global_step": 335704, "epoch": 1998} {"train_loss": -12.404504776000977, "global_step": 335705, "epoch": 1998} {"train_loss": -12.651607513427734, "global_step": 335706, "epoch": 1998} {"train_loss": -12.407158851623535, "global_step": 335707, "epoch": 1998} {"train_loss": -12.390015602111816, "global_step": 335708, "epoch": 1998} {"train_loss": -12.219538688659668, "global_step": 335709, "epoch": 1998} {"train_loss": -12.48838996887207, "global_step": 335710, "epoch": 1998} {"train_loss": -12.11854362487793, "global_step": 335711, "epoch": 1998} {"train_loss": -12.365154266357422, "global_step": 335712, "epoch": 1998} {"train_loss": -12.56673526763916, "global_step": 335713, "epoch": 1998} {"train_loss": -12.467670440673828, "global_step": 335714, "epoch": 1998} {"train_loss": -12.572532653808594, "global_step": 335715, "epoch": 1998} {"train_loss": -12.205422401428223, "global_step": 335716, "epoch": 1998} {"train_loss": -11.390665054321289, "global_step": 335717, "epoch": 1998} {"train_loss": -12.063960075378418, "global_step": 335718, "epoch": 1998} {"train_loss": -12.450628280639648, "global_step": 335719, "epoch": 1998} {"train_loss": -12.03314208984375, "global_step": 335720, "epoch": 1998} {"train_loss": -12.350931167602539, "global_step": 335721, "epoch": 1998} {"train_loss": -12.183382987976074, "global_step": 335722, "epoch": 1998} {"train_loss": -12.305998802185059, "global_step": 335723, "epoch": 1998} {"train_loss": -12.375295639038086, "global_step": 335724, "epoch": 1998} {"train_loss": -12.245060920715332, "global_step": 335725, "epoch": 1998} {"train_loss": -12.25314712524414, "global_step": 335726, "epoch": 1998} {"train_loss": -11.91673469543457, "global_step": 335727, "epoch": 1998} {"train_loss": -12.253798484802246, "global_step": 335728, "epoch": 1998} {"train_loss": -12.12086296081543, "global_step": 335729, "epoch": 1998} {"train_loss": -12.509282112121582, "global_step": 335730, "epoch": 1998} {"train_loss": -12.518373489379883, "global_step": 335731, "epoch": 1998} {"train_loss": -12.2020263671875, "global_step": 335732, "epoch": 1998} {"train_loss": -12.015911102294922, "global_step": 335733, "epoch": 1998} {"train_loss": -12.014594078063965, "global_step": 335734, "epoch": 1998} {"train_loss": -12.3764066696167, "global_step": 335735, "epoch": 1998} {"train_loss": -11.991127967834473, "global_step": 335736, "epoch": 1998} {"train_loss": -12.126256942749023, "global_step": 335737, "epoch": 1998} {"train_loss": -12.099422454833984, "global_step": 335738, "epoch": 1998} {"train_loss": -12.483770370483398, "global_step": 335739, "epoch": 1998} {"train_loss": -11.594025611877441, "global_step": 335740, "epoch": 1998} {"train_loss": -12.298730850219727, "global_step": 335741, "epoch": 1998} {"train_loss": -12.193788528442383, "global_step": 335742, "epoch": 1998} {"train_loss": -11.922667503356934, "global_step": 335743, "epoch": 1998} {"train_loss": -12.123453140258789, "global_step": 335744, "epoch": 1998} {"train_loss": -12.23753547668457, "global_step": 335745, "epoch": 1998} {"train_loss": -11.641792297363281, "global_step": 335746, "epoch": 1998} {"train_loss": -11.528488159179688, "global_step": 335747, "epoch": 1998} {"train_loss": -11.223344802856445, "global_step": 335748, "epoch": 1998} {"train_loss": -11.771422386169434, "global_step": 335749, "epoch": 1998} {"train_loss": -11.117124557495117, "global_step": 335750, "epoch": 1998} {"train_loss": -11.212666511535645, "global_step": 335751, "epoch": 1998} {"train_loss": -8.302401542663574, "global_step": 335752, "epoch": 1998} {"train_loss": -8.752178192138672, "global_step": 335753, "epoch": 1998} {"train_loss": -10.117525100708008, "global_step": 335754, "epoch": 1998} {"train_loss": -9.985742568969727, "global_step": 335755, "epoch": 1998} {"train_loss": -9.351507186889648, "global_step": 335756, "epoch": 1998} {"train_loss": -9.224479675292969, "global_step": 335757, "epoch": 1998} {"train_loss": -9.971187591552734, "global_step": 335758, "epoch": 1998} {"train_loss": -8.491412162780762, "global_step": 335759, "epoch": 1998} {"train_loss": -9.707572937011719, "global_step": 335760, "epoch": 1998} {"train_loss": -8.875814437866211, "global_step": 335761, "epoch": 1998} {"train_loss": -10.67959976196289, "global_step": 335762, "epoch": 1998} {"train_loss": -8.672388076782227, "global_step": 335763, "epoch": 1998} {"train_loss": -11.175193786621094, "global_step": 335764, "epoch": 1998} {"train_loss": -8.597516059875488, "global_step": 335765, "epoch": 1998} {"train_loss": -8.990133285522461, "global_step": 335766, "epoch": 1998} {"train_loss": -9.408308982849121, "global_step": 335767, "epoch": 1998} {"train_loss": -10.941518783569336, "global_step": 335768, "epoch": 1998} {"train_loss": -9.864139556884766, "global_step": 335769, "epoch": 1998} {"train_loss": -9.623235702514648, "global_step": 335770, "epoch": 1998} {"train_loss": -10.542652130126953, "global_step": 335771, "epoch": 1998} {"train_loss": -10.782112121582031, "global_step": 335772, "epoch": 1998} {"train_loss": -10.790040969848633, "global_step": 335773, "epoch": 1998} {"train_loss": -11.449230194091797, "global_step": 335774, "epoch": 1998} {"train_loss": -10.645990371704102, "global_step": 335775, "epoch": 1998} {"train_loss": -9.65029239654541, "global_step": 335776, "epoch": 1998} {"train_loss": -11.176043510437012, "global_step": 335777, "epoch": 1998} {"train_loss": -10.644559860229492, "global_step": 335778, "epoch": 1998} {"train_loss": -10.671119689941406, "global_step": 335779, "epoch": 1998} {"train_loss": -11.808732032775879, "global_step": 335780, "epoch": 1998} {"train_loss": -10.337759017944336, "global_step": 335781, "epoch": 1998} {"train_loss": -11.161951065063477, "global_step": 335782, "epoch": 1998} {"train_loss": -11.471061706542969, "global_step": 335783, "epoch": 1998} {"train_loss": -10.939889907836914, "global_step": 335784, "epoch": 1998} {"train_loss": -11.583900451660156, "global_step": 335785, "epoch": 1998} {"train_loss": -10.772727012634277, "global_step": 335786, "epoch": 1998} {"train_loss": -11.518035888671875, "global_step": 335787, "epoch": 1998} {"train_loss": -11.492183685302734, "global_step": 335788, "epoch": 1998} {"train_loss": -11.347519874572754, "global_step": 335789, "epoch": 1998} {"train_loss": -11.772232055664062, "global_step": 335790, "epoch": 1998} {"train_loss": -11.426733016967773, "global_step": 335791, "epoch": 1998} {"train_loss": -11.704479217529297, "global_step": 335792, "epoch": 1998} {"train_loss": -11.4923095703125, "global_step": 335793, "epoch": 1998} {"train_loss": -11.582586288452148, "global_step": 335794, "epoch": 1998} {"train_loss": -11.779179573059082, "global_step": 335795, "epoch": 1998} {"train_loss": -11.712289810180664, "global_step": 335796, "epoch": 1998} {"train_loss": -11.883148193359375, "global_step": 335797, "epoch": 1998} {"train_loss": -11.608733177185059, "global_step": 335798, "epoch": 1998} {"train_loss": -11.780305862426758, "global_step": 335799, "epoch": 1998} {"train_loss": -11.835859298706055, "global_step": 335800, "epoch": 1998} {"train_loss": -11.828084945678711, "global_step": 335801, "epoch": 1998} {"train_loss": -11.405017852783203, "global_step": 335802, "epoch": 1998} {"train_loss": -12.033171653747559, "global_step": 335803, "epoch": 1998} {"train_loss": -11.777984619140625, "global_step": 335804, "epoch": 1998} {"train_loss": -11.757237434387207, "global_step": 335805, "epoch": 1998} {"train_loss": -11.776762008666992, "global_step": 335806, "epoch": 1998} {"train_loss": -11.899564743041992, "global_step": 335807, "epoch": 1998} {"train_loss": -11.763885498046875, "global_step": 335808, "epoch": 1998} {"train_loss": -11.973999977111816, "global_step": 335809, "epoch": 1998} {"train_loss": -12.041500091552734, "global_step": 335810, "epoch": 1998} {"train_loss": -11.96647834777832, "global_step": 335811, "epoch": 1998} {"train_loss": -12.023050308227539, "global_step": 335812, "epoch": 1998} {"train_loss": -12.101798057556152, "global_step": 335813, "epoch": 1998} {"train_loss": -11.96828556060791, "global_step": 335814, "epoch": 1998} {"train_loss": -11.992158889770508, "global_step": 335815, "epoch": 1998} {"train_loss": -12.101451873779297, "global_step": 335816, "epoch": 1998} {"train_loss": -12.146164894104004, "global_step": 335817, "epoch": 1998} {"train_loss": -12.149946212768555, "global_step": 335818, "epoch": 1998} {"train_loss": -12.087942123413086, "global_step": 335819, "epoch": 1998} {"train_loss": -12.146465301513672, "global_step": 335820, "epoch": 1998} {"train_loss": -12.141644477844238, "global_step": 335821, "epoch": 1998} {"train_loss": -12.035518646240234, "global_step": 335822, "epoch": 1998} {"train_loss": -12.190994262695312, "global_step": 335823, "epoch": 1998} {"train_loss": -12.161796569824219, "global_step": 335824, "epoch": 1998} {"train_loss": -12.431270599365234, "global_step": 335825, "epoch": 1998} {"train_loss": -11.939014434814453, "global_step": 335826, "epoch": 1998} {"train_loss": -12.109700202941895, "global_step": 335827, "epoch": 1998} {"train_loss": -12.363494873046875, "global_step": 335828, "epoch": 1998} {"train_loss": -12.221033096313477, "global_step": 335829, "epoch": 1998} {"train_loss": -12.366323471069336, "global_step": 335830, "epoch": 1998} {"train_loss": -11.696598444666181, "global_step": 335831, "epoch": 1998, "val_loss": 280842.3125} {"train_loss": -12.202079772949219, "global_step": 335832, "epoch": 1999} {"train_loss": -12.319540977478027, "global_step": 335833, "epoch": 1999} {"train_loss": -12.212736129760742, "global_step": 335834, "epoch": 1999} {"train_loss": -11.904084205627441, "global_step": 335835, "epoch": 1999} {"train_loss": -12.337299346923828, "global_step": 335836, "epoch": 1999} {"train_loss": -11.946163177490234, "global_step": 335837, "epoch": 1999} {"train_loss": -11.954374313354492, "global_step": 335838, "epoch": 1999} {"train_loss": -12.277381896972656, "global_step": 335839, "epoch": 1999} {"train_loss": -12.179973602294922, "global_step": 335840, "epoch": 1999} {"train_loss": -12.094375610351562, "global_step": 335841, "epoch": 1999} {"train_loss": -12.326057434082031, "global_step": 335842, "epoch": 1999} {"train_loss": -11.949335098266602, "global_step": 335843, "epoch": 1999} {"train_loss": -12.066471099853516, "global_step": 335844, "epoch": 1999} {"train_loss": -12.215446472167969, "global_step": 335845, "epoch": 1999} {"train_loss": -11.901408195495605, "global_step": 335846, "epoch": 1999} {"train_loss": -12.100791931152344, "global_step": 335847, "epoch": 1999} {"train_loss": -10.667219161987305, "global_step": 335848, "epoch": 1999} {"train_loss": -12.387657165527344, "global_step": 335849, "epoch": 1999} {"train_loss": -11.388721466064453, "global_step": 335850, "epoch": 1999} {"train_loss": -12.138355255126953, "global_step": 335851, "epoch": 1999} {"train_loss": -11.542835235595703, "global_step": 335852, "epoch": 1999} {"train_loss": -11.76567268371582, "global_step": 335853, "epoch": 1999} {"train_loss": -11.755705833435059, "global_step": 335854, "epoch": 1999} {"train_loss": -11.980732917785645, "global_step": 335855, "epoch": 1999} {"train_loss": -11.899540901184082, "global_step": 335856, "epoch": 1999} {"train_loss": -11.99979019165039, "global_step": 335857, "epoch": 1999} {"train_loss": -12.19504451751709, "global_step": 335858, "epoch": 1999} {"train_loss": -11.783848762512207, "global_step": 335859, "epoch": 1999} {"train_loss": -12.167577743530273, "global_step": 335860, "epoch": 1999} {"train_loss": -12.165555000305176, "global_step": 335861, "epoch": 1999} {"train_loss": -12.136816024780273, "global_step": 335862, "epoch": 1999} {"train_loss": -12.3052978515625, "global_step": 335863, "epoch": 1999} {"train_loss": -12.0361909866333, "global_step": 335864, "epoch": 1999} {"train_loss": -12.157027244567871, "global_step": 335865, "epoch": 1999} {"train_loss": -12.544803619384766, "global_step": 335866, "epoch": 1999} {"train_loss": -12.169670104980469, "global_step": 335867, "epoch": 1999} {"train_loss": -12.411895751953125, "global_step": 335868, "epoch": 1999} {"train_loss": -12.498351097106934, "global_step": 335869, "epoch": 1999} {"train_loss": -12.200389862060547, "global_step": 335870, "epoch": 1999} {"train_loss": -12.322012901306152, "global_step": 335871, "epoch": 1999} {"train_loss": -12.389971733093262, "global_step": 335872, "epoch": 1999} {"train_loss": -11.943960189819336, "global_step": 335873, "epoch": 1999} {"train_loss": -12.281137466430664, "global_step": 335874, "epoch": 1999} {"train_loss": -12.223159790039062, "global_step": 335875, "epoch": 1999} {"train_loss": -12.180227279663086, "global_step": 335876, "epoch": 1999} {"train_loss": -11.933150291442871, "global_step": 335877, "epoch": 1999} {"train_loss": -12.541908264160156, "global_step": 335878, "epoch": 1999} {"train_loss": -12.417440414428711, "global_step": 335879, "epoch": 1999} {"train_loss": -12.288768768310547, "global_step": 335880, "epoch": 1999} {"train_loss": -12.357049942016602, "global_step": 335881, "epoch": 1999} {"train_loss": -12.153363227844238, "global_step": 335882, "epoch": 1999} {"train_loss": -12.529257774353027, "global_step": 335883, "epoch": 1999} {"train_loss": -12.241717338562012, "global_step": 335884, "epoch": 1999} {"train_loss": -12.239241600036621, "global_step": 335885, "epoch": 1999} {"train_loss": -12.39097785949707, "global_step": 335886, "epoch": 1999} {"train_loss": -12.522390365600586, "global_step": 335887, "epoch": 1999} {"train_loss": -12.33804702758789, "global_step": 335888, "epoch": 1999} {"train_loss": -12.387517929077148, "global_step": 335889, "epoch": 1999} {"train_loss": -12.386026382446289, "global_step": 335890, "epoch": 1999} {"train_loss": -12.448850631713867, "global_step": 335891, "epoch": 1999} {"train_loss": -12.341020584106445, "global_step": 335892, "epoch": 1999} {"train_loss": -12.613334655761719, "global_step": 335893, "epoch": 1999} {"train_loss": -12.409173965454102, "global_step": 335894, "epoch": 1999} {"train_loss": -12.454051971435547, "global_step": 335895, "epoch": 1999} {"train_loss": -12.417180061340332, "global_step": 335896, "epoch": 1999} {"train_loss": -12.487710952758789, "global_step": 335897, "epoch": 1999} {"train_loss": -12.553243637084961, "global_step": 335898, "epoch": 1999} {"train_loss": -12.73709487915039, "global_step": 335899, "epoch": 1999} {"train_loss": -12.596471786499023, "global_step": 335900, "epoch": 1999} {"train_loss": -12.484066009521484, "global_step": 335901, "epoch": 1999} {"train_loss": -12.620823860168457, "global_step": 335902, "epoch": 1999} {"train_loss": -12.51794719696045, "global_step": 335903, "epoch": 1999} {"train_loss": -12.305697441101074, "global_step": 335904, "epoch": 1999} {"train_loss": -12.692007064819336, "global_step": 335905, "epoch": 1999} {"train_loss": -12.49931812286377, "global_step": 335906, "epoch": 1999} {"train_loss": -12.64920711517334, "global_step": 335907, "epoch": 1999} {"train_loss": -12.516704559326172, "global_step": 335908, "epoch": 1999} {"train_loss": -12.53314208984375, "global_step": 335909, "epoch": 1999} {"train_loss": -12.368978500366211, "global_step": 335910, "epoch": 1999} {"train_loss": -12.759751319885254, "global_step": 335911, "epoch": 1999} {"train_loss": -12.528605461120605, "global_step": 335912, "epoch": 1999} {"train_loss": -11.990278244018555, "global_step": 335913, "epoch": 1999} {"train_loss": -12.040379524230957, "global_step": 335914, "epoch": 1999} {"train_loss": -12.251954078674316, "global_step": 335915, "epoch": 1999} {"train_loss": -12.740533828735352, "global_step": 335916, "epoch": 1999} {"train_loss": -12.001977920532227, "global_step": 335917, "epoch": 1999} {"train_loss": -11.527374267578125, "global_step": 335918, "epoch": 1999} {"train_loss": -10.51566219329834, "global_step": 335919, "epoch": 1999} {"train_loss": -11.687498092651367, "global_step": 335920, "epoch": 1999} {"train_loss": -10.734752655029297, "global_step": 335921, "epoch": 1999} {"train_loss": -11.120109558105469, "global_step": 335922, "epoch": 1999} {"train_loss": -10.195867538452148, "global_step": 335923, "epoch": 1999} {"train_loss": -11.780426025390625, "global_step": 335924, "epoch": 1999} {"train_loss": -8.375144958496094, "global_step": 335925, "epoch": 1999} {"train_loss": -9.470142364501953, "global_step": 335926, "epoch": 1999} {"train_loss": -8.778173446655273, "global_step": 335927, "epoch": 1999} {"train_loss": -9.115856170654297, "global_step": 335928, "epoch": 1999} {"train_loss": -8.032896995544434, "global_step": 335929, "epoch": 1999} {"train_loss": -7.751081943511963, "global_step": 335930, "epoch": 1999} {"train_loss": -6.510044574737549, "global_step": 335931, "epoch": 1999} {"train_loss": -8.239795684814453, "global_step": 335932, "epoch": 1999} {"train_loss": -7.516845703125, "global_step": 335933, "epoch": 1999} {"train_loss": -7.844632625579834, "global_step": 335934, "epoch": 1999} {"train_loss": -6.964820861816406, "global_step": 335935, "epoch": 1999} {"train_loss": -7.709589958190918, "global_step": 335936, "epoch": 1999} {"train_loss": -7.845633506774902, "global_step": 335937, "epoch": 1999} {"train_loss": -8.28073501586914, "global_step": 335938, "epoch": 1999} {"train_loss": -8.953224182128906, "global_step": 335939, "epoch": 1999} {"train_loss": -8.754127502441406, "global_step": 335940, "epoch": 1999} {"train_loss": -8.830816268920898, "global_step": 335941, "epoch": 1999} {"train_loss": -8.69509506225586, "global_step": 335942, "epoch": 1999} {"train_loss": -8.855545997619629, "global_step": 335943, "epoch": 1999} {"train_loss": -8.67990493774414, "global_step": 335944, "epoch": 1999} {"train_loss": -9.049676895141602, "global_step": 335945, "epoch": 1999} {"train_loss": -10.488247871398926, "global_step": 335946, "epoch": 1999} {"train_loss": -9.857569694519043, "global_step": 335947, "epoch": 1999} {"train_loss": -9.67363452911377, "global_step": 335948, "epoch": 1999} {"train_loss": -9.515721321105957, "global_step": 335949, "epoch": 1999} {"train_loss": -10.252995491027832, "global_step": 335950, "epoch": 1999} {"train_loss": -9.490713119506836, "global_step": 335951, "epoch": 1999} {"train_loss": -9.775239944458008, "global_step": 335952, "epoch": 1999} {"train_loss": -10.413490295410156, "global_step": 335953, "epoch": 1999} {"train_loss": -9.921628952026367, "global_step": 335954, "epoch": 1999} {"train_loss": -11.020082473754883, "global_step": 335955, "epoch": 1999} {"train_loss": -10.375517845153809, "global_step": 335956, "epoch": 1999} {"train_loss": -11.171802520751953, "global_step": 335957, "epoch": 1999} {"train_loss": -10.752305030822754, "global_step": 335958, "epoch": 1999} {"train_loss": -11.121259689331055, "global_step": 335959, "epoch": 1999} {"train_loss": -10.993406295776367, "global_step": 335960, "epoch": 1999} {"train_loss": -11.200855255126953, "global_step": 335961, "epoch": 1999} {"train_loss": -11.386517524719238, "global_step": 335962, "epoch": 1999} {"train_loss": -11.46497917175293, "global_step": 335963, "epoch": 1999} {"train_loss": -11.633790969848633, "global_step": 335964, "epoch": 1999} {"train_loss": -11.282356262207031, "global_step": 335965, "epoch": 1999} {"train_loss": -10.90061092376709, "global_step": 335966, "epoch": 1999} {"train_loss": -11.401213645935059, "global_step": 335967, "epoch": 1999} {"train_loss": -11.023002624511719, "global_step": 335968, "epoch": 1999} {"train_loss": -11.500551223754883, "global_step": 335969, "epoch": 1999} {"train_loss": -11.105180740356445, "global_step": 335970, "epoch": 1999} {"train_loss": -11.976266860961914, "global_step": 335971, "epoch": 1999} {"train_loss": -11.330978393554688, "global_step": 335972, "epoch": 1999} {"train_loss": -11.795327186584473, "global_step": 335973, "epoch": 1999} {"train_loss": -11.150350570678711, "global_step": 335974, "epoch": 1999} {"train_loss": -11.751893997192383, "global_step": 335975, "epoch": 1999} {"train_loss": -11.25058364868164, "global_step": 335976, "epoch": 1999} {"train_loss": -11.666006088256836, "global_step": 335977, "epoch": 1999} {"train_loss": -11.648850440979004, "global_step": 335978, "epoch": 1999} {"train_loss": -11.256295204162598, "global_step": 335979, "epoch": 1999} {"train_loss": -11.442811965942383, "global_step": 335980, "epoch": 1999} {"train_loss": -11.600522994995117, "global_step": 335981, "epoch": 1999} {"train_loss": -11.546675682067871, "global_step": 335982, "epoch": 1999} {"train_loss": -11.83401107788086, "global_step": 335983, "epoch": 1999} {"train_loss": -11.543630599975586, "global_step": 335984, "epoch": 1999} {"train_loss": -11.551891326904297, "global_step": 335985, "epoch": 1999} {"train_loss": -11.277702331542969, "global_step": 335986, "epoch": 1999} {"train_loss": -12.013941764831543, "global_step": 335987, "epoch": 1999} {"train_loss": -11.564652442932129, "global_step": 335988, "epoch": 1999} {"train_loss": -11.873167037963867, "global_step": 335989, "epoch": 1999} {"train_loss": -11.465792655944824, "global_step": 335990, "epoch": 1999} {"train_loss": -11.887311935424805, "global_step": 335991, "epoch": 1999} {"train_loss": -11.608491897583008, "global_step": 335992, "epoch": 1999} {"train_loss": -12.055160522460938, "global_step": 335993, "epoch": 1999} {"train_loss": -11.715524673461914, "global_step": 335994, "epoch": 1999} {"train_loss": -11.657430648803711, "global_step": 335995, "epoch": 1999} {"train_loss": -11.800353050231934, "global_step": 335996, "epoch": 1999} {"train_loss": -12.08094596862793, "global_step": 335997, "epoch": 1999} {"train_loss": -11.828533172607422, "global_step": 335998, "epoch": 1999} {"train_loss": -11.373279988765717, "global_step": 335999, "epoch": 1999, "val_loss": 285467.96875} {"train_loss": -11.966628074645996, "global_step": 336000, "epoch": 2000} {"train_loss": -12.106154441833496, "global_step": 336001, "epoch": 2000} {"train_loss": -12.181070327758789, "global_step": 336002, "epoch": 2000} {"train_loss": -11.869994163513184, "global_step": 336003, "epoch": 2000} {"train_loss": -12.165291786193848, "global_step": 336004, "epoch": 2000} {"train_loss": -12.13895034790039, "global_step": 336005, "epoch": 2000} {"train_loss": -12.24074649810791, "global_step": 336006, "epoch": 2000} {"train_loss": -12.008602142333984, "global_step": 336007, "epoch": 2000} {"train_loss": -11.814760208129883, "global_step": 336008, "epoch": 2000} {"train_loss": -12.087541580200195, "global_step": 336009, "epoch": 2000} {"train_loss": -11.841011047363281, "global_step": 336010, "epoch": 2000} {"train_loss": -12.273761749267578, "global_step": 336011, "epoch": 2000} {"train_loss": -12.121150970458984, "global_step": 336012, "epoch": 2000} {"train_loss": -12.073177337646484, "global_step": 336013, "epoch": 2000} {"train_loss": -11.989704132080078, "global_step": 336014, "epoch": 2000} {"train_loss": -11.935369491577148, "global_step": 336015, "epoch": 2000} {"train_loss": -12.153467178344727, "global_step": 336016, "epoch": 2000} {"train_loss": -12.119772911071777, "global_step": 336017, "epoch": 2000} {"train_loss": -12.096237182617188, "global_step": 336018, "epoch": 2000} {"train_loss": -12.413951873779297, "global_step": 336019, "epoch": 2000} {"train_loss": -12.151439666748047, "global_step": 336020, "epoch": 2000} {"train_loss": -11.852630615234375, "global_step": 336021, "epoch": 2000} {"train_loss": -12.354310035705566, "global_step": 336022, "epoch": 2000} {"train_loss": -12.239095687866211, "global_step": 336023, "epoch": 2000} {"train_loss": -12.079167366027832, "global_step": 336024, "epoch": 2000} {"train_loss": -12.013872146606445, "global_step": 336025, "epoch": 2000} {"train_loss": -12.211942672729492, "global_step": 336026, "epoch": 2000} {"train_loss": -12.38811206817627, "global_step": 336027, "epoch": 2000} {"train_loss": -12.275422096252441, "global_step": 336028, "epoch": 2000} {"train_loss": -11.957870483398438, "global_step": 336029, "epoch": 2000} {"train_loss": -12.32800579071045, "global_step": 336030, "epoch": 2000} {"train_loss": -12.069352149963379, "global_step": 336031, "epoch": 2000} {"train_loss": -12.322820663452148, "global_step": 336032, "epoch": 2000} {"train_loss": -12.348294258117676, "global_step": 336033, "epoch": 2000} {"train_loss": -12.520736694335938, "global_step": 336034, "epoch": 2000} {"train_loss": -12.418821334838867, "global_step": 336035, "epoch": 2000} {"train_loss": -12.244332313537598, "global_step": 336036, "epoch": 2000} {"train_loss": -12.141563415527344, "global_step": 336037, "epoch": 2000} {"train_loss": -12.346208572387695, "global_step": 336038, "epoch": 2000} {"train_loss": -12.2640380859375, "global_step": 336039, "epoch": 2000} {"train_loss": -12.403427124023438, "global_step": 336040, "epoch": 2000} {"train_loss": -12.200313568115234, "global_step": 336041, "epoch": 2000} {"train_loss": -12.204866409301758, "global_step": 336042, "epoch": 2000} {"train_loss": -12.640769004821777, "global_step": 336043, "epoch": 2000} {"train_loss": -12.45498275756836, "global_step": 336044, "epoch": 2000} {"train_loss": -12.482133865356445, "global_step": 336045, "epoch": 2000} {"train_loss": -12.416584014892578, "global_step": 336046, "epoch": 2000} {"train_loss": -12.486098289489746, "global_step": 336047, "epoch": 2000} {"train_loss": -12.256847381591797, "global_step": 336048, "epoch": 2000} {"train_loss": -12.2813081741333, "global_step": 336049, "epoch": 2000} {"train_loss": -12.275287628173828, "global_step": 336050, "epoch": 2000} {"train_loss": -12.46928596496582, "global_step": 336051, "epoch": 2000} {"train_loss": -12.234332084655762, "global_step": 336052, "epoch": 2000} {"train_loss": -12.241043090820312, "global_step": 336053, "epoch": 2000} {"train_loss": -12.689505577087402, "global_step": 336054, "epoch": 2000} {"train_loss": -12.516227722167969, "global_step": 336055, "epoch": 2000} {"train_loss": -12.442012786865234, "global_step": 336056, "epoch": 2000} {"train_loss": -12.615493774414062, "global_step": 336057, "epoch": 2000} {"train_loss": -12.320579528808594, "global_step": 336058, "epoch": 2000} {"train_loss": -12.508210182189941, "global_step": 336059, "epoch": 2000} {"train_loss": -12.145326614379883, "global_step": 336060, "epoch": 2000} {"train_loss": -12.131040573120117, "global_step": 336061, "epoch": 2000} {"train_loss": -12.224297523498535, "global_step": 336062, "epoch": 2000} {"train_loss": -12.327814102172852, "global_step": 336063, "epoch": 2000} {"train_loss": -12.28184700012207, "global_step": 336064, "epoch": 2000} {"train_loss": -12.400899887084961, "global_step": 336065, "epoch": 2000} {"train_loss": -12.431391716003418, "global_step": 336066, "epoch": 2000} {"train_loss": -12.38198471069336, "global_step": 336067, "epoch": 2000} {"train_loss": -11.886397361755371, "global_step": 336068, "epoch": 2000} {"train_loss": -12.190980911254883, "global_step": 336069, "epoch": 2000} {"train_loss": -12.430746078491211, "global_step": 336070, "epoch": 2000} {"train_loss": -12.384753227233887, "global_step": 336071, "epoch": 2000} {"train_loss": -12.070723533630371, "global_step": 336072, "epoch": 2000} {"train_loss": -12.328496932983398, "global_step": 336073, "epoch": 2000} {"train_loss": -12.561399459838867, "global_step": 336074, "epoch": 2000} {"train_loss": -12.350702285766602, "global_step": 336075, "epoch": 2000} {"train_loss": -11.874155044555664, "global_step": 336076, "epoch": 2000} {"train_loss": -12.000507354736328, "global_step": 336077, "epoch": 2000} {"train_loss": -12.496809005737305, "global_step": 336078, "epoch": 2000} {"train_loss": -12.518580436706543, "global_step": 336079, "epoch": 2000} {"train_loss": -12.602718353271484, "global_step": 336080, "epoch": 2000} {"train_loss": -11.939473152160645, "global_step": 336081, "epoch": 2000} {"train_loss": -12.42336368560791, "global_step": 336082, "epoch": 2000} {"train_loss": -12.382299423217773, "global_step": 336083, "epoch": 2000} {"train_loss": -12.462298393249512, "global_step": 336084, "epoch": 2000} {"train_loss": -11.999524116516113, "global_step": 336085, "epoch": 2000} {"train_loss": -11.858259201049805, "global_step": 336086, "epoch": 2000} {"train_loss": -11.912899017333984, "global_step": 336087, "epoch": 2000} {"train_loss": -12.369462013244629, "global_step": 336088, "epoch": 2000} {"train_loss": -11.743998527526855, "global_step": 336089, "epoch": 2000} {"train_loss": -10.6322660446167, "global_step": 336090, "epoch": 2000} {"train_loss": -10.855191230773926, "global_step": 336091, "epoch": 2000} {"train_loss": -10.910089492797852, "global_step": 336092, "epoch": 2000} {"train_loss": -8.997873306274414, "global_step": 336093, "epoch": 2000} {"train_loss": -10.024909973144531, "global_step": 336094, "epoch": 2000} {"train_loss": -9.69239330291748, "global_step": 336095, "epoch": 2000} {"train_loss": -11.514968872070312, "global_step": 336096, "epoch": 2000} {"train_loss": -10.689459800720215, "global_step": 336097, "epoch": 2000} {"train_loss": -10.322002410888672, "global_step": 336098, "epoch": 2000} {"train_loss": -9.743318557739258, "global_step": 336099, "epoch": 2000} {"train_loss": -11.224433898925781, "global_step": 336100, "epoch": 2000} {"train_loss": -10.573776245117188, "global_step": 336101, "epoch": 2000} {"train_loss": -11.236530303955078, "global_step": 336102, "epoch": 2000} {"train_loss": -11.78510856628418, "global_step": 336103, "epoch": 2000} {"train_loss": -9.817303657531738, "global_step": 336104, "epoch": 2000} {"train_loss": -11.559223175048828, "global_step": 336105, "epoch": 2000} {"train_loss": -11.246051788330078, "global_step": 336106, "epoch": 2000} {"train_loss": -9.96841812133789, "global_step": 336107, "epoch": 2000} {"train_loss": -11.666735649108887, "global_step": 336108, "epoch": 2000} {"train_loss": -10.961055755615234, "global_step": 336109, "epoch": 2000} {"train_loss": -11.187806129455566, "global_step": 336110, "epoch": 2000} {"train_loss": -11.739852905273438, "global_step": 336111, "epoch": 2000} {"train_loss": -11.502252578735352, "global_step": 336112, "epoch": 2000} {"train_loss": -11.241514205932617, "global_step": 336113, "epoch": 2000} {"train_loss": -11.510383605957031, "global_step": 336114, "epoch": 2000} {"train_loss": -10.604621887207031, "global_step": 336115, "epoch": 2000} {"train_loss": -10.847492218017578, "global_step": 336116, "epoch": 2000} {"train_loss": -10.981001853942871, "global_step": 336117, "epoch": 2000} {"train_loss": -10.250885963439941, "global_step": 336118, "epoch": 2000} {"train_loss": -11.430511474609375, "global_step": 336119, "epoch": 2000} {"train_loss": -11.108720779418945, "global_step": 336120, "epoch": 2000} {"train_loss": -10.782636642456055, "global_step": 336121, "epoch": 2000} {"train_loss": -11.691696166992188, "global_step": 336122, "epoch": 2000} {"train_loss": -9.873459815979004, "global_step": 336123, "epoch": 2000} {"train_loss": -10.518192291259766, "global_step": 336124, "epoch": 2000} {"train_loss": -10.62709903717041, "global_step": 336125, "epoch": 2000} {"train_loss": -11.105003356933594, "global_step": 336126, "epoch": 2000} {"train_loss": -11.159568786621094, "global_step": 336127, "epoch": 2000} {"train_loss": -10.247781753540039, "global_step": 336128, "epoch": 2000} {"train_loss": -10.428163528442383, "global_step": 336129, "epoch": 2000} {"train_loss": -11.048449516296387, "global_step": 336130, "epoch": 2000} {"train_loss": -10.416840553283691, "global_step": 336131, "epoch": 2000} {"train_loss": -11.654195785522461, "global_step": 336132, "epoch": 2000} {"train_loss": -10.74267864227295, "global_step": 336133, "epoch": 2000} {"train_loss": -11.39991283416748, "global_step": 336134, "epoch": 2000} {"train_loss": -11.120318412780762, "global_step": 336135, "epoch": 2000} {"train_loss": -11.429004669189453, "global_step": 336136, "epoch": 2000} {"train_loss": -11.6549711227417, "global_step": 336137, "epoch": 2000} {"train_loss": -11.305999755859375, "global_step": 336138, "epoch": 2000} {"train_loss": -11.616987228393555, "global_step": 336139, "epoch": 2000} {"train_loss": -11.284529685974121, "global_step": 336140, "epoch": 2000} {"train_loss": -11.412633895874023, "global_step": 336141, "epoch": 2000} {"train_loss": -11.536903381347656, "global_step": 336142, "epoch": 2000} {"train_loss": -12.013721466064453, "global_step": 336143, "epoch": 2000} {"train_loss": -11.807071685791016, "global_step": 336144, "epoch": 2000} {"train_loss": -11.679594993591309, "global_step": 336145, "epoch": 2000} {"train_loss": -11.66374397277832, "global_step": 336146, "epoch": 2000} {"train_loss": -11.677644729614258, "global_step": 336147, "epoch": 2000} {"train_loss": -11.794750213623047, "global_step": 336148, "epoch": 2000} {"train_loss": -11.486489295959473, "global_step": 336149, "epoch": 2000} {"train_loss": -11.81857681274414, "global_step": 336150, "epoch": 2000} {"train_loss": -11.82579517364502, "global_step": 336151, "epoch": 2000} {"train_loss": -11.72927474975586, "global_step": 336152, "epoch": 2000} {"train_loss": -12.043465614318848, "global_step": 336153, "epoch": 2000} {"train_loss": -11.653615951538086, "global_step": 336154, "epoch": 2000} {"train_loss": -11.789459228515625, "global_step": 336155, "epoch": 2000} {"train_loss": -11.63072395324707, "global_step": 336156, "epoch": 2000} {"train_loss": -11.978214263916016, "global_step": 336157, "epoch": 2000} {"train_loss": -11.781551361083984, "global_step": 336158, "epoch": 2000} {"train_loss": -11.950874328613281, "global_step": 336159, "epoch": 2000} {"train_loss": -12.026256561279297, "global_step": 336160, "epoch": 2000} {"train_loss": -12.141143798828125, "global_step": 336161, "epoch": 2000} {"train_loss": -12.4108304977417, "global_step": 336162, "epoch": 2000} {"train_loss": -12.197547912597656, "global_step": 336163, "epoch": 2000} {"train_loss": -12.148065567016602, "global_step": 336164, "epoch": 2000} {"train_loss": -12.158737182617188, "global_step": 336165, "epoch": 2000} {"train_loss": -12.337886810302734, "global_step": 336166, "epoch": 2000} {"train_loss": -11.774470176015582, "global_step": 336167, "epoch": 2000, "train/sim_max_reward_0": 0.6852289056713164, "train/sim_max_reward_1": 0.9216861404517904, "train/sim_max_reward_2": 0.029215113785663258, "train/sim_max_reward_3": 0.37044464692433504, "train/sim_max_reward_4": 0.997173758186454, "train/sim_max_reward_5": 0.6015238779691293, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.3852118204294461, "test/sim_max_reward_4400002": 0.5727817756817757, "test/sim_max_reward_4400003": 0.12479213911775688, "test/sim_max_reward_4400004": 0.42588875608733306, "test/sim_max_reward_4400005": 0.04996492853818785, "test/sim_max_reward_4400006": 0.9476942111950293, "test/sim_max_reward_4400007": 0.4904402382124439, "test/sim_max_reward_4400008": 0.553632248820065, "test/sim_max_reward_4400009": 0.40190513896096225, "test/sim_max_reward_4400010": 0.40747863509627236, "test/sim_max_reward_4400011": 0.9748291408990017, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.6693564702326067, "test/sim_max_reward_4400015": 0.9758680897323199, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.957936121866425, "test/sim_max_reward_4400019": 0.9854332401211182, "test/sim_max_reward_4400020": 0.00012085298095991483, "test/sim_max_reward_4400021": 0.6337306287166823, "test/sim_max_reward_4400022": 0.9707749983555592, "test/sim_max_reward_4400023": 0.1411189280384975, "test/sim_max_reward_4400024": 1.0, "test/sim_max_reward_4400025": 0.5220998287768255, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.3904312474058137, "test/sim_max_reward_4400028": 0.005620068987359156, "test/sim_max_reward_4400029": 0.5564844734811694, "test/sim_max_reward_4400030": 0.9770323419456451, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.6284020409137003, "test/sim_max_reward_4400034": 0.9483025414899632, "test/sim_max_reward_4400035": 0.28804602460025064, "test/sim_max_reward_4400036": 0.9841659563857091, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.29627210302387913, "test/sim_max_reward_4400039": 0.9648253981709737, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.16575744723544195, "test/sim_max_reward_4400042": 0.9872252199122512, "test/sim_max_reward_4400043": 0.9933709058090074, "test/sim_max_reward_4400044": 0.9817998564351873, "test/sim_max_reward_4400045": 0.4635891051528655, "test/sim_max_reward_4400046": 0.32551520858606253, "test/sim_max_reward_4400047": 0.9949373470696191, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.2856562056592552, "train/mean_score": 0.6008787404981147, "test/mean_score": 0.5685698336824684, "val_loss": 288560.46875, "train_action_mse_error": 1.3467789888381958} {"train_loss": -12.141018867492676, "global_step": 336168, "epoch": 2001} {"train_loss": -12.255205154418945, "global_step": 336169, "epoch": 2001} {"train_loss": -12.386392593383789, "global_step": 336170, "epoch": 2001} {"train_loss": -12.366657257080078, "global_step": 336171, "epoch": 2001} {"train_loss": -12.20182991027832, "global_step": 336172, "epoch": 2001} {"train_loss": -12.343982696533203, "global_step": 336173, "epoch": 2001} {"train_loss": -12.310431480407715, "global_step": 336174, "epoch": 2001} {"train_loss": -12.373594284057617, "global_step": 336175, "epoch": 2001} {"train_loss": -12.294036865234375, "global_step": 336176, "epoch": 2001} {"train_loss": -12.159164428710938, "global_step": 336177, "epoch": 2001} {"train_loss": -12.371052742004395, "global_step": 336178, "epoch": 2001} {"train_loss": -12.430952072143555, "global_step": 336179, "epoch": 2001} {"train_loss": -12.163156509399414, "global_step": 336180, "epoch": 2001} {"train_loss": -12.557981491088867, "global_step": 336181, "epoch": 2001} {"train_loss": -12.473217964172363, "global_step": 336182, "epoch": 2001} {"train_loss": -12.424213409423828, "global_step": 336183, "epoch": 2001} {"train_loss": -12.488201141357422, "global_step": 336184, "epoch": 2001} {"train_loss": -12.229153633117676, "global_step": 336185, "epoch": 2001} {"train_loss": -12.259387969970703, "global_step": 336186, "epoch": 2001} {"train_loss": -12.365192413330078, "global_step": 336187, "epoch": 2001} {"train_loss": -12.653701782226562, "global_step": 336188, "epoch": 2001} {"train_loss": -12.522029876708984, "global_step": 336189, "epoch": 2001} {"train_loss": -12.396627426147461, "global_step": 336190, "epoch": 2001} {"train_loss": -12.451149940490723, "global_step": 336191, "epoch": 2001} {"train_loss": -12.644308090209961, "global_step": 336192, "epoch": 2001} {"train_loss": -12.501483917236328, "global_step": 336193, "epoch": 2001} {"train_loss": -12.499323844909668, "global_step": 336194, "epoch": 2001} {"train_loss": -12.331002235412598, "global_step": 336195, "epoch": 2001} {"train_loss": -12.268001556396484, "global_step": 336196, "epoch": 2001} {"train_loss": -12.20269775390625, "global_step": 336197, "epoch": 2001} {"train_loss": -12.384283065795898, "global_step": 336198, "epoch": 2001} {"train_loss": -12.349973678588867, "global_step": 336199, "epoch": 2001} {"train_loss": -11.98536491394043, "global_step": 336200, "epoch": 2001} {"train_loss": -12.124055862426758, "global_step": 336201, "epoch": 2001} {"train_loss": -12.405194282531738, "global_step": 336202, "epoch": 2001} {"train_loss": -11.697999000549316, "global_step": 336203, "epoch": 2001} {"train_loss": -12.33242130279541, "global_step": 336204, "epoch": 2001} {"train_loss": -12.081409454345703, "global_step": 336205, "epoch": 2001} {"train_loss": -12.088669776916504, "global_step": 336206, "epoch": 2001} {"train_loss": -12.227601051330566, "global_step": 336207, "epoch": 2001} {"train_loss": -12.125799179077148, "global_step": 336208, "epoch": 2001} {"train_loss": -11.853506088256836, "global_step": 336209, "epoch": 2001} {"train_loss": -12.29139232635498, "global_step": 336210, "epoch": 2001} {"train_loss": -11.993907928466797, "global_step": 336211, "epoch": 2001} {"train_loss": -12.015993118286133, "global_step": 336212, "epoch": 2001} {"train_loss": -12.341856956481934, "global_step": 336213, "epoch": 2001} {"train_loss": -11.71137809753418, "global_step": 336214, "epoch": 2001} {"train_loss": -12.03993034362793, "global_step": 336215, "epoch": 2001} {"train_loss": -12.230316162109375, "global_step": 336216, "epoch": 2001} {"train_loss": -12.322237014770508, "global_step": 336217, "epoch": 2001} {"train_loss": -12.036231994628906, "global_step": 336218, "epoch": 2001} {"train_loss": -12.423538208007812, "global_step": 336219, "epoch": 2001} {"train_loss": -11.65907096862793, "global_step": 336220, "epoch": 2001} {"train_loss": -12.105537414550781, "global_step": 336221, "epoch": 2001} {"train_loss": -11.830477714538574, "global_step": 336222, "epoch": 2001} {"train_loss": -11.937532424926758, "global_step": 336223, "epoch": 2001} {"train_loss": -12.475258827209473, "global_step": 336224, "epoch": 2001} {"train_loss": -11.625468254089355, "global_step": 336225, "epoch": 2001} {"train_loss": -11.192110061645508, "global_step": 336226, "epoch": 2001} {"train_loss": -11.927302360534668, "global_step": 336227, "epoch": 2001} {"train_loss": -11.018058776855469, "global_step": 336228, "epoch": 2001} {"train_loss": -11.186797142028809, "global_step": 336229, "epoch": 2001} {"train_loss": -12.118825912475586, "global_step": 336230, "epoch": 2001} {"train_loss": -10.745171546936035, "global_step": 336231, "epoch": 2001} {"train_loss": -11.771661758422852, "global_step": 336232, "epoch": 2001} {"train_loss": -11.677593231201172, "global_step": 336233, "epoch": 2001} {"train_loss": -11.783756256103516, "global_step": 336234, "epoch": 2001} {"train_loss": -11.87148666381836, "global_step": 336235, "epoch": 2001} {"train_loss": -11.472524642944336, "global_step": 336236, "epoch": 2001} {"train_loss": -11.177943229675293, "global_step": 336237, "epoch": 2001} {"train_loss": -11.631811141967773, "global_step": 336238, "epoch": 2001} {"train_loss": -11.155538558959961, "global_step": 336239, "epoch": 2001} {"train_loss": -12.04404354095459, "global_step": 336240, "epoch": 2001} {"train_loss": -11.35075855255127, "global_step": 336241, "epoch": 2001} {"train_loss": -11.079919815063477, "global_step": 336242, "epoch": 2001} {"train_loss": -11.574109077453613, "global_step": 336243, "epoch": 2001} {"train_loss": -11.656587600708008, "global_step": 336244, "epoch": 2001} {"train_loss": -11.70716667175293, "global_step": 336245, "epoch": 2001} {"train_loss": -11.621713638305664, "global_step": 336246, "epoch": 2001} {"train_loss": -11.57597541809082, "global_step": 336247, "epoch": 2001} {"train_loss": -10.862548828125, "global_step": 336248, "epoch": 2001} {"train_loss": -10.482300758361816, "global_step": 336249, "epoch": 2001} {"train_loss": -11.906116485595703, "global_step": 336250, "epoch": 2001} {"train_loss": -11.129984855651855, "global_step": 336251, "epoch": 2001} {"train_loss": -11.77109146118164, "global_step": 336252, "epoch": 2001} {"train_loss": -10.885169982910156, "global_step": 336253, "epoch": 2001} {"train_loss": -11.44955825805664, "global_step": 336254, "epoch": 2001} {"train_loss": -10.60731315612793, "global_step": 336255, "epoch": 2001} {"train_loss": -11.953514099121094, "global_step": 336256, "epoch": 2001} {"train_loss": -11.289288520812988, "global_step": 336257, "epoch": 2001} {"train_loss": -12.169862747192383, "global_step": 336258, "epoch": 2001} {"train_loss": -11.542253494262695, "global_step": 336259, "epoch": 2001} {"train_loss": -11.621728897094727, "global_step": 336260, "epoch": 2001} {"train_loss": -11.93320083618164, "global_step": 336261, "epoch": 2001} {"train_loss": -11.242036819458008, "global_step": 336262, "epoch": 2001} {"train_loss": -12.106040000915527, "global_step": 336263, "epoch": 2001} {"train_loss": -11.643170356750488, "global_step": 336264, "epoch": 2001} {"train_loss": -12.095619201660156, "global_step": 336265, "epoch": 2001} {"train_loss": -12.086111068725586, "global_step": 336266, "epoch": 2001} {"train_loss": -12.098564147949219, "global_step": 336267, "epoch": 2001} {"train_loss": -12.125950813293457, "global_step": 336268, "epoch": 2001} {"train_loss": -12.156166076660156, "global_step": 336269, "epoch": 2001} {"train_loss": -12.278942108154297, "global_step": 336270, "epoch": 2001} {"train_loss": -12.260035514831543, "global_step": 336271, "epoch": 2001} {"train_loss": -12.220638275146484, "global_step": 336272, "epoch": 2001} {"train_loss": -12.188310623168945, "global_step": 336273, "epoch": 2001} {"train_loss": -12.315349578857422, "global_step": 336274, "epoch": 2001} {"train_loss": -12.297783851623535, "global_step": 336275, "epoch": 2001} {"train_loss": -12.203697204589844, "global_step": 336276, "epoch": 2001} {"train_loss": -12.395283699035645, "global_step": 336277, "epoch": 2001} {"train_loss": -12.436040878295898, "global_step": 336278, "epoch": 2001} {"train_loss": -11.990583419799805, "global_step": 336279, "epoch": 2001} {"train_loss": -12.386218070983887, "global_step": 336280, "epoch": 2001} {"train_loss": -12.105164527893066, "global_step": 336281, "epoch": 2001} {"train_loss": -11.972085952758789, "global_step": 336282, "epoch": 2001} {"train_loss": -12.140295028686523, "global_step": 336283, "epoch": 2001} {"train_loss": -12.107202529907227, "global_step": 336284, "epoch": 2001} {"train_loss": -11.653335571289062, "global_step": 336285, "epoch": 2001} {"train_loss": -12.130472183227539, "global_step": 336286, "epoch": 2001} {"train_loss": -12.127286911010742, "global_step": 336287, "epoch": 2001} {"train_loss": -12.349040985107422, "global_step": 336288, "epoch": 2001} {"train_loss": -12.175128936767578, "global_step": 336289, "epoch": 2001} {"train_loss": -12.130383491516113, "global_step": 336290, "epoch": 2001} {"train_loss": -11.758504867553711, "global_step": 336291, "epoch": 2001} {"train_loss": -12.274219512939453, "global_step": 336292, "epoch": 2001} {"train_loss": -12.032166481018066, "global_step": 336293, "epoch": 2001} {"train_loss": -12.079748153686523, "global_step": 336294, "epoch": 2001} {"train_loss": -12.16572380065918, "global_step": 336295, "epoch": 2001} {"train_loss": -12.22578239440918, "global_step": 336296, "epoch": 2001} {"train_loss": -11.82522201538086, "global_step": 336297, "epoch": 2001} {"train_loss": -12.26515007019043, "global_step": 336298, "epoch": 2001} {"train_loss": -12.143756866455078, "global_step": 336299, "epoch": 2001} {"train_loss": -12.099050521850586, "global_step": 336300, "epoch": 2001} {"train_loss": -11.914222717285156, "global_step": 336301, "epoch": 2001} {"train_loss": -12.290675163269043, "global_step": 336302, "epoch": 2001} {"train_loss": -12.511083602905273, "global_step": 336303, "epoch": 2001} {"train_loss": -12.29262924194336, "global_step": 336304, "epoch": 2001} {"train_loss": -12.309394836425781, "global_step": 336305, "epoch": 2001} {"train_loss": -12.78935432434082, "global_step": 336306, "epoch": 2001} {"train_loss": -11.957025527954102, "global_step": 336307, "epoch": 2001} {"train_loss": -12.401409149169922, "global_step": 336308, "epoch": 2001} {"train_loss": -12.216897964477539, "global_step": 336309, "epoch": 2001} {"train_loss": -12.417827606201172, "global_step": 336310, "epoch": 2001} {"train_loss": -12.282670021057129, "global_step": 336311, "epoch": 2001} {"train_loss": -12.51507568359375, "global_step": 336312, "epoch": 2001} {"train_loss": -12.17991828918457, "global_step": 336313, "epoch": 2001} {"train_loss": -12.363075256347656, "global_step": 336314, "epoch": 2001} {"train_loss": -12.41707992553711, "global_step": 336315, "epoch": 2001} {"train_loss": -12.584293365478516, "global_step": 336316, "epoch": 2001} {"train_loss": -12.32043170928955, "global_step": 336317, "epoch": 2001} {"train_loss": -12.533430099487305, "global_step": 336318, "epoch": 2001} {"train_loss": -12.398242950439453, "global_step": 336319, "epoch": 2001} {"train_loss": -12.22370719909668, "global_step": 336320, "epoch": 2001} {"train_loss": -12.440505981445312, "global_step": 336321, "epoch": 2001} {"train_loss": -12.468846321105957, "global_step": 336322, "epoch": 2001} {"train_loss": -12.053301811218262, "global_step": 336323, "epoch": 2001} {"train_loss": -12.048550605773926, "global_step": 336324, "epoch": 2001} {"train_loss": -11.214927673339844, "global_step": 336325, "epoch": 2001} {"train_loss": -11.682867050170898, "global_step": 336326, "epoch": 2001} {"train_loss": -12.271114349365234, "global_step": 336327, "epoch": 2001} {"train_loss": -11.438009262084961, "global_step": 336328, "epoch": 2001} {"train_loss": -10.514537811279297, "global_step": 336329, "epoch": 2001} {"train_loss": -11.456405639648438, "global_step": 336330, "epoch": 2001} {"train_loss": -11.504488945007324, "global_step": 336331, "epoch": 2001} {"train_loss": -11.089390754699707, "global_step": 336332, "epoch": 2001} {"train_loss": -11.803411483764648, "global_step": 336333, "epoch": 2001} {"train_loss": -12.115158081054688, "global_step": 336334, "epoch": 2001} {"train_loss": -12.00951411610558, "global_step": 336335, "epoch": 2001, "val_loss": 288032.59375} {"train_loss": -11.436546325683594, "global_step": 336336, "epoch": 2002} {"train_loss": -12.02784538269043, "global_step": 336337, "epoch": 2002} {"train_loss": -11.338813781738281, "global_step": 336338, "epoch": 2002} {"train_loss": -11.003077507019043, "global_step": 336339, "epoch": 2002} {"train_loss": -10.910141944885254, "global_step": 336340, "epoch": 2002} {"train_loss": -11.838085174560547, "global_step": 336341, "epoch": 2002} {"train_loss": -11.42280387878418, "global_step": 336342, "epoch": 2002} {"train_loss": -12.332822799682617, "global_step": 336343, "epoch": 2002} {"train_loss": -11.502388954162598, "global_step": 336344, "epoch": 2002} {"train_loss": -11.75202751159668, "global_step": 336345, "epoch": 2002} {"train_loss": -11.836856842041016, "global_step": 336346, "epoch": 2002} {"train_loss": -11.999393463134766, "global_step": 336347, "epoch": 2002} {"train_loss": -11.746953964233398, "global_step": 336348, "epoch": 2002} {"train_loss": -12.044995307922363, "global_step": 336349, "epoch": 2002} {"train_loss": -12.053985595703125, "global_step": 336350, "epoch": 2002} {"train_loss": -11.815876007080078, "global_step": 336351, "epoch": 2002} {"train_loss": -12.255782127380371, "global_step": 336352, "epoch": 2002} {"train_loss": -12.230313301086426, "global_step": 336353, "epoch": 2002} {"train_loss": -12.106409072875977, "global_step": 336354, "epoch": 2002} {"train_loss": -11.543006896972656, "global_step": 336355, "epoch": 2002} {"train_loss": -12.288578033447266, "global_step": 336356, "epoch": 2002} {"train_loss": -11.822839736938477, "global_step": 336357, "epoch": 2002} {"train_loss": -11.624019622802734, "global_step": 336358, "epoch": 2002} {"train_loss": -12.204429626464844, "global_step": 336359, "epoch": 2002} {"train_loss": -12.053682327270508, "global_step": 336360, "epoch": 2002} {"train_loss": -11.291997909545898, "global_step": 336361, "epoch": 2002} {"train_loss": -12.284306526184082, "global_step": 336362, "epoch": 2002} {"train_loss": -11.62222671508789, "global_step": 336363, "epoch": 2002} {"train_loss": -11.614006042480469, "global_step": 336364, "epoch": 2002} {"train_loss": -11.696207046508789, "global_step": 336365, "epoch": 2002} {"train_loss": -12.168201446533203, "global_step": 336366, "epoch": 2002} {"train_loss": -12.161075592041016, "global_step": 336367, "epoch": 2002} {"train_loss": -12.015338897705078, "global_step": 336368, "epoch": 2002} {"train_loss": -11.415433883666992, "global_step": 336369, "epoch": 2002} {"train_loss": -12.101885795593262, "global_step": 336370, "epoch": 2002} {"train_loss": -12.137645721435547, "global_step": 336371, "epoch": 2002} {"train_loss": -12.235855102539062, "global_step": 336372, "epoch": 2002} {"train_loss": -12.35258960723877, "global_step": 336373, "epoch": 2002} {"train_loss": -12.144979476928711, "global_step": 336374, "epoch": 2002} {"train_loss": -12.265144348144531, "global_step": 336375, "epoch": 2002} {"train_loss": -12.374155044555664, "global_step": 336376, "epoch": 2002} {"train_loss": -11.9375638961792, "global_step": 336377, "epoch": 2002} {"train_loss": -12.295578002929688, "global_step": 336378, "epoch": 2002} {"train_loss": -12.230203628540039, "global_step": 336379, "epoch": 2002} {"train_loss": -12.140746116638184, "global_step": 336380, "epoch": 2002} {"train_loss": -11.475322723388672, "global_step": 336381, "epoch": 2002} {"train_loss": -12.244213104248047, "global_step": 336382, "epoch": 2002} {"train_loss": -11.876334190368652, "global_step": 336383, "epoch": 2002} {"train_loss": -12.051254272460938, "global_step": 336384, "epoch": 2002} {"train_loss": -11.816868782043457, "global_step": 336385, "epoch": 2002} {"train_loss": -11.281402587890625, "global_step": 336386, "epoch": 2002} {"train_loss": -12.22570514678955, "global_step": 336387, "epoch": 2002} {"train_loss": -12.18621826171875, "global_step": 336388, "epoch": 2002} {"train_loss": -11.936716079711914, "global_step": 336389, "epoch": 2002} {"train_loss": -12.126774787902832, "global_step": 336390, "epoch": 2002} {"train_loss": -11.955036163330078, "global_step": 336391, "epoch": 2002} {"train_loss": -11.478705406188965, "global_step": 336392, "epoch": 2002} {"train_loss": -11.866021156311035, "global_step": 336393, "epoch": 2002} {"train_loss": -11.04327392578125, "global_step": 336394, "epoch": 2002} {"train_loss": -12.021574974060059, "global_step": 336395, "epoch": 2002} {"train_loss": -11.611328125, "global_step": 336396, "epoch": 2002} {"train_loss": -11.74182415008545, "global_step": 336397, "epoch": 2002} {"train_loss": -11.370610237121582, "global_step": 336398, "epoch": 2002} {"train_loss": -11.53514289855957, "global_step": 336399, "epoch": 2002} {"train_loss": -12.217314720153809, "global_step": 336400, "epoch": 2002} {"train_loss": -11.114290237426758, "global_step": 336401, "epoch": 2002} {"train_loss": -12.1460542678833, "global_step": 336402, "epoch": 2002} {"train_loss": -11.2593412399292, "global_step": 336403, "epoch": 2002} {"train_loss": -11.591143608093262, "global_step": 336404, "epoch": 2002} {"train_loss": -12.028133392333984, "global_step": 336405, "epoch": 2002} {"train_loss": -11.1104736328125, "global_step": 336406, "epoch": 2002} {"train_loss": -12.267207145690918, "global_step": 336407, "epoch": 2002} {"train_loss": -11.800329208374023, "global_step": 336408, "epoch": 2002} {"train_loss": -11.288994789123535, "global_step": 336409, "epoch": 2002} {"train_loss": -12.088130950927734, "global_step": 336410, "epoch": 2002} {"train_loss": -11.681975364685059, "global_step": 336411, "epoch": 2002} {"train_loss": -11.677765846252441, "global_step": 336412, "epoch": 2002} {"train_loss": -11.976238250732422, "global_step": 336413, "epoch": 2002} {"train_loss": -11.538082122802734, "global_step": 336414, "epoch": 2002} {"train_loss": -12.062568664550781, "global_step": 336415, "epoch": 2002} {"train_loss": -11.828903198242188, "global_step": 336416, "epoch": 2002} {"train_loss": -11.992464065551758, "global_step": 336417, "epoch": 2002} {"train_loss": -12.02397346496582, "global_step": 336418, "epoch": 2002} {"train_loss": -12.110645294189453, "global_step": 336419, "epoch": 2002} {"train_loss": -11.985292434692383, "global_step": 336420, "epoch": 2002} {"train_loss": -11.766837120056152, "global_step": 336421, "epoch": 2002} {"train_loss": -12.404268264770508, "global_step": 336422, "epoch": 2002} {"train_loss": -11.947250366210938, "global_step": 336423, "epoch": 2002} {"train_loss": -12.099678039550781, "global_step": 336424, "epoch": 2002} {"train_loss": -11.846308708190918, "global_step": 336425, "epoch": 2002} {"train_loss": -11.976146697998047, "global_step": 336426, "epoch": 2002} {"train_loss": -11.874195098876953, "global_step": 336427, "epoch": 2002} {"train_loss": -12.206615447998047, "global_step": 336428, "epoch": 2002} {"train_loss": -12.389137268066406, "global_step": 336429, "epoch": 2002} {"train_loss": -12.324352264404297, "global_step": 336430, "epoch": 2002} {"train_loss": -12.188159942626953, "global_step": 336431, "epoch": 2002} {"train_loss": -12.291196823120117, "global_step": 336432, "epoch": 2002} {"train_loss": -12.255760192871094, "global_step": 336433, "epoch": 2002} {"train_loss": -12.449113845825195, "global_step": 336434, "epoch": 2002} {"train_loss": -12.1876220703125, "global_step": 336435, "epoch": 2002} {"train_loss": -12.201719284057617, "global_step": 336436, "epoch": 2002} {"train_loss": -12.248003005981445, "global_step": 336437, "epoch": 2002} {"train_loss": -12.152182579040527, "global_step": 336438, "epoch": 2002} {"train_loss": -12.04583740234375, "global_step": 336439, "epoch": 2002} {"train_loss": -12.092901229858398, "global_step": 336440, "epoch": 2002} {"train_loss": -11.91181755065918, "global_step": 336441, "epoch": 2002} {"train_loss": -11.75891399383545, "global_step": 336442, "epoch": 2002} {"train_loss": -11.624025344848633, "global_step": 336443, "epoch": 2002} {"train_loss": -11.457019805908203, "global_step": 336444, "epoch": 2002} {"train_loss": -11.734869003295898, "global_step": 336445, "epoch": 2002} {"train_loss": -11.897830963134766, "global_step": 336446, "epoch": 2002} {"train_loss": -10.875547409057617, "global_step": 336447, "epoch": 2002} {"train_loss": -10.565284729003906, "global_step": 336448, "epoch": 2002} {"train_loss": -11.173233032226562, "global_step": 336449, "epoch": 2002} {"train_loss": -11.867796897888184, "global_step": 336450, "epoch": 2002} {"train_loss": -11.725120544433594, "global_step": 336451, "epoch": 2002} {"train_loss": -10.521951675415039, "global_step": 336452, "epoch": 2002} {"train_loss": -11.593023300170898, "global_step": 336453, "epoch": 2002} {"train_loss": -11.279850959777832, "global_step": 336454, "epoch": 2002} {"train_loss": -11.322700500488281, "global_step": 336455, "epoch": 2002} {"train_loss": -11.276796340942383, "global_step": 336456, "epoch": 2002} {"train_loss": -11.858007431030273, "global_step": 336457, "epoch": 2002} {"train_loss": -11.74819564819336, "global_step": 336458, "epoch": 2002} {"train_loss": -11.499433517456055, "global_step": 336459, "epoch": 2002} {"train_loss": -12.035494804382324, "global_step": 336460, "epoch": 2002} {"train_loss": -11.775620460510254, "global_step": 336461, "epoch": 2002} {"train_loss": -11.423002243041992, "global_step": 336462, "epoch": 2002} {"train_loss": -11.870346069335938, "global_step": 336463, "epoch": 2002} {"train_loss": -11.773585319519043, "global_step": 336464, "epoch": 2002} {"train_loss": -11.577016830444336, "global_step": 336465, "epoch": 2002} {"train_loss": -11.82957649230957, "global_step": 336466, "epoch": 2002} {"train_loss": -11.600445747375488, "global_step": 336467, "epoch": 2002} {"train_loss": -11.78233814239502, "global_step": 336468, "epoch": 2002} {"train_loss": -11.283000946044922, "global_step": 336469, "epoch": 2002} {"train_loss": -11.916254043579102, "global_step": 336470, "epoch": 2002} {"train_loss": -11.908687591552734, "global_step": 336471, "epoch": 2002} {"train_loss": -11.674522399902344, "global_step": 336472, "epoch": 2002} {"train_loss": -11.85223388671875, "global_step": 336473, "epoch": 2002} {"train_loss": -11.391996383666992, "global_step": 336474, "epoch": 2002} {"train_loss": -11.610525131225586, "global_step": 336475, "epoch": 2002} {"train_loss": -11.575434684753418, "global_step": 336476, "epoch": 2002} {"train_loss": -11.925321578979492, "global_step": 336477, "epoch": 2002} {"train_loss": -11.684974670410156, "global_step": 336478, "epoch": 2002} {"train_loss": -12.017599105834961, "global_step": 336479, "epoch": 2002} {"train_loss": -11.94765853881836, "global_step": 336480, "epoch": 2002} {"train_loss": -11.732030868530273, "global_step": 336481, "epoch": 2002} {"train_loss": -11.90876579284668, "global_step": 336482, "epoch": 2002} {"train_loss": -12.26462459564209, "global_step": 336483, "epoch": 2002} {"train_loss": -11.663579940795898, "global_step": 336484, "epoch": 2002} {"train_loss": -12.09823989868164, "global_step": 336485, "epoch": 2002} {"train_loss": -11.564508438110352, "global_step": 336486, "epoch": 2002} {"train_loss": -12.107393264770508, "global_step": 336487, "epoch": 2002} {"train_loss": -11.937061309814453, "global_step": 336488, "epoch": 2002} {"train_loss": -11.86905288696289, "global_step": 336489, "epoch": 2002} {"train_loss": -12.075920104980469, "global_step": 336490, "epoch": 2002} {"train_loss": -11.934874534606934, "global_step": 336491, "epoch": 2002} {"train_loss": -12.174776077270508, "global_step": 336492, "epoch": 2002} {"train_loss": -11.917776107788086, "global_step": 336493, "epoch": 2002} {"train_loss": -11.65371322631836, "global_step": 336494, "epoch": 2002} {"train_loss": -11.626032829284668, "global_step": 336495, "epoch": 2002} {"train_loss": -11.840188980102539, "global_step": 336496, "epoch": 2002} {"train_loss": -11.43337631225586, "global_step": 336497, "epoch": 2002} {"train_loss": -12.001724243164062, "global_step": 336498, "epoch": 2002} {"train_loss": -11.533208847045898, "global_step": 336499, "epoch": 2002} {"train_loss": -11.556681632995605, "global_step": 336500, "epoch": 2002} {"train_loss": -12.180843353271484, "global_step": 336501, "epoch": 2002} {"train_loss": -11.433899879455566, "global_step": 336502, "epoch": 2002} {"train_loss": -11.82512438864935, "global_step": 336503, "epoch": 2002, "val_loss": 288701.625} {"train_loss": -11.279614448547363, "global_step": 336504, "epoch": 2003} {"train_loss": -12.118595123291016, "global_step": 336505, "epoch": 2003} {"train_loss": -11.883315086364746, "global_step": 336506, "epoch": 2003} {"train_loss": -12.091545104980469, "global_step": 336507, "epoch": 2003} {"train_loss": -11.857137680053711, "global_step": 336508, "epoch": 2003} {"train_loss": -11.938876152038574, "global_step": 336509, "epoch": 2003} {"train_loss": -11.886667251586914, "global_step": 336510, "epoch": 2003} {"train_loss": -12.277048110961914, "global_step": 336511, "epoch": 2003} {"train_loss": -11.893854141235352, "global_step": 336512, "epoch": 2003} {"train_loss": -12.247964859008789, "global_step": 336513, "epoch": 2003} {"train_loss": -11.869277000427246, "global_step": 336514, "epoch": 2003} {"train_loss": -11.901329040527344, "global_step": 336515, "epoch": 2003} {"train_loss": -11.969232559204102, "global_step": 336516, "epoch": 2003} {"train_loss": -11.90668773651123, "global_step": 336517, "epoch": 2003} {"train_loss": -11.671329498291016, "global_step": 336518, "epoch": 2003} {"train_loss": -11.749261856079102, "global_step": 336519, "epoch": 2003} {"train_loss": -11.036270141601562, "global_step": 336520, "epoch": 2003} {"train_loss": -11.73269271850586, "global_step": 336521, "epoch": 2003} {"train_loss": -11.279422760009766, "global_step": 336522, "epoch": 2003} {"train_loss": -10.861379623413086, "global_step": 336523, "epoch": 2003} {"train_loss": -9.369035720825195, "global_step": 336524, "epoch": 2003} {"train_loss": -11.406272888183594, "global_step": 336525, "epoch": 2003} {"train_loss": -10.764581680297852, "global_step": 336526, "epoch": 2003} {"train_loss": -11.153324127197266, "global_step": 336527, "epoch": 2003} {"train_loss": -10.839972496032715, "global_step": 336528, "epoch": 2003} {"train_loss": -11.747390747070312, "global_step": 336529, "epoch": 2003} {"train_loss": -11.563705444335938, "global_step": 336530, "epoch": 2003} {"train_loss": -11.566267967224121, "global_step": 336531, "epoch": 2003} {"train_loss": -11.83207893371582, "global_step": 336532, "epoch": 2003} {"train_loss": -11.530057907104492, "global_step": 336533, "epoch": 2003} {"train_loss": -11.78632926940918, "global_step": 336534, "epoch": 2003} {"train_loss": -11.353971481323242, "global_step": 336535, "epoch": 2003} {"train_loss": -11.386730194091797, "global_step": 336536, "epoch": 2003} {"train_loss": -11.248382568359375, "global_step": 336537, "epoch": 2003} {"train_loss": -11.475545883178711, "global_step": 336538, "epoch": 2003} {"train_loss": -11.506280899047852, "global_step": 336539, "epoch": 2003} {"train_loss": -11.423677444458008, "global_step": 336540, "epoch": 2003} {"train_loss": -11.594063758850098, "global_step": 336541, "epoch": 2003} {"train_loss": -10.859288215637207, "global_step": 336542, "epoch": 2003} {"train_loss": -11.49001407623291, "global_step": 336543, "epoch": 2003} {"train_loss": -10.295178413391113, "global_step": 336544, "epoch": 2003} {"train_loss": -11.710105895996094, "global_step": 336545, "epoch": 2003} {"train_loss": -10.643465042114258, "global_step": 336546, "epoch": 2003} {"train_loss": -11.393953323364258, "global_step": 336547, "epoch": 2003} {"train_loss": -11.235272407531738, "global_step": 336548, "epoch": 2003} {"train_loss": -11.248527526855469, "global_step": 336549, "epoch": 2003} {"train_loss": -10.69411563873291, "global_step": 336550, "epoch": 2003} {"train_loss": -11.51415729522705, "global_step": 336551, "epoch": 2003} {"train_loss": -11.245447158813477, "global_step": 336552, "epoch": 2003} {"train_loss": -11.309389114379883, "global_step": 336553, "epoch": 2003} {"train_loss": -11.843683242797852, "global_step": 336554, "epoch": 2003} {"train_loss": -11.463229179382324, "global_step": 336555, "epoch": 2003} {"train_loss": -11.966072082519531, "global_step": 336556, "epoch": 2003} {"train_loss": -11.592697143554688, "global_step": 336557, "epoch": 2003} {"train_loss": -11.631772994995117, "global_step": 336558, "epoch": 2003} {"train_loss": -12.102502822875977, "global_step": 336559, "epoch": 2003} {"train_loss": -11.637958526611328, "global_step": 336560, "epoch": 2003} {"train_loss": -11.834033966064453, "global_step": 336561, "epoch": 2003} {"train_loss": -11.819822311401367, "global_step": 336562, "epoch": 2003} {"train_loss": -11.933799743652344, "global_step": 336563, "epoch": 2003} {"train_loss": -11.742820739746094, "global_step": 336564, "epoch": 2003} {"train_loss": -11.830012321472168, "global_step": 336565, "epoch": 2003} {"train_loss": -12.148765563964844, "global_step": 336566, "epoch": 2003} {"train_loss": -11.893951416015625, "global_step": 336567, "epoch": 2003} {"train_loss": -12.217428207397461, "global_step": 336568, "epoch": 2003} {"train_loss": -12.013187408447266, "global_step": 336569, "epoch": 2003} {"train_loss": -12.222967147827148, "global_step": 336570, "epoch": 2003} {"train_loss": -12.14330005645752, "global_step": 336571, "epoch": 2003} {"train_loss": -12.334184646606445, "global_step": 336572, "epoch": 2003} {"train_loss": -12.150602340698242, "global_step": 336573, "epoch": 2003} {"train_loss": -12.170368194580078, "global_step": 336574, "epoch": 2003} {"train_loss": -12.20318603515625, "global_step": 336575, "epoch": 2003} {"train_loss": -12.474211692810059, "global_step": 336576, "epoch": 2003} {"train_loss": -12.350790023803711, "global_step": 336577, "epoch": 2003} {"train_loss": -12.311819076538086, "global_step": 336578, "epoch": 2003} {"train_loss": -12.270697593688965, "global_step": 336579, "epoch": 2003} {"train_loss": -12.411870002746582, "global_step": 336580, "epoch": 2003} {"train_loss": -12.534025192260742, "global_step": 336581, "epoch": 2003} {"train_loss": -12.409947395324707, "global_step": 336582, "epoch": 2003} {"train_loss": -12.169685363769531, "global_step": 336583, "epoch": 2003} {"train_loss": -12.453658103942871, "global_step": 336584, "epoch": 2003} {"train_loss": -12.311274528503418, "global_step": 336585, "epoch": 2003} {"train_loss": -12.479398727416992, "global_step": 336586, "epoch": 2003} {"train_loss": -12.248798370361328, "global_step": 336587, "epoch": 2003} {"train_loss": -12.37048625946045, "global_step": 336588, "epoch": 2003} {"train_loss": -12.392431259155273, "global_step": 336589, "epoch": 2003} {"train_loss": -12.289196014404297, "global_step": 336590, "epoch": 2003} {"train_loss": -12.46898078918457, "global_step": 336591, "epoch": 2003} {"train_loss": -12.472713470458984, "global_step": 336592, "epoch": 2003} {"train_loss": -12.197784423828125, "global_step": 336593, "epoch": 2003} {"train_loss": -12.653970718383789, "global_step": 336594, "epoch": 2003} {"train_loss": -12.445924758911133, "global_step": 336595, "epoch": 2003} {"train_loss": -12.493204116821289, "global_step": 336596, "epoch": 2003} {"train_loss": -12.494489669799805, "global_step": 336597, "epoch": 2003} {"train_loss": -12.358865737915039, "global_step": 336598, "epoch": 2003} {"train_loss": -12.626252174377441, "global_step": 336599, "epoch": 2003} {"train_loss": -12.37509536743164, "global_step": 336600, "epoch": 2003} {"train_loss": -12.492185592651367, "global_step": 336601, "epoch": 2003} {"train_loss": -12.55674934387207, "global_step": 336602, "epoch": 2003} {"train_loss": -12.499923706054688, "global_step": 336603, "epoch": 2003} {"train_loss": -12.45655632019043, "global_step": 336604, "epoch": 2003} {"train_loss": -12.474466323852539, "global_step": 336605, "epoch": 2003} {"train_loss": -12.444632530212402, "global_step": 336606, "epoch": 2003} {"train_loss": -12.303370475769043, "global_step": 336607, "epoch": 2003} {"train_loss": -12.328563690185547, "global_step": 336608, "epoch": 2003} {"train_loss": -12.388670921325684, "global_step": 336609, "epoch": 2003} {"train_loss": -12.152647972106934, "global_step": 336610, "epoch": 2003} {"train_loss": -12.372150421142578, "global_step": 336611, "epoch": 2003} {"train_loss": -12.255314826965332, "global_step": 336612, "epoch": 2003} {"train_loss": -12.540623664855957, "global_step": 336613, "epoch": 2003} {"train_loss": -12.455724716186523, "global_step": 336614, "epoch": 2003} {"train_loss": -12.390786170959473, "global_step": 336615, "epoch": 2003} {"train_loss": -12.368943214416504, "global_step": 336616, "epoch": 2003} {"train_loss": -12.294488906860352, "global_step": 336617, "epoch": 2003} {"train_loss": -12.254327774047852, "global_step": 336618, "epoch": 2003} {"train_loss": -12.311365127563477, "global_step": 336619, "epoch": 2003} {"train_loss": -12.288734436035156, "global_step": 336620, "epoch": 2003} {"train_loss": -12.425045013427734, "global_step": 336621, "epoch": 2003} {"train_loss": -12.392730712890625, "global_step": 336622, "epoch": 2003} {"train_loss": -12.454444885253906, "global_step": 336623, "epoch": 2003} {"train_loss": -12.34256362915039, "global_step": 336624, "epoch": 2003} {"train_loss": -12.291122436523438, "global_step": 336625, "epoch": 2003} {"train_loss": -12.43301010131836, "global_step": 336626, "epoch": 2003} {"train_loss": -12.385757446289062, "global_step": 336627, "epoch": 2003} {"train_loss": -11.90037727355957, "global_step": 336628, "epoch": 2003} {"train_loss": -12.537004470825195, "global_step": 336629, "epoch": 2003} {"train_loss": -12.089890480041504, "global_step": 336630, "epoch": 2003} {"train_loss": -12.40318489074707, "global_step": 336631, "epoch": 2003} {"train_loss": -11.937762260437012, "global_step": 336632, "epoch": 2003} {"train_loss": -12.430731773376465, "global_step": 336633, "epoch": 2003} {"train_loss": -12.424010276794434, "global_step": 336634, "epoch": 2003} {"train_loss": -12.664651870727539, "global_step": 336635, "epoch": 2003} {"train_loss": -12.511629104614258, "global_step": 336636, "epoch": 2003} {"train_loss": -12.457386016845703, "global_step": 336637, "epoch": 2003} {"train_loss": -12.0296630859375, "global_step": 336638, "epoch": 2003} {"train_loss": -11.82160758972168, "global_step": 336639, "epoch": 2003} {"train_loss": -12.331594467163086, "global_step": 336640, "epoch": 2003} {"train_loss": -12.25300407409668, "global_step": 336641, "epoch": 2003} {"train_loss": -12.526914596557617, "global_step": 336642, "epoch": 2003} {"train_loss": -11.846336364746094, "global_step": 336643, "epoch": 2003} {"train_loss": -11.48796272277832, "global_step": 336644, "epoch": 2003} {"train_loss": -11.156997680664062, "global_step": 336645, "epoch": 2003} {"train_loss": -11.842584609985352, "global_step": 336646, "epoch": 2003} {"train_loss": -12.010021209716797, "global_step": 336647, "epoch": 2003} {"train_loss": -11.670063972473145, "global_step": 336648, "epoch": 2003} {"train_loss": -9.954635620117188, "global_step": 336649, "epoch": 2003} {"train_loss": -10.927236557006836, "global_step": 336650, "epoch": 2003} {"train_loss": -9.187660217285156, "global_step": 336651, "epoch": 2003} {"train_loss": -7.922601222991943, "global_step": 336652, "epoch": 2003} {"train_loss": -7.885899543762207, "global_step": 336653, "epoch": 2003} {"train_loss": -9.136474609375, "global_step": 336654, "epoch": 2003} {"train_loss": -8.06275749206543, "global_step": 336655, "epoch": 2003} {"train_loss": -7.709016799926758, "global_step": 336656, "epoch": 2003} {"train_loss": -8.133674621582031, "global_step": 336657, "epoch": 2003} {"train_loss": -9.196249008178711, "global_step": 336658, "epoch": 2003} {"train_loss": -9.63250732421875, "global_step": 336659, "epoch": 2003} {"train_loss": -10.357428550720215, "global_step": 336660, "epoch": 2003} {"train_loss": -11.30161190032959, "global_step": 336661, "epoch": 2003} {"train_loss": -11.100940704345703, "global_step": 336662, "epoch": 2003} {"train_loss": -10.942447662353516, "global_step": 336663, "epoch": 2003} {"train_loss": -10.793365478515625, "global_step": 336664, "epoch": 2003} {"train_loss": -10.938200950622559, "global_step": 336665, "epoch": 2003} {"train_loss": -11.351561546325684, "global_step": 336666, "epoch": 2003} {"train_loss": -10.829465866088867, "global_step": 336667, "epoch": 2003} {"train_loss": -11.428009033203125, "global_step": 336668, "epoch": 2003} {"train_loss": -11.267779350280762, "global_step": 336669, "epoch": 2003} {"train_loss": -11.750591278076172, "global_step": 336670, "epoch": 2003} {"train_loss": -11.700384245032357, "global_step": 336671, "epoch": 2003, "val_loss": 275509.34375} {"train_loss": -11.544618606567383, "global_step": 336672, "epoch": 2004} {"train_loss": -11.23081111907959, "global_step": 336673, "epoch": 2004} {"train_loss": -11.519718170166016, "global_step": 336674, "epoch": 2004} {"train_loss": -11.742424011230469, "global_step": 336675, "epoch": 2004} {"train_loss": -11.977293014526367, "global_step": 336676, "epoch": 2004} {"train_loss": -11.521612167358398, "global_step": 336677, "epoch": 2004} {"train_loss": -11.726218223571777, "global_step": 336678, "epoch": 2004} {"train_loss": -11.72286605834961, "global_step": 336679, "epoch": 2004} {"train_loss": -11.501291275024414, "global_step": 336680, "epoch": 2004} {"train_loss": -11.022676467895508, "global_step": 336681, "epoch": 2004} {"train_loss": -11.205185890197754, "global_step": 336682, "epoch": 2004} {"train_loss": -11.656532287597656, "global_step": 336683, "epoch": 2004} {"train_loss": -11.515643119812012, "global_step": 336684, "epoch": 2004} {"train_loss": -11.751609802246094, "global_step": 336685, "epoch": 2004} {"train_loss": -11.758146286010742, "global_step": 336686, "epoch": 2004} {"train_loss": -11.042861938476562, "global_step": 336687, "epoch": 2004} {"train_loss": -11.941232681274414, "global_step": 336688, "epoch": 2004} {"train_loss": -11.544435501098633, "global_step": 336689, "epoch": 2004} {"train_loss": -11.274972915649414, "global_step": 336690, "epoch": 2004} {"train_loss": -11.786739349365234, "global_step": 336691, "epoch": 2004} {"train_loss": -11.805444717407227, "global_step": 336692, "epoch": 2004} {"train_loss": -11.811986923217773, "global_step": 336693, "epoch": 2004} {"train_loss": -11.65695571899414, "global_step": 336694, "epoch": 2004} {"train_loss": -11.626686096191406, "global_step": 336695, "epoch": 2004} {"train_loss": -11.618359565734863, "global_step": 336696, "epoch": 2004} {"train_loss": -11.84565544128418, "global_step": 336697, "epoch": 2004} {"train_loss": -11.851003646850586, "global_step": 336698, "epoch": 2004} {"train_loss": -11.82194709777832, "global_step": 336699, "epoch": 2004} {"train_loss": -12.024457931518555, "global_step": 336700, "epoch": 2004} {"train_loss": -11.651323318481445, "global_step": 336701, "epoch": 2004} {"train_loss": -12.043024063110352, "global_step": 336702, "epoch": 2004} {"train_loss": -12.114274978637695, "global_step": 336703, "epoch": 2004} {"train_loss": -11.620906829833984, "global_step": 336704, "epoch": 2004} {"train_loss": -12.122552871704102, "global_step": 336705, "epoch": 2004} {"train_loss": -11.667728424072266, "global_step": 336706, "epoch": 2004} {"train_loss": -12.119454383850098, "global_step": 336707, "epoch": 2004} {"train_loss": -11.929008483886719, "global_step": 336708, "epoch": 2004} {"train_loss": -12.027331352233887, "global_step": 336709, "epoch": 2004} {"train_loss": -11.86400318145752, "global_step": 336710, "epoch": 2004} {"train_loss": -12.11091423034668, "global_step": 336711, "epoch": 2004} {"train_loss": -11.920360565185547, "global_step": 336712, "epoch": 2004} {"train_loss": -12.16884708404541, "global_step": 336713, "epoch": 2004} {"train_loss": -12.074872970581055, "global_step": 336714, "epoch": 2004} {"train_loss": -12.038248062133789, "global_step": 336715, "epoch": 2004} {"train_loss": -11.928329467773438, "global_step": 336716, "epoch": 2004} {"train_loss": -12.028925895690918, "global_step": 336717, "epoch": 2004} {"train_loss": -11.68946647644043, "global_step": 336718, "epoch": 2004} {"train_loss": -12.490110397338867, "global_step": 336719, "epoch": 2004} {"train_loss": -11.742262840270996, "global_step": 336720, "epoch": 2004} {"train_loss": -12.104446411132812, "global_step": 336721, "epoch": 2004} {"train_loss": -11.982734680175781, "global_step": 336722, "epoch": 2004} {"train_loss": -12.275707244873047, "global_step": 336723, "epoch": 2004} {"train_loss": -12.154519081115723, "global_step": 336724, "epoch": 2004} {"train_loss": -11.99063491821289, "global_step": 336725, "epoch": 2004} {"train_loss": -12.023992538452148, "global_step": 336726, "epoch": 2004} {"train_loss": -11.904743194580078, "global_step": 336727, "epoch": 2004} {"train_loss": -12.295879364013672, "global_step": 336728, "epoch": 2004} {"train_loss": -12.150859832763672, "global_step": 336729, "epoch": 2004} {"train_loss": -12.086881637573242, "global_step": 336730, "epoch": 2004} {"train_loss": -12.07761001586914, "global_step": 336731, "epoch": 2004} {"train_loss": -12.232479095458984, "global_step": 336732, "epoch": 2004} {"train_loss": -12.174820899963379, "global_step": 336733, "epoch": 2004} {"train_loss": -12.175080299377441, "global_step": 336734, "epoch": 2004} {"train_loss": -12.116955757141113, "global_step": 336735, "epoch": 2004} {"train_loss": -12.372882843017578, "global_step": 336736, "epoch": 2004} {"train_loss": -12.280967712402344, "global_step": 336737, "epoch": 2004} {"train_loss": -12.550873756408691, "global_step": 336738, "epoch": 2004} {"train_loss": -12.262324333190918, "global_step": 336739, "epoch": 2004} {"train_loss": -12.45051383972168, "global_step": 336740, "epoch": 2004} {"train_loss": -12.376428604125977, "global_step": 336741, "epoch": 2004} {"train_loss": -12.297407150268555, "global_step": 336742, "epoch": 2004} {"train_loss": -12.429634094238281, "global_step": 336743, "epoch": 2004} {"train_loss": -12.255422592163086, "global_step": 336744, "epoch": 2004} {"train_loss": -12.296899795532227, "global_step": 336745, "epoch": 2004} {"train_loss": -12.382222175598145, "global_step": 336746, "epoch": 2004} {"train_loss": -12.375936508178711, "global_step": 336747, "epoch": 2004} {"train_loss": -12.263915061950684, "global_step": 336748, "epoch": 2004} {"train_loss": -12.414732933044434, "global_step": 336749, "epoch": 2004} {"train_loss": -12.350467681884766, "global_step": 336750, "epoch": 2004} {"train_loss": -12.531481742858887, "global_step": 336751, "epoch": 2004} {"train_loss": -12.061384201049805, "global_step": 336752, "epoch": 2004} {"train_loss": -12.359648704528809, "global_step": 336753, "epoch": 2004} {"train_loss": -12.63349723815918, "global_step": 336754, "epoch": 2004} {"train_loss": -12.38998794555664, "global_step": 336755, "epoch": 2004} {"train_loss": -12.001190185546875, "global_step": 336756, "epoch": 2004} {"train_loss": -12.192953109741211, "global_step": 336757, "epoch": 2004} {"train_loss": -12.409948348999023, "global_step": 336758, "epoch": 2004} {"train_loss": -12.292176246643066, "global_step": 336759, "epoch": 2004} {"train_loss": -12.315128326416016, "global_step": 336760, "epoch": 2004} {"train_loss": -12.323564529418945, "global_step": 336761, "epoch": 2004} {"train_loss": -12.220324516296387, "global_step": 336762, "epoch": 2004} {"train_loss": -12.530740737915039, "global_step": 336763, "epoch": 2004} {"train_loss": -12.25446891784668, "global_step": 336764, "epoch": 2004} {"train_loss": -12.347442626953125, "global_step": 336765, "epoch": 2004} {"train_loss": -12.642938613891602, "global_step": 336766, "epoch": 2004} {"train_loss": -12.442363739013672, "global_step": 336767, "epoch": 2004} {"train_loss": -12.38532829284668, "global_step": 336768, "epoch": 2004} {"train_loss": -12.561158180236816, "global_step": 336769, "epoch": 2004} {"train_loss": -12.510896682739258, "global_step": 336770, "epoch": 2004} {"train_loss": -12.136367797851562, "global_step": 336771, "epoch": 2004} {"train_loss": -11.927963256835938, "global_step": 336772, "epoch": 2004} {"train_loss": -12.371270179748535, "global_step": 336773, "epoch": 2004} {"train_loss": -12.164787292480469, "global_step": 336774, "epoch": 2004} {"train_loss": -11.84490966796875, "global_step": 336775, "epoch": 2004} {"train_loss": -12.30295181274414, "global_step": 336776, "epoch": 2004} {"train_loss": -12.307576179504395, "global_step": 336777, "epoch": 2004} {"train_loss": -12.445987701416016, "global_step": 336778, "epoch": 2004} {"train_loss": -12.515554428100586, "global_step": 336779, "epoch": 2004} {"train_loss": -12.17779541015625, "global_step": 336780, "epoch": 2004} {"train_loss": -12.387192726135254, "global_step": 336781, "epoch": 2004} {"train_loss": -12.151557922363281, "global_step": 336782, "epoch": 2004} {"train_loss": -12.235112190246582, "global_step": 336783, "epoch": 2004} {"train_loss": -11.789671897888184, "global_step": 336784, "epoch": 2004} {"train_loss": -12.112373352050781, "global_step": 336785, "epoch": 2004} {"train_loss": -11.520597457885742, "global_step": 336786, "epoch": 2004} {"train_loss": -11.041692733764648, "global_step": 336787, "epoch": 2004} {"train_loss": -12.268318176269531, "global_step": 336788, "epoch": 2004} {"train_loss": -11.654922485351562, "global_step": 336789, "epoch": 2004} {"train_loss": -11.779536247253418, "global_step": 336790, "epoch": 2004} {"train_loss": -10.441965103149414, "global_step": 336791, "epoch": 2004} {"train_loss": -11.407796859741211, "global_step": 336792, "epoch": 2004} {"train_loss": -11.668621063232422, "global_step": 336793, "epoch": 2004} {"train_loss": -12.094185829162598, "global_step": 336794, "epoch": 2004} {"train_loss": -11.560850143432617, "global_step": 336795, "epoch": 2004} {"train_loss": -12.313652992248535, "global_step": 336796, "epoch": 2004} {"train_loss": -12.151199340820312, "global_step": 336797, "epoch": 2004} {"train_loss": -12.176472663879395, "global_step": 336798, "epoch": 2004} {"train_loss": -11.963188171386719, "global_step": 336799, "epoch": 2004} {"train_loss": -11.864812850952148, "global_step": 336800, "epoch": 2004} {"train_loss": -12.366515159606934, "global_step": 336801, "epoch": 2004} {"train_loss": -11.96694564819336, "global_step": 336802, "epoch": 2004} {"train_loss": -12.115840911865234, "global_step": 336803, "epoch": 2004} {"train_loss": -12.211801528930664, "global_step": 336804, "epoch": 2004} {"train_loss": -12.246870040893555, "global_step": 336805, "epoch": 2004} {"train_loss": -12.16042709350586, "global_step": 336806, "epoch": 2004} {"train_loss": -12.234447479248047, "global_step": 336807, "epoch": 2004} {"train_loss": -12.194164276123047, "global_step": 336808, "epoch": 2004} {"train_loss": -12.087658882141113, "global_step": 336809, "epoch": 2004} {"train_loss": -12.111265182495117, "global_step": 336810, "epoch": 2004} {"train_loss": -12.26842212677002, "global_step": 336811, "epoch": 2004} {"train_loss": -12.601956367492676, "global_step": 336812, "epoch": 2004} {"train_loss": -12.295634269714355, "global_step": 336813, "epoch": 2004} {"train_loss": -12.25944709777832, "global_step": 336814, "epoch": 2004} {"train_loss": -12.389522552490234, "global_step": 336815, "epoch": 2004} {"train_loss": -11.714239120483398, "global_step": 336816, "epoch": 2004} {"train_loss": -10.64194393157959, "global_step": 336817, "epoch": 2004} {"train_loss": -12.07514762878418, "global_step": 336818, "epoch": 2004} {"train_loss": -12.15951919555664, "global_step": 336819, "epoch": 2004} {"train_loss": -12.261282920837402, "global_step": 336820, "epoch": 2004} {"train_loss": -11.669355392456055, "global_step": 336821, "epoch": 2004} {"train_loss": -12.074197769165039, "global_step": 336822, "epoch": 2004} {"train_loss": -12.124273300170898, "global_step": 336823, "epoch": 2004} {"train_loss": -12.5053129196167, "global_step": 336824, "epoch": 2004} {"train_loss": -11.735760688781738, "global_step": 336825, "epoch": 2004} {"train_loss": -11.968505859375, "global_step": 336826, "epoch": 2004} {"train_loss": -12.203365325927734, "global_step": 336827, "epoch": 2004} {"train_loss": -11.90643310546875, "global_step": 336828, "epoch": 2004} {"train_loss": -11.803372383117676, "global_step": 336829, "epoch": 2004} {"train_loss": -11.924016952514648, "global_step": 336830, "epoch": 2004} {"train_loss": -11.7625732421875, "global_step": 336831, "epoch": 2004} {"train_loss": -12.199310302734375, "global_step": 336832, "epoch": 2004} {"train_loss": -11.601600646972656, "global_step": 336833, "epoch": 2004} {"train_loss": -12.126365661621094, "global_step": 336834, "epoch": 2004} {"train_loss": -11.872058868408203, "global_step": 336835, "epoch": 2004} {"train_loss": -12.039813041687012, "global_step": 336836, "epoch": 2004} {"train_loss": -11.369659423828125, "global_step": 336837, "epoch": 2004} {"train_loss": -12.051281929016113, "global_step": 336838, "epoch": 2004} {"train_loss": -12.012496477081662, "global_step": 336839, "epoch": 2004, "val_loss": 292282.5} {"train_loss": -11.126449584960938, "global_step": 336840, "epoch": 2005} {"train_loss": -11.207067489624023, "global_step": 336841, "epoch": 2005} {"train_loss": -12.006385803222656, "global_step": 336842, "epoch": 2005} {"train_loss": -11.098794937133789, "global_step": 336843, "epoch": 2005} {"train_loss": -10.073396682739258, "global_step": 336844, "epoch": 2005} {"train_loss": -11.470319747924805, "global_step": 336845, "epoch": 2005} {"train_loss": -9.98479175567627, "global_step": 336846, "epoch": 2005} {"train_loss": -9.761531829833984, "global_step": 336847, "epoch": 2005} {"train_loss": -10.330289840698242, "global_step": 336848, "epoch": 2005} {"train_loss": -9.72612190246582, "global_step": 336849, "epoch": 2005} {"train_loss": -8.866090774536133, "global_step": 336850, "epoch": 2005} {"train_loss": -10.552831649780273, "global_step": 336851, "epoch": 2005} {"train_loss": -9.233019828796387, "global_step": 336852, "epoch": 2005} {"train_loss": 5.746070861816406, "global_step": 336853, "epoch": 2005} {"train_loss": -9.860101699829102, "global_step": 336854, "epoch": 2005} {"train_loss": -11.027674674987793, "global_step": 336855, "epoch": 2005} {"train_loss": -9.205011367797852, "global_step": 336856, "epoch": 2005} {"train_loss": -10.113579750061035, "global_step": 336857, "epoch": 2005} {"train_loss": -10.71495246887207, "global_step": 336858, "epoch": 2005} {"train_loss": -10.293291091918945, "global_step": 336859, "epoch": 2005} {"train_loss": -10.922412872314453, "global_step": 336860, "epoch": 2005} {"train_loss": -10.962743759155273, "global_step": 336861, "epoch": 2005} {"train_loss": -10.838709831237793, "global_step": 336862, "epoch": 2005} {"train_loss": -6.639245510101318, "global_step": 336863, "epoch": 2005} {"train_loss": -11.195449829101562, "global_step": 336864, "epoch": 2005} {"train_loss": -10.531432151794434, "global_step": 336865, "epoch": 2005} {"train_loss": -10.445844650268555, "global_step": 336866, "epoch": 2005} {"train_loss": -10.804882049560547, "global_step": 336867, "epoch": 2005} {"train_loss": -11.388521194458008, "global_step": 336868, "epoch": 2005} {"train_loss": -10.94554328918457, "global_step": 336869, "epoch": 2005} {"train_loss": -10.171192169189453, "global_step": 336870, "epoch": 2005} {"train_loss": -11.319815635681152, "global_step": 336871, "epoch": 2005} {"train_loss": -11.166191101074219, "global_step": 336872, "epoch": 2005} {"train_loss": -11.564332008361816, "global_step": 336873, "epoch": 2005} {"train_loss": -11.039690971374512, "global_step": 336874, "epoch": 2005} {"train_loss": -11.226180076599121, "global_step": 336875, "epoch": 2005} {"train_loss": -10.392190933227539, "global_step": 336876, "epoch": 2005} {"train_loss": -11.236540794372559, "global_step": 336877, "epoch": 2005} {"train_loss": -10.965310096740723, "global_step": 336878, "epoch": 2005} {"train_loss": -11.530570030212402, "global_step": 336879, "epoch": 2005} {"train_loss": -11.137317657470703, "global_step": 336880, "epoch": 2005} {"train_loss": -11.550382614135742, "global_step": 336881, "epoch": 2005} {"train_loss": -10.978532791137695, "global_step": 336882, "epoch": 2005} {"train_loss": -11.752893447875977, "global_step": 336883, "epoch": 2005} {"train_loss": -11.426136016845703, "global_step": 336884, "epoch": 2005} {"train_loss": -11.192741394042969, "global_step": 336885, "epoch": 2005} {"train_loss": -11.830720901489258, "global_step": 336886, "epoch": 2005} {"train_loss": -11.591047286987305, "global_step": 336887, "epoch": 2005} {"train_loss": -11.734723091125488, "global_step": 336888, "epoch": 2005} {"train_loss": -11.848100662231445, "global_step": 336889, "epoch": 2005} {"train_loss": -11.526646614074707, "global_step": 336890, "epoch": 2005} {"train_loss": -11.66104793548584, "global_step": 336891, "epoch": 2005} {"train_loss": -11.707798957824707, "global_step": 336892, "epoch": 2005} {"train_loss": -11.38551139831543, "global_step": 336893, "epoch": 2005} {"train_loss": -11.849583625793457, "global_step": 336894, "epoch": 2005} {"train_loss": -11.647132873535156, "global_step": 336895, "epoch": 2005} {"train_loss": -11.749855041503906, "global_step": 336896, "epoch": 2005} {"train_loss": -11.61251163482666, "global_step": 336897, "epoch": 2005} {"train_loss": -11.648996353149414, "global_step": 336898, "epoch": 2005} {"train_loss": -11.665210723876953, "global_step": 336899, "epoch": 2005} {"train_loss": -11.945783615112305, "global_step": 336900, "epoch": 2005} {"train_loss": -11.83907699584961, "global_step": 336901, "epoch": 2005} {"train_loss": -11.92068099975586, "global_step": 336902, "epoch": 2005} {"train_loss": -11.841225624084473, "global_step": 336903, "epoch": 2005} {"train_loss": -11.095205307006836, "global_step": 336904, "epoch": 2005} {"train_loss": -11.982195854187012, "global_step": 336905, "epoch": 2005} {"train_loss": -11.926687240600586, "global_step": 336906, "epoch": 2005} {"train_loss": -11.762924194335938, "global_step": 336907, "epoch": 2005} {"train_loss": -12.040067672729492, "global_step": 336908, "epoch": 2005} {"train_loss": -11.260290145874023, "global_step": 336909, "epoch": 2005} {"train_loss": -11.85654067993164, "global_step": 336910, "epoch": 2005} {"train_loss": -11.743300437927246, "global_step": 336911, "epoch": 2005} {"train_loss": -11.985864639282227, "global_step": 336912, "epoch": 2005} {"train_loss": -11.963571548461914, "global_step": 336913, "epoch": 2005} {"train_loss": -11.849209785461426, "global_step": 336914, "epoch": 2005} {"train_loss": -12.149311065673828, "global_step": 336915, "epoch": 2005} {"train_loss": -12.23745346069336, "global_step": 336916, "epoch": 2005} {"train_loss": -11.932498931884766, "global_step": 336917, "epoch": 2005} {"train_loss": -12.390186309814453, "global_step": 336918, "epoch": 2005} {"train_loss": -12.134866714477539, "global_step": 336919, "epoch": 2005} {"train_loss": -12.391593933105469, "global_step": 336920, "epoch": 2005} {"train_loss": -12.208375930786133, "global_step": 336921, "epoch": 2005} {"train_loss": -12.175556182861328, "global_step": 336922, "epoch": 2005} {"train_loss": -11.990707397460938, "global_step": 336923, "epoch": 2005} {"train_loss": -12.136795043945312, "global_step": 336924, "epoch": 2005} {"train_loss": -12.170038223266602, "global_step": 336925, "epoch": 2005} {"train_loss": -12.083413124084473, "global_step": 336926, "epoch": 2005} {"train_loss": -12.004364013671875, "global_step": 336927, "epoch": 2005} {"train_loss": -12.179402351379395, "global_step": 336928, "epoch": 2005} {"train_loss": -11.90397834777832, "global_step": 336929, "epoch": 2005} {"train_loss": -12.26939868927002, "global_step": 336930, "epoch": 2005} {"train_loss": -12.24577808380127, "global_step": 336931, "epoch": 2005} {"train_loss": -12.139327049255371, "global_step": 336932, "epoch": 2005} {"train_loss": -12.163372039794922, "global_step": 336933, "epoch": 2005} {"train_loss": -12.198858261108398, "global_step": 336934, "epoch": 2005} {"train_loss": -12.389163970947266, "global_step": 336935, "epoch": 2005} {"train_loss": -12.255270004272461, "global_step": 336936, "epoch": 2005} {"train_loss": -12.41950798034668, "global_step": 336937, "epoch": 2005} {"train_loss": -12.404512405395508, "global_step": 336938, "epoch": 2005} {"train_loss": -12.444009780883789, "global_step": 336939, "epoch": 2005} {"train_loss": -12.024507522583008, "global_step": 336940, "epoch": 2005} {"train_loss": -12.453393936157227, "global_step": 336941, "epoch": 2005} {"train_loss": -12.19833755493164, "global_step": 336942, "epoch": 2005} {"train_loss": -12.23228645324707, "global_step": 336943, "epoch": 2005} {"train_loss": -12.500170707702637, "global_step": 336944, "epoch": 2005} {"train_loss": -12.308961868286133, "global_step": 336945, "epoch": 2005} {"train_loss": -12.522058486938477, "global_step": 336946, "epoch": 2005} {"train_loss": -11.972152709960938, "global_step": 336947, "epoch": 2005} {"train_loss": -12.341036796569824, "global_step": 336948, "epoch": 2005} {"train_loss": -12.288532257080078, "global_step": 336949, "epoch": 2005} {"train_loss": -12.336008071899414, "global_step": 336950, "epoch": 2005} {"train_loss": -12.152719497680664, "global_step": 336951, "epoch": 2005} {"train_loss": -12.336858749389648, "global_step": 336952, "epoch": 2005} {"train_loss": -12.309452056884766, "global_step": 336953, "epoch": 2005} {"train_loss": -12.261186599731445, "global_step": 336954, "epoch": 2005} {"train_loss": -12.197196960449219, "global_step": 336955, "epoch": 2005} {"train_loss": -12.332962989807129, "global_step": 336956, "epoch": 2005} {"train_loss": -12.259712219238281, "global_step": 336957, "epoch": 2005} {"train_loss": -12.553862571716309, "global_step": 336958, "epoch": 2005} {"train_loss": -12.516963005065918, "global_step": 336959, "epoch": 2005} {"train_loss": -12.068954467773438, "global_step": 336960, "epoch": 2005} {"train_loss": -12.091976165771484, "global_step": 336961, "epoch": 2005} {"train_loss": -12.266573905944824, "global_step": 336962, "epoch": 2005} {"train_loss": -11.92652702331543, "global_step": 336963, "epoch": 2005} {"train_loss": -11.520135879516602, "global_step": 336964, "epoch": 2005} {"train_loss": -12.424827575683594, "global_step": 336965, "epoch": 2005} {"train_loss": -12.274867057800293, "global_step": 336966, "epoch": 2005} {"train_loss": -12.446261405944824, "global_step": 336967, "epoch": 2005} {"train_loss": -12.24798583984375, "global_step": 336968, "epoch": 2005} {"train_loss": -12.240614891052246, "global_step": 336969, "epoch": 2005} {"train_loss": -12.374610900878906, "global_step": 336970, "epoch": 2005} {"train_loss": -12.127645492553711, "global_step": 336971, "epoch": 2005} {"train_loss": -11.920221328735352, "global_step": 336972, "epoch": 2005} {"train_loss": -11.918889045715332, "global_step": 336973, "epoch": 2005} {"train_loss": -12.133710861206055, "global_step": 336974, "epoch": 2005} {"train_loss": -12.439659118652344, "global_step": 336975, "epoch": 2005} {"train_loss": -12.353466987609863, "global_step": 336976, "epoch": 2005} {"train_loss": -12.494503021240234, "global_step": 336977, "epoch": 2005} {"train_loss": -12.35085391998291, "global_step": 336978, "epoch": 2005} {"train_loss": -12.08055305480957, "global_step": 336979, "epoch": 2005} {"train_loss": -12.008605003356934, "global_step": 336980, "epoch": 2005} {"train_loss": -11.99884033203125, "global_step": 336981, "epoch": 2005} {"train_loss": -11.839132308959961, "global_step": 336982, "epoch": 2005} {"train_loss": -10.730626106262207, "global_step": 336983, "epoch": 2005} {"train_loss": -12.272704124450684, "global_step": 336984, "epoch": 2005} {"train_loss": -11.028349876403809, "global_step": 336985, "epoch": 2005} {"train_loss": -11.290374755859375, "global_step": 336986, "epoch": 2005} {"train_loss": -12.058643341064453, "global_step": 336987, "epoch": 2005} {"train_loss": -11.254426002502441, "global_step": 336988, "epoch": 2005} {"train_loss": -10.594013214111328, "global_step": 336989, "epoch": 2005} {"train_loss": -11.979869842529297, "global_step": 336990, "epoch": 2005} {"train_loss": -10.909626007080078, "global_step": 336991, "epoch": 2005} {"train_loss": -11.050348281860352, "global_step": 336992, "epoch": 2005} {"train_loss": -11.961692810058594, "global_step": 336993, "epoch": 2005} {"train_loss": -11.232906341552734, "global_step": 336994, "epoch": 2005} {"train_loss": -10.824481964111328, "global_step": 336995, "epoch": 2005} {"train_loss": -11.78718376159668, "global_step": 336996, "epoch": 2005} {"train_loss": -10.850915908813477, "global_step": 336997, "epoch": 2005} {"train_loss": -11.688091278076172, "global_step": 336998, "epoch": 2005} {"train_loss": -11.906932830810547, "global_step": 336999, "epoch": 2005} {"train_loss": -11.549215316772461, "global_step": 337000, "epoch": 2005} {"train_loss": -11.671767234802246, "global_step": 337001, "epoch": 2005} {"train_loss": -11.884500503540039, "global_step": 337002, "epoch": 2005} {"train_loss": -11.060422897338867, "global_step": 337003, "epoch": 2005} {"train_loss": -12.274269104003906, "global_step": 337004, "epoch": 2005} {"train_loss": -11.771322250366211, "global_step": 337005, "epoch": 2005} {"train_loss": -12.175621032714844, "global_step": 337006, "epoch": 2005} {"train_loss": -11.506086375032153, "global_step": 337007, "epoch": 2005, "val_loss": 292254.28125, "train_action_mse_error": 1.383164405822754} {"train_loss": -12.004411697387695, "global_step": 337008, "epoch": 2006} {"train_loss": -12.141605377197266, "global_step": 337009, "epoch": 2006} {"train_loss": -12.045143127441406, "global_step": 337010, "epoch": 2006} {"train_loss": -12.264331817626953, "global_step": 337011, "epoch": 2006} {"train_loss": -11.807798385620117, "global_step": 337012, "epoch": 2006} {"train_loss": -12.409481048583984, "global_step": 337013, "epoch": 2006} {"train_loss": -12.039199829101562, "global_step": 337014, "epoch": 2006} {"train_loss": -12.304300308227539, "global_step": 337015, "epoch": 2006} {"train_loss": -12.364408493041992, "global_step": 337016, "epoch": 2006} {"train_loss": -12.206867218017578, "global_step": 337017, "epoch": 2006} {"train_loss": -12.230688095092773, "global_step": 337018, "epoch": 2006} {"train_loss": -12.331756591796875, "global_step": 337019, "epoch": 2006} {"train_loss": -12.134519577026367, "global_step": 337020, "epoch": 2006} {"train_loss": -12.226606369018555, "global_step": 337021, "epoch": 2006} {"train_loss": -12.045158386230469, "global_step": 337022, "epoch": 2006} {"train_loss": -12.159638404846191, "global_step": 337023, "epoch": 2006} {"train_loss": -12.118101119995117, "global_step": 337024, "epoch": 2006} {"train_loss": -11.998961448669434, "global_step": 337025, "epoch": 2006} {"train_loss": -11.497529029846191, "global_step": 337026, "epoch": 2006} {"train_loss": -12.139871597290039, "global_step": 337027, "epoch": 2006} {"train_loss": -10.867037773132324, "global_step": 337028, "epoch": 2006} {"train_loss": -12.23736572265625, "global_step": 337029, "epoch": 2006} {"train_loss": -11.500274658203125, "global_step": 337030, "epoch": 2006} {"train_loss": -11.66546630859375, "global_step": 337031, "epoch": 2006} {"train_loss": -11.396595001220703, "global_step": 337032, "epoch": 2006} {"train_loss": -11.2821683883667, "global_step": 337033, "epoch": 2006} {"train_loss": -12.257518768310547, "global_step": 337034, "epoch": 2006} {"train_loss": -11.80510425567627, "global_step": 337035, "epoch": 2006} {"train_loss": -12.191932678222656, "global_step": 337036, "epoch": 2006} {"train_loss": -11.372900009155273, "global_step": 337037, "epoch": 2006} {"train_loss": -11.647797584533691, "global_step": 337038, "epoch": 2006} {"train_loss": -11.886443138122559, "global_step": 337039, "epoch": 2006} {"train_loss": -11.958861351013184, "global_step": 337040, "epoch": 2006} {"train_loss": -11.611066818237305, "global_step": 337041, "epoch": 2006} {"train_loss": -11.80199146270752, "global_step": 337042, "epoch": 2006} {"train_loss": -11.828786849975586, "global_step": 337043, "epoch": 2006} {"train_loss": -10.800788879394531, "global_step": 337044, "epoch": 2006} {"train_loss": -11.932907104492188, "global_step": 337045, "epoch": 2006} {"train_loss": -11.53357982635498, "global_step": 337046, "epoch": 2006} {"train_loss": -11.965743064880371, "global_step": 337047, "epoch": 2006} {"train_loss": -11.89544677734375, "global_step": 337048, "epoch": 2006} {"train_loss": -12.079492568969727, "global_step": 337049, "epoch": 2006} {"train_loss": -11.917448043823242, "global_step": 337050, "epoch": 2006} {"train_loss": -12.256704330444336, "global_step": 337051, "epoch": 2006} {"train_loss": -12.010289192199707, "global_step": 337052, "epoch": 2006} {"train_loss": -12.052678108215332, "global_step": 337053, "epoch": 2006} {"train_loss": -11.860794067382812, "global_step": 337054, "epoch": 2006} {"train_loss": -12.456844329833984, "global_step": 337055, "epoch": 2006} {"train_loss": -11.882574081420898, "global_step": 337056, "epoch": 2006} {"train_loss": -12.510600090026855, "global_step": 337057, "epoch": 2006} {"train_loss": -12.211799621582031, "global_step": 337058, "epoch": 2006} {"train_loss": -12.398423194885254, "global_step": 337059, "epoch": 2006} {"train_loss": -12.227911949157715, "global_step": 337060, "epoch": 2006} {"train_loss": -12.253631591796875, "global_step": 337061, "epoch": 2006} {"train_loss": -12.277883529663086, "global_step": 337062, "epoch": 2006} {"train_loss": -12.273880004882812, "global_step": 337063, "epoch": 2006} {"train_loss": -12.381551742553711, "global_step": 337064, "epoch": 2006} {"train_loss": -12.599081039428711, "global_step": 337065, "epoch": 2006} {"train_loss": -12.446392059326172, "global_step": 337066, "epoch": 2006} {"train_loss": -12.401851654052734, "global_step": 337067, "epoch": 2006} {"train_loss": -12.46593189239502, "global_step": 337068, "epoch": 2006} {"train_loss": -12.544454574584961, "global_step": 337069, "epoch": 2006} {"train_loss": -12.390697479248047, "global_step": 337070, "epoch": 2006} {"train_loss": -12.088205337524414, "global_step": 337071, "epoch": 2006} {"train_loss": -11.990184783935547, "global_step": 337072, "epoch": 2006} {"train_loss": -12.442743301391602, "global_step": 337073, "epoch": 2006} {"train_loss": -11.460654258728027, "global_step": 337074, "epoch": 2006} {"train_loss": -12.0462646484375, "global_step": 337075, "epoch": 2006} {"train_loss": -12.135441780090332, "global_step": 337076, "epoch": 2006} {"train_loss": -11.764110565185547, "global_step": 337077, "epoch": 2006} {"train_loss": -12.1612548828125, "global_step": 337078, "epoch": 2006} {"train_loss": -11.861488342285156, "global_step": 337079, "epoch": 2006} {"train_loss": -11.748297691345215, "global_step": 337080, "epoch": 2006} {"train_loss": -11.87363052368164, "global_step": 337081, "epoch": 2006} {"train_loss": -11.826251983642578, "global_step": 337082, "epoch": 2006} {"train_loss": -11.914522171020508, "global_step": 337083, "epoch": 2006} {"train_loss": -11.905033111572266, "global_step": 337084, "epoch": 2006} {"train_loss": -11.987958908081055, "global_step": 337085, "epoch": 2006} {"train_loss": -11.95738410949707, "global_step": 337086, "epoch": 2006} {"train_loss": -11.985454559326172, "global_step": 337087, "epoch": 2006} {"train_loss": -11.457955360412598, "global_step": 337088, "epoch": 2006} {"train_loss": -11.794865608215332, "global_step": 337089, "epoch": 2006} {"train_loss": -11.993659973144531, "global_step": 337090, "epoch": 2006} {"train_loss": -11.910516738891602, "global_step": 337091, "epoch": 2006} {"train_loss": -12.268882751464844, "global_step": 337092, "epoch": 2006} {"train_loss": -12.405294418334961, "global_step": 337093, "epoch": 2006} {"train_loss": -11.664501190185547, "global_step": 337094, "epoch": 2006} {"train_loss": -12.19886589050293, "global_step": 337095, "epoch": 2006} {"train_loss": -11.655391693115234, "global_step": 337096, "epoch": 2006} {"train_loss": -12.107868194580078, "global_step": 337097, "epoch": 2006} {"train_loss": -11.829842567443848, "global_step": 337098, "epoch": 2006} {"train_loss": -11.885041236877441, "global_step": 337099, "epoch": 2006} {"train_loss": -11.97518539428711, "global_step": 337100, "epoch": 2006} {"train_loss": -12.04281234741211, "global_step": 337101, "epoch": 2006} {"train_loss": -12.136591911315918, "global_step": 337102, "epoch": 2006} {"train_loss": -12.086128234863281, "global_step": 337103, "epoch": 2006} {"train_loss": -12.093265533447266, "global_step": 337104, "epoch": 2006} {"train_loss": -11.989801406860352, "global_step": 337105, "epoch": 2006} {"train_loss": -12.322611808776855, "global_step": 337106, "epoch": 2006} {"train_loss": -11.97597885131836, "global_step": 337107, "epoch": 2006} {"train_loss": -12.200170516967773, "global_step": 337108, "epoch": 2006} {"train_loss": -12.115732192993164, "global_step": 337109, "epoch": 2006} {"train_loss": -12.27389144897461, "global_step": 337110, "epoch": 2006} {"train_loss": -11.803479194641113, "global_step": 337111, "epoch": 2006} {"train_loss": -12.456340789794922, "global_step": 337112, "epoch": 2006} {"train_loss": -11.564244270324707, "global_step": 337113, "epoch": 2006} {"train_loss": -11.989842414855957, "global_step": 337114, "epoch": 2006} {"train_loss": -11.624013900756836, "global_step": 337115, "epoch": 2006} {"train_loss": -11.080913543701172, "global_step": 337116, "epoch": 2006} {"train_loss": -11.069503784179688, "global_step": 337117, "epoch": 2006} {"train_loss": -10.826580047607422, "global_step": 337118, "epoch": 2006} {"train_loss": -10.992870330810547, "global_step": 337119, "epoch": 2006} {"train_loss": -11.54931926727295, "global_step": 337120, "epoch": 2006} {"train_loss": -10.938963890075684, "global_step": 337121, "epoch": 2006} {"train_loss": -11.646209716796875, "global_step": 337122, "epoch": 2006} {"train_loss": -10.401710510253906, "global_step": 337123, "epoch": 2006} {"train_loss": -11.594429969787598, "global_step": 337124, "epoch": 2006} {"train_loss": -10.2554349899292, "global_step": 337125, "epoch": 2006} {"train_loss": -11.901196479797363, "global_step": 337126, "epoch": 2006} {"train_loss": -11.139017105102539, "global_step": 337127, "epoch": 2006} {"train_loss": -10.918066024780273, "global_step": 337128, "epoch": 2006} {"train_loss": -11.2877197265625, "global_step": 337129, "epoch": 2006} {"train_loss": -10.665390014648438, "global_step": 337130, "epoch": 2006} {"train_loss": -11.790410041809082, "global_step": 337131, "epoch": 2006} {"train_loss": -10.65529727935791, "global_step": 337132, "epoch": 2006} {"train_loss": -11.13711166381836, "global_step": 337133, "epoch": 2006} {"train_loss": -11.271657943725586, "global_step": 337134, "epoch": 2006} {"train_loss": -11.012466430664062, "global_step": 337135, "epoch": 2006} {"train_loss": -11.600959777832031, "global_step": 337136, "epoch": 2006} {"train_loss": -11.373312950134277, "global_step": 337137, "epoch": 2006} {"train_loss": -11.24573802947998, "global_step": 337138, "epoch": 2006} {"train_loss": -11.806286811828613, "global_step": 337139, "epoch": 2006} {"train_loss": -11.495600700378418, "global_step": 337140, "epoch": 2006} {"train_loss": -11.421539306640625, "global_step": 337141, "epoch": 2006} {"train_loss": -12.019752502441406, "global_step": 337142, "epoch": 2006} {"train_loss": -11.668844223022461, "global_step": 337143, "epoch": 2006} {"train_loss": -12.002939224243164, "global_step": 337144, "epoch": 2006} {"train_loss": -11.947707176208496, "global_step": 337145, "epoch": 2006} {"train_loss": -11.596386909484863, "global_step": 337146, "epoch": 2006} {"train_loss": -11.502360343933105, "global_step": 337147, "epoch": 2006} {"train_loss": -11.575132369995117, "global_step": 337148, "epoch": 2006} {"train_loss": -11.954107284545898, "global_step": 337149, "epoch": 2006} {"train_loss": -11.43515682220459, "global_step": 337150, "epoch": 2006} {"train_loss": -12.051702499389648, "global_step": 337151, "epoch": 2006} {"train_loss": -11.659465789794922, "global_step": 337152, "epoch": 2006} {"train_loss": -11.593900680541992, "global_step": 337153, "epoch": 2006} {"train_loss": -12.057296752929688, "global_step": 337154, "epoch": 2006} {"train_loss": -11.154455184936523, "global_step": 337155, "epoch": 2006} {"train_loss": -12.049700736999512, "global_step": 337156, "epoch": 2006} {"train_loss": -11.121925354003906, "global_step": 337157, "epoch": 2006} {"train_loss": -11.423219680786133, "global_step": 337158, "epoch": 2006} {"train_loss": -11.424294471740723, "global_step": 337159, "epoch": 2006} {"train_loss": -11.162322998046875, "global_step": 337160, "epoch": 2006} {"train_loss": -11.677633285522461, "global_step": 337161, "epoch": 2006} {"train_loss": -11.871481895446777, "global_step": 337162, "epoch": 2006} {"train_loss": -12.145201683044434, "global_step": 337163, "epoch": 2006} {"train_loss": -11.951759338378906, "global_step": 337164, "epoch": 2006} {"train_loss": -12.135108947753906, "global_step": 337165, "epoch": 2006} {"train_loss": -12.205384254455566, "global_step": 337166, "epoch": 2006} {"train_loss": -12.374476432800293, "global_step": 337167, "epoch": 2006} {"train_loss": -12.44158935546875, "global_step": 337168, "epoch": 2006} {"train_loss": -12.11091136932373, "global_step": 337169, "epoch": 2006} {"train_loss": -12.351155281066895, "global_step": 337170, "epoch": 2006} {"train_loss": -12.208709716796875, "global_step": 337171, "epoch": 2006} {"train_loss": -12.020895004272461, "global_step": 337172, "epoch": 2006} {"train_loss": -11.977668762207031, "global_step": 337173, "epoch": 2006} {"train_loss": -12.294977188110352, "global_step": 337174, "epoch": 2006} {"train_loss": -11.851059414091564, "global_step": 337175, "epoch": 2006, "val_loss": 289800.09375} {"train_loss": -12.300403594970703, "global_step": 337176, "epoch": 2007} {"train_loss": -12.375978469848633, "global_step": 337177, "epoch": 2007} {"train_loss": -12.347805976867676, "global_step": 337178, "epoch": 2007} {"train_loss": -12.319612503051758, "global_step": 337179, "epoch": 2007} {"train_loss": -12.353277206420898, "global_step": 337180, "epoch": 2007} {"train_loss": -12.238113403320312, "global_step": 337181, "epoch": 2007} {"train_loss": -12.422647476196289, "global_step": 337182, "epoch": 2007} {"train_loss": -12.35623836517334, "global_step": 337183, "epoch": 2007} {"train_loss": -12.416236877441406, "global_step": 337184, "epoch": 2007} {"train_loss": -12.20287036895752, "global_step": 337185, "epoch": 2007} {"train_loss": -12.411346435546875, "global_step": 337186, "epoch": 2007} {"train_loss": -12.332878112792969, "global_step": 337187, "epoch": 2007} {"train_loss": -12.473965644836426, "global_step": 337188, "epoch": 2007} {"train_loss": -12.321075439453125, "global_step": 337189, "epoch": 2007} {"train_loss": -12.092365264892578, "global_step": 337190, "epoch": 2007} {"train_loss": -12.383177757263184, "global_step": 337191, "epoch": 2007} {"train_loss": -12.481979370117188, "global_step": 337192, "epoch": 2007} {"train_loss": -12.327386856079102, "global_step": 337193, "epoch": 2007} {"train_loss": -12.408378601074219, "global_step": 337194, "epoch": 2007} {"train_loss": -12.266797065734863, "global_step": 337195, "epoch": 2007} {"train_loss": -12.312102317810059, "global_step": 337196, "epoch": 2007} {"train_loss": -12.296249389648438, "global_step": 337197, "epoch": 2007} {"train_loss": -12.13554573059082, "global_step": 337198, "epoch": 2007} {"train_loss": -12.211071014404297, "global_step": 337199, "epoch": 2007} {"train_loss": -12.492297172546387, "global_step": 337200, "epoch": 2007} {"train_loss": -12.156530380249023, "global_step": 337201, "epoch": 2007} {"train_loss": -12.489200592041016, "global_step": 337202, "epoch": 2007} {"train_loss": -12.433246612548828, "global_step": 337203, "epoch": 2007} {"train_loss": -11.800444602966309, "global_step": 337204, "epoch": 2007} {"train_loss": -12.084372520446777, "global_step": 337205, "epoch": 2007} {"train_loss": -12.304841995239258, "global_step": 337206, "epoch": 2007} {"train_loss": -11.644689559936523, "global_step": 337207, "epoch": 2007} {"train_loss": -11.798219680786133, "global_step": 337208, "epoch": 2007} {"train_loss": -12.3899507522583, "global_step": 337209, "epoch": 2007} {"train_loss": -12.172889709472656, "global_step": 337210, "epoch": 2007} {"train_loss": -12.398056030273438, "global_step": 337211, "epoch": 2007} {"train_loss": -12.497493743896484, "global_step": 337212, "epoch": 2007} {"train_loss": -12.54952335357666, "global_step": 337213, "epoch": 2007} {"train_loss": -12.69775390625, "global_step": 337214, "epoch": 2007} {"train_loss": -12.475177764892578, "global_step": 337215, "epoch": 2007} {"train_loss": -12.450764656066895, "global_step": 337216, "epoch": 2007} {"train_loss": -12.575220108032227, "global_step": 337217, "epoch": 2007} {"train_loss": -12.44259262084961, "global_step": 337218, "epoch": 2007} {"train_loss": -12.583110809326172, "global_step": 337219, "epoch": 2007} {"train_loss": -12.433921813964844, "global_step": 337220, "epoch": 2007} {"train_loss": -12.4723539352417, "global_step": 337221, "epoch": 2007} {"train_loss": -12.721345901489258, "global_step": 337222, "epoch": 2007} {"train_loss": -12.803807258605957, "global_step": 337223, "epoch": 2007} {"train_loss": -12.562665939331055, "global_step": 337224, "epoch": 2007} {"train_loss": -12.570281982421875, "global_step": 337225, "epoch": 2007} {"train_loss": -12.564445495605469, "global_step": 337226, "epoch": 2007} {"train_loss": -12.66615104675293, "global_step": 337227, "epoch": 2007} {"train_loss": -12.616714477539062, "global_step": 337228, "epoch": 2007} {"train_loss": -12.538094520568848, "global_step": 337229, "epoch": 2007} {"train_loss": -12.396583557128906, "global_step": 337230, "epoch": 2007} {"train_loss": -12.394878387451172, "global_step": 337231, "epoch": 2007} {"train_loss": -12.631458282470703, "global_step": 337232, "epoch": 2007} {"train_loss": -12.600761413574219, "global_step": 337233, "epoch": 2007} {"train_loss": -12.426509857177734, "global_step": 337234, "epoch": 2007} {"train_loss": -12.424051284790039, "global_step": 337235, "epoch": 2007} {"train_loss": -12.466120719909668, "global_step": 337236, "epoch": 2007} {"train_loss": -12.419301986694336, "global_step": 337237, "epoch": 2007} {"train_loss": -12.63359260559082, "global_step": 337238, "epoch": 2007} {"train_loss": -12.542902946472168, "global_step": 337239, "epoch": 2007} {"train_loss": -12.798086166381836, "global_step": 337240, "epoch": 2007} {"train_loss": -12.612956047058105, "global_step": 337241, "epoch": 2007} {"train_loss": -12.17375659942627, "global_step": 337242, "epoch": 2007} {"train_loss": -12.03946304321289, "global_step": 337243, "epoch": 2007} {"train_loss": -11.704183578491211, "global_step": 337244, "epoch": 2007} {"train_loss": -12.065130233764648, "global_step": 337245, "epoch": 2007} {"train_loss": -12.268343925476074, "global_step": 337246, "epoch": 2007} {"train_loss": -12.225345611572266, "global_step": 337247, "epoch": 2007} {"train_loss": -11.052541732788086, "global_step": 337248, "epoch": 2007} {"train_loss": -11.015085220336914, "global_step": 337249, "epoch": 2007} {"train_loss": -12.348185539245605, "global_step": 337250, "epoch": 2007} {"train_loss": -12.208564758300781, "global_step": 337251, "epoch": 2007} {"train_loss": -11.888465881347656, "global_step": 337252, "epoch": 2007} {"train_loss": -11.527642250061035, "global_step": 337253, "epoch": 2007} {"train_loss": -11.062238693237305, "global_step": 337254, "epoch": 2007} {"train_loss": -11.101663589477539, "global_step": 337255, "epoch": 2007} {"train_loss": -11.509004592895508, "global_step": 337256, "epoch": 2007} {"train_loss": -12.462862014770508, "global_step": 337257, "epoch": 2007} {"train_loss": -11.506603240966797, "global_step": 337258, "epoch": 2007} {"train_loss": -11.14229965209961, "global_step": 337259, "epoch": 2007} {"train_loss": -9.741219520568848, "global_step": 337260, "epoch": 2007} {"train_loss": -11.023431777954102, "global_step": 337261, "epoch": 2007} {"train_loss": -9.14553451538086, "global_step": 337262, "epoch": 2007} {"train_loss": -10.886116027832031, "global_step": 337263, "epoch": 2007} {"train_loss": -9.31335735321045, "global_step": 337264, "epoch": 2007} {"train_loss": -9.495107650756836, "global_step": 337265, "epoch": 2007} {"train_loss": -10.0465669631958, "global_step": 337266, "epoch": 2007} {"train_loss": -8.74819278717041, "global_step": 337267, "epoch": 2007} {"train_loss": -7.534972190856934, "global_step": 337268, "epoch": 2007} {"train_loss": -7.852480411529541, "global_step": 337269, "epoch": 2007} {"train_loss": -7.718005180358887, "global_step": 337270, "epoch": 2007} {"train_loss": -7.785977363586426, "global_step": 337271, "epoch": 2007} {"train_loss": -8.286516189575195, "global_step": 337272, "epoch": 2007} {"train_loss": -9.189538955688477, "global_step": 337273, "epoch": 2007} {"train_loss": -8.736799240112305, "global_step": 337274, "epoch": 2007} {"train_loss": -8.813857078552246, "global_step": 337275, "epoch": 2007} {"train_loss": -9.572964668273926, "global_step": 337276, "epoch": 2007} {"train_loss": -10.292003631591797, "global_step": 337277, "epoch": 2007} {"train_loss": -9.768715858459473, "global_step": 337278, "epoch": 2007} {"train_loss": -10.892538070678711, "global_step": 337279, "epoch": 2007} {"train_loss": -9.359586715698242, "global_step": 337280, "epoch": 2007} {"train_loss": -10.160480499267578, "global_step": 337281, "epoch": 2007} {"train_loss": -10.36068058013916, "global_step": 337282, "epoch": 2007} {"train_loss": -9.75417423248291, "global_step": 337283, "epoch": 2007} {"train_loss": -10.31277847290039, "global_step": 337284, "epoch": 2007} {"train_loss": -10.082178115844727, "global_step": 337285, "epoch": 2007} {"train_loss": -9.835711479187012, "global_step": 337286, "epoch": 2007} {"train_loss": -9.00295639038086, "global_step": 337287, "epoch": 2007} {"train_loss": -9.949100494384766, "global_step": 337288, "epoch": 2007} {"train_loss": -10.86020278930664, "global_step": 337289, "epoch": 2007} {"train_loss": -9.151697158813477, "global_step": 337290, "epoch": 2007} {"train_loss": -8.968171119689941, "global_step": 337291, "epoch": 2007} {"train_loss": -10.73292350769043, "global_step": 337292, "epoch": 2007} {"train_loss": -10.187158584594727, "global_step": 337293, "epoch": 2007} {"train_loss": -9.225601196289062, "global_step": 337294, "epoch": 2007} {"train_loss": -9.570674896240234, "global_step": 337295, "epoch": 2007} {"train_loss": -9.586433410644531, "global_step": 337296, "epoch": 2007} {"train_loss": -10.163785934448242, "global_step": 337297, "epoch": 2007} {"train_loss": -9.65140151977539, "global_step": 337298, "epoch": 2007} {"train_loss": -10.933849334716797, "global_step": 337299, "epoch": 2007} {"train_loss": -10.777250289916992, "global_step": 337300, "epoch": 2007} {"train_loss": -10.19710636138916, "global_step": 337301, "epoch": 2007} {"train_loss": -11.174945831298828, "global_step": 337302, "epoch": 2007} {"train_loss": -11.438448905944824, "global_step": 337303, "epoch": 2007} {"train_loss": -10.729887962341309, "global_step": 337304, "epoch": 2007} {"train_loss": -11.616474151611328, "global_step": 337305, "epoch": 2007} {"train_loss": -11.787030220031738, "global_step": 337306, "epoch": 2007} {"train_loss": -10.806650161743164, "global_step": 337307, "epoch": 2007} {"train_loss": -11.437908172607422, "global_step": 337308, "epoch": 2007} {"train_loss": -11.70014762878418, "global_step": 337309, "epoch": 2007} {"train_loss": -11.6712646484375, "global_step": 337310, "epoch": 2007} {"train_loss": -11.783454895019531, "global_step": 337311, "epoch": 2007} {"train_loss": -11.587868690490723, "global_step": 337312, "epoch": 2007} {"train_loss": -11.55877685546875, "global_step": 337313, "epoch": 2007} {"train_loss": -11.713394165039062, "global_step": 337314, "epoch": 2007} {"train_loss": -11.556305885314941, "global_step": 337315, "epoch": 2007} {"train_loss": -11.458614349365234, "global_step": 337316, "epoch": 2007} {"train_loss": -11.805330276489258, "global_step": 337317, "epoch": 2007} {"train_loss": -11.58102798461914, "global_step": 337318, "epoch": 2007} {"train_loss": -11.598278999328613, "global_step": 337319, "epoch": 2007} {"train_loss": -11.801067352294922, "global_step": 337320, "epoch": 2007} {"train_loss": -11.713323593139648, "global_step": 337321, "epoch": 2007} {"train_loss": -11.676944732666016, "global_step": 337322, "epoch": 2007} {"train_loss": -11.835391998291016, "global_step": 337323, "epoch": 2007} {"train_loss": -11.78302001953125, "global_step": 337324, "epoch": 2007} {"train_loss": -11.887893676757812, "global_step": 337325, "epoch": 2007} {"train_loss": -11.652597427368164, "global_step": 337326, "epoch": 2007} {"train_loss": -11.30414867401123, "global_step": 337327, "epoch": 2007} {"train_loss": -11.9248046875, "global_step": 337328, "epoch": 2007} {"train_loss": -11.867276191711426, "global_step": 337329, "epoch": 2007} {"train_loss": -11.478126525878906, "global_step": 337330, "epoch": 2007} {"train_loss": -11.791010856628418, "global_step": 337331, "epoch": 2007} {"train_loss": -11.874412536621094, "global_step": 337332, "epoch": 2007} {"train_loss": -11.616925239562988, "global_step": 337333, "epoch": 2007} {"train_loss": -12.105266571044922, "global_step": 337334, "epoch": 2007} {"train_loss": -11.554558753967285, "global_step": 337335, "epoch": 2007} {"train_loss": -12.119945526123047, "global_step": 337336, "epoch": 2007} {"train_loss": -11.830161094665527, "global_step": 337337, "epoch": 2007} {"train_loss": -11.981758117675781, "global_step": 337338, "epoch": 2007} {"train_loss": -11.943618774414062, "global_step": 337339, "epoch": 2007} {"train_loss": -11.988941192626953, "global_step": 337340, "epoch": 2007} {"train_loss": -11.688669204711914, "global_step": 337341, "epoch": 2007} {"train_loss": -12.005581855773926, "global_step": 337342, "epoch": 2007} {"train_loss": -11.44966858625412, "global_step": 337343, "epoch": 2007, "val_loss": 287093.21875} {"train_loss": -12.09467887878418, "global_step": 337344, "epoch": 2008} {"train_loss": -12.019601821899414, "global_step": 337345, "epoch": 2008} {"train_loss": -12.047292709350586, "global_step": 337346, "epoch": 2008} {"train_loss": -11.803762435913086, "global_step": 337347, "epoch": 2008} {"train_loss": -12.027968406677246, "global_step": 337348, "epoch": 2008} {"train_loss": -12.214784622192383, "global_step": 337349, "epoch": 2008} {"train_loss": -12.309885025024414, "global_step": 337350, "epoch": 2008} {"train_loss": -12.176189422607422, "global_step": 337351, "epoch": 2008} {"train_loss": -12.009653091430664, "global_step": 337352, "epoch": 2008} {"train_loss": -12.359149932861328, "global_step": 337353, "epoch": 2008} {"train_loss": -12.169057846069336, "global_step": 337354, "epoch": 2008} {"train_loss": -12.336008071899414, "global_step": 337355, "epoch": 2008} {"train_loss": -11.831892013549805, "global_step": 337356, "epoch": 2008} {"train_loss": -12.149614334106445, "global_step": 337357, "epoch": 2008} {"train_loss": -12.104475021362305, "global_step": 337358, "epoch": 2008} {"train_loss": -12.31602668762207, "global_step": 337359, "epoch": 2008} {"train_loss": -12.154886245727539, "global_step": 337360, "epoch": 2008} {"train_loss": -12.054168701171875, "global_step": 337361, "epoch": 2008} {"train_loss": -12.305925369262695, "global_step": 337362, "epoch": 2008} {"train_loss": -11.984817504882812, "global_step": 337363, "epoch": 2008} {"train_loss": -12.219010353088379, "global_step": 337364, "epoch": 2008} {"train_loss": -12.286014556884766, "global_step": 337365, "epoch": 2008} {"train_loss": -12.359604835510254, "global_step": 337366, "epoch": 2008} {"train_loss": -12.284103393554688, "global_step": 337367, "epoch": 2008} {"train_loss": -12.28759479522705, "global_step": 337368, "epoch": 2008} {"train_loss": -12.257848739624023, "global_step": 337369, "epoch": 2008} {"train_loss": -12.330743789672852, "global_step": 337370, "epoch": 2008} {"train_loss": -12.292754173278809, "global_step": 337371, "epoch": 2008} {"train_loss": -12.21026611328125, "global_step": 337372, "epoch": 2008} {"train_loss": -12.191206932067871, "global_step": 337373, "epoch": 2008} {"train_loss": -12.446067810058594, "global_step": 337374, "epoch": 2008} {"train_loss": -12.131853103637695, "global_step": 337375, "epoch": 2008} {"train_loss": -12.573702812194824, "global_step": 337376, "epoch": 2008} {"train_loss": -12.251941680908203, "global_step": 337377, "epoch": 2008} {"train_loss": -12.099405288696289, "global_step": 337378, "epoch": 2008} {"train_loss": -12.453557968139648, "global_step": 337379, "epoch": 2008} {"train_loss": -12.375776290893555, "global_step": 337380, "epoch": 2008} {"train_loss": -11.93886947631836, "global_step": 337381, "epoch": 2008} {"train_loss": -12.389362335205078, "global_step": 337382, "epoch": 2008} {"train_loss": -12.36925220489502, "global_step": 337383, "epoch": 2008} {"train_loss": -12.3502779006958, "global_step": 337384, "epoch": 2008} {"train_loss": -12.59109878540039, "global_step": 337385, "epoch": 2008} {"train_loss": -12.459188461303711, "global_step": 337386, "epoch": 2008} {"train_loss": -12.540019989013672, "global_step": 337387, "epoch": 2008} {"train_loss": -12.388879776000977, "global_step": 337388, "epoch": 2008} {"train_loss": -12.46011734008789, "global_step": 337389, "epoch": 2008} {"train_loss": -12.50482177734375, "global_step": 337390, "epoch": 2008} {"train_loss": -12.627992630004883, "global_step": 337391, "epoch": 2008} {"train_loss": -12.548849105834961, "global_step": 337392, "epoch": 2008} {"train_loss": -12.616323471069336, "global_step": 337393, "epoch": 2008} {"train_loss": -12.53178596496582, "global_step": 337394, "epoch": 2008} {"train_loss": -12.486784934997559, "global_step": 337395, "epoch": 2008} {"train_loss": -12.758503913879395, "global_step": 337396, "epoch": 2008} {"train_loss": -12.711814880371094, "global_step": 337397, "epoch": 2008} {"train_loss": -12.441032409667969, "global_step": 337398, "epoch": 2008} {"train_loss": -12.453893661499023, "global_step": 337399, "epoch": 2008} {"train_loss": -12.451480865478516, "global_step": 337400, "epoch": 2008} {"train_loss": -12.568704605102539, "global_step": 337401, "epoch": 2008} {"train_loss": -12.476826667785645, "global_step": 337402, "epoch": 2008} {"train_loss": -12.723662376403809, "global_step": 337403, "epoch": 2008} {"train_loss": -12.672053337097168, "global_step": 337404, "epoch": 2008} {"train_loss": -12.51546859741211, "global_step": 337405, "epoch": 2008} {"train_loss": -12.342330932617188, "global_step": 337406, "epoch": 2008} {"train_loss": -12.75811767578125, "global_step": 337407, "epoch": 2008} {"train_loss": -12.66669750213623, "global_step": 337408, "epoch": 2008} {"train_loss": -12.641629219055176, "global_step": 337409, "epoch": 2008} {"train_loss": -12.656696319580078, "global_step": 337410, "epoch": 2008} {"train_loss": -12.304877281188965, "global_step": 337411, "epoch": 2008} {"train_loss": -12.578080177307129, "global_step": 337412, "epoch": 2008} {"train_loss": -12.584676742553711, "global_step": 337413, "epoch": 2008} {"train_loss": -12.610380172729492, "global_step": 337414, "epoch": 2008} {"train_loss": -12.033943176269531, "global_step": 337415, "epoch": 2008} {"train_loss": -12.210081100463867, "global_step": 337416, "epoch": 2008} {"train_loss": -12.139307022094727, "global_step": 337417, "epoch": 2008} {"train_loss": -11.546064376831055, "global_step": 337418, "epoch": 2008} {"train_loss": -10.815167427062988, "global_step": 337419, "epoch": 2008} {"train_loss": -11.019028663635254, "global_step": 337420, "epoch": 2008} {"train_loss": -11.72795581817627, "global_step": 337421, "epoch": 2008} {"train_loss": -12.212729454040527, "global_step": 337422, "epoch": 2008} {"train_loss": -9.895029067993164, "global_step": 337423, "epoch": 2008} {"train_loss": -11.424764633178711, "global_step": 337424, "epoch": 2008} {"train_loss": -11.952170372009277, "global_step": 337425, "epoch": 2008} {"train_loss": -11.208138465881348, "global_step": 337426, "epoch": 2008} {"train_loss": -11.250935554504395, "global_step": 337427, "epoch": 2008} {"train_loss": -12.554569244384766, "global_step": 337428, "epoch": 2008} {"train_loss": -11.88492202758789, "global_step": 337429, "epoch": 2008} {"train_loss": -11.639216423034668, "global_step": 337430, "epoch": 2008} {"train_loss": -12.150705337524414, "global_step": 337431, "epoch": 2008} {"train_loss": -11.890231132507324, "global_step": 337432, "epoch": 2008} {"train_loss": -12.285761833190918, "global_step": 337433, "epoch": 2008} {"train_loss": -12.39902114868164, "global_step": 337434, "epoch": 2008} {"train_loss": -12.0761079788208, "global_step": 337435, "epoch": 2008} {"train_loss": -11.931812286376953, "global_step": 337436, "epoch": 2008} {"train_loss": -11.858160018920898, "global_step": 337437, "epoch": 2008} {"train_loss": -12.423968315124512, "global_step": 337438, "epoch": 2008} {"train_loss": -12.377798080444336, "global_step": 337439, "epoch": 2008} {"train_loss": -12.37771224975586, "global_step": 337440, "epoch": 2008} {"train_loss": -11.8438138961792, "global_step": 337441, "epoch": 2008} {"train_loss": -12.210538864135742, "global_step": 337442, "epoch": 2008} {"train_loss": -12.105831146240234, "global_step": 337443, "epoch": 2008} {"train_loss": -12.558255195617676, "global_step": 337444, "epoch": 2008} {"train_loss": -11.901496887207031, "global_step": 337445, "epoch": 2008} {"train_loss": -11.451343536376953, "global_step": 337446, "epoch": 2008} {"train_loss": -11.890022277832031, "global_step": 337447, "epoch": 2008} {"train_loss": -12.203234672546387, "global_step": 337448, "epoch": 2008} {"train_loss": -11.985377311706543, "global_step": 337449, "epoch": 2008} {"train_loss": -12.241634368896484, "global_step": 337450, "epoch": 2008} {"train_loss": -12.419317245483398, "global_step": 337451, "epoch": 2008} {"train_loss": -12.084936141967773, "global_step": 337452, "epoch": 2008} {"train_loss": -12.089616775512695, "global_step": 337453, "epoch": 2008} {"train_loss": -12.321409225463867, "global_step": 337454, "epoch": 2008} {"train_loss": -12.243463516235352, "global_step": 337455, "epoch": 2008} {"train_loss": -12.186118125915527, "global_step": 337456, "epoch": 2008} {"train_loss": -12.210363388061523, "global_step": 337457, "epoch": 2008} {"train_loss": -12.399224281311035, "global_step": 337458, "epoch": 2008} {"train_loss": -12.285848617553711, "global_step": 337459, "epoch": 2008} {"train_loss": -12.321569442749023, "global_step": 337460, "epoch": 2008} {"train_loss": -11.758270263671875, "global_step": 337461, "epoch": 2008} {"train_loss": -11.513429641723633, "global_step": 337462, "epoch": 2008} {"train_loss": -11.886513710021973, "global_step": 337463, "epoch": 2008} {"train_loss": -12.063557624816895, "global_step": 337464, "epoch": 2008} {"train_loss": -12.07139778137207, "global_step": 337465, "epoch": 2008} {"train_loss": -11.797994613647461, "global_step": 337466, "epoch": 2008} {"train_loss": -12.341167449951172, "global_step": 337467, "epoch": 2008} {"train_loss": -11.702869415283203, "global_step": 337468, "epoch": 2008} {"train_loss": -11.83065414428711, "global_step": 337469, "epoch": 2008} {"train_loss": -11.700054168701172, "global_step": 337470, "epoch": 2008} {"train_loss": -12.541667938232422, "global_step": 337471, "epoch": 2008} {"train_loss": -11.674175262451172, "global_step": 337472, "epoch": 2008} {"train_loss": -12.153470993041992, "global_step": 337473, "epoch": 2008} {"train_loss": -11.15733528137207, "global_step": 337474, "epoch": 2008} {"train_loss": -11.460956573486328, "global_step": 337475, "epoch": 2008} {"train_loss": -11.418750762939453, "global_step": 337476, "epoch": 2008} {"train_loss": -11.239059448242188, "global_step": 337477, "epoch": 2008} {"train_loss": -11.909189224243164, "global_step": 337478, "epoch": 2008} {"train_loss": -10.337854385375977, "global_step": 337479, "epoch": 2008} {"train_loss": -11.436973571777344, "global_step": 337480, "epoch": 2008} {"train_loss": -9.836859703063965, "global_step": 337481, "epoch": 2008} {"train_loss": -10.203514099121094, "global_step": 337482, "epoch": 2008} {"train_loss": -9.938539505004883, "global_step": 337483, "epoch": 2008} {"train_loss": -10.651008605957031, "global_step": 337484, "epoch": 2008} {"train_loss": -11.003238677978516, "global_step": 337485, "epoch": 2008} {"train_loss": -10.608341217041016, "global_step": 337486, "epoch": 2008} {"train_loss": -10.172778129577637, "global_step": 337487, "epoch": 2008} {"train_loss": -11.896677017211914, "global_step": 337488, "epoch": 2008} {"train_loss": -10.931808471679688, "global_step": 337489, "epoch": 2008} {"train_loss": -10.939973831176758, "global_step": 337490, "epoch": 2008} {"train_loss": -11.678815841674805, "global_step": 337491, "epoch": 2008} {"train_loss": -10.688943862915039, "global_step": 337492, "epoch": 2008} {"train_loss": -11.58680248260498, "global_step": 337493, "epoch": 2008} {"train_loss": -10.887836456298828, "global_step": 337494, "epoch": 2008} {"train_loss": -10.462945938110352, "global_step": 337495, "epoch": 2008} {"train_loss": -11.940152168273926, "global_step": 337496, "epoch": 2008} {"train_loss": -11.066953659057617, "global_step": 337497, "epoch": 2008} {"train_loss": -11.008084297180176, "global_step": 337498, "epoch": 2008} {"train_loss": -11.65184211730957, "global_step": 337499, "epoch": 2008} {"train_loss": -11.195491790771484, "global_step": 337500, "epoch": 2008} {"train_loss": -11.909912109375, "global_step": 337501, "epoch": 2008} {"train_loss": -11.24056625366211, "global_step": 337502, "epoch": 2008} {"train_loss": -11.62171745300293, "global_step": 337503, "epoch": 2008} {"train_loss": -11.817461013793945, "global_step": 337504, "epoch": 2008} {"train_loss": -11.464323043823242, "global_step": 337505, "epoch": 2008} {"train_loss": -11.680961608886719, "global_step": 337506, "epoch": 2008} {"train_loss": -11.433223724365234, "global_step": 337507, "epoch": 2008} {"train_loss": -11.86825942993164, "global_step": 337508, "epoch": 2008} {"train_loss": -11.588401794433594, "global_step": 337509, "epoch": 2008} {"train_loss": -11.82738971710205, "global_step": 337510, "epoch": 2008} {"train_loss": -11.953513667696999, "global_step": 337511, "epoch": 2008, "val_loss": 290016.375} {"train_loss": -11.544612884521484, "global_step": 337512, "epoch": 2009} {"train_loss": -11.490884780883789, "global_step": 337513, "epoch": 2009} {"train_loss": -11.427168846130371, "global_step": 337514, "epoch": 2009} {"train_loss": -11.789188385009766, "global_step": 337515, "epoch": 2009} {"train_loss": -11.524133682250977, "global_step": 337516, "epoch": 2009} {"train_loss": -11.68968391418457, "global_step": 337517, "epoch": 2009} {"train_loss": -11.351975440979004, "global_step": 337518, "epoch": 2009} {"train_loss": -11.46562385559082, "global_step": 337519, "epoch": 2009} {"train_loss": -12.029123306274414, "global_step": 337520, "epoch": 2009} {"train_loss": -11.393777847290039, "global_step": 337521, "epoch": 2009} {"train_loss": -12.068548202514648, "global_step": 337522, "epoch": 2009} {"train_loss": -11.528828620910645, "global_step": 337523, "epoch": 2009} {"train_loss": -11.923896789550781, "global_step": 337524, "epoch": 2009} {"train_loss": -11.645293235778809, "global_step": 337525, "epoch": 2009} {"train_loss": -12.0128173828125, "global_step": 337526, "epoch": 2009} {"train_loss": -12.00936222076416, "global_step": 337527, "epoch": 2009} {"train_loss": -11.952249526977539, "global_step": 337528, "epoch": 2009} {"train_loss": -11.93010425567627, "global_step": 337529, "epoch": 2009} {"train_loss": -12.191774368286133, "global_step": 337530, "epoch": 2009} {"train_loss": -12.098857879638672, "global_step": 337531, "epoch": 2009} {"train_loss": -11.885866165161133, "global_step": 337532, "epoch": 2009} {"train_loss": -11.66291618347168, "global_step": 337533, "epoch": 2009} {"train_loss": -12.04958724975586, "global_step": 337534, "epoch": 2009} {"train_loss": -11.976537704467773, "global_step": 337535, "epoch": 2009} {"train_loss": -11.86904525756836, "global_step": 337536, "epoch": 2009} {"train_loss": -12.151185035705566, "global_step": 337537, "epoch": 2009} {"train_loss": -11.833464622497559, "global_step": 337538, "epoch": 2009} {"train_loss": -12.007453918457031, "global_step": 337539, "epoch": 2009} {"train_loss": -11.867023468017578, "global_step": 337540, "epoch": 2009} {"train_loss": -12.164712905883789, "global_step": 337541, "epoch": 2009} {"train_loss": -12.208638191223145, "global_step": 337542, "epoch": 2009} {"train_loss": -12.002464294433594, "global_step": 337543, "epoch": 2009} {"train_loss": -12.343236923217773, "global_step": 337544, "epoch": 2009} {"train_loss": -11.890604972839355, "global_step": 337545, "epoch": 2009} {"train_loss": -12.326713562011719, "global_step": 337546, "epoch": 2009} {"train_loss": -12.102478981018066, "global_step": 337547, "epoch": 2009} {"train_loss": -12.050947189331055, "global_step": 337548, "epoch": 2009} {"train_loss": -11.987137794494629, "global_step": 337549, "epoch": 2009} {"train_loss": -11.979198455810547, "global_step": 337550, "epoch": 2009} {"train_loss": -11.864667892456055, "global_step": 337551, "epoch": 2009} {"train_loss": -11.92983627319336, "global_step": 337552, "epoch": 2009} {"train_loss": -11.903427124023438, "global_step": 337553, "epoch": 2009} {"train_loss": -12.18709945678711, "global_step": 337554, "epoch": 2009} {"train_loss": -12.0802583694458, "global_step": 337555, "epoch": 2009} {"train_loss": -12.166653633117676, "global_step": 337556, "epoch": 2009} {"train_loss": -12.296433448791504, "global_step": 337557, "epoch": 2009} {"train_loss": -12.244271278381348, "global_step": 337558, "epoch": 2009} {"train_loss": -12.158218383789062, "global_step": 337559, "epoch": 2009} {"train_loss": -12.051349639892578, "global_step": 337560, "epoch": 2009} {"train_loss": -12.38032341003418, "global_step": 337561, "epoch": 2009} {"train_loss": -12.159942626953125, "global_step": 337562, "epoch": 2009} {"train_loss": -12.022018432617188, "global_step": 337563, "epoch": 2009} {"train_loss": -12.299755096435547, "global_step": 337564, "epoch": 2009} {"train_loss": -11.932796478271484, "global_step": 337565, "epoch": 2009} {"train_loss": -11.431861877441406, "global_step": 337566, "epoch": 2009} {"train_loss": -12.305279731750488, "global_step": 337567, "epoch": 2009} {"train_loss": -11.965421676635742, "global_step": 337568, "epoch": 2009} {"train_loss": -12.24786376953125, "global_step": 337569, "epoch": 2009} {"train_loss": -12.053068161010742, "global_step": 337570, "epoch": 2009} {"train_loss": -12.167840957641602, "global_step": 337571, "epoch": 2009} {"train_loss": -12.386907577514648, "global_step": 337572, "epoch": 2009} {"train_loss": -12.033193588256836, "global_step": 337573, "epoch": 2009} {"train_loss": -12.428948402404785, "global_step": 337574, "epoch": 2009} {"train_loss": -11.763652801513672, "global_step": 337575, "epoch": 2009} {"train_loss": -12.32913589477539, "global_step": 337576, "epoch": 2009} {"train_loss": -12.15998649597168, "global_step": 337577, "epoch": 2009} {"train_loss": -12.150198936462402, "global_step": 337578, "epoch": 2009} {"train_loss": -12.432418823242188, "global_step": 337579, "epoch": 2009} {"train_loss": -12.489947319030762, "global_step": 337580, "epoch": 2009} {"train_loss": -12.379083633422852, "global_step": 337581, "epoch": 2009} {"train_loss": -12.262259483337402, "global_step": 337582, "epoch": 2009} {"train_loss": -12.400921821594238, "global_step": 337583, "epoch": 2009} {"train_loss": -12.206918716430664, "global_step": 337584, "epoch": 2009} {"train_loss": -12.30383586883545, "global_step": 337585, "epoch": 2009} {"train_loss": -12.408232688903809, "global_step": 337586, "epoch": 2009} {"train_loss": -12.323690414428711, "global_step": 337587, "epoch": 2009} {"train_loss": -12.623388290405273, "global_step": 337588, "epoch": 2009} {"train_loss": -12.203901290893555, "global_step": 337589, "epoch": 2009} {"train_loss": -12.318000793457031, "global_step": 337590, "epoch": 2009} {"train_loss": -12.253549575805664, "global_step": 337591, "epoch": 2009} {"train_loss": -12.435203552246094, "global_step": 337592, "epoch": 2009} {"train_loss": -12.389494895935059, "global_step": 337593, "epoch": 2009} {"train_loss": -12.229753494262695, "global_step": 337594, "epoch": 2009} {"train_loss": -12.412027359008789, "global_step": 337595, "epoch": 2009} {"train_loss": -12.479082107543945, "global_step": 337596, "epoch": 2009} {"train_loss": -12.306806564331055, "global_step": 337597, "epoch": 2009} {"train_loss": -12.680927276611328, "global_step": 337598, "epoch": 2009} {"train_loss": -12.282041549682617, "global_step": 337599, "epoch": 2009} {"train_loss": -12.576587677001953, "global_step": 337600, "epoch": 2009} {"train_loss": -12.556085586547852, "global_step": 337601, "epoch": 2009} {"train_loss": -12.696989059448242, "global_step": 337602, "epoch": 2009} {"train_loss": -12.495738983154297, "global_step": 337603, "epoch": 2009} {"train_loss": -12.665283203125, "global_step": 337604, "epoch": 2009} {"train_loss": -12.797224044799805, "global_step": 337605, "epoch": 2009} {"train_loss": -12.522637367248535, "global_step": 337606, "epoch": 2009} {"train_loss": -12.721956253051758, "global_step": 337607, "epoch": 2009} {"train_loss": -12.610669136047363, "global_step": 337608, "epoch": 2009} {"train_loss": -12.82223892211914, "global_step": 337609, "epoch": 2009} {"train_loss": -12.587766647338867, "global_step": 337610, "epoch": 2009} {"train_loss": -12.725900650024414, "global_step": 337611, "epoch": 2009} {"train_loss": -12.751493453979492, "global_step": 337612, "epoch": 2009} {"train_loss": -12.801254272460938, "global_step": 337613, "epoch": 2009} {"train_loss": -12.413015365600586, "global_step": 337614, "epoch": 2009} {"train_loss": -12.700172424316406, "global_step": 337615, "epoch": 2009} {"train_loss": -12.633723258972168, "global_step": 337616, "epoch": 2009} {"train_loss": -12.750686645507812, "global_step": 337617, "epoch": 2009} {"train_loss": -12.680390357971191, "global_step": 337618, "epoch": 2009} {"train_loss": -12.366628646850586, "global_step": 337619, "epoch": 2009} {"train_loss": -12.477958679199219, "global_step": 337620, "epoch": 2009} {"train_loss": -12.532316207885742, "global_step": 337621, "epoch": 2009} {"train_loss": -12.504803657531738, "global_step": 337622, "epoch": 2009} {"train_loss": -12.454691886901855, "global_step": 337623, "epoch": 2009} {"train_loss": -12.671396255493164, "global_step": 337624, "epoch": 2009} {"train_loss": -12.451545715332031, "global_step": 337625, "epoch": 2009} {"train_loss": -12.399194717407227, "global_step": 337626, "epoch": 2009} {"train_loss": -12.225933074951172, "global_step": 337627, "epoch": 2009} {"train_loss": -12.158639907836914, "global_step": 337628, "epoch": 2009} {"train_loss": -11.802616119384766, "global_step": 337629, "epoch": 2009} {"train_loss": -12.325525283813477, "global_step": 337630, "epoch": 2009} {"train_loss": -12.330892562866211, "global_step": 337631, "epoch": 2009} {"train_loss": -12.000232696533203, "global_step": 337632, "epoch": 2009} {"train_loss": -12.043889999389648, "global_step": 337633, "epoch": 2009} {"train_loss": -12.420297622680664, "global_step": 337634, "epoch": 2009} {"train_loss": -12.169574737548828, "global_step": 337635, "epoch": 2009} {"train_loss": -12.066426277160645, "global_step": 337636, "epoch": 2009} {"train_loss": -11.927453994750977, "global_step": 337637, "epoch": 2009} {"train_loss": -12.509486198425293, "global_step": 337638, "epoch": 2009} {"train_loss": -12.507490158081055, "global_step": 337639, "epoch": 2009} {"train_loss": -12.632895469665527, "global_step": 337640, "epoch": 2009} {"train_loss": -12.32215690612793, "global_step": 337641, "epoch": 2009} {"train_loss": -12.16296100616455, "global_step": 337642, "epoch": 2009} {"train_loss": -12.124504089355469, "global_step": 337643, "epoch": 2009} {"train_loss": -12.311448097229004, "global_step": 337644, "epoch": 2009} {"train_loss": -12.508665084838867, "global_step": 337645, "epoch": 2009} {"train_loss": -12.15157699584961, "global_step": 337646, "epoch": 2009} {"train_loss": -11.713181495666504, "global_step": 337647, "epoch": 2009} {"train_loss": -10.844764709472656, "global_step": 337648, "epoch": 2009} {"train_loss": -11.184635162353516, "global_step": 337649, "epoch": 2009} {"train_loss": -10.364272117614746, "global_step": 337650, "epoch": 2009} {"train_loss": -10.588468551635742, "global_step": 337651, "epoch": 2009} {"train_loss": -11.174948692321777, "global_step": 337652, "epoch": 2009} {"train_loss": -11.442798614501953, "global_step": 337653, "epoch": 2009} {"train_loss": -11.431354522705078, "global_step": 337654, "epoch": 2009} {"train_loss": -11.832313537597656, "global_step": 337655, "epoch": 2009} {"train_loss": -11.797231674194336, "global_step": 337656, "epoch": 2009} {"train_loss": -11.716659545898438, "global_step": 337657, "epoch": 2009} {"train_loss": -11.339301109313965, "global_step": 337658, "epoch": 2009} {"train_loss": -11.508407592773438, "global_step": 337659, "epoch": 2009} {"train_loss": -10.520671844482422, "global_step": 337660, "epoch": 2009} {"train_loss": -11.601844787597656, "global_step": 337661, "epoch": 2009} {"train_loss": -11.119346618652344, "global_step": 337662, "epoch": 2009} {"train_loss": -10.046793937683105, "global_step": 337663, "epoch": 2009} {"train_loss": -11.228281021118164, "global_step": 337664, "epoch": 2009} {"train_loss": -10.504949569702148, "global_step": 337665, "epoch": 2009} {"train_loss": -10.571743965148926, "global_step": 337666, "epoch": 2009} {"train_loss": -11.340060234069824, "global_step": 337667, "epoch": 2009} {"train_loss": -10.27304458618164, "global_step": 337668, "epoch": 2009} {"train_loss": -11.5341796875, "global_step": 337669, "epoch": 2009} {"train_loss": -9.2213716506958, "global_step": 337670, "epoch": 2009} {"train_loss": -12.180461883544922, "global_step": 337671, "epoch": 2009} {"train_loss": -10.2223482131958, "global_step": 337672, "epoch": 2009} {"train_loss": -11.378625869750977, "global_step": 337673, "epoch": 2009} {"train_loss": -11.573027610778809, "global_step": 337674, "epoch": 2009} {"train_loss": -11.125673294067383, "global_step": 337675, "epoch": 2009} {"train_loss": -12.004867553710938, "global_step": 337676, "epoch": 2009} {"train_loss": -11.549066543579102, "global_step": 337677, "epoch": 2009} {"train_loss": -11.57302188873291, "global_step": 337678, "epoch": 2009} {"train_loss": -11.998581488927206, "global_step": 337679, "epoch": 2009, "val_loss": 291700.15625} {"train_loss": -11.887505531311035, "global_step": 337680, "epoch": 2010} {"train_loss": -12.017382621765137, "global_step": 337681, "epoch": 2010} {"train_loss": -11.544731140136719, "global_step": 337682, "epoch": 2010} {"train_loss": -12.009908676147461, "global_step": 337683, "epoch": 2010} {"train_loss": -11.753046989440918, "global_step": 337684, "epoch": 2010} {"train_loss": -12.006837844848633, "global_step": 337685, "epoch": 2010} {"train_loss": -11.903116226196289, "global_step": 337686, "epoch": 2010} {"train_loss": -11.817689895629883, "global_step": 337687, "epoch": 2010} {"train_loss": -12.297538757324219, "global_step": 337688, "epoch": 2010} {"train_loss": -11.843559265136719, "global_step": 337689, "epoch": 2010} {"train_loss": -12.245777130126953, "global_step": 337690, "epoch": 2010} {"train_loss": -12.120057106018066, "global_step": 337691, "epoch": 2010} {"train_loss": -12.179550170898438, "global_step": 337692, "epoch": 2010} {"train_loss": -12.1592435836792, "global_step": 337693, "epoch": 2010} {"train_loss": -11.958972930908203, "global_step": 337694, "epoch": 2010} {"train_loss": -12.211210250854492, "global_step": 337695, "epoch": 2010} {"train_loss": -12.018823623657227, "global_step": 337696, "epoch": 2010} {"train_loss": -11.998987197875977, "global_step": 337697, "epoch": 2010} {"train_loss": -12.192667961120605, "global_step": 337698, "epoch": 2010} {"train_loss": -11.871638298034668, "global_step": 337699, "epoch": 2010} {"train_loss": -12.264842987060547, "global_step": 337700, "epoch": 2010} {"train_loss": -11.414201736450195, "global_step": 337701, "epoch": 2010} {"train_loss": -11.982059478759766, "global_step": 337702, "epoch": 2010} {"train_loss": -11.877371788024902, "global_step": 337703, "epoch": 2010} {"train_loss": -11.913593292236328, "global_step": 337704, "epoch": 2010} {"train_loss": -12.002813339233398, "global_step": 337705, "epoch": 2010} {"train_loss": -11.99694538116455, "global_step": 337706, "epoch": 2010} {"train_loss": -12.260782241821289, "global_step": 337707, "epoch": 2010} {"train_loss": -11.975091934204102, "global_step": 337708, "epoch": 2010} {"train_loss": -12.323732376098633, "global_step": 337709, "epoch": 2010} {"train_loss": -12.303678512573242, "global_step": 337710, "epoch": 2010} {"train_loss": -12.03349494934082, "global_step": 337711, "epoch": 2010} {"train_loss": -12.23994255065918, "global_step": 337712, "epoch": 2010} {"train_loss": -11.852174758911133, "global_step": 337713, "epoch": 2010} {"train_loss": -11.91496753692627, "global_step": 337714, "epoch": 2010} {"train_loss": -12.037235260009766, "global_step": 337715, "epoch": 2010} {"train_loss": -11.646503448486328, "global_step": 337716, "epoch": 2010} {"train_loss": -12.082565307617188, "global_step": 337717, "epoch": 2010} {"train_loss": -11.769669532775879, "global_step": 337718, "epoch": 2010} {"train_loss": -12.226619720458984, "global_step": 337719, "epoch": 2010} {"train_loss": -11.710504531860352, "global_step": 337720, "epoch": 2010} {"train_loss": -12.002023696899414, "global_step": 337721, "epoch": 2010} {"train_loss": -12.021215438842773, "global_step": 337722, "epoch": 2010} {"train_loss": -11.935595512390137, "global_step": 337723, "epoch": 2010} {"train_loss": -12.368896484375, "global_step": 337724, "epoch": 2010} {"train_loss": -12.170659065246582, "global_step": 337725, "epoch": 2010} {"train_loss": -12.131888389587402, "global_step": 337726, "epoch": 2010} {"train_loss": -12.513198852539062, "global_step": 337727, "epoch": 2010} {"train_loss": -11.892916679382324, "global_step": 337728, "epoch": 2010} {"train_loss": -12.567474365234375, "global_step": 337729, "epoch": 2010} {"train_loss": -12.281715393066406, "global_step": 337730, "epoch": 2010} {"train_loss": -12.230682373046875, "global_step": 337731, "epoch": 2010} {"train_loss": -12.357901573181152, "global_step": 337732, "epoch": 2010} {"train_loss": -11.88250732421875, "global_step": 337733, "epoch": 2010} {"train_loss": -12.363306045532227, "global_step": 337734, "epoch": 2010} {"train_loss": -12.099013328552246, "global_step": 337735, "epoch": 2010} {"train_loss": -12.292192459106445, "global_step": 337736, "epoch": 2010} {"train_loss": -11.706052780151367, "global_step": 337737, "epoch": 2010} {"train_loss": -12.270483016967773, "global_step": 337738, "epoch": 2010} {"train_loss": -12.202481269836426, "global_step": 337739, "epoch": 2010} {"train_loss": -12.238828659057617, "global_step": 337740, "epoch": 2010} {"train_loss": -12.085782051086426, "global_step": 337741, "epoch": 2010} {"train_loss": -11.83594799041748, "global_step": 337742, "epoch": 2010} {"train_loss": -12.047746658325195, "global_step": 337743, "epoch": 2010} {"train_loss": -12.349264144897461, "global_step": 337744, "epoch": 2010} {"train_loss": -11.482889175415039, "global_step": 337745, "epoch": 2010} {"train_loss": -11.318588256835938, "global_step": 337746, "epoch": 2010} {"train_loss": -12.120780944824219, "global_step": 337747, "epoch": 2010} {"train_loss": -11.433618545532227, "global_step": 337748, "epoch": 2010} {"train_loss": -11.473104476928711, "global_step": 337749, "epoch": 2010} {"train_loss": -12.202232360839844, "global_step": 337750, "epoch": 2010} {"train_loss": -11.344900131225586, "global_step": 337751, "epoch": 2010} {"train_loss": -11.773065567016602, "global_step": 337752, "epoch": 2010} {"train_loss": -12.105936050415039, "global_step": 337753, "epoch": 2010} {"train_loss": -11.785991668701172, "global_step": 337754, "epoch": 2010} {"train_loss": -12.165153503417969, "global_step": 337755, "epoch": 2010} {"train_loss": -11.49055290222168, "global_step": 337756, "epoch": 2010} {"train_loss": -12.139411926269531, "global_step": 337757, "epoch": 2010} {"train_loss": -12.065475463867188, "global_step": 337758, "epoch": 2010} {"train_loss": -11.662179946899414, "global_step": 337759, "epoch": 2010} {"train_loss": -11.585371017456055, "global_step": 337760, "epoch": 2010} {"train_loss": -11.777914047241211, "global_step": 337761, "epoch": 2010} {"train_loss": -11.216412544250488, "global_step": 337762, "epoch": 2010} {"train_loss": -11.215470314025879, "global_step": 337763, "epoch": 2010} {"train_loss": -11.802088737487793, "global_step": 337764, "epoch": 2010} {"train_loss": -11.865020751953125, "global_step": 337765, "epoch": 2010} {"train_loss": -10.875116348266602, "global_step": 337766, "epoch": 2010} {"train_loss": -12.038508415222168, "global_step": 337767, "epoch": 2010} {"train_loss": -11.23511791229248, "global_step": 337768, "epoch": 2010} {"train_loss": -11.200644493103027, "global_step": 337769, "epoch": 2010} {"train_loss": -11.371373176574707, "global_step": 337770, "epoch": 2010} {"train_loss": -11.349149703979492, "global_step": 337771, "epoch": 2010} {"train_loss": -12.022323608398438, "global_step": 337772, "epoch": 2010} {"train_loss": -11.725717544555664, "global_step": 337773, "epoch": 2010} {"train_loss": -11.925224304199219, "global_step": 337774, "epoch": 2010} {"train_loss": -11.616260528564453, "global_step": 337775, "epoch": 2010} {"train_loss": -11.990591049194336, "global_step": 337776, "epoch": 2010} {"train_loss": -11.81114387512207, "global_step": 337777, "epoch": 2010} {"train_loss": -11.272615432739258, "global_step": 337778, "epoch": 2010} {"train_loss": -12.192952156066895, "global_step": 337779, "epoch": 2010} {"train_loss": -10.795660018920898, "global_step": 337780, "epoch": 2010} {"train_loss": -11.602333068847656, "global_step": 337781, "epoch": 2010} {"train_loss": -10.99863052368164, "global_step": 337782, "epoch": 2010} {"train_loss": -11.261465072631836, "global_step": 337783, "epoch": 2010} {"train_loss": -11.798383712768555, "global_step": 337784, "epoch": 2010} {"train_loss": -11.267630577087402, "global_step": 337785, "epoch": 2010} {"train_loss": -12.045316696166992, "global_step": 337786, "epoch": 2010} {"train_loss": -10.751928329467773, "global_step": 337787, "epoch": 2010} {"train_loss": -11.861124038696289, "global_step": 337788, "epoch": 2010} {"train_loss": -11.243154525756836, "global_step": 337789, "epoch": 2010} {"train_loss": -11.646689414978027, "global_step": 337790, "epoch": 2010} {"train_loss": -10.768759727478027, "global_step": 337791, "epoch": 2010} {"train_loss": -11.49390983581543, "global_step": 337792, "epoch": 2010} {"train_loss": -11.771184921264648, "global_step": 337793, "epoch": 2010} {"train_loss": -11.08391284942627, "global_step": 337794, "epoch": 2010} {"train_loss": -11.970787048339844, "global_step": 337795, "epoch": 2010} {"train_loss": -11.029118537902832, "global_step": 337796, "epoch": 2010} {"train_loss": -11.115135192871094, "global_step": 337797, "epoch": 2010} {"train_loss": -11.727136611938477, "global_step": 337798, "epoch": 2010} {"train_loss": -11.353172302246094, "global_step": 337799, "epoch": 2010} {"train_loss": -12.005521774291992, "global_step": 337800, "epoch": 2010} {"train_loss": -11.573938369750977, "global_step": 337801, "epoch": 2010} {"train_loss": -11.432859420776367, "global_step": 337802, "epoch": 2010} {"train_loss": -11.440338134765625, "global_step": 337803, "epoch": 2010} {"train_loss": -11.527965545654297, "global_step": 337804, "epoch": 2010} {"train_loss": -11.191451072692871, "global_step": 337805, "epoch": 2010} {"train_loss": -11.64522647857666, "global_step": 337806, "epoch": 2010} {"train_loss": -11.36185073852539, "global_step": 337807, "epoch": 2010} {"train_loss": -12.010612487792969, "global_step": 337808, "epoch": 2010} {"train_loss": -11.58914566040039, "global_step": 337809, "epoch": 2010} {"train_loss": -12.13868236541748, "global_step": 337810, "epoch": 2010} {"train_loss": -11.97127914428711, "global_step": 337811, "epoch": 2010} {"train_loss": -12.024648666381836, "global_step": 337812, "epoch": 2010} {"train_loss": -12.126550674438477, "global_step": 337813, "epoch": 2010} {"train_loss": -11.827383995056152, "global_step": 337814, "epoch": 2010} {"train_loss": -12.370925903320312, "global_step": 337815, "epoch": 2010} {"train_loss": -12.009066581726074, "global_step": 337816, "epoch": 2010} {"train_loss": -12.39988899230957, "global_step": 337817, "epoch": 2010} {"train_loss": -12.244760513305664, "global_step": 337818, "epoch": 2010} {"train_loss": -12.516925811767578, "global_step": 337819, "epoch": 2010} {"train_loss": -12.258721351623535, "global_step": 337820, "epoch": 2010} {"train_loss": -12.462017059326172, "global_step": 337821, "epoch": 2010} {"train_loss": -12.357890129089355, "global_step": 337822, "epoch": 2010} {"train_loss": -12.503785133361816, "global_step": 337823, "epoch": 2010} {"train_loss": -12.382074356079102, "global_step": 337824, "epoch": 2010} {"train_loss": -12.200596809387207, "global_step": 337825, "epoch": 2010} {"train_loss": -12.259803771972656, "global_step": 337826, "epoch": 2010} {"train_loss": -12.35586929321289, "global_step": 337827, "epoch": 2010} {"train_loss": -12.243284225463867, "global_step": 337828, "epoch": 2010} {"train_loss": -12.412972450256348, "global_step": 337829, "epoch": 2010} {"train_loss": -12.343031883239746, "global_step": 337830, "epoch": 2010} {"train_loss": -12.546995162963867, "global_step": 337831, "epoch": 2010} {"train_loss": -12.409783363342285, "global_step": 337832, "epoch": 2010} {"train_loss": -12.534107208251953, "global_step": 337833, "epoch": 2010} {"train_loss": -12.364988327026367, "global_step": 337834, "epoch": 2010} {"train_loss": -12.341468811035156, "global_step": 337835, "epoch": 2010} {"train_loss": -12.54456901550293, "global_step": 337836, "epoch": 2010} {"train_loss": -12.480260848999023, "global_step": 337837, "epoch": 2010} {"train_loss": -12.54035758972168, "global_step": 337838, "epoch": 2010} {"train_loss": -12.507307052612305, "global_step": 337839, "epoch": 2010} {"train_loss": -12.523233413696289, "global_step": 337840, "epoch": 2010} {"train_loss": -12.502496719360352, "global_step": 337841, "epoch": 2010} {"train_loss": -12.642190933227539, "global_step": 337842, "epoch": 2010} {"train_loss": -12.469738006591797, "global_step": 337843, "epoch": 2010} {"train_loss": -12.472421646118164, "global_step": 337844, "epoch": 2010} {"train_loss": -12.529741287231445, "global_step": 337845, "epoch": 2010} {"train_loss": -12.679204940795898, "global_step": 337846, "epoch": 2010} {"train_loss": -11.938648973192487, "global_step": 337847, "epoch": 2010, "val_loss": 290193.71875, "train_action_mse_error": 1.2980570793151855} {"train_loss": -12.49254035949707, "global_step": 337848, "epoch": 2011} {"train_loss": -12.693243980407715, "global_step": 337849, "epoch": 2011} {"train_loss": -12.667078018188477, "global_step": 337850, "epoch": 2011} {"train_loss": -12.465697288513184, "global_step": 337851, "epoch": 2011} {"train_loss": -12.771150588989258, "global_step": 337852, "epoch": 2011} {"train_loss": -12.489128112792969, "global_step": 337853, "epoch": 2011} {"train_loss": -12.50015640258789, "global_step": 337854, "epoch": 2011} {"train_loss": -12.566264152526855, "global_step": 337855, "epoch": 2011} {"train_loss": -12.229936599731445, "global_step": 337856, "epoch": 2011} {"train_loss": -12.634383201599121, "global_step": 337857, "epoch": 2011} {"train_loss": -12.19717025756836, "global_step": 337858, "epoch": 2011} {"train_loss": -11.316604614257812, "global_step": 337859, "epoch": 2011} {"train_loss": -11.597620010375977, "global_step": 337860, "epoch": 2011} {"train_loss": -12.220464706420898, "global_step": 337861, "epoch": 2011} {"train_loss": -10.69762134552002, "global_step": 337862, "epoch": 2011} {"train_loss": -11.922452926635742, "global_step": 337863, "epoch": 2011} {"train_loss": -11.686405181884766, "global_step": 337864, "epoch": 2011} {"train_loss": -11.005670547485352, "global_step": 337865, "epoch": 2011} {"train_loss": -11.338134765625, "global_step": 337866, "epoch": 2011} {"train_loss": -10.683873176574707, "global_step": 337867, "epoch": 2011} {"train_loss": -11.354570388793945, "global_step": 337868, "epoch": 2011} {"train_loss": -11.621397018432617, "global_step": 337869, "epoch": 2011} {"train_loss": -11.271078109741211, "global_step": 337870, "epoch": 2011} {"train_loss": -11.25443172454834, "global_step": 337871, "epoch": 2011} {"train_loss": -12.131568908691406, "global_step": 337872, "epoch": 2011} {"train_loss": -11.515210151672363, "global_step": 337873, "epoch": 2011} {"train_loss": -12.403249740600586, "global_step": 337874, "epoch": 2011} {"train_loss": -11.571231842041016, "global_step": 337875, "epoch": 2011} {"train_loss": -12.131085395812988, "global_step": 337876, "epoch": 2011} {"train_loss": -11.630894660949707, "global_step": 337877, "epoch": 2011} {"train_loss": -11.725198745727539, "global_step": 337878, "epoch": 2011} {"train_loss": -11.839478492736816, "global_step": 337879, "epoch": 2011} {"train_loss": -11.585887908935547, "global_step": 337880, "epoch": 2011} {"train_loss": -12.612560272216797, "global_step": 337881, "epoch": 2011} {"train_loss": -11.590307235717773, "global_step": 337882, "epoch": 2011} {"train_loss": -11.924131393432617, "global_step": 337883, "epoch": 2011} {"train_loss": -12.086431503295898, "global_step": 337884, "epoch": 2011} {"train_loss": -11.581850051879883, "global_step": 337885, "epoch": 2011} {"train_loss": -12.38449478149414, "global_step": 337886, "epoch": 2011} {"train_loss": -12.022107124328613, "global_step": 337887, "epoch": 2011} {"train_loss": -11.960915565490723, "global_step": 337888, "epoch": 2011} {"train_loss": -12.137504577636719, "global_step": 337889, "epoch": 2011} {"train_loss": -11.700898170471191, "global_step": 337890, "epoch": 2011} {"train_loss": -12.27165699005127, "global_step": 337891, "epoch": 2011} {"train_loss": -11.889883041381836, "global_step": 337892, "epoch": 2011} {"train_loss": -12.015176773071289, "global_step": 337893, "epoch": 2011} {"train_loss": -12.112167358398438, "global_step": 337894, "epoch": 2011} {"train_loss": -11.660896301269531, "global_step": 337895, "epoch": 2011} {"train_loss": -12.271340370178223, "global_step": 337896, "epoch": 2011} {"train_loss": -11.158112525939941, "global_step": 337897, "epoch": 2011} {"train_loss": -11.993209838867188, "global_step": 337898, "epoch": 2011} {"train_loss": -11.86093521118164, "global_step": 337899, "epoch": 2011} {"train_loss": -11.776805877685547, "global_step": 337900, "epoch": 2011} {"train_loss": -12.448530197143555, "global_step": 337901, "epoch": 2011} {"train_loss": -11.915604591369629, "global_step": 337902, "epoch": 2011} {"train_loss": -12.298799514770508, "global_step": 337903, "epoch": 2011} {"train_loss": -12.313713073730469, "global_step": 337904, "epoch": 2011} {"train_loss": -12.307615280151367, "global_step": 337905, "epoch": 2011} {"train_loss": -12.407600402832031, "global_step": 337906, "epoch": 2011} {"train_loss": -12.113502502441406, "global_step": 337907, "epoch": 2011} {"train_loss": -12.477555274963379, "global_step": 337908, "epoch": 2011} {"train_loss": -11.779783248901367, "global_step": 337909, "epoch": 2011} {"train_loss": -11.928720474243164, "global_step": 337910, "epoch": 2011} {"train_loss": -12.187995910644531, "global_step": 337911, "epoch": 2011} {"train_loss": -12.04826831817627, "global_step": 337912, "epoch": 2011} {"train_loss": -12.048700332641602, "global_step": 337913, "epoch": 2011} {"train_loss": -12.45823860168457, "global_step": 337914, "epoch": 2011} {"train_loss": -12.037843704223633, "global_step": 337915, "epoch": 2011} {"train_loss": -12.318276405334473, "global_step": 337916, "epoch": 2011} {"train_loss": -12.184205055236816, "global_step": 337917, "epoch": 2011} {"train_loss": -12.07471752166748, "global_step": 337918, "epoch": 2011} {"train_loss": -12.07182502746582, "global_step": 337919, "epoch": 2011} {"train_loss": -12.218151092529297, "global_step": 337920, "epoch": 2011} {"train_loss": -12.16370964050293, "global_step": 337921, "epoch": 2011} {"train_loss": -11.346094131469727, "global_step": 337922, "epoch": 2011} {"train_loss": -11.969318389892578, "global_step": 337923, "epoch": 2011} {"train_loss": -12.415016174316406, "global_step": 337924, "epoch": 2011} {"train_loss": -12.081865310668945, "global_step": 337925, "epoch": 2011} {"train_loss": -12.137375831604004, "global_step": 337926, "epoch": 2011} {"train_loss": -11.868948936462402, "global_step": 337927, "epoch": 2011} {"train_loss": -12.123753547668457, "global_step": 337928, "epoch": 2011} {"train_loss": -11.652238845825195, "global_step": 337929, "epoch": 2011} {"train_loss": -12.326741218566895, "global_step": 337930, "epoch": 2011} {"train_loss": -12.200191497802734, "global_step": 337931, "epoch": 2011} {"train_loss": -11.213888168334961, "global_step": 337932, "epoch": 2011} {"train_loss": -11.67531967163086, "global_step": 337933, "epoch": 2011} {"train_loss": -12.094457626342773, "global_step": 337934, "epoch": 2011} {"train_loss": -11.782495498657227, "global_step": 337935, "epoch": 2011} {"train_loss": -11.73315143585205, "global_step": 337936, "epoch": 2011} {"train_loss": -12.195176124572754, "global_step": 337937, "epoch": 2011} {"train_loss": -12.096893310546875, "global_step": 337938, "epoch": 2011} {"train_loss": -11.93034553527832, "global_step": 337939, "epoch": 2011} {"train_loss": -11.719574928283691, "global_step": 337940, "epoch": 2011} {"train_loss": -12.04466724395752, "global_step": 337941, "epoch": 2011} {"train_loss": -10.853032112121582, "global_step": 337942, "epoch": 2011} {"train_loss": -11.793899536132812, "global_step": 337943, "epoch": 2011} {"train_loss": -11.660940170288086, "global_step": 337944, "epoch": 2011} {"train_loss": -11.746712684631348, "global_step": 337945, "epoch": 2011} {"train_loss": -12.173381805419922, "global_step": 337946, "epoch": 2011} {"train_loss": -11.996734619140625, "global_step": 337947, "epoch": 2011} {"train_loss": -11.869491577148438, "global_step": 337948, "epoch": 2011} {"train_loss": -11.807184219360352, "global_step": 337949, "epoch": 2011} {"train_loss": -12.471658706665039, "global_step": 337950, "epoch": 2011} {"train_loss": -11.581408500671387, "global_step": 337951, "epoch": 2011} {"train_loss": -11.944982528686523, "global_step": 337952, "epoch": 2011} {"train_loss": -12.305524826049805, "global_step": 337953, "epoch": 2011} {"train_loss": -11.735139846801758, "global_step": 337954, "epoch": 2011} {"train_loss": -12.276503562927246, "global_step": 337955, "epoch": 2011} {"train_loss": -12.003297805786133, "global_step": 337956, "epoch": 2011} {"train_loss": -11.543161392211914, "global_step": 337957, "epoch": 2011} {"train_loss": -12.19619083404541, "global_step": 337958, "epoch": 2011} {"train_loss": -11.847467422485352, "global_step": 337959, "epoch": 2011} {"train_loss": -12.234343528747559, "global_step": 337960, "epoch": 2011} {"train_loss": -12.264307022094727, "global_step": 337961, "epoch": 2011} {"train_loss": -11.869548797607422, "global_step": 337962, "epoch": 2011} {"train_loss": -12.255345344543457, "global_step": 337963, "epoch": 2011} {"train_loss": -11.36931037902832, "global_step": 337964, "epoch": 2011} {"train_loss": -11.260703086853027, "global_step": 337965, "epoch": 2011} {"train_loss": -11.992256164550781, "global_step": 337966, "epoch": 2011} {"train_loss": -11.95885944366455, "global_step": 337967, "epoch": 2011} {"train_loss": -12.348767280578613, "global_step": 337968, "epoch": 2011} {"train_loss": -12.269355773925781, "global_step": 337969, "epoch": 2011} {"train_loss": -12.162748336791992, "global_step": 337970, "epoch": 2011} {"train_loss": -12.010204315185547, "global_step": 337971, "epoch": 2011} {"train_loss": -12.155906677246094, "global_step": 337972, "epoch": 2011} {"train_loss": -12.119285583496094, "global_step": 337973, "epoch": 2011} {"train_loss": -12.081987380981445, "global_step": 337974, "epoch": 2011} {"train_loss": -12.25506591796875, "global_step": 337975, "epoch": 2011} {"train_loss": -12.238289833068848, "global_step": 337976, "epoch": 2011} {"train_loss": -12.469725608825684, "global_step": 337977, "epoch": 2011} {"train_loss": -11.750240325927734, "global_step": 337978, "epoch": 2011} {"train_loss": -11.438948631286621, "global_step": 337979, "epoch": 2011} {"train_loss": -12.403181076049805, "global_step": 337980, "epoch": 2011} {"train_loss": -11.63769817352295, "global_step": 337981, "epoch": 2011} {"train_loss": -11.95773696899414, "global_step": 337982, "epoch": 2011} {"train_loss": -12.304374694824219, "global_step": 337983, "epoch": 2011} {"train_loss": -12.186141967773438, "global_step": 337984, "epoch": 2011} {"train_loss": -12.25118637084961, "global_step": 337985, "epoch": 2011} {"train_loss": -12.214860916137695, "global_step": 337986, "epoch": 2011} {"train_loss": -12.21483325958252, "global_step": 337987, "epoch": 2011} {"train_loss": -12.371009826660156, "global_step": 337988, "epoch": 2011} {"train_loss": -12.261850357055664, "global_step": 337989, "epoch": 2011} {"train_loss": -12.159936904907227, "global_step": 337990, "epoch": 2011} {"train_loss": -12.413658142089844, "global_step": 337991, "epoch": 2011} {"train_loss": -12.205764770507812, "global_step": 337992, "epoch": 2011} {"train_loss": -12.329007148742676, "global_step": 337993, "epoch": 2011} {"train_loss": -12.19051742553711, "global_step": 337994, "epoch": 2011} {"train_loss": -12.18979549407959, "global_step": 337995, "epoch": 2011} {"train_loss": -12.061507225036621, "global_step": 337996, "epoch": 2011} {"train_loss": -12.363428115844727, "global_step": 337997, "epoch": 2011} {"train_loss": -12.487797737121582, "global_step": 337998, "epoch": 2011} {"train_loss": -11.965543746948242, "global_step": 337999, "epoch": 2011} {"train_loss": -11.774298667907715, "global_step": 338000, "epoch": 2011} {"train_loss": -12.253721237182617, "global_step": 338001, "epoch": 2011} {"train_loss": -11.814388275146484, "global_step": 338002, "epoch": 2011} {"train_loss": -11.926143646240234, "global_step": 338003, "epoch": 2011} {"train_loss": -11.945634841918945, "global_step": 338004, "epoch": 2011} {"train_loss": -12.401379585266113, "global_step": 338005, "epoch": 2011} {"train_loss": -11.63451862335205, "global_step": 338006, "epoch": 2011} {"train_loss": -11.991728782653809, "global_step": 338007, "epoch": 2011} {"train_loss": -12.255026817321777, "global_step": 338008, "epoch": 2011} {"train_loss": -12.034263610839844, "global_step": 338009, "epoch": 2011} {"train_loss": -12.225297927856445, "global_step": 338010, "epoch": 2011} {"train_loss": -12.351676940917969, "global_step": 338011, "epoch": 2011} {"train_loss": -12.242730140686035, "global_step": 338012, "epoch": 2011} {"train_loss": -12.350674629211426, "global_step": 338013, "epoch": 2011} {"train_loss": -12.329927444458008, "global_step": 338014, "epoch": 2011} {"train_loss": -12.01050128823235, "global_step": 338015, "epoch": 2011, "val_loss": 288483.03125} {"train_loss": -12.047106742858887, "global_step": 338016, "epoch": 2012} {"train_loss": -12.353252410888672, "global_step": 338017, "epoch": 2012} {"train_loss": -11.989834785461426, "global_step": 338018, "epoch": 2012} {"train_loss": -11.44442367553711, "global_step": 338019, "epoch": 2012} {"train_loss": -11.48458480834961, "global_step": 338020, "epoch": 2012} {"train_loss": -12.420614242553711, "global_step": 338021, "epoch": 2012} {"train_loss": -11.40668773651123, "global_step": 338022, "epoch": 2012} {"train_loss": -11.929276466369629, "global_step": 338023, "epoch": 2012} {"train_loss": -11.523118019104004, "global_step": 338024, "epoch": 2012} {"train_loss": -11.607332229614258, "global_step": 338025, "epoch": 2012} {"train_loss": -11.455106735229492, "global_step": 338026, "epoch": 2012} {"train_loss": -12.021930694580078, "global_step": 338027, "epoch": 2012} {"train_loss": -11.175944328308105, "global_step": 338028, "epoch": 2012} {"train_loss": -11.65411376953125, "global_step": 338029, "epoch": 2012} {"train_loss": -11.095535278320312, "global_step": 338030, "epoch": 2012} {"train_loss": -12.01015853881836, "global_step": 338031, "epoch": 2012} {"train_loss": -11.045454025268555, "global_step": 338032, "epoch": 2012} {"train_loss": -11.373809814453125, "global_step": 338033, "epoch": 2012} {"train_loss": -12.172415733337402, "global_step": 338034, "epoch": 2012} {"train_loss": -11.468387603759766, "global_step": 338035, "epoch": 2012} {"train_loss": -11.667723655700684, "global_step": 338036, "epoch": 2012} {"train_loss": -12.060623168945312, "global_step": 338037, "epoch": 2012} {"train_loss": -11.888166427612305, "global_step": 338038, "epoch": 2012} {"train_loss": -12.16065788269043, "global_step": 338039, "epoch": 2012} {"train_loss": -11.744277954101562, "global_step": 338040, "epoch": 2012} {"train_loss": -12.113934516906738, "global_step": 338041, "epoch": 2012} {"train_loss": -11.832682609558105, "global_step": 338042, "epoch": 2012} {"train_loss": -12.006942749023438, "global_step": 338043, "epoch": 2012} {"train_loss": -11.920717239379883, "global_step": 338044, "epoch": 2012} {"train_loss": -12.095317840576172, "global_step": 338045, "epoch": 2012} {"train_loss": -11.981231689453125, "global_step": 338046, "epoch": 2012} {"train_loss": -12.361776351928711, "global_step": 338047, "epoch": 2012} {"train_loss": -11.874900817871094, "global_step": 338048, "epoch": 2012} {"train_loss": -12.187572479248047, "global_step": 338049, "epoch": 2012} {"train_loss": -11.340560913085938, "global_step": 338050, "epoch": 2012} {"train_loss": -12.11857795715332, "global_step": 338051, "epoch": 2012} {"train_loss": -11.682218551635742, "global_step": 338052, "epoch": 2012} {"train_loss": -11.516515731811523, "global_step": 338053, "epoch": 2012} {"train_loss": -12.139841079711914, "global_step": 338054, "epoch": 2012} {"train_loss": -11.689424514770508, "global_step": 338055, "epoch": 2012} {"train_loss": -11.777312278747559, "global_step": 338056, "epoch": 2012} {"train_loss": -11.478837966918945, "global_step": 338057, "epoch": 2012} {"train_loss": -12.089559555053711, "global_step": 338058, "epoch": 2012} {"train_loss": -11.754508972167969, "global_step": 338059, "epoch": 2012} {"train_loss": -11.412665367126465, "global_step": 338060, "epoch": 2012} {"train_loss": -11.294716835021973, "global_step": 338061, "epoch": 2012} {"train_loss": -12.060041427612305, "global_step": 338062, "epoch": 2012} {"train_loss": -11.76140308380127, "global_step": 338063, "epoch": 2012} {"train_loss": -11.462789535522461, "global_step": 338064, "epoch": 2012} {"train_loss": -12.307880401611328, "global_step": 338065, "epoch": 2012} {"train_loss": -11.528068542480469, "global_step": 338066, "epoch": 2012} {"train_loss": -12.062267303466797, "global_step": 338067, "epoch": 2012} {"train_loss": -12.140886306762695, "global_step": 338068, "epoch": 2012} {"train_loss": -12.14107608795166, "global_step": 338069, "epoch": 2012} {"train_loss": -12.170734405517578, "global_step": 338070, "epoch": 2012} {"train_loss": -11.913000106811523, "global_step": 338071, "epoch": 2012} {"train_loss": -12.359046936035156, "global_step": 338072, "epoch": 2012} {"train_loss": -12.131855010986328, "global_step": 338073, "epoch": 2012} {"train_loss": -12.314855575561523, "global_step": 338074, "epoch": 2012} {"train_loss": -11.75765609741211, "global_step": 338075, "epoch": 2012} {"train_loss": -12.339521408081055, "global_step": 338076, "epoch": 2012} {"train_loss": -12.08216667175293, "global_step": 338077, "epoch": 2012} {"train_loss": -11.935832023620605, "global_step": 338078, "epoch": 2012} {"train_loss": -12.300738334655762, "global_step": 338079, "epoch": 2012} {"train_loss": -11.679058074951172, "global_step": 338080, "epoch": 2012} {"train_loss": -12.36258316040039, "global_step": 338081, "epoch": 2012} {"train_loss": -11.695535659790039, "global_step": 338082, "epoch": 2012} {"train_loss": -12.299938201904297, "global_step": 338083, "epoch": 2012} {"train_loss": -12.190716743469238, "global_step": 338084, "epoch": 2012} {"train_loss": -12.506359100341797, "global_step": 338085, "epoch": 2012} {"train_loss": -12.214035034179688, "global_step": 338086, "epoch": 2012} {"train_loss": -12.086080551147461, "global_step": 338087, "epoch": 2012} {"train_loss": -12.118058204650879, "global_step": 338088, "epoch": 2012} {"train_loss": -12.318918228149414, "global_step": 338089, "epoch": 2012} {"train_loss": -12.00093936920166, "global_step": 338090, "epoch": 2012} {"train_loss": -12.217643737792969, "global_step": 338091, "epoch": 2012} {"train_loss": -12.325981140136719, "global_step": 338092, "epoch": 2012} {"train_loss": -12.123048782348633, "global_step": 338093, "epoch": 2012} {"train_loss": -12.353425979614258, "global_step": 338094, "epoch": 2012} {"train_loss": -12.40103816986084, "global_step": 338095, "epoch": 2012} {"train_loss": -12.560735702514648, "global_step": 338096, "epoch": 2012} {"train_loss": -12.19102954864502, "global_step": 338097, "epoch": 2012} {"train_loss": -12.211097717285156, "global_step": 338098, "epoch": 2012} {"train_loss": -12.312477111816406, "global_step": 338099, "epoch": 2012} {"train_loss": -12.230571746826172, "global_step": 338100, "epoch": 2012} {"train_loss": -12.50475025177002, "global_step": 338101, "epoch": 2012} {"train_loss": -12.217432022094727, "global_step": 338102, "epoch": 2012} {"train_loss": -12.349363327026367, "global_step": 338103, "epoch": 2012} {"train_loss": -12.229562759399414, "global_step": 338104, "epoch": 2012} {"train_loss": -12.683185577392578, "global_step": 338105, "epoch": 2012} {"train_loss": -12.443117141723633, "global_step": 338106, "epoch": 2012} {"train_loss": -12.239767074584961, "global_step": 338107, "epoch": 2012} {"train_loss": -12.212282180786133, "global_step": 338108, "epoch": 2012} {"train_loss": -12.201698303222656, "global_step": 338109, "epoch": 2012} {"train_loss": -12.143719673156738, "global_step": 338110, "epoch": 2012} {"train_loss": -12.267285346984863, "global_step": 338111, "epoch": 2012} {"train_loss": -12.475982666015625, "global_step": 338112, "epoch": 2012} {"train_loss": -12.361089706420898, "global_step": 338113, "epoch": 2012} {"train_loss": -12.470571517944336, "global_step": 338114, "epoch": 2012} {"train_loss": -12.491430282592773, "global_step": 338115, "epoch": 2012} {"train_loss": -12.263310432434082, "global_step": 338116, "epoch": 2012} {"train_loss": -12.390649795532227, "global_step": 338117, "epoch": 2012} {"train_loss": -11.980570793151855, "global_step": 338118, "epoch": 2012} {"train_loss": -11.497598648071289, "global_step": 338119, "epoch": 2012} {"train_loss": -11.988851547241211, "global_step": 338120, "epoch": 2012} {"train_loss": -11.439658164978027, "global_step": 338121, "epoch": 2012} {"train_loss": -11.708208084106445, "global_step": 338122, "epoch": 2012} {"train_loss": -12.389928817749023, "global_step": 338123, "epoch": 2012} {"train_loss": -11.357680320739746, "global_step": 338124, "epoch": 2012} {"train_loss": -12.216720581054688, "global_step": 338125, "epoch": 2012} {"train_loss": -11.815340042114258, "global_step": 338126, "epoch": 2012} {"train_loss": -12.423166275024414, "global_step": 338127, "epoch": 2012} {"train_loss": -11.93929672241211, "global_step": 338128, "epoch": 2012} {"train_loss": -12.076988220214844, "global_step": 338129, "epoch": 2012} {"train_loss": -11.8688383102417, "global_step": 338130, "epoch": 2012} {"train_loss": -12.620987892150879, "global_step": 338131, "epoch": 2012} {"train_loss": -11.79493522644043, "global_step": 338132, "epoch": 2012} {"train_loss": -12.343080520629883, "global_step": 338133, "epoch": 2012} {"train_loss": -12.284311294555664, "global_step": 338134, "epoch": 2012} {"train_loss": -11.982131958007812, "global_step": 338135, "epoch": 2012} {"train_loss": -12.454774856567383, "global_step": 338136, "epoch": 2012} {"train_loss": -12.348276138305664, "global_step": 338137, "epoch": 2012} {"train_loss": -12.040453910827637, "global_step": 338138, "epoch": 2012} {"train_loss": -12.257789611816406, "global_step": 338139, "epoch": 2012} {"train_loss": -11.617810249328613, "global_step": 338140, "epoch": 2012} {"train_loss": -11.66397476196289, "global_step": 338141, "epoch": 2012} {"train_loss": -11.940500259399414, "global_step": 338142, "epoch": 2012} {"train_loss": -12.073530197143555, "global_step": 338143, "epoch": 2012} {"train_loss": -12.496307373046875, "global_step": 338144, "epoch": 2012} {"train_loss": -12.196887969970703, "global_step": 338145, "epoch": 2012} {"train_loss": -12.204222679138184, "global_step": 338146, "epoch": 2012} {"train_loss": -12.103779792785645, "global_step": 338147, "epoch": 2012} {"train_loss": -11.775463104248047, "global_step": 338148, "epoch": 2012} {"train_loss": -11.90713882446289, "global_step": 338149, "epoch": 2012} {"train_loss": -11.911235809326172, "global_step": 338150, "epoch": 2012} {"train_loss": -12.174591064453125, "global_step": 338151, "epoch": 2012} {"train_loss": -12.03429126739502, "global_step": 338152, "epoch": 2012} {"train_loss": -12.131673812866211, "global_step": 338153, "epoch": 2012} {"train_loss": -12.331952095031738, "global_step": 338154, "epoch": 2012} {"train_loss": -12.30848503112793, "global_step": 338155, "epoch": 2012} {"train_loss": -11.897506713867188, "global_step": 338156, "epoch": 2012} {"train_loss": -12.45334243774414, "global_step": 338157, "epoch": 2012} {"train_loss": -12.454549789428711, "global_step": 338158, "epoch": 2012} {"train_loss": -12.195047378540039, "global_step": 338159, "epoch": 2012} {"train_loss": -12.643787384033203, "global_step": 338160, "epoch": 2012} {"train_loss": -12.336380004882812, "global_step": 338161, "epoch": 2012} {"train_loss": -12.509847640991211, "global_step": 338162, "epoch": 2012} {"train_loss": -12.549038887023926, "global_step": 338163, "epoch": 2012} {"train_loss": -12.523711204528809, "global_step": 338164, "epoch": 2012} {"train_loss": -12.264967918395996, "global_step": 338165, "epoch": 2012} {"train_loss": -12.4974365234375, "global_step": 338166, "epoch": 2012} {"train_loss": -12.331340789794922, "global_step": 338167, "epoch": 2012} {"train_loss": -12.513891220092773, "global_step": 338168, "epoch": 2012} {"train_loss": -12.328571319580078, "global_step": 338169, "epoch": 2012} {"train_loss": -12.484067916870117, "global_step": 338170, "epoch": 2012} {"train_loss": -12.41241455078125, "global_step": 338171, "epoch": 2012} {"train_loss": -12.731792449951172, "global_step": 338172, "epoch": 2012} {"train_loss": -12.488191604614258, "global_step": 338173, "epoch": 2012} {"train_loss": -12.681619644165039, "global_step": 338174, "epoch": 2012} {"train_loss": -12.603704452514648, "global_step": 338175, "epoch": 2012} {"train_loss": -12.50883674621582, "global_step": 338176, "epoch": 2012} {"train_loss": -12.293306350708008, "global_step": 338177, "epoch": 2012} {"train_loss": -12.234487533569336, "global_step": 338178, "epoch": 2012} {"train_loss": -12.399368286132812, "global_step": 338179, "epoch": 2012} {"train_loss": -12.328409194946289, "global_step": 338180, "epoch": 2012} {"train_loss": -11.158732414245605, "global_step": 338181, "epoch": 2012} {"train_loss": -11.879955291748047, "global_step": 338182, "epoch": 2012} {"train_loss": -12.07194869858878, "global_step": 338183, "epoch": 2012, "val_loss": 289660.1875} {"train_loss": -11.1611967086792, "global_step": 338184, "epoch": 2013} {"train_loss": -12.018009185791016, "global_step": 338185, "epoch": 2013} {"train_loss": -11.254000663757324, "global_step": 338186, "epoch": 2013} {"train_loss": -11.185195922851562, "global_step": 338187, "epoch": 2013} {"train_loss": -10.03040885925293, "global_step": 338188, "epoch": 2013} {"train_loss": -12.354297637939453, "global_step": 338189, "epoch": 2013} {"train_loss": -9.92770767211914, "global_step": 338190, "epoch": 2013} {"train_loss": -10.903532028198242, "global_step": 338191, "epoch": 2013} {"train_loss": -10.490411758422852, "global_step": 338192, "epoch": 2013} {"train_loss": -10.425369262695312, "global_step": 338193, "epoch": 2013} {"train_loss": -11.608864784240723, "global_step": 338194, "epoch": 2013} {"train_loss": -9.773056983947754, "global_step": 338195, "epoch": 2013} {"train_loss": -10.30695915222168, "global_step": 338196, "epoch": 2013} {"train_loss": -11.604116439819336, "global_step": 338197, "epoch": 2013} {"train_loss": -10.81119441986084, "global_step": 338198, "epoch": 2013} {"train_loss": -11.548620223999023, "global_step": 338199, "epoch": 2013} {"train_loss": -9.833141326904297, "global_step": 338200, "epoch": 2013} {"train_loss": -9.339386940002441, "global_step": 338201, "epoch": 2013} {"train_loss": -10.826196670532227, "global_step": 338202, "epoch": 2013} {"train_loss": -10.795324325561523, "global_step": 338203, "epoch": 2013} {"train_loss": -8.664779663085938, "global_step": 338204, "epoch": 2013} {"train_loss": -11.670876502990723, "global_step": 338205, "epoch": 2013} {"train_loss": -8.309465408325195, "global_step": 338206, "epoch": 2013} {"train_loss": -9.514991760253906, "global_step": 338207, "epoch": 2013} {"train_loss": -9.449270248413086, "global_step": 338208, "epoch": 2013} {"train_loss": -10.65593147277832, "global_step": 338209, "epoch": 2013} {"train_loss": -9.091078758239746, "global_step": 338210, "epoch": 2013} {"train_loss": -10.341544151306152, "global_step": 338211, "epoch": 2013} {"train_loss": -7.882107734680176, "global_step": 338212, "epoch": 2013} {"train_loss": -9.525408744812012, "global_step": 338213, "epoch": 2013} {"train_loss": -7.786221981048584, "global_step": 338214, "epoch": 2013} {"train_loss": -8.212299346923828, "global_step": 338215, "epoch": 2013} {"train_loss": -10.26753044128418, "global_step": 338216, "epoch": 2013} {"train_loss": -10.426267623901367, "global_step": 338217, "epoch": 2013} {"train_loss": -8.889106750488281, "global_step": 338218, "epoch": 2013} {"train_loss": -9.514467239379883, "global_step": 338219, "epoch": 2013} {"train_loss": -11.116419792175293, "global_step": 338220, "epoch": 2013} {"train_loss": -9.422658920288086, "global_step": 338221, "epoch": 2013} {"train_loss": -9.168521881103516, "global_step": 338222, "epoch": 2013} {"train_loss": -11.187320709228516, "global_step": 338223, "epoch": 2013} {"train_loss": -10.915414810180664, "global_step": 338224, "epoch": 2013} {"train_loss": -9.939266204833984, "global_step": 338225, "epoch": 2013} {"train_loss": -10.029413223266602, "global_step": 338226, "epoch": 2013} {"train_loss": -11.488236427307129, "global_step": 338227, "epoch": 2013} {"train_loss": -10.608206748962402, "global_step": 338228, "epoch": 2013} {"train_loss": -10.28244400024414, "global_step": 338229, "epoch": 2013} {"train_loss": -11.199190139770508, "global_step": 338230, "epoch": 2013} {"train_loss": -10.841100692749023, "global_step": 338231, "epoch": 2013} {"train_loss": -10.58635139465332, "global_step": 338232, "epoch": 2013} {"train_loss": -11.752604484558105, "global_step": 338233, "epoch": 2013} {"train_loss": -10.943458557128906, "global_step": 338234, "epoch": 2013} {"train_loss": -10.937623977661133, "global_step": 338235, "epoch": 2013} {"train_loss": -11.519866943359375, "global_step": 338236, "epoch": 2013} {"train_loss": -11.228797912597656, "global_step": 338237, "epoch": 2013} {"train_loss": -11.490388870239258, "global_step": 338238, "epoch": 2013} {"train_loss": -11.17035961151123, "global_step": 338239, "epoch": 2013} {"train_loss": -11.913094520568848, "global_step": 338240, "epoch": 2013} {"train_loss": -11.016437530517578, "global_step": 338241, "epoch": 2013} {"train_loss": -11.802398681640625, "global_step": 338242, "epoch": 2013} {"train_loss": -11.543720245361328, "global_step": 338243, "epoch": 2013} {"train_loss": -11.297404289245605, "global_step": 338244, "epoch": 2013} {"train_loss": -11.761707305908203, "global_step": 338245, "epoch": 2013} {"train_loss": -11.503856658935547, "global_step": 338246, "epoch": 2013} {"train_loss": -11.902262687683105, "global_step": 338247, "epoch": 2013} {"train_loss": -11.83434009552002, "global_step": 338248, "epoch": 2013} {"train_loss": -11.723666191101074, "global_step": 338249, "epoch": 2013} {"train_loss": -11.812350273132324, "global_step": 338250, "epoch": 2013} {"train_loss": -11.575187683105469, "global_step": 338251, "epoch": 2013} {"train_loss": -11.978014945983887, "global_step": 338252, "epoch": 2013} {"train_loss": -11.847269058227539, "global_step": 338253, "epoch": 2013} {"train_loss": -11.925442695617676, "global_step": 338254, "epoch": 2013} {"train_loss": -11.910856246948242, "global_step": 338255, "epoch": 2013} {"train_loss": -12.136191368103027, "global_step": 338256, "epoch": 2013} {"train_loss": -11.768976211547852, "global_step": 338257, "epoch": 2013} {"train_loss": -12.102975845336914, "global_step": 338258, "epoch": 2013} {"train_loss": -12.128294944763184, "global_step": 338259, "epoch": 2013} {"train_loss": -12.058612823486328, "global_step": 338260, "epoch": 2013} {"train_loss": -12.090336799621582, "global_step": 338261, "epoch": 2013} {"train_loss": -11.954235076904297, "global_step": 338262, "epoch": 2013} {"train_loss": -12.171204566955566, "global_step": 338263, "epoch": 2013} {"train_loss": -12.008598327636719, "global_step": 338264, "epoch": 2013} {"train_loss": -12.06913948059082, "global_step": 338265, "epoch": 2013} {"train_loss": -12.102521896362305, "global_step": 338266, "epoch": 2013} {"train_loss": -12.170431137084961, "global_step": 338267, "epoch": 2013} {"train_loss": -12.181581497192383, "global_step": 338268, "epoch": 2013} {"train_loss": -12.06591796875, "global_step": 338269, "epoch": 2013} {"train_loss": -12.08966064453125, "global_step": 338270, "epoch": 2013} {"train_loss": -12.13078498840332, "global_step": 338271, "epoch": 2013} {"train_loss": -12.139513969421387, "global_step": 338272, "epoch": 2013} {"train_loss": -12.126626968383789, "global_step": 338273, "epoch": 2013} {"train_loss": -12.276613235473633, "global_step": 338274, "epoch": 2013} {"train_loss": -12.201070785522461, "global_step": 338275, "epoch": 2013} {"train_loss": -12.055334091186523, "global_step": 338276, "epoch": 2013} {"train_loss": -12.310718536376953, "global_step": 338277, "epoch": 2013} {"train_loss": -12.380439758300781, "global_step": 338278, "epoch": 2013} {"train_loss": -12.287243843078613, "global_step": 338279, "epoch": 2013} {"train_loss": -12.280033111572266, "global_step": 338280, "epoch": 2013} {"train_loss": -12.43022346496582, "global_step": 338281, "epoch": 2013} {"train_loss": -12.347596168518066, "global_step": 338282, "epoch": 2013} {"train_loss": -12.289243698120117, "global_step": 338283, "epoch": 2013} {"train_loss": -12.366310119628906, "global_step": 338284, "epoch": 2013} {"train_loss": -12.412247657775879, "global_step": 338285, "epoch": 2013} {"train_loss": -12.3802490234375, "global_step": 338286, "epoch": 2013} {"train_loss": -12.453959465026855, "global_step": 338287, "epoch": 2013} {"train_loss": -12.443948745727539, "global_step": 338288, "epoch": 2013} {"train_loss": -12.472989082336426, "global_step": 338289, "epoch": 2013} {"train_loss": -12.44330883026123, "global_step": 338290, "epoch": 2013} {"train_loss": -12.437989234924316, "global_step": 338291, "epoch": 2013} {"train_loss": -12.291797637939453, "global_step": 338292, "epoch": 2013} {"train_loss": -12.467510223388672, "global_step": 338293, "epoch": 2013} {"train_loss": -12.503912925720215, "global_step": 338294, "epoch": 2013} {"train_loss": -12.381148338317871, "global_step": 338295, "epoch": 2013} {"train_loss": -12.336742401123047, "global_step": 338296, "epoch": 2013} {"train_loss": -12.486749649047852, "global_step": 338297, "epoch": 2013} {"train_loss": -12.534219741821289, "global_step": 338298, "epoch": 2013} {"train_loss": -12.446147918701172, "global_step": 338299, "epoch": 2013} {"train_loss": -12.718868255615234, "global_step": 338300, "epoch": 2013} {"train_loss": -12.421684265136719, "global_step": 338301, "epoch": 2013} {"train_loss": -12.6146821975708, "global_step": 338302, "epoch": 2013} {"train_loss": -12.595541954040527, "global_step": 338303, "epoch": 2013} {"train_loss": -12.597293853759766, "global_step": 338304, "epoch": 2013} {"train_loss": -12.396728515625, "global_step": 338305, "epoch": 2013} {"train_loss": -12.61281967163086, "global_step": 338306, "epoch": 2013} {"train_loss": -12.40705394744873, "global_step": 338307, "epoch": 2013} {"train_loss": -12.604887962341309, "global_step": 338308, "epoch": 2013} {"train_loss": -12.41908073425293, "global_step": 338309, "epoch": 2013} {"train_loss": -12.669746398925781, "global_step": 338310, "epoch": 2013} {"train_loss": -12.411616325378418, "global_step": 338311, "epoch": 2013} {"train_loss": -12.650233268737793, "global_step": 338312, "epoch": 2013} {"train_loss": -12.201783180236816, "global_step": 338313, "epoch": 2013} {"train_loss": -12.734251022338867, "global_step": 338314, "epoch": 2013} {"train_loss": -12.305356979370117, "global_step": 338315, "epoch": 2013} {"train_loss": -12.555557250976562, "global_step": 338316, "epoch": 2013} {"train_loss": -12.593534469604492, "global_step": 338317, "epoch": 2013} {"train_loss": -12.671160697937012, "global_step": 338318, "epoch": 2013} {"train_loss": -12.460234642028809, "global_step": 338319, "epoch": 2013} {"train_loss": -12.646591186523438, "global_step": 338320, "epoch": 2013} {"train_loss": -12.036486625671387, "global_step": 338321, "epoch": 2013} {"train_loss": -12.444086074829102, "global_step": 338322, "epoch": 2013} {"train_loss": -12.585749626159668, "global_step": 338323, "epoch": 2013} {"train_loss": -12.171104431152344, "global_step": 338324, "epoch": 2013} {"train_loss": -11.980438232421875, "global_step": 338325, "epoch": 2013} {"train_loss": -11.32433032989502, "global_step": 338326, "epoch": 2013} {"train_loss": -11.973611831665039, "global_step": 338327, "epoch": 2013} {"train_loss": -10.441707611083984, "global_step": 338328, "epoch": 2013} {"train_loss": -11.46005630493164, "global_step": 338329, "epoch": 2013} {"train_loss": -10.9430513381958, "global_step": 338330, "epoch": 2013} {"train_loss": -12.030387878417969, "global_step": 338331, "epoch": 2013} {"train_loss": -10.966381072998047, "global_step": 338332, "epoch": 2013} {"train_loss": -11.404333114624023, "global_step": 338333, "epoch": 2013} {"train_loss": -12.05839729309082, "global_step": 338334, "epoch": 2013} {"train_loss": -11.05499267578125, "global_step": 338335, "epoch": 2013} {"train_loss": -12.011764526367188, "global_step": 338336, "epoch": 2013} {"train_loss": -11.588298797607422, "global_step": 338337, "epoch": 2013} {"train_loss": -11.51838493347168, "global_step": 338338, "epoch": 2013} {"train_loss": -10.55082893371582, "global_step": 338339, "epoch": 2013} {"train_loss": -12.134369850158691, "global_step": 338340, "epoch": 2013} {"train_loss": -10.839394569396973, "global_step": 338341, "epoch": 2013} {"train_loss": -11.758115768432617, "global_step": 338342, "epoch": 2013} {"train_loss": -11.109052658081055, "global_step": 338343, "epoch": 2013} {"train_loss": -11.274714469909668, "global_step": 338344, "epoch": 2013} {"train_loss": -11.72685432434082, "global_step": 338345, "epoch": 2013} {"train_loss": -11.2786865234375, "global_step": 338346, "epoch": 2013} {"train_loss": -11.834832191467285, "global_step": 338347, "epoch": 2013} {"train_loss": -11.131156921386719, "global_step": 338348, "epoch": 2013} {"train_loss": -11.44102668762207, "global_step": 338349, "epoch": 2013} {"train_loss": -11.763121604919434, "global_step": 338350, "epoch": 2013} {"train_loss": -11.487504280748821, "global_step": 338351, "epoch": 2013, "val_loss": 282612.75} {"train_loss": -11.539578437805176, "global_step": 338352, "epoch": 2014} {"train_loss": -10.750072479248047, "global_step": 338353, "epoch": 2014} {"train_loss": -11.510295867919922, "global_step": 338354, "epoch": 2014} {"train_loss": -11.451568603515625, "global_step": 338355, "epoch": 2014} {"train_loss": -11.351570129394531, "global_step": 338356, "epoch": 2014} {"train_loss": -11.449584007263184, "global_step": 338357, "epoch": 2014} {"train_loss": -11.45346450805664, "global_step": 338358, "epoch": 2014} {"train_loss": -11.18182373046875, "global_step": 338359, "epoch": 2014} {"train_loss": -11.681598663330078, "global_step": 338360, "epoch": 2014} {"train_loss": -11.330259323120117, "global_step": 338361, "epoch": 2014} {"train_loss": -11.324013710021973, "global_step": 338362, "epoch": 2014} {"train_loss": -11.969049453735352, "global_step": 338363, "epoch": 2014} {"train_loss": -10.774806022644043, "global_step": 338364, "epoch": 2014} {"train_loss": -11.903493881225586, "global_step": 338365, "epoch": 2014} {"train_loss": -10.50496768951416, "global_step": 338366, "epoch": 2014} {"train_loss": -11.967073440551758, "global_step": 338367, "epoch": 2014} {"train_loss": -10.992607116699219, "global_step": 338368, "epoch": 2014} {"train_loss": -11.78385066986084, "global_step": 338369, "epoch": 2014} {"train_loss": -11.705154418945312, "global_step": 338370, "epoch": 2014} {"train_loss": -11.846516609191895, "global_step": 338371, "epoch": 2014} {"train_loss": -12.031044006347656, "global_step": 338372, "epoch": 2014} {"train_loss": -11.825325012207031, "global_step": 338373, "epoch": 2014} {"train_loss": -12.165292739868164, "global_step": 338374, "epoch": 2014} {"train_loss": -11.609047889709473, "global_step": 338375, "epoch": 2014} {"train_loss": -12.103498458862305, "global_step": 338376, "epoch": 2014} {"train_loss": -11.680156707763672, "global_step": 338377, "epoch": 2014} {"train_loss": -12.052478790283203, "global_step": 338378, "epoch": 2014} {"train_loss": -11.898931503295898, "global_step": 338379, "epoch": 2014} {"train_loss": -11.85092830657959, "global_step": 338380, "epoch": 2014} {"train_loss": -12.187739372253418, "global_step": 338381, "epoch": 2014} {"train_loss": -11.948493957519531, "global_step": 338382, "epoch": 2014} {"train_loss": -12.033660888671875, "global_step": 338383, "epoch": 2014} {"train_loss": -11.882887840270996, "global_step": 338384, "epoch": 2014} {"train_loss": -11.935604095458984, "global_step": 338385, "epoch": 2014} {"train_loss": -12.483789443969727, "global_step": 338386, "epoch": 2014} {"train_loss": -12.055234909057617, "global_step": 338387, "epoch": 2014} {"train_loss": -11.984126091003418, "global_step": 338388, "epoch": 2014} {"train_loss": -12.255005836486816, "global_step": 338389, "epoch": 2014} {"train_loss": -11.867977142333984, "global_step": 338390, "epoch": 2014} {"train_loss": -12.02505874633789, "global_step": 338391, "epoch": 2014} {"train_loss": -12.048402786254883, "global_step": 338392, "epoch": 2014} {"train_loss": -11.807973861694336, "global_step": 338393, "epoch": 2014} {"train_loss": -12.127989768981934, "global_step": 338394, "epoch": 2014} {"train_loss": -11.846490859985352, "global_step": 338395, "epoch": 2014} {"train_loss": -12.122334480285645, "global_step": 338396, "epoch": 2014} {"train_loss": -12.192277908325195, "global_step": 338397, "epoch": 2014} {"train_loss": -11.710569381713867, "global_step": 338398, "epoch": 2014} {"train_loss": -12.164297103881836, "global_step": 338399, "epoch": 2014} {"train_loss": -11.740570068359375, "global_step": 338400, "epoch": 2014} {"train_loss": -12.206181526184082, "global_step": 338401, "epoch": 2014} {"train_loss": -12.266881942749023, "global_step": 338402, "epoch": 2014} {"train_loss": -12.03421401977539, "global_step": 338403, "epoch": 2014} {"train_loss": -11.937150955200195, "global_step": 338404, "epoch": 2014} {"train_loss": -12.050917625427246, "global_step": 338405, "epoch": 2014} {"train_loss": -12.440738677978516, "global_step": 338406, "epoch": 2014} {"train_loss": -12.272825241088867, "global_step": 338407, "epoch": 2014} {"train_loss": -12.150354385375977, "global_step": 338408, "epoch": 2014} {"train_loss": -12.417726516723633, "global_step": 338409, "epoch": 2014} {"train_loss": -12.09395980834961, "global_step": 338410, "epoch": 2014} {"train_loss": -12.062671661376953, "global_step": 338411, "epoch": 2014} {"train_loss": -12.428403854370117, "global_step": 338412, "epoch": 2014} {"train_loss": -12.313013076782227, "global_step": 338413, "epoch": 2014} {"train_loss": -12.46844482421875, "global_step": 338414, "epoch": 2014} {"train_loss": -12.106542587280273, "global_step": 338415, "epoch": 2014} {"train_loss": -12.463043212890625, "global_step": 338416, "epoch": 2014} {"train_loss": -12.449040412902832, "global_step": 338417, "epoch": 2014} {"train_loss": -12.239310264587402, "global_step": 338418, "epoch": 2014} {"train_loss": -12.500038146972656, "global_step": 338419, "epoch": 2014} {"train_loss": -12.159818649291992, "global_step": 338420, "epoch": 2014} {"train_loss": -12.255596160888672, "global_step": 338421, "epoch": 2014} {"train_loss": -12.31753921508789, "global_step": 338422, "epoch": 2014} {"train_loss": -12.457037925720215, "global_step": 338423, "epoch": 2014} {"train_loss": -12.328093528747559, "global_step": 338424, "epoch": 2014} {"train_loss": -12.148392677307129, "global_step": 338425, "epoch": 2014} {"train_loss": -12.290587425231934, "global_step": 338426, "epoch": 2014} {"train_loss": -12.419670104980469, "global_step": 338427, "epoch": 2014} {"train_loss": -12.160955429077148, "global_step": 338428, "epoch": 2014} {"train_loss": -12.104307174682617, "global_step": 338429, "epoch": 2014} {"train_loss": -12.062828063964844, "global_step": 338430, "epoch": 2014} {"train_loss": -12.036999702453613, "global_step": 338431, "epoch": 2014} {"train_loss": -12.434109687805176, "global_step": 338432, "epoch": 2014} {"train_loss": -12.339248657226562, "global_step": 338433, "epoch": 2014} {"train_loss": -12.49019718170166, "global_step": 338434, "epoch": 2014} {"train_loss": -12.104602813720703, "global_step": 338435, "epoch": 2014} {"train_loss": -11.754785537719727, "global_step": 338436, "epoch": 2014} {"train_loss": -12.096406936645508, "global_step": 338437, "epoch": 2014} {"train_loss": -12.105890274047852, "global_step": 338438, "epoch": 2014} {"train_loss": -11.904472351074219, "global_step": 338439, "epoch": 2014} {"train_loss": -12.352865219116211, "global_step": 338440, "epoch": 2014} {"train_loss": -12.028671264648438, "global_step": 338441, "epoch": 2014} {"train_loss": -12.23725700378418, "global_step": 338442, "epoch": 2014} {"train_loss": -11.39452838897705, "global_step": 338443, "epoch": 2014} {"train_loss": -11.45541763305664, "global_step": 338444, "epoch": 2014} {"train_loss": -11.719511032104492, "global_step": 338445, "epoch": 2014} {"train_loss": -11.88469123840332, "global_step": 338446, "epoch": 2014} {"train_loss": -11.008504867553711, "global_step": 338447, "epoch": 2014} {"train_loss": -10.795727729797363, "global_step": 338448, "epoch": 2014} {"train_loss": -12.175542831420898, "global_step": 338449, "epoch": 2014} {"train_loss": -11.06021785736084, "global_step": 338450, "epoch": 2014} {"train_loss": -12.151636123657227, "global_step": 338451, "epoch": 2014} {"train_loss": -11.365154266357422, "global_step": 338452, "epoch": 2014} {"train_loss": -11.292661666870117, "global_step": 338453, "epoch": 2014} {"train_loss": -11.405282974243164, "global_step": 338454, "epoch": 2014} {"train_loss": -11.530044555664062, "global_step": 338455, "epoch": 2014} {"train_loss": -11.773089408874512, "global_step": 338456, "epoch": 2014} {"train_loss": -12.174742698669434, "global_step": 338457, "epoch": 2014} {"train_loss": -11.183093070983887, "global_step": 338458, "epoch": 2014} {"train_loss": -11.703042984008789, "global_step": 338459, "epoch": 2014} {"train_loss": -10.935041427612305, "global_step": 338460, "epoch": 2014} {"train_loss": -11.263218879699707, "global_step": 338461, "epoch": 2014} {"train_loss": -11.445650100708008, "global_step": 338462, "epoch": 2014} {"train_loss": -11.040679931640625, "global_step": 338463, "epoch": 2014} {"train_loss": -11.062021255493164, "global_step": 338464, "epoch": 2014} {"train_loss": -11.839369773864746, "global_step": 338465, "epoch": 2014} {"train_loss": -10.581661224365234, "global_step": 338466, "epoch": 2014} {"train_loss": -12.209864616394043, "global_step": 338467, "epoch": 2014} {"train_loss": -10.732133865356445, "global_step": 338468, "epoch": 2014} {"train_loss": -11.840618133544922, "global_step": 338469, "epoch": 2014} {"train_loss": -11.003173828125, "global_step": 338470, "epoch": 2014} {"train_loss": -11.110384941101074, "global_step": 338471, "epoch": 2014} {"train_loss": -12.045626640319824, "global_step": 338472, "epoch": 2014} {"train_loss": -10.960468292236328, "global_step": 338473, "epoch": 2014} {"train_loss": -11.02459716796875, "global_step": 338474, "epoch": 2014} {"train_loss": -11.544429779052734, "global_step": 338475, "epoch": 2014} {"train_loss": -10.922460556030273, "global_step": 338476, "epoch": 2014} {"train_loss": -10.789652824401855, "global_step": 338477, "epoch": 2014} {"train_loss": -11.570564270019531, "global_step": 338478, "epoch": 2014} {"train_loss": -10.211711883544922, "global_step": 338479, "epoch": 2014} {"train_loss": -11.36009407043457, "global_step": 338480, "epoch": 2014} {"train_loss": -11.59596061706543, "global_step": 338481, "epoch": 2014} {"train_loss": -9.688681602478027, "global_step": 338482, "epoch": 2014} {"train_loss": -11.91230583190918, "global_step": 338483, "epoch": 2014} {"train_loss": -10.257410049438477, "global_step": 338484, "epoch": 2014} {"train_loss": -11.809455871582031, "global_step": 338485, "epoch": 2014} {"train_loss": -10.570024490356445, "global_step": 338486, "epoch": 2014} {"train_loss": -11.746941566467285, "global_step": 338487, "epoch": 2014} {"train_loss": -11.182121276855469, "global_step": 338488, "epoch": 2014} {"train_loss": -11.696199417114258, "global_step": 338489, "epoch": 2014} {"train_loss": -11.48184585571289, "global_step": 338490, "epoch": 2014} {"train_loss": -11.633675575256348, "global_step": 338491, "epoch": 2014} {"train_loss": -11.735332489013672, "global_step": 338492, "epoch": 2014} {"train_loss": -11.427867889404297, "global_step": 338493, "epoch": 2014} {"train_loss": -11.75086498260498, "global_step": 338494, "epoch": 2014} {"train_loss": -11.794519424438477, "global_step": 338495, "epoch": 2014} {"train_loss": -11.845498085021973, "global_step": 338496, "epoch": 2014} {"train_loss": -11.792900085449219, "global_step": 338497, "epoch": 2014} {"train_loss": -11.184795379638672, "global_step": 338498, "epoch": 2014} {"train_loss": -11.687551498413086, "global_step": 338499, "epoch": 2014} {"train_loss": -11.469947814941406, "global_step": 338500, "epoch": 2014} {"train_loss": -11.497379302978516, "global_step": 338501, "epoch": 2014} {"train_loss": -11.823883056640625, "global_step": 338502, "epoch": 2014} {"train_loss": -11.743980407714844, "global_step": 338503, "epoch": 2014} {"train_loss": -11.732343673706055, "global_step": 338504, "epoch": 2014} {"train_loss": -11.904661178588867, "global_step": 338505, "epoch": 2014} {"train_loss": -11.642338752746582, "global_step": 338506, "epoch": 2014} {"train_loss": -11.441975593566895, "global_step": 338507, "epoch": 2014} {"train_loss": -12.052681922912598, "global_step": 338508, "epoch": 2014} {"train_loss": -12.074989318847656, "global_step": 338509, "epoch": 2014} {"train_loss": -12.03738021850586, "global_step": 338510, "epoch": 2014} {"train_loss": -11.836017608642578, "global_step": 338511, "epoch": 2014} {"train_loss": -12.012487411499023, "global_step": 338512, "epoch": 2014} {"train_loss": -11.759513854980469, "global_step": 338513, "epoch": 2014} {"train_loss": -12.11828327178955, "global_step": 338514, "epoch": 2014} {"train_loss": -11.808355331420898, "global_step": 338515, "epoch": 2014} {"train_loss": -12.165620803833008, "global_step": 338516, "epoch": 2014} {"train_loss": -11.874210357666016, "global_step": 338517, "epoch": 2014} {"train_loss": -12.329748153686523, "global_step": 338518, "epoch": 2014} {"train_loss": -11.7567222345443, "global_step": 338519, "epoch": 2014, "val_loss": 288060.46875} {"train_loss": -12.057256698608398, "global_step": 338520, "epoch": 2015} {"train_loss": -11.967802047729492, "global_step": 338521, "epoch": 2015} {"train_loss": -12.119535446166992, "global_step": 338522, "epoch": 2015} {"train_loss": -11.652242660522461, "global_step": 338523, "epoch": 2015} {"train_loss": -11.980996131896973, "global_step": 338524, "epoch": 2015} {"train_loss": -11.655448913574219, "global_step": 338525, "epoch": 2015} {"train_loss": -12.126670837402344, "global_step": 338526, "epoch": 2015} {"train_loss": -12.056703567504883, "global_step": 338527, "epoch": 2015} {"train_loss": -12.041083335876465, "global_step": 338528, "epoch": 2015} {"train_loss": -12.080005645751953, "global_step": 338529, "epoch": 2015} {"train_loss": -12.178853988647461, "global_step": 338530, "epoch": 2015} {"train_loss": -12.263128280639648, "global_step": 338531, "epoch": 2015} {"train_loss": -11.714530944824219, "global_step": 338532, "epoch": 2015} {"train_loss": -11.992801666259766, "global_step": 338533, "epoch": 2015} {"train_loss": -11.950624465942383, "global_step": 338534, "epoch": 2015} {"train_loss": -12.232563018798828, "global_step": 338535, "epoch": 2015} {"train_loss": -11.932008743286133, "global_step": 338536, "epoch": 2015} {"train_loss": -11.956707000732422, "global_step": 338537, "epoch": 2015} {"train_loss": -12.001544952392578, "global_step": 338538, "epoch": 2015} {"train_loss": -11.879180908203125, "global_step": 338539, "epoch": 2015} {"train_loss": -12.214998245239258, "global_step": 338540, "epoch": 2015} {"train_loss": -11.829154968261719, "global_step": 338541, "epoch": 2015} {"train_loss": -12.419976234436035, "global_step": 338542, "epoch": 2015} {"train_loss": -11.976024627685547, "global_step": 338543, "epoch": 2015} {"train_loss": -12.322259902954102, "global_step": 338544, "epoch": 2015} {"train_loss": -12.322824478149414, "global_step": 338545, "epoch": 2015} {"train_loss": -12.137554168701172, "global_step": 338546, "epoch": 2015} {"train_loss": -12.247875213623047, "global_step": 338547, "epoch": 2015} {"train_loss": -12.183762550354004, "global_step": 338548, "epoch": 2015} {"train_loss": -12.237031936645508, "global_step": 338549, "epoch": 2015} {"train_loss": -12.338542938232422, "global_step": 338550, "epoch": 2015} {"train_loss": -12.27485466003418, "global_step": 338551, "epoch": 2015} {"train_loss": -12.263747215270996, "global_step": 338552, "epoch": 2015} {"train_loss": -12.296889305114746, "global_step": 338553, "epoch": 2015} {"train_loss": -12.567300796508789, "global_step": 338554, "epoch": 2015} {"train_loss": -12.389814376831055, "global_step": 338555, "epoch": 2015} {"train_loss": -12.167969703674316, "global_step": 338556, "epoch": 2015} {"train_loss": -12.350513458251953, "global_step": 338557, "epoch": 2015} {"train_loss": -12.270345687866211, "global_step": 338558, "epoch": 2015} {"train_loss": -12.483747482299805, "global_step": 338559, "epoch": 2015} {"train_loss": -12.168594360351562, "global_step": 338560, "epoch": 2015} {"train_loss": -12.460558891296387, "global_step": 338561, "epoch": 2015} {"train_loss": -12.392223358154297, "global_step": 338562, "epoch": 2015} {"train_loss": -12.487211227416992, "global_step": 338563, "epoch": 2015} {"train_loss": -12.054267883300781, "global_step": 338564, "epoch": 2015} {"train_loss": -12.42672061920166, "global_step": 338565, "epoch": 2015} {"train_loss": -12.065410614013672, "global_step": 338566, "epoch": 2015} {"train_loss": -12.230441093444824, "global_step": 338567, "epoch": 2015} {"train_loss": -12.149096488952637, "global_step": 338568, "epoch": 2015} {"train_loss": -12.207715034484863, "global_step": 338569, "epoch": 2015} {"train_loss": -11.46249008178711, "global_step": 338570, "epoch": 2015} {"train_loss": -12.20077133178711, "global_step": 338571, "epoch": 2015} {"train_loss": -10.937135696411133, "global_step": 338572, "epoch": 2015} {"train_loss": -11.438453674316406, "global_step": 338573, "epoch": 2015} {"train_loss": -11.739709854125977, "global_step": 338574, "epoch": 2015} {"train_loss": -11.500125885009766, "global_step": 338575, "epoch": 2015} {"train_loss": -11.833544731140137, "global_step": 338576, "epoch": 2015} {"train_loss": -11.719785690307617, "global_step": 338577, "epoch": 2015} {"train_loss": -11.246188163757324, "global_step": 338578, "epoch": 2015} {"train_loss": -11.807790756225586, "global_step": 338579, "epoch": 2015} {"train_loss": -11.164925575256348, "global_step": 338580, "epoch": 2015} {"train_loss": -11.568751335144043, "global_step": 338581, "epoch": 2015} {"train_loss": -12.289557456970215, "global_step": 338582, "epoch": 2015} {"train_loss": -11.557899475097656, "global_step": 338583, "epoch": 2015} {"train_loss": -12.06026840209961, "global_step": 338584, "epoch": 2015} {"train_loss": -12.004646301269531, "global_step": 338585, "epoch": 2015} {"train_loss": -11.81200885772705, "global_step": 338586, "epoch": 2015} {"train_loss": -11.628984451293945, "global_step": 338587, "epoch": 2015} {"train_loss": -12.189200401306152, "global_step": 338588, "epoch": 2015} {"train_loss": -12.05838394165039, "global_step": 338589, "epoch": 2015} {"train_loss": -12.289935111999512, "global_step": 338590, "epoch": 2015} {"train_loss": -12.24636459350586, "global_step": 338591, "epoch": 2015} {"train_loss": -12.356206893920898, "global_step": 338592, "epoch": 2015} {"train_loss": -12.264111518859863, "global_step": 338593, "epoch": 2015} {"train_loss": -12.329113960266113, "global_step": 338594, "epoch": 2015} {"train_loss": -12.34295654296875, "global_step": 338595, "epoch": 2015} {"train_loss": -12.155298233032227, "global_step": 338596, "epoch": 2015} {"train_loss": -11.951421737670898, "global_step": 338597, "epoch": 2015} {"train_loss": -12.42116928100586, "global_step": 338598, "epoch": 2015} {"train_loss": -12.127933502197266, "global_step": 338599, "epoch": 2015} {"train_loss": -12.158416748046875, "global_step": 338600, "epoch": 2015} {"train_loss": -12.135112762451172, "global_step": 338601, "epoch": 2015} {"train_loss": -11.836196899414062, "global_step": 338602, "epoch": 2015} {"train_loss": -12.535944938659668, "global_step": 338603, "epoch": 2015} {"train_loss": -11.970380783081055, "global_step": 338604, "epoch": 2015} {"train_loss": -12.31131362915039, "global_step": 338605, "epoch": 2015} {"train_loss": -11.876311302185059, "global_step": 338606, "epoch": 2015} {"train_loss": -12.039970397949219, "global_step": 338607, "epoch": 2015} {"train_loss": -12.0410795211792, "global_step": 338608, "epoch": 2015} {"train_loss": -11.769893646240234, "global_step": 338609, "epoch": 2015} {"train_loss": -12.223577499389648, "global_step": 338610, "epoch": 2015} {"train_loss": -12.41151237487793, "global_step": 338611, "epoch": 2015} {"train_loss": -12.312482833862305, "global_step": 338612, "epoch": 2015} {"train_loss": -12.555521965026855, "global_step": 338613, "epoch": 2015} {"train_loss": -12.449800491333008, "global_step": 338614, "epoch": 2015} {"train_loss": -12.441574096679688, "global_step": 338615, "epoch": 2015} {"train_loss": -12.451091766357422, "global_step": 338616, "epoch": 2015} {"train_loss": -12.573759078979492, "global_step": 338617, "epoch": 2015} {"train_loss": -12.29780387878418, "global_step": 338618, "epoch": 2015} {"train_loss": -12.551855087280273, "global_step": 338619, "epoch": 2015} {"train_loss": -12.346332550048828, "global_step": 338620, "epoch": 2015} {"train_loss": -12.399384498596191, "global_step": 338621, "epoch": 2015} {"train_loss": -12.311924934387207, "global_step": 338622, "epoch": 2015} {"train_loss": -12.48898696899414, "global_step": 338623, "epoch": 2015} {"train_loss": -12.386181831359863, "global_step": 338624, "epoch": 2015} {"train_loss": -12.41628646850586, "global_step": 338625, "epoch": 2015} {"train_loss": -12.310270309448242, "global_step": 338626, "epoch": 2015} {"train_loss": -12.555227279663086, "global_step": 338627, "epoch": 2015} {"train_loss": -12.473119735717773, "global_step": 338628, "epoch": 2015} {"train_loss": -12.431577682495117, "global_step": 338629, "epoch": 2015} {"train_loss": -12.613882064819336, "global_step": 338630, "epoch": 2015} {"train_loss": -12.110706329345703, "global_step": 338631, "epoch": 2015} {"train_loss": -12.098812103271484, "global_step": 338632, "epoch": 2015} {"train_loss": -12.447757720947266, "global_step": 338633, "epoch": 2015} {"train_loss": -12.397480964660645, "global_step": 338634, "epoch": 2015} {"train_loss": -11.993574142456055, "global_step": 338635, "epoch": 2015} {"train_loss": -12.328554153442383, "global_step": 338636, "epoch": 2015} {"train_loss": -12.003641128540039, "global_step": 338637, "epoch": 2015} {"train_loss": -12.345622062683105, "global_step": 338638, "epoch": 2015} {"train_loss": -12.315337181091309, "global_step": 338639, "epoch": 2015} {"train_loss": -12.37025260925293, "global_step": 338640, "epoch": 2015} {"train_loss": -12.428454399108887, "global_step": 338641, "epoch": 2015} {"train_loss": -12.456232070922852, "global_step": 338642, "epoch": 2015} {"train_loss": -12.441011428833008, "global_step": 338643, "epoch": 2015} {"train_loss": -12.536673545837402, "global_step": 338644, "epoch": 2015} {"train_loss": -12.378011703491211, "global_step": 338645, "epoch": 2015} {"train_loss": -12.533411026000977, "global_step": 338646, "epoch": 2015} {"train_loss": -12.276348114013672, "global_step": 338647, "epoch": 2015} {"train_loss": -12.497032165527344, "global_step": 338648, "epoch": 2015} {"train_loss": -11.980859756469727, "global_step": 338649, "epoch": 2015} {"train_loss": -12.513311386108398, "global_step": 338650, "epoch": 2015} {"train_loss": -11.927047729492188, "global_step": 338651, "epoch": 2015} {"train_loss": -12.260198593139648, "global_step": 338652, "epoch": 2015} {"train_loss": -12.30679702758789, "global_step": 338653, "epoch": 2015} {"train_loss": -12.354706764221191, "global_step": 338654, "epoch": 2015} {"train_loss": -12.680513381958008, "global_step": 338655, "epoch": 2015} {"train_loss": -12.669194221496582, "global_step": 338656, "epoch": 2015} {"train_loss": -12.562860488891602, "global_step": 338657, "epoch": 2015} {"train_loss": -12.51891040802002, "global_step": 338658, "epoch": 2015} {"train_loss": -12.601388931274414, "global_step": 338659, "epoch": 2015} {"train_loss": -12.525503158569336, "global_step": 338660, "epoch": 2015} {"train_loss": -11.574590682983398, "global_step": 338661, "epoch": 2015} {"train_loss": -11.089177131652832, "global_step": 338662, "epoch": 2015} {"train_loss": -12.25440788269043, "global_step": 338663, "epoch": 2015} {"train_loss": -12.21749496459961, "global_step": 338664, "epoch": 2015} {"train_loss": -11.45320987701416, "global_step": 338665, "epoch": 2015} {"train_loss": -11.879814147949219, "global_step": 338666, "epoch": 2015} {"train_loss": -12.179471969604492, "global_step": 338667, "epoch": 2015} {"train_loss": -11.620562553405762, "global_step": 338668, "epoch": 2015} {"train_loss": -10.868308067321777, "global_step": 338669, "epoch": 2015} {"train_loss": -11.456872940063477, "global_step": 338670, "epoch": 2015} {"train_loss": -11.674253463745117, "global_step": 338671, "epoch": 2015} {"train_loss": -10.436166763305664, "global_step": 338672, "epoch": 2015} {"train_loss": -11.51831340789795, "global_step": 338673, "epoch": 2015} {"train_loss": -7.755684852600098, "global_step": 338674, "epoch": 2015} {"train_loss": -8.358124732971191, "global_step": 338675, "epoch": 2015} {"train_loss": -8.01629638671875, "global_step": 338676, "epoch": 2015} {"train_loss": -9.870611190795898, "global_step": 338677, "epoch": 2015} {"train_loss": -10.467424392700195, "global_step": 338678, "epoch": 2015} {"train_loss": -9.212748527526855, "global_step": 338679, "epoch": 2015} {"train_loss": -8.615218162536621, "global_step": 338680, "epoch": 2015} {"train_loss": -10.954395294189453, "global_step": 338681, "epoch": 2015} {"train_loss": -8.913564682006836, "global_step": 338682, "epoch": 2015} {"train_loss": -11.08053970336914, "global_step": 338683, "epoch": 2015} {"train_loss": -9.467151641845703, "global_step": 338684, "epoch": 2015} {"train_loss": -10.413865089416504, "global_step": 338685, "epoch": 2015} {"train_loss": -10.479568481445312, "global_step": 338686, "epoch": 2015} {"train_loss": -11.903190578733172, "global_step": 338687, "epoch": 2015, "val_loss": 281946.375, "train_action_mse_error": 1.395134449005127} {"train_loss": -9.73898696899414, "global_step": 338688, "epoch": 2016} {"train_loss": -10.511663436889648, "global_step": 338689, "epoch": 2016} {"train_loss": -10.319450378417969, "global_step": 338690, "epoch": 2016} {"train_loss": -9.316324234008789, "global_step": 338691, "epoch": 2016} {"train_loss": -9.861626625061035, "global_step": 338692, "epoch": 2016} {"train_loss": -10.039981842041016, "global_step": 338693, "epoch": 2016} {"train_loss": -11.154813766479492, "global_step": 338694, "epoch": 2016} {"train_loss": -10.455945014953613, "global_step": 338695, "epoch": 2016} {"train_loss": -11.01028060913086, "global_step": 338696, "epoch": 2016} {"train_loss": -10.797001838684082, "global_step": 338697, "epoch": 2016} {"train_loss": -11.227632522583008, "global_step": 338698, "epoch": 2016} {"train_loss": -11.127296447753906, "global_step": 338699, "epoch": 2016} {"train_loss": -10.302907943725586, "global_step": 338700, "epoch": 2016} {"train_loss": -11.457271575927734, "global_step": 338701, "epoch": 2016} {"train_loss": -11.396587371826172, "global_step": 338702, "epoch": 2016} {"train_loss": -11.411996841430664, "global_step": 338703, "epoch": 2016} {"train_loss": -10.747127532958984, "global_step": 338704, "epoch": 2016} {"train_loss": -11.687183380126953, "global_step": 338705, "epoch": 2016} {"train_loss": -11.092876434326172, "global_step": 338706, "epoch": 2016} {"train_loss": -11.932945251464844, "global_step": 338707, "epoch": 2016} {"train_loss": -11.374711990356445, "global_step": 338708, "epoch": 2016} {"train_loss": -11.483484268188477, "global_step": 338709, "epoch": 2016} {"train_loss": -11.491195678710938, "global_step": 338710, "epoch": 2016} {"train_loss": -11.502359390258789, "global_step": 338711, "epoch": 2016} {"train_loss": -11.5281982421875, "global_step": 338712, "epoch": 2016} {"train_loss": -11.645278930664062, "global_step": 338713, "epoch": 2016} {"train_loss": -11.477958679199219, "global_step": 338714, "epoch": 2016} {"train_loss": -11.6416597366333, "global_step": 338715, "epoch": 2016} {"train_loss": -11.957714080810547, "global_step": 338716, "epoch": 2016} {"train_loss": -11.657487869262695, "global_step": 338717, "epoch": 2016} {"train_loss": -11.887007713317871, "global_step": 338718, "epoch": 2016} {"train_loss": -12.017912864685059, "global_step": 338719, "epoch": 2016} {"train_loss": -11.771015167236328, "global_step": 338720, "epoch": 2016} {"train_loss": -11.99111270904541, "global_step": 338721, "epoch": 2016} {"train_loss": -11.976157188415527, "global_step": 338722, "epoch": 2016} {"train_loss": -11.957921981811523, "global_step": 338723, "epoch": 2016} {"train_loss": -12.022180557250977, "global_step": 338724, "epoch": 2016} {"train_loss": -12.266387939453125, "global_step": 338725, "epoch": 2016} {"train_loss": -12.204225540161133, "global_step": 338726, "epoch": 2016} {"train_loss": -12.266303062438965, "global_step": 338727, "epoch": 2016} {"train_loss": -12.024530410766602, "global_step": 338728, "epoch": 2016} {"train_loss": -12.080085754394531, "global_step": 338729, "epoch": 2016} {"train_loss": -12.10047721862793, "global_step": 338730, "epoch": 2016} {"train_loss": -11.938962936401367, "global_step": 338731, "epoch": 2016} {"train_loss": -12.159950256347656, "global_step": 338732, "epoch": 2016} {"train_loss": -11.971769332885742, "global_step": 338733, "epoch": 2016} {"train_loss": -12.256030082702637, "global_step": 338734, "epoch": 2016} {"train_loss": -12.071334838867188, "global_step": 338735, "epoch": 2016} {"train_loss": -12.133264541625977, "global_step": 338736, "epoch": 2016} {"train_loss": -12.045080184936523, "global_step": 338737, "epoch": 2016} {"train_loss": -12.105228424072266, "global_step": 338738, "epoch": 2016} {"train_loss": -12.079195022583008, "global_step": 338739, "epoch": 2016} {"train_loss": -12.28327751159668, "global_step": 338740, "epoch": 2016} {"train_loss": -12.364484786987305, "global_step": 338741, "epoch": 2016} {"train_loss": -12.066780090332031, "global_step": 338742, "epoch": 2016} {"train_loss": -12.297399520874023, "global_step": 338743, "epoch": 2016} {"train_loss": -12.153629302978516, "global_step": 338744, "epoch": 2016} {"train_loss": -12.016168594360352, "global_step": 338745, "epoch": 2016} {"train_loss": -12.205421447753906, "global_step": 338746, "epoch": 2016} {"train_loss": -12.078645706176758, "global_step": 338747, "epoch": 2016} {"train_loss": -12.133552551269531, "global_step": 338748, "epoch": 2016} {"train_loss": -12.294549942016602, "global_step": 338749, "epoch": 2016} {"train_loss": -12.058431625366211, "global_step": 338750, "epoch": 2016} {"train_loss": -12.201295852661133, "global_step": 338751, "epoch": 2016} {"train_loss": -12.084585189819336, "global_step": 338752, "epoch": 2016} {"train_loss": -12.438814163208008, "global_step": 338753, "epoch": 2016} {"train_loss": -12.244978904724121, "global_step": 338754, "epoch": 2016} {"train_loss": -12.332271575927734, "global_step": 338755, "epoch": 2016} {"train_loss": -12.26506519317627, "global_step": 338756, "epoch": 2016} {"train_loss": -12.338878631591797, "global_step": 338757, "epoch": 2016} {"train_loss": -12.436725616455078, "global_step": 338758, "epoch": 2016} {"train_loss": -12.157608985900879, "global_step": 338759, "epoch": 2016} {"train_loss": -12.571775436401367, "global_step": 338760, "epoch": 2016} {"train_loss": -12.30643081665039, "global_step": 338761, "epoch": 2016} {"train_loss": -12.258960723876953, "global_step": 338762, "epoch": 2016} {"train_loss": -12.117149353027344, "global_step": 338763, "epoch": 2016} {"train_loss": -12.430469512939453, "global_step": 338764, "epoch": 2016} {"train_loss": -12.10793685913086, "global_step": 338765, "epoch": 2016} {"train_loss": -12.158503532409668, "global_step": 338766, "epoch": 2016} {"train_loss": -11.547747611999512, "global_step": 338767, "epoch": 2016} {"train_loss": -12.075063705444336, "global_step": 338768, "epoch": 2016} {"train_loss": -11.729451179504395, "global_step": 338769, "epoch": 2016} {"train_loss": -12.219929695129395, "global_step": 338770, "epoch": 2016} {"train_loss": -12.12918472290039, "global_step": 338771, "epoch": 2016} {"train_loss": -12.137022018432617, "global_step": 338772, "epoch": 2016} {"train_loss": -12.144375801086426, "global_step": 338773, "epoch": 2016} {"train_loss": -12.381958961486816, "global_step": 338774, "epoch": 2016} {"train_loss": -11.744149208068848, "global_step": 338775, "epoch": 2016} {"train_loss": -12.285022735595703, "global_step": 338776, "epoch": 2016} {"train_loss": -12.135110855102539, "global_step": 338777, "epoch": 2016} {"train_loss": -12.35004997253418, "global_step": 338778, "epoch": 2016} {"train_loss": -11.888574600219727, "global_step": 338779, "epoch": 2016} {"train_loss": -12.293303489685059, "global_step": 338780, "epoch": 2016} {"train_loss": -11.790334701538086, "global_step": 338781, "epoch": 2016} {"train_loss": -12.384407997131348, "global_step": 338782, "epoch": 2016} {"train_loss": -11.725486755371094, "global_step": 338783, "epoch": 2016} {"train_loss": -12.4133882522583, "global_step": 338784, "epoch": 2016} {"train_loss": -11.973740577697754, "global_step": 338785, "epoch": 2016} {"train_loss": -12.34331226348877, "global_step": 338786, "epoch": 2016} {"train_loss": -11.988448143005371, "global_step": 338787, "epoch": 2016} {"train_loss": -12.133728981018066, "global_step": 338788, "epoch": 2016} {"train_loss": -12.444352149963379, "global_step": 338789, "epoch": 2016} {"train_loss": -11.802453994750977, "global_step": 338790, "epoch": 2016} {"train_loss": -12.117446899414062, "global_step": 338791, "epoch": 2016} {"train_loss": -12.101846694946289, "global_step": 338792, "epoch": 2016} {"train_loss": -11.98513126373291, "global_step": 338793, "epoch": 2016} {"train_loss": -11.204402923583984, "global_step": 338794, "epoch": 2016} {"train_loss": -11.908260345458984, "global_step": 338795, "epoch": 2016} {"train_loss": -10.930585861206055, "global_step": 338796, "epoch": 2016} {"train_loss": -12.615510940551758, "global_step": 338797, "epoch": 2016} {"train_loss": -11.403861999511719, "global_step": 338798, "epoch": 2016} {"train_loss": -11.931815147399902, "global_step": 338799, "epoch": 2016} {"train_loss": -11.661677360534668, "global_step": 338800, "epoch": 2016} {"train_loss": -11.807744026184082, "global_step": 338801, "epoch": 2016} {"train_loss": -12.315818786621094, "global_step": 338802, "epoch": 2016} {"train_loss": -11.740327835083008, "global_step": 338803, "epoch": 2016} {"train_loss": -12.16598129272461, "global_step": 338804, "epoch": 2016} {"train_loss": -11.443737030029297, "global_step": 338805, "epoch": 2016} {"train_loss": -11.0647611618042, "global_step": 338806, "epoch": 2016} {"train_loss": -11.633753776550293, "global_step": 338807, "epoch": 2016} {"train_loss": -11.046445846557617, "global_step": 338808, "epoch": 2016} {"train_loss": -11.888337135314941, "global_step": 338809, "epoch": 2016} {"train_loss": -11.496414184570312, "global_step": 338810, "epoch": 2016} {"train_loss": -11.91972541809082, "global_step": 338811, "epoch": 2016} {"train_loss": -12.220847129821777, "global_step": 338812, "epoch": 2016} {"train_loss": -11.311036109924316, "global_step": 338813, "epoch": 2016} {"train_loss": -11.588212013244629, "global_step": 338814, "epoch": 2016} {"train_loss": -12.12043571472168, "global_step": 338815, "epoch": 2016} {"train_loss": -11.500167846679688, "global_step": 338816, "epoch": 2016} {"train_loss": -11.8892240524292, "global_step": 338817, "epoch": 2016} {"train_loss": -12.254005432128906, "global_step": 338818, "epoch": 2016} {"train_loss": -11.841660499572754, "global_step": 338819, "epoch": 2016} {"train_loss": -11.251893043518066, "global_step": 338820, "epoch": 2016} {"train_loss": -12.098867416381836, "global_step": 338821, "epoch": 2016} {"train_loss": -11.911865234375, "global_step": 338822, "epoch": 2016} {"train_loss": -11.295055389404297, "global_step": 338823, "epoch": 2016} {"train_loss": -11.861719131469727, "global_step": 338824, "epoch": 2016} {"train_loss": -11.919052124023438, "global_step": 338825, "epoch": 2016} {"train_loss": -11.34980583190918, "global_step": 338826, "epoch": 2016} {"train_loss": -12.161272048950195, "global_step": 338827, "epoch": 2016} {"train_loss": -11.58852481842041, "global_step": 338828, "epoch": 2016} {"train_loss": -11.422767639160156, "global_step": 338829, "epoch": 2016} {"train_loss": -12.203505516052246, "global_step": 338830, "epoch": 2016} {"train_loss": -11.645463943481445, "global_step": 338831, "epoch": 2016} {"train_loss": -12.331136703491211, "global_step": 338832, "epoch": 2016} {"train_loss": -11.706111907958984, "global_step": 338833, "epoch": 2016} {"train_loss": -12.267898559570312, "global_step": 338834, "epoch": 2016} {"train_loss": -11.681219100952148, "global_step": 338835, "epoch": 2016} {"train_loss": -12.234001159667969, "global_step": 338836, "epoch": 2016} {"train_loss": -12.077730178833008, "global_step": 338837, "epoch": 2016} {"train_loss": -11.825315475463867, "global_step": 338838, "epoch": 2016} {"train_loss": -12.002449989318848, "global_step": 338839, "epoch": 2016} {"train_loss": -12.341593742370605, "global_step": 338840, "epoch": 2016} {"train_loss": -12.230914115905762, "global_step": 338841, "epoch": 2016} {"train_loss": -12.300593376159668, "global_step": 338842, "epoch": 2016} {"train_loss": -12.48824691772461, "global_step": 338843, "epoch": 2016} {"train_loss": -12.082868576049805, "global_step": 338844, "epoch": 2016} {"train_loss": -12.299211502075195, "global_step": 338845, "epoch": 2016} {"train_loss": -12.208548545837402, "global_step": 338846, "epoch": 2016} {"train_loss": -12.223892211914062, "global_step": 338847, "epoch": 2016} {"train_loss": -11.905649185180664, "global_step": 338848, "epoch": 2016} {"train_loss": -12.220203399658203, "global_step": 338849, "epoch": 2016} {"train_loss": -11.880539894104004, "global_step": 338850, "epoch": 2016} {"train_loss": -12.388298988342285, "global_step": 338851, "epoch": 2016} {"train_loss": -12.326841354370117, "global_step": 338852, "epoch": 2016} {"train_loss": -12.335063934326172, "global_step": 338853, "epoch": 2016} {"train_loss": -12.356697082519531, "global_step": 338854, "epoch": 2016} {"train_loss": -11.850118478139242, "global_step": 338855, "epoch": 2016, "val_loss": 286319.40625} {"train_loss": -12.314045906066895, "global_step": 338856, "epoch": 2017} {"train_loss": -12.23509693145752, "global_step": 338857, "epoch": 2017} {"train_loss": -12.225481033325195, "global_step": 338858, "epoch": 2017} {"train_loss": -11.839314460754395, "global_step": 338859, "epoch": 2017} {"train_loss": -12.248205184936523, "global_step": 338860, "epoch": 2017} {"train_loss": -12.03388500213623, "global_step": 338861, "epoch": 2017} {"train_loss": -12.089131355285645, "global_step": 338862, "epoch": 2017} {"train_loss": -12.075576782226562, "global_step": 338863, "epoch": 2017} {"train_loss": -12.519142150878906, "global_step": 338864, "epoch": 2017} {"train_loss": -12.200443267822266, "global_step": 338865, "epoch": 2017} {"train_loss": -12.086687088012695, "global_step": 338866, "epoch": 2017} {"train_loss": -12.184404373168945, "global_step": 338867, "epoch": 2017} {"train_loss": -12.41977596282959, "global_step": 338868, "epoch": 2017} {"train_loss": -12.041704177856445, "global_step": 338869, "epoch": 2017} {"train_loss": -12.115205764770508, "global_step": 338870, "epoch": 2017} {"train_loss": -12.100074768066406, "global_step": 338871, "epoch": 2017} {"train_loss": -11.701764106750488, "global_step": 338872, "epoch": 2017} {"train_loss": -12.630932807922363, "global_step": 338873, "epoch": 2017} {"train_loss": -12.10879898071289, "global_step": 338874, "epoch": 2017} {"train_loss": -12.254744529724121, "global_step": 338875, "epoch": 2017} {"train_loss": -12.307352066040039, "global_step": 338876, "epoch": 2017} {"train_loss": -12.267927169799805, "global_step": 338877, "epoch": 2017} {"train_loss": -11.942811965942383, "global_step": 338878, "epoch": 2017} {"train_loss": -12.09164810180664, "global_step": 338879, "epoch": 2017} {"train_loss": -11.42877197265625, "global_step": 338880, "epoch": 2017} {"train_loss": -11.789531707763672, "global_step": 338881, "epoch": 2017} {"train_loss": -11.742280960083008, "global_step": 338882, "epoch": 2017} {"train_loss": -11.337128639221191, "global_step": 338883, "epoch": 2017} {"train_loss": -11.356902122497559, "global_step": 338884, "epoch": 2017} {"train_loss": -11.45555305480957, "global_step": 338885, "epoch": 2017} {"train_loss": -11.430307388305664, "global_step": 338886, "epoch": 2017} {"train_loss": -11.738519668579102, "global_step": 338887, "epoch": 2017} {"train_loss": -10.414631843566895, "global_step": 338888, "epoch": 2017} {"train_loss": -11.729475021362305, "global_step": 338889, "epoch": 2017} {"train_loss": -8.804162979125977, "global_step": 338890, "epoch": 2017} {"train_loss": -11.374035835266113, "global_step": 338891, "epoch": 2017} {"train_loss": -9.316473007202148, "global_step": 338892, "epoch": 2017} {"train_loss": -11.132315635681152, "global_step": 338893, "epoch": 2017} {"train_loss": -11.009054183959961, "global_step": 338894, "epoch": 2017} {"train_loss": -9.391889572143555, "global_step": 338895, "epoch": 2017} {"train_loss": -11.78750991821289, "global_step": 338896, "epoch": 2017} {"train_loss": -9.783950805664062, "global_step": 338897, "epoch": 2017} {"train_loss": -11.768460273742676, "global_step": 338898, "epoch": 2017} {"train_loss": -10.645683288574219, "global_step": 338899, "epoch": 2017} {"train_loss": -11.764101028442383, "global_step": 338900, "epoch": 2017} {"train_loss": -10.66486930847168, "global_step": 338901, "epoch": 2017} {"train_loss": -11.573892593383789, "global_step": 338902, "epoch": 2017} {"train_loss": -11.45664119720459, "global_step": 338903, "epoch": 2017} {"train_loss": -11.348898887634277, "global_step": 338904, "epoch": 2017} {"train_loss": -9.79682731628418, "global_step": 338905, "epoch": 2017} {"train_loss": -11.648711204528809, "global_step": 338906, "epoch": 2017} {"train_loss": -9.363882064819336, "global_step": 338907, "epoch": 2017} {"train_loss": -11.520364761352539, "global_step": 338908, "epoch": 2017} {"train_loss": -11.109700202941895, "global_step": 338909, "epoch": 2017} {"train_loss": -10.74677848815918, "global_step": 338910, "epoch": 2017} {"train_loss": -11.94207763671875, "global_step": 338911, "epoch": 2017} {"train_loss": -11.260958671569824, "global_step": 338912, "epoch": 2017} {"train_loss": -11.099666595458984, "global_step": 338913, "epoch": 2017} {"train_loss": -11.700773239135742, "global_step": 338914, "epoch": 2017} {"train_loss": -11.119438171386719, "global_step": 338915, "epoch": 2017} {"train_loss": -11.910530090332031, "global_step": 338916, "epoch": 2017} {"train_loss": -11.2711181640625, "global_step": 338917, "epoch": 2017} {"train_loss": -11.388838768005371, "global_step": 338918, "epoch": 2017} {"train_loss": -11.40415096282959, "global_step": 338919, "epoch": 2017} {"train_loss": -11.759246826171875, "global_step": 338920, "epoch": 2017} {"train_loss": -11.638383865356445, "global_step": 338921, "epoch": 2017} {"train_loss": -12.14370346069336, "global_step": 338922, "epoch": 2017} {"train_loss": -11.795838356018066, "global_step": 338923, "epoch": 2017} {"train_loss": -12.047216415405273, "global_step": 338924, "epoch": 2017} {"train_loss": -12.098784446716309, "global_step": 338925, "epoch": 2017} {"train_loss": -12.00072193145752, "global_step": 338926, "epoch": 2017} {"train_loss": -11.861814498901367, "global_step": 338927, "epoch": 2017} {"train_loss": -12.04181957244873, "global_step": 338928, "epoch": 2017} {"train_loss": -12.055498123168945, "global_step": 338929, "epoch": 2017} {"train_loss": -12.122537612915039, "global_step": 338930, "epoch": 2017} {"train_loss": -12.02680492401123, "global_step": 338931, "epoch": 2017} {"train_loss": -12.220536231994629, "global_step": 338932, "epoch": 2017} {"train_loss": -12.067636489868164, "global_step": 338933, "epoch": 2017} {"train_loss": -12.237817764282227, "global_step": 338934, "epoch": 2017} {"train_loss": -12.089438438415527, "global_step": 338935, "epoch": 2017} {"train_loss": -12.10242748260498, "global_step": 338936, "epoch": 2017} {"train_loss": -12.100903511047363, "global_step": 338937, "epoch": 2017} {"train_loss": -12.18466567993164, "global_step": 338938, "epoch": 2017} {"train_loss": -12.236371994018555, "global_step": 338939, "epoch": 2017} {"train_loss": -12.346237182617188, "global_step": 338940, "epoch": 2017} {"train_loss": -12.2413330078125, "global_step": 338941, "epoch": 2017} {"train_loss": -12.398053169250488, "global_step": 338942, "epoch": 2017} {"train_loss": -12.137590408325195, "global_step": 338943, "epoch": 2017} {"train_loss": -11.936958312988281, "global_step": 338944, "epoch": 2017} {"train_loss": -12.35291862487793, "global_step": 338945, "epoch": 2017} {"train_loss": -12.177779197692871, "global_step": 338946, "epoch": 2017} {"train_loss": -12.274015426635742, "global_step": 338947, "epoch": 2017} {"train_loss": -12.171791076660156, "global_step": 338948, "epoch": 2017} {"train_loss": -12.377116203308105, "global_step": 338949, "epoch": 2017} {"train_loss": -11.986257553100586, "global_step": 338950, "epoch": 2017} {"train_loss": -12.400596618652344, "global_step": 338951, "epoch": 2017} {"train_loss": -12.401385307312012, "global_step": 338952, "epoch": 2017} {"train_loss": -12.502668380737305, "global_step": 338953, "epoch": 2017} {"train_loss": -12.218428611755371, "global_step": 338954, "epoch": 2017} {"train_loss": -12.34588623046875, "global_step": 338955, "epoch": 2017} {"train_loss": -12.449238777160645, "global_step": 338956, "epoch": 2017} {"train_loss": -12.580510139465332, "global_step": 338957, "epoch": 2017} {"train_loss": -12.456502914428711, "global_step": 338958, "epoch": 2017} {"train_loss": -12.321367263793945, "global_step": 338959, "epoch": 2017} {"train_loss": -12.45458698272705, "global_step": 338960, "epoch": 2017} {"train_loss": -12.505001068115234, "global_step": 338961, "epoch": 2017} {"train_loss": -12.46657943725586, "global_step": 338962, "epoch": 2017} {"train_loss": -12.211690902709961, "global_step": 338963, "epoch": 2017} {"train_loss": -12.545063972473145, "global_step": 338964, "epoch": 2017} {"train_loss": -12.359159469604492, "global_step": 338965, "epoch": 2017} {"train_loss": -12.579020500183105, "global_step": 338966, "epoch": 2017} {"train_loss": -12.532169342041016, "global_step": 338967, "epoch": 2017} {"train_loss": -12.415653228759766, "global_step": 338968, "epoch": 2017} {"train_loss": -12.63838005065918, "global_step": 338969, "epoch": 2017} {"train_loss": -12.662397384643555, "global_step": 338970, "epoch": 2017} {"train_loss": -12.388864517211914, "global_step": 338971, "epoch": 2017} {"train_loss": -12.41090202331543, "global_step": 338972, "epoch": 2017} {"train_loss": -12.288629531860352, "global_step": 338973, "epoch": 2017} {"train_loss": -12.512298583984375, "global_step": 338974, "epoch": 2017} {"train_loss": -12.401912689208984, "global_step": 338975, "epoch": 2017} {"train_loss": -12.368276596069336, "global_step": 338976, "epoch": 2017} {"train_loss": -12.481792449951172, "global_step": 338977, "epoch": 2017} {"train_loss": -12.339330673217773, "global_step": 338978, "epoch": 2017} {"train_loss": -12.181446075439453, "global_step": 338979, "epoch": 2017} {"train_loss": -12.399097442626953, "global_step": 338980, "epoch": 2017} {"train_loss": -12.517166137695312, "global_step": 338981, "epoch": 2017} {"train_loss": -12.506855010986328, "global_step": 338982, "epoch": 2017} {"train_loss": -12.116463661193848, "global_step": 338983, "epoch": 2017} {"train_loss": -12.492767333984375, "global_step": 338984, "epoch": 2017} {"train_loss": -12.361879348754883, "global_step": 338985, "epoch": 2017} {"train_loss": -11.660150527954102, "global_step": 338986, "epoch": 2017} {"train_loss": -12.183015823364258, "global_step": 338987, "epoch": 2017} {"train_loss": -12.365906715393066, "global_step": 338988, "epoch": 2017} {"train_loss": -11.275203704833984, "global_step": 338989, "epoch": 2017} {"train_loss": -11.696928024291992, "global_step": 338990, "epoch": 2017} {"train_loss": -12.360451698303223, "global_step": 338991, "epoch": 2017} {"train_loss": -11.8687105178833, "global_step": 338992, "epoch": 2017} {"train_loss": -11.279126167297363, "global_step": 338993, "epoch": 2017} {"train_loss": -11.856892585754395, "global_step": 338994, "epoch": 2017} {"train_loss": -12.411325454711914, "global_step": 338995, "epoch": 2017} {"train_loss": -11.849939346313477, "global_step": 338996, "epoch": 2017} {"train_loss": -12.515172958374023, "global_step": 338997, "epoch": 2017} {"train_loss": -11.400175094604492, "global_step": 338998, "epoch": 2017} {"train_loss": -11.869613647460938, "global_step": 338999, "epoch": 2017} {"train_loss": -12.349930763244629, "global_step": 339000, "epoch": 2017} {"train_loss": -12.342086791992188, "global_step": 339001, "epoch": 2017} {"train_loss": -12.248764038085938, "global_step": 339002, "epoch": 2017} {"train_loss": -12.481114387512207, "global_step": 339003, "epoch": 2017} {"train_loss": -12.210684776306152, "global_step": 339004, "epoch": 2017} {"train_loss": -12.363161087036133, "global_step": 339005, "epoch": 2017} {"train_loss": -12.412885665893555, "global_step": 339006, "epoch": 2017} {"train_loss": -12.286571502685547, "global_step": 339007, "epoch": 2017} {"train_loss": -11.174570083618164, "global_step": 339008, "epoch": 2017} {"train_loss": -12.177966117858887, "global_step": 339009, "epoch": 2017} {"train_loss": -11.756353378295898, "global_step": 339010, "epoch": 2017} {"train_loss": -11.853191375732422, "global_step": 339011, "epoch": 2017} {"train_loss": -10.916929244995117, "global_step": 339012, "epoch": 2017} {"train_loss": -12.275681495666504, "global_step": 339013, "epoch": 2017} {"train_loss": -11.522783279418945, "global_step": 339014, "epoch": 2017} {"train_loss": -10.770636558532715, "global_step": 339015, "epoch": 2017} {"train_loss": -11.551591873168945, "global_step": 339016, "epoch": 2017} {"train_loss": -11.979619979858398, "global_step": 339017, "epoch": 2017} {"train_loss": -11.24786376953125, "global_step": 339018, "epoch": 2017} {"train_loss": -12.063215255737305, "global_step": 339019, "epoch": 2017} {"train_loss": -11.817436218261719, "global_step": 339020, "epoch": 2017} {"train_loss": -10.813523292541504, "global_step": 339021, "epoch": 2017} {"train_loss": -11.890769004821777, "global_step": 339022, "epoch": 2017} {"train_loss": -11.878905665306817, "global_step": 339023, "epoch": 2017, "val_loss": 286678.25} {"train_loss": -11.37415885925293, "global_step": 339024, "epoch": 2018} {"train_loss": -10.852876663208008, "global_step": 339025, "epoch": 2018} {"train_loss": -11.870566368103027, "global_step": 339026, "epoch": 2018} {"train_loss": -11.600034713745117, "global_step": 339027, "epoch": 2018} {"train_loss": -11.450592041015625, "global_step": 339028, "epoch": 2018} {"train_loss": -11.981401443481445, "global_step": 339029, "epoch": 2018} {"train_loss": -11.764805793762207, "global_step": 339030, "epoch": 2018} {"train_loss": -11.006935119628906, "global_step": 339031, "epoch": 2018} {"train_loss": -12.092702865600586, "global_step": 339032, "epoch": 2018} {"train_loss": -11.095224380493164, "global_step": 339033, "epoch": 2018} {"train_loss": -11.415497779846191, "global_step": 339034, "epoch": 2018} {"train_loss": -12.173606872558594, "global_step": 339035, "epoch": 2018} {"train_loss": -11.273122787475586, "global_step": 339036, "epoch": 2018} {"train_loss": -11.884147644042969, "global_step": 339037, "epoch": 2018} {"train_loss": -11.658464431762695, "global_step": 339038, "epoch": 2018} {"train_loss": -11.200252532958984, "global_step": 339039, "epoch": 2018} {"train_loss": -12.075248718261719, "global_step": 339040, "epoch": 2018} {"train_loss": -11.63644790649414, "global_step": 339041, "epoch": 2018} {"train_loss": -11.618721961975098, "global_step": 339042, "epoch": 2018} {"train_loss": -12.063741683959961, "global_step": 339043, "epoch": 2018} {"train_loss": -12.103073120117188, "global_step": 339044, "epoch": 2018} {"train_loss": -12.365467071533203, "global_step": 339045, "epoch": 2018} {"train_loss": -11.827237129211426, "global_step": 339046, "epoch": 2018} {"train_loss": -12.13061237335205, "global_step": 339047, "epoch": 2018} {"train_loss": -11.968948364257812, "global_step": 339048, "epoch": 2018} {"train_loss": -11.79134750366211, "global_step": 339049, "epoch": 2018} {"train_loss": -11.996335983276367, "global_step": 339050, "epoch": 2018} {"train_loss": -11.849095344543457, "global_step": 339051, "epoch": 2018} {"train_loss": -12.161642074584961, "global_step": 339052, "epoch": 2018} {"train_loss": -11.942191123962402, "global_step": 339053, "epoch": 2018} {"train_loss": -12.090428352355957, "global_step": 339054, "epoch": 2018} {"train_loss": -12.094413757324219, "global_step": 339055, "epoch": 2018} {"train_loss": -11.591300964355469, "global_step": 339056, "epoch": 2018} {"train_loss": -12.269932746887207, "global_step": 339057, "epoch": 2018} {"train_loss": -12.117616653442383, "global_step": 339058, "epoch": 2018} {"train_loss": -12.233441352844238, "global_step": 339059, "epoch": 2018} {"train_loss": -12.157787322998047, "global_step": 339060, "epoch": 2018} {"train_loss": -11.911438941955566, "global_step": 339061, "epoch": 2018} {"train_loss": -12.15414047241211, "global_step": 339062, "epoch": 2018} {"train_loss": -12.094369888305664, "global_step": 339063, "epoch": 2018} {"train_loss": -12.242137908935547, "global_step": 339064, "epoch": 2018} {"train_loss": -12.551294326782227, "global_step": 339065, "epoch": 2018} {"train_loss": -12.055679321289062, "global_step": 339066, "epoch": 2018} {"train_loss": -12.512184143066406, "global_step": 339067, "epoch": 2018} {"train_loss": -12.017023086547852, "global_step": 339068, "epoch": 2018} {"train_loss": -12.531042098999023, "global_step": 339069, "epoch": 2018} {"train_loss": -11.993983268737793, "global_step": 339070, "epoch": 2018} {"train_loss": -12.228121757507324, "global_step": 339071, "epoch": 2018} {"train_loss": -12.040144920349121, "global_step": 339072, "epoch": 2018} {"train_loss": -12.332710266113281, "global_step": 339073, "epoch": 2018} {"train_loss": -11.938467025756836, "global_step": 339074, "epoch": 2018} {"train_loss": -11.826510429382324, "global_step": 339075, "epoch": 2018} {"train_loss": -12.197982788085938, "global_step": 339076, "epoch": 2018} {"train_loss": -11.416888236999512, "global_step": 339077, "epoch": 2018} {"train_loss": -12.001502990722656, "global_step": 339078, "epoch": 2018} {"train_loss": -11.269706726074219, "global_step": 339079, "epoch": 2018} {"train_loss": -12.484733581542969, "global_step": 339080, "epoch": 2018} {"train_loss": -11.372978210449219, "global_step": 339081, "epoch": 2018} {"train_loss": -12.479665756225586, "global_step": 339082, "epoch": 2018} {"train_loss": -11.643312454223633, "global_step": 339083, "epoch": 2018} {"train_loss": -12.217910766601562, "global_step": 339084, "epoch": 2018} {"train_loss": -12.002140045166016, "global_step": 339085, "epoch": 2018} {"train_loss": -12.239315032958984, "global_step": 339086, "epoch": 2018} {"train_loss": -12.080240249633789, "global_step": 339087, "epoch": 2018} {"train_loss": -12.182157516479492, "global_step": 339088, "epoch": 2018} {"train_loss": -11.953807830810547, "global_step": 339089, "epoch": 2018} {"train_loss": -12.21839714050293, "global_step": 339090, "epoch": 2018} {"train_loss": -12.283166885375977, "global_step": 339091, "epoch": 2018} {"train_loss": -12.482871055603027, "global_step": 339092, "epoch": 2018} {"train_loss": -12.1951322555542, "global_step": 339093, "epoch": 2018} {"train_loss": -12.03911018371582, "global_step": 339094, "epoch": 2018} {"train_loss": -12.10849380493164, "global_step": 339095, "epoch": 2018} {"train_loss": -12.192508697509766, "global_step": 339096, "epoch": 2018} {"train_loss": -12.00248908996582, "global_step": 339097, "epoch": 2018} {"train_loss": -11.897052764892578, "global_step": 339098, "epoch": 2018} {"train_loss": -11.993696212768555, "global_step": 339099, "epoch": 2018} {"train_loss": -11.627716064453125, "global_step": 339100, "epoch": 2018} {"train_loss": -12.101272583007812, "global_step": 339101, "epoch": 2018} {"train_loss": -11.947626113891602, "global_step": 339102, "epoch": 2018} {"train_loss": -11.75086784362793, "global_step": 339103, "epoch": 2018} {"train_loss": -11.795073509216309, "global_step": 339104, "epoch": 2018} {"train_loss": -12.105798721313477, "global_step": 339105, "epoch": 2018} {"train_loss": -11.788057327270508, "global_step": 339106, "epoch": 2018} {"train_loss": -12.002514839172363, "global_step": 339107, "epoch": 2018} {"train_loss": -10.312986373901367, "global_step": 339108, "epoch": 2018} {"train_loss": -12.014623641967773, "global_step": 339109, "epoch": 2018} {"train_loss": -10.847009658813477, "global_step": 339110, "epoch": 2018} {"train_loss": -11.867215156555176, "global_step": 339111, "epoch": 2018} {"train_loss": -11.016622543334961, "global_step": 339112, "epoch": 2018} {"train_loss": -10.536877632141113, "global_step": 339113, "epoch": 2018} {"train_loss": -10.620495796203613, "global_step": 339114, "epoch": 2018} {"train_loss": -9.48159408569336, "global_step": 339115, "epoch": 2018} {"train_loss": -10.00882339477539, "global_step": 339116, "epoch": 2018} {"train_loss": -10.977707862854004, "global_step": 339117, "epoch": 2018} {"train_loss": -10.6910400390625, "global_step": 339118, "epoch": 2018} {"train_loss": -10.302392959594727, "global_step": 339119, "epoch": 2018} {"train_loss": -10.700193405151367, "global_step": 339120, "epoch": 2018} {"train_loss": -11.406346321105957, "global_step": 339121, "epoch": 2018} {"train_loss": -10.895395278930664, "global_step": 339122, "epoch": 2018} {"train_loss": -11.645849227905273, "global_step": 339123, "epoch": 2018} {"train_loss": -10.969583511352539, "global_step": 339124, "epoch": 2018} {"train_loss": -11.273666381835938, "global_step": 339125, "epoch": 2018} {"train_loss": -11.82951545715332, "global_step": 339126, "epoch": 2018} {"train_loss": -10.407302856445312, "global_step": 339127, "epoch": 2018} {"train_loss": -11.846756935119629, "global_step": 339128, "epoch": 2018} {"train_loss": -10.800483703613281, "global_step": 339129, "epoch": 2018} {"train_loss": -11.666013717651367, "global_step": 339130, "epoch": 2018} {"train_loss": -11.34687614440918, "global_step": 339131, "epoch": 2018} {"train_loss": -11.729583740234375, "global_step": 339132, "epoch": 2018} {"train_loss": -11.740517616271973, "global_step": 339133, "epoch": 2018} {"train_loss": -11.929510116577148, "global_step": 339134, "epoch": 2018} {"train_loss": -12.027176856994629, "global_step": 339135, "epoch": 2018} {"train_loss": -11.936033248901367, "global_step": 339136, "epoch": 2018} {"train_loss": -11.910202026367188, "global_step": 339137, "epoch": 2018} {"train_loss": -12.010083198547363, "global_step": 339138, "epoch": 2018} {"train_loss": -12.123285293579102, "global_step": 339139, "epoch": 2018} {"train_loss": -11.807291030883789, "global_step": 339140, "epoch": 2018} {"train_loss": -12.005958557128906, "global_step": 339141, "epoch": 2018} {"train_loss": -11.932278633117676, "global_step": 339142, "epoch": 2018} {"train_loss": -12.221272468566895, "global_step": 339143, "epoch": 2018} {"train_loss": -12.146859169006348, "global_step": 339144, "epoch": 2018} {"train_loss": -12.263537406921387, "global_step": 339145, "epoch": 2018} {"train_loss": -11.845596313476562, "global_step": 339146, "epoch": 2018} {"train_loss": -12.212841033935547, "global_step": 339147, "epoch": 2018} {"train_loss": -12.028839111328125, "global_step": 339148, "epoch": 2018} {"train_loss": -12.24984359741211, "global_step": 339149, "epoch": 2018} {"train_loss": -12.243734359741211, "global_step": 339150, "epoch": 2018} {"train_loss": -12.448262214660645, "global_step": 339151, "epoch": 2018} {"train_loss": -12.365671157836914, "global_step": 339152, "epoch": 2018} {"train_loss": -12.32491397857666, "global_step": 339153, "epoch": 2018} {"train_loss": -12.378320693969727, "global_step": 339154, "epoch": 2018} {"train_loss": -12.52220630645752, "global_step": 339155, "epoch": 2018} {"train_loss": -12.248366355895996, "global_step": 339156, "epoch": 2018} {"train_loss": -12.360153198242188, "global_step": 339157, "epoch": 2018} {"train_loss": -12.294493675231934, "global_step": 339158, "epoch": 2018} {"train_loss": -12.233580589294434, "global_step": 339159, "epoch": 2018} {"train_loss": -12.503276824951172, "global_step": 339160, "epoch": 2018} {"train_loss": -12.297142028808594, "global_step": 339161, "epoch": 2018} {"train_loss": -12.508981704711914, "global_step": 339162, "epoch": 2018} {"train_loss": -12.394775390625, "global_step": 339163, "epoch": 2018} {"train_loss": -12.688117980957031, "global_step": 339164, "epoch": 2018} {"train_loss": -12.396121978759766, "global_step": 339165, "epoch": 2018} {"train_loss": -12.329379081726074, "global_step": 339166, "epoch": 2018} {"train_loss": -12.448495864868164, "global_step": 339167, "epoch": 2018} {"train_loss": -12.334333419799805, "global_step": 339168, "epoch": 2018} {"train_loss": -12.682570457458496, "global_step": 339169, "epoch": 2018} {"train_loss": -12.286653518676758, "global_step": 339170, "epoch": 2018} {"train_loss": -12.196683883666992, "global_step": 339171, "epoch": 2018} {"train_loss": -12.502995491027832, "global_step": 339172, "epoch": 2018} {"train_loss": -12.256799697875977, "global_step": 339173, "epoch": 2018} {"train_loss": -12.12938404083252, "global_step": 339174, "epoch": 2018} {"train_loss": -12.12598991394043, "global_step": 339175, "epoch": 2018} {"train_loss": -12.586363792419434, "global_step": 339176, "epoch": 2018} {"train_loss": -11.96299934387207, "global_step": 339177, "epoch": 2018} {"train_loss": -12.450977325439453, "global_step": 339178, "epoch": 2018} {"train_loss": -12.374292373657227, "global_step": 339179, "epoch": 2018} {"train_loss": -12.492050170898438, "global_step": 339180, "epoch": 2018} {"train_loss": -12.537713050842285, "global_step": 339181, "epoch": 2018} {"train_loss": -12.227010726928711, "global_step": 339182, "epoch": 2018} {"train_loss": -12.579561233520508, "global_step": 339183, "epoch": 2018} {"train_loss": -12.188299179077148, "global_step": 339184, "epoch": 2018} {"train_loss": -12.526440620422363, "global_step": 339185, "epoch": 2018} {"train_loss": -11.781599044799805, "global_step": 339186, "epoch": 2018} {"train_loss": -12.203227043151855, "global_step": 339187, "epoch": 2018} {"train_loss": -12.536375999450684, "global_step": 339188, "epoch": 2018} {"train_loss": -12.232341766357422, "global_step": 339189, "epoch": 2018} {"train_loss": -12.33287239074707, "global_step": 339190, "epoch": 2018} {"train_loss": -11.916332744416737, "global_step": 339191, "epoch": 2018, "val_loss": 287298.34375} {"train_loss": -12.233924865722656, "global_step": 339192, "epoch": 2019} {"train_loss": -12.618281364440918, "global_step": 339193, "epoch": 2019} {"train_loss": -12.281756401062012, "global_step": 339194, "epoch": 2019} {"train_loss": -12.338062286376953, "global_step": 339195, "epoch": 2019} {"train_loss": -12.303143501281738, "global_step": 339196, "epoch": 2019} {"train_loss": -12.229475975036621, "global_step": 339197, "epoch": 2019} {"train_loss": -12.05770492553711, "global_step": 339198, "epoch": 2019} {"train_loss": -12.137932777404785, "global_step": 339199, "epoch": 2019} {"train_loss": -12.269820213317871, "global_step": 339200, "epoch": 2019} {"train_loss": -12.148303985595703, "global_step": 339201, "epoch": 2019} {"train_loss": -12.006288528442383, "global_step": 339202, "epoch": 2019} {"train_loss": -11.98568344116211, "global_step": 339203, "epoch": 2019} {"train_loss": -11.49078369140625, "global_step": 339204, "epoch": 2019} {"train_loss": -10.770608901977539, "global_step": 339205, "epoch": 2019} {"train_loss": -12.254712104797363, "global_step": 339206, "epoch": 2019} {"train_loss": -11.204963684082031, "global_step": 339207, "epoch": 2019} {"train_loss": -11.712392807006836, "global_step": 339208, "epoch": 2019} {"train_loss": -12.05573844909668, "global_step": 339209, "epoch": 2019} {"train_loss": -11.520562171936035, "global_step": 339210, "epoch": 2019} {"train_loss": -12.119287490844727, "global_step": 339211, "epoch": 2019} {"train_loss": -11.611732482910156, "global_step": 339212, "epoch": 2019} {"train_loss": -12.466825485229492, "global_step": 339213, "epoch": 2019} {"train_loss": -11.76684284210205, "global_step": 339214, "epoch": 2019} {"train_loss": -12.124577522277832, "global_step": 339215, "epoch": 2019} {"train_loss": -11.980992317199707, "global_step": 339216, "epoch": 2019} {"train_loss": -11.093870162963867, "global_step": 339217, "epoch": 2019} {"train_loss": -12.155778884887695, "global_step": 339218, "epoch": 2019} {"train_loss": -11.699142456054688, "global_step": 339219, "epoch": 2019} {"train_loss": -12.2943696975708, "global_step": 339220, "epoch": 2019} {"train_loss": -12.25121784210205, "global_step": 339221, "epoch": 2019} {"train_loss": -11.820470809936523, "global_step": 339222, "epoch": 2019} {"train_loss": -11.733595848083496, "global_step": 339223, "epoch": 2019} {"train_loss": -11.959491729736328, "global_step": 339224, "epoch": 2019} {"train_loss": -11.28087043762207, "global_step": 339225, "epoch": 2019} {"train_loss": -11.267904281616211, "global_step": 339226, "epoch": 2019} {"train_loss": -12.039060592651367, "global_step": 339227, "epoch": 2019} {"train_loss": -11.697037696838379, "global_step": 339228, "epoch": 2019} {"train_loss": -11.237655639648438, "global_step": 339229, "epoch": 2019} {"train_loss": -11.964661598205566, "global_step": 339230, "epoch": 2019} {"train_loss": -10.955169677734375, "global_step": 339231, "epoch": 2019} {"train_loss": -12.231099128723145, "global_step": 339232, "epoch": 2019} {"train_loss": -11.395576477050781, "global_step": 339233, "epoch": 2019} {"train_loss": -11.682802200317383, "global_step": 339234, "epoch": 2019} {"train_loss": -11.488394737243652, "global_step": 339235, "epoch": 2019} {"train_loss": -11.265095710754395, "global_step": 339236, "epoch": 2019} {"train_loss": -10.67091178894043, "global_step": 339237, "epoch": 2019} {"train_loss": -11.435434341430664, "global_step": 339238, "epoch": 2019} {"train_loss": -11.316048622131348, "global_step": 339239, "epoch": 2019} {"train_loss": -10.06167221069336, "global_step": 339240, "epoch": 2019} {"train_loss": -11.52426815032959, "global_step": 339241, "epoch": 2019} {"train_loss": -11.098858833312988, "global_step": 339242, "epoch": 2019} {"train_loss": -11.851215362548828, "global_step": 339243, "epoch": 2019} {"train_loss": -10.84205436706543, "global_step": 339244, "epoch": 2019} {"train_loss": -10.983658790588379, "global_step": 339245, "epoch": 2019} {"train_loss": -11.334181785583496, "global_step": 339246, "epoch": 2019} {"train_loss": -10.610549926757812, "global_step": 339247, "epoch": 2019} {"train_loss": -11.183427810668945, "global_step": 339248, "epoch": 2019} {"train_loss": -11.77497673034668, "global_step": 339249, "epoch": 2019} {"train_loss": -10.749612808227539, "global_step": 339250, "epoch": 2019} {"train_loss": -12.102938652038574, "global_step": 339251, "epoch": 2019} {"train_loss": -11.263479232788086, "global_step": 339252, "epoch": 2019} {"train_loss": -11.528841018676758, "global_step": 339253, "epoch": 2019} {"train_loss": -11.489655494689941, "global_step": 339254, "epoch": 2019} {"train_loss": -11.738191604614258, "global_step": 339255, "epoch": 2019} {"train_loss": -11.280563354492188, "global_step": 339256, "epoch": 2019} {"train_loss": -11.755203247070312, "global_step": 339257, "epoch": 2019} {"train_loss": -11.410415649414062, "global_step": 339258, "epoch": 2019} {"train_loss": -11.456169128417969, "global_step": 339259, "epoch": 2019} {"train_loss": -11.085296630859375, "global_step": 339260, "epoch": 2019} {"train_loss": -11.341556549072266, "global_step": 339261, "epoch": 2019} {"train_loss": -12.02527141571045, "global_step": 339262, "epoch": 2019} {"train_loss": -9.929803848266602, "global_step": 339263, "epoch": 2019} {"train_loss": -11.72360610961914, "global_step": 339264, "epoch": 2019} {"train_loss": -11.811056137084961, "global_step": 339265, "epoch": 2019} {"train_loss": -11.315776824951172, "global_step": 339266, "epoch": 2019} {"train_loss": -11.476676940917969, "global_step": 339267, "epoch": 2019} {"train_loss": -11.469505310058594, "global_step": 339268, "epoch": 2019} {"train_loss": -11.467927932739258, "global_step": 339269, "epoch": 2019} {"train_loss": -11.790584564208984, "global_step": 339270, "epoch": 2019} {"train_loss": -11.157499313354492, "global_step": 339271, "epoch": 2019} {"train_loss": -11.733268737792969, "global_step": 339272, "epoch": 2019} {"train_loss": -11.535037994384766, "global_step": 339273, "epoch": 2019} {"train_loss": -11.900440216064453, "global_step": 339274, "epoch": 2019} {"train_loss": -11.886100769042969, "global_step": 339275, "epoch": 2019} {"train_loss": -11.39061164855957, "global_step": 339276, "epoch": 2019} {"train_loss": -11.742622375488281, "global_step": 339277, "epoch": 2019} {"train_loss": -11.53587818145752, "global_step": 339278, "epoch": 2019} {"train_loss": -11.782880783081055, "global_step": 339279, "epoch": 2019} {"train_loss": -11.626527786254883, "global_step": 339280, "epoch": 2019} {"train_loss": -11.65981674194336, "global_step": 339281, "epoch": 2019} {"train_loss": -11.759841918945312, "global_step": 339282, "epoch": 2019} {"train_loss": -11.440387725830078, "global_step": 339283, "epoch": 2019} {"train_loss": -11.843467712402344, "global_step": 339284, "epoch": 2019} {"train_loss": -11.752676010131836, "global_step": 339285, "epoch": 2019} {"train_loss": -11.846969604492188, "global_step": 339286, "epoch": 2019} {"train_loss": -12.052093505859375, "global_step": 339287, "epoch": 2019} {"train_loss": -11.86601734161377, "global_step": 339288, "epoch": 2019} {"train_loss": -12.411215782165527, "global_step": 339289, "epoch": 2019} {"train_loss": -12.15243148803711, "global_step": 339290, "epoch": 2019} {"train_loss": -12.033601760864258, "global_step": 339291, "epoch": 2019} {"train_loss": -12.304143905639648, "global_step": 339292, "epoch": 2019} {"train_loss": -12.008516311645508, "global_step": 339293, "epoch": 2019} {"train_loss": -12.052083969116211, "global_step": 339294, "epoch": 2019} {"train_loss": -12.243778228759766, "global_step": 339295, "epoch": 2019} {"train_loss": -12.202070236206055, "global_step": 339296, "epoch": 2019} {"train_loss": -12.168590545654297, "global_step": 339297, "epoch": 2019} {"train_loss": -12.267640113830566, "global_step": 339298, "epoch": 2019} {"train_loss": -12.271260261535645, "global_step": 339299, "epoch": 2019} {"train_loss": -12.172083854675293, "global_step": 339300, "epoch": 2019} {"train_loss": -12.17110824584961, "global_step": 339301, "epoch": 2019} {"train_loss": -11.93874740600586, "global_step": 339302, "epoch": 2019} {"train_loss": -12.446264266967773, "global_step": 339303, "epoch": 2019} {"train_loss": -12.284908294677734, "global_step": 339304, "epoch": 2019} {"train_loss": -12.303268432617188, "global_step": 339305, "epoch": 2019} {"train_loss": -12.307121276855469, "global_step": 339306, "epoch": 2019} {"train_loss": -12.125686645507812, "global_step": 339307, "epoch": 2019} {"train_loss": -12.23111629486084, "global_step": 339308, "epoch": 2019} {"train_loss": -12.433415412902832, "global_step": 339309, "epoch": 2019} {"train_loss": -12.455942153930664, "global_step": 339310, "epoch": 2019} {"train_loss": -12.348036766052246, "global_step": 339311, "epoch": 2019} {"train_loss": -12.460983276367188, "global_step": 339312, "epoch": 2019} {"train_loss": -12.151809692382812, "global_step": 339313, "epoch": 2019} {"train_loss": -12.558265686035156, "global_step": 339314, "epoch": 2019} {"train_loss": -12.325543403625488, "global_step": 339315, "epoch": 2019} {"train_loss": -12.409652709960938, "global_step": 339316, "epoch": 2019} {"train_loss": -12.273054122924805, "global_step": 339317, "epoch": 2019} {"train_loss": -12.333404541015625, "global_step": 339318, "epoch": 2019} {"train_loss": -12.392964363098145, "global_step": 339319, "epoch": 2019} {"train_loss": -12.482658386230469, "global_step": 339320, "epoch": 2019} {"train_loss": -12.489702224731445, "global_step": 339321, "epoch": 2019} {"train_loss": -12.321002960205078, "global_step": 339322, "epoch": 2019} {"train_loss": -12.557876586914062, "global_step": 339323, "epoch": 2019} {"train_loss": -12.494613647460938, "global_step": 339324, "epoch": 2019} {"train_loss": -12.388481140136719, "global_step": 339325, "epoch": 2019} {"train_loss": -12.567757606506348, "global_step": 339326, "epoch": 2019} {"train_loss": -12.273597717285156, "global_step": 339327, "epoch": 2019} {"train_loss": -12.39763069152832, "global_step": 339328, "epoch": 2019} {"train_loss": -12.455057144165039, "global_step": 339329, "epoch": 2019} {"train_loss": -12.590330123901367, "global_step": 339330, "epoch": 2019} {"train_loss": -12.698614120483398, "global_step": 339331, "epoch": 2019} {"train_loss": -12.501541137695312, "global_step": 339332, "epoch": 2019} {"train_loss": -12.410287857055664, "global_step": 339333, "epoch": 2019} {"train_loss": -12.588613510131836, "global_step": 339334, "epoch": 2019} {"train_loss": -12.617032051086426, "global_step": 339335, "epoch": 2019} {"train_loss": -12.717949867248535, "global_step": 339336, "epoch": 2019} {"train_loss": -12.685699462890625, "global_step": 339337, "epoch": 2019} {"train_loss": -12.611995697021484, "global_step": 339338, "epoch": 2019} {"train_loss": -12.66150951385498, "global_step": 339339, "epoch": 2019} {"train_loss": -12.442774772644043, "global_step": 339340, "epoch": 2019} {"train_loss": -12.2652006149292, "global_step": 339341, "epoch": 2019} {"train_loss": -12.177312850952148, "global_step": 339342, "epoch": 2019} {"train_loss": -12.360128402709961, "global_step": 339343, "epoch": 2019} {"train_loss": -12.151533126831055, "global_step": 339344, "epoch": 2019} {"train_loss": -12.20399284362793, "global_step": 339345, "epoch": 2019} {"train_loss": -11.372697830200195, "global_step": 339346, "epoch": 2019} {"train_loss": -11.299567222595215, "global_step": 339347, "epoch": 2019} {"train_loss": -12.551236152648926, "global_step": 339348, "epoch": 2019} {"train_loss": -12.115253448486328, "global_step": 339349, "epoch": 2019} {"train_loss": -12.500276565551758, "global_step": 339350, "epoch": 2019} {"train_loss": -12.490021705627441, "global_step": 339351, "epoch": 2019} {"train_loss": -12.41726303100586, "global_step": 339352, "epoch": 2019} {"train_loss": -12.231266021728516, "global_step": 339353, "epoch": 2019} {"train_loss": -12.393588066101074, "global_step": 339354, "epoch": 2019} {"train_loss": -12.013526916503906, "global_step": 339355, "epoch": 2019} {"train_loss": -12.284333229064941, "global_step": 339356, "epoch": 2019} {"train_loss": -12.15818977355957, "global_step": 339357, "epoch": 2019} {"train_loss": -12.238250732421875, "global_step": 339358, "epoch": 2019} {"train_loss": -11.921451210975647, "global_step": 339359, "epoch": 2019, "val_loss": 290051.9375} {"train_loss": -12.769365310668945, "global_step": 339360, "epoch": 2020} {"train_loss": -12.167678833007812, "global_step": 339361, "epoch": 2020} {"train_loss": -12.562738418579102, "global_step": 339362, "epoch": 2020} {"train_loss": -12.233783721923828, "global_step": 339363, "epoch": 2020} {"train_loss": -12.586362838745117, "global_step": 339364, "epoch": 2020} {"train_loss": -12.04501724243164, "global_step": 339365, "epoch": 2020} {"train_loss": -12.15310287475586, "global_step": 339366, "epoch": 2020} {"train_loss": -12.07544994354248, "global_step": 339367, "epoch": 2020} {"train_loss": -11.581460952758789, "global_step": 339368, "epoch": 2020} {"train_loss": -11.841691970825195, "global_step": 339369, "epoch": 2020} {"train_loss": -12.377567291259766, "global_step": 339370, "epoch": 2020} {"train_loss": -12.304389953613281, "global_step": 339371, "epoch": 2020} {"train_loss": -12.479458808898926, "global_step": 339372, "epoch": 2020} {"train_loss": -11.954487800598145, "global_step": 339373, "epoch": 2020} {"train_loss": -10.77058219909668, "global_step": 339374, "epoch": 2020} {"train_loss": -11.094669342041016, "global_step": 339375, "epoch": 2020} {"train_loss": -12.084580421447754, "global_step": 339376, "epoch": 2020} {"train_loss": -11.743614196777344, "global_step": 339377, "epoch": 2020} {"train_loss": -10.563549041748047, "global_step": 339378, "epoch": 2020} {"train_loss": -11.682255744934082, "global_step": 339379, "epoch": 2020} {"train_loss": -11.416942596435547, "global_step": 339380, "epoch": 2020} {"train_loss": -11.071090698242188, "global_step": 339381, "epoch": 2020} {"train_loss": -11.51699447631836, "global_step": 339382, "epoch": 2020} {"train_loss": -11.151239395141602, "global_step": 339383, "epoch": 2020} {"train_loss": -11.063783645629883, "global_step": 339384, "epoch": 2020} {"train_loss": -11.128992080688477, "global_step": 339385, "epoch": 2020} {"train_loss": -10.731091499328613, "global_step": 339386, "epoch": 2020} {"train_loss": -9.673746109008789, "global_step": 339387, "epoch": 2020} {"train_loss": -12.341838836669922, "global_step": 339388, "epoch": 2020} {"train_loss": -10.069173812866211, "global_step": 339389, "epoch": 2020} {"train_loss": -11.350724220275879, "global_step": 339390, "epoch": 2020} {"train_loss": -8.777423858642578, "global_step": 339391, "epoch": 2020} {"train_loss": -9.991512298583984, "global_step": 339392, "epoch": 2020} {"train_loss": -9.850175857543945, "global_step": 339393, "epoch": 2020} {"train_loss": -10.515117645263672, "global_step": 339394, "epoch": 2020} {"train_loss": -9.004194259643555, "global_step": 339395, "epoch": 2020} {"train_loss": -10.219234466552734, "global_step": 339396, "epoch": 2020} {"train_loss": -10.767110824584961, "global_step": 339397, "epoch": 2020} {"train_loss": -10.358807563781738, "global_step": 339398, "epoch": 2020} {"train_loss": -10.020565032958984, "global_step": 339399, "epoch": 2020} {"train_loss": -10.473026275634766, "global_step": 339400, "epoch": 2020} {"train_loss": -11.326461791992188, "global_step": 339401, "epoch": 2020} {"train_loss": -11.362279891967773, "global_step": 339402, "epoch": 2020} {"train_loss": -11.161381721496582, "global_step": 339403, "epoch": 2020} {"train_loss": -11.71665096282959, "global_step": 339404, "epoch": 2020} {"train_loss": -11.401503562927246, "global_step": 339405, "epoch": 2020} {"train_loss": -11.536764144897461, "global_step": 339406, "epoch": 2020} {"train_loss": -11.42167854309082, "global_step": 339407, "epoch": 2020} {"train_loss": -11.198116302490234, "global_step": 339408, "epoch": 2020} {"train_loss": -11.485030174255371, "global_step": 339409, "epoch": 2020} {"train_loss": -11.801349639892578, "global_step": 339410, "epoch": 2020} {"train_loss": -12.014512062072754, "global_step": 339411, "epoch": 2020} {"train_loss": -11.47318172454834, "global_step": 339412, "epoch": 2020} {"train_loss": -12.170713424682617, "global_step": 339413, "epoch": 2020} {"train_loss": -12.03913402557373, "global_step": 339414, "epoch": 2020} {"train_loss": -11.52199935913086, "global_step": 339415, "epoch": 2020} {"train_loss": -11.877084732055664, "global_step": 339416, "epoch": 2020} {"train_loss": -12.02956771850586, "global_step": 339417, "epoch": 2020} {"train_loss": -11.889883041381836, "global_step": 339418, "epoch": 2020} {"train_loss": -11.987908363342285, "global_step": 339419, "epoch": 2020} {"train_loss": -11.848947525024414, "global_step": 339420, "epoch": 2020} {"train_loss": -11.954814910888672, "global_step": 339421, "epoch": 2020} {"train_loss": -11.933494567871094, "global_step": 339422, "epoch": 2020} {"train_loss": -11.722919464111328, "global_step": 339423, "epoch": 2020} {"train_loss": -12.212188720703125, "global_step": 339424, "epoch": 2020} {"train_loss": -11.860563278198242, "global_step": 339425, "epoch": 2020} {"train_loss": -11.766801834106445, "global_step": 339426, "epoch": 2020} {"train_loss": -11.54561996459961, "global_step": 339427, "epoch": 2020} {"train_loss": -12.2666597366333, "global_step": 339428, "epoch": 2020} {"train_loss": -11.837249755859375, "global_step": 339429, "epoch": 2020} {"train_loss": -12.043208122253418, "global_step": 339430, "epoch": 2020} {"train_loss": -12.076620101928711, "global_step": 339431, "epoch": 2020} {"train_loss": -12.021350860595703, "global_step": 339432, "epoch": 2020} {"train_loss": -12.283108711242676, "global_step": 339433, "epoch": 2020} {"train_loss": -11.832752227783203, "global_step": 339434, "epoch": 2020} {"train_loss": -12.382570266723633, "global_step": 339435, "epoch": 2020} {"train_loss": -12.1918306350708, "global_step": 339436, "epoch": 2020} {"train_loss": -12.209348678588867, "global_step": 339437, "epoch": 2020} {"train_loss": -12.33270263671875, "global_step": 339438, "epoch": 2020} {"train_loss": -12.387392044067383, "global_step": 339439, "epoch": 2020} {"train_loss": -12.247123718261719, "global_step": 339440, "epoch": 2020} {"train_loss": -12.230698585510254, "global_step": 339441, "epoch": 2020} {"train_loss": -12.26003646850586, "global_step": 339442, "epoch": 2020} {"train_loss": -12.342972755432129, "global_step": 339443, "epoch": 2020} {"train_loss": -12.187067031860352, "global_step": 339444, "epoch": 2020} {"train_loss": -12.208658218383789, "global_step": 339445, "epoch": 2020} {"train_loss": -12.177091598510742, "global_step": 339446, "epoch": 2020} {"train_loss": -12.23971176147461, "global_step": 339447, "epoch": 2020} {"train_loss": -12.233686447143555, "global_step": 339448, "epoch": 2020} {"train_loss": -12.457052230834961, "global_step": 339449, "epoch": 2020} {"train_loss": -12.14849853515625, "global_step": 339450, "epoch": 2020} {"train_loss": -12.285862922668457, "global_step": 339451, "epoch": 2020} {"train_loss": -12.142658233642578, "global_step": 339452, "epoch": 2020} {"train_loss": -12.285202026367188, "global_step": 339453, "epoch": 2020} {"train_loss": -12.031779289245605, "global_step": 339454, "epoch": 2020} {"train_loss": -12.356937408447266, "global_step": 339455, "epoch": 2020} {"train_loss": -12.301064491271973, "global_step": 339456, "epoch": 2020} {"train_loss": -12.05556869506836, "global_step": 339457, "epoch": 2020} {"train_loss": -12.486381530761719, "global_step": 339458, "epoch": 2020} {"train_loss": -12.234722137451172, "global_step": 339459, "epoch": 2020} {"train_loss": -12.523597717285156, "global_step": 339460, "epoch": 2020} {"train_loss": -12.220443725585938, "global_step": 339461, "epoch": 2020} {"train_loss": -12.237882614135742, "global_step": 339462, "epoch": 2020} {"train_loss": -12.589347839355469, "global_step": 339463, "epoch": 2020} {"train_loss": -12.574443817138672, "global_step": 339464, "epoch": 2020} {"train_loss": -12.482236862182617, "global_step": 339465, "epoch": 2020} {"train_loss": -12.174116134643555, "global_step": 339466, "epoch": 2020} {"train_loss": -12.200325012207031, "global_step": 339467, "epoch": 2020} {"train_loss": -12.129454612731934, "global_step": 339468, "epoch": 2020} {"train_loss": -12.332878112792969, "global_step": 339469, "epoch": 2020} {"train_loss": -12.246442794799805, "global_step": 339470, "epoch": 2020} {"train_loss": -12.392281532287598, "global_step": 339471, "epoch": 2020} {"train_loss": -12.266217231750488, "global_step": 339472, "epoch": 2020} {"train_loss": -12.410980224609375, "global_step": 339473, "epoch": 2020} {"train_loss": -12.380976676940918, "global_step": 339474, "epoch": 2020} {"train_loss": -12.044524192810059, "global_step": 339475, "epoch": 2020} {"train_loss": -12.297172546386719, "global_step": 339476, "epoch": 2020} {"train_loss": -12.234654426574707, "global_step": 339477, "epoch": 2020} {"train_loss": -12.362159729003906, "global_step": 339478, "epoch": 2020} {"train_loss": -12.37301254272461, "global_step": 339479, "epoch": 2020} {"train_loss": -12.355155944824219, "global_step": 339480, "epoch": 2020} {"train_loss": -12.569421768188477, "global_step": 339481, "epoch": 2020} {"train_loss": -12.582544326782227, "global_step": 339482, "epoch": 2020} {"train_loss": -12.464616775512695, "global_step": 339483, "epoch": 2020} {"train_loss": -12.581605911254883, "global_step": 339484, "epoch": 2020} {"train_loss": -12.24250602722168, "global_step": 339485, "epoch": 2020} {"train_loss": -12.378410339355469, "global_step": 339486, "epoch": 2020} {"train_loss": -12.407675743103027, "global_step": 339487, "epoch": 2020} {"train_loss": -12.234046936035156, "global_step": 339488, "epoch": 2020} {"train_loss": -11.417839050292969, "global_step": 339489, "epoch": 2020} {"train_loss": -12.098838806152344, "global_step": 339490, "epoch": 2020} {"train_loss": -12.20458698272705, "global_step": 339491, "epoch": 2020} {"train_loss": -11.189719200134277, "global_step": 339492, "epoch": 2020} {"train_loss": -9.989295959472656, "global_step": 339493, "epoch": 2020} {"train_loss": -10.020740509033203, "global_step": 339494, "epoch": 2020} {"train_loss": -11.904777526855469, "global_step": 339495, "epoch": 2020} {"train_loss": -10.857388496398926, "global_step": 339496, "epoch": 2020} {"train_loss": -12.238153457641602, "global_step": 339497, "epoch": 2020} {"train_loss": -11.596149444580078, "global_step": 339498, "epoch": 2020} {"train_loss": -11.266716957092285, "global_step": 339499, "epoch": 2020} {"train_loss": -11.709030151367188, "global_step": 339500, "epoch": 2020} {"train_loss": -12.347820281982422, "global_step": 339501, "epoch": 2020} {"train_loss": -12.091814041137695, "global_step": 339502, "epoch": 2020} {"train_loss": -11.639484405517578, "global_step": 339503, "epoch": 2020} {"train_loss": -11.421223640441895, "global_step": 339504, "epoch": 2020} {"train_loss": -12.284242630004883, "global_step": 339505, "epoch": 2020} {"train_loss": -11.660858154296875, "global_step": 339506, "epoch": 2020} {"train_loss": -12.328977584838867, "global_step": 339507, "epoch": 2020} {"train_loss": -11.725168228149414, "global_step": 339508, "epoch": 2020} {"train_loss": -11.930157661437988, "global_step": 339509, "epoch": 2020} {"train_loss": -12.31714916229248, "global_step": 339510, "epoch": 2020} {"train_loss": -11.564051628112793, "global_step": 339511, "epoch": 2020} {"train_loss": -11.618157386779785, "global_step": 339512, "epoch": 2020} {"train_loss": -11.823444366455078, "global_step": 339513, "epoch": 2020} {"train_loss": -10.2700777053833, "global_step": 339514, "epoch": 2020} {"train_loss": -12.191411972045898, "global_step": 339515, "epoch": 2020} {"train_loss": -9.031551361083984, "global_step": 339516, "epoch": 2020} {"train_loss": -10.961091041564941, "global_step": 339517, "epoch": 2020} {"train_loss": -9.93464183807373, "global_step": 339518, "epoch": 2020} {"train_loss": -9.740715026855469, "global_step": 339519, "epoch": 2020} {"train_loss": -7.797359943389893, "global_step": 339520, "epoch": 2020} {"train_loss": -7.896738052368164, "global_step": 339521, "epoch": 2020} {"train_loss": -9.007935523986816, "global_step": 339522, "epoch": 2020} {"train_loss": -10.028818130493164, "global_step": 339523, "epoch": 2020} {"train_loss": -10.320035934448242, "global_step": 339524, "epoch": 2020} {"train_loss": -9.34717845916748, "global_step": 339525, "epoch": 2020} {"train_loss": -9.220212936401367, "global_step": 339526, "epoch": 2020} {"train_loss": -11.614418855735234, "global_step": 339527, "epoch": 2020, "val_loss": 277245.53125, "train_action_mse_error": 1.5543861389160156} {"train_loss": -9.45595645904541, "global_step": 339528, "epoch": 2021} {"train_loss": -9.243531227111816, "global_step": 339529, "epoch": 2021} {"train_loss": -10.340482711791992, "global_step": 339530, "epoch": 2021} {"train_loss": -9.777491569519043, "global_step": 339531, "epoch": 2021} {"train_loss": -10.152193069458008, "global_step": 339532, "epoch": 2021} {"train_loss": -10.832315444946289, "global_step": 339533, "epoch": 2021} {"train_loss": -11.207385063171387, "global_step": 339534, "epoch": 2021} {"train_loss": -10.302104949951172, "global_step": 339535, "epoch": 2021} {"train_loss": -11.291836738586426, "global_step": 339536, "epoch": 2021} {"train_loss": -9.782514572143555, "global_step": 339537, "epoch": 2021} {"train_loss": -10.620104789733887, "global_step": 339538, "epoch": 2021} {"train_loss": -11.336877822875977, "global_step": 339539, "epoch": 2021} {"train_loss": -10.272178649902344, "global_step": 339540, "epoch": 2021} {"train_loss": -11.539091110229492, "global_step": 339541, "epoch": 2021} {"train_loss": -11.094236373901367, "global_step": 339542, "epoch": 2021} {"train_loss": -11.638496398925781, "global_step": 339543, "epoch": 2021} {"train_loss": -11.256196975708008, "global_step": 339544, "epoch": 2021} {"train_loss": -11.286293983459473, "global_step": 339545, "epoch": 2021} {"train_loss": -11.53671646118164, "global_step": 339546, "epoch": 2021} {"train_loss": -11.582969665527344, "global_step": 339547, "epoch": 2021} {"train_loss": -11.652655601501465, "global_step": 339548, "epoch": 2021} {"train_loss": -11.706708908081055, "global_step": 339549, "epoch": 2021} {"train_loss": -11.784195899963379, "global_step": 339550, "epoch": 2021} {"train_loss": -11.85595703125, "global_step": 339551, "epoch": 2021} {"train_loss": -11.925182342529297, "global_step": 339552, "epoch": 2021} {"train_loss": -11.797381401062012, "global_step": 339553, "epoch": 2021} {"train_loss": -11.662043571472168, "global_step": 339554, "epoch": 2021} {"train_loss": -11.923805236816406, "global_step": 339555, "epoch": 2021} {"train_loss": -11.844561576843262, "global_step": 339556, "epoch": 2021} {"train_loss": -11.807374954223633, "global_step": 339557, "epoch": 2021} {"train_loss": -11.833586692810059, "global_step": 339558, "epoch": 2021} {"train_loss": -11.749687194824219, "global_step": 339559, "epoch": 2021} {"train_loss": -12.00927448272705, "global_step": 339560, "epoch": 2021} {"train_loss": -11.850460052490234, "global_step": 339561, "epoch": 2021} {"train_loss": -11.785078048706055, "global_step": 339562, "epoch": 2021} {"train_loss": -11.811336517333984, "global_step": 339563, "epoch": 2021} {"train_loss": -12.122001647949219, "global_step": 339564, "epoch": 2021} {"train_loss": -11.909433364868164, "global_step": 339565, "epoch": 2021} {"train_loss": -11.825811386108398, "global_step": 339566, "epoch": 2021} {"train_loss": -11.770490646362305, "global_step": 339567, "epoch": 2021} {"train_loss": -11.44856071472168, "global_step": 339568, "epoch": 2021} {"train_loss": -11.860130310058594, "global_step": 339569, "epoch": 2021} {"train_loss": -11.95102310180664, "global_step": 339570, "epoch": 2021} {"train_loss": -12.0208158493042, "global_step": 339571, "epoch": 2021} {"train_loss": -12.160323143005371, "global_step": 339572, "epoch": 2021} {"train_loss": -11.992881774902344, "global_step": 339573, "epoch": 2021} {"train_loss": -11.711076736450195, "global_step": 339574, "epoch": 2021} {"train_loss": -12.096790313720703, "global_step": 339575, "epoch": 2021} {"train_loss": -12.02306079864502, "global_step": 339576, "epoch": 2021} {"train_loss": -12.031845092773438, "global_step": 339577, "epoch": 2021} {"train_loss": -12.163311958312988, "global_step": 339578, "epoch": 2021} {"train_loss": -12.111289024353027, "global_step": 339579, "epoch": 2021} {"train_loss": -12.262422561645508, "global_step": 339580, "epoch": 2021} {"train_loss": -12.203386306762695, "global_step": 339581, "epoch": 2021} {"train_loss": -12.364845275878906, "global_step": 339582, "epoch": 2021} {"train_loss": -12.150245666503906, "global_step": 339583, "epoch": 2021} {"train_loss": -12.445140838623047, "global_step": 339584, "epoch": 2021} {"train_loss": -12.064840316772461, "global_step": 339585, "epoch": 2021} {"train_loss": -11.810157775878906, "global_step": 339586, "epoch": 2021} {"train_loss": -12.319683074951172, "global_step": 339587, "epoch": 2021} {"train_loss": -12.169583320617676, "global_step": 339588, "epoch": 2021} {"train_loss": -12.307198524475098, "global_step": 339589, "epoch": 2021} {"train_loss": -12.143645286560059, "global_step": 339590, "epoch": 2021} {"train_loss": -12.31589126586914, "global_step": 339591, "epoch": 2021} {"train_loss": -12.078020095825195, "global_step": 339592, "epoch": 2021} {"train_loss": -12.326814651489258, "global_step": 339593, "epoch": 2021} {"train_loss": -12.184617042541504, "global_step": 339594, "epoch": 2021} {"train_loss": -12.398073196411133, "global_step": 339595, "epoch": 2021} {"train_loss": -12.309062957763672, "global_step": 339596, "epoch": 2021} {"train_loss": -12.519264221191406, "global_step": 339597, "epoch": 2021} {"train_loss": -12.398542404174805, "global_step": 339598, "epoch": 2021} {"train_loss": -12.518177032470703, "global_step": 339599, "epoch": 2021} {"train_loss": -12.334758758544922, "global_step": 339600, "epoch": 2021} {"train_loss": -12.419742584228516, "global_step": 339601, "epoch": 2021} {"train_loss": -12.478212356567383, "global_step": 339602, "epoch": 2021} {"train_loss": -12.27112865447998, "global_step": 339603, "epoch": 2021} {"train_loss": -12.38853645324707, "global_step": 339604, "epoch": 2021} {"train_loss": -12.384714126586914, "global_step": 339605, "epoch": 2021} {"train_loss": -12.256010055541992, "global_step": 339606, "epoch": 2021} {"train_loss": -12.50582218170166, "global_step": 339607, "epoch": 2021} {"train_loss": -12.147558212280273, "global_step": 339608, "epoch": 2021} {"train_loss": -12.297822952270508, "global_step": 339609, "epoch": 2021} {"train_loss": -12.400520324707031, "global_step": 339610, "epoch": 2021} {"train_loss": -11.977853775024414, "global_step": 339611, "epoch": 2021} {"train_loss": -12.564931869506836, "global_step": 339612, "epoch": 2021} {"train_loss": -12.278192520141602, "global_step": 339613, "epoch": 2021} {"train_loss": -12.257226943969727, "global_step": 339614, "epoch": 2021} {"train_loss": -12.21792984008789, "global_step": 339615, "epoch": 2021} {"train_loss": -11.974000930786133, "global_step": 339616, "epoch": 2021} {"train_loss": -12.563508987426758, "global_step": 339617, "epoch": 2021} {"train_loss": -12.056365966796875, "global_step": 339618, "epoch": 2021} {"train_loss": -12.422001838684082, "global_step": 339619, "epoch": 2021} {"train_loss": -12.38555908203125, "global_step": 339620, "epoch": 2021} {"train_loss": -12.501605987548828, "global_step": 339621, "epoch": 2021} {"train_loss": -12.433616638183594, "global_step": 339622, "epoch": 2021} {"train_loss": -12.686004638671875, "global_step": 339623, "epoch": 2021} {"train_loss": -12.61530876159668, "global_step": 339624, "epoch": 2021} {"train_loss": -12.52225112915039, "global_step": 339625, "epoch": 2021} {"train_loss": -12.569341659545898, "global_step": 339626, "epoch": 2021} {"train_loss": -12.394593238830566, "global_step": 339627, "epoch": 2021} {"train_loss": -12.420721054077148, "global_step": 339628, "epoch": 2021} {"train_loss": -12.375925064086914, "global_step": 339629, "epoch": 2021} {"train_loss": -12.592625617980957, "global_step": 339630, "epoch": 2021} {"train_loss": -12.288188934326172, "global_step": 339631, "epoch": 2021} {"train_loss": -12.444360733032227, "global_step": 339632, "epoch": 2021} {"train_loss": -12.257558822631836, "global_step": 339633, "epoch": 2021} {"train_loss": -12.609146118164062, "global_step": 339634, "epoch": 2021} {"train_loss": -12.452254295349121, "global_step": 339635, "epoch": 2021} {"train_loss": -12.52110481262207, "global_step": 339636, "epoch": 2021} {"train_loss": -11.968034744262695, "global_step": 339637, "epoch": 2021} {"train_loss": -12.577733993530273, "global_step": 339638, "epoch": 2021} {"train_loss": -12.375651359558105, "global_step": 339639, "epoch": 2021} {"train_loss": -12.655474662780762, "global_step": 339640, "epoch": 2021} {"train_loss": -12.405647277832031, "global_step": 339641, "epoch": 2021} {"train_loss": -12.411029815673828, "global_step": 339642, "epoch": 2021} {"train_loss": -12.405647277832031, "global_step": 339643, "epoch": 2021} {"train_loss": -12.54131031036377, "global_step": 339644, "epoch": 2021} {"train_loss": -12.283685684204102, "global_step": 339645, "epoch": 2021} {"train_loss": -12.555790901184082, "global_step": 339646, "epoch": 2021} {"train_loss": -12.080146789550781, "global_step": 339647, "epoch": 2021} {"train_loss": -11.662168502807617, "global_step": 339648, "epoch": 2021} {"train_loss": -11.612747192382812, "global_step": 339649, "epoch": 2021} {"train_loss": -12.288468360900879, "global_step": 339650, "epoch": 2021} {"train_loss": -11.840160369873047, "global_step": 339651, "epoch": 2021} {"train_loss": -10.851550102233887, "global_step": 339652, "epoch": 2021} {"train_loss": -10.876242637634277, "global_step": 339653, "epoch": 2021} {"train_loss": -11.483760833740234, "global_step": 339654, "epoch": 2021} {"train_loss": -11.760066032409668, "global_step": 339655, "epoch": 2021} {"train_loss": -10.236705780029297, "global_step": 339656, "epoch": 2021} {"train_loss": -11.58824348449707, "global_step": 339657, "epoch": 2021} {"train_loss": -8.88730239868164, "global_step": 339658, "epoch": 2021} {"train_loss": -7.972613334655762, "global_step": 339659, "epoch": 2021} {"train_loss": -8.755943298339844, "global_step": 339660, "epoch": 2021} {"train_loss": -8.79498291015625, "global_step": 339661, "epoch": 2021} {"train_loss": -10.569901466369629, "global_step": 339662, "epoch": 2021} {"train_loss": -9.083295822143555, "global_step": 339663, "epoch": 2021} {"train_loss": -10.407922744750977, "global_step": 339664, "epoch": 2021} {"train_loss": -10.043274879455566, "global_step": 339665, "epoch": 2021} {"train_loss": -10.976841926574707, "global_step": 339666, "epoch": 2021} {"train_loss": -9.41466999053955, "global_step": 339667, "epoch": 2021} {"train_loss": -11.322229385375977, "global_step": 339668, "epoch": 2021} {"train_loss": -9.176490783691406, "global_step": 339669, "epoch": 2021} {"train_loss": -10.263151168823242, "global_step": 339670, "epoch": 2021} {"train_loss": -9.429106712341309, "global_step": 339671, "epoch": 2021} {"train_loss": -10.058120727539062, "global_step": 339672, "epoch": 2021} {"train_loss": -10.010110855102539, "global_step": 339673, "epoch": 2021} {"train_loss": -10.647510528564453, "global_step": 339674, "epoch": 2021} {"train_loss": -9.980415344238281, "global_step": 339675, "epoch": 2021} {"train_loss": -11.571874618530273, "global_step": 339676, "epoch": 2021} {"train_loss": -11.115585327148438, "global_step": 339677, "epoch": 2021} {"train_loss": -11.80614948272705, "global_step": 339678, "epoch": 2021} {"train_loss": -11.472075462341309, "global_step": 339679, "epoch": 2021} {"train_loss": -11.59835433959961, "global_step": 339680, "epoch": 2021} {"train_loss": -11.42113971710205, "global_step": 339681, "epoch": 2021} {"train_loss": -12.20120906829834, "global_step": 339682, "epoch": 2021} {"train_loss": -11.627761840820312, "global_step": 339683, "epoch": 2021} {"train_loss": -11.783103942871094, "global_step": 339684, "epoch": 2021} {"train_loss": -11.757676124572754, "global_step": 339685, "epoch": 2021} {"train_loss": -12.077373504638672, "global_step": 339686, "epoch": 2021} {"train_loss": -11.589730262756348, "global_step": 339687, "epoch": 2021} {"train_loss": -11.787320137023926, "global_step": 339688, "epoch": 2021} {"train_loss": -11.962623596191406, "global_step": 339689, "epoch": 2021} {"train_loss": -11.913390159606934, "global_step": 339690, "epoch": 2021} {"train_loss": -12.046430587768555, "global_step": 339691, "epoch": 2021} {"train_loss": -12.085381507873535, "global_step": 339692, "epoch": 2021} {"train_loss": -12.017913818359375, "global_step": 339693, "epoch": 2021} {"train_loss": -12.052568435668945, "global_step": 339694, "epoch": 2021} {"train_loss": -11.670164568083626, "global_step": 339695, "epoch": 2021, "val_loss": 284628.0625} {"train_loss": -12.261635780334473, "global_step": 339696, "epoch": 2022} {"train_loss": -12.065774917602539, "global_step": 339697, "epoch": 2022} {"train_loss": -12.15162467956543, "global_step": 339698, "epoch": 2022} {"train_loss": -11.901247024536133, "global_step": 339699, "epoch": 2022} {"train_loss": -12.036144256591797, "global_step": 339700, "epoch": 2022} {"train_loss": -12.284502029418945, "global_step": 339701, "epoch": 2022} {"train_loss": -12.005003929138184, "global_step": 339702, "epoch": 2022} {"train_loss": -11.952279090881348, "global_step": 339703, "epoch": 2022} {"train_loss": -11.908792495727539, "global_step": 339704, "epoch": 2022} {"train_loss": -12.024950981140137, "global_step": 339705, "epoch": 2022} {"train_loss": -12.232259750366211, "global_step": 339706, "epoch": 2022} {"train_loss": -12.011606216430664, "global_step": 339707, "epoch": 2022} {"train_loss": -12.17546272277832, "global_step": 339708, "epoch": 2022} {"train_loss": -12.267498016357422, "global_step": 339709, "epoch": 2022} {"train_loss": -12.196813583374023, "global_step": 339710, "epoch": 2022} {"train_loss": -12.078877449035645, "global_step": 339711, "epoch": 2022} {"train_loss": -12.120370864868164, "global_step": 339712, "epoch": 2022} {"train_loss": -12.240340232849121, "global_step": 339713, "epoch": 2022} {"train_loss": -12.320609092712402, "global_step": 339714, "epoch": 2022} {"train_loss": -12.13119888305664, "global_step": 339715, "epoch": 2022} {"train_loss": -12.178215026855469, "global_step": 339716, "epoch": 2022} {"train_loss": -12.291961669921875, "global_step": 339717, "epoch": 2022} {"train_loss": -12.26005744934082, "global_step": 339718, "epoch": 2022} {"train_loss": -12.411303520202637, "global_step": 339719, "epoch": 2022} {"train_loss": -12.27787971496582, "global_step": 339720, "epoch": 2022} {"train_loss": -12.319242477416992, "global_step": 339721, "epoch": 2022} {"train_loss": -12.457452774047852, "global_step": 339722, "epoch": 2022} {"train_loss": -12.191082000732422, "global_step": 339723, "epoch": 2022} {"train_loss": -12.653292655944824, "global_step": 339724, "epoch": 2022} {"train_loss": -12.418767929077148, "global_step": 339725, "epoch": 2022} {"train_loss": -12.449516296386719, "global_step": 339726, "epoch": 2022} {"train_loss": -12.347152709960938, "global_step": 339727, "epoch": 2022} {"train_loss": -12.092700958251953, "global_step": 339728, "epoch": 2022} {"train_loss": -12.493663787841797, "global_step": 339729, "epoch": 2022} {"train_loss": -12.439275741577148, "global_step": 339730, "epoch": 2022} {"train_loss": -12.302299499511719, "global_step": 339731, "epoch": 2022} {"train_loss": -12.384591102600098, "global_step": 339732, "epoch": 2022} {"train_loss": -12.19401741027832, "global_step": 339733, "epoch": 2022} {"train_loss": -12.62130069732666, "global_step": 339734, "epoch": 2022} {"train_loss": -11.996031761169434, "global_step": 339735, "epoch": 2022} {"train_loss": -11.986360549926758, "global_step": 339736, "epoch": 2022} {"train_loss": -12.350889205932617, "global_step": 339737, "epoch": 2022} {"train_loss": -12.051765441894531, "global_step": 339738, "epoch": 2022} {"train_loss": -10.7940673828125, "global_step": 339739, "epoch": 2022} {"train_loss": -10.448554992675781, "global_step": 339740, "epoch": 2022} {"train_loss": -11.546027183532715, "global_step": 339741, "epoch": 2022} {"train_loss": -10.963834762573242, "global_step": 339742, "epoch": 2022} {"train_loss": -7.870122909545898, "global_step": 339743, "epoch": 2022} {"train_loss": -8.951878547668457, "global_step": 339744, "epoch": 2022} {"train_loss": -10.74209976196289, "global_step": 339745, "epoch": 2022} {"train_loss": -11.491827964782715, "global_step": 339746, "epoch": 2022} {"train_loss": -10.502954483032227, "global_step": 339747, "epoch": 2022} {"train_loss": -12.180570602416992, "global_step": 339748, "epoch": 2022} {"train_loss": -10.426399230957031, "global_step": 339749, "epoch": 2022} {"train_loss": -11.843912124633789, "global_step": 339750, "epoch": 2022} {"train_loss": -10.904800415039062, "global_step": 339751, "epoch": 2022} {"train_loss": -11.15745735168457, "global_step": 339752, "epoch": 2022} {"train_loss": -11.28350830078125, "global_step": 339753, "epoch": 2022} {"train_loss": -10.180386543273926, "global_step": 339754, "epoch": 2022} {"train_loss": -9.601934432983398, "global_step": 339755, "epoch": 2022} {"train_loss": -11.935558319091797, "global_step": 339756, "epoch": 2022} {"train_loss": -9.589508056640625, "global_step": 339757, "epoch": 2022} {"train_loss": -11.90301513671875, "global_step": 339758, "epoch": 2022} {"train_loss": -9.848155975341797, "global_step": 339759, "epoch": 2022} {"train_loss": -11.311567306518555, "global_step": 339760, "epoch": 2022} {"train_loss": -11.346410751342773, "global_step": 339761, "epoch": 2022} {"train_loss": -10.900330543518066, "global_step": 339762, "epoch": 2022} {"train_loss": -11.459351539611816, "global_step": 339763, "epoch": 2022} {"train_loss": -10.599416732788086, "global_step": 339764, "epoch": 2022} {"train_loss": -12.210372924804688, "global_step": 339765, "epoch": 2022} {"train_loss": -11.208719253540039, "global_step": 339766, "epoch": 2022} {"train_loss": -10.826423645019531, "global_step": 339767, "epoch": 2022} {"train_loss": -12.065357208251953, "global_step": 339768, "epoch": 2022} {"train_loss": -11.02778434753418, "global_step": 339769, "epoch": 2022} {"train_loss": -11.70288372039795, "global_step": 339770, "epoch": 2022} {"train_loss": -11.751721382141113, "global_step": 339771, "epoch": 2022} {"train_loss": -11.303973197937012, "global_step": 339772, "epoch": 2022} {"train_loss": -11.735444068908691, "global_step": 339773, "epoch": 2022} {"train_loss": -11.279145240783691, "global_step": 339774, "epoch": 2022} {"train_loss": -11.323240280151367, "global_step": 339775, "epoch": 2022} {"train_loss": -11.881585121154785, "global_step": 339776, "epoch": 2022} {"train_loss": -10.752975463867188, "global_step": 339777, "epoch": 2022} {"train_loss": -11.254962921142578, "global_step": 339778, "epoch": 2022} {"train_loss": -12.217905044555664, "global_step": 339779, "epoch": 2022} {"train_loss": -11.174798965454102, "global_step": 339780, "epoch": 2022} {"train_loss": -11.708914756774902, "global_step": 339781, "epoch": 2022} {"train_loss": -11.583215713500977, "global_step": 339782, "epoch": 2022} {"train_loss": -11.392206192016602, "global_step": 339783, "epoch": 2022} {"train_loss": -11.472145080566406, "global_step": 339784, "epoch": 2022} {"train_loss": -10.900696754455566, "global_step": 339785, "epoch": 2022} {"train_loss": -11.247087478637695, "global_step": 339786, "epoch": 2022} {"train_loss": -11.559371948242188, "global_step": 339787, "epoch": 2022} {"train_loss": -11.997455596923828, "global_step": 339788, "epoch": 2022} {"train_loss": -11.128896713256836, "global_step": 339789, "epoch": 2022} {"train_loss": -12.288984298706055, "global_step": 339790, "epoch": 2022} {"train_loss": -11.508501052856445, "global_step": 339791, "epoch": 2022} {"train_loss": -12.063643455505371, "global_step": 339792, "epoch": 2022} {"train_loss": -11.694070816040039, "global_step": 339793, "epoch": 2022} {"train_loss": -11.95849609375, "global_step": 339794, "epoch": 2022} {"train_loss": -12.005949020385742, "global_step": 339795, "epoch": 2022} {"train_loss": -12.106295585632324, "global_step": 339796, "epoch": 2022} {"train_loss": -11.901507377624512, "global_step": 339797, "epoch": 2022} {"train_loss": -12.327855110168457, "global_step": 339798, "epoch": 2022} {"train_loss": -12.079721450805664, "global_step": 339799, "epoch": 2022} {"train_loss": -11.977261543273926, "global_step": 339800, "epoch": 2022} {"train_loss": -12.385136604309082, "global_step": 339801, "epoch": 2022} {"train_loss": -12.257760047912598, "global_step": 339802, "epoch": 2022} {"train_loss": -12.288403511047363, "global_step": 339803, "epoch": 2022} {"train_loss": -12.230384826660156, "global_step": 339804, "epoch": 2022} {"train_loss": -12.061232566833496, "global_step": 339805, "epoch": 2022} {"train_loss": -12.127985000610352, "global_step": 339806, "epoch": 2022} {"train_loss": -12.312747955322266, "global_step": 339807, "epoch": 2022} {"train_loss": -12.100425720214844, "global_step": 339808, "epoch": 2022} {"train_loss": -12.044124603271484, "global_step": 339809, "epoch": 2022} {"train_loss": -12.320184707641602, "global_step": 339810, "epoch": 2022} {"train_loss": -11.696349143981934, "global_step": 339811, "epoch": 2022} {"train_loss": -12.186717987060547, "global_step": 339812, "epoch": 2022} {"train_loss": -11.651664733886719, "global_step": 339813, "epoch": 2022} {"train_loss": -11.992712020874023, "global_step": 339814, "epoch": 2022} {"train_loss": -11.934181213378906, "global_step": 339815, "epoch": 2022} {"train_loss": -12.03066635131836, "global_step": 339816, "epoch": 2022} {"train_loss": -11.718130111694336, "global_step": 339817, "epoch": 2022} {"train_loss": -12.185380935668945, "global_step": 339818, "epoch": 2022} {"train_loss": -11.791494369506836, "global_step": 339819, "epoch": 2022} {"train_loss": -12.096848487854004, "global_step": 339820, "epoch": 2022} {"train_loss": -11.871400833129883, "global_step": 339821, "epoch": 2022} {"train_loss": -12.348670959472656, "global_step": 339822, "epoch": 2022} {"train_loss": -11.982486724853516, "global_step": 339823, "epoch": 2022} {"train_loss": -12.363401412963867, "global_step": 339824, "epoch": 2022} {"train_loss": -12.020922660827637, "global_step": 339825, "epoch": 2022} {"train_loss": -12.402334213256836, "global_step": 339826, "epoch": 2022} {"train_loss": -12.214496612548828, "global_step": 339827, "epoch": 2022} {"train_loss": -12.338155746459961, "global_step": 339828, "epoch": 2022} {"train_loss": -12.274101257324219, "global_step": 339829, "epoch": 2022} {"train_loss": -12.460412979125977, "global_step": 339830, "epoch": 2022} {"train_loss": -12.304153442382812, "global_step": 339831, "epoch": 2022} {"train_loss": -12.464715957641602, "global_step": 339832, "epoch": 2022} {"train_loss": -12.392494201660156, "global_step": 339833, "epoch": 2022} {"train_loss": -12.281892776489258, "global_step": 339834, "epoch": 2022} {"train_loss": -12.264674186706543, "global_step": 339835, "epoch": 2022} {"train_loss": -12.20136833190918, "global_step": 339836, "epoch": 2022} {"train_loss": -12.20372200012207, "global_step": 339837, "epoch": 2022} {"train_loss": -12.182056427001953, "global_step": 339838, "epoch": 2022} {"train_loss": -12.294855117797852, "global_step": 339839, "epoch": 2022} {"train_loss": -12.43615436553955, "global_step": 339840, "epoch": 2022} {"train_loss": -12.348129272460938, "global_step": 339841, "epoch": 2022} {"train_loss": -12.452899932861328, "global_step": 339842, "epoch": 2022} {"train_loss": -12.244220733642578, "global_step": 339843, "epoch": 2022} {"train_loss": -12.421662330627441, "global_step": 339844, "epoch": 2022} {"train_loss": -12.294782638549805, "global_step": 339845, "epoch": 2022} {"train_loss": -12.451605796813965, "global_step": 339846, "epoch": 2022} {"train_loss": -12.316533088684082, "global_step": 339847, "epoch": 2022} {"train_loss": -12.56521224975586, "global_step": 339848, "epoch": 2022} {"train_loss": -12.618867874145508, "global_step": 339849, "epoch": 2022} {"train_loss": -12.487813949584961, "global_step": 339850, "epoch": 2022} {"train_loss": -12.619428634643555, "global_step": 339851, "epoch": 2022} {"train_loss": -12.396045684814453, "global_step": 339852, "epoch": 2022} {"train_loss": -12.481800079345703, "global_step": 339853, "epoch": 2022} {"train_loss": -12.4600830078125, "global_step": 339854, "epoch": 2022} {"train_loss": -12.217361450195312, "global_step": 339855, "epoch": 2022} {"train_loss": -12.289825439453125, "global_step": 339856, "epoch": 2022} {"train_loss": -12.629960060119629, "global_step": 339857, "epoch": 2022} {"train_loss": -12.541666030883789, "global_step": 339858, "epoch": 2022} {"train_loss": -12.673283576965332, "global_step": 339859, "epoch": 2022} {"train_loss": -12.7228422164917, "global_step": 339860, "epoch": 2022} {"train_loss": -12.668478965759277, "global_step": 339861, "epoch": 2022} {"train_loss": -12.654468536376953, "global_step": 339862, "epoch": 2022} {"train_loss": -11.891520687511989, "global_step": 339863, "epoch": 2022, "val_loss": 280273.625} {"train_loss": -12.516029357910156, "global_step": 339864, "epoch": 2023} {"train_loss": -12.369474411010742, "global_step": 339865, "epoch": 2023} {"train_loss": -12.36509895324707, "global_step": 339866, "epoch": 2023} {"train_loss": -12.713750839233398, "global_step": 339867, "epoch": 2023} {"train_loss": -12.464381217956543, "global_step": 339868, "epoch": 2023} {"train_loss": -12.574175834655762, "global_step": 339869, "epoch": 2023} {"train_loss": -12.588346481323242, "global_step": 339870, "epoch": 2023} {"train_loss": -12.490280151367188, "global_step": 339871, "epoch": 2023} {"train_loss": -11.939530372619629, "global_step": 339872, "epoch": 2023} {"train_loss": -12.41871452331543, "global_step": 339873, "epoch": 2023} {"train_loss": -12.278852462768555, "global_step": 339874, "epoch": 2023} {"train_loss": -12.45004653930664, "global_step": 339875, "epoch": 2023} {"train_loss": -12.449806213378906, "global_step": 339876, "epoch": 2023} {"train_loss": -11.943267822265625, "global_step": 339877, "epoch": 2023} {"train_loss": -12.147052764892578, "global_step": 339878, "epoch": 2023} {"train_loss": -11.959634780883789, "global_step": 339879, "epoch": 2023} {"train_loss": -12.039010047912598, "global_step": 339880, "epoch": 2023} {"train_loss": -12.389083862304688, "global_step": 339881, "epoch": 2023} {"train_loss": -11.898104667663574, "global_step": 339882, "epoch": 2023} {"train_loss": -11.28860855102539, "global_step": 339883, "epoch": 2023} {"train_loss": -11.951187133789062, "global_step": 339884, "epoch": 2023} {"train_loss": -12.469980239868164, "global_step": 339885, "epoch": 2023} {"train_loss": -12.159440040588379, "global_step": 339886, "epoch": 2023} {"train_loss": -11.726778030395508, "global_step": 339887, "epoch": 2023} {"train_loss": -11.786409378051758, "global_step": 339888, "epoch": 2023} {"train_loss": -12.083663940429688, "global_step": 339889, "epoch": 2023} {"train_loss": -12.162001609802246, "global_step": 339890, "epoch": 2023} {"train_loss": -10.906362533569336, "global_step": 339891, "epoch": 2023} {"train_loss": -11.61044692993164, "global_step": 339892, "epoch": 2023} {"train_loss": -10.946297645568848, "global_step": 339893, "epoch": 2023} {"train_loss": -11.695634841918945, "global_step": 339894, "epoch": 2023} {"train_loss": -11.135544776916504, "global_step": 339895, "epoch": 2023} {"train_loss": -11.70823860168457, "global_step": 339896, "epoch": 2023} {"train_loss": -11.313004493713379, "global_step": 339897, "epoch": 2023} {"train_loss": -11.266407012939453, "global_step": 339898, "epoch": 2023} {"train_loss": -8.97120475769043, "global_step": 339899, "epoch": 2023} {"train_loss": -9.705942153930664, "global_step": 339900, "epoch": 2023} {"train_loss": -10.717440605163574, "global_step": 339901, "epoch": 2023} {"train_loss": -9.50065803527832, "global_step": 339902, "epoch": 2023} {"train_loss": -10.02291488647461, "global_step": 339903, "epoch": 2023} {"train_loss": -8.56717300415039, "global_step": 339904, "epoch": 2023} {"train_loss": -6.602015018463135, "global_step": 339905, "epoch": 2023} {"train_loss": -7.480818748474121, "global_step": 339906, "epoch": 2023} {"train_loss": -7.137060642242432, "global_step": 339907, "epoch": 2023} {"train_loss": -7.398189544677734, "global_step": 339908, "epoch": 2023} {"train_loss": -8.923117637634277, "global_step": 339909, "epoch": 2023} {"train_loss": -8.508180618286133, "global_step": 339910, "epoch": 2023} {"train_loss": -8.926401138305664, "global_step": 339911, "epoch": 2023} {"train_loss": -8.243886947631836, "global_step": 339912, "epoch": 2023} {"train_loss": -8.764861106872559, "global_step": 339913, "epoch": 2023} {"train_loss": -9.726212501525879, "global_step": 339914, "epoch": 2023} {"train_loss": -10.236503601074219, "global_step": 339915, "epoch": 2023} {"train_loss": -10.03610897064209, "global_step": 339916, "epoch": 2023} {"train_loss": -10.528066635131836, "global_step": 339917, "epoch": 2023} {"train_loss": -10.12968635559082, "global_step": 339918, "epoch": 2023} {"train_loss": -10.021199226379395, "global_step": 339919, "epoch": 2023} {"train_loss": -10.37972640991211, "global_step": 339920, "epoch": 2023} {"train_loss": -10.573665618896484, "global_step": 339921, "epoch": 2023} {"train_loss": -9.883995056152344, "global_step": 339922, "epoch": 2023} {"train_loss": -9.80508804321289, "global_step": 339923, "epoch": 2023} {"train_loss": -11.044214248657227, "global_step": 339924, "epoch": 2023} {"train_loss": -9.653243064880371, "global_step": 339925, "epoch": 2023} {"train_loss": -9.774720191955566, "global_step": 339926, "epoch": 2023} {"train_loss": -10.704744338989258, "global_step": 339927, "epoch": 2023} {"train_loss": -11.57538890838623, "global_step": 339928, "epoch": 2023} {"train_loss": -10.10517692565918, "global_step": 339929, "epoch": 2023} {"train_loss": -10.791425704956055, "global_step": 339930, "epoch": 2023} {"train_loss": -10.741283416748047, "global_step": 339931, "epoch": 2023} {"train_loss": -10.86461353302002, "global_step": 339932, "epoch": 2023} {"train_loss": -10.991250991821289, "global_step": 339933, "epoch": 2023} {"train_loss": -11.377375602722168, "global_step": 339934, "epoch": 2023} {"train_loss": -10.479997634887695, "global_step": 339935, "epoch": 2023} {"train_loss": -11.893436431884766, "global_step": 339936, "epoch": 2023} {"train_loss": -10.98484992980957, "global_step": 339937, "epoch": 2023} {"train_loss": -11.400522232055664, "global_step": 339938, "epoch": 2023} {"train_loss": -11.683209419250488, "global_step": 339939, "epoch": 2023} {"train_loss": -11.435376167297363, "global_step": 339940, "epoch": 2023} {"train_loss": -11.030208587646484, "global_step": 339941, "epoch": 2023} {"train_loss": -11.8420991897583, "global_step": 339942, "epoch": 2023} {"train_loss": -11.110332489013672, "global_step": 339943, "epoch": 2023} {"train_loss": -11.176361083984375, "global_step": 339944, "epoch": 2023} {"train_loss": -11.83088493347168, "global_step": 339945, "epoch": 2023} {"train_loss": -11.220312118530273, "global_step": 339946, "epoch": 2023} {"train_loss": -11.291667938232422, "global_step": 339947, "epoch": 2023} {"train_loss": -11.779746055603027, "global_step": 339948, "epoch": 2023} {"train_loss": -11.203615188598633, "global_step": 339949, "epoch": 2023} {"train_loss": -11.61181926727295, "global_step": 339950, "epoch": 2023} {"train_loss": -11.583490371704102, "global_step": 339951, "epoch": 2023} {"train_loss": -11.467157363891602, "global_step": 339952, "epoch": 2023} {"train_loss": -11.661659240722656, "global_step": 339953, "epoch": 2023} {"train_loss": -12.211252212524414, "global_step": 339954, "epoch": 2023} {"train_loss": -11.559528350830078, "global_step": 339955, "epoch": 2023} {"train_loss": -12.060863494873047, "global_step": 339956, "epoch": 2023} {"train_loss": -11.806538581848145, "global_step": 339957, "epoch": 2023} {"train_loss": -12.009902954101562, "global_step": 339958, "epoch": 2023} {"train_loss": -11.773283004760742, "global_step": 339959, "epoch": 2023} {"train_loss": -12.103382110595703, "global_step": 339960, "epoch": 2023} {"train_loss": -11.810358047485352, "global_step": 339961, "epoch": 2023} {"train_loss": -11.947710037231445, "global_step": 339962, "epoch": 2023} {"train_loss": -11.862103462219238, "global_step": 339963, "epoch": 2023} {"train_loss": -11.99490737915039, "global_step": 339964, "epoch": 2023} {"train_loss": -12.179380416870117, "global_step": 339965, "epoch": 2023} {"train_loss": -12.128564834594727, "global_step": 339966, "epoch": 2023} {"train_loss": -12.075271606445312, "global_step": 339967, "epoch": 2023} {"train_loss": -12.187593460083008, "global_step": 339968, "epoch": 2023} {"train_loss": -12.12849235534668, "global_step": 339969, "epoch": 2023} {"train_loss": -12.048664093017578, "global_step": 339970, "epoch": 2023} {"train_loss": -12.32235050201416, "global_step": 339971, "epoch": 2023} {"train_loss": -12.07497787475586, "global_step": 339972, "epoch": 2023} {"train_loss": -11.929317474365234, "global_step": 339973, "epoch": 2023} {"train_loss": -12.396925926208496, "global_step": 339974, "epoch": 2023} {"train_loss": -12.191003799438477, "global_step": 339975, "epoch": 2023} {"train_loss": -12.061378479003906, "global_step": 339976, "epoch": 2023} {"train_loss": -12.357807159423828, "global_step": 339977, "epoch": 2023} {"train_loss": -12.359685897827148, "global_step": 339978, "epoch": 2023} {"train_loss": -12.330551147460938, "global_step": 339979, "epoch": 2023} {"train_loss": -12.210578918457031, "global_step": 339980, "epoch": 2023} {"train_loss": -12.414504051208496, "global_step": 339981, "epoch": 2023} {"train_loss": -12.40660572052002, "global_step": 339982, "epoch": 2023} {"train_loss": -12.275350570678711, "global_step": 339983, "epoch": 2023} {"train_loss": -12.385961532592773, "global_step": 339984, "epoch": 2023} {"train_loss": -12.431243896484375, "global_step": 339985, "epoch": 2023} {"train_loss": -12.39166259765625, "global_step": 339986, "epoch": 2023} {"train_loss": -12.375259399414062, "global_step": 339987, "epoch": 2023} {"train_loss": -12.233126640319824, "global_step": 339988, "epoch": 2023} {"train_loss": -12.43285083770752, "global_step": 339989, "epoch": 2023} {"train_loss": -12.37967300415039, "global_step": 339990, "epoch": 2023} {"train_loss": -12.331968307495117, "global_step": 339991, "epoch": 2023} {"train_loss": -12.444303512573242, "global_step": 339992, "epoch": 2023} {"train_loss": -12.120347023010254, "global_step": 339993, "epoch": 2023} {"train_loss": -12.527308464050293, "global_step": 339994, "epoch": 2023} {"train_loss": -12.362222671508789, "global_step": 339995, "epoch": 2023} {"train_loss": -12.536430358886719, "global_step": 339996, "epoch": 2023} {"train_loss": -12.412885665893555, "global_step": 339997, "epoch": 2023} {"train_loss": -12.31900691986084, "global_step": 339998, "epoch": 2023} {"train_loss": -12.382758140563965, "global_step": 339999, "epoch": 2023} {"train_loss": -12.392560958862305, "global_step": 340000, "epoch": 2023} {"train_loss": -12.345682144165039, "global_step": 340001, "epoch": 2023} {"train_loss": -12.201997756958008, "global_step": 340002, "epoch": 2023} {"train_loss": -12.270477294921875, "global_step": 340003, "epoch": 2023} {"train_loss": -12.10218334197998, "global_step": 340004, "epoch": 2023} {"train_loss": -12.21810531616211, "global_step": 340005, "epoch": 2023} {"train_loss": -12.319601058959961, "global_step": 340006, "epoch": 2023} {"train_loss": -12.365898132324219, "global_step": 340007, "epoch": 2023} {"train_loss": -12.384878158569336, "global_step": 340008, "epoch": 2023} {"train_loss": -12.436614990234375, "global_step": 340009, "epoch": 2023} {"train_loss": -12.333057403564453, "global_step": 340010, "epoch": 2023} {"train_loss": -12.668156623840332, "global_step": 340011, "epoch": 2023} {"train_loss": -12.309213638305664, "global_step": 340012, "epoch": 2023} {"train_loss": -12.328773498535156, "global_step": 340013, "epoch": 2023} {"train_loss": -12.404685974121094, "global_step": 340014, "epoch": 2023} {"train_loss": -12.20097541809082, "global_step": 340015, "epoch": 2023} {"train_loss": -12.465814590454102, "global_step": 340016, "epoch": 2023} {"train_loss": -12.264692306518555, "global_step": 340017, "epoch": 2023} {"train_loss": -12.401973724365234, "global_step": 340018, "epoch": 2023} {"train_loss": -12.276498794555664, "global_step": 340019, "epoch": 2023} {"train_loss": -12.388052940368652, "global_step": 340020, "epoch": 2023} {"train_loss": -12.395200729370117, "global_step": 340021, "epoch": 2023} {"train_loss": -12.106550216674805, "global_step": 340022, "epoch": 2023} {"train_loss": -12.567317008972168, "global_step": 340023, "epoch": 2023} {"train_loss": -12.418718338012695, "global_step": 340024, "epoch": 2023} {"train_loss": -12.232540130615234, "global_step": 340025, "epoch": 2023} {"train_loss": -12.478861808776855, "global_step": 340026, "epoch": 2023} {"train_loss": -12.215651512145996, "global_step": 340027, "epoch": 2023} {"train_loss": -12.188210487365723, "global_step": 340028, "epoch": 2023} {"train_loss": -12.143756866455078, "global_step": 340029, "epoch": 2023} {"train_loss": -12.288827896118164, "global_step": 340030, "epoch": 2023} {"train_loss": -11.553952745028905, "global_step": 340031, "epoch": 2023, "val_loss": 280454.96875} {"train_loss": -12.373476028442383, "global_step": 340032, "epoch": 2024} {"train_loss": -12.177145957946777, "global_step": 340033, "epoch": 2024} {"train_loss": -12.034343719482422, "global_step": 340034, "epoch": 2024} {"train_loss": -12.421488761901855, "global_step": 340035, "epoch": 2024} {"train_loss": -12.282524108886719, "global_step": 340036, "epoch": 2024} {"train_loss": -11.987662315368652, "global_step": 340037, "epoch": 2024} {"train_loss": -12.46543025970459, "global_step": 340038, "epoch": 2024} {"train_loss": -12.164569854736328, "global_step": 340039, "epoch": 2024} {"train_loss": -12.322589874267578, "global_step": 340040, "epoch": 2024} {"train_loss": -11.854281425476074, "global_step": 340041, "epoch": 2024} {"train_loss": -12.121931076049805, "global_step": 340042, "epoch": 2024} {"train_loss": -12.272598266601562, "global_step": 340043, "epoch": 2024} {"train_loss": -12.47730541229248, "global_step": 340044, "epoch": 2024} {"train_loss": -12.2089262008667, "global_step": 340045, "epoch": 2024} {"train_loss": -12.166952133178711, "global_step": 340046, "epoch": 2024} {"train_loss": -12.120355606079102, "global_step": 340047, "epoch": 2024} {"train_loss": -11.430317878723145, "global_step": 340048, "epoch": 2024} {"train_loss": -11.131155014038086, "global_step": 340049, "epoch": 2024} {"train_loss": -12.293498992919922, "global_step": 340050, "epoch": 2024} {"train_loss": -12.12936782836914, "global_step": 340051, "epoch": 2024} {"train_loss": -12.29079818725586, "global_step": 340052, "epoch": 2024} {"train_loss": -12.448972702026367, "global_step": 340053, "epoch": 2024} {"train_loss": -12.555663108825684, "global_step": 340054, "epoch": 2024} {"train_loss": -12.385579109191895, "global_step": 340055, "epoch": 2024} {"train_loss": -12.374232292175293, "global_step": 340056, "epoch": 2024} {"train_loss": -12.61246109008789, "global_step": 340057, "epoch": 2024} {"train_loss": -12.444868087768555, "global_step": 340058, "epoch": 2024} {"train_loss": -12.563117980957031, "global_step": 340059, "epoch": 2024} {"train_loss": -12.58687973022461, "global_step": 340060, "epoch": 2024} {"train_loss": -12.536940574645996, "global_step": 340061, "epoch": 2024} {"train_loss": -12.052122116088867, "global_step": 340062, "epoch": 2024} {"train_loss": -12.28522777557373, "global_step": 340063, "epoch": 2024} {"train_loss": -12.511219024658203, "global_step": 340064, "epoch": 2024} {"train_loss": -12.369756698608398, "global_step": 340065, "epoch": 2024} {"train_loss": -11.861429214477539, "global_step": 340066, "epoch": 2024} {"train_loss": -11.978799819946289, "global_step": 340067, "epoch": 2024} {"train_loss": -11.788582801818848, "global_step": 340068, "epoch": 2024} {"train_loss": -12.391119956970215, "global_step": 340069, "epoch": 2024} {"train_loss": -12.356465339660645, "global_step": 340070, "epoch": 2024} {"train_loss": -12.100683212280273, "global_step": 340071, "epoch": 2024} {"train_loss": -11.741886138916016, "global_step": 340072, "epoch": 2024} {"train_loss": -12.370027542114258, "global_step": 340073, "epoch": 2024} {"train_loss": -12.294974327087402, "global_step": 340074, "epoch": 2024} {"train_loss": -12.602348327636719, "global_step": 340075, "epoch": 2024} {"train_loss": -12.265591621398926, "global_step": 340076, "epoch": 2024} {"train_loss": -11.253946304321289, "global_step": 340077, "epoch": 2024} {"train_loss": -11.659717559814453, "global_step": 340078, "epoch": 2024} {"train_loss": -12.697663307189941, "global_step": 340079, "epoch": 2024} {"train_loss": -11.765828132629395, "global_step": 340080, "epoch": 2024} {"train_loss": -11.626320838928223, "global_step": 340081, "epoch": 2024} {"train_loss": -11.736549377441406, "global_step": 340082, "epoch": 2024} {"train_loss": -12.274639129638672, "global_step": 340083, "epoch": 2024} {"train_loss": -11.770191192626953, "global_step": 340084, "epoch": 2024} {"train_loss": -11.469287872314453, "global_step": 340085, "epoch": 2024} {"train_loss": -12.350712776184082, "global_step": 340086, "epoch": 2024} {"train_loss": -12.171287536621094, "global_step": 340087, "epoch": 2024} {"train_loss": -11.574430465698242, "global_step": 340088, "epoch": 2024} {"train_loss": -11.656949996948242, "global_step": 340089, "epoch": 2024} {"train_loss": -12.404287338256836, "global_step": 340090, "epoch": 2024} {"train_loss": -11.156845092773438, "global_step": 340091, "epoch": 2024} {"train_loss": -11.470165252685547, "global_step": 340092, "epoch": 2024} {"train_loss": -12.253960609436035, "global_step": 340093, "epoch": 2024} {"train_loss": -12.148679733276367, "global_step": 340094, "epoch": 2024} {"train_loss": -11.435525894165039, "global_step": 340095, "epoch": 2024} {"train_loss": -11.648040771484375, "global_step": 340096, "epoch": 2024} {"train_loss": -12.128528594970703, "global_step": 340097, "epoch": 2024} {"train_loss": -11.596210479736328, "global_step": 340098, "epoch": 2024} {"train_loss": -11.683538436889648, "global_step": 340099, "epoch": 2024} {"train_loss": -11.694061279296875, "global_step": 340100, "epoch": 2024} {"train_loss": -12.360361099243164, "global_step": 340101, "epoch": 2024} {"train_loss": -11.912095069885254, "global_step": 340102, "epoch": 2024} {"train_loss": -12.209405899047852, "global_step": 340103, "epoch": 2024} {"train_loss": -12.357805252075195, "global_step": 340104, "epoch": 2024} {"train_loss": -12.301839828491211, "global_step": 340105, "epoch": 2024} {"train_loss": -11.830896377563477, "global_step": 340106, "epoch": 2024} {"train_loss": -11.742280960083008, "global_step": 340107, "epoch": 2024} {"train_loss": -11.419394493103027, "global_step": 340108, "epoch": 2024} {"train_loss": -12.215707778930664, "global_step": 340109, "epoch": 2024} {"train_loss": -12.51156997680664, "global_step": 340110, "epoch": 2024} {"train_loss": -12.202520370483398, "global_step": 340111, "epoch": 2024} {"train_loss": -12.072099685668945, "global_step": 340112, "epoch": 2024} {"train_loss": -11.744359970092773, "global_step": 340113, "epoch": 2024} {"train_loss": -12.159754753112793, "global_step": 340114, "epoch": 2024} {"train_loss": -12.282716751098633, "global_step": 340115, "epoch": 2024} {"train_loss": -12.24212646484375, "global_step": 340116, "epoch": 2024} {"train_loss": -11.89634895324707, "global_step": 340117, "epoch": 2024} {"train_loss": -12.327860832214355, "global_step": 340118, "epoch": 2024} {"train_loss": -11.88563060760498, "global_step": 340119, "epoch": 2024} {"train_loss": -11.948725700378418, "global_step": 340120, "epoch": 2024} {"train_loss": -11.508637428283691, "global_step": 340121, "epoch": 2024} {"train_loss": -12.426630020141602, "global_step": 340122, "epoch": 2024} {"train_loss": -11.918959617614746, "global_step": 340123, "epoch": 2024} {"train_loss": -12.398052215576172, "global_step": 340124, "epoch": 2024} {"train_loss": -12.322958946228027, "global_step": 340125, "epoch": 2024} {"train_loss": -12.111246109008789, "global_step": 340126, "epoch": 2024} {"train_loss": -12.41010570526123, "global_step": 340127, "epoch": 2024} {"train_loss": -11.840328216552734, "global_step": 340128, "epoch": 2024} {"train_loss": -11.754276275634766, "global_step": 340129, "epoch": 2024} {"train_loss": -12.169490814208984, "global_step": 340130, "epoch": 2024} {"train_loss": -12.188206672668457, "global_step": 340131, "epoch": 2024} {"train_loss": -11.815771102905273, "global_step": 340132, "epoch": 2024} {"train_loss": -12.241744995117188, "global_step": 340133, "epoch": 2024} {"train_loss": -11.654476165771484, "global_step": 340134, "epoch": 2024} {"train_loss": -11.919267654418945, "global_step": 340135, "epoch": 2024} {"train_loss": -12.332437515258789, "global_step": 340136, "epoch": 2024} {"train_loss": -11.852951049804688, "global_step": 340137, "epoch": 2024} {"train_loss": -12.095754623413086, "global_step": 340138, "epoch": 2024} {"train_loss": -12.347829818725586, "global_step": 340139, "epoch": 2024} {"train_loss": -11.902227401733398, "global_step": 340140, "epoch": 2024} {"train_loss": -12.303378105163574, "global_step": 340141, "epoch": 2024} {"train_loss": -12.098699569702148, "global_step": 340142, "epoch": 2024} {"train_loss": -12.157299995422363, "global_step": 340143, "epoch": 2024} {"train_loss": -12.054483413696289, "global_step": 340144, "epoch": 2024} {"train_loss": -12.158088684082031, "global_step": 340145, "epoch": 2024} {"train_loss": -11.981969833374023, "global_step": 340146, "epoch": 2024} {"train_loss": -12.152348518371582, "global_step": 340147, "epoch": 2024} {"train_loss": -11.766708374023438, "global_step": 340148, "epoch": 2024} {"train_loss": -12.096587181091309, "global_step": 340149, "epoch": 2024} {"train_loss": -11.876846313476562, "global_step": 340150, "epoch": 2024} {"train_loss": -11.476993560791016, "global_step": 340151, "epoch": 2024} {"train_loss": -12.294970512390137, "global_step": 340152, "epoch": 2024} {"train_loss": -11.858763694763184, "global_step": 340153, "epoch": 2024} {"train_loss": -11.564650535583496, "global_step": 340154, "epoch": 2024} {"train_loss": -11.967901229858398, "global_step": 340155, "epoch": 2024} {"train_loss": -11.429976463317871, "global_step": 340156, "epoch": 2024} {"train_loss": -11.98099136352539, "global_step": 340157, "epoch": 2024} {"train_loss": -11.801926612854004, "global_step": 340158, "epoch": 2024} {"train_loss": -12.112142562866211, "global_step": 340159, "epoch": 2024} {"train_loss": -12.244409561157227, "global_step": 340160, "epoch": 2024} {"train_loss": -11.87203311920166, "global_step": 340161, "epoch": 2024} {"train_loss": -12.005459785461426, "global_step": 340162, "epoch": 2024} {"train_loss": -11.959484100341797, "global_step": 340163, "epoch": 2024} {"train_loss": -11.324019432067871, "global_step": 340164, "epoch": 2024} {"train_loss": -12.245004653930664, "global_step": 340165, "epoch": 2024} {"train_loss": -12.023868560791016, "global_step": 340166, "epoch": 2024} {"train_loss": -10.43393325805664, "global_step": 340167, "epoch": 2024} {"train_loss": -11.117667198181152, "global_step": 340168, "epoch": 2024} {"train_loss": -12.449844360351562, "global_step": 340169, "epoch": 2024} {"train_loss": -10.721749305725098, "global_step": 340170, "epoch": 2024} {"train_loss": -11.202512741088867, "global_step": 340171, "epoch": 2024} {"train_loss": -11.672035217285156, "global_step": 340172, "epoch": 2024} {"train_loss": -11.686201095581055, "global_step": 340173, "epoch": 2024} {"train_loss": -12.09897518157959, "global_step": 340174, "epoch": 2024} {"train_loss": -11.781803131103516, "global_step": 340175, "epoch": 2024} {"train_loss": -12.401771545410156, "global_step": 340176, "epoch": 2024} {"train_loss": -11.961894989013672, "global_step": 340177, "epoch": 2024} {"train_loss": -12.268464088439941, "global_step": 340178, "epoch": 2024} {"train_loss": -12.284369468688965, "global_step": 340179, "epoch": 2024} {"train_loss": -11.826435089111328, "global_step": 340180, "epoch": 2024} {"train_loss": -12.41066837310791, "global_step": 340181, "epoch": 2024} {"train_loss": -11.81052017211914, "global_step": 340182, "epoch": 2024} {"train_loss": -12.437287330627441, "global_step": 340183, "epoch": 2024} {"train_loss": -12.088993072509766, "global_step": 340184, "epoch": 2024} {"train_loss": -12.120999336242676, "global_step": 340185, "epoch": 2024} {"train_loss": -12.061454772949219, "global_step": 340186, "epoch": 2024} {"train_loss": -12.007303237915039, "global_step": 340187, "epoch": 2024} {"train_loss": -12.145551681518555, "global_step": 340188, "epoch": 2024} {"train_loss": -12.228304862976074, "global_step": 340189, "epoch": 2024} {"train_loss": -11.928817749023438, "global_step": 340190, "epoch": 2024} {"train_loss": -12.02928352355957, "global_step": 340191, "epoch": 2024} {"train_loss": -11.97360610961914, "global_step": 340192, "epoch": 2024} {"train_loss": -12.182655334472656, "global_step": 340193, "epoch": 2024} {"train_loss": -12.06730842590332, "global_step": 340194, "epoch": 2024} {"train_loss": -12.338563919067383, "global_step": 340195, "epoch": 2024} {"train_loss": -12.176280975341797, "global_step": 340196, "epoch": 2024} {"train_loss": -12.3931884765625, "global_step": 340197, "epoch": 2024} {"train_loss": -12.40011978149414, "global_step": 340198, "epoch": 2024} {"train_loss": -12.036519868033272, "global_step": 340199, "epoch": 2024, "val_loss": 279577.46875} {"train_loss": -12.29502010345459, "global_step": 340200, "epoch": 2025} {"train_loss": -12.252754211425781, "global_step": 340201, "epoch": 2025} {"train_loss": -12.314535140991211, "global_step": 340202, "epoch": 2025} {"train_loss": -12.291618347167969, "global_step": 340203, "epoch": 2025} {"train_loss": -12.416561126708984, "global_step": 340204, "epoch": 2025} {"train_loss": -12.21010971069336, "global_step": 340205, "epoch": 2025} {"train_loss": -11.912555694580078, "global_step": 340206, "epoch": 2025} {"train_loss": -11.673745155334473, "global_step": 340207, "epoch": 2025} {"train_loss": -12.389995574951172, "global_step": 340208, "epoch": 2025} {"train_loss": -12.061878204345703, "global_step": 340209, "epoch": 2025} {"train_loss": -11.537862777709961, "global_step": 340210, "epoch": 2025} {"train_loss": -12.30782699584961, "global_step": 340211, "epoch": 2025} {"train_loss": -10.744632720947266, "global_step": 340212, "epoch": 2025} {"train_loss": -10.510190963745117, "global_step": 340213, "epoch": 2025} {"train_loss": -12.427987098693848, "global_step": 340214, "epoch": 2025} {"train_loss": -10.910585403442383, "global_step": 340215, "epoch": 2025} {"train_loss": -11.432451248168945, "global_step": 340216, "epoch": 2025} {"train_loss": -11.601222038269043, "global_step": 340217, "epoch": 2025} {"train_loss": -11.405425071716309, "global_step": 340218, "epoch": 2025} {"train_loss": -11.35422134399414, "global_step": 340219, "epoch": 2025} {"train_loss": -12.312234878540039, "global_step": 340220, "epoch": 2025} {"train_loss": -11.563982963562012, "global_step": 340221, "epoch": 2025} {"train_loss": -12.018888473510742, "global_step": 340222, "epoch": 2025} {"train_loss": -12.179716110229492, "global_step": 340223, "epoch": 2025} {"train_loss": -11.07211685180664, "global_step": 340224, "epoch": 2025} {"train_loss": -12.24421215057373, "global_step": 340225, "epoch": 2025} {"train_loss": -10.618407249450684, "global_step": 340226, "epoch": 2025} {"train_loss": -11.398505210876465, "global_step": 340227, "epoch": 2025} {"train_loss": -11.713696479797363, "global_step": 340228, "epoch": 2025} {"train_loss": -11.89647102355957, "global_step": 340229, "epoch": 2025} {"train_loss": -11.591684341430664, "global_step": 340230, "epoch": 2025} {"train_loss": -11.449459075927734, "global_step": 340231, "epoch": 2025} {"train_loss": -10.784725189208984, "global_step": 340232, "epoch": 2025} {"train_loss": -11.298046112060547, "global_step": 340233, "epoch": 2025} {"train_loss": -11.242727279663086, "global_step": 340234, "epoch": 2025} {"train_loss": -11.15092945098877, "global_step": 340235, "epoch": 2025} {"train_loss": -11.322803497314453, "global_step": 340236, "epoch": 2025} {"train_loss": -10.508443832397461, "global_step": 340237, "epoch": 2025} {"train_loss": -11.738933563232422, "global_step": 340238, "epoch": 2025} {"train_loss": -9.959023475646973, "global_step": 340239, "epoch": 2025} {"train_loss": -11.657316207885742, "global_step": 340240, "epoch": 2025} {"train_loss": -10.320499420166016, "global_step": 340241, "epoch": 2025} {"train_loss": -11.603921890258789, "global_step": 340242, "epoch": 2025} {"train_loss": -10.867331504821777, "global_step": 340243, "epoch": 2025} {"train_loss": -11.444730758666992, "global_step": 340244, "epoch": 2025} {"train_loss": -11.431694030761719, "global_step": 340245, "epoch": 2025} {"train_loss": -11.194320678710938, "global_step": 340246, "epoch": 2025} {"train_loss": -11.728710174560547, "global_step": 340247, "epoch": 2025} {"train_loss": -10.84830093383789, "global_step": 340248, "epoch": 2025} {"train_loss": -12.14643383026123, "global_step": 340249, "epoch": 2025} {"train_loss": -10.976014137268066, "global_step": 340250, "epoch": 2025} {"train_loss": -11.841485977172852, "global_step": 340251, "epoch": 2025} {"train_loss": -11.93464469909668, "global_step": 340252, "epoch": 2025} {"train_loss": -11.533594131469727, "global_step": 340253, "epoch": 2025} {"train_loss": -11.979446411132812, "global_step": 340254, "epoch": 2025} {"train_loss": -11.489728927612305, "global_step": 340255, "epoch": 2025} {"train_loss": -12.153883934020996, "global_step": 340256, "epoch": 2025} {"train_loss": -12.01115894317627, "global_step": 340257, "epoch": 2025} {"train_loss": -11.451115608215332, "global_step": 340258, "epoch": 2025} {"train_loss": -12.099601745605469, "global_step": 340259, "epoch": 2025} {"train_loss": -11.521061897277832, "global_step": 340260, "epoch": 2025} {"train_loss": -11.737529754638672, "global_step": 340261, "epoch": 2025} {"train_loss": -11.972140312194824, "global_step": 340262, "epoch": 2025} {"train_loss": -11.696704864501953, "global_step": 340263, "epoch": 2025} {"train_loss": -12.334287643432617, "global_step": 340264, "epoch": 2025} {"train_loss": -11.96613883972168, "global_step": 340265, "epoch": 2025} {"train_loss": -11.823360443115234, "global_step": 340266, "epoch": 2025} {"train_loss": -12.210948944091797, "global_step": 340267, "epoch": 2025} {"train_loss": -11.672174453735352, "global_step": 340268, "epoch": 2025} {"train_loss": -12.081609725952148, "global_step": 340269, "epoch": 2025} {"train_loss": -12.18154239654541, "global_step": 340270, "epoch": 2025} {"train_loss": -12.160820007324219, "global_step": 340271, "epoch": 2025} {"train_loss": -12.288949966430664, "global_step": 340272, "epoch": 2025} {"train_loss": -12.157302856445312, "global_step": 340273, "epoch": 2025} {"train_loss": -12.021207809448242, "global_step": 340274, "epoch": 2025} {"train_loss": -12.29488754272461, "global_step": 340275, "epoch": 2025} {"train_loss": -12.224882125854492, "global_step": 340276, "epoch": 2025} {"train_loss": -12.28175163269043, "global_step": 340277, "epoch": 2025} {"train_loss": -12.462606430053711, "global_step": 340278, "epoch": 2025} {"train_loss": -12.080286026000977, "global_step": 340279, "epoch": 2025} {"train_loss": -12.394559860229492, "global_step": 340280, "epoch": 2025} {"train_loss": -12.405258178710938, "global_step": 340281, "epoch": 2025} {"train_loss": -12.251107215881348, "global_step": 340282, "epoch": 2025} {"train_loss": -12.428264617919922, "global_step": 340283, "epoch": 2025} {"train_loss": -12.418157577514648, "global_step": 340284, "epoch": 2025} {"train_loss": -12.251968383789062, "global_step": 340285, "epoch": 2025} {"train_loss": -12.533918380737305, "global_step": 340286, "epoch": 2025} {"train_loss": -12.309354782104492, "global_step": 340287, "epoch": 2025} {"train_loss": -12.366931915283203, "global_step": 340288, "epoch": 2025} {"train_loss": -12.559103012084961, "global_step": 340289, "epoch": 2025} {"train_loss": -12.050907135009766, "global_step": 340290, "epoch": 2025} {"train_loss": -12.397051811218262, "global_step": 340291, "epoch": 2025} {"train_loss": -12.414482116699219, "global_step": 340292, "epoch": 2025} {"train_loss": -12.394230842590332, "global_step": 340293, "epoch": 2025} {"train_loss": -12.45827865600586, "global_step": 340294, "epoch": 2025} {"train_loss": -12.435674667358398, "global_step": 340295, "epoch": 2025} {"train_loss": -12.557198524475098, "global_step": 340296, "epoch": 2025} {"train_loss": -12.24323844909668, "global_step": 340297, "epoch": 2025} {"train_loss": -12.423338890075684, "global_step": 340298, "epoch": 2025} {"train_loss": -12.256694793701172, "global_step": 340299, "epoch": 2025} {"train_loss": -12.39579963684082, "global_step": 340300, "epoch": 2025} {"train_loss": -12.460678100585938, "global_step": 340301, "epoch": 2025} {"train_loss": -12.233771324157715, "global_step": 340302, "epoch": 2025} {"train_loss": -12.406464576721191, "global_step": 340303, "epoch": 2025} {"train_loss": -12.216771125793457, "global_step": 340304, "epoch": 2025} {"train_loss": -12.431475639343262, "global_step": 340305, "epoch": 2025} {"train_loss": -12.292455673217773, "global_step": 340306, "epoch": 2025} {"train_loss": -12.276348114013672, "global_step": 340307, "epoch": 2025} {"train_loss": -12.226360321044922, "global_step": 340308, "epoch": 2025} {"train_loss": -12.396718978881836, "global_step": 340309, "epoch": 2025} {"train_loss": -12.365738868713379, "global_step": 340310, "epoch": 2025} {"train_loss": -12.324532508850098, "global_step": 340311, "epoch": 2025} {"train_loss": -12.306262969970703, "global_step": 340312, "epoch": 2025} {"train_loss": -12.175004959106445, "global_step": 340313, "epoch": 2025} {"train_loss": -12.665027618408203, "global_step": 340314, "epoch": 2025} {"train_loss": -12.408159255981445, "global_step": 340315, "epoch": 2025} {"train_loss": -12.625350952148438, "global_step": 340316, "epoch": 2025} {"train_loss": -12.431865692138672, "global_step": 340317, "epoch": 2025} {"train_loss": -12.64381217956543, "global_step": 340318, "epoch": 2025} {"train_loss": -12.413496971130371, "global_step": 340319, "epoch": 2025} {"train_loss": -12.579912185668945, "global_step": 340320, "epoch": 2025} {"train_loss": -12.774076461791992, "global_step": 340321, "epoch": 2025} {"train_loss": -12.829641342163086, "global_step": 340322, "epoch": 2025} {"train_loss": -12.761070251464844, "global_step": 340323, "epoch": 2025} {"train_loss": -12.511648178100586, "global_step": 340324, "epoch": 2025} {"train_loss": -12.719862937927246, "global_step": 340325, "epoch": 2025} {"train_loss": -12.641412734985352, "global_step": 340326, "epoch": 2025} {"train_loss": -12.699102401733398, "global_step": 340327, "epoch": 2025} {"train_loss": -12.605716705322266, "global_step": 340328, "epoch": 2025} {"train_loss": -12.687965393066406, "global_step": 340329, "epoch": 2025} {"train_loss": -12.607584953308105, "global_step": 340330, "epoch": 2025} {"train_loss": -12.318302154541016, "global_step": 340331, "epoch": 2025} {"train_loss": -12.416476249694824, "global_step": 340332, "epoch": 2025} {"train_loss": -12.449861526489258, "global_step": 340333, "epoch": 2025} {"train_loss": -12.650550842285156, "global_step": 340334, "epoch": 2025} {"train_loss": -12.800973892211914, "global_step": 340335, "epoch": 2025} {"train_loss": -12.355228424072266, "global_step": 340336, "epoch": 2025} {"train_loss": -11.963274002075195, "global_step": 340337, "epoch": 2025} {"train_loss": -11.20556640625, "global_step": 340338, "epoch": 2025} {"train_loss": -12.014305114746094, "global_step": 340339, "epoch": 2025} {"train_loss": -12.102127075195312, "global_step": 340340, "epoch": 2025} {"train_loss": -11.529397964477539, "global_step": 340341, "epoch": 2025} {"train_loss": -10.93799877166748, "global_step": 340342, "epoch": 2025} {"train_loss": -9.83993911743164, "global_step": 340343, "epoch": 2025} {"train_loss": -11.383594512939453, "global_step": 340344, "epoch": 2025} {"train_loss": -8.922239303588867, "global_step": 340345, "epoch": 2025} {"train_loss": -9.224578857421875, "global_step": 340346, "epoch": 2025} {"train_loss": -10.732246398925781, "global_step": 340347, "epoch": 2025} {"train_loss": -10.168486595153809, "global_step": 340348, "epoch": 2025} {"train_loss": -8.274711608886719, "global_step": 340349, "epoch": 2025} {"train_loss": -9.524138450622559, "global_step": 340350, "epoch": 2025} {"train_loss": -10.736906051635742, "global_step": 340351, "epoch": 2025} {"train_loss": -9.231390953063965, "global_step": 340352, "epoch": 2025} {"train_loss": -10.377020835876465, "global_step": 340353, "epoch": 2025} {"train_loss": -10.609853744506836, "global_step": 340354, "epoch": 2025} {"train_loss": -9.123971939086914, "global_step": 340355, "epoch": 2025} {"train_loss": -11.185209274291992, "global_step": 340356, "epoch": 2025} {"train_loss": -11.496152877807617, "global_step": 340357, "epoch": 2025} {"train_loss": -10.749734878540039, "global_step": 340358, "epoch": 2025} {"train_loss": -10.33519172668457, "global_step": 340359, "epoch": 2025} {"train_loss": -9.116836547851562, "global_step": 340360, "epoch": 2025} {"train_loss": -11.390728950500488, "global_step": 340361, "epoch": 2025} {"train_loss": -11.24658203125, "global_step": 340362, "epoch": 2025} {"train_loss": -10.48297119140625, "global_step": 340363, "epoch": 2025} {"train_loss": -10.834844589233398, "global_step": 340364, "epoch": 2025} {"train_loss": -10.228315353393555, "global_step": 340365, "epoch": 2025} {"train_loss": -10.489110946655273, "global_step": 340366, "epoch": 2025} {"train_loss": -11.7268439133962, "global_step": 340367, "epoch": 2025, "val_loss": 279303.6875, "train_action_mse_error": 1.8616490364074707} {"train_loss": -11.446828842163086, "global_step": 340368, "epoch": 2026} {"train_loss": -11.11961555480957, "global_step": 340369, "epoch": 2026} {"train_loss": -11.885424613952637, "global_step": 340370, "epoch": 2026} {"train_loss": -10.22611141204834, "global_step": 340371, "epoch": 2026} {"train_loss": -11.172319412231445, "global_step": 340372, "epoch": 2026} {"train_loss": -11.300912857055664, "global_step": 340373, "epoch": 2026} {"train_loss": -10.26828670501709, "global_step": 340374, "epoch": 2026} {"train_loss": -11.812393188476562, "global_step": 340375, "epoch": 2026} {"train_loss": -11.159965515136719, "global_step": 340376, "epoch": 2026} {"train_loss": -11.562871932983398, "global_step": 340377, "epoch": 2026} {"train_loss": -11.54198169708252, "global_step": 340378, "epoch": 2026} {"train_loss": -11.891555786132812, "global_step": 340379, "epoch": 2026} {"train_loss": -11.404816627502441, "global_step": 340380, "epoch": 2026} {"train_loss": -12.087044715881348, "global_step": 340381, "epoch": 2026} {"train_loss": -11.645956993103027, "global_step": 340382, "epoch": 2026} {"train_loss": -11.736078262329102, "global_step": 340383, "epoch": 2026} {"train_loss": -11.926568031311035, "global_step": 340384, "epoch": 2026} {"train_loss": -11.576200485229492, "global_step": 340385, "epoch": 2026} {"train_loss": -12.018156051635742, "global_step": 340386, "epoch": 2026} {"train_loss": -12.075643539428711, "global_step": 340387, "epoch": 2026} {"train_loss": -11.844034194946289, "global_step": 340388, "epoch": 2026} {"train_loss": -12.15571403503418, "global_step": 340389, "epoch": 2026} {"train_loss": -11.985783576965332, "global_step": 340390, "epoch": 2026} {"train_loss": -11.898990631103516, "global_step": 340391, "epoch": 2026} {"train_loss": -12.237258911132812, "global_step": 340392, "epoch": 2026} {"train_loss": -12.105224609375, "global_step": 340393, "epoch": 2026} {"train_loss": -11.816913604736328, "global_step": 340394, "epoch": 2026} {"train_loss": -12.196538925170898, "global_step": 340395, "epoch": 2026} {"train_loss": -11.984678268432617, "global_step": 340396, "epoch": 2026} {"train_loss": -12.09615707397461, "global_step": 340397, "epoch": 2026} {"train_loss": -12.043912887573242, "global_step": 340398, "epoch": 2026} {"train_loss": -12.08875846862793, "global_step": 340399, "epoch": 2026} {"train_loss": -12.302997589111328, "global_step": 340400, "epoch": 2026} {"train_loss": -12.227209091186523, "global_step": 340401, "epoch": 2026} {"train_loss": -12.1500883102417, "global_step": 340402, "epoch": 2026} {"train_loss": -11.947463989257812, "global_step": 340403, "epoch": 2026} {"train_loss": -12.120604515075684, "global_step": 340404, "epoch": 2026} {"train_loss": -12.363245010375977, "global_step": 340405, "epoch": 2026} {"train_loss": -12.096916198730469, "global_step": 340406, "epoch": 2026} {"train_loss": -12.340950012207031, "global_step": 340407, "epoch": 2026} {"train_loss": -12.426315307617188, "global_step": 340408, "epoch": 2026} {"train_loss": -12.322504043579102, "global_step": 340409, "epoch": 2026} {"train_loss": -12.100085258483887, "global_step": 340410, "epoch": 2026} {"train_loss": -12.431035995483398, "global_step": 340411, "epoch": 2026} {"train_loss": -12.328725814819336, "global_step": 340412, "epoch": 2026} {"train_loss": -12.297130584716797, "global_step": 340413, "epoch": 2026} {"train_loss": -12.34909439086914, "global_step": 340414, "epoch": 2026} {"train_loss": -12.293828010559082, "global_step": 340415, "epoch": 2026} {"train_loss": -12.49343204498291, "global_step": 340416, "epoch": 2026} {"train_loss": -12.173932075500488, "global_step": 340417, "epoch": 2026} {"train_loss": -12.509798049926758, "global_step": 340418, "epoch": 2026} {"train_loss": -12.29819393157959, "global_step": 340419, "epoch": 2026} {"train_loss": -12.430368423461914, "global_step": 340420, "epoch": 2026} {"train_loss": -12.32740592956543, "global_step": 340421, "epoch": 2026} {"train_loss": -12.423582077026367, "global_step": 340422, "epoch": 2026} {"train_loss": -12.422792434692383, "global_step": 340423, "epoch": 2026} {"train_loss": -12.533610343933105, "global_step": 340424, "epoch": 2026} {"train_loss": -12.125832557678223, "global_step": 340425, "epoch": 2026} {"train_loss": -12.039546012878418, "global_step": 340426, "epoch": 2026} {"train_loss": -12.47746753692627, "global_step": 340427, "epoch": 2026} {"train_loss": -12.344722747802734, "global_step": 340428, "epoch": 2026} {"train_loss": -12.202007293701172, "global_step": 340429, "epoch": 2026} {"train_loss": -12.430543899536133, "global_step": 340430, "epoch": 2026} {"train_loss": -12.669841766357422, "global_step": 340431, "epoch": 2026} {"train_loss": -12.545724868774414, "global_step": 340432, "epoch": 2026} {"train_loss": -12.523908615112305, "global_step": 340433, "epoch": 2026} {"train_loss": -12.371955871582031, "global_step": 340434, "epoch": 2026} {"train_loss": -12.21493148803711, "global_step": 340435, "epoch": 2026} {"train_loss": -12.245654106140137, "global_step": 340436, "epoch": 2026} {"train_loss": -12.403491973876953, "global_step": 340437, "epoch": 2026} {"train_loss": -12.565237998962402, "global_step": 340438, "epoch": 2026} {"train_loss": -12.543535232543945, "global_step": 340439, "epoch": 2026} {"train_loss": -12.738276481628418, "global_step": 340440, "epoch": 2026} {"train_loss": -12.538166046142578, "global_step": 340441, "epoch": 2026} {"train_loss": -12.387889862060547, "global_step": 340442, "epoch": 2026} {"train_loss": -12.546183586120605, "global_step": 340443, "epoch": 2026} {"train_loss": -12.499478340148926, "global_step": 340444, "epoch": 2026} {"train_loss": -12.580753326416016, "global_step": 340445, "epoch": 2026} {"train_loss": -12.61574649810791, "global_step": 340446, "epoch": 2026} {"train_loss": -12.07093334197998, "global_step": 340447, "epoch": 2026} {"train_loss": -12.632055282592773, "global_step": 340448, "epoch": 2026} {"train_loss": -12.598945617675781, "global_step": 340449, "epoch": 2026} {"train_loss": -12.631986618041992, "global_step": 340450, "epoch": 2026} {"train_loss": -12.68944263458252, "global_step": 340451, "epoch": 2026} {"train_loss": -12.566606521606445, "global_step": 340452, "epoch": 2026} {"train_loss": -12.623100280761719, "global_step": 340453, "epoch": 2026} {"train_loss": -12.667708396911621, "global_step": 340454, "epoch": 2026} {"train_loss": -12.438396453857422, "global_step": 340455, "epoch": 2026} {"train_loss": -12.64957046508789, "global_step": 340456, "epoch": 2026} {"train_loss": -12.214567184448242, "global_step": 340457, "epoch": 2026} {"train_loss": -12.16855239868164, "global_step": 340458, "epoch": 2026} {"train_loss": -12.575968742370605, "global_step": 340459, "epoch": 2026} {"train_loss": -12.56417465209961, "global_step": 340460, "epoch": 2026} {"train_loss": -12.408809661865234, "global_step": 340461, "epoch": 2026} {"train_loss": -12.306571006774902, "global_step": 340462, "epoch": 2026} {"train_loss": -12.263263702392578, "global_step": 340463, "epoch": 2026} {"train_loss": -12.499731063842773, "global_step": 340464, "epoch": 2026} {"train_loss": -12.593950271606445, "global_step": 340465, "epoch": 2026} {"train_loss": -12.649717330932617, "global_step": 340466, "epoch": 2026} {"train_loss": -12.538326263427734, "global_step": 340467, "epoch": 2026} {"train_loss": -12.214487075805664, "global_step": 340468, "epoch": 2026} {"train_loss": -12.113479614257812, "global_step": 340469, "epoch": 2026} {"train_loss": -12.17727279663086, "global_step": 340470, "epoch": 2026} {"train_loss": -12.477010726928711, "global_step": 340471, "epoch": 2026} {"train_loss": -12.519855499267578, "global_step": 340472, "epoch": 2026} {"train_loss": -12.115470886230469, "global_step": 340473, "epoch": 2026} {"train_loss": -11.740985870361328, "global_step": 340474, "epoch": 2026} {"train_loss": -12.48564624786377, "global_step": 340475, "epoch": 2026} {"train_loss": -12.368768692016602, "global_step": 340476, "epoch": 2026} {"train_loss": -12.400036811828613, "global_step": 340477, "epoch": 2026} {"train_loss": -12.13547134399414, "global_step": 340478, "epoch": 2026} {"train_loss": -11.3652925491333, "global_step": 340479, "epoch": 2026} {"train_loss": -11.17016315460205, "global_step": 340480, "epoch": 2026} {"train_loss": -11.301218032836914, "global_step": 340481, "epoch": 2026} {"train_loss": -11.964505195617676, "global_step": 340482, "epoch": 2026} {"train_loss": -12.018292427062988, "global_step": 340483, "epoch": 2026} {"train_loss": -11.257209777832031, "global_step": 340484, "epoch": 2026} {"train_loss": -10.624876022338867, "global_step": 340485, "epoch": 2026} {"train_loss": -11.058664321899414, "global_step": 340486, "epoch": 2026} {"train_loss": -12.426013946533203, "global_step": 340487, "epoch": 2026} {"train_loss": -5.196083068847656, "global_step": 340488, "epoch": 2026} {"train_loss": -10.987286567687988, "global_step": 340489, "epoch": 2026} {"train_loss": -11.326621055603027, "global_step": 340490, "epoch": 2026} {"train_loss": -10.385985374450684, "global_step": 340491, "epoch": 2026} {"train_loss": -10.055547714233398, "global_step": 340492, "epoch": 2026} {"train_loss": -11.022815704345703, "global_step": 340493, "epoch": 2026} {"train_loss": -9.984451293945312, "global_step": 340494, "epoch": 2026} {"train_loss": -10.928942680358887, "global_step": 340495, "epoch": 2026} {"train_loss": -10.347309112548828, "global_step": 340496, "epoch": 2026} {"train_loss": -11.407791137695312, "global_step": 340497, "epoch": 2026} {"train_loss": -11.420714378356934, "global_step": 340498, "epoch": 2026} {"train_loss": -11.773491859436035, "global_step": 340499, "epoch": 2026} {"train_loss": -11.15908432006836, "global_step": 340500, "epoch": 2026} {"train_loss": -10.920919418334961, "global_step": 340501, "epoch": 2026} {"train_loss": -11.785110473632812, "global_step": 340502, "epoch": 2026} {"train_loss": -11.60313606262207, "global_step": 340503, "epoch": 2026} {"train_loss": -11.470855712890625, "global_step": 340504, "epoch": 2026} {"train_loss": -11.27828598022461, "global_step": 340505, "epoch": 2026} {"train_loss": -11.750687599182129, "global_step": 340506, "epoch": 2026} {"train_loss": -11.299348831176758, "global_step": 340507, "epoch": 2026} {"train_loss": -11.27515983581543, "global_step": 340508, "epoch": 2026} {"train_loss": -12.022209167480469, "global_step": 340509, "epoch": 2026} {"train_loss": -11.450424194335938, "global_step": 340510, "epoch": 2026} {"train_loss": -12.122262954711914, "global_step": 340511, "epoch": 2026} {"train_loss": -11.319314002990723, "global_step": 340512, "epoch": 2026} {"train_loss": -11.216039657592773, "global_step": 340513, "epoch": 2026} {"train_loss": -11.66572093963623, "global_step": 340514, "epoch": 2026} {"train_loss": -11.58947467803955, "global_step": 340515, "epoch": 2026} {"train_loss": -11.695209503173828, "global_step": 340516, "epoch": 2026} {"train_loss": -11.302241325378418, "global_step": 340517, "epoch": 2026} {"train_loss": -11.944961547851562, "global_step": 340518, "epoch": 2026} {"train_loss": -11.492317199707031, "global_step": 340519, "epoch": 2026} {"train_loss": -11.818109512329102, "global_step": 340520, "epoch": 2026} {"train_loss": -11.712146759033203, "global_step": 340521, "epoch": 2026} {"train_loss": -12.009462356567383, "global_step": 340522, "epoch": 2026} {"train_loss": -11.69578742980957, "global_step": 340523, "epoch": 2026} {"train_loss": -11.870025634765625, "global_step": 340524, "epoch": 2026} {"train_loss": -11.914348602294922, "global_step": 340525, "epoch": 2026} {"train_loss": -12.181978225708008, "global_step": 340526, "epoch": 2026} {"train_loss": -11.659505844116211, "global_step": 340527, "epoch": 2026} {"train_loss": -11.95089340209961, "global_step": 340528, "epoch": 2026} {"train_loss": -12.094083786010742, "global_step": 340529, "epoch": 2026} {"train_loss": -11.816343307495117, "global_step": 340530, "epoch": 2026} {"train_loss": -12.305953979492188, "global_step": 340531, "epoch": 2026} {"train_loss": -12.033023834228516, "global_step": 340532, "epoch": 2026} {"train_loss": -11.989875793457031, "global_step": 340533, "epoch": 2026} {"train_loss": -11.565773010253906, "global_step": 340534, "epoch": 2026} {"train_loss": -11.915449290048509, "global_step": 340535, "epoch": 2026, "val_loss": 282483.71875} {"train_loss": -11.443020820617676, "global_step": 340536, "epoch": 2027} {"train_loss": -12.00834846496582, "global_step": 340537, "epoch": 2027} {"train_loss": -11.976823806762695, "global_step": 340538, "epoch": 2027} {"train_loss": -11.850746154785156, "global_step": 340539, "epoch": 2027} {"train_loss": -11.827985763549805, "global_step": 340540, "epoch": 2027} {"train_loss": -11.845022201538086, "global_step": 340541, "epoch": 2027} {"train_loss": -11.847087860107422, "global_step": 340542, "epoch": 2027} {"train_loss": -12.081767082214355, "global_step": 340543, "epoch": 2027} {"train_loss": -12.124282836914062, "global_step": 340544, "epoch": 2027} {"train_loss": -11.651481628417969, "global_step": 340545, "epoch": 2027} {"train_loss": -11.908605575561523, "global_step": 340546, "epoch": 2027} {"train_loss": -12.032642364501953, "global_step": 340547, "epoch": 2027} {"train_loss": -11.997659683227539, "global_step": 340548, "epoch": 2027} {"train_loss": -12.098804473876953, "global_step": 340549, "epoch": 2027} {"train_loss": -12.08696174621582, "global_step": 340550, "epoch": 2027} {"train_loss": -12.210763931274414, "global_step": 340551, "epoch": 2027} {"train_loss": -12.064412117004395, "global_step": 340552, "epoch": 2027} {"train_loss": -12.169918060302734, "global_step": 340553, "epoch": 2027} {"train_loss": -12.100269317626953, "global_step": 340554, "epoch": 2027} {"train_loss": -12.188281059265137, "global_step": 340555, "epoch": 2027} {"train_loss": -12.289217948913574, "global_step": 340556, "epoch": 2027} {"train_loss": -12.21734619140625, "global_step": 340557, "epoch": 2027} {"train_loss": -12.212984085083008, "global_step": 340558, "epoch": 2027} {"train_loss": -11.95589828491211, "global_step": 340559, "epoch": 2027} {"train_loss": -12.053228378295898, "global_step": 340560, "epoch": 2027} {"train_loss": -12.229053497314453, "global_step": 340561, "epoch": 2027} {"train_loss": -11.933149337768555, "global_step": 340562, "epoch": 2027} {"train_loss": -12.047491073608398, "global_step": 340563, "epoch": 2027} {"train_loss": -12.29979133605957, "global_step": 340564, "epoch": 2027} {"train_loss": -11.928669929504395, "global_step": 340565, "epoch": 2027} {"train_loss": -11.953384399414062, "global_step": 340566, "epoch": 2027} {"train_loss": -11.794257164001465, "global_step": 340567, "epoch": 2027} {"train_loss": -12.07051944732666, "global_step": 340568, "epoch": 2027} {"train_loss": -12.107213973999023, "global_step": 340569, "epoch": 2027} {"train_loss": -12.162528991699219, "global_step": 340570, "epoch": 2027} {"train_loss": -12.103826522827148, "global_step": 340571, "epoch": 2027} {"train_loss": -12.267045974731445, "global_step": 340572, "epoch": 2027} {"train_loss": -12.173458099365234, "global_step": 340573, "epoch": 2027} {"train_loss": -12.128551483154297, "global_step": 340574, "epoch": 2027} {"train_loss": -12.030092239379883, "global_step": 340575, "epoch": 2027} {"train_loss": -12.083749771118164, "global_step": 340576, "epoch": 2027} {"train_loss": -11.90407943725586, "global_step": 340577, "epoch": 2027} {"train_loss": -11.601890563964844, "global_step": 340578, "epoch": 2027} {"train_loss": -12.277170181274414, "global_step": 340579, "epoch": 2027} {"train_loss": -11.914873123168945, "global_step": 340580, "epoch": 2027} {"train_loss": -11.428817749023438, "global_step": 340581, "epoch": 2027} {"train_loss": -11.886453628540039, "global_step": 340582, "epoch": 2027} {"train_loss": -11.575681686401367, "global_step": 340583, "epoch": 2027} {"train_loss": -11.391653060913086, "global_step": 340584, "epoch": 2027} {"train_loss": -11.667781829833984, "global_step": 340585, "epoch": 2027} {"train_loss": -11.842992782592773, "global_step": 340586, "epoch": 2027} {"train_loss": -10.8828125, "global_step": 340587, "epoch": 2027} {"train_loss": -11.947563171386719, "global_step": 340588, "epoch": 2027} {"train_loss": -10.900312423706055, "global_step": 340589, "epoch": 2027} {"train_loss": -11.556883811950684, "global_step": 340590, "epoch": 2027} {"train_loss": -11.276548385620117, "global_step": 340591, "epoch": 2027} {"train_loss": -11.756296157836914, "global_step": 340592, "epoch": 2027} {"train_loss": -11.534578323364258, "global_step": 340593, "epoch": 2027} {"train_loss": -12.225568771362305, "global_step": 340594, "epoch": 2027} {"train_loss": -12.072625160217285, "global_step": 340595, "epoch": 2027} {"train_loss": -12.105314254760742, "global_step": 340596, "epoch": 2027} {"train_loss": -12.328962326049805, "global_step": 340597, "epoch": 2027} {"train_loss": -12.157541275024414, "global_step": 340598, "epoch": 2027} {"train_loss": -12.090473175048828, "global_step": 340599, "epoch": 2027} {"train_loss": -12.359564781188965, "global_step": 340600, "epoch": 2027} {"train_loss": -11.912725448608398, "global_step": 340601, "epoch": 2027} {"train_loss": -11.853257179260254, "global_step": 340602, "epoch": 2027} {"train_loss": -12.017281532287598, "global_step": 340603, "epoch": 2027} {"train_loss": -11.881355285644531, "global_step": 340604, "epoch": 2027} {"train_loss": -11.678138732910156, "global_step": 340605, "epoch": 2027} {"train_loss": -12.17080020904541, "global_step": 340606, "epoch": 2027} {"train_loss": -11.340107917785645, "global_step": 340607, "epoch": 2027} {"train_loss": -12.229000091552734, "global_step": 340608, "epoch": 2027} {"train_loss": -12.092119216918945, "global_step": 340609, "epoch": 2027} {"train_loss": -11.863639831542969, "global_step": 340610, "epoch": 2027} {"train_loss": -12.130603790283203, "global_step": 340611, "epoch": 2027} {"train_loss": -11.921998977661133, "global_step": 340612, "epoch": 2027} {"train_loss": -11.947468757629395, "global_step": 340613, "epoch": 2027} {"train_loss": -12.035442352294922, "global_step": 340614, "epoch": 2027} {"train_loss": -11.589727401733398, "global_step": 340615, "epoch": 2027} {"train_loss": -11.542139053344727, "global_step": 340616, "epoch": 2027} {"train_loss": -11.948676109313965, "global_step": 340617, "epoch": 2027} {"train_loss": -10.757387161254883, "global_step": 340618, "epoch": 2027} {"train_loss": -11.415630340576172, "global_step": 340619, "epoch": 2027} {"train_loss": -11.1849365234375, "global_step": 340620, "epoch": 2027} {"train_loss": -10.844734191894531, "global_step": 340621, "epoch": 2027} {"train_loss": -11.268830299377441, "global_step": 340622, "epoch": 2027} {"train_loss": -11.343530654907227, "global_step": 340623, "epoch": 2027} {"train_loss": -11.129083633422852, "global_step": 340624, "epoch": 2027} {"train_loss": -11.009899139404297, "global_step": 340625, "epoch": 2027} {"train_loss": -10.58174991607666, "global_step": 340626, "epoch": 2027} {"train_loss": -11.042922973632812, "global_step": 340627, "epoch": 2027} {"train_loss": -9.164690017700195, "global_step": 340628, "epoch": 2027} {"train_loss": -10.254621505737305, "global_step": 340629, "epoch": 2027} {"train_loss": -10.49622917175293, "global_step": 340630, "epoch": 2027} {"train_loss": -9.772607803344727, "global_step": 340631, "epoch": 2027} {"train_loss": -9.971332550048828, "global_step": 340632, "epoch": 2027} {"train_loss": -10.34299087524414, "global_step": 340633, "epoch": 2027} {"train_loss": -10.190115928649902, "global_step": 340634, "epoch": 2027} {"train_loss": -10.949960708618164, "global_step": 340635, "epoch": 2027} {"train_loss": -10.605939865112305, "global_step": 340636, "epoch": 2027} {"train_loss": -10.914295196533203, "global_step": 340637, "epoch": 2027} {"train_loss": -10.515595436096191, "global_step": 340638, "epoch": 2027} {"train_loss": -10.854470252990723, "global_step": 340639, "epoch": 2027} {"train_loss": -11.463200569152832, "global_step": 340640, "epoch": 2027} {"train_loss": -11.04448127746582, "global_step": 340641, "epoch": 2027} {"train_loss": -10.578596115112305, "global_step": 340642, "epoch": 2027} {"train_loss": -11.690557479858398, "global_step": 340643, "epoch": 2027} {"train_loss": -11.000581741333008, "global_step": 340644, "epoch": 2027} {"train_loss": -10.827925682067871, "global_step": 340645, "epoch": 2027} {"train_loss": -11.592653274536133, "global_step": 340646, "epoch": 2027} {"train_loss": -10.361482620239258, "global_step": 340647, "epoch": 2027} {"train_loss": -10.938026428222656, "global_step": 340648, "epoch": 2027} {"train_loss": -10.81715202331543, "global_step": 340649, "epoch": 2027} {"train_loss": -10.418501853942871, "global_step": 340650, "epoch": 2027} {"train_loss": -11.576444625854492, "global_step": 340651, "epoch": 2027} {"train_loss": -11.880940437316895, "global_step": 340652, "epoch": 2027} {"train_loss": -11.233112335205078, "global_step": 340653, "epoch": 2027} {"train_loss": -11.936138153076172, "global_step": 340654, "epoch": 2027} {"train_loss": -11.83426284790039, "global_step": 340655, "epoch": 2027} {"train_loss": -11.642045974731445, "global_step": 340656, "epoch": 2027} {"train_loss": -12.002413749694824, "global_step": 340657, "epoch": 2027} {"train_loss": -11.84184455871582, "global_step": 340658, "epoch": 2027} {"train_loss": -11.548271179199219, "global_step": 340659, "epoch": 2027} {"train_loss": -12.183462142944336, "global_step": 340660, "epoch": 2027} {"train_loss": -11.390115737915039, "global_step": 340661, "epoch": 2027} {"train_loss": -11.681550979614258, "global_step": 340662, "epoch": 2027} {"train_loss": -12.088629722595215, "global_step": 340663, "epoch": 2027} {"train_loss": -11.682601928710938, "global_step": 340664, "epoch": 2027} {"train_loss": -11.784418106079102, "global_step": 340665, "epoch": 2027} {"train_loss": -12.043010711669922, "global_step": 340666, "epoch": 2027} {"train_loss": -11.788575172424316, "global_step": 340667, "epoch": 2027} {"train_loss": -12.029560089111328, "global_step": 340668, "epoch": 2027} {"train_loss": -12.083930015563965, "global_step": 340669, "epoch": 2027} {"train_loss": -11.982673645019531, "global_step": 340670, "epoch": 2027} {"train_loss": -11.980718612670898, "global_step": 340671, "epoch": 2027} {"train_loss": -11.749882698059082, "global_step": 340672, "epoch": 2027} {"train_loss": -12.107564926147461, "global_step": 340673, "epoch": 2027} {"train_loss": -12.364222526550293, "global_step": 340674, "epoch": 2027} {"train_loss": -11.946046829223633, "global_step": 340675, "epoch": 2027} {"train_loss": -12.152771949768066, "global_step": 340676, "epoch": 2027} {"train_loss": -11.916950225830078, "global_step": 340677, "epoch": 2027} {"train_loss": -12.036361694335938, "global_step": 340678, "epoch": 2027} {"train_loss": -12.2051420211792, "global_step": 340679, "epoch": 2027} {"train_loss": -12.023456573486328, "global_step": 340680, "epoch": 2027} {"train_loss": -12.193800926208496, "global_step": 340681, "epoch": 2027} {"train_loss": -12.326725959777832, "global_step": 340682, "epoch": 2027} {"train_loss": -12.078530311584473, "global_step": 340683, "epoch": 2027} {"train_loss": -12.37294864654541, "global_step": 340684, "epoch": 2027} {"train_loss": -12.109054565429688, "global_step": 340685, "epoch": 2027} {"train_loss": -12.11343765258789, "global_step": 340686, "epoch": 2027} {"train_loss": -12.474595069885254, "global_step": 340687, "epoch": 2027} {"train_loss": -12.393987655639648, "global_step": 340688, "epoch": 2027} {"train_loss": -12.424643516540527, "global_step": 340689, "epoch": 2027} {"train_loss": -12.282853126525879, "global_step": 340690, "epoch": 2027} {"train_loss": -12.265037536621094, "global_step": 340691, "epoch": 2027} {"train_loss": -12.367356300354004, "global_step": 340692, "epoch": 2027} {"train_loss": -12.120193481445312, "global_step": 340693, "epoch": 2027} {"train_loss": -12.460131645202637, "global_step": 340694, "epoch": 2027} {"train_loss": -12.23888874053955, "global_step": 340695, "epoch": 2027} {"train_loss": -12.46391773223877, "global_step": 340696, "epoch": 2027} {"train_loss": -12.084240913391113, "global_step": 340697, "epoch": 2027} {"train_loss": -12.121248245239258, "global_step": 340698, "epoch": 2027} {"train_loss": -12.031246185302734, "global_step": 340699, "epoch": 2027} {"train_loss": -12.57834243774414, "global_step": 340700, "epoch": 2027} {"train_loss": -12.470314979553223, "global_step": 340701, "epoch": 2027} {"train_loss": -12.569025039672852, "global_step": 340702, "epoch": 2027} {"train_loss": -11.747381437392463, "global_step": 340703, "epoch": 2027, "val_loss": 286344.9375} {"train_loss": -12.373215675354004, "global_step": 340704, "epoch": 2028} {"train_loss": -12.479166030883789, "global_step": 340705, "epoch": 2028} {"train_loss": -12.360788345336914, "global_step": 340706, "epoch": 2028} {"train_loss": -12.265402793884277, "global_step": 340707, "epoch": 2028} {"train_loss": -12.412444114685059, "global_step": 340708, "epoch": 2028} {"train_loss": -12.385774612426758, "global_step": 340709, "epoch": 2028} {"train_loss": -12.403697967529297, "global_step": 340710, "epoch": 2028} {"train_loss": -12.374002456665039, "global_step": 340711, "epoch": 2028} {"train_loss": -12.578336715698242, "global_step": 340712, "epoch": 2028} {"train_loss": -12.661643028259277, "global_step": 340713, "epoch": 2028} {"train_loss": -12.145362854003906, "global_step": 340714, "epoch": 2028} {"train_loss": -12.34752082824707, "global_step": 340715, "epoch": 2028} {"train_loss": -12.477090835571289, "global_step": 340716, "epoch": 2028} {"train_loss": -12.492874145507812, "global_step": 340717, "epoch": 2028} {"train_loss": -12.53809928894043, "global_step": 340718, "epoch": 2028} {"train_loss": -12.671609878540039, "global_step": 340719, "epoch": 2028} {"train_loss": -12.614755630493164, "global_step": 340720, "epoch": 2028} {"train_loss": -12.699590682983398, "global_step": 340721, "epoch": 2028} {"train_loss": -12.625879287719727, "global_step": 340722, "epoch": 2028} {"train_loss": -12.436983108520508, "global_step": 340723, "epoch": 2028} {"train_loss": -12.695805549621582, "global_step": 340724, "epoch": 2028} {"train_loss": -12.537941932678223, "global_step": 340725, "epoch": 2028} {"train_loss": -12.532681465148926, "global_step": 340726, "epoch": 2028} {"train_loss": -12.621929168701172, "global_step": 340727, "epoch": 2028} {"train_loss": -12.529533386230469, "global_step": 340728, "epoch": 2028} {"train_loss": -12.657888412475586, "global_step": 340729, "epoch": 2028} {"train_loss": -12.609090805053711, "global_step": 340730, "epoch": 2028} {"train_loss": -12.697076797485352, "global_step": 340731, "epoch": 2028} {"train_loss": -12.376672744750977, "global_step": 340732, "epoch": 2028} {"train_loss": -12.629162788391113, "global_step": 340733, "epoch": 2028} {"train_loss": -12.514455795288086, "global_step": 340734, "epoch": 2028} {"train_loss": -12.691649436950684, "global_step": 340735, "epoch": 2028} {"train_loss": -12.588947296142578, "global_step": 340736, "epoch": 2028} {"train_loss": -12.369556427001953, "global_step": 340737, "epoch": 2028} {"train_loss": -12.802558898925781, "global_step": 340738, "epoch": 2028} {"train_loss": -12.499320030212402, "global_step": 340739, "epoch": 2028} {"train_loss": -11.809316635131836, "global_step": 340740, "epoch": 2028} {"train_loss": -11.897684097290039, "global_step": 340741, "epoch": 2028} {"train_loss": -12.626899719238281, "global_step": 340742, "epoch": 2028} {"train_loss": -12.227910041809082, "global_step": 340743, "epoch": 2028} {"train_loss": -12.354045867919922, "global_step": 340744, "epoch": 2028} {"train_loss": -11.909004211425781, "global_step": 340745, "epoch": 2028} {"train_loss": -11.699454307556152, "global_step": 340746, "epoch": 2028} {"train_loss": -11.629823684692383, "global_step": 340747, "epoch": 2028} {"train_loss": -12.316742897033691, "global_step": 340748, "epoch": 2028} {"train_loss": -12.497945785522461, "global_step": 340749, "epoch": 2028} {"train_loss": -12.428742408752441, "global_step": 340750, "epoch": 2028} {"train_loss": -11.872337341308594, "global_step": 340751, "epoch": 2028} {"train_loss": -11.989727020263672, "global_step": 340752, "epoch": 2028} {"train_loss": -12.014741897583008, "global_step": 340753, "epoch": 2028} {"train_loss": -12.436203956604004, "global_step": 340754, "epoch": 2028} {"train_loss": -12.561105728149414, "global_step": 340755, "epoch": 2028} {"train_loss": -12.429311752319336, "global_step": 340756, "epoch": 2028} {"train_loss": -12.035916328430176, "global_step": 340757, "epoch": 2028} {"train_loss": -10.30828857421875, "global_step": 340758, "epoch": 2028} {"train_loss": -10.744670867919922, "global_step": 340759, "epoch": 2028} {"train_loss": -12.155898094177246, "global_step": 340760, "epoch": 2028} {"train_loss": -11.747347831726074, "global_step": 340761, "epoch": 2028} {"train_loss": -11.89411449432373, "global_step": 340762, "epoch": 2028} {"train_loss": -10.92155647277832, "global_step": 340763, "epoch": 2028} {"train_loss": -11.296002388000488, "global_step": 340764, "epoch": 2028} {"train_loss": -11.363426208496094, "global_step": 340765, "epoch": 2028} {"train_loss": -11.932373046875, "global_step": 340766, "epoch": 2028} {"train_loss": -10.55018138885498, "global_step": 340767, "epoch": 2028} {"train_loss": -11.119668006896973, "global_step": 340768, "epoch": 2028} {"train_loss": -11.857758522033691, "global_step": 340769, "epoch": 2028} {"train_loss": -11.025787353515625, "global_step": 340770, "epoch": 2028} {"train_loss": -11.552396774291992, "global_step": 340771, "epoch": 2028} {"train_loss": -11.297121047973633, "global_step": 340772, "epoch": 2028} {"train_loss": -12.426751136779785, "global_step": 340773, "epoch": 2028} {"train_loss": -11.300261497497559, "global_step": 340774, "epoch": 2028} {"train_loss": -11.910456657409668, "global_step": 340775, "epoch": 2028} {"train_loss": -11.46817398071289, "global_step": 340776, "epoch": 2028} {"train_loss": -10.477819442749023, "global_step": 340777, "epoch": 2028} {"train_loss": -11.765148162841797, "global_step": 340778, "epoch": 2028} {"train_loss": -10.984600067138672, "global_step": 340779, "epoch": 2028} {"train_loss": -9.231582641601562, "global_step": 340780, "epoch": 2028} {"train_loss": -10.17004680633545, "global_step": 340781, "epoch": 2028} {"train_loss": -10.068618774414062, "global_step": 340782, "epoch": 2028} {"train_loss": -11.616052627563477, "global_step": 340783, "epoch": 2028} {"train_loss": -10.883516311645508, "global_step": 340784, "epoch": 2028} {"train_loss": -10.770241737365723, "global_step": 340785, "epoch": 2028} {"train_loss": -10.726463317871094, "global_step": 340786, "epoch": 2028} {"train_loss": -9.526458740234375, "global_step": 340787, "epoch": 2028} {"train_loss": -11.336800575256348, "global_step": 340788, "epoch": 2028} {"train_loss": -9.517656326293945, "global_step": 340789, "epoch": 2028} {"train_loss": -10.686723709106445, "global_step": 340790, "epoch": 2028} {"train_loss": -9.830127716064453, "global_step": 340791, "epoch": 2028} {"train_loss": -11.034552574157715, "global_step": 340792, "epoch": 2028} {"train_loss": -10.283206939697266, "global_step": 340793, "epoch": 2028} {"train_loss": -11.184871673583984, "global_step": 340794, "epoch": 2028} {"train_loss": -10.567170143127441, "global_step": 340795, "epoch": 2028} {"train_loss": -10.922306060791016, "global_step": 340796, "epoch": 2028} {"train_loss": -10.949311256408691, "global_step": 340797, "epoch": 2028} {"train_loss": -11.4569673538208, "global_step": 340798, "epoch": 2028} {"train_loss": -10.961458206176758, "global_step": 340799, "epoch": 2028} {"train_loss": -11.360808372497559, "global_step": 340800, "epoch": 2028} {"train_loss": -11.571557998657227, "global_step": 340801, "epoch": 2028} {"train_loss": -11.28223991394043, "global_step": 340802, "epoch": 2028} {"train_loss": -11.117386817932129, "global_step": 340803, "epoch": 2028} {"train_loss": -11.335691452026367, "global_step": 340804, "epoch": 2028} {"train_loss": -11.677358627319336, "global_step": 340805, "epoch": 2028} {"train_loss": -11.351480484008789, "global_step": 340806, "epoch": 2028} {"train_loss": -11.754495620727539, "global_step": 340807, "epoch": 2028} {"train_loss": -11.33419418334961, "global_step": 340808, "epoch": 2028} {"train_loss": -11.642166137695312, "global_step": 340809, "epoch": 2028} {"train_loss": -11.513323783874512, "global_step": 340810, "epoch": 2028} {"train_loss": -11.459238052368164, "global_step": 340811, "epoch": 2028} {"train_loss": -11.145440101623535, "global_step": 340812, "epoch": 2028} {"train_loss": -11.63792610168457, "global_step": 340813, "epoch": 2028} {"train_loss": -11.38709831237793, "global_step": 340814, "epoch": 2028} {"train_loss": -11.818798065185547, "global_step": 340815, "epoch": 2028} {"train_loss": -11.530064582824707, "global_step": 340816, "epoch": 2028} {"train_loss": -11.806385040283203, "global_step": 340817, "epoch": 2028} {"train_loss": -11.861495971679688, "global_step": 340818, "epoch": 2028} {"train_loss": -11.911092758178711, "global_step": 340819, "epoch": 2028} {"train_loss": -11.829387664794922, "global_step": 340820, "epoch": 2028} {"train_loss": -11.778722763061523, "global_step": 340821, "epoch": 2028} {"train_loss": -11.877466201782227, "global_step": 340822, "epoch": 2028} {"train_loss": -11.718608856201172, "global_step": 340823, "epoch": 2028} {"train_loss": -12.12717342376709, "global_step": 340824, "epoch": 2028} {"train_loss": -11.821290016174316, "global_step": 340825, "epoch": 2028} {"train_loss": -11.918169021606445, "global_step": 340826, "epoch": 2028} {"train_loss": -12.21943473815918, "global_step": 340827, "epoch": 2028} {"train_loss": -12.090570449829102, "global_step": 340828, "epoch": 2028} {"train_loss": -11.856372833251953, "global_step": 340829, "epoch": 2028} {"train_loss": -12.006921768188477, "global_step": 340830, "epoch": 2028} {"train_loss": -11.786942481994629, "global_step": 340831, "epoch": 2028} {"train_loss": -12.122488021850586, "global_step": 340832, "epoch": 2028} {"train_loss": -12.027649879455566, "global_step": 340833, "epoch": 2028} {"train_loss": -12.067020416259766, "global_step": 340834, "epoch": 2028} {"train_loss": -12.109180450439453, "global_step": 340835, "epoch": 2028} {"train_loss": -12.207701683044434, "global_step": 340836, "epoch": 2028} {"train_loss": -12.325922966003418, "global_step": 340837, "epoch": 2028} {"train_loss": -12.133922576904297, "global_step": 340838, "epoch": 2028} {"train_loss": -12.505880355834961, "global_step": 340839, "epoch": 2028} {"train_loss": -12.461894989013672, "global_step": 340840, "epoch": 2028} {"train_loss": -12.310855865478516, "global_step": 340841, "epoch": 2028} {"train_loss": -12.267328262329102, "global_step": 340842, "epoch": 2028} {"train_loss": -12.163372993469238, "global_step": 340843, "epoch": 2028} {"train_loss": -12.44253158569336, "global_step": 340844, "epoch": 2028} {"train_loss": -12.327728271484375, "global_step": 340845, "epoch": 2028} {"train_loss": -11.859777450561523, "global_step": 340846, "epoch": 2028} {"train_loss": -12.328605651855469, "global_step": 340847, "epoch": 2028} {"train_loss": -12.290572166442871, "global_step": 340848, "epoch": 2028} {"train_loss": -12.421286582946777, "global_step": 340849, "epoch": 2028} {"train_loss": -12.565864562988281, "global_step": 340850, "epoch": 2028} {"train_loss": -12.561334609985352, "global_step": 340851, "epoch": 2028} {"train_loss": -12.46164321899414, "global_step": 340852, "epoch": 2028} {"train_loss": -12.35498046875, "global_step": 340853, "epoch": 2028} {"train_loss": -12.551011085510254, "global_step": 340854, "epoch": 2028} {"train_loss": -12.357555389404297, "global_step": 340855, "epoch": 2028} {"train_loss": -12.372894287109375, "global_step": 340856, "epoch": 2028} {"train_loss": -12.488147735595703, "global_step": 340857, "epoch": 2028} {"train_loss": -12.384530067443848, "global_step": 340858, "epoch": 2028} {"train_loss": -12.542288780212402, "global_step": 340859, "epoch": 2028} {"train_loss": -12.224323272705078, "global_step": 340860, "epoch": 2028} {"train_loss": -12.40283489227295, "global_step": 340861, "epoch": 2028} {"train_loss": -12.465368270874023, "global_step": 340862, "epoch": 2028} {"train_loss": -12.366905212402344, "global_step": 340863, "epoch": 2028} {"train_loss": -12.506117820739746, "global_step": 340864, "epoch": 2028} {"train_loss": -12.565834045410156, "global_step": 340865, "epoch": 2028} {"train_loss": -12.395587921142578, "global_step": 340866, "epoch": 2028} {"train_loss": -12.416460037231445, "global_step": 340867, "epoch": 2028} {"train_loss": -12.666942596435547, "global_step": 340868, "epoch": 2028} {"train_loss": -12.179027557373047, "global_step": 340869, "epoch": 2028} {"train_loss": -12.367670059204102, "global_step": 340870, "epoch": 2028} {"train_loss": -11.895156423250834, "global_step": 340871, "epoch": 2028, "val_loss": 286170.96875} {"train_loss": -12.293195724487305, "global_step": 340872, "epoch": 2029} {"train_loss": -12.667083740234375, "global_step": 340873, "epoch": 2029} {"train_loss": -12.743853569030762, "global_step": 340874, "epoch": 2029} {"train_loss": -12.69240951538086, "global_step": 340875, "epoch": 2029} {"train_loss": -12.577203750610352, "global_step": 340876, "epoch": 2029} {"train_loss": -12.608267784118652, "global_step": 340877, "epoch": 2029} {"train_loss": -12.78013801574707, "global_step": 340878, "epoch": 2029} {"train_loss": -12.725879669189453, "global_step": 340879, "epoch": 2029} {"train_loss": -12.58529281616211, "global_step": 340880, "epoch": 2029} {"train_loss": -12.62691879272461, "global_step": 340881, "epoch": 2029} {"train_loss": -12.090568542480469, "global_step": 340882, "epoch": 2029} {"train_loss": -12.512064933776855, "global_step": 340883, "epoch": 2029} {"train_loss": -12.382156372070312, "global_step": 340884, "epoch": 2029} {"train_loss": -12.325469970703125, "global_step": 340885, "epoch": 2029} {"train_loss": -12.456145286560059, "global_step": 340886, "epoch": 2029} {"train_loss": -12.437325477600098, "global_step": 340887, "epoch": 2029} {"train_loss": -12.201240539550781, "global_step": 340888, "epoch": 2029} {"train_loss": -12.567121505737305, "global_step": 340889, "epoch": 2029} {"train_loss": -11.825056076049805, "global_step": 340890, "epoch": 2029} {"train_loss": -11.68447494506836, "global_step": 340891, "epoch": 2029} {"train_loss": -11.206053733825684, "global_step": 340892, "epoch": 2029} {"train_loss": -11.890745162963867, "global_step": 340893, "epoch": 2029} {"train_loss": -11.943683624267578, "global_step": 340894, "epoch": 2029} {"train_loss": -10.851898193359375, "global_step": 340895, "epoch": 2029} {"train_loss": -11.766660690307617, "global_step": 340896, "epoch": 2029} {"train_loss": -11.417810440063477, "global_step": 340897, "epoch": 2029} {"train_loss": -10.10588550567627, "global_step": 340898, "epoch": 2029} {"train_loss": -11.360309600830078, "global_step": 340899, "epoch": 2029} {"train_loss": -10.479083061218262, "global_step": 340900, "epoch": 2029} {"train_loss": -8.425509452819824, "global_step": 340901, "epoch": 2029} {"train_loss": -11.627737045288086, "global_step": 340902, "epoch": 2029} {"train_loss": -9.976274490356445, "global_step": 340903, "epoch": 2029} {"train_loss": -11.0250244140625, "global_step": 340904, "epoch": 2029} {"train_loss": -11.550313949584961, "global_step": 340905, "epoch": 2029} {"train_loss": -10.076208114624023, "global_step": 340906, "epoch": 2029} {"train_loss": -11.808191299438477, "global_step": 340907, "epoch": 2029} {"train_loss": -10.471535682678223, "global_step": 340908, "epoch": 2029} {"train_loss": -9.718914031982422, "global_step": 340909, "epoch": 2029} {"train_loss": -10.668535232543945, "global_step": 340910, "epoch": 2029} {"train_loss": -8.752897262573242, "global_step": 340911, "epoch": 2029} {"train_loss": -11.44051456451416, "global_step": 340912, "epoch": 2029} {"train_loss": -8.682071685791016, "global_step": 340913, "epoch": 2029} {"train_loss": -9.408180236816406, "global_step": 340914, "epoch": 2029} {"train_loss": -9.440423965454102, "global_step": 340915, "epoch": 2029} {"train_loss": -11.240479469299316, "global_step": 340916, "epoch": 2029} {"train_loss": -10.045188903808594, "global_step": 340917, "epoch": 2029} {"train_loss": -10.694539070129395, "global_step": 340918, "epoch": 2029} {"train_loss": -11.731403350830078, "global_step": 340919, "epoch": 2029} {"train_loss": -10.073134422302246, "global_step": 340920, "epoch": 2029} {"train_loss": -11.757583618164062, "global_step": 340921, "epoch": 2029} {"train_loss": -10.90967082977295, "global_step": 340922, "epoch": 2029} {"train_loss": -10.718343734741211, "global_step": 340923, "epoch": 2029} {"train_loss": -11.339778900146484, "global_step": 340924, "epoch": 2029} {"train_loss": -11.279191017150879, "global_step": 340925, "epoch": 2029} {"train_loss": -10.833063125610352, "global_step": 340926, "epoch": 2029} {"train_loss": -11.604208946228027, "global_step": 340927, "epoch": 2029} {"train_loss": -10.96737289428711, "global_step": 340928, "epoch": 2029} {"train_loss": -11.431790351867676, "global_step": 340929, "epoch": 2029} {"train_loss": -11.58932113647461, "global_step": 340930, "epoch": 2029} {"train_loss": -11.403409004211426, "global_step": 340931, "epoch": 2029} {"train_loss": -11.678833961486816, "global_step": 340932, "epoch": 2029} {"train_loss": -11.169132232666016, "global_step": 340933, "epoch": 2029} {"train_loss": -11.600068092346191, "global_step": 340934, "epoch": 2029} {"train_loss": -11.598201751708984, "global_step": 340935, "epoch": 2029} {"train_loss": -10.97952938079834, "global_step": 340936, "epoch": 2029} {"train_loss": -11.696357727050781, "global_step": 340937, "epoch": 2029} {"train_loss": -11.721579551696777, "global_step": 340938, "epoch": 2029} {"train_loss": -11.39548110961914, "global_step": 340939, "epoch": 2029} {"train_loss": -11.338163375854492, "global_step": 340940, "epoch": 2029} {"train_loss": -11.57789134979248, "global_step": 340941, "epoch": 2029} {"train_loss": -10.696919441223145, "global_step": 340942, "epoch": 2029} {"train_loss": -11.661792755126953, "global_step": 340943, "epoch": 2029} {"train_loss": -11.248490333557129, "global_step": 340944, "epoch": 2029} {"train_loss": -12.07571029663086, "global_step": 340945, "epoch": 2029} {"train_loss": -11.295587539672852, "global_step": 340946, "epoch": 2029} {"train_loss": -11.759073257446289, "global_step": 340947, "epoch": 2029} {"train_loss": -11.282855987548828, "global_step": 340948, "epoch": 2029} {"train_loss": -11.625816345214844, "global_step": 340949, "epoch": 2029} {"train_loss": -11.493826866149902, "global_step": 340950, "epoch": 2029} {"train_loss": -11.571696281433105, "global_step": 340951, "epoch": 2029} {"train_loss": -10.900447845458984, "global_step": 340952, "epoch": 2029} {"train_loss": -11.878656387329102, "global_step": 340953, "epoch": 2029} {"train_loss": -11.301132202148438, "global_step": 340954, "epoch": 2029} {"train_loss": -12.048959732055664, "global_step": 340955, "epoch": 2029} {"train_loss": -11.637503623962402, "global_step": 340956, "epoch": 2029} {"train_loss": -11.214632987976074, "global_step": 340957, "epoch": 2029} {"train_loss": -12.045269966125488, "global_step": 340958, "epoch": 2029} {"train_loss": -11.384926795959473, "global_step": 340959, "epoch": 2029} {"train_loss": -11.40793228149414, "global_step": 340960, "epoch": 2029} {"train_loss": -11.972832679748535, "global_step": 340961, "epoch": 2029} {"train_loss": -11.41850471496582, "global_step": 340962, "epoch": 2029} {"train_loss": -12.007272720336914, "global_step": 340963, "epoch": 2029} {"train_loss": -11.93173599243164, "global_step": 340964, "epoch": 2029} {"train_loss": -11.723426818847656, "global_step": 340965, "epoch": 2029} {"train_loss": -11.440052032470703, "global_step": 340966, "epoch": 2029} {"train_loss": -11.401660919189453, "global_step": 340967, "epoch": 2029} {"train_loss": -11.502049446105957, "global_step": 340968, "epoch": 2029} {"train_loss": -11.477736473083496, "global_step": 340969, "epoch": 2029} {"train_loss": -11.250218391418457, "global_step": 340970, "epoch": 2029} {"train_loss": -11.545007705688477, "global_step": 340971, "epoch": 2029} {"train_loss": -11.879094123840332, "global_step": 340972, "epoch": 2029} {"train_loss": -11.227405548095703, "global_step": 340973, "epoch": 2029} {"train_loss": -12.054692268371582, "global_step": 340974, "epoch": 2029} {"train_loss": -11.868768692016602, "global_step": 340975, "epoch": 2029} {"train_loss": -11.901466369628906, "global_step": 340976, "epoch": 2029} {"train_loss": -11.594280242919922, "global_step": 340977, "epoch": 2029} {"train_loss": -11.555366516113281, "global_step": 340978, "epoch": 2029} {"train_loss": -11.798863410949707, "global_step": 340979, "epoch": 2029} {"train_loss": -11.677921295166016, "global_step": 340980, "epoch": 2029} {"train_loss": -11.788562774658203, "global_step": 340981, "epoch": 2029} {"train_loss": -11.672568321228027, "global_step": 340982, "epoch": 2029} {"train_loss": -11.570123672485352, "global_step": 340983, "epoch": 2029} {"train_loss": -11.941034317016602, "global_step": 340984, "epoch": 2029} {"train_loss": -11.77698040008545, "global_step": 340985, "epoch": 2029} {"train_loss": -11.890581130981445, "global_step": 340986, "epoch": 2029} {"train_loss": -12.081842422485352, "global_step": 340987, "epoch": 2029} {"train_loss": -11.856630325317383, "global_step": 340988, "epoch": 2029} {"train_loss": -12.176851272583008, "global_step": 340989, "epoch": 2029} {"train_loss": -12.132414817810059, "global_step": 340990, "epoch": 2029} {"train_loss": -12.15335464477539, "global_step": 340991, "epoch": 2029} {"train_loss": -11.906654357910156, "global_step": 340992, "epoch": 2029} {"train_loss": -11.730232238769531, "global_step": 340993, "epoch": 2029} {"train_loss": -11.945816993713379, "global_step": 340994, "epoch": 2029} {"train_loss": -12.103272438049316, "global_step": 340995, "epoch": 2029} {"train_loss": -12.350210189819336, "global_step": 340996, "epoch": 2029} {"train_loss": -12.100057601928711, "global_step": 340997, "epoch": 2029} {"train_loss": -12.278932571411133, "global_step": 340998, "epoch": 2029} {"train_loss": -12.259765625, "global_step": 340999, "epoch": 2029} {"train_loss": -12.200845718383789, "global_step": 341000, "epoch": 2029} {"train_loss": -12.211448669433594, "global_step": 341001, "epoch": 2029} {"train_loss": -12.07872200012207, "global_step": 341002, "epoch": 2029} {"train_loss": -12.1103515625, "global_step": 341003, "epoch": 2029} {"train_loss": -12.20068645477295, "global_step": 341004, "epoch": 2029} {"train_loss": -12.030060768127441, "global_step": 341005, "epoch": 2029} {"train_loss": -12.445036888122559, "global_step": 341006, "epoch": 2029} {"train_loss": -12.067227363586426, "global_step": 341007, "epoch": 2029} {"train_loss": -12.372909545898438, "global_step": 341008, "epoch": 2029} {"train_loss": -12.25450325012207, "global_step": 341009, "epoch": 2029} {"train_loss": -12.462651252746582, "global_step": 341010, "epoch": 2029} {"train_loss": -12.389730453491211, "global_step": 341011, "epoch": 2029} {"train_loss": -12.165003776550293, "global_step": 341012, "epoch": 2029} {"train_loss": -12.316689491271973, "global_step": 341013, "epoch": 2029} {"train_loss": -12.16792106628418, "global_step": 341014, "epoch": 2029} {"train_loss": -12.40188980102539, "global_step": 341015, "epoch": 2029} {"train_loss": -12.53276252746582, "global_step": 341016, "epoch": 2029} {"train_loss": -12.519538879394531, "global_step": 341017, "epoch": 2029} {"train_loss": -12.444480895996094, "global_step": 341018, "epoch": 2029} {"train_loss": -12.414261817932129, "global_step": 341019, "epoch": 2029} {"train_loss": -12.394451141357422, "global_step": 341020, "epoch": 2029} {"train_loss": -12.492951393127441, "global_step": 341021, "epoch": 2029} {"train_loss": -12.411430358886719, "global_step": 341022, "epoch": 2029} {"train_loss": -12.458526611328125, "global_step": 341023, "epoch": 2029} {"train_loss": -12.480907440185547, "global_step": 341024, "epoch": 2029} {"train_loss": -12.533452987670898, "global_step": 341025, "epoch": 2029} {"train_loss": -12.405685424804688, "global_step": 341026, "epoch": 2029} {"train_loss": -12.335334777832031, "global_step": 341027, "epoch": 2029} {"train_loss": -12.540116310119629, "global_step": 341028, "epoch": 2029} {"train_loss": -12.465317726135254, "global_step": 341029, "epoch": 2029} {"train_loss": -12.539819717407227, "global_step": 341030, "epoch": 2029} {"train_loss": -12.703242301940918, "global_step": 341031, "epoch": 2029} {"train_loss": -12.391780853271484, "global_step": 341032, "epoch": 2029} {"train_loss": -12.494820594787598, "global_step": 341033, "epoch": 2029} {"train_loss": -12.657022476196289, "global_step": 341034, "epoch": 2029} {"train_loss": -12.604076385498047, "global_step": 341035, "epoch": 2029} {"train_loss": -12.821525573730469, "global_step": 341036, "epoch": 2029} {"train_loss": -12.609903335571289, "global_step": 341037, "epoch": 2029} {"train_loss": -12.666814804077148, "global_step": 341038, "epoch": 2029} {"train_loss": -11.732729786918277, "global_step": 341039, "epoch": 2029, "val_loss": 286092.125} {"train_loss": -12.84849739074707, "global_step": 341040, "epoch": 2030} {"train_loss": -12.172554016113281, "global_step": 341041, "epoch": 2030} {"train_loss": -12.798728942871094, "global_step": 341042, "epoch": 2030} {"train_loss": -12.805940628051758, "global_step": 341043, "epoch": 2030} {"train_loss": -12.687566757202148, "global_step": 341044, "epoch": 2030} {"train_loss": -12.375991821289062, "global_step": 341045, "epoch": 2030} {"train_loss": -12.885808944702148, "global_step": 341046, "epoch": 2030} {"train_loss": -12.892728805541992, "global_step": 341047, "epoch": 2030} {"train_loss": -12.56678295135498, "global_step": 341048, "epoch": 2030} {"train_loss": -12.453767776489258, "global_step": 341049, "epoch": 2030} {"train_loss": -12.664426803588867, "global_step": 341050, "epoch": 2030} {"train_loss": -12.05235767364502, "global_step": 341051, "epoch": 2030} {"train_loss": -11.91470718383789, "global_step": 341052, "epoch": 2030} {"train_loss": -12.03713321685791, "global_step": 341053, "epoch": 2030} {"train_loss": -12.384552001953125, "global_step": 341054, "epoch": 2030} {"train_loss": -12.416999816894531, "global_step": 341055, "epoch": 2030} {"train_loss": -12.619319915771484, "global_step": 341056, "epoch": 2030} {"train_loss": -12.137763977050781, "global_step": 341057, "epoch": 2030} {"train_loss": -11.027040481567383, "global_step": 341058, "epoch": 2030} {"train_loss": -11.921525955200195, "global_step": 341059, "epoch": 2030} {"train_loss": -12.422298431396484, "global_step": 341060, "epoch": 2030} {"train_loss": -11.898151397705078, "global_step": 341061, "epoch": 2030} {"train_loss": -11.532398223876953, "global_step": 341062, "epoch": 2030} {"train_loss": -11.041888236999512, "global_step": 341063, "epoch": 2030} {"train_loss": -10.639360427856445, "global_step": 341064, "epoch": 2030} {"train_loss": -11.201936721801758, "global_step": 341065, "epoch": 2030} {"train_loss": -11.21931266784668, "global_step": 341066, "epoch": 2030} {"train_loss": -11.314895629882812, "global_step": 341067, "epoch": 2030} {"train_loss": -9.413068771362305, "global_step": 341068, "epoch": 2030} {"train_loss": -10.428323745727539, "global_step": 341069, "epoch": 2030} {"train_loss": -10.191524505615234, "global_step": 341070, "epoch": 2030} {"train_loss": -9.010091781616211, "global_step": 341071, "epoch": 2030} {"train_loss": -10.821638107299805, "global_step": 341072, "epoch": 2030} {"train_loss": -9.382902145385742, "global_step": 341073, "epoch": 2030} {"train_loss": -11.16794490814209, "global_step": 341074, "epoch": 2030} {"train_loss": -10.747576713562012, "global_step": 341075, "epoch": 2030} {"train_loss": -11.693985939025879, "global_step": 341076, "epoch": 2030} {"train_loss": -10.530468940734863, "global_step": 341077, "epoch": 2030} {"train_loss": -11.691929817199707, "global_step": 341078, "epoch": 2030} {"train_loss": -10.72137451171875, "global_step": 341079, "epoch": 2030} {"train_loss": -11.216827392578125, "global_step": 341080, "epoch": 2030} {"train_loss": -10.771869659423828, "global_step": 341081, "epoch": 2030} {"train_loss": -11.670026779174805, "global_step": 341082, "epoch": 2030} {"train_loss": -11.073593139648438, "global_step": 341083, "epoch": 2030} {"train_loss": -10.690136909484863, "global_step": 341084, "epoch": 2030} {"train_loss": -10.794189453125, "global_step": 341085, "epoch": 2030} {"train_loss": -11.226442337036133, "global_step": 341086, "epoch": 2030} {"train_loss": -11.307011604309082, "global_step": 341087, "epoch": 2030} {"train_loss": -10.260141372680664, "global_step": 341088, "epoch": 2030} {"train_loss": -9.816144943237305, "global_step": 341089, "epoch": 2030} {"train_loss": -11.491231918334961, "global_step": 341090, "epoch": 2030} {"train_loss": -9.991839408874512, "global_step": 341091, "epoch": 2030} {"train_loss": -11.799403190612793, "global_step": 341092, "epoch": 2030} {"train_loss": -10.414144515991211, "global_step": 341093, "epoch": 2030} {"train_loss": -11.524675369262695, "global_step": 341094, "epoch": 2030} {"train_loss": -11.11899471282959, "global_step": 341095, "epoch": 2030} {"train_loss": -11.756369590759277, "global_step": 341096, "epoch": 2030} {"train_loss": -11.033629417419434, "global_step": 341097, "epoch": 2030} {"train_loss": -11.48216438293457, "global_step": 341098, "epoch": 2030} {"train_loss": -11.532731056213379, "global_step": 341099, "epoch": 2030} {"train_loss": -11.643142700195312, "global_step": 341100, "epoch": 2030} {"train_loss": -11.849032402038574, "global_step": 341101, "epoch": 2030} {"train_loss": -11.614516258239746, "global_step": 341102, "epoch": 2030} {"train_loss": -11.819602966308594, "global_step": 341103, "epoch": 2030} {"train_loss": -11.86030387878418, "global_step": 341104, "epoch": 2030} {"train_loss": -11.92088794708252, "global_step": 341105, "epoch": 2030} {"train_loss": -12.164651870727539, "global_step": 341106, "epoch": 2030} {"train_loss": -11.794843673706055, "global_step": 341107, "epoch": 2030} {"train_loss": -12.166736602783203, "global_step": 341108, "epoch": 2030} {"train_loss": -12.206645965576172, "global_step": 341109, "epoch": 2030} {"train_loss": -11.935234069824219, "global_step": 341110, "epoch": 2030} {"train_loss": -12.11193561553955, "global_step": 341111, "epoch": 2030} {"train_loss": -12.199470520019531, "global_step": 341112, "epoch": 2030} {"train_loss": -11.84873104095459, "global_step": 341113, "epoch": 2030} {"train_loss": -12.161293983459473, "global_step": 341114, "epoch": 2030} {"train_loss": -11.851112365722656, "global_step": 341115, "epoch": 2030} {"train_loss": -12.210673332214355, "global_step": 341116, "epoch": 2030} {"train_loss": -12.2337646484375, "global_step": 341117, "epoch": 2030} {"train_loss": -12.191383361816406, "global_step": 341118, "epoch": 2030} {"train_loss": -12.366223335266113, "global_step": 341119, "epoch": 2030} {"train_loss": -12.195913314819336, "global_step": 341120, "epoch": 2030} {"train_loss": -12.380118370056152, "global_step": 341121, "epoch": 2030} {"train_loss": -11.976095199584961, "global_step": 341122, "epoch": 2030} {"train_loss": -12.474508285522461, "global_step": 341123, "epoch": 2030} {"train_loss": -12.124906539916992, "global_step": 341124, "epoch": 2030} {"train_loss": -12.302209854125977, "global_step": 341125, "epoch": 2030} {"train_loss": -12.489631652832031, "global_step": 341126, "epoch": 2030} {"train_loss": -12.337854385375977, "global_step": 341127, "epoch": 2030} {"train_loss": -12.306793212890625, "global_step": 341128, "epoch": 2030} {"train_loss": -12.570685386657715, "global_step": 341129, "epoch": 2030} {"train_loss": -12.088090896606445, "global_step": 341130, "epoch": 2030} {"train_loss": -12.413718223571777, "global_step": 341131, "epoch": 2030} {"train_loss": -12.123766899108887, "global_step": 341132, "epoch": 2030} {"train_loss": -12.204513549804688, "global_step": 341133, "epoch": 2030} {"train_loss": -12.359659194946289, "global_step": 341134, "epoch": 2030} {"train_loss": -12.382403373718262, "global_step": 341135, "epoch": 2030} {"train_loss": -12.35260009765625, "global_step": 341136, "epoch": 2030} {"train_loss": -12.341667175292969, "global_step": 341137, "epoch": 2030} {"train_loss": -12.5360107421875, "global_step": 341138, "epoch": 2030} {"train_loss": -12.313186645507812, "global_step": 341139, "epoch": 2030} {"train_loss": -12.416772842407227, "global_step": 341140, "epoch": 2030} {"train_loss": -12.516816139221191, "global_step": 341141, "epoch": 2030} {"train_loss": -12.455028533935547, "global_step": 341142, "epoch": 2030} {"train_loss": -12.596975326538086, "global_step": 341143, "epoch": 2030} {"train_loss": -12.434711456298828, "global_step": 341144, "epoch": 2030} {"train_loss": -12.546138763427734, "global_step": 341145, "epoch": 2030} {"train_loss": -12.49642562866211, "global_step": 341146, "epoch": 2030} {"train_loss": -12.437139511108398, "global_step": 341147, "epoch": 2030} {"train_loss": -12.425610542297363, "global_step": 341148, "epoch": 2030} {"train_loss": -12.198545455932617, "global_step": 341149, "epoch": 2030} {"train_loss": -12.508841514587402, "global_step": 341150, "epoch": 2030} {"train_loss": -12.388671875, "global_step": 341151, "epoch": 2030} {"train_loss": -11.975571632385254, "global_step": 341152, "epoch": 2030} {"train_loss": -12.115699768066406, "global_step": 341153, "epoch": 2030} {"train_loss": -12.247576713562012, "global_step": 341154, "epoch": 2030} {"train_loss": -12.616291046142578, "global_step": 341155, "epoch": 2030} {"train_loss": -12.455808639526367, "global_step": 341156, "epoch": 2030} {"train_loss": -12.320863723754883, "global_step": 341157, "epoch": 2030} {"train_loss": -12.478629112243652, "global_step": 341158, "epoch": 2030} {"train_loss": -12.41708755493164, "global_step": 341159, "epoch": 2030} {"train_loss": -12.517461776733398, "global_step": 341160, "epoch": 2030} {"train_loss": -12.091731071472168, "global_step": 341161, "epoch": 2030} {"train_loss": -12.21413803100586, "global_step": 341162, "epoch": 2030} {"train_loss": -12.62187385559082, "global_step": 341163, "epoch": 2030} {"train_loss": -12.410804748535156, "global_step": 341164, "epoch": 2030} {"train_loss": -12.390270233154297, "global_step": 341165, "epoch": 2030} {"train_loss": -12.002260208129883, "global_step": 341166, "epoch": 2030} {"train_loss": -12.481178283691406, "global_step": 341167, "epoch": 2030} {"train_loss": -12.445722579956055, "global_step": 341168, "epoch": 2030} {"train_loss": -12.476480484008789, "global_step": 341169, "epoch": 2030} {"train_loss": -12.201805114746094, "global_step": 341170, "epoch": 2030} {"train_loss": -12.66736125946045, "global_step": 341171, "epoch": 2030} {"train_loss": -12.373048782348633, "global_step": 341172, "epoch": 2030} {"train_loss": -12.381816864013672, "global_step": 341173, "epoch": 2030} {"train_loss": -12.696051597595215, "global_step": 341174, "epoch": 2030} {"train_loss": -12.424722671508789, "global_step": 341175, "epoch": 2030} {"train_loss": -12.218974113464355, "global_step": 341176, "epoch": 2030} {"train_loss": -12.227862358093262, "global_step": 341177, "epoch": 2030} {"train_loss": -12.42647647857666, "global_step": 341178, "epoch": 2030} {"train_loss": -12.623175621032715, "global_step": 341179, "epoch": 2030} {"train_loss": -12.060226440429688, "global_step": 341180, "epoch": 2030} {"train_loss": -12.029942512512207, "global_step": 341181, "epoch": 2030} {"train_loss": -12.254960060119629, "global_step": 341182, "epoch": 2030} {"train_loss": -12.217134475708008, "global_step": 341183, "epoch": 2030} {"train_loss": -12.411460876464844, "global_step": 341184, "epoch": 2030} {"train_loss": -12.172172546386719, "global_step": 341185, "epoch": 2030} {"train_loss": -11.627010345458984, "global_step": 341186, "epoch": 2030} {"train_loss": -12.119499206542969, "global_step": 341187, "epoch": 2030} {"train_loss": -11.084282875061035, "global_step": 341188, "epoch": 2030} {"train_loss": -12.260566711425781, "global_step": 341189, "epoch": 2030} {"train_loss": -11.221574783325195, "global_step": 341190, "epoch": 2030} {"train_loss": -11.960027694702148, "global_step": 341191, "epoch": 2030} {"train_loss": -11.039745330810547, "global_step": 341192, "epoch": 2030} {"train_loss": -11.052467346191406, "global_step": 341193, "epoch": 2030} {"train_loss": -10.566422462463379, "global_step": 341194, "epoch": 2030} {"train_loss": -10.37492561340332, "global_step": 341195, "epoch": 2030} {"train_loss": -12.051416397094727, "global_step": 341196, "epoch": 2030} {"train_loss": -11.135135650634766, "global_step": 341197, "epoch": 2030} {"train_loss": -9.930835723876953, "global_step": 341198, "epoch": 2030} {"train_loss": -11.237468719482422, "global_step": 341199, "epoch": 2030} {"train_loss": -9.436634063720703, "global_step": 341200, "epoch": 2030} {"train_loss": -7.62815523147583, "global_step": 341201, "epoch": 2030} {"train_loss": -8.425859451293945, "global_step": 341202, "epoch": 2030} {"train_loss": -10.588523864746094, "global_step": 341203, "epoch": 2030} {"train_loss": -7.33802604675293, "global_step": 341204, "epoch": 2030} {"train_loss": -9.168289184570312, "global_step": 341205, "epoch": 2030} {"train_loss": -9.82533073425293, "global_step": 341206, "epoch": 2030} {"train_loss": -11.739134564286186, "global_step": 341207, "epoch": 2030, "val_loss": 282499.875, "train_action_mse_error": 0.35713711380958557} {"train_loss": -10.95334243774414, "global_step": 341208, "epoch": 2031} {"train_loss": -11.275071144104004, "global_step": 341209, "epoch": 2031} {"train_loss": -11.22601318359375, "global_step": 341210, "epoch": 2031} {"train_loss": -9.984254837036133, "global_step": 341211, "epoch": 2031} {"train_loss": -11.247489929199219, "global_step": 341212, "epoch": 2031} {"train_loss": -11.246918678283691, "global_step": 341213, "epoch": 2031} {"train_loss": -11.246591567993164, "global_step": 341214, "epoch": 2031} {"train_loss": -10.612181663513184, "global_step": 341215, "epoch": 2031} {"train_loss": -10.698347091674805, "global_step": 341216, "epoch": 2031} {"train_loss": -11.029115676879883, "global_step": 341217, "epoch": 2031} {"train_loss": -9.863565444946289, "global_step": 341218, "epoch": 2031} {"train_loss": -11.189778327941895, "global_step": 341219, "epoch": 2031} {"train_loss": -10.351669311523438, "global_step": 341220, "epoch": 2031} {"train_loss": -10.328312873840332, "global_step": 341221, "epoch": 2031} {"train_loss": -10.570024490356445, "global_step": 341222, "epoch": 2031} {"train_loss": -10.153623580932617, "global_step": 341223, "epoch": 2031} {"train_loss": -11.330476760864258, "global_step": 341224, "epoch": 2031} {"train_loss": -10.316566467285156, "global_step": 341225, "epoch": 2031} {"train_loss": -11.493867874145508, "global_step": 341226, "epoch": 2031} {"train_loss": -10.360690116882324, "global_step": 341227, "epoch": 2031} {"train_loss": -11.955793380737305, "global_step": 341228, "epoch": 2031} {"train_loss": -11.011104583740234, "global_step": 341229, "epoch": 2031} {"train_loss": -11.965269088745117, "global_step": 341230, "epoch": 2031} {"train_loss": -11.037396430969238, "global_step": 341231, "epoch": 2031} {"train_loss": -12.05990982055664, "global_step": 341232, "epoch": 2031} {"train_loss": -11.393943786621094, "global_step": 341233, "epoch": 2031} {"train_loss": -11.986574172973633, "global_step": 341234, "epoch": 2031} {"train_loss": -11.450886726379395, "global_step": 341235, "epoch": 2031} {"train_loss": -11.75625228881836, "global_step": 341236, "epoch": 2031} {"train_loss": -11.35123348236084, "global_step": 341237, "epoch": 2031} {"train_loss": -11.75184440612793, "global_step": 341238, "epoch": 2031} {"train_loss": -11.441446304321289, "global_step": 341239, "epoch": 2031} {"train_loss": -11.907278060913086, "global_step": 341240, "epoch": 2031} {"train_loss": -11.462934494018555, "global_step": 341241, "epoch": 2031} {"train_loss": -11.753986358642578, "global_step": 341242, "epoch": 2031} {"train_loss": -11.288553237915039, "global_step": 341243, "epoch": 2031} {"train_loss": -11.661405563354492, "global_step": 341244, "epoch": 2031} {"train_loss": -11.364492416381836, "global_step": 341245, "epoch": 2031} {"train_loss": -11.582735061645508, "global_step": 341246, "epoch": 2031} {"train_loss": -11.374565124511719, "global_step": 341247, "epoch": 2031} {"train_loss": -11.691417694091797, "global_step": 341248, "epoch": 2031} {"train_loss": -11.856861114501953, "global_step": 341249, "epoch": 2031} {"train_loss": -12.007296562194824, "global_step": 341250, "epoch": 2031} {"train_loss": -11.572235107421875, "global_step": 341251, "epoch": 2031} {"train_loss": -11.960979461669922, "global_step": 341252, "epoch": 2031} {"train_loss": -11.93084716796875, "global_step": 341253, "epoch": 2031} {"train_loss": -12.207751274108887, "global_step": 341254, "epoch": 2031} {"train_loss": -11.892972946166992, "global_step": 341255, "epoch": 2031} {"train_loss": -12.008845329284668, "global_step": 341256, "epoch": 2031} {"train_loss": -11.96146011352539, "global_step": 341257, "epoch": 2031} {"train_loss": -11.979477882385254, "global_step": 341258, "epoch": 2031} {"train_loss": -11.614616394042969, "global_step": 341259, "epoch": 2031} {"train_loss": -11.981969833374023, "global_step": 341260, "epoch": 2031} {"train_loss": -11.866104125976562, "global_step": 341261, "epoch": 2031} {"train_loss": -11.955376625061035, "global_step": 341262, "epoch": 2031} {"train_loss": -11.809653282165527, "global_step": 341263, "epoch": 2031} {"train_loss": -11.687108993530273, "global_step": 341264, "epoch": 2031} {"train_loss": -11.81768798828125, "global_step": 341265, "epoch": 2031} {"train_loss": -11.805340766906738, "global_step": 341266, "epoch": 2031} {"train_loss": -11.793804168701172, "global_step": 341267, "epoch": 2031} {"train_loss": -11.956771850585938, "global_step": 341268, "epoch": 2031} {"train_loss": -11.856282234191895, "global_step": 341269, "epoch": 2031} {"train_loss": -12.208940505981445, "global_step": 341270, "epoch": 2031} {"train_loss": -11.910760879516602, "global_step": 341271, "epoch": 2031} {"train_loss": -12.223073959350586, "global_step": 341272, "epoch": 2031} {"train_loss": -12.338922500610352, "global_step": 341273, "epoch": 2031} {"train_loss": -11.957500457763672, "global_step": 341274, "epoch": 2031} {"train_loss": -12.140129089355469, "global_step": 341275, "epoch": 2031} {"train_loss": -11.989707946777344, "global_step": 341276, "epoch": 2031} {"train_loss": -12.269951820373535, "global_step": 341277, "epoch": 2031} {"train_loss": -11.979684829711914, "global_step": 341278, "epoch": 2031} {"train_loss": -12.288436889648438, "global_step": 341279, "epoch": 2031} {"train_loss": -12.373899459838867, "global_step": 341280, "epoch": 2031} {"train_loss": -12.32846736907959, "global_step": 341281, "epoch": 2031} {"train_loss": -12.244272232055664, "global_step": 341282, "epoch": 2031} {"train_loss": -12.28449821472168, "global_step": 341283, "epoch": 2031} {"train_loss": -12.499650955200195, "global_step": 341284, "epoch": 2031} {"train_loss": -12.085424423217773, "global_step": 341285, "epoch": 2031} {"train_loss": -12.35660457611084, "global_step": 341286, "epoch": 2031} {"train_loss": -12.209267616271973, "global_step": 341287, "epoch": 2031} {"train_loss": -12.151453018188477, "global_step": 341288, "epoch": 2031} {"train_loss": -12.257705688476562, "global_step": 341289, "epoch": 2031} {"train_loss": -12.187935829162598, "global_step": 341290, "epoch": 2031} {"train_loss": -12.248350143432617, "global_step": 341291, "epoch": 2031} {"train_loss": -12.10177993774414, "global_step": 341292, "epoch": 2031} {"train_loss": -12.287450790405273, "global_step": 341293, "epoch": 2031} {"train_loss": -12.349056243896484, "global_step": 341294, "epoch": 2031} {"train_loss": -12.265514373779297, "global_step": 341295, "epoch": 2031} {"train_loss": -12.436050415039062, "global_step": 341296, "epoch": 2031} {"train_loss": -12.44588565826416, "global_step": 341297, "epoch": 2031} {"train_loss": -12.321627616882324, "global_step": 341298, "epoch": 2031} {"train_loss": -12.511281967163086, "global_step": 341299, "epoch": 2031} {"train_loss": -12.333625793457031, "global_step": 341300, "epoch": 2031} {"train_loss": -12.309202194213867, "global_step": 341301, "epoch": 2031} {"train_loss": -12.09239673614502, "global_step": 341302, "epoch": 2031} {"train_loss": -12.320810317993164, "global_step": 341303, "epoch": 2031} {"train_loss": -12.535655975341797, "global_step": 341304, "epoch": 2031} {"train_loss": -12.356027603149414, "global_step": 341305, "epoch": 2031} {"train_loss": -12.28828239440918, "global_step": 341306, "epoch": 2031} {"train_loss": -12.447126388549805, "global_step": 341307, "epoch": 2031} {"train_loss": -12.270147323608398, "global_step": 341308, "epoch": 2031} {"train_loss": -12.585615158081055, "global_step": 341309, "epoch": 2031} {"train_loss": -12.511682510375977, "global_step": 341310, "epoch": 2031} {"train_loss": -12.552919387817383, "global_step": 341311, "epoch": 2031} {"train_loss": -12.072586059570312, "global_step": 341312, "epoch": 2031} {"train_loss": -12.326881408691406, "global_step": 341313, "epoch": 2031} {"train_loss": -12.196399688720703, "global_step": 341314, "epoch": 2031} {"train_loss": -11.644984245300293, "global_step": 341315, "epoch": 2031} {"train_loss": -11.869792938232422, "global_step": 341316, "epoch": 2031} {"train_loss": -12.22659969329834, "global_step": 341317, "epoch": 2031} {"train_loss": -11.893684387207031, "global_step": 341318, "epoch": 2031} {"train_loss": -11.92508316040039, "global_step": 341319, "epoch": 2031} {"train_loss": -11.907482147216797, "global_step": 341320, "epoch": 2031} {"train_loss": -11.632373809814453, "global_step": 341321, "epoch": 2031} {"train_loss": -10.4359769821167, "global_step": 341322, "epoch": 2031} {"train_loss": -11.195093154907227, "global_step": 341323, "epoch": 2031} {"train_loss": -11.547163009643555, "global_step": 341324, "epoch": 2031} {"train_loss": -9.119873046875, "global_step": 341325, "epoch": 2031} {"train_loss": -12.134756088256836, "global_step": 341326, "epoch": 2031} {"train_loss": -9.904537200927734, "global_step": 341327, "epoch": 2031} {"train_loss": -9.627416610717773, "global_step": 341328, "epoch": 2031} {"train_loss": -11.878543853759766, "global_step": 341329, "epoch": 2031} {"train_loss": -8.755267143249512, "global_step": 341330, "epoch": 2031} {"train_loss": -9.642512321472168, "global_step": 341331, "epoch": 2031} {"train_loss": -11.593515396118164, "global_step": 341332, "epoch": 2031} {"train_loss": -8.869010925292969, "global_step": 341333, "epoch": 2031} {"train_loss": -10.427504539489746, "global_step": 341334, "epoch": 2031} {"train_loss": -10.515867233276367, "global_step": 341335, "epoch": 2031} {"train_loss": -10.327842712402344, "global_step": 341336, "epoch": 2031} {"train_loss": -11.475228309631348, "global_step": 341337, "epoch": 2031} {"train_loss": -11.164726257324219, "global_step": 341338, "epoch": 2031} {"train_loss": -11.167386054992676, "global_step": 341339, "epoch": 2031} {"train_loss": -11.882328033447266, "global_step": 341340, "epoch": 2031} {"train_loss": -11.345132827758789, "global_step": 341341, "epoch": 2031} {"train_loss": -12.031158447265625, "global_step": 341342, "epoch": 2031} {"train_loss": -11.556100845336914, "global_step": 341343, "epoch": 2031} {"train_loss": -11.97111701965332, "global_step": 341344, "epoch": 2031} {"train_loss": -11.949955940246582, "global_step": 341345, "epoch": 2031} {"train_loss": -11.705533981323242, "global_step": 341346, "epoch": 2031} {"train_loss": -11.959379196166992, "global_step": 341347, "epoch": 2031} {"train_loss": -11.902778625488281, "global_step": 341348, "epoch": 2031} {"train_loss": -11.852564811706543, "global_step": 341349, "epoch": 2031} {"train_loss": -12.292980194091797, "global_step": 341350, "epoch": 2031} {"train_loss": -11.820286750793457, "global_step": 341351, "epoch": 2031} {"train_loss": -12.04713249206543, "global_step": 341352, "epoch": 2031} {"train_loss": -11.78309440612793, "global_step": 341353, "epoch": 2031} {"train_loss": -11.627241134643555, "global_step": 341354, "epoch": 2031} {"train_loss": -11.913105964660645, "global_step": 341355, "epoch": 2031} {"train_loss": -11.335498809814453, "global_step": 341356, "epoch": 2031} {"train_loss": -12.155372619628906, "global_step": 341357, "epoch": 2031} {"train_loss": -11.14473819732666, "global_step": 341358, "epoch": 2031} {"train_loss": -12.044538497924805, "global_step": 341359, "epoch": 2031} {"train_loss": -11.68958854675293, "global_step": 341360, "epoch": 2031} {"train_loss": -11.634453773498535, "global_step": 341361, "epoch": 2031} {"train_loss": -11.495000839233398, "global_step": 341362, "epoch": 2031} {"train_loss": -11.97524642944336, "global_step": 341363, "epoch": 2031} {"train_loss": -11.203523635864258, "global_step": 341364, "epoch": 2031} {"train_loss": -11.892016410827637, "global_step": 341365, "epoch": 2031} {"train_loss": -11.458728790283203, "global_step": 341366, "epoch": 2031} {"train_loss": -11.74403190612793, "global_step": 341367, "epoch": 2031} {"train_loss": -12.198894500732422, "global_step": 341368, "epoch": 2031} {"train_loss": -11.675786972045898, "global_step": 341369, "epoch": 2031} {"train_loss": -11.811925888061523, "global_step": 341370, "epoch": 2031} {"train_loss": -11.866159439086914, "global_step": 341371, "epoch": 2031} {"train_loss": -11.987234115600586, "global_step": 341372, "epoch": 2031} {"train_loss": -12.089973449707031, "global_step": 341373, "epoch": 2031} {"train_loss": -11.950895309448242, "global_step": 341374, "epoch": 2031} {"train_loss": -11.658193128449577, "global_step": 341375, "epoch": 2031, "val_loss": 276990.3125} {"train_loss": -11.799551963806152, "global_step": 341376, "epoch": 2032} {"train_loss": -11.928834915161133, "global_step": 341377, "epoch": 2032} {"train_loss": -10.889348983764648, "global_step": 341378, "epoch": 2032} {"train_loss": -12.044954299926758, "global_step": 341379, "epoch": 2032} {"train_loss": -10.688284873962402, "global_step": 341380, "epoch": 2032} {"train_loss": -10.58763313293457, "global_step": 341381, "epoch": 2032} {"train_loss": -11.463329315185547, "global_step": 341382, "epoch": 2032} {"train_loss": -10.086551666259766, "global_step": 341383, "epoch": 2032} {"train_loss": -10.569143295288086, "global_step": 341384, "epoch": 2032} {"train_loss": -9.7023344039917, "global_step": 341385, "epoch": 2032} {"train_loss": -9.980253219604492, "global_step": 341386, "epoch": 2032} {"train_loss": -9.467453002929688, "global_step": 341387, "epoch": 2032} {"train_loss": -11.994982719421387, "global_step": 341388, "epoch": 2032} {"train_loss": -8.946100234985352, "global_step": 341389, "epoch": 2032} {"train_loss": -11.508577346801758, "global_step": 341390, "epoch": 2032} {"train_loss": -10.330085754394531, "global_step": 341391, "epoch": 2032} {"train_loss": -11.432373046875, "global_step": 341392, "epoch": 2032} {"train_loss": -10.036565780639648, "global_step": 341393, "epoch": 2032} {"train_loss": -11.823989868164062, "global_step": 341394, "epoch": 2032} {"train_loss": -9.995057106018066, "global_step": 341395, "epoch": 2032} {"train_loss": -12.048099517822266, "global_step": 341396, "epoch": 2032} {"train_loss": -10.829687118530273, "global_step": 341397, "epoch": 2032} {"train_loss": -11.893393516540527, "global_step": 341398, "epoch": 2032} {"train_loss": -11.466496467590332, "global_step": 341399, "epoch": 2032} {"train_loss": -11.746465682983398, "global_step": 341400, "epoch": 2032} {"train_loss": -11.692570686340332, "global_step": 341401, "epoch": 2032} {"train_loss": -11.877187728881836, "global_step": 341402, "epoch": 2032} {"train_loss": -11.693927764892578, "global_step": 341403, "epoch": 2032} {"train_loss": -11.540351867675781, "global_step": 341404, "epoch": 2032} {"train_loss": -11.820011138916016, "global_step": 341405, "epoch": 2032} {"train_loss": -11.249744415283203, "global_step": 341406, "epoch": 2032} {"train_loss": -12.111773490905762, "global_step": 341407, "epoch": 2032} {"train_loss": -11.66916275024414, "global_step": 341408, "epoch": 2032} {"train_loss": -11.982891082763672, "global_step": 341409, "epoch": 2032} {"train_loss": -11.79383659362793, "global_step": 341410, "epoch": 2032} {"train_loss": -12.00238037109375, "global_step": 341411, "epoch": 2032} {"train_loss": -11.608280181884766, "global_step": 341412, "epoch": 2032} {"train_loss": -12.091875076293945, "global_step": 341413, "epoch": 2032} {"train_loss": -12.067703247070312, "global_step": 341414, "epoch": 2032} {"train_loss": -12.190564155578613, "global_step": 341415, "epoch": 2032} {"train_loss": -11.941362380981445, "global_step": 341416, "epoch": 2032} {"train_loss": -12.175251007080078, "global_step": 341417, "epoch": 2032} {"train_loss": -12.157179832458496, "global_step": 341418, "epoch": 2032} {"train_loss": -11.895235061645508, "global_step": 341419, "epoch": 2032} {"train_loss": -12.107454299926758, "global_step": 341420, "epoch": 2032} {"train_loss": -12.104488372802734, "global_step": 341421, "epoch": 2032} {"train_loss": -11.940114974975586, "global_step": 341422, "epoch": 2032} {"train_loss": -12.065896034240723, "global_step": 341423, "epoch": 2032} {"train_loss": -12.119609832763672, "global_step": 341424, "epoch": 2032} {"train_loss": -12.317737579345703, "global_step": 341425, "epoch": 2032} {"train_loss": -12.067983627319336, "global_step": 341426, "epoch": 2032} {"train_loss": -12.292976379394531, "global_step": 341427, "epoch": 2032} {"train_loss": -12.428738594055176, "global_step": 341428, "epoch": 2032} {"train_loss": -12.315596580505371, "global_step": 341429, "epoch": 2032} {"train_loss": -12.149225234985352, "global_step": 341430, "epoch": 2032} {"train_loss": -12.483924865722656, "global_step": 341431, "epoch": 2032} {"train_loss": -12.173315048217773, "global_step": 341432, "epoch": 2032} {"train_loss": -12.266130447387695, "global_step": 341433, "epoch": 2032} {"train_loss": -12.099027633666992, "global_step": 341434, "epoch": 2032} {"train_loss": -12.29952621459961, "global_step": 341435, "epoch": 2032} {"train_loss": -12.263042449951172, "global_step": 341436, "epoch": 2032} {"train_loss": -12.299038887023926, "global_step": 341437, "epoch": 2032} {"train_loss": -12.456453323364258, "global_step": 341438, "epoch": 2032} {"train_loss": -12.609590530395508, "global_step": 341439, "epoch": 2032} {"train_loss": -12.369104385375977, "global_step": 341440, "epoch": 2032} {"train_loss": -12.120990753173828, "global_step": 341441, "epoch": 2032} {"train_loss": -12.442235946655273, "global_step": 341442, "epoch": 2032} {"train_loss": -12.422012329101562, "global_step": 341443, "epoch": 2032} {"train_loss": -12.40694522857666, "global_step": 341444, "epoch": 2032} {"train_loss": -12.504327774047852, "global_step": 341445, "epoch": 2032} {"train_loss": -12.629274368286133, "global_step": 341446, "epoch": 2032} {"train_loss": -12.70516586303711, "global_step": 341447, "epoch": 2032} {"train_loss": -12.60956859588623, "global_step": 341448, "epoch": 2032} {"train_loss": -12.589733123779297, "global_step": 341449, "epoch": 2032} {"train_loss": -12.58470630645752, "global_step": 341450, "epoch": 2032} {"train_loss": -12.045955657958984, "global_step": 341451, "epoch": 2032} {"train_loss": -12.72875690460205, "global_step": 341452, "epoch": 2032} {"train_loss": -12.451308250427246, "global_step": 341453, "epoch": 2032} {"train_loss": -12.587404251098633, "global_step": 341454, "epoch": 2032} {"train_loss": -12.568792343139648, "global_step": 341455, "epoch": 2032} {"train_loss": -12.59185791015625, "global_step": 341456, "epoch": 2032} {"train_loss": -12.564519882202148, "global_step": 341457, "epoch": 2032} {"train_loss": -12.591815948486328, "global_step": 341458, "epoch": 2032} {"train_loss": -12.469182014465332, "global_step": 341459, "epoch": 2032} {"train_loss": -12.650501251220703, "global_step": 341460, "epoch": 2032} {"train_loss": -12.49740982055664, "global_step": 341461, "epoch": 2032} {"train_loss": -12.608360290527344, "global_step": 341462, "epoch": 2032} {"train_loss": -12.562981605529785, "global_step": 341463, "epoch": 2032} {"train_loss": -12.866968154907227, "global_step": 341464, "epoch": 2032} {"train_loss": -12.702766418457031, "global_step": 341465, "epoch": 2032} {"train_loss": -12.735881805419922, "global_step": 341466, "epoch": 2032} {"train_loss": -12.527027130126953, "global_step": 341467, "epoch": 2032} {"train_loss": -12.750141143798828, "global_step": 341468, "epoch": 2032} {"train_loss": -12.822044372558594, "global_step": 341469, "epoch": 2032} {"train_loss": -12.841071128845215, "global_step": 341470, "epoch": 2032} {"train_loss": -12.762639045715332, "global_step": 341471, "epoch": 2032} {"train_loss": -12.575898170471191, "global_step": 341472, "epoch": 2032} {"train_loss": -12.482477188110352, "global_step": 341473, "epoch": 2032} {"train_loss": -12.81248950958252, "global_step": 341474, "epoch": 2032} {"train_loss": -12.80383014678955, "global_step": 341475, "epoch": 2032} {"train_loss": -12.766812324523926, "global_step": 341476, "epoch": 2032} {"train_loss": -12.792773246765137, "global_step": 341477, "epoch": 2032} {"train_loss": -12.811051368713379, "global_step": 341478, "epoch": 2032} {"train_loss": -12.844182014465332, "global_step": 341479, "epoch": 2032} {"train_loss": -12.780938148498535, "global_step": 341480, "epoch": 2032} {"train_loss": -12.952890396118164, "global_step": 341481, "epoch": 2032} {"train_loss": -12.70544719696045, "global_step": 341482, "epoch": 2032} {"train_loss": -12.627176284790039, "global_step": 341483, "epoch": 2032} {"train_loss": -12.609472274780273, "global_step": 341484, "epoch": 2032} {"train_loss": -12.660061836242676, "global_step": 341485, "epoch": 2032} {"train_loss": -12.038190841674805, "global_step": 341486, "epoch": 2032} {"train_loss": -12.040327072143555, "global_step": 341487, "epoch": 2032} {"train_loss": -10.497976303100586, "global_step": 341488, "epoch": 2032} {"train_loss": -10.79726505279541, "global_step": 341489, "epoch": 2032} {"train_loss": -12.577162742614746, "global_step": 341490, "epoch": 2032} {"train_loss": -9.758411407470703, "global_step": 341491, "epoch": 2032} {"train_loss": -8.595667839050293, "global_step": 341492, "epoch": 2032} {"train_loss": -11.562044143676758, "global_step": 341493, "epoch": 2032} {"train_loss": -6.205990791320801, "global_step": 341494, "epoch": 2032} {"train_loss": -6.349812030792236, "global_step": 341495, "epoch": 2032} {"train_loss": -6.315467834472656, "global_step": 341496, "epoch": 2032} {"train_loss": -5.8284912109375, "global_step": 341497, "epoch": 2032} {"train_loss": -5.436588287353516, "global_step": 341498, "epoch": 2032} {"train_loss": -5.704957485198975, "global_step": 341499, "epoch": 2032} {"train_loss": -6.409795761108398, "global_step": 341500, "epoch": 2032} {"train_loss": -5.757221221923828, "global_step": 341501, "epoch": 2032} {"train_loss": -5.473606109619141, "global_step": 341502, "epoch": 2032} {"train_loss": -5.930614471435547, "global_step": 341503, "epoch": 2032} {"train_loss": -7.535277366638184, "global_step": 341504, "epoch": 2032} {"train_loss": -6.59160041809082, "global_step": 341505, "epoch": 2032} {"train_loss": -6.842254638671875, "global_step": 341506, "epoch": 2032} {"train_loss": -6.907976150512695, "global_step": 341507, "epoch": 2032} {"train_loss": -7.074053764343262, "global_step": 341508, "epoch": 2032} {"train_loss": -8.696304321289062, "global_step": 341509, "epoch": 2032} {"train_loss": -7.6492719650268555, "global_step": 341510, "epoch": 2032} {"train_loss": -8.133743286132812, "global_step": 341511, "epoch": 2032} {"train_loss": -8.376299858093262, "global_step": 341512, "epoch": 2032} {"train_loss": -9.251888275146484, "global_step": 341513, "epoch": 2032} {"train_loss": -8.73054313659668, "global_step": 341514, "epoch": 2032} {"train_loss": -8.816333770751953, "global_step": 341515, "epoch": 2032} {"train_loss": -8.854416847229004, "global_step": 341516, "epoch": 2032} {"train_loss": -8.9005126953125, "global_step": 341517, "epoch": 2032} {"train_loss": -8.759864807128906, "global_step": 341518, "epoch": 2032} {"train_loss": -9.360264778137207, "global_step": 341519, "epoch": 2032} {"train_loss": -10.23298454284668, "global_step": 341520, "epoch": 2032} {"train_loss": -10.329286575317383, "global_step": 341521, "epoch": 2032} {"train_loss": -10.360483169555664, "global_step": 341522, "epoch": 2032} {"train_loss": -9.286182403564453, "global_step": 341523, "epoch": 2032} {"train_loss": -10.573858261108398, "global_step": 341524, "epoch": 2032} {"train_loss": -9.817540168762207, "global_step": 341525, "epoch": 2032} {"train_loss": -10.715790748596191, "global_step": 341526, "epoch": 2032} {"train_loss": -10.368021011352539, "global_step": 341527, "epoch": 2032} {"train_loss": -11.023444175720215, "global_step": 341528, "epoch": 2032} {"train_loss": -10.714825630187988, "global_step": 341529, "epoch": 2032} {"train_loss": -11.27519416809082, "global_step": 341530, "epoch": 2032} {"train_loss": -11.115148544311523, "global_step": 341531, "epoch": 2032} {"train_loss": -10.915908813476562, "global_step": 341532, "epoch": 2032} {"train_loss": -11.330787658691406, "global_step": 341533, "epoch": 2032} {"train_loss": -11.384353637695312, "global_step": 341534, "epoch": 2032} {"train_loss": -10.863739013671875, "global_step": 341535, "epoch": 2032} {"train_loss": -11.715360641479492, "global_step": 341536, "epoch": 2032} {"train_loss": -11.233983039855957, "global_step": 341537, "epoch": 2032} {"train_loss": -11.259864807128906, "global_step": 341538, "epoch": 2032} {"train_loss": -11.41067886352539, "global_step": 341539, "epoch": 2032} {"train_loss": -10.83871841430664, "global_step": 341540, "epoch": 2032} {"train_loss": -11.459980010986328, "global_step": 341541, "epoch": 2032} {"train_loss": -10.287351608276367, "global_step": 341542, "epoch": 2032} {"train_loss": -11.083725367273603, "global_step": 341543, "epoch": 2032, "val_loss": 282347.4375} {"train_loss": -11.052407264709473, "global_step": 341544, "epoch": 2033} {"train_loss": -11.528486251831055, "global_step": 341545, "epoch": 2033} {"train_loss": -11.14747142791748, "global_step": 341546, "epoch": 2033} {"train_loss": -11.64459228515625, "global_step": 341547, "epoch": 2033} {"train_loss": -10.71944808959961, "global_step": 341548, "epoch": 2033} {"train_loss": -11.73859977722168, "global_step": 341549, "epoch": 2033} {"train_loss": -10.91110610961914, "global_step": 341550, "epoch": 2033} {"train_loss": -11.61215591430664, "global_step": 341551, "epoch": 2033} {"train_loss": -10.934097290039062, "global_step": 341552, "epoch": 2033} {"train_loss": -11.406646728515625, "global_step": 341553, "epoch": 2033} {"train_loss": -11.509237289428711, "global_step": 341554, "epoch": 2033} {"train_loss": -11.486069679260254, "global_step": 341555, "epoch": 2033} {"train_loss": -11.43055534362793, "global_step": 341556, "epoch": 2033} {"train_loss": -11.592676162719727, "global_step": 341557, "epoch": 2033} {"train_loss": -11.80842399597168, "global_step": 341558, "epoch": 2033} {"train_loss": -11.925568580627441, "global_step": 341559, "epoch": 2033} {"train_loss": -11.889091491699219, "global_step": 341560, "epoch": 2033} {"train_loss": -11.446104049682617, "global_step": 341561, "epoch": 2033} {"train_loss": -12.21237564086914, "global_step": 341562, "epoch": 2033} {"train_loss": -11.758764266967773, "global_step": 341563, "epoch": 2033} {"train_loss": -11.440535545349121, "global_step": 341564, "epoch": 2033} {"train_loss": -11.932560920715332, "global_step": 341565, "epoch": 2033} {"train_loss": -11.633708953857422, "global_step": 341566, "epoch": 2033} {"train_loss": -11.89708423614502, "global_step": 341567, "epoch": 2033} {"train_loss": -11.669590950012207, "global_step": 341568, "epoch": 2033} {"train_loss": -11.939958572387695, "global_step": 341569, "epoch": 2033} {"train_loss": -11.767898559570312, "global_step": 341570, "epoch": 2033} {"train_loss": -11.840555191040039, "global_step": 341571, "epoch": 2033} {"train_loss": -12.024551391601562, "global_step": 341572, "epoch": 2033} {"train_loss": -12.091896057128906, "global_step": 341573, "epoch": 2033} {"train_loss": -11.667366027832031, "global_step": 341574, "epoch": 2033} {"train_loss": -12.112309455871582, "global_step": 341575, "epoch": 2033} {"train_loss": -11.618330001831055, "global_step": 341576, "epoch": 2033} {"train_loss": -12.182836532592773, "global_step": 341577, "epoch": 2033} {"train_loss": -11.859843254089355, "global_step": 341578, "epoch": 2033} {"train_loss": -11.874075889587402, "global_step": 341579, "epoch": 2033} {"train_loss": -12.210982322692871, "global_step": 341580, "epoch": 2033} {"train_loss": -11.944478034973145, "global_step": 341581, "epoch": 2033} {"train_loss": -12.186237335205078, "global_step": 341582, "epoch": 2033} {"train_loss": -12.103195190429688, "global_step": 341583, "epoch": 2033} {"train_loss": -11.989261627197266, "global_step": 341584, "epoch": 2033} {"train_loss": -12.24356460571289, "global_step": 341585, "epoch": 2033} {"train_loss": -12.156512260437012, "global_step": 341586, "epoch": 2033} {"train_loss": -11.991668701171875, "global_step": 341587, "epoch": 2033} {"train_loss": -12.244462013244629, "global_step": 341588, "epoch": 2033} {"train_loss": -12.069750785827637, "global_step": 341589, "epoch": 2033} {"train_loss": -12.194852828979492, "global_step": 341590, "epoch": 2033} {"train_loss": -12.342253684997559, "global_step": 341591, "epoch": 2033} {"train_loss": -12.186586380004883, "global_step": 341592, "epoch": 2033} {"train_loss": -11.965375900268555, "global_step": 341593, "epoch": 2033} {"train_loss": -12.310972213745117, "global_step": 341594, "epoch": 2033} {"train_loss": -11.691583633422852, "global_step": 341595, "epoch": 2033} {"train_loss": -11.575180053710938, "global_step": 341596, "epoch": 2033} {"train_loss": -12.027749061584473, "global_step": 341597, "epoch": 2033} {"train_loss": -12.251379013061523, "global_step": 341598, "epoch": 2033} {"train_loss": -11.457808494567871, "global_step": 341599, "epoch": 2033} {"train_loss": -12.338311195373535, "global_step": 341600, "epoch": 2033} {"train_loss": -12.13575553894043, "global_step": 341601, "epoch": 2033} {"train_loss": -12.168634414672852, "global_step": 341602, "epoch": 2033} {"train_loss": -12.511784553527832, "global_step": 341603, "epoch": 2033} {"train_loss": -12.331466674804688, "global_step": 341604, "epoch": 2033} {"train_loss": -12.13076400756836, "global_step": 341605, "epoch": 2033} {"train_loss": -12.281631469726562, "global_step": 341606, "epoch": 2033} {"train_loss": -12.274081230163574, "global_step": 341607, "epoch": 2033} {"train_loss": -11.925055503845215, "global_step": 341608, "epoch": 2033} {"train_loss": -12.501372337341309, "global_step": 341609, "epoch": 2033} {"train_loss": -11.859768867492676, "global_step": 341610, "epoch": 2033} {"train_loss": -11.572223663330078, "global_step": 341611, "epoch": 2033} {"train_loss": -12.020573616027832, "global_step": 341612, "epoch": 2033} {"train_loss": -12.408882141113281, "global_step": 341613, "epoch": 2033} {"train_loss": -11.890518188476562, "global_step": 341614, "epoch": 2033} {"train_loss": -12.077150344848633, "global_step": 341615, "epoch": 2033} {"train_loss": -12.527862548828125, "global_step": 341616, "epoch": 2033} {"train_loss": -12.03520679473877, "global_step": 341617, "epoch": 2033} {"train_loss": -12.046873092651367, "global_step": 341618, "epoch": 2033} {"train_loss": -12.472149848937988, "global_step": 341619, "epoch": 2033} {"train_loss": -12.303863525390625, "global_step": 341620, "epoch": 2033} {"train_loss": -12.093111038208008, "global_step": 341621, "epoch": 2033} {"train_loss": -12.215644836425781, "global_step": 341622, "epoch": 2033} {"train_loss": -12.056610107421875, "global_step": 341623, "epoch": 2033} {"train_loss": -11.644203186035156, "global_step": 341624, "epoch": 2033} {"train_loss": -12.234888076782227, "global_step": 341625, "epoch": 2033} {"train_loss": -12.19774055480957, "global_step": 341626, "epoch": 2033} {"train_loss": -12.07934856414795, "global_step": 341627, "epoch": 2033} {"train_loss": -12.592047691345215, "global_step": 341628, "epoch": 2033} {"train_loss": -12.43798542022705, "global_step": 341629, "epoch": 2033} {"train_loss": -12.169109344482422, "global_step": 341630, "epoch": 2033} {"train_loss": -12.06164836883545, "global_step": 341631, "epoch": 2033} {"train_loss": -12.411155700683594, "global_step": 341632, "epoch": 2033} {"train_loss": -11.9540433883667, "global_step": 341633, "epoch": 2033} {"train_loss": -11.884440422058105, "global_step": 341634, "epoch": 2033} {"train_loss": -12.252708435058594, "global_step": 341635, "epoch": 2033} {"train_loss": -12.287826538085938, "global_step": 341636, "epoch": 2033} {"train_loss": -11.934488296508789, "global_step": 341637, "epoch": 2033} {"train_loss": -12.117053031921387, "global_step": 341638, "epoch": 2033} {"train_loss": -11.992918968200684, "global_step": 341639, "epoch": 2033} {"train_loss": -12.381769180297852, "global_step": 341640, "epoch": 2033} {"train_loss": -11.892804145812988, "global_step": 341641, "epoch": 2033} {"train_loss": -12.196949005126953, "global_step": 341642, "epoch": 2033} {"train_loss": -11.539871215820312, "global_step": 341643, "epoch": 2033} {"train_loss": -11.821529388427734, "global_step": 341644, "epoch": 2033} {"train_loss": -10.636903762817383, "global_step": 341645, "epoch": 2033} {"train_loss": -11.321298599243164, "global_step": 341646, "epoch": 2033} {"train_loss": -11.230541229248047, "global_step": 341647, "epoch": 2033} {"train_loss": -10.54587173461914, "global_step": 341648, "epoch": 2033} {"train_loss": -10.821659088134766, "global_step": 341649, "epoch": 2033} {"train_loss": -11.42573356628418, "global_step": 341650, "epoch": 2033} {"train_loss": -9.071124076843262, "global_step": 341651, "epoch": 2033} {"train_loss": -8.964159965515137, "global_step": 341652, "epoch": 2033} {"train_loss": -10.364575386047363, "global_step": 341653, "epoch": 2033} {"train_loss": -10.02688980102539, "global_step": 341654, "epoch": 2033} {"train_loss": -10.275930404663086, "global_step": 341655, "epoch": 2033} {"train_loss": -10.593612670898438, "global_step": 341656, "epoch": 2033} {"train_loss": -10.489367485046387, "global_step": 341657, "epoch": 2033} {"train_loss": -10.275022506713867, "global_step": 341658, "epoch": 2033} {"train_loss": -11.345010757446289, "global_step": 341659, "epoch": 2033} {"train_loss": -9.641048431396484, "global_step": 341660, "epoch": 2033} {"train_loss": -11.015068054199219, "global_step": 341661, "epoch": 2033} {"train_loss": -9.052214622497559, "global_step": 341662, "epoch": 2033} {"train_loss": -10.940191268920898, "global_step": 341663, "epoch": 2033} {"train_loss": -10.548295974731445, "global_step": 341664, "epoch": 2033} {"train_loss": -10.806295394897461, "global_step": 341665, "epoch": 2033} {"train_loss": -11.539773941040039, "global_step": 341666, "epoch": 2033} {"train_loss": -10.718212127685547, "global_step": 341667, "epoch": 2033} {"train_loss": -11.308990478515625, "global_step": 341668, "epoch": 2033} {"train_loss": -11.091375350952148, "global_step": 341669, "epoch": 2033} {"train_loss": -11.569623947143555, "global_step": 341670, "epoch": 2033} {"train_loss": -10.717142105102539, "global_step": 341671, "epoch": 2033} {"train_loss": -11.884511947631836, "global_step": 341672, "epoch": 2033} {"train_loss": -11.164405822753906, "global_step": 341673, "epoch": 2033} {"train_loss": -11.932353019714355, "global_step": 341674, "epoch": 2033} {"train_loss": -11.416759490966797, "global_step": 341675, "epoch": 2033} {"train_loss": -11.533145904541016, "global_step": 341676, "epoch": 2033} {"train_loss": -12.035077095031738, "global_step": 341677, "epoch": 2033} {"train_loss": -11.797652244567871, "global_step": 341678, "epoch": 2033} {"train_loss": -11.889081954956055, "global_step": 341679, "epoch": 2033} {"train_loss": -11.55911636352539, "global_step": 341680, "epoch": 2033} {"train_loss": -11.982889175415039, "global_step": 341681, "epoch": 2033} {"train_loss": -11.679603576660156, "global_step": 341682, "epoch": 2033} {"train_loss": -11.764122009277344, "global_step": 341683, "epoch": 2033} {"train_loss": -12.041646957397461, "global_step": 341684, "epoch": 2033} {"train_loss": -12.121721267700195, "global_step": 341685, "epoch": 2033} {"train_loss": -11.863077163696289, "global_step": 341686, "epoch": 2033} {"train_loss": -11.872356414794922, "global_step": 341687, "epoch": 2033} {"train_loss": -11.96567153930664, "global_step": 341688, "epoch": 2033} {"train_loss": -12.075698852539062, "global_step": 341689, "epoch": 2033} {"train_loss": -11.702592849731445, "global_step": 341690, "epoch": 2033} {"train_loss": -12.037531852722168, "global_step": 341691, "epoch": 2033} {"train_loss": -12.014326095581055, "global_step": 341692, "epoch": 2033} {"train_loss": -12.121906280517578, "global_step": 341693, "epoch": 2033} {"train_loss": -12.098716735839844, "global_step": 341694, "epoch": 2033} {"train_loss": -11.981935501098633, "global_step": 341695, "epoch": 2033} {"train_loss": -12.336593627929688, "global_step": 341696, "epoch": 2033} {"train_loss": -12.258089065551758, "global_step": 341697, "epoch": 2033} {"train_loss": -12.025142669677734, "global_step": 341698, "epoch": 2033} {"train_loss": -12.205164909362793, "global_step": 341699, "epoch": 2033} {"train_loss": -12.419763565063477, "global_step": 341700, "epoch": 2033} {"train_loss": -12.205392837524414, "global_step": 341701, "epoch": 2033} {"train_loss": -12.15639591217041, "global_step": 341702, "epoch": 2033} {"train_loss": -12.280593872070312, "global_step": 341703, "epoch": 2033} {"train_loss": -12.066389083862305, "global_step": 341704, "epoch": 2033} {"train_loss": -12.186553001403809, "global_step": 341705, "epoch": 2033} {"train_loss": -12.084778785705566, "global_step": 341706, "epoch": 2033} {"train_loss": -12.24741268157959, "global_step": 341707, "epoch": 2033} {"train_loss": -12.266071319580078, "global_step": 341708, "epoch": 2033} {"train_loss": -12.262968063354492, "global_step": 341709, "epoch": 2033} {"train_loss": -12.349224090576172, "global_step": 341710, "epoch": 2033} {"train_loss": -11.745016166142054, "global_step": 341711, "epoch": 2033, "val_loss": 285526.46875} {"train_loss": -12.236303329467773, "global_step": 341712, "epoch": 2034} {"train_loss": -12.378288269042969, "global_step": 341713, "epoch": 2034} {"train_loss": -12.374434471130371, "global_step": 341714, "epoch": 2034} {"train_loss": -12.312660217285156, "global_step": 341715, "epoch": 2034} {"train_loss": -12.498414993286133, "global_step": 341716, "epoch": 2034} {"train_loss": -12.25528335571289, "global_step": 341717, "epoch": 2034} {"train_loss": -12.428211212158203, "global_step": 341718, "epoch": 2034} {"train_loss": -12.298812866210938, "global_step": 341719, "epoch": 2034} {"train_loss": -12.366921424865723, "global_step": 341720, "epoch": 2034} {"train_loss": -12.431447982788086, "global_step": 341721, "epoch": 2034} {"train_loss": -12.210494995117188, "global_step": 341722, "epoch": 2034} {"train_loss": -12.524266242980957, "global_step": 341723, "epoch": 2034} {"train_loss": -12.329228401184082, "global_step": 341724, "epoch": 2034} {"train_loss": -12.411595344543457, "global_step": 341725, "epoch": 2034} {"train_loss": -12.372007369995117, "global_step": 341726, "epoch": 2034} {"train_loss": -12.359573364257812, "global_step": 341727, "epoch": 2034} {"train_loss": -12.409799575805664, "global_step": 341728, "epoch": 2034} {"train_loss": -12.538124084472656, "global_step": 341729, "epoch": 2034} {"train_loss": -12.311439514160156, "global_step": 341730, "epoch": 2034} {"train_loss": -12.328401565551758, "global_step": 341731, "epoch": 2034} {"train_loss": -12.000557899475098, "global_step": 341732, "epoch": 2034} {"train_loss": -12.49622631072998, "global_step": 341733, "epoch": 2034} {"train_loss": -11.972589492797852, "global_step": 341734, "epoch": 2034} {"train_loss": -12.386747360229492, "global_step": 341735, "epoch": 2034} {"train_loss": -12.196311950683594, "global_step": 341736, "epoch": 2034} {"train_loss": -11.937616348266602, "global_step": 341737, "epoch": 2034} {"train_loss": -12.220909118652344, "global_step": 341738, "epoch": 2034} {"train_loss": -11.91474723815918, "global_step": 341739, "epoch": 2034} {"train_loss": -12.267793655395508, "global_step": 341740, "epoch": 2034} {"train_loss": -11.910903930664062, "global_step": 341741, "epoch": 2034} {"train_loss": -12.243795394897461, "global_step": 341742, "epoch": 2034} {"train_loss": -12.102869033813477, "global_step": 341743, "epoch": 2034} {"train_loss": -12.269357681274414, "global_step": 341744, "epoch": 2034} {"train_loss": -12.364836692810059, "global_step": 341745, "epoch": 2034} {"train_loss": -12.174602508544922, "global_step": 341746, "epoch": 2034} {"train_loss": -12.075835227966309, "global_step": 341747, "epoch": 2034} {"train_loss": -12.51319694519043, "global_step": 341748, "epoch": 2034} {"train_loss": -12.445094108581543, "global_step": 341749, "epoch": 2034} {"train_loss": -11.91926383972168, "global_step": 341750, "epoch": 2034} {"train_loss": -11.558237075805664, "global_step": 341751, "epoch": 2034} {"train_loss": -12.32810115814209, "global_step": 341752, "epoch": 2034} {"train_loss": -11.83145523071289, "global_step": 341753, "epoch": 2034} {"train_loss": -11.272754669189453, "global_step": 341754, "epoch": 2034} {"train_loss": -12.186129570007324, "global_step": 341755, "epoch": 2034} {"train_loss": -12.441963195800781, "global_step": 341756, "epoch": 2034} {"train_loss": -11.733804702758789, "global_step": 341757, "epoch": 2034} {"train_loss": -11.956460952758789, "global_step": 341758, "epoch": 2034} {"train_loss": -12.126129150390625, "global_step": 341759, "epoch": 2034} {"train_loss": -12.043655395507812, "global_step": 341760, "epoch": 2034} {"train_loss": -12.249613761901855, "global_step": 341761, "epoch": 2034} {"train_loss": -11.992138862609863, "global_step": 341762, "epoch": 2034} {"train_loss": -12.072843551635742, "global_step": 341763, "epoch": 2034} {"train_loss": -12.230093002319336, "global_step": 341764, "epoch": 2034} {"train_loss": -11.878738403320312, "global_step": 341765, "epoch": 2034} {"train_loss": -12.298266410827637, "global_step": 341766, "epoch": 2034} {"train_loss": -12.342870712280273, "global_step": 341767, "epoch": 2034} {"train_loss": -12.131244659423828, "global_step": 341768, "epoch": 2034} {"train_loss": -12.373628616333008, "global_step": 341769, "epoch": 2034} {"train_loss": -12.323781967163086, "global_step": 341770, "epoch": 2034} {"train_loss": -12.277044296264648, "global_step": 341771, "epoch": 2034} {"train_loss": -12.57011604309082, "global_step": 341772, "epoch": 2034} {"train_loss": -11.65285873413086, "global_step": 341773, "epoch": 2034} {"train_loss": -12.014127731323242, "global_step": 341774, "epoch": 2034} {"train_loss": -11.901151657104492, "global_step": 341775, "epoch": 2034} {"train_loss": -12.600532531738281, "global_step": 341776, "epoch": 2034} {"train_loss": -12.175634384155273, "global_step": 341777, "epoch": 2034} {"train_loss": -12.382166862487793, "global_step": 341778, "epoch": 2034} {"train_loss": -11.789152145385742, "global_step": 341779, "epoch": 2034} {"train_loss": -12.240118026733398, "global_step": 341780, "epoch": 2034} {"train_loss": -12.210067749023438, "global_step": 341781, "epoch": 2034} {"train_loss": -12.146684646606445, "global_step": 341782, "epoch": 2034} {"train_loss": -12.269709587097168, "global_step": 341783, "epoch": 2034} {"train_loss": -11.960783004760742, "global_step": 341784, "epoch": 2034} {"train_loss": -12.183188438415527, "global_step": 341785, "epoch": 2034} {"train_loss": -12.038843154907227, "global_step": 341786, "epoch": 2034} {"train_loss": -12.091437339782715, "global_step": 341787, "epoch": 2034} {"train_loss": -12.375887870788574, "global_step": 341788, "epoch": 2034} {"train_loss": -12.297243118286133, "global_step": 341789, "epoch": 2034} {"train_loss": -12.375001907348633, "global_step": 341790, "epoch": 2034} {"train_loss": -12.089448928833008, "global_step": 341791, "epoch": 2034} {"train_loss": -12.140758514404297, "global_step": 341792, "epoch": 2034} {"train_loss": -12.358712196350098, "global_step": 341793, "epoch": 2034} {"train_loss": -12.02182388305664, "global_step": 341794, "epoch": 2034} {"train_loss": -12.140682220458984, "global_step": 341795, "epoch": 2034} {"train_loss": -12.013495445251465, "global_step": 341796, "epoch": 2034} {"train_loss": -11.09792709350586, "global_step": 341797, "epoch": 2034} {"train_loss": -12.323665618896484, "global_step": 341798, "epoch": 2034} {"train_loss": -11.5588960647583, "global_step": 341799, "epoch": 2034} {"train_loss": -11.39403247833252, "global_step": 341800, "epoch": 2034} {"train_loss": -10.881468772888184, "global_step": 341801, "epoch": 2034} {"train_loss": -11.561548233032227, "global_step": 341802, "epoch": 2034} {"train_loss": -11.355649948120117, "global_step": 341803, "epoch": 2034} {"train_loss": -11.751300811767578, "global_step": 341804, "epoch": 2034} {"train_loss": -12.003660202026367, "global_step": 341805, "epoch": 2034} {"train_loss": -11.769775390625, "global_step": 341806, "epoch": 2034} {"train_loss": -11.825435638427734, "global_step": 341807, "epoch": 2034} {"train_loss": -12.101173400878906, "global_step": 341808, "epoch": 2034} {"train_loss": -11.9190034866333, "global_step": 341809, "epoch": 2034} {"train_loss": -11.824275970458984, "global_step": 341810, "epoch": 2034} {"train_loss": -12.416032791137695, "global_step": 341811, "epoch": 2034} {"train_loss": -11.556772232055664, "global_step": 341812, "epoch": 2034} {"train_loss": -12.181004524230957, "global_step": 341813, "epoch": 2034} {"train_loss": -12.070350646972656, "global_step": 341814, "epoch": 2034} {"train_loss": -11.696916580200195, "global_step": 341815, "epoch": 2034} {"train_loss": -12.331624984741211, "global_step": 341816, "epoch": 2034} {"train_loss": -11.662139892578125, "global_step": 341817, "epoch": 2034} {"train_loss": -12.316072463989258, "global_step": 341818, "epoch": 2034} {"train_loss": -11.768502235412598, "global_step": 341819, "epoch": 2034} {"train_loss": -11.992830276489258, "global_step": 341820, "epoch": 2034} {"train_loss": -12.079145431518555, "global_step": 341821, "epoch": 2034} {"train_loss": -11.654175758361816, "global_step": 341822, "epoch": 2034} {"train_loss": -12.357927322387695, "global_step": 341823, "epoch": 2034} {"train_loss": -11.594353675842285, "global_step": 341824, "epoch": 2034} {"train_loss": -11.320378303527832, "global_step": 341825, "epoch": 2034} {"train_loss": -11.733030319213867, "global_step": 341826, "epoch": 2034} {"train_loss": -12.165708541870117, "global_step": 341827, "epoch": 2034} {"train_loss": -11.623525619506836, "global_step": 341828, "epoch": 2034} {"train_loss": -11.346653938293457, "global_step": 341829, "epoch": 2034} {"train_loss": -11.35110855102539, "global_step": 341830, "epoch": 2034} {"train_loss": -11.135614395141602, "global_step": 341831, "epoch": 2034} {"train_loss": -11.321893692016602, "global_step": 341832, "epoch": 2034} {"train_loss": -11.853676795959473, "global_step": 341833, "epoch": 2034} {"train_loss": -11.275154113769531, "global_step": 341834, "epoch": 2034} {"train_loss": -11.364678382873535, "global_step": 341835, "epoch": 2034} {"train_loss": -11.454866409301758, "global_step": 341836, "epoch": 2034} {"train_loss": -11.921952247619629, "global_step": 341837, "epoch": 2034} {"train_loss": -11.496246337890625, "global_step": 341838, "epoch": 2034} {"train_loss": -11.93048095703125, "global_step": 341839, "epoch": 2034} {"train_loss": -11.645712852478027, "global_step": 341840, "epoch": 2034} {"train_loss": -11.958436965942383, "global_step": 341841, "epoch": 2034} {"train_loss": -11.763495445251465, "global_step": 341842, "epoch": 2034} {"train_loss": -11.817203521728516, "global_step": 341843, "epoch": 2034} {"train_loss": -11.71356201171875, "global_step": 341844, "epoch": 2034} {"train_loss": -11.958436012268066, "global_step": 341845, "epoch": 2034} {"train_loss": -11.708610534667969, "global_step": 341846, "epoch": 2034} {"train_loss": -12.148239135742188, "global_step": 341847, "epoch": 2034} {"train_loss": -11.685656547546387, "global_step": 341848, "epoch": 2034} {"train_loss": -11.68429183959961, "global_step": 341849, "epoch": 2034} {"train_loss": -11.806684494018555, "global_step": 341850, "epoch": 2034} {"train_loss": -11.540117263793945, "global_step": 341851, "epoch": 2034} {"train_loss": -11.923820495605469, "global_step": 341852, "epoch": 2034} {"train_loss": -11.729482650756836, "global_step": 341853, "epoch": 2034} {"train_loss": -11.69324779510498, "global_step": 341854, "epoch": 2034} {"train_loss": -11.516973495483398, "global_step": 341855, "epoch": 2034} {"train_loss": -11.789698600769043, "global_step": 341856, "epoch": 2034} {"train_loss": -11.899820327758789, "global_step": 341857, "epoch": 2034} {"train_loss": -11.948799133300781, "global_step": 341858, "epoch": 2034} {"train_loss": -12.171160697937012, "global_step": 341859, "epoch": 2034} {"train_loss": -12.057859420776367, "global_step": 341860, "epoch": 2034} {"train_loss": -11.970951080322266, "global_step": 341861, "epoch": 2034} {"train_loss": -12.301383972167969, "global_step": 341862, "epoch": 2034} {"train_loss": -11.891719818115234, "global_step": 341863, "epoch": 2034} {"train_loss": -11.826642990112305, "global_step": 341864, "epoch": 2034} {"train_loss": -12.18592643737793, "global_step": 341865, "epoch": 2034} {"train_loss": -12.100101470947266, "global_step": 341866, "epoch": 2034} {"train_loss": -11.978949546813965, "global_step": 341867, "epoch": 2034} {"train_loss": -12.058451652526855, "global_step": 341868, "epoch": 2034} {"train_loss": -12.047904968261719, "global_step": 341869, "epoch": 2034} {"train_loss": -12.000978469848633, "global_step": 341870, "epoch": 2034} {"train_loss": -11.773515701293945, "global_step": 341871, "epoch": 2034} {"train_loss": -12.39117431640625, "global_step": 341872, "epoch": 2034} {"train_loss": -11.983041763305664, "global_step": 341873, "epoch": 2034} {"train_loss": -12.403005599975586, "global_step": 341874, "epoch": 2034} {"train_loss": -12.061921119689941, "global_step": 341875, "epoch": 2034} {"train_loss": -12.402132034301758, "global_step": 341876, "epoch": 2034} {"train_loss": -12.265684127807617, "global_step": 341877, "epoch": 2034} {"train_loss": -12.322399139404297, "global_step": 341878, "epoch": 2034} {"train_loss": -12.018896051815577, "global_step": 341879, "epoch": 2034, "val_loss": 286924.46875} {"train_loss": -12.080684661865234, "global_step": 341880, "epoch": 2035} {"train_loss": -12.230332374572754, "global_step": 341881, "epoch": 2035} {"train_loss": -12.01731014251709, "global_step": 341882, "epoch": 2035} {"train_loss": -12.618815422058105, "global_step": 341883, "epoch": 2035} {"train_loss": -12.359180450439453, "global_step": 341884, "epoch": 2035} {"train_loss": -11.768241882324219, "global_step": 341885, "epoch": 2035} {"train_loss": -12.280529022216797, "global_step": 341886, "epoch": 2035} {"train_loss": -12.10957145690918, "global_step": 341887, "epoch": 2035} {"train_loss": -11.972223281860352, "global_step": 341888, "epoch": 2035} {"train_loss": -12.269136428833008, "global_step": 341889, "epoch": 2035} {"train_loss": -11.92327880859375, "global_step": 341890, "epoch": 2035} {"train_loss": -12.149779319763184, "global_step": 341891, "epoch": 2035} {"train_loss": -12.253704071044922, "global_step": 341892, "epoch": 2035} {"train_loss": -11.710540771484375, "global_step": 341893, "epoch": 2035} {"train_loss": -12.374821662902832, "global_step": 341894, "epoch": 2035} {"train_loss": -11.974250793457031, "global_step": 341895, "epoch": 2035} {"train_loss": -12.250982284545898, "global_step": 341896, "epoch": 2035} {"train_loss": -12.042997360229492, "global_step": 341897, "epoch": 2035} {"train_loss": -12.608747482299805, "global_step": 341898, "epoch": 2035} {"train_loss": -12.246989250183105, "global_step": 341899, "epoch": 2035} {"train_loss": -12.416519165039062, "global_step": 341900, "epoch": 2035} {"train_loss": -12.365177154541016, "global_step": 341901, "epoch": 2035} {"train_loss": -11.945939064025879, "global_step": 341902, "epoch": 2035} {"train_loss": -11.945920944213867, "global_step": 341903, "epoch": 2035} {"train_loss": -12.197826385498047, "global_step": 341904, "epoch": 2035} {"train_loss": -11.728494644165039, "global_step": 341905, "epoch": 2035} {"train_loss": -12.132993698120117, "global_step": 341906, "epoch": 2035} {"train_loss": -11.53607177734375, "global_step": 341907, "epoch": 2035} {"train_loss": -12.376277923583984, "global_step": 341908, "epoch": 2035} {"train_loss": -11.798443794250488, "global_step": 341909, "epoch": 2035} {"train_loss": -12.33582878112793, "global_step": 341910, "epoch": 2035} {"train_loss": -11.653421401977539, "global_step": 341911, "epoch": 2035} {"train_loss": -12.089086532592773, "global_step": 341912, "epoch": 2035} {"train_loss": -11.777372360229492, "global_step": 341913, "epoch": 2035} {"train_loss": -11.581388473510742, "global_step": 341914, "epoch": 2035} {"train_loss": -11.927433013916016, "global_step": 341915, "epoch": 2035} {"train_loss": -11.703042984008789, "global_step": 341916, "epoch": 2035} {"train_loss": -11.823238372802734, "global_step": 341917, "epoch": 2035} {"train_loss": -12.23233413696289, "global_step": 341918, "epoch": 2035} {"train_loss": -11.92369556427002, "global_step": 341919, "epoch": 2035} {"train_loss": -11.320439338684082, "global_step": 341920, "epoch": 2035} {"train_loss": -12.132423400878906, "global_step": 341921, "epoch": 2035} {"train_loss": -12.060226440429688, "global_step": 341922, "epoch": 2035} {"train_loss": -11.993491172790527, "global_step": 341923, "epoch": 2035} {"train_loss": -11.773460388183594, "global_step": 341924, "epoch": 2035} {"train_loss": -12.245104789733887, "global_step": 341925, "epoch": 2035} {"train_loss": -11.800641059875488, "global_step": 341926, "epoch": 2035} {"train_loss": -12.38853645324707, "global_step": 341927, "epoch": 2035} {"train_loss": -12.23581314086914, "global_step": 341928, "epoch": 2035} {"train_loss": -11.94865608215332, "global_step": 341929, "epoch": 2035} {"train_loss": -12.001120567321777, "global_step": 341930, "epoch": 2035} {"train_loss": -11.740240097045898, "global_step": 341931, "epoch": 2035} {"train_loss": -12.485515594482422, "global_step": 341932, "epoch": 2035} {"train_loss": -12.176400184631348, "global_step": 341933, "epoch": 2035} {"train_loss": -12.28125, "global_step": 341934, "epoch": 2035} {"train_loss": -11.83028793334961, "global_step": 341935, "epoch": 2035} {"train_loss": -12.053007125854492, "global_step": 341936, "epoch": 2035} {"train_loss": -11.997892379760742, "global_step": 341937, "epoch": 2035} {"train_loss": -12.265741348266602, "global_step": 341938, "epoch": 2035} {"train_loss": -12.179571151733398, "global_step": 341939, "epoch": 2035} {"train_loss": -12.12380599975586, "global_step": 341940, "epoch": 2035} {"train_loss": -12.165791511535645, "global_step": 341941, "epoch": 2035} {"train_loss": -12.039289474487305, "global_step": 341942, "epoch": 2035} {"train_loss": -12.345538139343262, "global_step": 341943, "epoch": 2035} {"train_loss": -11.79964828491211, "global_step": 341944, "epoch": 2035} {"train_loss": -11.775795936584473, "global_step": 341945, "epoch": 2035} {"train_loss": -11.504417419433594, "global_step": 341946, "epoch": 2035} {"train_loss": -11.912233352661133, "global_step": 341947, "epoch": 2035} {"train_loss": -11.31999397277832, "global_step": 341948, "epoch": 2035} {"train_loss": -12.151410102844238, "global_step": 341949, "epoch": 2035} {"train_loss": -12.030029296875, "global_step": 341950, "epoch": 2035} {"train_loss": -11.81606674194336, "global_step": 341951, "epoch": 2035} {"train_loss": -12.277135848999023, "global_step": 341952, "epoch": 2035} {"train_loss": -11.901284217834473, "global_step": 341953, "epoch": 2035} {"train_loss": -12.171847343444824, "global_step": 341954, "epoch": 2035} {"train_loss": -12.377252578735352, "global_step": 341955, "epoch": 2035} {"train_loss": -11.515483856201172, "global_step": 341956, "epoch": 2035} {"train_loss": -12.070300102233887, "global_step": 341957, "epoch": 2035} {"train_loss": -12.279193878173828, "global_step": 341958, "epoch": 2035} {"train_loss": -12.212057113647461, "global_step": 341959, "epoch": 2035} {"train_loss": -12.496583938598633, "global_step": 341960, "epoch": 2035} {"train_loss": -12.106834411621094, "global_step": 341961, "epoch": 2035} {"train_loss": -12.380669593811035, "global_step": 341962, "epoch": 2035} {"train_loss": -12.464580535888672, "global_step": 341963, "epoch": 2035} {"train_loss": -12.085165023803711, "global_step": 341964, "epoch": 2035} {"train_loss": -12.023832321166992, "global_step": 341965, "epoch": 2035} {"train_loss": -12.183984756469727, "global_step": 341966, "epoch": 2035} {"train_loss": -11.32539176940918, "global_step": 341967, "epoch": 2035} {"train_loss": -12.246955871582031, "global_step": 341968, "epoch": 2035} {"train_loss": -11.446367263793945, "global_step": 341969, "epoch": 2035} {"train_loss": -11.190643310546875, "global_step": 341970, "epoch": 2035} {"train_loss": -11.282051086425781, "global_step": 341971, "epoch": 2035} {"train_loss": -10.936458587646484, "global_step": 341972, "epoch": 2035} {"train_loss": -10.040447235107422, "global_step": 341973, "epoch": 2035} {"train_loss": -11.877197265625, "global_step": 341974, "epoch": 2035} {"train_loss": -11.626747131347656, "global_step": 341975, "epoch": 2035} {"train_loss": -11.60008716583252, "global_step": 341976, "epoch": 2035} {"train_loss": -12.037236213684082, "global_step": 341977, "epoch": 2035} {"train_loss": -12.17099380493164, "global_step": 341978, "epoch": 2035} {"train_loss": -11.827390670776367, "global_step": 341979, "epoch": 2035} {"train_loss": -12.377490997314453, "global_step": 341980, "epoch": 2035} {"train_loss": -12.020145416259766, "global_step": 341981, "epoch": 2035} {"train_loss": -12.073959350585938, "global_step": 341982, "epoch": 2035} {"train_loss": -11.679444313049316, "global_step": 341983, "epoch": 2035} {"train_loss": -12.306007385253906, "global_step": 341984, "epoch": 2035} {"train_loss": -12.007868766784668, "global_step": 341985, "epoch": 2035} {"train_loss": -12.073827743530273, "global_step": 341986, "epoch": 2035} {"train_loss": -12.19554328918457, "global_step": 341987, "epoch": 2035} {"train_loss": -12.093231201171875, "global_step": 341988, "epoch": 2035} {"train_loss": -12.205026626586914, "global_step": 341989, "epoch": 2035} {"train_loss": -12.236684799194336, "global_step": 341990, "epoch": 2035} {"train_loss": -12.392888069152832, "global_step": 341991, "epoch": 2035} {"train_loss": -12.305201530456543, "global_step": 341992, "epoch": 2035} {"train_loss": -12.309210777282715, "global_step": 341993, "epoch": 2035} {"train_loss": -12.283625602722168, "global_step": 341994, "epoch": 2035} {"train_loss": -12.279549598693848, "global_step": 341995, "epoch": 2035} {"train_loss": -12.245200157165527, "global_step": 341996, "epoch": 2035} {"train_loss": -12.457340240478516, "global_step": 341997, "epoch": 2035} {"train_loss": -12.28045654296875, "global_step": 341998, "epoch": 2035} {"train_loss": -12.250593185424805, "global_step": 341999, "epoch": 2035} {"train_loss": -12.340201377868652, "global_step": 342000, "epoch": 2035} {"train_loss": -12.346271514892578, "global_step": 342001, "epoch": 2035} {"train_loss": -12.411989212036133, "global_step": 342002, "epoch": 2035} {"train_loss": -12.411249160766602, "global_step": 342003, "epoch": 2035} {"train_loss": -12.549918174743652, "global_step": 342004, "epoch": 2035} {"train_loss": -12.240213394165039, "global_step": 342005, "epoch": 2035} {"train_loss": -12.15478515625, "global_step": 342006, "epoch": 2035} {"train_loss": -12.492413520812988, "global_step": 342007, "epoch": 2035} {"train_loss": -12.17541217803955, "global_step": 342008, "epoch": 2035} {"train_loss": -12.668561935424805, "global_step": 342009, "epoch": 2035} {"train_loss": -12.55130386352539, "global_step": 342010, "epoch": 2035} {"train_loss": -12.430459022521973, "global_step": 342011, "epoch": 2035} {"train_loss": -12.465282440185547, "global_step": 342012, "epoch": 2035} {"train_loss": -12.584693908691406, "global_step": 342013, "epoch": 2035} {"train_loss": -12.682563781738281, "global_step": 342014, "epoch": 2035} {"train_loss": -12.3319673538208, "global_step": 342015, "epoch": 2035} {"train_loss": -12.375984191894531, "global_step": 342016, "epoch": 2035} {"train_loss": -12.436370849609375, "global_step": 342017, "epoch": 2035} {"train_loss": -12.478438377380371, "global_step": 342018, "epoch": 2035} {"train_loss": -12.353318214416504, "global_step": 342019, "epoch": 2035} {"train_loss": -12.538642883300781, "global_step": 342020, "epoch": 2035} {"train_loss": -12.696065902709961, "global_step": 342021, "epoch": 2035} {"train_loss": -12.331438064575195, "global_step": 342022, "epoch": 2035} {"train_loss": -12.486349105834961, "global_step": 342023, "epoch": 2035} {"train_loss": -12.411141395568848, "global_step": 342024, "epoch": 2035} {"train_loss": -12.526004791259766, "global_step": 342025, "epoch": 2035} {"train_loss": -12.355910301208496, "global_step": 342026, "epoch": 2035} {"train_loss": -12.039129257202148, "global_step": 342027, "epoch": 2035} {"train_loss": -12.540897369384766, "global_step": 342028, "epoch": 2035} {"train_loss": -12.350032806396484, "global_step": 342029, "epoch": 2035} {"train_loss": -12.411991119384766, "global_step": 342030, "epoch": 2035} {"train_loss": -12.47268009185791, "global_step": 342031, "epoch": 2035} {"train_loss": -11.853139877319336, "global_step": 342032, "epoch": 2035} {"train_loss": -10.673545837402344, "global_step": 342033, "epoch": 2035} {"train_loss": -11.752424240112305, "global_step": 342034, "epoch": 2035} {"train_loss": -9.908585548400879, "global_step": 342035, "epoch": 2035} {"train_loss": -10.36225700378418, "global_step": 342036, "epoch": 2035} {"train_loss": -11.441183090209961, "global_step": 342037, "epoch": 2035} {"train_loss": -7.064600944519043, "global_step": 342038, "epoch": 2035} {"train_loss": -6.783141136169434, "global_step": 342039, "epoch": 2035} {"train_loss": -6.090002536773682, "global_step": 342040, "epoch": 2035} {"train_loss": -7.00255823135376, "global_step": 342041, "epoch": 2035} {"train_loss": -7.0418877601623535, "global_step": 342042, "epoch": 2035} {"train_loss": -6.478065490722656, "global_step": 342043, "epoch": 2035} {"train_loss": -7.577107906341553, "global_step": 342044, "epoch": 2035} {"train_loss": -7.861397743225098, "global_step": 342045, "epoch": 2035} {"train_loss": -8.049238204956055, "global_step": 342046, "epoch": 2035} {"train_loss": -11.775243787538438, "global_step": 342047, "epoch": 2035, "val_loss": 285026.84375, "train_action_mse_error": 2.7160098552703857} {"train_loss": -7.783282279968262, "global_step": 342048, "epoch": 2036} {"train_loss": -7.504302501678467, "global_step": 342049, "epoch": 2036} {"train_loss": -7.7742133140563965, "global_step": 342050, "epoch": 2036} {"train_loss": -8.534923553466797, "global_step": 342051, "epoch": 2036} {"train_loss": -8.537775993347168, "global_step": 342052, "epoch": 2036} {"train_loss": -8.690549850463867, "global_step": 342053, "epoch": 2036} {"train_loss": -8.190396308898926, "global_step": 342054, "epoch": 2036} {"train_loss": -8.574994087219238, "global_step": 342055, "epoch": 2036} {"train_loss": -8.436051368713379, "global_step": 342056, "epoch": 2036} {"train_loss": -9.120878219604492, "global_step": 342057, "epoch": 2036} {"train_loss": -8.55296516418457, "global_step": 342058, "epoch": 2036} {"train_loss": -9.078947067260742, "global_step": 342059, "epoch": 2036} {"train_loss": -9.419926643371582, "global_step": 342060, "epoch": 2036} {"train_loss": -9.395263671875, "global_step": 342061, "epoch": 2036} {"train_loss": -9.625608444213867, "global_step": 342062, "epoch": 2036} {"train_loss": -9.993837356567383, "global_step": 342063, "epoch": 2036} {"train_loss": -10.642172813415527, "global_step": 342064, "epoch": 2036} {"train_loss": -10.079866409301758, "global_step": 342065, "epoch": 2036} {"train_loss": -10.57828140258789, "global_step": 342066, "epoch": 2036} {"train_loss": -10.240665435791016, "global_step": 342067, "epoch": 2036} {"train_loss": -10.587799072265625, "global_step": 342068, "epoch": 2036} {"train_loss": -10.539012908935547, "global_step": 342069, "epoch": 2036} {"train_loss": -10.844444274902344, "global_step": 342070, "epoch": 2036} {"train_loss": -10.717504501342773, "global_step": 342071, "epoch": 2036} {"train_loss": -11.527448654174805, "global_step": 342072, "epoch": 2036} {"train_loss": -11.100802421569824, "global_step": 342073, "epoch": 2036} {"train_loss": -11.077702522277832, "global_step": 342074, "epoch": 2036} {"train_loss": -11.561993598937988, "global_step": 342075, "epoch": 2036} {"train_loss": -11.202430725097656, "global_step": 342076, "epoch": 2036} {"train_loss": -11.974327087402344, "global_step": 342077, "epoch": 2036} {"train_loss": -11.586338996887207, "global_step": 342078, "epoch": 2036} {"train_loss": -11.747037887573242, "global_step": 342079, "epoch": 2036} {"train_loss": -11.752696990966797, "global_step": 342080, "epoch": 2036} {"train_loss": -11.770626068115234, "global_step": 342081, "epoch": 2036} {"train_loss": -11.980874061584473, "global_step": 342082, "epoch": 2036} {"train_loss": -11.840496063232422, "global_step": 342083, "epoch": 2036} {"train_loss": -11.933197021484375, "global_step": 342084, "epoch": 2036} {"train_loss": -11.72939682006836, "global_step": 342085, "epoch": 2036} {"train_loss": -11.938436508178711, "global_step": 342086, "epoch": 2036} {"train_loss": -11.922924995422363, "global_step": 342087, "epoch": 2036} {"train_loss": -11.664266586303711, "global_step": 342088, "epoch": 2036} {"train_loss": -12.115303993225098, "global_step": 342089, "epoch": 2036} {"train_loss": -11.903166770935059, "global_step": 342090, "epoch": 2036} {"train_loss": -11.662221908569336, "global_step": 342091, "epoch": 2036} {"train_loss": -11.35483169555664, "global_step": 342092, "epoch": 2036} {"train_loss": -11.959623336791992, "global_step": 342093, "epoch": 2036} {"train_loss": -11.625000953674316, "global_step": 342094, "epoch": 2036} {"train_loss": -10.565500259399414, "global_step": 342095, "epoch": 2036} {"train_loss": -11.784318923950195, "global_step": 342096, "epoch": 2036} {"train_loss": -10.466984748840332, "global_step": 342097, "epoch": 2036} {"train_loss": -11.390340805053711, "global_step": 342098, "epoch": 2036} {"train_loss": -10.824243545532227, "global_step": 342099, "epoch": 2036} {"train_loss": -10.65825080871582, "global_step": 342100, "epoch": 2036} {"train_loss": -11.341299057006836, "global_step": 342101, "epoch": 2036} {"train_loss": -10.797506332397461, "global_step": 342102, "epoch": 2036} {"train_loss": -11.720035552978516, "global_step": 342103, "epoch": 2036} {"train_loss": -10.668659210205078, "global_step": 342104, "epoch": 2036} {"train_loss": -11.037171363830566, "global_step": 342105, "epoch": 2036} {"train_loss": -10.935800552368164, "global_step": 342106, "epoch": 2036} {"train_loss": -11.62775993347168, "global_step": 342107, "epoch": 2036} {"train_loss": -11.079599380493164, "global_step": 342108, "epoch": 2036} {"train_loss": -11.70024299621582, "global_step": 342109, "epoch": 2036} {"train_loss": -11.792142868041992, "global_step": 342110, "epoch": 2036} {"train_loss": -11.319836616516113, "global_step": 342111, "epoch": 2036} {"train_loss": -11.607812881469727, "global_step": 342112, "epoch": 2036} {"train_loss": -11.477603912353516, "global_step": 342113, "epoch": 2036} {"train_loss": -11.067007064819336, "global_step": 342114, "epoch": 2036} {"train_loss": -11.917516708374023, "global_step": 342115, "epoch": 2036} {"train_loss": -11.583595275878906, "global_step": 342116, "epoch": 2036} {"train_loss": -11.861692428588867, "global_step": 342117, "epoch": 2036} {"train_loss": -11.604037284851074, "global_step": 342118, "epoch": 2036} {"train_loss": -12.230158805847168, "global_step": 342119, "epoch": 2036} {"train_loss": -11.242143630981445, "global_step": 342120, "epoch": 2036} {"train_loss": -11.564168930053711, "global_step": 342121, "epoch": 2036} {"train_loss": -11.801153182983398, "global_step": 342122, "epoch": 2036} {"train_loss": -11.270895004272461, "global_step": 342123, "epoch": 2036} {"train_loss": -11.984586715698242, "global_step": 342124, "epoch": 2036} {"train_loss": -11.51173210144043, "global_step": 342125, "epoch": 2036} {"train_loss": -11.796858787536621, "global_step": 342126, "epoch": 2036} {"train_loss": -11.971029281616211, "global_step": 342127, "epoch": 2036} {"train_loss": -11.663050651550293, "global_step": 342128, "epoch": 2036} {"train_loss": -12.099832534790039, "global_step": 342129, "epoch": 2036} {"train_loss": -11.885187149047852, "global_step": 342130, "epoch": 2036} {"train_loss": -12.26291561126709, "global_step": 342131, "epoch": 2036} {"train_loss": -11.688413619995117, "global_step": 342132, "epoch": 2036} {"train_loss": -11.867395401000977, "global_step": 342133, "epoch": 2036} {"train_loss": -11.914731979370117, "global_step": 342134, "epoch": 2036} {"train_loss": -12.04863452911377, "global_step": 342135, "epoch": 2036} {"train_loss": -11.542101860046387, "global_step": 342136, "epoch": 2036} {"train_loss": -11.75492000579834, "global_step": 342137, "epoch": 2036} {"train_loss": -11.911767959594727, "global_step": 342138, "epoch": 2036} {"train_loss": -11.909446716308594, "global_step": 342139, "epoch": 2036} {"train_loss": -11.74211597442627, "global_step": 342140, "epoch": 2036} {"train_loss": -11.985458374023438, "global_step": 342141, "epoch": 2036} {"train_loss": -11.722195625305176, "global_step": 342142, "epoch": 2036} {"train_loss": -12.141609191894531, "global_step": 342143, "epoch": 2036} {"train_loss": -11.922157287597656, "global_step": 342144, "epoch": 2036} {"train_loss": -11.424013137817383, "global_step": 342145, "epoch": 2036} {"train_loss": -11.478236198425293, "global_step": 342146, "epoch": 2036} {"train_loss": -11.143462181091309, "global_step": 342147, "epoch": 2036} {"train_loss": -11.896657943725586, "global_step": 342148, "epoch": 2036} {"train_loss": -11.249505996704102, "global_step": 342149, "epoch": 2036} {"train_loss": -11.626230239868164, "global_step": 342150, "epoch": 2036} {"train_loss": -11.713373184204102, "global_step": 342151, "epoch": 2036} {"train_loss": -10.755836486816406, "global_step": 342152, "epoch": 2036} {"train_loss": -11.27823543548584, "global_step": 342153, "epoch": 2036} {"train_loss": -11.700013160705566, "global_step": 342154, "epoch": 2036} {"train_loss": -11.115656852722168, "global_step": 342155, "epoch": 2036} {"train_loss": -12.263498306274414, "global_step": 342156, "epoch": 2036} {"train_loss": -11.041585922241211, "global_step": 342157, "epoch": 2036} {"train_loss": -11.647631645202637, "global_step": 342158, "epoch": 2036} {"train_loss": -11.716017723083496, "global_step": 342159, "epoch": 2036} {"train_loss": -11.60060977935791, "global_step": 342160, "epoch": 2036} {"train_loss": -12.071268081665039, "global_step": 342161, "epoch": 2036} {"train_loss": -11.531258583068848, "global_step": 342162, "epoch": 2036} {"train_loss": -12.052228927612305, "global_step": 342163, "epoch": 2036} {"train_loss": -11.808197021484375, "global_step": 342164, "epoch": 2036} {"train_loss": -11.700967788696289, "global_step": 342165, "epoch": 2036} {"train_loss": -12.206663131713867, "global_step": 342166, "epoch": 2036} {"train_loss": -11.727947235107422, "global_step": 342167, "epoch": 2036} {"train_loss": -12.163207054138184, "global_step": 342168, "epoch": 2036} {"train_loss": -11.542732238769531, "global_step": 342169, "epoch": 2036} {"train_loss": -11.488129615783691, "global_step": 342170, "epoch": 2036} {"train_loss": -12.140239715576172, "global_step": 342171, "epoch": 2036} {"train_loss": -11.484569549560547, "global_step": 342172, "epoch": 2036} {"train_loss": -11.87789535522461, "global_step": 342173, "epoch": 2036} {"train_loss": -11.703041076660156, "global_step": 342174, "epoch": 2036} {"train_loss": -11.68857479095459, "global_step": 342175, "epoch": 2036} {"train_loss": -11.628907203674316, "global_step": 342176, "epoch": 2036} {"train_loss": -11.500968933105469, "global_step": 342177, "epoch": 2036} {"train_loss": -11.88481616973877, "global_step": 342178, "epoch": 2036} {"train_loss": -11.723180770874023, "global_step": 342179, "epoch": 2036} {"train_loss": -12.333086967468262, "global_step": 342180, "epoch": 2036} {"train_loss": -11.795198440551758, "global_step": 342181, "epoch": 2036} {"train_loss": -12.08944320678711, "global_step": 342182, "epoch": 2036} {"train_loss": -11.728134155273438, "global_step": 342183, "epoch": 2036} {"train_loss": -11.847131729125977, "global_step": 342184, "epoch": 2036} {"train_loss": -12.027166366577148, "global_step": 342185, "epoch": 2036} {"train_loss": -11.856732368469238, "global_step": 342186, "epoch": 2036} {"train_loss": -12.195314407348633, "global_step": 342187, "epoch": 2036} {"train_loss": -12.019116401672363, "global_step": 342188, "epoch": 2036} {"train_loss": -12.062128067016602, "global_step": 342189, "epoch": 2036} {"train_loss": -12.3560791015625, "global_step": 342190, "epoch": 2036} {"train_loss": -12.136884689331055, "global_step": 342191, "epoch": 2036} {"train_loss": -12.436286926269531, "global_step": 342192, "epoch": 2036} {"train_loss": -11.963586807250977, "global_step": 342193, "epoch": 2036} {"train_loss": -12.212549209594727, "global_step": 342194, "epoch": 2036} {"train_loss": -12.162131309509277, "global_step": 342195, "epoch": 2036} {"train_loss": -12.242910385131836, "global_step": 342196, "epoch": 2036} {"train_loss": -12.41872787475586, "global_step": 342197, "epoch": 2036} {"train_loss": -12.203399658203125, "global_step": 342198, "epoch": 2036} {"train_loss": -12.327667236328125, "global_step": 342199, "epoch": 2036} {"train_loss": -12.187149047851562, "global_step": 342200, "epoch": 2036} {"train_loss": -12.426753997802734, "global_step": 342201, "epoch": 2036} {"train_loss": -12.256542205810547, "global_step": 342202, "epoch": 2036} {"train_loss": -12.231021881103516, "global_step": 342203, "epoch": 2036} {"train_loss": -12.396665573120117, "global_step": 342204, "epoch": 2036} {"train_loss": -12.384225845336914, "global_step": 342205, "epoch": 2036} {"train_loss": -12.423982620239258, "global_step": 342206, "epoch": 2036} {"train_loss": -12.255380630493164, "global_step": 342207, "epoch": 2036} {"train_loss": -12.112421035766602, "global_step": 342208, "epoch": 2036} {"train_loss": -12.518728256225586, "global_step": 342209, "epoch": 2036} {"train_loss": -12.232150077819824, "global_step": 342210, "epoch": 2036} {"train_loss": -12.56833553314209, "global_step": 342211, "epoch": 2036} {"train_loss": -12.161666870117188, "global_step": 342212, "epoch": 2036} {"train_loss": -12.035027503967285, "global_step": 342213, "epoch": 2036} {"train_loss": -12.419928550720215, "global_step": 342214, "epoch": 2036} {"train_loss": -11.412220268022446, "global_step": 342215, "epoch": 2036, "val_loss": 287591.40625} {"train_loss": -12.164412498474121, "global_step": 342216, "epoch": 2037} {"train_loss": -12.118048667907715, "global_step": 342217, "epoch": 2037} {"train_loss": -12.330748558044434, "global_step": 342218, "epoch": 2037} {"train_loss": -12.318761825561523, "global_step": 342219, "epoch": 2037} {"train_loss": -12.142833709716797, "global_step": 342220, "epoch": 2037} {"train_loss": -12.236729621887207, "global_step": 342221, "epoch": 2037} {"train_loss": -12.208027839660645, "global_step": 342222, "epoch": 2037} {"train_loss": -11.94040298461914, "global_step": 342223, "epoch": 2037} {"train_loss": -12.071475982666016, "global_step": 342224, "epoch": 2037} {"train_loss": -11.603367805480957, "global_step": 342225, "epoch": 2037} {"train_loss": -11.857935905456543, "global_step": 342226, "epoch": 2037} {"train_loss": -12.147892951965332, "global_step": 342227, "epoch": 2037} {"train_loss": -12.195812225341797, "global_step": 342228, "epoch": 2037} {"train_loss": -11.553581237792969, "global_step": 342229, "epoch": 2037} {"train_loss": -11.21316909790039, "global_step": 342230, "epoch": 2037} {"train_loss": -11.407571792602539, "global_step": 342231, "epoch": 2037} {"train_loss": -11.713083267211914, "global_step": 342232, "epoch": 2037} {"train_loss": -12.370361328125, "global_step": 342233, "epoch": 2037} {"train_loss": -11.549641609191895, "global_step": 342234, "epoch": 2037} {"train_loss": -11.683568000793457, "global_step": 342235, "epoch": 2037} {"train_loss": -12.12271499633789, "global_step": 342236, "epoch": 2037} {"train_loss": -10.959567070007324, "global_step": 342237, "epoch": 2037} {"train_loss": -10.73781967163086, "global_step": 342238, "epoch": 2037} {"train_loss": -11.921062469482422, "global_step": 342239, "epoch": 2037} {"train_loss": -10.844036102294922, "global_step": 342240, "epoch": 2037} {"train_loss": -10.920906066894531, "global_step": 342241, "epoch": 2037} {"train_loss": -12.001133918762207, "global_step": 342242, "epoch": 2037} {"train_loss": -11.036602973937988, "global_step": 342243, "epoch": 2037} {"train_loss": -11.562554359436035, "global_step": 342244, "epoch": 2037} {"train_loss": -11.692771911621094, "global_step": 342245, "epoch": 2037} {"train_loss": -11.576810836791992, "global_step": 342246, "epoch": 2037} {"train_loss": -12.256429672241211, "global_step": 342247, "epoch": 2037} {"train_loss": -11.73968505859375, "global_step": 342248, "epoch": 2037} {"train_loss": -11.79936408996582, "global_step": 342249, "epoch": 2037} {"train_loss": -11.575963973999023, "global_step": 342250, "epoch": 2037} {"train_loss": -11.138360977172852, "global_step": 342251, "epoch": 2037} {"train_loss": -11.627971649169922, "global_step": 342252, "epoch": 2037} {"train_loss": -11.17786979675293, "global_step": 342253, "epoch": 2037} {"train_loss": -10.985086441040039, "global_step": 342254, "epoch": 2037} {"train_loss": -11.298065185546875, "global_step": 342255, "epoch": 2037} {"train_loss": -11.253421783447266, "global_step": 342256, "epoch": 2037} {"train_loss": -11.42245101928711, "global_step": 342257, "epoch": 2037} {"train_loss": -10.966702461242676, "global_step": 342258, "epoch": 2037} {"train_loss": -11.418787002563477, "global_step": 342259, "epoch": 2037} {"train_loss": -11.395957946777344, "global_step": 342260, "epoch": 2037} {"train_loss": -10.541897773742676, "global_step": 342261, "epoch": 2037} {"train_loss": -11.272245407104492, "global_step": 342262, "epoch": 2037} {"train_loss": -10.701164245605469, "global_step": 342263, "epoch": 2037} {"train_loss": -11.496589660644531, "global_step": 342264, "epoch": 2037} {"train_loss": -11.291351318359375, "global_step": 342265, "epoch": 2037} {"train_loss": -11.347091674804688, "global_step": 342266, "epoch": 2037} {"train_loss": -12.042739868164062, "global_step": 342267, "epoch": 2037} {"train_loss": -10.904671669006348, "global_step": 342268, "epoch": 2037} {"train_loss": -11.652189254760742, "global_step": 342269, "epoch": 2037} {"train_loss": -11.568126678466797, "global_step": 342270, "epoch": 2037} {"train_loss": -10.818405151367188, "global_step": 342271, "epoch": 2037} {"train_loss": -11.959081649780273, "global_step": 342272, "epoch": 2037} {"train_loss": -10.723150253295898, "global_step": 342273, "epoch": 2037} {"train_loss": -11.561339378356934, "global_step": 342274, "epoch": 2037} {"train_loss": -10.665961265563965, "global_step": 342275, "epoch": 2037} {"train_loss": -10.829200744628906, "global_step": 342276, "epoch": 2037} {"train_loss": -11.357229232788086, "global_step": 342277, "epoch": 2037} {"train_loss": -11.106168746948242, "global_step": 342278, "epoch": 2037} {"train_loss": -11.819684982299805, "global_step": 342279, "epoch": 2037} {"train_loss": -11.720375061035156, "global_step": 342280, "epoch": 2037} {"train_loss": -11.34523868560791, "global_step": 342281, "epoch": 2037} {"train_loss": -11.827390670776367, "global_step": 342282, "epoch": 2037} {"train_loss": -11.348274230957031, "global_step": 342283, "epoch": 2037} {"train_loss": -11.653827667236328, "global_step": 342284, "epoch": 2037} {"train_loss": -12.040194511413574, "global_step": 342285, "epoch": 2037} {"train_loss": -11.365989685058594, "global_step": 342286, "epoch": 2037} {"train_loss": -11.922725677490234, "global_step": 342287, "epoch": 2037} {"train_loss": -11.784459114074707, "global_step": 342288, "epoch": 2037} {"train_loss": -12.003005981445312, "global_step": 342289, "epoch": 2037} {"train_loss": -11.630197525024414, "global_step": 342290, "epoch": 2037} {"train_loss": -11.628656387329102, "global_step": 342291, "epoch": 2037} {"train_loss": -11.706419944763184, "global_step": 342292, "epoch": 2037} {"train_loss": -11.272547721862793, "global_step": 342293, "epoch": 2037} {"train_loss": -11.887243270874023, "global_step": 342294, "epoch": 2037} {"train_loss": -12.050680160522461, "global_step": 342295, "epoch": 2037} {"train_loss": -11.725467681884766, "global_step": 342296, "epoch": 2037} {"train_loss": -11.918329238891602, "global_step": 342297, "epoch": 2037} {"train_loss": -11.538281440734863, "global_step": 342298, "epoch": 2037} {"train_loss": -11.888908386230469, "global_step": 342299, "epoch": 2037} {"train_loss": -11.89888858795166, "global_step": 342300, "epoch": 2037} {"train_loss": -11.936759948730469, "global_step": 342301, "epoch": 2037} {"train_loss": -11.70934009552002, "global_step": 342302, "epoch": 2037} {"train_loss": -12.15513801574707, "global_step": 342303, "epoch": 2037} {"train_loss": -11.957929611206055, "global_step": 342304, "epoch": 2037} {"train_loss": -12.221802711486816, "global_step": 342305, "epoch": 2037} {"train_loss": -12.281685829162598, "global_step": 342306, "epoch": 2037} {"train_loss": -12.286705017089844, "global_step": 342307, "epoch": 2037} {"train_loss": -12.280082702636719, "global_step": 342308, "epoch": 2037} {"train_loss": -12.343856811523438, "global_step": 342309, "epoch": 2037} {"train_loss": -12.144965171813965, "global_step": 342310, "epoch": 2037} {"train_loss": -12.353290557861328, "global_step": 342311, "epoch": 2037} {"train_loss": -12.256635665893555, "global_step": 342312, "epoch": 2037} {"train_loss": -12.458182334899902, "global_step": 342313, "epoch": 2037} {"train_loss": -12.126897811889648, "global_step": 342314, "epoch": 2037} {"train_loss": -12.325736999511719, "global_step": 342315, "epoch": 2037} {"train_loss": -12.329391479492188, "global_step": 342316, "epoch": 2037} {"train_loss": -12.380433082580566, "global_step": 342317, "epoch": 2037} {"train_loss": -12.234783172607422, "global_step": 342318, "epoch": 2037} {"train_loss": -12.358763694763184, "global_step": 342319, "epoch": 2037} {"train_loss": -12.167667388916016, "global_step": 342320, "epoch": 2037} {"train_loss": -12.141495704650879, "global_step": 342321, "epoch": 2037} {"train_loss": -12.014074325561523, "global_step": 342322, "epoch": 2037} {"train_loss": -11.919172286987305, "global_step": 342323, "epoch": 2037} {"train_loss": -12.581056594848633, "global_step": 342324, "epoch": 2037} {"train_loss": -12.052084922790527, "global_step": 342325, "epoch": 2037} {"train_loss": -12.432262420654297, "global_step": 342326, "epoch": 2037} {"train_loss": -12.329635620117188, "global_step": 342327, "epoch": 2037} {"train_loss": -11.938568115234375, "global_step": 342328, "epoch": 2037} {"train_loss": -12.615821838378906, "global_step": 342329, "epoch": 2037} {"train_loss": -12.323257446289062, "global_step": 342330, "epoch": 2037} {"train_loss": -12.487427711486816, "global_step": 342331, "epoch": 2037} {"train_loss": -12.40278434753418, "global_step": 342332, "epoch": 2037} {"train_loss": -12.237287521362305, "global_step": 342333, "epoch": 2037} {"train_loss": -12.434099197387695, "global_step": 342334, "epoch": 2037} {"train_loss": -12.429752349853516, "global_step": 342335, "epoch": 2037} {"train_loss": -11.94841194152832, "global_step": 342336, "epoch": 2037} {"train_loss": -12.546178817749023, "global_step": 342337, "epoch": 2037} {"train_loss": -12.171274185180664, "global_step": 342338, "epoch": 2037} {"train_loss": -11.907720565795898, "global_step": 342339, "epoch": 2037} {"train_loss": -12.368651390075684, "global_step": 342340, "epoch": 2037} {"train_loss": -12.282079696655273, "global_step": 342341, "epoch": 2037} {"train_loss": -12.265446662902832, "global_step": 342342, "epoch": 2037} {"train_loss": -12.54195499420166, "global_step": 342343, "epoch": 2037} {"train_loss": -12.59582233428955, "global_step": 342344, "epoch": 2037} {"train_loss": -12.415963172912598, "global_step": 342345, "epoch": 2037} {"train_loss": -12.6167631149292, "global_step": 342346, "epoch": 2037} {"train_loss": -12.51727294921875, "global_step": 342347, "epoch": 2037} {"train_loss": -12.295733451843262, "global_step": 342348, "epoch": 2037} {"train_loss": -12.370153427124023, "global_step": 342349, "epoch": 2037} {"train_loss": -12.304327011108398, "global_step": 342350, "epoch": 2037} {"train_loss": -12.49797248840332, "global_step": 342351, "epoch": 2037} {"train_loss": -12.413240432739258, "global_step": 342352, "epoch": 2037} {"train_loss": -12.671039581298828, "global_step": 342353, "epoch": 2037} {"train_loss": -12.371460914611816, "global_step": 342354, "epoch": 2037} {"train_loss": -12.443695068359375, "global_step": 342355, "epoch": 2037} {"train_loss": -12.541790008544922, "global_step": 342356, "epoch": 2037} {"train_loss": -12.685068130493164, "global_step": 342357, "epoch": 2037} {"train_loss": -12.411086082458496, "global_step": 342358, "epoch": 2037} {"train_loss": -12.678930282592773, "global_step": 342359, "epoch": 2037} {"train_loss": -12.44057846069336, "global_step": 342360, "epoch": 2037} {"train_loss": -12.468267440795898, "global_step": 342361, "epoch": 2037} {"train_loss": -12.375140190124512, "global_step": 342362, "epoch": 2037} {"train_loss": -12.581795692443848, "global_step": 342363, "epoch": 2037} {"train_loss": -12.486995697021484, "global_step": 342364, "epoch": 2037} {"train_loss": -12.30078125, "global_step": 342365, "epoch": 2037} {"train_loss": -12.157759666442871, "global_step": 342366, "epoch": 2037} {"train_loss": -11.421841621398926, "global_step": 342367, "epoch": 2037} {"train_loss": -12.088329315185547, "global_step": 342368, "epoch": 2037} {"train_loss": -12.423871994018555, "global_step": 342369, "epoch": 2037} {"train_loss": -12.105073928833008, "global_step": 342370, "epoch": 2037} {"train_loss": -11.549715042114258, "global_step": 342371, "epoch": 2037} {"train_loss": -12.229859352111816, "global_step": 342372, "epoch": 2037} {"train_loss": -12.28237533569336, "global_step": 342373, "epoch": 2037} {"train_loss": -12.063135147094727, "global_step": 342374, "epoch": 2037} {"train_loss": -11.960655212402344, "global_step": 342375, "epoch": 2037} {"train_loss": -12.148561477661133, "global_step": 342376, "epoch": 2037} {"train_loss": -11.831676483154297, "global_step": 342377, "epoch": 2037} {"train_loss": -12.25126838684082, "global_step": 342378, "epoch": 2037} {"train_loss": -11.616317749023438, "global_step": 342379, "epoch": 2037} {"train_loss": -11.289462089538574, "global_step": 342380, "epoch": 2037} {"train_loss": -9.518228530883789, "global_step": 342381, "epoch": 2037} {"train_loss": -10.010882377624512, "global_step": 342382, "epoch": 2037} {"train_loss": -11.871562509309678, "global_step": 342383, "epoch": 2037, "val_loss": 285999.625} {"train_loss": -10.293309211730957, "global_step": 342384, "epoch": 2038} {"train_loss": -7.7815260887146, "global_step": 342385, "epoch": 2038} {"train_loss": -9.376691818237305, "global_step": 342386, "epoch": 2038} {"train_loss": -10.262802124023438, "global_step": 342387, "epoch": 2038} {"train_loss": -8.83542537689209, "global_step": 342388, "epoch": 2038} {"train_loss": -9.312697410583496, "global_step": 342389, "epoch": 2038} {"train_loss": -8.496452331542969, "global_step": 342390, "epoch": 2038} {"train_loss": -9.316194534301758, "global_step": 342391, "epoch": 2038} {"train_loss": -7.808629989624023, "global_step": 342392, "epoch": 2038} {"train_loss": -7.4952850341796875, "global_step": 342393, "epoch": 2038} {"train_loss": -8.908260345458984, "global_step": 342394, "epoch": 2038} {"train_loss": -8.835391998291016, "global_step": 342395, "epoch": 2038} {"train_loss": -8.805375099182129, "global_step": 342396, "epoch": 2038} {"train_loss": -9.457062721252441, "global_step": 342397, "epoch": 2038} {"train_loss": -9.166581153869629, "global_step": 342398, "epoch": 2038} {"train_loss": -9.994952201843262, "global_step": 342399, "epoch": 2038} {"train_loss": -10.16761302947998, "global_step": 342400, "epoch": 2038} {"train_loss": -10.390840530395508, "global_step": 342401, "epoch": 2038} {"train_loss": -10.31408405303955, "global_step": 342402, "epoch": 2038} {"train_loss": -10.662714004516602, "global_step": 342403, "epoch": 2038} {"train_loss": -10.79251480102539, "global_step": 342404, "epoch": 2038} {"train_loss": -10.172721862792969, "global_step": 342405, "epoch": 2038} {"train_loss": -11.167688369750977, "global_step": 342406, "epoch": 2038} {"train_loss": -10.68626594543457, "global_step": 342407, "epoch": 2038} {"train_loss": -11.593281745910645, "global_step": 342408, "epoch": 2038} {"train_loss": -11.17330265045166, "global_step": 342409, "epoch": 2038} {"train_loss": -11.611639976501465, "global_step": 342410, "epoch": 2038} {"train_loss": -11.714184761047363, "global_step": 342411, "epoch": 2038} {"train_loss": -11.342028617858887, "global_step": 342412, "epoch": 2038} {"train_loss": -11.622501373291016, "global_step": 342413, "epoch": 2038} {"train_loss": -11.868042945861816, "global_step": 342414, "epoch": 2038} {"train_loss": -11.546634674072266, "global_step": 342415, "epoch": 2038} {"train_loss": -11.827593803405762, "global_step": 342416, "epoch": 2038} {"train_loss": -11.851767539978027, "global_step": 342417, "epoch": 2038} {"train_loss": -11.90353012084961, "global_step": 342418, "epoch": 2038} {"train_loss": -11.89624309539795, "global_step": 342419, "epoch": 2038} {"train_loss": -11.887250900268555, "global_step": 342420, "epoch": 2038} {"train_loss": -11.895654678344727, "global_step": 342421, "epoch": 2038} {"train_loss": -11.796648025512695, "global_step": 342422, "epoch": 2038} {"train_loss": -11.82404899597168, "global_step": 342423, "epoch": 2038} {"train_loss": -11.784265518188477, "global_step": 342424, "epoch": 2038} {"train_loss": -12.038314819335938, "global_step": 342425, "epoch": 2038} {"train_loss": -12.164299011230469, "global_step": 342426, "epoch": 2038} {"train_loss": -12.1769380569458, "global_step": 342427, "epoch": 2038} {"train_loss": -12.080770492553711, "global_step": 342428, "epoch": 2038} {"train_loss": -11.876226425170898, "global_step": 342429, "epoch": 2038} {"train_loss": -12.154232025146484, "global_step": 342430, "epoch": 2038} {"train_loss": -12.162208557128906, "global_step": 342431, "epoch": 2038} {"train_loss": -12.200303077697754, "global_step": 342432, "epoch": 2038} {"train_loss": -12.18971061706543, "global_step": 342433, "epoch": 2038} {"train_loss": -12.138914108276367, "global_step": 342434, "epoch": 2038} {"train_loss": -12.113245010375977, "global_step": 342435, "epoch": 2038} {"train_loss": -12.040328979492188, "global_step": 342436, "epoch": 2038} {"train_loss": -12.173152923583984, "global_step": 342437, "epoch": 2038} {"train_loss": -12.18008804321289, "global_step": 342438, "epoch": 2038} {"train_loss": -12.349452018737793, "global_step": 342439, "epoch": 2038} {"train_loss": -12.335065841674805, "global_step": 342440, "epoch": 2038} {"train_loss": -12.253256797790527, "global_step": 342441, "epoch": 2038} {"train_loss": -12.262434959411621, "global_step": 342442, "epoch": 2038} {"train_loss": -12.393391609191895, "global_step": 342443, "epoch": 2038} {"train_loss": -12.329126358032227, "global_step": 342444, "epoch": 2038} {"train_loss": -12.131963729858398, "global_step": 342445, "epoch": 2038} {"train_loss": -12.247072219848633, "global_step": 342446, "epoch": 2038} {"train_loss": -12.338396072387695, "global_step": 342447, "epoch": 2038} {"train_loss": -12.396844863891602, "global_step": 342448, "epoch": 2038} {"train_loss": -12.3922758102417, "global_step": 342449, "epoch": 2038} {"train_loss": -12.33111572265625, "global_step": 342450, "epoch": 2038} {"train_loss": -12.4293212890625, "global_step": 342451, "epoch": 2038} {"train_loss": -12.467632293701172, "global_step": 342452, "epoch": 2038} {"train_loss": -12.262983322143555, "global_step": 342453, "epoch": 2038} {"train_loss": -12.495367050170898, "global_step": 342454, "epoch": 2038} {"train_loss": -12.313993453979492, "global_step": 342455, "epoch": 2038} {"train_loss": -12.341459274291992, "global_step": 342456, "epoch": 2038} {"train_loss": -12.373123168945312, "global_step": 342457, "epoch": 2038} {"train_loss": -12.405241966247559, "global_step": 342458, "epoch": 2038} {"train_loss": -12.516889572143555, "global_step": 342459, "epoch": 2038} {"train_loss": -12.406017303466797, "global_step": 342460, "epoch": 2038} {"train_loss": -12.622390747070312, "global_step": 342461, "epoch": 2038} {"train_loss": -12.410688400268555, "global_step": 342462, "epoch": 2038} {"train_loss": -12.629388809204102, "global_step": 342463, "epoch": 2038} {"train_loss": -12.246238708496094, "global_step": 342464, "epoch": 2038} {"train_loss": -12.221729278564453, "global_step": 342465, "epoch": 2038} {"train_loss": -12.467100143432617, "global_step": 342466, "epoch": 2038} {"train_loss": -12.282913208007812, "global_step": 342467, "epoch": 2038} {"train_loss": -12.563596725463867, "global_step": 342468, "epoch": 2038} {"train_loss": -12.278302192687988, "global_step": 342469, "epoch": 2038} {"train_loss": -12.257791519165039, "global_step": 342470, "epoch": 2038} {"train_loss": -12.436843872070312, "global_step": 342471, "epoch": 2038} {"train_loss": -12.235227584838867, "global_step": 342472, "epoch": 2038} {"train_loss": -11.851310729980469, "global_step": 342473, "epoch": 2038} {"train_loss": -12.269886016845703, "global_step": 342474, "epoch": 2038} {"train_loss": -12.297304153442383, "global_step": 342475, "epoch": 2038} {"train_loss": -12.037117004394531, "global_step": 342476, "epoch": 2038} {"train_loss": -12.290184020996094, "global_step": 342477, "epoch": 2038} {"train_loss": -12.414596557617188, "global_step": 342478, "epoch": 2038} {"train_loss": -11.248023986816406, "global_step": 342479, "epoch": 2038} {"train_loss": -11.61276626586914, "global_step": 342480, "epoch": 2038} {"train_loss": -12.110130310058594, "global_step": 342481, "epoch": 2038} {"train_loss": -11.071049690246582, "global_step": 342482, "epoch": 2038} {"train_loss": -12.01137924194336, "global_step": 342483, "epoch": 2038} {"train_loss": -11.605875968933105, "global_step": 342484, "epoch": 2038} {"train_loss": -12.422800064086914, "global_step": 342485, "epoch": 2038} {"train_loss": -11.81044864654541, "global_step": 342486, "epoch": 2038} {"train_loss": -12.01701831817627, "global_step": 342487, "epoch": 2038} {"train_loss": -11.34644889831543, "global_step": 342488, "epoch": 2038} {"train_loss": -12.358673095703125, "global_step": 342489, "epoch": 2038} {"train_loss": -11.001764297485352, "global_step": 342490, "epoch": 2038} {"train_loss": -11.034546852111816, "global_step": 342491, "epoch": 2038} {"train_loss": -11.986625671386719, "global_step": 342492, "epoch": 2038} {"train_loss": -11.72266960144043, "global_step": 342493, "epoch": 2038} {"train_loss": -11.884876251220703, "global_step": 342494, "epoch": 2038} {"train_loss": -11.967874526977539, "global_step": 342495, "epoch": 2038} {"train_loss": -11.708074569702148, "global_step": 342496, "epoch": 2038} {"train_loss": -11.087749481201172, "global_step": 342497, "epoch": 2038} {"train_loss": -11.51260757446289, "global_step": 342498, "epoch": 2038} {"train_loss": -11.303861618041992, "global_step": 342499, "epoch": 2038} {"train_loss": -11.46976089477539, "global_step": 342500, "epoch": 2038} {"train_loss": -11.000864028930664, "global_step": 342501, "epoch": 2038} {"train_loss": -11.034879684448242, "global_step": 342502, "epoch": 2038} {"train_loss": -12.132280349731445, "global_step": 342503, "epoch": 2038} {"train_loss": -11.505488395690918, "global_step": 342504, "epoch": 2038} {"train_loss": -11.924518585205078, "global_step": 342505, "epoch": 2038} {"train_loss": -11.537951469421387, "global_step": 342506, "epoch": 2038} {"train_loss": -11.268499374389648, "global_step": 342507, "epoch": 2038} {"train_loss": -11.018178939819336, "global_step": 342508, "epoch": 2038} {"train_loss": -11.083606719970703, "global_step": 342509, "epoch": 2038} {"train_loss": -11.502561569213867, "global_step": 342510, "epoch": 2038} {"train_loss": -10.764152526855469, "global_step": 342511, "epoch": 2038} {"train_loss": -11.673561096191406, "global_step": 342512, "epoch": 2038} {"train_loss": -11.147987365722656, "global_step": 342513, "epoch": 2038} {"train_loss": -11.079429626464844, "global_step": 342514, "epoch": 2038} {"train_loss": -11.715486526489258, "global_step": 342515, "epoch": 2038} {"train_loss": -11.386468887329102, "global_step": 342516, "epoch": 2038} {"train_loss": -11.449596405029297, "global_step": 342517, "epoch": 2038} {"train_loss": -11.413726806640625, "global_step": 342518, "epoch": 2038} {"train_loss": -11.774044036865234, "global_step": 342519, "epoch": 2038} {"train_loss": -10.784526824951172, "global_step": 342520, "epoch": 2038} {"train_loss": -12.143402099609375, "global_step": 342521, "epoch": 2038} {"train_loss": -11.35035228729248, "global_step": 342522, "epoch": 2038} {"train_loss": -12.05931282043457, "global_step": 342523, "epoch": 2038} {"train_loss": -11.523110389709473, "global_step": 342524, "epoch": 2038} {"train_loss": -11.545884132385254, "global_step": 342525, "epoch": 2038} {"train_loss": -11.538809776306152, "global_step": 342526, "epoch": 2038} {"train_loss": -11.608652114868164, "global_step": 342527, "epoch": 2038} {"train_loss": -11.982220649719238, "global_step": 342528, "epoch": 2038} {"train_loss": -11.584115028381348, "global_step": 342529, "epoch": 2038} {"train_loss": -11.260367393493652, "global_step": 342530, "epoch": 2038} {"train_loss": -11.870841979980469, "global_step": 342531, "epoch": 2038} {"train_loss": -11.74693489074707, "global_step": 342532, "epoch": 2038} {"train_loss": -11.96806526184082, "global_step": 342533, "epoch": 2038} {"train_loss": -11.794021606445312, "global_step": 342534, "epoch": 2038} {"train_loss": -11.849055290222168, "global_step": 342535, "epoch": 2038} {"train_loss": -11.853941917419434, "global_step": 342536, "epoch": 2038} {"train_loss": -12.006162643432617, "global_step": 342537, "epoch": 2038} {"train_loss": -11.719528198242188, "global_step": 342538, "epoch": 2038} {"train_loss": -11.767580032348633, "global_step": 342539, "epoch": 2038} {"train_loss": -12.027652740478516, "global_step": 342540, "epoch": 2038} {"train_loss": -11.643473625183105, "global_step": 342541, "epoch": 2038} {"train_loss": -11.59862995147705, "global_step": 342542, "epoch": 2038} {"train_loss": -11.80638599395752, "global_step": 342543, "epoch": 2038} {"train_loss": -11.208481788635254, "global_step": 342544, "epoch": 2038} {"train_loss": -12.147964477539062, "global_step": 342545, "epoch": 2038} {"train_loss": -11.669650077819824, "global_step": 342546, "epoch": 2038} {"train_loss": -12.050110816955566, "global_step": 342547, "epoch": 2038} {"train_loss": -11.696467399597168, "global_step": 342548, "epoch": 2038} {"train_loss": -12.194337844848633, "global_step": 342549, "epoch": 2038} {"train_loss": -11.827888488769531, "global_step": 342550, "epoch": 2038} {"train_loss": -11.54618656919116, "global_step": 342551, "epoch": 2038, "val_loss": 286981.3125} {"train_loss": -12.224613189697266, "global_step": 342552, "epoch": 2039} {"train_loss": -12.113507270812988, "global_step": 342553, "epoch": 2039} {"train_loss": -12.295870780944824, "global_step": 342554, "epoch": 2039} {"train_loss": -12.111690521240234, "global_step": 342555, "epoch": 2039} {"train_loss": -12.222368240356445, "global_step": 342556, "epoch": 2039} {"train_loss": -12.376437187194824, "global_step": 342557, "epoch": 2039} {"train_loss": -12.326383590698242, "global_step": 342558, "epoch": 2039} {"train_loss": -12.283767700195312, "global_step": 342559, "epoch": 2039} {"train_loss": -12.300366401672363, "global_step": 342560, "epoch": 2039} {"train_loss": -12.253735542297363, "global_step": 342561, "epoch": 2039} {"train_loss": -12.366020202636719, "global_step": 342562, "epoch": 2039} {"train_loss": -12.176546096801758, "global_step": 342563, "epoch": 2039} {"train_loss": -12.236343383789062, "global_step": 342564, "epoch": 2039} {"train_loss": -12.537656784057617, "global_step": 342565, "epoch": 2039} {"train_loss": -12.62115478515625, "global_step": 342566, "epoch": 2039} {"train_loss": -12.395818710327148, "global_step": 342567, "epoch": 2039} {"train_loss": -12.376232147216797, "global_step": 342568, "epoch": 2039} {"train_loss": -12.543800354003906, "global_step": 342569, "epoch": 2039} {"train_loss": -12.397096633911133, "global_step": 342570, "epoch": 2039} {"train_loss": -12.426942825317383, "global_step": 342571, "epoch": 2039} {"train_loss": -12.410589218139648, "global_step": 342572, "epoch": 2039} {"train_loss": -12.388893127441406, "global_step": 342573, "epoch": 2039} {"train_loss": -12.469423294067383, "global_step": 342574, "epoch": 2039} {"train_loss": -12.3031587600708, "global_step": 342575, "epoch": 2039} {"train_loss": -12.482366561889648, "global_step": 342576, "epoch": 2039} {"train_loss": -12.07486343383789, "global_step": 342577, "epoch": 2039} {"train_loss": -12.588770866394043, "global_step": 342578, "epoch": 2039} {"train_loss": -12.348578453063965, "global_step": 342579, "epoch": 2039} {"train_loss": -12.372172355651855, "global_step": 342580, "epoch": 2039} {"train_loss": -11.93758773803711, "global_step": 342581, "epoch": 2039} {"train_loss": -12.495506286621094, "global_step": 342582, "epoch": 2039} {"train_loss": -12.223905563354492, "global_step": 342583, "epoch": 2039} {"train_loss": -12.136371612548828, "global_step": 342584, "epoch": 2039} {"train_loss": -12.376120567321777, "global_step": 342585, "epoch": 2039} {"train_loss": -12.118457794189453, "global_step": 342586, "epoch": 2039} {"train_loss": -11.977167129516602, "global_step": 342587, "epoch": 2039} {"train_loss": -12.055397987365723, "global_step": 342588, "epoch": 2039} {"train_loss": -12.403172492980957, "global_step": 342589, "epoch": 2039} {"train_loss": -11.795682907104492, "global_step": 342590, "epoch": 2039} {"train_loss": -12.094197273254395, "global_step": 342591, "epoch": 2039} {"train_loss": -12.064598083496094, "global_step": 342592, "epoch": 2039} {"train_loss": -12.213560104370117, "global_step": 342593, "epoch": 2039} {"train_loss": -12.39915657043457, "global_step": 342594, "epoch": 2039} {"train_loss": -11.9180269241333, "global_step": 342595, "epoch": 2039} {"train_loss": -11.991799354553223, "global_step": 342596, "epoch": 2039} {"train_loss": -12.127498626708984, "global_step": 342597, "epoch": 2039} {"train_loss": -11.9039306640625, "global_step": 342598, "epoch": 2039} {"train_loss": -12.004261016845703, "global_step": 342599, "epoch": 2039} {"train_loss": -12.092233657836914, "global_step": 342600, "epoch": 2039} {"train_loss": -12.358236312866211, "global_step": 342601, "epoch": 2039} {"train_loss": -12.175333023071289, "global_step": 342602, "epoch": 2039} {"train_loss": -12.383566856384277, "global_step": 342603, "epoch": 2039} {"train_loss": -12.21046257019043, "global_step": 342604, "epoch": 2039} {"train_loss": -12.320378303527832, "global_step": 342605, "epoch": 2039} {"train_loss": -12.474584579467773, "global_step": 342606, "epoch": 2039} {"train_loss": -12.343027114868164, "global_step": 342607, "epoch": 2039} {"train_loss": -12.092973709106445, "global_step": 342608, "epoch": 2039} {"train_loss": -12.187679290771484, "global_step": 342609, "epoch": 2039} {"train_loss": -12.190168380737305, "global_step": 342610, "epoch": 2039} {"train_loss": -11.812261581420898, "global_step": 342611, "epoch": 2039} {"train_loss": -12.273073196411133, "global_step": 342612, "epoch": 2039} {"train_loss": -12.006360054016113, "global_step": 342613, "epoch": 2039} {"train_loss": -12.501590728759766, "global_step": 342614, "epoch": 2039} {"train_loss": -12.473316192626953, "global_step": 342615, "epoch": 2039} {"train_loss": -12.13765811920166, "global_step": 342616, "epoch": 2039} {"train_loss": -12.251468658447266, "global_step": 342617, "epoch": 2039} {"train_loss": -12.305500030517578, "global_step": 342618, "epoch": 2039} {"train_loss": -12.009108543395996, "global_step": 342619, "epoch": 2039} {"train_loss": -12.41379165649414, "global_step": 342620, "epoch": 2039} {"train_loss": -12.609452247619629, "global_step": 342621, "epoch": 2039} {"train_loss": -12.620194435119629, "global_step": 342622, "epoch": 2039} {"train_loss": -12.517704010009766, "global_step": 342623, "epoch": 2039} {"train_loss": -12.645977020263672, "global_step": 342624, "epoch": 2039} {"train_loss": -12.543437957763672, "global_step": 342625, "epoch": 2039} {"train_loss": -12.549667358398438, "global_step": 342626, "epoch": 2039} {"train_loss": -12.423731803894043, "global_step": 342627, "epoch": 2039} {"train_loss": -12.443069458007812, "global_step": 342628, "epoch": 2039} {"train_loss": -12.127433776855469, "global_step": 342629, "epoch": 2039} {"train_loss": -12.380661964416504, "global_step": 342630, "epoch": 2039} {"train_loss": -12.255090713500977, "global_step": 342631, "epoch": 2039} {"train_loss": -12.385794639587402, "global_step": 342632, "epoch": 2039} {"train_loss": -12.435199737548828, "global_step": 342633, "epoch": 2039} {"train_loss": -12.56902027130127, "global_step": 342634, "epoch": 2039} {"train_loss": -12.36489200592041, "global_step": 342635, "epoch": 2039} {"train_loss": -12.58082103729248, "global_step": 342636, "epoch": 2039} {"train_loss": -12.617377281188965, "global_step": 342637, "epoch": 2039} {"train_loss": -12.42968463897705, "global_step": 342638, "epoch": 2039} {"train_loss": -12.484813690185547, "global_step": 342639, "epoch": 2039} {"train_loss": -12.171142578125, "global_step": 342640, "epoch": 2039} {"train_loss": -12.753689765930176, "global_step": 342641, "epoch": 2039} {"train_loss": -12.36361026763916, "global_step": 342642, "epoch": 2039} {"train_loss": -12.350156784057617, "global_step": 342643, "epoch": 2039} {"train_loss": -12.500333786010742, "global_step": 342644, "epoch": 2039} {"train_loss": -12.299795150756836, "global_step": 342645, "epoch": 2039} {"train_loss": -12.430875778198242, "global_step": 342646, "epoch": 2039} {"train_loss": -12.42184829711914, "global_step": 342647, "epoch": 2039} {"train_loss": -12.52126407623291, "global_step": 342648, "epoch": 2039} {"train_loss": -12.092830657958984, "global_step": 342649, "epoch": 2039} {"train_loss": -12.27505874633789, "global_step": 342650, "epoch": 2039} {"train_loss": -12.056903839111328, "global_step": 342651, "epoch": 2039} {"train_loss": -12.56074047088623, "global_step": 342652, "epoch": 2039} {"train_loss": -12.228757858276367, "global_step": 342653, "epoch": 2039} {"train_loss": -12.418048858642578, "global_step": 342654, "epoch": 2039} {"train_loss": -12.022207260131836, "global_step": 342655, "epoch": 2039} {"train_loss": -12.278545379638672, "global_step": 342656, "epoch": 2039} {"train_loss": -12.057535171508789, "global_step": 342657, "epoch": 2039} {"train_loss": -11.945633888244629, "global_step": 342658, "epoch": 2039} {"train_loss": -11.679740905761719, "global_step": 342659, "epoch": 2039} {"train_loss": -11.678492546081543, "global_step": 342660, "epoch": 2039} {"train_loss": -11.655454635620117, "global_step": 342661, "epoch": 2039} {"train_loss": -9.39797592163086, "global_step": 342662, "epoch": 2039} {"train_loss": -10.882196426391602, "global_step": 342663, "epoch": 2039} {"train_loss": -7.919192314147949, "global_step": 342664, "epoch": 2039} {"train_loss": -10.614192962646484, "global_step": 342665, "epoch": 2039} {"train_loss": -11.203093528747559, "global_step": 342666, "epoch": 2039} {"train_loss": -9.283333778381348, "global_step": 342667, "epoch": 2039} {"train_loss": -9.328203201293945, "global_step": 342668, "epoch": 2039} {"train_loss": -9.658191680908203, "global_step": 342669, "epoch": 2039} {"train_loss": -10.659278869628906, "global_step": 342670, "epoch": 2039} {"train_loss": -8.771890640258789, "global_step": 342671, "epoch": 2039} {"train_loss": -9.724956512451172, "global_step": 342672, "epoch": 2039} {"train_loss": -9.828330993652344, "global_step": 342673, "epoch": 2039} {"train_loss": -10.6516695022583, "global_step": 342674, "epoch": 2039} {"train_loss": -10.474583625793457, "global_step": 342675, "epoch": 2039} {"train_loss": -11.178217887878418, "global_step": 342676, "epoch": 2039} {"train_loss": -10.84221363067627, "global_step": 342677, "epoch": 2039} {"train_loss": -9.725955963134766, "global_step": 342678, "epoch": 2039} {"train_loss": -10.953815460205078, "global_step": 342679, "epoch": 2039} {"train_loss": -10.110172271728516, "global_step": 342680, "epoch": 2039} {"train_loss": -11.364133834838867, "global_step": 342681, "epoch": 2039} {"train_loss": -11.182184219360352, "global_step": 342682, "epoch": 2039} {"train_loss": -10.968558311462402, "global_step": 342683, "epoch": 2039} {"train_loss": -11.03561019897461, "global_step": 342684, "epoch": 2039} {"train_loss": -10.630027770996094, "global_step": 342685, "epoch": 2039} {"train_loss": -10.59787368774414, "global_step": 342686, "epoch": 2039} {"train_loss": -10.206008911132812, "global_step": 342687, "epoch": 2039} {"train_loss": -9.960872650146484, "global_step": 342688, "epoch": 2039} {"train_loss": -11.1756010055542, "global_step": 342689, "epoch": 2039} {"train_loss": -10.090590476989746, "global_step": 342690, "epoch": 2039} {"train_loss": -10.229710578918457, "global_step": 342691, "epoch": 2039} {"train_loss": -9.478139877319336, "global_step": 342692, "epoch": 2039} {"train_loss": -9.03549575805664, "global_step": 342693, "epoch": 2039} {"train_loss": -10.33423900604248, "global_step": 342694, "epoch": 2039} {"train_loss": -9.603083610534668, "global_step": 342695, "epoch": 2039} {"train_loss": -10.191143035888672, "global_step": 342696, "epoch": 2039} {"train_loss": -10.124367713928223, "global_step": 342697, "epoch": 2039} {"train_loss": -9.74075984954834, "global_step": 342698, "epoch": 2039} {"train_loss": -11.622478485107422, "global_step": 342699, "epoch": 2039} {"train_loss": -9.329936981201172, "global_step": 342700, "epoch": 2039} {"train_loss": -9.926301956176758, "global_step": 342701, "epoch": 2039} {"train_loss": -9.75796890258789, "global_step": 342702, "epoch": 2039} {"train_loss": -10.911762237548828, "global_step": 342703, "epoch": 2039} {"train_loss": -10.373674392700195, "global_step": 342704, "epoch": 2039} {"train_loss": -9.92262077331543, "global_step": 342705, "epoch": 2039} {"train_loss": -10.446194648742676, "global_step": 342706, "epoch": 2039} {"train_loss": -9.869182586669922, "global_step": 342707, "epoch": 2039} {"train_loss": -10.954036712646484, "global_step": 342708, "epoch": 2039} {"train_loss": -10.703472137451172, "global_step": 342709, "epoch": 2039} {"train_loss": -10.45387077331543, "global_step": 342710, "epoch": 2039} {"train_loss": -11.219572067260742, "global_step": 342711, "epoch": 2039} {"train_loss": -10.925674438476562, "global_step": 342712, "epoch": 2039} {"train_loss": -10.804866790771484, "global_step": 342713, "epoch": 2039} {"train_loss": -11.267131805419922, "global_step": 342714, "epoch": 2039} {"train_loss": -11.52242660522461, "global_step": 342715, "epoch": 2039} {"train_loss": -11.348260879516602, "global_step": 342716, "epoch": 2039} {"train_loss": -11.692773818969727, "global_step": 342717, "epoch": 2039} {"train_loss": -11.275741577148438, "global_step": 342718, "epoch": 2039} {"train_loss": -11.632072062719436, "global_step": 342719, "epoch": 2039, "val_loss": 284482.75} {"train_loss": -11.485578536987305, "global_step": 342720, "epoch": 2040} {"train_loss": -11.843907356262207, "global_step": 342721, "epoch": 2040} {"train_loss": -11.58568000793457, "global_step": 342722, "epoch": 2040} {"train_loss": -12.040260314941406, "global_step": 342723, "epoch": 2040} {"train_loss": -11.851513862609863, "global_step": 342724, "epoch": 2040} {"train_loss": -12.145988464355469, "global_step": 342725, "epoch": 2040} {"train_loss": -11.806439399719238, "global_step": 342726, "epoch": 2040} {"train_loss": -11.878978729248047, "global_step": 342727, "epoch": 2040} {"train_loss": -11.874409675598145, "global_step": 342728, "epoch": 2040} {"train_loss": -11.90237045288086, "global_step": 342729, "epoch": 2040} {"train_loss": -11.92124080657959, "global_step": 342730, "epoch": 2040} {"train_loss": -12.01772403717041, "global_step": 342731, "epoch": 2040} {"train_loss": -11.671581268310547, "global_step": 342732, "epoch": 2040} {"train_loss": -12.160602569580078, "global_step": 342733, "epoch": 2040} {"train_loss": -11.927518844604492, "global_step": 342734, "epoch": 2040} {"train_loss": -12.332725524902344, "global_step": 342735, "epoch": 2040} {"train_loss": -11.936725616455078, "global_step": 342736, "epoch": 2040} {"train_loss": -12.051090240478516, "global_step": 342737, "epoch": 2040} {"train_loss": -12.021411895751953, "global_step": 342738, "epoch": 2040} {"train_loss": -12.068166732788086, "global_step": 342739, "epoch": 2040} {"train_loss": -12.169608116149902, "global_step": 342740, "epoch": 2040} {"train_loss": -11.928426742553711, "global_step": 342741, "epoch": 2040} {"train_loss": -12.263402938842773, "global_step": 342742, "epoch": 2040} {"train_loss": -12.248241424560547, "global_step": 342743, "epoch": 2040} {"train_loss": -12.035236358642578, "global_step": 342744, "epoch": 2040} {"train_loss": -12.001537322998047, "global_step": 342745, "epoch": 2040} {"train_loss": -12.257574081420898, "global_step": 342746, "epoch": 2040} {"train_loss": -12.158971786499023, "global_step": 342747, "epoch": 2040} {"train_loss": -12.297515869140625, "global_step": 342748, "epoch": 2040} {"train_loss": -12.353287696838379, "global_step": 342749, "epoch": 2040} {"train_loss": -12.32939624786377, "global_step": 342750, "epoch": 2040} {"train_loss": -12.242414474487305, "global_step": 342751, "epoch": 2040} {"train_loss": -12.371916770935059, "global_step": 342752, "epoch": 2040} {"train_loss": -12.354230880737305, "global_step": 342753, "epoch": 2040} {"train_loss": -12.326263427734375, "global_step": 342754, "epoch": 2040} {"train_loss": -12.399515151977539, "global_step": 342755, "epoch": 2040} {"train_loss": -12.260696411132812, "global_step": 342756, "epoch": 2040} {"train_loss": -12.168438911437988, "global_step": 342757, "epoch": 2040} {"train_loss": -12.516494750976562, "global_step": 342758, "epoch": 2040} {"train_loss": -12.452394485473633, "global_step": 342759, "epoch": 2040} {"train_loss": -12.503955841064453, "global_step": 342760, "epoch": 2040} {"train_loss": -12.48573112487793, "global_step": 342761, "epoch": 2040} {"train_loss": -12.48594856262207, "global_step": 342762, "epoch": 2040} {"train_loss": -12.370745658874512, "global_step": 342763, "epoch": 2040} {"train_loss": -12.458175659179688, "global_step": 342764, "epoch": 2040} {"train_loss": -12.41897964477539, "global_step": 342765, "epoch": 2040} {"train_loss": -12.411909103393555, "global_step": 342766, "epoch": 2040} {"train_loss": -12.523188591003418, "global_step": 342767, "epoch": 2040} {"train_loss": -12.48814582824707, "global_step": 342768, "epoch": 2040} {"train_loss": -12.422143936157227, "global_step": 342769, "epoch": 2040} {"train_loss": -12.546299934387207, "global_step": 342770, "epoch": 2040} {"train_loss": -12.55665397644043, "global_step": 342771, "epoch": 2040} {"train_loss": -12.613637924194336, "global_step": 342772, "epoch": 2040} {"train_loss": -12.45869255065918, "global_step": 342773, "epoch": 2040} {"train_loss": -12.781173706054688, "global_step": 342774, "epoch": 2040} {"train_loss": -12.277322769165039, "global_step": 342775, "epoch": 2040} {"train_loss": -12.433806419372559, "global_step": 342776, "epoch": 2040} {"train_loss": -12.713996887207031, "global_step": 342777, "epoch": 2040} {"train_loss": -12.596086502075195, "global_step": 342778, "epoch": 2040} {"train_loss": -12.643749237060547, "global_step": 342779, "epoch": 2040} {"train_loss": -12.466567993164062, "global_step": 342780, "epoch": 2040} {"train_loss": -12.59440803527832, "global_step": 342781, "epoch": 2040} {"train_loss": -12.722310066223145, "global_step": 342782, "epoch": 2040} {"train_loss": -12.627141952514648, "global_step": 342783, "epoch": 2040} {"train_loss": -12.497831344604492, "global_step": 342784, "epoch": 2040} {"train_loss": -12.68071460723877, "global_step": 342785, "epoch": 2040} {"train_loss": -12.745229721069336, "global_step": 342786, "epoch": 2040} {"train_loss": -12.671343803405762, "global_step": 342787, "epoch": 2040} {"train_loss": -12.58438491821289, "global_step": 342788, "epoch": 2040} {"train_loss": -12.505937576293945, "global_step": 342789, "epoch": 2040} {"train_loss": -12.646997451782227, "global_step": 342790, "epoch": 2040} {"train_loss": -12.502704620361328, "global_step": 342791, "epoch": 2040} {"train_loss": -12.579056739807129, "global_step": 342792, "epoch": 2040} {"train_loss": -12.583040237426758, "global_step": 342793, "epoch": 2040} {"train_loss": -12.61953353881836, "global_step": 342794, "epoch": 2040} {"train_loss": -12.749892234802246, "global_step": 342795, "epoch": 2040} {"train_loss": -12.72681999206543, "global_step": 342796, "epoch": 2040} {"train_loss": -12.66749382019043, "global_step": 342797, "epoch": 2040} {"train_loss": -12.66208267211914, "global_step": 342798, "epoch": 2040} {"train_loss": -12.734434127807617, "global_step": 342799, "epoch": 2040} {"train_loss": -11.627510070800781, "global_step": 342800, "epoch": 2040} {"train_loss": -12.259237289428711, "global_step": 342801, "epoch": 2040} {"train_loss": -12.201981544494629, "global_step": 342802, "epoch": 2040} {"train_loss": -12.354595184326172, "global_step": 342803, "epoch": 2040} {"train_loss": -12.015268325805664, "global_step": 342804, "epoch": 2040} {"train_loss": -12.171220779418945, "global_step": 342805, "epoch": 2040} {"train_loss": -12.217878341674805, "global_step": 342806, "epoch": 2040} {"train_loss": -11.90877914428711, "global_step": 342807, "epoch": 2040} {"train_loss": -12.053569793701172, "global_step": 342808, "epoch": 2040} {"train_loss": -11.813850402832031, "global_step": 342809, "epoch": 2040} {"train_loss": -10.86475944519043, "global_step": 342810, "epoch": 2040} {"train_loss": -10.239380836486816, "global_step": 342811, "epoch": 2040} {"train_loss": -11.294225692749023, "global_step": 342812, "epoch": 2040} {"train_loss": -12.275402069091797, "global_step": 342813, "epoch": 2040} {"train_loss": -10.857364654541016, "global_step": 342814, "epoch": 2040} {"train_loss": -11.468524932861328, "global_step": 342815, "epoch": 2040} {"train_loss": -11.362850189208984, "global_step": 342816, "epoch": 2040} {"train_loss": -11.628347396850586, "global_step": 342817, "epoch": 2040} {"train_loss": -10.89700698852539, "global_step": 342818, "epoch": 2040} {"train_loss": -12.493328094482422, "global_step": 342819, "epoch": 2040} {"train_loss": -11.26530647277832, "global_step": 342820, "epoch": 2040} {"train_loss": -10.624382972717285, "global_step": 342821, "epoch": 2040} {"train_loss": -11.438207626342773, "global_step": 342822, "epoch": 2040} {"train_loss": -11.310380935668945, "global_step": 342823, "epoch": 2040} {"train_loss": -10.436333656311035, "global_step": 342824, "epoch": 2040} {"train_loss": -10.586596488952637, "global_step": 342825, "epoch": 2040} {"train_loss": -11.488435745239258, "global_step": 342826, "epoch": 2040} {"train_loss": -10.75220775604248, "global_step": 342827, "epoch": 2040} {"train_loss": -11.069104194641113, "global_step": 342828, "epoch": 2040} {"train_loss": -10.039321899414062, "global_step": 342829, "epoch": 2040} {"train_loss": -11.053607940673828, "global_step": 342830, "epoch": 2040} {"train_loss": -10.674699783325195, "global_step": 342831, "epoch": 2040} {"train_loss": -10.300724029541016, "global_step": 342832, "epoch": 2040} {"train_loss": -11.278966903686523, "global_step": 342833, "epoch": 2040} {"train_loss": -9.48361587524414, "global_step": 342834, "epoch": 2040} {"train_loss": -10.108261108398438, "global_step": 342835, "epoch": 2040} {"train_loss": -11.606460571289062, "global_step": 342836, "epoch": 2040} {"train_loss": -10.201679229736328, "global_step": 342837, "epoch": 2040} {"train_loss": -10.133995056152344, "global_step": 342838, "epoch": 2040} {"train_loss": -11.528755187988281, "global_step": 342839, "epoch": 2040} {"train_loss": -10.5589599609375, "global_step": 342840, "epoch": 2040} {"train_loss": -11.551130294799805, "global_step": 342841, "epoch": 2040} {"train_loss": -11.53235912322998, "global_step": 342842, "epoch": 2040} {"train_loss": -11.415163040161133, "global_step": 342843, "epoch": 2040} {"train_loss": -11.382102966308594, "global_step": 342844, "epoch": 2040} {"train_loss": -11.401023864746094, "global_step": 342845, "epoch": 2040} {"train_loss": -11.323409080505371, "global_step": 342846, "epoch": 2040} {"train_loss": -11.558913230895996, "global_step": 342847, "epoch": 2040} {"train_loss": -11.655917167663574, "global_step": 342848, "epoch": 2040} {"train_loss": -11.202898025512695, "global_step": 342849, "epoch": 2040} {"train_loss": -11.350055694580078, "global_step": 342850, "epoch": 2040} {"train_loss": -11.069467544555664, "global_step": 342851, "epoch": 2040} {"train_loss": -11.520905494689941, "global_step": 342852, "epoch": 2040} {"train_loss": -11.27807331085205, "global_step": 342853, "epoch": 2040} {"train_loss": -11.963361740112305, "global_step": 342854, "epoch": 2040} {"train_loss": -11.616523742675781, "global_step": 342855, "epoch": 2040} {"train_loss": -11.742402076721191, "global_step": 342856, "epoch": 2040} {"train_loss": -11.689078330993652, "global_step": 342857, "epoch": 2040} {"train_loss": -11.531511306762695, "global_step": 342858, "epoch": 2040} {"train_loss": -11.53042221069336, "global_step": 342859, "epoch": 2040} {"train_loss": -11.396052360534668, "global_step": 342860, "epoch": 2040} {"train_loss": -11.746969223022461, "global_step": 342861, "epoch": 2040} {"train_loss": -11.282856941223145, "global_step": 342862, "epoch": 2040} {"train_loss": -11.564336776733398, "global_step": 342863, "epoch": 2040} {"train_loss": -11.996533393859863, "global_step": 342864, "epoch": 2040} {"train_loss": -11.406970977783203, "global_step": 342865, "epoch": 2040} {"train_loss": -11.608612060546875, "global_step": 342866, "epoch": 2040} {"train_loss": -10.685176849365234, "global_step": 342867, "epoch": 2040} {"train_loss": -11.57505989074707, "global_step": 342868, "epoch": 2040} {"train_loss": -11.699665069580078, "global_step": 342869, "epoch": 2040} {"train_loss": -11.704761505126953, "global_step": 342870, "epoch": 2040} {"train_loss": -11.618456840515137, "global_step": 342871, "epoch": 2040} {"train_loss": -11.398667335510254, "global_step": 342872, "epoch": 2040} {"train_loss": -11.927074432373047, "global_step": 342873, "epoch": 2040} {"train_loss": -11.396223068237305, "global_step": 342874, "epoch": 2040} {"train_loss": -11.627723693847656, "global_step": 342875, "epoch": 2040} {"train_loss": -11.505200386047363, "global_step": 342876, "epoch": 2040} {"train_loss": -11.64888858795166, "global_step": 342877, "epoch": 2040} {"train_loss": -11.48388957977295, "global_step": 342878, "epoch": 2040} {"train_loss": -11.862199783325195, "global_step": 342879, "epoch": 2040} {"train_loss": -11.651447296142578, "global_step": 342880, "epoch": 2040} {"train_loss": -11.788996696472168, "global_step": 342881, "epoch": 2040} {"train_loss": -11.888568878173828, "global_step": 342882, "epoch": 2040} {"train_loss": -11.223394393920898, "global_step": 342883, "epoch": 2040} {"train_loss": -11.997803688049316, "global_step": 342884, "epoch": 2040} {"train_loss": -12.172528266906738, "global_step": 342885, "epoch": 2040} {"train_loss": -11.766477584838867, "global_step": 342886, "epoch": 2040} {"train_loss": -11.848065245719184, "global_step": 342887, "epoch": 2040, "val_loss": 285324.0625, "train_action_mse_error": 1.2997770309448242} {"train_loss": -12.00082015991211, "global_step": 342888, "epoch": 2041} {"train_loss": -12.023590087890625, "global_step": 342889, "epoch": 2041} {"train_loss": -11.661457061767578, "global_step": 342890, "epoch": 2041} {"train_loss": -12.048867225646973, "global_step": 342891, "epoch": 2041} {"train_loss": -12.098323822021484, "global_step": 342892, "epoch": 2041} {"train_loss": -12.304922103881836, "global_step": 342893, "epoch": 2041} {"train_loss": -12.167133331298828, "global_step": 342894, "epoch": 2041} {"train_loss": -12.12933349609375, "global_step": 342895, "epoch": 2041} {"train_loss": -12.212099075317383, "global_step": 342896, "epoch": 2041} {"train_loss": -12.075566291809082, "global_step": 342897, "epoch": 2041} {"train_loss": -12.420907974243164, "global_step": 342898, "epoch": 2041} {"train_loss": -12.061331748962402, "global_step": 342899, "epoch": 2041} {"train_loss": -12.404645919799805, "global_step": 342900, "epoch": 2041} {"train_loss": -12.220054626464844, "global_step": 342901, "epoch": 2041} {"train_loss": -12.456390380859375, "global_step": 342902, "epoch": 2041} {"train_loss": -12.131895065307617, "global_step": 342903, "epoch": 2041} {"train_loss": -12.463003158569336, "global_step": 342904, "epoch": 2041} {"train_loss": -12.244283676147461, "global_step": 342905, "epoch": 2041} {"train_loss": -12.361701965332031, "global_step": 342906, "epoch": 2041} {"train_loss": -12.131985664367676, "global_step": 342907, "epoch": 2041} {"train_loss": -12.305046081542969, "global_step": 342908, "epoch": 2041} {"train_loss": -12.33663272857666, "global_step": 342909, "epoch": 2041} {"train_loss": -12.278406143188477, "global_step": 342910, "epoch": 2041} {"train_loss": -12.412113189697266, "global_step": 342911, "epoch": 2041} {"train_loss": -12.057487487792969, "global_step": 342912, "epoch": 2041} {"train_loss": -12.370266914367676, "global_step": 342913, "epoch": 2041} {"train_loss": -12.226383209228516, "global_step": 342914, "epoch": 2041} {"train_loss": -12.454668045043945, "global_step": 342915, "epoch": 2041} {"train_loss": -12.446246147155762, "global_step": 342916, "epoch": 2041} {"train_loss": -12.345134735107422, "global_step": 342917, "epoch": 2041} {"train_loss": -12.508687973022461, "global_step": 342918, "epoch": 2041} {"train_loss": -12.277631759643555, "global_step": 342919, "epoch": 2041} {"train_loss": -12.272980690002441, "global_step": 342920, "epoch": 2041} {"train_loss": -12.575494766235352, "global_step": 342921, "epoch": 2041} {"train_loss": -12.373342514038086, "global_step": 342922, "epoch": 2041} {"train_loss": -12.329427719116211, "global_step": 342923, "epoch": 2041} {"train_loss": -12.185670852661133, "global_step": 342924, "epoch": 2041} {"train_loss": -12.487748146057129, "global_step": 342925, "epoch": 2041} {"train_loss": -11.619573593139648, "global_step": 342926, "epoch": 2041} {"train_loss": -11.44436264038086, "global_step": 342927, "epoch": 2041} {"train_loss": -12.00546932220459, "global_step": 342928, "epoch": 2041} {"train_loss": -12.005444526672363, "global_step": 342929, "epoch": 2041} {"train_loss": -11.77401065826416, "global_step": 342930, "epoch": 2041} {"train_loss": -11.44566535949707, "global_step": 342931, "epoch": 2041} {"train_loss": -12.230403900146484, "global_step": 342932, "epoch": 2041} {"train_loss": -12.148703575134277, "global_step": 342933, "epoch": 2041} {"train_loss": -11.577973365783691, "global_step": 342934, "epoch": 2041} {"train_loss": -12.101749420166016, "global_step": 342935, "epoch": 2041} {"train_loss": -12.4478759765625, "global_step": 342936, "epoch": 2041} {"train_loss": -12.209684371948242, "global_step": 342937, "epoch": 2041} {"train_loss": -12.103265762329102, "global_step": 342938, "epoch": 2041} {"train_loss": -12.347116470336914, "global_step": 342939, "epoch": 2041} {"train_loss": -11.813592910766602, "global_step": 342940, "epoch": 2041} {"train_loss": -12.235603332519531, "global_step": 342941, "epoch": 2041} {"train_loss": -11.68878173828125, "global_step": 342942, "epoch": 2041} {"train_loss": -12.247225761413574, "global_step": 342943, "epoch": 2041} {"train_loss": -12.329967498779297, "global_step": 342944, "epoch": 2041} {"train_loss": -12.20484733581543, "global_step": 342945, "epoch": 2041} {"train_loss": -12.329695701599121, "global_step": 342946, "epoch": 2041} {"train_loss": -12.163043975830078, "global_step": 342947, "epoch": 2041} {"train_loss": -12.462298393249512, "global_step": 342948, "epoch": 2041} {"train_loss": -12.589534759521484, "global_step": 342949, "epoch": 2041} {"train_loss": -11.869474411010742, "global_step": 342950, "epoch": 2041} {"train_loss": -12.551673889160156, "global_step": 342951, "epoch": 2041} {"train_loss": -11.93459701538086, "global_step": 342952, "epoch": 2041} {"train_loss": -12.32155704498291, "global_step": 342953, "epoch": 2041} {"train_loss": -12.10545825958252, "global_step": 342954, "epoch": 2041} {"train_loss": -12.424521446228027, "global_step": 342955, "epoch": 2041} {"train_loss": -12.20048713684082, "global_step": 342956, "epoch": 2041} {"train_loss": -11.823068618774414, "global_step": 342957, "epoch": 2041} {"train_loss": -12.606975555419922, "global_step": 342958, "epoch": 2041} {"train_loss": -12.448456764221191, "global_step": 342959, "epoch": 2041} {"train_loss": -12.37394905090332, "global_step": 342960, "epoch": 2041} {"train_loss": -12.367944717407227, "global_step": 342961, "epoch": 2041} {"train_loss": -12.446788787841797, "global_step": 342962, "epoch": 2041} {"train_loss": -12.479229927062988, "global_step": 342963, "epoch": 2041} {"train_loss": -12.339751243591309, "global_step": 342964, "epoch": 2041} {"train_loss": -12.602180480957031, "global_step": 342965, "epoch": 2041} {"train_loss": -12.299453735351562, "global_step": 342966, "epoch": 2041} {"train_loss": -12.182777404785156, "global_step": 342967, "epoch": 2041} {"train_loss": -12.459556579589844, "global_step": 342968, "epoch": 2041} {"train_loss": -12.615800857543945, "global_step": 342969, "epoch": 2041} {"train_loss": -12.42132568359375, "global_step": 342970, "epoch": 2041} {"train_loss": -12.348859786987305, "global_step": 342971, "epoch": 2041} {"train_loss": -12.340957641601562, "global_step": 342972, "epoch": 2041} {"train_loss": -12.449674606323242, "global_step": 342973, "epoch": 2041} {"train_loss": -12.253657341003418, "global_step": 342974, "epoch": 2041} {"train_loss": -12.490028381347656, "global_step": 342975, "epoch": 2041} {"train_loss": -12.31550407409668, "global_step": 342976, "epoch": 2041} {"train_loss": -12.149328231811523, "global_step": 342977, "epoch": 2041} {"train_loss": -12.160736083984375, "global_step": 342978, "epoch": 2041} {"train_loss": -12.45648193359375, "global_step": 342979, "epoch": 2041} {"train_loss": -12.612405776977539, "global_step": 342980, "epoch": 2041} {"train_loss": -12.577245712280273, "global_step": 342981, "epoch": 2041} {"train_loss": -12.424516677856445, "global_step": 342982, "epoch": 2041} {"train_loss": -12.176528930664062, "global_step": 342983, "epoch": 2041} {"train_loss": -12.365205764770508, "global_step": 342984, "epoch": 2041} {"train_loss": -12.120370864868164, "global_step": 342985, "epoch": 2041} {"train_loss": -11.956031799316406, "global_step": 342986, "epoch": 2041} {"train_loss": -11.836883544921875, "global_step": 342987, "epoch": 2041} {"train_loss": -12.090850830078125, "global_step": 342988, "epoch": 2041} {"train_loss": -10.731534957885742, "global_step": 342989, "epoch": 2041} {"train_loss": -11.843168258666992, "global_step": 342990, "epoch": 2041} {"train_loss": -11.780656814575195, "global_step": 342991, "epoch": 2041} {"train_loss": -11.108841896057129, "global_step": 342992, "epoch": 2041} {"train_loss": -11.491010665893555, "global_step": 342993, "epoch": 2041} {"train_loss": -12.166619300842285, "global_step": 342994, "epoch": 2041} {"train_loss": -11.240242004394531, "global_step": 342995, "epoch": 2041} {"train_loss": -11.865177154541016, "global_step": 342996, "epoch": 2041} {"train_loss": -11.295656204223633, "global_step": 342997, "epoch": 2041} {"train_loss": -11.09471321105957, "global_step": 342998, "epoch": 2041} {"train_loss": -11.680638313293457, "global_step": 342999, "epoch": 2041} {"train_loss": -12.110363006591797, "global_step": 343000, "epoch": 2041} {"train_loss": -11.634897232055664, "global_step": 343001, "epoch": 2041} {"train_loss": -10.435287475585938, "global_step": 343002, "epoch": 2041} {"train_loss": -12.279749870300293, "global_step": 343003, "epoch": 2041} {"train_loss": -11.838237762451172, "global_step": 343004, "epoch": 2041} {"train_loss": -11.310032844543457, "global_step": 343005, "epoch": 2041} {"train_loss": -11.254737854003906, "global_step": 343006, "epoch": 2041} {"train_loss": -12.095535278320312, "global_step": 343007, "epoch": 2041} {"train_loss": -11.446188926696777, "global_step": 343008, "epoch": 2041} {"train_loss": -11.89642333984375, "global_step": 343009, "epoch": 2041} {"train_loss": -11.097051620483398, "global_step": 343010, "epoch": 2041} {"train_loss": -11.538334846496582, "global_step": 343011, "epoch": 2041} {"train_loss": -10.728026390075684, "global_step": 343012, "epoch": 2041} {"train_loss": -11.311779022216797, "global_step": 343013, "epoch": 2041} {"train_loss": -10.968936920166016, "global_step": 343014, "epoch": 2041} {"train_loss": -10.130058288574219, "global_step": 343015, "epoch": 2041} {"train_loss": -11.14059829711914, "global_step": 343016, "epoch": 2041} {"train_loss": -10.56387710571289, "global_step": 343017, "epoch": 2041} {"train_loss": -10.866497039794922, "global_step": 343018, "epoch": 2041} {"train_loss": -10.148882865905762, "global_step": 343019, "epoch": 2041} {"train_loss": -9.17760944366455, "global_step": 343020, "epoch": 2041} {"train_loss": -8.495174407958984, "global_step": 343021, "epoch": 2041} {"train_loss": -11.377401351928711, "global_step": 343022, "epoch": 2041} {"train_loss": -7.991787910461426, "global_step": 343023, "epoch": 2041} {"train_loss": -9.56247329711914, "global_step": 343024, "epoch": 2041} {"train_loss": -10.027862548828125, "global_step": 343025, "epoch": 2041} {"train_loss": -10.672409057617188, "global_step": 343026, "epoch": 2041} {"train_loss": -10.140417098999023, "global_step": 343027, "epoch": 2041} {"train_loss": -11.089823722839355, "global_step": 343028, "epoch": 2041} {"train_loss": -9.889118194580078, "global_step": 343029, "epoch": 2041} {"train_loss": -10.99438762664795, "global_step": 343030, "epoch": 2041} {"train_loss": -10.087486267089844, "global_step": 343031, "epoch": 2041} {"train_loss": -10.68105697631836, "global_step": 343032, "epoch": 2041} {"train_loss": -9.714056015014648, "global_step": 343033, "epoch": 2041} {"train_loss": -10.352700233459473, "global_step": 343034, "epoch": 2041} {"train_loss": -10.970820426940918, "global_step": 343035, "epoch": 2041} {"train_loss": -10.7867431640625, "global_step": 343036, "epoch": 2041} {"train_loss": -11.037895202636719, "global_step": 343037, "epoch": 2041} {"train_loss": -10.630249977111816, "global_step": 343038, "epoch": 2041} {"train_loss": -11.190983772277832, "global_step": 343039, "epoch": 2041} {"train_loss": -10.353931427001953, "global_step": 343040, "epoch": 2041} {"train_loss": -11.489681243896484, "global_step": 343041, "epoch": 2041} {"train_loss": -10.902755737304688, "global_step": 343042, "epoch": 2041} {"train_loss": -11.71776008605957, "global_step": 343043, "epoch": 2041} {"train_loss": -11.52703857421875, "global_step": 343044, "epoch": 2041} {"train_loss": -11.876572608947754, "global_step": 343045, "epoch": 2041} {"train_loss": -11.693265914916992, "global_step": 343046, "epoch": 2041} {"train_loss": -11.748180389404297, "global_step": 343047, "epoch": 2041} {"train_loss": -11.814020156860352, "global_step": 343048, "epoch": 2041} {"train_loss": -11.878894805908203, "global_step": 343049, "epoch": 2041} {"train_loss": -11.925470352172852, "global_step": 343050, "epoch": 2041} {"train_loss": -11.876781463623047, "global_step": 343051, "epoch": 2041} {"train_loss": -12.123394012451172, "global_step": 343052, "epoch": 2041} {"train_loss": -11.957630157470703, "global_step": 343053, "epoch": 2041} {"train_loss": -11.862390518188477, "global_step": 343054, "epoch": 2041} {"train_loss": -11.773161116100493, "global_step": 343055, "epoch": 2041, "val_loss": 284069.625} {"train_loss": -11.58043384552002, "global_step": 343056, "epoch": 2042} {"train_loss": -11.923398971557617, "global_step": 343057, "epoch": 2042} {"train_loss": -11.9508638381958, "global_step": 343058, "epoch": 2042} {"train_loss": -12.017160415649414, "global_step": 343059, "epoch": 2042} {"train_loss": -11.888465881347656, "global_step": 343060, "epoch": 2042} {"train_loss": -11.765813827514648, "global_step": 343061, "epoch": 2042} {"train_loss": -11.892950057983398, "global_step": 343062, "epoch": 2042} {"train_loss": -11.79147720336914, "global_step": 343063, "epoch": 2042} {"train_loss": -12.019107818603516, "global_step": 343064, "epoch": 2042} {"train_loss": -11.978726387023926, "global_step": 343065, "epoch": 2042} {"train_loss": -12.122377395629883, "global_step": 343066, "epoch": 2042} {"train_loss": -11.965967178344727, "global_step": 343067, "epoch": 2042} {"train_loss": -11.923440933227539, "global_step": 343068, "epoch": 2042} {"train_loss": -11.950538635253906, "global_step": 343069, "epoch": 2042} {"train_loss": -12.113924980163574, "global_step": 343070, "epoch": 2042} {"train_loss": -12.095779418945312, "global_step": 343071, "epoch": 2042} {"train_loss": -12.198423385620117, "global_step": 343072, "epoch": 2042} {"train_loss": -12.152048110961914, "global_step": 343073, "epoch": 2042} {"train_loss": -12.212961196899414, "global_step": 343074, "epoch": 2042} {"train_loss": -12.35479736328125, "global_step": 343075, "epoch": 2042} {"train_loss": -12.143949508666992, "global_step": 343076, "epoch": 2042} {"train_loss": -12.38497257232666, "global_step": 343077, "epoch": 2042} {"train_loss": -12.262747764587402, "global_step": 343078, "epoch": 2042} {"train_loss": -12.228248596191406, "global_step": 343079, "epoch": 2042} {"train_loss": -12.279518127441406, "global_step": 343080, "epoch": 2042} {"train_loss": -12.215381622314453, "global_step": 343081, "epoch": 2042} {"train_loss": -12.21200942993164, "global_step": 343082, "epoch": 2042} {"train_loss": -12.247465133666992, "global_step": 343083, "epoch": 2042} {"train_loss": -12.502327919006348, "global_step": 343084, "epoch": 2042} {"train_loss": -12.318256378173828, "global_step": 343085, "epoch": 2042} {"train_loss": -12.322546005249023, "global_step": 343086, "epoch": 2042} {"train_loss": -12.384828567504883, "global_step": 343087, "epoch": 2042} {"train_loss": -12.539050102233887, "global_step": 343088, "epoch": 2042} {"train_loss": -12.277316093444824, "global_step": 343089, "epoch": 2042} {"train_loss": -12.480757713317871, "global_step": 343090, "epoch": 2042} {"train_loss": -12.372137069702148, "global_step": 343091, "epoch": 2042} {"train_loss": -12.344860076904297, "global_step": 343092, "epoch": 2042} {"train_loss": -12.500167846679688, "global_step": 343093, "epoch": 2042} {"train_loss": -12.134647369384766, "global_step": 343094, "epoch": 2042} {"train_loss": -12.45338249206543, "global_step": 343095, "epoch": 2042} {"train_loss": -12.246574401855469, "global_step": 343096, "epoch": 2042} {"train_loss": -12.047538757324219, "global_step": 343097, "epoch": 2042} {"train_loss": -12.325342178344727, "global_step": 343098, "epoch": 2042} {"train_loss": -12.230937957763672, "global_step": 343099, "epoch": 2042} {"train_loss": -12.297746658325195, "global_step": 343100, "epoch": 2042} {"train_loss": -12.396024703979492, "global_step": 343101, "epoch": 2042} {"train_loss": -12.349006652832031, "global_step": 343102, "epoch": 2042} {"train_loss": -12.549257278442383, "global_step": 343103, "epoch": 2042} {"train_loss": -12.15556526184082, "global_step": 343104, "epoch": 2042} {"train_loss": -12.669260025024414, "global_step": 343105, "epoch": 2042} {"train_loss": -12.446683883666992, "global_step": 343106, "epoch": 2042} {"train_loss": -12.608407020568848, "global_step": 343107, "epoch": 2042} {"train_loss": -12.359050750732422, "global_step": 343108, "epoch": 2042} {"train_loss": -12.262662887573242, "global_step": 343109, "epoch": 2042} {"train_loss": -12.430896759033203, "global_step": 343110, "epoch": 2042} {"train_loss": -12.557938575744629, "global_step": 343111, "epoch": 2042} {"train_loss": -12.456473350524902, "global_step": 343112, "epoch": 2042} {"train_loss": -12.583662033081055, "global_step": 343113, "epoch": 2042} {"train_loss": -12.480920791625977, "global_step": 343114, "epoch": 2042} {"train_loss": -12.501996994018555, "global_step": 343115, "epoch": 2042} {"train_loss": -12.41712760925293, "global_step": 343116, "epoch": 2042} {"train_loss": -12.596702575683594, "global_step": 343117, "epoch": 2042} {"train_loss": -12.483633995056152, "global_step": 343118, "epoch": 2042} {"train_loss": -12.398759841918945, "global_step": 343119, "epoch": 2042} {"train_loss": -12.409026145935059, "global_step": 343120, "epoch": 2042} {"train_loss": -11.793524742126465, "global_step": 343121, "epoch": 2042} {"train_loss": -11.986080169677734, "global_step": 343122, "epoch": 2042} {"train_loss": -12.549359321594238, "global_step": 343123, "epoch": 2042} {"train_loss": -12.398482322692871, "global_step": 343124, "epoch": 2042} {"train_loss": -12.250472068786621, "global_step": 343125, "epoch": 2042} {"train_loss": -11.939719200134277, "global_step": 343126, "epoch": 2042} {"train_loss": -12.403158187866211, "global_step": 343127, "epoch": 2042} {"train_loss": -12.202945709228516, "global_step": 343128, "epoch": 2042} {"train_loss": -11.220664978027344, "global_step": 343129, "epoch": 2042} {"train_loss": -11.331781387329102, "global_step": 343130, "epoch": 2042} {"train_loss": -12.632136344909668, "global_step": 343131, "epoch": 2042} {"train_loss": -11.210511207580566, "global_step": 343132, "epoch": 2042} {"train_loss": -10.548604011535645, "global_step": 343133, "epoch": 2042} {"train_loss": -11.895768165588379, "global_step": 343134, "epoch": 2042} {"train_loss": -9.406113624572754, "global_step": 343135, "epoch": 2042} {"train_loss": -11.027441024780273, "global_step": 343136, "epoch": 2042} {"train_loss": -11.988883972167969, "global_step": 343137, "epoch": 2042} {"train_loss": -11.311519622802734, "global_step": 343138, "epoch": 2042} {"train_loss": -10.828323364257812, "global_step": 343139, "epoch": 2042} {"train_loss": -11.137184143066406, "global_step": 343140, "epoch": 2042} {"train_loss": -9.714691162109375, "global_step": 343141, "epoch": 2042} {"train_loss": -9.66637897491455, "global_step": 343142, "epoch": 2042} {"train_loss": -10.50311279296875, "global_step": 343143, "epoch": 2042} {"train_loss": -9.892066955566406, "global_step": 343144, "epoch": 2042} {"train_loss": -8.876869201660156, "global_step": 343145, "epoch": 2042} {"train_loss": -10.66691780090332, "global_step": 343146, "epoch": 2042} {"train_loss": -10.127636909484863, "global_step": 343147, "epoch": 2042} {"train_loss": -11.226871490478516, "global_step": 343148, "epoch": 2042} {"train_loss": -9.782516479492188, "global_step": 343149, "epoch": 2042} {"train_loss": -11.154736518859863, "global_step": 343150, "epoch": 2042} {"train_loss": -9.47502326965332, "global_step": 343151, "epoch": 2042} {"train_loss": -10.728824615478516, "global_step": 343152, "epoch": 2042} {"train_loss": -9.99563980102539, "global_step": 343153, "epoch": 2042} {"train_loss": -10.91816520690918, "global_step": 343154, "epoch": 2042} {"train_loss": -10.976739883422852, "global_step": 343155, "epoch": 2042} {"train_loss": -11.11860179901123, "global_step": 343156, "epoch": 2042} {"train_loss": -11.079395294189453, "global_step": 343157, "epoch": 2042} {"train_loss": -11.092449188232422, "global_step": 343158, "epoch": 2042} {"train_loss": -11.41190242767334, "global_step": 343159, "epoch": 2042} {"train_loss": -11.609573364257812, "global_step": 343160, "epoch": 2042} {"train_loss": -11.500947952270508, "global_step": 343161, "epoch": 2042} {"train_loss": -11.809566497802734, "global_step": 343162, "epoch": 2042} {"train_loss": -11.217232704162598, "global_step": 343163, "epoch": 2042} {"train_loss": -11.711517333984375, "global_step": 343164, "epoch": 2042} {"train_loss": -11.648176193237305, "global_step": 343165, "epoch": 2042} {"train_loss": -11.29318618774414, "global_step": 343166, "epoch": 2042} {"train_loss": -11.773963928222656, "global_step": 343167, "epoch": 2042} {"train_loss": -11.27676773071289, "global_step": 343168, "epoch": 2042} {"train_loss": -12.075810432434082, "global_step": 343169, "epoch": 2042} {"train_loss": -11.38325309753418, "global_step": 343170, "epoch": 2042} {"train_loss": -11.452199935913086, "global_step": 343171, "epoch": 2042} {"train_loss": -12.21515941619873, "global_step": 343172, "epoch": 2042} {"train_loss": -11.413810729980469, "global_step": 343173, "epoch": 2042} {"train_loss": -11.970813751220703, "global_step": 343174, "epoch": 2042} {"train_loss": -11.675684928894043, "global_step": 343175, "epoch": 2042} {"train_loss": -11.184721946716309, "global_step": 343176, "epoch": 2042} {"train_loss": -11.855342864990234, "global_step": 343177, "epoch": 2042} {"train_loss": -11.682817459106445, "global_step": 343178, "epoch": 2042} {"train_loss": -11.76025390625, "global_step": 343179, "epoch": 2042} {"train_loss": -11.863344192504883, "global_step": 343180, "epoch": 2042} {"train_loss": -11.814756393432617, "global_step": 343181, "epoch": 2042} {"train_loss": -11.803369522094727, "global_step": 343182, "epoch": 2042} {"train_loss": -12.068650245666504, "global_step": 343183, "epoch": 2042} {"train_loss": -11.903620719909668, "global_step": 343184, "epoch": 2042} {"train_loss": -12.166505813598633, "global_step": 343185, "epoch": 2042} {"train_loss": -11.88261890411377, "global_step": 343186, "epoch": 2042} {"train_loss": -12.025474548339844, "global_step": 343187, "epoch": 2042} {"train_loss": -12.32394027709961, "global_step": 343188, "epoch": 2042} {"train_loss": -11.960521697998047, "global_step": 343189, "epoch": 2042} {"train_loss": -12.132397651672363, "global_step": 343190, "epoch": 2042} {"train_loss": -12.336031913757324, "global_step": 343191, "epoch": 2042} {"train_loss": -12.010048866271973, "global_step": 343192, "epoch": 2042} {"train_loss": -12.233531951904297, "global_step": 343193, "epoch": 2042} {"train_loss": -12.184124946594238, "global_step": 343194, "epoch": 2042} {"train_loss": -11.96835708618164, "global_step": 343195, "epoch": 2042} {"train_loss": -12.311103820800781, "global_step": 343196, "epoch": 2042} {"train_loss": -12.202127456665039, "global_step": 343197, "epoch": 2042} {"train_loss": -12.307733535766602, "global_step": 343198, "epoch": 2042} {"train_loss": -12.223485946655273, "global_step": 343199, "epoch": 2042} {"train_loss": -12.179974555969238, "global_step": 343200, "epoch": 2042} {"train_loss": -12.269309043884277, "global_step": 343201, "epoch": 2042} {"train_loss": -12.207508087158203, "global_step": 343202, "epoch": 2042} {"train_loss": -12.166902542114258, "global_step": 343203, "epoch": 2042} {"train_loss": -11.985441207885742, "global_step": 343204, "epoch": 2042} {"train_loss": -12.389498710632324, "global_step": 343205, "epoch": 2042} {"train_loss": -12.323564529418945, "global_step": 343206, "epoch": 2042} {"train_loss": -12.331724166870117, "global_step": 343207, "epoch": 2042} {"train_loss": -12.445121765136719, "global_step": 343208, "epoch": 2042} {"train_loss": -12.408244132995605, "global_step": 343209, "epoch": 2042} {"train_loss": -12.437580108642578, "global_step": 343210, "epoch": 2042} {"train_loss": -12.129508972167969, "global_step": 343211, "epoch": 2042} {"train_loss": -12.698434829711914, "global_step": 343212, "epoch": 2042} {"train_loss": -12.305009841918945, "global_step": 343213, "epoch": 2042} {"train_loss": -12.571436882019043, "global_step": 343214, "epoch": 2042} {"train_loss": -12.257116317749023, "global_step": 343215, "epoch": 2042} {"train_loss": -12.530938148498535, "global_step": 343216, "epoch": 2042} {"train_loss": -12.380887985229492, "global_step": 343217, "epoch": 2042} {"train_loss": -12.616165161132812, "global_step": 343218, "epoch": 2042} {"train_loss": -12.510954856872559, "global_step": 343219, "epoch": 2042} {"train_loss": -12.473176956176758, "global_step": 343220, "epoch": 2042} {"train_loss": -12.347799301147461, "global_step": 343221, "epoch": 2042} {"train_loss": -12.410144805908203, "global_step": 343222, "epoch": 2042} {"train_loss": -11.895564879689898, "global_step": 343223, "epoch": 2042, "val_loss": 285405.625} {"train_loss": -12.487251281738281, "global_step": 343224, "epoch": 2043} {"train_loss": -12.320419311523438, "global_step": 343225, "epoch": 2043} {"train_loss": -12.538444519042969, "global_step": 343226, "epoch": 2043} {"train_loss": -12.226325988769531, "global_step": 343227, "epoch": 2043} {"train_loss": -12.319368362426758, "global_step": 343228, "epoch": 2043} {"train_loss": -12.206038475036621, "global_step": 343229, "epoch": 2043} {"train_loss": -12.484716415405273, "global_step": 343230, "epoch": 2043} {"train_loss": -12.381319999694824, "global_step": 343231, "epoch": 2043} {"train_loss": -12.346871376037598, "global_step": 343232, "epoch": 2043} {"train_loss": -12.603534698486328, "global_step": 343233, "epoch": 2043} {"train_loss": -12.468035697937012, "global_step": 343234, "epoch": 2043} {"train_loss": -12.5118408203125, "global_step": 343235, "epoch": 2043} {"train_loss": -12.53281021118164, "global_step": 343236, "epoch": 2043} {"train_loss": -12.092934608459473, "global_step": 343237, "epoch": 2043} {"train_loss": -12.510637283325195, "global_step": 343238, "epoch": 2043} {"train_loss": -12.169782638549805, "global_step": 343239, "epoch": 2043} {"train_loss": -12.241777420043945, "global_step": 343240, "epoch": 2043} {"train_loss": -12.355169296264648, "global_step": 343241, "epoch": 2043} {"train_loss": -11.337692260742188, "global_step": 343242, "epoch": 2043} {"train_loss": -12.086385726928711, "global_step": 343243, "epoch": 2043} {"train_loss": -12.232027053833008, "global_step": 343244, "epoch": 2043} {"train_loss": -12.064764022827148, "global_step": 343245, "epoch": 2043} {"train_loss": -12.14336109161377, "global_step": 343246, "epoch": 2043} {"train_loss": -12.061698913574219, "global_step": 343247, "epoch": 2043} {"train_loss": -11.973060607910156, "global_step": 343248, "epoch": 2043} {"train_loss": -11.920475959777832, "global_step": 343249, "epoch": 2043} {"train_loss": -12.342147827148438, "global_step": 343250, "epoch": 2043} {"train_loss": -11.84364128112793, "global_step": 343251, "epoch": 2043} {"train_loss": -12.290603637695312, "global_step": 343252, "epoch": 2043} {"train_loss": -12.063742637634277, "global_step": 343253, "epoch": 2043} {"train_loss": -12.013945579528809, "global_step": 343254, "epoch": 2043} {"train_loss": -12.295360565185547, "global_step": 343255, "epoch": 2043} {"train_loss": -12.227636337280273, "global_step": 343256, "epoch": 2043} {"train_loss": -12.222594261169434, "global_step": 343257, "epoch": 2043} {"train_loss": -11.928325653076172, "global_step": 343258, "epoch": 2043} {"train_loss": -11.825606346130371, "global_step": 343259, "epoch": 2043} {"train_loss": -12.473876953125, "global_step": 343260, "epoch": 2043} {"train_loss": -12.278882026672363, "global_step": 343261, "epoch": 2043} {"train_loss": -12.189661026000977, "global_step": 343262, "epoch": 2043} {"train_loss": -12.334794044494629, "global_step": 343263, "epoch": 2043} {"train_loss": -12.57663345336914, "global_step": 343264, "epoch": 2043} {"train_loss": -12.147270202636719, "global_step": 343265, "epoch": 2043} {"train_loss": -12.422708511352539, "global_step": 343266, "epoch": 2043} {"train_loss": -12.426048278808594, "global_step": 343267, "epoch": 2043} {"train_loss": -12.20591926574707, "global_step": 343268, "epoch": 2043} {"train_loss": -12.318089485168457, "global_step": 343269, "epoch": 2043} {"train_loss": -12.221841812133789, "global_step": 343270, "epoch": 2043} {"train_loss": -11.55296802520752, "global_step": 343271, "epoch": 2043} {"train_loss": -11.928147315979004, "global_step": 343272, "epoch": 2043} {"train_loss": -12.063344955444336, "global_step": 343273, "epoch": 2043} {"train_loss": -12.369999885559082, "global_step": 343274, "epoch": 2043} {"train_loss": -12.320781707763672, "global_step": 343275, "epoch": 2043} {"train_loss": -12.413049697875977, "global_step": 343276, "epoch": 2043} {"train_loss": -12.40234088897705, "global_step": 343277, "epoch": 2043} {"train_loss": -11.717853546142578, "global_step": 343278, "epoch": 2043} {"train_loss": -12.290950775146484, "global_step": 343279, "epoch": 2043} {"train_loss": -12.03433895111084, "global_step": 343280, "epoch": 2043} {"train_loss": -12.010986328125, "global_step": 343281, "epoch": 2043} {"train_loss": -11.643763542175293, "global_step": 343282, "epoch": 2043} {"train_loss": -12.329066276550293, "global_step": 343283, "epoch": 2043} {"train_loss": -12.299328804016113, "global_step": 343284, "epoch": 2043} {"train_loss": -12.005451202392578, "global_step": 343285, "epoch": 2043} {"train_loss": -11.914554595947266, "global_step": 343286, "epoch": 2043} {"train_loss": -12.03835678100586, "global_step": 343287, "epoch": 2043} {"train_loss": -12.145454406738281, "global_step": 343288, "epoch": 2043} {"train_loss": -11.191845893859863, "global_step": 343289, "epoch": 2043} {"train_loss": -12.058953285217285, "global_step": 343290, "epoch": 2043} {"train_loss": -11.722743034362793, "global_step": 343291, "epoch": 2043} {"train_loss": -11.58215045928955, "global_step": 343292, "epoch": 2043} {"train_loss": -12.270734786987305, "global_step": 343293, "epoch": 2043} {"train_loss": -11.604854583740234, "global_step": 343294, "epoch": 2043} {"train_loss": -11.149674415588379, "global_step": 343295, "epoch": 2043} {"train_loss": -11.83234977722168, "global_step": 343296, "epoch": 2043} {"train_loss": -11.280827522277832, "global_step": 343297, "epoch": 2043} {"train_loss": -11.543672561645508, "global_step": 343298, "epoch": 2043} {"train_loss": -11.892349243164062, "global_step": 343299, "epoch": 2043} {"train_loss": -11.264892578125, "global_step": 343300, "epoch": 2043} {"train_loss": -11.835494995117188, "global_step": 343301, "epoch": 2043} {"train_loss": -10.629992485046387, "global_step": 343302, "epoch": 2043} {"train_loss": -11.529457092285156, "global_step": 343303, "epoch": 2043} {"train_loss": -10.68593978881836, "global_step": 343304, "epoch": 2043} {"train_loss": -12.128881454467773, "global_step": 343305, "epoch": 2043} {"train_loss": -11.423812866210938, "global_step": 343306, "epoch": 2043} {"train_loss": -11.473749160766602, "global_step": 343307, "epoch": 2043} {"train_loss": -11.473660469055176, "global_step": 343308, "epoch": 2043} {"train_loss": -11.846160888671875, "global_step": 343309, "epoch": 2043} {"train_loss": -11.628361701965332, "global_step": 343310, "epoch": 2043} {"train_loss": -11.987499237060547, "global_step": 343311, "epoch": 2043} {"train_loss": -11.72685432434082, "global_step": 343312, "epoch": 2043} {"train_loss": -11.901988983154297, "global_step": 343313, "epoch": 2043} {"train_loss": -12.212246894836426, "global_step": 343314, "epoch": 2043} {"train_loss": -11.72311019897461, "global_step": 343315, "epoch": 2043} {"train_loss": -12.385701179504395, "global_step": 343316, "epoch": 2043} {"train_loss": -12.341232299804688, "global_step": 343317, "epoch": 2043} {"train_loss": -12.076766014099121, "global_step": 343318, "epoch": 2043} {"train_loss": -12.24156665802002, "global_step": 343319, "epoch": 2043} {"train_loss": -12.15807819366455, "global_step": 343320, "epoch": 2043} {"train_loss": -12.469432830810547, "global_step": 343321, "epoch": 2043} {"train_loss": -12.002644538879395, "global_step": 343322, "epoch": 2043} {"train_loss": -12.428655624389648, "global_step": 343323, "epoch": 2043} {"train_loss": -12.416740417480469, "global_step": 343324, "epoch": 2043} {"train_loss": -12.368906021118164, "global_step": 343325, "epoch": 2043} {"train_loss": -12.361781120300293, "global_step": 343326, "epoch": 2043} {"train_loss": -12.447181701660156, "global_step": 343327, "epoch": 2043} {"train_loss": -12.54442024230957, "global_step": 343328, "epoch": 2043} {"train_loss": -12.41165542602539, "global_step": 343329, "epoch": 2043} {"train_loss": -12.43893051147461, "global_step": 343330, "epoch": 2043} {"train_loss": -12.455360412597656, "global_step": 343331, "epoch": 2043} {"train_loss": -12.47633171081543, "global_step": 343332, "epoch": 2043} {"train_loss": -12.32816219329834, "global_step": 343333, "epoch": 2043} {"train_loss": -12.201820373535156, "global_step": 343334, "epoch": 2043} {"train_loss": -12.376928329467773, "global_step": 343335, "epoch": 2043} {"train_loss": -12.400371551513672, "global_step": 343336, "epoch": 2043} {"train_loss": -12.436943054199219, "global_step": 343337, "epoch": 2043} {"train_loss": -12.017263412475586, "global_step": 343338, "epoch": 2043} {"train_loss": -12.487430572509766, "global_step": 343339, "epoch": 2043} {"train_loss": -12.053936004638672, "global_step": 343340, "epoch": 2043} {"train_loss": -12.31485366821289, "global_step": 343341, "epoch": 2043} {"train_loss": -12.357015609741211, "global_step": 343342, "epoch": 2043} {"train_loss": -12.168758392333984, "global_step": 343343, "epoch": 2043} {"train_loss": -12.204910278320312, "global_step": 343344, "epoch": 2043} {"train_loss": -12.113536834716797, "global_step": 343345, "epoch": 2043} {"train_loss": -12.454795837402344, "global_step": 343346, "epoch": 2043} {"train_loss": -12.418037414550781, "global_step": 343347, "epoch": 2043} {"train_loss": -12.36325454711914, "global_step": 343348, "epoch": 2043} {"train_loss": -12.508886337280273, "global_step": 343349, "epoch": 2043} {"train_loss": -12.309910774230957, "global_step": 343350, "epoch": 2043} {"train_loss": -12.074772834777832, "global_step": 343351, "epoch": 2043} {"train_loss": -12.46657943725586, "global_step": 343352, "epoch": 2043} {"train_loss": -12.048553466796875, "global_step": 343353, "epoch": 2043} {"train_loss": -12.400703430175781, "global_step": 343354, "epoch": 2043} {"train_loss": -12.083477973937988, "global_step": 343355, "epoch": 2043} {"train_loss": -12.098075866699219, "global_step": 343356, "epoch": 2043} {"train_loss": -12.51419734954834, "global_step": 343357, "epoch": 2043} {"train_loss": -12.363760948181152, "global_step": 343358, "epoch": 2043} {"train_loss": -12.419857025146484, "global_step": 343359, "epoch": 2043} {"train_loss": -12.395360946655273, "global_step": 343360, "epoch": 2043} {"train_loss": -12.413018226623535, "global_step": 343361, "epoch": 2043} {"train_loss": -12.640968322753906, "global_step": 343362, "epoch": 2043} {"train_loss": -12.638103485107422, "global_step": 343363, "epoch": 2043} {"train_loss": -12.424732208251953, "global_step": 343364, "epoch": 2043} {"train_loss": -12.51904296875, "global_step": 343365, "epoch": 2043} {"train_loss": -12.552952766418457, "global_step": 343366, "epoch": 2043} {"train_loss": -12.426538467407227, "global_step": 343367, "epoch": 2043} {"train_loss": -12.517075538635254, "global_step": 343368, "epoch": 2043} {"train_loss": -12.651174545288086, "global_step": 343369, "epoch": 2043} {"train_loss": -12.105518341064453, "global_step": 343370, "epoch": 2043} {"train_loss": -12.780160903930664, "global_step": 343371, "epoch": 2043} {"train_loss": -12.554715156555176, "global_step": 343372, "epoch": 2043} {"train_loss": -12.697122573852539, "global_step": 343373, "epoch": 2043} {"train_loss": -12.549381256103516, "global_step": 343374, "epoch": 2043} {"train_loss": -12.46469497680664, "global_step": 343375, "epoch": 2043} {"train_loss": -12.362451553344727, "global_step": 343376, "epoch": 2043} {"train_loss": -12.103313446044922, "global_step": 343377, "epoch": 2043} {"train_loss": -11.976415634155273, "global_step": 343378, "epoch": 2043} {"train_loss": -11.995725631713867, "global_step": 343379, "epoch": 2043} {"train_loss": -11.70566177368164, "global_step": 343380, "epoch": 2043} {"train_loss": -11.030570983886719, "global_step": 343381, "epoch": 2043} {"train_loss": -10.688488960266113, "global_step": 343382, "epoch": 2043} {"train_loss": -11.986233711242676, "global_step": 343383, "epoch": 2043} {"train_loss": -12.306690216064453, "global_step": 343384, "epoch": 2043} {"train_loss": -11.679573059082031, "global_step": 343385, "epoch": 2043} {"train_loss": -10.818570137023926, "global_step": 343386, "epoch": 2043} {"train_loss": -11.369086265563965, "global_step": 343387, "epoch": 2043} {"train_loss": -12.070608139038086, "global_step": 343388, "epoch": 2043} {"train_loss": -10.140827178955078, "global_step": 343389, "epoch": 2043} {"train_loss": -12.150285720825195, "global_step": 343390, "epoch": 2043} {"train_loss": -12.1039883125396, "global_step": 343391, "epoch": 2043, "val_loss": 289785.1875} {"train_loss": -11.416145324707031, "global_step": 343392, "epoch": 2044} {"train_loss": -10.67532730102539, "global_step": 343393, "epoch": 2044} {"train_loss": -11.092140197753906, "global_step": 343394, "epoch": 2044} {"train_loss": -11.581963539123535, "global_step": 343395, "epoch": 2044} {"train_loss": -11.890615463256836, "global_step": 343396, "epoch": 2044} {"train_loss": -11.347999572753906, "global_step": 343397, "epoch": 2044} {"train_loss": -11.542887687683105, "global_step": 343398, "epoch": 2044} {"train_loss": -11.838420867919922, "global_step": 343399, "epoch": 2044} {"train_loss": -10.729110717773438, "global_step": 343400, "epoch": 2044} {"train_loss": -11.285257339477539, "global_step": 343401, "epoch": 2044} {"train_loss": -11.472017288208008, "global_step": 343402, "epoch": 2044} {"train_loss": -10.36690902709961, "global_step": 343403, "epoch": 2044} {"train_loss": -9.752847671508789, "global_step": 343404, "epoch": 2044} {"train_loss": -11.131908416748047, "global_step": 343405, "epoch": 2044} {"train_loss": -8.159656524658203, "global_step": 343406, "epoch": 2044} {"train_loss": -8.84768009185791, "global_step": 343407, "epoch": 2044} {"train_loss": -9.349117279052734, "global_step": 343408, "epoch": 2044} {"train_loss": -10.501169204711914, "global_step": 343409, "epoch": 2044} {"train_loss": -10.265063285827637, "global_step": 343410, "epoch": 2044} {"train_loss": -9.898170471191406, "global_step": 343411, "epoch": 2044} {"train_loss": -10.068382263183594, "global_step": 343412, "epoch": 2044} {"train_loss": -10.78731918334961, "global_step": 343413, "epoch": 2044} {"train_loss": -10.28183650970459, "global_step": 343414, "epoch": 2044} {"train_loss": -10.465005874633789, "global_step": 343415, "epoch": 2044} {"train_loss": -10.70173454284668, "global_step": 343416, "epoch": 2044} {"train_loss": -10.438272476196289, "global_step": 343417, "epoch": 2044} {"train_loss": -11.064732551574707, "global_step": 343418, "epoch": 2044} {"train_loss": -10.576735496520996, "global_step": 343419, "epoch": 2044} {"train_loss": -11.02006721496582, "global_step": 343420, "epoch": 2044} {"train_loss": -11.203437805175781, "global_step": 343421, "epoch": 2044} {"train_loss": -10.48916244506836, "global_step": 343422, "epoch": 2044} {"train_loss": -11.83150863647461, "global_step": 343423, "epoch": 2044} {"train_loss": -11.248005867004395, "global_step": 343424, "epoch": 2044} {"train_loss": -11.045133590698242, "global_step": 343425, "epoch": 2044} {"train_loss": -11.181964874267578, "global_step": 343426, "epoch": 2044} {"train_loss": -11.257417678833008, "global_step": 343427, "epoch": 2044} {"train_loss": -11.29066276550293, "global_step": 343428, "epoch": 2044} {"train_loss": -10.96232795715332, "global_step": 343429, "epoch": 2044} {"train_loss": -11.29358959197998, "global_step": 343430, "epoch": 2044} {"train_loss": -11.476235389709473, "global_step": 343431, "epoch": 2044} {"train_loss": -11.80976676940918, "global_step": 343432, "epoch": 2044} {"train_loss": -10.885334968566895, "global_step": 343433, "epoch": 2044} {"train_loss": -11.350896835327148, "global_step": 343434, "epoch": 2044} {"train_loss": -11.391772270202637, "global_step": 343435, "epoch": 2044} {"train_loss": -11.59769344329834, "global_step": 343436, "epoch": 2044} {"train_loss": -11.911844253540039, "global_step": 343437, "epoch": 2044} {"train_loss": -11.092113494873047, "global_step": 343438, "epoch": 2044} {"train_loss": -11.693669319152832, "global_step": 343439, "epoch": 2044} {"train_loss": -11.565008163452148, "global_step": 343440, "epoch": 2044} {"train_loss": -11.352701187133789, "global_step": 343441, "epoch": 2044} {"train_loss": -11.585044860839844, "global_step": 343442, "epoch": 2044} {"train_loss": -11.70064926147461, "global_step": 343443, "epoch": 2044} {"train_loss": -11.33631706237793, "global_step": 343444, "epoch": 2044} {"train_loss": -11.877338409423828, "global_step": 343445, "epoch": 2044} {"train_loss": -11.164549827575684, "global_step": 343446, "epoch": 2044} {"train_loss": -11.111478805541992, "global_step": 343447, "epoch": 2044} {"train_loss": -12.035717964172363, "global_step": 343448, "epoch": 2044} {"train_loss": -11.069095611572266, "global_step": 343449, "epoch": 2044} {"train_loss": -11.923260688781738, "global_step": 343450, "epoch": 2044} {"train_loss": -11.589408874511719, "global_step": 343451, "epoch": 2044} {"train_loss": -11.47479248046875, "global_step": 343452, "epoch": 2044} {"train_loss": -11.957802772521973, "global_step": 343453, "epoch": 2044} {"train_loss": -11.558855056762695, "global_step": 343454, "epoch": 2044} {"train_loss": -11.855140686035156, "global_step": 343455, "epoch": 2044} {"train_loss": -11.90627670288086, "global_step": 343456, "epoch": 2044} {"train_loss": -11.790209770202637, "global_step": 343457, "epoch": 2044} {"train_loss": -12.061944961547852, "global_step": 343458, "epoch": 2044} {"train_loss": -11.881967544555664, "global_step": 343459, "epoch": 2044} {"train_loss": -12.135841369628906, "global_step": 343460, "epoch": 2044} {"train_loss": -12.11616325378418, "global_step": 343461, "epoch": 2044} {"train_loss": -11.780682563781738, "global_step": 343462, "epoch": 2044} {"train_loss": -12.116630554199219, "global_step": 343463, "epoch": 2044} {"train_loss": -12.07640552520752, "global_step": 343464, "epoch": 2044} {"train_loss": -12.220407485961914, "global_step": 343465, "epoch": 2044} {"train_loss": -12.195611953735352, "global_step": 343466, "epoch": 2044} {"train_loss": -12.115997314453125, "global_step": 343467, "epoch": 2044} {"train_loss": -12.139649391174316, "global_step": 343468, "epoch": 2044} {"train_loss": -12.02324104309082, "global_step": 343469, "epoch": 2044} {"train_loss": -12.013904571533203, "global_step": 343470, "epoch": 2044} {"train_loss": -12.19958209991455, "global_step": 343471, "epoch": 2044} {"train_loss": -12.18786334991455, "global_step": 343472, "epoch": 2044} {"train_loss": -12.118009567260742, "global_step": 343473, "epoch": 2044} {"train_loss": -12.11429214477539, "global_step": 343474, "epoch": 2044} {"train_loss": -12.388681411743164, "global_step": 343475, "epoch": 2044} {"train_loss": -12.146150588989258, "global_step": 343476, "epoch": 2044} {"train_loss": -12.171263694763184, "global_step": 343477, "epoch": 2044} {"train_loss": -12.194759368896484, "global_step": 343478, "epoch": 2044} {"train_loss": -12.3187255859375, "global_step": 343479, "epoch": 2044} {"train_loss": -12.341737747192383, "global_step": 343480, "epoch": 2044} {"train_loss": -12.34744644165039, "global_step": 343481, "epoch": 2044} {"train_loss": -12.050252914428711, "global_step": 343482, "epoch": 2044} {"train_loss": -11.607461929321289, "global_step": 343483, "epoch": 2044} {"train_loss": -12.238744735717773, "global_step": 343484, "epoch": 2044} {"train_loss": -12.087311744689941, "global_step": 343485, "epoch": 2044} {"train_loss": -12.134088516235352, "global_step": 343486, "epoch": 2044} {"train_loss": -12.225118637084961, "global_step": 343487, "epoch": 2044} {"train_loss": -12.17765998840332, "global_step": 343488, "epoch": 2044} {"train_loss": -12.149345397949219, "global_step": 343489, "epoch": 2044} {"train_loss": -12.303237915039062, "global_step": 343490, "epoch": 2044} {"train_loss": -12.290781021118164, "global_step": 343491, "epoch": 2044} {"train_loss": -12.259521484375, "global_step": 343492, "epoch": 2044} {"train_loss": -12.42330551147461, "global_step": 343493, "epoch": 2044} {"train_loss": -12.314452171325684, "global_step": 343494, "epoch": 2044} {"train_loss": -12.079998970031738, "global_step": 343495, "epoch": 2044} {"train_loss": -12.06683349609375, "global_step": 343496, "epoch": 2044} {"train_loss": -12.1343355178833, "global_step": 343497, "epoch": 2044} {"train_loss": -12.374091148376465, "global_step": 343498, "epoch": 2044} {"train_loss": -12.074745178222656, "global_step": 343499, "epoch": 2044} {"train_loss": -12.201326370239258, "global_step": 343500, "epoch": 2044} {"train_loss": -11.767736434936523, "global_step": 343501, "epoch": 2044} {"train_loss": -12.444134712219238, "global_step": 343502, "epoch": 2044} {"train_loss": -12.007678985595703, "global_step": 343503, "epoch": 2044} {"train_loss": -12.026123046875, "global_step": 343504, "epoch": 2044} {"train_loss": -12.143157005310059, "global_step": 343505, "epoch": 2044} {"train_loss": -11.442859649658203, "global_step": 343506, "epoch": 2044} {"train_loss": -11.753803253173828, "global_step": 343507, "epoch": 2044} {"train_loss": -11.43820571899414, "global_step": 343508, "epoch": 2044} {"train_loss": -10.915630340576172, "global_step": 343509, "epoch": 2044} {"train_loss": -11.881948471069336, "global_step": 343510, "epoch": 2044} {"train_loss": -10.499642372131348, "global_step": 343511, "epoch": 2044} {"train_loss": -11.152505874633789, "global_step": 343512, "epoch": 2044} {"train_loss": -9.91928768157959, "global_step": 343513, "epoch": 2044} {"train_loss": -11.15672492980957, "global_step": 343514, "epoch": 2044} {"train_loss": -10.378288269042969, "global_step": 343515, "epoch": 2044} {"train_loss": -11.913307189941406, "global_step": 343516, "epoch": 2044} {"train_loss": -10.373183250427246, "global_step": 343517, "epoch": 2044} {"train_loss": -12.29918098449707, "global_step": 343518, "epoch": 2044} {"train_loss": -10.887687683105469, "global_step": 343519, "epoch": 2044} {"train_loss": -12.182106971740723, "global_step": 343520, "epoch": 2044} {"train_loss": -11.825754165649414, "global_step": 343521, "epoch": 2044} {"train_loss": -12.184304237365723, "global_step": 343522, "epoch": 2044} {"train_loss": -12.261946678161621, "global_step": 343523, "epoch": 2044} {"train_loss": -11.786898612976074, "global_step": 343524, "epoch": 2044} {"train_loss": -12.350480079650879, "global_step": 343525, "epoch": 2044} {"train_loss": -11.508609771728516, "global_step": 343526, "epoch": 2044} {"train_loss": -12.297601699829102, "global_step": 343527, "epoch": 2044} {"train_loss": -11.861108779907227, "global_step": 343528, "epoch": 2044} {"train_loss": -12.105806350708008, "global_step": 343529, "epoch": 2044} {"train_loss": -12.342321395874023, "global_step": 343530, "epoch": 2044} {"train_loss": -11.798871040344238, "global_step": 343531, "epoch": 2044} {"train_loss": -12.15987777709961, "global_step": 343532, "epoch": 2044} {"train_loss": -11.814281463623047, "global_step": 343533, "epoch": 2044} {"train_loss": -12.318262100219727, "global_step": 343534, "epoch": 2044} {"train_loss": -11.819228172302246, "global_step": 343535, "epoch": 2044} {"train_loss": -12.190065383911133, "global_step": 343536, "epoch": 2044} {"train_loss": -11.75344181060791, "global_step": 343537, "epoch": 2044} {"train_loss": -12.264081954956055, "global_step": 343538, "epoch": 2044} {"train_loss": -11.869821548461914, "global_step": 343539, "epoch": 2044} {"train_loss": -12.196554183959961, "global_step": 343540, "epoch": 2044} {"train_loss": -12.040101051330566, "global_step": 343541, "epoch": 2044} {"train_loss": -12.259325981140137, "global_step": 343542, "epoch": 2044} {"train_loss": -12.035808563232422, "global_step": 343543, "epoch": 2044} {"train_loss": -11.814878463745117, "global_step": 343544, "epoch": 2044} {"train_loss": -12.131111145019531, "global_step": 343545, "epoch": 2044} {"train_loss": -11.723577499389648, "global_step": 343546, "epoch": 2044} {"train_loss": -12.519033432006836, "global_step": 343547, "epoch": 2044} {"train_loss": -12.11379623413086, "global_step": 343548, "epoch": 2044} {"train_loss": -12.20854663848877, "global_step": 343549, "epoch": 2044} {"train_loss": -12.390350341796875, "global_step": 343550, "epoch": 2044} {"train_loss": -11.851879119873047, "global_step": 343551, "epoch": 2044} {"train_loss": -12.270501136779785, "global_step": 343552, "epoch": 2044} {"train_loss": -12.107606887817383, "global_step": 343553, "epoch": 2044} {"train_loss": -12.170013427734375, "global_step": 343554, "epoch": 2044} {"train_loss": -12.085136413574219, "global_step": 343555, "epoch": 2044} {"train_loss": -12.042098045349121, "global_step": 343556, "epoch": 2044} {"train_loss": -12.454151153564453, "global_step": 343557, "epoch": 2044} {"train_loss": -12.395059585571289, "global_step": 343558, "epoch": 2044} {"train_loss": -11.637490800448827, "global_step": 343559, "epoch": 2044, "val_loss": 287552.1875} {"train_loss": -12.436515808105469, "global_step": 343560, "epoch": 2045} {"train_loss": -12.175579071044922, "global_step": 343561, "epoch": 2045} {"train_loss": -12.155592918395996, "global_step": 343562, "epoch": 2045} {"train_loss": -12.28488826751709, "global_step": 343563, "epoch": 2045} {"train_loss": -12.33143424987793, "global_step": 343564, "epoch": 2045} {"train_loss": -12.375849723815918, "global_step": 343565, "epoch": 2045} {"train_loss": -12.457979202270508, "global_step": 343566, "epoch": 2045} {"train_loss": -12.213846206665039, "global_step": 343567, "epoch": 2045} {"train_loss": -12.484749794006348, "global_step": 343568, "epoch": 2045} {"train_loss": -11.952775955200195, "global_step": 343569, "epoch": 2045} {"train_loss": -12.247756958007812, "global_step": 343570, "epoch": 2045} {"train_loss": -12.398774147033691, "global_step": 343571, "epoch": 2045} {"train_loss": -12.38008975982666, "global_step": 343572, "epoch": 2045} {"train_loss": -12.56109619140625, "global_step": 343573, "epoch": 2045} {"train_loss": -11.971711158752441, "global_step": 343574, "epoch": 2045} {"train_loss": -11.703239440917969, "global_step": 343575, "epoch": 2045} {"train_loss": -12.422136306762695, "global_step": 343576, "epoch": 2045} {"train_loss": -11.692300796508789, "global_step": 343577, "epoch": 2045} {"train_loss": -12.048649787902832, "global_step": 343578, "epoch": 2045} {"train_loss": -12.242833137512207, "global_step": 343579, "epoch": 2045} {"train_loss": -12.296438217163086, "global_step": 343580, "epoch": 2045} {"train_loss": -11.808313369750977, "global_step": 343581, "epoch": 2045} {"train_loss": -12.420995712280273, "global_step": 343582, "epoch": 2045} {"train_loss": -11.843284606933594, "global_step": 343583, "epoch": 2045} {"train_loss": -11.66845703125, "global_step": 343584, "epoch": 2045} {"train_loss": -11.228704452514648, "global_step": 343585, "epoch": 2045} {"train_loss": -12.42195987701416, "global_step": 343586, "epoch": 2045} {"train_loss": -11.486856460571289, "global_step": 343587, "epoch": 2045} {"train_loss": -11.182990074157715, "global_step": 343588, "epoch": 2045} {"train_loss": -10.838411331176758, "global_step": 343589, "epoch": 2045} {"train_loss": -12.226053237915039, "global_step": 343590, "epoch": 2045} {"train_loss": -11.101117134094238, "global_step": 343591, "epoch": 2045} {"train_loss": -10.031752586364746, "global_step": 343592, "epoch": 2045} {"train_loss": -12.28050422668457, "global_step": 343593, "epoch": 2045} {"train_loss": -9.858043670654297, "global_step": 343594, "epoch": 2045} {"train_loss": -12.019916534423828, "global_step": 343595, "epoch": 2045} {"train_loss": -11.560014724731445, "global_step": 343596, "epoch": 2045} {"train_loss": -10.909393310546875, "global_step": 343597, "epoch": 2045} {"train_loss": -12.202635765075684, "global_step": 343598, "epoch": 2045} {"train_loss": -10.955974578857422, "global_step": 343599, "epoch": 2045} {"train_loss": -11.466350555419922, "global_step": 343600, "epoch": 2045} {"train_loss": -11.948519706726074, "global_step": 343601, "epoch": 2045} {"train_loss": -10.858272552490234, "global_step": 343602, "epoch": 2045} {"train_loss": -11.925082206726074, "global_step": 343603, "epoch": 2045} {"train_loss": -11.883418083190918, "global_step": 343604, "epoch": 2045} {"train_loss": -11.600563049316406, "global_step": 343605, "epoch": 2045} {"train_loss": -12.124279975891113, "global_step": 343606, "epoch": 2045} {"train_loss": -12.071260452270508, "global_step": 343607, "epoch": 2045} {"train_loss": -11.99374008178711, "global_step": 343608, "epoch": 2045} {"train_loss": -12.206024169921875, "global_step": 343609, "epoch": 2045} {"train_loss": -12.035388946533203, "global_step": 343610, "epoch": 2045} {"train_loss": -12.015918731689453, "global_step": 343611, "epoch": 2045} {"train_loss": -12.09735107421875, "global_step": 343612, "epoch": 2045} {"train_loss": -12.152144432067871, "global_step": 343613, "epoch": 2045} {"train_loss": -12.437372207641602, "global_step": 343614, "epoch": 2045} {"train_loss": -11.804363250732422, "global_step": 343615, "epoch": 2045} {"train_loss": -12.388489723205566, "global_step": 343616, "epoch": 2045} {"train_loss": -12.286060333251953, "global_step": 343617, "epoch": 2045} {"train_loss": -12.299633026123047, "global_step": 343618, "epoch": 2045} {"train_loss": -12.152687072753906, "global_step": 343619, "epoch": 2045} {"train_loss": -12.329666137695312, "global_step": 343620, "epoch": 2045} {"train_loss": -12.330256462097168, "global_step": 343621, "epoch": 2045} {"train_loss": -12.35360336303711, "global_step": 343622, "epoch": 2045} {"train_loss": -12.19321346282959, "global_step": 343623, "epoch": 2045} {"train_loss": -12.343104362487793, "global_step": 343624, "epoch": 2045} {"train_loss": -12.461002349853516, "global_step": 343625, "epoch": 2045} {"train_loss": -12.117477416992188, "global_step": 343626, "epoch": 2045} {"train_loss": -12.13968563079834, "global_step": 343627, "epoch": 2045} {"train_loss": -12.098907470703125, "global_step": 343628, "epoch": 2045} {"train_loss": -12.016475677490234, "global_step": 343629, "epoch": 2045} {"train_loss": -12.13044548034668, "global_step": 343630, "epoch": 2045} {"train_loss": -12.214961051940918, "global_step": 343631, "epoch": 2045} {"train_loss": -12.111227035522461, "global_step": 343632, "epoch": 2045} {"train_loss": -12.190141677856445, "global_step": 343633, "epoch": 2045} {"train_loss": -11.943635940551758, "global_step": 343634, "epoch": 2045} {"train_loss": -11.915470123291016, "global_step": 343635, "epoch": 2045} {"train_loss": -11.737552642822266, "global_step": 343636, "epoch": 2045} {"train_loss": -12.361869812011719, "global_step": 343637, "epoch": 2045} {"train_loss": -11.772875785827637, "global_step": 343638, "epoch": 2045} {"train_loss": -12.313750267028809, "global_step": 343639, "epoch": 2045} {"train_loss": -11.715044975280762, "global_step": 343640, "epoch": 2045} {"train_loss": -11.758809089660645, "global_step": 343641, "epoch": 2045} {"train_loss": -11.876625061035156, "global_step": 343642, "epoch": 2045} {"train_loss": -12.214241027832031, "global_step": 343643, "epoch": 2045} {"train_loss": -12.010321617126465, "global_step": 343644, "epoch": 2045} {"train_loss": -12.24856185913086, "global_step": 343645, "epoch": 2045} {"train_loss": -12.163551330566406, "global_step": 343646, "epoch": 2045} {"train_loss": -12.075701713562012, "global_step": 343647, "epoch": 2045} {"train_loss": -12.339822769165039, "global_step": 343648, "epoch": 2045} {"train_loss": -12.250798225402832, "global_step": 343649, "epoch": 2045} {"train_loss": -12.062625885009766, "global_step": 343650, "epoch": 2045} {"train_loss": -11.777229309082031, "global_step": 343651, "epoch": 2045} {"train_loss": -11.680253982543945, "global_step": 343652, "epoch": 2045} {"train_loss": -11.873327255249023, "global_step": 343653, "epoch": 2045} {"train_loss": -11.142134666442871, "global_step": 343654, "epoch": 2045} {"train_loss": -11.755037307739258, "global_step": 343655, "epoch": 2045} {"train_loss": -11.579798698425293, "global_step": 343656, "epoch": 2045} {"train_loss": -11.013961791992188, "global_step": 343657, "epoch": 2045} {"train_loss": -11.720529556274414, "global_step": 343658, "epoch": 2045} {"train_loss": -9.80838680267334, "global_step": 343659, "epoch": 2045} {"train_loss": -11.264168739318848, "global_step": 343660, "epoch": 2045} {"train_loss": -11.29163646697998, "global_step": 343661, "epoch": 2045} {"train_loss": -10.694747924804688, "global_step": 343662, "epoch": 2045} {"train_loss": -12.083893775939941, "global_step": 343663, "epoch": 2045} {"train_loss": -10.749464988708496, "global_step": 343664, "epoch": 2045} {"train_loss": -11.274711608886719, "global_step": 343665, "epoch": 2045} {"train_loss": -11.228607177734375, "global_step": 343666, "epoch": 2045} {"train_loss": -11.146186828613281, "global_step": 343667, "epoch": 2045} {"train_loss": -11.080121994018555, "global_step": 343668, "epoch": 2045} {"train_loss": -11.734338760375977, "global_step": 343669, "epoch": 2045} {"train_loss": -10.738946914672852, "global_step": 343670, "epoch": 2045} {"train_loss": -12.12272834777832, "global_step": 343671, "epoch": 2045} {"train_loss": -11.340527534484863, "global_step": 343672, "epoch": 2045} {"train_loss": -11.734128952026367, "global_step": 343673, "epoch": 2045} {"train_loss": -11.693300247192383, "global_step": 343674, "epoch": 2045} {"train_loss": -11.250797271728516, "global_step": 343675, "epoch": 2045} {"train_loss": -11.891077041625977, "global_step": 343676, "epoch": 2045} {"train_loss": -11.13270378112793, "global_step": 343677, "epoch": 2045} {"train_loss": -12.249591827392578, "global_step": 343678, "epoch": 2045} {"train_loss": -11.417915344238281, "global_step": 343679, "epoch": 2045} {"train_loss": -12.181135177612305, "global_step": 343680, "epoch": 2045} {"train_loss": -10.863729476928711, "global_step": 343681, "epoch": 2045} {"train_loss": -12.327634811401367, "global_step": 343682, "epoch": 2045} {"train_loss": -11.338312149047852, "global_step": 343683, "epoch": 2045} {"train_loss": -11.997163772583008, "global_step": 343684, "epoch": 2045} {"train_loss": -11.197803497314453, "global_step": 343685, "epoch": 2045} {"train_loss": -11.483981132507324, "global_step": 343686, "epoch": 2045} {"train_loss": -11.772076606750488, "global_step": 343687, "epoch": 2045} {"train_loss": -11.671215057373047, "global_step": 343688, "epoch": 2045} {"train_loss": -11.846956253051758, "global_step": 343689, "epoch": 2045} {"train_loss": -11.327013969421387, "global_step": 343690, "epoch": 2045} {"train_loss": -11.520604133605957, "global_step": 343691, "epoch": 2045} {"train_loss": -11.070119857788086, "global_step": 343692, "epoch": 2045} {"train_loss": -11.088852882385254, "global_step": 343693, "epoch": 2045} {"train_loss": -12.060230255126953, "global_step": 343694, "epoch": 2045} {"train_loss": -11.012975692749023, "global_step": 343695, "epoch": 2045} {"train_loss": -11.761406898498535, "global_step": 343696, "epoch": 2045} {"train_loss": -12.057482719421387, "global_step": 343697, "epoch": 2045} {"train_loss": -10.518228530883789, "global_step": 343698, "epoch": 2045} {"train_loss": -12.022220611572266, "global_step": 343699, "epoch": 2045} {"train_loss": -10.603971481323242, "global_step": 343700, "epoch": 2045} {"train_loss": -11.721975326538086, "global_step": 343701, "epoch": 2045} {"train_loss": -11.711681365966797, "global_step": 343702, "epoch": 2045} {"train_loss": -10.786005973815918, "global_step": 343703, "epoch": 2045} {"train_loss": -11.40464973449707, "global_step": 343704, "epoch": 2045} {"train_loss": -11.923341751098633, "global_step": 343705, "epoch": 2045} {"train_loss": -10.584333419799805, "global_step": 343706, "epoch": 2045} {"train_loss": -11.975868225097656, "global_step": 343707, "epoch": 2045} {"train_loss": -11.390478134155273, "global_step": 343708, "epoch": 2045} {"train_loss": -11.79101848602295, "global_step": 343709, "epoch": 2045} {"train_loss": -11.495159149169922, "global_step": 343710, "epoch": 2045} {"train_loss": -12.146421432495117, "global_step": 343711, "epoch": 2045} {"train_loss": -11.963653564453125, "global_step": 343712, "epoch": 2045} {"train_loss": -11.954593658447266, "global_step": 343713, "epoch": 2045} {"train_loss": -12.119192123413086, "global_step": 343714, "epoch": 2045} {"train_loss": -11.97595500946045, "global_step": 343715, "epoch": 2045} {"train_loss": -12.24437141418457, "global_step": 343716, "epoch": 2045} {"train_loss": -12.335884094238281, "global_step": 343717, "epoch": 2045} {"train_loss": -12.107876777648926, "global_step": 343718, "epoch": 2045} {"train_loss": -12.26655101776123, "global_step": 343719, "epoch": 2045} {"train_loss": -12.13917064666748, "global_step": 343720, "epoch": 2045} {"train_loss": -12.287354469299316, "global_step": 343721, "epoch": 2045} {"train_loss": -12.188183784484863, "global_step": 343722, "epoch": 2045} {"train_loss": -12.297464370727539, "global_step": 343723, "epoch": 2045} {"train_loss": -12.255270957946777, "global_step": 343724, "epoch": 2045} {"train_loss": -12.386130332946777, "global_step": 343725, "epoch": 2045} {"train_loss": -12.407279968261719, "global_step": 343726, "epoch": 2045} {"train_loss": -11.815461368787856, "global_step": 343727, "epoch": 2045, "val_loss": 288770.46875, "train_action_mse_error": 2.2170815467834473} {"train_loss": -12.384571075439453, "global_step": 343728, "epoch": 2046} {"train_loss": -12.347764015197754, "global_step": 343729, "epoch": 2046} {"train_loss": -12.393377304077148, "global_step": 343730, "epoch": 2046} {"train_loss": -12.256946563720703, "global_step": 343731, "epoch": 2046} {"train_loss": -12.480841636657715, "global_step": 343732, "epoch": 2046} {"train_loss": -12.299778938293457, "global_step": 343733, "epoch": 2046} {"train_loss": -12.232068061828613, "global_step": 343734, "epoch": 2046} {"train_loss": -12.272941589355469, "global_step": 343735, "epoch": 2046} {"train_loss": -12.292190551757812, "global_step": 343736, "epoch": 2046} {"train_loss": -12.342429161071777, "global_step": 343737, "epoch": 2046} {"train_loss": -12.521187782287598, "global_step": 343738, "epoch": 2046} {"train_loss": -12.549842834472656, "global_step": 343739, "epoch": 2046} {"train_loss": -12.457002639770508, "global_step": 343740, "epoch": 2046} {"train_loss": -12.26756477355957, "global_step": 343741, "epoch": 2046} {"train_loss": -12.332168579101562, "global_step": 343742, "epoch": 2046} {"train_loss": -12.439539909362793, "global_step": 343743, "epoch": 2046} {"train_loss": -12.559764862060547, "global_step": 343744, "epoch": 2046} {"train_loss": -12.336444854736328, "global_step": 343745, "epoch": 2046} {"train_loss": -12.621896743774414, "global_step": 343746, "epoch": 2046} {"train_loss": -12.490793228149414, "global_step": 343747, "epoch": 2046} {"train_loss": -12.712299346923828, "global_step": 343748, "epoch": 2046} {"train_loss": -12.447843551635742, "global_step": 343749, "epoch": 2046} {"train_loss": -12.48859977722168, "global_step": 343750, "epoch": 2046} {"train_loss": -12.001373291015625, "global_step": 343751, "epoch": 2046} {"train_loss": -12.471423149108887, "global_step": 343752, "epoch": 2046} {"train_loss": -12.131340980529785, "global_step": 343753, "epoch": 2046} {"train_loss": -12.2920503616333, "global_step": 343754, "epoch": 2046} {"train_loss": -12.295523643493652, "global_step": 343755, "epoch": 2046} {"train_loss": -12.156744003295898, "global_step": 343756, "epoch": 2046} {"train_loss": -12.472742080688477, "global_step": 343757, "epoch": 2046} {"train_loss": -12.351094245910645, "global_step": 343758, "epoch": 2046} {"train_loss": -12.13128662109375, "global_step": 343759, "epoch": 2046} {"train_loss": -12.394582748413086, "global_step": 343760, "epoch": 2046} {"train_loss": -12.400456428527832, "global_step": 343761, "epoch": 2046} {"train_loss": -12.385683059692383, "global_step": 343762, "epoch": 2046} {"train_loss": -12.11643123626709, "global_step": 343763, "epoch": 2046} {"train_loss": -12.019915580749512, "global_step": 343764, "epoch": 2046} {"train_loss": -12.545499801635742, "global_step": 343765, "epoch": 2046} {"train_loss": -11.38840389251709, "global_step": 343766, "epoch": 2046} {"train_loss": -12.286226272583008, "global_step": 343767, "epoch": 2046} {"train_loss": -11.941060066223145, "global_step": 343768, "epoch": 2046} {"train_loss": -12.148588180541992, "global_step": 343769, "epoch": 2046} {"train_loss": -12.288058280944824, "global_step": 343770, "epoch": 2046} {"train_loss": -11.81028938293457, "global_step": 343771, "epoch": 2046} {"train_loss": -12.515849113464355, "global_step": 343772, "epoch": 2046} {"train_loss": -12.16235637664795, "global_step": 343773, "epoch": 2046} {"train_loss": -11.982544898986816, "global_step": 343774, "epoch": 2046} {"train_loss": -12.050640106201172, "global_step": 343775, "epoch": 2046} {"train_loss": -11.490948677062988, "global_step": 343776, "epoch": 2046} {"train_loss": -12.381847381591797, "global_step": 343777, "epoch": 2046} {"train_loss": -11.918789863586426, "global_step": 343778, "epoch": 2046} {"train_loss": -11.974509239196777, "global_step": 343779, "epoch": 2046} {"train_loss": -12.394433975219727, "global_step": 343780, "epoch": 2046} {"train_loss": -11.78462028503418, "global_step": 343781, "epoch": 2046} {"train_loss": -11.986148834228516, "global_step": 343782, "epoch": 2046} {"train_loss": -11.67818832397461, "global_step": 343783, "epoch": 2046} {"train_loss": -12.309136390686035, "global_step": 343784, "epoch": 2046} {"train_loss": -11.984431266784668, "global_step": 343785, "epoch": 2046} {"train_loss": -11.92559814453125, "global_step": 343786, "epoch": 2046} {"train_loss": -11.677515029907227, "global_step": 343787, "epoch": 2046} {"train_loss": -11.879047393798828, "global_step": 343788, "epoch": 2046} {"train_loss": -11.723164558410645, "global_step": 343789, "epoch": 2046} {"train_loss": -11.565030097961426, "global_step": 343790, "epoch": 2046} {"train_loss": -10.448759078979492, "global_step": 343791, "epoch": 2046} {"train_loss": -10.578062057495117, "global_step": 343792, "epoch": 2046} {"train_loss": -11.168879508972168, "global_step": 343793, "epoch": 2046} {"train_loss": -11.612932205200195, "global_step": 343794, "epoch": 2046} {"train_loss": -11.036042213439941, "global_step": 343795, "epoch": 2046} {"train_loss": -11.231973648071289, "global_step": 343796, "epoch": 2046} {"train_loss": -11.575728416442871, "global_step": 343797, "epoch": 2046} {"train_loss": -9.995582580566406, "global_step": 343798, "epoch": 2046} {"train_loss": -10.762676239013672, "global_step": 343799, "epoch": 2046} {"train_loss": -10.796497344970703, "global_step": 343800, "epoch": 2046} {"train_loss": -10.652894973754883, "global_step": 343801, "epoch": 2046} {"train_loss": -10.726325988769531, "global_step": 343802, "epoch": 2046} {"train_loss": -10.049834251403809, "global_step": 343803, "epoch": 2046} {"train_loss": -9.447038650512695, "global_step": 343804, "epoch": 2046} {"train_loss": -9.983526229858398, "global_step": 343805, "epoch": 2046} {"train_loss": -10.783318519592285, "global_step": 343806, "epoch": 2046} {"train_loss": -10.734991073608398, "global_step": 343807, "epoch": 2046} {"train_loss": -11.029372215270996, "global_step": 343808, "epoch": 2046} {"train_loss": -10.872831344604492, "global_step": 343809, "epoch": 2046} {"train_loss": -11.73509407043457, "global_step": 343810, "epoch": 2046} {"train_loss": -11.449161529541016, "global_step": 343811, "epoch": 2046} {"train_loss": -11.691996574401855, "global_step": 343812, "epoch": 2046} {"train_loss": -11.847968101501465, "global_step": 343813, "epoch": 2046} {"train_loss": -11.685593605041504, "global_step": 343814, "epoch": 2046} {"train_loss": -11.701127052307129, "global_step": 343815, "epoch": 2046} {"train_loss": -11.394020080566406, "global_step": 343816, "epoch": 2046} {"train_loss": -11.877738952636719, "global_step": 343817, "epoch": 2046} {"train_loss": -11.844500541687012, "global_step": 343818, "epoch": 2046} {"train_loss": -11.649650573730469, "global_step": 343819, "epoch": 2046} {"train_loss": -11.38847827911377, "global_step": 343820, "epoch": 2046} {"train_loss": -11.823915481567383, "global_step": 343821, "epoch": 2046} {"train_loss": -11.81130599975586, "global_step": 343822, "epoch": 2046} {"train_loss": -11.809334754943848, "global_step": 343823, "epoch": 2046} {"train_loss": -12.011032104492188, "global_step": 343824, "epoch": 2046} {"train_loss": -11.180265426635742, "global_step": 343825, "epoch": 2046} {"train_loss": -11.857015609741211, "global_step": 343826, "epoch": 2046} {"train_loss": -11.697922706604004, "global_step": 343827, "epoch": 2046} {"train_loss": -11.679220199584961, "global_step": 343828, "epoch": 2046} {"train_loss": -12.06799030303955, "global_step": 343829, "epoch": 2046} {"train_loss": -11.989545822143555, "global_step": 343830, "epoch": 2046} {"train_loss": -12.076208114624023, "global_step": 343831, "epoch": 2046} {"train_loss": -12.05505084991455, "global_step": 343832, "epoch": 2046} {"train_loss": -12.281102180480957, "global_step": 343833, "epoch": 2046} {"train_loss": -12.097113609313965, "global_step": 343834, "epoch": 2046} {"train_loss": -12.189594268798828, "global_step": 343835, "epoch": 2046} {"train_loss": -12.033100128173828, "global_step": 343836, "epoch": 2046} {"train_loss": -12.089529037475586, "global_step": 343837, "epoch": 2046} {"train_loss": -12.184874534606934, "global_step": 343838, "epoch": 2046} {"train_loss": -12.09459400177002, "global_step": 343839, "epoch": 2046} {"train_loss": -12.10708236694336, "global_step": 343840, "epoch": 2046} {"train_loss": -11.828971862792969, "global_step": 343841, "epoch": 2046} {"train_loss": -12.076375007629395, "global_step": 343842, "epoch": 2046} {"train_loss": -12.375041961669922, "global_step": 343843, "epoch": 2046} {"train_loss": -12.098884582519531, "global_step": 343844, "epoch": 2046} {"train_loss": -12.208431243896484, "global_step": 343845, "epoch": 2046} {"train_loss": -12.072870254516602, "global_step": 343846, "epoch": 2046} {"train_loss": -12.221281051635742, "global_step": 343847, "epoch": 2046} {"train_loss": -12.056915283203125, "global_step": 343848, "epoch": 2046} {"train_loss": -12.063713073730469, "global_step": 343849, "epoch": 2046} {"train_loss": -12.393023490905762, "global_step": 343850, "epoch": 2046} {"train_loss": -12.12501335144043, "global_step": 343851, "epoch": 2046} {"train_loss": -12.012236595153809, "global_step": 343852, "epoch": 2046} {"train_loss": -12.177392959594727, "global_step": 343853, "epoch": 2046} {"train_loss": -12.148795127868652, "global_step": 343854, "epoch": 2046} {"train_loss": -12.380260467529297, "global_step": 343855, "epoch": 2046} {"train_loss": -12.12442684173584, "global_step": 343856, "epoch": 2046} {"train_loss": -12.268516540527344, "global_step": 343857, "epoch": 2046} {"train_loss": -12.09213638305664, "global_step": 343858, "epoch": 2046} {"train_loss": -12.06119155883789, "global_step": 343859, "epoch": 2046} {"train_loss": -12.19350814819336, "global_step": 343860, "epoch": 2046} {"train_loss": -11.879072189331055, "global_step": 343861, "epoch": 2046} {"train_loss": -12.437902450561523, "global_step": 343862, "epoch": 2046} {"train_loss": -12.316676139831543, "global_step": 343863, "epoch": 2046} {"train_loss": -12.35566234588623, "global_step": 343864, "epoch": 2046} {"train_loss": -12.374003410339355, "global_step": 343865, "epoch": 2046} {"train_loss": -12.329704284667969, "global_step": 343866, "epoch": 2046} {"train_loss": -12.465033531188965, "global_step": 343867, "epoch": 2046} {"train_loss": -12.114261627197266, "global_step": 343868, "epoch": 2046} {"train_loss": -12.334800720214844, "global_step": 343869, "epoch": 2046} {"train_loss": -12.569313049316406, "global_step": 343870, "epoch": 2046} {"train_loss": -11.982508659362793, "global_step": 343871, "epoch": 2046} {"train_loss": -12.34935188293457, "global_step": 343872, "epoch": 2046} {"train_loss": -12.178780555725098, "global_step": 343873, "epoch": 2046} {"train_loss": -12.44051456451416, "global_step": 343874, "epoch": 2046} {"train_loss": -11.960123062133789, "global_step": 343875, "epoch": 2046} {"train_loss": -12.098153114318848, "global_step": 343876, "epoch": 2046} {"train_loss": -12.410356521606445, "global_step": 343877, "epoch": 2046} {"train_loss": -11.978265762329102, "global_step": 343878, "epoch": 2046} {"train_loss": -12.291678428649902, "global_step": 343879, "epoch": 2046} {"train_loss": -11.948770523071289, "global_step": 343880, "epoch": 2046} {"train_loss": -11.658441543579102, "global_step": 343881, "epoch": 2046} {"train_loss": -11.934316635131836, "global_step": 343882, "epoch": 2046} {"train_loss": -12.0557279586792, "global_step": 343883, "epoch": 2046} {"train_loss": -11.665515899658203, "global_step": 343884, "epoch": 2046} {"train_loss": -12.570916175842285, "global_step": 343885, "epoch": 2046} {"train_loss": -12.166202545166016, "global_step": 343886, "epoch": 2046} {"train_loss": -12.054969787597656, "global_step": 343887, "epoch": 2046} {"train_loss": -11.550681114196777, "global_step": 343888, "epoch": 2046} {"train_loss": -12.339963912963867, "global_step": 343889, "epoch": 2046} {"train_loss": -11.966564178466797, "global_step": 343890, "epoch": 2046} {"train_loss": -12.203089714050293, "global_step": 343891, "epoch": 2046} {"train_loss": -12.04345703125, "global_step": 343892, "epoch": 2046} {"train_loss": -12.22679328918457, "global_step": 343893, "epoch": 2046} {"train_loss": -12.26822280883789, "global_step": 343894, "epoch": 2046} {"train_loss": -11.953286329905191, "global_step": 343895, "epoch": 2046, "val_loss": 283811.40625} {"train_loss": -11.790853500366211, "global_step": 343896, "epoch": 2047} {"train_loss": -12.215044021606445, "global_step": 343897, "epoch": 2047} {"train_loss": -12.041488647460938, "global_step": 343898, "epoch": 2047} {"train_loss": -12.035646438598633, "global_step": 343899, "epoch": 2047} {"train_loss": -12.28238582611084, "global_step": 343900, "epoch": 2047} {"train_loss": -12.505725860595703, "global_step": 343901, "epoch": 2047} {"train_loss": -12.198680877685547, "global_step": 343902, "epoch": 2047} {"train_loss": -12.312213897705078, "global_step": 343903, "epoch": 2047} {"train_loss": -12.406745910644531, "global_step": 343904, "epoch": 2047} {"train_loss": -12.318851470947266, "global_step": 343905, "epoch": 2047} {"train_loss": -12.26199722290039, "global_step": 343906, "epoch": 2047} {"train_loss": -12.234777450561523, "global_step": 343907, "epoch": 2047} {"train_loss": -12.466228485107422, "global_step": 343908, "epoch": 2047} {"train_loss": -12.303163528442383, "global_step": 343909, "epoch": 2047} {"train_loss": -12.610626220703125, "global_step": 343910, "epoch": 2047} {"train_loss": -12.266209602355957, "global_step": 343911, "epoch": 2047} {"train_loss": -12.370685577392578, "global_step": 343912, "epoch": 2047} {"train_loss": -12.32162094116211, "global_step": 343913, "epoch": 2047} {"train_loss": -12.354669570922852, "global_step": 343914, "epoch": 2047} {"train_loss": -12.220512390136719, "global_step": 343915, "epoch": 2047} {"train_loss": -12.148286819458008, "global_step": 343916, "epoch": 2047} {"train_loss": -12.327325820922852, "global_step": 343917, "epoch": 2047} {"train_loss": -12.358833312988281, "global_step": 343918, "epoch": 2047} {"train_loss": -12.477514266967773, "global_step": 343919, "epoch": 2047} {"train_loss": -11.6962890625, "global_step": 343920, "epoch": 2047} {"train_loss": -12.042601585388184, "global_step": 343921, "epoch": 2047} {"train_loss": -12.229053497314453, "global_step": 343922, "epoch": 2047} {"train_loss": -10.385480880737305, "global_step": 343923, "epoch": 2047} {"train_loss": -11.729290008544922, "global_step": 343924, "epoch": 2047} {"train_loss": -10.930829048156738, "global_step": 343925, "epoch": 2047} {"train_loss": -10.813068389892578, "global_step": 343926, "epoch": 2047} {"train_loss": -10.88653564453125, "global_step": 343927, "epoch": 2047} {"train_loss": -10.995309829711914, "global_step": 343928, "epoch": 2047} {"train_loss": -10.307952880859375, "global_step": 343929, "epoch": 2047} {"train_loss": -12.003737449645996, "global_step": 343930, "epoch": 2047} {"train_loss": -10.02821159362793, "global_step": 343931, "epoch": 2047} {"train_loss": -11.570913314819336, "global_step": 343932, "epoch": 2047} {"train_loss": -10.092241287231445, "global_step": 343933, "epoch": 2047} {"train_loss": -11.038981437683105, "global_step": 343934, "epoch": 2047} {"train_loss": -10.352840423583984, "global_step": 343935, "epoch": 2047} {"train_loss": -11.53369140625, "global_step": 343936, "epoch": 2047} {"train_loss": -11.124212265014648, "global_step": 343937, "epoch": 2047} {"train_loss": -11.852630615234375, "global_step": 343938, "epoch": 2047} {"train_loss": -11.442753791809082, "global_step": 343939, "epoch": 2047} {"train_loss": -11.785139083862305, "global_step": 343940, "epoch": 2047} {"train_loss": -12.048151969909668, "global_step": 343941, "epoch": 2047} {"train_loss": -11.459029197692871, "global_step": 343942, "epoch": 2047} {"train_loss": -11.707386016845703, "global_step": 343943, "epoch": 2047} {"train_loss": -11.305572509765625, "global_step": 343944, "epoch": 2047} {"train_loss": -11.907448768615723, "global_step": 343945, "epoch": 2047} {"train_loss": -11.836141586303711, "global_step": 343946, "epoch": 2047} {"train_loss": -11.54366683959961, "global_step": 343947, "epoch": 2047} {"train_loss": -11.817764282226562, "global_step": 343948, "epoch": 2047} {"train_loss": -11.20103645324707, "global_step": 343949, "epoch": 2047} {"train_loss": -11.916759490966797, "global_step": 343950, "epoch": 2047} {"train_loss": -11.924860000610352, "global_step": 343951, "epoch": 2047} {"train_loss": -11.567193984985352, "global_step": 343952, "epoch": 2047} {"train_loss": -12.27046012878418, "global_step": 343953, "epoch": 2047} {"train_loss": -11.363608360290527, "global_step": 343954, "epoch": 2047} {"train_loss": -12.400299072265625, "global_step": 343955, "epoch": 2047} {"train_loss": -11.830301284790039, "global_step": 343956, "epoch": 2047} {"train_loss": -12.135677337646484, "global_step": 343957, "epoch": 2047} {"train_loss": -12.018838882446289, "global_step": 343958, "epoch": 2047} {"train_loss": -12.149027824401855, "global_step": 343959, "epoch": 2047} {"train_loss": -12.1096773147583, "global_step": 343960, "epoch": 2047} {"train_loss": -12.006553649902344, "global_step": 343961, "epoch": 2047} {"train_loss": -12.042074203491211, "global_step": 343962, "epoch": 2047} {"train_loss": -11.939743041992188, "global_step": 343963, "epoch": 2047} {"train_loss": -12.198234558105469, "global_step": 343964, "epoch": 2047} {"train_loss": -12.36264705657959, "global_step": 343965, "epoch": 2047} {"train_loss": -12.316786766052246, "global_step": 343966, "epoch": 2047} {"train_loss": -12.13961124420166, "global_step": 343967, "epoch": 2047} {"train_loss": -12.289058685302734, "global_step": 343968, "epoch": 2047} {"train_loss": -12.434962272644043, "global_step": 343969, "epoch": 2047} {"train_loss": -12.482950210571289, "global_step": 343970, "epoch": 2047} {"train_loss": -12.183999061584473, "global_step": 343971, "epoch": 2047} {"train_loss": -12.327407836914062, "global_step": 343972, "epoch": 2047} {"train_loss": -12.224035263061523, "global_step": 343973, "epoch": 2047} {"train_loss": -12.396430969238281, "global_step": 343974, "epoch": 2047} {"train_loss": -12.108101844787598, "global_step": 343975, "epoch": 2047} {"train_loss": -12.139938354492188, "global_step": 343976, "epoch": 2047} {"train_loss": -12.369097709655762, "global_step": 343977, "epoch": 2047} {"train_loss": -12.283175468444824, "global_step": 343978, "epoch": 2047} {"train_loss": -12.369160652160645, "global_step": 343979, "epoch": 2047} {"train_loss": -12.538932800292969, "global_step": 343980, "epoch": 2047} {"train_loss": -12.311267852783203, "global_step": 343981, "epoch": 2047} {"train_loss": -12.552122116088867, "global_step": 343982, "epoch": 2047} {"train_loss": -12.373003005981445, "global_step": 343983, "epoch": 2047} {"train_loss": -11.954863548278809, "global_step": 343984, "epoch": 2047} {"train_loss": -12.150367736816406, "global_step": 343985, "epoch": 2047} {"train_loss": -12.628729820251465, "global_step": 343986, "epoch": 2047} {"train_loss": -12.125322341918945, "global_step": 343987, "epoch": 2047} {"train_loss": -12.390812873840332, "global_step": 343988, "epoch": 2047} {"train_loss": -12.062097549438477, "global_step": 343989, "epoch": 2047} {"train_loss": -12.159382820129395, "global_step": 343990, "epoch": 2047} {"train_loss": -11.742583274841309, "global_step": 343991, "epoch": 2047} {"train_loss": -11.911365509033203, "global_step": 343992, "epoch": 2047} {"train_loss": -11.791815757751465, "global_step": 343993, "epoch": 2047} {"train_loss": -11.947809219360352, "global_step": 343994, "epoch": 2047} {"train_loss": -11.67203140258789, "global_step": 343995, "epoch": 2047} {"train_loss": -12.12575626373291, "global_step": 343996, "epoch": 2047} {"train_loss": -11.984557151794434, "global_step": 343997, "epoch": 2047} {"train_loss": -12.266475677490234, "global_step": 343998, "epoch": 2047} {"train_loss": -11.9017333984375, "global_step": 343999, "epoch": 2047} {"train_loss": -12.241284370422363, "global_step": 344000, "epoch": 2047} {"train_loss": -11.951062202453613, "global_step": 344001, "epoch": 2047} {"train_loss": -12.286516189575195, "global_step": 344002, "epoch": 2047} {"train_loss": -11.804766654968262, "global_step": 344003, "epoch": 2047} {"train_loss": -12.22266960144043, "global_step": 344004, "epoch": 2047} {"train_loss": -11.57516860961914, "global_step": 344005, "epoch": 2047} {"train_loss": -11.881370544433594, "global_step": 344006, "epoch": 2047} {"train_loss": -12.062328338623047, "global_step": 344007, "epoch": 2047} {"train_loss": -12.319256782531738, "global_step": 344008, "epoch": 2047} {"train_loss": -11.587285995483398, "global_step": 344009, "epoch": 2047} {"train_loss": -12.20126724243164, "global_step": 344010, "epoch": 2047} {"train_loss": -11.48503303527832, "global_step": 344011, "epoch": 2047} {"train_loss": -11.578540802001953, "global_step": 344012, "epoch": 2047} {"train_loss": -11.194070816040039, "global_step": 344013, "epoch": 2047} {"train_loss": -11.74785041809082, "global_step": 344014, "epoch": 2047} {"train_loss": -11.929304122924805, "global_step": 344015, "epoch": 2047} {"train_loss": -11.638574600219727, "global_step": 344016, "epoch": 2047} {"train_loss": -11.675844192504883, "global_step": 344017, "epoch": 2047} {"train_loss": -11.921688079833984, "global_step": 344018, "epoch": 2047} {"train_loss": -12.079879760742188, "global_step": 344019, "epoch": 2047} {"train_loss": -11.738064765930176, "global_step": 344020, "epoch": 2047} {"train_loss": -11.995017051696777, "global_step": 344021, "epoch": 2047} {"train_loss": -11.804142951965332, "global_step": 344022, "epoch": 2047} {"train_loss": -11.700494766235352, "global_step": 344023, "epoch": 2047} {"train_loss": -12.090258598327637, "global_step": 344024, "epoch": 2047} {"train_loss": -11.853063583374023, "global_step": 344025, "epoch": 2047} {"train_loss": -12.32042407989502, "global_step": 344026, "epoch": 2047} {"train_loss": -11.930693626403809, "global_step": 344027, "epoch": 2047} {"train_loss": -12.19693374633789, "global_step": 344028, "epoch": 2047} {"train_loss": -11.896587371826172, "global_step": 344029, "epoch": 2047} {"train_loss": -12.145346641540527, "global_step": 344030, "epoch": 2047} {"train_loss": -12.144904136657715, "global_step": 344031, "epoch": 2047} {"train_loss": -11.913755416870117, "global_step": 344032, "epoch": 2047} {"train_loss": -12.340476036071777, "global_step": 344033, "epoch": 2047} {"train_loss": -12.07673454284668, "global_step": 344034, "epoch": 2047} {"train_loss": -12.509807586669922, "global_step": 344035, "epoch": 2047} {"train_loss": -12.182574272155762, "global_step": 344036, "epoch": 2047} {"train_loss": -12.012198448181152, "global_step": 344037, "epoch": 2047} {"train_loss": -12.425064086914062, "global_step": 344038, "epoch": 2047} {"train_loss": -12.184364318847656, "global_step": 344039, "epoch": 2047} {"train_loss": -12.423828125, "global_step": 344040, "epoch": 2047} {"train_loss": -12.33253002166748, "global_step": 344041, "epoch": 2047} {"train_loss": -12.116382598876953, "global_step": 344042, "epoch": 2047} {"train_loss": -12.536199569702148, "global_step": 344043, "epoch": 2047} {"train_loss": -12.082368850708008, "global_step": 344044, "epoch": 2047} {"train_loss": -12.252792358398438, "global_step": 344045, "epoch": 2047} {"train_loss": -12.270587921142578, "global_step": 344046, "epoch": 2047} {"train_loss": -12.572415351867676, "global_step": 344047, "epoch": 2047} {"train_loss": -11.777905464172363, "global_step": 344048, "epoch": 2047} {"train_loss": -12.039201736450195, "global_step": 344049, "epoch": 2047} {"train_loss": -12.571063995361328, "global_step": 344050, "epoch": 2047} {"train_loss": -12.14692497253418, "global_step": 344051, "epoch": 2047} {"train_loss": -12.321024894714355, "global_step": 344052, "epoch": 2047} {"train_loss": -12.445625305175781, "global_step": 344053, "epoch": 2047} {"train_loss": -12.576414108276367, "global_step": 344054, "epoch": 2047} {"train_loss": -12.33569049835205, "global_step": 344055, "epoch": 2047} {"train_loss": -12.049901962280273, "global_step": 344056, "epoch": 2047} {"train_loss": -12.096785545349121, "global_step": 344057, "epoch": 2047} {"train_loss": -11.95663833618164, "global_step": 344058, "epoch": 2047} {"train_loss": -11.686623573303223, "global_step": 344059, "epoch": 2047} {"train_loss": -11.907703399658203, "global_step": 344060, "epoch": 2047} {"train_loss": -12.634073257446289, "global_step": 344061, "epoch": 2047} {"train_loss": -11.245943069458008, "global_step": 344062, "epoch": 2047} {"train_loss": -11.979987922168913, "global_step": 344063, "epoch": 2047, "val_loss": 286914.59375} {"train_loss": -11.91666030883789, "global_step": 344064, "epoch": 2048} {"train_loss": -12.285951614379883, "global_step": 344065, "epoch": 2048} {"train_loss": -11.095413208007812, "global_step": 344066, "epoch": 2048} {"train_loss": -12.017114639282227, "global_step": 344067, "epoch": 2048} {"train_loss": -11.663884162902832, "global_step": 344068, "epoch": 2048} {"train_loss": -11.38873291015625, "global_step": 344069, "epoch": 2048} {"train_loss": -11.630661010742188, "global_step": 344070, "epoch": 2048} {"train_loss": -11.806234359741211, "global_step": 344071, "epoch": 2048} {"train_loss": -11.832777976989746, "global_step": 344072, "epoch": 2048} {"train_loss": -12.41705322265625, "global_step": 344073, "epoch": 2048} {"train_loss": -12.03389835357666, "global_step": 344074, "epoch": 2048} {"train_loss": -12.058897018432617, "global_step": 344075, "epoch": 2048} {"train_loss": -12.184541702270508, "global_step": 344076, "epoch": 2048} {"train_loss": -12.233681678771973, "global_step": 344077, "epoch": 2048} {"train_loss": -12.315853118896484, "global_step": 344078, "epoch": 2048} {"train_loss": -12.02733039855957, "global_step": 344079, "epoch": 2048} {"train_loss": -12.152764320373535, "global_step": 344080, "epoch": 2048} {"train_loss": -10.916509628295898, "global_step": 344081, "epoch": 2048} {"train_loss": -11.706034660339355, "global_step": 344082, "epoch": 2048} {"train_loss": -12.173225402832031, "global_step": 344083, "epoch": 2048} {"train_loss": -11.953226089477539, "global_step": 344084, "epoch": 2048} {"train_loss": -11.816890716552734, "global_step": 344085, "epoch": 2048} {"train_loss": -11.7658109664917, "global_step": 344086, "epoch": 2048} {"train_loss": -12.163322448730469, "global_step": 344087, "epoch": 2048} {"train_loss": -12.174408912658691, "global_step": 344088, "epoch": 2048} {"train_loss": -12.43537712097168, "global_step": 344089, "epoch": 2048} {"train_loss": -12.054706573486328, "global_step": 344090, "epoch": 2048} {"train_loss": -12.338689804077148, "global_step": 344091, "epoch": 2048} {"train_loss": -12.307004928588867, "global_step": 344092, "epoch": 2048} {"train_loss": -12.331088066101074, "global_step": 344093, "epoch": 2048} {"train_loss": -12.290678024291992, "global_step": 344094, "epoch": 2048} {"train_loss": -12.463520050048828, "global_step": 344095, "epoch": 2048} {"train_loss": -12.250088691711426, "global_step": 344096, "epoch": 2048} {"train_loss": -12.156314849853516, "global_step": 344097, "epoch": 2048} {"train_loss": -12.260747909545898, "global_step": 344098, "epoch": 2048} {"train_loss": -12.280389785766602, "global_step": 344099, "epoch": 2048} {"train_loss": -11.897419929504395, "global_step": 344100, "epoch": 2048} {"train_loss": -12.448358535766602, "global_step": 344101, "epoch": 2048} {"train_loss": -12.22715950012207, "global_step": 344102, "epoch": 2048} {"train_loss": -12.392967224121094, "global_step": 344103, "epoch": 2048} {"train_loss": -12.066046714782715, "global_step": 344104, "epoch": 2048} {"train_loss": -12.295032501220703, "global_step": 344105, "epoch": 2048} {"train_loss": -12.516777992248535, "global_step": 344106, "epoch": 2048} {"train_loss": -12.279078483581543, "global_step": 344107, "epoch": 2048} {"train_loss": -12.248787879943848, "global_step": 344108, "epoch": 2048} {"train_loss": -12.130681991577148, "global_step": 344109, "epoch": 2048} {"train_loss": -12.160473823547363, "global_step": 344110, "epoch": 2048} {"train_loss": -12.229372024536133, "global_step": 344111, "epoch": 2048} {"train_loss": -12.430395126342773, "global_step": 344112, "epoch": 2048} {"train_loss": -12.32138442993164, "global_step": 344113, "epoch": 2048} {"train_loss": -12.555768966674805, "global_step": 344114, "epoch": 2048} {"train_loss": -11.771123886108398, "global_step": 344115, "epoch": 2048} {"train_loss": -11.921993255615234, "global_step": 344116, "epoch": 2048} {"train_loss": -12.683662414550781, "global_step": 344117, "epoch": 2048} {"train_loss": -12.073773384094238, "global_step": 344118, "epoch": 2048} {"train_loss": -11.924822807312012, "global_step": 344119, "epoch": 2048} {"train_loss": -12.424519538879395, "global_step": 344120, "epoch": 2048} {"train_loss": -12.419286727905273, "global_step": 344121, "epoch": 2048} {"train_loss": -12.56781005859375, "global_step": 344122, "epoch": 2048} {"train_loss": -12.465991973876953, "global_step": 344123, "epoch": 2048} {"train_loss": -12.365274429321289, "global_step": 344124, "epoch": 2048} {"train_loss": -12.14792251586914, "global_step": 344125, "epoch": 2048} {"train_loss": -12.424741744995117, "global_step": 344126, "epoch": 2048} {"train_loss": -12.58143138885498, "global_step": 344127, "epoch": 2048} {"train_loss": -11.99398136138916, "global_step": 344128, "epoch": 2048} {"train_loss": -12.116164207458496, "global_step": 344129, "epoch": 2048} {"train_loss": -12.410650253295898, "global_step": 344130, "epoch": 2048} {"train_loss": -12.229194641113281, "global_step": 344131, "epoch": 2048} {"train_loss": -12.060043334960938, "global_step": 344132, "epoch": 2048} {"train_loss": -11.997943878173828, "global_step": 344133, "epoch": 2048} {"train_loss": -12.419403076171875, "global_step": 344134, "epoch": 2048} {"train_loss": -12.31174373626709, "global_step": 344135, "epoch": 2048} {"train_loss": -12.52670669555664, "global_step": 344136, "epoch": 2048} {"train_loss": -12.522418022155762, "global_step": 344137, "epoch": 2048} {"train_loss": -12.328986167907715, "global_step": 344138, "epoch": 2048} {"train_loss": -12.327571868896484, "global_step": 344139, "epoch": 2048} {"train_loss": -12.280706405639648, "global_step": 344140, "epoch": 2048} {"train_loss": -12.817550659179688, "global_step": 344141, "epoch": 2048} {"train_loss": -12.319993019104004, "global_step": 344142, "epoch": 2048} {"train_loss": -11.954940795898438, "global_step": 344143, "epoch": 2048} {"train_loss": -12.176258087158203, "global_step": 344144, "epoch": 2048} {"train_loss": -12.689908981323242, "global_step": 344145, "epoch": 2048} {"train_loss": -12.477983474731445, "global_step": 344146, "epoch": 2048} {"train_loss": -12.440494537353516, "global_step": 344147, "epoch": 2048} {"train_loss": -12.50331974029541, "global_step": 344148, "epoch": 2048} {"train_loss": -12.536771774291992, "global_step": 344149, "epoch": 2048} {"train_loss": -12.15318489074707, "global_step": 344150, "epoch": 2048} {"train_loss": -12.312370300292969, "global_step": 344151, "epoch": 2048} {"train_loss": -12.419071197509766, "global_step": 344152, "epoch": 2048} {"train_loss": -12.152868270874023, "global_step": 344153, "epoch": 2048} {"train_loss": -12.599828720092773, "global_step": 344154, "epoch": 2048} {"train_loss": -12.458677291870117, "global_step": 344155, "epoch": 2048} {"train_loss": -12.585601806640625, "global_step": 344156, "epoch": 2048} {"train_loss": -12.568025588989258, "global_step": 344157, "epoch": 2048} {"train_loss": -12.788711547851562, "global_step": 344158, "epoch": 2048} {"train_loss": -12.219276428222656, "global_step": 344159, "epoch": 2048} {"train_loss": -11.93971061706543, "global_step": 344160, "epoch": 2048} {"train_loss": -11.836690902709961, "global_step": 344161, "epoch": 2048} {"train_loss": -11.745135307312012, "global_step": 344162, "epoch": 2048} {"train_loss": -12.538166046142578, "global_step": 344163, "epoch": 2048} {"train_loss": -12.035061836242676, "global_step": 344164, "epoch": 2048} {"train_loss": -10.558938980102539, "global_step": 344165, "epoch": 2048} {"train_loss": -11.562515258789062, "global_step": 344166, "epoch": 2048} {"train_loss": -12.370587348937988, "global_step": 344167, "epoch": 2048} {"train_loss": -11.756338119506836, "global_step": 344168, "epoch": 2048} {"train_loss": -11.830842971801758, "global_step": 344169, "epoch": 2048} {"train_loss": -12.473821640014648, "global_step": 344170, "epoch": 2048} {"train_loss": -12.272836685180664, "global_step": 344171, "epoch": 2048} {"train_loss": -11.712444305419922, "global_step": 344172, "epoch": 2048} {"train_loss": -12.23799991607666, "global_step": 344173, "epoch": 2048} {"train_loss": -12.558706283569336, "global_step": 344174, "epoch": 2048} {"train_loss": -11.690984725952148, "global_step": 344175, "epoch": 2048} {"train_loss": -11.783069610595703, "global_step": 344176, "epoch": 2048} {"train_loss": -12.323381423950195, "global_step": 344177, "epoch": 2048} {"train_loss": -12.270452499389648, "global_step": 344178, "epoch": 2048} {"train_loss": -11.591789245605469, "global_step": 344179, "epoch": 2048} {"train_loss": -11.769794464111328, "global_step": 344180, "epoch": 2048} {"train_loss": -11.415498733520508, "global_step": 344181, "epoch": 2048} {"train_loss": -11.334070205688477, "global_step": 344182, "epoch": 2048} {"train_loss": -11.736976623535156, "global_step": 344183, "epoch": 2048} {"train_loss": -11.802042007446289, "global_step": 344184, "epoch": 2048} {"train_loss": -11.458739280700684, "global_step": 344185, "epoch": 2048} {"train_loss": -11.028290748596191, "global_step": 344186, "epoch": 2048} {"train_loss": -11.407539367675781, "global_step": 344187, "epoch": 2048} {"train_loss": -11.630280494689941, "global_step": 344188, "epoch": 2048} {"train_loss": -11.138028144836426, "global_step": 344189, "epoch": 2048} {"train_loss": -11.805360794067383, "global_step": 344190, "epoch": 2048} {"train_loss": -11.999565124511719, "global_step": 344191, "epoch": 2048} {"train_loss": -12.009620666503906, "global_step": 344192, "epoch": 2048} {"train_loss": -11.851085662841797, "global_step": 344193, "epoch": 2048} {"train_loss": -12.16602897644043, "global_step": 344194, "epoch": 2048} {"train_loss": -12.077816009521484, "global_step": 344195, "epoch": 2048} {"train_loss": -12.130569458007812, "global_step": 344196, "epoch": 2048} {"train_loss": -11.809370994567871, "global_step": 344197, "epoch": 2048} {"train_loss": -11.905473709106445, "global_step": 344198, "epoch": 2048} {"train_loss": -12.219684600830078, "global_step": 344199, "epoch": 2048} {"train_loss": -12.155317306518555, "global_step": 344200, "epoch": 2048} {"train_loss": -12.304259300231934, "global_step": 344201, "epoch": 2048} {"train_loss": -12.035831451416016, "global_step": 344202, "epoch": 2048} {"train_loss": -12.624471664428711, "global_step": 344203, "epoch": 2048} {"train_loss": -11.990610122680664, "global_step": 344204, "epoch": 2048} {"train_loss": -12.020304679870605, "global_step": 344205, "epoch": 2048} {"train_loss": -12.482242584228516, "global_step": 344206, "epoch": 2048} {"train_loss": -12.353080749511719, "global_step": 344207, "epoch": 2048} {"train_loss": -12.46397876739502, "global_step": 344208, "epoch": 2048} {"train_loss": -12.27794361114502, "global_step": 344209, "epoch": 2048} {"train_loss": -12.37915325164795, "global_step": 344210, "epoch": 2048} {"train_loss": -11.892326354980469, "global_step": 344211, "epoch": 2048} {"train_loss": -12.074274063110352, "global_step": 344212, "epoch": 2048} {"train_loss": -12.221233367919922, "global_step": 344213, "epoch": 2048} {"train_loss": -11.913244247436523, "global_step": 344214, "epoch": 2048} {"train_loss": -12.060232162475586, "global_step": 344215, "epoch": 2048} {"train_loss": -12.050284385681152, "global_step": 344216, "epoch": 2048} {"train_loss": -12.331733703613281, "global_step": 344217, "epoch": 2048} {"train_loss": -12.207029342651367, "global_step": 344218, "epoch": 2048} {"train_loss": -12.266796112060547, "global_step": 344219, "epoch": 2048} {"train_loss": -11.841726303100586, "global_step": 344220, "epoch": 2048} {"train_loss": -11.91641616821289, "global_step": 344221, "epoch": 2048} {"train_loss": -11.795394897460938, "global_step": 344222, "epoch": 2048} {"train_loss": -11.338187217712402, "global_step": 344223, "epoch": 2048} {"train_loss": -10.825345993041992, "global_step": 344224, "epoch": 2048} {"train_loss": -10.293535232543945, "global_step": 344225, "epoch": 2048} {"train_loss": -10.338409423828125, "global_step": 344226, "epoch": 2048} {"train_loss": -11.926458358764648, "global_step": 344227, "epoch": 2048} {"train_loss": -10.557686805725098, "global_step": 344228, "epoch": 2048} {"train_loss": -10.18834400177002, "global_step": 344229, "epoch": 2048} {"train_loss": -10.146737098693848, "global_step": 344230, "epoch": 2048} {"train_loss": -12.036513538587661, "global_step": 344231, "epoch": 2048, "val_loss": 287401.15625} {"train_loss": -8.918924331665039, "global_step": 344232, "epoch": 2049} {"train_loss": -10.82784652709961, "global_step": 344233, "epoch": 2049} {"train_loss": -10.61145305633545, "global_step": 344234, "epoch": 2049} {"train_loss": -8.479199409484863, "global_step": 344235, "epoch": 2049} {"train_loss": -9.53844928741455, "global_step": 344236, "epoch": 2049} {"train_loss": -9.283838272094727, "global_step": 344237, "epoch": 2049} {"train_loss": -10.380875587463379, "global_step": 344238, "epoch": 2049} {"train_loss": -9.344244003295898, "global_step": 344239, "epoch": 2049} {"train_loss": -10.18730354309082, "global_step": 344240, "epoch": 2049} {"train_loss": -9.633635520935059, "global_step": 344241, "epoch": 2049} {"train_loss": -10.076309204101562, "global_step": 344242, "epoch": 2049} {"train_loss": -9.971437454223633, "global_step": 344243, "epoch": 2049} {"train_loss": -10.740116119384766, "global_step": 344244, "epoch": 2049} {"train_loss": -8.221892356872559, "global_step": 344245, "epoch": 2049} {"train_loss": -10.16775131225586, "global_step": 344246, "epoch": 2049} {"train_loss": -9.085269927978516, "global_step": 344247, "epoch": 2049} {"train_loss": -9.576647758483887, "global_step": 344248, "epoch": 2049} {"train_loss": -10.391429901123047, "global_step": 344249, "epoch": 2049} {"train_loss": -9.48819351196289, "global_step": 344250, "epoch": 2049} {"train_loss": -10.62241268157959, "global_step": 344251, "epoch": 2049} {"train_loss": -10.576638221740723, "global_step": 344252, "epoch": 2049} {"train_loss": -10.709407806396484, "global_step": 344253, "epoch": 2049} {"train_loss": -10.587047576904297, "global_step": 344254, "epoch": 2049} {"train_loss": -10.529485702514648, "global_step": 344255, "epoch": 2049} {"train_loss": -10.705915451049805, "global_step": 344256, "epoch": 2049} {"train_loss": -11.035146713256836, "global_step": 344257, "epoch": 2049} {"train_loss": -10.708993911743164, "global_step": 344258, "epoch": 2049} {"train_loss": -11.162996292114258, "global_step": 344259, "epoch": 2049} {"train_loss": -11.142487525939941, "global_step": 344260, "epoch": 2049} {"train_loss": -11.104329109191895, "global_step": 344261, "epoch": 2049} {"train_loss": -11.539592742919922, "global_step": 344262, "epoch": 2049} {"train_loss": -11.55555534362793, "global_step": 344263, "epoch": 2049} {"train_loss": -11.074481010437012, "global_step": 344264, "epoch": 2049} {"train_loss": -11.6156005859375, "global_step": 344265, "epoch": 2049} {"train_loss": -11.517168045043945, "global_step": 344266, "epoch": 2049} {"train_loss": -11.708551406860352, "global_step": 344267, "epoch": 2049} {"train_loss": -11.737590789794922, "global_step": 344268, "epoch": 2049} {"train_loss": -11.689788818359375, "global_step": 344269, "epoch": 2049} {"train_loss": -11.628350257873535, "global_step": 344270, "epoch": 2049} {"train_loss": -11.83517074584961, "global_step": 344271, "epoch": 2049} {"train_loss": -11.844274520874023, "global_step": 344272, "epoch": 2049} {"train_loss": -11.799739837646484, "global_step": 344273, "epoch": 2049} {"train_loss": -12.147013664245605, "global_step": 344274, "epoch": 2049} {"train_loss": -11.834527969360352, "global_step": 344275, "epoch": 2049} {"train_loss": -11.788602828979492, "global_step": 344276, "epoch": 2049} {"train_loss": -12.006681442260742, "global_step": 344277, "epoch": 2049} {"train_loss": -12.023282051086426, "global_step": 344278, "epoch": 2049} {"train_loss": -11.844080924987793, "global_step": 344279, "epoch": 2049} {"train_loss": -12.005471229553223, "global_step": 344280, "epoch": 2049} {"train_loss": -11.980716705322266, "global_step": 344281, "epoch": 2049} {"train_loss": -12.01016616821289, "global_step": 344282, "epoch": 2049} {"train_loss": -11.798042297363281, "global_step": 344283, "epoch": 2049} {"train_loss": -11.84709644317627, "global_step": 344284, "epoch": 2049} {"train_loss": -12.115352630615234, "global_step": 344285, "epoch": 2049} {"train_loss": -11.905685424804688, "global_step": 344286, "epoch": 2049} {"train_loss": -12.302560806274414, "global_step": 344287, "epoch": 2049} {"train_loss": -11.74155330657959, "global_step": 344288, "epoch": 2049} {"train_loss": -11.877725601196289, "global_step": 344289, "epoch": 2049} {"train_loss": -12.215210914611816, "global_step": 344290, "epoch": 2049} {"train_loss": -11.523009300231934, "global_step": 344291, "epoch": 2049} {"train_loss": -12.020610809326172, "global_step": 344292, "epoch": 2049} {"train_loss": -11.954480171203613, "global_step": 344293, "epoch": 2049} {"train_loss": -12.045524597167969, "global_step": 344294, "epoch": 2049} {"train_loss": -12.111016273498535, "global_step": 344295, "epoch": 2049} {"train_loss": -12.006695747375488, "global_step": 344296, "epoch": 2049} {"train_loss": -12.20920181274414, "global_step": 344297, "epoch": 2049} {"train_loss": -12.024709701538086, "global_step": 344298, "epoch": 2049} {"train_loss": -12.175410270690918, "global_step": 344299, "epoch": 2049} {"train_loss": -12.20730209350586, "global_step": 344300, "epoch": 2049} {"train_loss": -12.184789657592773, "global_step": 344301, "epoch": 2049} {"train_loss": -12.098751068115234, "global_step": 344302, "epoch": 2049} {"train_loss": -12.308381080627441, "global_step": 344303, "epoch": 2049} {"train_loss": -11.98991584777832, "global_step": 344304, "epoch": 2049} {"train_loss": -12.07961654663086, "global_step": 344305, "epoch": 2049} {"train_loss": -12.248470306396484, "global_step": 344306, "epoch": 2049} {"train_loss": -12.175164222717285, "global_step": 344307, "epoch": 2049} {"train_loss": -12.257811546325684, "global_step": 344308, "epoch": 2049} {"train_loss": -12.010896682739258, "global_step": 344309, "epoch": 2049} {"train_loss": -12.217187881469727, "global_step": 344310, "epoch": 2049} {"train_loss": -11.912904739379883, "global_step": 344311, "epoch": 2049} {"train_loss": -12.479323387145996, "global_step": 344312, "epoch": 2049} {"train_loss": -11.806840896606445, "global_step": 344313, "epoch": 2049} {"train_loss": -12.050918579101562, "global_step": 344314, "epoch": 2049} {"train_loss": -12.223767280578613, "global_step": 344315, "epoch": 2049} {"train_loss": -12.207447052001953, "global_step": 344316, "epoch": 2049} {"train_loss": -12.240464210510254, "global_step": 344317, "epoch": 2049} {"train_loss": -12.020879745483398, "global_step": 344318, "epoch": 2049} {"train_loss": -12.237187385559082, "global_step": 344319, "epoch": 2049} {"train_loss": -12.067408561706543, "global_step": 344320, "epoch": 2049} {"train_loss": -12.264450073242188, "global_step": 344321, "epoch": 2049} {"train_loss": -12.385223388671875, "global_step": 344322, "epoch": 2049} {"train_loss": -12.317989349365234, "global_step": 344323, "epoch": 2049} {"train_loss": -12.474035263061523, "global_step": 344324, "epoch": 2049} {"train_loss": -12.287372589111328, "global_step": 344325, "epoch": 2049} {"train_loss": -12.399406433105469, "global_step": 344326, "epoch": 2049} {"train_loss": -12.158195495605469, "global_step": 344327, "epoch": 2049} {"train_loss": -12.362882614135742, "global_step": 344328, "epoch": 2049} {"train_loss": -12.291729927062988, "global_step": 344329, "epoch": 2049} {"train_loss": -12.507259368896484, "global_step": 344330, "epoch": 2049} {"train_loss": -12.351850509643555, "global_step": 344331, "epoch": 2049} {"train_loss": -12.623795509338379, "global_step": 344332, "epoch": 2049} {"train_loss": -12.45118522644043, "global_step": 344333, "epoch": 2049} {"train_loss": -12.568885803222656, "global_step": 344334, "epoch": 2049} {"train_loss": -12.572757720947266, "global_step": 344335, "epoch": 2049} {"train_loss": -12.375116348266602, "global_step": 344336, "epoch": 2049} {"train_loss": -12.61264705657959, "global_step": 344337, "epoch": 2049} {"train_loss": -12.240608215332031, "global_step": 344338, "epoch": 2049} {"train_loss": -12.514892578125, "global_step": 344339, "epoch": 2049} {"train_loss": -12.163640022277832, "global_step": 344340, "epoch": 2049} {"train_loss": -12.612672805786133, "global_step": 344341, "epoch": 2049} {"train_loss": -12.283123016357422, "global_step": 344342, "epoch": 2049} {"train_loss": -12.276153564453125, "global_step": 344343, "epoch": 2049} {"train_loss": -12.446640968322754, "global_step": 344344, "epoch": 2049} {"train_loss": -12.184117317199707, "global_step": 344345, "epoch": 2049} {"train_loss": -12.107030868530273, "global_step": 344346, "epoch": 2049} {"train_loss": -12.349180221557617, "global_step": 344347, "epoch": 2049} {"train_loss": -12.509393692016602, "global_step": 344348, "epoch": 2049} {"train_loss": -12.21541976928711, "global_step": 344349, "epoch": 2049} {"train_loss": -12.49610710144043, "global_step": 344350, "epoch": 2049} {"train_loss": -12.488370895385742, "global_step": 344351, "epoch": 2049} {"train_loss": -12.403553009033203, "global_step": 344352, "epoch": 2049} {"train_loss": -12.439329147338867, "global_step": 344353, "epoch": 2049} {"train_loss": -12.203573226928711, "global_step": 344354, "epoch": 2049} {"train_loss": -12.59616470336914, "global_step": 344355, "epoch": 2049} {"train_loss": -12.182470321655273, "global_step": 344356, "epoch": 2049} {"train_loss": -12.393746376037598, "global_step": 344357, "epoch": 2049} {"train_loss": -12.422990798950195, "global_step": 344358, "epoch": 2049} {"train_loss": -12.663158416748047, "global_step": 344359, "epoch": 2049} {"train_loss": -12.480555534362793, "global_step": 344360, "epoch": 2049} {"train_loss": -12.588627815246582, "global_step": 344361, "epoch": 2049} {"train_loss": -12.378036499023438, "global_step": 344362, "epoch": 2049} {"train_loss": -12.422459602355957, "global_step": 344363, "epoch": 2049} {"train_loss": -12.412820816040039, "global_step": 344364, "epoch": 2049} {"train_loss": -12.66220474243164, "global_step": 344365, "epoch": 2049} {"train_loss": -12.739063262939453, "global_step": 344366, "epoch": 2049} {"train_loss": -12.711542129516602, "global_step": 344367, "epoch": 2049} {"train_loss": -12.451407432556152, "global_step": 344368, "epoch": 2049} {"train_loss": -12.460822105407715, "global_step": 344369, "epoch": 2049} {"train_loss": -12.508347511291504, "global_step": 344370, "epoch": 2049} {"train_loss": -12.549949645996094, "global_step": 344371, "epoch": 2049} {"train_loss": -12.624920845031738, "global_step": 344372, "epoch": 2049} {"train_loss": -12.769343376159668, "global_step": 344373, "epoch": 2049} {"train_loss": -12.699872016906738, "global_step": 344374, "epoch": 2049} {"train_loss": -12.684391975402832, "global_step": 344375, "epoch": 2049} {"train_loss": -12.457433700561523, "global_step": 344376, "epoch": 2049} {"train_loss": -12.67066764831543, "global_step": 344377, "epoch": 2049} {"train_loss": -12.40988540649414, "global_step": 344378, "epoch": 2049} {"train_loss": -12.751492500305176, "global_step": 344379, "epoch": 2049} {"train_loss": -12.572270393371582, "global_step": 344380, "epoch": 2049} {"train_loss": -12.541328430175781, "global_step": 344381, "epoch": 2049} {"train_loss": -12.741764068603516, "global_step": 344382, "epoch": 2049} {"train_loss": -12.582416534423828, "global_step": 344383, "epoch": 2049} {"train_loss": -12.482775688171387, "global_step": 344384, "epoch": 2049} {"train_loss": -12.420145988464355, "global_step": 344385, "epoch": 2049} {"train_loss": -12.44261360168457, "global_step": 344386, "epoch": 2049} {"train_loss": -12.558233261108398, "global_step": 344387, "epoch": 2049} {"train_loss": -12.404645919799805, "global_step": 344388, "epoch": 2049} {"train_loss": -12.374856948852539, "global_step": 344389, "epoch": 2049} {"train_loss": -12.209421157836914, "global_step": 344390, "epoch": 2049} {"train_loss": -11.872743606567383, "global_step": 344391, "epoch": 2049} {"train_loss": -12.048738479614258, "global_step": 344392, "epoch": 2049} {"train_loss": -11.99770736694336, "global_step": 344393, "epoch": 2049} {"train_loss": -11.966778755187988, "global_step": 344394, "epoch": 2049} {"train_loss": -12.299253463745117, "global_step": 344395, "epoch": 2049} {"train_loss": -11.307758331298828, "global_step": 344396, "epoch": 2049} {"train_loss": -10.848600387573242, "global_step": 344397, "epoch": 2049} {"train_loss": -10.517820358276367, "global_step": 344398, "epoch": 2049} {"train_loss": -11.822244059471856, "global_step": 344399, "epoch": 2049, "val_loss": 283006.3125} {"train_loss": -9.883100509643555, "global_step": 344400, "epoch": 2050} {"train_loss": -10.192215919494629, "global_step": 344401, "epoch": 2050} {"train_loss": -10.844341278076172, "global_step": 344402, "epoch": 2050} {"train_loss": -8.4445219039917, "global_step": 344403, "epoch": 2050} {"train_loss": -9.375231742858887, "global_step": 344404, "epoch": 2050} {"train_loss": -8.491239547729492, "global_step": 344405, "epoch": 2050} {"train_loss": -9.98811149597168, "global_step": 344406, "epoch": 2050} {"train_loss": -8.606500625610352, "global_step": 344407, "epoch": 2050} {"train_loss": -9.267049789428711, "global_step": 344408, "epoch": 2050} {"train_loss": -10.856948852539062, "global_step": 344409, "epoch": 2050} {"train_loss": -8.192578315734863, "global_step": 344410, "epoch": 2050} {"train_loss": -7.289630889892578, "global_step": 344411, "epoch": 2050} {"train_loss": -9.241795539855957, "global_step": 344412, "epoch": 2050} {"train_loss": -8.258047103881836, "global_step": 344413, "epoch": 2050} {"train_loss": -8.411815643310547, "global_step": 344414, "epoch": 2050} {"train_loss": -10.44330883026123, "global_step": 344415, "epoch": 2050} {"train_loss": -9.292356491088867, "global_step": 344416, "epoch": 2050} {"train_loss": -10.2174072265625, "global_step": 344417, "epoch": 2050} {"train_loss": -9.854528427124023, "global_step": 344418, "epoch": 2050} {"train_loss": -9.620859146118164, "global_step": 344419, "epoch": 2050} {"train_loss": -9.966283798217773, "global_step": 344420, "epoch": 2050} {"train_loss": -10.941612243652344, "global_step": 344421, "epoch": 2050} {"train_loss": -11.23857307434082, "global_step": 344422, "epoch": 2050} {"train_loss": -10.368034362792969, "global_step": 344423, "epoch": 2050} {"train_loss": -11.302661895751953, "global_step": 344424, "epoch": 2050} {"train_loss": -10.579383850097656, "global_step": 344425, "epoch": 2050} {"train_loss": -11.097394943237305, "global_step": 344426, "epoch": 2050} {"train_loss": -10.987394332885742, "global_step": 344427, "epoch": 2050} {"train_loss": -11.857975006103516, "global_step": 344428, "epoch": 2050} {"train_loss": -11.538652420043945, "global_step": 344429, "epoch": 2050} {"train_loss": -11.177000045776367, "global_step": 344430, "epoch": 2050} {"train_loss": -11.182685852050781, "global_step": 344431, "epoch": 2050} {"train_loss": -11.123044967651367, "global_step": 344432, "epoch": 2050} {"train_loss": -11.665770530700684, "global_step": 344433, "epoch": 2050} {"train_loss": -11.39185619354248, "global_step": 344434, "epoch": 2050} {"train_loss": -11.597734451293945, "global_step": 344435, "epoch": 2050} {"train_loss": -11.31955337524414, "global_step": 344436, "epoch": 2050} {"train_loss": -11.770843505859375, "global_step": 344437, "epoch": 2050} {"train_loss": -11.258444786071777, "global_step": 344438, "epoch": 2050} {"train_loss": -12.005217552185059, "global_step": 344439, "epoch": 2050} {"train_loss": -10.661701202392578, "global_step": 344440, "epoch": 2050} {"train_loss": -11.7755126953125, "global_step": 344441, "epoch": 2050} {"train_loss": -11.754886627197266, "global_step": 344442, "epoch": 2050} {"train_loss": -11.20480728149414, "global_step": 344443, "epoch": 2050} {"train_loss": -11.699152946472168, "global_step": 344444, "epoch": 2050} {"train_loss": -11.817560195922852, "global_step": 344445, "epoch": 2050} {"train_loss": -11.806232452392578, "global_step": 344446, "epoch": 2050} {"train_loss": -11.92136001586914, "global_step": 344447, "epoch": 2050} {"train_loss": -12.12026309967041, "global_step": 344448, "epoch": 2050} {"train_loss": -11.639139175415039, "global_step": 344449, "epoch": 2050} {"train_loss": -11.981836318969727, "global_step": 344450, "epoch": 2050} {"train_loss": -11.772470474243164, "global_step": 344451, "epoch": 2050} {"train_loss": -11.776970863342285, "global_step": 344452, "epoch": 2050} {"train_loss": -11.879157066345215, "global_step": 344453, "epoch": 2050} {"train_loss": -12.049653053283691, "global_step": 344454, "epoch": 2050} {"train_loss": -11.785609245300293, "global_step": 344455, "epoch": 2050} {"train_loss": -12.245153427124023, "global_step": 344456, "epoch": 2050} {"train_loss": -11.999387741088867, "global_step": 344457, "epoch": 2050} {"train_loss": -11.992708206176758, "global_step": 344458, "epoch": 2050} {"train_loss": -11.987314224243164, "global_step": 344459, "epoch": 2050} {"train_loss": -12.093012809753418, "global_step": 344460, "epoch": 2050} {"train_loss": -12.271121978759766, "global_step": 344461, "epoch": 2050} {"train_loss": -12.150934219360352, "global_step": 344462, "epoch": 2050} {"train_loss": -11.87095832824707, "global_step": 344463, "epoch": 2050} {"train_loss": -12.258794784545898, "global_step": 344464, "epoch": 2050} {"train_loss": -12.111533164978027, "global_step": 344465, "epoch": 2050} {"train_loss": -12.196807861328125, "global_step": 344466, "epoch": 2050} {"train_loss": -12.241811752319336, "global_step": 344467, "epoch": 2050} {"train_loss": -12.122928619384766, "global_step": 344468, "epoch": 2050} {"train_loss": -12.23953628540039, "global_step": 344469, "epoch": 2050} {"train_loss": -12.229226112365723, "global_step": 344470, "epoch": 2050} {"train_loss": -12.313913345336914, "global_step": 344471, "epoch": 2050} {"train_loss": -11.895576477050781, "global_step": 344472, "epoch": 2050} {"train_loss": -12.32233715057373, "global_step": 344473, "epoch": 2050} {"train_loss": -12.151567459106445, "global_step": 344474, "epoch": 2050} {"train_loss": -12.276195526123047, "global_step": 344475, "epoch": 2050} {"train_loss": -12.3469820022583, "global_step": 344476, "epoch": 2050} {"train_loss": -12.302711486816406, "global_step": 344477, "epoch": 2050} {"train_loss": -12.43284797668457, "global_step": 344478, "epoch": 2050} {"train_loss": -12.546756744384766, "global_step": 344479, "epoch": 2050} {"train_loss": -12.38567066192627, "global_step": 344480, "epoch": 2050} {"train_loss": -12.4410982131958, "global_step": 344481, "epoch": 2050} {"train_loss": -12.402997970581055, "global_step": 344482, "epoch": 2050} {"train_loss": -12.366994857788086, "global_step": 344483, "epoch": 2050} {"train_loss": -12.463871002197266, "global_step": 344484, "epoch": 2050} {"train_loss": -12.330890655517578, "global_step": 344485, "epoch": 2050} {"train_loss": -12.564465522766113, "global_step": 344486, "epoch": 2050} {"train_loss": -12.430572509765625, "global_step": 344487, "epoch": 2050} {"train_loss": -12.364046096801758, "global_step": 344488, "epoch": 2050} {"train_loss": -12.456741333007812, "global_step": 344489, "epoch": 2050} {"train_loss": -12.325399398803711, "global_step": 344490, "epoch": 2050} {"train_loss": -12.493866920471191, "global_step": 344491, "epoch": 2050} {"train_loss": -12.467096328735352, "global_step": 344492, "epoch": 2050} {"train_loss": -12.519918441772461, "global_step": 344493, "epoch": 2050} {"train_loss": -12.575785636901855, "global_step": 344494, "epoch": 2050} {"train_loss": -12.512813568115234, "global_step": 344495, "epoch": 2050} {"train_loss": -12.390801429748535, "global_step": 344496, "epoch": 2050} {"train_loss": -12.576326370239258, "global_step": 344497, "epoch": 2050} {"train_loss": -12.38292407989502, "global_step": 344498, "epoch": 2050} {"train_loss": -12.400887489318848, "global_step": 344499, "epoch": 2050} {"train_loss": -12.545340538024902, "global_step": 344500, "epoch": 2050} {"train_loss": -12.325592041015625, "global_step": 344501, "epoch": 2050} {"train_loss": -12.702926635742188, "global_step": 344502, "epoch": 2050} {"train_loss": -12.627544403076172, "global_step": 344503, "epoch": 2050} {"train_loss": -12.544099807739258, "global_step": 344504, "epoch": 2050} {"train_loss": -12.32480239868164, "global_step": 344505, "epoch": 2050} {"train_loss": -12.552522659301758, "global_step": 344506, "epoch": 2050} {"train_loss": -11.926786422729492, "global_step": 344507, "epoch": 2050} {"train_loss": -12.272445678710938, "global_step": 344508, "epoch": 2050} {"train_loss": -12.397765159606934, "global_step": 344509, "epoch": 2050} {"train_loss": -12.066585540771484, "global_step": 344510, "epoch": 2050} {"train_loss": -12.185730934143066, "global_step": 344511, "epoch": 2050} {"train_loss": -12.324801445007324, "global_step": 344512, "epoch": 2050} {"train_loss": -11.992853164672852, "global_step": 344513, "epoch": 2050} {"train_loss": -12.375455856323242, "global_step": 344514, "epoch": 2050} {"train_loss": -11.12873649597168, "global_step": 344515, "epoch": 2050} {"train_loss": -11.989908218383789, "global_step": 344516, "epoch": 2050} {"train_loss": -12.252981185913086, "global_step": 344517, "epoch": 2050} {"train_loss": -11.58448600769043, "global_step": 344518, "epoch": 2050} {"train_loss": -12.32888412475586, "global_step": 344519, "epoch": 2050} {"train_loss": -12.053287506103516, "global_step": 344520, "epoch": 2050} {"train_loss": -11.996990203857422, "global_step": 344521, "epoch": 2050} {"train_loss": -12.388486862182617, "global_step": 344522, "epoch": 2050} {"train_loss": -11.845059394836426, "global_step": 344523, "epoch": 2050} {"train_loss": -12.286128997802734, "global_step": 344524, "epoch": 2050} {"train_loss": -12.4302339553833, "global_step": 344525, "epoch": 2050} {"train_loss": -11.764955520629883, "global_step": 344526, "epoch": 2050} {"train_loss": -12.205377578735352, "global_step": 344527, "epoch": 2050} {"train_loss": -12.254096984863281, "global_step": 344528, "epoch": 2050} {"train_loss": -11.671256065368652, "global_step": 344529, "epoch": 2050} {"train_loss": -11.991744995117188, "global_step": 344530, "epoch": 2050} {"train_loss": -11.734906196594238, "global_step": 344531, "epoch": 2050} {"train_loss": -11.26821517944336, "global_step": 344532, "epoch": 2050} {"train_loss": -11.832261085510254, "global_step": 344533, "epoch": 2050} {"train_loss": -10.97073745727539, "global_step": 344534, "epoch": 2050} {"train_loss": -11.657356262207031, "global_step": 344535, "epoch": 2050} {"train_loss": -11.663772583007812, "global_step": 344536, "epoch": 2050} {"train_loss": -11.748872756958008, "global_step": 344537, "epoch": 2050} {"train_loss": -11.32396125793457, "global_step": 344538, "epoch": 2050} {"train_loss": -12.034900665283203, "global_step": 344539, "epoch": 2050} {"train_loss": -11.103748321533203, "global_step": 344540, "epoch": 2050} {"train_loss": -10.813396453857422, "global_step": 344541, "epoch": 2050} {"train_loss": -10.66125774383545, "global_step": 344542, "epoch": 2050} {"train_loss": -11.238534927368164, "global_step": 344543, "epoch": 2050} {"train_loss": -7.967869281768799, "global_step": 344544, "epoch": 2050} {"train_loss": -9.692757606506348, "global_step": 344545, "epoch": 2050} {"train_loss": -9.791167259216309, "global_step": 344546, "epoch": 2050} {"train_loss": -9.792625427246094, "global_step": 344547, "epoch": 2050} {"train_loss": -9.378559112548828, "global_step": 344548, "epoch": 2050} {"train_loss": -9.827168464660645, "global_step": 344549, "epoch": 2050} {"train_loss": -9.664673805236816, "global_step": 344550, "epoch": 2050} {"train_loss": -10.032279014587402, "global_step": 344551, "epoch": 2050} {"train_loss": -10.030041694641113, "global_step": 344552, "epoch": 2050} {"train_loss": -8.57725715637207, "global_step": 344553, "epoch": 2050} {"train_loss": -9.788533210754395, "global_step": 344554, "epoch": 2050} {"train_loss": -8.424152374267578, "global_step": 344555, "epoch": 2050} {"train_loss": -10.422504425048828, "global_step": 344556, "epoch": 2050} {"train_loss": -9.207250595092773, "global_step": 344557, "epoch": 2050} {"train_loss": -9.468750953674316, "global_step": 344558, "epoch": 2050} {"train_loss": -9.473236083984375, "global_step": 344559, "epoch": 2050} {"train_loss": -10.506919860839844, "global_step": 344560, "epoch": 2050} {"train_loss": -10.653392791748047, "global_step": 344561, "epoch": 2050} {"train_loss": -10.755537986755371, "global_step": 344562, "epoch": 2050} {"train_loss": -10.799657821655273, "global_step": 344563, "epoch": 2050} {"train_loss": -10.876173973083496, "global_step": 344564, "epoch": 2050} {"train_loss": -10.534889221191406, "global_step": 344565, "epoch": 2050} {"train_loss": -11.17557144165039, "global_step": 344566, "epoch": 2050} {"train_loss": -11.331690762724195, "global_step": 344567, "epoch": 2050, "train/sim_max_reward_0": 0.600075633952269, "train/sim_max_reward_1": 0.978306945678059, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.440369009012871, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.8270871749938578, "test/sim_max_reward_4400000": 0.9983214083290263, "test/sim_max_reward_4400001": 0.40227399248671275, "test/sim_max_reward_4400002": 0.08928661590744709, "test/sim_max_reward_4400003": 0.08401023173289131, "test/sim_max_reward_4400004": 0.4542278852333557, "test/sim_max_reward_4400005": 0.9547997146175103, "test/sim_max_reward_4400006": 0.2883992745888446, "test/sim_max_reward_4400007": 0.5708520672404747, "test/sim_max_reward_4400008": 0.6047347945869626, "test/sim_max_reward_4400009": 0.47988485712976525, "test/sim_max_reward_4400010": 0.9995744888892913, "test/sim_max_reward_4400011": 0.9646040281348661, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 0.9954019928399007, "test/sim_max_reward_4400014": 0.5189651474546596, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.5980797186593864, "test/sim_max_reward_4400019": 0.39908188140235534, "test/sim_max_reward_4400020": 0.3834697997647253, "test/sim_max_reward_4400021": 0.60949421601971, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 1.0, "test/sim_max_reward_4400024": 0.7968515385514947, "test/sim_max_reward_4400025": 0.1741402484129392, "test/sim_max_reward_4400026": 0.5872257400960489, "test/sim_max_reward_4400027": 0.9751163621760203, "test/sim_max_reward_4400028": 0.9525450709721024, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9910065745270153, "test/sim_max_reward_4400031": 0.9738222712476892, "test/sim_max_reward_4400032": 0.9264361851433095, "test/sim_max_reward_4400033": 0.5321678514116237, "test/sim_max_reward_4400034": 0.4841088021674648, "test/sim_max_reward_4400035": 0.9579862922724581, "test/sim_max_reward_4400036": 0.37412753559934764, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.5120107361775725, "test/sim_max_reward_4400039": 0.4117785158303383, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.42808170072654894, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.0, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.40705192062434137, "test/sim_max_reward_4400046": 0.9995689267794937, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6409731272728428, "test/mean_score": 0.5575897677546738, "val_loss": 286704.0625, "train_action_mse_error": 1.816845178604126} {"train_loss": -11.353830337524414, "global_step": 344568, "epoch": 2051} {"train_loss": -11.012104034423828, "global_step": 344569, "epoch": 2051} {"train_loss": -11.574138641357422, "global_step": 344570, "epoch": 2051} {"train_loss": -10.998120307922363, "global_step": 344571, "epoch": 2051} {"train_loss": -11.659196853637695, "global_step": 344572, "epoch": 2051} {"train_loss": -11.420947074890137, "global_step": 344573, "epoch": 2051} {"train_loss": -11.372044563293457, "global_step": 344574, "epoch": 2051} {"train_loss": -11.612873077392578, "global_step": 344575, "epoch": 2051} {"train_loss": -11.607537269592285, "global_step": 344576, "epoch": 2051} {"train_loss": -11.294527053833008, "global_step": 344577, "epoch": 2051} {"train_loss": -11.605499267578125, "global_step": 344578, "epoch": 2051} {"train_loss": -11.740599632263184, "global_step": 344579, "epoch": 2051} {"train_loss": -11.558682441711426, "global_step": 344580, "epoch": 2051} {"train_loss": -11.506363868713379, "global_step": 344581, "epoch": 2051} {"train_loss": -11.659262657165527, "global_step": 344582, "epoch": 2051} {"train_loss": -11.19921875, "global_step": 344583, "epoch": 2051} {"train_loss": -11.930227279663086, "global_step": 344584, "epoch": 2051} {"train_loss": -11.854557991027832, "global_step": 344585, "epoch": 2051} {"train_loss": -11.8253173828125, "global_step": 344586, "epoch": 2051} {"train_loss": -11.98466682434082, "global_step": 344587, "epoch": 2051} {"train_loss": -11.898361206054688, "global_step": 344588, "epoch": 2051} {"train_loss": -11.878857612609863, "global_step": 344589, "epoch": 2051} {"train_loss": -11.930442810058594, "global_step": 344590, "epoch": 2051} {"train_loss": -12.109245300292969, "global_step": 344591, "epoch": 2051} {"train_loss": -12.097941398620605, "global_step": 344592, "epoch": 2051} {"train_loss": -12.035743713378906, "global_step": 344593, "epoch": 2051} {"train_loss": -11.96981430053711, "global_step": 344594, "epoch": 2051} {"train_loss": -12.089432716369629, "global_step": 344595, "epoch": 2051} {"train_loss": -12.170149803161621, "global_step": 344596, "epoch": 2051} {"train_loss": -12.002321243286133, "global_step": 344597, "epoch": 2051} {"train_loss": -12.014063835144043, "global_step": 344598, "epoch": 2051} {"train_loss": -12.124626159667969, "global_step": 344599, "epoch": 2051} {"train_loss": -12.174541473388672, "global_step": 344600, "epoch": 2051} {"train_loss": -12.129411697387695, "global_step": 344601, "epoch": 2051} {"train_loss": -12.148265838623047, "global_step": 344602, "epoch": 2051} {"train_loss": -12.263368606567383, "global_step": 344603, "epoch": 2051} {"train_loss": -12.257705688476562, "global_step": 344604, "epoch": 2051} {"train_loss": -12.215506553649902, "global_step": 344605, "epoch": 2051} {"train_loss": -12.245294570922852, "global_step": 344606, "epoch": 2051} {"train_loss": -12.176959991455078, "global_step": 344607, "epoch": 2051} {"train_loss": -11.804811477661133, "global_step": 344608, "epoch": 2051} {"train_loss": -12.224098205566406, "global_step": 344609, "epoch": 2051} {"train_loss": -12.120901107788086, "global_step": 344610, "epoch": 2051} {"train_loss": -12.030590057373047, "global_step": 344611, "epoch": 2051} {"train_loss": -12.412702560424805, "global_step": 344612, "epoch": 2051} {"train_loss": -12.363964080810547, "global_step": 344613, "epoch": 2051} {"train_loss": -12.23047924041748, "global_step": 344614, "epoch": 2051} {"train_loss": -12.249500274658203, "global_step": 344615, "epoch": 2051} {"train_loss": -12.262785911560059, "global_step": 344616, "epoch": 2051} {"train_loss": -12.31890869140625, "global_step": 344617, "epoch": 2051} {"train_loss": -12.317220687866211, "global_step": 344618, "epoch": 2051} {"train_loss": -12.354129791259766, "global_step": 344619, "epoch": 2051} {"train_loss": -12.39686393737793, "global_step": 344620, "epoch": 2051} {"train_loss": -12.3568115234375, "global_step": 344621, "epoch": 2051} {"train_loss": -12.239860534667969, "global_step": 344622, "epoch": 2051} {"train_loss": -12.240859985351562, "global_step": 344623, "epoch": 2051} {"train_loss": -12.297721862792969, "global_step": 344624, "epoch": 2051} {"train_loss": -12.286216735839844, "global_step": 344625, "epoch": 2051} {"train_loss": -12.180745124816895, "global_step": 344626, "epoch": 2051} {"train_loss": -12.130868911743164, "global_step": 344627, "epoch": 2051} {"train_loss": -12.567462921142578, "global_step": 344628, "epoch": 2051} {"train_loss": -12.28695297241211, "global_step": 344629, "epoch": 2051} {"train_loss": -12.526237487792969, "global_step": 344630, "epoch": 2051} {"train_loss": -12.308690071105957, "global_step": 344631, "epoch": 2051} {"train_loss": -12.593847274780273, "global_step": 344632, "epoch": 2051} {"train_loss": -12.281336784362793, "global_step": 344633, "epoch": 2051} {"train_loss": -12.468927383422852, "global_step": 344634, "epoch": 2051} {"train_loss": -12.247495651245117, "global_step": 344635, "epoch": 2051} {"train_loss": -12.507408142089844, "global_step": 344636, "epoch": 2051} {"train_loss": -12.456733703613281, "global_step": 344637, "epoch": 2051} {"train_loss": -12.348502159118652, "global_step": 344638, "epoch": 2051} {"train_loss": -12.514103889465332, "global_step": 344639, "epoch": 2051} {"train_loss": -12.368193626403809, "global_step": 344640, "epoch": 2051} {"train_loss": -12.433710098266602, "global_step": 344641, "epoch": 2051} {"train_loss": -12.169126510620117, "global_step": 344642, "epoch": 2051} {"train_loss": -12.600967407226562, "global_step": 344643, "epoch": 2051} {"train_loss": -12.223801612854004, "global_step": 344644, "epoch": 2051} {"train_loss": -12.278881072998047, "global_step": 344645, "epoch": 2051} {"train_loss": -12.272186279296875, "global_step": 344646, "epoch": 2051} {"train_loss": -12.441812515258789, "global_step": 344647, "epoch": 2051} {"train_loss": -12.562749862670898, "global_step": 344648, "epoch": 2051} {"train_loss": -12.421743392944336, "global_step": 344649, "epoch": 2051} {"train_loss": -12.327186584472656, "global_step": 344650, "epoch": 2051} {"train_loss": -12.466567993164062, "global_step": 344651, "epoch": 2051} {"train_loss": -12.427492141723633, "global_step": 344652, "epoch": 2051} {"train_loss": -12.473058700561523, "global_step": 344653, "epoch": 2051} {"train_loss": -12.504328727722168, "global_step": 344654, "epoch": 2051} {"train_loss": -12.522761344909668, "global_step": 344655, "epoch": 2051} {"train_loss": -12.399123191833496, "global_step": 344656, "epoch": 2051} {"train_loss": -12.715088844299316, "global_step": 344657, "epoch": 2051} {"train_loss": -12.394021987915039, "global_step": 344658, "epoch": 2051} {"train_loss": -12.507140159606934, "global_step": 344659, "epoch": 2051} {"train_loss": -12.589499473571777, "global_step": 344660, "epoch": 2051} {"train_loss": -12.597525596618652, "global_step": 344661, "epoch": 2051} {"train_loss": -12.571263313293457, "global_step": 344662, "epoch": 2051} {"train_loss": -12.605350494384766, "global_step": 344663, "epoch": 2051} {"train_loss": -12.520285606384277, "global_step": 344664, "epoch": 2051} {"train_loss": -12.533723831176758, "global_step": 344665, "epoch": 2051} {"train_loss": -12.711779594421387, "global_step": 344666, "epoch": 2051} {"train_loss": -12.606559753417969, "global_step": 344667, "epoch": 2051} {"train_loss": -12.49085521697998, "global_step": 344668, "epoch": 2051} {"train_loss": -12.546772003173828, "global_step": 344669, "epoch": 2051} {"train_loss": -12.512051582336426, "global_step": 344670, "epoch": 2051} {"train_loss": -12.737436294555664, "global_step": 344671, "epoch": 2051} {"train_loss": -12.862835884094238, "global_step": 344672, "epoch": 2051} {"train_loss": -12.720856666564941, "global_step": 344673, "epoch": 2051} {"train_loss": -12.565631866455078, "global_step": 344674, "epoch": 2051} {"train_loss": -12.642237663269043, "global_step": 344675, "epoch": 2051} {"train_loss": -12.754807472229004, "global_step": 344676, "epoch": 2051} {"train_loss": -12.359861373901367, "global_step": 344677, "epoch": 2051} {"train_loss": -12.130764961242676, "global_step": 344678, "epoch": 2051} {"train_loss": -11.661914825439453, "global_step": 344679, "epoch": 2051} {"train_loss": -12.175985336303711, "global_step": 344680, "epoch": 2051} {"train_loss": -12.578784942626953, "global_step": 344681, "epoch": 2051} {"train_loss": -11.995911598205566, "global_step": 344682, "epoch": 2051} {"train_loss": -12.33271598815918, "global_step": 344683, "epoch": 2051} {"train_loss": -12.136899948120117, "global_step": 344684, "epoch": 2051} {"train_loss": -12.128487586975098, "global_step": 344685, "epoch": 2051} {"train_loss": -12.436375617980957, "global_step": 344686, "epoch": 2051} {"train_loss": -12.391134262084961, "global_step": 344687, "epoch": 2051} {"train_loss": -12.112348556518555, "global_step": 344688, "epoch": 2051} {"train_loss": -12.150732040405273, "global_step": 344689, "epoch": 2051} {"train_loss": -12.232978820800781, "global_step": 344690, "epoch": 2051} {"train_loss": -11.889556884765625, "global_step": 344691, "epoch": 2051} {"train_loss": -12.245401382446289, "global_step": 344692, "epoch": 2051} {"train_loss": -11.377634048461914, "global_step": 344693, "epoch": 2051} {"train_loss": -12.105913162231445, "global_step": 344694, "epoch": 2051} {"train_loss": -12.568902015686035, "global_step": 344695, "epoch": 2051} {"train_loss": -12.411789894104004, "global_step": 344696, "epoch": 2051} {"train_loss": -12.050276756286621, "global_step": 344697, "epoch": 2051} {"train_loss": -11.961329460144043, "global_step": 344698, "epoch": 2051} {"train_loss": -12.645913124084473, "global_step": 344699, "epoch": 2051} {"train_loss": -11.026988983154297, "global_step": 344700, "epoch": 2051} {"train_loss": -10.175086975097656, "global_step": 344701, "epoch": 2051} {"train_loss": -12.198603630065918, "global_step": 344702, "epoch": 2051} {"train_loss": -10.606443405151367, "global_step": 344703, "epoch": 2051} {"train_loss": -9.236539840698242, "global_step": 344704, "epoch": 2051} {"train_loss": -12.162996292114258, "global_step": 344705, "epoch": 2051} {"train_loss": -9.592245101928711, "global_step": 344706, "epoch": 2051} {"train_loss": -11.271492958068848, "global_step": 344707, "epoch": 2051} {"train_loss": -11.438562393188477, "global_step": 344708, "epoch": 2051} {"train_loss": -11.14765739440918, "global_step": 344709, "epoch": 2051} {"train_loss": -11.686142921447754, "global_step": 344710, "epoch": 2051} {"train_loss": -10.491344451904297, "global_step": 344711, "epoch": 2051} {"train_loss": -10.861074447631836, "global_step": 344712, "epoch": 2051} {"train_loss": -11.141546249389648, "global_step": 344713, "epoch": 2051} {"train_loss": -11.727240562438965, "global_step": 344714, "epoch": 2051} {"train_loss": -10.760330200195312, "global_step": 344715, "epoch": 2051} {"train_loss": -10.943288803100586, "global_step": 344716, "epoch": 2051} {"train_loss": -10.194565773010254, "global_step": 344717, "epoch": 2051} {"train_loss": -10.777166366577148, "global_step": 344718, "epoch": 2051} {"train_loss": -10.46027946472168, "global_step": 344719, "epoch": 2051} {"train_loss": -11.355030059814453, "global_step": 344720, "epoch": 2051} {"train_loss": -10.53471851348877, "global_step": 344721, "epoch": 2051} {"train_loss": -10.947803497314453, "global_step": 344722, "epoch": 2051} {"train_loss": -11.053563117980957, "global_step": 344723, "epoch": 2051} {"train_loss": -10.28053092956543, "global_step": 344724, "epoch": 2051} {"train_loss": -12.227397918701172, "global_step": 344725, "epoch": 2051} {"train_loss": -10.689126968383789, "global_step": 344726, "epoch": 2051} {"train_loss": -11.676252365112305, "global_step": 344727, "epoch": 2051} {"train_loss": -11.533674240112305, "global_step": 344728, "epoch": 2051} {"train_loss": -11.289291381835938, "global_step": 344729, "epoch": 2051} {"train_loss": -11.478377342224121, "global_step": 344730, "epoch": 2051} {"train_loss": -11.252337455749512, "global_step": 344731, "epoch": 2051} {"train_loss": -11.339509963989258, "global_step": 344732, "epoch": 2051} {"train_loss": -12.03891658782959, "global_step": 344733, "epoch": 2051} {"train_loss": -11.022123336791992, "global_step": 344734, "epoch": 2051} {"train_loss": -11.954258827936082, "global_step": 344735, "epoch": 2051, "val_loss": 285270.03125} {"train_loss": -10.639881134033203, "global_step": 344736, "epoch": 2052} {"train_loss": -11.485745429992676, "global_step": 344737, "epoch": 2052} {"train_loss": -11.591096878051758, "global_step": 344738, "epoch": 2052} {"train_loss": -10.433839797973633, "global_step": 344739, "epoch": 2052} {"train_loss": -11.214584350585938, "global_step": 344740, "epoch": 2052} {"train_loss": -11.036625862121582, "global_step": 344741, "epoch": 2052} {"train_loss": -10.54981517791748, "global_step": 344742, "epoch": 2052} {"train_loss": -11.319676399230957, "global_step": 344743, "epoch": 2052} {"train_loss": -11.056314468383789, "global_step": 344744, "epoch": 2052} {"train_loss": -9.870450019836426, "global_step": 344745, "epoch": 2052} {"train_loss": -11.42666244506836, "global_step": 344746, "epoch": 2052} {"train_loss": -10.894159317016602, "global_step": 344747, "epoch": 2052} {"train_loss": -10.614564895629883, "global_step": 344748, "epoch": 2052} {"train_loss": -11.369481086730957, "global_step": 344749, "epoch": 2052} {"train_loss": -10.749220848083496, "global_step": 344750, "epoch": 2052} {"train_loss": -11.334741592407227, "global_step": 344751, "epoch": 2052} {"train_loss": -10.891548156738281, "global_step": 344752, "epoch": 2052} {"train_loss": -11.14630126953125, "global_step": 344753, "epoch": 2052} {"train_loss": -11.841619491577148, "global_step": 344754, "epoch": 2052} {"train_loss": -11.62948989868164, "global_step": 344755, "epoch": 2052} {"train_loss": -11.520405769348145, "global_step": 344756, "epoch": 2052} {"train_loss": -11.38770866394043, "global_step": 344757, "epoch": 2052} {"train_loss": -11.658936500549316, "global_step": 344758, "epoch": 2052} {"train_loss": -11.055315017700195, "global_step": 344759, "epoch": 2052} {"train_loss": -11.631391525268555, "global_step": 344760, "epoch": 2052} {"train_loss": -11.686674118041992, "global_step": 344761, "epoch": 2052} {"train_loss": -10.987558364868164, "global_step": 344762, "epoch": 2052} {"train_loss": -11.867253303527832, "global_step": 344763, "epoch": 2052} {"train_loss": -10.979469299316406, "global_step": 344764, "epoch": 2052} {"train_loss": -11.521614074707031, "global_step": 344765, "epoch": 2052} {"train_loss": -11.362646102905273, "global_step": 344766, "epoch": 2052} {"train_loss": -11.585294723510742, "global_step": 344767, "epoch": 2052} {"train_loss": -11.520807266235352, "global_step": 344768, "epoch": 2052} {"train_loss": -11.143791198730469, "global_step": 344769, "epoch": 2052} {"train_loss": -11.308006286621094, "global_step": 344770, "epoch": 2052} {"train_loss": -11.123668670654297, "global_step": 344771, "epoch": 2052} {"train_loss": -11.426108360290527, "global_step": 344772, "epoch": 2052} {"train_loss": -11.696756362915039, "global_step": 344773, "epoch": 2052} {"train_loss": -11.531280517578125, "global_step": 344774, "epoch": 2052} {"train_loss": -11.73080825805664, "global_step": 344775, "epoch": 2052} {"train_loss": -11.384319305419922, "global_step": 344776, "epoch": 2052} {"train_loss": -11.995780944824219, "global_step": 344777, "epoch": 2052} {"train_loss": -11.77598762512207, "global_step": 344778, "epoch": 2052} {"train_loss": -11.679862976074219, "global_step": 344779, "epoch": 2052} {"train_loss": -12.104646682739258, "global_step": 344780, "epoch": 2052} {"train_loss": -11.983362197875977, "global_step": 344781, "epoch": 2052} {"train_loss": -12.143108367919922, "global_step": 344782, "epoch": 2052} {"train_loss": -11.824411392211914, "global_step": 344783, "epoch": 2052} {"train_loss": -12.206936836242676, "global_step": 344784, "epoch": 2052} {"train_loss": -11.619491577148438, "global_step": 344785, "epoch": 2052} {"train_loss": -11.997308731079102, "global_step": 344786, "epoch": 2052} {"train_loss": -11.693990707397461, "global_step": 344787, "epoch": 2052} {"train_loss": -11.942890167236328, "global_step": 344788, "epoch": 2052} {"train_loss": -11.809850692749023, "global_step": 344789, "epoch": 2052} {"train_loss": -11.955883979797363, "global_step": 344790, "epoch": 2052} {"train_loss": -11.629598617553711, "global_step": 344791, "epoch": 2052} {"train_loss": -11.925642013549805, "global_step": 344792, "epoch": 2052} {"train_loss": -12.0750732421875, "global_step": 344793, "epoch": 2052} {"train_loss": -11.704992294311523, "global_step": 344794, "epoch": 2052} {"train_loss": -12.221409797668457, "global_step": 344795, "epoch": 2052} {"train_loss": -11.84605598449707, "global_step": 344796, "epoch": 2052} {"train_loss": -12.136677742004395, "global_step": 344797, "epoch": 2052} {"train_loss": -11.821416854858398, "global_step": 344798, "epoch": 2052} {"train_loss": -12.065582275390625, "global_step": 344799, "epoch": 2052} {"train_loss": -12.004613876342773, "global_step": 344800, "epoch": 2052} {"train_loss": -12.284599304199219, "global_step": 344801, "epoch": 2052} {"train_loss": -11.979267120361328, "global_step": 344802, "epoch": 2052} {"train_loss": -12.402396202087402, "global_step": 344803, "epoch": 2052} {"train_loss": -11.958789825439453, "global_step": 344804, "epoch": 2052} {"train_loss": -12.370355606079102, "global_step": 344805, "epoch": 2052} {"train_loss": -11.83863639831543, "global_step": 344806, "epoch": 2052} {"train_loss": -12.099203109741211, "global_step": 344807, "epoch": 2052} {"train_loss": -12.144807815551758, "global_step": 344808, "epoch": 2052} {"train_loss": -12.349666595458984, "global_step": 344809, "epoch": 2052} {"train_loss": -12.261399269104004, "global_step": 344810, "epoch": 2052} {"train_loss": -12.138145446777344, "global_step": 344811, "epoch": 2052} {"train_loss": -12.485518455505371, "global_step": 344812, "epoch": 2052} {"train_loss": -12.300517082214355, "global_step": 344813, "epoch": 2052} {"train_loss": -12.425925254821777, "global_step": 344814, "epoch": 2052} {"train_loss": -12.376294136047363, "global_step": 344815, "epoch": 2052} {"train_loss": -12.453947067260742, "global_step": 344816, "epoch": 2052} {"train_loss": -12.150662422180176, "global_step": 344817, "epoch": 2052} {"train_loss": -12.364791870117188, "global_step": 344818, "epoch": 2052} {"train_loss": -12.393720626831055, "global_step": 344819, "epoch": 2052} {"train_loss": -12.552130699157715, "global_step": 344820, "epoch": 2052} {"train_loss": -12.349306106567383, "global_step": 344821, "epoch": 2052} {"train_loss": -12.443595886230469, "global_step": 344822, "epoch": 2052} {"train_loss": -12.408066749572754, "global_step": 344823, "epoch": 2052} {"train_loss": -12.478599548339844, "global_step": 344824, "epoch": 2052} {"train_loss": -12.48069953918457, "global_step": 344825, "epoch": 2052} {"train_loss": -11.997156143188477, "global_step": 344826, "epoch": 2052} {"train_loss": -12.430543899536133, "global_step": 344827, "epoch": 2052} {"train_loss": -12.41524600982666, "global_step": 344828, "epoch": 2052} {"train_loss": -12.49618148803711, "global_step": 344829, "epoch": 2052} {"train_loss": -12.580397605895996, "global_step": 344830, "epoch": 2052} {"train_loss": -12.408021926879883, "global_step": 344831, "epoch": 2052} {"train_loss": -12.568472862243652, "global_step": 344832, "epoch": 2052} {"train_loss": -12.463046073913574, "global_step": 344833, "epoch": 2052} {"train_loss": -12.203660011291504, "global_step": 344834, "epoch": 2052} {"train_loss": -12.579514503479004, "global_step": 344835, "epoch": 2052} {"train_loss": -12.702970504760742, "global_step": 344836, "epoch": 2052} {"train_loss": -12.737066268920898, "global_step": 344837, "epoch": 2052} {"train_loss": -12.584875106811523, "global_step": 344838, "epoch": 2052} {"train_loss": -12.399301528930664, "global_step": 344839, "epoch": 2052} {"train_loss": -12.609911918640137, "global_step": 344840, "epoch": 2052} {"train_loss": -12.279641151428223, "global_step": 344841, "epoch": 2052} {"train_loss": -12.388984680175781, "global_step": 344842, "epoch": 2052} {"train_loss": -12.410205841064453, "global_step": 344843, "epoch": 2052} {"train_loss": -12.50130844116211, "global_step": 344844, "epoch": 2052} {"train_loss": -12.562662124633789, "global_step": 344845, "epoch": 2052} {"train_loss": -12.285650253295898, "global_step": 344846, "epoch": 2052} {"train_loss": -12.449831008911133, "global_step": 344847, "epoch": 2052} {"train_loss": -12.345898628234863, "global_step": 344848, "epoch": 2052} {"train_loss": -12.673974990844727, "global_step": 344849, "epoch": 2052} {"train_loss": -12.693229675292969, "global_step": 344850, "epoch": 2052} {"train_loss": -12.562885284423828, "global_step": 344851, "epoch": 2052} {"train_loss": -12.575230598449707, "global_step": 344852, "epoch": 2052} {"train_loss": -12.352704048156738, "global_step": 344853, "epoch": 2052} {"train_loss": -12.685873985290527, "global_step": 344854, "epoch": 2052} {"train_loss": -12.608817100524902, "global_step": 344855, "epoch": 2052} {"train_loss": -12.217440605163574, "global_step": 344856, "epoch": 2052} {"train_loss": -12.563410758972168, "global_step": 344857, "epoch": 2052} {"train_loss": -12.698715209960938, "global_step": 344858, "epoch": 2052} {"train_loss": -12.533137321472168, "global_step": 344859, "epoch": 2052} {"train_loss": -12.494315147399902, "global_step": 344860, "epoch": 2052} {"train_loss": -12.573149681091309, "global_step": 344861, "epoch": 2052} {"train_loss": -12.922264099121094, "global_step": 344862, "epoch": 2052} {"train_loss": -12.36846923828125, "global_step": 344863, "epoch": 2052} {"train_loss": -12.762568473815918, "global_step": 344864, "epoch": 2052} {"train_loss": -12.703156471252441, "global_step": 344865, "epoch": 2052} {"train_loss": -12.574237823486328, "global_step": 344866, "epoch": 2052} {"train_loss": -12.48609733581543, "global_step": 344867, "epoch": 2052} {"train_loss": -12.654462814331055, "global_step": 344868, "epoch": 2052} {"train_loss": -12.553081512451172, "global_step": 344869, "epoch": 2052} {"train_loss": -11.487142562866211, "global_step": 344870, "epoch": 2052} {"train_loss": -10.170211791992188, "global_step": 344871, "epoch": 2052} {"train_loss": -12.752042770385742, "global_step": 344872, "epoch": 2052} {"train_loss": -9.35086441040039, "global_step": 344873, "epoch": 2052} {"train_loss": -10.759714126586914, "global_step": 344874, "epoch": 2052} {"train_loss": -12.072912216186523, "global_step": 344875, "epoch": 2052} {"train_loss": -8.457809448242188, "global_step": 344876, "epoch": 2052} {"train_loss": -7.900054931640625, "global_step": 344877, "epoch": 2052} {"train_loss": -6.830174446105957, "global_step": 344878, "epoch": 2052} {"train_loss": -6.75046968460083, "global_step": 344879, "epoch": 2052} {"train_loss": -7.625617027282715, "global_step": 344880, "epoch": 2052} {"train_loss": -6.9746856689453125, "global_step": 344881, "epoch": 2052} {"train_loss": -7.650367736816406, "global_step": 344882, "epoch": 2052} {"train_loss": -8.03533935546875, "global_step": 344883, "epoch": 2052} {"train_loss": -7.813725471496582, "global_step": 344884, "epoch": 2052} {"train_loss": -7.84970235824585, "global_step": 344885, "epoch": 2052} {"train_loss": -8.003555297851562, "global_step": 344886, "epoch": 2052} {"train_loss": -8.543493270874023, "global_step": 344887, "epoch": 2052} {"train_loss": -8.872310638427734, "global_step": 344888, "epoch": 2052} {"train_loss": -8.449860572814941, "global_step": 344889, "epoch": 2052} {"train_loss": -8.75235366821289, "global_step": 344890, "epoch": 2052} {"train_loss": -8.362715721130371, "global_step": 344891, "epoch": 2052} {"train_loss": -8.381797790527344, "global_step": 344892, "epoch": 2052} {"train_loss": -9.266414642333984, "global_step": 344893, "epoch": 2052} {"train_loss": -9.471031188964844, "global_step": 344894, "epoch": 2052} {"train_loss": -9.376409530639648, "global_step": 344895, "epoch": 2052} {"train_loss": -10.001060485839844, "global_step": 344896, "epoch": 2052} {"train_loss": -10.203704833984375, "global_step": 344897, "epoch": 2052} {"train_loss": -10.424239158630371, "global_step": 344898, "epoch": 2052} {"train_loss": -10.047639846801758, "global_step": 344899, "epoch": 2052} {"train_loss": -10.479219436645508, "global_step": 344900, "epoch": 2052} {"train_loss": -10.383502960205078, "global_step": 344901, "epoch": 2052} {"train_loss": -10.428689002990723, "global_step": 344902, "epoch": 2052} {"train_loss": -11.422048563048953, "global_step": 344903, "epoch": 2052, "val_loss": 285281.46875} {"train_loss": -10.692771911621094, "global_step": 344904, "epoch": 2053} {"train_loss": -10.515155792236328, "global_step": 344905, "epoch": 2053} {"train_loss": -9.969173431396484, "global_step": 344906, "epoch": 2053} {"train_loss": -11.372509002685547, "global_step": 344907, "epoch": 2053} {"train_loss": -9.834196090698242, "global_step": 344908, "epoch": 2053} {"train_loss": -10.28363037109375, "global_step": 344909, "epoch": 2053} {"train_loss": -11.138814926147461, "global_step": 344910, "epoch": 2053} {"train_loss": -10.516063690185547, "global_step": 344911, "epoch": 2053} {"train_loss": -11.375062942504883, "global_step": 344912, "epoch": 2053} {"train_loss": -11.107025146484375, "global_step": 344913, "epoch": 2053} {"train_loss": -11.554643630981445, "global_step": 344914, "epoch": 2053} {"train_loss": -11.001809120178223, "global_step": 344915, "epoch": 2053} {"train_loss": -11.070196151733398, "global_step": 344916, "epoch": 2053} {"train_loss": -11.042560577392578, "global_step": 344917, "epoch": 2053} {"train_loss": -11.841181755065918, "global_step": 344918, "epoch": 2053} {"train_loss": -10.991730690002441, "global_step": 344919, "epoch": 2053} {"train_loss": -11.243146896362305, "global_step": 344920, "epoch": 2053} {"train_loss": -11.29350471496582, "global_step": 344921, "epoch": 2053} {"train_loss": -11.304790496826172, "global_step": 344922, "epoch": 2053} {"train_loss": -11.367706298828125, "global_step": 344923, "epoch": 2053} {"train_loss": -11.733329772949219, "global_step": 344924, "epoch": 2053} {"train_loss": -11.539628982543945, "global_step": 344925, "epoch": 2053} {"train_loss": -11.713451385498047, "global_step": 344926, "epoch": 2053} {"train_loss": -11.608451843261719, "global_step": 344927, "epoch": 2053} {"train_loss": -11.381284713745117, "global_step": 344928, "epoch": 2053} {"train_loss": -12.088892936706543, "global_step": 344929, "epoch": 2053} {"train_loss": -11.649202346801758, "global_step": 344930, "epoch": 2053} {"train_loss": -11.752723693847656, "global_step": 344931, "epoch": 2053} {"train_loss": -12.017364501953125, "global_step": 344932, "epoch": 2053} {"train_loss": -11.565299987792969, "global_step": 344933, "epoch": 2053} {"train_loss": -12.100545883178711, "global_step": 344934, "epoch": 2053} {"train_loss": -12.238235473632812, "global_step": 344935, "epoch": 2053} {"train_loss": -11.888425827026367, "global_step": 344936, "epoch": 2053} {"train_loss": -11.633415222167969, "global_step": 344937, "epoch": 2053} {"train_loss": -11.753837585449219, "global_step": 344938, "epoch": 2053} {"train_loss": -11.6409912109375, "global_step": 344939, "epoch": 2053} {"train_loss": -12.089765548706055, "global_step": 344940, "epoch": 2053} {"train_loss": -11.60435676574707, "global_step": 344941, "epoch": 2053} {"train_loss": -11.84968090057373, "global_step": 344942, "epoch": 2053} {"train_loss": -11.805032730102539, "global_step": 344943, "epoch": 2053} {"train_loss": -12.090484619140625, "global_step": 344944, "epoch": 2053} {"train_loss": -11.984833717346191, "global_step": 344945, "epoch": 2053} {"train_loss": -12.417531967163086, "global_step": 344946, "epoch": 2053} {"train_loss": -11.935176849365234, "global_step": 344947, "epoch": 2053} {"train_loss": -12.078522682189941, "global_step": 344948, "epoch": 2053} {"train_loss": -12.009051322937012, "global_step": 344949, "epoch": 2053} {"train_loss": -12.131400108337402, "global_step": 344950, "epoch": 2053} {"train_loss": -12.136211395263672, "global_step": 344951, "epoch": 2053} {"train_loss": -12.153924942016602, "global_step": 344952, "epoch": 2053} {"train_loss": -12.034669876098633, "global_step": 344953, "epoch": 2053} {"train_loss": -12.295907974243164, "global_step": 344954, "epoch": 2053} {"train_loss": -12.247440338134766, "global_step": 344955, "epoch": 2053} {"train_loss": -12.236272811889648, "global_step": 344956, "epoch": 2053} {"train_loss": -12.061169624328613, "global_step": 344957, "epoch": 2053} {"train_loss": -12.099321365356445, "global_step": 344958, "epoch": 2053} {"train_loss": -12.117034912109375, "global_step": 344959, "epoch": 2053} {"train_loss": -12.244545936584473, "global_step": 344960, "epoch": 2053} {"train_loss": -11.71831226348877, "global_step": 344961, "epoch": 2053} {"train_loss": -12.16408920288086, "global_step": 344962, "epoch": 2053} {"train_loss": -12.141666412353516, "global_step": 344963, "epoch": 2053} {"train_loss": -12.165103912353516, "global_step": 344964, "epoch": 2053} {"train_loss": -11.974466323852539, "global_step": 344965, "epoch": 2053} {"train_loss": -12.268646240234375, "global_step": 344966, "epoch": 2053} {"train_loss": -11.939641952514648, "global_step": 344967, "epoch": 2053} {"train_loss": -11.908193588256836, "global_step": 344968, "epoch": 2053} {"train_loss": -11.862264633178711, "global_step": 344969, "epoch": 2053} {"train_loss": -12.320640563964844, "global_step": 344970, "epoch": 2053} {"train_loss": -11.900150299072266, "global_step": 344971, "epoch": 2053} {"train_loss": -12.417891502380371, "global_step": 344972, "epoch": 2053} {"train_loss": -12.076000213623047, "global_step": 344973, "epoch": 2053} {"train_loss": -12.01690673828125, "global_step": 344974, "epoch": 2053} {"train_loss": -12.378207206726074, "global_step": 344975, "epoch": 2053} {"train_loss": -12.34821605682373, "global_step": 344976, "epoch": 2053} {"train_loss": -12.196844100952148, "global_step": 344977, "epoch": 2053} {"train_loss": -12.313421249389648, "global_step": 344978, "epoch": 2053} {"train_loss": -11.999553680419922, "global_step": 344979, "epoch": 2053} {"train_loss": -12.41571044921875, "global_step": 344980, "epoch": 2053} {"train_loss": -12.047833442687988, "global_step": 344981, "epoch": 2053} {"train_loss": -12.02054214477539, "global_step": 344982, "epoch": 2053} {"train_loss": -12.193429946899414, "global_step": 344983, "epoch": 2053} {"train_loss": -12.127235412597656, "global_step": 344984, "epoch": 2053} {"train_loss": -12.39141845703125, "global_step": 344985, "epoch": 2053} {"train_loss": -12.031990051269531, "global_step": 344986, "epoch": 2053} {"train_loss": -12.326258659362793, "global_step": 344987, "epoch": 2053} {"train_loss": -12.310155868530273, "global_step": 344988, "epoch": 2053} {"train_loss": -12.153185844421387, "global_step": 344989, "epoch": 2053} {"train_loss": -12.13957405090332, "global_step": 344990, "epoch": 2053} {"train_loss": -12.521610260009766, "global_step": 344991, "epoch": 2053} {"train_loss": -12.186811447143555, "global_step": 344992, "epoch": 2053} {"train_loss": -12.32750415802002, "global_step": 344993, "epoch": 2053} {"train_loss": -12.05445671081543, "global_step": 344994, "epoch": 2053} {"train_loss": -12.35346794128418, "global_step": 344995, "epoch": 2053} {"train_loss": -12.285651206970215, "global_step": 344996, "epoch": 2053} {"train_loss": -12.631118774414062, "global_step": 344997, "epoch": 2053} {"train_loss": -12.167620658874512, "global_step": 344998, "epoch": 2053} {"train_loss": -12.485542297363281, "global_step": 344999, "epoch": 2053} {"train_loss": -12.620986938476562, "global_step": 345000, "epoch": 2053} {"train_loss": -12.428407669067383, "global_step": 345001, "epoch": 2053} {"train_loss": -12.323486328125, "global_step": 345002, "epoch": 2053} {"train_loss": -12.520246505737305, "global_step": 345003, "epoch": 2053} {"train_loss": -12.471302032470703, "global_step": 345004, "epoch": 2053} {"train_loss": -12.207963943481445, "global_step": 345005, "epoch": 2053} {"train_loss": -12.50210952758789, "global_step": 345006, "epoch": 2053} {"train_loss": -12.246439933776855, "global_step": 345007, "epoch": 2053} {"train_loss": -12.253425598144531, "global_step": 345008, "epoch": 2053} {"train_loss": -12.09209156036377, "global_step": 345009, "epoch": 2053} {"train_loss": -12.073636054992676, "global_step": 345010, "epoch": 2053} {"train_loss": -12.430700302124023, "global_step": 345011, "epoch": 2053} {"train_loss": -12.217973709106445, "global_step": 345012, "epoch": 2053} {"train_loss": -12.77730941772461, "global_step": 345013, "epoch": 2053} {"train_loss": -12.154412269592285, "global_step": 345014, "epoch": 2053} {"train_loss": -12.599811553955078, "global_step": 345015, "epoch": 2053} {"train_loss": -12.417410850524902, "global_step": 345016, "epoch": 2053} {"train_loss": -12.511178016662598, "global_step": 345017, "epoch": 2053} {"train_loss": -11.960411071777344, "global_step": 345018, "epoch": 2053} {"train_loss": -12.161405563354492, "global_step": 345019, "epoch": 2053} {"train_loss": -12.623842239379883, "global_step": 345020, "epoch": 2053} {"train_loss": -12.56458854675293, "global_step": 345021, "epoch": 2053} {"train_loss": -12.0844087600708, "global_step": 345022, "epoch": 2053} {"train_loss": -11.360576629638672, "global_step": 345023, "epoch": 2053} {"train_loss": -12.227714538574219, "global_step": 345024, "epoch": 2053} {"train_loss": -12.320079803466797, "global_step": 345025, "epoch": 2053} {"train_loss": -12.317137718200684, "global_step": 345026, "epoch": 2053} {"train_loss": -11.705399513244629, "global_step": 345027, "epoch": 2053} {"train_loss": -11.823741912841797, "global_step": 345028, "epoch": 2053} {"train_loss": -11.533300399780273, "global_step": 345029, "epoch": 2053} {"train_loss": -11.76338005065918, "global_step": 345030, "epoch": 2053} {"train_loss": -11.920833587646484, "global_step": 345031, "epoch": 2053} {"train_loss": -9.681480407714844, "global_step": 345032, "epoch": 2053} {"train_loss": -10.87983512878418, "global_step": 345033, "epoch": 2053} {"train_loss": -10.4599027633667, "global_step": 345034, "epoch": 2053} {"train_loss": -10.232868194580078, "global_step": 345035, "epoch": 2053} {"train_loss": -10.089741706848145, "global_step": 345036, "epoch": 2053} {"train_loss": -8.692811012268066, "global_step": 345037, "epoch": 2053} {"train_loss": -8.546791076660156, "global_step": 345038, "epoch": 2053} {"train_loss": -8.699249267578125, "global_step": 345039, "epoch": 2053} {"train_loss": -8.463274002075195, "global_step": 345040, "epoch": 2053} {"train_loss": -9.585906982421875, "global_step": 345041, "epoch": 2053} {"train_loss": -10.182072639465332, "global_step": 345042, "epoch": 2053} {"train_loss": -9.669321060180664, "global_step": 345043, "epoch": 2053} {"train_loss": -8.75233268737793, "global_step": 345044, "epoch": 2053} {"train_loss": -10.997275352478027, "global_step": 345045, "epoch": 2053} {"train_loss": -10.458515167236328, "global_step": 345046, "epoch": 2053} {"train_loss": -10.235573768615723, "global_step": 345047, "epoch": 2053} {"train_loss": -11.14303970336914, "global_step": 345048, "epoch": 2053} {"train_loss": -10.408029556274414, "global_step": 345049, "epoch": 2053} {"train_loss": -11.578348159790039, "global_step": 345050, "epoch": 2053} {"train_loss": -10.41043472290039, "global_step": 345051, "epoch": 2053} {"train_loss": -11.292019844055176, "global_step": 345052, "epoch": 2053} {"train_loss": -10.579338073730469, "global_step": 345053, "epoch": 2053} {"train_loss": -10.960140228271484, "global_step": 345054, "epoch": 2053} {"train_loss": -10.641132354736328, "global_step": 345055, "epoch": 2053} {"train_loss": -11.56039810180664, "global_step": 345056, "epoch": 2053} {"train_loss": -10.607219696044922, "global_step": 345057, "epoch": 2053} {"train_loss": -11.254402160644531, "global_step": 345058, "epoch": 2053} {"train_loss": -10.76675033569336, "global_step": 345059, "epoch": 2053} {"train_loss": -11.049381256103516, "global_step": 345060, "epoch": 2053} {"train_loss": -11.226696014404297, "global_step": 345061, "epoch": 2053} {"train_loss": -9.192556381225586, "global_step": 345062, "epoch": 2053} {"train_loss": -10.80610179901123, "global_step": 345063, "epoch": 2053} {"train_loss": -9.341606140136719, "global_step": 345064, "epoch": 2053} {"train_loss": -10.728992462158203, "global_step": 345065, "epoch": 2053} {"train_loss": -10.000625610351562, "global_step": 345066, "epoch": 2053} {"train_loss": -9.49898624420166, "global_step": 345067, "epoch": 2053} {"train_loss": -10.537662506103516, "global_step": 345068, "epoch": 2053} {"train_loss": -10.40239429473877, "global_step": 345069, "epoch": 2053} {"train_loss": -10.111749649047852, "global_step": 345070, "epoch": 2053} {"train_loss": -11.5325345993042, "global_step": 345071, "epoch": 2053, "val_loss": 283394.71875} {"train_loss": -10.63255786895752, "global_step": 345072, "epoch": 2054} {"train_loss": -10.545653343200684, "global_step": 345073, "epoch": 2054} {"train_loss": -11.53536605834961, "global_step": 345074, "epoch": 2054} {"train_loss": -10.754631042480469, "global_step": 345075, "epoch": 2054} {"train_loss": -11.347137451171875, "global_step": 345076, "epoch": 2054} {"train_loss": -10.438478469848633, "global_step": 345077, "epoch": 2054} {"train_loss": -11.773584365844727, "global_step": 345078, "epoch": 2054} {"train_loss": -11.150412559509277, "global_step": 345079, "epoch": 2054} {"train_loss": -11.81734848022461, "global_step": 345080, "epoch": 2054} {"train_loss": -11.655393600463867, "global_step": 345081, "epoch": 2054} {"train_loss": -11.253108978271484, "global_step": 345082, "epoch": 2054} {"train_loss": -12.058664321899414, "global_step": 345083, "epoch": 2054} {"train_loss": -11.426948547363281, "global_step": 345084, "epoch": 2054} {"train_loss": -11.579206466674805, "global_step": 345085, "epoch": 2054} {"train_loss": -11.564610481262207, "global_step": 345086, "epoch": 2054} {"train_loss": -11.521041870117188, "global_step": 345087, "epoch": 2054} {"train_loss": -11.959543228149414, "global_step": 345088, "epoch": 2054} {"train_loss": -11.517887115478516, "global_step": 345089, "epoch": 2054} {"train_loss": -11.927436828613281, "global_step": 345090, "epoch": 2054} {"train_loss": -11.641439437866211, "global_step": 345091, "epoch": 2054} {"train_loss": -11.715301513671875, "global_step": 345092, "epoch": 2054} {"train_loss": -11.812007904052734, "global_step": 345093, "epoch": 2054} {"train_loss": -11.847297668457031, "global_step": 345094, "epoch": 2054} {"train_loss": -11.71628189086914, "global_step": 345095, "epoch": 2054} {"train_loss": -11.940441131591797, "global_step": 345096, "epoch": 2054} {"train_loss": -11.623266220092773, "global_step": 345097, "epoch": 2054} {"train_loss": -12.055788040161133, "global_step": 345098, "epoch": 2054} {"train_loss": -11.94580078125, "global_step": 345099, "epoch": 2054} {"train_loss": -12.001983642578125, "global_step": 345100, "epoch": 2054} {"train_loss": -11.894879341125488, "global_step": 345101, "epoch": 2054} {"train_loss": -12.075530052185059, "global_step": 345102, "epoch": 2054} {"train_loss": -11.884729385375977, "global_step": 345103, "epoch": 2054} {"train_loss": -12.09223747253418, "global_step": 345104, "epoch": 2054} {"train_loss": -11.89255142211914, "global_step": 345105, "epoch": 2054} {"train_loss": -12.17773723602295, "global_step": 345106, "epoch": 2054} {"train_loss": -11.983298301696777, "global_step": 345107, "epoch": 2054} {"train_loss": -12.109450340270996, "global_step": 345108, "epoch": 2054} {"train_loss": -12.049911499023438, "global_step": 345109, "epoch": 2054} {"train_loss": -12.001976013183594, "global_step": 345110, "epoch": 2054} {"train_loss": -12.287829399108887, "global_step": 345111, "epoch": 2054} {"train_loss": -12.005701065063477, "global_step": 345112, "epoch": 2054} {"train_loss": -12.211087226867676, "global_step": 345113, "epoch": 2054} {"train_loss": -12.113689422607422, "global_step": 345114, "epoch": 2054} {"train_loss": -12.105106353759766, "global_step": 345115, "epoch": 2054} {"train_loss": -12.087435722351074, "global_step": 345116, "epoch": 2054} {"train_loss": -11.734850883483887, "global_step": 345117, "epoch": 2054} {"train_loss": -12.263206481933594, "global_step": 345118, "epoch": 2054} {"train_loss": -12.002670288085938, "global_step": 345119, "epoch": 2054} {"train_loss": -12.054197311401367, "global_step": 345120, "epoch": 2054} {"train_loss": -12.134716987609863, "global_step": 345121, "epoch": 2054} {"train_loss": -12.311107635498047, "global_step": 345122, "epoch": 2054} {"train_loss": -12.124871253967285, "global_step": 345123, "epoch": 2054} {"train_loss": -11.961837768554688, "global_step": 345124, "epoch": 2054} {"train_loss": -12.111231803894043, "global_step": 345125, "epoch": 2054} {"train_loss": -12.076772689819336, "global_step": 345126, "epoch": 2054} {"train_loss": -12.149105072021484, "global_step": 345127, "epoch": 2054} {"train_loss": -12.325557708740234, "global_step": 345128, "epoch": 2054} {"train_loss": -12.30386734008789, "global_step": 345129, "epoch": 2054} {"train_loss": -12.365180969238281, "global_step": 345130, "epoch": 2054} {"train_loss": -12.33307933807373, "global_step": 345131, "epoch": 2054} {"train_loss": -12.166783332824707, "global_step": 345132, "epoch": 2054} {"train_loss": -12.406937599182129, "global_step": 345133, "epoch": 2054} {"train_loss": -12.211634635925293, "global_step": 345134, "epoch": 2054} {"train_loss": -12.310978889465332, "global_step": 345135, "epoch": 2054} {"train_loss": -12.298553466796875, "global_step": 345136, "epoch": 2054} {"train_loss": -12.429235458374023, "global_step": 345137, "epoch": 2054} {"train_loss": -12.486770629882812, "global_step": 345138, "epoch": 2054} {"train_loss": -12.322925567626953, "global_step": 345139, "epoch": 2054} {"train_loss": -12.560627937316895, "global_step": 345140, "epoch": 2054} {"train_loss": -12.3946533203125, "global_step": 345141, "epoch": 2054} {"train_loss": -12.411304473876953, "global_step": 345142, "epoch": 2054} {"train_loss": -12.351701736450195, "global_step": 345143, "epoch": 2054} {"train_loss": -12.392171859741211, "global_step": 345144, "epoch": 2054} {"train_loss": -12.442389488220215, "global_step": 345145, "epoch": 2054} {"train_loss": -12.29471206665039, "global_step": 345146, "epoch": 2054} {"train_loss": -12.503714561462402, "global_step": 345147, "epoch": 2054} {"train_loss": -12.236586570739746, "global_step": 345148, "epoch": 2054} {"train_loss": -12.42760944366455, "global_step": 345149, "epoch": 2054} {"train_loss": -12.601234436035156, "global_step": 345150, "epoch": 2054} {"train_loss": -12.494434356689453, "global_step": 345151, "epoch": 2054} {"train_loss": -12.697131156921387, "global_step": 345152, "epoch": 2054} {"train_loss": -12.662586212158203, "global_step": 345153, "epoch": 2054} {"train_loss": -12.601007461547852, "global_step": 345154, "epoch": 2054} {"train_loss": -12.430987358093262, "global_step": 345155, "epoch": 2054} {"train_loss": -12.500524520874023, "global_step": 345156, "epoch": 2054} {"train_loss": -12.6952543258667, "global_step": 345157, "epoch": 2054} {"train_loss": -12.60904598236084, "global_step": 345158, "epoch": 2054} {"train_loss": -12.616926193237305, "global_step": 345159, "epoch": 2054} {"train_loss": -12.742429733276367, "global_step": 345160, "epoch": 2054} {"train_loss": -12.696368217468262, "global_step": 345161, "epoch": 2054} {"train_loss": -12.522253036499023, "global_step": 345162, "epoch": 2054} {"train_loss": -12.445526123046875, "global_step": 345163, "epoch": 2054} {"train_loss": -12.575651168823242, "global_step": 345164, "epoch": 2054} {"train_loss": -12.657428741455078, "global_step": 345165, "epoch": 2054} {"train_loss": -12.641108512878418, "global_step": 345166, "epoch": 2054} {"train_loss": -12.480128288269043, "global_step": 345167, "epoch": 2054} {"train_loss": -12.48397445678711, "global_step": 345168, "epoch": 2054} {"train_loss": -12.666704177856445, "global_step": 345169, "epoch": 2054} {"train_loss": -12.52588176727295, "global_step": 345170, "epoch": 2054} {"train_loss": -12.578224182128906, "global_step": 345171, "epoch": 2054} {"train_loss": -12.799556732177734, "global_step": 345172, "epoch": 2054} {"train_loss": -12.76924991607666, "global_step": 345173, "epoch": 2054} {"train_loss": -12.495122909545898, "global_step": 345174, "epoch": 2054} {"train_loss": -12.593339920043945, "global_step": 345175, "epoch": 2054} {"train_loss": -12.73371696472168, "global_step": 345176, "epoch": 2054} {"train_loss": -12.495595932006836, "global_step": 345177, "epoch": 2054} {"train_loss": -12.453861236572266, "global_step": 345178, "epoch": 2054} {"train_loss": -12.12685775756836, "global_step": 345179, "epoch": 2054} {"train_loss": -11.857423782348633, "global_step": 345180, "epoch": 2054} {"train_loss": -12.23511028289795, "global_step": 345181, "epoch": 2054} {"train_loss": -12.458255767822266, "global_step": 345182, "epoch": 2054} {"train_loss": -12.263814926147461, "global_step": 345183, "epoch": 2054} {"train_loss": -12.164976119995117, "global_step": 345184, "epoch": 2054} {"train_loss": -12.45614242553711, "global_step": 345185, "epoch": 2054} {"train_loss": -12.350255966186523, "global_step": 345186, "epoch": 2054} {"train_loss": -11.308305740356445, "global_step": 345187, "epoch": 2054} {"train_loss": -9.27294921875, "global_step": 345188, "epoch": 2054} {"train_loss": -9.691426277160645, "global_step": 345189, "epoch": 2054} {"train_loss": -11.79585075378418, "global_step": 345190, "epoch": 2054} {"train_loss": -7.58469820022583, "global_step": 345191, "epoch": 2054} {"train_loss": -8.014677047729492, "global_step": 345192, "epoch": 2054} {"train_loss": -8.298365592956543, "global_step": 345193, "epoch": 2054} {"train_loss": -9.804360389709473, "global_step": 345194, "epoch": 2054} {"train_loss": -9.600414276123047, "global_step": 345195, "epoch": 2054} {"train_loss": -8.569511413574219, "global_step": 345196, "epoch": 2054} {"train_loss": -9.531153678894043, "global_step": 345197, "epoch": 2054} {"train_loss": -9.738777160644531, "global_step": 345198, "epoch": 2054} {"train_loss": -8.747262954711914, "global_step": 345199, "epoch": 2054} {"train_loss": -10.029180526733398, "global_step": 345200, "epoch": 2054} {"train_loss": -10.428277969360352, "global_step": 345201, "epoch": 2054} {"train_loss": -9.561059951782227, "global_step": 345202, "epoch": 2054} {"train_loss": -10.652132987976074, "global_step": 345203, "epoch": 2054} {"train_loss": -10.126697540283203, "global_step": 345204, "epoch": 2054} {"train_loss": -10.946606636047363, "global_step": 345205, "epoch": 2054} {"train_loss": -8.255965232849121, "global_step": 345206, "epoch": 2054} {"train_loss": -8.94717788696289, "global_step": 345207, "epoch": 2054} {"train_loss": -9.037361145019531, "global_step": 345208, "epoch": 2054} {"train_loss": -8.615240097045898, "global_step": 345209, "epoch": 2054} {"train_loss": -10.151998519897461, "global_step": 345210, "epoch": 2054} {"train_loss": -8.836753845214844, "global_step": 345211, "epoch": 2054} {"train_loss": -8.627321243286133, "global_step": 345212, "epoch": 2054} {"train_loss": -8.468180656433105, "global_step": 345213, "epoch": 2054} {"train_loss": -8.437397003173828, "global_step": 345214, "epoch": 2054} {"train_loss": -10.31969928741455, "global_step": 345215, "epoch": 2054} {"train_loss": -10.12485122680664, "global_step": 345216, "epoch": 2054} {"train_loss": -9.968027114868164, "global_step": 345217, "epoch": 2054} {"train_loss": -10.13658332824707, "global_step": 345218, "epoch": 2054} {"train_loss": -10.546960830688477, "global_step": 345219, "epoch": 2054} {"train_loss": -10.664131164550781, "global_step": 345220, "epoch": 2054} {"train_loss": -9.395347595214844, "global_step": 345221, "epoch": 2054} {"train_loss": -10.97478199005127, "global_step": 345222, "epoch": 2054} {"train_loss": -10.49280071258545, "global_step": 345223, "epoch": 2054} {"train_loss": -10.721986770629883, "global_step": 345224, "epoch": 2054} {"train_loss": -11.028915405273438, "global_step": 345225, "epoch": 2054} {"train_loss": -10.816452980041504, "global_step": 345226, "epoch": 2054} {"train_loss": -11.19754409790039, "global_step": 345227, "epoch": 2054} {"train_loss": -11.251874923706055, "global_step": 345228, "epoch": 2054} {"train_loss": -11.302742004394531, "global_step": 345229, "epoch": 2054} {"train_loss": -11.376880645751953, "global_step": 345230, "epoch": 2054} {"train_loss": -11.35004997253418, "global_step": 345231, "epoch": 2054} {"train_loss": -10.790468215942383, "global_step": 345232, "epoch": 2054} {"train_loss": -11.707372665405273, "global_step": 345233, "epoch": 2054} {"train_loss": -11.400364875793457, "global_step": 345234, "epoch": 2054} {"train_loss": -11.456628799438477, "global_step": 345235, "epoch": 2054} {"train_loss": -11.480218887329102, "global_step": 345236, "epoch": 2054} {"train_loss": -11.003170013427734, "global_step": 345237, "epoch": 2054} {"train_loss": -11.472049713134766, "global_step": 345238, "epoch": 2054} {"train_loss": -11.496373179413023, "global_step": 345239, "epoch": 2054, "val_loss": 278076.15625} {"train_loss": -11.606132507324219, "global_step": 345240, "epoch": 2055} {"train_loss": -11.302453994750977, "global_step": 345241, "epoch": 2055} {"train_loss": -11.539144515991211, "global_step": 345242, "epoch": 2055} {"train_loss": -11.567729949951172, "global_step": 345243, "epoch": 2055} {"train_loss": -11.36315631866455, "global_step": 345244, "epoch": 2055} {"train_loss": -12.031033515930176, "global_step": 345245, "epoch": 2055} {"train_loss": -11.512939453125, "global_step": 345246, "epoch": 2055} {"train_loss": -11.943343162536621, "global_step": 345247, "epoch": 2055} {"train_loss": -11.542757034301758, "global_step": 345248, "epoch": 2055} {"train_loss": -11.99666690826416, "global_step": 345249, "epoch": 2055} {"train_loss": -11.7098388671875, "global_step": 345250, "epoch": 2055} {"train_loss": -11.82910442352295, "global_step": 345251, "epoch": 2055} {"train_loss": -11.663291931152344, "global_step": 345252, "epoch": 2055} {"train_loss": -11.840629577636719, "global_step": 345253, "epoch": 2055} {"train_loss": -12.028776168823242, "global_step": 345254, "epoch": 2055} {"train_loss": -11.3880615234375, "global_step": 345255, "epoch": 2055} {"train_loss": -11.705877304077148, "global_step": 345256, "epoch": 2055} {"train_loss": -12.02452564239502, "global_step": 345257, "epoch": 2055} {"train_loss": -11.661149024963379, "global_step": 345258, "epoch": 2055} {"train_loss": -12.043529510498047, "global_step": 345259, "epoch": 2055} {"train_loss": -12.098016738891602, "global_step": 345260, "epoch": 2055} {"train_loss": -11.873385429382324, "global_step": 345261, "epoch": 2055} {"train_loss": -12.261754989624023, "global_step": 345262, "epoch": 2055} {"train_loss": -11.734492301940918, "global_step": 345263, "epoch": 2055} {"train_loss": -12.174322128295898, "global_step": 345264, "epoch": 2055} {"train_loss": -11.884665489196777, "global_step": 345265, "epoch": 2055} {"train_loss": -11.92003059387207, "global_step": 345266, "epoch": 2055} {"train_loss": -11.94478702545166, "global_step": 345267, "epoch": 2055} {"train_loss": -12.133111953735352, "global_step": 345268, "epoch": 2055} {"train_loss": -12.098946571350098, "global_step": 345269, "epoch": 2055} {"train_loss": -12.192886352539062, "global_step": 345270, "epoch": 2055} {"train_loss": -12.339258193969727, "global_step": 345271, "epoch": 2055} {"train_loss": -12.051408767700195, "global_step": 345272, "epoch": 2055} {"train_loss": -12.202301025390625, "global_step": 345273, "epoch": 2055} {"train_loss": -12.205923080444336, "global_step": 345274, "epoch": 2055} {"train_loss": -12.292282104492188, "global_step": 345275, "epoch": 2055} {"train_loss": -12.319640159606934, "global_step": 345276, "epoch": 2055} {"train_loss": -12.301915168762207, "global_step": 345277, "epoch": 2055} {"train_loss": -12.29255199432373, "global_step": 345278, "epoch": 2055} {"train_loss": -12.294219970703125, "global_step": 345279, "epoch": 2055} {"train_loss": -12.318355560302734, "global_step": 345280, "epoch": 2055} {"train_loss": -12.184497833251953, "global_step": 345281, "epoch": 2055} {"train_loss": -12.250221252441406, "global_step": 345282, "epoch": 2055} {"train_loss": -12.326183319091797, "global_step": 345283, "epoch": 2055} {"train_loss": -12.36878776550293, "global_step": 345284, "epoch": 2055} {"train_loss": -12.404817581176758, "global_step": 345285, "epoch": 2055} {"train_loss": -12.24654483795166, "global_step": 345286, "epoch": 2055} {"train_loss": -12.365521430969238, "global_step": 345287, "epoch": 2055} {"train_loss": -12.424827575683594, "global_step": 345288, "epoch": 2055} {"train_loss": -12.542572021484375, "global_step": 345289, "epoch": 2055} {"train_loss": -12.364875793457031, "global_step": 345290, "epoch": 2055} {"train_loss": -12.49937915802002, "global_step": 345291, "epoch": 2055} {"train_loss": -12.124234199523926, "global_step": 345292, "epoch": 2055} {"train_loss": -12.581197738647461, "global_step": 345293, "epoch": 2055} {"train_loss": -12.48929214477539, "global_step": 345294, "epoch": 2055} {"train_loss": -12.562256813049316, "global_step": 345295, "epoch": 2055} {"train_loss": -12.521190643310547, "global_step": 345296, "epoch": 2055} {"train_loss": -12.367162704467773, "global_step": 345297, "epoch": 2055} {"train_loss": -12.44353199005127, "global_step": 345298, "epoch": 2055} {"train_loss": -12.305931091308594, "global_step": 345299, "epoch": 2055} {"train_loss": -12.333812713623047, "global_step": 345300, "epoch": 2055} {"train_loss": -12.54026985168457, "global_step": 345301, "epoch": 2055} {"train_loss": -12.716453552246094, "global_step": 345302, "epoch": 2055} {"train_loss": -12.50928020477295, "global_step": 345303, "epoch": 2055} {"train_loss": -12.549137115478516, "global_step": 345304, "epoch": 2055} {"train_loss": -12.662549018859863, "global_step": 345305, "epoch": 2055} {"train_loss": -12.59151554107666, "global_step": 345306, "epoch": 2055} {"train_loss": -12.46372127532959, "global_step": 345307, "epoch": 2055} {"train_loss": -12.610502243041992, "global_step": 345308, "epoch": 2055} {"train_loss": -12.644012451171875, "global_step": 345309, "epoch": 2055} {"train_loss": -12.59432315826416, "global_step": 345310, "epoch": 2055} {"train_loss": -12.671454429626465, "global_step": 345311, "epoch": 2055} {"train_loss": -12.569938659667969, "global_step": 345312, "epoch": 2055} {"train_loss": -12.59597396850586, "global_step": 345313, "epoch": 2055} {"train_loss": -12.415655136108398, "global_step": 345314, "epoch": 2055} {"train_loss": -12.55053997039795, "global_step": 345315, "epoch": 2055} {"train_loss": -12.548661231994629, "global_step": 345316, "epoch": 2055} {"train_loss": -12.735342025756836, "global_step": 345317, "epoch": 2055} {"train_loss": -12.565428733825684, "global_step": 345318, "epoch": 2055} {"train_loss": -12.638752937316895, "global_step": 345319, "epoch": 2055} {"train_loss": -12.459440231323242, "global_step": 345320, "epoch": 2055} {"train_loss": -12.797296524047852, "global_step": 345321, "epoch": 2055} {"train_loss": -12.551054954528809, "global_step": 345322, "epoch": 2055} {"train_loss": -12.609752655029297, "global_step": 345323, "epoch": 2055} {"train_loss": -12.266270637512207, "global_step": 345324, "epoch": 2055} {"train_loss": -12.809158325195312, "global_step": 345325, "epoch": 2055} {"train_loss": -12.67530345916748, "global_step": 345326, "epoch": 2055} {"train_loss": -12.705999374389648, "global_step": 345327, "epoch": 2055} {"train_loss": -12.730926513671875, "global_step": 345328, "epoch": 2055} {"train_loss": -12.707719802856445, "global_step": 345329, "epoch": 2055} {"train_loss": -12.645879745483398, "global_step": 345330, "epoch": 2055} {"train_loss": -12.460013389587402, "global_step": 345331, "epoch": 2055} {"train_loss": -12.202552795410156, "global_step": 345332, "epoch": 2055} {"train_loss": -11.857933044433594, "global_step": 345333, "epoch": 2055} {"train_loss": -12.549666404724121, "global_step": 345334, "epoch": 2055} {"train_loss": -12.055521011352539, "global_step": 345335, "epoch": 2055} {"train_loss": -11.483473777770996, "global_step": 345336, "epoch": 2055} {"train_loss": -11.869669914245605, "global_step": 345337, "epoch": 2055} {"train_loss": -11.30329704284668, "global_step": 345338, "epoch": 2055} {"train_loss": -11.225600242614746, "global_step": 345339, "epoch": 2055} {"train_loss": -11.410211563110352, "global_step": 345340, "epoch": 2055} {"train_loss": -11.808412551879883, "global_step": 345341, "epoch": 2055} {"train_loss": -11.97379207611084, "global_step": 345342, "epoch": 2055} {"train_loss": -11.304352760314941, "global_step": 345343, "epoch": 2055} {"train_loss": -12.101219177246094, "global_step": 345344, "epoch": 2055} {"train_loss": -12.549999237060547, "global_step": 345345, "epoch": 2055} {"train_loss": -12.222023010253906, "global_step": 345346, "epoch": 2055} {"train_loss": -12.179384231567383, "global_step": 345347, "epoch": 2055} {"train_loss": -12.388577461242676, "global_step": 345348, "epoch": 2055} {"train_loss": -12.339574813842773, "global_step": 345349, "epoch": 2055} {"train_loss": -11.838056564331055, "global_step": 345350, "epoch": 2055} {"train_loss": -11.567317962646484, "global_step": 345351, "epoch": 2055} {"train_loss": -12.054679870605469, "global_step": 345352, "epoch": 2055} {"train_loss": -12.22380256652832, "global_step": 345353, "epoch": 2055} {"train_loss": -11.281034469604492, "global_step": 345354, "epoch": 2055} {"train_loss": -11.122873306274414, "global_step": 345355, "epoch": 2055} {"train_loss": -11.620452880859375, "global_step": 345356, "epoch": 2055} {"train_loss": -11.612910270690918, "global_step": 345357, "epoch": 2055} {"train_loss": -12.000617980957031, "global_step": 345358, "epoch": 2055} {"train_loss": -11.734502792358398, "global_step": 345359, "epoch": 2055} {"train_loss": -11.935518264770508, "global_step": 345360, "epoch": 2055} {"train_loss": -11.771553039550781, "global_step": 345361, "epoch": 2055} {"train_loss": -11.376432418823242, "global_step": 345362, "epoch": 2055} {"train_loss": -11.545520782470703, "global_step": 345363, "epoch": 2055} {"train_loss": -11.801410675048828, "global_step": 345364, "epoch": 2055} {"train_loss": -11.210445404052734, "global_step": 345365, "epoch": 2055} {"train_loss": -10.41177749633789, "global_step": 345366, "epoch": 2055} {"train_loss": -11.399532318115234, "global_step": 345367, "epoch": 2055} {"train_loss": -9.709339141845703, "global_step": 345368, "epoch": 2055} {"train_loss": -10.878029823303223, "global_step": 345369, "epoch": 2055} {"train_loss": -10.565997123718262, "global_step": 345370, "epoch": 2055} {"train_loss": -11.02818489074707, "global_step": 345371, "epoch": 2055} {"train_loss": -11.191381454467773, "global_step": 345372, "epoch": 2055} {"train_loss": -10.843436241149902, "global_step": 345373, "epoch": 2055} {"train_loss": -11.886848449707031, "global_step": 345374, "epoch": 2055} {"train_loss": -10.79633903503418, "global_step": 345375, "epoch": 2055} {"train_loss": -12.060184478759766, "global_step": 345376, "epoch": 2055} {"train_loss": -10.401020050048828, "global_step": 345377, "epoch": 2055} {"train_loss": -12.035165786743164, "global_step": 345378, "epoch": 2055} {"train_loss": -11.000032424926758, "global_step": 345379, "epoch": 2055} {"train_loss": -11.869329452514648, "global_step": 345380, "epoch": 2055} {"train_loss": -11.36848258972168, "global_step": 345381, "epoch": 2055} {"train_loss": -11.58877944946289, "global_step": 345382, "epoch": 2055} {"train_loss": -11.661439895629883, "global_step": 345383, "epoch": 2055} {"train_loss": -11.887084007263184, "global_step": 345384, "epoch": 2055} {"train_loss": -10.314369201660156, "global_step": 345385, "epoch": 2055} {"train_loss": -11.939607620239258, "global_step": 345386, "epoch": 2055} {"train_loss": -11.18127155303955, "global_step": 345387, "epoch": 2055} {"train_loss": -11.349899291992188, "global_step": 345388, "epoch": 2055} {"train_loss": -11.52420711517334, "global_step": 345389, "epoch": 2055} {"train_loss": -11.025269508361816, "global_step": 345390, "epoch": 2055} {"train_loss": -11.538212776184082, "global_step": 345391, "epoch": 2055} {"train_loss": -10.358978271484375, "global_step": 345392, "epoch": 2055} {"train_loss": -11.143045425415039, "global_step": 345393, "epoch": 2055} {"train_loss": -11.6038818359375, "global_step": 345394, "epoch": 2055} {"train_loss": -11.191649436950684, "global_step": 345395, "epoch": 2055} {"train_loss": -11.594545364379883, "global_step": 345396, "epoch": 2055} {"train_loss": -11.648218154907227, "global_step": 345397, "epoch": 2055} {"train_loss": -11.466487884521484, "global_step": 345398, "epoch": 2055} {"train_loss": -11.625055313110352, "global_step": 345399, "epoch": 2055} {"train_loss": -11.535018920898438, "global_step": 345400, "epoch": 2055} {"train_loss": -11.963691711425781, "global_step": 345401, "epoch": 2055} {"train_loss": -11.493010520935059, "global_step": 345402, "epoch": 2055} {"train_loss": -11.889730453491211, "global_step": 345403, "epoch": 2055} {"train_loss": -11.516425132751465, "global_step": 345404, "epoch": 2055} {"train_loss": -11.351012229919434, "global_step": 345405, "epoch": 2055} {"train_loss": -12.00092601776123, "global_step": 345406, "epoch": 2055} {"train_loss": -11.933434900783357, "global_step": 345407, "epoch": 2055, "val_loss": 290580.34375, "train_action_mse_error": 1.352954626083374} {"train_loss": -11.460124015808105, "global_step": 345408, "epoch": 2056} {"train_loss": -12.049022674560547, "global_step": 345409, "epoch": 2056} {"train_loss": -11.747512817382812, "global_step": 345410, "epoch": 2056} {"train_loss": -12.203847885131836, "global_step": 345411, "epoch": 2056} {"train_loss": -11.787182807922363, "global_step": 345412, "epoch": 2056} {"train_loss": -11.900379180908203, "global_step": 345413, "epoch": 2056} {"train_loss": -11.931436538696289, "global_step": 345414, "epoch": 2056} {"train_loss": -11.9135103225708, "global_step": 345415, "epoch": 2056} {"train_loss": -12.019712448120117, "global_step": 345416, "epoch": 2056} {"train_loss": -11.61876106262207, "global_step": 345417, "epoch": 2056} {"train_loss": -12.100844383239746, "global_step": 345418, "epoch": 2056} {"train_loss": -11.91113567352295, "global_step": 345419, "epoch": 2056} {"train_loss": -11.556360244750977, "global_step": 345420, "epoch": 2056} {"train_loss": -12.076981544494629, "global_step": 345421, "epoch": 2056} {"train_loss": -11.43387222290039, "global_step": 345422, "epoch": 2056} {"train_loss": -12.207165718078613, "global_step": 345423, "epoch": 2056} {"train_loss": -11.744550704956055, "global_step": 345424, "epoch": 2056} {"train_loss": -11.69715690612793, "global_step": 345425, "epoch": 2056} {"train_loss": -11.644281387329102, "global_step": 345426, "epoch": 2056} {"train_loss": -11.178326606750488, "global_step": 345427, "epoch": 2056} {"train_loss": -12.268997192382812, "global_step": 345428, "epoch": 2056} {"train_loss": -11.030672073364258, "global_step": 345429, "epoch": 2056} {"train_loss": -12.166380882263184, "global_step": 345430, "epoch": 2056} {"train_loss": -11.385777473449707, "global_step": 345431, "epoch": 2056} {"train_loss": -11.757040023803711, "global_step": 345432, "epoch": 2056} {"train_loss": -12.006321907043457, "global_step": 345433, "epoch": 2056} {"train_loss": -11.577472686767578, "global_step": 345434, "epoch": 2056} {"train_loss": -11.848108291625977, "global_step": 345435, "epoch": 2056} {"train_loss": -11.986093521118164, "global_step": 345436, "epoch": 2056} {"train_loss": -12.295782089233398, "global_step": 345437, "epoch": 2056} {"train_loss": -11.753746032714844, "global_step": 345438, "epoch": 2056} {"train_loss": -11.950409889221191, "global_step": 345439, "epoch": 2056} {"train_loss": -12.177715301513672, "global_step": 345440, "epoch": 2056} {"train_loss": -11.834692001342773, "global_step": 345441, "epoch": 2056} {"train_loss": -12.13278579711914, "global_step": 345442, "epoch": 2056} {"train_loss": -11.435998916625977, "global_step": 345443, "epoch": 2056} {"train_loss": -12.179643630981445, "global_step": 345444, "epoch": 2056} {"train_loss": -12.134328842163086, "global_step": 345445, "epoch": 2056} {"train_loss": -11.836080551147461, "global_step": 345446, "epoch": 2056} {"train_loss": -11.973234176635742, "global_step": 345447, "epoch": 2056} {"train_loss": -11.285954475402832, "global_step": 345448, "epoch": 2056} {"train_loss": -12.027994155883789, "global_step": 345449, "epoch": 2056} {"train_loss": -11.633262634277344, "global_step": 345450, "epoch": 2056} {"train_loss": -12.177192687988281, "global_step": 345451, "epoch": 2056} {"train_loss": -11.837700843811035, "global_step": 345452, "epoch": 2056} {"train_loss": -11.747318267822266, "global_step": 345453, "epoch": 2056} {"train_loss": -12.182828903198242, "global_step": 345454, "epoch": 2056} {"train_loss": -11.431999206542969, "global_step": 345455, "epoch": 2056} {"train_loss": -11.921300888061523, "global_step": 345456, "epoch": 2056} {"train_loss": -10.58675765991211, "global_step": 345457, "epoch": 2056} {"train_loss": -11.05320930480957, "global_step": 345458, "epoch": 2056} {"train_loss": -10.601949691772461, "global_step": 345459, "epoch": 2056} {"train_loss": -10.971412658691406, "global_step": 345460, "epoch": 2056} {"train_loss": -11.600689888000488, "global_step": 345461, "epoch": 2056} {"train_loss": -11.163485527038574, "global_step": 345462, "epoch": 2056} {"train_loss": -12.096177101135254, "global_step": 345463, "epoch": 2056} {"train_loss": -11.172493934631348, "global_step": 345464, "epoch": 2056} {"train_loss": -11.871089935302734, "global_step": 345465, "epoch": 2056} {"train_loss": -11.399669647216797, "global_step": 345466, "epoch": 2056} {"train_loss": -11.908621788024902, "global_step": 345467, "epoch": 2056} {"train_loss": -12.08678150177002, "global_step": 345468, "epoch": 2056} {"train_loss": -11.32750415802002, "global_step": 345469, "epoch": 2056} {"train_loss": -12.18582534790039, "global_step": 345470, "epoch": 2056} {"train_loss": -11.553585052490234, "global_step": 345471, "epoch": 2056} {"train_loss": -12.219978332519531, "global_step": 345472, "epoch": 2056} {"train_loss": -11.67531681060791, "global_step": 345473, "epoch": 2056} {"train_loss": -12.231108665466309, "global_step": 345474, "epoch": 2056} {"train_loss": -12.216588973999023, "global_step": 345475, "epoch": 2056} {"train_loss": -12.19509506225586, "global_step": 345476, "epoch": 2056} {"train_loss": -12.391565322875977, "global_step": 345477, "epoch": 2056} {"train_loss": -12.046842575073242, "global_step": 345478, "epoch": 2056} {"train_loss": -12.154322624206543, "global_step": 345479, "epoch": 2056} {"train_loss": -12.052074432373047, "global_step": 345480, "epoch": 2056} {"train_loss": -12.117431640625, "global_step": 345481, "epoch": 2056} {"train_loss": -12.053948402404785, "global_step": 345482, "epoch": 2056} {"train_loss": -11.79834270477295, "global_step": 345483, "epoch": 2056} {"train_loss": -12.373356819152832, "global_step": 345484, "epoch": 2056} {"train_loss": -11.802824974060059, "global_step": 345485, "epoch": 2056} {"train_loss": -12.325029373168945, "global_step": 345486, "epoch": 2056} {"train_loss": -12.041545867919922, "global_step": 345487, "epoch": 2056} {"train_loss": -12.10818099975586, "global_step": 345488, "epoch": 2056} {"train_loss": -12.074626922607422, "global_step": 345489, "epoch": 2056} {"train_loss": -11.969005584716797, "global_step": 345490, "epoch": 2056} {"train_loss": -12.333534240722656, "global_step": 345491, "epoch": 2056} {"train_loss": -11.968708038330078, "global_step": 345492, "epoch": 2056} {"train_loss": -11.92657470703125, "global_step": 345493, "epoch": 2056} {"train_loss": -11.890031814575195, "global_step": 345494, "epoch": 2056} {"train_loss": -11.680124282836914, "global_step": 345495, "epoch": 2056} {"train_loss": -12.227492332458496, "global_step": 345496, "epoch": 2056} {"train_loss": -11.696660041809082, "global_step": 345497, "epoch": 2056} {"train_loss": -12.137655258178711, "global_step": 345498, "epoch": 2056} {"train_loss": -11.830696105957031, "global_step": 345499, "epoch": 2056} {"train_loss": -11.582408905029297, "global_step": 345500, "epoch": 2056} {"train_loss": -11.978196144104004, "global_step": 345501, "epoch": 2056} {"train_loss": -11.943828582763672, "global_step": 345502, "epoch": 2056} {"train_loss": -11.932157516479492, "global_step": 345503, "epoch": 2056} {"train_loss": -12.050551414489746, "global_step": 345504, "epoch": 2056} {"train_loss": -12.092500686645508, "global_step": 345505, "epoch": 2056} {"train_loss": -12.088834762573242, "global_step": 345506, "epoch": 2056} {"train_loss": -11.981613159179688, "global_step": 345507, "epoch": 2056} {"train_loss": -12.325700759887695, "global_step": 345508, "epoch": 2056} {"train_loss": -12.03756332397461, "global_step": 345509, "epoch": 2056} {"train_loss": -12.428617477416992, "global_step": 345510, "epoch": 2056} {"train_loss": -11.860527992248535, "global_step": 345511, "epoch": 2056} {"train_loss": -12.373664855957031, "global_step": 345512, "epoch": 2056} {"train_loss": -12.197591781616211, "global_step": 345513, "epoch": 2056} {"train_loss": -12.044573783874512, "global_step": 345514, "epoch": 2056} {"train_loss": -12.336549758911133, "global_step": 345515, "epoch": 2056} {"train_loss": -12.077905654907227, "global_step": 345516, "epoch": 2056} {"train_loss": -12.43879222869873, "global_step": 345517, "epoch": 2056} {"train_loss": -12.145891189575195, "global_step": 345518, "epoch": 2056} {"train_loss": -12.499284744262695, "global_step": 345519, "epoch": 2056} {"train_loss": -12.117365837097168, "global_step": 345520, "epoch": 2056} {"train_loss": -12.22780990600586, "global_step": 345521, "epoch": 2056} {"train_loss": -12.248531341552734, "global_step": 345522, "epoch": 2056} {"train_loss": -12.325300216674805, "global_step": 345523, "epoch": 2056} {"train_loss": -12.301794052124023, "global_step": 345524, "epoch": 2056} {"train_loss": -12.321125030517578, "global_step": 345525, "epoch": 2056} {"train_loss": -12.296337127685547, "global_step": 345526, "epoch": 2056} {"train_loss": -12.265373229980469, "global_step": 345527, "epoch": 2056} {"train_loss": -12.541749954223633, "global_step": 345528, "epoch": 2056} {"train_loss": -12.188776016235352, "global_step": 345529, "epoch": 2056} {"train_loss": -12.516990661621094, "global_step": 345530, "epoch": 2056} {"train_loss": -12.229230880737305, "global_step": 345531, "epoch": 2056} {"train_loss": -12.416654586791992, "global_step": 345532, "epoch": 2056} {"train_loss": -11.991612434387207, "global_step": 345533, "epoch": 2056} {"train_loss": -12.446605682373047, "global_step": 345534, "epoch": 2056} {"train_loss": -12.31082534790039, "global_step": 345535, "epoch": 2056} {"train_loss": -12.417774200439453, "global_step": 345536, "epoch": 2056} {"train_loss": -11.955488204956055, "global_step": 345537, "epoch": 2056} {"train_loss": -12.098714828491211, "global_step": 345538, "epoch": 2056} {"train_loss": -12.324295043945312, "global_step": 345539, "epoch": 2056} {"train_loss": -12.347038269042969, "global_step": 345540, "epoch": 2056} {"train_loss": -12.24513053894043, "global_step": 345541, "epoch": 2056} {"train_loss": -12.236241340637207, "global_step": 345542, "epoch": 2056} {"train_loss": -12.156436920166016, "global_step": 345543, "epoch": 2056} {"train_loss": -12.488174438476562, "global_step": 345544, "epoch": 2056} {"train_loss": -12.1548433303833, "global_step": 345545, "epoch": 2056} {"train_loss": -11.664108276367188, "global_step": 345546, "epoch": 2056} {"train_loss": -11.63090991973877, "global_step": 345547, "epoch": 2056} {"train_loss": -12.235803604125977, "global_step": 345548, "epoch": 2056} {"train_loss": -11.204488754272461, "global_step": 345549, "epoch": 2056} {"train_loss": -10.636322975158691, "global_step": 345550, "epoch": 2056} {"train_loss": -10.905889511108398, "global_step": 345551, "epoch": 2056} {"train_loss": -10.403541564941406, "global_step": 345552, "epoch": 2056} {"train_loss": -9.0780668258667, "global_step": 345553, "epoch": 2056} {"train_loss": -9.877260208129883, "global_step": 345554, "epoch": 2056} {"train_loss": -9.623334884643555, "global_step": 345555, "epoch": 2056} {"train_loss": -10.640300750732422, "global_step": 345556, "epoch": 2056} {"train_loss": -9.994633674621582, "global_step": 345557, "epoch": 2056} {"train_loss": -9.35610580444336, "global_step": 345558, "epoch": 2056} {"train_loss": -9.526396751403809, "global_step": 345559, "epoch": 2056} {"train_loss": -10.261951446533203, "global_step": 345560, "epoch": 2056} {"train_loss": -10.55965518951416, "global_step": 345561, "epoch": 2056} {"train_loss": -9.89063549041748, "global_step": 345562, "epoch": 2056} {"train_loss": -10.250545501708984, "global_step": 345563, "epoch": 2056} {"train_loss": -10.018182754516602, "global_step": 345564, "epoch": 2056} {"train_loss": -9.19550609588623, "global_step": 345565, "epoch": 2056} {"train_loss": -10.10675048828125, "global_step": 345566, "epoch": 2056} {"train_loss": -8.843400001525879, "global_step": 345567, "epoch": 2056} {"train_loss": -10.037109375, "global_step": 345568, "epoch": 2056} {"train_loss": -9.433934211730957, "global_step": 345569, "epoch": 2056} {"train_loss": -10.0325927734375, "global_step": 345570, "epoch": 2056} {"train_loss": -11.371208190917969, "global_step": 345571, "epoch": 2056} {"train_loss": -11.068623542785645, "global_step": 345572, "epoch": 2056} {"train_loss": -11.33127212524414, "global_step": 345573, "epoch": 2056} {"train_loss": -10.887533187866211, "global_step": 345574, "epoch": 2056} {"train_loss": -11.676531093461174, "global_step": 345575, "epoch": 2056, "val_loss": 284566.6875} {"train_loss": -10.203939437866211, "global_step": 345576, "epoch": 2057} {"train_loss": -11.157449722290039, "global_step": 345577, "epoch": 2057} {"train_loss": -10.949515342712402, "global_step": 345578, "epoch": 2057} {"train_loss": -10.778992652893066, "global_step": 345579, "epoch": 2057} {"train_loss": -11.194416046142578, "global_step": 345580, "epoch": 2057} {"train_loss": -10.82668685913086, "global_step": 345581, "epoch": 2057} {"train_loss": -10.090360641479492, "global_step": 345582, "epoch": 2057} {"train_loss": -11.668160438537598, "global_step": 345583, "epoch": 2057} {"train_loss": -10.536985397338867, "global_step": 345584, "epoch": 2057} {"train_loss": -11.520272254943848, "global_step": 345585, "epoch": 2057} {"train_loss": -11.043584823608398, "global_step": 345586, "epoch": 2057} {"train_loss": -11.397658348083496, "global_step": 345587, "epoch": 2057} {"train_loss": -11.771245956420898, "global_step": 345588, "epoch": 2057} {"train_loss": -11.78073501586914, "global_step": 345589, "epoch": 2057} {"train_loss": -11.374210357666016, "global_step": 345590, "epoch": 2057} {"train_loss": -11.944238662719727, "global_step": 345591, "epoch": 2057} {"train_loss": -11.682827949523926, "global_step": 345592, "epoch": 2057} {"train_loss": -11.761695861816406, "global_step": 345593, "epoch": 2057} {"train_loss": -11.873432159423828, "global_step": 345594, "epoch": 2057} {"train_loss": -11.977766990661621, "global_step": 345595, "epoch": 2057} {"train_loss": -12.035210609436035, "global_step": 345596, "epoch": 2057} {"train_loss": -11.959820747375488, "global_step": 345597, "epoch": 2057} {"train_loss": -11.85586929321289, "global_step": 345598, "epoch": 2057} {"train_loss": -12.095025062561035, "global_step": 345599, "epoch": 2057} {"train_loss": -12.11661434173584, "global_step": 345600, "epoch": 2057} {"train_loss": -11.92918586730957, "global_step": 345601, "epoch": 2057} {"train_loss": -11.847335815429688, "global_step": 345602, "epoch": 2057} {"train_loss": -11.872671127319336, "global_step": 345603, "epoch": 2057} {"train_loss": -11.753623962402344, "global_step": 345604, "epoch": 2057} {"train_loss": -11.835681915283203, "global_step": 345605, "epoch": 2057} {"train_loss": -12.08268928527832, "global_step": 345606, "epoch": 2057} {"train_loss": -11.853055953979492, "global_step": 345607, "epoch": 2057} {"train_loss": -12.160957336425781, "global_step": 345608, "epoch": 2057} {"train_loss": -12.181593894958496, "global_step": 345609, "epoch": 2057} {"train_loss": -12.232242584228516, "global_step": 345610, "epoch": 2057} {"train_loss": -12.059978485107422, "global_step": 345611, "epoch": 2057} {"train_loss": -12.05609130859375, "global_step": 345612, "epoch": 2057} {"train_loss": -12.313886642456055, "global_step": 345613, "epoch": 2057} {"train_loss": -12.150009155273438, "global_step": 345614, "epoch": 2057} {"train_loss": -12.053473472595215, "global_step": 345615, "epoch": 2057} {"train_loss": -12.199211120605469, "global_step": 345616, "epoch": 2057} {"train_loss": -12.12681770324707, "global_step": 345617, "epoch": 2057} {"train_loss": -12.119771003723145, "global_step": 345618, "epoch": 2057} {"train_loss": -12.149152755737305, "global_step": 345619, "epoch": 2057} {"train_loss": -12.026093482971191, "global_step": 345620, "epoch": 2057} {"train_loss": -12.37436294555664, "global_step": 345621, "epoch": 2057} {"train_loss": -12.0723237991333, "global_step": 345622, "epoch": 2057} {"train_loss": -12.21229362487793, "global_step": 345623, "epoch": 2057} {"train_loss": -12.064899444580078, "global_step": 345624, "epoch": 2057} {"train_loss": -12.193721771240234, "global_step": 345625, "epoch": 2057} {"train_loss": -12.191448211669922, "global_step": 345626, "epoch": 2057} {"train_loss": -12.275043487548828, "global_step": 345627, "epoch": 2057} {"train_loss": -12.323020935058594, "global_step": 345628, "epoch": 2057} {"train_loss": -12.37950611114502, "global_step": 345629, "epoch": 2057} {"train_loss": -12.31405258178711, "global_step": 345630, "epoch": 2057} {"train_loss": -12.457318305969238, "global_step": 345631, "epoch": 2057} {"train_loss": -12.274175643920898, "global_step": 345632, "epoch": 2057} {"train_loss": -12.30497932434082, "global_step": 345633, "epoch": 2057} {"train_loss": -12.254715919494629, "global_step": 345634, "epoch": 2057} {"train_loss": -12.036888122558594, "global_step": 345635, "epoch": 2057} {"train_loss": -12.256841659545898, "global_step": 345636, "epoch": 2057} {"train_loss": -12.21531867980957, "global_step": 345637, "epoch": 2057} {"train_loss": -12.519948959350586, "global_step": 345638, "epoch": 2057} {"train_loss": -11.967195510864258, "global_step": 345639, "epoch": 2057} {"train_loss": -12.489787101745605, "global_step": 345640, "epoch": 2057} {"train_loss": -11.882648468017578, "global_step": 345641, "epoch": 2057} {"train_loss": -12.400243759155273, "global_step": 345642, "epoch": 2057} {"train_loss": -12.332733154296875, "global_step": 345643, "epoch": 2057} {"train_loss": -12.160930633544922, "global_step": 345644, "epoch": 2057} {"train_loss": -12.315937995910645, "global_step": 345645, "epoch": 2057} {"train_loss": -12.299394607543945, "global_step": 345646, "epoch": 2057} {"train_loss": -12.504393577575684, "global_step": 345647, "epoch": 2057} {"train_loss": -12.162822723388672, "global_step": 345648, "epoch": 2057} {"train_loss": -11.962003707885742, "global_step": 345649, "epoch": 2057} {"train_loss": -12.312506675720215, "global_step": 345650, "epoch": 2057} {"train_loss": -11.742829322814941, "global_step": 345651, "epoch": 2057} {"train_loss": -11.848264694213867, "global_step": 345652, "epoch": 2057} {"train_loss": -12.38641357421875, "global_step": 345653, "epoch": 2057} {"train_loss": -12.051485061645508, "global_step": 345654, "epoch": 2057} {"train_loss": -11.972570419311523, "global_step": 345655, "epoch": 2057} {"train_loss": -12.414056777954102, "global_step": 345656, "epoch": 2057} {"train_loss": -12.0469388961792, "global_step": 345657, "epoch": 2057} {"train_loss": -12.205053329467773, "global_step": 345658, "epoch": 2057} {"train_loss": -12.275758743286133, "global_step": 345659, "epoch": 2057} {"train_loss": -12.126995086669922, "global_step": 345660, "epoch": 2057} {"train_loss": -12.426521301269531, "global_step": 345661, "epoch": 2057} {"train_loss": -12.477312088012695, "global_step": 345662, "epoch": 2057} {"train_loss": -12.265762329101562, "global_step": 345663, "epoch": 2057} {"train_loss": -12.53170108795166, "global_step": 345664, "epoch": 2057} {"train_loss": -12.421693801879883, "global_step": 345665, "epoch": 2057} {"train_loss": -12.15658950805664, "global_step": 345666, "epoch": 2057} {"train_loss": -12.358183860778809, "global_step": 345667, "epoch": 2057} {"train_loss": -12.329269409179688, "global_step": 345668, "epoch": 2057} {"train_loss": -12.186600685119629, "global_step": 345669, "epoch": 2057} {"train_loss": -12.211491584777832, "global_step": 345670, "epoch": 2057} {"train_loss": -12.361690521240234, "global_step": 345671, "epoch": 2057} {"train_loss": -12.592938423156738, "global_step": 345672, "epoch": 2057} {"train_loss": -12.773456573486328, "global_step": 345673, "epoch": 2057} {"train_loss": -12.478065490722656, "global_step": 345674, "epoch": 2057} {"train_loss": -12.737663269042969, "global_step": 345675, "epoch": 2057} {"train_loss": -12.51497745513916, "global_step": 345676, "epoch": 2057} {"train_loss": -12.388927459716797, "global_step": 345677, "epoch": 2057} {"train_loss": -12.554901123046875, "global_step": 345678, "epoch": 2057} {"train_loss": -12.45584487915039, "global_step": 345679, "epoch": 2057} {"train_loss": -12.403436660766602, "global_step": 345680, "epoch": 2057} {"train_loss": -12.143310546875, "global_step": 345681, "epoch": 2057} {"train_loss": -12.008699417114258, "global_step": 345682, "epoch": 2057} {"train_loss": -11.796855926513672, "global_step": 345683, "epoch": 2057} {"train_loss": -12.009632110595703, "global_step": 345684, "epoch": 2057} {"train_loss": -12.198716163635254, "global_step": 345685, "epoch": 2057} {"train_loss": -11.6494779586792, "global_step": 345686, "epoch": 2057} {"train_loss": -12.32517147064209, "global_step": 345687, "epoch": 2057} {"train_loss": -11.85909652709961, "global_step": 345688, "epoch": 2057} {"train_loss": -11.93606185913086, "global_step": 345689, "epoch": 2057} {"train_loss": -11.659114837646484, "global_step": 345690, "epoch": 2057} {"train_loss": -11.822660446166992, "global_step": 345691, "epoch": 2057} {"train_loss": -10.158233642578125, "global_step": 345692, "epoch": 2057} {"train_loss": -12.25296401977539, "global_step": 345693, "epoch": 2057} {"train_loss": -10.881261825561523, "global_step": 345694, "epoch": 2057} {"train_loss": -9.72398567199707, "global_step": 345695, "epoch": 2057} {"train_loss": -11.811540603637695, "global_step": 345696, "epoch": 2057} {"train_loss": -10.81745719909668, "global_step": 345697, "epoch": 2057} {"train_loss": -10.782958030700684, "global_step": 345698, "epoch": 2057} {"train_loss": -12.190544128417969, "global_step": 345699, "epoch": 2057} {"train_loss": -11.022113800048828, "global_step": 345700, "epoch": 2057} {"train_loss": -12.047178268432617, "global_step": 345701, "epoch": 2057} {"train_loss": -11.374265670776367, "global_step": 345702, "epoch": 2057} {"train_loss": -12.005155563354492, "global_step": 345703, "epoch": 2057} {"train_loss": -11.670289993286133, "global_step": 345704, "epoch": 2057} {"train_loss": -11.391347885131836, "global_step": 345705, "epoch": 2057} {"train_loss": -11.662534713745117, "global_step": 345706, "epoch": 2057} {"train_loss": -11.724563598632812, "global_step": 345707, "epoch": 2057} {"train_loss": -11.165755271911621, "global_step": 345708, "epoch": 2057} {"train_loss": -11.581442832946777, "global_step": 345709, "epoch": 2057} {"train_loss": -11.154420852661133, "global_step": 345710, "epoch": 2057} {"train_loss": -10.341712951660156, "global_step": 345711, "epoch": 2057} {"train_loss": -11.582839012145996, "global_step": 345712, "epoch": 2057} {"train_loss": -10.510825157165527, "global_step": 345713, "epoch": 2057} {"train_loss": -11.496940612792969, "global_step": 345714, "epoch": 2057} {"train_loss": -10.062891006469727, "global_step": 345715, "epoch": 2057} {"train_loss": -11.346753120422363, "global_step": 345716, "epoch": 2057} {"train_loss": -9.991667747497559, "global_step": 345717, "epoch": 2057} {"train_loss": -10.866694450378418, "global_step": 345718, "epoch": 2057} {"train_loss": -10.819150924682617, "global_step": 345719, "epoch": 2057} {"train_loss": -10.02092170715332, "global_step": 345720, "epoch": 2057} {"train_loss": -9.997173309326172, "global_step": 345721, "epoch": 2057} {"train_loss": -10.500022888183594, "global_step": 345722, "epoch": 2057} {"train_loss": -10.705171585083008, "global_step": 345723, "epoch": 2057} {"train_loss": -10.815153121948242, "global_step": 345724, "epoch": 2057} {"train_loss": -10.868412971496582, "global_step": 345725, "epoch": 2057} {"train_loss": -11.35780143737793, "global_step": 345726, "epoch": 2057} {"train_loss": -10.899577140808105, "global_step": 345727, "epoch": 2057} {"train_loss": -11.373716354370117, "global_step": 345728, "epoch": 2057} {"train_loss": -11.306035041809082, "global_step": 345729, "epoch": 2057} {"train_loss": -11.462008476257324, "global_step": 345730, "epoch": 2057} {"train_loss": -10.65278434753418, "global_step": 345731, "epoch": 2057} {"train_loss": -11.652107238769531, "global_step": 345732, "epoch": 2057} {"train_loss": -10.490762710571289, "global_step": 345733, "epoch": 2057} {"train_loss": -11.404413223266602, "global_step": 345734, "epoch": 2057} {"train_loss": -11.185355186462402, "global_step": 345735, "epoch": 2057} {"train_loss": -10.219947814941406, "global_step": 345736, "epoch": 2057} {"train_loss": -11.900781631469727, "global_step": 345737, "epoch": 2057} {"train_loss": -11.011812210083008, "global_step": 345738, "epoch": 2057} {"train_loss": -11.222835540771484, "global_step": 345739, "epoch": 2057} {"train_loss": -11.48126220703125, "global_step": 345740, "epoch": 2057} {"train_loss": -11.029912948608398, "global_step": 345741, "epoch": 2057} {"train_loss": -11.245487213134766, "global_step": 345742, "epoch": 2057} {"train_loss": -11.738379784992762, "global_step": 345743, "epoch": 2057, "val_loss": 290032.59375} {"train_loss": -10.876714706420898, "global_step": 345744, "epoch": 2058} {"train_loss": -11.527477264404297, "global_step": 345745, "epoch": 2058} {"train_loss": -11.841334342956543, "global_step": 345746, "epoch": 2058} {"train_loss": -10.938496589660645, "global_step": 345747, "epoch": 2058} {"train_loss": -11.637666702270508, "global_step": 345748, "epoch": 2058} {"train_loss": -11.69461441040039, "global_step": 345749, "epoch": 2058} {"train_loss": -11.48894214630127, "global_step": 345750, "epoch": 2058} {"train_loss": -11.938817977905273, "global_step": 345751, "epoch": 2058} {"train_loss": -11.623361587524414, "global_step": 345752, "epoch": 2058} {"train_loss": -11.877315521240234, "global_step": 345753, "epoch": 2058} {"train_loss": -11.932151794433594, "global_step": 345754, "epoch": 2058} {"train_loss": -11.668155670166016, "global_step": 345755, "epoch": 2058} {"train_loss": -11.8239107131958, "global_step": 345756, "epoch": 2058} {"train_loss": -12.067575454711914, "global_step": 345757, "epoch": 2058} {"train_loss": -11.631153106689453, "global_step": 345758, "epoch": 2058} {"train_loss": -12.202689170837402, "global_step": 345759, "epoch": 2058} {"train_loss": -11.447598457336426, "global_step": 345760, "epoch": 2058} {"train_loss": -12.095455169677734, "global_step": 345761, "epoch": 2058} {"train_loss": -11.76891803741455, "global_step": 345762, "epoch": 2058} {"train_loss": -11.872197151184082, "global_step": 345763, "epoch": 2058} {"train_loss": -11.793817520141602, "global_step": 345764, "epoch": 2058} {"train_loss": -12.151227951049805, "global_step": 345765, "epoch": 2058} {"train_loss": -11.721684455871582, "global_step": 345766, "epoch": 2058} {"train_loss": -12.127098083496094, "global_step": 345767, "epoch": 2058} {"train_loss": -11.867976188659668, "global_step": 345768, "epoch": 2058} {"train_loss": -12.240299224853516, "global_step": 345769, "epoch": 2058} {"train_loss": -11.80935287475586, "global_step": 345770, "epoch": 2058} {"train_loss": -12.034844398498535, "global_step": 345771, "epoch": 2058} {"train_loss": -11.923776626586914, "global_step": 345772, "epoch": 2058} {"train_loss": -12.261083602905273, "global_step": 345773, "epoch": 2058} {"train_loss": -11.759044647216797, "global_step": 345774, "epoch": 2058} {"train_loss": -12.305144309997559, "global_step": 345775, "epoch": 2058} {"train_loss": -11.94620418548584, "global_step": 345776, "epoch": 2058} {"train_loss": -12.132169723510742, "global_step": 345777, "epoch": 2058} {"train_loss": -12.074295997619629, "global_step": 345778, "epoch": 2058} {"train_loss": -12.165253639221191, "global_step": 345779, "epoch": 2058} {"train_loss": -11.968704223632812, "global_step": 345780, "epoch": 2058} {"train_loss": -12.259040832519531, "global_step": 345781, "epoch": 2058} {"train_loss": -12.178586959838867, "global_step": 345782, "epoch": 2058} {"train_loss": -12.365447044372559, "global_step": 345783, "epoch": 2058} {"train_loss": -12.313111305236816, "global_step": 345784, "epoch": 2058} {"train_loss": -12.190690040588379, "global_step": 345785, "epoch": 2058} {"train_loss": -12.377737045288086, "global_step": 345786, "epoch": 2058} {"train_loss": -12.418231964111328, "global_step": 345787, "epoch": 2058} {"train_loss": -12.269506454467773, "global_step": 345788, "epoch": 2058} {"train_loss": -12.338811874389648, "global_step": 345789, "epoch": 2058} {"train_loss": -12.22314453125, "global_step": 345790, "epoch": 2058} {"train_loss": -12.445666313171387, "global_step": 345791, "epoch": 2058} {"train_loss": -12.46064567565918, "global_step": 345792, "epoch": 2058} {"train_loss": -12.383951187133789, "global_step": 345793, "epoch": 2058} {"train_loss": -12.245054244995117, "global_step": 345794, "epoch": 2058} {"train_loss": -12.208673477172852, "global_step": 345795, "epoch": 2058} {"train_loss": -12.51676082611084, "global_step": 345796, "epoch": 2058} {"train_loss": -12.270216941833496, "global_step": 345797, "epoch": 2058} {"train_loss": -12.28131103515625, "global_step": 345798, "epoch": 2058} {"train_loss": -12.393869400024414, "global_step": 345799, "epoch": 2058} {"train_loss": -12.573524475097656, "global_step": 345800, "epoch": 2058} {"train_loss": -12.488696098327637, "global_step": 345801, "epoch": 2058} {"train_loss": -12.193763732910156, "global_step": 345802, "epoch": 2058} {"train_loss": -12.556526184082031, "global_step": 345803, "epoch": 2058} {"train_loss": -12.080973625183105, "global_step": 345804, "epoch": 2058} {"train_loss": -12.44750690460205, "global_step": 345805, "epoch": 2058} {"train_loss": -12.33433723449707, "global_step": 345806, "epoch": 2058} {"train_loss": -12.413789749145508, "global_step": 345807, "epoch": 2058} {"train_loss": -12.312260627746582, "global_step": 345808, "epoch": 2058} {"train_loss": -12.627464294433594, "global_step": 345809, "epoch": 2058} {"train_loss": -12.441219329833984, "global_step": 345810, "epoch": 2058} {"train_loss": -12.048201560974121, "global_step": 345811, "epoch": 2058} {"train_loss": -12.350484848022461, "global_step": 345812, "epoch": 2058} {"train_loss": -12.480827331542969, "global_step": 345813, "epoch": 2058} {"train_loss": -12.564163208007812, "global_step": 345814, "epoch": 2058} {"train_loss": -12.275188446044922, "global_step": 345815, "epoch": 2058} {"train_loss": -12.366754531860352, "global_step": 345816, "epoch": 2058} {"train_loss": -12.556865692138672, "global_step": 345817, "epoch": 2058} {"train_loss": -12.607254981994629, "global_step": 345818, "epoch": 2058} {"train_loss": -12.609785079956055, "global_step": 345819, "epoch": 2058} {"train_loss": -12.668867111206055, "global_step": 345820, "epoch": 2058} {"train_loss": -12.662705421447754, "global_step": 345821, "epoch": 2058} {"train_loss": -12.365249633789062, "global_step": 345822, "epoch": 2058} {"train_loss": -12.267305374145508, "global_step": 345823, "epoch": 2058} {"train_loss": -12.346874237060547, "global_step": 345824, "epoch": 2058} {"train_loss": -12.648621559143066, "global_step": 345825, "epoch": 2058} {"train_loss": -12.382246971130371, "global_step": 345826, "epoch": 2058} {"train_loss": -12.124494552612305, "global_step": 345827, "epoch": 2058} {"train_loss": -12.366844177246094, "global_step": 345828, "epoch": 2058} {"train_loss": -12.784734725952148, "global_step": 345829, "epoch": 2058} {"train_loss": -12.42072868347168, "global_step": 345830, "epoch": 2058} {"train_loss": -12.476826667785645, "global_step": 345831, "epoch": 2058} {"train_loss": -12.179158210754395, "global_step": 345832, "epoch": 2058} {"train_loss": -12.107465744018555, "global_step": 345833, "epoch": 2058} {"train_loss": -12.182624816894531, "global_step": 345834, "epoch": 2058} {"train_loss": -12.60448169708252, "global_step": 345835, "epoch": 2058} {"train_loss": -12.686070442199707, "global_step": 345836, "epoch": 2058} {"train_loss": -12.115987777709961, "global_step": 345837, "epoch": 2058} {"train_loss": -11.82841968536377, "global_step": 345838, "epoch": 2058} {"train_loss": -12.064762115478516, "global_step": 345839, "epoch": 2058} {"train_loss": -12.440803527832031, "global_step": 345840, "epoch": 2058} {"train_loss": -11.742589950561523, "global_step": 345841, "epoch": 2058} {"train_loss": -11.762331008911133, "global_step": 345842, "epoch": 2058} {"train_loss": -11.77690315246582, "global_step": 345843, "epoch": 2058} {"train_loss": -12.054811477661133, "global_step": 345844, "epoch": 2058} {"train_loss": -10.55059814453125, "global_step": 345845, "epoch": 2058} {"train_loss": -11.390131950378418, "global_step": 345846, "epoch": 2058} {"train_loss": -12.26064682006836, "global_step": 345847, "epoch": 2058} {"train_loss": -11.540258407592773, "global_step": 345848, "epoch": 2058} {"train_loss": -10.96631145477295, "global_step": 345849, "epoch": 2058} {"train_loss": -12.308419227600098, "global_step": 345850, "epoch": 2058} {"train_loss": -10.972559928894043, "global_step": 345851, "epoch": 2058} {"train_loss": -11.873470306396484, "global_step": 345852, "epoch": 2058} {"train_loss": -11.995248794555664, "global_step": 345853, "epoch": 2058} {"train_loss": -11.783312797546387, "global_step": 345854, "epoch": 2058} {"train_loss": -10.700822830200195, "global_step": 345855, "epoch": 2058} {"train_loss": -12.342510223388672, "global_step": 345856, "epoch": 2058} {"train_loss": -11.545079231262207, "global_step": 345857, "epoch": 2058} {"train_loss": -11.195009231567383, "global_step": 345858, "epoch": 2058} {"train_loss": -11.86487865447998, "global_step": 345859, "epoch": 2058} {"train_loss": -10.51780891418457, "global_step": 345860, "epoch": 2058} {"train_loss": -11.848072052001953, "global_step": 345861, "epoch": 2058} {"train_loss": -11.190914154052734, "global_step": 345862, "epoch": 2058} {"train_loss": -10.294336318969727, "global_step": 345863, "epoch": 2058} {"train_loss": -12.335066795349121, "global_step": 345864, "epoch": 2058} {"train_loss": -11.9917573928833, "global_step": 345865, "epoch": 2058} {"train_loss": -11.32101058959961, "global_step": 345866, "epoch": 2058} {"train_loss": -12.069393157958984, "global_step": 345867, "epoch": 2058} {"train_loss": -11.773418426513672, "global_step": 345868, "epoch": 2058} {"train_loss": -11.380435943603516, "global_step": 345869, "epoch": 2058} {"train_loss": -11.351295471191406, "global_step": 345870, "epoch": 2058} {"train_loss": -11.833624839782715, "global_step": 345871, "epoch": 2058} {"train_loss": -11.826658248901367, "global_step": 345872, "epoch": 2058} {"train_loss": -11.937298774719238, "global_step": 345873, "epoch": 2058} {"train_loss": -11.96351432800293, "global_step": 345874, "epoch": 2058} {"train_loss": -12.007746696472168, "global_step": 345875, "epoch": 2058} {"train_loss": -11.705097198486328, "global_step": 345876, "epoch": 2058} {"train_loss": -12.590729713439941, "global_step": 345877, "epoch": 2058} {"train_loss": -11.686609268188477, "global_step": 345878, "epoch": 2058} {"train_loss": -12.12189769744873, "global_step": 345879, "epoch": 2058} {"train_loss": -11.962262153625488, "global_step": 345880, "epoch": 2058} {"train_loss": -11.968570709228516, "global_step": 345881, "epoch": 2058} {"train_loss": -12.073028564453125, "global_step": 345882, "epoch": 2058} {"train_loss": -11.780014038085938, "global_step": 345883, "epoch": 2058} {"train_loss": -12.07815933227539, "global_step": 345884, "epoch": 2058} {"train_loss": -11.715574264526367, "global_step": 345885, "epoch": 2058} {"train_loss": -12.012046813964844, "global_step": 345886, "epoch": 2058} {"train_loss": -12.461280822753906, "global_step": 345887, "epoch": 2058} {"train_loss": -12.0770263671875, "global_step": 345888, "epoch": 2058} {"train_loss": -12.565750122070312, "global_step": 345889, "epoch": 2058} {"train_loss": -12.012619018554688, "global_step": 345890, "epoch": 2058} {"train_loss": -12.05223274230957, "global_step": 345891, "epoch": 2058} {"train_loss": -12.090659141540527, "global_step": 345892, "epoch": 2058} {"train_loss": -12.161839485168457, "global_step": 345893, "epoch": 2058} {"train_loss": -12.096124649047852, "global_step": 345894, "epoch": 2058} {"train_loss": -12.208578109741211, "global_step": 345895, "epoch": 2058} {"train_loss": -12.216564178466797, "global_step": 345896, "epoch": 2058} {"train_loss": -12.197297096252441, "global_step": 345897, "epoch": 2058} {"train_loss": -12.06764030456543, "global_step": 345898, "epoch": 2058} {"train_loss": -12.2530517578125, "global_step": 345899, "epoch": 2058} {"train_loss": -12.220226287841797, "global_step": 345900, "epoch": 2058} {"train_loss": -11.882174491882324, "global_step": 345901, "epoch": 2058} {"train_loss": -12.29306411743164, "global_step": 345902, "epoch": 2058} {"train_loss": -12.14584732055664, "global_step": 345903, "epoch": 2058} {"train_loss": -12.479253768920898, "global_step": 345904, "epoch": 2058} {"train_loss": -12.51195240020752, "global_step": 345905, "epoch": 2058} {"train_loss": -12.335773468017578, "global_step": 345906, "epoch": 2058} {"train_loss": -12.602380752563477, "global_step": 345907, "epoch": 2058} {"train_loss": -12.351896286010742, "global_step": 345908, "epoch": 2058} {"train_loss": -12.611349105834961, "global_step": 345909, "epoch": 2058} {"train_loss": -12.676977157592773, "global_step": 345910, "epoch": 2058} {"train_loss": -12.053579920814151, "global_step": 345911, "epoch": 2058, "val_loss": 289601.21875} {"train_loss": -12.544368743896484, "global_step": 345912, "epoch": 2059} {"train_loss": -12.32333755493164, "global_step": 345913, "epoch": 2059} {"train_loss": -12.729022979736328, "global_step": 345914, "epoch": 2059} {"train_loss": -12.639490127563477, "global_step": 345915, "epoch": 2059} {"train_loss": -12.231856346130371, "global_step": 345916, "epoch": 2059} {"train_loss": -12.254524230957031, "global_step": 345917, "epoch": 2059} {"train_loss": -12.608575820922852, "global_step": 345918, "epoch": 2059} {"train_loss": -12.48324203491211, "global_step": 345919, "epoch": 2059} {"train_loss": -12.473854064941406, "global_step": 345920, "epoch": 2059} {"train_loss": -12.364103317260742, "global_step": 345921, "epoch": 2059} {"train_loss": -12.526683807373047, "global_step": 345922, "epoch": 2059} {"train_loss": -12.33537483215332, "global_step": 345923, "epoch": 2059} {"train_loss": -12.588781356811523, "global_step": 345924, "epoch": 2059} {"train_loss": -12.336711883544922, "global_step": 345925, "epoch": 2059} {"train_loss": -12.573798179626465, "global_step": 345926, "epoch": 2059} {"train_loss": -12.441041946411133, "global_step": 345927, "epoch": 2059} {"train_loss": -12.251771926879883, "global_step": 345928, "epoch": 2059} {"train_loss": -12.54127025604248, "global_step": 345929, "epoch": 2059} {"train_loss": -12.497078895568848, "global_step": 345930, "epoch": 2059} {"train_loss": -12.337186813354492, "global_step": 345931, "epoch": 2059} {"train_loss": -12.16680908203125, "global_step": 345932, "epoch": 2059} {"train_loss": -12.269977569580078, "global_step": 345933, "epoch": 2059} {"train_loss": -12.272621154785156, "global_step": 345934, "epoch": 2059} {"train_loss": -12.145286560058594, "global_step": 345935, "epoch": 2059} {"train_loss": -12.224989891052246, "global_step": 345936, "epoch": 2059} {"train_loss": -12.072450637817383, "global_step": 345937, "epoch": 2059} {"train_loss": -11.723554611206055, "global_step": 345938, "epoch": 2059} {"train_loss": -11.981330871582031, "global_step": 345939, "epoch": 2059} {"train_loss": -12.124649047851562, "global_step": 345940, "epoch": 2059} {"train_loss": -11.985689163208008, "global_step": 345941, "epoch": 2059} {"train_loss": -12.61484146118164, "global_step": 345942, "epoch": 2059} {"train_loss": -11.82036018371582, "global_step": 345943, "epoch": 2059} {"train_loss": -11.777959823608398, "global_step": 345944, "epoch": 2059} {"train_loss": -12.092757225036621, "global_step": 345945, "epoch": 2059} {"train_loss": -12.145402908325195, "global_step": 345946, "epoch": 2059} {"train_loss": -12.06319522857666, "global_step": 345947, "epoch": 2059} {"train_loss": -11.758797645568848, "global_step": 345948, "epoch": 2059} {"train_loss": -12.493337631225586, "global_step": 345949, "epoch": 2059} {"train_loss": -11.524621963500977, "global_step": 345950, "epoch": 2059} {"train_loss": -11.657285690307617, "global_step": 345951, "epoch": 2059} {"train_loss": -11.86990737915039, "global_step": 345952, "epoch": 2059} {"train_loss": -11.208290100097656, "global_step": 345953, "epoch": 2059} {"train_loss": -11.512109756469727, "global_step": 345954, "epoch": 2059} {"train_loss": -11.28785514831543, "global_step": 345955, "epoch": 2059} {"train_loss": -12.044198989868164, "global_step": 345956, "epoch": 2059} {"train_loss": -11.682069778442383, "global_step": 345957, "epoch": 2059} {"train_loss": -11.6511869430542, "global_step": 345958, "epoch": 2059} {"train_loss": -12.20523452758789, "global_step": 345959, "epoch": 2059} {"train_loss": -11.145143508911133, "global_step": 345960, "epoch": 2059} {"train_loss": -10.546607971191406, "global_step": 345961, "epoch": 2059} {"train_loss": -9.495096206665039, "global_step": 345962, "epoch": 2059} {"train_loss": -11.384011268615723, "global_step": 345963, "epoch": 2059} {"train_loss": -9.672143936157227, "global_step": 345964, "epoch": 2059} {"train_loss": -9.378557205200195, "global_step": 345965, "epoch": 2059} {"train_loss": -10.02230167388916, "global_step": 345966, "epoch": 2059} {"train_loss": -10.742347717285156, "global_step": 345967, "epoch": 2059} {"train_loss": -10.710286140441895, "global_step": 345968, "epoch": 2059} {"train_loss": -9.898775100708008, "global_step": 345969, "epoch": 2059} {"train_loss": -11.624807357788086, "global_step": 345970, "epoch": 2059} {"train_loss": -7.557064056396484, "global_step": 345971, "epoch": 2059} {"train_loss": -10.418821334838867, "global_step": 345972, "epoch": 2059} {"train_loss": -7.184483051300049, "global_step": 345973, "epoch": 2059} {"train_loss": -6.946750640869141, "global_step": 345974, "epoch": 2059} {"train_loss": -7.17587947845459, "global_step": 345975, "epoch": 2059} {"train_loss": -8.130183219909668, "global_step": 345976, "epoch": 2059} {"train_loss": -8.151348114013672, "global_step": 345977, "epoch": 2059} {"train_loss": -10.193670272827148, "global_step": 345978, "epoch": 2059} {"train_loss": -8.70965576171875, "global_step": 345979, "epoch": 2059} {"train_loss": -7.99251651763916, "global_step": 345980, "epoch": 2059} {"train_loss": -8.62181568145752, "global_step": 345981, "epoch": 2059} {"train_loss": -8.328165054321289, "global_step": 345982, "epoch": 2059} {"train_loss": -10.051746368408203, "global_step": 345983, "epoch": 2059} {"train_loss": -9.282423973083496, "global_step": 345984, "epoch": 2059} {"train_loss": -10.18377685546875, "global_step": 345985, "epoch": 2059} {"train_loss": -10.889824867248535, "global_step": 345986, "epoch": 2059} {"train_loss": -9.614837646484375, "global_step": 345987, "epoch": 2059} {"train_loss": -9.819719314575195, "global_step": 345988, "epoch": 2059} {"train_loss": -9.954063415527344, "global_step": 345989, "epoch": 2059} {"train_loss": -9.611963272094727, "global_step": 345990, "epoch": 2059} {"train_loss": -10.06541633605957, "global_step": 345991, "epoch": 2059} {"train_loss": -9.964405059814453, "global_step": 345992, "epoch": 2059} {"train_loss": -11.195330619812012, "global_step": 345993, "epoch": 2059} {"train_loss": -10.817136764526367, "global_step": 345994, "epoch": 2059} {"train_loss": -10.860223770141602, "global_step": 345995, "epoch": 2059} {"train_loss": -11.399201393127441, "global_step": 345996, "epoch": 2059} {"train_loss": -10.801353454589844, "global_step": 345997, "epoch": 2059} {"train_loss": -10.576689720153809, "global_step": 345998, "epoch": 2059} {"train_loss": -10.80211067199707, "global_step": 345999, "epoch": 2059} {"train_loss": -10.283417701721191, "global_step": 346000, "epoch": 2059} {"train_loss": -11.178781509399414, "global_step": 346001, "epoch": 2059} {"train_loss": -10.698638916015625, "global_step": 346002, "epoch": 2059} {"train_loss": -10.865325927734375, "global_step": 346003, "epoch": 2059} {"train_loss": -10.85283374786377, "global_step": 346004, "epoch": 2059} {"train_loss": -11.213981628417969, "global_step": 346005, "epoch": 2059} {"train_loss": -10.408817291259766, "global_step": 346006, "epoch": 2059} {"train_loss": -11.3505220413208, "global_step": 346007, "epoch": 2059} {"train_loss": -10.758098602294922, "global_step": 346008, "epoch": 2059} {"train_loss": -10.469049453735352, "global_step": 346009, "epoch": 2059} {"train_loss": -11.123533248901367, "global_step": 346010, "epoch": 2059} {"train_loss": -9.922931671142578, "global_step": 346011, "epoch": 2059} {"train_loss": -11.148900985717773, "global_step": 346012, "epoch": 2059} {"train_loss": -10.646211624145508, "global_step": 346013, "epoch": 2059} {"train_loss": -11.157779693603516, "global_step": 346014, "epoch": 2059} {"train_loss": -11.343559265136719, "global_step": 346015, "epoch": 2059} {"train_loss": -10.664583206176758, "global_step": 346016, "epoch": 2059} {"train_loss": -11.518148422241211, "global_step": 346017, "epoch": 2059} {"train_loss": -11.237525939941406, "global_step": 346018, "epoch": 2059} {"train_loss": -10.955607414245605, "global_step": 346019, "epoch": 2059} {"train_loss": -11.841243743896484, "global_step": 346020, "epoch": 2059} {"train_loss": -11.31907844543457, "global_step": 346021, "epoch": 2059} {"train_loss": -11.587911605834961, "global_step": 346022, "epoch": 2059} {"train_loss": -11.659708976745605, "global_step": 346023, "epoch": 2059} {"train_loss": -11.632230758666992, "global_step": 346024, "epoch": 2059} {"train_loss": -11.49641227722168, "global_step": 346025, "epoch": 2059} {"train_loss": -11.813597679138184, "global_step": 346026, "epoch": 2059} {"train_loss": -11.710850715637207, "global_step": 346027, "epoch": 2059} {"train_loss": -11.374015808105469, "global_step": 346028, "epoch": 2059} {"train_loss": -11.73438835144043, "global_step": 346029, "epoch": 2059} {"train_loss": -11.873790740966797, "global_step": 346030, "epoch": 2059} {"train_loss": -11.365860939025879, "global_step": 346031, "epoch": 2059} {"train_loss": -11.527573585510254, "global_step": 346032, "epoch": 2059} {"train_loss": -11.62594985961914, "global_step": 346033, "epoch": 2059} {"train_loss": -11.860595703125, "global_step": 346034, "epoch": 2059} {"train_loss": -10.97242546081543, "global_step": 346035, "epoch": 2059} {"train_loss": -11.70438003540039, "global_step": 346036, "epoch": 2059} {"train_loss": -11.655288696289062, "global_step": 346037, "epoch": 2059} {"train_loss": -11.20694351196289, "global_step": 346038, "epoch": 2059} {"train_loss": -11.764841079711914, "global_step": 346039, "epoch": 2059} {"train_loss": -11.650101661682129, "global_step": 346040, "epoch": 2059} {"train_loss": -11.639780044555664, "global_step": 346041, "epoch": 2059} {"train_loss": -11.882150650024414, "global_step": 346042, "epoch": 2059} {"train_loss": -11.527935028076172, "global_step": 346043, "epoch": 2059} {"train_loss": -11.657651901245117, "global_step": 346044, "epoch": 2059} {"train_loss": -11.83292007446289, "global_step": 346045, "epoch": 2059} {"train_loss": -11.72236156463623, "global_step": 346046, "epoch": 2059} {"train_loss": -11.984172821044922, "global_step": 346047, "epoch": 2059} {"train_loss": -11.911861419677734, "global_step": 346048, "epoch": 2059} {"train_loss": -12.094564437866211, "global_step": 346049, "epoch": 2059} {"train_loss": -11.892722129821777, "global_step": 346050, "epoch": 2059} {"train_loss": -11.999308586120605, "global_step": 346051, "epoch": 2059} {"train_loss": -12.132996559143066, "global_step": 346052, "epoch": 2059} {"train_loss": -12.073394775390625, "global_step": 346053, "epoch": 2059} {"train_loss": -12.17263412475586, "global_step": 346054, "epoch": 2059} {"train_loss": -12.19588851928711, "global_step": 346055, "epoch": 2059} {"train_loss": -12.005785942077637, "global_step": 346056, "epoch": 2059} {"train_loss": -12.242225646972656, "global_step": 346057, "epoch": 2059} {"train_loss": -12.23437213897705, "global_step": 346058, "epoch": 2059} {"train_loss": -12.106054306030273, "global_step": 346059, "epoch": 2059} {"train_loss": -12.145304679870605, "global_step": 346060, "epoch": 2059} {"train_loss": -12.219264030456543, "global_step": 346061, "epoch": 2059} {"train_loss": -12.239768981933594, "global_step": 346062, "epoch": 2059} {"train_loss": -12.040935516357422, "global_step": 346063, "epoch": 2059} {"train_loss": -12.217239379882812, "global_step": 346064, "epoch": 2059} {"train_loss": -12.17542839050293, "global_step": 346065, "epoch": 2059} {"train_loss": -12.170169830322266, "global_step": 346066, "epoch": 2059} {"train_loss": -12.297445297241211, "global_step": 346067, "epoch": 2059} {"train_loss": -12.128026008605957, "global_step": 346068, "epoch": 2059} {"train_loss": -12.142640113830566, "global_step": 346069, "epoch": 2059} {"train_loss": -12.460922241210938, "global_step": 346070, "epoch": 2059} {"train_loss": -11.990496635437012, "global_step": 346071, "epoch": 2059} {"train_loss": -11.878358840942383, "global_step": 346072, "epoch": 2059} {"train_loss": -12.060359954833984, "global_step": 346073, "epoch": 2059} {"train_loss": -12.312416076660156, "global_step": 346074, "epoch": 2059} {"train_loss": -12.167655944824219, "global_step": 346075, "epoch": 2059} {"train_loss": -12.195157051086426, "global_step": 346076, "epoch": 2059} {"train_loss": -12.488957405090332, "global_step": 346077, "epoch": 2059} {"train_loss": -12.423038482666016, "global_step": 346078, "epoch": 2059} {"train_loss": -11.343527524244218, "global_step": 346079, "epoch": 2059, "val_loss": 288379.0} {"train_loss": -12.308412551879883, "global_step": 346080, "epoch": 2060} {"train_loss": -12.379051208496094, "global_step": 346081, "epoch": 2060} {"train_loss": -12.335457801818848, "global_step": 346082, "epoch": 2060} {"train_loss": -12.119575500488281, "global_step": 346083, "epoch": 2060} {"train_loss": -12.572047233581543, "global_step": 346084, "epoch": 2060} {"train_loss": -12.252730369567871, "global_step": 346085, "epoch": 2060} {"train_loss": -12.296905517578125, "global_step": 346086, "epoch": 2060} {"train_loss": -12.548479080200195, "global_step": 346087, "epoch": 2060} {"train_loss": -12.406091690063477, "global_step": 346088, "epoch": 2060} {"train_loss": -12.483745574951172, "global_step": 346089, "epoch": 2060} {"train_loss": -12.566984176635742, "global_step": 346090, "epoch": 2060} {"train_loss": -12.554954528808594, "global_step": 346091, "epoch": 2060} {"train_loss": -12.557734489440918, "global_step": 346092, "epoch": 2060} {"train_loss": -12.648244857788086, "global_step": 346093, "epoch": 2060} {"train_loss": -12.473848342895508, "global_step": 346094, "epoch": 2060} {"train_loss": -12.617969512939453, "global_step": 346095, "epoch": 2060} {"train_loss": -12.485602378845215, "global_step": 346096, "epoch": 2060} {"train_loss": -12.506524085998535, "global_step": 346097, "epoch": 2060} {"train_loss": -12.48796558380127, "global_step": 346098, "epoch": 2060} {"train_loss": -12.493170738220215, "global_step": 346099, "epoch": 2060} {"train_loss": -12.58666706085205, "global_step": 346100, "epoch": 2060} {"train_loss": -12.425968170166016, "global_step": 346101, "epoch": 2060} {"train_loss": -12.658208847045898, "global_step": 346102, "epoch": 2060} {"train_loss": -12.456342697143555, "global_step": 346103, "epoch": 2060} {"train_loss": -12.689889907836914, "global_step": 346104, "epoch": 2060} {"train_loss": -12.501541137695312, "global_step": 346105, "epoch": 2060} {"train_loss": -12.661964416503906, "global_step": 346106, "epoch": 2060} {"train_loss": -12.359939575195312, "global_step": 346107, "epoch": 2060} {"train_loss": -12.759562492370605, "global_step": 346108, "epoch": 2060} {"train_loss": -12.633159637451172, "global_step": 346109, "epoch": 2060} {"train_loss": -12.503473281860352, "global_step": 346110, "epoch": 2060} {"train_loss": -12.724510192871094, "global_step": 346111, "epoch": 2060} {"train_loss": -12.671485900878906, "global_step": 346112, "epoch": 2060} {"train_loss": -12.730298042297363, "global_step": 346113, "epoch": 2060} {"train_loss": -12.661245346069336, "global_step": 346114, "epoch": 2060} {"train_loss": -12.724119186401367, "global_step": 346115, "epoch": 2060} {"train_loss": -12.741333961486816, "global_step": 346116, "epoch": 2060} {"train_loss": -12.699743270874023, "global_step": 346117, "epoch": 2060} {"train_loss": -12.736546516418457, "global_step": 346118, "epoch": 2060} {"train_loss": -12.685370445251465, "global_step": 346119, "epoch": 2060} {"train_loss": -12.843413352966309, "global_step": 346120, "epoch": 2060} {"train_loss": -12.461691856384277, "global_step": 346121, "epoch": 2060} {"train_loss": -12.399465560913086, "global_step": 346122, "epoch": 2060} {"train_loss": -12.6002836227417, "global_step": 346123, "epoch": 2060} {"train_loss": -12.651510238647461, "global_step": 346124, "epoch": 2060} {"train_loss": -12.738607406616211, "global_step": 346125, "epoch": 2060} {"train_loss": -12.548678398132324, "global_step": 346126, "epoch": 2060} {"train_loss": -12.406453132629395, "global_step": 346127, "epoch": 2060} {"train_loss": -12.46087646484375, "global_step": 346128, "epoch": 2060} {"train_loss": -12.456263542175293, "global_step": 346129, "epoch": 2060} {"train_loss": -12.59908676147461, "global_step": 346130, "epoch": 2060} {"train_loss": -12.621492385864258, "global_step": 346131, "epoch": 2060} {"train_loss": -12.629751205444336, "global_step": 346132, "epoch": 2060} {"train_loss": -12.389328956604004, "global_step": 346133, "epoch": 2060} {"train_loss": -12.358528137207031, "global_step": 346134, "epoch": 2060} {"train_loss": -12.3701753616333, "global_step": 346135, "epoch": 2060} {"train_loss": -11.82441520690918, "global_step": 346136, "epoch": 2060} {"train_loss": -11.33096694946289, "global_step": 346137, "epoch": 2060} {"train_loss": -10.193824768066406, "global_step": 346138, "epoch": 2060} {"train_loss": -11.817578315734863, "global_step": 346139, "epoch": 2060} {"train_loss": -11.016716003417969, "global_step": 346140, "epoch": 2060} {"train_loss": -11.06289005279541, "global_step": 346141, "epoch": 2060} {"train_loss": -12.287246704101562, "global_step": 346142, "epoch": 2060} {"train_loss": -12.195028305053711, "global_step": 346143, "epoch": 2060} {"train_loss": -11.401130676269531, "global_step": 346144, "epoch": 2060} {"train_loss": -11.479385375976562, "global_step": 346145, "epoch": 2060} {"train_loss": -12.025835990905762, "global_step": 346146, "epoch": 2060} {"train_loss": -11.33582878112793, "global_step": 346147, "epoch": 2060} {"train_loss": -12.355457305908203, "global_step": 346148, "epoch": 2060} {"train_loss": -10.694133758544922, "global_step": 346149, "epoch": 2060} {"train_loss": -11.851388931274414, "global_step": 346150, "epoch": 2060} {"train_loss": -11.152294158935547, "global_step": 346151, "epoch": 2060} {"train_loss": -10.24809741973877, "global_step": 346152, "epoch": 2060} {"train_loss": -11.847457885742188, "global_step": 346153, "epoch": 2060} {"train_loss": -10.801811218261719, "global_step": 346154, "epoch": 2060} {"train_loss": -11.55888843536377, "global_step": 346155, "epoch": 2060} {"train_loss": -11.95697021484375, "global_step": 346156, "epoch": 2060} {"train_loss": -11.420522689819336, "global_step": 346157, "epoch": 2060} {"train_loss": -12.13963794708252, "global_step": 346158, "epoch": 2060} {"train_loss": -11.762008666992188, "global_step": 346159, "epoch": 2060} {"train_loss": -11.850870132446289, "global_step": 346160, "epoch": 2060} {"train_loss": -12.087753295898438, "global_step": 346161, "epoch": 2060} {"train_loss": -12.011338233947754, "global_step": 346162, "epoch": 2060} {"train_loss": -11.580953598022461, "global_step": 346163, "epoch": 2060} {"train_loss": -11.45139217376709, "global_step": 346164, "epoch": 2060} {"train_loss": -11.716175079345703, "global_step": 346165, "epoch": 2060} {"train_loss": -11.86263656616211, "global_step": 346166, "epoch": 2060} {"train_loss": -11.556099891662598, "global_step": 346167, "epoch": 2060} {"train_loss": -12.078330993652344, "global_step": 346168, "epoch": 2060} {"train_loss": -12.006536483764648, "global_step": 346169, "epoch": 2060} {"train_loss": -11.854131698608398, "global_step": 346170, "epoch": 2060} {"train_loss": -11.957060813903809, "global_step": 346171, "epoch": 2060} {"train_loss": -11.847678184509277, "global_step": 346172, "epoch": 2060} {"train_loss": -12.09356689453125, "global_step": 346173, "epoch": 2060} {"train_loss": -12.027623176574707, "global_step": 346174, "epoch": 2060} {"train_loss": -12.29543685913086, "global_step": 346175, "epoch": 2060} {"train_loss": -12.069265365600586, "global_step": 346176, "epoch": 2060} {"train_loss": -12.13957691192627, "global_step": 346177, "epoch": 2060} {"train_loss": -12.013648986816406, "global_step": 346178, "epoch": 2060} {"train_loss": -12.293745040893555, "global_step": 346179, "epoch": 2060} {"train_loss": -11.925666809082031, "global_step": 346180, "epoch": 2060} {"train_loss": -11.944334030151367, "global_step": 346181, "epoch": 2060} {"train_loss": -12.151102066040039, "global_step": 346182, "epoch": 2060} {"train_loss": -11.650100708007812, "global_step": 346183, "epoch": 2060} {"train_loss": -11.813169479370117, "global_step": 346184, "epoch": 2060} {"train_loss": -12.041875839233398, "global_step": 346185, "epoch": 2060} {"train_loss": -11.891826629638672, "global_step": 346186, "epoch": 2060} {"train_loss": -11.110340118408203, "global_step": 346187, "epoch": 2060} {"train_loss": -12.142946243286133, "global_step": 346188, "epoch": 2060} {"train_loss": -11.92555046081543, "global_step": 346189, "epoch": 2060} {"train_loss": -11.593477249145508, "global_step": 346190, "epoch": 2060} {"train_loss": -10.882808685302734, "global_step": 346191, "epoch": 2060} {"train_loss": -10.699263572692871, "global_step": 346192, "epoch": 2060} {"train_loss": -11.092668533325195, "global_step": 346193, "epoch": 2060} {"train_loss": -10.596264839172363, "global_step": 346194, "epoch": 2060} {"train_loss": -10.503483772277832, "global_step": 346195, "epoch": 2060} {"train_loss": -8.275321960449219, "global_step": 346196, "epoch": 2060} {"train_loss": -11.551063537597656, "global_step": 346197, "epoch": 2060} {"train_loss": -11.447725296020508, "global_step": 346198, "epoch": 2060} {"train_loss": -8.130767822265625, "global_step": 346199, "epoch": 2060} {"train_loss": -9.845256805419922, "global_step": 346200, "epoch": 2060} {"train_loss": -10.355945587158203, "global_step": 346201, "epoch": 2060} {"train_loss": -10.957852363586426, "global_step": 346202, "epoch": 2060} {"train_loss": -11.186439514160156, "global_step": 346203, "epoch": 2060} {"train_loss": -11.300411224365234, "global_step": 346204, "epoch": 2060} {"train_loss": -11.105485916137695, "global_step": 346205, "epoch": 2060} {"train_loss": -10.877695083618164, "global_step": 346206, "epoch": 2060} {"train_loss": -10.41127872467041, "global_step": 346207, "epoch": 2060} {"train_loss": -11.649344444274902, "global_step": 346208, "epoch": 2060} {"train_loss": -10.092916488647461, "global_step": 346209, "epoch": 2060} {"train_loss": -10.781378746032715, "global_step": 346210, "epoch": 2060} {"train_loss": -11.333040237426758, "global_step": 346211, "epoch": 2060} {"train_loss": -10.256597518920898, "global_step": 346212, "epoch": 2060} {"train_loss": -11.497166633605957, "global_step": 346213, "epoch": 2060} {"train_loss": -10.128859519958496, "global_step": 346214, "epoch": 2060} {"train_loss": -10.560935974121094, "global_step": 346215, "epoch": 2060} {"train_loss": -9.763051986694336, "global_step": 346216, "epoch": 2060} {"train_loss": -10.381263732910156, "global_step": 346217, "epoch": 2060} {"train_loss": -10.93327808380127, "global_step": 346218, "epoch": 2060} {"train_loss": -11.041257858276367, "global_step": 346219, "epoch": 2060} {"train_loss": -10.495323181152344, "global_step": 346220, "epoch": 2060} {"train_loss": -11.620026588439941, "global_step": 346221, "epoch": 2060} {"train_loss": -9.972529411315918, "global_step": 346222, "epoch": 2060} {"train_loss": -11.211258888244629, "global_step": 346223, "epoch": 2060} {"train_loss": -10.665681838989258, "global_step": 346224, "epoch": 2060} {"train_loss": -11.08026123046875, "global_step": 346225, "epoch": 2060} {"train_loss": -11.285209655761719, "global_step": 346226, "epoch": 2060} {"train_loss": -11.144423484802246, "global_step": 346227, "epoch": 2060} {"train_loss": -10.63170051574707, "global_step": 346228, "epoch": 2060} {"train_loss": -11.250917434692383, "global_step": 346229, "epoch": 2060} {"train_loss": -11.325311660766602, "global_step": 346230, "epoch": 2060} {"train_loss": -11.591804504394531, "global_step": 346231, "epoch": 2060} {"train_loss": -11.721953392028809, "global_step": 346232, "epoch": 2060} {"train_loss": -11.323653221130371, "global_step": 346233, "epoch": 2060} {"train_loss": -11.372063636779785, "global_step": 346234, "epoch": 2060} {"train_loss": -11.595338821411133, "global_step": 346235, "epoch": 2060} {"train_loss": -11.783205032348633, "global_step": 346236, "epoch": 2060} {"train_loss": -11.80964183807373, "global_step": 346237, "epoch": 2060} {"train_loss": -11.473372459411621, "global_step": 346238, "epoch": 2060} {"train_loss": -11.72471809387207, "global_step": 346239, "epoch": 2060} {"train_loss": -12.231834411621094, "global_step": 346240, "epoch": 2060} {"train_loss": -12.099494934082031, "global_step": 346241, "epoch": 2060} {"train_loss": -12.0645751953125, "global_step": 346242, "epoch": 2060} {"train_loss": -11.731160163879395, "global_step": 346243, "epoch": 2060} {"train_loss": -12.146636962890625, "global_step": 346244, "epoch": 2060} {"train_loss": -11.95905876159668, "global_step": 346245, "epoch": 2060} {"train_loss": -11.853126525878906, "global_step": 346246, "epoch": 2060} {"train_loss": -11.760737112590245, "global_step": 346247, "epoch": 2060, "val_loss": 290793.5625, "train_action_mse_error": 8.840946197509766} {"train_loss": -12.058320999145508, "global_step": 346248, "epoch": 2061} {"train_loss": -11.935571670532227, "global_step": 346249, "epoch": 2061} {"train_loss": -12.027061462402344, "global_step": 346250, "epoch": 2061} {"train_loss": -11.926764488220215, "global_step": 346251, "epoch": 2061} {"train_loss": -11.962509155273438, "global_step": 346252, "epoch": 2061} {"train_loss": -11.878742218017578, "global_step": 346253, "epoch": 2061} {"train_loss": -12.148956298828125, "global_step": 346254, "epoch": 2061} {"train_loss": -11.923931121826172, "global_step": 346255, "epoch": 2061} {"train_loss": -12.111495971679688, "global_step": 346256, "epoch": 2061} {"train_loss": -11.895031929016113, "global_step": 346257, "epoch": 2061} {"train_loss": -12.028654098510742, "global_step": 346258, "epoch": 2061} {"train_loss": -12.149404525756836, "global_step": 346259, "epoch": 2061} {"train_loss": -12.1889009475708, "global_step": 346260, "epoch": 2061} {"train_loss": -11.875244140625, "global_step": 346261, "epoch": 2061} {"train_loss": -12.136878967285156, "global_step": 346262, "epoch": 2061} {"train_loss": -11.902846336364746, "global_step": 346263, "epoch": 2061} {"train_loss": -11.962545394897461, "global_step": 346264, "epoch": 2061} {"train_loss": -11.997446060180664, "global_step": 346265, "epoch": 2061} {"train_loss": -11.947080612182617, "global_step": 346266, "epoch": 2061} {"train_loss": -12.043231964111328, "global_step": 346267, "epoch": 2061} {"train_loss": -12.347476959228516, "global_step": 346268, "epoch": 2061} {"train_loss": -12.186126708984375, "global_step": 346269, "epoch": 2061} {"train_loss": -11.886213302612305, "global_step": 346270, "epoch": 2061} {"train_loss": -12.208173751831055, "global_step": 346271, "epoch": 2061} {"train_loss": -12.286645889282227, "global_step": 346272, "epoch": 2061} {"train_loss": -12.00896167755127, "global_step": 346273, "epoch": 2061} {"train_loss": -12.065343856811523, "global_step": 346274, "epoch": 2061} {"train_loss": -12.251283645629883, "global_step": 346275, "epoch": 2061} {"train_loss": -12.382783889770508, "global_step": 346276, "epoch": 2061} {"train_loss": -12.32438850402832, "global_step": 346277, "epoch": 2061} {"train_loss": -12.21523666381836, "global_step": 346278, "epoch": 2061} {"train_loss": -12.191226959228516, "global_step": 346279, "epoch": 2061} {"train_loss": -12.073928833007812, "global_step": 346280, "epoch": 2061} {"train_loss": -12.111413955688477, "global_step": 346281, "epoch": 2061} {"train_loss": -12.075523376464844, "global_step": 346282, "epoch": 2061} {"train_loss": -12.17644214630127, "global_step": 346283, "epoch": 2061} {"train_loss": -12.107810020446777, "global_step": 346284, "epoch": 2061} {"train_loss": -12.340433120727539, "global_step": 346285, "epoch": 2061} {"train_loss": -12.287769317626953, "global_step": 346286, "epoch": 2061} {"train_loss": -12.222412109375, "global_step": 346287, "epoch": 2061} {"train_loss": -12.20405387878418, "global_step": 346288, "epoch": 2061} {"train_loss": -12.264947891235352, "global_step": 346289, "epoch": 2061} {"train_loss": -12.249967575073242, "global_step": 346290, "epoch": 2061} {"train_loss": -12.596105575561523, "global_step": 346291, "epoch": 2061} {"train_loss": -12.238329887390137, "global_step": 346292, "epoch": 2061} {"train_loss": -12.550566673278809, "global_step": 346293, "epoch": 2061} {"train_loss": -12.249804496765137, "global_step": 346294, "epoch": 2061} {"train_loss": -12.324853897094727, "global_step": 346295, "epoch": 2061} {"train_loss": -12.358573913574219, "global_step": 346296, "epoch": 2061} {"train_loss": -12.353342056274414, "global_step": 346297, "epoch": 2061} {"train_loss": -12.065704345703125, "global_step": 346298, "epoch": 2061} {"train_loss": -12.261011123657227, "global_step": 346299, "epoch": 2061} {"train_loss": -12.650931358337402, "global_step": 346300, "epoch": 2061} {"train_loss": -12.439103126525879, "global_step": 346301, "epoch": 2061} {"train_loss": -12.383501052856445, "global_step": 346302, "epoch": 2061} {"train_loss": -12.36473274230957, "global_step": 346303, "epoch": 2061} {"train_loss": -12.049250602722168, "global_step": 346304, "epoch": 2061} {"train_loss": -12.199531555175781, "global_step": 346305, "epoch": 2061} {"train_loss": -12.4969482421875, "global_step": 346306, "epoch": 2061} {"train_loss": -12.361316680908203, "global_step": 346307, "epoch": 2061} {"train_loss": -12.475625991821289, "global_step": 346308, "epoch": 2061} {"train_loss": -12.51019287109375, "global_step": 346309, "epoch": 2061} {"train_loss": -12.473968505859375, "global_step": 346310, "epoch": 2061} {"train_loss": -12.346863746643066, "global_step": 346311, "epoch": 2061} {"train_loss": -12.380636215209961, "global_step": 346312, "epoch": 2061} {"train_loss": -12.585944175720215, "global_step": 346313, "epoch": 2061} {"train_loss": -12.441410064697266, "global_step": 346314, "epoch": 2061} {"train_loss": -12.348760604858398, "global_step": 346315, "epoch": 2061} {"train_loss": -12.531961441040039, "global_step": 346316, "epoch": 2061} {"train_loss": -12.261419296264648, "global_step": 346317, "epoch": 2061} {"train_loss": -12.744725227355957, "global_step": 346318, "epoch": 2061} {"train_loss": -12.566366195678711, "global_step": 346319, "epoch": 2061} {"train_loss": -12.34256649017334, "global_step": 346320, "epoch": 2061} {"train_loss": -12.230622291564941, "global_step": 346321, "epoch": 2061} {"train_loss": -12.4893159866333, "global_step": 346322, "epoch": 2061} {"train_loss": -12.633132934570312, "global_step": 346323, "epoch": 2061} {"train_loss": -12.297567367553711, "global_step": 346324, "epoch": 2061} {"train_loss": -11.957382202148438, "global_step": 346325, "epoch": 2061} {"train_loss": -12.24020767211914, "global_step": 346326, "epoch": 2061} {"train_loss": -12.447275161743164, "global_step": 346327, "epoch": 2061} {"train_loss": -12.038783073425293, "global_step": 346328, "epoch": 2061} {"train_loss": -11.932254791259766, "global_step": 346329, "epoch": 2061} {"train_loss": -11.90445613861084, "global_step": 346330, "epoch": 2061} {"train_loss": -11.955018997192383, "global_step": 346331, "epoch": 2061} {"train_loss": -11.500661849975586, "global_step": 346332, "epoch": 2061} {"train_loss": -10.486041069030762, "global_step": 346333, "epoch": 2061} {"train_loss": -11.28055191040039, "global_step": 346334, "epoch": 2061} {"train_loss": -12.435998916625977, "global_step": 346335, "epoch": 2061} {"train_loss": -11.231193542480469, "global_step": 346336, "epoch": 2061} {"train_loss": -11.74207878112793, "global_step": 346337, "epoch": 2061} {"train_loss": -11.69882583618164, "global_step": 346338, "epoch": 2061} {"train_loss": -12.005444526672363, "global_step": 346339, "epoch": 2061} {"train_loss": -11.826290130615234, "global_step": 346340, "epoch": 2061} {"train_loss": -11.911542892456055, "global_step": 346341, "epoch": 2061} {"train_loss": -11.6922607421875, "global_step": 346342, "epoch": 2061} {"train_loss": -11.65846061706543, "global_step": 346343, "epoch": 2061} {"train_loss": -11.629770278930664, "global_step": 346344, "epoch": 2061} {"train_loss": -12.015650749206543, "global_step": 346345, "epoch": 2061} {"train_loss": -11.713516235351562, "global_step": 346346, "epoch": 2061} {"train_loss": -12.377750396728516, "global_step": 346347, "epoch": 2061} {"train_loss": -11.762767791748047, "global_step": 346348, "epoch": 2061} {"train_loss": -11.864453315734863, "global_step": 346349, "epoch": 2061} {"train_loss": -11.338468551635742, "global_step": 346350, "epoch": 2061} {"train_loss": -11.300943374633789, "global_step": 346351, "epoch": 2061} {"train_loss": -10.734392166137695, "global_step": 346352, "epoch": 2061} {"train_loss": -11.999795913696289, "global_step": 346353, "epoch": 2061} {"train_loss": -11.457989692687988, "global_step": 346354, "epoch": 2061} {"train_loss": -10.807326316833496, "global_step": 346355, "epoch": 2061} {"train_loss": -11.328592300415039, "global_step": 346356, "epoch": 2061} {"train_loss": -11.957296371459961, "global_step": 346357, "epoch": 2061} {"train_loss": -11.575018882751465, "global_step": 346358, "epoch": 2061} {"train_loss": -11.844581604003906, "global_step": 346359, "epoch": 2061} {"train_loss": -11.495420455932617, "global_step": 346360, "epoch": 2061} {"train_loss": -11.15849494934082, "global_step": 346361, "epoch": 2061} {"train_loss": -11.427637100219727, "global_step": 346362, "epoch": 2061} {"train_loss": -11.62908935546875, "global_step": 346363, "epoch": 2061} {"train_loss": -11.487794876098633, "global_step": 346364, "epoch": 2061} {"train_loss": -11.1915283203125, "global_step": 346365, "epoch": 2061} {"train_loss": -12.386837005615234, "global_step": 346366, "epoch": 2061} {"train_loss": -11.927194595336914, "global_step": 346367, "epoch": 2061} {"train_loss": -11.518155097961426, "global_step": 346368, "epoch": 2061} {"train_loss": -12.086090087890625, "global_step": 346369, "epoch": 2061} {"train_loss": -11.911431312561035, "global_step": 346370, "epoch": 2061} {"train_loss": -11.151226997375488, "global_step": 346371, "epoch": 2061} {"train_loss": -12.30048942565918, "global_step": 346372, "epoch": 2061} {"train_loss": -11.749044418334961, "global_step": 346373, "epoch": 2061} {"train_loss": -11.511560440063477, "global_step": 346374, "epoch": 2061} {"train_loss": -11.946060180664062, "global_step": 346375, "epoch": 2061} {"train_loss": -12.341800689697266, "global_step": 346376, "epoch": 2061} {"train_loss": -11.67999267578125, "global_step": 346377, "epoch": 2061} {"train_loss": -11.809852600097656, "global_step": 346378, "epoch": 2061} {"train_loss": -9.85931396484375, "global_step": 346379, "epoch": 2061} {"train_loss": -12.16572380065918, "global_step": 346380, "epoch": 2061} {"train_loss": -10.687541961669922, "global_step": 346381, "epoch": 2061} {"train_loss": -11.34518051147461, "global_step": 346382, "epoch": 2061} {"train_loss": -10.455302238464355, "global_step": 346383, "epoch": 2061} {"train_loss": -11.192182540893555, "global_step": 346384, "epoch": 2061} {"train_loss": -11.419775009155273, "global_step": 346385, "epoch": 2061} {"train_loss": -11.144744873046875, "global_step": 346386, "epoch": 2061} {"train_loss": -11.418524742126465, "global_step": 346387, "epoch": 2061} {"train_loss": -10.234678268432617, "global_step": 346388, "epoch": 2061} {"train_loss": -11.163458824157715, "global_step": 346389, "epoch": 2061} {"train_loss": -10.984758377075195, "global_step": 346390, "epoch": 2061} {"train_loss": -10.692180633544922, "global_step": 346391, "epoch": 2061} {"train_loss": -11.38731575012207, "global_step": 346392, "epoch": 2061} {"train_loss": -10.879878997802734, "global_step": 346393, "epoch": 2061} {"train_loss": -10.791399002075195, "global_step": 346394, "epoch": 2061} {"train_loss": -11.366471290588379, "global_step": 346395, "epoch": 2061} {"train_loss": -9.982921600341797, "global_step": 346396, "epoch": 2061} {"train_loss": -11.156633377075195, "global_step": 346397, "epoch": 2061} {"train_loss": -9.828624725341797, "global_step": 346398, "epoch": 2061} {"train_loss": -9.987089157104492, "global_step": 346399, "epoch": 2061} {"train_loss": -10.952418327331543, "global_step": 346400, "epoch": 2061} {"train_loss": -10.064583778381348, "global_step": 346401, "epoch": 2061} {"train_loss": -11.367395401000977, "global_step": 346402, "epoch": 2061} {"train_loss": -10.484997749328613, "global_step": 346403, "epoch": 2061} {"train_loss": -11.224321365356445, "global_step": 346404, "epoch": 2061} {"train_loss": -10.220882415771484, "global_step": 346405, "epoch": 2061} {"train_loss": -11.841516494750977, "global_step": 346406, "epoch": 2061} {"train_loss": -10.459297180175781, "global_step": 346407, "epoch": 2061} {"train_loss": -11.498931884765625, "global_step": 346408, "epoch": 2061} {"train_loss": -10.764853477478027, "global_step": 346409, "epoch": 2061} {"train_loss": -10.939647674560547, "global_step": 346410, "epoch": 2061} {"train_loss": -11.361648559570312, "global_step": 346411, "epoch": 2061} {"train_loss": -11.119734764099121, "global_step": 346412, "epoch": 2061} {"train_loss": -11.283628463745117, "global_step": 346413, "epoch": 2061} {"train_loss": -11.915277481079102, "global_step": 346414, "epoch": 2061} {"train_loss": -11.782334458260308, "global_step": 346415, "epoch": 2061, "val_loss": 291805.96875} {"train_loss": -11.729735374450684, "global_step": 346416, "epoch": 2062} {"train_loss": -11.457747459411621, "global_step": 346417, "epoch": 2062} {"train_loss": -11.403284072875977, "global_step": 346418, "epoch": 2062} {"train_loss": -11.903186798095703, "global_step": 346419, "epoch": 2062} {"train_loss": -11.422420501708984, "global_step": 346420, "epoch": 2062} {"train_loss": -11.970065116882324, "global_step": 346421, "epoch": 2062} {"train_loss": -11.830924987792969, "global_step": 346422, "epoch": 2062} {"train_loss": -11.802056312561035, "global_step": 346423, "epoch": 2062} {"train_loss": -11.698492050170898, "global_step": 346424, "epoch": 2062} {"train_loss": -11.478296279907227, "global_step": 346425, "epoch": 2062} {"train_loss": -12.017560005187988, "global_step": 346426, "epoch": 2062} {"train_loss": -12.083775520324707, "global_step": 346427, "epoch": 2062} {"train_loss": -11.973112106323242, "global_step": 346428, "epoch": 2062} {"train_loss": -12.340433120727539, "global_step": 346429, "epoch": 2062} {"train_loss": -11.941362380981445, "global_step": 346430, "epoch": 2062} {"train_loss": -12.188074111938477, "global_step": 346431, "epoch": 2062} {"train_loss": -11.903532028198242, "global_step": 346432, "epoch": 2062} {"train_loss": -12.137028694152832, "global_step": 346433, "epoch": 2062} {"train_loss": -11.952787399291992, "global_step": 346434, "epoch": 2062} {"train_loss": -12.141254425048828, "global_step": 346435, "epoch": 2062} {"train_loss": -12.165800094604492, "global_step": 346436, "epoch": 2062} {"train_loss": -12.122693061828613, "global_step": 346437, "epoch": 2062} {"train_loss": -12.249122619628906, "global_step": 346438, "epoch": 2062} {"train_loss": -12.143978118896484, "global_step": 346439, "epoch": 2062} {"train_loss": -12.211681365966797, "global_step": 346440, "epoch": 2062} {"train_loss": -12.137563705444336, "global_step": 346441, "epoch": 2062} {"train_loss": -12.052083969116211, "global_step": 346442, "epoch": 2062} {"train_loss": -12.401591300964355, "global_step": 346443, "epoch": 2062} {"train_loss": -12.254617691040039, "global_step": 346444, "epoch": 2062} {"train_loss": -12.361146926879883, "global_step": 346445, "epoch": 2062} {"train_loss": -12.268178939819336, "global_step": 346446, "epoch": 2062} {"train_loss": -12.309432983398438, "global_step": 346447, "epoch": 2062} {"train_loss": -12.299396514892578, "global_step": 346448, "epoch": 2062} {"train_loss": -12.278411865234375, "global_step": 346449, "epoch": 2062} {"train_loss": -12.080734252929688, "global_step": 346450, "epoch": 2062} {"train_loss": -12.22485065460205, "global_step": 346451, "epoch": 2062} {"train_loss": -12.200765609741211, "global_step": 346452, "epoch": 2062} {"train_loss": -12.190373420715332, "global_step": 346453, "epoch": 2062} {"train_loss": -12.387063980102539, "global_step": 346454, "epoch": 2062} {"train_loss": -12.089658737182617, "global_step": 346455, "epoch": 2062} {"train_loss": -12.198662757873535, "global_step": 346456, "epoch": 2062} {"train_loss": -12.149030685424805, "global_step": 346457, "epoch": 2062} {"train_loss": -11.945270538330078, "global_step": 346458, "epoch": 2062} {"train_loss": -12.349721908569336, "global_step": 346459, "epoch": 2062} {"train_loss": -11.88543701171875, "global_step": 346460, "epoch": 2062} {"train_loss": -11.933395385742188, "global_step": 346461, "epoch": 2062} {"train_loss": -12.26968002319336, "global_step": 346462, "epoch": 2062} {"train_loss": -11.96834945678711, "global_step": 346463, "epoch": 2062} {"train_loss": -12.159835815429688, "global_step": 346464, "epoch": 2062} {"train_loss": -12.343652725219727, "global_step": 346465, "epoch": 2062} {"train_loss": -12.24831771850586, "global_step": 346466, "epoch": 2062} {"train_loss": -12.187661170959473, "global_step": 346467, "epoch": 2062} {"train_loss": -12.29340648651123, "global_step": 346468, "epoch": 2062} {"train_loss": -11.995182037353516, "global_step": 346469, "epoch": 2062} {"train_loss": -12.071301460266113, "global_step": 346470, "epoch": 2062} {"train_loss": -12.36052131652832, "global_step": 346471, "epoch": 2062} {"train_loss": -12.241989135742188, "global_step": 346472, "epoch": 2062} {"train_loss": -11.79253101348877, "global_step": 346473, "epoch": 2062} {"train_loss": -12.416318893432617, "global_step": 346474, "epoch": 2062} {"train_loss": -12.129104614257812, "global_step": 346475, "epoch": 2062} {"train_loss": -12.322195053100586, "global_step": 346476, "epoch": 2062} {"train_loss": -11.970298767089844, "global_step": 346477, "epoch": 2062} {"train_loss": -12.420296669006348, "global_step": 346478, "epoch": 2062} {"train_loss": -12.003874778747559, "global_step": 346479, "epoch": 2062} {"train_loss": -12.408234596252441, "global_step": 346480, "epoch": 2062} {"train_loss": -12.169204711914062, "global_step": 346481, "epoch": 2062} {"train_loss": -12.50247573852539, "global_step": 346482, "epoch": 2062} {"train_loss": -11.875106811523438, "global_step": 346483, "epoch": 2062} {"train_loss": -12.04909610748291, "global_step": 346484, "epoch": 2062} {"train_loss": -11.093914031982422, "global_step": 346485, "epoch": 2062} {"train_loss": -10.766850471496582, "global_step": 346486, "epoch": 2062} {"train_loss": -10.865764617919922, "global_step": 346487, "epoch": 2062} {"train_loss": -10.046066284179688, "global_step": 346488, "epoch": 2062} {"train_loss": -10.55621337890625, "global_step": 346489, "epoch": 2062} {"train_loss": -10.321247100830078, "global_step": 346490, "epoch": 2062} {"train_loss": -10.093929290771484, "global_step": 346491, "epoch": 2062} {"train_loss": -10.92543888092041, "global_step": 346492, "epoch": 2062} {"train_loss": -10.614537239074707, "global_step": 346493, "epoch": 2062} {"train_loss": -9.630925178527832, "global_step": 346494, "epoch": 2062} {"train_loss": -11.374746322631836, "global_step": 346495, "epoch": 2062} {"train_loss": -10.518762588500977, "global_step": 346496, "epoch": 2062} {"train_loss": -10.422658920288086, "global_step": 346497, "epoch": 2062} {"train_loss": -10.624353408813477, "global_step": 346498, "epoch": 2062} {"train_loss": -9.97370719909668, "global_step": 346499, "epoch": 2062} {"train_loss": -11.366117477416992, "global_step": 346500, "epoch": 2062} {"train_loss": -10.78493595123291, "global_step": 346501, "epoch": 2062} {"train_loss": -9.250329971313477, "global_step": 346502, "epoch": 2062} {"train_loss": -11.340160369873047, "global_step": 346503, "epoch": 2062} {"train_loss": -9.71045207977295, "global_step": 346504, "epoch": 2062} {"train_loss": -9.725471496582031, "global_step": 346505, "epoch": 2062} {"train_loss": -9.3757905960083, "global_step": 346506, "epoch": 2062} {"train_loss": -9.930641174316406, "global_step": 346507, "epoch": 2062} {"train_loss": -11.107436180114746, "global_step": 346508, "epoch": 2062} {"train_loss": -9.513916969299316, "global_step": 346509, "epoch": 2062} {"train_loss": -9.794961929321289, "global_step": 346510, "epoch": 2062} {"train_loss": -11.165998458862305, "global_step": 346511, "epoch": 2062} {"train_loss": -10.71523666381836, "global_step": 346512, "epoch": 2062} {"train_loss": -10.540313720703125, "global_step": 346513, "epoch": 2062} {"train_loss": -11.025908470153809, "global_step": 346514, "epoch": 2062} {"train_loss": -10.626810073852539, "global_step": 346515, "epoch": 2062} {"train_loss": -11.637886047363281, "global_step": 346516, "epoch": 2062} {"train_loss": -10.957761764526367, "global_step": 346517, "epoch": 2062} {"train_loss": -11.706777572631836, "global_step": 346518, "epoch": 2062} {"train_loss": -11.295120239257812, "global_step": 346519, "epoch": 2062} {"train_loss": -11.659520149230957, "global_step": 346520, "epoch": 2062} {"train_loss": -11.514137268066406, "global_step": 346521, "epoch": 2062} {"train_loss": -11.543231964111328, "global_step": 346522, "epoch": 2062} {"train_loss": -11.378682136535645, "global_step": 346523, "epoch": 2062} {"train_loss": -11.739812850952148, "global_step": 346524, "epoch": 2062} {"train_loss": -11.163915634155273, "global_step": 346525, "epoch": 2062} {"train_loss": -11.98305892944336, "global_step": 346526, "epoch": 2062} {"train_loss": -11.855716705322266, "global_step": 346527, "epoch": 2062} {"train_loss": -11.759103775024414, "global_step": 346528, "epoch": 2062} {"train_loss": -11.791460037231445, "global_step": 346529, "epoch": 2062} {"train_loss": -11.736791610717773, "global_step": 346530, "epoch": 2062} {"train_loss": -11.609807968139648, "global_step": 346531, "epoch": 2062} {"train_loss": -11.865863800048828, "global_step": 346532, "epoch": 2062} {"train_loss": -11.441289901733398, "global_step": 346533, "epoch": 2062} {"train_loss": -12.055821418762207, "global_step": 346534, "epoch": 2062} {"train_loss": -11.805992126464844, "global_step": 346535, "epoch": 2062} {"train_loss": -12.03054428100586, "global_step": 346536, "epoch": 2062} {"train_loss": -11.75466537475586, "global_step": 346537, "epoch": 2062} {"train_loss": -12.06319808959961, "global_step": 346538, "epoch": 2062} {"train_loss": -11.974620819091797, "global_step": 346539, "epoch": 2062} {"train_loss": -12.22265911102295, "global_step": 346540, "epoch": 2062} {"train_loss": -11.981715202331543, "global_step": 346541, "epoch": 2062} {"train_loss": -12.02194881439209, "global_step": 346542, "epoch": 2062} {"train_loss": -12.084759712219238, "global_step": 346543, "epoch": 2062} {"train_loss": -11.753643035888672, "global_step": 346544, "epoch": 2062} {"train_loss": -11.563934326171875, "global_step": 346545, "epoch": 2062} {"train_loss": -11.443655014038086, "global_step": 346546, "epoch": 2062} {"train_loss": -12.242813110351562, "global_step": 346547, "epoch": 2062} {"train_loss": -11.52305793762207, "global_step": 346548, "epoch": 2062} {"train_loss": -12.009819030761719, "global_step": 346549, "epoch": 2062} {"train_loss": -11.881742477416992, "global_step": 346550, "epoch": 2062} {"train_loss": -12.04957389831543, "global_step": 346551, "epoch": 2062} {"train_loss": -12.25169563293457, "global_step": 346552, "epoch": 2062} {"train_loss": -11.954452514648438, "global_step": 346553, "epoch": 2062} {"train_loss": -11.894200325012207, "global_step": 346554, "epoch": 2062} {"train_loss": -11.921624183654785, "global_step": 346555, "epoch": 2062} {"train_loss": -11.879013061523438, "global_step": 346556, "epoch": 2062} {"train_loss": -12.154789924621582, "global_step": 346557, "epoch": 2062} {"train_loss": -11.840425491333008, "global_step": 346558, "epoch": 2062} {"train_loss": -11.895761489868164, "global_step": 346559, "epoch": 2062} {"train_loss": -11.88188362121582, "global_step": 346560, "epoch": 2062} {"train_loss": -11.980925559997559, "global_step": 346561, "epoch": 2062} {"train_loss": -11.841875076293945, "global_step": 346562, "epoch": 2062} {"train_loss": -12.254317283630371, "global_step": 346563, "epoch": 2062} {"train_loss": -12.203371047973633, "global_step": 346564, "epoch": 2062} {"train_loss": -12.009581565856934, "global_step": 346565, "epoch": 2062} {"train_loss": -12.268285751342773, "global_step": 346566, "epoch": 2062} {"train_loss": -12.280077934265137, "global_step": 346567, "epoch": 2062} {"train_loss": -12.334105491638184, "global_step": 346568, "epoch": 2062} {"train_loss": -12.208534240722656, "global_step": 346569, "epoch": 2062} {"train_loss": -12.087299346923828, "global_step": 346570, "epoch": 2062} {"train_loss": -12.275790214538574, "global_step": 346571, "epoch": 2062} {"train_loss": -12.01225757598877, "global_step": 346572, "epoch": 2062} {"train_loss": -12.060001373291016, "global_step": 346573, "epoch": 2062} {"train_loss": -12.022863388061523, "global_step": 346574, "epoch": 2062} {"train_loss": -12.342714309692383, "global_step": 346575, "epoch": 2062} {"train_loss": -12.063608169555664, "global_step": 346576, "epoch": 2062} {"train_loss": -12.244462966918945, "global_step": 346577, "epoch": 2062} {"train_loss": -12.057369232177734, "global_step": 346578, "epoch": 2062} {"train_loss": -12.055713653564453, "global_step": 346579, "epoch": 2062} {"train_loss": -12.303086280822754, "global_step": 346580, "epoch": 2062} {"train_loss": -11.994800567626953, "global_step": 346581, "epoch": 2062} {"train_loss": -12.568042755126953, "global_step": 346582, "epoch": 2062} {"train_loss": -11.718211849530539, "global_step": 346583, "epoch": 2062, "val_loss": 288152.375} {"train_loss": -12.175975799560547, "global_step": 346584, "epoch": 2063} {"train_loss": -12.340322494506836, "global_step": 346585, "epoch": 2063} {"train_loss": -12.34952163696289, "global_step": 346586, "epoch": 2063} {"train_loss": -12.391560554504395, "global_step": 346587, "epoch": 2063} {"train_loss": -12.36945629119873, "global_step": 346588, "epoch": 2063} {"train_loss": -12.303305625915527, "global_step": 346589, "epoch": 2063} {"train_loss": -12.573783874511719, "global_step": 346590, "epoch": 2063} {"train_loss": -12.04725170135498, "global_step": 346591, "epoch": 2063} {"train_loss": -12.346447944641113, "global_step": 346592, "epoch": 2063} {"train_loss": -12.365525245666504, "global_step": 346593, "epoch": 2063} {"train_loss": -12.209696769714355, "global_step": 346594, "epoch": 2063} {"train_loss": -12.432841300964355, "global_step": 346595, "epoch": 2063} {"train_loss": -12.287551879882812, "global_step": 346596, "epoch": 2063} {"train_loss": -12.304966926574707, "global_step": 346597, "epoch": 2063} {"train_loss": -12.345869064331055, "global_step": 346598, "epoch": 2063} {"train_loss": -12.308721542358398, "global_step": 346599, "epoch": 2063} {"train_loss": -12.306370735168457, "global_step": 346600, "epoch": 2063} {"train_loss": -12.576702117919922, "global_step": 346601, "epoch": 2063} {"train_loss": -12.222528457641602, "global_step": 346602, "epoch": 2063} {"train_loss": -12.284685134887695, "global_step": 346603, "epoch": 2063} {"train_loss": -12.574466705322266, "global_step": 346604, "epoch": 2063} {"train_loss": -12.351655960083008, "global_step": 346605, "epoch": 2063} {"train_loss": -12.478952407836914, "global_step": 346606, "epoch": 2063} {"train_loss": -12.317102432250977, "global_step": 346607, "epoch": 2063} {"train_loss": -12.51270580291748, "global_step": 346608, "epoch": 2063} {"train_loss": -12.36838150024414, "global_step": 346609, "epoch": 2063} {"train_loss": -12.420768737792969, "global_step": 346610, "epoch": 2063} {"train_loss": -12.583282470703125, "global_step": 346611, "epoch": 2063} {"train_loss": -12.57004165649414, "global_step": 346612, "epoch": 2063} {"train_loss": -12.580211639404297, "global_step": 346613, "epoch": 2063} {"train_loss": -12.64931869506836, "global_step": 346614, "epoch": 2063} {"train_loss": -12.48133659362793, "global_step": 346615, "epoch": 2063} {"train_loss": -12.460935592651367, "global_step": 346616, "epoch": 2063} {"train_loss": -12.538488388061523, "global_step": 346617, "epoch": 2063} {"train_loss": -12.70629596710205, "global_step": 346618, "epoch": 2063} {"train_loss": -12.572977066040039, "global_step": 346619, "epoch": 2063} {"train_loss": -12.769046783447266, "global_step": 346620, "epoch": 2063} {"train_loss": -12.529094696044922, "global_step": 346621, "epoch": 2063} {"train_loss": -12.585166931152344, "global_step": 346622, "epoch": 2063} {"train_loss": -12.664321899414062, "global_step": 346623, "epoch": 2063} {"train_loss": -12.597911834716797, "global_step": 346624, "epoch": 2063} {"train_loss": -12.462507247924805, "global_step": 346625, "epoch": 2063} {"train_loss": -12.842764854431152, "global_step": 346626, "epoch": 2063} {"train_loss": -12.232111930847168, "global_step": 346627, "epoch": 2063} {"train_loss": -12.228376388549805, "global_step": 346628, "epoch": 2063} {"train_loss": -12.263961791992188, "global_step": 346629, "epoch": 2063} {"train_loss": -12.463783264160156, "global_step": 346630, "epoch": 2063} {"train_loss": -12.38677978515625, "global_step": 346631, "epoch": 2063} {"train_loss": -12.424186706542969, "global_step": 346632, "epoch": 2063} {"train_loss": -11.900581359863281, "global_step": 346633, "epoch": 2063} {"train_loss": -12.670635223388672, "global_step": 346634, "epoch": 2063} {"train_loss": -12.234342575073242, "global_step": 346635, "epoch": 2063} {"train_loss": -12.018206596374512, "global_step": 346636, "epoch": 2063} {"train_loss": -11.89986801147461, "global_step": 346637, "epoch": 2063} {"train_loss": -12.466899871826172, "global_step": 346638, "epoch": 2063} {"train_loss": -12.45718765258789, "global_step": 346639, "epoch": 2063} {"train_loss": -12.432548522949219, "global_step": 346640, "epoch": 2063} {"train_loss": -12.382800102233887, "global_step": 346641, "epoch": 2063} {"train_loss": -10.929994583129883, "global_step": 346642, "epoch": 2063} {"train_loss": -10.61977481842041, "global_step": 346643, "epoch": 2063} {"train_loss": -11.32020378112793, "global_step": 346644, "epoch": 2063} {"train_loss": -11.603431701660156, "global_step": 346645, "epoch": 2063} {"train_loss": -12.100339889526367, "global_step": 346646, "epoch": 2063} {"train_loss": -11.70132827758789, "global_step": 346647, "epoch": 2063} {"train_loss": -10.491033554077148, "global_step": 346648, "epoch": 2063} {"train_loss": -11.903796195983887, "global_step": 346649, "epoch": 2063} {"train_loss": -10.118943214416504, "global_step": 346650, "epoch": 2063} {"train_loss": -10.843469619750977, "global_step": 346651, "epoch": 2063} {"train_loss": -11.629667282104492, "global_step": 346652, "epoch": 2063} {"train_loss": -10.691539764404297, "global_step": 346653, "epoch": 2063} {"train_loss": -11.49551010131836, "global_step": 346654, "epoch": 2063} {"train_loss": -8.944269180297852, "global_step": 346655, "epoch": 2063} {"train_loss": -11.245087623596191, "global_step": 346656, "epoch": 2063} {"train_loss": -10.364738464355469, "global_step": 346657, "epoch": 2063} {"train_loss": -10.59450912475586, "global_step": 346658, "epoch": 2063} {"train_loss": -11.978154182434082, "global_step": 346659, "epoch": 2063} {"train_loss": -9.603007316589355, "global_step": 346660, "epoch": 2063} {"train_loss": -11.531795501708984, "global_step": 346661, "epoch": 2063} {"train_loss": -9.997162818908691, "global_step": 346662, "epoch": 2063} {"train_loss": -9.645509719848633, "global_step": 346663, "epoch": 2063} {"train_loss": -9.8369779586792, "global_step": 346664, "epoch": 2063} {"train_loss": -11.483158111572266, "global_step": 346665, "epoch": 2063} {"train_loss": -9.426149368286133, "global_step": 346666, "epoch": 2063} {"train_loss": -10.455941200256348, "global_step": 346667, "epoch": 2063} {"train_loss": -11.034696578979492, "global_step": 346668, "epoch": 2063} {"train_loss": -10.725055694580078, "global_step": 346669, "epoch": 2063} {"train_loss": -11.62563419342041, "global_step": 346670, "epoch": 2063} {"train_loss": -10.617107391357422, "global_step": 346671, "epoch": 2063} {"train_loss": -11.138885498046875, "global_step": 346672, "epoch": 2063} {"train_loss": -10.918018341064453, "global_step": 346673, "epoch": 2063} {"train_loss": -11.749773025512695, "global_step": 346674, "epoch": 2063} {"train_loss": -11.209675788879395, "global_step": 346675, "epoch": 2063} {"train_loss": -11.839104652404785, "global_step": 346676, "epoch": 2063} {"train_loss": -11.283294677734375, "global_step": 346677, "epoch": 2063} {"train_loss": -11.43497085571289, "global_step": 346678, "epoch": 2063} {"train_loss": -11.746675491333008, "global_step": 346679, "epoch": 2063} {"train_loss": -11.229575157165527, "global_step": 346680, "epoch": 2063} {"train_loss": -11.528564453125, "global_step": 346681, "epoch": 2063} {"train_loss": -11.590154647827148, "global_step": 346682, "epoch": 2063} {"train_loss": -11.540765762329102, "global_step": 346683, "epoch": 2063} {"train_loss": -11.363214492797852, "global_step": 346684, "epoch": 2063} {"train_loss": -11.716010093688965, "global_step": 346685, "epoch": 2063} {"train_loss": -10.900678634643555, "global_step": 346686, "epoch": 2063} {"train_loss": -11.587959289550781, "global_step": 346687, "epoch": 2063} {"train_loss": -11.413223266601562, "global_step": 346688, "epoch": 2063} {"train_loss": -11.461015701293945, "global_step": 346689, "epoch": 2063} {"train_loss": -11.97364616394043, "global_step": 346690, "epoch": 2063} {"train_loss": -10.859223365783691, "global_step": 346691, "epoch": 2063} {"train_loss": -11.928515434265137, "global_step": 346692, "epoch": 2063} {"train_loss": -11.82959270477295, "global_step": 346693, "epoch": 2063} {"train_loss": -11.420090675354004, "global_step": 346694, "epoch": 2063} {"train_loss": -12.122688293457031, "global_step": 346695, "epoch": 2063} {"train_loss": -11.55919361114502, "global_step": 346696, "epoch": 2063} {"train_loss": -11.538134574890137, "global_step": 346697, "epoch": 2063} {"train_loss": -11.744531631469727, "global_step": 346698, "epoch": 2063} {"train_loss": -11.080985069274902, "global_step": 346699, "epoch": 2063} {"train_loss": -12.212623596191406, "global_step": 346700, "epoch": 2063} {"train_loss": -11.69382095336914, "global_step": 346701, "epoch": 2063} {"train_loss": -11.581212997436523, "global_step": 346702, "epoch": 2063} {"train_loss": -12.017660140991211, "global_step": 346703, "epoch": 2063} {"train_loss": -11.993654251098633, "global_step": 346704, "epoch": 2063} {"train_loss": -11.554817199707031, "global_step": 346705, "epoch": 2063} {"train_loss": -12.097325325012207, "global_step": 346706, "epoch": 2063} {"train_loss": -11.936614036560059, "global_step": 346707, "epoch": 2063} {"train_loss": -12.091897964477539, "global_step": 346708, "epoch": 2063} {"train_loss": -12.034111022949219, "global_step": 346709, "epoch": 2063} {"train_loss": -11.814157485961914, "global_step": 346710, "epoch": 2063} {"train_loss": -11.81274700164795, "global_step": 346711, "epoch": 2063} {"train_loss": -12.007654190063477, "global_step": 346712, "epoch": 2063} {"train_loss": -12.005685806274414, "global_step": 346713, "epoch": 2063} {"train_loss": -12.092972755432129, "global_step": 346714, "epoch": 2063} {"train_loss": -11.673444747924805, "global_step": 346715, "epoch": 2063} {"train_loss": -12.340784072875977, "global_step": 346716, "epoch": 2063} {"train_loss": -11.875749588012695, "global_step": 346717, "epoch": 2063} {"train_loss": -11.73627758026123, "global_step": 346718, "epoch": 2063} {"train_loss": -12.302868843078613, "global_step": 346719, "epoch": 2063} {"train_loss": -11.703357696533203, "global_step": 346720, "epoch": 2063} {"train_loss": -11.895036697387695, "global_step": 346721, "epoch": 2063} {"train_loss": -11.335613250732422, "global_step": 346722, "epoch": 2063} {"train_loss": -11.981842041015625, "global_step": 346723, "epoch": 2063} {"train_loss": -11.479703903198242, "global_step": 346724, "epoch": 2063} {"train_loss": -11.553105354309082, "global_step": 346725, "epoch": 2063} {"train_loss": -12.113231658935547, "global_step": 346726, "epoch": 2063} {"train_loss": -11.60670280456543, "global_step": 346727, "epoch": 2063} {"train_loss": -11.862902641296387, "global_step": 346728, "epoch": 2063} {"train_loss": -11.279756546020508, "global_step": 346729, "epoch": 2063} {"train_loss": -11.758849143981934, "global_step": 346730, "epoch": 2063} {"train_loss": -11.922309875488281, "global_step": 346731, "epoch": 2063} {"train_loss": -11.720315933227539, "global_step": 346732, "epoch": 2063} {"train_loss": -12.179781913757324, "global_step": 346733, "epoch": 2063} {"train_loss": -11.705589294433594, "global_step": 346734, "epoch": 2063} {"train_loss": -11.795562744140625, "global_step": 346735, "epoch": 2063} {"train_loss": -11.580575942993164, "global_step": 346736, "epoch": 2063} {"train_loss": -11.580934524536133, "global_step": 346737, "epoch": 2063} {"train_loss": -10.815864562988281, "global_step": 346738, "epoch": 2063} {"train_loss": -11.292503356933594, "global_step": 346739, "epoch": 2063} {"train_loss": -11.094276428222656, "global_step": 346740, "epoch": 2063} {"train_loss": -11.539836883544922, "global_step": 346741, "epoch": 2063} {"train_loss": -11.4118070602417, "global_step": 346742, "epoch": 2063} {"train_loss": -9.841197967529297, "global_step": 346743, "epoch": 2063} {"train_loss": -10.327604293823242, "global_step": 346744, "epoch": 2063} {"train_loss": -10.990730285644531, "global_step": 346745, "epoch": 2063} {"train_loss": -10.498056411743164, "global_step": 346746, "epoch": 2063} {"train_loss": -10.539819717407227, "global_step": 346747, "epoch": 2063} {"train_loss": -11.324331283569336, "global_step": 346748, "epoch": 2063} {"train_loss": -10.056923866271973, "global_step": 346749, "epoch": 2063} {"train_loss": -9.833772659301758, "global_step": 346750, "epoch": 2063} {"train_loss": -11.700941290174212, "global_step": 346751, "epoch": 2063, "val_loss": 288775.46875} {"train_loss": -10.988818168640137, "global_step": 346752, "epoch": 2064} {"train_loss": -9.918376922607422, "global_step": 346753, "epoch": 2064} {"train_loss": -10.525203704833984, "global_step": 346754, "epoch": 2064} {"train_loss": -11.695667266845703, "global_step": 346755, "epoch": 2064} {"train_loss": -10.583369255065918, "global_step": 346756, "epoch": 2064} {"train_loss": -11.082191467285156, "global_step": 346757, "epoch": 2064} {"train_loss": -11.054021835327148, "global_step": 346758, "epoch": 2064} {"train_loss": -10.598005294799805, "global_step": 346759, "epoch": 2064} {"train_loss": -10.824897766113281, "global_step": 346760, "epoch": 2064} {"train_loss": -11.312421798706055, "global_step": 346761, "epoch": 2064} {"train_loss": -10.161258697509766, "global_step": 346762, "epoch": 2064} {"train_loss": -10.485273361206055, "global_step": 346763, "epoch": 2064} {"train_loss": -10.378005027770996, "global_step": 346764, "epoch": 2064} {"train_loss": -10.721835136413574, "global_step": 346765, "epoch": 2064} {"train_loss": -11.166790008544922, "global_step": 346766, "epoch": 2064} {"train_loss": -11.301146507263184, "global_step": 346767, "epoch": 2064} {"train_loss": -11.43264389038086, "global_step": 346768, "epoch": 2064} {"train_loss": -11.290101051330566, "global_step": 346769, "epoch": 2064} {"train_loss": -11.397575378417969, "global_step": 346770, "epoch": 2064} {"train_loss": -11.386720657348633, "global_step": 346771, "epoch": 2064} {"train_loss": -11.330436706542969, "global_step": 346772, "epoch": 2064} {"train_loss": -11.734563827514648, "global_step": 346773, "epoch": 2064} {"train_loss": -11.418667793273926, "global_step": 346774, "epoch": 2064} {"train_loss": -11.4744873046875, "global_step": 346775, "epoch": 2064} {"train_loss": -11.400506973266602, "global_step": 346776, "epoch": 2064} {"train_loss": -11.955265045166016, "global_step": 346777, "epoch": 2064} {"train_loss": -11.764006614685059, "global_step": 346778, "epoch": 2064} {"train_loss": -12.07968521118164, "global_step": 346779, "epoch": 2064} {"train_loss": -11.728212356567383, "global_step": 346780, "epoch": 2064} {"train_loss": -12.07103157043457, "global_step": 346781, "epoch": 2064} {"train_loss": -11.929778099060059, "global_step": 346782, "epoch": 2064} {"train_loss": -11.911491394042969, "global_step": 346783, "epoch": 2064} {"train_loss": -11.686210632324219, "global_step": 346784, "epoch": 2064} {"train_loss": -11.914244651794434, "global_step": 346785, "epoch": 2064} {"train_loss": -11.952322006225586, "global_step": 346786, "epoch": 2064} {"train_loss": -12.088790893554688, "global_step": 346787, "epoch": 2064} {"train_loss": -11.858685493469238, "global_step": 346788, "epoch": 2064} {"train_loss": -11.991899490356445, "global_step": 346789, "epoch": 2064} {"train_loss": -12.044149398803711, "global_step": 346790, "epoch": 2064} {"train_loss": -11.628185272216797, "global_step": 346791, "epoch": 2064} {"train_loss": -12.131486892700195, "global_step": 346792, "epoch": 2064} {"train_loss": -12.050496101379395, "global_step": 346793, "epoch": 2064} {"train_loss": -11.96523666381836, "global_step": 346794, "epoch": 2064} {"train_loss": -11.963911056518555, "global_step": 346795, "epoch": 2064} {"train_loss": -12.404571533203125, "global_step": 346796, "epoch": 2064} {"train_loss": -12.07648754119873, "global_step": 346797, "epoch": 2064} {"train_loss": -12.254127502441406, "global_step": 346798, "epoch": 2064} {"train_loss": -12.103830337524414, "global_step": 346799, "epoch": 2064} {"train_loss": -12.001338005065918, "global_step": 346800, "epoch": 2064} {"train_loss": -11.88905143737793, "global_step": 346801, "epoch": 2064} {"train_loss": -12.342350959777832, "global_step": 346802, "epoch": 2064} {"train_loss": -12.229167938232422, "global_step": 346803, "epoch": 2064} {"train_loss": -12.189587593078613, "global_step": 346804, "epoch": 2064} {"train_loss": -12.288908004760742, "global_step": 346805, "epoch": 2064} {"train_loss": -11.929140090942383, "global_step": 346806, "epoch": 2064} {"train_loss": -11.818620681762695, "global_step": 346807, "epoch": 2064} {"train_loss": -12.270035743713379, "global_step": 346808, "epoch": 2064} {"train_loss": -12.044177055358887, "global_step": 346809, "epoch": 2064} {"train_loss": -12.281914710998535, "global_step": 346810, "epoch": 2064} {"train_loss": -12.157671928405762, "global_step": 346811, "epoch": 2064} {"train_loss": -12.099997520446777, "global_step": 346812, "epoch": 2064} {"train_loss": -12.297358512878418, "global_step": 346813, "epoch": 2064} {"train_loss": -11.970863342285156, "global_step": 346814, "epoch": 2064} {"train_loss": -12.362546920776367, "global_step": 346815, "epoch": 2064} {"train_loss": -12.232919692993164, "global_step": 346816, "epoch": 2064} {"train_loss": -12.128474235534668, "global_step": 346817, "epoch": 2064} {"train_loss": -12.203414916992188, "global_step": 346818, "epoch": 2064} {"train_loss": -12.131540298461914, "global_step": 346819, "epoch": 2064} {"train_loss": -12.627296447753906, "global_step": 346820, "epoch": 2064} {"train_loss": -12.256884574890137, "global_step": 346821, "epoch": 2064} {"train_loss": -12.183014869689941, "global_step": 346822, "epoch": 2064} {"train_loss": -11.952866554260254, "global_step": 346823, "epoch": 2064} {"train_loss": -12.243644714355469, "global_step": 346824, "epoch": 2064} {"train_loss": -12.296119689941406, "global_step": 346825, "epoch": 2064} {"train_loss": -12.361557960510254, "global_step": 346826, "epoch": 2064} {"train_loss": -12.309420585632324, "global_step": 346827, "epoch": 2064} {"train_loss": -12.345006942749023, "global_step": 346828, "epoch": 2064} {"train_loss": -12.60153865814209, "global_step": 346829, "epoch": 2064} {"train_loss": -12.46784782409668, "global_step": 346830, "epoch": 2064} {"train_loss": -12.386441230773926, "global_step": 346831, "epoch": 2064} {"train_loss": -12.345575332641602, "global_step": 346832, "epoch": 2064} {"train_loss": -12.352774620056152, "global_step": 346833, "epoch": 2064} {"train_loss": -12.176254272460938, "global_step": 346834, "epoch": 2064} {"train_loss": -12.240090370178223, "global_step": 346835, "epoch": 2064} {"train_loss": -12.417265892028809, "global_step": 346836, "epoch": 2064} {"train_loss": -12.23892593383789, "global_step": 346837, "epoch": 2064} {"train_loss": -12.230293273925781, "global_step": 346838, "epoch": 2064} {"train_loss": -12.373013496398926, "global_step": 346839, "epoch": 2064} {"train_loss": -12.450977325439453, "global_step": 346840, "epoch": 2064} {"train_loss": -12.299489974975586, "global_step": 346841, "epoch": 2064} {"train_loss": -12.542420387268066, "global_step": 346842, "epoch": 2064} {"train_loss": -12.247044563293457, "global_step": 346843, "epoch": 2064} {"train_loss": -12.699227333068848, "global_step": 346844, "epoch": 2064} {"train_loss": -12.77800178527832, "global_step": 346845, "epoch": 2064} {"train_loss": -12.582038879394531, "global_step": 346846, "epoch": 2064} {"train_loss": -12.68518352508545, "global_step": 346847, "epoch": 2064} {"train_loss": -12.57866096496582, "global_step": 346848, "epoch": 2064} {"train_loss": -12.646551132202148, "global_step": 346849, "epoch": 2064} {"train_loss": -12.389766693115234, "global_step": 346850, "epoch": 2064} {"train_loss": -12.518349647521973, "global_step": 346851, "epoch": 2064} {"train_loss": -12.583263397216797, "global_step": 346852, "epoch": 2064} {"train_loss": -12.513132095336914, "global_step": 346853, "epoch": 2064} {"train_loss": -12.411474227905273, "global_step": 346854, "epoch": 2064} {"train_loss": -12.626911163330078, "global_step": 346855, "epoch": 2064} {"train_loss": -12.633892059326172, "global_step": 346856, "epoch": 2064} {"train_loss": -12.689306259155273, "global_step": 346857, "epoch": 2064} {"train_loss": -12.500164031982422, "global_step": 346858, "epoch": 2064} {"train_loss": -12.575508117675781, "global_step": 346859, "epoch": 2064} {"train_loss": -12.714912414550781, "global_step": 346860, "epoch": 2064} {"train_loss": -12.590852737426758, "global_step": 346861, "epoch": 2064} {"train_loss": -12.453384399414062, "global_step": 346862, "epoch": 2064} {"train_loss": -12.768791198730469, "global_step": 346863, "epoch": 2064} {"train_loss": -12.354655265808105, "global_step": 346864, "epoch": 2064} {"train_loss": -12.527955055236816, "global_step": 346865, "epoch": 2064} {"train_loss": -12.683828353881836, "global_step": 346866, "epoch": 2064} {"train_loss": -12.686744689941406, "global_step": 346867, "epoch": 2064} {"train_loss": -12.618175506591797, "global_step": 346868, "epoch": 2064} {"train_loss": -12.742918968200684, "global_step": 346869, "epoch": 2064} {"train_loss": -12.879024505615234, "global_step": 346870, "epoch": 2064} {"train_loss": -12.547260284423828, "global_step": 346871, "epoch": 2064} {"train_loss": -12.514347076416016, "global_step": 346872, "epoch": 2064} {"train_loss": -11.996822357177734, "global_step": 346873, "epoch": 2064} {"train_loss": -12.380906105041504, "global_step": 346874, "epoch": 2064} {"train_loss": -12.578706741333008, "global_step": 346875, "epoch": 2064} {"train_loss": -12.172858238220215, "global_step": 346876, "epoch": 2064} {"train_loss": -12.456615447998047, "global_step": 346877, "epoch": 2064} {"train_loss": -12.631145477294922, "global_step": 346878, "epoch": 2064} {"train_loss": -11.94774055480957, "global_step": 346879, "epoch": 2064} {"train_loss": -11.447808265686035, "global_step": 346880, "epoch": 2064} {"train_loss": -11.611364364624023, "global_step": 346881, "epoch": 2064} {"train_loss": -12.098627090454102, "global_step": 346882, "epoch": 2064} {"train_loss": -11.404983520507812, "global_step": 346883, "epoch": 2064} {"train_loss": -11.284685134887695, "global_step": 346884, "epoch": 2064} {"train_loss": -12.083298683166504, "global_step": 346885, "epoch": 2064} {"train_loss": -11.151012420654297, "global_step": 346886, "epoch": 2064} {"train_loss": -11.805510520935059, "global_step": 346887, "epoch": 2064} {"train_loss": -11.284550666809082, "global_step": 346888, "epoch": 2064} {"train_loss": -12.477668762207031, "global_step": 346889, "epoch": 2064} {"train_loss": -10.790410041809082, "global_step": 346890, "epoch": 2064} {"train_loss": -11.63437271118164, "global_step": 346891, "epoch": 2064} {"train_loss": -10.933982849121094, "global_step": 346892, "epoch": 2064} {"train_loss": -12.038713455200195, "global_step": 346893, "epoch": 2064} {"train_loss": -11.185306549072266, "global_step": 346894, "epoch": 2064} {"train_loss": -11.845528602600098, "global_step": 346895, "epoch": 2064} {"train_loss": -10.804966926574707, "global_step": 346896, "epoch": 2064} {"train_loss": -9.903536796569824, "global_step": 346897, "epoch": 2064} {"train_loss": -11.113225936889648, "global_step": 346898, "epoch": 2064} {"train_loss": -11.346090316772461, "global_step": 346899, "epoch": 2064} {"train_loss": -11.245359420776367, "global_step": 346900, "epoch": 2064} {"train_loss": -11.523918151855469, "global_step": 346901, "epoch": 2064} {"train_loss": -10.178342819213867, "global_step": 346902, "epoch": 2064} {"train_loss": -11.540693283081055, "global_step": 346903, "epoch": 2064} {"train_loss": -9.994486808776855, "global_step": 346904, "epoch": 2064} {"train_loss": -8.857934951782227, "global_step": 346905, "epoch": 2064} {"train_loss": -10.33390998840332, "global_step": 346906, "epoch": 2064} {"train_loss": -11.144601821899414, "global_step": 346907, "epoch": 2064} {"train_loss": -10.60240364074707, "global_step": 346908, "epoch": 2064} {"train_loss": -11.448659896850586, "global_step": 346909, "epoch": 2064} {"train_loss": -9.210321426391602, "global_step": 346910, "epoch": 2064} {"train_loss": -9.346783638000488, "global_step": 346911, "epoch": 2064} {"train_loss": -10.193415641784668, "global_step": 346912, "epoch": 2064} {"train_loss": -9.59573745727539, "global_step": 346913, "epoch": 2064} {"train_loss": -9.464117050170898, "global_step": 346914, "epoch": 2064} {"train_loss": -8.83559799194336, "global_step": 346915, "epoch": 2064} {"train_loss": -9.67440414428711, "global_step": 346916, "epoch": 2064} {"train_loss": -9.219268798828125, "global_step": 346917, "epoch": 2064} {"train_loss": -9.715652465820312, "global_step": 346918, "epoch": 2064} {"train_loss": -11.742363333702087, "global_step": 346919, "epoch": 2064, "val_loss": 286114.6875} {"train_loss": -9.038089752197266, "global_step": 346920, "epoch": 2065} {"train_loss": -10.545177459716797, "global_step": 346921, "epoch": 2065} {"train_loss": -9.940553665161133, "global_step": 346922, "epoch": 2065} {"train_loss": -10.12118911743164, "global_step": 346923, "epoch": 2065} {"train_loss": -10.541068077087402, "global_step": 346924, "epoch": 2065} {"train_loss": -11.01227855682373, "global_step": 346925, "epoch": 2065} {"train_loss": -10.441543579101562, "global_step": 346926, "epoch": 2065} {"train_loss": -11.099742889404297, "global_step": 346927, "epoch": 2065} {"train_loss": -10.476091384887695, "global_step": 346928, "epoch": 2065} {"train_loss": -10.533398628234863, "global_step": 346929, "epoch": 2065} {"train_loss": -10.95556926727295, "global_step": 346930, "epoch": 2065} {"train_loss": -10.784897804260254, "global_step": 346931, "epoch": 2065} {"train_loss": -11.402978897094727, "global_step": 346932, "epoch": 2065} {"train_loss": -11.23865795135498, "global_step": 346933, "epoch": 2065} {"train_loss": -12.029922485351562, "global_step": 346934, "epoch": 2065} {"train_loss": -11.232983589172363, "global_step": 346935, "epoch": 2065} {"train_loss": -11.620811462402344, "global_step": 346936, "epoch": 2065} {"train_loss": -11.390491485595703, "global_step": 346937, "epoch": 2065} {"train_loss": -11.682259559631348, "global_step": 346938, "epoch": 2065} {"train_loss": -11.014312744140625, "global_step": 346939, "epoch": 2065} {"train_loss": -11.618510246276855, "global_step": 346940, "epoch": 2065} {"train_loss": -10.830345153808594, "global_step": 346941, "epoch": 2065} {"train_loss": -11.47547721862793, "global_step": 346942, "epoch": 2065} {"train_loss": -11.190566062927246, "global_step": 346943, "epoch": 2065} {"train_loss": -11.26490592956543, "global_step": 346944, "epoch": 2065} {"train_loss": -11.282611846923828, "global_step": 346945, "epoch": 2065} {"train_loss": -11.191106796264648, "global_step": 346946, "epoch": 2065} {"train_loss": -11.712550163269043, "global_step": 346947, "epoch": 2065} {"train_loss": -11.46232795715332, "global_step": 346948, "epoch": 2065} {"train_loss": -11.675329208374023, "global_step": 346949, "epoch": 2065} {"train_loss": -11.277297973632812, "global_step": 346950, "epoch": 2065} {"train_loss": -11.8126220703125, "global_step": 346951, "epoch": 2065} {"train_loss": -11.867626190185547, "global_step": 346952, "epoch": 2065} {"train_loss": -11.96684455871582, "global_step": 346953, "epoch": 2065} {"train_loss": -12.049076080322266, "global_step": 346954, "epoch": 2065} {"train_loss": -11.929839134216309, "global_step": 346955, "epoch": 2065} {"train_loss": -12.148298263549805, "global_step": 346956, "epoch": 2065} {"train_loss": -11.903745651245117, "global_step": 346957, "epoch": 2065} {"train_loss": -12.194519996643066, "global_step": 346958, "epoch": 2065} {"train_loss": -11.851221084594727, "global_step": 346959, "epoch": 2065} {"train_loss": -11.835379600524902, "global_step": 346960, "epoch": 2065} {"train_loss": -11.913806915283203, "global_step": 346961, "epoch": 2065} {"train_loss": -12.007347106933594, "global_step": 346962, "epoch": 2065} {"train_loss": -11.840665817260742, "global_step": 346963, "epoch": 2065} {"train_loss": -11.990737915039062, "global_step": 346964, "epoch": 2065} {"train_loss": -11.833163261413574, "global_step": 346965, "epoch": 2065} {"train_loss": -12.295943260192871, "global_step": 346966, "epoch": 2065} {"train_loss": -11.981088638305664, "global_step": 346967, "epoch": 2065} {"train_loss": -12.108724594116211, "global_step": 346968, "epoch": 2065} {"train_loss": -12.21163558959961, "global_step": 346969, "epoch": 2065} {"train_loss": -12.284355163574219, "global_step": 346970, "epoch": 2065} {"train_loss": -12.005370140075684, "global_step": 346971, "epoch": 2065} {"train_loss": -12.16677188873291, "global_step": 346972, "epoch": 2065} {"train_loss": -12.138401985168457, "global_step": 346973, "epoch": 2065} {"train_loss": -12.209173202514648, "global_step": 346974, "epoch": 2065} {"train_loss": -12.28038501739502, "global_step": 346975, "epoch": 2065} {"train_loss": -12.203667640686035, "global_step": 346976, "epoch": 2065} {"train_loss": -12.014092445373535, "global_step": 346977, "epoch": 2065} {"train_loss": -12.196921348571777, "global_step": 346978, "epoch": 2065} {"train_loss": -11.9750337600708, "global_step": 346979, "epoch": 2065} {"train_loss": -12.324697494506836, "global_step": 346980, "epoch": 2065} {"train_loss": -11.701610565185547, "global_step": 346981, "epoch": 2065} {"train_loss": -12.162055969238281, "global_step": 346982, "epoch": 2065} {"train_loss": -11.903932571411133, "global_step": 346983, "epoch": 2065} {"train_loss": -12.405781745910645, "global_step": 346984, "epoch": 2065} {"train_loss": -12.066428184509277, "global_step": 346985, "epoch": 2065} {"train_loss": -12.374213218688965, "global_step": 346986, "epoch": 2065} {"train_loss": -12.176429748535156, "global_step": 346987, "epoch": 2065} {"train_loss": -12.129919052124023, "global_step": 346988, "epoch": 2065} {"train_loss": -12.203332901000977, "global_step": 346989, "epoch": 2065} {"train_loss": -12.206467628479004, "global_step": 346990, "epoch": 2065} {"train_loss": -12.389567375183105, "global_step": 346991, "epoch": 2065} {"train_loss": -11.973005294799805, "global_step": 346992, "epoch": 2065} {"train_loss": -12.445148468017578, "global_step": 346993, "epoch": 2065} {"train_loss": -12.268806457519531, "global_step": 346994, "epoch": 2065} {"train_loss": -12.498550415039062, "global_step": 346995, "epoch": 2065} {"train_loss": -12.270572662353516, "global_step": 346996, "epoch": 2065} {"train_loss": -12.56225872039795, "global_step": 346997, "epoch": 2065} {"train_loss": -12.46212387084961, "global_step": 346998, "epoch": 2065} {"train_loss": -12.642496109008789, "global_step": 346999, "epoch": 2065} {"train_loss": -12.405813217163086, "global_step": 347000, "epoch": 2065} {"train_loss": -12.528167724609375, "global_step": 347001, "epoch": 2065} {"train_loss": -12.509028434753418, "global_step": 347002, "epoch": 2065} {"train_loss": -12.274574279785156, "global_step": 347003, "epoch": 2065} {"train_loss": -12.527854919433594, "global_step": 347004, "epoch": 2065} {"train_loss": -12.231216430664062, "global_step": 347005, "epoch": 2065} {"train_loss": -12.25208568572998, "global_step": 347006, "epoch": 2065} {"train_loss": -12.414093971252441, "global_step": 347007, "epoch": 2065} {"train_loss": -12.597932815551758, "global_step": 347008, "epoch": 2065} {"train_loss": -12.375417709350586, "global_step": 347009, "epoch": 2065} {"train_loss": -12.272563934326172, "global_step": 347010, "epoch": 2065} {"train_loss": -12.394705772399902, "global_step": 347011, "epoch": 2065} {"train_loss": -12.347911834716797, "global_step": 347012, "epoch": 2065} {"train_loss": -12.358100891113281, "global_step": 347013, "epoch": 2065} {"train_loss": -12.402973175048828, "global_step": 347014, "epoch": 2065} {"train_loss": -12.451510429382324, "global_step": 347015, "epoch": 2065} {"train_loss": -12.613814353942871, "global_step": 347016, "epoch": 2065} {"train_loss": -12.348491668701172, "global_step": 347017, "epoch": 2065} {"train_loss": -12.514892578125, "global_step": 347018, "epoch": 2065} {"train_loss": -12.530016899108887, "global_step": 347019, "epoch": 2065} {"train_loss": -12.676569938659668, "global_step": 347020, "epoch": 2065} {"train_loss": -12.414449691772461, "global_step": 347021, "epoch": 2065} {"train_loss": -12.42253303527832, "global_step": 347022, "epoch": 2065} {"train_loss": -12.408609390258789, "global_step": 347023, "epoch": 2065} {"train_loss": -12.25209903717041, "global_step": 347024, "epoch": 2065} {"train_loss": -12.059163093566895, "global_step": 347025, "epoch": 2065} {"train_loss": -12.363882064819336, "global_step": 347026, "epoch": 2065} {"train_loss": -12.42893123626709, "global_step": 347027, "epoch": 2065} {"train_loss": -12.384069442749023, "global_step": 347028, "epoch": 2065} {"train_loss": -12.271984100341797, "global_step": 347029, "epoch": 2065} {"train_loss": -12.458986282348633, "global_step": 347030, "epoch": 2065} {"train_loss": -12.289752960205078, "global_step": 347031, "epoch": 2065} {"train_loss": -12.455954551696777, "global_step": 347032, "epoch": 2065} {"train_loss": -12.402295112609863, "global_step": 347033, "epoch": 2065} {"train_loss": -12.330629348754883, "global_step": 347034, "epoch": 2065} {"train_loss": -12.434678077697754, "global_step": 347035, "epoch": 2065} {"train_loss": -12.74026870727539, "global_step": 347036, "epoch": 2065} {"train_loss": -12.396892547607422, "global_step": 347037, "epoch": 2065} {"train_loss": -12.527141571044922, "global_step": 347038, "epoch": 2065} {"train_loss": -12.601030349731445, "global_step": 347039, "epoch": 2065} {"train_loss": -12.406444549560547, "global_step": 347040, "epoch": 2065} {"train_loss": -12.359966278076172, "global_step": 347041, "epoch": 2065} {"train_loss": -12.712379455566406, "global_step": 347042, "epoch": 2065} {"train_loss": -12.499101638793945, "global_step": 347043, "epoch": 2065} {"train_loss": -12.705484390258789, "global_step": 347044, "epoch": 2065} {"train_loss": -12.541606903076172, "global_step": 347045, "epoch": 2065} {"train_loss": -12.114846229553223, "global_step": 347046, "epoch": 2065} {"train_loss": -11.995401382446289, "global_step": 347047, "epoch": 2065} {"train_loss": -12.47612190246582, "global_step": 347048, "epoch": 2065} {"train_loss": -12.297200202941895, "global_step": 347049, "epoch": 2065} {"train_loss": -11.515957832336426, "global_step": 347050, "epoch": 2065} {"train_loss": -12.011466979980469, "global_step": 347051, "epoch": 2065} {"train_loss": -12.572860717773438, "global_step": 347052, "epoch": 2065} {"train_loss": -11.843440055847168, "global_step": 347053, "epoch": 2065} {"train_loss": -10.933507919311523, "global_step": 347054, "epoch": 2065} {"train_loss": -11.929481506347656, "global_step": 347055, "epoch": 2065} {"train_loss": -12.585905075073242, "global_step": 347056, "epoch": 2065} {"train_loss": -11.164011001586914, "global_step": 347057, "epoch": 2065} {"train_loss": -11.083541870117188, "global_step": 347058, "epoch": 2065} {"train_loss": -12.379304885864258, "global_step": 347059, "epoch": 2065} {"train_loss": -11.215734481811523, "global_step": 347060, "epoch": 2065} {"train_loss": -9.68392562866211, "global_step": 347061, "epoch": 2065} {"train_loss": -12.133291244506836, "global_step": 347062, "epoch": 2065} {"train_loss": -11.091962814331055, "global_step": 347063, "epoch": 2065} {"train_loss": -10.89212703704834, "global_step": 347064, "epoch": 2065} {"train_loss": -10.757049560546875, "global_step": 347065, "epoch": 2065} {"train_loss": -10.019929885864258, "global_step": 347066, "epoch": 2065} {"train_loss": -8.330673217773438, "global_step": 347067, "epoch": 2065} {"train_loss": -8.0433349609375, "global_step": 347068, "epoch": 2065} {"train_loss": -8.553552627563477, "global_step": 347069, "epoch": 2065} {"train_loss": -8.408288955688477, "global_step": 347070, "epoch": 2065} {"train_loss": -9.037181854248047, "global_step": 347071, "epoch": 2065} {"train_loss": -9.059669494628906, "global_step": 347072, "epoch": 2065} {"train_loss": -8.447261810302734, "global_step": 347073, "epoch": 2065} {"train_loss": -8.316598892211914, "global_step": 347074, "epoch": 2065} {"train_loss": -9.033729553222656, "global_step": 347075, "epoch": 2065} {"train_loss": -8.117276191711426, "global_step": 347076, "epoch": 2065} {"train_loss": -8.360957145690918, "global_step": 347077, "epoch": 2065} {"train_loss": -9.18896484375, "global_step": 347078, "epoch": 2065} {"train_loss": -9.254520416259766, "global_step": 347079, "epoch": 2065} {"train_loss": -9.961753845214844, "global_step": 347080, "epoch": 2065} {"train_loss": -9.010104179382324, "global_step": 347081, "epoch": 2065} {"train_loss": -10.577747344970703, "global_step": 347082, "epoch": 2065} {"train_loss": -10.39763069152832, "global_step": 347083, "epoch": 2065} {"train_loss": -9.198833465576172, "global_step": 347084, "epoch": 2065} {"train_loss": -9.922496795654297, "global_step": 347085, "epoch": 2065} {"train_loss": -10.331175804138184, "global_step": 347086, "epoch": 2065} {"train_loss": -11.565769428298587, "global_step": 347087, "epoch": 2065, "val_loss": 286905.03125, "train_action_mse_error": 0.5628947615623474} {"train_loss": -10.950990676879883, "global_step": 347088, "epoch": 2066} {"train_loss": -10.780754089355469, "global_step": 347089, "epoch": 2066} {"train_loss": -10.840885162353516, "global_step": 347090, "epoch": 2066} {"train_loss": -10.682687759399414, "global_step": 347091, "epoch": 2066} {"train_loss": -10.532974243164062, "global_step": 347092, "epoch": 2066} {"train_loss": -11.23086929321289, "global_step": 347093, "epoch": 2066} {"train_loss": -10.306709289550781, "global_step": 347094, "epoch": 2066} {"train_loss": -10.535757064819336, "global_step": 347095, "epoch": 2066} {"train_loss": -11.292776107788086, "global_step": 347096, "epoch": 2066} {"train_loss": -10.876399993896484, "global_step": 347097, "epoch": 2066} {"train_loss": -11.123023986816406, "global_step": 347098, "epoch": 2066} {"train_loss": -10.839693069458008, "global_step": 347099, "epoch": 2066} {"train_loss": -10.972789764404297, "global_step": 347100, "epoch": 2066} {"train_loss": -11.339104652404785, "global_step": 347101, "epoch": 2066} {"train_loss": -11.004945755004883, "global_step": 347102, "epoch": 2066} {"train_loss": -11.274055480957031, "global_step": 347103, "epoch": 2066} {"train_loss": -11.377189636230469, "global_step": 347104, "epoch": 2066} {"train_loss": -11.332927703857422, "global_step": 347105, "epoch": 2066} {"train_loss": -11.023880958557129, "global_step": 347106, "epoch": 2066} {"train_loss": -11.18983268737793, "global_step": 347107, "epoch": 2066} {"train_loss": -11.586483001708984, "global_step": 347108, "epoch": 2066} {"train_loss": -11.030510902404785, "global_step": 347109, "epoch": 2066} {"train_loss": -12.066422462463379, "global_step": 347110, "epoch": 2066} {"train_loss": -11.219269752502441, "global_step": 347111, "epoch": 2066} {"train_loss": -11.807836532592773, "global_step": 347112, "epoch": 2066} {"train_loss": -11.375553131103516, "global_step": 347113, "epoch": 2066} {"train_loss": -11.931367874145508, "global_step": 347114, "epoch": 2066} {"train_loss": -11.724044799804688, "global_step": 347115, "epoch": 2066} {"train_loss": -11.814035415649414, "global_step": 347116, "epoch": 2066} {"train_loss": -11.827743530273438, "global_step": 347117, "epoch": 2066} {"train_loss": -11.635176658630371, "global_step": 347118, "epoch": 2066} {"train_loss": -12.000984191894531, "global_step": 347119, "epoch": 2066} {"train_loss": -11.991144180297852, "global_step": 347120, "epoch": 2066} {"train_loss": -11.690608978271484, "global_step": 347121, "epoch": 2066} {"train_loss": -11.777275085449219, "global_step": 347122, "epoch": 2066} {"train_loss": -11.552775382995605, "global_step": 347123, "epoch": 2066} {"train_loss": -11.713775634765625, "global_step": 347124, "epoch": 2066} {"train_loss": -12.098262786865234, "global_step": 347125, "epoch": 2066} {"train_loss": -11.474407196044922, "global_step": 347126, "epoch": 2066} {"train_loss": -11.87648868560791, "global_step": 347127, "epoch": 2066} {"train_loss": -11.973822593688965, "global_step": 347128, "epoch": 2066} {"train_loss": -11.931982040405273, "global_step": 347129, "epoch": 2066} {"train_loss": -12.0519437789917, "global_step": 347130, "epoch": 2066} {"train_loss": -11.932787895202637, "global_step": 347131, "epoch": 2066} {"train_loss": -12.294708251953125, "global_step": 347132, "epoch": 2066} {"train_loss": -11.87364387512207, "global_step": 347133, "epoch": 2066} {"train_loss": -12.173005104064941, "global_step": 347134, "epoch": 2066} {"train_loss": -12.195685386657715, "global_step": 347135, "epoch": 2066} {"train_loss": -11.866373062133789, "global_step": 347136, "epoch": 2066} {"train_loss": -12.35584831237793, "global_step": 347137, "epoch": 2066} {"train_loss": -12.11781120300293, "global_step": 347138, "epoch": 2066} {"train_loss": -12.009157180786133, "global_step": 347139, "epoch": 2066} {"train_loss": -12.037453651428223, "global_step": 347140, "epoch": 2066} {"train_loss": -12.174943923950195, "global_step": 347141, "epoch": 2066} {"train_loss": -12.095959663391113, "global_step": 347142, "epoch": 2066} {"train_loss": -12.22331428527832, "global_step": 347143, "epoch": 2066} {"train_loss": -11.926790237426758, "global_step": 347144, "epoch": 2066} {"train_loss": -12.091837882995605, "global_step": 347145, "epoch": 2066} {"train_loss": -12.242076873779297, "global_step": 347146, "epoch": 2066} {"train_loss": -11.872909545898438, "global_step": 347147, "epoch": 2066} {"train_loss": -12.184871673583984, "global_step": 347148, "epoch": 2066} {"train_loss": -11.991981506347656, "global_step": 347149, "epoch": 2066} {"train_loss": -12.037644386291504, "global_step": 347150, "epoch": 2066} {"train_loss": -11.816279411315918, "global_step": 347151, "epoch": 2066} {"train_loss": -11.952733039855957, "global_step": 347152, "epoch": 2066} {"train_loss": -12.204133033752441, "global_step": 347153, "epoch": 2066} {"train_loss": -12.241065979003906, "global_step": 347154, "epoch": 2066} {"train_loss": -12.244119644165039, "global_step": 347155, "epoch": 2066} {"train_loss": -12.286190032958984, "global_step": 347156, "epoch": 2066} {"train_loss": -12.149591445922852, "global_step": 347157, "epoch": 2066} {"train_loss": -11.991530418395996, "global_step": 347158, "epoch": 2066} {"train_loss": -12.08400821685791, "global_step": 347159, "epoch": 2066} {"train_loss": -12.211700439453125, "global_step": 347160, "epoch": 2066} {"train_loss": -11.797628402709961, "global_step": 347161, "epoch": 2066} {"train_loss": -12.291987419128418, "global_step": 347162, "epoch": 2066} {"train_loss": -12.137235641479492, "global_step": 347163, "epoch": 2066} {"train_loss": -12.315144538879395, "global_step": 347164, "epoch": 2066} {"train_loss": -12.183294296264648, "global_step": 347165, "epoch": 2066} {"train_loss": -12.25133991241455, "global_step": 347166, "epoch": 2066} {"train_loss": -12.137551307678223, "global_step": 347167, "epoch": 2066} {"train_loss": -12.290215492248535, "global_step": 347168, "epoch": 2066} {"train_loss": -12.070813179016113, "global_step": 347169, "epoch": 2066} {"train_loss": -12.352169036865234, "global_step": 347170, "epoch": 2066} {"train_loss": -12.171003341674805, "global_step": 347171, "epoch": 2066} {"train_loss": -12.376909255981445, "global_step": 347172, "epoch": 2066} {"train_loss": -12.397679328918457, "global_step": 347173, "epoch": 2066} {"train_loss": -12.140239715576172, "global_step": 347174, "epoch": 2066} {"train_loss": -12.34190559387207, "global_step": 347175, "epoch": 2066} {"train_loss": -12.389371871948242, "global_step": 347176, "epoch": 2066} {"train_loss": -12.103014945983887, "global_step": 347177, "epoch": 2066} {"train_loss": -12.514328002929688, "global_step": 347178, "epoch": 2066} {"train_loss": -12.354129791259766, "global_step": 347179, "epoch": 2066} {"train_loss": -12.51174545288086, "global_step": 347180, "epoch": 2066} {"train_loss": -12.292698860168457, "global_step": 347181, "epoch": 2066} {"train_loss": -12.3980073928833, "global_step": 347182, "epoch": 2066} {"train_loss": -12.435792922973633, "global_step": 347183, "epoch": 2066} {"train_loss": -12.393623352050781, "global_step": 347184, "epoch": 2066} {"train_loss": -12.553235054016113, "global_step": 347185, "epoch": 2066} {"train_loss": -12.524284362792969, "global_step": 347186, "epoch": 2066} {"train_loss": -12.499841690063477, "global_step": 347187, "epoch": 2066} {"train_loss": -12.388265609741211, "global_step": 347188, "epoch": 2066} {"train_loss": -12.53051471710205, "global_step": 347189, "epoch": 2066} {"train_loss": -12.259364128112793, "global_step": 347190, "epoch": 2066} {"train_loss": -12.351970672607422, "global_step": 347191, "epoch": 2066} {"train_loss": -12.547616958618164, "global_step": 347192, "epoch": 2066} {"train_loss": -12.521305084228516, "global_step": 347193, "epoch": 2066} {"train_loss": -12.726062774658203, "global_step": 347194, "epoch": 2066} {"train_loss": -12.568024635314941, "global_step": 347195, "epoch": 2066} {"train_loss": -12.76811408996582, "global_step": 347196, "epoch": 2066} {"train_loss": -12.621919631958008, "global_step": 347197, "epoch": 2066} {"train_loss": -12.575470924377441, "global_step": 347198, "epoch": 2066} {"train_loss": -12.433900833129883, "global_step": 347199, "epoch": 2066} {"train_loss": -12.156376838684082, "global_step": 347200, "epoch": 2066} {"train_loss": -12.565062522888184, "global_step": 347201, "epoch": 2066} {"train_loss": -12.21579360961914, "global_step": 347202, "epoch": 2066} {"train_loss": -11.838781356811523, "global_step": 347203, "epoch": 2066} {"train_loss": -12.279996871948242, "global_step": 347204, "epoch": 2066} {"train_loss": -12.35901927947998, "global_step": 347205, "epoch": 2066} {"train_loss": -12.547765731811523, "global_step": 347206, "epoch": 2066} {"train_loss": -11.11289119720459, "global_step": 347207, "epoch": 2066} {"train_loss": -11.382368087768555, "global_step": 347208, "epoch": 2066} {"train_loss": -12.408729553222656, "global_step": 347209, "epoch": 2066} {"train_loss": -11.05171012878418, "global_step": 347210, "epoch": 2066} {"train_loss": -11.910730361938477, "global_step": 347211, "epoch": 2066} {"train_loss": -11.365565299987793, "global_step": 347212, "epoch": 2066} {"train_loss": -10.81920337677002, "global_step": 347213, "epoch": 2066} {"train_loss": -10.49604606628418, "global_step": 347214, "epoch": 2066} {"train_loss": -11.7075834274292, "global_step": 347215, "epoch": 2066} {"train_loss": -9.345477104187012, "global_step": 347216, "epoch": 2066} {"train_loss": -10.56588363647461, "global_step": 347217, "epoch": 2066} {"train_loss": -9.708821296691895, "global_step": 347218, "epoch": 2066} {"train_loss": -9.011614799499512, "global_step": 347219, "epoch": 2066} {"train_loss": -8.660139083862305, "global_step": 347220, "epoch": 2066} {"train_loss": -10.588502883911133, "global_step": 347221, "epoch": 2066} {"train_loss": -9.050712585449219, "global_step": 347222, "epoch": 2066} {"train_loss": -9.784208297729492, "global_step": 347223, "epoch": 2066} {"train_loss": -9.309906959533691, "global_step": 347224, "epoch": 2066} {"train_loss": -9.02131462097168, "global_step": 347225, "epoch": 2066} {"train_loss": -9.076269149780273, "global_step": 347226, "epoch": 2066} {"train_loss": -8.997410774230957, "global_step": 347227, "epoch": 2066} {"train_loss": -10.044599533081055, "global_step": 347228, "epoch": 2066} {"train_loss": -8.739981651306152, "global_step": 347229, "epoch": 2066} {"train_loss": -9.433584213256836, "global_step": 347230, "epoch": 2066} {"train_loss": -9.664052963256836, "global_step": 347231, "epoch": 2066} {"train_loss": -10.015071868896484, "global_step": 347232, "epoch": 2066} {"train_loss": -9.402896881103516, "global_step": 347233, "epoch": 2066} {"train_loss": -9.305828094482422, "global_step": 347234, "epoch": 2066} {"train_loss": -10.211651802062988, "global_step": 347235, "epoch": 2066} {"train_loss": -9.660730361938477, "global_step": 347236, "epoch": 2066} {"train_loss": -8.437932968139648, "global_step": 347237, "epoch": 2066} {"train_loss": -11.092241287231445, "global_step": 347238, "epoch": 2066} {"train_loss": -9.56121826171875, "global_step": 347239, "epoch": 2066} {"train_loss": -10.015783309936523, "global_step": 347240, "epoch": 2066} {"train_loss": -11.115034103393555, "global_step": 347241, "epoch": 2066} {"train_loss": -10.303323745727539, "global_step": 347242, "epoch": 2066} {"train_loss": -10.604713439941406, "global_step": 347243, "epoch": 2066} {"train_loss": -10.82242202758789, "global_step": 347244, "epoch": 2066} {"train_loss": -10.35661506652832, "global_step": 347245, "epoch": 2066} {"train_loss": -10.11264419555664, "global_step": 347246, "epoch": 2066} {"train_loss": -11.25977897644043, "global_step": 347247, "epoch": 2066} {"train_loss": -10.562822341918945, "global_step": 347248, "epoch": 2066} {"train_loss": -10.457393646240234, "global_step": 347249, "epoch": 2066} {"train_loss": -10.582569122314453, "global_step": 347250, "epoch": 2066} {"train_loss": -11.583480834960938, "global_step": 347251, "epoch": 2066} {"train_loss": -10.440832138061523, "global_step": 347252, "epoch": 2066} {"train_loss": -10.625680923461914, "global_step": 347253, "epoch": 2066} {"train_loss": -11.65510368347168, "global_step": 347254, "epoch": 2066} {"train_loss": -11.447595953941345, "global_step": 347255, "epoch": 2066, "val_loss": 285342.03125} {"train_loss": -11.32083511352539, "global_step": 347256, "epoch": 2067} {"train_loss": -11.814388275146484, "global_step": 347257, "epoch": 2067} {"train_loss": -11.481029510498047, "global_step": 347258, "epoch": 2067} {"train_loss": -11.567461013793945, "global_step": 347259, "epoch": 2067} {"train_loss": -11.426572799682617, "global_step": 347260, "epoch": 2067} {"train_loss": -11.839198112487793, "global_step": 347261, "epoch": 2067} {"train_loss": -11.569955825805664, "global_step": 347262, "epoch": 2067} {"train_loss": -11.632794380187988, "global_step": 347263, "epoch": 2067} {"train_loss": -11.40244197845459, "global_step": 347264, "epoch": 2067} {"train_loss": -11.486431121826172, "global_step": 347265, "epoch": 2067} {"train_loss": -12.12739372253418, "global_step": 347266, "epoch": 2067} {"train_loss": -11.529415130615234, "global_step": 347267, "epoch": 2067} {"train_loss": -11.688481330871582, "global_step": 347268, "epoch": 2067} {"train_loss": -11.775964736938477, "global_step": 347269, "epoch": 2067} {"train_loss": -11.647525787353516, "global_step": 347270, "epoch": 2067} {"train_loss": -11.839923858642578, "global_step": 347271, "epoch": 2067} {"train_loss": -11.980035781860352, "global_step": 347272, "epoch": 2067} {"train_loss": -11.753597259521484, "global_step": 347273, "epoch": 2067} {"train_loss": -11.918489456176758, "global_step": 347274, "epoch": 2067} {"train_loss": -11.830364227294922, "global_step": 347275, "epoch": 2067} {"train_loss": -12.003145217895508, "global_step": 347276, "epoch": 2067} {"train_loss": -11.991304397583008, "global_step": 347277, "epoch": 2067} {"train_loss": -12.029082298278809, "global_step": 347278, "epoch": 2067} {"train_loss": -11.889394760131836, "global_step": 347279, "epoch": 2067} {"train_loss": -11.946699142456055, "global_step": 347280, "epoch": 2067} {"train_loss": -12.162080764770508, "global_step": 347281, "epoch": 2067} {"train_loss": -12.14323616027832, "global_step": 347282, "epoch": 2067} {"train_loss": -11.98215103149414, "global_step": 347283, "epoch": 2067} {"train_loss": -12.167129516601562, "global_step": 347284, "epoch": 2067} {"train_loss": -12.17796516418457, "global_step": 347285, "epoch": 2067} {"train_loss": -12.295045852661133, "global_step": 347286, "epoch": 2067} {"train_loss": -11.978610038757324, "global_step": 347287, "epoch": 2067} {"train_loss": -12.071782112121582, "global_step": 347288, "epoch": 2067} {"train_loss": -12.353157043457031, "global_step": 347289, "epoch": 2067} {"train_loss": -12.015524864196777, "global_step": 347290, "epoch": 2067} {"train_loss": -12.312150955200195, "global_step": 347291, "epoch": 2067} {"train_loss": -12.131410598754883, "global_step": 347292, "epoch": 2067} {"train_loss": -12.244192123413086, "global_step": 347293, "epoch": 2067} {"train_loss": -12.177765846252441, "global_step": 347294, "epoch": 2067} {"train_loss": -12.206987380981445, "global_step": 347295, "epoch": 2067} {"train_loss": -12.229111671447754, "global_step": 347296, "epoch": 2067} {"train_loss": -12.26608657836914, "global_step": 347297, "epoch": 2067} {"train_loss": -12.593737602233887, "global_step": 347298, "epoch": 2067} {"train_loss": -12.195747375488281, "global_step": 347299, "epoch": 2067} {"train_loss": -12.44633674621582, "global_step": 347300, "epoch": 2067} {"train_loss": -12.219879150390625, "global_step": 347301, "epoch": 2067} {"train_loss": -12.301010131835938, "global_step": 347302, "epoch": 2067} {"train_loss": -12.291194915771484, "global_step": 347303, "epoch": 2067} {"train_loss": -12.263799667358398, "global_step": 347304, "epoch": 2067} {"train_loss": -12.214336395263672, "global_step": 347305, "epoch": 2067} {"train_loss": -12.355033874511719, "global_step": 347306, "epoch": 2067} {"train_loss": -12.298580169677734, "global_step": 347307, "epoch": 2067} {"train_loss": -12.163412094116211, "global_step": 347308, "epoch": 2067} {"train_loss": -12.391786575317383, "global_step": 347309, "epoch": 2067} {"train_loss": -12.085111618041992, "global_step": 347310, "epoch": 2067} {"train_loss": -12.08503532409668, "global_step": 347311, "epoch": 2067} {"train_loss": -12.33276081085205, "global_step": 347312, "epoch": 2067} {"train_loss": -12.10181999206543, "global_step": 347313, "epoch": 2067} {"train_loss": -12.22880744934082, "global_step": 347314, "epoch": 2067} {"train_loss": -12.237342834472656, "global_step": 347315, "epoch": 2067} {"train_loss": -12.05029296875, "global_step": 347316, "epoch": 2067} {"train_loss": -11.976991653442383, "global_step": 347317, "epoch": 2067} {"train_loss": -12.431188583374023, "global_step": 347318, "epoch": 2067} {"train_loss": -12.220392227172852, "global_step": 347319, "epoch": 2067} {"train_loss": -12.11011791229248, "global_step": 347320, "epoch": 2067} {"train_loss": -12.262263298034668, "global_step": 347321, "epoch": 2067} {"train_loss": -12.359272003173828, "global_step": 347322, "epoch": 2067} {"train_loss": -12.124850273132324, "global_step": 347323, "epoch": 2067} {"train_loss": -12.053434371948242, "global_step": 347324, "epoch": 2067} {"train_loss": -12.018186569213867, "global_step": 347325, "epoch": 2067} {"train_loss": -11.733114242553711, "global_step": 347326, "epoch": 2067} {"train_loss": -12.161001205444336, "global_step": 347327, "epoch": 2067} {"train_loss": -11.527901649475098, "global_step": 347328, "epoch": 2067} {"train_loss": -11.708312034606934, "global_step": 347329, "epoch": 2067} {"train_loss": -11.57264518737793, "global_step": 347330, "epoch": 2067} {"train_loss": -12.395431518554688, "global_step": 347331, "epoch": 2067} {"train_loss": -11.6669282913208, "global_step": 347332, "epoch": 2067} {"train_loss": -11.99040412902832, "global_step": 347333, "epoch": 2067} {"train_loss": -11.423294067382812, "global_step": 347334, "epoch": 2067} {"train_loss": -11.786998748779297, "global_step": 347335, "epoch": 2067} {"train_loss": -10.909258842468262, "global_step": 347336, "epoch": 2067} {"train_loss": -10.617131233215332, "global_step": 347337, "epoch": 2067} {"train_loss": -11.949017524719238, "global_step": 347338, "epoch": 2067} {"train_loss": -11.403669357299805, "global_step": 347339, "epoch": 2067} {"train_loss": -11.582468032836914, "global_step": 347340, "epoch": 2067} {"train_loss": -11.772796630859375, "global_step": 347341, "epoch": 2067} {"train_loss": -11.762272834777832, "global_step": 347342, "epoch": 2067} {"train_loss": -11.68515682220459, "global_step": 347343, "epoch": 2067} {"train_loss": -11.209659576416016, "global_step": 347344, "epoch": 2067} {"train_loss": -12.2166109085083, "global_step": 347345, "epoch": 2067} {"train_loss": -11.745651245117188, "global_step": 347346, "epoch": 2067} {"train_loss": -10.926170349121094, "global_step": 347347, "epoch": 2067} {"train_loss": -11.571611404418945, "global_step": 347348, "epoch": 2067} {"train_loss": -11.705938339233398, "global_step": 347349, "epoch": 2067} {"train_loss": -11.783102989196777, "global_step": 347350, "epoch": 2067} {"train_loss": -11.446920394897461, "global_step": 347351, "epoch": 2067} {"train_loss": -11.72319221496582, "global_step": 347352, "epoch": 2067} {"train_loss": -11.430351257324219, "global_step": 347353, "epoch": 2067} {"train_loss": -11.862174987792969, "global_step": 347354, "epoch": 2067} {"train_loss": -11.184295654296875, "global_step": 347355, "epoch": 2067} {"train_loss": -11.785950660705566, "global_step": 347356, "epoch": 2067} {"train_loss": -11.446002960205078, "global_step": 347357, "epoch": 2067} {"train_loss": -10.973506927490234, "global_step": 347358, "epoch": 2067} {"train_loss": -11.525723457336426, "global_step": 347359, "epoch": 2067} {"train_loss": -11.964012145996094, "global_step": 347360, "epoch": 2067} {"train_loss": -11.714835166931152, "global_step": 347361, "epoch": 2067} {"train_loss": -12.171804428100586, "global_step": 347362, "epoch": 2067} {"train_loss": -12.026510238647461, "global_step": 347363, "epoch": 2067} {"train_loss": -11.974172592163086, "global_step": 347364, "epoch": 2067} {"train_loss": -11.718804359436035, "global_step": 347365, "epoch": 2067} {"train_loss": -11.945821762084961, "global_step": 347366, "epoch": 2067} {"train_loss": -11.889623641967773, "global_step": 347367, "epoch": 2067} {"train_loss": -11.876077651977539, "global_step": 347368, "epoch": 2067} {"train_loss": -12.342527389526367, "global_step": 347369, "epoch": 2067} {"train_loss": -11.757425308227539, "global_step": 347370, "epoch": 2067} {"train_loss": -12.413578033447266, "global_step": 347371, "epoch": 2067} {"train_loss": -11.730342864990234, "global_step": 347372, "epoch": 2067} {"train_loss": -11.95748519897461, "global_step": 347373, "epoch": 2067} {"train_loss": -12.004537582397461, "global_step": 347374, "epoch": 2067} {"train_loss": -11.968090057373047, "global_step": 347375, "epoch": 2067} {"train_loss": -11.88800048828125, "global_step": 347376, "epoch": 2067} {"train_loss": -12.070425033569336, "global_step": 347377, "epoch": 2067} {"train_loss": -11.891600608825684, "global_step": 347378, "epoch": 2067} {"train_loss": -11.973682403564453, "global_step": 347379, "epoch": 2067} {"train_loss": -12.247915267944336, "global_step": 347380, "epoch": 2067} {"train_loss": -12.130725860595703, "global_step": 347381, "epoch": 2067} {"train_loss": -12.29509449005127, "global_step": 347382, "epoch": 2067} {"train_loss": -12.171675682067871, "global_step": 347383, "epoch": 2067} {"train_loss": -12.45097827911377, "global_step": 347384, "epoch": 2067} {"train_loss": -12.064667701721191, "global_step": 347385, "epoch": 2067} {"train_loss": -12.222688674926758, "global_step": 347386, "epoch": 2067} {"train_loss": -12.11530590057373, "global_step": 347387, "epoch": 2067} {"train_loss": -12.038792610168457, "global_step": 347388, "epoch": 2067} {"train_loss": -12.013901710510254, "global_step": 347389, "epoch": 2067} {"train_loss": -12.359460830688477, "global_step": 347390, "epoch": 2067} {"train_loss": -11.994014739990234, "global_step": 347391, "epoch": 2067} {"train_loss": -12.259614944458008, "global_step": 347392, "epoch": 2067} {"train_loss": -12.355429649353027, "global_step": 347393, "epoch": 2067} {"train_loss": -12.100179672241211, "global_step": 347394, "epoch": 2067} {"train_loss": -12.161293029785156, "global_step": 347395, "epoch": 2067} {"train_loss": -12.110492706298828, "global_step": 347396, "epoch": 2067} {"train_loss": -12.295342445373535, "global_step": 347397, "epoch": 2067} {"train_loss": -11.949178695678711, "global_step": 347398, "epoch": 2067} {"train_loss": -12.129122734069824, "global_step": 347399, "epoch": 2067} {"train_loss": -12.405466079711914, "global_step": 347400, "epoch": 2067} {"train_loss": -11.163606643676758, "global_step": 347401, "epoch": 2067} {"train_loss": -12.121827125549316, "global_step": 347402, "epoch": 2067} {"train_loss": -11.748218536376953, "global_step": 347403, "epoch": 2067} {"train_loss": -12.0865478515625, "global_step": 347404, "epoch": 2067} {"train_loss": -11.860698699951172, "global_step": 347405, "epoch": 2067} {"train_loss": -12.293038368225098, "global_step": 347406, "epoch": 2067} {"train_loss": -11.885661125183105, "global_step": 347407, "epoch": 2067} {"train_loss": -12.176502227783203, "global_step": 347408, "epoch": 2067} {"train_loss": -12.347026824951172, "global_step": 347409, "epoch": 2067} {"train_loss": -12.244653701782227, "global_step": 347410, "epoch": 2067} {"train_loss": -12.40685749053955, "global_step": 347411, "epoch": 2067} {"train_loss": -12.26422119140625, "global_step": 347412, "epoch": 2067} {"train_loss": -12.69045639038086, "global_step": 347413, "epoch": 2067} {"train_loss": -12.35012149810791, "global_step": 347414, "epoch": 2067} {"train_loss": -12.600248336791992, "global_step": 347415, "epoch": 2067} {"train_loss": -12.437535285949707, "global_step": 347416, "epoch": 2067} {"train_loss": -12.263429641723633, "global_step": 347417, "epoch": 2067} {"train_loss": -12.547954559326172, "global_step": 347418, "epoch": 2067} {"train_loss": -12.240644454956055, "global_step": 347419, "epoch": 2067} {"train_loss": -11.998296737670898, "global_step": 347420, "epoch": 2067} {"train_loss": -12.563810348510742, "global_step": 347421, "epoch": 2067} {"train_loss": -12.137750625610352, "global_step": 347422, "epoch": 2067} {"train_loss": -11.98110120069413, "global_step": 347423, "epoch": 2067, "val_loss": 286767.46875} {"train_loss": -11.992616653442383, "global_step": 347424, "epoch": 2068} {"train_loss": -12.448294639587402, "global_step": 347425, "epoch": 2068} {"train_loss": -12.24128532409668, "global_step": 347426, "epoch": 2068} {"train_loss": -12.088592529296875, "global_step": 347427, "epoch": 2068} {"train_loss": -12.203851699829102, "global_step": 347428, "epoch": 2068} {"train_loss": -12.389446258544922, "global_step": 347429, "epoch": 2068} {"train_loss": -12.23698616027832, "global_step": 347430, "epoch": 2068} {"train_loss": -12.21647834777832, "global_step": 347431, "epoch": 2068} {"train_loss": -12.34750747680664, "global_step": 347432, "epoch": 2068} {"train_loss": -12.007706642150879, "global_step": 347433, "epoch": 2068} {"train_loss": -12.306032180786133, "global_step": 347434, "epoch": 2068} {"train_loss": -12.197654724121094, "global_step": 347435, "epoch": 2068} {"train_loss": -12.45962905883789, "global_step": 347436, "epoch": 2068} {"train_loss": -12.239555358886719, "global_step": 347437, "epoch": 2068} {"train_loss": -11.863672256469727, "global_step": 347438, "epoch": 2068} {"train_loss": -11.954682350158691, "global_step": 347439, "epoch": 2068} {"train_loss": -12.031980514526367, "global_step": 347440, "epoch": 2068} {"train_loss": -12.311030387878418, "global_step": 347441, "epoch": 2068} {"train_loss": -12.388840675354004, "global_step": 347442, "epoch": 2068} {"train_loss": -12.340827941894531, "global_step": 347443, "epoch": 2068} {"train_loss": -12.614703178405762, "global_step": 347444, "epoch": 2068} {"train_loss": -12.315635681152344, "global_step": 347445, "epoch": 2068} {"train_loss": -12.52931022644043, "global_step": 347446, "epoch": 2068} {"train_loss": -12.265358924865723, "global_step": 347447, "epoch": 2068} {"train_loss": -12.491255760192871, "global_step": 347448, "epoch": 2068} {"train_loss": -12.191991806030273, "global_step": 347449, "epoch": 2068} {"train_loss": -12.077691078186035, "global_step": 347450, "epoch": 2068} {"train_loss": -12.041728019714355, "global_step": 347451, "epoch": 2068} {"train_loss": -12.364999771118164, "global_step": 347452, "epoch": 2068} {"train_loss": -12.526826858520508, "global_step": 347453, "epoch": 2068} {"train_loss": -12.166284561157227, "global_step": 347454, "epoch": 2068} {"train_loss": -12.254472732543945, "global_step": 347455, "epoch": 2068} {"train_loss": -12.141632080078125, "global_step": 347456, "epoch": 2068} {"train_loss": -12.45416259765625, "global_step": 347457, "epoch": 2068} {"train_loss": -12.049418449401855, "global_step": 347458, "epoch": 2068} {"train_loss": -12.144477844238281, "global_step": 347459, "epoch": 2068} {"train_loss": -12.149675369262695, "global_step": 347460, "epoch": 2068} {"train_loss": -11.932373046875, "global_step": 347461, "epoch": 2068} {"train_loss": -12.212077140808105, "global_step": 347462, "epoch": 2068} {"train_loss": -12.426422119140625, "global_step": 347463, "epoch": 2068} {"train_loss": -12.31545352935791, "global_step": 347464, "epoch": 2068} {"train_loss": -12.401910781860352, "global_step": 347465, "epoch": 2068} {"train_loss": -12.140567779541016, "global_step": 347466, "epoch": 2068} {"train_loss": -12.390480041503906, "global_step": 347467, "epoch": 2068} {"train_loss": -12.420116424560547, "global_step": 347468, "epoch": 2068} {"train_loss": -12.162385940551758, "global_step": 347469, "epoch": 2068} {"train_loss": -11.331205368041992, "global_step": 347470, "epoch": 2068} {"train_loss": -12.188716888427734, "global_step": 347471, "epoch": 2068} {"train_loss": -12.119376182556152, "global_step": 347472, "epoch": 2068} {"train_loss": -11.719645500183105, "global_step": 347473, "epoch": 2068} {"train_loss": -11.630077362060547, "global_step": 347474, "epoch": 2068} {"train_loss": -12.148993492126465, "global_step": 347475, "epoch": 2068} {"train_loss": -12.048870086669922, "global_step": 347476, "epoch": 2068} {"train_loss": -11.567310333251953, "global_step": 347477, "epoch": 2068} {"train_loss": -11.333301544189453, "global_step": 347478, "epoch": 2068} {"train_loss": -12.509054183959961, "global_step": 347479, "epoch": 2068} {"train_loss": -11.881645202636719, "global_step": 347480, "epoch": 2068} {"train_loss": -11.099138259887695, "global_step": 347481, "epoch": 2068} {"train_loss": -11.84300422668457, "global_step": 347482, "epoch": 2068} {"train_loss": -12.073165893554688, "global_step": 347483, "epoch": 2068} {"train_loss": -11.901650428771973, "global_step": 347484, "epoch": 2068} {"train_loss": -12.358280181884766, "global_step": 347485, "epoch": 2068} {"train_loss": -11.61131477355957, "global_step": 347486, "epoch": 2068} {"train_loss": -11.447944641113281, "global_step": 347487, "epoch": 2068} {"train_loss": -11.42189884185791, "global_step": 347488, "epoch": 2068} {"train_loss": -12.42879867553711, "global_step": 347489, "epoch": 2068} {"train_loss": -10.9248685836792, "global_step": 347490, "epoch": 2068} {"train_loss": -11.099580764770508, "global_step": 347491, "epoch": 2068} {"train_loss": -11.905683517456055, "global_step": 347492, "epoch": 2068} {"train_loss": -9.5391845703125, "global_step": 347493, "epoch": 2068} {"train_loss": -11.586551666259766, "global_step": 347494, "epoch": 2068} {"train_loss": -9.98227310180664, "global_step": 347495, "epoch": 2068} {"train_loss": -10.968239784240723, "global_step": 347496, "epoch": 2068} {"train_loss": -12.02438735961914, "global_step": 347497, "epoch": 2068} {"train_loss": -11.351871490478516, "global_step": 347498, "epoch": 2068} {"train_loss": -12.223651885986328, "global_step": 347499, "epoch": 2068} {"train_loss": -12.042303085327148, "global_step": 347500, "epoch": 2068} {"train_loss": -11.976274490356445, "global_step": 347501, "epoch": 2068} {"train_loss": -12.178947448730469, "global_step": 347502, "epoch": 2068} {"train_loss": -11.95803451538086, "global_step": 347503, "epoch": 2068} {"train_loss": -12.255781173706055, "global_step": 347504, "epoch": 2068} {"train_loss": -12.291364669799805, "global_step": 347505, "epoch": 2068} {"train_loss": -12.185426712036133, "global_step": 347506, "epoch": 2068} {"train_loss": -12.414862632751465, "global_step": 347507, "epoch": 2068} {"train_loss": -12.127288818359375, "global_step": 347508, "epoch": 2068} {"train_loss": -12.037370681762695, "global_step": 347509, "epoch": 2068} {"train_loss": -12.133720397949219, "global_step": 347510, "epoch": 2068} {"train_loss": -12.087156295776367, "global_step": 347511, "epoch": 2068} {"train_loss": -12.112266540527344, "global_step": 347512, "epoch": 2068} {"train_loss": -11.982044219970703, "global_step": 347513, "epoch": 2068} {"train_loss": -12.26764965057373, "global_step": 347514, "epoch": 2068} {"train_loss": -12.168676376342773, "global_step": 347515, "epoch": 2068} {"train_loss": -11.893339157104492, "global_step": 347516, "epoch": 2068} {"train_loss": -12.320993423461914, "global_step": 347517, "epoch": 2068} {"train_loss": -12.127361297607422, "global_step": 347518, "epoch": 2068} {"train_loss": -12.024246215820312, "global_step": 347519, "epoch": 2068} {"train_loss": -12.140626907348633, "global_step": 347520, "epoch": 2068} {"train_loss": -12.035204887390137, "global_step": 347521, "epoch": 2068} {"train_loss": -12.48169231414795, "global_step": 347522, "epoch": 2068} {"train_loss": -11.645082473754883, "global_step": 347523, "epoch": 2068} {"train_loss": -11.994610786437988, "global_step": 347524, "epoch": 2068} {"train_loss": -11.720033645629883, "global_step": 347525, "epoch": 2068} {"train_loss": -11.153526306152344, "global_step": 347526, "epoch": 2068} {"train_loss": -12.030176162719727, "global_step": 347527, "epoch": 2068} {"train_loss": -10.323816299438477, "global_step": 347528, "epoch": 2068} {"train_loss": -11.931802749633789, "global_step": 347529, "epoch": 2068} {"train_loss": -11.620196342468262, "global_step": 347530, "epoch": 2068} {"train_loss": -12.02498722076416, "global_step": 347531, "epoch": 2068} {"train_loss": -11.908271789550781, "global_step": 347532, "epoch": 2068} {"train_loss": -11.599472999572754, "global_step": 347533, "epoch": 2068} {"train_loss": -12.098419189453125, "global_step": 347534, "epoch": 2068} {"train_loss": -12.110235214233398, "global_step": 347535, "epoch": 2068} {"train_loss": -12.427791595458984, "global_step": 347536, "epoch": 2068} {"train_loss": -12.016170501708984, "global_step": 347537, "epoch": 2068} {"train_loss": -12.184664726257324, "global_step": 347538, "epoch": 2068} {"train_loss": -12.343291282653809, "global_step": 347539, "epoch": 2068} {"train_loss": -12.158172607421875, "global_step": 347540, "epoch": 2068} {"train_loss": -12.171992301940918, "global_step": 347541, "epoch": 2068} {"train_loss": -12.375431060791016, "global_step": 347542, "epoch": 2068} {"train_loss": -12.313602447509766, "global_step": 347543, "epoch": 2068} {"train_loss": -12.34307861328125, "global_step": 347544, "epoch": 2068} {"train_loss": -12.174118995666504, "global_step": 347545, "epoch": 2068} {"train_loss": -12.480554580688477, "global_step": 347546, "epoch": 2068} {"train_loss": -12.212604522705078, "global_step": 347547, "epoch": 2068} {"train_loss": -12.179387092590332, "global_step": 347548, "epoch": 2068} {"train_loss": -12.508657455444336, "global_step": 347549, "epoch": 2068} {"train_loss": -12.308911323547363, "global_step": 347550, "epoch": 2068} {"train_loss": -12.242996215820312, "global_step": 347551, "epoch": 2068} {"train_loss": -12.338375091552734, "global_step": 347552, "epoch": 2068} {"train_loss": -11.963976860046387, "global_step": 347553, "epoch": 2068} {"train_loss": -12.375286102294922, "global_step": 347554, "epoch": 2068} {"train_loss": -11.886856079101562, "global_step": 347555, "epoch": 2068} {"train_loss": -11.437889099121094, "global_step": 347556, "epoch": 2068} {"train_loss": -11.33309555053711, "global_step": 347557, "epoch": 2068} {"train_loss": -11.573226928710938, "global_step": 347558, "epoch": 2068} {"train_loss": -11.941092491149902, "global_step": 347559, "epoch": 2068} {"train_loss": -10.809226989746094, "global_step": 347560, "epoch": 2068} {"train_loss": -9.606578826904297, "global_step": 347561, "epoch": 2068} {"train_loss": -9.845438003540039, "global_step": 347562, "epoch": 2068} {"train_loss": -10.929454803466797, "global_step": 347563, "epoch": 2068} {"train_loss": -10.490440368652344, "global_step": 347564, "epoch": 2068} {"train_loss": -9.678443908691406, "global_step": 347565, "epoch": 2068} {"train_loss": -10.781185150146484, "global_step": 347566, "epoch": 2068} {"train_loss": -10.75555419921875, "global_step": 347567, "epoch": 2068} {"train_loss": -8.889533996582031, "global_step": 347568, "epoch": 2068} {"train_loss": -9.982789993286133, "global_step": 347569, "epoch": 2068} {"train_loss": -9.895124435424805, "global_step": 347570, "epoch": 2068} {"train_loss": -11.073806762695312, "global_step": 347571, "epoch": 2068} {"train_loss": -8.856185913085938, "global_step": 347572, "epoch": 2068} {"train_loss": -10.571428298950195, "global_step": 347573, "epoch": 2068} {"train_loss": -10.720333099365234, "global_step": 347574, "epoch": 2068} {"train_loss": -11.27254867553711, "global_step": 347575, "epoch": 2068} {"train_loss": -10.554258346557617, "global_step": 347576, "epoch": 2068} {"train_loss": -11.547419548034668, "global_step": 347577, "epoch": 2068} {"train_loss": -11.305665969848633, "global_step": 347578, "epoch": 2068} {"train_loss": -10.818379402160645, "global_step": 347579, "epoch": 2068} {"train_loss": -11.629311561584473, "global_step": 347580, "epoch": 2068} {"train_loss": -11.041929244995117, "global_step": 347581, "epoch": 2068} {"train_loss": -11.549808502197266, "global_step": 347582, "epoch": 2068} {"train_loss": -11.37204360961914, "global_step": 347583, "epoch": 2068} {"train_loss": -11.055784225463867, "global_step": 347584, "epoch": 2068} {"train_loss": -11.725049018859863, "global_step": 347585, "epoch": 2068} {"train_loss": -11.563889503479004, "global_step": 347586, "epoch": 2068} {"train_loss": -11.693572044372559, "global_step": 347587, "epoch": 2068} {"train_loss": -11.743634223937988, "global_step": 347588, "epoch": 2068} {"train_loss": -11.110217094421387, "global_step": 347589, "epoch": 2068} {"train_loss": -12.060746192932129, "global_step": 347590, "epoch": 2068} {"train_loss": -11.790382339840843, "global_step": 347591, "epoch": 2068, "val_loss": 284017.46875} {"train_loss": -11.959291458129883, "global_step": 347592, "epoch": 2069} {"train_loss": -11.24836540222168, "global_step": 347593, "epoch": 2069} {"train_loss": -11.886783599853516, "global_step": 347594, "epoch": 2069} {"train_loss": -11.965370178222656, "global_step": 347595, "epoch": 2069} {"train_loss": -11.811336517333984, "global_step": 347596, "epoch": 2069} {"train_loss": -12.201977729797363, "global_step": 347597, "epoch": 2069} {"train_loss": -11.817733764648438, "global_step": 347598, "epoch": 2069} {"train_loss": -11.856277465820312, "global_step": 347599, "epoch": 2069} {"train_loss": -12.075526237487793, "global_step": 347600, "epoch": 2069} {"train_loss": -11.828697204589844, "global_step": 347601, "epoch": 2069} {"train_loss": -12.285840034484863, "global_step": 347602, "epoch": 2069} {"train_loss": -11.990474700927734, "global_step": 347603, "epoch": 2069} {"train_loss": -12.095120429992676, "global_step": 347604, "epoch": 2069} {"train_loss": -12.026468276977539, "global_step": 347605, "epoch": 2069} {"train_loss": -11.97437858581543, "global_step": 347606, "epoch": 2069} {"train_loss": -12.151348114013672, "global_step": 347607, "epoch": 2069} {"train_loss": -12.345671653747559, "global_step": 347608, "epoch": 2069} {"train_loss": -12.052446365356445, "global_step": 347609, "epoch": 2069} {"train_loss": -12.331934928894043, "global_step": 347610, "epoch": 2069} {"train_loss": -12.100040435791016, "global_step": 347611, "epoch": 2069} {"train_loss": -11.980636596679688, "global_step": 347612, "epoch": 2069} {"train_loss": -12.314300537109375, "global_step": 347613, "epoch": 2069} {"train_loss": -11.903084754943848, "global_step": 347614, "epoch": 2069} {"train_loss": -12.45965576171875, "global_step": 347615, "epoch": 2069} {"train_loss": -12.331472396850586, "global_step": 347616, "epoch": 2069} {"train_loss": -11.896406173706055, "global_step": 347617, "epoch": 2069} {"train_loss": -11.998367309570312, "global_step": 347618, "epoch": 2069} {"train_loss": -12.331092834472656, "global_step": 347619, "epoch": 2069} {"train_loss": -12.289051055908203, "global_step": 347620, "epoch": 2069} {"train_loss": -12.383866310119629, "global_step": 347621, "epoch": 2069} {"train_loss": -12.506987571716309, "global_step": 347622, "epoch": 2069} {"train_loss": -12.424816131591797, "global_step": 347623, "epoch": 2069} {"train_loss": -12.420976638793945, "global_step": 347624, "epoch": 2069} {"train_loss": -12.319087982177734, "global_step": 347625, "epoch": 2069} {"train_loss": -12.444616317749023, "global_step": 347626, "epoch": 2069} {"train_loss": -12.400022506713867, "global_step": 347627, "epoch": 2069} {"train_loss": -12.368861198425293, "global_step": 347628, "epoch": 2069} {"train_loss": -12.45559024810791, "global_step": 347629, "epoch": 2069} {"train_loss": -12.569910049438477, "global_step": 347630, "epoch": 2069} {"train_loss": -12.455221176147461, "global_step": 347631, "epoch": 2069} {"train_loss": -12.448119163513184, "global_step": 347632, "epoch": 2069} {"train_loss": -12.201740264892578, "global_step": 347633, "epoch": 2069} {"train_loss": -12.21200942993164, "global_step": 347634, "epoch": 2069} {"train_loss": -12.164984703063965, "global_step": 347635, "epoch": 2069} {"train_loss": -12.56874942779541, "global_step": 347636, "epoch": 2069} {"train_loss": -12.41514778137207, "global_step": 347637, "epoch": 2069} {"train_loss": -12.482032775878906, "global_step": 347638, "epoch": 2069} {"train_loss": -12.33616828918457, "global_step": 347639, "epoch": 2069} {"train_loss": -12.51760482788086, "global_step": 347640, "epoch": 2069} {"train_loss": -12.424775123596191, "global_step": 347641, "epoch": 2069} {"train_loss": -12.557465553283691, "global_step": 347642, "epoch": 2069} {"train_loss": -12.539979934692383, "global_step": 347643, "epoch": 2069} {"train_loss": -12.517120361328125, "global_step": 347644, "epoch": 2069} {"train_loss": -12.523727416992188, "global_step": 347645, "epoch": 2069} {"train_loss": -12.570082664489746, "global_step": 347646, "epoch": 2069} {"train_loss": -12.386797904968262, "global_step": 347647, "epoch": 2069} {"train_loss": -12.51067066192627, "global_step": 347648, "epoch": 2069} {"train_loss": -12.675142288208008, "global_step": 347649, "epoch": 2069} {"train_loss": -12.661224365234375, "global_step": 347650, "epoch": 2069} {"train_loss": -12.455546379089355, "global_step": 347651, "epoch": 2069} {"train_loss": -12.667215347290039, "global_step": 347652, "epoch": 2069} {"train_loss": -12.70836067199707, "global_step": 347653, "epoch": 2069} {"train_loss": -12.444161415100098, "global_step": 347654, "epoch": 2069} {"train_loss": -12.551631927490234, "global_step": 347655, "epoch": 2069} {"train_loss": -12.815887451171875, "global_step": 347656, "epoch": 2069} {"train_loss": -12.538991928100586, "global_step": 347657, "epoch": 2069} {"train_loss": -12.528409004211426, "global_step": 347658, "epoch": 2069} {"train_loss": -12.454292297363281, "global_step": 347659, "epoch": 2069} {"train_loss": -11.745243072509766, "global_step": 347660, "epoch": 2069} {"train_loss": -11.359195709228516, "global_step": 347661, "epoch": 2069} {"train_loss": -11.87724781036377, "global_step": 347662, "epoch": 2069} {"train_loss": -12.52049732208252, "global_step": 347663, "epoch": 2069} {"train_loss": -11.374761581420898, "global_step": 347664, "epoch": 2069} {"train_loss": -11.741473197937012, "global_step": 347665, "epoch": 2069} {"train_loss": -10.907747268676758, "global_step": 347666, "epoch": 2069} {"train_loss": -9.717342376708984, "global_step": 347667, "epoch": 2069} {"train_loss": -10.781902313232422, "global_step": 347668, "epoch": 2069} {"train_loss": -7.808365821838379, "global_step": 347669, "epoch": 2069} {"train_loss": -7.651928424835205, "global_step": 347670, "epoch": 2069} {"train_loss": -7.787015914916992, "global_step": 347671, "epoch": 2069} {"train_loss": -7.211030006408691, "global_step": 347672, "epoch": 2069} {"train_loss": -7.745446681976318, "global_step": 347673, "epoch": 2069} {"train_loss": -8.936883926391602, "global_step": 347674, "epoch": 2069} {"train_loss": -8.447345733642578, "global_step": 347675, "epoch": 2069} {"train_loss": -8.728778839111328, "global_step": 347676, "epoch": 2069} {"train_loss": -8.150415420532227, "global_step": 347677, "epoch": 2069} {"train_loss": -9.319925308227539, "global_step": 347678, "epoch": 2069} {"train_loss": -9.479206085205078, "global_step": 347679, "epoch": 2069} {"train_loss": -10.570196151733398, "global_step": 347680, "epoch": 2069} {"train_loss": -9.876350402832031, "global_step": 347681, "epoch": 2069} {"train_loss": -11.417546272277832, "global_step": 347682, "epoch": 2069} {"train_loss": -10.832433700561523, "global_step": 347683, "epoch": 2069} {"train_loss": -10.726458549499512, "global_step": 347684, "epoch": 2069} {"train_loss": -9.86905574798584, "global_step": 347685, "epoch": 2069} {"train_loss": -10.297061920166016, "global_step": 347686, "epoch": 2069} {"train_loss": -10.490856170654297, "global_step": 347687, "epoch": 2069} {"train_loss": -11.234701156616211, "global_step": 347688, "epoch": 2069} {"train_loss": -11.312767028808594, "global_step": 347689, "epoch": 2069} {"train_loss": -10.634695053100586, "global_step": 347690, "epoch": 2069} {"train_loss": -11.759339332580566, "global_step": 347691, "epoch": 2069} {"train_loss": -10.783615112304688, "global_step": 347692, "epoch": 2069} {"train_loss": -12.150582313537598, "global_step": 347693, "epoch": 2069} {"train_loss": -11.123165130615234, "global_step": 347694, "epoch": 2069} {"train_loss": -12.015228271484375, "global_step": 347695, "epoch": 2069} {"train_loss": -11.691876411437988, "global_step": 347696, "epoch": 2069} {"train_loss": -11.59405517578125, "global_step": 347697, "epoch": 2069} {"train_loss": -11.840974807739258, "global_step": 347698, "epoch": 2069} {"train_loss": -11.602263450622559, "global_step": 347699, "epoch": 2069} {"train_loss": -12.092658996582031, "global_step": 347700, "epoch": 2069} {"train_loss": -11.872802734375, "global_step": 347701, "epoch": 2069} {"train_loss": -12.211701393127441, "global_step": 347702, "epoch": 2069} {"train_loss": -11.813047409057617, "global_step": 347703, "epoch": 2069} {"train_loss": -12.071816444396973, "global_step": 347704, "epoch": 2069} {"train_loss": -11.82652473449707, "global_step": 347705, "epoch": 2069} {"train_loss": -12.037657737731934, "global_step": 347706, "epoch": 2069} {"train_loss": -11.8485746383667, "global_step": 347707, "epoch": 2069} {"train_loss": -12.005086898803711, "global_step": 347708, "epoch": 2069} {"train_loss": -12.123504638671875, "global_step": 347709, "epoch": 2069} {"train_loss": -12.180904388427734, "global_step": 347710, "epoch": 2069} {"train_loss": -12.132247924804688, "global_step": 347711, "epoch": 2069} {"train_loss": -11.975481033325195, "global_step": 347712, "epoch": 2069} {"train_loss": -12.167491912841797, "global_step": 347713, "epoch": 2069} {"train_loss": -12.19971752166748, "global_step": 347714, "epoch": 2069} {"train_loss": -12.028657913208008, "global_step": 347715, "epoch": 2069} {"train_loss": -12.02316951751709, "global_step": 347716, "epoch": 2069} {"train_loss": -12.087804794311523, "global_step": 347717, "epoch": 2069} {"train_loss": -12.188899993896484, "global_step": 347718, "epoch": 2069} {"train_loss": -11.869956970214844, "global_step": 347719, "epoch": 2069} {"train_loss": -12.136444091796875, "global_step": 347720, "epoch": 2069} {"train_loss": -12.006691932678223, "global_step": 347721, "epoch": 2069} {"train_loss": -11.92498779296875, "global_step": 347722, "epoch": 2069} {"train_loss": -12.08133316040039, "global_step": 347723, "epoch": 2069} {"train_loss": -11.372293472290039, "global_step": 347724, "epoch": 2069} {"train_loss": -11.945825576782227, "global_step": 347725, "epoch": 2069} {"train_loss": -12.203516006469727, "global_step": 347726, "epoch": 2069} {"train_loss": -11.010675430297852, "global_step": 347727, "epoch": 2069} {"train_loss": -11.991220474243164, "global_step": 347728, "epoch": 2069} {"train_loss": -11.717899322509766, "global_step": 347729, "epoch": 2069} {"train_loss": -11.930403709411621, "global_step": 347730, "epoch": 2069} {"train_loss": -12.262451171875, "global_step": 347731, "epoch": 2069} {"train_loss": -11.52876091003418, "global_step": 347732, "epoch": 2069} {"train_loss": -12.391998291015625, "global_step": 347733, "epoch": 2069} {"train_loss": -11.656384468078613, "global_step": 347734, "epoch": 2069} {"train_loss": -12.031672477722168, "global_step": 347735, "epoch": 2069} {"train_loss": -12.326129913330078, "global_step": 347736, "epoch": 2069} {"train_loss": -12.075334548950195, "global_step": 347737, "epoch": 2069} {"train_loss": -12.026934623718262, "global_step": 347738, "epoch": 2069} {"train_loss": -12.061363220214844, "global_step": 347739, "epoch": 2069} {"train_loss": -12.208353042602539, "global_step": 347740, "epoch": 2069} {"train_loss": -11.744747161865234, "global_step": 347741, "epoch": 2069} {"train_loss": -12.255971908569336, "global_step": 347742, "epoch": 2069} {"train_loss": -11.815648078918457, "global_step": 347743, "epoch": 2069} {"train_loss": -12.18951416015625, "global_step": 347744, "epoch": 2069} {"train_loss": -12.398646354675293, "global_step": 347745, "epoch": 2069} {"train_loss": -11.817212104797363, "global_step": 347746, "epoch": 2069} {"train_loss": -12.344400405883789, "global_step": 347747, "epoch": 2069} {"train_loss": -12.023194313049316, "global_step": 347748, "epoch": 2069} {"train_loss": -12.501992225646973, "global_step": 347749, "epoch": 2069} {"train_loss": -12.127449035644531, "global_step": 347750, "epoch": 2069} {"train_loss": -12.39346694946289, "global_step": 347751, "epoch": 2069} {"train_loss": -12.27096176147461, "global_step": 347752, "epoch": 2069} {"train_loss": -12.290143966674805, "global_step": 347753, "epoch": 2069} {"train_loss": -12.233123779296875, "global_step": 347754, "epoch": 2069} {"train_loss": -12.398923873901367, "global_step": 347755, "epoch": 2069} {"train_loss": -12.19957160949707, "global_step": 347756, "epoch": 2069} {"train_loss": -12.165255546569824, "global_step": 347757, "epoch": 2069} {"train_loss": -12.058100700378418, "global_step": 347758, "epoch": 2069} {"train_loss": -11.75177614461808, "global_step": 347759, "epoch": 2069, "val_loss": 284296.53125} {"train_loss": -12.464975357055664, "global_step": 347760, "epoch": 2070} {"train_loss": -12.39498519897461, "global_step": 347761, "epoch": 2070} {"train_loss": -12.423219680786133, "global_step": 347762, "epoch": 2070} {"train_loss": -12.213058471679688, "global_step": 347763, "epoch": 2070} {"train_loss": -12.303434371948242, "global_step": 347764, "epoch": 2070} {"train_loss": -11.957094192504883, "global_step": 347765, "epoch": 2070} {"train_loss": -11.933996200561523, "global_step": 347766, "epoch": 2070} {"train_loss": -12.294694900512695, "global_step": 347767, "epoch": 2070} {"train_loss": -12.385019302368164, "global_step": 347768, "epoch": 2070} {"train_loss": -11.94102668762207, "global_step": 347769, "epoch": 2070} {"train_loss": -12.573314666748047, "global_step": 347770, "epoch": 2070} {"train_loss": -11.947124481201172, "global_step": 347771, "epoch": 2070} {"train_loss": -12.397035598754883, "global_step": 347772, "epoch": 2070} {"train_loss": -12.054438591003418, "global_step": 347773, "epoch": 2070} {"train_loss": -12.424169540405273, "global_step": 347774, "epoch": 2070} {"train_loss": -12.228288650512695, "global_step": 347775, "epoch": 2070} {"train_loss": -12.392707824707031, "global_step": 347776, "epoch": 2070} {"train_loss": -12.152029037475586, "global_step": 347777, "epoch": 2070} {"train_loss": -12.500213623046875, "global_step": 347778, "epoch": 2070} {"train_loss": -12.439990997314453, "global_step": 347779, "epoch": 2070} {"train_loss": -12.188497543334961, "global_step": 347780, "epoch": 2070} {"train_loss": -12.164510726928711, "global_step": 347781, "epoch": 2070} {"train_loss": -12.38216495513916, "global_step": 347782, "epoch": 2070} {"train_loss": -12.502857208251953, "global_step": 347783, "epoch": 2070} {"train_loss": -12.50922966003418, "global_step": 347784, "epoch": 2070} {"train_loss": -12.156299591064453, "global_step": 347785, "epoch": 2070} {"train_loss": -12.330741882324219, "global_step": 347786, "epoch": 2070} {"train_loss": -12.4910888671875, "global_step": 347787, "epoch": 2070} {"train_loss": -12.11934757232666, "global_step": 347788, "epoch": 2070} {"train_loss": -12.144042015075684, "global_step": 347789, "epoch": 2070} {"train_loss": -12.616521835327148, "global_step": 347790, "epoch": 2070} {"train_loss": -12.575153350830078, "global_step": 347791, "epoch": 2070} {"train_loss": -12.427312850952148, "global_step": 347792, "epoch": 2070} {"train_loss": -12.677453994750977, "global_step": 347793, "epoch": 2070} {"train_loss": -12.076306343078613, "global_step": 347794, "epoch": 2070} {"train_loss": -12.246797561645508, "global_step": 347795, "epoch": 2070} {"train_loss": -12.444656372070312, "global_step": 347796, "epoch": 2070} {"train_loss": -12.19517707824707, "global_step": 347797, "epoch": 2070} {"train_loss": -12.244930267333984, "global_step": 347798, "epoch": 2070} {"train_loss": -12.29963207244873, "global_step": 347799, "epoch": 2070} {"train_loss": -12.445099830627441, "global_step": 347800, "epoch": 2070} {"train_loss": -12.358792304992676, "global_step": 347801, "epoch": 2070} {"train_loss": -12.352376937866211, "global_step": 347802, "epoch": 2070} {"train_loss": -11.987104415893555, "global_step": 347803, "epoch": 2070} {"train_loss": -12.534533500671387, "global_step": 347804, "epoch": 2070} {"train_loss": -12.513298034667969, "global_step": 347805, "epoch": 2070} {"train_loss": -12.472091674804688, "global_step": 347806, "epoch": 2070} {"train_loss": -12.327367782592773, "global_step": 347807, "epoch": 2070} {"train_loss": -12.223875045776367, "global_step": 347808, "epoch": 2070} {"train_loss": -11.826967239379883, "global_step": 347809, "epoch": 2070} {"train_loss": -12.453801155090332, "global_step": 347810, "epoch": 2070} {"train_loss": -12.07868766784668, "global_step": 347811, "epoch": 2070} {"train_loss": -12.175376892089844, "global_step": 347812, "epoch": 2070} {"train_loss": -12.130796432495117, "global_step": 347813, "epoch": 2070} {"train_loss": -12.189352035522461, "global_step": 347814, "epoch": 2070} {"train_loss": -11.673800468444824, "global_step": 347815, "epoch": 2070} {"train_loss": -12.382566452026367, "global_step": 347816, "epoch": 2070} {"train_loss": -12.231481552124023, "global_step": 347817, "epoch": 2070} {"train_loss": -12.314565658569336, "global_step": 347818, "epoch": 2070} {"train_loss": -11.886846542358398, "global_step": 347819, "epoch": 2070} {"train_loss": -12.211243629455566, "global_step": 347820, "epoch": 2070} {"train_loss": -12.27674674987793, "global_step": 347821, "epoch": 2070} {"train_loss": -11.81906509399414, "global_step": 347822, "epoch": 2070} {"train_loss": -12.382370948791504, "global_step": 347823, "epoch": 2070} {"train_loss": -12.009013175964355, "global_step": 347824, "epoch": 2070} {"train_loss": -11.979263305664062, "global_step": 347825, "epoch": 2070} {"train_loss": -11.525368690490723, "global_step": 347826, "epoch": 2070} {"train_loss": -11.234559059143066, "global_step": 347827, "epoch": 2070} {"train_loss": -12.175317764282227, "global_step": 347828, "epoch": 2070} {"train_loss": -12.267168045043945, "global_step": 347829, "epoch": 2070} {"train_loss": -12.437040328979492, "global_step": 347830, "epoch": 2070} {"train_loss": -11.55125617980957, "global_step": 347831, "epoch": 2070} {"train_loss": -11.81035041809082, "global_step": 347832, "epoch": 2070} {"train_loss": -12.469332695007324, "global_step": 347833, "epoch": 2070} {"train_loss": -12.076909065246582, "global_step": 347834, "epoch": 2070} {"train_loss": -11.846332550048828, "global_step": 347835, "epoch": 2070} {"train_loss": -12.051509857177734, "global_step": 347836, "epoch": 2070} {"train_loss": -12.18602180480957, "global_step": 347837, "epoch": 2070} {"train_loss": -11.860986709594727, "global_step": 347838, "epoch": 2070} {"train_loss": -11.369582176208496, "global_step": 347839, "epoch": 2070} {"train_loss": -11.82470703125, "global_step": 347840, "epoch": 2070} {"train_loss": -11.708850860595703, "global_step": 347841, "epoch": 2070} {"train_loss": -11.805537223815918, "global_step": 347842, "epoch": 2070} {"train_loss": -11.696170806884766, "global_step": 347843, "epoch": 2070} {"train_loss": -12.286949157714844, "global_step": 347844, "epoch": 2070} {"train_loss": -11.9615478515625, "global_step": 347845, "epoch": 2070} {"train_loss": -12.456709861755371, "global_step": 347846, "epoch": 2070} {"train_loss": -12.145306587219238, "global_step": 347847, "epoch": 2070} {"train_loss": -11.821832656860352, "global_step": 347848, "epoch": 2070} {"train_loss": -11.00067138671875, "global_step": 347849, "epoch": 2070} {"train_loss": -12.138779640197754, "global_step": 347850, "epoch": 2070} {"train_loss": -10.672764778137207, "global_step": 347851, "epoch": 2070} {"train_loss": -11.559833526611328, "global_step": 347852, "epoch": 2070} {"train_loss": -11.61390495300293, "global_step": 347853, "epoch": 2070} {"train_loss": -10.516897201538086, "global_step": 347854, "epoch": 2070} {"train_loss": -10.556437492370605, "global_step": 347855, "epoch": 2070} {"train_loss": -12.159197807312012, "global_step": 347856, "epoch": 2070} {"train_loss": -11.22303295135498, "global_step": 347857, "epoch": 2070} {"train_loss": -12.242615699768066, "global_step": 347858, "epoch": 2070} {"train_loss": -11.082937240600586, "global_step": 347859, "epoch": 2070} {"train_loss": -11.501119613647461, "global_step": 347860, "epoch": 2070} {"train_loss": -11.640604019165039, "global_step": 347861, "epoch": 2070} {"train_loss": -11.023515701293945, "global_step": 347862, "epoch": 2070} {"train_loss": -11.928382873535156, "global_step": 347863, "epoch": 2070} {"train_loss": -11.185282707214355, "global_step": 347864, "epoch": 2070} {"train_loss": -11.548576354980469, "global_step": 347865, "epoch": 2070} {"train_loss": -11.743942260742188, "global_step": 347866, "epoch": 2070} {"train_loss": -10.840818405151367, "global_step": 347867, "epoch": 2070} {"train_loss": -12.053536415100098, "global_step": 347868, "epoch": 2070} {"train_loss": -10.758724212646484, "global_step": 347869, "epoch": 2070} {"train_loss": -11.980011940002441, "global_step": 347870, "epoch": 2070} {"train_loss": -11.016218185424805, "global_step": 347871, "epoch": 2070} {"train_loss": -11.83798599243164, "global_step": 347872, "epoch": 2070} {"train_loss": -11.831567764282227, "global_step": 347873, "epoch": 2070} {"train_loss": -11.63228988647461, "global_step": 347874, "epoch": 2070} {"train_loss": -12.233975410461426, "global_step": 347875, "epoch": 2070} {"train_loss": -11.853479385375977, "global_step": 347876, "epoch": 2070} {"train_loss": -12.12826156616211, "global_step": 347877, "epoch": 2070} {"train_loss": -11.76385498046875, "global_step": 347878, "epoch": 2070} {"train_loss": -11.716312408447266, "global_step": 347879, "epoch": 2070} {"train_loss": -12.097383499145508, "global_step": 347880, "epoch": 2070} {"train_loss": -11.77298355102539, "global_step": 347881, "epoch": 2070} {"train_loss": -12.334126472473145, "global_step": 347882, "epoch": 2070} {"train_loss": -11.897397994995117, "global_step": 347883, "epoch": 2070} {"train_loss": -11.726048469543457, "global_step": 347884, "epoch": 2070} {"train_loss": -12.040657043457031, "global_step": 347885, "epoch": 2070} {"train_loss": -11.869002342224121, "global_step": 347886, "epoch": 2070} {"train_loss": -12.077717781066895, "global_step": 347887, "epoch": 2070} {"train_loss": -11.247444152832031, "global_step": 347888, "epoch": 2070} {"train_loss": -11.935760498046875, "global_step": 347889, "epoch": 2070} {"train_loss": -11.282747268676758, "global_step": 347890, "epoch": 2070} {"train_loss": -11.956450462341309, "global_step": 347891, "epoch": 2070} {"train_loss": -11.407562255859375, "global_step": 347892, "epoch": 2070} {"train_loss": -11.608226776123047, "global_step": 347893, "epoch": 2070} {"train_loss": -10.812847137451172, "global_step": 347894, "epoch": 2070} {"train_loss": -11.34650993347168, "global_step": 347895, "epoch": 2070} {"train_loss": -11.276464462280273, "global_step": 347896, "epoch": 2070} {"train_loss": -11.391124725341797, "global_step": 347897, "epoch": 2070} {"train_loss": -11.94481086730957, "global_step": 347898, "epoch": 2070} {"train_loss": -10.83388900756836, "global_step": 347899, "epoch": 2070} {"train_loss": -12.089221000671387, "global_step": 347900, "epoch": 2070} {"train_loss": -11.352174758911133, "global_step": 347901, "epoch": 2070} {"train_loss": -11.536603927612305, "global_step": 347902, "epoch": 2070} {"train_loss": -11.88595962524414, "global_step": 347903, "epoch": 2070} {"train_loss": -11.633275985717773, "global_step": 347904, "epoch": 2070} {"train_loss": -11.971385955810547, "global_step": 347905, "epoch": 2070} {"train_loss": -11.875301361083984, "global_step": 347906, "epoch": 2070} {"train_loss": -11.22142219543457, "global_step": 347907, "epoch": 2070} {"train_loss": -11.91772174835205, "global_step": 347908, "epoch": 2070} {"train_loss": -11.434794425964355, "global_step": 347909, "epoch": 2070} {"train_loss": -12.157554626464844, "global_step": 347910, "epoch": 2070} {"train_loss": -11.34237289428711, "global_step": 347911, "epoch": 2070} {"train_loss": -11.799604415893555, "global_step": 347912, "epoch": 2070} {"train_loss": -11.16853141784668, "global_step": 347913, "epoch": 2070} {"train_loss": -11.88516616821289, "global_step": 347914, "epoch": 2070} {"train_loss": -11.21546459197998, "global_step": 347915, "epoch": 2070} {"train_loss": -12.063128471374512, "global_step": 347916, "epoch": 2070} {"train_loss": -11.607336044311523, "global_step": 347917, "epoch": 2070} {"train_loss": -11.561396598815918, "global_step": 347918, "epoch": 2070} {"train_loss": -11.59403133392334, "global_step": 347919, "epoch": 2070} {"train_loss": -11.89576244354248, "global_step": 347920, "epoch": 2070} {"train_loss": -11.408977508544922, "global_step": 347921, "epoch": 2070} {"train_loss": -11.997169494628906, "global_step": 347922, "epoch": 2070} {"train_loss": -11.174156188964844, "global_step": 347923, "epoch": 2070} {"train_loss": -11.88252067565918, "global_step": 347924, "epoch": 2070} {"train_loss": -11.667057037353516, "global_step": 347925, "epoch": 2070} {"train_loss": -11.8137845993042, "global_step": 347926, "epoch": 2070} {"train_loss": -11.91157108829135, "global_step": 347927, "epoch": 2070, "val_loss": 290499.40625, "train_action_mse_error": 0.5433183312416077} {"train_loss": -11.823351860046387, "global_step": 347928, "epoch": 2071} {"train_loss": -12.340581893920898, "global_step": 347929, "epoch": 2071} {"train_loss": -11.788213729858398, "global_step": 347930, "epoch": 2071} {"train_loss": -11.864299774169922, "global_step": 347931, "epoch": 2071} {"train_loss": -11.96381664276123, "global_step": 347932, "epoch": 2071} {"train_loss": -12.09675407409668, "global_step": 347933, "epoch": 2071} {"train_loss": -11.963866233825684, "global_step": 347934, "epoch": 2071} {"train_loss": -12.228143692016602, "global_step": 347935, "epoch": 2071} {"train_loss": -12.002187728881836, "global_step": 347936, "epoch": 2071} {"train_loss": -12.140501022338867, "global_step": 347937, "epoch": 2071} {"train_loss": -12.140565872192383, "global_step": 347938, "epoch": 2071} {"train_loss": -12.200407981872559, "global_step": 347939, "epoch": 2071} {"train_loss": -12.01913070678711, "global_step": 347940, "epoch": 2071} {"train_loss": -12.253124237060547, "global_step": 347941, "epoch": 2071} {"train_loss": -12.165553092956543, "global_step": 347942, "epoch": 2071} {"train_loss": -12.322318077087402, "global_step": 347943, "epoch": 2071} {"train_loss": -12.069328308105469, "global_step": 347944, "epoch": 2071} {"train_loss": -12.367997169494629, "global_step": 347945, "epoch": 2071} {"train_loss": -12.331693649291992, "global_step": 347946, "epoch": 2071} {"train_loss": -12.276835441589355, "global_step": 347947, "epoch": 2071} {"train_loss": -12.43875503540039, "global_step": 347948, "epoch": 2071} {"train_loss": -12.302172660827637, "global_step": 347949, "epoch": 2071} {"train_loss": -12.28080940246582, "global_step": 347950, "epoch": 2071} {"train_loss": -12.401101112365723, "global_step": 347951, "epoch": 2071} {"train_loss": -12.375998497009277, "global_step": 347952, "epoch": 2071} {"train_loss": -12.27652359008789, "global_step": 347953, "epoch": 2071} {"train_loss": -12.190343856811523, "global_step": 347954, "epoch": 2071} {"train_loss": -12.581464767456055, "global_step": 347955, "epoch": 2071} {"train_loss": -12.115489959716797, "global_step": 347956, "epoch": 2071} {"train_loss": -12.321813583374023, "global_step": 347957, "epoch": 2071} {"train_loss": -12.1384859085083, "global_step": 347958, "epoch": 2071} {"train_loss": -12.094928741455078, "global_step": 347959, "epoch": 2071} {"train_loss": -12.095979690551758, "global_step": 347960, "epoch": 2071} {"train_loss": -12.271648406982422, "global_step": 347961, "epoch": 2071} {"train_loss": -11.57570743560791, "global_step": 347962, "epoch": 2071} {"train_loss": -12.173579216003418, "global_step": 347963, "epoch": 2071} {"train_loss": -11.356799125671387, "global_step": 347964, "epoch": 2071} {"train_loss": -11.745772361755371, "global_step": 347965, "epoch": 2071} {"train_loss": -10.869989395141602, "global_step": 347966, "epoch": 2071} {"train_loss": -12.53911018371582, "global_step": 347967, "epoch": 2071} {"train_loss": -11.325180053710938, "global_step": 347968, "epoch": 2071} {"train_loss": -11.934749603271484, "global_step": 347969, "epoch": 2071} {"train_loss": -11.599651336669922, "global_step": 347970, "epoch": 2071} {"train_loss": -11.903146743774414, "global_step": 347971, "epoch": 2071} {"train_loss": -10.94133186340332, "global_step": 347972, "epoch": 2071} {"train_loss": -12.014410018920898, "global_step": 347973, "epoch": 2071} {"train_loss": -12.011656761169434, "global_step": 347974, "epoch": 2071} {"train_loss": -12.044130325317383, "global_step": 347975, "epoch": 2071} {"train_loss": -11.798072814941406, "global_step": 347976, "epoch": 2071} {"train_loss": -12.21099853515625, "global_step": 347977, "epoch": 2071} {"train_loss": -11.19900894165039, "global_step": 347978, "epoch": 2071} {"train_loss": -12.224773406982422, "global_step": 347979, "epoch": 2071} {"train_loss": -11.565842628479004, "global_step": 347980, "epoch": 2071} {"train_loss": -11.722228050231934, "global_step": 347981, "epoch": 2071} {"train_loss": -11.41869831085205, "global_step": 347982, "epoch": 2071} {"train_loss": -12.07768440246582, "global_step": 347983, "epoch": 2071} {"train_loss": -11.650115966796875, "global_step": 347984, "epoch": 2071} {"train_loss": -12.20980167388916, "global_step": 347985, "epoch": 2071} {"train_loss": -11.995412826538086, "global_step": 347986, "epoch": 2071} {"train_loss": -12.079609870910645, "global_step": 347987, "epoch": 2071} {"train_loss": -12.229164123535156, "global_step": 347988, "epoch": 2071} {"train_loss": -11.056458473205566, "global_step": 347989, "epoch": 2071} {"train_loss": -11.85564136505127, "global_step": 347990, "epoch": 2071} {"train_loss": -11.778491973876953, "global_step": 347991, "epoch": 2071} {"train_loss": -11.566171646118164, "global_step": 347992, "epoch": 2071} {"train_loss": -11.957012176513672, "global_step": 347993, "epoch": 2071} {"train_loss": -12.150667190551758, "global_step": 347994, "epoch": 2071} {"train_loss": -11.696840286254883, "global_step": 347995, "epoch": 2071} {"train_loss": -12.087408065795898, "global_step": 347996, "epoch": 2071} {"train_loss": -11.673417091369629, "global_step": 347997, "epoch": 2071} {"train_loss": -12.014547348022461, "global_step": 347998, "epoch": 2071} {"train_loss": -11.084454536437988, "global_step": 347999, "epoch": 2071} {"train_loss": -12.171232223510742, "global_step": 348000, "epoch": 2071} {"train_loss": -11.666842460632324, "global_step": 348001, "epoch": 2071} {"train_loss": -11.199373245239258, "global_step": 348002, "epoch": 2071} {"train_loss": -12.194578170776367, "global_step": 348003, "epoch": 2071} {"train_loss": -11.036920547485352, "global_step": 348004, "epoch": 2071} {"train_loss": -12.273941040039062, "global_step": 348005, "epoch": 2071} {"train_loss": -11.081947326660156, "global_step": 348006, "epoch": 2071} {"train_loss": -12.187625885009766, "global_step": 348007, "epoch": 2071} {"train_loss": -11.292391777038574, "global_step": 348008, "epoch": 2071} {"train_loss": -11.986671447753906, "global_step": 348009, "epoch": 2071} {"train_loss": -12.086708068847656, "global_step": 348010, "epoch": 2071} {"train_loss": -12.022239685058594, "global_step": 348011, "epoch": 2071} {"train_loss": -12.064229965209961, "global_step": 348012, "epoch": 2071} {"train_loss": -12.20956802368164, "global_step": 348013, "epoch": 2071} {"train_loss": -12.278046607971191, "global_step": 348014, "epoch": 2071} {"train_loss": -12.316180229187012, "global_step": 348015, "epoch": 2071} {"train_loss": -12.1991605758667, "global_step": 348016, "epoch": 2071} {"train_loss": -12.133525848388672, "global_step": 348017, "epoch": 2071} {"train_loss": -12.304366111755371, "global_step": 348018, "epoch": 2071} {"train_loss": -12.480059623718262, "global_step": 348019, "epoch": 2071} {"train_loss": -12.424601554870605, "global_step": 348020, "epoch": 2071} {"train_loss": -12.547735214233398, "global_step": 348021, "epoch": 2071} {"train_loss": -12.36606216430664, "global_step": 348022, "epoch": 2071} {"train_loss": -12.034183502197266, "global_step": 348023, "epoch": 2071} {"train_loss": -12.330631256103516, "global_step": 348024, "epoch": 2071} {"train_loss": -12.023402214050293, "global_step": 348025, "epoch": 2071} {"train_loss": -12.144020080566406, "global_step": 348026, "epoch": 2071} {"train_loss": -11.756290435791016, "global_step": 348027, "epoch": 2071} {"train_loss": -12.361433029174805, "global_step": 348028, "epoch": 2071} {"train_loss": -12.031681060791016, "global_step": 348029, "epoch": 2071} {"train_loss": -12.300416946411133, "global_step": 348030, "epoch": 2071} {"train_loss": -12.059534072875977, "global_step": 348031, "epoch": 2071} {"train_loss": -12.158767700195312, "global_step": 348032, "epoch": 2071} {"train_loss": -12.372669219970703, "global_step": 348033, "epoch": 2071} {"train_loss": -12.427905082702637, "global_step": 348034, "epoch": 2071} {"train_loss": -11.569259643554688, "global_step": 348035, "epoch": 2071} {"train_loss": -12.39974594116211, "global_step": 348036, "epoch": 2071} {"train_loss": -12.019848823547363, "global_step": 348037, "epoch": 2071} {"train_loss": -12.142266273498535, "global_step": 348038, "epoch": 2071} {"train_loss": -11.960601806640625, "global_step": 348039, "epoch": 2071} {"train_loss": -11.91720962524414, "global_step": 348040, "epoch": 2071} {"train_loss": -12.213052749633789, "global_step": 348041, "epoch": 2071} {"train_loss": -12.4201078414917, "global_step": 348042, "epoch": 2071} {"train_loss": -12.069012641906738, "global_step": 348043, "epoch": 2071} {"train_loss": -12.40710735321045, "global_step": 348044, "epoch": 2071} {"train_loss": -12.301799774169922, "global_step": 348045, "epoch": 2071} {"train_loss": -12.156803131103516, "global_step": 348046, "epoch": 2071} {"train_loss": -12.268850326538086, "global_step": 348047, "epoch": 2071} {"train_loss": -12.504289627075195, "global_step": 348048, "epoch": 2071} {"train_loss": -12.318014144897461, "global_step": 348049, "epoch": 2071} {"train_loss": -12.175865173339844, "global_step": 348050, "epoch": 2071} {"train_loss": -12.411355972290039, "global_step": 348051, "epoch": 2071} {"train_loss": -11.85824203491211, "global_step": 348052, "epoch": 2071} {"train_loss": -12.044944763183594, "global_step": 348053, "epoch": 2071} {"train_loss": -12.289337158203125, "global_step": 348054, "epoch": 2071} {"train_loss": -12.577421188354492, "global_step": 348055, "epoch": 2071} {"train_loss": -12.159905433654785, "global_step": 348056, "epoch": 2071} {"train_loss": -12.510354042053223, "global_step": 348057, "epoch": 2071} {"train_loss": -12.065073013305664, "global_step": 348058, "epoch": 2071} {"train_loss": -12.150832176208496, "global_step": 348059, "epoch": 2071} {"train_loss": -12.38990592956543, "global_step": 348060, "epoch": 2071} {"train_loss": -12.673603057861328, "global_step": 348061, "epoch": 2071} {"train_loss": -11.814054489135742, "global_step": 348062, "epoch": 2071} {"train_loss": -12.088171005249023, "global_step": 348063, "epoch": 2071} {"train_loss": -12.459606170654297, "global_step": 348064, "epoch": 2071} {"train_loss": -11.835634231567383, "global_step": 348065, "epoch": 2071} {"train_loss": -11.595307350158691, "global_step": 348066, "epoch": 2071} {"train_loss": -12.309612274169922, "global_step": 348067, "epoch": 2071} {"train_loss": -12.068477630615234, "global_step": 348068, "epoch": 2071} {"train_loss": -12.210609436035156, "global_step": 348069, "epoch": 2071} {"train_loss": -12.053022384643555, "global_step": 348070, "epoch": 2071} {"train_loss": -12.314379692077637, "global_step": 348071, "epoch": 2071} {"train_loss": -12.152111053466797, "global_step": 348072, "epoch": 2071} {"train_loss": -12.478050231933594, "global_step": 348073, "epoch": 2071} {"train_loss": -12.206684112548828, "global_step": 348074, "epoch": 2071} {"train_loss": -12.329399108886719, "global_step": 348075, "epoch": 2071} {"train_loss": -12.484766960144043, "global_step": 348076, "epoch": 2071} {"train_loss": -12.55630111694336, "global_step": 348077, "epoch": 2071} {"train_loss": -12.249457359313965, "global_step": 348078, "epoch": 2071} {"train_loss": -12.11478042602539, "global_step": 348079, "epoch": 2071} {"train_loss": -12.376420974731445, "global_step": 348080, "epoch": 2071} {"train_loss": -12.784234046936035, "global_step": 348081, "epoch": 2071} {"train_loss": -12.288554191589355, "global_step": 348082, "epoch": 2071} {"train_loss": -12.448795318603516, "global_step": 348083, "epoch": 2071} {"train_loss": -12.238856315612793, "global_step": 348084, "epoch": 2071} {"train_loss": -12.403340339660645, "global_step": 348085, "epoch": 2071} {"train_loss": -12.263895034790039, "global_step": 348086, "epoch": 2071} {"train_loss": -12.505481719970703, "global_step": 348087, "epoch": 2071} {"train_loss": -12.609392166137695, "global_step": 348088, "epoch": 2071} {"train_loss": -12.494260787963867, "global_step": 348089, "epoch": 2071} {"train_loss": -12.357588768005371, "global_step": 348090, "epoch": 2071} {"train_loss": -12.559820175170898, "global_step": 348091, "epoch": 2071} {"train_loss": -12.352951049804688, "global_step": 348092, "epoch": 2071} {"train_loss": -12.367622375488281, "global_step": 348093, "epoch": 2071} {"train_loss": -12.455602645874023, "global_step": 348094, "epoch": 2071} {"train_loss": -12.09849891208467, "global_step": 348095, "epoch": 2071, "val_loss": 291140.78125} {"train_loss": -12.39303970336914, "global_step": 348096, "epoch": 2072} {"train_loss": -12.479501724243164, "global_step": 348097, "epoch": 2072} {"train_loss": -12.590704917907715, "global_step": 348098, "epoch": 2072} {"train_loss": -12.590229988098145, "global_step": 348099, "epoch": 2072} {"train_loss": -12.590214729309082, "global_step": 348100, "epoch": 2072} {"train_loss": -12.27919864654541, "global_step": 348101, "epoch": 2072} {"train_loss": -12.569733619689941, "global_step": 348102, "epoch": 2072} {"train_loss": -12.825550079345703, "global_step": 348103, "epoch": 2072} {"train_loss": -12.778159141540527, "global_step": 348104, "epoch": 2072} {"train_loss": -12.197556495666504, "global_step": 348105, "epoch": 2072} {"train_loss": -12.178802490234375, "global_step": 348106, "epoch": 2072} {"train_loss": -12.729926109313965, "global_step": 348107, "epoch": 2072} {"train_loss": -12.549583435058594, "global_step": 348108, "epoch": 2072} {"train_loss": -12.446671485900879, "global_step": 348109, "epoch": 2072} {"train_loss": -12.268150329589844, "global_step": 348110, "epoch": 2072} {"train_loss": -12.643588066101074, "global_step": 348111, "epoch": 2072} {"train_loss": -12.413825035095215, "global_step": 348112, "epoch": 2072} {"train_loss": -11.51719856262207, "global_step": 348113, "epoch": 2072} {"train_loss": -11.908912658691406, "global_step": 348114, "epoch": 2072} {"train_loss": -12.174942016601562, "global_step": 348115, "epoch": 2072} {"train_loss": -12.234238624572754, "global_step": 348116, "epoch": 2072} {"train_loss": -12.611855506896973, "global_step": 348117, "epoch": 2072} {"train_loss": -11.740716934204102, "global_step": 348118, "epoch": 2072} {"train_loss": -10.37386703491211, "global_step": 348119, "epoch": 2072} {"train_loss": -12.36936092376709, "global_step": 348120, "epoch": 2072} {"train_loss": -9.581567764282227, "global_step": 348121, "epoch": 2072} {"train_loss": -10.678253173828125, "global_step": 348122, "epoch": 2072} {"train_loss": -8.421603202819824, "global_step": 348123, "epoch": 2072} {"train_loss": -8.043049812316895, "global_step": 348124, "epoch": 2072} {"train_loss": -8.60534381866455, "global_step": 348125, "epoch": 2072} {"train_loss": -9.996623992919922, "global_step": 348126, "epoch": 2072} {"train_loss": -7.6972856521606445, "global_step": 348127, "epoch": 2072} {"train_loss": -9.000226974487305, "global_step": 348128, "epoch": 2072} {"train_loss": -10.082478523254395, "global_step": 348129, "epoch": 2072} {"train_loss": -7.646742343902588, "global_step": 348130, "epoch": 2072} {"train_loss": -6.719117164611816, "global_step": 348131, "epoch": 2072} {"train_loss": -8.157770156860352, "global_step": 348132, "epoch": 2072} {"train_loss": -8.404772758483887, "global_step": 348133, "epoch": 2072} {"train_loss": -9.187006950378418, "global_step": 348134, "epoch": 2072} {"train_loss": -7.946263313293457, "global_step": 348135, "epoch": 2072} {"train_loss": -8.2147855758667, "global_step": 348136, "epoch": 2072} {"train_loss": -9.251829147338867, "global_step": 348137, "epoch": 2072} {"train_loss": -8.845540046691895, "global_step": 348138, "epoch": 2072} {"train_loss": -10.099752426147461, "global_step": 348139, "epoch": 2072} {"train_loss": -10.19298267364502, "global_step": 348140, "epoch": 2072} {"train_loss": -9.91672134399414, "global_step": 348141, "epoch": 2072} {"train_loss": -9.836424827575684, "global_step": 348142, "epoch": 2072} {"train_loss": -10.806843757629395, "global_step": 348143, "epoch": 2072} {"train_loss": -10.000263214111328, "global_step": 348144, "epoch": 2072} {"train_loss": -10.570235252380371, "global_step": 348145, "epoch": 2072} {"train_loss": -10.424589157104492, "global_step": 348146, "epoch": 2072} {"train_loss": -10.338772773742676, "global_step": 348147, "epoch": 2072} {"train_loss": -10.997883796691895, "global_step": 348148, "epoch": 2072} {"train_loss": -11.281940460205078, "global_step": 348149, "epoch": 2072} {"train_loss": -10.815967559814453, "global_step": 348150, "epoch": 2072} {"train_loss": -11.413518905639648, "global_step": 348151, "epoch": 2072} {"train_loss": -10.911123275756836, "global_step": 348152, "epoch": 2072} {"train_loss": -10.508204460144043, "global_step": 348153, "epoch": 2072} {"train_loss": -11.429977416992188, "global_step": 348154, "epoch": 2072} {"train_loss": -10.741497039794922, "global_step": 348155, "epoch": 2072} {"train_loss": -11.102323532104492, "global_step": 348156, "epoch": 2072} {"train_loss": -11.509407043457031, "global_step": 348157, "epoch": 2072} {"train_loss": -11.341157913208008, "global_step": 348158, "epoch": 2072} {"train_loss": -11.540046691894531, "global_step": 348159, "epoch": 2072} {"train_loss": -11.383766174316406, "global_step": 348160, "epoch": 2072} {"train_loss": -11.303741455078125, "global_step": 348161, "epoch": 2072} {"train_loss": -11.212010383605957, "global_step": 348162, "epoch": 2072} {"train_loss": -11.684438705444336, "global_step": 348163, "epoch": 2072} {"train_loss": -11.463387489318848, "global_step": 348164, "epoch": 2072} {"train_loss": -11.631441116333008, "global_step": 348165, "epoch": 2072} {"train_loss": -11.407266616821289, "global_step": 348166, "epoch": 2072} {"train_loss": -11.94091796875, "global_step": 348167, "epoch": 2072} {"train_loss": -11.809183120727539, "global_step": 348168, "epoch": 2072} {"train_loss": -11.646496772766113, "global_step": 348169, "epoch": 2072} {"train_loss": -11.620250701904297, "global_step": 348170, "epoch": 2072} {"train_loss": -11.8123779296875, "global_step": 348171, "epoch": 2072} {"train_loss": -11.664243698120117, "global_step": 348172, "epoch": 2072} {"train_loss": -11.964692115783691, "global_step": 348173, "epoch": 2072} {"train_loss": -12.123401641845703, "global_step": 348174, "epoch": 2072} {"train_loss": -11.97217845916748, "global_step": 348175, "epoch": 2072} {"train_loss": -12.027726173400879, "global_step": 348176, "epoch": 2072} {"train_loss": -11.952576637268066, "global_step": 348177, "epoch": 2072} {"train_loss": -11.684326171875, "global_step": 348178, "epoch": 2072} {"train_loss": -12.076318740844727, "global_step": 348179, "epoch": 2072} {"train_loss": -12.054827690124512, "global_step": 348180, "epoch": 2072} {"train_loss": -11.868470191955566, "global_step": 348181, "epoch": 2072} {"train_loss": -12.176874160766602, "global_step": 348182, "epoch": 2072} {"train_loss": -12.215357780456543, "global_step": 348183, "epoch": 2072} {"train_loss": -12.334366798400879, "global_step": 348184, "epoch": 2072} {"train_loss": -12.17713737487793, "global_step": 348185, "epoch": 2072} {"train_loss": -12.261808395385742, "global_step": 348186, "epoch": 2072} {"train_loss": -12.199243545532227, "global_step": 348187, "epoch": 2072} {"train_loss": -12.241060256958008, "global_step": 348188, "epoch": 2072} {"train_loss": -12.255935668945312, "global_step": 348189, "epoch": 2072} {"train_loss": -12.305865287780762, "global_step": 348190, "epoch": 2072} {"train_loss": -12.156641006469727, "global_step": 348191, "epoch": 2072} {"train_loss": -12.368341445922852, "global_step": 348192, "epoch": 2072} {"train_loss": -12.17733383178711, "global_step": 348193, "epoch": 2072} {"train_loss": -12.307500839233398, "global_step": 348194, "epoch": 2072} {"train_loss": -12.35354232788086, "global_step": 348195, "epoch": 2072} {"train_loss": -12.613836288452148, "global_step": 348196, "epoch": 2072} {"train_loss": -12.187877655029297, "global_step": 348197, "epoch": 2072} {"train_loss": -12.213024139404297, "global_step": 348198, "epoch": 2072} {"train_loss": -12.328466415405273, "global_step": 348199, "epoch": 2072} {"train_loss": -12.4837646484375, "global_step": 348200, "epoch": 2072} {"train_loss": -12.222925186157227, "global_step": 348201, "epoch": 2072} {"train_loss": -12.255256652832031, "global_step": 348202, "epoch": 2072} {"train_loss": -12.229016304016113, "global_step": 348203, "epoch": 2072} {"train_loss": -12.30319595336914, "global_step": 348204, "epoch": 2072} {"train_loss": -12.276835441589355, "global_step": 348205, "epoch": 2072} {"train_loss": -12.291364669799805, "global_step": 348206, "epoch": 2072} {"train_loss": -12.524606704711914, "global_step": 348207, "epoch": 2072} {"train_loss": -12.415663719177246, "global_step": 348208, "epoch": 2072} {"train_loss": -12.589057922363281, "global_step": 348209, "epoch": 2072} {"train_loss": -12.48000431060791, "global_step": 348210, "epoch": 2072} {"train_loss": -12.592355728149414, "global_step": 348211, "epoch": 2072} {"train_loss": -12.463029861450195, "global_step": 348212, "epoch": 2072} {"train_loss": -12.588432312011719, "global_step": 348213, "epoch": 2072} {"train_loss": -12.383723258972168, "global_step": 348214, "epoch": 2072} {"train_loss": -12.469749450683594, "global_step": 348215, "epoch": 2072} {"train_loss": -12.467292785644531, "global_step": 348216, "epoch": 2072} {"train_loss": -12.637670516967773, "global_step": 348217, "epoch": 2072} {"train_loss": -12.385526657104492, "global_step": 348218, "epoch": 2072} {"train_loss": -12.58297348022461, "global_step": 348219, "epoch": 2072} {"train_loss": -12.591043472290039, "global_step": 348220, "epoch": 2072} {"train_loss": -12.507881164550781, "global_step": 348221, "epoch": 2072} {"train_loss": -12.472963333129883, "global_step": 348222, "epoch": 2072} {"train_loss": -12.392952919006348, "global_step": 348223, "epoch": 2072} {"train_loss": -12.60662841796875, "global_step": 348224, "epoch": 2072} {"train_loss": -12.54452896118164, "global_step": 348225, "epoch": 2072} {"train_loss": -12.729520797729492, "global_step": 348226, "epoch": 2072} {"train_loss": -12.354280471801758, "global_step": 348227, "epoch": 2072} {"train_loss": -12.468912124633789, "global_step": 348228, "epoch": 2072} {"train_loss": -12.794180870056152, "global_step": 348229, "epoch": 2072} {"train_loss": -12.541638374328613, "global_step": 348230, "epoch": 2072} {"train_loss": -12.290664672851562, "global_step": 348231, "epoch": 2072} {"train_loss": -12.327312469482422, "global_step": 348232, "epoch": 2072} {"train_loss": -11.910037994384766, "global_step": 348233, "epoch": 2072} {"train_loss": -12.408401489257812, "global_step": 348234, "epoch": 2072} {"train_loss": -12.03648853302002, "global_step": 348235, "epoch": 2072} {"train_loss": -12.321382522583008, "global_step": 348236, "epoch": 2072} {"train_loss": -12.217552185058594, "global_step": 348237, "epoch": 2072} {"train_loss": -12.239767074584961, "global_step": 348238, "epoch": 2072} {"train_loss": -12.181417465209961, "global_step": 348239, "epoch": 2072} {"train_loss": -12.309904098510742, "global_step": 348240, "epoch": 2072} {"train_loss": -12.275856018066406, "global_step": 348241, "epoch": 2072} {"train_loss": -12.490951538085938, "global_step": 348242, "epoch": 2072} {"train_loss": -12.021129608154297, "global_step": 348243, "epoch": 2072} {"train_loss": -12.527791023254395, "global_step": 348244, "epoch": 2072} {"train_loss": -11.9954833984375, "global_step": 348245, "epoch": 2072} {"train_loss": -12.455994606018066, "global_step": 348246, "epoch": 2072} {"train_loss": -12.242691040039062, "global_step": 348247, "epoch": 2072} {"train_loss": -11.799578666687012, "global_step": 348248, "epoch": 2072} {"train_loss": -11.970050811767578, "global_step": 348249, "epoch": 2072} {"train_loss": -12.239809036254883, "global_step": 348250, "epoch": 2072} {"train_loss": -11.977550506591797, "global_step": 348251, "epoch": 2072} {"train_loss": -11.593021392822266, "global_step": 348252, "epoch": 2072} {"train_loss": -11.943635940551758, "global_step": 348253, "epoch": 2072} {"train_loss": -11.877092361450195, "global_step": 348254, "epoch": 2072} {"train_loss": -11.025266647338867, "global_step": 348255, "epoch": 2072} {"train_loss": -11.405030250549316, "global_step": 348256, "epoch": 2072} {"train_loss": -12.396926879882812, "global_step": 348257, "epoch": 2072} {"train_loss": -11.096366882324219, "global_step": 348258, "epoch": 2072} {"train_loss": -11.54580307006836, "global_step": 348259, "epoch": 2072} {"train_loss": -11.771980285644531, "global_step": 348260, "epoch": 2072} {"train_loss": -11.459494590759277, "global_step": 348261, "epoch": 2072} {"train_loss": -11.668599128723145, "global_step": 348262, "epoch": 2072} {"train_loss": -11.609307990187691, "global_step": 348263, "epoch": 2072, "val_loss": 283772.78125} {"train_loss": -11.385992050170898, "global_step": 348264, "epoch": 2073} {"train_loss": -9.559367179870605, "global_step": 348265, "epoch": 2073} {"train_loss": -11.234966278076172, "global_step": 348266, "epoch": 2073} {"train_loss": -10.665223121643066, "global_step": 348267, "epoch": 2073} {"train_loss": -10.889175415039062, "global_step": 348268, "epoch": 2073} {"train_loss": -11.025240898132324, "global_step": 348269, "epoch": 2073} {"train_loss": -11.105072021484375, "global_step": 348270, "epoch": 2073} {"train_loss": -10.537663459777832, "global_step": 348271, "epoch": 2073} {"train_loss": -10.945155143737793, "global_step": 348272, "epoch": 2073} {"train_loss": -12.431861877441406, "global_step": 348273, "epoch": 2073} {"train_loss": -11.454414367675781, "global_step": 348274, "epoch": 2073} {"train_loss": -11.91382884979248, "global_step": 348275, "epoch": 2073} {"train_loss": -11.81792163848877, "global_step": 348276, "epoch": 2073} {"train_loss": -11.77621841430664, "global_step": 348277, "epoch": 2073} {"train_loss": -11.921268463134766, "global_step": 348278, "epoch": 2073} {"train_loss": -11.647727012634277, "global_step": 348279, "epoch": 2073} {"train_loss": -11.958736419677734, "global_step": 348280, "epoch": 2073} {"train_loss": -12.041998863220215, "global_step": 348281, "epoch": 2073} {"train_loss": -11.654474258422852, "global_step": 348282, "epoch": 2073} {"train_loss": -11.72730541229248, "global_step": 348283, "epoch": 2073} {"train_loss": -11.043085098266602, "global_step": 348284, "epoch": 2073} {"train_loss": -12.216394424438477, "global_step": 348285, "epoch": 2073} {"train_loss": -10.79466438293457, "global_step": 348286, "epoch": 2073} {"train_loss": -11.545989036560059, "global_step": 348287, "epoch": 2073} {"train_loss": -11.279926300048828, "global_step": 348288, "epoch": 2073} {"train_loss": -11.45608901977539, "global_step": 348289, "epoch": 2073} {"train_loss": -11.799103736877441, "global_step": 348290, "epoch": 2073} {"train_loss": -11.370849609375, "global_step": 348291, "epoch": 2073} {"train_loss": -11.703807830810547, "global_step": 348292, "epoch": 2073} {"train_loss": -11.555558204650879, "global_step": 348293, "epoch": 2073} {"train_loss": -11.592767715454102, "global_step": 348294, "epoch": 2073} {"train_loss": -11.234441757202148, "global_step": 348295, "epoch": 2073} {"train_loss": -10.517162322998047, "global_step": 348296, "epoch": 2073} {"train_loss": -9.698407173156738, "global_step": 348297, "epoch": 2073} {"train_loss": -11.306208610534668, "global_step": 348298, "epoch": 2073} {"train_loss": -11.071807861328125, "global_step": 348299, "epoch": 2073} {"train_loss": -11.14036750793457, "global_step": 348300, "epoch": 2073} {"train_loss": -11.841833114624023, "global_step": 348301, "epoch": 2073} {"train_loss": -11.259881973266602, "global_step": 348302, "epoch": 2073} {"train_loss": -12.05086898803711, "global_step": 348303, "epoch": 2073} {"train_loss": -11.320701599121094, "global_step": 348304, "epoch": 2073} {"train_loss": -12.013290405273438, "global_step": 348305, "epoch": 2073} {"train_loss": -11.605978965759277, "global_step": 348306, "epoch": 2073} {"train_loss": -11.55409049987793, "global_step": 348307, "epoch": 2073} {"train_loss": -11.916635513305664, "global_step": 348308, "epoch": 2073} {"train_loss": -11.044198989868164, "global_step": 348309, "epoch": 2073} {"train_loss": -12.00113296508789, "global_step": 348310, "epoch": 2073} {"train_loss": -11.740692138671875, "global_step": 348311, "epoch": 2073} {"train_loss": -12.011849403381348, "global_step": 348312, "epoch": 2073} {"train_loss": -12.046226501464844, "global_step": 348313, "epoch": 2073} {"train_loss": -11.888245582580566, "global_step": 348314, "epoch": 2073} {"train_loss": -12.006914138793945, "global_step": 348315, "epoch": 2073} {"train_loss": -12.173025131225586, "global_step": 348316, "epoch": 2073} {"train_loss": -12.171640396118164, "global_step": 348317, "epoch": 2073} {"train_loss": -12.248244285583496, "global_step": 348318, "epoch": 2073} {"train_loss": -12.040275573730469, "global_step": 348319, "epoch": 2073} {"train_loss": -11.918716430664062, "global_step": 348320, "epoch": 2073} {"train_loss": -12.080629348754883, "global_step": 348321, "epoch": 2073} {"train_loss": -11.88978385925293, "global_step": 348322, "epoch": 2073} {"train_loss": -12.28925895690918, "global_step": 348323, "epoch": 2073} {"train_loss": -11.977919578552246, "global_step": 348324, "epoch": 2073} {"train_loss": -12.25582504272461, "global_step": 348325, "epoch": 2073} {"train_loss": -12.25063705444336, "global_step": 348326, "epoch": 2073} {"train_loss": -12.209114074707031, "global_step": 348327, "epoch": 2073} {"train_loss": -12.21839714050293, "global_step": 348328, "epoch": 2073} {"train_loss": -12.123727798461914, "global_step": 348329, "epoch": 2073} {"train_loss": -12.228337287902832, "global_step": 348330, "epoch": 2073} {"train_loss": -12.090250968933105, "global_step": 348331, "epoch": 2073} {"train_loss": -12.349591255187988, "global_step": 348332, "epoch": 2073} {"train_loss": -12.253496170043945, "global_step": 348333, "epoch": 2073} {"train_loss": -12.209405899047852, "global_step": 348334, "epoch": 2073} {"train_loss": -12.309805870056152, "global_step": 348335, "epoch": 2073} {"train_loss": -12.222511291503906, "global_step": 348336, "epoch": 2073} {"train_loss": -12.18264102935791, "global_step": 348337, "epoch": 2073} {"train_loss": -12.278895378112793, "global_step": 348338, "epoch": 2073} {"train_loss": -12.332808494567871, "global_step": 348339, "epoch": 2073} {"train_loss": -12.208257675170898, "global_step": 348340, "epoch": 2073} {"train_loss": -12.567527770996094, "global_step": 348341, "epoch": 2073} {"train_loss": -12.508661270141602, "global_step": 348342, "epoch": 2073} {"train_loss": -12.497132301330566, "global_step": 348343, "epoch": 2073} {"train_loss": -12.490497589111328, "global_step": 348344, "epoch": 2073} {"train_loss": -12.310237884521484, "global_step": 348345, "epoch": 2073} {"train_loss": -12.356691360473633, "global_step": 348346, "epoch": 2073} {"train_loss": -12.40318489074707, "global_step": 348347, "epoch": 2073} {"train_loss": -12.423519134521484, "global_step": 348348, "epoch": 2073} {"train_loss": -12.457724571228027, "global_step": 348349, "epoch": 2073} {"train_loss": -12.389947891235352, "global_step": 348350, "epoch": 2073} {"train_loss": -12.361087799072266, "global_step": 348351, "epoch": 2073} {"train_loss": -12.513627052307129, "global_step": 348352, "epoch": 2073} {"train_loss": -12.429949760437012, "global_step": 348353, "epoch": 2073} {"train_loss": -12.533052444458008, "global_step": 348354, "epoch": 2073} {"train_loss": -12.176435470581055, "global_step": 348355, "epoch": 2073} {"train_loss": -11.688309669494629, "global_step": 348356, "epoch": 2073} {"train_loss": -11.80714225769043, "global_step": 348357, "epoch": 2073} {"train_loss": -12.162275314331055, "global_step": 348358, "epoch": 2073} {"train_loss": -12.052276611328125, "global_step": 348359, "epoch": 2073} {"train_loss": -11.989469528198242, "global_step": 348360, "epoch": 2073} {"train_loss": -11.673080444335938, "global_step": 348361, "epoch": 2073} {"train_loss": -10.949825286865234, "global_step": 348362, "epoch": 2073} {"train_loss": -11.599433898925781, "global_step": 348363, "epoch": 2073} {"train_loss": -10.981327056884766, "global_step": 348364, "epoch": 2073} {"train_loss": -11.604677200317383, "global_step": 348365, "epoch": 2073} {"train_loss": -11.059239387512207, "global_step": 348366, "epoch": 2073} {"train_loss": -8.958102226257324, "global_step": 348367, "epoch": 2073} {"train_loss": -8.74121379852295, "global_step": 348368, "epoch": 2073} {"train_loss": -11.513101577758789, "global_step": 348369, "epoch": 2073} {"train_loss": -8.929193496704102, "global_step": 348370, "epoch": 2073} {"train_loss": -9.866788864135742, "global_step": 348371, "epoch": 2073} {"train_loss": -8.942153930664062, "global_step": 348372, "epoch": 2073} {"train_loss": -11.183340072631836, "global_step": 348373, "epoch": 2073} {"train_loss": -8.472095489501953, "global_step": 348374, "epoch": 2073} {"train_loss": -8.705102920532227, "global_step": 348375, "epoch": 2073} {"train_loss": -10.838154792785645, "global_step": 348376, "epoch": 2073} {"train_loss": -10.231368064880371, "global_step": 348377, "epoch": 2073} {"train_loss": -9.247552871704102, "global_step": 348378, "epoch": 2073} {"train_loss": -8.910402297973633, "global_step": 348379, "epoch": 2073} {"train_loss": -10.505500793457031, "global_step": 348380, "epoch": 2073} {"train_loss": -11.229430198669434, "global_step": 348381, "epoch": 2073} {"train_loss": -9.433384895324707, "global_step": 348382, "epoch": 2073} {"train_loss": -10.982828140258789, "global_step": 348383, "epoch": 2073} {"train_loss": -11.137624740600586, "global_step": 348384, "epoch": 2073} {"train_loss": -10.185132026672363, "global_step": 348385, "epoch": 2073} {"train_loss": -10.163860321044922, "global_step": 348386, "epoch": 2073} {"train_loss": -11.261341094970703, "global_step": 348387, "epoch": 2073} {"train_loss": -10.466730117797852, "global_step": 348388, "epoch": 2073} {"train_loss": -10.186296463012695, "global_step": 348389, "epoch": 2073} {"train_loss": -10.70846939086914, "global_step": 348390, "epoch": 2073} {"train_loss": -11.35858154296875, "global_step": 348391, "epoch": 2073} {"train_loss": -11.060486793518066, "global_step": 348392, "epoch": 2073} {"train_loss": -10.776118278503418, "global_step": 348393, "epoch": 2073} {"train_loss": -11.40534782409668, "global_step": 348394, "epoch": 2073} {"train_loss": -11.057953834533691, "global_step": 348395, "epoch": 2073} {"train_loss": -11.601400375366211, "global_step": 348396, "epoch": 2073} {"train_loss": -11.689553260803223, "global_step": 348397, "epoch": 2073} {"train_loss": -10.723062515258789, "global_step": 348398, "epoch": 2073} {"train_loss": -11.746854782104492, "global_step": 348399, "epoch": 2073} {"train_loss": -11.606430053710938, "global_step": 348400, "epoch": 2073} {"train_loss": -11.273054122924805, "global_step": 348401, "epoch": 2073} {"train_loss": -11.722312927246094, "global_step": 348402, "epoch": 2073} {"train_loss": -11.508190155029297, "global_step": 348403, "epoch": 2073} {"train_loss": -11.399238586425781, "global_step": 348404, "epoch": 2073} {"train_loss": -11.798967361450195, "global_step": 348405, "epoch": 2073} {"train_loss": -11.74771499633789, "global_step": 348406, "epoch": 2073} {"train_loss": -11.509391784667969, "global_step": 348407, "epoch": 2073} {"train_loss": -11.695541381835938, "global_step": 348408, "epoch": 2073} {"train_loss": -11.770506858825684, "global_step": 348409, "epoch": 2073} {"train_loss": -12.010039329528809, "global_step": 348410, "epoch": 2073} {"train_loss": -11.514168739318848, "global_step": 348411, "epoch": 2073} {"train_loss": -12.102560043334961, "global_step": 348412, "epoch": 2073} {"train_loss": -11.632325172424316, "global_step": 348413, "epoch": 2073} {"train_loss": -11.844619750976562, "global_step": 348414, "epoch": 2073} {"train_loss": -12.069305419921875, "global_step": 348415, "epoch": 2073} {"train_loss": -11.963623046875, "global_step": 348416, "epoch": 2073} {"train_loss": -12.0316162109375, "global_step": 348417, "epoch": 2073} {"train_loss": -12.150704383850098, "global_step": 348418, "epoch": 2073} {"train_loss": -12.157672882080078, "global_step": 348419, "epoch": 2073} {"train_loss": -11.997577667236328, "global_step": 348420, "epoch": 2073} {"train_loss": -12.197074890136719, "global_step": 348421, "epoch": 2073} {"train_loss": -12.283949851989746, "global_step": 348422, "epoch": 2073} {"train_loss": -12.00526237487793, "global_step": 348423, "epoch": 2073} {"train_loss": -12.24344253540039, "global_step": 348424, "epoch": 2073} {"train_loss": -12.058883666992188, "global_step": 348425, "epoch": 2073} {"train_loss": -12.243322372436523, "global_step": 348426, "epoch": 2073} {"train_loss": -12.11367416381836, "global_step": 348427, "epoch": 2073} {"train_loss": -12.360156059265137, "global_step": 348428, "epoch": 2073} {"train_loss": -12.16978645324707, "global_step": 348429, "epoch": 2073} {"train_loss": -12.349266052246094, "global_step": 348430, "epoch": 2073} {"train_loss": -11.534587559245882, "global_step": 348431, "epoch": 2073, "val_loss": 290758.6875} {"train_loss": -12.436787605285645, "global_step": 348432, "epoch": 2074} {"train_loss": -12.546194076538086, "global_step": 348433, "epoch": 2074} {"train_loss": -12.33703327178955, "global_step": 348434, "epoch": 2074} {"train_loss": -12.228816032409668, "global_step": 348435, "epoch": 2074} {"train_loss": -12.443791389465332, "global_step": 348436, "epoch": 2074} {"train_loss": -12.4154052734375, "global_step": 348437, "epoch": 2074} {"train_loss": -12.500810623168945, "global_step": 348438, "epoch": 2074} {"train_loss": -12.293373107910156, "global_step": 348439, "epoch": 2074} {"train_loss": -12.562127113342285, "global_step": 348440, "epoch": 2074} {"train_loss": -12.362040519714355, "global_step": 348441, "epoch": 2074} {"train_loss": -12.461834907531738, "global_step": 348442, "epoch": 2074} {"train_loss": -12.355615615844727, "global_step": 348443, "epoch": 2074} {"train_loss": -12.539215087890625, "global_step": 348444, "epoch": 2074} {"train_loss": -12.459291458129883, "global_step": 348445, "epoch": 2074} {"train_loss": -12.484477043151855, "global_step": 348446, "epoch": 2074} {"train_loss": -12.612550735473633, "global_step": 348447, "epoch": 2074} {"train_loss": -12.550786018371582, "global_step": 348448, "epoch": 2074} {"train_loss": -12.48619270324707, "global_step": 348449, "epoch": 2074} {"train_loss": -12.47195816040039, "global_step": 348450, "epoch": 2074} {"train_loss": -12.470216751098633, "global_step": 348451, "epoch": 2074} {"train_loss": -12.510980606079102, "global_step": 348452, "epoch": 2074} {"train_loss": -12.462133407592773, "global_step": 348453, "epoch": 2074} {"train_loss": -12.514202117919922, "global_step": 348454, "epoch": 2074} {"train_loss": -12.52560806274414, "global_step": 348455, "epoch": 2074} {"train_loss": -12.489540100097656, "global_step": 348456, "epoch": 2074} {"train_loss": -12.335625648498535, "global_step": 348457, "epoch": 2074} {"train_loss": -12.37871265411377, "global_step": 348458, "epoch": 2074} {"train_loss": -12.427167892456055, "global_step": 348459, "epoch": 2074} {"train_loss": -12.582883834838867, "global_step": 348460, "epoch": 2074} {"train_loss": -12.380165100097656, "global_step": 348461, "epoch": 2074} {"train_loss": -12.424304962158203, "global_step": 348462, "epoch": 2074} {"train_loss": -12.442824363708496, "global_step": 348463, "epoch": 2074} {"train_loss": -12.54616928100586, "global_step": 348464, "epoch": 2074} {"train_loss": -12.451862335205078, "global_step": 348465, "epoch": 2074} {"train_loss": -12.551885604858398, "global_step": 348466, "epoch": 2074} {"train_loss": -12.649083137512207, "global_step": 348467, "epoch": 2074} {"train_loss": -12.465984344482422, "global_step": 348468, "epoch": 2074} {"train_loss": -12.434040069580078, "global_step": 348469, "epoch": 2074} {"train_loss": -12.406579971313477, "global_step": 348470, "epoch": 2074} {"train_loss": -12.578764915466309, "global_step": 348471, "epoch": 2074} {"train_loss": -12.557441711425781, "global_step": 348472, "epoch": 2074} {"train_loss": -12.035490036010742, "global_step": 348473, "epoch": 2074} {"train_loss": -11.954063415527344, "global_step": 348474, "epoch": 2074} {"train_loss": -12.547843933105469, "global_step": 348475, "epoch": 2074} {"train_loss": -12.30819034576416, "global_step": 348476, "epoch": 2074} {"train_loss": -11.952672958374023, "global_step": 348477, "epoch": 2074} {"train_loss": -12.277917861938477, "global_step": 348478, "epoch": 2074} {"train_loss": -12.272115707397461, "global_step": 348479, "epoch": 2074} {"train_loss": -12.290746688842773, "global_step": 348480, "epoch": 2074} {"train_loss": -12.047746658325195, "global_step": 348481, "epoch": 2074} {"train_loss": -12.356978416442871, "global_step": 348482, "epoch": 2074} {"train_loss": -11.83691120147705, "global_step": 348483, "epoch": 2074} {"train_loss": -11.661728858947754, "global_step": 348484, "epoch": 2074} {"train_loss": -11.92990493774414, "global_step": 348485, "epoch": 2074} {"train_loss": -12.034574508666992, "global_step": 348486, "epoch": 2074} {"train_loss": -11.475167274475098, "global_step": 348487, "epoch": 2074} {"train_loss": -11.557255744934082, "global_step": 348488, "epoch": 2074} {"train_loss": -11.908775329589844, "global_step": 348489, "epoch": 2074} {"train_loss": -12.100114822387695, "global_step": 348490, "epoch": 2074} {"train_loss": -11.381765365600586, "global_step": 348491, "epoch": 2074} {"train_loss": -11.16025161743164, "global_step": 348492, "epoch": 2074} {"train_loss": -12.567737579345703, "global_step": 348493, "epoch": 2074} {"train_loss": -11.032362937927246, "global_step": 348494, "epoch": 2074} {"train_loss": -11.059561729431152, "global_step": 348495, "epoch": 2074} {"train_loss": -11.888830184936523, "global_step": 348496, "epoch": 2074} {"train_loss": -12.503043174743652, "global_step": 348497, "epoch": 2074} {"train_loss": -10.822407722473145, "global_step": 348498, "epoch": 2074} {"train_loss": -10.705472946166992, "global_step": 348499, "epoch": 2074} {"train_loss": -11.317602157592773, "global_step": 348500, "epoch": 2074} {"train_loss": -12.037065505981445, "global_step": 348501, "epoch": 2074} {"train_loss": -11.562311172485352, "global_step": 348502, "epoch": 2074} {"train_loss": -11.952278137207031, "global_step": 348503, "epoch": 2074} {"train_loss": -12.218294143676758, "global_step": 348504, "epoch": 2074} {"train_loss": -12.308276176452637, "global_step": 348505, "epoch": 2074} {"train_loss": -12.10019588470459, "global_step": 348506, "epoch": 2074} {"train_loss": -12.521634101867676, "global_step": 348507, "epoch": 2074} {"train_loss": -11.916629791259766, "global_step": 348508, "epoch": 2074} {"train_loss": -11.634075164794922, "global_step": 348509, "epoch": 2074} {"train_loss": -12.352293968200684, "global_step": 348510, "epoch": 2074} {"train_loss": -11.419142723083496, "global_step": 348511, "epoch": 2074} {"train_loss": -11.780914306640625, "global_step": 348512, "epoch": 2074} {"train_loss": -12.159220695495605, "global_step": 348513, "epoch": 2074} {"train_loss": -12.356729507446289, "global_step": 348514, "epoch": 2074} {"train_loss": -12.14804458618164, "global_step": 348515, "epoch": 2074} {"train_loss": -12.139579772949219, "global_step": 348516, "epoch": 2074} {"train_loss": -12.05032730102539, "global_step": 348517, "epoch": 2074} {"train_loss": -11.911382675170898, "global_step": 348518, "epoch": 2074} {"train_loss": -11.529376983642578, "global_step": 348519, "epoch": 2074} {"train_loss": -11.950716018676758, "global_step": 348520, "epoch": 2074} {"train_loss": -11.889922142028809, "global_step": 348521, "epoch": 2074} {"train_loss": -11.163434982299805, "global_step": 348522, "epoch": 2074} {"train_loss": -12.076667785644531, "global_step": 348523, "epoch": 2074} {"train_loss": -11.607093811035156, "global_step": 348524, "epoch": 2074} {"train_loss": -10.504470825195312, "global_step": 348525, "epoch": 2074} {"train_loss": -12.07514762878418, "global_step": 348526, "epoch": 2074} {"train_loss": -11.345890045166016, "global_step": 348527, "epoch": 2074} {"train_loss": -11.240432739257812, "global_step": 348528, "epoch": 2074} {"train_loss": -12.036774635314941, "global_step": 348529, "epoch": 2074} {"train_loss": -10.478351593017578, "global_step": 348530, "epoch": 2074} {"train_loss": -11.845524787902832, "global_step": 348531, "epoch": 2074} {"train_loss": -10.885445594787598, "global_step": 348532, "epoch": 2074} {"train_loss": -10.835286140441895, "global_step": 348533, "epoch": 2074} {"train_loss": -12.02348518371582, "global_step": 348534, "epoch": 2074} {"train_loss": -10.494486808776855, "global_step": 348535, "epoch": 2074} {"train_loss": -12.07885456085205, "global_step": 348536, "epoch": 2074} {"train_loss": -11.37918472290039, "global_step": 348537, "epoch": 2074} {"train_loss": -11.417828559875488, "global_step": 348538, "epoch": 2074} {"train_loss": -11.990804672241211, "global_step": 348539, "epoch": 2074} {"train_loss": -11.110502243041992, "global_step": 348540, "epoch": 2074} {"train_loss": -11.242656707763672, "global_step": 348541, "epoch": 2074} {"train_loss": -11.301233291625977, "global_step": 348542, "epoch": 2074} {"train_loss": -11.17313289642334, "global_step": 348543, "epoch": 2074} {"train_loss": -11.763505935668945, "global_step": 348544, "epoch": 2074} {"train_loss": -10.793859481811523, "global_step": 348545, "epoch": 2074} {"train_loss": -11.118175506591797, "global_step": 348546, "epoch": 2074} {"train_loss": -11.715620994567871, "global_step": 348547, "epoch": 2074} {"train_loss": -11.382185935974121, "global_step": 348548, "epoch": 2074} {"train_loss": -11.776826858520508, "global_step": 348549, "epoch": 2074} {"train_loss": -11.242057800292969, "global_step": 348550, "epoch": 2074} {"train_loss": -11.507465362548828, "global_step": 348551, "epoch": 2074} {"train_loss": -11.542451858520508, "global_step": 348552, "epoch": 2074} {"train_loss": -11.697607040405273, "global_step": 348553, "epoch": 2074} {"train_loss": -11.372922897338867, "global_step": 348554, "epoch": 2074} {"train_loss": -11.809473991394043, "global_step": 348555, "epoch": 2074} {"train_loss": -12.036602973937988, "global_step": 348556, "epoch": 2074} {"train_loss": -11.993757247924805, "global_step": 348557, "epoch": 2074} {"train_loss": -12.455571174621582, "global_step": 348558, "epoch": 2074} {"train_loss": -11.910895347595215, "global_step": 348559, "epoch": 2074} {"train_loss": -12.249225616455078, "global_step": 348560, "epoch": 2074} {"train_loss": -12.046318054199219, "global_step": 348561, "epoch": 2074} {"train_loss": -12.096697807312012, "global_step": 348562, "epoch": 2074} {"train_loss": -12.305349349975586, "global_step": 348563, "epoch": 2074} {"train_loss": -12.376413345336914, "global_step": 348564, "epoch": 2074} {"train_loss": -12.399418830871582, "global_step": 348565, "epoch": 2074} {"train_loss": -12.223386764526367, "global_step": 348566, "epoch": 2074} {"train_loss": -12.24665355682373, "global_step": 348567, "epoch": 2074} {"train_loss": -12.306737899780273, "global_step": 348568, "epoch": 2074} {"train_loss": -12.092965126037598, "global_step": 348569, "epoch": 2074} {"train_loss": -11.863512992858887, "global_step": 348570, "epoch": 2074} {"train_loss": -12.201013565063477, "global_step": 348571, "epoch": 2074} {"train_loss": -12.40096664428711, "global_step": 348572, "epoch": 2074} {"train_loss": -11.998233795166016, "global_step": 348573, "epoch": 2074} {"train_loss": -12.206886291503906, "global_step": 348574, "epoch": 2074} {"train_loss": -12.20431900024414, "global_step": 348575, "epoch": 2074} {"train_loss": -12.523882865905762, "global_step": 348576, "epoch": 2074} {"train_loss": -12.059425354003906, "global_step": 348577, "epoch": 2074} {"train_loss": -12.280216217041016, "global_step": 348578, "epoch": 2074} {"train_loss": -11.833864212036133, "global_step": 348579, "epoch": 2074} {"train_loss": -12.227198600769043, "global_step": 348580, "epoch": 2074} {"train_loss": -11.40378189086914, "global_step": 348581, "epoch": 2074} {"train_loss": -11.843050003051758, "global_step": 348582, "epoch": 2074} {"train_loss": -11.725051879882812, "global_step": 348583, "epoch": 2074} {"train_loss": -11.931312561035156, "global_step": 348584, "epoch": 2074} {"train_loss": -11.63867473602295, "global_step": 348585, "epoch": 2074} {"train_loss": -11.035058975219727, "global_step": 348586, "epoch": 2074} {"train_loss": -11.751595497131348, "global_step": 348587, "epoch": 2074} {"train_loss": -11.079755783081055, "global_step": 348588, "epoch": 2074} {"train_loss": -12.112039566040039, "global_step": 348589, "epoch": 2074} {"train_loss": -11.4395751953125, "global_step": 348590, "epoch": 2074} {"train_loss": -12.212652206420898, "global_step": 348591, "epoch": 2074} {"train_loss": -11.57763671875, "global_step": 348592, "epoch": 2074} {"train_loss": -11.748030662536621, "global_step": 348593, "epoch": 2074} {"train_loss": -12.219801902770996, "global_step": 348594, "epoch": 2074} {"train_loss": -11.527585983276367, "global_step": 348595, "epoch": 2074} {"train_loss": -12.397130966186523, "global_step": 348596, "epoch": 2074} {"train_loss": -11.349227905273438, "global_step": 348597, "epoch": 2074} {"train_loss": -11.997063636779785, "global_step": 348598, "epoch": 2074} {"train_loss": -11.960151161466326, "global_step": 348599, "epoch": 2074, "val_loss": 290457.25} {"train_loss": -12.03789234161377, "global_step": 348600, "epoch": 2075} {"train_loss": -11.77938461303711, "global_step": 348601, "epoch": 2075} {"train_loss": -11.866292953491211, "global_step": 348602, "epoch": 2075} {"train_loss": -11.806014060974121, "global_step": 348603, "epoch": 2075} {"train_loss": -12.261350631713867, "global_step": 348604, "epoch": 2075} {"train_loss": -12.02204704284668, "global_step": 348605, "epoch": 2075} {"train_loss": -12.057493209838867, "global_step": 348606, "epoch": 2075} {"train_loss": -12.15843391418457, "global_step": 348607, "epoch": 2075} {"train_loss": -11.857664108276367, "global_step": 348608, "epoch": 2075} {"train_loss": -12.37179183959961, "global_step": 348609, "epoch": 2075} {"train_loss": -12.237741470336914, "global_step": 348610, "epoch": 2075} {"train_loss": -12.043680191040039, "global_step": 348611, "epoch": 2075} {"train_loss": -12.059950828552246, "global_step": 348612, "epoch": 2075} {"train_loss": -11.488946914672852, "global_step": 348613, "epoch": 2075} {"train_loss": -11.759202003479004, "global_step": 348614, "epoch": 2075} {"train_loss": -11.994384765625, "global_step": 348615, "epoch": 2075} {"train_loss": -11.862058639526367, "global_step": 348616, "epoch": 2075} {"train_loss": -11.572185516357422, "global_step": 348617, "epoch": 2075} {"train_loss": -12.140618324279785, "global_step": 348618, "epoch": 2075} {"train_loss": -12.115263938903809, "global_step": 348619, "epoch": 2075} {"train_loss": -11.737447738647461, "global_step": 348620, "epoch": 2075} {"train_loss": -11.908496856689453, "global_step": 348621, "epoch": 2075} {"train_loss": -11.947660446166992, "global_step": 348622, "epoch": 2075} {"train_loss": -11.276137351989746, "global_step": 348623, "epoch": 2075} {"train_loss": -11.966188430786133, "global_step": 348624, "epoch": 2075} {"train_loss": -11.687288284301758, "global_step": 348625, "epoch": 2075} {"train_loss": -12.08549690246582, "global_step": 348626, "epoch": 2075} {"train_loss": -11.362967491149902, "global_step": 348627, "epoch": 2075} {"train_loss": -11.948949813842773, "global_step": 348628, "epoch": 2075} {"train_loss": -12.459346771240234, "global_step": 348629, "epoch": 2075} {"train_loss": -11.631905555725098, "global_step": 348630, "epoch": 2075} {"train_loss": -12.1183443069458, "global_step": 348631, "epoch": 2075} {"train_loss": -11.727088928222656, "global_step": 348632, "epoch": 2075} {"train_loss": -11.779062271118164, "global_step": 348633, "epoch": 2075} {"train_loss": -12.058497428894043, "global_step": 348634, "epoch": 2075} {"train_loss": -12.300268173217773, "global_step": 348635, "epoch": 2075} {"train_loss": -12.104644775390625, "global_step": 348636, "epoch": 2075} {"train_loss": -11.875567436218262, "global_step": 348637, "epoch": 2075} {"train_loss": -12.428213119506836, "global_step": 348638, "epoch": 2075} {"train_loss": -12.054506301879883, "global_step": 348639, "epoch": 2075} {"train_loss": -12.233219146728516, "global_step": 348640, "epoch": 2075} {"train_loss": -12.45726203918457, "global_step": 348641, "epoch": 2075} {"train_loss": -11.679971694946289, "global_step": 348642, "epoch": 2075} {"train_loss": -12.364838600158691, "global_step": 348643, "epoch": 2075} {"train_loss": -12.198493003845215, "global_step": 348644, "epoch": 2075} {"train_loss": -12.016731262207031, "global_step": 348645, "epoch": 2075} {"train_loss": -12.441529273986816, "global_step": 348646, "epoch": 2075} {"train_loss": -11.376943588256836, "global_step": 348647, "epoch": 2075} {"train_loss": -10.937784194946289, "global_step": 348648, "epoch": 2075} {"train_loss": -12.26488971710205, "global_step": 348649, "epoch": 2075} {"train_loss": -11.694291114807129, "global_step": 348650, "epoch": 2075} {"train_loss": -12.256647109985352, "global_step": 348651, "epoch": 2075} {"train_loss": -11.533170700073242, "global_step": 348652, "epoch": 2075} {"train_loss": -11.994325637817383, "global_step": 348653, "epoch": 2075} {"train_loss": -11.845463752746582, "global_step": 348654, "epoch": 2075} {"train_loss": -12.033882141113281, "global_step": 348655, "epoch": 2075} {"train_loss": -11.943326950073242, "global_step": 348656, "epoch": 2075} {"train_loss": -12.105602264404297, "global_step": 348657, "epoch": 2075} {"train_loss": -12.103708267211914, "global_step": 348658, "epoch": 2075} {"train_loss": -11.940704345703125, "global_step": 348659, "epoch": 2075} {"train_loss": -12.141578674316406, "global_step": 348660, "epoch": 2075} {"train_loss": -12.239322662353516, "global_step": 348661, "epoch": 2075} {"train_loss": -12.534605979919434, "global_step": 348662, "epoch": 2075} {"train_loss": -11.939603805541992, "global_step": 348663, "epoch": 2075} {"train_loss": -12.290721893310547, "global_step": 348664, "epoch": 2075} {"train_loss": -12.262286186218262, "global_step": 348665, "epoch": 2075} {"train_loss": -12.379009246826172, "global_step": 348666, "epoch": 2075} {"train_loss": -12.2283353805542, "global_step": 348667, "epoch": 2075} {"train_loss": -12.130851745605469, "global_step": 348668, "epoch": 2075} {"train_loss": -12.131980895996094, "global_step": 348669, "epoch": 2075} {"train_loss": -11.731874465942383, "global_step": 348670, "epoch": 2075} {"train_loss": -12.563705444335938, "global_step": 348671, "epoch": 2075} {"train_loss": -11.870384216308594, "global_step": 348672, "epoch": 2075} {"train_loss": -11.909029006958008, "global_step": 348673, "epoch": 2075} {"train_loss": -11.856754302978516, "global_step": 348674, "epoch": 2075} {"train_loss": -11.767313003540039, "global_step": 348675, "epoch": 2075} {"train_loss": -11.961465835571289, "global_step": 348676, "epoch": 2075} {"train_loss": -12.186971664428711, "global_step": 348677, "epoch": 2075} {"train_loss": -12.00732421875, "global_step": 348678, "epoch": 2075} {"train_loss": -12.348628997802734, "global_step": 348679, "epoch": 2075} {"train_loss": -11.348122596740723, "global_step": 348680, "epoch": 2075} {"train_loss": -11.918607711791992, "global_step": 348681, "epoch": 2075} {"train_loss": -12.045612335205078, "global_step": 348682, "epoch": 2075} {"train_loss": -11.799053192138672, "global_step": 348683, "epoch": 2075} {"train_loss": -11.813361167907715, "global_step": 348684, "epoch": 2075} {"train_loss": -11.873025894165039, "global_step": 348685, "epoch": 2075} {"train_loss": -11.703115463256836, "global_step": 348686, "epoch": 2075} {"train_loss": -12.15363883972168, "global_step": 348687, "epoch": 2075} {"train_loss": -11.743234634399414, "global_step": 348688, "epoch": 2075} {"train_loss": -11.91228199005127, "global_step": 348689, "epoch": 2075} {"train_loss": -12.210660934448242, "global_step": 348690, "epoch": 2075} {"train_loss": -11.870292663574219, "global_step": 348691, "epoch": 2075} {"train_loss": -12.345487594604492, "global_step": 348692, "epoch": 2075} {"train_loss": -12.020956993103027, "global_step": 348693, "epoch": 2075} {"train_loss": -12.393694877624512, "global_step": 348694, "epoch": 2075} {"train_loss": -12.101731300354004, "global_step": 348695, "epoch": 2075} {"train_loss": -11.948490142822266, "global_step": 348696, "epoch": 2075} {"train_loss": -11.730937004089355, "global_step": 348697, "epoch": 2075} {"train_loss": -12.59809684753418, "global_step": 348698, "epoch": 2075} {"train_loss": -11.546367645263672, "global_step": 348699, "epoch": 2075} {"train_loss": -12.04330825805664, "global_step": 348700, "epoch": 2075} {"train_loss": -11.388437271118164, "global_step": 348701, "epoch": 2075} {"train_loss": -11.692755699157715, "global_step": 348702, "epoch": 2075} {"train_loss": -12.167000770568848, "global_step": 348703, "epoch": 2075} {"train_loss": -12.136231422424316, "global_step": 348704, "epoch": 2075} {"train_loss": -11.940813064575195, "global_step": 348705, "epoch": 2075} {"train_loss": -12.037609100341797, "global_step": 348706, "epoch": 2075} {"train_loss": -12.187207221984863, "global_step": 348707, "epoch": 2075} {"train_loss": -12.375618934631348, "global_step": 348708, "epoch": 2075} {"train_loss": -12.225317001342773, "global_step": 348709, "epoch": 2075} {"train_loss": -12.273205757141113, "global_step": 348710, "epoch": 2075} {"train_loss": -12.557306289672852, "global_step": 348711, "epoch": 2075} {"train_loss": -12.378057479858398, "global_step": 348712, "epoch": 2075} {"train_loss": -12.409448623657227, "global_step": 348713, "epoch": 2075} {"train_loss": -12.158790588378906, "global_step": 348714, "epoch": 2075} {"train_loss": -11.805021286010742, "global_step": 348715, "epoch": 2075} {"train_loss": -12.349464416503906, "global_step": 348716, "epoch": 2075} {"train_loss": -11.852165222167969, "global_step": 348717, "epoch": 2075} {"train_loss": -11.851324081420898, "global_step": 348718, "epoch": 2075} {"train_loss": -12.10925006866455, "global_step": 348719, "epoch": 2075} {"train_loss": -11.87214469909668, "global_step": 348720, "epoch": 2075} {"train_loss": -11.703187942504883, "global_step": 348721, "epoch": 2075} {"train_loss": -12.120957374572754, "global_step": 348722, "epoch": 2075} {"train_loss": -10.04629898071289, "global_step": 348723, "epoch": 2075} {"train_loss": -11.859262466430664, "global_step": 348724, "epoch": 2075} {"train_loss": -10.487092971801758, "global_step": 348725, "epoch": 2075} {"train_loss": -10.11796760559082, "global_step": 348726, "epoch": 2075} {"train_loss": -11.04855728149414, "global_step": 348727, "epoch": 2075} {"train_loss": -10.447755813598633, "global_step": 348728, "epoch": 2075} {"train_loss": -11.86391830444336, "global_step": 348729, "epoch": 2075} {"train_loss": -10.013741493225098, "global_step": 348730, "epoch": 2075} {"train_loss": -10.713271141052246, "global_step": 348731, "epoch": 2075} {"train_loss": -11.621331214904785, "global_step": 348732, "epoch": 2075} {"train_loss": -10.68403434753418, "global_step": 348733, "epoch": 2075} {"train_loss": -10.59548568725586, "global_step": 348734, "epoch": 2075} {"train_loss": -10.672721862792969, "global_step": 348735, "epoch": 2075} {"train_loss": -9.705154418945312, "global_step": 348736, "epoch": 2075} {"train_loss": -11.353450775146484, "global_step": 348737, "epoch": 2075} {"train_loss": -10.678218841552734, "global_step": 348738, "epoch": 2075} {"train_loss": -11.414679527282715, "global_step": 348739, "epoch": 2075} {"train_loss": -11.055364608764648, "global_step": 348740, "epoch": 2075} {"train_loss": -11.574773788452148, "global_step": 348741, "epoch": 2075} {"train_loss": -11.367094039916992, "global_step": 348742, "epoch": 2075} {"train_loss": -11.207239151000977, "global_step": 348743, "epoch": 2075} {"train_loss": -11.632930755615234, "global_step": 348744, "epoch": 2075} {"train_loss": -11.540212631225586, "global_step": 348745, "epoch": 2075} {"train_loss": -11.889947891235352, "global_step": 348746, "epoch": 2075} {"train_loss": -11.203021049499512, "global_step": 348747, "epoch": 2075} {"train_loss": -12.06286907196045, "global_step": 348748, "epoch": 2075} {"train_loss": -11.453028678894043, "global_step": 348749, "epoch": 2075} {"train_loss": -11.969438552856445, "global_step": 348750, "epoch": 2075} {"train_loss": -10.913249969482422, "global_step": 348751, "epoch": 2075} {"train_loss": -12.125970840454102, "global_step": 348752, "epoch": 2075} {"train_loss": -11.741588592529297, "global_step": 348753, "epoch": 2075} {"train_loss": -12.105202674865723, "global_step": 348754, "epoch": 2075} {"train_loss": -11.717691421508789, "global_step": 348755, "epoch": 2075} {"train_loss": -11.944839477539062, "global_step": 348756, "epoch": 2075} {"train_loss": -11.83339786529541, "global_step": 348757, "epoch": 2075} {"train_loss": -12.344354629516602, "global_step": 348758, "epoch": 2075} {"train_loss": -11.747686386108398, "global_step": 348759, "epoch": 2075} {"train_loss": -12.343011856079102, "global_step": 348760, "epoch": 2075} {"train_loss": -12.180152893066406, "global_step": 348761, "epoch": 2075} {"train_loss": -11.984090805053711, "global_step": 348762, "epoch": 2075} {"train_loss": -12.009956359863281, "global_step": 348763, "epoch": 2075} {"train_loss": -12.180870056152344, "global_step": 348764, "epoch": 2075} {"train_loss": -11.928581237792969, "global_step": 348765, "epoch": 2075} {"train_loss": -11.858606338500977, "global_step": 348766, "epoch": 2075} {"train_loss": -11.84372779868898, "global_step": 348767, "epoch": 2075, "val_loss": 289010.59375, "train_action_mse_error": 3.930741786956787} {"train_loss": -11.825441360473633, "global_step": 348768, "epoch": 2076} {"train_loss": -12.288267135620117, "global_step": 348769, "epoch": 2076} {"train_loss": -12.245903015136719, "global_step": 348770, "epoch": 2076} {"train_loss": -12.41091537475586, "global_step": 348771, "epoch": 2076} {"train_loss": -12.19002914428711, "global_step": 348772, "epoch": 2076} {"train_loss": -12.434093475341797, "global_step": 348773, "epoch": 2076} {"train_loss": -12.257362365722656, "global_step": 348774, "epoch": 2076} {"train_loss": -12.406329154968262, "global_step": 348775, "epoch": 2076} {"train_loss": -12.171438217163086, "global_step": 348776, "epoch": 2076} {"train_loss": -12.328435897827148, "global_step": 348777, "epoch": 2076} {"train_loss": -12.273992538452148, "global_step": 348778, "epoch": 2076} {"train_loss": -12.449832916259766, "global_step": 348779, "epoch": 2076} {"train_loss": -12.493810653686523, "global_step": 348780, "epoch": 2076} {"train_loss": -12.382416725158691, "global_step": 348781, "epoch": 2076} {"train_loss": -12.156698226928711, "global_step": 348782, "epoch": 2076} {"train_loss": -12.368818283081055, "global_step": 348783, "epoch": 2076} {"train_loss": -12.164596557617188, "global_step": 348784, "epoch": 2076} {"train_loss": -12.112678527832031, "global_step": 348785, "epoch": 2076} {"train_loss": -12.307239532470703, "global_step": 348786, "epoch": 2076} {"train_loss": -12.189519882202148, "global_step": 348787, "epoch": 2076} {"train_loss": -12.349689483642578, "global_step": 348788, "epoch": 2076} {"train_loss": -12.235245704650879, "global_step": 348789, "epoch": 2076} {"train_loss": -12.488040924072266, "global_step": 348790, "epoch": 2076} {"train_loss": -12.34343147277832, "global_step": 348791, "epoch": 2076} {"train_loss": -12.467721939086914, "global_step": 348792, "epoch": 2076} {"train_loss": -12.229857444763184, "global_step": 348793, "epoch": 2076} {"train_loss": -12.234334945678711, "global_step": 348794, "epoch": 2076} {"train_loss": -12.357994079589844, "global_step": 348795, "epoch": 2076} {"train_loss": -12.378332138061523, "global_step": 348796, "epoch": 2076} {"train_loss": -12.581071853637695, "global_step": 348797, "epoch": 2076} {"train_loss": -12.490866661071777, "global_step": 348798, "epoch": 2076} {"train_loss": -12.465511322021484, "global_step": 348799, "epoch": 2076} {"train_loss": -12.519676208496094, "global_step": 348800, "epoch": 2076} {"train_loss": -12.501225471496582, "global_step": 348801, "epoch": 2076} {"train_loss": -12.295406341552734, "global_step": 348802, "epoch": 2076} {"train_loss": -12.716821670532227, "global_step": 348803, "epoch": 2076} {"train_loss": -12.411029815673828, "global_step": 348804, "epoch": 2076} {"train_loss": -12.363859176635742, "global_step": 348805, "epoch": 2076} {"train_loss": -12.652286529541016, "global_step": 348806, "epoch": 2076} {"train_loss": -12.480161666870117, "global_step": 348807, "epoch": 2076} {"train_loss": -12.644224166870117, "global_step": 348808, "epoch": 2076} {"train_loss": -12.614707946777344, "global_step": 348809, "epoch": 2076} {"train_loss": -12.730998992919922, "global_step": 348810, "epoch": 2076} {"train_loss": -12.594493865966797, "global_step": 348811, "epoch": 2076} {"train_loss": -12.632139205932617, "global_step": 348812, "epoch": 2076} {"train_loss": -12.685400009155273, "global_step": 348813, "epoch": 2076} {"train_loss": -12.498899459838867, "global_step": 348814, "epoch": 2076} {"train_loss": -12.612427711486816, "global_step": 348815, "epoch": 2076} {"train_loss": -12.631799697875977, "global_step": 348816, "epoch": 2076} {"train_loss": -12.442265510559082, "global_step": 348817, "epoch": 2076} {"train_loss": -12.775997161865234, "global_step": 348818, "epoch": 2076} {"train_loss": -12.601934432983398, "global_step": 348819, "epoch": 2076} {"train_loss": -12.751803398132324, "global_step": 348820, "epoch": 2076} {"train_loss": -12.668042182922363, "global_step": 348821, "epoch": 2076} {"train_loss": -12.530118942260742, "global_step": 348822, "epoch": 2076} {"train_loss": -12.604251861572266, "global_step": 348823, "epoch": 2076} {"train_loss": -12.515175819396973, "global_step": 348824, "epoch": 2076} {"train_loss": -12.229852676391602, "global_step": 348825, "epoch": 2076} {"train_loss": -12.268287658691406, "global_step": 348826, "epoch": 2076} {"train_loss": -12.420122146606445, "global_step": 348827, "epoch": 2076} {"train_loss": -12.519126892089844, "global_step": 348828, "epoch": 2076} {"train_loss": -12.362836837768555, "global_step": 348829, "epoch": 2076} {"train_loss": -12.617244720458984, "global_step": 348830, "epoch": 2076} {"train_loss": -12.44982624053955, "global_step": 348831, "epoch": 2076} {"train_loss": -12.69719123840332, "global_step": 348832, "epoch": 2076} {"train_loss": -12.090776443481445, "global_step": 348833, "epoch": 2076} {"train_loss": -12.593159675598145, "global_step": 348834, "epoch": 2076} {"train_loss": -12.005701065063477, "global_step": 348835, "epoch": 2076} {"train_loss": -12.475259780883789, "global_step": 348836, "epoch": 2076} {"train_loss": -11.983539581298828, "global_step": 348837, "epoch": 2076} {"train_loss": -11.892729759216309, "global_step": 348838, "epoch": 2076} {"train_loss": -11.231894493103027, "global_step": 348839, "epoch": 2076} {"train_loss": -11.99206256866455, "global_step": 348840, "epoch": 2076} {"train_loss": -11.60844612121582, "global_step": 348841, "epoch": 2076} {"train_loss": -11.667505264282227, "global_step": 348842, "epoch": 2076} {"train_loss": -11.376691818237305, "global_step": 348843, "epoch": 2076} {"train_loss": -11.451493263244629, "global_step": 348844, "epoch": 2076} {"train_loss": -11.724353790283203, "global_step": 348845, "epoch": 2076} {"train_loss": -10.65338134765625, "global_step": 348846, "epoch": 2076} {"train_loss": -11.92451000213623, "global_step": 348847, "epoch": 2076} {"train_loss": -11.660820960998535, "global_step": 348848, "epoch": 2076} {"train_loss": -11.494794845581055, "global_step": 348849, "epoch": 2076} {"train_loss": -10.776765823364258, "global_step": 348850, "epoch": 2076} {"train_loss": -10.720260620117188, "global_step": 348851, "epoch": 2076} {"train_loss": -11.62989616394043, "global_step": 348852, "epoch": 2076} {"train_loss": -11.581717491149902, "global_step": 348853, "epoch": 2076} {"train_loss": -10.458955764770508, "global_step": 348854, "epoch": 2076} {"train_loss": -12.37986946105957, "global_step": 348855, "epoch": 2076} {"train_loss": -11.502328872680664, "global_step": 348856, "epoch": 2076} {"train_loss": -11.154088020324707, "global_step": 348857, "epoch": 2076} {"train_loss": -10.892364501953125, "global_step": 348858, "epoch": 2076} {"train_loss": -11.180074691772461, "global_step": 348859, "epoch": 2076} {"train_loss": -10.988256454467773, "global_step": 348860, "epoch": 2076} {"train_loss": -10.435650825500488, "global_step": 348861, "epoch": 2076} {"train_loss": -9.710954666137695, "global_step": 348862, "epoch": 2076} {"train_loss": -11.693840980529785, "global_step": 348863, "epoch": 2076} {"train_loss": -10.008148193359375, "global_step": 348864, "epoch": 2076} {"train_loss": -10.325647354125977, "global_step": 348865, "epoch": 2076} {"train_loss": -11.073305130004883, "global_step": 348866, "epoch": 2076} {"train_loss": -10.89055347442627, "global_step": 348867, "epoch": 2076} {"train_loss": -10.407110214233398, "global_step": 348868, "epoch": 2076} {"train_loss": -10.450223922729492, "global_step": 348869, "epoch": 2076} {"train_loss": -11.96600341796875, "global_step": 348870, "epoch": 2076} {"train_loss": -11.169328689575195, "global_step": 348871, "epoch": 2076} {"train_loss": -11.778339385986328, "global_step": 348872, "epoch": 2076} {"train_loss": -10.86893367767334, "global_step": 348873, "epoch": 2076} {"train_loss": -12.215412139892578, "global_step": 348874, "epoch": 2076} {"train_loss": -11.389764785766602, "global_step": 348875, "epoch": 2076} {"train_loss": -11.730130195617676, "global_step": 348876, "epoch": 2076} {"train_loss": -11.408482551574707, "global_step": 348877, "epoch": 2076} {"train_loss": -11.526571273803711, "global_step": 348878, "epoch": 2076} {"train_loss": -12.228486061096191, "global_step": 348879, "epoch": 2076} {"train_loss": -11.886829376220703, "global_step": 348880, "epoch": 2076} {"train_loss": -12.019746780395508, "global_step": 348881, "epoch": 2076} {"train_loss": -11.792466163635254, "global_step": 348882, "epoch": 2076} {"train_loss": -11.95529842376709, "global_step": 348883, "epoch": 2076} {"train_loss": -11.43857192993164, "global_step": 348884, "epoch": 2076} {"train_loss": -11.986084938049316, "global_step": 348885, "epoch": 2076} {"train_loss": -11.98959732055664, "global_step": 348886, "epoch": 2076} {"train_loss": -12.005805015563965, "global_step": 348887, "epoch": 2076} {"train_loss": -11.73931884765625, "global_step": 348888, "epoch": 2076} {"train_loss": -11.662793159484863, "global_step": 348889, "epoch": 2076} {"train_loss": -11.855052947998047, "global_step": 348890, "epoch": 2076} {"train_loss": -11.459853172302246, "global_step": 348891, "epoch": 2076} {"train_loss": -11.337183952331543, "global_step": 348892, "epoch": 2076} {"train_loss": -11.298645973205566, "global_step": 348893, "epoch": 2076} {"train_loss": -11.551836013793945, "global_step": 348894, "epoch": 2076} {"train_loss": -11.76741886138916, "global_step": 348895, "epoch": 2076} {"train_loss": -11.756365776062012, "global_step": 348896, "epoch": 2076} {"train_loss": -10.811382293701172, "global_step": 348897, "epoch": 2076} {"train_loss": -11.421285629272461, "global_step": 348898, "epoch": 2076} {"train_loss": -10.759306907653809, "global_step": 348899, "epoch": 2076} {"train_loss": -11.30567741394043, "global_step": 348900, "epoch": 2076} {"train_loss": -11.553520202636719, "global_step": 348901, "epoch": 2076} {"train_loss": -10.795341491699219, "global_step": 348902, "epoch": 2076} {"train_loss": -11.622601509094238, "global_step": 348903, "epoch": 2076} {"train_loss": -11.118170738220215, "global_step": 348904, "epoch": 2076} {"train_loss": -11.842901229858398, "global_step": 348905, "epoch": 2076} {"train_loss": -11.509575843811035, "global_step": 348906, "epoch": 2076} {"train_loss": -11.571911811828613, "global_step": 348907, "epoch": 2076} {"train_loss": -11.923385620117188, "global_step": 348908, "epoch": 2076} {"train_loss": -11.691444396972656, "global_step": 348909, "epoch": 2076} {"train_loss": -11.978168487548828, "global_step": 348910, "epoch": 2076} {"train_loss": -11.650633811950684, "global_step": 348911, "epoch": 2076} {"train_loss": -11.998307228088379, "global_step": 348912, "epoch": 2076} {"train_loss": -11.961544036865234, "global_step": 348913, "epoch": 2076} {"train_loss": -11.883808135986328, "global_step": 348914, "epoch": 2076} {"train_loss": -11.881282806396484, "global_step": 348915, "epoch": 2076} {"train_loss": -12.01192855834961, "global_step": 348916, "epoch": 2076} {"train_loss": -11.978139877319336, "global_step": 348917, "epoch": 2076} {"train_loss": -11.893169403076172, "global_step": 348918, "epoch": 2076} {"train_loss": -12.032663345336914, "global_step": 348919, "epoch": 2076} {"train_loss": -12.04405403137207, "global_step": 348920, "epoch": 2076} {"train_loss": -11.748163223266602, "global_step": 348921, "epoch": 2076} {"train_loss": -11.756248474121094, "global_step": 348922, "epoch": 2076} {"train_loss": -12.05093002319336, "global_step": 348923, "epoch": 2076} {"train_loss": -11.344593048095703, "global_step": 348924, "epoch": 2076} {"train_loss": -11.867655754089355, "global_step": 348925, "epoch": 2076} {"train_loss": -11.464202880859375, "global_step": 348926, "epoch": 2076} {"train_loss": -11.78731918334961, "global_step": 348927, "epoch": 2076} {"train_loss": -9.924270629882812, "global_step": 348928, "epoch": 2076} {"train_loss": -11.743597030639648, "global_step": 348929, "epoch": 2076} {"train_loss": -10.680797576904297, "global_step": 348930, "epoch": 2076} {"train_loss": -11.61017894744873, "global_step": 348931, "epoch": 2076} {"train_loss": -11.274297714233398, "global_step": 348932, "epoch": 2076} {"train_loss": -10.933878898620605, "global_step": 348933, "epoch": 2076} {"train_loss": -12.030359268188477, "global_step": 348934, "epoch": 2076} {"train_loss": -11.863944155829293, "global_step": 348935, "epoch": 2076, "val_loss": 290532.625} {"train_loss": -11.427940368652344, "global_step": 348936, "epoch": 2077} {"train_loss": -12.024179458618164, "global_step": 348937, "epoch": 2077} {"train_loss": -11.408912658691406, "global_step": 348938, "epoch": 2077} {"train_loss": -11.718547821044922, "global_step": 348939, "epoch": 2077} {"train_loss": -11.71060848236084, "global_step": 348940, "epoch": 2077} {"train_loss": -11.849279403686523, "global_step": 348941, "epoch": 2077} {"train_loss": -11.805830001831055, "global_step": 348942, "epoch": 2077} {"train_loss": -12.033502578735352, "global_step": 348943, "epoch": 2077} {"train_loss": -11.25500202178955, "global_step": 348944, "epoch": 2077} {"train_loss": -12.248252868652344, "global_step": 348945, "epoch": 2077} {"train_loss": -11.70145320892334, "global_step": 348946, "epoch": 2077} {"train_loss": -11.7576904296875, "global_step": 348947, "epoch": 2077} {"train_loss": -12.274477005004883, "global_step": 348948, "epoch": 2077} {"train_loss": -11.839479446411133, "global_step": 348949, "epoch": 2077} {"train_loss": -12.052633285522461, "global_step": 348950, "epoch": 2077} {"train_loss": -12.157096862792969, "global_step": 348951, "epoch": 2077} {"train_loss": -11.609739303588867, "global_step": 348952, "epoch": 2077} {"train_loss": -11.790894508361816, "global_step": 348953, "epoch": 2077} {"train_loss": -11.95788860321045, "global_step": 348954, "epoch": 2077} {"train_loss": -11.009279251098633, "global_step": 348955, "epoch": 2077} {"train_loss": -12.094802856445312, "global_step": 348956, "epoch": 2077} {"train_loss": -10.740492820739746, "global_step": 348957, "epoch": 2077} {"train_loss": -11.800915718078613, "global_step": 348958, "epoch": 2077} {"train_loss": -11.800628662109375, "global_step": 348959, "epoch": 2077} {"train_loss": -11.612457275390625, "global_step": 348960, "epoch": 2077} {"train_loss": -11.42393684387207, "global_step": 348961, "epoch": 2077} {"train_loss": -11.7742338180542, "global_step": 348962, "epoch": 2077} {"train_loss": -11.833097457885742, "global_step": 348963, "epoch": 2077} {"train_loss": -11.895243644714355, "global_step": 348964, "epoch": 2077} {"train_loss": -11.702258110046387, "global_step": 348965, "epoch": 2077} {"train_loss": -11.879968643188477, "global_step": 348966, "epoch": 2077} {"train_loss": -11.985679626464844, "global_step": 348967, "epoch": 2077} {"train_loss": -12.111295700073242, "global_step": 348968, "epoch": 2077} {"train_loss": -11.82022762298584, "global_step": 348969, "epoch": 2077} {"train_loss": -12.182908058166504, "global_step": 348970, "epoch": 2077} {"train_loss": -12.061220169067383, "global_step": 348971, "epoch": 2077} {"train_loss": -12.042110443115234, "global_step": 348972, "epoch": 2077} {"train_loss": -12.124229431152344, "global_step": 348973, "epoch": 2077} {"train_loss": -11.973520278930664, "global_step": 348974, "epoch": 2077} {"train_loss": -12.223886489868164, "global_step": 348975, "epoch": 2077} {"train_loss": -12.368934631347656, "global_step": 348976, "epoch": 2077} {"train_loss": -11.97486686706543, "global_step": 348977, "epoch": 2077} {"train_loss": -12.133810043334961, "global_step": 348978, "epoch": 2077} {"train_loss": -12.470008850097656, "global_step": 348979, "epoch": 2077} {"train_loss": -12.101003646850586, "global_step": 348980, "epoch": 2077} {"train_loss": -12.461959838867188, "global_step": 348981, "epoch": 2077} {"train_loss": -12.30687141418457, "global_step": 348982, "epoch": 2077} {"train_loss": -12.520796775817871, "global_step": 348983, "epoch": 2077} {"train_loss": -12.454669952392578, "global_step": 348984, "epoch": 2077} {"train_loss": -12.493013381958008, "global_step": 348985, "epoch": 2077} {"train_loss": -12.404731750488281, "global_step": 348986, "epoch": 2077} {"train_loss": -12.336138725280762, "global_step": 348987, "epoch": 2077} {"train_loss": -12.271560668945312, "global_step": 348988, "epoch": 2077} {"train_loss": -12.261638641357422, "global_step": 348989, "epoch": 2077} {"train_loss": -12.254013061523438, "global_step": 348990, "epoch": 2077} {"train_loss": -12.215723991394043, "global_step": 348991, "epoch": 2077} {"train_loss": -12.035886764526367, "global_step": 348992, "epoch": 2077} {"train_loss": -12.169657707214355, "global_step": 348993, "epoch": 2077} {"train_loss": -12.33111572265625, "global_step": 348994, "epoch": 2077} {"train_loss": -12.475044250488281, "global_step": 348995, "epoch": 2077} {"train_loss": -12.504047393798828, "global_step": 348996, "epoch": 2077} {"train_loss": -12.39042854309082, "global_step": 348997, "epoch": 2077} {"train_loss": -12.57479190826416, "global_step": 348998, "epoch": 2077} {"train_loss": -12.040498733520508, "global_step": 348999, "epoch": 2077} {"train_loss": -12.40317440032959, "global_step": 349000, "epoch": 2077} {"train_loss": -12.443021774291992, "global_step": 349001, "epoch": 2077} {"train_loss": -12.165007591247559, "global_step": 349002, "epoch": 2077} {"train_loss": -12.370965957641602, "global_step": 349003, "epoch": 2077} {"train_loss": -12.346223831176758, "global_step": 349004, "epoch": 2077} {"train_loss": -12.23508071899414, "global_step": 349005, "epoch": 2077} {"train_loss": -12.453598022460938, "global_step": 349006, "epoch": 2077} {"train_loss": -12.443513870239258, "global_step": 349007, "epoch": 2077} {"train_loss": -12.543638229370117, "global_step": 349008, "epoch": 2077} {"train_loss": -12.370887756347656, "global_step": 349009, "epoch": 2077} {"train_loss": -12.190008163452148, "global_step": 349010, "epoch": 2077} {"train_loss": -12.295480728149414, "global_step": 349011, "epoch": 2077} {"train_loss": -12.566940307617188, "global_step": 349012, "epoch": 2077} {"train_loss": -12.383964538574219, "global_step": 349013, "epoch": 2077} {"train_loss": -12.278002738952637, "global_step": 349014, "epoch": 2077} {"train_loss": -12.459159851074219, "global_step": 349015, "epoch": 2077} {"train_loss": -12.651070594787598, "global_step": 349016, "epoch": 2077} {"train_loss": -12.257794380187988, "global_step": 349017, "epoch": 2077} {"train_loss": -12.559005737304688, "global_step": 349018, "epoch": 2077} {"train_loss": -12.139284133911133, "global_step": 349019, "epoch": 2077} {"train_loss": -12.450616836547852, "global_step": 349020, "epoch": 2077} {"train_loss": -12.261005401611328, "global_step": 349021, "epoch": 2077} {"train_loss": -12.104911804199219, "global_step": 349022, "epoch": 2077} {"train_loss": -12.385156631469727, "global_step": 349023, "epoch": 2077} {"train_loss": -11.954483985900879, "global_step": 349024, "epoch": 2077} {"train_loss": -12.3539457321167, "global_step": 349025, "epoch": 2077} {"train_loss": -12.08609390258789, "global_step": 349026, "epoch": 2077} {"train_loss": -12.325116157531738, "global_step": 349027, "epoch": 2077} {"train_loss": -11.943917274475098, "global_step": 349028, "epoch": 2077} {"train_loss": -12.326615333557129, "global_step": 349029, "epoch": 2077} {"train_loss": -12.399173736572266, "global_step": 349030, "epoch": 2077} {"train_loss": -12.123411178588867, "global_step": 349031, "epoch": 2077} {"train_loss": -12.47760009765625, "global_step": 349032, "epoch": 2077} {"train_loss": -11.997844696044922, "global_step": 349033, "epoch": 2077} {"train_loss": -12.431769371032715, "global_step": 349034, "epoch": 2077} {"train_loss": -12.353263854980469, "global_step": 349035, "epoch": 2077} {"train_loss": -12.086788177490234, "global_step": 349036, "epoch": 2077} {"train_loss": -12.400070190429688, "global_step": 349037, "epoch": 2077} {"train_loss": -12.043233871459961, "global_step": 349038, "epoch": 2077} {"train_loss": -12.528481483459473, "global_step": 349039, "epoch": 2077} {"train_loss": -12.231554985046387, "global_step": 349040, "epoch": 2077} {"train_loss": -12.469286918640137, "global_step": 349041, "epoch": 2077} {"train_loss": -12.622518539428711, "global_step": 349042, "epoch": 2077} {"train_loss": -12.329731941223145, "global_step": 349043, "epoch": 2077} {"train_loss": -12.617654800415039, "global_step": 349044, "epoch": 2077} {"train_loss": -12.579665184020996, "global_step": 349045, "epoch": 2077} {"train_loss": -12.650739669799805, "global_step": 349046, "epoch": 2077} {"train_loss": -12.239561080932617, "global_step": 349047, "epoch": 2077} {"train_loss": -11.916584014892578, "global_step": 349048, "epoch": 2077} {"train_loss": -12.251696586608887, "global_step": 349049, "epoch": 2077} {"train_loss": -12.463325500488281, "global_step": 349050, "epoch": 2077} {"train_loss": -11.988658905029297, "global_step": 349051, "epoch": 2077} {"train_loss": -11.855998039245605, "global_step": 349052, "epoch": 2077} {"train_loss": -12.392605781555176, "global_step": 349053, "epoch": 2077} {"train_loss": -12.321135520935059, "global_step": 349054, "epoch": 2077} {"train_loss": -12.15212631225586, "global_step": 349055, "epoch": 2077} {"train_loss": -11.423559188842773, "global_step": 349056, "epoch": 2077} {"train_loss": -11.511651039123535, "global_step": 349057, "epoch": 2077} {"train_loss": -12.276483535766602, "global_step": 349058, "epoch": 2077} {"train_loss": -12.372636795043945, "global_step": 349059, "epoch": 2077} {"train_loss": -11.559914588928223, "global_step": 349060, "epoch": 2077} {"train_loss": -11.466047286987305, "global_step": 349061, "epoch": 2077} {"train_loss": -12.419425964355469, "global_step": 349062, "epoch": 2077} {"train_loss": -12.27092170715332, "global_step": 349063, "epoch": 2077} {"train_loss": -11.303552627563477, "global_step": 349064, "epoch": 2077} {"train_loss": -11.207748413085938, "global_step": 349065, "epoch": 2077} {"train_loss": -11.914854049682617, "global_step": 349066, "epoch": 2077} {"train_loss": -12.03281021118164, "global_step": 349067, "epoch": 2077} {"train_loss": -11.171060562133789, "global_step": 349068, "epoch": 2077} {"train_loss": -11.42952823638916, "global_step": 349069, "epoch": 2077} {"train_loss": -11.447139739990234, "global_step": 349070, "epoch": 2077} {"train_loss": -10.652946472167969, "global_step": 349071, "epoch": 2077} {"train_loss": -11.658188819885254, "global_step": 349072, "epoch": 2077} {"train_loss": -12.000778198242188, "global_step": 349073, "epoch": 2077} {"train_loss": -11.536418914794922, "global_step": 349074, "epoch": 2077} {"train_loss": -12.247739791870117, "global_step": 349075, "epoch": 2077} {"train_loss": -12.299448013305664, "global_step": 349076, "epoch": 2077} {"train_loss": -12.179773330688477, "global_step": 349077, "epoch": 2077} {"train_loss": -12.120845794677734, "global_step": 349078, "epoch": 2077} {"train_loss": -11.420108795166016, "global_step": 349079, "epoch": 2077} {"train_loss": -12.211058616638184, "global_step": 349080, "epoch": 2077} {"train_loss": -12.050077438354492, "global_step": 349081, "epoch": 2077} {"train_loss": -12.121675491333008, "global_step": 349082, "epoch": 2077} {"train_loss": -11.07888412475586, "global_step": 349083, "epoch": 2077} {"train_loss": -11.604011535644531, "global_step": 349084, "epoch": 2077} {"train_loss": -11.382621765136719, "global_step": 349085, "epoch": 2077} {"train_loss": -10.682059288024902, "global_step": 349086, "epoch": 2077} {"train_loss": -10.64331340789795, "global_step": 349087, "epoch": 2077} {"train_loss": -11.409780502319336, "global_step": 349088, "epoch": 2077} {"train_loss": -11.589943885803223, "global_step": 349089, "epoch": 2077} {"train_loss": -11.109987258911133, "global_step": 349090, "epoch": 2077} {"train_loss": -10.922271728515625, "global_step": 349091, "epoch": 2077} {"train_loss": -11.33354377746582, "global_step": 349092, "epoch": 2077} {"train_loss": -11.148571014404297, "global_step": 349093, "epoch": 2077} {"train_loss": -10.129728317260742, "global_step": 349094, "epoch": 2077} {"train_loss": -11.248797416687012, "global_step": 349095, "epoch": 2077} {"train_loss": -10.668556213378906, "global_step": 349096, "epoch": 2077} {"train_loss": -11.374038696289062, "global_step": 349097, "epoch": 2077} {"train_loss": -11.125646591186523, "global_step": 349098, "epoch": 2077} {"train_loss": -11.93681812286377, "global_step": 349099, "epoch": 2077} {"train_loss": -10.940597534179688, "global_step": 349100, "epoch": 2077} {"train_loss": -11.534997940063477, "global_step": 349101, "epoch": 2077} {"train_loss": -11.48736572265625, "global_step": 349102, "epoch": 2077} {"train_loss": -11.971591438565936, "global_step": 349103, "epoch": 2077, "val_loss": 290777.34375} {"train_loss": -11.755199432373047, "global_step": 349104, "epoch": 2078} {"train_loss": -11.003616333007812, "global_step": 349105, "epoch": 2078} {"train_loss": -11.688484191894531, "global_step": 349106, "epoch": 2078} {"train_loss": -11.486369132995605, "global_step": 349107, "epoch": 2078} {"train_loss": -11.907482147216797, "global_step": 349108, "epoch": 2078} {"train_loss": -11.56027889251709, "global_step": 349109, "epoch": 2078} {"train_loss": -12.053985595703125, "global_step": 349110, "epoch": 2078} {"train_loss": -11.643253326416016, "global_step": 349111, "epoch": 2078} {"train_loss": -12.215023040771484, "global_step": 349112, "epoch": 2078} {"train_loss": -11.861913681030273, "global_step": 349113, "epoch": 2078} {"train_loss": -12.281400680541992, "global_step": 349114, "epoch": 2078} {"train_loss": -11.972322463989258, "global_step": 349115, "epoch": 2078} {"train_loss": -12.007784843444824, "global_step": 349116, "epoch": 2078} {"train_loss": -12.059061050415039, "global_step": 349117, "epoch": 2078} {"train_loss": -12.047225952148438, "global_step": 349118, "epoch": 2078} {"train_loss": -12.1258544921875, "global_step": 349119, "epoch": 2078} {"train_loss": -12.27599811553955, "global_step": 349120, "epoch": 2078} {"train_loss": -12.104484558105469, "global_step": 349121, "epoch": 2078} {"train_loss": -12.155442237854004, "global_step": 349122, "epoch": 2078} {"train_loss": -12.144224166870117, "global_step": 349123, "epoch": 2078} {"train_loss": -12.429222106933594, "global_step": 349124, "epoch": 2078} {"train_loss": -11.741815567016602, "global_step": 349125, "epoch": 2078} {"train_loss": -12.125423431396484, "global_step": 349126, "epoch": 2078} {"train_loss": -11.906486511230469, "global_step": 349127, "epoch": 2078} {"train_loss": -11.430356979370117, "global_step": 349128, "epoch": 2078} {"train_loss": -12.153745651245117, "global_step": 349129, "epoch": 2078} {"train_loss": -12.016786575317383, "global_step": 349130, "epoch": 2078} {"train_loss": -11.966180801391602, "global_step": 349131, "epoch": 2078} {"train_loss": -12.301525115966797, "global_step": 349132, "epoch": 2078} {"train_loss": -12.02597427368164, "global_step": 349133, "epoch": 2078} {"train_loss": -12.244647979736328, "global_step": 349134, "epoch": 2078} {"train_loss": -11.775291442871094, "global_step": 349135, "epoch": 2078} {"train_loss": -12.262754440307617, "global_step": 349136, "epoch": 2078} {"train_loss": -12.202215194702148, "global_step": 349137, "epoch": 2078} {"train_loss": -12.218849182128906, "global_step": 349138, "epoch": 2078} {"train_loss": -12.174478530883789, "global_step": 349139, "epoch": 2078} {"train_loss": -12.336780548095703, "global_step": 349140, "epoch": 2078} {"train_loss": -12.229818344116211, "global_step": 349141, "epoch": 2078} {"train_loss": -12.331003189086914, "global_step": 349142, "epoch": 2078} {"train_loss": -12.25272274017334, "global_step": 349143, "epoch": 2078} {"train_loss": -12.025821685791016, "global_step": 349144, "epoch": 2078} {"train_loss": -12.372573852539062, "global_step": 349145, "epoch": 2078} {"train_loss": -12.195476531982422, "global_step": 349146, "epoch": 2078} {"train_loss": -12.48729133605957, "global_step": 349147, "epoch": 2078} {"train_loss": -12.305272102355957, "global_step": 349148, "epoch": 2078} {"train_loss": -12.163520812988281, "global_step": 349149, "epoch": 2078} {"train_loss": -12.514056205749512, "global_step": 349150, "epoch": 2078} {"train_loss": -12.094795227050781, "global_step": 349151, "epoch": 2078} {"train_loss": -12.234273910522461, "global_step": 349152, "epoch": 2078} {"train_loss": -11.7965669631958, "global_step": 349153, "epoch": 2078} {"train_loss": -11.991384506225586, "global_step": 349154, "epoch": 2078} {"train_loss": -12.40301513671875, "global_step": 349155, "epoch": 2078} {"train_loss": -12.272821426391602, "global_step": 349156, "epoch": 2078} {"train_loss": -12.30136489868164, "global_step": 349157, "epoch": 2078} {"train_loss": -12.395164489746094, "global_step": 349158, "epoch": 2078} {"train_loss": -12.317291259765625, "global_step": 349159, "epoch": 2078} {"train_loss": -12.348666191101074, "global_step": 349160, "epoch": 2078} {"train_loss": -12.158096313476562, "global_step": 349161, "epoch": 2078} {"train_loss": -12.481010437011719, "global_step": 349162, "epoch": 2078} {"train_loss": -12.370290756225586, "global_step": 349163, "epoch": 2078} {"train_loss": -12.560443878173828, "global_step": 349164, "epoch": 2078} {"train_loss": -12.319891929626465, "global_step": 349165, "epoch": 2078} {"train_loss": -12.603074073791504, "global_step": 349166, "epoch": 2078} {"train_loss": -12.582696914672852, "global_step": 349167, "epoch": 2078} {"train_loss": -12.47704029083252, "global_step": 349168, "epoch": 2078} {"train_loss": -12.098926544189453, "global_step": 349169, "epoch": 2078} {"train_loss": -12.457822799682617, "global_step": 349170, "epoch": 2078} {"train_loss": -12.35916519165039, "global_step": 349171, "epoch": 2078} {"train_loss": -12.32699203491211, "global_step": 349172, "epoch": 2078} {"train_loss": -12.251029968261719, "global_step": 349173, "epoch": 2078} {"train_loss": -12.3919095993042, "global_step": 349174, "epoch": 2078} {"train_loss": -12.458410263061523, "global_step": 349175, "epoch": 2078} {"train_loss": -12.399356842041016, "global_step": 349176, "epoch": 2078} {"train_loss": -12.517126083374023, "global_step": 349177, "epoch": 2078} {"train_loss": -12.417853355407715, "global_step": 349178, "epoch": 2078} {"train_loss": -12.610990524291992, "global_step": 349179, "epoch": 2078} {"train_loss": -12.36044692993164, "global_step": 349180, "epoch": 2078} {"train_loss": -12.571322441101074, "global_step": 349181, "epoch": 2078} {"train_loss": -12.431535720825195, "global_step": 349182, "epoch": 2078} {"train_loss": -12.531866073608398, "global_step": 349183, "epoch": 2078} {"train_loss": -12.474674224853516, "global_step": 349184, "epoch": 2078} {"train_loss": -11.861377716064453, "global_step": 349185, "epoch": 2078} {"train_loss": -12.414652824401855, "global_step": 349186, "epoch": 2078} {"train_loss": -12.200143814086914, "global_step": 349187, "epoch": 2078} {"train_loss": -12.242119789123535, "global_step": 349188, "epoch": 2078} {"train_loss": -12.198572158813477, "global_step": 349189, "epoch": 2078} {"train_loss": -11.829818725585938, "global_step": 349190, "epoch": 2078} {"train_loss": -11.583812713623047, "global_step": 349191, "epoch": 2078} {"train_loss": -12.546253204345703, "global_step": 349192, "epoch": 2078} {"train_loss": -11.51431655883789, "global_step": 349193, "epoch": 2078} {"train_loss": -12.496560096740723, "global_step": 349194, "epoch": 2078} {"train_loss": -11.441926956176758, "global_step": 349195, "epoch": 2078} {"train_loss": -11.862703323364258, "global_step": 349196, "epoch": 2078} {"train_loss": -12.256120681762695, "global_step": 349197, "epoch": 2078} {"train_loss": -12.478811264038086, "global_step": 349198, "epoch": 2078} {"train_loss": -12.123444557189941, "global_step": 349199, "epoch": 2078} {"train_loss": -12.275819778442383, "global_step": 349200, "epoch": 2078} {"train_loss": -12.509635925292969, "global_step": 349201, "epoch": 2078} {"train_loss": -11.880928039550781, "global_step": 349202, "epoch": 2078} {"train_loss": -12.46595573425293, "global_step": 349203, "epoch": 2078} {"train_loss": -12.144161224365234, "global_step": 349204, "epoch": 2078} {"train_loss": -12.315864562988281, "global_step": 349205, "epoch": 2078} {"train_loss": -12.500001907348633, "global_step": 349206, "epoch": 2078} {"train_loss": -12.058246612548828, "global_step": 349207, "epoch": 2078} {"train_loss": -11.458734512329102, "global_step": 349208, "epoch": 2078} {"train_loss": -11.380486488342285, "global_step": 349209, "epoch": 2078} {"train_loss": -10.9899320602417, "global_step": 349210, "epoch": 2078} {"train_loss": -11.584855079650879, "global_step": 349211, "epoch": 2078} {"train_loss": -11.472573280334473, "global_step": 349212, "epoch": 2078} {"train_loss": -10.478578567504883, "global_step": 349213, "epoch": 2078} {"train_loss": -11.454832077026367, "global_step": 349214, "epoch": 2078} {"train_loss": -10.767467498779297, "global_step": 349215, "epoch": 2078} {"train_loss": -11.51101303100586, "global_step": 349216, "epoch": 2078} {"train_loss": -11.868219375610352, "global_step": 349217, "epoch": 2078} {"train_loss": -11.251838684082031, "global_step": 349218, "epoch": 2078} {"train_loss": -11.641658782958984, "global_step": 349219, "epoch": 2078} {"train_loss": -12.170246124267578, "global_step": 349220, "epoch": 2078} {"train_loss": -10.925782203674316, "global_step": 349221, "epoch": 2078} {"train_loss": -12.263036727905273, "global_step": 349222, "epoch": 2078} {"train_loss": -11.76184368133545, "global_step": 349223, "epoch": 2078} {"train_loss": -11.837695121765137, "global_step": 349224, "epoch": 2078} {"train_loss": -11.464274406433105, "global_step": 349225, "epoch": 2078} {"train_loss": -11.479982376098633, "global_step": 349226, "epoch": 2078} {"train_loss": -11.705881118774414, "global_step": 349227, "epoch": 2078} {"train_loss": -11.52784538269043, "global_step": 349228, "epoch": 2078} {"train_loss": -11.860123634338379, "global_step": 349229, "epoch": 2078} {"train_loss": -11.8067626953125, "global_step": 349230, "epoch": 2078} {"train_loss": -11.07115364074707, "global_step": 349231, "epoch": 2078} {"train_loss": -11.448123931884766, "global_step": 349232, "epoch": 2078} {"train_loss": -9.643117904663086, "global_step": 349233, "epoch": 2078} {"train_loss": -11.531282424926758, "global_step": 349234, "epoch": 2078} {"train_loss": -10.755178451538086, "global_step": 349235, "epoch": 2078} {"train_loss": -10.529461860656738, "global_step": 349236, "epoch": 2078} {"train_loss": -11.679695129394531, "global_step": 349237, "epoch": 2078} {"train_loss": -9.747091293334961, "global_step": 349238, "epoch": 2078} {"train_loss": -11.236428260803223, "global_step": 349239, "epoch": 2078} {"train_loss": -11.605209350585938, "global_step": 349240, "epoch": 2078} {"train_loss": -10.646925926208496, "global_step": 349241, "epoch": 2078} {"train_loss": -11.467523574829102, "global_step": 349242, "epoch": 2078} {"train_loss": -10.754813194274902, "global_step": 349243, "epoch": 2078} {"train_loss": -11.116567611694336, "global_step": 349244, "epoch": 2078} {"train_loss": -10.642091751098633, "global_step": 349245, "epoch": 2078} {"train_loss": -11.075713157653809, "global_step": 349246, "epoch": 2078} {"train_loss": -10.885786056518555, "global_step": 349247, "epoch": 2078} {"train_loss": -11.338193893432617, "global_step": 349248, "epoch": 2078} {"train_loss": -11.073447227478027, "global_step": 349249, "epoch": 2078} {"train_loss": -11.672182083129883, "global_step": 349250, "epoch": 2078} {"train_loss": -11.48744010925293, "global_step": 349251, "epoch": 2078} {"train_loss": -12.09756088256836, "global_step": 349252, "epoch": 2078} {"train_loss": -11.342634201049805, "global_step": 349253, "epoch": 2078} {"train_loss": -11.812390327453613, "global_step": 349254, "epoch": 2078} {"train_loss": -11.286409378051758, "global_step": 349255, "epoch": 2078} {"train_loss": -11.75395393371582, "global_step": 349256, "epoch": 2078} {"train_loss": -11.776932716369629, "global_step": 349257, "epoch": 2078} {"train_loss": -12.213759422302246, "global_step": 349258, "epoch": 2078} {"train_loss": -11.910017013549805, "global_step": 349259, "epoch": 2078} {"train_loss": -12.324679374694824, "global_step": 349260, "epoch": 2078} {"train_loss": -11.80212688446045, "global_step": 349261, "epoch": 2078} {"train_loss": -12.225326538085938, "global_step": 349262, "epoch": 2078} {"train_loss": -11.864063262939453, "global_step": 349263, "epoch": 2078} {"train_loss": -11.988207817077637, "global_step": 349264, "epoch": 2078} {"train_loss": -12.346134185791016, "global_step": 349265, "epoch": 2078} {"train_loss": -12.102537155151367, "global_step": 349266, "epoch": 2078} {"train_loss": -12.212040901184082, "global_step": 349267, "epoch": 2078} {"train_loss": -12.194231986999512, "global_step": 349268, "epoch": 2078} {"train_loss": -12.105201721191406, "global_step": 349269, "epoch": 2078} {"train_loss": -12.307703971862793, "global_step": 349270, "epoch": 2078} {"train_loss": -11.915904737654186, "global_step": 349271, "epoch": 2078, "val_loss": 292109.0} {"train_loss": -12.02944278717041, "global_step": 349272, "epoch": 2079} {"train_loss": -12.306753158569336, "global_step": 349273, "epoch": 2079} {"train_loss": -11.94707202911377, "global_step": 349274, "epoch": 2079} {"train_loss": -11.95386028289795, "global_step": 349275, "epoch": 2079} {"train_loss": -12.04922103881836, "global_step": 349276, "epoch": 2079} {"train_loss": -11.798728942871094, "global_step": 349277, "epoch": 2079} {"train_loss": -12.193910598754883, "global_step": 349278, "epoch": 2079} {"train_loss": -12.24952507019043, "global_step": 349279, "epoch": 2079} {"train_loss": -11.868717193603516, "global_step": 349280, "epoch": 2079} {"train_loss": -12.257800102233887, "global_step": 349281, "epoch": 2079} {"train_loss": -12.010141372680664, "global_step": 349282, "epoch": 2079} {"train_loss": -12.01115608215332, "global_step": 349283, "epoch": 2079} {"train_loss": -12.233631134033203, "global_step": 349284, "epoch": 2079} {"train_loss": -12.081842422485352, "global_step": 349285, "epoch": 2079} {"train_loss": -12.173559188842773, "global_step": 349286, "epoch": 2079} {"train_loss": -12.188064575195312, "global_step": 349287, "epoch": 2079} {"train_loss": -12.277560234069824, "global_step": 349288, "epoch": 2079} {"train_loss": -12.572071075439453, "global_step": 349289, "epoch": 2079} {"train_loss": -11.991715431213379, "global_step": 349290, "epoch": 2079} {"train_loss": -12.388931274414062, "global_step": 349291, "epoch": 2079} {"train_loss": -12.34557056427002, "global_step": 349292, "epoch": 2079} {"train_loss": -12.151988983154297, "global_step": 349293, "epoch": 2079} {"train_loss": -12.298343658447266, "global_step": 349294, "epoch": 2079} {"train_loss": -12.202924728393555, "global_step": 349295, "epoch": 2079} {"train_loss": -12.50571060180664, "global_step": 349296, "epoch": 2079} {"train_loss": -12.366495132446289, "global_step": 349297, "epoch": 2079} {"train_loss": -12.422160148620605, "global_step": 349298, "epoch": 2079} {"train_loss": -12.280834197998047, "global_step": 349299, "epoch": 2079} {"train_loss": -12.460996627807617, "global_step": 349300, "epoch": 2079} {"train_loss": -12.408090591430664, "global_step": 349301, "epoch": 2079} {"train_loss": -12.523406982421875, "global_step": 349302, "epoch": 2079} {"train_loss": -12.433130264282227, "global_step": 349303, "epoch": 2079} {"train_loss": -12.478106498718262, "global_step": 349304, "epoch": 2079} {"train_loss": -12.35490608215332, "global_step": 349305, "epoch": 2079} {"train_loss": -12.531160354614258, "global_step": 349306, "epoch": 2079} {"train_loss": -12.28535270690918, "global_step": 349307, "epoch": 2079} {"train_loss": -12.319881439208984, "global_step": 349308, "epoch": 2079} {"train_loss": -12.307748794555664, "global_step": 349309, "epoch": 2079} {"train_loss": -12.084507942199707, "global_step": 349310, "epoch": 2079} {"train_loss": -11.822042465209961, "global_step": 349311, "epoch": 2079} {"train_loss": -11.52828598022461, "global_step": 349312, "epoch": 2079} {"train_loss": -12.391950607299805, "global_step": 349313, "epoch": 2079} {"train_loss": -10.384082794189453, "global_step": 349314, "epoch": 2079} {"train_loss": -10.504542350769043, "global_step": 349315, "epoch": 2079} {"train_loss": -12.05227279663086, "global_step": 349316, "epoch": 2079} {"train_loss": -11.23198127746582, "global_step": 349317, "epoch": 2079} {"train_loss": -11.214305877685547, "global_step": 349318, "epoch": 2079} {"train_loss": -12.098093032836914, "global_step": 349319, "epoch": 2079} {"train_loss": -10.924612045288086, "global_step": 349320, "epoch": 2079} {"train_loss": -11.689064025878906, "global_step": 349321, "epoch": 2079} {"train_loss": -11.719639778137207, "global_step": 349322, "epoch": 2079} {"train_loss": -11.399097442626953, "global_step": 349323, "epoch": 2079} {"train_loss": -11.948244094848633, "global_step": 349324, "epoch": 2079} {"train_loss": -10.907893180847168, "global_step": 349325, "epoch": 2079} {"train_loss": -11.999825477600098, "global_step": 349326, "epoch": 2079} {"train_loss": -11.05521011352539, "global_step": 349327, "epoch": 2079} {"train_loss": -11.704919815063477, "global_step": 349328, "epoch": 2079} {"train_loss": -12.09205436706543, "global_step": 349329, "epoch": 2079} {"train_loss": -11.211296081542969, "global_step": 349330, "epoch": 2079} {"train_loss": -12.060298919677734, "global_step": 349331, "epoch": 2079} {"train_loss": -11.982988357543945, "global_step": 349332, "epoch": 2079} {"train_loss": -11.450736045837402, "global_step": 349333, "epoch": 2079} {"train_loss": -12.056321144104004, "global_step": 349334, "epoch": 2079} {"train_loss": -11.461444854736328, "global_step": 349335, "epoch": 2079} {"train_loss": -12.187397003173828, "global_step": 349336, "epoch": 2079} {"train_loss": -11.574484825134277, "global_step": 349337, "epoch": 2079} {"train_loss": -12.00827693939209, "global_step": 349338, "epoch": 2079} {"train_loss": -12.055315017700195, "global_step": 349339, "epoch": 2079} {"train_loss": -12.13685417175293, "global_step": 349340, "epoch": 2079} {"train_loss": -11.869791984558105, "global_step": 349341, "epoch": 2079} {"train_loss": -11.99085521697998, "global_step": 349342, "epoch": 2079} {"train_loss": -12.113930702209473, "global_step": 349343, "epoch": 2079} {"train_loss": -12.288454055786133, "global_step": 349344, "epoch": 2079} {"train_loss": -12.12707805633545, "global_step": 349345, "epoch": 2079} {"train_loss": -12.006600379943848, "global_step": 349346, "epoch": 2079} {"train_loss": -12.229881286621094, "global_step": 349347, "epoch": 2079} {"train_loss": -11.937139511108398, "global_step": 349348, "epoch": 2079} {"train_loss": -12.402179718017578, "global_step": 349349, "epoch": 2079} {"train_loss": -12.326072692871094, "global_step": 349350, "epoch": 2079} {"train_loss": -12.327401161193848, "global_step": 349351, "epoch": 2079} {"train_loss": -12.364084243774414, "global_step": 349352, "epoch": 2079} {"train_loss": -12.324993133544922, "global_step": 349353, "epoch": 2079} {"train_loss": -12.482275009155273, "global_step": 349354, "epoch": 2079} {"train_loss": -12.271629333496094, "global_step": 349355, "epoch": 2079} {"train_loss": -12.376775741577148, "global_step": 349356, "epoch": 2079} {"train_loss": -12.428154945373535, "global_step": 349357, "epoch": 2079} {"train_loss": -12.225578308105469, "global_step": 349358, "epoch": 2079} {"train_loss": -12.391762733459473, "global_step": 349359, "epoch": 2079} {"train_loss": -12.302478790283203, "global_step": 349360, "epoch": 2079} {"train_loss": -12.627476692199707, "global_step": 349361, "epoch": 2079} {"train_loss": -12.151824951171875, "global_step": 349362, "epoch": 2079} {"train_loss": -12.229166030883789, "global_step": 349363, "epoch": 2079} {"train_loss": -12.337019920349121, "global_step": 349364, "epoch": 2079} {"train_loss": -12.532845497131348, "global_step": 349365, "epoch": 2079} {"train_loss": -12.456771850585938, "global_step": 349366, "epoch": 2079} {"train_loss": -12.592456817626953, "global_step": 349367, "epoch": 2079} {"train_loss": -12.65038013458252, "global_step": 349368, "epoch": 2079} {"train_loss": -12.518091201782227, "global_step": 349369, "epoch": 2079} {"train_loss": -12.522574424743652, "global_step": 349370, "epoch": 2079} {"train_loss": -12.551105499267578, "global_step": 349371, "epoch": 2079} {"train_loss": -12.611489295959473, "global_step": 349372, "epoch": 2079} {"train_loss": -12.137948036193848, "global_step": 349373, "epoch": 2079} {"train_loss": -12.029199600219727, "global_step": 349374, "epoch": 2079} {"train_loss": -12.095426559448242, "global_step": 349375, "epoch": 2079} {"train_loss": -12.179478645324707, "global_step": 349376, "epoch": 2079} {"train_loss": -12.196374893188477, "global_step": 349377, "epoch": 2079} {"train_loss": -12.494182586669922, "global_step": 349378, "epoch": 2079} {"train_loss": -11.963594436645508, "global_step": 349379, "epoch": 2079} {"train_loss": -10.656006813049316, "global_step": 349380, "epoch": 2079} {"train_loss": -11.982606887817383, "global_step": 349381, "epoch": 2079} {"train_loss": -11.384977340698242, "global_step": 349382, "epoch": 2079} {"train_loss": -9.47949504852295, "global_step": 349383, "epoch": 2079} {"train_loss": -12.351041793823242, "global_step": 349384, "epoch": 2079} {"train_loss": -10.585437774658203, "global_step": 349385, "epoch": 2079} {"train_loss": -10.489157676696777, "global_step": 349386, "epoch": 2079} {"train_loss": -11.524333000183105, "global_step": 349387, "epoch": 2079} {"train_loss": -9.789716720581055, "global_step": 349388, "epoch": 2079} {"train_loss": -9.322669982910156, "global_step": 349389, "epoch": 2079} {"train_loss": -10.96286392211914, "global_step": 349390, "epoch": 2079} {"train_loss": -10.987211227416992, "global_step": 349391, "epoch": 2079} {"train_loss": -9.590578079223633, "global_step": 349392, "epoch": 2079} {"train_loss": -11.414867401123047, "global_step": 349393, "epoch": 2079} {"train_loss": -10.621490478515625, "global_step": 349394, "epoch": 2079} {"train_loss": -9.715733528137207, "global_step": 349395, "epoch": 2079} {"train_loss": -10.438140869140625, "global_step": 349396, "epoch": 2079} {"train_loss": -11.075128555297852, "global_step": 349397, "epoch": 2079} {"train_loss": -9.222790718078613, "global_step": 349398, "epoch": 2079} {"train_loss": -11.002446174621582, "global_step": 349399, "epoch": 2079} {"train_loss": -8.546524047851562, "global_step": 349400, "epoch": 2079} {"train_loss": -10.324050903320312, "global_step": 349401, "epoch": 2079} {"train_loss": -7.602871894836426, "global_step": 349402, "epoch": 2079} {"train_loss": -8.856985092163086, "global_step": 349403, "epoch": 2079} {"train_loss": -9.778971672058105, "global_step": 349404, "epoch": 2079} {"train_loss": -10.365467071533203, "global_step": 349405, "epoch": 2079} {"train_loss": -10.303577423095703, "global_step": 349406, "epoch": 2079} {"train_loss": -10.105310440063477, "global_step": 349407, "epoch": 2079} {"train_loss": -10.613214492797852, "global_step": 349408, "epoch": 2079} {"train_loss": -10.810474395751953, "global_step": 349409, "epoch": 2079} {"train_loss": -10.141365051269531, "global_step": 349410, "epoch": 2079} {"train_loss": -11.454340934753418, "global_step": 349411, "epoch": 2079} {"train_loss": -11.130399703979492, "global_step": 349412, "epoch": 2079} {"train_loss": -11.59393310546875, "global_step": 349413, "epoch": 2079} {"train_loss": -11.370265007019043, "global_step": 349414, "epoch": 2079} {"train_loss": -11.529870986938477, "global_step": 349415, "epoch": 2079} {"train_loss": -10.69452953338623, "global_step": 349416, "epoch": 2079} {"train_loss": -11.744207382202148, "global_step": 349417, "epoch": 2079} {"train_loss": -11.342317581176758, "global_step": 349418, "epoch": 2079} {"train_loss": -11.490817070007324, "global_step": 349419, "epoch": 2079} {"train_loss": -11.572200775146484, "global_step": 349420, "epoch": 2079} {"train_loss": -11.578228950500488, "global_step": 349421, "epoch": 2079} {"train_loss": -10.872611045837402, "global_step": 349422, "epoch": 2079} {"train_loss": -11.71909236907959, "global_step": 349423, "epoch": 2079} {"train_loss": -11.281123161315918, "global_step": 349424, "epoch": 2079} {"train_loss": -11.643985748291016, "global_step": 349425, "epoch": 2079} {"train_loss": -11.70537281036377, "global_step": 349426, "epoch": 2079} {"train_loss": -11.493426322937012, "global_step": 349427, "epoch": 2079} {"train_loss": -11.768373489379883, "global_step": 349428, "epoch": 2079} {"train_loss": -11.980369567871094, "global_step": 349429, "epoch": 2079} {"train_loss": -11.62905502319336, "global_step": 349430, "epoch": 2079} {"train_loss": -11.679061889648438, "global_step": 349431, "epoch": 2079} {"train_loss": -11.736011505126953, "global_step": 349432, "epoch": 2079} {"train_loss": -11.847214698791504, "global_step": 349433, "epoch": 2079} {"train_loss": -11.859895706176758, "global_step": 349434, "epoch": 2079} {"train_loss": -11.946239471435547, "global_step": 349435, "epoch": 2079} {"train_loss": -11.921976089477539, "global_step": 349436, "epoch": 2079} {"train_loss": -11.915786743164062, "global_step": 349437, "epoch": 2079} {"train_loss": -12.037627220153809, "global_step": 349438, "epoch": 2079} {"train_loss": -11.68099842752729, "global_step": 349439, "epoch": 2079, "val_loss": 288346.5625} {"train_loss": -11.886512756347656, "global_step": 349440, "epoch": 2080} {"train_loss": -12.18793773651123, "global_step": 349441, "epoch": 2080} {"train_loss": -12.139434814453125, "global_step": 349442, "epoch": 2080} {"train_loss": -11.884378433227539, "global_step": 349443, "epoch": 2080} {"train_loss": -11.893802642822266, "global_step": 349444, "epoch": 2080} {"train_loss": -12.068798065185547, "global_step": 349445, "epoch": 2080} {"train_loss": -11.571588516235352, "global_step": 349446, "epoch": 2080} {"train_loss": -12.271252632141113, "global_step": 349447, "epoch": 2080} {"train_loss": -12.091885566711426, "global_step": 349448, "epoch": 2080} {"train_loss": -12.219371795654297, "global_step": 349449, "epoch": 2080} {"train_loss": -12.045695304870605, "global_step": 349450, "epoch": 2080} {"train_loss": -12.257966995239258, "global_step": 349451, "epoch": 2080} {"train_loss": -12.103187561035156, "global_step": 349452, "epoch": 2080} {"train_loss": -11.945799827575684, "global_step": 349453, "epoch": 2080} {"train_loss": -12.165122032165527, "global_step": 349454, "epoch": 2080} {"train_loss": -11.962865829467773, "global_step": 349455, "epoch": 2080} {"train_loss": -12.281046867370605, "global_step": 349456, "epoch": 2080} {"train_loss": -11.939979553222656, "global_step": 349457, "epoch": 2080} {"train_loss": -12.24692440032959, "global_step": 349458, "epoch": 2080} {"train_loss": -12.075284957885742, "global_step": 349459, "epoch": 2080} {"train_loss": -12.167863845825195, "global_step": 349460, "epoch": 2080} {"train_loss": -12.193306922912598, "global_step": 349461, "epoch": 2080} {"train_loss": -12.22899055480957, "global_step": 349462, "epoch": 2080} {"train_loss": -12.082487106323242, "global_step": 349463, "epoch": 2080} {"train_loss": -12.138708114624023, "global_step": 349464, "epoch": 2080} {"train_loss": -11.988762855529785, "global_step": 349465, "epoch": 2080} {"train_loss": -12.30344009399414, "global_step": 349466, "epoch": 2080} {"train_loss": -12.149077415466309, "global_step": 349467, "epoch": 2080} {"train_loss": -11.995681762695312, "global_step": 349468, "epoch": 2080} {"train_loss": -12.123955726623535, "global_step": 349469, "epoch": 2080} {"train_loss": -12.273635864257812, "global_step": 349470, "epoch": 2080} {"train_loss": -11.89505386352539, "global_step": 349471, "epoch": 2080} {"train_loss": -12.338750839233398, "global_step": 349472, "epoch": 2080} {"train_loss": -12.227169036865234, "global_step": 349473, "epoch": 2080} {"train_loss": -11.93942642211914, "global_step": 349474, "epoch": 2080} {"train_loss": -11.966089248657227, "global_step": 349475, "epoch": 2080} {"train_loss": -12.088342666625977, "global_step": 349476, "epoch": 2080} {"train_loss": -11.92862606048584, "global_step": 349477, "epoch": 2080} {"train_loss": -11.801350593566895, "global_step": 349478, "epoch": 2080} {"train_loss": -12.051042556762695, "global_step": 349479, "epoch": 2080} {"train_loss": -11.910005569458008, "global_step": 349480, "epoch": 2080} {"train_loss": -12.323341369628906, "global_step": 349481, "epoch": 2080} {"train_loss": -12.056556701660156, "global_step": 349482, "epoch": 2080} {"train_loss": -12.443721771240234, "global_step": 349483, "epoch": 2080} {"train_loss": -12.061470031738281, "global_step": 349484, "epoch": 2080} {"train_loss": -12.445384979248047, "global_step": 349485, "epoch": 2080} {"train_loss": -12.054673194885254, "global_step": 349486, "epoch": 2080} {"train_loss": -12.206355094909668, "global_step": 349487, "epoch": 2080} {"train_loss": -12.220230102539062, "global_step": 349488, "epoch": 2080} {"train_loss": -12.22911262512207, "global_step": 349489, "epoch": 2080} {"train_loss": -12.215472221374512, "global_step": 349490, "epoch": 2080} {"train_loss": -12.529865264892578, "global_step": 349491, "epoch": 2080} {"train_loss": -12.072545051574707, "global_step": 349492, "epoch": 2080} {"train_loss": -12.377921104431152, "global_step": 349493, "epoch": 2080} {"train_loss": -12.371639251708984, "global_step": 349494, "epoch": 2080} {"train_loss": -12.428391456604004, "global_step": 349495, "epoch": 2080} {"train_loss": -12.444134712219238, "global_step": 349496, "epoch": 2080} {"train_loss": -12.247342109680176, "global_step": 349497, "epoch": 2080} {"train_loss": -12.671554565429688, "global_step": 349498, "epoch": 2080} {"train_loss": -12.599421501159668, "global_step": 349499, "epoch": 2080} {"train_loss": -12.513660430908203, "global_step": 349500, "epoch": 2080} {"train_loss": -12.429665565490723, "global_step": 349501, "epoch": 2080} {"train_loss": -12.18968391418457, "global_step": 349502, "epoch": 2080} {"train_loss": -12.500446319580078, "global_step": 349503, "epoch": 2080} {"train_loss": -12.458256721496582, "global_step": 349504, "epoch": 2080} {"train_loss": -12.312118530273438, "global_step": 349505, "epoch": 2080} {"train_loss": -12.406966209411621, "global_step": 349506, "epoch": 2080} {"train_loss": -12.503097534179688, "global_step": 349507, "epoch": 2080} {"train_loss": -12.62663459777832, "global_step": 349508, "epoch": 2080} {"train_loss": -12.564261436462402, "global_step": 349509, "epoch": 2080} {"train_loss": -12.15329360961914, "global_step": 349510, "epoch": 2080} {"train_loss": -12.209904670715332, "global_step": 349511, "epoch": 2080} {"train_loss": -12.068692207336426, "global_step": 349512, "epoch": 2080} {"train_loss": -11.138079643249512, "global_step": 349513, "epoch": 2080} {"train_loss": -12.205366134643555, "global_step": 349514, "epoch": 2080} {"train_loss": -12.307584762573242, "global_step": 349515, "epoch": 2080} {"train_loss": -11.925125122070312, "global_step": 349516, "epoch": 2080} {"train_loss": -11.918756484985352, "global_step": 349517, "epoch": 2080} {"train_loss": -12.47782039642334, "global_step": 349518, "epoch": 2080} {"train_loss": -11.967365264892578, "global_step": 349519, "epoch": 2080} {"train_loss": -12.308082580566406, "global_step": 349520, "epoch": 2080} {"train_loss": -12.212096214294434, "global_step": 349521, "epoch": 2080} {"train_loss": -12.506031036376953, "global_step": 349522, "epoch": 2080} {"train_loss": -12.552423477172852, "global_step": 349523, "epoch": 2080} {"train_loss": -12.338298797607422, "global_step": 349524, "epoch": 2080} {"train_loss": -12.343755722045898, "global_step": 349525, "epoch": 2080} {"train_loss": -12.26153564453125, "global_step": 349526, "epoch": 2080} {"train_loss": -12.082765579223633, "global_step": 349527, "epoch": 2080} {"train_loss": -10.801969528198242, "global_step": 349528, "epoch": 2080} {"train_loss": -12.156352043151855, "global_step": 349529, "epoch": 2080} {"train_loss": -12.239339828491211, "global_step": 349530, "epoch": 2080} {"train_loss": -11.008079528808594, "global_step": 349531, "epoch": 2080} {"train_loss": -12.21866226196289, "global_step": 349532, "epoch": 2080} {"train_loss": -12.092838287353516, "global_step": 349533, "epoch": 2080} {"train_loss": -11.893247604370117, "global_step": 349534, "epoch": 2080} {"train_loss": -11.88046646118164, "global_step": 349535, "epoch": 2080} {"train_loss": -12.092132568359375, "global_step": 349536, "epoch": 2080} {"train_loss": -12.300527572631836, "global_step": 349537, "epoch": 2080} {"train_loss": -12.297529220581055, "global_step": 349538, "epoch": 2080} {"train_loss": -12.144014358520508, "global_step": 349539, "epoch": 2080} {"train_loss": -12.370014190673828, "global_step": 349540, "epoch": 2080} {"train_loss": -12.641916275024414, "global_step": 349541, "epoch": 2080} {"train_loss": -12.341424942016602, "global_step": 349542, "epoch": 2080} {"train_loss": -12.417445182800293, "global_step": 349543, "epoch": 2080} {"train_loss": -12.466154098510742, "global_step": 349544, "epoch": 2080} {"train_loss": -11.773895263671875, "global_step": 349545, "epoch": 2080} {"train_loss": -11.102301597595215, "global_step": 349546, "epoch": 2080} {"train_loss": -12.480810165405273, "global_step": 349547, "epoch": 2080} {"train_loss": -12.108299255371094, "global_step": 349548, "epoch": 2080} {"train_loss": -11.74542236328125, "global_step": 349549, "epoch": 2080} {"train_loss": -11.0834321975708, "global_step": 349550, "epoch": 2080} {"train_loss": -12.094386100769043, "global_step": 349551, "epoch": 2080} {"train_loss": -10.338638305664062, "global_step": 349552, "epoch": 2080} {"train_loss": -11.657954216003418, "global_step": 349553, "epoch": 2080} {"train_loss": -9.930723190307617, "global_step": 349554, "epoch": 2080} {"train_loss": -10.259295463562012, "global_step": 349555, "epoch": 2080} {"train_loss": -11.55099105834961, "global_step": 349556, "epoch": 2080} {"train_loss": -11.066156387329102, "global_step": 349557, "epoch": 2080} {"train_loss": -11.36623764038086, "global_step": 349558, "epoch": 2080} {"train_loss": -11.576190948486328, "global_step": 349559, "epoch": 2080} {"train_loss": -9.757364273071289, "global_step": 349560, "epoch": 2080} {"train_loss": -10.90339469909668, "global_step": 349561, "epoch": 2080} {"train_loss": -11.185446739196777, "global_step": 349562, "epoch": 2080} {"train_loss": -10.159590721130371, "global_step": 349563, "epoch": 2080} {"train_loss": -10.142251968383789, "global_step": 349564, "epoch": 2080} {"train_loss": -11.883760452270508, "global_step": 349565, "epoch": 2080} {"train_loss": -11.085916519165039, "global_step": 349566, "epoch": 2080} {"train_loss": -11.51608657836914, "global_step": 349567, "epoch": 2080} {"train_loss": -10.755472183227539, "global_step": 349568, "epoch": 2080} {"train_loss": -11.050216674804688, "global_step": 349569, "epoch": 2080} {"train_loss": -11.320433616638184, "global_step": 349570, "epoch": 2080} {"train_loss": -10.92905044555664, "global_step": 349571, "epoch": 2080} {"train_loss": -11.13541030883789, "global_step": 349572, "epoch": 2080} {"train_loss": -11.379045486450195, "global_step": 349573, "epoch": 2080} {"train_loss": -11.147233963012695, "global_step": 349574, "epoch": 2080} {"train_loss": -11.169185638427734, "global_step": 349575, "epoch": 2080} {"train_loss": -11.248945236206055, "global_step": 349576, "epoch": 2080} {"train_loss": -11.378656387329102, "global_step": 349577, "epoch": 2080} {"train_loss": -11.687753677368164, "global_step": 349578, "epoch": 2080} {"train_loss": -11.338648796081543, "global_step": 349579, "epoch": 2080} {"train_loss": -11.307635307312012, "global_step": 349580, "epoch": 2080} {"train_loss": -11.530001640319824, "global_step": 349581, "epoch": 2080} {"train_loss": -11.16334342956543, "global_step": 349582, "epoch": 2080} {"train_loss": -11.69250774383545, "global_step": 349583, "epoch": 2080} {"train_loss": -11.276458740234375, "global_step": 349584, "epoch": 2080} {"train_loss": -11.290928840637207, "global_step": 349585, "epoch": 2080} {"train_loss": -11.816926002502441, "global_step": 349586, "epoch": 2080} {"train_loss": -11.471314430236816, "global_step": 349587, "epoch": 2080} {"train_loss": -11.140629768371582, "global_step": 349588, "epoch": 2080} {"train_loss": -12.074499130249023, "global_step": 349589, "epoch": 2080} {"train_loss": -11.609323501586914, "global_step": 349590, "epoch": 2080} {"train_loss": -11.89280891418457, "global_step": 349591, "epoch": 2080} {"train_loss": -12.056022644042969, "global_step": 349592, "epoch": 2080} {"train_loss": -11.994507789611816, "global_step": 349593, "epoch": 2080} {"train_loss": -12.0030517578125, "global_step": 349594, "epoch": 2080} {"train_loss": -12.091691970825195, "global_step": 349595, "epoch": 2080} {"train_loss": -11.673957824707031, "global_step": 349596, "epoch": 2080} {"train_loss": -12.254884719848633, "global_step": 349597, "epoch": 2080} {"train_loss": -12.221449851989746, "global_step": 349598, "epoch": 2080} {"train_loss": -12.305736541748047, "global_step": 349599, "epoch": 2080} {"train_loss": -12.354690551757812, "global_step": 349600, "epoch": 2080} {"train_loss": -12.203965187072754, "global_step": 349601, "epoch": 2080} {"train_loss": -12.459514617919922, "global_step": 349602, "epoch": 2080} {"train_loss": -12.425627708435059, "global_step": 349603, "epoch": 2080} {"train_loss": -11.940869331359863, "global_step": 349604, "epoch": 2080} {"train_loss": -12.308128356933594, "global_step": 349605, "epoch": 2080} {"train_loss": -12.313727378845215, "global_step": 349606, "epoch": 2080} {"train_loss": -11.919230143229166, "global_step": 349607, "epoch": 2080, "val_loss": 287004.84375, "train_action_mse_error": 1.5453864336013794} {"train_loss": -12.325843811035156, "global_step": 349608, "epoch": 2081} {"train_loss": -12.073284149169922, "global_step": 349609, "epoch": 2081} {"train_loss": -12.256134033203125, "global_step": 349610, "epoch": 2081} {"train_loss": -12.372621536254883, "global_step": 349611, "epoch": 2081} {"train_loss": -12.170999526977539, "global_step": 349612, "epoch": 2081} {"train_loss": -12.431367874145508, "global_step": 349613, "epoch": 2081} {"train_loss": -12.282670021057129, "global_step": 349614, "epoch": 2081} {"train_loss": -12.366050720214844, "global_step": 349615, "epoch": 2081} {"train_loss": -12.447668075561523, "global_step": 349616, "epoch": 2081} {"train_loss": -12.263635635375977, "global_step": 349617, "epoch": 2081} {"train_loss": -12.214025497436523, "global_step": 349618, "epoch": 2081} {"train_loss": -12.314759254455566, "global_step": 349619, "epoch": 2081} {"train_loss": -12.556770324707031, "global_step": 349620, "epoch": 2081} {"train_loss": -12.44434928894043, "global_step": 349621, "epoch": 2081} {"train_loss": -12.505934715270996, "global_step": 349622, "epoch": 2081} {"train_loss": -12.139127731323242, "global_step": 349623, "epoch": 2081} {"train_loss": -12.589624404907227, "global_step": 349624, "epoch": 2081} {"train_loss": -12.386358261108398, "global_step": 349625, "epoch": 2081} {"train_loss": -12.575572967529297, "global_step": 349626, "epoch": 2081} {"train_loss": -12.630245208740234, "global_step": 349627, "epoch": 2081} {"train_loss": -12.51994514465332, "global_step": 349628, "epoch": 2081} {"train_loss": -12.388338088989258, "global_step": 349629, "epoch": 2081} {"train_loss": -12.576425552368164, "global_step": 349630, "epoch": 2081} {"train_loss": -12.673952102661133, "global_step": 349631, "epoch": 2081} {"train_loss": -12.430025100708008, "global_step": 349632, "epoch": 2081} {"train_loss": -12.508476257324219, "global_step": 349633, "epoch": 2081} {"train_loss": -12.583536148071289, "global_step": 349634, "epoch": 2081} {"train_loss": -12.679094314575195, "global_step": 349635, "epoch": 2081} {"train_loss": -12.639938354492188, "global_step": 349636, "epoch": 2081} {"train_loss": -12.609407424926758, "global_step": 349637, "epoch": 2081} {"train_loss": -12.383602142333984, "global_step": 349638, "epoch": 2081} {"train_loss": -12.65734577178955, "global_step": 349639, "epoch": 2081} {"train_loss": -12.50693416595459, "global_step": 349640, "epoch": 2081} {"train_loss": -12.415643692016602, "global_step": 349641, "epoch": 2081} {"train_loss": -12.464359283447266, "global_step": 349642, "epoch": 2081} {"train_loss": -12.619781494140625, "global_step": 349643, "epoch": 2081} {"train_loss": -12.486289024353027, "global_step": 349644, "epoch": 2081} {"train_loss": -12.474321365356445, "global_step": 349645, "epoch": 2081} {"train_loss": -12.403575897216797, "global_step": 349646, "epoch": 2081} {"train_loss": -12.662970542907715, "global_step": 349647, "epoch": 2081} {"train_loss": -12.346429824829102, "global_step": 349648, "epoch": 2081} {"train_loss": -12.56300163269043, "global_step": 349649, "epoch": 2081} {"train_loss": -12.352038383483887, "global_step": 349650, "epoch": 2081} {"train_loss": -12.513319969177246, "global_step": 349651, "epoch": 2081} {"train_loss": -12.197449684143066, "global_step": 349652, "epoch": 2081} {"train_loss": -11.840872764587402, "global_step": 349653, "epoch": 2081} {"train_loss": -12.583762168884277, "global_step": 349654, "epoch": 2081} {"train_loss": -12.31556510925293, "global_step": 349655, "epoch": 2081} {"train_loss": -11.905375480651855, "global_step": 349656, "epoch": 2081} {"train_loss": -12.051504135131836, "global_step": 349657, "epoch": 2081} {"train_loss": -12.531129837036133, "global_step": 349658, "epoch": 2081} {"train_loss": -11.974991798400879, "global_step": 349659, "epoch": 2081} {"train_loss": -11.417781829833984, "global_step": 349660, "epoch": 2081} {"train_loss": -12.113349914550781, "global_step": 349661, "epoch": 2081} {"train_loss": -12.441969871520996, "global_step": 349662, "epoch": 2081} {"train_loss": -12.237992286682129, "global_step": 349663, "epoch": 2081} {"train_loss": -12.099040985107422, "global_step": 349664, "epoch": 2081} {"train_loss": -12.319568634033203, "global_step": 349665, "epoch": 2081} {"train_loss": -12.494794845581055, "global_step": 349666, "epoch": 2081} {"train_loss": -12.02774429321289, "global_step": 349667, "epoch": 2081} {"train_loss": -11.99289321899414, "global_step": 349668, "epoch": 2081} {"train_loss": -12.297245979309082, "global_step": 349669, "epoch": 2081} {"train_loss": -11.978100776672363, "global_step": 349670, "epoch": 2081} {"train_loss": -12.349274635314941, "global_step": 349671, "epoch": 2081} {"train_loss": -12.148357391357422, "global_step": 349672, "epoch": 2081} {"train_loss": -12.375944137573242, "global_step": 349673, "epoch": 2081} {"train_loss": -11.905439376831055, "global_step": 349674, "epoch": 2081} {"train_loss": -12.12592887878418, "global_step": 349675, "epoch": 2081} {"train_loss": -11.501254081726074, "global_step": 349676, "epoch": 2081} {"train_loss": -11.983951568603516, "global_step": 349677, "epoch": 2081} {"train_loss": -11.339299201965332, "global_step": 349678, "epoch": 2081} {"train_loss": -12.036626815795898, "global_step": 349679, "epoch": 2081} {"train_loss": -12.437536239624023, "global_step": 349680, "epoch": 2081} {"train_loss": -12.332771301269531, "global_step": 349681, "epoch": 2081} {"train_loss": -12.50117015838623, "global_step": 349682, "epoch": 2081} {"train_loss": -12.394538879394531, "global_step": 349683, "epoch": 2081} {"train_loss": -12.403690338134766, "global_step": 349684, "epoch": 2081} {"train_loss": -12.365921020507812, "global_step": 349685, "epoch": 2081} {"train_loss": -12.327792167663574, "global_step": 349686, "epoch": 2081} {"train_loss": -12.22216510772705, "global_step": 349687, "epoch": 2081} {"train_loss": -12.105132102966309, "global_step": 349688, "epoch": 2081} {"train_loss": -12.574569702148438, "global_step": 349689, "epoch": 2081} {"train_loss": -12.469217300415039, "global_step": 349690, "epoch": 2081} {"train_loss": -12.31109619140625, "global_step": 349691, "epoch": 2081} {"train_loss": -12.022228240966797, "global_step": 349692, "epoch": 2081} {"train_loss": -12.431931495666504, "global_step": 349693, "epoch": 2081} {"train_loss": -12.044279098510742, "global_step": 349694, "epoch": 2081} {"train_loss": -12.351325988769531, "global_step": 349695, "epoch": 2081} {"train_loss": -12.181584358215332, "global_step": 349696, "epoch": 2081} {"train_loss": -12.507938385009766, "global_step": 349697, "epoch": 2081} {"train_loss": -12.2319974899292, "global_step": 349698, "epoch": 2081} {"train_loss": -12.655912399291992, "global_step": 349699, "epoch": 2081} {"train_loss": -12.16206169128418, "global_step": 349700, "epoch": 2081} {"train_loss": -12.19588851928711, "global_step": 349701, "epoch": 2081} {"train_loss": -12.471699714660645, "global_step": 349702, "epoch": 2081} {"train_loss": -12.08433723449707, "global_step": 349703, "epoch": 2081} {"train_loss": -12.42862319946289, "global_step": 349704, "epoch": 2081} {"train_loss": -12.205402374267578, "global_step": 349705, "epoch": 2081} {"train_loss": -12.44387435913086, "global_step": 349706, "epoch": 2081} {"train_loss": -12.297828674316406, "global_step": 349707, "epoch": 2081} {"train_loss": -11.969138145446777, "global_step": 349708, "epoch": 2081} {"train_loss": -11.380046844482422, "global_step": 349709, "epoch": 2081} {"train_loss": -12.099477767944336, "global_step": 349710, "epoch": 2081} {"train_loss": -12.090986251831055, "global_step": 349711, "epoch": 2081} {"train_loss": -10.254201889038086, "global_step": 349712, "epoch": 2081} {"train_loss": -9.733476638793945, "global_step": 349713, "epoch": 2081} {"train_loss": -10.216606140136719, "global_step": 349714, "epoch": 2081} {"train_loss": -10.711033821105957, "global_step": 349715, "epoch": 2081} {"train_loss": -8.961241722106934, "global_step": 349716, "epoch": 2081} {"train_loss": -9.304332733154297, "global_step": 349717, "epoch": 2081} {"train_loss": -8.582293510437012, "global_step": 349718, "epoch": 2081} {"train_loss": -7.291852951049805, "global_step": 349719, "epoch": 2081} {"train_loss": -7.523567199707031, "global_step": 349720, "epoch": 2081} {"train_loss": -7.480489730834961, "global_step": 349721, "epoch": 2081} {"train_loss": -7.5658159255981445, "global_step": 349722, "epoch": 2081} {"train_loss": -8.297243118286133, "global_step": 349723, "epoch": 2081} {"train_loss": -8.05699348449707, "global_step": 349724, "epoch": 2081} {"train_loss": -7.086831569671631, "global_step": 349725, "epoch": 2081} {"train_loss": -8.509042739868164, "global_step": 349726, "epoch": 2081} {"train_loss": -7.802173137664795, "global_step": 349727, "epoch": 2081} {"train_loss": -7.777670860290527, "global_step": 349728, "epoch": 2081} {"train_loss": -8.405889511108398, "global_step": 349729, "epoch": 2081} {"train_loss": -9.281429290771484, "global_step": 349730, "epoch": 2081} {"train_loss": -9.096065521240234, "global_step": 349731, "epoch": 2081} {"train_loss": -9.398138999938965, "global_step": 349732, "epoch": 2081} {"train_loss": -10.638208389282227, "global_step": 349733, "epoch": 2081} {"train_loss": -10.685417175292969, "global_step": 349734, "epoch": 2081} {"train_loss": -9.925483703613281, "global_step": 349735, "epoch": 2081} {"train_loss": -10.688737869262695, "global_step": 349736, "epoch": 2081} {"train_loss": -10.45449447631836, "global_step": 349737, "epoch": 2081} {"train_loss": -10.755786895751953, "global_step": 349738, "epoch": 2081} {"train_loss": -10.579290390014648, "global_step": 349739, "epoch": 2081} {"train_loss": -11.255105018615723, "global_step": 349740, "epoch": 2081} {"train_loss": -10.73147201538086, "global_step": 349741, "epoch": 2081} {"train_loss": -11.604795455932617, "global_step": 349742, "epoch": 2081} {"train_loss": -11.708641052246094, "global_step": 349743, "epoch": 2081} {"train_loss": -11.412894248962402, "global_step": 349744, "epoch": 2081} {"train_loss": -11.50614070892334, "global_step": 349745, "epoch": 2081} {"train_loss": -11.477838516235352, "global_step": 349746, "epoch": 2081} {"train_loss": -11.728438377380371, "global_step": 349747, "epoch": 2081} {"train_loss": -11.857316970825195, "global_step": 349748, "epoch": 2081} {"train_loss": -11.458539009094238, "global_step": 349749, "epoch": 2081} {"train_loss": -11.39794635772705, "global_step": 349750, "epoch": 2081} {"train_loss": -11.511655807495117, "global_step": 349751, "epoch": 2081} {"train_loss": -11.556707382202148, "global_step": 349752, "epoch": 2081} {"train_loss": -11.824316024780273, "global_step": 349753, "epoch": 2081} {"train_loss": -11.688241004943848, "global_step": 349754, "epoch": 2081} {"train_loss": -11.547201156616211, "global_step": 349755, "epoch": 2081} {"train_loss": -11.623783111572266, "global_step": 349756, "epoch": 2081} {"train_loss": -11.678873062133789, "global_step": 349757, "epoch": 2081} {"train_loss": -11.931619644165039, "global_step": 349758, "epoch": 2081} {"train_loss": -11.778400421142578, "global_step": 349759, "epoch": 2081} {"train_loss": -11.918893814086914, "global_step": 349760, "epoch": 2081} {"train_loss": -11.583089828491211, "global_step": 349761, "epoch": 2081} {"train_loss": -12.053128242492676, "global_step": 349762, "epoch": 2081} {"train_loss": -11.688044548034668, "global_step": 349763, "epoch": 2081} {"train_loss": -12.074283599853516, "global_step": 349764, "epoch": 2081} {"train_loss": -11.865772247314453, "global_step": 349765, "epoch": 2081} {"train_loss": -11.997356414794922, "global_step": 349766, "epoch": 2081} {"train_loss": -11.810568809509277, "global_step": 349767, "epoch": 2081} {"train_loss": -12.453493118286133, "global_step": 349768, "epoch": 2081} {"train_loss": -11.875714302062988, "global_step": 349769, "epoch": 2081} {"train_loss": -12.1722993850708, "global_step": 349770, "epoch": 2081} {"train_loss": -11.757503509521484, "global_step": 349771, "epoch": 2081} {"train_loss": -12.231754302978516, "global_step": 349772, "epoch": 2081} {"train_loss": -12.117645263671875, "global_step": 349773, "epoch": 2081} {"train_loss": -12.229597091674805, "global_step": 349774, "epoch": 2081} {"train_loss": -11.650659277325584, "global_step": 349775, "epoch": 2081, "val_loss": 281534.5} {"train_loss": -12.247304916381836, "global_step": 349776, "epoch": 2082} {"train_loss": -12.021722793579102, "global_step": 349777, "epoch": 2082} {"train_loss": -11.986507415771484, "global_step": 349778, "epoch": 2082} {"train_loss": -11.971271514892578, "global_step": 349779, "epoch": 2082} {"train_loss": -11.92599868774414, "global_step": 349780, "epoch": 2082} {"train_loss": -11.990646362304688, "global_step": 349781, "epoch": 2082} {"train_loss": -12.019887924194336, "global_step": 349782, "epoch": 2082} {"train_loss": -12.181636810302734, "global_step": 349783, "epoch": 2082} {"train_loss": -11.990477561950684, "global_step": 349784, "epoch": 2082} {"train_loss": -12.047603607177734, "global_step": 349785, "epoch": 2082} {"train_loss": -12.278398513793945, "global_step": 349786, "epoch": 2082} {"train_loss": -12.110908508300781, "global_step": 349787, "epoch": 2082} {"train_loss": -12.078862190246582, "global_step": 349788, "epoch": 2082} {"train_loss": -12.20566177368164, "global_step": 349789, "epoch": 2082} {"train_loss": -12.376494407653809, "global_step": 349790, "epoch": 2082} {"train_loss": -12.334785461425781, "global_step": 349791, "epoch": 2082} {"train_loss": -12.449295997619629, "global_step": 349792, "epoch": 2082} {"train_loss": -12.162015914916992, "global_step": 349793, "epoch": 2082} {"train_loss": -12.355612754821777, "global_step": 349794, "epoch": 2082} {"train_loss": -12.585079193115234, "global_step": 349795, "epoch": 2082} {"train_loss": -12.455520629882812, "global_step": 349796, "epoch": 2082} {"train_loss": -12.515768051147461, "global_step": 349797, "epoch": 2082} {"train_loss": -12.244187355041504, "global_step": 349798, "epoch": 2082} {"train_loss": -12.323695182800293, "global_step": 349799, "epoch": 2082} {"train_loss": -12.302413940429688, "global_step": 349800, "epoch": 2082} {"train_loss": -12.274518966674805, "global_step": 349801, "epoch": 2082} {"train_loss": -12.194467544555664, "global_step": 349802, "epoch": 2082} {"train_loss": -12.058022499084473, "global_step": 349803, "epoch": 2082} {"train_loss": -12.139551162719727, "global_step": 349804, "epoch": 2082} {"train_loss": -12.236189842224121, "global_step": 349805, "epoch": 2082} {"train_loss": -11.987762451171875, "global_step": 349806, "epoch": 2082} {"train_loss": -12.511265754699707, "global_step": 349807, "epoch": 2082} {"train_loss": -12.396116256713867, "global_step": 349808, "epoch": 2082} {"train_loss": -12.309330940246582, "global_step": 349809, "epoch": 2082} {"train_loss": -12.554129600524902, "global_step": 349810, "epoch": 2082} {"train_loss": -11.977694511413574, "global_step": 349811, "epoch": 2082} {"train_loss": -12.24911880493164, "global_step": 349812, "epoch": 2082} {"train_loss": -11.636366844177246, "global_step": 349813, "epoch": 2082} {"train_loss": -11.899426460266113, "global_step": 349814, "epoch": 2082} {"train_loss": -11.508180618286133, "global_step": 349815, "epoch": 2082} {"train_loss": -12.139578819274902, "global_step": 349816, "epoch": 2082} {"train_loss": -10.375977516174316, "global_step": 349817, "epoch": 2082} {"train_loss": -11.379691123962402, "global_step": 349818, "epoch": 2082} {"train_loss": -12.031461715698242, "global_step": 349819, "epoch": 2082} {"train_loss": -11.423529624938965, "global_step": 349820, "epoch": 2082} {"train_loss": -11.724371910095215, "global_step": 349821, "epoch": 2082} {"train_loss": -10.99161148071289, "global_step": 349822, "epoch": 2082} {"train_loss": -11.93668270111084, "global_step": 349823, "epoch": 2082} {"train_loss": -11.269553184509277, "global_step": 349824, "epoch": 2082} {"train_loss": -11.61994743347168, "global_step": 349825, "epoch": 2082} {"train_loss": -11.613851547241211, "global_step": 349826, "epoch": 2082} {"train_loss": -11.486205101013184, "global_step": 349827, "epoch": 2082} {"train_loss": -11.778413772583008, "global_step": 349828, "epoch": 2082} {"train_loss": -11.424678802490234, "global_step": 349829, "epoch": 2082} {"train_loss": -12.035561561584473, "global_step": 349830, "epoch": 2082} {"train_loss": -11.522161483764648, "global_step": 349831, "epoch": 2082} {"train_loss": -11.62702751159668, "global_step": 349832, "epoch": 2082} {"train_loss": -12.093019485473633, "global_step": 349833, "epoch": 2082} {"train_loss": -11.47348403930664, "global_step": 349834, "epoch": 2082} {"train_loss": -12.260972023010254, "global_step": 349835, "epoch": 2082} {"train_loss": -11.957475662231445, "global_step": 349836, "epoch": 2082} {"train_loss": -11.615699768066406, "global_step": 349837, "epoch": 2082} {"train_loss": -12.410697937011719, "global_step": 349838, "epoch": 2082} {"train_loss": -11.561506271362305, "global_step": 349839, "epoch": 2082} {"train_loss": -11.428357124328613, "global_step": 349840, "epoch": 2082} {"train_loss": -11.541369438171387, "global_step": 349841, "epoch": 2082} {"train_loss": -12.20879077911377, "global_step": 349842, "epoch": 2082} {"train_loss": -12.057720184326172, "global_step": 349843, "epoch": 2082} {"train_loss": -12.156936645507812, "global_step": 349844, "epoch": 2082} {"train_loss": -12.308259963989258, "global_step": 349845, "epoch": 2082} {"train_loss": -11.857056617736816, "global_step": 349846, "epoch": 2082} {"train_loss": -12.281076431274414, "global_step": 349847, "epoch": 2082} {"train_loss": -11.984774589538574, "global_step": 349848, "epoch": 2082} {"train_loss": -12.17685604095459, "global_step": 349849, "epoch": 2082} {"train_loss": -12.357450485229492, "global_step": 349850, "epoch": 2082} {"train_loss": -11.916853904724121, "global_step": 349851, "epoch": 2082} {"train_loss": -12.43083381652832, "global_step": 349852, "epoch": 2082} {"train_loss": -12.180975914001465, "global_step": 349853, "epoch": 2082} {"train_loss": -12.658914566040039, "global_step": 349854, "epoch": 2082} {"train_loss": -12.168949127197266, "global_step": 349855, "epoch": 2082} {"train_loss": -12.378912925720215, "global_step": 349856, "epoch": 2082} {"train_loss": -12.025838851928711, "global_step": 349857, "epoch": 2082} {"train_loss": -12.339254379272461, "global_step": 349858, "epoch": 2082} {"train_loss": -11.89647102355957, "global_step": 349859, "epoch": 2082} {"train_loss": -12.411160469055176, "global_step": 349860, "epoch": 2082} {"train_loss": -12.08837890625, "global_step": 349861, "epoch": 2082} {"train_loss": -11.997478485107422, "global_step": 349862, "epoch": 2082} {"train_loss": -11.932821273803711, "global_step": 349863, "epoch": 2082} {"train_loss": -12.03874397277832, "global_step": 349864, "epoch": 2082} {"train_loss": -11.569025039672852, "global_step": 349865, "epoch": 2082} {"train_loss": -12.296645164489746, "global_step": 349866, "epoch": 2082} {"train_loss": -11.624818801879883, "global_step": 349867, "epoch": 2082} {"train_loss": -12.40594482421875, "global_step": 349868, "epoch": 2082} {"train_loss": -11.948209762573242, "global_step": 349869, "epoch": 2082} {"train_loss": -11.861001968383789, "global_step": 349870, "epoch": 2082} {"train_loss": -11.960084915161133, "global_step": 349871, "epoch": 2082} {"train_loss": -12.49265193939209, "global_step": 349872, "epoch": 2082} {"train_loss": -11.979597091674805, "global_step": 349873, "epoch": 2082} {"train_loss": -12.090812683105469, "global_step": 349874, "epoch": 2082} {"train_loss": -12.255083084106445, "global_step": 349875, "epoch": 2082} {"train_loss": -12.141246795654297, "global_step": 349876, "epoch": 2082} {"train_loss": -12.24991512298584, "global_step": 349877, "epoch": 2082} {"train_loss": -12.13006591796875, "global_step": 349878, "epoch": 2082} {"train_loss": -12.05910873413086, "global_step": 349879, "epoch": 2082} {"train_loss": -12.304908752441406, "global_step": 349880, "epoch": 2082} {"train_loss": -12.232247352600098, "global_step": 349881, "epoch": 2082} {"train_loss": -12.197418212890625, "global_step": 349882, "epoch": 2082} {"train_loss": -12.040081024169922, "global_step": 349883, "epoch": 2082} {"train_loss": -10.910669326782227, "global_step": 349884, "epoch": 2082} {"train_loss": -11.997478485107422, "global_step": 349885, "epoch": 2082} {"train_loss": -11.06977367401123, "global_step": 349886, "epoch": 2082} {"train_loss": -11.762271881103516, "global_step": 349887, "epoch": 2082} {"train_loss": -10.961159706115723, "global_step": 349888, "epoch": 2082} {"train_loss": -10.471050262451172, "global_step": 349889, "epoch": 2082} {"train_loss": -11.531930923461914, "global_step": 349890, "epoch": 2082} {"train_loss": -11.792537689208984, "global_step": 349891, "epoch": 2082} {"train_loss": -11.800742149353027, "global_step": 349892, "epoch": 2082} {"train_loss": -10.996319770812988, "global_step": 349893, "epoch": 2082} {"train_loss": -11.264410018920898, "global_step": 349894, "epoch": 2082} {"train_loss": -11.654449462890625, "global_step": 349895, "epoch": 2082} {"train_loss": -11.184188842773438, "global_step": 349896, "epoch": 2082} {"train_loss": -11.40186882019043, "global_step": 349897, "epoch": 2082} {"train_loss": -11.531037330627441, "global_step": 349898, "epoch": 2082} {"train_loss": -11.537179946899414, "global_step": 349899, "epoch": 2082} {"train_loss": -11.617042541503906, "global_step": 349900, "epoch": 2082} {"train_loss": -11.120054244995117, "global_step": 349901, "epoch": 2082} {"train_loss": -10.993585586547852, "global_step": 349902, "epoch": 2082} {"train_loss": -12.110913276672363, "global_step": 349903, "epoch": 2082} {"train_loss": -11.066542625427246, "global_step": 349904, "epoch": 2082} {"train_loss": -11.87921142578125, "global_step": 349905, "epoch": 2082} {"train_loss": -10.822151184082031, "global_step": 349906, "epoch": 2082} {"train_loss": -11.02767562866211, "global_step": 349907, "epoch": 2082} {"train_loss": -11.63505744934082, "global_step": 349908, "epoch": 2082} {"train_loss": -11.923471450805664, "global_step": 349909, "epoch": 2082} {"train_loss": -11.851126670837402, "global_step": 349910, "epoch": 2082} {"train_loss": -11.034847259521484, "global_step": 349911, "epoch": 2082} {"train_loss": -11.802043914794922, "global_step": 349912, "epoch": 2082} {"train_loss": -11.173181533813477, "global_step": 349913, "epoch": 2082} {"train_loss": -11.76585865020752, "global_step": 349914, "epoch": 2082} {"train_loss": -11.18361759185791, "global_step": 349915, "epoch": 2082} {"train_loss": -11.222939491271973, "global_step": 349916, "epoch": 2082} {"train_loss": -12.112919807434082, "global_step": 349917, "epoch": 2082} {"train_loss": -10.36564826965332, "global_step": 349918, "epoch": 2082} {"train_loss": -12.183279991149902, "global_step": 349919, "epoch": 2082} {"train_loss": -10.783288955688477, "global_step": 349920, "epoch": 2082} {"train_loss": -11.56856632232666, "global_step": 349921, "epoch": 2082} {"train_loss": -11.214845657348633, "global_step": 349922, "epoch": 2082} {"train_loss": -10.933414459228516, "global_step": 349923, "epoch": 2082} {"train_loss": -11.626514434814453, "global_step": 349924, "epoch": 2082} {"train_loss": -10.429677963256836, "global_step": 349925, "epoch": 2082} {"train_loss": -11.937808990478516, "global_step": 349926, "epoch": 2082} {"train_loss": -10.904022216796875, "global_step": 349927, "epoch": 2082} {"train_loss": -11.292623519897461, "global_step": 349928, "epoch": 2082} {"train_loss": -11.003328323364258, "global_step": 349929, "epoch": 2082} {"train_loss": -11.30417251586914, "global_step": 349930, "epoch": 2082} {"train_loss": -11.314325332641602, "global_step": 349931, "epoch": 2082} {"train_loss": -12.138040542602539, "global_step": 349932, "epoch": 2082} {"train_loss": -11.296915054321289, "global_step": 349933, "epoch": 2082} {"train_loss": -12.225180625915527, "global_step": 349934, "epoch": 2082} {"train_loss": -11.623058319091797, "global_step": 349935, "epoch": 2082} {"train_loss": -12.134875297546387, "global_step": 349936, "epoch": 2082} {"train_loss": -11.641963958740234, "global_step": 349937, "epoch": 2082} {"train_loss": -12.05668830871582, "global_step": 349938, "epoch": 2082} {"train_loss": -11.801843643188477, "global_step": 349939, "epoch": 2082} {"train_loss": -12.211816787719727, "global_step": 349940, "epoch": 2082} {"train_loss": -11.768306732177734, "global_step": 349941, "epoch": 2082} {"train_loss": -12.160491943359375, "global_step": 349942, "epoch": 2082} {"train_loss": -11.829429626464844, "global_step": 349943, "epoch": 2082, "val_loss": 290633.84375} {"train_loss": -12.183338165283203, "global_step": 349944, "epoch": 2083} {"train_loss": -11.75212287902832, "global_step": 349945, "epoch": 2083} {"train_loss": -12.181671142578125, "global_step": 349946, "epoch": 2083} {"train_loss": -12.04339599609375, "global_step": 349947, "epoch": 2083} {"train_loss": -12.295759201049805, "global_step": 349948, "epoch": 2083} {"train_loss": -12.263633728027344, "global_step": 349949, "epoch": 2083} {"train_loss": -12.278175354003906, "global_step": 349950, "epoch": 2083} {"train_loss": -12.36098861694336, "global_step": 349951, "epoch": 2083} {"train_loss": -12.243136405944824, "global_step": 349952, "epoch": 2083} {"train_loss": -12.287321090698242, "global_step": 349953, "epoch": 2083} {"train_loss": -12.377509117126465, "global_step": 349954, "epoch": 2083} {"train_loss": -12.25186824798584, "global_step": 349955, "epoch": 2083} {"train_loss": -12.324859619140625, "global_step": 349956, "epoch": 2083} {"train_loss": -12.172983169555664, "global_step": 349957, "epoch": 2083} {"train_loss": -12.111632347106934, "global_step": 349958, "epoch": 2083} {"train_loss": -12.247902870178223, "global_step": 349959, "epoch": 2083} {"train_loss": -12.405166625976562, "global_step": 349960, "epoch": 2083} {"train_loss": -12.267948150634766, "global_step": 349961, "epoch": 2083} {"train_loss": -12.276362419128418, "global_step": 349962, "epoch": 2083} {"train_loss": -12.187037467956543, "global_step": 349963, "epoch": 2083} {"train_loss": -12.276739120483398, "global_step": 349964, "epoch": 2083} {"train_loss": -12.463528633117676, "global_step": 349965, "epoch": 2083} {"train_loss": -12.280606269836426, "global_step": 349966, "epoch": 2083} {"train_loss": -12.396675109863281, "global_step": 349967, "epoch": 2083} {"train_loss": -12.341702461242676, "global_step": 349968, "epoch": 2083} {"train_loss": -12.542448997497559, "global_step": 349969, "epoch": 2083} {"train_loss": -12.455900192260742, "global_step": 349970, "epoch": 2083} {"train_loss": -12.227344512939453, "global_step": 349971, "epoch": 2083} {"train_loss": -12.358851432800293, "global_step": 349972, "epoch": 2083} {"train_loss": -12.357763290405273, "global_step": 349973, "epoch": 2083} {"train_loss": -12.447851181030273, "global_step": 349974, "epoch": 2083} {"train_loss": -12.441162109375, "global_step": 349975, "epoch": 2083} {"train_loss": -12.309553146362305, "global_step": 349976, "epoch": 2083} {"train_loss": -12.262771606445312, "global_step": 349977, "epoch": 2083} {"train_loss": -12.518351554870605, "global_step": 349978, "epoch": 2083} {"train_loss": -12.354260444641113, "global_step": 349979, "epoch": 2083} {"train_loss": -12.174092292785645, "global_step": 349980, "epoch": 2083} {"train_loss": -12.664779663085938, "global_step": 349981, "epoch": 2083} {"train_loss": -12.22910213470459, "global_step": 349982, "epoch": 2083} {"train_loss": -12.618284225463867, "global_step": 349983, "epoch": 2083} {"train_loss": -12.742316246032715, "global_step": 349984, "epoch": 2083} {"train_loss": -12.57409954071045, "global_step": 349985, "epoch": 2083} {"train_loss": -12.35598373413086, "global_step": 349986, "epoch": 2083} {"train_loss": -12.292654037475586, "global_step": 349987, "epoch": 2083} {"train_loss": -12.462493896484375, "global_step": 349988, "epoch": 2083} {"train_loss": -12.568855285644531, "global_step": 349989, "epoch": 2083} {"train_loss": -12.43316650390625, "global_step": 349990, "epoch": 2083} {"train_loss": -12.625329971313477, "global_step": 349991, "epoch": 2083} {"train_loss": -12.328567504882812, "global_step": 349992, "epoch": 2083} {"train_loss": -12.646584510803223, "global_step": 349993, "epoch": 2083} {"train_loss": -12.479005813598633, "global_step": 349994, "epoch": 2083} {"train_loss": -12.679814338684082, "global_step": 349995, "epoch": 2083} {"train_loss": -12.53441333770752, "global_step": 349996, "epoch": 2083} {"train_loss": -12.738801002502441, "global_step": 349997, "epoch": 2083} {"train_loss": -12.586895942687988, "global_step": 349998, "epoch": 2083} {"train_loss": -12.501681327819824, "global_step": 349999, "epoch": 2083} {"train_loss": -12.509841918945312, "global_step": 350000, "epoch": 2083} {"train_loss": -12.61988639831543, "global_step": 350001, "epoch": 2083} {"train_loss": -12.277116775512695, "global_step": 350002, "epoch": 2083} {"train_loss": -12.453034400939941, "global_step": 350003, "epoch": 2083} {"train_loss": -12.60443115234375, "global_step": 350004, "epoch": 2083} {"train_loss": -12.503549575805664, "global_step": 350005, "epoch": 2083} {"train_loss": -12.373342514038086, "global_step": 350006, "epoch": 2083} {"train_loss": -12.522117614746094, "global_step": 350007, "epoch": 2083} {"train_loss": -12.80643081665039, "global_step": 350008, "epoch": 2083} {"train_loss": -12.489856719970703, "global_step": 350009, "epoch": 2083} {"train_loss": -12.29941177368164, "global_step": 350010, "epoch": 2083} {"train_loss": -12.289191246032715, "global_step": 350011, "epoch": 2083} {"train_loss": -11.772987365722656, "global_step": 350012, "epoch": 2083} {"train_loss": -11.929952621459961, "global_step": 350013, "epoch": 2083} {"train_loss": -11.651718139648438, "global_step": 350014, "epoch": 2083} {"train_loss": -12.231359481811523, "global_step": 350015, "epoch": 2083} {"train_loss": -10.48062515258789, "global_step": 350016, "epoch": 2083} {"train_loss": -12.226652145385742, "global_step": 350017, "epoch": 2083} {"train_loss": -11.241531372070312, "global_step": 350018, "epoch": 2083} {"train_loss": -11.268234252929688, "global_step": 350019, "epoch": 2083} {"train_loss": -10.733831405639648, "global_step": 350020, "epoch": 2083} {"train_loss": -12.605133056640625, "global_step": 350021, "epoch": 2083} {"train_loss": -11.18671989440918, "global_step": 350022, "epoch": 2083} {"train_loss": -11.874256134033203, "global_step": 350023, "epoch": 2083} {"train_loss": -11.73379135131836, "global_step": 350024, "epoch": 2083} {"train_loss": -12.008241653442383, "global_step": 350025, "epoch": 2083} {"train_loss": -10.35624885559082, "global_step": 350026, "epoch": 2083} {"train_loss": -11.5350341796875, "global_step": 350027, "epoch": 2083} {"train_loss": -10.965774536132812, "global_step": 350028, "epoch": 2083} {"train_loss": -9.900884628295898, "global_step": 350029, "epoch": 2083} {"train_loss": -12.26761245727539, "global_step": 350030, "epoch": 2083} {"train_loss": -9.065633773803711, "global_step": 350031, "epoch": 2083} {"train_loss": -11.340479850769043, "global_step": 350032, "epoch": 2083} {"train_loss": -10.039692878723145, "global_step": 350033, "epoch": 2083} {"train_loss": -11.759153366088867, "global_step": 350034, "epoch": 2083} {"train_loss": -10.919090270996094, "global_step": 350035, "epoch": 2083} {"train_loss": -10.828265190124512, "global_step": 350036, "epoch": 2083} {"train_loss": -11.271836280822754, "global_step": 350037, "epoch": 2083} {"train_loss": -10.021526336669922, "global_step": 350038, "epoch": 2083} {"train_loss": -11.540122985839844, "global_step": 350039, "epoch": 2083} {"train_loss": -9.919017791748047, "global_step": 350040, "epoch": 2083} {"train_loss": -11.853278160095215, "global_step": 350041, "epoch": 2083} {"train_loss": -11.112316131591797, "global_step": 350042, "epoch": 2083} {"train_loss": -11.814579010009766, "global_step": 350043, "epoch": 2083} {"train_loss": -11.13830280303955, "global_step": 350044, "epoch": 2083} {"train_loss": -11.46899700164795, "global_step": 350045, "epoch": 2083} {"train_loss": -11.853631973266602, "global_step": 350046, "epoch": 2083} {"train_loss": -11.488977432250977, "global_step": 350047, "epoch": 2083} {"train_loss": -11.951238632202148, "global_step": 350048, "epoch": 2083} {"train_loss": -11.779041290283203, "global_step": 350049, "epoch": 2083} {"train_loss": -11.983566284179688, "global_step": 350050, "epoch": 2083} {"train_loss": -12.040815353393555, "global_step": 350051, "epoch": 2083} {"train_loss": -11.29336929321289, "global_step": 350052, "epoch": 2083} {"train_loss": -12.019876480102539, "global_step": 350053, "epoch": 2083} {"train_loss": -11.816357612609863, "global_step": 350054, "epoch": 2083} {"train_loss": -12.054203033447266, "global_step": 350055, "epoch": 2083} {"train_loss": -12.196718215942383, "global_step": 350056, "epoch": 2083} {"train_loss": -11.719100952148438, "global_step": 350057, "epoch": 2083} {"train_loss": -12.114846229553223, "global_step": 350058, "epoch": 2083} {"train_loss": -11.945436477661133, "global_step": 350059, "epoch": 2083} {"train_loss": -12.25135612487793, "global_step": 350060, "epoch": 2083} {"train_loss": -12.15362548828125, "global_step": 350061, "epoch": 2083} {"train_loss": -12.351024627685547, "global_step": 350062, "epoch": 2083} {"train_loss": -12.43814468383789, "global_step": 350063, "epoch": 2083} {"train_loss": -12.201827049255371, "global_step": 350064, "epoch": 2083} {"train_loss": -12.24303150177002, "global_step": 350065, "epoch": 2083} {"train_loss": -12.553531646728516, "global_step": 350066, "epoch": 2083} {"train_loss": -12.469352722167969, "global_step": 350067, "epoch": 2083} {"train_loss": -12.284116744995117, "global_step": 350068, "epoch": 2083} {"train_loss": -12.359591484069824, "global_step": 350069, "epoch": 2083} {"train_loss": -12.206470489501953, "global_step": 350070, "epoch": 2083} {"train_loss": -12.423310279846191, "global_step": 350071, "epoch": 2083} {"train_loss": -12.358251571655273, "global_step": 350072, "epoch": 2083} {"train_loss": -12.152174949645996, "global_step": 350073, "epoch": 2083} {"train_loss": -12.547294616699219, "global_step": 350074, "epoch": 2083} {"train_loss": -12.584663391113281, "global_step": 350075, "epoch": 2083} {"train_loss": -12.294205665588379, "global_step": 350076, "epoch": 2083} {"train_loss": -12.596549034118652, "global_step": 350077, "epoch": 2083} {"train_loss": -12.350852012634277, "global_step": 350078, "epoch": 2083} {"train_loss": -12.476116180419922, "global_step": 350079, "epoch": 2083} {"train_loss": -12.5001220703125, "global_step": 350080, "epoch": 2083} {"train_loss": -12.221464157104492, "global_step": 350081, "epoch": 2083} {"train_loss": -12.537559509277344, "global_step": 350082, "epoch": 2083} {"train_loss": -12.483602523803711, "global_step": 350083, "epoch": 2083} {"train_loss": -12.361004829406738, "global_step": 350084, "epoch": 2083} {"train_loss": -12.33886432647705, "global_step": 350085, "epoch": 2083} {"train_loss": -12.534221649169922, "global_step": 350086, "epoch": 2083} {"train_loss": -12.412233352661133, "global_step": 350087, "epoch": 2083} {"train_loss": -12.355082511901855, "global_step": 350088, "epoch": 2083} {"train_loss": -12.61575698852539, "global_step": 350089, "epoch": 2083} {"train_loss": -12.429433822631836, "global_step": 350090, "epoch": 2083} {"train_loss": -12.45273208618164, "global_step": 350091, "epoch": 2083} {"train_loss": -12.458707809448242, "global_step": 350092, "epoch": 2083} {"train_loss": -12.435345649719238, "global_step": 350093, "epoch": 2083} {"train_loss": -12.228547096252441, "global_step": 350094, "epoch": 2083} {"train_loss": -12.729499816894531, "global_step": 350095, "epoch": 2083} {"train_loss": -12.106241226196289, "global_step": 350096, "epoch": 2083} {"train_loss": -12.322876930236816, "global_step": 350097, "epoch": 2083} {"train_loss": -12.35531234741211, "global_step": 350098, "epoch": 2083} {"train_loss": -12.632080078125, "global_step": 350099, "epoch": 2083} {"train_loss": -12.322011947631836, "global_step": 350100, "epoch": 2083} {"train_loss": -12.338218688964844, "global_step": 350101, "epoch": 2083} {"train_loss": -12.617971420288086, "global_step": 350102, "epoch": 2083} {"train_loss": -12.338278770446777, "global_step": 350103, "epoch": 2083} {"train_loss": -12.14042854309082, "global_step": 350104, "epoch": 2083} {"train_loss": -12.639495849609375, "global_step": 350105, "epoch": 2083} {"train_loss": -12.431373596191406, "global_step": 350106, "epoch": 2083} {"train_loss": -12.383434295654297, "global_step": 350107, "epoch": 2083} {"train_loss": -12.421552658081055, "global_step": 350108, "epoch": 2083} {"train_loss": -12.460235595703125, "global_step": 350109, "epoch": 2083} {"train_loss": -12.260505676269531, "global_step": 350110, "epoch": 2083} {"train_loss": -12.116453085626874, "global_step": 350111, "epoch": 2083, "val_loss": 286944.125} {"train_loss": -12.084615707397461, "global_step": 350112, "epoch": 2084} {"train_loss": -12.620172500610352, "global_step": 350113, "epoch": 2084} {"train_loss": -12.096794128417969, "global_step": 350114, "epoch": 2084} {"train_loss": -11.979935646057129, "global_step": 350115, "epoch": 2084} {"train_loss": -12.397911071777344, "global_step": 350116, "epoch": 2084} {"train_loss": -11.949068069458008, "global_step": 350117, "epoch": 2084} {"train_loss": -12.837451934814453, "global_step": 350118, "epoch": 2084} {"train_loss": -12.126504898071289, "global_step": 350119, "epoch": 2084} {"train_loss": -12.69377326965332, "global_step": 350120, "epoch": 2084} {"train_loss": -12.387214660644531, "global_step": 350121, "epoch": 2084} {"train_loss": -11.664422988891602, "global_step": 350122, "epoch": 2084} {"train_loss": -11.180168151855469, "global_step": 350123, "epoch": 2084} {"train_loss": -10.789490699768066, "global_step": 350124, "epoch": 2084} {"train_loss": -11.964035034179688, "global_step": 350125, "epoch": 2084} {"train_loss": -11.908105850219727, "global_step": 350126, "epoch": 2084} {"train_loss": -9.719598770141602, "global_step": 350127, "epoch": 2084} {"train_loss": -11.987045288085938, "global_step": 350128, "epoch": 2084} {"train_loss": -10.821049690246582, "global_step": 350129, "epoch": 2084} {"train_loss": -9.974466323852539, "global_step": 350130, "epoch": 2084} {"train_loss": -11.735172271728516, "global_step": 350131, "epoch": 2084} {"train_loss": -8.659194946289062, "global_step": 350132, "epoch": 2084} {"train_loss": -11.26376724243164, "global_step": 350133, "epoch": 2084} {"train_loss": -8.66445255279541, "global_step": 350134, "epoch": 2084} {"train_loss": -7.986896514892578, "global_step": 350135, "epoch": 2084} {"train_loss": -7.587881088256836, "global_step": 350136, "epoch": 2084} {"train_loss": -7.995192527770996, "global_step": 350137, "epoch": 2084} {"train_loss": -9.209513664245605, "global_step": 350138, "epoch": 2084} {"train_loss": -8.361130714416504, "global_step": 350139, "epoch": 2084} {"train_loss": -8.516592979431152, "global_step": 350140, "epoch": 2084} {"train_loss": -8.888099670410156, "global_step": 350141, "epoch": 2084} {"train_loss": -10.314963340759277, "global_step": 350142, "epoch": 2084} {"train_loss": -9.861702919006348, "global_step": 350143, "epoch": 2084} {"train_loss": -9.185768127441406, "global_step": 350144, "epoch": 2084} {"train_loss": -10.339916229248047, "global_step": 350145, "epoch": 2084} {"train_loss": -10.898284912109375, "global_step": 350146, "epoch": 2084} {"train_loss": -9.919891357421875, "global_step": 350147, "epoch": 2084} {"train_loss": -10.225425720214844, "global_step": 350148, "epoch": 2084} {"train_loss": -10.928351402282715, "global_step": 350149, "epoch": 2084} {"train_loss": -10.293424606323242, "global_step": 350150, "epoch": 2084} {"train_loss": -11.097049713134766, "global_step": 350151, "epoch": 2084} {"train_loss": -10.93427848815918, "global_step": 350152, "epoch": 2084} {"train_loss": -10.364204406738281, "global_step": 350153, "epoch": 2084} {"train_loss": -10.960285186767578, "global_step": 350154, "epoch": 2084} {"train_loss": -10.50028133392334, "global_step": 350155, "epoch": 2084} {"train_loss": -10.79159927368164, "global_step": 350156, "epoch": 2084} {"train_loss": -10.82808780670166, "global_step": 350157, "epoch": 2084} {"train_loss": -11.69913101196289, "global_step": 350158, "epoch": 2084} {"train_loss": -10.866305351257324, "global_step": 350159, "epoch": 2084} {"train_loss": -11.01482105255127, "global_step": 350160, "epoch": 2084} {"train_loss": -11.402714729309082, "global_step": 350161, "epoch": 2084} {"train_loss": -10.195127487182617, "global_step": 350162, "epoch": 2084} {"train_loss": -11.156730651855469, "global_step": 350163, "epoch": 2084} {"train_loss": -11.376888275146484, "global_step": 350164, "epoch": 2084} {"train_loss": -10.88425064086914, "global_step": 350165, "epoch": 2084} {"train_loss": -10.814470291137695, "global_step": 350166, "epoch": 2084} {"train_loss": -10.566000938415527, "global_step": 350167, "epoch": 2084} {"train_loss": -10.4464111328125, "global_step": 350168, "epoch": 2084} {"train_loss": -10.970632553100586, "global_step": 350169, "epoch": 2084} {"train_loss": -10.5252685546875, "global_step": 350170, "epoch": 2084} {"train_loss": -11.239788055419922, "global_step": 350171, "epoch": 2084} {"train_loss": -11.456799507141113, "global_step": 350172, "epoch": 2084} {"train_loss": -11.420194625854492, "global_step": 350173, "epoch": 2084} {"train_loss": -11.490367889404297, "global_step": 350174, "epoch": 2084} {"train_loss": -11.571592330932617, "global_step": 350175, "epoch": 2084} {"train_loss": -11.268360137939453, "global_step": 350176, "epoch": 2084} {"train_loss": -11.611186981201172, "global_step": 350177, "epoch": 2084} {"train_loss": -11.247031211853027, "global_step": 350178, "epoch": 2084} {"train_loss": -11.661402702331543, "global_step": 350179, "epoch": 2084} {"train_loss": -11.52260971069336, "global_step": 350180, "epoch": 2084} {"train_loss": -11.374454498291016, "global_step": 350181, "epoch": 2084} {"train_loss": -11.825272560119629, "global_step": 350182, "epoch": 2084} {"train_loss": -11.952028274536133, "global_step": 350183, "epoch": 2084} {"train_loss": -11.55428695678711, "global_step": 350184, "epoch": 2084} {"train_loss": -11.751401901245117, "global_step": 350185, "epoch": 2084} {"train_loss": -11.657703399658203, "global_step": 350186, "epoch": 2084} {"train_loss": -12.017363548278809, "global_step": 350187, "epoch": 2084} {"train_loss": -11.809457778930664, "global_step": 350188, "epoch": 2084} {"train_loss": -11.914957046508789, "global_step": 350189, "epoch": 2084} {"train_loss": -12.145530700683594, "global_step": 350190, "epoch": 2084} {"train_loss": -11.71921157836914, "global_step": 350191, "epoch": 2084} {"train_loss": -11.791886329650879, "global_step": 350192, "epoch": 2084} {"train_loss": -11.975236892700195, "global_step": 350193, "epoch": 2084} {"train_loss": -11.929365158081055, "global_step": 350194, "epoch": 2084} {"train_loss": -12.098978042602539, "global_step": 350195, "epoch": 2084} {"train_loss": -11.959372520446777, "global_step": 350196, "epoch": 2084} {"train_loss": -12.00340461730957, "global_step": 350197, "epoch": 2084} {"train_loss": -11.826003074645996, "global_step": 350198, "epoch": 2084} {"train_loss": -12.249290466308594, "global_step": 350199, "epoch": 2084} {"train_loss": -11.90933895111084, "global_step": 350200, "epoch": 2084} {"train_loss": -11.87834644317627, "global_step": 350201, "epoch": 2084} {"train_loss": -11.957242012023926, "global_step": 350202, "epoch": 2084} {"train_loss": -12.28309440612793, "global_step": 350203, "epoch": 2084} {"train_loss": -12.109613418579102, "global_step": 350204, "epoch": 2084} {"train_loss": -12.180697441101074, "global_step": 350205, "epoch": 2084} {"train_loss": -12.05459976196289, "global_step": 350206, "epoch": 2084} {"train_loss": -11.87453556060791, "global_step": 350207, "epoch": 2084} {"train_loss": -12.237983703613281, "global_step": 350208, "epoch": 2084} {"train_loss": -12.140678405761719, "global_step": 350209, "epoch": 2084} {"train_loss": -12.318778991699219, "global_step": 350210, "epoch": 2084} {"train_loss": -12.089884757995605, "global_step": 350211, "epoch": 2084} {"train_loss": -12.200091361999512, "global_step": 350212, "epoch": 2084} {"train_loss": -12.18679428100586, "global_step": 350213, "epoch": 2084} {"train_loss": -12.326704025268555, "global_step": 350214, "epoch": 2084} {"train_loss": -12.214982986450195, "global_step": 350215, "epoch": 2084} {"train_loss": -12.059558868408203, "global_step": 350216, "epoch": 2084} {"train_loss": -12.524473190307617, "global_step": 350217, "epoch": 2084} {"train_loss": -12.226847648620605, "global_step": 350218, "epoch": 2084} {"train_loss": -12.141559600830078, "global_step": 350219, "epoch": 2084} {"train_loss": -12.478455543518066, "global_step": 350220, "epoch": 2084} {"train_loss": -12.367576599121094, "global_step": 350221, "epoch": 2084} {"train_loss": -12.209936141967773, "global_step": 350222, "epoch": 2084} {"train_loss": -12.352568626403809, "global_step": 350223, "epoch": 2084} {"train_loss": -12.258638381958008, "global_step": 350224, "epoch": 2084} {"train_loss": -12.432378768920898, "global_step": 350225, "epoch": 2084} {"train_loss": -12.425834655761719, "global_step": 350226, "epoch": 2084} {"train_loss": -12.278305053710938, "global_step": 350227, "epoch": 2084} {"train_loss": -12.314189910888672, "global_step": 350228, "epoch": 2084} {"train_loss": -12.486766815185547, "global_step": 350229, "epoch": 2084} {"train_loss": -12.296056747436523, "global_step": 350230, "epoch": 2084} {"train_loss": -12.39425277709961, "global_step": 350231, "epoch": 2084} {"train_loss": -12.347702026367188, "global_step": 350232, "epoch": 2084} {"train_loss": -12.237834930419922, "global_step": 350233, "epoch": 2084} {"train_loss": -12.246147155761719, "global_step": 350234, "epoch": 2084} {"train_loss": -12.146492004394531, "global_step": 350235, "epoch": 2084} {"train_loss": -12.234201431274414, "global_step": 350236, "epoch": 2084} {"train_loss": -12.029820442199707, "global_step": 350237, "epoch": 2084} {"train_loss": -12.200931549072266, "global_step": 350238, "epoch": 2084} {"train_loss": -12.340457916259766, "global_step": 350239, "epoch": 2084} {"train_loss": -12.055007934570312, "global_step": 350240, "epoch": 2084} {"train_loss": -11.341941833496094, "global_step": 350241, "epoch": 2084} {"train_loss": -12.413129806518555, "global_step": 350242, "epoch": 2084} {"train_loss": -11.079447746276855, "global_step": 350243, "epoch": 2084} {"train_loss": -10.934022903442383, "global_step": 350244, "epoch": 2084} {"train_loss": -12.034137725830078, "global_step": 350245, "epoch": 2084} {"train_loss": -11.437055587768555, "global_step": 350246, "epoch": 2084} {"train_loss": -11.205792427062988, "global_step": 350247, "epoch": 2084} {"train_loss": -11.601235389709473, "global_step": 350248, "epoch": 2084} {"train_loss": -12.048334121704102, "global_step": 350249, "epoch": 2084} {"train_loss": -11.793183326721191, "global_step": 350250, "epoch": 2084} {"train_loss": -12.236751556396484, "global_step": 350251, "epoch": 2084} {"train_loss": -11.750117301940918, "global_step": 350252, "epoch": 2084} {"train_loss": -12.234321594238281, "global_step": 350253, "epoch": 2084} {"train_loss": -11.70058822631836, "global_step": 350254, "epoch": 2084} {"train_loss": -12.381431579589844, "global_step": 350255, "epoch": 2084} {"train_loss": -12.305803298950195, "global_step": 350256, "epoch": 2084} {"train_loss": -12.491260528564453, "global_step": 350257, "epoch": 2084} {"train_loss": -12.020458221435547, "global_step": 350258, "epoch": 2084} {"train_loss": -12.146574020385742, "global_step": 350259, "epoch": 2084} {"train_loss": -12.357177734375, "global_step": 350260, "epoch": 2084} {"train_loss": -12.336362838745117, "global_step": 350261, "epoch": 2084} {"train_loss": -12.30985164642334, "global_step": 350262, "epoch": 2084} {"train_loss": -12.019323348999023, "global_step": 350263, "epoch": 2084} {"train_loss": -12.343026161193848, "global_step": 350264, "epoch": 2084} {"train_loss": -12.031671524047852, "global_step": 350265, "epoch": 2084} {"train_loss": -12.238080978393555, "global_step": 350266, "epoch": 2084} {"train_loss": -12.265018463134766, "global_step": 350267, "epoch": 2084} {"train_loss": -12.26189136505127, "global_step": 350268, "epoch": 2084} {"train_loss": -12.132452011108398, "global_step": 350269, "epoch": 2084} {"train_loss": -11.975435256958008, "global_step": 350270, "epoch": 2084} {"train_loss": -12.40955924987793, "global_step": 350271, "epoch": 2084} {"train_loss": -12.0675048828125, "global_step": 350272, "epoch": 2084} {"train_loss": -11.48837661743164, "global_step": 350273, "epoch": 2084} {"train_loss": -11.744776725769043, "global_step": 350274, "epoch": 2084} {"train_loss": -12.012686729431152, "global_step": 350275, "epoch": 2084} {"train_loss": -11.843562126159668, "global_step": 350276, "epoch": 2084} {"train_loss": -12.255582809448242, "global_step": 350277, "epoch": 2084} {"train_loss": -11.601637840270996, "global_step": 350278, "epoch": 2084} {"train_loss": -11.543471188772292, "global_step": 350279, "epoch": 2084, "val_loss": 287247.15625} {"train_loss": -11.453996658325195, "global_step": 350280, "epoch": 2085} {"train_loss": -12.432933807373047, "global_step": 350281, "epoch": 2085} {"train_loss": -11.655305862426758, "global_step": 350282, "epoch": 2085} {"train_loss": -12.145565032958984, "global_step": 350283, "epoch": 2085} {"train_loss": -11.931807518005371, "global_step": 350284, "epoch": 2085} {"train_loss": -12.008854866027832, "global_step": 350285, "epoch": 2085} {"train_loss": -12.301279067993164, "global_step": 350286, "epoch": 2085} {"train_loss": -11.885623931884766, "global_step": 350287, "epoch": 2085} {"train_loss": -12.177361488342285, "global_step": 350288, "epoch": 2085} {"train_loss": -12.359493255615234, "global_step": 350289, "epoch": 2085} {"train_loss": -12.360769271850586, "global_step": 350290, "epoch": 2085} {"train_loss": -12.35792064666748, "global_step": 350291, "epoch": 2085} {"train_loss": -12.400726318359375, "global_step": 350292, "epoch": 2085} {"train_loss": -12.308639526367188, "global_step": 350293, "epoch": 2085} {"train_loss": -12.124212265014648, "global_step": 350294, "epoch": 2085} {"train_loss": -12.503419876098633, "global_step": 350295, "epoch": 2085} {"train_loss": -12.369770050048828, "global_step": 350296, "epoch": 2085} {"train_loss": -12.523049354553223, "global_step": 350297, "epoch": 2085} {"train_loss": -12.46608829498291, "global_step": 350298, "epoch": 2085} {"train_loss": -12.332196235656738, "global_step": 350299, "epoch": 2085} {"train_loss": -12.601436614990234, "global_step": 350300, "epoch": 2085} {"train_loss": -12.210865020751953, "global_step": 350301, "epoch": 2085} {"train_loss": -12.117114067077637, "global_step": 350302, "epoch": 2085} {"train_loss": -12.172897338867188, "global_step": 350303, "epoch": 2085} {"train_loss": -12.048465728759766, "global_step": 350304, "epoch": 2085} {"train_loss": -12.240348815917969, "global_step": 350305, "epoch": 2085} {"train_loss": -11.624149322509766, "global_step": 350306, "epoch": 2085} {"train_loss": -11.946829795837402, "global_step": 350307, "epoch": 2085} {"train_loss": -12.257896423339844, "global_step": 350308, "epoch": 2085} {"train_loss": -11.76921272277832, "global_step": 350309, "epoch": 2085} {"train_loss": -11.809674263000488, "global_step": 350310, "epoch": 2085} {"train_loss": -12.24095344543457, "global_step": 350311, "epoch": 2085} {"train_loss": -11.366758346557617, "global_step": 350312, "epoch": 2085} {"train_loss": -12.15970230102539, "global_step": 350313, "epoch": 2085} {"train_loss": -11.419058799743652, "global_step": 350314, "epoch": 2085} {"train_loss": -12.071584701538086, "global_step": 350315, "epoch": 2085} {"train_loss": -11.201851844787598, "global_step": 350316, "epoch": 2085} {"train_loss": -10.595890045166016, "global_step": 350317, "epoch": 2085} {"train_loss": -11.480388641357422, "global_step": 350318, "epoch": 2085} {"train_loss": -11.430337905883789, "global_step": 350319, "epoch": 2085} {"train_loss": -10.735227584838867, "global_step": 350320, "epoch": 2085} {"train_loss": -11.683008193969727, "global_step": 350321, "epoch": 2085} {"train_loss": -11.118587493896484, "global_step": 350322, "epoch": 2085} {"train_loss": -10.496415138244629, "global_step": 350323, "epoch": 2085} {"train_loss": -11.869098663330078, "global_step": 350324, "epoch": 2085} {"train_loss": -10.728240966796875, "global_step": 350325, "epoch": 2085} {"train_loss": -11.394172668457031, "global_step": 350326, "epoch": 2085} {"train_loss": -11.582756042480469, "global_step": 350327, "epoch": 2085} {"train_loss": -11.657177925109863, "global_step": 350328, "epoch": 2085} {"train_loss": -11.576190948486328, "global_step": 350329, "epoch": 2085} {"train_loss": -11.580008506774902, "global_step": 350330, "epoch": 2085} {"train_loss": -11.164714813232422, "global_step": 350331, "epoch": 2085} {"train_loss": -11.675854682922363, "global_step": 350332, "epoch": 2085} {"train_loss": -10.622947692871094, "global_step": 350333, "epoch": 2085} {"train_loss": -11.781437873840332, "global_step": 350334, "epoch": 2085} {"train_loss": -10.831628799438477, "global_step": 350335, "epoch": 2085} {"train_loss": -11.142678260803223, "global_step": 350336, "epoch": 2085} {"train_loss": -11.582825660705566, "global_step": 350337, "epoch": 2085} {"train_loss": -10.452934265136719, "global_step": 350338, "epoch": 2085} {"train_loss": -11.043537139892578, "global_step": 350339, "epoch": 2085} {"train_loss": -9.478805541992188, "global_step": 350340, "epoch": 2085} {"train_loss": -11.189664840698242, "global_step": 350341, "epoch": 2085} {"train_loss": -9.63504409790039, "global_step": 350342, "epoch": 2085} {"train_loss": -11.510497093200684, "global_step": 350343, "epoch": 2085} {"train_loss": -10.50733757019043, "global_step": 350344, "epoch": 2085} {"train_loss": -10.99594497680664, "global_step": 350345, "epoch": 2085} {"train_loss": -11.12091064453125, "global_step": 350346, "epoch": 2085} {"train_loss": -11.250905990600586, "global_step": 350347, "epoch": 2085} {"train_loss": -11.492395401000977, "global_step": 350348, "epoch": 2085} {"train_loss": -11.384384155273438, "global_step": 350349, "epoch": 2085} {"train_loss": -11.565781593322754, "global_step": 350350, "epoch": 2085} {"train_loss": -11.764101028442383, "global_step": 350351, "epoch": 2085} {"train_loss": -11.916940689086914, "global_step": 350352, "epoch": 2085} {"train_loss": -11.964354515075684, "global_step": 350353, "epoch": 2085} {"train_loss": -12.207389831542969, "global_step": 350354, "epoch": 2085} {"train_loss": -12.196752548217773, "global_step": 350355, "epoch": 2085} {"train_loss": -11.985610961914062, "global_step": 350356, "epoch": 2085} {"train_loss": -12.272418022155762, "global_step": 350357, "epoch": 2085} {"train_loss": -11.673020362854004, "global_step": 350358, "epoch": 2085} {"train_loss": -12.081172943115234, "global_step": 350359, "epoch": 2085} {"train_loss": -11.96967887878418, "global_step": 350360, "epoch": 2085} {"train_loss": -11.544355392456055, "global_step": 350361, "epoch": 2085} {"train_loss": -12.106431007385254, "global_step": 350362, "epoch": 2085} {"train_loss": -12.033506393432617, "global_step": 350363, "epoch": 2085} {"train_loss": -12.02511978149414, "global_step": 350364, "epoch": 2085} {"train_loss": -12.158197402954102, "global_step": 350365, "epoch": 2085} {"train_loss": -11.967106819152832, "global_step": 350366, "epoch": 2085} {"train_loss": -12.344099998474121, "global_step": 350367, "epoch": 2085} {"train_loss": -12.203292846679688, "global_step": 350368, "epoch": 2085} {"train_loss": -12.13389778137207, "global_step": 350369, "epoch": 2085} {"train_loss": -12.437858581542969, "global_step": 350370, "epoch": 2085} {"train_loss": -12.182284355163574, "global_step": 350371, "epoch": 2085} {"train_loss": -12.341621398925781, "global_step": 350372, "epoch": 2085} {"train_loss": -12.410989761352539, "global_step": 350373, "epoch": 2085} {"train_loss": -12.56965160369873, "global_step": 350374, "epoch": 2085} {"train_loss": -12.459543228149414, "global_step": 350375, "epoch": 2085} {"train_loss": -12.22480583190918, "global_step": 350376, "epoch": 2085} {"train_loss": -12.60859489440918, "global_step": 350377, "epoch": 2085} {"train_loss": -12.44497299194336, "global_step": 350378, "epoch": 2085} {"train_loss": -12.476882934570312, "global_step": 350379, "epoch": 2085} {"train_loss": -12.634136199951172, "global_step": 350380, "epoch": 2085} {"train_loss": -12.403331756591797, "global_step": 350381, "epoch": 2085} {"train_loss": -12.361778259277344, "global_step": 350382, "epoch": 2085} {"train_loss": -12.538307189941406, "global_step": 350383, "epoch": 2085} {"train_loss": -12.457086563110352, "global_step": 350384, "epoch": 2085} {"train_loss": -12.39236068725586, "global_step": 350385, "epoch": 2085} {"train_loss": -12.547175407409668, "global_step": 350386, "epoch": 2085} {"train_loss": -12.402399063110352, "global_step": 350387, "epoch": 2085} {"train_loss": -12.497621536254883, "global_step": 350388, "epoch": 2085} {"train_loss": -12.591955184936523, "global_step": 350389, "epoch": 2085} {"train_loss": -12.469985008239746, "global_step": 350390, "epoch": 2085} {"train_loss": -12.40449333190918, "global_step": 350391, "epoch": 2085} {"train_loss": -12.403987884521484, "global_step": 350392, "epoch": 2085} {"train_loss": -12.670145988464355, "global_step": 350393, "epoch": 2085} {"train_loss": -12.590045928955078, "global_step": 350394, "epoch": 2085} {"train_loss": -12.61421012878418, "global_step": 350395, "epoch": 2085} {"train_loss": -12.654830932617188, "global_step": 350396, "epoch": 2085} {"train_loss": -12.481149673461914, "global_step": 350397, "epoch": 2085} {"train_loss": -12.660377502441406, "global_step": 350398, "epoch": 2085} {"train_loss": -12.55184555053711, "global_step": 350399, "epoch": 2085} {"train_loss": -12.383489608764648, "global_step": 350400, "epoch": 2085} {"train_loss": -12.333577156066895, "global_step": 350401, "epoch": 2085} {"train_loss": -12.514060974121094, "global_step": 350402, "epoch": 2085} {"train_loss": -12.458611488342285, "global_step": 350403, "epoch": 2085} {"train_loss": -12.559093475341797, "global_step": 350404, "epoch": 2085} {"train_loss": -12.509248733520508, "global_step": 350405, "epoch": 2085} {"train_loss": -12.395669937133789, "global_step": 350406, "epoch": 2085} {"train_loss": -12.173181533813477, "global_step": 350407, "epoch": 2085} {"train_loss": -12.331663131713867, "global_step": 350408, "epoch": 2085} {"train_loss": -11.764266967773438, "global_step": 350409, "epoch": 2085} {"train_loss": -11.4874267578125, "global_step": 350410, "epoch": 2085} {"train_loss": -11.806642532348633, "global_step": 350411, "epoch": 2085} {"train_loss": -11.366655349731445, "global_step": 350412, "epoch": 2085} {"train_loss": -11.198075294494629, "global_step": 350413, "epoch": 2085} {"train_loss": -12.0306396484375, "global_step": 350414, "epoch": 2085} {"train_loss": -10.907333374023438, "global_step": 350415, "epoch": 2085} {"train_loss": -10.90880012512207, "global_step": 350416, "epoch": 2085} {"train_loss": -12.005260467529297, "global_step": 350417, "epoch": 2085} {"train_loss": -11.513333320617676, "global_step": 350418, "epoch": 2085} {"train_loss": -11.462172508239746, "global_step": 350419, "epoch": 2085} {"train_loss": -11.694700241088867, "global_step": 350420, "epoch": 2085} {"train_loss": -11.878538131713867, "global_step": 350421, "epoch": 2085} {"train_loss": -11.34309196472168, "global_step": 350422, "epoch": 2085} {"train_loss": -11.922128677368164, "global_step": 350423, "epoch": 2085} {"train_loss": -11.16916275024414, "global_step": 350424, "epoch": 2085} {"train_loss": -11.95496940612793, "global_step": 350425, "epoch": 2085} {"train_loss": -11.367166519165039, "global_step": 350426, "epoch": 2085} {"train_loss": -11.455219268798828, "global_step": 350427, "epoch": 2085} {"train_loss": -11.666507720947266, "global_step": 350428, "epoch": 2085} {"train_loss": -10.558708190917969, "global_step": 350429, "epoch": 2085} {"train_loss": -11.86482048034668, "global_step": 350430, "epoch": 2085} {"train_loss": -11.10365104675293, "global_step": 350431, "epoch": 2085} {"train_loss": -11.673569679260254, "global_step": 350432, "epoch": 2085} {"train_loss": -11.414464950561523, "global_step": 350433, "epoch": 2085} {"train_loss": -11.706790924072266, "global_step": 350434, "epoch": 2085} {"train_loss": -12.110069274902344, "global_step": 350435, "epoch": 2085} {"train_loss": -11.872098922729492, "global_step": 350436, "epoch": 2085} {"train_loss": -12.155238151550293, "global_step": 350437, "epoch": 2085} {"train_loss": -11.984743118286133, "global_step": 350438, "epoch": 2085} {"train_loss": -12.003061294555664, "global_step": 350439, "epoch": 2085} {"train_loss": -11.636005401611328, "global_step": 350440, "epoch": 2085} {"train_loss": -11.87796401977539, "global_step": 350441, "epoch": 2085} {"train_loss": -11.839156150817871, "global_step": 350442, "epoch": 2085} {"train_loss": -12.00502872467041, "global_step": 350443, "epoch": 2085} {"train_loss": -11.914695739746094, "global_step": 350444, "epoch": 2085} {"train_loss": -11.52105712890625, "global_step": 350445, "epoch": 2085} {"train_loss": -11.35929012298584, "global_step": 350446, "epoch": 2085} {"train_loss": -11.866252626691546, "global_step": 350447, "epoch": 2085, "val_loss": 290883.40625, "train_action_mse_error": 0.4977353811264038} {"train_loss": -12.068611145019531, "global_step": 350448, "epoch": 2086} {"train_loss": -11.927061080932617, "global_step": 350449, "epoch": 2086} {"train_loss": -11.734474182128906, "global_step": 350450, "epoch": 2086} {"train_loss": -11.79365062713623, "global_step": 350451, "epoch": 2086} {"train_loss": -11.969078063964844, "global_step": 350452, "epoch": 2086} {"train_loss": -12.214466094970703, "global_step": 350453, "epoch": 2086} {"train_loss": -11.774761199951172, "global_step": 350454, "epoch": 2086} {"train_loss": -11.196001052856445, "global_step": 350455, "epoch": 2086} {"train_loss": -11.642373085021973, "global_step": 350456, "epoch": 2086} {"train_loss": -12.001136779785156, "global_step": 350457, "epoch": 2086} {"train_loss": -11.50275707244873, "global_step": 350458, "epoch": 2086} {"train_loss": -12.001642227172852, "global_step": 350459, "epoch": 2086} {"train_loss": -12.077098846435547, "global_step": 350460, "epoch": 2086} {"train_loss": -11.913630485534668, "global_step": 350461, "epoch": 2086} {"train_loss": -12.20669937133789, "global_step": 350462, "epoch": 2086} {"train_loss": -11.845483779907227, "global_step": 350463, "epoch": 2086} {"train_loss": -12.117393493652344, "global_step": 350464, "epoch": 2086} {"train_loss": -11.957206726074219, "global_step": 350465, "epoch": 2086} {"train_loss": -11.872920989990234, "global_step": 350466, "epoch": 2086} {"train_loss": -12.151952743530273, "global_step": 350467, "epoch": 2086} {"train_loss": -11.783122062683105, "global_step": 350468, "epoch": 2086} {"train_loss": -12.315780639648438, "global_step": 350469, "epoch": 2086} {"train_loss": -11.784980773925781, "global_step": 350470, "epoch": 2086} {"train_loss": -12.198185920715332, "global_step": 350471, "epoch": 2086} {"train_loss": -11.977775573730469, "global_step": 350472, "epoch": 2086} {"train_loss": -12.027701377868652, "global_step": 350473, "epoch": 2086} {"train_loss": -11.922660827636719, "global_step": 350474, "epoch": 2086} {"train_loss": -12.244730949401855, "global_step": 350475, "epoch": 2086} {"train_loss": -12.252921104431152, "global_step": 350476, "epoch": 2086} {"train_loss": -12.053982734680176, "global_step": 350477, "epoch": 2086} {"train_loss": -12.33839225769043, "global_step": 350478, "epoch": 2086} {"train_loss": -12.109228134155273, "global_step": 350479, "epoch": 2086} {"train_loss": -12.283291816711426, "global_step": 350480, "epoch": 2086} {"train_loss": -12.240835189819336, "global_step": 350481, "epoch": 2086} {"train_loss": -12.028827667236328, "global_step": 350482, "epoch": 2086} {"train_loss": -12.589117050170898, "global_step": 350483, "epoch": 2086} {"train_loss": -12.196393013000488, "global_step": 350484, "epoch": 2086} {"train_loss": -12.451803207397461, "global_step": 350485, "epoch": 2086} {"train_loss": -12.188512802124023, "global_step": 350486, "epoch": 2086} {"train_loss": -12.34782600402832, "global_step": 350487, "epoch": 2086} {"train_loss": -12.048637390136719, "global_step": 350488, "epoch": 2086} {"train_loss": -11.643796920776367, "global_step": 350489, "epoch": 2086} {"train_loss": -12.398159980773926, "global_step": 350490, "epoch": 2086} {"train_loss": -12.244531631469727, "global_step": 350491, "epoch": 2086} {"train_loss": -12.012357711791992, "global_step": 350492, "epoch": 2086} {"train_loss": -12.278848648071289, "global_step": 350493, "epoch": 2086} {"train_loss": -12.134614944458008, "global_step": 350494, "epoch": 2086} {"train_loss": -12.489965438842773, "global_step": 350495, "epoch": 2086} {"train_loss": -12.066088676452637, "global_step": 350496, "epoch": 2086} {"train_loss": -12.031471252441406, "global_step": 350497, "epoch": 2086} {"train_loss": -12.165111541748047, "global_step": 350498, "epoch": 2086} {"train_loss": -12.016061782836914, "global_step": 350499, "epoch": 2086} {"train_loss": -12.396294593811035, "global_step": 350500, "epoch": 2086} {"train_loss": -12.168075561523438, "global_step": 350501, "epoch": 2086} {"train_loss": -12.151505470275879, "global_step": 350502, "epoch": 2086} {"train_loss": -12.052780151367188, "global_step": 350503, "epoch": 2086} {"train_loss": -12.258955955505371, "global_step": 350504, "epoch": 2086} {"train_loss": -12.095175743103027, "global_step": 350505, "epoch": 2086} {"train_loss": -12.280532836914062, "global_step": 350506, "epoch": 2086} {"train_loss": -12.147897720336914, "global_step": 350507, "epoch": 2086} {"train_loss": -11.982623100280762, "global_step": 350508, "epoch": 2086} {"train_loss": -12.330427169799805, "global_step": 350509, "epoch": 2086} {"train_loss": -12.099519729614258, "global_step": 350510, "epoch": 2086} {"train_loss": -12.322751998901367, "global_step": 350511, "epoch": 2086} {"train_loss": -11.599370956420898, "global_step": 350512, "epoch": 2086} {"train_loss": -11.48993968963623, "global_step": 350513, "epoch": 2086} {"train_loss": -11.226310729980469, "global_step": 350514, "epoch": 2086} {"train_loss": -11.690606117248535, "global_step": 350515, "epoch": 2086} {"train_loss": -11.041402816772461, "global_step": 350516, "epoch": 2086} {"train_loss": -11.000993728637695, "global_step": 350517, "epoch": 2086} {"train_loss": -11.897332191467285, "global_step": 350518, "epoch": 2086} {"train_loss": -11.372339248657227, "global_step": 350519, "epoch": 2086} {"train_loss": -11.841041564941406, "global_step": 350520, "epoch": 2086} {"train_loss": -11.532279014587402, "global_step": 350521, "epoch": 2086} {"train_loss": -12.168231964111328, "global_step": 350522, "epoch": 2086} {"train_loss": -11.239418029785156, "global_step": 350523, "epoch": 2086} {"train_loss": -12.144820213317871, "global_step": 350524, "epoch": 2086} {"train_loss": -11.383540153503418, "global_step": 350525, "epoch": 2086} {"train_loss": -10.986028671264648, "global_step": 350526, "epoch": 2086} {"train_loss": -11.935078620910645, "global_step": 350527, "epoch": 2086} {"train_loss": -11.393661499023438, "global_step": 350528, "epoch": 2086} {"train_loss": -11.390264511108398, "global_step": 350529, "epoch": 2086} {"train_loss": -11.982187271118164, "global_step": 350530, "epoch": 2086} {"train_loss": -11.399894714355469, "global_step": 350531, "epoch": 2086} {"train_loss": -11.788718223571777, "global_step": 350532, "epoch": 2086} {"train_loss": -11.578229904174805, "global_step": 350533, "epoch": 2086} {"train_loss": -12.088592529296875, "global_step": 350534, "epoch": 2086} {"train_loss": -11.367528915405273, "global_step": 350535, "epoch": 2086} {"train_loss": -11.79806900024414, "global_step": 350536, "epoch": 2086} {"train_loss": -11.709569931030273, "global_step": 350537, "epoch": 2086} {"train_loss": -11.792946815490723, "global_step": 350538, "epoch": 2086} {"train_loss": -11.657526016235352, "global_step": 350539, "epoch": 2086} {"train_loss": -11.672334671020508, "global_step": 350540, "epoch": 2086} {"train_loss": -12.178815841674805, "global_step": 350541, "epoch": 2086} {"train_loss": -11.857240676879883, "global_step": 350542, "epoch": 2086} {"train_loss": -12.090774536132812, "global_step": 350543, "epoch": 2086} {"train_loss": -12.374217987060547, "global_step": 350544, "epoch": 2086} {"train_loss": -12.027120590209961, "global_step": 350545, "epoch": 2086} {"train_loss": -12.16781234741211, "global_step": 350546, "epoch": 2086} {"train_loss": -11.941085815429688, "global_step": 350547, "epoch": 2086} {"train_loss": -12.398359298706055, "global_step": 350548, "epoch": 2086} {"train_loss": -12.328825950622559, "global_step": 350549, "epoch": 2086} {"train_loss": -12.127153396606445, "global_step": 350550, "epoch": 2086} {"train_loss": -11.983318328857422, "global_step": 350551, "epoch": 2086} {"train_loss": -12.546942710876465, "global_step": 350552, "epoch": 2086} {"train_loss": -12.41102409362793, "global_step": 350553, "epoch": 2086} {"train_loss": -12.045183181762695, "global_step": 350554, "epoch": 2086} {"train_loss": -12.464704513549805, "global_step": 350555, "epoch": 2086} {"train_loss": -12.231273651123047, "global_step": 350556, "epoch": 2086} {"train_loss": -12.230592727661133, "global_step": 350557, "epoch": 2086} {"train_loss": -12.251291275024414, "global_step": 350558, "epoch": 2086} {"train_loss": -11.87208366394043, "global_step": 350559, "epoch": 2086} {"train_loss": -12.019776344299316, "global_step": 350560, "epoch": 2086} {"train_loss": -12.23213005065918, "global_step": 350561, "epoch": 2086} {"train_loss": -12.03172492980957, "global_step": 350562, "epoch": 2086} {"train_loss": -12.07615852355957, "global_step": 350563, "epoch": 2086} {"train_loss": -12.41462516784668, "global_step": 350564, "epoch": 2086} {"train_loss": -11.895013809204102, "global_step": 350565, "epoch": 2086} {"train_loss": -12.082038879394531, "global_step": 350566, "epoch": 2086} {"train_loss": -12.079421997070312, "global_step": 350567, "epoch": 2086} {"train_loss": -11.938814163208008, "global_step": 350568, "epoch": 2086} {"train_loss": -12.073980331420898, "global_step": 350569, "epoch": 2086} {"train_loss": -11.769826889038086, "global_step": 350570, "epoch": 2086} {"train_loss": -12.047684669494629, "global_step": 350571, "epoch": 2086} {"train_loss": -12.214649200439453, "global_step": 350572, "epoch": 2086} {"train_loss": -12.1182279586792, "global_step": 350573, "epoch": 2086} {"train_loss": -12.455814361572266, "global_step": 350574, "epoch": 2086} {"train_loss": -12.193284034729004, "global_step": 350575, "epoch": 2086} {"train_loss": -12.317357063293457, "global_step": 350576, "epoch": 2086} {"train_loss": -11.879308700561523, "global_step": 350577, "epoch": 2086} {"train_loss": -12.022592544555664, "global_step": 350578, "epoch": 2086} {"train_loss": -12.127119064331055, "global_step": 350579, "epoch": 2086} {"train_loss": -12.214561462402344, "global_step": 350580, "epoch": 2086} {"train_loss": -12.29417896270752, "global_step": 350581, "epoch": 2086} {"train_loss": -12.215095520019531, "global_step": 350582, "epoch": 2086} {"train_loss": -12.110843658447266, "global_step": 350583, "epoch": 2086} {"train_loss": -12.490116119384766, "global_step": 350584, "epoch": 2086} {"train_loss": -12.042573928833008, "global_step": 350585, "epoch": 2086} {"train_loss": -12.013211250305176, "global_step": 350586, "epoch": 2086} {"train_loss": -12.192827224731445, "global_step": 350587, "epoch": 2086} {"train_loss": -12.038143157958984, "global_step": 350588, "epoch": 2086} {"train_loss": -12.24640941619873, "global_step": 350589, "epoch": 2086} {"train_loss": -12.25682544708252, "global_step": 350590, "epoch": 2086} {"train_loss": -12.048199653625488, "global_step": 350591, "epoch": 2086} {"train_loss": -12.333341598510742, "global_step": 350592, "epoch": 2086} {"train_loss": -11.979555130004883, "global_step": 350593, "epoch": 2086} {"train_loss": -12.427823066711426, "global_step": 350594, "epoch": 2086} {"train_loss": -12.09177017211914, "global_step": 350595, "epoch": 2086} {"train_loss": -12.29012393951416, "global_step": 350596, "epoch": 2086} {"train_loss": -12.062329292297363, "global_step": 350597, "epoch": 2086} {"train_loss": -12.488012313842773, "global_step": 350598, "epoch": 2086} {"train_loss": -12.511693000793457, "global_step": 350599, "epoch": 2086} {"train_loss": -12.495033264160156, "global_step": 350600, "epoch": 2086} {"train_loss": -12.423297882080078, "global_step": 350601, "epoch": 2086} {"train_loss": -12.519607543945312, "global_step": 350602, "epoch": 2086} {"train_loss": -12.368904113769531, "global_step": 350603, "epoch": 2086} {"train_loss": -12.566944122314453, "global_step": 350604, "epoch": 2086} {"train_loss": -12.210857391357422, "global_step": 350605, "epoch": 2086} {"train_loss": -12.130193710327148, "global_step": 350606, "epoch": 2086} {"train_loss": -12.538595199584961, "global_step": 350607, "epoch": 2086} {"train_loss": -12.386679649353027, "global_step": 350608, "epoch": 2086} {"train_loss": -12.253005981445312, "global_step": 350609, "epoch": 2086} {"train_loss": -12.409568786621094, "global_step": 350610, "epoch": 2086} {"train_loss": -12.509319305419922, "global_step": 350611, "epoch": 2086} {"train_loss": -12.254201889038086, "global_step": 350612, "epoch": 2086} {"train_loss": -12.30094051361084, "global_step": 350613, "epoch": 2086} {"train_loss": -12.45052719116211, "global_step": 350614, "epoch": 2086} {"train_loss": -12.053037382307506, "global_step": 350615, "epoch": 2086, "val_loss": 292149.84375} {"train_loss": -12.125211715698242, "global_step": 350616, "epoch": 2087} {"train_loss": -12.482229232788086, "global_step": 350617, "epoch": 2087} {"train_loss": -12.594683647155762, "global_step": 350618, "epoch": 2087} {"train_loss": -12.281401634216309, "global_step": 350619, "epoch": 2087} {"train_loss": -12.435723304748535, "global_step": 350620, "epoch": 2087} {"train_loss": -12.140189170837402, "global_step": 350621, "epoch": 2087} {"train_loss": -12.401994705200195, "global_step": 350622, "epoch": 2087} {"train_loss": -12.334331512451172, "global_step": 350623, "epoch": 2087} {"train_loss": -11.956315040588379, "global_step": 350624, "epoch": 2087} {"train_loss": -11.882402420043945, "global_step": 350625, "epoch": 2087} {"train_loss": -11.968144416809082, "global_step": 350626, "epoch": 2087} {"train_loss": -12.291932106018066, "global_step": 350627, "epoch": 2087} {"train_loss": -12.098627090454102, "global_step": 350628, "epoch": 2087} {"train_loss": -12.129594802856445, "global_step": 350629, "epoch": 2087} {"train_loss": -11.973832130432129, "global_step": 350630, "epoch": 2087} {"train_loss": -12.273615837097168, "global_step": 350631, "epoch": 2087} {"train_loss": -12.559301376342773, "global_step": 350632, "epoch": 2087} {"train_loss": -11.874427795410156, "global_step": 350633, "epoch": 2087} {"train_loss": -12.055676460266113, "global_step": 350634, "epoch": 2087} {"train_loss": -12.045050621032715, "global_step": 350635, "epoch": 2087} {"train_loss": -12.497392654418945, "global_step": 350636, "epoch": 2087} {"train_loss": -12.45367431640625, "global_step": 350637, "epoch": 2087} {"train_loss": -12.280858993530273, "global_step": 350638, "epoch": 2087} {"train_loss": -12.360109329223633, "global_step": 350639, "epoch": 2087} {"train_loss": -12.036896705627441, "global_step": 350640, "epoch": 2087} {"train_loss": -12.363262176513672, "global_step": 350641, "epoch": 2087} {"train_loss": -12.301183700561523, "global_step": 350642, "epoch": 2087} {"train_loss": -12.218364715576172, "global_step": 350643, "epoch": 2087} {"train_loss": -12.036429405212402, "global_step": 350644, "epoch": 2087} {"train_loss": -11.952583312988281, "global_step": 350645, "epoch": 2087} {"train_loss": -11.739068031311035, "global_step": 350646, "epoch": 2087} {"train_loss": -12.05302619934082, "global_step": 350647, "epoch": 2087} {"train_loss": -11.650432586669922, "global_step": 350648, "epoch": 2087} {"train_loss": -11.426443099975586, "global_step": 350649, "epoch": 2087} {"train_loss": -11.076030731201172, "global_step": 350650, "epoch": 2087} {"train_loss": -12.199190139770508, "global_step": 350651, "epoch": 2087} {"train_loss": -11.759125709533691, "global_step": 350652, "epoch": 2087} {"train_loss": -11.853036880493164, "global_step": 350653, "epoch": 2087} {"train_loss": -10.885200500488281, "global_step": 350654, "epoch": 2087} {"train_loss": -12.008773803710938, "global_step": 350655, "epoch": 2087} {"train_loss": -11.262340545654297, "global_step": 350656, "epoch": 2087} {"train_loss": -12.181550025939941, "global_step": 350657, "epoch": 2087} {"train_loss": -11.622577667236328, "global_step": 350658, "epoch": 2087} {"train_loss": -11.396636962890625, "global_step": 350659, "epoch": 2087} {"train_loss": -11.38775634765625, "global_step": 350660, "epoch": 2087} {"train_loss": -11.938961029052734, "global_step": 350661, "epoch": 2087} {"train_loss": -11.591475486755371, "global_step": 350662, "epoch": 2087} {"train_loss": -12.132695198059082, "global_step": 350663, "epoch": 2087} {"train_loss": -11.276212692260742, "global_step": 350664, "epoch": 2087} {"train_loss": -11.230558395385742, "global_step": 350665, "epoch": 2087} {"train_loss": -11.853522300720215, "global_step": 350666, "epoch": 2087} {"train_loss": -11.744686126708984, "global_step": 350667, "epoch": 2087} {"train_loss": -11.700777053833008, "global_step": 350668, "epoch": 2087} {"train_loss": -11.26982307434082, "global_step": 350669, "epoch": 2087} {"train_loss": -11.943967819213867, "global_step": 350670, "epoch": 2087} {"train_loss": -12.116714477539062, "global_step": 350671, "epoch": 2087} {"train_loss": -11.717453002929688, "global_step": 350672, "epoch": 2087} {"train_loss": -12.197526931762695, "global_step": 350673, "epoch": 2087} {"train_loss": -11.873432159423828, "global_step": 350674, "epoch": 2087} {"train_loss": -11.973114013671875, "global_step": 350675, "epoch": 2087} {"train_loss": -12.227815628051758, "global_step": 350676, "epoch": 2087} {"train_loss": -12.084909439086914, "global_step": 350677, "epoch": 2087} {"train_loss": -11.9779052734375, "global_step": 350678, "epoch": 2087} {"train_loss": -11.97789192199707, "global_step": 350679, "epoch": 2087} {"train_loss": -11.915227890014648, "global_step": 350680, "epoch": 2087} {"train_loss": -11.551445960998535, "global_step": 350681, "epoch": 2087} {"train_loss": -11.971307754516602, "global_step": 350682, "epoch": 2087} {"train_loss": -11.886659622192383, "global_step": 350683, "epoch": 2087} {"train_loss": -12.07260513305664, "global_step": 350684, "epoch": 2087} {"train_loss": -11.996630668640137, "global_step": 350685, "epoch": 2087} {"train_loss": -11.955549240112305, "global_step": 350686, "epoch": 2087} {"train_loss": -12.03924560546875, "global_step": 350687, "epoch": 2087} {"train_loss": -11.906112670898438, "global_step": 350688, "epoch": 2087} {"train_loss": -12.230962753295898, "global_step": 350689, "epoch": 2087} {"train_loss": -12.265862464904785, "global_step": 350690, "epoch": 2087} {"train_loss": -12.380388259887695, "global_step": 350691, "epoch": 2087} {"train_loss": -12.176036834716797, "global_step": 350692, "epoch": 2087} {"train_loss": -12.345966339111328, "global_step": 350693, "epoch": 2087} {"train_loss": -12.467855453491211, "global_step": 350694, "epoch": 2087} {"train_loss": -12.153169631958008, "global_step": 350695, "epoch": 2087} {"train_loss": -12.490407943725586, "global_step": 350696, "epoch": 2087} {"train_loss": -12.366266250610352, "global_step": 350697, "epoch": 2087} {"train_loss": -12.094066619873047, "global_step": 350698, "epoch": 2087} {"train_loss": -12.121509552001953, "global_step": 350699, "epoch": 2087} {"train_loss": -12.50399398803711, "global_step": 350700, "epoch": 2087} {"train_loss": -12.055185317993164, "global_step": 350701, "epoch": 2087} {"train_loss": -12.242012023925781, "global_step": 350702, "epoch": 2087} {"train_loss": -12.051946640014648, "global_step": 350703, "epoch": 2087} {"train_loss": -12.373144149780273, "global_step": 350704, "epoch": 2087} {"train_loss": -12.089792251586914, "global_step": 350705, "epoch": 2087} {"train_loss": -12.373069763183594, "global_step": 350706, "epoch": 2087} {"train_loss": -12.186910629272461, "global_step": 350707, "epoch": 2087} {"train_loss": -12.256917953491211, "global_step": 350708, "epoch": 2087} {"train_loss": -12.213181495666504, "global_step": 350709, "epoch": 2087} {"train_loss": -12.371809005737305, "global_step": 350710, "epoch": 2087} {"train_loss": -12.22366714477539, "global_step": 350711, "epoch": 2087} {"train_loss": -12.384509086608887, "global_step": 350712, "epoch": 2087} {"train_loss": -11.837316513061523, "global_step": 350713, "epoch": 2087} {"train_loss": -12.14973258972168, "global_step": 350714, "epoch": 2087} {"train_loss": -11.939582824707031, "global_step": 350715, "epoch": 2087} {"train_loss": -11.88760757446289, "global_step": 350716, "epoch": 2087} {"train_loss": -11.855331420898438, "global_step": 350717, "epoch": 2087} {"train_loss": -12.365424156188965, "global_step": 350718, "epoch": 2087} {"train_loss": -11.830118179321289, "global_step": 350719, "epoch": 2087} {"train_loss": -12.601962089538574, "global_step": 350720, "epoch": 2087} {"train_loss": -12.168517112731934, "global_step": 350721, "epoch": 2087} {"train_loss": -12.614922523498535, "global_step": 350722, "epoch": 2087} {"train_loss": -12.38766098022461, "global_step": 350723, "epoch": 2087} {"train_loss": -12.298739433288574, "global_step": 350724, "epoch": 2087} {"train_loss": -12.41475772857666, "global_step": 350725, "epoch": 2087} {"train_loss": -12.16637134552002, "global_step": 350726, "epoch": 2087} {"train_loss": -12.314780235290527, "global_step": 350727, "epoch": 2087} {"train_loss": -12.54525375366211, "global_step": 350728, "epoch": 2087} {"train_loss": -12.38461971282959, "global_step": 350729, "epoch": 2087} {"train_loss": -12.112582206726074, "global_step": 350730, "epoch": 2087} {"train_loss": -12.57899284362793, "global_step": 350731, "epoch": 2087} {"train_loss": -12.553997039794922, "global_step": 350732, "epoch": 2087} {"train_loss": -12.537708282470703, "global_step": 350733, "epoch": 2087} {"train_loss": -12.228586196899414, "global_step": 350734, "epoch": 2087} {"train_loss": -12.427909851074219, "global_step": 350735, "epoch": 2087} {"train_loss": -12.649444580078125, "global_step": 350736, "epoch": 2087} {"train_loss": -12.359718322753906, "global_step": 350737, "epoch": 2087} {"train_loss": -12.528331756591797, "global_step": 350738, "epoch": 2087} {"train_loss": -12.387685775756836, "global_step": 350739, "epoch": 2087} {"train_loss": -12.128095626831055, "global_step": 350740, "epoch": 2087} {"train_loss": -12.059600830078125, "global_step": 350741, "epoch": 2087} {"train_loss": -12.6788969039917, "global_step": 350742, "epoch": 2087} {"train_loss": -12.302177429199219, "global_step": 350743, "epoch": 2087} {"train_loss": -12.231332778930664, "global_step": 350744, "epoch": 2087} {"train_loss": -12.61785888671875, "global_step": 350745, "epoch": 2087} {"train_loss": -12.039510726928711, "global_step": 350746, "epoch": 2087} {"train_loss": -11.870786666870117, "global_step": 350747, "epoch": 2087} {"train_loss": -12.751119613647461, "global_step": 350748, "epoch": 2087} {"train_loss": -11.680769920349121, "global_step": 350749, "epoch": 2087} {"train_loss": -10.488543510437012, "global_step": 350750, "epoch": 2087} {"train_loss": -12.686929702758789, "global_step": 350751, "epoch": 2087} {"train_loss": -11.065634727478027, "global_step": 350752, "epoch": 2087} {"train_loss": -11.394845008850098, "global_step": 350753, "epoch": 2087} {"train_loss": -11.366146087646484, "global_step": 350754, "epoch": 2087} {"train_loss": -11.977304458618164, "global_step": 350755, "epoch": 2087} {"train_loss": -11.412872314453125, "global_step": 350756, "epoch": 2087} {"train_loss": -12.026277542114258, "global_step": 350757, "epoch": 2087} {"train_loss": -11.899162292480469, "global_step": 350758, "epoch": 2087} {"train_loss": -11.736587524414062, "global_step": 350759, "epoch": 2087} {"train_loss": -12.221661567687988, "global_step": 350760, "epoch": 2087} {"train_loss": -12.163447380065918, "global_step": 350761, "epoch": 2087} {"train_loss": -12.035502433776855, "global_step": 350762, "epoch": 2087} {"train_loss": -12.259626388549805, "global_step": 350763, "epoch": 2087} {"train_loss": -11.79364013671875, "global_step": 350764, "epoch": 2087} {"train_loss": -12.363759994506836, "global_step": 350765, "epoch": 2087} {"train_loss": -11.944377899169922, "global_step": 350766, "epoch": 2087} {"train_loss": -12.58659839630127, "global_step": 350767, "epoch": 2087} {"train_loss": -12.284180641174316, "global_step": 350768, "epoch": 2087} {"train_loss": -12.272510528564453, "global_step": 350769, "epoch": 2087} {"train_loss": -12.112394332885742, "global_step": 350770, "epoch": 2087} {"train_loss": -11.566211700439453, "global_step": 350771, "epoch": 2087} {"train_loss": -11.519116401672363, "global_step": 350772, "epoch": 2087} {"train_loss": -11.820890426635742, "global_step": 350773, "epoch": 2087} {"train_loss": -11.455516815185547, "global_step": 350774, "epoch": 2087} {"train_loss": -12.352174758911133, "global_step": 350775, "epoch": 2087} {"train_loss": -11.74362564086914, "global_step": 350776, "epoch": 2087} {"train_loss": -11.90914535522461, "global_step": 350777, "epoch": 2087} {"train_loss": -12.076622009277344, "global_step": 350778, "epoch": 2087} {"train_loss": -12.489337921142578, "global_step": 350779, "epoch": 2087} {"train_loss": -12.262871742248535, "global_step": 350780, "epoch": 2087} {"train_loss": -12.389496803283691, "global_step": 350781, "epoch": 2087} {"train_loss": -12.520349502563477, "global_step": 350782, "epoch": 2087} {"train_loss": -12.07550036907196, "global_step": 350783, "epoch": 2087, "val_loss": 292948.21875} {"train_loss": -12.184844017028809, "global_step": 350784, "epoch": 2088} {"train_loss": -12.281777381896973, "global_step": 350785, "epoch": 2088} {"train_loss": -12.229941368103027, "global_step": 350786, "epoch": 2088} {"train_loss": -11.589065551757812, "global_step": 350787, "epoch": 2088} {"train_loss": -12.375351905822754, "global_step": 350788, "epoch": 2088} {"train_loss": -12.020783424377441, "global_step": 350789, "epoch": 2088} {"train_loss": -11.808786392211914, "global_step": 350790, "epoch": 2088} {"train_loss": -12.329839706420898, "global_step": 350791, "epoch": 2088} {"train_loss": -12.415533065795898, "global_step": 350792, "epoch": 2088} {"train_loss": -12.068984985351562, "global_step": 350793, "epoch": 2088} {"train_loss": -12.513870239257812, "global_step": 350794, "epoch": 2088} {"train_loss": -12.041568756103516, "global_step": 350795, "epoch": 2088} {"train_loss": -12.103118896484375, "global_step": 350796, "epoch": 2088} {"train_loss": -12.247602462768555, "global_step": 350797, "epoch": 2088} {"train_loss": -11.349618911743164, "global_step": 350798, "epoch": 2088} {"train_loss": -12.008788108825684, "global_step": 350799, "epoch": 2088} {"train_loss": -11.380624771118164, "global_step": 350800, "epoch": 2088} {"train_loss": -12.289592742919922, "global_step": 350801, "epoch": 2088} {"train_loss": -12.072981834411621, "global_step": 350802, "epoch": 2088} {"train_loss": -10.977899551391602, "global_step": 350803, "epoch": 2088} {"train_loss": -10.97467041015625, "global_step": 350804, "epoch": 2088} {"train_loss": -12.045808792114258, "global_step": 350805, "epoch": 2088} {"train_loss": -11.150135040283203, "global_step": 350806, "epoch": 2088} {"train_loss": -11.19087028503418, "global_step": 350807, "epoch": 2088} {"train_loss": -11.785030364990234, "global_step": 350808, "epoch": 2088} {"train_loss": -10.57182502746582, "global_step": 350809, "epoch": 2088} {"train_loss": -9.616945266723633, "global_step": 350810, "epoch": 2088} {"train_loss": -10.94719123840332, "global_step": 350811, "epoch": 2088} {"train_loss": -8.409685134887695, "global_step": 350812, "epoch": 2088} {"train_loss": -9.84528923034668, "global_step": 350813, "epoch": 2088} {"train_loss": -8.762177467346191, "global_step": 350814, "epoch": 2088} {"train_loss": -10.566079139709473, "global_step": 350815, "epoch": 2088} {"train_loss": -8.467697143554688, "global_step": 350816, "epoch": 2088} {"train_loss": -8.824422836303711, "global_step": 350817, "epoch": 2088} {"train_loss": -8.67593765258789, "global_step": 350818, "epoch": 2088} {"train_loss": -9.989531517028809, "global_step": 350819, "epoch": 2088} {"train_loss": -10.255815505981445, "global_step": 350820, "epoch": 2088} {"train_loss": -9.446235656738281, "global_step": 350821, "epoch": 2088} {"train_loss": -10.544425964355469, "global_step": 350822, "epoch": 2088} {"train_loss": -10.978506088256836, "global_step": 350823, "epoch": 2088} {"train_loss": -10.519449234008789, "global_step": 350824, "epoch": 2088} {"train_loss": -11.146247863769531, "global_step": 350825, "epoch": 2088} {"train_loss": -10.137510299682617, "global_step": 350826, "epoch": 2088} {"train_loss": -10.559481620788574, "global_step": 350827, "epoch": 2088} {"train_loss": -10.269218444824219, "global_step": 350828, "epoch": 2088} {"train_loss": -11.333243370056152, "global_step": 350829, "epoch": 2088} {"train_loss": -10.646051406860352, "global_step": 350830, "epoch": 2088} {"train_loss": -10.981385231018066, "global_step": 350831, "epoch": 2088} {"train_loss": -10.104377746582031, "global_step": 350832, "epoch": 2088} {"train_loss": -11.062472343444824, "global_step": 350833, "epoch": 2088} {"train_loss": -10.374992370605469, "global_step": 350834, "epoch": 2088} {"train_loss": -11.421079635620117, "global_step": 350835, "epoch": 2088} {"train_loss": -11.28115463256836, "global_step": 350836, "epoch": 2088} {"train_loss": -11.474501609802246, "global_step": 350837, "epoch": 2088} {"train_loss": -10.161418914794922, "global_step": 350838, "epoch": 2088} {"train_loss": -11.047075271606445, "global_step": 350839, "epoch": 2088} {"train_loss": -9.966222763061523, "global_step": 350840, "epoch": 2088} {"train_loss": -11.462465286254883, "global_step": 350841, "epoch": 2088} {"train_loss": -10.922280311584473, "global_step": 350842, "epoch": 2088} {"train_loss": -11.254281997680664, "global_step": 350843, "epoch": 2088} {"train_loss": -10.307903289794922, "global_step": 350844, "epoch": 2088} {"train_loss": -11.16392707824707, "global_step": 350845, "epoch": 2088} {"train_loss": -11.343695640563965, "global_step": 350846, "epoch": 2088} {"train_loss": -11.317138671875, "global_step": 350847, "epoch": 2088} {"train_loss": -11.609329223632812, "global_step": 350848, "epoch": 2088} {"train_loss": -11.366218566894531, "global_step": 350849, "epoch": 2088} {"train_loss": -11.94392204284668, "global_step": 350850, "epoch": 2088} {"train_loss": -11.516265869140625, "global_step": 350851, "epoch": 2088} {"train_loss": -11.90004825592041, "global_step": 350852, "epoch": 2088} {"train_loss": -11.427735328674316, "global_step": 350853, "epoch": 2088} {"train_loss": -10.288965225219727, "global_step": 350854, "epoch": 2088} {"train_loss": -11.695657730102539, "global_step": 350855, "epoch": 2088} {"train_loss": -11.520027160644531, "global_step": 350856, "epoch": 2088} {"train_loss": -11.725717544555664, "global_step": 350857, "epoch": 2088} {"train_loss": -11.832294464111328, "global_step": 350858, "epoch": 2088} {"train_loss": -11.608671188354492, "global_step": 350859, "epoch": 2088} {"train_loss": -11.902873992919922, "global_step": 350860, "epoch": 2088} {"train_loss": -11.910564422607422, "global_step": 350861, "epoch": 2088} {"train_loss": -11.774179458618164, "global_step": 350862, "epoch": 2088} {"train_loss": -11.697944641113281, "global_step": 350863, "epoch": 2088} {"train_loss": -11.697443008422852, "global_step": 350864, "epoch": 2088} {"train_loss": -11.86164665222168, "global_step": 350865, "epoch": 2088} {"train_loss": -12.016244888305664, "global_step": 350866, "epoch": 2088} {"train_loss": -11.602179527282715, "global_step": 350867, "epoch": 2088} {"train_loss": -11.756401062011719, "global_step": 350868, "epoch": 2088} {"train_loss": -11.905715942382812, "global_step": 350869, "epoch": 2088} {"train_loss": -11.714126586914062, "global_step": 350870, "epoch": 2088} {"train_loss": -11.693305969238281, "global_step": 350871, "epoch": 2088} {"train_loss": -12.210458755493164, "global_step": 350872, "epoch": 2088} {"train_loss": -11.729496002197266, "global_step": 350873, "epoch": 2088} {"train_loss": -11.950235366821289, "global_step": 350874, "epoch": 2088} {"train_loss": -12.000411987304688, "global_step": 350875, "epoch": 2088} {"train_loss": -11.947099685668945, "global_step": 350876, "epoch": 2088} {"train_loss": -11.604110717773438, "global_step": 350877, "epoch": 2088} {"train_loss": -12.227283477783203, "global_step": 350878, "epoch": 2088} {"train_loss": -11.933791160583496, "global_step": 350879, "epoch": 2088} {"train_loss": -12.288104057312012, "global_step": 350880, "epoch": 2088} {"train_loss": -12.146966934204102, "global_step": 350881, "epoch": 2088} {"train_loss": -12.111468315124512, "global_step": 350882, "epoch": 2088} {"train_loss": -12.351581573486328, "global_step": 350883, "epoch": 2088} {"train_loss": -12.105151176452637, "global_step": 350884, "epoch": 2088} {"train_loss": -12.13119125366211, "global_step": 350885, "epoch": 2088} {"train_loss": -12.308547973632812, "global_step": 350886, "epoch": 2088} {"train_loss": -12.404570579528809, "global_step": 350887, "epoch": 2088} {"train_loss": -12.199069023132324, "global_step": 350888, "epoch": 2088} {"train_loss": -12.12419319152832, "global_step": 350889, "epoch": 2088} {"train_loss": -12.089092254638672, "global_step": 350890, "epoch": 2088} {"train_loss": -12.195245742797852, "global_step": 350891, "epoch": 2088} {"train_loss": -12.407878875732422, "global_step": 350892, "epoch": 2088} {"train_loss": -12.197014808654785, "global_step": 350893, "epoch": 2088} {"train_loss": -11.965457916259766, "global_step": 350894, "epoch": 2088} {"train_loss": -12.091617584228516, "global_step": 350895, "epoch": 2088} {"train_loss": -12.398332595825195, "global_step": 350896, "epoch": 2088} {"train_loss": -12.116925239562988, "global_step": 350897, "epoch": 2088} {"train_loss": -11.781837463378906, "global_step": 350898, "epoch": 2088} {"train_loss": -12.276430130004883, "global_step": 350899, "epoch": 2088} {"train_loss": -12.02876091003418, "global_step": 350900, "epoch": 2088} {"train_loss": -12.249701499938965, "global_step": 350901, "epoch": 2088} {"train_loss": -12.449502944946289, "global_step": 350902, "epoch": 2088} {"train_loss": -12.22038459777832, "global_step": 350903, "epoch": 2088} {"train_loss": -12.272777557373047, "global_step": 350904, "epoch": 2088} {"train_loss": -12.133899688720703, "global_step": 350905, "epoch": 2088} {"train_loss": -11.972442626953125, "global_step": 350906, "epoch": 2088} {"train_loss": -12.354506492614746, "global_step": 350907, "epoch": 2088} {"train_loss": -12.110977172851562, "global_step": 350908, "epoch": 2088} {"train_loss": -12.401464462280273, "global_step": 350909, "epoch": 2088} {"train_loss": -12.434070587158203, "global_step": 350910, "epoch": 2088} {"train_loss": -12.241082191467285, "global_step": 350911, "epoch": 2088} {"train_loss": -12.43535327911377, "global_step": 350912, "epoch": 2088} {"train_loss": -12.210329055786133, "global_step": 350913, "epoch": 2088} {"train_loss": -12.49632740020752, "global_step": 350914, "epoch": 2088} {"train_loss": -12.22546100616455, "global_step": 350915, "epoch": 2088} {"train_loss": -12.127594947814941, "global_step": 350916, "epoch": 2088} {"train_loss": -12.034472465515137, "global_step": 350917, "epoch": 2088} {"train_loss": -12.201346397399902, "global_step": 350918, "epoch": 2088} {"train_loss": -12.382962226867676, "global_step": 350919, "epoch": 2088} {"train_loss": -12.228736877441406, "global_step": 350920, "epoch": 2088} {"train_loss": -12.246530532836914, "global_step": 350921, "epoch": 2088} {"train_loss": -12.357992172241211, "global_step": 350922, "epoch": 2088} {"train_loss": -12.223189353942871, "global_step": 350923, "epoch": 2088} {"train_loss": -12.388859748840332, "global_step": 350924, "epoch": 2088} {"train_loss": -12.027957916259766, "global_step": 350925, "epoch": 2088} {"train_loss": -12.074275970458984, "global_step": 350926, "epoch": 2088} {"train_loss": -12.40765380859375, "global_step": 350927, "epoch": 2088} {"train_loss": -12.46316909790039, "global_step": 350928, "epoch": 2088} {"train_loss": -12.671392440795898, "global_step": 350929, "epoch": 2088} {"train_loss": -12.136049270629883, "global_step": 350930, "epoch": 2088} {"train_loss": -12.46733283996582, "global_step": 350931, "epoch": 2088} {"train_loss": -12.417560577392578, "global_step": 350932, "epoch": 2088} {"train_loss": -12.203310012817383, "global_step": 350933, "epoch": 2088} {"train_loss": -12.347224235534668, "global_step": 350934, "epoch": 2088} {"train_loss": -12.229013442993164, "global_step": 350935, "epoch": 2088} {"train_loss": -11.97081184387207, "global_step": 350936, "epoch": 2088} {"train_loss": -12.729697227478027, "global_step": 350937, "epoch": 2088} {"train_loss": -12.083141326904297, "global_step": 350938, "epoch": 2088} {"train_loss": -11.618427276611328, "global_step": 350939, "epoch": 2088} {"train_loss": -12.393502235412598, "global_step": 350940, "epoch": 2088} {"train_loss": -12.029487609863281, "global_step": 350941, "epoch": 2088} {"train_loss": -11.663976669311523, "global_step": 350942, "epoch": 2088} {"train_loss": -12.301057815551758, "global_step": 350943, "epoch": 2088} {"train_loss": -11.808631896972656, "global_step": 350944, "epoch": 2088} {"train_loss": -12.485987663269043, "global_step": 350945, "epoch": 2088} {"train_loss": -12.118576049804688, "global_step": 350946, "epoch": 2088} {"train_loss": -12.073121070861816, "global_step": 350947, "epoch": 2088} {"train_loss": -12.450279235839844, "global_step": 350948, "epoch": 2088} {"train_loss": -12.278356552124023, "global_step": 350949, "epoch": 2088} {"train_loss": -12.227455139160156, "global_step": 350950, "epoch": 2088} {"train_loss": -11.660238549822854, "global_step": 350951, "epoch": 2088, "val_loss": 293777.34375} {"train_loss": -12.013525009155273, "global_step": 350952, "epoch": 2089} {"train_loss": -12.174442291259766, "global_step": 350953, "epoch": 2089} {"train_loss": -11.526318550109863, "global_step": 350954, "epoch": 2089} {"train_loss": -11.532771110534668, "global_step": 350955, "epoch": 2089} {"train_loss": -11.273029327392578, "global_step": 350956, "epoch": 2089} {"train_loss": -11.824877738952637, "global_step": 350957, "epoch": 2089} {"train_loss": -11.73182487487793, "global_step": 350958, "epoch": 2089} {"train_loss": -9.80804443359375, "global_step": 350959, "epoch": 2089} {"train_loss": -11.529888153076172, "global_step": 350960, "epoch": 2089} {"train_loss": -9.681255340576172, "global_step": 350961, "epoch": 2089} {"train_loss": -10.520158767700195, "global_step": 350962, "epoch": 2089} {"train_loss": -10.68928337097168, "global_step": 350963, "epoch": 2089} {"train_loss": -10.12270736694336, "global_step": 350964, "epoch": 2089} {"train_loss": -10.375027656555176, "global_step": 350965, "epoch": 2089} {"train_loss": -11.68111801147461, "global_step": 350966, "epoch": 2089} {"train_loss": -10.977972030639648, "global_step": 350967, "epoch": 2089} {"train_loss": -11.465475082397461, "global_step": 350968, "epoch": 2089} {"train_loss": -11.699326515197754, "global_step": 350969, "epoch": 2089} {"train_loss": -10.975881576538086, "global_step": 350970, "epoch": 2089} {"train_loss": -11.996469497680664, "global_step": 350971, "epoch": 2089} {"train_loss": -11.023686408996582, "global_step": 350972, "epoch": 2089} {"train_loss": -11.9217529296875, "global_step": 350973, "epoch": 2089} {"train_loss": -11.435487747192383, "global_step": 350974, "epoch": 2089} {"train_loss": -11.63234806060791, "global_step": 350975, "epoch": 2089} {"train_loss": -11.64211368560791, "global_step": 350976, "epoch": 2089} {"train_loss": -11.794024467468262, "global_step": 350977, "epoch": 2089} {"train_loss": -11.984859466552734, "global_step": 350978, "epoch": 2089} {"train_loss": -11.38046646118164, "global_step": 350979, "epoch": 2089} {"train_loss": -11.836477279663086, "global_step": 350980, "epoch": 2089} {"train_loss": -11.500825881958008, "global_step": 350981, "epoch": 2089} {"train_loss": -12.006879806518555, "global_step": 350982, "epoch": 2089} {"train_loss": -11.460923194885254, "global_step": 350983, "epoch": 2089} {"train_loss": -12.053226470947266, "global_step": 350984, "epoch": 2089} {"train_loss": -11.438705444335938, "global_step": 350985, "epoch": 2089} {"train_loss": -12.369184494018555, "global_step": 350986, "epoch": 2089} {"train_loss": -11.690771102905273, "global_step": 350987, "epoch": 2089} {"train_loss": -11.833106994628906, "global_step": 350988, "epoch": 2089} {"train_loss": -11.907007217407227, "global_step": 350989, "epoch": 2089} {"train_loss": -11.945314407348633, "global_step": 350990, "epoch": 2089} {"train_loss": -11.094820976257324, "global_step": 350991, "epoch": 2089} {"train_loss": -11.764219284057617, "global_step": 350992, "epoch": 2089} {"train_loss": -11.638439178466797, "global_step": 350993, "epoch": 2089} {"train_loss": -11.804344177246094, "global_step": 350994, "epoch": 2089} {"train_loss": -12.219192504882812, "global_step": 350995, "epoch": 2089} {"train_loss": -11.767467498779297, "global_step": 350996, "epoch": 2089} {"train_loss": -12.09740161895752, "global_step": 350997, "epoch": 2089} {"train_loss": -11.845795631408691, "global_step": 350998, "epoch": 2089} {"train_loss": -12.064594268798828, "global_step": 350999, "epoch": 2089} {"train_loss": -12.077338218688965, "global_step": 351000, "epoch": 2089} {"train_loss": -11.895153045654297, "global_step": 351001, "epoch": 2089} {"train_loss": -12.421857833862305, "global_step": 351002, "epoch": 2089} {"train_loss": -11.823319435119629, "global_step": 351003, "epoch": 2089} {"train_loss": -11.980040550231934, "global_step": 351004, "epoch": 2089} {"train_loss": -11.846857070922852, "global_step": 351005, "epoch": 2089} {"train_loss": -11.640079498291016, "global_step": 351006, "epoch": 2089} {"train_loss": -12.29133415222168, "global_step": 351007, "epoch": 2089} {"train_loss": -11.581521034240723, "global_step": 351008, "epoch": 2089} {"train_loss": -11.998909950256348, "global_step": 351009, "epoch": 2089} {"train_loss": -11.958641052246094, "global_step": 351010, "epoch": 2089} {"train_loss": -11.646970748901367, "global_step": 351011, "epoch": 2089} {"train_loss": -11.967679977416992, "global_step": 351012, "epoch": 2089} {"train_loss": -11.997476577758789, "global_step": 351013, "epoch": 2089} {"train_loss": -12.101152420043945, "global_step": 351014, "epoch": 2089} {"train_loss": -11.780704498291016, "global_step": 351015, "epoch": 2089} {"train_loss": -12.08788013458252, "global_step": 351016, "epoch": 2089} {"train_loss": -11.745306015014648, "global_step": 351017, "epoch": 2089} {"train_loss": -12.233373641967773, "global_step": 351018, "epoch": 2089} {"train_loss": -11.516426086425781, "global_step": 351019, "epoch": 2089} {"train_loss": -12.509721755981445, "global_step": 351020, "epoch": 2089} {"train_loss": -12.069502830505371, "global_step": 351021, "epoch": 2089} {"train_loss": -12.192801475524902, "global_step": 351022, "epoch": 2089} {"train_loss": -11.777942657470703, "global_step": 351023, "epoch": 2089} {"train_loss": -11.892471313476562, "global_step": 351024, "epoch": 2089} {"train_loss": -12.097114562988281, "global_step": 351025, "epoch": 2089} {"train_loss": -12.333609580993652, "global_step": 351026, "epoch": 2089} {"train_loss": -12.146653175354004, "global_step": 351027, "epoch": 2089} {"train_loss": -12.383459091186523, "global_step": 351028, "epoch": 2089} {"train_loss": -11.780024528503418, "global_step": 351029, "epoch": 2089} {"train_loss": -11.434581756591797, "global_step": 351030, "epoch": 2089} {"train_loss": -12.349088668823242, "global_step": 351031, "epoch": 2089} {"train_loss": -11.64095401763916, "global_step": 351032, "epoch": 2089} {"train_loss": -11.799554824829102, "global_step": 351033, "epoch": 2089} {"train_loss": -12.387813568115234, "global_step": 351034, "epoch": 2089} {"train_loss": -11.560281753540039, "global_step": 351035, "epoch": 2089} {"train_loss": -12.171056747436523, "global_step": 351036, "epoch": 2089} {"train_loss": -11.868698120117188, "global_step": 351037, "epoch": 2089} {"train_loss": -12.157424926757812, "global_step": 351038, "epoch": 2089} {"train_loss": -12.230621337890625, "global_step": 351039, "epoch": 2089} {"train_loss": -12.328657150268555, "global_step": 351040, "epoch": 2089} {"train_loss": -12.174789428710938, "global_step": 351041, "epoch": 2089} {"train_loss": -12.181909561157227, "global_step": 351042, "epoch": 2089} {"train_loss": -12.438324928283691, "global_step": 351043, "epoch": 2089} {"train_loss": -11.957801818847656, "global_step": 351044, "epoch": 2089} {"train_loss": -12.381978988647461, "global_step": 351045, "epoch": 2089} {"train_loss": -12.25442123413086, "global_step": 351046, "epoch": 2089} {"train_loss": -12.263775825500488, "global_step": 351047, "epoch": 2089} {"train_loss": -12.1904296875, "global_step": 351048, "epoch": 2089} {"train_loss": -12.411783218383789, "global_step": 351049, "epoch": 2089} {"train_loss": -12.282401084899902, "global_step": 351050, "epoch": 2089} {"train_loss": -12.400053024291992, "global_step": 351051, "epoch": 2089} {"train_loss": -12.365083694458008, "global_step": 351052, "epoch": 2089} {"train_loss": -12.311930656433105, "global_step": 351053, "epoch": 2089} {"train_loss": -12.317193031311035, "global_step": 351054, "epoch": 2089} {"train_loss": -11.884760856628418, "global_step": 351055, "epoch": 2089} {"train_loss": -12.384918212890625, "global_step": 351056, "epoch": 2089} {"train_loss": -12.183544158935547, "global_step": 351057, "epoch": 2089} {"train_loss": -11.61747932434082, "global_step": 351058, "epoch": 2089} {"train_loss": -12.450090408325195, "global_step": 351059, "epoch": 2089} {"train_loss": -12.268909454345703, "global_step": 351060, "epoch": 2089} {"train_loss": -12.407238006591797, "global_step": 351061, "epoch": 2089} {"train_loss": -12.274679183959961, "global_step": 351062, "epoch": 2089} {"train_loss": -11.959111213684082, "global_step": 351063, "epoch": 2089} {"train_loss": -12.363441467285156, "global_step": 351064, "epoch": 2089} {"train_loss": -12.376379013061523, "global_step": 351065, "epoch": 2089} {"train_loss": -11.753446578979492, "global_step": 351066, "epoch": 2089} {"train_loss": -11.788219451904297, "global_step": 351067, "epoch": 2089} {"train_loss": -12.253057479858398, "global_step": 351068, "epoch": 2089} {"train_loss": -11.152656555175781, "global_step": 351069, "epoch": 2089} {"train_loss": -10.924652099609375, "global_step": 351070, "epoch": 2089} {"train_loss": -10.930135726928711, "global_step": 351071, "epoch": 2089} {"train_loss": -10.621614456176758, "global_step": 351072, "epoch": 2089} {"train_loss": -11.138410568237305, "global_step": 351073, "epoch": 2089} {"train_loss": -10.908952713012695, "global_step": 351074, "epoch": 2089} {"train_loss": -11.13978385925293, "global_step": 351075, "epoch": 2089} {"train_loss": -11.366039276123047, "global_step": 351076, "epoch": 2089} {"train_loss": -10.9268798828125, "global_step": 351077, "epoch": 2089} {"train_loss": -12.111614227294922, "global_step": 351078, "epoch": 2089} {"train_loss": -10.139200210571289, "global_step": 351079, "epoch": 2089} {"train_loss": -11.987508773803711, "global_step": 351080, "epoch": 2089} {"train_loss": -10.235174179077148, "global_step": 351081, "epoch": 2089} {"train_loss": -11.130330085754395, "global_step": 351082, "epoch": 2089} {"train_loss": -11.294933319091797, "global_step": 351083, "epoch": 2089} {"train_loss": -11.307851791381836, "global_step": 351084, "epoch": 2089} {"train_loss": -12.060286521911621, "global_step": 351085, "epoch": 2089} {"train_loss": -11.571050643920898, "global_step": 351086, "epoch": 2089} {"train_loss": -11.518341064453125, "global_step": 351087, "epoch": 2089} {"train_loss": -11.173900604248047, "global_step": 351088, "epoch": 2089} {"train_loss": -11.24455738067627, "global_step": 351089, "epoch": 2089} {"train_loss": -11.569061279296875, "global_step": 351090, "epoch": 2089} {"train_loss": -11.19028091430664, "global_step": 351091, "epoch": 2089} {"train_loss": -11.106327056884766, "global_step": 351092, "epoch": 2089} {"train_loss": -12.008426666259766, "global_step": 351093, "epoch": 2089} {"train_loss": -10.904948234558105, "global_step": 351094, "epoch": 2089} {"train_loss": -12.11723518371582, "global_step": 351095, "epoch": 2089} {"train_loss": -10.78765869140625, "global_step": 351096, "epoch": 2089} {"train_loss": -11.96735954284668, "global_step": 351097, "epoch": 2089} {"train_loss": -11.27461051940918, "global_step": 351098, "epoch": 2089} {"train_loss": -11.706353187561035, "global_step": 351099, "epoch": 2089} {"train_loss": -11.730218887329102, "global_step": 351100, "epoch": 2089} {"train_loss": -11.150508880615234, "global_step": 351101, "epoch": 2089} {"train_loss": -12.002588272094727, "global_step": 351102, "epoch": 2089} {"train_loss": -11.874632835388184, "global_step": 351103, "epoch": 2089} {"train_loss": -11.88484001159668, "global_step": 351104, "epoch": 2089} {"train_loss": -11.47705364227295, "global_step": 351105, "epoch": 2089} {"train_loss": -11.76845932006836, "global_step": 351106, "epoch": 2089} {"train_loss": -11.898167610168457, "global_step": 351107, "epoch": 2089} {"train_loss": -11.73771858215332, "global_step": 351108, "epoch": 2089} {"train_loss": -11.863018989562988, "global_step": 351109, "epoch": 2089} {"train_loss": -11.835002899169922, "global_step": 351110, "epoch": 2089} {"train_loss": -12.114110946655273, "global_step": 351111, "epoch": 2089} {"train_loss": -12.102293014526367, "global_step": 351112, "epoch": 2089} {"train_loss": -12.144803047180176, "global_step": 351113, "epoch": 2089} {"train_loss": -11.939329147338867, "global_step": 351114, "epoch": 2089} {"train_loss": -12.219736099243164, "global_step": 351115, "epoch": 2089} {"train_loss": -12.048761367797852, "global_step": 351116, "epoch": 2089} {"train_loss": -11.876347541809082, "global_step": 351117, "epoch": 2089} {"train_loss": -11.808197021484375, "global_step": 351118, "epoch": 2089} {"train_loss": -11.743960301081339, "global_step": 351119, "epoch": 2089, "val_loss": 289941.40625} {"train_loss": -11.828967094421387, "global_step": 351120, "epoch": 2090} {"train_loss": -11.65626335144043, "global_step": 351121, "epoch": 2090} {"train_loss": -11.20458984375, "global_step": 351122, "epoch": 2090} {"train_loss": -11.942612648010254, "global_step": 351123, "epoch": 2090} {"train_loss": -11.562875747680664, "global_step": 351124, "epoch": 2090} {"train_loss": -12.038949966430664, "global_step": 351125, "epoch": 2090} {"train_loss": -12.183775901794434, "global_step": 351126, "epoch": 2090} {"train_loss": -11.984973907470703, "global_step": 351127, "epoch": 2090} {"train_loss": -12.121524810791016, "global_step": 351128, "epoch": 2090} {"train_loss": -12.091473579406738, "global_step": 351129, "epoch": 2090} {"train_loss": -12.185683250427246, "global_step": 351130, "epoch": 2090} {"train_loss": -12.246105194091797, "global_step": 351131, "epoch": 2090} {"train_loss": -12.24756145477295, "global_step": 351132, "epoch": 2090} {"train_loss": -12.451252937316895, "global_step": 351133, "epoch": 2090} {"train_loss": -12.360252380371094, "global_step": 351134, "epoch": 2090} {"train_loss": -12.122007369995117, "global_step": 351135, "epoch": 2090} {"train_loss": -12.364944458007812, "global_step": 351136, "epoch": 2090} {"train_loss": -12.185230255126953, "global_step": 351137, "epoch": 2090} {"train_loss": -12.375513076782227, "global_step": 351138, "epoch": 2090} {"train_loss": -12.089786529541016, "global_step": 351139, "epoch": 2090} {"train_loss": -12.444510459899902, "global_step": 351140, "epoch": 2090} {"train_loss": -12.326542854309082, "global_step": 351141, "epoch": 2090} {"train_loss": -12.23564338684082, "global_step": 351142, "epoch": 2090} {"train_loss": -11.962970733642578, "global_step": 351143, "epoch": 2090} {"train_loss": -12.155494689941406, "global_step": 351144, "epoch": 2090} {"train_loss": -12.338168144226074, "global_step": 351145, "epoch": 2090} {"train_loss": -11.975032806396484, "global_step": 351146, "epoch": 2090} {"train_loss": -12.32205581665039, "global_step": 351147, "epoch": 2090} {"train_loss": -11.982215881347656, "global_step": 351148, "epoch": 2090} {"train_loss": -12.134488105773926, "global_step": 351149, "epoch": 2090} {"train_loss": -12.232053756713867, "global_step": 351150, "epoch": 2090} {"train_loss": -11.740927696228027, "global_step": 351151, "epoch": 2090} {"train_loss": -12.601923942565918, "global_step": 351152, "epoch": 2090} {"train_loss": -11.98690414428711, "global_step": 351153, "epoch": 2090} {"train_loss": -12.440448760986328, "global_step": 351154, "epoch": 2090} {"train_loss": -11.969474792480469, "global_step": 351155, "epoch": 2090} {"train_loss": -12.261943817138672, "global_step": 351156, "epoch": 2090} {"train_loss": -12.157981872558594, "global_step": 351157, "epoch": 2090} {"train_loss": -11.954118728637695, "global_step": 351158, "epoch": 2090} {"train_loss": -12.564857482910156, "global_step": 351159, "epoch": 2090} {"train_loss": -12.390562057495117, "global_step": 351160, "epoch": 2090} {"train_loss": -12.4494047164917, "global_step": 351161, "epoch": 2090} {"train_loss": -12.403366088867188, "global_step": 351162, "epoch": 2090} {"train_loss": -12.579334259033203, "global_step": 351163, "epoch": 2090} {"train_loss": -12.279928207397461, "global_step": 351164, "epoch": 2090} {"train_loss": -12.331707954406738, "global_step": 351165, "epoch": 2090} {"train_loss": -12.251229286193848, "global_step": 351166, "epoch": 2090} {"train_loss": -12.449600219726562, "global_step": 351167, "epoch": 2090} {"train_loss": -12.479114532470703, "global_step": 351168, "epoch": 2090} {"train_loss": -12.221137046813965, "global_step": 351169, "epoch": 2090} {"train_loss": -12.272300720214844, "global_step": 351170, "epoch": 2090} {"train_loss": -12.315616607666016, "global_step": 351171, "epoch": 2090} {"train_loss": -12.204875946044922, "global_step": 351172, "epoch": 2090} {"train_loss": -12.095373153686523, "global_step": 351173, "epoch": 2090} {"train_loss": -12.098398208618164, "global_step": 351174, "epoch": 2090} {"train_loss": -12.233485221862793, "global_step": 351175, "epoch": 2090} {"train_loss": -12.216594696044922, "global_step": 351176, "epoch": 2090} {"train_loss": -11.815000534057617, "global_step": 351177, "epoch": 2090} {"train_loss": -11.61506462097168, "global_step": 351178, "epoch": 2090} {"train_loss": -11.24296760559082, "global_step": 351179, "epoch": 2090} {"train_loss": -10.288543701171875, "global_step": 351180, "epoch": 2090} {"train_loss": -12.164068222045898, "global_step": 351181, "epoch": 2090} {"train_loss": -10.557636260986328, "global_step": 351182, "epoch": 2090} {"train_loss": -11.180416107177734, "global_step": 351183, "epoch": 2090} {"train_loss": -11.574016571044922, "global_step": 351184, "epoch": 2090} {"train_loss": -9.931251525878906, "global_step": 351185, "epoch": 2090} {"train_loss": -11.856249809265137, "global_step": 351186, "epoch": 2090} {"train_loss": -10.97953987121582, "global_step": 351187, "epoch": 2090} {"train_loss": -11.738996505737305, "global_step": 351188, "epoch": 2090} {"train_loss": -11.984926223754883, "global_step": 351189, "epoch": 2090} {"train_loss": -12.022093772888184, "global_step": 351190, "epoch": 2090} {"train_loss": -11.79626750946045, "global_step": 351191, "epoch": 2090} {"train_loss": -11.932720184326172, "global_step": 351192, "epoch": 2090} {"train_loss": -11.787887573242188, "global_step": 351193, "epoch": 2090} {"train_loss": -12.05905532836914, "global_step": 351194, "epoch": 2090} {"train_loss": -12.339338302612305, "global_step": 351195, "epoch": 2090} {"train_loss": -12.06606674194336, "global_step": 351196, "epoch": 2090} {"train_loss": -11.914649963378906, "global_step": 351197, "epoch": 2090} {"train_loss": -12.048471450805664, "global_step": 351198, "epoch": 2090} {"train_loss": -11.998489379882812, "global_step": 351199, "epoch": 2090} {"train_loss": -12.059333801269531, "global_step": 351200, "epoch": 2090} {"train_loss": -12.241925239562988, "global_step": 351201, "epoch": 2090} {"train_loss": -12.212836265563965, "global_step": 351202, "epoch": 2090} {"train_loss": -11.88359546661377, "global_step": 351203, "epoch": 2090} {"train_loss": -12.234414100646973, "global_step": 351204, "epoch": 2090} {"train_loss": -12.184433937072754, "global_step": 351205, "epoch": 2090} {"train_loss": -12.444482803344727, "global_step": 351206, "epoch": 2090} {"train_loss": -12.308019638061523, "global_step": 351207, "epoch": 2090} {"train_loss": -12.46546459197998, "global_step": 351208, "epoch": 2090} {"train_loss": -12.349283218383789, "global_step": 351209, "epoch": 2090} {"train_loss": -12.244733810424805, "global_step": 351210, "epoch": 2090} {"train_loss": -12.196109771728516, "global_step": 351211, "epoch": 2090} {"train_loss": -12.278938293457031, "global_step": 351212, "epoch": 2090} {"train_loss": -12.429269790649414, "global_step": 351213, "epoch": 2090} {"train_loss": -12.601095199584961, "global_step": 351214, "epoch": 2090} {"train_loss": -12.277176856994629, "global_step": 351215, "epoch": 2090} {"train_loss": -12.270027160644531, "global_step": 351216, "epoch": 2090} {"train_loss": -12.1915922164917, "global_step": 351217, "epoch": 2090} {"train_loss": -12.167665481567383, "global_step": 351218, "epoch": 2090} {"train_loss": -12.44093132019043, "global_step": 351219, "epoch": 2090} {"train_loss": -12.30228042602539, "global_step": 351220, "epoch": 2090} {"train_loss": -12.039052963256836, "global_step": 351221, "epoch": 2090} {"train_loss": -12.196187973022461, "global_step": 351222, "epoch": 2090} {"train_loss": -12.364839553833008, "global_step": 351223, "epoch": 2090} {"train_loss": -12.427757263183594, "global_step": 351224, "epoch": 2090} {"train_loss": -12.092446327209473, "global_step": 351225, "epoch": 2090} {"train_loss": -12.360841751098633, "global_step": 351226, "epoch": 2090} {"train_loss": -12.497529983520508, "global_step": 351227, "epoch": 2090} {"train_loss": -12.088680267333984, "global_step": 351228, "epoch": 2090} {"train_loss": -12.576749801635742, "global_step": 351229, "epoch": 2090} {"train_loss": -12.342348098754883, "global_step": 351230, "epoch": 2090} {"train_loss": -12.620138168334961, "global_step": 351231, "epoch": 2090} {"train_loss": -12.175350189208984, "global_step": 351232, "epoch": 2090} {"train_loss": -12.507543563842773, "global_step": 351233, "epoch": 2090} {"train_loss": -12.346107482910156, "global_step": 351234, "epoch": 2090} {"train_loss": -12.38885498046875, "global_step": 351235, "epoch": 2090} {"train_loss": -12.58950138092041, "global_step": 351236, "epoch": 2090} {"train_loss": -12.380067825317383, "global_step": 351237, "epoch": 2090} {"train_loss": -12.36680793762207, "global_step": 351238, "epoch": 2090} {"train_loss": -12.434328079223633, "global_step": 351239, "epoch": 2090} {"train_loss": -12.618175506591797, "global_step": 351240, "epoch": 2090} {"train_loss": -12.328100204467773, "global_step": 351241, "epoch": 2090} {"train_loss": -12.15319538116455, "global_step": 351242, "epoch": 2090} {"train_loss": -11.8489990234375, "global_step": 351243, "epoch": 2090} {"train_loss": -12.714345932006836, "global_step": 351244, "epoch": 2090} {"train_loss": -12.049585342407227, "global_step": 351245, "epoch": 2090} {"train_loss": -12.05321216583252, "global_step": 351246, "epoch": 2090} {"train_loss": -12.415090560913086, "global_step": 351247, "epoch": 2090} {"train_loss": -12.704780578613281, "global_step": 351248, "epoch": 2090} {"train_loss": -12.167881965637207, "global_step": 351249, "epoch": 2090} {"train_loss": -12.348944664001465, "global_step": 351250, "epoch": 2090} {"train_loss": -12.812355041503906, "global_step": 351251, "epoch": 2090} {"train_loss": -12.555505752563477, "global_step": 351252, "epoch": 2090} {"train_loss": -12.134552001953125, "global_step": 351253, "epoch": 2090} {"train_loss": -12.638520240783691, "global_step": 351254, "epoch": 2090} {"train_loss": -12.586813926696777, "global_step": 351255, "epoch": 2090} {"train_loss": -12.440006256103516, "global_step": 351256, "epoch": 2090} {"train_loss": -12.55858039855957, "global_step": 351257, "epoch": 2090} {"train_loss": -12.413660049438477, "global_step": 351258, "epoch": 2090} {"train_loss": -12.277776718139648, "global_step": 351259, "epoch": 2090} {"train_loss": -12.070601463317871, "global_step": 351260, "epoch": 2090} {"train_loss": -12.322938919067383, "global_step": 351261, "epoch": 2090} {"train_loss": -12.495820999145508, "global_step": 351262, "epoch": 2090} {"train_loss": -12.255247116088867, "global_step": 351263, "epoch": 2090} {"train_loss": -12.543642044067383, "global_step": 351264, "epoch": 2090} {"train_loss": -12.260063171386719, "global_step": 351265, "epoch": 2090} {"train_loss": -12.261524200439453, "global_step": 351266, "epoch": 2090} {"train_loss": -11.946645736694336, "global_step": 351267, "epoch": 2090} {"train_loss": -12.266287803649902, "global_step": 351268, "epoch": 2090} {"train_loss": -11.89089584350586, "global_step": 351269, "epoch": 2090} {"train_loss": -12.023458480834961, "global_step": 351270, "epoch": 2090} {"train_loss": -10.340022087097168, "global_step": 351271, "epoch": 2090} {"train_loss": -11.313149452209473, "global_step": 351272, "epoch": 2090} {"train_loss": -12.0186185836792, "global_step": 351273, "epoch": 2090} {"train_loss": -11.388011932373047, "global_step": 351274, "epoch": 2090} {"train_loss": -11.393644332885742, "global_step": 351275, "epoch": 2090} {"train_loss": -11.28108024597168, "global_step": 351276, "epoch": 2090} {"train_loss": -9.180590629577637, "global_step": 351277, "epoch": 2090} {"train_loss": -9.306294441223145, "global_step": 351278, "epoch": 2090} {"train_loss": -10.6307373046875, "global_step": 351279, "epoch": 2090} {"train_loss": -9.009695053100586, "global_step": 351280, "epoch": 2090} {"train_loss": -9.669071197509766, "global_step": 351281, "epoch": 2090} {"train_loss": -9.88995361328125, "global_step": 351282, "epoch": 2090} {"train_loss": -11.402267456054688, "global_step": 351283, "epoch": 2090} {"train_loss": -9.866085052490234, "global_step": 351284, "epoch": 2090} {"train_loss": -11.02238941192627, "global_step": 351285, "epoch": 2090} {"train_loss": -11.212641716003418, "global_step": 351286, "epoch": 2090} {"train_loss": -11.992134974116372, "global_step": 351287, "epoch": 2090, "val_loss": 284679.25, "train_action_mse_error": 2.076960802078247} {"train_loss": -11.677528381347656, "global_step": 351288, "epoch": 2091} {"train_loss": -10.86859130859375, "global_step": 351289, "epoch": 2091} {"train_loss": -11.767152786254883, "global_step": 351290, "epoch": 2091} {"train_loss": -11.024224281311035, "global_step": 351291, "epoch": 2091} {"train_loss": -10.848939895629883, "global_step": 351292, "epoch": 2091} {"train_loss": -11.674376487731934, "global_step": 351293, "epoch": 2091} {"train_loss": -11.517766952514648, "global_step": 351294, "epoch": 2091} {"train_loss": -11.304152488708496, "global_step": 351295, "epoch": 2091} {"train_loss": -12.078147888183594, "global_step": 351296, "epoch": 2091} {"train_loss": -11.166397094726562, "global_step": 351297, "epoch": 2091} {"train_loss": -11.667854309082031, "global_step": 351298, "epoch": 2091} {"train_loss": -11.901629447937012, "global_step": 351299, "epoch": 2091} {"train_loss": -10.907877922058105, "global_step": 351300, "epoch": 2091} {"train_loss": -11.964113235473633, "global_step": 351301, "epoch": 2091} {"train_loss": -11.63045883178711, "global_step": 351302, "epoch": 2091} {"train_loss": -11.644542694091797, "global_step": 351303, "epoch": 2091} {"train_loss": -11.412763595581055, "global_step": 351304, "epoch": 2091} {"train_loss": -11.633907318115234, "global_step": 351305, "epoch": 2091} {"train_loss": -12.021329879760742, "global_step": 351306, "epoch": 2091} {"train_loss": -11.803260803222656, "global_step": 351307, "epoch": 2091} {"train_loss": -12.183609008789062, "global_step": 351308, "epoch": 2091} {"train_loss": -11.879413604736328, "global_step": 351309, "epoch": 2091} {"train_loss": -11.333730697631836, "global_step": 351310, "epoch": 2091} {"train_loss": -11.764983177185059, "global_step": 351311, "epoch": 2091} {"train_loss": -11.226541519165039, "global_step": 351312, "epoch": 2091} {"train_loss": -11.867313385009766, "global_step": 351313, "epoch": 2091} {"train_loss": -11.737297058105469, "global_step": 351314, "epoch": 2091} {"train_loss": -12.175277709960938, "global_step": 351315, "epoch": 2091} {"train_loss": -11.696099281311035, "global_step": 351316, "epoch": 2091} {"train_loss": -12.198814392089844, "global_step": 351317, "epoch": 2091} {"train_loss": -12.020379066467285, "global_step": 351318, "epoch": 2091} {"train_loss": -11.968853950500488, "global_step": 351319, "epoch": 2091} {"train_loss": -12.379528045654297, "global_step": 351320, "epoch": 2091} {"train_loss": -12.052654266357422, "global_step": 351321, "epoch": 2091} {"train_loss": -12.094392776489258, "global_step": 351322, "epoch": 2091} {"train_loss": -12.124226570129395, "global_step": 351323, "epoch": 2091} {"train_loss": -11.812494277954102, "global_step": 351324, "epoch": 2091} {"train_loss": -12.209999084472656, "global_step": 351325, "epoch": 2091} {"train_loss": -12.054449081420898, "global_step": 351326, "epoch": 2091} {"train_loss": -12.189973831176758, "global_step": 351327, "epoch": 2091} {"train_loss": -12.309181213378906, "global_step": 351328, "epoch": 2091} {"train_loss": -12.023446083068848, "global_step": 351329, "epoch": 2091} {"train_loss": -12.388628005981445, "global_step": 351330, "epoch": 2091} {"train_loss": -12.146992683410645, "global_step": 351331, "epoch": 2091} {"train_loss": -12.25695514678955, "global_step": 351332, "epoch": 2091} {"train_loss": -12.09841537475586, "global_step": 351333, "epoch": 2091} {"train_loss": -12.400114059448242, "global_step": 351334, "epoch": 2091} {"train_loss": -12.397539138793945, "global_step": 351335, "epoch": 2091} {"train_loss": -12.09701156616211, "global_step": 351336, "epoch": 2091} {"train_loss": -12.507534980773926, "global_step": 351337, "epoch": 2091} {"train_loss": -11.913288116455078, "global_step": 351338, "epoch": 2091} {"train_loss": -12.219539642333984, "global_step": 351339, "epoch": 2091} {"train_loss": -12.297279357910156, "global_step": 351340, "epoch": 2091} {"train_loss": -12.186771392822266, "global_step": 351341, "epoch": 2091} {"train_loss": -12.300363540649414, "global_step": 351342, "epoch": 2091} {"train_loss": -12.089673042297363, "global_step": 351343, "epoch": 2091} {"train_loss": -12.415621757507324, "global_step": 351344, "epoch": 2091} {"train_loss": -12.158870697021484, "global_step": 351345, "epoch": 2091} {"train_loss": -12.413509368896484, "global_step": 351346, "epoch": 2091} {"train_loss": -12.615671157836914, "global_step": 351347, "epoch": 2091} {"train_loss": -12.521013259887695, "global_step": 351348, "epoch": 2091} {"train_loss": -12.42238998413086, "global_step": 351349, "epoch": 2091} {"train_loss": -12.55073356628418, "global_step": 351350, "epoch": 2091} {"train_loss": -12.284994125366211, "global_step": 351351, "epoch": 2091} {"train_loss": -12.315616607666016, "global_step": 351352, "epoch": 2091} {"train_loss": -12.377763748168945, "global_step": 351353, "epoch": 2091} {"train_loss": -12.678424835205078, "global_step": 351354, "epoch": 2091} {"train_loss": -12.29684829711914, "global_step": 351355, "epoch": 2091} {"train_loss": -12.524913787841797, "global_step": 351356, "epoch": 2091} {"train_loss": -12.553881645202637, "global_step": 351357, "epoch": 2091} {"train_loss": -12.721758842468262, "global_step": 351358, "epoch": 2091} {"train_loss": -12.433246612548828, "global_step": 351359, "epoch": 2091} {"train_loss": -12.522634506225586, "global_step": 351360, "epoch": 2091} {"train_loss": -12.188066482543945, "global_step": 351361, "epoch": 2091} {"train_loss": -12.414864540100098, "global_step": 351362, "epoch": 2091} {"train_loss": -12.207560539245605, "global_step": 351363, "epoch": 2091} {"train_loss": -11.934747695922852, "global_step": 351364, "epoch": 2091} {"train_loss": -12.177148818969727, "global_step": 351365, "epoch": 2091} {"train_loss": -12.126476287841797, "global_step": 351366, "epoch": 2091} {"train_loss": -12.233297348022461, "global_step": 351367, "epoch": 2091} {"train_loss": -11.967470169067383, "global_step": 351368, "epoch": 2091} {"train_loss": -12.44727897644043, "global_step": 351369, "epoch": 2091} {"train_loss": -11.783029556274414, "global_step": 351370, "epoch": 2091} {"train_loss": -12.220014572143555, "global_step": 351371, "epoch": 2091} {"train_loss": -11.44947624206543, "global_step": 351372, "epoch": 2091} {"train_loss": -11.966130256652832, "global_step": 351373, "epoch": 2091} {"train_loss": -12.309309005737305, "global_step": 351374, "epoch": 2091} {"train_loss": -12.122298240661621, "global_step": 351375, "epoch": 2091} {"train_loss": -11.390045166015625, "global_step": 351376, "epoch": 2091} {"train_loss": -12.159208297729492, "global_step": 351377, "epoch": 2091} {"train_loss": -12.14154052734375, "global_step": 351378, "epoch": 2091} {"train_loss": -11.700521469116211, "global_step": 351379, "epoch": 2091} {"train_loss": -11.776656150817871, "global_step": 351380, "epoch": 2091} {"train_loss": -12.210269927978516, "global_step": 351381, "epoch": 2091} {"train_loss": -12.086559295654297, "global_step": 351382, "epoch": 2091} {"train_loss": -12.254536628723145, "global_step": 351383, "epoch": 2091} {"train_loss": -12.500432968139648, "global_step": 351384, "epoch": 2091} {"train_loss": -12.492502212524414, "global_step": 351385, "epoch": 2091} {"train_loss": -12.396368980407715, "global_step": 351386, "epoch": 2091} {"train_loss": -12.182113647460938, "global_step": 351387, "epoch": 2091} {"train_loss": -12.463396072387695, "global_step": 351388, "epoch": 2091} {"train_loss": -12.08718204498291, "global_step": 351389, "epoch": 2091} {"train_loss": -12.379464149475098, "global_step": 351390, "epoch": 2091} {"train_loss": -12.45152759552002, "global_step": 351391, "epoch": 2091} {"train_loss": -12.480154037475586, "global_step": 351392, "epoch": 2091} {"train_loss": -12.46377182006836, "global_step": 351393, "epoch": 2091} {"train_loss": -12.452221870422363, "global_step": 351394, "epoch": 2091} {"train_loss": -12.4564790725708, "global_step": 351395, "epoch": 2091} {"train_loss": -12.182955741882324, "global_step": 351396, "epoch": 2091} {"train_loss": -12.430362701416016, "global_step": 351397, "epoch": 2091} {"train_loss": -12.44703483581543, "global_step": 351398, "epoch": 2091} {"train_loss": -12.493873596191406, "global_step": 351399, "epoch": 2091} {"train_loss": -12.465677261352539, "global_step": 351400, "epoch": 2091} {"train_loss": -12.210339546203613, "global_step": 351401, "epoch": 2091} {"train_loss": -12.371223449707031, "global_step": 351402, "epoch": 2091} {"train_loss": -12.70097541809082, "global_step": 351403, "epoch": 2091} {"train_loss": -12.146449089050293, "global_step": 351404, "epoch": 2091} {"train_loss": -12.300286293029785, "global_step": 351405, "epoch": 2091} {"train_loss": -12.449317932128906, "global_step": 351406, "epoch": 2091} {"train_loss": -12.348339080810547, "global_step": 351407, "epoch": 2091} {"train_loss": -11.394479751586914, "global_step": 351408, "epoch": 2091} {"train_loss": -12.587480545043945, "global_step": 351409, "epoch": 2091} {"train_loss": -12.22104549407959, "global_step": 351410, "epoch": 2091} {"train_loss": -12.072760581970215, "global_step": 351411, "epoch": 2091} {"train_loss": -12.072647094726562, "global_step": 351412, "epoch": 2091} {"train_loss": -12.35389518737793, "global_step": 351413, "epoch": 2091} {"train_loss": -12.270284652709961, "global_step": 351414, "epoch": 2091} {"train_loss": -12.314897537231445, "global_step": 351415, "epoch": 2091} {"train_loss": -12.30058479309082, "global_step": 351416, "epoch": 2091} {"train_loss": -11.890800476074219, "global_step": 351417, "epoch": 2091} {"train_loss": -12.470123291015625, "global_step": 351418, "epoch": 2091} {"train_loss": -12.17990493774414, "global_step": 351419, "epoch": 2091} {"train_loss": -12.026769638061523, "global_step": 351420, "epoch": 2091} {"train_loss": -12.236724853515625, "global_step": 351421, "epoch": 2091} {"train_loss": -12.054265022277832, "global_step": 351422, "epoch": 2091} {"train_loss": -11.806936264038086, "global_step": 351423, "epoch": 2091} {"train_loss": -11.996678352355957, "global_step": 351424, "epoch": 2091} {"train_loss": -11.511667251586914, "global_step": 351425, "epoch": 2091} {"train_loss": -10.671608924865723, "global_step": 351426, "epoch": 2091} {"train_loss": -11.777328491210938, "global_step": 351427, "epoch": 2091} {"train_loss": -12.090065002441406, "global_step": 351428, "epoch": 2091} {"train_loss": -10.89657974243164, "global_step": 351429, "epoch": 2091} {"train_loss": -10.861478805541992, "global_step": 351430, "epoch": 2091} {"train_loss": -11.568782806396484, "global_step": 351431, "epoch": 2091} {"train_loss": -9.521499633789062, "global_step": 351432, "epoch": 2091} {"train_loss": -10.248376846313477, "global_step": 351433, "epoch": 2091} {"train_loss": -11.065604209899902, "global_step": 351434, "epoch": 2091} {"train_loss": -11.408208847045898, "global_step": 351435, "epoch": 2091} {"train_loss": -11.726354598999023, "global_step": 351436, "epoch": 2091} {"train_loss": -11.142478942871094, "global_step": 351437, "epoch": 2091} {"train_loss": -11.678152084350586, "global_step": 351438, "epoch": 2091} {"train_loss": -11.807408332824707, "global_step": 351439, "epoch": 2091} {"train_loss": -11.857318878173828, "global_step": 351440, "epoch": 2091} {"train_loss": -11.552743911743164, "global_step": 351441, "epoch": 2091} {"train_loss": -11.65146541595459, "global_step": 351442, "epoch": 2091} {"train_loss": -11.323921203613281, "global_step": 351443, "epoch": 2091} {"train_loss": -11.59251594543457, "global_step": 351444, "epoch": 2091} {"train_loss": -12.12915325164795, "global_step": 351445, "epoch": 2091} {"train_loss": -11.408926010131836, "global_step": 351446, "epoch": 2091} {"train_loss": -11.64629077911377, "global_step": 351447, "epoch": 2091} {"train_loss": -11.486330032348633, "global_step": 351448, "epoch": 2091} {"train_loss": -10.726520538330078, "global_step": 351449, "epoch": 2091} {"train_loss": -11.762872695922852, "global_step": 351450, "epoch": 2091} {"train_loss": -11.798898696899414, "global_step": 351451, "epoch": 2091} {"train_loss": -11.344757080078125, "global_step": 351452, "epoch": 2091} {"train_loss": -12.104572296142578, "global_step": 351453, "epoch": 2091} {"train_loss": -11.056160926818848, "global_step": 351454, "epoch": 2091} {"train_loss": -11.96691426209041, "global_step": 351455, "epoch": 2091, "val_loss": 289419.15625} {"train_loss": -11.767599105834961, "global_step": 351456, "epoch": 2092} {"train_loss": -11.005683898925781, "global_step": 351457, "epoch": 2092} {"train_loss": -11.438459396362305, "global_step": 351458, "epoch": 2092} {"train_loss": -11.021352767944336, "global_step": 351459, "epoch": 2092} {"train_loss": -9.951650619506836, "global_step": 351460, "epoch": 2092} {"train_loss": -11.035945892333984, "global_step": 351461, "epoch": 2092} {"train_loss": -10.169919967651367, "global_step": 351462, "epoch": 2092} {"train_loss": -10.73453140258789, "global_step": 351463, "epoch": 2092} {"train_loss": -11.209667205810547, "global_step": 351464, "epoch": 2092} {"train_loss": -9.794098854064941, "global_step": 351465, "epoch": 2092} {"train_loss": -11.00227165222168, "global_step": 351466, "epoch": 2092} {"train_loss": -9.088462829589844, "global_step": 351467, "epoch": 2092} {"train_loss": -10.165901184082031, "global_step": 351468, "epoch": 2092} {"train_loss": -10.274736404418945, "global_step": 351469, "epoch": 2092} {"train_loss": -10.707464218139648, "global_step": 351470, "epoch": 2092} {"train_loss": -9.97713851928711, "global_step": 351471, "epoch": 2092} {"train_loss": -11.280652046203613, "global_step": 351472, "epoch": 2092} {"train_loss": -10.610816955566406, "global_step": 351473, "epoch": 2092} {"train_loss": -10.622594833374023, "global_step": 351474, "epoch": 2092} {"train_loss": -10.591102600097656, "global_step": 351475, "epoch": 2092} {"train_loss": -11.359258651733398, "global_step": 351476, "epoch": 2092} {"train_loss": -10.17530632019043, "global_step": 351477, "epoch": 2092} {"train_loss": -11.56893539428711, "global_step": 351478, "epoch": 2092} {"train_loss": -11.290218353271484, "global_step": 351479, "epoch": 2092} {"train_loss": -11.150144577026367, "global_step": 351480, "epoch": 2092} {"train_loss": -11.960474014282227, "global_step": 351481, "epoch": 2092} {"train_loss": -10.963642120361328, "global_step": 351482, "epoch": 2092} {"train_loss": -11.431085586547852, "global_step": 351483, "epoch": 2092} {"train_loss": -11.39883804321289, "global_step": 351484, "epoch": 2092} {"train_loss": -11.145641326904297, "global_step": 351485, "epoch": 2092} {"train_loss": -11.452674865722656, "global_step": 351486, "epoch": 2092} {"train_loss": -11.554433822631836, "global_step": 351487, "epoch": 2092} {"train_loss": -11.409210205078125, "global_step": 351488, "epoch": 2092} {"train_loss": -11.700828552246094, "global_step": 351489, "epoch": 2092} {"train_loss": -11.88677978515625, "global_step": 351490, "epoch": 2092} {"train_loss": -11.495593070983887, "global_step": 351491, "epoch": 2092} {"train_loss": -11.885276794433594, "global_step": 351492, "epoch": 2092} {"train_loss": -11.452144622802734, "global_step": 351493, "epoch": 2092} {"train_loss": -12.093559265136719, "global_step": 351494, "epoch": 2092} {"train_loss": -11.583104133605957, "global_step": 351495, "epoch": 2092} {"train_loss": -11.390482902526855, "global_step": 351496, "epoch": 2092} {"train_loss": -12.027935028076172, "global_step": 351497, "epoch": 2092} {"train_loss": -11.644830703735352, "global_step": 351498, "epoch": 2092} {"train_loss": -11.692913055419922, "global_step": 351499, "epoch": 2092} {"train_loss": -11.908549308776855, "global_step": 351500, "epoch": 2092} {"train_loss": -11.821934700012207, "global_step": 351501, "epoch": 2092} {"train_loss": -11.98454761505127, "global_step": 351502, "epoch": 2092} {"train_loss": -11.711978912353516, "global_step": 351503, "epoch": 2092} {"train_loss": -11.952288627624512, "global_step": 351504, "epoch": 2092} {"train_loss": -11.874659538269043, "global_step": 351505, "epoch": 2092} {"train_loss": -11.970257759094238, "global_step": 351506, "epoch": 2092} {"train_loss": -12.178762435913086, "global_step": 351507, "epoch": 2092} {"train_loss": -12.023259162902832, "global_step": 351508, "epoch": 2092} {"train_loss": -12.16220474243164, "global_step": 351509, "epoch": 2092} {"train_loss": -12.018240928649902, "global_step": 351510, "epoch": 2092} {"train_loss": -12.139995574951172, "global_step": 351511, "epoch": 2092} {"train_loss": -12.370132446289062, "global_step": 351512, "epoch": 2092} {"train_loss": -12.103385925292969, "global_step": 351513, "epoch": 2092} {"train_loss": -12.292435646057129, "global_step": 351514, "epoch": 2092} {"train_loss": -12.357711791992188, "global_step": 351515, "epoch": 2092} {"train_loss": -12.080846786499023, "global_step": 351516, "epoch": 2092} {"train_loss": -12.422964096069336, "global_step": 351517, "epoch": 2092} {"train_loss": -11.911909103393555, "global_step": 351518, "epoch": 2092} {"train_loss": -12.333768844604492, "global_step": 351519, "epoch": 2092} {"train_loss": -12.46296501159668, "global_step": 351520, "epoch": 2092} {"train_loss": -12.10937213897705, "global_step": 351521, "epoch": 2092} {"train_loss": -12.278504371643066, "global_step": 351522, "epoch": 2092} {"train_loss": -12.069046974182129, "global_step": 351523, "epoch": 2092} {"train_loss": -12.443428039550781, "global_step": 351524, "epoch": 2092} {"train_loss": -12.441648483276367, "global_step": 351525, "epoch": 2092} {"train_loss": -12.15134048461914, "global_step": 351526, "epoch": 2092} {"train_loss": -12.28294849395752, "global_step": 351527, "epoch": 2092} {"train_loss": -12.051423072814941, "global_step": 351528, "epoch": 2092} {"train_loss": -12.392579078674316, "global_step": 351529, "epoch": 2092} {"train_loss": -12.508735656738281, "global_step": 351530, "epoch": 2092} {"train_loss": -12.189021110534668, "global_step": 351531, "epoch": 2092} {"train_loss": -12.28095817565918, "global_step": 351532, "epoch": 2092} {"train_loss": -12.252933502197266, "global_step": 351533, "epoch": 2092} {"train_loss": -12.477191925048828, "global_step": 351534, "epoch": 2092} {"train_loss": -12.337724685668945, "global_step": 351535, "epoch": 2092} {"train_loss": -12.247997283935547, "global_step": 351536, "epoch": 2092} {"train_loss": -12.441643714904785, "global_step": 351537, "epoch": 2092} {"train_loss": -12.281959533691406, "global_step": 351538, "epoch": 2092} {"train_loss": -12.478473663330078, "global_step": 351539, "epoch": 2092} {"train_loss": -12.397174835205078, "global_step": 351540, "epoch": 2092} {"train_loss": -12.421367645263672, "global_step": 351541, "epoch": 2092} {"train_loss": -12.336201667785645, "global_step": 351542, "epoch": 2092} {"train_loss": -11.872421264648438, "global_step": 351543, "epoch": 2092} {"train_loss": -12.301159858703613, "global_step": 351544, "epoch": 2092} {"train_loss": -12.381985664367676, "global_step": 351545, "epoch": 2092} {"train_loss": -12.211797714233398, "global_step": 351546, "epoch": 2092} {"train_loss": -12.413318634033203, "global_step": 351547, "epoch": 2092} {"train_loss": -12.100284576416016, "global_step": 351548, "epoch": 2092} {"train_loss": -12.265081405639648, "global_step": 351549, "epoch": 2092} {"train_loss": -12.289348602294922, "global_step": 351550, "epoch": 2092} {"train_loss": -12.194086074829102, "global_step": 351551, "epoch": 2092} {"train_loss": -12.429422378540039, "global_step": 351552, "epoch": 2092} {"train_loss": -12.452987670898438, "global_step": 351553, "epoch": 2092} {"train_loss": -12.435107231140137, "global_step": 351554, "epoch": 2092} {"train_loss": -12.28834056854248, "global_step": 351555, "epoch": 2092} {"train_loss": -12.146256446838379, "global_step": 351556, "epoch": 2092} {"train_loss": -12.470636367797852, "global_step": 351557, "epoch": 2092} {"train_loss": -12.319944381713867, "global_step": 351558, "epoch": 2092} {"train_loss": -12.686620712280273, "global_step": 351559, "epoch": 2092} {"train_loss": -12.302658081054688, "global_step": 351560, "epoch": 2092} {"train_loss": -12.461780548095703, "global_step": 351561, "epoch": 2092} {"train_loss": -12.273565292358398, "global_step": 351562, "epoch": 2092} {"train_loss": -12.148505210876465, "global_step": 351563, "epoch": 2092} {"train_loss": -12.418048858642578, "global_step": 351564, "epoch": 2092} {"train_loss": -11.885482788085938, "global_step": 351565, "epoch": 2092} {"train_loss": -12.482719421386719, "global_step": 351566, "epoch": 2092} {"train_loss": -11.841195106506348, "global_step": 351567, "epoch": 2092} {"train_loss": -11.865213394165039, "global_step": 351568, "epoch": 2092} {"train_loss": -12.242332458496094, "global_step": 351569, "epoch": 2092} {"train_loss": -10.586736679077148, "global_step": 351570, "epoch": 2092} {"train_loss": -12.202615737915039, "global_step": 351571, "epoch": 2092} {"train_loss": -12.076131820678711, "global_step": 351572, "epoch": 2092} {"train_loss": -11.595311164855957, "global_step": 351573, "epoch": 2092} {"train_loss": -12.522151947021484, "global_step": 351574, "epoch": 2092} {"train_loss": -12.334830284118652, "global_step": 351575, "epoch": 2092} {"train_loss": -11.937887191772461, "global_step": 351576, "epoch": 2092} {"train_loss": -12.45425033569336, "global_step": 351577, "epoch": 2092} {"train_loss": -12.000373840332031, "global_step": 351578, "epoch": 2092} {"train_loss": -12.612090110778809, "global_step": 351579, "epoch": 2092} {"train_loss": -12.079747200012207, "global_step": 351580, "epoch": 2092} {"train_loss": -12.410083770751953, "global_step": 351581, "epoch": 2092} {"train_loss": -12.49760913848877, "global_step": 351582, "epoch": 2092} {"train_loss": -12.161097526550293, "global_step": 351583, "epoch": 2092} {"train_loss": -12.587964057922363, "global_step": 351584, "epoch": 2092} {"train_loss": -12.269147872924805, "global_step": 351585, "epoch": 2092} {"train_loss": -12.232590675354004, "global_step": 351586, "epoch": 2092} {"train_loss": -12.373723030090332, "global_step": 351587, "epoch": 2092} {"train_loss": -12.646656036376953, "global_step": 351588, "epoch": 2092} {"train_loss": -12.645794868469238, "global_step": 351589, "epoch": 2092} {"train_loss": -12.451863288879395, "global_step": 351590, "epoch": 2092} {"train_loss": -12.396493911743164, "global_step": 351591, "epoch": 2092} {"train_loss": -12.11181640625, "global_step": 351592, "epoch": 2092} {"train_loss": -12.578011512756348, "global_step": 351593, "epoch": 2092} {"train_loss": -12.217852592468262, "global_step": 351594, "epoch": 2092} {"train_loss": -12.34946060180664, "global_step": 351595, "epoch": 2092} {"train_loss": -12.510190963745117, "global_step": 351596, "epoch": 2092} {"train_loss": -11.807294845581055, "global_step": 351597, "epoch": 2092} {"train_loss": -11.950347900390625, "global_step": 351598, "epoch": 2092} {"train_loss": -12.359786987304688, "global_step": 351599, "epoch": 2092} {"train_loss": -11.466575622558594, "global_step": 351600, "epoch": 2092} {"train_loss": -11.764163970947266, "global_step": 351601, "epoch": 2092} {"train_loss": -11.951375007629395, "global_step": 351602, "epoch": 2092} {"train_loss": -11.206846237182617, "global_step": 351603, "epoch": 2092} {"train_loss": -12.15019416809082, "global_step": 351604, "epoch": 2092} {"train_loss": -9.97108268737793, "global_step": 351605, "epoch": 2092} {"train_loss": -11.16705322265625, "global_step": 351606, "epoch": 2092} {"train_loss": -11.09666633605957, "global_step": 351607, "epoch": 2092} {"train_loss": -11.41689682006836, "global_step": 351608, "epoch": 2092} {"train_loss": -10.179096221923828, "global_step": 351609, "epoch": 2092} {"train_loss": -12.00954532623291, "global_step": 351610, "epoch": 2092} {"train_loss": -11.163429260253906, "global_step": 351611, "epoch": 2092} {"train_loss": -11.847763061523438, "global_step": 351612, "epoch": 2092} {"train_loss": -11.183236122131348, "global_step": 351613, "epoch": 2092} {"train_loss": -12.081050872802734, "global_step": 351614, "epoch": 2092} {"train_loss": -11.371358871459961, "global_step": 351615, "epoch": 2092} {"train_loss": -11.685476303100586, "global_step": 351616, "epoch": 2092} {"train_loss": -10.564165115356445, "global_step": 351617, "epoch": 2092} {"train_loss": -11.28996753692627, "global_step": 351618, "epoch": 2092} {"train_loss": -11.928739547729492, "global_step": 351619, "epoch": 2092} {"train_loss": -11.04193115234375, "global_step": 351620, "epoch": 2092} {"train_loss": -11.861377716064453, "global_step": 351621, "epoch": 2092} {"train_loss": -11.072635650634766, "global_step": 351622, "epoch": 2092} {"train_loss": -11.8115504412424, "global_step": 351623, "epoch": 2092, "val_loss": 291099.78125} {"train_loss": -11.822019577026367, "global_step": 351624, "epoch": 2093} {"train_loss": -10.726476669311523, "global_step": 351625, "epoch": 2093} {"train_loss": -11.975912094116211, "global_step": 351626, "epoch": 2093} {"train_loss": -10.308717727661133, "global_step": 351627, "epoch": 2093} {"train_loss": -11.016955375671387, "global_step": 351628, "epoch": 2093} {"train_loss": -11.347868919372559, "global_step": 351629, "epoch": 2093} {"train_loss": -10.563457489013672, "global_step": 351630, "epoch": 2093} {"train_loss": -9.741641998291016, "global_step": 351631, "epoch": 2093} {"train_loss": -11.654508590698242, "global_step": 351632, "epoch": 2093} {"train_loss": -10.355243682861328, "global_step": 351633, "epoch": 2093} {"train_loss": -11.559881210327148, "global_step": 351634, "epoch": 2093} {"train_loss": -10.982208251953125, "global_step": 351635, "epoch": 2093} {"train_loss": -10.795745849609375, "global_step": 351636, "epoch": 2093} {"train_loss": -10.829015731811523, "global_step": 351637, "epoch": 2093} {"train_loss": -11.880685806274414, "global_step": 351638, "epoch": 2093} {"train_loss": -11.101099014282227, "global_step": 351639, "epoch": 2093} {"train_loss": -11.654050827026367, "global_step": 351640, "epoch": 2093} {"train_loss": -11.162772178649902, "global_step": 351641, "epoch": 2093} {"train_loss": -11.625608444213867, "global_step": 351642, "epoch": 2093} {"train_loss": -11.80849838256836, "global_step": 351643, "epoch": 2093} {"train_loss": -11.661821365356445, "global_step": 351644, "epoch": 2093} {"train_loss": -11.565644264221191, "global_step": 351645, "epoch": 2093} {"train_loss": -11.865339279174805, "global_step": 351646, "epoch": 2093} {"train_loss": -11.719404220581055, "global_step": 351647, "epoch": 2093} {"train_loss": -12.01866626739502, "global_step": 351648, "epoch": 2093} {"train_loss": -11.605724334716797, "global_step": 351649, "epoch": 2093} {"train_loss": -12.015619277954102, "global_step": 351650, "epoch": 2093} {"train_loss": -11.80005168914795, "global_step": 351651, "epoch": 2093} {"train_loss": -12.397022247314453, "global_step": 351652, "epoch": 2093} {"train_loss": -11.653096199035645, "global_step": 351653, "epoch": 2093} {"train_loss": -12.235271453857422, "global_step": 351654, "epoch": 2093} {"train_loss": -11.708253860473633, "global_step": 351655, "epoch": 2093} {"train_loss": -12.131808280944824, "global_step": 351656, "epoch": 2093} {"train_loss": -11.932915687561035, "global_step": 351657, "epoch": 2093} {"train_loss": -11.643404006958008, "global_step": 351658, "epoch": 2093} {"train_loss": -12.304661750793457, "global_step": 351659, "epoch": 2093} {"train_loss": -11.925779342651367, "global_step": 351660, "epoch": 2093} {"train_loss": -12.130388259887695, "global_step": 351661, "epoch": 2093} {"train_loss": -12.318535804748535, "global_step": 351662, "epoch": 2093} {"train_loss": -11.852404594421387, "global_step": 351663, "epoch": 2093} {"train_loss": -12.228889465332031, "global_step": 351664, "epoch": 2093} {"train_loss": -11.951608657836914, "global_step": 351665, "epoch": 2093} {"train_loss": -12.121391296386719, "global_step": 351666, "epoch": 2093} {"train_loss": -12.385597229003906, "global_step": 351667, "epoch": 2093} {"train_loss": -11.943641662597656, "global_step": 351668, "epoch": 2093} {"train_loss": -12.313077926635742, "global_step": 351669, "epoch": 2093} {"train_loss": -12.300370216369629, "global_step": 351670, "epoch": 2093} {"train_loss": -11.973581314086914, "global_step": 351671, "epoch": 2093} {"train_loss": -12.330310821533203, "global_step": 351672, "epoch": 2093} {"train_loss": -12.271053314208984, "global_step": 351673, "epoch": 2093} {"train_loss": -12.427837371826172, "global_step": 351674, "epoch": 2093} {"train_loss": -12.295180320739746, "global_step": 351675, "epoch": 2093} {"train_loss": -12.542470932006836, "global_step": 351676, "epoch": 2093} {"train_loss": -12.27138900756836, "global_step": 351677, "epoch": 2093} {"train_loss": -12.53805160522461, "global_step": 351678, "epoch": 2093} {"train_loss": -12.34880256652832, "global_step": 351679, "epoch": 2093} {"train_loss": -12.218517303466797, "global_step": 351680, "epoch": 2093} {"train_loss": -12.457117080688477, "global_step": 351681, "epoch": 2093} {"train_loss": -12.482885360717773, "global_step": 351682, "epoch": 2093} {"train_loss": -12.348371505737305, "global_step": 351683, "epoch": 2093} {"train_loss": -12.197000503540039, "global_step": 351684, "epoch": 2093} {"train_loss": -12.383979797363281, "global_step": 351685, "epoch": 2093} {"train_loss": -12.410235404968262, "global_step": 351686, "epoch": 2093} {"train_loss": -12.013065338134766, "global_step": 351687, "epoch": 2093} {"train_loss": -12.453629493713379, "global_step": 351688, "epoch": 2093} {"train_loss": -11.765631675720215, "global_step": 351689, "epoch": 2093} {"train_loss": -11.698816299438477, "global_step": 351690, "epoch": 2093} {"train_loss": -12.433384895324707, "global_step": 351691, "epoch": 2093} {"train_loss": -11.761286735534668, "global_step": 351692, "epoch": 2093} {"train_loss": -11.759296417236328, "global_step": 351693, "epoch": 2093} {"train_loss": -12.30435562133789, "global_step": 351694, "epoch": 2093} {"train_loss": -11.970151901245117, "global_step": 351695, "epoch": 2093} {"train_loss": -12.105648040771484, "global_step": 351696, "epoch": 2093} {"train_loss": -12.13198471069336, "global_step": 351697, "epoch": 2093} {"train_loss": -12.645082473754883, "global_step": 351698, "epoch": 2093} {"train_loss": -12.24923324584961, "global_step": 351699, "epoch": 2093} {"train_loss": -12.397668838500977, "global_step": 351700, "epoch": 2093} {"train_loss": -12.391828536987305, "global_step": 351701, "epoch": 2093} {"train_loss": -12.545280456542969, "global_step": 351702, "epoch": 2093} {"train_loss": -12.391972541809082, "global_step": 351703, "epoch": 2093} {"train_loss": -12.475786209106445, "global_step": 351704, "epoch": 2093} {"train_loss": -12.35588264465332, "global_step": 351705, "epoch": 2093} {"train_loss": -12.370655059814453, "global_step": 351706, "epoch": 2093} {"train_loss": -12.347953796386719, "global_step": 351707, "epoch": 2093} {"train_loss": -12.542774200439453, "global_step": 351708, "epoch": 2093} {"train_loss": -12.390141487121582, "global_step": 351709, "epoch": 2093} {"train_loss": -12.147366523742676, "global_step": 351710, "epoch": 2093} {"train_loss": -12.561957359313965, "global_step": 351711, "epoch": 2093} {"train_loss": -12.345104217529297, "global_step": 351712, "epoch": 2093} {"train_loss": -12.593786239624023, "global_step": 351713, "epoch": 2093} {"train_loss": -12.621228218078613, "global_step": 351714, "epoch": 2093} {"train_loss": -12.442177772521973, "global_step": 351715, "epoch": 2093} {"train_loss": -12.108560562133789, "global_step": 351716, "epoch": 2093} {"train_loss": -12.420280456542969, "global_step": 351717, "epoch": 2093} {"train_loss": -12.517824172973633, "global_step": 351718, "epoch": 2093} {"train_loss": -12.525303840637207, "global_step": 351719, "epoch": 2093} {"train_loss": -12.480281829833984, "global_step": 351720, "epoch": 2093} {"train_loss": -12.41401481628418, "global_step": 351721, "epoch": 2093} {"train_loss": -12.425308227539062, "global_step": 351722, "epoch": 2093} {"train_loss": -12.383785247802734, "global_step": 351723, "epoch": 2093} {"train_loss": -12.441018104553223, "global_step": 351724, "epoch": 2093} {"train_loss": -12.584271430969238, "global_step": 351725, "epoch": 2093} {"train_loss": -12.80061149597168, "global_step": 351726, "epoch": 2093} {"train_loss": -12.591867446899414, "global_step": 351727, "epoch": 2093} {"train_loss": -12.600147247314453, "global_step": 351728, "epoch": 2093} {"train_loss": -12.55927562713623, "global_step": 351729, "epoch": 2093} {"train_loss": -12.667301177978516, "global_step": 351730, "epoch": 2093} {"train_loss": -12.524340629577637, "global_step": 351731, "epoch": 2093} {"train_loss": -12.362726211547852, "global_step": 351732, "epoch": 2093} {"train_loss": -12.251202583312988, "global_step": 351733, "epoch": 2093} {"train_loss": -12.508874893188477, "global_step": 351734, "epoch": 2093} {"train_loss": -12.618831634521484, "global_step": 351735, "epoch": 2093} {"train_loss": -11.827417373657227, "global_step": 351736, "epoch": 2093} {"train_loss": -10.93665885925293, "global_step": 351737, "epoch": 2093} {"train_loss": -12.122722625732422, "global_step": 351738, "epoch": 2093} {"train_loss": -12.119232177734375, "global_step": 351739, "epoch": 2093} {"train_loss": -11.307783126831055, "global_step": 351740, "epoch": 2093} {"train_loss": -10.6848726272583, "global_step": 351741, "epoch": 2093} {"train_loss": -11.641584396362305, "global_step": 351742, "epoch": 2093} {"train_loss": -10.136774063110352, "global_step": 351743, "epoch": 2093} {"train_loss": -8.68954086303711, "global_step": 351744, "epoch": 2093} {"train_loss": -8.046777725219727, "global_step": 351745, "epoch": 2093} {"train_loss": -9.034582138061523, "global_step": 351746, "epoch": 2093} {"train_loss": -9.298155784606934, "global_step": 351747, "epoch": 2093} {"train_loss": -9.914772033691406, "global_step": 351748, "epoch": 2093} {"train_loss": -10.256122589111328, "global_step": 351749, "epoch": 2093} {"train_loss": -9.215978622436523, "global_step": 351750, "epoch": 2093} {"train_loss": -8.149026870727539, "global_step": 351751, "epoch": 2093} {"train_loss": -6.652237415313721, "global_step": 351752, "epoch": 2093} {"train_loss": -8.55218505859375, "global_step": 351753, "epoch": 2093} {"train_loss": -7.579603672027588, "global_step": 351754, "epoch": 2093} {"train_loss": -9.053427696228027, "global_step": 351755, "epoch": 2093} {"train_loss": -9.471419334411621, "global_step": 351756, "epoch": 2093} {"train_loss": -9.68112850189209, "global_step": 351757, "epoch": 2093} {"train_loss": -8.889866828918457, "global_step": 351758, "epoch": 2093} {"train_loss": -9.707725524902344, "global_step": 351759, "epoch": 2093} {"train_loss": -10.483329772949219, "global_step": 351760, "epoch": 2093} {"train_loss": -9.051074981689453, "global_step": 351761, "epoch": 2093} {"train_loss": -10.092498779296875, "global_step": 351762, "epoch": 2093} {"train_loss": -10.07221508026123, "global_step": 351763, "epoch": 2093} {"train_loss": -10.302935600280762, "global_step": 351764, "epoch": 2093} {"train_loss": -9.587446212768555, "global_step": 351765, "epoch": 2093} {"train_loss": -9.506667137145996, "global_step": 351766, "epoch": 2093} {"train_loss": -10.877321243286133, "global_step": 351767, "epoch": 2093} {"train_loss": -9.92367935180664, "global_step": 351768, "epoch": 2093} {"train_loss": -9.416653633117676, "global_step": 351769, "epoch": 2093} {"train_loss": -11.011548042297363, "global_step": 351770, "epoch": 2093} {"train_loss": -10.36201286315918, "global_step": 351771, "epoch": 2093} {"train_loss": -10.476274490356445, "global_step": 351772, "epoch": 2093} {"train_loss": -11.110705375671387, "global_step": 351773, "epoch": 2093} {"train_loss": -11.346687316894531, "global_step": 351774, "epoch": 2093} {"train_loss": -10.413021087646484, "global_step": 351775, "epoch": 2093} {"train_loss": -11.019927978515625, "global_step": 351776, "epoch": 2093} {"train_loss": -11.358833312988281, "global_step": 351777, "epoch": 2093} {"train_loss": -10.744222640991211, "global_step": 351778, "epoch": 2093} {"train_loss": -11.026248931884766, "global_step": 351779, "epoch": 2093} {"train_loss": -11.239428520202637, "global_step": 351780, "epoch": 2093} {"train_loss": -11.282313346862793, "global_step": 351781, "epoch": 2093} {"train_loss": -11.182692527770996, "global_step": 351782, "epoch": 2093} {"train_loss": -11.679936408996582, "global_step": 351783, "epoch": 2093} {"train_loss": -10.859947204589844, "global_step": 351784, "epoch": 2093} {"train_loss": -11.183844566345215, "global_step": 351785, "epoch": 2093} {"train_loss": -11.848958969116211, "global_step": 351786, "epoch": 2093} {"train_loss": -11.561668395996094, "global_step": 351787, "epoch": 2093} {"train_loss": -11.411422729492188, "global_step": 351788, "epoch": 2093} {"train_loss": -12.208663940429688, "global_step": 351789, "epoch": 2093} {"train_loss": -11.415639877319336, "global_step": 351790, "epoch": 2093} {"train_loss": -11.481213541257949, "global_step": 351791, "epoch": 2093, "val_loss": 286262.34375} {"train_loss": -11.646108627319336, "global_step": 351792, "epoch": 2094} {"train_loss": -11.326714515686035, "global_step": 351793, "epoch": 2094} {"train_loss": -11.682618141174316, "global_step": 351794, "epoch": 2094} {"train_loss": -11.905338287353516, "global_step": 351795, "epoch": 2094} {"train_loss": -11.971803665161133, "global_step": 351796, "epoch": 2094} {"train_loss": -11.444231033325195, "global_step": 351797, "epoch": 2094} {"train_loss": -11.861577987670898, "global_step": 351798, "epoch": 2094} {"train_loss": -11.700692176818848, "global_step": 351799, "epoch": 2094} {"train_loss": -12.14961051940918, "global_step": 351800, "epoch": 2094} {"train_loss": -11.940402030944824, "global_step": 351801, "epoch": 2094} {"train_loss": -12.236698150634766, "global_step": 351802, "epoch": 2094} {"train_loss": -12.216743469238281, "global_step": 351803, "epoch": 2094} {"train_loss": -12.094077110290527, "global_step": 351804, "epoch": 2094} {"train_loss": -12.105567932128906, "global_step": 351805, "epoch": 2094} {"train_loss": -12.11328125, "global_step": 351806, "epoch": 2094} {"train_loss": -12.272424697875977, "global_step": 351807, "epoch": 2094} {"train_loss": -12.207225799560547, "global_step": 351808, "epoch": 2094} {"train_loss": -12.0178861618042, "global_step": 351809, "epoch": 2094} {"train_loss": -12.224042892456055, "global_step": 351810, "epoch": 2094} {"train_loss": -12.350173950195312, "global_step": 351811, "epoch": 2094} {"train_loss": -12.156411170959473, "global_step": 351812, "epoch": 2094} {"train_loss": -12.343786239624023, "global_step": 351813, "epoch": 2094} {"train_loss": -12.401280403137207, "global_step": 351814, "epoch": 2094} {"train_loss": -12.236196517944336, "global_step": 351815, "epoch": 2094} {"train_loss": -12.142356872558594, "global_step": 351816, "epoch": 2094} {"train_loss": -12.256053924560547, "global_step": 351817, "epoch": 2094} {"train_loss": -12.306440353393555, "global_step": 351818, "epoch": 2094} {"train_loss": -12.410181045532227, "global_step": 351819, "epoch": 2094} {"train_loss": -12.272912979125977, "global_step": 351820, "epoch": 2094} {"train_loss": -12.321090698242188, "global_step": 351821, "epoch": 2094} {"train_loss": -12.463582992553711, "global_step": 351822, "epoch": 2094} {"train_loss": -12.37186336517334, "global_step": 351823, "epoch": 2094} {"train_loss": -12.408761978149414, "global_step": 351824, "epoch": 2094} {"train_loss": -12.4385986328125, "global_step": 351825, "epoch": 2094} {"train_loss": -12.273658752441406, "global_step": 351826, "epoch": 2094} {"train_loss": -12.404919624328613, "global_step": 351827, "epoch": 2094} {"train_loss": -12.522640228271484, "global_step": 351828, "epoch": 2094} {"train_loss": -12.39145278930664, "global_step": 351829, "epoch": 2094} {"train_loss": -12.559181213378906, "global_step": 351830, "epoch": 2094} {"train_loss": -12.510404586791992, "global_step": 351831, "epoch": 2094} {"train_loss": -12.30672836303711, "global_step": 351832, "epoch": 2094} {"train_loss": -12.31972885131836, "global_step": 351833, "epoch": 2094} {"train_loss": -12.353740692138672, "global_step": 351834, "epoch": 2094} {"train_loss": -12.404245376586914, "global_step": 351835, "epoch": 2094} {"train_loss": -12.251096725463867, "global_step": 351836, "epoch": 2094} {"train_loss": -12.715263366699219, "global_step": 351837, "epoch": 2094} {"train_loss": -12.345451354980469, "global_step": 351838, "epoch": 2094} {"train_loss": -12.494430541992188, "global_step": 351839, "epoch": 2094} {"train_loss": -12.138406753540039, "global_step": 351840, "epoch": 2094} {"train_loss": -12.617498397827148, "global_step": 351841, "epoch": 2094} {"train_loss": -12.488113403320312, "global_step": 351842, "epoch": 2094} {"train_loss": -12.401182174682617, "global_step": 351843, "epoch": 2094} {"train_loss": -12.48685073852539, "global_step": 351844, "epoch": 2094} {"train_loss": -12.653818130493164, "global_step": 351845, "epoch": 2094} {"train_loss": -12.551118850708008, "global_step": 351846, "epoch": 2094} {"train_loss": -12.46060562133789, "global_step": 351847, "epoch": 2094} {"train_loss": -12.381872177124023, "global_step": 351848, "epoch": 2094} {"train_loss": -12.651060104370117, "global_step": 351849, "epoch": 2094} {"train_loss": -12.22557258605957, "global_step": 351850, "epoch": 2094} {"train_loss": -12.380261421203613, "global_step": 351851, "epoch": 2094} {"train_loss": -12.112783432006836, "global_step": 351852, "epoch": 2094} {"train_loss": -12.466888427734375, "global_step": 351853, "epoch": 2094} {"train_loss": -12.495063781738281, "global_step": 351854, "epoch": 2094} {"train_loss": -12.188070297241211, "global_step": 351855, "epoch": 2094} {"train_loss": -12.392112731933594, "global_step": 351856, "epoch": 2094} {"train_loss": -12.376714706420898, "global_step": 351857, "epoch": 2094} {"train_loss": -12.536885261535645, "global_step": 351858, "epoch": 2094} {"train_loss": -12.47104263305664, "global_step": 351859, "epoch": 2094} {"train_loss": -12.250415802001953, "global_step": 351860, "epoch": 2094} {"train_loss": -12.523155212402344, "global_step": 351861, "epoch": 2094} {"train_loss": -12.194007873535156, "global_step": 351862, "epoch": 2094} {"train_loss": -12.628337860107422, "global_step": 351863, "epoch": 2094} {"train_loss": -12.599100112915039, "global_step": 351864, "epoch": 2094} {"train_loss": -12.357231140136719, "global_step": 351865, "epoch": 2094} {"train_loss": -11.787738800048828, "global_step": 351866, "epoch": 2094} {"train_loss": -11.901809692382812, "global_step": 351867, "epoch": 2094} {"train_loss": -10.947001457214355, "global_step": 351868, "epoch": 2094} {"train_loss": -11.450960159301758, "global_step": 351869, "epoch": 2094} {"train_loss": -12.49140739440918, "global_step": 351870, "epoch": 2094} {"train_loss": -11.429340362548828, "global_step": 351871, "epoch": 2094} {"train_loss": -11.604482650756836, "global_step": 351872, "epoch": 2094} {"train_loss": -11.121123313903809, "global_step": 351873, "epoch": 2094} {"train_loss": -12.018304824829102, "global_step": 351874, "epoch": 2094} {"train_loss": -12.395505905151367, "global_step": 351875, "epoch": 2094} {"train_loss": -11.928423881530762, "global_step": 351876, "epoch": 2094} {"train_loss": -12.249632835388184, "global_step": 351877, "epoch": 2094} {"train_loss": -12.437195777893066, "global_step": 351878, "epoch": 2094} {"train_loss": -11.819732666015625, "global_step": 351879, "epoch": 2094} {"train_loss": -11.765447616577148, "global_step": 351880, "epoch": 2094} {"train_loss": -11.52977180480957, "global_step": 351881, "epoch": 2094} {"train_loss": -12.214168548583984, "global_step": 351882, "epoch": 2094} {"train_loss": -11.970616340637207, "global_step": 351883, "epoch": 2094} {"train_loss": -12.403352737426758, "global_step": 351884, "epoch": 2094} {"train_loss": -11.770914077758789, "global_step": 351885, "epoch": 2094} {"train_loss": -12.025613784790039, "global_step": 351886, "epoch": 2094} {"train_loss": -12.275053977966309, "global_step": 351887, "epoch": 2094} {"train_loss": -11.908452987670898, "global_step": 351888, "epoch": 2094} {"train_loss": -10.494438171386719, "global_step": 351889, "epoch": 2094} {"train_loss": -11.591475486755371, "global_step": 351890, "epoch": 2094} {"train_loss": -12.037254333496094, "global_step": 351891, "epoch": 2094} {"train_loss": -11.520668029785156, "global_step": 351892, "epoch": 2094} {"train_loss": -11.515127182006836, "global_step": 351893, "epoch": 2094} {"train_loss": -12.161767959594727, "global_step": 351894, "epoch": 2094} {"train_loss": -10.693598747253418, "global_step": 351895, "epoch": 2094} {"train_loss": -11.722606658935547, "global_step": 351896, "epoch": 2094} {"train_loss": -11.51095962524414, "global_step": 351897, "epoch": 2094} {"train_loss": -9.70758056640625, "global_step": 351898, "epoch": 2094} {"train_loss": -11.527809143066406, "global_step": 351899, "epoch": 2094} {"train_loss": -11.078474044799805, "global_step": 351900, "epoch": 2094} {"train_loss": -11.593634605407715, "global_step": 351901, "epoch": 2094} {"train_loss": -11.052879333496094, "global_step": 351902, "epoch": 2094} {"train_loss": -10.837594032287598, "global_step": 351903, "epoch": 2094} {"train_loss": -11.521889686584473, "global_step": 351904, "epoch": 2094} {"train_loss": -10.344680786132812, "global_step": 351905, "epoch": 2094} {"train_loss": -11.235976219177246, "global_step": 351906, "epoch": 2094} {"train_loss": -11.428275108337402, "global_step": 351907, "epoch": 2094} {"train_loss": -9.579776763916016, "global_step": 351908, "epoch": 2094} {"train_loss": -11.631707191467285, "global_step": 351909, "epoch": 2094} {"train_loss": -10.558938980102539, "global_step": 351910, "epoch": 2094} {"train_loss": -11.833998680114746, "global_step": 351911, "epoch": 2094} {"train_loss": -11.336978912353516, "global_step": 351912, "epoch": 2094} {"train_loss": -11.57593059539795, "global_step": 351913, "epoch": 2094} {"train_loss": -11.279939651489258, "global_step": 351914, "epoch": 2094} {"train_loss": -12.152777671813965, "global_step": 351915, "epoch": 2094} {"train_loss": -10.979019165039062, "global_step": 351916, "epoch": 2094} {"train_loss": -12.132827758789062, "global_step": 351917, "epoch": 2094} {"train_loss": -11.216873168945312, "global_step": 351918, "epoch": 2094} {"train_loss": -12.037882804870605, "global_step": 351919, "epoch": 2094} {"train_loss": -11.58816909790039, "global_step": 351920, "epoch": 2094} {"train_loss": -11.761923789978027, "global_step": 351921, "epoch": 2094} {"train_loss": -11.547601699829102, "global_step": 351922, "epoch": 2094} {"train_loss": -11.97885799407959, "global_step": 351923, "epoch": 2094} {"train_loss": -11.827899932861328, "global_step": 351924, "epoch": 2094} {"train_loss": -12.244141578674316, "global_step": 351925, "epoch": 2094} {"train_loss": -11.597043991088867, "global_step": 351926, "epoch": 2094} {"train_loss": -12.142937660217285, "global_step": 351927, "epoch": 2094} {"train_loss": -12.0177001953125, "global_step": 351928, "epoch": 2094} {"train_loss": -12.02287483215332, "global_step": 351929, "epoch": 2094} {"train_loss": -12.045425415039062, "global_step": 351930, "epoch": 2094} {"train_loss": -12.030618667602539, "global_step": 351931, "epoch": 2094} {"train_loss": -11.711331367492676, "global_step": 351932, "epoch": 2094} {"train_loss": -12.098240852355957, "global_step": 351933, "epoch": 2094} {"train_loss": -11.900891304016113, "global_step": 351934, "epoch": 2094} {"train_loss": -12.177846908569336, "global_step": 351935, "epoch": 2094} {"train_loss": -11.827659606933594, "global_step": 351936, "epoch": 2094} {"train_loss": -12.092180252075195, "global_step": 351937, "epoch": 2094} {"train_loss": -11.622504234313965, "global_step": 351938, "epoch": 2094} {"train_loss": -12.060263633728027, "global_step": 351939, "epoch": 2094} {"train_loss": -11.693458557128906, "global_step": 351940, "epoch": 2094} {"train_loss": -11.762365341186523, "global_step": 351941, "epoch": 2094} {"train_loss": -12.116409301757812, "global_step": 351942, "epoch": 2094} {"train_loss": -11.314334869384766, "global_step": 351943, "epoch": 2094} {"train_loss": -11.955829620361328, "global_step": 351944, "epoch": 2094} {"train_loss": -11.495694160461426, "global_step": 351945, "epoch": 2094} {"train_loss": -12.0552978515625, "global_step": 351946, "epoch": 2094} {"train_loss": -11.821430206298828, "global_step": 351947, "epoch": 2094} {"train_loss": -11.87926959991455, "global_step": 351948, "epoch": 2094} {"train_loss": -11.765661239624023, "global_step": 351949, "epoch": 2094} {"train_loss": -12.149100303649902, "global_step": 351950, "epoch": 2094} {"train_loss": -11.921133041381836, "global_step": 351951, "epoch": 2094} {"train_loss": -11.858380317687988, "global_step": 351952, "epoch": 2094} {"train_loss": -11.906681060791016, "global_step": 351953, "epoch": 2094} {"train_loss": -11.853920936584473, "global_step": 351954, "epoch": 2094} {"train_loss": -11.662389755249023, "global_step": 351955, "epoch": 2094} {"train_loss": -12.019269943237305, "global_step": 351956, "epoch": 2094} {"train_loss": -12.319486618041992, "global_step": 351957, "epoch": 2094} {"train_loss": -12.134645462036133, "global_step": 351958, "epoch": 2094} {"train_loss": -11.955103556315104, "global_step": 351959, "epoch": 2094, "val_loss": 290016.875} {"train_loss": -12.245037078857422, "global_step": 351960, "epoch": 2095} {"train_loss": -12.318648338317871, "global_step": 351961, "epoch": 2095} {"train_loss": -12.359233856201172, "global_step": 351962, "epoch": 2095} {"train_loss": -12.421293258666992, "global_step": 351963, "epoch": 2095} {"train_loss": -12.191865921020508, "global_step": 351964, "epoch": 2095} {"train_loss": -12.480192184448242, "global_step": 351965, "epoch": 2095} {"train_loss": -12.26345443725586, "global_step": 351966, "epoch": 2095} {"train_loss": -12.454367637634277, "global_step": 351967, "epoch": 2095} {"train_loss": -12.343339920043945, "global_step": 351968, "epoch": 2095} {"train_loss": -12.322809219360352, "global_step": 351969, "epoch": 2095} {"train_loss": -12.428759574890137, "global_step": 351970, "epoch": 2095} {"train_loss": -12.465450286865234, "global_step": 351971, "epoch": 2095} {"train_loss": -12.336060523986816, "global_step": 351972, "epoch": 2095} {"train_loss": -12.347758293151855, "global_step": 351973, "epoch": 2095} {"train_loss": -12.453155517578125, "global_step": 351974, "epoch": 2095} {"train_loss": -12.471692085266113, "global_step": 351975, "epoch": 2095} {"train_loss": -12.403549194335938, "global_step": 351976, "epoch": 2095} {"train_loss": -12.622282028198242, "global_step": 351977, "epoch": 2095} {"train_loss": -12.492706298828125, "global_step": 351978, "epoch": 2095} {"train_loss": -12.501272201538086, "global_step": 351979, "epoch": 2095} {"train_loss": -12.607402801513672, "global_step": 351980, "epoch": 2095} {"train_loss": -12.555065155029297, "global_step": 351981, "epoch": 2095} {"train_loss": -12.54498291015625, "global_step": 351982, "epoch": 2095} {"train_loss": -12.464414596557617, "global_step": 351983, "epoch": 2095} {"train_loss": -12.556901931762695, "global_step": 351984, "epoch": 2095} {"train_loss": -12.516128540039062, "global_step": 351985, "epoch": 2095} {"train_loss": -12.641858100891113, "global_step": 351986, "epoch": 2095} {"train_loss": -12.606701850891113, "global_step": 351987, "epoch": 2095} {"train_loss": -12.387283325195312, "global_step": 351988, "epoch": 2095} {"train_loss": -12.618757247924805, "global_step": 351989, "epoch": 2095} {"train_loss": -12.604718208312988, "global_step": 351990, "epoch": 2095} {"train_loss": -12.566560745239258, "global_step": 351991, "epoch": 2095} {"train_loss": -12.519546508789062, "global_step": 351992, "epoch": 2095} {"train_loss": -12.508855819702148, "global_step": 351993, "epoch": 2095} {"train_loss": -12.512045860290527, "global_step": 351994, "epoch": 2095} {"train_loss": -12.741113662719727, "global_step": 351995, "epoch": 2095} {"train_loss": -12.76987075805664, "global_step": 351996, "epoch": 2095} {"train_loss": -12.52342414855957, "global_step": 351997, "epoch": 2095} {"train_loss": -12.508060455322266, "global_step": 351998, "epoch": 2095} {"train_loss": -12.60279655456543, "global_step": 351999, "epoch": 2095} {"train_loss": -12.601156234741211, "global_step": 352000, "epoch": 2095} {"train_loss": -12.49384593963623, "global_step": 352001, "epoch": 2095} {"train_loss": -12.338714599609375, "global_step": 352002, "epoch": 2095} {"train_loss": -12.602338790893555, "global_step": 352003, "epoch": 2095} {"train_loss": -12.305639266967773, "global_step": 352004, "epoch": 2095} {"train_loss": -12.000465393066406, "global_step": 352005, "epoch": 2095} {"train_loss": -12.288213729858398, "global_step": 352006, "epoch": 2095} {"train_loss": -12.592352867126465, "global_step": 352007, "epoch": 2095} {"train_loss": -11.459329605102539, "global_step": 352008, "epoch": 2095} {"train_loss": -10.995906829833984, "global_step": 352009, "epoch": 2095} {"train_loss": -11.958656311035156, "global_step": 352010, "epoch": 2095} {"train_loss": -12.44235610961914, "global_step": 352011, "epoch": 2095} {"train_loss": -12.113468170166016, "global_step": 352012, "epoch": 2095} {"train_loss": -12.125946044921875, "global_step": 352013, "epoch": 2095} {"train_loss": -12.296284675598145, "global_step": 352014, "epoch": 2095} {"train_loss": -12.38226318359375, "global_step": 352015, "epoch": 2095} {"train_loss": -12.019031524658203, "global_step": 352016, "epoch": 2095} {"train_loss": -12.335387229919434, "global_step": 352017, "epoch": 2095} {"train_loss": -12.672013282775879, "global_step": 352018, "epoch": 2095} {"train_loss": -11.774353981018066, "global_step": 352019, "epoch": 2095} {"train_loss": -11.24330997467041, "global_step": 352020, "epoch": 2095} {"train_loss": -12.060043334960938, "global_step": 352021, "epoch": 2095} {"train_loss": -11.694869041442871, "global_step": 352022, "epoch": 2095} {"train_loss": -12.003340721130371, "global_step": 352023, "epoch": 2095} {"train_loss": -11.784882545471191, "global_step": 352024, "epoch": 2095} {"train_loss": -11.526077270507812, "global_step": 352025, "epoch": 2095} {"train_loss": -12.225265502929688, "global_step": 352026, "epoch": 2095} {"train_loss": -12.155447006225586, "global_step": 352027, "epoch": 2095} {"train_loss": -11.961467742919922, "global_step": 352028, "epoch": 2095} {"train_loss": -12.067569732666016, "global_step": 352029, "epoch": 2095} {"train_loss": -12.339116096496582, "global_step": 352030, "epoch": 2095} {"train_loss": -12.324285507202148, "global_step": 352031, "epoch": 2095} {"train_loss": -12.336851119995117, "global_step": 352032, "epoch": 2095} {"train_loss": -11.99929141998291, "global_step": 352033, "epoch": 2095} {"train_loss": -11.666055679321289, "global_step": 352034, "epoch": 2095} {"train_loss": -12.351192474365234, "global_step": 352035, "epoch": 2095} {"train_loss": -11.242445945739746, "global_step": 352036, "epoch": 2095} {"train_loss": -9.98503303527832, "global_step": 352037, "epoch": 2095} {"train_loss": -11.89811897277832, "global_step": 352038, "epoch": 2095} {"train_loss": -11.15971565246582, "global_step": 352039, "epoch": 2095} {"train_loss": -11.31268310546875, "global_step": 352040, "epoch": 2095} {"train_loss": -10.999920845031738, "global_step": 352041, "epoch": 2095} {"train_loss": -11.335001945495605, "global_step": 352042, "epoch": 2095} {"train_loss": -10.450887680053711, "global_step": 352043, "epoch": 2095} {"train_loss": -11.080059051513672, "global_step": 352044, "epoch": 2095} {"train_loss": -10.527575492858887, "global_step": 352045, "epoch": 2095} {"train_loss": -11.353227615356445, "global_step": 352046, "epoch": 2095} {"train_loss": -10.424535751342773, "global_step": 352047, "epoch": 2095} {"train_loss": -9.383007049560547, "global_step": 352048, "epoch": 2095} {"train_loss": -10.830324172973633, "global_step": 352049, "epoch": 2095} {"train_loss": -7.800878524780273, "global_step": 352050, "epoch": 2095} {"train_loss": -7.38437032699585, "global_step": 352051, "epoch": 2095} {"train_loss": -7.148688316345215, "global_step": 352052, "epoch": 2095} {"train_loss": -6.4865217208862305, "global_step": 352053, "epoch": 2095} {"train_loss": -6.957749366760254, "global_step": 352054, "epoch": 2095} {"train_loss": -7.140719413757324, "global_step": 352055, "epoch": 2095} {"train_loss": -7.35676383972168, "global_step": 352056, "epoch": 2095} {"train_loss": -7.736035346984863, "global_step": 352057, "epoch": 2095} {"train_loss": -7.312559127807617, "global_step": 352058, "epoch": 2095} {"train_loss": -7.75393533706665, "global_step": 352059, "epoch": 2095} {"train_loss": -7.9102373123168945, "global_step": 352060, "epoch": 2095} {"train_loss": -8.285995483398438, "global_step": 352061, "epoch": 2095} {"train_loss": -8.406177520751953, "global_step": 352062, "epoch": 2095} {"train_loss": -8.492256164550781, "global_step": 352063, "epoch": 2095} {"train_loss": -8.01915454864502, "global_step": 352064, "epoch": 2095} {"train_loss": -8.127117156982422, "global_step": 352065, "epoch": 2095} {"train_loss": -8.389740943908691, "global_step": 352066, "epoch": 2095} {"train_loss": -9.390246391296387, "global_step": 352067, "epoch": 2095} {"train_loss": -8.781739234924316, "global_step": 352068, "epoch": 2095} {"train_loss": -8.796588897705078, "global_step": 352069, "epoch": 2095} {"train_loss": -9.156394958496094, "global_step": 352070, "epoch": 2095} {"train_loss": -9.851875305175781, "global_step": 352071, "epoch": 2095} {"train_loss": -9.508224487304688, "global_step": 352072, "epoch": 2095} {"train_loss": -9.843860626220703, "global_step": 352073, "epoch": 2095} {"train_loss": -10.032564163208008, "global_step": 352074, "epoch": 2095} {"train_loss": -10.510143280029297, "global_step": 352075, "epoch": 2095} {"train_loss": -10.40130615234375, "global_step": 352076, "epoch": 2095} {"train_loss": -10.03211498260498, "global_step": 352077, "epoch": 2095} {"train_loss": -10.582406044006348, "global_step": 352078, "epoch": 2095} {"train_loss": -10.924076080322266, "global_step": 352079, "epoch": 2095} {"train_loss": -10.519052505493164, "global_step": 352080, "epoch": 2095} {"train_loss": -11.27564525604248, "global_step": 352081, "epoch": 2095} {"train_loss": -10.92695426940918, "global_step": 352082, "epoch": 2095} {"train_loss": -11.202713012695312, "global_step": 352083, "epoch": 2095} {"train_loss": -11.092872619628906, "global_step": 352084, "epoch": 2095} {"train_loss": -11.447400093078613, "global_step": 352085, "epoch": 2095} {"train_loss": -11.457109451293945, "global_step": 352086, "epoch": 2095} {"train_loss": -11.604301452636719, "global_step": 352087, "epoch": 2095} {"train_loss": -11.911925315856934, "global_step": 352088, "epoch": 2095} {"train_loss": -11.318222999572754, "global_step": 352089, "epoch": 2095} {"train_loss": -11.631057739257812, "global_step": 352090, "epoch": 2095} {"train_loss": -11.128938674926758, "global_step": 352091, "epoch": 2095} {"train_loss": -11.662078857421875, "global_step": 352092, "epoch": 2095} {"train_loss": -10.867694854736328, "global_step": 352093, "epoch": 2095} {"train_loss": -11.564690589904785, "global_step": 352094, "epoch": 2095} {"train_loss": -11.042550086975098, "global_step": 352095, "epoch": 2095} {"train_loss": -11.617904663085938, "global_step": 352096, "epoch": 2095} {"train_loss": -11.635330200195312, "global_step": 352097, "epoch": 2095} {"train_loss": -11.434859275817871, "global_step": 352098, "epoch": 2095} {"train_loss": -11.61544418334961, "global_step": 352099, "epoch": 2095} {"train_loss": -11.692832946777344, "global_step": 352100, "epoch": 2095} {"train_loss": -11.705638885498047, "global_step": 352101, "epoch": 2095} {"train_loss": -11.469747543334961, "global_step": 352102, "epoch": 2095} {"train_loss": -11.708597183227539, "global_step": 352103, "epoch": 2095} {"train_loss": -11.594930648803711, "global_step": 352104, "epoch": 2095} {"train_loss": -11.93225383758545, "global_step": 352105, "epoch": 2095} {"train_loss": -11.785581588745117, "global_step": 352106, "epoch": 2095} {"train_loss": -11.849992752075195, "global_step": 352107, "epoch": 2095} {"train_loss": -11.468584060668945, "global_step": 352108, "epoch": 2095} {"train_loss": -12.244683265686035, "global_step": 352109, "epoch": 2095} {"train_loss": -11.892152786254883, "global_step": 352110, "epoch": 2095} {"train_loss": -12.016172409057617, "global_step": 352111, "epoch": 2095} {"train_loss": -11.811840057373047, "global_step": 352112, "epoch": 2095} {"train_loss": -11.799728393554688, "global_step": 352113, "epoch": 2095} {"train_loss": -12.109275817871094, "global_step": 352114, "epoch": 2095} {"train_loss": -12.001262664794922, "global_step": 352115, "epoch": 2095} {"train_loss": -11.568760871887207, "global_step": 352116, "epoch": 2095} {"train_loss": -11.873556137084961, "global_step": 352117, "epoch": 2095} {"train_loss": -11.957629203796387, "global_step": 352118, "epoch": 2095} {"train_loss": -12.015459060668945, "global_step": 352119, "epoch": 2095} {"train_loss": -12.115985870361328, "global_step": 352120, "epoch": 2095} {"train_loss": -12.033056259155273, "global_step": 352121, "epoch": 2095} {"train_loss": -11.63157844543457, "global_step": 352122, "epoch": 2095} {"train_loss": -12.121000289916992, "global_step": 352123, "epoch": 2095} {"train_loss": -11.600268363952637, "global_step": 352124, "epoch": 2095} {"train_loss": -11.953304290771484, "global_step": 352125, "epoch": 2095} {"train_loss": -12.010265350341797, "global_step": 352126, "epoch": 2095} {"train_loss": -11.33553447609856, "global_step": 352127, "epoch": 2095, "val_loss": 290460.96875, "train_action_mse_error": 0.40728384256362915} {"train_loss": -11.959400177001953, "global_step": 352128, "epoch": 2096} {"train_loss": -11.974672317504883, "global_step": 352129, "epoch": 2096} {"train_loss": -12.088052749633789, "global_step": 352130, "epoch": 2096} {"train_loss": -11.889935493469238, "global_step": 352131, "epoch": 2096} {"train_loss": -12.298629760742188, "global_step": 352132, "epoch": 2096} {"train_loss": -12.102816581726074, "global_step": 352133, "epoch": 2096} {"train_loss": -12.234356880187988, "global_step": 352134, "epoch": 2096} {"train_loss": -12.073049545288086, "global_step": 352135, "epoch": 2096} {"train_loss": -12.182965278625488, "global_step": 352136, "epoch": 2096} {"train_loss": -12.221325874328613, "global_step": 352137, "epoch": 2096} {"train_loss": -12.484203338623047, "global_step": 352138, "epoch": 2096} {"train_loss": -12.280579566955566, "global_step": 352139, "epoch": 2096} {"train_loss": -12.28836441040039, "global_step": 352140, "epoch": 2096} {"train_loss": -12.361440658569336, "global_step": 352141, "epoch": 2096} {"train_loss": -12.220820426940918, "global_step": 352142, "epoch": 2096} {"train_loss": -12.153104782104492, "global_step": 352143, "epoch": 2096} {"train_loss": -12.072917938232422, "global_step": 352144, "epoch": 2096} {"train_loss": -12.478785514831543, "global_step": 352145, "epoch": 2096} {"train_loss": -12.465707778930664, "global_step": 352146, "epoch": 2096} {"train_loss": -12.384374618530273, "global_step": 352147, "epoch": 2096} {"train_loss": -12.401487350463867, "global_step": 352148, "epoch": 2096} {"train_loss": -12.519277572631836, "global_step": 352149, "epoch": 2096} {"train_loss": -12.455889701843262, "global_step": 352150, "epoch": 2096} {"train_loss": -12.366416931152344, "global_step": 352151, "epoch": 2096} {"train_loss": -12.456869125366211, "global_step": 352152, "epoch": 2096} {"train_loss": -12.596607208251953, "global_step": 352153, "epoch": 2096} {"train_loss": -12.40278434753418, "global_step": 352154, "epoch": 2096} {"train_loss": -12.535364151000977, "global_step": 352155, "epoch": 2096} {"train_loss": -12.389566421508789, "global_step": 352156, "epoch": 2096} {"train_loss": -12.470268249511719, "global_step": 352157, "epoch": 2096} {"train_loss": -12.498106956481934, "global_step": 352158, "epoch": 2096} {"train_loss": -12.251601219177246, "global_step": 352159, "epoch": 2096} {"train_loss": -12.68106460571289, "global_step": 352160, "epoch": 2096} {"train_loss": -12.503283500671387, "global_step": 352161, "epoch": 2096} {"train_loss": -12.45390510559082, "global_step": 352162, "epoch": 2096} {"train_loss": -12.61387825012207, "global_step": 352163, "epoch": 2096} {"train_loss": -12.449954986572266, "global_step": 352164, "epoch": 2096} {"train_loss": -12.481913566589355, "global_step": 352165, "epoch": 2096} {"train_loss": -12.599235534667969, "global_step": 352166, "epoch": 2096} {"train_loss": -12.36744499206543, "global_step": 352167, "epoch": 2096} {"train_loss": -12.285181045532227, "global_step": 352168, "epoch": 2096} {"train_loss": -12.6693115234375, "global_step": 352169, "epoch": 2096} {"train_loss": -12.346511840820312, "global_step": 352170, "epoch": 2096} {"train_loss": -12.662481307983398, "global_step": 352171, "epoch": 2096} {"train_loss": -12.534913063049316, "global_step": 352172, "epoch": 2096} {"train_loss": -12.691055297851562, "global_step": 352173, "epoch": 2096} {"train_loss": -12.538923263549805, "global_step": 352174, "epoch": 2096} {"train_loss": -12.406444549560547, "global_step": 352175, "epoch": 2096} {"train_loss": -12.535253524780273, "global_step": 352176, "epoch": 2096} {"train_loss": -12.749939918518066, "global_step": 352177, "epoch": 2096} {"train_loss": -12.523061752319336, "global_step": 352178, "epoch": 2096} {"train_loss": -12.594539642333984, "global_step": 352179, "epoch": 2096} {"train_loss": -12.728851318359375, "global_step": 352180, "epoch": 2096} {"train_loss": -12.49559211730957, "global_step": 352181, "epoch": 2096} {"train_loss": -12.412513732910156, "global_step": 352182, "epoch": 2096} {"train_loss": -12.643428802490234, "global_step": 352183, "epoch": 2096} {"train_loss": -12.603355407714844, "global_step": 352184, "epoch": 2096} {"train_loss": -12.766834259033203, "global_step": 352185, "epoch": 2096} {"train_loss": -12.815977096557617, "global_step": 352186, "epoch": 2096} {"train_loss": -12.527233123779297, "global_step": 352187, "epoch": 2096} {"train_loss": -12.57046127319336, "global_step": 352188, "epoch": 2096} {"train_loss": -12.691187858581543, "global_step": 352189, "epoch": 2096} {"train_loss": -12.606760025024414, "global_step": 352190, "epoch": 2096} {"train_loss": -12.195164680480957, "global_step": 352191, "epoch": 2096} {"train_loss": -12.004182815551758, "global_step": 352192, "epoch": 2096} {"train_loss": -12.47900390625, "global_step": 352193, "epoch": 2096} {"train_loss": -12.365458488464355, "global_step": 352194, "epoch": 2096} {"train_loss": -12.168157577514648, "global_step": 352195, "epoch": 2096} {"train_loss": -12.331916809082031, "global_step": 352196, "epoch": 2096} {"train_loss": -12.03821849822998, "global_step": 352197, "epoch": 2096} {"train_loss": -12.68013858795166, "global_step": 352198, "epoch": 2096} {"train_loss": -11.907793998718262, "global_step": 352199, "epoch": 2096} {"train_loss": -11.868083953857422, "global_step": 352200, "epoch": 2096} {"train_loss": -12.329541206359863, "global_step": 352201, "epoch": 2096} {"train_loss": -11.927772521972656, "global_step": 352202, "epoch": 2096} {"train_loss": -12.239458084106445, "global_step": 352203, "epoch": 2096} {"train_loss": -11.882264137268066, "global_step": 352204, "epoch": 2096} {"train_loss": -11.873298645019531, "global_step": 352205, "epoch": 2096} {"train_loss": -10.08980941772461, "global_step": 352206, "epoch": 2096} {"train_loss": -11.47793197631836, "global_step": 352207, "epoch": 2096} {"train_loss": -12.062877655029297, "global_step": 352208, "epoch": 2096} {"train_loss": -12.354629516601562, "global_step": 352209, "epoch": 2096} {"train_loss": -12.179044723510742, "global_step": 352210, "epoch": 2096} {"train_loss": -11.657485008239746, "global_step": 352211, "epoch": 2096} {"train_loss": -11.84186840057373, "global_step": 352212, "epoch": 2096} {"train_loss": -12.347799301147461, "global_step": 352213, "epoch": 2096} {"train_loss": -11.803436279296875, "global_step": 352214, "epoch": 2096} {"train_loss": -10.400725364685059, "global_step": 352215, "epoch": 2096} {"train_loss": -11.89368724822998, "global_step": 352216, "epoch": 2096} {"train_loss": -11.338747024536133, "global_step": 352217, "epoch": 2096} {"train_loss": -11.89801025390625, "global_step": 352218, "epoch": 2096} {"train_loss": -11.641302108764648, "global_step": 352219, "epoch": 2096} {"train_loss": -11.507357597351074, "global_step": 352220, "epoch": 2096} {"train_loss": -10.474440574645996, "global_step": 352221, "epoch": 2096} {"train_loss": -11.322564125061035, "global_step": 352222, "epoch": 2096} {"train_loss": -9.735769271850586, "global_step": 352223, "epoch": 2096} {"train_loss": -11.109856605529785, "global_step": 352224, "epoch": 2096} {"train_loss": -11.470747947692871, "global_step": 352225, "epoch": 2096} {"train_loss": -9.954225540161133, "global_step": 352226, "epoch": 2096} {"train_loss": -11.805288314819336, "global_step": 352227, "epoch": 2096} {"train_loss": -9.974592208862305, "global_step": 352228, "epoch": 2096} {"train_loss": -9.276159286499023, "global_step": 352229, "epoch": 2096} {"train_loss": -9.917441368103027, "global_step": 352230, "epoch": 2096} {"train_loss": -11.161046981811523, "global_step": 352231, "epoch": 2096} {"train_loss": -10.750558853149414, "global_step": 352232, "epoch": 2096} {"train_loss": -10.767277717590332, "global_step": 352233, "epoch": 2096} {"train_loss": -10.283319473266602, "global_step": 352234, "epoch": 2096} {"train_loss": -11.009122848510742, "global_step": 352235, "epoch": 2096} {"train_loss": -11.101922035217285, "global_step": 352236, "epoch": 2096} {"train_loss": -11.179458618164062, "global_step": 352237, "epoch": 2096} {"train_loss": -11.17245864868164, "global_step": 352238, "epoch": 2096} {"train_loss": -11.770925521850586, "global_step": 352239, "epoch": 2096} {"train_loss": -10.522485733032227, "global_step": 352240, "epoch": 2096} {"train_loss": -11.72564697265625, "global_step": 352241, "epoch": 2096} {"train_loss": -11.100603103637695, "global_step": 352242, "epoch": 2096} {"train_loss": -11.261652946472168, "global_step": 352243, "epoch": 2096} {"train_loss": -11.313304901123047, "global_step": 352244, "epoch": 2096} {"train_loss": -11.135993957519531, "global_step": 352245, "epoch": 2096} {"train_loss": -11.302974700927734, "global_step": 352246, "epoch": 2096} {"train_loss": -10.364904403686523, "global_step": 352247, "epoch": 2096} {"train_loss": -11.219121932983398, "global_step": 352248, "epoch": 2096} {"train_loss": -11.119386672973633, "global_step": 352249, "epoch": 2096} {"train_loss": -11.48421859741211, "global_step": 352250, "epoch": 2096} {"train_loss": -11.743331909179688, "global_step": 352251, "epoch": 2096} {"train_loss": -11.310857772827148, "global_step": 352252, "epoch": 2096} {"train_loss": -12.057113647460938, "global_step": 352253, "epoch": 2096} {"train_loss": -11.17490005493164, "global_step": 352254, "epoch": 2096} {"train_loss": -12.165508270263672, "global_step": 352255, "epoch": 2096} {"train_loss": -11.505373001098633, "global_step": 352256, "epoch": 2096} {"train_loss": -11.793899536132812, "global_step": 352257, "epoch": 2096} {"train_loss": -11.658676147460938, "global_step": 352258, "epoch": 2096} {"train_loss": -12.033994674682617, "global_step": 352259, "epoch": 2096} {"train_loss": -11.999814987182617, "global_step": 352260, "epoch": 2096} {"train_loss": -12.233636856079102, "global_step": 352261, "epoch": 2096} {"train_loss": -11.994819641113281, "global_step": 352262, "epoch": 2096} {"train_loss": -12.193309783935547, "global_step": 352263, "epoch": 2096} {"train_loss": -12.067619323730469, "global_step": 352264, "epoch": 2096} {"train_loss": -12.161070823669434, "global_step": 352265, "epoch": 2096} {"train_loss": -12.276975631713867, "global_step": 352266, "epoch": 2096} {"train_loss": -11.749692916870117, "global_step": 352267, "epoch": 2096} {"train_loss": -12.200434684753418, "global_step": 352268, "epoch": 2096} {"train_loss": -11.896923065185547, "global_step": 352269, "epoch": 2096} {"train_loss": -12.127519607543945, "global_step": 352270, "epoch": 2096} {"train_loss": -12.138690948486328, "global_step": 352271, "epoch": 2096} {"train_loss": -12.142099380493164, "global_step": 352272, "epoch": 2096} {"train_loss": -12.046534538269043, "global_step": 352273, "epoch": 2096} {"train_loss": -11.86195182800293, "global_step": 352274, "epoch": 2096} {"train_loss": -11.986898422241211, "global_step": 352275, "epoch": 2096} {"train_loss": -12.020231246948242, "global_step": 352276, "epoch": 2096} {"train_loss": -11.956551551818848, "global_step": 352277, "epoch": 2096} {"train_loss": -12.253890991210938, "global_step": 352278, "epoch": 2096} {"train_loss": -12.174960136413574, "global_step": 352279, "epoch": 2096} {"train_loss": -12.238802909851074, "global_step": 352280, "epoch": 2096} {"train_loss": -11.938253402709961, "global_step": 352281, "epoch": 2096} {"train_loss": -12.000689506530762, "global_step": 352282, "epoch": 2096} {"train_loss": -12.443790435791016, "global_step": 352283, "epoch": 2096} {"train_loss": -11.888556480407715, "global_step": 352284, "epoch": 2096} {"train_loss": -12.316875457763672, "global_step": 352285, "epoch": 2096} {"train_loss": -11.598091125488281, "global_step": 352286, "epoch": 2096} {"train_loss": -11.973663330078125, "global_step": 352287, "epoch": 2096} {"train_loss": -11.872638702392578, "global_step": 352288, "epoch": 2096} {"train_loss": -12.333576202392578, "global_step": 352289, "epoch": 2096} {"train_loss": -11.282245635986328, "global_step": 352290, "epoch": 2096} {"train_loss": -11.835367202758789, "global_step": 352291, "epoch": 2096} {"train_loss": -12.265106201171875, "global_step": 352292, "epoch": 2096} {"train_loss": -11.87606143951416, "global_step": 352293, "epoch": 2096} {"train_loss": -11.986478805541992, "global_step": 352294, "epoch": 2096} {"train_loss": -11.938424292064848, "global_step": 352295, "epoch": 2096, "val_loss": 296504.5625} {"train_loss": -12.117887496948242, "global_step": 352296, "epoch": 2097} {"train_loss": -11.994485855102539, "global_step": 352297, "epoch": 2097} {"train_loss": -12.079642295837402, "global_step": 352298, "epoch": 2097} {"train_loss": -11.941116333007812, "global_step": 352299, "epoch": 2097} {"train_loss": -12.33093547821045, "global_step": 352300, "epoch": 2097} {"train_loss": -12.055068016052246, "global_step": 352301, "epoch": 2097} {"train_loss": -12.37463665008545, "global_step": 352302, "epoch": 2097} {"train_loss": -12.003686904907227, "global_step": 352303, "epoch": 2097} {"train_loss": -12.297645568847656, "global_step": 352304, "epoch": 2097} {"train_loss": -12.160630226135254, "global_step": 352305, "epoch": 2097} {"train_loss": -12.392349243164062, "global_step": 352306, "epoch": 2097} {"train_loss": -11.860968589782715, "global_step": 352307, "epoch": 2097} {"train_loss": -11.476142883300781, "global_step": 352308, "epoch": 2097} {"train_loss": -11.810225486755371, "global_step": 352309, "epoch": 2097} {"train_loss": -12.362852096557617, "global_step": 352310, "epoch": 2097} {"train_loss": -12.3604097366333, "global_step": 352311, "epoch": 2097} {"train_loss": -12.090206146240234, "global_step": 352312, "epoch": 2097} {"train_loss": -11.837323188781738, "global_step": 352313, "epoch": 2097} {"train_loss": -12.042776107788086, "global_step": 352314, "epoch": 2097} {"train_loss": -11.990787506103516, "global_step": 352315, "epoch": 2097} {"train_loss": -12.00343132019043, "global_step": 352316, "epoch": 2097} {"train_loss": -11.575931549072266, "global_step": 352317, "epoch": 2097} {"train_loss": -12.063580513000488, "global_step": 352318, "epoch": 2097} {"train_loss": -11.718650817871094, "global_step": 352319, "epoch": 2097} {"train_loss": -11.587369918823242, "global_step": 352320, "epoch": 2097} {"train_loss": -12.061386108398438, "global_step": 352321, "epoch": 2097} {"train_loss": -12.137728691101074, "global_step": 352322, "epoch": 2097} {"train_loss": -11.600608825683594, "global_step": 352323, "epoch": 2097} {"train_loss": -12.168079376220703, "global_step": 352324, "epoch": 2097} {"train_loss": -11.70071029663086, "global_step": 352325, "epoch": 2097} {"train_loss": -11.500648498535156, "global_step": 352326, "epoch": 2097} {"train_loss": -12.024629592895508, "global_step": 352327, "epoch": 2097} {"train_loss": -12.035863876342773, "global_step": 352328, "epoch": 2097} {"train_loss": -12.320101737976074, "global_step": 352329, "epoch": 2097} {"train_loss": -12.007845878601074, "global_step": 352330, "epoch": 2097} {"train_loss": -12.007054328918457, "global_step": 352331, "epoch": 2097} {"train_loss": -11.660773277282715, "global_step": 352332, "epoch": 2097} {"train_loss": -12.057111740112305, "global_step": 352333, "epoch": 2097} {"train_loss": -11.99795150756836, "global_step": 352334, "epoch": 2097} {"train_loss": -11.936201095581055, "global_step": 352335, "epoch": 2097} {"train_loss": -12.179285049438477, "global_step": 352336, "epoch": 2097} {"train_loss": -11.629314422607422, "global_step": 352337, "epoch": 2097} {"train_loss": -12.090001106262207, "global_step": 352338, "epoch": 2097} {"train_loss": -12.003279685974121, "global_step": 352339, "epoch": 2097} {"train_loss": -11.478341102600098, "global_step": 352340, "epoch": 2097} {"train_loss": -12.418525695800781, "global_step": 352341, "epoch": 2097} {"train_loss": -11.872007369995117, "global_step": 352342, "epoch": 2097} {"train_loss": -12.248000144958496, "global_step": 352343, "epoch": 2097} {"train_loss": -12.113935470581055, "global_step": 352344, "epoch": 2097} {"train_loss": -12.342157363891602, "global_step": 352345, "epoch": 2097} {"train_loss": -11.662461280822754, "global_step": 352346, "epoch": 2097} {"train_loss": -12.275823593139648, "global_step": 352347, "epoch": 2097} {"train_loss": -12.034194946289062, "global_step": 352348, "epoch": 2097} {"train_loss": -11.561286926269531, "global_step": 352349, "epoch": 2097} {"train_loss": -12.081794738769531, "global_step": 352350, "epoch": 2097} {"train_loss": -12.178756713867188, "global_step": 352351, "epoch": 2097} {"train_loss": -12.145305633544922, "global_step": 352352, "epoch": 2097} {"train_loss": -12.540857315063477, "global_step": 352353, "epoch": 2097} {"train_loss": -12.244879722595215, "global_step": 352354, "epoch": 2097} {"train_loss": -11.98419189453125, "global_step": 352355, "epoch": 2097} {"train_loss": -12.247922897338867, "global_step": 352356, "epoch": 2097} {"train_loss": -11.608097076416016, "global_step": 352357, "epoch": 2097} {"train_loss": -10.667699813842773, "global_step": 352358, "epoch": 2097} {"train_loss": -11.693399429321289, "global_step": 352359, "epoch": 2097} {"train_loss": -10.649962425231934, "global_step": 352360, "epoch": 2097} {"train_loss": -10.562583923339844, "global_step": 352361, "epoch": 2097} {"train_loss": -11.981813430786133, "global_step": 352362, "epoch": 2097} {"train_loss": -11.582723617553711, "global_step": 352363, "epoch": 2097} {"train_loss": -10.818368911743164, "global_step": 352364, "epoch": 2097} {"train_loss": -11.562480926513672, "global_step": 352365, "epoch": 2097} {"train_loss": -10.692642211914062, "global_step": 352366, "epoch": 2097} {"train_loss": -11.136615753173828, "global_step": 352367, "epoch": 2097} {"train_loss": -11.298454284667969, "global_step": 352368, "epoch": 2097} {"train_loss": -10.655858993530273, "global_step": 352369, "epoch": 2097} {"train_loss": -11.060286521911621, "global_step": 352370, "epoch": 2097} {"train_loss": -10.704896926879883, "global_step": 352371, "epoch": 2097} {"train_loss": -10.855887413024902, "global_step": 352372, "epoch": 2097} {"train_loss": -10.780008316040039, "global_step": 352373, "epoch": 2097} {"train_loss": -11.515863418579102, "global_step": 352374, "epoch": 2097} {"train_loss": -11.745719909667969, "global_step": 352375, "epoch": 2097} {"train_loss": -11.990877151489258, "global_step": 352376, "epoch": 2097} {"train_loss": -12.01762580871582, "global_step": 352377, "epoch": 2097} {"train_loss": -11.020824432373047, "global_step": 352378, "epoch": 2097} {"train_loss": -12.160329818725586, "global_step": 352379, "epoch": 2097} {"train_loss": -11.133646011352539, "global_step": 352380, "epoch": 2097} {"train_loss": -11.843132019042969, "global_step": 352381, "epoch": 2097} {"train_loss": -11.338184356689453, "global_step": 352382, "epoch": 2097} {"train_loss": -11.995532989501953, "global_step": 352383, "epoch": 2097} {"train_loss": -11.712135314941406, "global_step": 352384, "epoch": 2097} {"train_loss": -11.64881420135498, "global_step": 352385, "epoch": 2097} {"train_loss": -11.830575942993164, "global_step": 352386, "epoch": 2097} {"train_loss": -11.994367599487305, "global_step": 352387, "epoch": 2097} {"train_loss": -11.799596786499023, "global_step": 352388, "epoch": 2097} {"train_loss": -12.421945571899414, "global_step": 352389, "epoch": 2097} {"train_loss": -12.179858207702637, "global_step": 352390, "epoch": 2097} {"train_loss": -12.0718355178833, "global_step": 352391, "epoch": 2097} {"train_loss": -12.226682662963867, "global_step": 352392, "epoch": 2097} {"train_loss": -12.113527297973633, "global_step": 352393, "epoch": 2097} {"train_loss": -12.221780776977539, "global_step": 352394, "epoch": 2097} {"train_loss": -12.22944450378418, "global_step": 352395, "epoch": 2097} {"train_loss": -12.337258338928223, "global_step": 352396, "epoch": 2097} {"train_loss": -12.153757095336914, "global_step": 352397, "epoch": 2097} {"train_loss": -12.364394187927246, "global_step": 352398, "epoch": 2097} {"train_loss": -12.289472579956055, "global_step": 352399, "epoch": 2097} {"train_loss": -12.28283405303955, "global_step": 352400, "epoch": 2097} {"train_loss": -12.232940673828125, "global_step": 352401, "epoch": 2097} {"train_loss": -12.093985557556152, "global_step": 352402, "epoch": 2097} {"train_loss": -12.399486541748047, "global_step": 352403, "epoch": 2097} {"train_loss": -12.003878593444824, "global_step": 352404, "epoch": 2097} {"train_loss": -12.42266845703125, "global_step": 352405, "epoch": 2097} {"train_loss": -12.368239402770996, "global_step": 352406, "epoch": 2097} {"train_loss": -12.463998794555664, "global_step": 352407, "epoch": 2097} {"train_loss": -12.383465766906738, "global_step": 352408, "epoch": 2097} {"train_loss": -12.164196014404297, "global_step": 352409, "epoch": 2097} {"train_loss": -12.275188446044922, "global_step": 352410, "epoch": 2097} {"train_loss": -12.35429859161377, "global_step": 352411, "epoch": 2097} {"train_loss": -12.376615524291992, "global_step": 352412, "epoch": 2097} {"train_loss": -12.444453239440918, "global_step": 352413, "epoch": 2097} {"train_loss": -12.418445587158203, "global_step": 352414, "epoch": 2097} {"train_loss": -12.34591007232666, "global_step": 352415, "epoch": 2097} {"train_loss": -12.344663619995117, "global_step": 352416, "epoch": 2097} {"train_loss": -12.441559791564941, "global_step": 352417, "epoch": 2097} {"train_loss": -12.232004165649414, "global_step": 352418, "epoch": 2097} {"train_loss": -12.21363639831543, "global_step": 352419, "epoch": 2097} {"train_loss": -12.33291244506836, "global_step": 352420, "epoch": 2097} {"train_loss": -12.377328872680664, "global_step": 352421, "epoch": 2097} {"train_loss": -12.146659851074219, "global_step": 352422, "epoch": 2097} {"train_loss": -12.20886516571045, "global_step": 352423, "epoch": 2097} {"train_loss": -12.329659461975098, "global_step": 352424, "epoch": 2097} {"train_loss": -12.20991039276123, "global_step": 352425, "epoch": 2097} {"train_loss": -12.380970001220703, "global_step": 352426, "epoch": 2097} {"train_loss": -12.295845031738281, "global_step": 352427, "epoch": 2097} {"train_loss": -12.324068069458008, "global_step": 352428, "epoch": 2097} {"train_loss": -11.978423118591309, "global_step": 352429, "epoch": 2097} {"train_loss": -12.380399703979492, "global_step": 352430, "epoch": 2097} {"train_loss": -12.141486167907715, "global_step": 352431, "epoch": 2097} {"train_loss": -12.517974853515625, "global_step": 352432, "epoch": 2097} {"train_loss": -12.032546997070312, "global_step": 352433, "epoch": 2097} {"train_loss": -12.391536712646484, "global_step": 352434, "epoch": 2097} {"train_loss": -11.982619285583496, "global_step": 352435, "epoch": 2097} {"train_loss": -12.215147018432617, "global_step": 352436, "epoch": 2097} {"train_loss": -12.459295272827148, "global_step": 352437, "epoch": 2097} {"train_loss": -12.268474578857422, "global_step": 352438, "epoch": 2097} {"train_loss": -12.496610641479492, "global_step": 352439, "epoch": 2097} {"train_loss": -12.368136405944824, "global_step": 352440, "epoch": 2097} {"train_loss": -12.281091690063477, "global_step": 352441, "epoch": 2097} {"train_loss": -12.471431732177734, "global_step": 352442, "epoch": 2097} {"train_loss": -12.566837310791016, "global_step": 352443, "epoch": 2097} {"train_loss": -12.112342834472656, "global_step": 352444, "epoch": 2097} {"train_loss": -12.459612846374512, "global_step": 352445, "epoch": 2097} {"train_loss": -12.33316421508789, "global_step": 352446, "epoch": 2097} {"train_loss": -12.731810569763184, "global_step": 352447, "epoch": 2097} {"train_loss": -12.344863891601562, "global_step": 352448, "epoch": 2097} {"train_loss": -11.421401977539062, "global_step": 352449, "epoch": 2097} {"train_loss": -12.390310287475586, "global_step": 352450, "epoch": 2097} {"train_loss": -12.18391227722168, "global_step": 352451, "epoch": 2097} {"train_loss": -12.410139083862305, "global_step": 352452, "epoch": 2097} {"train_loss": -12.178027153015137, "global_step": 352453, "epoch": 2097} {"train_loss": -12.132707595825195, "global_step": 352454, "epoch": 2097} {"train_loss": -11.589746475219727, "global_step": 352455, "epoch": 2097} {"train_loss": -11.997756958007812, "global_step": 352456, "epoch": 2097} {"train_loss": -11.346711158752441, "global_step": 352457, "epoch": 2097} {"train_loss": -11.96964168548584, "global_step": 352458, "epoch": 2097} {"train_loss": -11.71359634399414, "global_step": 352459, "epoch": 2097} {"train_loss": -12.394590377807617, "global_step": 352460, "epoch": 2097} {"train_loss": -11.596748352050781, "global_step": 352461, "epoch": 2097} {"train_loss": -12.303197860717773, "global_step": 352462, "epoch": 2097} {"train_loss": -11.992697431927635, "global_step": 352463, "epoch": 2097, "val_loss": 291704.75} {"train_loss": -12.38235092163086, "global_step": 352464, "epoch": 2098} {"train_loss": -11.596879959106445, "global_step": 352465, "epoch": 2098} {"train_loss": -11.345314025878906, "global_step": 352466, "epoch": 2098} {"train_loss": -11.542587280273438, "global_step": 352467, "epoch": 2098} {"train_loss": -11.848003387451172, "global_step": 352468, "epoch": 2098} {"train_loss": -12.304792404174805, "global_step": 352469, "epoch": 2098} {"train_loss": -12.051067352294922, "global_step": 352470, "epoch": 2098} {"train_loss": -12.230701446533203, "global_step": 352471, "epoch": 2098} {"train_loss": -12.197614669799805, "global_step": 352472, "epoch": 2098} {"train_loss": -11.95262622833252, "global_step": 352473, "epoch": 2098} {"train_loss": -12.241121292114258, "global_step": 352474, "epoch": 2098} {"train_loss": -12.5329008102417, "global_step": 352475, "epoch": 2098} {"train_loss": -12.322967529296875, "global_step": 352476, "epoch": 2098} {"train_loss": -12.21107292175293, "global_step": 352477, "epoch": 2098} {"train_loss": -12.51650619506836, "global_step": 352478, "epoch": 2098} {"train_loss": -12.242853164672852, "global_step": 352479, "epoch": 2098} {"train_loss": -11.791387557983398, "global_step": 352480, "epoch": 2098} {"train_loss": -11.221284866333008, "global_step": 352481, "epoch": 2098} {"train_loss": -12.192968368530273, "global_step": 352482, "epoch": 2098} {"train_loss": -11.526895523071289, "global_step": 352483, "epoch": 2098} {"train_loss": -10.391469955444336, "global_step": 352484, "epoch": 2098} {"train_loss": -11.278312683105469, "global_step": 352485, "epoch": 2098} {"train_loss": -12.153078079223633, "global_step": 352486, "epoch": 2098} {"train_loss": -11.145703315734863, "global_step": 352487, "epoch": 2098} {"train_loss": -11.843469619750977, "global_step": 352488, "epoch": 2098} {"train_loss": -11.446539878845215, "global_step": 352489, "epoch": 2098} {"train_loss": -10.888065338134766, "global_step": 352490, "epoch": 2098} {"train_loss": -11.765652656555176, "global_step": 352491, "epoch": 2098} {"train_loss": -11.05219841003418, "global_step": 352492, "epoch": 2098} {"train_loss": -10.058822631835938, "global_step": 352493, "epoch": 2098} {"train_loss": -11.3358736038208, "global_step": 352494, "epoch": 2098} {"train_loss": -8.584124565124512, "global_step": 352495, "epoch": 2098} {"train_loss": -8.172480583190918, "global_step": 352496, "epoch": 2098} {"train_loss": -7.973883152008057, "global_step": 352497, "epoch": 2098} {"train_loss": -8.19318962097168, "global_step": 352498, "epoch": 2098} {"train_loss": -9.102860450744629, "global_step": 352499, "epoch": 2098} {"train_loss": -9.58163833618164, "global_step": 352500, "epoch": 2098} {"train_loss": -9.484367370605469, "global_step": 352501, "epoch": 2098} {"train_loss": -8.609764099121094, "global_step": 352502, "epoch": 2098} {"train_loss": -8.60013484954834, "global_step": 352503, "epoch": 2098} {"train_loss": -10.665689468383789, "global_step": 352504, "epoch": 2098} {"train_loss": -9.247077941894531, "global_step": 352505, "epoch": 2098} {"train_loss": -9.683784484863281, "global_step": 352506, "epoch": 2098} {"train_loss": -10.278264999389648, "global_step": 352507, "epoch": 2098} {"train_loss": -10.021637916564941, "global_step": 352508, "epoch": 2098} {"train_loss": -9.828580856323242, "global_step": 352509, "epoch": 2098} {"train_loss": -10.200380325317383, "global_step": 352510, "epoch": 2098} {"train_loss": -10.564882278442383, "global_step": 352511, "epoch": 2098} {"train_loss": -9.494440078735352, "global_step": 352512, "epoch": 2098} {"train_loss": -11.28354549407959, "global_step": 352513, "epoch": 2098} {"train_loss": -10.022895812988281, "global_step": 352514, "epoch": 2098} {"train_loss": -11.46798324584961, "global_step": 352515, "epoch": 2098} {"train_loss": -9.984417915344238, "global_step": 352516, "epoch": 2098} {"train_loss": -11.239795684814453, "global_step": 352517, "epoch": 2098} {"train_loss": -9.790681838989258, "global_step": 352518, "epoch": 2098} {"train_loss": -10.398946762084961, "global_step": 352519, "epoch": 2098} {"train_loss": -9.667814254760742, "global_step": 352520, "epoch": 2098} {"train_loss": -9.950130462646484, "global_step": 352521, "epoch": 2098} {"train_loss": -9.775161743164062, "global_step": 352522, "epoch": 2098} {"train_loss": -8.927753448486328, "global_step": 352523, "epoch": 2098} {"train_loss": -11.003816604614258, "global_step": 352524, "epoch": 2098} {"train_loss": -10.587209701538086, "global_step": 352525, "epoch": 2098} {"train_loss": -10.441282272338867, "global_step": 352526, "epoch": 2098} {"train_loss": -10.467912673950195, "global_step": 352527, "epoch": 2098} {"train_loss": -9.681089401245117, "global_step": 352528, "epoch": 2098} {"train_loss": -11.538196563720703, "global_step": 352529, "epoch": 2098} {"train_loss": -9.794703483581543, "global_step": 352530, "epoch": 2098} {"train_loss": -11.18114185333252, "global_step": 352531, "epoch": 2098} {"train_loss": -10.618255615234375, "global_step": 352532, "epoch": 2098} {"train_loss": -10.986127853393555, "global_step": 352533, "epoch": 2098} {"train_loss": -11.809206008911133, "global_step": 352534, "epoch": 2098} {"train_loss": -10.363615036010742, "global_step": 352535, "epoch": 2098} {"train_loss": -11.407576560974121, "global_step": 352536, "epoch": 2098} {"train_loss": -11.070942878723145, "global_step": 352537, "epoch": 2098} {"train_loss": -10.937906265258789, "global_step": 352538, "epoch": 2098} {"train_loss": -11.402915954589844, "global_step": 352539, "epoch": 2098} {"train_loss": -11.464914321899414, "global_step": 352540, "epoch": 2098} {"train_loss": -11.566986083984375, "global_step": 352541, "epoch": 2098} {"train_loss": -11.716462135314941, "global_step": 352542, "epoch": 2098} {"train_loss": -11.549288749694824, "global_step": 352543, "epoch": 2098} {"train_loss": -11.544025421142578, "global_step": 352544, "epoch": 2098} {"train_loss": -11.596416473388672, "global_step": 352545, "epoch": 2098} {"train_loss": -11.603402137756348, "global_step": 352546, "epoch": 2098} {"train_loss": -11.56159782409668, "global_step": 352547, "epoch": 2098} {"train_loss": -11.950817108154297, "global_step": 352548, "epoch": 2098} {"train_loss": -11.549886703491211, "global_step": 352549, "epoch": 2098} {"train_loss": -11.695018768310547, "global_step": 352550, "epoch": 2098} {"train_loss": -12.118114471435547, "global_step": 352551, "epoch": 2098} {"train_loss": -11.584856986999512, "global_step": 352552, "epoch": 2098} {"train_loss": -11.937247276306152, "global_step": 352553, "epoch": 2098} {"train_loss": -11.818172454833984, "global_step": 352554, "epoch": 2098} {"train_loss": -11.543327331542969, "global_step": 352555, "epoch": 2098} {"train_loss": -11.866920471191406, "global_step": 352556, "epoch": 2098} {"train_loss": -11.570281028747559, "global_step": 352557, "epoch": 2098} {"train_loss": -11.955809593200684, "global_step": 352558, "epoch": 2098} {"train_loss": -11.712715148925781, "global_step": 352559, "epoch": 2098} {"train_loss": -11.730523109436035, "global_step": 352560, "epoch": 2098} {"train_loss": -12.145267486572266, "global_step": 352561, "epoch": 2098} {"train_loss": -11.872760772705078, "global_step": 352562, "epoch": 2098} {"train_loss": -11.901365280151367, "global_step": 352563, "epoch": 2098} {"train_loss": -11.68807601928711, "global_step": 352564, "epoch": 2098} {"train_loss": -11.812884330749512, "global_step": 352565, "epoch": 2098} {"train_loss": -11.795604705810547, "global_step": 352566, "epoch": 2098} {"train_loss": -11.837512016296387, "global_step": 352567, "epoch": 2098} {"train_loss": -11.956734657287598, "global_step": 352568, "epoch": 2098} {"train_loss": -11.864527702331543, "global_step": 352569, "epoch": 2098} {"train_loss": -11.8687105178833, "global_step": 352570, "epoch": 2098} {"train_loss": -11.763548851013184, "global_step": 352571, "epoch": 2098} {"train_loss": -12.2036714553833, "global_step": 352572, "epoch": 2098} {"train_loss": -12.133749008178711, "global_step": 352573, "epoch": 2098} {"train_loss": -12.168153762817383, "global_step": 352574, "epoch": 2098} {"train_loss": -11.930976867675781, "global_step": 352575, "epoch": 2098} {"train_loss": -11.985464096069336, "global_step": 352576, "epoch": 2098} {"train_loss": -12.06224536895752, "global_step": 352577, "epoch": 2098} {"train_loss": -11.98288345336914, "global_step": 352578, "epoch": 2098} {"train_loss": -12.133255004882812, "global_step": 352579, "epoch": 2098} {"train_loss": -12.124505043029785, "global_step": 352580, "epoch": 2098} {"train_loss": -11.906822204589844, "global_step": 352581, "epoch": 2098} {"train_loss": -12.147994995117188, "global_step": 352582, "epoch": 2098} {"train_loss": -11.856677055358887, "global_step": 352583, "epoch": 2098} {"train_loss": -12.296960830688477, "global_step": 352584, "epoch": 2098} {"train_loss": -11.962275505065918, "global_step": 352585, "epoch": 2098} {"train_loss": -12.213254928588867, "global_step": 352586, "epoch": 2098} {"train_loss": -12.102163314819336, "global_step": 352587, "epoch": 2098} {"train_loss": -12.186988830566406, "global_step": 352588, "epoch": 2098} {"train_loss": -12.320817947387695, "global_step": 352589, "epoch": 2098} {"train_loss": -12.223344802856445, "global_step": 352590, "epoch": 2098} {"train_loss": -12.244233131408691, "global_step": 352591, "epoch": 2098} {"train_loss": -12.172356605529785, "global_step": 352592, "epoch": 2098} {"train_loss": -12.182427406311035, "global_step": 352593, "epoch": 2098} {"train_loss": -12.309929847717285, "global_step": 352594, "epoch": 2098} {"train_loss": -12.263172149658203, "global_step": 352595, "epoch": 2098} {"train_loss": -12.29811954498291, "global_step": 352596, "epoch": 2098} {"train_loss": -12.413192749023438, "global_step": 352597, "epoch": 2098} {"train_loss": -12.322022438049316, "global_step": 352598, "epoch": 2098} {"train_loss": -12.119342803955078, "global_step": 352599, "epoch": 2098} {"train_loss": -12.444551467895508, "global_step": 352600, "epoch": 2098} {"train_loss": -12.128632545471191, "global_step": 352601, "epoch": 2098} {"train_loss": -12.249244689941406, "global_step": 352602, "epoch": 2098} {"train_loss": -12.291614532470703, "global_step": 352603, "epoch": 2098} {"train_loss": -12.310750961303711, "global_step": 352604, "epoch": 2098} {"train_loss": -12.333656311035156, "global_step": 352605, "epoch": 2098} {"train_loss": -12.094342231750488, "global_step": 352606, "epoch": 2098} {"train_loss": -11.906421661376953, "global_step": 352607, "epoch": 2098} {"train_loss": -12.20802116394043, "global_step": 352608, "epoch": 2098} {"train_loss": -11.961181640625, "global_step": 352609, "epoch": 2098} {"train_loss": -11.943838119506836, "global_step": 352610, "epoch": 2098} {"train_loss": -12.398080825805664, "global_step": 352611, "epoch": 2098} {"train_loss": -11.831439971923828, "global_step": 352612, "epoch": 2098} {"train_loss": -12.197439193725586, "global_step": 352613, "epoch": 2098} {"train_loss": -12.147462844848633, "global_step": 352614, "epoch": 2098} {"train_loss": -11.967220306396484, "global_step": 352615, "epoch": 2098} {"train_loss": -12.139036178588867, "global_step": 352616, "epoch": 2098} {"train_loss": -12.541950225830078, "global_step": 352617, "epoch": 2098} {"train_loss": -12.26363754272461, "global_step": 352618, "epoch": 2098} {"train_loss": -12.360325813293457, "global_step": 352619, "epoch": 2098} {"train_loss": -12.382087707519531, "global_step": 352620, "epoch": 2098} {"train_loss": -12.223690032958984, "global_step": 352621, "epoch": 2098} {"train_loss": -12.214303970336914, "global_step": 352622, "epoch": 2098} {"train_loss": -12.14797592163086, "global_step": 352623, "epoch": 2098} {"train_loss": -12.558453559875488, "global_step": 352624, "epoch": 2098} {"train_loss": -12.36410140991211, "global_step": 352625, "epoch": 2098} {"train_loss": -12.323480606079102, "global_step": 352626, "epoch": 2098} {"train_loss": -12.03989315032959, "global_step": 352627, "epoch": 2098} {"train_loss": -12.397579193115234, "global_step": 352628, "epoch": 2098} {"train_loss": -12.349809646606445, "global_step": 352629, "epoch": 2098} {"train_loss": -12.317110061645508, "global_step": 352630, "epoch": 2098} {"train_loss": -11.462053262052082, "global_step": 352631, "epoch": 2098, "val_loss": 288683.34375} {"train_loss": -12.378707885742188, "global_step": 352632, "epoch": 2099} {"train_loss": -12.24494743347168, "global_step": 352633, "epoch": 2099} {"train_loss": -12.176111221313477, "global_step": 352634, "epoch": 2099} {"train_loss": -12.529661178588867, "global_step": 352635, "epoch": 2099} {"train_loss": -12.258094787597656, "global_step": 352636, "epoch": 2099} {"train_loss": -12.549656867980957, "global_step": 352637, "epoch": 2099} {"train_loss": -12.021215438842773, "global_step": 352638, "epoch": 2099} {"train_loss": -12.273924827575684, "global_step": 352639, "epoch": 2099} {"train_loss": -12.379134178161621, "global_step": 352640, "epoch": 2099} {"train_loss": -12.77227783203125, "global_step": 352641, "epoch": 2099} {"train_loss": -12.424581527709961, "global_step": 352642, "epoch": 2099} {"train_loss": -12.577942848205566, "global_step": 352643, "epoch": 2099} {"train_loss": -12.720991134643555, "global_step": 352644, "epoch": 2099} {"train_loss": -12.479791641235352, "global_step": 352645, "epoch": 2099} {"train_loss": -12.618345260620117, "global_step": 352646, "epoch": 2099} {"train_loss": -12.166040420532227, "global_step": 352647, "epoch": 2099} {"train_loss": -12.608182907104492, "global_step": 352648, "epoch": 2099} {"train_loss": -12.507574081420898, "global_step": 352649, "epoch": 2099} {"train_loss": -12.439098358154297, "global_step": 352650, "epoch": 2099} {"train_loss": -12.727245330810547, "global_step": 352651, "epoch": 2099} {"train_loss": -12.734528541564941, "global_step": 352652, "epoch": 2099} {"train_loss": -12.663818359375, "global_step": 352653, "epoch": 2099} {"train_loss": -12.634739875793457, "global_step": 352654, "epoch": 2099} {"train_loss": -12.742820739746094, "global_step": 352655, "epoch": 2099} {"train_loss": -12.678716659545898, "global_step": 352656, "epoch": 2099} {"train_loss": -12.424181938171387, "global_step": 352657, "epoch": 2099} {"train_loss": -12.730379104614258, "global_step": 352658, "epoch": 2099} {"train_loss": -12.510062217712402, "global_step": 352659, "epoch": 2099} {"train_loss": -12.530379295349121, "global_step": 352660, "epoch": 2099} {"train_loss": -12.72317123413086, "global_step": 352661, "epoch": 2099} {"train_loss": -12.776870727539062, "global_step": 352662, "epoch": 2099} {"train_loss": -12.945901870727539, "global_step": 352663, "epoch": 2099} {"train_loss": -12.636797904968262, "global_step": 352664, "epoch": 2099} {"train_loss": -12.62470817565918, "global_step": 352665, "epoch": 2099} {"train_loss": -12.869813919067383, "global_step": 352666, "epoch": 2099} {"train_loss": -12.578216552734375, "global_step": 352667, "epoch": 2099} {"train_loss": -12.6810302734375, "global_step": 352668, "epoch": 2099} {"train_loss": -12.631427764892578, "global_step": 352669, "epoch": 2099} {"train_loss": -12.7245512008667, "global_step": 352670, "epoch": 2099} {"train_loss": -12.677838325500488, "global_step": 352671, "epoch": 2099} {"train_loss": -12.612072944641113, "global_step": 352672, "epoch": 2099} {"train_loss": -12.715429306030273, "global_step": 352673, "epoch": 2099} {"train_loss": -12.64563274383545, "global_step": 352674, "epoch": 2099} {"train_loss": -12.424077987670898, "global_step": 352675, "epoch": 2099} {"train_loss": -12.49534797668457, "global_step": 352676, "epoch": 2099} {"train_loss": -12.524347305297852, "global_step": 352677, "epoch": 2099} {"train_loss": -12.574275016784668, "global_step": 352678, "epoch": 2099} {"train_loss": -12.892068862915039, "global_step": 352679, "epoch": 2099} {"train_loss": -12.326045989990234, "global_step": 352680, "epoch": 2099} {"train_loss": -12.078485488891602, "global_step": 352681, "epoch": 2099} {"train_loss": -11.703838348388672, "global_step": 352682, "epoch": 2099} {"train_loss": -11.547226905822754, "global_step": 352683, "epoch": 2099} {"train_loss": -11.062908172607422, "global_step": 352684, "epoch": 2099} {"train_loss": -12.266956329345703, "global_step": 352685, "epoch": 2099} {"train_loss": -11.989612579345703, "global_step": 352686, "epoch": 2099} {"train_loss": -12.037115097045898, "global_step": 352687, "epoch": 2099} {"train_loss": -11.235426902770996, "global_step": 352688, "epoch": 2099} {"train_loss": -11.585222244262695, "global_step": 352689, "epoch": 2099} {"train_loss": -12.067992210388184, "global_step": 352690, "epoch": 2099} {"train_loss": -10.979142189025879, "global_step": 352691, "epoch": 2099} {"train_loss": -11.730178833007812, "global_step": 352692, "epoch": 2099} {"train_loss": -9.412046432495117, "global_step": 352693, "epoch": 2099} {"train_loss": -9.512896537780762, "global_step": 352694, "epoch": 2099} {"train_loss": -9.875322341918945, "global_step": 352695, "epoch": 2099} {"train_loss": -9.784523010253906, "global_step": 352696, "epoch": 2099} {"train_loss": -10.451704025268555, "global_step": 352697, "epoch": 2099} {"train_loss": -8.558287620544434, "global_step": 352698, "epoch": 2099} {"train_loss": -8.956582069396973, "global_step": 352699, "epoch": 2099} {"train_loss": -7.86236047744751, "global_step": 352700, "epoch": 2099} {"train_loss": -8.55612564086914, "global_step": 352701, "epoch": 2099} {"train_loss": -9.842772483825684, "global_step": 352702, "epoch": 2099} {"train_loss": -10.943402290344238, "global_step": 352703, "epoch": 2099} {"train_loss": -9.571261405944824, "global_step": 352704, "epoch": 2099} {"train_loss": -10.539645195007324, "global_step": 352705, "epoch": 2099} {"train_loss": -10.107589721679688, "global_step": 352706, "epoch": 2099} {"train_loss": -10.419782638549805, "global_step": 352707, "epoch": 2099} {"train_loss": -10.643148422241211, "global_step": 352708, "epoch": 2099} {"train_loss": -10.263236999511719, "global_step": 352709, "epoch": 2099} {"train_loss": -10.35934066772461, "global_step": 352710, "epoch": 2099} {"train_loss": -10.700788497924805, "global_step": 352711, "epoch": 2099} {"train_loss": -10.864500999450684, "global_step": 352712, "epoch": 2099} {"train_loss": -10.482889175415039, "global_step": 352713, "epoch": 2099} {"train_loss": -10.465801239013672, "global_step": 352714, "epoch": 2099} {"train_loss": -11.445026397705078, "global_step": 352715, "epoch": 2099} {"train_loss": -10.658092498779297, "global_step": 352716, "epoch": 2099} {"train_loss": -11.996859550476074, "global_step": 352717, "epoch": 2099} {"train_loss": -10.641157150268555, "global_step": 352718, "epoch": 2099} {"train_loss": -12.010370254516602, "global_step": 352719, "epoch": 2099} {"train_loss": -11.670045852661133, "global_step": 352720, "epoch": 2099} {"train_loss": -11.441104888916016, "global_step": 352721, "epoch": 2099} {"train_loss": -11.290711402893066, "global_step": 352722, "epoch": 2099} {"train_loss": -10.975493431091309, "global_step": 352723, "epoch": 2099} {"train_loss": -11.411781311035156, "global_step": 352724, "epoch": 2099} {"train_loss": -10.608062744140625, "global_step": 352725, "epoch": 2099} {"train_loss": -10.511550903320312, "global_step": 352726, "epoch": 2099} {"train_loss": -11.31531810760498, "global_step": 352727, "epoch": 2099} {"train_loss": -10.676115989685059, "global_step": 352728, "epoch": 2099} {"train_loss": -11.314510345458984, "global_step": 352729, "epoch": 2099} {"train_loss": -10.87919807434082, "global_step": 352730, "epoch": 2099} {"train_loss": -11.578079223632812, "global_step": 352731, "epoch": 2099} {"train_loss": -11.271060943603516, "global_step": 352732, "epoch": 2099} {"train_loss": -11.142175674438477, "global_step": 352733, "epoch": 2099} {"train_loss": -11.597827911376953, "global_step": 352734, "epoch": 2099} {"train_loss": -11.265759468078613, "global_step": 352735, "epoch": 2099} {"train_loss": -11.714530944824219, "global_step": 352736, "epoch": 2099} {"train_loss": -11.307714462280273, "global_step": 352737, "epoch": 2099} {"train_loss": -12.121519088745117, "global_step": 352738, "epoch": 2099} {"train_loss": -11.869377136230469, "global_step": 352739, "epoch": 2099} {"train_loss": -11.899900436401367, "global_step": 352740, "epoch": 2099} {"train_loss": -11.715731620788574, "global_step": 352741, "epoch": 2099} {"train_loss": -11.937028884887695, "global_step": 352742, "epoch": 2099} {"train_loss": -12.148226737976074, "global_step": 352743, "epoch": 2099} {"train_loss": -11.603250503540039, "global_step": 352744, "epoch": 2099} {"train_loss": -12.423152923583984, "global_step": 352745, "epoch": 2099} {"train_loss": -11.83485221862793, "global_step": 352746, "epoch": 2099} {"train_loss": -12.037558555603027, "global_step": 352747, "epoch": 2099} {"train_loss": -12.156469345092773, "global_step": 352748, "epoch": 2099} {"train_loss": -12.184432029724121, "global_step": 352749, "epoch": 2099} {"train_loss": -12.119277954101562, "global_step": 352750, "epoch": 2099} {"train_loss": -12.19667911529541, "global_step": 352751, "epoch": 2099} {"train_loss": -12.096966743469238, "global_step": 352752, "epoch": 2099} {"train_loss": -12.283523559570312, "global_step": 352753, "epoch": 2099} {"train_loss": -12.00433349609375, "global_step": 352754, "epoch": 2099} {"train_loss": -12.33915901184082, "global_step": 352755, "epoch": 2099} {"train_loss": -12.240803718566895, "global_step": 352756, "epoch": 2099} {"train_loss": -12.327116012573242, "global_step": 352757, "epoch": 2099} {"train_loss": -12.228593826293945, "global_step": 352758, "epoch": 2099} {"train_loss": -12.33298397064209, "global_step": 352759, "epoch": 2099} {"train_loss": -12.189872741699219, "global_step": 352760, "epoch": 2099} {"train_loss": -12.32638168334961, "global_step": 352761, "epoch": 2099} {"train_loss": -12.292970657348633, "global_step": 352762, "epoch": 2099} {"train_loss": -12.500425338745117, "global_step": 352763, "epoch": 2099} {"train_loss": -12.287015914916992, "global_step": 352764, "epoch": 2099} {"train_loss": -12.30350112915039, "global_step": 352765, "epoch": 2099} {"train_loss": -12.393109321594238, "global_step": 352766, "epoch": 2099} {"train_loss": -12.477777481079102, "global_step": 352767, "epoch": 2099} {"train_loss": -12.336504936218262, "global_step": 352768, "epoch": 2099} {"train_loss": -12.330716133117676, "global_step": 352769, "epoch": 2099} {"train_loss": -12.391656875610352, "global_step": 352770, "epoch": 2099} {"train_loss": -12.488298416137695, "global_step": 352771, "epoch": 2099} {"train_loss": -12.456609725952148, "global_step": 352772, "epoch": 2099} {"train_loss": -12.466241836547852, "global_step": 352773, "epoch": 2099} {"train_loss": -12.367254257202148, "global_step": 352774, "epoch": 2099} {"train_loss": -12.680408477783203, "global_step": 352775, "epoch": 2099} {"train_loss": -12.568719863891602, "global_step": 352776, "epoch": 2099} {"train_loss": -12.532182693481445, "global_step": 352777, "epoch": 2099} {"train_loss": -12.431217193603516, "global_step": 352778, "epoch": 2099} {"train_loss": -12.494840621948242, "global_step": 352779, "epoch": 2099} {"train_loss": -12.58443832397461, "global_step": 352780, "epoch": 2099} {"train_loss": -12.462095260620117, "global_step": 352781, "epoch": 2099} {"train_loss": -12.6676025390625, "global_step": 352782, "epoch": 2099} {"train_loss": -12.192413330078125, "global_step": 352783, "epoch": 2099} {"train_loss": -12.23403549194336, "global_step": 352784, "epoch": 2099} {"train_loss": -12.016119956970215, "global_step": 352785, "epoch": 2099} {"train_loss": -12.263283729553223, "global_step": 352786, "epoch": 2099} {"train_loss": -12.348658561706543, "global_step": 352787, "epoch": 2099} {"train_loss": -12.27651596069336, "global_step": 352788, "epoch": 2099} {"train_loss": -12.582290649414062, "global_step": 352789, "epoch": 2099} {"train_loss": -11.982824325561523, "global_step": 352790, "epoch": 2099} {"train_loss": -12.251181602478027, "global_step": 352791, "epoch": 2099} {"train_loss": -12.173014640808105, "global_step": 352792, "epoch": 2099} {"train_loss": -12.528218269348145, "global_step": 352793, "epoch": 2099} {"train_loss": -11.890068054199219, "global_step": 352794, "epoch": 2099} {"train_loss": -12.245384216308594, "global_step": 352795, "epoch": 2099} {"train_loss": -12.064374923706055, "global_step": 352796, "epoch": 2099} {"train_loss": -12.217765808105469, "global_step": 352797, "epoch": 2099} {"train_loss": -12.005664825439453, "global_step": 352798, "epoch": 2099} {"train_loss": -11.851936382906777, "global_step": 352799, "epoch": 2099, "val_loss": 289116.59375} {"train_loss": -12.202438354492188, "global_step": 352800, "epoch": 2100} {"train_loss": -11.887149810791016, "global_step": 352801, "epoch": 2100} {"train_loss": -12.2461576461792, "global_step": 352802, "epoch": 2100} {"train_loss": -11.766518592834473, "global_step": 352803, "epoch": 2100} {"train_loss": -12.51540756225586, "global_step": 352804, "epoch": 2100} {"train_loss": -12.126241683959961, "global_step": 352805, "epoch": 2100} {"train_loss": -12.139411926269531, "global_step": 352806, "epoch": 2100} {"train_loss": -11.85308837890625, "global_step": 352807, "epoch": 2100} {"train_loss": -11.677473068237305, "global_step": 352808, "epoch": 2100} {"train_loss": -11.301462173461914, "global_step": 352809, "epoch": 2100} {"train_loss": -11.373476028442383, "global_step": 352810, "epoch": 2100} {"train_loss": -9.99715805053711, "global_step": 352811, "epoch": 2100} {"train_loss": -10.402875900268555, "global_step": 352812, "epoch": 2100} {"train_loss": -9.3031644821167, "global_step": 352813, "epoch": 2100} {"train_loss": -10.590843200683594, "global_step": 352814, "epoch": 2100} {"train_loss": -9.728300094604492, "global_step": 352815, "epoch": 2100} {"train_loss": -10.001041412353516, "global_step": 352816, "epoch": 2100} {"train_loss": -8.99376106262207, "global_step": 352817, "epoch": 2100} {"train_loss": -9.761421203613281, "global_step": 352818, "epoch": 2100} {"train_loss": -11.12051773071289, "global_step": 352819, "epoch": 2100} {"train_loss": -11.038333892822266, "global_step": 352820, "epoch": 2100} {"train_loss": -10.623672485351562, "global_step": 352821, "epoch": 2100} {"train_loss": -11.48091983795166, "global_step": 352822, "epoch": 2100} {"train_loss": -11.726490020751953, "global_step": 352823, "epoch": 2100} {"train_loss": -11.601665496826172, "global_step": 352824, "epoch": 2100} {"train_loss": -11.835528373718262, "global_step": 352825, "epoch": 2100} {"train_loss": -10.962505340576172, "global_step": 352826, "epoch": 2100} {"train_loss": -12.106760025024414, "global_step": 352827, "epoch": 2100} {"train_loss": -11.81539535522461, "global_step": 352828, "epoch": 2100} {"train_loss": -11.829992294311523, "global_step": 352829, "epoch": 2100} {"train_loss": -11.341835021972656, "global_step": 352830, "epoch": 2100} {"train_loss": -12.013513565063477, "global_step": 352831, "epoch": 2100} {"train_loss": -11.42900276184082, "global_step": 352832, "epoch": 2100} {"train_loss": -11.838155746459961, "global_step": 352833, "epoch": 2100} {"train_loss": -11.558379173278809, "global_step": 352834, "epoch": 2100} {"train_loss": -11.797563552856445, "global_step": 352835, "epoch": 2100} {"train_loss": -11.9716215133667, "global_step": 352836, "epoch": 2100} {"train_loss": -12.213064193725586, "global_step": 352837, "epoch": 2100} {"train_loss": -12.032095909118652, "global_step": 352838, "epoch": 2100} {"train_loss": -12.213750839233398, "global_step": 352839, "epoch": 2100} {"train_loss": -11.917774200439453, "global_step": 352840, "epoch": 2100} {"train_loss": -11.574535369873047, "global_step": 352841, "epoch": 2100} {"train_loss": -11.933656692504883, "global_step": 352842, "epoch": 2100} {"train_loss": -11.901946067810059, "global_step": 352843, "epoch": 2100} {"train_loss": -11.881272315979004, "global_step": 352844, "epoch": 2100} {"train_loss": -11.700263977050781, "global_step": 352845, "epoch": 2100} {"train_loss": -11.795646667480469, "global_step": 352846, "epoch": 2100} {"train_loss": -12.244999885559082, "global_step": 352847, "epoch": 2100} {"train_loss": -12.131887435913086, "global_step": 352848, "epoch": 2100} {"train_loss": -11.969045639038086, "global_step": 352849, "epoch": 2100} {"train_loss": -12.192331314086914, "global_step": 352850, "epoch": 2100} {"train_loss": -11.942455291748047, "global_step": 352851, "epoch": 2100} {"train_loss": -12.323816299438477, "global_step": 352852, "epoch": 2100} {"train_loss": -11.899144172668457, "global_step": 352853, "epoch": 2100} {"train_loss": -12.136008262634277, "global_step": 352854, "epoch": 2100} {"train_loss": -12.072456359863281, "global_step": 352855, "epoch": 2100} {"train_loss": -12.196493148803711, "global_step": 352856, "epoch": 2100} {"train_loss": -11.700613021850586, "global_step": 352857, "epoch": 2100} {"train_loss": -12.36414909362793, "global_step": 352858, "epoch": 2100} {"train_loss": -11.928037643432617, "global_step": 352859, "epoch": 2100} {"train_loss": -12.401517868041992, "global_step": 352860, "epoch": 2100} {"train_loss": -11.968827247619629, "global_step": 352861, "epoch": 2100} {"train_loss": -12.535895347595215, "global_step": 352862, "epoch": 2100} {"train_loss": -12.085775375366211, "global_step": 352863, "epoch": 2100} {"train_loss": -12.335456848144531, "global_step": 352864, "epoch": 2100} {"train_loss": -12.249093055725098, "global_step": 352865, "epoch": 2100} {"train_loss": -12.099615097045898, "global_step": 352866, "epoch": 2100} {"train_loss": -12.198042869567871, "global_step": 352867, "epoch": 2100} {"train_loss": -12.394872665405273, "global_step": 352868, "epoch": 2100} {"train_loss": -11.809659957885742, "global_step": 352869, "epoch": 2100} {"train_loss": -12.081033706665039, "global_step": 352870, "epoch": 2100} {"train_loss": -11.8322172164917, "global_step": 352871, "epoch": 2100} {"train_loss": -12.098963737487793, "global_step": 352872, "epoch": 2100} {"train_loss": -11.796577453613281, "global_step": 352873, "epoch": 2100} {"train_loss": -11.80528450012207, "global_step": 352874, "epoch": 2100} {"train_loss": -12.275794982910156, "global_step": 352875, "epoch": 2100} {"train_loss": -11.81039047241211, "global_step": 352876, "epoch": 2100} {"train_loss": -11.72580337524414, "global_step": 352877, "epoch": 2100} {"train_loss": -12.071070671081543, "global_step": 352878, "epoch": 2100} {"train_loss": -11.732620239257812, "global_step": 352879, "epoch": 2100} {"train_loss": -11.198809623718262, "global_step": 352880, "epoch": 2100} {"train_loss": -11.154458045959473, "global_step": 352881, "epoch": 2100} {"train_loss": -11.656519889831543, "global_step": 352882, "epoch": 2100} {"train_loss": -9.971553802490234, "global_step": 352883, "epoch": 2100} {"train_loss": -9.965999603271484, "global_step": 352884, "epoch": 2100} {"train_loss": -11.609197616577148, "global_step": 352885, "epoch": 2100} {"train_loss": -10.185585975646973, "global_step": 352886, "epoch": 2100} {"train_loss": -10.447304725646973, "global_step": 352887, "epoch": 2100} {"train_loss": -10.760478973388672, "global_step": 352888, "epoch": 2100} {"train_loss": -8.98300552368164, "global_step": 352889, "epoch": 2100} {"train_loss": -9.075838088989258, "global_step": 352890, "epoch": 2100} {"train_loss": -11.357731819152832, "global_step": 352891, "epoch": 2100} {"train_loss": -9.894510269165039, "global_step": 352892, "epoch": 2100} {"train_loss": -10.619723320007324, "global_step": 352893, "epoch": 2100} {"train_loss": -10.73400592803955, "global_step": 352894, "epoch": 2100} {"train_loss": -10.1865234375, "global_step": 352895, "epoch": 2100} {"train_loss": -9.42395305633545, "global_step": 352896, "epoch": 2100} {"train_loss": -11.146568298339844, "global_step": 352897, "epoch": 2100} {"train_loss": -10.03127670288086, "global_step": 352898, "epoch": 2100} {"train_loss": -9.604494094848633, "global_step": 352899, "epoch": 2100} {"train_loss": -9.65376091003418, "global_step": 352900, "epoch": 2100} {"train_loss": -11.675159454345703, "global_step": 352901, "epoch": 2100} {"train_loss": -10.1322021484375, "global_step": 352902, "epoch": 2100} {"train_loss": -10.200618743896484, "global_step": 352903, "epoch": 2100} {"train_loss": -11.348548889160156, "global_step": 352904, "epoch": 2100} {"train_loss": -11.003281593322754, "global_step": 352905, "epoch": 2100} {"train_loss": -10.464292526245117, "global_step": 352906, "epoch": 2100} {"train_loss": -11.79110050201416, "global_step": 352907, "epoch": 2100} {"train_loss": -10.484915733337402, "global_step": 352908, "epoch": 2100} {"train_loss": -11.283607482910156, "global_step": 352909, "epoch": 2100} {"train_loss": -11.704814910888672, "global_step": 352910, "epoch": 2100} {"train_loss": -11.103546142578125, "global_step": 352911, "epoch": 2100} {"train_loss": -11.615447998046875, "global_step": 352912, "epoch": 2100} {"train_loss": -11.963949203491211, "global_step": 352913, "epoch": 2100} {"train_loss": -11.484962463378906, "global_step": 352914, "epoch": 2100} {"train_loss": -11.869787216186523, "global_step": 352915, "epoch": 2100} {"train_loss": -11.554460525512695, "global_step": 352916, "epoch": 2100} {"train_loss": -11.827352523803711, "global_step": 352917, "epoch": 2100} {"train_loss": -11.856480598449707, "global_step": 352918, "epoch": 2100} {"train_loss": -11.708562850952148, "global_step": 352919, "epoch": 2100} {"train_loss": -12.038622856140137, "global_step": 352920, "epoch": 2100} {"train_loss": -11.646690368652344, "global_step": 352921, "epoch": 2100} {"train_loss": -12.0571928024292, "global_step": 352922, "epoch": 2100} {"train_loss": -11.73257827758789, "global_step": 352923, "epoch": 2100} {"train_loss": -12.066621780395508, "global_step": 352924, "epoch": 2100} {"train_loss": -11.902775764465332, "global_step": 352925, "epoch": 2100} {"train_loss": -12.163213729858398, "global_step": 352926, "epoch": 2100} {"train_loss": -12.117584228515625, "global_step": 352927, "epoch": 2100} {"train_loss": -11.992671966552734, "global_step": 352928, "epoch": 2100} {"train_loss": -11.93252944946289, "global_step": 352929, "epoch": 2100} {"train_loss": -11.916459083557129, "global_step": 352930, "epoch": 2100} {"train_loss": -12.169150352478027, "global_step": 352931, "epoch": 2100} {"train_loss": -11.900044441223145, "global_step": 352932, "epoch": 2100} {"train_loss": -12.246747016906738, "global_step": 352933, "epoch": 2100} {"train_loss": -12.090982437133789, "global_step": 352934, "epoch": 2100} {"train_loss": -12.15656852722168, "global_step": 352935, "epoch": 2100} {"train_loss": -12.310465812683105, "global_step": 352936, "epoch": 2100} {"train_loss": -12.232561111450195, "global_step": 352937, "epoch": 2100} {"train_loss": -12.322858810424805, "global_step": 352938, "epoch": 2100} {"train_loss": -12.259990692138672, "global_step": 352939, "epoch": 2100} {"train_loss": -12.280646324157715, "global_step": 352940, "epoch": 2100} {"train_loss": -12.321332931518555, "global_step": 352941, "epoch": 2100} {"train_loss": -12.169824600219727, "global_step": 352942, "epoch": 2100} {"train_loss": -12.229361534118652, "global_step": 352943, "epoch": 2100} {"train_loss": -12.154266357421875, "global_step": 352944, "epoch": 2100} {"train_loss": -12.236120223999023, "global_step": 352945, "epoch": 2100} {"train_loss": -12.405265808105469, "global_step": 352946, "epoch": 2100} {"train_loss": -12.340364456176758, "global_step": 352947, "epoch": 2100} {"train_loss": -12.31611442565918, "global_step": 352948, "epoch": 2100} {"train_loss": -12.389680862426758, "global_step": 352949, "epoch": 2100} {"train_loss": -12.562972068786621, "global_step": 352950, "epoch": 2100} {"train_loss": -12.4827880859375, "global_step": 352951, "epoch": 2100} {"train_loss": -12.449005126953125, "global_step": 352952, "epoch": 2100} {"train_loss": -12.385393142700195, "global_step": 352953, "epoch": 2100} {"train_loss": -12.467297554016113, "global_step": 352954, "epoch": 2100} {"train_loss": -12.455263137817383, "global_step": 352955, "epoch": 2100} {"train_loss": -12.503984451293945, "global_step": 352956, "epoch": 2100} {"train_loss": -12.465588569641113, "global_step": 352957, "epoch": 2100} {"train_loss": -12.336409568786621, "global_step": 352958, "epoch": 2100} {"train_loss": -12.299297332763672, "global_step": 352959, "epoch": 2100} {"train_loss": -12.539933204650879, "global_step": 352960, "epoch": 2100} {"train_loss": -12.502391815185547, "global_step": 352961, "epoch": 2100} {"train_loss": -12.395398139953613, "global_step": 352962, "epoch": 2100} {"train_loss": -12.60994815826416, "global_step": 352963, "epoch": 2100} {"train_loss": -12.578760147094727, "global_step": 352964, "epoch": 2100} {"train_loss": -12.630413055419922, "global_step": 352965, "epoch": 2100} {"train_loss": -12.42507553100586, "global_step": 352966, "epoch": 2100} {"train_loss": -11.647841879299708, "global_step": 352967, "epoch": 2100, "train/sim_max_reward_0": 0.6941311558788477, "train/sim_max_reward_1": 0.9781113003340756, "train/sim_max_reward_2": 0.0052746159773498676, "train/sim_max_reward_3": 0.6819483981295104, "train/sim_max_reward_4": 0.964803072030041, "train/sim_max_reward_5": 0.5698223661864545, "test/sim_max_reward_4400000": 0.9730575537602587, "test/sim_max_reward_4400001": 0.40452796298806093, "test/sim_max_reward_4400002": 0.9592029956226782, "test/sim_max_reward_4400003": 0.9250403733774268, "test/sim_max_reward_4400004": 0.5366388451481938, "test/sim_max_reward_4400005": 0.9519127606997739, "test/sim_max_reward_4400006": 0.3605946727847028, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 0.5974649707138636, "test/sim_max_reward_4400009": 0.365594987874595, "test/sim_max_reward_4400010": 0.5347109972468931, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 0.7338166187118413, "test/sim_max_reward_4400013": 0.9453667794753523, "test/sim_max_reward_4400014": 0.6370600583402948, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.1273807568422073, "test/sim_max_reward_4400018": 0.9452533182515168, "test/sim_max_reward_4400019": 0.48350315091707985, "test/sim_max_reward_4400020": 0.46511506859555235, "test/sim_max_reward_4400021": 0.685010976269471, "test/sim_max_reward_4400022": 0.9896482224900071, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.9887936762819219, "test/sim_max_reward_4400025": 0.7081733821292624, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.43760479998675156, "test/sim_max_reward_4400028": 0.9893662932303996, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9970884946652974, "test/sim_max_reward_4400031": 0.9745558088654132, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.9567852062371562, "test/sim_max_reward_4400034": 0.4793700082733208, "test/sim_max_reward_4400035": 0.42307599695530096, "test/sim_max_reward_4400036": 0.37339202735851934, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.04497881815618269, "test/sim_max_reward_4400039": 0.9530775548119053, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.16142574768577606, "test/sim_max_reward_4400042": 0.5682065097669267, "test/sim_max_reward_4400043": 0.9772954254491968, "test/sim_max_reward_4400044": 0.9389444832364695, "test/sim_max_reward_4400045": 0.39040641219349187, "test/sim_max_reward_4400046": 0.9390174926361262, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.649015151422713, "test/mean_score": 0.5784491841605838, "val_loss": 287143.75, "train_action_mse_error": 0.6278157234191895} {"train_loss": -12.433723449707031, "global_step": 352968, "epoch": 2101} {"train_loss": -12.559518814086914, "global_step": 352969, "epoch": 2101} {"train_loss": -12.399431228637695, "global_step": 352970, "epoch": 2101} {"train_loss": -12.215530395507812, "global_step": 352971, "epoch": 2101} {"train_loss": -12.318326950073242, "global_step": 352972, "epoch": 2101} {"train_loss": -12.558099746704102, "global_step": 352973, "epoch": 2101} {"train_loss": -12.437053680419922, "global_step": 352974, "epoch": 2101} {"train_loss": -12.505915641784668, "global_step": 352975, "epoch": 2101} {"train_loss": -12.048809051513672, "global_step": 352976, "epoch": 2101} {"train_loss": -12.511878967285156, "global_step": 352977, "epoch": 2101} {"train_loss": -12.53936767578125, "global_step": 352978, "epoch": 2101} {"train_loss": -12.580119132995605, "global_step": 352979, "epoch": 2101} {"train_loss": -12.593334197998047, "global_step": 352980, "epoch": 2101} {"train_loss": -12.5184326171875, "global_step": 352981, "epoch": 2101} {"train_loss": -12.353330612182617, "global_step": 352982, "epoch": 2101} {"train_loss": -12.573458671569824, "global_step": 352983, "epoch": 2101} {"train_loss": -12.527080535888672, "global_step": 352984, "epoch": 2101} {"train_loss": -12.09022331237793, "global_step": 352985, "epoch": 2101} {"train_loss": -12.566201210021973, "global_step": 352986, "epoch": 2101} {"train_loss": -12.503772735595703, "global_step": 352987, "epoch": 2101} {"train_loss": -12.533409118652344, "global_step": 352988, "epoch": 2101} {"train_loss": -12.492440223693848, "global_step": 352989, "epoch": 2101} {"train_loss": -12.617057800292969, "global_step": 352990, "epoch": 2101} {"train_loss": -12.582307815551758, "global_step": 352991, "epoch": 2101} {"train_loss": -12.597908020019531, "global_step": 352992, "epoch": 2101} {"train_loss": -12.685518264770508, "global_step": 352993, "epoch": 2101} {"train_loss": -12.402082443237305, "global_step": 352994, "epoch": 2101} {"train_loss": -12.614524841308594, "global_step": 352995, "epoch": 2101} {"train_loss": -12.566513061523438, "global_step": 352996, "epoch": 2101} {"train_loss": -12.568344116210938, "global_step": 352997, "epoch": 2101} {"train_loss": -12.607095718383789, "global_step": 352998, "epoch": 2101} {"train_loss": -12.603553771972656, "global_step": 352999, "epoch": 2101} {"train_loss": -12.569881439208984, "global_step": 353000, "epoch": 2101} {"train_loss": -12.307088851928711, "global_step": 353001, "epoch": 2101} {"train_loss": -11.923978805541992, "global_step": 353002, "epoch": 2101} {"train_loss": -12.315902709960938, "global_step": 353003, "epoch": 2101} {"train_loss": -12.185013771057129, "global_step": 353004, "epoch": 2101} {"train_loss": -10.953227996826172, "global_step": 353005, "epoch": 2101} {"train_loss": -11.244026184082031, "global_step": 353006, "epoch": 2101} {"train_loss": -12.093488693237305, "global_step": 353007, "epoch": 2101} {"train_loss": -11.993318557739258, "global_step": 353008, "epoch": 2101} {"train_loss": -11.940814971923828, "global_step": 353009, "epoch": 2101} {"train_loss": -11.19151496887207, "global_step": 353010, "epoch": 2101} {"train_loss": -11.610184669494629, "global_step": 353011, "epoch": 2101} {"train_loss": -9.897968292236328, "global_step": 353012, "epoch": 2101} {"train_loss": -12.06656265258789, "global_step": 353013, "epoch": 2101} {"train_loss": -9.561792373657227, "global_step": 353014, "epoch": 2101} {"train_loss": -11.275434494018555, "global_step": 353015, "epoch": 2101} {"train_loss": -11.019271850585938, "global_step": 353016, "epoch": 2101} {"train_loss": -11.346414566040039, "global_step": 353017, "epoch": 2101} {"train_loss": -10.173377990722656, "global_step": 353018, "epoch": 2101} {"train_loss": -12.46216869354248, "global_step": 353019, "epoch": 2101} {"train_loss": -11.239230155944824, "global_step": 353020, "epoch": 2101} {"train_loss": -12.21210765838623, "global_step": 353021, "epoch": 2101} {"train_loss": -11.9487943649292, "global_step": 353022, "epoch": 2101} {"train_loss": -11.696939468383789, "global_step": 353023, "epoch": 2101} {"train_loss": -11.735527992248535, "global_step": 353024, "epoch": 2101} {"train_loss": -12.100845336914062, "global_step": 353025, "epoch": 2101} {"train_loss": -11.482851028442383, "global_step": 353026, "epoch": 2101} {"train_loss": -11.999828338623047, "global_step": 353027, "epoch": 2101} {"train_loss": -10.896600723266602, "global_step": 353028, "epoch": 2101} {"train_loss": -11.60356330871582, "global_step": 353029, "epoch": 2101} {"train_loss": -11.653510093688965, "global_step": 353030, "epoch": 2101} {"train_loss": -11.513310432434082, "global_step": 353031, "epoch": 2101} {"train_loss": -11.552728652954102, "global_step": 353032, "epoch": 2101} {"train_loss": -11.684365272521973, "global_step": 353033, "epoch": 2101} {"train_loss": -11.322441101074219, "global_step": 353034, "epoch": 2101} {"train_loss": -12.09422492980957, "global_step": 353035, "epoch": 2101} {"train_loss": -10.547439575195312, "global_step": 353036, "epoch": 2101} {"train_loss": -12.317572593688965, "global_step": 353037, "epoch": 2101} {"train_loss": -11.464155197143555, "global_step": 353038, "epoch": 2101} {"train_loss": -12.02008056640625, "global_step": 353039, "epoch": 2101} {"train_loss": -11.94324779510498, "global_step": 353040, "epoch": 2101} {"train_loss": -11.932229995727539, "global_step": 353041, "epoch": 2101} {"train_loss": -11.483039855957031, "global_step": 353042, "epoch": 2101} {"train_loss": -12.168279647827148, "global_step": 353043, "epoch": 2101} {"train_loss": -11.814815521240234, "global_step": 353044, "epoch": 2101} {"train_loss": -12.198734283447266, "global_step": 353045, "epoch": 2101} {"train_loss": -12.437142372131348, "global_step": 353046, "epoch": 2101} {"train_loss": -12.120397567749023, "global_step": 353047, "epoch": 2101} {"train_loss": -11.92708969116211, "global_step": 353048, "epoch": 2101} {"train_loss": -11.93779182434082, "global_step": 353049, "epoch": 2101} {"train_loss": -12.455384254455566, "global_step": 353050, "epoch": 2101} {"train_loss": -11.789987564086914, "global_step": 353051, "epoch": 2101} {"train_loss": -12.061534881591797, "global_step": 353052, "epoch": 2101} {"train_loss": -12.03238296508789, "global_step": 353053, "epoch": 2101} {"train_loss": -12.138028144836426, "global_step": 353054, "epoch": 2101} {"train_loss": -12.138130187988281, "global_step": 353055, "epoch": 2101} {"train_loss": -12.151678085327148, "global_step": 353056, "epoch": 2101} {"train_loss": -12.23651123046875, "global_step": 353057, "epoch": 2101} {"train_loss": -12.194408416748047, "global_step": 353058, "epoch": 2101} {"train_loss": -12.30229377746582, "global_step": 353059, "epoch": 2101} {"train_loss": -12.382256507873535, "global_step": 353060, "epoch": 2101} {"train_loss": -12.395377159118652, "global_step": 353061, "epoch": 2101} {"train_loss": -12.336559295654297, "global_step": 353062, "epoch": 2101} {"train_loss": -12.310251235961914, "global_step": 353063, "epoch": 2101} {"train_loss": -12.391626358032227, "global_step": 353064, "epoch": 2101} {"train_loss": -12.408980369567871, "global_step": 353065, "epoch": 2101} {"train_loss": -12.36539363861084, "global_step": 353066, "epoch": 2101} {"train_loss": -12.234864234924316, "global_step": 353067, "epoch": 2101} {"train_loss": -12.012288093566895, "global_step": 353068, "epoch": 2101} {"train_loss": -12.442602157592773, "global_step": 353069, "epoch": 2101} {"train_loss": -12.50840950012207, "global_step": 353070, "epoch": 2101} {"train_loss": -12.435843467712402, "global_step": 353071, "epoch": 2101} {"train_loss": -12.43867301940918, "global_step": 353072, "epoch": 2101} {"train_loss": -12.45783805847168, "global_step": 353073, "epoch": 2101} {"train_loss": -12.376485824584961, "global_step": 353074, "epoch": 2101} {"train_loss": -12.498052597045898, "global_step": 353075, "epoch": 2101} {"train_loss": -12.328956604003906, "global_step": 353076, "epoch": 2101} {"train_loss": -12.27950668334961, "global_step": 353077, "epoch": 2101} {"train_loss": -12.38016414642334, "global_step": 353078, "epoch": 2101} {"train_loss": -12.309342384338379, "global_step": 353079, "epoch": 2101} {"train_loss": -11.517648696899414, "global_step": 353080, "epoch": 2101} {"train_loss": -11.632355690002441, "global_step": 353081, "epoch": 2101} {"train_loss": -12.331830978393555, "global_step": 353082, "epoch": 2101} {"train_loss": -12.607501983642578, "global_step": 353083, "epoch": 2101} {"train_loss": -12.092329025268555, "global_step": 353084, "epoch": 2101} {"train_loss": -12.08625602722168, "global_step": 353085, "epoch": 2101} {"train_loss": -12.405881881713867, "global_step": 353086, "epoch": 2101} {"train_loss": -11.688592910766602, "global_step": 353087, "epoch": 2101} {"train_loss": -12.264117240905762, "global_step": 353088, "epoch": 2101} {"train_loss": -12.173916816711426, "global_step": 353089, "epoch": 2101} {"train_loss": -12.039213180541992, "global_step": 353090, "epoch": 2101} {"train_loss": -12.398747444152832, "global_step": 353091, "epoch": 2101} {"train_loss": -11.89796257019043, "global_step": 353092, "epoch": 2101} {"train_loss": -12.403420448303223, "global_step": 353093, "epoch": 2101} {"train_loss": -12.733192443847656, "global_step": 353094, "epoch": 2101} {"train_loss": -12.014240264892578, "global_step": 353095, "epoch": 2101} {"train_loss": -12.279382705688477, "global_step": 353096, "epoch": 2101} {"train_loss": -12.463008880615234, "global_step": 353097, "epoch": 2101} {"train_loss": -11.845274925231934, "global_step": 353098, "epoch": 2101} {"train_loss": -11.92533016204834, "global_step": 353099, "epoch": 2101} {"train_loss": -12.121231079101562, "global_step": 353100, "epoch": 2101} {"train_loss": -11.671446800231934, "global_step": 353101, "epoch": 2101} {"train_loss": -11.92315673828125, "global_step": 353102, "epoch": 2101} {"train_loss": -12.252561569213867, "global_step": 353103, "epoch": 2101} {"train_loss": -12.294119834899902, "global_step": 353104, "epoch": 2101} {"train_loss": -12.32112979888916, "global_step": 353105, "epoch": 2101} {"train_loss": -12.239755630493164, "global_step": 353106, "epoch": 2101} {"train_loss": -12.037034034729004, "global_step": 353107, "epoch": 2101} {"train_loss": -12.286433219909668, "global_step": 353108, "epoch": 2101} {"train_loss": -12.083003997802734, "global_step": 353109, "epoch": 2101} {"train_loss": -12.378692626953125, "global_step": 353110, "epoch": 2101} {"train_loss": -11.953999519348145, "global_step": 353111, "epoch": 2101} {"train_loss": -12.517847061157227, "global_step": 353112, "epoch": 2101} {"train_loss": -12.413528442382812, "global_step": 353113, "epoch": 2101} {"train_loss": -12.241599082946777, "global_step": 353114, "epoch": 2101} {"train_loss": -11.658187866210938, "global_step": 353115, "epoch": 2101} {"train_loss": -12.163432121276855, "global_step": 353116, "epoch": 2101} {"train_loss": -10.22589111328125, "global_step": 353117, "epoch": 2101} {"train_loss": -12.001306533813477, "global_step": 353118, "epoch": 2101} {"train_loss": -11.023622512817383, "global_step": 353119, "epoch": 2101} {"train_loss": -11.51321792602539, "global_step": 353120, "epoch": 2101} {"train_loss": -10.7975435256958, "global_step": 353121, "epoch": 2101} {"train_loss": -11.557647705078125, "global_step": 353122, "epoch": 2101} {"train_loss": -10.001890182495117, "global_step": 353123, "epoch": 2101} {"train_loss": -8.684307098388672, "global_step": 353124, "epoch": 2101} {"train_loss": -9.913206100463867, "global_step": 353125, "epoch": 2101} {"train_loss": -10.163721084594727, "global_step": 353126, "epoch": 2101} {"train_loss": -10.27021598815918, "global_step": 353127, "epoch": 2101} {"train_loss": -9.112957000732422, "global_step": 353128, "epoch": 2101} {"train_loss": -9.038225173950195, "global_step": 353129, "epoch": 2101} {"train_loss": -9.64263916015625, "global_step": 353130, "epoch": 2101} {"train_loss": -11.169916152954102, "global_step": 353131, "epoch": 2101} {"train_loss": -9.831708908081055, "global_step": 353132, "epoch": 2101} {"train_loss": -11.767741203308105, "global_step": 353133, "epoch": 2101} {"train_loss": -10.32938003540039, "global_step": 353134, "epoch": 2101} {"train_loss": -11.905127712658473, "global_step": 353135, "epoch": 2101, "val_loss": 288554.375} {"train_loss": -10.604425430297852, "global_step": 353136, "epoch": 2102} {"train_loss": -11.060176849365234, "global_step": 353137, "epoch": 2102} {"train_loss": -10.49200439453125, "global_step": 353138, "epoch": 2102} {"train_loss": -11.275951385498047, "global_step": 353139, "epoch": 2102} {"train_loss": -11.838692665100098, "global_step": 353140, "epoch": 2102} {"train_loss": -10.886034965515137, "global_step": 353141, "epoch": 2102} {"train_loss": -11.915199279785156, "global_step": 353142, "epoch": 2102} {"train_loss": -10.943521499633789, "global_step": 353143, "epoch": 2102} {"train_loss": -11.764856338500977, "global_step": 353144, "epoch": 2102} {"train_loss": -11.006505012512207, "global_step": 353145, "epoch": 2102} {"train_loss": -11.75966739654541, "global_step": 353146, "epoch": 2102} {"train_loss": -11.552581787109375, "global_step": 353147, "epoch": 2102} {"train_loss": -11.290166854858398, "global_step": 353148, "epoch": 2102} {"train_loss": -11.438801765441895, "global_step": 353149, "epoch": 2102} {"train_loss": -11.99618148803711, "global_step": 353150, "epoch": 2102} {"train_loss": -11.75912857055664, "global_step": 353151, "epoch": 2102} {"train_loss": -11.788818359375, "global_step": 353152, "epoch": 2102} {"train_loss": -12.18609619140625, "global_step": 353153, "epoch": 2102} {"train_loss": -11.835521697998047, "global_step": 353154, "epoch": 2102} {"train_loss": -11.672765731811523, "global_step": 353155, "epoch": 2102} {"train_loss": -11.962553024291992, "global_step": 353156, "epoch": 2102} {"train_loss": -11.992820739746094, "global_step": 353157, "epoch": 2102} {"train_loss": -11.321462631225586, "global_step": 353158, "epoch": 2102} {"train_loss": -12.201713562011719, "global_step": 353159, "epoch": 2102} {"train_loss": -12.279266357421875, "global_step": 353160, "epoch": 2102} {"train_loss": -12.04372787475586, "global_step": 353161, "epoch": 2102} {"train_loss": -12.262043952941895, "global_step": 353162, "epoch": 2102} {"train_loss": -12.115272521972656, "global_step": 353163, "epoch": 2102} {"train_loss": -12.136979103088379, "global_step": 353164, "epoch": 2102} {"train_loss": -11.967816352844238, "global_step": 353165, "epoch": 2102} {"train_loss": -12.111062049865723, "global_step": 353166, "epoch": 2102} {"train_loss": -11.79198932647705, "global_step": 353167, "epoch": 2102} {"train_loss": -12.152061462402344, "global_step": 353168, "epoch": 2102} {"train_loss": -12.060093879699707, "global_step": 353169, "epoch": 2102} {"train_loss": -12.356035232543945, "global_step": 353170, "epoch": 2102} {"train_loss": -12.029895782470703, "global_step": 353171, "epoch": 2102} {"train_loss": -12.332764625549316, "global_step": 353172, "epoch": 2102} {"train_loss": -12.227874755859375, "global_step": 353173, "epoch": 2102} {"train_loss": -12.17120361328125, "global_step": 353174, "epoch": 2102} {"train_loss": -12.22509765625, "global_step": 353175, "epoch": 2102} {"train_loss": -12.239387512207031, "global_step": 353176, "epoch": 2102} {"train_loss": -12.231624603271484, "global_step": 353177, "epoch": 2102} {"train_loss": -12.11376953125, "global_step": 353178, "epoch": 2102} {"train_loss": -12.57398509979248, "global_step": 353179, "epoch": 2102} {"train_loss": -12.07028579711914, "global_step": 353180, "epoch": 2102} {"train_loss": -12.319217681884766, "global_step": 353181, "epoch": 2102} {"train_loss": -11.967260360717773, "global_step": 353182, "epoch": 2102} {"train_loss": -11.636434555053711, "global_step": 353183, "epoch": 2102} {"train_loss": -12.429557800292969, "global_step": 353184, "epoch": 2102} {"train_loss": -12.083017349243164, "global_step": 353185, "epoch": 2102} {"train_loss": -12.469987869262695, "global_step": 353186, "epoch": 2102} {"train_loss": -12.143697738647461, "global_step": 353187, "epoch": 2102} {"train_loss": -12.06604290008545, "global_step": 353188, "epoch": 2102} {"train_loss": -12.373132705688477, "global_step": 353189, "epoch": 2102} {"train_loss": -11.764745712280273, "global_step": 353190, "epoch": 2102} {"train_loss": -12.299086570739746, "global_step": 353191, "epoch": 2102} {"train_loss": -11.368440628051758, "global_step": 353192, "epoch": 2102} {"train_loss": -11.841689109802246, "global_step": 353193, "epoch": 2102} {"train_loss": -11.9002685546875, "global_step": 353194, "epoch": 2102} {"train_loss": -11.006555557250977, "global_step": 353195, "epoch": 2102} {"train_loss": -12.117399215698242, "global_step": 353196, "epoch": 2102} {"train_loss": -11.059983253479004, "global_step": 353197, "epoch": 2102} {"train_loss": -11.876513481140137, "global_step": 353198, "epoch": 2102} {"train_loss": -10.980592727661133, "global_step": 353199, "epoch": 2102} {"train_loss": -11.561042785644531, "global_step": 353200, "epoch": 2102} {"train_loss": -11.690189361572266, "global_step": 353201, "epoch": 2102} {"train_loss": -11.940132141113281, "global_step": 353202, "epoch": 2102} {"train_loss": -10.822233200073242, "global_step": 353203, "epoch": 2102} {"train_loss": -11.758699417114258, "global_step": 353204, "epoch": 2102} {"train_loss": -11.881333351135254, "global_step": 353205, "epoch": 2102} {"train_loss": -11.635241508483887, "global_step": 353206, "epoch": 2102} {"train_loss": -12.129558563232422, "global_step": 353207, "epoch": 2102} {"train_loss": -11.480897903442383, "global_step": 353208, "epoch": 2102} {"train_loss": -12.123941421508789, "global_step": 353209, "epoch": 2102} {"train_loss": -11.832235336303711, "global_step": 353210, "epoch": 2102} {"train_loss": -12.214008331298828, "global_step": 353211, "epoch": 2102} {"train_loss": -12.031771659851074, "global_step": 353212, "epoch": 2102} {"train_loss": -11.821056365966797, "global_step": 353213, "epoch": 2102} {"train_loss": -12.080394744873047, "global_step": 353214, "epoch": 2102} {"train_loss": -11.759896278381348, "global_step": 353215, "epoch": 2102} {"train_loss": -12.241935729980469, "global_step": 353216, "epoch": 2102} {"train_loss": -11.948415756225586, "global_step": 353217, "epoch": 2102} {"train_loss": -11.86777400970459, "global_step": 353218, "epoch": 2102} {"train_loss": -11.996477127075195, "global_step": 353219, "epoch": 2102} {"train_loss": -11.47275161743164, "global_step": 353220, "epoch": 2102} {"train_loss": -12.074888229370117, "global_step": 353221, "epoch": 2102} {"train_loss": -11.406827926635742, "global_step": 353222, "epoch": 2102} {"train_loss": -12.313521385192871, "global_step": 353223, "epoch": 2102} {"train_loss": -10.8479642868042, "global_step": 353224, "epoch": 2102} {"train_loss": -11.383686065673828, "global_step": 353225, "epoch": 2102} {"train_loss": -11.304960250854492, "global_step": 353226, "epoch": 2102} {"train_loss": -11.69395637512207, "global_step": 353227, "epoch": 2102} {"train_loss": -11.005125999450684, "global_step": 353228, "epoch": 2102} {"train_loss": -11.661690711975098, "global_step": 353229, "epoch": 2102} {"train_loss": -10.991942405700684, "global_step": 353230, "epoch": 2102} {"train_loss": -11.75239086151123, "global_step": 353231, "epoch": 2102} {"train_loss": -11.545988082885742, "global_step": 353232, "epoch": 2102} {"train_loss": -11.432666778564453, "global_step": 353233, "epoch": 2102} {"train_loss": -11.67088508605957, "global_step": 353234, "epoch": 2102} {"train_loss": -11.887624740600586, "global_step": 353235, "epoch": 2102} {"train_loss": -11.615338325500488, "global_step": 353236, "epoch": 2102} {"train_loss": -11.982675552368164, "global_step": 353237, "epoch": 2102} {"train_loss": -11.788105010986328, "global_step": 353238, "epoch": 2102} {"train_loss": -11.777435302734375, "global_step": 353239, "epoch": 2102} {"train_loss": -11.956659317016602, "global_step": 353240, "epoch": 2102} {"train_loss": -11.93483829498291, "global_step": 353241, "epoch": 2102} {"train_loss": -11.888542175292969, "global_step": 353242, "epoch": 2102} {"train_loss": -12.076504707336426, "global_step": 353243, "epoch": 2102} {"train_loss": -12.123510360717773, "global_step": 353244, "epoch": 2102} {"train_loss": -12.170232772827148, "global_step": 353245, "epoch": 2102} {"train_loss": -12.380002975463867, "global_step": 353246, "epoch": 2102} {"train_loss": -12.280680656433105, "global_step": 353247, "epoch": 2102} {"train_loss": -12.211097717285156, "global_step": 353248, "epoch": 2102} {"train_loss": -12.404278755187988, "global_step": 353249, "epoch": 2102} {"train_loss": -12.29742431640625, "global_step": 353250, "epoch": 2102} {"train_loss": -12.448325157165527, "global_step": 353251, "epoch": 2102} {"train_loss": -12.375732421875, "global_step": 353252, "epoch": 2102} {"train_loss": -12.647329330444336, "global_step": 353253, "epoch": 2102} {"train_loss": -12.635618209838867, "global_step": 353254, "epoch": 2102} {"train_loss": -12.548450469970703, "global_step": 353255, "epoch": 2102} {"train_loss": -12.460287094116211, "global_step": 353256, "epoch": 2102} {"train_loss": -12.362438201904297, "global_step": 353257, "epoch": 2102} {"train_loss": -12.629972457885742, "global_step": 353258, "epoch": 2102} {"train_loss": -12.315082550048828, "global_step": 353259, "epoch": 2102} {"train_loss": -12.424694061279297, "global_step": 353260, "epoch": 2102} {"train_loss": -12.439878463745117, "global_step": 353261, "epoch": 2102} {"train_loss": -12.266039848327637, "global_step": 353262, "epoch": 2102} {"train_loss": -12.644281387329102, "global_step": 353263, "epoch": 2102} {"train_loss": -12.330915451049805, "global_step": 353264, "epoch": 2102} {"train_loss": -12.531646728515625, "global_step": 353265, "epoch": 2102} {"train_loss": -12.317415237426758, "global_step": 353266, "epoch": 2102} {"train_loss": -12.82186508178711, "global_step": 353267, "epoch": 2102} {"train_loss": -12.588191986083984, "global_step": 353268, "epoch": 2102} {"train_loss": -12.495265007019043, "global_step": 353269, "epoch": 2102} {"train_loss": -12.572593688964844, "global_step": 353270, "epoch": 2102} {"train_loss": -12.781862258911133, "global_step": 353271, "epoch": 2102} {"train_loss": -12.604714393615723, "global_step": 353272, "epoch": 2102} {"train_loss": -12.513243675231934, "global_step": 353273, "epoch": 2102} {"train_loss": -12.710108757019043, "global_step": 353274, "epoch": 2102} {"train_loss": -12.66015911102295, "global_step": 353275, "epoch": 2102} {"train_loss": -12.609935760498047, "global_step": 353276, "epoch": 2102} {"train_loss": -12.53505802154541, "global_step": 353277, "epoch": 2102} {"train_loss": -12.72049331665039, "global_step": 353278, "epoch": 2102} {"train_loss": -12.524335861206055, "global_step": 353279, "epoch": 2102} {"train_loss": -12.604574203491211, "global_step": 353280, "epoch": 2102} {"train_loss": -12.71463680267334, "global_step": 353281, "epoch": 2102} {"train_loss": -12.304207801818848, "global_step": 353282, "epoch": 2102} {"train_loss": -12.344091415405273, "global_step": 353283, "epoch": 2102} {"train_loss": -12.40884017944336, "global_step": 353284, "epoch": 2102} {"train_loss": -12.318140029907227, "global_step": 353285, "epoch": 2102} {"train_loss": -12.046796798706055, "global_step": 353286, "epoch": 2102} {"train_loss": -12.284303665161133, "global_step": 353287, "epoch": 2102} {"train_loss": -11.54596996307373, "global_step": 353288, "epoch": 2102} {"train_loss": -12.175166130065918, "global_step": 353289, "epoch": 2102} {"train_loss": -11.910038948059082, "global_step": 353290, "epoch": 2102} {"train_loss": -11.463595390319824, "global_step": 353291, "epoch": 2102} {"train_loss": -11.668582916259766, "global_step": 353292, "epoch": 2102} {"train_loss": -12.160636901855469, "global_step": 353293, "epoch": 2102} {"train_loss": -11.569735527038574, "global_step": 353294, "epoch": 2102} {"train_loss": -12.018753051757812, "global_step": 353295, "epoch": 2102} {"train_loss": -12.392072677612305, "global_step": 353296, "epoch": 2102} {"train_loss": -12.082612037658691, "global_step": 353297, "epoch": 2102} {"train_loss": -12.344620704650879, "global_step": 353298, "epoch": 2102} {"train_loss": -12.396448135375977, "global_step": 353299, "epoch": 2102} {"train_loss": -12.391519546508789, "global_step": 353300, "epoch": 2102} {"train_loss": -12.019962310791016, "global_step": 353301, "epoch": 2102} {"train_loss": -11.786027908325195, "global_step": 353302, "epoch": 2102} {"train_loss": -11.989606760797047, "global_step": 353303, "epoch": 2102, "val_loss": 290695.46875} {"train_loss": -12.171273231506348, "global_step": 353304, "epoch": 2103} {"train_loss": -11.345283508300781, "global_step": 353305, "epoch": 2103} {"train_loss": -10.897046089172363, "global_step": 353306, "epoch": 2103} {"train_loss": -11.670914649963379, "global_step": 353307, "epoch": 2103} {"train_loss": -11.588418960571289, "global_step": 353308, "epoch": 2103} {"train_loss": -11.38083267211914, "global_step": 353309, "epoch": 2103} {"train_loss": -9.300674438476562, "global_step": 353310, "epoch": 2103} {"train_loss": -10.092475891113281, "global_step": 353311, "epoch": 2103} {"train_loss": -7.886291980743408, "global_step": 353312, "epoch": 2103} {"train_loss": -10.82010269165039, "global_step": 353313, "epoch": 2103} {"train_loss": -10.351247787475586, "global_step": 353314, "epoch": 2103} {"train_loss": -10.956512451171875, "global_step": 353315, "epoch": 2103} {"train_loss": -11.204355239868164, "global_step": 353316, "epoch": 2103} {"train_loss": -10.47141170501709, "global_step": 353317, "epoch": 2103} {"train_loss": -11.329696655273438, "global_step": 353318, "epoch": 2103} {"train_loss": -10.538355827331543, "global_step": 353319, "epoch": 2103} {"train_loss": -11.2022705078125, "global_step": 353320, "epoch": 2103} {"train_loss": -11.48069953918457, "global_step": 353321, "epoch": 2103} {"train_loss": -11.06122875213623, "global_step": 353322, "epoch": 2103} {"train_loss": -11.388790130615234, "global_step": 353323, "epoch": 2103} {"train_loss": -11.407186508178711, "global_step": 353324, "epoch": 2103} {"train_loss": -11.6685791015625, "global_step": 353325, "epoch": 2103} {"train_loss": -10.816024780273438, "global_step": 353326, "epoch": 2103} {"train_loss": -11.848258972167969, "global_step": 353327, "epoch": 2103} {"train_loss": -10.659689903259277, "global_step": 353328, "epoch": 2103} {"train_loss": -11.824567794799805, "global_step": 353329, "epoch": 2103} {"train_loss": -11.499764442443848, "global_step": 353330, "epoch": 2103} {"train_loss": -11.05585765838623, "global_step": 353331, "epoch": 2103} {"train_loss": -11.587366104125977, "global_step": 353332, "epoch": 2103} {"train_loss": -10.932018280029297, "global_step": 353333, "epoch": 2103} {"train_loss": -11.922033309936523, "global_step": 353334, "epoch": 2103} {"train_loss": -10.977951049804688, "global_step": 353335, "epoch": 2103} {"train_loss": -11.71021842956543, "global_step": 353336, "epoch": 2103} {"train_loss": -11.798888206481934, "global_step": 353337, "epoch": 2103} {"train_loss": -11.663908004760742, "global_step": 353338, "epoch": 2103} {"train_loss": -12.101999282836914, "global_step": 353339, "epoch": 2103} {"train_loss": -11.498137474060059, "global_step": 353340, "epoch": 2103} {"train_loss": -11.935256004333496, "global_step": 353341, "epoch": 2103} {"train_loss": -11.920392036437988, "global_step": 353342, "epoch": 2103} {"train_loss": -11.630183219909668, "global_step": 353343, "epoch": 2103} {"train_loss": -12.382201194763184, "global_step": 353344, "epoch": 2103} {"train_loss": -11.911459922790527, "global_step": 353345, "epoch": 2103} {"train_loss": -12.042266845703125, "global_step": 353346, "epoch": 2103} {"train_loss": -11.823606491088867, "global_step": 353347, "epoch": 2103} {"train_loss": -12.109029769897461, "global_step": 353348, "epoch": 2103} {"train_loss": -12.057920455932617, "global_step": 353349, "epoch": 2103} {"train_loss": -12.176400184631348, "global_step": 353350, "epoch": 2103} {"train_loss": -12.230367660522461, "global_step": 353351, "epoch": 2103} {"train_loss": -12.2634916305542, "global_step": 353352, "epoch": 2103} {"train_loss": -12.048428535461426, "global_step": 353353, "epoch": 2103} {"train_loss": -12.316576957702637, "global_step": 353354, "epoch": 2103} {"train_loss": -12.060295104980469, "global_step": 353355, "epoch": 2103} {"train_loss": -12.265754699707031, "global_step": 353356, "epoch": 2103} {"train_loss": -12.089717864990234, "global_step": 353357, "epoch": 2103} {"train_loss": -12.279340744018555, "global_step": 353358, "epoch": 2103} {"train_loss": -11.938223838806152, "global_step": 353359, "epoch": 2103} {"train_loss": -12.324897766113281, "global_step": 353360, "epoch": 2103} {"train_loss": -12.333390235900879, "global_step": 353361, "epoch": 2103} {"train_loss": -12.286150932312012, "global_step": 353362, "epoch": 2103} {"train_loss": -12.361844062805176, "global_step": 353363, "epoch": 2103} {"train_loss": -12.49984359741211, "global_step": 353364, "epoch": 2103} {"train_loss": -12.494824409484863, "global_step": 353365, "epoch": 2103} {"train_loss": -12.424588203430176, "global_step": 353366, "epoch": 2103} {"train_loss": -12.465603828430176, "global_step": 353367, "epoch": 2103} {"train_loss": -12.297866821289062, "global_step": 353368, "epoch": 2103} {"train_loss": -12.485641479492188, "global_step": 353369, "epoch": 2103} {"train_loss": -12.70565414428711, "global_step": 353370, "epoch": 2103} {"train_loss": -12.616308212280273, "global_step": 353371, "epoch": 2103} {"train_loss": -12.404512405395508, "global_step": 353372, "epoch": 2103} {"train_loss": -12.614850997924805, "global_step": 353373, "epoch": 2103} {"train_loss": -12.664360046386719, "global_step": 353374, "epoch": 2103} {"train_loss": -12.70720100402832, "global_step": 353375, "epoch": 2103} {"train_loss": -12.50402545928955, "global_step": 353376, "epoch": 2103} {"train_loss": -12.659822463989258, "global_step": 353377, "epoch": 2103} {"train_loss": -12.458456039428711, "global_step": 353378, "epoch": 2103} {"train_loss": -12.614839553833008, "global_step": 353379, "epoch": 2103} {"train_loss": -12.567683219909668, "global_step": 353380, "epoch": 2103} {"train_loss": -12.523056030273438, "global_step": 353381, "epoch": 2103} {"train_loss": -12.590914726257324, "global_step": 353382, "epoch": 2103} {"train_loss": -12.604700088500977, "global_step": 353383, "epoch": 2103} {"train_loss": -12.336268424987793, "global_step": 353384, "epoch": 2103} {"train_loss": -12.470653533935547, "global_step": 353385, "epoch": 2103} {"train_loss": -12.530521392822266, "global_step": 353386, "epoch": 2103} {"train_loss": -12.764086723327637, "global_step": 353387, "epoch": 2103} {"train_loss": -12.564708709716797, "global_step": 353388, "epoch": 2103} {"train_loss": -12.750797271728516, "global_step": 353389, "epoch": 2103} {"train_loss": -12.702999114990234, "global_step": 353390, "epoch": 2103} {"train_loss": -12.566703796386719, "global_step": 353391, "epoch": 2103} {"train_loss": -12.719499588012695, "global_step": 353392, "epoch": 2103} {"train_loss": -12.755306243896484, "global_step": 353393, "epoch": 2103} {"train_loss": -12.543848037719727, "global_step": 353394, "epoch": 2103} {"train_loss": -12.565013885498047, "global_step": 353395, "epoch": 2103} {"train_loss": -12.217632293701172, "global_step": 353396, "epoch": 2103} {"train_loss": -12.464410781860352, "global_step": 353397, "epoch": 2103} {"train_loss": -12.570220947265625, "global_step": 353398, "epoch": 2103} {"train_loss": -12.202686309814453, "global_step": 353399, "epoch": 2103} {"train_loss": -12.214479446411133, "global_step": 353400, "epoch": 2103} {"train_loss": -12.706615447998047, "global_step": 353401, "epoch": 2103} {"train_loss": -12.464184761047363, "global_step": 353402, "epoch": 2103} {"train_loss": -12.27691650390625, "global_step": 353403, "epoch": 2103} {"train_loss": -12.554716110229492, "global_step": 353404, "epoch": 2103} {"train_loss": -12.527873992919922, "global_step": 353405, "epoch": 2103} {"train_loss": -12.44697093963623, "global_step": 353406, "epoch": 2103} {"train_loss": -12.24826431274414, "global_step": 353407, "epoch": 2103} {"train_loss": -12.297161102294922, "global_step": 353408, "epoch": 2103} {"train_loss": -12.62282657623291, "global_step": 353409, "epoch": 2103} {"train_loss": -12.534481048583984, "global_step": 353410, "epoch": 2103} {"train_loss": -12.272968292236328, "global_step": 353411, "epoch": 2103} {"train_loss": -12.050376892089844, "global_step": 353412, "epoch": 2103} {"train_loss": -12.58896255493164, "global_step": 353413, "epoch": 2103} {"train_loss": -12.139242172241211, "global_step": 353414, "epoch": 2103} {"train_loss": -11.966487884521484, "global_step": 353415, "epoch": 2103} {"train_loss": -11.582796096801758, "global_step": 353416, "epoch": 2103} {"train_loss": -12.55512809753418, "global_step": 353417, "epoch": 2103} {"train_loss": -12.250865936279297, "global_step": 353418, "epoch": 2103} {"train_loss": -12.18848991394043, "global_step": 353419, "epoch": 2103} {"train_loss": -11.630175590515137, "global_step": 353420, "epoch": 2103} {"train_loss": -11.539705276489258, "global_step": 353421, "epoch": 2103} {"train_loss": -12.477389335632324, "global_step": 353422, "epoch": 2103} {"train_loss": -12.389106750488281, "global_step": 353423, "epoch": 2103} {"train_loss": -12.462495803833008, "global_step": 353424, "epoch": 2103} {"train_loss": -12.37630558013916, "global_step": 353425, "epoch": 2103} {"train_loss": -11.861856460571289, "global_step": 353426, "epoch": 2103} {"train_loss": -11.719366073608398, "global_step": 353427, "epoch": 2103} {"train_loss": -11.807661056518555, "global_step": 353428, "epoch": 2103} {"train_loss": -12.528762817382812, "global_step": 353429, "epoch": 2103} {"train_loss": -12.057246208190918, "global_step": 353430, "epoch": 2103} {"train_loss": -12.040973663330078, "global_step": 353431, "epoch": 2103} {"train_loss": -12.105450630187988, "global_step": 353432, "epoch": 2103} {"train_loss": -12.26686954498291, "global_step": 353433, "epoch": 2103} {"train_loss": -11.536443710327148, "global_step": 353434, "epoch": 2103} {"train_loss": -12.354822158813477, "global_step": 353435, "epoch": 2103} {"train_loss": -11.488893508911133, "global_step": 353436, "epoch": 2103} {"train_loss": -12.243673324584961, "global_step": 353437, "epoch": 2103} {"train_loss": -11.244171142578125, "global_step": 353438, "epoch": 2103} {"train_loss": -11.969632148742676, "global_step": 353439, "epoch": 2103} {"train_loss": -11.096029281616211, "global_step": 353440, "epoch": 2103} {"train_loss": -12.022748947143555, "global_step": 353441, "epoch": 2103} {"train_loss": -11.72402286529541, "global_step": 353442, "epoch": 2103} {"train_loss": -10.056495666503906, "global_step": 353443, "epoch": 2103} {"train_loss": -10.847654342651367, "global_step": 353444, "epoch": 2103} {"train_loss": -9.43270492553711, "global_step": 353445, "epoch": 2103} {"train_loss": -9.972681045532227, "global_step": 353446, "epoch": 2103} {"train_loss": -10.388490676879883, "global_step": 353447, "epoch": 2103} {"train_loss": -8.503326416015625, "global_step": 353448, "epoch": 2103} {"train_loss": -5.8299994468688965, "global_step": 353449, "epoch": 2103} {"train_loss": -7.009732246398926, "global_step": 353450, "epoch": 2103} {"train_loss": -7.281665325164795, "global_step": 353451, "epoch": 2103} {"train_loss": -6.88267183303833, "global_step": 353452, "epoch": 2103} {"train_loss": -7.564873218536377, "global_step": 353453, "epoch": 2103} {"train_loss": -6.799659729003906, "global_step": 353454, "epoch": 2103} {"train_loss": -6.9910101890563965, "global_step": 353455, "epoch": 2103} {"train_loss": -7.725548267364502, "global_step": 353456, "epoch": 2103} {"train_loss": -7.088869094848633, "global_step": 353457, "epoch": 2103} {"train_loss": -8.081329345703125, "global_step": 353458, "epoch": 2103} {"train_loss": -8.446163177490234, "global_step": 353459, "epoch": 2103} {"train_loss": -7.602449893951416, "global_step": 353460, "epoch": 2103} {"train_loss": -7.620171546936035, "global_step": 353461, "epoch": 2103} {"train_loss": -8.5662841796875, "global_step": 353462, "epoch": 2103} {"train_loss": -8.585052490234375, "global_step": 353463, "epoch": 2103} {"train_loss": -8.103109359741211, "global_step": 353464, "epoch": 2103} {"train_loss": -9.178003311157227, "global_step": 353465, "epoch": 2103} {"train_loss": -9.184292793273926, "global_step": 353466, "epoch": 2103} {"train_loss": -9.310201644897461, "global_step": 353467, "epoch": 2103} {"train_loss": -9.825265884399414, "global_step": 353468, "epoch": 2103} {"train_loss": -9.590425491333008, "global_step": 353469, "epoch": 2103} {"train_loss": -9.75953483581543, "global_step": 353470, "epoch": 2103} {"train_loss": -11.370182837758746, "global_step": 353471, "epoch": 2103, "val_loss": 287545.65625} {"train_loss": -10.26566219329834, "global_step": 353472, "epoch": 2104} {"train_loss": -10.726445198059082, "global_step": 353473, "epoch": 2104} {"train_loss": -10.210994720458984, "global_step": 353474, "epoch": 2104} {"train_loss": -10.554159164428711, "global_step": 353475, "epoch": 2104} {"train_loss": -10.962030410766602, "global_step": 353476, "epoch": 2104} {"train_loss": -10.59882640838623, "global_step": 353477, "epoch": 2104} {"train_loss": -11.283472061157227, "global_step": 353478, "epoch": 2104} {"train_loss": -11.316372871398926, "global_step": 353479, "epoch": 2104} {"train_loss": -11.798063278198242, "global_step": 353480, "epoch": 2104} {"train_loss": -11.280757904052734, "global_step": 353481, "epoch": 2104} {"train_loss": -11.874762535095215, "global_step": 353482, "epoch": 2104} {"train_loss": -11.45887565612793, "global_step": 353483, "epoch": 2104} {"train_loss": -11.61315631866455, "global_step": 353484, "epoch": 2104} {"train_loss": -11.513071060180664, "global_step": 353485, "epoch": 2104} {"train_loss": -11.712726593017578, "global_step": 353486, "epoch": 2104} {"train_loss": -11.885095596313477, "global_step": 353487, "epoch": 2104} {"train_loss": -11.95766544342041, "global_step": 353488, "epoch": 2104} {"train_loss": -11.652928352355957, "global_step": 353489, "epoch": 2104} {"train_loss": -11.971969604492188, "global_step": 353490, "epoch": 2104} {"train_loss": -11.73892593383789, "global_step": 353491, "epoch": 2104} {"train_loss": -12.00786018371582, "global_step": 353492, "epoch": 2104} {"train_loss": -12.088751792907715, "global_step": 353493, "epoch": 2104} {"train_loss": -11.612371444702148, "global_step": 353494, "epoch": 2104} {"train_loss": -11.839902877807617, "global_step": 353495, "epoch": 2104} {"train_loss": -11.52386474609375, "global_step": 353496, "epoch": 2104} {"train_loss": -12.11945629119873, "global_step": 353497, "epoch": 2104} {"train_loss": -11.962416648864746, "global_step": 353498, "epoch": 2104} {"train_loss": -12.15555477142334, "global_step": 353499, "epoch": 2104} {"train_loss": -12.051124572753906, "global_step": 353500, "epoch": 2104} {"train_loss": -12.087207794189453, "global_step": 353501, "epoch": 2104} {"train_loss": -12.210668563842773, "global_step": 353502, "epoch": 2104} {"train_loss": -11.754181861877441, "global_step": 353503, "epoch": 2104} {"train_loss": -11.952280044555664, "global_step": 353504, "epoch": 2104} {"train_loss": -11.78591537475586, "global_step": 353505, "epoch": 2104} {"train_loss": -12.157437324523926, "global_step": 353506, "epoch": 2104} {"train_loss": -12.181010246276855, "global_step": 353507, "epoch": 2104} {"train_loss": -11.761991500854492, "global_step": 353508, "epoch": 2104} {"train_loss": -12.47381591796875, "global_step": 353509, "epoch": 2104} {"train_loss": -11.85252571105957, "global_step": 353510, "epoch": 2104} {"train_loss": -12.247018814086914, "global_step": 353511, "epoch": 2104} {"train_loss": -12.195154190063477, "global_step": 353512, "epoch": 2104} {"train_loss": -12.15774917602539, "global_step": 353513, "epoch": 2104} {"train_loss": -12.279397010803223, "global_step": 353514, "epoch": 2104} {"train_loss": -12.02691650390625, "global_step": 353515, "epoch": 2104} {"train_loss": -12.147188186645508, "global_step": 353516, "epoch": 2104} {"train_loss": -12.238500595092773, "global_step": 353517, "epoch": 2104} {"train_loss": -12.10483169555664, "global_step": 353518, "epoch": 2104} {"train_loss": -11.847352981567383, "global_step": 353519, "epoch": 2104} {"train_loss": -11.908206939697266, "global_step": 353520, "epoch": 2104} {"train_loss": -11.820732116699219, "global_step": 353521, "epoch": 2104} {"train_loss": -12.062871932983398, "global_step": 353522, "epoch": 2104} {"train_loss": -11.22317123413086, "global_step": 353523, "epoch": 2104} {"train_loss": -12.41739273071289, "global_step": 353524, "epoch": 2104} {"train_loss": -11.721367835998535, "global_step": 353525, "epoch": 2104} {"train_loss": -12.612751960754395, "global_step": 353526, "epoch": 2104} {"train_loss": -11.975004196166992, "global_step": 353527, "epoch": 2104} {"train_loss": -12.323715209960938, "global_step": 353528, "epoch": 2104} {"train_loss": -12.2025728225708, "global_step": 353529, "epoch": 2104} {"train_loss": -12.260357856750488, "global_step": 353530, "epoch": 2104} {"train_loss": -12.431074142456055, "global_step": 353531, "epoch": 2104} {"train_loss": -12.231727600097656, "global_step": 353532, "epoch": 2104} {"train_loss": -12.320775985717773, "global_step": 353533, "epoch": 2104} {"train_loss": -12.176023483276367, "global_step": 353534, "epoch": 2104} {"train_loss": -12.408265113830566, "global_step": 353535, "epoch": 2104} {"train_loss": -12.199193000793457, "global_step": 353536, "epoch": 2104} {"train_loss": -12.355489730834961, "global_step": 353537, "epoch": 2104} {"train_loss": -12.406932830810547, "global_step": 353538, "epoch": 2104} {"train_loss": -12.308246612548828, "global_step": 353539, "epoch": 2104} {"train_loss": -12.39833927154541, "global_step": 353540, "epoch": 2104} {"train_loss": -12.339433670043945, "global_step": 353541, "epoch": 2104} {"train_loss": -12.462519645690918, "global_step": 353542, "epoch": 2104} {"train_loss": -12.282632827758789, "global_step": 353543, "epoch": 2104} {"train_loss": -12.547759056091309, "global_step": 353544, "epoch": 2104} {"train_loss": -12.526453971862793, "global_step": 353545, "epoch": 2104} {"train_loss": -12.556224822998047, "global_step": 353546, "epoch": 2104} {"train_loss": -12.28759765625, "global_step": 353547, "epoch": 2104} {"train_loss": -12.12869644165039, "global_step": 353548, "epoch": 2104} {"train_loss": -12.499712944030762, "global_step": 353549, "epoch": 2104} {"train_loss": -11.986555099487305, "global_step": 353550, "epoch": 2104} {"train_loss": -12.416461944580078, "global_step": 353551, "epoch": 2104} {"train_loss": -12.429906845092773, "global_step": 353552, "epoch": 2104} {"train_loss": -12.160211563110352, "global_step": 353553, "epoch": 2104} {"train_loss": -12.25554084777832, "global_step": 353554, "epoch": 2104} {"train_loss": -12.429767608642578, "global_step": 353555, "epoch": 2104} {"train_loss": -12.349384307861328, "global_step": 353556, "epoch": 2104} {"train_loss": -12.181164741516113, "global_step": 353557, "epoch": 2104} {"train_loss": -12.220165252685547, "global_step": 353558, "epoch": 2104} {"train_loss": -12.288185119628906, "global_step": 353559, "epoch": 2104} {"train_loss": -12.01164722442627, "global_step": 353560, "epoch": 2104} {"train_loss": -12.012924194335938, "global_step": 353561, "epoch": 2104} {"train_loss": -12.119922637939453, "global_step": 353562, "epoch": 2104} {"train_loss": -12.059569358825684, "global_step": 353563, "epoch": 2104} {"train_loss": -12.383977890014648, "global_step": 353564, "epoch": 2104} {"train_loss": -11.891717910766602, "global_step": 353565, "epoch": 2104} {"train_loss": -12.473403930664062, "global_step": 353566, "epoch": 2104} {"train_loss": -12.00914192199707, "global_step": 353567, "epoch": 2104} {"train_loss": -11.911255836486816, "global_step": 353568, "epoch": 2104} {"train_loss": -11.571290016174316, "global_step": 353569, "epoch": 2104} {"train_loss": -12.069350242614746, "global_step": 353570, "epoch": 2104} {"train_loss": -12.079122543334961, "global_step": 353571, "epoch": 2104} {"train_loss": -11.920391082763672, "global_step": 353572, "epoch": 2104} {"train_loss": -11.072720527648926, "global_step": 353573, "epoch": 2104} {"train_loss": -11.447378158569336, "global_step": 353574, "epoch": 2104} {"train_loss": -11.994129180908203, "global_step": 353575, "epoch": 2104} {"train_loss": -10.790279388427734, "global_step": 353576, "epoch": 2104} {"train_loss": -11.15694808959961, "global_step": 353577, "epoch": 2104} {"train_loss": -11.187901496887207, "global_step": 353578, "epoch": 2104} {"train_loss": -10.415390968322754, "global_step": 353579, "epoch": 2104} {"train_loss": -11.34762191772461, "global_step": 353580, "epoch": 2104} {"train_loss": -10.494952201843262, "global_step": 353581, "epoch": 2104} {"train_loss": -11.548198699951172, "global_step": 353582, "epoch": 2104} {"train_loss": -10.274462699890137, "global_step": 353583, "epoch": 2104} {"train_loss": -10.363738059997559, "global_step": 353584, "epoch": 2104} {"train_loss": -11.606932640075684, "global_step": 353585, "epoch": 2104} {"train_loss": -10.80831527709961, "global_step": 353586, "epoch": 2104} {"train_loss": -11.12594223022461, "global_step": 353587, "epoch": 2104} {"train_loss": -11.443893432617188, "global_step": 353588, "epoch": 2104} {"train_loss": -10.583582878112793, "global_step": 353589, "epoch": 2104} {"train_loss": -11.866697311401367, "global_step": 353590, "epoch": 2104} {"train_loss": -10.300760269165039, "global_step": 353591, "epoch": 2104} {"train_loss": -12.013861656188965, "global_step": 353592, "epoch": 2104} {"train_loss": -10.92072868347168, "global_step": 353593, "epoch": 2104} {"train_loss": -10.919541358947754, "global_step": 353594, "epoch": 2104} {"train_loss": -10.11713695526123, "global_step": 353595, "epoch": 2104} {"train_loss": -10.89218521118164, "global_step": 353596, "epoch": 2104} {"train_loss": -11.329032897949219, "global_step": 353597, "epoch": 2104} {"train_loss": -10.133934020996094, "global_step": 353598, "epoch": 2104} {"train_loss": -11.575400352478027, "global_step": 353599, "epoch": 2104} {"train_loss": -10.33928108215332, "global_step": 353600, "epoch": 2104} {"train_loss": -11.13397216796875, "global_step": 353601, "epoch": 2104} {"train_loss": -11.559484481811523, "global_step": 353602, "epoch": 2104} {"train_loss": -11.125333786010742, "global_step": 353603, "epoch": 2104} {"train_loss": -11.654180526733398, "global_step": 353604, "epoch": 2104} {"train_loss": -11.349946975708008, "global_step": 353605, "epoch": 2104} {"train_loss": -11.40609073638916, "global_step": 353606, "epoch": 2104} {"train_loss": -11.620262145996094, "global_step": 353607, "epoch": 2104} {"train_loss": -11.568462371826172, "global_step": 353608, "epoch": 2104} {"train_loss": -11.921798706054688, "global_step": 353609, "epoch": 2104} {"train_loss": -11.870957374572754, "global_step": 353610, "epoch": 2104} {"train_loss": -11.894046783447266, "global_step": 353611, "epoch": 2104} {"train_loss": -12.111408233642578, "global_step": 353612, "epoch": 2104} {"train_loss": -12.07685375213623, "global_step": 353613, "epoch": 2104} {"train_loss": -11.956308364868164, "global_step": 353614, "epoch": 2104} {"train_loss": -11.89676570892334, "global_step": 353615, "epoch": 2104} {"train_loss": -12.274036407470703, "global_step": 353616, "epoch": 2104} {"train_loss": -12.09398078918457, "global_step": 353617, "epoch": 2104} {"train_loss": -12.394306182861328, "global_step": 353618, "epoch": 2104} {"train_loss": -12.100077629089355, "global_step": 353619, "epoch": 2104} {"train_loss": -12.221120834350586, "global_step": 353620, "epoch": 2104} {"train_loss": -12.18597412109375, "global_step": 353621, "epoch": 2104} {"train_loss": -12.33213996887207, "global_step": 353622, "epoch": 2104} {"train_loss": -12.157148361206055, "global_step": 353623, "epoch": 2104} {"train_loss": -12.129070281982422, "global_step": 353624, "epoch": 2104} {"train_loss": -12.392184257507324, "global_step": 353625, "epoch": 2104} {"train_loss": -12.044411659240723, "global_step": 353626, "epoch": 2104} {"train_loss": -12.28333854675293, "global_step": 353627, "epoch": 2104} {"train_loss": -12.459189414978027, "global_step": 353628, "epoch": 2104} {"train_loss": -12.348780632019043, "global_step": 353629, "epoch": 2104} {"train_loss": -12.32557487487793, "global_step": 353630, "epoch": 2104} {"train_loss": -12.300291061401367, "global_step": 353631, "epoch": 2104} {"train_loss": -12.261703491210938, "global_step": 353632, "epoch": 2104} {"train_loss": -12.407869338989258, "global_step": 353633, "epoch": 2104} {"train_loss": -12.280233383178711, "global_step": 353634, "epoch": 2104} {"train_loss": -12.429865837097168, "global_step": 353635, "epoch": 2104} {"train_loss": -12.223906517028809, "global_step": 353636, "epoch": 2104} {"train_loss": -12.388385772705078, "global_step": 353637, "epoch": 2104} {"train_loss": -12.081748008728027, "global_step": 353638, "epoch": 2104} {"train_loss": -11.831505843571254, "global_step": 353639, "epoch": 2104, "val_loss": 286910.53125} {"train_loss": -12.381409645080566, "global_step": 353640, "epoch": 2105} {"train_loss": -12.12767219543457, "global_step": 353641, "epoch": 2105} {"train_loss": -12.087668418884277, "global_step": 353642, "epoch": 2105} {"train_loss": -11.973461151123047, "global_step": 353643, "epoch": 2105} {"train_loss": -12.03939437866211, "global_step": 353644, "epoch": 2105} {"train_loss": -12.246808052062988, "global_step": 353645, "epoch": 2105} {"train_loss": -11.925244331359863, "global_step": 353646, "epoch": 2105} {"train_loss": -12.083166122436523, "global_step": 353647, "epoch": 2105} {"train_loss": -12.502086639404297, "global_step": 353648, "epoch": 2105} {"train_loss": -11.770591735839844, "global_step": 353649, "epoch": 2105} {"train_loss": -12.31906509399414, "global_step": 353650, "epoch": 2105} {"train_loss": -11.836265563964844, "global_step": 353651, "epoch": 2105} {"train_loss": -11.742128372192383, "global_step": 353652, "epoch": 2105} {"train_loss": -12.169281005859375, "global_step": 353653, "epoch": 2105} {"train_loss": -11.968347549438477, "global_step": 353654, "epoch": 2105} {"train_loss": -12.388221740722656, "global_step": 353655, "epoch": 2105} {"train_loss": -12.310778617858887, "global_step": 353656, "epoch": 2105} {"train_loss": -12.397012710571289, "global_step": 353657, "epoch": 2105} {"train_loss": -12.137422561645508, "global_step": 353658, "epoch": 2105} {"train_loss": -11.954690933227539, "global_step": 353659, "epoch": 2105} {"train_loss": -12.419554710388184, "global_step": 353660, "epoch": 2105} {"train_loss": -11.796320915222168, "global_step": 353661, "epoch": 2105} {"train_loss": -11.80074691772461, "global_step": 353662, "epoch": 2105} {"train_loss": -11.868314743041992, "global_step": 353663, "epoch": 2105} {"train_loss": -12.492939949035645, "global_step": 353664, "epoch": 2105} {"train_loss": -11.611495971679688, "global_step": 353665, "epoch": 2105} {"train_loss": -12.210176467895508, "global_step": 353666, "epoch": 2105} {"train_loss": -11.790246963500977, "global_step": 353667, "epoch": 2105} {"train_loss": -11.371790885925293, "global_step": 353668, "epoch": 2105} {"train_loss": -11.637338638305664, "global_step": 353669, "epoch": 2105} {"train_loss": -12.088238716125488, "global_step": 353670, "epoch": 2105} {"train_loss": -11.4182767868042, "global_step": 353671, "epoch": 2105} {"train_loss": -12.317262649536133, "global_step": 353672, "epoch": 2105} {"train_loss": -11.753847122192383, "global_step": 353673, "epoch": 2105} {"train_loss": -11.450018882751465, "global_step": 353674, "epoch": 2105} {"train_loss": -12.554157257080078, "global_step": 353675, "epoch": 2105} {"train_loss": -11.413674354553223, "global_step": 353676, "epoch": 2105} {"train_loss": -11.857233047485352, "global_step": 353677, "epoch": 2105} {"train_loss": -12.232629776000977, "global_step": 353678, "epoch": 2105} {"train_loss": -11.60233211517334, "global_step": 353679, "epoch": 2105} {"train_loss": -11.182509422302246, "global_step": 353680, "epoch": 2105} {"train_loss": -11.333135604858398, "global_step": 353681, "epoch": 2105} {"train_loss": -10.72268295288086, "global_step": 353682, "epoch": 2105} {"train_loss": -11.407114028930664, "global_step": 353683, "epoch": 2105} {"train_loss": -11.250188827514648, "global_step": 353684, "epoch": 2105} {"train_loss": -11.359609603881836, "global_step": 353685, "epoch": 2105} {"train_loss": -10.42326831817627, "global_step": 353686, "epoch": 2105} {"train_loss": -10.840476989746094, "global_step": 353687, "epoch": 2105} {"train_loss": -9.731919288635254, "global_step": 353688, "epoch": 2105} {"train_loss": -11.706568717956543, "global_step": 353689, "epoch": 2105} {"train_loss": -10.276514053344727, "global_step": 353690, "epoch": 2105} {"train_loss": -10.806472778320312, "global_step": 353691, "epoch": 2105} {"train_loss": -11.398975372314453, "global_step": 353692, "epoch": 2105} {"train_loss": -11.271747589111328, "global_step": 353693, "epoch": 2105} {"train_loss": -10.799261093139648, "global_step": 353694, "epoch": 2105} {"train_loss": -11.082137107849121, "global_step": 353695, "epoch": 2105} {"train_loss": -11.496648788452148, "global_step": 353696, "epoch": 2105} {"train_loss": -10.639535903930664, "global_step": 353697, "epoch": 2105} {"train_loss": -11.92105770111084, "global_step": 353698, "epoch": 2105} {"train_loss": -11.471460342407227, "global_step": 353699, "epoch": 2105} {"train_loss": -11.408133506774902, "global_step": 353700, "epoch": 2105} {"train_loss": -11.867876052856445, "global_step": 353701, "epoch": 2105} {"train_loss": -11.936981201171875, "global_step": 353702, "epoch": 2105} {"train_loss": -11.799966812133789, "global_step": 353703, "epoch": 2105} {"train_loss": -11.272968292236328, "global_step": 353704, "epoch": 2105} {"train_loss": -11.936935424804688, "global_step": 353705, "epoch": 2105} {"train_loss": -11.604540824890137, "global_step": 353706, "epoch": 2105} {"train_loss": -11.834022521972656, "global_step": 353707, "epoch": 2105} {"train_loss": -11.766695976257324, "global_step": 353708, "epoch": 2105} {"train_loss": -12.036765098571777, "global_step": 353709, "epoch": 2105} {"train_loss": -11.62922477722168, "global_step": 353710, "epoch": 2105} {"train_loss": -12.193626403808594, "global_step": 353711, "epoch": 2105} {"train_loss": -11.908982276916504, "global_step": 353712, "epoch": 2105} {"train_loss": -11.909274101257324, "global_step": 353713, "epoch": 2105} {"train_loss": -11.719722747802734, "global_step": 353714, "epoch": 2105} {"train_loss": -11.95262336730957, "global_step": 353715, "epoch": 2105} {"train_loss": -12.381855964660645, "global_step": 353716, "epoch": 2105} {"train_loss": -11.859596252441406, "global_step": 353717, "epoch": 2105} {"train_loss": -12.287139892578125, "global_step": 353718, "epoch": 2105} {"train_loss": -11.815448760986328, "global_step": 353719, "epoch": 2105} {"train_loss": -12.087636947631836, "global_step": 353720, "epoch": 2105} {"train_loss": -11.781081199645996, "global_step": 353721, "epoch": 2105} {"train_loss": -11.790190696716309, "global_step": 353722, "epoch": 2105} {"train_loss": -12.220311164855957, "global_step": 353723, "epoch": 2105} {"train_loss": -11.893932342529297, "global_step": 353724, "epoch": 2105} {"train_loss": -12.101654052734375, "global_step": 353725, "epoch": 2105} {"train_loss": -12.118083953857422, "global_step": 353726, "epoch": 2105} {"train_loss": -12.16014575958252, "global_step": 353727, "epoch": 2105} {"train_loss": -12.16189956665039, "global_step": 353728, "epoch": 2105} {"train_loss": -12.005243301391602, "global_step": 353729, "epoch": 2105} {"train_loss": -12.290136337280273, "global_step": 353730, "epoch": 2105} {"train_loss": -11.996627807617188, "global_step": 353731, "epoch": 2105} {"train_loss": -12.091384887695312, "global_step": 353732, "epoch": 2105} {"train_loss": -12.319278717041016, "global_step": 353733, "epoch": 2105} {"train_loss": -11.999667167663574, "global_step": 353734, "epoch": 2105} {"train_loss": -12.405016899108887, "global_step": 353735, "epoch": 2105} {"train_loss": -12.054993629455566, "global_step": 353736, "epoch": 2105} {"train_loss": -12.260316848754883, "global_step": 353737, "epoch": 2105} {"train_loss": -12.532539367675781, "global_step": 353738, "epoch": 2105} {"train_loss": -12.296783447265625, "global_step": 353739, "epoch": 2105} {"train_loss": -12.152679443359375, "global_step": 353740, "epoch": 2105} {"train_loss": -12.191184043884277, "global_step": 353741, "epoch": 2105} {"train_loss": -12.17612361907959, "global_step": 353742, "epoch": 2105} {"train_loss": -12.328376770019531, "global_step": 353743, "epoch": 2105} {"train_loss": -12.122953414916992, "global_step": 353744, "epoch": 2105} {"train_loss": -12.58725357055664, "global_step": 353745, "epoch": 2105} {"train_loss": -12.453311920166016, "global_step": 353746, "epoch": 2105} {"train_loss": -12.693643569946289, "global_step": 353747, "epoch": 2105} {"train_loss": -12.086282730102539, "global_step": 353748, "epoch": 2105} {"train_loss": -12.514083862304688, "global_step": 353749, "epoch": 2105} {"train_loss": -12.476733207702637, "global_step": 353750, "epoch": 2105} {"train_loss": -12.163368225097656, "global_step": 353751, "epoch": 2105} {"train_loss": -12.453222274780273, "global_step": 353752, "epoch": 2105} {"train_loss": -12.541473388671875, "global_step": 353753, "epoch": 2105} {"train_loss": -12.622978210449219, "global_step": 353754, "epoch": 2105} {"train_loss": -12.64112377166748, "global_step": 353755, "epoch": 2105} {"train_loss": -12.429351806640625, "global_step": 353756, "epoch": 2105} {"train_loss": -12.51622486114502, "global_step": 353757, "epoch": 2105} {"train_loss": -12.365653991699219, "global_step": 353758, "epoch": 2105} {"train_loss": -12.443063735961914, "global_step": 353759, "epoch": 2105} {"train_loss": -12.549060821533203, "global_step": 353760, "epoch": 2105} {"train_loss": -12.485671043395996, "global_step": 353761, "epoch": 2105} {"train_loss": -12.57732105255127, "global_step": 353762, "epoch": 2105} {"train_loss": -12.26085090637207, "global_step": 353763, "epoch": 2105} {"train_loss": -12.423480987548828, "global_step": 353764, "epoch": 2105} {"train_loss": -12.59158706665039, "global_step": 353765, "epoch": 2105} {"train_loss": -12.69691276550293, "global_step": 353766, "epoch": 2105} {"train_loss": -12.49713134765625, "global_step": 353767, "epoch": 2105} {"train_loss": -12.566009521484375, "global_step": 353768, "epoch": 2105} {"train_loss": -12.502819061279297, "global_step": 353769, "epoch": 2105} {"train_loss": -12.404485702514648, "global_step": 353770, "epoch": 2105} {"train_loss": -12.517583847045898, "global_step": 353771, "epoch": 2105} {"train_loss": -12.317798614501953, "global_step": 353772, "epoch": 2105} {"train_loss": -12.322603225708008, "global_step": 353773, "epoch": 2105} {"train_loss": -12.676891326904297, "global_step": 353774, "epoch": 2105} {"train_loss": -12.213643074035645, "global_step": 353775, "epoch": 2105} {"train_loss": -12.381227493286133, "global_step": 353776, "epoch": 2105} {"train_loss": -12.591670989990234, "global_step": 353777, "epoch": 2105} {"train_loss": -12.415182113647461, "global_step": 353778, "epoch": 2105} {"train_loss": -12.146821975708008, "global_step": 353779, "epoch": 2105} {"train_loss": -12.509662628173828, "global_step": 353780, "epoch": 2105} {"train_loss": -12.344559669494629, "global_step": 353781, "epoch": 2105} {"train_loss": -12.312030792236328, "global_step": 353782, "epoch": 2105} {"train_loss": -12.395952224731445, "global_step": 353783, "epoch": 2105} {"train_loss": -12.464117050170898, "global_step": 353784, "epoch": 2105} {"train_loss": -12.042346954345703, "global_step": 353785, "epoch": 2105} {"train_loss": -10.838973999023438, "global_step": 353786, "epoch": 2105} {"train_loss": -11.619887351989746, "global_step": 353787, "epoch": 2105} {"train_loss": -12.46687126159668, "global_step": 353788, "epoch": 2105} {"train_loss": -11.902740478515625, "global_step": 353789, "epoch": 2105} {"train_loss": -11.136022567749023, "global_step": 353790, "epoch": 2105} {"train_loss": -12.168545722961426, "global_step": 353791, "epoch": 2105} {"train_loss": -11.00734806060791, "global_step": 353792, "epoch": 2105} {"train_loss": -9.084184646606445, "global_step": 353793, "epoch": 2105} {"train_loss": -11.784271240234375, "global_step": 353794, "epoch": 2105} {"train_loss": -9.448339462280273, "global_step": 353795, "epoch": 2105} {"train_loss": -11.41445541381836, "global_step": 353796, "epoch": 2105} {"train_loss": -9.476509094238281, "global_step": 353797, "epoch": 2105} {"train_loss": -12.046533584594727, "global_step": 353798, "epoch": 2105} {"train_loss": -10.310761451721191, "global_step": 353799, "epoch": 2105} {"train_loss": -11.614322662353516, "global_step": 353800, "epoch": 2105} {"train_loss": -10.985989570617676, "global_step": 353801, "epoch": 2105} {"train_loss": -9.79161262512207, "global_step": 353802, "epoch": 2105} {"train_loss": -12.005134582519531, "global_step": 353803, "epoch": 2105} {"train_loss": -10.73017692565918, "global_step": 353804, "epoch": 2105} {"train_loss": -11.83966064453125, "global_step": 353805, "epoch": 2105} {"train_loss": -10.567145347595215, "global_step": 353806, "epoch": 2105} {"train_loss": -11.876573835100446, "global_step": 353807, "epoch": 2105, "val_loss": 289791.875, "train_action_mse_error": 0.3623678982257843} {"train_loss": -11.449617385864258, "global_step": 353808, "epoch": 2106} {"train_loss": -10.654898643493652, "global_step": 353809, "epoch": 2106} {"train_loss": -11.710566520690918, "global_step": 353810, "epoch": 2106} {"train_loss": -10.779857635498047, "global_step": 353811, "epoch": 2106} {"train_loss": -12.066377639770508, "global_step": 353812, "epoch": 2106} {"train_loss": -11.528555870056152, "global_step": 353813, "epoch": 2106} {"train_loss": -11.99067497253418, "global_step": 353814, "epoch": 2106} {"train_loss": -11.675481796264648, "global_step": 353815, "epoch": 2106} {"train_loss": -11.972838401794434, "global_step": 353816, "epoch": 2106} {"train_loss": -11.715047836303711, "global_step": 353817, "epoch": 2106} {"train_loss": -12.140913009643555, "global_step": 353818, "epoch": 2106} {"train_loss": -11.702680587768555, "global_step": 353819, "epoch": 2106} {"train_loss": -12.048883438110352, "global_step": 353820, "epoch": 2106} {"train_loss": -11.90107250213623, "global_step": 353821, "epoch": 2106} {"train_loss": -12.149084091186523, "global_step": 353822, "epoch": 2106} {"train_loss": -11.935417175292969, "global_step": 353823, "epoch": 2106} {"train_loss": -11.89698600769043, "global_step": 353824, "epoch": 2106} {"train_loss": -11.834066390991211, "global_step": 353825, "epoch": 2106} {"train_loss": -12.125611305236816, "global_step": 353826, "epoch": 2106} {"train_loss": -12.297735214233398, "global_step": 353827, "epoch": 2106} {"train_loss": -11.868745803833008, "global_step": 353828, "epoch": 2106} {"train_loss": -12.345544815063477, "global_step": 353829, "epoch": 2106} {"train_loss": -11.853106498718262, "global_step": 353830, "epoch": 2106} {"train_loss": -12.200275421142578, "global_step": 353831, "epoch": 2106} {"train_loss": -12.18767261505127, "global_step": 353832, "epoch": 2106} {"train_loss": -12.217222213745117, "global_step": 353833, "epoch": 2106} {"train_loss": -12.208763122558594, "global_step": 353834, "epoch": 2106} {"train_loss": -12.2987642288208, "global_step": 353835, "epoch": 2106} {"train_loss": -12.269920349121094, "global_step": 353836, "epoch": 2106} {"train_loss": -12.408735275268555, "global_step": 353837, "epoch": 2106} {"train_loss": -12.152530670166016, "global_step": 353838, "epoch": 2106} {"train_loss": -12.492820739746094, "global_step": 353839, "epoch": 2106} {"train_loss": -12.384742736816406, "global_step": 353840, "epoch": 2106} {"train_loss": -12.189849853515625, "global_step": 353841, "epoch": 2106} {"train_loss": -12.188888549804688, "global_step": 353842, "epoch": 2106} {"train_loss": -12.244729995727539, "global_step": 353843, "epoch": 2106} {"train_loss": -11.97451400756836, "global_step": 353844, "epoch": 2106} {"train_loss": -12.577282905578613, "global_step": 353845, "epoch": 2106} {"train_loss": -12.154870986938477, "global_step": 353846, "epoch": 2106} {"train_loss": -12.29873275756836, "global_step": 353847, "epoch": 2106} {"train_loss": -12.26375675201416, "global_step": 353848, "epoch": 2106} {"train_loss": -12.300016403198242, "global_step": 353849, "epoch": 2106} {"train_loss": -12.036909103393555, "global_step": 353850, "epoch": 2106} {"train_loss": -12.156547546386719, "global_step": 353851, "epoch": 2106} {"train_loss": -12.140771865844727, "global_step": 353852, "epoch": 2106} {"train_loss": -12.50063705444336, "global_step": 353853, "epoch": 2106} {"train_loss": -12.013174057006836, "global_step": 353854, "epoch": 2106} {"train_loss": -12.425003051757812, "global_step": 353855, "epoch": 2106} {"train_loss": -12.479610443115234, "global_step": 353856, "epoch": 2106} {"train_loss": -12.188529968261719, "global_step": 353857, "epoch": 2106} {"train_loss": -12.185537338256836, "global_step": 353858, "epoch": 2106} {"train_loss": -12.36246109008789, "global_step": 353859, "epoch": 2106} {"train_loss": -12.165864944458008, "global_step": 353860, "epoch": 2106} {"train_loss": -12.349055290222168, "global_step": 353861, "epoch": 2106} {"train_loss": -12.340855598449707, "global_step": 353862, "epoch": 2106} {"train_loss": -12.397405624389648, "global_step": 353863, "epoch": 2106} {"train_loss": -12.155324935913086, "global_step": 353864, "epoch": 2106} {"train_loss": -12.307188034057617, "global_step": 353865, "epoch": 2106} {"train_loss": -12.609302520751953, "global_step": 353866, "epoch": 2106} {"train_loss": -12.335786819458008, "global_step": 353867, "epoch": 2106} {"train_loss": -12.454524040222168, "global_step": 353868, "epoch": 2106} {"train_loss": -12.459712982177734, "global_step": 353869, "epoch": 2106} {"train_loss": -12.231184005737305, "global_step": 353870, "epoch": 2106} {"train_loss": -12.341489791870117, "global_step": 353871, "epoch": 2106} {"train_loss": -12.762354850769043, "global_step": 353872, "epoch": 2106} {"train_loss": -12.524347305297852, "global_step": 353873, "epoch": 2106} {"train_loss": -12.743572235107422, "global_step": 353874, "epoch": 2106} {"train_loss": -12.426553726196289, "global_step": 353875, "epoch": 2106} {"train_loss": -12.687191009521484, "global_step": 353876, "epoch": 2106} {"train_loss": -12.620845794677734, "global_step": 353877, "epoch": 2106} {"train_loss": -12.659866333007812, "global_step": 353878, "epoch": 2106} {"train_loss": -12.333730697631836, "global_step": 353879, "epoch": 2106} {"train_loss": -12.407468795776367, "global_step": 353880, "epoch": 2106} {"train_loss": -12.55217456817627, "global_step": 353881, "epoch": 2106} {"train_loss": -12.585285186767578, "global_step": 353882, "epoch": 2106} {"train_loss": -12.253952026367188, "global_step": 353883, "epoch": 2106} {"train_loss": -11.960918426513672, "global_step": 353884, "epoch": 2106} {"train_loss": -12.355371475219727, "global_step": 353885, "epoch": 2106} {"train_loss": -12.077880859375, "global_step": 353886, "epoch": 2106} {"train_loss": -12.273040771484375, "global_step": 353887, "epoch": 2106} {"train_loss": -12.554159164428711, "global_step": 353888, "epoch": 2106} {"train_loss": -12.357711791992188, "global_step": 353889, "epoch": 2106} {"train_loss": -12.053086280822754, "global_step": 353890, "epoch": 2106} {"train_loss": -12.191186904907227, "global_step": 353891, "epoch": 2106} {"train_loss": -12.396316528320312, "global_step": 353892, "epoch": 2106} {"train_loss": -11.55798625946045, "global_step": 353893, "epoch": 2106} {"train_loss": -11.813281059265137, "global_step": 353894, "epoch": 2106} {"train_loss": -11.459846496582031, "global_step": 353895, "epoch": 2106} {"train_loss": -11.136676788330078, "global_step": 353896, "epoch": 2106} {"train_loss": -8.949441909790039, "global_step": 353897, "epoch": 2106} {"train_loss": -10.495929718017578, "global_step": 353898, "epoch": 2106} {"train_loss": -9.973165512084961, "global_step": 353899, "epoch": 2106} {"train_loss": -9.56959342956543, "global_step": 353900, "epoch": 2106} {"train_loss": -10.82012939453125, "global_step": 353901, "epoch": 2106} {"train_loss": -9.24134349822998, "global_step": 353902, "epoch": 2106} {"train_loss": -9.770854949951172, "global_step": 353903, "epoch": 2106} {"train_loss": -10.935050010681152, "global_step": 353904, "epoch": 2106} {"train_loss": -9.164229393005371, "global_step": 353905, "epoch": 2106} {"train_loss": -9.361326217651367, "global_step": 353906, "epoch": 2106} {"train_loss": -9.442951202392578, "global_step": 353907, "epoch": 2106} {"train_loss": -9.50770092010498, "global_step": 353908, "epoch": 2106} {"train_loss": -9.711894035339355, "global_step": 353909, "epoch": 2106} {"train_loss": -9.95744514465332, "global_step": 353910, "epoch": 2106} {"train_loss": -9.363905906677246, "global_step": 353911, "epoch": 2106} {"train_loss": -9.683540344238281, "global_step": 353912, "epoch": 2106} {"train_loss": -9.953502655029297, "global_step": 353913, "epoch": 2106} {"train_loss": -11.028459548950195, "global_step": 353914, "epoch": 2106} {"train_loss": -11.579059600830078, "global_step": 353915, "epoch": 2106} {"train_loss": -10.801437377929688, "global_step": 353916, "epoch": 2106} {"train_loss": -11.131307601928711, "global_step": 353917, "epoch": 2106} {"train_loss": -10.74589729309082, "global_step": 353918, "epoch": 2106} {"train_loss": -11.364106178283691, "global_step": 353919, "epoch": 2106} {"train_loss": -10.833044052124023, "global_step": 353920, "epoch": 2106} {"train_loss": -11.256512641906738, "global_step": 353921, "epoch": 2106} {"train_loss": -11.503484725952148, "global_step": 353922, "epoch": 2106} {"train_loss": -11.462801933288574, "global_step": 353923, "epoch": 2106} {"train_loss": -12.123032569885254, "global_step": 353924, "epoch": 2106} {"train_loss": -11.685615539550781, "global_step": 353925, "epoch": 2106} {"train_loss": -11.569488525390625, "global_step": 353926, "epoch": 2106} {"train_loss": -11.360614776611328, "global_step": 353927, "epoch": 2106} {"train_loss": -11.443023681640625, "global_step": 353928, "epoch": 2106} {"train_loss": -11.692140579223633, "global_step": 353929, "epoch": 2106} {"train_loss": -11.907052040100098, "global_step": 353930, "epoch": 2106} {"train_loss": -11.77155876159668, "global_step": 353931, "epoch": 2106} {"train_loss": -11.748433113098145, "global_step": 353932, "epoch": 2106} {"train_loss": -11.752212524414062, "global_step": 353933, "epoch": 2106} {"train_loss": -11.753490447998047, "global_step": 353934, "epoch": 2106} {"train_loss": -11.696170806884766, "global_step": 353935, "epoch": 2106} {"train_loss": -11.668233871459961, "global_step": 353936, "epoch": 2106} {"train_loss": -12.072579383850098, "global_step": 353937, "epoch": 2106} {"train_loss": -12.039560317993164, "global_step": 353938, "epoch": 2106} {"train_loss": -12.11611557006836, "global_step": 353939, "epoch": 2106} {"train_loss": -11.447152137756348, "global_step": 353940, "epoch": 2106} {"train_loss": -11.440069198608398, "global_step": 353941, "epoch": 2106} {"train_loss": -11.631275177001953, "global_step": 353942, "epoch": 2106} {"train_loss": -11.148000717163086, "global_step": 353943, "epoch": 2106} {"train_loss": -11.336021423339844, "global_step": 353944, "epoch": 2106} {"train_loss": -11.29572868347168, "global_step": 353945, "epoch": 2106} {"train_loss": -11.72913932800293, "global_step": 353946, "epoch": 2106} {"train_loss": -11.116395950317383, "global_step": 353947, "epoch": 2106} {"train_loss": -10.857669830322266, "global_step": 353948, "epoch": 2106} {"train_loss": -11.448928833007812, "global_step": 353949, "epoch": 2106} {"train_loss": -11.6901273727417, "global_step": 353950, "epoch": 2106} {"train_loss": -10.984013557434082, "global_step": 353951, "epoch": 2106} {"train_loss": -12.083635330200195, "global_step": 353952, "epoch": 2106} {"train_loss": -11.549687385559082, "global_step": 353953, "epoch": 2106} {"train_loss": -11.667980194091797, "global_step": 353954, "epoch": 2106} {"train_loss": -11.709585189819336, "global_step": 353955, "epoch": 2106} {"train_loss": -11.436983108520508, "global_step": 353956, "epoch": 2106} {"train_loss": -11.876106262207031, "global_step": 353957, "epoch": 2106} {"train_loss": -11.705404281616211, "global_step": 353958, "epoch": 2106} {"train_loss": -11.498023986816406, "global_step": 353959, "epoch": 2106} {"train_loss": -11.548648834228516, "global_step": 353960, "epoch": 2106} {"train_loss": -11.654836654663086, "global_step": 353961, "epoch": 2106} {"train_loss": -11.040660858154297, "global_step": 353962, "epoch": 2106} {"train_loss": -10.67011833190918, "global_step": 353963, "epoch": 2106} {"train_loss": -11.063650131225586, "global_step": 353964, "epoch": 2106} {"train_loss": -11.044008255004883, "global_step": 353965, "epoch": 2106} {"train_loss": -11.567755699157715, "global_step": 353966, "epoch": 2106} {"train_loss": -11.735196113586426, "global_step": 353967, "epoch": 2106} {"train_loss": -11.358503341674805, "global_step": 353968, "epoch": 2106} {"train_loss": -10.992095947265625, "global_step": 353969, "epoch": 2106} {"train_loss": -11.568346977233887, "global_step": 353970, "epoch": 2106} {"train_loss": -11.793839454650879, "global_step": 353971, "epoch": 2106} {"train_loss": -11.398458480834961, "global_step": 353972, "epoch": 2106} {"train_loss": -11.44009780883789, "global_step": 353973, "epoch": 2106} {"train_loss": -11.48476505279541, "global_step": 353974, "epoch": 2106} {"train_loss": -11.663007140159607, "global_step": 353975, "epoch": 2106, "val_loss": 287775.75} {"train_loss": -11.747142791748047, "global_step": 353976, "epoch": 2107} {"train_loss": -11.31899356842041, "global_step": 353977, "epoch": 2107} {"train_loss": -11.631309509277344, "global_step": 353978, "epoch": 2107} {"train_loss": -11.627699851989746, "global_step": 353979, "epoch": 2107} {"train_loss": -11.434549331665039, "global_step": 353980, "epoch": 2107} {"train_loss": -11.501699447631836, "global_step": 353981, "epoch": 2107} {"train_loss": -11.856762886047363, "global_step": 353982, "epoch": 2107} {"train_loss": -11.669482231140137, "global_step": 353983, "epoch": 2107} {"train_loss": -12.005876541137695, "global_step": 353984, "epoch": 2107} {"train_loss": -11.641148567199707, "global_step": 353985, "epoch": 2107} {"train_loss": -11.678382873535156, "global_step": 353986, "epoch": 2107} {"train_loss": -12.219429016113281, "global_step": 353987, "epoch": 2107} {"train_loss": -11.929864883422852, "global_step": 353988, "epoch": 2107} {"train_loss": -11.943167686462402, "global_step": 353989, "epoch": 2107} {"train_loss": -11.721452713012695, "global_step": 353990, "epoch": 2107} {"train_loss": -12.089083671569824, "global_step": 353991, "epoch": 2107} {"train_loss": -12.217880249023438, "global_step": 353992, "epoch": 2107} {"train_loss": -12.146676063537598, "global_step": 353993, "epoch": 2107} {"train_loss": -12.062233924865723, "global_step": 353994, "epoch": 2107} {"train_loss": -11.877755165100098, "global_step": 353995, "epoch": 2107} {"train_loss": -12.146549224853516, "global_step": 353996, "epoch": 2107} {"train_loss": -12.216114044189453, "global_step": 353997, "epoch": 2107} {"train_loss": -12.010152816772461, "global_step": 353998, "epoch": 2107} {"train_loss": -12.176132202148438, "global_step": 353999, "epoch": 2107} {"train_loss": -12.327106475830078, "global_step": 354000, "epoch": 2107} {"train_loss": -12.112287521362305, "global_step": 354001, "epoch": 2107} {"train_loss": -12.215743064880371, "global_step": 354002, "epoch": 2107} {"train_loss": -12.29788589477539, "global_step": 354003, "epoch": 2107} {"train_loss": -12.335433959960938, "global_step": 354004, "epoch": 2107} {"train_loss": -12.453571319580078, "global_step": 354005, "epoch": 2107} {"train_loss": -12.435174942016602, "global_step": 354006, "epoch": 2107} {"train_loss": -12.16341781616211, "global_step": 354007, "epoch": 2107} {"train_loss": -12.423221588134766, "global_step": 354008, "epoch": 2107} {"train_loss": -11.927902221679688, "global_step": 354009, "epoch": 2107} {"train_loss": -12.271140098571777, "global_step": 354010, "epoch": 2107} {"train_loss": -11.986964225769043, "global_step": 354011, "epoch": 2107} {"train_loss": -12.387435913085938, "global_step": 354012, "epoch": 2107} {"train_loss": -12.183128356933594, "global_step": 354013, "epoch": 2107} {"train_loss": -12.108636856079102, "global_step": 354014, "epoch": 2107} {"train_loss": -12.445032119750977, "global_step": 354015, "epoch": 2107} {"train_loss": -12.268562316894531, "global_step": 354016, "epoch": 2107} {"train_loss": -12.454788208007812, "global_step": 354017, "epoch": 2107} {"train_loss": -12.152732849121094, "global_step": 354018, "epoch": 2107} {"train_loss": -12.328842163085938, "global_step": 354019, "epoch": 2107} {"train_loss": -12.35385799407959, "global_step": 354020, "epoch": 2107} {"train_loss": -12.67393970489502, "global_step": 354021, "epoch": 2107} {"train_loss": -12.322931289672852, "global_step": 354022, "epoch": 2107} {"train_loss": -12.503982543945312, "global_step": 354023, "epoch": 2107} {"train_loss": -12.574129104614258, "global_step": 354024, "epoch": 2107} {"train_loss": -12.405233383178711, "global_step": 354025, "epoch": 2107} {"train_loss": -12.267547607421875, "global_step": 354026, "epoch": 2107} {"train_loss": -12.195320129394531, "global_step": 354027, "epoch": 2107} {"train_loss": -12.091985702514648, "global_step": 354028, "epoch": 2107} {"train_loss": -11.854524612426758, "global_step": 354029, "epoch": 2107} {"train_loss": -12.23706340789795, "global_step": 354030, "epoch": 2107} {"train_loss": -11.972476959228516, "global_step": 354031, "epoch": 2107} {"train_loss": -12.451663970947266, "global_step": 354032, "epoch": 2107} {"train_loss": -12.51553726196289, "global_step": 354033, "epoch": 2107} {"train_loss": -12.281786918640137, "global_step": 354034, "epoch": 2107} {"train_loss": -12.572488784790039, "global_step": 354035, "epoch": 2107} {"train_loss": -12.67588996887207, "global_step": 354036, "epoch": 2107} {"train_loss": -12.590118408203125, "global_step": 354037, "epoch": 2107} {"train_loss": -12.644376754760742, "global_step": 354038, "epoch": 2107} {"train_loss": -12.670780181884766, "global_step": 354039, "epoch": 2107} {"train_loss": -12.513283729553223, "global_step": 354040, "epoch": 2107} {"train_loss": -12.530923843383789, "global_step": 354041, "epoch": 2107} {"train_loss": -12.677485466003418, "global_step": 354042, "epoch": 2107} {"train_loss": -12.507104873657227, "global_step": 354043, "epoch": 2107} {"train_loss": -12.726814270019531, "global_step": 354044, "epoch": 2107} {"train_loss": -12.498835563659668, "global_step": 354045, "epoch": 2107} {"train_loss": -12.895353317260742, "global_step": 354046, "epoch": 2107} {"train_loss": -12.43712043762207, "global_step": 354047, "epoch": 2107} {"train_loss": -12.32123851776123, "global_step": 354048, "epoch": 2107} {"train_loss": -12.306042671203613, "global_step": 354049, "epoch": 2107} {"train_loss": -12.682559967041016, "global_step": 354050, "epoch": 2107} {"train_loss": -12.320493698120117, "global_step": 354051, "epoch": 2107} {"train_loss": -12.370134353637695, "global_step": 354052, "epoch": 2107} {"train_loss": -12.371129035949707, "global_step": 354053, "epoch": 2107} {"train_loss": -12.011415481567383, "global_step": 354054, "epoch": 2107} {"train_loss": -12.385255813598633, "global_step": 354055, "epoch": 2107} {"train_loss": -12.586069107055664, "global_step": 354056, "epoch": 2107} {"train_loss": -12.215365409851074, "global_step": 354057, "epoch": 2107} {"train_loss": -12.558391571044922, "global_step": 354058, "epoch": 2107} {"train_loss": -12.421735763549805, "global_step": 354059, "epoch": 2107} {"train_loss": -11.797929763793945, "global_step": 354060, "epoch": 2107} {"train_loss": -12.469810485839844, "global_step": 354061, "epoch": 2107} {"train_loss": -12.43241024017334, "global_step": 354062, "epoch": 2107} {"train_loss": -12.313997268676758, "global_step": 354063, "epoch": 2107} {"train_loss": -12.104131698608398, "global_step": 354064, "epoch": 2107} {"train_loss": -12.189958572387695, "global_step": 354065, "epoch": 2107} {"train_loss": -12.284109115600586, "global_step": 354066, "epoch": 2107} {"train_loss": -12.398735046386719, "global_step": 354067, "epoch": 2107} {"train_loss": -12.53416633605957, "global_step": 354068, "epoch": 2107} {"train_loss": -11.983490943908691, "global_step": 354069, "epoch": 2107} {"train_loss": -11.706246376037598, "global_step": 354070, "epoch": 2107} {"train_loss": -12.541772842407227, "global_step": 354071, "epoch": 2107} {"train_loss": -12.174333572387695, "global_step": 354072, "epoch": 2107} {"train_loss": -11.419057846069336, "global_step": 354073, "epoch": 2107} {"train_loss": -11.527462005615234, "global_step": 354074, "epoch": 2107} {"train_loss": -11.93725299835205, "global_step": 354075, "epoch": 2107} {"train_loss": -9.998799324035645, "global_step": 354076, "epoch": 2107} {"train_loss": -11.751747131347656, "global_step": 354077, "epoch": 2107} {"train_loss": -10.82023811340332, "global_step": 354078, "epoch": 2107} {"train_loss": -11.476154327392578, "global_step": 354079, "epoch": 2107} {"train_loss": -11.723653793334961, "global_step": 354080, "epoch": 2107} {"train_loss": -9.625164985656738, "global_step": 354081, "epoch": 2107} {"train_loss": -11.84013557434082, "global_step": 354082, "epoch": 2107} {"train_loss": -11.758075714111328, "global_step": 354083, "epoch": 2107} {"train_loss": -11.336102485656738, "global_step": 354084, "epoch": 2107} {"train_loss": -12.362422943115234, "global_step": 354085, "epoch": 2107} {"train_loss": -11.787270545959473, "global_step": 354086, "epoch": 2107} {"train_loss": -12.205437660217285, "global_step": 354087, "epoch": 2107} {"train_loss": -12.383344650268555, "global_step": 354088, "epoch": 2107} {"train_loss": -12.191286087036133, "global_step": 354089, "epoch": 2107} {"train_loss": -12.124921798706055, "global_step": 354090, "epoch": 2107} {"train_loss": -12.236716270446777, "global_step": 354091, "epoch": 2107} {"train_loss": -11.850281715393066, "global_step": 354092, "epoch": 2107} {"train_loss": -12.145898818969727, "global_step": 354093, "epoch": 2107} {"train_loss": -12.458065032958984, "global_step": 354094, "epoch": 2107} {"train_loss": -11.7318115234375, "global_step": 354095, "epoch": 2107} {"train_loss": -11.791362762451172, "global_step": 354096, "epoch": 2107} {"train_loss": -12.361837387084961, "global_step": 354097, "epoch": 2107} {"train_loss": -11.885805130004883, "global_step": 354098, "epoch": 2107} {"train_loss": -12.295063018798828, "global_step": 354099, "epoch": 2107} {"train_loss": -12.157684326171875, "global_step": 354100, "epoch": 2107} {"train_loss": -12.384450912475586, "global_step": 354101, "epoch": 2107} {"train_loss": -12.082752227783203, "global_step": 354102, "epoch": 2107} {"train_loss": -12.301702499389648, "global_step": 354103, "epoch": 2107} {"train_loss": -12.42436408996582, "global_step": 354104, "epoch": 2107} {"train_loss": -12.197549819946289, "global_step": 354105, "epoch": 2107} {"train_loss": -11.722127914428711, "global_step": 354106, "epoch": 2107} {"train_loss": -12.269447326660156, "global_step": 354107, "epoch": 2107} {"train_loss": -10.884294509887695, "global_step": 354108, "epoch": 2107} {"train_loss": -10.286684036254883, "global_step": 354109, "epoch": 2107} {"train_loss": -11.886247634887695, "global_step": 354110, "epoch": 2107} {"train_loss": -9.754650115966797, "global_step": 354111, "epoch": 2107} {"train_loss": -10.429645538330078, "global_step": 354112, "epoch": 2107} {"train_loss": -10.234910011291504, "global_step": 354113, "epoch": 2107} {"train_loss": -10.145184516906738, "global_step": 354114, "epoch": 2107} {"train_loss": -11.361481666564941, "global_step": 354115, "epoch": 2107} {"train_loss": -10.553787231445312, "global_step": 354116, "epoch": 2107} {"train_loss": -10.903131484985352, "global_step": 354117, "epoch": 2107} {"train_loss": -11.226419448852539, "global_step": 354118, "epoch": 2107} {"train_loss": -10.872027397155762, "global_step": 354119, "epoch": 2107} {"train_loss": -11.02042293548584, "global_step": 354120, "epoch": 2107} {"train_loss": -10.964651107788086, "global_step": 354121, "epoch": 2107} {"train_loss": -11.169410705566406, "global_step": 354122, "epoch": 2107} {"train_loss": -11.733308792114258, "global_step": 354123, "epoch": 2107} {"train_loss": -10.711978912353516, "global_step": 354124, "epoch": 2107} {"train_loss": -11.727210998535156, "global_step": 354125, "epoch": 2107} {"train_loss": -11.682018280029297, "global_step": 354126, "epoch": 2107} {"train_loss": -11.09829330444336, "global_step": 354127, "epoch": 2107} {"train_loss": -11.188322067260742, "global_step": 354128, "epoch": 2107} {"train_loss": -11.352932929992676, "global_step": 354129, "epoch": 2107} {"train_loss": -11.37094497680664, "global_step": 354130, "epoch": 2107} {"train_loss": -11.516413688659668, "global_step": 354131, "epoch": 2107} {"train_loss": -11.780191421508789, "global_step": 354132, "epoch": 2107} {"train_loss": -11.624505996704102, "global_step": 354133, "epoch": 2107} {"train_loss": -11.702065467834473, "global_step": 354134, "epoch": 2107} {"train_loss": -11.440683364868164, "global_step": 354135, "epoch": 2107} {"train_loss": -11.978646278381348, "global_step": 354136, "epoch": 2107} {"train_loss": -11.808781623840332, "global_step": 354137, "epoch": 2107} {"train_loss": -11.727420806884766, "global_step": 354138, "epoch": 2107} {"train_loss": -11.952832221984863, "global_step": 354139, "epoch": 2107} {"train_loss": -12.049434661865234, "global_step": 354140, "epoch": 2107} {"train_loss": -12.265682220458984, "global_step": 354141, "epoch": 2107} {"train_loss": -11.632589340209961, "global_step": 354142, "epoch": 2107} {"train_loss": -11.946486393610636, "global_step": 354143, "epoch": 2107, "val_loss": 290053.375} {"train_loss": -12.251007080078125, "global_step": 354144, "epoch": 2108} {"train_loss": -11.846819877624512, "global_step": 354145, "epoch": 2108} {"train_loss": -12.22686767578125, "global_step": 354146, "epoch": 2108} {"train_loss": -11.974918365478516, "global_step": 354147, "epoch": 2108} {"train_loss": -11.84793472290039, "global_step": 354148, "epoch": 2108} {"train_loss": -12.033039093017578, "global_step": 354149, "epoch": 2108} {"train_loss": -12.048717498779297, "global_step": 354150, "epoch": 2108} {"train_loss": -12.206236839294434, "global_step": 354151, "epoch": 2108} {"train_loss": -12.201248168945312, "global_step": 354152, "epoch": 2108} {"train_loss": -12.414665222167969, "global_step": 354153, "epoch": 2108} {"train_loss": -12.209622383117676, "global_step": 354154, "epoch": 2108} {"train_loss": -12.095251083374023, "global_step": 354155, "epoch": 2108} {"train_loss": -12.059738159179688, "global_step": 354156, "epoch": 2108} {"train_loss": -12.062347412109375, "global_step": 354157, "epoch": 2108} {"train_loss": -12.260347366333008, "global_step": 354158, "epoch": 2108} {"train_loss": -12.225983619689941, "global_step": 354159, "epoch": 2108} {"train_loss": -12.109464645385742, "global_step": 354160, "epoch": 2108} {"train_loss": -12.560237884521484, "global_step": 354161, "epoch": 2108} {"train_loss": -12.1449556350708, "global_step": 354162, "epoch": 2108} {"train_loss": -12.221893310546875, "global_step": 354163, "epoch": 2108} {"train_loss": -12.074522018432617, "global_step": 354164, "epoch": 2108} {"train_loss": -12.369678497314453, "global_step": 354165, "epoch": 2108} {"train_loss": -12.139652252197266, "global_step": 354166, "epoch": 2108} {"train_loss": -12.038969039916992, "global_step": 354167, "epoch": 2108} {"train_loss": -12.219663619995117, "global_step": 354168, "epoch": 2108} {"train_loss": -12.049151420593262, "global_step": 354169, "epoch": 2108} {"train_loss": -12.362622261047363, "global_step": 354170, "epoch": 2108} {"train_loss": -12.109294891357422, "global_step": 354171, "epoch": 2108} {"train_loss": -12.283975601196289, "global_step": 354172, "epoch": 2108} {"train_loss": -12.383870124816895, "global_step": 354173, "epoch": 2108} {"train_loss": -12.193427085876465, "global_step": 354174, "epoch": 2108} {"train_loss": -12.61347770690918, "global_step": 354175, "epoch": 2108} {"train_loss": -12.17574691772461, "global_step": 354176, "epoch": 2108} {"train_loss": -12.393243789672852, "global_step": 354177, "epoch": 2108} {"train_loss": -12.428937911987305, "global_step": 354178, "epoch": 2108} {"train_loss": -12.308530807495117, "global_step": 354179, "epoch": 2108} {"train_loss": -12.285274505615234, "global_step": 354180, "epoch": 2108} {"train_loss": -12.194784164428711, "global_step": 354181, "epoch": 2108} {"train_loss": -12.650551795959473, "global_step": 354182, "epoch": 2108} {"train_loss": -12.173124313354492, "global_step": 354183, "epoch": 2108} {"train_loss": -12.362142562866211, "global_step": 354184, "epoch": 2108} {"train_loss": -12.604618072509766, "global_step": 354185, "epoch": 2108} {"train_loss": -12.371576309204102, "global_step": 354186, "epoch": 2108} {"train_loss": -12.29665756225586, "global_step": 354187, "epoch": 2108} {"train_loss": -12.461031913757324, "global_step": 354188, "epoch": 2108} {"train_loss": -12.29018783569336, "global_step": 354189, "epoch": 2108} {"train_loss": -12.256277084350586, "global_step": 354190, "epoch": 2108} {"train_loss": -12.356973648071289, "global_step": 354191, "epoch": 2108} {"train_loss": -12.370084762573242, "global_step": 354192, "epoch": 2108} {"train_loss": -12.315909385681152, "global_step": 354193, "epoch": 2108} {"train_loss": -12.483802795410156, "global_step": 354194, "epoch": 2108} {"train_loss": -12.378921508789062, "global_step": 354195, "epoch": 2108} {"train_loss": -12.671957969665527, "global_step": 354196, "epoch": 2108} {"train_loss": -12.368555068969727, "global_step": 354197, "epoch": 2108} {"train_loss": -12.686548233032227, "global_step": 354198, "epoch": 2108} {"train_loss": -11.886030197143555, "global_step": 354199, "epoch": 2108} {"train_loss": -12.382013320922852, "global_step": 354200, "epoch": 2108} {"train_loss": -12.239941596984863, "global_step": 354201, "epoch": 2108} {"train_loss": -12.582752227783203, "global_step": 354202, "epoch": 2108} {"train_loss": -12.077497482299805, "global_step": 354203, "epoch": 2108} {"train_loss": -12.16123104095459, "global_step": 354204, "epoch": 2108} {"train_loss": -12.052257537841797, "global_step": 354205, "epoch": 2108} {"train_loss": -12.524053573608398, "global_step": 354206, "epoch": 2108} {"train_loss": -11.75, "global_step": 354207, "epoch": 2108} {"train_loss": -12.598342895507812, "global_step": 354208, "epoch": 2108} {"train_loss": -11.33387565612793, "global_step": 354209, "epoch": 2108} {"train_loss": -12.562145233154297, "global_step": 354210, "epoch": 2108} {"train_loss": -11.480745315551758, "global_step": 354211, "epoch": 2108} {"train_loss": -12.326480865478516, "global_step": 354212, "epoch": 2108} {"train_loss": -11.794805526733398, "global_step": 354213, "epoch": 2108} {"train_loss": -12.584733963012695, "global_step": 354214, "epoch": 2108} {"train_loss": -11.821985244750977, "global_step": 354215, "epoch": 2108} {"train_loss": -12.132563591003418, "global_step": 354216, "epoch": 2108} {"train_loss": -12.229381561279297, "global_step": 354217, "epoch": 2108} {"train_loss": -12.428224563598633, "global_step": 354218, "epoch": 2108} {"train_loss": -12.329788208007812, "global_step": 354219, "epoch": 2108} {"train_loss": -12.16259765625, "global_step": 354220, "epoch": 2108} {"train_loss": -12.596943855285645, "global_step": 354221, "epoch": 2108} {"train_loss": -11.90029525756836, "global_step": 354222, "epoch": 2108} {"train_loss": -12.486894607543945, "global_step": 354223, "epoch": 2108} {"train_loss": -11.877015113830566, "global_step": 354224, "epoch": 2108} {"train_loss": -12.37611198425293, "global_step": 354225, "epoch": 2108} {"train_loss": -12.403016090393066, "global_step": 354226, "epoch": 2108} {"train_loss": -12.343048095703125, "global_step": 354227, "epoch": 2108} {"train_loss": -12.340036392211914, "global_step": 354228, "epoch": 2108} {"train_loss": -12.276897430419922, "global_step": 354229, "epoch": 2108} {"train_loss": -12.64141845703125, "global_step": 354230, "epoch": 2108} {"train_loss": -12.581925392150879, "global_step": 354231, "epoch": 2108} {"train_loss": -12.378517150878906, "global_step": 354232, "epoch": 2108} {"train_loss": -12.460029602050781, "global_step": 354233, "epoch": 2108} {"train_loss": -12.468890190124512, "global_step": 354234, "epoch": 2108} {"train_loss": -12.492948532104492, "global_step": 354235, "epoch": 2108} {"train_loss": -12.355676651000977, "global_step": 354236, "epoch": 2108} {"train_loss": -12.491071701049805, "global_step": 354237, "epoch": 2108} {"train_loss": -12.641027450561523, "global_step": 354238, "epoch": 2108} {"train_loss": -12.501764297485352, "global_step": 354239, "epoch": 2108} {"train_loss": -12.331392288208008, "global_step": 354240, "epoch": 2108} {"train_loss": -11.789599418640137, "global_step": 354241, "epoch": 2108} {"train_loss": -12.596456527709961, "global_step": 354242, "epoch": 2108} {"train_loss": -12.165390014648438, "global_step": 354243, "epoch": 2108} {"train_loss": -11.633398056030273, "global_step": 354244, "epoch": 2108} {"train_loss": -12.233530044555664, "global_step": 354245, "epoch": 2108} {"train_loss": -10.538315773010254, "global_step": 354246, "epoch": 2108} {"train_loss": -11.93387508392334, "global_step": 354247, "epoch": 2108} {"train_loss": -12.024351119995117, "global_step": 354248, "epoch": 2108} {"train_loss": -11.318124771118164, "global_step": 354249, "epoch": 2108} {"train_loss": -12.410640716552734, "global_step": 354250, "epoch": 2108} {"train_loss": -11.668684005737305, "global_step": 354251, "epoch": 2108} {"train_loss": -11.05883502960205, "global_step": 354252, "epoch": 2108} {"train_loss": -12.37663459777832, "global_step": 354253, "epoch": 2108} {"train_loss": -10.020153999328613, "global_step": 354254, "epoch": 2108} {"train_loss": -12.266374588012695, "global_step": 354255, "epoch": 2108} {"train_loss": -10.52627944946289, "global_step": 354256, "epoch": 2108} {"train_loss": -11.89907455444336, "global_step": 354257, "epoch": 2108} {"train_loss": -11.340615272521973, "global_step": 354258, "epoch": 2108} {"train_loss": -11.66919231414795, "global_step": 354259, "epoch": 2108} {"train_loss": -10.739875793457031, "global_step": 354260, "epoch": 2108} {"train_loss": -11.410075187683105, "global_step": 354261, "epoch": 2108} {"train_loss": -11.302434921264648, "global_step": 354262, "epoch": 2108} {"train_loss": -11.324503898620605, "global_step": 354263, "epoch": 2108} {"train_loss": -10.244873046875, "global_step": 354264, "epoch": 2108} {"train_loss": -9.833662033081055, "global_step": 354265, "epoch": 2108} {"train_loss": -10.527872085571289, "global_step": 354266, "epoch": 2108} {"train_loss": -11.347397804260254, "global_step": 354267, "epoch": 2108} {"train_loss": -11.164379119873047, "global_step": 354268, "epoch": 2108} {"train_loss": -10.950247764587402, "global_step": 354269, "epoch": 2108} {"train_loss": -11.503573417663574, "global_step": 354270, "epoch": 2108} {"train_loss": -11.562780380249023, "global_step": 354271, "epoch": 2108} {"train_loss": -11.963367462158203, "global_step": 354272, "epoch": 2108} {"train_loss": -11.500732421875, "global_step": 354273, "epoch": 2108} {"train_loss": -12.164021492004395, "global_step": 354274, "epoch": 2108} {"train_loss": -11.56932258605957, "global_step": 354275, "epoch": 2108} {"train_loss": -11.930426597595215, "global_step": 354276, "epoch": 2108} {"train_loss": -11.860394477844238, "global_step": 354277, "epoch": 2108} {"train_loss": -11.77754020690918, "global_step": 354278, "epoch": 2108} {"train_loss": -12.196696281433105, "global_step": 354279, "epoch": 2108} {"train_loss": -11.880743026733398, "global_step": 354280, "epoch": 2108} {"train_loss": -11.933683395385742, "global_step": 354281, "epoch": 2108} {"train_loss": -11.889557838439941, "global_step": 354282, "epoch": 2108} {"train_loss": -12.026178359985352, "global_step": 354283, "epoch": 2108} {"train_loss": -12.261428833007812, "global_step": 354284, "epoch": 2108} {"train_loss": -12.01409912109375, "global_step": 354285, "epoch": 2108} {"train_loss": -11.925260543823242, "global_step": 354286, "epoch": 2108} {"train_loss": -12.396594047546387, "global_step": 354287, "epoch": 2108} {"train_loss": -12.166765213012695, "global_step": 354288, "epoch": 2108} {"train_loss": -12.310611724853516, "global_step": 354289, "epoch": 2108} {"train_loss": -12.169473648071289, "global_step": 354290, "epoch": 2108} {"train_loss": -12.28797435760498, "global_step": 354291, "epoch": 2108} {"train_loss": -12.044490814208984, "global_step": 354292, "epoch": 2108} {"train_loss": -12.215242385864258, "global_step": 354293, "epoch": 2108} {"train_loss": -11.933992385864258, "global_step": 354294, "epoch": 2108} {"train_loss": -12.434616088867188, "global_step": 354295, "epoch": 2108} {"train_loss": -12.333226203918457, "global_step": 354296, "epoch": 2108} {"train_loss": -12.148279190063477, "global_step": 354297, "epoch": 2108} {"train_loss": -12.35158920288086, "global_step": 354298, "epoch": 2108} {"train_loss": -12.379899024963379, "global_step": 354299, "epoch": 2108} {"train_loss": -12.356752395629883, "global_step": 354300, "epoch": 2108} {"train_loss": -12.282247543334961, "global_step": 354301, "epoch": 2108} {"train_loss": -12.392507553100586, "global_step": 354302, "epoch": 2108} {"train_loss": -12.021492004394531, "global_step": 354303, "epoch": 2108} {"train_loss": -12.171051025390625, "global_step": 354304, "epoch": 2108} {"train_loss": -11.730484008789062, "global_step": 354305, "epoch": 2108} {"train_loss": -12.159635543823242, "global_step": 354306, "epoch": 2108} {"train_loss": -12.139763832092285, "global_step": 354307, "epoch": 2108} {"train_loss": -11.47812271118164, "global_step": 354308, "epoch": 2108} {"train_loss": -12.212058067321777, "global_step": 354309, "epoch": 2108} {"train_loss": -12.160357475280762, "global_step": 354310, "epoch": 2108} {"train_loss": -12.058459838231405, "global_step": 354311, "epoch": 2108, "val_loss": 288901.46875} {"train_loss": -11.37386417388916, "global_step": 354312, "epoch": 2109} {"train_loss": -12.305763244628906, "global_step": 354313, "epoch": 2109} {"train_loss": -11.866246223449707, "global_step": 354314, "epoch": 2109} {"train_loss": -11.56180477142334, "global_step": 354315, "epoch": 2109} {"train_loss": -11.953869819641113, "global_step": 354316, "epoch": 2109} {"train_loss": -12.170385360717773, "global_step": 354317, "epoch": 2109} {"train_loss": -11.764079093933105, "global_step": 354318, "epoch": 2109} {"train_loss": -12.0921630859375, "global_step": 354319, "epoch": 2109} {"train_loss": -11.865906715393066, "global_step": 354320, "epoch": 2109} {"train_loss": -12.020203590393066, "global_step": 354321, "epoch": 2109} {"train_loss": -12.03615951538086, "global_step": 354322, "epoch": 2109} {"train_loss": -12.106472969055176, "global_step": 354323, "epoch": 2109} {"train_loss": -12.304180145263672, "global_step": 354324, "epoch": 2109} {"train_loss": -12.038454055786133, "global_step": 354325, "epoch": 2109} {"train_loss": -12.095172882080078, "global_step": 354326, "epoch": 2109} {"train_loss": -12.4608154296875, "global_step": 354327, "epoch": 2109} {"train_loss": -12.325404167175293, "global_step": 354328, "epoch": 2109} {"train_loss": -12.018558502197266, "global_step": 354329, "epoch": 2109} {"train_loss": -12.458332061767578, "global_step": 354330, "epoch": 2109} {"train_loss": -12.354837417602539, "global_step": 354331, "epoch": 2109} {"train_loss": -12.245180130004883, "global_step": 354332, "epoch": 2109} {"train_loss": -12.463741302490234, "global_step": 354333, "epoch": 2109} {"train_loss": -12.305811882019043, "global_step": 354334, "epoch": 2109} {"train_loss": -12.56908130645752, "global_step": 354335, "epoch": 2109} {"train_loss": -12.375031471252441, "global_step": 354336, "epoch": 2109} {"train_loss": -12.576051712036133, "global_step": 354337, "epoch": 2109} {"train_loss": -11.9942626953125, "global_step": 354338, "epoch": 2109} {"train_loss": -12.50722885131836, "global_step": 354339, "epoch": 2109} {"train_loss": -12.006914138793945, "global_step": 354340, "epoch": 2109} {"train_loss": -12.660873413085938, "global_step": 354341, "epoch": 2109} {"train_loss": -12.22750473022461, "global_step": 354342, "epoch": 2109} {"train_loss": -12.433425903320312, "global_step": 354343, "epoch": 2109} {"train_loss": -12.41645622253418, "global_step": 354344, "epoch": 2109} {"train_loss": -12.320711135864258, "global_step": 354345, "epoch": 2109} {"train_loss": -11.874752044677734, "global_step": 354346, "epoch": 2109} {"train_loss": -12.227579116821289, "global_step": 354347, "epoch": 2109} {"train_loss": -12.335935592651367, "global_step": 354348, "epoch": 2109} {"train_loss": -11.890214920043945, "global_step": 354349, "epoch": 2109} {"train_loss": -11.881105422973633, "global_step": 354350, "epoch": 2109} {"train_loss": -11.187590599060059, "global_step": 354351, "epoch": 2109} {"train_loss": -12.337957382202148, "global_step": 354352, "epoch": 2109} {"train_loss": -10.704204559326172, "global_step": 354353, "epoch": 2109} {"train_loss": -10.038673400878906, "global_step": 354354, "epoch": 2109} {"train_loss": -10.709304809570312, "global_step": 354355, "epoch": 2109} {"train_loss": -10.026432037353516, "global_step": 354356, "epoch": 2109} {"train_loss": -10.737449645996094, "global_step": 354357, "epoch": 2109} {"train_loss": -10.046575546264648, "global_step": 354358, "epoch": 2109} {"train_loss": -10.336974143981934, "global_step": 354359, "epoch": 2109} {"train_loss": -9.976608276367188, "global_step": 354360, "epoch": 2109} {"train_loss": -11.017992973327637, "global_step": 354361, "epoch": 2109} {"train_loss": -10.249074935913086, "global_step": 354362, "epoch": 2109} {"train_loss": -10.528264999389648, "global_step": 354363, "epoch": 2109} {"train_loss": -10.155683517456055, "global_step": 354364, "epoch": 2109} {"train_loss": -10.512960433959961, "global_step": 354365, "epoch": 2109} {"train_loss": -10.169971466064453, "global_step": 354366, "epoch": 2109} {"train_loss": -10.413839340209961, "global_step": 354367, "epoch": 2109} {"train_loss": -10.628315925598145, "global_step": 354368, "epoch": 2109} {"train_loss": -12.04215145111084, "global_step": 354369, "epoch": 2109} {"train_loss": -10.205484390258789, "global_step": 354370, "epoch": 2109} {"train_loss": -11.729743957519531, "global_step": 354371, "epoch": 2109} {"train_loss": -10.782157897949219, "global_step": 354372, "epoch": 2109} {"train_loss": -10.17473030090332, "global_step": 354373, "epoch": 2109} {"train_loss": -11.543390274047852, "global_step": 354374, "epoch": 2109} {"train_loss": -10.756097793579102, "global_step": 354375, "epoch": 2109} {"train_loss": -10.530723571777344, "global_step": 354376, "epoch": 2109} {"train_loss": -11.27016830444336, "global_step": 354377, "epoch": 2109} {"train_loss": -11.423760414123535, "global_step": 354378, "epoch": 2109} {"train_loss": -11.896492004394531, "global_step": 354379, "epoch": 2109} {"train_loss": -11.213910102844238, "global_step": 354380, "epoch": 2109} {"train_loss": -11.507474899291992, "global_step": 354381, "epoch": 2109} {"train_loss": -10.959650993347168, "global_step": 354382, "epoch": 2109} {"train_loss": -11.159984588623047, "global_step": 354383, "epoch": 2109} {"train_loss": -11.622461318969727, "global_step": 354384, "epoch": 2109} {"train_loss": -11.646223068237305, "global_step": 354385, "epoch": 2109} {"train_loss": -11.289881706237793, "global_step": 354386, "epoch": 2109} {"train_loss": -11.46596908569336, "global_step": 354387, "epoch": 2109} {"train_loss": -11.27306842803955, "global_step": 354388, "epoch": 2109} {"train_loss": -11.817376136779785, "global_step": 354389, "epoch": 2109} {"train_loss": -11.254981994628906, "global_step": 354390, "epoch": 2109} {"train_loss": -11.786466598510742, "global_step": 354391, "epoch": 2109} {"train_loss": -11.559370040893555, "global_step": 354392, "epoch": 2109} {"train_loss": -11.998451232910156, "global_step": 354393, "epoch": 2109} {"train_loss": -11.785469055175781, "global_step": 354394, "epoch": 2109} {"train_loss": -11.980897903442383, "global_step": 354395, "epoch": 2109} {"train_loss": -11.767623901367188, "global_step": 354396, "epoch": 2109} {"train_loss": -12.071527481079102, "global_step": 354397, "epoch": 2109} {"train_loss": -11.523228645324707, "global_step": 354398, "epoch": 2109} {"train_loss": -12.159058570861816, "global_step": 354399, "epoch": 2109} {"train_loss": -11.976545333862305, "global_step": 354400, "epoch": 2109} {"train_loss": -11.75828742980957, "global_step": 354401, "epoch": 2109} {"train_loss": -12.383350372314453, "global_step": 354402, "epoch": 2109} {"train_loss": -11.598447799682617, "global_step": 354403, "epoch": 2109} {"train_loss": -11.860511779785156, "global_step": 354404, "epoch": 2109} {"train_loss": -12.060510635375977, "global_step": 354405, "epoch": 2109} {"train_loss": -11.745695114135742, "global_step": 354406, "epoch": 2109} {"train_loss": -12.245019912719727, "global_step": 354407, "epoch": 2109} {"train_loss": -11.965015411376953, "global_step": 354408, "epoch": 2109} {"train_loss": -11.957906723022461, "global_step": 354409, "epoch": 2109} {"train_loss": -12.212716102600098, "global_step": 354410, "epoch": 2109} {"train_loss": -11.631361961364746, "global_step": 354411, "epoch": 2109} {"train_loss": -11.967782020568848, "global_step": 354412, "epoch": 2109} {"train_loss": -11.845914840698242, "global_step": 354413, "epoch": 2109} {"train_loss": -11.798298835754395, "global_step": 354414, "epoch": 2109} {"train_loss": -11.94979476928711, "global_step": 354415, "epoch": 2109} {"train_loss": -11.525863647460938, "global_step": 354416, "epoch": 2109} {"train_loss": -11.69668197631836, "global_step": 354417, "epoch": 2109} {"train_loss": -11.766704559326172, "global_step": 354418, "epoch": 2109} {"train_loss": -11.569367408752441, "global_step": 354419, "epoch": 2109} {"train_loss": -11.481369972229004, "global_step": 354420, "epoch": 2109} {"train_loss": -11.646300315856934, "global_step": 354421, "epoch": 2109} {"train_loss": -11.413625717163086, "global_step": 354422, "epoch": 2109} {"train_loss": -11.741047859191895, "global_step": 354423, "epoch": 2109} {"train_loss": -11.310430526733398, "global_step": 354424, "epoch": 2109} {"train_loss": -11.820023536682129, "global_step": 354425, "epoch": 2109} {"train_loss": -11.635807991027832, "global_step": 354426, "epoch": 2109} {"train_loss": -11.84786605834961, "global_step": 354427, "epoch": 2109} {"train_loss": -11.484418869018555, "global_step": 354428, "epoch": 2109} {"train_loss": -12.138029098510742, "global_step": 354429, "epoch": 2109} {"train_loss": -11.727470397949219, "global_step": 354430, "epoch": 2109} {"train_loss": -12.09366226196289, "global_step": 354431, "epoch": 2109} {"train_loss": -11.992450714111328, "global_step": 354432, "epoch": 2109} {"train_loss": -11.906566619873047, "global_step": 354433, "epoch": 2109} {"train_loss": -11.885414123535156, "global_step": 354434, "epoch": 2109} {"train_loss": -12.017641067504883, "global_step": 354435, "epoch": 2109} {"train_loss": -11.726736068725586, "global_step": 354436, "epoch": 2109} {"train_loss": -12.28683090209961, "global_step": 354437, "epoch": 2109} {"train_loss": -12.027284622192383, "global_step": 354438, "epoch": 2109} {"train_loss": -11.850667953491211, "global_step": 354439, "epoch": 2109} {"train_loss": -12.319432258605957, "global_step": 354440, "epoch": 2109} {"train_loss": -12.098499298095703, "global_step": 354441, "epoch": 2109} {"train_loss": -12.467620849609375, "global_step": 354442, "epoch": 2109} {"train_loss": -12.128643989562988, "global_step": 354443, "epoch": 2109} {"train_loss": -12.202603340148926, "global_step": 354444, "epoch": 2109} {"train_loss": -12.420089721679688, "global_step": 354445, "epoch": 2109} {"train_loss": -12.263752937316895, "global_step": 354446, "epoch": 2109} {"train_loss": -12.357476234436035, "global_step": 354447, "epoch": 2109} {"train_loss": -12.189361572265625, "global_step": 354448, "epoch": 2109} {"train_loss": -12.300414085388184, "global_step": 354449, "epoch": 2109} {"train_loss": -12.13880729675293, "global_step": 354450, "epoch": 2109} {"train_loss": -12.411052703857422, "global_step": 354451, "epoch": 2109} {"train_loss": -12.210447311401367, "global_step": 354452, "epoch": 2109} {"train_loss": -12.350019454956055, "global_step": 354453, "epoch": 2109} {"train_loss": -12.425664901733398, "global_step": 354454, "epoch": 2109} {"train_loss": -12.222210884094238, "global_step": 354455, "epoch": 2109} {"train_loss": -12.4625883102417, "global_step": 354456, "epoch": 2109} {"train_loss": -12.282474517822266, "global_step": 354457, "epoch": 2109} {"train_loss": -12.547679901123047, "global_step": 354458, "epoch": 2109} {"train_loss": -12.42197036743164, "global_step": 354459, "epoch": 2109} {"train_loss": -12.071690559387207, "global_step": 354460, "epoch": 2109} {"train_loss": -12.368976593017578, "global_step": 354461, "epoch": 2109} {"train_loss": -12.42588996887207, "global_step": 354462, "epoch": 2109} {"train_loss": -11.914112091064453, "global_step": 354463, "epoch": 2109} {"train_loss": -12.549181938171387, "global_step": 354464, "epoch": 2109} {"train_loss": -11.699490547180176, "global_step": 354465, "epoch": 2109} {"train_loss": -12.490808486938477, "global_step": 354466, "epoch": 2109} {"train_loss": -12.026802062988281, "global_step": 354467, "epoch": 2109} {"train_loss": -12.245040893554688, "global_step": 354468, "epoch": 2109} {"train_loss": -12.03650951385498, "global_step": 354469, "epoch": 2109} {"train_loss": -11.844022750854492, "global_step": 354470, "epoch": 2109} {"train_loss": -11.661426544189453, "global_step": 354471, "epoch": 2109} {"train_loss": -12.128780364990234, "global_step": 354472, "epoch": 2109} {"train_loss": -11.972000122070312, "global_step": 354473, "epoch": 2109} {"train_loss": -12.110017776489258, "global_step": 354474, "epoch": 2109} {"train_loss": -11.919255256652832, "global_step": 354475, "epoch": 2109} {"train_loss": -11.505332946777344, "global_step": 354476, "epoch": 2109} {"train_loss": -11.76944351196289, "global_step": 354477, "epoch": 2109} {"train_loss": -12.058274269104004, "global_step": 354478, "epoch": 2109} {"train_loss": -11.777756918044318, "global_step": 354479, "epoch": 2109, "val_loss": 292401.03125} {"train_loss": -11.96343994140625, "global_step": 354480, "epoch": 2110} {"train_loss": -12.235435485839844, "global_step": 354481, "epoch": 2110} {"train_loss": -11.96731185913086, "global_step": 354482, "epoch": 2110} {"train_loss": -12.183907508850098, "global_step": 354483, "epoch": 2110} {"train_loss": -12.17083740234375, "global_step": 354484, "epoch": 2110} {"train_loss": -12.032838821411133, "global_step": 354485, "epoch": 2110} {"train_loss": -12.291303634643555, "global_step": 354486, "epoch": 2110} {"train_loss": -11.962055206298828, "global_step": 354487, "epoch": 2110} {"train_loss": -12.26728630065918, "global_step": 354488, "epoch": 2110} {"train_loss": -12.094503402709961, "global_step": 354489, "epoch": 2110} {"train_loss": -11.850910186767578, "global_step": 354490, "epoch": 2110} {"train_loss": -12.333433151245117, "global_step": 354491, "epoch": 2110} {"train_loss": -11.409585952758789, "global_step": 354492, "epoch": 2110} {"train_loss": -11.625753402709961, "global_step": 354493, "epoch": 2110} {"train_loss": -11.092057228088379, "global_step": 354494, "epoch": 2110} {"train_loss": -11.759781837463379, "global_step": 354495, "epoch": 2110} {"train_loss": -11.678279876708984, "global_step": 354496, "epoch": 2110} {"train_loss": -10.924076080322266, "global_step": 354497, "epoch": 2110} {"train_loss": -11.597980499267578, "global_step": 354498, "epoch": 2110} {"train_loss": -10.890772819519043, "global_step": 354499, "epoch": 2110} {"train_loss": -11.936212539672852, "global_step": 354500, "epoch": 2110} {"train_loss": -10.916187286376953, "global_step": 354501, "epoch": 2110} {"train_loss": -11.169717788696289, "global_step": 354502, "epoch": 2110} {"train_loss": -11.246604919433594, "global_step": 354503, "epoch": 2110} {"train_loss": -10.29033088684082, "global_step": 354504, "epoch": 2110} {"train_loss": -11.91631031036377, "global_step": 354505, "epoch": 2110} {"train_loss": -10.548666000366211, "global_step": 354506, "epoch": 2110} {"train_loss": -12.031549453735352, "global_step": 354507, "epoch": 2110} {"train_loss": -11.192109107971191, "global_step": 354508, "epoch": 2110} {"train_loss": -11.918228149414062, "global_step": 354509, "epoch": 2110} {"train_loss": -11.275697708129883, "global_step": 354510, "epoch": 2110} {"train_loss": -11.747739791870117, "global_step": 354511, "epoch": 2110} {"train_loss": -11.562784194946289, "global_step": 354512, "epoch": 2110} {"train_loss": -11.662345886230469, "global_step": 354513, "epoch": 2110} {"train_loss": -11.999741554260254, "global_step": 354514, "epoch": 2110} {"train_loss": -11.535919189453125, "global_step": 354515, "epoch": 2110} {"train_loss": -12.268927574157715, "global_step": 354516, "epoch": 2110} {"train_loss": -12.067136764526367, "global_step": 354517, "epoch": 2110} {"train_loss": -12.220586776733398, "global_step": 354518, "epoch": 2110} {"train_loss": -12.149142265319824, "global_step": 354519, "epoch": 2110} {"train_loss": -11.928803443908691, "global_step": 354520, "epoch": 2110} {"train_loss": -11.997241973876953, "global_step": 354521, "epoch": 2110} {"train_loss": -12.296594619750977, "global_step": 354522, "epoch": 2110} {"train_loss": -12.268020629882812, "global_step": 354523, "epoch": 2110} {"train_loss": -12.172243118286133, "global_step": 354524, "epoch": 2110} {"train_loss": -12.077777862548828, "global_step": 354525, "epoch": 2110} {"train_loss": -12.450032234191895, "global_step": 354526, "epoch": 2110} {"train_loss": -12.231188774108887, "global_step": 354527, "epoch": 2110} {"train_loss": -12.286565780639648, "global_step": 354528, "epoch": 2110} {"train_loss": -12.102099418640137, "global_step": 354529, "epoch": 2110} {"train_loss": -12.32295036315918, "global_step": 354530, "epoch": 2110} {"train_loss": -12.117816925048828, "global_step": 354531, "epoch": 2110} {"train_loss": -12.147745132446289, "global_step": 354532, "epoch": 2110} {"train_loss": -12.127038955688477, "global_step": 354533, "epoch": 2110} {"train_loss": -11.956088066101074, "global_step": 354534, "epoch": 2110} {"train_loss": -12.114641189575195, "global_step": 354535, "epoch": 2110} {"train_loss": -11.834287643432617, "global_step": 354536, "epoch": 2110} {"train_loss": -12.228031158447266, "global_step": 354537, "epoch": 2110} {"train_loss": -11.721199989318848, "global_step": 354538, "epoch": 2110} {"train_loss": -12.136026382446289, "global_step": 354539, "epoch": 2110} {"train_loss": -11.511581420898438, "global_step": 354540, "epoch": 2110} {"train_loss": -11.874074935913086, "global_step": 354541, "epoch": 2110} {"train_loss": -12.002240180969238, "global_step": 354542, "epoch": 2110} {"train_loss": -12.17062759399414, "global_step": 354543, "epoch": 2110} {"train_loss": -12.309296607971191, "global_step": 354544, "epoch": 2110} {"train_loss": -11.959732055664062, "global_step": 354545, "epoch": 2110} {"train_loss": -12.341606140136719, "global_step": 354546, "epoch": 2110} {"train_loss": -11.908855438232422, "global_step": 354547, "epoch": 2110} {"train_loss": -12.416288375854492, "global_step": 354548, "epoch": 2110} {"train_loss": -11.884040832519531, "global_step": 354549, "epoch": 2110} {"train_loss": -12.233154296875, "global_step": 354550, "epoch": 2110} {"train_loss": -12.362409591674805, "global_step": 354551, "epoch": 2110} {"train_loss": -12.254554748535156, "global_step": 354552, "epoch": 2110} {"train_loss": -12.364297866821289, "global_step": 354553, "epoch": 2110} {"train_loss": -12.235207557678223, "global_step": 354554, "epoch": 2110} {"train_loss": -12.561513900756836, "global_step": 354555, "epoch": 2110} {"train_loss": -12.225945472717285, "global_step": 354556, "epoch": 2110} {"train_loss": -12.472941398620605, "global_step": 354557, "epoch": 2110} {"train_loss": -12.231724739074707, "global_step": 354558, "epoch": 2110} {"train_loss": -12.043058395385742, "global_step": 354559, "epoch": 2110} {"train_loss": -12.263031005859375, "global_step": 354560, "epoch": 2110} {"train_loss": -12.135148048400879, "global_step": 354561, "epoch": 2110} {"train_loss": -12.321340560913086, "global_step": 354562, "epoch": 2110} {"train_loss": -11.561321258544922, "global_step": 354563, "epoch": 2110} {"train_loss": -11.337006568908691, "global_step": 354564, "epoch": 2110} {"train_loss": -12.167028427124023, "global_step": 354565, "epoch": 2110} {"train_loss": -11.94955825805664, "global_step": 354566, "epoch": 2110} {"train_loss": -11.64556884765625, "global_step": 354567, "epoch": 2110} {"train_loss": -11.525216102600098, "global_step": 354568, "epoch": 2110} {"train_loss": -12.231147766113281, "global_step": 354569, "epoch": 2110} {"train_loss": -11.895965576171875, "global_step": 354570, "epoch": 2110} {"train_loss": -11.769237518310547, "global_step": 354571, "epoch": 2110} {"train_loss": -12.353673934936523, "global_step": 354572, "epoch": 2110} {"train_loss": -11.446008682250977, "global_step": 354573, "epoch": 2110} {"train_loss": -11.68714714050293, "global_step": 354574, "epoch": 2110} {"train_loss": -11.546440124511719, "global_step": 354575, "epoch": 2110} {"train_loss": -10.518041610717773, "global_step": 354576, "epoch": 2110} {"train_loss": -12.387430191040039, "global_step": 354577, "epoch": 2110} {"train_loss": -11.358114242553711, "global_step": 354578, "epoch": 2110} {"train_loss": -12.018949508666992, "global_step": 354579, "epoch": 2110} {"train_loss": -11.698518753051758, "global_step": 354580, "epoch": 2110} {"train_loss": -10.996516227722168, "global_step": 354581, "epoch": 2110} {"train_loss": -12.331911087036133, "global_step": 354582, "epoch": 2110} {"train_loss": -11.378032684326172, "global_step": 354583, "epoch": 2110} {"train_loss": -11.824612617492676, "global_step": 354584, "epoch": 2110} {"train_loss": -11.311651229858398, "global_step": 354585, "epoch": 2110} {"train_loss": -10.95485782623291, "global_step": 354586, "epoch": 2110} {"train_loss": -11.864969253540039, "global_step": 354587, "epoch": 2110} {"train_loss": -11.346181869506836, "global_step": 354588, "epoch": 2110} {"train_loss": -11.883283615112305, "global_step": 354589, "epoch": 2110} {"train_loss": -11.59025764465332, "global_step": 354590, "epoch": 2110} {"train_loss": -11.224275588989258, "global_step": 354591, "epoch": 2110} {"train_loss": -11.809093475341797, "global_step": 354592, "epoch": 2110} {"train_loss": -11.845283508300781, "global_step": 354593, "epoch": 2110} {"train_loss": -11.46923828125, "global_step": 354594, "epoch": 2110} {"train_loss": -12.067262649536133, "global_step": 354595, "epoch": 2110} {"train_loss": -11.576766014099121, "global_step": 354596, "epoch": 2110} {"train_loss": -12.150556564331055, "global_step": 354597, "epoch": 2110} {"train_loss": -11.933393478393555, "global_step": 354598, "epoch": 2110} {"train_loss": -11.9913330078125, "global_step": 354599, "epoch": 2110} {"train_loss": -12.04155158996582, "global_step": 354600, "epoch": 2110} {"train_loss": -12.154045104980469, "global_step": 354601, "epoch": 2110} {"train_loss": -11.889843940734863, "global_step": 354602, "epoch": 2110} {"train_loss": -12.266725540161133, "global_step": 354603, "epoch": 2110} {"train_loss": -12.02938461303711, "global_step": 354604, "epoch": 2110} {"train_loss": -12.288240432739258, "global_step": 354605, "epoch": 2110} {"train_loss": -12.302103996276855, "global_step": 354606, "epoch": 2110} {"train_loss": -12.105938911437988, "global_step": 354607, "epoch": 2110} {"train_loss": -12.38682746887207, "global_step": 354608, "epoch": 2110} {"train_loss": -12.209680557250977, "global_step": 354609, "epoch": 2110} {"train_loss": -12.264341354370117, "global_step": 354610, "epoch": 2110} {"train_loss": -12.172264099121094, "global_step": 354611, "epoch": 2110} {"train_loss": -12.116165161132812, "global_step": 354612, "epoch": 2110} {"train_loss": -12.175430297851562, "global_step": 354613, "epoch": 2110} {"train_loss": -12.322792053222656, "global_step": 354614, "epoch": 2110} {"train_loss": -12.094476699829102, "global_step": 354615, "epoch": 2110} {"train_loss": -12.505290985107422, "global_step": 354616, "epoch": 2110} {"train_loss": -12.05022144317627, "global_step": 354617, "epoch": 2110} {"train_loss": -12.265401840209961, "global_step": 354618, "epoch": 2110} {"train_loss": -12.48428726196289, "global_step": 354619, "epoch": 2110} {"train_loss": -11.721238136291504, "global_step": 354620, "epoch": 2110} {"train_loss": -12.46036434173584, "global_step": 354621, "epoch": 2110} {"train_loss": -12.098759651184082, "global_step": 354622, "epoch": 2110} {"train_loss": -12.294672966003418, "global_step": 354623, "epoch": 2110} {"train_loss": -12.189679145812988, "global_step": 354624, "epoch": 2110} {"train_loss": -12.235071182250977, "global_step": 354625, "epoch": 2110} {"train_loss": -12.041142463684082, "global_step": 354626, "epoch": 2110} {"train_loss": -12.186870574951172, "global_step": 354627, "epoch": 2110} {"train_loss": -12.219743728637695, "global_step": 354628, "epoch": 2110} {"train_loss": -11.862771987915039, "global_step": 354629, "epoch": 2110} {"train_loss": -12.23354721069336, "global_step": 354630, "epoch": 2110} {"train_loss": -12.349187850952148, "global_step": 354631, "epoch": 2110} {"train_loss": -12.079206466674805, "global_step": 354632, "epoch": 2110} {"train_loss": -12.328889846801758, "global_step": 354633, "epoch": 2110} {"train_loss": -11.708913803100586, "global_step": 354634, "epoch": 2110} {"train_loss": -11.637618064880371, "global_step": 354635, "epoch": 2110} {"train_loss": -11.98833179473877, "global_step": 354636, "epoch": 2110} {"train_loss": -10.969639778137207, "global_step": 354637, "epoch": 2110} {"train_loss": -12.052057266235352, "global_step": 354638, "epoch": 2110} {"train_loss": -12.017484664916992, "global_step": 354639, "epoch": 2110} {"train_loss": -12.249641418457031, "global_step": 354640, "epoch": 2110} {"train_loss": -12.099096298217773, "global_step": 354641, "epoch": 2110} {"train_loss": -11.575525283813477, "global_step": 354642, "epoch": 2110} {"train_loss": -12.394925117492676, "global_step": 354643, "epoch": 2110} {"train_loss": -11.600918769836426, "global_step": 354644, "epoch": 2110} {"train_loss": -12.148218154907227, "global_step": 354645, "epoch": 2110} {"train_loss": -12.032301902770996, "global_step": 354646, "epoch": 2110} {"train_loss": -11.928413992836362, "global_step": 354647, "epoch": 2110, "val_loss": 291380.0625, "train_action_mse_error": 1.5127652883529663} {"train_loss": -12.243307113647461, "global_step": 354648, "epoch": 2111} {"train_loss": -12.259150505065918, "global_step": 354649, "epoch": 2111} {"train_loss": -12.36206340789795, "global_step": 354650, "epoch": 2111} {"train_loss": -12.229284286499023, "global_step": 354651, "epoch": 2111} {"train_loss": -12.093515396118164, "global_step": 354652, "epoch": 2111} {"train_loss": -12.22706127166748, "global_step": 354653, "epoch": 2111} {"train_loss": -12.009809494018555, "global_step": 354654, "epoch": 2111} {"train_loss": -12.402863502502441, "global_step": 354655, "epoch": 2111} {"train_loss": -12.181716918945312, "global_step": 354656, "epoch": 2111} {"train_loss": -12.374940872192383, "global_step": 354657, "epoch": 2111} {"train_loss": -12.258893966674805, "global_step": 354658, "epoch": 2111} {"train_loss": -12.46043586730957, "global_step": 354659, "epoch": 2111} {"train_loss": -12.409361839294434, "global_step": 354660, "epoch": 2111} {"train_loss": -12.49118423461914, "global_step": 354661, "epoch": 2111} {"train_loss": -12.169326782226562, "global_step": 354662, "epoch": 2111} {"train_loss": -12.554758071899414, "global_step": 354663, "epoch": 2111} {"train_loss": -12.33326244354248, "global_step": 354664, "epoch": 2111} {"train_loss": -12.180070877075195, "global_step": 354665, "epoch": 2111} {"train_loss": -12.269567489624023, "global_step": 354666, "epoch": 2111} {"train_loss": -12.054891586303711, "global_step": 354667, "epoch": 2111} {"train_loss": -11.876632690429688, "global_step": 354668, "epoch": 2111} {"train_loss": -12.191723823547363, "global_step": 354669, "epoch": 2111} {"train_loss": -11.75645637512207, "global_step": 354670, "epoch": 2111} {"train_loss": -12.093006134033203, "global_step": 354671, "epoch": 2111} {"train_loss": -11.874165534973145, "global_step": 354672, "epoch": 2111} {"train_loss": -11.93490982055664, "global_step": 354673, "epoch": 2111} {"train_loss": -12.46474838256836, "global_step": 354674, "epoch": 2111} {"train_loss": -12.40985107421875, "global_step": 354675, "epoch": 2111} {"train_loss": -11.845451354980469, "global_step": 354676, "epoch": 2111} {"train_loss": -12.212872505187988, "global_step": 354677, "epoch": 2111} {"train_loss": -12.051789283752441, "global_step": 354678, "epoch": 2111} {"train_loss": -12.306562423706055, "global_step": 354679, "epoch": 2111} {"train_loss": -11.900793075561523, "global_step": 354680, "epoch": 2111} {"train_loss": -12.243680000305176, "global_step": 354681, "epoch": 2111} {"train_loss": -11.87198257446289, "global_step": 354682, "epoch": 2111} {"train_loss": -12.087457656860352, "global_step": 354683, "epoch": 2111} {"train_loss": -11.58265495300293, "global_step": 354684, "epoch": 2111} {"train_loss": -12.579732894897461, "global_step": 354685, "epoch": 2111} {"train_loss": -11.96088981628418, "global_step": 354686, "epoch": 2111} {"train_loss": -11.98226547241211, "global_step": 354687, "epoch": 2111} {"train_loss": -12.069772720336914, "global_step": 354688, "epoch": 2111} {"train_loss": -12.081794738769531, "global_step": 354689, "epoch": 2111} {"train_loss": -11.938594818115234, "global_step": 354690, "epoch": 2111} {"train_loss": -12.28504467010498, "global_step": 354691, "epoch": 2111} {"train_loss": -12.055563926696777, "global_step": 354692, "epoch": 2111} {"train_loss": -12.414438247680664, "global_step": 354693, "epoch": 2111} {"train_loss": -12.317663192749023, "global_step": 354694, "epoch": 2111} {"train_loss": -12.56973934173584, "global_step": 354695, "epoch": 2111} {"train_loss": -12.054744720458984, "global_step": 354696, "epoch": 2111} {"train_loss": -12.445047378540039, "global_step": 354697, "epoch": 2111} {"train_loss": -12.14955997467041, "global_step": 354698, "epoch": 2111} {"train_loss": -12.421566009521484, "global_step": 354699, "epoch": 2111} {"train_loss": -12.201903343200684, "global_step": 354700, "epoch": 2111} {"train_loss": -12.27145004272461, "global_step": 354701, "epoch": 2111} {"train_loss": -12.45666217803955, "global_step": 354702, "epoch": 2111} {"train_loss": -12.415191650390625, "global_step": 354703, "epoch": 2111} {"train_loss": -12.157341003417969, "global_step": 354704, "epoch": 2111} {"train_loss": -12.11697769165039, "global_step": 354705, "epoch": 2111} {"train_loss": -12.285737037658691, "global_step": 354706, "epoch": 2111} {"train_loss": -12.211057662963867, "global_step": 354707, "epoch": 2111} {"train_loss": -11.983247756958008, "global_step": 354708, "epoch": 2111} {"train_loss": -11.797466278076172, "global_step": 354709, "epoch": 2111} {"train_loss": -12.224956512451172, "global_step": 354710, "epoch": 2111} {"train_loss": -12.219974517822266, "global_step": 354711, "epoch": 2111} {"train_loss": -11.927717208862305, "global_step": 354712, "epoch": 2111} {"train_loss": -11.670591354370117, "global_step": 354713, "epoch": 2111} {"train_loss": -12.335826873779297, "global_step": 354714, "epoch": 2111} {"train_loss": -12.28087043762207, "global_step": 354715, "epoch": 2111} {"train_loss": -11.958720207214355, "global_step": 354716, "epoch": 2111} {"train_loss": -12.419120788574219, "global_step": 354717, "epoch": 2111} {"train_loss": -12.17062759399414, "global_step": 354718, "epoch": 2111} {"train_loss": -12.361092567443848, "global_step": 354719, "epoch": 2111} {"train_loss": -12.154359817504883, "global_step": 354720, "epoch": 2111} {"train_loss": -11.77755069732666, "global_step": 354721, "epoch": 2111} {"train_loss": -12.524559020996094, "global_step": 354722, "epoch": 2111} {"train_loss": -12.487411499023438, "global_step": 354723, "epoch": 2111} {"train_loss": -12.092065811157227, "global_step": 354724, "epoch": 2111} {"train_loss": -12.166885375976562, "global_step": 354725, "epoch": 2111} {"train_loss": -12.265342712402344, "global_step": 354726, "epoch": 2111} {"train_loss": -11.639463424682617, "global_step": 354727, "epoch": 2111} {"train_loss": -11.981090545654297, "global_step": 354728, "epoch": 2111} {"train_loss": -11.83964729309082, "global_step": 354729, "epoch": 2111} {"train_loss": -12.193331718444824, "global_step": 354730, "epoch": 2111} {"train_loss": -12.146097183227539, "global_step": 354731, "epoch": 2111} {"train_loss": -12.058501243591309, "global_step": 354732, "epoch": 2111} {"train_loss": -11.952936172485352, "global_step": 354733, "epoch": 2111} {"train_loss": -12.411011695861816, "global_step": 354734, "epoch": 2111} {"train_loss": -11.824459075927734, "global_step": 354735, "epoch": 2111} {"train_loss": -11.878538131713867, "global_step": 354736, "epoch": 2111} {"train_loss": -11.970489501953125, "global_step": 354737, "epoch": 2111} {"train_loss": -11.637090682983398, "global_step": 354738, "epoch": 2111} {"train_loss": -11.434236526489258, "global_step": 354739, "epoch": 2111} {"train_loss": -11.673778533935547, "global_step": 354740, "epoch": 2111} {"train_loss": -12.132020950317383, "global_step": 354741, "epoch": 2111} {"train_loss": -11.582029342651367, "global_step": 354742, "epoch": 2111} {"train_loss": -12.028766632080078, "global_step": 354743, "epoch": 2111} {"train_loss": -12.131311416625977, "global_step": 354744, "epoch": 2111} {"train_loss": -11.70786190032959, "global_step": 354745, "epoch": 2111} {"train_loss": -11.834005355834961, "global_step": 354746, "epoch": 2111} {"train_loss": -12.369340896606445, "global_step": 354747, "epoch": 2111} {"train_loss": -11.497224807739258, "global_step": 354748, "epoch": 2111} {"train_loss": -11.690587043762207, "global_step": 354749, "epoch": 2111} {"train_loss": -11.992284774780273, "global_step": 354750, "epoch": 2111} {"train_loss": -11.031363487243652, "global_step": 354751, "epoch": 2111} {"train_loss": -12.091105461120605, "global_step": 354752, "epoch": 2111} {"train_loss": -10.716835021972656, "global_step": 354753, "epoch": 2111} {"train_loss": -11.337400436401367, "global_step": 354754, "epoch": 2111} {"train_loss": -11.574941635131836, "global_step": 354755, "epoch": 2111} {"train_loss": -10.8726224899292, "global_step": 354756, "epoch": 2111} {"train_loss": -11.675665855407715, "global_step": 354757, "epoch": 2111} {"train_loss": -9.246631622314453, "global_step": 354758, "epoch": 2111} {"train_loss": -11.918115615844727, "global_step": 354759, "epoch": 2111} {"train_loss": -10.293787002563477, "global_step": 354760, "epoch": 2111} {"train_loss": -11.439361572265625, "global_step": 354761, "epoch": 2111} {"train_loss": -11.03635311126709, "global_step": 354762, "epoch": 2111} {"train_loss": -10.503734588623047, "global_step": 354763, "epoch": 2111} {"train_loss": -10.442354202270508, "global_step": 354764, "epoch": 2111} {"train_loss": -10.18327808380127, "global_step": 354765, "epoch": 2111} {"train_loss": -9.318400382995605, "global_step": 354766, "epoch": 2111} {"train_loss": -11.1119384765625, "global_step": 354767, "epoch": 2111} {"train_loss": -10.056680679321289, "global_step": 354768, "epoch": 2111} {"train_loss": -10.662360191345215, "global_step": 354769, "epoch": 2111} {"train_loss": -11.07384967803955, "global_step": 354770, "epoch": 2111} {"train_loss": -10.494089126586914, "global_step": 354771, "epoch": 2111} {"train_loss": -10.410024642944336, "global_step": 354772, "epoch": 2111} {"train_loss": -10.572336196899414, "global_step": 354773, "epoch": 2111} {"train_loss": -10.274568557739258, "global_step": 354774, "epoch": 2111} {"train_loss": -10.893092155456543, "global_step": 354775, "epoch": 2111} {"train_loss": -9.197002410888672, "global_step": 354776, "epoch": 2111} {"train_loss": -10.622690200805664, "global_step": 354777, "epoch": 2111} {"train_loss": -10.957465171813965, "global_step": 354778, "epoch": 2111} {"train_loss": -10.460991859436035, "global_step": 354779, "epoch": 2111} {"train_loss": -11.474133491516113, "global_step": 354780, "epoch": 2111} {"train_loss": -11.108150482177734, "global_step": 354781, "epoch": 2111} {"train_loss": -10.594179153442383, "global_step": 354782, "epoch": 2111} {"train_loss": -11.854447364807129, "global_step": 354783, "epoch": 2111} {"train_loss": -10.415430068969727, "global_step": 354784, "epoch": 2111} {"train_loss": -11.715963363647461, "global_step": 354785, "epoch": 2111} {"train_loss": -10.815927505493164, "global_step": 354786, "epoch": 2111} {"train_loss": -10.955804824829102, "global_step": 354787, "epoch": 2111} {"train_loss": -10.934965133666992, "global_step": 354788, "epoch": 2111} {"train_loss": -10.645406723022461, "global_step": 354789, "epoch": 2111} {"train_loss": -10.826622009277344, "global_step": 354790, "epoch": 2111} {"train_loss": -10.311065673828125, "global_step": 354791, "epoch": 2111} {"train_loss": -11.36288070678711, "global_step": 354792, "epoch": 2111} {"train_loss": -10.891887664794922, "global_step": 354793, "epoch": 2111} {"train_loss": -11.412538528442383, "global_step": 354794, "epoch": 2111} {"train_loss": -11.253806114196777, "global_step": 354795, "epoch": 2111} {"train_loss": -11.45814037322998, "global_step": 354796, "epoch": 2111} {"train_loss": -11.084662437438965, "global_step": 354797, "epoch": 2111} {"train_loss": -11.955805778503418, "global_step": 354798, "epoch": 2111} {"train_loss": -11.345096588134766, "global_step": 354799, "epoch": 2111} {"train_loss": -12.125539779663086, "global_step": 354800, "epoch": 2111} {"train_loss": -12.017524719238281, "global_step": 354801, "epoch": 2111} {"train_loss": -11.772087097167969, "global_step": 354802, "epoch": 2111} {"train_loss": -11.842222213745117, "global_step": 354803, "epoch": 2111} {"train_loss": -11.74219799041748, "global_step": 354804, "epoch": 2111} {"train_loss": -11.820690155029297, "global_step": 354805, "epoch": 2111} {"train_loss": -12.068073272705078, "global_step": 354806, "epoch": 2111} {"train_loss": -12.059993743896484, "global_step": 354807, "epoch": 2111} {"train_loss": -12.235200881958008, "global_step": 354808, "epoch": 2111} {"train_loss": -12.306146621704102, "global_step": 354809, "epoch": 2111} {"train_loss": -12.097415924072266, "global_step": 354810, "epoch": 2111} {"train_loss": -12.211748123168945, "global_step": 354811, "epoch": 2111} {"train_loss": -11.87757682800293, "global_step": 354812, "epoch": 2111} {"train_loss": -12.020137786865234, "global_step": 354813, "epoch": 2111} {"train_loss": -12.28940200805664, "global_step": 354814, "epoch": 2111} {"train_loss": -11.74654647849855, "global_step": 354815, "epoch": 2111, "val_loss": 287918.34375} {"train_loss": -12.272383689880371, "global_step": 354816, "epoch": 2112} {"train_loss": -12.24578857421875, "global_step": 354817, "epoch": 2112} {"train_loss": -12.210927963256836, "global_step": 354818, "epoch": 2112} {"train_loss": -12.254634857177734, "global_step": 354819, "epoch": 2112} {"train_loss": -12.273066520690918, "global_step": 354820, "epoch": 2112} {"train_loss": -12.210542678833008, "global_step": 354821, "epoch": 2112} {"train_loss": -12.117942810058594, "global_step": 354822, "epoch": 2112} {"train_loss": -12.137575149536133, "global_step": 354823, "epoch": 2112} {"train_loss": -12.336729049682617, "global_step": 354824, "epoch": 2112} {"train_loss": -12.272363662719727, "global_step": 354825, "epoch": 2112} {"train_loss": -12.276137351989746, "global_step": 354826, "epoch": 2112} {"train_loss": -12.20498275756836, "global_step": 354827, "epoch": 2112} {"train_loss": -12.448674201965332, "global_step": 354828, "epoch": 2112} {"train_loss": -12.245388984680176, "global_step": 354829, "epoch": 2112} {"train_loss": -12.314279556274414, "global_step": 354830, "epoch": 2112} {"train_loss": -12.390454292297363, "global_step": 354831, "epoch": 2112} {"train_loss": -12.342238426208496, "global_step": 354832, "epoch": 2112} {"train_loss": -12.478897094726562, "global_step": 354833, "epoch": 2112} {"train_loss": -12.38100814819336, "global_step": 354834, "epoch": 2112} {"train_loss": -12.325753211975098, "global_step": 354835, "epoch": 2112} {"train_loss": -12.299640655517578, "global_step": 354836, "epoch": 2112} {"train_loss": -12.52430534362793, "global_step": 354837, "epoch": 2112} {"train_loss": -12.275861740112305, "global_step": 354838, "epoch": 2112} {"train_loss": -12.493870735168457, "global_step": 354839, "epoch": 2112} {"train_loss": -12.576045036315918, "global_step": 354840, "epoch": 2112} {"train_loss": -12.330490112304688, "global_step": 354841, "epoch": 2112} {"train_loss": -12.364033699035645, "global_step": 354842, "epoch": 2112} {"train_loss": -12.523653984069824, "global_step": 354843, "epoch": 2112} {"train_loss": -12.4552001953125, "global_step": 354844, "epoch": 2112} {"train_loss": -12.624161720275879, "global_step": 354845, "epoch": 2112} {"train_loss": -12.501134872436523, "global_step": 354846, "epoch": 2112} {"train_loss": -12.647724151611328, "global_step": 354847, "epoch": 2112} {"train_loss": -12.460346221923828, "global_step": 354848, "epoch": 2112} {"train_loss": -12.439403533935547, "global_step": 354849, "epoch": 2112} {"train_loss": -12.638141632080078, "global_step": 354850, "epoch": 2112} {"train_loss": -12.187211990356445, "global_step": 354851, "epoch": 2112} {"train_loss": -12.38460922241211, "global_step": 354852, "epoch": 2112} {"train_loss": -12.623623847961426, "global_step": 354853, "epoch": 2112} {"train_loss": -12.416122436523438, "global_step": 354854, "epoch": 2112} {"train_loss": -12.511287689208984, "global_step": 354855, "epoch": 2112} {"train_loss": -12.382333755493164, "global_step": 354856, "epoch": 2112} {"train_loss": -12.393709182739258, "global_step": 354857, "epoch": 2112} {"train_loss": -12.57767391204834, "global_step": 354858, "epoch": 2112} {"train_loss": -12.600290298461914, "global_step": 354859, "epoch": 2112} {"train_loss": -12.603649139404297, "global_step": 354860, "epoch": 2112} {"train_loss": -12.536675453186035, "global_step": 354861, "epoch": 2112} {"train_loss": -12.483139038085938, "global_step": 354862, "epoch": 2112} {"train_loss": -12.487972259521484, "global_step": 354863, "epoch": 2112} {"train_loss": -12.320539474487305, "global_step": 354864, "epoch": 2112} {"train_loss": -12.680009841918945, "global_step": 354865, "epoch": 2112} {"train_loss": -12.426514625549316, "global_step": 354866, "epoch": 2112} {"train_loss": -12.443172454833984, "global_step": 354867, "epoch": 2112} {"train_loss": -12.701546669006348, "global_step": 354868, "epoch": 2112} {"train_loss": -12.565057754516602, "global_step": 354869, "epoch": 2112} {"train_loss": -12.86344051361084, "global_step": 354870, "epoch": 2112} {"train_loss": -12.599194526672363, "global_step": 354871, "epoch": 2112} {"train_loss": -12.502273559570312, "global_step": 354872, "epoch": 2112} {"train_loss": -12.71592903137207, "global_step": 354873, "epoch": 2112} {"train_loss": -12.651824951171875, "global_step": 354874, "epoch": 2112} {"train_loss": -12.788771629333496, "global_step": 354875, "epoch": 2112} {"train_loss": -12.457818984985352, "global_step": 354876, "epoch": 2112} {"train_loss": -12.861809730529785, "global_step": 354877, "epoch": 2112} {"train_loss": -12.706640243530273, "global_step": 354878, "epoch": 2112} {"train_loss": -12.553035736083984, "global_step": 354879, "epoch": 2112} {"train_loss": -12.526803016662598, "global_step": 354880, "epoch": 2112} {"train_loss": -12.68004035949707, "global_step": 354881, "epoch": 2112} {"train_loss": -12.647086143493652, "global_step": 354882, "epoch": 2112} {"train_loss": -12.624868392944336, "global_step": 354883, "epoch": 2112} {"train_loss": -12.622393608093262, "global_step": 354884, "epoch": 2112} {"train_loss": -12.483664512634277, "global_step": 354885, "epoch": 2112} {"train_loss": -12.907720565795898, "global_step": 354886, "epoch": 2112} {"train_loss": -12.17053508758545, "global_step": 354887, "epoch": 2112} {"train_loss": -12.388904571533203, "global_step": 354888, "epoch": 2112} {"train_loss": -12.063404083251953, "global_step": 354889, "epoch": 2112} {"train_loss": -11.921805381774902, "global_step": 354890, "epoch": 2112} {"train_loss": -11.92481803894043, "global_step": 354891, "epoch": 2112} {"train_loss": -12.632089614868164, "global_step": 354892, "epoch": 2112} {"train_loss": -12.004252433776855, "global_step": 354893, "epoch": 2112} {"train_loss": -12.09235954284668, "global_step": 354894, "epoch": 2112} {"train_loss": -12.209678649902344, "global_step": 354895, "epoch": 2112} {"train_loss": -12.120244979858398, "global_step": 354896, "epoch": 2112} {"train_loss": -11.651030540466309, "global_step": 354897, "epoch": 2112} {"train_loss": -11.569479942321777, "global_step": 354898, "epoch": 2112} {"train_loss": -12.161925315856934, "global_step": 354899, "epoch": 2112} {"train_loss": -11.424150466918945, "global_step": 354900, "epoch": 2112} {"train_loss": -10.467155456542969, "global_step": 354901, "epoch": 2112} {"train_loss": -11.01949691772461, "global_step": 354902, "epoch": 2112} {"train_loss": -10.279556274414062, "global_step": 354903, "epoch": 2112} {"train_loss": -11.341829299926758, "global_step": 354904, "epoch": 2112} {"train_loss": -11.133926391601562, "global_step": 354905, "epoch": 2112} {"train_loss": -10.741423606872559, "global_step": 354906, "epoch": 2112} {"train_loss": -10.703470230102539, "global_step": 354907, "epoch": 2112} {"train_loss": -10.692447662353516, "global_step": 354908, "epoch": 2112} {"train_loss": -9.711886405944824, "global_step": 354909, "epoch": 2112} {"train_loss": -8.593849182128906, "global_step": 354910, "epoch": 2112} {"train_loss": -9.978190422058105, "global_step": 354911, "epoch": 2112} {"train_loss": -9.917865753173828, "global_step": 354912, "epoch": 2112} {"train_loss": -10.207250595092773, "global_step": 354913, "epoch": 2112} {"train_loss": -11.075089454650879, "global_step": 354914, "epoch": 2112} {"train_loss": -10.580371856689453, "global_step": 354915, "epoch": 2112} {"train_loss": -9.966135025024414, "global_step": 354916, "epoch": 2112} {"train_loss": -11.192712783813477, "global_step": 354917, "epoch": 2112} {"train_loss": -10.853379249572754, "global_step": 354918, "epoch": 2112} {"train_loss": -10.547204971313477, "global_step": 354919, "epoch": 2112} {"train_loss": -11.278519630432129, "global_step": 354920, "epoch": 2112} {"train_loss": -10.716608047485352, "global_step": 354921, "epoch": 2112} {"train_loss": -11.218513488769531, "global_step": 354922, "epoch": 2112} {"train_loss": -11.34339427947998, "global_step": 354923, "epoch": 2112} {"train_loss": -11.391483306884766, "global_step": 354924, "epoch": 2112} {"train_loss": -11.40594482421875, "global_step": 354925, "epoch": 2112} {"train_loss": -11.16441535949707, "global_step": 354926, "epoch": 2112} {"train_loss": -11.750410079956055, "global_step": 354927, "epoch": 2112} {"train_loss": -11.879159927368164, "global_step": 354928, "epoch": 2112} {"train_loss": -11.898353576660156, "global_step": 354929, "epoch": 2112} {"train_loss": -11.664091110229492, "global_step": 354930, "epoch": 2112} {"train_loss": -12.223636627197266, "global_step": 354931, "epoch": 2112} {"train_loss": -11.924752235412598, "global_step": 354932, "epoch": 2112} {"train_loss": -12.020532608032227, "global_step": 354933, "epoch": 2112} {"train_loss": -11.837617874145508, "global_step": 354934, "epoch": 2112} {"train_loss": -12.01302719116211, "global_step": 354935, "epoch": 2112} {"train_loss": -11.84410285949707, "global_step": 354936, "epoch": 2112} {"train_loss": -11.550701141357422, "global_step": 354937, "epoch": 2112} {"train_loss": -12.110377311706543, "global_step": 354938, "epoch": 2112} {"train_loss": -11.829181671142578, "global_step": 354939, "epoch": 2112} {"train_loss": -12.215566635131836, "global_step": 354940, "epoch": 2112} {"train_loss": -11.878311157226562, "global_step": 354941, "epoch": 2112} {"train_loss": -12.33959674835205, "global_step": 354942, "epoch": 2112} {"train_loss": -11.552386283874512, "global_step": 354943, "epoch": 2112} {"train_loss": -12.149273872375488, "global_step": 354944, "epoch": 2112} {"train_loss": -11.644397735595703, "global_step": 354945, "epoch": 2112} {"train_loss": -12.341760635375977, "global_step": 354946, "epoch": 2112} {"train_loss": -11.802936553955078, "global_step": 354947, "epoch": 2112} {"train_loss": -12.30490493774414, "global_step": 354948, "epoch": 2112} {"train_loss": -11.923957824707031, "global_step": 354949, "epoch": 2112} {"train_loss": -12.27029037475586, "global_step": 354950, "epoch": 2112} {"train_loss": -11.89202880859375, "global_step": 354951, "epoch": 2112} {"train_loss": -12.348960876464844, "global_step": 354952, "epoch": 2112} {"train_loss": -12.158063888549805, "global_step": 354953, "epoch": 2112} {"train_loss": -12.381891250610352, "global_step": 354954, "epoch": 2112} {"train_loss": -12.275348663330078, "global_step": 354955, "epoch": 2112} {"train_loss": -12.460968017578125, "global_step": 354956, "epoch": 2112} {"train_loss": -12.316855430603027, "global_step": 354957, "epoch": 2112} {"train_loss": -12.381489753723145, "global_step": 354958, "epoch": 2112} {"train_loss": -12.398841857910156, "global_step": 354959, "epoch": 2112} {"train_loss": -12.264232635498047, "global_step": 354960, "epoch": 2112} {"train_loss": -12.341033935546875, "global_step": 354961, "epoch": 2112} {"train_loss": -12.406691551208496, "global_step": 354962, "epoch": 2112} {"train_loss": -12.49133014678955, "global_step": 354963, "epoch": 2112} {"train_loss": -12.39874267578125, "global_step": 354964, "epoch": 2112} {"train_loss": -12.396688461303711, "global_step": 354965, "epoch": 2112} {"train_loss": -12.54017448425293, "global_step": 354966, "epoch": 2112} {"train_loss": -12.322942733764648, "global_step": 354967, "epoch": 2112} {"train_loss": -12.41476821899414, "global_step": 354968, "epoch": 2112} {"train_loss": -12.580620765686035, "global_step": 354969, "epoch": 2112} {"train_loss": -12.405794143676758, "global_step": 354970, "epoch": 2112} {"train_loss": -12.600622177124023, "global_step": 354971, "epoch": 2112} {"train_loss": -12.427438735961914, "global_step": 354972, "epoch": 2112} {"train_loss": -12.354368209838867, "global_step": 354973, "epoch": 2112} {"train_loss": -12.69959831237793, "global_step": 354974, "epoch": 2112} {"train_loss": -12.104004859924316, "global_step": 354975, "epoch": 2112} {"train_loss": -11.96189022064209, "global_step": 354976, "epoch": 2112} {"train_loss": -12.551666259765625, "global_step": 354977, "epoch": 2112} {"train_loss": -11.835962295532227, "global_step": 354978, "epoch": 2112} {"train_loss": -12.162859916687012, "global_step": 354979, "epoch": 2112} {"train_loss": -12.090425491333008, "global_step": 354980, "epoch": 2112} {"train_loss": -12.29642391204834, "global_step": 354981, "epoch": 2112} {"train_loss": -12.087496757507324, "global_step": 354982, "epoch": 2112} {"train_loss": -12.052038516317095, "global_step": 354983, "epoch": 2112, "val_loss": 290165.0} {"train_loss": -12.169022560119629, "global_step": 354984, "epoch": 2113} {"train_loss": -12.424580574035645, "global_step": 354985, "epoch": 2113} {"train_loss": -12.4453763961792, "global_step": 354986, "epoch": 2113} {"train_loss": -12.473612785339355, "global_step": 354987, "epoch": 2113} {"train_loss": -12.178715705871582, "global_step": 354988, "epoch": 2113} {"train_loss": -12.68231201171875, "global_step": 354989, "epoch": 2113} {"train_loss": -12.303119659423828, "global_step": 354990, "epoch": 2113} {"train_loss": -12.579292297363281, "global_step": 354991, "epoch": 2113} {"train_loss": -12.404186248779297, "global_step": 354992, "epoch": 2113} {"train_loss": -12.459447860717773, "global_step": 354993, "epoch": 2113} {"train_loss": -12.345438957214355, "global_step": 354994, "epoch": 2113} {"train_loss": -12.406253814697266, "global_step": 354995, "epoch": 2113} {"train_loss": -12.331535339355469, "global_step": 354996, "epoch": 2113} {"train_loss": -12.218339920043945, "global_step": 354997, "epoch": 2113} {"train_loss": -12.401298522949219, "global_step": 354998, "epoch": 2113} {"train_loss": -12.113984107971191, "global_step": 354999, "epoch": 2113} {"train_loss": -12.501094818115234, "global_step": 355000, "epoch": 2113} {"train_loss": -12.436050415039062, "global_step": 355001, "epoch": 2113} {"train_loss": -12.488495826721191, "global_step": 355002, "epoch": 2113} {"train_loss": -12.587292671203613, "global_step": 355003, "epoch": 2113} {"train_loss": -12.356447219848633, "global_step": 355004, "epoch": 2113} {"train_loss": -12.456647872924805, "global_step": 355005, "epoch": 2113} {"train_loss": -12.609386444091797, "global_step": 355006, "epoch": 2113} {"train_loss": -12.539405822753906, "global_step": 355007, "epoch": 2113} {"train_loss": -12.529690742492676, "global_step": 355008, "epoch": 2113} {"train_loss": -12.516990661621094, "global_step": 355009, "epoch": 2113} {"train_loss": -12.091851234436035, "global_step": 355010, "epoch": 2113} {"train_loss": -11.34304428100586, "global_step": 355011, "epoch": 2113} {"train_loss": -11.938573837280273, "global_step": 355012, "epoch": 2113} {"train_loss": -11.874698638916016, "global_step": 355013, "epoch": 2113} {"train_loss": -11.614570617675781, "global_step": 355014, "epoch": 2113} {"train_loss": -11.330659866333008, "global_step": 355015, "epoch": 2113} {"train_loss": -12.194162368774414, "global_step": 355016, "epoch": 2113} {"train_loss": -12.12134075164795, "global_step": 355017, "epoch": 2113} {"train_loss": -11.805017471313477, "global_step": 355018, "epoch": 2113} {"train_loss": -9.635933876037598, "global_step": 355019, "epoch": 2113} {"train_loss": -11.184814453125, "global_step": 355020, "epoch": 2113} {"train_loss": -8.324798583984375, "global_step": 355021, "epoch": 2113} {"train_loss": -10.341791152954102, "global_step": 355022, "epoch": 2113} {"train_loss": -10.395428657531738, "global_step": 355023, "epoch": 2113} {"train_loss": -10.388524055480957, "global_step": 355024, "epoch": 2113} {"train_loss": -8.786242485046387, "global_step": 355025, "epoch": 2113} {"train_loss": -9.370858192443848, "global_step": 355026, "epoch": 2113} {"train_loss": -9.712867736816406, "global_step": 355027, "epoch": 2113} {"train_loss": -9.035390853881836, "global_step": 355028, "epoch": 2113} {"train_loss": -9.319381713867188, "global_step": 355029, "epoch": 2113} {"train_loss": -7.832036018371582, "global_step": 355030, "epoch": 2113} {"train_loss": -11.298337936401367, "global_step": 355031, "epoch": 2113} {"train_loss": -8.142614364624023, "global_step": 355032, "epoch": 2113} {"train_loss": -7.899686336517334, "global_step": 355033, "epoch": 2113} {"train_loss": -8.693735122680664, "global_step": 355034, "epoch": 2113} {"train_loss": -10.278507232666016, "global_step": 355035, "epoch": 2113} {"train_loss": -9.200672149658203, "global_step": 355036, "epoch": 2113} {"train_loss": -10.137304306030273, "global_step": 355037, "epoch": 2113} {"train_loss": -10.354530334472656, "global_step": 355038, "epoch": 2113} {"train_loss": -10.566908836364746, "global_step": 355039, "epoch": 2113} {"train_loss": -10.492962837219238, "global_step": 355040, "epoch": 2113} {"train_loss": -10.938724517822266, "global_step": 355041, "epoch": 2113} {"train_loss": -10.817108154296875, "global_step": 355042, "epoch": 2113} {"train_loss": -10.615608215332031, "global_step": 355043, "epoch": 2113} {"train_loss": -11.09201431274414, "global_step": 355044, "epoch": 2113} {"train_loss": -11.084924697875977, "global_step": 355045, "epoch": 2113} {"train_loss": -11.769916534423828, "global_step": 355046, "epoch": 2113} {"train_loss": -11.698012351989746, "global_step": 355047, "epoch": 2113} {"train_loss": -11.452874183654785, "global_step": 355048, "epoch": 2113} {"train_loss": -11.855969429016113, "global_step": 355049, "epoch": 2113} {"train_loss": -11.73205280303955, "global_step": 355050, "epoch": 2113} {"train_loss": -11.644388198852539, "global_step": 355051, "epoch": 2113} {"train_loss": -11.757804870605469, "global_step": 355052, "epoch": 2113} {"train_loss": -11.644207954406738, "global_step": 355053, "epoch": 2113} {"train_loss": -11.62341594696045, "global_step": 355054, "epoch": 2113} {"train_loss": -11.810944557189941, "global_step": 355055, "epoch": 2113} {"train_loss": -12.005417823791504, "global_step": 355056, "epoch": 2113} {"train_loss": -11.887495994567871, "global_step": 355057, "epoch": 2113} {"train_loss": -12.008541107177734, "global_step": 355058, "epoch": 2113} {"train_loss": -11.995990753173828, "global_step": 355059, "epoch": 2113} {"train_loss": -11.990821838378906, "global_step": 355060, "epoch": 2113} {"train_loss": -11.957435607910156, "global_step": 355061, "epoch": 2113} {"train_loss": -11.995774269104004, "global_step": 355062, "epoch": 2113} {"train_loss": -12.087690353393555, "global_step": 355063, "epoch": 2113} {"train_loss": -12.276143074035645, "global_step": 355064, "epoch": 2113} {"train_loss": -11.85126781463623, "global_step": 355065, "epoch": 2113} {"train_loss": -12.182451248168945, "global_step": 355066, "epoch": 2113} {"train_loss": -12.28763198852539, "global_step": 355067, "epoch": 2113} {"train_loss": -11.927473068237305, "global_step": 355068, "epoch": 2113} {"train_loss": -12.131633758544922, "global_step": 355069, "epoch": 2113} {"train_loss": -12.227859497070312, "global_step": 355070, "epoch": 2113} {"train_loss": -12.140271186828613, "global_step": 355071, "epoch": 2113} {"train_loss": -12.119757652282715, "global_step": 355072, "epoch": 2113} {"train_loss": -12.121728897094727, "global_step": 355073, "epoch": 2113} {"train_loss": -12.186408996582031, "global_step": 355074, "epoch": 2113} {"train_loss": -12.144582748413086, "global_step": 355075, "epoch": 2113} {"train_loss": -12.061491012573242, "global_step": 355076, "epoch": 2113} {"train_loss": -12.24156379699707, "global_step": 355077, "epoch": 2113} {"train_loss": -12.137886047363281, "global_step": 355078, "epoch": 2113} {"train_loss": -12.301456451416016, "global_step": 355079, "epoch": 2113} {"train_loss": -12.128753662109375, "global_step": 355080, "epoch": 2113} {"train_loss": -12.179174423217773, "global_step": 355081, "epoch": 2113} {"train_loss": -12.164804458618164, "global_step": 355082, "epoch": 2113} {"train_loss": -12.326570510864258, "global_step": 355083, "epoch": 2113} {"train_loss": -12.195770263671875, "global_step": 355084, "epoch": 2113} {"train_loss": -12.141870498657227, "global_step": 355085, "epoch": 2113} {"train_loss": -12.35118293762207, "global_step": 355086, "epoch": 2113} {"train_loss": -12.27580451965332, "global_step": 355087, "epoch": 2113} {"train_loss": -12.056282997131348, "global_step": 355088, "epoch": 2113} {"train_loss": -12.284143447875977, "global_step": 355089, "epoch": 2113} {"train_loss": -12.28388786315918, "global_step": 355090, "epoch": 2113} {"train_loss": -12.497443199157715, "global_step": 355091, "epoch": 2113} {"train_loss": -12.450299263000488, "global_step": 355092, "epoch": 2113} {"train_loss": -12.386463165283203, "global_step": 355093, "epoch": 2113} {"train_loss": -12.160453796386719, "global_step": 355094, "epoch": 2113} {"train_loss": -12.279821395874023, "global_step": 355095, "epoch": 2113} {"train_loss": -12.257282257080078, "global_step": 355096, "epoch": 2113} {"train_loss": -12.39521312713623, "global_step": 355097, "epoch": 2113} {"train_loss": -12.549236297607422, "global_step": 355098, "epoch": 2113} {"train_loss": -12.410099029541016, "global_step": 355099, "epoch": 2113} {"train_loss": -12.347841262817383, "global_step": 355100, "epoch": 2113} {"train_loss": -12.307093620300293, "global_step": 355101, "epoch": 2113} {"train_loss": -12.201826095581055, "global_step": 355102, "epoch": 2113} {"train_loss": -12.341730117797852, "global_step": 355103, "epoch": 2113} {"train_loss": -12.295692443847656, "global_step": 355104, "epoch": 2113} {"train_loss": -12.285701751708984, "global_step": 355105, "epoch": 2113} {"train_loss": -12.410280227661133, "global_step": 355106, "epoch": 2113} {"train_loss": -12.195402145385742, "global_step": 355107, "epoch": 2113} {"train_loss": -12.59808349609375, "global_step": 355108, "epoch": 2113} {"train_loss": -12.317160606384277, "global_step": 355109, "epoch": 2113} {"train_loss": -12.368232727050781, "global_step": 355110, "epoch": 2113} {"train_loss": -12.52873420715332, "global_step": 355111, "epoch": 2113} {"train_loss": -12.432613372802734, "global_step": 355112, "epoch": 2113} {"train_loss": -12.101399421691895, "global_step": 355113, "epoch": 2113} {"train_loss": -12.610006332397461, "global_step": 355114, "epoch": 2113} {"train_loss": -12.436933517456055, "global_step": 355115, "epoch": 2113} {"train_loss": -12.63650894165039, "global_step": 355116, "epoch": 2113} {"train_loss": -12.4271821975708, "global_step": 355117, "epoch": 2113} {"train_loss": -12.289066314697266, "global_step": 355118, "epoch": 2113} {"train_loss": -12.152312278747559, "global_step": 355119, "epoch": 2113} {"train_loss": -12.500995635986328, "global_step": 355120, "epoch": 2113} {"train_loss": -11.853132247924805, "global_step": 355121, "epoch": 2113} {"train_loss": -12.20051383972168, "global_step": 355122, "epoch": 2113} {"train_loss": -12.541622161865234, "global_step": 355123, "epoch": 2113} {"train_loss": -11.646782875061035, "global_step": 355124, "epoch": 2113} {"train_loss": -12.273061752319336, "global_step": 355125, "epoch": 2113} {"train_loss": -12.097236633300781, "global_step": 355126, "epoch": 2113} {"train_loss": -12.401803970336914, "global_step": 355127, "epoch": 2113} {"train_loss": -12.180232048034668, "global_step": 355128, "epoch": 2113} {"train_loss": -12.273774147033691, "global_step": 355129, "epoch": 2113} {"train_loss": -11.943169593811035, "global_step": 355130, "epoch": 2113} {"train_loss": -12.031929016113281, "global_step": 355131, "epoch": 2113} {"train_loss": -12.157657623291016, "global_step": 355132, "epoch": 2113} {"train_loss": -11.817957878112793, "global_step": 355133, "epoch": 2113} {"train_loss": -12.197734832763672, "global_step": 355134, "epoch": 2113} {"train_loss": -12.442989349365234, "global_step": 355135, "epoch": 2113} {"train_loss": -11.917041778564453, "global_step": 355136, "epoch": 2113} {"train_loss": -11.68655776977539, "global_step": 355137, "epoch": 2113} {"train_loss": -11.694851875305176, "global_step": 355138, "epoch": 2113} {"train_loss": -12.182518005371094, "global_step": 355139, "epoch": 2113} {"train_loss": -12.19080638885498, "global_step": 355140, "epoch": 2113} {"train_loss": -12.048879623413086, "global_step": 355141, "epoch": 2113} {"train_loss": -11.928550720214844, "global_step": 355142, "epoch": 2113} {"train_loss": -12.083575248718262, "global_step": 355143, "epoch": 2113} {"train_loss": -11.543947219848633, "global_step": 355144, "epoch": 2113} {"train_loss": -11.41883659362793, "global_step": 355145, "epoch": 2113} {"train_loss": -11.98520278930664, "global_step": 355146, "epoch": 2113} {"train_loss": -11.909462928771973, "global_step": 355147, "epoch": 2113} {"train_loss": -10.193084716796875, "global_step": 355148, "epoch": 2113} {"train_loss": -11.081682205200195, "global_step": 355149, "epoch": 2113} {"train_loss": -12.327787399291992, "global_step": 355150, "epoch": 2113} {"train_loss": -11.773294082709722, "global_step": 355151, "epoch": 2113, "val_loss": 287772.125} {"train_loss": -11.887054443359375, "global_step": 355152, "epoch": 2114} {"train_loss": -12.608648300170898, "global_step": 355153, "epoch": 2114} {"train_loss": -11.805039405822754, "global_step": 355154, "epoch": 2114} {"train_loss": -11.475469589233398, "global_step": 355155, "epoch": 2114} {"train_loss": -11.786482810974121, "global_step": 355156, "epoch": 2114} {"train_loss": -12.06810188293457, "global_step": 355157, "epoch": 2114} {"train_loss": -11.069061279296875, "global_step": 355158, "epoch": 2114} {"train_loss": -10.823562622070312, "global_step": 355159, "epoch": 2114} {"train_loss": -12.049179077148438, "global_step": 355160, "epoch": 2114} {"train_loss": -11.1675443649292, "global_step": 355161, "epoch": 2114} {"train_loss": -11.904762268066406, "global_step": 355162, "epoch": 2114} {"train_loss": -10.786455154418945, "global_step": 355163, "epoch": 2114} {"train_loss": -11.79582691192627, "global_step": 355164, "epoch": 2114} {"train_loss": -11.38641357421875, "global_step": 355165, "epoch": 2114} {"train_loss": -11.750460624694824, "global_step": 355166, "epoch": 2114} {"train_loss": -11.820938110351562, "global_step": 355167, "epoch": 2114} {"train_loss": -10.87338924407959, "global_step": 355168, "epoch": 2114} {"train_loss": -11.648961067199707, "global_step": 355169, "epoch": 2114} {"train_loss": -11.339370727539062, "global_step": 355170, "epoch": 2114} {"train_loss": -10.869629859924316, "global_step": 355171, "epoch": 2114} {"train_loss": -11.560956954956055, "global_step": 355172, "epoch": 2114} {"train_loss": -10.801024436950684, "global_step": 355173, "epoch": 2114} {"train_loss": -11.45865249633789, "global_step": 355174, "epoch": 2114} {"train_loss": -10.80230712890625, "global_step": 355175, "epoch": 2114} {"train_loss": -11.792755126953125, "global_step": 355176, "epoch": 2114} {"train_loss": -11.769704818725586, "global_step": 355177, "epoch": 2114} {"train_loss": -11.285201072692871, "global_step": 355178, "epoch": 2114} {"train_loss": -12.001970291137695, "global_step": 355179, "epoch": 2114} {"train_loss": -11.672078132629395, "global_step": 355180, "epoch": 2114} {"train_loss": -11.170722961425781, "global_step": 355181, "epoch": 2114} {"train_loss": -12.146947860717773, "global_step": 355182, "epoch": 2114} {"train_loss": -11.19111442565918, "global_step": 355183, "epoch": 2114} {"train_loss": -11.96619701385498, "global_step": 355184, "epoch": 2114} {"train_loss": -11.716943740844727, "global_step": 355185, "epoch": 2114} {"train_loss": -11.873056411743164, "global_step": 355186, "epoch": 2114} {"train_loss": -12.023797035217285, "global_step": 355187, "epoch": 2114} {"train_loss": -11.655694007873535, "global_step": 355188, "epoch": 2114} {"train_loss": -12.010041236877441, "global_step": 355189, "epoch": 2114} {"train_loss": -11.541326522827148, "global_step": 355190, "epoch": 2114} {"train_loss": -12.458799362182617, "global_step": 355191, "epoch": 2114} {"train_loss": -11.832368850708008, "global_step": 355192, "epoch": 2114} {"train_loss": -12.327507019042969, "global_step": 355193, "epoch": 2114} {"train_loss": -12.073439598083496, "global_step": 355194, "epoch": 2114} {"train_loss": -12.181062698364258, "global_step": 355195, "epoch": 2114} {"train_loss": -11.794624328613281, "global_step": 355196, "epoch": 2114} {"train_loss": -12.276557922363281, "global_step": 355197, "epoch": 2114} {"train_loss": -12.352642059326172, "global_step": 355198, "epoch": 2114} {"train_loss": -12.094549179077148, "global_step": 355199, "epoch": 2114} {"train_loss": -12.31100845336914, "global_step": 355200, "epoch": 2114} {"train_loss": -12.330692291259766, "global_step": 355201, "epoch": 2114} {"train_loss": -12.216392517089844, "global_step": 355202, "epoch": 2114} {"train_loss": -12.054710388183594, "global_step": 355203, "epoch": 2114} {"train_loss": -12.50053596496582, "global_step": 355204, "epoch": 2114} {"train_loss": -12.037376403808594, "global_step": 355205, "epoch": 2114} {"train_loss": -12.289922714233398, "global_step": 355206, "epoch": 2114} {"train_loss": -12.477191925048828, "global_step": 355207, "epoch": 2114} {"train_loss": -12.322837829589844, "global_step": 355208, "epoch": 2114} {"train_loss": -12.55059814453125, "global_step": 355209, "epoch": 2114} {"train_loss": -12.13199234008789, "global_step": 355210, "epoch": 2114} {"train_loss": -12.462376594543457, "global_step": 355211, "epoch": 2114} {"train_loss": -12.1976957321167, "global_step": 355212, "epoch": 2114} {"train_loss": -12.374515533447266, "global_step": 355213, "epoch": 2114} {"train_loss": -12.114541053771973, "global_step": 355214, "epoch": 2114} {"train_loss": -12.17595386505127, "global_step": 355215, "epoch": 2114} {"train_loss": -12.566852569580078, "global_step": 355216, "epoch": 2114} {"train_loss": -11.920684814453125, "global_step": 355217, "epoch": 2114} {"train_loss": -12.32728385925293, "global_step": 355218, "epoch": 2114} {"train_loss": -11.9091157913208, "global_step": 355219, "epoch": 2114} {"train_loss": -12.008960723876953, "global_step": 355220, "epoch": 2114} {"train_loss": -12.351821899414062, "global_step": 355221, "epoch": 2114} {"train_loss": -12.247735023498535, "global_step": 355222, "epoch": 2114} {"train_loss": -12.09434986114502, "global_step": 355223, "epoch": 2114} {"train_loss": -11.684038162231445, "global_step": 355224, "epoch": 2114} {"train_loss": -11.93464469909668, "global_step": 355225, "epoch": 2114} {"train_loss": -11.621435165405273, "global_step": 355226, "epoch": 2114} {"train_loss": -12.285210609436035, "global_step": 355227, "epoch": 2114} {"train_loss": -11.643389701843262, "global_step": 355228, "epoch": 2114} {"train_loss": -12.491096496582031, "global_step": 355229, "epoch": 2114} {"train_loss": -11.581036567687988, "global_step": 355230, "epoch": 2114} {"train_loss": -11.927982330322266, "global_step": 355231, "epoch": 2114} {"train_loss": -12.364381790161133, "global_step": 355232, "epoch": 2114} {"train_loss": -11.795286178588867, "global_step": 355233, "epoch": 2114} {"train_loss": -12.212848663330078, "global_step": 355234, "epoch": 2114} {"train_loss": -12.291291236877441, "global_step": 355235, "epoch": 2114} {"train_loss": -12.501924514770508, "global_step": 355236, "epoch": 2114} {"train_loss": -12.156377792358398, "global_step": 355237, "epoch": 2114} {"train_loss": -12.465843200683594, "global_step": 355238, "epoch": 2114} {"train_loss": -12.478260040283203, "global_step": 355239, "epoch": 2114} {"train_loss": -12.415413856506348, "global_step": 355240, "epoch": 2114} {"train_loss": -12.263443946838379, "global_step": 355241, "epoch": 2114} {"train_loss": -12.40412712097168, "global_step": 355242, "epoch": 2114} {"train_loss": -12.399871826171875, "global_step": 355243, "epoch": 2114} {"train_loss": -12.395459175109863, "global_step": 355244, "epoch": 2114} {"train_loss": -12.411752700805664, "global_step": 355245, "epoch": 2114} {"train_loss": -12.394033432006836, "global_step": 355246, "epoch": 2114} {"train_loss": -12.372105598449707, "global_step": 355247, "epoch": 2114} {"train_loss": -12.433263778686523, "global_step": 355248, "epoch": 2114} {"train_loss": -12.43574047088623, "global_step": 355249, "epoch": 2114} {"train_loss": -12.221111297607422, "global_step": 355250, "epoch": 2114} {"train_loss": -12.360504150390625, "global_step": 355251, "epoch": 2114} {"train_loss": -12.431608200073242, "global_step": 355252, "epoch": 2114} {"train_loss": -12.193998336791992, "global_step": 355253, "epoch": 2114} {"train_loss": -12.4375, "global_step": 355254, "epoch": 2114} {"train_loss": -11.52482795715332, "global_step": 355255, "epoch": 2114} {"train_loss": -12.378040313720703, "global_step": 355256, "epoch": 2114} {"train_loss": -12.18832015991211, "global_step": 355257, "epoch": 2114} {"train_loss": -12.170980453491211, "global_step": 355258, "epoch": 2114} {"train_loss": -12.329056739807129, "global_step": 355259, "epoch": 2114} {"train_loss": -12.12140941619873, "global_step": 355260, "epoch": 2114} {"train_loss": -12.04570198059082, "global_step": 355261, "epoch": 2114} {"train_loss": -12.587031364440918, "global_step": 355262, "epoch": 2114} {"train_loss": -12.611968994140625, "global_step": 355263, "epoch": 2114} {"train_loss": -12.423067092895508, "global_step": 355264, "epoch": 2114} {"train_loss": -12.656769752502441, "global_step": 355265, "epoch": 2114} {"train_loss": -12.176166534423828, "global_step": 355266, "epoch": 2114} {"train_loss": -12.546126365661621, "global_step": 355267, "epoch": 2114} {"train_loss": -12.155746459960938, "global_step": 355268, "epoch": 2114} {"train_loss": -11.9016695022583, "global_step": 355269, "epoch": 2114} {"train_loss": -12.203106880187988, "global_step": 355270, "epoch": 2114} {"train_loss": -12.487592697143555, "global_step": 355271, "epoch": 2114} {"train_loss": -12.131587028503418, "global_step": 355272, "epoch": 2114} {"train_loss": -12.031344413757324, "global_step": 355273, "epoch": 2114} {"train_loss": -12.563241004943848, "global_step": 355274, "epoch": 2114} {"train_loss": -12.04482650756836, "global_step": 355275, "epoch": 2114} {"train_loss": -12.271076202392578, "global_step": 355276, "epoch": 2114} {"train_loss": -12.321964263916016, "global_step": 355277, "epoch": 2114} {"train_loss": -12.30496883392334, "global_step": 355278, "epoch": 2114} {"train_loss": -11.726768493652344, "global_step": 355279, "epoch": 2114} {"train_loss": -12.527103424072266, "global_step": 355280, "epoch": 2114} {"train_loss": -12.363471984863281, "global_step": 355281, "epoch": 2114} {"train_loss": -12.346203804016113, "global_step": 355282, "epoch": 2114} {"train_loss": -12.571035385131836, "global_step": 355283, "epoch": 2114} {"train_loss": -12.414432525634766, "global_step": 355284, "epoch": 2114} {"train_loss": -12.429178237915039, "global_step": 355285, "epoch": 2114} {"train_loss": -12.197052955627441, "global_step": 355286, "epoch": 2114} {"train_loss": -12.297600746154785, "global_step": 355287, "epoch": 2114} {"train_loss": -12.370615005493164, "global_step": 355288, "epoch": 2114} {"train_loss": -11.532456398010254, "global_step": 355289, "epoch": 2114} {"train_loss": -12.003297805786133, "global_step": 355290, "epoch": 2114} {"train_loss": -11.495797157287598, "global_step": 355291, "epoch": 2114} {"train_loss": -11.828847885131836, "global_step": 355292, "epoch": 2114} {"train_loss": -12.148136138916016, "global_step": 355293, "epoch": 2114} {"train_loss": -12.6084623336792, "global_step": 355294, "epoch": 2114} {"train_loss": -12.264396667480469, "global_step": 355295, "epoch": 2114} {"train_loss": -11.545475006103516, "global_step": 355296, "epoch": 2114} {"train_loss": -11.69649600982666, "global_step": 355297, "epoch": 2114} {"train_loss": -11.61878776550293, "global_step": 355298, "epoch": 2114} {"train_loss": -11.788695335388184, "global_step": 355299, "epoch": 2114} {"train_loss": -10.386754035949707, "global_step": 355300, "epoch": 2114} {"train_loss": -10.624795913696289, "global_step": 355301, "epoch": 2114} {"train_loss": -10.718158721923828, "global_step": 355302, "epoch": 2114} {"train_loss": -10.206808090209961, "global_step": 355303, "epoch": 2114} {"train_loss": -9.338676452636719, "global_step": 355304, "epoch": 2114} {"train_loss": -11.386218070983887, "global_step": 355305, "epoch": 2114} {"train_loss": -10.725423812866211, "global_step": 355306, "epoch": 2114} {"train_loss": -10.673978805541992, "global_step": 355307, "epoch": 2114} {"train_loss": -9.61872673034668, "global_step": 355308, "epoch": 2114} {"train_loss": -10.409842491149902, "global_step": 355309, "epoch": 2114} {"train_loss": -9.55310344696045, "global_step": 355310, "epoch": 2114} {"train_loss": -9.895893096923828, "global_step": 355311, "epoch": 2114} {"train_loss": -10.27775764465332, "global_step": 355312, "epoch": 2114} {"train_loss": -10.59478759765625, "global_step": 355313, "epoch": 2114} {"train_loss": -9.922904968261719, "global_step": 355314, "epoch": 2114} {"train_loss": -11.263835906982422, "global_step": 355315, "epoch": 2114} {"train_loss": -9.529394149780273, "global_step": 355316, "epoch": 2114} {"train_loss": -10.970030784606934, "global_step": 355317, "epoch": 2114} {"train_loss": -10.061932563781738, "global_step": 355318, "epoch": 2114} {"train_loss": -11.837108186313085, "global_step": 355319, "epoch": 2114, "val_loss": 283220.375} {"train_loss": -10.994041442871094, "global_step": 355320, "epoch": 2115} {"train_loss": -10.708695411682129, "global_step": 355321, "epoch": 2115} {"train_loss": -10.849499702453613, "global_step": 355322, "epoch": 2115} {"train_loss": -9.976987838745117, "global_step": 355323, "epoch": 2115} {"train_loss": -11.279903411865234, "global_step": 355324, "epoch": 2115} {"train_loss": -10.005704879760742, "global_step": 355325, "epoch": 2115} {"train_loss": -11.118666648864746, "global_step": 355326, "epoch": 2115} {"train_loss": -10.805074691772461, "global_step": 355327, "epoch": 2115} {"train_loss": -11.195650100708008, "global_step": 355328, "epoch": 2115} {"train_loss": -10.457494735717773, "global_step": 355329, "epoch": 2115} {"train_loss": -11.233827590942383, "global_step": 355330, "epoch": 2115} {"train_loss": -11.258356094360352, "global_step": 355331, "epoch": 2115} {"train_loss": -11.198933601379395, "global_step": 355332, "epoch": 2115} {"train_loss": -11.482338905334473, "global_step": 355333, "epoch": 2115} {"train_loss": -10.74957275390625, "global_step": 355334, "epoch": 2115} {"train_loss": -12.029708862304688, "global_step": 355335, "epoch": 2115} {"train_loss": -11.022928237915039, "global_step": 355336, "epoch": 2115} {"train_loss": -11.728693008422852, "global_step": 355337, "epoch": 2115} {"train_loss": -11.38055419921875, "global_step": 355338, "epoch": 2115} {"train_loss": -11.124893188476562, "global_step": 355339, "epoch": 2115} {"train_loss": -10.865763664245605, "global_step": 355340, "epoch": 2115} {"train_loss": -11.736956596374512, "global_step": 355341, "epoch": 2115} {"train_loss": -10.660531997680664, "global_step": 355342, "epoch": 2115} {"train_loss": -11.521626472473145, "global_step": 355343, "epoch": 2115} {"train_loss": -11.47266960144043, "global_step": 355344, "epoch": 2115} {"train_loss": -11.2051420211792, "global_step": 355345, "epoch": 2115} {"train_loss": -12.11235237121582, "global_step": 355346, "epoch": 2115} {"train_loss": -11.225987434387207, "global_step": 355347, "epoch": 2115} {"train_loss": -11.785210609436035, "global_step": 355348, "epoch": 2115} {"train_loss": -11.626907348632812, "global_step": 355349, "epoch": 2115} {"train_loss": -11.787263870239258, "global_step": 355350, "epoch": 2115} {"train_loss": -11.754863739013672, "global_step": 355351, "epoch": 2115} {"train_loss": -11.64755630493164, "global_step": 355352, "epoch": 2115} {"train_loss": -11.7540922164917, "global_step": 355353, "epoch": 2115} {"train_loss": -11.968125343322754, "global_step": 355354, "epoch": 2115} {"train_loss": -12.107648849487305, "global_step": 355355, "epoch": 2115} {"train_loss": -11.915328979492188, "global_step": 355356, "epoch": 2115} {"train_loss": -12.326671600341797, "global_step": 355357, "epoch": 2115} {"train_loss": -12.10131549835205, "global_step": 355358, "epoch": 2115} {"train_loss": -12.189826011657715, "global_step": 355359, "epoch": 2115} {"train_loss": -12.217540740966797, "global_step": 355360, "epoch": 2115} {"train_loss": -12.345949172973633, "global_step": 355361, "epoch": 2115} {"train_loss": -12.23241138458252, "global_step": 355362, "epoch": 2115} {"train_loss": -12.293790817260742, "global_step": 355363, "epoch": 2115} {"train_loss": -12.184664726257324, "global_step": 355364, "epoch": 2115} {"train_loss": -12.104048728942871, "global_step": 355365, "epoch": 2115} {"train_loss": -12.181336402893066, "global_step": 355366, "epoch": 2115} {"train_loss": -12.349011421203613, "global_step": 355367, "epoch": 2115} {"train_loss": -12.346833229064941, "global_step": 355368, "epoch": 2115} {"train_loss": -12.365262985229492, "global_step": 355369, "epoch": 2115} {"train_loss": -12.209344863891602, "global_step": 355370, "epoch": 2115} {"train_loss": -12.432646751403809, "global_step": 355371, "epoch": 2115} {"train_loss": -12.233179092407227, "global_step": 355372, "epoch": 2115} {"train_loss": -12.327170372009277, "global_step": 355373, "epoch": 2115} {"train_loss": -12.325342178344727, "global_step": 355374, "epoch": 2115} {"train_loss": -12.38132095336914, "global_step": 355375, "epoch": 2115} {"train_loss": -12.323116302490234, "global_step": 355376, "epoch": 2115} {"train_loss": -12.333316802978516, "global_step": 355377, "epoch": 2115} {"train_loss": -12.327098846435547, "global_step": 355378, "epoch": 2115} {"train_loss": -12.592232704162598, "global_step": 355379, "epoch": 2115} {"train_loss": -12.45436954498291, "global_step": 355380, "epoch": 2115} {"train_loss": -12.399404525756836, "global_step": 355381, "epoch": 2115} {"train_loss": -12.428442001342773, "global_step": 355382, "epoch": 2115} {"train_loss": -12.460389137268066, "global_step": 355383, "epoch": 2115} {"train_loss": -12.348888397216797, "global_step": 355384, "epoch": 2115} {"train_loss": -12.602548599243164, "global_step": 355385, "epoch": 2115} {"train_loss": -12.273210525512695, "global_step": 355386, "epoch": 2115} {"train_loss": -12.60819149017334, "global_step": 355387, "epoch": 2115} {"train_loss": -12.44873046875, "global_step": 355388, "epoch": 2115} {"train_loss": -12.556520462036133, "global_step": 355389, "epoch": 2115} {"train_loss": -12.288366317749023, "global_step": 355390, "epoch": 2115} {"train_loss": -12.779979705810547, "global_step": 355391, "epoch": 2115} {"train_loss": -12.190845489501953, "global_step": 355392, "epoch": 2115} {"train_loss": -12.284806251525879, "global_step": 355393, "epoch": 2115} {"train_loss": -12.41891098022461, "global_step": 355394, "epoch": 2115} {"train_loss": -12.248514175415039, "global_step": 355395, "epoch": 2115} {"train_loss": -12.580867767333984, "global_step": 355396, "epoch": 2115} {"train_loss": -12.379802703857422, "global_step": 355397, "epoch": 2115} {"train_loss": -12.379913330078125, "global_step": 355398, "epoch": 2115} {"train_loss": -12.586761474609375, "global_step": 355399, "epoch": 2115} {"train_loss": -12.43809700012207, "global_step": 355400, "epoch": 2115} {"train_loss": -12.5431489944458, "global_step": 355401, "epoch": 2115} {"train_loss": -12.464118003845215, "global_step": 355402, "epoch": 2115} {"train_loss": -12.123941421508789, "global_step": 355403, "epoch": 2115} {"train_loss": -12.416173934936523, "global_step": 355404, "epoch": 2115} {"train_loss": -12.569042205810547, "global_step": 355405, "epoch": 2115} {"train_loss": -12.378555297851562, "global_step": 355406, "epoch": 2115} {"train_loss": -12.432695388793945, "global_step": 355407, "epoch": 2115} {"train_loss": -12.745450973510742, "global_step": 355408, "epoch": 2115} {"train_loss": -12.438567161560059, "global_step": 355409, "epoch": 2115} {"train_loss": -12.30324935913086, "global_step": 355410, "epoch": 2115} {"train_loss": -12.59653377532959, "global_step": 355411, "epoch": 2115} {"train_loss": -12.429176330566406, "global_step": 355412, "epoch": 2115} {"train_loss": -12.328453063964844, "global_step": 355413, "epoch": 2115} {"train_loss": -12.380071640014648, "global_step": 355414, "epoch": 2115} {"train_loss": -12.381150245666504, "global_step": 355415, "epoch": 2115} {"train_loss": -12.068312644958496, "global_step": 355416, "epoch": 2115} {"train_loss": -12.310422897338867, "global_step": 355417, "epoch": 2115} {"train_loss": -12.052886009216309, "global_step": 355418, "epoch": 2115} {"train_loss": -12.544509887695312, "global_step": 355419, "epoch": 2115} {"train_loss": -11.729883193969727, "global_step": 355420, "epoch": 2115} {"train_loss": -11.45899772644043, "global_step": 355421, "epoch": 2115} {"train_loss": -11.10936450958252, "global_step": 355422, "epoch": 2115} {"train_loss": -12.041558265686035, "global_step": 355423, "epoch": 2115} {"train_loss": -11.926103591918945, "global_step": 355424, "epoch": 2115} {"train_loss": -12.29548168182373, "global_step": 355425, "epoch": 2115} {"train_loss": -12.024514198303223, "global_step": 355426, "epoch": 2115} {"train_loss": -11.739385604858398, "global_step": 355427, "epoch": 2115} {"train_loss": -12.248725891113281, "global_step": 355428, "epoch": 2115} {"train_loss": -11.472467422485352, "global_step": 355429, "epoch": 2115} {"train_loss": -11.790746688842773, "global_step": 355430, "epoch": 2115} {"train_loss": -11.746280670166016, "global_step": 355431, "epoch": 2115} {"train_loss": -10.475164413452148, "global_step": 355432, "epoch": 2115} {"train_loss": -11.98818588256836, "global_step": 355433, "epoch": 2115} {"train_loss": -11.22622299194336, "global_step": 355434, "epoch": 2115} {"train_loss": -11.034889221191406, "global_step": 355435, "epoch": 2115} {"train_loss": -11.931109428405762, "global_step": 355436, "epoch": 2115} {"train_loss": -10.614620208740234, "global_step": 355437, "epoch": 2115} {"train_loss": -11.738966941833496, "global_step": 355438, "epoch": 2115} {"train_loss": -11.630562782287598, "global_step": 355439, "epoch": 2115} {"train_loss": -11.431646347045898, "global_step": 355440, "epoch": 2115} {"train_loss": -11.352981567382812, "global_step": 355441, "epoch": 2115} {"train_loss": -10.808300018310547, "global_step": 355442, "epoch": 2115} {"train_loss": -11.581595420837402, "global_step": 355443, "epoch": 2115} {"train_loss": -11.925167083740234, "global_step": 355444, "epoch": 2115} {"train_loss": -11.03458023071289, "global_step": 355445, "epoch": 2115} {"train_loss": -10.892707824707031, "global_step": 355446, "epoch": 2115} {"train_loss": -11.859397888183594, "global_step": 355447, "epoch": 2115} {"train_loss": -11.655041694641113, "global_step": 355448, "epoch": 2115} {"train_loss": -10.908811569213867, "global_step": 355449, "epoch": 2115} {"train_loss": -11.904561996459961, "global_step": 355450, "epoch": 2115} {"train_loss": -10.729818344116211, "global_step": 355451, "epoch": 2115} {"train_loss": -11.712316513061523, "global_step": 355452, "epoch": 2115} {"train_loss": -11.744211196899414, "global_step": 355453, "epoch": 2115} {"train_loss": -11.637332916259766, "global_step": 355454, "epoch": 2115} {"train_loss": -12.460761070251465, "global_step": 355455, "epoch": 2115} {"train_loss": -11.31832504272461, "global_step": 355456, "epoch": 2115} {"train_loss": -12.220280647277832, "global_step": 355457, "epoch": 2115} {"train_loss": -11.87089729309082, "global_step": 355458, "epoch": 2115} {"train_loss": -12.326396942138672, "global_step": 355459, "epoch": 2115} {"train_loss": -12.064598083496094, "global_step": 355460, "epoch": 2115} {"train_loss": -11.714232444763184, "global_step": 355461, "epoch": 2115} {"train_loss": -12.087112426757812, "global_step": 355462, "epoch": 2115} {"train_loss": -12.040825843811035, "global_step": 355463, "epoch": 2115} {"train_loss": -12.087068557739258, "global_step": 355464, "epoch": 2115} {"train_loss": -12.409126281738281, "global_step": 355465, "epoch": 2115} {"train_loss": -12.101152420043945, "global_step": 355466, "epoch": 2115} {"train_loss": -11.962419509887695, "global_step": 355467, "epoch": 2115} {"train_loss": -11.689008712768555, "global_step": 355468, "epoch": 2115} {"train_loss": -12.229009628295898, "global_step": 355469, "epoch": 2115} {"train_loss": -12.042509078979492, "global_step": 355470, "epoch": 2115} {"train_loss": -12.071290969848633, "global_step": 355471, "epoch": 2115} {"train_loss": -12.445362091064453, "global_step": 355472, "epoch": 2115} {"train_loss": -12.145929336547852, "global_step": 355473, "epoch": 2115} {"train_loss": -12.519381523132324, "global_step": 355474, "epoch": 2115} {"train_loss": -12.140146255493164, "global_step": 355475, "epoch": 2115} {"train_loss": -12.276701927185059, "global_step": 355476, "epoch": 2115} {"train_loss": -12.304117202758789, "global_step": 355477, "epoch": 2115} {"train_loss": -12.38250732421875, "global_step": 355478, "epoch": 2115} {"train_loss": -12.381685256958008, "global_step": 355479, "epoch": 2115} {"train_loss": -12.378466606140137, "global_step": 355480, "epoch": 2115} {"train_loss": -12.223517417907715, "global_step": 355481, "epoch": 2115} {"train_loss": -12.387121200561523, "global_step": 355482, "epoch": 2115} {"train_loss": -12.410846710205078, "global_step": 355483, "epoch": 2115} {"train_loss": -12.24700927734375, "global_step": 355484, "epoch": 2115} {"train_loss": -12.563821792602539, "global_step": 355485, "epoch": 2115} {"train_loss": -12.591119766235352, "global_step": 355486, "epoch": 2115} {"train_loss": -11.92102183046795, "global_step": 355487, "epoch": 2115, "val_loss": 289449.65625, "train_action_mse_error": 1.40376877784729} {"train_loss": -12.077774047851562, "global_step": 355488, "epoch": 2116} {"train_loss": -12.41439437866211, "global_step": 355489, "epoch": 2116} {"train_loss": -11.969249725341797, "global_step": 355490, "epoch": 2116} {"train_loss": -12.008329391479492, "global_step": 355491, "epoch": 2116} {"train_loss": -12.216485023498535, "global_step": 355492, "epoch": 2116} {"train_loss": -12.019220352172852, "global_step": 355493, "epoch": 2116} {"train_loss": -12.359065055847168, "global_step": 355494, "epoch": 2116} {"train_loss": -12.008915901184082, "global_step": 355495, "epoch": 2116} {"train_loss": -12.415192604064941, "global_step": 355496, "epoch": 2116} {"train_loss": -12.042755126953125, "global_step": 355497, "epoch": 2116} {"train_loss": -12.350841522216797, "global_step": 355498, "epoch": 2116} {"train_loss": -12.07247543334961, "global_step": 355499, "epoch": 2116} {"train_loss": -12.475274085998535, "global_step": 355500, "epoch": 2116} {"train_loss": -11.859893798828125, "global_step": 355501, "epoch": 2116} {"train_loss": -12.578071594238281, "global_step": 355502, "epoch": 2116} {"train_loss": -12.33128833770752, "global_step": 355503, "epoch": 2116} {"train_loss": -11.728708267211914, "global_step": 355504, "epoch": 2116} {"train_loss": -12.179609298706055, "global_step": 355505, "epoch": 2116} {"train_loss": -11.81243896484375, "global_step": 355506, "epoch": 2116} {"train_loss": -11.917312622070312, "global_step": 355507, "epoch": 2116} {"train_loss": -12.207789421081543, "global_step": 355508, "epoch": 2116} {"train_loss": -12.342923164367676, "global_step": 355509, "epoch": 2116} {"train_loss": -11.919610977172852, "global_step": 355510, "epoch": 2116} {"train_loss": -11.792309761047363, "global_step": 355511, "epoch": 2116} {"train_loss": -12.235240936279297, "global_step": 355512, "epoch": 2116} {"train_loss": -11.43107795715332, "global_step": 355513, "epoch": 2116} {"train_loss": -11.557807922363281, "global_step": 355514, "epoch": 2116} {"train_loss": -10.788320541381836, "global_step": 355515, "epoch": 2116} {"train_loss": -9.03657341003418, "global_step": 355516, "epoch": 2116} {"train_loss": -10.431110382080078, "global_step": 355517, "epoch": 2116} {"train_loss": -10.999090194702148, "global_step": 355518, "epoch": 2116} {"train_loss": -10.810086250305176, "global_step": 355519, "epoch": 2116} {"train_loss": -10.47628402709961, "global_step": 355520, "epoch": 2116} {"train_loss": -10.967841148376465, "global_step": 355521, "epoch": 2116} {"train_loss": -10.504162788391113, "global_step": 355522, "epoch": 2116} {"train_loss": -11.54014778137207, "global_step": 355523, "epoch": 2116} {"train_loss": -10.101944923400879, "global_step": 355524, "epoch": 2116} {"train_loss": -11.79635238647461, "global_step": 355525, "epoch": 2116} {"train_loss": -11.053241729736328, "global_step": 355526, "epoch": 2116} {"train_loss": -10.895952224731445, "global_step": 355527, "epoch": 2116} {"train_loss": -11.453604698181152, "global_step": 355528, "epoch": 2116} {"train_loss": -11.086596488952637, "global_step": 355529, "epoch": 2116} {"train_loss": -10.78825569152832, "global_step": 355530, "epoch": 2116} {"train_loss": -11.091336250305176, "global_step": 355531, "epoch": 2116} {"train_loss": -10.680648803710938, "global_step": 355532, "epoch": 2116} {"train_loss": -11.084617614746094, "global_step": 355533, "epoch": 2116} {"train_loss": -11.33529281616211, "global_step": 355534, "epoch": 2116} {"train_loss": -10.865119934082031, "global_step": 355535, "epoch": 2116} {"train_loss": -10.832815170288086, "global_step": 355536, "epoch": 2116} {"train_loss": -10.676385879516602, "global_step": 355537, "epoch": 2116} {"train_loss": -9.702488899230957, "global_step": 355538, "epoch": 2116} {"train_loss": -10.10858154296875, "global_step": 355539, "epoch": 2116} {"train_loss": -10.449912071228027, "global_step": 355540, "epoch": 2116} {"train_loss": -9.698079109191895, "global_step": 355541, "epoch": 2116} {"train_loss": -10.756900787353516, "global_step": 355542, "epoch": 2116} {"train_loss": -10.7896146774292, "global_step": 355543, "epoch": 2116} {"train_loss": -11.130884170532227, "global_step": 355544, "epoch": 2116} {"train_loss": -11.534612655639648, "global_step": 355545, "epoch": 2116} {"train_loss": -11.445270538330078, "global_step": 355546, "epoch": 2116} {"train_loss": -11.032426834106445, "global_step": 355547, "epoch": 2116} {"train_loss": -11.852230072021484, "global_step": 355548, "epoch": 2116} {"train_loss": -11.038009643554688, "global_step": 355549, "epoch": 2116} {"train_loss": -11.57191276550293, "global_step": 355550, "epoch": 2116} {"train_loss": -11.756943702697754, "global_step": 355551, "epoch": 2116} {"train_loss": -11.766988754272461, "global_step": 355552, "epoch": 2116} {"train_loss": -11.455041885375977, "global_step": 355553, "epoch": 2116} {"train_loss": -11.890130996704102, "global_step": 355554, "epoch": 2116} {"train_loss": -11.607906341552734, "global_step": 355555, "epoch": 2116} {"train_loss": -11.52779769897461, "global_step": 355556, "epoch": 2116} {"train_loss": -11.718308448791504, "global_step": 355557, "epoch": 2116} {"train_loss": -11.556520462036133, "global_step": 355558, "epoch": 2116} {"train_loss": -11.676798820495605, "global_step": 355559, "epoch": 2116} {"train_loss": -12.11310863494873, "global_step": 355560, "epoch": 2116} {"train_loss": -11.4451904296875, "global_step": 355561, "epoch": 2116} {"train_loss": -11.700957298278809, "global_step": 355562, "epoch": 2116} {"train_loss": -11.677274703979492, "global_step": 355563, "epoch": 2116} {"train_loss": -11.420732498168945, "global_step": 355564, "epoch": 2116} {"train_loss": -12.200410842895508, "global_step": 355565, "epoch": 2116} {"train_loss": -11.76920223236084, "global_step": 355566, "epoch": 2116} {"train_loss": -11.21163558959961, "global_step": 355567, "epoch": 2116} {"train_loss": -12.021112442016602, "global_step": 355568, "epoch": 2116} {"train_loss": -11.551942825317383, "global_step": 355569, "epoch": 2116} {"train_loss": -11.822345733642578, "global_step": 355570, "epoch": 2116} {"train_loss": -12.15771770477295, "global_step": 355571, "epoch": 2116} {"train_loss": -11.50057601928711, "global_step": 355572, "epoch": 2116} {"train_loss": -12.082011222839355, "global_step": 355573, "epoch": 2116} {"train_loss": -12.147635459899902, "global_step": 355574, "epoch": 2116} {"train_loss": -11.540623664855957, "global_step": 355575, "epoch": 2116} {"train_loss": -12.139650344848633, "global_step": 355576, "epoch": 2116} {"train_loss": -11.81462287902832, "global_step": 355577, "epoch": 2116} {"train_loss": -11.93101692199707, "global_step": 355578, "epoch": 2116} {"train_loss": -12.039621353149414, "global_step": 355579, "epoch": 2116} {"train_loss": -11.441909790039062, "global_step": 355580, "epoch": 2116} {"train_loss": -12.104019165039062, "global_step": 355581, "epoch": 2116} {"train_loss": -11.915703773498535, "global_step": 355582, "epoch": 2116} {"train_loss": -11.856512069702148, "global_step": 355583, "epoch": 2116} {"train_loss": -12.422714233398438, "global_step": 355584, "epoch": 2116} {"train_loss": -11.86400032043457, "global_step": 355585, "epoch": 2116} {"train_loss": -12.25088119506836, "global_step": 355586, "epoch": 2116} {"train_loss": -12.167381286621094, "global_step": 355587, "epoch": 2116} {"train_loss": -12.062494277954102, "global_step": 355588, "epoch": 2116} {"train_loss": -12.33677864074707, "global_step": 355589, "epoch": 2116} {"train_loss": -12.243778228759766, "global_step": 355590, "epoch": 2116} {"train_loss": -12.178433418273926, "global_step": 355591, "epoch": 2116} {"train_loss": -12.338171005249023, "global_step": 355592, "epoch": 2116} {"train_loss": -12.169321060180664, "global_step": 355593, "epoch": 2116} {"train_loss": -12.135948181152344, "global_step": 355594, "epoch": 2116} {"train_loss": -12.06169319152832, "global_step": 355595, "epoch": 2116} {"train_loss": -12.290929794311523, "global_step": 355596, "epoch": 2116} {"train_loss": -12.023508071899414, "global_step": 355597, "epoch": 2116} {"train_loss": -12.437824249267578, "global_step": 355598, "epoch": 2116} {"train_loss": -11.994126319885254, "global_step": 355599, "epoch": 2116} {"train_loss": -12.263368606567383, "global_step": 355600, "epoch": 2116} {"train_loss": -12.059981346130371, "global_step": 355601, "epoch": 2116} {"train_loss": -12.208969116210938, "global_step": 355602, "epoch": 2116} {"train_loss": -12.370502471923828, "global_step": 355603, "epoch": 2116} {"train_loss": -12.20398235321045, "global_step": 355604, "epoch": 2116} {"train_loss": -12.402562141418457, "global_step": 355605, "epoch": 2116} {"train_loss": -12.159677505493164, "global_step": 355606, "epoch": 2116} {"train_loss": -12.302108764648438, "global_step": 355607, "epoch": 2116} {"train_loss": -12.189850807189941, "global_step": 355608, "epoch": 2116} {"train_loss": -12.403348922729492, "global_step": 355609, "epoch": 2116} {"train_loss": -12.11621379852295, "global_step": 355610, "epoch": 2116} {"train_loss": -12.397957801818848, "global_step": 355611, "epoch": 2116} {"train_loss": -12.079129219055176, "global_step": 355612, "epoch": 2116} {"train_loss": -12.116972923278809, "global_step": 355613, "epoch": 2116} {"train_loss": -12.218236923217773, "global_step": 355614, "epoch": 2116} {"train_loss": -12.29288101196289, "global_step": 355615, "epoch": 2116} {"train_loss": -12.442453384399414, "global_step": 355616, "epoch": 2116} {"train_loss": -12.564586639404297, "global_step": 355617, "epoch": 2116} {"train_loss": -12.471904754638672, "global_step": 355618, "epoch": 2116} {"train_loss": -12.448676109313965, "global_step": 355619, "epoch": 2116} {"train_loss": -12.481199264526367, "global_step": 355620, "epoch": 2116} {"train_loss": -12.384622573852539, "global_step": 355621, "epoch": 2116} {"train_loss": -12.679145812988281, "global_step": 355622, "epoch": 2116} {"train_loss": -12.502864837646484, "global_step": 355623, "epoch": 2116} {"train_loss": -12.606287002563477, "global_step": 355624, "epoch": 2116} {"train_loss": -12.516139030456543, "global_step": 355625, "epoch": 2116} {"train_loss": -12.524352073669434, "global_step": 355626, "epoch": 2116} {"train_loss": -12.499345779418945, "global_step": 355627, "epoch": 2116} {"train_loss": -12.648275375366211, "global_step": 355628, "epoch": 2116} {"train_loss": -12.51794147491455, "global_step": 355629, "epoch": 2116} {"train_loss": -12.579584121704102, "global_step": 355630, "epoch": 2116} {"train_loss": -12.484556198120117, "global_step": 355631, "epoch": 2116} {"train_loss": -12.57810115814209, "global_step": 355632, "epoch": 2116} {"train_loss": -12.531097412109375, "global_step": 355633, "epoch": 2116} {"train_loss": -12.580814361572266, "global_step": 355634, "epoch": 2116} {"train_loss": -12.560450553894043, "global_step": 355635, "epoch": 2116} {"train_loss": -12.372014045715332, "global_step": 355636, "epoch": 2116} {"train_loss": -12.612211227416992, "global_step": 355637, "epoch": 2116} {"train_loss": -12.60354995727539, "global_step": 355638, "epoch": 2116} {"train_loss": -12.713991165161133, "global_step": 355639, "epoch": 2116} {"train_loss": -12.746302604675293, "global_step": 355640, "epoch": 2116} {"train_loss": -12.737089157104492, "global_step": 355641, "epoch": 2116} {"train_loss": -12.628665924072266, "global_step": 355642, "epoch": 2116} {"train_loss": -12.725646018981934, "global_step": 355643, "epoch": 2116} {"train_loss": -12.781227111816406, "global_step": 355644, "epoch": 2116} {"train_loss": -12.530275344848633, "global_step": 355645, "epoch": 2116} {"train_loss": -12.653188705444336, "global_step": 355646, "epoch": 2116} {"train_loss": -12.495826721191406, "global_step": 355647, "epoch": 2116} {"train_loss": -12.71874713897705, "global_step": 355648, "epoch": 2116} {"train_loss": -12.752202987670898, "global_step": 355649, "epoch": 2116} {"train_loss": -12.683165550231934, "global_step": 355650, "epoch": 2116} {"train_loss": -12.293885231018066, "global_step": 355651, "epoch": 2116} {"train_loss": -12.402525901794434, "global_step": 355652, "epoch": 2116} {"train_loss": -12.784347534179688, "global_step": 355653, "epoch": 2116} {"train_loss": -11.418025970458984, "global_step": 355654, "epoch": 2116} {"train_loss": -11.885979998679389, "global_step": 355655, "epoch": 2116, "val_loss": 289889.09375} {"train_loss": -10.90729808807373, "global_step": 355656, "epoch": 2117} {"train_loss": -12.336174964904785, "global_step": 355657, "epoch": 2117} {"train_loss": -12.118020057678223, "global_step": 355658, "epoch": 2117} {"train_loss": -11.025552749633789, "global_step": 355659, "epoch": 2117} {"train_loss": -11.428961753845215, "global_step": 355660, "epoch": 2117} {"train_loss": -12.218255996704102, "global_step": 355661, "epoch": 2117} {"train_loss": -11.113454818725586, "global_step": 355662, "epoch": 2117} {"train_loss": -10.8795166015625, "global_step": 355663, "epoch": 2117} {"train_loss": -11.992064476013184, "global_step": 355664, "epoch": 2117} {"train_loss": -11.737396240234375, "global_step": 355665, "epoch": 2117} {"train_loss": -11.299708366394043, "global_step": 355666, "epoch": 2117} {"train_loss": -10.8729248046875, "global_step": 355667, "epoch": 2117} {"train_loss": -10.699283599853516, "global_step": 355668, "epoch": 2117} {"train_loss": -11.512039184570312, "global_step": 355669, "epoch": 2117} {"train_loss": -10.926204681396484, "global_step": 355670, "epoch": 2117} {"train_loss": -11.283134460449219, "global_step": 355671, "epoch": 2117} {"train_loss": -11.82571792602539, "global_step": 355672, "epoch": 2117} {"train_loss": -11.710851669311523, "global_step": 355673, "epoch": 2117} {"train_loss": -11.427221298217773, "global_step": 355674, "epoch": 2117} {"train_loss": -11.69633960723877, "global_step": 355675, "epoch": 2117} {"train_loss": -10.643669128417969, "global_step": 355676, "epoch": 2117} {"train_loss": -9.495138168334961, "global_step": 355677, "epoch": 2117} {"train_loss": -11.1063232421875, "global_step": 355678, "epoch": 2117} {"train_loss": -8.856304168701172, "global_step": 355679, "epoch": 2117} {"train_loss": -8.784049987792969, "global_step": 355680, "epoch": 2117} {"train_loss": -9.00224494934082, "global_step": 355681, "epoch": 2117} {"train_loss": -11.249441146850586, "global_step": 355682, "epoch": 2117} {"train_loss": -8.34200382232666, "global_step": 355683, "epoch": 2117} {"train_loss": -11.231914520263672, "global_step": 355684, "epoch": 2117} {"train_loss": -10.08318042755127, "global_step": 355685, "epoch": 2117} {"train_loss": -10.617923736572266, "global_step": 355686, "epoch": 2117} {"train_loss": -10.630325317382812, "global_step": 355687, "epoch": 2117} {"train_loss": -9.170207977294922, "global_step": 355688, "epoch": 2117} {"train_loss": -11.77412223815918, "global_step": 355689, "epoch": 2117} {"train_loss": -10.800040245056152, "global_step": 355690, "epoch": 2117} {"train_loss": -11.550243377685547, "global_step": 355691, "epoch": 2117} {"train_loss": -11.089388847351074, "global_step": 355692, "epoch": 2117} {"train_loss": -11.634775161743164, "global_step": 355693, "epoch": 2117} {"train_loss": -11.469017028808594, "global_step": 355694, "epoch": 2117} {"train_loss": -11.636276245117188, "global_step": 355695, "epoch": 2117} {"train_loss": -11.361055374145508, "global_step": 355696, "epoch": 2117} {"train_loss": -11.302667617797852, "global_step": 355697, "epoch": 2117} {"train_loss": -12.146245956420898, "global_step": 355698, "epoch": 2117} {"train_loss": -11.341531753540039, "global_step": 355699, "epoch": 2117} {"train_loss": -12.06946849822998, "global_step": 355700, "epoch": 2117} {"train_loss": -11.605245590209961, "global_step": 355701, "epoch": 2117} {"train_loss": -11.79185676574707, "global_step": 355702, "epoch": 2117} {"train_loss": -11.834453582763672, "global_step": 355703, "epoch": 2117} {"train_loss": -11.843324661254883, "global_step": 355704, "epoch": 2117} {"train_loss": -11.833959579467773, "global_step": 355705, "epoch": 2117} {"train_loss": -12.217416763305664, "global_step": 355706, "epoch": 2117} {"train_loss": -11.948230743408203, "global_step": 355707, "epoch": 2117} {"train_loss": -11.74549674987793, "global_step": 355708, "epoch": 2117} {"train_loss": -12.052325248718262, "global_step": 355709, "epoch": 2117} {"train_loss": -11.75727653503418, "global_step": 355710, "epoch": 2117} {"train_loss": -11.849788665771484, "global_step": 355711, "epoch": 2117} {"train_loss": -12.010303497314453, "global_step": 355712, "epoch": 2117} {"train_loss": -11.745922088623047, "global_step": 355713, "epoch": 2117} {"train_loss": -12.215888977050781, "global_step": 355714, "epoch": 2117} {"train_loss": -11.921316146850586, "global_step": 355715, "epoch": 2117} {"train_loss": -12.276098251342773, "global_step": 355716, "epoch": 2117} {"train_loss": -12.05156135559082, "global_step": 355717, "epoch": 2117} {"train_loss": -12.04481315612793, "global_step": 355718, "epoch": 2117} {"train_loss": -12.286844253540039, "global_step": 355719, "epoch": 2117} {"train_loss": -11.975224494934082, "global_step": 355720, "epoch": 2117} {"train_loss": -12.135822296142578, "global_step": 355721, "epoch": 2117} {"train_loss": -12.023456573486328, "global_step": 355722, "epoch": 2117} {"train_loss": -12.122507095336914, "global_step": 355723, "epoch": 2117} {"train_loss": -12.209440231323242, "global_step": 355724, "epoch": 2117} {"train_loss": -12.092601776123047, "global_step": 355725, "epoch": 2117} {"train_loss": -12.304275512695312, "global_step": 355726, "epoch": 2117} {"train_loss": -12.385356903076172, "global_step": 355727, "epoch": 2117} {"train_loss": -12.288352966308594, "global_step": 355728, "epoch": 2117} {"train_loss": -12.531991958618164, "global_step": 355729, "epoch": 2117} {"train_loss": -12.492487907409668, "global_step": 355730, "epoch": 2117} {"train_loss": -12.376123428344727, "global_step": 355731, "epoch": 2117} {"train_loss": -12.224355697631836, "global_step": 355732, "epoch": 2117} {"train_loss": -12.412616729736328, "global_step": 355733, "epoch": 2117} {"train_loss": -12.080619812011719, "global_step": 355734, "epoch": 2117} {"train_loss": -12.360686302185059, "global_step": 355735, "epoch": 2117} {"train_loss": -12.323437690734863, "global_step": 355736, "epoch": 2117} {"train_loss": -12.088848114013672, "global_step": 355737, "epoch": 2117} {"train_loss": -12.49490737915039, "global_step": 355738, "epoch": 2117} {"train_loss": -11.97680950164795, "global_step": 355739, "epoch": 2117} {"train_loss": -12.26845932006836, "global_step": 355740, "epoch": 2117} {"train_loss": -12.221298217773438, "global_step": 355741, "epoch": 2117} {"train_loss": -12.476158142089844, "global_step": 355742, "epoch": 2117} {"train_loss": -12.172832489013672, "global_step": 355743, "epoch": 2117} {"train_loss": -12.137765884399414, "global_step": 355744, "epoch": 2117} {"train_loss": -12.44858455657959, "global_step": 355745, "epoch": 2117} {"train_loss": -12.310441017150879, "global_step": 355746, "epoch": 2117} {"train_loss": -12.372611045837402, "global_step": 355747, "epoch": 2117} {"train_loss": -12.253774642944336, "global_step": 355748, "epoch": 2117} {"train_loss": -12.29616928100586, "global_step": 355749, "epoch": 2117} {"train_loss": -12.265373229980469, "global_step": 355750, "epoch": 2117} {"train_loss": -12.263428688049316, "global_step": 355751, "epoch": 2117} {"train_loss": -12.277593612670898, "global_step": 355752, "epoch": 2117} {"train_loss": -12.463690757751465, "global_step": 355753, "epoch": 2117} {"train_loss": -12.389151573181152, "global_step": 355754, "epoch": 2117} {"train_loss": -12.307918548583984, "global_step": 355755, "epoch": 2117} {"train_loss": -12.53416919708252, "global_step": 355756, "epoch": 2117} {"train_loss": -12.439815521240234, "global_step": 355757, "epoch": 2117} {"train_loss": -12.66912841796875, "global_step": 355758, "epoch": 2117} {"train_loss": -12.462529182434082, "global_step": 355759, "epoch": 2117} {"train_loss": -12.365938186645508, "global_step": 355760, "epoch": 2117} {"train_loss": -12.48378849029541, "global_step": 355761, "epoch": 2117} {"train_loss": -12.551756858825684, "global_step": 355762, "epoch": 2117} {"train_loss": -12.34837532043457, "global_step": 355763, "epoch": 2117} {"train_loss": -12.541051864624023, "global_step": 355764, "epoch": 2117} {"train_loss": -12.525574684143066, "global_step": 355765, "epoch": 2117} {"train_loss": -12.336835861206055, "global_step": 355766, "epoch": 2117} {"train_loss": -12.577325820922852, "global_step": 355767, "epoch": 2117} {"train_loss": -11.88276481628418, "global_step": 355768, "epoch": 2117} {"train_loss": -12.375621795654297, "global_step": 355769, "epoch": 2117} {"train_loss": -12.225505828857422, "global_step": 355770, "epoch": 2117} {"train_loss": -11.849047660827637, "global_step": 355771, "epoch": 2117} {"train_loss": -12.402091979980469, "global_step": 355772, "epoch": 2117} {"train_loss": -11.932350158691406, "global_step": 355773, "epoch": 2117} {"train_loss": -11.66291332244873, "global_step": 355774, "epoch": 2117} {"train_loss": -11.98213005065918, "global_step": 355775, "epoch": 2117} {"train_loss": -11.351350784301758, "global_step": 355776, "epoch": 2117} {"train_loss": -11.668543815612793, "global_step": 355777, "epoch": 2117} {"train_loss": -10.299922943115234, "global_step": 355778, "epoch": 2117} {"train_loss": -12.222814559936523, "global_step": 355779, "epoch": 2117} {"train_loss": -10.686019897460938, "global_step": 355780, "epoch": 2117} {"train_loss": -11.842935562133789, "global_step": 355781, "epoch": 2117} {"train_loss": -12.16458511352539, "global_step": 355782, "epoch": 2117} {"train_loss": -11.261984825134277, "global_step": 355783, "epoch": 2117} {"train_loss": -11.911611557006836, "global_step": 355784, "epoch": 2117} {"train_loss": -11.346513748168945, "global_step": 355785, "epoch": 2117} {"train_loss": -11.706327438354492, "global_step": 355786, "epoch": 2117} {"train_loss": -11.483148574829102, "global_step": 355787, "epoch": 2117} {"train_loss": -12.050331115722656, "global_step": 355788, "epoch": 2117} {"train_loss": -11.287457466125488, "global_step": 355789, "epoch": 2117} {"train_loss": -12.214683532714844, "global_step": 355790, "epoch": 2117} {"train_loss": -11.252351760864258, "global_step": 355791, "epoch": 2117} {"train_loss": -11.98086166381836, "global_step": 355792, "epoch": 2117} {"train_loss": -11.882314682006836, "global_step": 355793, "epoch": 2117} {"train_loss": -12.24290657043457, "global_step": 355794, "epoch": 2117} {"train_loss": -11.569238662719727, "global_step": 355795, "epoch": 2117} {"train_loss": -11.796808242797852, "global_step": 355796, "epoch": 2117} {"train_loss": -11.770874977111816, "global_step": 355797, "epoch": 2117} {"train_loss": -12.088340759277344, "global_step": 355798, "epoch": 2117} {"train_loss": -11.918949127197266, "global_step": 355799, "epoch": 2117} {"train_loss": -12.092161178588867, "global_step": 355800, "epoch": 2117} {"train_loss": -11.906200408935547, "global_step": 355801, "epoch": 2117} {"train_loss": -11.836362838745117, "global_step": 355802, "epoch": 2117} {"train_loss": -12.102240562438965, "global_step": 355803, "epoch": 2117} {"train_loss": -12.063255310058594, "global_step": 355804, "epoch": 2117} {"train_loss": -11.900434494018555, "global_step": 355805, "epoch": 2117} {"train_loss": -11.76650619506836, "global_step": 355806, "epoch": 2117} {"train_loss": -11.779082298278809, "global_step": 355807, "epoch": 2117} {"train_loss": -12.415724754333496, "global_step": 355808, "epoch": 2117} {"train_loss": -11.411514282226562, "global_step": 355809, "epoch": 2117} {"train_loss": -11.845952987670898, "global_step": 355810, "epoch": 2117} {"train_loss": -11.65971851348877, "global_step": 355811, "epoch": 2117} {"train_loss": -11.473591804504395, "global_step": 355812, "epoch": 2117} {"train_loss": -11.938983917236328, "global_step": 355813, "epoch": 2117} {"train_loss": -11.203737258911133, "global_step": 355814, "epoch": 2117} {"train_loss": -11.87882137298584, "global_step": 355815, "epoch": 2117} {"train_loss": -11.828646659851074, "global_step": 355816, "epoch": 2117} {"train_loss": -11.443777084350586, "global_step": 355817, "epoch": 2117} {"train_loss": -11.467781066894531, "global_step": 355818, "epoch": 2117} {"train_loss": -11.541399955749512, "global_step": 355819, "epoch": 2117} {"train_loss": -11.517550468444824, "global_step": 355820, "epoch": 2117} {"train_loss": -11.896839141845703, "global_step": 355821, "epoch": 2117} {"train_loss": -11.645040512084961, "global_step": 355822, "epoch": 2117} {"train_loss": -11.746562781788054, "global_step": 355823, "epoch": 2117, "val_loss": 288342.71875} {"train_loss": -11.718636512756348, "global_step": 355824, "epoch": 2118} {"train_loss": -10.857088088989258, "global_step": 355825, "epoch": 2118} {"train_loss": -11.705694198608398, "global_step": 355826, "epoch": 2118} {"train_loss": -11.583672523498535, "global_step": 355827, "epoch": 2118} {"train_loss": -11.708484649658203, "global_step": 355828, "epoch": 2118} {"train_loss": -11.771966934204102, "global_step": 355829, "epoch": 2118} {"train_loss": -11.36621379852295, "global_step": 355830, "epoch": 2118} {"train_loss": -11.911688804626465, "global_step": 355831, "epoch": 2118} {"train_loss": -10.991188049316406, "global_step": 355832, "epoch": 2118} {"train_loss": -11.844253540039062, "global_step": 355833, "epoch": 2118} {"train_loss": -10.780838966369629, "global_step": 355834, "epoch": 2118} {"train_loss": -11.322736740112305, "global_step": 355835, "epoch": 2118} {"train_loss": -11.802045822143555, "global_step": 355836, "epoch": 2118} {"train_loss": -11.034074783325195, "global_step": 355837, "epoch": 2118} {"train_loss": -11.834177017211914, "global_step": 355838, "epoch": 2118} {"train_loss": -11.415159225463867, "global_step": 355839, "epoch": 2118} {"train_loss": -11.394550323486328, "global_step": 355840, "epoch": 2118} {"train_loss": -12.055301666259766, "global_step": 355841, "epoch": 2118} {"train_loss": -10.731568336486816, "global_step": 355842, "epoch": 2118} {"train_loss": -12.132532119750977, "global_step": 355843, "epoch": 2118} {"train_loss": -11.608968734741211, "global_step": 355844, "epoch": 2118} {"train_loss": -11.741358757019043, "global_step": 355845, "epoch": 2118} {"train_loss": -11.748554229736328, "global_step": 355846, "epoch": 2118} {"train_loss": -11.484455108642578, "global_step": 355847, "epoch": 2118} {"train_loss": -12.158805847167969, "global_step": 355848, "epoch": 2118} {"train_loss": -11.832311630249023, "global_step": 355849, "epoch": 2118} {"train_loss": -12.1862154006958, "global_step": 355850, "epoch": 2118} {"train_loss": -11.88730239868164, "global_step": 355851, "epoch": 2118} {"train_loss": -12.173955917358398, "global_step": 355852, "epoch": 2118} {"train_loss": -11.857290267944336, "global_step": 355853, "epoch": 2118} {"train_loss": -12.137531280517578, "global_step": 355854, "epoch": 2118} {"train_loss": -12.18197250366211, "global_step": 355855, "epoch": 2118} {"train_loss": -12.170339584350586, "global_step": 355856, "epoch": 2118} {"train_loss": -12.209836959838867, "global_step": 355857, "epoch": 2118} {"train_loss": -12.20370101928711, "global_step": 355858, "epoch": 2118} {"train_loss": -12.282154083251953, "global_step": 355859, "epoch": 2118} {"train_loss": -12.263286590576172, "global_step": 355860, "epoch": 2118} {"train_loss": -12.208999633789062, "global_step": 355861, "epoch": 2118} {"train_loss": -12.397167205810547, "global_step": 355862, "epoch": 2118} {"train_loss": -11.829188346862793, "global_step": 355863, "epoch": 2118} {"train_loss": -12.360755920410156, "global_step": 355864, "epoch": 2118} {"train_loss": -12.117278099060059, "global_step": 355865, "epoch": 2118} {"train_loss": -12.532205581665039, "global_step": 355866, "epoch": 2118} {"train_loss": -12.410400390625, "global_step": 355867, "epoch": 2118} {"train_loss": -12.332281112670898, "global_step": 355868, "epoch": 2118} {"train_loss": -12.376142501831055, "global_step": 355869, "epoch": 2118} {"train_loss": -12.479904174804688, "global_step": 355870, "epoch": 2118} {"train_loss": -12.140572547912598, "global_step": 355871, "epoch": 2118} {"train_loss": -12.334628105163574, "global_step": 355872, "epoch": 2118} {"train_loss": -12.382072448730469, "global_step": 355873, "epoch": 2118} {"train_loss": -12.261377334594727, "global_step": 355874, "epoch": 2118} {"train_loss": -12.205471992492676, "global_step": 355875, "epoch": 2118} {"train_loss": -12.288475036621094, "global_step": 355876, "epoch": 2118} {"train_loss": -12.365163803100586, "global_step": 355877, "epoch": 2118} {"train_loss": -12.148641586303711, "global_step": 355878, "epoch": 2118} {"train_loss": -12.254761695861816, "global_step": 355879, "epoch": 2118} {"train_loss": -12.288942337036133, "global_step": 355880, "epoch": 2118} {"train_loss": -12.266770362854004, "global_step": 355881, "epoch": 2118} {"train_loss": -12.161614418029785, "global_step": 355882, "epoch": 2118} {"train_loss": -12.217795372009277, "global_step": 355883, "epoch": 2118} {"train_loss": -12.267882347106934, "global_step": 355884, "epoch": 2118} {"train_loss": -12.281122207641602, "global_step": 355885, "epoch": 2118} {"train_loss": -12.39360237121582, "global_step": 355886, "epoch": 2118} {"train_loss": -12.706205368041992, "global_step": 355887, "epoch": 2118} {"train_loss": -12.478407859802246, "global_step": 355888, "epoch": 2118} {"train_loss": -12.550468444824219, "global_step": 355889, "epoch": 2118} {"train_loss": -12.446211814880371, "global_step": 355890, "epoch": 2118} {"train_loss": -12.508536338806152, "global_step": 355891, "epoch": 2118} {"train_loss": -12.529031753540039, "global_step": 355892, "epoch": 2118} {"train_loss": -12.381534576416016, "global_step": 355893, "epoch": 2118} {"train_loss": -12.49744987487793, "global_step": 355894, "epoch": 2118} {"train_loss": -12.544218063354492, "global_step": 355895, "epoch": 2118} {"train_loss": -12.540975570678711, "global_step": 355896, "epoch": 2118} {"train_loss": -12.375061988830566, "global_step": 355897, "epoch": 2118} {"train_loss": -12.053323745727539, "global_step": 355898, "epoch": 2118} {"train_loss": -12.725123405456543, "global_step": 355899, "epoch": 2118} {"train_loss": -12.295684814453125, "global_step": 355900, "epoch": 2118} {"train_loss": -12.171918869018555, "global_step": 355901, "epoch": 2118} {"train_loss": -12.527963638305664, "global_step": 355902, "epoch": 2118} {"train_loss": -12.539588928222656, "global_step": 355903, "epoch": 2118} {"train_loss": -12.212299346923828, "global_step": 355904, "epoch": 2118} {"train_loss": -11.854982376098633, "global_step": 355905, "epoch": 2118} {"train_loss": -12.418570518493652, "global_step": 355906, "epoch": 2118} {"train_loss": -12.443915367126465, "global_step": 355907, "epoch": 2118} {"train_loss": -11.941810607910156, "global_step": 355908, "epoch": 2118} {"train_loss": -12.528435707092285, "global_step": 355909, "epoch": 2118} {"train_loss": -12.184042930603027, "global_step": 355910, "epoch": 2118} {"train_loss": -11.75018310546875, "global_step": 355911, "epoch": 2118} {"train_loss": -12.610881805419922, "global_step": 355912, "epoch": 2118} {"train_loss": -11.705415725708008, "global_step": 355913, "epoch": 2118} {"train_loss": -11.882858276367188, "global_step": 355914, "epoch": 2118} {"train_loss": -12.406267166137695, "global_step": 355915, "epoch": 2118} {"train_loss": -12.450246810913086, "global_step": 355916, "epoch": 2118} {"train_loss": -11.693952560424805, "global_step": 355917, "epoch": 2118} {"train_loss": -10.909478187561035, "global_step": 355918, "epoch": 2118} {"train_loss": -12.213314056396484, "global_step": 355919, "epoch": 2118} {"train_loss": -11.931808471679688, "global_step": 355920, "epoch": 2118} {"train_loss": -10.69022274017334, "global_step": 355921, "epoch": 2118} {"train_loss": -11.56447982788086, "global_step": 355922, "epoch": 2118} {"train_loss": -12.509416580200195, "global_step": 355923, "epoch": 2118} {"train_loss": -11.407036781311035, "global_step": 355924, "epoch": 2118} {"train_loss": -11.51744270324707, "global_step": 355925, "epoch": 2118} {"train_loss": -12.377111434936523, "global_step": 355926, "epoch": 2118} {"train_loss": -11.952025413513184, "global_step": 355927, "epoch": 2118} {"train_loss": -12.419404983520508, "global_step": 355928, "epoch": 2118} {"train_loss": -12.189067840576172, "global_step": 355929, "epoch": 2118} {"train_loss": -12.316749572753906, "global_step": 355930, "epoch": 2118} {"train_loss": -12.276765823364258, "global_step": 355931, "epoch": 2118} {"train_loss": -12.239785194396973, "global_step": 355932, "epoch": 2118} {"train_loss": -12.583237648010254, "global_step": 355933, "epoch": 2118} {"train_loss": -11.629592895507812, "global_step": 355934, "epoch": 2118} {"train_loss": -12.49465274810791, "global_step": 355935, "epoch": 2118} {"train_loss": -12.020258903503418, "global_step": 355936, "epoch": 2118} {"train_loss": -12.294570922851562, "global_step": 355937, "epoch": 2118} {"train_loss": -12.318656921386719, "global_step": 355938, "epoch": 2118} {"train_loss": -12.450874328613281, "global_step": 355939, "epoch": 2118} {"train_loss": -11.821422576904297, "global_step": 355940, "epoch": 2118} {"train_loss": -12.168338775634766, "global_step": 355941, "epoch": 2118} {"train_loss": -11.608741760253906, "global_step": 355942, "epoch": 2118} {"train_loss": -11.196134567260742, "global_step": 355943, "epoch": 2118} {"train_loss": -12.2614164352417, "global_step": 355944, "epoch": 2118} {"train_loss": -11.094549179077148, "global_step": 355945, "epoch": 2118} {"train_loss": -11.172072410583496, "global_step": 355946, "epoch": 2118} {"train_loss": -11.744890213012695, "global_step": 355947, "epoch": 2118} {"train_loss": -11.599584579467773, "global_step": 355948, "epoch": 2118} {"train_loss": -11.772329330444336, "global_step": 355949, "epoch": 2118} {"train_loss": -10.714252471923828, "global_step": 355950, "epoch": 2118} {"train_loss": -12.083963394165039, "global_step": 355951, "epoch": 2118} {"train_loss": -10.10129165649414, "global_step": 355952, "epoch": 2118} {"train_loss": -11.559576034545898, "global_step": 355953, "epoch": 2118} {"train_loss": -9.596479415893555, "global_step": 355954, "epoch": 2118} {"train_loss": -10.07916259765625, "global_step": 355955, "epoch": 2118} {"train_loss": -11.385820388793945, "global_step": 355956, "epoch": 2118} {"train_loss": -7.46113920211792, "global_step": 355957, "epoch": 2118} {"train_loss": -9.127836227416992, "global_step": 355958, "epoch": 2118} {"train_loss": -9.792831420898438, "global_step": 355959, "epoch": 2118} {"train_loss": -9.444066047668457, "global_step": 355960, "epoch": 2118} {"train_loss": -10.665675163269043, "global_step": 355961, "epoch": 2118} {"train_loss": -8.202279090881348, "global_step": 355962, "epoch": 2118} {"train_loss": -8.928940773010254, "global_step": 355963, "epoch": 2118} {"train_loss": -9.424495697021484, "global_step": 355964, "epoch": 2118} {"train_loss": -9.956384658813477, "global_step": 355965, "epoch": 2118} {"train_loss": -10.542263984680176, "global_step": 355966, "epoch": 2118} {"train_loss": -9.36208724975586, "global_step": 355967, "epoch": 2118} {"train_loss": -11.1376314163208, "global_step": 355968, "epoch": 2118} {"train_loss": -10.459840774536133, "global_step": 355969, "epoch": 2118} {"train_loss": -11.040979385375977, "global_step": 355970, "epoch": 2118} {"train_loss": -9.710834503173828, "global_step": 355971, "epoch": 2118} {"train_loss": -11.035738945007324, "global_step": 355972, "epoch": 2118} {"train_loss": -10.605025291442871, "global_step": 355973, "epoch": 2118} {"train_loss": -11.730199813842773, "global_step": 355974, "epoch": 2118} {"train_loss": -10.707858085632324, "global_step": 355975, "epoch": 2118} {"train_loss": -11.495827674865723, "global_step": 355976, "epoch": 2118} {"train_loss": -10.501220703125, "global_step": 355977, "epoch": 2118} {"train_loss": -11.49515151977539, "global_step": 355978, "epoch": 2118} {"train_loss": -10.809270858764648, "global_step": 355979, "epoch": 2118} {"train_loss": -11.320066452026367, "global_step": 355980, "epoch": 2118} {"train_loss": -10.561748504638672, "global_step": 355981, "epoch": 2118} {"train_loss": -10.842976570129395, "global_step": 355982, "epoch": 2118} {"train_loss": -11.133443832397461, "global_step": 355983, "epoch": 2118} {"train_loss": -11.38741683959961, "global_step": 355984, "epoch": 2118} {"train_loss": -11.041616439819336, "global_step": 355985, "epoch": 2118} {"train_loss": -11.455245018005371, "global_step": 355986, "epoch": 2118} {"train_loss": -11.118188858032227, "global_step": 355987, "epoch": 2118} {"train_loss": -11.398834228515625, "global_step": 355988, "epoch": 2118} {"train_loss": -11.7593355178833, "global_step": 355989, "epoch": 2118} {"train_loss": -11.013142585754395, "global_step": 355990, "epoch": 2118} {"train_loss": -11.668470606917428, "global_step": 355991, "epoch": 2118, "val_loss": 286069.3125} {"train_loss": -11.384284019470215, "global_step": 355992, "epoch": 2119} {"train_loss": -11.963396072387695, "global_step": 355993, "epoch": 2119} {"train_loss": -11.717766761779785, "global_step": 355994, "epoch": 2119} {"train_loss": -11.801225662231445, "global_step": 355995, "epoch": 2119} {"train_loss": -11.820075988769531, "global_step": 355996, "epoch": 2119} {"train_loss": -11.629473686218262, "global_step": 355997, "epoch": 2119} {"train_loss": -11.800355911254883, "global_step": 355998, "epoch": 2119} {"train_loss": -11.749584197998047, "global_step": 355999, "epoch": 2119} {"train_loss": -11.852849960327148, "global_step": 356000, "epoch": 2119} {"train_loss": -11.851811408996582, "global_step": 356001, "epoch": 2119} {"train_loss": -12.245172500610352, "global_step": 356002, "epoch": 2119} {"train_loss": -11.999038696289062, "global_step": 356003, "epoch": 2119} {"train_loss": -11.914264678955078, "global_step": 356004, "epoch": 2119} {"train_loss": -12.067301750183105, "global_step": 356005, "epoch": 2119} {"train_loss": -11.876925468444824, "global_step": 356006, "epoch": 2119} {"train_loss": -11.901865005493164, "global_step": 356007, "epoch": 2119} {"train_loss": -12.00680160522461, "global_step": 356008, "epoch": 2119} {"train_loss": -11.572495460510254, "global_step": 356009, "epoch": 2119} {"train_loss": -11.988580703735352, "global_step": 356010, "epoch": 2119} {"train_loss": -12.081293106079102, "global_step": 356011, "epoch": 2119} {"train_loss": -12.145977020263672, "global_step": 356012, "epoch": 2119} {"train_loss": -11.92846393585205, "global_step": 356013, "epoch": 2119} {"train_loss": -11.916496276855469, "global_step": 356014, "epoch": 2119} {"train_loss": -12.106151580810547, "global_step": 356015, "epoch": 2119} {"train_loss": -11.921537399291992, "global_step": 356016, "epoch": 2119} {"train_loss": -11.949361801147461, "global_step": 356017, "epoch": 2119} {"train_loss": -12.109981536865234, "global_step": 356018, "epoch": 2119} {"train_loss": -12.193059921264648, "global_step": 356019, "epoch": 2119} {"train_loss": -12.024354934692383, "global_step": 356020, "epoch": 2119} {"train_loss": -12.243175506591797, "global_step": 356021, "epoch": 2119} {"train_loss": -12.209342002868652, "global_step": 356022, "epoch": 2119} {"train_loss": -12.236213684082031, "global_step": 356023, "epoch": 2119} {"train_loss": -12.20779037475586, "global_step": 356024, "epoch": 2119} {"train_loss": -12.277315139770508, "global_step": 356025, "epoch": 2119} {"train_loss": -12.27063274383545, "global_step": 356026, "epoch": 2119} {"train_loss": -12.297791481018066, "global_step": 356027, "epoch": 2119} {"train_loss": -12.154903411865234, "global_step": 356028, "epoch": 2119} {"train_loss": -12.335489273071289, "global_step": 356029, "epoch": 2119} {"train_loss": -12.038114547729492, "global_step": 356030, "epoch": 2119} {"train_loss": -12.110490798950195, "global_step": 356031, "epoch": 2119} {"train_loss": -12.44835376739502, "global_step": 356032, "epoch": 2119} {"train_loss": -11.939472198486328, "global_step": 356033, "epoch": 2119} {"train_loss": -12.394187927246094, "global_step": 356034, "epoch": 2119} {"train_loss": -12.195110321044922, "global_step": 356035, "epoch": 2119} {"train_loss": -12.230219841003418, "global_step": 356036, "epoch": 2119} {"train_loss": -12.306916236877441, "global_step": 356037, "epoch": 2119} {"train_loss": -12.411855697631836, "global_step": 356038, "epoch": 2119} {"train_loss": -12.385149002075195, "global_step": 356039, "epoch": 2119} {"train_loss": -12.28726863861084, "global_step": 356040, "epoch": 2119} {"train_loss": -12.40328598022461, "global_step": 356041, "epoch": 2119} {"train_loss": -12.339582443237305, "global_step": 356042, "epoch": 2119} {"train_loss": -12.35276985168457, "global_step": 356043, "epoch": 2119} {"train_loss": -12.249167442321777, "global_step": 356044, "epoch": 2119} {"train_loss": -12.466909408569336, "global_step": 356045, "epoch": 2119} {"train_loss": -12.513871192932129, "global_step": 356046, "epoch": 2119} {"train_loss": -12.328315734863281, "global_step": 356047, "epoch": 2119} {"train_loss": -12.20589828491211, "global_step": 356048, "epoch": 2119} {"train_loss": -12.24521255493164, "global_step": 356049, "epoch": 2119} {"train_loss": -12.503290176391602, "global_step": 356050, "epoch": 2119} {"train_loss": -12.545547485351562, "global_step": 356051, "epoch": 2119} {"train_loss": -12.495865821838379, "global_step": 356052, "epoch": 2119} {"train_loss": -12.428129196166992, "global_step": 356053, "epoch": 2119} {"train_loss": -12.33935832977295, "global_step": 356054, "epoch": 2119} {"train_loss": -12.39528751373291, "global_step": 356055, "epoch": 2119} {"train_loss": -12.358112335205078, "global_step": 356056, "epoch": 2119} {"train_loss": -12.488990783691406, "global_step": 356057, "epoch": 2119} {"train_loss": -12.518138885498047, "global_step": 356058, "epoch": 2119} {"train_loss": -12.505776405334473, "global_step": 356059, "epoch": 2119} {"train_loss": -12.36160659790039, "global_step": 356060, "epoch": 2119} {"train_loss": -12.430611610412598, "global_step": 356061, "epoch": 2119} {"train_loss": -12.424758911132812, "global_step": 356062, "epoch": 2119} {"train_loss": -12.303388595581055, "global_step": 356063, "epoch": 2119} {"train_loss": -12.30821704864502, "global_step": 356064, "epoch": 2119} {"train_loss": -12.706932067871094, "global_step": 356065, "epoch": 2119} {"train_loss": -12.50989818572998, "global_step": 356066, "epoch": 2119} {"train_loss": -12.407410621643066, "global_step": 356067, "epoch": 2119} {"train_loss": -12.305790901184082, "global_step": 356068, "epoch": 2119} {"train_loss": -12.400872230529785, "global_step": 356069, "epoch": 2119} {"train_loss": -12.709514617919922, "global_step": 356070, "epoch": 2119} {"train_loss": -12.44090461730957, "global_step": 356071, "epoch": 2119} {"train_loss": -12.593315124511719, "global_step": 356072, "epoch": 2119} {"train_loss": -12.080926895141602, "global_step": 356073, "epoch": 2119} {"train_loss": -12.165264129638672, "global_step": 356074, "epoch": 2119} {"train_loss": -12.026058197021484, "global_step": 356075, "epoch": 2119} {"train_loss": -12.418449401855469, "global_step": 356076, "epoch": 2119} {"train_loss": -11.99975299835205, "global_step": 356077, "epoch": 2119} {"train_loss": -11.96966552734375, "global_step": 356078, "epoch": 2119} {"train_loss": -11.447941780090332, "global_step": 356079, "epoch": 2119} {"train_loss": -12.657522201538086, "global_step": 356080, "epoch": 2119} {"train_loss": -11.573282241821289, "global_step": 356081, "epoch": 2119} {"train_loss": -11.965351104736328, "global_step": 356082, "epoch": 2119} {"train_loss": -11.722766876220703, "global_step": 356083, "epoch": 2119} {"train_loss": -12.066823959350586, "global_step": 356084, "epoch": 2119} {"train_loss": -12.230377197265625, "global_step": 356085, "epoch": 2119} {"train_loss": -12.157779693603516, "global_step": 356086, "epoch": 2119} {"train_loss": -12.277776718139648, "global_step": 356087, "epoch": 2119} {"train_loss": -11.86766242980957, "global_step": 356088, "epoch": 2119} {"train_loss": -11.994699478149414, "global_step": 356089, "epoch": 2119} {"train_loss": -12.255818367004395, "global_step": 356090, "epoch": 2119} {"train_loss": -11.490360260009766, "global_step": 356091, "epoch": 2119} {"train_loss": -11.765239715576172, "global_step": 356092, "epoch": 2119} {"train_loss": -12.413646697998047, "global_step": 356093, "epoch": 2119} {"train_loss": -11.863908767700195, "global_step": 356094, "epoch": 2119} {"train_loss": -12.202978134155273, "global_step": 356095, "epoch": 2119} {"train_loss": -12.181482315063477, "global_step": 356096, "epoch": 2119} {"train_loss": -11.806699752807617, "global_step": 356097, "epoch": 2119} {"train_loss": -11.973673820495605, "global_step": 356098, "epoch": 2119} {"train_loss": -11.794130325317383, "global_step": 356099, "epoch": 2119} {"train_loss": -11.552196502685547, "global_step": 356100, "epoch": 2119} {"train_loss": -12.02865219116211, "global_step": 356101, "epoch": 2119} {"train_loss": -12.294456481933594, "global_step": 356102, "epoch": 2119} {"train_loss": -11.939882278442383, "global_step": 356103, "epoch": 2119} {"train_loss": -12.385217666625977, "global_step": 356104, "epoch": 2119} {"train_loss": -12.2001953125, "global_step": 356105, "epoch": 2119} {"train_loss": -12.40965747833252, "global_step": 356106, "epoch": 2119} {"train_loss": -12.315845489501953, "global_step": 356107, "epoch": 2119} {"train_loss": -11.637731552124023, "global_step": 356108, "epoch": 2119} {"train_loss": -12.10239028930664, "global_step": 356109, "epoch": 2119} {"train_loss": -11.460098266601562, "global_step": 356110, "epoch": 2119} {"train_loss": -11.014589309692383, "global_step": 356111, "epoch": 2119} {"train_loss": -12.393292427062988, "global_step": 356112, "epoch": 2119} {"train_loss": -11.684553146362305, "global_step": 356113, "epoch": 2119} {"train_loss": -11.210384368896484, "global_step": 356114, "epoch": 2119} {"train_loss": -12.031181335449219, "global_step": 356115, "epoch": 2119} {"train_loss": -11.079648971557617, "global_step": 356116, "epoch": 2119} {"train_loss": -10.675191879272461, "global_step": 356117, "epoch": 2119} {"train_loss": -11.966819763183594, "global_step": 356118, "epoch": 2119} {"train_loss": -9.520291328430176, "global_step": 356119, "epoch": 2119} {"train_loss": -11.533802032470703, "global_step": 356120, "epoch": 2119} {"train_loss": -10.40270709991455, "global_step": 356121, "epoch": 2119} {"train_loss": -10.79512882232666, "global_step": 356122, "epoch": 2119} {"train_loss": -11.614938735961914, "global_step": 356123, "epoch": 2119} {"train_loss": -11.219849586486816, "global_step": 356124, "epoch": 2119} {"train_loss": -11.60919189453125, "global_step": 356125, "epoch": 2119} {"train_loss": -10.07674789428711, "global_step": 356126, "epoch": 2119} {"train_loss": -11.086963653564453, "global_step": 356127, "epoch": 2119} {"train_loss": -8.725973129272461, "global_step": 356128, "epoch": 2119} {"train_loss": -11.454500198364258, "global_step": 356129, "epoch": 2119} {"train_loss": -9.849176406860352, "global_step": 356130, "epoch": 2119} {"train_loss": -11.261133193969727, "global_step": 356131, "epoch": 2119} {"train_loss": -11.316736221313477, "global_step": 356132, "epoch": 2119} {"train_loss": -11.686487197875977, "global_step": 356133, "epoch": 2119} {"train_loss": -11.13056755065918, "global_step": 356134, "epoch": 2119} {"train_loss": -11.564752578735352, "global_step": 356135, "epoch": 2119} {"train_loss": -11.40679931640625, "global_step": 356136, "epoch": 2119} {"train_loss": -11.580757141113281, "global_step": 356137, "epoch": 2119} {"train_loss": -11.403486251831055, "global_step": 356138, "epoch": 2119} {"train_loss": -11.80329704284668, "global_step": 356139, "epoch": 2119} {"train_loss": -11.712234497070312, "global_step": 356140, "epoch": 2119} {"train_loss": -11.493415832519531, "global_step": 356141, "epoch": 2119} {"train_loss": -11.729837417602539, "global_step": 356142, "epoch": 2119} {"train_loss": -11.574542045593262, "global_step": 356143, "epoch": 2119} {"train_loss": -11.541162490844727, "global_step": 356144, "epoch": 2119} {"train_loss": -12.030463218688965, "global_step": 356145, "epoch": 2119} {"train_loss": -11.830568313598633, "global_step": 356146, "epoch": 2119} {"train_loss": -11.835639953613281, "global_step": 356147, "epoch": 2119} {"train_loss": -12.183804512023926, "global_step": 356148, "epoch": 2119} {"train_loss": -12.11404800415039, "global_step": 356149, "epoch": 2119} {"train_loss": -12.029340744018555, "global_step": 356150, "epoch": 2119} {"train_loss": -12.11054801940918, "global_step": 356151, "epoch": 2119} {"train_loss": -11.575313568115234, "global_step": 356152, "epoch": 2119} {"train_loss": -12.120859146118164, "global_step": 356153, "epoch": 2119} {"train_loss": -12.104391098022461, "global_step": 356154, "epoch": 2119} {"train_loss": -11.899665832519531, "global_step": 356155, "epoch": 2119} {"train_loss": -11.809091567993164, "global_step": 356156, "epoch": 2119} {"train_loss": -12.109663009643555, "global_step": 356157, "epoch": 2119} {"train_loss": -12.399089813232422, "global_step": 356158, "epoch": 2119} {"train_loss": -11.942771605082921, "global_step": 356159, "epoch": 2119, "val_loss": 293024.3125} {"train_loss": -12.14967155456543, "global_step": 356160, "epoch": 2120} {"train_loss": -12.215536117553711, "global_step": 356161, "epoch": 2120} {"train_loss": -12.187219619750977, "global_step": 356162, "epoch": 2120} {"train_loss": -12.242774963378906, "global_step": 356163, "epoch": 2120} {"train_loss": -12.591836929321289, "global_step": 356164, "epoch": 2120} {"train_loss": -11.969954490661621, "global_step": 356165, "epoch": 2120} {"train_loss": -11.894227027893066, "global_step": 356166, "epoch": 2120} {"train_loss": -12.326367378234863, "global_step": 356167, "epoch": 2120} {"train_loss": -11.829076766967773, "global_step": 356168, "epoch": 2120} {"train_loss": -11.819269180297852, "global_step": 356169, "epoch": 2120} {"train_loss": -12.263982772827148, "global_step": 356170, "epoch": 2120} {"train_loss": -12.0409574508667, "global_step": 356171, "epoch": 2120} {"train_loss": -12.148004531860352, "global_step": 356172, "epoch": 2120} {"train_loss": -12.16871452331543, "global_step": 356173, "epoch": 2120} {"train_loss": -12.189217567443848, "global_step": 356174, "epoch": 2120} {"train_loss": -11.973597526550293, "global_step": 356175, "epoch": 2120} {"train_loss": -12.141742706298828, "global_step": 356176, "epoch": 2120} {"train_loss": -11.955824851989746, "global_step": 356177, "epoch": 2120} {"train_loss": -12.058094024658203, "global_step": 356178, "epoch": 2120} {"train_loss": -11.942158699035645, "global_step": 356179, "epoch": 2120} {"train_loss": -12.228471755981445, "global_step": 356180, "epoch": 2120} {"train_loss": -12.184608459472656, "global_step": 356181, "epoch": 2120} {"train_loss": -12.235212326049805, "global_step": 356182, "epoch": 2120} {"train_loss": -12.519933700561523, "global_step": 356183, "epoch": 2120} {"train_loss": -12.370220184326172, "global_step": 356184, "epoch": 2120} {"train_loss": -12.38328742980957, "global_step": 356185, "epoch": 2120} {"train_loss": -12.302125930786133, "global_step": 356186, "epoch": 2120} {"train_loss": -12.682266235351562, "global_step": 356187, "epoch": 2120} {"train_loss": -12.150713920593262, "global_step": 356188, "epoch": 2120} {"train_loss": -12.568437576293945, "global_step": 356189, "epoch": 2120} {"train_loss": -12.438294410705566, "global_step": 356190, "epoch": 2120} {"train_loss": -12.406198501586914, "global_step": 356191, "epoch": 2120} {"train_loss": -12.447002410888672, "global_step": 356192, "epoch": 2120} {"train_loss": -12.599428176879883, "global_step": 356193, "epoch": 2120} {"train_loss": -12.348824501037598, "global_step": 356194, "epoch": 2120} {"train_loss": -12.34814739227295, "global_step": 356195, "epoch": 2120} {"train_loss": -12.40412712097168, "global_step": 356196, "epoch": 2120} {"train_loss": -12.400070190429688, "global_step": 356197, "epoch": 2120} {"train_loss": -12.569388389587402, "global_step": 356198, "epoch": 2120} {"train_loss": -12.58735466003418, "global_step": 356199, "epoch": 2120} {"train_loss": -12.565908432006836, "global_step": 356200, "epoch": 2120} {"train_loss": -12.641718864440918, "global_step": 356201, "epoch": 2120} {"train_loss": -12.476202011108398, "global_step": 356202, "epoch": 2120} {"train_loss": -12.608654022216797, "global_step": 356203, "epoch": 2120} {"train_loss": -12.360746383666992, "global_step": 356204, "epoch": 2120} {"train_loss": -12.442073822021484, "global_step": 356205, "epoch": 2120} {"train_loss": -12.392688751220703, "global_step": 356206, "epoch": 2120} {"train_loss": -12.342153549194336, "global_step": 356207, "epoch": 2120} {"train_loss": -12.167404174804688, "global_step": 356208, "epoch": 2120} {"train_loss": -12.561633110046387, "global_step": 356209, "epoch": 2120} {"train_loss": -12.590892791748047, "global_step": 356210, "epoch": 2120} {"train_loss": -12.439876556396484, "global_step": 356211, "epoch": 2120} {"train_loss": -12.33434009552002, "global_step": 356212, "epoch": 2120} {"train_loss": -12.257372856140137, "global_step": 356213, "epoch": 2120} {"train_loss": -12.32986831665039, "global_step": 356214, "epoch": 2120} {"train_loss": -12.16148853302002, "global_step": 356215, "epoch": 2120} {"train_loss": -12.423245429992676, "global_step": 356216, "epoch": 2120} {"train_loss": -12.145078659057617, "global_step": 356217, "epoch": 2120} {"train_loss": -11.881990432739258, "global_step": 356218, "epoch": 2120} {"train_loss": -11.967588424682617, "global_step": 356219, "epoch": 2120} {"train_loss": -12.394952774047852, "global_step": 356220, "epoch": 2120} {"train_loss": -12.271151542663574, "global_step": 356221, "epoch": 2120} {"train_loss": -11.366308212280273, "global_step": 356222, "epoch": 2120} {"train_loss": -12.354842185974121, "global_step": 356223, "epoch": 2120} {"train_loss": -12.653560638427734, "global_step": 356224, "epoch": 2120} {"train_loss": -11.93810749053955, "global_step": 356225, "epoch": 2120} {"train_loss": -11.835043907165527, "global_step": 356226, "epoch": 2120} {"train_loss": -12.597705841064453, "global_step": 356227, "epoch": 2120} {"train_loss": -12.36046028137207, "global_step": 356228, "epoch": 2120} {"train_loss": -12.26038932800293, "global_step": 356229, "epoch": 2120} {"train_loss": -12.29658317565918, "global_step": 356230, "epoch": 2120} {"train_loss": -11.971929550170898, "global_step": 356231, "epoch": 2120} {"train_loss": -11.369380950927734, "global_step": 356232, "epoch": 2120} {"train_loss": -12.055569648742676, "global_step": 356233, "epoch": 2120} {"train_loss": -11.262871742248535, "global_step": 356234, "epoch": 2120} {"train_loss": -11.801279067993164, "global_step": 356235, "epoch": 2120} {"train_loss": -11.964876174926758, "global_step": 356236, "epoch": 2120} {"train_loss": -12.100593566894531, "global_step": 356237, "epoch": 2120} {"train_loss": -11.775132179260254, "global_step": 356238, "epoch": 2120} {"train_loss": -11.77601146697998, "global_step": 356239, "epoch": 2120} {"train_loss": -11.895498275756836, "global_step": 356240, "epoch": 2120} {"train_loss": -12.432720184326172, "global_step": 356241, "epoch": 2120} {"train_loss": -11.722082138061523, "global_step": 356242, "epoch": 2120} {"train_loss": -12.277618408203125, "global_step": 356243, "epoch": 2120} {"train_loss": -11.907336235046387, "global_step": 356244, "epoch": 2120} {"train_loss": -11.467279434204102, "global_step": 356245, "epoch": 2120} {"train_loss": -12.058698654174805, "global_step": 356246, "epoch": 2120} {"train_loss": -10.352532386779785, "global_step": 356247, "epoch": 2120} {"train_loss": -11.98996353149414, "global_step": 356248, "epoch": 2120} {"train_loss": -11.567264556884766, "global_step": 356249, "epoch": 2120} {"train_loss": -11.960267066955566, "global_step": 356250, "epoch": 2120} {"train_loss": -11.635685920715332, "global_step": 356251, "epoch": 2120} {"train_loss": -11.76753044128418, "global_step": 356252, "epoch": 2120} {"train_loss": -11.304081916809082, "global_step": 356253, "epoch": 2120} {"train_loss": -11.018537521362305, "global_step": 356254, "epoch": 2120} {"train_loss": -11.815900802612305, "global_step": 356255, "epoch": 2120} {"train_loss": -11.558837890625, "global_step": 356256, "epoch": 2120} {"train_loss": -12.031136512756348, "global_step": 356257, "epoch": 2120} {"train_loss": -11.669937133789062, "global_step": 356258, "epoch": 2120} {"train_loss": -12.042757034301758, "global_step": 356259, "epoch": 2120} {"train_loss": -11.642231941223145, "global_step": 356260, "epoch": 2120} {"train_loss": -12.362373352050781, "global_step": 356261, "epoch": 2120} {"train_loss": -11.916837692260742, "global_step": 356262, "epoch": 2120} {"train_loss": -12.162458419799805, "global_step": 356263, "epoch": 2120} {"train_loss": -12.137014389038086, "global_step": 356264, "epoch": 2120} {"train_loss": -11.6251220703125, "global_step": 356265, "epoch": 2120} {"train_loss": -10.757600784301758, "global_step": 356266, "epoch": 2120} {"train_loss": -11.189391136169434, "global_step": 356267, "epoch": 2120} {"train_loss": -11.814297676086426, "global_step": 356268, "epoch": 2120} {"train_loss": -12.258920669555664, "global_step": 356269, "epoch": 2120} {"train_loss": -11.57631778717041, "global_step": 356270, "epoch": 2120} {"train_loss": -12.211250305175781, "global_step": 356271, "epoch": 2120} {"train_loss": -11.175561904907227, "global_step": 356272, "epoch": 2120} {"train_loss": -11.914199829101562, "global_step": 356273, "epoch": 2120} {"train_loss": -11.111040115356445, "global_step": 356274, "epoch": 2120} {"train_loss": -11.577478408813477, "global_step": 356275, "epoch": 2120} {"train_loss": -11.145700454711914, "global_step": 356276, "epoch": 2120} {"train_loss": -11.592052459716797, "global_step": 356277, "epoch": 2120} {"train_loss": -11.202224731445312, "global_step": 356278, "epoch": 2120} {"train_loss": -11.855423927307129, "global_step": 356279, "epoch": 2120} {"train_loss": -11.193506240844727, "global_step": 356280, "epoch": 2120} {"train_loss": -11.186147689819336, "global_step": 356281, "epoch": 2120} {"train_loss": -11.590779304504395, "global_step": 356282, "epoch": 2120} {"train_loss": -11.670686721801758, "global_step": 356283, "epoch": 2120} {"train_loss": -10.864988327026367, "global_step": 356284, "epoch": 2120} {"train_loss": -12.173349380493164, "global_step": 356285, "epoch": 2120} {"train_loss": -11.251111030578613, "global_step": 356286, "epoch": 2120} {"train_loss": -11.770486831665039, "global_step": 356287, "epoch": 2120} {"train_loss": -12.216513633728027, "global_step": 356288, "epoch": 2120} {"train_loss": -11.686501502990723, "global_step": 356289, "epoch": 2120} {"train_loss": -12.256836891174316, "global_step": 356290, "epoch": 2120} {"train_loss": -11.33237075805664, "global_step": 356291, "epoch": 2120} {"train_loss": -12.327005386352539, "global_step": 356292, "epoch": 2120} {"train_loss": -11.728813171386719, "global_step": 356293, "epoch": 2120} {"train_loss": -12.211050033569336, "global_step": 356294, "epoch": 2120} {"train_loss": -12.126396179199219, "global_step": 356295, "epoch": 2120} {"train_loss": -11.847966194152832, "global_step": 356296, "epoch": 2120} {"train_loss": -12.131379127502441, "global_step": 356297, "epoch": 2120} {"train_loss": -11.971918106079102, "global_step": 356298, "epoch": 2120} {"train_loss": -12.265315055847168, "global_step": 356299, "epoch": 2120} {"train_loss": -12.157011032104492, "global_step": 356300, "epoch": 2120} {"train_loss": -11.910774230957031, "global_step": 356301, "epoch": 2120} {"train_loss": -12.222112655639648, "global_step": 356302, "epoch": 2120} {"train_loss": -12.12869644165039, "global_step": 356303, "epoch": 2120} {"train_loss": -12.312932968139648, "global_step": 356304, "epoch": 2120} {"train_loss": -12.310859680175781, "global_step": 356305, "epoch": 2120} {"train_loss": -12.138980865478516, "global_step": 356306, "epoch": 2120} {"train_loss": -12.249473571777344, "global_step": 356307, "epoch": 2120} {"train_loss": -12.166521072387695, "global_step": 356308, "epoch": 2120} {"train_loss": -12.264261245727539, "global_step": 356309, "epoch": 2120} {"train_loss": -12.503698348999023, "global_step": 356310, "epoch": 2120} {"train_loss": -12.146665573120117, "global_step": 356311, "epoch": 2120} {"train_loss": -12.530997276306152, "global_step": 356312, "epoch": 2120} {"train_loss": -12.099382400512695, "global_step": 356313, "epoch": 2120} {"train_loss": -12.354020118713379, "global_step": 356314, "epoch": 2120} {"train_loss": -12.1273193359375, "global_step": 356315, "epoch": 2120} {"train_loss": -12.351358413696289, "global_step": 356316, "epoch": 2120} {"train_loss": -11.99008846282959, "global_step": 356317, "epoch": 2120} {"train_loss": -12.379032135009766, "global_step": 356318, "epoch": 2120} {"train_loss": -12.214942932128906, "global_step": 356319, "epoch": 2120} {"train_loss": -12.272928237915039, "global_step": 356320, "epoch": 2120} {"train_loss": -12.479721069335938, "global_step": 356321, "epoch": 2120} {"train_loss": -12.531572341918945, "global_step": 356322, "epoch": 2120} {"train_loss": -12.154090881347656, "global_step": 356323, "epoch": 2120} {"train_loss": -12.495555877685547, "global_step": 356324, "epoch": 2120} {"train_loss": -12.408218383789062, "global_step": 356325, "epoch": 2120} {"train_loss": -12.519067764282227, "global_step": 356326, "epoch": 2120} {"train_loss": -12.055363904862176, "global_step": 356327, "epoch": 2120, "val_loss": 292667.3125, "train_action_mse_error": 0.7882117033004761} {"train_loss": -12.40884780883789, "global_step": 356328, "epoch": 2121} {"train_loss": -12.338327407836914, "global_step": 356329, "epoch": 2121} {"train_loss": -12.565671920776367, "global_step": 356330, "epoch": 2121} {"train_loss": -12.059761047363281, "global_step": 356331, "epoch": 2121} {"train_loss": -12.546817779541016, "global_step": 356332, "epoch": 2121} {"train_loss": -12.493303298950195, "global_step": 356333, "epoch": 2121} {"train_loss": -12.637638092041016, "global_step": 356334, "epoch": 2121} {"train_loss": -12.371862411499023, "global_step": 356335, "epoch": 2121} {"train_loss": -12.546802520751953, "global_step": 356336, "epoch": 2121} {"train_loss": -11.531688690185547, "global_step": 356337, "epoch": 2121} {"train_loss": -11.952178955078125, "global_step": 356338, "epoch": 2121} {"train_loss": -12.25605583190918, "global_step": 356339, "epoch": 2121} {"train_loss": -11.853583335876465, "global_step": 356340, "epoch": 2121} {"train_loss": -12.343254089355469, "global_step": 356341, "epoch": 2121} {"train_loss": -12.510725021362305, "global_step": 356342, "epoch": 2121} {"train_loss": -11.965919494628906, "global_step": 356343, "epoch": 2121} {"train_loss": -12.124780654907227, "global_step": 356344, "epoch": 2121} {"train_loss": -12.158899307250977, "global_step": 356345, "epoch": 2121} {"train_loss": -12.121362686157227, "global_step": 356346, "epoch": 2121} {"train_loss": -12.103357315063477, "global_step": 356347, "epoch": 2121} {"train_loss": -12.452811241149902, "global_step": 356348, "epoch": 2121} {"train_loss": -12.16574478149414, "global_step": 356349, "epoch": 2121} {"train_loss": -12.558238983154297, "global_step": 356350, "epoch": 2121} {"train_loss": -12.288506507873535, "global_step": 356351, "epoch": 2121} {"train_loss": -12.419290542602539, "global_step": 356352, "epoch": 2121} {"train_loss": -12.23632526397705, "global_step": 356353, "epoch": 2121} {"train_loss": -12.328970909118652, "global_step": 356354, "epoch": 2121} {"train_loss": -12.251588821411133, "global_step": 356355, "epoch": 2121} {"train_loss": -12.368690490722656, "global_step": 356356, "epoch": 2121} {"train_loss": -12.3966703414917, "global_step": 356357, "epoch": 2121} {"train_loss": -12.181062698364258, "global_step": 356358, "epoch": 2121} {"train_loss": -12.150995254516602, "global_step": 356359, "epoch": 2121} {"train_loss": -12.578466415405273, "global_step": 356360, "epoch": 2121} {"train_loss": -12.01905632019043, "global_step": 356361, "epoch": 2121} {"train_loss": -12.153331756591797, "global_step": 356362, "epoch": 2121} {"train_loss": -10.797586441040039, "global_step": 356363, "epoch": 2121} {"train_loss": -10.202454566955566, "global_step": 356364, "epoch": 2121} {"train_loss": -10.406957626342773, "global_step": 356365, "epoch": 2121} {"train_loss": -11.934930801391602, "global_step": 356366, "epoch": 2121} {"train_loss": -8.687957763671875, "global_step": 356367, "epoch": 2121} {"train_loss": -10.969453811645508, "global_step": 356368, "epoch": 2121} {"train_loss": -7.689467430114746, "global_step": 356369, "epoch": 2121} {"train_loss": -9.036836624145508, "global_step": 356370, "epoch": 2121} {"train_loss": -8.01315975189209, "global_step": 356371, "epoch": 2121} {"train_loss": -8.99272346496582, "global_step": 356372, "epoch": 2121} {"train_loss": -8.908493041992188, "global_step": 356373, "epoch": 2121} {"train_loss": -10.077789306640625, "global_step": 356374, "epoch": 2121} {"train_loss": -9.442983627319336, "global_step": 356375, "epoch": 2121} {"train_loss": -9.3256254196167, "global_step": 356376, "epoch": 2121} {"train_loss": -9.028634071350098, "global_step": 356377, "epoch": 2121} {"train_loss": -8.290771484375, "global_step": 356378, "epoch": 2121} {"train_loss": -9.41208553314209, "global_step": 356379, "epoch": 2121} {"train_loss": -8.398100852966309, "global_step": 356380, "epoch": 2121} {"train_loss": -8.742338180541992, "global_step": 356381, "epoch": 2121} {"train_loss": -9.752176284790039, "global_step": 356382, "epoch": 2121} {"train_loss": -8.44749641418457, "global_step": 356383, "epoch": 2121} {"train_loss": -8.320206642150879, "global_step": 356384, "epoch": 2121} {"train_loss": -8.263858795166016, "global_step": 356385, "epoch": 2121} {"train_loss": -9.790480613708496, "global_step": 356386, "epoch": 2121} {"train_loss": -9.562037467956543, "global_step": 356387, "epoch": 2121} {"train_loss": -8.335582733154297, "global_step": 356388, "epoch": 2121} {"train_loss": -8.882966995239258, "global_step": 356389, "epoch": 2121} {"train_loss": -9.915868759155273, "global_step": 356390, "epoch": 2121} {"train_loss": -10.72844123840332, "global_step": 356391, "epoch": 2121} {"train_loss": -9.466484069824219, "global_step": 356392, "epoch": 2121} {"train_loss": -10.03166675567627, "global_step": 356393, "epoch": 2121} {"train_loss": -10.434036254882812, "global_step": 356394, "epoch": 2121} {"train_loss": -9.2894287109375, "global_step": 356395, "epoch": 2121} {"train_loss": -10.545636177062988, "global_step": 356396, "epoch": 2121} {"train_loss": -10.897102355957031, "global_step": 356397, "epoch": 2121} {"train_loss": -10.725051879882812, "global_step": 356398, "epoch": 2121} {"train_loss": -10.460271835327148, "global_step": 356399, "epoch": 2121} {"train_loss": -11.111848831176758, "global_step": 356400, "epoch": 2121} {"train_loss": -11.067790985107422, "global_step": 356401, "epoch": 2121} {"train_loss": -11.206160545349121, "global_step": 356402, "epoch": 2121} {"train_loss": -9.88408088684082, "global_step": 356403, "epoch": 2121} {"train_loss": -11.523448944091797, "global_step": 356404, "epoch": 2121} {"train_loss": -11.284076690673828, "global_step": 356405, "epoch": 2121} {"train_loss": -10.75291919708252, "global_step": 356406, "epoch": 2121} {"train_loss": -11.315634727478027, "global_step": 356407, "epoch": 2121} {"train_loss": -11.839109420776367, "global_step": 356408, "epoch": 2121} {"train_loss": -11.246711730957031, "global_step": 356409, "epoch": 2121} {"train_loss": -11.164013862609863, "global_step": 356410, "epoch": 2121} {"train_loss": -11.8247709274292, "global_step": 356411, "epoch": 2121} {"train_loss": -11.228875160217285, "global_step": 356412, "epoch": 2121} {"train_loss": -11.057331085205078, "global_step": 356413, "epoch": 2121} {"train_loss": -11.776313781738281, "global_step": 356414, "epoch": 2121} {"train_loss": -11.064115524291992, "global_step": 356415, "epoch": 2121} {"train_loss": -11.411149978637695, "global_step": 356416, "epoch": 2121} {"train_loss": -11.582231521606445, "global_step": 356417, "epoch": 2121} {"train_loss": -11.606096267700195, "global_step": 356418, "epoch": 2121} {"train_loss": -11.481437683105469, "global_step": 356419, "epoch": 2121} {"train_loss": -11.959487915039062, "global_step": 356420, "epoch": 2121} {"train_loss": -11.56991958618164, "global_step": 356421, "epoch": 2121} {"train_loss": -11.65999984741211, "global_step": 356422, "epoch": 2121} {"train_loss": -11.836199760437012, "global_step": 356423, "epoch": 2121} {"train_loss": -11.831110000610352, "global_step": 356424, "epoch": 2121} {"train_loss": -11.824394226074219, "global_step": 356425, "epoch": 2121} {"train_loss": -11.87660026550293, "global_step": 356426, "epoch": 2121} {"train_loss": -11.8629150390625, "global_step": 356427, "epoch": 2121} {"train_loss": -12.033109664916992, "global_step": 356428, "epoch": 2121} {"train_loss": -12.005097389221191, "global_step": 356429, "epoch": 2121} {"train_loss": -12.05803108215332, "global_step": 356430, "epoch": 2121} {"train_loss": -12.104532241821289, "global_step": 356431, "epoch": 2121} {"train_loss": -12.226343154907227, "global_step": 356432, "epoch": 2121} {"train_loss": -11.961162567138672, "global_step": 356433, "epoch": 2121} {"train_loss": -12.068251609802246, "global_step": 356434, "epoch": 2121} {"train_loss": -12.198577880859375, "global_step": 356435, "epoch": 2121} {"train_loss": -12.225926399230957, "global_step": 356436, "epoch": 2121} {"train_loss": -12.13951587677002, "global_step": 356437, "epoch": 2121} {"train_loss": -12.082584381103516, "global_step": 356438, "epoch": 2121} {"train_loss": -11.993093490600586, "global_step": 356439, "epoch": 2121} {"train_loss": -12.1851806640625, "global_step": 356440, "epoch": 2121} {"train_loss": -12.18918514251709, "global_step": 356441, "epoch": 2121} {"train_loss": -12.130271911621094, "global_step": 356442, "epoch": 2121} {"train_loss": -12.167779922485352, "global_step": 356443, "epoch": 2121} {"train_loss": -12.080632209777832, "global_step": 356444, "epoch": 2121} {"train_loss": -12.164499282836914, "global_step": 356445, "epoch": 2121} {"train_loss": -12.273370742797852, "global_step": 356446, "epoch": 2121} {"train_loss": -12.271892547607422, "global_step": 356447, "epoch": 2121} {"train_loss": -12.27565860748291, "global_step": 356448, "epoch": 2121} {"train_loss": -12.156722068786621, "global_step": 356449, "epoch": 2121} {"train_loss": -12.335102081298828, "global_step": 356450, "epoch": 2121} {"train_loss": -12.358989715576172, "global_step": 356451, "epoch": 2121} {"train_loss": -12.391643524169922, "global_step": 356452, "epoch": 2121} {"train_loss": -12.154356956481934, "global_step": 356453, "epoch": 2121} {"train_loss": -12.163955688476562, "global_step": 356454, "epoch": 2121} {"train_loss": -12.252880096435547, "global_step": 356455, "epoch": 2121} {"train_loss": -12.41047477722168, "global_step": 356456, "epoch": 2121} {"train_loss": -12.474782943725586, "global_step": 356457, "epoch": 2121} {"train_loss": -12.289905548095703, "global_step": 356458, "epoch": 2121} {"train_loss": -12.285701751708984, "global_step": 356459, "epoch": 2121} {"train_loss": -12.446192741394043, "global_step": 356460, "epoch": 2121} {"train_loss": -12.365762710571289, "global_step": 356461, "epoch": 2121} {"train_loss": -12.310997009277344, "global_step": 356462, "epoch": 2121} {"train_loss": -12.523099899291992, "global_step": 356463, "epoch": 2121} {"train_loss": -12.321216583251953, "global_step": 356464, "epoch": 2121} {"train_loss": -12.45118236541748, "global_step": 356465, "epoch": 2121} {"train_loss": -12.422821044921875, "global_step": 356466, "epoch": 2121} {"train_loss": -12.41686725616455, "global_step": 356467, "epoch": 2121} {"train_loss": -12.46209716796875, "global_step": 356468, "epoch": 2121} {"train_loss": -12.521631240844727, "global_step": 356469, "epoch": 2121} {"train_loss": -12.4014892578125, "global_step": 356470, "epoch": 2121} {"train_loss": -12.40603256225586, "global_step": 356471, "epoch": 2121} {"train_loss": -12.343025207519531, "global_step": 356472, "epoch": 2121} {"train_loss": -12.614816665649414, "global_step": 356473, "epoch": 2121} {"train_loss": -12.309582710266113, "global_step": 356474, "epoch": 2121} {"train_loss": -12.560543060302734, "global_step": 356475, "epoch": 2121} {"train_loss": -12.475055694580078, "global_step": 356476, "epoch": 2121} {"train_loss": -12.407115936279297, "global_step": 356477, "epoch": 2121} {"train_loss": -12.63235092163086, "global_step": 356478, "epoch": 2121} {"train_loss": -12.553340911865234, "global_step": 356479, "epoch": 2121} {"train_loss": -12.6642484664917, "global_step": 356480, "epoch": 2121} {"train_loss": -12.341318130493164, "global_step": 356481, "epoch": 2121} {"train_loss": -12.611817359924316, "global_step": 356482, "epoch": 2121} {"train_loss": -12.361129760742188, "global_step": 356483, "epoch": 2121} {"train_loss": -12.510663986206055, "global_step": 356484, "epoch": 2121} {"train_loss": -12.325052261352539, "global_step": 356485, "epoch": 2121} {"train_loss": -12.484394073486328, "global_step": 356486, "epoch": 2121} {"train_loss": -12.617280006408691, "global_step": 356487, "epoch": 2121} {"train_loss": -12.500268936157227, "global_step": 356488, "epoch": 2121} {"train_loss": -12.365817070007324, "global_step": 356489, "epoch": 2121} {"train_loss": -12.451260566711426, "global_step": 356490, "epoch": 2121} {"train_loss": -12.57902717590332, "global_step": 356491, "epoch": 2121} {"train_loss": -12.463066101074219, "global_step": 356492, "epoch": 2121} {"train_loss": -12.572083473205566, "global_step": 356493, "epoch": 2121} {"train_loss": -12.679967880249023, "global_step": 356494, "epoch": 2121} {"train_loss": -11.55241120429266, "global_step": 356495, "epoch": 2121, "val_loss": 291661.71875} {"train_loss": -12.469736099243164, "global_step": 356496, "epoch": 2122} {"train_loss": -12.323525428771973, "global_step": 356497, "epoch": 2122} {"train_loss": -12.418354034423828, "global_step": 356498, "epoch": 2122} {"train_loss": -12.795269012451172, "global_step": 356499, "epoch": 2122} {"train_loss": -12.656258583068848, "global_step": 356500, "epoch": 2122} {"train_loss": -12.583324432373047, "global_step": 356501, "epoch": 2122} {"train_loss": -12.509196281433105, "global_step": 356502, "epoch": 2122} {"train_loss": -12.66923713684082, "global_step": 356503, "epoch": 2122} {"train_loss": -12.44123649597168, "global_step": 356504, "epoch": 2122} {"train_loss": -12.152082443237305, "global_step": 356505, "epoch": 2122} {"train_loss": -11.837101936340332, "global_step": 356506, "epoch": 2122} {"train_loss": -12.76124382019043, "global_step": 356507, "epoch": 2122} {"train_loss": -12.451330184936523, "global_step": 356508, "epoch": 2122} {"train_loss": -12.171070098876953, "global_step": 356509, "epoch": 2122} {"train_loss": -12.191903114318848, "global_step": 356510, "epoch": 2122} {"train_loss": -12.680001258850098, "global_step": 356511, "epoch": 2122} {"train_loss": -12.249604225158691, "global_step": 356512, "epoch": 2122} {"train_loss": -11.772966384887695, "global_step": 356513, "epoch": 2122} {"train_loss": -11.951583862304688, "global_step": 356514, "epoch": 2122} {"train_loss": -12.408275604248047, "global_step": 356515, "epoch": 2122} {"train_loss": -12.433555603027344, "global_step": 356516, "epoch": 2122} {"train_loss": -12.50997543334961, "global_step": 356517, "epoch": 2122} {"train_loss": -12.151354789733887, "global_step": 356518, "epoch": 2122} {"train_loss": -12.559898376464844, "global_step": 356519, "epoch": 2122} {"train_loss": -12.397623062133789, "global_step": 356520, "epoch": 2122} {"train_loss": -12.672015190124512, "global_step": 356521, "epoch": 2122} {"train_loss": -12.018549919128418, "global_step": 356522, "epoch": 2122} {"train_loss": -12.049108505249023, "global_step": 356523, "epoch": 2122} {"train_loss": -12.497674942016602, "global_step": 356524, "epoch": 2122} {"train_loss": -12.439165115356445, "global_step": 356525, "epoch": 2122} {"train_loss": -11.560163497924805, "global_step": 356526, "epoch": 2122} {"train_loss": -10.469422340393066, "global_step": 356527, "epoch": 2122} {"train_loss": -12.02872085571289, "global_step": 356528, "epoch": 2122} {"train_loss": -12.379823684692383, "global_step": 356529, "epoch": 2122} {"train_loss": -10.872657775878906, "global_step": 356530, "epoch": 2122} {"train_loss": -11.895079612731934, "global_step": 356531, "epoch": 2122} {"train_loss": -12.1971435546875, "global_step": 356532, "epoch": 2122} {"train_loss": -11.668625831604004, "global_step": 356533, "epoch": 2122} {"train_loss": -12.266122817993164, "global_step": 356534, "epoch": 2122} {"train_loss": -12.628610610961914, "global_step": 356535, "epoch": 2122} {"train_loss": -12.028682708740234, "global_step": 356536, "epoch": 2122} {"train_loss": -12.338825225830078, "global_step": 356537, "epoch": 2122} {"train_loss": -12.516348838806152, "global_step": 356538, "epoch": 2122} {"train_loss": -11.736815452575684, "global_step": 356539, "epoch": 2122} {"train_loss": -11.526926040649414, "global_step": 356540, "epoch": 2122} {"train_loss": -12.479231834411621, "global_step": 356541, "epoch": 2122} {"train_loss": -12.006921768188477, "global_step": 356542, "epoch": 2122} {"train_loss": -11.771835327148438, "global_step": 356543, "epoch": 2122} {"train_loss": -11.919219017028809, "global_step": 356544, "epoch": 2122} {"train_loss": -11.91515827178955, "global_step": 356545, "epoch": 2122} {"train_loss": -11.223895072937012, "global_step": 356546, "epoch": 2122} {"train_loss": -12.184707641601562, "global_step": 356547, "epoch": 2122} {"train_loss": -11.697114944458008, "global_step": 356548, "epoch": 2122} {"train_loss": -10.482088088989258, "global_step": 356549, "epoch": 2122} {"train_loss": -11.7080078125, "global_step": 356550, "epoch": 2122} {"train_loss": -11.421432495117188, "global_step": 356551, "epoch": 2122} {"train_loss": -9.862333297729492, "global_step": 356552, "epoch": 2122} {"train_loss": -10.73193073272705, "global_step": 356553, "epoch": 2122} {"train_loss": -7.842606544494629, "global_step": 356554, "epoch": 2122} {"train_loss": -7.971785545349121, "global_step": 356555, "epoch": 2122} {"train_loss": -8.808603286743164, "global_step": 356556, "epoch": 2122} {"train_loss": -8.244409561157227, "global_step": 356557, "epoch": 2122} {"train_loss": -9.766749382019043, "global_step": 356558, "epoch": 2122} {"train_loss": -10.48472785949707, "global_step": 356559, "epoch": 2122} {"train_loss": -8.974019050598145, "global_step": 356560, "epoch": 2122} {"train_loss": -10.881912231445312, "global_step": 356561, "epoch": 2122} {"train_loss": -9.870626449584961, "global_step": 356562, "epoch": 2122} {"train_loss": -9.331008911132812, "global_step": 356563, "epoch": 2122} {"train_loss": -11.056621551513672, "global_step": 356564, "epoch": 2122} {"train_loss": -11.224132537841797, "global_step": 356565, "epoch": 2122} {"train_loss": -10.90346908569336, "global_step": 356566, "epoch": 2122} {"train_loss": -10.961647033691406, "global_step": 356567, "epoch": 2122} {"train_loss": -11.001178741455078, "global_step": 356568, "epoch": 2122} {"train_loss": -11.271082878112793, "global_step": 356569, "epoch": 2122} {"train_loss": -11.211787223815918, "global_step": 356570, "epoch": 2122} {"train_loss": -11.503242492675781, "global_step": 356571, "epoch": 2122} {"train_loss": -11.284369468688965, "global_step": 356572, "epoch": 2122} {"train_loss": -11.424535751342773, "global_step": 356573, "epoch": 2122} {"train_loss": -10.847162246704102, "global_step": 356574, "epoch": 2122} {"train_loss": -11.093780517578125, "global_step": 356575, "epoch": 2122} {"train_loss": -10.609567642211914, "global_step": 356576, "epoch": 2122} {"train_loss": -11.230562210083008, "global_step": 356577, "epoch": 2122} {"train_loss": -10.598047256469727, "global_step": 356578, "epoch": 2122} {"train_loss": -11.48987102508545, "global_step": 356579, "epoch": 2122} {"train_loss": -11.161523818969727, "global_step": 356580, "epoch": 2122} {"train_loss": -11.911859512329102, "global_step": 356581, "epoch": 2122} {"train_loss": -11.538778305053711, "global_step": 356582, "epoch": 2122} {"train_loss": -11.577526092529297, "global_step": 356583, "epoch": 2122} {"train_loss": -11.520718574523926, "global_step": 356584, "epoch": 2122} {"train_loss": -11.804264068603516, "global_step": 356585, "epoch": 2122} {"train_loss": -11.735610961914062, "global_step": 356586, "epoch": 2122} {"train_loss": -11.995926856994629, "global_step": 356587, "epoch": 2122} {"train_loss": -11.547904968261719, "global_step": 356588, "epoch": 2122} {"train_loss": -11.6364107131958, "global_step": 356589, "epoch": 2122} {"train_loss": -11.85139274597168, "global_step": 356590, "epoch": 2122} {"train_loss": -11.718767166137695, "global_step": 356591, "epoch": 2122} {"train_loss": -11.779796600341797, "global_step": 356592, "epoch": 2122} {"train_loss": -11.729033470153809, "global_step": 356593, "epoch": 2122} {"train_loss": -11.476608276367188, "global_step": 356594, "epoch": 2122} {"train_loss": -11.945690155029297, "global_step": 356595, "epoch": 2122} {"train_loss": -11.57129955291748, "global_step": 356596, "epoch": 2122} {"train_loss": -11.729702949523926, "global_step": 356597, "epoch": 2122} {"train_loss": -11.845697402954102, "global_step": 356598, "epoch": 2122} {"train_loss": -11.54928970336914, "global_step": 356599, "epoch": 2122} {"train_loss": -12.100005149841309, "global_step": 356600, "epoch": 2122} {"train_loss": -11.698001861572266, "global_step": 356601, "epoch": 2122} {"train_loss": -11.93767261505127, "global_step": 356602, "epoch": 2122} {"train_loss": -11.700821876525879, "global_step": 356603, "epoch": 2122} {"train_loss": -11.865947723388672, "global_step": 356604, "epoch": 2122} {"train_loss": -11.824031829833984, "global_step": 356605, "epoch": 2122} {"train_loss": -12.14940357208252, "global_step": 356606, "epoch": 2122} {"train_loss": -11.938413619995117, "global_step": 356607, "epoch": 2122} {"train_loss": -11.86892318725586, "global_step": 356608, "epoch": 2122} {"train_loss": -12.222492218017578, "global_step": 356609, "epoch": 2122} {"train_loss": -12.124605178833008, "global_step": 356610, "epoch": 2122} {"train_loss": -12.206504821777344, "global_step": 356611, "epoch": 2122} {"train_loss": -12.160290718078613, "global_step": 356612, "epoch": 2122} {"train_loss": -12.017965316772461, "global_step": 356613, "epoch": 2122} {"train_loss": -12.125062942504883, "global_step": 356614, "epoch": 2122} {"train_loss": -12.34077262878418, "global_step": 356615, "epoch": 2122} {"train_loss": -12.346920013427734, "global_step": 356616, "epoch": 2122} {"train_loss": -12.290811538696289, "global_step": 356617, "epoch": 2122} {"train_loss": -12.36905574798584, "global_step": 356618, "epoch": 2122} {"train_loss": -12.388423919677734, "global_step": 356619, "epoch": 2122} {"train_loss": -12.462803840637207, "global_step": 356620, "epoch": 2122} {"train_loss": -12.341118812561035, "global_step": 356621, "epoch": 2122} {"train_loss": -12.336604118347168, "global_step": 356622, "epoch": 2122} {"train_loss": -12.153701782226562, "global_step": 356623, "epoch": 2122} {"train_loss": -12.462581634521484, "global_step": 356624, "epoch": 2122} {"train_loss": -12.38674545288086, "global_step": 356625, "epoch": 2122} {"train_loss": -12.065057754516602, "global_step": 356626, "epoch": 2122} {"train_loss": -12.454207420349121, "global_step": 356627, "epoch": 2122} {"train_loss": -12.38193130493164, "global_step": 356628, "epoch": 2122} {"train_loss": -12.38563346862793, "global_step": 356629, "epoch": 2122} {"train_loss": -12.313972473144531, "global_step": 356630, "epoch": 2122} {"train_loss": -12.38033390045166, "global_step": 356631, "epoch": 2122} {"train_loss": -12.20706844329834, "global_step": 356632, "epoch": 2122} {"train_loss": -12.59576416015625, "global_step": 356633, "epoch": 2122} {"train_loss": -12.498952865600586, "global_step": 356634, "epoch": 2122} {"train_loss": -12.288164138793945, "global_step": 356635, "epoch": 2122} {"train_loss": -12.392621040344238, "global_step": 356636, "epoch": 2122} {"train_loss": -12.438316345214844, "global_step": 356637, "epoch": 2122} {"train_loss": -12.603107452392578, "global_step": 356638, "epoch": 2122} {"train_loss": -12.600054740905762, "global_step": 356639, "epoch": 2122} {"train_loss": -12.572664260864258, "global_step": 356640, "epoch": 2122} {"train_loss": -12.497785568237305, "global_step": 356641, "epoch": 2122} {"train_loss": -12.435640335083008, "global_step": 356642, "epoch": 2122} {"train_loss": -12.540773391723633, "global_step": 356643, "epoch": 2122} {"train_loss": -12.558112144470215, "global_step": 356644, "epoch": 2122} {"train_loss": -12.548306465148926, "global_step": 356645, "epoch": 2122} {"train_loss": -12.171073913574219, "global_step": 356646, "epoch": 2122} {"train_loss": -12.541421890258789, "global_step": 356647, "epoch": 2122} {"train_loss": -12.429708480834961, "global_step": 356648, "epoch": 2122} {"train_loss": -12.449273109436035, "global_step": 356649, "epoch": 2122} {"train_loss": -12.476187705993652, "global_step": 356650, "epoch": 2122} {"train_loss": -12.639511108398438, "global_step": 356651, "epoch": 2122} {"train_loss": -12.59367847442627, "global_step": 356652, "epoch": 2122} {"train_loss": -12.611381530761719, "global_step": 356653, "epoch": 2122} {"train_loss": -12.664412498474121, "global_step": 356654, "epoch": 2122} {"train_loss": -12.706865310668945, "global_step": 356655, "epoch": 2122} {"train_loss": -12.664546966552734, "global_step": 356656, "epoch": 2122} {"train_loss": -12.577301025390625, "global_step": 356657, "epoch": 2122} {"train_loss": -12.896392822265625, "global_step": 356658, "epoch": 2122} {"train_loss": -12.574420928955078, "global_step": 356659, "epoch": 2122} {"train_loss": -12.632890701293945, "global_step": 356660, "epoch": 2122} {"train_loss": -12.658368110656738, "global_step": 356661, "epoch": 2122} {"train_loss": -12.346120834350586, "global_step": 356662, "epoch": 2122} {"train_loss": -11.86023573648362, "global_step": 356663, "epoch": 2122, "val_loss": 288538.09375} {"train_loss": -12.695545196533203, "global_step": 356664, "epoch": 2123} {"train_loss": -11.924877166748047, "global_step": 356665, "epoch": 2123} {"train_loss": -11.622061729431152, "global_step": 356666, "epoch": 2123} {"train_loss": -12.216920852661133, "global_step": 356667, "epoch": 2123} {"train_loss": -12.08848762512207, "global_step": 356668, "epoch": 2123} {"train_loss": -11.65325927734375, "global_step": 356669, "epoch": 2123} {"train_loss": -12.002599716186523, "global_step": 356670, "epoch": 2123} {"train_loss": -11.961505889892578, "global_step": 356671, "epoch": 2123} {"train_loss": -12.41749382019043, "global_step": 356672, "epoch": 2123} {"train_loss": -12.313684463500977, "global_step": 356673, "epoch": 2123} {"train_loss": -12.399818420410156, "global_step": 356674, "epoch": 2123} {"train_loss": -12.270529747009277, "global_step": 356675, "epoch": 2123} {"train_loss": -12.171123504638672, "global_step": 356676, "epoch": 2123} {"train_loss": -12.450761795043945, "global_step": 356677, "epoch": 2123} {"train_loss": -12.551153182983398, "global_step": 356678, "epoch": 2123} {"train_loss": -12.503976821899414, "global_step": 356679, "epoch": 2123} {"train_loss": -11.941396713256836, "global_step": 356680, "epoch": 2123} {"train_loss": -12.099692344665527, "global_step": 356681, "epoch": 2123} {"train_loss": -12.115495681762695, "global_step": 356682, "epoch": 2123} {"train_loss": -12.409466743469238, "global_step": 356683, "epoch": 2123} {"train_loss": -11.606467247009277, "global_step": 356684, "epoch": 2123} {"train_loss": -11.887674331665039, "global_step": 356685, "epoch": 2123} {"train_loss": -12.366511344909668, "global_step": 356686, "epoch": 2123} {"train_loss": -11.928220748901367, "global_step": 356687, "epoch": 2123} {"train_loss": -12.068503379821777, "global_step": 356688, "epoch": 2123} {"train_loss": -12.235940933227539, "global_step": 356689, "epoch": 2123} {"train_loss": -12.379532814025879, "global_step": 356690, "epoch": 2123} {"train_loss": -11.856477737426758, "global_step": 356691, "epoch": 2123} {"train_loss": -11.99946403503418, "global_step": 356692, "epoch": 2123} {"train_loss": -12.088922500610352, "global_step": 356693, "epoch": 2123} {"train_loss": -10.61117935180664, "global_step": 356694, "epoch": 2123} {"train_loss": -11.375380516052246, "global_step": 356695, "epoch": 2123} {"train_loss": -11.868673324584961, "global_step": 356696, "epoch": 2123} {"train_loss": -10.57344913482666, "global_step": 356697, "epoch": 2123} {"train_loss": -10.408194541931152, "global_step": 356698, "epoch": 2123} {"train_loss": -10.250179290771484, "global_step": 356699, "epoch": 2123} {"train_loss": -10.180841445922852, "global_step": 356700, "epoch": 2123} {"train_loss": -10.835673332214355, "global_step": 356701, "epoch": 2123} {"train_loss": -11.440180778503418, "global_step": 356702, "epoch": 2123} {"train_loss": -9.510560989379883, "global_step": 356703, "epoch": 2123} {"train_loss": -11.626120567321777, "global_step": 356704, "epoch": 2123} {"train_loss": -9.651281356811523, "global_step": 356705, "epoch": 2123} {"train_loss": -11.440473556518555, "global_step": 356706, "epoch": 2123} {"train_loss": -9.21982192993164, "global_step": 356707, "epoch": 2123} {"train_loss": -8.728093147277832, "global_step": 356708, "epoch": 2123} {"train_loss": -9.752655029296875, "global_step": 356709, "epoch": 2123} {"train_loss": -9.9583740234375, "global_step": 356710, "epoch": 2123} {"train_loss": -10.269319534301758, "global_step": 356711, "epoch": 2123} {"train_loss": -9.243669509887695, "global_step": 356712, "epoch": 2123} {"train_loss": -9.649665832519531, "global_step": 356713, "epoch": 2123} {"train_loss": -9.577817916870117, "global_step": 356714, "epoch": 2123} {"train_loss": -11.234375, "global_step": 356715, "epoch": 2123} {"train_loss": -9.724433898925781, "global_step": 356716, "epoch": 2123} {"train_loss": -11.272753715515137, "global_step": 356717, "epoch": 2123} {"train_loss": -10.497936248779297, "global_step": 356718, "epoch": 2123} {"train_loss": -10.198701858520508, "global_step": 356719, "epoch": 2123} {"train_loss": -11.31592082977295, "global_step": 356720, "epoch": 2123} {"train_loss": -10.821956634521484, "global_step": 356721, "epoch": 2123} {"train_loss": -11.072625160217285, "global_step": 356722, "epoch": 2123} {"train_loss": -11.473198890686035, "global_step": 356723, "epoch": 2123} {"train_loss": -11.735594749450684, "global_step": 356724, "epoch": 2123} {"train_loss": -11.72092342376709, "global_step": 356725, "epoch": 2123} {"train_loss": -11.486299514770508, "global_step": 356726, "epoch": 2123} {"train_loss": -11.842199325561523, "global_step": 356727, "epoch": 2123} {"train_loss": -11.994353294372559, "global_step": 356728, "epoch": 2123} {"train_loss": -11.49128532409668, "global_step": 356729, "epoch": 2123} {"train_loss": -11.99255084991455, "global_step": 356730, "epoch": 2123} {"train_loss": -12.100269317626953, "global_step": 356731, "epoch": 2123} {"train_loss": -11.70029067993164, "global_step": 356732, "epoch": 2123} {"train_loss": -12.048235893249512, "global_step": 356733, "epoch": 2123} {"train_loss": -12.297690391540527, "global_step": 356734, "epoch": 2123} {"train_loss": -11.31867790222168, "global_step": 356735, "epoch": 2123} {"train_loss": -12.026479721069336, "global_step": 356736, "epoch": 2123} {"train_loss": -11.898308753967285, "global_step": 356737, "epoch": 2123} {"train_loss": -12.149015426635742, "global_step": 356738, "epoch": 2123} {"train_loss": -11.928326606750488, "global_step": 356739, "epoch": 2123} {"train_loss": -11.766412734985352, "global_step": 356740, "epoch": 2123} {"train_loss": -12.01511287689209, "global_step": 356741, "epoch": 2123} {"train_loss": -12.141420364379883, "global_step": 356742, "epoch": 2123} {"train_loss": -11.952052116394043, "global_step": 356743, "epoch": 2123} {"train_loss": -12.029727935791016, "global_step": 356744, "epoch": 2123} {"train_loss": -11.99517822265625, "global_step": 356745, "epoch": 2123} {"train_loss": -12.256673812866211, "global_step": 356746, "epoch": 2123} {"train_loss": -11.953165054321289, "global_step": 356747, "epoch": 2123} {"train_loss": -12.039604187011719, "global_step": 356748, "epoch": 2123} {"train_loss": -12.278523445129395, "global_step": 356749, "epoch": 2123} {"train_loss": -11.881363868713379, "global_step": 356750, "epoch": 2123} {"train_loss": -12.310076713562012, "global_step": 356751, "epoch": 2123} {"train_loss": -12.3277587890625, "global_step": 356752, "epoch": 2123} {"train_loss": -12.175552368164062, "global_step": 356753, "epoch": 2123} {"train_loss": -12.095602035522461, "global_step": 356754, "epoch": 2123} {"train_loss": -12.229314804077148, "global_step": 356755, "epoch": 2123} {"train_loss": -12.218679428100586, "global_step": 356756, "epoch": 2123} {"train_loss": -12.022758483886719, "global_step": 356757, "epoch": 2123} {"train_loss": -12.46049976348877, "global_step": 356758, "epoch": 2123} {"train_loss": -12.126852035522461, "global_step": 356759, "epoch": 2123} {"train_loss": -11.937185287475586, "global_step": 356760, "epoch": 2123} {"train_loss": -12.277316093444824, "global_step": 356761, "epoch": 2123} {"train_loss": -12.111183166503906, "global_step": 356762, "epoch": 2123} {"train_loss": -12.091466903686523, "global_step": 356763, "epoch": 2123} {"train_loss": -12.244587898254395, "global_step": 356764, "epoch": 2123} {"train_loss": -12.171628952026367, "global_step": 356765, "epoch": 2123} {"train_loss": -12.365423202514648, "global_step": 356766, "epoch": 2123} {"train_loss": -12.405012130737305, "global_step": 356767, "epoch": 2123} {"train_loss": -12.37687873840332, "global_step": 356768, "epoch": 2123} {"train_loss": -12.123044967651367, "global_step": 356769, "epoch": 2123} {"train_loss": -12.229435920715332, "global_step": 356770, "epoch": 2123} {"train_loss": -12.263887405395508, "global_step": 356771, "epoch": 2123} {"train_loss": -12.259676933288574, "global_step": 356772, "epoch": 2123} {"train_loss": -12.465816497802734, "global_step": 356773, "epoch": 2123} {"train_loss": -12.389825820922852, "global_step": 356774, "epoch": 2123} {"train_loss": -12.364660263061523, "global_step": 356775, "epoch": 2123} {"train_loss": -12.315775871276855, "global_step": 356776, "epoch": 2123} {"train_loss": -12.322347640991211, "global_step": 356777, "epoch": 2123} {"train_loss": -11.73127555847168, "global_step": 356778, "epoch": 2123} {"train_loss": -12.470399856567383, "global_step": 356779, "epoch": 2123} {"train_loss": -12.04732894897461, "global_step": 356780, "epoch": 2123} {"train_loss": -12.291353225708008, "global_step": 356781, "epoch": 2123} {"train_loss": -12.077502250671387, "global_step": 356782, "epoch": 2123} {"train_loss": -12.250861167907715, "global_step": 356783, "epoch": 2123} {"train_loss": -12.224823951721191, "global_step": 356784, "epoch": 2123} {"train_loss": -12.326656341552734, "global_step": 356785, "epoch": 2123} {"train_loss": -11.98984146118164, "global_step": 356786, "epoch": 2123} {"train_loss": -12.436817169189453, "global_step": 356787, "epoch": 2123} {"train_loss": -12.267510414123535, "global_step": 356788, "epoch": 2123} {"train_loss": -12.02292251586914, "global_step": 356789, "epoch": 2123} {"train_loss": -12.113346099853516, "global_step": 356790, "epoch": 2123} {"train_loss": -12.018379211425781, "global_step": 356791, "epoch": 2123} {"train_loss": -12.0186185836792, "global_step": 356792, "epoch": 2123} {"train_loss": -10.394600868225098, "global_step": 356793, "epoch": 2123} {"train_loss": -12.206799507141113, "global_step": 356794, "epoch": 2123} {"train_loss": -12.242300033569336, "global_step": 356795, "epoch": 2123} {"train_loss": -12.293388366699219, "global_step": 356796, "epoch": 2123} {"train_loss": -12.05634880065918, "global_step": 356797, "epoch": 2123} {"train_loss": -11.811790466308594, "global_step": 356798, "epoch": 2123} {"train_loss": -12.193970680236816, "global_step": 356799, "epoch": 2123} {"train_loss": -11.99941635131836, "global_step": 356800, "epoch": 2123} {"train_loss": -11.814697265625, "global_step": 356801, "epoch": 2123} {"train_loss": -12.069419860839844, "global_step": 356802, "epoch": 2123} {"train_loss": -11.424325942993164, "global_step": 356803, "epoch": 2123} {"train_loss": -12.147216796875, "global_step": 356804, "epoch": 2123} {"train_loss": -11.953561782836914, "global_step": 356805, "epoch": 2123} {"train_loss": -11.861703872680664, "global_step": 356806, "epoch": 2123} {"train_loss": -11.946837425231934, "global_step": 356807, "epoch": 2123} {"train_loss": -11.899869918823242, "global_step": 356808, "epoch": 2123} {"train_loss": -12.191012382507324, "global_step": 356809, "epoch": 2123} {"train_loss": -12.288639068603516, "global_step": 356810, "epoch": 2123} {"train_loss": -11.841432571411133, "global_step": 356811, "epoch": 2123} {"train_loss": -10.658994674682617, "global_step": 356812, "epoch": 2123} {"train_loss": -11.483804702758789, "global_step": 356813, "epoch": 2123} {"train_loss": -11.57542610168457, "global_step": 356814, "epoch": 2123} {"train_loss": -11.954878807067871, "global_step": 356815, "epoch": 2123} {"train_loss": -10.884876251220703, "global_step": 356816, "epoch": 2123} {"train_loss": -11.197705268859863, "global_step": 356817, "epoch": 2123} {"train_loss": -11.29052734375, "global_step": 356818, "epoch": 2123} {"train_loss": -11.113462448120117, "global_step": 356819, "epoch": 2123} {"train_loss": -11.281089782714844, "global_step": 356820, "epoch": 2123} {"train_loss": -12.055849075317383, "global_step": 356821, "epoch": 2123} {"train_loss": -11.498102188110352, "global_step": 356822, "epoch": 2123} {"train_loss": -11.292160987854004, "global_step": 356823, "epoch": 2123} {"train_loss": -10.840787887573242, "global_step": 356824, "epoch": 2123} {"train_loss": -11.917981147766113, "global_step": 356825, "epoch": 2123} {"train_loss": -11.673763275146484, "global_step": 356826, "epoch": 2123} {"train_loss": -11.470352172851562, "global_step": 356827, "epoch": 2123} {"train_loss": -10.946439743041992, "global_step": 356828, "epoch": 2123} {"train_loss": -12.062779426574707, "global_step": 356829, "epoch": 2123} {"train_loss": -11.445096015930176, "global_step": 356830, "epoch": 2123} {"train_loss": -11.716004524912153, "global_step": 356831, "epoch": 2123, "val_loss": 294507.90625} {"train_loss": -11.87553596496582, "global_step": 356832, "epoch": 2124} {"train_loss": -11.679559707641602, "global_step": 356833, "epoch": 2124} {"train_loss": -11.882124900817871, "global_step": 356834, "epoch": 2124} {"train_loss": -11.091546058654785, "global_step": 356835, "epoch": 2124} {"train_loss": -11.87626838684082, "global_step": 356836, "epoch": 2124} {"train_loss": -10.612445831298828, "global_step": 356837, "epoch": 2124} {"train_loss": -11.401542663574219, "global_step": 356838, "epoch": 2124} {"train_loss": -11.324348449707031, "global_step": 356839, "epoch": 2124} {"train_loss": -11.605890274047852, "global_step": 356840, "epoch": 2124} {"train_loss": -10.9910888671875, "global_step": 356841, "epoch": 2124} {"train_loss": -11.913230895996094, "global_step": 356842, "epoch": 2124} {"train_loss": -10.249274253845215, "global_step": 356843, "epoch": 2124} {"train_loss": -11.412057876586914, "global_step": 356844, "epoch": 2124} {"train_loss": -11.227023124694824, "global_step": 356845, "epoch": 2124} {"train_loss": -10.920570373535156, "global_step": 356846, "epoch": 2124} {"train_loss": -11.35305118560791, "global_step": 356847, "epoch": 2124} {"train_loss": -10.967247009277344, "global_step": 356848, "epoch": 2124} {"train_loss": -11.436639785766602, "global_step": 356849, "epoch": 2124} {"train_loss": -10.668975830078125, "global_step": 356850, "epoch": 2124} {"train_loss": -11.295724868774414, "global_step": 356851, "epoch": 2124} {"train_loss": -11.089847564697266, "global_step": 356852, "epoch": 2124} {"train_loss": -11.391584396362305, "global_step": 356853, "epoch": 2124} {"train_loss": -11.532362937927246, "global_step": 356854, "epoch": 2124} {"train_loss": -11.395094871520996, "global_step": 356855, "epoch": 2124} {"train_loss": -11.772649765014648, "global_step": 356856, "epoch": 2124} {"train_loss": -11.559347152709961, "global_step": 356857, "epoch": 2124} {"train_loss": -11.368200302124023, "global_step": 356858, "epoch": 2124} {"train_loss": -11.88479995727539, "global_step": 356859, "epoch": 2124} {"train_loss": -11.68773078918457, "global_step": 356860, "epoch": 2124} {"train_loss": -11.891458511352539, "global_step": 356861, "epoch": 2124} {"train_loss": -11.850181579589844, "global_step": 356862, "epoch": 2124} {"train_loss": -11.21731185913086, "global_step": 356863, "epoch": 2124} {"train_loss": -11.605012893676758, "global_step": 356864, "epoch": 2124} {"train_loss": -11.80610466003418, "global_step": 356865, "epoch": 2124} {"train_loss": -12.092290878295898, "global_step": 356866, "epoch": 2124} {"train_loss": -11.95404052734375, "global_step": 356867, "epoch": 2124} {"train_loss": -11.554412841796875, "global_step": 356868, "epoch": 2124} {"train_loss": -11.902982711791992, "global_step": 356869, "epoch": 2124} {"train_loss": -12.209802627563477, "global_step": 356870, "epoch": 2124} {"train_loss": -11.818062782287598, "global_step": 356871, "epoch": 2124} {"train_loss": -12.154959678649902, "global_step": 356872, "epoch": 2124} {"train_loss": -11.715497016906738, "global_step": 356873, "epoch": 2124} {"train_loss": -12.042113304138184, "global_step": 356874, "epoch": 2124} {"train_loss": -12.274908065795898, "global_step": 356875, "epoch": 2124} {"train_loss": -11.774627685546875, "global_step": 356876, "epoch": 2124} {"train_loss": -12.413458824157715, "global_step": 356877, "epoch": 2124} {"train_loss": -12.270223617553711, "global_step": 356878, "epoch": 2124} {"train_loss": -12.194036483764648, "global_step": 356879, "epoch": 2124} {"train_loss": -12.416389465332031, "global_step": 356880, "epoch": 2124} {"train_loss": -12.227099418640137, "global_step": 356881, "epoch": 2124} {"train_loss": -12.374246597290039, "global_step": 356882, "epoch": 2124} {"train_loss": -12.245182991027832, "global_step": 356883, "epoch": 2124} {"train_loss": -12.571907043457031, "global_step": 356884, "epoch": 2124} {"train_loss": -12.310396194458008, "global_step": 356885, "epoch": 2124} {"train_loss": -12.417062759399414, "global_step": 356886, "epoch": 2124} {"train_loss": -12.464895248413086, "global_step": 356887, "epoch": 2124} {"train_loss": -12.354433059692383, "global_step": 356888, "epoch": 2124} {"train_loss": -12.4142484664917, "global_step": 356889, "epoch": 2124} {"train_loss": -12.546045303344727, "global_step": 356890, "epoch": 2124} {"train_loss": -12.31385612487793, "global_step": 356891, "epoch": 2124} {"train_loss": -12.172380447387695, "global_step": 356892, "epoch": 2124} {"train_loss": -12.358675003051758, "global_step": 356893, "epoch": 2124} {"train_loss": -12.215749740600586, "global_step": 356894, "epoch": 2124} {"train_loss": -12.152351379394531, "global_step": 356895, "epoch": 2124} {"train_loss": -12.229641914367676, "global_step": 356896, "epoch": 2124} {"train_loss": -12.226473808288574, "global_step": 356897, "epoch": 2124} {"train_loss": -12.253922462463379, "global_step": 356898, "epoch": 2124} {"train_loss": -12.342874526977539, "global_step": 356899, "epoch": 2124} {"train_loss": -12.109825134277344, "global_step": 356900, "epoch": 2124} {"train_loss": -12.290862083435059, "global_step": 356901, "epoch": 2124} {"train_loss": -12.311833381652832, "global_step": 356902, "epoch": 2124} {"train_loss": -12.48251724243164, "global_step": 356903, "epoch": 2124} {"train_loss": -12.349590301513672, "global_step": 356904, "epoch": 2124} {"train_loss": -12.472525596618652, "global_step": 356905, "epoch": 2124} {"train_loss": -12.407732963562012, "global_step": 356906, "epoch": 2124} {"train_loss": -11.977350234985352, "global_step": 356907, "epoch": 2124} {"train_loss": -12.31851863861084, "global_step": 356908, "epoch": 2124} {"train_loss": -12.653244018554688, "global_step": 356909, "epoch": 2124} {"train_loss": -12.013811111450195, "global_step": 356910, "epoch": 2124} {"train_loss": -12.40549087524414, "global_step": 356911, "epoch": 2124} {"train_loss": -12.154199600219727, "global_step": 356912, "epoch": 2124} {"train_loss": -12.3488130569458, "global_step": 356913, "epoch": 2124} {"train_loss": -12.315067291259766, "global_step": 356914, "epoch": 2124} {"train_loss": -12.365460395812988, "global_step": 356915, "epoch": 2124} {"train_loss": -12.164734840393066, "global_step": 356916, "epoch": 2124} {"train_loss": -12.04570198059082, "global_step": 356917, "epoch": 2124} {"train_loss": -12.242130279541016, "global_step": 356918, "epoch": 2124} {"train_loss": -12.298582077026367, "global_step": 356919, "epoch": 2124} {"train_loss": -12.089599609375, "global_step": 356920, "epoch": 2124} {"train_loss": -12.222759246826172, "global_step": 356921, "epoch": 2124} {"train_loss": -12.15307331085205, "global_step": 356922, "epoch": 2124} {"train_loss": -12.136678695678711, "global_step": 356923, "epoch": 2124} {"train_loss": -11.411026954650879, "global_step": 356924, "epoch": 2124} {"train_loss": -11.931480407714844, "global_step": 356925, "epoch": 2124} {"train_loss": -11.45640754699707, "global_step": 356926, "epoch": 2124} {"train_loss": -12.2728271484375, "global_step": 356927, "epoch": 2124} {"train_loss": -12.308391571044922, "global_step": 356928, "epoch": 2124} {"train_loss": -11.862857818603516, "global_step": 356929, "epoch": 2124} {"train_loss": -12.067850112915039, "global_step": 356930, "epoch": 2124} {"train_loss": -12.100459098815918, "global_step": 356931, "epoch": 2124} {"train_loss": -12.361831665039062, "global_step": 356932, "epoch": 2124} {"train_loss": -11.80093765258789, "global_step": 356933, "epoch": 2124} {"train_loss": -12.11100959777832, "global_step": 356934, "epoch": 2124} {"train_loss": -12.019025802612305, "global_step": 356935, "epoch": 2124} {"train_loss": -12.23425579071045, "global_step": 356936, "epoch": 2124} {"train_loss": -11.833925247192383, "global_step": 356937, "epoch": 2124} {"train_loss": -11.793623924255371, "global_step": 356938, "epoch": 2124} {"train_loss": -11.867786407470703, "global_step": 356939, "epoch": 2124} {"train_loss": -10.282867431640625, "global_step": 356940, "epoch": 2124} {"train_loss": -12.225339889526367, "global_step": 356941, "epoch": 2124} {"train_loss": -11.430524826049805, "global_step": 356942, "epoch": 2124} {"train_loss": -11.467451095581055, "global_step": 356943, "epoch": 2124} {"train_loss": -11.023199081420898, "global_step": 356944, "epoch": 2124} {"train_loss": -11.284963607788086, "global_step": 356945, "epoch": 2124} {"train_loss": -11.220247268676758, "global_step": 356946, "epoch": 2124} {"train_loss": -11.355636596679688, "global_step": 356947, "epoch": 2124} {"train_loss": -11.578840255737305, "global_step": 356948, "epoch": 2124} {"train_loss": -10.860322952270508, "global_step": 356949, "epoch": 2124} {"train_loss": -12.270966529846191, "global_step": 356950, "epoch": 2124} {"train_loss": -12.012088775634766, "global_step": 356951, "epoch": 2124} {"train_loss": -12.397500991821289, "global_step": 356952, "epoch": 2124} {"train_loss": -11.847230911254883, "global_step": 356953, "epoch": 2124} {"train_loss": -12.00754165649414, "global_step": 356954, "epoch": 2124} {"train_loss": -11.991565704345703, "global_step": 356955, "epoch": 2124} {"train_loss": -11.629931449890137, "global_step": 356956, "epoch": 2124} {"train_loss": -12.289348602294922, "global_step": 356957, "epoch": 2124} {"train_loss": -12.008800506591797, "global_step": 356958, "epoch": 2124} {"train_loss": -12.514686584472656, "global_step": 356959, "epoch": 2124} {"train_loss": -11.947898864746094, "global_step": 356960, "epoch": 2124} {"train_loss": -11.899864196777344, "global_step": 356961, "epoch": 2124} {"train_loss": -12.014538764953613, "global_step": 356962, "epoch": 2124} {"train_loss": -12.088879585266113, "global_step": 356963, "epoch": 2124} {"train_loss": -11.971593856811523, "global_step": 356964, "epoch": 2124} {"train_loss": -11.788354873657227, "global_step": 356965, "epoch": 2124} {"train_loss": -12.149959564208984, "global_step": 356966, "epoch": 2124} {"train_loss": -11.757867813110352, "global_step": 356967, "epoch": 2124} {"train_loss": -11.929814338684082, "global_step": 356968, "epoch": 2124} {"train_loss": -11.877431869506836, "global_step": 356969, "epoch": 2124} {"train_loss": -12.355562210083008, "global_step": 356970, "epoch": 2124} {"train_loss": -11.934597969055176, "global_step": 356971, "epoch": 2124} {"train_loss": -12.285213470458984, "global_step": 356972, "epoch": 2124} {"train_loss": -11.840818405151367, "global_step": 356973, "epoch": 2124} {"train_loss": -12.3389892578125, "global_step": 356974, "epoch": 2124} {"train_loss": -12.11861515045166, "global_step": 356975, "epoch": 2124} {"train_loss": -12.378917694091797, "global_step": 356976, "epoch": 2124} {"train_loss": -12.159435272216797, "global_step": 356977, "epoch": 2124} {"train_loss": -11.951142311096191, "global_step": 356978, "epoch": 2124} {"train_loss": -12.197500228881836, "global_step": 356979, "epoch": 2124} {"train_loss": -12.141424179077148, "global_step": 356980, "epoch": 2124} {"train_loss": -12.36975383758545, "global_step": 356981, "epoch": 2124} {"train_loss": -11.874788284301758, "global_step": 356982, "epoch": 2124} {"train_loss": -12.210740089416504, "global_step": 356983, "epoch": 2124} {"train_loss": -12.21364974975586, "global_step": 356984, "epoch": 2124} {"train_loss": -12.260405540466309, "global_step": 356985, "epoch": 2124} {"train_loss": -12.216753959655762, "global_step": 356986, "epoch": 2124} {"train_loss": -12.40971851348877, "global_step": 356987, "epoch": 2124} {"train_loss": -11.93548583984375, "global_step": 356988, "epoch": 2124} {"train_loss": -12.038551330566406, "global_step": 356989, "epoch": 2124} {"train_loss": -12.578925132751465, "global_step": 356990, "epoch": 2124} {"train_loss": -12.229040145874023, "global_step": 356991, "epoch": 2124} {"train_loss": -12.687767028808594, "global_step": 356992, "epoch": 2124} {"train_loss": -12.224271774291992, "global_step": 356993, "epoch": 2124} {"train_loss": -12.056312561035156, "global_step": 356994, "epoch": 2124} {"train_loss": -12.62844181060791, "global_step": 356995, "epoch": 2124} {"train_loss": -12.544498443603516, "global_step": 356996, "epoch": 2124} {"train_loss": -12.258369445800781, "global_step": 356997, "epoch": 2124} {"train_loss": -12.39450454711914, "global_step": 356998, "epoch": 2124} {"train_loss": -11.956371596881322, "global_step": 356999, "epoch": 2124, "val_loss": 294150.875} {"train_loss": -12.378021240234375, "global_step": 357000, "epoch": 2125} {"train_loss": -12.291194915771484, "global_step": 357001, "epoch": 2125} {"train_loss": -12.22490406036377, "global_step": 357002, "epoch": 2125} {"train_loss": -12.37575626373291, "global_step": 357003, "epoch": 2125} {"train_loss": -12.029888153076172, "global_step": 357004, "epoch": 2125} {"train_loss": -11.8883695602417, "global_step": 357005, "epoch": 2125} {"train_loss": -11.667268753051758, "global_step": 357006, "epoch": 2125} {"train_loss": -11.050545692443848, "global_step": 357007, "epoch": 2125} {"train_loss": -11.653013229370117, "global_step": 357008, "epoch": 2125} {"train_loss": -11.530275344848633, "global_step": 357009, "epoch": 2125} {"train_loss": -11.48425006866455, "global_step": 357010, "epoch": 2125} {"train_loss": -11.672993659973145, "global_step": 357011, "epoch": 2125} {"train_loss": -11.83923053741455, "global_step": 357012, "epoch": 2125} {"train_loss": -11.868062973022461, "global_step": 357013, "epoch": 2125} {"train_loss": -11.537260055541992, "global_step": 357014, "epoch": 2125} {"train_loss": -10.786622047424316, "global_step": 357015, "epoch": 2125} {"train_loss": -12.101629257202148, "global_step": 357016, "epoch": 2125} {"train_loss": -11.974864959716797, "global_step": 357017, "epoch": 2125} {"train_loss": -11.060054779052734, "global_step": 357018, "epoch": 2125} {"train_loss": -11.391007423400879, "global_step": 357019, "epoch": 2125} {"train_loss": -11.889524459838867, "global_step": 357020, "epoch": 2125} {"train_loss": -11.920509338378906, "global_step": 357021, "epoch": 2125} {"train_loss": -11.816573143005371, "global_step": 357022, "epoch": 2125} {"train_loss": -12.147187232971191, "global_step": 357023, "epoch": 2125} {"train_loss": -12.031119346618652, "global_step": 357024, "epoch": 2125} {"train_loss": -11.782896041870117, "global_step": 357025, "epoch": 2125} {"train_loss": -12.478740692138672, "global_step": 357026, "epoch": 2125} {"train_loss": -11.490592956542969, "global_step": 357027, "epoch": 2125} {"train_loss": -11.396846771240234, "global_step": 357028, "epoch": 2125} {"train_loss": -11.534523010253906, "global_step": 357029, "epoch": 2125} {"train_loss": -12.181987762451172, "global_step": 357030, "epoch": 2125} {"train_loss": -10.59671401977539, "global_step": 357031, "epoch": 2125} {"train_loss": -12.056051254272461, "global_step": 357032, "epoch": 2125} {"train_loss": -12.28792953491211, "global_step": 357033, "epoch": 2125} {"train_loss": -11.666177749633789, "global_step": 357034, "epoch": 2125} {"train_loss": -12.280890464782715, "global_step": 357035, "epoch": 2125} {"train_loss": -11.589576721191406, "global_step": 357036, "epoch": 2125} {"train_loss": -11.671308517456055, "global_step": 357037, "epoch": 2125} {"train_loss": -11.865992546081543, "global_step": 357038, "epoch": 2125} {"train_loss": -11.176128387451172, "global_step": 357039, "epoch": 2125} {"train_loss": -10.907431602478027, "global_step": 357040, "epoch": 2125} {"train_loss": -9.870302200317383, "global_step": 357041, "epoch": 2125} {"train_loss": -11.670180320739746, "global_step": 357042, "epoch": 2125} {"train_loss": -10.845577239990234, "global_step": 357043, "epoch": 2125} {"train_loss": -11.441000938415527, "global_step": 357044, "epoch": 2125} {"train_loss": -10.928308486938477, "global_step": 357045, "epoch": 2125} {"train_loss": -10.588203430175781, "global_step": 357046, "epoch": 2125} {"train_loss": -11.799232482910156, "global_step": 357047, "epoch": 2125} {"train_loss": -10.46229076385498, "global_step": 357048, "epoch": 2125} {"train_loss": -11.931936264038086, "global_step": 357049, "epoch": 2125} {"train_loss": -11.114838600158691, "global_step": 357050, "epoch": 2125} {"train_loss": -11.347981452941895, "global_step": 357051, "epoch": 2125} {"train_loss": -11.947607040405273, "global_step": 357052, "epoch": 2125} {"train_loss": -10.916375160217285, "global_step": 357053, "epoch": 2125} {"train_loss": -11.941570281982422, "global_step": 357054, "epoch": 2125} {"train_loss": -11.114092826843262, "global_step": 357055, "epoch": 2125} {"train_loss": -11.079889297485352, "global_step": 357056, "epoch": 2125} {"train_loss": -10.991103172302246, "global_step": 357057, "epoch": 2125} {"train_loss": -10.404394149780273, "global_step": 357058, "epoch": 2125} {"train_loss": -11.344564437866211, "global_step": 357059, "epoch": 2125} {"train_loss": -9.905171394348145, "global_step": 357060, "epoch": 2125} {"train_loss": -12.13937759399414, "global_step": 357061, "epoch": 2125} {"train_loss": -10.425252914428711, "global_step": 357062, "epoch": 2125} {"train_loss": -11.117533683776855, "global_step": 357063, "epoch": 2125} {"train_loss": -11.874822616577148, "global_step": 357064, "epoch": 2125} {"train_loss": -10.282876968383789, "global_step": 357065, "epoch": 2125} {"train_loss": -11.176441192626953, "global_step": 357066, "epoch": 2125} {"train_loss": -11.656312942504883, "global_step": 357067, "epoch": 2125} {"train_loss": -10.15542984008789, "global_step": 357068, "epoch": 2125} {"train_loss": -11.3725004196167, "global_step": 357069, "epoch": 2125} {"train_loss": -10.846275329589844, "global_step": 357070, "epoch": 2125} {"train_loss": -10.191328048706055, "global_step": 357071, "epoch": 2125} {"train_loss": -11.131356239318848, "global_step": 357072, "epoch": 2125} {"train_loss": -10.841575622558594, "global_step": 357073, "epoch": 2125} {"train_loss": -11.065489768981934, "global_step": 357074, "epoch": 2125} {"train_loss": -12.162983894348145, "global_step": 357075, "epoch": 2125} {"train_loss": -11.255558013916016, "global_step": 357076, "epoch": 2125} {"train_loss": -11.315179824829102, "global_step": 357077, "epoch": 2125} {"train_loss": -11.53718376159668, "global_step": 357078, "epoch": 2125} {"train_loss": -11.534196853637695, "global_step": 357079, "epoch": 2125} {"train_loss": -11.999285697937012, "global_step": 357080, "epoch": 2125} {"train_loss": -11.63229751586914, "global_step": 357081, "epoch": 2125} {"train_loss": -11.701910018920898, "global_step": 357082, "epoch": 2125} {"train_loss": -11.83227825164795, "global_step": 357083, "epoch": 2125} {"train_loss": -11.995404243469238, "global_step": 357084, "epoch": 2125} {"train_loss": -11.60531234741211, "global_step": 357085, "epoch": 2125} {"train_loss": -11.946300506591797, "global_step": 357086, "epoch": 2125} {"train_loss": -11.945634841918945, "global_step": 357087, "epoch": 2125} {"train_loss": -12.022838592529297, "global_step": 357088, "epoch": 2125} {"train_loss": -11.955873489379883, "global_step": 357089, "epoch": 2125} {"train_loss": -11.838933944702148, "global_step": 357090, "epoch": 2125} {"train_loss": -12.010619163513184, "global_step": 357091, "epoch": 2125} {"train_loss": -12.119296073913574, "global_step": 357092, "epoch": 2125} {"train_loss": -12.011701583862305, "global_step": 357093, "epoch": 2125} {"train_loss": -11.868882179260254, "global_step": 357094, "epoch": 2125} {"train_loss": -12.014724731445312, "global_step": 357095, "epoch": 2125} {"train_loss": -11.904905319213867, "global_step": 357096, "epoch": 2125} {"train_loss": -12.178823471069336, "global_step": 357097, "epoch": 2125} {"train_loss": -12.057441711425781, "global_step": 357098, "epoch": 2125} {"train_loss": -11.903127670288086, "global_step": 357099, "epoch": 2125} {"train_loss": -12.289230346679688, "global_step": 357100, "epoch": 2125} {"train_loss": -11.944095611572266, "global_step": 357101, "epoch": 2125} {"train_loss": -12.26978874206543, "global_step": 357102, "epoch": 2125} {"train_loss": -12.425716400146484, "global_step": 357103, "epoch": 2125} {"train_loss": -12.049539566040039, "global_step": 357104, "epoch": 2125} {"train_loss": -12.348699569702148, "global_step": 357105, "epoch": 2125} {"train_loss": -12.312557220458984, "global_step": 357106, "epoch": 2125} {"train_loss": -12.04308795928955, "global_step": 357107, "epoch": 2125} {"train_loss": -12.323530197143555, "global_step": 357108, "epoch": 2125} {"train_loss": -12.345107078552246, "global_step": 357109, "epoch": 2125} {"train_loss": -12.544839859008789, "global_step": 357110, "epoch": 2125} {"train_loss": -12.271570205688477, "global_step": 357111, "epoch": 2125} {"train_loss": -12.284492492675781, "global_step": 357112, "epoch": 2125} {"train_loss": -11.934832572937012, "global_step": 357113, "epoch": 2125} {"train_loss": -12.282230377197266, "global_step": 357114, "epoch": 2125} {"train_loss": -12.358642578125, "global_step": 357115, "epoch": 2125} {"train_loss": -12.208069801330566, "global_step": 357116, "epoch": 2125} {"train_loss": -12.332752227783203, "global_step": 357117, "epoch": 2125} {"train_loss": -12.137279510498047, "global_step": 357118, "epoch": 2125} {"train_loss": -12.41494083404541, "global_step": 357119, "epoch": 2125} {"train_loss": -12.314807891845703, "global_step": 357120, "epoch": 2125} {"train_loss": -12.402874946594238, "global_step": 357121, "epoch": 2125} {"train_loss": -12.304901123046875, "global_step": 357122, "epoch": 2125} {"train_loss": -12.311275482177734, "global_step": 357123, "epoch": 2125} {"train_loss": -12.087007522583008, "global_step": 357124, "epoch": 2125} {"train_loss": -12.709078788757324, "global_step": 357125, "epoch": 2125} {"train_loss": -12.262557983398438, "global_step": 357126, "epoch": 2125} {"train_loss": -12.254423141479492, "global_step": 357127, "epoch": 2125} {"train_loss": -12.470037460327148, "global_step": 357128, "epoch": 2125} {"train_loss": -12.184971809387207, "global_step": 357129, "epoch": 2125} {"train_loss": -12.698953628540039, "global_step": 357130, "epoch": 2125} {"train_loss": -12.475702285766602, "global_step": 357131, "epoch": 2125} {"train_loss": -12.483956336975098, "global_step": 357132, "epoch": 2125} {"train_loss": -12.74223518371582, "global_step": 357133, "epoch": 2125} {"train_loss": -12.582024574279785, "global_step": 357134, "epoch": 2125} {"train_loss": -12.425397872924805, "global_step": 357135, "epoch": 2125} {"train_loss": -12.56552791595459, "global_step": 357136, "epoch": 2125} {"train_loss": -12.196041107177734, "global_step": 357137, "epoch": 2125} {"train_loss": -12.241168975830078, "global_step": 357138, "epoch": 2125} {"train_loss": -12.554028511047363, "global_step": 357139, "epoch": 2125} {"train_loss": -12.034953117370605, "global_step": 357140, "epoch": 2125} {"train_loss": -12.292128562927246, "global_step": 357141, "epoch": 2125} {"train_loss": -12.239618301391602, "global_step": 357142, "epoch": 2125} {"train_loss": -12.381061553955078, "global_step": 357143, "epoch": 2125} {"train_loss": -12.355363845825195, "global_step": 357144, "epoch": 2125} {"train_loss": -12.13626480102539, "global_step": 357145, "epoch": 2125} {"train_loss": -12.522370338439941, "global_step": 357146, "epoch": 2125} {"train_loss": -12.412288665771484, "global_step": 357147, "epoch": 2125} {"train_loss": -12.087041854858398, "global_step": 357148, "epoch": 2125} {"train_loss": -12.29896354675293, "global_step": 357149, "epoch": 2125} {"train_loss": -11.794177055358887, "global_step": 357150, "epoch": 2125} {"train_loss": -12.205924987792969, "global_step": 357151, "epoch": 2125} {"train_loss": -12.076828002929688, "global_step": 357152, "epoch": 2125} {"train_loss": -12.28919506072998, "global_step": 357153, "epoch": 2125} {"train_loss": -12.281022071838379, "global_step": 357154, "epoch": 2125} {"train_loss": -12.029214859008789, "global_step": 357155, "epoch": 2125} {"train_loss": -12.12027645111084, "global_step": 357156, "epoch": 2125} {"train_loss": -12.46240234375, "global_step": 357157, "epoch": 2125} {"train_loss": -11.582386016845703, "global_step": 357158, "epoch": 2125} {"train_loss": -11.628645896911621, "global_step": 357159, "epoch": 2125} {"train_loss": -12.464807510375977, "global_step": 357160, "epoch": 2125} {"train_loss": -12.389843940734863, "global_step": 357161, "epoch": 2125} {"train_loss": -12.123106002807617, "global_step": 357162, "epoch": 2125} {"train_loss": -12.064546585083008, "global_step": 357163, "epoch": 2125} {"train_loss": -12.048478126525879, "global_step": 357164, "epoch": 2125} {"train_loss": -12.385671615600586, "global_step": 357165, "epoch": 2125} {"train_loss": -12.238863945007324, "global_step": 357166, "epoch": 2125} {"train_loss": -11.83712276958284, "global_step": 357167, "epoch": 2125, "val_loss": 288301.84375, "train_action_mse_error": 1.1011358499526978} {"train_loss": -11.915812492370605, "global_step": 357168, "epoch": 2126} {"train_loss": -12.191825866699219, "global_step": 357169, "epoch": 2126} {"train_loss": -12.152225494384766, "global_step": 357170, "epoch": 2126} {"train_loss": -12.391489028930664, "global_step": 357171, "epoch": 2126} {"train_loss": -12.156407356262207, "global_step": 357172, "epoch": 2126} {"train_loss": -11.774301528930664, "global_step": 357173, "epoch": 2126} {"train_loss": -12.293042182922363, "global_step": 357174, "epoch": 2126} {"train_loss": -11.94424819946289, "global_step": 357175, "epoch": 2126} {"train_loss": -11.278936386108398, "global_step": 357176, "epoch": 2126} {"train_loss": -11.628961563110352, "global_step": 357177, "epoch": 2126} {"train_loss": -11.8972806930542, "global_step": 357178, "epoch": 2126} {"train_loss": -12.257256507873535, "global_step": 357179, "epoch": 2126} {"train_loss": -11.862333297729492, "global_step": 357180, "epoch": 2126} {"train_loss": -12.22578239440918, "global_step": 357181, "epoch": 2126} {"train_loss": -11.845500946044922, "global_step": 357182, "epoch": 2126} {"train_loss": -11.254809379577637, "global_step": 357183, "epoch": 2126} {"train_loss": -12.354339599609375, "global_step": 357184, "epoch": 2126} {"train_loss": -11.218088150024414, "global_step": 357185, "epoch": 2126} {"train_loss": -11.539915084838867, "global_step": 357186, "epoch": 2126} {"train_loss": -11.797616958618164, "global_step": 357187, "epoch": 2126} {"train_loss": -11.778512954711914, "global_step": 357188, "epoch": 2126} {"train_loss": -11.54672622680664, "global_step": 357189, "epoch": 2126} {"train_loss": -11.666851043701172, "global_step": 357190, "epoch": 2126} {"train_loss": -11.50362777709961, "global_step": 357191, "epoch": 2126} {"train_loss": -11.536260604858398, "global_step": 357192, "epoch": 2126} {"train_loss": -10.826478958129883, "global_step": 357193, "epoch": 2126} {"train_loss": -11.693729400634766, "global_step": 357194, "epoch": 2126} {"train_loss": -10.944693565368652, "global_step": 357195, "epoch": 2126} {"train_loss": -11.325335502624512, "global_step": 357196, "epoch": 2126} {"train_loss": -11.742378234863281, "global_step": 357197, "epoch": 2126} {"train_loss": -9.73263931274414, "global_step": 357198, "epoch": 2126} {"train_loss": -12.427884101867676, "global_step": 357199, "epoch": 2126} {"train_loss": -9.853226661682129, "global_step": 357200, "epoch": 2126} {"train_loss": -11.592694282531738, "global_step": 357201, "epoch": 2126} {"train_loss": -10.762187957763672, "global_step": 357202, "epoch": 2126} {"train_loss": -11.525839805603027, "global_step": 357203, "epoch": 2126} {"train_loss": -11.224660873413086, "global_step": 357204, "epoch": 2126} {"train_loss": -10.84383773803711, "global_step": 357205, "epoch": 2126} {"train_loss": -11.90066146850586, "global_step": 357206, "epoch": 2126} {"train_loss": -10.48938274383545, "global_step": 357207, "epoch": 2126} {"train_loss": -11.73604965209961, "global_step": 357208, "epoch": 2126} {"train_loss": -10.439462661743164, "global_step": 357209, "epoch": 2126} {"train_loss": -12.146209716796875, "global_step": 357210, "epoch": 2126} {"train_loss": -11.271512985229492, "global_step": 357211, "epoch": 2126} {"train_loss": -11.070515632629395, "global_step": 357212, "epoch": 2126} {"train_loss": -11.854936599731445, "global_step": 357213, "epoch": 2126} {"train_loss": -11.09337043762207, "global_step": 357214, "epoch": 2126} {"train_loss": -11.911508560180664, "global_step": 357215, "epoch": 2126} {"train_loss": -11.162769317626953, "global_step": 357216, "epoch": 2126} {"train_loss": -11.62778377532959, "global_step": 357217, "epoch": 2126} {"train_loss": -11.549383163452148, "global_step": 357218, "epoch": 2126} {"train_loss": -11.585951805114746, "global_step": 357219, "epoch": 2126} {"train_loss": -12.027962684631348, "global_step": 357220, "epoch": 2126} {"train_loss": -11.678446769714355, "global_step": 357221, "epoch": 2126} {"train_loss": -12.037030220031738, "global_step": 357222, "epoch": 2126} {"train_loss": -11.64816665649414, "global_step": 357223, "epoch": 2126} {"train_loss": -11.967679977416992, "global_step": 357224, "epoch": 2126} {"train_loss": -11.486668586730957, "global_step": 357225, "epoch": 2126} {"train_loss": -11.860054016113281, "global_step": 357226, "epoch": 2126} {"train_loss": -11.847448348999023, "global_step": 357227, "epoch": 2126} {"train_loss": -12.192066192626953, "global_step": 357228, "epoch": 2126} {"train_loss": -11.86227798461914, "global_step": 357229, "epoch": 2126} {"train_loss": -11.866762161254883, "global_step": 357230, "epoch": 2126} {"train_loss": -11.879791259765625, "global_step": 357231, "epoch": 2126} {"train_loss": -11.920711517333984, "global_step": 357232, "epoch": 2126} {"train_loss": -12.234874725341797, "global_step": 357233, "epoch": 2126} {"train_loss": -11.504215240478516, "global_step": 357234, "epoch": 2126} {"train_loss": -12.167543411254883, "global_step": 357235, "epoch": 2126} {"train_loss": -11.798811912536621, "global_step": 357236, "epoch": 2126} {"train_loss": -11.939305305480957, "global_step": 357237, "epoch": 2126} {"train_loss": -11.947643280029297, "global_step": 357238, "epoch": 2126} {"train_loss": -11.816929817199707, "global_step": 357239, "epoch": 2126} {"train_loss": -11.622408866882324, "global_step": 357240, "epoch": 2126} {"train_loss": -11.776477813720703, "global_step": 357241, "epoch": 2126} {"train_loss": -11.669210433959961, "global_step": 357242, "epoch": 2126} {"train_loss": -11.452363967895508, "global_step": 357243, "epoch": 2126} {"train_loss": -11.319568634033203, "global_step": 357244, "epoch": 2126} {"train_loss": -11.952112197875977, "global_step": 357245, "epoch": 2126} {"train_loss": -11.967218399047852, "global_step": 357246, "epoch": 2126} {"train_loss": -11.843475341796875, "global_step": 357247, "epoch": 2126} {"train_loss": -12.11178207397461, "global_step": 357248, "epoch": 2126} {"train_loss": -11.306257247924805, "global_step": 357249, "epoch": 2126} {"train_loss": -12.128623962402344, "global_step": 357250, "epoch": 2126} {"train_loss": -11.807022094726562, "global_step": 357251, "epoch": 2126} {"train_loss": -12.140957832336426, "global_step": 357252, "epoch": 2126} {"train_loss": -12.128679275512695, "global_step": 357253, "epoch": 2126} {"train_loss": -11.746097564697266, "global_step": 357254, "epoch": 2126} {"train_loss": -12.26396369934082, "global_step": 357255, "epoch": 2126} {"train_loss": -11.993059158325195, "global_step": 357256, "epoch": 2126} {"train_loss": -12.196475982666016, "global_step": 357257, "epoch": 2126} {"train_loss": -12.04506778717041, "global_step": 357258, "epoch": 2126} {"train_loss": -12.021387100219727, "global_step": 357259, "epoch": 2126} {"train_loss": -12.307439804077148, "global_step": 357260, "epoch": 2126} {"train_loss": -12.016878128051758, "global_step": 357261, "epoch": 2126} {"train_loss": -12.136889457702637, "global_step": 357262, "epoch": 2126} {"train_loss": -12.06374740600586, "global_step": 357263, "epoch": 2126} {"train_loss": -12.15162467956543, "global_step": 357264, "epoch": 2126} {"train_loss": -12.175373077392578, "global_step": 357265, "epoch": 2126} {"train_loss": -12.034646987915039, "global_step": 357266, "epoch": 2126} {"train_loss": -12.442415237426758, "global_step": 357267, "epoch": 2126} {"train_loss": -12.137535095214844, "global_step": 357268, "epoch": 2126} {"train_loss": -12.497930526733398, "global_step": 357269, "epoch": 2126} {"train_loss": -12.291193962097168, "global_step": 357270, "epoch": 2126} {"train_loss": -12.43931770324707, "global_step": 357271, "epoch": 2126} {"train_loss": -12.422393798828125, "global_step": 357272, "epoch": 2126} {"train_loss": -12.387950897216797, "global_step": 357273, "epoch": 2126} {"train_loss": -12.460604667663574, "global_step": 357274, "epoch": 2126} {"train_loss": -12.254653930664062, "global_step": 357275, "epoch": 2126} {"train_loss": -12.451465606689453, "global_step": 357276, "epoch": 2126} {"train_loss": -12.275749206542969, "global_step": 357277, "epoch": 2126} {"train_loss": -12.492683410644531, "global_step": 357278, "epoch": 2126} {"train_loss": -12.267946243286133, "global_step": 357279, "epoch": 2126} {"train_loss": -11.520057678222656, "global_step": 357280, "epoch": 2126} {"train_loss": -12.122932434082031, "global_step": 357281, "epoch": 2126} {"train_loss": -11.368122100830078, "global_step": 357282, "epoch": 2126} {"train_loss": -12.258186340332031, "global_step": 357283, "epoch": 2126} {"train_loss": -11.85986614227295, "global_step": 357284, "epoch": 2126} {"train_loss": -11.505099296569824, "global_step": 357285, "epoch": 2126} {"train_loss": -12.075654029846191, "global_step": 357286, "epoch": 2126} {"train_loss": -11.494882583618164, "global_step": 357287, "epoch": 2126} {"train_loss": -12.304048538208008, "global_step": 357288, "epoch": 2126} {"train_loss": -11.7830171585083, "global_step": 357289, "epoch": 2126} {"train_loss": -11.299811363220215, "global_step": 357290, "epoch": 2126} {"train_loss": -11.769948959350586, "global_step": 357291, "epoch": 2126} {"train_loss": -10.7256441116333, "global_step": 357292, "epoch": 2126} {"train_loss": -12.478300094604492, "global_step": 357293, "epoch": 2126} {"train_loss": -11.153404235839844, "global_step": 357294, "epoch": 2126} {"train_loss": -11.892419815063477, "global_step": 357295, "epoch": 2126} {"train_loss": -12.058417320251465, "global_step": 357296, "epoch": 2126} {"train_loss": -11.521110534667969, "global_step": 357297, "epoch": 2126} {"train_loss": -12.284257888793945, "global_step": 357298, "epoch": 2126} {"train_loss": -11.661662101745605, "global_step": 357299, "epoch": 2126} {"train_loss": -12.368536949157715, "global_step": 357300, "epoch": 2126} {"train_loss": -11.909951210021973, "global_step": 357301, "epoch": 2126} {"train_loss": -11.968128204345703, "global_step": 357302, "epoch": 2126} {"train_loss": -12.172024726867676, "global_step": 357303, "epoch": 2126} {"train_loss": -12.255643844604492, "global_step": 357304, "epoch": 2126} {"train_loss": -12.445075988769531, "global_step": 357305, "epoch": 2126} {"train_loss": -12.270271301269531, "global_step": 357306, "epoch": 2126} {"train_loss": -12.416318893432617, "global_step": 357307, "epoch": 2126} {"train_loss": -12.081506729125977, "global_step": 357308, "epoch": 2126} {"train_loss": -12.241060256958008, "global_step": 357309, "epoch": 2126} {"train_loss": -12.221877098083496, "global_step": 357310, "epoch": 2126} {"train_loss": -12.300970077514648, "global_step": 357311, "epoch": 2126} {"train_loss": -12.199087142944336, "global_step": 357312, "epoch": 2126} {"train_loss": -12.33798599243164, "global_step": 357313, "epoch": 2126} {"train_loss": -12.297225952148438, "global_step": 357314, "epoch": 2126} {"train_loss": -12.473892211914062, "global_step": 357315, "epoch": 2126} {"train_loss": -12.553085327148438, "global_step": 357316, "epoch": 2126} {"train_loss": -12.343172073364258, "global_step": 357317, "epoch": 2126} {"train_loss": -12.42949104309082, "global_step": 357318, "epoch": 2126} {"train_loss": -12.4262113571167, "global_step": 357319, "epoch": 2126} {"train_loss": -12.493764877319336, "global_step": 357320, "epoch": 2126} {"train_loss": -12.522357940673828, "global_step": 357321, "epoch": 2126} {"train_loss": -12.472490310668945, "global_step": 357322, "epoch": 2126} {"train_loss": -12.45266342163086, "global_step": 357323, "epoch": 2126} {"train_loss": -12.47408676147461, "global_step": 357324, "epoch": 2126} {"train_loss": -12.421995162963867, "global_step": 357325, "epoch": 2126} {"train_loss": -12.593100547790527, "global_step": 357326, "epoch": 2126} {"train_loss": -12.271818161010742, "global_step": 357327, "epoch": 2126} {"train_loss": -12.461953163146973, "global_step": 357328, "epoch": 2126} {"train_loss": -12.634830474853516, "global_step": 357329, "epoch": 2126} {"train_loss": -12.402068138122559, "global_step": 357330, "epoch": 2126} {"train_loss": -12.360982894897461, "global_step": 357331, "epoch": 2126} {"train_loss": -12.670734405517578, "global_step": 357332, "epoch": 2126} {"train_loss": -12.529031753540039, "global_step": 357333, "epoch": 2126} {"train_loss": -12.59773063659668, "global_step": 357334, "epoch": 2126} {"train_loss": -11.915655170168195, "global_step": 357335, "epoch": 2126, "val_loss": 290582.25} {"train_loss": -12.511991500854492, "global_step": 357336, "epoch": 2127} {"train_loss": -12.593317031860352, "global_step": 357337, "epoch": 2127} {"train_loss": -12.474006652832031, "global_step": 357338, "epoch": 2127} {"train_loss": -12.419775009155273, "global_step": 357339, "epoch": 2127} {"train_loss": -12.486963272094727, "global_step": 357340, "epoch": 2127} {"train_loss": -12.459219932556152, "global_step": 357341, "epoch": 2127} {"train_loss": -12.192750930786133, "global_step": 357342, "epoch": 2127} {"train_loss": -12.19214916229248, "global_step": 357343, "epoch": 2127} {"train_loss": -12.347700119018555, "global_step": 357344, "epoch": 2127} {"train_loss": -12.539983749389648, "global_step": 357345, "epoch": 2127} {"train_loss": -12.481008529663086, "global_step": 357346, "epoch": 2127} {"train_loss": -12.674901008605957, "global_step": 357347, "epoch": 2127} {"train_loss": -12.514448165893555, "global_step": 357348, "epoch": 2127} {"train_loss": -12.553679466247559, "global_step": 357349, "epoch": 2127} {"train_loss": -12.495857238769531, "global_step": 357350, "epoch": 2127} {"train_loss": -12.427960395812988, "global_step": 357351, "epoch": 2127} {"train_loss": -12.321788787841797, "global_step": 357352, "epoch": 2127} {"train_loss": -12.537416458129883, "global_step": 357353, "epoch": 2127} {"train_loss": -12.276326179504395, "global_step": 357354, "epoch": 2127} {"train_loss": -12.355833053588867, "global_step": 357355, "epoch": 2127} {"train_loss": -11.475093841552734, "global_step": 357356, "epoch": 2127} {"train_loss": -12.000496864318848, "global_step": 357357, "epoch": 2127} {"train_loss": -11.776269912719727, "global_step": 357358, "epoch": 2127} {"train_loss": -12.570503234863281, "global_step": 357359, "epoch": 2127} {"train_loss": -11.792806625366211, "global_step": 357360, "epoch": 2127} {"train_loss": -12.211488723754883, "global_step": 357361, "epoch": 2127} {"train_loss": -11.852256774902344, "global_step": 357362, "epoch": 2127} {"train_loss": -11.907890319824219, "global_step": 357363, "epoch": 2127} {"train_loss": -11.202103614807129, "global_step": 357364, "epoch": 2127} {"train_loss": -11.409172058105469, "global_step": 357365, "epoch": 2127} {"train_loss": -10.362808227539062, "global_step": 357366, "epoch": 2127} {"train_loss": -11.988422393798828, "global_step": 357367, "epoch": 2127} {"train_loss": -9.40185546875, "global_step": 357368, "epoch": 2127} {"train_loss": -9.63222599029541, "global_step": 357369, "epoch": 2127} {"train_loss": -10.720128059387207, "global_step": 357370, "epoch": 2127} {"train_loss": -9.308772087097168, "global_step": 357371, "epoch": 2127} {"train_loss": -9.218162536621094, "global_step": 357372, "epoch": 2127} {"train_loss": -9.71376895904541, "global_step": 357373, "epoch": 2127} {"train_loss": -9.93862533569336, "global_step": 357374, "epoch": 2127} {"train_loss": -7.333766460418701, "global_step": 357375, "epoch": 2127} {"train_loss": -8.02752685546875, "global_step": 357376, "epoch": 2127} {"train_loss": -8.078302383422852, "global_step": 357377, "epoch": 2127} {"train_loss": -9.522385597229004, "global_step": 357378, "epoch": 2127} {"train_loss": -9.018884658813477, "global_step": 357379, "epoch": 2127} {"train_loss": -9.033319473266602, "global_step": 357380, "epoch": 2127} {"train_loss": -9.29269790649414, "global_step": 357381, "epoch": 2127} {"train_loss": -7.344122886657715, "global_step": 357382, "epoch": 2127} {"train_loss": -7.562429428100586, "global_step": 357383, "epoch": 2127} {"train_loss": -7.849692344665527, "global_step": 357384, "epoch": 2127} {"train_loss": -8.479122161865234, "global_step": 357385, "epoch": 2127} {"train_loss": -9.846357345581055, "global_step": 357386, "epoch": 2127} {"train_loss": -8.770306587219238, "global_step": 357387, "epoch": 2127} {"train_loss": -10.157974243164062, "global_step": 357388, "epoch": 2127} {"train_loss": -9.803415298461914, "global_step": 357389, "epoch": 2127} {"train_loss": -10.848219871520996, "global_step": 357390, "epoch": 2127} {"train_loss": -10.124112129211426, "global_step": 357391, "epoch": 2127} {"train_loss": -11.23607349395752, "global_step": 357392, "epoch": 2127} {"train_loss": -10.434249877929688, "global_step": 357393, "epoch": 2127} {"train_loss": -10.389664649963379, "global_step": 357394, "epoch": 2127} {"train_loss": -10.455698013305664, "global_step": 357395, "epoch": 2127} {"train_loss": -10.164416313171387, "global_step": 357396, "epoch": 2127} {"train_loss": -11.253580093383789, "global_step": 357397, "epoch": 2127} {"train_loss": -10.642767906188965, "global_step": 357398, "epoch": 2127} {"train_loss": -11.28933334350586, "global_step": 357399, "epoch": 2127} {"train_loss": -10.78750228881836, "global_step": 357400, "epoch": 2127} {"train_loss": -11.149109840393066, "global_step": 357401, "epoch": 2127} {"train_loss": -11.078535079956055, "global_step": 357402, "epoch": 2127} {"train_loss": -11.275758743286133, "global_step": 357403, "epoch": 2127} {"train_loss": -11.167447090148926, "global_step": 357404, "epoch": 2127} {"train_loss": -11.658153533935547, "global_step": 357405, "epoch": 2127} {"train_loss": -11.011698722839355, "global_step": 357406, "epoch": 2127} {"train_loss": -11.838874816894531, "global_step": 357407, "epoch": 2127} {"train_loss": -11.191214561462402, "global_step": 357408, "epoch": 2127} {"train_loss": -11.564154624938965, "global_step": 357409, "epoch": 2127} {"train_loss": -11.613677978515625, "global_step": 357410, "epoch": 2127} {"train_loss": -11.701071739196777, "global_step": 357411, "epoch": 2127} {"train_loss": -11.597967147827148, "global_step": 357412, "epoch": 2127} {"train_loss": -12.049747467041016, "global_step": 357413, "epoch": 2127} {"train_loss": -11.786484718322754, "global_step": 357414, "epoch": 2127} {"train_loss": -11.687952041625977, "global_step": 357415, "epoch": 2127} {"train_loss": -12.189981460571289, "global_step": 357416, "epoch": 2127} {"train_loss": -11.760408401489258, "global_step": 357417, "epoch": 2127} {"train_loss": -11.705475807189941, "global_step": 357418, "epoch": 2127} {"train_loss": -12.076146125793457, "global_step": 357419, "epoch": 2127} {"train_loss": -12.044136047363281, "global_step": 357420, "epoch": 2127} {"train_loss": -11.947404861450195, "global_step": 357421, "epoch": 2127} {"train_loss": -12.020923614501953, "global_step": 357422, "epoch": 2127} {"train_loss": -12.01298999786377, "global_step": 357423, "epoch": 2127} {"train_loss": -12.18819808959961, "global_step": 357424, "epoch": 2127} {"train_loss": -12.022518157958984, "global_step": 357425, "epoch": 2127} {"train_loss": -11.859922409057617, "global_step": 357426, "epoch": 2127} {"train_loss": -12.24453353881836, "global_step": 357427, "epoch": 2127} {"train_loss": -12.177223205566406, "global_step": 357428, "epoch": 2127} {"train_loss": -12.088249206542969, "global_step": 357429, "epoch": 2127} {"train_loss": -12.219858169555664, "global_step": 357430, "epoch": 2127} {"train_loss": -12.061555862426758, "global_step": 357431, "epoch": 2127} {"train_loss": -12.12997055053711, "global_step": 357432, "epoch": 2127} {"train_loss": -12.33027172088623, "global_step": 357433, "epoch": 2127} {"train_loss": -12.170568466186523, "global_step": 357434, "epoch": 2127} {"train_loss": -12.132080078125, "global_step": 357435, "epoch": 2127} {"train_loss": -12.329532623291016, "global_step": 357436, "epoch": 2127} {"train_loss": -12.265949249267578, "global_step": 357437, "epoch": 2127} {"train_loss": -12.493193626403809, "global_step": 357438, "epoch": 2127} {"train_loss": -12.027826309204102, "global_step": 357439, "epoch": 2127} {"train_loss": -12.311705589294434, "global_step": 357440, "epoch": 2127} {"train_loss": -12.187959671020508, "global_step": 357441, "epoch": 2127} {"train_loss": -12.136370658874512, "global_step": 357442, "epoch": 2127} {"train_loss": -12.272568702697754, "global_step": 357443, "epoch": 2127} {"train_loss": -12.276165962219238, "global_step": 357444, "epoch": 2127} {"train_loss": -12.044933319091797, "global_step": 357445, "epoch": 2127} {"train_loss": -12.371301651000977, "global_step": 357446, "epoch": 2127} {"train_loss": -12.398165702819824, "global_step": 357447, "epoch": 2127} {"train_loss": -12.479177474975586, "global_step": 357448, "epoch": 2127} {"train_loss": -12.298687934875488, "global_step": 357449, "epoch": 2127} {"train_loss": -12.350226402282715, "global_step": 357450, "epoch": 2127} {"train_loss": -12.212740898132324, "global_step": 357451, "epoch": 2127} {"train_loss": -12.510953903198242, "global_step": 357452, "epoch": 2127} {"train_loss": -12.397899627685547, "global_step": 357453, "epoch": 2127} {"train_loss": -12.408028602600098, "global_step": 357454, "epoch": 2127} {"train_loss": -12.324647903442383, "global_step": 357455, "epoch": 2127} {"train_loss": -12.484895706176758, "global_step": 357456, "epoch": 2127} {"train_loss": -12.423604011535645, "global_step": 357457, "epoch": 2127} {"train_loss": -12.58771800994873, "global_step": 357458, "epoch": 2127} {"train_loss": -12.464228630065918, "global_step": 357459, "epoch": 2127} {"train_loss": -12.455002784729004, "global_step": 357460, "epoch": 2127} {"train_loss": -12.68792724609375, "global_step": 357461, "epoch": 2127} {"train_loss": -12.398658752441406, "global_step": 357462, "epoch": 2127} {"train_loss": -12.360671997070312, "global_step": 357463, "epoch": 2127} {"train_loss": -12.57255744934082, "global_step": 357464, "epoch": 2127} {"train_loss": -12.475358963012695, "global_step": 357465, "epoch": 2127} {"train_loss": -12.30277156829834, "global_step": 357466, "epoch": 2127} {"train_loss": -12.428561210632324, "global_step": 357467, "epoch": 2127} {"train_loss": -12.665889739990234, "global_step": 357468, "epoch": 2127} {"train_loss": -12.121740341186523, "global_step": 357469, "epoch": 2127} {"train_loss": -12.493558883666992, "global_step": 357470, "epoch": 2127} {"train_loss": -12.393932342529297, "global_step": 357471, "epoch": 2127} {"train_loss": -12.485042572021484, "global_step": 357472, "epoch": 2127} {"train_loss": -12.515176773071289, "global_step": 357473, "epoch": 2127} {"train_loss": -12.486528396606445, "global_step": 357474, "epoch": 2127} {"train_loss": -12.605927467346191, "global_step": 357475, "epoch": 2127} {"train_loss": -12.45472240447998, "global_step": 357476, "epoch": 2127} {"train_loss": -12.745590209960938, "global_step": 357477, "epoch": 2127} {"train_loss": -12.458144187927246, "global_step": 357478, "epoch": 2127} {"train_loss": -12.835947036743164, "global_step": 357479, "epoch": 2127} {"train_loss": -12.428192138671875, "global_step": 357480, "epoch": 2127} {"train_loss": -12.75436019897461, "global_step": 357481, "epoch": 2127} {"train_loss": -12.6765718460083, "global_step": 357482, "epoch": 2127} {"train_loss": -12.629162788391113, "global_step": 357483, "epoch": 2127} {"train_loss": -12.60732650756836, "global_step": 357484, "epoch": 2127} {"train_loss": -12.630565643310547, "global_step": 357485, "epoch": 2127} {"train_loss": -12.50859546661377, "global_step": 357486, "epoch": 2127} {"train_loss": -12.556337356567383, "global_step": 357487, "epoch": 2127} {"train_loss": -12.710359573364258, "global_step": 357488, "epoch": 2127} {"train_loss": -12.300332069396973, "global_step": 357489, "epoch": 2127} {"train_loss": -12.840169906616211, "global_step": 357490, "epoch": 2127} {"train_loss": -12.551753997802734, "global_step": 357491, "epoch": 2127} {"train_loss": -12.446170806884766, "global_step": 357492, "epoch": 2127} {"train_loss": -12.21599006652832, "global_step": 357493, "epoch": 2127} {"train_loss": -12.842218399047852, "global_step": 357494, "epoch": 2127} {"train_loss": -12.593719482421875, "global_step": 357495, "epoch": 2127} {"train_loss": -12.586019515991211, "global_step": 357496, "epoch": 2127} {"train_loss": -12.564313888549805, "global_step": 357497, "epoch": 2127} {"train_loss": -12.665216445922852, "global_step": 357498, "epoch": 2127} {"train_loss": -12.700989723205566, "global_step": 357499, "epoch": 2127} {"train_loss": -12.645660400390625, "global_step": 357500, "epoch": 2127} {"train_loss": -12.754472732543945, "global_step": 357501, "epoch": 2127} {"train_loss": -12.723398208618164, "global_step": 357502, "epoch": 2127} {"train_loss": -11.7124995021593, "global_step": 357503, "epoch": 2127, "val_loss": 289928.875} {"train_loss": -12.85080337524414, "global_step": 357504, "epoch": 2128} {"train_loss": -12.435741424560547, "global_step": 357505, "epoch": 2128} {"train_loss": -12.86172103881836, "global_step": 357506, "epoch": 2128} {"train_loss": -12.702098846435547, "global_step": 357507, "epoch": 2128} {"train_loss": -12.95183277130127, "global_step": 357508, "epoch": 2128} {"train_loss": -12.724571228027344, "global_step": 357509, "epoch": 2128} {"train_loss": -12.660157203674316, "global_step": 357510, "epoch": 2128} {"train_loss": -12.354619979858398, "global_step": 357511, "epoch": 2128} {"train_loss": -12.663902282714844, "global_step": 357512, "epoch": 2128} {"train_loss": -12.369165420532227, "global_step": 357513, "epoch": 2128} {"train_loss": -12.156259536743164, "global_step": 357514, "epoch": 2128} {"train_loss": -12.25002384185791, "global_step": 357515, "epoch": 2128} {"train_loss": -12.106685638427734, "global_step": 357516, "epoch": 2128} {"train_loss": -12.373119354248047, "global_step": 357517, "epoch": 2128} {"train_loss": -12.17184066772461, "global_step": 357518, "epoch": 2128} {"train_loss": -12.303679466247559, "global_step": 357519, "epoch": 2128} {"train_loss": -12.08906364440918, "global_step": 357520, "epoch": 2128} {"train_loss": -12.211212158203125, "global_step": 357521, "epoch": 2128} {"train_loss": -10.72812271118164, "global_step": 357522, "epoch": 2128} {"train_loss": -11.915781021118164, "global_step": 357523, "epoch": 2128} {"train_loss": -11.85696792602539, "global_step": 357524, "epoch": 2128} {"train_loss": -11.795973777770996, "global_step": 357525, "epoch": 2128} {"train_loss": -10.87069320678711, "global_step": 357526, "epoch": 2128} {"train_loss": -11.904251098632812, "global_step": 357527, "epoch": 2128} {"train_loss": -12.191947937011719, "global_step": 357528, "epoch": 2128} {"train_loss": -11.500310897827148, "global_step": 357529, "epoch": 2128} {"train_loss": -11.502058029174805, "global_step": 357530, "epoch": 2128} {"train_loss": -11.453266143798828, "global_step": 357531, "epoch": 2128} {"train_loss": -12.28374195098877, "global_step": 357532, "epoch": 2128} {"train_loss": -11.31842041015625, "global_step": 357533, "epoch": 2128} {"train_loss": -11.2949800491333, "global_step": 357534, "epoch": 2128} {"train_loss": -11.305122375488281, "global_step": 357535, "epoch": 2128} {"train_loss": -12.502346992492676, "global_step": 357536, "epoch": 2128} {"train_loss": -11.81914234161377, "global_step": 357537, "epoch": 2128} {"train_loss": -10.194231986999512, "global_step": 357538, "epoch": 2128} {"train_loss": -11.119020462036133, "global_step": 357539, "epoch": 2128} {"train_loss": -12.213308334350586, "global_step": 357540, "epoch": 2128} {"train_loss": -11.405719757080078, "global_step": 357541, "epoch": 2128} {"train_loss": -10.709234237670898, "global_step": 357542, "epoch": 2128} {"train_loss": -11.495704650878906, "global_step": 357543, "epoch": 2128} {"train_loss": -10.841816902160645, "global_step": 357544, "epoch": 2128} {"train_loss": -9.683579444885254, "global_step": 357545, "epoch": 2128} {"train_loss": -11.9767484664917, "global_step": 357546, "epoch": 2128} {"train_loss": -10.42455005645752, "global_step": 357547, "epoch": 2128} {"train_loss": -10.451562881469727, "global_step": 357548, "epoch": 2128} {"train_loss": -11.718070983886719, "global_step": 357549, "epoch": 2128} {"train_loss": -9.868891716003418, "global_step": 357550, "epoch": 2128} {"train_loss": -10.982484817504883, "global_step": 357551, "epoch": 2128} {"train_loss": -11.284826278686523, "global_step": 357552, "epoch": 2128} {"train_loss": -10.252666473388672, "global_step": 357553, "epoch": 2128} {"train_loss": -11.66196060180664, "global_step": 357554, "epoch": 2128} {"train_loss": -10.72446060180664, "global_step": 357555, "epoch": 2128} {"train_loss": -11.691473007202148, "global_step": 357556, "epoch": 2128} {"train_loss": -11.126642227172852, "global_step": 357557, "epoch": 2128} {"train_loss": -11.232767105102539, "global_step": 357558, "epoch": 2128} {"train_loss": -11.607093811035156, "global_step": 357559, "epoch": 2128} {"train_loss": -11.604330062866211, "global_step": 357560, "epoch": 2128} {"train_loss": -11.662246704101562, "global_step": 357561, "epoch": 2128} {"train_loss": -11.689598083496094, "global_step": 357562, "epoch": 2128} {"train_loss": -11.563316345214844, "global_step": 357563, "epoch": 2128} {"train_loss": -11.613375663757324, "global_step": 357564, "epoch": 2128} {"train_loss": -11.98277473449707, "global_step": 357565, "epoch": 2128} {"train_loss": -11.613728523254395, "global_step": 357566, "epoch": 2128} {"train_loss": -11.819802284240723, "global_step": 357567, "epoch": 2128} {"train_loss": -11.041255950927734, "global_step": 357568, "epoch": 2128} {"train_loss": -11.065943717956543, "global_step": 357569, "epoch": 2128} {"train_loss": -11.89892864227295, "global_step": 357570, "epoch": 2128} {"train_loss": -11.329355239868164, "global_step": 357571, "epoch": 2128} {"train_loss": -11.971449851989746, "global_step": 357572, "epoch": 2128} {"train_loss": -11.72872543334961, "global_step": 357573, "epoch": 2128} {"train_loss": -11.705890655517578, "global_step": 357574, "epoch": 2128} {"train_loss": -12.06593132019043, "global_step": 357575, "epoch": 2128} {"train_loss": -11.220763206481934, "global_step": 357576, "epoch": 2128} {"train_loss": -12.165669441223145, "global_step": 357577, "epoch": 2128} {"train_loss": -11.984601020812988, "global_step": 357578, "epoch": 2128} {"train_loss": -12.175729751586914, "global_step": 357579, "epoch": 2128} {"train_loss": -11.958955764770508, "global_step": 357580, "epoch": 2128} {"train_loss": -11.795496940612793, "global_step": 357581, "epoch": 2128} {"train_loss": -12.020395278930664, "global_step": 357582, "epoch": 2128} {"train_loss": -11.97974967956543, "global_step": 357583, "epoch": 2128} {"train_loss": -11.846460342407227, "global_step": 357584, "epoch": 2128} {"train_loss": -11.950664520263672, "global_step": 357585, "epoch": 2128} {"train_loss": -12.030654907226562, "global_step": 357586, "epoch": 2128} {"train_loss": -12.340675354003906, "global_step": 357587, "epoch": 2128} {"train_loss": -11.683576583862305, "global_step": 357588, "epoch": 2128} {"train_loss": -12.368077278137207, "global_step": 357589, "epoch": 2128} {"train_loss": -12.052846908569336, "global_step": 357590, "epoch": 2128} {"train_loss": -12.406576156616211, "global_step": 357591, "epoch": 2128} {"train_loss": -12.169902801513672, "global_step": 357592, "epoch": 2128} {"train_loss": -12.205923080444336, "global_step": 357593, "epoch": 2128} {"train_loss": -12.3602294921875, "global_step": 357594, "epoch": 2128} {"train_loss": -12.143914222717285, "global_step": 357595, "epoch": 2128} {"train_loss": -12.292823791503906, "global_step": 357596, "epoch": 2128} {"train_loss": -12.474722862243652, "global_step": 357597, "epoch": 2128} {"train_loss": -12.364888191223145, "global_step": 357598, "epoch": 2128} {"train_loss": -12.28044319152832, "global_step": 357599, "epoch": 2128} {"train_loss": -12.364368438720703, "global_step": 357600, "epoch": 2128} {"train_loss": -12.361655235290527, "global_step": 357601, "epoch": 2128} {"train_loss": -12.329622268676758, "global_step": 357602, "epoch": 2128} {"train_loss": -12.44866943359375, "global_step": 357603, "epoch": 2128} {"train_loss": -12.221508026123047, "global_step": 357604, "epoch": 2128} {"train_loss": -12.709757804870605, "global_step": 357605, "epoch": 2128} {"train_loss": -12.494932174682617, "global_step": 357606, "epoch": 2128} {"train_loss": -12.528169631958008, "global_step": 357607, "epoch": 2128} {"train_loss": -12.208703994750977, "global_step": 357608, "epoch": 2128} {"train_loss": -12.541574478149414, "global_step": 357609, "epoch": 2128} {"train_loss": -12.238424301147461, "global_step": 357610, "epoch": 2128} {"train_loss": -12.252462387084961, "global_step": 357611, "epoch": 2128} {"train_loss": -12.32771110534668, "global_step": 357612, "epoch": 2128} {"train_loss": -12.436238288879395, "global_step": 357613, "epoch": 2128} {"train_loss": -12.391881942749023, "global_step": 357614, "epoch": 2128} {"train_loss": -12.313636779785156, "global_step": 357615, "epoch": 2128} {"train_loss": -12.437637329101562, "global_step": 357616, "epoch": 2128} {"train_loss": -12.47871208190918, "global_step": 357617, "epoch": 2128} {"train_loss": -12.573339462280273, "global_step": 357618, "epoch": 2128} {"train_loss": -12.281232833862305, "global_step": 357619, "epoch": 2128} {"train_loss": -12.30506706237793, "global_step": 357620, "epoch": 2128} {"train_loss": -12.490385055541992, "global_step": 357621, "epoch": 2128} {"train_loss": -12.55749225616455, "global_step": 357622, "epoch": 2128} {"train_loss": -12.28525161743164, "global_step": 357623, "epoch": 2128} {"train_loss": -12.695965766906738, "global_step": 357624, "epoch": 2128} {"train_loss": -12.481409072875977, "global_step": 357625, "epoch": 2128} {"train_loss": -12.30870246887207, "global_step": 357626, "epoch": 2128} {"train_loss": -12.218204498291016, "global_step": 357627, "epoch": 2128} {"train_loss": -12.231376647949219, "global_step": 357628, "epoch": 2128} {"train_loss": -12.578638076782227, "global_step": 357629, "epoch": 2128} {"train_loss": -12.33667278289795, "global_step": 357630, "epoch": 2128} {"train_loss": -12.36505126953125, "global_step": 357631, "epoch": 2128} {"train_loss": -12.588913917541504, "global_step": 357632, "epoch": 2128} {"train_loss": -12.085533142089844, "global_step": 357633, "epoch": 2128} {"train_loss": -11.994651794433594, "global_step": 357634, "epoch": 2128} {"train_loss": -12.520544052124023, "global_step": 357635, "epoch": 2128} {"train_loss": -11.764538764953613, "global_step": 357636, "epoch": 2128} {"train_loss": -11.698480606079102, "global_step": 357637, "epoch": 2128} {"train_loss": -12.120431900024414, "global_step": 357638, "epoch": 2128} {"train_loss": -12.443145751953125, "global_step": 357639, "epoch": 2128} {"train_loss": -12.516636848449707, "global_step": 357640, "epoch": 2128} {"train_loss": -11.739662170410156, "global_step": 357641, "epoch": 2128} {"train_loss": -12.09642219543457, "global_step": 357642, "epoch": 2128} {"train_loss": -12.547712326049805, "global_step": 357643, "epoch": 2128} {"train_loss": -12.525565147399902, "global_step": 357644, "epoch": 2128} {"train_loss": -12.270873069763184, "global_step": 357645, "epoch": 2128} {"train_loss": -12.158027648925781, "global_step": 357646, "epoch": 2128} {"train_loss": -12.18808364868164, "global_step": 357647, "epoch": 2128} {"train_loss": -12.344461441040039, "global_step": 357648, "epoch": 2128} {"train_loss": -12.719078063964844, "global_step": 357649, "epoch": 2128} {"train_loss": -12.113649368286133, "global_step": 357650, "epoch": 2128} {"train_loss": -12.28388500213623, "global_step": 357651, "epoch": 2128} {"train_loss": -12.633142471313477, "global_step": 357652, "epoch": 2128} {"train_loss": -12.238950729370117, "global_step": 357653, "epoch": 2128} {"train_loss": -11.108968734741211, "global_step": 357654, "epoch": 2128} {"train_loss": -12.072528839111328, "global_step": 357655, "epoch": 2128} {"train_loss": -12.122062683105469, "global_step": 357656, "epoch": 2128} {"train_loss": -11.871175765991211, "global_step": 357657, "epoch": 2128} {"train_loss": -11.858242988586426, "global_step": 357658, "epoch": 2128} {"train_loss": -12.26280403137207, "global_step": 357659, "epoch": 2128} {"train_loss": -11.522726058959961, "global_step": 357660, "epoch": 2128} {"train_loss": -11.726816177368164, "global_step": 357661, "epoch": 2128} {"train_loss": -12.005674362182617, "global_step": 357662, "epoch": 2128} {"train_loss": -12.293844223022461, "global_step": 357663, "epoch": 2128} {"train_loss": -11.984696388244629, "global_step": 357664, "epoch": 2128} {"train_loss": -11.78992748260498, "global_step": 357665, "epoch": 2128} {"train_loss": -11.995219230651855, "global_step": 357666, "epoch": 2128} {"train_loss": -12.166133880615234, "global_step": 357667, "epoch": 2128} {"train_loss": -12.55115795135498, "global_step": 357668, "epoch": 2128} {"train_loss": -11.774686813354492, "global_step": 357669, "epoch": 2128} {"train_loss": -10.923364639282227, "global_step": 357670, "epoch": 2128} {"train_loss": -11.960252523422241, "global_step": 357671, "epoch": 2128, "val_loss": 291173.375} {"train_loss": -11.656003952026367, "global_step": 357672, "epoch": 2129} {"train_loss": -11.822746276855469, "global_step": 357673, "epoch": 2129} {"train_loss": -10.864616394042969, "global_step": 357674, "epoch": 2129} {"train_loss": -11.594047546386719, "global_step": 357675, "epoch": 2129} {"train_loss": -10.650962829589844, "global_step": 357676, "epoch": 2129} {"train_loss": -11.521100997924805, "global_step": 357677, "epoch": 2129} {"train_loss": -11.582677841186523, "global_step": 357678, "epoch": 2129} {"train_loss": -12.17039680480957, "global_step": 357679, "epoch": 2129} {"train_loss": -11.350086212158203, "global_step": 357680, "epoch": 2129} {"train_loss": -12.010200500488281, "global_step": 357681, "epoch": 2129} {"train_loss": -11.69277572631836, "global_step": 357682, "epoch": 2129} {"train_loss": -11.3369722366333, "global_step": 357683, "epoch": 2129} {"train_loss": -11.809036254882812, "global_step": 357684, "epoch": 2129} {"train_loss": -11.885984420776367, "global_step": 357685, "epoch": 2129} {"train_loss": -11.940521240234375, "global_step": 357686, "epoch": 2129} {"train_loss": -11.152573585510254, "global_step": 357687, "epoch": 2129} {"train_loss": -11.38566780090332, "global_step": 357688, "epoch": 2129} {"train_loss": -11.532804489135742, "global_step": 357689, "epoch": 2129} {"train_loss": -11.914933204650879, "global_step": 357690, "epoch": 2129} {"train_loss": -11.933876037597656, "global_step": 357691, "epoch": 2129} {"train_loss": -12.309646606445312, "global_step": 357692, "epoch": 2129} {"train_loss": -11.883906364440918, "global_step": 357693, "epoch": 2129} {"train_loss": -12.342719078063965, "global_step": 357694, "epoch": 2129} {"train_loss": -12.053882598876953, "global_step": 357695, "epoch": 2129} {"train_loss": -11.972857475280762, "global_step": 357696, "epoch": 2129} {"train_loss": -12.479232788085938, "global_step": 357697, "epoch": 2129} {"train_loss": -12.137328147888184, "global_step": 357698, "epoch": 2129} {"train_loss": -12.372296333312988, "global_step": 357699, "epoch": 2129} {"train_loss": -12.05363941192627, "global_step": 357700, "epoch": 2129} {"train_loss": -12.066680908203125, "global_step": 357701, "epoch": 2129} {"train_loss": -12.195714950561523, "global_step": 357702, "epoch": 2129} {"train_loss": -11.161745071411133, "global_step": 357703, "epoch": 2129} {"train_loss": -12.268465042114258, "global_step": 357704, "epoch": 2129} {"train_loss": -11.949638366699219, "global_step": 357705, "epoch": 2129} {"train_loss": -11.880216598510742, "global_step": 357706, "epoch": 2129} {"train_loss": -12.080568313598633, "global_step": 357707, "epoch": 2129} {"train_loss": -12.032964706420898, "global_step": 357708, "epoch": 2129} {"train_loss": -12.087078094482422, "global_step": 357709, "epoch": 2129} {"train_loss": -12.099918365478516, "global_step": 357710, "epoch": 2129} {"train_loss": -12.150749206542969, "global_step": 357711, "epoch": 2129} {"train_loss": -12.43124771118164, "global_step": 357712, "epoch": 2129} {"train_loss": -11.93144416809082, "global_step": 357713, "epoch": 2129} {"train_loss": -12.471833229064941, "global_step": 357714, "epoch": 2129} {"train_loss": -11.611307144165039, "global_step": 357715, "epoch": 2129} {"train_loss": -12.340559959411621, "global_step": 357716, "epoch": 2129} {"train_loss": -11.969669342041016, "global_step": 357717, "epoch": 2129} {"train_loss": -12.243253707885742, "global_step": 357718, "epoch": 2129} {"train_loss": -12.284664154052734, "global_step": 357719, "epoch": 2129} {"train_loss": -11.672538757324219, "global_step": 357720, "epoch": 2129} {"train_loss": -12.251829147338867, "global_step": 357721, "epoch": 2129} {"train_loss": -11.85647201538086, "global_step": 357722, "epoch": 2129} {"train_loss": -12.305293083190918, "global_step": 357723, "epoch": 2129} {"train_loss": -11.948193550109863, "global_step": 357724, "epoch": 2129} {"train_loss": -12.186327934265137, "global_step": 357725, "epoch": 2129} {"train_loss": -11.948118209838867, "global_step": 357726, "epoch": 2129} {"train_loss": -11.932880401611328, "global_step": 357727, "epoch": 2129} {"train_loss": -12.158666610717773, "global_step": 357728, "epoch": 2129} {"train_loss": -12.219568252563477, "global_step": 357729, "epoch": 2129} {"train_loss": -11.992741584777832, "global_step": 357730, "epoch": 2129} {"train_loss": -12.22507381439209, "global_step": 357731, "epoch": 2129} {"train_loss": -12.146677017211914, "global_step": 357732, "epoch": 2129} {"train_loss": -12.139364242553711, "global_step": 357733, "epoch": 2129} {"train_loss": -12.326486587524414, "global_step": 357734, "epoch": 2129} {"train_loss": -12.275680541992188, "global_step": 357735, "epoch": 2129} {"train_loss": -12.157289505004883, "global_step": 357736, "epoch": 2129} {"train_loss": -12.186098098754883, "global_step": 357737, "epoch": 2129} {"train_loss": -12.574596405029297, "global_step": 357738, "epoch": 2129} {"train_loss": -12.071041107177734, "global_step": 357739, "epoch": 2129} {"train_loss": -12.29745864868164, "global_step": 357740, "epoch": 2129} {"train_loss": -11.863603591918945, "global_step": 357741, "epoch": 2129} {"train_loss": -11.973522186279297, "global_step": 357742, "epoch": 2129} {"train_loss": -11.828811645507812, "global_step": 357743, "epoch": 2129} {"train_loss": -11.719501495361328, "global_step": 357744, "epoch": 2129} {"train_loss": -12.213849067687988, "global_step": 357745, "epoch": 2129} {"train_loss": -11.96365737915039, "global_step": 357746, "epoch": 2129} {"train_loss": -11.247862815856934, "global_step": 357747, "epoch": 2129} {"train_loss": -12.262680053710938, "global_step": 357748, "epoch": 2129} {"train_loss": -11.76773738861084, "global_step": 357749, "epoch": 2129} {"train_loss": -11.311967849731445, "global_step": 357750, "epoch": 2129} {"train_loss": -12.154415130615234, "global_step": 357751, "epoch": 2129} {"train_loss": -10.400107383728027, "global_step": 357752, "epoch": 2129} {"train_loss": -11.66258430480957, "global_step": 357753, "epoch": 2129} {"train_loss": -11.52359390258789, "global_step": 357754, "epoch": 2129} {"train_loss": -11.614913940429688, "global_step": 357755, "epoch": 2129} {"train_loss": -11.00460433959961, "global_step": 357756, "epoch": 2129} {"train_loss": -11.67239761352539, "global_step": 357757, "epoch": 2129} {"train_loss": -11.243009567260742, "global_step": 357758, "epoch": 2129} {"train_loss": -10.049062728881836, "global_step": 357759, "epoch": 2129} {"train_loss": -11.873764991760254, "global_step": 357760, "epoch": 2129} {"train_loss": -10.338714599609375, "global_step": 357761, "epoch": 2129} {"train_loss": -11.63177490234375, "global_step": 357762, "epoch": 2129} {"train_loss": -11.43055248260498, "global_step": 357763, "epoch": 2129} {"train_loss": -10.989304542541504, "global_step": 357764, "epoch": 2129} {"train_loss": -11.21788215637207, "global_step": 357765, "epoch": 2129} {"train_loss": -10.510650634765625, "global_step": 357766, "epoch": 2129} {"train_loss": -11.14460277557373, "global_step": 357767, "epoch": 2129} {"train_loss": -11.435598373413086, "global_step": 357768, "epoch": 2129} {"train_loss": -10.283808708190918, "global_step": 357769, "epoch": 2129} {"train_loss": -11.933185577392578, "global_step": 357770, "epoch": 2129} {"train_loss": -10.414172172546387, "global_step": 357771, "epoch": 2129} {"train_loss": -10.75916862487793, "global_step": 357772, "epoch": 2129} {"train_loss": -11.627710342407227, "global_step": 357773, "epoch": 2129} {"train_loss": -10.374433517456055, "global_step": 357774, "epoch": 2129} {"train_loss": -11.846017837524414, "global_step": 357775, "epoch": 2129} {"train_loss": -10.892378807067871, "global_step": 357776, "epoch": 2129} {"train_loss": -11.015347480773926, "global_step": 357777, "epoch": 2129} {"train_loss": -12.1555814743042, "global_step": 357778, "epoch": 2129} {"train_loss": -10.992547035217285, "global_step": 357779, "epoch": 2129} {"train_loss": -11.675559043884277, "global_step": 357780, "epoch": 2129} {"train_loss": -11.692598342895508, "global_step": 357781, "epoch": 2129} {"train_loss": -11.515937805175781, "global_step": 357782, "epoch": 2129} {"train_loss": -11.8158597946167, "global_step": 357783, "epoch": 2129} {"train_loss": -11.066396713256836, "global_step": 357784, "epoch": 2129} {"train_loss": -12.187629699707031, "global_step": 357785, "epoch": 2129} {"train_loss": -11.65789794921875, "global_step": 357786, "epoch": 2129} {"train_loss": -11.695451736450195, "global_step": 357787, "epoch": 2129} {"train_loss": -12.089727401733398, "global_step": 357788, "epoch": 2129} {"train_loss": -11.661940574645996, "global_step": 357789, "epoch": 2129} {"train_loss": -12.143186569213867, "global_step": 357790, "epoch": 2129} {"train_loss": -11.91202449798584, "global_step": 357791, "epoch": 2129} {"train_loss": -11.854538917541504, "global_step": 357792, "epoch": 2129} {"train_loss": -11.875624656677246, "global_step": 357793, "epoch": 2129} {"train_loss": -11.981582641601562, "global_step": 357794, "epoch": 2129} {"train_loss": -11.701860427856445, "global_step": 357795, "epoch": 2129} {"train_loss": -12.066328048706055, "global_step": 357796, "epoch": 2129} {"train_loss": -11.990713119506836, "global_step": 357797, "epoch": 2129} {"train_loss": -11.996321678161621, "global_step": 357798, "epoch": 2129} {"train_loss": -12.187491416931152, "global_step": 357799, "epoch": 2129} {"train_loss": -11.937034606933594, "global_step": 357800, "epoch": 2129} {"train_loss": -12.358333587646484, "global_step": 357801, "epoch": 2129} {"train_loss": -12.081747055053711, "global_step": 357802, "epoch": 2129} {"train_loss": -12.306360244750977, "global_step": 357803, "epoch": 2129} {"train_loss": -11.832319259643555, "global_step": 357804, "epoch": 2129} {"train_loss": -12.240804672241211, "global_step": 357805, "epoch": 2129} {"train_loss": -12.123796463012695, "global_step": 357806, "epoch": 2129} {"train_loss": -12.37507152557373, "global_step": 357807, "epoch": 2129} {"train_loss": -11.919697761535645, "global_step": 357808, "epoch": 2129} {"train_loss": -12.290718078613281, "global_step": 357809, "epoch": 2129} {"train_loss": -12.315613746643066, "global_step": 357810, "epoch": 2129} {"train_loss": -12.030062675476074, "global_step": 357811, "epoch": 2129} {"train_loss": -12.248722076416016, "global_step": 357812, "epoch": 2129} {"train_loss": -12.088075637817383, "global_step": 357813, "epoch": 2129} {"train_loss": -12.343572616577148, "global_step": 357814, "epoch": 2129} {"train_loss": -12.460813522338867, "global_step": 357815, "epoch": 2129} {"train_loss": -12.091955184936523, "global_step": 357816, "epoch": 2129} {"train_loss": -12.351527214050293, "global_step": 357817, "epoch": 2129} {"train_loss": -12.451613426208496, "global_step": 357818, "epoch": 2129} {"train_loss": -12.360641479492188, "global_step": 357819, "epoch": 2129} {"train_loss": -12.425771713256836, "global_step": 357820, "epoch": 2129} {"train_loss": -12.439109802246094, "global_step": 357821, "epoch": 2129} {"train_loss": -12.45977783203125, "global_step": 357822, "epoch": 2129} {"train_loss": -12.62251091003418, "global_step": 357823, "epoch": 2129} {"train_loss": -12.263940811157227, "global_step": 357824, "epoch": 2129} {"train_loss": -12.516090393066406, "global_step": 357825, "epoch": 2129} {"train_loss": -12.480533599853516, "global_step": 357826, "epoch": 2129} {"train_loss": -12.615518569946289, "global_step": 357827, "epoch": 2129} {"train_loss": -12.559746742248535, "global_step": 357828, "epoch": 2129} {"train_loss": -12.49599838256836, "global_step": 357829, "epoch": 2129} {"train_loss": -12.521525382995605, "global_step": 357830, "epoch": 2129} {"train_loss": -12.471259117126465, "global_step": 357831, "epoch": 2129} {"train_loss": -12.507711410522461, "global_step": 357832, "epoch": 2129} {"train_loss": -12.608142852783203, "global_step": 357833, "epoch": 2129} {"train_loss": -12.448546409606934, "global_step": 357834, "epoch": 2129} {"train_loss": -12.628551483154297, "global_step": 357835, "epoch": 2129} {"train_loss": -12.614341735839844, "global_step": 357836, "epoch": 2129} {"train_loss": -12.643131256103516, "global_step": 357837, "epoch": 2129} {"train_loss": -12.661144256591797, "global_step": 357838, "epoch": 2129} {"train_loss": -11.901265388443356, "global_step": 357839, "epoch": 2129, "val_loss": 289795.84375} {"train_loss": -12.585506439208984, "global_step": 357840, "epoch": 2130} {"train_loss": -12.396647453308105, "global_step": 357841, "epoch": 2130} {"train_loss": -12.621667861938477, "global_step": 357842, "epoch": 2130} {"train_loss": -12.348123550415039, "global_step": 357843, "epoch": 2130} {"train_loss": -12.595592498779297, "global_step": 357844, "epoch": 2130} {"train_loss": -12.544763565063477, "global_step": 357845, "epoch": 2130} {"train_loss": -12.404366493225098, "global_step": 357846, "epoch": 2130} {"train_loss": -12.754154205322266, "global_step": 357847, "epoch": 2130} {"train_loss": -12.583510398864746, "global_step": 357848, "epoch": 2130} {"train_loss": -12.761298179626465, "global_step": 357849, "epoch": 2130} {"train_loss": -12.479242324829102, "global_step": 357850, "epoch": 2130} {"train_loss": -12.714827537536621, "global_step": 357851, "epoch": 2130} {"train_loss": -12.774103164672852, "global_step": 357852, "epoch": 2130} {"train_loss": -12.589126586914062, "global_step": 357853, "epoch": 2130} {"train_loss": -12.70107650756836, "global_step": 357854, "epoch": 2130} {"train_loss": -12.859813690185547, "global_step": 357855, "epoch": 2130} {"train_loss": -12.722867965698242, "global_step": 357856, "epoch": 2130} {"train_loss": -12.651524543762207, "global_step": 357857, "epoch": 2130} {"train_loss": -12.63397216796875, "global_step": 357858, "epoch": 2130} {"train_loss": -12.654935836791992, "global_step": 357859, "epoch": 2130} {"train_loss": -12.564294815063477, "global_step": 357860, "epoch": 2130} {"train_loss": -12.473258018493652, "global_step": 357861, "epoch": 2130} {"train_loss": -12.44140625, "global_step": 357862, "epoch": 2130} {"train_loss": -12.432762145996094, "global_step": 357863, "epoch": 2130} {"train_loss": -12.696943283081055, "global_step": 357864, "epoch": 2130} {"train_loss": -12.794318199157715, "global_step": 357865, "epoch": 2130} {"train_loss": -12.328819274902344, "global_step": 357866, "epoch": 2130} {"train_loss": -11.985419273376465, "global_step": 357867, "epoch": 2130} {"train_loss": -12.083141326904297, "global_step": 357868, "epoch": 2130} {"train_loss": -12.798816680908203, "global_step": 357869, "epoch": 2130} {"train_loss": -12.565712928771973, "global_step": 357870, "epoch": 2130} {"train_loss": -12.006206512451172, "global_step": 357871, "epoch": 2130} {"train_loss": -12.085445404052734, "global_step": 357872, "epoch": 2130} {"train_loss": -12.063872337341309, "global_step": 357873, "epoch": 2130} {"train_loss": -12.248578071594238, "global_step": 357874, "epoch": 2130} {"train_loss": -10.8234224319458, "global_step": 357875, "epoch": 2130} {"train_loss": -11.051033020019531, "global_step": 357876, "epoch": 2130} {"train_loss": -11.661876678466797, "global_step": 357877, "epoch": 2130} {"train_loss": -12.07818603515625, "global_step": 357878, "epoch": 2130} {"train_loss": -12.027538299560547, "global_step": 357879, "epoch": 2130} {"train_loss": -10.817883491516113, "global_step": 357880, "epoch": 2130} {"train_loss": -12.06559944152832, "global_step": 357881, "epoch": 2130} {"train_loss": -9.762042999267578, "global_step": 357882, "epoch": 2130} {"train_loss": -9.392895698547363, "global_step": 357883, "epoch": 2130} {"train_loss": -10.178181648254395, "global_step": 357884, "epoch": 2130} {"train_loss": -9.637035369873047, "global_step": 357885, "epoch": 2130} {"train_loss": -9.064644813537598, "global_step": 357886, "epoch": 2130} {"train_loss": -8.154495239257812, "global_step": 357887, "epoch": 2130} {"train_loss": -8.72507095336914, "global_step": 357888, "epoch": 2130} {"train_loss": -9.319278717041016, "global_step": 357889, "epoch": 2130} {"train_loss": -10.128585815429688, "global_step": 357890, "epoch": 2130} {"train_loss": -9.229826927185059, "global_step": 357891, "epoch": 2130} {"train_loss": -8.035646438598633, "global_step": 357892, "epoch": 2130} {"train_loss": -9.118249893188477, "global_step": 357893, "epoch": 2130} {"train_loss": -8.664482116699219, "global_step": 357894, "epoch": 2130} {"train_loss": -9.120750427246094, "global_step": 357895, "epoch": 2130} {"train_loss": -9.447099685668945, "global_step": 357896, "epoch": 2130} {"train_loss": -9.914600372314453, "global_step": 357897, "epoch": 2130} {"train_loss": -9.46262264251709, "global_step": 357898, "epoch": 2130} {"train_loss": -9.994867324829102, "global_step": 357899, "epoch": 2130} {"train_loss": -10.928019523620605, "global_step": 357900, "epoch": 2130} {"train_loss": -9.928519248962402, "global_step": 357901, "epoch": 2130} {"train_loss": -9.762463569641113, "global_step": 357902, "epoch": 2130} {"train_loss": -10.863014221191406, "global_step": 357903, "epoch": 2130} {"train_loss": -9.039239883422852, "global_step": 357904, "epoch": 2130} {"train_loss": -10.315559387207031, "global_step": 357905, "epoch": 2130} {"train_loss": -10.975772857666016, "global_step": 357906, "epoch": 2130} {"train_loss": -9.996050834655762, "global_step": 357907, "epoch": 2130} {"train_loss": -10.475883483886719, "global_step": 357908, "epoch": 2130} {"train_loss": -11.108381271362305, "global_step": 357909, "epoch": 2130} {"train_loss": -10.806039810180664, "global_step": 357910, "epoch": 2130} {"train_loss": -11.196107864379883, "global_step": 357911, "epoch": 2130} {"train_loss": -11.228233337402344, "global_step": 357912, "epoch": 2130} {"train_loss": -11.114797592163086, "global_step": 357913, "epoch": 2130} {"train_loss": -10.955344200134277, "global_step": 357914, "epoch": 2130} {"train_loss": -11.504255294799805, "global_step": 357915, "epoch": 2130} {"train_loss": -11.948827743530273, "global_step": 357916, "epoch": 2130} {"train_loss": -11.741349220275879, "global_step": 357917, "epoch": 2130} {"train_loss": -12.065784454345703, "global_step": 357918, "epoch": 2130} {"train_loss": -11.928577423095703, "global_step": 357919, "epoch": 2130} {"train_loss": -11.613826751708984, "global_step": 357920, "epoch": 2130} {"train_loss": -11.847790718078613, "global_step": 357921, "epoch": 2130} {"train_loss": -11.791618347167969, "global_step": 357922, "epoch": 2130} {"train_loss": -11.869653701782227, "global_step": 357923, "epoch": 2130} {"train_loss": -11.769279479980469, "global_step": 357924, "epoch": 2130} {"train_loss": -11.226760864257812, "global_step": 357925, "epoch": 2130} {"train_loss": -12.019706726074219, "global_step": 357926, "epoch": 2130} {"train_loss": -11.276320457458496, "global_step": 357927, "epoch": 2130} {"train_loss": -11.909260749816895, "global_step": 357928, "epoch": 2130} {"train_loss": -11.671464920043945, "global_step": 357929, "epoch": 2130} {"train_loss": -11.741072654724121, "global_step": 357930, "epoch": 2130} {"train_loss": -12.214824676513672, "global_step": 357931, "epoch": 2130} {"train_loss": -11.71446418762207, "global_step": 357932, "epoch": 2130} {"train_loss": -11.930313110351562, "global_step": 357933, "epoch": 2130} {"train_loss": -12.04690170288086, "global_step": 357934, "epoch": 2130} {"train_loss": -12.005839347839355, "global_step": 357935, "epoch": 2130} {"train_loss": -11.957500457763672, "global_step": 357936, "epoch": 2130} {"train_loss": -12.041380882263184, "global_step": 357937, "epoch": 2130} {"train_loss": -11.970836639404297, "global_step": 357938, "epoch": 2130} {"train_loss": -12.225027084350586, "global_step": 357939, "epoch": 2130} {"train_loss": -11.958776473999023, "global_step": 357940, "epoch": 2130} {"train_loss": -12.222939491271973, "global_step": 357941, "epoch": 2130} {"train_loss": -12.036003112792969, "global_step": 357942, "epoch": 2130} {"train_loss": -12.087462425231934, "global_step": 357943, "epoch": 2130} {"train_loss": -12.172880172729492, "global_step": 357944, "epoch": 2130} {"train_loss": -11.969229698181152, "global_step": 357945, "epoch": 2130} {"train_loss": -12.30770492553711, "global_step": 357946, "epoch": 2130} {"train_loss": -12.19023323059082, "global_step": 357947, "epoch": 2130} {"train_loss": -11.919800758361816, "global_step": 357948, "epoch": 2130} {"train_loss": -12.119070053100586, "global_step": 357949, "epoch": 2130} {"train_loss": -12.08470630645752, "global_step": 357950, "epoch": 2130} {"train_loss": -12.236896514892578, "global_step": 357951, "epoch": 2130} {"train_loss": -12.193469047546387, "global_step": 357952, "epoch": 2130} {"train_loss": -12.361610412597656, "global_step": 357953, "epoch": 2130} {"train_loss": -12.233504295349121, "global_step": 357954, "epoch": 2130} {"train_loss": -12.238770484924316, "global_step": 357955, "epoch": 2130} {"train_loss": -12.146263122558594, "global_step": 357956, "epoch": 2130} {"train_loss": -12.396475791931152, "global_step": 357957, "epoch": 2130} {"train_loss": -12.325993537902832, "global_step": 357958, "epoch": 2130} {"train_loss": -12.37916374206543, "global_step": 357959, "epoch": 2130} {"train_loss": -12.312056541442871, "global_step": 357960, "epoch": 2130} {"train_loss": -12.373619079589844, "global_step": 357961, "epoch": 2130} {"train_loss": -12.222713470458984, "global_step": 357962, "epoch": 2130} {"train_loss": -12.618082046508789, "global_step": 357963, "epoch": 2130} {"train_loss": -12.47383975982666, "global_step": 357964, "epoch": 2130} {"train_loss": -12.156539916992188, "global_step": 357965, "epoch": 2130} {"train_loss": -12.324604034423828, "global_step": 357966, "epoch": 2130} {"train_loss": -12.131048202514648, "global_step": 357967, "epoch": 2130} {"train_loss": -12.574565887451172, "global_step": 357968, "epoch": 2130} {"train_loss": -12.443244934082031, "global_step": 357969, "epoch": 2130} {"train_loss": -12.398902893066406, "global_step": 357970, "epoch": 2130} {"train_loss": -12.37172794342041, "global_step": 357971, "epoch": 2130} {"train_loss": -12.671565055847168, "global_step": 357972, "epoch": 2130} {"train_loss": -12.63439655303955, "global_step": 357973, "epoch": 2130} {"train_loss": -12.269499778747559, "global_step": 357974, "epoch": 2130} {"train_loss": -12.645265579223633, "global_step": 357975, "epoch": 2130} {"train_loss": -12.567316055297852, "global_step": 357976, "epoch": 2130} {"train_loss": -12.420076370239258, "global_step": 357977, "epoch": 2130} {"train_loss": -12.574774742126465, "global_step": 357978, "epoch": 2130} {"train_loss": -12.442262649536133, "global_step": 357979, "epoch": 2130} {"train_loss": -12.491891860961914, "global_step": 357980, "epoch": 2130} {"train_loss": -12.540837287902832, "global_step": 357981, "epoch": 2130} {"train_loss": -12.522789001464844, "global_step": 357982, "epoch": 2130} {"train_loss": -12.583308219909668, "global_step": 357983, "epoch": 2130} {"train_loss": -12.669135093688965, "global_step": 357984, "epoch": 2130} {"train_loss": -12.538522720336914, "global_step": 357985, "epoch": 2130} {"train_loss": -12.687082290649414, "global_step": 357986, "epoch": 2130} {"train_loss": -12.700788497924805, "global_step": 357987, "epoch": 2130} {"train_loss": -12.555692672729492, "global_step": 357988, "epoch": 2130} {"train_loss": -12.782434463500977, "global_step": 357989, "epoch": 2130} {"train_loss": -12.689872741699219, "global_step": 357990, "epoch": 2130} {"train_loss": -12.798139572143555, "global_step": 357991, "epoch": 2130} {"train_loss": -12.705741882324219, "global_step": 357992, "epoch": 2130} {"train_loss": -12.654291152954102, "global_step": 357993, "epoch": 2130} {"train_loss": -12.856674194335938, "global_step": 357994, "epoch": 2130} {"train_loss": -12.739824295043945, "global_step": 357995, "epoch": 2130} {"train_loss": -12.749773025512695, "global_step": 357996, "epoch": 2130} {"train_loss": -12.644160270690918, "global_step": 357997, "epoch": 2130} {"train_loss": -12.693973541259766, "global_step": 357998, "epoch": 2130} {"train_loss": -12.92185115814209, "global_step": 357999, "epoch": 2130} {"train_loss": -12.643645286560059, "global_step": 358000, "epoch": 2130} {"train_loss": -12.787332534790039, "global_step": 358001, "epoch": 2130} {"train_loss": -12.673334121704102, "global_step": 358002, "epoch": 2130} {"train_loss": -12.778305053710938, "global_step": 358003, "epoch": 2130} {"train_loss": -12.688020706176758, "global_step": 358004, "epoch": 2130} {"train_loss": -12.908122062683105, "global_step": 358005, "epoch": 2130} {"train_loss": -12.657791137695312, "global_step": 358006, "epoch": 2130} {"train_loss": -11.834925589107332, "global_step": 358007, "epoch": 2130, "val_loss": 284761.125, "train_action_mse_error": 0.938752293586731} {"train_loss": -12.667436599731445, "global_step": 358008, "epoch": 2131} {"train_loss": -12.983648300170898, "global_step": 358009, "epoch": 2131} {"train_loss": -12.650720596313477, "global_step": 358010, "epoch": 2131} {"train_loss": -12.947385787963867, "global_step": 358011, "epoch": 2131} {"train_loss": -12.727740287780762, "global_step": 358012, "epoch": 2131} {"train_loss": -12.854266166687012, "global_step": 358013, "epoch": 2131} {"train_loss": -12.783899307250977, "global_step": 358014, "epoch": 2131} {"train_loss": -12.94011116027832, "global_step": 358015, "epoch": 2131} {"train_loss": -12.591392517089844, "global_step": 358016, "epoch": 2131} {"train_loss": -12.732915878295898, "global_step": 358017, "epoch": 2131} {"train_loss": -12.530790328979492, "global_step": 358018, "epoch": 2131} {"train_loss": -12.695419311523438, "global_step": 358019, "epoch": 2131} {"train_loss": -12.8820219039917, "global_step": 358020, "epoch": 2131} {"train_loss": -12.656439781188965, "global_step": 358021, "epoch": 2131} {"train_loss": -12.558500289916992, "global_step": 358022, "epoch": 2131} {"train_loss": -12.193117141723633, "global_step": 358023, "epoch": 2131} {"train_loss": -11.912014961242676, "global_step": 358024, "epoch": 2131} {"train_loss": -11.719003677368164, "global_step": 358025, "epoch": 2131} {"train_loss": -11.315835952758789, "global_step": 358026, "epoch": 2131} {"train_loss": -11.245841026306152, "global_step": 358027, "epoch": 2131} {"train_loss": -10.577841758728027, "global_step": 358028, "epoch": 2131} {"train_loss": -12.097004890441895, "global_step": 358029, "epoch": 2131} {"train_loss": -10.34219741821289, "global_step": 358030, "epoch": 2131} {"train_loss": -12.184286117553711, "global_step": 358031, "epoch": 2131} {"train_loss": -10.662755966186523, "global_step": 358032, "epoch": 2131} {"train_loss": -11.927897453308105, "global_step": 358033, "epoch": 2131} {"train_loss": -11.414901733398438, "global_step": 358034, "epoch": 2131} {"train_loss": -11.856721878051758, "global_step": 358035, "epoch": 2131} {"train_loss": -11.311450958251953, "global_step": 358036, "epoch": 2131} {"train_loss": -12.275232315063477, "global_step": 358037, "epoch": 2131} {"train_loss": -11.637468338012695, "global_step": 358038, "epoch": 2131} {"train_loss": -12.209152221679688, "global_step": 358039, "epoch": 2131} {"train_loss": -11.854782104492188, "global_step": 358040, "epoch": 2131} {"train_loss": -12.066408157348633, "global_step": 358041, "epoch": 2131} {"train_loss": -11.86331558227539, "global_step": 358042, "epoch": 2131} {"train_loss": -11.840042114257812, "global_step": 358043, "epoch": 2131} {"train_loss": -11.176162719726562, "global_step": 358044, "epoch": 2131} {"train_loss": -11.991201400756836, "global_step": 358045, "epoch": 2131} {"train_loss": -12.059134483337402, "global_step": 358046, "epoch": 2131} {"train_loss": -11.507192611694336, "global_step": 358047, "epoch": 2131} {"train_loss": -11.309952735900879, "global_step": 358048, "epoch": 2131} {"train_loss": -12.119770050048828, "global_step": 358049, "epoch": 2131} {"train_loss": -12.226444244384766, "global_step": 358050, "epoch": 2131} {"train_loss": -11.916934967041016, "global_step": 358051, "epoch": 2131} {"train_loss": -11.431661605834961, "global_step": 358052, "epoch": 2131} {"train_loss": -10.013931274414062, "global_step": 358053, "epoch": 2131} {"train_loss": -10.858526229858398, "global_step": 358054, "epoch": 2131} {"train_loss": -11.987994194030762, "global_step": 358055, "epoch": 2131} {"train_loss": -12.200311660766602, "global_step": 358056, "epoch": 2131} {"train_loss": -11.68190860748291, "global_step": 358057, "epoch": 2131} {"train_loss": -12.30691146850586, "global_step": 358058, "epoch": 2131} {"train_loss": -12.212890625, "global_step": 358059, "epoch": 2131} {"train_loss": -12.02056884765625, "global_step": 358060, "epoch": 2131} {"train_loss": -12.188833236694336, "global_step": 358061, "epoch": 2131} {"train_loss": -12.116718292236328, "global_step": 358062, "epoch": 2131} {"train_loss": -11.652067184448242, "global_step": 358063, "epoch": 2131} {"train_loss": -11.940946578979492, "global_step": 358064, "epoch": 2131} {"train_loss": -11.725040435791016, "global_step": 358065, "epoch": 2131} {"train_loss": -11.728525161743164, "global_step": 358066, "epoch": 2131} {"train_loss": -11.57567024230957, "global_step": 358067, "epoch": 2131} {"train_loss": -11.513712882995605, "global_step": 358068, "epoch": 2131} {"train_loss": -12.038684844970703, "global_step": 358069, "epoch": 2131} {"train_loss": -11.292546272277832, "global_step": 358070, "epoch": 2131} {"train_loss": -11.880071640014648, "global_step": 358071, "epoch": 2131} {"train_loss": -11.845281600952148, "global_step": 358072, "epoch": 2131} {"train_loss": -11.763765335083008, "global_step": 358073, "epoch": 2131} {"train_loss": -11.769363403320312, "global_step": 358074, "epoch": 2131} {"train_loss": -11.739646911621094, "global_step": 358075, "epoch": 2131} {"train_loss": -11.965594291687012, "global_step": 358076, "epoch": 2131} {"train_loss": -11.444202423095703, "global_step": 358077, "epoch": 2131} {"train_loss": -12.577170372009277, "global_step": 358078, "epoch": 2131} {"train_loss": -11.373003005981445, "global_step": 358079, "epoch": 2131} {"train_loss": -11.8846435546875, "global_step": 358080, "epoch": 2131} {"train_loss": -11.083667755126953, "global_step": 358081, "epoch": 2131} {"train_loss": -11.50197696685791, "global_step": 358082, "epoch": 2131} {"train_loss": -11.549074172973633, "global_step": 358083, "epoch": 2131} {"train_loss": -11.179656982421875, "global_step": 358084, "epoch": 2131} {"train_loss": -12.443765640258789, "global_step": 358085, "epoch": 2131} {"train_loss": -11.660975456237793, "global_step": 358086, "epoch": 2131} {"train_loss": -11.978889465332031, "global_step": 358087, "epoch": 2131} {"train_loss": -11.572819709777832, "global_step": 358088, "epoch": 2131} {"train_loss": -11.906058311462402, "global_step": 358089, "epoch": 2131} {"train_loss": -12.073060989379883, "global_step": 358090, "epoch": 2131} {"train_loss": -11.64982795715332, "global_step": 358091, "epoch": 2131} {"train_loss": -11.84537124633789, "global_step": 358092, "epoch": 2131} {"train_loss": -11.699026107788086, "global_step": 358093, "epoch": 2131} {"train_loss": -11.437722206115723, "global_step": 358094, "epoch": 2131} {"train_loss": -12.081872940063477, "global_step": 358095, "epoch": 2131} {"train_loss": -11.78427505493164, "global_step": 358096, "epoch": 2131} {"train_loss": -11.534488677978516, "global_step": 358097, "epoch": 2131} {"train_loss": -12.265039443969727, "global_step": 358098, "epoch": 2131} {"train_loss": -11.426021575927734, "global_step": 358099, "epoch": 2131} {"train_loss": -12.125004768371582, "global_step": 358100, "epoch": 2131} {"train_loss": -12.01020622253418, "global_step": 358101, "epoch": 2131} {"train_loss": -12.028432846069336, "global_step": 358102, "epoch": 2131} {"train_loss": -12.368309020996094, "global_step": 358103, "epoch": 2131} {"train_loss": -12.095327377319336, "global_step": 358104, "epoch": 2131} {"train_loss": -12.11681842803955, "global_step": 358105, "epoch": 2131} {"train_loss": -12.093364715576172, "global_step": 358106, "epoch": 2131} {"train_loss": -12.215924263000488, "global_step": 358107, "epoch": 2131} {"train_loss": -11.740959167480469, "global_step": 358108, "epoch": 2131} {"train_loss": -12.300190925598145, "global_step": 358109, "epoch": 2131} {"train_loss": -11.910011291503906, "global_step": 358110, "epoch": 2131} {"train_loss": -11.95175838470459, "global_step": 358111, "epoch": 2131} {"train_loss": -12.188886642456055, "global_step": 358112, "epoch": 2131} {"train_loss": -12.087425231933594, "global_step": 358113, "epoch": 2131} {"train_loss": -11.795967102050781, "global_step": 358114, "epoch": 2131} {"train_loss": -11.929866790771484, "global_step": 358115, "epoch": 2131} {"train_loss": -11.34028434753418, "global_step": 358116, "epoch": 2131} {"train_loss": -12.056644439697266, "global_step": 358117, "epoch": 2131} {"train_loss": -11.850399017333984, "global_step": 358118, "epoch": 2131} {"train_loss": -11.166759490966797, "global_step": 358119, "epoch": 2131} {"train_loss": -11.957627296447754, "global_step": 358120, "epoch": 2131} {"train_loss": -11.228001594543457, "global_step": 358121, "epoch": 2131} {"train_loss": -12.23163890838623, "global_step": 358122, "epoch": 2131} {"train_loss": -11.584356307983398, "global_step": 358123, "epoch": 2131} {"train_loss": -12.31356430053711, "global_step": 358124, "epoch": 2131} {"train_loss": -11.647147178649902, "global_step": 358125, "epoch": 2131} {"train_loss": -11.75643539428711, "global_step": 358126, "epoch": 2131} {"train_loss": -12.036230087280273, "global_step": 358127, "epoch": 2131} {"train_loss": -12.112386703491211, "global_step": 358128, "epoch": 2131} {"train_loss": -12.120943069458008, "global_step": 358129, "epoch": 2131} {"train_loss": -12.02075481414795, "global_step": 358130, "epoch": 2131} {"train_loss": -10.657336235046387, "global_step": 358131, "epoch": 2131} {"train_loss": -11.894304275512695, "global_step": 358132, "epoch": 2131} {"train_loss": -10.313713073730469, "global_step": 358133, "epoch": 2131} {"train_loss": -11.676780700683594, "global_step": 358134, "epoch": 2131} {"train_loss": -11.394881248474121, "global_step": 358135, "epoch": 2131} {"train_loss": -10.705821990966797, "global_step": 358136, "epoch": 2131} {"train_loss": -12.09554672241211, "global_step": 358137, "epoch": 2131} {"train_loss": -11.09893798828125, "global_step": 358138, "epoch": 2131} {"train_loss": -12.299102783203125, "global_step": 358139, "epoch": 2131} {"train_loss": -11.104460716247559, "global_step": 358140, "epoch": 2131} {"train_loss": -11.582426071166992, "global_step": 358141, "epoch": 2131} {"train_loss": -12.095340728759766, "global_step": 358142, "epoch": 2131} {"train_loss": -11.79052448272705, "global_step": 358143, "epoch": 2131} {"train_loss": -11.970520973205566, "global_step": 358144, "epoch": 2131} {"train_loss": -12.222614288330078, "global_step": 358145, "epoch": 2131} {"train_loss": -11.998266220092773, "global_step": 358146, "epoch": 2131} {"train_loss": -12.565557479858398, "global_step": 358147, "epoch": 2131} {"train_loss": -11.896388053894043, "global_step": 358148, "epoch": 2131} {"train_loss": -12.061907768249512, "global_step": 358149, "epoch": 2131} {"train_loss": -11.928189277648926, "global_step": 358150, "epoch": 2131} {"train_loss": -12.172041893005371, "global_step": 358151, "epoch": 2131} {"train_loss": -12.144250869750977, "global_step": 358152, "epoch": 2131} {"train_loss": -11.934754371643066, "global_step": 358153, "epoch": 2131} {"train_loss": -12.422286987304688, "global_step": 358154, "epoch": 2131} {"train_loss": -11.965368270874023, "global_step": 358155, "epoch": 2131} {"train_loss": -12.410490989685059, "global_step": 358156, "epoch": 2131} {"train_loss": -12.112447738647461, "global_step": 358157, "epoch": 2131} {"train_loss": -12.330695152282715, "global_step": 358158, "epoch": 2131} {"train_loss": -12.163806915283203, "global_step": 358159, "epoch": 2131} {"train_loss": -11.280557632446289, "global_step": 358160, "epoch": 2131} {"train_loss": -12.41391372680664, "global_step": 358161, "epoch": 2131} {"train_loss": -11.939081192016602, "global_step": 358162, "epoch": 2131} {"train_loss": -12.201675415039062, "global_step": 358163, "epoch": 2131} {"train_loss": -12.010701179504395, "global_step": 358164, "epoch": 2131} {"train_loss": -12.201473236083984, "global_step": 358165, "epoch": 2131} {"train_loss": -11.71885871887207, "global_step": 358166, "epoch": 2131} {"train_loss": -12.21481704711914, "global_step": 358167, "epoch": 2131} {"train_loss": -12.288003921508789, "global_step": 358168, "epoch": 2131} {"train_loss": -12.380073547363281, "global_step": 358169, "epoch": 2131} {"train_loss": -12.512141227722168, "global_step": 358170, "epoch": 2131} {"train_loss": -12.295063018798828, "global_step": 358171, "epoch": 2131} {"train_loss": -12.355449676513672, "global_step": 358172, "epoch": 2131} {"train_loss": -12.136417388916016, "global_step": 358173, "epoch": 2131} {"train_loss": -12.163930892944336, "global_step": 358174, "epoch": 2131} {"train_loss": -11.910320843969073, "global_step": 358175, "epoch": 2131, "val_loss": 289266.6875} {"train_loss": -12.460280418395996, "global_step": 358176, "epoch": 2132} {"train_loss": -12.327842712402344, "global_step": 358177, "epoch": 2132} {"train_loss": -12.44546890258789, "global_step": 358178, "epoch": 2132} {"train_loss": -11.769232749938965, "global_step": 358179, "epoch": 2132} {"train_loss": -12.496967315673828, "global_step": 358180, "epoch": 2132} {"train_loss": -12.210990905761719, "global_step": 358181, "epoch": 2132} {"train_loss": -12.373802185058594, "global_step": 358182, "epoch": 2132} {"train_loss": -12.673243522644043, "global_step": 358183, "epoch": 2132} {"train_loss": -12.468088150024414, "global_step": 358184, "epoch": 2132} {"train_loss": -12.368709564208984, "global_step": 358185, "epoch": 2132} {"train_loss": -12.635579109191895, "global_step": 358186, "epoch": 2132} {"train_loss": -12.507356643676758, "global_step": 358187, "epoch": 2132} {"train_loss": -12.193819046020508, "global_step": 358188, "epoch": 2132} {"train_loss": -12.61203670501709, "global_step": 358189, "epoch": 2132} {"train_loss": -12.579015731811523, "global_step": 358190, "epoch": 2132} {"train_loss": -12.388040542602539, "global_step": 358191, "epoch": 2132} {"train_loss": -12.327184677124023, "global_step": 358192, "epoch": 2132} {"train_loss": -12.464404106140137, "global_step": 358193, "epoch": 2132} {"train_loss": -12.270035743713379, "global_step": 358194, "epoch": 2132} {"train_loss": -12.335962295532227, "global_step": 358195, "epoch": 2132} {"train_loss": -12.276032447814941, "global_step": 358196, "epoch": 2132} {"train_loss": -12.156641006469727, "global_step": 358197, "epoch": 2132} {"train_loss": -12.13896369934082, "global_step": 358198, "epoch": 2132} {"train_loss": -11.206400871276855, "global_step": 358199, "epoch": 2132} {"train_loss": -10.48829174041748, "global_step": 358200, "epoch": 2132} {"train_loss": -12.340397834777832, "global_step": 358201, "epoch": 2132} {"train_loss": -11.127447128295898, "global_step": 358202, "epoch": 2132} {"train_loss": -10.927082061767578, "global_step": 358203, "epoch": 2132} {"train_loss": -11.637200355529785, "global_step": 358204, "epoch": 2132} {"train_loss": -11.543111801147461, "global_step": 358205, "epoch": 2132} {"train_loss": -11.871427536010742, "global_step": 358206, "epoch": 2132} {"train_loss": -11.921476364135742, "global_step": 358207, "epoch": 2132} {"train_loss": -12.008413314819336, "global_step": 358208, "epoch": 2132} {"train_loss": -12.091546058654785, "global_step": 358209, "epoch": 2132} {"train_loss": -12.111565589904785, "global_step": 358210, "epoch": 2132} {"train_loss": -12.281633377075195, "global_step": 358211, "epoch": 2132} {"train_loss": -12.150968551635742, "global_step": 358212, "epoch": 2132} {"train_loss": -12.459421157836914, "global_step": 358213, "epoch": 2132} {"train_loss": -12.142919540405273, "global_step": 358214, "epoch": 2132} {"train_loss": -12.156803131103516, "global_step": 358215, "epoch": 2132} {"train_loss": -12.228597640991211, "global_step": 358216, "epoch": 2132} {"train_loss": -12.24477481842041, "global_step": 358217, "epoch": 2132} {"train_loss": -12.2774658203125, "global_step": 358218, "epoch": 2132} {"train_loss": -12.260934829711914, "global_step": 358219, "epoch": 2132} {"train_loss": -11.646944046020508, "global_step": 358220, "epoch": 2132} {"train_loss": -11.59321117401123, "global_step": 358221, "epoch": 2132} {"train_loss": -11.769340515136719, "global_step": 358222, "epoch": 2132} {"train_loss": -11.303665161132812, "global_step": 358223, "epoch": 2132} {"train_loss": -11.466205596923828, "global_step": 358224, "epoch": 2132} {"train_loss": -11.915550231933594, "global_step": 358225, "epoch": 2132} {"train_loss": -11.66990852355957, "global_step": 358226, "epoch": 2132} {"train_loss": -11.663028717041016, "global_step": 358227, "epoch": 2132} {"train_loss": -12.149116516113281, "global_step": 358228, "epoch": 2132} {"train_loss": -11.201726913452148, "global_step": 358229, "epoch": 2132} {"train_loss": -12.10155200958252, "global_step": 358230, "epoch": 2132} {"train_loss": -11.67326831817627, "global_step": 358231, "epoch": 2132} {"train_loss": -11.695148468017578, "global_step": 358232, "epoch": 2132} {"train_loss": -12.212518692016602, "global_step": 358233, "epoch": 2132} {"train_loss": -11.499574661254883, "global_step": 358234, "epoch": 2132} {"train_loss": -12.132589340209961, "global_step": 358235, "epoch": 2132} {"train_loss": -12.146288871765137, "global_step": 358236, "epoch": 2132} {"train_loss": -11.98236083984375, "global_step": 358237, "epoch": 2132} {"train_loss": -11.962924003601074, "global_step": 358238, "epoch": 2132} {"train_loss": -12.21681022644043, "global_step": 358239, "epoch": 2132} {"train_loss": -11.720935821533203, "global_step": 358240, "epoch": 2132} {"train_loss": -12.460566520690918, "global_step": 358241, "epoch": 2132} {"train_loss": -12.49998950958252, "global_step": 358242, "epoch": 2132} {"train_loss": -12.19582748413086, "global_step": 358243, "epoch": 2132} {"train_loss": -12.34378433227539, "global_step": 358244, "epoch": 2132} {"train_loss": -12.320846557617188, "global_step": 358245, "epoch": 2132} {"train_loss": -11.87366008758545, "global_step": 358246, "epoch": 2132} {"train_loss": -12.497787475585938, "global_step": 358247, "epoch": 2132} {"train_loss": -12.375635147094727, "global_step": 358248, "epoch": 2132} {"train_loss": -12.143045425415039, "global_step": 358249, "epoch": 2132} {"train_loss": -12.362669944763184, "global_step": 358250, "epoch": 2132} {"train_loss": -12.162099838256836, "global_step": 358251, "epoch": 2132} {"train_loss": -12.106571197509766, "global_step": 358252, "epoch": 2132} {"train_loss": -12.523414611816406, "global_step": 358253, "epoch": 2132} {"train_loss": -12.186948776245117, "global_step": 358254, "epoch": 2132} {"train_loss": -12.23250961303711, "global_step": 358255, "epoch": 2132} {"train_loss": -12.205446243286133, "global_step": 358256, "epoch": 2132} {"train_loss": -11.858535766601562, "global_step": 358257, "epoch": 2132} {"train_loss": -11.680585861206055, "global_step": 358258, "epoch": 2132} {"train_loss": -11.568403244018555, "global_step": 358259, "epoch": 2132} {"train_loss": -11.974925994873047, "global_step": 358260, "epoch": 2132} {"train_loss": -10.536510467529297, "global_step": 358261, "epoch": 2132} {"train_loss": -11.821249008178711, "global_step": 358262, "epoch": 2132} {"train_loss": -11.256656646728516, "global_step": 358263, "epoch": 2132} {"train_loss": -11.609139442443848, "global_step": 358264, "epoch": 2132} {"train_loss": -11.882225036621094, "global_step": 358265, "epoch": 2132} {"train_loss": -12.388692855834961, "global_step": 358266, "epoch": 2132} {"train_loss": -12.076537132263184, "global_step": 358267, "epoch": 2132} {"train_loss": -11.846114158630371, "global_step": 358268, "epoch": 2132} {"train_loss": -12.249218940734863, "global_step": 358269, "epoch": 2132} {"train_loss": -11.662458419799805, "global_step": 358270, "epoch": 2132} {"train_loss": -12.066020011901855, "global_step": 358271, "epoch": 2132} {"train_loss": -12.169694900512695, "global_step": 358272, "epoch": 2132} {"train_loss": -12.162841796875, "global_step": 358273, "epoch": 2132} {"train_loss": -11.936273574829102, "global_step": 358274, "epoch": 2132} {"train_loss": -12.274992942810059, "global_step": 358275, "epoch": 2132} {"train_loss": -11.889237403869629, "global_step": 358276, "epoch": 2132} {"train_loss": -12.01034927368164, "global_step": 358277, "epoch": 2132} {"train_loss": -12.538158416748047, "global_step": 358278, "epoch": 2132} {"train_loss": -12.107698440551758, "global_step": 358279, "epoch": 2132} {"train_loss": -12.202689170837402, "global_step": 358280, "epoch": 2132} {"train_loss": -12.152109146118164, "global_step": 358281, "epoch": 2132} {"train_loss": -12.312437057495117, "global_step": 358282, "epoch": 2132} {"train_loss": -12.428256034851074, "global_step": 358283, "epoch": 2132} {"train_loss": -12.337767601013184, "global_step": 358284, "epoch": 2132} {"train_loss": -12.156942367553711, "global_step": 358285, "epoch": 2132} {"train_loss": -12.34601879119873, "global_step": 358286, "epoch": 2132} {"train_loss": -12.26099967956543, "global_step": 358287, "epoch": 2132} {"train_loss": -12.558855056762695, "global_step": 358288, "epoch": 2132} {"train_loss": -12.439496040344238, "global_step": 358289, "epoch": 2132} {"train_loss": -12.44942855834961, "global_step": 358290, "epoch": 2132} {"train_loss": -12.430513381958008, "global_step": 358291, "epoch": 2132} {"train_loss": -12.289966583251953, "global_step": 358292, "epoch": 2132} {"train_loss": -12.405652046203613, "global_step": 358293, "epoch": 2132} {"train_loss": -12.641185760498047, "global_step": 358294, "epoch": 2132} {"train_loss": -12.296430587768555, "global_step": 358295, "epoch": 2132} {"train_loss": -12.372518539428711, "global_step": 358296, "epoch": 2132} {"train_loss": -11.962568283081055, "global_step": 358297, "epoch": 2132} {"train_loss": -12.480533599853516, "global_step": 358298, "epoch": 2132} {"train_loss": -11.953743934631348, "global_step": 358299, "epoch": 2132} {"train_loss": -12.507457733154297, "global_step": 358300, "epoch": 2132} {"train_loss": -12.041908264160156, "global_step": 358301, "epoch": 2132} {"train_loss": -12.211822509765625, "global_step": 358302, "epoch": 2132} {"train_loss": -12.463508605957031, "global_step": 358303, "epoch": 2132} {"train_loss": -12.420427322387695, "global_step": 358304, "epoch": 2132} {"train_loss": -12.428738594055176, "global_step": 358305, "epoch": 2132} {"train_loss": -12.190879821777344, "global_step": 358306, "epoch": 2132} {"train_loss": -12.420904159545898, "global_step": 358307, "epoch": 2132} {"train_loss": -12.616974830627441, "global_step": 358308, "epoch": 2132} {"train_loss": -12.800384521484375, "global_step": 358309, "epoch": 2132} {"train_loss": -12.258359909057617, "global_step": 358310, "epoch": 2132} {"train_loss": -11.76663589477539, "global_step": 358311, "epoch": 2132} {"train_loss": -12.429117202758789, "global_step": 358312, "epoch": 2132} {"train_loss": -12.51321792602539, "global_step": 358313, "epoch": 2132} {"train_loss": -12.257070541381836, "global_step": 358314, "epoch": 2132} {"train_loss": -12.126714706420898, "global_step": 358315, "epoch": 2132} {"train_loss": -12.305597305297852, "global_step": 358316, "epoch": 2132} {"train_loss": -11.346282005310059, "global_step": 358317, "epoch": 2132} {"train_loss": -11.79955005645752, "global_step": 358318, "epoch": 2132} {"train_loss": -12.072225570678711, "global_step": 358319, "epoch": 2132} {"train_loss": -12.136972427368164, "global_step": 358320, "epoch": 2132} {"train_loss": -11.689228057861328, "global_step": 358321, "epoch": 2132} {"train_loss": -11.9014892578125, "global_step": 358322, "epoch": 2132} {"train_loss": -11.961461067199707, "global_step": 358323, "epoch": 2132} {"train_loss": -11.799457550048828, "global_step": 358324, "epoch": 2132} {"train_loss": -11.834497451782227, "global_step": 358325, "epoch": 2132} {"train_loss": -11.873199462890625, "global_step": 358326, "epoch": 2132} {"train_loss": -12.057476997375488, "global_step": 358327, "epoch": 2132} {"train_loss": -11.955001831054688, "global_step": 358328, "epoch": 2132} {"train_loss": -11.215438842773438, "global_step": 358329, "epoch": 2132} {"train_loss": -10.881845474243164, "global_step": 358330, "epoch": 2132} {"train_loss": -12.096237182617188, "global_step": 358331, "epoch": 2132} {"train_loss": -11.41386604309082, "global_step": 358332, "epoch": 2132} {"train_loss": -11.883180618286133, "global_step": 358333, "epoch": 2132} {"train_loss": -12.128650665283203, "global_step": 358334, "epoch": 2132} {"train_loss": -11.082352638244629, "global_step": 358335, "epoch": 2132} {"train_loss": -12.087321281433105, "global_step": 358336, "epoch": 2132} {"train_loss": -11.829280853271484, "global_step": 358337, "epoch": 2132} {"train_loss": -11.608802795410156, "global_step": 358338, "epoch": 2132} {"train_loss": -12.129826545715332, "global_step": 358339, "epoch": 2132} {"train_loss": -11.549713134765625, "global_step": 358340, "epoch": 2132} {"train_loss": -11.028789520263672, "global_step": 358341, "epoch": 2132} {"train_loss": -11.805192947387695, "global_step": 358342, "epoch": 2132} {"train_loss": -12.030932159650893, "global_step": 358343, "epoch": 2132, "val_loss": 289655.4375} {"train_loss": -11.709677696228027, "global_step": 358344, "epoch": 2133} {"train_loss": -9.854635238647461, "global_step": 358345, "epoch": 2133} {"train_loss": -10.390399932861328, "global_step": 358346, "epoch": 2133} {"train_loss": -11.081779479980469, "global_step": 358347, "epoch": 2133} {"train_loss": -10.380773544311523, "global_step": 358348, "epoch": 2133} {"train_loss": -10.652008056640625, "global_step": 358349, "epoch": 2133} {"train_loss": -12.072490692138672, "global_step": 358350, "epoch": 2133} {"train_loss": -10.765533447265625, "global_step": 358351, "epoch": 2133} {"train_loss": -12.084352493286133, "global_step": 358352, "epoch": 2133} {"train_loss": -11.46070384979248, "global_step": 358353, "epoch": 2133} {"train_loss": -11.154385566711426, "global_step": 358354, "epoch": 2133} {"train_loss": -12.099345207214355, "global_step": 358355, "epoch": 2133} {"train_loss": -11.29916763305664, "global_step": 358356, "epoch": 2133} {"train_loss": -11.31740665435791, "global_step": 358357, "epoch": 2133} {"train_loss": -11.985086441040039, "global_step": 358358, "epoch": 2133} {"train_loss": -11.184346199035645, "global_step": 358359, "epoch": 2133} {"train_loss": -12.159891128540039, "global_step": 358360, "epoch": 2133} {"train_loss": -11.165506362915039, "global_step": 358361, "epoch": 2133} {"train_loss": -11.854757308959961, "global_step": 358362, "epoch": 2133} {"train_loss": -12.032535552978516, "global_step": 358363, "epoch": 2133} {"train_loss": -11.897928237915039, "global_step": 358364, "epoch": 2133} {"train_loss": -11.836814880371094, "global_step": 358365, "epoch": 2133} {"train_loss": -11.961165428161621, "global_step": 358366, "epoch": 2133} {"train_loss": -12.143308639526367, "global_step": 358367, "epoch": 2133} {"train_loss": -11.836061477661133, "global_step": 358368, "epoch": 2133} {"train_loss": -11.86563491821289, "global_step": 358369, "epoch": 2133} {"train_loss": -11.709211349487305, "global_step": 358370, "epoch": 2133} {"train_loss": -12.333001136779785, "global_step": 358371, "epoch": 2133} {"train_loss": -11.58496379852295, "global_step": 358372, "epoch": 2133} {"train_loss": -12.175337791442871, "global_step": 358373, "epoch": 2133} {"train_loss": -11.982672691345215, "global_step": 358374, "epoch": 2133} {"train_loss": -12.07104778289795, "global_step": 358375, "epoch": 2133} {"train_loss": -11.804752349853516, "global_step": 358376, "epoch": 2133} {"train_loss": -12.157440185546875, "global_step": 358377, "epoch": 2133} {"train_loss": -12.031021118164062, "global_step": 358378, "epoch": 2133} {"train_loss": -12.290521621704102, "global_step": 358379, "epoch": 2133} {"train_loss": -12.24686050415039, "global_step": 358380, "epoch": 2133} {"train_loss": -12.141952514648438, "global_step": 358381, "epoch": 2133} {"train_loss": -12.094038009643555, "global_step": 358382, "epoch": 2133} {"train_loss": -12.439273834228516, "global_step": 358383, "epoch": 2133} {"train_loss": -12.263567924499512, "global_step": 358384, "epoch": 2133} {"train_loss": -12.494529724121094, "global_step": 358385, "epoch": 2133} {"train_loss": -12.137344360351562, "global_step": 358386, "epoch": 2133} {"train_loss": -12.377189636230469, "global_step": 358387, "epoch": 2133} {"train_loss": -12.039741516113281, "global_step": 358388, "epoch": 2133} {"train_loss": -12.14149284362793, "global_step": 358389, "epoch": 2133} {"train_loss": -12.372249603271484, "global_step": 358390, "epoch": 2133} {"train_loss": -12.11021614074707, "global_step": 358391, "epoch": 2133} {"train_loss": -12.044461250305176, "global_step": 358392, "epoch": 2133} {"train_loss": -12.346761703491211, "global_step": 358393, "epoch": 2133} {"train_loss": -11.833377838134766, "global_step": 358394, "epoch": 2133} {"train_loss": -12.591110229492188, "global_step": 358395, "epoch": 2133} {"train_loss": -12.350508689880371, "global_step": 358396, "epoch": 2133} {"train_loss": -12.155157089233398, "global_step": 358397, "epoch": 2133} {"train_loss": -12.409124374389648, "global_step": 358398, "epoch": 2133} {"train_loss": -12.179136276245117, "global_step": 358399, "epoch": 2133} {"train_loss": -12.298255920410156, "global_step": 358400, "epoch": 2133} {"train_loss": -12.503944396972656, "global_step": 358401, "epoch": 2133} {"train_loss": -12.194408416748047, "global_step": 358402, "epoch": 2133} {"train_loss": -12.231724739074707, "global_step": 358403, "epoch": 2133} {"train_loss": -12.074087142944336, "global_step": 358404, "epoch": 2133} {"train_loss": -11.016059875488281, "global_step": 358405, "epoch": 2133} {"train_loss": -12.18400764465332, "global_step": 358406, "epoch": 2133} {"train_loss": -12.310598373413086, "global_step": 358407, "epoch": 2133} {"train_loss": -11.731409072875977, "global_step": 358408, "epoch": 2133} {"train_loss": -12.216946601867676, "global_step": 358409, "epoch": 2133} {"train_loss": -12.199966430664062, "global_step": 358410, "epoch": 2133} {"train_loss": -12.120054244995117, "global_step": 358411, "epoch": 2133} {"train_loss": -12.176294326782227, "global_step": 358412, "epoch": 2133} {"train_loss": -12.475099563598633, "global_step": 358413, "epoch": 2133} {"train_loss": -12.19924545288086, "global_step": 358414, "epoch": 2133} {"train_loss": -12.598871231079102, "global_step": 358415, "epoch": 2133} {"train_loss": -12.500045776367188, "global_step": 358416, "epoch": 2133} {"train_loss": -12.58879566192627, "global_step": 358417, "epoch": 2133} {"train_loss": -12.70061206817627, "global_step": 358418, "epoch": 2133} {"train_loss": -12.454042434692383, "global_step": 358419, "epoch": 2133} {"train_loss": -12.7634916305542, "global_step": 358420, "epoch": 2133} {"train_loss": -12.233638763427734, "global_step": 358421, "epoch": 2133} {"train_loss": -12.456645965576172, "global_step": 358422, "epoch": 2133} {"train_loss": -12.6334810256958, "global_step": 358423, "epoch": 2133} {"train_loss": -12.651668548583984, "global_step": 358424, "epoch": 2133} {"train_loss": -12.465473175048828, "global_step": 358425, "epoch": 2133} {"train_loss": -12.408970832824707, "global_step": 358426, "epoch": 2133} {"train_loss": -12.604728698730469, "global_step": 358427, "epoch": 2133} {"train_loss": -12.380698204040527, "global_step": 358428, "epoch": 2133} {"train_loss": -12.825752258300781, "global_step": 358429, "epoch": 2133} {"train_loss": -12.306009292602539, "global_step": 358430, "epoch": 2133} {"train_loss": -12.6578369140625, "global_step": 358431, "epoch": 2133} {"train_loss": -12.45028305053711, "global_step": 358432, "epoch": 2133} {"train_loss": -12.519887924194336, "global_step": 358433, "epoch": 2133} {"train_loss": -12.573709487915039, "global_step": 358434, "epoch": 2133} {"train_loss": -12.623279571533203, "global_step": 358435, "epoch": 2133} {"train_loss": -12.553797721862793, "global_step": 358436, "epoch": 2133} {"train_loss": -12.772947311401367, "global_step": 358437, "epoch": 2133} {"train_loss": -12.42806625366211, "global_step": 358438, "epoch": 2133} {"train_loss": -12.775236129760742, "global_step": 358439, "epoch": 2133} {"train_loss": -12.495450973510742, "global_step": 358440, "epoch": 2133} {"train_loss": -12.587553024291992, "global_step": 358441, "epoch": 2133} {"train_loss": -12.506113052368164, "global_step": 358442, "epoch": 2133} {"train_loss": -12.660911560058594, "global_step": 358443, "epoch": 2133} {"train_loss": -12.440988540649414, "global_step": 358444, "epoch": 2133} {"train_loss": -12.652420043945312, "global_step": 358445, "epoch": 2133} {"train_loss": -12.77743911743164, "global_step": 358446, "epoch": 2133} {"train_loss": -12.793161392211914, "global_step": 358447, "epoch": 2133} {"train_loss": -12.685545921325684, "global_step": 358448, "epoch": 2133} {"train_loss": -12.734016418457031, "global_step": 358449, "epoch": 2133} {"train_loss": -12.688045501708984, "global_step": 358450, "epoch": 2133} {"train_loss": -12.706040382385254, "global_step": 358451, "epoch": 2133} {"train_loss": -12.592028617858887, "global_step": 358452, "epoch": 2133} {"train_loss": -12.615142822265625, "global_step": 358453, "epoch": 2133} {"train_loss": -12.539236068725586, "global_step": 358454, "epoch": 2133} {"train_loss": -12.647686958312988, "global_step": 358455, "epoch": 2133} {"train_loss": -12.532035827636719, "global_step": 358456, "epoch": 2133} {"train_loss": -12.424853324890137, "global_step": 358457, "epoch": 2133} {"train_loss": -12.631134033203125, "global_step": 358458, "epoch": 2133} {"train_loss": -12.600143432617188, "global_step": 358459, "epoch": 2133} {"train_loss": -12.72813892364502, "global_step": 358460, "epoch": 2133} {"train_loss": -12.617493629455566, "global_step": 358461, "epoch": 2133} {"train_loss": -12.760558128356934, "global_step": 358462, "epoch": 2133} {"train_loss": -12.514606475830078, "global_step": 358463, "epoch": 2133} {"train_loss": -12.661186218261719, "global_step": 358464, "epoch": 2133} {"train_loss": -12.341500282287598, "global_step": 358465, "epoch": 2133} {"train_loss": -11.875587463378906, "global_step": 358466, "epoch": 2133} {"train_loss": -9.951043128967285, "global_step": 358467, "epoch": 2133} {"train_loss": -12.231672286987305, "global_step": 358468, "epoch": 2133} {"train_loss": -11.58209228515625, "global_step": 358469, "epoch": 2133} {"train_loss": -10.92178726196289, "global_step": 358470, "epoch": 2133} {"train_loss": -12.37173843383789, "global_step": 358471, "epoch": 2133} {"train_loss": -12.226469993591309, "global_step": 358472, "epoch": 2133} {"train_loss": -12.114164352416992, "global_step": 358473, "epoch": 2133} {"train_loss": -11.047220230102539, "global_step": 358474, "epoch": 2133} {"train_loss": -11.851112365722656, "global_step": 358475, "epoch": 2133} {"train_loss": -11.585159301757812, "global_step": 358476, "epoch": 2133} {"train_loss": -11.126882553100586, "global_step": 358477, "epoch": 2133} {"train_loss": -11.952667236328125, "global_step": 358478, "epoch": 2133} {"train_loss": -11.982102394104004, "global_step": 358479, "epoch": 2133} {"train_loss": -11.457986831665039, "global_step": 358480, "epoch": 2133} {"train_loss": -11.56141471862793, "global_step": 358481, "epoch": 2133} {"train_loss": -9.76885986328125, "global_step": 358482, "epoch": 2133} {"train_loss": -10.911693572998047, "global_step": 358483, "epoch": 2133} {"train_loss": -11.481271743774414, "global_step": 358484, "epoch": 2133} {"train_loss": -10.950971603393555, "global_step": 358485, "epoch": 2133} {"train_loss": -9.79800796508789, "global_step": 358486, "epoch": 2133} {"train_loss": -11.504677772521973, "global_step": 358487, "epoch": 2133} {"train_loss": -9.44735050201416, "global_step": 358488, "epoch": 2133} {"train_loss": -9.781179428100586, "global_step": 358489, "epoch": 2133} {"train_loss": -10.53288459777832, "global_step": 358490, "epoch": 2133} {"train_loss": -9.033951759338379, "global_step": 358491, "epoch": 2133} {"train_loss": -9.920126914978027, "global_step": 358492, "epoch": 2133} {"train_loss": -9.913054466247559, "global_step": 358493, "epoch": 2133} {"train_loss": -8.956110000610352, "global_step": 358494, "epoch": 2133} {"train_loss": -8.44772720336914, "global_step": 358495, "epoch": 2133} {"train_loss": -10.607133865356445, "global_step": 358496, "epoch": 2133} {"train_loss": -8.594889640808105, "global_step": 358497, "epoch": 2133} {"train_loss": -9.329421997070312, "global_step": 358498, "epoch": 2133} {"train_loss": -10.857708930969238, "global_step": 358499, "epoch": 2133} {"train_loss": -9.803875923156738, "global_step": 358500, "epoch": 2133} {"train_loss": -11.328882217407227, "global_step": 358501, "epoch": 2133} {"train_loss": -10.533697128295898, "global_step": 358502, "epoch": 2133} {"train_loss": -10.041934967041016, "global_step": 358503, "epoch": 2133} {"train_loss": -11.246112823486328, "global_step": 358504, "epoch": 2133} {"train_loss": -9.709163665771484, "global_step": 358505, "epoch": 2133} {"train_loss": -10.111995697021484, "global_step": 358506, "epoch": 2133} {"train_loss": -8.60837173461914, "global_step": 358507, "epoch": 2133} {"train_loss": -10.16663932800293, "global_step": 358508, "epoch": 2133} {"train_loss": -10.93641471862793, "global_step": 358509, "epoch": 2133} {"train_loss": -10.255549430847168, "global_step": 358510, "epoch": 2133} {"train_loss": -11.763956421897525, "global_step": 358511, "epoch": 2133, "val_loss": 283882.96875} {"train_loss": -11.055349349975586, "global_step": 358512, "epoch": 2134} {"train_loss": -11.341812133789062, "global_step": 358513, "epoch": 2134} {"train_loss": -10.912544250488281, "global_step": 358514, "epoch": 2134} {"train_loss": -10.97336196899414, "global_step": 358515, "epoch": 2134} {"train_loss": -10.969934463500977, "global_step": 358516, "epoch": 2134} {"train_loss": -11.531532287597656, "global_step": 358517, "epoch": 2134} {"train_loss": -11.241901397705078, "global_step": 358518, "epoch": 2134} {"train_loss": -11.73741626739502, "global_step": 358519, "epoch": 2134} {"train_loss": -11.387001037597656, "global_step": 358520, "epoch": 2134} {"train_loss": -11.396256446838379, "global_step": 358521, "epoch": 2134} {"train_loss": -11.477456092834473, "global_step": 358522, "epoch": 2134} {"train_loss": -11.421122550964355, "global_step": 358523, "epoch": 2134} {"train_loss": -11.589492797851562, "global_step": 358524, "epoch": 2134} {"train_loss": -11.795783996582031, "global_step": 358525, "epoch": 2134} {"train_loss": -11.220746994018555, "global_step": 358526, "epoch": 2134} {"train_loss": -11.54263687133789, "global_step": 358527, "epoch": 2134} {"train_loss": -11.898199081420898, "global_step": 358528, "epoch": 2134} {"train_loss": -11.402702331542969, "global_step": 358529, "epoch": 2134} {"train_loss": -11.787900924682617, "global_step": 358530, "epoch": 2134} {"train_loss": -11.670394897460938, "global_step": 358531, "epoch": 2134} {"train_loss": -11.755545616149902, "global_step": 358532, "epoch": 2134} {"train_loss": -11.769596099853516, "global_step": 358533, "epoch": 2134} {"train_loss": -11.867523193359375, "global_step": 358534, "epoch": 2134} {"train_loss": -11.741752624511719, "global_step": 358535, "epoch": 2134} {"train_loss": -12.027917861938477, "global_step": 358536, "epoch": 2134} {"train_loss": -12.248826026916504, "global_step": 358537, "epoch": 2134} {"train_loss": -12.088401794433594, "global_step": 358538, "epoch": 2134} {"train_loss": -12.13929271697998, "global_step": 358539, "epoch": 2134} {"train_loss": -11.845178604125977, "global_step": 358540, "epoch": 2134} {"train_loss": -11.996463775634766, "global_step": 358541, "epoch": 2134} {"train_loss": -11.878731727600098, "global_step": 358542, "epoch": 2134} {"train_loss": -12.178518295288086, "global_step": 358543, "epoch": 2134} {"train_loss": -11.744808197021484, "global_step": 358544, "epoch": 2134} {"train_loss": -11.971817970275879, "global_step": 358545, "epoch": 2134} {"train_loss": -12.200258255004883, "global_step": 358546, "epoch": 2134} {"train_loss": -11.952342987060547, "global_step": 358547, "epoch": 2134} {"train_loss": -12.292037010192871, "global_step": 358548, "epoch": 2134} {"train_loss": -11.916387557983398, "global_step": 358549, "epoch": 2134} {"train_loss": -12.286016464233398, "global_step": 358550, "epoch": 2134} {"train_loss": -12.303197860717773, "global_step": 358551, "epoch": 2134} {"train_loss": -12.255302429199219, "global_step": 358552, "epoch": 2134} {"train_loss": -12.22097110748291, "global_step": 358553, "epoch": 2134} {"train_loss": -12.050415992736816, "global_step": 358554, "epoch": 2134} {"train_loss": -12.49984359741211, "global_step": 358555, "epoch": 2134} {"train_loss": -12.269007682800293, "global_step": 358556, "epoch": 2134} {"train_loss": -12.313607215881348, "global_step": 358557, "epoch": 2134} {"train_loss": -12.18155288696289, "global_step": 358558, "epoch": 2134} {"train_loss": -12.499876022338867, "global_step": 358559, "epoch": 2134} {"train_loss": -12.359561920166016, "global_step": 358560, "epoch": 2134} {"train_loss": -12.393187522888184, "global_step": 358561, "epoch": 2134} {"train_loss": -12.515360832214355, "global_step": 358562, "epoch": 2134} {"train_loss": -12.391233444213867, "global_step": 358563, "epoch": 2134} {"train_loss": -12.222786903381348, "global_step": 358564, "epoch": 2134} {"train_loss": -12.526571273803711, "global_step": 358565, "epoch": 2134} {"train_loss": -12.492249488830566, "global_step": 358566, "epoch": 2134} {"train_loss": -12.460370063781738, "global_step": 358567, "epoch": 2134} {"train_loss": -12.310440063476562, "global_step": 358568, "epoch": 2134} {"train_loss": -12.280142784118652, "global_step": 358569, "epoch": 2134} {"train_loss": -12.386772155761719, "global_step": 358570, "epoch": 2134} {"train_loss": -12.019338607788086, "global_step": 358571, "epoch": 2134} {"train_loss": -12.643081665039062, "global_step": 358572, "epoch": 2134} {"train_loss": -11.856624603271484, "global_step": 358573, "epoch": 2134} {"train_loss": -12.516792297363281, "global_step": 358574, "epoch": 2134} {"train_loss": -12.00520133972168, "global_step": 358575, "epoch": 2134} {"train_loss": -12.31065559387207, "global_step": 358576, "epoch": 2134} {"train_loss": -12.217361450195312, "global_step": 358577, "epoch": 2134} {"train_loss": -12.394084930419922, "global_step": 358578, "epoch": 2134} {"train_loss": -12.218541145324707, "global_step": 358579, "epoch": 2134} {"train_loss": -11.618704795837402, "global_step": 358580, "epoch": 2134} {"train_loss": -12.154454231262207, "global_step": 358581, "epoch": 2134} {"train_loss": -11.962322235107422, "global_step": 358582, "epoch": 2134} {"train_loss": -12.09457015991211, "global_step": 358583, "epoch": 2134} {"train_loss": -12.56826400756836, "global_step": 358584, "epoch": 2134} {"train_loss": -12.207228660583496, "global_step": 358585, "epoch": 2134} {"train_loss": -12.545633316040039, "global_step": 358586, "epoch": 2134} {"train_loss": -12.524839401245117, "global_step": 358587, "epoch": 2134} {"train_loss": -12.403831481933594, "global_step": 358588, "epoch": 2134} {"train_loss": -12.532344818115234, "global_step": 358589, "epoch": 2134} {"train_loss": -12.403812408447266, "global_step": 358590, "epoch": 2134} {"train_loss": -12.536314010620117, "global_step": 358591, "epoch": 2134} {"train_loss": -12.51486587524414, "global_step": 358592, "epoch": 2134} {"train_loss": -12.412537574768066, "global_step": 358593, "epoch": 2134} {"train_loss": -12.549665451049805, "global_step": 358594, "epoch": 2134} {"train_loss": -12.36245346069336, "global_step": 358595, "epoch": 2134} {"train_loss": -12.543989181518555, "global_step": 358596, "epoch": 2134} {"train_loss": -12.18301010131836, "global_step": 358597, "epoch": 2134} {"train_loss": -12.583171844482422, "global_step": 358598, "epoch": 2134} {"train_loss": -12.119961738586426, "global_step": 358599, "epoch": 2134} {"train_loss": -12.164508819580078, "global_step": 358600, "epoch": 2134} {"train_loss": -12.467329978942871, "global_step": 358601, "epoch": 2134} {"train_loss": -12.503935813903809, "global_step": 358602, "epoch": 2134} {"train_loss": -12.4733304977417, "global_step": 358603, "epoch": 2134} {"train_loss": -12.304864883422852, "global_step": 358604, "epoch": 2134} {"train_loss": -12.511109352111816, "global_step": 358605, "epoch": 2134} {"train_loss": -12.606101989746094, "global_step": 358606, "epoch": 2134} {"train_loss": -12.60518741607666, "global_step": 358607, "epoch": 2134} {"train_loss": -12.485981941223145, "global_step": 358608, "epoch": 2134} {"train_loss": -12.591836929321289, "global_step": 358609, "epoch": 2134} {"train_loss": -12.714558601379395, "global_step": 358610, "epoch": 2134} {"train_loss": -12.836651802062988, "global_step": 358611, "epoch": 2134} {"train_loss": -12.670035362243652, "global_step": 358612, "epoch": 2134} {"train_loss": -12.558006286621094, "global_step": 358613, "epoch": 2134} {"train_loss": -12.579326629638672, "global_step": 358614, "epoch": 2134} {"train_loss": -12.422632217407227, "global_step": 358615, "epoch": 2134} {"train_loss": -12.667241096496582, "global_step": 358616, "epoch": 2134} {"train_loss": -12.56959056854248, "global_step": 358617, "epoch": 2134} {"train_loss": -12.396110534667969, "global_step": 358618, "epoch": 2134} {"train_loss": -12.559513092041016, "global_step": 358619, "epoch": 2134} {"train_loss": -12.608774185180664, "global_step": 358620, "epoch": 2134} {"train_loss": -12.674980163574219, "global_step": 358621, "epoch": 2134} {"train_loss": -12.68161392211914, "global_step": 358622, "epoch": 2134} {"train_loss": -12.755853652954102, "global_step": 358623, "epoch": 2134} {"train_loss": -12.813579559326172, "global_step": 358624, "epoch": 2134} {"train_loss": -12.487977981567383, "global_step": 358625, "epoch": 2134} {"train_loss": -12.628414154052734, "global_step": 358626, "epoch": 2134} {"train_loss": -12.749736785888672, "global_step": 358627, "epoch": 2134} {"train_loss": -12.52975082397461, "global_step": 358628, "epoch": 2134} {"train_loss": -12.416778564453125, "global_step": 358629, "epoch": 2134} {"train_loss": -12.718331336975098, "global_step": 358630, "epoch": 2134} {"train_loss": -12.788297653198242, "global_step": 358631, "epoch": 2134} {"train_loss": -12.620586395263672, "global_step": 358632, "epoch": 2134} {"train_loss": -11.733687400817871, "global_step": 358633, "epoch": 2134} {"train_loss": -11.86220932006836, "global_step": 358634, "epoch": 2134} {"train_loss": -12.111237525939941, "global_step": 358635, "epoch": 2134} {"train_loss": -12.518037796020508, "global_step": 358636, "epoch": 2134} {"train_loss": -12.397926330566406, "global_step": 358637, "epoch": 2134} {"train_loss": -11.807392120361328, "global_step": 358638, "epoch": 2134} {"train_loss": -11.046414375305176, "global_step": 358639, "epoch": 2134} {"train_loss": -12.294981956481934, "global_step": 358640, "epoch": 2134} {"train_loss": -12.321677207946777, "global_step": 358641, "epoch": 2134} {"train_loss": -11.852932929992676, "global_step": 358642, "epoch": 2134} {"train_loss": -12.503410339355469, "global_step": 358643, "epoch": 2134} {"train_loss": -12.254517555236816, "global_step": 358644, "epoch": 2134} {"train_loss": -12.631643295288086, "global_step": 358645, "epoch": 2134} {"train_loss": -12.561363220214844, "global_step": 358646, "epoch": 2134} {"train_loss": -12.673833847045898, "global_step": 358647, "epoch": 2134} {"train_loss": -12.321407318115234, "global_step": 358648, "epoch": 2134} {"train_loss": -12.58336067199707, "global_step": 358649, "epoch": 2134} {"train_loss": -12.613311767578125, "global_step": 358650, "epoch": 2134} {"train_loss": -12.044809341430664, "global_step": 358651, "epoch": 2134} {"train_loss": -12.532384872436523, "global_step": 358652, "epoch": 2134} {"train_loss": -12.476898193359375, "global_step": 358653, "epoch": 2134} {"train_loss": -12.054594039916992, "global_step": 358654, "epoch": 2134} {"train_loss": -11.976820945739746, "global_step": 358655, "epoch": 2134} {"train_loss": -12.40363883972168, "global_step": 358656, "epoch": 2134} {"train_loss": -12.283563613891602, "global_step": 358657, "epoch": 2134} {"train_loss": -12.093395233154297, "global_step": 358658, "epoch": 2134} {"train_loss": -12.17959213256836, "global_step": 358659, "epoch": 2134} {"train_loss": -12.115230560302734, "global_step": 358660, "epoch": 2134} {"train_loss": -11.61140251159668, "global_step": 358661, "epoch": 2134} {"train_loss": -11.517045974731445, "global_step": 358662, "epoch": 2134} {"train_loss": -11.358121871948242, "global_step": 358663, "epoch": 2134} {"train_loss": -12.008431434631348, "global_step": 358664, "epoch": 2134} {"train_loss": -11.758532524108887, "global_step": 358665, "epoch": 2134} {"train_loss": -11.008918762207031, "global_step": 358666, "epoch": 2134} {"train_loss": -11.405123710632324, "global_step": 358667, "epoch": 2134} {"train_loss": -12.107956886291504, "global_step": 358668, "epoch": 2134} {"train_loss": -11.61234188079834, "global_step": 358669, "epoch": 2134} {"train_loss": -12.149642944335938, "global_step": 358670, "epoch": 2134} {"train_loss": -12.143367767333984, "global_step": 358671, "epoch": 2134} {"train_loss": -11.496099472045898, "global_step": 358672, "epoch": 2134} {"train_loss": -11.366384506225586, "global_step": 358673, "epoch": 2134} {"train_loss": -10.800931930541992, "global_step": 358674, "epoch": 2134} {"train_loss": -10.299650192260742, "global_step": 358675, "epoch": 2134} {"train_loss": -9.515080451965332, "global_step": 358676, "epoch": 2134} {"train_loss": -11.019756317138672, "global_step": 358677, "epoch": 2134} {"train_loss": -10.017929077148438, "global_step": 358678, "epoch": 2134} {"train_loss": -12.090788353057135, "global_step": 358679, "epoch": 2134, "val_loss": 290349.9375} {"train_loss": -9.724352836608887, "global_step": 358680, "epoch": 2135} {"train_loss": -11.299665451049805, "global_step": 358681, "epoch": 2135} {"train_loss": -11.066574096679688, "global_step": 358682, "epoch": 2135} {"train_loss": -10.524360656738281, "global_step": 358683, "epoch": 2135} {"train_loss": -8.073310852050781, "global_step": 358684, "epoch": 2135} {"train_loss": -8.54160213470459, "global_step": 358685, "epoch": 2135} {"train_loss": -7.260990142822266, "global_step": 358686, "epoch": 2135} {"train_loss": -8.06717586517334, "global_step": 358687, "epoch": 2135} {"train_loss": -8.407241821289062, "global_step": 358688, "epoch": 2135} {"train_loss": -8.284563064575195, "global_step": 358689, "epoch": 2135} {"train_loss": -8.338129043579102, "global_step": 358690, "epoch": 2135} {"train_loss": -8.124935150146484, "global_step": 358691, "epoch": 2135} {"train_loss": -8.199538230895996, "global_step": 358692, "epoch": 2135} {"train_loss": -8.37342357635498, "global_step": 358693, "epoch": 2135} {"train_loss": -8.317086219787598, "global_step": 358694, "epoch": 2135} {"train_loss": -8.662755966186523, "global_step": 358695, "epoch": 2135} {"train_loss": -9.2186918258667, "global_step": 358696, "epoch": 2135} {"train_loss": -10.324714660644531, "global_step": 358697, "epoch": 2135} {"train_loss": -10.66364574432373, "global_step": 358698, "epoch": 2135} {"train_loss": -10.893077850341797, "global_step": 358699, "epoch": 2135} {"train_loss": -10.429773330688477, "global_step": 358700, "epoch": 2135} {"train_loss": -10.504386901855469, "global_step": 358701, "epoch": 2135} {"train_loss": -9.985071182250977, "global_step": 358702, "epoch": 2135} {"train_loss": -9.761775016784668, "global_step": 358703, "epoch": 2135} {"train_loss": -10.481283187866211, "global_step": 358704, "epoch": 2135} {"train_loss": -10.316972732543945, "global_step": 358705, "epoch": 2135} {"train_loss": -11.229740142822266, "global_step": 358706, "epoch": 2135} {"train_loss": -11.494732856750488, "global_step": 358707, "epoch": 2135} {"train_loss": -11.236143112182617, "global_step": 358708, "epoch": 2135} {"train_loss": -11.719240188598633, "global_step": 358709, "epoch": 2135} {"train_loss": -10.618141174316406, "global_step": 358710, "epoch": 2135} {"train_loss": -11.431730270385742, "global_step": 358711, "epoch": 2135} {"train_loss": -11.293085098266602, "global_step": 358712, "epoch": 2135} {"train_loss": -11.276496887207031, "global_step": 358713, "epoch": 2135} {"train_loss": -11.901947021484375, "global_step": 358714, "epoch": 2135} {"train_loss": -10.99804401397705, "global_step": 358715, "epoch": 2135} {"train_loss": -12.002089500427246, "global_step": 358716, "epoch": 2135} {"train_loss": -11.11460018157959, "global_step": 358717, "epoch": 2135} {"train_loss": -11.512906074523926, "global_step": 358718, "epoch": 2135} {"train_loss": -11.55131721496582, "global_step": 358719, "epoch": 2135} {"train_loss": -11.675811767578125, "global_step": 358720, "epoch": 2135} {"train_loss": -11.863333702087402, "global_step": 358721, "epoch": 2135} {"train_loss": -11.600584983825684, "global_step": 358722, "epoch": 2135} {"train_loss": -11.564397811889648, "global_step": 358723, "epoch": 2135} {"train_loss": -11.999252319335938, "global_step": 358724, "epoch": 2135} {"train_loss": -11.773092269897461, "global_step": 358725, "epoch": 2135} {"train_loss": -12.14277458190918, "global_step": 358726, "epoch": 2135} {"train_loss": -11.697301864624023, "global_step": 358727, "epoch": 2135} {"train_loss": -11.948646545410156, "global_step": 358728, "epoch": 2135} {"train_loss": -12.227940559387207, "global_step": 358729, "epoch": 2135} {"train_loss": -11.541820526123047, "global_step": 358730, "epoch": 2135} {"train_loss": -11.982040405273438, "global_step": 358731, "epoch": 2135} {"train_loss": -11.936217308044434, "global_step": 358732, "epoch": 2135} {"train_loss": -12.050436019897461, "global_step": 358733, "epoch": 2135} {"train_loss": -12.186304092407227, "global_step": 358734, "epoch": 2135} {"train_loss": -12.013195037841797, "global_step": 358735, "epoch": 2135} {"train_loss": -12.247384071350098, "global_step": 358736, "epoch": 2135} {"train_loss": -12.170839309692383, "global_step": 358737, "epoch": 2135} {"train_loss": -12.177050590515137, "global_step": 358738, "epoch": 2135} {"train_loss": -12.428391456604004, "global_step": 358739, "epoch": 2135} {"train_loss": -12.147977828979492, "global_step": 358740, "epoch": 2135} {"train_loss": -12.311361312866211, "global_step": 358741, "epoch": 2135} {"train_loss": -12.195610046386719, "global_step": 358742, "epoch": 2135} {"train_loss": -12.014598846435547, "global_step": 358743, "epoch": 2135} {"train_loss": -12.404808044433594, "global_step": 358744, "epoch": 2135} {"train_loss": -12.084224700927734, "global_step": 358745, "epoch": 2135} {"train_loss": -12.191076278686523, "global_step": 358746, "epoch": 2135} {"train_loss": -12.512609481811523, "global_step": 358747, "epoch": 2135} {"train_loss": -12.29391098022461, "global_step": 358748, "epoch": 2135} {"train_loss": -12.477563858032227, "global_step": 358749, "epoch": 2135} {"train_loss": -12.250005722045898, "global_step": 358750, "epoch": 2135} {"train_loss": -12.199146270751953, "global_step": 358751, "epoch": 2135} {"train_loss": -12.523530960083008, "global_step": 358752, "epoch": 2135} {"train_loss": -12.061439514160156, "global_step": 358753, "epoch": 2135} {"train_loss": -12.415790557861328, "global_step": 358754, "epoch": 2135} {"train_loss": -12.223986625671387, "global_step": 358755, "epoch": 2135} {"train_loss": -12.378389358520508, "global_step": 358756, "epoch": 2135} {"train_loss": -12.272430419921875, "global_step": 358757, "epoch": 2135} {"train_loss": -12.366608619689941, "global_step": 358758, "epoch": 2135} {"train_loss": -12.357707023620605, "global_step": 358759, "epoch": 2135} {"train_loss": -12.182266235351562, "global_step": 358760, "epoch": 2135} {"train_loss": -12.167281150817871, "global_step": 358761, "epoch": 2135} {"train_loss": -12.43550968170166, "global_step": 358762, "epoch": 2135} {"train_loss": -12.105703353881836, "global_step": 358763, "epoch": 2135} {"train_loss": -12.273149490356445, "global_step": 358764, "epoch": 2135} {"train_loss": -12.261201858520508, "global_step": 358765, "epoch": 2135} {"train_loss": -12.274909973144531, "global_step": 358766, "epoch": 2135} {"train_loss": -12.637198448181152, "global_step": 358767, "epoch": 2135} {"train_loss": -12.242936134338379, "global_step": 358768, "epoch": 2135} {"train_loss": -12.636839866638184, "global_step": 358769, "epoch": 2135} {"train_loss": -12.422453880310059, "global_step": 358770, "epoch": 2135} {"train_loss": -12.312149047851562, "global_step": 358771, "epoch": 2135} {"train_loss": -12.547513008117676, "global_step": 358772, "epoch": 2135} {"train_loss": -12.447419166564941, "global_step": 358773, "epoch": 2135} {"train_loss": -12.472314834594727, "global_step": 358774, "epoch": 2135} {"train_loss": -12.430147171020508, "global_step": 358775, "epoch": 2135} {"train_loss": -12.486479759216309, "global_step": 358776, "epoch": 2135} {"train_loss": -12.400575637817383, "global_step": 358777, "epoch": 2135} {"train_loss": -12.552098274230957, "global_step": 358778, "epoch": 2135} {"train_loss": -12.440494537353516, "global_step": 358779, "epoch": 2135} {"train_loss": -12.531590461730957, "global_step": 358780, "epoch": 2135} {"train_loss": -12.53092098236084, "global_step": 358781, "epoch": 2135} {"train_loss": -12.37901782989502, "global_step": 358782, "epoch": 2135} {"train_loss": -12.743062019348145, "global_step": 358783, "epoch": 2135} {"train_loss": -12.208742141723633, "global_step": 358784, "epoch": 2135} {"train_loss": -12.493844032287598, "global_step": 358785, "epoch": 2135} {"train_loss": -12.192010879516602, "global_step": 358786, "epoch": 2135} {"train_loss": -12.475597381591797, "global_step": 358787, "epoch": 2135} {"train_loss": -12.073417663574219, "global_step": 358788, "epoch": 2135} {"train_loss": -11.926366806030273, "global_step": 358789, "epoch": 2135} {"train_loss": -11.958473205566406, "global_step": 358790, "epoch": 2135} {"train_loss": -11.938763618469238, "global_step": 358791, "epoch": 2135} {"train_loss": -11.675832748413086, "global_step": 358792, "epoch": 2135} {"train_loss": -11.871010780334473, "global_step": 358793, "epoch": 2135} {"train_loss": -11.694337844848633, "global_step": 358794, "epoch": 2135} {"train_loss": -11.661027908325195, "global_step": 358795, "epoch": 2135} {"train_loss": -12.202664375305176, "global_step": 358796, "epoch": 2135} {"train_loss": -11.626375198364258, "global_step": 358797, "epoch": 2135} {"train_loss": -12.07567024230957, "global_step": 358798, "epoch": 2135} {"train_loss": -12.447874069213867, "global_step": 358799, "epoch": 2135} {"train_loss": -11.679754257202148, "global_step": 358800, "epoch": 2135} {"train_loss": -12.493612289428711, "global_step": 358801, "epoch": 2135} {"train_loss": -12.174509048461914, "global_step": 358802, "epoch": 2135} {"train_loss": -11.594107627868652, "global_step": 358803, "epoch": 2135} {"train_loss": -12.219644546508789, "global_step": 358804, "epoch": 2135} {"train_loss": -12.182868957519531, "global_step": 358805, "epoch": 2135} {"train_loss": -11.202348709106445, "global_step": 358806, "epoch": 2135} {"train_loss": -12.178651809692383, "global_step": 358807, "epoch": 2135} {"train_loss": -11.97557544708252, "global_step": 358808, "epoch": 2135} {"train_loss": -11.758512496948242, "global_step": 358809, "epoch": 2135} {"train_loss": -12.22611141204834, "global_step": 358810, "epoch": 2135} {"train_loss": -12.016515731811523, "global_step": 358811, "epoch": 2135} {"train_loss": -12.298717498779297, "global_step": 358812, "epoch": 2135} {"train_loss": -12.340771675109863, "global_step": 358813, "epoch": 2135} {"train_loss": -11.924419403076172, "global_step": 358814, "epoch": 2135} {"train_loss": -12.165905952453613, "global_step": 358815, "epoch": 2135} {"train_loss": -12.223360061645508, "global_step": 358816, "epoch": 2135} {"train_loss": -12.216825485229492, "global_step": 358817, "epoch": 2135} {"train_loss": -12.309243202209473, "global_step": 358818, "epoch": 2135} {"train_loss": -12.413387298583984, "global_step": 358819, "epoch": 2135} {"train_loss": -12.379520416259766, "global_step": 358820, "epoch": 2135} {"train_loss": -12.707292556762695, "global_step": 358821, "epoch": 2135} {"train_loss": -12.159961700439453, "global_step": 358822, "epoch": 2135} {"train_loss": -12.414376258850098, "global_step": 358823, "epoch": 2135} {"train_loss": -12.554365158081055, "global_step": 358824, "epoch": 2135} {"train_loss": -12.343515396118164, "global_step": 358825, "epoch": 2135} {"train_loss": -12.615438461303711, "global_step": 358826, "epoch": 2135} {"train_loss": -12.16796875, "global_step": 358827, "epoch": 2135} {"train_loss": -12.43060302734375, "global_step": 358828, "epoch": 2135} {"train_loss": -12.099113464355469, "global_step": 358829, "epoch": 2135} {"train_loss": -12.276168823242188, "global_step": 358830, "epoch": 2135} {"train_loss": -12.371294021606445, "global_step": 358831, "epoch": 2135} {"train_loss": -12.521657943725586, "global_step": 358832, "epoch": 2135} {"train_loss": -12.339620590209961, "global_step": 358833, "epoch": 2135} {"train_loss": -12.582098007202148, "global_step": 358834, "epoch": 2135} {"train_loss": -12.097160339355469, "global_step": 358835, "epoch": 2135} {"train_loss": -12.167795181274414, "global_step": 358836, "epoch": 2135} {"train_loss": -12.192749977111816, "global_step": 358837, "epoch": 2135} {"train_loss": -12.084735870361328, "global_step": 358838, "epoch": 2135} {"train_loss": -12.406270980834961, "global_step": 358839, "epoch": 2135} {"train_loss": -11.703085899353027, "global_step": 358840, "epoch": 2135} {"train_loss": -11.338582038879395, "global_step": 358841, "epoch": 2135} {"train_loss": -11.20689582824707, "global_step": 358842, "epoch": 2135} {"train_loss": -12.06397819519043, "global_step": 358843, "epoch": 2135} {"train_loss": -12.04041862487793, "global_step": 358844, "epoch": 2135} {"train_loss": -11.99502182006836, "global_step": 358845, "epoch": 2135} {"train_loss": -11.986701965332031, "global_step": 358846, "epoch": 2135} {"train_loss": -11.672167897224426, "global_step": 358847, "epoch": 2135, "val_loss": 289333.46875, "train_action_mse_error": 3.495948076248169} {"train_loss": -12.25567626953125, "global_step": 358848, "epoch": 2136} {"train_loss": -11.561761856079102, "global_step": 358849, "epoch": 2136} {"train_loss": -11.956488609313965, "global_step": 358850, "epoch": 2136} {"train_loss": -12.125434875488281, "global_step": 358851, "epoch": 2136} {"train_loss": -11.642871856689453, "global_step": 358852, "epoch": 2136} {"train_loss": -11.834539413452148, "global_step": 358853, "epoch": 2136} {"train_loss": -11.614808082580566, "global_step": 358854, "epoch": 2136} {"train_loss": -11.8611478805542, "global_step": 358855, "epoch": 2136} {"train_loss": -10.685956954956055, "global_step": 358856, "epoch": 2136} {"train_loss": -11.849895477294922, "global_step": 358857, "epoch": 2136} {"train_loss": -11.05653190612793, "global_step": 358858, "epoch": 2136} {"train_loss": -12.31738567352295, "global_step": 358859, "epoch": 2136} {"train_loss": -11.322027206420898, "global_step": 358860, "epoch": 2136} {"train_loss": -11.632410049438477, "global_step": 358861, "epoch": 2136} {"train_loss": -11.32672119140625, "global_step": 358862, "epoch": 2136} {"train_loss": -12.386220932006836, "global_step": 358863, "epoch": 2136} {"train_loss": -11.992563247680664, "global_step": 358864, "epoch": 2136} {"train_loss": -12.357402801513672, "global_step": 358865, "epoch": 2136} {"train_loss": -11.911561965942383, "global_step": 358866, "epoch": 2136} {"train_loss": -12.123238563537598, "global_step": 358867, "epoch": 2136} {"train_loss": -10.826473236083984, "global_step": 358868, "epoch": 2136} {"train_loss": -12.148545265197754, "global_step": 358869, "epoch": 2136} {"train_loss": -11.236136436462402, "global_step": 358870, "epoch": 2136} {"train_loss": -11.33173942565918, "global_step": 358871, "epoch": 2136} {"train_loss": -11.010334014892578, "global_step": 358872, "epoch": 2136} {"train_loss": -10.694107055664062, "global_step": 358873, "epoch": 2136} {"train_loss": -11.655726432800293, "global_step": 358874, "epoch": 2136} {"train_loss": -11.160035133361816, "global_step": 358875, "epoch": 2136} {"train_loss": -11.228365898132324, "global_step": 358876, "epoch": 2136} {"train_loss": -10.378057479858398, "global_step": 358877, "epoch": 2136} {"train_loss": -11.306615829467773, "global_step": 358878, "epoch": 2136} {"train_loss": -11.240903854370117, "global_step": 358879, "epoch": 2136} {"train_loss": -10.890460968017578, "global_step": 358880, "epoch": 2136} {"train_loss": -12.028411865234375, "global_step": 358881, "epoch": 2136} {"train_loss": -10.961347579956055, "global_step": 358882, "epoch": 2136} {"train_loss": -12.061172485351562, "global_step": 358883, "epoch": 2136} {"train_loss": -11.616613388061523, "global_step": 358884, "epoch": 2136} {"train_loss": -12.08741569519043, "global_step": 358885, "epoch": 2136} {"train_loss": -11.317488670349121, "global_step": 358886, "epoch": 2136} {"train_loss": -11.90003776550293, "global_step": 358887, "epoch": 2136} {"train_loss": -11.596933364868164, "global_step": 358888, "epoch": 2136} {"train_loss": -12.163372993469238, "global_step": 358889, "epoch": 2136} {"train_loss": -11.647050857543945, "global_step": 358890, "epoch": 2136} {"train_loss": -11.405162811279297, "global_step": 358891, "epoch": 2136} {"train_loss": -12.075736999511719, "global_step": 358892, "epoch": 2136} {"train_loss": -12.10660457611084, "global_step": 358893, "epoch": 2136} {"train_loss": -11.677377700805664, "global_step": 358894, "epoch": 2136} {"train_loss": -12.268506050109863, "global_step": 358895, "epoch": 2136} {"train_loss": -11.805688858032227, "global_step": 358896, "epoch": 2136} {"train_loss": -12.15665054321289, "global_step": 358897, "epoch": 2136} {"train_loss": -12.201000213623047, "global_step": 358898, "epoch": 2136} {"train_loss": -11.675321578979492, "global_step": 358899, "epoch": 2136} {"train_loss": -12.23415756225586, "global_step": 358900, "epoch": 2136} {"train_loss": -11.763860702514648, "global_step": 358901, "epoch": 2136} {"train_loss": -12.256797790527344, "global_step": 358902, "epoch": 2136} {"train_loss": -12.044532775878906, "global_step": 358903, "epoch": 2136} {"train_loss": -12.019411087036133, "global_step": 358904, "epoch": 2136} {"train_loss": -12.214305877685547, "global_step": 358905, "epoch": 2136} {"train_loss": -12.028371810913086, "global_step": 358906, "epoch": 2136} {"train_loss": -12.33714771270752, "global_step": 358907, "epoch": 2136} {"train_loss": -12.107959747314453, "global_step": 358908, "epoch": 2136} {"train_loss": -12.318075180053711, "global_step": 358909, "epoch": 2136} {"train_loss": -12.083576202392578, "global_step": 358910, "epoch": 2136} {"train_loss": -12.263248443603516, "global_step": 358911, "epoch": 2136} {"train_loss": -12.209367752075195, "global_step": 358912, "epoch": 2136} {"train_loss": -12.020376205444336, "global_step": 358913, "epoch": 2136} {"train_loss": -12.131898880004883, "global_step": 358914, "epoch": 2136} {"train_loss": -12.304224014282227, "global_step": 358915, "epoch": 2136} {"train_loss": -12.188952445983887, "global_step": 358916, "epoch": 2136} {"train_loss": -12.253266334533691, "global_step": 358917, "epoch": 2136} {"train_loss": -12.289970397949219, "global_step": 358918, "epoch": 2136} {"train_loss": -12.133523941040039, "global_step": 358919, "epoch": 2136} {"train_loss": -12.54486083984375, "global_step": 358920, "epoch": 2136} {"train_loss": -12.472049713134766, "global_step": 358921, "epoch": 2136} {"train_loss": -12.397333145141602, "global_step": 358922, "epoch": 2136} {"train_loss": -12.32763957977295, "global_step": 358923, "epoch": 2136} {"train_loss": -12.347167015075684, "global_step": 358924, "epoch": 2136} {"train_loss": -12.504762649536133, "global_step": 358925, "epoch": 2136} {"train_loss": -12.255890846252441, "global_step": 358926, "epoch": 2136} {"train_loss": -12.443214416503906, "global_step": 358927, "epoch": 2136} {"train_loss": -11.975324630737305, "global_step": 358928, "epoch": 2136} {"train_loss": -12.446707725524902, "global_step": 358929, "epoch": 2136} {"train_loss": -12.422082901000977, "global_step": 358930, "epoch": 2136} {"train_loss": -12.378303527832031, "global_step": 358931, "epoch": 2136} {"train_loss": -12.20048713684082, "global_step": 358932, "epoch": 2136} {"train_loss": -12.325666427612305, "global_step": 358933, "epoch": 2136} {"train_loss": -12.371236801147461, "global_step": 358934, "epoch": 2136} {"train_loss": -12.285943984985352, "global_step": 358935, "epoch": 2136} {"train_loss": -12.04362678527832, "global_step": 358936, "epoch": 2136} {"train_loss": -12.5267333984375, "global_step": 358937, "epoch": 2136} {"train_loss": -11.968414306640625, "global_step": 358938, "epoch": 2136} {"train_loss": -12.412471771240234, "global_step": 358939, "epoch": 2136} {"train_loss": -12.378490447998047, "global_step": 358940, "epoch": 2136} {"train_loss": -11.9061861038208, "global_step": 358941, "epoch": 2136} {"train_loss": -12.182279586791992, "global_step": 358942, "epoch": 2136} {"train_loss": -12.285024642944336, "global_step": 358943, "epoch": 2136} {"train_loss": -12.284988403320312, "global_step": 358944, "epoch": 2136} {"train_loss": -11.935239791870117, "global_step": 358945, "epoch": 2136} {"train_loss": -12.07944107055664, "global_step": 358946, "epoch": 2136} {"train_loss": -11.854473114013672, "global_step": 358947, "epoch": 2136} {"train_loss": -11.898219108581543, "global_step": 358948, "epoch": 2136} {"train_loss": -12.073806762695312, "global_step": 358949, "epoch": 2136} {"train_loss": -12.268645286560059, "global_step": 358950, "epoch": 2136} {"train_loss": -11.997018814086914, "global_step": 358951, "epoch": 2136} {"train_loss": -12.002998352050781, "global_step": 358952, "epoch": 2136} {"train_loss": -11.382015228271484, "global_step": 358953, "epoch": 2136} {"train_loss": -11.236019134521484, "global_step": 358954, "epoch": 2136} {"train_loss": -11.215166091918945, "global_step": 358955, "epoch": 2136} {"train_loss": -11.372088432312012, "global_step": 358956, "epoch": 2136} {"train_loss": -11.555075645446777, "global_step": 358957, "epoch": 2136} {"train_loss": -11.647287368774414, "global_step": 358958, "epoch": 2136} {"train_loss": -11.758376121520996, "global_step": 358959, "epoch": 2136} {"train_loss": -12.32077407836914, "global_step": 358960, "epoch": 2136} {"train_loss": -12.22542953491211, "global_step": 358961, "epoch": 2136} {"train_loss": -11.95200252532959, "global_step": 358962, "epoch": 2136} {"train_loss": -11.848091125488281, "global_step": 358963, "epoch": 2136} {"train_loss": -11.393365859985352, "global_step": 358964, "epoch": 2136} {"train_loss": -11.746976852416992, "global_step": 358965, "epoch": 2136} {"train_loss": -11.839214324951172, "global_step": 358966, "epoch": 2136} {"train_loss": -12.189933776855469, "global_step": 358967, "epoch": 2136} {"train_loss": -11.726811408996582, "global_step": 358968, "epoch": 2136} {"train_loss": -12.258929252624512, "global_step": 358969, "epoch": 2136} {"train_loss": -11.370185852050781, "global_step": 358970, "epoch": 2136} {"train_loss": -12.27237606048584, "global_step": 358971, "epoch": 2136} {"train_loss": -11.675350189208984, "global_step": 358972, "epoch": 2136} {"train_loss": -12.290928840637207, "global_step": 358973, "epoch": 2136} {"train_loss": -11.765021324157715, "global_step": 358974, "epoch": 2136} {"train_loss": -11.796243667602539, "global_step": 358975, "epoch": 2136} {"train_loss": -10.903778076171875, "global_step": 358976, "epoch": 2136} {"train_loss": -11.344104766845703, "global_step": 358977, "epoch": 2136} {"train_loss": -12.211674690246582, "global_step": 358978, "epoch": 2136} {"train_loss": -11.566766738891602, "global_step": 358979, "epoch": 2136} {"train_loss": -12.067340850830078, "global_step": 358980, "epoch": 2136} {"train_loss": -11.815427780151367, "global_step": 358981, "epoch": 2136} {"train_loss": -12.410014152526855, "global_step": 358982, "epoch": 2136} {"train_loss": -11.950300216674805, "global_step": 358983, "epoch": 2136} {"train_loss": -11.454965591430664, "global_step": 358984, "epoch": 2136} {"train_loss": -11.560771942138672, "global_step": 358985, "epoch": 2136} {"train_loss": -11.80898666381836, "global_step": 358986, "epoch": 2136} {"train_loss": -10.929924011230469, "global_step": 358987, "epoch": 2136} {"train_loss": -11.738876342773438, "global_step": 358988, "epoch": 2136} {"train_loss": -11.694168090820312, "global_step": 358989, "epoch": 2136} {"train_loss": -11.573711395263672, "global_step": 358990, "epoch": 2136} {"train_loss": -12.045913696289062, "global_step": 358991, "epoch": 2136} {"train_loss": -11.56711196899414, "global_step": 358992, "epoch": 2136} {"train_loss": -11.881532669067383, "global_step": 358993, "epoch": 2136} {"train_loss": -11.525390625, "global_step": 358994, "epoch": 2136} {"train_loss": -11.532878875732422, "global_step": 358995, "epoch": 2136} {"train_loss": -11.464899063110352, "global_step": 358996, "epoch": 2136} {"train_loss": -11.236001014709473, "global_step": 358997, "epoch": 2136} {"train_loss": -11.839147567749023, "global_step": 358998, "epoch": 2136} {"train_loss": -11.665693283081055, "global_step": 358999, "epoch": 2136} {"train_loss": -11.449258804321289, "global_step": 359000, "epoch": 2136} {"train_loss": -12.01097583770752, "global_step": 359001, "epoch": 2136} {"train_loss": -10.960458755493164, "global_step": 359002, "epoch": 2136} {"train_loss": -11.405029296875, "global_step": 359003, "epoch": 2136} {"train_loss": -11.157169342041016, "global_step": 359004, "epoch": 2136} {"train_loss": -11.230169296264648, "global_step": 359005, "epoch": 2136} {"train_loss": -10.880985260009766, "global_step": 359006, "epoch": 2136} {"train_loss": -10.484390258789062, "global_step": 359007, "epoch": 2136} {"train_loss": -10.569103240966797, "global_step": 359008, "epoch": 2136} {"train_loss": -10.749027252197266, "global_step": 359009, "epoch": 2136} {"train_loss": -10.927046775817871, "global_step": 359010, "epoch": 2136} {"train_loss": -9.014720916748047, "global_step": 359011, "epoch": 2136} {"train_loss": -11.236315727233887, "global_step": 359012, "epoch": 2136} {"train_loss": -11.135841369628906, "global_step": 359013, "epoch": 2136} {"train_loss": -11.446290969848633, "global_step": 359014, "epoch": 2136} {"train_loss": -11.779995730945043, "global_step": 359015, "epoch": 2136, "val_loss": 296034.25} {"train_loss": -11.25619888305664, "global_step": 359016, "epoch": 2137} {"train_loss": -10.856267929077148, "global_step": 359017, "epoch": 2137} {"train_loss": -11.035932540893555, "global_step": 359018, "epoch": 2137} {"train_loss": -11.319910049438477, "global_step": 359019, "epoch": 2137} {"train_loss": -11.500155448913574, "global_step": 359020, "epoch": 2137} {"train_loss": -10.840469360351562, "global_step": 359021, "epoch": 2137} {"train_loss": -11.576101303100586, "global_step": 359022, "epoch": 2137} {"train_loss": -11.27206802368164, "global_step": 359023, "epoch": 2137} {"train_loss": -11.575464248657227, "global_step": 359024, "epoch": 2137} {"train_loss": -11.465923309326172, "global_step": 359025, "epoch": 2137} {"train_loss": -11.63779067993164, "global_step": 359026, "epoch": 2137} {"train_loss": -11.476325988769531, "global_step": 359027, "epoch": 2137} {"train_loss": -11.542717933654785, "global_step": 359028, "epoch": 2137} {"train_loss": -11.548784255981445, "global_step": 359029, "epoch": 2137} {"train_loss": -11.778817176818848, "global_step": 359030, "epoch": 2137} {"train_loss": -11.341056823730469, "global_step": 359031, "epoch": 2137} {"train_loss": -11.513964653015137, "global_step": 359032, "epoch": 2137} {"train_loss": -11.790443420410156, "global_step": 359033, "epoch": 2137} {"train_loss": -11.722917556762695, "global_step": 359034, "epoch": 2137} {"train_loss": -11.924850463867188, "global_step": 359035, "epoch": 2137} {"train_loss": -11.948719024658203, "global_step": 359036, "epoch": 2137} {"train_loss": -11.582147598266602, "global_step": 359037, "epoch": 2137} {"train_loss": -12.066556930541992, "global_step": 359038, "epoch": 2137} {"train_loss": -11.92815113067627, "global_step": 359039, "epoch": 2137} {"train_loss": -11.822650909423828, "global_step": 359040, "epoch": 2137} {"train_loss": -11.959586143493652, "global_step": 359041, "epoch": 2137} {"train_loss": -12.107721328735352, "global_step": 359042, "epoch": 2137} {"train_loss": -11.948249816894531, "global_step": 359043, "epoch": 2137} {"train_loss": -11.933225631713867, "global_step": 359044, "epoch": 2137} {"train_loss": -12.13818359375, "global_step": 359045, "epoch": 2137} {"train_loss": -11.934992790222168, "global_step": 359046, "epoch": 2137} {"train_loss": -12.180108070373535, "global_step": 359047, "epoch": 2137} {"train_loss": -11.701105117797852, "global_step": 359048, "epoch": 2137} {"train_loss": -12.302665710449219, "global_step": 359049, "epoch": 2137} {"train_loss": -11.988451957702637, "global_step": 359050, "epoch": 2137} {"train_loss": -12.07479476928711, "global_step": 359051, "epoch": 2137} {"train_loss": -11.998651504516602, "global_step": 359052, "epoch": 2137} {"train_loss": -11.938261985778809, "global_step": 359053, "epoch": 2137} {"train_loss": -11.858261108398438, "global_step": 359054, "epoch": 2137} {"train_loss": -12.230297088623047, "global_step": 359055, "epoch": 2137} {"train_loss": -11.658050537109375, "global_step": 359056, "epoch": 2137} {"train_loss": -11.572393417358398, "global_step": 359057, "epoch": 2137} {"train_loss": -11.75225830078125, "global_step": 359058, "epoch": 2137} {"train_loss": -11.871267318725586, "global_step": 359059, "epoch": 2137} {"train_loss": -11.823437690734863, "global_step": 359060, "epoch": 2137} {"train_loss": -12.013788223266602, "global_step": 359061, "epoch": 2137} {"train_loss": -12.065337181091309, "global_step": 359062, "epoch": 2137} {"train_loss": -11.955704689025879, "global_step": 359063, "epoch": 2137} {"train_loss": -12.252704620361328, "global_step": 359064, "epoch": 2137} {"train_loss": -11.926868438720703, "global_step": 359065, "epoch": 2137} {"train_loss": -11.996814727783203, "global_step": 359066, "epoch": 2137} {"train_loss": -11.658100128173828, "global_step": 359067, "epoch": 2137} {"train_loss": -12.272555351257324, "global_step": 359068, "epoch": 2137} {"train_loss": -11.989568710327148, "global_step": 359069, "epoch": 2137} {"train_loss": -12.017541885375977, "global_step": 359070, "epoch": 2137} {"train_loss": -12.250154495239258, "global_step": 359071, "epoch": 2137} {"train_loss": -12.28132438659668, "global_step": 359072, "epoch": 2137} {"train_loss": -12.333575248718262, "global_step": 359073, "epoch": 2137} {"train_loss": -11.805255889892578, "global_step": 359074, "epoch": 2137} {"train_loss": -12.323404312133789, "global_step": 359075, "epoch": 2137} {"train_loss": -12.41033935546875, "global_step": 359076, "epoch": 2137} {"train_loss": -12.38763427734375, "global_step": 359077, "epoch": 2137} {"train_loss": -12.200362205505371, "global_step": 359078, "epoch": 2137} {"train_loss": -12.383718490600586, "global_step": 359079, "epoch": 2137} {"train_loss": -12.146041870117188, "global_step": 359080, "epoch": 2137} {"train_loss": -12.354900360107422, "global_step": 359081, "epoch": 2137} {"train_loss": -12.027725219726562, "global_step": 359082, "epoch": 2137} {"train_loss": -12.308778762817383, "global_step": 359083, "epoch": 2137} {"train_loss": -12.112881660461426, "global_step": 359084, "epoch": 2137} {"train_loss": -12.231893539428711, "global_step": 359085, "epoch": 2137} {"train_loss": -12.487895965576172, "global_step": 359086, "epoch": 2137} {"train_loss": -12.351141929626465, "global_step": 359087, "epoch": 2137} {"train_loss": -12.58812427520752, "global_step": 359088, "epoch": 2137} {"train_loss": -12.253904342651367, "global_step": 359089, "epoch": 2137} {"train_loss": -12.545788764953613, "global_step": 359090, "epoch": 2137} {"train_loss": -11.853355407714844, "global_step": 359091, "epoch": 2137} {"train_loss": -12.482468605041504, "global_step": 359092, "epoch": 2137} {"train_loss": -12.341276168823242, "global_step": 359093, "epoch": 2137} {"train_loss": -12.565489768981934, "global_step": 359094, "epoch": 2137} {"train_loss": -12.012174606323242, "global_step": 359095, "epoch": 2137} {"train_loss": -12.372550964355469, "global_step": 359096, "epoch": 2137} {"train_loss": -11.787272453308105, "global_step": 359097, "epoch": 2137} {"train_loss": -11.977522850036621, "global_step": 359098, "epoch": 2137} {"train_loss": -12.108192443847656, "global_step": 359099, "epoch": 2137} {"train_loss": -12.101615905761719, "global_step": 359100, "epoch": 2137} {"train_loss": -12.541481971740723, "global_step": 359101, "epoch": 2137} {"train_loss": -12.289702415466309, "global_step": 359102, "epoch": 2137} {"train_loss": -12.477729797363281, "global_step": 359103, "epoch": 2137} {"train_loss": -12.33189582824707, "global_step": 359104, "epoch": 2137} {"train_loss": -11.667515754699707, "global_step": 359105, "epoch": 2137} {"train_loss": -12.572198867797852, "global_step": 359106, "epoch": 2137} {"train_loss": -11.77048110961914, "global_step": 359107, "epoch": 2137} {"train_loss": -10.961973190307617, "global_step": 359108, "epoch": 2137} {"train_loss": -12.089089393615723, "global_step": 359109, "epoch": 2137} {"train_loss": -11.914148330688477, "global_step": 359110, "epoch": 2137} {"train_loss": -11.167875289916992, "global_step": 359111, "epoch": 2137} {"train_loss": -12.279735565185547, "global_step": 359112, "epoch": 2137} {"train_loss": -11.83221435546875, "global_step": 359113, "epoch": 2137} {"train_loss": -11.796422004699707, "global_step": 359114, "epoch": 2137} {"train_loss": -11.468005180358887, "global_step": 359115, "epoch": 2137} {"train_loss": -11.507551193237305, "global_step": 359116, "epoch": 2137} {"train_loss": -11.143339157104492, "global_step": 359117, "epoch": 2137} {"train_loss": -12.136306762695312, "global_step": 359118, "epoch": 2137} {"train_loss": -11.023286819458008, "global_step": 359119, "epoch": 2137} {"train_loss": -12.271286010742188, "global_step": 359120, "epoch": 2137} {"train_loss": -11.640213012695312, "global_step": 359121, "epoch": 2137} {"train_loss": -11.222301483154297, "global_step": 359122, "epoch": 2137} {"train_loss": -12.166025161743164, "global_step": 359123, "epoch": 2137} {"train_loss": -10.664105415344238, "global_step": 359124, "epoch": 2137} {"train_loss": -11.984472274780273, "global_step": 359125, "epoch": 2137} {"train_loss": -11.196013450622559, "global_step": 359126, "epoch": 2137} {"train_loss": -11.740877151489258, "global_step": 359127, "epoch": 2137} {"train_loss": -11.662349700927734, "global_step": 359128, "epoch": 2137} {"train_loss": -11.372323989868164, "global_step": 359129, "epoch": 2137} {"train_loss": -10.96268081665039, "global_step": 359130, "epoch": 2137} {"train_loss": -11.163702011108398, "global_step": 359131, "epoch": 2137} {"train_loss": -11.958106994628906, "global_step": 359132, "epoch": 2137} {"train_loss": -11.233955383300781, "global_step": 359133, "epoch": 2137} {"train_loss": -11.814130783081055, "global_step": 359134, "epoch": 2137} {"train_loss": -11.666746139526367, "global_step": 359135, "epoch": 2137} {"train_loss": -11.7816162109375, "global_step": 359136, "epoch": 2137} {"train_loss": -11.769872665405273, "global_step": 359137, "epoch": 2137} {"train_loss": -11.803787231445312, "global_step": 359138, "epoch": 2137} {"train_loss": -11.372720718383789, "global_step": 359139, "epoch": 2137} {"train_loss": -11.940065383911133, "global_step": 359140, "epoch": 2137} {"train_loss": -11.902856826782227, "global_step": 359141, "epoch": 2137} {"train_loss": -11.79499626159668, "global_step": 359142, "epoch": 2137} {"train_loss": -11.854679107666016, "global_step": 359143, "epoch": 2137} {"train_loss": -11.488849639892578, "global_step": 359144, "epoch": 2137} {"train_loss": -12.288080215454102, "global_step": 359145, "epoch": 2137} {"train_loss": -11.802987098693848, "global_step": 359146, "epoch": 2137} {"train_loss": -12.209817886352539, "global_step": 359147, "epoch": 2137} {"train_loss": -12.03194808959961, "global_step": 359148, "epoch": 2137} {"train_loss": -11.771970748901367, "global_step": 359149, "epoch": 2137} {"train_loss": -12.213438034057617, "global_step": 359150, "epoch": 2137} {"train_loss": -12.040011405944824, "global_step": 359151, "epoch": 2137} {"train_loss": -12.38189697265625, "global_step": 359152, "epoch": 2137} {"train_loss": -11.551749229431152, "global_step": 359153, "epoch": 2137} {"train_loss": -12.450384140014648, "global_step": 359154, "epoch": 2137} {"train_loss": -12.145137786865234, "global_step": 359155, "epoch": 2137} {"train_loss": -12.337737083435059, "global_step": 359156, "epoch": 2137} {"train_loss": -12.342010498046875, "global_step": 359157, "epoch": 2137} {"train_loss": -12.0111083984375, "global_step": 359158, "epoch": 2137} {"train_loss": -12.367375373840332, "global_step": 359159, "epoch": 2137} {"train_loss": -11.926431655883789, "global_step": 359160, "epoch": 2137} {"train_loss": -12.48189926147461, "global_step": 359161, "epoch": 2137} {"train_loss": -12.461261749267578, "global_step": 359162, "epoch": 2137} {"train_loss": -12.408126831054688, "global_step": 359163, "epoch": 2137} {"train_loss": -12.15146255493164, "global_step": 359164, "epoch": 2137} {"train_loss": -12.534576416015625, "global_step": 359165, "epoch": 2137} {"train_loss": -12.199586868286133, "global_step": 359166, "epoch": 2137} {"train_loss": -12.439165115356445, "global_step": 359167, "epoch": 2137} {"train_loss": -12.59268569946289, "global_step": 359168, "epoch": 2137} {"train_loss": -12.249526977539062, "global_step": 359169, "epoch": 2137} {"train_loss": -12.50793743133545, "global_step": 359170, "epoch": 2137} {"train_loss": -12.196815490722656, "global_step": 359171, "epoch": 2137} {"train_loss": -12.645511627197266, "global_step": 359172, "epoch": 2137} {"train_loss": -12.493611335754395, "global_step": 359173, "epoch": 2137} {"train_loss": -12.339492797851562, "global_step": 359174, "epoch": 2137} {"train_loss": -12.254951477050781, "global_step": 359175, "epoch": 2137} {"train_loss": -12.469676971435547, "global_step": 359176, "epoch": 2137} {"train_loss": -12.115198135375977, "global_step": 359177, "epoch": 2137} {"train_loss": -12.407440185546875, "global_step": 359178, "epoch": 2137} {"train_loss": -12.135344505310059, "global_step": 359179, "epoch": 2137} {"train_loss": -12.480152130126953, "global_step": 359180, "epoch": 2137} {"train_loss": -12.26535701751709, "global_step": 359181, "epoch": 2137} {"train_loss": -12.356245040893555, "global_step": 359182, "epoch": 2137} {"train_loss": -11.95272597812471, "global_step": 359183, "epoch": 2137, "val_loss": 294647.375} {"train_loss": -12.162508010864258, "global_step": 359184, "epoch": 2138} {"train_loss": -12.217594146728516, "global_step": 359185, "epoch": 2138} {"train_loss": -11.971452713012695, "global_step": 359186, "epoch": 2138} {"train_loss": -12.248529434204102, "global_step": 359187, "epoch": 2138} {"train_loss": -11.962562561035156, "global_step": 359188, "epoch": 2138} {"train_loss": -12.033553123474121, "global_step": 359189, "epoch": 2138} {"train_loss": -12.231281280517578, "global_step": 359190, "epoch": 2138} {"train_loss": -12.553668022155762, "global_step": 359191, "epoch": 2138} {"train_loss": -12.43454360961914, "global_step": 359192, "epoch": 2138} {"train_loss": -12.446998596191406, "global_step": 359193, "epoch": 2138} {"train_loss": -12.492683410644531, "global_step": 359194, "epoch": 2138} {"train_loss": -12.312918663024902, "global_step": 359195, "epoch": 2138} {"train_loss": -12.406164169311523, "global_step": 359196, "epoch": 2138} {"train_loss": -12.053330421447754, "global_step": 359197, "epoch": 2138} {"train_loss": -12.430432319641113, "global_step": 359198, "epoch": 2138} {"train_loss": -12.53622055053711, "global_step": 359199, "epoch": 2138} {"train_loss": -12.325538635253906, "global_step": 359200, "epoch": 2138} {"train_loss": -12.456901550292969, "global_step": 359201, "epoch": 2138} {"train_loss": -12.06098461151123, "global_step": 359202, "epoch": 2138} {"train_loss": -12.187841415405273, "global_step": 359203, "epoch": 2138} {"train_loss": -12.685404777526855, "global_step": 359204, "epoch": 2138} {"train_loss": -12.53339958190918, "global_step": 359205, "epoch": 2138} {"train_loss": -12.202041625976562, "global_step": 359206, "epoch": 2138} {"train_loss": -12.356929779052734, "global_step": 359207, "epoch": 2138} {"train_loss": -12.43798828125, "global_step": 359208, "epoch": 2138} {"train_loss": -11.838860511779785, "global_step": 359209, "epoch": 2138} {"train_loss": -12.06098747253418, "global_step": 359210, "epoch": 2138} {"train_loss": -12.360969543457031, "global_step": 359211, "epoch": 2138} {"train_loss": -12.193947792053223, "global_step": 359212, "epoch": 2138} {"train_loss": -12.288963317871094, "global_step": 359213, "epoch": 2138} {"train_loss": -12.716207504272461, "global_step": 359214, "epoch": 2138} {"train_loss": -11.985937118530273, "global_step": 359215, "epoch": 2138} {"train_loss": -12.239934921264648, "global_step": 359216, "epoch": 2138} {"train_loss": -12.19129467010498, "global_step": 359217, "epoch": 2138} {"train_loss": -12.391282081604004, "global_step": 359218, "epoch": 2138} {"train_loss": -12.01309871673584, "global_step": 359219, "epoch": 2138} {"train_loss": -12.158940315246582, "global_step": 359220, "epoch": 2138} {"train_loss": -12.340572357177734, "global_step": 359221, "epoch": 2138} {"train_loss": -11.013124465942383, "global_step": 359222, "epoch": 2138} {"train_loss": -12.459808349609375, "global_step": 359223, "epoch": 2138} {"train_loss": -11.853635787963867, "global_step": 359224, "epoch": 2138} {"train_loss": -11.763721466064453, "global_step": 359225, "epoch": 2138} {"train_loss": -12.084355354309082, "global_step": 359226, "epoch": 2138} {"train_loss": -12.217766761779785, "global_step": 359227, "epoch": 2138} {"train_loss": -12.412535667419434, "global_step": 359228, "epoch": 2138} {"train_loss": -12.279945373535156, "global_step": 359229, "epoch": 2138} {"train_loss": -12.534276008605957, "global_step": 359230, "epoch": 2138} {"train_loss": -12.182671546936035, "global_step": 359231, "epoch": 2138} {"train_loss": -12.755969047546387, "global_step": 359232, "epoch": 2138} {"train_loss": -12.564153671264648, "global_step": 359233, "epoch": 2138} {"train_loss": -12.199549674987793, "global_step": 359234, "epoch": 2138} {"train_loss": -12.1329345703125, "global_step": 359235, "epoch": 2138} {"train_loss": -12.709744453430176, "global_step": 359236, "epoch": 2138} {"train_loss": -12.200077056884766, "global_step": 359237, "epoch": 2138} {"train_loss": -12.492624282836914, "global_step": 359238, "epoch": 2138} {"train_loss": -12.573979377746582, "global_step": 359239, "epoch": 2138} {"train_loss": -12.530377388000488, "global_step": 359240, "epoch": 2138} {"train_loss": -11.658864974975586, "global_step": 359241, "epoch": 2138} {"train_loss": -12.32335376739502, "global_step": 359242, "epoch": 2138} {"train_loss": -12.271005630493164, "global_step": 359243, "epoch": 2138} {"train_loss": -12.910360336303711, "global_step": 359244, "epoch": 2138} {"train_loss": -12.408114433288574, "global_step": 359245, "epoch": 2138} {"train_loss": -12.376792907714844, "global_step": 359246, "epoch": 2138} {"train_loss": -11.971094131469727, "global_step": 359247, "epoch": 2138} {"train_loss": -12.677461624145508, "global_step": 359248, "epoch": 2138} {"train_loss": -11.641616821289062, "global_step": 359249, "epoch": 2138} {"train_loss": -11.403350830078125, "global_step": 359250, "epoch": 2138} {"train_loss": -11.971670150756836, "global_step": 359251, "epoch": 2138} {"train_loss": -12.516313552856445, "global_step": 359252, "epoch": 2138} {"train_loss": -11.532695770263672, "global_step": 359253, "epoch": 2138} {"train_loss": -11.74728775024414, "global_step": 359254, "epoch": 2138} {"train_loss": -12.242634773254395, "global_step": 359255, "epoch": 2138} {"train_loss": -11.43024730682373, "global_step": 359256, "epoch": 2138} {"train_loss": -12.0869140625, "global_step": 359257, "epoch": 2138} {"train_loss": -12.292875289916992, "global_step": 359258, "epoch": 2138} {"train_loss": -11.850273132324219, "global_step": 359259, "epoch": 2138} {"train_loss": -12.38218879699707, "global_step": 359260, "epoch": 2138} {"train_loss": -11.855390548706055, "global_step": 359261, "epoch": 2138} {"train_loss": -11.42971134185791, "global_step": 359262, "epoch": 2138} {"train_loss": -12.144265174865723, "global_step": 359263, "epoch": 2138} {"train_loss": -9.825161933898926, "global_step": 359264, "epoch": 2138} {"train_loss": -10.341474533081055, "global_step": 359265, "epoch": 2138} {"train_loss": -12.238025665283203, "global_step": 359266, "epoch": 2138} {"train_loss": -11.193365097045898, "global_step": 359267, "epoch": 2138} {"train_loss": -10.751920700073242, "global_step": 359268, "epoch": 2138} {"train_loss": -12.004095077514648, "global_step": 359269, "epoch": 2138} {"train_loss": -10.406229019165039, "global_step": 359270, "epoch": 2138} {"train_loss": -10.295670509338379, "global_step": 359271, "epoch": 2138} {"train_loss": -10.289298057556152, "global_step": 359272, "epoch": 2138} {"train_loss": -11.210718154907227, "global_step": 359273, "epoch": 2138} {"train_loss": -9.696407318115234, "global_step": 359274, "epoch": 2138} {"train_loss": -9.400354385375977, "global_step": 359275, "epoch": 2138} {"train_loss": -11.87922191619873, "global_step": 359276, "epoch": 2138} {"train_loss": -9.025874137878418, "global_step": 359277, "epoch": 2138} {"train_loss": -11.153765678405762, "global_step": 359278, "epoch": 2138} {"train_loss": -9.624645233154297, "global_step": 359279, "epoch": 2138} {"train_loss": -10.224706649780273, "global_step": 359280, "epoch": 2138} {"train_loss": -8.314496040344238, "global_step": 359281, "epoch": 2138} {"train_loss": -10.242759704589844, "global_step": 359282, "epoch": 2138} {"train_loss": -10.012907028198242, "global_step": 359283, "epoch": 2138} {"train_loss": -9.401567459106445, "global_step": 359284, "epoch": 2138} {"train_loss": -10.465951919555664, "global_step": 359285, "epoch": 2138} {"train_loss": -11.062239646911621, "global_step": 359286, "epoch": 2138} {"train_loss": -10.585445404052734, "global_step": 359287, "epoch": 2138} {"train_loss": -11.601917266845703, "global_step": 359288, "epoch": 2138} {"train_loss": -10.831029891967773, "global_step": 359289, "epoch": 2138} {"train_loss": -11.815134048461914, "global_step": 359290, "epoch": 2138} {"train_loss": -10.799703598022461, "global_step": 359291, "epoch": 2138} {"train_loss": -11.547372817993164, "global_step": 359292, "epoch": 2138} {"train_loss": -10.996495246887207, "global_step": 359293, "epoch": 2138} {"train_loss": -11.34153938293457, "global_step": 359294, "epoch": 2138} {"train_loss": -11.717187881469727, "global_step": 359295, "epoch": 2138} {"train_loss": -11.736467361450195, "global_step": 359296, "epoch": 2138} {"train_loss": -11.859770774841309, "global_step": 359297, "epoch": 2138} {"train_loss": -11.599557876586914, "global_step": 359298, "epoch": 2138} {"train_loss": -12.050771713256836, "global_step": 359299, "epoch": 2138} {"train_loss": -11.817383766174316, "global_step": 359300, "epoch": 2138} {"train_loss": -11.811814308166504, "global_step": 359301, "epoch": 2138} {"train_loss": -11.703601837158203, "global_step": 359302, "epoch": 2138} {"train_loss": -11.987226486206055, "global_step": 359303, "epoch": 2138} {"train_loss": -11.894779205322266, "global_step": 359304, "epoch": 2138} {"train_loss": -11.793846130371094, "global_step": 359305, "epoch": 2138} {"train_loss": -12.127456665039062, "global_step": 359306, "epoch": 2138} {"train_loss": -12.2445650100708, "global_step": 359307, "epoch": 2138} {"train_loss": -11.918811798095703, "global_step": 359308, "epoch": 2138} {"train_loss": -12.199666023254395, "global_step": 359309, "epoch": 2138} {"train_loss": -11.894882202148438, "global_step": 359310, "epoch": 2138} {"train_loss": -12.095836639404297, "global_step": 359311, "epoch": 2138} {"train_loss": -12.365971565246582, "global_step": 359312, "epoch": 2138} {"train_loss": -12.061254501342773, "global_step": 359313, "epoch": 2138} {"train_loss": -12.19599437713623, "global_step": 359314, "epoch": 2138} {"train_loss": -11.849470138549805, "global_step": 359315, "epoch": 2138} {"train_loss": -11.8389253616333, "global_step": 359316, "epoch": 2138} {"train_loss": -12.227617263793945, "global_step": 359317, "epoch": 2138} {"train_loss": -12.213976860046387, "global_step": 359318, "epoch": 2138} {"train_loss": -12.223323822021484, "global_step": 359319, "epoch": 2138} {"train_loss": -12.036561012268066, "global_step": 359320, "epoch": 2138} {"train_loss": -12.033400535583496, "global_step": 359321, "epoch": 2138} {"train_loss": -12.239980697631836, "global_step": 359322, "epoch": 2138} {"train_loss": -12.025741577148438, "global_step": 359323, "epoch": 2138} {"train_loss": -12.220685958862305, "global_step": 359324, "epoch": 2138} {"train_loss": -12.362082481384277, "global_step": 359325, "epoch": 2138} {"train_loss": -12.400825500488281, "global_step": 359326, "epoch": 2138} {"train_loss": -12.374343872070312, "global_step": 359327, "epoch": 2138} {"train_loss": -12.209281921386719, "global_step": 359328, "epoch": 2138} {"train_loss": -12.525369644165039, "global_step": 359329, "epoch": 2138} {"train_loss": -12.55397891998291, "global_step": 359330, "epoch": 2138} {"train_loss": -12.459857940673828, "global_step": 359331, "epoch": 2138} {"train_loss": -12.399532318115234, "global_step": 359332, "epoch": 2138} {"train_loss": -12.440021514892578, "global_step": 359333, "epoch": 2138} {"train_loss": -12.39545726776123, "global_step": 359334, "epoch": 2138} {"train_loss": -12.322786331176758, "global_step": 359335, "epoch": 2138} {"train_loss": -12.161431312561035, "global_step": 359336, "epoch": 2138} {"train_loss": -12.403472900390625, "global_step": 359337, "epoch": 2138} {"train_loss": -12.645648002624512, "global_step": 359338, "epoch": 2138} {"train_loss": -12.354811668395996, "global_step": 359339, "epoch": 2138} {"train_loss": -12.552216529846191, "global_step": 359340, "epoch": 2138} {"train_loss": -12.565948486328125, "global_step": 359341, "epoch": 2138} {"train_loss": -12.593757629394531, "global_step": 359342, "epoch": 2138} {"train_loss": -12.125093460083008, "global_step": 359343, "epoch": 2138} {"train_loss": -12.518356323242188, "global_step": 359344, "epoch": 2138} {"train_loss": -12.331066131591797, "global_step": 359345, "epoch": 2138} {"train_loss": -12.638127326965332, "global_step": 359346, "epoch": 2138} {"train_loss": -12.219715118408203, "global_step": 359347, "epoch": 2138} {"train_loss": -12.49532413482666, "global_step": 359348, "epoch": 2138} {"train_loss": -12.526307106018066, "global_step": 359349, "epoch": 2138} {"train_loss": -12.114725112915039, "global_step": 359350, "epoch": 2138} {"train_loss": -11.907143047877721, "global_step": 359351, "epoch": 2138, "val_loss": 290254.6875} {"train_loss": -12.402061462402344, "global_step": 359352, "epoch": 2139} {"train_loss": -11.85493278503418, "global_step": 359353, "epoch": 2139} {"train_loss": -12.423942565917969, "global_step": 359354, "epoch": 2139} {"train_loss": -11.864093780517578, "global_step": 359355, "epoch": 2139} {"train_loss": -12.32376480102539, "global_step": 359356, "epoch": 2139} {"train_loss": -12.01628303527832, "global_step": 359357, "epoch": 2139} {"train_loss": -12.14129638671875, "global_step": 359358, "epoch": 2139} {"train_loss": -12.087150573730469, "global_step": 359359, "epoch": 2139} {"train_loss": -12.33897590637207, "global_step": 359360, "epoch": 2139} {"train_loss": -12.280495643615723, "global_step": 359361, "epoch": 2139} {"train_loss": -11.637653350830078, "global_step": 359362, "epoch": 2139} {"train_loss": -11.798871994018555, "global_step": 359363, "epoch": 2139} {"train_loss": -12.685267448425293, "global_step": 359364, "epoch": 2139} {"train_loss": -11.37987232208252, "global_step": 359365, "epoch": 2139} {"train_loss": -12.370357513427734, "global_step": 359366, "epoch": 2139} {"train_loss": -12.18492317199707, "global_step": 359367, "epoch": 2139} {"train_loss": -11.234901428222656, "global_step": 359368, "epoch": 2139} {"train_loss": -12.052353858947754, "global_step": 359369, "epoch": 2139} {"train_loss": -11.833133697509766, "global_step": 359370, "epoch": 2139} {"train_loss": -11.874554634094238, "global_step": 359371, "epoch": 2139} {"train_loss": -11.52949047088623, "global_step": 359372, "epoch": 2139} {"train_loss": -11.788106918334961, "global_step": 359373, "epoch": 2139} {"train_loss": -12.00564956665039, "global_step": 359374, "epoch": 2139} {"train_loss": -11.754709243774414, "global_step": 359375, "epoch": 2139} {"train_loss": -11.022796630859375, "global_step": 359376, "epoch": 2139} {"train_loss": -11.86857795715332, "global_step": 359377, "epoch": 2139} {"train_loss": -10.996687889099121, "global_step": 359378, "epoch": 2139} {"train_loss": -10.684340476989746, "global_step": 359379, "epoch": 2139} {"train_loss": -12.213327407836914, "global_step": 359380, "epoch": 2139} {"train_loss": -11.300609588623047, "global_step": 359381, "epoch": 2139} {"train_loss": -11.753755569458008, "global_step": 359382, "epoch": 2139} {"train_loss": -11.124898910522461, "global_step": 359383, "epoch": 2139} {"train_loss": -11.679039001464844, "global_step": 359384, "epoch": 2139} {"train_loss": -11.758903503417969, "global_step": 359385, "epoch": 2139} {"train_loss": -11.71672248840332, "global_step": 359386, "epoch": 2139} {"train_loss": -12.070882797241211, "global_step": 359387, "epoch": 2139} {"train_loss": -11.277579307556152, "global_step": 359388, "epoch": 2139} {"train_loss": -12.220137596130371, "global_step": 359389, "epoch": 2139} {"train_loss": -11.718196868896484, "global_step": 359390, "epoch": 2139} {"train_loss": -11.348454475402832, "global_step": 359391, "epoch": 2139} {"train_loss": -11.60805892944336, "global_step": 359392, "epoch": 2139} {"train_loss": -9.80743408203125, "global_step": 359393, "epoch": 2139} {"train_loss": -12.032855987548828, "global_step": 359394, "epoch": 2139} {"train_loss": -10.383344650268555, "global_step": 359395, "epoch": 2139} {"train_loss": -11.475641250610352, "global_step": 359396, "epoch": 2139} {"train_loss": -10.19540023803711, "global_step": 359397, "epoch": 2139} {"train_loss": -11.268081665039062, "global_step": 359398, "epoch": 2139} {"train_loss": -10.431421279907227, "global_step": 359399, "epoch": 2139} {"train_loss": -11.370798110961914, "global_step": 359400, "epoch": 2139} {"train_loss": -11.664661407470703, "global_step": 359401, "epoch": 2139} {"train_loss": -10.949749946594238, "global_step": 359402, "epoch": 2139} {"train_loss": -11.720053672790527, "global_step": 359403, "epoch": 2139} {"train_loss": -11.398406028747559, "global_step": 359404, "epoch": 2139} {"train_loss": -11.289556503295898, "global_step": 359405, "epoch": 2139} {"train_loss": -11.467172622680664, "global_step": 359406, "epoch": 2139} {"train_loss": -11.625165939331055, "global_step": 359407, "epoch": 2139} {"train_loss": -11.867619514465332, "global_step": 359408, "epoch": 2139} {"train_loss": -11.863059997558594, "global_step": 359409, "epoch": 2139} {"train_loss": -11.604999542236328, "global_step": 359410, "epoch": 2139} {"train_loss": -11.67138671875, "global_step": 359411, "epoch": 2139} {"train_loss": -11.862937927246094, "global_step": 359412, "epoch": 2139} {"train_loss": -11.998708724975586, "global_step": 359413, "epoch": 2139} {"train_loss": -12.071741104125977, "global_step": 359414, "epoch": 2139} {"train_loss": -11.77212905883789, "global_step": 359415, "epoch": 2139} {"train_loss": -12.116893768310547, "global_step": 359416, "epoch": 2139} {"train_loss": -11.605097770690918, "global_step": 359417, "epoch": 2139} {"train_loss": -12.003427505493164, "global_step": 359418, "epoch": 2139} {"train_loss": -11.963062286376953, "global_step": 359419, "epoch": 2139} {"train_loss": -11.698297500610352, "global_step": 359420, "epoch": 2139} {"train_loss": -11.779500961303711, "global_step": 359421, "epoch": 2139} {"train_loss": -12.048894882202148, "global_step": 359422, "epoch": 2139} {"train_loss": -11.799398422241211, "global_step": 359423, "epoch": 2139} {"train_loss": -11.860169410705566, "global_step": 359424, "epoch": 2139} {"train_loss": -11.00855827331543, "global_step": 359425, "epoch": 2139} {"train_loss": -11.938840866088867, "global_step": 359426, "epoch": 2139} {"train_loss": -11.485722541809082, "global_step": 359427, "epoch": 2139} {"train_loss": -11.82528305053711, "global_step": 359428, "epoch": 2139} {"train_loss": -11.84920597076416, "global_step": 359429, "epoch": 2139} {"train_loss": -11.915651321411133, "global_step": 359430, "epoch": 2139} {"train_loss": -11.927732467651367, "global_step": 359431, "epoch": 2139} {"train_loss": -11.674888610839844, "global_step": 359432, "epoch": 2139} {"train_loss": -12.263206481933594, "global_step": 359433, "epoch": 2139} {"train_loss": -11.395832061767578, "global_step": 359434, "epoch": 2139} {"train_loss": -12.418478012084961, "global_step": 359435, "epoch": 2139} {"train_loss": -11.427658081054688, "global_step": 359436, "epoch": 2139} {"train_loss": -12.316603660583496, "global_step": 359437, "epoch": 2139} {"train_loss": -11.386286735534668, "global_step": 359438, "epoch": 2139} {"train_loss": -12.38526439666748, "global_step": 359439, "epoch": 2139} {"train_loss": -11.964164733886719, "global_step": 359440, "epoch": 2139} {"train_loss": -12.120691299438477, "global_step": 359441, "epoch": 2139} {"train_loss": -12.234020233154297, "global_step": 359442, "epoch": 2139} {"train_loss": -12.267461776733398, "global_step": 359443, "epoch": 2139} {"train_loss": -12.359564781188965, "global_step": 359444, "epoch": 2139} {"train_loss": -12.309152603149414, "global_step": 359445, "epoch": 2139} {"train_loss": -12.327455520629883, "global_step": 359446, "epoch": 2139} {"train_loss": -12.40108871459961, "global_step": 359447, "epoch": 2139} {"train_loss": -12.063833236694336, "global_step": 359448, "epoch": 2139} {"train_loss": -12.488286972045898, "global_step": 359449, "epoch": 2139} {"train_loss": -12.26705551147461, "global_step": 359450, "epoch": 2139} {"train_loss": -12.45494270324707, "global_step": 359451, "epoch": 2139} {"train_loss": -12.06229019165039, "global_step": 359452, "epoch": 2139} {"train_loss": -12.396550178527832, "global_step": 359453, "epoch": 2139} {"train_loss": -12.413119316101074, "global_step": 359454, "epoch": 2139} {"train_loss": -12.468513488769531, "global_step": 359455, "epoch": 2139} {"train_loss": -12.410283088684082, "global_step": 359456, "epoch": 2139} {"train_loss": -12.525764465332031, "global_step": 359457, "epoch": 2139} {"train_loss": -12.314592361450195, "global_step": 359458, "epoch": 2139} {"train_loss": -12.30456256866455, "global_step": 359459, "epoch": 2139} {"train_loss": -12.588139533996582, "global_step": 359460, "epoch": 2139} {"train_loss": -12.379863739013672, "global_step": 359461, "epoch": 2139} {"train_loss": -12.645830154418945, "global_step": 359462, "epoch": 2139} {"train_loss": -12.213411331176758, "global_step": 359463, "epoch": 2139} {"train_loss": -12.266717910766602, "global_step": 359464, "epoch": 2139} {"train_loss": -12.028997421264648, "global_step": 359465, "epoch": 2139} {"train_loss": -11.795654296875, "global_step": 359466, "epoch": 2139} {"train_loss": -12.371198654174805, "global_step": 359467, "epoch": 2139} {"train_loss": -11.483489990234375, "global_step": 359468, "epoch": 2139} {"train_loss": -12.414048194885254, "global_step": 359469, "epoch": 2139} {"train_loss": -12.19035530090332, "global_step": 359470, "epoch": 2139} {"train_loss": -11.859825134277344, "global_step": 359471, "epoch": 2139} {"train_loss": -12.148024559020996, "global_step": 359472, "epoch": 2139} {"train_loss": -12.597631454467773, "global_step": 359473, "epoch": 2139} {"train_loss": -12.490018844604492, "global_step": 359474, "epoch": 2139} {"train_loss": -12.487203598022461, "global_step": 359475, "epoch": 2139} {"train_loss": -12.252973556518555, "global_step": 359476, "epoch": 2139} {"train_loss": -12.419410705566406, "global_step": 359477, "epoch": 2139} {"train_loss": -12.526281356811523, "global_step": 359478, "epoch": 2139} {"train_loss": -12.477273941040039, "global_step": 359479, "epoch": 2139} {"train_loss": -12.534112930297852, "global_step": 359480, "epoch": 2139} {"train_loss": -12.39236068725586, "global_step": 359481, "epoch": 2139} {"train_loss": -12.487077713012695, "global_step": 359482, "epoch": 2139} {"train_loss": -12.692026138305664, "global_step": 359483, "epoch": 2139} {"train_loss": -12.496370315551758, "global_step": 359484, "epoch": 2139} {"train_loss": -12.358755111694336, "global_step": 359485, "epoch": 2139} {"train_loss": -12.697969436645508, "global_step": 359486, "epoch": 2139} {"train_loss": -12.356643676757812, "global_step": 359487, "epoch": 2139} {"train_loss": -12.43290901184082, "global_step": 359488, "epoch": 2139} {"train_loss": -12.477252006530762, "global_step": 359489, "epoch": 2139} {"train_loss": -12.371614456176758, "global_step": 359490, "epoch": 2139} {"train_loss": -12.56157112121582, "global_step": 359491, "epoch": 2139} {"train_loss": -12.422943115234375, "global_step": 359492, "epoch": 2139} {"train_loss": -12.465131759643555, "global_step": 359493, "epoch": 2139} {"train_loss": -12.189245223999023, "global_step": 359494, "epoch": 2139} {"train_loss": -12.536819458007812, "global_step": 359495, "epoch": 2139} {"train_loss": -12.163434982299805, "global_step": 359496, "epoch": 2139} {"train_loss": -12.299501419067383, "global_step": 359497, "epoch": 2139} {"train_loss": -12.495723724365234, "global_step": 359498, "epoch": 2139} {"train_loss": -12.278678894042969, "global_step": 359499, "epoch": 2139} {"train_loss": -12.451223373413086, "global_step": 359500, "epoch": 2139} {"train_loss": -12.440156936645508, "global_step": 359501, "epoch": 2139} {"train_loss": -12.679014205932617, "global_step": 359502, "epoch": 2139} {"train_loss": -12.528764724731445, "global_step": 359503, "epoch": 2139} {"train_loss": -12.519804000854492, "global_step": 359504, "epoch": 2139} {"train_loss": -12.708194732666016, "global_step": 359505, "epoch": 2139} {"train_loss": -12.49393081665039, "global_step": 359506, "epoch": 2139} {"train_loss": -12.686702728271484, "global_step": 359507, "epoch": 2139} {"train_loss": -12.58848762512207, "global_step": 359508, "epoch": 2139} {"train_loss": -12.55196475982666, "global_step": 359509, "epoch": 2139} {"train_loss": -12.41328239440918, "global_step": 359510, "epoch": 2139} {"train_loss": -12.101152420043945, "global_step": 359511, "epoch": 2139} {"train_loss": -12.668195724487305, "global_step": 359512, "epoch": 2139} {"train_loss": -12.426098823547363, "global_step": 359513, "epoch": 2139} {"train_loss": -12.261465072631836, "global_step": 359514, "epoch": 2139} {"train_loss": -12.646408081054688, "global_step": 359515, "epoch": 2139} {"train_loss": -12.30042839050293, "global_step": 359516, "epoch": 2139} {"train_loss": -12.790704727172852, "global_step": 359517, "epoch": 2139} {"train_loss": -12.469666481018066, "global_step": 359518, "epoch": 2139} {"train_loss": -12.029416566803341, "global_step": 359519, "epoch": 2139, "val_loss": 295432.5625} {"train_loss": -12.59664249420166, "global_step": 359520, "epoch": 2140} {"train_loss": -12.675695419311523, "global_step": 359521, "epoch": 2140} {"train_loss": -12.617526054382324, "global_step": 359522, "epoch": 2140} {"train_loss": -12.460901260375977, "global_step": 359523, "epoch": 2140} {"train_loss": -12.242612838745117, "global_step": 359524, "epoch": 2140} {"train_loss": -12.545611381530762, "global_step": 359525, "epoch": 2140} {"train_loss": -12.578255653381348, "global_step": 359526, "epoch": 2140} {"train_loss": -12.342108726501465, "global_step": 359527, "epoch": 2140} {"train_loss": -12.329943656921387, "global_step": 359528, "epoch": 2140} {"train_loss": -11.60693359375, "global_step": 359529, "epoch": 2140} {"train_loss": -12.190356254577637, "global_step": 359530, "epoch": 2140} {"train_loss": -12.549966812133789, "global_step": 359531, "epoch": 2140} {"train_loss": -12.123201370239258, "global_step": 359532, "epoch": 2140} {"train_loss": -11.808737754821777, "global_step": 359533, "epoch": 2140} {"train_loss": -12.168075561523438, "global_step": 359534, "epoch": 2140} {"train_loss": -12.434272766113281, "global_step": 359535, "epoch": 2140} {"train_loss": -11.511143684387207, "global_step": 359536, "epoch": 2140} {"train_loss": -11.337879180908203, "global_step": 359537, "epoch": 2140} {"train_loss": -11.320917129516602, "global_step": 359538, "epoch": 2140} {"train_loss": -10.811627388000488, "global_step": 359539, "epoch": 2140} {"train_loss": -11.817319869995117, "global_step": 359540, "epoch": 2140} {"train_loss": -11.445651054382324, "global_step": 359541, "epoch": 2140} {"train_loss": -12.08275318145752, "global_step": 359542, "epoch": 2140} {"train_loss": -11.691426277160645, "global_step": 359543, "epoch": 2140} {"train_loss": -10.520683288574219, "global_step": 359544, "epoch": 2140} {"train_loss": -11.057565689086914, "global_step": 359545, "epoch": 2140} {"train_loss": -11.275535583496094, "global_step": 359546, "epoch": 2140} {"train_loss": -10.892489433288574, "global_step": 359547, "epoch": 2140} {"train_loss": -9.886404991149902, "global_step": 359548, "epoch": 2140} {"train_loss": -8.678081512451172, "global_step": 359549, "epoch": 2140} {"train_loss": -8.28664779663086, "global_step": 359550, "epoch": 2140} {"train_loss": -9.10954761505127, "global_step": 359551, "epoch": 2140} {"train_loss": -9.574235916137695, "global_step": 359552, "epoch": 2140} {"train_loss": -10.39121150970459, "global_step": 359553, "epoch": 2140} {"train_loss": -10.059222221374512, "global_step": 359554, "epoch": 2140} {"train_loss": -10.3763427734375, "global_step": 359555, "epoch": 2140} {"train_loss": -10.894956588745117, "global_step": 359556, "epoch": 2140} {"train_loss": -10.09977912902832, "global_step": 359557, "epoch": 2140} {"train_loss": -9.706461906433105, "global_step": 359558, "epoch": 2140} {"train_loss": -11.053543090820312, "global_step": 359559, "epoch": 2140} {"train_loss": -10.320999145507812, "global_step": 359560, "epoch": 2140} {"train_loss": -11.012765884399414, "global_step": 359561, "epoch": 2140} {"train_loss": -10.58482551574707, "global_step": 359562, "epoch": 2140} {"train_loss": -11.50345516204834, "global_step": 359563, "epoch": 2140} {"train_loss": -11.156081199645996, "global_step": 359564, "epoch": 2140} {"train_loss": -10.902141571044922, "global_step": 359565, "epoch": 2140} {"train_loss": -11.406194686889648, "global_step": 359566, "epoch": 2140} {"train_loss": -11.53658676147461, "global_step": 359567, "epoch": 2140} {"train_loss": -11.242713928222656, "global_step": 359568, "epoch": 2140} {"train_loss": -11.58486557006836, "global_step": 359569, "epoch": 2140} {"train_loss": -11.215560913085938, "global_step": 359570, "epoch": 2140} {"train_loss": -11.770120620727539, "global_step": 359571, "epoch": 2140} {"train_loss": -11.484891891479492, "global_step": 359572, "epoch": 2140} {"train_loss": -11.378138542175293, "global_step": 359573, "epoch": 2140} {"train_loss": -12.237350463867188, "global_step": 359574, "epoch": 2140} {"train_loss": -11.517542839050293, "global_step": 359575, "epoch": 2140} {"train_loss": -11.071797370910645, "global_step": 359576, "epoch": 2140} {"train_loss": -11.597940444946289, "global_step": 359577, "epoch": 2140} {"train_loss": -11.057245254516602, "global_step": 359578, "epoch": 2140} {"train_loss": -11.602055549621582, "global_step": 359579, "epoch": 2140} {"train_loss": -11.169748306274414, "global_step": 359580, "epoch": 2140} {"train_loss": -10.944818496704102, "global_step": 359581, "epoch": 2140} {"train_loss": -11.616994857788086, "global_step": 359582, "epoch": 2140} {"train_loss": -11.186220169067383, "global_step": 359583, "epoch": 2140} {"train_loss": -11.913119316101074, "global_step": 359584, "epoch": 2140} {"train_loss": -10.811039924621582, "global_step": 359585, "epoch": 2140} {"train_loss": -12.025365829467773, "global_step": 359586, "epoch": 2140} {"train_loss": -11.556102752685547, "global_step": 359587, "epoch": 2140} {"train_loss": -12.022320747375488, "global_step": 359588, "epoch": 2140} {"train_loss": -12.00306224822998, "global_step": 359589, "epoch": 2140} {"train_loss": -12.183055877685547, "global_step": 359590, "epoch": 2140} {"train_loss": -11.926553726196289, "global_step": 359591, "epoch": 2140} {"train_loss": -11.86533260345459, "global_step": 359592, "epoch": 2140} {"train_loss": -11.562259674072266, "global_step": 359593, "epoch": 2140} {"train_loss": -11.797200202941895, "global_step": 359594, "epoch": 2140} {"train_loss": -12.102689743041992, "global_step": 359595, "epoch": 2140} {"train_loss": -12.000324249267578, "global_step": 359596, "epoch": 2140} {"train_loss": -11.915489196777344, "global_step": 359597, "epoch": 2140} {"train_loss": -11.995729446411133, "global_step": 359598, "epoch": 2140} {"train_loss": -11.894033432006836, "global_step": 359599, "epoch": 2140} {"train_loss": -12.201141357421875, "global_step": 359600, "epoch": 2140} {"train_loss": -11.9755859375, "global_step": 359601, "epoch": 2140} {"train_loss": -12.072649955749512, "global_step": 359602, "epoch": 2140} {"train_loss": -12.106390953063965, "global_step": 359603, "epoch": 2140} {"train_loss": -12.112542152404785, "global_step": 359604, "epoch": 2140} {"train_loss": -12.117870330810547, "global_step": 359605, "epoch": 2140} {"train_loss": -11.829648971557617, "global_step": 359606, "epoch": 2140} {"train_loss": -12.389744758605957, "global_step": 359607, "epoch": 2140} {"train_loss": -11.901042938232422, "global_step": 359608, "epoch": 2140} {"train_loss": -12.249317169189453, "global_step": 359609, "epoch": 2140} {"train_loss": -12.23944091796875, "global_step": 359610, "epoch": 2140} {"train_loss": -12.286725997924805, "global_step": 359611, "epoch": 2140} {"train_loss": -12.400192260742188, "global_step": 359612, "epoch": 2140} {"train_loss": -12.160089492797852, "global_step": 359613, "epoch": 2140} {"train_loss": -12.311915397644043, "global_step": 359614, "epoch": 2140} {"train_loss": -12.001564025878906, "global_step": 359615, "epoch": 2140} {"train_loss": -12.384641647338867, "global_step": 359616, "epoch": 2140} {"train_loss": -12.3025541305542, "global_step": 359617, "epoch": 2140} {"train_loss": -12.163461685180664, "global_step": 359618, "epoch": 2140} {"train_loss": -12.273390769958496, "global_step": 359619, "epoch": 2140} {"train_loss": -12.255173683166504, "global_step": 359620, "epoch": 2140} {"train_loss": -12.487993240356445, "global_step": 359621, "epoch": 2140} {"train_loss": -12.469034194946289, "global_step": 359622, "epoch": 2140} {"train_loss": -12.383739471435547, "global_step": 359623, "epoch": 2140} {"train_loss": -12.233579635620117, "global_step": 359624, "epoch": 2140} {"train_loss": -12.615428924560547, "global_step": 359625, "epoch": 2140} {"train_loss": -12.416644096374512, "global_step": 359626, "epoch": 2140} {"train_loss": -12.392385482788086, "global_step": 359627, "epoch": 2140} {"train_loss": -12.41404914855957, "global_step": 359628, "epoch": 2140} {"train_loss": -12.634331703186035, "global_step": 359629, "epoch": 2140} {"train_loss": -12.585697174072266, "global_step": 359630, "epoch": 2140} {"train_loss": -12.456581115722656, "global_step": 359631, "epoch": 2140} {"train_loss": -12.512866973876953, "global_step": 359632, "epoch": 2140} {"train_loss": -12.704850196838379, "global_step": 359633, "epoch": 2140} {"train_loss": -12.611737251281738, "global_step": 359634, "epoch": 2140} {"train_loss": -12.499225616455078, "global_step": 359635, "epoch": 2140} {"train_loss": -12.647876739501953, "global_step": 359636, "epoch": 2140} {"train_loss": -12.424208641052246, "global_step": 359637, "epoch": 2140} {"train_loss": -12.500864028930664, "global_step": 359638, "epoch": 2140} {"train_loss": -12.430475234985352, "global_step": 359639, "epoch": 2140} {"train_loss": -12.48751449584961, "global_step": 359640, "epoch": 2140} {"train_loss": -12.619752883911133, "global_step": 359641, "epoch": 2140} {"train_loss": -12.540021896362305, "global_step": 359642, "epoch": 2140} {"train_loss": -12.548839569091797, "global_step": 359643, "epoch": 2140} {"train_loss": -12.401545524597168, "global_step": 359644, "epoch": 2140} {"train_loss": -12.397871017456055, "global_step": 359645, "epoch": 2140} {"train_loss": -12.65514850616455, "global_step": 359646, "epoch": 2140} {"train_loss": -12.577661514282227, "global_step": 359647, "epoch": 2140} {"train_loss": -12.616121292114258, "global_step": 359648, "epoch": 2140} {"train_loss": -12.528029441833496, "global_step": 359649, "epoch": 2140} {"train_loss": -12.837150573730469, "global_step": 359650, "epoch": 2140} {"train_loss": -12.59758186340332, "global_step": 359651, "epoch": 2140} {"train_loss": -12.735466003417969, "global_step": 359652, "epoch": 2140} {"train_loss": -12.679518699645996, "global_step": 359653, "epoch": 2140} {"train_loss": -12.683971405029297, "global_step": 359654, "epoch": 2140} {"train_loss": -12.568645477294922, "global_step": 359655, "epoch": 2140} {"train_loss": -12.741148948669434, "global_step": 359656, "epoch": 2140} {"train_loss": -12.689706802368164, "global_step": 359657, "epoch": 2140} {"train_loss": -12.550287246704102, "global_step": 359658, "epoch": 2140} {"train_loss": -12.66789722442627, "global_step": 359659, "epoch": 2140} {"train_loss": -12.319416999816895, "global_step": 359660, "epoch": 2140} {"train_loss": -12.641175270080566, "global_step": 359661, "epoch": 2140} {"train_loss": -12.596630096435547, "global_step": 359662, "epoch": 2140} {"train_loss": -12.442038536071777, "global_step": 359663, "epoch": 2140} {"train_loss": -11.990910530090332, "global_step": 359664, "epoch": 2140} {"train_loss": -12.459646224975586, "global_step": 359665, "epoch": 2140} {"train_loss": -12.571651458740234, "global_step": 359666, "epoch": 2140} {"train_loss": -12.630264282226562, "global_step": 359667, "epoch": 2140} {"train_loss": -12.752439498901367, "global_step": 359668, "epoch": 2140} {"train_loss": -12.610939025878906, "global_step": 359669, "epoch": 2140} {"train_loss": -12.72711181640625, "global_step": 359670, "epoch": 2140} {"train_loss": -12.623477935791016, "global_step": 359671, "epoch": 2140} {"train_loss": -11.935555458068848, "global_step": 359672, "epoch": 2140} {"train_loss": -11.130697250366211, "global_step": 359673, "epoch": 2140} {"train_loss": -12.041950225830078, "global_step": 359674, "epoch": 2140} {"train_loss": -12.549870491027832, "global_step": 359675, "epoch": 2140} {"train_loss": -11.431787490844727, "global_step": 359676, "epoch": 2140} {"train_loss": -11.829795837402344, "global_step": 359677, "epoch": 2140} {"train_loss": -12.427715301513672, "global_step": 359678, "epoch": 2140} {"train_loss": -10.7413330078125, "global_step": 359679, "epoch": 2140} {"train_loss": -10.094915390014648, "global_step": 359680, "epoch": 2140} {"train_loss": -12.361971855163574, "global_step": 359681, "epoch": 2140} {"train_loss": -10.603564262390137, "global_step": 359682, "epoch": 2140} {"train_loss": -10.923847198486328, "global_step": 359683, "epoch": 2140} {"train_loss": -11.63604736328125, "global_step": 359684, "epoch": 2140} {"train_loss": -12.158360481262207, "global_step": 359685, "epoch": 2140} {"train_loss": -11.26517391204834, "global_step": 359686, "epoch": 2140} {"train_loss": -11.858005529358273, "global_step": 359687, "epoch": 2140, "val_loss": 286108.40625, "train_action_mse_error": 1.4585174322128296} {"train_loss": -9.88083267211914, "global_step": 359688, "epoch": 2141} {"train_loss": -11.138720512390137, "global_step": 359689, "epoch": 2141} {"train_loss": -10.367069244384766, "global_step": 359690, "epoch": 2141} {"train_loss": -10.534250259399414, "global_step": 359691, "epoch": 2141} {"train_loss": -10.52132797241211, "global_step": 359692, "epoch": 2141} {"train_loss": -10.306421279907227, "global_step": 359693, "epoch": 2141} {"train_loss": -11.131383895874023, "global_step": 359694, "epoch": 2141} {"train_loss": -9.965267181396484, "global_step": 359695, "epoch": 2141} {"train_loss": -10.858887672424316, "global_step": 359696, "epoch": 2141} {"train_loss": -9.932082176208496, "global_step": 359697, "epoch": 2141} {"train_loss": -11.173246383666992, "global_step": 359698, "epoch": 2141} {"train_loss": -11.80119514465332, "global_step": 359699, "epoch": 2141} {"train_loss": -11.780083656311035, "global_step": 359700, "epoch": 2141} {"train_loss": -11.683632850646973, "global_step": 359701, "epoch": 2141} {"train_loss": -11.203876495361328, "global_step": 359702, "epoch": 2141} {"train_loss": -11.865565299987793, "global_step": 359703, "epoch": 2141} {"train_loss": -11.510979652404785, "global_step": 359704, "epoch": 2141} {"train_loss": -11.120992660522461, "global_step": 359705, "epoch": 2141} {"train_loss": -11.934675216674805, "global_step": 359706, "epoch": 2141} {"train_loss": -11.667000770568848, "global_step": 359707, "epoch": 2141} {"train_loss": -11.443403244018555, "global_step": 359708, "epoch": 2141} {"train_loss": -11.171794891357422, "global_step": 359709, "epoch": 2141} {"train_loss": -11.48678970336914, "global_step": 359710, "epoch": 2141} {"train_loss": -10.526174545288086, "global_step": 359711, "epoch": 2141} {"train_loss": -12.062231063842773, "global_step": 359712, "epoch": 2141} {"train_loss": -11.087308883666992, "global_step": 359713, "epoch": 2141} {"train_loss": -11.831707000732422, "global_step": 359714, "epoch": 2141} {"train_loss": -11.984334945678711, "global_step": 359715, "epoch": 2141} {"train_loss": -11.640756607055664, "global_step": 359716, "epoch": 2141} {"train_loss": -11.994331359863281, "global_step": 359717, "epoch": 2141} {"train_loss": -11.618478775024414, "global_step": 359718, "epoch": 2141} {"train_loss": -11.63943099975586, "global_step": 359719, "epoch": 2141} {"train_loss": -11.777759552001953, "global_step": 359720, "epoch": 2141} {"train_loss": -11.934928894042969, "global_step": 359721, "epoch": 2141} {"train_loss": -11.792865753173828, "global_step": 359722, "epoch": 2141} {"train_loss": -11.824831008911133, "global_step": 359723, "epoch": 2141} {"train_loss": -11.887856483459473, "global_step": 359724, "epoch": 2141} {"train_loss": -11.720170974731445, "global_step": 359725, "epoch": 2141} {"train_loss": -11.693288803100586, "global_step": 359726, "epoch": 2141} {"train_loss": -11.817865371704102, "global_step": 359727, "epoch": 2141} {"train_loss": -11.632464408874512, "global_step": 359728, "epoch": 2141} {"train_loss": -12.075444221496582, "global_step": 359729, "epoch": 2141} {"train_loss": -11.824583053588867, "global_step": 359730, "epoch": 2141} {"train_loss": -11.98259162902832, "global_step": 359731, "epoch": 2141} {"train_loss": -11.505901336669922, "global_step": 359732, "epoch": 2141} {"train_loss": -12.117557525634766, "global_step": 359733, "epoch": 2141} {"train_loss": -11.812427520751953, "global_step": 359734, "epoch": 2141} {"train_loss": -12.134827613830566, "global_step": 359735, "epoch": 2141} {"train_loss": -12.198166847229004, "global_step": 359736, "epoch": 2141} {"train_loss": -12.135835647583008, "global_step": 359737, "epoch": 2141} {"train_loss": -12.241744995117188, "global_step": 359738, "epoch": 2141} {"train_loss": -11.968697547912598, "global_step": 359739, "epoch": 2141} {"train_loss": -12.450706481933594, "global_step": 359740, "epoch": 2141} {"train_loss": -12.195280075073242, "global_step": 359741, "epoch": 2141} {"train_loss": -12.292442321777344, "global_step": 359742, "epoch": 2141} {"train_loss": -12.073173522949219, "global_step": 359743, "epoch": 2141} {"train_loss": -12.353296279907227, "global_step": 359744, "epoch": 2141} {"train_loss": -12.349717140197754, "global_step": 359745, "epoch": 2141} {"train_loss": -12.08162784576416, "global_step": 359746, "epoch": 2141} {"train_loss": -12.20516586303711, "global_step": 359747, "epoch": 2141} {"train_loss": -12.355098724365234, "global_step": 359748, "epoch": 2141} {"train_loss": -12.308698654174805, "global_step": 359749, "epoch": 2141} {"train_loss": -12.342520713806152, "global_step": 359750, "epoch": 2141} {"train_loss": -12.558586120605469, "global_step": 359751, "epoch": 2141} {"train_loss": -12.069795608520508, "global_step": 359752, "epoch": 2141} {"train_loss": -12.557470321655273, "global_step": 359753, "epoch": 2141} {"train_loss": -12.045999526977539, "global_step": 359754, "epoch": 2141} {"train_loss": -12.288848876953125, "global_step": 359755, "epoch": 2141} {"train_loss": -12.355732917785645, "global_step": 359756, "epoch": 2141} {"train_loss": -12.447493553161621, "global_step": 359757, "epoch": 2141} {"train_loss": -12.611139297485352, "global_step": 359758, "epoch": 2141} {"train_loss": -12.522673606872559, "global_step": 359759, "epoch": 2141} {"train_loss": -11.922972679138184, "global_step": 359760, "epoch": 2141} {"train_loss": -12.359020233154297, "global_step": 359761, "epoch": 2141} {"train_loss": -12.287944793701172, "global_step": 359762, "epoch": 2141} {"train_loss": -11.858152389526367, "global_step": 359763, "epoch": 2141} {"train_loss": -12.254312515258789, "global_step": 359764, "epoch": 2141} {"train_loss": -12.538934707641602, "global_step": 359765, "epoch": 2141} {"train_loss": -11.976844787597656, "global_step": 359766, "epoch": 2141} {"train_loss": -12.431724548339844, "global_step": 359767, "epoch": 2141} {"train_loss": -12.112691879272461, "global_step": 359768, "epoch": 2141} {"train_loss": -12.421632766723633, "global_step": 359769, "epoch": 2141} {"train_loss": -12.172416687011719, "global_step": 359770, "epoch": 2141} {"train_loss": -12.137843132019043, "global_step": 359771, "epoch": 2141} {"train_loss": -12.56317138671875, "global_step": 359772, "epoch": 2141} {"train_loss": -12.21879768371582, "global_step": 359773, "epoch": 2141} {"train_loss": -12.292887687683105, "global_step": 359774, "epoch": 2141} {"train_loss": -12.295745849609375, "global_step": 359775, "epoch": 2141} {"train_loss": -12.176543235778809, "global_step": 359776, "epoch": 2141} {"train_loss": -11.407546997070312, "global_step": 359777, "epoch": 2141} {"train_loss": -12.345142364501953, "global_step": 359778, "epoch": 2141} {"train_loss": -11.973150253295898, "global_step": 359779, "epoch": 2141} {"train_loss": -10.021566390991211, "global_step": 359780, "epoch": 2141} {"train_loss": -11.380508422851562, "global_step": 359781, "epoch": 2141} {"train_loss": -11.514442443847656, "global_step": 359782, "epoch": 2141} {"train_loss": -10.836299896240234, "global_step": 359783, "epoch": 2141} {"train_loss": -11.409358978271484, "global_step": 359784, "epoch": 2141} {"train_loss": -10.074126243591309, "global_step": 359785, "epoch": 2141} {"train_loss": -9.944561004638672, "global_step": 359786, "epoch": 2141} {"train_loss": -11.735584259033203, "global_step": 359787, "epoch": 2141} {"train_loss": -11.007734298706055, "global_step": 359788, "epoch": 2141} {"train_loss": -11.365080833435059, "global_step": 359789, "epoch": 2141} {"train_loss": -12.00865650177002, "global_step": 359790, "epoch": 2141} {"train_loss": -11.558186531066895, "global_step": 359791, "epoch": 2141} {"train_loss": -12.158319473266602, "global_step": 359792, "epoch": 2141} {"train_loss": -10.585461616516113, "global_step": 359793, "epoch": 2141} {"train_loss": -11.292396545410156, "global_step": 359794, "epoch": 2141} {"train_loss": -11.687232971191406, "global_step": 359795, "epoch": 2141} {"train_loss": -10.788475036621094, "global_step": 359796, "epoch": 2141} {"train_loss": -12.042213439941406, "global_step": 359797, "epoch": 2141} {"train_loss": -11.26460075378418, "global_step": 359798, "epoch": 2141} {"train_loss": -12.115044593811035, "global_step": 359799, "epoch": 2141} {"train_loss": -11.404352188110352, "global_step": 359800, "epoch": 2141} {"train_loss": -11.950586318969727, "global_step": 359801, "epoch": 2141} {"train_loss": -11.777280807495117, "global_step": 359802, "epoch": 2141} {"train_loss": -11.779085159301758, "global_step": 359803, "epoch": 2141} {"train_loss": -12.176952362060547, "global_step": 359804, "epoch": 2141} {"train_loss": -11.806013107299805, "global_step": 359805, "epoch": 2141} {"train_loss": -12.442375183105469, "global_step": 359806, "epoch": 2141} {"train_loss": -11.957649230957031, "global_step": 359807, "epoch": 2141} {"train_loss": -12.398313522338867, "global_step": 359808, "epoch": 2141} {"train_loss": -11.926780700683594, "global_step": 359809, "epoch": 2141} {"train_loss": -12.115266799926758, "global_step": 359810, "epoch": 2141} {"train_loss": -12.34610652923584, "global_step": 359811, "epoch": 2141} {"train_loss": -12.290980339050293, "global_step": 359812, "epoch": 2141} {"train_loss": -12.562108993530273, "global_step": 359813, "epoch": 2141} {"train_loss": -12.218320846557617, "global_step": 359814, "epoch": 2141} {"train_loss": -12.13673210144043, "global_step": 359815, "epoch": 2141} {"train_loss": -12.551319122314453, "global_step": 359816, "epoch": 2141} {"train_loss": -12.197321891784668, "global_step": 359817, "epoch": 2141} {"train_loss": -12.374675750732422, "global_step": 359818, "epoch": 2141} {"train_loss": -12.440601348876953, "global_step": 359819, "epoch": 2141} {"train_loss": -12.179311752319336, "global_step": 359820, "epoch": 2141} {"train_loss": -12.346002578735352, "global_step": 359821, "epoch": 2141} {"train_loss": -12.389630317687988, "global_step": 359822, "epoch": 2141} {"train_loss": -12.316108703613281, "global_step": 359823, "epoch": 2141} {"train_loss": -12.474203109741211, "global_step": 359824, "epoch": 2141} {"train_loss": -12.258082389831543, "global_step": 359825, "epoch": 2141} {"train_loss": -12.39020824432373, "global_step": 359826, "epoch": 2141} {"train_loss": -12.468347549438477, "global_step": 359827, "epoch": 2141} {"train_loss": -12.67327880859375, "global_step": 359828, "epoch": 2141} {"train_loss": -12.702510833740234, "global_step": 359829, "epoch": 2141} {"train_loss": -12.397638320922852, "global_step": 359830, "epoch": 2141} {"train_loss": -12.596683502197266, "global_step": 359831, "epoch": 2141} {"train_loss": -12.513903617858887, "global_step": 359832, "epoch": 2141} {"train_loss": -12.257806777954102, "global_step": 359833, "epoch": 2141} {"train_loss": -12.647387504577637, "global_step": 359834, "epoch": 2141} {"train_loss": -12.38133430480957, "global_step": 359835, "epoch": 2141} {"train_loss": -12.655338287353516, "global_step": 359836, "epoch": 2141} {"train_loss": -12.593708992004395, "global_step": 359837, "epoch": 2141} {"train_loss": -12.674165725708008, "global_step": 359838, "epoch": 2141} {"train_loss": -12.645429611206055, "global_step": 359839, "epoch": 2141} {"train_loss": -12.48004150390625, "global_step": 359840, "epoch": 2141} {"train_loss": -12.492330551147461, "global_step": 359841, "epoch": 2141} {"train_loss": -12.548770904541016, "global_step": 359842, "epoch": 2141} {"train_loss": -12.760496139526367, "global_step": 359843, "epoch": 2141} {"train_loss": -12.73832893371582, "global_step": 359844, "epoch": 2141} {"train_loss": -12.683009147644043, "global_step": 359845, "epoch": 2141} {"train_loss": -12.699305534362793, "global_step": 359846, "epoch": 2141} {"train_loss": -12.648488998413086, "global_step": 359847, "epoch": 2141} {"train_loss": -12.661365509033203, "global_step": 359848, "epoch": 2141} {"train_loss": -12.597517967224121, "global_step": 359849, "epoch": 2141} {"train_loss": -12.59472942352295, "global_step": 359850, "epoch": 2141} {"train_loss": -12.830643653869629, "global_step": 359851, "epoch": 2141} {"train_loss": -12.868664741516113, "global_step": 359852, "epoch": 2141} {"train_loss": -12.660528182983398, "global_step": 359853, "epoch": 2141} {"train_loss": -12.723612785339355, "global_step": 359854, "epoch": 2141} {"train_loss": -11.946468455450875, "global_step": 359855, "epoch": 2141, "val_loss": 292498.15625} {"train_loss": -12.764892578125, "global_step": 359856, "epoch": 2142} {"train_loss": -12.828622817993164, "global_step": 359857, "epoch": 2142} {"train_loss": -12.774060249328613, "global_step": 359858, "epoch": 2142} {"train_loss": -12.867593765258789, "global_step": 359859, "epoch": 2142} {"train_loss": -12.673004150390625, "global_step": 359860, "epoch": 2142} {"train_loss": -12.726436614990234, "global_step": 359861, "epoch": 2142} {"train_loss": -12.475403785705566, "global_step": 359862, "epoch": 2142} {"train_loss": -12.030101776123047, "global_step": 359863, "epoch": 2142} {"train_loss": -12.224576950073242, "global_step": 359864, "epoch": 2142} {"train_loss": -12.811502456665039, "global_step": 359865, "epoch": 2142} {"train_loss": -12.025812149047852, "global_step": 359866, "epoch": 2142} {"train_loss": -12.183135986328125, "global_step": 359867, "epoch": 2142} {"train_loss": -12.028871536254883, "global_step": 359868, "epoch": 2142} {"train_loss": -11.510696411132812, "global_step": 359869, "epoch": 2142} {"train_loss": -12.131715774536133, "global_step": 359870, "epoch": 2142} {"train_loss": -11.703458786010742, "global_step": 359871, "epoch": 2142} {"train_loss": -11.656869888305664, "global_step": 359872, "epoch": 2142} {"train_loss": -12.414268493652344, "global_step": 359873, "epoch": 2142} {"train_loss": -12.506949424743652, "global_step": 359874, "epoch": 2142} {"train_loss": -12.46870231628418, "global_step": 359875, "epoch": 2142} {"train_loss": -12.097529411315918, "global_step": 359876, "epoch": 2142} {"train_loss": -10.671533584594727, "global_step": 359877, "epoch": 2142} {"train_loss": -10.202723503112793, "global_step": 359878, "epoch": 2142} {"train_loss": -12.018365859985352, "global_step": 359879, "epoch": 2142} {"train_loss": -12.115966796875, "global_step": 359880, "epoch": 2142} {"train_loss": -10.916131019592285, "global_step": 359881, "epoch": 2142} {"train_loss": -11.940936088562012, "global_step": 359882, "epoch": 2142} {"train_loss": -11.064513206481934, "global_step": 359883, "epoch": 2142} {"train_loss": -11.270856857299805, "global_step": 359884, "epoch": 2142} {"train_loss": -11.575122833251953, "global_step": 359885, "epoch": 2142} {"train_loss": -9.847213745117188, "global_step": 359886, "epoch": 2142} {"train_loss": -10.41299057006836, "global_step": 359887, "epoch": 2142} {"train_loss": -9.501602172851562, "global_step": 359888, "epoch": 2142} {"train_loss": -10.733802795410156, "global_step": 359889, "epoch": 2142} {"train_loss": -9.75073528289795, "global_step": 359890, "epoch": 2142} {"train_loss": -7.905890941619873, "global_step": 359891, "epoch": 2142} {"train_loss": -10.609447479248047, "global_step": 359892, "epoch": 2142} {"train_loss": -8.102826118469238, "global_step": 359893, "epoch": 2142} {"train_loss": -8.034154891967773, "global_step": 359894, "epoch": 2142} {"train_loss": -10.37845230102539, "global_step": 359895, "epoch": 2142} {"train_loss": -10.3511962890625, "global_step": 359896, "epoch": 2142} {"train_loss": -9.657218933105469, "global_step": 359897, "epoch": 2142} {"train_loss": -10.369328498840332, "global_step": 359898, "epoch": 2142} {"train_loss": -10.350772857666016, "global_step": 359899, "epoch": 2142} {"train_loss": -11.131057739257812, "global_step": 359900, "epoch": 2142} {"train_loss": -11.100595474243164, "global_step": 359901, "epoch": 2142} {"train_loss": -11.089852333068848, "global_step": 359902, "epoch": 2142} {"train_loss": -11.687429428100586, "global_step": 359903, "epoch": 2142} {"train_loss": -10.822183609008789, "global_step": 359904, "epoch": 2142} {"train_loss": -10.769851684570312, "global_step": 359905, "epoch": 2142} {"train_loss": -11.030656814575195, "global_step": 359906, "epoch": 2142} {"train_loss": -11.330857276916504, "global_step": 359907, "epoch": 2142} {"train_loss": -11.220647811889648, "global_step": 359908, "epoch": 2142} {"train_loss": -11.595945358276367, "global_step": 359909, "epoch": 2142} {"train_loss": -10.63304328918457, "global_step": 359910, "epoch": 2142} {"train_loss": -12.07777214050293, "global_step": 359911, "epoch": 2142} {"train_loss": -10.924470901489258, "global_step": 359912, "epoch": 2142} {"train_loss": -12.134577751159668, "global_step": 359913, "epoch": 2142} {"train_loss": -11.480091094970703, "global_step": 359914, "epoch": 2142} {"train_loss": -11.830730438232422, "global_step": 359915, "epoch": 2142} {"train_loss": -11.702173233032227, "global_step": 359916, "epoch": 2142} {"train_loss": -11.663837432861328, "global_step": 359917, "epoch": 2142} {"train_loss": -11.54688549041748, "global_step": 359918, "epoch": 2142} {"train_loss": -12.194156646728516, "global_step": 359919, "epoch": 2142} {"train_loss": -11.51162338256836, "global_step": 359920, "epoch": 2142} {"train_loss": -11.821613311767578, "global_step": 359921, "epoch": 2142} {"train_loss": -11.641382217407227, "global_step": 359922, "epoch": 2142} {"train_loss": -12.157360076904297, "global_step": 359923, "epoch": 2142} {"train_loss": -11.335960388183594, "global_step": 359924, "epoch": 2142} {"train_loss": -12.236446380615234, "global_step": 359925, "epoch": 2142} {"train_loss": -11.541864395141602, "global_step": 359926, "epoch": 2142} {"train_loss": -12.13566780090332, "global_step": 359927, "epoch": 2142} {"train_loss": -12.00704574584961, "global_step": 359928, "epoch": 2142} {"train_loss": -11.949094772338867, "global_step": 359929, "epoch": 2142} {"train_loss": -12.03581428527832, "global_step": 359930, "epoch": 2142} {"train_loss": -11.97248363494873, "global_step": 359931, "epoch": 2142} {"train_loss": -12.038549423217773, "global_step": 359932, "epoch": 2142} {"train_loss": -12.185962677001953, "global_step": 359933, "epoch": 2142} {"train_loss": -12.205621719360352, "global_step": 359934, "epoch": 2142} {"train_loss": -12.142156600952148, "global_step": 359935, "epoch": 2142} {"train_loss": -12.359363555908203, "global_step": 359936, "epoch": 2142} {"train_loss": -12.322463989257812, "global_step": 359937, "epoch": 2142} {"train_loss": -12.303289413452148, "global_step": 359938, "epoch": 2142} {"train_loss": -12.183462142944336, "global_step": 359939, "epoch": 2142} {"train_loss": -12.354240417480469, "global_step": 359940, "epoch": 2142} {"train_loss": -12.19133472442627, "global_step": 359941, "epoch": 2142} {"train_loss": -12.407072067260742, "global_step": 359942, "epoch": 2142} {"train_loss": -12.211013793945312, "global_step": 359943, "epoch": 2142} {"train_loss": -12.457173347473145, "global_step": 359944, "epoch": 2142} {"train_loss": -12.118815422058105, "global_step": 359945, "epoch": 2142} {"train_loss": -12.207015991210938, "global_step": 359946, "epoch": 2142} {"train_loss": -12.18753719329834, "global_step": 359947, "epoch": 2142} {"train_loss": -11.981549263000488, "global_step": 359948, "epoch": 2142} {"train_loss": -12.293455123901367, "global_step": 359949, "epoch": 2142} {"train_loss": -12.066608428955078, "global_step": 359950, "epoch": 2142} {"train_loss": -12.265655517578125, "global_step": 359951, "epoch": 2142} {"train_loss": -12.144896507263184, "global_step": 359952, "epoch": 2142} {"train_loss": -12.320353507995605, "global_step": 359953, "epoch": 2142} {"train_loss": -11.842321395874023, "global_step": 359954, "epoch": 2142} {"train_loss": -12.417078018188477, "global_step": 359955, "epoch": 2142} {"train_loss": -12.10272216796875, "global_step": 359956, "epoch": 2142} {"train_loss": -12.202564239501953, "global_step": 359957, "epoch": 2142} {"train_loss": -12.108074188232422, "global_step": 359958, "epoch": 2142} {"train_loss": -12.065560340881348, "global_step": 359959, "epoch": 2142} {"train_loss": -12.31786823272705, "global_step": 359960, "epoch": 2142} {"train_loss": -12.24759292602539, "global_step": 359961, "epoch": 2142} {"train_loss": -12.399202346801758, "global_step": 359962, "epoch": 2142} {"train_loss": -12.249836921691895, "global_step": 359963, "epoch": 2142} {"train_loss": -12.072714805603027, "global_step": 359964, "epoch": 2142} {"train_loss": -12.2042875289917, "global_step": 359965, "epoch": 2142} {"train_loss": -12.048721313476562, "global_step": 359966, "epoch": 2142} {"train_loss": -12.284043312072754, "global_step": 359967, "epoch": 2142} {"train_loss": -11.803457260131836, "global_step": 359968, "epoch": 2142} {"train_loss": -12.065777778625488, "global_step": 359969, "epoch": 2142} {"train_loss": -12.092058181762695, "global_step": 359970, "epoch": 2142} {"train_loss": -12.235662460327148, "global_step": 359971, "epoch": 2142} {"train_loss": -12.00244140625, "global_step": 359972, "epoch": 2142} {"train_loss": -12.168570518493652, "global_step": 359973, "epoch": 2142} {"train_loss": -12.242714881896973, "global_step": 359974, "epoch": 2142} {"train_loss": -12.339277267456055, "global_step": 359975, "epoch": 2142} {"train_loss": -12.427080154418945, "global_step": 359976, "epoch": 2142} {"train_loss": -12.268836975097656, "global_step": 359977, "epoch": 2142} {"train_loss": -12.435808181762695, "global_step": 359978, "epoch": 2142} {"train_loss": -11.908185958862305, "global_step": 359979, "epoch": 2142} {"train_loss": -12.011098861694336, "global_step": 359980, "epoch": 2142} {"train_loss": -12.27825927734375, "global_step": 359981, "epoch": 2142} {"train_loss": -11.994606018066406, "global_step": 359982, "epoch": 2142} {"train_loss": -11.990838050842285, "global_step": 359983, "epoch": 2142} {"train_loss": -11.677907943725586, "global_step": 359984, "epoch": 2142} {"train_loss": -12.104284286499023, "global_step": 359985, "epoch": 2142} {"train_loss": -11.665136337280273, "global_step": 359986, "epoch": 2142} {"train_loss": -12.168800354003906, "global_step": 359987, "epoch": 2142} {"train_loss": -12.237940788269043, "global_step": 359988, "epoch": 2142} {"train_loss": -11.885793685913086, "global_step": 359989, "epoch": 2142} {"train_loss": -12.335748672485352, "global_step": 359990, "epoch": 2142} {"train_loss": -11.956068992614746, "global_step": 359991, "epoch": 2142} {"train_loss": -12.115476608276367, "global_step": 359992, "epoch": 2142} {"train_loss": -12.52404499053955, "global_step": 359993, "epoch": 2142} {"train_loss": -12.24592399597168, "global_step": 359994, "epoch": 2142} {"train_loss": -12.560409545898438, "global_step": 359995, "epoch": 2142} {"train_loss": -11.942151069641113, "global_step": 359996, "epoch": 2142} {"train_loss": -12.243551254272461, "global_step": 359997, "epoch": 2142} {"train_loss": -12.462053298950195, "global_step": 359998, "epoch": 2142} {"train_loss": -12.321733474731445, "global_step": 359999, "epoch": 2142} {"train_loss": -12.644455909729004, "global_step": 360000, "epoch": 2142} {"train_loss": -12.497819900512695, "global_step": 360001, "epoch": 2142} {"train_loss": -12.646310806274414, "global_step": 360002, "epoch": 2142} {"train_loss": -12.475082397460938, "global_step": 360003, "epoch": 2142} {"train_loss": -12.717256546020508, "global_step": 360004, "epoch": 2142} {"train_loss": -12.648483276367188, "global_step": 360005, "epoch": 2142} {"train_loss": -12.451306343078613, "global_step": 360006, "epoch": 2142} {"train_loss": -12.455925941467285, "global_step": 360007, "epoch": 2142} {"train_loss": -12.397012710571289, "global_step": 360008, "epoch": 2142} {"train_loss": -12.342729568481445, "global_step": 360009, "epoch": 2142} {"train_loss": -12.431608200073242, "global_step": 360010, "epoch": 2142} {"train_loss": -12.583097457885742, "global_step": 360011, "epoch": 2142} {"train_loss": -12.590873718261719, "global_step": 360012, "epoch": 2142} {"train_loss": -12.558530807495117, "global_step": 360013, "epoch": 2142} {"train_loss": -12.734225273132324, "global_step": 360014, "epoch": 2142} {"train_loss": -12.167200088500977, "global_step": 360015, "epoch": 2142} {"train_loss": -12.671817779541016, "global_step": 360016, "epoch": 2142} {"train_loss": -12.472206115722656, "global_step": 360017, "epoch": 2142} {"train_loss": -12.68826675415039, "global_step": 360018, "epoch": 2142} {"train_loss": -12.388941764831543, "global_step": 360019, "epoch": 2142} {"train_loss": -11.739137649536133, "global_step": 360020, "epoch": 2142} {"train_loss": -11.153735160827637, "global_step": 360021, "epoch": 2142} {"train_loss": -12.240724563598633, "global_step": 360022, "epoch": 2142} {"train_loss": -11.86324360540935, "global_step": 360023, "epoch": 2142, "val_loss": 288913.375} {"train_loss": -11.86121940612793, "global_step": 360024, "epoch": 2143} {"train_loss": -12.17755126953125, "global_step": 360025, "epoch": 2143} {"train_loss": -12.104700088500977, "global_step": 360026, "epoch": 2143} {"train_loss": -12.733235359191895, "global_step": 360027, "epoch": 2143} {"train_loss": -12.184713363647461, "global_step": 360028, "epoch": 2143} {"train_loss": -11.95903491973877, "global_step": 360029, "epoch": 2143} {"train_loss": -11.472112655639648, "global_step": 360030, "epoch": 2143} {"train_loss": -11.972309112548828, "global_step": 360031, "epoch": 2143} {"train_loss": -12.481512069702148, "global_step": 360032, "epoch": 2143} {"train_loss": -11.636030197143555, "global_step": 360033, "epoch": 2143} {"train_loss": -12.598773002624512, "global_step": 360034, "epoch": 2143} {"train_loss": -11.639213562011719, "global_step": 360035, "epoch": 2143} {"train_loss": -11.9411039352417, "global_step": 360036, "epoch": 2143} {"train_loss": -11.95318603515625, "global_step": 360037, "epoch": 2143} {"train_loss": -11.727458000183105, "global_step": 360038, "epoch": 2143} {"train_loss": -11.183046340942383, "global_step": 360039, "epoch": 2143} {"train_loss": -12.110809326171875, "global_step": 360040, "epoch": 2143} {"train_loss": -11.287801742553711, "global_step": 360041, "epoch": 2143} {"train_loss": -12.40038013458252, "global_step": 360042, "epoch": 2143} {"train_loss": -11.45101261138916, "global_step": 360043, "epoch": 2143} {"train_loss": -12.266829490661621, "global_step": 360044, "epoch": 2143} {"train_loss": -11.903142929077148, "global_step": 360045, "epoch": 2143} {"train_loss": -12.05215072631836, "global_step": 360046, "epoch": 2143} {"train_loss": -12.113253593444824, "global_step": 360047, "epoch": 2143} {"train_loss": -12.10862922668457, "global_step": 360048, "epoch": 2143} {"train_loss": -11.733339309692383, "global_step": 360049, "epoch": 2143} {"train_loss": -12.043777465820312, "global_step": 360050, "epoch": 2143} {"train_loss": -12.075552940368652, "global_step": 360051, "epoch": 2143} {"train_loss": -11.869174003601074, "global_step": 360052, "epoch": 2143} {"train_loss": -12.186727523803711, "global_step": 360053, "epoch": 2143} {"train_loss": -11.619279861450195, "global_step": 360054, "epoch": 2143} {"train_loss": -11.317079544067383, "global_step": 360055, "epoch": 2143} {"train_loss": -12.219046592712402, "global_step": 360056, "epoch": 2143} {"train_loss": -10.787801742553711, "global_step": 360057, "epoch": 2143} {"train_loss": -12.23060131072998, "global_step": 360058, "epoch": 2143} {"train_loss": -12.079208374023438, "global_step": 360059, "epoch": 2143} {"train_loss": -12.154891967773438, "global_step": 360060, "epoch": 2143} {"train_loss": -11.935138702392578, "global_step": 360061, "epoch": 2143} {"train_loss": -12.13973617553711, "global_step": 360062, "epoch": 2143} {"train_loss": -11.738997459411621, "global_step": 360063, "epoch": 2143} {"train_loss": -12.069408416748047, "global_step": 360064, "epoch": 2143} {"train_loss": -12.063339233398438, "global_step": 360065, "epoch": 2143} {"train_loss": -12.24378776550293, "global_step": 360066, "epoch": 2143} {"train_loss": -11.727495193481445, "global_step": 360067, "epoch": 2143} {"train_loss": -12.595573425292969, "global_step": 360068, "epoch": 2143} {"train_loss": -12.216917991638184, "global_step": 360069, "epoch": 2143} {"train_loss": -12.412742614746094, "global_step": 360070, "epoch": 2143} {"train_loss": -12.46037769317627, "global_step": 360071, "epoch": 2143} {"train_loss": -12.340736389160156, "global_step": 360072, "epoch": 2143} {"train_loss": -12.40181827545166, "global_step": 360073, "epoch": 2143} {"train_loss": -12.41342830657959, "global_step": 360074, "epoch": 2143} {"train_loss": -12.46995735168457, "global_step": 360075, "epoch": 2143} {"train_loss": -12.208333969116211, "global_step": 360076, "epoch": 2143} {"train_loss": -12.167339324951172, "global_step": 360077, "epoch": 2143} {"train_loss": -11.99837875366211, "global_step": 360078, "epoch": 2143} {"train_loss": -12.514225959777832, "global_step": 360079, "epoch": 2143} {"train_loss": -12.143087387084961, "global_step": 360080, "epoch": 2143} {"train_loss": -12.278402328491211, "global_step": 360081, "epoch": 2143} {"train_loss": -12.536821365356445, "global_step": 360082, "epoch": 2143} {"train_loss": -12.290637969970703, "global_step": 360083, "epoch": 2143} {"train_loss": -12.110363006591797, "global_step": 360084, "epoch": 2143} {"train_loss": -12.559950828552246, "global_step": 360085, "epoch": 2143} {"train_loss": -12.313192367553711, "global_step": 360086, "epoch": 2143} {"train_loss": -12.004867553710938, "global_step": 360087, "epoch": 2143} {"train_loss": -12.153520584106445, "global_step": 360088, "epoch": 2143} {"train_loss": -12.346908569335938, "global_step": 360089, "epoch": 2143} {"train_loss": -12.317837715148926, "global_step": 360090, "epoch": 2143} {"train_loss": -12.587438583374023, "global_step": 360091, "epoch": 2143} {"train_loss": -12.567420959472656, "global_step": 360092, "epoch": 2143} {"train_loss": -12.572608947753906, "global_step": 360093, "epoch": 2143} {"train_loss": -12.498876571655273, "global_step": 360094, "epoch": 2143} {"train_loss": -12.662281036376953, "global_step": 360095, "epoch": 2143} {"train_loss": -12.286500930786133, "global_step": 360096, "epoch": 2143} {"train_loss": -12.382637023925781, "global_step": 360097, "epoch": 2143} {"train_loss": -12.67049789428711, "global_step": 360098, "epoch": 2143} {"train_loss": -12.758679389953613, "global_step": 360099, "epoch": 2143} {"train_loss": -12.632617950439453, "global_step": 360100, "epoch": 2143} {"train_loss": -12.431676864624023, "global_step": 360101, "epoch": 2143} {"train_loss": -12.743908882141113, "global_step": 360102, "epoch": 2143} {"train_loss": -12.250223159790039, "global_step": 360103, "epoch": 2143} {"train_loss": -12.667927742004395, "global_step": 360104, "epoch": 2143} {"train_loss": -12.671170234680176, "global_step": 360105, "epoch": 2143} {"train_loss": -12.497791290283203, "global_step": 360106, "epoch": 2143} {"train_loss": -12.364582061767578, "global_step": 360107, "epoch": 2143} {"train_loss": -12.668872833251953, "global_step": 360108, "epoch": 2143} {"train_loss": -12.397894859313965, "global_step": 360109, "epoch": 2143} {"train_loss": -12.768924713134766, "global_step": 360110, "epoch": 2143} {"train_loss": -12.45292854309082, "global_step": 360111, "epoch": 2143} {"train_loss": -12.82558536529541, "global_step": 360112, "epoch": 2143} {"train_loss": -12.43557071685791, "global_step": 360113, "epoch": 2143} {"train_loss": -12.605997085571289, "global_step": 360114, "epoch": 2143} {"train_loss": -12.331686019897461, "global_step": 360115, "epoch": 2143} {"train_loss": -12.350383758544922, "global_step": 360116, "epoch": 2143} {"train_loss": -12.645572662353516, "global_step": 360117, "epoch": 2143} {"train_loss": -12.751276016235352, "global_step": 360118, "epoch": 2143} {"train_loss": -12.247040748596191, "global_step": 360119, "epoch": 2143} {"train_loss": -12.379777908325195, "global_step": 360120, "epoch": 2143} {"train_loss": -12.328657150268555, "global_step": 360121, "epoch": 2143} {"train_loss": -12.742117881774902, "global_step": 360122, "epoch": 2143} {"train_loss": -12.610686302185059, "global_step": 360123, "epoch": 2143} {"train_loss": -12.5484619140625, "global_step": 360124, "epoch": 2143} {"train_loss": -12.250900268554688, "global_step": 360125, "epoch": 2143} {"train_loss": -12.359798431396484, "global_step": 360126, "epoch": 2143} {"train_loss": -12.187761306762695, "global_step": 360127, "epoch": 2143} {"train_loss": -11.271586418151855, "global_step": 360128, "epoch": 2143} {"train_loss": -11.06403923034668, "global_step": 360129, "epoch": 2143} {"train_loss": -11.195723533630371, "global_step": 360130, "epoch": 2143} {"train_loss": -10.93752670288086, "global_step": 360131, "epoch": 2143} {"train_loss": -10.4548978805542, "global_step": 360132, "epoch": 2143} {"train_loss": -10.068075180053711, "global_step": 360133, "epoch": 2143} {"train_loss": -8.423529624938965, "global_step": 360134, "epoch": 2143} {"train_loss": -7.380108833312988, "global_step": 360135, "epoch": 2143} {"train_loss": -8.054445266723633, "global_step": 360136, "epoch": 2143} {"train_loss": -7.9014739990234375, "global_step": 360137, "epoch": 2143} {"train_loss": -7.683175563812256, "global_step": 360138, "epoch": 2143} {"train_loss": -8.779129028320312, "global_step": 360139, "epoch": 2143} {"train_loss": -8.541803359985352, "global_step": 360140, "epoch": 2143} {"train_loss": -8.625322341918945, "global_step": 360141, "epoch": 2143} {"train_loss": -8.594747543334961, "global_step": 360142, "epoch": 2143} {"train_loss": -9.003080368041992, "global_step": 360143, "epoch": 2143} {"train_loss": -8.359825134277344, "global_step": 360144, "epoch": 2143} {"train_loss": -8.828287124633789, "global_step": 360145, "epoch": 2143} {"train_loss": -9.41542911529541, "global_step": 360146, "epoch": 2143} {"train_loss": -10.438053131103516, "global_step": 360147, "epoch": 2143} {"train_loss": -10.154058456420898, "global_step": 360148, "epoch": 2143} {"train_loss": -11.028680801391602, "global_step": 360149, "epoch": 2143} {"train_loss": -10.180904388427734, "global_step": 360150, "epoch": 2143} {"train_loss": -10.543890953063965, "global_step": 360151, "epoch": 2143} {"train_loss": -9.766862869262695, "global_step": 360152, "epoch": 2143} {"train_loss": -10.326457977294922, "global_step": 360153, "epoch": 2143} {"train_loss": -10.642322540283203, "global_step": 360154, "epoch": 2143} {"train_loss": -10.395235061645508, "global_step": 360155, "epoch": 2143} {"train_loss": -10.023879051208496, "global_step": 360156, "epoch": 2143} {"train_loss": -11.565520286560059, "global_step": 360157, "epoch": 2143} {"train_loss": -10.31762409210205, "global_step": 360158, "epoch": 2143} {"train_loss": -11.178984642028809, "global_step": 360159, "epoch": 2143} {"train_loss": -10.112442016601562, "global_step": 360160, "epoch": 2143} {"train_loss": -11.287461280822754, "global_step": 360161, "epoch": 2143} {"train_loss": -9.108453750610352, "global_step": 360162, "epoch": 2143} {"train_loss": -11.346019744873047, "global_step": 360163, "epoch": 2143} {"train_loss": -10.877606391906738, "global_step": 360164, "epoch": 2143} {"train_loss": -11.425372123718262, "global_step": 360165, "epoch": 2143} {"train_loss": -10.856571197509766, "global_step": 360166, "epoch": 2143} {"train_loss": -11.7193603515625, "global_step": 360167, "epoch": 2143} {"train_loss": -10.86203384399414, "global_step": 360168, "epoch": 2143} {"train_loss": -11.98384952545166, "global_step": 360169, "epoch": 2143} {"train_loss": -11.391129493713379, "global_step": 360170, "epoch": 2143} {"train_loss": -11.38097095489502, "global_step": 360171, "epoch": 2143} {"train_loss": -11.735161781311035, "global_step": 360172, "epoch": 2143} {"train_loss": -11.614038467407227, "global_step": 360173, "epoch": 2143} {"train_loss": -11.770915031433105, "global_step": 360174, "epoch": 2143} {"train_loss": -11.735762596130371, "global_step": 360175, "epoch": 2143} {"train_loss": -12.229153633117676, "global_step": 360176, "epoch": 2143} {"train_loss": -11.892672538757324, "global_step": 360177, "epoch": 2143} {"train_loss": -11.858039855957031, "global_step": 360178, "epoch": 2143} {"train_loss": -11.865726470947266, "global_step": 360179, "epoch": 2143} {"train_loss": -12.0176362991333, "global_step": 360180, "epoch": 2143} {"train_loss": -11.9959077835083, "global_step": 360181, "epoch": 2143} {"train_loss": -12.120986938476562, "global_step": 360182, "epoch": 2143} {"train_loss": -12.318765640258789, "global_step": 360183, "epoch": 2143} {"train_loss": -12.156332015991211, "global_step": 360184, "epoch": 2143} {"train_loss": -12.217691421508789, "global_step": 360185, "epoch": 2143} {"train_loss": -12.2316255569458, "global_step": 360186, "epoch": 2143} {"train_loss": -12.160196304321289, "global_step": 360187, "epoch": 2143} {"train_loss": -12.252647399902344, "global_step": 360188, "epoch": 2143} {"train_loss": -12.480384826660156, "global_step": 360189, "epoch": 2143} {"train_loss": -12.122329711914062, "global_step": 360190, "epoch": 2143} {"train_loss": -11.646401703357697, "global_step": 360191, "epoch": 2143, "val_loss": 291898.59375} {"train_loss": -12.203399658203125, "global_step": 360192, "epoch": 2144} {"train_loss": -12.208345413208008, "global_step": 360193, "epoch": 2144} {"train_loss": -12.351017951965332, "global_step": 360194, "epoch": 2144} {"train_loss": -12.102030754089355, "global_step": 360195, "epoch": 2144} {"train_loss": -12.344620704650879, "global_step": 360196, "epoch": 2144} {"train_loss": -12.367568969726562, "global_step": 360197, "epoch": 2144} {"train_loss": -12.317842483520508, "global_step": 360198, "epoch": 2144} {"train_loss": -12.13757038116455, "global_step": 360199, "epoch": 2144} {"train_loss": -12.213996887207031, "global_step": 360200, "epoch": 2144} {"train_loss": -12.105910301208496, "global_step": 360201, "epoch": 2144} {"train_loss": -12.243432998657227, "global_step": 360202, "epoch": 2144} {"train_loss": -12.312651634216309, "global_step": 360203, "epoch": 2144} {"train_loss": -12.561909675598145, "global_step": 360204, "epoch": 2144} {"train_loss": -12.396895408630371, "global_step": 360205, "epoch": 2144} {"train_loss": -12.550665855407715, "global_step": 360206, "epoch": 2144} {"train_loss": -12.425790786743164, "global_step": 360207, "epoch": 2144} {"train_loss": -12.482748031616211, "global_step": 360208, "epoch": 2144} {"train_loss": -12.26231575012207, "global_step": 360209, "epoch": 2144} {"train_loss": -12.531164169311523, "global_step": 360210, "epoch": 2144} {"train_loss": -12.390069007873535, "global_step": 360211, "epoch": 2144} {"train_loss": -12.4912109375, "global_step": 360212, "epoch": 2144} {"train_loss": -12.516206741333008, "global_step": 360213, "epoch": 2144} {"train_loss": -12.520496368408203, "global_step": 360214, "epoch": 2144} {"train_loss": -12.44039249420166, "global_step": 360215, "epoch": 2144} {"train_loss": -12.592512130737305, "global_step": 360216, "epoch": 2144} {"train_loss": -12.494985580444336, "global_step": 360217, "epoch": 2144} {"train_loss": -12.477852821350098, "global_step": 360218, "epoch": 2144} {"train_loss": -12.52880859375, "global_step": 360219, "epoch": 2144} {"train_loss": -12.61520004272461, "global_step": 360220, "epoch": 2144} {"train_loss": -12.665254592895508, "global_step": 360221, "epoch": 2144} {"train_loss": -12.23705768585205, "global_step": 360222, "epoch": 2144} {"train_loss": -12.482000350952148, "global_step": 360223, "epoch": 2144} {"train_loss": -12.699917793273926, "global_step": 360224, "epoch": 2144} {"train_loss": -12.471484184265137, "global_step": 360225, "epoch": 2144} {"train_loss": -12.491790771484375, "global_step": 360226, "epoch": 2144} {"train_loss": -12.413261413574219, "global_step": 360227, "epoch": 2144} {"train_loss": -12.782307624816895, "global_step": 360228, "epoch": 2144} {"train_loss": -12.479141235351562, "global_step": 360229, "epoch": 2144} {"train_loss": -12.515751838684082, "global_step": 360230, "epoch": 2144} {"train_loss": -12.27314567565918, "global_step": 360231, "epoch": 2144} {"train_loss": -12.670389175415039, "global_step": 360232, "epoch": 2144} {"train_loss": -12.626001358032227, "global_step": 360233, "epoch": 2144} {"train_loss": -12.464935302734375, "global_step": 360234, "epoch": 2144} {"train_loss": -12.564990997314453, "global_step": 360235, "epoch": 2144} {"train_loss": -12.641538619995117, "global_step": 360236, "epoch": 2144} {"train_loss": -12.595195770263672, "global_step": 360237, "epoch": 2144} {"train_loss": -12.774700164794922, "global_step": 360238, "epoch": 2144} {"train_loss": -12.651330947875977, "global_step": 360239, "epoch": 2144} {"train_loss": -12.637336730957031, "global_step": 360240, "epoch": 2144} {"train_loss": -12.73414421081543, "global_step": 360241, "epoch": 2144} {"train_loss": -12.68226432800293, "global_step": 360242, "epoch": 2144} {"train_loss": -12.645709991455078, "global_step": 360243, "epoch": 2144} {"train_loss": -12.659177780151367, "global_step": 360244, "epoch": 2144} {"train_loss": -12.672979354858398, "global_step": 360245, "epoch": 2144} {"train_loss": -12.583940505981445, "global_step": 360246, "epoch": 2144} {"train_loss": -12.541489601135254, "global_step": 360247, "epoch": 2144} {"train_loss": -12.53860855102539, "global_step": 360248, "epoch": 2144} {"train_loss": -12.639307975769043, "global_step": 360249, "epoch": 2144} {"train_loss": -12.29449462890625, "global_step": 360250, "epoch": 2144} {"train_loss": -12.699028015136719, "global_step": 360251, "epoch": 2144} {"train_loss": -12.635217666625977, "global_step": 360252, "epoch": 2144} {"train_loss": -12.52352523803711, "global_step": 360253, "epoch": 2144} {"train_loss": -12.538576126098633, "global_step": 360254, "epoch": 2144} {"train_loss": -12.372480392456055, "global_step": 360255, "epoch": 2144} {"train_loss": -12.880136489868164, "global_step": 360256, "epoch": 2144} {"train_loss": -12.644777297973633, "global_step": 360257, "epoch": 2144} {"train_loss": -12.406949996948242, "global_step": 360258, "epoch": 2144} {"train_loss": -12.673203468322754, "global_step": 360259, "epoch": 2144} {"train_loss": -12.620424270629883, "global_step": 360260, "epoch": 2144} {"train_loss": -12.356223106384277, "global_step": 360261, "epoch": 2144} {"train_loss": -12.464140892028809, "global_step": 360262, "epoch": 2144} {"train_loss": -12.351717948913574, "global_step": 360263, "epoch": 2144} {"train_loss": -11.74826431274414, "global_step": 360264, "epoch": 2144} {"train_loss": -11.053747177124023, "global_step": 360265, "epoch": 2144} {"train_loss": -11.580913543701172, "global_step": 360266, "epoch": 2144} {"train_loss": -11.093754768371582, "global_step": 360267, "epoch": 2144} {"train_loss": -11.255620956420898, "global_step": 360268, "epoch": 2144} {"train_loss": -11.823175430297852, "global_step": 360269, "epoch": 2144} {"train_loss": -11.66797924041748, "global_step": 360270, "epoch": 2144} {"train_loss": -10.917622566223145, "global_step": 360271, "epoch": 2144} {"train_loss": -11.159965515136719, "global_step": 360272, "epoch": 2144} {"train_loss": -11.498727798461914, "global_step": 360273, "epoch": 2144} {"train_loss": -11.875923156738281, "global_step": 360274, "epoch": 2144} {"train_loss": -10.2984619140625, "global_step": 360275, "epoch": 2144} {"train_loss": -10.709966659545898, "global_step": 360276, "epoch": 2144} {"train_loss": -10.955621719360352, "global_step": 360277, "epoch": 2144} {"train_loss": -10.043046951293945, "global_step": 360278, "epoch": 2144} {"train_loss": -11.68269157409668, "global_step": 360279, "epoch": 2144} {"train_loss": -10.122844696044922, "global_step": 360280, "epoch": 2144} {"train_loss": -11.353199005126953, "global_step": 360281, "epoch": 2144} {"train_loss": -9.173437118530273, "global_step": 360282, "epoch": 2144} {"train_loss": -9.000919342041016, "global_step": 360283, "epoch": 2144} {"train_loss": -7.835171699523926, "global_step": 360284, "epoch": 2144} {"train_loss": -9.033035278320312, "global_step": 360285, "epoch": 2144} {"train_loss": -8.685033798217773, "global_step": 360286, "epoch": 2144} {"train_loss": -10.575319290161133, "global_step": 360287, "epoch": 2144} {"train_loss": -9.42637825012207, "global_step": 360288, "epoch": 2144} {"train_loss": -8.992506980895996, "global_step": 360289, "epoch": 2144} {"train_loss": -9.916311264038086, "global_step": 360290, "epoch": 2144} {"train_loss": -10.032571792602539, "global_step": 360291, "epoch": 2144} {"train_loss": -8.915727615356445, "global_step": 360292, "epoch": 2144} {"train_loss": -10.116111755371094, "global_step": 360293, "epoch": 2144} {"train_loss": -10.2330322265625, "global_step": 360294, "epoch": 2144} {"train_loss": -10.368310928344727, "global_step": 360295, "epoch": 2144} {"train_loss": -10.59122085571289, "global_step": 360296, "epoch": 2144} {"train_loss": -10.071216583251953, "global_step": 360297, "epoch": 2144} {"train_loss": -10.05862808227539, "global_step": 360298, "epoch": 2144} {"train_loss": -9.528742790222168, "global_step": 360299, "epoch": 2144} {"train_loss": -10.577007293701172, "global_step": 360300, "epoch": 2144} {"train_loss": -11.112000465393066, "global_step": 360301, "epoch": 2144} {"train_loss": -11.151213645935059, "global_step": 360302, "epoch": 2144} {"train_loss": -10.269792556762695, "global_step": 360303, "epoch": 2144} {"train_loss": -11.129951477050781, "global_step": 360304, "epoch": 2144} {"train_loss": -11.059886932373047, "global_step": 360305, "epoch": 2144} {"train_loss": -11.206903457641602, "global_step": 360306, "epoch": 2144} {"train_loss": -10.856405258178711, "global_step": 360307, "epoch": 2144} {"train_loss": -11.338757514953613, "global_step": 360308, "epoch": 2144} {"train_loss": -11.018503189086914, "global_step": 360309, "epoch": 2144} {"train_loss": -11.358685493469238, "global_step": 360310, "epoch": 2144} {"train_loss": -11.097824096679688, "global_step": 360311, "epoch": 2144} {"train_loss": -11.15953540802002, "global_step": 360312, "epoch": 2144} {"train_loss": -10.555912971496582, "global_step": 360313, "epoch": 2144} {"train_loss": -11.08232307434082, "global_step": 360314, "epoch": 2144} {"train_loss": -10.871917724609375, "global_step": 360315, "epoch": 2144} {"train_loss": -11.265056610107422, "global_step": 360316, "epoch": 2144} {"train_loss": -11.566556930541992, "global_step": 360317, "epoch": 2144} {"train_loss": -11.11021900177002, "global_step": 360318, "epoch": 2144} {"train_loss": -11.132487297058105, "global_step": 360319, "epoch": 2144} {"train_loss": -11.452567100524902, "global_step": 360320, "epoch": 2144} {"train_loss": -11.115913391113281, "global_step": 360321, "epoch": 2144} {"train_loss": -11.674264907836914, "global_step": 360322, "epoch": 2144} {"train_loss": -11.494537353515625, "global_step": 360323, "epoch": 2144} {"train_loss": -11.099664688110352, "global_step": 360324, "epoch": 2144} {"train_loss": -11.548609733581543, "global_step": 360325, "epoch": 2144} {"train_loss": -11.293525695800781, "global_step": 360326, "epoch": 2144} {"train_loss": -12.086013793945312, "global_step": 360327, "epoch": 2144} {"train_loss": -11.796745300292969, "global_step": 360328, "epoch": 2144} {"train_loss": -11.848760604858398, "global_step": 360329, "epoch": 2144} {"train_loss": -11.544214248657227, "global_step": 360330, "epoch": 2144} {"train_loss": -11.356440544128418, "global_step": 360331, "epoch": 2144} {"train_loss": -11.914726257324219, "global_step": 360332, "epoch": 2144} {"train_loss": -11.432299613952637, "global_step": 360333, "epoch": 2144} {"train_loss": -11.609884262084961, "global_step": 360334, "epoch": 2144} {"train_loss": -11.887847900390625, "global_step": 360335, "epoch": 2144} {"train_loss": -11.996373176574707, "global_step": 360336, "epoch": 2144} {"train_loss": -11.615304946899414, "global_step": 360337, "epoch": 2144} {"train_loss": -12.064180374145508, "global_step": 360338, "epoch": 2144} {"train_loss": -11.643369674682617, "global_step": 360339, "epoch": 2144} {"train_loss": -12.117774963378906, "global_step": 360340, "epoch": 2144} {"train_loss": -11.774093627929688, "global_step": 360341, "epoch": 2144} {"train_loss": -11.852842330932617, "global_step": 360342, "epoch": 2144} {"train_loss": -11.832529067993164, "global_step": 360343, "epoch": 2144} {"train_loss": -12.22775650024414, "global_step": 360344, "epoch": 2144} {"train_loss": -12.077122688293457, "global_step": 360345, "epoch": 2144} {"train_loss": -12.233570098876953, "global_step": 360346, "epoch": 2144} {"train_loss": -12.049091339111328, "global_step": 360347, "epoch": 2144} {"train_loss": -12.230920791625977, "global_step": 360348, "epoch": 2144} {"train_loss": -12.206384658813477, "global_step": 360349, "epoch": 2144} {"train_loss": -12.02035140991211, "global_step": 360350, "epoch": 2144} {"train_loss": -12.085311889648438, "global_step": 360351, "epoch": 2144} {"train_loss": -11.994710922241211, "global_step": 360352, "epoch": 2144} {"train_loss": -11.657268524169922, "global_step": 360353, "epoch": 2144} {"train_loss": -12.14894962310791, "global_step": 360354, "epoch": 2144} {"train_loss": -12.00515365600586, "global_step": 360355, "epoch": 2144} {"train_loss": -12.124757766723633, "global_step": 360356, "epoch": 2144} {"train_loss": -12.382682800292969, "global_step": 360357, "epoch": 2144} {"train_loss": -12.121936798095703, "global_step": 360358, "epoch": 2144} {"train_loss": -11.710552828652519, "global_step": 360359, "epoch": 2144, "val_loss": 294555.21875} {"train_loss": -12.356964111328125, "global_step": 360360, "epoch": 2145} {"train_loss": -12.197263717651367, "global_step": 360361, "epoch": 2145} {"train_loss": -12.452386856079102, "global_step": 360362, "epoch": 2145} {"train_loss": -12.201883316040039, "global_step": 360363, "epoch": 2145} {"train_loss": -12.36101245880127, "global_step": 360364, "epoch": 2145} {"train_loss": -12.439874649047852, "global_step": 360365, "epoch": 2145} {"train_loss": -12.227743148803711, "global_step": 360366, "epoch": 2145} {"train_loss": -12.326095581054688, "global_step": 360367, "epoch": 2145} {"train_loss": -12.420689582824707, "global_step": 360368, "epoch": 2145} {"train_loss": -12.1043701171875, "global_step": 360369, "epoch": 2145} {"train_loss": -12.41326904296875, "global_step": 360370, "epoch": 2145} {"train_loss": -12.098913192749023, "global_step": 360371, "epoch": 2145} {"train_loss": -12.378292083740234, "global_step": 360372, "epoch": 2145} {"train_loss": -12.247966766357422, "global_step": 360373, "epoch": 2145} {"train_loss": -12.39318561553955, "global_step": 360374, "epoch": 2145} {"train_loss": -12.447761535644531, "global_step": 360375, "epoch": 2145} {"train_loss": -12.588480949401855, "global_step": 360376, "epoch": 2145} {"train_loss": -12.288091659545898, "global_step": 360377, "epoch": 2145} {"train_loss": -12.15644359588623, "global_step": 360378, "epoch": 2145} {"train_loss": -12.28093433380127, "global_step": 360379, "epoch": 2145} {"train_loss": -12.365108489990234, "global_step": 360380, "epoch": 2145} {"train_loss": -12.325658798217773, "global_step": 360381, "epoch": 2145} {"train_loss": -12.387397766113281, "global_step": 360382, "epoch": 2145} {"train_loss": -12.12283992767334, "global_step": 360383, "epoch": 2145} {"train_loss": -12.248784065246582, "global_step": 360384, "epoch": 2145} {"train_loss": -12.022814750671387, "global_step": 360385, "epoch": 2145} {"train_loss": -12.517194747924805, "global_step": 360386, "epoch": 2145} {"train_loss": -12.036946296691895, "global_step": 360387, "epoch": 2145} {"train_loss": -12.365250587463379, "global_step": 360388, "epoch": 2145} {"train_loss": -11.72342300415039, "global_step": 360389, "epoch": 2145} {"train_loss": -12.220577239990234, "global_step": 360390, "epoch": 2145} {"train_loss": -12.001229286193848, "global_step": 360391, "epoch": 2145} {"train_loss": -12.03358268737793, "global_step": 360392, "epoch": 2145} {"train_loss": -12.46432876586914, "global_step": 360393, "epoch": 2145} {"train_loss": -12.103771209716797, "global_step": 360394, "epoch": 2145} {"train_loss": -12.511445045471191, "global_step": 360395, "epoch": 2145} {"train_loss": -12.333511352539062, "global_step": 360396, "epoch": 2145} {"train_loss": -12.182703018188477, "global_step": 360397, "epoch": 2145} {"train_loss": -11.81978988647461, "global_step": 360398, "epoch": 2145} {"train_loss": -12.310575485229492, "global_step": 360399, "epoch": 2145} {"train_loss": -12.28164291381836, "global_step": 360400, "epoch": 2145} {"train_loss": -12.087185859680176, "global_step": 360401, "epoch": 2145} {"train_loss": -12.336018562316895, "global_step": 360402, "epoch": 2145} {"train_loss": -11.94440746307373, "global_step": 360403, "epoch": 2145} {"train_loss": -12.36384391784668, "global_step": 360404, "epoch": 2145} {"train_loss": -11.57109546661377, "global_step": 360405, "epoch": 2145} {"train_loss": -12.444950103759766, "global_step": 360406, "epoch": 2145} {"train_loss": -11.750142097473145, "global_step": 360407, "epoch": 2145} {"train_loss": -12.632959365844727, "global_step": 360408, "epoch": 2145} {"train_loss": -12.277388572692871, "global_step": 360409, "epoch": 2145} {"train_loss": -12.484018325805664, "global_step": 360410, "epoch": 2145} {"train_loss": -12.13275146484375, "global_step": 360411, "epoch": 2145} {"train_loss": -11.890279769897461, "global_step": 360412, "epoch": 2145} {"train_loss": -12.287043571472168, "global_step": 360413, "epoch": 2145} {"train_loss": -12.446026802062988, "global_step": 360414, "epoch": 2145} {"train_loss": -12.16821575164795, "global_step": 360415, "epoch": 2145} {"train_loss": -11.997693061828613, "global_step": 360416, "epoch": 2145} {"train_loss": -12.38966178894043, "global_step": 360417, "epoch": 2145} {"train_loss": -12.450061798095703, "global_step": 360418, "epoch": 2145} {"train_loss": -12.279306411743164, "global_step": 360419, "epoch": 2145} {"train_loss": -12.117105484008789, "global_step": 360420, "epoch": 2145} {"train_loss": -12.476791381835938, "global_step": 360421, "epoch": 2145} {"train_loss": -11.893333435058594, "global_step": 360422, "epoch": 2145} {"train_loss": -12.296199798583984, "global_step": 360423, "epoch": 2145} {"train_loss": -12.431721687316895, "global_step": 360424, "epoch": 2145} {"train_loss": -11.87733268737793, "global_step": 360425, "epoch": 2145} {"train_loss": -12.351085662841797, "global_step": 360426, "epoch": 2145} {"train_loss": -11.88228702545166, "global_step": 360427, "epoch": 2145} {"train_loss": -12.148932456970215, "global_step": 360428, "epoch": 2145} {"train_loss": -11.748662948608398, "global_step": 360429, "epoch": 2145} {"train_loss": -12.395401954650879, "global_step": 360430, "epoch": 2145} {"train_loss": -11.683664321899414, "global_step": 360431, "epoch": 2145} {"train_loss": -12.203764915466309, "global_step": 360432, "epoch": 2145} {"train_loss": -11.665475845336914, "global_step": 360433, "epoch": 2145} {"train_loss": -12.434165954589844, "global_step": 360434, "epoch": 2145} {"train_loss": -11.961862564086914, "global_step": 360435, "epoch": 2145} {"train_loss": -11.950556755065918, "global_step": 360436, "epoch": 2145} {"train_loss": -12.217689514160156, "global_step": 360437, "epoch": 2145} {"train_loss": -10.941276550292969, "global_step": 360438, "epoch": 2145} {"train_loss": -11.986570358276367, "global_step": 360439, "epoch": 2145} {"train_loss": -11.823431015014648, "global_step": 360440, "epoch": 2145} {"train_loss": -12.188575744628906, "global_step": 360441, "epoch": 2145} {"train_loss": -11.778899192810059, "global_step": 360442, "epoch": 2145} {"train_loss": -12.130637168884277, "global_step": 360443, "epoch": 2145} {"train_loss": -12.005508422851562, "global_step": 360444, "epoch": 2145} {"train_loss": -12.15178108215332, "global_step": 360445, "epoch": 2145} {"train_loss": -12.04012680053711, "global_step": 360446, "epoch": 2145} {"train_loss": -11.8704833984375, "global_step": 360447, "epoch": 2145} {"train_loss": -12.255281448364258, "global_step": 360448, "epoch": 2145} {"train_loss": -11.641361236572266, "global_step": 360449, "epoch": 2145} {"train_loss": -12.010476112365723, "global_step": 360450, "epoch": 2145} {"train_loss": -12.476581573486328, "global_step": 360451, "epoch": 2145} {"train_loss": -12.20260238647461, "global_step": 360452, "epoch": 2145} {"train_loss": -12.172517776489258, "global_step": 360453, "epoch": 2145} {"train_loss": -12.503047943115234, "global_step": 360454, "epoch": 2145} {"train_loss": -12.457704544067383, "global_step": 360455, "epoch": 2145} {"train_loss": -12.346424102783203, "global_step": 360456, "epoch": 2145} {"train_loss": -12.198512077331543, "global_step": 360457, "epoch": 2145} {"train_loss": -12.432472229003906, "global_step": 360458, "epoch": 2145} {"train_loss": -12.33449935913086, "global_step": 360459, "epoch": 2145} {"train_loss": -12.151735305786133, "global_step": 360460, "epoch": 2145} {"train_loss": -12.564218521118164, "global_step": 360461, "epoch": 2145} {"train_loss": -12.053898811340332, "global_step": 360462, "epoch": 2145} {"train_loss": -12.210211753845215, "global_step": 360463, "epoch": 2145} {"train_loss": -11.697212219238281, "global_step": 360464, "epoch": 2145} {"train_loss": -12.596436500549316, "global_step": 360465, "epoch": 2145} {"train_loss": -12.101214408874512, "global_step": 360466, "epoch": 2145} {"train_loss": -12.315773010253906, "global_step": 360467, "epoch": 2145} {"train_loss": -11.975301742553711, "global_step": 360468, "epoch": 2145} {"train_loss": -12.238710403442383, "global_step": 360469, "epoch": 2145} {"train_loss": -11.979379653930664, "global_step": 360470, "epoch": 2145} {"train_loss": -12.019710540771484, "global_step": 360471, "epoch": 2145} {"train_loss": -11.930105209350586, "global_step": 360472, "epoch": 2145} {"train_loss": -12.292981147766113, "global_step": 360473, "epoch": 2145} {"train_loss": -12.0289306640625, "global_step": 360474, "epoch": 2145} {"train_loss": -11.924726486206055, "global_step": 360475, "epoch": 2145} {"train_loss": -11.568506240844727, "global_step": 360476, "epoch": 2145} {"train_loss": -11.771207809448242, "global_step": 360477, "epoch": 2145} {"train_loss": -12.152532577514648, "global_step": 360478, "epoch": 2145} {"train_loss": -11.751121520996094, "global_step": 360479, "epoch": 2145} {"train_loss": -11.948663711547852, "global_step": 360480, "epoch": 2145} {"train_loss": -11.915848731994629, "global_step": 360481, "epoch": 2145} {"train_loss": -11.976064682006836, "global_step": 360482, "epoch": 2145} {"train_loss": -11.84278678894043, "global_step": 360483, "epoch": 2145} {"train_loss": -11.106925964355469, "global_step": 360484, "epoch": 2145} {"train_loss": -10.757311820983887, "global_step": 360485, "epoch": 2145} {"train_loss": -10.022298812866211, "global_step": 360486, "epoch": 2145} {"train_loss": -11.652095794677734, "global_step": 360487, "epoch": 2145} {"train_loss": -8.959125518798828, "global_step": 360488, "epoch": 2145} {"train_loss": -10.76132869720459, "global_step": 360489, "epoch": 2145} {"train_loss": -10.037683486938477, "global_step": 360490, "epoch": 2145} {"train_loss": -10.241076469421387, "global_step": 360491, "epoch": 2145} {"train_loss": -10.633073806762695, "global_step": 360492, "epoch": 2145} {"train_loss": -10.657546997070312, "global_step": 360493, "epoch": 2145} {"train_loss": -10.155080795288086, "global_step": 360494, "epoch": 2145} {"train_loss": -10.12704086303711, "global_step": 360495, "epoch": 2145} {"train_loss": -11.159523010253906, "global_step": 360496, "epoch": 2145} {"train_loss": -10.710063934326172, "global_step": 360497, "epoch": 2145} {"train_loss": -11.193280220031738, "global_step": 360498, "epoch": 2145} {"train_loss": -10.499950408935547, "global_step": 360499, "epoch": 2145} {"train_loss": -11.959901809692383, "global_step": 360500, "epoch": 2145} {"train_loss": -11.064920425415039, "global_step": 360501, "epoch": 2145} {"train_loss": -11.806404113769531, "global_step": 360502, "epoch": 2145} {"train_loss": -10.70674991607666, "global_step": 360503, "epoch": 2145} {"train_loss": -11.504637718200684, "global_step": 360504, "epoch": 2145} {"train_loss": -11.229143142700195, "global_step": 360505, "epoch": 2145} {"train_loss": -11.791277885437012, "global_step": 360506, "epoch": 2145} {"train_loss": -11.525186538696289, "global_step": 360507, "epoch": 2145} {"train_loss": -12.276958465576172, "global_step": 360508, "epoch": 2145} {"train_loss": -11.75500774383545, "global_step": 360509, "epoch": 2145} {"train_loss": -12.271827697753906, "global_step": 360510, "epoch": 2145} {"train_loss": -11.849120140075684, "global_step": 360511, "epoch": 2145} {"train_loss": -12.259214401245117, "global_step": 360512, "epoch": 2145} {"train_loss": -12.111604690551758, "global_step": 360513, "epoch": 2145} {"train_loss": -12.060564041137695, "global_step": 360514, "epoch": 2145} {"train_loss": -12.159646034240723, "global_step": 360515, "epoch": 2145} {"train_loss": -12.282257080078125, "global_step": 360516, "epoch": 2145} {"train_loss": -12.108378410339355, "global_step": 360517, "epoch": 2145} {"train_loss": -12.175923347473145, "global_step": 360518, "epoch": 2145} {"train_loss": -12.254536628723145, "global_step": 360519, "epoch": 2145} {"train_loss": -12.385598182678223, "global_step": 360520, "epoch": 2145} {"train_loss": -12.003324508666992, "global_step": 360521, "epoch": 2145} {"train_loss": -12.371265411376953, "global_step": 360522, "epoch": 2145} {"train_loss": -11.957479476928711, "global_step": 360523, "epoch": 2145} {"train_loss": -12.322975158691406, "global_step": 360524, "epoch": 2145} {"train_loss": -12.222103118896484, "global_step": 360525, "epoch": 2145} {"train_loss": -12.443061828613281, "global_step": 360526, "epoch": 2145} {"train_loss": -11.972090692747207, "global_step": 360527, "epoch": 2145, "val_loss": 292490.625, "train_action_mse_error": 0.9389398097991943} {"train_loss": -12.406347274780273, "global_step": 360528, "epoch": 2146} {"train_loss": -12.369080543518066, "global_step": 360529, "epoch": 2146} {"train_loss": -12.435819625854492, "global_step": 360530, "epoch": 2146} {"train_loss": -12.235544204711914, "global_step": 360531, "epoch": 2146} {"train_loss": -12.210336685180664, "global_step": 360532, "epoch": 2146} {"train_loss": -12.550683975219727, "global_step": 360533, "epoch": 2146} {"train_loss": -12.328367233276367, "global_step": 360534, "epoch": 2146} {"train_loss": -12.274121284484863, "global_step": 360535, "epoch": 2146} {"train_loss": -12.34665584564209, "global_step": 360536, "epoch": 2146} {"train_loss": -12.490392684936523, "global_step": 360537, "epoch": 2146} {"train_loss": -12.180061340332031, "global_step": 360538, "epoch": 2146} {"train_loss": -12.543428421020508, "global_step": 360539, "epoch": 2146} {"train_loss": -12.453794479370117, "global_step": 360540, "epoch": 2146} {"train_loss": -12.493873596191406, "global_step": 360541, "epoch": 2146} {"train_loss": -12.377562522888184, "global_step": 360542, "epoch": 2146} {"train_loss": -12.634115219116211, "global_step": 360543, "epoch": 2146} {"train_loss": -12.335488319396973, "global_step": 360544, "epoch": 2146} {"train_loss": -12.560345649719238, "global_step": 360545, "epoch": 2146} {"train_loss": -12.479040145874023, "global_step": 360546, "epoch": 2146} {"train_loss": -12.502223014831543, "global_step": 360547, "epoch": 2146} {"train_loss": -12.525558471679688, "global_step": 360548, "epoch": 2146} {"train_loss": -12.540008544921875, "global_step": 360549, "epoch": 2146} {"train_loss": -12.536975860595703, "global_step": 360550, "epoch": 2146} {"train_loss": -12.627079010009766, "global_step": 360551, "epoch": 2146} {"train_loss": -12.487818717956543, "global_step": 360552, "epoch": 2146} {"train_loss": -12.762019157409668, "global_step": 360553, "epoch": 2146} {"train_loss": -12.385917663574219, "global_step": 360554, "epoch": 2146} {"train_loss": -12.631102561950684, "global_step": 360555, "epoch": 2146} {"train_loss": -12.641805648803711, "global_step": 360556, "epoch": 2146} {"train_loss": -12.46589469909668, "global_step": 360557, "epoch": 2146} {"train_loss": -12.591760635375977, "global_step": 360558, "epoch": 2146} {"train_loss": -12.601276397705078, "global_step": 360559, "epoch": 2146} {"train_loss": -12.63572883605957, "global_step": 360560, "epoch": 2146} {"train_loss": -12.603662490844727, "global_step": 360561, "epoch": 2146} {"train_loss": -12.316311836242676, "global_step": 360562, "epoch": 2146} {"train_loss": -12.433152198791504, "global_step": 360563, "epoch": 2146} {"train_loss": -12.496370315551758, "global_step": 360564, "epoch": 2146} {"train_loss": -12.59378719329834, "global_step": 360565, "epoch": 2146} {"train_loss": -12.610740661621094, "global_step": 360566, "epoch": 2146} {"train_loss": -12.043651580810547, "global_step": 360567, "epoch": 2146} {"train_loss": -12.370402336120605, "global_step": 360568, "epoch": 2146} {"train_loss": -12.539360046386719, "global_step": 360569, "epoch": 2146} {"train_loss": -12.51002311706543, "global_step": 360570, "epoch": 2146} {"train_loss": -12.540943145751953, "global_step": 360571, "epoch": 2146} {"train_loss": -12.79898738861084, "global_step": 360572, "epoch": 2146} {"train_loss": -12.703716278076172, "global_step": 360573, "epoch": 2146} {"train_loss": -12.58553695678711, "global_step": 360574, "epoch": 2146} {"train_loss": -12.504915237426758, "global_step": 360575, "epoch": 2146} {"train_loss": -12.467416763305664, "global_step": 360576, "epoch": 2146} {"train_loss": -12.56319808959961, "global_step": 360577, "epoch": 2146} {"train_loss": -12.409780502319336, "global_step": 360578, "epoch": 2146} {"train_loss": -11.323055267333984, "global_step": 360579, "epoch": 2146} {"train_loss": -12.05230712890625, "global_step": 360580, "epoch": 2146} {"train_loss": -12.596137046813965, "global_step": 360581, "epoch": 2146} {"train_loss": -11.947847366333008, "global_step": 360582, "epoch": 2146} {"train_loss": -12.029611587524414, "global_step": 360583, "epoch": 2146} {"train_loss": -12.007125854492188, "global_step": 360584, "epoch": 2146} {"train_loss": -12.516048431396484, "global_step": 360585, "epoch": 2146} {"train_loss": -12.12055778503418, "global_step": 360586, "epoch": 2146} {"train_loss": -11.175649642944336, "global_step": 360587, "epoch": 2146} {"train_loss": -12.08016586303711, "global_step": 360588, "epoch": 2146} {"train_loss": -12.626288414001465, "global_step": 360589, "epoch": 2146} {"train_loss": -11.44207763671875, "global_step": 360590, "epoch": 2146} {"train_loss": -10.774662017822266, "global_step": 360591, "epoch": 2146} {"train_loss": -12.450335502624512, "global_step": 360592, "epoch": 2146} {"train_loss": -11.265499114990234, "global_step": 360593, "epoch": 2146} {"train_loss": -10.378887176513672, "global_step": 360594, "epoch": 2146} {"train_loss": -12.337264060974121, "global_step": 360595, "epoch": 2146} {"train_loss": -10.955081939697266, "global_step": 360596, "epoch": 2146} {"train_loss": -12.350918769836426, "global_step": 360597, "epoch": 2146} {"train_loss": -10.833479881286621, "global_step": 360598, "epoch": 2146} {"train_loss": -11.050024032592773, "global_step": 360599, "epoch": 2146} {"train_loss": -11.442458152770996, "global_step": 360600, "epoch": 2146} {"train_loss": -10.332746505737305, "global_step": 360601, "epoch": 2146} {"train_loss": -10.163898468017578, "global_step": 360602, "epoch": 2146} {"train_loss": -10.79410457611084, "global_step": 360603, "epoch": 2146} {"train_loss": -10.412277221679688, "global_step": 360604, "epoch": 2146} {"train_loss": -10.762275695800781, "global_step": 360605, "epoch": 2146} {"train_loss": -10.633115768432617, "global_step": 360606, "epoch": 2146} {"train_loss": -11.290135383605957, "global_step": 360607, "epoch": 2146} {"train_loss": -10.814986228942871, "global_step": 360608, "epoch": 2146} {"train_loss": -10.98507308959961, "global_step": 360609, "epoch": 2146} {"train_loss": -10.636226654052734, "global_step": 360610, "epoch": 2146} {"train_loss": -11.179065704345703, "global_step": 360611, "epoch": 2146} {"train_loss": -10.426033020019531, "global_step": 360612, "epoch": 2146} {"train_loss": -11.30628490447998, "global_step": 360613, "epoch": 2146} {"train_loss": -10.383256912231445, "global_step": 360614, "epoch": 2146} {"train_loss": -11.367708206176758, "global_step": 360615, "epoch": 2146} {"train_loss": -11.791577339172363, "global_step": 360616, "epoch": 2146} {"train_loss": -11.015708923339844, "global_step": 360617, "epoch": 2146} {"train_loss": -12.072831153869629, "global_step": 360618, "epoch": 2146} {"train_loss": -11.684083938598633, "global_step": 360619, "epoch": 2146} {"train_loss": -11.612431526184082, "global_step": 360620, "epoch": 2146} {"train_loss": -11.157632827758789, "global_step": 360621, "epoch": 2146} {"train_loss": -11.569069862365723, "global_step": 360622, "epoch": 2146} {"train_loss": -11.847921371459961, "global_step": 360623, "epoch": 2146} {"train_loss": -11.460609436035156, "global_step": 360624, "epoch": 2146} {"train_loss": -11.48896598815918, "global_step": 360625, "epoch": 2146} {"train_loss": -11.726787567138672, "global_step": 360626, "epoch": 2146} {"train_loss": -11.314308166503906, "global_step": 360627, "epoch": 2146} {"train_loss": -11.88565444946289, "global_step": 360628, "epoch": 2146} {"train_loss": -10.976709365844727, "global_step": 360629, "epoch": 2146} {"train_loss": -11.624200820922852, "global_step": 360630, "epoch": 2146} {"train_loss": -11.456756591796875, "global_step": 360631, "epoch": 2146} {"train_loss": -11.511701583862305, "global_step": 360632, "epoch": 2146} {"train_loss": -11.878971099853516, "global_step": 360633, "epoch": 2146} {"train_loss": -12.01183032989502, "global_step": 360634, "epoch": 2146} {"train_loss": -11.660330772399902, "global_step": 360635, "epoch": 2146} {"train_loss": -11.315366744995117, "global_step": 360636, "epoch": 2146} {"train_loss": -11.843648910522461, "global_step": 360637, "epoch": 2146} {"train_loss": -11.644388198852539, "global_step": 360638, "epoch": 2146} {"train_loss": -11.965353965759277, "global_step": 360639, "epoch": 2146} {"train_loss": -11.51170539855957, "global_step": 360640, "epoch": 2146} {"train_loss": -12.176210403442383, "global_step": 360641, "epoch": 2146} {"train_loss": -12.034004211425781, "global_step": 360642, "epoch": 2146} {"train_loss": -12.1407470703125, "global_step": 360643, "epoch": 2146} {"train_loss": -11.582877159118652, "global_step": 360644, "epoch": 2146} {"train_loss": -12.02871322631836, "global_step": 360645, "epoch": 2146} {"train_loss": -12.02375602722168, "global_step": 360646, "epoch": 2146} {"train_loss": -12.074474334716797, "global_step": 360647, "epoch": 2146} {"train_loss": -12.299102783203125, "global_step": 360648, "epoch": 2146} {"train_loss": -11.739838600158691, "global_step": 360649, "epoch": 2146} {"train_loss": -12.09113883972168, "global_step": 360650, "epoch": 2146} {"train_loss": -11.747968673706055, "global_step": 360651, "epoch": 2146} {"train_loss": -12.344292640686035, "global_step": 360652, "epoch": 2146} {"train_loss": -12.048540115356445, "global_step": 360653, "epoch": 2146} {"train_loss": -12.103962898254395, "global_step": 360654, "epoch": 2146} {"train_loss": -11.974800109863281, "global_step": 360655, "epoch": 2146} {"train_loss": -11.970909118652344, "global_step": 360656, "epoch": 2146} {"train_loss": -12.24365234375, "global_step": 360657, "epoch": 2146} {"train_loss": -12.34689998626709, "global_step": 360658, "epoch": 2146} {"train_loss": -11.687477111816406, "global_step": 360659, "epoch": 2146} {"train_loss": -11.61212158203125, "global_step": 360660, "epoch": 2146} {"train_loss": -11.813232421875, "global_step": 360661, "epoch": 2146} {"train_loss": -11.84847640991211, "global_step": 360662, "epoch": 2146} {"train_loss": -11.378881454467773, "global_step": 360663, "epoch": 2146} {"train_loss": -11.887136459350586, "global_step": 360664, "epoch": 2146} {"train_loss": -11.839489936828613, "global_step": 360665, "epoch": 2146} {"train_loss": -11.345726013183594, "global_step": 360666, "epoch": 2146} {"train_loss": -11.979705810546875, "global_step": 360667, "epoch": 2146} {"train_loss": -11.168954849243164, "global_step": 360668, "epoch": 2146} {"train_loss": -12.044519424438477, "global_step": 360669, "epoch": 2146} {"train_loss": -11.563896179199219, "global_step": 360670, "epoch": 2146} {"train_loss": -11.85074520111084, "global_step": 360671, "epoch": 2146} {"train_loss": -11.988006591796875, "global_step": 360672, "epoch": 2146} {"train_loss": -12.137468338012695, "global_step": 360673, "epoch": 2146} {"train_loss": -11.683833122253418, "global_step": 360674, "epoch": 2146} {"train_loss": -11.868095397949219, "global_step": 360675, "epoch": 2146} {"train_loss": -11.931448936462402, "global_step": 360676, "epoch": 2146} {"train_loss": -12.00621223449707, "global_step": 360677, "epoch": 2146} {"train_loss": -11.943710327148438, "global_step": 360678, "epoch": 2146} {"train_loss": -11.614038467407227, "global_step": 360679, "epoch": 2146} {"train_loss": -12.424747467041016, "global_step": 360680, "epoch": 2146} {"train_loss": -11.866111755371094, "global_step": 360681, "epoch": 2146} {"train_loss": -12.136934280395508, "global_step": 360682, "epoch": 2146} {"train_loss": -11.905784606933594, "global_step": 360683, "epoch": 2146} {"train_loss": -12.252978324890137, "global_step": 360684, "epoch": 2146} {"train_loss": -11.899724960327148, "global_step": 360685, "epoch": 2146} {"train_loss": -11.881305694580078, "global_step": 360686, "epoch": 2146} {"train_loss": -12.124956130981445, "global_step": 360687, "epoch": 2146} {"train_loss": -11.914066314697266, "global_step": 360688, "epoch": 2146} {"train_loss": -12.552616119384766, "global_step": 360689, "epoch": 2146} {"train_loss": -12.294323921203613, "global_step": 360690, "epoch": 2146} {"train_loss": -11.466545104980469, "global_step": 360691, "epoch": 2146} {"train_loss": -12.393152236938477, "global_step": 360692, "epoch": 2146} {"train_loss": -12.18447208404541, "global_step": 360693, "epoch": 2146} {"train_loss": -12.451278686523438, "global_step": 360694, "epoch": 2146} {"train_loss": -11.929586694354104, "global_step": 360695, "epoch": 2146, "val_loss": 294006.28125} {"train_loss": -12.483745574951172, "global_step": 360696, "epoch": 2147} {"train_loss": -12.219465255737305, "global_step": 360697, "epoch": 2147} {"train_loss": -12.584342956542969, "global_step": 360698, "epoch": 2147} {"train_loss": -12.347797393798828, "global_step": 360699, "epoch": 2147} {"train_loss": -12.285368919372559, "global_step": 360700, "epoch": 2147} {"train_loss": -12.295818328857422, "global_step": 360701, "epoch": 2147} {"train_loss": -12.477819442749023, "global_step": 360702, "epoch": 2147} {"train_loss": -12.404308319091797, "global_step": 360703, "epoch": 2147} {"train_loss": -12.297094345092773, "global_step": 360704, "epoch": 2147} {"train_loss": -12.455785751342773, "global_step": 360705, "epoch": 2147} {"train_loss": -11.802312850952148, "global_step": 360706, "epoch": 2147} {"train_loss": -12.19819450378418, "global_step": 360707, "epoch": 2147} {"train_loss": -12.389240264892578, "global_step": 360708, "epoch": 2147} {"train_loss": -12.416244506835938, "global_step": 360709, "epoch": 2147} {"train_loss": -12.366395950317383, "global_step": 360710, "epoch": 2147} {"train_loss": -12.568058013916016, "global_step": 360711, "epoch": 2147} {"train_loss": -12.355222702026367, "global_step": 360712, "epoch": 2147} {"train_loss": -12.68182373046875, "global_step": 360713, "epoch": 2147} {"train_loss": -12.432319641113281, "global_step": 360714, "epoch": 2147} {"train_loss": -12.576004028320312, "global_step": 360715, "epoch": 2147} {"train_loss": -12.371282577514648, "global_step": 360716, "epoch": 2147} {"train_loss": -12.494216918945312, "global_step": 360717, "epoch": 2147} {"train_loss": -12.497285842895508, "global_step": 360718, "epoch": 2147} {"train_loss": -12.52470588684082, "global_step": 360719, "epoch": 2147} {"train_loss": -12.78225326538086, "global_step": 360720, "epoch": 2147} {"train_loss": -12.478546142578125, "global_step": 360721, "epoch": 2147} {"train_loss": -12.379642486572266, "global_step": 360722, "epoch": 2147} {"train_loss": -12.343664169311523, "global_step": 360723, "epoch": 2147} {"train_loss": -12.67294692993164, "global_step": 360724, "epoch": 2147} {"train_loss": -12.682106971740723, "global_step": 360725, "epoch": 2147} {"train_loss": -12.134027481079102, "global_step": 360726, "epoch": 2147} {"train_loss": -12.444473266601562, "global_step": 360727, "epoch": 2147} {"train_loss": -12.09381103515625, "global_step": 360728, "epoch": 2147} {"train_loss": -11.902749061584473, "global_step": 360729, "epoch": 2147} {"train_loss": -12.25735092163086, "global_step": 360730, "epoch": 2147} {"train_loss": -11.824182510375977, "global_step": 360731, "epoch": 2147} {"train_loss": -11.474693298339844, "global_step": 360732, "epoch": 2147} {"train_loss": -12.095528602600098, "global_step": 360733, "epoch": 2147} {"train_loss": -11.50298023223877, "global_step": 360734, "epoch": 2147} {"train_loss": -10.628122329711914, "global_step": 360735, "epoch": 2147} {"train_loss": -11.494978904724121, "global_step": 360736, "epoch": 2147} {"train_loss": -9.8930082321167, "global_step": 360737, "epoch": 2147} {"train_loss": -11.414999008178711, "global_step": 360738, "epoch": 2147} {"train_loss": -10.707267761230469, "global_step": 360739, "epoch": 2147} {"train_loss": -9.675027847290039, "global_step": 360740, "epoch": 2147} {"train_loss": -10.487314224243164, "global_step": 360741, "epoch": 2147} {"train_loss": -11.37856674194336, "global_step": 360742, "epoch": 2147} {"train_loss": -9.659431457519531, "global_step": 360743, "epoch": 2147} {"train_loss": -10.448987007141113, "global_step": 360744, "epoch": 2147} {"train_loss": -9.914649963378906, "global_step": 360745, "epoch": 2147} {"train_loss": -11.175715446472168, "global_step": 360746, "epoch": 2147} {"train_loss": -11.695810317993164, "global_step": 360747, "epoch": 2147} {"train_loss": -10.678741455078125, "global_step": 360748, "epoch": 2147} {"train_loss": -11.969549179077148, "global_step": 360749, "epoch": 2147} {"train_loss": -11.297754287719727, "global_step": 360750, "epoch": 2147} {"train_loss": -11.187281608581543, "global_step": 360751, "epoch": 2147} {"train_loss": -11.746072769165039, "global_step": 360752, "epoch": 2147} {"train_loss": -11.418424606323242, "global_step": 360753, "epoch": 2147} {"train_loss": -11.331528663635254, "global_step": 360754, "epoch": 2147} {"train_loss": -11.97891616821289, "global_step": 360755, "epoch": 2147} {"train_loss": -11.509137153625488, "global_step": 360756, "epoch": 2147} {"train_loss": -11.578380584716797, "global_step": 360757, "epoch": 2147} {"train_loss": -11.379373550415039, "global_step": 360758, "epoch": 2147} {"train_loss": -11.473102569580078, "global_step": 360759, "epoch": 2147} {"train_loss": -11.65994644165039, "global_step": 360760, "epoch": 2147} {"train_loss": -11.80122184753418, "global_step": 360761, "epoch": 2147} {"train_loss": -11.730619430541992, "global_step": 360762, "epoch": 2147} {"train_loss": -11.716442108154297, "global_step": 360763, "epoch": 2147} {"train_loss": -11.67732048034668, "global_step": 360764, "epoch": 2147} {"train_loss": -11.423370361328125, "global_step": 360765, "epoch": 2147} {"train_loss": -11.845630645751953, "global_step": 360766, "epoch": 2147} {"train_loss": -11.765256881713867, "global_step": 360767, "epoch": 2147} {"train_loss": -11.35747241973877, "global_step": 360768, "epoch": 2147} {"train_loss": -11.57088851928711, "global_step": 360769, "epoch": 2147} {"train_loss": -11.573738098144531, "global_step": 360770, "epoch": 2147} {"train_loss": -11.271303176879883, "global_step": 360771, "epoch": 2147} {"train_loss": -11.91114616394043, "global_step": 360772, "epoch": 2147} {"train_loss": -11.547415733337402, "global_step": 360773, "epoch": 2147} {"train_loss": -12.161834716796875, "global_step": 360774, "epoch": 2147} {"train_loss": -12.071023941040039, "global_step": 360775, "epoch": 2147} {"train_loss": -12.057305335998535, "global_step": 360776, "epoch": 2147} {"train_loss": -12.409730911254883, "global_step": 360777, "epoch": 2147} {"train_loss": -11.90110969543457, "global_step": 360778, "epoch": 2147} {"train_loss": -11.991175651550293, "global_step": 360779, "epoch": 2147} {"train_loss": -12.045783996582031, "global_step": 360780, "epoch": 2147} {"train_loss": -12.023771286010742, "global_step": 360781, "epoch": 2147} {"train_loss": -11.854881286621094, "global_step": 360782, "epoch": 2147} {"train_loss": -12.084575653076172, "global_step": 360783, "epoch": 2147} {"train_loss": -12.219442367553711, "global_step": 360784, "epoch": 2147} {"train_loss": -12.00490665435791, "global_step": 360785, "epoch": 2147} {"train_loss": -12.128275871276855, "global_step": 360786, "epoch": 2147} {"train_loss": -12.10179328918457, "global_step": 360787, "epoch": 2147} {"train_loss": -12.228108406066895, "global_step": 360788, "epoch": 2147} {"train_loss": -12.450716972351074, "global_step": 360789, "epoch": 2147} {"train_loss": -11.91012954711914, "global_step": 360790, "epoch": 2147} {"train_loss": -12.217395782470703, "global_step": 360791, "epoch": 2147} {"train_loss": -11.68862533569336, "global_step": 360792, "epoch": 2147} {"train_loss": -11.917167663574219, "global_step": 360793, "epoch": 2147} {"train_loss": -11.95315170288086, "global_step": 360794, "epoch": 2147} {"train_loss": -11.414981842041016, "global_step": 360795, "epoch": 2147} {"train_loss": -11.827760696411133, "global_step": 360796, "epoch": 2147} {"train_loss": -11.624505996704102, "global_step": 360797, "epoch": 2147} {"train_loss": -12.260770797729492, "global_step": 360798, "epoch": 2147} {"train_loss": -12.0986328125, "global_step": 360799, "epoch": 2147} {"train_loss": -12.336787223815918, "global_step": 360800, "epoch": 2147} {"train_loss": -11.897831916809082, "global_step": 360801, "epoch": 2147} {"train_loss": -12.164583206176758, "global_step": 360802, "epoch": 2147} {"train_loss": -12.12112808227539, "global_step": 360803, "epoch": 2147} {"train_loss": -11.80039119720459, "global_step": 360804, "epoch": 2147} {"train_loss": -12.316165924072266, "global_step": 360805, "epoch": 2147} {"train_loss": -11.984380722045898, "global_step": 360806, "epoch": 2147} {"train_loss": -12.336851119995117, "global_step": 360807, "epoch": 2147} {"train_loss": -12.46721363067627, "global_step": 360808, "epoch": 2147} {"train_loss": -12.172639846801758, "global_step": 360809, "epoch": 2147} {"train_loss": -12.483016967773438, "global_step": 360810, "epoch": 2147} {"train_loss": -12.350373268127441, "global_step": 360811, "epoch": 2147} {"train_loss": -12.264710426330566, "global_step": 360812, "epoch": 2147} {"train_loss": -12.681270599365234, "global_step": 360813, "epoch": 2147} {"train_loss": -12.154022216796875, "global_step": 360814, "epoch": 2147} {"train_loss": -12.338994979858398, "global_step": 360815, "epoch": 2147} {"train_loss": -12.367572784423828, "global_step": 360816, "epoch": 2147} {"train_loss": -12.411040306091309, "global_step": 360817, "epoch": 2147} {"train_loss": -12.189430236816406, "global_step": 360818, "epoch": 2147} {"train_loss": -11.858551025390625, "global_step": 360819, "epoch": 2147} {"train_loss": -12.451942443847656, "global_step": 360820, "epoch": 2147} {"train_loss": -12.24888801574707, "global_step": 360821, "epoch": 2147} {"train_loss": -12.077351570129395, "global_step": 360822, "epoch": 2147} {"train_loss": -12.377538681030273, "global_step": 360823, "epoch": 2147} {"train_loss": -12.250465393066406, "global_step": 360824, "epoch": 2147} {"train_loss": -12.359628677368164, "global_step": 360825, "epoch": 2147} {"train_loss": -11.978078842163086, "global_step": 360826, "epoch": 2147} {"train_loss": -12.284835815429688, "global_step": 360827, "epoch": 2147} {"train_loss": -12.323488235473633, "global_step": 360828, "epoch": 2147} {"train_loss": -12.401525497436523, "global_step": 360829, "epoch": 2147} {"train_loss": -12.306148529052734, "global_step": 360830, "epoch": 2147} {"train_loss": -12.07327938079834, "global_step": 360831, "epoch": 2147} {"train_loss": -12.467811584472656, "global_step": 360832, "epoch": 2147} {"train_loss": -12.203176498413086, "global_step": 360833, "epoch": 2147} {"train_loss": -12.29818058013916, "global_step": 360834, "epoch": 2147} {"train_loss": -12.3619966506958, "global_step": 360835, "epoch": 2147} {"train_loss": -12.160521507263184, "global_step": 360836, "epoch": 2147} {"train_loss": -12.005826950073242, "global_step": 360837, "epoch": 2147} {"train_loss": -12.472294807434082, "global_step": 360838, "epoch": 2147} {"train_loss": -12.524354934692383, "global_step": 360839, "epoch": 2147} {"train_loss": -12.462454795837402, "global_step": 360840, "epoch": 2147} {"train_loss": -12.323342323303223, "global_step": 360841, "epoch": 2147} {"train_loss": -12.560678482055664, "global_step": 360842, "epoch": 2147} {"train_loss": -12.350997924804688, "global_step": 360843, "epoch": 2147} {"train_loss": -11.881949424743652, "global_step": 360844, "epoch": 2147} {"train_loss": -12.50352668762207, "global_step": 360845, "epoch": 2147} {"train_loss": -12.510822296142578, "global_step": 360846, "epoch": 2147} {"train_loss": -12.078749656677246, "global_step": 360847, "epoch": 2147} {"train_loss": -12.631710052490234, "global_step": 360848, "epoch": 2147} {"train_loss": -12.132156372070312, "global_step": 360849, "epoch": 2147} {"train_loss": -11.786450386047363, "global_step": 360850, "epoch": 2147} {"train_loss": -12.547849655151367, "global_step": 360851, "epoch": 2147} {"train_loss": -12.329463958740234, "global_step": 360852, "epoch": 2147} {"train_loss": -11.942611694335938, "global_step": 360853, "epoch": 2147} {"train_loss": -12.550834655761719, "global_step": 360854, "epoch": 2147} {"train_loss": -12.323087692260742, "global_step": 360855, "epoch": 2147} {"train_loss": -12.46826457977295, "global_step": 360856, "epoch": 2147} {"train_loss": -12.348306655883789, "global_step": 360857, "epoch": 2147} {"train_loss": -12.470906257629395, "global_step": 360858, "epoch": 2147} {"train_loss": -12.563167572021484, "global_step": 360859, "epoch": 2147} {"train_loss": -12.42582893371582, "global_step": 360860, "epoch": 2147} {"train_loss": -12.26578140258789, "global_step": 360861, "epoch": 2147} {"train_loss": -12.575450897216797, "global_step": 360862, "epoch": 2147} {"train_loss": -12.017431520280384, "global_step": 360863, "epoch": 2147, "val_loss": 285662.90625} {"train_loss": -12.486222267150879, "global_step": 360864, "epoch": 2148} {"train_loss": -12.424705505371094, "global_step": 360865, "epoch": 2148} {"train_loss": -12.333690643310547, "global_step": 360866, "epoch": 2148} {"train_loss": -12.045726776123047, "global_step": 360867, "epoch": 2148} {"train_loss": -12.422794342041016, "global_step": 360868, "epoch": 2148} {"train_loss": -12.231372833251953, "global_step": 360869, "epoch": 2148} {"train_loss": -12.701520919799805, "global_step": 360870, "epoch": 2148} {"train_loss": -12.586034774780273, "global_step": 360871, "epoch": 2148} {"train_loss": -12.267951965332031, "global_step": 360872, "epoch": 2148} {"train_loss": -12.449987411499023, "global_step": 360873, "epoch": 2148} {"train_loss": -12.309901237487793, "global_step": 360874, "epoch": 2148} {"train_loss": -12.568557739257812, "global_step": 360875, "epoch": 2148} {"train_loss": -12.296363830566406, "global_step": 360876, "epoch": 2148} {"train_loss": -12.497552871704102, "global_step": 360877, "epoch": 2148} {"train_loss": -12.428762435913086, "global_step": 360878, "epoch": 2148} {"train_loss": -12.677475929260254, "global_step": 360879, "epoch": 2148} {"train_loss": -12.367524147033691, "global_step": 360880, "epoch": 2148} {"train_loss": -12.117057800292969, "global_step": 360881, "epoch": 2148} {"train_loss": -12.282509803771973, "global_step": 360882, "epoch": 2148} {"train_loss": -12.347238540649414, "global_step": 360883, "epoch": 2148} {"train_loss": -12.323330879211426, "global_step": 360884, "epoch": 2148} {"train_loss": -12.412230491638184, "global_step": 360885, "epoch": 2148} {"train_loss": -12.240030288696289, "global_step": 360886, "epoch": 2148} {"train_loss": -12.449467658996582, "global_step": 360887, "epoch": 2148} {"train_loss": -12.329971313476562, "global_step": 360888, "epoch": 2148} {"train_loss": -12.398337364196777, "global_step": 360889, "epoch": 2148} {"train_loss": -12.332584381103516, "global_step": 360890, "epoch": 2148} {"train_loss": -12.304128646850586, "global_step": 360891, "epoch": 2148} {"train_loss": -12.658668518066406, "global_step": 360892, "epoch": 2148} {"train_loss": -12.348140716552734, "global_step": 360893, "epoch": 2148} {"train_loss": -12.393362045288086, "global_step": 360894, "epoch": 2148} {"train_loss": -12.267786026000977, "global_step": 360895, "epoch": 2148} {"train_loss": -11.919112205505371, "global_step": 360896, "epoch": 2148} {"train_loss": -12.02342700958252, "global_step": 360897, "epoch": 2148} {"train_loss": -11.644257545471191, "global_step": 360898, "epoch": 2148} {"train_loss": -10.953597068786621, "global_step": 360899, "epoch": 2148} {"train_loss": -10.977084159851074, "global_step": 360900, "epoch": 2148} {"train_loss": -12.0287446975708, "global_step": 360901, "epoch": 2148} {"train_loss": -11.104900360107422, "global_step": 360902, "epoch": 2148} {"train_loss": -9.323345184326172, "global_step": 360903, "epoch": 2148} {"train_loss": -11.51567268371582, "global_step": 360904, "epoch": 2148} {"train_loss": -7.736388206481934, "global_step": 360905, "epoch": 2148} {"train_loss": -9.953888893127441, "global_step": 360906, "epoch": 2148} {"train_loss": -7.71298885345459, "global_step": 360907, "epoch": 2148} {"train_loss": -7.046806335449219, "global_step": 360908, "epoch": 2148} {"train_loss": -7.329892158508301, "global_step": 360909, "epoch": 2148} {"train_loss": -7.596109867095947, "global_step": 360910, "epoch": 2148} {"train_loss": -9.691263198852539, "global_step": 360911, "epoch": 2148} {"train_loss": -7.871768951416016, "global_step": 360912, "epoch": 2148} {"train_loss": -8.938740730285645, "global_step": 360913, "epoch": 2148} {"train_loss": -7.8775482177734375, "global_step": 360914, "epoch": 2148} {"train_loss": -7.820739269256592, "global_step": 360915, "epoch": 2148} {"train_loss": -7.461179733276367, "global_step": 360916, "epoch": 2148} {"train_loss": -8.362842559814453, "global_step": 360917, "epoch": 2148} {"train_loss": -8.752071380615234, "global_step": 360918, "epoch": 2148} {"train_loss": -8.346294403076172, "global_step": 360919, "epoch": 2148} {"train_loss": -6.944117069244385, "global_step": 360920, "epoch": 2148} {"train_loss": -7.691174507141113, "global_step": 360921, "epoch": 2148} {"train_loss": -7.78551721572876, "global_step": 360922, "epoch": 2148} {"train_loss": -7.69757080078125, "global_step": 360923, "epoch": 2148} {"train_loss": -8.95703411102295, "global_step": 360924, "epoch": 2148} {"train_loss": -7.526682376861572, "global_step": 360925, "epoch": 2148} {"train_loss": -8.165218353271484, "global_step": 360926, "epoch": 2148} {"train_loss": -8.914200782775879, "global_step": 360927, "epoch": 2148} {"train_loss": -8.513671875, "global_step": 360928, "epoch": 2148} {"train_loss": -10.2575044631958, "global_step": 360929, "epoch": 2148} {"train_loss": -10.207216262817383, "global_step": 360930, "epoch": 2148} {"train_loss": -9.529138565063477, "global_step": 360931, "epoch": 2148} {"train_loss": -11.161576271057129, "global_step": 360932, "epoch": 2148} {"train_loss": -9.98311996459961, "global_step": 360933, "epoch": 2148} {"train_loss": -9.59485912322998, "global_step": 360934, "epoch": 2148} {"train_loss": -9.100687026977539, "global_step": 360935, "epoch": 2148} {"train_loss": -8.981121063232422, "global_step": 360936, "epoch": 2148} {"train_loss": -9.320816040039062, "global_step": 360937, "epoch": 2148} {"train_loss": -10.263787269592285, "global_step": 360938, "epoch": 2148} {"train_loss": -9.883293151855469, "global_step": 360939, "epoch": 2148} {"train_loss": -9.812505722045898, "global_step": 360940, "epoch": 2148} {"train_loss": -9.62148666381836, "global_step": 360941, "epoch": 2148} {"train_loss": -9.617376327514648, "global_step": 360942, "epoch": 2148} {"train_loss": -9.627849578857422, "global_step": 360943, "epoch": 2148} {"train_loss": -10.673833847045898, "global_step": 360944, "epoch": 2148} {"train_loss": -10.97494125366211, "global_step": 360945, "epoch": 2148} {"train_loss": -9.898371696472168, "global_step": 360946, "epoch": 2148} {"train_loss": -10.517492294311523, "global_step": 360947, "epoch": 2148} {"train_loss": -11.290090560913086, "global_step": 360948, "epoch": 2148} {"train_loss": -10.546926498413086, "global_step": 360949, "epoch": 2148} {"train_loss": -10.919462203979492, "global_step": 360950, "epoch": 2148} {"train_loss": -11.128984451293945, "global_step": 360951, "epoch": 2148} {"train_loss": -10.774109840393066, "global_step": 360952, "epoch": 2148} {"train_loss": -11.433422088623047, "global_step": 360953, "epoch": 2148} {"train_loss": -11.537321090698242, "global_step": 360954, "epoch": 2148} {"train_loss": -11.375438690185547, "global_step": 360955, "epoch": 2148} {"train_loss": -11.099576950073242, "global_step": 360956, "epoch": 2148} {"train_loss": -11.187923431396484, "global_step": 360957, "epoch": 2148} {"train_loss": -12.012527465820312, "global_step": 360958, "epoch": 2148} {"train_loss": -11.186701774597168, "global_step": 360959, "epoch": 2148} {"train_loss": -11.20025634765625, "global_step": 360960, "epoch": 2148} {"train_loss": -11.669416427612305, "global_step": 360961, "epoch": 2148} {"train_loss": -11.309944152832031, "global_step": 360962, "epoch": 2148} {"train_loss": -11.651472091674805, "global_step": 360963, "epoch": 2148} {"train_loss": -11.574248313903809, "global_step": 360964, "epoch": 2148} {"train_loss": -11.745988845825195, "global_step": 360965, "epoch": 2148} {"train_loss": -11.309453964233398, "global_step": 360966, "epoch": 2148} {"train_loss": -11.853315353393555, "global_step": 360967, "epoch": 2148} {"train_loss": -11.921516418457031, "global_step": 360968, "epoch": 2148} {"train_loss": -11.811667442321777, "global_step": 360969, "epoch": 2148} {"train_loss": -12.118167877197266, "global_step": 360970, "epoch": 2148} {"train_loss": -11.886209487915039, "global_step": 360971, "epoch": 2148} {"train_loss": -11.908345222473145, "global_step": 360972, "epoch": 2148} {"train_loss": -11.784980773925781, "global_step": 360973, "epoch": 2148} {"train_loss": -12.100407600402832, "global_step": 360974, "epoch": 2148} {"train_loss": -11.903228759765625, "global_step": 360975, "epoch": 2148} {"train_loss": -11.731078147888184, "global_step": 360976, "epoch": 2148} {"train_loss": -11.900615692138672, "global_step": 360977, "epoch": 2148} {"train_loss": -12.024718284606934, "global_step": 360978, "epoch": 2148} {"train_loss": -11.954373359680176, "global_step": 360979, "epoch": 2148} {"train_loss": -11.713666915893555, "global_step": 360980, "epoch": 2148} {"train_loss": -12.000200271606445, "global_step": 360981, "epoch": 2148} {"train_loss": -11.985795021057129, "global_step": 360982, "epoch": 2148} {"train_loss": -12.166768074035645, "global_step": 360983, "epoch": 2148} {"train_loss": -12.148900985717773, "global_step": 360984, "epoch": 2148} {"train_loss": -12.066627502441406, "global_step": 360985, "epoch": 2148} {"train_loss": -12.034355163574219, "global_step": 360986, "epoch": 2148} {"train_loss": -12.172380447387695, "global_step": 360987, "epoch": 2148} {"train_loss": -12.2501220703125, "global_step": 360988, "epoch": 2148} {"train_loss": -12.095073699951172, "global_step": 360989, "epoch": 2148} {"train_loss": -12.238873481750488, "global_step": 360990, "epoch": 2148} {"train_loss": -12.145950317382812, "global_step": 360991, "epoch": 2148} {"train_loss": -12.204133033752441, "global_step": 360992, "epoch": 2148} {"train_loss": -12.28197956085205, "global_step": 360993, "epoch": 2148} {"train_loss": -12.033466339111328, "global_step": 360994, "epoch": 2148} {"train_loss": -12.179523468017578, "global_step": 360995, "epoch": 2148} {"train_loss": -12.308942794799805, "global_step": 360996, "epoch": 2148} {"train_loss": -12.115747451782227, "global_step": 360997, "epoch": 2148} {"train_loss": -11.989341735839844, "global_step": 360998, "epoch": 2148} {"train_loss": -12.353342056274414, "global_step": 360999, "epoch": 2148} {"train_loss": -12.311972618103027, "global_step": 361000, "epoch": 2148} {"train_loss": -12.138980865478516, "global_step": 361001, "epoch": 2148} {"train_loss": -12.14078426361084, "global_step": 361002, "epoch": 2148} {"train_loss": -12.360260009765625, "global_step": 361003, "epoch": 2148} {"train_loss": -12.51576042175293, "global_step": 361004, "epoch": 2148} {"train_loss": -12.09451675415039, "global_step": 361005, "epoch": 2148} {"train_loss": -12.343408584594727, "global_step": 361006, "epoch": 2148} {"train_loss": -12.331823348999023, "global_step": 361007, "epoch": 2148} {"train_loss": -12.431975364685059, "global_step": 361008, "epoch": 2148} {"train_loss": -12.432662010192871, "global_step": 361009, "epoch": 2148} {"train_loss": -12.080482482910156, "global_step": 361010, "epoch": 2148} {"train_loss": -12.164856910705566, "global_step": 361011, "epoch": 2148} {"train_loss": -12.405267715454102, "global_step": 361012, "epoch": 2148} {"train_loss": -12.398619651794434, "global_step": 361013, "epoch": 2148} {"train_loss": -12.439144134521484, "global_step": 361014, "epoch": 2148} {"train_loss": -12.530891418457031, "global_step": 361015, "epoch": 2148} {"train_loss": -12.57715129852295, "global_step": 361016, "epoch": 2148} {"train_loss": -12.033210754394531, "global_step": 361017, "epoch": 2148} {"train_loss": -12.451425552368164, "global_step": 361018, "epoch": 2148} {"train_loss": -12.523140907287598, "global_step": 361019, "epoch": 2148} {"train_loss": -12.504009246826172, "global_step": 361020, "epoch": 2148} {"train_loss": -12.42457389831543, "global_step": 361021, "epoch": 2148} {"train_loss": -12.467897415161133, "global_step": 361022, "epoch": 2148} {"train_loss": -12.161713600158691, "global_step": 361023, "epoch": 2148} {"train_loss": -12.571098327636719, "global_step": 361024, "epoch": 2148} {"train_loss": -12.63062858581543, "global_step": 361025, "epoch": 2148} {"train_loss": -12.614583015441895, "global_step": 361026, "epoch": 2148} {"train_loss": -12.411916732788086, "global_step": 361027, "epoch": 2148} {"train_loss": -12.33957290649414, "global_step": 361028, "epoch": 2148} {"train_loss": -12.515039443969727, "global_step": 361029, "epoch": 2148} {"train_loss": -12.449576377868652, "global_step": 361030, "epoch": 2148} {"train_loss": -11.248898100285302, "global_step": 361031, "epoch": 2148, "val_loss": 294478.78125} {"train_loss": -12.49136734008789, "global_step": 361032, "epoch": 2149} {"train_loss": -12.054931640625, "global_step": 361033, "epoch": 2149} {"train_loss": -12.109369277954102, "global_step": 361034, "epoch": 2149} {"train_loss": -12.318716049194336, "global_step": 361035, "epoch": 2149} {"train_loss": -12.260332107543945, "global_step": 361036, "epoch": 2149} {"train_loss": -12.034721374511719, "global_step": 361037, "epoch": 2149} {"train_loss": -12.257806777954102, "global_step": 361038, "epoch": 2149} {"train_loss": -12.396471977233887, "global_step": 361039, "epoch": 2149} {"train_loss": -11.69864559173584, "global_step": 361040, "epoch": 2149} {"train_loss": -11.653791427612305, "global_step": 361041, "epoch": 2149} {"train_loss": -11.449455261230469, "global_step": 361042, "epoch": 2149} {"train_loss": -12.645842552185059, "global_step": 361043, "epoch": 2149} {"train_loss": -12.471111297607422, "global_step": 361044, "epoch": 2149} {"train_loss": -12.084840774536133, "global_step": 361045, "epoch": 2149} {"train_loss": -12.261198043823242, "global_step": 361046, "epoch": 2149} {"train_loss": -12.238990783691406, "global_step": 361047, "epoch": 2149} {"train_loss": -12.243196487426758, "global_step": 361048, "epoch": 2149} {"train_loss": -12.355063438415527, "global_step": 361049, "epoch": 2149} {"train_loss": -12.394923210144043, "global_step": 361050, "epoch": 2149} {"train_loss": -12.526307106018066, "global_step": 361051, "epoch": 2149} {"train_loss": -12.23072338104248, "global_step": 361052, "epoch": 2149} {"train_loss": -12.439065933227539, "global_step": 361053, "epoch": 2149} {"train_loss": -12.29189682006836, "global_step": 361054, "epoch": 2149} {"train_loss": -12.228410720825195, "global_step": 361055, "epoch": 2149} {"train_loss": -12.263996124267578, "global_step": 361056, "epoch": 2149} {"train_loss": -12.358505249023438, "global_step": 361057, "epoch": 2149} {"train_loss": -11.496313095092773, "global_step": 361058, "epoch": 2149} {"train_loss": -11.488067626953125, "global_step": 361059, "epoch": 2149} {"train_loss": -11.86652660369873, "global_step": 361060, "epoch": 2149} {"train_loss": -12.287256240844727, "global_step": 361061, "epoch": 2149} {"train_loss": -12.03347110748291, "global_step": 361062, "epoch": 2149} {"train_loss": -12.187100410461426, "global_step": 361063, "epoch": 2149} {"train_loss": -12.004725456237793, "global_step": 361064, "epoch": 2149} {"train_loss": -12.230769157409668, "global_step": 361065, "epoch": 2149} {"train_loss": -12.035202026367188, "global_step": 361066, "epoch": 2149} {"train_loss": -11.914012908935547, "global_step": 361067, "epoch": 2149} {"train_loss": -11.888933181762695, "global_step": 361068, "epoch": 2149} {"train_loss": -11.79784107208252, "global_step": 361069, "epoch": 2149} {"train_loss": -11.5908203125, "global_step": 361070, "epoch": 2149} {"train_loss": -11.889204025268555, "global_step": 361071, "epoch": 2149} {"train_loss": -11.817535400390625, "global_step": 361072, "epoch": 2149} {"train_loss": -11.99466323852539, "global_step": 361073, "epoch": 2149} {"train_loss": -12.162115097045898, "global_step": 361074, "epoch": 2149} {"train_loss": -11.444840431213379, "global_step": 361075, "epoch": 2149} {"train_loss": -11.351641654968262, "global_step": 361076, "epoch": 2149} {"train_loss": -12.27556324005127, "global_step": 361077, "epoch": 2149} {"train_loss": -11.167132377624512, "global_step": 361078, "epoch": 2149} {"train_loss": -11.758411407470703, "global_step": 361079, "epoch": 2149} {"train_loss": -11.543741226196289, "global_step": 361080, "epoch": 2149} {"train_loss": -12.134218215942383, "global_step": 361081, "epoch": 2149} {"train_loss": -11.66357421875, "global_step": 361082, "epoch": 2149} {"train_loss": -12.230573654174805, "global_step": 361083, "epoch": 2149} {"train_loss": -11.76817512512207, "global_step": 361084, "epoch": 2149} {"train_loss": -12.09119987487793, "global_step": 361085, "epoch": 2149} {"train_loss": -11.474893569946289, "global_step": 361086, "epoch": 2149} {"train_loss": -12.328781127929688, "global_step": 361087, "epoch": 2149} {"train_loss": -12.348983764648438, "global_step": 361088, "epoch": 2149} {"train_loss": -11.889588356018066, "global_step": 361089, "epoch": 2149} {"train_loss": -12.418710708618164, "global_step": 361090, "epoch": 2149} {"train_loss": -12.41015625, "global_step": 361091, "epoch": 2149} {"train_loss": -12.185986518859863, "global_step": 361092, "epoch": 2149} {"train_loss": -11.997517585754395, "global_step": 361093, "epoch": 2149} {"train_loss": -12.482690811157227, "global_step": 361094, "epoch": 2149} {"train_loss": -12.211481094360352, "global_step": 361095, "epoch": 2149} {"train_loss": -12.446062088012695, "global_step": 361096, "epoch": 2149} {"train_loss": -12.460044860839844, "global_step": 361097, "epoch": 2149} {"train_loss": -11.9287691116333, "global_step": 361098, "epoch": 2149} {"train_loss": -12.4485502243042, "global_step": 361099, "epoch": 2149} {"train_loss": -12.121794700622559, "global_step": 361100, "epoch": 2149} {"train_loss": -11.910935401916504, "global_step": 361101, "epoch": 2149} {"train_loss": -12.448731422424316, "global_step": 361102, "epoch": 2149} {"train_loss": -11.60558032989502, "global_step": 361103, "epoch": 2149} {"train_loss": -12.382798194885254, "global_step": 361104, "epoch": 2149} {"train_loss": -12.29231071472168, "global_step": 361105, "epoch": 2149} {"train_loss": -11.507494926452637, "global_step": 361106, "epoch": 2149} {"train_loss": -11.889932632446289, "global_step": 361107, "epoch": 2149} {"train_loss": -12.325973510742188, "global_step": 361108, "epoch": 2149} {"train_loss": -12.062203407287598, "global_step": 361109, "epoch": 2149} {"train_loss": -12.446616172790527, "global_step": 361110, "epoch": 2149} {"train_loss": -11.900583267211914, "global_step": 361111, "epoch": 2149} {"train_loss": -12.488468170166016, "global_step": 361112, "epoch": 2149} {"train_loss": -12.159280776977539, "global_step": 361113, "epoch": 2149} {"train_loss": -12.088644027709961, "global_step": 361114, "epoch": 2149} {"train_loss": -12.390373229980469, "global_step": 361115, "epoch": 2149} {"train_loss": -12.214436531066895, "global_step": 361116, "epoch": 2149} {"train_loss": -12.401851654052734, "global_step": 361117, "epoch": 2149} {"train_loss": -12.144062995910645, "global_step": 361118, "epoch": 2149} {"train_loss": -11.739288330078125, "global_step": 361119, "epoch": 2149} {"train_loss": -12.181846618652344, "global_step": 361120, "epoch": 2149} {"train_loss": -12.609743118286133, "global_step": 361121, "epoch": 2149} {"train_loss": -12.121688842773438, "global_step": 361122, "epoch": 2149} {"train_loss": -12.17317008972168, "global_step": 361123, "epoch": 2149} {"train_loss": -12.716875076293945, "global_step": 361124, "epoch": 2149} {"train_loss": -11.706256866455078, "global_step": 361125, "epoch": 2149} {"train_loss": -11.645280838012695, "global_step": 361126, "epoch": 2149} {"train_loss": -11.912298202514648, "global_step": 361127, "epoch": 2149} {"train_loss": -12.482193946838379, "global_step": 361128, "epoch": 2149} {"train_loss": -12.023136138916016, "global_step": 361129, "epoch": 2149} {"train_loss": -11.594673156738281, "global_step": 361130, "epoch": 2149} {"train_loss": -12.118117332458496, "global_step": 361131, "epoch": 2149} {"train_loss": -12.17800521850586, "global_step": 361132, "epoch": 2149} {"train_loss": -12.054038047790527, "global_step": 361133, "epoch": 2149} {"train_loss": -12.033987045288086, "global_step": 361134, "epoch": 2149} {"train_loss": -12.119525909423828, "global_step": 361135, "epoch": 2149} {"train_loss": -12.113269805908203, "global_step": 361136, "epoch": 2149} {"train_loss": -12.412925720214844, "global_step": 361137, "epoch": 2149} {"train_loss": -11.965139389038086, "global_step": 361138, "epoch": 2149} {"train_loss": -12.063716888427734, "global_step": 361139, "epoch": 2149} {"train_loss": -12.306995391845703, "global_step": 361140, "epoch": 2149} {"train_loss": -12.224594116210938, "global_step": 361141, "epoch": 2149} {"train_loss": -12.503558158874512, "global_step": 361142, "epoch": 2149} {"train_loss": -12.199508666992188, "global_step": 361143, "epoch": 2149} {"train_loss": -12.36586856842041, "global_step": 361144, "epoch": 2149} {"train_loss": -12.021385192871094, "global_step": 361145, "epoch": 2149} {"train_loss": -12.183906555175781, "global_step": 361146, "epoch": 2149} {"train_loss": -11.828274726867676, "global_step": 361147, "epoch": 2149} {"train_loss": -12.456141471862793, "global_step": 361148, "epoch": 2149} {"train_loss": -12.132635116577148, "global_step": 361149, "epoch": 2149} {"train_loss": -12.190818786621094, "global_step": 361150, "epoch": 2149} {"train_loss": -12.529071807861328, "global_step": 361151, "epoch": 2149} {"train_loss": -12.310988426208496, "global_step": 361152, "epoch": 2149} {"train_loss": -11.872886657714844, "global_step": 361153, "epoch": 2149} {"train_loss": -12.315191268920898, "global_step": 361154, "epoch": 2149} {"train_loss": -11.771120071411133, "global_step": 361155, "epoch": 2149} {"train_loss": -12.08321475982666, "global_step": 361156, "epoch": 2149} {"train_loss": -12.215913772583008, "global_step": 361157, "epoch": 2149} {"train_loss": -11.793037414550781, "global_step": 361158, "epoch": 2149} {"train_loss": -11.645627975463867, "global_step": 361159, "epoch": 2149} {"train_loss": -12.43442153930664, "global_step": 361160, "epoch": 2149} {"train_loss": -12.194454193115234, "global_step": 361161, "epoch": 2149} {"train_loss": -12.255073547363281, "global_step": 361162, "epoch": 2149} {"train_loss": -11.378816604614258, "global_step": 361163, "epoch": 2149} {"train_loss": -11.247784614562988, "global_step": 361164, "epoch": 2149} {"train_loss": -12.363191604614258, "global_step": 361165, "epoch": 2149} {"train_loss": -11.374683380126953, "global_step": 361166, "epoch": 2149} {"train_loss": -10.921509742736816, "global_step": 361167, "epoch": 2149} {"train_loss": -12.023351669311523, "global_step": 361168, "epoch": 2149} {"train_loss": -10.327935218811035, "global_step": 361169, "epoch": 2149} {"train_loss": -11.236038208007812, "global_step": 361170, "epoch": 2149} {"train_loss": -11.110865592956543, "global_step": 361171, "epoch": 2149} {"train_loss": -11.273406982421875, "global_step": 361172, "epoch": 2149} {"train_loss": -11.7496337890625, "global_step": 361173, "epoch": 2149} {"train_loss": -10.926248550415039, "global_step": 361174, "epoch": 2149} {"train_loss": -12.072835922241211, "global_step": 361175, "epoch": 2149} {"train_loss": -11.27519416809082, "global_step": 361176, "epoch": 2149} {"train_loss": -12.450089454650879, "global_step": 361177, "epoch": 2149} {"train_loss": -11.520644187927246, "global_step": 361178, "epoch": 2149} {"train_loss": -12.220465660095215, "global_step": 361179, "epoch": 2149} {"train_loss": -11.061639785766602, "global_step": 361180, "epoch": 2149} {"train_loss": -12.096597671508789, "global_step": 361181, "epoch": 2149} {"train_loss": -11.736323356628418, "global_step": 361182, "epoch": 2149} {"train_loss": -11.630491256713867, "global_step": 361183, "epoch": 2149} {"train_loss": -12.020023345947266, "global_step": 361184, "epoch": 2149} {"train_loss": -11.828579902648926, "global_step": 361185, "epoch": 2149} {"train_loss": -11.98141098022461, "global_step": 361186, "epoch": 2149} {"train_loss": -11.490425109863281, "global_step": 361187, "epoch": 2149} {"train_loss": -11.854642868041992, "global_step": 361188, "epoch": 2149} {"train_loss": -11.531024932861328, "global_step": 361189, "epoch": 2149} {"train_loss": -12.134716987609863, "global_step": 361190, "epoch": 2149} {"train_loss": -11.968832969665527, "global_step": 361191, "epoch": 2149} {"train_loss": -11.65846061706543, "global_step": 361192, "epoch": 2149} {"train_loss": -12.282485008239746, "global_step": 361193, "epoch": 2149} {"train_loss": -11.633390426635742, "global_step": 361194, "epoch": 2149} {"train_loss": -12.300712585449219, "global_step": 361195, "epoch": 2149} {"train_loss": -11.578980445861816, "global_step": 361196, "epoch": 2149} {"train_loss": -11.516864776611328, "global_step": 361197, "epoch": 2149} {"train_loss": -12.261473655700684, "global_step": 361198, "epoch": 2149} {"train_loss": -12.007069292522612, "global_step": 361199, "epoch": 2149, "val_loss": 292154.53125} {"train_loss": -11.789915084838867, "global_step": 361200, "epoch": 2150} {"train_loss": -10.957693099975586, "global_step": 361201, "epoch": 2150} {"train_loss": -11.891813278198242, "global_step": 361202, "epoch": 2150} {"train_loss": -11.533348083496094, "global_step": 361203, "epoch": 2150} {"train_loss": -11.606029510498047, "global_step": 361204, "epoch": 2150} {"train_loss": -11.831156730651855, "global_step": 361205, "epoch": 2150} {"train_loss": -11.787282943725586, "global_step": 361206, "epoch": 2150} {"train_loss": -11.960533142089844, "global_step": 361207, "epoch": 2150} {"train_loss": -11.589742660522461, "global_step": 361208, "epoch": 2150} {"train_loss": -12.348376274108887, "global_step": 361209, "epoch": 2150} {"train_loss": -11.796960830688477, "global_step": 361210, "epoch": 2150} {"train_loss": -12.079209327697754, "global_step": 361211, "epoch": 2150} {"train_loss": -12.169500350952148, "global_step": 361212, "epoch": 2150} {"train_loss": -12.074007987976074, "global_step": 361213, "epoch": 2150} {"train_loss": -12.456169128417969, "global_step": 361214, "epoch": 2150} {"train_loss": -12.113885879516602, "global_step": 361215, "epoch": 2150} {"train_loss": -12.278371810913086, "global_step": 361216, "epoch": 2150} {"train_loss": -12.170544624328613, "global_step": 361217, "epoch": 2150} {"train_loss": -12.22118091583252, "global_step": 361218, "epoch": 2150} {"train_loss": -12.138049125671387, "global_step": 361219, "epoch": 2150} {"train_loss": -12.249059677124023, "global_step": 361220, "epoch": 2150} {"train_loss": -12.039627075195312, "global_step": 361221, "epoch": 2150} {"train_loss": -12.044479370117188, "global_step": 361222, "epoch": 2150} {"train_loss": -12.375988006591797, "global_step": 361223, "epoch": 2150} {"train_loss": -12.309906005859375, "global_step": 361224, "epoch": 2150} {"train_loss": -11.987451553344727, "global_step": 361225, "epoch": 2150} {"train_loss": -12.050278663635254, "global_step": 361226, "epoch": 2150} {"train_loss": -12.221534729003906, "global_step": 361227, "epoch": 2150} {"train_loss": -12.129741668701172, "global_step": 361228, "epoch": 2150} {"train_loss": -12.150772094726562, "global_step": 361229, "epoch": 2150} {"train_loss": -11.999637603759766, "global_step": 361230, "epoch": 2150} {"train_loss": -11.783729553222656, "global_step": 361231, "epoch": 2150} {"train_loss": -12.230722427368164, "global_step": 361232, "epoch": 2150} {"train_loss": -12.108316421508789, "global_step": 361233, "epoch": 2150} {"train_loss": -11.982809066772461, "global_step": 361234, "epoch": 2150} {"train_loss": -11.188300132751465, "global_step": 361235, "epoch": 2150} {"train_loss": -11.941579818725586, "global_step": 361236, "epoch": 2150} {"train_loss": -12.341878890991211, "global_step": 361237, "epoch": 2150} {"train_loss": -12.044846534729004, "global_step": 361238, "epoch": 2150} {"train_loss": -11.803586959838867, "global_step": 361239, "epoch": 2150} {"train_loss": -12.036579132080078, "global_step": 361240, "epoch": 2150} {"train_loss": -12.127214431762695, "global_step": 361241, "epoch": 2150} {"train_loss": -12.196196556091309, "global_step": 361242, "epoch": 2150} {"train_loss": -11.543031692504883, "global_step": 361243, "epoch": 2150} {"train_loss": -12.29794979095459, "global_step": 361244, "epoch": 2150} {"train_loss": -11.948858261108398, "global_step": 361245, "epoch": 2150} {"train_loss": -12.107836723327637, "global_step": 361246, "epoch": 2150} {"train_loss": -12.362049102783203, "global_step": 361247, "epoch": 2150} {"train_loss": -12.228338241577148, "global_step": 361248, "epoch": 2150} {"train_loss": -12.352157592773438, "global_step": 361249, "epoch": 2150} {"train_loss": -12.317676544189453, "global_step": 361250, "epoch": 2150} {"train_loss": -12.194275856018066, "global_step": 361251, "epoch": 2150} {"train_loss": -12.387467384338379, "global_step": 361252, "epoch": 2150} {"train_loss": -12.397603988647461, "global_step": 361253, "epoch": 2150} {"train_loss": -12.014450073242188, "global_step": 361254, "epoch": 2150} {"train_loss": -12.511411666870117, "global_step": 361255, "epoch": 2150} {"train_loss": -12.331298828125, "global_step": 361256, "epoch": 2150} {"train_loss": -12.242765426635742, "global_step": 361257, "epoch": 2150} {"train_loss": -11.942750930786133, "global_step": 361258, "epoch": 2150} {"train_loss": -12.323933601379395, "global_step": 361259, "epoch": 2150} {"train_loss": -12.281120300292969, "global_step": 361260, "epoch": 2150} {"train_loss": -12.041439056396484, "global_step": 361261, "epoch": 2150} {"train_loss": -11.783758163452148, "global_step": 361262, "epoch": 2150} {"train_loss": -12.10218620300293, "global_step": 361263, "epoch": 2150} {"train_loss": -12.507906913757324, "global_step": 361264, "epoch": 2150} {"train_loss": -12.431434631347656, "global_step": 361265, "epoch": 2150} {"train_loss": -12.477670669555664, "global_step": 361266, "epoch": 2150} {"train_loss": -12.352022171020508, "global_step": 361267, "epoch": 2150} {"train_loss": -12.756366729736328, "global_step": 361268, "epoch": 2150} {"train_loss": -12.146533966064453, "global_step": 361269, "epoch": 2150} {"train_loss": -12.246906280517578, "global_step": 361270, "epoch": 2150} {"train_loss": -12.462610244750977, "global_step": 361271, "epoch": 2150} {"train_loss": -12.371729850769043, "global_step": 361272, "epoch": 2150} {"train_loss": -12.189558982849121, "global_step": 361273, "epoch": 2150} {"train_loss": -12.149528503417969, "global_step": 361274, "epoch": 2150} {"train_loss": -12.407757759094238, "global_step": 361275, "epoch": 2150} {"train_loss": -11.919334411621094, "global_step": 361276, "epoch": 2150} {"train_loss": -12.39749813079834, "global_step": 361277, "epoch": 2150} {"train_loss": -12.43235969543457, "global_step": 361278, "epoch": 2150} {"train_loss": -12.028670310974121, "global_step": 361279, "epoch": 2150} {"train_loss": -12.19640064239502, "global_step": 361280, "epoch": 2150} {"train_loss": -12.073454856872559, "global_step": 361281, "epoch": 2150} {"train_loss": -12.369482040405273, "global_step": 361282, "epoch": 2150} {"train_loss": -11.976190567016602, "global_step": 361283, "epoch": 2150} {"train_loss": -12.364212036132812, "global_step": 361284, "epoch": 2150} {"train_loss": -12.222545623779297, "global_step": 361285, "epoch": 2150} {"train_loss": -12.409518241882324, "global_step": 361286, "epoch": 2150} {"train_loss": -12.35699462890625, "global_step": 361287, "epoch": 2150} {"train_loss": -11.927654266357422, "global_step": 361288, "epoch": 2150} {"train_loss": -12.100241661071777, "global_step": 361289, "epoch": 2150} {"train_loss": -12.30804443359375, "global_step": 361290, "epoch": 2150} {"train_loss": -12.375558853149414, "global_step": 361291, "epoch": 2150} {"train_loss": -11.484495162963867, "global_step": 361292, "epoch": 2150} {"train_loss": -11.117243766784668, "global_step": 361293, "epoch": 2150} {"train_loss": -12.344388961791992, "global_step": 361294, "epoch": 2150} {"train_loss": -12.184717178344727, "global_step": 361295, "epoch": 2150} {"train_loss": -10.798402786254883, "global_step": 361296, "epoch": 2150} {"train_loss": -11.525550842285156, "global_step": 361297, "epoch": 2150} {"train_loss": -11.068048477172852, "global_step": 361298, "epoch": 2150} {"train_loss": -9.297959327697754, "global_step": 361299, "epoch": 2150} {"train_loss": -11.09553337097168, "global_step": 361300, "epoch": 2150} {"train_loss": -10.810863494873047, "global_step": 361301, "epoch": 2150} {"train_loss": -8.811058044433594, "global_step": 361302, "epoch": 2150} {"train_loss": -8.47012710571289, "global_step": 361303, "epoch": 2150} {"train_loss": -9.549606323242188, "global_step": 361304, "epoch": 2150} {"train_loss": -11.23867416381836, "global_step": 361305, "epoch": 2150} {"train_loss": -8.984548568725586, "global_step": 361306, "epoch": 2150} {"train_loss": -10.256612777709961, "global_step": 361307, "epoch": 2150} {"train_loss": -10.209394454956055, "global_step": 361308, "epoch": 2150} {"train_loss": -10.189583778381348, "global_step": 361309, "epoch": 2150} {"train_loss": -10.318045616149902, "global_step": 361310, "epoch": 2150} {"train_loss": -9.729321479797363, "global_step": 361311, "epoch": 2150} {"train_loss": -10.625925064086914, "global_step": 361312, "epoch": 2150} {"train_loss": -9.35916805267334, "global_step": 361313, "epoch": 2150} {"train_loss": -9.780997276306152, "global_step": 361314, "epoch": 2150} {"train_loss": -9.067630767822266, "global_step": 361315, "epoch": 2150} {"train_loss": -10.035064697265625, "global_step": 361316, "epoch": 2150} {"train_loss": -10.151897430419922, "global_step": 361317, "epoch": 2150} {"train_loss": -10.724956512451172, "global_step": 361318, "epoch": 2150} {"train_loss": -9.885269165039062, "global_step": 361319, "epoch": 2150} {"train_loss": -9.766828536987305, "global_step": 361320, "epoch": 2150} {"train_loss": -9.973287582397461, "global_step": 361321, "epoch": 2150} {"train_loss": -10.195058822631836, "global_step": 361322, "epoch": 2150} {"train_loss": -11.061582565307617, "global_step": 361323, "epoch": 2150} {"train_loss": -10.334625244140625, "global_step": 361324, "epoch": 2150} {"train_loss": -11.220973014831543, "global_step": 361325, "epoch": 2150} {"train_loss": -10.564248085021973, "global_step": 361326, "epoch": 2150} {"train_loss": -11.497637748718262, "global_step": 361327, "epoch": 2150} {"train_loss": -10.123872756958008, "global_step": 361328, "epoch": 2150} {"train_loss": -11.145204544067383, "global_step": 361329, "epoch": 2150} {"train_loss": -10.557910919189453, "global_step": 361330, "epoch": 2150} {"train_loss": -11.250574111938477, "global_step": 361331, "epoch": 2150} {"train_loss": -11.379199981689453, "global_step": 361332, "epoch": 2150} {"train_loss": -10.093950271606445, "global_step": 361333, "epoch": 2150} {"train_loss": -11.84075927734375, "global_step": 361334, "epoch": 2150} {"train_loss": -10.357654571533203, "global_step": 361335, "epoch": 2150} {"train_loss": -11.364299774169922, "global_step": 361336, "epoch": 2150} {"train_loss": -10.957124710083008, "global_step": 361337, "epoch": 2150} {"train_loss": -11.063249588012695, "global_step": 361338, "epoch": 2150} {"train_loss": -11.626717567443848, "global_step": 361339, "epoch": 2150} {"train_loss": -11.211542129516602, "global_step": 361340, "epoch": 2150} {"train_loss": -11.693977355957031, "global_step": 361341, "epoch": 2150} {"train_loss": -11.51638412475586, "global_step": 361342, "epoch": 2150} {"train_loss": -12.077543258666992, "global_step": 361343, "epoch": 2150} {"train_loss": -11.987262725830078, "global_step": 361344, "epoch": 2150} {"train_loss": -11.964456558227539, "global_step": 361345, "epoch": 2150} {"train_loss": -11.895254135131836, "global_step": 361346, "epoch": 2150} {"train_loss": -12.107518196105957, "global_step": 361347, "epoch": 2150} {"train_loss": -11.986571311950684, "global_step": 361348, "epoch": 2150} {"train_loss": -12.171917915344238, "global_step": 361349, "epoch": 2150} {"train_loss": -11.96735954284668, "global_step": 361350, "epoch": 2150} {"train_loss": -11.996707916259766, "global_step": 361351, "epoch": 2150} {"train_loss": -11.999004364013672, "global_step": 361352, "epoch": 2150} {"train_loss": -12.103208541870117, "global_step": 361353, "epoch": 2150} {"train_loss": -12.075098037719727, "global_step": 361354, "epoch": 2150} {"train_loss": -12.006865501403809, "global_step": 361355, "epoch": 2150} {"train_loss": -12.167448043823242, "global_step": 361356, "epoch": 2150} {"train_loss": -12.30573844909668, "global_step": 361357, "epoch": 2150} {"train_loss": -12.031232833862305, "global_step": 361358, "epoch": 2150} {"train_loss": -12.390901565551758, "global_step": 361359, "epoch": 2150} {"train_loss": -12.204959869384766, "global_step": 361360, "epoch": 2150} {"train_loss": -12.27889633178711, "global_step": 361361, "epoch": 2150} {"train_loss": -12.261248588562012, "global_step": 361362, "epoch": 2150} {"train_loss": -12.34628677368164, "global_step": 361363, "epoch": 2150} {"train_loss": -12.387113571166992, "global_step": 361364, "epoch": 2150} {"train_loss": -12.255453109741211, "global_step": 361365, "epoch": 2150} {"train_loss": -12.318888664245605, "global_step": 361366, "epoch": 2150} {"train_loss": -11.662335111981346, "global_step": 361367, "epoch": 2150, "train/sim_max_reward_0": 0.5480508697890856, "train/sim_max_reward_1": 0.9712942152369406, "train/sim_max_reward_2": 0.0012760145966057756, "train/sim_max_reward_3": 0.45118110918880544, "train/sim_max_reward_4": 0.9711127976415944, "train/sim_max_reward_5": 0.6512491869333162, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.37418418837015427, "test/sim_max_reward_4400002": 0.513239428127133, "test/sim_max_reward_4400003": 0.0014043513950531227, "test/sim_max_reward_4400004": 0.9955413247717338, "test/sim_max_reward_4400005": 0.5114507439592552, "test/sim_max_reward_4400006": 0.128049673675432, "test/sim_max_reward_4400007": 0.4741759517664866, "test/sim_max_reward_4400008": 0.5038828090948494, "test/sim_max_reward_4400009": 0.35512840526743533, "test/sim_max_reward_4400010": 0.9548947801328111, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 0.14110722128947978, "test/sim_max_reward_4400013": 0.9975167959598223, "test/sim_max_reward_4400014": 0.6222908654400324, "test/sim_max_reward_4400015": 0.14776095455329885, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9581173201473722, "test/sim_max_reward_4400019": 0.2161421733357473, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.6389724790241182, "test/sim_max_reward_4400022": 0.9690979487814517, "test/sim_max_reward_4400023": 0.16429967181776028, "test/sim_max_reward_4400024": 0.379528681902144, "test/sim_max_reward_4400025": 0.581835203483363, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.631548760352283, "test/sim_max_reward_4400028": 0.978430791087841, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9750598419151634, "test/sim_max_reward_4400031": 0.9702275603265084, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.7177807367542164, "test/sim_max_reward_4400034": 0.9376797903926506, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.5301288515113486, "test/sim_max_reward_4400037": 0.9899986602652248, "test/sim_max_reward_4400038": 0.298531688394343, "test/sim_max_reward_4400039": 0.4119948843327103, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.1655475459651782, "test/sim_max_reward_4400042": 0.7273685113382036, "test/sim_max_reward_4400043": 0.018661596823014572, "test/sim_max_reward_4400044": 0.5814653523489102, "test/sim_max_reward_4400045": 0.4066884816692215, "test/sim_max_reward_4400046": 0.3183521882408541, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0029501152603825863, "train/mean_score": 0.5990273655643913, "test/mean_score": 0.47151144678502677, "val_loss": 292301.375, "train_action_mse_error": 0.780125617980957} {"train_loss": -12.399297714233398, "global_step": 361368, "epoch": 2151} {"train_loss": -12.179686546325684, "global_step": 361369, "epoch": 2151} {"train_loss": -12.230583190917969, "global_step": 361370, "epoch": 2151} {"train_loss": -12.224628448486328, "global_step": 361371, "epoch": 2151} {"train_loss": -12.432689666748047, "global_step": 361372, "epoch": 2151} {"train_loss": -12.296648025512695, "global_step": 361373, "epoch": 2151} {"train_loss": -12.291814804077148, "global_step": 361374, "epoch": 2151} {"train_loss": -12.37932300567627, "global_step": 361375, "epoch": 2151} {"train_loss": -12.314640998840332, "global_step": 361376, "epoch": 2151} {"train_loss": -12.298929214477539, "global_step": 361377, "epoch": 2151} {"train_loss": -12.472320556640625, "global_step": 361378, "epoch": 2151} {"train_loss": -12.531219482421875, "global_step": 361379, "epoch": 2151} {"train_loss": -12.413932800292969, "global_step": 361380, "epoch": 2151} {"train_loss": -12.372339248657227, "global_step": 361381, "epoch": 2151} {"train_loss": -12.47103214263916, "global_step": 361382, "epoch": 2151} {"train_loss": -12.303149223327637, "global_step": 361383, "epoch": 2151} {"train_loss": -12.511512756347656, "global_step": 361384, "epoch": 2151} {"train_loss": -12.211020469665527, "global_step": 361385, "epoch": 2151} {"train_loss": -12.505426406860352, "global_step": 361386, "epoch": 2151} {"train_loss": -12.47635555267334, "global_step": 361387, "epoch": 2151} {"train_loss": -12.552228927612305, "global_step": 361388, "epoch": 2151} {"train_loss": -12.383244514465332, "global_step": 361389, "epoch": 2151} {"train_loss": -12.506867408752441, "global_step": 361390, "epoch": 2151} {"train_loss": -12.662372589111328, "global_step": 361391, "epoch": 2151} {"train_loss": -12.332849502563477, "global_step": 361392, "epoch": 2151} {"train_loss": -12.668729782104492, "global_step": 361393, "epoch": 2151} {"train_loss": -12.436773300170898, "global_step": 361394, "epoch": 2151} {"train_loss": -12.52437686920166, "global_step": 361395, "epoch": 2151} {"train_loss": -12.620203018188477, "global_step": 361396, "epoch": 2151} {"train_loss": -12.488070487976074, "global_step": 361397, "epoch": 2151} {"train_loss": -12.470357894897461, "global_step": 361398, "epoch": 2151} {"train_loss": -12.47235107421875, "global_step": 361399, "epoch": 2151} {"train_loss": -12.346369743347168, "global_step": 361400, "epoch": 2151} {"train_loss": -12.678539276123047, "global_step": 361401, "epoch": 2151} {"train_loss": -12.589807510375977, "global_step": 361402, "epoch": 2151} {"train_loss": -12.70184326171875, "global_step": 361403, "epoch": 2151} {"train_loss": -12.501981735229492, "global_step": 361404, "epoch": 2151} {"train_loss": -12.56799602508545, "global_step": 361405, "epoch": 2151} {"train_loss": -12.604318618774414, "global_step": 361406, "epoch": 2151} {"train_loss": -12.513215065002441, "global_step": 361407, "epoch": 2151} {"train_loss": -12.538731575012207, "global_step": 361408, "epoch": 2151} {"train_loss": -12.17704963684082, "global_step": 361409, "epoch": 2151} {"train_loss": -12.337909698486328, "global_step": 361410, "epoch": 2151} {"train_loss": -12.361078262329102, "global_step": 361411, "epoch": 2151} {"train_loss": -12.313919067382812, "global_step": 361412, "epoch": 2151} {"train_loss": -12.533493041992188, "global_step": 361413, "epoch": 2151} {"train_loss": -12.201435089111328, "global_step": 361414, "epoch": 2151} {"train_loss": -12.576107025146484, "global_step": 361415, "epoch": 2151} {"train_loss": -12.374387741088867, "global_step": 361416, "epoch": 2151} {"train_loss": -12.11357593536377, "global_step": 361417, "epoch": 2151} {"train_loss": -12.353405952453613, "global_step": 361418, "epoch": 2151} {"train_loss": -12.0363187789917, "global_step": 361419, "epoch": 2151} {"train_loss": -12.317222595214844, "global_step": 361420, "epoch": 2151} {"train_loss": -12.136604309082031, "global_step": 361421, "epoch": 2151} {"train_loss": -12.328241348266602, "global_step": 361422, "epoch": 2151} {"train_loss": -12.182056427001953, "global_step": 361423, "epoch": 2151} {"train_loss": -12.041386604309082, "global_step": 361424, "epoch": 2151} {"train_loss": -12.560218811035156, "global_step": 361425, "epoch": 2151} {"train_loss": -11.91305160522461, "global_step": 361426, "epoch": 2151} {"train_loss": -11.344554901123047, "global_step": 361427, "epoch": 2151} {"train_loss": -11.814802169799805, "global_step": 361428, "epoch": 2151} {"train_loss": -12.116724014282227, "global_step": 361429, "epoch": 2151} {"train_loss": -11.828983306884766, "global_step": 361430, "epoch": 2151} {"train_loss": -10.17734432220459, "global_step": 361431, "epoch": 2151} {"train_loss": -10.06753921508789, "global_step": 361432, "epoch": 2151} {"train_loss": -8.35318660736084, "global_step": 361433, "epoch": 2151} {"train_loss": -8.67770004272461, "global_step": 361434, "epoch": 2151} {"train_loss": -10.176107406616211, "global_step": 361435, "epoch": 2151} {"train_loss": -10.832024574279785, "global_step": 361436, "epoch": 2151} {"train_loss": -9.938579559326172, "global_step": 361437, "epoch": 2151} {"train_loss": -9.661761283874512, "global_step": 361438, "epoch": 2151} {"train_loss": -10.032608032226562, "global_step": 361439, "epoch": 2151} {"train_loss": -10.35324764251709, "global_step": 361440, "epoch": 2151} {"train_loss": -10.182743072509766, "global_step": 361441, "epoch": 2151} {"train_loss": -10.555907249450684, "global_step": 361442, "epoch": 2151} {"train_loss": -11.070761680603027, "global_step": 361443, "epoch": 2151} {"train_loss": -10.29261302947998, "global_step": 361444, "epoch": 2151} {"train_loss": -10.904255867004395, "global_step": 361445, "epoch": 2151} {"train_loss": -10.599337577819824, "global_step": 361446, "epoch": 2151} {"train_loss": -11.47765827178955, "global_step": 361447, "epoch": 2151} {"train_loss": -10.43101978302002, "global_step": 361448, "epoch": 2151} {"train_loss": -10.581064224243164, "global_step": 361449, "epoch": 2151} {"train_loss": -10.491713523864746, "global_step": 361450, "epoch": 2151} {"train_loss": -10.391071319580078, "global_step": 361451, "epoch": 2151} {"train_loss": -10.822837829589844, "global_step": 361452, "epoch": 2151} {"train_loss": -10.968619346618652, "global_step": 361453, "epoch": 2151} {"train_loss": -11.266263008117676, "global_step": 361454, "epoch": 2151} {"train_loss": -10.324647903442383, "global_step": 361455, "epoch": 2151} {"train_loss": -11.123543739318848, "global_step": 361456, "epoch": 2151} {"train_loss": -10.759284973144531, "global_step": 361457, "epoch": 2151} {"train_loss": -11.544565200805664, "global_step": 361458, "epoch": 2151} {"train_loss": -11.457132339477539, "global_step": 361459, "epoch": 2151} {"train_loss": -10.680953979492188, "global_step": 361460, "epoch": 2151} {"train_loss": -11.523757934570312, "global_step": 361461, "epoch": 2151} {"train_loss": -11.248004913330078, "global_step": 361462, "epoch": 2151} {"train_loss": -11.088069915771484, "global_step": 361463, "epoch": 2151} {"train_loss": -11.03522777557373, "global_step": 361464, "epoch": 2151} {"train_loss": -10.76278305053711, "global_step": 361465, "epoch": 2151} {"train_loss": -11.609550476074219, "global_step": 361466, "epoch": 2151} {"train_loss": -11.300785064697266, "global_step": 361467, "epoch": 2151} {"train_loss": -11.643804550170898, "global_step": 361468, "epoch": 2151} {"train_loss": -11.30723762512207, "global_step": 361469, "epoch": 2151} {"train_loss": -11.44265365600586, "global_step": 361470, "epoch": 2151} {"train_loss": -11.577129364013672, "global_step": 361471, "epoch": 2151} {"train_loss": -11.411308288574219, "global_step": 361472, "epoch": 2151} {"train_loss": -11.115715980529785, "global_step": 361473, "epoch": 2151} {"train_loss": -11.586017608642578, "global_step": 361474, "epoch": 2151} {"train_loss": -11.67740535736084, "global_step": 361475, "epoch": 2151} {"train_loss": -11.254268646240234, "global_step": 361476, "epoch": 2151} {"train_loss": -12.081558227539062, "global_step": 361477, "epoch": 2151} {"train_loss": -11.40190315246582, "global_step": 361478, "epoch": 2151} {"train_loss": -11.6239013671875, "global_step": 361479, "epoch": 2151} {"train_loss": -11.770859718322754, "global_step": 361480, "epoch": 2151} {"train_loss": -11.661855697631836, "global_step": 361481, "epoch": 2151} {"train_loss": -11.913180351257324, "global_step": 361482, "epoch": 2151} {"train_loss": -11.89384937286377, "global_step": 361483, "epoch": 2151} {"train_loss": -11.937417984008789, "global_step": 361484, "epoch": 2151} {"train_loss": -11.648605346679688, "global_step": 361485, "epoch": 2151} {"train_loss": -11.70582103729248, "global_step": 361486, "epoch": 2151} {"train_loss": -11.685386657714844, "global_step": 361487, "epoch": 2151} {"train_loss": -11.651742935180664, "global_step": 361488, "epoch": 2151} {"train_loss": -11.963229179382324, "global_step": 361489, "epoch": 2151} {"train_loss": -11.925411224365234, "global_step": 361490, "epoch": 2151} {"train_loss": -12.10019302368164, "global_step": 361491, "epoch": 2151} {"train_loss": -12.132683753967285, "global_step": 361492, "epoch": 2151} {"train_loss": -12.11158561706543, "global_step": 361493, "epoch": 2151} {"train_loss": -12.288778305053711, "global_step": 361494, "epoch": 2151} {"train_loss": -12.174528121948242, "global_step": 361495, "epoch": 2151} {"train_loss": -12.096504211425781, "global_step": 361496, "epoch": 2151} {"train_loss": -11.932523727416992, "global_step": 361497, "epoch": 2151} {"train_loss": -12.33884048461914, "global_step": 361498, "epoch": 2151} {"train_loss": -11.861915588378906, "global_step": 361499, "epoch": 2151} {"train_loss": -12.20284366607666, "global_step": 361500, "epoch": 2151} {"train_loss": -12.187521934509277, "global_step": 361501, "epoch": 2151} {"train_loss": -12.090507507324219, "global_step": 361502, "epoch": 2151} {"train_loss": -12.3058443069458, "global_step": 361503, "epoch": 2151} {"train_loss": -12.299538612365723, "global_step": 361504, "epoch": 2151} {"train_loss": -12.234107971191406, "global_step": 361505, "epoch": 2151} {"train_loss": -12.331756591796875, "global_step": 361506, "epoch": 2151} {"train_loss": -12.327876091003418, "global_step": 361507, "epoch": 2151} {"train_loss": -12.278862953186035, "global_step": 361508, "epoch": 2151} {"train_loss": -12.307343482971191, "global_step": 361509, "epoch": 2151} {"train_loss": -12.405105590820312, "global_step": 361510, "epoch": 2151} {"train_loss": -12.547504425048828, "global_step": 361511, "epoch": 2151} {"train_loss": -12.314217567443848, "global_step": 361512, "epoch": 2151} {"train_loss": -12.446207046508789, "global_step": 361513, "epoch": 2151} {"train_loss": -12.498978614807129, "global_step": 361514, "epoch": 2151} {"train_loss": -12.386796951293945, "global_step": 361515, "epoch": 2151} {"train_loss": -12.491303443908691, "global_step": 361516, "epoch": 2151} {"train_loss": -12.564291000366211, "global_step": 361517, "epoch": 2151} {"train_loss": -12.305624008178711, "global_step": 361518, "epoch": 2151} {"train_loss": -12.526836395263672, "global_step": 361519, "epoch": 2151} {"train_loss": -12.526426315307617, "global_step": 361520, "epoch": 2151} {"train_loss": -12.341264724731445, "global_step": 361521, "epoch": 2151} {"train_loss": -12.38656997680664, "global_step": 361522, "epoch": 2151} {"train_loss": -12.41111946105957, "global_step": 361523, "epoch": 2151} {"train_loss": -12.63245677947998, "global_step": 361524, "epoch": 2151} {"train_loss": -12.5423583984375, "global_step": 361525, "epoch": 2151} {"train_loss": -12.628952026367188, "global_step": 361526, "epoch": 2151} {"train_loss": -12.49459457397461, "global_step": 361527, "epoch": 2151} {"train_loss": -12.464263916015625, "global_step": 361528, "epoch": 2151} {"train_loss": -12.48234748840332, "global_step": 361529, "epoch": 2151} {"train_loss": -12.725166320800781, "global_step": 361530, "epoch": 2151} {"train_loss": -12.757325172424316, "global_step": 361531, "epoch": 2151} {"train_loss": -12.51810359954834, "global_step": 361532, "epoch": 2151} {"train_loss": -12.632135391235352, "global_step": 361533, "epoch": 2151} {"train_loss": -12.350708961486816, "global_step": 361534, "epoch": 2151} {"train_loss": -11.878952162606376, "global_step": 361535, "epoch": 2151, "val_loss": 293062.15625} {"train_loss": -12.616382598876953, "global_step": 361536, "epoch": 2152} {"train_loss": -12.655837059020996, "global_step": 361537, "epoch": 2152} {"train_loss": -12.71695613861084, "global_step": 361538, "epoch": 2152} {"train_loss": -12.601125717163086, "global_step": 361539, "epoch": 2152} {"train_loss": -12.462299346923828, "global_step": 361540, "epoch": 2152} {"train_loss": -11.760805130004883, "global_step": 361541, "epoch": 2152} {"train_loss": -12.697361946105957, "global_step": 361542, "epoch": 2152} {"train_loss": -12.217044830322266, "global_step": 361543, "epoch": 2152} {"train_loss": -11.712186813354492, "global_step": 361544, "epoch": 2152} {"train_loss": -12.218729972839355, "global_step": 361545, "epoch": 2152} {"train_loss": -12.624327659606934, "global_step": 361546, "epoch": 2152} {"train_loss": -12.229565620422363, "global_step": 361547, "epoch": 2152} {"train_loss": -12.403244972229004, "global_step": 361548, "epoch": 2152} {"train_loss": -12.64489459991455, "global_step": 361549, "epoch": 2152} {"train_loss": -11.984479904174805, "global_step": 361550, "epoch": 2152} {"train_loss": -12.743728637695312, "global_step": 361551, "epoch": 2152} {"train_loss": -12.221877098083496, "global_step": 361552, "epoch": 2152} {"train_loss": -12.609075546264648, "global_step": 361553, "epoch": 2152} {"train_loss": -12.518492698669434, "global_step": 361554, "epoch": 2152} {"train_loss": -12.64571762084961, "global_step": 361555, "epoch": 2152} {"train_loss": -12.254478454589844, "global_step": 361556, "epoch": 2152} {"train_loss": -12.797150611877441, "global_step": 361557, "epoch": 2152} {"train_loss": -12.454925537109375, "global_step": 361558, "epoch": 2152} {"train_loss": -12.809196472167969, "global_step": 361559, "epoch": 2152} {"train_loss": -12.402740478515625, "global_step": 361560, "epoch": 2152} {"train_loss": -12.231624603271484, "global_step": 361561, "epoch": 2152} {"train_loss": -12.460134506225586, "global_step": 361562, "epoch": 2152} {"train_loss": -12.48351001739502, "global_step": 361563, "epoch": 2152} {"train_loss": -12.305656433105469, "global_step": 361564, "epoch": 2152} {"train_loss": -11.99937629699707, "global_step": 361565, "epoch": 2152} {"train_loss": -12.455192565917969, "global_step": 361566, "epoch": 2152} {"train_loss": -12.54588508605957, "global_step": 361567, "epoch": 2152} {"train_loss": -12.323253631591797, "global_step": 361568, "epoch": 2152} {"train_loss": -12.345539093017578, "global_step": 361569, "epoch": 2152} {"train_loss": -12.178858757019043, "global_step": 361570, "epoch": 2152} {"train_loss": -12.537660598754883, "global_step": 361571, "epoch": 2152} {"train_loss": -12.345972061157227, "global_step": 361572, "epoch": 2152} {"train_loss": -11.293295860290527, "global_step": 361573, "epoch": 2152} {"train_loss": -10.971059799194336, "global_step": 361574, "epoch": 2152} {"train_loss": -12.618727684020996, "global_step": 361575, "epoch": 2152} {"train_loss": -11.064680099487305, "global_step": 361576, "epoch": 2152} {"train_loss": -11.793071746826172, "global_step": 361577, "epoch": 2152} {"train_loss": -10.763046264648438, "global_step": 361578, "epoch": 2152} {"train_loss": -11.357930183410645, "global_step": 361579, "epoch": 2152} {"train_loss": -11.440530776977539, "global_step": 361580, "epoch": 2152} {"train_loss": -12.025962829589844, "global_step": 361581, "epoch": 2152} {"train_loss": -11.52527904510498, "global_step": 361582, "epoch": 2152} {"train_loss": -11.63542366027832, "global_step": 361583, "epoch": 2152} {"train_loss": -11.29791259765625, "global_step": 361584, "epoch": 2152} {"train_loss": -12.11981201171875, "global_step": 361585, "epoch": 2152} {"train_loss": -12.119860649108887, "global_step": 361586, "epoch": 2152} {"train_loss": -11.746903419494629, "global_step": 361587, "epoch": 2152} {"train_loss": -11.122690200805664, "global_step": 361588, "epoch": 2152} {"train_loss": -10.810250282287598, "global_step": 361589, "epoch": 2152} {"train_loss": -11.250325202941895, "global_step": 361590, "epoch": 2152} {"train_loss": -11.030241012573242, "global_step": 361591, "epoch": 2152} {"train_loss": -11.817066192626953, "global_step": 361592, "epoch": 2152} {"train_loss": -10.564325332641602, "global_step": 361593, "epoch": 2152} {"train_loss": -10.037479400634766, "global_step": 361594, "epoch": 2152} {"train_loss": -9.27946662902832, "global_step": 361595, "epoch": 2152} {"train_loss": -11.129932403564453, "global_step": 361596, "epoch": 2152} {"train_loss": -10.32913589477539, "global_step": 361597, "epoch": 2152} {"train_loss": -10.40329360961914, "global_step": 361598, "epoch": 2152} {"train_loss": -10.294477462768555, "global_step": 361599, "epoch": 2152} {"train_loss": -10.136537551879883, "global_step": 361600, "epoch": 2152} {"train_loss": -10.021408081054688, "global_step": 361601, "epoch": 2152} {"train_loss": -10.490121841430664, "global_step": 361602, "epoch": 2152} {"train_loss": -11.009465217590332, "global_step": 361603, "epoch": 2152} {"train_loss": -10.034214973449707, "global_step": 361604, "epoch": 2152} {"train_loss": -11.683722496032715, "global_step": 361605, "epoch": 2152} {"train_loss": -10.70150089263916, "global_step": 361606, "epoch": 2152} {"train_loss": -11.968707084655762, "global_step": 361607, "epoch": 2152} {"train_loss": -11.458694458007812, "global_step": 361608, "epoch": 2152} {"train_loss": -11.828632354736328, "global_step": 361609, "epoch": 2152} {"train_loss": -11.732398986816406, "global_step": 361610, "epoch": 2152} {"train_loss": -11.578510284423828, "global_step": 361611, "epoch": 2152} {"train_loss": -11.904365539550781, "global_step": 361612, "epoch": 2152} {"train_loss": -11.680314064025879, "global_step": 361613, "epoch": 2152} {"train_loss": -12.215421676635742, "global_step": 361614, "epoch": 2152} {"train_loss": -12.148558616638184, "global_step": 361615, "epoch": 2152} {"train_loss": -11.908096313476562, "global_step": 361616, "epoch": 2152} {"train_loss": -12.162528038024902, "global_step": 361617, "epoch": 2152} {"train_loss": -12.130191802978516, "global_step": 361618, "epoch": 2152} {"train_loss": -12.141823768615723, "global_step": 361619, "epoch": 2152} {"train_loss": -12.163129806518555, "global_step": 361620, "epoch": 2152} {"train_loss": -12.239673614501953, "global_step": 361621, "epoch": 2152} {"train_loss": -12.249181747436523, "global_step": 361622, "epoch": 2152} {"train_loss": -12.236237525939941, "global_step": 361623, "epoch": 2152} {"train_loss": -12.183809280395508, "global_step": 361624, "epoch": 2152} {"train_loss": -12.112161636352539, "global_step": 361625, "epoch": 2152} {"train_loss": -12.170641899108887, "global_step": 361626, "epoch": 2152} {"train_loss": -12.114715576171875, "global_step": 361627, "epoch": 2152} {"train_loss": -12.116951942443848, "global_step": 361628, "epoch": 2152} {"train_loss": -12.066736221313477, "global_step": 361629, "epoch": 2152} {"train_loss": -12.448482513427734, "global_step": 361630, "epoch": 2152} {"train_loss": -12.38491439819336, "global_step": 361631, "epoch": 2152} {"train_loss": -11.951370239257812, "global_step": 361632, "epoch": 2152} {"train_loss": -12.022958755493164, "global_step": 361633, "epoch": 2152} {"train_loss": -11.796272277832031, "global_step": 361634, "epoch": 2152} {"train_loss": -12.213205337524414, "global_step": 361635, "epoch": 2152} {"train_loss": -11.887547492980957, "global_step": 361636, "epoch": 2152} {"train_loss": -12.134946823120117, "global_step": 361637, "epoch": 2152} {"train_loss": -11.848953247070312, "global_step": 361638, "epoch": 2152} {"train_loss": -12.121707916259766, "global_step": 361639, "epoch": 2152} {"train_loss": -12.291289329528809, "global_step": 361640, "epoch": 2152} {"train_loss": -12.238043785095215, "global_step": 361641, "epoch": 2152} {"train_loss": -12.253406524658203, "global_step": 361642, "epoch": 2152} {"train_loss": -12.494481086730957, "global_step": 361643, "epoch": 2152} {"train_loss": -12.479015350341797, "global_step": 361644, "epoch": 2152} {"train_loss": -12.313362121582031, "global_step": 361645, "epoch": 2152} {"train_loss": -12.375249862670898, "global_step": 361646, "epoch": 2152} {"train_loss": -12.479671478271484, "global_step": 361647, "epoch": 2152} {"train_loss": -12.311043739318848, "global_step": 361648, "epoch": 2152} {"train_loss": -12.59235954284668, "global_step": 361649, "epoch": 2152} {"train_loss": -12.360570907592773, "global_step": 361650, "epoch": 2152} {"train_loss": -12.704740524291992, "global_step": 361651, "epoch": 2152} {"train_loss": -12.542410850524902, "global_step": 361652, "epoch": 2152} {"train_loss": -12.47314453125, "global_step": 361653, "epoch": 2152} {"train_loss": -12.578592300415039, "global_step": 361654, "epoch": 2152} {"train_loss": -12.477836608886719, "global_step": 361655, "epoch": 2152} {"train_loss": -12.625771522521973, "global_step": 361656, "epoch": 2152} {"train_loss": -12.47431468963623, "global_step": 361657, "epoch": 2152} {"train_loss": -12.627908706665039, "global_step": 361658, "epoch": 2152} {"train_loss": -12.699638366699219, "global_step": 361659, "epoch": 2152} {"train_loss": -12.647370338439941, "global_step": 361660, "epoch": 2152} {"train_loss": -12.629190444946289, "global_step": 361661, "epoch": 2152} {"train_loss": -12.627525329589844, "global_step": 361662, "epoch": 2152} {"train_loss": -12.427949905395508, "global_step": 361663, "epoch": 2152} {"train_loss": -12.530672073364258, "global_step": 361664, "epoch": 2152} {"train_loss": -12.422266006469727, "global_step": 361665, "epoch": 2152} {"train_loss": -12.499513626098633, "global_step": 361666, "epoch": 2152} {"train_loss": -12.635180473327637, "global_step": 361667, "epoch": 2152} {"train_loss": -12.653030395507812, "global_step": 361668, "epoch": 2152} {"train_loss": -12.754684448242188, "global_step": 361669, "epoch": 2152} {"train_loss": -12.357856750488281, "global_step": 361670, "epoch": 2152} {"train_loss": -12.648310661315918, "global_step": 361671, "epoch": 2152} {"train_loss": -12.490568161010742, "global_step": 361672, "epoch": 2152} {"train_loss": -12.616549491882324, "global_step": 361673, "epoch": 2152} {"train_loss": -12.675858497619629, "global_step": 361674, "epoch": 2152} {"train_loss": -12.70941162109375, "global_step": 361675, "epoch": 2152} {"train_loss": -12.750934600830078, "global_step": 361676, "epoch": 2152} {"train_loss": -12.70671272277832, "global_step": 361677, "epoch": 2152} {"train_loss": -12.453662872314453, "global_step": 361678, "epoch": 2152} {"train_loss": -12.391569137573242, "global_step": 361679, "epoch": 2152} {"train_loss": -12.554033279418945, "global_step": 361680, "epoch": 2152} {"train_loss": -12.470346450805664, "global_step": 361681, "epoch": 2152} {"train_loss": -12.467726707458496, "global_step": 361682, "epoch": 2152} {"train_loss": -12.345914840698242, "global_step": 361683, "epoch": 2152} {"train_loss": -12.439983367919922, "global_step": 361684, "epoch": 2152} {"train_loss": -12.528200149536133, "global_step": 361685, "epoch": 2152} {"train_loss": -12.14113998413086, "global_step": 361686, "epoch": 2152} {"train_loss": -11.44254207611084, "global_step": 361687, "epoch": 2152} {"train_loss": -11.71371841430664, "global_step": 361688, "epoch": 2152} {"train_loss": -11.668249130249023, "global_step": 361689, "epoch": 2152} {"train_loss": -12.206811904907227, "global_step": 361690, "epoch": 2152} {"train_loss": -12.599719047546387, "global_step": 361691, "epoch": 2152} {"train_loss": -12.038914680480957, "global_step": 361692, "epoch": 2152} {"train_loss": -12.40037727355957, "global_step": 361693, "epoch": 2152} {"train_loss": -11.909210205078125, "global_step": 361694, "epoch": 2152} {"train_loss": -12.134257316589355, "global_step": 361695, "epoch": 2152} {"train_loss": -12.028642654418945, "global_step": 361696, "epoch": 2152} {"train_loss": -11.653453826904297, "global_step": 361697, "epoch": 2152} {"train_loss": -11.848424911499023, "global_step": 361698, "epoch": 2152} {"train_loss": -11.513664245605469, "global_step": 361699, "epoch": 2152} {"train_loss": -11.909908294677734, "global_step": 361700, "epoch": 2152} {"train_loss": -12.303509712219238, "global_step": 361701, "epoch": 2152} {"train_loss": -11.949396133422852, "global_step": 361702, "epoch": 2152} {"train_loss": -12.038247818038577, "global_step": 361703, "epoch": 2152, "val_loss": 288830.90625} {"train_loss": -11.657862663269043, "global_step": 361704, "epoch": 2153} {"train_loss": -11.880887031555176, "global_step": 361705, "epoch": 2153} {"train_loss": -10.903396606445312, "global_step": 361706, "epoch": 2153} {"train_loss": -11.38043212890625, "global_step": 361707, "epoch": 2153} {"train_loss": -11.319366455078125, "global_step": 361708, "epoch": 2153} {"train_loss": -11.070894241333008, "global_step": 361709, "epoch": 2153} {"train_loss": -11.71310043334961, "global_step": 361710, "epoch": 2153} {"train_loss": -12.062262535095215, "global_step": 361711, "epoch": 2153} {"train_loss": -11.16118049621582, "global_step": 361712, "epoch": 2153} {"train_loss": -11.24678897857666, "global_step": 361713, "epoch": 2153} {"train_loss": -12.266959190368652, "global_step": 361714, "epoch": 2153} {"train_loss": -11.210622787475586, "global_step": 361715, "epoch": 2153} {"train_loss": -11.211790084838867, "global_step": 361716, "epoch": 2153} {"train_loss": -11.09428596496582, "global_step": 361717, "epoch": 2153} {"train_loss": -11.549805641174316, "global_step": 361718, "epoch": 2153} {"train_loss": -11.39583969116211, "global_step": 361719, "epoch": 2153} {"train_loss": -12.337254524230957, "global_step": 361720, "epoch": 2153} {"train_loss": -11.655557632446289, "global_step": 361721, "epoch": 2153} {"train_loss": -12.177694320678711, "global_step": 361722, "epoch": 2153} {"train_loss": -11.943075180053711, "global_step": 361723, "epoch": 2153} {"train_loss": -12.411832809448242, "global_step": 361724, "epoch": 2153} {"train_loss": -11.95907974243164, "global_step": 361725, "epoch": 2153} {"train_loss": -12.247414588928223, "global_step": 361726, "epoch": 2153} {"train_loss": -11.755668640136719, "global_step": 361727, "epoch": 2153} {"train_loss": -12.259332656860352, "global_step": 361728, "epoch": 2153} {"train_loss": -11.657181739807129, "global_step": 361729, "epoch": 2153} {"train_loss": -11.321069717407227, "global_step": 361730, "epoch": 2153} {"train_loss": -11.35085678100586, "global_step": 361731, "epoch": 2153} {"train_loss": -11.27177619934082, "global_step": 361732, "epoch": 2153} {"train_loss": -11.361801147460938, "global_step": 361733, "epoch": 2153} {"train_loss": -12.199706077575684, "global_step": 361734, "epoch": 2153} {"train_loss": -11.745888710021973, "global_step": 361735, "epoch": 2153} {"train_loss": -12.185102462768555, "global_step": 361736, "epoch": 2153} {"train_loss": -12.275613784790039, "global_step": 361737, "epoch": 2153} {"train_loss": -11.89223575592041, "global_step": 361738, "epoch": 2153} {"train_loss": -12.406736373901367, "global_step": 361739, "epoch": 2153} {"train_loss": -12.094184875488281, "global_step": 361740, "epoch": 2153} {"train_loss": -12.339644432067871, "global_step": 361741, "epoch": 2153} {"train_loss": -12.636890411376953, "global_step": 361742, "epoch": 2153} {"train_loss": -12.248361587524414, "global_step": 361743, "epoch": 2153} {"train_loss": -12.535372734069824, "global_step": 361744, "epoch": 2153} {"train_loss": -12.225702285766602, "global_step": 361745, "epoch": 2153} {"train_loss": -12.357345581054688, "global_step": 361746, "epoch": 2153} {"train_loss": -12.25486946105957, "global_step": 361747, "epoch": 2153} {"train_loss": -12.381032943725586, "global_step": 361748, "epoch": 2153} {"train_loss": -12.219850540161133, "global_step": 361749, "epoch": 2153} {"train_loss": -12.493029594421387, "global_step": 361750, "epoch": 2153} {"train_loss": -12.43470287322998, "global_step": 361751, "epoch": 2153} {"train_loss": -12.381802558898926, "global_step": 361752, "epoch": 2153} {"train_loss": -12.207267761230469, "global_step": 361753, "epoch": 2153} {"train_loss": -12.419130325317383, "global_step": 361754, "epoch": 2153} {"train_loss": -12.325545310974121, "global_step": 361755, "epoch": 2153} {"train_loss": -12.121429443359375, "global_step": 361756, "epoch": 2153} {"train_loss": -12.415130615234375, "global_step": 361757, "epoch": 2153} {"train_loss": -12.39266586303711, "global_step": 361758, "epoch": 2153} {"train_loss": -12.231435775756836, "global_step": 361759, "epoch": 2153} {"train_loss": -11.953741073608398, "global_step": 361760, "epoch": 2153} {"train_loss": -12.294523239135742, "global_step": 361761, "epoch": 2153} {"train_loss": -11.866408348083496, "global_step": 361762, "epoch": 2153} {"train_loss": -12.527486801147461, "global_step": 361763, "epoch": 2153} {"train_loss": -11.725056648254395, "global_step": 361764, "epoch": 2153} {"train_loss": -12.527200698852539, "global_step": 361765, "epoch": 2153} {"train_loss": -12.279090881347656, "global_step": 361766, "epoch": 2153} {"train_loss": -12.634449005126953, "global_step": 361767, "epoch": 2153} {"train_loss": -12.111228942871094, "global_step": 361768, "epoch": 2153} {"train_loss": -12.551867485046387, "global_step": 361769, "epoch": 2153} {"train_loss": -12.173883438110352, "global_step": 361770, "epoch": 2153} {"train_loss": -12.512960433959961, "global_step": 361771, "epoch": 2153} {"train_loss": -12.40544319152832, "global_step": 361772, "epoch": 2153} {"train_loss": -12.496618270874023, "global_step": 361773, "epoch": 2153} {"train_loss": -12.323060989379883, "global_step": 361774, "epoch": 2153} {"train_loss": -12.369234085083008, "global_step": 361775, "epoch": 2153} {"train_loss": -12.208581924438477, "global_step": 361776, "epoch": 2153} {"train_loss": -12.431870460510254, "global_step": 361777, "epoch": 2153} {"train_loss": -12.69235610961914, "global_step": 361778, "epoch": 2153} {"train_loss": -12.377811431884766, "global_step": 361779, "epoch": 2153} {"train_loss": -12.650419235229492, "global_step": 361780, "epoch": 2153} {"train_loss": -12.340274810791016, "global_step": 361781, "epoch": 2153} {"train_loss": -12.386690139770508, "global_step": 361782, "epoch": 2153} {"train_loss": -12.169797897338867, "global_step": 361783, "epoch": 2153} {"train_loss": -12.683846473693848, "global_step": 361784, "epoch": 2153} {"train_loss": -11.99250602722168, "global_step": 361785, "epoch": 2153} {"train_loss": -12.527589797973633, "global_step": 361786, "epoch": 2153} {"train_loss": -12.687664031982422, "global_step": 361787, "epoch": 2153} {"train_loss": -11.980947494506836, "global_step": 361788, "epoch": 2153} {"train_loss": -12.087564468383789, "global_step": 361789, "epoch": 2153} {"train_loss": -12.01336669921875, "global_step": 361790, "epoch": 2153} {"train_loss": -12.106464385986328, "global_step": 361791, "epoch": 2153} {"train_loss": -11.928155899047852, "global_step": 361792, "epoch": 2153} {"train_loss": -12.42036247253418, "global_step": 361793, "epoch": 2153} {"train_loss": -12.076630592346191, "global_step": 361794, "epoch": 2153} {"train_loss": -12.330097198486328, "global_step": 361795, "epoch": 2153} {"train_loss": -11.962690353393555, "global_step": 361796, "epoch": 2153} {"train_loss": -11.98862075805664, "global_step": 361797, "epoch": 2153} {"train_loss": -12.520162582397461, "global_step": 361798, "epoch": 2153} {"train_loss": -12.405147552490234, "global_step": 361799, "epoch": 2153} {"train_loss": -12.382030487060547, "global_step": 361800, "epoch": 2153} {"train_loss": -12.117547035217285, "global_step": 361801, "epoch": 2153} {"train_loss": -12.265283584594727, "global_step": 361802, "epoch": 2153} {"train_loss": -12.191743850708008, "global_step": 361803, "epoch": 2153} {"train_loss": -12.299381256103516, "global_step": 361804, "epoch": 2153} {"train_loss": -12.5845947265625, "global_step": 361805, "epoch": 2153} {"train_loss": -12.162402153015137, "global_step": 361806, "epoch": 2153} {"train_loss": -11.806717872619629, "global_step": 361807, "epoch": 2153} {"train_loss": -12.224369049072266, "global_step": 361808, "epoch": 2153} {"train_loss": -12.572732925415039, "global_step": 361809, "epoch": 2153} {"train_loss": -12.035635948181152, "global_step": 361810, "epoch": 2153} {"train_loss": -12.347463607788086, "global_step": 361811, "epoch": 2153} {"train_loss": -12.20423698425293, "global_step": 361812, "epoch": 2153} {"train_loss": -12.109451293945312, "global_step": 361813, "epoch": 2153} {"train_loss": -12.124626159667969, "global_step": 361814, "epoch": 2153} {"train_loss": -12.4518461227417, "global_step": 361815, "epoch": 2153} {"train_loss": -12.18599796295166, "global_step": 361816, "epoch": 2153} {"train_loss": -11.757497787475586, "global_step": 361817, "epoch": 2153} {"train_loss": -12.286054611206055, "global_step": 361818, "epoch": 2153} {"train_loss": -12.282393455505371, "global_step": 361819, "epoch": 2153} {"train_loss": -12.345864295959473, "global_step": 361820, "epoch": 2153} {"train_loss": -12.640251159667969, "global_step": 361821, "epoch": 2153} {"train_loss": -12.581132888793945, "global_step": 361822, "epoch": 2153} {"train_loss": -12.511236190795898, "global_step": 361823, "epoch": 2153} {"train_loss": -12.612743377685547, "global_step": 361824, "epoch": 2153} {"train_loss": -12.318655014038086, "global_step": 361825, "epoch": 2153} {"train_loss": -12.462684631347656, "global_step": 361826, "epoch": 2153} {"train_loss": -12.478471755981445, "global_step": 361827, "epoch": 2153} {"train_loss": -12.538114547729492, "global_step": 361828, "epoch": 2153} {"train_loss": -12.525842666625977, "global_step": 361829, "epoch": 2153} {"train_loss": -12.355703353881836, "global_step": 361830, "epoch": 2153} {"train_loss": -11.948776245117188, "global_step": 361831, "epoch": 2153} {"train_loss": -12.16305923461914, "global_step": 361832, "epoch": 2153} {"train_loss": -11.745827674865723, "global_step": 361833, "epoch": 2153} {"train_loss": -12.524375915527344, "global_step": 361834, "epoch": 2153} {"train_loss": -12.313268661499023, "global_step": 361835, "epoch": 2153} {"train_loss": -11.878963470458984, "global_step": 361836, "epoch": 2153} {"train_loss": -12.138082504272461, "global_step": 361837, "epoch": 2153} {"train_loss": -11.370412826538086, "global_step": 361838, "epoch": 2153} {"train_loss": -9.644661903381348, "global_step": 361839, "epoch": 2153} {"train_loss": -11.749587059020996, "global_step": 361840, "epoch": 2153} {"train_loss": -11.181600570678711, "global_step": 361841, "epoch": 2153} {"train_loss": -11.16810417175293, "global_step": 361842, "epoch": 2153} {"train_loss": -12.0435791015625, "global_step": 361843, "epoch": 2153} {"train_loss": -10.868074417114258, "global_step": 361844, "epoch": 2153} {"train_loss": -11.535839080810547, "global_step": 361845, "epoch": 2153} {"train_loss": -10.706854820251465, "global_step": 361846, "epoch": 2153} {"train_loss": -12.471673965454102, "global_step": 361847, "epoch": 2153} {"train_loss": -11.207944869995117, "global_step": 361848, "epoch": 2153} {"train_loss": -11.906576156616211, "global_step": 361849, "epoch": 2153} {"train_loss": -11.588356018066406, "global_step": 361850, "epoch": 2153} {"train_loss": -12.379247665405273, "global_step": 361851, "epoch": 2153} {"train_loss": -11.632421493530273, "global_step": 361852, "epoch": 2153} {"train_loss": -12.015621185302734, "global_step": 361853, "epoch": 2153} {"train_loss": -11.602615356445312, "global_step": 361854, "epoch": 2153} {"train_loss": -11.942940711975098, "global_step": 361855, "epoch": 2153} {"train_loss": -11.924867630004883, "global_step": 361856, "epoch": 2153} {"train_loss": -11.940227508544922, "global_step": 361857, "epoch": 2153} {"train_loss": -12.304666519165039, "global_step": 361858, "epoch": 2153} {"train_loss": -12.192063331604004, "global_step": 361859, "epoch": 2153} {"train_loss": -11.948155403137207, "global_step": 361860, "epoch": 2153} {"train_loss": -11.769768714904785, "global_step": 361861, "epoch": 2153} {"train_loss": -11.74334716796875, "global_step": 361862, "epoch": 2153} {"train_loss": -11.965827941894531, "global_step": 361863, "epoch": 2153} {"train_loss": -11.67501449584961, "global_step": 361864, "epoch": 2153} {"train_loss": -11.971221923828125, "global_step": 361865, "epoch": 2153} {"train_loss": -11.855997085571289, "global_step": 361866, "epoch": 2153} {"train_loss": -11.674163818359375, "global_step": 361867, "epoch": 2153} {"train_loss": -11.872659683227539, "global_step": 361868, "epoch": 2153} {"train_loss": -11.55949878692627, "global_step": 361869, "epoch": 2153} {"train_loss": -11.557332992553711, "global_step": 361870, "epoch": 2153} {"train_loss": -12.041937583968753, "global_step": 361871, "epoch": 2153, "val_loss": 291791.375} {"train_loss": -10.339597702026367, "global_step": 361872, "epoch": 2154} {"train_loss": -11.213468551635742, "global_step": 361873, "epoch": 2154} {"train_loss": -10.611709594726562, "global_step": 361874, "epoch": 2154} {"train_loss": -9.616480827331543, "global_step": 361875, "epoch": 2154} {"train_loss": -9.259587287902832, "global_step": 361876, "epoch": 2154} {"train_loss": -10.320849418640137, "global_step": 361877, "epoch": 2154} {"train_loss": -10.877283096313477, "global_step": 361878, "epoch": 2154} {"train_loss": -10.022564888000488, "global_step": 361879, "epoch": 2154} {"train_loss": -10.370401382446289, "global_step": 361880, "epoch": 2154} {"train_loss": -11.739208221435547, "global_step": 361881, "epoch": 2154} {"train_loss": -11.199201583862305, "global_step": 361882, "epoch": 2154} {"train_loss": -11.500247955322266, "global_step": 361883, "epoch": 2154} {"train_loss": -10.907903671264648, "global_step": 361884, "epoch": 2154} {"train_loss": -11.375978469848633, "global_step": 361885, "epoch": 2154} {"train_loss": -11.332481384277344, "global_step": 361886, "epoch": 2154} {"train_loss": -10.601801872253418, "global_step": 361887, "epoch": 2154} {"train_loss": -11.43503189086914, "global_step": 361888, "epoch": 2154} {"train_loss": -11.400181770324707, "global_step": 361889, "epoch": 2154} {"train_loss": -10.535398483276367, "global_step": 361890, "epoch": 2154} {"train_loss": -11.581647872924805, "global_step": 361891, "epoch": 2154} {"train_loss": -11.320428848266602, "global_step": 361892, "epoch": 2154} {"train_loss": -11.246672630310059, "global_step": 361893, "epoch": 2154} {"train_loss": -11.853212356567383, "global_step": 361894, "epoch": 2154} {"train_loss": -10.814672470092773, "global_step": 361895, "epoch": 2154} {"train_loss": -12.152450561523438, "global_step": 361896, "epoch": 2154} {"train_loss": -10.670804977416992, "global_step": 361897, "epoch": 2154} {"train_loss": -11.848959922790527, "global_step": 361898, "epoch": 2154} {"train_loss": -11.008001327514648, "global_step": 361899, "epoch": 2154} {"train_loss": -11.916458129882812, "global_step": 361900, "epoch": 2154} {"train_loss": -11.5414457321167, "global_step": 361901, "epoch": 2154} {"train_loss": -11.771395683288574, "global_step": 361902, "epoch": 2154} {"train_loss": -11.581007957458496, "global_step": 361903, "epoch": 2154} {"train_loss": -11.840372085571289, "global_step": 361904, "epoch": 2154} {"train_loss": -11.752143859863281, "global_step": 361905, "epoch": 2154} {"train_loss": -11.991167068481445, "global_step": 361906, "epoch": 2154} {"train_loss": -11.862337112426758, "global_step": 361907, "epoch": 2154} {"train_loss": -11.919540405273438, "global_step": 361908, "epoch": 2154} {"train_loss": -12.102128028869629, "global_step": 361909, "epoch": 2154} {"train_loss": -11.928644180297852, "global_step": 361910, "epoch": 2154} {"train_loss": -12.153523445129395, "global_step": 361911, "epoch": 2154} {"train_loss": -11.772189140319824, "global_step": 361912, "epoch": 2154} {"train_loss": -12.190287590026855, "global_step": 361913, "epoch": 2154} {"train_loss": -11.69393253326416, "global_step": 361914, "epoch": 2154} {"train_loss": -12.257301330566406, "global_step": 361915, "epoch": 2154} {"train_loss": -11.947638511657715, "global_step": 361916, "epoch": 2154} {"train_loss": -11.963554382324219, "global_step": 361917, "epoch": 2154} {"train_loss": -12.20468521118164, "global_step": 361918, "epoch": 2154} {"train_loss": -11.967374801635742, "global_step": 361919, "epoch": 2154} {"train_loss": -12.163393020629883, "global_step": 361920, "epoch": 2154} {"train_loss": -11.776874542236328, "global_step": 361921, "epoch": 2154} {"train_loss": -12.392627716064453, "global_step": 361922, "epoch": 2154} {"train_loss": -11.63606071472168, "global_step": 361923, "epoch": 2154} {"train_loss": -12.076889038085938, "global_step": 361924, "epoch": 2154} {"train_loss": -12.118913650512695, "global_step": 361925, "epoch": 2154} {"train_loss": -11.691912651062012, "global_step": 361926, "epoch": 2154} {"train_loss": -12.325506210327148, "global_step": 361927, "epoch": 2154} {"train_loss": -11.96939754486084, "global_step": 361928, "epoch": 2154} {"train_loss": -12.366859436035156, "global_step": 361929, "epoch": 2154} {"train_loss": -11.868839263916016, "global_step": 361930, "epoch": 2154} {"train_loss": -12.409669876098633, "global_step": 361931, "epoch": 2154} {"train_loss": -12.244121551513672, "global_step": 361932, "epoch": 2154} {"train_loss": -12.382801055908203, "global_step": 361933, "epoch": 2154} {"train_loss": -12.334104537963867, "global_step": 361934, "epoch": 2154} {"train_loss": -12.318416595458984, "global_step": 361935, "epoch": 2154} {"train_loss": -12.263328552246094, "global_step": 361936, "epoch": 2154} {"train_loss": -12.278761863708496, "global_step": 361937, "epoch": 2154} {"train_loss": -12.395885467529297, "global_step": 361938, "epoch": 2154} {"train_loss": -12.57849407196045, "global_step": 361939, "epoch": 2154} {"train_loss": -12.206327438354492, "global_step": 361940, "epoch": 2154} {"train_loss": -12.323644638061523, "global_step": 361941, "epoch": 2154} {"train_loss": -12.520402908325195, "global_step": 361942, "epoch": 2154} {"train_loss": -12.186147689819336, "global_step": 361943, "epoch": 2154} {"train_loss": -12.230670928955078, "global_step": 361944, "epoch": 2154} {"train_loss": -12.473312377929688, "global_step": 361945, "epoch": 2154} {"train_loss": -12.530231475830078, "global_step": 361946, "epoch": 2154} {"train_loss": -12.45404052734375, "global_step": 361947, "epoch": 2154} {"train_loss": -12.523067474365234, "global_step": 361948, "epoch": 2154} {"train_loss": -12.42832088470459, "global_step": 361949, "epoch": 2154} {"train_loss": -12.580501556396484, "global_step": 361950, "epoch": 2154} {"train_loss": -12.489736557006836, "global_step": 361951, "epoch": 2154} {"train_loss": -12.658658981323242, "global_step": 361952, "epoch": 2154} {"train_loss": -12.250368118286133, "global_step": 361953, "epoch": 2154} {"train_loss": -12.602638244628906, "global_step": 361954, "epoch": 2154} {"train_loss": -12.56866455078125, "global_step": 361955, "epoch": 2154} {"train_loss": -12.479997634887695, "global_step": 361956, "epoch": 2154} {"train_loss": -12.476900100708008, "global_step": 361957, "epoch": 2154} {"train_loss": -12.525564193725586, "global_step": 361958, "epoch": 2154} {"train_loss": -12.650259017944336, "global_step": 361959, "epoch": 2154} {"train_loss": -12.635747909545898, "global_step": 361960, "epoch": 2154} {"train_loss": -12.42973804473877, "global_step": 361961, "epoch": 2154} {"train_loss": -12.631255149841309, "global_step": 361962, "epoch": 2154} {"train_loss": -12.63650131225586, "global_step": 361963, "epoch": 2154} {"train_loss": -12.829899787902832, "global_step": 361964, "epoch": 2154} {"train_loss": -12.73659610748291, "global_step": 361965, "epoch": 2154} {"train_loss": -12.642902374267578, "global_step": 361966, "epoch": 2154} {"train_loss": -12.658966064453125, "global_step": 361967, "epoch": 2154} {"train_loss": -12.754627227783203, "global_step": 361968, "epoch": 2154} {"train_loss": -12.396817207336426, "global_step": 361969, "epoch": 2154} {"train_loss": -12.576199531555176, "global_step": 361970, "epoch": 2154} {"train_loss": -12.611632347106934, "global_step": 361971, "epoch": 2154} {"train_loss": -12.385395050048828, "global_step": 361972, "epoch": 2154} {"train_loss": -12.260217666625977, "global_step": 361973, "epoch": 2154} {"train_loss": -12.651763916015625, "global_step": 361974, "epoch": 2154} {"train_loss": -12.29725456237793, "global_step": 361975, "epoch": 2154} {"train_loss": -12.359086990356445, "global_step": 361976, "epoch": 2154} {"train_loss": -12.365060806274414, "global_step": 361977, "epoch": 2154} {"train_loss": -12.520119667053223, "global_step": 361978, "epoch": 2154} {"train_loss": -12.647542953491211, "global_step": 361979, "epoch": 2154} {"train_loss": -12.740304946899414, "global_step": 361980, "epoch": 2154} {"train_loss": -12.4193696975708, "global_step": 361981, "epoch": 2154} {"train_loss": -12.518745422363281, "global_step": 361982, "epoch": 2154} {"train_loss": -12.659488677978516, "global_step": 361983, "epoch": 2154} {"train_loss": -12.906332015991211, "global_step": 361984, "epoch": 2154} {"train_loss": -12.800477981567383, "global_step": 361985, "epoch": 2154} {"train_loss": -12.250650405883789, "global_step": 361986, "epoch": 2154} {"train_loss": -12.602855682373047, "global_step": 361987, "epoch": 2154} {"train_loss": -12.529654502868652, "global_step": 361988, "epoch": 2154} {"train_loss": -12.583263397216797, "global_step": 361989, "epoch": 2154} {"train_loss": -12.739517211914062, "global_step": 361990, "epoch": 2154} {"train_loss": -11.666946411132812, "global_step": 361991, "epoch": 2154} {"train_loss": -11.787278175354004, "global_step": 361992, "epoch": 2154} {"train_loss": -11.90256118774414, "global_step": 361993, "epoch": 2154} {"train_loss": -12.495086669921875, "global_step": 361994, "epoch": 2154} {"train_loss": -11.73410415649414, "global_step": 361995, "epoch": 2154} {"train_loss": -9.851700782775879, "global_step": 361996, "epoch": 2154} {"train_loss": -10.648360252380371, "global_step": 361997, "epoch": 2154} {"train_loss": -12.284149169921875, "global_step": 361998, "epoch": 2154} {"train_loss": -9.910396575927734, "global_step": 361999, "epoch": 2154} {"train_loss": -10.143989562988281, "global_step": 362000, "epoch": 2154} {"train_loss": -9.026556015014648, "global_step": 362001, "epoch": 2154} {"train_loss": -10.157819747924805, "global_step": 362002, "epoch": 2154} {"train_loss": -6.957483291625977, "global_step": 362003, "epoch": 2154} {"train_loss": -9.565299034118652, "global_step": 362004, "epoch": 2154} {"train_loss": -6.718761444091797, "global_step": 362005, "epoch": 2154} {"train_loss": -5.009703636169434, "global_step": 362006, "epoch": 2154} {"train_loss": -5.039491176605225, "global_step": 362007, "epoch": 2154} {"train_loss": -5.421426773071289, "global_step": 362008, "epoch": 2154} {"train_loss": -5.048095226287842, "global_step": 362009, "epoch": 2154} {"train_loss": -5.315794944763184, "global_step": 362010, "epoch": 2154} {"train_loss": -5.779982566833496, "global_step": 362011, "epoch": 2154} {"train_loss": -5.299867630004883, "global_step": 362012, "epoch": 2154} {"train_loss": -5.24070405960083, "global_step": 362013, "epoch": 2154} {"train_loss": -5.501434326171875, "global_step": 362014, "epoch": 2154} {"train_loss": -5.66051721572876, "global_step": 362015, "epoch": 2154} {"train_loss": -5.346048355102539, "global_step": 362016, "epoch": 2154} {"train_loss": -5.669895172119141, "global_step": 362017, "epoch": 2154} {"train_loss": -5.836880683898926, "global_step": 362018, "epoch": 2154} {"train_loss": -6.338342189788818, "global_step": 362019, "epoch": 2154} {"train_loss": -6.021993637084961, "global_step": 362020, "epoch": 2154} {"train_loss": -6.0921478271484375, "global_step": 362021, "epoch": 2154} {"train_loss": -6.662446022033691, "global_step": 362022, "epoch": 2154} {"train_loss": -6.744983673095703, "global_step": 362023, "epoch": 2154} {"train_loss": -6.486257553100586, "global_step": 362024, "epoch": 2154} {"train_loss": -6.552473545074463, "global_step": 362025, "epoch": 2154} {"train_loss": -6.802164077758789, "global_step": 362026, "epoch": 2154} {"train_loss": -6.809821605682373, "global_step": 362027, "epoch": 2154} {"train_loss": -6.836702346801758, "global_step": 362028, "epoch": 2154} {"train_loss": -7.0965576171875, "global_step": 362029, "epoch": 2154} {"train_loss": -7.264199256896973, "global_step": 362030, "epoch": 2154} {"train_loss": -7.682535171508789, "global_step": 362031, "epoch": 2154} {"train_loss": -7.099313259124756, "global_step": 362032, "epoch": 2154} {"train_loss": -7.552427291870117, "global_step": 362033, "epoch": 2154} {"train_loss": -7.580893516540527, "global_step": 362034, "epoch": 2154} {"train_loss": -7.554862022399902, "global_step": 362035, "epoch": 2154} {"train_loss": -7.880614757537842, "global_step": 362036, "epoch": 2154} {"train_loss": -7.998734474182129, "global_step": 362037, "epoch": 2154} {"train_loss": -8.135943412780762, "global_step": 362038, "epoch": 2154} {"train_loss": -10.729877537205105, "global_step": 362039, "epoch": 2154, "val_loss": 285282.1875} {"train_loss": -8.312700271606445, "global_step": 362040, "epoch": 2155} {"train_loss": -8.523632049560547, "global_step": 362041, "epoch": 2155} {"train_loss": -8.406289100646973, "global_step": 362042, "epoch": 2155} {"train_loss": -8.662160873413086, "global_step": 362043, "epoch": 2155} {"train_loss": -8.826794624328613, "global_step": 362044, "epoch": 2155} {"train_loss": -8.96457290649414, "global_step": 362045, "epoch": 2155} {"train_loss": -9.135469436645508, "global_step": 362046, "epoch": 2155} {"train_loss": -8.986114501953125, "global_step": 362047, "epoch": 2155} {"train_loss": -9.03807258605957, "global_step": 362048, "epoch": 2155} {"train_loss": -9.466819763183594, "global_step": 362049, "epoch": 2155} {"train_loss": -9.11008071899414, "global_step": 362050, "epoch": 2155} {"train_loss": -9.495502471923828, "global_step": 362051, "epoch": 2155} {"train_loss": -9.611699104309082, "global_step": 362052, "epoch": 2155} {"train_loss": -9.57896900177002, "global_step": 362053, "epoch": 2155} {"train_loss": -9.252376556396484, "global_step": 362054, "epoch": 2155} {"train_loss": -9.613386154174805, "global_step": 362055, "epoch": 2155} {"train_loss": -9.894121170043945, "global_step": 362056, "epoch": 2155} {"train_loss": -9.923409461975098, "global_step": 362057, "epoch": 2155} {"train_loss": -9.979820251464844, "global_step": 362058, "epoch": 2155} {"train_loss": -10.454231262207031, "global_step": 362059, "epoch": 2155} {"train_loss": -10.28305435180664, "global_step": 362060, "epoch": 2155} {"train_loss": -10.837081909179688, "global_step": 362061, "epoch": 2155} {"train_loss": -10.464029312133789, "global_step": 362062, "epoch": 2155} {"train_loss": -10.907014846801758, "global_step": 362063, "epoch": 2155} {"train_loss": -10.490915298461914, "global_step": 362064, "epoch": 2155} {"train_loss": -11.021310806274414, "global_step": 362065, "epoch": 2155} {"train_loss": -11.060163497924805, "global_step": 362066, "epoch": 2155} {"train_loss": -10.929695129394531, "global_step": 362067, "epoch": 2155} {"train_loss": -10.854303359985352, "global_step": 362068, "epoch": 2155} {"train_loss": -11.102185249328613, "global_step": 362069, "epoch": 2155} {"train_loss": -10.915956497192383, "global_step": 362070, "epoch": 2155} {"train_loss": -10.607690811157227, "global_step": 362071, "epoch": 2155} {"train_loss": -11.50151538848877, "global_step": 362072, "epoch": 2155} {"train_loss": -10.771648406982422, "global_step": 362073, "epoch": 2155} {"train_loss": -11.358749389648438, "global_step": 362074, "epoch": 2155} {"train_loss": -11.20866870880127, "global_step": 362075, "epoch": 2155} {"train_loss": -11.387178421020508, "global_step": 362076, "epoch": 2155} {"train_loss": -11.271954536437988, "global_step": 362077, "epoch": 2155} {"train_loss": -11.595723152160645, "global_step": 362078, "epoch": 2155} {"train_loss": -11.288838386535645, "global_step": 362079, "epoch": 2155} {"train_loss": -12.012083053588867, "global_step": 362080, "epoch": 2155} {"train_loss": -11.771726608276367, "global_step": 362081, "epoch": 2155} {"train_loss": -11.670044898986816, "global_step": 362082, "epoch": 2155} {"train_loss": -11.570868492126465, "global_step": 362083, "epoch": 2155} {"train_loss": -11.058744430541992, "global_step": 362084, "epoch": 2155} {"train_loss": -11.371264457702637, "global_step": 362085, "epoch": 2155} {"train_loss": -11.737143516540527, "global_step": 362086, "epoch": 2155} {"train_loss": -11.42387866973877, "global_step": 362087, "epoch": 2155} {"train_loss": -11.706836700439453, "global_step": 362088, "epoch": 2155} {"train_loss": -11.63248062133789, "global_step": 362089, "epoch": 2155} {"train_loss": -11.466428756713867, "global_step": 362090, "epoch": 2155} {"train_loss": -11.354180335998535, "global_step": 362091, "epoch": 2155} {"train_loss": -11.544559478759766, "global_step": 362092, "epoch": 2155} {"train_loss": -11.775993347167969, "global_step": 362093, "epoch": 2155} {"train_loss": -11.73427963256836, "global_step": 362094, "epoch": 2155} {"train_loss": -12.04814624786377, "global_step": 362095, "epoch": 2155} {"train_loss": -11.886804580688477, "global_step": 362096, "epoch": 2155} {"train_loss": -11.876960754394531, "global_step": 362097, "epoch": 2155} {"train_loss": -12.267765998840332, "global_step": 362098, "epoch": 2155} {"train_loss": -11.919221878051758, "global_step": 362099, "epoch": 2155} {"train_loss": -11.940731048583984, "global_step": 362100, "epoch": 2155} {"train_loss": -12.313234329223633, "global_step": 362101, "epoch": 2155} {"train_loss": -12.123210906982422, "global_step": 362102, "epoch": 2155} {"train_loss": -11.903438568115234, "global_step": 362103, "epoch": 2155} {"train_loss": -11.904942512512207, "global_step": 362104, "epoch": 2155} {"train_loss": -12.245424270629883, "global_step": 362105, "epoch": 2155} {"train_loss": -12.123662948608398, "global_step": 362106, "epoch": 2155} {"train_loss": -11.983749389648438, "global_step": 362107, "epoch": 2155} {"train_loss": -12.359477996826172, "global_step": 362108, "epoch": 2155} {"train_loss": -12.080108642578125, "global_step": 362109, "epoch": 2155} {"train_loss": -12.19487190246582, "global_step": 362110, "epoch": 2155} {"train_loss": -12.135204315185547, "global_step": 362111, "epoch": 2155} {"train_loss": -11.604605674743652, "global_step": 362112, "epoch": 2155} {"train_loss": -12.097990989685059, "global_step": 362113, "epoch": 2155} {"train_loss": -12.021728515625, "global_step": 362114, "epoch": 2155} {"train_loss": -12.069681167602539, "global_step": 362115, "epoch": 2155} {"train_loss": -12.122368812561035, "global_step": 362116, "epoch": 2155} {"train_loss": -12.020828247070312, "global_step": 362117, "epoch": 2155} {"train_loss": -12.4244384765625, "global_step": 362118, "epoch": 2155} {"train_loss": -12.388763427734375, "global_step": 362119, "epoch": 2155} {"train_loss": -12.315649032592773, "global_step": 362120, "epoch": 2155} {"train_loss": -11.73708724975586, "global_step": 362121, "epoch": 2155} {"train_loss": -12.019050598144531, "global_step": 362122, "epoch": 2155} {"train_loss": -12.337657928466797, "global_step": 362123, "epoch": 2155} {"train_loss": -11.950698852539062, "global_step": 362124, "epoch": 2155} {"train_loss": -11.671173095703125, "global_step": 362125, "epoch": 2155} {"train_loss": -12.11358642578125, "global_step": 362126, "epoch": 2155} {"train_loss": -12.009713172912598, "global_step": 362127, "epoch": 2155} {"train_loss": -12.274394989013672, "global_step": 362128, "epoch": 2155} {"train_loss": -11.834966659545898, "global_step": 362129, "epoch": 2155} {"train_loss": -12.380914688110352, "global_step": 362130, "epoch": 2155} {"train_loss": -11.925596237182617, "global_step": 362131, "epoch": 2155} {"train_loss": -11.557310104370117, "global_step": 362132, "epoch": 2155} {"train_loss": -11.702478408813477, "global_step": 362133, "epoch": 2155} {"train_loss": -12.21847152709961, "global_step": 362134, "epoch": 2155} {"train_loss": -11.388009071350098, "global_step": 362135, "epoch": 2155} {"train_loss": -11.725174903869629, "global_step": 362136, "epoch": 2155} {"train_loss": -12.092477798461914, "global_step": 362137, "epoch": 2155} {"train_loss": -11.967161178588867, "global_step": 362138, "epoch": 2155} {"train_loss": -11.942044258117676, "global_step": 362139, "epoch": 2155} {"train_loss": -11.972583770751953, "global_step": 362140, "epoch": 2155} {"train_loss": -12.088273048400879, "global_step": 362141, "epoch": 2155} {"train_loss": -11.646528244018555, "global_step": 362142, "epoch": 2155} {"train_loss": -11.763297080993652, "global_step": 362143, "epoch": 2155} {"train_loss": -11.876794815063477, "global_step": 362144, "epoch": 2155} {"train_loss": -12.154133796691895, "global_step": 362145, "epoch": 2155} {"train_loss": -11.761947631835938, "global_step": 362146, "epoch": 2155} {"train_loss": -12.414092063903809, "global_step": 362147, "epoch": 2155} {"train_loss": -12.323923110961914, "global_step": 362148, "epoch": 2155} {"train_loss": -11.626471519470215, "global_step": 362149, "epoch": 2155} {"train_loss": -11.449108123779297, "global_step": 362150, "epoch": 2155} {"train_loss": -12.204168319702148, "global_step": 362151, "epoch": 2155} {"train_loss": -12.189802169799805, "global_step": 362152, "epoch": 2155} {"train_loss": -12.402572631835938, "global_step": 362153, "epoch": 2155} {"train_loss": -12.51791000366211, "global_step": 362154, "epoch": 2155} {"train_loss": -12.4747953414917, "global_step": 362155, "epoch": 2155} {"train_loss": -12.24429988861084, "global_step": 362156, "epoch": 2155} {"train_loss": -12.540319442749023, "global_step": 362157, "epoch": 2155} {"train_loss": -12.298969268798828, "global_step": 362158, "epoch": 2155} {"train_loss": -12.630939483642578, "global_step": 362159, "epoch": 2155} {"train_loss": -12.247480392456055, "global_step": 362160, "epoch": 2155} {"train_loss": -12.550233840942383, "global_step": 362161, "epoch": 2155} {"train_loss": -12.356212615966797, "global_step": 362162, "epoch": 2155} {"train_loss": -12.492864608764648, "global_step": 362163, "epoch": 2155} {"train_loss": -12.360345840454102, "global_step": 362164, "epoch": 2155} {"train_loss": -12.24597454071045, "global_step": 362165, "epoch": 2155} {"train_loss": -12.443446159362793, "global_step": 362166, "epoch": 2155} {"train_loss": -11.983675003051758, "global_step": 362167, "epoch": 2155} {"train_loss": -11.795312881469727, "global_step": 362168, "epoch": 2155} {"train_loss": -12.10810375213623, "global_step": 362169, "epoch": 2155} {"train_loss": -11.610777854919434, "global_step": 362170, "epoch": 2155} {"train_loss": -11.951388359069824, "global_step": 362171, "epoch": 2155} {"train_loss": -11.434860229492188, "global_step": 362172, "epoch": 2155} {"train_loss": -12.325828552246094, "global_step": 362173, "epoch": 2155} {"train_loss": -11.673614501953125, "global_step": 362174, "epoch": 2155} {"train_loss": -11.723925590515137, "global_step": 362175, "epoch": 2155} {"train_loss": -10.96955680847168, "global_step": 362176, "epoch": 2155} {"train_loss": -11.29965591430664, "global_step": 362177, "epoch": 2155} {"train_loss": -11.999963760375977, "global_step": 362178, "epoch": 2155} {"train_loss": -11.69449520111084, "global_step": 362179, "epoch": 2155} {"train_loss": -12.050758361816406, "global_step": 362180, "epoch": 2155} {"train_loss": -12.494187355041504, "global_step": 362181, "epoch": 2155} {"train_loss": -11.585962295532227, "global_step": 362182, "epoch": 2155} {"train_loss": -12.433378219604492, "global_step": 362183, "epoch": 2155} {"train_loss": -11.06190013885498, "global_step": 362184, "epoch": 2155} {"train_loss": -12.37154769897461, "global_step": 362185, "epoch": 2155} {"train_loss": -12.032623291015625, "global_step": 362186, "epoch": 2155} {"train_loss": -11.656394958496094, "global_step": 362187, "epoch": 2155} {"train_loss": -12.05870246887207, "global_step": 362188, "epoch": 2155} {"train_loss": -12.06854248046875, "global_step": 362189, "epoch": 2155} {"train_loss": -12.128454208374023, "global_step": 362190, "epoch": 2155} {"train_loss": -12.399389266967773, "global_step": 362191, "epoch": 2155} {"train_loss": -11.71941089630127, "global_step": 362192, "epoch": 2155} {"train_loss": -12.451515197753906, "global_step": 362193, "epoch": 2155} {"train_loss": -12.159724235534668, "global_step": 362194, "epoch": 2155} {"train_loss": -11.678705215454102, "global_step": 362195, "epoch": 2155} {"train_loss": -12.294941902160645, "global_step": 362196, "epoch": 2155} {"train_loss": -11.920981407165527, "global_step": 362197, "epoch": 2155} {"train_loss": -12.158519744873047, "global_step": 362198, "epoch": 2155} {"train_loss": -11.98928451538086, "global_step": 362199, "epoch": 2155} {"train_loss": -12.191963195800781, "global_step": 362200, "epoch": 2155} {"train_loss": -12.279875755310059, "global_step": 362201, "epoch": 2155} {"train_loss": -11.779675483703613, "global_step": 362202, "epoch": 2155} {"train_loss": -12.040587425231934, "global_step": 362203, "epoch": 2155} {"train_loss": -12.135950088500977, "global_step": 362204, "epoch": 2155} {"train_loss": -12.34567928314209, "global_step": 362205, "epoch": 2155} {"train_loss": -12.407051086425781, "global_step": 362206, "epoch": 2155} {"train_loss": -11.547142267227173, "global_step": 362207, "epoch": 2155, "val_loss": 293109.65625, "train_action_mse_error": 1.6928600072860718} {"train_loss": -11.339296340942383, "global_step": 362208, "epoch": 2156} {"train_loss": -11.628301620483398, "global_step": 362209, "epoch": 2156} {"train_loss": -12.488466262817383, "global_step": 362210, "epoch": 2156} {"train_loss": -11.597965240478516, "global_step": 362211, "epoch": 2156} {"train_loss": -11.480600357055664, "global_step": 362212, "epoch": 2156} {"train_loss": -12.264516830444336, "global_step": 362213, "epoch": 2156} {"train_loss": -11.259103775024414, "global_step": 362214, "epoch": 2156} {"train_loss": -11.966323852539062, "global_step": 362215, "epoch": 2156} {"train_loss": -11.975341796875, "global_step": 362216, "epoch": 2156} {"train_loss": -11.944513320922852, "global_step": 362217, "epoch": 2156} {"train_loss": -12.074546813964844, "global_step": 362218, "epoch": 2156} {"train_loss": -12.2701416015625, "global_step": 362219, "epoch": 2156} {"train_loss": -12.172134399414062, "global_step": 362220, "epoch": 2156} {"train_loss": -12.223837852478027, "global_step": 362221, "epoch": 2156} {"train_loss": -12.168622970581055, "global_step": 362222, "epoch": 2156} {"train_loss": -11.8260498046875, "global_step": 362223, "epoch": 2156} {"train_loss": -12.17416000366211, "global_step": 362224, "epoch": 2156} {"train_loss": -11.699843406677246, "global_step": 362225, "epoch": 2156} {"train_loss": -12.035371780395508, "global_step": 362226, "epoch": 2156} {"train_loss": -12.173481941223145, "global_step": 362227, "epoch": 2156} {"train_loss": -11.82568073272705, "global_step": 362228, "epoch": 2156} {"train_loss": -12.514228820800781, "global_step": 362229, "epoch": 2156} {"train_loss": -11.994132995605469, "global_step": 362230, "epoch": 2156} {"train_loss": -11.904983520507812, "global_step": 362231, "epoch": 2156} {"train_loss": -12.618340492248535, "global_step": 362232, "epoch": 2156} {"train_loss": -12.227336883544922, "global_step": 362233, "epoch": 2156} {"train_loss": -11.712296485900879, "global_step": 362234, "epoch": 2156} {"train_loss": -12.486644744873047, "global_step": 362235, "epoch": 2156} {"train_loss": -12.275236129760742, "global_step": 362236, "epoch": 2156} {"train_loss": -12.122220039367676, "global_step": 362237, "epoch": 2156} {"train_loss": -12.47848129272461, "global_step": 362238, "epoch": 2156} {"train_loss": -12.536093711853027, "global_step": 362239, "epoch": 2156} {"train_loss": -12.296211242675781, "global_step": 362240, "epoch": 2156} {"train_loss": -12.039243698120117, "global_step": 362241, "epoch": 2156} {"train_loss": -12.376167297363281, "global_step": 362242, "epoch": 2156} {"train_loss": -12.409229278564453, "global_step": 362243, "epoch": 2156} {"train_loss": -11.977204322814941, "global_step": 362244, "epoch": 2156} {"train_loss": -12.427900314331055, "global_step": 362245, "epoch": 2156} {"train_loss": -12.370190620422363, "global_step": 362246, "epoch": 2156} {"train_loss": -11.885302543640137, "global_step": 362247, "epoch": 2156} {"train_loss": -12.237882614135742, "global_step": 362248, "epoch": 2156} {"train_loss": -12.490750312805176, "global_step": 362249, "epoch": 2156} {"train_loss": -11.785734176635742, "global_step": 362250, "epoch": 2156} {"train_loss": -12.320048332214355, "global_step": 362251, "epoch": 2156} {"train_loss": -12.313094139099121, "global_step": 362252, "epoch": 2156} {"train_loss": -11.905658721923828, "global_step": 362253, "epoch": 2156} {"train_loss": -11.96451473236084, "global_step": 362254, "epoch": 2156} {"train_loss": -12.135967254638672, "global_step": 362255, "epoch": 2156} {"train_loss": -11.990808486938477, "global_step": 362256, "epoch": 2156} {"train_loss": -11.529491424560547, "global_step": 362257, "epoch": 2156} {"train_loss": -11.430785179138184, "global_step": 362258, "epoch": 2156} {"train_loss": -12.15328311920166, "global_step": 362259, "epoch": 2156} {"train_loss": -12.285316467285156, "global_step": 362260, "epoch": 2156} {"train_loss": -11.127058982849121, "global_step": 362261, "epoch": 2156} {"train_loss": -11.874317169189453, "global_step": 362262, "epoch": 2156} {"train_loss": -12.238855361938477, "global_step": 362263, "epoch": 2156} {"train_loss": -11.886604309082031, "global_step": 362264, "epoch": 2156} {"train_loss": -11.947526931762695, "global_step": 362265, "epoch": 2156} {"train_loss": -12.036547660827637, "global_step": 362266, "epoch": 2156} {"train_loss": -10.700993537902832, "global_step": 362267, "epoch": 2156} {"train_loss": -11.63147258758545, "global_step": 362268, "epoch": 2156} {"train_loss": -11.88188362121582, "global_step": 362269, "epoch": 2156} {"train_loss": -12.152851104736328, "global_step": 362270, "epoch": 2156} {"train_loss": -11.862003326416016, "global_step": 362271, "epoch": 2156} {"train_loss": -12.321233749389648, "global_step": 362272, "epoch": 2156} {"train_loss": -12.20875072479248, "global_step": 362273, "epoch": 2156} {"train_loss": -12.24951457977295, "global_step": 362274, "epoch": 2156} {"train_loss": -12.346616744995117, "global_step": 362275, "epoch": 2156} {"train_loss": -11.952478408813477, "global_step": 362276, "epoch": 2156} {"train_loss": -12.431554794311523, "global_step": 362277, "epoch": 2156} {"train_loss": -12.108861923217773, "global_step": 362278, "epoch": 2156} {"train_loss": -12.1627197265625, "global_step": 362279, "epoch": 2156} {"train_loss": -12.282432556152344, "global_step": 362280, "epoch": 2156} {"train_loss": -12.467700004577637, "global_step": 362281, "epoch": 2156} {"train_loss": -12.225703239440918, "global_step": 362282, "epoch": 2156} {"train_loss": -12.341947555541992, "global_step": 362283, "epoch": 2156} {"train_loss": -11.496758460998535, "global_step": 362284, "epoch": 2156} {"train_loss": -12.504838943481445, "global_step": 362285, "epoch": 2156} {"train_loss": -11.607168197631836, "global_step": 362286, "epoch": 2156} {"train_loss": -12.307607650756836, "global_step": 362287, "epoch": 2156} {"train_loss": -11.638401985168457, "global_step": 362288, "epoch": 2156} {"train_loss": -11.984212875366211, "global_step": 362289, "epoch": 2156} {"train_loss": -11.80548095703125, "global_step": 362290, "epoch": 2156} {"train_loss": -11.924614906311035, "global_step": 362291, "epoch": 2156} {"train_loss": -11.362161636352539, "global_step": 362292, "epoch": 2156} {"train_loss": -12.020334243774414, "global_step": 362293, "epoch": 2156} {"train_loss": -12.505779266357422, "global_step": 362294, "epoch": 2156} {"train_loss": -11.676874160766602, "global_step": 362295, "epoch": 2156} {"train_loss": -12.070755958557129, "global_step": 362296, "epoch": 2156} {"train_loss": -12.123565673828125, "global_step": 362297, "epoch": 2156} {"train_loss": -11.63273811340332, "global_step": 362298, "epoch": 2156} {"train_loss": -11.637365341186523, "global_step": 362299, "epoch": 2156} {"train_loss": -11.459625244140625, "global_step": 362300, "epoch": 2156} {"train_loss": -10.584895133972168, "global_step": 362301, "epoch": 2156} {"train_loss": -11.857755661010742, "global_step": 362302, "epoch": 2156} {"train_loss": -9.617045402526855, "global_step": 362303, "epoch": 2156} {"train_loss": -11.337398529052734, "global_step": 362304, "epoch": 2156} {"train_loss": -9.706669807434082, "global_step": 362305, "epoch": 2156} {"train_loss": -10.197933197021484, "global_step": 362306, "epoch": 2156} {"train_loss": -9.958106994628906, "global_step": 362307, "epoch": 2156} {"train_loss": -10.976966857910156, "global_step": 362308, "epoch": 2156} {"train_loss": -10.245349884033203, "global_step": 362309, "epoch": 2156} {"train_loss": -11.845584869384766, "global_step": 362310, "epoch": 2156} {"train_loss": -10.778571128845215, "global_step": 362311, "epoch": 2156} {"train_loss": -10.345998764038086, "global_step": 362312, "epoch": 2156} {"train_loss": -11.130928039550781, "global_step": 362313, "epoch": 2156} {"train_loss": -10.858599662780762, "global_step": 362314, "epoch": 2156} {"train_loss": -10.520429611206055, "global_step": 362315, "epoch": 2156} {"train_loss": -11.604339599609375, "global_step": 362316, "epoch": 2156} {"train_loss": -11.005207061767578, "global_step": 362317, "epoch": 2156} {"train_loss": -11.59078311920166, "global_step": 362318, "epoch": 2156} {"train_loss": -10.966285705566406, "global_step": 362319, "epoch": 2156} {"train_loss": -11.46139907836914, "global_step": 362320, "epoch": 2156} {"train_loss": -11.307073593139648, "global_step": 362321, "epoch": 2156} {"train_loss": -10.829740524291992, "global_step": 362322, "epoch": 2156} {"train_loss": -11.608275413513184, "global_step": 362323, "epoch": 2156} {"train_loss": -11.39521598815918, "global_step": 362324, "epoch": 2156} {"train_loss": -11.448169708251953, "global_step": 362325, "epoch": 2156} {"train_loss": -11.250190734863281, "global_step": 362326, "epoch": 2156} {"train_loss": -11.366089820861816, "global_step": 362327, "epoch": 2156} {"train_loss": -11.705589294433594, "global_step": 362328, "epoch": 2156} {"train_loss": -11.369359970092773, "global_step": 362329, "epoch": 2156} {"train_loss": -11.504121780395508, "global_step": 362330, "epoch": 2156} {"train_loss": -11.820220947265625, "global_step": 362331, "epoch": 2156} {"train_loss": -11.785768508911133, "global_step": 362332, "epoch": 2156} {"train_loss": -11.685302734375, "global_step": 362333, "epoch": 2156} {"train_loss": -11.982207298278809, "global_step": 362334, "epoch": 2156} {"train_loss": -11.577664375305176, "global_step": 362335, "epoch": 2156} {"train_loss": -12.164669036865234, "global_step": 362336, "epoch": 2156} {"train_loss": -11.671586036682129, "global_step": 362337, "epoch": 2156} {"train_loss": -11.816793441772461, "global_step": 362338, "epoch": 2156} {"train_loss": -12.002992630004883, "global_step": 362339, "epoch": 2156} {"train_loss": -11.831920623779297, "global_step": 362340, "epoch": 2156} {"train_loss": -12.003032684326172, "global_step": 362341, "epoch": 2156} {"train_loss": -11.613383293151855, "global_step": 362342, "epoch": 2156} {"train_loss": -12.156707763671875, "global_step": 362343, "epoch": 2156} {"train_loss": -12.027639389038086, "global_step": 362344, "epoch": 2156} {"train_loss": -12.071601867675781, "global_step": 362345, "epoch": 2156} {"train_loss": -12.105167388916016, "global_step": 362346, "epoch": 2156} {"train_loss": -11.93365478515625, "global_step": 362347, "epoch": 2156} {"train_loss": -11.928205490112305, "global_step": 362348, "epoch": 2156} {"train_loss": -12.269922256469727, "global_step": 362349, "epoch": 2156} {"train_loss": -11.802227973937988, "global_step": 362350, "epoch": 2156} {"train_loss": -12.18559455871582, "global_step": 362351, "epoch": 2156} {"train_loss": -11.956846237182617, "global_step": 362352, "epoch": 2156} {"train_loss": -12.5438814163208, "global_step": 362353, "epoch": 2156} {"train_loss": -12.24638843536377, "global_step": 362354, "epoch": 2156} {"train_loss": -12.326403617858887, "global_step": 362355, "epoch": 2156} {"train_loss": -12.356130599975586, "global_step": 362356, "epoch": 2156} {"train_loss": -12.326199531555176, "global_step": 362357, "epoch": 2156} {"train_loss": -12.28184700012207, "global_step": 362358, "epoch": 2156} {"train_loss": -11.774787902832031, "global_step": 362359, "epoch": 2156} {"train_loss": -12.32450008392334, "global_step": 362360, "epoch": 2156} {"train_loss": -11.978675842285156, "global_step": 362361, "epoch": 2156} {"train_loss": -12.259326934814453, "global_step": 362362, "epoch": 2156} {"train_loss": -12.22258186340332, "global_step": 362363, "epoch": 2156} {"train_loss": -12.045591354370117, "global_step": 362364, "epoch": 2156} {"train_loss": -11.837697982788086, "global_step": 362365, "epoch": 2156} {"train_loss": -11.745064735412598, "global_step": 362366, "epoch": 2156} {"train_loss": -11.373767852783203, "global_step": 362367, "epoch": 2156} {"train_loss": -12.343368530273438, "global_step": 362368, "epoch": 2156} {"train_loss": -11.41073226928711, "global_step": 362369, "epoch": 2156} {"train_loss": -11.743843078613281, "global_step": 362370, "epoch": 2156} {"train_loss": -11.596010208129883, "global_step": 362371, "epoch": 2156} {"train_loss": -11.471307754516602, "global_step": 362372, "epoch": 2156} {"train_loss": -11.910606384277344, "global_step": 362373, "epoch": 2156} {"train_loss": -11.385330200195312, "global_step": 362374, "epoch": 2156} {"train_loss": -11.824619440805344, "global_step": 362375, "epoch": 2156, "val_loss": 292241.84375} {"train_loss": -10.909402847290039, "global_step": 362376, "epoch": 2157} {"train_loss": -12.236576080322266, "global_step": 362377, "epoch": 2157} {"train_loss": -11.234548568725586, "global_step": 362378, "epoch": 2157} {"train_loss": -11.454177856445312, "global_step": 362379, "epoch": 2157} {"train_loss": -12.246994018554688, "global_step": 362380, "epoch": 2157} {"train_loss": -11.137809753417969, "global_step": 362381, "epoch": 2157} {"train_loss": -11.47343635559082, "global_step": 362382, "epoch": 2157} {"train_loss": -11.843128204345703, "global_step": 362383, "epoch": 2157} {"train_loss": -10.755781173706055, "global_step": 362384, "epoch": 2157} {"train_loss": -11.488258361816406, "global_step": 362385, "epoch": 2157} {"train_loss": -10.421086311340332, "global_step": 362386, "epoch": 2157} {"train_loss": -10.460250854492188, "global_step": 362387, "epoch": 2157} {"train_loss": -11.260697364807129, "global_step": 362388, "epoch": 2157} {"train_loss": -10.070131301879883, "global_step": 362389, "epoch": 2157} {"train_loss": -9.991345405578613, "global_step": 362390, "epoch": 2157} {"train_loss": -10.995397567749023, "global_step": 362391, "epoch": 2157} {"train_loss": -10.960927963256836, "global_step": 362392, "epoch": 2157} {"train_loss": -10.828192710876465, "global_step": 362393, "epoch": 2157} {"train_loss": -10.830799102783203, "global_step": 362394, "epoch": 2157} {"train_loss": -10.391033172607422, "global_step": 362395, "epoch": 2157} {"train_loss": -10.891849517822266, "global_step": 362396, "epoch": 2157} {"train_loss": -11.066197395324707, "global_step": 362397, "epoch": 2157} {"train_loss": -10.72557258605957, "global_step": 362398, "epoch": 2157} {"train_loss": -11.325342178344727, "global_step": 362399, "epoch": 2157} {"train_loss": -10.952658653259277, "global_step": 362400, "epoch": 2157} {"train_loss": -11.754636764526367, "global_step": 362401, "epoch": 2157} {"train_loss": -9.871660232543945, "global_step": 362402, "epoch": 2157} {"train_loss": -10.710043907165527, "global_step": 362403, "epoch": 2157} {"train_loss": -10.29955768585205, "global_step": 362404, "epoch": 2157} {"train_loss": -9.98378849029541, "global_step": 362405, "epoch": 2157} {"train_loss": -11.317276000976562, "global_step": 362406, "epoch": 2157} {"train_loss": -9.808700561523438, "global_step": 362407, "epoch": 2157} {"train_loss": -11.871030807495117, "global_step": 362408, "epoch": 2157} {"train_loss": -10.622114181518555, "global_step": 362409, "epoch": 2157} {"train_loss": -11.639020919799805, "global_step": 362410, "epoch": 2157} {"train_loss": -10.704606056213379, "global_step": 362411, "epoch": 2157} {"train_loss": -11.534452438354492, "global_step": 362412, "epoch": 2157} {"train_loss": -11.688642501831055, "global_step": 362413, "epoch": 2157} {"train_loss": -11.057962417602539, "global_step": 362414, "epoch": 2157} {"train_loss": -11.817373275756836, "global_step": 362415, "epoch": 2157} {"train_loss": -11.374252319335938, "global_step": 362416, "epoch": 2157} {"train_loss": -12.294000625610352, "global_step": 362417, "epoch": 2157} {"train_loss": -11.553743362426758, "global_step": 362418, "epoch": 2157} {"train_loss": -11.544357299804688, "global_step": 362419, "epoch": 2157} {"train_loss": -11.590743064880371, "global_step": 362420, "epoch": 2157} {"train_loss": -12.005431175231934, "global_step": 362421, "epoch": 2157} {"train_loss": -11.780477523803711, "global_step": 362422, "epoch": 2157} {"train_loss": -12.116759300231934, "global_step": 362423, "epoch": 2157} {"train_loss": -11.854867935180664, "global_step": 362424, "epoch": 2157} {"train_loss": -11.834424018859863, "global_step": 362425, "epoch": 2157} {"train_loss": -12.066734313964844, "global_step": 362426, "epoch": 2157} {"train_loss": -11.667813301086426, "global_step": 362427, "epoch": 2157} {"train_loss": -12.227009773254395, "global_step": 362428, "epoch": 2157} {"train_loss": -11.748641967773438, "global_step": 362429, "epoch": 2157} {"train_loss": -12.01492691040039, "global_step": 362430, "epoch": 2157} {"train_loss": -12.156391143798828, "global_step": 362431, "epoch": 2157} {"train_loss": -11.999149322509766, "global_step": 362432, "epoch": 2157} {"train_loss": -12.417266845703125, "global_step": 362433, "epoch": 2157} {"train_loss": -11.939718246459961, "global_step": 362434, "epoch": 2157} {"train_loss": -12.203897476196289, "global_step": 362435, "epoch": 2157} {"train_loss": -12.44424057006836, "global_step": 362436, "epoch": 2157} {"train_loss": -12.320612907409668, "global_step": 362437, "epoch": 2157} {"train_loss": -12.25473403930664, "global_step": 362438, "epoch": 2157} {"train_loss": -12.263851165771484, "global_step": 362439, "epoch": 2157} {"train_loss": -12.332178115844727, "global_step": 362440, "epoch": 2157} {"train_loss": -12.114389419555664, "global_step": 362441, "epoch": 2157} {"train_loss": -12.17057991027832, "global_step": 362442, "epoch": 2157} {"train_loss": -12.33912467956543, "global_step": 362443, "epoch": 2157} {"train_loss": -12.308404922485352, "global_step": 362444, "epoch": 2157} {"train_loss": -11.994216918945312, "global_step": 362445, "epoch": 2157} {"train_loss": -12.321586608886719, "global_step": 362446, "epoch": 2157} {"train_loss": -12.105428695678711, "global_step": 362447, "epoch": 2157} {"train_loss": -12.478556632995605, "global_step": 362448, "epoch": 2157} {"train_loss": -12.335687637329102, "global_step": 362449, "epoch": 2157} {"train_loss": -12.333613395690918, "global_step": 362450, "epoch": 2157} {"train_loss": -12.459697723388672, "global_step": 362451, "epoch": 2157} {"train_loss": -12.412576675415039, "global_step": 362452, "epoch": 2157} {"train_loss": -12.549047470092773, "global_step": 362453, "epoch": 2157} {"train_loss": -12.420461654663086, "global_step": 362454, "epoch": 2157} {"train_loss": -12.138673782348633, "global_step": 362455, "epoch": 2157} {"train_loss": -12.464576721191406, "global_step": 362456, "epoch": 2157} {"train_loss": -12.434808731079102, "global_step": 362457, "epoch": 2157} {"train_loss": -12.547538757324219, "global_step": 362458, "epoch": 2157} {"train_loss": -12.386545181274414, "global_step": 362459, "epoch": 2157} {"train_loss": -12.294031143188477, "global_step": 362460, "epoch": 2157} {"train_loss": -12.524759292602539, "global_step": 362461, "epoch": 2157} {"train_loss": -12.513259887695312, "global_step": 362462, "epoch": 2157} {"train_loss": -12.498682022094727, "global_step": 362463, "epoch": 2157} {"train_loss": -12.618096351623535, "global_step": 362464, "epoch": 2157} {"train_loss": -12.332963943481445, "global_step": 362465, "epoch": 2157} {"train_loss": -12.54068374633789, "global_step": 362466, "epoch": 2157} {"train_loss": -12.576204299926758, "global_step": 362467, "epoch": 2157} {"train_loss": -12.64934253692627, "global_step": 362468, "epoch": 2157} {"train_loss": -12.648377418518066, "global_step": 362469, "epoch": 2157} {"train_loss": -12.6494140625, "global_step": 362470, "epoch": 2157} {"train_loss": -12.297557830810547, "global_step": 362471, "epoch": 2157} {"train_loss": -12.622758865356445, "global_step": 362472, "epoch": 2157} {"train_loss": -12.632363319396973, "global_step": 362473, "epoch": 2157} {"train_loss": -12.485044479370117, "global_step": 362474, "epoch": 2157} {"train_loss": -12.68577766418457, "global_step": 362475, "epoch": 2157} {"train_loss": -12.60797119140625, "global_step": 362476, "epoch": 2157} {"train_loss": -12.576027870178223, "global_step": 362477, "epoch": 2157} {"train_loss": -12.763174057006836, "global_step": 362478, "epoch": 2157} {"train_loss": -12.361103057861328, "global_step": 362479, "epoch": 2157} {"train_loss": -12.339235305786133, "global_step": 362480, "epoch": 2157} {"train_loss": -12.687095642089844, "global_step": 362481, "epoch": 2157} {"train_loss": -12.760194778442383, "global_step": 362482, "epoch": 2157} {"train_loss": -12.372673034667969, "global_step": 362483, "epoch": 2157} {"train_loss": -12.235269546508789, "global_step": 362484, "epoch": 2157} {"train_loss": -12.723154067993164, "global_step": 362485, "epoch": 2157} {"train_loss": -12.43081283569336, "global_step": 362486, "epoch": 2157} {"train_loss": -12.514832496643066, "global_step": 362487, "epoch": 2157} {"train_loss": -12.325843811035156, "global_step": 362488, "epoch": 2157} {"train_loss": -12.635107040405273, "global_step": 362489, "epoch": 2157} {"train_loss": -12.677018165588379, "global_step": 362490, "epoch": 2157} {"train_loss": -12.731732368469238, "global_step": 362491, "epoch": 2157} {"train_loss": -12.496999740600586, "global_step": 362492, "epoch": 2157} {"train_loss": -12.525362014770508, "global_step": 362493, "epoch": 2157} {"train_loss": -12.613984107971191, "global_step": 362494, "epoch": 2157} {"train_loss": -12.59353256225586, "global_step": 362495, "epoch": 2157} {"train_loss": -12.53060531616211, "global_step": 362496, "epoch": 2157} {"train_loss": -12.800216674804688, "global_step": 362497, "epoch": 2157} {"train_loss": -12.718255996704102, "global_step": 362498, "epoch": 2157} {"train_loss": -12.661041259765625, "global_step": 362499, "epoch": 2157} {"train_loss": -12.664655685424805, "global_step": 362500, "epoch": 2157} {"train_loss": -12.518850326538086, "global_step": 362501, "epoch": 2157} {"train_loss": -12.703357696533203, "global_step": 362502, "epoch": 2157} {"train_loss": -12.612783432006836, "global_step": 362503, "epoch": 2157} {"train_loss": -12.753146171569824, "global_step": 362504, "epoch": 2157} {"train_loss": -12.691450119018555, "global_step": 362505, "epoch": 2157} {"train_loss": -12.566606521606445, "global_step": 362506, "epoch": 2157} {"train_loss": -12.45266056060791, "global_step": 362507, "epoch": 2157} {"train_loss": -12.415563583374023, "global_step": 362508, "epoch": 2157} {"train_loss": -12.39461898803711, "global_step": 362509, "epoch": 2157} {"train_loss": -12.717134475708008, "global_step": 362510, "epoch": 2157} {"train_loss": -12.57934284210205, "global_step": 362511, "epoch": 2157} {"train_loss": -12.01653003692627, "global_step": 362512, "epoch": 2157} {"train_loss": -12.25851058959961, "global_step": 362513, "epoch": 2157} {"train_loss": -11.49123764038086, "global_step": 362514, "epoch": 2157} {"train_loss": -12.140196800231934, "global_step": 362515, "epoch": 2157} {"train_loss": -12.485367774963379, "global_step": 362516, "epoch": 2157} {"train_loss": -12.11075210571289, "global_step": 362517, "epoch": 2157} {"train_loss": -11.8126220703125, "global_step": 362518, "epoch": 2157} {"train_loss": -11.776379585266113, "global_step": 362519, "epoch": 2157} {"train_loss": -12.45214557647705, "global_step": 362520, "epoch": 2157} {"train_loss": -11.743097305297852, "global_step": 362521, "epoch": 2157} {"train_loss": -12.705105781555176, "global_step": 362522, "epoch": 2157} {"train_loss": -12.426193237304688, "global_step": 362523, "epoch": 2157} {"train_loss": -12.178417205810547, "global_step": 362524, "epoch": 2157} {"train_loss": -12.206819534301758, "global_step": 362525, "epoch": 2157} {"train_loss": -12.145390510559082, "global_step": 362526, "epoch": 2157} {"train_loss": -12.118555068969727, "global_step": 362527, "epoch": 2157} {"train_loss": -12.47058391571045, "global_step": 362528, "epoch": 2157} {"train_loss": -11.956836700439453, "global_step": 362529, "epoch": 2157} {"train_loss": -12.13685131072998, "global_step": 362530, "epoch": 2157} {"train_loss": -12.406794548034668, "global_step": 362531, "epoch": 2157} {"train_loss": -11.897562980651855, "global_step": 362532, "epoch": 2157} {"train_loss": -11.658371925354004, "global_step": 362533, "epoch": 2157} {"train_loss": -11.936742782592773, "global_step": 362534, "epoch": 2157} {"train_loss": -11.647662162780762, "global_step": 362535, "epoch": 2157} {"train_loss": -12.214019775390625, "global_step": 362536, "epoch": 2157} {"train_loss": -12.228513717651367, "global_step": 362537, "epoch": 2157} {"train_loss": -12.136478424072266, "global_step": 362538, "epoch": 2157} {"train_loss": -11.697280883789062, "global_step": 362539, "epoch": 2157} {"train_loss": -11.961854934692383, "global_step": 362540, "epoch": 2157} {"train_loss": -11.908523559570312, "global_step": 362541, "epoch": 2157} {"train_loss": -11.79428482055664, "global_step": 362542, "epoch": 2157} {"train_loss": -11.98971012092772, "global_step": 362543, "epoch": 2157, "val_loss": 296879.0} {"train_loss": -11.930257797241211, "global_step": 362544, "epoch": 2158} {"train_loss": -11.935260772705078, "global_step": 362545, "epoch": 2158} {"train_loss": -12.165807723999023, "global_step": 362546, "epoch": 2158} {"train_loss": -11.357418060302734, "global_step": 362547, "epoch": 2158} {"train_loss": -10.29974365234375, "global_step": 362548, "epoch": 2158} {"train_loss": -11.705028533935547, "global_step": 362549, "epoch": 2158} {"train_loss": -8.748906135559082, "global_step": 362550, "epoch": 2158} {"train_loss": -10.324472427368164, "global_step": 362551, "epoch": 2158} {"train_loss": -10.827873229980469, "global_step": 362552, "epoch": 2158} {"train_loss": -10.535873413085938, "global_step": 362553, "epoch": 2158} {"train_loss": -10.243712425231934, "global_step": 362554, "epoch": 2158} {"train_loss": -10.916046142578125, "global_step": 362555, "epoch": 2158} {"train_loss": -11.272497177124023, "global_step": 362556, "epoch": 2158} {"train_loss": -9.62457275390625, "global_step": 362557, "epoch": 2158} {"train_loss": -11.104146003723145, "global_step": 362558, "epoch": 2158} {"train_loss": -8.9086332321167, "global_step": 362559, "epoch": 2158} {"train_loss": -8.894878387451172, "global_step": 362560, "epoch": 2158} {"train_loss": -10.840545654296875, "global_step": 362561, "epoch": 2158} {"train_loss": -8.820490837097168, "global_step": 362562, "epoch": 2158} {"train_loss": -7.990367889404297, "global_step": 362563, "epoch": 2158} {"train_loss": -9.714584350585938, "global_step": 362564, "epoch": 2158} {"train_loss": -10.403539657592773, "global_step": 362565, "epoch": 2158} {"train_loss": -9.99354076385498, "global_step": 362566, "epoch": 2158} {"train_loss": -10.555231094360352, "global_step": 362567, "epoch": 2158} {"train_loss": -9.801920890808105, "global_step": 362568, "epoch": 2158} {"train_loss": -10.133326530456543, "global_step": 362569, "epoch": 2158} {"train_loss": -9.893275260925293, "global_step": 362570, "epoch": 2158} {"train_loss": -11.024075508117676, "global_step": 362571, "epoch": 2158} {"train_loss": -9.244487762451172, "global_step": 362572, "epoch": 2158} {"train_loss": -10.500053405761719, "global_step": 362573, "epoch": 2158} {"train_loss": -10.159049987792969, "global_step": 362574, "epoch": 2158} {"train_loss": -11.062677383422852, "global_step": 362575, "epoch": 2158} {"train_loss": -10.652018547058105, "global_step": 362576, "epoch": 2158} {"train_loss": -11.472237586975098, "global_step": 362577, "epoch": 2158} {"train_loss": -10.757753372192383, "global_step": 362578, "epoch": 2158} {"train_loss": -11.402438163757324, "global_step": 362579, "epoch": 2158} {"train_loss": -10.651304244995117, "global_step": 362580, "epoch": 2158} {"train_loss": -10.87187671661377, "global_step": 362581, "epoch": 2158} {"train_loss": -11.149600982666016, "global_step": 362582, "epoch": 2158} {"train_loss": -10.641107559204102, "global_step": 362583, "epoch": 2158} {"train_loss": -11.27994155883789, "global_step": 362584, "epoch": 2158} {"train_loss": -11.164030075073242, "global_step": 362585, "epoch": 2158} {"train_loss": -10.651491165161133, "global_step": 362586, "epoch": 2158} {"train_loss": -11.801909446716309, "global_step": 362587, "epoch": 2158} {"train_loss": -11.331685066223145, "global_step": 362588, "epoch": 2158} {"train_loss": -11.724222183227539, "global_step": 362589, "epoch": 2158} {"train_loss": -11.339073181152344, "global_step": 362590, "epoch": 2158} {"train_loss": -11.254548072814941, "global_step": 362591, "epoch": 2158} {"train_loss": -11.226607322692871, "global_step": 362592, "epoch": 2158} {"train_loss": -10.390915870666504, "global_step": 362593, "epoch": 2158} {"train_loss": -11.327156066894531, "global_step": 362594, "epoch": 2158} {"train_loss": -11.55350112915039, "global_step": 362595, "epoch": 2158} {"train_loss": -11.329182624816895, "global_step": 362596, "epoch": 2158} {"train_loss": -11.55494499206543, "global_step": 362597, "epoch": 2158} {"train_loss": -11.260370254516602, "global_step": 362598, "epoch": 2158} {"train_loss": -11.31796932220459, "global_step": 362599, "epoch": 2158} {"train_loss": -11.317852020263672, "global_step": 362600, "epoch": 2158} {"train_loss": -11.597574234008789, "global_step": 362601, "epoch": 2158} {"train_loss": -11.410367965698242, "global_step": 362602, "epoch": 2158} {"train_loss": -11.51846981048584, "global_step": 362603, "epoch": 2158} {"train_loss": -11.443106651306152, "global_step": 362604, "epoch": 2158} {"train_loss": -11.499532699584961, "global_step": 362605, "epoch": 2158} {"train_loss": -11.760683059692383, "global_step": 362606, "epoch": 2158} {"train_loss": -10.208553314208984, "global_step": 362607, "epoch": 2158} {"train_loss": -11.410100936889648, "global_step": 362608, "epoch": 2158} {"train_loss": -11.775529861450195, "global_step": 362609, "epoch": 2158} {"train_loss": -11.623458862304688, "global_step": 362610, "epoch": 2158} {"train_loss": -11.682475090026855, "global_step": 362611, "epoch": 2158} {"train_loss": -11.501214027404785, "global_step": 362612, "epoch": 2158} {"train_loss": -11.9317626953125, "global_step": 362613, "epoch": 2158} {"train_loss": -11.688718795776367, "global_step": 362614, "epoch": 2158} {"train_loss": -11.720090866088867, "global_step": 362615, "epoch": 2158} {"train_loss": -11.770196914672852, "global_step": 362616, "epoch": 2158} {"train_loss": -11.92785358428955, "global_step": 362617, "epoch": 2158} {"train_loss": -11.82565975189209, "global_step": 362618, "epoch": 2158} {"train_loss": -12.018594741821289, "global_step": 362619, "epoch": 2158} {"train_loss": -11.915484428405762, "global_step": 362620, "epoch": 2158} {"train_loss": -11.97055721282959, "global_step": 362621, "epoch": 2158} {"train_loss": -12.131569862365723, "global_step": 362622, "epoch": 2158} {"train_loss": -12.066427230834961, "global_step": 362623, "epoch": 2158} {"train_loss": -11.99305534362793, "global_step": 362624, "epoch": 2158} {"train_loss": -12.20387077331543, "global_step": 362625, "epoch": 2158} {"train_loss": -12.058547019958496, "global_step": 362626, "epoch": 2158} {"train_loss": -12.291227340698242, "global_step": 362627, "epoch": 2158} {"train_loss": -12.170782089233398, "global_step": 362628, "epoch": 2158} {"train_loss": -12.283191680908203, "global_step": 362629, "epoch": 2158} {"train_loss": -12.230648040771484, "global_step": 362630, "epoch": 2158} {"train_loss": -12.2767972946167, "global_step": 362631, "epoch": 2158} {"train_loss": -12.079574584960938, "global_step": 362632, "epoch": 2158} {"train_loss": -12.178753852844238, "global_step": 362633, "epoch": 2158} {"train_loss": -11.77161979675293, "global_step": 362634, "epoch": 2158} {"train_loss": -12.305065155029297, "global_step": 362635, "epoch": 2158} {"train_loss": -12.037616729736328, "global_step": 362636, "epoch": 2158} {"train_loss": -11.987451553344727, "global_step": 362637, "epoch": 2158} {"train_loss": -11.98349380493164, "global_step": 362638, "epoch": 2158} {"train_loss": -12.189962387084961, "global_step": 362639, "epoch": 2158} {"train_loss": -11.98327922821045, "global_step": 362640, "epoch": 2158} {"train_loss": -12.30555534362793, "global_step": 362641, "epoch": 2158} {"train_loss": -12.243155479431152, "global_step": 362642, "epoch": 2158} {"train_loss": -12.365402221679688, "global_step": 362643, "epoch": 2158} {"train_loss": -12.070329666137695, "global_step": 362644, "epoch": 2158} {"train_loss": -12.355506896972656, "global_step": 362645, "epoch": 2158} {"train_loss": -12.234306335449219, "global_step": 362646, "epoch": 2158} {"train_loss": -12.444315910339355, "global_step": 362647, "epoch": 2158} {"train_loss": -12.415678024291992, "global_step": 362648, "epoch": 2158} {"train_loss": -12.591239929199219, "global_step": 362649, "epoch": 2158} {"train_loss": -12.280448913574219, "global_step": 362650, "epoch": 2158} {"train_loss": -12.059111595153809, "global_step": 362651, "epoch": 2158} {"train_loss": -12.257640838623047, "global_step": 362652, "epoch": 2158} {"train_loss": -12.302284240722656, "global_step": 362653, "epoch": 2158} {"train_loss": -12.57072925567627, "global_step": 362654, "epoch": 2158} {"train_loss": -12.221109390258789, "global_step": 362655, "epoch": 2158} {"train_loss": -12.369922637939453, "global_step": 362656, "epoch": 2158} {"train_loss": -12.286458969116211, "global_step": 362657, "epoch": 2158} {"train_loss": -12.282773971557617, "global_step": 362658, "epoch": 2158} {"train_loss": -12.350290298461914, "global_step": 362659, "epoch": 2158} {"train_loss": -12.544537544250488, "global_step": 362660, "epoch": 2158} {"train_loss": -12.172547340393066, "global_step": 362661, "epoch": 2158} {"train_loss": -12.382304191589355, "global_step": 362662, "epoch": 2158} {"train_loss": -12.503395080566406, "global_step": 362663, "epoch": 2158} {"train_loss": -12.378663063049316, "global_step": 362664, "epoch": 2158} {"train_loss": -12.23031997680664, "global_step": 362665, "epoch": 2158} {"train_loss": -12.567676544189453, "global_step": 362666, "epoch": 2158} {"train_loss": -12.407478332519531, "global_step": 362667, "epoch": 2158} {"train_loss": -12.392937660217285, "global_step": 362668, "epoch": 2158} {"train_loss": -12.562103271484375, "global_step": 362669, "epoch": 2158} {"train_loss": -12.244707107543945, "global_step": 362670, "epoch": 2158} {"train_loss": -12.32990837097168, "global_step": 362671, "epoch": 2158} {"train_loss": -12.224031448364258, "global_step": 362672, "epoch": 2158} {"train_loss": -12.399665832519531, "global_step": 362673, "epoch": 2158} {"train_loss": -12.625911712646484, "global_step": 362674, "epoch": 2158} {"train_loss": -12.449706077575684, "global_step": 362675, "epoch": 2158} {"train_loss": -12.603690147399902, "global_step": 362676, "epoch": 2158} {"train_loss": -12.49637222290039, "global_step": 362677, "epoch": 2158} {"train_loss": -12.614744186401367, "global_step": 362678, "epoch": 2158} {"train_loss": -12.554070472717285, "global_step": 362679, "epoch": 2158} {"train_loss": -12.679037094116211, "global_step": 362680, "epoch": 2158} {"train_loss": -12.351083755493164, "global_step": 362681, "epoch": 2158} {"train_loss": -12.315563201904297, "global_step": 362682, "epoch": 2158} {"train_loss": -12.510148048400879, "global_step": 362683, "epoch": 2158} {"train_loss": -12.592472076416016, "global_step": 362684, "epoch": 2158} {"train_loss": -12.448880195617676, "global_step": 362685, "epoch": 2158} {"train_loss": -11.663914680480957, "global_step": 362686, "epoch": 2158} {"train_loss": -12.434074401855469, "global_step": 362687, "epoch": 2158} {"train_loss": -12.492915153503418, "global_step": 362688, "epoch": 2158} {"train_loss": -12.61895751953125, "global_step": 362689, "epoch": 2158} {"train_loss": -12.580131530761719, "global_step": 362690, "epoch": 2158} {"train_loss": -12.456757545471191, "global_step": 362691, "epoch": 2158} {"train_loss": -12.46573257446289, "global_step": 362692, "epoch": 2158} {"train_loss": -12.614912986755371, "global_step": 362693, "epoch": 2158} {"train_loss": -12.617502212524414, "global_step": 362694, "epoch": 2158} {"train_loss": -12.574044227600098, "global_step": 362695, "epoch": 2158} {"train_loss": -12.621613502502441, "global_step": 362696, "epoch": 2158} {"train_loss": -12.383589744567871, "global_step": 362697, "epoch": 2158} {"train_loss": -12.744810104370117, "global_step": 362698, "epoch": 2158} {"train_loss": -11.932588577270508, "global_step": 362699, "epoch": 2158} {"train_loss": -12.75555419921875, "global_step": 362700, "epoch": 2158} {"train_loss": -12.591075897216797, "global_step": 362701, "epoch": 2158} {"train_loss": -12.686702728271484, "global_step": 362702, "epoch": 2158} {"train_loss": -12.554935455322266, "global_step": 362703, "epoch": 2158} {"train_loss": -12.142436027526855, "global_step": 362704, "epoch": 2158} {"train_loss": -11.684700012207031, "global_step": 362705, "epoch": 2158} {"train_loss": -12.296477317810059, "global_step": 362706, "epoch": 2158} {"train_loss": -12.163458824157715, "global_step": 362707, "epoch": 2158} {"train_loss": -12.298457145690918, "global_step": 362708, "epoch": 2158} {"train_loss": -12.466747283935547, "global_step": 362709, "epoch": 2158} {"train_loss": -12.329904556274414, "global_step": 362710, "epoch": 2158} {"train_loss": -11.695830277034215, "global_step": 362711, "epoch": 2158, "val_loss": 290062.65625} {"train_loss": -12.513235092163086, "global_step": 362712, "epoch": 2159} {"train_loss": -12.549077033996582, "global_step": 362713, "epoch": 2159} {"train_loss": -11.96485710144043, "global_step": 362714, "epoch": 2159} {"train_loss": -10.407907485961914, "global_step": 362715, "epoch": 2159} {"train_loss": -10.516057968139648, "global_step": 362716, "epoch": 2159} {"train_loss": -11.583131790161133, "global_step": 362717, "epoch": 2159} {"train_loss": -11.131328582763672, "global_step": 362718, "epoch": 2159} {"train_loss": -9.150304794311523, "global_step": 362719, "epoch": 2159} {"train_loss": -8.936483383178711, "global_step": 362720, "epoch": 2159} {"train_loss": -8.70956802368164, "global_step": 362721, "epoch": 2159} {"train_loss": -10.458564758300781, "global_step": 362722, "epoch": 2159} {"train_loss": -10.02018928527832, "global_step": 362723, "epoch": 2159} {"train_loss": -9.222829818725586, "global_step": 362724, "epoch": 2159} {"train_loss": -11.417243957519531, "global_step": 362725, "epoch": 2159} {"train_loss": -9.784128189086914, "global_step": 362726, "epoch": 2159} {"train_loss": -10.23529052734375, "global_step": 362727, "epoch": 2159} {"train_loss": -10.414262771606445, "global_step": 362728, "epoch": 2159} {"train_loss": -10.448089599609375, "global_step": 362729, "epoch": 2159} {"train_loss": -10.084609031677246, "global_step": 362730, "epoch": 2159} {"train_loss": -11.157010078430176, "global_step": 362731, "epoch": 2159} {"train_loss": -9.962393760681152, "global_step": 362732, "epoch": 2159} {"train_loss": -9.633747100830078, "global_step": 362733, "epoch": 2159} {"train_loss": -10.482431411743164, "global_step": 362734, "epoch": 2159} {"train_loss": -8.814252853393555, "global_step": 362735, "epoch": 2159} {"train_loss": -9.259725570678711, "global_step": 362736, "epoch": 2159} {"train_loss": -10.342375755310059, "global_step": 362737, "epoch": 2159} {"train_loss": -9.938535690307617, "global_step": 362738, "epoch": 2159} {"train_loss": -9.563486099243164, "global_step": 362739, "epoch": 2159} {"train_loss": -8.906312942504883, "global_step": 362740, "epoch": 2159} {"train_loss": -9.406225204467773, "global_step": 362741, "epoch": 2159} {"train_loss": -10.360210418701172, "global_step": 362742, "epoch": 2159} {"train_loss": -11.1468505859375, "global_step": 362743, "epoch": 2159} {"train_loss": -10.005889892578125, "global_step": 362744, "epoch": 2159} {"train_loss": -10.982032775878906, "global_step": 362745, "epoch": 2159} {"train_loss": -10.575087547302246, "global_step": 362746, "epoch": 2159} {"train_loss": -10.525671005249023, "global_step": 362747, "epoch": 2159} {"train_loss": -10.87313175201416, "global_step": 362748, "epoch": 2159} {"train_loss": -9.93899917602539, "global_step": 362749, "epoch": 2159} {"train_loss": -10.594459533691406, "global_step": 362750, "epoch": 2159} {"train_loss": -10.962026596069336, "global_step": 362751, "epoch": 2159} {"train_loss": -10.796296119689941, "global_step": 362752, "epoch": 2159} {"train_loss": -11.05605411529541, "global_step": 362753, "epoch": 2159} {"train_loss": -11.211729049682617, "global_step": 362754, "epoch": 2159} {"train_loss": -10.585357666015625, "global_step": 362755, "epoch": 2159} {"train_loss": -11.810455322265625, "global_step": 362756, "epoch": 2159} {"train_loss": -11.0142822265625, "global_step": 362757, "epoch": 2159} {"train_loss": -11.785430908203125, "global_step": 362758, "epoch": 2159} {"train_loss": -11.396843910217285, "global_step": 362759, "epoch": 2159} {"train_loss": -11.70329761505127, "global_step": 362760, "epoch": 2159} {"train_loss": -11.751448631286621, "global_step": 362761, "epoch": 2159} {"train_loss": -11.481695175170898, "global_step": 362762, "epoch": 2159} {"train_loss": -11.92434310913086, "global_step": 362763, "epoch": 2159} {"train_loss": -11.603386878967285, "global_step": 362764, "epoch": 2159} {"train_loss": -11.67558479309082, "global_step": 362765, "epoch": 2159} {"train_loss": -11.691715240478516, "global_step": 362766, "epoch": 2159} {"train_loss": -11.950372695922852, "global_step": 362767, "epoch": 2159} {"train_loss": -12.008320808410645, "global_step": 362768, "epoch": 2159} {"train_loss": -11.978713989257812, "global_step": 362769, "epoch": 2159} {"train_loss": -11.816370010375977, "global_step": 362770, "epoch": 2159} {"train_loss": -11.979930877685547, "global_step": 362771, "epoch": 2159} {"train_loss": -12.056136131286621, "global_step": 362772, "epoch": 2159} {"train_loss": -12.092670440673828, "global_step": 362773, "epoch": 2159} {"train_loss": -12.144054412841797, "global_step": 362774, "epoch": 2159} {"train_loss": -12.045705795288086, "global_step": 362775, "epoch": 2159} {"train_loss": -12.22073745727539, "global_step": 362776, "epoch": 2159} {"train_loss": -12.092900276184082, "global_step": 362777, "epoch": 2159} {"train_loss": -11.687931060791016, "global_step": 362778, "epoch": 2159} {"train_loss": -12.080713272094727, "global_step": 362779, "epoch": 2159} {"train_loss": -12.225594520568848, "global_step": 362780, "epoch": 2159} {"train_loss": -12.108756065368652, "global_step": 362781, "epoch": 2159} {"train_loss": -12.145763397216797, "global_step": 362782, "epoch": 2159} {"train_loss": -12.012907028198242, "global_step": 362783, "epoch": 2159} {"train_loss": -12.040550231933594, "global_step": 362784, "epoch": 2159} {"train_loss": -12.10204792022705, "global_step": 362785, "epoch": 2159} {"train_loss": -12.074413299560547, "global_step": 362786, "epoch": 2159} {"train_loss": -12.16903018951416, "global_step": 362787, "epoch": 2159} {"train_loss": -12.103455543518066, "global_step": 362788, "epoch": 2159} {"train_loss": -12.294934272766113, "global_step": 362789, "epoch": 2159} {"train_loss": -12.24171257019043, "global_step": 362790, "epoch": 2159} {"train_loss": -12.443708419799805, "global_step": 362791, "epoch": 2159} {"train_loss": -12.157709121704102, "global_step": 362792, "epoch": 2159} {"train_loss": -12.047630310058594, "global_step": 362793, "epoch": 2159} {"train_loss": -12.299445152282715, "global_step": 362794, "epoch": 2159} {"train_loss": -12.1806001663208, "global_step": 362795, "epoch": 2159} {"train_loss": -12.295504570007324, "global_step": 362796, "epoch": 2159} {"train_loss": -12.193050384521484, "global_step": 362797, "epoch": 2159} {"train_loss": -12.167169570922852, "global_step": 362798, "epoch": 2159} {"train_loss": -12.275819778442383, "global_step": 362799, "epoch": 2159} {"train_loss": -12.26711368560791, "global_step": 362800, "epoch": 2159} {"train_loss": -12.382915496826172, "global_step": 362801, "epoch": 2159} {"train_loss": -12.295719146728516, "global_step": 362802, "epoch": 2159} {"train_loss": -12.244733810424805, "global_step": 362803, "epoch": 2159} {"train_loss": -12.3916654586792, "global_step": 362804, "epoch": 2159} {"train_loss": -12.362384796142578, "global_step": 362805, "epoch": 2159} {"train_loss": -12.389214515686035, "global_step": 362806, "epoch": 2159} {"train_loss": -12.31129264831543, "global_step": 362807, "epoch": 2159} {"train_loss": -12.636466979980469, "global_step": 362808, "epoch": 2159} {"train_loss": -12.275691986083984, "global_step": 362809, "epoch": 2159} {"train_loss": -12.231191635131836, "global_step": 362810, "epoch": 2159} {"train_loss": -12.298391342163086, "global_step": 362811, "epoch": 2159} {"train_loss": -12.236602783203125, "global_step": 362812, "epoch": 2159} {"train_loss": -12.3768892288208, "global_step": 362813, "epoch": 2159} {"train_loss": -12.20101547241211, "global_step": 362814, "epoch": 2159} {"train_loss": -12.194464683532715, "global_step": 362815, "epoch": 2159} {"train_loss": -11.958305358886719, "global_step": 362816, "epoch": 2159} {"train_loss": -12.250822067260742, "global_step": 362817, "epoch": 2159} {"train_loss": -11.767345428466797, "global_step": 362818, "epoch": 2159} {"train_loss": -12.470216751098633, "global_step": 362819, "epoch": 2159} {"train_loss": -12.03132438659668, "global_step": 362820, "epoch": 2159} {"train_loss": -12.037696838378906, "global_step": 362821, "epoch": 2159} {"train_loss": -12.218335151672363, "global_step": 362822, "epoch": 2159} {"train_loss": -12.172847747802734, "global_step": 362823, "epoch": 2159} {"train_loss": -11.961465835571289, "global_step": 362824, "epoch": 2159} {"train_loss": -12.340719223022461, "global_step": 362825, "epoch": 2159} {"train_loss": -12.369014739990234, "global_step": 362826, "epoch": 2159} {"train_loss": -11.651180267333984, "global_step": 362827, "epoch": 2159} {"train_loss": -12.279069900512695, "global_step": 362828, "epoch": 2159} {"train_loss": -12.150819778442383, "global_step": 362829, "epoch": 2159} {"train_loss": -12.317659378051758, "global_step": 362830, "epoch": 2159} {"train_loss": -12.417095184326172, "global_step": 362831, "epoch": 2159} {"train_loss": -12.440917015075684, "global_step": 362832, "epoch": 2159} {"train_loss": -12.37759017944336, "global_step": 362833, "epoch": 2159} {"train_loss": -12.28256607055664, "global_step": 362834, "epoch": 2159} {"train_loss": -12.246683120727539, "global_step": 362835, "epoch": 2159} {"train_loss": -12.204730987548828, "global_step": 362836, "epoch": 2159} {"train_loss": -12.059244155883789, "global_step": 362837, "epoch": 2159} {"train_loss": -12.276213645935059, "global_step": 362838, "epoch": 2159} {"train_loss": -12.152702331542969, "global_step": 362839, "epoch": 2159} {"train_loss": -11.299888610839844, "global_step": 362840, "epoch": 2159} {"train_loss": -12.334076881408691, "global_step": 362841, "epoch": 2159} {"train_loss": -11.695634841918945, "global_step": 362842, "epoch": 2159} {"train_loss": -11.960775375366211, "global_step": 362843, "epoch": 2159} {"train_loss": -12.201294898986816, "global_step": 362844, "epoch": 2159} {"train_loss": -11.532041549682617, "global_step": 362845, "epoch": 2159} {"train_loss": -12.186479568481445, "global_step": 362846, "epoch": 2159} {"train_loss": -11.740039825439453, "global_step": 362847, "epoch": 2159} {"train_loss": -11.884215354919434, "global_step": 362848, "epoch": 2159} {"train_loss": -11.332959175109863, "global_step": 362849, "epoch": 2159} {"train_loss": -12.133325576782227, "global_step": 362850, "epoch": 2159} {"train_loss": -11.452108383178711, "global_step": 362851, "epoch": 2159} {"train_loss": -12.16253662109375, "global_step": 362852, "epoch": 2159} {"train_loss": -11.899572372436523, "global_step": 362853, "epoch": 2159} {"train_loss": -12.346927642822266, "global_step": 362854, "epoch": 2159} {"train_loss": -11.83489990234375, "global_step": 362855, "epoch": 2159} {"train_loss": -12.303643226623535, "global_step": 362856, "epoch": 2159} {"train_loss": -12.166069030761719, "global_step": 362857, "epoch": 2159} {"train_loss": -12.130815505981445, "global_step": 362858, "epoch": 2159} {"train_loss": -12.369905471801758, "global_step": 362859, "epoch": 2159} {"train_loss": -12.13499641418457, "global_step": 362860, "epoch": 2159} {"train_loss": -12.428661346435547, "global_step": 362861, "epoch": 2159} {"train_loss": -12.23235034942627, "global_step": 362862, "epoch": 2159} {"train_loss": -12.341798782348633, "global_step": 362863, "epoch": 2159} {"train_loss": -12.28266716003418, "global_step": 362864, "epoch": 2159} {"train_loss": -12.084059715270996, "global_step": 362865, "epoch": 2159} {"train_loss": -12.072168350219727, "global_step": 362866, "epoch": 2159} {"train_loss": -12.402769088745117, "global_step": 362867, "epoch": 2159} {"train_loss": -11.474264144897461, "global_step": 362868, "epoch": 2159} {"train_loss": -12.204309463500977, "global_step": 362869, "epoch": 2159} {"train_loss": -12.291464805603027, "global_step": 362870, "epoch": 2159} {"train_loss": -11.897014617919922, "global_step": 362871, "epoch": 2159} {"train_loss": -12.093266487121582, "global_step": 362872, "epoch": 2159} {"train_loss": -11.872503280639648, "global_step": 362873, "epoch": 2159} {"train_loss": -12.14645004272461, "global_step": 362874, "epoch": 2159} {"train_loss": -12.176819801330566, "global_step": 362875, "epoch": 2159} {"train_loss": -12.42366886138916, "global_step": 362876, "epoch": 2159} {"train_loss": -11.895829200744629, "global_step": 362877, "epoch": 2159} {"train_loss": -12.180868148803711, "global_step": 362878, "epoch": 2159} {"train_loss": -11.6393525713966, "global_step": 362879, "epoch": 2159, "val_loss": 287682.3125} {"train_loss": -12.255136489868164, "global_step": 362880, "epoch": 2160} {"train_loss": -11.4586181640625, "global_step": 362881, "epoch": 2160} {"train_loss": -11.610591888427734, "global_step": 362882, "epoch": 2160} {"train_loss": -11.189008712768555, "global_step": 362883, "epoch": 2160} {"train_loss": -11.329397201538086, "global_step": 362884, "epoch": 2160} {"train_loss": -11.568248748779297, "global_step": 362885, "epoch": 2160} {"train_loss": -11.752272605895996, "global_step": 362886, "epoch": 2160} {"train_loss": -11.24061393737793, "global_step": 362887, "epoch": 2160} {"train_loss": -11.239424705505371, "global_step": 362888, "epoch": 2160} {"train_loss": -10.087945938110352, "global_step": 362889, "epoch": 2160} {"train_loss": -10.203025817871094, "global_step": 362890, "epoch": 2160} {"train_loss": -11.161554336547852, "global_step": 362891, "epoch": 2160} {"train_loss": -10.860445022583008, "global_step": 362892, "epoch": 2160} {"train_loss": -11.856060981750488, "global_step": 362893, "epoch": 2160} {"train_loss": -10.792200088500977, "global_step": 362894, "epoch": 2160} {"train_loss": -11.21082592010498, "global_step": 362895, "epoch": 2160} {"train_loss": -11.438326835632324, "global_step": 362896, "epoch": 2160} {"train_loss": -11.164594650268555, "global_step": 362897, "epoch": 2160} {"train_loss": -11.654651641845703, "global_step": 362898, "epoch": 2160} {"train_loss": -10.677289962768555, "global_step": 362899, "epoch": 2160} {"train_loss": -12.245606422424316, "global_step": 362900, "epoch": 2160} {"train_loss": -11.640005111694336, "global_step": 362901, "epoch": 2160} {"train_loss": -11.842119216918945, "global_step": 362902, "epoch": 2160} {"train_loss": -11.255865097045898, "global_step": 362903, "epoch": 2160} {"train_loss": -12.107359886169434, "global_step": 362904, "epoch": 2160} {"train_loss": -10.930960655212402, "global_step": 362905, "epoch": 2160} {"train_loss": -11.670064926147461, "global_step": 362906, "epoch": 2160} {"train_loss": -11.486700057983398, "global_step": 362907, "epoch": 2160} {"train_loss": -12.059332847595215, "global_step": 362908, "epoch": 2160} {"train_loss": -11.542911529541016, "global_step": 362909, "epoch": 2160} {"train_loss": -12.200847625732422, "global_step": 362910, "epoch": 2160} {"train_loss": -11.339239120483398, "global_step": 362911, "epoch": 2160} {"train_loss": -11.735469818115234, "global_step": 362912, "epoch": 2160} {"train_loss": -11.57241153717041, "global_step": 362913, "epoch": 2160} {"train_loss": -11.747167587280273, "global_step": 362914, "epoch": 2160} {"train_loss": -11.683916091918945, "global_step": 362915, "epoch": 2160} {"train_loss": -11.44876766204834, "global_step": 362916, "epoch": 2160} {"train_loss": -11.985774993896484, "global_step": 362917, "epoch": 2160} {"train_loss": -11.30337905883789, "global_step": 362918, "epoch": 2160} {"train_loss": -12.014457702636719, "global_step": 362919, "epoch": 2160} {"train_loss": -11.433465957641602, "global_step": 362920, "epoch": 2160} {"train_loss": -11.75794792175293, "global_step": 362921, "epoch": 2160} {"train_loss": -11.912906646728516, "global_step": 362922, "epoch": 2160} {"train_loss": -11.0235595703125, "global_step": 362923, "epoch": 2160} {"train_loss": -11.413252830505371, "global_step": 362924, "epoch": 2160} {"train_loss": -11.452043533325195, "global_step": 362925, "epoch": 2160} {"train_loss": -11.675506591796875, "global_step": 362926, "epoch": 2160} {"train_loss": -10.876493453979492, "global_step": 362927, "epoch": 2160} {"train_loss": -11.369882583618164, "global_step": 362928, "epoch": 2160} {"train_loss": -10.32127571105957, "global_step": 362929, "epoch": 2160} {"train_loss": -10.91080093383789, "global_step": 362930, "epoch": 2160} {"train_loss": -11.56888198852539, "global_step": 362931, "epoch": 2160} {"train_loss": -9.436273574829102, "global_step": 362932, "epoch": 2160} {"train_loss": -10.441890716552734, "global_step": 362933, "epoch": 2160} {"train_loss": -10.957691192626953, "global_step": 362934, "epoch": 2160} {"train_loss": -10.777644157409668, "global_step": 362935, "epoch": 2160} {"train_loss": -11.009740829467773, "global_step": 362936, "epoch": 2160} {"train_loss": -10.844213485717773, "global_step": 362937, "epoch": 2160} {"train_loss": -11.248943328857422, "global_step": 362938, "epoch": 2160} {"train_loss": -10.948043823242188, "global_step": 362939, "epoch": 2160} {"train_loss": -11.763265609741211, "global_step": 362940, "epoch": 2160} {"train_loss": -11.056537628173828, "global_step": 362941, "epoch": 2160} {"train_loss": -11.670394897460938, "global_step": 362942, "epoch": 2160} {"train_loss": -11.499135971069336, "global_step": 362943, "epoch": 2160} {"train_loss": -11.590262413024902, "global_step": 362944, "epoch": 2160} {"train_loss": -11.882169723510742, "global_step": 362945, "epoch": 2160} {"train_loss": -11.347286224365234, "global_step": 362946, "epoch": 2160} {"train_loss": -11.893007278442383, "global_step": 362947, "epoch": 2160} {"train_loss": -11.878588676452637, "global_step": 362948, "epoch": 2160} {"train_loss": -11.644171714782715, "global_step": 362949, "epoch": 2160} {"train_loss": -11.99747085571289, "global_step": 362950, "epoch": 2160} {"train_loss": -11.339807510375977, "global_step": 362951, "epoch": 2160} {"train_loss": -11.479727745056152, "global_step": 362952, "epoch": 2160} {"train_loss": -11.47264289855957, "global_step": 362953, "epoch": 2160} {"train_loss": -11.043718338012695, "global_step": 362954, "epoch": 2160} {"train_loss": -11.690828323364258, "global_step": 362955, "epoch": 2160} {"train_loss": -11.606470108032227, "global_step": 362956, "epoch": 2160} {"train_loss": -11.811380386352539, "global_step": 362957, "epoch": 2160} {"train_loss": -11.882336616516113, "global_step": 362958, "epoch": 2160} {"train_loss": -11.54574966430664, "global_step": 362959, "epoch": 2160} {"train_loss": -11.615620613098145, "global_step": 362960, "epoch": 2160} {"train_loss": -11.890140533447266, "global_step": 362961, "epoch": 2160} {"train_loss": -12.052428245544434, "global_step": 362962, "epoch": 2160} {"train_loss": -11.788647651672363, "global_step": 362963, "epoch": 2160} {"train_loss": -11.50943374633789, "global_step": 362964, "epoch": 2160} {"train_loss": -11.79709529876709, "global_step": 362965, "epoch": 2160} {"train_loss": -11.929056167602539, "global_step": 362966, "epoch": 2160} {"train_loss": -11.94234848022461, "global_step": 362967, "epoch": 2160} {"train_loss": -12.139835357666016, "global_step": 362968, "epoch": 2160} {"train_loss": -12.2133150100708, "global_step": 362969, "epoch": 2160} {"train_loss": -12.026885032653809, "global_step": 362970, "epoch": 2160} {"train_loss": -12.133764266967773, "global_step": 362971, "epoch": 2160} {"train_loss": -12.083524703979492, "global_step": 362972, "epoch": 2160} {"train_loss": -12.165757179260254, "global_step": 362973, "epoch": 2160} {"train_loss": -12.191200256347656, "global_step": 362974, "epoch": 2160} {"train_loss": -12.298826217651367, "global_step": 362975, "epoch": 2160} {"train_loss": -12.143260955810547, "global_step": 362976, "epoch": 2160} {"train_loss": -12.25583267211914, "global_step": 362977, "epoch": 2160} {"train_loss": -12.310274124145508, "global_step": 362978, "epoch": 2160} {"train_loss": -12.122365951538086, "global_step": 362979, "epoch": 2160} {"train_loss": -12.258346557617188, "global_step": 362980, "epoch": 2160} {"train_loss": -12.180570602416992, "global_step": 362981, "epoch": 2160} {"train_loss": -12.392884254455566, "global_step": 362982, "epoch": 2160} {"train_loss": -11.665940284729004, "global_step": 362983, "epoch": 2160} {"train_loss": -12.116289138793945, "global_step": 362984, "epoch": 2160} {"train_loss": -11.922407150268555, "global_step": 362985, "epoch": 2160} {"train_loss": -12.235294342041016, "global_step": 362986, "epoch": 2160} {"train_loss": -12.174825668334961, "global_step": 362987, "epoch": 2160} {"train_loss": -11.886631965637207, "global_step": 362988, "epoch": 2160} {"train_loss": -12.105391502380371, "global_step": 362989, "epoch": 2160} {"train_loss": -12.039257049560547, "global_step": 362990, "epoch": 2160} {"train_loss": -12.465457916259766, "global_step": 362991, "epoch": 2160} {"train_loss": -12.099990844726562, "global_step": 362992, "epoch": 2160} {"train_loss": -12.405510902404785, "global_step": 362993, "epoch": 2160} {"train_loss": -12.048856735229492, "global_step": 362994, "epoch": 2160} {"train_loss": -11.911097526550293, "global_step": 362995, "epoch": 2160} {"train_loss": -12.225174903869629, "global_step": 362996, "epoch": 2160} {"train_loss": -11.85694694519043, "global_step": 362997, "epoch": 2160} {"train_loss": -12.229211807250977, "global_step": 362998, "epoch": 2160} {"train_loss": -12.173006057739258, "global_step": 362999, "epoch": 2160} {"train_loss": -12.20602035522461, "global_step": 363000, "epoch": 2160} {"train_loss": -12.168655395507812, "global_step": 363001, "epoch": 2160} {"train_loss": -12.175630569458008, "global_step": 363002, "epoch": 2160} {"train_loss": -12.344107627868652, "global_step": 363003, "epoch": 2160} {"train_loss": -12.256561279296875, "global_step": 363004, "epoch": 2160} {"train_loss": -12.50167465209961, "global_step": 363005, "epoch": 2160} {"train_loss": -12.189680099487305, "global_step": 363006, "epoch": 2160} {"train_loss": -12.186887741088867, "global_step": 363007, "epoch": 2160} {"train_loss": -12.191032409667969, "global_step": 363008, "epoch": 2160} {"train_loss": -12.536039352416992, "global_step": 363009, "epoch": 2160} {"train_loss": -12.272377967834473, "global_step": 363010, "epoch": 2160} {"train_loss": -11.794954299926758, "global_step": 363011, "epoch": 2160} {"train_loss": -12.583974838256836, "global_step": 363012, "epoch": 2160} {"train_loss": -11.908712387084961, "global_step": 363013, "epoch": 2160} {"train_loss": -12.319671630859375, "global_step": 363014, "epoch": 2160} {"train_loss": -12.236358642578125, "global_step": 363015, "epoch": 2160} {"train_loss": -11.937309265136719, "global_step": 363016, "epoch": 2160} {"train_loss": -12.443626403808594, "global_step": 363017, "epoch": 2160} {"train_loss": -11.879642486572266, "global_step": 363018, "epoch": 2160} {"train_loss": -12.209105491638184, "global_step": 363019, "epoch": 2160} {"train_loss": -11.920623779296875, "global_step": 363020, "epoch": 2160} {"train_loss": -12.248550415039062, "global_step": 363021, "epoch": 2160} {"train_loss": -12.24227523803711, "global_step": 363022, "epoch": 2160} {"train_loss": -12.153764724731445, "global_step": 363023, "epoch": 2160} {"train_loss": -12.218132972717285, "global_step": 363024, "epoch": 2160} {"train_loss": -12.229276657104492, "global_step": 363025, "epoch": 2160} {"train_loss": -11.991107940673828, "global_step": 363026, "epoch": 2160} {"train_loss": -12.50448226928711, "global_step": 363027, "epoch": 2160} {"train_loss": -12.121657371520996, "global_step": 363028, "epoch": 2160} {"train_loss": -12.321557998657227, "global_step": 363029, "epoch": 2160} {"train_loss": -12.245403289794922, "global_step": 363030, "epoch": 2160} {"train_loss": -12.638378143310547, "global_step": 363031, "epoch": 2160} {"train_loss": -12.032279014587402, "global_step": 363032, "epoch": 2160} {"train_loss": -12.48282241821289, "global_step": 363033, "epoch": 2160} {"train_loss": -12.065181732177734, "global_step": 363034, "epoch": 2160} {"train_loss": -12.181658744812012, "global_step": 363035, "epoch": 2160} {"train_loss": -11.96119213104248, "global_step": 363036, "epoch": 2160} {"train_loss": -12.594522476196289, "global_step": 363037, "epoch": 2160} {"train_loss": -12.181514739990234, "global_step": 363038, "epoch": 2160} {"train_loss": -12.022306442260742, "global_step": 363039, "epoch": 2160} {"train_loss": -12.422967910766602, "global_step": 363040, "epoch": 2160} {"train_loss": -12.436922073364258, "global_step": 363041, "epoch": 2160} {"train_loss": -12.452310562133789, "global_step": 363042, "epoch": 2160} {"train_loss": -12.502547264099121, "global_step": 363043, "epoch": 2160} {"train_loss": -11.877565383911133, "global_step": 363044, "epoch": 2160} {"train_loss": -12.140838623046875, "global_step": 363045, "epoch": 2160} {"train_loss": -12.282855033874512, "global_step": 363046, "epoch": 2160} {"train_loss": -11.796652504376002, "global_step": 363047, "epoch": 2160, "val_loss": 292834.375, "train_action_mse_error": 2.142782211303711} {"train_loss": -11.287802696228027, "global_step": 363048, "epoch": 2161} {"train_loss": -12.299398422241211, "global_step": 363049, "epoch": 2161} {"train_loss": -11.18591022491455, "global_step": 363050, "epoch": 2161} {"train_loss": -11.23538589477539, "global_step": 363051, "epoch": 2161} {"train_loss": -12.087512016296387, "global_step": 363052, "epoch": 2161} {"train_loss": -11.72962760925293, "global_step": 363053, "epoch": 2161} {"train_loss": -11.30203914642334, "global_step": 363054, "epoch": 2161} {"train_loss": -12.263771057128906, "global_step": 363055, "epoch": 2161} {"train_loss": -12.38409423828125, "global_step": 363056, "epoch": 2161} {"train_loss": -11.75847339630127, "global_step": 363057, "epoch": 2161} {"train_loss": -12.556044578552246, "global_step": 363058, "epoch": 2161} {"train_loss": -12.186683654785156, "global_step": 363059, "epoch": 2161} {"train_loss": -12.331758499145508, "global_step": 363060, "epoch": 2161} {"train_loss": -12.39120101928711, "global_step": 363061, "epoch": 2161} {"train_loss": -12.153221130371094, "global_step": 363062, "epoch": 2161} {"train_loss": -12.565399169921875, "global_step": 363063, "epoch": 2161} {"train_loss": -12.372682571411133, "global_step": 363064, "epoch": 2161} {"train_loss": -12.298175811767578, "global_step": 363065, "epoch": 2161} {"train_loss": -12.52824592590332, "global_step": 363066, "epoch": 2161} {"train_loss": -12.302759170532227, "global_step": 363067, "epoch": 2161} {"train_loss": -12.066022872924805, "global_step": 363068, "epoch": 2161} {"train_loss": -12.52824592590332, "global_step": 363069, "epoch": 2161} {"train_loss": -12.326062202453613, "global_step": 363070, "epoch": 2161} {"train_loss": -12.054347038269043, "global_step": 363071, "epoch": 2161} {"train_loss": -12.55311393737793, "global_step": 363072, "epoch": 2161} {"train_loss": -12.296734809875488, "global_step": 363073, "epoch": 2161} {"train_loss": -12.645973205566406, "global_step": 363074, "epoch": 2161} {"train_loss": -12.47157096862793, "global_step": 363075, "epoch": 2161} {"train_loss": -12.608133316040039, "global_step": 363076, "epoch": 2161} {"train_loss": -12.232150077819824, "global_step": 363077, "epoch": 2161} {"train_loss": -12.427400588989258, "global_step": 363078, "epoch": 2161} {"train_loss": -12.129731178283691, "global_step": 363079, "epoch": 2161} {"train_loss": -12.346599578857422, "global_step": 363080, "epoch": 2161} {"train_loss": -12.216145515441895, "global_step": 363081, "epoch": 2161} {"train_loss": -12.416288375854492, "global_step": 363082, "epoch": 2161} {"train_loss": -12.088945388793945, "global_step": 363083, "epoch": 2161} {"train_loss": -12.266864776611328, "global_step": 363084, "epoch": 2161} {"train_loss": -11.92741584777832, "global_step": 363085, "epoch": 2161} {"train_loss": -11.379335403442383, "global_step": 363086, "epoch": 2161} {"train_loss": -12.032432556152344, "global_step": 363087, "epoch": 2161} {"train_loss": -11.922449111938477, "global_step": 363088, "epoch": 2161} {"train_loss": -11.159462928771973, "global_step": 363089, "epoch": 2161} {"train_loss": -12.166455268859863, "global_step": 363090, "epoch": 2161} {"train_loss": -11.494308471679688, "global_step": 363091, "epoch": 2161} {"train_loss": -12.263324737548828, "global_step": 363092, "epoch": 2161} {"train_loss": -11.550275802612305, "global_step": 363093, "epoch": 2161} {"train_loss": -12.66706657409668, "global_step": 363094, "epoch": 2161} {"train_loss": -11.914761543273926, "global_step": 363095, "epoch": 2161} {"train_loss": -12.417596817016602, "global_step": 363096, "epoch": 2161} {"train_loss": -11.875877380371094, "global_step": 363097, "epoch": 2161} {"train_loss": -12.26806640625, "global_step": 363098, "epoch": 2161} {"train_loss": -12.004716873168945, "global_step": 363099, "epoch": 2161} {"train_loss": -11.853530883789062, "global_step": 363100, "epoch": 2161} {"train_loss": -11.645262718200684, "global_step": 363101, "epoch": 2161} {"train_loss": -12.536396026611328, "global_step": 363102, "epoch": 2161} {"train_loss": -12.345004081726074, "global_step": 363103, "epoch": 2161} {"train_loss": -11.529890060424805, "global_step": 363104, "epoch": 2161} {"train_loss": -11.815765380859375, "global_step": 363105, "epoch": 2161} {"train_loss": -11.900214195251465, "global_step": 363106, "epoch": 2161} {"train_loss": -11.265195846557617, "global_step": 363107, "epoch": 2161} {"train_loss": -12.240274429321289, "global_step": 363108, "epoch": 2161} {"train_loss": -11.606468200683594, "global_step": 363109, "epoch": 2161} {"train_loss": -11.368854522705078, "global_step": 363110, "epoch": 2161} {"train_loss": -11.818668365478516, "global_step": 363111, "epoch": 2161} {"train_loss": -12.211589813232422, "global_step": 363112, "epoch": 2161} {"train_loss": -12.300296783447266, "global_step": 363113, "epoch": 2161} {"train_loss": -11.813220977783203, "global_step": 363114, "epoch": 2161} {"train_loss": -12.082620620727539, "global_step": 363115, "epoch": 2161} {"train_loss": -12.091031074523926, "global_step": 363116, "epoch": 2161} {"train_loss": -12.439291000366211, "global_step": 363117, "epoch": 2161} {"train_loss": -11.559661865234375, "global_step": 363118, "epoch": 2161} {"train_loss": -12.567374229431152, "global_step": 363119, "epoch": 2161} {"train_loss": -11.392461776733398, "global_step": 363120, "epoch": 2161} {"train_loss": -12.086594581604004, "global_step": 363121, "epoch": 2161} {"train_loss": -11.852411270141602, "global_step": 363122, "epoch": 2161} {"train_loss": -12.02659797668457, "global_step": 363123, "epoch": 2161} {"train_loss": -11.785490989685059, "global_step": 363124, "epoch": 2161} {"train_loss": -12.341618537902832, "global_step": 363125, "epoch": 2161} {"train_loss": -12.24404525756836, "global_step": 363126, "epoch": 2161} {"train_loss": -11.874837875366211, "global_step": 363127, "epoch": 2161} {"train_loss": -12.079959869384766, "global_step": 363128, "epoch": 2161} {"train_loss": -12.224811553955078, "global_step": 363129, "epoch": 2161} {"train_loss": -11.896356582641602, "global_step": 363130, "epoch": 2161} {"train_loss": -12.06696605682373, "global_step": 363131, "epoch": 2161} {"train_loss": -11.789587020874023, "global_step": 363132, "epoch": 2161} {"train_loss": -11.664290428161621, "global_step": 363133, "epoch": 2161} {"train_loss": -11.671698570251465, "global_step": 363134, "epoch": 2161} {"train_loss": -12.432039260864258, "global_step": 363135, "epoch": 2161} {"train_loss": -11.22348403930664, "global_step": 363136, "epoch": 2161} {"train_loss": -10.905643463134766, "global_step": 363137, "epoch": 2161} {"train_loss": -11.125213623046875, "global_step": 363138, "epoch": 2161} {"train_loss": -11.957540512084961, "global_step": 363139, "epoch": 2161} {"train_loss": -11.507770538330078, "global_step": 363140, "epoch": 2161} {"train_loss": -11.789413452148438, "global_step": 363141, "epoch": 2161} {"train_loss": -12.003925323486328, "global_step": 363142, "epoch": 2161} {"train_loss": -12.174001693725586, "global_step": 363143, "epoch": 2161} {"train_loss": -11.97219467163086, "global_step": 363144, "epoch": 2161} {"train_loss": -11.853511810302734, "global_step": 363145, "epoch": 2161} {"train_loss": -11.752679824829102, "global_step": 363146, "epoch": 2161} {"train_loss": -11.876805305480957, "global_step": 363147, "epoch": 2161} {"train_loss": -11.860597610473633, "global_step": 363148, "epoch": 2161} {"train_loss": -11.621450424194336, "global_step": 363149, "epoch": 2161} {"train_loss": -12.139328002929688, "global_step": 363150, "epoch": 2161} {"train_loss": -11.750702857971191, "global_step": 363151, "epoch": 2161} {"train_loss": -11.945475578308105, "global_step": 363152, "epoch": 2161} {"train_loss": -12.134332656860352, "global_step": 363153, "epoch": 2161} {"train_loss": -11.57416820526123, "global_step": 363154, "epoch": 2161} {"train_loss": -12.300015449523926, "global_step": 363155, "epoch": 2161} {"train_loss": -11.955810546875, "global_step": 363156, "epoch": 2161} {"train_loss": -11.872514724731445, "global_step": 363157, "epoch": 2161} {"train_loss": -12.105634689331055, "global_step": 363158, "epoch": 2161} {"train_loss": -12.271069526672363, "global_step": 363159, "epoch": 2161} {"train_loss": -12.370869636535645, "global_step": 363160, "epoch": 2161} {"train_loss": -12.058160781860352, "global_step": 363161, "epoch": 2161} {"train_loss": -12.389049530029297, "global_step": 363162, "epoch": 2161} {"train_loss": -12.110053062438965, "global_step": 363163, "epoch": 2161} {"train_loss": -12.297416687011719, "global_step": 363164, "epoch": 2161} {"train_loss": -12.307901382446289, "global_step": 363165, "epoch": 2161} {"train_loss": -12.151388168334961, "global_step": 363166, "epoch": 2161} {"train_loss": -12.311111450195312, "global_step": 363167, "epoch": 2161} {"train_loss": -12.296945571899414, "global_step": 363168, "epoch": 2161} {"train_loss": -12.28923225402832, "global_step": 363169, "epoch": 2161} {"train_loss": -12.030510902404785, "global_step": 363170, "epoch": 2161} {"train_loss": -12.25947380065918, "global_step": 363171, "epoch": 2161} {"train_loss": -12.334061622619629, "global_step": 363172, "epoch": 2161} {"train_loss": -12.371330261230469, "global_step": 363173, "epoch": 2161} {"train_loss": -12.204331398010254, "global_step": 363174, "epoch": 2161} {"train_loss": -12.555049896240234, "global_step": 363175, "epoch": 2161} {"train_loss": -12.586012840270996, "global_step": 363176, "epoch": 2161} {"train_loss": -12.371810913085938, "global_step": 363177, "epoch": 2161} {"train_loss": -12.391740798950195, "global_step": 363178, "epoch": 2161} {"train_loss": -12.249617576599121, "global_step": 363179, "epoch": 2161} {"train_loss": -12.21234130859375, "global_step": 363180, "epoch": 2161} {"train_loss": -12.113656044006348, "global_step": 363181, "epoch": 2161} {"train_loss": -12.562965393066406, "global_step": 363182, "epoch": 2161} {"train_loss": -12.259725570678711, "global_step": 363183, "epoch": 2161} {"train_loss": -12.443920135498047, "global_step": 363184, "epoch": 2161} {"train_loss": -12.055784225463867, "global_step": 363185, "epoch": 2161} {"train_loss": -12.119523048400879, "global_step": 363186, "epoch": 2161} {"train_loss": -12.325225830078125, "global_step": 363187, "epoch": 2161} {"train_loss": -11.456008911132812, "global_step": 363188, "epoch": 2161} {"train_loss": -12.405136108398438, "global_step": 363189, "epoch": 2161} {"train_loss": -10.851583480834961, "global_step": 363190, "epoch": 2161} {"train_loss": -11.566394805908203, "global_step": 363191, "epoch": 2161} {"train_loss": -11.6558837890625, "global_step": 363192, "epoch": 2161} {"train_loss": -11.196710586547852, "global_step": 363193, "epoch": 2161} {"train_loss": -11.559484481811523, "global_step": 363194, "epoch": 2161} {"train_loss": -10.757951736450195, "global_step": 363195, "epoch": 2161} {"train_loss": -10.638362884521484, "global_step": 363196, "epoch": 2161} {"train_loss": -10.067121505737305, "global_step": 363197, "epoch": 2161} {"train_loss": -11.575032234191895, "global_step": 363198, "epoch": 2161} {"train_loss": -10.103787422180176, "global_step": 363199, "epoch": 2161} {"train_loss": -11.150252342224121, "global_step": 363200, "epoch": 2161} {"train_loss": -11.472444534301758, "global_step": 363201, "epoch": 2161} {"train_loss": -8.748180389404297, "global_step": 363202, "epoch": 2161} {"train_loss": -9.156569480895996, "global_step": 363203, "epoch": 2161} {"train_loss": -10.422536849975586, "global_step": 363204, "epoch": 2161} {"train_loss": -10.198383331298828, "global_step": 363205, "epoch": 2161} {"train_loss": -9.789536476135254, "global_step": 363206, "epoch": 2161} {"train_loss": -9.093900680541992, "global_step": 363207, "epoch": 2161} {"train_loss": -11.086714744567871, "global_step": 363208, "epoch": 2161} {"train_loss": -9.318801879882812, "global_step": 363209, "epoch": 2161} {"train_loss": -8.986178398132324, "global_step": 363210, "epoch": 2161} {"train_loss": -9.992708206176758, "global_step": 363211, "epoch": 2161} {"train_loss": -10.556314468383789, "global_step": 363212, "epoch": 2161} {"train_loss": -9.904594421386719, "global_step": 363213, "epoch": 2161} {"train_loss": -8.996500015258789, "global_step": 363214, "epoch": 2161} {"train_loss": -11.793472448984781, "global_step": 363215, "epoch": 2161, "val_loss": 289328.03125} {"train_loss": -11.66747760772705, "global_step": 363216, "epoch": 2162} {"train_loss": -10.761975288391113, "global_step": 363217, "epoch": 2162} {"train_loss": -11.061394691467285, "global_step": 363218, "epoch": 2162} {"train_loss": -11.240001678466797, "global_step": 363219, "epoch": 2162} {"train_loss": -11.01041030883789, "global_step": 363220, "epoch": 2162} {"train_loss": -11.05964469909668, "global_step": 363221, "epoch": 2162} {"train_loss": -11.452198028564453, "global_step": 363222, "epoch": 2162} {"train_loss": -10.887683868408203, "global_step": 363223, "epoch": 2162} {"train_loss": -11.667622566223145, "global_step": 363224, "epoch": 2162} {"train_loss": -11.893889427185059, "global_step": 363225, "epoch": 2162} {"train_loss": -11.664700508117676, "global_step": 363226, "epoch": 2162} {"train_loss": -11.791603088378906, "global_step": 363227, "epoch": 2162} {"train_loss": -11.897353172302246, "global_step": 363228, "epoch": 2162} {"train_loss": -11.987112045288086, "global_step": 363229, "epoch": 2162} {"train_loss": -12.11619758605957, "global_step": 363230, "epoch": 2162} {"train_loss": -12.222434997558594, "global_step": 363231, "epoch": 2162} {"train_loss": -11.914361000061035, "global_step": 363232, "epoch": 2162} {"train_loss": -11.989938735961914, "global_step": 363233, "epoch": 2162} {"train_loss": -11.982925415039062, "global_step": 363234, "epoch": 2162} {"train_loss": -12.110007286071777, "global_step": 363235, "epoch": 2162} {"train_loss": -12.106072425842285, "global_step": 363236, "epoch": 2162} {"train_loss": -12.245399475097656, "global_step": 363237, "epoch": 2162} {"train_loss": -12.189889907836914, "global_step": 363238, "epoch": 2162} {"train_loss": -12.180477142333984, "global_step": 363239, "epoch": 2162} {"train_loss": -12.220523834228516, "global_step": 363240, "epoch": 2162} {"train_loss": -12.116954803466797, "global_step": 363241, "epoch": 2162} {"train_loss": -12.33482551574707, "global_step": 363242, "epoch": 2162} {"train_loss": -12.078861236572266, "global_step": 363243, "epoch": 2162} {"train_loss": -12.126521110534668, "global_step": 363244, "epoch": 2162} {"train_loss": -12.106199264526367, "global_step": 363245, "epoch": 2162} {"train_loss": -12.402297973632812, "global_step": 363246, "epoch": 2162} {"train_loss": -12.149441719055176, "global_step": 363247, "epoch": 2162} {"train_loss": -12.478730201721191, "global_step": 363248, "epoch": 2162} {"train_loss": -12.208415031433105, "global_step": 363249, "epoch": 2162} {"train_loss": -12.407660484313965, "global_step": 363250, "epoch": 2162} {"train_loss": -12.407768249511719, "global_step": 363251, "epoch": 2162} {"train_loss": -12.235309600830078, "global_step": 363252, "epoch": 2162} {"train_loss": -12.280176162719727, "global_step": 363253, "epoch": 2162} {"train_loss": -12.155776977539062, "global_step": 363254, "epoch": 2162} {"train_loss": -12.260736465454102, "global_step": 363255, "epoch": 2162} {"train_loss": -12.341512680053711, "global_step": 363256, "epoch": 2162} {"train_loss": -12.39281940460205, "global_step": 363257, "epoch": 2162} {"train_loss": -12.409744262695312, "global_step": 363258, "epoch": 2162} {"train_loss": -12.329623222351074, "global_step": 363259, "epoch": 2162} {"train_loss": -12.445699691772461, "global_step": 363260, "epoch": 2162} {"train_loss": -12.25871467590332, "global_step": 363261, "epoch": 2162} {"train_loss": -12.383787155151367, "global_step": 363262, "epoch": 2162} {"train_loss": -12.417232513427734, "global_step": 363263, "epoch": 2162} {"train_loss": -12.41571044921875, "global_step": 363264, "epoch": 2162} {"train_loss": -12.440886497497559, "global_step": 363265, "epoch": 2162} {"train_loss": -12.281805038452148, "global_step": 363266, "epoch": 2162} {"train_loss": -12.377805709838867, "global_step": 363267, "epoch": 2162} {"train_loss": -12.317935943603516, "global_step": 363268, "epoch": 2162} {"train_loss": -12.267860412597656, "global_step": 363269, "epoch": 2162} {"train_loss": -12.309576034545898, "global_step": 363270, "epoch": 2162} {"train_loss": -12.088035583496094, "global_step": 363271, "epoch": 2162} {"train_loss": -12.469711303710938, "global_step": 363272, "epoch": 2162} {"train_loss": -12.228682518005371, "global_step": 363273, "epoch": 2162} {"train_loss": -12.49980640411377, "global_step": 363274, "epoch": 2162} {"train_loss": -12.323966979980469, "global_step": 363275, "epoch": 2162} {"train_loss": -12.257279396057129, "global_step": 363276, "epoch": 2162} {"train_loss": -12.427999496459961, "global_step": 363277, "epoch": 2162} {"train_loss": -12.468255996704102, "global_step": 363278, "epoch": 2162} {"train_loss": -12.529976844787598, "global_step": 363279, "epoch": 2162} {"train_loss": -12.467219352722168, "global_step": 363280, "epoch": 2162} {"train_loss": -12.51521110534668, "global_step": 363281, "epoch": 2162} {"train_loss": -12.606585502624512, "global_step": 363282, "epoch": 2162} {"train_loss": -12.511930465698242, "global_step": 363283, "epoch": 2162} {"train_loss": -12.749068260192871, "global_step": 363284, "epoch": 2162} {"train_loss": -12.358939170837402, "global_step": 363285, "epoch": 2162} {"train_loss": -12.696481704711914, "global_step": 363286, "epoch": 2162} {"train_loss": -12.384647369384766, "global_step": 363287, "epoch": 2162} {"train_loss": -12.681922912597656, "global_step": 363288, "epoch": 2162} {"train_loss": -12.428937911987305, "global_step": 363289, "epoch": 2162} {"train_loss": -11.985740661621094, "global_step": 363290, "epoch": 2162} {"train_loss": -11.790669441223145, "global_step": 363291, "epoch": 2162} {"train_loss": -12.248327255249023, "global_step": 363292, "epoch": 2162} {"train_loss": -12.442930221557617, "global_step": 363293, "epoch": 2162} {"train_loss": -12.58344841003418, "global_step": 363294, "epoch": 2162} {"train_loss": -12.236005783081055, "global_step": 363295, "epoch": 2162} {"train_loss": -11.974053382873535, "global_step": 363296, "epoch": 2162} {"train_loss": -12.221820831298828, "global_step": 363297, "epoch": 2162} {"train_loss": -12.550148963928223, "global_step": 363298, "epoch": 2162} {"train_loss": -12.193685531616211, "global_step": 363299, "epoch": 2162} {"train_loss": -12.479375839233398, "global_step": 363300, "epoch": 2162} {"train_loss": -12.170652389526367, "global_step": 363301, "epoch": 2162} {"train_loss": -12.579887390136719, "global_step": 363302, "epoch": 2162} {"train_loss": -12.272810935974121, "global_step": 363303, "epoch": 2162} {"train_loss": -11.405228614807129, "global_step": 363304, "epoch": 2162} {"train_loss": -12.35696792602539, "global_step": 363305, "epoch": 2162} {"train_loss": -11.969950675964355, "global_step": 363306, "epoch": 2162} {"train_loss": -12.524975776672363, "global_step": 363307, "epoch": 2162} {"train_loss": -11.227110862731934, "global_step": 363308, "epoch": 2162} {"train_loss": -11.33342170715332, "global_step": 363309, "epoch": 2162} {"train_loss": -12.021927833557129, "global_step": 363310, "epoch": 2162} {"train_loss": -12.389466285705566, "global_step": 363311, "epoch": 2162} {"train_loss": -10.913890838623047, "global_step": 363312, "epoch": 2162} {"train_loss": -11.802740097045898, "global_step": 363313, "epoch": 2162} {"train_loss": -11.902868270874023, "global_step": 363314, "epoch": 2162} {"train_loss": -11.327521324157715, "global_step": 363315, "epoch": 2162} {"train_loss": -12.00486946105957, "global_step": 363316, "epoch": 2162} {"train_loss": -11.72883415222168, "global_step": 363317, "epoch": 2162} {"train_loss": -12.089113235473633, "global_step": 363318, "epoch": 2162} {"train_loss": -11.678346633911133, "global_step": 363319, "epoch": 2162} {"train_loss": -11.57773208618164, "global_step": 363320, "epoch": 2162} {"train_loss": -11.778943061828613, "global_step": 363321, "epoch": 2162} {"train_loss": -11.666147232055664, "global_step": 363322, "epoch": 2162} {"train_loss": -10.904546737670898, "global_step": 363323, "epoch": 2162} {"train_loss": -11.869929313659668, "global_step": 363324, "epoch": 2162} {"train_loss": -9.770975112915039, "global_step": 363325, "epoch": 2162} {"train_loss": -10.931011199951172, "global_step": 363326, "epoch": 2162} {"train_loss": -11.221921920776367, "global_step": 363327, "epoch": 2162} {"train_loss": -9.872038841247559, "global_step": 363328, "epoch": 2162} {"train_loss": -10.275002479553223, "global_step": 363329, "epoch": 2162} {"train_loss": -10.86632251739502, "global_step": 363330, "epoch": 2162} {"train_loss": -10.575395584106445, "global_step": 363331, "epoch": 2162} {"train_loss": -9.573165893554688, "global_step": 363332, "epoch": 2162} {"train_loss": -10.727030754089355, "global_step": 363333, "epoch": 2162} {"train_loss": -9.338455200195312, "global_step": 363334, "epoch": 2162} {"train_loss": -9.138948440551758, "global_step": 363335, "epoch": 2162} {"train_loss": -10.158082008361816, "global_step": 363336, "epoch": 2162} {"train_loss": -10.77845573425293, "global_step": 363337, "epoch": 2162} {"train_loss": -9.548017501831055, "global_step": 363338, "epoch": 2162} {"train_loss": -8.650656700134277, "global_step": 363339, "epoch": 2162} {"train_loss": -9.77586555480957, "global_step": 363340, "epoch": 2162} {"train_loss": -10.848926544189453, "global_step": 363341, "epoch": 2162} {"train_loss": -10.901103973388672, "global_step": 363342, "epoch": 2162} {"train_loss": -10.440406799316406, "global_step": 363343, "epoch": 2162} {"train_loss": -10.622743606567383, "global_step": 363344, "epoch": 2162} {"train_loss": -11.093293190002441, "global_step": 363345, "epoch": 2162} {"train_loss": -10.788423538208008, "global_step": 363346, "epoch": 2162} {"train_loss": -11.13680362701416, "global_step": 363347, "epoch": 2162} {"train_loss": -10.520694732666016, "global_step": 363348, "epoch": 2162} {"train_loss": -11.278764724731445, "global_step": 363349, "epoch": 2162} {"train_loss": -9.864089012145996, "global_step": 363350, "epoch": 2162} {"train_loss": -10.97164535522461, "global_step": 363351, "epoch": 2162} {"train_loss": -10.654359817504883, "global_step": 363352, "epoch": 2162} {"train_loss": -11.618764877319336, "global_step": 363353, "epoch": 2162} {"train_loss": -9.858443260192871, "global_step": 363354, "epoch": 2162} {"train_loss": -12.172015190124512, "global_step": 363355, "epoch": 2162} {"train_loss": -10.920598030090332, "global_step": 363356, "epoch": 2162} {"train_loss": -10.847182273864746, "global_step": 363357, "epoch": 2162} {"train_loss": -11.804492950439453, "global_step": 363358, "epoch": 2162} {"train_loss": -10.913604736328125, "global_step": 363359, "epoch": 2162} {"train_loss": -10.971811294555664, "global_step": 363360, "epoch": 2162} {"train_loss": -11.078063011169434, "global_step": 363361, "epoch": 2162} {"train_loss": -10.545771598815918, "global_step": 363362, "epoch": 2162} {"train_loss": -11.37198543548584, "global_step": 363363, "epoch": 2162} {"train_loss": -11.407587051391602, "global_step": 363364, "epoch": 2162} {"train_loss": -11.381772994995117, "global_step": 363365, "epoch": 2162} {"train_loss": -11.768559455871582, "global_step": 363366, "epoch": 2162} {"train_loss": -11.400649070739746, "global_step": 363367, "epoch": 2162} {"train_loss": -11.16072940826416, "global_step": 363368, "epoch": 2162} {"train_loss": -11.68270206451416, "global_step": 363369, "epoch": 2162} {"train_loss": -11.15641975402832, "global_step": 363370, "epoch": 2162} {"train_loss": -11.322139739990234, "global_step": 363371, "epoch": 2162} {"train_loss": -11.495476722717285, "global_step": 363372, "epoch": 2162} {"train_loss": -11.3503999710083, "global_step": 363373, "epoch": 2162} {"train_loss": -12.009235382080078, "global_step": 363374, "epoch": 2162} {"train_loss": -11.770578384399414, "global_step": 363375, "epoch": 2162} {"train_loss": -11.763595581054688, "global_step": 363376, "epoch": 2162} {"train_loss": -11.459088325500488, "global_step": 363377, "epoch": 2162} {"train_loss": -11.83956241607666, "global_step": 363378, "epoch": 2162} {"train_loss": -11.849302291870117, "global_step": 363379, "epoch": 2162} {"train_loss": -11.975749969482422, "global_step": 363380, "epoch": 2162} {"train_loss": -11.618690490722656, "global_step": 363381, "epoch": 2162} {"train_loss": -12.274139404296875, "global_step": 363382, "epoch": 2162} {"train_loss": -11.682350493612743, "global_step": 363383, "epoch": 2162, "val_loss": 287017.4375} {"train_loss": -11.843591690063477, "global_step": 363384, "epoch": 2163} {"train_loss": -12.083702087402344, "global_step": 363385, "epoch": 2163} {"train_loss": -11.999155044555664, "global_step": 363386, "epoch": 2163} {"train_loss": -12.086533546447754, "global_step": 363387, "epoch": 2163} {"train_loss": -12.059652328491211, "global_step": 363388, "epoch": 2163} {"train_loss": -11.923443794250488, "global_step": 363389, "epoch": 2163} {"train_loss": -12.109710693359375, "global_step": 363390, "epoch": 2163} {"train_loss": -12.075603485107422, "global_step": 363391, "epoch": 2163} {"train_loss": -12.192883491516113, "global_step": 363392, "epoch": 2163} {"train_loss": -11.832204818725586, "global_step": 363393, "epoch": 2163} {"train_loss": -12.210229873657227, "global_step": 363394, "epoch": 2163} {"train_loss": -12.185672760009766, "global_step": 363395, "epoch": 2163} {"train_loss": -12.051899909973145, "global_step": 363396, "epoch": 2163} {"train_loss": -12.181404113769531, "global_step": 363397, "epoch": 2163} {"train_loss": -12.216581344604492, "global_step": 363398, "epoch": 2163} {"train_loss": -12.254393577575684, "global_step": 363399, "epoch": 2163} {"train_loss": -12.12575912475586, "global_step": 363400, "epoch": 2163} {"train_loss": -12.045198440551758, "global_step": 363401, "epoch": 2163} {"train_loss": -12.03349781036377, "global_step": 363402, "epoch": 2163} {"train_loss": -12.25387191772461, "global_step": 363403, "epoch": 2163} {"train_loss": -12.30557632446289, "global_step": 363404, "epoch": 2163} {"train_loss": -12.33005142211914, "global_step": 363405, "epoch": 2163} {"train_loss": -12.228267669677734, "global_step": 363406, "epoch": 2163} {"train_loss": -12.133065223693848, "global_step": 363407, "epoch": 2163} {"train_loss": -12.439400672912598, "global_step": 363408, "epoch": 2163} {"train_loss": -12.057337760925293, "global_step": 363409, "epoch": 2163} {"train_loss": -12.466007232666016, "global_step": 363410, "epoch": 2163} {"train_loss": -12.270742416381836, "global_step": 363411, "epoch": 2163} {"train_loss": -12.379512786865234, "global_step": 363412, "epoch": 2163} {"train_loss": -12.379903793334961, "global_step": 363413, "epoch": 2163} {"train_loss": -12.277032852172852, "global_step": 363414, "epoch": 2163} {"train_loss": -12.459665298461914, "global_step": 363415, "epoch": 2163} {"train_loss": -12.267601013183594, "global_step": 363416, "epoch": 2163} {"train_loss": -12.415712356567383, "global_step": 363417, "epoch": 2163} {"train_loss": -12.327428817749023, "global_step": 363418, "epoch": 2163} {"train_loss": -12.221792221069336, "global_step": 363419, "epoch": 2163} {"train_loss": -12.352434158325195, "global_step": 363420, "epoch": 2163} {"train_loss": -12.28001594543457, "global_step": 363421, "epoch": 2163} {"train_loss": -12.311999320983887, "global_step": 363422, "epoch": 2163} {"train_loss": -12.444110870361328, "global_step": 363423, "epoch": 2163} {"train_loss": -12.2718505859375, "global_step": 363424, "epoch": 2163} {"train_loss": -12.515655517578125, "global_step": 363425, "epoch": 2163} {"train_loss": -12.468109130859375, "global_step": 363426, "epoch": 2163} {"train_loss": -12.455554962158203, "global_step": 363427, "epoch": 2163} {"train_loss": -12.511877059936523, "global_step": 363428, "epoch": 2163} {"train_loss": -12.608475685119629, "global_step": 363429, "epoch": 2163} {"train_loss": -12.579720497131348, "global_step": 363430, "epoch": 2163} {"train_loss": -12.417569160461426, "global_step": 363431, "epoch": 2163} {"train_loss": -12.685773849487305, "global_step": 363432, "epoch": 2163} {"train_loss": -12.60355281829834, "global_step": 363433, "epoch": 2163} {"train_loss": -12.419584274291992, "global_step": 363434, "epoch": 2163} {"train_loss": -12.609762191772461, "global_step": 363435, "epoch": 2163} {"train_loss": -12.479074478149414, "global_step": 363436, "epoch": 2163} {"train_loss": -12.677921295166016, "global_step": 363437, "epoch": 2163} {"train_loss": -12.566180229187012, "global_step": 363438, "epoch": 2163} {"train_loss": -12.611741065979004, "global_step": 363439, "epoch": 2163} {"train_loss": -12.640765190124512, "global_step": 363440, "epoch": 2163} {"train_loss": -12.602067947387695, "global_step": 363441, "epoch": 2163} {"train_loss": -12.576412200927734, "global_step": 363442, "epoch": 2163} {"train_loss": -12.372451782226562, "global_step": 363443, "epoch": 2163} {"train_loss": -12.592344284057617, "global_step": 363444, "epoch": 2163} {"train_loss": -12.616657257080078, "global_step": 363445, "epoch": 2163} {"train_loss": -12.535161972045898, "global_step": 363446, "epoch": 2163} {"train_loss": -12.364002227783203, "global_step": 363447, "epoch": 2163} {"train_loss": -12.835212707519531, "global_step": 363448, "epoch": 2163} {"train_loss": -12.20549201965332, "global_step": 363449, "epoch": 2163} {"train_loss": -12.400115013122559, "global_step": 363450, "epoch": 2163} {"train_loss": -12.685344696044922, "global_step": 363451, "epoch": 2163} {"train_loss": -12.376708030700684, "global_step": 363452, "epoch": 2163} {"train_loss": -12.514436721801758, "global_step": 363453, "epoch": 2163} {"train_loss": -12.326669692993164, "global_step": 363454, "epoch": 2163} {"train_loss": -12.296659469604492, "global_step": 363455, "epoch": 2163} {"train_loss": -12.58645248413086, "global_step": 363456, "epoch": 2163} {"train_loss": -12.316644668579102, "global_step": 363457, "epoch": 2163} {"train_loss": -11.50490951538086, "global_step": 363458, "epoch": 2163} {"train_loss": -11.207448959350586, "global_step": 363459, "epoch": 2163} {"train_loss": -11.757308006286621, "global_step": 363460, "epoch": 2163} {"train_loss": -12.618162155151367, "global_step": 363461, "epoch": 2163} {"train_loss": -11.06608772277832, "global_step": 363462, "epoch": 2163} {"train_loss": -10.583768844604492, "global_step": 363463, "epoch": 2163} {"train_loss": -11.068700790405273, "global_step": 363464, "epoch": 2163} {"train_loss": -11.524227142333984, "global_step": 363465, "epoch": 2163} {"train_loss": -10.732992172241211, "global_step": 363466, "epoch": 2163} {"train_loss": -12.45298957824707, "global_step": 363467, "epoch": 2163} {"train_loss": -10.342899322509766, "global_step": 363468, "epoch": 2163} {"train_loss": -11.532506942749023, "global_step": 363469, "epoch": 2163} {"train_loss": -11.298608779907227, "global_step": 363470, "epoch": 2163} {"train_loss": -8.68896484375, "global_step": 363471, "epoch": 2163} {"train_loss": -10.541912078857422, "global_step": 363472, "epoch": 2163} {"train_loss": -8.494975090026855, "global_step": 363473, "epoch": 2163} {"train_loss": -9.831673622131348, "global_step": 363474, "epoch": 2163} {"train_loss": -8.48450756072998, "global_step": 363475, "epoch": 2163} {"train_loss": -9.997611045837402, "global_step": 363476, "epoch": 2163} {"train_loss": -9.833988189697266, "global_step": 363477, "epoch": 2163} {"train_loss": -10.578592300415039, "global_step": 363478, "epoch": 2163} {"train_loss": -10.196305274963379, "global_step": 363479, "epoch": 2163} {"train_loss": -8.943914413452148, "global_step": 363480, "epoch": 2163} {"train_loss": -9.269876480102539, "global_step": 363481, "epoch": 2163} {"train_loss": -9.96371841430664, "global_step": 363482, "epoch": 2163} {"train_loss": -9.606231689453125, "global_step": 363483, "epoch": 2163} {"train_loss": -9.849557876586914, "global_step": 363484, "epoch": 2163} {"train_loss": -10.764314651489258, "global_step": 363485, "epoch": 2163} {"train_loss": -10.735981941223145, "global_step": 363486, "epoch": 2163} {"train_loss": -9.961753845214844, "global_step": 363487, "epoch": 2163} {"train_loss": -11.208505630493164, "global_step": 363488, "epoch": 2163} {"train_loss": -11.194063186645508, "global_step": 363489, "epoch": 2163} {"train_loss": -11.638643264770508, "global_step": 363490, "epoch": 2163} {"train_loss": -11.863373756408691, "global_step": 363491, "epoch": 2163} {"train_loss": -11.258172988891602, "global_step": 363492, "epoch": 2163} {"train_loss": -11.947898864746094, "global_step": 363493, "epoch": 2163} {"train_loss": -11.721177101135254, "global_step": 363494, "epoch": 2163} {"train_loss": -11.971014976501465, "global_step": 363495, "epoch": 2163} {"train_loss": -11.767461776733398, "global_step": 363496, "epoch": 2163} {"train_loss": -12.284420013427734, "global_step": 363497, "epoch": 2163} {"train_loss": -11.631232261657715, "global_step": 363498, "epoch": 2163} {"train_loss": -11.863170623779297, "global_step": 363499, "epoch": 2163} {"train_loss": -11.832664489746094, "global_step": 363500, "epoch": 2163} {"train_loss": -11.99288558959961, "global_step": 363501, "epoch": 2163} {"train_loss": -11.859313011169434, "global_step": 363502, "epoch": 2163} {"train_loss": -12.158425331115723, "global_step": 363503, "epoch": 2163} {"train_loss": -11.86205005645752, "global_step": 363504, "epoch": 2163} {"train_loss": -12.220027923583984, "global_step": 363505, "epoch": 2163} {"train_loss": -11.988547325134277, "global_step": 363506, "epoch": 2163} {"train_loss": -11.98012924194336, "global_step": 363507, "epoch": 2163} {"train_loss": -12.207798957824707, "global_step": 363508, "epoch": 2163} {"train_loss": -12.037471771240234, "global_step": 363509, "epoch": 2163} {"train_loss": -12.042725563049316, "global_step": 363510, "epoch": 2163} {"train_loss": -12.21127700805664, "global_step": 363511, "epoch": 2163} {"train_loss": -12.21883487701416, "global_step": 363512, "epoch": 2163} {"train_loss": -12.35460090637207, "global_step": 363513, "epoch": 2163} {"train_loss": -12.111164093017578, "global_step": 363514, "epoch": 2163} {"train_loss": -12.309514045715332, "global_step": 363515, "epoch": 2163} {"train_loss": -12.03187370300293, "global_step": 363516, "epoch": 2163} {"train_loss": -12.209671974182129, "global_step": 363517, "epoch": 2163} {"train_loss": -12.567422866821289, "global_step": 363518, "epoch": 2163} {"train_loss": -12.236637115478516, "global_step": 363519, "epoch": 2163} {"train_loss": -12.300155639648438, "global_step": 363520, "epoch": 2163} {"train_loss": -12.305633544921875, "global_step": 363521, "epoch": 2163} {"train_loss": -12.204959869384766, "global_step": 363522, "epoch": 2163} {"train_loss": -12.26812744140625, "global_step": 363523, "epoch": 2163} {"train_loss": -12.365133285522461, "global_step": 363524, "epoch": 2163} {"train_loss": -12.319985389709473, "global_step": 363525, "epoch": 2163} {"train_loss": -12.380327224731445, "global_step": 363526, "epoch": 2163} {"train_loss": -12.44139289855957, "global_step": 363527, "epoch": 2163} {"train_loss": -12.418113708496094, "global_step": 363528, "epoch": 2163} {"train_loss": -12.431928634643555, "global_step": 363529, "epoch": 2163} {"train_loss": -12.58043098449707, "global_step": 363530, "epoch": 2163} {"train_loss": -12.232002258300781, "global_step": 363531, "epoch": 2163} {"train_loss": -12.566190719604492, "global_step": 363532, "epoch": 2163} {"train_loss": -12.67619514465332, "global_step": 363533, "epoch": 2163} {"train_loss": -12.217638969421387, "global_step": 363534, "epoch": 2163} {"train_loss": -12.527616500854492, "global_step": 363535, "epoch": 2163} {"train_loss": -12.527464866638184, "global_step": 363536, "epoch": 2163} {"train_loss": -12.412981986999512, "global_step": 363537, "epoch": 2163} {"train_loss": -12.335306167602539, "global_step": 363538, "epoch": 2163} {"train_loss": -12.357805252075195, "global_step": 363539, "epoch": 2163} {"train_loss": -12.385087966918945, "global_step": 363540, "epoch": 2163} {"train_loss": -12.419567108154297, "global_step": 363541, "epoch": 2163} {"train_loss": -12.530750274658203, "global_step": 363542, "epoch": 2163} {"train_loss": -12.258390426635742, "global_step": 363543, "epoch": 2163} {"train_loss": -12.363503456115723, "global_step": 363544, "epoch": 2163} {"train_loss": -12.539382934570312, "global_step": 363545, "epoch": 2163} {"train_loss": -12.267305374145508, "global_step": 363546, "epoch": 2163} {"train_loss": -12.046930313110352, "global_step": 363547, "epoch": 2163} {"train_loss": -12.647144317626953, "global_step": 363548, "epoch": 2163} {"train_loss": -12.269349098205566, "global_step": 363549, "epoch": 2163} {"train_loss": -12.12298583984375, "global_step": 363550, "epoch": 2163} {"train_loss": -11.938903274990263, "global_step": 363551, "epoch": 2163, "val_loss": 291478.28125} {"train_loss": -12.511868476867676, "global_step": 363552, "epoch": 2164} {"train_loss": -11.76657485961914, "global_step": 363553, "epoch": 2164} {"train_loss": -12.388416290283203, "global_step": 363554, "epoch": 2164} {"train_loss": -12.57248306274414, "global_step": 363555, "epoch": 2164} {"train_loss": -11.844208717346191, "global_step": 363556, "epoch": 2164} {"train_loss": -11.588031768798828, "global_step": 363557, "epoch": 2164} {"train_loss": -12.27334213256836, "global_step": 363558, "epoch": 2164} {"train_loss": -12.438072204589844, "global_step": 363559, "epoch": 2164} {"train_loss": -12.068968772888184, "global_step": 363560, "epoch": 2164} {"train_loss": -11.888467788696289, "global_step": 363561, "epoch": 2164} {"train_loss": -12.391209602355957, "global_step": 363562, "epoch": 2164} {"train_loss": -12.214573860168457, "global_step": 363563, "epoch": 2164} {"train_loss": -11.993587493896484, "global_step": 363564, "epoch": 2164} {"train_loss": -12.336206436157227, "global_step": 363565, "epoch": 2164} {"train_loss": -12.768482208251953, "global_step": 363566, "epoch": 2164} {"train_loss": -12.21638011932373, "global_step": 363567, "epoch": 2164} {"train_loss": -11.70704460144043, "global_step": 363568, "epoch": 2164} {"train_loss": -12.395761489868164, "global_step": 363569, "epoch": 2164} {"train_loss": -12.5617036819458, "global_step": 363570, "epoch": 2164} {"train_loss": -12.088798522949219, "global_step": 363571, "epoch": 2164} {"train_loss": -11.982609748840332, "global_step": 363572, "epoch": 2164} {"train_loss": -12.21811294555664, "global_step": 363573, "epoch": 2164} {"train_loss": -12.26838207244873, "global_step": 363574, "epoch": 2164} {"train_loss": -12.191057205200195, "global_step": 363575, "epoch": 2164} {"train_loss": -12.376240730285645, "global_step": 363576, "epoch": 2164} {"train_loss": -12.132139205932617, "global_step": 363577, "epoch": 2164} {"train_loss": -12.40023422241211, "global_step": 363578, "epoch": 2164} {"train_loss": -12.3709716796875, "global_step": 363579, "epoch": 2164} {"train_loss": -12.467277526855469, "global_step": 363580, "epoch": 2164} {"train_loss": -12.693723678588867, "global_step": 363581, "epoch": 2164} {"train_loss": -12.545770645141602, "global_step": 363582, "epoch": 2164} {"train_loss": -11.984407424926758, "global_step": 363583, "epoch": 2164} {"train_loss": -12.154237747192383, "global_step": 363584, "epoch": 2164} {"train_loss": -12.547826766967773, "global_step": 363585, "epoch": 2164} {"train_loss": -12.504606246948242, "global_step": 363586, "epoch": 2164} {"train_loss": -12.161128044128418, "global_step": 363587, "epoch": 2164} {"train_loss": -12.364564895629883, "global_step": 363588, "epoch": 2164} {"train_loss": -12.387096405029297, "global_step": 363589, "epoch": 2164} {"train_loss": -12.301183700561523, "global_step": 363590, "epoch": 2164} {"train_loss": -12.252796173095703, "global_step": 363591, "epoch": 2164} {"train_loss": -12.627242088317871, "global_step": 363592, "epoch": 2164} {"train_loss": -12.255894660949707, "global_step": 363593, "epoch": 2164} {"train_loss": -12.598630905151367, "global_step": 363594, "epoch": 2164} {"train_loss": -12.030062675476074, "global_step": 363595, "epoch": 2164} {"train_loss": -12.290670394897461, "global_step": 363596, "epoch": 2164} {"train_loss": -12.489974975585938, "global_step": 363597, "epoch": 2164} {"train_loss": -12.155959129333496, "global_step": 363598, "epoch": 2164} {"train_loss": -12.097387313842773, "global_step": 363599, "epoch": 2164} {"train_loss": -12.553892135620117, "global_step": 363600, "epoch": 2164} {"train_loss": -11.982523918151855, "global_step": 363601, "epoch": 2164} {"train_loss": -11.945722579956055, "global_step": 363602, "epoch": 2164} {"train_loss": -12.114167213439941, "global_step": 363603, "epoch": 2164} {"train_loss": -12.780244827270508, "global_step": 363604, "epoch": 2164} {"train_loss": -11.539690017700195, "global_step": 363605, "epoch": 2164} {"train_loss": -11.6197509765625, "global_step": 363606, "epoch": 2164} {"train_loss": -12.572758674621582, "global_step": 363607, "epoch": 2164} {"train_loss": -12.18039321899414, "global_step": 363608, "epoch": 2164} {"train_loss": -11.302020072937012, "global_step": 363609, "epoch": 2164} {"train_loss": -12.2077054977417, "global_step": 363610, "epoch": 2164} {"train_loss": -12.728570938110352, "global_step": 363611, "epoch": 2164} {"train_loss": -12.16991138458252, "global_step": 363612, "epoch": 2164} {"train_loss": -11.757818222045898, "global_step": 363613, "epoch": 2164} {"train_loss": -12.595661163330078, "global_step": 363614, "epoch": 2164} {"train_loss": -12.395208358764648, "global_step": 363615, "epoch": 2164} {"train_loss": -12.001057624816895, "global_step": 363616, "epoch": 2164} {"train_loss": -12.463794708251953, "global_step": 363617, "epoch": 2164} {"train_loss": -12.39862060546875, "global_step": 363618, "epoch": 2164} {"train_loss": -11.946554183959961, "global_step": 363619, "epoch": 2164} {"train_loss": -11.97081184387207, "global_step": 363620, "epoch": 2164} {"train_loss": -12.405399322509766, "global_step": 363621, "epoch": 2164} {"train_loss": -11.271910667419434, "global_step": 363622, "epoch": 2164} {"train_loss": -11.542551040649414, "global_step": 363623, "epoch": 2164} {"train_loss": -12.237957954406738, "global_step": 363624, "epoch": 2164} {"train_loss": -11.705889701843262, "global_step": 363625, "epoch": 2164} {"train_loss": -11.99077033996582, "global_step": 363626, "epoch": 2164} {"train_loss": -11.677536010742188, "global_step": 363627, "epoch": 2164} {"train_loss": -10.664608001708984, "global_step": 363628, "epoch": 2164} {"train_loss": -11.946479797363281, "global_step": 363629, "epoch": 2164} {"train_loss": -12.305989265441895, "global_step": 363630, "epoch": 2164} {"train_loss": -10.947585105895996, "global_step": 363631, "epoch": 2164} {"train_loss": -11.635688781738281, "global_step": 363632, "epoch": 2164} {"train_loss": -11.960493087768555, "global_step": 363633, "epoch": 2164} {"train_loss": -11.868707656860352, "global_step": 363634, "epoch": 2164} {"train_loss": -11.261979103088379, "global_step": 363635, "epoch": 2164} {"train_loss": -11.913780212402344, "global_step": 363636, "epoch": 2164} {"train_loss": -12.116055488586426, "global_step": 363637, "epoch": 2164} {"train_loss": -12.166942596435547, "global_step": 363638, "epoch": 2164} {"train_loss": -11.796436309814453, "global_step": 363639, "epoch": 2164} {"train_loss": -12.431034088134766, "global_step": 363640, "epoch": 2164} {"train_loss": -11.806058883666992, "global_step": 363641, "epoch": 2164} {"train_loss": -12.26758861541748, "global_step": 363642, "epoch": 2164} {"train_loss": -12.20469856262207, "global_step": 363643, "epoch": 2164} {"train_loss": -12.534021377563477, "global_step": 363644, "epoch": 2164} {"train_loss": -11.928369522094727, "global_step": 363645, "epoch": 2164} {"train_loss": -12.388280868530273, "global_step": 363646, "epoch": 2164} {"train_loss": -12.114324569702148, "global_step": 363647, "epoch": 2164} {"train_loss": -12.110727310180664, "global_step": 363648, "epoch": 2164} {"train_loss": -12.17611312866211, "global_step": 363649, "epoch": 2164} {"train_loss": -12.023077011108398, "global_step": 363650, "epoch": 2164} {"train_loss": -12.178176879882812, "global_step": 363651, "epoch": 2164} {"train_loss": -11.764060974121094, "global_step": 363652, "epoch": 2164} {"train_loss": -12.12364387512207, "global_step": 363653, "epoch": 2164} {"train_loss": -12.06279182434082, "global_step": 363654, "epoch": 2164} {"train_loss": -12.452866554260254, "global_step": 363655, "epoch": 2164} {"train_loss": -12.138816833496094, "global_step": 363656, "epoch": 2164} {"train_loss": -12.13917350769043, "global_step": 363657, "epoch": 2164} {"train_loss": -11.702840805053711, "global_step": 363658, "epoch": 2164} {"train_loss": -11.9939603805542, "global_step": 363659, "epoch": 2164} {"train_loss": -11.946317672729492, "global_step": 363660, "epoch": 2164} {"train_loss": -12.102997779846191, "global_step": 363661, "epoch": 2164} {"train_loss": -12.044848442077637, "global_step": 363662, "epoch": 2164} {"train_loss": -12.132455825805664, "global_step": 363663, "epoch": 2164} {"train_loss": -12.274621963500977, "global_step": 363664, "epoch": 2164} {"train_loss": -11.816781997680664, "global_step": 363665, "epoch": 2164} {"train_loss": -12.278633117675781, "global_step": 363666, "epoch": 2164} {"train_loss": -12.01716136932373, "global_step": 363667, "epoch": 2164} {"train_loss": -12.288978576660156, "global_step": 363668, "epoch": 2164} {"train_loss": -11.689849853515625, "global_step": 363669, "epoch": 2164} {"train_loss": -12.05124282836914, "global_step": 363670, "epoch": 2164} {"train_loss": -11.79310417175293, "global_step": 363671, "epoch": 2164} {"train_loss": -12.15496826171875, "global_step": 363672, "epoch": 2164} {"train_loss": -11.499077796936035, "global_step": 363673, "epoch": 2164} {"train_loss": -11.928567886352539, "global_step": 363674, "epoch": 2164} {"train_loss": -11.889761924743652, "global_step": 363675, "epoch": 2164} {"train_loss": -11.799564361572266, "global_step": 363676, "epoch": 2164} {"train_loss": -11.224977493286133, "global_step": 363677, "epoch": 2164} {"train_loss": -11.520450592041016, "global_step": 363678, "epoch": 2164} {"train_loss": -11.879531860351562, "global_step": 363679, "epoch": 2164} {"train_loss": -11.861787796020508, "global_step": 363680, "epoch": 2164} {"train_loss": -11.849796295166016, "global_step": 363681, "epoch": 2164} {"train_loss": -11.903557777404785, "global_step": 363682, "epoch": 2164} {"train_loss": -12.019426345825195, "global_step": 363683, "epoch": 2164} {"train_loss": -12.002082824707031, "global_step": 363684, "epoch": 2164} {"train_loss": -11.82028579711914, "global_step": 363685, "epoch": 2164} {"train_loss": -11.90853500366211, "global_step": 363686, "epoch": 2164} {"train_loss": -11.990121841430664, "global_step": 363687, "epoch": 2164} {"train_loss": -11.474335670471191, "global_step": 363688, "epoch": 2164} {"train_loss": -11.836258888244629, "global_step": 363689, "epoch": 2164} {"train_loss": -11.955509185791016, "global_step": 363690, "epoch": 2164} {"train_loss": -10.870243072509766, "global_step": 363691, "epoch": 2164} {"train_loss": -12.18462085723877, "global_step": 363692, "epoch": 2164} {"train_loss": -11.999361991882324, "global_step": 363693, "epoch": 2164} {"train_loss": -11.278676986694336, "global_step": 363694, "epoch": 2164} {"train_loss": -11.795540809631348, "global_step": 363695, "epoch": 2164} {"train_loss": -11.536243438720703, "global_step": 363696, "epoch": 2164} {"train_loss": -11.331672668457031, "global_step": 363697, "epoch": 2164} {"train_loss": -11.484209060668945, "global_step": 363698, "epoch": 2164} {"train_loss": -11.289414405822754, "global_step": 363699, "epoch": 2164} {"train_loss": -11.935700416564941, "global_step": 363700, "epoch": 2164} {"train_loss": -11.59376049041748, "global_step": 363701, "epoch": 2164} {"train_loss": -11.865039825439453, "global_step": 363702, "epoch": 2164} {"train_loss": -11.926024436950684, "global_step": 363703, "epoch": 2164} {"train_loss": -11.589781761169434, "global_step": 363704, "epoch": 2164} {"train_loss": -12.095663070678711, "global_step": 363705, "epoch": 2164} {"train_loss": -11.104503631591797, "global_step": 363706, "epoch": 2164} {"train_loss": -11.688285827636719, "global_step": 363707, "epoch": 2164} {"train_loss": -11.758686065673828, "global_step": 363708, "epoch": 2164} {"train_loss": -11.1864013671875, "global_step": 363709, "epoch": 2164} {"train_loss": -12.16907787322998, "global_step": 363710, "epoch": 2164} {"train_loss": -11.180785179138184, "global_step": 363711, "epoch": 2164} {"train_loss": -11.356425285339355, "global_step": 363712, "epoch": 2164} {"train_loss": -11.972940444946289, "global_step": 363713, "epoch": 2164} {"train_loss": -11.508342742919922, "global_step": 363714, "epoch": 2164} {"train_loss": -12.08647346496582, "global_step": 363715, "epoch": 2164} {"train_loss": -11.56445026397705, "global_step": 363716, "epoch": 2164} {"train_loss": -11.599994659423828, "global_step": 363717, "epoch": 2164} {"train_loss": -11.566802024841309, "global_step": 363718, "epoch": 2164} {"train_loss": -11.999955881209601, "global_step": 363719, "epoch": 2164, "val_loss": 292435.34375} {"train_loss": -11.736753463745117, "global_step": 363720, "epoch": 2165} {"train_loss": -11.750545501708984, "global_step": 363721, "epoch": 2165} {"train_loss": -12.253250122070312, "global_step": 363722, "epoch": 2165} {"train_loss": -11.765056610107422, "global_step": 363723, "epoch": 2165} {"train_loss": -11.817800521850586, "global_step": 363724, "epoch": 2165} {"train_loss": -11.94797134399414, "global_step": 363725, "epoch": 2165} {"train_loss": -12.104140281677246, "global_step": 363726, "epoch": 2165} {"train_loss": -12.342409133911133, "global_step": 363727, "epoch": 2165} {"train_loss": -11.849488258361816, "global_step": 363728, "epoch": 2165} {"train_loss": -12.27792739868164, "global_step": 363729, "epoch": 2165} {"train_loss": -11.745152473449707, "global_step": 363730, "epoch": 2165} {"train_loss": -11.973119735717773, "global_step": 363731, "epoch": 2165} {"train_loss": -12.065814971923828, "global_step": 363732, "epoch": 2165} {"train_loss": -11.337116241455078, "global_step": 363733, "epoch": 2165} {"train_loss": -12.04401969909668, "global_step": 363734, "epoch": 2165} {"train_loss": -11.948925971984863, "global_step": 363735, "epoch": 2165} {"train_loss": -11.994974136352539, "global_step": 363736, "epoch": 2165} {"train_loss": -12.370914459228516, "global_step": 363737, "epoch": 2165} {"train_loss": -11.957679748535156, "global_step": 363738, "epoch": 2165} {"train_loss": -12.259326934814453, "global_step": 363739, "epoch": 2165} {"train_loss": -12.47767448425293, "global_step": 363740, "epoch": 2165} {"train_loss": -12.134735107421875, "global_step": 363741, "epoch": 2165} {"train_loss": -12.462040901184082, "global_step": 363742, "epoch": 2165} {"train_loss": -12.286178588867188, "global_step": 363743, "epoch": 2165} {"train_loss": -12.397560119628906, "global_step": 363744, "epoch": 2165} {"train_loss": -12.120155334472656, "global_step": 363745, "epoch": 2165} {"train_loss": -12.45846176147461, "global_step": 363746, "epoch": 2165} {"train_loss": -12.490856170654297, "global_step": 363747, "epoch": 2165} {"train_loss": -12.19136905670166, "global_step": 363748, "epoch": 2165} {"train_loss": -12.570306777954102, "global_step": 363749, "epoch": 2165} {"train_loss": -12.342397689819336, "global_step": 363750, "epoch": 2165} {"train_loss": -12.47821044921875, "global_step": 363751, "epoch": 2165} {"train_loss": -12.585044860839844, "global_step": 363752, "epoch": 2165} {"train_loss": -12.441768646240234, "global_step": 363753, "epoch": 2165} {"train_loss": -12.581235885620117, "global_step": 363754, "epoch": 2165} {"train_loss": -12.41459846496582, "global_step": 363755, "epoch": 2165} {"train_loss": -12.594582557678223, "global_step": 363756, "epoch": 2165} {"train_loss": -12.241594314575195, "global_step": 363757, "epoch": 2165} {"train_loss": -12.5068359375, "global_step": 363758, "epoch": 2165} {"train_loss": -12.437427520751953, "global_step": 363759, "epoch": 2165} {"train_loss": -12.584447860717773, "global_step": 363760, "epoch": 2165} {"train_loss": -12.758087158203125, "global_step": 363761, "epoch": 2165} {"train_loss": -12.49293041229248, "global_step": 363762, "epoch": 2165} {"train_loss": -12.587246894836426, "global_step": 363763, "epoch": 2165} {"train_loss": -12.700065612792969, "global_step": 363764, "epoch": 2165} {"train_loss": -12.750691413879395, "global_step": 363765, "epoch": 2165} {"train_loss": -12.702411651611328, "global_step": 363766, "epoch": 2165} {"train_loss": -12.500382423400879, "global_step": 363767, "epoch": 2165} {"train_loss": -12.55841064453125, "global_step": 363768, "epoch": 2165} {"train_loss": -12.684664726257324, "global_step": 363769, "epoch": 2165} {"train_loss": -12.687443733215332, "global_step": 363770, "epoch": 2165} {"train_loss": -12.703783988952637, "global_step": 363771, "epoch": 2165} {"train_loss": -12.488594055175781, "global_step": 363772, "epoch": 2165} {"train_loss": -12.605232238769531, "global_step": 363773, "epoch": 2165} {"train_loss": -12.812442779541016, "global_step": 363774, "epoch": 2165} {"train_loss": -12.56048583984375, "global_step": 363775, "epoch": 2165} {"train_loss": -12.658404350280762, "global_step": 363776, "epoch": 2165} {"train_loss": -12.735172271728516, "global_step": 363777, "epoch": 2165} {"train_loss": -12.534038543701172, "global_step": 363778, "epoch": 2165} {"train_loss": -12.235983848571777, "global_step": 363779, "epoch": 2165} {"train_loss": -12.545732498168945, "global_step": 363780, "epoch": 2165} {"train_loss": -12.099845886230469, "global_step": 363781, "epoch": 2165} {"train_loss": -12.273998260498047, "global_step": 363782, "epoch": 2165} {"train_loss": -12.008377075195312, "global_step": 363783, "epoch": 2165} {"train_loss": -9.653274536132812, "global_step": 363784, "epoch": 2165} {"train_loss": -12.194011688232422, "global_step": 363785, "epoch": 2165} {"train_loss": -11.876970291137695, "global_step": 363786, "epoch": 2165} {"train_loss": -9.395391464233398, "global_step": 363787, "epoch": 2165} {"train_loss": -10.817869186401367, "global_step": 363788, "epoch": 2165} {"train_loss": -9.708763122558594, "global_step": 363789, "epoch": 2165} {"train_loss": -9.36775016784668, "global_step": 363790, "epoch": 2165} {"train_loss": -7.978426456451416, "global_step": 363791, "epoch": 2165} {"train_loss": -9.344808578491211, "global_step": 363792, "epoch": 2165} {"train_loss": -10.728536605834961, "global_step": 363793, "epoch": 2165} {"train_loss": -10.053945541381836, "global_step": 363794, "epoch": 2165} {"train_loss": -10.056480407714844, "global_step": 363795, "epoch": 2165} {"train_loss": -9.206358909606934, "global_step": 363796, "epoch": 2165} {"train_loss": -9.115650177001953, "global_step": 363797, "epoch": 2165} {"train_loss": -8.816469192504883, "global_step": 363798, "epoch": 2165} {"train_loss": -9.641607284545898, "global_step": 363799, "epoch": 2165} {"train_loss": -9.575469970703125, "global_step": 363800, "epoch": 2165} {"train_loss": -8.679159164428711, "global_step": 363801, "epoch": 2165} {"train_loss": -8.873176574707031, "global_step": 363802, "epoch": 2165} {"train_loss": -10.132926940917969, "global_step": 363803, "epoch": 2165} {"train_loss": -10.715583801269531, "global_step": 363804, "epoch": 2165} {"train_loss": -11.059440612792969, "global_step": 363805, "epoch": 2165} {"train_loss": -10.357489585876465, "global_step": 363806, "epoch": 2165} {"train_loss": -11.021282196044922, "global_step": 363807, "epoch": 2165} {"train_loss": -10.550687789916992, "global_step": 363808, "epoch": 2165} {"train_loss": -11.13875961303711, "global_step": 363809, "epoch": 2165} {"train_loss": -10.659163475036621, "global_step": 363810, "epoch": 2165} {"train_loss": -10.9597806930542, "global_step": 363811, "epoch": 2165} {"train_loss": -10.969979286193848, "global_step": 363812, "epoch": 2165} {"train_loss": -10.66070556640625, "global_step": 363813, "epoch": 2165} {"train_loss": -10.861329078674316, "global_step": 363814, "epoch": 2165} {"train_loss": -10.342734336853027, "global_step": 363815, "epoch": 2165} {"train_loss": -11.3134765625, "global_step": 363816, "epoch": 2165} {"train_loss": -10.007458686828613, "global_step": 363817, "epoch": 2165} {"train_loss": -10.898492813110352, "global_step": 363818, "epoch": 2165} {"train_loss": -11.383184432983398, "global_step": 363819, "epoch": 2165} {"train_loss": -10.988402366638184, "global_step": 363820, "epoch": 2165} {"train_loss": -11.220670700073242, "global_step": 363821, "epoch": 2165} {"train_loss": -11.711935997009277, "global_step": 363822, "epoch": 2165} {"train_loss": -10.808679580688477, "global_step": 363823, "epoch": 2165} {"train_loss": -11.86800479888916, "global_step": 363824, "epoch": 2165} {"train_loss": -11.082475662231445, "global_step": 363825, "epoch": 2165} {"train_loss": -10.733634948730469, "global_step": 363826, "epoch": 2165} {"train_loss": -11.144851684570312, "global_step": 363827, "epoch": 2165} {"train_loss": -11.006827354431152, "global_step": 363828, "epoch": 2165} {"train_loss": -10.518369674682617, "global_step": 363829, "epoch": 2165} {"train_loss": -11.058652877807617, "global_step": 363830, "epoch": 2165} {"train_loss": -11.261564254760742, "global_step": 363831, "epoch": 2165} {"train_loss": -10.287288665771484, "global_step": 363832, "epoch": 2165} {"train_loss": -11.703350067138672, "global_step": 363833, "epoch": 2165} {"train_loss": -10.972616195678711, "global_step": 363834, "epoch": 2165} {"train_loss": -11.602697372436523, "global_step": 363835, "epoch": 2165} {"train_loss": -11.343061447143555, "global_step": 363836, "epoch": 2165} {"train_loss": -11.485345840454102, "global_step": 363837, "epoch": 2165} {"train_loss": -11.455011367797852, "global_step": 363838, "epoch": 2165} {"train_loss": -11.757709503173828, "global_step": 363839, "epoch": 2165} {"train_loss": -11.802434921264648, "global_step": 363840, "epoch": 2165} {"train_loss": -11.285440444946289, "global_step": 363841, "epoch": 2165} {"train_loss": -11.680471420288086, "global_step": 363842, "epoch": 2165} {"train_loss": -11.998970031738281, "global_step": 363843, "epoch": 2165} {"train_loss": -11.67509651184082, "global_step": 363844, "epoch": 2165} {"train_loss": -12.327640533447266, "global_step": 363845, "epoch": 2165} {"train_loss": -12.016952514648438, "global_step": 363846, "epoch": 2165} {"train_loss": -11.59914779663086, "global_step": 363847, "epoch": 2165} {"train_loss": -12.113155364990234, "global_step": 363848, "epoch": 2165} {"train_loss": -12.178611755371094, "global_step": 363849, "epoch": 2165} {"train_loss": -12.065420150756836, "global_step": 363850, "epoch": 2165} {"train_loss": -12.16612434387207, "global_step": 363851, "epoch": 2165} {"train_loss": -11.914027214050293, "global_step": 363852, "epoch": 2165} {"train_loss": -11.896974563598633, "global_step": 363853, "epoch": 2165} {"train_loss": -12.003024101257324, "global_step": 363854, "epoch": 2165} {"train_loss": -11.942693710327148, "global_step": 363855, "epoch": 2165} {"train_loss": -12.138126373291016, "global_step": 363856, "epoch": 2165} {"train_loss": -12.167125701904297, "global_step": 363857, "epoch": 2165} {"train_loss": -12.192198753356934, "global_step": 363858, "epoch": 2165} {"train_loss": -12.18299388885498, "global_step": 363859, "epoch": 2165} {"train_loss": -12.312206268310547, "global_step": 363860, "epoch": 2165} {"train_loss": -11.98915958404541, "global_step": 363861, "epoch": 2165} {"train_loss": -12.409463882446289, "global_step": 363862, "epoch": 2165} {"train_loss": -12.104395866394043, "global_step": 363863, "epoch": 2165} {"train_loss": -12.21329402923584, "global_step": 363864, "epoch": 2165} {"train_loss": -12.183096885681152, "global_step": 363865, "epoch": 2165} {"train_loss": -12.268281936645508, "global_step": 363866, "epoch": 2165} {"train_loss": -12.229827880859375, "global_step": 363867, "epoch": 2165} {"train_loss": -12.165306091308594, "global_step": 363868, "epoch": 2165} {"train_loss": -12.322087287902832, "global_step": 363869, "epoch": 2165} {"train_loss": -12.390552520751953, "global_step": 363870, "epoch": 2165} {"train_loss": -12.269250869750977, "global_step": 363871, "epoch": 2165} {"train_loss": -12.271366119384766, "global_step": 363872, "epoch": 2165} {"train_loss": -12.258950233459473, "global_step": 363873, "epoch": 2165} {"train_loss": -12.410871505737305, "global_step": 363874, "epoch": 2165} {"train_loss": -12.328285217285156, "global_step": 363875, "epoch": 2165} {"train_loss": -12.410331726074219, "global_step": 363876, "epoch": 2165} {"train_loss": -12.434514045715332, "global_step": 363877, "epoch": 2165} {"train_loss": -12.414472579956055, "global_step": 363878, "epoch": 2165} {"train_loss": -12.159492492675781, "global_step": 363879, "epoch": 2165} {"train_loss": -12.310166358947754, "global_step": 363880, "epoch": 2165} {"train_loss": -12.387630462646484, "global_step": 363881, "epoch": 2165} {"train_loss": -12.256600379943848, "global_step": 363882, "epoch": 2165} {"train_loss": -12.28223705291748, "global_step": 363883, "epoch": 2165} {"train_loss": -12.42215347290039, "global_step": 363884, "epoch": 2165} {"train_loss": -12.404552459716797, "global_step": 363885, "epoch": 2165} {"train_loss": -12.434317588806152, "global_step": 363886, "epoch": 2165} {"train_loss": -11.697090481008802, "global_step": 363887, "epoch": 2165, "val_loss": 283862.875, "train_action_mse_error": 1.878983974456787} {"train_loss": -12.67338752746582, "global_step": 363888, "epoch": 2166} {"train_loss": -12.356881141662598, "global_step": 363889, "epoch": 2166} {"train_loss": -12.398447036743164, "global_step": 363890, "epoch": 2166} {"train_loss": -12.482654571533203, "global_step": 363891, "epoch": 2166} {"train_loss": -12.622781753540039, "global_step": 363892, "epoch": 2166} {"train_loss": -12.489864349365234, "global_step": 363893, "epoch": 2166} {"train_loss": -12.584625244140625, "global_step": 363894, "epoch": 2166} {"train_loss": -12.34987735748291, "global_step": 363895, "epoch": 2166} {"train_loss": -12.390474319458008, "global_step": 363896, "epoch": 2166} {"train_loss": -12.618255615234375, "global_step": 363897, "epoch": 2166} {"train_loss": -12.445990562438965, "global_step": 363898, "epoch": 2166} {"train_loss": -12.506311416625977, "global_step": 363899, "epoch": 2166} {"train_loss": -12.443190574645996, "global_step": 363900, "epoch": 2166} {"train_loss": -12.713996887207031, "global_step": 363901, "epoch": 2166} {"train_loss": -12.736047744750977, "global_step": 363902, "epoch": 2166} {"train_loss": -12.599788665771484, "global_step": 363903, "epoch": 2166} {"train_loss": -12.634183883666992, "global_step": 363904, "epoch": 2166} {"train_loss": -12.451248168945312, "global_step": 363905, "epoch": 2166} {"train_loss": -12.421401977539062, "global_step": 363906, "epoch": 2166} {"train_loss": -12.698999404907227, "global_step": 363907, "epoch": 2166} {"train_loss": -12.501899719238281, "global_step": 363908, "epoch": 2166} {"train_loss": -12.376816749572754, "global_step": 363909, "epoch": 2166} {"train_loss": -12.374526977539062, "global_step": 363910, "epoch": 2166} {"train_loss": -12.651479721069336, "global_step": 363911, "epoch": 2166} {"train_loss": -12.602874755859375, "global_step": 363912, "epoch": 2166} {"train_loss": -12.350685119628906, "global_step": 363913, "epoch": 2166} {"train_loss": -12.319463729858398, "global_step": 363914, "epoch": 2166} {"train_loss": -11.991445541381836, "global_step": 363915, "epoch": 2166} {"train_loss": -12.138910293579102, "global_step": 363916, "epoch": 2166} {"train_loss": -12.762406349182129, "global_step": 363917, "epoch": 2166} {"train_loss": -12.433356285095215, "global_step": 363918, "epoch": 2166} {"train_loss": -12.659172058105469, "global_step": 363919, "epoch": 2166} {"train_loss": -12.51672077178955, "global_step": 363920, "epoch": 2166} {"train_loss": -12.493829727172852, "global_step": 363921, "epoch": 2166} {"train_loss": -12.032602310180664, "global_step": 363922, "epoch": 2166} {"train_loss": -12.10227108001709, "global_step": 363923, "epoch": 2166} {"train_loss": -12.090164184570312, "global_step": 363924, "epoch": 2166} {"train_loss": -12.293764114379883, "global_step": 363925, "epoch": 2166} {"train_loss": -12.327099800109863, "global_step": 363926, "epoch": 2166} {"train_loss": -12.659931182861328, "global_step": 363927, "epoch": 2166} {"train_loss": -12.583990097045898, "global_step": 363928, "epoch": 2166} {"train_loss": -12.507329940795898, "global_step": 363929, "epoch": 2166} {"train_loss": -12.428430557250977, "global_step": 363930, "epoch": 2166} {"train_loss": -12.53665542602539, "global_step": 363931, "epoch": 2166} {"train_loss": -12.3464937210083, "global_step": 363932, "epoch": 2166} {"train_loss": -12.364888191223145, "global_step": 363933, "epoch": 2166} {"train_loss": -12.425172805786133, "global_step": 363934, "epoch": 2166} {"train_loss": -11.645681381225586, "global_step": 363935, "epoch": 2166} {"train_loss": -11.256814956665039, "global_step": 363936, "epoch": 2166} {"train_loss": -12.192744255065918, "global_step": 363937, "epoch": 2166} {"train_loss": -12.187568664550781, "global_step": 363938, "epoch": 2166} {"train_loss": -11.877352714538574, "global_step": 363939, "epoch": 2166} {"train_loss": -11.106348991394043, "global_step": 363940, "epoch": 2166} {"train_loss": -12.194049835205078, "global_step": 363941, "epoch": 2166} {"train_loss": -11.230802536010742, "global_step": 363942, "epoch": 2166} {"train_loss": -9.356410026550293, "global_step": 363943, "epoch": 2166} {"train_loss": -9.696544647216797, "global_step": 363944, "epoch": 2166} {"train_loss": -11.444414138793945, "global_step": 363945, "epoch": 2166} {"train_loss": -8.8422269821167, "global_step": 363946, "epoch": 2166} {"train_loss": -9.452133178710938, "global_step": 363947, "epoch": 2166} {"train_loss": -9.246706008911133, "global_step": 363948, "epoch": 2166} {"train_loss": -10.641860961914062, "global_step": 363949, "epoch": 2166} {"train_loss": -9.237951278686523, "global_step": 363950, "epoch": 2166} {"train_loss": -7.210906982421875, "global_step": 363951, "epoch": 2166} {"train_loss": -8.463814735412598, "global_step": 363952, "epoch": 2166} {"train_loss": -8.831533432006836, "global_step": 363953, "epoch": 2166} {"train_loss": -9.757406234741211, "global_step": 363954, "epoch": 2166} {"train_loss": -9.320333480834961, "global_step": 363955, "epoch": 2166} {"train_loss": -9.419120788574219, "global_step": 363956, "epoch": 2166} {"train_loss": -8.995969772338867, "global_step": 363957, "epoch": 2166} {"train_loss": -11.167461395263672, "global_step": 363958, "epoch": 2166} {"train_loss": -9.79463005065918, "global_step": 363959, "epoch": 2166} {"train_loss": -10.603144645690918, "global_step": 363960, "epoch": 2166} {"train_loss": -10.177879333496094, "global_step": 363961, "epoch": 2166} {"train_loss": -10.146331787109375, "global_step": 363962, "epoch": 2166} {"train_loss": -10.701464653015137, "global_step": 363963, "epoch": 2166} {"train_loss": -9.775273323059082, "global_step": 363964, "epoch": 2166} {"train_loss": -10.674041748046875, "global_step": 363965, "epoch": 2166} {"train_loss": -10.32759952545166, "global_step": 363966, "epoch": 2166} {"train_loss": -9.601844787597656, "global_step": 363967, "epoch": 2166} {"train_loss": -9.075186729431152, "global_step": 363968, "epoch": 2166} {"train_loss": -10.364250183105469, "global_step": 363969, "epoch": 2166} {"train_loss": -8.63621711730957, "global_step": 363970, "epoch": 2166} {"train_loss": -10.85706901550293, "global_step": 363971, "epoch": 2166} {"train_loss": -9.846634864807129, "global_step": 363972, "epoch": 2166} {"train_loss": -10.359350204467773, "global_step": 363973, "epoch": 2166} {"train_loss": -9.901814460754395, "global_step": 363974, "epoch": 2166} {"train_loss": -10.853816986083984, "global_step": 363975, "epoch": 2166} {"train_loss": -10.711882591247559, "global_step": 363976, "epoch": 2166} {"train_loss": -10.890874862670898, "global_step": 363977, "epoch": 2166} {"train_loss": -11.200927734375, "global_step": 363978, "epoch": 2166} {"train_loss": -10.423447608947754, "global_step": 363979, "epoch": 2166} {"train_loss": -10.497701644897461, "global_step": 363980, "epoch": 2166} {"train_loss": -11.134300231933594, "global_step": 363981, "epoch": 2166} {"train_loss": -11.26900577545166, "global_step": 363982, "epoch": 2166} {"train_loss": -9.874926567077637, "global_step": 363983, "epoch": 2166} {"train_loss": -11.345634460449219, "global_step": 363984, "epoch": 2166} {"train_loss": -10.845197677612305, "global_step": 363985, "epoch": 2166} {"train_loss": -11.12153148651123, "global_step": 363986, "epoch": 2166} {"train_loss": -11.818452835083008, "global_step": 363987, "epoch": 2166} {"train_loss": -11.259666442871094, "global_step": 363988, "epoch": 2166} {"train_loss": -11.486007690429688, "global_step": 363989, "epoch": 2166} {"train_loss": -11.383493423461914, "global_step": 363990, "epoch": 2166} {"train_loss": -11.54847240447998, "global_step": 363991, "epoch": 2166} {"train_loss": -11.802690505981445, "global_step": 363992, "epoch": 2166} {"train_loss": -11.254112243652344, "global_step": 363993, "epoch": 2166} {"train_loss": -11.225541114807129, "global_step": 363994, "epoch": 2166} {"train_loss": -11.768693923950195, "global_step": 363995, "epoch": 2166} {"train_loss": -11.110830307006836, "global_step": 363996, "epoch": 2166} {"train_loss": -11.425764083862305, "global_step": 363997, "epoch": 2166} {"train_loss": -11.847939491271973, "global_step": 363998, "epoch": 2166} {"train_loss": -11.47468376159668, "global_step": 363999, "epoch": 2166} {"train_loss": -11.534405708312988, "global_step": 364000, "epoch": 2166} {"train_loss": -11.869667053222656, "global_step": 364001, "epoch": 2166} {"train_loss": -11.310293197631836, "global_step": 364002, "epoch": 2166} {"train_loss": -11.884495735168457, "global_step": 364003, "epoch": 2166} {"train_loss": -11.754867553710938, "global_step": 364004, "epoch": 2166} {"train_loss": -11.876434326171875, "global_step": 364005, "epoch": 2166} {"train_loss": -11.778375625610352, "global_step": 364006, "epoch": 2166} {"train_loss": -11.774238586425781, "global_step": 364007, "epoch": 2166} {"train_loss": -11.942523002624512, "global_step": 364008, "epoch": 2166} {"train_loss": -11.903923988342285, "global_step": 364009, "epoch": 2166} {"train_loss": -12.159156799316406, "global_step": 364010, "epoch": 2166} {"train_loss": -11.893209457397461, "global_step": 364011, "epoch": 2166} {"train_loss": -12.05882740020752, "global_step": 364012, "epoch": 2166} {"train_loss": -12.124940872192383, "global_step": 364013, "epoch": 2166} {"train_loss": -12.009772300720215, "global_step": 364014, "epoch": 2166} {"train_loss": -12.412515640258789, "global_step": 364015, "epoch": 2166} {"train_loss": -12.154870986938477, "global_step": 364016, "epoch": 2166} {"train_loss": -12.023502349853516, "global_step": 364017, "epoch": 2166} {"train_loss": -12.055543899536133, "global_step": 364018, "epoch": 2166} {"train_loss": -12.217863082885742, "global_step": 364019, "epoch": 2166} {"train_loss": -12.174352645874023, "global_step": 364020, "epoch": 2166} {"train_loss": -12.101917266845703, "global_step": 364021, "epoch": 2166} {"train_loss": -12.320760726928711, "global_step": 364022, "epoch": 2166} {"train_loss": -12.10097885131836, "global_step": 364023, "epoch": 2166} {"train_loss": -12.259780883789062, "global_step": 364024, "epoch": 2166} {"train_loss": -12.067246437072754, "global_step": 364025, "epoch": 2166} {"train_loss": -12.235658645629883, "global_step": 364026, "epoch": 2166} {"train_loss": -12.154207229614258, "global_step": 364027, "epoch": 2166} {"train_loss": -12.379364013671875, "global_step": 364028, "epoch": 2166} {"train_loss": -12.200248718261719, "global_step": 364029, "epoch": 2166} {"train_loss": -12.221569061279297, "global_step": 364030, "epoch": 2166} {"train_loss": -12.156034469604492, "global_step": 364031, "epoch": 2166} {"train_loss": -12.30543041229248, "global_step": 364032, "epoch": 2166} {"train_loss": -12.226463317871094, "global_step": 364033, "epoch": 2166} {"train_loss": -12.151185989379883, "global_step": 364034, "epoch": 2166} {"train_loss": -12.40937614440918, "global_step": 364035, "epoch": 2166} {"train_loss": -12.185933113098145, "global_step": 364036, "epoch": 2166} {"train_loss": -12.373285293579102, "global_step": 364037, "epoch": 2166} {"train_loss": -12.447589874267578, "global_step": 364038, "epoch": 2166} {"train_loss": -12.28586196899414, "global_step": 364039, "epoch": 2166} {"train_loss": -12.41572380065918, "global_step": 364040, "epoch": 2166} {"train_loss": -12.50201416015625, "global_step": 364041, "epoch": 2166} {"train_loss": -12.412240982055664, "global_step": 364042, "epoch": 2166} {"train_loss": -12.275870323181152, "global_step": 364043, "epoch": 2166} {"train_loss": -12.380706787109375, "global_step": 364044, "epoch": 2166} {"train_loss": -12.300357818603516, "global_step": 364045, "epoch": 2166} {"train_loss": -12.362283706665039, "global_step": 364046, "epoch": 2166} {"train_loss": -12.539640426635742, "global_step": 364047, "epoch": 2166} {"train_loss": -12.304543495178223, "global_step": 364048, "epoch": 2166} {"train_loss": -12.558736801147461, "global_step": 364049, "epoch": 2166} {"train_loss": -12.521369934082031, "global_step": 364050, "epoch": 2166} {"train_loss": -12.446231842041016, "global_step": 364051, "epoch": 2166} {"train_loss": -12.498188018798828, "global_step": 364052, "epoch": 2166} {"train_loss": -12.436296463012695, "global_step": 364053, "epoch": 2166} {"train_loss": -12.530746459960938, "global_step": 364054, "epoch": 2166} {"train_loss": -11.625538922491527, "global_step": 364055, "epoch": 2166, "val_loss": 286381.40625} {"train_loss": -12.461492538452148, "global_step": 364056, "epoch": 2167} {"train_loss": -12.355609893798828, "global_step": 364057, "epoch": 2167} {"train_loss": -12.361953735351562, "global_step": 364058, "epoch": 2167} {"train_loss": -12.58979606628418, "global_step": 364059, "epoch": 2167} {"train_loss": -12.372247695922852, "global_step": 364060, "epoch": 2167} {"train_loss": -12.113357543945312, "global_step": 364061, "epoch": 2167} {"train_loss": -12.474944114685059, "global_step": 364062, "epoch": 2167} {"train_loss": -12.171709060668945, "global_step": 364063, "epoch": 2167} {"train_loss": -12.415872573852539, "global_step": 364064, "epoch": 2167} {"train_loss": -12.418031692504883, "global_step": 364065, "epoch": 2167} {"train_loss": -12.503355026245117, "global_step": 364066, "epoch": 2167} {"train_loss": -12.554586410522461, "global_step": 364067, "epoch": 2167} {"train_loss": -12.529385566711426, "global_step": 364068, "epoch": 2167} {"train_loss": -12.477272033691406, "global_step": 364069, "epoch": 2167} {"train_loss": -12.389140129089355, "global_step": 364070, "epoch": 2167} {"train_loss": -12.337712287902832, "global_step": 364071, "epoch": 2167} {"train_loss": -12.483762741088867, "global_step": 364072, "epoch": 2167} {"train_loss": -12.536444664001465, "global_step": 364073, "epoch": 2167} {"train_loss": -12.588212966918945, "global_step": 364074, "epoch": 2167} {"train_loss": -12.652276992797852, "global_step": 364075, "epoch": 2167} {"train_loss": -12.554973602294922, "global_step": 364076, "epoch": 2167} {"train_loss": -12.308332443237305, "global_step": 364077, "epoch": 2167} {"train_loss": -12.560076713562012, "global_step": 364078, "epoch": 2167} {"train_loss": -12.508509635925293, "global_step": 364079, "epoch": 2167} {"train_loss": -12.651811599731445, "global_step": 364080, "epoch": 2167} {"train_loss": -12.687023162841797, "global_step": 364081, "epoch": 2167} {"train_loss": -12.189216613769531, "global_step": 364082, "epoch": 2167} {"train_loss": -12.34524154663086, "global_step": 364083, "epoch": 2167} {"train_loss": -12.387025833129883, "global_step": 364084, "epoch": 2167} {"train_loss": -12.57374095916748, "global_step": 364085, "epoch": 2167} {"train_loss": -11.99329948425293, "global_step": 364086, "epoch": 2167} {"train_loss": -11.829442977905273, "global_step": 364087, "epoch": 2167} {"train_loss": -12.139304161071777, "global_step": 364088, "epoch": 2167} {"train_loss": -12.641283988952637, "global_step": 364089, "epoch": 2167} {"train_loss": -12.12378978729248, "global_step": 364090, "epoch": 2167} {"train_loss": -11.746660232543945, "global_step": 364091, "epoch": 2167} {"train_loss": -11.964985847473145, "global_step": 364092, "epoch": 2167} {"train_loss": -12.245641708374023, "global_step": 364093, "epoch": 2167} {"train_loss": -12.602761268615723, "global_step": 364094, "epoch": 2167} {"train_loss": -12.63850212097168, "global_step": 364095, "epoch": 2167} {"train_loss": -12.139737129211426, "global_step": 364096, "epoch": 2167} {"train_loss": -11.900971412658691, "global_step": 364097, "epoch": 2167} {"train_loss": -12.31113052368164, "global_step": 364098, "epoch": 2167} {"train_loss": -11.948258399963379, "global_step": 364099, "epoch": 2167} {"train_loss": -11.999340057373047, "global_step": 364100, "epoch": 2167} {"train_loss": -10.584875106811523, "global_step": 364101, "epoch": 2167} {"train_loss": -11.23965835571289, "global_step": 364102, "epoch": 2167} {"train_loss": -12.196817398071289, "global_step": 364103, "epoch": 2167} {"train_loss": -11.528152465820312, "global_step": 364104, "epoch": 2167} {"train_loss": -11.663012504577637, "global_step": 364105, "epoch": 2167} {"train_loss": -12.104609489440918, "global_step": 364106, "epoch": 2167} {"train_loss": -11.709165573120117, "global_step": 364107, "epoch": 2167} {"train_loss": -11.68426513671875, "global_step": 364108, "epoch": 2167} {"train_loss": -12.3260498046875, "global_step": 364109, "epoch": 2167} {"train_loss": -11.747699737548828, "global_step": 364110, "epoch": 2167} {"train_loss": -12.138044357299805, "global_step": 364111, "epoch": 2167} {"train_loss": -12.35840892791748, "global_step": 364112, "epoch": 2167} {"train_loss": -12.096384048461914, "global_step": 364113, "epoch": 2167} {"train_loss": -11.718517303466797, "global_step": 364114, "epoch": 2167} {"train_loss": -11.269508361816406, "global_step": 364115, "epoch": 2167} {"train_loss": -12.439414024353027, "global_step": 364116, "epoch": 2167} {"train_loss": -11.550304412841797, "global_step": 364117, "epoch": 2167} {"train_loss": -11.814191818237305, "global_step": 364118, "epoch": 2167} {"train_loss": -12.261281967163086, "global_step": 364119, "epoch": 2167} {"train_loss": -12.02935791015625, "global_step": 364120, "epoch": 2167} {"train_loss": -11.589595794677734, "global_step": 364121, "epoch": 2167} {"train_loss": -11.487854957580566, "global_step": 364122, "epoch": 2167} {"train_loss": -12.12718391418457, "global_step": 364123, "epoch": 2167} {"train_loss": -12.036541938781738, "global_step": 364124, "epoch": 2167} {"train_loss": -11.85646915435791, "global_step": 364125, "epoch": 2167} {"train_loss": -12.125877380371094, "global_step": 364126, "epoch": 2167} {"train_loss": -11.30624008178711, "global_step": 364127, "epoch": 2167} {"train_loss": -12.249210357666016, "global_step": 364128, "epoch": 2167} {"train_loss": -11.493488311767578, "global_step": 364129, "epoch": 2167} {"train_loss": -11.802945137023926, "global_step": 364130, "epoch": 2167} {"train_loss": -11.284997940063477, "global_step": 364131, "epoch": 2167} {"train_loss": -12.203805923461914, "global_step": 364132, "epoch": 2167} {"train_loss": -10.895209312438965, "global_step": 364133, "epoch": 2167} {"train_loss": -12.020543098449707, "global_step": 364134, "epoch": 2167} {"train_loss": -11.435510635375977, "global_step": 364135, "epoch": 2167} {"train_loss": -11.287626266479492, "global_step": 364136, "epoch": 2167} {"train_loss": -11.526521682739258, "global_step": 364137, "epoch": 2167} {"train_loss": -12.057985305786133, "global_step": 364138, "epoch": 2167} {"train_loss": -11.943906784057617, "global_step": 364139, "epoch": 2167} {"train_loss": -11.979947090148926, "global_step": 364140, "epoch": 2167} {"train_loss": -12.12041187286377, "global_step": 364141, "epoch": 2167} {"train_loss": -11.886621475219727, "global_step": 364142, "epoch": 2167} {"train_loss": -11.876153945922852, "global_step": 364143, "epoch": 2167} {"train_loss": -12.277259826660156, "global_step": 364144, "epoch": 2167} {"train_loss": -11.839693069458008, "global_step": 364145, "epoch": 2167} {"train_loss": -11.764723777770996, "global_step": 364146, "epoch": 2167} {"train_loss": -12.326790809631348, "global_step": 364147, "epoch": 2167} {"train_loss": -12.187440872192383, "global_step": 364148, "epoch": 2167} {"train_loss": -12.379192352294922, "global_step": 364149, "epoch": 2167} {"train_loss": -12.359384536743164, "global_step": 364150, "epoch": 2167} {"train_loss": -12.300090789794922, "global_step": 364151, "epoch": 2167} {"train_loss": -12.48429012298584, "global_step": 364152, "epoch": 2167} {"train_loss": -11.799097061157227, "global_step": 364153, "epoch": 2167} {"train_loss": -12.166580200195312, "global_step": 364154, "epoch": 2167} {"train_loss": -11.921693801879883, "global_step": 364155, "epoch": 2167} {"train_loss": -12.538040161132812, "global_step": 364156, "epoch": 2167} {"train_loss": -12.013839721679688, "global_step": 364157, "epoch": 2167} {"train_loss": -12.102884292602539, "global_step": 364158, "epoch": 2167} {"train_loss": -12.497705459594727, "global_step": 364159, "epoch": 2167} {"train_loss": -12.12843132019043, "global_step": 364160, "epoch": 2167} {"train_loss": -12.540056228637695, "global_step": 364161, "epoch": 2167} {"train_loss": -12.30900764465332, "global_step": 364162, "epoch": 2167} {"train_loss": -12.204294204711914, "global_step": 364163, "epoch": 2167} {"train_loss": -12.413219451904297, "global_step": 364164, "epoch": 2167} {"train_loss": -12.108991622924805, "global_step": 364165, "epoch": 2167} {"train_loss": -11.810663223266602, "global_step": 364166, "epoch": 2167} {"train_loss": -12.373963356018066, "global_step": 364167, "epoch": 2167} {"train_loss": -12.084484100341797, "global_step": 364168, "epoch": 2167} {"train_loss": -12.20515251159668, "global_step": 364169, "epoch": 2167} {"train_loss": -12.297542572021484, "global_step": 364170, "epoch": 2167} {"train_loss": -12.372461318969727, "global_step": 364171, "epoch": 2167} {"train_loss": -12.089757919311523, "global_step": 364172, "epoch": 2167} {"train_loss": -12.547829627990723, "global_step": 364173, "epoch": 2167} {"train_loss": -12.226988792419434, "global_step": 364174, "epoch": 2167} {"train_loss": -12.465727806091309, "global_step": 364175, "epoch": 2167} {"train_loss": -11.956082344055176, "global_step": 364176, "epoch": 2167} {"train_loss": -12.387203216552734, "global_step": 364177, "epoch": 2167} {"train_loss": -12.200980186462402, "global_step": 364178, "epoch": 2167} {"train_loss": -12.699419021606445, "global_step": 364179, "epoch": 2167} {"train_loss": -12.479426383972168, "global_step": 364180, "epoch": 2167} {"train_loss": -12.32598876953125, "global_step": 364181, "epoch": 2167} {"train_loss": -12.563100814819336, "global_step": 364182, "epoch": 2167} {"train_loss": -12.454522132873535, "global_step": 364183, "epoch": 2167} {"train_loss": -12.477869033813477, "global_step": 364184, "epoch": 2167} {"train_loss": -12.446534156799316, "global_step": 364185, "epoch": 2167} {"train_loss": -12.44127082824707, "global_step": 364186, "epoch": 2167} {"train_loss": -12.30327320098877, "global_step": 364187, "epoch": 2167} {"train_loss": -12.472827911376953, "global_step": 364188, "epoch": 2167} {"train_loss": -12.398168563842773, "global_step": 364189, "epoch": 2167} {"train_loss": -12.074636459350586, "global_step": 364190, "epoch": 2167} {"train_loss": -12.079733848571777, "global_step": 364191, "epoch": 2167} {"train_loss": -12.296234130859375, "global_step": 364192, "epoch": 2167} {"train_loss": -12.533794403076172, "global_step": 364193, "epoch": 2167} {"train_loss": -12.264110565185547, "global_step": 364194, "epoch": 2167} {"train_loss": -12.408146858215332, "global_step": 364195, "epoch": 2167} {"train_loss": -12.442499160766602, "global_step": 364196, "epoch": 2167} {"train_loss": -12.48443603515625, "global_step": 364197, "epoch": 2167} {"train_loss": -12.39787483215332, "global_step": 364198, "epoch": 2167} {"train_loss": -12.323123931884766, "global_step": 364199, "epoch": 2167} {"train_loss": -12.413946151733398, "global_step": 364200, "epoch": 2167} {"train_loss": -12.291508674621582, "global_step": 364201, "epoch": 2167} {"train_loss": -12.203707695007324, "global_step": 364202, "epoch": 2167} {"train_loss": -12.093402862548828, "global_step": 364203, "epoch": 2167} {"train_loss": -12.37732982635498, "global_step": 364204, "epoch": 2167} {"train_loss": -12.158573150634766, "global_step": 364205, "epoch": 2167} {"train_loss": -12.503534317016602, "global_step": 364206, "epoch": 2167} {"train_loss": -11.825590133666992, "global_step": 364207, "epoch": 2167} {"train_loss": -12.206798553466797, "global_step": 364208, "epoch": 2167} {"train_loss": -12.487839698791504, "global_step": 364209, "epoch": 2167} {"train_loss": -11.999147415161133, "global_step": 364210, "epoch": 2167} {"train_loss": -11.522581100463867, "global_step": 364211, "epoch": 2167} {"train_loss": -12.087712287902832, "global_step": 364212, "epoch": 2167} {"train_loss": -9.413522720336914, "global_step": 364213, "epoch": 2167} {"train_loss": -11.010321617126465, "global_step": 364214, "epoch": 2167} {"train_loss": -12.177757263183594, "global_step": 364215, "epoch": 2167} {"train_loss": -10.974356651306152, "global_step": 364216, "epoch": 2167} {"train_loss": -11.776898384094238, "global_step": 364217, "epoch": 2167} {"train_loss": -12.366636276245117, "global_step": 364218, "epoch": 2167} {"train_loss": -11.957637786865234, "global_step": 364219, "epoch": 2167} {"train_loss": -11.730230331420898, "global_step": 364220, "epoch": 2167} {"train_loss": -12.2259521484375, "global_step": 364221, "epoch": 2167} {"train_loss": -12.399538040161133, "global_step": 364222, "epoch": 2167} {"train_loss": -12.12543367204212, "global_step": 364223, "epoch": 2167, "val_loss": 290986.59375} {"train_loss": -11.440500259399414, "global_step": 364224, "epoch": 2168} {"train_loss": -11.853080749511719, "global_step": 364225, "epoch": 2168} {"train_loss": -12.034353256225586, "global_step": 364226, "epoch": 2168} {"train_loss": -11.566761016845703, "global_step": 364227, "epoch": 2168} {"train_loss": -12.185688018798828, "global_step": 364228, "epoch": 2168} {"train_loss": -12.024089813232422, "global_step": 364229, "epoch": 2168} {"train_loss": -11.074272155761719, "global_step": 364230, "epoch": 2168} {"train_loss": -11.261470794677734, "global_step": 364231, "epoch": 2168} {"train_loss": -10.881376266479492, "global_step": 364232, "epoch": 2168} {"train_loss": -10.141119003295898, "global_step": 364233, "epoch": 2168} {"train_loss": -11.939603805541992, "global_step": 364234, "epoch": 2168} {"train_loss": -10.54422378540039, "global_step": 364235, "epoch": 2168} {"train_loss": -11.02248477935791, "global_step": 364236, "epoch": 2168} {"train_loss": -9.754461288452148, "global_step": 364237, "epoch": 2168} {"train_loss": -9.265151977539062, "global_step": 364238, "epoch": 2168} {"train_loss": -8.399665832519531, "global_step": 364239, "epoch": 2168} {"train_loss": -9.097543716430664, "global_step": 364240, "epoch": 2168} {"train_loss": -9.640984535217285, "global_step": 364241, "epoch": 2168} {"train_loss": -10.122867584228516, "global_step": 364242, "epoch": 2168} {"train_loss": -10.034836769104004, "global_step": 364243, "epoch": 2168} {"train_loss": -8.726083755493164, "global_step": 364244, "epoch": 2168} {"train_loss": -9.29615592956543, "global_step": 364245, "epoch": 2168} {"train_loss": -9.922449111938477, "global_step": 364246, "epoch": 2168} {"train_loss": -10.401100158691406, "global_step": 364247, "epoch": 2168} {"train_loss": -10.048969268798828, "global_step": 364248, "epoch": 2168} {"train_loss": -11.316996574401855, "global_step": 364249, "epoch": 2168} {"train_loss": -10.183393478393555, "global_step": 364250, "epoch": 2168} {"train_loss": -11.580556869506836, "global_step": 364251, "epoch": 2168} {"train_loss": -10.869699478149414, "global_step": 364252, "epoch": 2168} {"train_loss": -11.537147521972656, "global_step": 364253, "epoch": 2168} {"train_loss": -10.637645721435547, "global_step": 364254, "epoch": 2168} {"train_loss": -11.425735473632812, "global_step": 364255, "epoch": 2168} {"train_loss": -11.164955139160156, "global_step": 364256, "epoch": 2168} {"train_loss": -11.199312210083008, "global_step": 364257, "epoch": 2168} {"train_loss": -11.835477828979492, "global_step": 364258, "epoch": 2168} {"train_loss": -11.024003982543945, "global_step": 364259, "epoch": 2168} {"train_loss": -12.0343017578125, "global_step": 364260, "epoch": 2168} {"train_loss": -11.27883529663086, "global_step": 364261, "epoch": 2168} {"train_loss": -11.59174919128418, "global_step": 364262, "epoch": 2168} {"train_loss": -11.925811767578125, "global_step": 364263, "epoch": 2168} {"train_loss": -11.828252792358398, "global_step": 364264, "epoch": 2168} {"train_loss": -11.623634338378906, "global_step": 364265, "epoch": 2168} {"train_loss": -11.83689022064209, "global_step": 364266, "epoch": 2168} {"train_loss": -11.937418937683105, "global_step": 364267, "epoch": 2168} {"train_loss": -11.737611770629883, "global_step": 364268, "epoch": 2168} {"train_loss": -11.989130020141602, "global_step": 364269, "epoch": 2168} {"train_loss": -11.62743091583252, "global_step": 364270, "epoch": 2168} {"train_loss": -12.27382755279541, "global_step": 364271, "epoch": 2168} {"train_loss": -11.705257415771484, "global_step": 364272, "epoch": 2168} {"train_loss": -12.101863861083984, "global_step": 364273, "epoch": 2168} {"train_loss": -12.08952522277832, "global_step": 364274, "epoch": 2168} {"train_loss": -12.110764503479004, "global_step": 364275, "epoch": 2168} {"train_loss": -12.21187686920166, "global_step": 364276, "epoch": 2168} {"train_loss": -12.330723762512207, "global_step": 364277, "epoch": 2168} {"train_loss": -12.251885414123535, "global_step": 364278, "epoch": 2168} {"train_loss": -12.26331901550293, "global_step": 364279, "epoch": 2168} {"train_loss": -12.130989074707031, "global_step": 364280, "epoch": 2168} {"train_loss": -12.381597518920898, "global_step": 364281, "epoch": 2168} {"train_loss": -12.350815773010254, "global_step": 364282, "epoch": 2168} {"train_loss": -12.393407821655273, "global_step": 364283, "epoch": 2168} {"train_loss": -12.242422103881836, "global_step": 364284, "epoch": 2168} {"train_loss": -12.132966041564941, "global_step": 364285, "epoch": 2168} {"train_loss": -12.248069763183594, "global_step": 364286, "epoch": 2168} {"train_loss": -12.161911964416504, "global_step": 364287, "epoch": 2168} {"train_loss": -12.08035659790039, "global_step": 364288, "epoch": 2168} {"train_loss": -12.345756530761719, "global_step": 364289, "epoch": 2168} {"train_loss": -12.103109359741211, "global_step": 364290, "epoch": 2168} {"train_loss": -12.365680694580078, "global_step": 364291, "epoch": 2168} {"train_loss": -12.293777465820312, "global_step": 364292, "epoch": 2168} {"train_loss": -12.462825775146484, "global_step": 364293, "epoch": 2168} {"train_loss": -12.330327987670898, "global_step": 364294, "epoch": 2168} {"train_loss": -12.430961608886719, "global_step": 364295, "epoch": 2168} {"train_loss": -12.46249008178711, "global_step": 364296, "epoch": 2168} {"train_loss": -12.440479278564453, "global_step": 364297, "epoch": 2168} {"train_loss": -12.525473594665527, "global_step": 364298, "epoch": 2168} {"train_loss": -12.470476150512695, "global_step": 364299, "epoch": 2168} {"train_loss": -12.378730773925781, "global_step": 364300, "epoch": 2168} {"train_loss": -12.50505256652832, "global_step": 364301, "epoch": 2168} {"train_loss": -12.271449089050293, "global_step": 364302, "epoch": 2168} {"train_loss": -12.27718734741211, "global_step": 364303, "epoch": 2168} {"train_loss": -12.33177375793457, "global_step": 364304, "epoch": 2168} {"train_loss": -12.228147506713867, "global_step": 364305, "epoch": 2168} {"train_loss": -12.536521911621094, "global_step": 364306, "epoch": 2168} {"train_loss": -12.216917991638184, "global_step": 364307, "epoch": 2168} {"train_loss": -12.657573699951172, "global_step": 364308, "epoch": 2168} {"train_loss": -12.29896354675293, "global_step": 364309, "epoch": 2168} {"train_loss": -12.316841125488281, "global_step": 364310, "epoch": 2168} {"train_loss": -12.413281440734863, "global_step": 364311, "epoch": 2168} {"train_loss": -12.575685501098633, "global_step": 364312, "epoch": 2168} {"train_loss": -12.572443008422852, "global_step": 364313, "epoch": 2168} {"train_loss": -12.434728622436523, "global_step": 364314, "epoch": 2168} {"train_loss": -12.533920288085938, "global_step": 364315, "epoch": 2168} {"train_loss": -12.672043800354004, "global_step": 364316, "epoch": 2168} {"train_loss": -12.283790588378906, "global_step": 364317, "epoch": 2168} {"train_loss": -12.466419219970703, "global_step": 364318, "epoch": 2168} {"train_loss": -12.724530220031738, "global_step": 364319, "epoch": 2168} {"train_loss": -12.499052047729492, "global_step": 364320, "epoch": 2168} {"train_loss": -12.627913475036621, "global_step": 364321, "epoch": 2168} {"train_loss": -12.42645263671875, "global_step": 364322, "epoch": 2168} {"train_loss": -12.502435684204102, "global_step": 364323, "epoch": 2168} {"train_loss": -12.522846221923828, "global_step": 364324, "epoch": 2168} {"train_loss": -12.448820114135742, "global_step": 364325, "epoch": 2168} {"train_loss": -12.613609313964844, "global_step": 364326, "epoch": 2168} {"train_loss": -12.583311080932617, "global_step": 364327, "epoch": 2168} {"train_loss": -12.273934364318848, "global_step": 364328, "epoch": 2168} {"train_loss": -12.490074157714844, "global_step": 364329, "epoch": 2168} {"train_loss": -12.589950561523438, "global_step": 364330, "epoch": 2168} {"train_loss": -12.472158432006836, "global_step": 364331, "epoch": 2168} {"train_loss": -12.619633674621582, "global_step": 364332, "epoch": 2168} {"train_loss": -12.743406295776367, "global_step": 364333, "epoch": 2168} {"train_loss": -12.767711639404297, "global_step": 364334, "epoch": 2168} {"train_loss": -12.576438903808594, "global_step": 364335, "epoch": 2168} {"train_loss": -12.666034698486328, "global_step": 364336, "epoch": 2168} {"train_loss": -12.408916473388672, "global_step": 364337, "epoch": 2168} {"train_loss": -12.545244216918945, "global_step": 364338, "epoch": 2168} {"train_loss": -12.629546165466309, "global_step": 364339, "epoch": 2168} {"train_loss": -12.669581413269043, "global_step": 364340, "epoch": 2168} {"train_loss": -12.125922203063965, "global_step": 364341, "epoch": 2168} {"train_loss": -11.709860801696777, "global_step": 364342, "epoch": 2168} {"train_loss": -12.573195457458496, "global_step": 364343, "epoch": 2168} {"train_loss": -11.776816368103027, "global_step": 364344, "epoch": 2168} {"train_loss": -12.252246856689453, "global_step": 364345, "epoch": 2168} {"train_loss": -11.878289222717285, "global_step": 364346, "epoch": 2168} {"train_loss": -12.291172981262207, "global_step": 364347, "epoch": 2168} {"train_loss": -11.597129821777344, "global_step": 364348, "epoch": 2168} {"train_loss": -12.33108139038086, "global_step": 364349, "epoch": 2168} {"train_loss": -10.184659957885742, "global_step": 364350, "epoch": 2168} {"train_loss": -11.864289283752441, "global_step": 364351, "epoch": 2168} {"train_loss": -10.67734432220459, "global_step": 364352, "epoch": 2168} {"train_loss": -11.520637512207031, "global_step": 364353, "epoch": 2168} {"train_loss": -11.623356819152832, "global_step": 364354, "epoch": 2168} {"train_loss": -12.03618335723877, "global_step": 364355, "epoch": 2168} {"train_loss": -11.0938720703125, "global_step": 364356, "epoch": 2168} {"train_loss": -12.157617568969727, "global_step": 364357, "epoch": 2168} {"train_loss": -11.190999984741211, "global_step": 364358, "epoch": 2168} {"train_loss": -11.353622436523438, "global_step": 364359, "epoch": 2168} {"train_loss": -11.078409194946289, "global_step": 364360, "epoch": 2168} {"train_loss": -12.275900840759277, "global_step": 364361, "epoch": 2168} {"train_loss": -9.852956771850586, "global_step": 364362, "epoch": 2168} {"train_loss": -11.868998527526855, "global_step": 364363, "epoch": 2168} {"train_loss": -10.990557670593262, "global_step": 364364, "epoch": 2168} {"train_loss": -10.558162689208984, "global_step": 364365, "epoch": 2168} {"train_loss": -8.771749496459961, "global_step": 364366, "epoch": 2168} {"train_loss": -10.049951553344727, "global_step": 364367, "epoch": 2168} {"train_loss": -9.70147705078125, "global_step": 364368, "epoch": 2168} {"train_loss": -9.467170715332031, "global_step": 364369, "epoch": 2168} {"train_loss": -9.583009719848633, "global_step": 364370, "epoch": 2168} {"train_loss": -7.9955902099609375, "global_step": 364371, "epoch": 2168} {"train_loss": -9.853933334350586, "global_step": 364372, "epoch": 2168} {"train_loss": -8.65501594543457, "global_step": 364373, "epoch": 2168} {"train_loss": -8.58702564239502, "global_step": 364374, "epoch": 2168} {"train_loss": -10.328832626342773, "global_step": 364375, "epoch": 2168} {"train_loss": -9.150012969970703, "global_step": 364376, "epoch": 2168} {"train_loss": -10.006575584411621, "global_step": 364377, "epoch": 2168} {"train_loss": -10.619629859924316, "global_step": 364378, "epoch": 2168} {"train_loss": -10.044035911560059, "global_step": 364379, "epoch": 2168} {"train_loss": -10.663825035095215, "global_step": 364380, "epoch": 2168} {"train_loss": -10.746879577636719, "global_step": 364381, "epoch": 2168} {"train_loss": -9.815774917602539, "global_step": 364382, "epoch": 2168} {"train_loss": -8.913686752319336, "global_step": 364383, "epoch": 2168} {"train_loss": -10.571306228637695, "global_step": 364384, "epoch": 2168} {"train_loss": -10.090089797973633, "global_step": 364385, "epoch": 2168} {"train_loss": -10.264809608459473, "global_step": 364386, "epoch": 2168} {"train_loss": -10.950080871582031, "global_step": 364387, "epoch": 2168} {"train_loss": -10.761907577514648, "global_step": 364388, "epoch": 2168} {"train_loss": -10.721893310546875, "global_step": 364389, "epoch": 2168} {"train_loss": -11.531639099121094, "global_step": 364390, "epoch": 2168} {"train_loss": -11.494143894740514, "global_step": 364391, "epoch": 2168, "val_loss": 286959.96875} {"train_loss": -11.287651062011719, "global_step": 364392, "epoch": 2169} {"train_loss": -11.30860424041748, "global_step": 364393, "epoch": 2169} {"train_loss": -10.641494750976562, "global_step": 364394, "epoch": 2169} {"train_loss": -11.635513305664062, "global_step": 364395, "epoch": 2169} {"train_loss": -10.849424362182617, "global_step": 364396, "epoch": 2169} {"train_loss": -11.340677261352539, "global_step": 364397, "epoch": 2169} {"train_loss": -10.95627212524414, "global_step": 364398, "epoch": 2169} {"train_loss": -11.181373596191406, "global_step": 364399, "epoch": 2169} {"train_loss": -11.405550003051758, "global_step": 364400, "epoch": 2169} {"train_loss": -11.487039566040039, "global_step": 364401, "epoch": 2169} {"train_loss": -11.735812187194824, "global_step": 364402, "epoch": 2169} {"train_loss": -11.560991287231445, "global_step": 364403, "epoch": 2169} {"train_loss": -11.352001190185547, "global_step": 364404, "epoch": 2169} {"train_loss": -11.58883285522461, "global_step": 364405, "epoch": 2169} {"train_loss": -11.908166885375977, "global_step": 364406, "epoch": 2169} {"train_loss": -11.5960111618042, "global_step": 364407, "epoch": 2169} {"train_loss": -12.024971008300781, "global_step": 364408, "epoch": 2169} {"train_loss": -11.372791290283203, "global_step": 364409, "epoch": 2169} {"train_loss": -11.809768676757812, "global_step": 364410, "epoch": 2169} {"train_loss": -11.106572151184082, "global_step": 364411, "epoch": 2169} {"train_loss": -11.905160903930664, "global_step": 364412, "epoch": 2169} {"train_loss": -11.138605117797852, "global_step": 364413, "epoch": 2169} {"train_loss": -11.860209465026855, "global_step": 364414, "epoch": 2169} {"train_loss": -11.116476058959961, "global_step": 364415, "epoch": 2169} {"train_loss": -11.9476318359375, "global_step": 364416, "epoch": 2169} {"train_loss": -11.46027660369873, "global_step": 364417, "epoch": 2169} {"train_loss": -12.06257438659668, "global_step": 364418, "epoch": 2169} {"train_loss": -11.705585479736328, "global_step": 364419, "epoch": 2169} {"train_loss": -12.230389595031738, "global_step": 364420, "epoch": 2169} {"train_loss": -11.753564834594727, "global_step": 364421, "epoch": 2169} {"train_loss": -11.839256286621094, "global_step": 364422, "epoch": 2169} {"train_loss": -12.016921043395996, "global_step": 364423, "epoch": 2169} {"train_loss": -11.960362434387207, "global_step": 364424, "epoch": 2169} {"train_loss": -11.889328002929688, "global_step": 364425, "epoch": 2169} {"train_loss": -11.983198165893555, "global_step": 364426, "epoch": 2169} {"train_loss": -12.207143783569336, "global_step": 364427, "epoch": 2169} {"train_loss": -11.800274848937988, "global_step": 364428, "epoch": 2169} {"train_loss": -12.075475692749023, "global_step": 364429, "epoch": 2169} {"train_loss": -12.178035736083984, "global_step": 364430, "epoch": 2169} {"train_loss": -12.381490707397461, "global_step": 364431, "epoch": 2169} {"train_loss": -11.94523811340332, "global_step": 364432, "epoch": 2169} {"train_loss": -12.359968185424805, "global_step": 364433, "epoch": 2169} {"train_loss": -12.167303085327148, "global_step": 364434, "epoch": 2169} {"train_loss": -12.263980865478516, "global_step": 364435, "epoch": 2169} {"train_loss": -12.301483154296875, "global_step": 364436, "epoch": 2169} {"train_loss": -12.297210693359375, "global_step": 364437, "epoch": 2169} {"train_loss": -12.180599212646484, "global_step": 364438, "epoch": 2169} {"train_loss": -12.137224197387695, "global_step": 364439, "epoch": 2169} {"train_loss": -12.162015914916992, "global_step": 364440, "epoch": 2169} {"train_loss": -12.432887077331543, "global_step": 364441, "epoch": 2169} {"train_loss": -12.380056381225586, "global_step": 364442, "epoch": 2169} {"train_loss": -12.164396286010742, "global_step": 364443, "epoch": 2169} {"train_loss": -12.29513931274414, "global_step": 364444, "epoch": 2169} {"train_loss": -12.318002700805664, "global_step": 364445, "epoch": 2169} {"train_loss": -12.3441162109375, "global_step": 364446, "epoch": 2169} {"train_loss": -12.215770721435547, "global_step": 364447, "epoch": 2169} {"train_loss": -12.517961502075195, "global_step": 364448, "epoch": 2169} {"train_loss": -12.359861373901367, "global_step": 364449, "epoch": 2169} {"train_loss": -12.52487564086914, "global_step": 364450, "epoch": 2169} {"train_loss": -12.484329223632812, "global_step": 364451, "epoch": 2169} {"train_loss": -12.347453117370605, "global_step": 364452, "epoch": 2169} {"train_loss": -12.575560569763184, "global_step": 364453, "epoch": 2169} {"train_loss": -12.33144474029541, "global_step": 364454, "epoch": 2169} {"train_loss": -12.370382308959961, "global_step": 364455, "epoch": 2169} {"train_loss": -12.626792907714844, "global_step": 364456, "epoch": 2169} {"train_loss": -12.120365142822266, "global_step": 364457, "epoch": 2169} {"train_loss": -12.323160171508789, "global_step": 364458, "epoch": 2169} {"train_loss": -12.527776718139648, "global_step": 364459, "epoch": 2169} {"train_loss": -12.43040943145752, "global_step": 364460, "epoch": 2169} {"train_loss": -12.623186111450195, "global_step": 364461, "epoch": 2169} {"train_loss": -12.16295337677002, "global_step": 364462, "epoch": 2169} {"train_loss": -12.272993087768555, "global_step": 364463, "epoch": 2169} {"train_loss": -12.502197265625, "global_step": 364464, "epoch": 2169} {"train_loss": -12.198040008544922, "global_step": 364465, "epoch": 2169} {"train_loss": -12.401451110839844, "global_step": 364466, "epoch": 2169} {"train_loss": -12.139434814453125, "global_step": 364467, "epoch": 2169} {"train_loss": -12.226807594299316, "global_step": 364468, "epoch": 2169} {"train_loss": -12.41239070892334, "global_step": 364469, "epoch": 2169} {"train_loss": -12.11216926574707, "global_step": 364470, "epoch": 2169} {"train_loss": -12.15589427947998, "global_step": 364471, "epoch": 2169} {"train_loss": -12.443841934204102, "global_step": 364472, "epoch": 2169} {"train_loss": -11.711217880249023, "global_step": 364473, "epoch": 2169} {"train_loss": -12.218303680419922, "global_step": 364474, "epoch": 2169} {"train_loss": -12.636669158935547, "global_step": 364475, "epoch": 2169} {"train_loss": -11.894662857055664, "global_step": 364476, "epoch": 2169} {"train_loss": -12.0615816116333, "global_step": 364477, "epoch": 2169} {"train_loss": -12.214555740356445, "global_step": 364478, "epoch": 2169} {"train_loss": -12.276315689086914, "global_step": 364479, "epoch": 2169} {"train_loss": -12.208549499511719, "global_step": 364480, "epoch": 2169} {"train_loss": -12.36095142364502, "global_step": 364481, "epoch": 2169} {"train_loss": -11.788961410522461, "global_step": 364482, "epoch": 2169} {"train_loss": -11.959221839904785, "global_step": 364483, "epoch": 2169} {"train_loss": -12.249210357666016, "global_step": 364484, "epoch": 2169} {"train_loss": -12.09150505065918, "global_step": 364485, "epoch": 2169} {"train_loss": -12.210670471191406, "global_step": 364486, "epoch": 2169} {"train_loss": -12.23028564453125, "global_step": 364487, "epoch": 2169} {"train_loss": -11.92009162902832, "global_step": 364488, "epoch": 2169} {"train_loss": -12.428421974182129, "global_step": 364489, "epoch": 2169} {"train_loss": -12.024248123168945, "global_step": 364490, "epoch": 2169} {"train_loss": -11.942150115966797, "global_step": 364491, "epoch": 2169} {"train_loss": -12.320226669311523, "global_step": 364492, "epoch": 2169} {"train_loss": -11.415143966674805, "global_step": 364493, "epoch": 2169} {"train_loss": -12.01386833190918, "global_step": 364494, "epoch": 2169} {"train_loss": -12.205221176147461, "global_step": 364495, "epoch": 2169} {"train_loss": -12.043281555175781, "global_step": 364496, "epoch": 2169} {"train_loss": -12.273001670837402, "global_step": 364497, "epoch": 2169} {"train_loss": -12.0992431640625, "global_step": 364498, "epoch": 2169} {"train_loss": -12.067733764648438, "global_step": 364499, "epoch": 2169} {"train_loss": -12.424274444580078, "global_step": 364500, "epoch": 2169} {"train_loss": -11.975883483886719, "global_step": 364501, "epoch": 2169} {"train_loss": -12.455937385559082, "global_step": 364502, "epoch": 2169} {"train_loss": -12.169776916503906, "global_step": 364503, "epoch": 2169} {"train_loss": -11.798410415649414, "global_step": 364504, "epoch": 2169} {"train_loss": -12.496591567993164, "global_step": 364505, "epoch": 2169} {"train_loss": -11.954771041870117, "global_step": 364506, "epoch": 2169} {"train_loss": -12.440784454345703, "global_step": 364507, "epoch": 2169} {"train_loss": -12.244590759277344, "global_step": 364508, "epoch": 2169} {"train_loss": -11.683881759643555, "global_step": 364509, "epoch": 2169} {"train_loss": -11.732172012329102, "global_step": 364510, "epoch": 2169} {"train_loss": -12.253965377807617, "global_step": 364511, "epoch": 2169} {"train_loss": -11.330049514770508, "global_step": 364512, "epoch": 2169} {"train_loss": -12.214229583740234, "global_step": 364513, "epoch": 2169} {"train_loss": -11.799026489257812, "global_step": 364514, "epoch": 2169} {"train_loss": -11.686751365661621, "global_step": 364515, "epoch": 2169} {"train_loss": -12.280489921569824, "global_step": 364516, "epoch": 2169} {"train_loss": -11.780159950256348, "global_step": 364517, "epoch": 2169} {"train_loss": -11.89604377746582, "global_step": 364518, "epoch": 2169} {"train_loss": -11.852304458618164, "global_step": 364519, "epoch": 2169} {"train_loss": -11.331757545471191, "global_step": 364520, "epoch": 2169} {"train_loss": -12.243788719177246, "global_step": 364521, "epoch": 2169} {"train_loss": -11.388887405395508, "global_step": 364522, "epoch": 2169} {"train_loss": -10.831121444702148, "global_step": 364523, "epoch": 2169} {"train_loss": -10.609103202819824, "global_step": 364524, "epoch": 2169} {"train_loss": -9.006874084472656, "global_step": 364525, "epoch": 2169} {"train_loss": -10.378623962402344, "global_step": 364526, "epoch": 2169} {"train_loss": -10.778852462768555, "global_step": 364527, "epoch": 2169} {"train_loss": -10.720053672790527, "global_step": 364528, "epoch": 2169} {"train_loss": -10.842265129089355, "global_step": 364529, "epoch": 2169} {"train_loss": -8.616203308105469, "global_step": 364530, "epoch": 2169} {"train_loss": -7.506001949310303, "global_step": 364531, "epoch": 2169} {"train_loss": -7.75538444519043, "global_step": 364532, "epoch": 2169} {"train_loss": -6.803487777709961, "global_step": 364533, "epoch": 2169} {"train_loss": -7.299576759338379, "global_step": 364534, "epoch": 2169} {"train_loss": -7.731164932250977, "global_step": 364535, "epoch": 2169} {"train_loss": -8.354938507080078, "global_step": 364536, "epoch": 2169} {"train_loss": -8.484375, "global_step": 364537, "epoch": 2169} {"train_loss": -8.791109085083008, "global_step": 364538, "epoch": 2169} {"train_loss": -9.633484840393066, "global_step": 364539, "epoch": 2169} {"train_loss": -9.74502182006836, "global_step": 364540, "epoch": 2169} {"train_loss": -9.289202690124512, "global_step": 364541, "epoch": 2169} {"train_loss": -9.914619445800781, "global_step": 364542, "epoch": 2169} {"train_loss": -10.397958755493164, "global_step": 364543, "epoch": 2169} {"train_loss": -11.070882797241211, "global_step": 364544, "epoch": 2169} {"train_loss": -11.171466827392578, "global_step": 364545, "epoch": 2169} {"train_loss": -11.125223159790039, "global_step": 364546, "epoch": 2169} {"train_loss": -10.86841869354248, "global_step": 364547, "epoch": 2169} {"train_loss": -10.76772689819336, "global_step": 364548, "epoch": 2169} {"train_loss": -11.024181365966797, "global_step": 364549, "epoch": 2169} {"train_loss": -11.028026580810547, "global_step": 364550, "epoch": 2169} {"train_loss": -10.793098449707031, "global_step": 364551, "epoch": 2169} {"train_loss": -11.09695053100586, "global_step": 364552, "epoch": 2169} {"train_loss": -10.576217651367188, "global_step": 364553, "epoch": 2169} {"train_loss": -11.369523048400879, "global_step": 364554, "epoch": 2169} {"train_loss": -10.335887908935547, "global_step": 364555, "epoch": 2169} {"train_loss": -11.554529190063477, "global_step": 364556, "epoch": 2169} {"train_loss": -11.310517311096191, "global_step": 364557, "epoch": 2169} {"train_loss": -11.356157302856445, "global_step": 364558, "epoch": 2169} {"train_loss": -11.567665392444248, "global_step": 364559, "epoch": 2169, "val_loss": 295017.84375} {"train_loss": -11.976469039916992, "global_step": 364560, "epoch": 2170} {"train_loss": -11.399576187133789, "global_step": 364561, "epoch": 2170} {"train_loss": -11.850409507751465, "global_step": 364562, "epoch": 2170} {"train_loss": -11.176572799682617, "global_step": 364563, "epoch": 2170} {"train_loss": -11.74921989440918, "global_step": 364564, "epoch": 2170} {"train_loss": -11.252897262573242, "global_step": 364565, "epoch": 2170} {"train_loss": -11.800130844116211, "global_step": 364566, "epoch": 2170} {"train_loss": -11.602595329284668, "global_step": 364567, "epoch": 2170} {"train_loss": -11.942161560058594, "global_step": 364568, "epoch": 2170} {"train_loss": -12.000553131103516, "global_step": 364569, "epoch": 2170} {"train_loss": -11.64982795715332, "global_step": 364570, "epoch": 2170} {"train_loss": -11.809042930603027, "global_step": 364571, "epoch": 2170} {"train_loss": -11.454042434692383, "global_step": 364572, "epoch": 2170} {"train_loss": -12.23436164855957, "global_step": 364573, "epoch": 2170} {"train_loss": -11.594087600708008, "global_step": 364574, "epoch": 2170} {"train_loss": -11.99058723449707, "global_step": 364575, "epoch": 2170} {"train_loss": -11.86585521697998, "global_step": 364576, "epoch": 2170} {"train_loss": -12.150063514709473, "global_step": 364577, "epoch": 2170} {"train_loss": -11.753236770629883, "global_step": 364578, "epoch": 2170} {"train_loss": -12.203727722167969, "global_step": 364579, "epoch": 2170} {"train_loss": -11.713747024536133, "global_step": 364580, "epoch": 2170} {"train_loss": -12.210077285766602, "global_step": 364581, "epoch": 2170} {"train_loss": -11.998936653137207, "global_step": 364582, "epoch": 2170} {"train_loss": -12.187664985656738, "global_step": 364583, "epoch": 2170} {"train_loss": -12.076251983642578, "global_step": 364584, "epoch": 2170} {"train_loss": -12.149238586425781, "global_step": 364585, "epoch": 2170} {"train_loss": -12.158052444458008, "global_step": 364586, "epoch": 2170} {"train_loss": -12.155744552612305, "global_step": 364587, "epoch": 2170} {"train_loss": -12.0720796585083, "global_step": 364588, "epoch": 2170} {"train_loss": -12.186241149902344, "global_step": 364589, "epoch": 2170} {"train_loss": -12.157254219055176, "global_step": 364590, "epoch": 2170} {"train_loss": -12.222190856933594, "global_step": 364591, "epoch": 2170} {"train_loss": -12.248934745788574, "global_step": 364592, "epoch": 2170} {"train_loss": -12.245338439941406, "global_step": 364593, "epoch": 2170} {"train_loss": -12.069868087768555, "global_step": 364594, "epoch": 2170} {"train_loss": -12.227574348449707, "global_step": 364595, "epoch": 2170} {"train_loss": -11.978007316589355, "global_step": 364596, "epoch": 2170} {"train_loss": -12.07640552520752, "global_step": 364597, "epoch": 2170} {"train_loss": -12.076431274414062, "global_step": 364598, "epoch": 2170} {"train_loss": -12.380033493041992, "global_step": 364599, "epoch": 2170} {"train_loss": -11.960058212280273, "global_step": 364600, "epoch": 2170} {"train_loss": -12.362398147583008, "global_step": 364601, "epoch": 2170} {"train_loss": -11.849968910217285, "global_step": 364602, "epoch": 2170} {"train_loss": -12.300793647766113, "global_step": 364603, "epoch": 2170} {"train_loss": -12.152915954589844, "global_step": 364604, "epoch": 2170} {"train_loss": -12.301801681518555, "global_step": 364605, "epoch": 2170} {"train_loss": -12.102981567382812, "global_step": 364606, "epoch": 2170} {"train_loss": -12.093430519104004, "global_step": 364607, "epoch": 2170} {"train_loss": -12.227596282958984, "global_step": 364608, "epoch": 2170} {"train_loss": -12.230941772460938, "global_step": 364609, "epoch": 2170} {"train_loss": -12.178611755371094, "global_step": 364610, "epoch": 2170} {"train_loss": -11.974752426147461, "global_step": 364611, "epoch": 2170} {"train_loss": -12.197663307189941, "global_step": 364612, "epoch": 2170} {"train_loss": -12.147747039794922, "global_step": 364613, "epoch": 2170} {"train_loss": -12.101486206054688, "global_step": 364614, "epoch": 2170} {"train_loss": -12.130285263061523, "global_step": 364615, "epoch": 2170} {"train_loss": -12.00343132019043, "global_step": 364616, "epoch": 2170} {"train_loss": -12.035588264465332, "global_step": 364617, "epoch": 2170} {"train_loss": -11.882826805114746, "global_step": 364618, "epoch": 2170} {"train_loss": -12.136805534362793, "global_step": 364619, "epoch": 2170} {"train_loss": -12.19229793548584, "global_step": 364620, "epoch": 2170} {"train_loss": -11.946351051330566, "global_step": 364621, "epoch": 2170} {"train_loss": -12.43538761138916, "global_step": 364622, "epoch": 2170} {"train_loss": -12.296210289001465, "global_step": 364623, "epoch": 2170} {"train_loss": -12.406505584716797, "global_step": 364624, "epoch": 2170} {"train_loss": -12.17698860168457, "global_step": 364625, "epoch": 2170} {"train_loss": -11.906414031982422, "global_step": 364626, "epoch": 2170} {"train_loss": -11.729464530944824, "global_step": 364627, "epoch": 2170} {"train_loss": -12.39338493347168, "global_step": 364628, "epoch": 2170} {"train_loss": -11.882412910461426, "global_step": 364629, "epoch": 2170} {"train_loss": -12.12024974822998, "global_step": 364630, "epoch": 2170} {"train_loss": -12.196699142456055, "global_step": 364631, "epoch": 2170} {"train_loss": -12.215536117553711, "global_step": 364632, "epoch": 2170} {"train_loss": -12.194518089294434, "global_step": 364633, "epoch": 2170} {"train_loss": -12.365062713623047, "global_step": 364634, "epoch": 2170} {"train_loss": -11.664145469665527, "global_step": 364635, "epoch": 2170} {"train_loss": -12.244989395141602, "global_step": 364636, "epoch": 2170} {"train_loss": -12.450664520263672, "global_step": 364637, "epoch": 2170} {"train_loss": -12.058618545532227, "global_step": 364638, "epoch": 2170} {"train_loss": -11.720767974853516, "global_step": 364639, "epoch": 2170} {"train_loss": -12.30134391784668, "global_step": 364640, "epoch": 2170} {"train_loss": -11.824837684631348, "global_step": 364641, "epoch": 2170} {"train_loss": -11.849796295166016, "global_step": 364642, "epoch": 2170} {"train_loss": -11.500311851501465, "global_step": 364643, "epoch": 2170} {"train_loss": -11.530569076538086, "global_step": 364644, "epoch": 2170} {"train_loss": -11.806607246398926, "global_step": 364645, "epoch": 2170} {"train_loss": -11.358805656433105, "global_step": 364646, "epoch": 2170} {"train_loss": -11.356106758117676, "global_step": 364647, "epoch": 2170} {"train_loss": -12.323347091674805, "global_step": 364648, "epoch": 2170} {"train_loss": -11.421281814575195, "global_step": 364649, "epoch": 2170} {"train_loss": -12.030847549438477, "global_step": 364650, "epoch": 2170} {"train_loss": -12.093694686889648, "global_step": 364651, "epoch": 2170} {"train_loss": -12.073162078857422, "global_step": 364652, "epoch": 2170} {"train_loss": -11.844908714294434, "global_step": 364653, "epoch": 2170} {"train_loss": -12.211423873901367, "global_step": 364654, "epoch": 2170} {"train_loss": -12.269659042358398, "global_step": 364655, "epoch": 2170} {"train_loss": -12.109763145446777, "global_step": 364656, "epoch": 2170} {"train_loss": -12.000246047973633, "global_step": 364657, "epoch": 2170} {"train_loss": -11.894445419311523, "global_step": 364658, "epoch": 2170} {"train_loss": -11.922414779663086, "global_step": 364659, "epoch": 2170} {"train_loss": -12.138229370117188, "global_step": 364660, "epoch": 2170} {"train_loss": -12.280792236328125, "global_step": 364661, "epoch": 2170} {"train_loss": -11.233257293701172, "global_step": 364662, "epoch": 2170} {"train_loss": -11.328445434570312, "global_step": 364663, "epoch": 2170} {"train_loss": -12.316454887390137, "global_step": 364664, "epoch": 2170} {"train_loss": -11.93476676940918, "global_step": 364665, "epoch": 2170} {"train_loss": -12.204444885253906, "global_step": 364666, "epoch": 2170} {"train_loss": -11.779515266418457, "global_step": 364667, "epoch": 2170} {"train_loss": -12.160555839538574, "global_step": 364668, "epoch": 2170} {"train_loss": -12.062588691711426, "global_step": 364669, "epoch": 2170} {"train_loss": -11.972624778747559, "global_step": 364670, "epoch": 2170} {"train_loss": -12.168126106262207, "global_step": 364671, "epoch": 2170} {"train_loss": -12.187047004699707, "global_step": 364672, "epoch": 2170} {"train_loss": -11.940605163574219, "global_step": 364673, "epoch": 2170} {"train_loss": -12.147130966186523, "global_step": 364674, "epoch": 2170} {"train_loss": -11.768028259277344, "global_step": 364675, "epoch": 2170} {"train_loss": -11.786840438842773, "global_step": 364676, "epoch": 2170} {"train_loss": -11.779661178588867, "global_step": 364677, "epoch": 2170} {"train_loss": -12.117788314819336, "global_step": 364678, "epoch": 2170} {"train_loss": -12.326183319091797, "global_step": 364679, "epoch": 2170} {"train_loss": -12.160829544067383, "global_step": 364680, "epoch": 2170} {"train_loss": -12.344295501708984, "global_step": 364681, "epoch": 2170} {"train_loss": -11.861604690551758, "global_step": 364682, "epoch": 2170} {"train_loss": -12.26992416381836, "global_step": 364683, "epoch": 2170} {"train_loss": -12.138128280639648, "global_step": 364684, "epoch": 2170} {"train_loss": -11.844175338745117, "global_step": 364685, "epoch": 2170} {"train_loss": -12.490747451782227, "global_step": 364686, "epoch": 2170} {"train_loss": -11.994163513183594, "global_step": 364687, "epoch": 2170} {"train_loss": -11.786699295043945, "global_step": 364688, "epoch": 2170} {"train_loss": -12.42484188079834, "global_step": 364689, "epoch": 2170} {"train_loss": -12.02115249633789, "global_step": 364690, "epoch": 2170} {"train_loss": -11.55249309539795, "global_step": 364691, "epoch": 2170} {"train_loss": -12.185912132263184, "global_step": 364692, "epoch": 2170} {"train_loss": -12.235113143920898, "global_step": 364693, "epoch": 2170} {"train_loss": -11.874727249145508, "global_step": 364694, "epoch": 2170} {"train_loss": -11.142318725585938, "global_step": 364695, "epoch": 2170} {"train_loss": -12.476762771606445, "global_step": 364696, "epoch": 2170} {"train_loss": -11.5316162109375, "global_step": 364697, "epoch": 2170} {"train_loss": -12.19754695892334, "global_step": 364698, "epoch": 2170} {"train_loss": -11.287702560424805, "global_step": 364699, "epoch": 2170} {"train_loss": -11.313169479370117, "global_step": 364700, "epoch": 2170} {"train_loss": -11.752386093139648, "global_step": 364701, "epoch": 2170} {"train_loss": -11.946040153503418, "global_step": 364702, "epoch": 2170} {"train_loss": -11.521696090698242, "global_step": 364703, "epoch": 2170} {"train_loss": -12.073044776916504, "global_step": 364704, "epoch": 2170} {"train_loss": -11.810871124267578, "global_step": 364705, "epoch": 2170} {"train_loss": -11.428947448730469, "global_step": 364706, "epoch": 2170} {"train_loss": -12.388503074645996, "global_step": 364707, "epoch": 2170} {"train_loss": -11.789592742919922, "global_step": 364708, "epoch": 2170} {"train_loss": -12.233291625976562, "global_step": 364709, "epoch": 2170} {"train_loss": -12.06629753112793, "global_step": 364710, "epoch": 2170} {"train_loss": -12.196674346923828, "global_step": 364711, "epoch": 2170} {"train_loss": -12.308589935302734, "global_step": 364712, "epoch": 2170} {"train_loss": -12.174989700317383, "global_step": 364713, "epoch": 2170} {"train_loss": -12.26702880859375, "global_step": 364714, "epoch": 2170} {"train_loss": -12.244306564331055, "global_step": 364715, "epoch": 2170} {"train_loss": -12.36005973815918, "global_step": 364716, "epoch": 2170} {"train_loss": -12.359066009521484, "global_step": 364717, "epoch": 2170} {"train_loss": -12.404499053955078, "global_step": 364718, "epoch": 2170} {"train_loss": -11.78734016418457, "global_step": 364719, "epoch": 2170} {"train_loss": -11.980764389038086, "global_step": 364720, "epoch": 2170} {"train_loss": -12.286653518676758, "global_step": 364721, "epoch": 2170} {"train_loss": -12.249587059020996, "global_step": 364722, "epoch": 2170} {"train_loss": -12.001649856567383, "global_step": 364723, "epoch": 2170} {"train_loss": -12.432448387145996, "global_step": 364724, "epoch": 2170} {"train_loss": -12.301880836486816, "global_step": 364725, "epoch": 2170} {"train_loss": -12.331844329833984, "global_step": 364726, "epoch": 2170} {"train_loss": -12.014179184323265, "global_step": 364727, "epoch": 2170, "val_loss": 289170.9375, "train_action_mse_error": 7.318881034851074} {"train_loss": -12.322854995727539, "global_step": 364728, "epoch": 2171} {"train_loss": -12.421335220336914, "global_step": 364729, "epoch": 2171} {"train_loss": -12.285083770751953, "global_step": 364730, "epoch": 2171} {"train_loss": -12.363044738769531, "global_step": 364731, "epoch": 2171} {"train_loss": -11.993399620056152, "global_step": 364732, "epoch": 2171} {"train_loss": -12.453539848327637, "global_step": 364733, "epoch": 2171} {"train_loss": -12.349242210388184, "global_step": 364734, "epoch": 2171} {"train_loss": -11.564931869506836, "global_step": 364735, "epoch": 2171} {"train_loss": -11.655221939086914, "global_step": 364736, "epoch": 2171} {"train_loss": -12.522704124450684, "global_step": 364737, "epoch": 2171} {"train_loss": -11.166482925415039, "global_step": 364738, "epoch": 2171} {"train_loss": -11.660359382629395, "global_step": 364739, "epoch": 2171} {"train_loss": -12.016672134399414, "global_step": 364740, "epoch": 2171} {"train_loss": -11.340557098388672, "global_step": 364741, "epoch": 2171} {"train_loss": -11.269163131713867, "global_step": 364742, "epoch": 2171} {"train_loss": -11.921525955200195, "global_step": 364743, "epoch": 2171} {"train_loss": -12.226598739624023, "global_step": 364744, "epoch": 2171} {"train_loss": -11.784829139709473, "global_step": 364745, "epoch": 2171} {"train_loss": -12.102357864379883, "global_step": 364746, "epoch": 2171} {"train_loss": -12.237269401550293, "global_step": 364747, "epoch": 2171} {"train_loss": -11.868412017822266, "global_step": 364748, "epoch": 2171} {"train_loss": -12.385213851928711, "global_step": 364749, "epoch": 2171} {"train_loss": -11.604097366333008, "global_step": 364750, "epoch": 2171} {"train_loss": -11.812030792236328, "global_step": 364751, "epoch": 2171} {"train_loss": -11.922225952148438, "global_step": 364752, "epoch": 2171} {"train_loss": -11.725674629211426, "global_step": 364753, "epoch": 2171} {"train_loss": -12.212099075317383, "global_step": 364754, "epoch": 2171} {"train_loss": -11.807435989379883, "global_step": 364755, "epoch": 2171} {"train_loss": -12.183013916015625, "global_step": 364756, "epoch": 2171} {"train_loss": -12.276260375976562, "global_step": 364757, "epoch": 2171} {"train_loss": -11.865013122558594, "global_step": 364758, "epoch": 2171} {"train_loss": -11.800271987915039, "global_step": 364759, "epoch": 2171} {"train_loss": -12.301730155944824, "global_step": 364760, "epoch": 2171} {"train_loss": -11.872172355651855, "global_step": 364761, "epoch": 2171} {"train_loss": -12.417282104492188, "global_step": 364762, "epoch": 2171} {"train_loss": -12.03138542175293, "global_step": 364763, "epoch": 2171} {"train_loss": -12.04386043548584, "global_step": 364764, "epoch": 2171} {"train_loss": -11.433511734008789, "global_step": 364765, "epoch": 2171} {"train_loss": -10.868590354919434, "global_step": 364766, "epoch": 2171} {"train_loss": -10.109304428100586, "global_step": 364767, "epoch": 2171} {"train_loss": -9.003045082092285, "global_step": 364768, "epoch": 2171} {"train_loss": -10.461593627929688, "global_step": 364769, "epoch": 2171} {"train_loss": -9.107437133789062, "global_step": 364770, "epoch": 2171} {"train_loss": -9.289012908935547, "global_step": 364771, "epoch": 2171} {"train_loss": -8.664716720581055, "global_step": 364772, "epoch": 2171} {"train_loss": -8.965858459472656, "global_step": 364773, "epoch": 2171} {"train_loss": -9.462224960327148, "global_step": 364774, "epoch": 2171} {"train_loss": -7.422948837280273, "global_step": 364775, "epoch": 2171} {"train_loss": -8.06823444366455, "global_step": 364776, "epoch": 2171} {"train_loss": -10.494068145751953, "global_step": 364777, "epoch": 2171} {"train_loss": -8.018457412719727, "global_step": 364778, "epoch": 2171} {"train_loss": -8.877117156982422, "global_step": 364779, "epoch": 2171} {"train_loss": -8.890368461608887, "global_step": 364780, "epoch": 2171} {"train_loss": -9.493420600891113, "global_step": 364781, "epoch": 2171} {"train_loss": -9.43005084991455, "global_step": 364782, "epoch": 2171} {"train_loss": -9.847402572631836, "global_step": 364783, "epoch": 2171} {"train_loss": -10.553443908691406, "global_step": 364784, "epoch": 2171} {"train_loss": -9.50075912475586, "global_step": 364785, "epoch": 2171} {"train_loss": -10.48740005493164, "global_step": 364786, "epoch": 2171} {"train_loss": -10.660711288452148, "global_step": 364787, "epoch": 2171} {"train_loss": -10.354509353637695, "global_step": 364788, "epoch": 2171} {"train_loss": -11.147015571594238, "global_step": 364789, "epoch": 2171} {"train_loss": -10.45512580871582, "global_step": 364790, "epoch": 2171} {"train_loss": -11.04750919342041, "global_step": 364791, "epoch": 2171} {"train_loss": -10.756000518798828, "global_step": 364792, "epoch": 2171} {"train_loss": -10.86474895477295, "global_step": 364793, "epoch": 2171} {"train_loss": -11.19000244140625, "global_step": 364794, "epoch": 2171} {"train_loss": -11.042856216430664, "global_step": 364795, "epoch": 2171} {"train_loss": -10.355640411376953, "global_step": 364796, "epoch": 2171} {"train_loss": -11.280078887939453, "global_step": 364797, "epoch": 2171} {"train_loss": -11.076593399047852, "global_step": 364798, "epoch": 2171} {"train_loss": -10.97526741027832, "global_step": 364799, "epoch": 2171} {"train_loss": -11.662044525146484, "global_step": 364800, "epoch": 2171} {"train_loss": -10.971572875976562, "global_step": 364801, "epoch": 2171} {"train_loss": -11.445439338684082, "global_step": 364802, "epoch": 2171} {"train_loss": -11.204063415527344, "global_step": 364803, "epoch": 2171} {"train_loss": -11.22608757019043, "global_step": 364804, "epoch": 2171} {"train_loss": -11.138471603393555, "global_step": 364805, "epoch": 2171} {"train_loss": -11.446798324584961, "global_step": 364806, "epoch": 2171} {"train_loss": -11.490549087524414, "global_step": 364807, "epoch": 2171} {"train_loss": -11.31263542175293, "global_step": 364808, "epoch": 2171} {"train_loss": -11.863506317138672, "global_step": 364809, "epoch": 2171} {"train_loss": -11.44084358215332, "global_step": 364810, "epoch": 2171} {"train_loss": -11.732135772705078, "global_step": 364811, "epoch": 2171} {"train_loss": -11.934356689453125, "global_step": 364812, "epoch": 2171} {"train_loss": -11.792840003967285, "global_step": 364813, "epoch": 2171} {"train_loss": -11.80217456817627, "global_step": 364814, "epoch": 2171} {"train_loss": -11.79607105255127, "global_step": 364815, "epoch": 2171} {"train_loss": -12.088970184326172, "global_step": 364816, "epoch": 2171} {"train_loss": -12.003164291381836, "global_step": 364817, "epoch": 2171} {"train_loss": -11.92014217376709, "global_step": 364818, "epoch": 2171} {"train_loss": -11.98574447631836, "global_step": 364819, "epoch": 2171} {"train_loss": -12.008318901062012, "global_step": 364820, "epoch": 2171} {"train_loss": -12.298283576965332, "global_step": 364821, "epoch": 2171} {"train_loss": -12.116695404052734, "global_step": 364822, "epoch": 2171} {"train_loss": -12.184388160705566, "global_step": 364823, "epoch": 2171} {"train_loss": -11.727090835571289, "global_step": 364824, "epoch": 2171} {"train_loss": -12.135791778564453, "global_step": 364825, "epoch": 2171} {"train_loss": -12.3034086227417, "global_step": 364826, "epoch": 2171} {"train_loss": -12.18551254272461, "global_step": 364827, "epoch": 2171} {"train_loss": -12.073166847229004, "global_step": 364828, "epoch": 2171} {"train_loss": -12.223091125488281, "global_step": 364829, "epoch": 2171} {"train_loss": -12.238639831542969, "global_step": 364830, "epoch": 2171} {"train_loss": -12.388114929199219, "global_step": 364831, "epoch": 2171} {"train_loss": -12.212807655334473, "global_step": 364832, "epoch": 2171} {"train_loss": -12.043756484985352, "global_step": 364833, "epoch": 2171} {"train_loss": -12.251304626464844, "global_step": 364834, "epoch": 2171} {"train_loss": -12.38538932800293, "global_step": 364835, "epoch": 2171} {"train_loss": -12.083335876464844, "global_step": 364836, "epoch": 2171} {"train_loss": -12.226542472839355, "global_step": 364837, "epoch": 2171} {"train_loss": -12.134981155395508, "global_step": 364838, "epoch": 2171} {"train_loss": -12.29345417022705, "global_step": 364839, "epoch": 2171} {"train_loss": -12.43214225769043, "global_step": 364840, "epoch": 2171} {"train_loss": -12.585115432739258, "global_step": 364841, "epoch": 2171} {"train_loss": -12.391746520996094, "global_step": 364842, "epoch": 2171} {"train_loss": -12.203731536865234, "global_step": 364843, "epoch": 2171} {"train_loss": -12.317842483520508, "global_step": 364844, "epoch": 2171} {"train_loss": -12.329153060913086, "global_step": 364845, "epoch": 2171} {"train_loss": -12.323101043701172, "global_step": 364846, "epoch": 2171} {"train_loss": -12.146808624267578, "global_step": 364847, "epoch": 2171} {"train_loss": -12.389047622680664, "global_step": 364848, "epoch": 2171} {"train_loss": -12.3646240234375, "global_step": 364849, "epoch": 2171} {"train_loss": -12.305107116699219, "global_step": 364850, "epoch": 2171} {"train_loss": -12.107512474060059, "global_step": 364851, "epoch": 2171} {"train_loss": -12.40053939819336, "global_step": 364852, "epoch": 2171} {"train_loss": -12.534412384033203, "global_step": 364853, "epoch": 2171} {"train_loss": -12.432119369506836, "global_step": 364854, "epoch": 2171} {"train_loss": -12.54643726348877, "global_step": 364855, "epoch": 2171} {"train_loss": -12.376190185546875, "global_step": 364856, "epoch": 2171} {"train_loss": -12.448360443115234, "global_step": 364857, "epoch": 2171} {"train_loss": -12.512619018554688, "global_step": 364858, "epoch": 2171} {"train_loss": -12.335128784179688, "global_step": 364859, "epoch": 2171} {"train_loss": -12.538470268249512, "global_step": 364860, "epoch": 2171} {"train_loss": -12.331369400024414, "global_step": 364861, "epoch": 2171} {"train_loss": -12.410930633544922, "global_step": 364862, "epoch": 2171} {"train_loss": -12.3297119140625, "global_step": 364863, "epoch": 2171} {"train_loss": -12.49606990814209, "global_step": 364864, "epoch": 2171} {"train_loss": -12.25442123413086, "global_step": 364865, "epoch": 2171} {"train_loss": -12.54422664642334, "global_step": 364866, "epoch": 2171} {"train_loss": -12.220796585083008, "global_step": 364867, "epoch": 2171} {"train_loss": -12.446910858154297, "global_step": 364868, "epoch": 2171} {"train_loss": -12.178114891052246, "global_step": 364869, "epoch": 2171} {"train_loss": -12.497376441955566, "global_step": 364870, "epoch": 2171} {"train_loss": -12.305418968200684, "global_step": 364871, "epoch": 2171} {"train_loss": -12.357919692993164, "global_step": 364872, "epoch": 2171} {"train_loss": -12.593328475952148, "global_step": 364873, "epoch": 2171} {"train_loss": -12.44023323059082, "global_step": 364874, "epoch": 2171} {"train_loss": -12.61628532409668, "global_step": 364875, "epoch": 2171} {"train_loss": -12.162576675415039, "global_step": 364876, "epoch": 2171} {"train_loss": -12.53024673461914, "global_step": 364877, "epoch": 2171} {"train_loss": -12.551640510559082, "global_step": 364878, "epoch": 2171} {"train_loss": -12.379894256591797, "global_step": 364879, "epoch": 2171} {"train_loss": -12.435047149658203, "global_step": 364880, "epoch": 2171} {"train_loss": -12.422511100769043, "global_step": 364881, "epoch": 2171} {"train_loss": -12.405557632446289, "global_step": 364882, "epoch": 2171} {"train_loss": -12.515022277832031, "global_step": 364883, "epoch": 2171} {"train_loss": -12.278240203857422, "global_step": 364884, "epoch": 2171} {"train_loss": -12.42281723022461, "global_step": 364885, "epoch": 2171} {"train_loss": -12.45414924621582, "global_step": 364886, "epoch": 2171} {"train_loss": -11.861188888549805, "global_step": 364887, "epoch": 2171} {"train_loss": -12.017533302307129, "global_step": 364888, "epoch": 2171} {"train_loss": -11.6495361328125, "global_step": 364889, "epoch": 2171} {"train_loss": -12.052871704101562, "global_step": 364890, "epoch": 2171} {"train_loss": -12.1648530960083, "global_step": 364891, "epoch": 2171} {"train_loss": -12.645196914672852, "global_step": 364892, "epoch": 2171} {"train_loss": -12.037093162536621, "global_step": 364893, "epoch": 2171} {"train_loss": -12.062599182128906, "global_step": 364894, "epoch": 2171} {"train_loss": -11.669119692984081, "global_step": 364895, "epoch": 2171, "val_loss": 285154.21875} {"train_loss": -12.144828796386719, "global_step": 364896, "epoch": 2172} {"train_loss": -12.144567489624023, "global_step": 364897, "epoch": 2172} {"train_loss": -12.095001220703125, "global_step": 364898, "epoch": 2172} {"train_loss": -12.009839057922363, "global_step": 364899, "epoch": 2172} {"train_loss": -11.76004409790039, "global_step": 364900, "epoch": 2172} {"train_loss": -12.340896606445312, "global_step": 364901, "epoch": 2172} {"train_loss": -12.181235313415527, "global_step": 364902, "epoch": 2172} {"train_loss": -12.529557228088379, "global_step": 364903, "epoch": 2172} {"train_loss": -11.899895668029785, "global_step": 364904, "epoch": 2172} {"train_loss": -11.771987915039062, "global_step": 364905, "epoch": 2172} {"train_loss": -12.322257041931152, "global_step": 364906, "epoch": 2172} {"train_loss": -12.43367862701416, "global_step": 364907, "epoch": 2172} {"train_loss": -12.117240905761719, "global_step": 364908, "epoch": 2172} {"train_loss": -12.108892440795898, "global_step": 364909, "epoch": 2172} {"train_loss": -12.642784118652344, "global_step": 364910, "epoch": 2172} {"train_loss": -12.34135627746582, "global_step": 364911, "epoch": 2172} {"train_loss": -11.715556144714355, "global_step": 364912, "epoch": 2172} {"train_loss": -11.501668930053711, "global_step": 364913, "epoch": 2172} {"train_loss": -12.257733345031738, "global_step": 364914, "epoch": 2172} {"train_loss": -11.130468368530273, "global_step": 364915, "epoch": 2172} {"train_loss": -9.30185604095459, "global_step": 364916, "epoch": 2172} {"train_loss": -11.00071907043457, "global_step": 364917, "epoch": 2172} {"train_loss": -12.21958065032959, "global_step": 364918, "epoch": 2172} {"train_loss": -11.108405113220215, "global_step": 364919, "epoch": 2172} {"train_loss": -11.411853790283203, "global_step": 364920, "epoch": 2172} {"train_loss": -11.943714141845703, "global_step": 364921, "epoch": 2172} {"train_loss": -11.830659866333008, "global_step": 364922, "epoch": 2172} {"train_loss": -11.91215991973877, "global_step": 364923, "epoch": 2172} {"train_loss": -12.226818084716797, "global_step": 364924, "epoch": 2172} {"train_loss": -11.833110809326172, "global_step": 364925, "epoch": 2172} {"train_loss": -11.930007934570312, "global_step": 364926, "epoch": 2172} {"train_loss": -12.155595779418945, "global_step": 364927, "epoch": 2172} {"train_loss": -12.078770637512207, "global_step": 364928, "epoch": 2172} {"train_loss": -12.059110641479492, "global_step": 364929, "epoch": 2172} {"train_loss": -11.464353561401367, "global_step": 364930, "epoch": 2172} {"train_loss": -12.155089378356934, "global_step": 364931, "epoch": 2172} {"train_loss": -11.675426483154297, "global_step": 364932, "epoch": 2172} {"train_loss": -12.156251907348633, "global_step": 364933, "epoch": 2172} {"train_loss": -11.595014572143555, "global_step": 364934, "epoch": 2172} {"train_loss": -12.454670906066895, "global_step": 364935, "epoch": 2172} {"train_loss": -11.851314544677734, "global_step": 364936, "epoch": 2172} {"train_loss": -12.328960418701172, "global_step": 364937, "epoch": 2172} {"train_loss": -11.817193984985352, "global_step": 364938, "epoch": 2172} {"train_loss": -12.198719024658203, "global_step": 364939, "epoch": 2172} {"train_loss": -11.977001190185547, "global_step": 364940, "epoch": 2172} {"train_loss": -12.219616889953613, "global_step": 364941, "epoch": 2172} {"train_loss": -12.016277313232422, "global_step": 364942, "epoch": 2172} {"train_loss": -11.929727554321289, "global_step": 364943, "epoch": 2172} {"train_loss": -11.95848274230957, "global_step": 364944, "epoch": 2172} {"train_loss": -11.691274642944336, "global_step": 364945, "epoch": 2172} {"train_loss": -11.595438003540039, "global_step": 364946, "epoch": 2172} {"train_loss": -12.297860145568848, "global_step": 364947, "epoch": 2172} {"train_loss": -12.10848331451416, "global_step": 364948, "epoch": 2172} {"train_loss": -12.678199768066406, "global_step": 364949, "epoch": 2172} {"train_loss": -11.813796997070312, "global_step": 364950, "epoch": 2172} {"train_loss": -11.81667423248291, "global_step": 364951, "epoch": 2172} {"train_loss": -12.089282035827637, "global_step": 364952, "epoch": 2172} {"train_loss": -12.111085891723633, "global_step": 364953, "epoch": 2172} {"train_loss": -11.790546417236328, "global_step": 364954, "epoch": 2172} {"train_loss": -11.67808723449707, "global_step": 364955, "epoch": 2172} {"train_loss": -11.423467636108398, "global_step": 364956, "epoch": 2172} {"train_loss": -11.924144744873047, "global_step": 364957, "epoch": 2172} {"train_loss": -10.528329849243164, "global_step": 364958, "epoch": 2172} {"train_loss": -12.13745403289795, "global_step": 364959, "epoch": 2172} {"train_loss": -11.054335594177246, "global_step": 364960, "epoch": 2172} {"train_loss": -11.680229187011719, "global_step": 364961, "epoch": 2172} {"train_loss": -11.093374252319336, "global_step": 364962, "epoch": 2172} {"train_loss": -11.345483779907227, "global_step": 364963, "epoch": 2172} {"train_loss": -11.070028305053711, "global_step": 364964, "epoch": 2172} {"train_loss": -11.776029586791992, "global_step": 364965, "epoch": 2172} {"train_loss": -11.362857818603516, "global_step": 364966, "epoch": 2172} {"train_loss": -11.648428916931152, "global_step": 364967, "epoch": 2172} {"train_loss": -11.747894287109375, "global_step": 364968, "epoch": 2172} {"train_loss": -11.442066192626953, "global_step": 364969, "epoch": 2172} {"train_loss": -11.781170845031738, "global_step": 364970, "epoch": 2172} {"train_loss": -11.607389450073242, "global_step": 364971, "epoch": 2172} {"train_loss": -12.102925300598145, "global_step": 364972, "epoch": 2172} {"train_loss": -11.63945198059082, "global_step": 364973, "epoch": 2172} {"train_loss": -12.207540512084961, "global_step": 364974, "epoch": 2172} {"train_loss": -11.504364013671875, "global_step": 364975, "epoch": 2172} {"train_loss": -11.96151065826416, "global_step": 364976, "epoch": 2172} {"train_loss": -11.80019760131836, "global_step": 364977, "epoch": 2172} {"train_loss": -11.133864402770996, "global_step": 364978, "epoch": 2172} {"train_loss": -11.743236541748047, "global_step": 364979, "epoch": 2172} {"train_loss": -11.619647979736328, "global_step": 364980, "epoch": 2172} {"train_loss": -11.72187328338623, "global_step": 364981, "epoch": 2172} {"train_loss": -11.689043045043945, "global_step": 364982, "epoch": 2172} {"train_loss": -11.677530288696289, "global_step": 364983, "epoch": 2172} {"train_loss": -11.760591506958008, "global_step": 364984, "epoch": 2172} {"train_loss": -11.66004467010498, "global_step": 364985, "epoch": 2172} {"train_loss": -11.556806564331055, "global_step": 364986, "epoch": 2172} {"train_loss": -12.017244338989258, "global_step": 364987, "epoch": 2172} {"train_loss": -11.525050163269043, "global_step": 364988, "epoch": 2172} {"train_loss": -11.783506393432617, "global_step": 364989, "epoch": 2172} {"train_loss": -11.401028633117676, "global_step": 364990, "epoch": 2172} {"train_loss": -12.010858535766602, "global_step": 364991, "epoch": 2172} {"train_loss": -12.13466739654541, "global_step": 364992, "epoch": 2172} {"train_loss": -11.695577621459961, "global_step": 364993, "epoch": 2172} {"train_loss": -12.057516098022461, "global_step": 364994, "epoch": 2172} {"train_loss": -12.114753723144531, "global_step": 364995, "epoch": 2172} {"train_loss": -11.9544095993042, "global_step": 364996, "epoch": 2172} {"train_loss": -12.24019718170166, "global_step": 364997, "epoch": 2172} {"train_loss": -12.030037879943848, "global_step": 364998, "epoch": 2172} {"train_loss": -12.045088768005371, "global_step": 364999, "epoch": 2172} {"train_loss": -12.35964584350586, "global_step": 365000, "epoch": 2172} {"train_loss": -12.067806243896484, "global_step": 365001, "epoch": 2172} {"train_loss": -12.195379257202148, "global_step": 365002, "epoch": 2172} {"train_loss": -12.017725944519043, "global_step": 365003, "epoch": 2172} {"train_loss": -12.021886825561523, "global_step": 365004, "epoch": 2172} {"train_loss": -12.349557876586914, "global_step": 365005, "epoch": 2172} {"train_loss": -12.337322235107422, "global_step": 365006, "epoch": 2172} {"train_loss": -12.387868881225586, "global_step": 365007, "epoch": 2172} {"train_loss": -12.303430557250977, "global_step": 365008, "epoch": 2172} {"train_loss": -12.378142356872559, "global_step": 365009, "epoch": 2172} {"train_loss": -12.498255729675293, "global_step": 365010, "epoch": 2172} {"train_loss": -12.35287094116211, "global_step": 365011, "epoch": 2172} {"train_loss": -12.406187057495117, "global_step": 365012, "epoch": 2172} {"train_loss": -12.048291206359863, "global_step": 365013, "epoch": 2172} {"train_loss": -12.478778839111328, "global_step": 365014, "epoch": 2172} {"train_loss": -12.316628456115723, "global_step": 365015, "epoch": 2172} {"train_loss": -12.097339630126953, "global_step": 365016, "epoch": 2172} {"train_loss": -12.37497329711914, "global_step": 365017, "epoch": 2172} {"train_loss": -12.526375770568848, "global_step": 365018, "epoch": 2172} {"train_loss": -12.188130378723145, "global_step": 365019, "epoch": 2172} {"train_loss": -12.47766399383545, "global_step": 365020, "epoch": 2172} {"train_loss": -12.39093017578125, "global_step": 365021, "epoch": 2172} {"train_loss": -12.310593605041504, "global_step": 365022, "epoch": 2172} {"train_loss": -12.174360275268555, "global_step": 365023, "epoch": 2172} {"train_loss": -12.589070320129395, "global_step": 365024, "epoch": 2172} {"train_loss": -12.505928039550781, "global_step": 365025, "epoch": 2172} {"train_loss": -12.313405990600586, "global_step": 365026, "epoch": 2172} {"train_loss": -12.48486328125, "global_step": 365027, "epoch": 2172} {"train_loss": -12.361480712890625, "global_step": 365028, "epoch": 2172} {"train_loss": -12.477851867675781, "global_step": 365029, "epoch": 2172} {"train_loss": -12.066811561584473, "global_step": 365030, "epoch": 2172} {"train_loss": -12.756383895874023, "global_step": 365031, "epoch": 2172} {"train_loss": -12.385334968566895, "global_step": 365032, "epoch": 2172} {"train_loss": -11.890572547912598, "global_step": 365033, "epoch": 2172} {"train_loss": -12.45048713684082, "global_step": 365034, "epoch": 2172} {"train_loss": -12.146549224853516, "global_step": 365035, "epoch": 2172} {"train_loss": -11.885292053222656, "global_step": 365036, "epoch": 2172} {"train_loss": -12.258403778076172, "global_step": 365037, "epoch": 2172} {"train_loss": -12.318531036376953, "global_step": 365038, "epoch": 2172} {"train_loss": -12.190567016601562, "global_step": 365039, "epoch": 2172} {"train_loss": -11.44931411743164, "global_step": 365040, "epoch": 2172} {"train_loss": -11.945117950439453, "global_step": 365041, "epoch": 2172} {"train_loss": -12.444424629211426, "global_step": 365042, "epoch": 2172} {"train_loss": -12.250423431396484, "global_step": 365043, "epoch": 2172} {"train_loss": -11.69328784942627, "global_step": 365044, "epoch": 2172} {"train_loss": -12.383552551269531, "global_step": 365045, "epoch": 2172} {"train_loss": -12.310894012451172, "global_step": 365046, "epoch": 2172} {"train_loss": -12.226457595825195, "global_step": 365047, "epoch": 2172} {"train_loss": -11.611868858337402, "global_step": 365048, "epoch": 2172} {"train_loss": -11.933337211608887, "global_step": 365049, "epoch": 2172} {"train_loss": -11.856680870056152, "global_step": 365050, "epoch": 2172} {"train_loss": -12.100042343139648, "global_step": 365051, "epoch": 2172} {"train_loss": -12.417322158813477, "global_step": 365052, "epoch": 2172} {"train_loss": -11.913579940795898, "global_step": 365053, "epoch": 2172} {"train_loss": -11.798582077026367, "global_step": 365054, "epoch": 2172} {"train_loss": -12.012055397033691, "global_step": 365055, "epoch": 2172} {"train_loss": -12.194549560546875, "global_step": 365056, "epoch": 2172} {"train_loss": -12.16677474975586, "global_step": 365057, "epoch": 2172} {"train_loss": -12.408448219299316, "global_step": 365058, "epoch": 2172} {"train_loss": -11.864891052246094, "global_step": 365059, "epoch": 2172} {"train_loss": -12.473824501037598, "global_step": 365060, "epoch": 2172} {"train_loss": -12.07741928100586, "global_step": 365061, "epoch": 2172} {"train_loss": -11.972780227661133, "global_step": 365062, "epoch": 2172} {"train_loss": -11.974429039728074, "global_step": 365063, "epoch": 2172, "val_loss": 289872.53125} {"train_loss": -12.08841323852539, "global_step": 365064, "epoch": 2173} {"train_loss": -11.994000434875488, "global_step": 365065, "epoch": 2173} {"train_loss": -12.365553855895996, "global_step": 365066, "epoch": 2173} {"train_loss": -11.818285942077637, "global_step": 365067, "epoch": 2173} {"train_loss": -12.352399826049805, "global_step": 365068, "epoch": 2173} {"train_loss": -12.351207733154297, "global_step": 365069, "epoch": 2173} {"train_loss": -12.226689338684082, "global_step": 365070, "epoch": 2173} {"train_loss": -12.14576244354248, "global_step": 365071, "epoch": 2173} {"train_loss": -12.506958961486816, "global_step": 365072, "epoch": 2173} {"train_loss": -12.288177490234375, "global_step": 365073, "epoch": 2173} {"train_loss": -11.921422958374023, "global_step": 365074, "epoch": 2173} {"train_loss": -12.497318267822266, "global_step": 365075, "epoch": 2173} {"train_loss": -12.189131736755371, "global_step": 365076, "epoch": 2173} {"train_loss": -12.003265380859375, "global_step": 365077, "epoch": 2173} {"train_loss": -12.291927337646484, "global_step": 365078, "epoch": 2173} {"train_loss": -12.008956909179688, "global_step": 365079, "epoch": 2173} {"train_loss": -12.022961616516113, "global_step": 365080, "epoch": 2173} {"train_loss": -11.746179580688477, "global_step": 365081, "epoch": 2173} {"train_loss": -12.114082336425781, "global_step": 365082, "epoch": 2173} {"train_loss": -11.87326431274414, "global_step": 365083, "epoch": 2173} {"train_loss": -12.150199890136719, "global_step": 365084, "epoch": 2173} {"train_loss": -12.04327392578125, "global_step": 365085, "epoch": 2173} {"train_loss": -11.766939163208008, "global_step": 365086, "epoch": 2173} {"train_loss": -12.253131866455078, "global_step": 365087, "epoch": 2173} {"train_loss": -12.022205352783203, "global_step": 365088, "epoch": 2173} {"train_loss": -11.223654747009277, "global_step": 365089, "epoch": 2173} {"train_loss": -11.817023277282715, "global_step": 365090, "epoch": 2173} {"train_loss": -10.437511444091797, "global_step": 365091, "epoch": 2173} {"train_loss": -11.54245376586914, "global_step": 365092, "epoch": 2173} {"train_loss": -10.311452865600586, "global_step": 365093, "epoch": 2173} {"train_loss": -12.373610496520996, "global_step": 365094, "epoch": 2173} {"train_loss": -10.970023155212402, "global_step": 365095, "epoch": 2173} {"train_loss": -12.258176803588867, "global_step": 365096, "epoch": 2173} {"train_loss": -11.358663558959961, "global_step": 365097, "epoch": 2173} {"train_loss": -11.58081340789795, "global_step": 365098, "epoch": 2173} {"train_loss": -11.857227325439453, "global_step": 365099, "epoch": 2173} {"train_loss": -11.362858772277832, "global_step": 365100, "epoch": 2173} {"train_loss": -11.636630058288574, "global_step": 365101, "epoch": 2173} {"train_loss": -11.087331771850586, "global_step": 365102, "epoch": 2173} {"train_loss": -11.763138771057129, "global_step": 365103, "epoch": 2173} {"train_loss": -12.212900161743164, "global_step": 365104, "epoch": 2173} {"train_loss": -11.322807312011719, "global_step": 365105, "epoch": 2173} {"train_loss": -12.029109954833984, "global_step": 365106, "epoch": 2173} {"train_loss": -11.905384063720703, "global_step": 365107, "epoch": 2173} {"train_loss": -11.55853271484375, "global_step": 365108, "epoch": 2173} {"train_loss": -12.126212120056152, "global_step": 365109, "epoch": 2173} {"train_loss": -11.26795482635498, "global_step": 365110, "epoch": 2173} {"train_loss": -12.146045684814453, "global_step": 365111, "epoch": 2173} {"train_loss": -11.535261154174805, "global_step": 365112, "epoch": 2173} {"train_loss": -11.001604080200195, "global_step": 365113, "epoch": 2173} {"train_loss": -10.932892799377441, "global_step": 365114, "epoch": 2173} {"train_loss": -10.876230239868164, "global_step": 365115, "epoch": 2173} {"train_loss": -9.686107635498047, "global_step": 365116, "epoch": 2173} {"train_loss": -10.734746932983398, "global_step": 365117, "epoch": 2173} {"train_loss": -9.457348823547363, "global_step": 365118, "epoch": 2173} {"train_loss": -9.734371185302734, "global_step": 365119, "epoch": 2173} {"train_loss": -10.37836742401123, "global_step": 365120, "epoch": 2173} {"train_loss": -10.782119750976562, "global_step": 365121, "epoch": 2173} {"train_loss": -10.334392547607422, "global_step": 365122, "epoch": 2173} {"train_loss": -9.539141654968262, "global_step": 365123, "epoch": 2173} {"train_loss": -9.449971199035645, "global_step": 365124, "epoch": 2173} {"train_loss": -11.307619094848633, "global_step": 365125, "epoch": 2173} {"train_loss": -10.372573852539062, "global_step": 365126, "epoch": 2173} {"train_loss": -11.299354553222656, "global_step": 365127, "epoch": 2173} {"train_loss": -11.31558895111084, "global_step": 365128, "epoch": 2173} {"train_loss": -11.3857421875, "global_step": 365129, "epoch": 2173} {"train_loss": -11.09908676147461, "global_step": 365130, "epoch": 2173} {"train_loss": -11.381916046142578, "global_step": 365131, "epoch": 2173} {"train_loss": -10.74118709564209, "global_step": 365132, "epoch": 2173} {"train_loss": -11.647577285766602, "global_step": 365133, "epoch": 2173} {"train_loss": -11.291828155517578, "global_step": 365134, "epoch": 2173} {"train_loss": -12.088664054870605, "global_step": 365135, "epoch": 2173} {"train_loss": -11.273321151733398, "global_step": 365136, "epoch": 2173} {"train_loss": -11.628135681152344, "global_step": 365137, "epoch": 2173} {"train_loss": -11.756905555725098, "global_step": 365138, "epoch": 2173} {"train_loss": -11.880218505859375, "global_step": 365139, "epoch": 2173} {"train_loss": -11.836079597473145, "global_step": 365140, "epoch": 2173} {"train_loss": -11.9674711227417, "global_step": 365141, "epoch": 2173} {"train_loss": -11.769956588745117, "global_step": 365142, "epoch": 2173} {"train_loss": -11.973930358886719, "global_step": 365143, "epoch": 2173} {"train_loss": -11.736772537231445, "global_step": 365144, "epoch": 2173} {"train_loss": -11.743919372558594, "global_step": 365145, "epoch": 2173} {"train_loss": -11.969270706176758, "global_step": 365146, "epoch": 2173} {"train_loss": -11.827220916748047, "global_step": 365147, "epoch": 2173} {"train_loss": -12.18936824798584, "global_step": 365148, "epoch": 2173} {"train_loss": -12.044410705566406, "global_step": 365149, "epoch": 2173} {"train_loss": -11.954221725463867, "global_step": 365150, "epoch": 2173} {"train_loss": -11.953580856323242, "global_step": 365151, "epoch": 2173} {"train_loss": -12.216987609863281, "global_step": 365152, "epoch": 2173} {"train_loss": -11.902445793151855, "global_step": 365153, "epoch": 2173} {"train_loss": -12.030183792114258, "global_step": 365154, "epoch": 2173} {"train_loss": -12.121484756469727, "global_step": 365155, "epoch": 2173} {"train_loss": -12.072942733764648, "global_step": 365156, "epoch": 2173} {"train_loss": -12.21158218383789, "global_step": 365157, "epoch": 2173} {"train_loss": -12.049558639526367, "global_step": 365158, "epoch": 2173} {"train_loss": -12.221460342407227, "global_step": 365159, "epoch": 2173} {"train_loss": -12.271448135375977, "global_step": 365160, "epoch": 2173} {"train_loss": -12.329329490661621, "global_step": 365161, "epoch": 2173} {"train_loss": -11.951828002929688, "global_step": 365162, "epoch": 2173} {"train_loss": -12.102294921875, "global_step": 365163, "epoch": 2173} {"train_loss": -12.156009674072266, "global_step": 365164, "epoch": 2173} {"train_loss": -12.18043327331543, "global_step": 365165, "epoch": 2173} {"train_loss": -12.375886917114258, "global_step": 365166, "epoch": 2173} {"train_loss": -12.392492294311523, "global_step": 365167, "epoch": 2173} {"train_loss": -12.194378852844238, "global_step": 365168, "epoch": 2173} {"train_loss": -12.330490112304688, "global_step": 365169, "epoch": 2173} {"train_loss": -12.275413513183594, "global_step": 365170, "epoch": 2173} {"train_loss": -12.477249145507812, "global_step": 365171, "epoch": 2173} {"train_loss": -12.392314910888672, "global_step": 365172, "epoch": 2173} {"train_loss": -12.39796257019043, "global_step": 365173, "epoch": 2173} {"train_loss": -12.238832473754883, "global_step": 365174, "epoch": 2173} {"train_loss": -12.467094421386719, "global_step": 365175, "epoch": 2173} {"train_loss": -12.18967342376709, "global_step": 365176, "epoch": 2173} {"train_loss": -12.256725311279297, "global_step": 365177, "epoch": 2173} {"train_loss": -12.2537841796875, "global_step": 365178, "epoch": 2173} {"train_loss": -12.111939430236816, "global_step": 365179, "epoch": 2173} {"train_loss": -12.385255813598633, "global_step": 365180, "epoch": 2173} {"train_loss": -12.248453140258789, "global_step": 365181, "epoch": 2173} {"train_loss": -12.432788848876953, "global_step": 365182, "epoch": 2173} {"train_loss": -12.131333351135254, "global_step": 365183, "epoch": 2173} {"train_loss": -12.337579727172852, "global_step": 365184, "epoch": 2173} {"train_loss": -12.030694961547852, "global_step": 365185, "epoch": 2173} {"train_loss": -12.408547401428223, "global_step": 365186, "epoch": 2173} {"train_loss": -12.217687606811523, "global_step": 365187, "epoch": 2173} {"train_loss": -12.514287948608398, "global_step": 365188, "epoch": 2173} {"train_loss": -12.298139572143555, "global_step": 365189, "epoch": 2173} {"train_loss": -12.427375793457031, "global_step": 365190, "epoch": 2173} {"train_loss": -12.43375015258789, "global_step": 365191, "epoch": 2173} {"train_loss": -12.280649185180664, "global_step": 365192, "epoch": 2173} {"train_loss": -12.325764656066895, "global_step": 365193, "epoch": 2173} {"train_loss": -12.194459915161133, "global_step": 365194, "epoch": 2173} {"train_loss": -12.35110855102539, "global_step": 365195, "epoch": 2173} {"train_loss": -11.51528263092041, "global_step": 365196, "epoch": 2173} {"train_loss": -11.521183013916016, "global_step": 365197, "epoch": 2173} {"train_loss": -12.058828353881836, "global_step": 365198, "epoch": 2173} {"train_loss": -11.869388580322266, "global_step": 365199, "epoch": 2173} {"train_loss": -11.539922714233398, "global_step": 365200, "epoch": 2173} {"train_loss": -12.071982383728027, "global_step": 365201, "epoch": 2173} {"train_loss": -12.132329940795898, "global_step": 365202, "epoch": 2173} {"train_loss": -11.327577590942383, "global_step": 365203, "epoch": 2173} {"train_loss": -11.707000732421875, "global_step": 365204, "epoch": 2173} {"train_loss": -11.77353286743164, "global_step": 365205, "epoch": 2173} {"train_loss": -12.151971817016602, "global_step": 365206, "epoch": 2173} {"train_loss": -11.932077407836914, "global_step": 365207, "epoch": 2173} {"train_loss": -11.660197257995605, "global_step": 365208, "epoch": 2173} {"train_loss": -11.710259437561035, "global_step": 365209, "epoch": 2173} {"train_loss": -11.57225227355957, "global_step": 365210, "epoch": 2173} {"train_loss": -10.103815078735352, "global_step": 365211, "epoch": 2173} {"train_loss": -11.344398498535156, "global_step": 365212, "epoch": 2173} {"train_loss": -9.86715316772461, "global_step": 365213, "epoch": 2173} {"train_loss": -10.75008773803711, "global_step": 365214, "epoch": 2173} {"train_loss": -8.883647918701172, "global_step": 365215, "epoch": 2173} {"train_loss": -11.075638771057129, "global_step": 365216, "epoch": 2173} {"train_loss": -9.741828918457031, "global_step": 365217, "epoch": 2173} {"train_loss": -11.37317180633545, "global_step": 365218, "epoch": 2173} {"train_loss": -9.500419616699219, "global_step": 365219, "epoch": 2173} {"train_loss": -10.02698802947998, "global_step": 365220, "epoch": 2173} {"train_loss": -9.25692367553711, "global_step": 365221, "epoch": 2173} {"train_loss": -10.715399742126465, "global_step": 365222, "epoch": 2173} {"train_loss": -10.09247875213623, "global_step": 365223, "epoch": 2173} {"train_loss": -10.677075386047363, "global_step": 365224, "epoch": 2173} {"train_loss": -9.698573112487793, "global_step": 365225, "epoch": 2173} {"train_loss": -11.412391662597656, "global_step": 365226, "epoch": 2173} {"train_loss": -10.123058319091797, "global_step": 365227, "epoch": 2173} {"train_loss": -11.48159122467041, "global_step": 365228, "epoch": 2173} {"train_loss": -11.009474754333496, "global_step": 365229, "epoch": 2173} {"train_loss": -10.80451488494873, "global_step": 365230, "epoch": 2173} {"train_loss": -11.620747299421401, "global_step": 365231, "epoch": 2173, "val_loss": 286949.40625} {"train_loss": -10.469991683959961, "global_step": 365232, "epoch": 2174} {"train_loss": -11.675117492675781, "global_step": 365233, "epoch": 2174} {"train_loss": -11.085835456848145, "global_step": 365234, "epoch": 2174} {"train_loss": -11.4920654296875, "global_step": 365235, "epoch": 2174} {"train_loss": -11.809484481811523, "global_step": 365236, "epoch": 2174} {"train_loss": -11.35881519317627, "global_step": 365237, "epoch": 2174} {"train_loss": -11.3281888961792, "global_step": 365238, "epoch": 2174} {"train_loss": -11.612375259399414, "global_step": 365239, "epoch": 2174} {"train_loss": -11.14402961730957, "global_step": 365240, "epoch": 2174} {"train_loss": -11.945230484008789, "global_step": 365241, "epoch": 2174} {"train_loss": -11.829744338989258, "global_step": 365242, "epoch": 2174} {"train_loss": -11.914783477783203, "global_step": 365243, "epoch": 2174} {"train_loss": -11.766016006469727, "global_step": 365244, "epoch": 2174} {"train_loss": -11.685437202453613, "global_step": 365245, "epoch": 2174} {"train_loss": -11.801746368408203, "global_step": 365246, "epoch": 2174} {"train_loss": -11.77762222290039, "global_step": 365247, "epoch": 2174} {"train_loss": -11.959033966064453, "global_step": 365248, "epoch": 2174} {"train_loss": -11.91866683959961, "global_step": 365249, "epoch": 2174} {"train_loss": -12.062579154968262, "global_step": 365250, "epoch": 2174} {"train_loss": -11.824845314025879, "global_step": 365251, "epoch": 2174} {"train_loss": -12.079073905944824, "global_step": 365252, "epoch": 2174} {"train_loss": -12.087333679199219, "global_step": 365253, "epoch": 2174} {"train_loss": -12.142114639282227, "global_step": 365254, "epoch": 2174} {"train_loss": -12.206021308898926, "global_step": 365255, "epoch": 2174} {"train_loss": -12.101797103881836, "global_step": 365256, "epoch": 2174} {"train_loss": -12.01213550567627, "global_step": 365257, "epoch": 2174} {"train_loss": -12.259876251220703, "global_step": 365258, "epoch": 2174} {"train_loss": -11.945186614990234, "global_step": 365259, "epoch": 2174} {"train_loss": -12.212084770202637, "global_step": 365260, "epoch": 2174} {"train_loss": -12.184904098510742, "global_step": 365261, "epoch": 2174} {"train_loss": -12.06273078918457, "global_step": 365262, "epoch": 2174} {"train_loss": -12.200674057006836, "global_step": 365263, "epoch": 2174} {"train_loss": -11.811945915222168, "global_step": 365264, "epoch": 2174} {"train_loss": -12.359084129333496, "global_step": 365265, "epoch": 2174} {"train_loss": -12.142097473144531, "global_step": 365266, "epoch": 2174} {"train_loss": -12.269221305847168, "global_step": 365267, "epoch": 2174} {"train_loss": -12.151750564575195, "global_step": 365268, "epoch": 2174} {"train_loss": -12.362651824951172, "global_step": 365269, "epoch": 2174} {"train_loss": -12.166417121887207, "global_step": 365270, "epoch": 2174} {"train_loss": -12.226821899414062, "global_step": 365271, "epoch": 2174} {"train_loss": -12.161426544189453, "global_step": 365272, "epoch": 2174} {"train_loss": -12.022930145263672, "global_step": 365273, "epoch": 2174} {"train_loss": -12.328468322753906, "global_step": 365274, "epoch": 2174} {"train_loss": -12.439715385437012, "global_step": 365275, "epoch": 2174} {"train_loss": -12.179367065429688, "global_step": 365276, "epoch": 2174} {"train_loss": -12.403081893920898, "global_step": 365277, "epoch": 2174} {"train_loss": -12.190126419067383, "global_step": 365278, "epoch": 2174} {"train_loss": -12.578835487365723, "global_step": 365279, "epoch": 2174} {"train_loss": -12.337339401245117, "global_step": 365280, "epoch": 2174} {"train_loss": -12.278581619262695, "global_step": 365281, "epoch": 2174} {"train_loss": -12.100914001464844, "global_step": 365282, "epoch": 2174} {"train_loss": -12.243343353271484, "global_step": 365283, "epoch": 2174} {"train_loss": -12.173940658569336, "global_step": 365284, "epoch": 2174} {"train_loss": -12.14517593383789, "global_step": 365285, "epoch": 2174} {"train_loss": -12.260955810546875, "global_step": 365286, "epoch": 2174} {"train_loss": -12.406064987182617, "global_step": 365287, "epoch": 2174} {"train_loss": -12.296826362609863, "global_step": 365288, "epoch": 2174} {"train_loss": -12.451486587524414, "global_step": 365289, "epoch": 2174} {"train_loss": -12.221747398376465, "global_step": 365290, "epoch": 2174} {"train_loss": -12.657727241516113, "global_step": 365291, "epoch": 2174} {"train_loss": -12.4132661819458, "global_step": 365292, "epoch": 2174} {"train_loss": -12.427085876464844, "global_step": 365293, "epoch": 2174} {"train_loss": -12.455322265625, "global_step": 365294, "epoch": 2174} {"train_loss": -12.441730499267578, "global_step": 365295, "epoch": 2174} {"train_loss": -12.580835342407227, "global_step": 365296, "epoch": 2174} {"train_loss": -12.387626647949219, "global_step": 365297, "epoch": 2174} {"train_loss": -12.468233108520508, "global_step": 365298, "epoch": 2174} {"train_loss": -12.521623611450195, "global_step": 365299, "epoch": 2174} {"train_loss": -12.465995788574219, "global_step": 365300, "epoch": 2174} {"train_loss": -12.51009750366211, "global_step": 365301, "epoch": 2174} {"train_loss": -12.47428035736084, "global_step": 365302, "epoch": 2174} {"train_loss": -12.522074699401855, "global_step": 365303, "epoch": 2174} {"train_loss": -12.626895904541016, "global_step": 365304, "epoch": 2174} {"train_loss": -12.480243682861328, "global_step": 365305, "epoch": 2174} {"train_loss": -12.389852523803711, "global_step": 365306, "epoch": 2174} {"train_loss": -12.457660675048828, "global_step": 365307, "epoch": 2174} {"train_loss": -12.405789375305176, "global_step": 365308, "epoch": 2174} {"train_loss": -12.423192977905273, "global_step": 365309, "epoch": 2174} {"train_loss": -12.557300567626953, "global_step": 365310, "epoch": 2174} {"train_loss": -12.418766975402832, "global_step": 365311, "epoch": 2174} {"train_loss": -12.268199920654297, "global_step": 365312, "epoch": 2174} {"train_loss": -12.656594276428223, "global_step": 365313, "epoch": 2174} {"train_loss": -12.27053165435791, "global_step": 365314, "epoch": 2174} {"train_loss": -12.680869102478027, "global_step": 365315, "epoch": 2174} {"train_loss": -12.669534683227539, "global_step": 365316, "epoch": 2174} {"train_loss": -12.47080135345459, "global_step": 365317, "epoch": 2174} {"train_loss": -12.371939659118652, "global_step": 365318, "epoch": 2174} {"train_loss": -12.636825561523438, "global_step": 365319, "epoch": 2174} {"train_loss": -12.611228942871094, "global_step": 365320, "epoch": 2174} {"train_loss": -12.733139038085938, "global_step": 365321, "epoch": 2174} {"train_loss": -12.701790809631348, "global_step": 365322, "epoch": 2174} {"train_loss": -12.529041290283203, "global_step": 365323, "epoch": 2174} {"train_loss": -12.472602844238281, "global_step": 365324, "epoch": 2174} {"train_loss": -12.676501274108887, "global_step": 365325, "epoch": 2174} {"train_loss": -12.35629940032959, "global_step": 365326, "epoch": 2174} {"train_loss": -12.503838539123535, "global_step": 365327, "epoch": 2174} {"train_loss": -12.665252685546875, "global_step": 365328, "epoch": 2174} {"train_loss": -12.475461959838867, "global_step": 365329, "epoch": 2174} {"train_loss": -12.4774169921875, "global_step": 365330, "epoch": 2174} {"train_loss": -12.58110237121582, "global_step": 365331, "epoch": 2174} {"train_loss": -12.641307830810547, "global_step": 365332, "epoch": 2174} {"train_loss": -12.62004280090332, "global_step": 365333, "epoch": 2174} {"train_loss": -12.303213119506836, "global_step": 365334, "epoch": 2174} {"train_loss": -12.596148490905762, "global_step": 365335, "epoch": 2174} {"train_loss": -12.371384620666504, "global_step": 365336, "epoch": 2174} {"train_loss": -12.31854248046875, "global_step": 365337, "epoch": 2174} {"train_loss": -12.027181625366211, "global_step": 365338, "epoch": 2174} {"train_loss": -12.344449996948242, "global_step": 365339, "epoch": 2174} {"train_loss": -11.808640480041504, "global_step": 365340, "epoch": 2174} {"train_loss": -12.541089057922363, "global_step": 365341, "epoch": 2174} {"train_loss": -12.327522277832031, "global_step": 365342, "epoch": 2174} {"train_loss": -11.2910737991333, "global_step": 365343, "epoch": 2174} {"train_loss": -10.349011421203613, "global_step": 365344, "epoch": 2174} {"train_loss": -10.405145645141602, "global_step": 365345, "epoch": 2174} {"train_loss": -11.329383850097656, "global_step": 365346, "epoch": 2174} {"train_loss": -11.229127883911133, "global_step": 365347, "epoch": 2174} {"train_loss": -12.0740966796875, "global_step": 365348, "epoch": 2174} {"train_loss": -10.954935073852539, "global_step": 365349, "epoch": 2174} {"train_loss": -10.922356605529785, "global_step": 365350, "epoch": 2174} {"train_loss": -11.327154159545898, "global_step": 365351, "epoch": 2174} {"train_loss": -11.728364944458008, "global_step": 365352, "epoch": 2174} {"train_loss": -12.036466598510742, "global_step": 365353, "epoch": 2174} {"train_loss": -12.260615348815918, "global_step": 365354, "epoch": 2174} {"train_loss": -11.9431734085083, "global_step": 365355, "epoch": 2174} {"train_loss": -11.954267501831055, "global_step": 365356, "epoch": 2174} {"train_loss": -12.227288246154785, "global_step": 365357, "epoch": 2174} {"train_loss": -11.99364948272705, "global_step": 365358, "epoch": 2174} {"train_loss": -11.390782356262207, "global_step": 365359, "epoch": 2174} {"train_loss": -12.287948608398438, "global_step": 365360, "epoch": 2174} {"train_loss": -11.85916805267334, "global_step": 365361, "epoch": 2174} {"train_loss": -11.536458015441895, "global_step": 365362, "epoch": 2174} {"train_loss": -11.822053909301758, "global_step": 365363, "epoch": 2174} {"train_loss": -11.60281753540039, "global_step": 365364, "epoch": 2174} {"train_loss": -10.550161361694336, "global_step": 365365, "epoch": 2174} {"train_loss": -11.705695152282715, "global_step": 365366, "epoch": 2174} {"train_loss": -11.971959114074707, "global_step": 365367, "epoch": 2174} {"train_loss": -10.890032768249512, "global_step": 365368, "epoch": 2174} {"train_loss": -11.858536720275879, "global_step": 365369, "epoch": 2174} {"train_loss": -11.76546859741211, "global_step": 365370, "epoch": 2174} {"train_loss": -11.250570297241211, "global_step": 365371, "epoch": 2174} {"train_loss": -12.122196197509766, "global_step": 365372, "epoch": 2174} {"train_loss": -11.94070053100586, "global_step": 365373, "epoch": 2174} {"train_loss": -11.912426948547363, "global_step": 365374, "epoch": 2174} {"train_loss": -12.438151359558105, "global_step": 365375, "epoch": 2174} {"train_loss": -11.9829683303833, "global_step": 365376, "epoch": 2174} {"train_loss": -11.399471282958984, "global_step": 365377, "epoch": 2174} {"train_loss": -12.43997573852539, "global_step": 365378, "epoch": 2174} {"train_loss": -11.318256378173828, "global_step": 365379, "epoch": 2174} {"train_loss": -11.18990707397461, "global_step": 365380, "epoch": 2174} {"train_loss": -11.958846092224121, "global_step": 365381, "epoch": 2174} {"train_loss": -12.167427062988281, "global_step": 365382, "epoch": 2174} {"train_loss": -10.971933364868164, "global_step": 365383, "epoch": 2174} {"train_loss": -11.772481918334961, "global_step": 365384, "epoch": 2174} {"train_loss": -11.92056941986084, "global_step": 365385, "epoch": 2174} {"train_loss": -10.868316650390625, "global_step": 365386, "epoch": 2174} {"train_loss": -11.563947677612305, "global_step": 365387, "epoch": 2174} {"train_loss": -11.205246925354004, "global_step": 365388, "epoch": 2174} {"train_loss": -10.632923126220703, "global_step": 365389, "epoch": 2174} {"train_loss": -12.236717224121094, "global_step": 365390, "epoch": 2174} {"train_loss": -9.861413955688477, "global_step": 365391, "epoch": 2174} {"train_loss": -12.364871978759766, "global_step": 365392, "epoch": 2174} {"train_loss": -10.089478492736816, "global_step": 365393, "epoch": 2174} {"train_loss": -11.020549774169922, "global_step": 365394, "epoch": 2174} {"train_loss": -11.110811233520508, "global_step": 365395, "epoch": 2174} {"train_loss": -11.087236404418945, "global_step": 365396, "epoch": 2174} {"train_loss": -11.519015312194824, "global_step": 365397, "epoch": 2174} {"train_loss": -10.018453598022461, "global_step": 365398, "epoch": 2174} {"train_loss": -11.973665288516454, "global_step": 365399, "epoch": 2174, "val_loss": 290046.53125} {"train_loss": -11.196162223815918, "global_step": 365400, "epoch": 2175} {"train_loss": -11.707822799682617, "global_step": 365401, "epoch": 2175} {"train_loss": -11.076800346374512, "global_step": 365402, "epoch": 2175} {"train_loss": -12.162216186523438, "global_step": 365403, "epoch": 2175} {"train_loss": -11.472837448120117, "global_step": 365404, "epoch": 2175} {"train_loss": -12.237695693969727, "global_step": 365405, "epoch": 2175} {"train_loss": -11.602128982543945, "global_step": 365406, "epoch": 2175} {"train_loss": -11.202841758728027, "global_step": 365407, "epoch": 2175} {"train_loss": -12.046831130981445, "global_step": 365408, "epoch": 2175} {"train_loss": -11.122323989868164, "global_step": 365409, "epoch": 2175} {"train_loss": -12.17724895477295, "global_step": 365410, "epoch": 2175} {"train_loss": -11.505290031433105, "global_step": 365411, "epoch": 2175} {"train_loss": -12.10964584350586, "global_step": 365412, "epoch": 2175} {"train_loss": -11.619317054748535, "global_step": 365413, "epoch": 2175} {"train_loss": -11.85871696472168, "global_step": 365414, "epoch": 2175} {"train_loss": -11.935722351074219, "global_step": 365415, "epoch": 2175} {"train_loss": -11.341409683227539, "global_step": 365416, "epoch": 2175} {"train_loss": -11.766075134277344, "global_step": 365417, "epoch": 2175} {"train_loss": -11.798673629760742, "global_step": 365418, "epoch": 2175} {"train_loss": -12.261468887329102, "global_step": 365419, "epoch": 2175} {"train_loss": -12.159637451171875, "global_step": 365420, "epoch": 2175} {"train_loss": -11.89893913269043, "global_step": 365421, "epoch": 2175} {"train_loss": -12.015913963317871, "global_step": 365422, "epoch": 2175} {"train_loss": -12.26760482788086, "global_step": 365423, "epoch": 2175} {"train_loss": -11.87389850616455, "global_step": 365424, "epoch": 2175} {"train_loss": -11.99865436553955, "global_step": 365425, "epoch": 2175} {"train_loss": -11.779193878173828, "global_step": 365426, "epoch": 2175} {"train_loss": -11.998762130737305, "global_step": 365427, "epoch": 2175} {"train_loss": -11.668449401855469, "global_step": 365428, "epoch": 2175} {"train_loss": -11.98623275756836, "global_step": 365429, "epoch": 2175} {"train_loss": -12.066507339477539, "global_step": 365430, "epoch": 2175} {"train_loss": -12.482049942016602, "global_step": 365431, "epoch": 2175} {"train_loss": -11.87450885772705, "global_step": 365432, "epoch": 2175} {"train_loss": -12.34430980682373, "global_step": 365433, "epoch": 2175} {"train_loss": -11.986587524414062, "global_step": 365434, "epoch": 2175} {"train_loss": -12.175482749938965, "global_step": 365435, "epoch": 2175} {"train_loss": -12.343466758728027, "global_step": 365436, "epoch": 2175} {"train_loss": -11.89024543762207, "global_step": 365437, "epoch": 2175} {"train_loss": -12.278148651123047, "global_step": 365438, "epoch": 2175} {"train_loss": -12.017624855041504, "global_step": 365439, "epoch": 2175} {"train_loss": -12.247968673706055, "global_step": 365440, "epoch": 2175} {"train_loss": -12.057973861694336, "global_step": 365441, "epoch": 2175} {"train_loss": -11.95440673828125, "global_step": 365442, "epoch": 2175} {"train_loss": -12.29633617401123, "global_step": 365443, "epoch": 2175} {"train_loss": -12.203614234924316, "global_step": 365444, "epoch": 2175} {"train_loss": -12.641290664672852, "global_step": 365445, "epoch": 2175} {"train_loss": -12.139673233032227, "global_step": 365446, "epoch": 2175} {"train_loss": -12.589115142822266, "global_step": 365447, "epoch": 2175} {"train_loss": -12.490839004516602, "global_step": 365448, "epoch": 2175} {"train_loss": -12.390949249267578, "global_step": 365449, "epoch": 2175} {"train_loss": -12.072998046875, "global_step": 365450, "epoch": 2175} {"train_loss": -12.157776832580566, "global_step": 365451, "epoch": 2175} {"train_loss": -12.410858154296875, "global_step": 365452, "epoch": 2175} {"train_loss": -12.102758407592773, "global_step": 365453, "epoch": 2175} {"train_loss": -12.369644165039062, "global_step": 365454, "epoch": 2175} {"train_loss": -12.360701560974121, "global_step": 365455, "epoch": 2175} {"train_loss": -12.096713066101074, "global_step": 365456, "epoch": 2175} {"train_loss": -12.546269416809082, "global_step": 365457, "epoch": 2175} {"train_loss": -12.149667739868164, "global_step": 365458, "epoch": 2175} {"train_loss": -12.224063873291016, "global_step": 365459, "epoch": 2175} {"train_loss": -12.24370002746582, "global_step": 365460, "epoch": 2175} {"train_loss": -12.174877166748047, "global_step": 365461, "epoch": 2175} {"train_loss": -11.926552772521973, "global_step": 365462, "epoch": 2175} {"train_loss": -12.255491256713867, "global_step": 365463, "epoch": 2175} {"train_loss": -12.317049026489258, "global_step": 365464, "epoch": 2175} {"train_loss": -12.353782653808594, "global_step": 365465, "epoch": 2175} {"train_loss": -12.220659255981445, "global_step": 365466, "epoch": 2175} {"train_loss": -12.361577987670898, "global_step": 365467, "epoch": 2175} {"train_loss": -12.445120811462402, "global_step": 365468, "epoch": 2175} {"train_loss": -12.44502067565918, "global_step": 365469, "epoch": 2175} {"train_loss": -12.41187858581543, "global_step": 365470, "epoch": 2175} {"train_loss": -12.354830741882324, "global_step": 365471, "epoch": 2175} {"train_loss": -12.533381462097168, "global_step": 365472, "epoch": 2175} {"train_loss": -12.35922908782959, "global_step": 365473, "epoch": 2175} {"train_loss": -12.392273902893066, "global_step": 365474, "epoch": 2175} {"train_loss": -12.270158767700195, "global_step": 365475, "epoch": 2175} {"train_loss": -12.208805084228516, "global_step": 365476, "epoch": 2175} {"train_loss": -12.520668029785156, "global_step": 365477, "epoch": 2175} {"train_loss": -12.427841186523438, "global_step": 365478, "epoch": 2175} {"train_loss": -12.537040710449219, "global_step": 365479, "epoch": 2175} {"train_loss": -12.354301452636719, "global_step": 365480, "epoch": 2175} {"train_loss": -12.453163146972656, "global_step": 365481, "epoch": 2175} {"train_loss": -12.586674690246582, "global_step": 365482, "epoch": 2175} {"train_loss": -12.438484191894531, "global_step": 365483, "epoch": 2175} {"train_loss": -12.569364547729492, "global_step": 365484, "epoch": 2175} {"train_loss": -12.543367385864258, "global_step": 365485, "epoch": 2175} {"train_loss": -12.535456657409668, "global_step": 365486, "epoch": 2175} {"train_loss": -12.4436674118042, "global_step": 365487, "epoch": 2175} {"train_loss": -12.535181045532227, "global_step": 365488, "epoch": 2175} {"train_loss": -12.520059585571289, "global_step": 365489, "epoch": 2175} {"train_loss": -12.587078094482422, "global_step": 365490, "epoch": 2175} {"train_loss": -12.501765251159668, "global_step": 365491, "epoch": 2175} {"train_loss": -12.69354248046875, "global_step": 365492, "epoch": 2175} {"train_loss": -12.616128921508789, "global_step": 365493, "epoch": 2175} {"train_loss": -12.326457977294922, "global_step": 365494, "epoch": 2175} {"train_loss": -12.5490083694458, "global_step": 365495, "epoch": 2175} {"train_loss": -12.469294548034668, "global_step": 365496, "epoch": 2175} {"train_loss": -12.133235931396484, "global_step": 365497, "epoch": 2175} {"train_loss": -12.307001113891602, "global_step": 365498, "epoch": 2175} {"train_loss": -12.51288890838623, "global_step": 365499, "epoch": 2175} {"train_loss": -12.451712608337402, "global_step": 365500, "epoch": 2175} {"train_loss": -12.357690811157227, "global_step": 365501, "epoch": 2175} {"train_loss": -12.0882568359375, "global_step": 365502, "epoch": 2175} {"train_loss": -12.421374320983887, "global_step": 365503, "epoch": 2175} {"train_loss": -11.961216926574707, "global_step": 365504, "epoch": 2175} {"train_loss": -10.681949615478516, "global_step": 365505, "epoch": 2175} {"train_loss": -10.957651138305664, "global_step": 365506, "epoch": 2175} {"train_loss": -12.166621208190918, "global_step": 365507, "epoch": 2175} {"train_loss": -11.273666381835938, "global_step": 365508, "epoch": 2175} {"train_loss": -10.75628662109375, "global_step": 365509, "epoch": 2175} {"train_loss": -11.586356163024902, "global_step": 365510, "epoch": 2175} {"train_loss": -11.48841667175293, "global_step": 365511, "epoch": 2175} {"train_loss": -11.335078239440918, "global_step": 365512, "epoch": 2175} {"train_loss": -11.738980293273926, "global_step": 365513, "epoch": 2175} {"train_loss": -11.80589771270752, "global_step": 365514, "epoch": 2175} {"train_loss": -11.049201011657715, "global_step": 365515, "epoch": 2175} {"train_loss": -11.495450973510742, "global_step": 365516, "epoch": 2175} {"train_loss": -11.405864715576172, "global_step": 365517, "epoch": 2175} {"train_loss": -11.856142044067383, "global_step": 365518, "epoch": 2175} {"train_loss": -10.526275634765625, "global_step": 365519, "epoch": 2175} {"train_loss": -11.408735275268555, "global_step": 365520, "epoch": 2175} {"train_loss": -11.699016571044922, "global_step": 365521, "epoch": 2175} {"train_loss": -11.733802795410156, "global_step": 365522, "epoch": 2175} {"train_loss": -11.485861778259277, "global_step": 365523, "epoch": 2175} {"train_loss": -11.726603507995605, "global_step": 365524, "epoch": 2175} {"train_loss": -12.146160125732422, "global_step": 365525, "epoch": 2175} {"train_loss": -11.385574340820312, "global_step": 365526, "epoch": 2175} {"train_loss": -12.455078125, "global_step": 365527, "epoch": 2175} {"train_loss": -11.874191284179688, "global_step": 365528, "epoch": 2175} {"train_loss": -12.219535827636719, "global_step": 365529, "epoch": 2175} {"train_loss": -11.915424346923828, "global_step": 365530, "epoch": 2175} {"train_loss": -12.433841705322266, "global_step": 365531, "epoch": 2175} {"train_loss": -11.966567993164062, "global_step": 365532, "epoch": 2175} {"train_loss": -12.13592529296875, "global_step": 365533, "epoch": 2175} {"train_loss": -11.981908798217773, "global_step": 365534, "epoch": 2175} {"train_loss": -11.964714050292969, "global_step": 365535, "epoch": 2175} {"train_loss": -12.447309494018555, "global_step": 365536, "epoch": 2175} {"train_loss": -12.14553451538086, "global_step": 365537, "epoch": 2175} {"train_loss": -11.571576118469238, "global_step": 365538, "epoch": 2175} {"train_loss": -12.395304679870605, "global_step": 365539, "epoch": 2175} {"train_loss": -11.957523345947266, "global_step": 365540, "epoch": 2175} {"train_loss": -12.331125259399414, "global_step": 365541, "epoch": 2175} {"train_loss": -12.008710861206055, "global_step": 365542, "epoch": 2175} {"train_loss": -11.37775707244873, "global_step": 365543, "epoch": 2175} {"train_loss": -12.481998443603516, "global_step": 365544, "epoch": 2175} {"train_loss": -11.655502319335938, "global_step": 365545, "epoch": 2175} {"train_loss": -12.253612518310547, "global_step": 365546, "epoch": 2175} {"train_loss": -11.920852661132812, "global_step": 365547, "epoch": 2175} {"train_loss": -12.01943302154541, "global_step": 365548, "epoch": 2175} {"train_loss": -12.407756805419922, "global_step": 365549, "epoch": 2175} {"train_loss": -11.97257137298584, "global_step": 365550, "epoch": 2175} {"train_loss": -12.342069625854492, "global_step": 365551, "epoch": 2175} {"train_loss": -12.34201431274414, "global_step": 365552, "epoch": 2175} {"train_loss": -12.348651885986328, "global_step": 365553, "epoch": 2175} {"train_loss": -12.258240699768066, "global_step": 365554, "epoch": 2175} {"train_loss": -12.089132308959961, "global_step": 365555, "epoch": 2175} {"train_loss": -12.563159942626953, "global_step": 365556, "epoch": 2175} {"train_loss": -12.423856735229492, "global_step": 365557, "epoch": 2175} {"train_loss": -12.406291961669922, "global_step": 365558, "epoch": 2175} {"train_loss": -12.415534019470215, "global_step": 365559, "epoch": 2175} {"train_loss": -12.214608192443848, "global_step": 365560, "epoch": 2175} {"train_loss": -12.12155818939209, "global_step": 365561, "epoch": 2175} {"train_loss": -12.702274322509766, "global_step": 365562, "epoch": 2175} {"train_loss": -12.245256423950195, "global_step": 365563, "epoch": 2175} {"train_loss": -12.521465301513672, "global_step": 365564, "epoch": 2175} {"train_loss": -12.182907104492188, "global_step": 365565, "epoch": 2175} {"train_loss": -12.363410949707031, "global_step": 365566, "epoch": 2175} {"train_loss": -12.083497524261475, "global_step": 365567, "epoch": 2175, "val_loss": 292605.6875, "train_action_mse_error": 1.305778980255127} {"train_loss": -11.895904541015625, "global_step": 365568, "epoch": 2176} {"train_loss": -11.767890930175781, "global_step": 365569, "epoch": 2176} {"train_loss": -12.138639450073242, "global_step": 365570, "epoch": 2176} {"train_loss": -11.933649063110352, "global_step": 365571, "epoch": 2176} {"train_loss": -11.55235481262207, "global_step": 365572, "epoch": 2176} {"train_loss": -12.473031044006348, "global_step": 365573, "epoch": 2176} {"train_loss": -11.601024627685547, "global_step": 365574, "epoch": 2176} {"train_loss": -11.844034194946289, "global_step": 365575, "epoch": 2176} {"train_loss": -12.247068405151367, "global_step": 365576, "epoch": 2176} {"train_loss": -12.243159294128418, "global_step": 365577, "epoch": 2176} {"train_loss": -12.608695983886719, "global_step": 365578, "epoch": 2176} {"train_loss": -11.92926025390625, "global_step": 365579, "epoch": 2176} {"train_loss": -11.912498474121094, "global_step": 365580, "epoch": 2176} {"train_loss": -12.462018013000488, "global_step": 365581, "epoch": 2176} {"train_loss": -12.179557800292969, "global_step": 365582, "epoch": 2176} {"train_loss": -12.32374095916748, "global_step": 365583, "epoch": 2176} {"train_loss": -12.225342750549316, "global_step": 365584, "epoch": 2176} {"train_loss": -12.442341804504395, "global_step": 365585, "epoch": 2176} {"train_loss": -12.037910461425781, "global_step": 365586, "epoch": 2176} {"train_loss": -12.03431510925293, "global_step": 365587, "epoch": 2176} {"train_loss": -11.774112701416016, "global_step": 365588, "epoch": 2176} {"train_loss": -12.110618591308594, "global_step": 365589, "epoch": 2176} {"train_loss": -11.117176055908203, "global_step": 365590, "epoch": 2176} {"train_loss": -12.359543800354004, "global_step": 365591, "epoch": 2176} {"train_loss": -11.241455078125, "global_step": 365592, "epoch": 2176} {"train_loss": -12.138087272644043, "global_step": 365593, "epoch": 2176} {"train_loss": -12.132678985595703, "global_step": 365594, "epoch": 2176} {"train_loss": -11.546159744262695, "global_step": 365595, "epoch": 2176} {"train_loss": -12.291646957397461, "global_step": 365596, "epoch": 2176} {"train_loss": -11.521769523620605, "global_step": 365597, "epoch": 2176} {"train_loss": -12.003599166870117, "global_step": 365598, "epoch": 2176} {"train_loss": -11.88752269744873, "global_step": 365599, "epoch": 2176} {"train_loss": -11.967000961303711, "global_step": 365600, "epoch": 2176} {"train_loss": -11.933968544006348, "global_step": 365601, "epoch": 2176} {"train_loss": -12.107732772827148, "global_step": 365602, "epoch": 2176} {"train_loss": -11.9989013671875, "global_step": 365603, "epoch": 2176} {"train_loss": -12.341560363769531, "global_step": 365604, "epoch": 2176} {"train_loss": -12.028083801269531, "global_step": 365605, "epoch": 2176} {"train_loss": -12.137229919433594, "global_step": 365606, "epoch": 2176} {"train_loss": -12.471450805664062, "global_step": 365607, "epoch": 2176} {"train_loss": -11.8502836227417, "global_step": 365608, "epoch": 2176} {"train_loss": -12.186107635498047, "global_step": 365609, "epoch": 2176} {"train_loss": -11.861469268798828, "global_step": 365610, "epoch": 2176} {"train_loss": -11.864017486572266, "global_step": 365611, "epoch": 2176} {"train_loss": -12.508035659790039, "global_step": 365612, "epoch": 2176} {"train_loss": -12.20889663696289, "global_step": 365613, "epoch": 2176} {"train_loss": -12.403215408325195, "global_step": 365614, "epoch": 2176} {"train_loss": -12.128661155700684, "global_step": 365615, "epoch": 2176} {"train_loss": -12.280745506286621, "global_step": 365616, "epoch": 2176} {"train_loss": -11.706459045410156, "global_step": 365617, "epoch": 2176} {"train_loss": -11.820301055908203, "global_step": 365618, "epoch": 2176} {"train_loss": -12.31458854675293, "global_step": 365619, "epoch": 2176} {"train_loss": -11.450705528259277, "global_step": 365620, "epoch": 2176} {"train_loss": -12.188577651977539, "global_step": 365621, "epoch": 2176} {"train_loss": -12.101031303405762, "global_step": 365622, "epoch": 2176} {"train_loss": -12.164548873901367, "global_step": 365623, "epoch": 2176} {"train_loss": -11.60669994354248, "global_step": 365624, "epoch": 2176} {"train_loss": -11.840420722961426, "global_step": 365625, "epoch": 2176} {"train_loss": -11.734573364257812, "global_step": 365626, "epoch": 2176} {"train_loss": -12.226767539978027, "global_step": 365627, "epoch": 2176} {"train_loss": -11.701786994934082, "global_step": 365628, "epoch": 2176} {"train_loss": -11.692596435546875, "global_step": 365629, "epoch": 2176} {"train_loss": -11.609171867370605, "global_step": 365630, "epoch": 2176} {"train_loss": -12.179794311523438, "global_step": 365631, "epoch": 2176} {"train_loss": -11.526741027832031, "global_step": 365632, "epoch": 2176} {"train_loss": -11.989274978637695, "global_step": 365633, "epoch": 2176} {"train_loss": -11.859289169311523, "global_step": 365634, "epoch": 2176} {"train_loss": -11.893339157104492, "global_step": 365635, "epoch": 2176} {"train_loss": -11.500818252563477, "global_step": 365636, "epoch": 2176} {"train_loss": -12.464402198791504, "global_step": 365637, "epoch": 2176} {"train_loss": -12.083317756652832, "global_step": 365638, "epoch": 2176} {"train_loss": -11.568574905395508, "global_step": 365639, "epoch": 2176} {"train_loss": -12.237263679504395, "global_step": 365640, "epoch": 2176} {"train_loss": -11.953317642211914, "global_step": 365641, "epoch": 2176} {"train_loss": -12.190196990966797, "global_step": 365642, "epoch": 2176} {"train_loss": -12.342473030090332, "global_step": 365643, "epoch": 2176} {"train_loss": -11.90647029876709, "global_step": 365644, "epoch": 2176} {"train_loss": -12.08031940460205, "global_step": 365645, "epoch": 2176} {"train_loss": -12.212135314941406, "global_step": 365646, "epoch": 2176} {"train_loss": -12.25277042388916, "global_step": 365647, "epoch": 2176} {"train_loss": -11.960888862609863, "global_step": 365648, "epoch": 2176} {"train_loss": -12.288949012756348, "global_step": 365649, "epoch": 2176} {"train_loss": -11.671674728393555, "global_step": 365650, "epoch": 2176} {"train_loss": -12.224613189697266, "global_step": 365651, "epoch": 2176} {"train_loss": -11.95335578918457, "global_step": 365652, "epoch": 2176} {"train_loss": -11.533397674560547, "global_step": 365653, "epoch": 2176} {"train_loss": -12.120288848876953, "global_step": 365654, "epoch": 2176} {"train_loss": -12.267560958862305, "global_step": 365655, "epoch": 2176} {"train_loss": -11.928964614868164, "global_step": 365656, "epoch": 2176} {"train_loss": -12.361743927001953, "global_step": 365657, "epoch": 2176} {"train_loss": -12.187273025512695, "global_step": 365658, "epoch": 2176} {"train_loss": -11.687281608581543, "global_step": 365659, "epoch": 2176} {"train_loss": -11.779145240783691, "global_step": 365660, "epoch": 2176} {"train_loss": -12.031049728393555, "global_step": 365661, "epoch": 2176} {"train_loss": -11.447275161743164, "global_step": 365662, "epoch": 2176} {"train_loss": -12.215272903442383, "global_step": 365663, "epoch": 2176} {"train_loss": -11.921806335449219, "global_step": 365664, "epoch": 2176} {"train_loss": -11.6841402053833, "global_step": 365665, "epoch": 2176} {"train_loss": -12.066022872924805, "global_step": 365666, "epoch": 2176} {"train_loss": -12.149112701416016, "global_step": 365667, "epoch": 2176} {"train_loss": -11.545591354370117, "global_step": 365668, "epoch": 2176} {"train_loss": -12.346929550170898, "global_step": 365669, "epoch": 2176} {"train_loss": -11.983675003051758, "global_step": 365670, "epoch": 2176} {"train_loss": -12.19986343383789, "global_step": 365671, "epoch": 2176} {"train_loss": -12.166519165039062, "global_step": 365672, "epoch": 2176} {"train_loss": -12.607717514038086, "global_step": 365673, "epoch": 2176} {"train_loss": -12.37147045135498, "global_step": 365674, "epoch": 2176} {"train_loss": -12.364152908325195, "global_step": 365675, "epoch": 2176} {"train_loss": -12.516212463378906, "global_step": 365676, "epoch": 2176} {"train_loss": -12.62490463256836, "global_step": 365677, "epoch": 2176} {"train_loss": -12.318466186523438, "global_step": 365678, "epoch": 2176} {"train_loss": -12.162724494934082, "global_step": 365679, "epoch": 2176} {"train_loss": -12.391263961791992, "global_step": 365680, "epoch": 2176} {"train_loss": -12.156846046447754, "global_step": 365681, "epoch": 2176} {"train_loss": -12.093433380126953, "global_step": 365682, "epoch": 2176} {"train_loss": -12.519442558288574, "global_step": 365683, "epoch": 2176} {"train_loss": -12.001842498779297, "global_step": 365684, "epoch": 2176} {"train_loss": -12.26602554321289, "global_step": 365685, "epoch": 2176} {"train_loss": -12.323161125183105, "global_step": 365686, "epoch": 2176} {"train_loss": -12.23050308227539, "global_step": 365687, "epoch": 2176} {"train_loss": -12.179317474365234, "global_step": 365688, "epoch": 2176} {"train_loss": -12.375051498413086, "global_step": 365689, "epoch": 2176} {"train_loss": -12.161029815673828, "global_step": 365690, "epoch": 2176} {"train_loss": -12.141311645507812, "global_step": 365691, "epoch": 2176} {"train_loss": -12.45513916015625, "global_step": 365692, "epoch": 2176} {"train_loss": -12.061036109924316, "global_step": 365693, "epoch": 2176} {"train_loss": -12.088546752929688, "global_step": 365694, "epoch": 2176} {"train_loss": -12.580018997192383, "global_step": 365695, "epoch": 2176} {"train_loss": -12.362129211425781, "global_step": 365696, "epoch": 2176} {"train_loss": -12.40089225769043, "global_step": 365697, "epoch": 2176} {"train_loss": -12.484180450439453, "global_step": 365698, "epoch": 2176} {"train_loss": -12.44996452331543, "global_step": 365699, "epoch": 2176} {"train_loss": -11.810842514038086, "global_step": 365700, "epoch": 2176} {"train_loss": -11.795675277709961, "global_step": 365701, "epoch": 2176} {"train_loss": -11.849455833435059, "global_step": 365702, "epoch": 2176} {"train_loss": -11.515447616577148, "global_step": 365703, "epoch": 2176} {"train_loss": -10.885567665100098, "global_step": 365704, "epoch": 2176} {"train_loss": -12.079927444458008, "global_step": 365705, "epoch": 2176} {"train_loss": -10.088111877441406, "global_step": 365706, "epoch": 2176} {"train_loss": -10.81904411315918, "global_step": 365707, "epoch": 2176} {"train_loss": -11.684822082519531, "global_step": 365708, "epoch": 2176} {"train_loss": -10.453908920288086, "global_step": 365709, "epoch": 2176} {"train_loss": -11.032516479492188, "global_step": 365710, "epoch": 2176} {"train_loss": -10.685450553894043, "global_step": 365711, "epoch": 2176} {"train_loss": -9.62443733215332, "global_step": 365712, "epoch": 2176} {"train_loss": -8.06624698638916, "global_step": 365713, "epoch": 2176} {"train_loss": -8.345087051391602, "global_step": 365714, "epoch": 2176} {"train_loss": -9.530682563781738, "global_step": 365715, "epoch": 2176} {"train_loss": -11.081683158874512, "global_step": 365716, "epoch": 2176} {"train_loss": -9.220535278320312, "global_step": 365717, "epoch": 2176} {"train_loss": -9.517864227294922, "global_step": 365718, "epoch": 2176} {"train_loss": -10.443920135498047, "global_step": 365719, "epoch": 2176} {"train_loss": -10.265835762023926, "global_step": 365720, "epoch": 2176} {"train_loss": -10.088781356811523, "global_step": 365721, "epoch": 2176} {"train_loss": -10.405186653137207, "global_step": 365722, "epoch": 2176} {"train_loss": -11.562952041625977, "global_step": 365723, "epoch": 2176} {"train_loss": -11.020291328430176, "global_step": 365724, "epoch": 2176} {"train_loss": -11.655497550964355, "global_step": 365725, "epoch": 2176} {"train_loss": -11.652091979980469, "global_step": 365726, "epoch": 2176} {"train_loss": -11.448009490966797, "global_step": 365727, "epoch": 2176} {"train_loss": -11.376794815063477, "global_step": 365728, "epoch": 2176} {"train_loss": -11.478926658630371, "global_step": 365729, "epoch": 2176} {"train_loss": -11.959742546081543, "global_step": 365730, "epoch": 2176} {"train_loss": -11.53897476196289, "global_step": 365731, "epoch": 2176} {"train_loss": -11.873916625976562, "global_step": 365732, "epoch": 2176} {"train_loss": -11.61091423034668, "global_step": 365733, "epoch": 2176} {"train_loss": -11.43797779083252, "global_step": 365734, "epoch": 2176} {"train_loss": -11.811333554131645, "global_step": 365735, "epoch": 2176, "val_loss": 287813.8125} {"train_loss": -11.027027130126953, "global_step": 365736, "epoch": 2177} {"train_loss": -11.592036247253418, "global_step": 365737, "epoch": 2177} {"train_loss": -11.141973495483398, "global_step": 365738, "epoch": 2177} {"train_loss": -11.975439071655273, "global_step": 365739, "epoch": 2177} {"train_loss": -11.579434394836426, "global_step": 365740, "epoch": 2177} {"train_loss": -12.058507919311523, "global_step": 365741, "epoch": 2177} {"train_loss": -11.57210922241211, "global_step": 365742, "epoch": 2177} {"train_loss": -11.9773530960083, "global_step": 365743, "epoch": 2177} {"train_loss": -10.671333312988281, "global_step": 365744, "epoch": 2177} {"train_loss": -12.078369140625, "global_step": 365745, "epoch": 2177} {"train_loss": -10.818933486938477, "global_step": 365746, "epoch": 2177} {"train_loss": -11.986934661865234, "global_step": 365747, "epoch": 2177} {"train_loss": -11.634902954101562, "global_step": 365748, "epoch": 2177} {"train_loss": -11.57916259765625, "global_step": 365749, "epoch": 2177} {"train_loss": -12.085565567016602, "global_step": 365750, "epoch": 2177} {"train_loss": -11.825675964355469, "global_step": 365751, "epoch": 2177} {"train_loss": -12.107956886291504, "global_step": 365752, "epoch": 2177} {"train_loss": -11.987241744995117, "global_step": 365753, "epoch": 2177} {"train_loss": -12.066729545593262, "global_step": 365754, "epoch": 2177} {"train_loss": -12.147311210632324, "global_step": 365755, "epoch": 2177} {"train_loss": -12.077134132385254, "global_step": 365756, "epoch": 2177} {"train_loss": -11.815187454223633, "global_step": 365757, "epoch": 2177} {"train_loss": -12.228212356567383, "global_step": 365758, "epoch": 2177} {"train_loss": -12.008462905883789, "global_step": 365759, "epoch": 2177} {"train_loss": -12.341867446899414, "global_step": 365760, "epoch": 2177} {"train_loss": -11.896909713745117, "global_step": 365761, "epoch": 2177} {"train_loss": -12.149147033691406, "global_step": 365762, "epoch": 2177} {"train_loss": -12.169897079467773, "global_step": 365763, "epoch": 2177} {"train_loss": -12.105698585510254, "global_step": 365764, "epoch": 2177} {"train_loss": -12.256125450134277, "global_step": 365765, "epoch": 2177} {"train_loss": -12.187058448791504, "global_step": 365766, "epoch": 2177} {"train_loss": -12.338150024414062, "global_step": 365767, "epoch": 2177} {"train_loss": -12.087754249572754, "global_step": 365768, "epoch": 2177} {"train_loss": -12.293191909790039, "global_step": 365769, "epoch": 2177} {"train_loss": -12.07427978515625, "global_step": 365770, "epoch": 2177} {"train_loss": -12.240140914916992, "global_step": 365771, "epoch": 2177} {"train_loss": -12.244009017944336, "global_step": 365772, "epoch": 2177} {"train_loss": -12.324687957763672, "global_step": 365773, "epoch": 2177} {"train_loss": -12.364639282226562, "global_step": 365774, "epoch": 2177} {"train_loss": -12.291753768920898, "global_step": 365775, "epoch": 2177} {"train_loss": -12.356935501098633, "global_step": 365776, "epoch": 2177} {"train_loss": -12.323042869567871, "global_step": 365777, "epoch": 2177} {"train_loss": -12.270585060119629, "global_step": 365778, "epoch": 2177} {"train_loss": -12.44898796081543, "global_step": 365779, "epoch": 2177} {"train_loss": -12.353912353515625, "global_step": 365780, "epoch": 2177} {"train_loss": -12.477746963500977, "global_step": 365781, "epoch": 2177} {"train_loss": -12.23466682434082, "global_step": 365782, "epoch": 2177} {"train_loss": -12.516170501708984, "global_step": 365783, "epoch": 2177} {"train_loss": -12.30978775024414, "global_step": 365784, "epoch": 2177} {"train_loss": -12.442729949951172, "global_step": 365785, "epoch": 2177} {"train_loss": -12.624309539794922, "global_step": 365786, "epoch": 2177} {"train_loss": -12.26938247680664, "global_step": 365787, "epoch": 2177} {"train_loss": -12.404733657836914, "global_step": 365788, "epoch": 2177} {"train_loss": -12.53683853149414, "global_step": 365789, "epoch": 2177} {"train_loss": -12.51347541809082, "global_step": 365790, "epoch": 2177} {"train_loss": -12.296792984008789, "global_step": 365791, "epoch": 2177} {"train_loss": -12.504459381103516, "global_step": 365792, "epoch": 2177} {"train_loss": -12.389188766479492, "global_step": 365793, "epoch": 2177} {"train_loss": -12.54061508178711, "global_step": 365794, "epoch": 2177} {"train_loss": -12.618066787719727, "global_step": 365795, "epoch": 2177} {"train_loss": -12.488887786865234, "global_step": 365796, "epoch": 2177} {"train_loss": -12.482709884643555, "global_step": 365797, "epoch": 2177} {"train_loss": -12.249149322509766, "global_step": 365798, "epoch": 2177} {"train_loss": -12.439898490905762, "global_step": 365799, "epoch": 2177} {"train_loss": -12.076757431030273, "global_step": 365800, "epoch": 2177} {"train_loss": -12.55239486694336, "global_step": 365801, "epoch": 2177} {"train_loss": -12.441246032714844, "global_step": 365802, "epoch": 2177} {"train_loss": -12.066696166992188, "global_step": 365803, "epoch": 2177} {"train_loss": -12.056166648864746, "global_step": 365804, "epoch": 2177} {"train_loss": -12.366033554077148, "global_step": 365805, "epoch": 2177} {"train_loss": -11.976978302001953, "global_step": 365806, "epoch": 2177} {"train_loss": -11.674771308898926, "global_step": 365807, "epoch": 2177} {"train_loss": -12.28899097442627, "global_step": 365808, "epoch": 2177} {"train_loss": -12.108589172363281, "global_step": 365809, "epoch": 2177} {"train_loss": -12.148845672607422, "global_step": 365810, "epoch": 2177} {"train_loss": -12.436182022094727, "global_step": 365811, "epoch": 2177} {"train_loss": -12.409454345703125, "global_step": 365812, "epoch": 2177} {"train_loss": -11.968755722045898, "global_step": 365813, "epoch": 2177} {"train_loss": -12.323188781738281, "global_step": 365814, "epoch": 2177} {"train_loss": -12.188594818115234, "global_step": 365815, "epoch": 2177} {"train_loss": -11.957420349121094, "global_step": 365816, "epoch": 2177} {"train_loss": -11.783146858215332, "global_step": 365817, "epoch": 2177} {"train_loss": -12.697221755981445, "global_step": 365818, "epoch": 2177} {"train_loss": -11.770854949951172, "global_step": 365819, "epoch": 2177} {"train_loss": -11.493293762207031, "global_step": 365820, "epoch": 2177} {"train_loss": -11.828460693359375, "global_step": 365821, "epoch": 2177} {"train_loss": -12.238590240478516, "global_step": 365822, "epoch": 2177} {"train_loss": -12.222294807434082, "global_step": 365823, "epoch": 2177} {"train_loss": -12.42048454284668, "global_step": 365824, "epoch": 2177} {"train_loss": -12.078024864196777, "global_step": 365825, "epoch": 2177} {"train_loss": -12.076099395751953, "global_step": 365826, "epoch": 2177} {"train_loss": -11.621326446533203, "global_step": 365827, "epoch": 2177} {"train_loss": -11.947148323059082, "global_step": 365828, "epoch": 2177} {"train_loss": -12.507457733154297, "global_step": 365829, "epoch": 2177} {"train_loss": -11.91560173034668, "global_step": 365830, "epoch": 2177} {"train_loss": -11.779571533203125, "global_step": 365831, "epoch": 2177} {"train_loss": -12.144859313964844, "global_step": 365832, "epoch": 2177} {"train_loss": -12.082079887390137, "global_step": 365833, "epoch": 2177} {"train_loss": -11.601200103759766, "global_step": 365834, "epoch": 2177} {"train_loss": -12.319900512695312, "global_step": 365835, "epoch": 2177} {"train_loss": -11.350062370300293, "global_step": 365836, "epoch": 2177} {"train_loss": -12.079866409301758, "global_step": 365837, "epoch": 2177} {"train_loss": -11.380406379699707, "global_step": 365838, "epoch": 2177} {"train_loss": -11.111701965332031, "global_step": 365839, "epoch": 2177} {"train_loss": -11.870179176330566, "global_step": 365840, "epoch": 2177} {"train_loss": -11.149127960205078, "global_step": 365841, "epoch": 2177} {"train_loss": -11.648791313171387, "global_step": 365842, "epoch": 2177} {"train_loss": -12.23530387878418, "global_step": 365843, "epoch": 2177} {"train_loss": -11.709514617919922, "global_step": 365844, "epoch": 2177} {"train_loss": -11.576372146606445, "global_step": 365845, "epoch": 2177} {"train_loss": -12.090044021606445, "global_step": 365846, "epoch": 2177} {"train_loss": -11.287099838256836, "global_step": 365847, "epoch": 2177} {"train_loss": -11.713434219360352, "global_step": 365848, "epoch": 2177} {"train_loss": -11.69575309753418, "global_step": 365849, "epoch": 2177} {"train_loss": -12.065492630004883, "global_step": 365850, "epoch": 2177} {"train_loss": -11.944951057434082, "global_step": 365851, "epoch": 2177} {"train_loss": -11.470836639404297, "global_step": 365852, "epoch": 2177} {"train_loss": -11.746048927307129, "global_step": 365853, "epoch": 2177} {"train_loss": -12.286628723144531, "global_step": 365854, "epoch": 2177} {"train_loss": -11.31489372253418, "global_step": 365855, "epoch": 2177} {"train_loss": -11.91729736328125, "global_step": 365856, "epoch": 2177} {"train_loss": -11.586174011230469, "global_step": 365857, "epoch": 2177} {"train_loss": -11.810014724731445, "global_step": 365858, "epoch": 2177} {"train_loss": -11.17547607421875, "global_step": 365859, "epoch": 2177} {"train_loss": -11.989655494689941, "global_step": 365860, "epoch": 2177} {"train_loss": -12.041189193725586, "global_step": 365861, "epoch": 2177} {"train_loss": -11.648523330688477, "global_step": 365862, "epoch": 2177} {"train_loss": -12.277036666870117, "global_step": 365863, "epoch": 2177} {"train_loss": -11.329343795776367, "global_step": 365864, "epoch": 2177} {"train_loss": -11.724611282348633, "global_step": 365865, "epoch": 2177} {"train_loss": -11.488340377807617, "global_step": 365866, "epoch": 2177} {"train_loss": -11.929017066955566, "global_step": 365867, "epoch": 2177} {"train_loss": -10.920125961303711, "global_step": 365868, "epoch": 2177} {"train_loss": -11.120183944702148, "global_step": 365869, "epoch": 2177} {"train_loss": -11.244057655334473, "global_step": 365870, "epoch": 2177} {"train_loss": -10.468070983886719, "global_step": 365871, "epoch": 2177} {"train_loss": -11.872201919555664, "global_step": 365872, "epoch": 2177} {"train_loss": -11.367918014526367, "global_step": 365873, "epoch": 2177} {"train_loss": -11.058431625366211, "global_step": 365874, "epoch": 2177} {"train_loss": -11.79393196105957, "global_step": 365875, "epoch": 2177} {"train_loss": -11.014578819274902, "global_step": 365876, "epoch": 2177} {"train_loss": -11.69153881072998, "global_step": 365877, "epoch": 2177} {"train_loss": -11.709409713745117, "global_step": 365878, "epoch": 2177} {"train_loss": -11.776752471923828, "global_step": 365879, "epoch": 2177} {"train_loss": -11.907242774963379, "global_step": 365880, "epoch": 2177} {"train_loss": -11.019691467285156, "global_step": 365881, "epoch": 2177} {"train_loss": -11.872047424316406, "global_step": 365882, "epoch": 2177} {"train_loss": -10.977099418640137, "global_step": 365883, "epoch": 2177} {"train_loss": -11.174482345581055, "global_step": 365884, "epoch": 2177} {"train_loss": -11.268775939941406, "global_step": 365885, "epoch": 2177} {"train_loss": -11.07118034362793, "global_step": 365886, "epoch": 2177} {"train_loss": -11.924928665161133, "global_step": 365887, "epoch": 2177} {"train_loss": -11.562531471252441, "global_step": 365888, "epoch": 2177} {"train_loss": -11.537250518798828, "global_step": 365889, "epoch": 2177} {"train_loss": -11.527837753295898, "global_step": 365890, "epoch": 2177} {"train_loss": -11.959014892578125, "global_step": 365891, "epoch": 2177} {"train_loss": -11.480192184448242, "global_step": 365892, "epoch": 2177} {"train_loss": -11.667686462402344, "global_step": 365893, "epoch": 2177} {"train_loss": -11.944530487060547, "global_step": 365894, "epoch": 2177} {"train_loss": -11.353971481323242, "global_step": 365895, "epoch": 2177} {"train_loss": -11.989107131958008, "global_step": 365896, "epoch": 2177} {"train_loss": -11.620681762695312, "global_step": 365897, "epoch": 2177} {"train_loss": -11.942499160766602, "global_step": 365898, "epoch": 2177} {"train_loss": -11.292895317077637, "global_step": 365899, "epoch": 2177} {"train_loss": -11.923087120056152, "global_step": 365900, "epoch": 2177} {"train_loss": -11.822212219238281, "global_step": 365901, "epoch": 2177} {"train_loss": -11.938887596130371, "global_step": 365902, "epoch": 2177} {"train_loss": -11.909965923854283, "global_step": 365903, "epoch": 2177, "val_loss": 291404.40625} {"train_loss": -11.535443305969238, "global_step": 365904, "epoch": 2178} {"train_loss": -12.218875885009766, "global_step": 365905, "epoch": 2178} {"train_loss": -12.049991607666016, "global_step": 365906, "epoch": 2178} {"train_loss": -12.291227340698242, "global_step": 365907, "epoch": 2178} {"train_loss": -12.110077857971191, "global_step": 365908, "epoch": 2178} {"train_loss": -12.1701021194458, "global_step": 365909, "epoch": 2178} {"train_loss": -12.317829132080078, "global_step": 365910, "epoch": 2178} {"train_loss": -12.60743522644043, "global_step": 365911, "epoch": 2178} {"train_loss": -12.230782508850098, "global_step": 365912, "epoch": 2178} {"train_loss": -12.676896095275879, "global_step": 365913, "epoch": 2178} {"train_loss": -12.27277660369873, "global_step": 365914, "epoch": 2178} {"train_loss": -12.298759460449219, "global_step": 365915, "epoch": 2178} {"train_loss": -12.452912330627441, "global_step": 365916, "epoch": 2178} {"train_loss": -12.414823532104492, "global_step": 365917, "epoch": 2178} {"train_loss": -12.221395492553711, "global_step": 365918, "epoch": 2178} {"train_loss": -12.255802154541016, "global_step": 365919, "epoch": 2178} {"train_loss": -12.274471282958984, "global_step": 365920, "epoch": 2178} {"train_loss": -12.047754287719727, "global_step": 365921, "epoch": 2178} {"train_loss": -12.145176887512207, "global_step": 365922, "epoch": 2178} {"train_loss": -12.339725494384766, "global_step": 365923, "epoch": 2178} {"train_loss": -12.05529499053955, "global_step": 365924, "epoch": 2178} {"train_loss": -12.310981750488281, "global_step": 365925, "epoch": 2178} {"train_loss": -12.31563949584961, "global_step": 365926, "epoch": 2178} {"train_loss": -12.250543594360352, "global_step": 365927, "epoch": 2178} {"train_loss": -12.26340103149414, "global_step": 365928, "epoch": 2178} {"train_loss": -12.289327621459961, "global_step": 365929, "epoch": 2178} {"train_loss": -12.340919494628906, "global_step": 365930, "epoch": 2178} {"train_loss": -12.484490394592285, "global_step": 365931, "epoch": 2178} {"train_loss": -12.197122573852539, "global_step": 365932, "epoch": 2178} {"train_loss": -12.500919342041016, "global_step": 365933, "epoch": 2178} {"train_loss": -12.40688419342041, "global_step": 365934, "epoch": 2178} {"train_loss": -12.392602920532227, "global_step": 365935, "epoch": 2178} {"train_loss": -12.461980819702148, "global_step": 365936, "epoch": 2178} {"train_loss": -12.364049911499023, "global_step": 365937, "epoch": 2178} {"train_loss": -12.392841339111328, "global_step": 365938, "epoch": 2178} {"train_loss": -12.266839027404785, "global_step": 365939, "epoch": 2178} {"train_loss": -12.65101432800293, "global_step": 365940, "epoch": 2178} {"train_loss": -12.572854042053223, "global_step": 365941, "epoch": 2178} {"train_loss": -12.501903533935547, "global_step": 365942, "epoch": 2178} {"train_loss": -12.54709243774414, "global_step": 365943, "epoch": 2178} {"train_loss": -12.631174087524414, "global_step": 365944, "epoch": 2178} {"train_loss": -12.451515197753906, "global_step": 365945, "epoch": 2178} {"train_loss": -12.559808731079102, "global_step": 365946, "epoch": 2178} {"train_loss": -12.792078018188477, "global_step": 365947, "epoch": 2178} {"train_loss": -12.463132858276367, "global_step": 365948, "epoch": 2178} {"train_loss": -12.626129150390625, "global_step": 365949, "epoch": 2178} {"train_loss": -12.578855514526367, "global_step": 365950, "epoch": 2178} {"train_loss": -12.37867259979248, "global_step": 365951, "epoch": 2178} {"train_loss": -12.682738304138184, "global_step": 365952, "epoch": 2178} {"train_loss": -12.572088241577148, "global_step": 365953, "epoch": 2178} {"train_loss": -12.597614288330078, "global_step": 365954, "epoch": 2178} {"train_loss": -12.654289245605469, "global_step": 365955, "epoch": 2178} {"train_loss": -12.670686721801758, "global_step": 365956, "epoch": 2178} {"train_loss": -12.744369506835938, "global_step": 365957, "epoch": 2178} {"train_loss": -12.804475784301758, "global_step": 365958, "epoch": 2178} {"train_loss": -12.458500862121582, "global_step": 365959, "epoch": 2178} {"train_loss": -12.836068153381348, "global_step": 365960, "epoch": 2178} {"train_loss": -12.734335899353027, "global_step": 365961, "epoch": 2178} {"train_loss": -12.776618957519531, "global_step": 365962, "epoch": 2178} {"train_loss": -12.687911987304688, "global_step": 365963, "epoch": 2178} {"train_loss": -12.833353042602539, "global_step": 365964, "epoch": 2178} {"train_loss": -12.743345260620117, "global_step": 365965, "epoch": 2178} {"train_loss": -12.489458084106445, "global_step": 365966, "epoch": 2178} {"train_loss": -12.474157333374023, "global_step": 365967, "epoch": 2178} {"train_loss": -12.684438705444336, "global_step": 365968, "epoch": 2178} {"train_loss": -12.584918022155762, "global_step": 365969, "epoch": 2178} {"train_loss": -11.929631233215332, "global_step": 365970, "epoch": 2178} {"train_loss": -12.494868278503418, "global_step": 365971, "epoch": 2178} {"train_loss": -12.659111022949219, "global_step": 365972, "epoch": 2178} {"train_loss": -11.979509353637695, "global_step": 365973, "epoch": 2178} {"train_loss": -12.037986755371094, "global_step": 365974, "epoch": 2178} {"train_loss": -12.678189277648926, "global_step": 365975, "epoch": 2178} {"train_loss": -12.791664123535156, "global_step": 365976, "epoch": 2178} {"train_loss": -12.086377143859863, "global_step": 365977, "epoch": 2178} {"train_loss": -11.906980514526367, "global_step": 365978, "epoch": 2178} {"train_loss": -12.273725509643555, "global_step": 365979, "epoch": 2178} {"train_loss": -12.136422157287598, "global_step": 365980, "epoch": 2178} {"train_loss": -10.32746696472168, "global_step": 365981, "epoch": 2178} {"train_loss": -12.326643943786621, "global_step": 365982, "epoch": 2178} {"train_loss": -9.99929428100586, "global_step": 365983, "epoch": 2178} {"train_loss": -12.14250659942627, "global_step": 365984, "epoch": 2178} {"train_loss": -12.053272247314453, "global_step": 365985, "epoch": 2178} {"train_loss": -11.368538856506348, "global_step": 365986, "epoch": 2178} {"train_loss": -12.084432601928711, "global_step": 365987, "epoch": 2178} {"train_loss": -12.324974060058594, "global_step": 365988, "epoch": 2178} {"train_loss": -12.086007118225098, "global_step": 365989, "epoch": 2178} {"train_loss": -11.589651107788086, "global_step": 365990, "epoch": 2178} {"train_loss": -12.313520431518555, "global_step": 365991, "epoch": 2178} {"train_loss": -12.333495140075684, "global_step": 365992, "epoch": 2178} {"train_loss": -12.233846664428711, "global_step": 365993, "epoch": 2178} {"train_loss": -12.213972091674805, "global_step": 365994, "epoch": 2178} {"train_loss": -11.787973403930664, "global_step": 365995, "epoch": 2178} {"train_loss": -12.139910697937012, "global_step": 365996, "epoch": 2178} {"train_loss": -11.61865520477295, "global_step": 365997, "epoch": 2178} {"train_loss": -9.270254135131836, "global_step": 365998, "epoch": 2178} {"train_loss": -9.86976432800293, "global_step": 365999, "epoch": 2178} {"train_loss": -12.01041316986084, "global_step": 366000, "epoch": 2178} {"train_loss": -9.354506492614746, "global_step": 366001, "epoch": 2178} {"train_loss": -9.896442413330078, "global_step": 366002, "epoch": 2178} {"train_loss": -10.47402286529541, "global_step": 366003, "epoch": 2178} {"train_loss": -10.05832290649414, "global_step": 366004, "epoch": 2178} {"train_loss": -11.33377742767334, "global_step": 366005, "epoch": 2178} {"train_loss": -10.607501983642578, "global_step": 366006, "epoch": 2178} {"train_loss": -10.99388313293457, "global_step": 366007, "epoch": 2178} {"train_loss": -12.024486541748047, "global_step": 366008, "epoch": 2178} {"train_loss": -11.008537292480469, "global_step": 366009, "epoch": 2178} {"train_loss": -11.083221435546875, "global_step": 366010, "epoch": 2178} {"train_loss": -11.684215545654297, "global_step": 366011, "epoch": 2178} {"train_loss": -11.373773574829102, "global_step": 366012, "epoch": 2178} {"train_loss": -11.571938514709473, "global_step": 366013, "epoch": 2178} {"train_loss": -11.636536598205566, "global_step": 366014, "epoch": 2178} {"train_loss": -11.901409149169922, "global_step": 366015, "epoch": 2178} {"train_loss": -11.73807144165039, "global_step": 366016, "epoch": 2178} {"train_loss": -11.850860595703125, "global_step": 366017, "epoch": 2178} {"train_loss": -11.091373443603516, "global_step": 366018, "epoch": 2178} {"train_loss": -12.055407524108887, "global_step": 366019, "epoch": 2178} {"train_loss": -11.389644622802734, "global_step": 366020, "epoch": 2178} {"train_loss": -11.474485397338867, "global_step": 366021, "epoch": 2178} {"train_loss": -11.208213806152344, "global_step": 366022, "epoch": 2178} {"train_loss": -11.123025894165039, "global_step": 366023, "epoch": 2178} {"train_loss": -11.336994171142578, "global_step": 366024, "epoch": 2178} {"train_loss": -11.303869247436523, "global_step": 366025, "epoch": 2178} {"train_loss": -11.591997146606445, "global_step": 366026, "epoch": 2178} {"train_loss": -11.511724472045898, "global_step": 366027, "epoch": 2178} {"train_loss": -12.042288780212402, "global_step": 366028, "epoch": 2178} {"train_loss": -11.55904483795166, "global_step": 366029, "epoch": 2178} {"train_loss": -12.175704956054688, "global_step": 366030, "epoch": 2178} {"train_loss": -11.814229965209961, "global_step": 366031, "epoch": 2178} {"train_loss": -11.842482566833496, "global_step": 366032, "epoch": 2178} {"train_loss": -11.876166343688965, "global_step": 366033, "epoch": 2178} {"train_loss": -11.987966537475586, "global_step": 366034, "epoch": 2178} {"train_loss": -11.995929718017578, "global_step": 366035, "epoch": 2178} {"train_loss": -12.017629623413086, "global_step": 366036, "epoch": 2178} {"train_loss": -11.953676223754883, "global_step": 366037, "epoch": 2178} {"train_loss": -11.476693153381348, "global_step": 366038, "epoch": 2178} {"train_loss": -11.769617080688477, "global_step": 366039, "epoch": 2178} {"train_loss": -11.32270622253418, "global_step": 366040, "epoch": 2178} {"train_loss": -12.253422737121582, "global_step": 366041, "epoch": 2178} {"train_loss": -11.328521728515625, "global_step": 366042, "epoch": 2178} {"train_loss": -12.12621784210205, "global_step": 366043, "epoch": 2178} {"train_loss": -12.000633239746094, "global_step": 366044, "epoch": 2178} {"train_loss": -11.898683547973633, "global_step": 366045, "epoch": 2178} {"train_loss": -11.783721923828125, "global_step": 366046, "epoch": 2178} {"train_loss": -11.760382652282715, "global_step": 366047, "epoch": 2178} {"train_loss": -12.239999771118164, "global_step": 366048, "epoch": 2178} {"train_loss": -11.67237663269043, "global_step": 366049, "epoch": 2178} {"train_loss": -12.167724609375, "global_step": 366050, "epoch": 2178} {"train_loss": -11.905696868896484, "global_step": 366051, "epoch": 2178} {"train_loss": -11.570812225341797, "global_step": 366052, "epoch": 2178} {"train_loss": -12.11845588684082, "global_step": 366053, "epoch": 2178} {"train_loss": -11.818533897399902, "global_step": 366054, "epoch": 2178} {"train_loss": -12.408157348632812, "global_step": 366055, "epoch": 2178} {"train_loss": -12.157313346862793, "global_step": 366056, "epoch": 2178} {"train_loss": -12.191488265991211, "global_step": 366057, "epoch": 2178} {"train_loss": -12.50164794921875, "global_step": 366058, "epoch": 2178} {"train_loss": -11.870052337646484, "global_step": 366059, "epoch": 2178} {"train_loss": -12.301372528076172, "global_step": 366060, "epoch": 2178} {"train_loss": -12.170677185058594, "global_step": 366061, "epoch": 2178} {"train_loss": -12.342062950134277, "global_step": 366062, "epoch": 2178} {"train_loss": -12.175765991210938, "global_step": 366063, "epoch": 2178} {"train_loss": -12.134941101074219, "global_step": 366064, "epoch": 2178} {"train_loss": -11.951181411743164, "global_step": 366065, "epoch": 2178} {"train_loss": -12.031147956848145, "global_step": 366066, "epoch": 2178} {"train_loss": -12.21165943145752, "global_step": 366067, "epoch": 2178} {"train_loss": -11.563695907592773, "global_step": 366068, "epoch": 2178} {"train_loss": -12.206501007080078, "global_step": 366069, "epoch": 2178} {"train_loss": -11.32952880859375, "global_step": 366070, "epoch": 2178} {"train_loss": -12.005073734692164, "global_step": 366071, "epoch": 2178, "val_loss": 292751.21875} {"train_loss": -11.996065139770508, "global_step": 366072, "epoch": 2179} {"train_loss": -12.155317306518555, "global_step": 366073, "epoch": 2179} {"train_loss": -12.381793975830078, "global_step": 366074, "epoch": 2179} {"train_loss": -12.121267318725586, "global_step": 366075, "epoch": 2179} {"train_loss": -12.109633445739746, "global_step": 366076, "epoch": 2179} {"train_loss": -12.329601287841797, "global_step": 366077, "epoch": 2179} {"train_loss": -12.139467239379883, "global_step": 366078, "epoch": 2179} {"train_loss": -12.380284309387207, "global_step": 366079, "epoch": 2179} {"train_loss": -12.069058418273926, "global_step": 366080, "epoch": 2179} {"train_loss": -12.345056533813477, "global_step": 366081, "epoch": 2179} {"train_loss": -12.154256820678711, "global_step": 366082, "epoch": 2179} {"train_loss": -12.140064239501953, "global_step": 366083, "epoch": 2179} {"train_loss": -11.98246955871582, "global_step": 366084, "epoch": 2179} {"train_loss": -12.449433326721191, "global_step": 366085, "epoch": 2179} {"train_loss": -12.522747039794922, "global_step": 366086, "epoch": 2179} {"train_loss": -12.453495979309082, "global_step": 366087, "epoch": 2179} {"train_loss": -12.55064582824707, "global_step": 366088, "epoch": 2179} {"train_loss": -12.665680885314941, "global_step": 366089, "epoch": 2179} {"train_loss": -12.495672225952148, "global_step": 366090, "epoch": 2179} {"train_loss": -12.748205184936523, "global_step": 366091, "epoch": 2179} {"train_loss": -12.589478492736816, "global_step": 366092, "epoch": 2179} {"train_loss": -12.390296936035156, "global_step": 366093, "epoch": 2179} {"train_loss": -12.47671890258789, "global_step": 366094, "epoch": 2179} {"train_loss": -12.385822296142578, "global_step": 366095, "epoch": 2179} {"train_loss": -12.511910438537598, "global_step": 366096, "epoch": 2179} {"train_loss": -12.377546310424805, "global_step": 366097, "epoch": 2179} {"train_loss": -12.07054328918457, "global_step": 366098, "epoch": 2179} {"train_loss": -12.39355182647705, "global_step": 366099, "epoch": 2179} {"train_loss": -12.349700927734375, "global_step": 366100, "epoch": 2179} {"train_loss": -11.596126556396484, "global_step": 366101, "epoch": 2179} {"train_loss": -12.449280738830566, "global_step": 366102, "epoch": 2179} {"train_loss": -12.273048400878906, "global_step": 366103, "epoch": 2179} {"train_loss": -11.99364948272705, "global_step": 366104, "epoch": 2179} {"train_loss": -12.266980171203613, "global_step": 366105, "epoch": 2179} {"train_loss": -11.960282325744629, "global_step": 366106, "epoch": 2179} {"train_loss": -12.498758316040039, "global_step": 366107, "epoch": 2179} {"train_loss": -12.28982162475586, "global_step": 366108, "epoch": 2179} {"train_loss": -12.235736846923828, "global_step": 366109, "epoch": 2179} {"train_loss": -12.327693939208984, "global_step": 366110, "epoch": 2179} {"train_loss": -12.468038558959961, "global_step": 366111, "epoch": 2179} {"train_loss": -12.544797897338867, "global_step": 366112, "epoch": 2179} {"train_loss": -12.18795394897461, "global_step": 366113, "epoch": 2179} {"train_loss": -12.412497520446777, "global_step": 366114, "epoch": 2179} {"train_loss": -12.196516036987305, "global_step": 366115, "epoch": 2179} {"train_loss": -12.753059387207031, "global_step": 366116, "epoch": 2179} {"train_loss": -12.223276138305664, "global_step": 366117, "epoch": 2179} {"train_loss": -12.019426345825195, "global_step": 366118, "epoch": 2179} {"train_loss": -12.264835357666016, "global_step": 366119, "epoch": 2179} {"train_loss": -12.602781295776367, "global_step": 366120, "epoch": 2179} {"train_loss": -11.979984283447266, "global_step": 366121, "epoch": 2179} {"train_loss": -12.340946197509766, "global_step": 366122, "epoch": 2179} {"train_loss": -12.223287582397461, "global_step": 366123, "epoch": 2179} {"train_loss": -12.643028259277344, "global_step": 366124, "epoch": 2179} {"train_loss": -12.19570541381836, "global_step": 366125, "epoch": 2179} {"train_loss": -12.576183319091797, "global_step": 366126, "epoch": 2179} {"train_loss": -12.218090057373047, "global_step": 366127, "epoch": 2179} {"train_loss": -12.663801193237305, "global_step": 366128, "epoch": 2179} {"train_loss": -12.351457595825195, "global_step": 366129, "epoch": 2179} {"train_loss": -12.573476791381836, "global_step": 366130, "epoch": 2179} {"train_loss": -12.307796478271484, "global_step": 366131, "epoch": 2179} {"train_loss": -12.346385955810547, "global_step": 366132, "epoch": 2179} {"train_loss": -12.730110168457031, "global_step": 366133, "epoch": 2179} {"train_loss": -12.206764221191406, "global_step": 366134, "epoch": 2179} {"train_loss": -12.40084457397461, "global_step": 366135, "epoch": 2179} {"train_loss": -12.430904388427734, "global_step": 366136, "epoch": 2179} {"train_loss": -12.162212371826172, "global_step": 366137, "epoch": 2179} {"train_loss": -11.900962829589844, "global_step": 366138, "epoch": 2179} {"train_loss": -12.287962913513184, "global_step": 366139, "epoch": 2179} {"train_loss": -12.345391273498535, "global_step": 366140, "epoch": 2179} {"train_loss": -11.538626670837402, "global_step": 366141, "epoch": 2179} {"train_loss": -12.087614059448242, "global_step": 366142, "epoch": 2179} {"train_loss": -12.109550476074219, "global_step": 366143, "epoch": 2179} {"train_loss": -12.47037124633789, "global_step": 366144, "epoch": 2179} {"train_loss": -12.602874755859375, "global_step": 366145, "epoch": 2179} {"train_loss": -12.457359313964844, "global_step": 366146, "epoch": 2179} {"train_loss": -12.53903579711914, "global_step": 366147, "epoch": 2179} {"train_loss": -12.473453521728516, "global_step": 366148, "epoch": 2179} {"train_loss": -12.188152313232422, "global_step": 366149, "epoch": 2179} {"train_loss": -11.707460403442383, "global_step": 366150, "epoch": 2179} {"train_loss": -12.308131217956543, "global_step": 366151, "epoch": 2179} {"train_loss": -12.486087799072266, "global_step": 366152, "epoch": 2179} {"train_loss": -11.811033248901367, "global_step": 366153, "epoch": 2179} {"train_loss": -11.972553253173828, "global_step": 366154, "epoch": 2179} {"train_loss": -12.194620132446289, "global_step": 366155, "epoch": 2179} {"train_loss": -12.617526054382324, "global_step": 366156, "epoch": 2179} {"train_loss": -12.02890396118164, "global_step": 366157, "epoch": 2179} {"train_loss": -12.666988372802734, "global_step": 366158, "epoch": 2179} {"train_loss": -12.29833984375, "global_step": 366159, "epoch": 2179} {"train_loss": -12.206109046936035, "global_step": 366160, "epoch": 2179} {"train_loss": -12.269896507263184, "global_step": 366161, "epoch": 2179} {"train_loss": -12.217443466186523, "global_step": 366162, "epoch": 2179} {"train_loss": -12.319178581237793, "global_step": 366163, "epoch": 2179} {"train_loss": -12.558795928955078, "global_step": 366164, "epoch": 2179} {"train_loss": -12.396275520324707, "global_step": 366165, "epoch": 2179} {"train_loss": -12.527017593383789, "global_step": 366166, "epoch": 2179} {"train_loss": -12.557405471801758, "global_step": 366167, "epoch": 2179} {"train_loss": -12.694517135620117, "global_step": 366168, "epoch": 2179} {"train_loss": -12.155342102050781, "global_step": 366169, "epoch": 2179} {"train_loss": -12.309757232666016, "global_step": 366170, "epoch": 2179} {"train_loss": -12.703659057617188, "global_step": 366171, "epoch": 2179} {"train_loss": -12.291402816772461, "global_step": 366172, "epoch": 2179} {"train_loss": -12.256874084472656, "global_step": 366173, "epoch": 2179} {"train_loss": -12.428417205810547, "global_step": 366174, "epoch": 2179} {"train_loss": -12.385199546813965, "global_step": 366175, "epoch": 2179} {"train_loss": -12.488824844360352, "global_step": 366176, "epoch": 2179} {"train_loss": -12.509058952331543, "global_step": 366177, "epoch": 2179} {"train_loss": -12.122714042663574, "global_step": 366178, "epoch": 2179} {"train_loss": -11.703706741333008, "global_step": 366179, "epoch": 2179} {"train_loss": -11.864757537841797, "global_step": 366180, "epoch": 2179} {"train_loss": -11.999685287475586, "global_step": 366181, "epoch": 2179} {"train_loss": -12.531211853027344, "global_step": 366182, "epoch": 2179} {"train_loss": -11.710859298706055, "global_step": 366183, "epoch": 2179} {"train_loss": -11.019038200378418, "global_step": 366184, "epoch": 2179} {"train_loss": -11.04125690460205, "global_step": 366185, "epoch": 2179} {"train_loss": -11.534433364868164, "global_step": 366186, "epoch": 2179} {"train_loss": -11.840579986572266, "global_step": 366187, "epoch": 2179} {"train_loss": -11.866162300109863, "global_step": 366188, "epoch": 2179} {"train_loss": -11.82297134399414, "global_step": 366189, "epoch": 2179} {"train_loss": -12.214094161987305, "global_step": 366190, "epoch": 2179} {"train_loss": -11.770402908325195, "global_step": 366191, "epoch": 2179} {"train_loss": -12.016006469726562, "global_step": 366192, "epoch": 2179} {"train_loss": -12.110309600830078, "global_step": 366193, "epoch": 2179} {"train_loss": -11.890968322753906, "global_step": 366194, "epoch": 2179} {"train_loss": -11.529321670532227, "global_step": 366195, "epoch": 2179} {"train_loss": -11.816471099853516, "global_step": 366196, "epoch": 2179} {"train_loss": -11.653311729431152, "global_step": 366197, "epoch": 2179} {"train_loss": -11.710758209228516, "global_step": 366198, "epoch": 2179} {"train_loss": -10.202032089233398, "global_step": 366199, "epoch": 2179} {"train_loss": -11.742953300476074, "global_step": 366200, "epoch": 2179} {"train_loss": -10.2490234375, "global_step": 366201, "epoch": 2179} {"train_loss": -10.831781387329102, "global_step": 366202, "epoch": 2179} {"train_loss": -11.272078514099121, "global_step": 366203, "epoch": 2179} {"train_loss": -11.227364540100098, "global_step": 366204, "epoch": 2179} {"train_loss": -11.690350532531738, "global_step": 366205, "epoch": 2179} {"train_loss": -11.321561813354492, "global_step": 366206, "epoch": 2179} {"train_loss": -11.728659629821777, "global_step": 366207, "epoch": 2179} {"train_loss": -11.797712326049805, "global_step": 366208, "epoch": 2179} {"train_loss": -11.546977996826172, "global_step": 366209, "epoch": 2179} {"train_loss": -12.282400131225586, "global_step": 366210, "epoch": 2179} {"train_loss": -11.504182815551758, "global_step": 366211, "epoch": 2179} {"train_loss": -12.108244895935059, "global_step": 366212, "epoch": 2179} {"train_loss": -11.702656745910645, "global_step": 366213, "epoch": 2179} {"train_loss": -12.394207954406738, "global_step": 366214, "epoch": 2179} {"train_loss": -11.59249496459961, "global_step": 366215, "epoch": 2179} {"train_loss": -12.149068832397461, "global_step": 366216, "epoch": 2179} {"train_loss": -11.950235366821289, "global_step": 366217, "epoch": 2179} {"train_loss": -12.21447467803955, "global_step": 366218, "epoch": 2179} {"train_loss": -11.815101623535156, "global_step": 366219, "epoch": 2179} {"train_loss": -12.102863311767578, "global_step": 366220, "epoch": 2179} {"train_loss": -11.984271049499512, "global_step": 366221, "epoch": 2179} {"train_loss": -12.011783599853516, "global_step": 366222, "epoch": 2179} {"train_loss": -11.96784782409668, "global_step": 366223, "epoch": 2179} {"train_loss": -12.119643211364746, "global_step": 366224, "epoch": 2179} {"train_loss": -11.956337928771973, "global_step": 366225, "epoch": 2179} {"train_loss": -12.272187232971191, "global_step": 366226, "epoch": 2179} {"train_loss": -11.617713928222656, "global_step": 366227, "epoch": 2179} {"train_loss": -12.1630859375, "global_step": 366228, "epoch": 2179} {"train_loss": -11.66862678527832, "global_step": 366229, "epoch": 2179} {"train_loss": -12.281978607177734, "global_step": 366230, "epoch": 2179} {"train_loss": -11.997184753417969, "global_step": 366231, "epoch": 2179} {"train_loss": -12.05435562133789, "global_step": 366232, "epoch": 2179} {"train_loss": -11.23531723022461, "global_step": 366233, "epoch": 2179} {"train_loss": -11.590113639831543, "global_step": 366234, "epoch": 2179} {"train_loss": -11.689380645751953, "global_step": 366235, "epoch": 2179} {"train_loss": -11.704534530639648, "global_step": 366236, "epoch": 2179} {"train_loss": -12.187582969665527, "global_step": 366237, "epoch": 2179} {"train_loss": -11.553206443786621, "global_step": 366238, "epoch": 2179} {"train_loss": -12.11643750326974, "global_step": 366239, "epoch": 2179, "val_loss": 292236.65625} {"train_loss": -12.125154495239258, "global_step": 366240, "epoch": 2180} {"train_loss": -12.273334503173828, "global_step": 366241, "epoch": 2180} {"train_loss": -12.152250289916992, "global_step": 366242, "epoch": 2180} {"train_loss": -11.68012523651123, "global_step": 366243, "epoch": 2180} {"train_loss": -12.293638229370117, "global_step": 366244, "epoch": 2180} {"train_loss": -11.504903793334961, "global_step": 366245, "epoch": 2180} {"train_loss": -12.186342239379883, "global_step": 366246, "epoch": 2180} {"train_loss": -11.987013816833496, "global_step": 366247, "epoch": 2180} {"train_loss": -11.897541046142578, "global_step": 366248, "epoch": 2180} {"train_loss": -12.104061126708984, "global_step": 366249, "epoch": 2180} {"train_loss": -11.610898971557617, "global_step": 366250, "epoch": 2180} {"train_loss": -12.098505973815918, "global_step": 366251, "epoch": 2180} {"train_loss": -11.625490188598633, "global_step": 366252, "epoch": 2180} {"train_loss": -12.036941528320312, "global_step": 366253, "epoch": 2180} {"train_loss": -12.021127700805664, "global_step": 366254, "epoch": 2180} {"train_loss": -12.515008926391602, "global_step": 366255, "epoch": 2180} {"train_loss": -12.130799293518066, "global_step": 366256, "epoch": 2180} {"train_loss": -12.145586967468262, "global_step": 366257, "epoch": 2180} {"train_loss": -12.13302230834961, "global_step": 366258, "epoch": 2180} {"train_loss": -12.363533020019531, "global_step": 366259, "epoch": 2180} {"train_loss": -12.04541301727295, "global_step": 366260, "epoch": 2180} {"train_loss": -12.177946090698242, "global_step": 366261, "epoch": 2180} {"train_loss": -12.389129638671875, "global_step": 366262, "epoch": 2180} {"train_loss": -12.295003890991211, "global_step": 366263, "epoch": 2180} {"train_loss": -12.362107276916504, "global_step": 366264, "epoch": 2180} {"train_loss": -12.536877632141113, "global_step": 366265, "epoch": 2180} {"train_loss": -12.560333251953125, "global_step": 366266, "epoch": 2180} {"train_loss": -12.427796363830566, "global_step": 366267, "epoch": 2180} {"train_loss": -12.451748847961426, "global_step": 366268, "epoch": 2180} {"train_loss": -12.230695724487305, "global_step": 366269, "epoch": 2180} {"train_loss": -12.368942260742188, "global_step": 366270, "epoch": 2180} {"train_loss": -12.771442413330078, "global_step": 366271, "epoch": 2180} {"train_loss": -12.42748737335205, "global_step": 366272, "epoch": 2180} {"train_loss": -12.615100860595703, "global_step": 366273, "epoch": 2180} {"train_loss": -12.152532577514648, "global_step": 366274, "epoch": 2180} {"train_loss": -12.465865135192871, "global_step": 366275, "epoch": 2180} {"train_loss": -12.24887752532959, "global_step": 366276, "epoch": 2180} {"train_loss": -11.91877555847168, "global_step": 366277, "epoch": 2180} {"train_loss": -12.22357177734375, "global_step": 366278, "epoch": 2180} {"train_loss": -11.997398376464844, "global_step": 366279, "epoch": 2180} {"train_loss": -12.415074348449707, "global_step": 366280, "epoch": 2180} {"train_loss": -11.335819244384766, "global_step": 366281, "epoch": 2180} {"train_loss": -11.899116516113281, "global_step": 366282, "epoch": 2180} {"train_loss": -12.214653968811035, "global_step": 366283, "epoch": 2180} {"train_loss": -12.208154678344727, "global_step": 366284, "epoch": 2180} {"train_loss": -12.411886215209961, "global_step": 366285, "epoch": 2180} {"train_loss": -11.930545806884766, "global_step": 366286, "epoch": 2180} {"train_loss": -12.012002944946289, "global_step": 366287, "epoch": 2180} {"train_loss": -12.459123611450195, "global_step": 366288, "epoch": 2180} {"train_loss": -11.25249195098877, "global_step": 366289, "epoch": 2180} {"train_loss": -12.024134635925293, "global_step": 366290, "epoch": 2180} {"train_loss": -12.401243209838867, "global_step": 366291, "epoch": 2180} {"train_loss": -12.048982620239258, "global_step": 366292, "epoch": 2180} {"train_loss": -12.179070472717285, "global_step": 366293, "epoch": 2180} {"train_loss": -12.329268455505371, "global_step": 366294, "epoch": 2180} {"train_loss": -12.206303596496582, "global_step": 366295, "epoch": 2180} {"train_loss": -12.270122528076172, "global_step": 366296, "epoch": 2180} {"train_loss": -12.47292709350586, "global_step": 366297, "epoch": 2180} {"train_loss": -11.867494583129883, "global_step": 366298, "epoch": 2180} {"train_loss": -12.151357650756836, "global_step": 366299, "epoch": 2180} {"train_loss": -12.56511116027832, "global_step": 366300, "epoch": 2180} {"train_loss": -11.854630470275879, "global_step": 366301, "epoch": 2180} {"train_loss": -12.50921630859375, "global_step": 366302, "epoch": 2180} {"train_loss": -12.239034652709961, "global_step": 366303, "epoch": 2180} {"train_loss": -12.28592586517334, "global_step": 366304, "epoch": 2180} {"train_loss": -12.451715469360352, "global_step": 366305, "epoch": 2180} {"train_loss": -12.218734741210938, "global_step": 366306, "epoch": 2180} {"train_loss": -12.243194580078125, "global_step": 366307, "epoch": 2180} {"train_loss": -12.34970760345459, "global_step": 366308, "epoch": 2180} {"train_loss": -11.78787612915039, "global_step": 366309, "epoch": 2180} {"train_loss": -11.949825286865234, "global_step": 366310, "epoch": 2180} {"train_loss": -11.350359916687012, "global_step": 366311, "epoch": 2180} {"train_loss": -12.221385955810547, "global_step": 366312, "epoch": 2180} {"train_loss": -11.653463363647461, "global_step": 366313, "epoch": 2180} {"train_loss": -11.682450294494629, "global_step": 366314, "epoch": 2180} {"train_loss": -12.506324768066406, "global_step": 366315, "epoch": 2180} {"train_loss": -11.805809020996094, "global_step": 366316, "epoch": 2180} {"train_loss": -12.131998062133789, "global_step": 366317, "epoch": 2180} {"train_loss": -12.008140563964844, "global_step": 366318, "epoch": 2180} {"train_loss": -12.39999008178711, "global_step": 366319, "epoch": 2180} {"train_loss": -11.501214981079102, "global_step": 366320, "epoch": 2180} {"train_loss": -12.059225082397461, "global_step": 366321, "epoch": 2180} {"train_loss": -12.31587028503418, "global_step": 366322, "epoch": 2180} {"train_loss": -11.632808685302734, "global_step": 366323, "epoch": 2180} {"train_loss": -12.00536823272705, "global_step": 366324, "epoch": 2180} {"train_loss": -12.040325164794922, "global_step": 366325, "epoch": 2180} {"train_loss": -12.195564270019531, "global_step": 366326, "epoch": 2180} {"train_loss": -11.956623077392578, "global_step": 366327, "epoch": 2180} {"train_loss": -12.563582420349121, "global_step": 366328, "epoch": 2180} {"train_loss": -11.912290573120117, "global_step": 366329, "epoch": 2180} {"train_loss": -12.211252212524414, "global_step": 366330, "epoch": 2180} {"train_loss": -12.06206226348877, "global_step": 366331, "epoch": 2180} {"train_loss": -12.227203369140625, "global_step": 366332, "epoch": 2180} {"train_loss": -11.960012435913086, "global_step": 366333, "epoch": 2180} {"train_loss": -12.356391906738281, "global_step": 366334, "epoch": 2180} {"train_loss": -11.68274211883545, "global_step": 366335, "epoch": 2180} {"train_loss": -12.399192810058594, "global_step": 366336, "epoch": 2180} {"train_loss": -11.918365478515625, "global_step": 366337, "epoch": 2180} {"train_loss": -12.009203910827637, "global_step": 366338, "epoch": 2180} {"train_loss": -12.304834365844727, "global_step": 366339, "epoch": 2180} {"train_loss": -12.055230140686035, "global_step": 366340, "epoch": 2180} {"train_loss": -12.626544952392578, "global_step": 366341, "epoch": 2180} {"train_loss": -12.10807991027832, "global_step": 366342, "epoch": 2180} {"train_loss": -12.203319549560547, "global_step": 366343, "epoch": 2180} {"train_loss": -12.40431022644043, "global_step": 366344, "epoch": 2180} {"train_loss": -12.327747344970703, "global_step": 366345, "epoch": 2180} {"train_loss": -12.130051612854004, "global_step": 366346, "epoch": 2180} {"train_loss": -12.30605697631836, "global_step": 366347, "epoch": 2180} {"train_loss": -12.1422700881958, "global_step": 366348, "epoch": 2180} {"train_loss": -11.844852447509766, "global_step": 366349, "epoch": 2180} {"train_loss": -12.132863998413086, "global_step": 366350, "epoch": 2180} {"train_loss": -10.586078643798828, "global_step": 366351, "epoch": 2180} {"train_loss": -11.112525939941406, "global_step": 366352, "epoch": 2180} {"train_loss": -11.91071605682373, "global_step": 366353, "epoch": 2180} {"train_loss": -11.627992630004883, "global_step": 366354, "epoch": 2180} {"train_loss": -10.721017837524414, "global_step": 366355, "epoch": 2180} {"train_loss": -11.358784675598145, "global_step": 366356, "epoch": 2180} {"train_loss": -10.212226867675781, "global_step": 366357, "epoch": 2180} {"train_loss": -11.112822532653809, "global_step": 366358, "epoch": 2180} {"train_loss": -10.910361289978027, "global_step": 366359, "epoch": 2180} {"train_loss": -11.38920783996582, "global_step": 366360, "epoch": 2180} {"train_loss": -11.489044189453125, "global_step": 366361, "epoch": 2180} {"train_loss": -11.831791877746582, "global_step": 366362, "epoch": 2180} {"train_loss": -11.797675132751465, "global_step": 366363, "epoch": 2180} {"train_loss": -11.69642448425293, "global_step": 366364, "epoch": 2180} {"train_loss": -12.23000717163086, "global_step": 366365, "epoch": 2180} {"train_loss": -11.94552230834961, "global_step": 366366, "epoch": 2180} {"train_loss": -11.901342391967773, "global_step": 366367, "epoch": 2180} {"train_loss": -11.902856826782227, "global_step": 366368, "epoch": 2180} {"train_loss": -12.178998947143555, "global_step": 366369, "epoch": 2180} {"train_loss": -11.672969818115234, "global_step": 366370, "epoch": 2180} {"train_loss": -11.249393463134766, "global_step": 366371, "epoch": 2180} {"train_loss": -11.442806243896484, "global_step": 366372, "epoch": 2180} {"train_loss": -11.333276748657227, "global_step": 366373, "epoch": 2180} {"train_loss": -10.84545612335205, "global_step": 366374, "epoch": 2180} {"train_loss": -11.242422103881836, "global_step": 366375, "epoch": 2180} {"train_loss": -9.912067413330078, "global_step": 366376, "epoch": 2180} {"train_loss": -11.15949821472168, "global_step": 366377, "epoch": 2180} {"train_loss": -10.297698020935059, "global_step": 366378, "epoch": 2180} {"train_loss": -9.379721641540527, "global_step": 366379, "epoch": 2180} {"train_loss": -8.060138702392578, "global_step": 366380, "epoch": 2180} {"train_loss": -8.993032455444336, "global_step": 366381, "epoch": 2180} {"train_loss": -9.460603713989258, "global_step": 366382, "epoch": 2180} {"train_loss": -10.96159553527832, "global_step": 366383, "epoch": 2180} {"train_loss": -9.335058212280273, "global_step": 366384, "epoch": 2180} {"train_loss": -9.982904434204102, "global_step": 366385, "epoch": 2180} {"train_loss": -10.957490921020508, "global_step": 366386, "epoch": 2180} {"train_loss": -9.791467666625977, "global_step": 366387, "epoch": 2180} {"train_loss": -10.39599895477295, "global_step": 366388, "epoch": 2180} {"train_loss": -10.847140312194824, "global_step": 366389, "epoch": 2180} {"train_loss": -10.346905708312988, "global_step": 366390, "epoch": 2180} {"train_loss": -9.188065528869629, "global_step": 366391, "epoch": 2180} {"train_loss": -10.757757186889648, "global_step": 366392, "epoch": 2180} {"train_loss": -9.837654113769531, "global_step": 366393, "epoch": 2180} {"train_loss": -9.550058364868164, "global_step": 366394, "epoch": 2180} {"train_loss": -10.540277481079102, "global_step": 366395, "epoch": 2180} {"train_loss": -10.985026359558105, "global_step": 366396, "epoch": 2180} {"train_loss": -9.665204048156738, "global_step": 366397, "epoch": 2180} {"train_loss": -11.045557022094727, "global_step": 366398, "epoch": 2180} {"train_loss": -11.03874397277832, "global_step": 366399, "epoch": 2180} {"train_loss": -10.733787536621094, "global_step": 366400, "epoch": 2180} {"train_loss": -11.741920471191406, "global_step": 366401, "epoch": 2180} {"train_loss": -11.322545051574707, "global_step": 366402, "epoch": 2180} {"train_loss": -11.0120849609375, "global_step": 366403, "epoch": 2180} {"train_loss": -11.649415969848633, "global_step": 366404, "epoch": 2180} {"train_loss": -10.886964797973633, "global_step": 366405, "epoch": 2180} {"train_loss": -11.33802604675293, "global_step": 366406, "epoch": 2180} {"train_loss": -11.702366658619471, "global_step": 366407, "epoch": 2180, "val_loss": 283731.40625, "train_action_mse_error": 5.979158878326416} {"train_loss": -11.002508163452148, "global_step": 366408, "epoch": 2181} {"train_loss": -11.805384635925293, "global_step": 366409, "epoch": 2181} {"train_loss": -11.333577156066895, "global_step": 366410, "epoch": 2181} {"train_loss": -11.678680419921875, "global_step": 366411, "epoch": 2181} {"train_loss": -11.420549392700195, "global_step": 366412, "epoch": 2181} {"train_loss": -11.105249404907227, "global_step": 366413, "epoch": 2181} {"train_loss": -11.622405052185059, "global_step": 366414, "epoch": 2181} {"train_loss": -11.486002922058105, "global_step": 366415, "epoch": 2181} {"train_loss": -11.50503921508789, "global_step": 366416, "epoch": 2181} {"train_loss": -11.805927276611328, "global_step": 366417, "epoch": 2181} {"train_loss": -11.475658416748047, "global_step": 366418, "epoch": 2181} {"train_loss": -11.741451263427734, "global_step": 366419, "epoch": 2181} {"train_loss": -11.852079391479492, "global_step": 366420, "epoch": 2181} {"train_loss": -11.923521041870117, "global_step": 366421, "epoch": 2181} {"train_loss": -11.895341873168945, "global_step": 366422, "epoch": 2181} {"train_loss": -11.791937828063965, "global_step": 366423, "epoch": 2181} {"train_loss": -12.175135612487793, "global_step": 366424, "epoch": 2181} {"train_loss": -11.86569595336914, "global_step": 366425, "epoch": 2181} {"train_loss": -12.121540069580078, "global_step": 366426, "epoch": 2181} {"train_loss": -12.048956871032715, "global_step": 366427, "epoch": 2181} {"train_loss": -12.099294662475586, "global_step": 366428, "epoch": 2181} {"train_loss": -11.817720413208008, "global_step": 366429, "epoch": 2181} {"train_loss": -11.92687702178955, "global_step": 366430, "epoch": 2181} {"train_loss": -11.81078815460205, "global_step": 366431, "epoch": 2181} {"train_loss": -12.313820838928223, "global_step": 366432, "epoch": 2181} {"train_loss": -11.809135437011719, "global_step": 366433, "epoch": 2181} {"train_loss": -12.157159805297852, "global_step": 366434, "epoch": 2181} {"train_loss": -11.897109031677246, "global_step": 366435, "epoch": 2181} {"train_loss": -12.23251724243164, "global_step": 366436, "epoch": 2181} {"train_loss": -11.915964126586914, "global_step": 366437, "epoch": 2181} {"train_loss": -12.114091873168945, "global_step": 366438, "epoch": 2181} {"train_loss": -11.918103218078613, "global_step": 366439, "epoch": 2181} {"train_loss": -12.324275970458984, "global_step": 366440, "epoch": 2181} {"train_loss": -12.079346656799316, "global_step": 366441, "epoch": 2181} {"train_loss": -12.315317153930664, "global_step": 366442, "epoch": 2181} {"train_loss": -12.058767318725586, "global_step": 366443, "epoch": 2181} {"train_loss": -12.301469802856445, "global_step": 366444, "epoch": 2181} {"train_loss": -12.226784706115723, "global_step": 366445, "epoch": 2181} {"train_loss": -12.263543128967285, "global_step": 366446, "epoch": 2181} {"train_loss": -12.176885604858398, "global_step": 366447, "epoch": 2181} {"train_loss": -12.311083793640137, "global_step": 366448, "epoch": 2181} {"train_loss": -12.294422149658203, "global_step": 366449, "epoch": 2181} {"train_loss": -12.25021743774414, "global_step": 366450, "epoch": 2181} {"train_loss": -12.102523803710938, "global_step": 366451, "epoch": 2181} {"train_loss": -12.320069313049316, "global_step": 366452, "epoch": 2181} {"train_loss": -12.419066429138184, "global_step": 366453, "epoch": 2181} {"train_loss": -12.372102737426758, "global_step": 366454, "epoch": 2181} {"train_loss": -12.334662437438965, "global_step": 366455, "epoch": 2181} {"train_loss": -12.044554710388184, "global_step": 366456, "epoch": 2181} {"train_loss": -12.42691421508789, "global_step": 366457, "epoch": 2181} {"train_loss": -12.045207023620605, "global_step": 366458, "epoch": 2181} {"train_loss": -12.345868110656738, "global_step": 366459, "epoch": 2181} {"train_loss": -12.423038482666016, "global_step": 366460, "epoch": 2181} {"train_loss": -12.222387313842773, "global_step": 366461, "epoch": 2181} {"train_loss": -12.318635940551758, "global_step": 366462, "epoch": 2181} {"train_loss": -12.118047714233398, "global_step": 366463, "epoch": 2181} {"train_loss": -12.326730728149414, "global_step": 366464, "epoch": 2181} {"train_loss": -12.204435348510742, "global_step": 366465, "epoch": 2181} {"train_loss": -12.166597366333008, "global_step": 366466, "epoch": 2181} {"train_loss": -12.207578659057617, "global_step": 366467, "epoch": 2181} {"train_loss": -12.267261505126953, "global_step": 366468, "epoch": 2181} {"train_loss": -12.375524520874023, "global_step": 366469, "epoch": 2181} {"train_loss": -12.323974609375, "global_step": 366470, "epoch": 2181} {"train_loss": -12.285836219787598, "global_step": 366471, "epoch": 2181} {"train_loss": -12.384955406188965, "global_step": 366472, "epoch": 2181} {"train_loss": -12.214252471923828, "global_step": 366473, "epoch": 2181} {"train_loss": -12.34998893737793, "global_step": 366474, "epoch": 2181} {"train_loss": -12.290401458740234, "global_step": 366475, "epoch": 2181} {"train_loss": -12.482429504394531, "global_step": 366476, "epoch": 2181} {"train_loss": -12.378132820129395, "global_step": 366477, "epoch": 2181} {"train_loss": -12.421112060546875, "global_step": 366478, "epoch": 2181} {"train_loss": -12.133744239807129, "global_step": 366479, "epoch": 2181} {"train_loss": -12.435901641845703, "global_step": 366480, "epoch": 2181} {"train_loss": -12.558887481689453, "global_step": 366481, "epoch": 2181} {"train_loss": -12.651676177978516, "global_step": 366482, "epoch": 2181} {"train_loss": -12.379888534545898, "global_step": 366483, "epoch": 2181} {"train_loss": -12.600913047790527, "global_step": 366484, "epoch": 2181} {"train_loss": -12.534738540649414, "global_step": 366485, "epoch": 2181} {"train_loss": -12.446803092956543, "global_step": 366486, "epoch": 2181} {"train_loss": -12.584858894348145, "global_step": 366487, "epoch": 2181} {"train_loss": -12.577410697937012, "global_step": 366488, "epoch": 2181} {"train_loss": -12.533960342407227, "global_step": 366489, "epoch": 2181} {"train_loss": -12.333030700683594, "global_step": 366490, "epoch": 2181} {"train_loss": -12.591291427612305, "global_step": 366491, "epoch": 2181} {"train_loss": -12.629459381103516, "global_step": 366492, "epoch": 2181} {"train_loss": -12.791655540466309, "global_step": 366493, "epoch": 2181} {"train_loss": -12.734221458435059, "global_step": 366494, "epoch": 2181} {"train_loss": -12.797574996948242, "global_step": 366495, "epoch": 2181} {"train_loss": -12.732450485229492, "global_step": 366496, "epoch": 2181} {"train_loss": -12.4659423828125, "global_step": 366497, "epoch": 2181} {"train_loss": -12.486631393432617, "global_step": 366498, "epoch": 2181} {"train_loss": -12.796290397644043, "global_step": 366499, "epoch": 2181} {"train_loss": -12.743781089782715, "global_step": 366500, "epoch": 2181} {"train_loss": -12.100500106811523, "global_step": 366501, "epoch": 2181} {"train_loss": -12.561561584472656, "global_step": 366502, "epoch": 2181} {"train_loss": -12.682859420776367, "global_step": 366503, "epoch": 2181} {"train_loss": -12.65113639831543, "global_step": 366504, "epoch": 2181} {"train_loss": -12.534521102905273, "global_step": 366505, "epoch": 2181} {"train_loss": -12.783231735229492, "global_step": 366506, "epoch": 2181} {"train_loss": -12.467768669128418, "global_step": 366507, "epoch": 2181} {"train_loss": -12.739419937133789, "global_step": 366508, "epoch": 2181} {"train_loss": -12.642766952514648, "global_step": 366509, "epoch": 2181} {"train_loss": -12.854147911071777, "global_step": 366510, "epoch": 2181} {"train_loss": -12.770841598510742, "global_step": 366511, "epoch": 2181} {"train_loss": -12.58206558227539, "global_step": 366512, "epoch": 2181} {"train_loss": -12.762382507324219, "global_step": 366513, "epoch": 2181} {"train_loss": -12.479997634887695, "global_step": 366514, "epoch": 2181} {"train_loss": -12.771099090576172, "global_step": 366515, "epoch": 2181} {"train_loss": -12.879439353942871, "global_step": 366516, "epoch": 2181} {"train_loss": -12.87228775024414, "global_step": 366517, "epoch": 2181} {"train_loss": -12.773777961730957, "global_step": 366518, "epoch": 2181} {"train_loss": -12.603303909301758, "global_step": 366519, "epoch": 2181} {"train_loss": -12.575276374816895, "global_step": 366520, "epoch": 2181} {"train_loss": -11.761970520019531, "global_step": 366521, "epoch": 2181} {"train_loss": -12.253377914428711, "global_step": 366522, "epoch": 2181} {"train_loss": -12.396590232849121, "global_step": 366523, "epoch": 2181} {"train_loss": -12.743891716003418, "global_step": 366524, "epoch": 2181} {"train_loss": -12.460139274597168, "global_step": 366525, "epoch": 2181} {"train_loss": -12.303784370422363, "global_step": 366526, "epoch": 2181} {"train_loss": -11.670512199401855, "global_step": 366527, "epoch": 2181} {"train_loss": -11.813838005065918, "global_step": 366528, "epoch": 2181} {"train_loss": -12.3164701461792, "global_step": 366529, "epoch": 2181} {"train_loss": -12.188644409179688, "global_step": 366530, "epoch": 2181} {"train_loss": -11.406442642211914, "global_step": 366531, "epoch": 2181} {"train_loss": -10.311956405639648, "global_step": 366532, "epoch": 2181} {"train_loss": -11.171768188476562, "global_step": 366533, "epoch": 2181} {"train_loss": -10.32268238067627, "global_step": 366534, "epoch": 2181} {"train_loss": -8.348146438598633, "global_step": 366535, "epoch": 2181} {"train_loss": -11.024297714233398, "global_step": 366536, "epoch": 2181} {"train_loss": -7.549470901489258, "global_step": 366537, "epoch": 2181} {"train_loss": -6.796860218048096, "global_step": 366538, "epoch": 2181} {"train_loss": -5.908457279205322, "global_step": 366539, "epoch": 2181} {"train_loss": -6.376381874084473, "global_step": 366540, "epoch": 2181} {"train_loss": -7.169979572296143, "global_step": 366541, "epoch": 2181} {"train_loss": -6.659806251525879, "global_step": 366542, "epoch": 2181} {"train_loss": -6.681073188781738, "global_step": 366543, "epoch": 2181} {"train_loss": -7.127397060394287, "global_step": 366544, "epoch": 2181} {"train_loss": -6.519675254821777, "global_step": 366545, "epoch": 2181} {"train_loss": -7.645359039306641, "global_step": 366546, "epoch": 2181} {"train_loss": -6.87702751159668, "global_step": 366547, "epoch": 2181} {"train_loss": -7.392408847808838, "global_step": 366548, "epoch": 2181} {"train_loss": -7.134659767150879, "global_step": 366549, "epoch": 2181} {"train_loss": -7.681944370269775, "global_step": 366550, "epoch": 2181} {"train_loss": -7.500515937805176, "global_step": 366551, "epoch": 2181} {"train_loss": -8.49007797241211, "global_step": 366552, "epoch": 2181} {"train_loss": -7.423092842102051, "global_step": 366553, "epoch": 2181} {"train_loss": -8.293479919433594, "global_step": 366554, "epoch": 2181} {"train_loss": -8.019411087036133, "global_step": 366555, "epoch": 2181} {"train_loss": -8.441180229187012, "global_step": 366556, "epoch": 2181} {"train_loss": -8.174458503723145, "global_step": 366557, "epoch": 2181} {"train_loss": -8.570276260375977, "global_step": 366558, "epoch": 2181} {"train_loss": -8.748576164245605, "global_step": 366559, "epoch": 2181} {"train_loss": -8.313934326171875, "global_step": 366560, "epoch": 2181} {"train_loss": -9.19713306427002, "global_step": 366561, "epoch": 2181} {"train_loss": -7.842504501342773, "global_step": 366562, "epoch": 2181} {"train_loss": -8.498794555664062, "global_step": 366563, "epoch": 2181} {"train_loss": -9.572809219360352, "global_step": 366564, "epoch": 2181} {"train_loss": -8.716096878051758, "global_step": 366565, "epoch": 2181} {"train_loss": -8.711642265319824, "global_step": 366566, "epoch": 2181} {"train_loss": -8.55589485168457, "global_step": 366567, "epoch": 2181} {"train_loss": -9.011470794677734, "global_step": 366568, "epoch": 2181} {"train_loss": -9.038148880004883, "global_step": 366569, "epoch": 2181} {"train_loss": -9.217912673950195, "global_step": 366570, "epoch": 2181} {"train_loss": -9.176214218139648, "global_step": 366571, "epoch": 2181} {"train_loss": -9.277044296264648, "global_step": 366572, "epoch": 2181} {"train_loss": -9.524612426757812, "global_step": 366573, "epoch": 2181} {"train_loss": -9.085283279418945, "global_step": 366574, "epoch": 2181} {"train_loss": -11.222904528890338, "global_step": 366575, "epoch": 2181, "val_loss": 289048.6875} {"train_loss": -9.531994819641113, "global_step": 366576, "epoch": 2182} {"train_loss": -9.608131408691406, "global_step": 366577, "epoch": 2182} {"train_loss": -9.738603591918945, "global_step": 366578, "epoch": 2182} {"train_loss": -9.922833442687988, "global_step": 366579, "epoch": 2182} {"train_loss": -9.908474922180176, "global_step": 366580, "epoch": 2182} {"train_loss": -10.422089576721191, "global_step": 366581, "epoch": 2182} {"train_loss": -9.844368934631348, "global_step": 366582, "epoch": 2182} {"train_loss": -10.689640045166016, "global_step": 366583, "epoch": 2182} {"train_loss": -10.393569946289062, "global_step": 366584, "epoch": 2182} {"train_loss": -10.190957069396973, "global_step": 366585, "epoch": 2182} {"train_loss": -10.612103462219238, "global_step": 366586, "epoch": 2182} {"train_loss": -10.520431518554688, "global_step": 366587, "epoch": 2182} {"train_loss": -10.567235946655273, "global_step": 366588, "epoch": 2182} {"train_loss": -10.421566009521484, "global_step": 366589, "epoch": 2182} {"train_loss": -9.761981964111328, "global_step": 366590, "epoch": 2182} {"train_loss": -10.699270248413086, "global_step": 366591, "epoch": 2182} {"train_loss": -10.314830780029297, "global_step": 366592, "epoch": 2182} {"train_loss": -9.054193496704102, "global_step": 366593, "epoch": 2182} {"train_loss": -10.087380409240723, "global_step": 366594, "epoch": 2182} {"train_loss": -10.987500190734863, "global_step": 366595, "epoch": 2182} {"train_loss": -10.821479797363281, "global_step": 366596, "epoch": 2182} {"train_loss": -10.320975303649902, "global_step": 366597, "epoch": 2182} {"train_loss": -10.426008224487305, "global_step": 366598, "epoch": 2182} {"train_loss": -11.296953201293945, "global_step": 366599, "epoch": 2182} {"train_loss": -10.693436622619629, "global_step": 366600, "epoch": 2182} {"train_loss": -10.907443046569824, "global_step": 366601, "epoch": 2182} {"train_loss": -11.637316703796387, "global_step": 366602, "epoch": 2182} {"train_loss": -11.0277099609375, "global_step": 366603, "epoch": 2182} {"train_loss": -11.186437606811523, "global_step": 366604, "epoch": 2182} {"train_loss": -11.109322547912598, "global_step": 366605, "epoch": 2182} {"train_loss": -11.627252578735352, "global_step": 366606, "epoch": 2182} {"train_loss": -11.101308822631836, "global_step": 366607, "epoch": 2182} {"train_loss": -11.518857955932617, "global_step": 366608, "epoch": 2182} {"train_loss": -11.525089263916016, "global_step": 366609, "epoch": 2182} {"train_loss": -11.491847038269043, "global_step": 366610, "epoch": 2182} {"train_loss": -11.065702438354492, "global_step": 366611, "epoch": 2182} {"train_loss": -11.86029052734375, "global_step": 366612, "epoch": 2182} {"train_loss": -11.3549165725708, "global_step": 366613, "epoch": 2182} {"train_loss": -11.403846740722656, "global_step": 366614, "epoch": 2182} {"train_loss": -11.796346664428711, "global_step": 366615, "epoch": 2182} {"train_loss": -11.539934158325195, "global_step": 366616, "epoch": 2182} {"train_loss": -11.827081680297852, "global_step": 366617, "epoch": 2182} {"train_loss": -11.888509750366211, "global_step": 366618, "epoch": 2182} {"train_loss": -12.018499374389648, "global_step": 366619, "epoch": 2182} {"train_loss": -11.680604934692383, "global_step": 366620, "epoch": 2182} {"train_loss": -12.085284233093262, "global_step": 366621, "epoch": 2182} {"train_loss": -11.857946395874023, "global_step": 366622, "epoch": 2182} {"train_loss": -12.182161331176758, "global_step": 366623, "epoch": 2182} {"train_loss": -11.981033325195312, "global_step": 366624, "epoch": 2182} {"train_loss": -12.009881973266602, "global_step": 366625, "epoch": 2182} {"train_loss": -12.181718826293945, "global_step": 366626, "epoch": 2182} {"train_loss": -12.054601669311523, "global_step": 366627, "epoch": 2182} {"train_loss": -11.759916305541992, "global_step": 366628, "epoch": 2182} {"train_loss": -11.905889511108398, "global_step": 366629, "epoch": 2182} {"train_loss": -12.052879333496094, "global_step": 366630, "epoch": 2182} {"train_loss": -12.054458618164062, "global_step": 366631, "epoch": 2182} {"train_loss": -11.7863130569458, "global_step": 366632, "epoch": 2182} {"train_loss": -12.380365371704102, "global_step": 366633, "epoch": 2182} {"train_loss": -12.283218383789062, "global_step": 366634, "epoch": 2182} {"train_loss": -12.301063537597656, "global_step": 366635, "epoch": 2182} {"train_loss": -12.212352752685547, "global_step": 366636, "epoch": 2182} {"train_loss": -12.229951858520508, "global_step": 366637, "epoch": 2182} {"train_loss": -12.12946891784668, "global_step": 366638, "epoch": 2182} {"train_loss": -12.069034576416016, "global_step": 366639, "epoch": 2182} {"train_loss": -12.325307846069336, "global_step": 366640, "epoch": 2182} {"train_loss": -12.49149227142334, "global_step": 366641, "epoch": 2182} {"train_loss": -12.332225799560547, "global_step": 366642, "epoch": 2182} {"train_loss": -12.158668518066406, "global_step": 366643, "epoch": 2182} {"train_loss": -12.200480461120605, "global_step": 366644, "epoch": 2182} {"train_loss": -12.46958065032959, "global_step": 366645, "epoch": 2182} {"train_loss": -12.272512435913086, "global_step": 366646, "epoch": 2182} {"train_loss": -12.42179012298584, "global_step": 366647, "epoch": 2182} {"train_loss": -12.20535945892334, "global_step": 366648, "epoch": 2182} {"train_loss": -12.151893615722656, "global_step": 366649, "epoch": 2182} {"train_loss": -12.515987396240234, "global_step": 366650, "epoch": 2182} {"train_loss": -12.428829193115234, "global_step": 366651, "epoch": 2182} {"train_loss": -12.446661949157715, "global_step": 366652, "epoch": 2182} {"train_loss": -12.53103256225586, "global_step": 366653, "epoch": 2182} {"train_loss": -12.293466567993164, "global_step": 366654, "epoch": 2182} {"train_loss": -12.203547477722168, "global_step": 366655, "epoch": 2182} {"train_loss": -12.367980003356934, "global_step": 366656, "epoch": 2182} {"train_loss": -12.375770568847656, "global_step": 366657, "epoch": 2182} {"train_loss": -12.51335334777832, "global_step": 366658, "epoch": 2182} {"train_loss": -12.439069747924805, "global_step": 366659, "epoch": 2182} {"train_loss": -12.27676773071289, "global_step": 366660, "epoch": 2182} {"train_loss": -12.20435905456543, "global_step": 366661, "epoch": 2182} {"train_loss": -12.574658393859863, "global_step": 366662, "epoch": 2182} {"train_loss": -12.276211738586426, "global_step": 366663, "epoch": 2182} {"train_loss": -12.460670471191406, "global_step": 366664, "epoch": 2182} {"train_loss": -12.492025375366211, "global_step": 366665, "epoch": 2182} {"train_loss": -12.013361930847168, "global_step": 366666, "epoch": 2182} {"train_loss": -11.89621639251709, "global_step": 366667, "epoch": 2182} {"train_loss": -12.140931129455566, "global_step": 366668, "epoch": 2182} {"train_loss": -12.611204147338867, "global_step": 366669, "epoch": 2182} {"train_loss": -12.225114822387695, "global_step": 366670, "epoch": 2182} {"train_loss": -12.266483306884766, "global_step": 366671, "epoch": 2182} {"train_loss": -12.149835586547852, "global_step": 366672, "epoch": 2182} {"train_loss": -12.314474105834961, "global_step": 366673, "epoch": 2182} {"train_loss": -12.024103164672852, "global_step": 366674, "epoch": 2182} {"train_loss": -11.768641471862793, "global_step": 366675, "epoch": 2182} {"train_loss": -12.41408634185791, "global_step": 366676, "epoch": 2182} {"train_loss": -12.488243103027344, "global_step": 366677, "epoch": 2182} {"train_loss": -12.334961891174316, "global_step": 366678, "epoch": 2182} {"train_loss": -11.887313842773438, "global_step": 366679, "epoch": 2182} {"train_loss": -12.156734466552734, "global_step": 366680, "epoch": 2182} {"train_loss": -12.22227954864502, "global_step": 366681, "epoch": 2182} {"train_loss": -11.887161254882812, "global_step": 366682, "epoch": 2182} {"train_loss": -12.581294059753418, "global_step": 366683, "epoch": 2182} {"train_loss": -11.356212615966797, "global_step": 366684, "epoch": 2182} {"train_loss": -12.082304000854492, "global_step": 366685, "epoch": 2182} {"train_loss": -12.103015899658203, "global_step": 366686, "epoch": 2182} {"train_loss": -12.11600112915039, "global_step": 366687, "epoch": 2182} {"train_loss": -11.856310844421387, "global_step": 366688, "epoch": 2182} {"train_loss": -11.122014045715332, "global_step": 366689, "epoch": 2182} {"train_loss": -10.860672950744629, "global_step": 366690, "epoch": 2182} {"train_loss": -11.267805099487305, "global_step": 366691, "epoch": 2182} {"train_loss": -11.73233413696289, "global_step": 366692, "epoch": 2182} {"train_loss": -11.121973037719727, "global_step": 366693, "epoch": 2182} {"train_loss": -10.680952072143555, "global_step": 366694, "epoch": 2182} {"train_loss": -11.94035530090332, "global_step": 366695, "epoch": 2182} {"train_loss": -11.020812034606934, "global_step": 366696, "epoch": 2182} {"train_loss": -11.75222396850586, "global_step": 366697, "epoch": 2182} {"train_loss": -11.718098640441895, "global_step": 366698, "epoch": 2182} {"train_loss": -9.860406875610352, "global_step": 366699, "epoch": 2182} {"train_loss": -10.749357223510742, "global_step": 366700, "epoch": 2182} {"train_loss": -11.730679512023926, "global_step": 366701, "epoch": 2182} {"train_loss": -12.184041976928711, "global_step": 366702, "epoch": 2182} {"train_loss": -10.694869995117188, "global_step": 366703, "epoch": 2182} {"train_loss": -11.175427436828613, "global_step": 366704, "epoch": 2182} {"train_loss": -11.385356903076172, "global_step": 366705, "epoch": 2182} {"train_loss": -11.673971176147461, "global_step": 366706, "epoch": 2182} {"train_loss": -11.105823516845703, "global_step": 366707, "epoch": 2182} {"train_loss": -10.30689811706543, "global_step": 366708, "epoch": 2182} {"train_loss": -11.052770614624023, "global_step": 366709, "epoch": 2182} {"train_loss": -11.292974472045898, "global_step": 366710, "epoch": 2182} {"train_loss": -9.360383987426758, "global_step": 366711, "epoch": 2182} {"train_loss": -11.132226943969727, "global_step": 366712, "epoch": 2182} {"train_loss": -9.91726303100586, "global_step": 366713, "epoch": 2182} {"train_loss": -10.05289363861084, "global_step": 366714, "epoch": 2182} {"train_loss": -8.883142471313477, "global_step": 366715, "epoch": 2182} {"train_loss": -10.713166236877441, "global_step": 366716, "epoch": 2182} {"train_loss": -8.73266315460205, "global_step": 366717, "epoch": 2182} {"train_loss": -10.355663299560547, "global_step": 366718, "epoch": 2182} {"train_loss": -10.351617813110352, "global_step": 366719, "epoch": 2182} {"train_loss": -9.908926963806152, "global_step": 366720, "epoch": 2182} {"train_loss": -10.212748527526855, "global_step": 366721, "epoch": 2182} {"train_loss": -10.938093185424805, "global_step": 366722, "epoch": 2182} {"train_loss": -9.564016342163086, "global_step": 366723, "epoch": 2182} {"train_loss": -10.72589111328125, "global_step": 366724, "epoch": 2182} {"train_loss": -9.915436744689941, "global_step": 366725, "epoch": 2182} {"train_loss": -9.553508758544922, "global_step": 366726, "epoch": 2182} {"train_loss": -9.460990905761719, "global_step": 366727, "epoch": 2182} {"train_loss": -10.716176986694336, "global_step": 366728, "epoch": 2182} {"train_loss": -10.165077209472656, "global_step": 366729, "epoch": 2182} {"train_loss": -9.908187866210938, "global_step": 366730, "epoch": 2182} {"train_loss": -9.648466110229492, "global_step": 366731, "epoch": 2182} {"train_loss": -10.307305335998535, "global_step": 366732, "epoch": 2182} {"train_loss": -11.069124221801758, "global_step": 366733, "epoch": 2182} {"train_loss": -10.684661865234375, "global_step": 366734, "epoch": 2182} {"train_loss": -11.501725196838379, "global_step": 366735, "epoch": 2182} {"train_loss": -10.283218383789062, "global_step": 366736, "epoch": 2182} {"train_loss": -11.366134643554688, "global_step": 366737, "epoch": 2182} {"train_loss": -10.785120010375977, "global_step": 366738, "epoch": 2182} {"train_loss": -10.27649211883545, "global_step": 366739, "epoch": 2182} {"train_loss": -10.989117622375488, "global_step": 366740, "epoch": 2182} {"train_loss": -11.203432083129883, "global_step": 366741, "epoch": 2182} {"train_loss": -11.014009475708008, "global_step": 366742, "epoch": 2182} {"train_loss": -11.332391858100891, "global_step": 366743, "epoch": 2182, "val_loss": 294204.875} {"train_loss": -11.75865364074707, "global_step": 366744, "epoch": 2183} {"train_loss": -10.377163887023926, "global_step": 366745, "epoch": 2183} {"train_loss": -11.397621154785156, "global_step": 366746, "epoch": 2183} {"train_loss": -11.404363632202148, "global_step": 366747, "epoch": 2183} {"train_loss": -11.420561790466309, "global_step": 366748, "epoch": 2183} {"train_loss": -11.103822708129883, "global_step": 366749, "epoch": 2183} {"train_loss": -11.12127685546875, "global_step": 366750, "epoch": 2183} {"train_loss": -11.014969825744629, "global_step": 366751, "epoch": 2183} {"train_loss": -11.233562469482422, "global_step": 366752, "epoch": 2183} {"train_loss": -11.142327308654785, "global_step": 366753, "epoch": 2183} {"train_loss": -11.006586074829102, "global_step": 366754, "epoch": 2183} {"train_loss": -11.624435424804688, "global_step": 366755, "epoch": 2183} {"train_loss": -11.554159164428711, "global_step": 366756, "epoch": 2183} {"train_loss": -11.209733963012695, "global_step": 366757, "epoch": 2183} {"train_loss": -11.528400421142578, "global_step": 366758, "epoch": 2183} {"train_loss": -11.364715576171875, "global_step": 366759, "epoch": 2183} {"train_loss": -11.296783447265625, "global_step": 366760, "epoch": 2183} {"train_loss": -11.362964630126953, "global_step": 366761, "epoch": 2183} {"train_loss": -11.422500610351562, "global_step": 366762, "epoch": 2183} {"train_loss": -11.504846572875977, "global_step": 366763, "epoch": 2183} {"train_loss": -11.84556770324707, "global_step": 366764, "epoch": 2183} {"train_loss": -11.651850700378418, "global_step": 366765, "epoch": 2183} {"train_loss": -11.881421089172363, "global_step": 366766, "epoch": 2183} {"train_loss": -11.648662567138672, "global_step": 366767, "epoch": 2183} {"train_loss": -11.400064468383789, "global_step": 366768, "epoch": 2183} {"train_loss": -11.827797889709473, "global_step": 366769, "epoch": 2183} {"train_loss": -11.727885246276855, "global_step": 366770, "epoch": 2183} {"train_loss": -11.831639289855957, "global_step": 366771, "epoch": 2183} {"train_loss": -11.748355865478516, "global_step": 366772, "epoch": 2183} {"train_loss": -11.83481502532959, "global_step": 366773, "epoch": 2183} {"train_loss": -11.860649108886719, "global_step": 366774, "epoch": 2183} {"train_loss": -11.862937927246094, "global_step": 366775, "epoch": 2183} {"train_loss": -12.254524230957031, "global_step": 366776, "epoch": 2183} {"train_loss": -11.853120803833008, "global_step": 366777, "epoch": 2183} {"train_loss": -11.882390975952148, "global_step": 366778, "epoch": 2183} {"train_loss": -11.730300903320312, "global_step": 366779, "epoch": 2183} {"train_loss": -11.879903793334961, "global_step": 366780, "epoch": 2183} {"train_loss": -11.908476829528809, "global_step": 366781, "epoch": 2183} {"train_loss": -11.848152160644531, "global_step": 366782, "epoch": 2183} {"train_loss": -12.085880279541016, "global_step": 366783, "epoch": 2183} {"train_loss": -10.344474792480469, "global_step": 366784, "epoch": 2183} {"train_loss": -12.152470588684082, "global_step": 366785, "epoch": 2183} {"train_loss": -12.073770523071289, "global_step": 366786, "epoch": 2183} {"train_loss": -12.085294723510742, "global_step": 366787, "epoch": 2183} {"train_loss": -12.086725234985352, "global_step": 366788, "epoch": 2183} {"train_loss": -11.907468795776367, "global_step": 366789, "epoch": 2183} {"train_loss": -12.134429931640625, "global_step": 366790, "epoch": 2183} {"train_loss": -11.98478889465332, "global_step": 366791, "epoch": 2183} {"train_loss": -12.10908317565918, "global_step": 366792, "epoch": 2183} {"train_loss": -11.801471710205078, "global_step": 366793, "epoch": 2183} {"train_loss": -11.827898025512695, "global_step": 366794, "epoch": 2183} {"train_loss": -12.353288650512695, "global_step": 366795, "epoch": 2183} {"train_loss": -11.571672439575195, "global_step": 366796, "epoch": 2183} {"train_loss": -12.19411849975586, "global_step": 366797, "epoch": 2183} {"train_loss": -11.712041854858398, "global_step": 366798, "epoch": 2183} {"train_loss": -12.07183837890625, "global_step": 366799, "epoch": 2183} {"train_loss": -12.028533935546875, "global_step": 366800, "epoch": 2183} {"train_loss": -11.897407531738281, "global_step": 366801, "epoch": 2183} {"train_loss": -12.273876190185547, "global_step": 366802, "epoch": 2183} {"train_loss": -11.83186149597168, "global_step": 366803, "epoch": 2183} {"train_loss": -12.164015769958496, "global_step": 366804, "epoch": 2183} {"train_loss": -11.318500518798828, "global_step": 366805, "epoch": 2183} {"train_loss": -11.886314392089844, "global_step": 366806, "epoch": 2183} {"train_loss": -12.23713493347168, "global_step": 366807, "epoch": 2183} {"train_loss": -11.917987823486328, "global_step": 366808, "epoch": 2183} {"train_loss": -12.175619125366211, "global_step": 366809, "epoch": 2183} {"train_loss": -12.007186889648438, "global_step": 366810, "epoch": 2183} {"train_loss": -12.262277603149414, "global_step": 366811, "epoch": 2183} {"train_loss": -12.122577667236328, "global_step": 366812, "epoch": 2183} {"train_loss": -12.027498245239258, "global_step": 366813, "epoch": 2183} {"train_loss": -11.81792163848877, "global_step": 366814, "epoch": 2183} {"train_loss": -12.184741973876953, "global_step": 366815, "epoch": 2183} {"train_loss": -12.19754409790039, "global_step": 366816, "epoch": 2183} {"train_loss": -12.190139770507812, "global_step": 366817, "epoch": 2183} {"train_loss": -12.304652214050293, "global_step": 366818, "epoch": 2183} {"train_loss": -12.31137466430664, "global_step": 366819, "epoch": 2183} {"train_loss": -12.169397354125977, "global_step": 366820, "epoch": 2183} {"train_loss": -12.289310455322266, "global_step": 366821, "epoch": 2183} {"train_loss": -12.275042533874512, "global_step": 366822, "epoch": 2183} {"train_loss": -12.045869827270508, "global_step": 366823, "epoch": 2183} {"train_loss": -12.311203956604004, "global_step": 366824, "epoch": 2183} {"train_loss": -12.401505470275879, "global_step": 366825, "epoch": 2183} {"train_loss": -12.258973121643066, "global_step": 366826, "epoch": 2183} {"train_loss": -12.073665618896484, "global_step": 366827, "epoch": 2183} {"train_loss": -12.260719299316406, "global_step": 366828, "epoch": 2183} {"train_loss": -12.05245590209961, "global_step": 366829, "epoch": 2183} {"train_loss": -12.31534194946289, "global_step": 366830, "epoch": 2183} {"train_loss": -12.092058181762695, "global_step": 366831, "epoch": 2183} {"train_loss": -12.260814666748047, "global_step": 366832, "epoch": 2183} {"train_loss": -12.13658618927002, "global_step": 366833, "epoch": 2183} {"train_loss": -12.446671485900879, "global_step": 366834, "epoch": 2183} {"train_loss": -12.488473892211914, "global_step": 366835, "epoch": 2183} {"train_loss": -12.099679946899414, "global_step": 366836, "epoch": 2183} {"train_loss": -12.279611587524414, "global_step": 366837, "epoch": 2183} {"train_loss": -12.25920295715332, "global_step": 366838, "epoch": 2183} {"train_loss": -12.387105941772461, "global_step": 366839, "epoch": 2183} {"train_loss": -12.584070205688477, "global_step": 366840, "epoch": 2183} {"train_loss": -12.370816230773926, "global_step": 366841, "epoch": 2183} {"train_loss": -12.480388641357422, "global_step": 366842, "epoch": 2183} {"train_loss": -12.521688461303711, "global_step": 366843, "epoch": 2183} {"train_loss": -12.116912841796875, "global_step": 366844, "epoch": 2183} {"train_loss": -11.96683406829834, "global_step": 366845, "epoch": 2183} {"train_loss": -12.235405921936035, "global_step": 366846, "epoch": 2183} {"train_loss": -11.974285125732422, "global_step": 366847, "epoch": 2183} {"train_loss": -12.423606872558594, "global_step": 366848, "epoch": 2183} {"train_loss": -12.286090850830078, "global_step": 366849, "epoch": 2183} {"train_loss": -12.356660842895508, "global_step": 366850, "epoch": 2183} {"train_loss": -12.066974639892578, "global_step": 366851, "epoch": 2183} {"train_loss": -12.36078929901123, "global_step": 366852, "epoch": 2183} {"train_loss": -11.317145347595215, "global_step": 366853, "epoch": 2183} {"train_loss": -11.02468490600586, "global_step": 366854, "epoch": 2183} {"train_loss": -11.784900665283203, "global_step": 366855, "epoch": 2183} {"train_loss": -12.201925277709961, "global_step": 366856, "epoch": 2183} {"train_loss": -10.561250686645508, "global_step": 366857, "epoch": 2183} {"train_loss": -12.037727355957031, "global_step": 366858, "epoch": 2183} {"train_loss": -11.041219711303711, "global_step": 366859, "epoch": 2183} {"train_loss": -9.82770824432373, "global_step": 366860, "epoch": 2183} {"train_loss": -11.795406341552734, "global_step": 366861, "epoch": 2183} {"train_loss": -11.866035461425781, "global_step": 366862, "epoch": 2183} {"train_loss": -10.277885437011719, "global_step": 366863, "epoch": 2183} {"train_loss": -10.576581954956055, "global_step": 366864, "epoch": 2183} {"train_loss": -11.47270393371582, "global_step": 366865, "epoch": 2183} {"train_loss": -11.886265754699707, "global_step": 366866, "epoch": 2183} {"train_loss": -11.121138572692871, "global_step": 366867, "epoch": 2183} {"train_loss": -11.434988975524902, "global_step": 366868, "epoch": 2183} {"train_loss": -12.092131614685059, "global_step": 366869, "epoch": 2183} {"train_loss": -11.43828296661377, "global_step": 366870, "epoch": 2183} {"train_loss": -11.458078384399414, "global_step": 366871, "epoch": 2183} {"train_loss": -10.897008895874023, "global_step": 366872, "epoch": 2183} {"train_loss": -11.263287544250488, "global_step": 366873, "epoch": 2183} {"train_loss": -11.832744598388672, "global_step": 366874, "epoch": 2183} {"train_loss": -11.64185619354248, "global_step": 366875, "epoch": 2183} {"train_loss": -11.85622787475586, "global_step": 366876, "epoch": 2183} {"train_loss": -11.560736656188965, "global_step": 366877, "epoch": 2183} {"train_loss": -11.686018943786621, "global_step": 366878, "epoch": 2183} {"train_loss": -11.515457153320312, "global_step": 366879, "epoch": 2183} {"train_loss": -11.675453186035156, "global_step": 366880, "epoch": 2183} {"train_loss": -11.744752883911133, "global_step": 366881, "epoch": 2183} {"train_loss": -11.855827331542969, "global_step": 366882, "epoch": 2183} {"train_loss": -12.449562072753906, "global_step": 366883, "epoch": 2183} {"train_loss": -11.90134048461914, "global_step": 366884, "epoch": 2183} {"train_loss": -12.355232238769531, "global_step": 366885, "epoch": 2183} {"train_loss": -12.059354782104492, "global_step": 366886, "epoch": 2183} {"train_loss": -11.950092315673828, "global_step": 366887, "epoch": 2183} {"train_loss": -12.055020332336426, "global_step": 366888, "epoch": 2183} {"train_loss": -12.104864120483398, "global_step": 366889, "epoch": 2183} {"train_loss": -12.385370254516602, "global_step": 366890, "epoch": 2183} {"train_loss": -11.640575408935547, "global_step": 366891, "epoch": 2183} {"train_loss": -12.09010124206543, "global_step": 366892, "epoch": 2183} {"train_loss": -12.02481746673584, "global_step": 366893, "epoch": 2183} {"train_loss": -11.849508285522461, "global_step": 366894, "epoch": 2183} {"train_loss": -12.141267776489258, "global_step": 366895, "epoch": 2183} {"train_loss": -12.05774211883545, "global_step": 366896, "epoch": 2183} {"train_loss": -11.505086898803711, "global_step": 366897, "epoch": 2183} {"train_loss": -12.064910888671875, "global_step": 366898, "epoch": 2183} {"train_loss": -12.055562019348145, "global_step": 366899, "epoch": 2183} {"train_loss": -11.296579360961914, "global_step": 366900, "epoch": 2183} {"train_loss": -11.996891021728516, "global_step": 366901, "epoch": 2183} {"train_loss": -12.255477905273438, "global_step": 366902, "epoch": 2183} {"train_loss": -10.94006061553955, "global_step": 366903, "epoch": 2183} {"train_loss": -11.939966201782227, "global_step": 366904, "epoch": 2183} {"train_loss": -11.130982398986816, "global_step": 366905, "epoch": 2183} {"train_loss": -11.416536331176758, "global_step": 366906, "epoch": 2183} {"train_loss": -11.794614791870117, "global_step": 366907, "epoch": 2183} {"train_loss": -10.568564414978027, "global_step": 366908, "epoch": 2183} {"train_loss": -12.068546295166016, "global_step": 366909, "epoch": 2183} {"train_loss": -11.539411544799805, "global_step": 366910, "epoch": 2183} {"train_loss": -11.812474551654997, "global_step": 366911, "epoch": 2183, "val_loss": 292368.09375} {"train_loss": -11.983149528503418, "global_step": 366912, "epoch": 2184} {"train_loss": -11.598806381225586, "global_step": 366913, "epoch": 2184} {"train_loss": -11.960752487182617, "global_step": 366914, "epoch": 2184} {"train_loss": -11.958152770996094, "global_step": 366915, "epoch": 2184} {"train_loss": -12.077766418457031, "global_step": 366916, "epoch": 2184} {"train_loss": -11.966619491577148, "global_step": 366917, "epoch": 2184} {"train_loss": -12.018817901611328, "global_step": 366918, "epoch": 2184} {"train_loss": -12.2682523727417, "global_step": 366919, "epoch": 2184} {"train_loss": -12.22250747680664, "global_step": 366920, "epoch": 2184} {"train_loss": -12.144619941711426, "global_step": 366921, "epoch": 2184} {"train_loss": -11.069292068481445, "global_step": 366922, "epoch": 2184} {"train_loss": -11.63758659362793, "global_step": 366923, "epoch": 2184} {"train_loss": -11.141865730285645, "global_step": 366924, "epoch": 2184} {"train_loss": -11.897523880004883, "global_step": 366925, "epoch": 2184} {"train_loss": -11.362580299377441, "global_step": 366926, "epoch": 2184} {"train_loss": -11.687324523925781, "global_step": 366927, "epoch": 2184} {"train_loss": -11.719439506530762, "global_step": 366928, "epoch": 2184} {"train_loss": -12.236412048339844, "global_step": 366929, "epoch": 2184} {"train_loss": -11.710756301879883, "global_step": 366930, "epoch": 2184} {"train_loss": -12.113824844360352, "global_step": 366931, "epoch": 2184} {"train_loss": -11.633309364318848, "global_step": 366932, "epoch": 2184} {"train_loss": -11.977804183959961, "global_step": 366933, "epoch": 2184} {"train_loss": -11.981935501098633, "global_step": 366934, "epoch": 2184} {"train_loss": -11.50191879272461, "global_step": 366935, "epoch": 2184} {"train_loss": -11.874335289001465, "global_step": 366936, "epoch": 2184} {"train_loss": -12.107897758483887, "global_step": 366937, "epoch": 2184} {"train_loss": -12.074531555175781, "global_step": 366938, "epoch": 2184} {"train_loss": -12.211246490478516, "global_step": 366939, "epoch": 2184} {"train_loss": -12.121986389160156, "global_step": 366940, "epoch": 2184} {"train_loss": -11.93575668334961, "global_step": 366941, "epoch": 2184} {"train_loss": -11.923828125, "global_step": 366942, "epoch": 2184} {"train_loss": -12.323400497436523, "global_step": 366943, "epoch": 2184} {"train_loss": -12.093683242797852, "global_step": 366944, "epoch": 2184} {"train_loss": -12.213591575622559, "global_step": 366945, "epoch": 2184} {"train_loss": -12.004998207092285, "global_step": 366946, "epoch": 2184} {"train_loss": -12.141702651977539, "global_step": 366947, "epoch": 2184} {"train_loss": -12.20399284362793, "global_step": 366948, "epoch": 2184} {"train_loss": -11.840784072875977, "global_step": 366949, "epoch": 2184} {"train_loss": -12.188553810119629, "global_step": 366950, "epoch": 2184} {"train_loss": -12.218586921691895, "global_step": 366951, "epoch": 2184} {"train_loss": -12.151005744934082, "global_step": 366952, "epoch": 2184} {"train_loss": -12.068523406982422, "global_step": 366953, "epoch": 2184} {"train_loss": -12.158588409423828, "global_step": 366954, "epoch": 2184} {"train_loss": -12.43382453918457, "global_step": 366955, "epoch": 2184} {"train_loss": -12.335112571716309, "global_step": 366956, "epoch": 2184} {"train_loss": -12.226042747497559, "global_step": 366957, "epoch": 2184} {"train_loss": -12.248689651489258, "global_step": 366958, "epoch": 2184} {"train_loss": -12.051393508911133, "global_step": 366959, "epoch": 2184} {"train_loss": -11.886798858642578, "global_step": 366960, "epoch": 2184} {"train_loss": -12.121419906616211, "global_step": 366961, "epoch": 2184} {"train_loss": -11.870043754577637, "global_step": 366962, "epoch": 2184} {"train_loss": -11.922609329223633, "global_step": 366963, "epoch": 2184} {"train_loss": -12.133382797241211, "global_step": 366964, "epoch": 2184} {"train_loss": -12.302579879760742, "global_step": 366965, "epoch": 2184} {"train_loss": -12.280253410339355, "global_step": 366966, "epoch": 2184} {"train_loss": -12.244501113891602, "global_step": 366967, "epoch": 2184} {"train_loss": -12.067367553710938, "global_step": 366968, "epoch": 2184} {"train_loss": -12.163461685180664, "global_step": 366969, "epoch": 2184} {"train_loss": -12.057995796203613, "global_step": 366970, "epoch": 2184} {"train_loss": -11.889667510986328, "global_step": 366971, "epoch": 2184} {"train_loss": -11.291257858276367, "global_step": 366972, "epoch": 2184} {"train_loss": -11.506176948547363, "global_step": 366973, "epoch": 2184} {"train_loss": -11.313472747802734, "global_step": 366974, "epoch": 2184} {"train_loss": -11.91009521484375, "global_step": 366975, "epoch": 2184} {"train_loss": -12.075114250183105, "global_step": 366976, "epoch": 2184} {"train_loss": -11.402316093444824, "global_step": 366977, "epoch": 2184} {"train_loss": -12.270106315612793, "global_step": 366978, "epoch": 2184} {"train_loss": -11.75684642791748, "global_step": 366979, "epoch": 2184} {"train_loss": -11.772695541381836, "global_step": 366980, "epoch": 2184} {"train_loss": -12.540277481079102, "global_step": 366981, "epoch": 2184} {"train_loss": -11.78361701965332, "global_step": 366982, "epoch": 2184} {"train_loss": -12.346061706542969, "global_step": 366983, "epoch": 2184} {"train_loss": -11.768800735473633, "global_step": 366984, "epoch": 2184} {"train_loss": -11.678667068481445, "global_step": 366985, "epoch": 2184} {"train_loss": -12.013840675354004, "global_step": 366986, "epoch": 2184} {"train_loss": -11.958211898803711, "global_step": 366987, "epoch": 2184} {"train_loss": -12.109323501586914, "global_step": 366988, "epoch": 2184} {"train_loss": -11.969209671020508, "global_step": 366989, "epoch": 2184} {"train_loss": -11.99162483215332, "global_step": 366990, "epoch": 2184} {"train_loss": -12.03834056854248, "global_step": 366991, "epoch": 2184} {"train_loss": -12.191191673278809, "global_step": 366992, "epoch": 2184} {"train_loss": -11.895362854003906, "global_step": 366993, "epoch": 2184} {"train_loss": -12.521879196166992, "global_step": 366994, "epoch": 2184} {"train_loss": -12.218921661376953, "global_step": 366995, "epoch": 2184} {"train_loss": -11.631546974182129, "global_step": 366996, "epoch": 2184} {"train_loss": -11.60917854309082, "global_step": 366997, "epoch": 2184} {"train_loss": -12.218559265136719, "global_step": 366998, "epoch": 2184} {"train_loss": -10.731386184692383, "global_step": 366999, "epoch": 2184} {"train_loss": -12.313583374023438, "global_step": 367000, "epoch": 2184} {"train_loss": -11.927096366882324, "global_step": 367001, "epoch": 2184} {"train_loss": -11.730888366699219, "global_step": 367002, "epoch": 2184} {"train_loss": -12.5817232131958, "global_step": 367003, "epoch": 2184} {"train_loss": -11.678959846496582, "global_step": 367004, "epoch": 2184} {"train_loss": -11.939065933227539, "global_step": 367005, "epoch": 2184} {"train_loss": -12.407974243164062, "global_step": 367006, "epoch": 2184} {"train_loss": -11.50068187713623, "global_step": 367007, "epoch": 2184} {"train_loss": -12.111715316772461, "global_step": 367008, "epoch": 2184} {"train_loss": -12.134937286376953, "global_step": 367009, "epoch": 2184} {"train_loss": -11.85389518737793, "global_step": 367010, "epoch": 2184} {"train_loss": -12.313652038574219, "global_step": 367011, "epoch": 2184} {"train_loss": -11.739418029785156, "global_step": 367012, "epoch": 2184} {"train_loss": -10.938982009887695, "global_step": 367013, "epoch": 2184} {"train_loss": -12.274185180664062, "global_step": 367014, "epoch": 2184} {"train_loss": -11.527460098266602, "global_step": 367015, "epoch": 2184} {"train_loss": -11.342473983764648, "global_step": 367016, "epoch": 2184} {"train_loss": -11.996573448181152, "global_step": 367017, "epoch": 2184} {"train_loss": -10.866106033325195, "global_step": 367018, "epoch": 2184} {"train_loss": -11.65539264678955, "global_step": 367019, "epoch": 2184} {"train_loss": -10.426987648010254, "global_step": 367020, "epoch": 2184} {"train_loss": -11.241840362548828, "global_step": 367021, "epoch": 2184} {"train_loss": -10.477680206298828, "global_step": 367022, "epoch": 2184} {"train_loss": -10.683504104614258, "global_step": 367023, "epoch": 2184} {"train_loss": -11.18485164642334, "global_step": 367024, "epoch": 2184} {"train_loss": -10.501829147338867, "global_step": 367025, "epoch": 2184} {"train_loss": -11.596105575561523, "global_step": 367026, "epoch": 2184} {"train_loss": -10.903800964355469, "global_step": 367027, "epoch": 2184} {"train_loss": -11.314821243286133, "global_step": 367028, "epoch": 2184} {"train_loss": -10.981030464172363, "global_step": 367029, "epoch": 2184} {"train_loss": -11.151939392089844, "global_step": 367030, "epoch": 2184} {"train_loss": -11.674132347106934, "global_step": 367031, "epoch": 2184} {"train_loss": -11.133710861206055, "global_step": 367032, "epoch": 2184} {"train_loss": -12.191499710083008, "global_step": 367033, "epoch": 2184} {"train_loss": -10.911410331726074, "global_step": 367034, "epoch": 2184} {"train_loss": -12.015425682067871, "global_step": 367035, "epoch": 2184} {"train_loss": -11.528985977172852, "global_step": 367036, "epoch": 2184} {"train_loss": -11.803815841674805, "global_step": 367037, "epoch": 2184} {"train_loss": -11.85147476196289, "global_step": 367038, "epoch": 2184} {"train_loss": -11.71750259399414, "global_step": 367039, "epoch": 2184} {"train_loss": -11.849899291992188, "global_step": 367040, "epoch": 2184} {"train_loss": -11.58302116394043, "global_step": 367041, "epoch": 2184} {"train_loss": -11.96882438659668, "global_step": 367042, "epoch": 2184} {"train_loss": -11.993165969848633, "global_step": 367043, "epoch": 2184} {"train_loss": -11.94442367553711, "global_step": 367044, "epoch": 2184} {"train_loss": -11.930062294006348, "global_step": 367045, "epoch": 2184} {"train_loss": -12.169721603393555, "global_step": 367046, "epoch": 2184} {"train_loss": -11.80466365814209, "global_step": 367047, "epoch": 2184} {"train_loss": -11.775409698486328, "global_step": 367048, "epoch": 2184} {"train_loss": -12.053962707519531, "global_step": 367049, "epoch": 2184} {"train_loss": -11.963141441345215, "global_step": 367050, "epoch": 2184} {"train_loss": -12.132115364074707, "global_step": 367051, "epoch": 2184} {"train_loss": -12.112136840820312, "global_step": 367052, "epoch": 2184} {"train_loss": -12.017461776733398, "global_step": 367053, "epoch": 2184} {"train_loss": -12.36938190460205, "global_step": 367054, "epoch": 2184} {"train_loss": -12.122533798217773, "global_step": 367055, "epoch": 2184} {"train_loss": -12.255905151367188, "global_step": 367056, "epoch": 2184} {"train_loss": -11.710460662841797, "global_step": 367057, "epoch": 2184} {"train_loss": -12.382146835327148, "global_step": 367058, "epoch": 2184} {"train_loss": -12.03266716003418, "global_step": 367059, "epoch": 2184} {"train_loss": -12.27766227722168, "global_step": 367060, "epoch": 2184} {"train_loss": -12.3141450881958, "global_step": 367061, "epoch": 2184} {"train_loss": -12.182881355285645, "global_step": 367062, "epoch": 2184} {"train_loss": -12.27634048461914, "global_step": 367063, "epoch": 2184} {"train_loss": -11.927026748657227, "global_step": 367064, "epoch": 2184} {"train_loss": -12.365324020385742, "global_step": 367065, "epoch": 2184} {"train_loss": -12.33000373840332, "global_step": 367066, "epoch": 2184} {"train_loss": -12.264937400817871, "global_step": 367067, "epoch": 2184} {"train_loss": -12.296646118164062, "global_step": 367068, "epoch": 2184} {"train_loss": -12.090866088867188, "global_step": 367069, "epoch": 2184} {"train_loss": -12.203868865966797, "global_step": 367070, "epoch": 2184} {"train_loss": -12.28347110748291, "global_step": 367071, "epoch": 2184} {"train_loss": -11.492180824279785, "global_step": 367072, "epoch": 2184} {"train_loss": -12.02731990814209, "global_step": 367073, "epoch": 2184} {"train_loss": -11.624335289001465, "global_step": 367074, "epoch": 2184} {"train_loss": -12.479669570922852, "global_step": 367075, "epoch": 2184} {"train_loss": -11.861251831054688, "global_step": 367076, "epoch": 2184} {"train_loss": -11.869283676147461, "global_step": 367077, "epoch": 2184} {"train_loss": -12.269407272338867, "global_step": 367078, "epoch": 2184} {"train_loss": -11.889517562729973, "global_step": 367079, "epoch": 2184, "val_loss": 292948.0} {"train_loss": -12.040958404541016, "global_step": 367080, "epoch": 2185} {"train_loss": -12.34947395324707, "global_step": 367081, "epoch": 2185} {"train_loss": -12.05186653137207, "global_step": 367082, "epoch": 2185} {"train_loss": -12.530982971191406, "global_step": 367083, "epoch": 2185} {"train_loss": -12.323177337646484, "global_step": 367084, "epoch": 2185} {"train_loss": -12.500478744506836, "global_step": 367085, "epoch": 2185} {"train_loss": -12.241678237915039, "global_step": 367086, "epoch": 2185} {"train_loss": -12.282793045043945, "global_step": 367087, "epoch": 2185} {"train_loss": -12.226438522338867, "global_step": 367088, "epoch": 2185} {"train_loss": -12.280599594116211, "global_step": 367089, "epoch": 2185} {"train_loss": -12.683363914489746, "global_step": 367090, "epoch": 2185} {"train_loss": -11.955580711364746, "global_step": 367091, "epoch": 2185} {"train_loss": -12.558324813842773, "global_step": 367092, "epoch": 2185} {"train_loss": -12.372385025024414, "global_step": 367093, "epoch": 2185} {"train_loss": -12.345718383789062, "global_step": 367094, "epoch": 2185} {"train_loss": -12.363544464111328, "global_step": 367095, "epoch": 2185} {"train_loss": -12.513580322265625, "global_step": 367096, "epoch": 2185} {"train_loss": -12.374082565307617, "global_step": 367097, "epoch": 2185} {"train_loss": -12.32851791381836, "global_step": 367098, "epoch": 2185} {"train_loss": -12.483028411865234, "global_step": 367099, "epoch": 2185} {"train_loss": -12.413187026977539, "global_step": 367100, "epoch": 2185} {"train_loss": -12.273126602172852, "global_step": 367101, "epoch": 2185} {"train_loss": -11.844749450683594, "global_step": 367102, "epoch": 2185} {"train_loss": -12.58934211730957, "global_step": 367103, "epoch": 2185} {"train_loss": -11.770317077636719, "global_step": 367104, "epoch": 2185} {"train_loss": -12.188058853149414, "global_step": 367105, "epoch": 2185} {"train_loss": -12.202817916870117, "global_step": 367106, "epoch": 2185} {"train_loss": -12.062454223632812, "global_step": 367107, "epoch": 2185} {"train_loss": -11.957486152648926, "global_step": 367108, "epoch": 2185} {"train_loss": -12.71734619140625, "global_step": 367109, "epoch": 2185} {"train_loss": -11.817546844482422, "global_step": 367110, "epoch": 2185} {"train_loss": -12.54220199584961, "global_step": 367111, "epoch": 2185} {"train_loss": -11.855331420898438, "global_step": 367112, "epoch": 2185} {"train_loss": -12.235860824584961, "global_step": 367113, "epoch": 2185} {"train_loss": -12.271190643310547, "global_step": 367114, "epoch": 2185} {"train_loss": -11.8894681930542, "global_step": 367115, "epoch": 2185} {"train_loss": -12.544960021972656, "global_step": 367116, "epoch": 2185} {"train_loss": -11.940791130065918, "global_step": 367117, "epoch": 2185} {"train_loss": -12.304323196411133, "global_step": 367118, "epoch": 2185} {"train_loss": -12.380505561828613, "global_step": 367119, "epoch": 2185} {"train_loss": -12.261922836303711, "global_step": 367120, "epoch": 2185} {"train_loss": -12.619111061096191, "global_step": 367121, "epoch": 2185} {"train_loss": -11.888195037841797, "global_step": 367122, "epoch": 2185} {"train_loss": -12.560038566589355, "global_step": 367123, "epoch": 2185} {"train_loss": -12.444439888000488, "global_step": 367124, "epoch": 2185} {"train_loss": -12.100141525268555, "global_step": 367125, "epoch": 2185} {"train_loss": -11.571285247802734, "global_step": 367126, "epoch": 2185} {"train_loss": -12.337579727172852, "global_step": 367127, "epoch": 2185} {"train_loss": -11.601579666137695, "global_step": 367128, "epoch": 2185} {"train_loss": -11.85981273651123, "global_step": 367129, "epoch": 2185} {"train_loss": -12.107026100158691, "global_step": 367130, "epoch": 2185} {"train_loss": -11.673460006713867, "global_step": 367131, "epoch": 2185} {"train_loss": -11.785439491271973, "global_step": 367132, "epoch": 2185} {"train_loss": -11.727558135986328, "global_step": 367133, "epoch": 2185} {"train_loss": -11.26804256439209, "global_step": 367134, "epoch": 2185} {"train_loss": -11.833669662475586, "global_step": 367135, "epoch": 2185} {"train_loss": -11.625268936157227, "global_step": 367136, "epoch": 2185} {"train_loss": -11.906232833862305, "global_step": 367137, "epoch": 2185} {"train_loss": -11.107841491699219, "global_step": 367138, "epoch": 2185} {"train_loss": -12.156635284423828, "global_step": 367139, "epoch": 2185} {"train_loss": -11.241109848022461, "global_step": 367140, "epoch": 2185} {"train_loss": -11.619081497192383, "global_step": 367141, "epoch": 2185} {"train_loss": -11.895902633666992, "global_step": 367142, "epoch": 2185} {"train_loss": -12.323026657104492, "global_step": 367143, "epoch": 2185} {"train_loss": -11.313882827758789, "global_step": 367144, "epoch": 2185} {"train_loss": -11.459423065185547, "global_step": 367145, "epoch": 2185} {"train_loss": -11.483606338500977, "global_step": 367146, "epoch": 2185} {"train_loss": -10.7384033203125, "global_step": 367147, "epoch": 2185} {"train_loss": -11.227775573730469, "global_step": 367148, "epoch": 2185} {"train_loss": -11.868707656860352, "global_step": 367149, "epoch": 2185} {"train_loss": -11.326157569885254, "global_step": 367150, "epoch": 2185} {"train_loss": -11.416272163391113, "global_step": 367151, "epoch": 2185} {"train_loss": -11.447751998901367, "global_step": 367152, "epoch": 2185} {"train_loss": -11.852582931518555, "global_step": 367153, "epoch": 2185} {"train_loss": -11.733749389648438, "global_step": 367154, "epoch": 2185} {"train_loss": -11.446396827697754, "global_step": 367155, "epoch": 2185} {"train_loss": -11.844911575317383, "global_step": 367156, "epoch": 2185} {"train_loss": -12.159549713134766, "global_step": 367157, "epoch": 2185} {"train_loss": -11.363682746887207, "global_step": 367158, "epoch": 2185} {"train_loss": -11.568090438842773, "global_step": 367159, "epoch": 2185} {"train_loss": -12.11250114440918, "global_step": 367160, "epoch": 2185} {"train_loss": -11.791391372680664, "global_step": 367161, "epoch": 2185} {"train_loss": -11.802321434020996, "global_step": 367162, "epoch": 2185} {"train_loss": -11.956850051879883, "global_step": 367163, "epoch": 2185} {"train_loss": -11.241662979125977, "global_step": 367164, "epoch": 2185} {"train_loss": -11.009344100952148, "global_step": 367165, "epoch": 2185} {"train_loss": -11.678678512573242, "global_step": 367166, "epoch": 2185} {"train_loss": -11.008171081542969, "global_step": 367167, "epoch": 2185} {"train_loss": -11.38503646850586, "global_step": 367168, "epoch": 2185} {"train_loss": -11.893239974975586, "global_step": 367169, "epoch": 2185} {"train_loss": -10.76443862915039, "global_step": 367170, "epoch": 2185} {"train_loss": -11.183252334594727, "global_step": 367171, "epoch": 2185} {"train_loss": -10.948488235473633, "global_step": 367172, "epoch": 2185} {"train_loss": -10.316476821899414, "global_step": 367173, "epoch": 2185} {"train_loss": -11.532539367675781, "global_step": 367174, "epoch": 2185} {"train_loss": -10.738767623901367, "global_step": 367175, "epoch": 2185} {"train_loss": -11.762325286865234, "global_step": 367176, "epoch": 2185} {"train_loss": -11.379667282104492, "global_step": 367177, "epoch": 2185} {"train_loss": -11.600103378295898, "global_step": 367178, "epoch": 2185} {"train_loss": -11.792794227600098, "global_step": 367179, "epoch": 2185} {"train_loss": -11.501461029052734, "global_step": 367180, "epoch": 2185} {"train_loss": -11.51054859161377, "global_step": 367181, "epoch": 2185} {"train_loss": -11.64124870300293, "global_step": 367182, "epoch": 2185} {"train_loss": -11.277297019958496, "global_step": 367183, "epoch": 2185} {"train_loss": -11.76953125, "global_step": 367184, "epoch": 2185} {"train_loss": -11.694944381713867, "global_step": 367185, "epoch": 2185} {"train_loss": -11.860417366027832, "global_step": 367186, "epoch": 2185} {"train_loss": -11.641143798828125, "global_step": 367187, "epoch": 2185} {"train_loss": -11.765153884887695, "global_step": 367188, "epoch": 2185} {"train_loss": -11.928813934326172, "global_step": 367189, "epoch": 2185} {"train_loss": -12.085403442382812, "global_step": 367190, "epoch": 2185} {"train_loss": -12.191216468811035, "global_step": 367191, "epoch": 2185} {"train_loss": -12.013232231140137, "global_step": 367192, "epoch": 2185} {"train_loss": -11.839588165283203, "global_step": 367193, "epoch": 2185} {"train_loss": -12.078737258911133, "global_step": 367194, "epoch": 2185} {"train_loss": -12.0432767868042, "global_step": 367195, "epoch": 2185} {"train_loss": -12.13984203338623, "global_step": 367196, "epoch": 2185} {"train_loss": -12.184436798095703, "global_step": 367197, "epoch": 2185} {"train_loss": -11.984114646911621, "global_step": 367198, "epoch": 2185} {"train_loss": -12.044387817382812, "global_step": 367199, "epoch": 2185} {"train_loss": -12.058357238769531, "global_step": 367200, "epoch": 2185} {"train_loss": -12.220748901367188, "global_step": 367201, "epoch": 2185} {"train_loss": -12.247274398803711, "global_step": 367202, "epoch": 2185} {"train_loss": -12.218293190002441, "global_step": 367203, "epoch": 2185} {"train_loss": -12.243690490722656, "global_step": 367204, "epoch": 2185} {"train_loss": -12.167501449584961, "global_step": 367205, "epoch": 2185} {"train_loss": -12.204279899597168, "global_step": 367206, "epoch": 2185} {"train_loss": -12.240348815917969, "global_step": 367207, "epoch": 2185} {"train_loss": -12.08514404296875, "global_step": 367208, "epoch": 2185} {"train_loss": -12.0267972946167, "global_step": 367209, "epoch": 2185} {"train_loss": -12.183956146240234, "global_step": 367210, "epoch": 2185} {"train_loss": -12.165885925292969, "global_step": 367211, "epoch": 2185} {"train_loss": -12.343366622924805, "global_step": 367212, "epoch": 2185} {"train_loss": -12.13210678100586, "global_step": 367213, "epoch": 2185} {"train_loss": -12.278103828430176, "global_step": 367214, "epoch": 2185} {"train_loss": -12.458477973937988, "global_step": 367215, "epoch": 2185} {"train_loss": -12.482855796813965, "global_step": 367216, "epoch": 2185} {"train_loss": -12.200078964233398, "global_step": 367217, "epoch": 2185} {"train_loss": -12.56474494934082, "global_step": 367218, "epoch": 2185} {"train_loss": -12.368207931518555, "global_step": 367219, "epoch": 2185} {"train_loss": -12.445070266723633, "global_step": 367220, "epoch": 2185} {"train_loss": -12.284420013427734, "global_step": 367221, "epoch": 2185} {"train_loss": -12.209108352661133, "global_step": 367222, "epoch": 2185} {"train_loss": -12.404544830322266, "global_step": 367223, "epoch": 2185} {"train_loss": -12.027061462402344, "global_step": 367224, "epoch": 2185} {"train_loss": -12.46420669555664, "global_step": 367225, "epoch": 2185} {"train_loss": -12.214029312133789, "global_step": 367226, "epoch": 2185} {"train_loss": -12.500268936157227, "global_step": 367227, "epoch": 2185} {"train_loss": -12.304547309875488, "global_step": 367228, "epoch": 2185} {"train_loss": -12.454652786254883, "global_step": 367229, "epoch": 2185} {"train_loss": -12.485801696777344, "global_step": 367230, "epoch": 2185} {"train_loss": -12.453747749328613, "global_step": 367231, "epoch": 2185} {"train_loss": -12.082460403442383, "global_step": 367232, "epoch": 2185} {"train_loss": -12.071306228637695, "global_step": 367233, "epoch": 2185} {"train_loss": -12.189960479736328, "global_step": 367234, "epoch": 2185} {"train_loss": -11.648653030395508, "global_step": 367235, "epoch": 2185} {"train_loss": -12.27932071685791, "global_step": 367236, "epoch": 2185} {"train_loss": -12.251590728759766, "global_step": 367237, "epoch": 2185} {"train_loss": -12.018198013305664, "global_step": 367238, "epoch": 2185} {"train_loss": -12.385963439941406, "global_step": 367239, "epoch": 2185} {"train_loss": -12.333077430725098, "global_step": 367240, "epoch": 2185} {"train_loss": -12.282172203063965, "global_step": 367241, "epoch": 2185} {"train_loss": -12.585674285888672, "global_step": 367242, "epoch": 2185} {"train_loss": -12.1981782913208, "global_step": 367243, "epoch": 2185} {"train_loss": -12.395929336547852, "global_step": 367244, "epoch": 2185} {"train_loss": -12.27391529083252, "global_step": 367245, "epoch": 2185} {"train_loss": -12.651641845703125, "global_step": 367246, "epoch": 2185} {"train_loss": -11.989294415428525, "global_step": 367247, "epoch": 2185, "val_loss": 295335.40625, "train_action_mse_error": 2.8574938774108887} {"train_loss": -12.219072341918945, "global_step": 367248, "epoch": 2186} {"train_loss": -12.283382415771484, "global_step": 367249, "epoch": 2186} {"train_loss": -12.335373878479004, "global_step": 367250, "epoch": 2186} {"train_loss": -12.200200080871582, "global_step": 367251, "epoch": 2186} {"train_loss": -11.99660873413086, "global_step": 367252, "epoch": 2186} {"train_loss": -11.725686073303223, "global_step": 367253, "epoch": 2186} {"train_loss": -12.447763442993164, "global_step": 367254, "epoch": 2186} {"train_loss": -11.71635627746582, "global_step": 367255, "epoch": 2186} {"train_loss": -12.24725341796875, "global_step": 367256, "epoch": 2186} {"train_loss": -12.004220962524414, "global_step": 367257, "epoch": 2186} {"train_loss": -12.191943168640137, "global_step": 367258, "epoch": 2186} {"train_loss": -12.230088233947754, "global_step": 367259, "epoch": 2186} {"train_loss": -12.507038116455078, "global_step": 367260, "epoch": 2186} {"train_loss": -12.30433464050293, "global_step": 367261, "epoch": 2186} {"train_loss": -12.297908782958984, "global_step": 367262, "epoch": 2186} {"train_loss": -11.836438179016113, "global_step": 367263, "epoch": 2186} {"train_loss": -12.245054244995117, "global_step": 367264, "epoch": 2186} {"train_loss": -12.480295181274414, "global_step": 367265, "epoch": 2186} {"train_loss": -12.025552749633789, "global_step": 367266, "epoch": 2186} {"train_loss": -12.406136512756348, "global_step": 367267, "epoch": 2186} {"train_loss": -12.381498336791992, "global_step": 367268, "epoch": 2186} {"train_loss": -12.399478912353516, "global_step": 367269, "epoch": 2186} {"train_loss": -12.44922161102295, "global_step": 367270, "epoch": 2186} {"train_loss": -12.438106536865234, "global_step": 367271, "epoch": 2186} {"train_loss": -12.099098205566406, "global_step": 367272, "epoch": 2186} {"train_loss": -12.465794563293457, "global_step": 367273, "epoch": 2186} {"train_loss": -12.22166633605957, "global_step": 367274, "epoch": 2186} {"train_loss": -12.300621032714844, "global_step": 367275, "epoch": 2186} {"train_loss": -12.107244491577148, "global_step": 367276, "epoch": 2186} {"train_loss": -12.273736953735352, "global_step": 367277, "epoch": 2186} {"train_loss": -12.139949798583984, "global_step": 367278, "epoch": 2186} {"train_loss": -12.26795482635498, "global_step": 367279, "epoch": 2186} {"train_loss": -12.139334678649902, "global_step": 367280, "epoch": 2186} {"train_loss": -12.052423477172852, "global_step": 367281, "epoch": 2186} {"train_loss": -11.997884750366211, "global_step": 367282, "epoch": 2186} {"train_loss": -12.653633117675781, "global_step": 367283, "epoch": 2186} {"train_loss": -12.198206901550293, "global_step": 367284, "epoch": 2186} {"train_loss": -11.854706764221191, "global_step": 367285, "epoch": 2186} {"train_loss": -11.151350021362305, "global_step": 367286, "epoch": 2186} {"train_loss": -12.616121292114258, "global_step": 367287, "epoch": 2186} {"train_loss": -10.574901580810547, "global_step": 367288, "epoch": 2186} {"train_loss": -11.898332595825195, "global_step": 367289, "epoch": 2186} {"train_loss": -10.90027141571045, "global_step": 367290, "epoch": 2186} {"train_loss": -12.147261619567871, "global_step": 367291, "epoch": 2186} {"train_loss": -10.948148727416992, "global_step": 367292, "epoch": 2186} {"train_loss": -12.27161979675293, "global_step": 367293, "epoch": 2186} {"train_loss": -11.33764934539795, "global_step": 367294, "epoch": 2186} {"train_loss": -11.827113151550293, "global_step": 367295, "epoch": 2186} {"train_loss": -11.842708587646484, "global_step": 367296, "epoch": 2186} {"train_loss": -11.329622268676758, "global_step": 367297, "epoch": 2186} {"train_loss": -11.457934379577637, "global_step": 367298, "epoch": 2186} {"train_loss": -12.056379318237305, "global_step": 367299, "epoch": 2186} {"train_loss": -11.69328784942627, "global_step": 367300, "epoch": 2186} {"train_loss": -12.273720741271973, "global_step": 367301, "epoch": 2186} {"train_loss": -11.674814224243164, "global_step": 367302, "epoch": 2186} {"train_loss": -12.099204063415527, "global_step": 367303, "epoch": 2186} {"train_loss": -11.699434280395508, "global_step": 367304, "epoch": 2186} {"train_loss": -11.781364440917969, "global_step": 367305, "epoch": 2186} {"train_loss": -11.763065338134766, "global_step": 367306, "epoch": 2186} {"train_loss": -12.13377857208252, "global_step": 367307, "epoch": 2186} {"train_loss": -11.777925491333008, "global_step": 367308, "epoch": 2186} {"train_loss": -12.13055419921875, "global_step": 367309, "epoch": 2186} {"train_loss": -11.932374954223633, "global_step": 367310, "epoch": 2186} {"train_loss": -11.860770225524902, "global_step": 367311, "epoch": 2186} {"train_loss": -12.118307113647461, "global_step": 367312, "epoch": 2186} {"train_loss": -11.6177339553833, "global_step": 367313, "epoch": 2186} {"train_loss": -11.533537864685059, "global_step": 367314, "epoch": 2186} {"train_loss": -11.726542472839355, "global_step": 367315, "epoch": 2186} {"train_loss": -11.807355880737305, "global_step": 367316, "epoch": 2186} {"train_loss": -11.886677742004395, "global_step": 367317, "epoch": 2186} {"train_loss": -11.801620483398438, "global_step": 367318, "epoch": 2186} {"train_loss": -11.904027938842773, "global_step": 367319, "epoch": 2186} {"train_loss": -11.485876083374023, "global_step": 367320, "epoch": 2186} {"train_loss": -10.78396987915039, "global_step": 367321, "epoch": 2186} {"train_loss": -12.232261657714844, "global_step": 367322, "epoch": 2186} {"train_loss": -11.6585693359375, "global_step": 367323, "epoch": 2186} {"train_loss": -12.011014938354492, "global_step": 367324, "epoch": 2186} {"train_loss": -12.254654884338379, "global_step": 367325, "epoch": 2186} {"train_loss": -12.058155059814453, "global_step": 367326, "epoch": 2186} {"train_loss": -12.153409957885742, "global_step": 367327, "epoch": 2186} {"train_loss": -11.815826416015625, "global_step": 367328, "epoch": 2186} {"train_loss": -12.202384948730469, "global_step": 367329, "epoch": 2186} {"train_loss": -12.061881065368652, "global_step": 367330, "epoch": 2186} {"train_loss": -11.918798446655273, "global_step": 367331, "epoch": 2186} {"train_loss": -12.41634750366211, "global_step": 367332, "epoch": 2186} {"train_loss": -12.07404899597168, "global_step": 367333, "epoch": 2186} {"train_loss": -12.229532241821289, "global_step": 367334, "epoch": 2186} {"train_loss": -12.504829406738281, "global_step": 367335, "epoch": 2186} {"train_loss": -11.766252517700195, "global_step": 367336, "epoch": 2186} {"train_loss": -12.268335342407227, "global_step": 367337, "epoch": 2186} {"train_loss": -12.053668975830078, "global_step": 367338, "epoch": 2186} {"train_loss": -12.397762298583984, "global_step": 367339, "epoch": 2186} {"train_loss": -12.096325874328613, "global_step": 367340, "epoch": 2186} {"train_loss": -11.734832763671875, "global_step": 367341, "epoch": 2186} {"train_loss": -12.125967979431152, "global_step": 367342, "epoch": 2186} {"train_loss": -12.166473388671875, "global_step": 367343, "epoch": 2186} {"train_loss": -12.232280731201172, "global_step": 367344, "epoch": 2186} {"train_loss": -12.16843318939209, "global_step": 367345, "epoch": 2186} {"train_loss": -11.797075271606445, "global_step": 367346, "epoch": 2186} {"train_loss": -12.069018363952637, "global_step": 367347, "epoch": 2186} {"train_loss": -12.384366989135742, "global_step": 367348, "epoch": 2186} {"train_loss": -12.077768325805664, "global_step": 367349, "epoch": 2186} {"train_loss": -11.959726333618164, "global_step": 367350, "epoch": 2186} {"train_loss": -11.722559928894043, "global_step": 367351, "epoch": 2186} {"train_loss": -12.190925598144531, "global_step": 367352, "epoch": 2186} {"train_loss": -11.550312042236328, "global_step": 367353, "epoch": 2186} {"train_loss": -12.183090209960938, "global_step": 367354, "epoch": 2186} {"train_loss": -12.34745979309082, "global_step": 367355, "epoch": 2186} {"train_loss": -11.897294998168945, "global_step": 367356, "epoch": 2186} {"train_loss": -12.063279151916504, "global_step": 367357, "epoch": 2186} {"train_loss": -12.4399995803833, "global_step": 367358, "epoch": 2186} {"train_loss": -12.347360610961914, "global_step": 367359, "epoch": 2186} {"train_loss": -11.974963188171387, "global_step": 367360, "epoch": 2186} {"train_loss": -12.454507827758789, "global_step": 367361, "epoch": 2186} {"train_loss": -12.130301475524902, "global_step": 367362, "epoch": 2186} {"train_loss": -12.129682540893555, "global_step": 367363, "epoch": 2186} {"train_loss": -12.048425674438477, "global_step": 367364, "epoch": 2186} {"train_loss": -12.443130493164062, "global_step": 367365, "epoch": 2186} {"train_loss": -12.155497550964355, "global_step": 367366, "epoch": 2186} {"train_loss": -12.393667221069336, "global_step": 367367, "epoch": 2186} {"train_loss": -12.294998168945312, "global_step": 367368, "epoch": 2186} {"train_loss": -11.989386558532715, "global_step": 367369, "epoch": 2186} {"train_loss": -11.828319549560547, "global_step": 367370, "epoch": 2186} {"train_loss": -12.621353149414062, "global_step": 367371, "epoch": 2186} {"train_loss": -11.846813201904297, "global_step": 367372, "epoch": 2186} {"train_loss": -11.23167610168457, "global_step": 367373, "epoch": 2186} {"train_loss": -12.006715774536133, "global_step": 367374, "epoch": 2186} {"train_loss": -12.282365798950195, "global_step": 367375, "epoch": 2186} {"train_loss": -11.694238662719727, "global_step": 367376, "epoch": 2186} {"train_loss": -12.468753814697266, "global_step": 367377, "epoch": 2186} {"train_loss": -12.03492546081543, "global_step": 367378, "epoch": 2186} {"train_loss": -11.887035369873047, "global_step": 367379, "epoch": 2186} {"train_loss": -12.24152660369873, "global_step": 367380, "epoch": 2186} {"train_loss": -12.151985168457031, "global_step": 367381, "epoch": 2186} {"train_loss": -11.195276260375977, "global_step": 367382, "epoch": 2186} {"train_loss": -12.460901260375977, "global_step": 367383, "epoch": 2186} {"train_loss": -11.798213958740234, "global_step": 367384, "epoch": 2186} {"train_loss": -11.21718978881836, "global_step": 367385, "epoch": 2186} {"train_loss": -11.860479354858398, "global_step": 367386, "epoch": 2186} {"train_loss": -10.933525085449219, "global_step": 367387, "epoch": 2186} {"train_loss": -11.065937042236328, "global_step": 367388, "epoch": 2186} {"train_loss": -11.126947402954102, "global_step": 367389, "epoch": 2186} {"train_loss": -10.690786361694336, "global_step": 367390, "epoch": 2186} {"train_loss": -10.285808563232422, "global_step": 367391, "epoch": 2186} {"train_loss": -11.082876205444336, "global_step": 367392, "epoch": 2186} {"train_loss": -9.829710960388184, "global_step": 367393, "epoch": 2186} {"train_loss": -11.898829460144043, "global_step": 367394, "epoch": 2186} {"train_loss": -9.397834777832031, "global_step": 367395, "epoch": 2186} {"train_loss": -11.291067123413086, "global_step": 367396, "epoch": 2186} {"train_loss": -10.117987632751465, "global_step": 367397, "epoch": 2186} {"train_loss": -10.913320541381836, "global_step": 367398, "epoch": 2186} {"train_loss": -9.999595642089844, "global_step": 367399, "epoch": 2186} {"train_loss": -10.148887634277344, "global_step": 367400, "epoch": 2186} {"train_loss": -11.358742713928223, "global_step": 367401, "epoch": 2186} {"train_loss": -10.798007011413574, "global_step": 367402, "epoch": 2186} {"train_loss": -10.696172714233398, "global_step": 367403, "epoch": 2186} {"train_loss": -11.030672073364258, "global_step": 367404, "epoch": 2186} {"train_loss": -11.62430191040039, "global_step": 367405, "epoch": 2186} {"train_loss": -11.189947128295898, "global_step": 367406, "epoch": 2186} {"train_loss": -11.430421829223633, "global_step": 367407, "epoch": 2186} {"train_loss": -12.213067054748535, "global_step": 367408, "epoch": 2186} {"train_loss": -11.0379638671875, "global_step": 367409, "epoch": 2186} {"train_loss": -11.740299224853516, "global_step": 367410, "epoch": 2186} {"train_loss": -11.069501876831055, "global_step": 367411, "epoch": 2186} {"train_loss": -11.425107955932617, "global_step": 367412, "epoch": 2186} {"train_loss": -11.250533103942871, "global_step": 367413, "epoch": 2186} {"train_loss": -11.941160202026367, "global_step": 367414, "epoch": 2186} {"train_loss": -11.840070111410958, "global_step": 367415, "epoch": 2186, "val_loss": 291194.28125} {"train_loss": -11.498319625854492, "global_step": 367416, "epoch": 2187} {"train_loss": -12.065467834472656, "global_step": 367417, "epoch": 2187} {"train_loss": -11.541417121887207, "global_step": 367418, "epoch": 2187} {"train_loss": -11.790628433227539, "global_step": 367419, "epoch": 2187} {"train_loss": -11.45598030090332, "global_step": 367420, "epoch": 2187} {"train_loss": -11.84710693359375, "global_step": 367421, "epoch": 2187} {"train_loss": -11.998594284057617, "global_step": 367422, "epoch": 2187} {"train_loss": -11.56390380859375, "global_step": 367423, "epoch": 2187} {"train_loss": -12.149301528930664, "global_step": 367424, "epoch": 2187} {"train_loss": -12.00750732421875, "global_step": 367425, "epoch": 2187} {"train_loss": -12.047548294067383, "global_step": 367426, "epoch": 2187} {"train_loss": -11.76368522644043, "global_step": 367427, "epoch": 2187} {"train_loss": -11.984314918518066, "global_step": 367428, "epoch": 2187} {"train_loss": -11.987237930297852, "global_step": 367429, "epoch": 2187} {"train_loss": -11.78117847442627, "global_step": 367430, "epoch": 2187} {"train_loss": -11.88123893737793, "global_step": 367431, "epoch": 2187} {"train_loss": -12.180295944213867, "global_step": 367432, "epoch": 2187} {"train_loss": -11.687259674072266, "global_step": 367433, "epoch": 2187} {"train_loss": -12.061519622802734, "global_step": 367434, "epoch": 2187} {"train_loss": -11.975980758666992, "global_step": 367435, "epoch": 2187} {"train_loss": -11.852838516235352, "global_step": 367436, "epoch": 2187} {"train_loss": -12.39422607421875, "global_step": 367437, "epoch": 2187} {"train_loss": -11.918479919433594, "global_step": 367438, "epoch": 2187} {"train_loss": -11.949580192565918, "global_step": 367439, "epoch": 2187} {"train_loss": -11.990524291992188, "global_step": 367440, "epoch": 2187} {"train_loss": -11.884794235229492, "global_step": 367441, "epoch": 2187} {"train_loss": -12.30782699584961, "global_step": 367442, "epoch": 2187} {"train_loss": -11.896904945373535, "global_step": 367443, "epoch": 2187} {"train_loss": -12.27001953125, "global_step": 367444, "epoch": 2187} {"train_loss": -11.948841094970703, "global_step": 367445, "epoch": 2187} {"train_loss": -12.195019721984863, "global_step": 367446, "epoch": 2187} {"train_loss": -12.30822467803955, "global_step": 367447, "epoch": 2187} {"train_loss": -12.434017181396484, "global_step": 367448, "epoch": 2187} {"train_loss": -12.399396896362305, "global_step": 367449, "epoch": 2187} {"train_loss": -12.10930061340332, "global_step": 367450, "epoch": 2187} {"train_loss": -12.233182907104492, "global_step": 367451, "epoch": 2187} {"train_loss": -12.417991638183594, "global_step": 367452, "epoch": 2187} {"train_loss": -12.289799690246582, "global_step": 367453, "epoch": 2187} {"train_loss": -12.369670867919922, "global_step": 367454, "epoch": 2187} {"train_loss": -12.626684188842773, "global_step": 367455, "epoch": 2187} {"train_loss": -12.40572738647461, "global_step": 367456, "epoch": 2187} {"train_loss": -12.17747688293457, "global_step": 367457, "epoch": 2187} {"train_loss": -12.46473217010498, "global_step": 367458, "epoch": 2187} {"train_loss": -12.302206039428711, "global_step": 367459, "epoch": 2187} {"train_loss": -12.537152290344238, "global_step": 367460, "epoch": 2187} {"train_loss": -12.338594436645508, "global_step": 367461, "epoch": 2187} {"train_loss": -12.546991348266602, "global_step": 367462, "epoch": 2187} {"train_loss": -12.434444427490234, "global_step": 367463, "epoch": 2187} {"train_loss": -12.23225212097168, "global_step": 367464, "epoch": 2187} {"train_loss": -12.230021476745605, "global_step": 367465, "epoch": 2187} {"train_loss": -12.37519359588623, "global_step": 367466, "epoch": 2187} {"train_loss": -12.520955085754395, "global_step": 367467, "epoch": 2187} {"train_loss": -12.411626815795898, "global_step": 367468, "epoch": 2187} {"train_loss": -12.374101638793945, "global_step": 367469, "epoch": 2187} {"train_loss": -12.273101806640625, "global_step": 367470, "epoch": 2187} {"train_loss": -12.352277755737305, "global_step": 367471, "epoch": 2187} {"train_loss": -12.342124938964844, "global_step": 367472, "epoch": 2187} {"train_loss": -12.335352897644043, "global_step": 367473, "epoch": 2187} {"train_loss": -12.367471694946289, "global_step": 367474, "epoch": 2187} {"train_loss": -12.17306137084961, "global_step": 367475, "epoch": 2187} {"train_loss": -12.559115409851074, "global_step": 367476, "epoch": 2187} {"train_loss": -11.865650177001953, "global_step": 367477, "epoch": 2187} {"train_loss": -12.661211013793945, "global_step": 367478, "epoch": 2187} {"train_loss": -12.241680145263672, "global_step": 367479, "epoch": 2187} {"train_loss": -12.513540267944336, "global_step": 367480, "epoch": 2187} {"train_loss": -12.455432891845703, "global_step": 367481, "epoch": 2187} {"train_loss": -12.463139533996582, "global_step": 367482, "epoch": 2187} {"train_loss": -12.568473815917969, "global_step": 367483, "epoch": 2187} {"train_loss": -12.30984878540039, "global_step": 367484, "epoch": 2187} {"train_loss": -12.438501358032227, "global_step": 367485, "epoch": 2187} {"train_loss": -12.607837677001953, "global_step": 367486, "epoch": 2187} {"train_loss": -12.287412643432617, "global_step": 367487, "epoch": 2187} {"train_loss": -12.315103530883789, "global_step": 367488, "epoch": 2187} {"train_loss": -12.517059326171875, "global_step": 367489, "epoch": 2187} {"train_loss": -12.2620267868042, "global_step": 367490, "epoch": 2187} {"train_loss": -12.424150466918945, "global_step": 367491, "epoch": 2187} {"train_loss": -12.794054985046387, "global_step": 367492, "epoch": 2187} {"train_loss": -12.341928482055664, "global_step": 367493, "epoch": 2187} {"train_loss": -11.996142387390137, "global_step": 367494, "epoch": 2187} {"train_loss": -12.578949928283691, "global_step": 367495, "epoch": 2187} {"train_loss": -12.297920227050781, "global_step": 367496, "epoch": 2187} {"train_loss": -11.981553077697754, "global_step": 367497, "epoch": 2187} {"train_loss": -12.645763397216797, "global_step": 367498, "epoch": 2187} {"train_loss": -11.888693809509277, "global_step": 367499, "epoch": 2187} {"train_loss": -12.37881851196289, "global_step": 367500, "epoch": 2187} {"train_loss": -12.490636825561523, "global_step": 367501, "epoch": 2187} {"train_loss": -12.359990119934082, "global_step": 367502, "epoch": 2187} {"train_loss": -11.68666934967041, "global_step": 367503, "epoch": 2187} {"train_loss": -12.352397918701172, "global_step": 367504, "epoch": 2187} {"train_loss": -11.738361358642578, "global_step": 367505, "epoch": 2187} {"train_loss": -12.41740608215332, "global_step": 367506, "epoch": 2187} {"train_loss": -11.560064315795898, "global_step": 367507, "epoch": 2187} {"train_loss": -12.406793594360352, "global_step": 367508, "epoch": 2187} {"train_loss": -10.589040756225586, "global_step": 367509, "epoch": 2187} {"train_loss": -11.825759887695312, "global_step": 367510, "epoch": 2187} {"train_loss": -11.73047161102295, "global_step": 367511, "epoch": 2187} {"train_loss": -12.044987678527832, "global_step": 367512, "epoch": 2187} {"train_loss": -11.71537971496582, "global_step": 367513, "epoch": 2187} {"train_loss": -11.59620475769043, "global_step": 367514, "epoch": 2187} {"train_loss": -11.073338508605957, "global_step": 367515, "epoch": 2187} {"train_loss": -11.068792343139648, "global_step": 367516, "epoch": 2187} {"train_loss": -10.013542175292969, "global_step": 367517, "epoch": 2187} {"train_loss": -9.162087440490723, "global_step": 367518, "epoch": 2187} {"train_loss": -10.515403747558594, "global_step": 367519, "epoch": 2187} {"train_loss": -11.910791397094727, "global_step": 367520, "epoch": 2187} {"train_loss": -10.126965522766113, "global_step": 367521, "epoch": 2187} {"train_loss": -11.66042423248291, "global_step": 367522, "epoch": 2187} {"train_loss": -11.05922794342041, "global_step": 367523, "epoch": 2187} {"train_loss": -10.441537857055664, "global_step": 367524, "epoch": 2187} {"train_loss": -11.03683090209961, "global_step": 367525, "epoch": 2187} {"train_loss": -11.509309768676758, "global_step": 367526, "epoch": 2187} {"train_loss": -11.293100357055664, "global_step": 367527, "epoch": 2187} {"train_loss": -10.588264465332031, "global_step": 367528, "epoch": 2187} {"train_loss": -9.9848051071167, "global_step": 367529, "epoch": 2187} {"train_loss": -10.768407821655273, "global_step": 367530, "epoch": 2187} {"train_loss": -11.891302108764648, "global_step": 367531, "epoch": 2187} {"train_loss": -10.477468490600586, "global_step": 367532, "epoch": 2187} {"train_loss": -9.616147994995117, "global_step": 367533, "epoch": 2187} {"train_loss": -10.777386665344238, "global_step": 367534, "epoch": 2187} {"train_loss": -9.433406829833984, "global_step": 367535, "epoch": 2187} {"train_loss": -10.180341720581055, "global_step": 367536, "epoch": 2187} {"train_loss": -10.818615913391113, "global_step": 367537, "epoch": 2187} {"train_loss": -10.848010063171387, "global_step": 367538, "epoch": 2187} {"train_loss": -9.744930267333984, "global_step": 367539, "epoch": 2187} {"train_loss": -10.847135543823242, "global_step": 367540, "epoch": 2187} {"train_loss": -10.597671508789062, "global_step": 367541, "epoch": 2187} {"train_loss": -9.960994720458984, "global_step": 367542, "epoch": 2187} {"train_loss": -11.272136688232422, "global_step": 367543, "epoch": 2187} {"train_loss": -10.731904983520508, "global_step": 367544, "epoch": 2187} {"train_loss": -9.33232307434082, "global_step": 367545, "epoch": 2187} {"train_loss": -9.270187377929688, "global_step": 367546, "epoch": 2187} {"train_loss": -11.255716323852539, "global_step": 367547, "epoch": 2187} {"train_loss": -10.399542808532715, "global_step": 367548, "epoch": 2187} {"train_loss": -9.93155288696289, "global_step": 367549, "epoch": 2187} {"train_loss": -10.771675109863281, "global_step": 367550, "epoch": 2187} {"train_loss": -10.212018013000488, "global_step": 367551, "epoch": 2187} {"train_loss": -10.356229782104492, "global_step": 367552, "epoch": 2187} {"train_loss": -11.171605110168457, "global_step": 367553, "epoch": 2187} {"train_loss": -10.988271713256836, "global_step": 367554, "epoch": 2187} {"train_loss": -10.738768577575684, "global_step": 367555, "epoch": 2187} {"train_loss": -11.26518440246582, "global_step": 367556, "epoch": 2187} {"train_loss": -10.796159744262695, "global_step": 367557, "epoch": 2187} {"train_loss": -11.081851959228516, "global_step": 367558, "epoch": 2187} {"train_loss": -11.541897773742676, "global_step": 367559, "epoch": 2187} {"train_loss": -11.514200210571289, "global_step": 367560, "epoch": 2187} {"train_loss": -11.31027603149414, "global_step": 367561, "epoch": 2187} {"train_loss": -11.865157127380371, "global_step": 367562, "epoch": 2187} {"train_loss": -11.818666458129883, "global_step": 367563, "epoch": 2187} {"train_loss": -11.769665718078613, "global_step": 367564, "epoch": 2187} {"train_loss": -11.950615882873535, "global_step": 367565, "epoch": 2187} {"train_loss": -11.996847152709961, "global_step": 367566, "epoch": 2187} {"train_loss": -11.975730895996094, "global_step": 367567, "epoch": 2187} {"train_loss": -12.001091003417969, "global_step": 367568, "epoch": 2187} {"train_loss": -11.99337100982666, "global_step": 367569, "epoch": 2187} {"train_loss": -12.096704483032227, "global_step": 367570, "epoch": 2187} {"train_loss": -11.909627914428711, "global_step": 367571, "epoch": 2187} {"train_loss": -12.162176132202148, "global_step": 367572, "epoch": 2187} {"train_loss": -12.183116912841797, "global_step": 367573, "epoch": 2187} {"train_loss": -12.166975021362305, "global_step": 367574, "epoch": 2187} {"train_loss": -12.026829719543457, "global_step": 367575, "epoch": 2187} {"train_loss": -12.261016845703125, "global_step": 367576, "epoch": 2187} {"train_loss": -12.334280967712402, "global_step": 367577, "epoch": 2187} {"train_loss": -12.125110626220703, "global_step": 367578, "epoch": 2187} {"train_loss": -12.227373123168945, "global_step": 367579, "epoch": 2187} {"train_loss": -12.346435546875, "global_step": 367580, "epoch": 2187} {"train_loss": -12.09000301361084, "global_step": 367581, "epoch": 2187} {"train_loss": -12.15873908996582, "global_step": 367582, "epoch": 2187} {"train_loss": -11.73153471379053, "global_step": 367583, "epoch": 2187, "val_loss": 290359.78125} {"train_loss": -12.326410293579102, "global_step": 367584, "epoch": 2188} {"train_loss": -12.260705947875977, "global_step": 367585, "epoch": 2188} {"train_loss": -12.279706954956055, "global_step": 367586, "epoch": 2188} {"train_loss": -12.31033706665039, "global_step": 367587, "epoch": 2188} {"train_loss": -12.276906967163086, "global_step": 367588, "epoch": 2188} {"train_loss": -12.23164176940918, "global_step": 367589, "epoch": 2188} {"train_loss": -12.305660247802734, "global_step": 367590, "epoch": 2188} {"train_loss": -12.181817054748535, "global_step": 367591, "epoch": 2188} {"train_loss": -12.248659133911133, "global_step": 367592, "epoch": 2188} {"train_loss": -12.436721801757812, "global_step": 367593, "epoch": 2188} {"train_loss": -12.326441764831543, "global_step": 367594, "epoch": 2188} {"train_loss": -12.280566215515137, "global_step": 367595, "epoch": 2188} {"train_loss": -12.188531875610352, "global_step": 367596, "epoch": 2188} {"train_loss": -12.412025451660156, "global_step": 367597, "epoch": 2188} {"train_loss": -12.212471961975098, "global_step": 367598, "epoch": 2188} {"train_loss": -12.26345443725586, "global_step": 367599, "epoch": 2188} {"train_loss": -12.54146957397461, "global_step": 367600, "epoch": 2188} {"train_loss": -12.362907409667969, "global_step": 367601, "epoch": 2188} {"train_loss": -12.332425117492676, "global_step": 367602, "epoch": 2188} {"train_loss": -12.428248405456543, "global_step": 367603, "epoch": 2188} {"train_loss": -12.605659484863281, "global_step": 367604, "epoch": 2188} {"train_loss": -12.524019241333008, "global_step": 367605, "epoch": 2188} {"train_loss": -12.49337387084961, "global_step": 367606, "epoch": 2188} {"train_loss": -12.49814510345459, "global_step": 367607, "epoch": 2188} {"train_loss": -12.569110870361328, "global_step": 367608, "epoch": 2188} {"train_loss": -12.676506996154785, "global_step": 367609, "epoch": 2188} {"train_loss": -12.353032112121582, "global_step": 367610, "epoch": 2188} {"train_loss": -12.478926658630371, "global_step": 367611, "epoch": 2188} {"train_loss": -12.464860916137695, "global_step": 367612, "epoch": 2188} {"train_loss": -12.454565048217773, "global_step": 367613, "epoch": 2188} {"train_loss": -12.451475143432617, "global_step": 367614, "epoch": 2188} {"train_loss": -12.54922103881836, "global_step": 367615, "epoch": 2188} {"train_loss": -12.539594650268555, "global_step": 367616, "epoch": 2188} {"train_loss": -12.550183296203613, "global_step": 367617, "epoch": 2188} {"train_loss": -12.537266731262207, "global_step": 367618, "epoch": 2188} {"train_loss": -12.305383682250977, "global_step": 367619, "epoch": 2188} {"train_loss": -12.601119995117188, "global_step": 367620, "epoch": 2188} {"train_loss": -12.305986404418945, "global_step": 367621, "epoch": 2188} {"train_loss": -12.552078247070312, "global_step": 367622, "epoch": 2188} {"train_loss": -12.319517135620117, "global_step": 367623, "epoch": 2188} {"train_loss": -12.441574096679688, "global_step": 367624, "epoch": 2188} {"train_loss": -12.51530647277832, "global_step": 367625, "epoch": 2188} {"train_loss": -12.517500877380371, "global_step": 367626, "epoch": 2188} {"train_loss": -12.672820091247559, "global_step": 367627, "epoch": 2188} {"train_loss": -12.709443092346191, "global_step": 367628, "epoch": 2188} {"train_loss": -12.506998062133789, "global_step": 367629, "epoch": 2188} {"train_loss": -12.535294532775879, "global_step": 367630, "epoch": 2188} {"train_loss": -12.44880485534668, "global_step": 367631, "epoch": 2188} {"train_loss": -12.694695472717285, "global_step": 367632, "epoch": 2188} {"train_loss": -12.5787353515625, "global_step": 367633, "epoch": 2188} {"train_loss": -12.036510467529297, "global_step": 367634, "epoch": 2188} {"train_loss": -12.035467147827148, "global_step": 367635, "epoch": 2188} {"train_loss": -12.485112190246582, "global_step": 367636, "epoch": 2188} {"train_loss": -12.428853988647461, "global_step": 367637, "epoch": 2188} {"train_loss": -11.90790843963623, "global_step": 367638, "epoch": 2188} {"train_loss": -12.11235237121582, "global_step": 367639, "epoch": 2188} {"train_loss": -12.0007905960083, "global_step": 367640, "epoch": 2188} {"train_loss": -12.259533882141113, "global_step": 367641, "epoch": 2188} {"train_loss": -12.536943435668945, "global_step": 367642, "epoch": 2188} {"train_loss": -12.15067195892334, "global_step": 367643, "epoch": 2188} {"train_loss": -12.163249969482422, "global_step": 367644, "epoch": 2188} {"train_loss": -11.268277168273926, "global_step": 367645, "epoch": 2188} {"train_loss": -12.075236320495605, "global_step": 367646, "epoch": 2188} {"train_loss": -11.79092025756836, "global_step": 367647, "epoch": 2188} {"train_loss": -12.417072296142578, "global_step": 367648, "epoch": 2188} {"train_loss": -11.631563186645508, "global_step": 367649, "epoch": 2188} {"train_loss": -12.318732261657715, "global_step": 367650, "epoch": 2188} {"train_loss": -11.840075492858887, "global_step": 367651, "epoch": 2188} {"train_loss": -12.426563262939453, "global_step": 367652, "epoch": 2188} {"train_loss": -12.241844177246094, "global_step": 367653, "epoch": 2188} {"train_loss": -11.741798400878906, "global_step": 367654, "epoch": 2188} {"train_loss": -12.252960205078125, "global_step": 367655, "epoch": 2188} {"train_loss": -12.32048225402832, "global_step": 367656, "epoch": 2188} {"train_loss": -11.546859741210938, "global_step": 367657, "epoch": 2188} {"train_loss": -11.36590576171875, "global_step": 367658, "epoch": 2188} {"train_loss": -12.324077606201172, "global_step": 367659, "epoch": 2188} {"train_loss": -12.229698181152344, "global_step": 367660, "epoch": 2188} {"train_loss": -11.139585494995117, "global_step": 367661, "epoch": 2188} {"train_loss": -11.768899917602539, "global_step": 367662, "epoch": 2188} {"train_loss": -12.613323211669922, "global_step": 367663, "epoch": 2188} {"train_loss": -11.372068405151367, "global_step": 367664, "epoch": 2188} {"train_loss": -11.383172988891602, "global_step": 367665, "epoch": 2188} {"train_loss": -12.071643829345703, "global_step": 367666, "epoch": 2188} {"train_loss": -12.058282852172852, "global_step": 367667, "epoch": 2188} {"train_loss": -12.41396713256836, "global_step": 367668, "epoch": 2188} {"train_loss": -12.267230033874512, "global_step": 367669, "epoch": 2188} {"train_loss": -12.519265174865723, "global_step": 367670, "epoch": 2188} {"train_loss": -12.768766403198242, "global_step": 367671, "epoch": 2188} {"train_loss": -12.205848693847656, "global_step": 367672, "epoch": 2188} {"train_loss": -12.193007469177246, "global_step": 367673, "epoch": 2188} {"train_loss": -12.489822387695312, "global_step": 367674, "epoch": 2188} {"train_loss": -12.386292457580566, "global_step": 367675, "epoch": 2188} {"train_loss": -12.57853889465332, "global_step": 367676, "epoch": 2188} {"train_loss": -12.615848541259766, "global_step": 367677, "epoch": 2188} {"train_loss": -12.64176082611084, "global_step": 367678, "epoch": 2188} {"train_loss": -12.49470329284668, "global_step": 367679, "epoch": 2188} {"train_loss": -12.564573287963867, "global_step": 367680, "epoch": 2188} {"train_loss": -12.429006576538086, "global_step": 367681, "epoch": 2188} {"train_loss": -12.381404876708984, "global_step": 367682, "epoch": 2188} {"train_loss": -12.310009956359863, "global_step": 367683, "epoch": 2188} {"train_loss": -12.572135925292969, "global_step": 367684, "epoch": 2188} {"train_loss": -12.532407760620117, "global_step": 367685, "epoch": 2188} {"train_loss": -12.358131408691406, "global_step": 367686, "epoch": 2188} {"train_loss": -12.631936073303223, "global_step": 367687, "epoch": 2188} {"train_loss": -12.422308921813965, "global_step": 367688, "epoch": 2188} {"train_loss": -12.216696739196777, "global_step": 367689, "epoch": 2188} {"train_loss": -12.602931022644043, "global_step": 367690, "epoch": 2188} {"train_loss": -12.041476249694824, "global_step": 367691, "epoch": 2188} {"train_loss": -12.109869956970215, "global_step": 367692, "epoch": 2188} {"train_loss": -12.242046356201172, "global_step": 367693, "epoch": 2188} {"train_loss": -11.872102737426758, "global_step": 367694, "epoch": 2188} {"train_loss": -12.080739974975586, "global_step": 367695, "epoch": 2188} {"train_loss": -11.542119979858398, "global_step": 367696, "epoch": 2188} {"train_loss": -11.492269515991211, "global_step": 367697, "epoch": 2188} {"train_loss": -12.421159744262695, "global_step": 367698, "epoch": 2188} {"train_loss": -11.704816818237305, "global_step": 367699, "epoch": 2188} {"train_loss": -11.370030403137207, "global_step": 367700, "epoch": 2188} {"train_loss": -12.191585540771484, "global_step": 367701, "epoch": 2188} {"train_loss": -11.925445556640625, "global_step": 367702, "epoch": 2188} {"train_loss": -11.507194519042969, "global_step": 367703, "epoch": 2188} {"train_loss": -11.895546913146973, "global_step": 367704, "epoch": 2188} {"train_loss": -11.312093734741211, "global_step": 367705, "epoch": 2188} {"train_loss": -11.38111686706543, "global_step": 367706, "epoch": 2188} {"train_loss": -12.36091423034668, "global_step": 367707, "epoch": 2188} {"train_loss": -11.369610786437988, "global_step": 367708, "epoch": 2188} {"train_loss": -12.20968246459961, "global_step": 367709, "epoch": 2188} {"train_loss": -11.745890617370605, "global_step": 367710, "epoch": 2188} {"train_loss": -11.369667053222656, "global_step": 367711, "epoch": 2188} {"train_loss": -11.787252426147461, "global_step": 367712, "epoch": 2188} {"train_loss": -11.202396392822266, "global_step": 367713, "epoch": 2188} {"train_loss": -11.260960578918457, "global_step": 367714, "epoch": 2188} {"train_loss": -9.793315887451172, "global_step": 367715, "epoch": 2188} {"train_loss": -10.124394416809082, "global_step": 367716, "epoch": 2188} {"train_loss": -11.34535026550293, "global_step": 367717, "epoch": 2188} {"train_loss": -11.40523624420166, "global_step": 367718, "epoch": 2188} {"train_loss": -11.007568359375, "global_step": 367719, "epoch": 2188} {"train_loss": -11.281007766723633, "global_step": 367720, "epoch": 2188} {"train_loss": -11.467992782592773, "global_step": 367721, "epoch": 2188} {"train_loss": -11.573863983154297, "global_step": 367722, "epoch": 2188} {"train_loss": -11.688859939575195, "global_step": 367723, "epoch": 2188} {"train_loss": -11.149296760559082, "global_step": 367724, "epoch": 2188} {"train_loss": -11.584221839904785, "global_step": 367725, "epoch": 2188} {"train_loss": -11.651187896728516, "global_step": 367726, "epoch": 2188} {"train_loss": -11.482980728149414, "global_step": 367727, "epoch": 2188} {"train_loss": -12.263667106628418, "global_step": 367728, "epoch": 2188} {"train_loss": -11.691951751708984, "global_step": 367729, "epoch": 2188} {"train_loss": -11.899700164794922, "global_step": 367730, "epoch": 2188} {"train_loss": -11.710220336914062, "global_step": 367731, "epoch": 2188} {"train_loss": -11.966163635253906, "global_step": 367732, "epoch": 2188} {"train_loss": -12.49547290802002, "global_step": 367733, "epoch": 2188} {"train_loss": -11.691761016845703, "global_step": 367734, "epoch": 2188} {"train_loss": -11.86975383758545, "global_step": 367735, "epoch": 2188} {"train_loss": -11.952960968017578, "global_step": 367736, "epoch": 2188} {"train_loss": -11.702856063842773, "global_step": 367737, "epoch": 2188} {"train_loss": -12.142091751098633, "global_step": 367738, "epoch": 2188} {"train_loss": -12.007457733154297, "global_step": 367739, "epoch": 2188} {"train_loss": -12.26226806640625, "global_step": 367740, "epoch": 2188} {"train_loss": -12.272086143493652, "global_step": 367741, "epoch": 2188} {"train_loss": -11.806242942810059, "global_step": 367742, "epoch": 2188} {"train_loss": -12.132296562194824, "global_step": 367743, "epoch": 2188} {"train_loss": -12.334711074829102, "global_step": 367744, "epoch": 2188} {"train_loss": -12.136682510375977, "global_step": 367745, "epoch": 2188} {"train_loss": -12.471189498901367, "global_step": 367746, "epoch": 2188} {"train_loss": -12.233871459960938, "global_step": 367747, "epoch": 2188} {"train_loss": -11.894561767578125, "global_step": 367748, "epoch": 2188} {"train_loss": -12.550816535949707, "global_step": 367749, "epoch": 2188} {"train_loss": -12.36073112487793, "global_step": 367750, "epoch": 2188} {"train_loss": -12.10590142295474, "global_step": 367751, "epoch": 2188, "val_loss": 291840.875} {"train_loss": -12.120647430419922, "global_step": 367752, "epoch": 2189} {"train_loss": -12.244953155517578, "global_step": 367753, "epoch": 2189} {"train_loss": -11.977994918823242, "global_step": 367754, "epoch": 2189} {"train_loss": -12.200151443481445, "global_step": 367755, "epoch": 2189} {"train_loss": -12.535446166992188, "global_step": 367756, "epoch": 2189} {"train_loss": -12.221776962280273, "global_step": 367757, "epoch": 2189} {"train_loss": -12.482194900512695, "global_step": 367758, "epoch": 2189} {"train_loss": -12.607943534851074, "global_step": 367759, "epoch": 2189} {"train_loss": -12.441049575805664, "global_step": 367760, "epoch": 2189} {"train_loss": -12.341856002807617, "global_step": 367761, "epoch": 2189} {"train_loss": -12.361175537109375, "global_step": 367762, "epoch": 2189} {"train_loss": -12.224557876586914, "global_step": 367763, "epoch": 2189} {"train_loss": -12.24229621887207, "global_step": 367764, "epoch": 2189} {"train_loss": -12.4008207321167, "global_step": 367765, "epoch": 2189} {"train_loss": -12.478311538696289, "global_step": 367766, "epoch": 2189} {"train_loss": -12.526166915893555, "global_step": 367767, "epoch": 2189} {"train_loss": -12.618067741394043, "global_step": 367768, "epoch": 2189} {"train_loss": -12.250615119934082, "global_step": 367769, "epoch": 2189} {"train_loss": -12.496240615844727, "global_step": 367770, "epoch": 2189} {"train_loss": -11.934171676635742, "global_step": 367771, "epoch": 2189} {"train_loss": -12.54604434967041, "global_step": 367772, "epoch": 2189} {"train_loss": -12.008281707763672, "global_step": 367773, "epoch": 2189} {"train_loss": -12.449254035949707, "global_step": 367774, "epoch": 2189} {"train_loss": -12.457576751708984, "global_step": 367775, "epoch": 2189} {"train_loss": -12.267712593078613, "global_step": 367776, "epoch": 2189} {"train_loss": -12.513714790344238, "global_step": 367777, "epoch": 2189} {"train_loss": -12.399153709411621, "global_step": 367778, "epoch": 2189} {"train_loss": -12.480196952819824, "global_step": 367779, "epoch": 2189} {"train_loss": -12.092018127441406, "global_step": 367780, "epoch": 2189} {"train_loss": -12.549043655395508, "global_step": 367781, "epoch": 2189} {"train_loss": -12.091851234436035, "global_step": 367782, "epoch": 2189} {"train_loss": -11.88125991821289, "global_step": 367783, "epoch": 2189} {"train_loss": -12.597423553466797, "global_step": 367784, "epoch": 2189} {"train_loss": -12.151609420776367, "global_step": 367785, "epoch": 2189} {"train_loss": -12.344893455505371, "global_step": 367786, "epoch": 2189} {"train_loss": -12.175138473510742, "global_step": 367787, "epoch": 2189} {"train_loss": -12.142024040222168, "global_step": 367788, "epoch": 2189} {"train_loss": -12.479350090026855, "global_step": 367789, "epoch": 2189} {"train_loss": -12.144594192504883, "global_step": 367790, "epoch": 2189} {"train_loss": -11.787208557128906, "global_step": 367791, "epoch": 2189} {"train_loss": -12.344850540161133, "global_step": 367792, "epoch": 2189} {"train_loss": -11.620272636413574, "global_step": 367793, "epoch": 2189} {"train_loss": -12.158981323242188, "global_step": 367794, "epoch": 2189} {"train_loss": -12.143243789672852, "global_step": 367795, "epoch": 2189} {"train_loss": -12.432526588439941, "global_step": 367796, "epoch": 2189} {"train_loss": -12.486265182495117, "global_step": 367797, "epoch": 2189} {"train_loss": -12.302045822143555, "global_step": 367798, "epoch": 2189} {"train_loss": -12.539676666259766, "global_step": 367799, "epoch": 2189} {"train_loss": -12.424004554748535, "global_step": 367800, "epoch": 2189} {"train_loss": -12.341322898864746, "global_step": 367801, "epoch": 2189} {"train_loss": -12.609033584594727, "global_step": 367802, "epoch": 2189} {"train_loss": -12.07455825805664, "global_step": 367803, "epoch": 2189} {"train_loss": -12.237049102783203, "global_step": 367804, "epoch": 2189} {"train_loss": -12.019010543823242, "global_step": 367805, "epoch": 2189} {"train_loss": -12.55703067779541, "global_step": 367806, "epoch": 2189} {"train_loss": -11.972562789916992, "global_step": 367807, "epoch": 2189} {"train_loss": -11.707724571228027, "global_step": 367808, "epoch": 2189} {"train_loss": -11.98829460144043, "global_step": 367809, "epoch": 2189} {"train_loss": -12.512998580932617, "global_step": 367810, "epoch": 2189} {"train_loss": -11.758705139160156, "global_step": 367811, "epoch": 2189} {"train_loss": -11.243095397949219, "global_step": 367812, "epoch": 2189} {"train_loss": -11.813316345214844, "global_step": 367813, "epoch": 2189} {"train_loss": -12.202981948852539, "global_step": 367814, "epoch": 2189} {"train_loss": -11.79042911529541, "global_step": 367815, "epoch": 2189} {"train_loss": -12.578243255615234, "global_step": 367816, "epoch": 2189} {"train_loss": -11.510113716125488, "global_step": 367817, "epoch": 2189} {"train_loss": -11.73983097076416, "global_step": 367818, "epoch": 2189} {"train_loss": -11.763103485107422, "global_step": 367819, "epoch": 2189} {"train_loss": -12.161948204040527, "global_step": 367820, "epoch": 2189} {"train_loss": -12.156721115112305, "global_step": 367821, "epoch": 2189} {"train_loss": -12.580005645751953, "global_step": 367822, "epoch": 2189} {"train_loss": -12.17074966430664, "global_step": 367823, "epoch": 2189} {"train_loss": -12.300174713134766, "global_step": 367824, "epoch": 2189} {"train_loss": -11.919235229492188, "global_step": 367825, "epoch": 2189} {"train_loss": -12.381851196289062, "global_step": 367826, "epoch": 2189} {"train_loss": -12.060319900512695, "global_step": 367827, "epoch": 2189} {"train_loss": -12.274826049804688, "global_step": 367828, "epoch": 2189} {"train_loss": -11.752196311950684, "global_step": 367829, "epoch": 2189} {"train_loss": -12.579573631286621, "global_step": 367830, "epoch": 2189} {"train_loss": -12.2566556930542, "global_step": 367831, "epoch": 2189} {"train_loss": -11.841085433959961, "global_step": 367832, "epoch": 2189} {"train_loss": -12.020947456359863, "global_step": 367833, "epoch": 2189} {"train_loss": -12.153369903564453, "global_step": 367834, "epoch": 2189} {"train_loss": -12.239535331726074, "global_step": 367835, "epoch": 2189} {"train_loss": -12.66523551940918, "global_step": 367836, "epoch": 2189} {"train_loss": -12.32719612121582, "global_step": 367837, "epoch": 2189} {"train_loss": -11.89495849609375, "global_step": 367838, "epoch": 2189} {"train_loss": -12.34105110168457, "global_step": 367839, "epoch": 2189} {"train_loss": -12.089033126831055, "global_step": 367840, "epoch": 2189} {"train_loss": -12.219893455505371, "global_step": 367841, "epoch": 2189} {"train_loss": -12.184564590454102, "global_step": 367842, "epoch": 2189} {"train_loss": -11.640395164489746, "global_step": 367843, "epoch": 2189} {"train_loss": -11.874130249023438, "global_step": 367844, "epoch": 2189} {"train_loss": -12.4202880859375, "global_step": 367845, "epoch": 2189} {"train_loss": -11.60986328125, "global_step": 367846, "epoch": 2189} {"train_loss": -11.586771011352539, "global_step": 367847, "epoch": 2189} {"train_loss": -12.459674835205078, "global_step": 367848, "epoch": 2189} {"train_loss": -11.889459609985352, "global_step": 367849, "epoch": 2189} {"train_loss": -12.310606956481934, "global_step": 367850, "epoch": 2189} {"train_loss": -12.200849533081055, "global_step": 367851, "epoch": 2189} {"train_loss": -12.027680397033691, "global_step": 367852, "epoch": 2189} {"train_loss": -11.97197151184082, "global_step": 367853, "epoch": 2189} {"train_loss": -12.077014923095703, "global_step": 367854, "epoch": 2189} {"train_loss": -12.178160667419434, "global_step": 367855, "epoch": 2189} {"train_loss": -11.676883697509766, "global_step": 367856, "epoch": 2189} {"train_loss": -12.032360076904297, "global_step": 367857, "epoch": 2189} {"train_loss": -11.782705307006836, "global_step": 367858, "epoch": 2189} {"train_loss": -12.100616455078125, "global_step": 367859, "epoch": 2189} {"train_loss": -11.926384925842285, "global_step": 367860, "epoch": 2189} {"train_loss": -12.222829818725586, "global_step": 367861, "epoch": 2189} {"train_loss": -11.678720474243164, "global_step": 367862, "epoch": 2189} {"train_loss": -12.539772033691406, "global_step": 367863, "epoch": 2189} {"train_loss": -11.922584533691406, "global_step": 367864, "epoch": 2189} {"train_loss": -12.044187545776367, "global_step": 367865, "epoch": 2189} {"train_loss": -12.513141632080078, "global_step": 367866, "epoch": 2189} {"train_loss": -11.870681762695312, "global_step": 367867, "epoch": 2189} {"train_loss": -11.641705513000488, "global_step": 367868, "epoch": 2189} {"train_loss": -12.59692096710205, "global_step": 367869, "epoch": 2189} {"train_loss": -12.113500595092773, "global_step": 367870, "epoch": 2189} {"train_loss": -11.770700454711914, "global_step": 367871, "epoch": 2189} {"train_loss": -12.325135231018066, "global_step": 367872, "epoch": 2189} {"train_loss": -12.393372535705566, "global_step": 367873, "epoch": 2189} {"train_loss": -12.359983444213867, "global_step": 367874, "epoch": 2189} {"train_loss": -12.36416244506836, "global_step": 367875, "epoch": 2189} {"train_loss": -12.325847625732422, "global_step": 367876, "epoch": 2189} {"train_loss": -12.609682083129883, "global_step": 367877, "epoch": 2189} {"train_loss": -12.0784912109375, "global_step": 367878, "epoch": 2189} {"train_loss": -12.360885620117188, "global_step": 367879, "epoch": 2189} {"train_loss": -12.18455696105957, "global_step": 367880, "epoch": 2189} {"train_loss": -12.106611251831055, "global_step": 367881, "epoch": 2189} {"train_loss": -12.064312934875488, "global_step": 367882, "epoch": 2189} {"train_loss": -12.288751602172852, "global_step": 367883, "epoch": 2189} {"train_loss": -12.106616973876953, "global_step": 367884, "epoch": 2189} {"train_loss": -12.408988952636719, "global_step": 367885, "epoch": 2189} {"train_loss": -11.989952087402344, "global_step": 367886, "epoch": 2189} {"train_loss": -12.097797393798828, "global_step": 367887, "epoch": 2189} {"train_loss": -11.07177734375, "global_step": 367888, "epoch": 2189} {"train_loss": -11.162248611450195, "global_step": 367889, "epoch": 2189} {"train_loss": -11.201370239257812, "global_step": 367890, "epoch": 2189} {"train_loss": -8.743412017822266, "global_step": 367891, "epoch": 2189} {"train_loss": -10.794791221618652, "global_step": 367892, "epoch": 2189} {"train_loss": -7.944435119628906, "global_step": 367893, "epoch": 2189} {"train_loss": -10.389542579650879, "global_step": 367894, "epoch": 2189} {"train_loss": -8.960115432739258, "global_step": 367895, "epoch": 2189} {"train_loss": -10.916361808776855, "global_step": 367896, "epoch": 2189} {"train_loss": -10.595560073852539, "global_step": 367897, "epoch": 2189} {"train_loss": -10.855926513671875, "global_step": 367898, "epoch": 2189} {"train_loss": -11.564186096191406, "global_step": 367899, "epoch": 2189} {"train_loss": -10.829353332519531, "global_step": 367900, "epoch": 2189} {"train_loss": -11.798284530639648, "global_step": 367901, "epoch": 2189} {"train_loss": -11.231696128845215, "global_step": 367902, "epoch": 2189} {"train_loss": -11.224831581115723, "global_step": 367903, "epoch": 2189} {"train_loss": -11.581808090209961, "global_step": 367904, "epoch": 2189} {"train_loss": -11.406417846679688, "global_step": 367905, "epoch": 2189} {"train_loss": -11.874433517456055, "global_step": 367906, "epoch": 2189} {"train_loss": -11.514852523803711, "global_step": 367907, "epoch": 2189} {"train_loss": -11.765948295593262, "global_step": 367908, "epoch": 2189} {"train_loss": -10.676580429077148, "global_step": 367909, "epoch": 2189} {"train_loss": -11.382745742797852, "global_step": 367910, "epoch": 2189} {"train_loss": -11.31578540802002, "global_step": 367911, "epoch": 2189} {"train_loss": -10.68799877166748, "global_step": 367912, "epoch": 2189} {"train_loss": -12.041261672973633, "global_step": 367913, "epoch": 2189} {"train_loss": -11.141798973083496, "global_step": 367914, "epoch": 2189} {"train_loss": -11.476670265197754, "global_step": 367915, "epoch": 2189} {"train_loss": -11.621264457702637, "global_step": 367916, "epoch": 2189} {"train_loss": -11.180158615112305, "global_step": 367917, "epoch": 2189} {"train_loss": -11.85421371459961, "global_step": 367918, "epoch": 2189} {"train_loss": -11.958283969334193, "global_step": 367919, "epoch": 2189, "val_loss": 286411.15625} {"train_loss": -11.796955108642578, "global_step": 367920, "epoch": 2190} {"train_loss": -12.083688735961914, "global_step": 367921, "epoch": 2190} {"train_loss": -11.539204597473145, "global_step": 367922, "epoch": 2190} {"train_loss": -11.94402027130127, "global_step": 367923, "epoch": 2190} {"train_loss": -12.1720609664917, "global_step": 367924, "epoch": 2190} {"train_loss": -11.8314790725708, "global_step": 367925, "epoch": 2190} {"train_loss": -12.026433944702148, "global_step": 367926, "epoch": 2190} {"train_loss": -11.648384094238281, "global_step": 367927, "epoch": 2190} {"train_loss": -12.257593154907227, "global_step": 367928, "epoch": 2190} {"train_loss": -11.98739242553711, "global_step": 367929, "epoch": 2190} {"train_loss": -11.793327331542969, "global_step": 367930, "epoch": 2190} {"train_loss": -11.895301818847656, "global_step": 367931, "epoch": 2190} {"train_loss": -12.071747779846191, "global_step": 367932, "epoch": 2190} {"train_loss": -12.020669937133789, "global_step": 367933, "epoch": 2190} {"train_loss": -12.204549789428711, "global_step": 367934, "epoch": 2190} {"train_loss": -11.83115005493164, "global_step": 367935, "epoch": 2190} {"train_loss": -12.226821899414062, "global_step": 367936, "epoch": 2190} {"train_loss": -12.089353561401367, "global_step": 367937, "epoch": 2190} {"train_loss": -12.259069442749023, "global_step": 367938, "epoch": 2190} {"train_loss": -12.391056060791016, "global_step": 367939, "epoch": 2190} {"train_loss": -12.264984130859375, "global_step": 367940, "epoch": 2190} {"train_loss": -12.305267333984375, "global_step": 367941, "epoch": 2190} {"train_loss": -12.347332000732422, "global_step": 367942, "epoch": 2190} {"train_loss": -12.340373992919922, "global_step": 367943, "epoch": 2190} {"train_loss": -12.31103515625, "global_step": 367944, "epoch": 2190} {"train_loss": -12.288948059082031, "global_step": 367945, "epoch": 2190} {"train_loss": -12.124723434448242, "global_step": 367946, "epoch": 2190} {"train_loss": -12.317157745361328, "global_step": 367947, "epoch": 2190} {"train_loss": -12.206287384033203, "global_step": 367948, "epoch": 2190} {"train_loss": -12.087453842163086, "global_step": 367949, "epoch": 2190} {"train_loss": -12.177118301391602, "global_step": 367950, "epoch": 2190} {"train_loss": -12.455493927001953, "global_step": 367951, "epoch": 2190} {"train_loss": -12.130411148071289, "global_step": 367952, "epoch": 2190} {"train_loss": -12.4801025390625, "global_step": 367953, "epoch": 2190} {"train_loss": -12.392793655395508, "global_step": 367954, "epoch": 2190} {"train_loss": -12.37989616394043, "global_step": 367955, "epoch": 2190} {"train_loss": -12.215150833129883, "global_step": 367956, "epoch": 2190} {"train_loss": -12.458005905151367, "global_step": 367957, "epoch": 2190} {"train_loss": -12.22596263885498, "global_step": 367958, "epoch": 2190} {"train_loss": -12.19057846069336, "global_step": 367959, "epoch": 2190} {"train_loss": -12.433813095092773, "global_step": 367960, "epoch": 2190} {"train_loss": -11.678520202636719, "global_step": 367961, "epoch": 2190} {"train_loss": -12.16513442993164, "global_step": 367962, "epoch": 2190} {"train_loss": -11.527458190917969, "global_step": 367963, "epoch": 2190} {"train_loss": -12.435919761657715, "global_step": 367964, "epoch": 2190} {"train_loss": -11.929703712463379, "global_step": 367965, "epoch": 2190} {"train_loss": -12.534000396728516, "global_step": 367966, "epoch": 2190} {"train_loss": -11.997003555297852, "global_step": 367967, "epoch": 2190} {"train_loss": -12.026196479797363, "global_step": 367968, "epoch": 2190} {"train_loss": -12.066544532775879, "global_step": 367969, "epoch": 2190} {"train_loss": -11.896018028259277, "global_step": 367970, "epoch": 2190} {"train_loss": -11.601659774780273, "global_step": 367971, "epoch": 2190} {"train_loss": -11.757965087890625, "global_step": 367972, "epoch": 2190} {"train_loss": -11.06007194519043, "global_step": 367973, "epoch": 2190} {"train_loss": -11.336498260498047, "global_step": 367974, "epoch": 2190} {"train_loss": -11.86772632598877, "global_step": 367975, "epoch": 2190} {"train_loss": -10.518267631530762, "global_step": 367976, "epoch": 2190} {"train_loss": -11.914790153503418, "global_step": 367977, "epoch": 2190} {"train_loss": -10.93734359741211, "global_step": 367978, "epoch": 2190} {"train_loss": -12.309427261352539, "global_step": 367979, "epoch": 2190} {"train_loss": -11.117205619812012, "global_step": 367980, "epoch": 2190} {"train_loss": -12.26310920715332, "global_step": 367981, "epoch": 2190} {"train_loss": -11.96092700958252, "global_step": 367982, "epoch": 2190} {"train_loss": -12.23068618774414, "global_step": 367983, "epoch": 2190} {"train_loss": -11.978937149047852, "global_step": 367984, "epoch": 2190} {"train_loss": -12.157841682434082, "global_step": 367985, "epoch": 2190} {"train_loss": -12.051087379455566, "global_step": 367986, "epoch": 2190} {"train_loss": -12.360621452331543, "global_step": 367987, "epoch": 2190} {"train_loss": -12.187423706054688, "global_step": 367988, "epoch": 2190} {"train_loss": -12.089082717895508, "global_step": 367989, "epoch": 2190} {"train_loss": -12.588788986206055, "global_step": 367990, "epoch": 2190} {"train_loss": -12.383880615234375, "global_step": 367991, "epoch": 2190} {"train_loss": -12.211938858032227, "global_step": 367992, "epoch": 2190} {"train_loss": -12.346784591674805, "global_step": 367993, "epoch": 2190} {"train_loss": -12.077007293701172, "global_step": 367994, "epoch": 2190} {"train_loss": -12.074869155883789, "global_step": 367995, "epoch": 2190} {"train_loss": -12.040264129638672, "global_step": 367996, "epoch": 2190} {"train_loss": -12.33833122253418, "global_step": 367997, "epoch": 2190} {"train_loss": -12.137735366821289, "global_step": 367998, "epoch": 2190} {"train_loss": -12.182943344116211, "global_step": 367999, "epoch": 2190} {"train_loss": -12.45517349243164, "global_step": 368000, "epoch": 2190} {"train_loss": -12.064599990844727, "global_step": 368001, "epoch": 2190} {"train_loss": -12.34568977355957, "global_step": 368002, "epoch": 2190} {"train_loss": -12.557971954345703, "global_step": 368003, "epoch": 2190} {"train_loss": -12.33315658569336, "global_step": 368004, "epoch": 2190} {"train_loss": -12.617110252380371, "global_step": 368005, "epoch": 2190} {"train_loss": -12.34085464477539, "global_step": 368006, "epoch": 2190} {"train_loss": -12.350664138793945, "global_step": 368007, "epoch": 2190} {"train_loss": -12.273097038269043, "global_step": 368008, "epoch": 2190} {"train_loss": -12.708551406860352, "global_step": 368009, "epoch": 2190} {"train_loss": -12.437211036682129, "global_step": 368010, "epoch": 2190} {"train_loss": -12.656479835510254, "global_step": 368011, "epoch": 2190} {"train_loss": -12.528739929199219, "global_step": 368012, "epoch": 2190} {"train_loss": -12.666208267211914, "global_step": 368013, "epoch": 2190} {"train_loss": -12.486001968383789, "global_step": 368014, "epoch": 2190} {"train_loss": -12.30396842956543, "global_step": 368015, "epoch": 2190} {"train_loss": -12.320352554321289, "global_step": 368016, "epoch": 2190} {"train_loss": -12.275413513183594, "global_step": 368017, "epoch": 2190} {"train_loss": -12.581405639648438, "global_step": 368018, "epoch": 2190} {"train_loss": -12.606760025024414, "global_step": 368019, "epoch": 2190} {"train_loss": -12.783377647399902, "global_step": 368020, "epoch": 2190} {"train_loss": -12.497825622558594, "global_step": 368021, "epoch": 2190} {"train_loss": -12.4720458984375, "global_step": 368022, "epoch": 2190} {"train_loss": -12.671012878417969, "global_step": 368023, "epoch": 2190} {"train_loss": -12.19394588470459, "global_step": 368024, "epoch": 2190} {"train_loss": -12.470252990722656, "global_step": 368025, "epoch": 2190} {"train_loss": -12.61833381652832, "global_step": 368026, "epoch": 2190} {"train_loss": -12.485174179077148, "global_step": 368027, "epoch": 2190} {"train_loss": -12.77978515625, "global_step": 368028, "epoch": 2190} {"train_loss": -12.584209442138672, "global_step": 368029, "epoch": 2190} {"train_loss": -12.327025413513184, "global_step": 368030, "epoch": 2190} {"train_loss": -12.719432830810547, "global_step": 368031, "epoch": 2190} {"train_loss": -12.674285888671875, "global_step": 368032, "epoch": 2190} {"train_loss": -12.40188980102539, "global_step": 368033, "epoch": 2190} {"train_loss": -12.733381271362305, "global_step": 368034, "epoch": 2190} {"train_loss": -12.340530395507812, "global_step": 368035, "epoch": 2190} {"train_loss": -12.549848556518555, "global_step": 368036, "epoch": 2190} {"train_loss": -12.373071670532227, "global_step": 368037, "epoch": 2190} {"train_loss": -12.493980407714844, "global_step": 368038, "epoch": 2190} {"train_loss": -12.56651782989502, "global_step": 368039, "epoch": 2190} {"train_loss": -12.186683654785156, "global_step": 368040, "epoch": 2190} {"train_loss": -11.968339920043945, "global_step": 368041, "epoch": 2190} {"train_loss": -12.464010238647461, "global_step": 368042, "epoch": 2190} {"train_loss": -12.28498363494873, "global_step": 368043, "epoch": 2190} {"train_loss": -12.326577186584473, "global_step": 368044, "epoch": 2190} {"train_loss": -12.36291217803955, "global_step": 368045, "epoch": 2190} {"train_loss": -12.748926162719727, "global_step": 368046, "epoch": 2190} {"train_loss": -12.657743453979492, "global_step": 368047, "epoch": 2190} {"train_loss": -12.445292472839355, "global_step": 368048, "epoch": 2190} {"train_loss": -12.772823333740234, "global_step": 368049, "epoch": 2190} {"train_loss": -12.644903182983398, "global_step": 368050, "epoch": 2190} {"train_loss": -12.0853271484375, "global_step": 368051, "epoch": 2190} {"train_loss": -12.543092727661133, "global_step": 368052, "epoch": 2190} {"train_loss": -12.516668319702148, "global_step": 368053, "epoch": 2190} {"train_loss": -12.437442779541016, "global_step": 368054, "epoch": 2190} {"train_loss": -12.524496078491211, "global_step": 368055, "epoch": 2190} {"train_loss": -12.30662727355957, "global_step": 368056, "epoch": 2190} {"train_loss": -12.3458833694458, "global_step": 368057, "epoch": 2190} {"train_loss": -12.249818801879883, "global_step": 368058, "epoch": 2190} {"train_loss": -12.11185073852539, "global_step": 368059, "epoch": 2190} {"train_loss": -12.209335327148438, "global_step": 368060, "epoch": 2190} {"train_loss": -11.855218887329102, "global_step": 368061, "epoch": 2190} {"train_loss": -11.686288833618164, "global_step": 368062, "epoch": 2190} {"train_loss": -11.280402183532715, "global_step": 368063, "epoch": 2190} {"train_loss": -11.924120903015137, "global_step": 368064, "epoch": 2190} {"train_loss": -12.482368469238281, "global_step": 368065, "epoch": 2190} {"train_loss": -12.226579666137695, "global_step": 368066, "epoch": 2190} {"train_loss": -11.26248550415039, "global_step": 368067, "epoch": 2190} {"train_loss": -11.329878807067871, "global_step": 368068, "epoch": 2190} {"train_loss": -11.79348373413086, "global_step": 368069, "epoch": 2190} {"train_loss": -12.104558944702148, "global_step": 368070, "epoch": 2190} {"train_loss": -12.376165390014648, "global_step": 368071, "epoch": 2190} {"train_loss": -11.78632926940918, "global_step": 368072, "epoch": 2190} {"train_loss": -11.991506576538086, "global_step": 368073, "epoch": 2190} {"train_loss": -11.838634490966797, "global_step": 368074, "epoch": 2190} {"train_loss": -12.10219955444336, "global_step": 368075, "epoch": 2190} {"train_loss": -11.243735313415527, "global_step": 368076, "epoch": 2190} {"train_loss": -12.164413452148438, "global_step": 368077, "epoch": 2190} {"train_loss": -11.329742431640625, "global_step": 368078, "epoch": 2190} {"train_loss": -12.135279655456543, "global_step": 368079, "epoch": 2190} {"train_loss": -11.499593734741211, "global_step": 368080, "epoch": 2190} {"train_loss": -11.789199829101562, "global_step": 368081, "epoch": 2190} {"train_loss": -11.510649681091309, "global_step": 368082, "epoch": 2190} {"train_loss": -12.232576370239258, "global_step": 368083, "epoch": 2190} {"train_loss": -11.97412109375, "global_step": 368084, "epoch": 2190} {"train_loss": -12.193559646606445, "global_step": 368085, "epoch": 2190} {"train_loss": -12.120285987854004, "global_step": 368086, "epoch": 2190} {"train_loss": -12.168552165939694, "global_step": 368087, "epoch": 2190, "val_loss": 291822.53125, "train_action_mse_error": 0.2861745357513428} {"train_loss": -10.37114143371582, "global_step": 368088, "epoch": 2191} {"train_loss": -10.56100845336914, "global_step": 368089, "epoch": 2191} {"train_loss": -11.337764739990234, "global_step": 368090, "epoch": 2191} {"train_loss": -10.677419662475586, "global_step": 368091, "epoch": 2191} {"train_loss": -10.179347038269043, "global_step": 368092, "epoch": 2191} {"train_loss": -9.612753868103027, "global_step": 368093, "epoch": 2191} {"train_loss": -11.230085372924805, "global_step": 368094, "epoch": 2191} {"train_loss": -10.688529968261719, "global_step": 368095, "epoch": 2191} {"train_loss": -10.890464782714844, "global_step": 368096, "epoch": 2191} {"train_loss": -10.561125755310059, "global_step": 368097, "epoch": 2191} {"train_loss": -10.656435012817383, "global_step": 368098, "epoch": 2191} {"train_loss": -10.311092376708984, "global_step": 368099, "epoch": 2191} {"train_loss": -10.949090957641602, "global_step": 368100, "epoch": 2191} {"train_loss": -10.958735466003418, "global_step": 368101, "epoch": 2191} {"train_loss": -11.766698837280273, "global_step": 368102, "epoch": 2191} {"train_loss": -11.059417724609375, "global_step": 368103, "epoch": 2191} {"train_loss": -10.933791160583496, "global_step": 368104, "epoch": 2191} {"train_loss": -11.143106460571289, "global_step": 368105, "epoch": 2191} {"train_loss": -10.68348503112793, "global_step": 368106, "epoch": 2191} {"train_loss": -9.81159496307373, "global_step": 368107, "epoch": 2191} {"train_loss": -10.73487663269043, "global_step": 368108, "epoch": 2191} {"train_loss": -11.450240135192871, "global_step": 368109, "epoch": 2191} {"train_loss": -9.590332984924316, "global_step": 368110, "epoch": 2191} {"train_loss": -10.371809005737305, "global_step": 368111, "epoch": 2191} {"train_loss": -10.961392402648926, "global_step": 368112, "epoch": 2191} {"train_loss": -9.952656745910645, "global_step": 368113, "epoch": 2191} {"train_loss": -11.249881744384766, "global_step": 368114, "epoch": 2191} {"train_loss": -10.419322967529297, "global_step": 368115, "epoch": 2191} {"train_loss": -10.554614067077637, "global_step": 368116, "epoch": 2191} {"train_loss": -11.432077407836914, "global_step": 368117, "epoch": 2191} {"train_loss": -11.196602821350098, "global_step": 368118, "epoch": 2191} {"train_loss": -10.589008331298828, "global_step": 368119, "epoch": 2191} {"train_loss": -11.501582145690918, "global_step": 368120, "epoch": 2191} {"train_loss": -10.986282348632812, "global_step": 368121, "epoch": 2191} {"train_loss": -12.085041046142578, "global_step": 368122, "epoch": 2191} {"train_loss": -11.501208305358887, "global_step": 368123, "epoch": 2191} {"train_loss": -11.34416389465332, "global_step": 368124, "epoch": 2191} {"train_loss": -11.792160987854004, "global_step": 368125, "epoch": 2191} {"train_loss": -11.029032707214355, "global_step": 368126, "epoch": 2191} {"train_loss": -11.516372680664062, "global_step": 368127, "epoch": 2191} {"train_loss": -11.49996280670166, "global_step": 368128, "epoch": 2191} {"train_loss": -11.32773208618164, "global_step": 368129, "epoch": 2191} {"train_loss": -12.266488075256348, "global_step": 368130, "epoch": 2191} {"train_loss": -11.758528709411621, "global_step": 368131, "epoch": 2191} {"train_loss": -11.38329792022705, "global_step": 368132, "epoch": 2191} {"train_loss": -11.87318229675293, "global_step": 368133, "epoch": 2191} {"train_loss": -11.718755722045898, "global_step": 368134, "epoch": 2191} {"train_loss": -11.78441047668457, "global_step": 368135, "epoch": 2191} {"train_loss": -12.136974334716797, "global_step": 368136, "epoch": 2191} {"train_loss": -11.936681747436523, "global_step": 368137, "epoch": 2191} {"train_loss": -11.993173599243164, "global_step": 368138, "epoch": 2191} {"train_loss": -12.21875, "global_step": 368139, "epoch": 2191} {"train_loss": -11.983221054077148, "global_step": 368140, "epoch": 2191} {"train_loss": -12.119709014892578, "global_step": 368141, "epoch": 2191} {"train_loss": -12.027901649475098, "global_step": 368142, "epoch": 2191} {"train_loss": -11.886632919311523, "global_step": 368143, "epoch": 2191} {"train_loss": -12.17755126953125, "global_step": 368144, "epoch": 2191} {"train_loss": -12.154991149902344, "global_step": 368145, "epoch": 2191} {"train_loss": -12.094125747680664, "global_step": 368146, "epoch": 2191} {"train_loss": -11.965277671813965, "global_step": 368147, "epoch": 2191} {"train_loss": -12.285852432250977, "global_step": 368148, "epoch": 2191} {"train_loss": -11.864194869995117, "global_step": 368149, "epoch": 2191} {"train_loss": -12.110764503479004, "global_step": 368150, "epoch": 2191} {"train_loss": -12.167898178100586, "global_step": 368151, "epoch": 2191} {"train_loss": -11.969295501708984, "global_step": 368152, "epoch": 2191} {"train_loss": -12.10151481628418, "global_step": 368153, "epoch": 2191} {"train_loss": -12.054868698120117, "global_step": 368154, "epoch": 2191} {"train_loss": -12.337691307067871, "global_step": 368155, "epoch": 2191} {"train_loss": -12.42529582977295, "global_step": 368156, "epoch": 2191} {"train_loss": -12.529562950134277, "global_step": 368157, "epoch": 2191} {"train_loss": -12.387535095214844, "global_step": 368158, "epoch": 2191} {"train_loss": -12.45921802520752, "global_step": 368159, "epoch": 2191} {"train_loss": -12.444055557250977, "global_step": 368160, "epoch": 2191} {"train_loss": -12.310592651367188, "global_step": 368161, "epoch": 2191} {"train_loss": -12.33513355255127, "global_step": 368162, "epoch": 2191} {"train_loss": -12.202102661132812, "global_step": 368163, "epoch": 2191} {"train_loss": -12.405309677124023, "global_step": 368164, "epoch": 2191} {"train_loss": -12.214425086975098, "global_step": 368165, "epoch": 2191} {"train_loss": -12.29666805267334, "global_step": 368166, "epoch": 2191} {"train_loss": -12.09011459350586, "global_step": 368167, "epoch": 2191} {"train_loss": -12.354801177978516, "global_step": 368168, "epoch": 2191} {"train_loss": -12.177109718322754, "global_step": 368169, "epoch": 2191} {"train_loss": -12.671655654907227, "global_step": 368170, "epoch": 2191} {"train_loss": -12.180573463439941, "global_step": 368171, "epoch": 2191} {"train_loss": -12.558150291442871, "global_step": 368172, "epoch": 2191} {"train_loss": -12.338030815124512, "global_step": 368173, "epoch": 2191} {"train_loss": -12.337081909179688, "global_step": 368174, "epoch": 2191} {"train_loss": -12.49169921875, "global_step": 368175, "epoch": 2191} {"train_loss": -12.199146270751953, "global_step": 368176, "epoch": 2191} {"train_loss": -12.456080436706543, "global_step": 368177, "epoch": 2191} {"train_loss": -12.2371826171875, "global_step": 368178, "epoch": 2191} {"train_loss": -12.369200706481934, "global_step": 368179, "epoch": 2191} {"train_loss": -12.402894020080566, "global_step": 368180, "epoch": 2191} {"train_loss": -12.334592819213867, "global_step": 368181, "epoch": 2191} {"train_loss": -12.326576232910156, "global_step": 368182, "epoch": 2191} {"train_loss": -12.296940803527832, "global_step": 368183, "epoch": 2191} {"train_loss": -12.535648345947266, "global_step": 368184, "epoch": 2191} {"train_loss": -12.76777172088623, "global_step": 368185, "epoch": 2191} {"train_loss": -12.476299285888672, "global_step": 368186, "epoch": 2191} {"train_loss": -12.758330345153809, "global_step": 368187, "epoch": 2191} {"train_loss": -12.72288703918457, "global_step": 368188, "epoch": 2191} {"train_loss": -12.560500144958496, "global_step": 368189, "epoch": 2191} {"train_loss": -12.606205940246582, "global_step": 368190, "epoch": 2191} {"train_loss": -12.434142112731934, "global_step": 368191, "epoch": 2191} {"train_loss": -12.654800415039062, "global_step": 368192, "epoch": 2191} {"train_loss": -12.62082290649414, "global_step": 368193, "epoch": 2191} {"train_loss": -12.588004112243652, "global_step": 368194, "epoch": 2191} {"train_loss": -12.496295928955078, "global_step": 368195, "epoch": 2191} {"train_loss": -12.767598152160645, "global_step": 368196, "epoch": 2191} {"train_loss": -12.744306564331055, "global_step": 368197, "epoch": 2191} {"train_loss": -12.758779525756836, "global_step": 368198, "epoch": 2191} {"train_loss": -12.512262344360352, "global_step": 368199, "epoch": 2191} {"train_loss": -12.42005729675293, "global_step": 368200, "epoch": 2191} {"train_loss": -12.466974258422852, "global_step": 368201, "epoch": 2191} {"train_loss": -12.548430442810059, "global_step": 368202, "epoch": 2191} {"train_loss": -12.20093059539795, "global_step": 368203, "epoch": 2191} {"train_loss": -11.697893142700195, "global_step": 368204, "epoch": 2191} {"train_loss": -12.518564224243164, "global_step": 368205, "epoch": 2191} {"train_loss": -12.624902725219727, "global_step": 368206, "epoch": 2191} {"train_loss": -11.827634811401367, "global_step": 368207, "epoch": 2191} {"train_loss": -11.618772506713867, "global_step": 368208, "epoch": 2191} {"train_loss": -12.26414966583252, "global_step": 368209, "epoch": 2191} {"train_loss": -11.957548141479492, "global_step": 368210, "epoch": 2191} {"train_loss": -11.210936546325684, "global_step": 368211, "epoch": 2191} {"train_loss": -12.503002166748047, "global_step": 368212, "epoch": 2191} {"train_loss": -12.373456954956055, "global_step": 368213, "epoch": 2191} {"train_loss": -12.200218200683594, "global_step": 368214, "epoch": 2191} {"train_loss": -12.275602340698242, "global_step": 368215, "epoch": 2191} {"train_loss": -12.329357147216797, "global_step": 368216, "epoch": 2191} {"train_loss": -12.700850486755371, "global_step": 368217, "epoch": 2191} {"train_loss": -12.578001022338867, "global_step": 368218, "epoch": 2191} {"train_loss": -12.234859466552734, "global_step": 368219, "epoch": 2191} {"train_loss": -11.93752670288086, "global_step": 368220, "epoch": 2191} {"train_loss": -11.842741966247559, "global_step": 368221, "epoch": 2191} {"train_loss": -11.890813827514648, "global_step": 368222, "epoch": 2191} {"train_loss": -11.483759880065918, "global_step": 368223, "epoch": 2191} {"train_loss": -9.543237686157227, "global_step": 368224, "epoch": 2191} {"train_loss": -12.271924018859863, "global_step": 368225, "epoch": 2191} {"train_loss": -9.51285457611084, "global_step": 368226, "epoch": 2191} {"train_loss": -11.156360626220703, "global_step": 368227, "epoch": 2191} {"train_loss": -11.288983345031738, "global_step": 368228, "epoch": 2191} {"train_loss": -11.01418399810791, "global_step": 368229, "epoch": 2191} {"train_loss": -11.961148262023926, "global_step": 368230, "epoch": 2191} {"train_loss": -10.083993911743164, "global_step": 368231, "epoch": 2191} {"train_loss": -11.796723365783691, "global_step": 368232, "epoch": 2191} {"train_loss": -11.833678245544434, "global_step": 368233, "epoch": 2191} {"train_loss": -11.341981887817383, "global_step": 368234, "epoch": 2191} {"train_loss": -12.208908081054688, "global_step": 368235, "epoch": 2191} {"train_loss": -11.15626335144043, "global_step": 368236, "epoch": 2191} {"train_loss": -12.288156509399414, "global_step": 368237, "epoch": 2191} {"train_loss": -11.326465606689453, "global_step": 368238, "epoch": 2191} {"train_loss": -11.485062599182129, "global_step": 368239, "epoch": 2191} {"train_loss": -11.50058364868164, "global_step": 368240, "epoch": 2191} {"train_loss": -11.697701454162598, "global_step": 368241, "epoch": 2191} {"train_loss": -12.415521621704102, "global_step": 368242, "epoch": 2191} {"train_loss": -11.418960571289062, "global_step": 368243, "epoch": 2191} {"train_loss": -12.66849136352539, "global_step": 368244, "epoch": 2191} {"train_loss": -10.896475791931152, "global_step": 368245, "epoch": 2191} {"train_loss": -12.352706909179688, "global_step": 368246, "epoch": 2191} {"train_loss": -11.258955001831055, "global_step": 368247, "epoch": 2191} {"train_loss": -11.725189208984375, "global_step": 368248, "epoch": 2191} {"train_loss": -11.898155212402344, "global_step": 368249, "epoch": 2191} {"train_loss": -11.481529235839844, "global_step": 368250, "epoch": 2191} {"train_loss": -11.375237464904785, "global_step": 368251, "epoch": 2191} {"train_loss": -11.61384391784668, "global_step": 368252, "epoch": 2191} {"train_loss": -11.567358016967773, "global_step": 368253, "epoch": 2191} {"train_loss": -11.743816375732422, "global_step": 368254, "epoch": 2191} {"train_loss": -11.768191797392708, "global_step": 368255, "epoch": 2191, "val_loss": 290975.0625} {"train_loss": -11.994510650634766, "global_step": 368256, "epoch": 2192} {"train_loss": -11.532249450683594, "global_step": 368257, "epoch": 2192} {"train_loss": -11.952357292175293, "global_step": 368258, "epoch": 2192} {"train_loss": -11.852941513061523, "global_step": 368259, "epoch": 2192} {"train_loss": -12.223060607910156, "global_step": 368260, "epoch": 2192} {"train_loss": -11.9166259765625, "global_step": 368261, "epoch": 2192} {"train_loss": -12.2667875289917, "global_step": 368262, "epoch": 2192} {"train_loss": -12.293682098388672, "global_step": 368263, "epoch": 2192} {"train_loss": -11.842180252075195, "global_step": 368264, "epoch": 2192} {"train_loss": -12.304608345031738, "global_step": 368265, "epoch": 2192} {"train_loss": -11.514062881469727, "global_step": 368266, "epoch": 2192} {"train_loss": -12.079150199890137, "global_step": 368267, "epoch": 2192} {"train_loss": -11.7120943069458, "global_step": 368268, "epoch": 2192} {"train_loss": -12.249279975891113, "global_step": 368269, "epoch": 2192} {"train_loss": -12.148563385009766, "global_step": 368270, "epoch": 2192} {"train_loss": -12.502692222595215, "global_step": 368271, "epoch": 2192} {"train_loss": -12.068452835083008, "global_step": 368272, "epoch": 2192} {"train_loss": -12.17247200012207, "global_step": 368273, "epoch": 2192} {"train_loss": -12.21623706817627, "global_step": 368274, "epoch": 2192} {"train_loss": -12.219751358032227, "global_step": 368275, "epoch": 2192} {"train_loss": -12.183329582214355, "global_step": 368276, "epoch": 2192} {"train_loss": -12.106636047363281, "global_step": 368277, "epoch": 2192} {"train_loss": -12.322936058044434, "global_step": 368278, "epoch": 2192} {"train_loss": -12.195531845092773, "global_step": 368279, "epoch": 2192} {"train_loss": -12.39513874053955, "global_step": 368280, "epoch": 2192} {"train_loss": -12.324722290039062, "global_step": 368281, "epoch": 2192} {"train_loss": -12.448781967163086, "global_step": 368282, "epoch": 2192} {"train_loss": -12.36883544921875, "global_step": 368283, "epoch": 2192} {"train_loss": -12.564138412475586, "global_step": 368284, "epoch": 2192} {"train_loss": -12.194975852966309, "global_step": 368285, "epoch": 2192} {"train_loss": -12.707660675048828, "global_step": 368286, "epoch": 2192} {"train_loss": -12.413074493408203, "global_step": 368287, "epoch": 2192} {"train_loss": -12.65695571899414, "global_step": 368288, "epoch": 2192} {"train_loss": -12.22439956665039, "global_step": 368289, "epoch": 2192} {"train_loss": -12.478374481201172, "global_step": 368290, "epoch": 2192} {"train_loss": -12.381185531616211, "global_step": 368291, "epoch": 2192} {"train_loss": -12.299964904785156, "global_step": 368292, "epoch": 2192} {"train_loss": -12.552595138549805, "global_step": 368293, "epoch": 2192} {"train_loss": -12.322547912597656, "global_step": 368294, "epoch": 2192} {"train_loss": -12.41679573059082, "global_step": 368295, "epoch": 2192} {"train_loss": -12.470834732055664, "global_step": 368296, "epoch": 2192} {"train_loss": -12.65192699432373, "global_step": 368297, "epoch": 2192} {"train_loss": -12.7991943359375, "global_step": 368298, "epoch": 2192} {"train_loss": -12.492402076721191, "global_step": 368299, "epoch": 2192} {"train_loss": -12.456740379333496, "global_step": 368300, "epoch": 2192} {"train_loss": -12.595107078552246, "global_step": 368301, "epoch": 2192} {"train_loss": -12.61557674407959, "global_step": 368302, "epoch": 2192} {"train_loss": -12.567129135131836, "global_step": 368303, "epoch": 2192} {"train_loss": -12.529829978942871, "global_step": 368304, "epoch": 2192} {"train_loss": -12.660087585449219, "global_step": 368305, "epoch": 2192} {"train_loss": -12.6976900100708, "global_step": 368306, "epoch": 2192} {"train_loss": -12.482295036315918, "global_step": 368307, "epoch": 2192} {"train_loss": -12.510690689086914, "global_step": 368308, "epoch": 2192} {"train_loss": -12.527345657348633, "global_step": 368309, "epoch": 2192} {"train_loss": -12.74233627319336, "global_step": 368310, "epoch": 2192} {"train_loss": -12.759855270385742, "global_step": 368311, "epoch": 2192} {"train_loss": -12.838160514831543, "global_step": 368312, "epoch": 2192} {"train_loss": -12.577912330627441, "global_step": 368313, "epoch": 2192} {"train_loss": -12.72274398803711, "global_step": 368314, "epoch": 2192} {"train_loss": -12.83876895904541, "global_step": 368315, "epoch": 2192} {"train_loss": -12.88204288482666, "global_step": 368316, "epoch": 2192} {"train_loss": -12.769088745117188, "global_step": 368317, "epoch": 2192} {"train_loss": -12.552923202514648, "global_step": 368318, "epoch": 2192} {"train_loss": -12.5496244430542, "global_step": 368319, "epoch": 2192} {"train_loss": -12.778995513916016, "global_step": 368320, "epoch": 2192} {"train_loss": -12.813650131225586, "global_step": 368321, "epoch": 2192} {"train_loss": -12.386177062988281, "global_step": 368322, "epoch": 2192} {"train_loss": -12.857633590698242, "global_step": 368323, "epoch": 2192} {"train_loss": -12.621891975402832, "global_step": 368324, "epoch": 2192} {"train_loss": -12.567354202270508, "global_step": 368325, "epoch": 2192} {"train_loss": -12.722517013549805, "global_step": 368326, "epoch": 2192} {"train_loss": -12.535776138305664, "global_step": 368327, "epoch": 2192} {"train_loss": -12.697492599487305, "global_step": 368328, "epoch": 2192} {"train_loss": -12.357537269592285, "global_step": 368329, "epoch": 2192} {"train_loss": -11.583597183227539, "global_step": 368330, "epoch": 2192} {"train_loss": -11.954989433288574, "global_step": 368331, "epoch": 2192} {"train_loss": -12.353662490844727, "global_step": 368332, "epoch": 2192} {"train_loss": -12.567488670349121, "global_step": 368333, "epoch": 2192} {"train_loss": -11.68568229675293, "global_step": 368334, "epoch": 2192} {"train_loss": -10.319568634033203, "global_step": 368335, "epoch": 2192} {"train_loss": -9.37521743774414, "global_step": 368336, "epoch": 2192} {"train_loss": -9.549234390258789, "global_step": 368337, "epoch": 2192} {"train_loss": -11.102840423583984, "global_step": 368338, "epoch": 2192} {"train_loss": -8.357126235961914, "global_step": 368339, "epoch": 2192} {"train_loss": -10.372538566589355, "global_step": 368340, "epoch": 2192} {"train_loss": -6.1968817710876465, "global_step": 368341, "epoch": 2192} {"train_loss": -6.618971824645996, "global_step": 368342, "epoch": 2192} {"train_loss": -6.436018943786621, "global_step": 368343, "epoch": 2192} {"train_loss": -6.75606632232666, "global_step": 368344, "epoch": 2192} {"train_loss": -6.551146030426025, "global_step": 368345, "epoch": 2192} {"train_loss": -6.2455549240112305, "global_step": 368346, "epoch": 2192} {"train_loss": -5.978545188903809, "global_step": 368347, "epoch": 2192} {"train_loss": -6.390915870666504, "global_step": 368348, "epoch": 2192} {"train_loss": -5.966680526733398, "global_step": 368349, "epoch": 2192} {"train_loss": -5.904106140136719, "global_step": 368350, "epoch": 2192} {"train_loss": -6.435843467712402, "global_step": 368351, "epoch": 2192} {"train_loss": -6.621652603149414, "global_step": 368352, "epoch": 2192} {"train_loss": -6.879261493682861, "global_step": 368353, "epoch": 2192} {"train_loss": -6.3129167556762695, "global_step": 368354, "epoch": 2192} {"train_loss": -6.104466915130615, "global_step": 368355, "epoch": 2192} {"train_loss": -6.228609561920166, "global_step": 368356, "epoch": 2192} {"train_loss": -6.8691816329956055, "global_step": 368357, "epoch": 2192} {"train_loss": -6.674395561218262, "global_step": 368358, "epoch": 2192} {"train_loss": -7.0989227294921875, "global_step": 368359, "epoch": 2192} {"train_loss": -6.949390888214111, "global_step": 368360, "epoch": 2192} {"train_loss": -7.238105773925781, "global_step": 368361, "epoch": 2192} {"train_loss": -7.2878804206848145, "global_step": 368362, "epoch": 2192} {"train_loss": -7.346235275268555, "global_step": 368363, "epoch": 2192} {"train_loss": -7.297240257263184, "global_step": 368364, "epoch": 2192} {"train_loss": -7.251924514770508, "global_step": 368365, "epoch": 2192} {"train_loss": -8.00623607635498, "global_step": 368366, "epoch": 2192} {"train_loss": -7.506028175354004, "global_step": 368367, "epoch": 2192} {"train_loss": -7.750451564788818, "global_step": 368368, "epoch": 2192} {"train_loss": -7.905857086181641, "global_step": 368369, "epoch": 2192} {"train_loss": -8.164705276489258, "global_step": 368370, "epoch": 2192} {"train_loss": -8.617898941040039, "global_step": 368371, "epoch": 2192} {"train_loss": -8.366353988647461, "global_step": 368372, "epoch": 2192} {"train_loss": -8.23608684539795, "global_step": 368373, "epoch": 2192} {"train_loss": -8.613298416137695, "global_step": 368374, "epoch": 2192} {"train_loss": -8.514055252075195, "global_step": 368375, "epoch": 2192} {"train_loss": -8.655433654785156, "global_step": 368376, "epoch": 2192} {"train_loss": -9.130728721618652, "global_step": 368377, "epoch": 2192} {"train_loss": -8.966426849365234, "global_step": 368378, "epoch": 2192} {"train_loss": -9.435001373291016, "global_step": 368379, "epoch": 2192} {"train_loss": -9.932403564453125, "global_step": 368380, "epoch": 2192} {"train_loss": -9.910028457641602, "global_step": 368381, "epoch": 2192} {"train_loss": -10.046669960021973, "global_step": 368382, "epoch": 2192} {"train_loss": -10.021793365478516, "global_step": 368383, "epoch": 2192} {"train_loss": -10.383529663085938, "global_step": 368384, "epoch": 2192} {"train_loss": -10.74245548248291, "global_step": 368385, "epoch": 2192} {"train_loss": -10.444276809692383, "global_step": 368386, "epoch": 2192} {"train_loss": -10.984970092773438, "global_step": 368387, "epoch": 2192} {"train_loss": -11.231679916381836, "global_step": 368388, "epoch": 2192} {"train_loss": -11.358748435974121, "global_step": 368389, "epoch": 2192} {"train_loss": -10.945646286010742, "global_step": 368390, "epoch": 2192} {"train_loss": -11.4480562210083, "global_step": 368391, "epoch": 2192} {"train_loss": -11.515348434448242, "global_step": 368392, "epoch": 2192} {"train_loss": -11.682282447814941, "global_step": 368393, "epoch": 2192} {"train_loss": -11.931327819824219, "global_step": 368394, "epoch": 2192} {"train_loss": -11.73666000366211, "global_step": 368395, "epoch": 2192} {"train_loss": -11.65108871459961, "global_step": 368396, "epoch": 2192} {"train_loss": -11.770891189575195, "global_step": 368397, "epoch": 2192} {"train_loss": -11.627050399780273, "global_step": 368398, "epoch": 2192} {"train_loss": -11.531400680541992, "global_step": 368399, "epoch": 2192} {"train_loss": -11.7630033493042, "global_step": 368400, "epoch": 2192} {"train_loss": -11.998340606689453, "global_step": 368401, "epoch": 2192} {"train_loss": -11.681495666503906, "global_step": 368402, "epoch": 2192} {"train_loss": -11.72941780090332, "global_step": 368403, "epoch": 2192} {"train_loss": -11.774011611938477, "global_step": 368404, "epoch": 2192} {"train_loss": -11.910728454589844, "global_step": 368405, "epoch": 2192} {"train_loss": -11.824319839477539, "global_step": 368406, "epoch": 2192} {"train_loss": -12.214471817016602, "global_step": 368407, "epoch": 2192} {"train_loss": -11.894014358520508, "global_step": 368408, "epoch": 2192} {"train_loss": -12.324060440063477, "global_step": 368409, "epoch": 2192} {"train_loss": -11.946395874023438, "global_step": 368410, "epoch": 2192} {"train_loss": -12.011805534362793, "global_step": 368411, "epoch": 2192} {"train_loss": -12.282122611999512, "global_step": 368412, "epoch": 2192} {"train_loss": -11.972572326660156, "global_step": 368413, "epoch": 2192} {"train_loss": -12.237167358398438, "global_step": 368414, "epoch": 2192} {"train_loss": -12.173074722290039, "global_step": 368415, "epoch": 2192} {"train_loss": -11.848466873168945, "global_step": 368416, "epoch": 2192} {"train_loss": -12.238771438598633, "global_step": 368417, "epoch": 2192} {"train_loss": -11.863134384155273, "global_step": 368418, "epoch": 2192} {"train_loss": -11.812387466430664, "global_step": 368419, "epoch": 2192} {"train_loss": -11.917661666870117, "global_step": 368420, "epoch": 2192} {"train_loss": -11.458614349365234, "global_step": 368421, "epoch": 2192} {"train_loss": -12.139995574951172, "global_step": 368422, "epoch": 2192} {"train_loss": -10.883510935874213, "global_step": 368423, "epoch": 2192, "val_loss": 292667.6875} {"train_loss": -11.57363510131836, "global_step": 368424, "epoch": 2193} {"train_loss": -11.012638092041016, "global_step": 368425, "epoch": 2193} {"train_loss": -11.27851390838623, "global_step": 368426, "epoch": 2193} {"train_loss": -11.627279281616211, "global_step": 368427, "epoch": 2193} {"train_loss": -11.020097732543945, "global_step": 368428, "epoch": 2193} {"train_loss": -11.99128246307373, "global_step": 368429, "epoch": 2193} {"train_loss": -10.954954147338867, "global_step": 368430, "epoch": 2193} {"train_loss": -11.399526596069336, "global_step": 368431, "epoch": 2193} {"train_loss": -11.030147552490234, "global_step": 368432, "epoch": 2193} {"train_loss": -11.319134712219238, "global_step": 368433, "epoch": 2193} {"train_loss": -10.810564041137695, "global_step": 368434, "epoch": 2193} {"train_loss": -12.24598217010498, "global_step": 368435, "epoch": 2193} {"train_loss": -10.812615394592285, "global_step": 368436, "epoch": 2193} {"train_loss": -11.971573829650879, "global_step": 368437, "epoch": 2193} {"train_loss": -11.505468368530273, "global_step": 368438, "epoch": 2193} {"train_loss": -11.220941543579102, "global_step": 368439, "epoch": 2193} {"train_loss": -11.887725830078125, "global_step": 368440, "epoch": 2193} {"train_loss": -11.314571380615234, "global_step": 368441, "epoch": 2193} {"train_loss": -11.58702564239502, "global_step": 368442, "epoch": 2193} {"train_loss": -11.479501724243164, "global_step": 368443, "epoch": 2193} {"train_loss": -11.311912536621094, "global_step": 368444, "epoch": 2193} {"train_loss": -11.67837142944336, "global_step": 368445, "epoch": 2193} {"train_loss": -11.415764808654785, "global_step": 368446, "epoch": 2193} {"train_loss": -11.99988079071045, "global_step": 368447, "epoch": 2193} {"train_loss": -11.719234466552734, "global_step": 368448, "epoch": 2193} {"train_loss": -11.083233833312988, "global_step": 368449, "epoch": 2193} {"train_loss": -11.908292770385742, "global_step": 368450, "epoch": 2193} {"train_loss": -11.704059600830078, "global_step": 368451, "epoch": 2193} {"train_loss": -10.547456741333008, "global_step": 368452, "epoch": 2193} {"train_loss": -12.207387924194336, "global_step": 368453, "epoch": 2193} {"train_loss": -10.77558708190918, "global_step": 368454, "epoch": 2193} {"train_loss": -12.114412307739258, "global_step": 368455, "epoch": 2193} {"train_loss": -11.02020263671875, "global_step": 368456, "epoch": 2193} {"train_loss": -11.587303161621094, "global_step": 368457, "epoch": 2193} {"train_loss": -11.834817886352539, "global_step": 368458, "epoch": 2193} {"train_loss": -11.794416427612305, "global_step": 368459, "epoch": 2193} {"train_loss": -11.901004791259766, "global_step": 368460, "epoch": 2193} {"train_loss": -12.184814453125, "global_step": 368461, "epoch": 2193} {"train_loss": -11.501258850097656, "global_step": 368462, "epoch": 2193} {"train_loss": -12.230998992919922, "global_step": 368463, "epoch": 2193} {"train_loss": -11.927023887634277, "global_step": 368464, "epoch": 2193} {"train_loss": -12.082674980163574, "global_step": 368465, "epoch": 2193} {"train_loss": -11.997797012329102, "global_step": 368466, "epoch": 2193} {"train_loss": -11.914579391479492, "global_step": 368467, "epoch": 2193} {"train_loss": -12.276451110839844, "global_step": 368468, "epoch": 2193} {"train_loss": -12.19112777709961, "global_step": 368469, "epoch": 2193} {"train_loss": -12.029057502746582, "global_step": 368470, "epoch": 2193} {"train_loss": -12.077422142028809, "global_step": 368471, "epoch": 2193} {"train_loss": -12.029706001281738, "global_step": 368472, "epoch": 2193} {"train_loss": -12.349775314331055, "global_step": 368473, "epoch": 2193} {"train_loss": -12.120227813720703, "global_step": 368474, "epoch": 2193} {"train_loss": -12.503116607666016, "global_step": 368475, "epoch": 2193} {"train_loss": -12.348600387573242, "global_step": 368476, "epoch": 2193} {"train_loss": -12.034958839416504, "global_step": 368477, "epoch": 2193} {"train_loss": -12.211461067199707, "global_step": 368478, "epoch": 2193} {"train_loss": -11.860177993774414, "global_step": 368479, "epoch": 2193} {"train_loss": -12.307823181152344, "global_step": 368480, "epoch": 2193} {"train_loss": -12.03888988494873, "global_step": 368481, "epoch": 2193} {"train_loss": -12.319231033325195, "global_step": 368482, "epoch": 2193} {"train_loss": -12.137649536132812, "global_step": 368483, "epoch": 2193} {"train_loss": -12.3009033203125, "global_step": 368484, "epoch": 2193} {"train_loss": -11.890809059143066, "global_step": 368485, "epoch": 2193} {"train_loss": -12.497844696044922, "global_step": 368486, "epoch": 2193} {"train_loss": -11.967947006225586, "global_step": 368487, "epoch": 2193} {"train_loss": -11.998828887939453, "global_step": 368488, "epoch": 2193} {"train_loss": -12.03335952758789, "global_step": 368489, "epoch": 2193} {"train_loss": -12.066474914550781, "global_step": 368490, "epoch": 2193} {"train_loss": -11.962907791137695, "global_step": 368491, "epoch": 2193} {"train_loss": -12.349117279052734, "global_step": 368492, "epoch": 2193} {"train_loss": -12.217997550964355, "global_step": 368493, "epoch": 2193} {"train_loss": -12.131063461303711, "global_step": 368494, "epoch": 2193} {"train_loss": -12.204048156738281, "global_step": 368495, "epoch": 2193} {"train_loss": -12.301068305969238, "global_step": 368496, "epoch": 2193} {"train_loss": -12.043302536010742, "global_step": 368497, "epoch": 2193} {"train_loss": -11.932853698730469, "global_step": 368498, "epoch": 2193} {"train_loss": -11.707098007202148, "global_step": 368499, "epoch": 2193} {"train_loss": -11.70649528503418, "global_step": 368500, "epoch": 2193} {"train_loss": -11.994452476501465, "global_step": 368501, "epoch": 2193} {"train_loss": -11.145817756652832, "global_step": 368502, "epoch": 2193} {"train_loss": -11.872519493103027, "global_step": 368503, "epoch": 2193} {"train_loss": -11.56429672241211, "global_step": 368504, "epoch": 2193} {"train_loss": -11.247180938720703, "global_step": 368505, "epoch": 2193} {"train_loss": -11.579803466796875, "global_step": 368506, "epoch": 2193} {"train_loss": -11.318647384643555, "global_step": 368507, "epoch": 2193} {"train_loss": -11.766782760620117, "global_step": 368508, "epoch": 2193} {"train_loss": -11.616865158081055, "global_step": 368509, "epoch": 2193} {"train_loss": -11.883329391479492, "global_step": 368510, "epoch": 2193} {"train_loss": -11.702230453491211, "global_step": 368511, "epoch": 2193} {"train_loss": -11.473054885864258, "global_step": 368512, "epoch": 2193} {"train_loss": -11.462163925170898, "global_step": 368513, "epoch": 2193} {"train_loss": -11.7041654586792, "global_step": 368514, "epoch": 2193} {"train_loss": -12.08664608001709, "global_step": 368515, "epoch": 2193} {"train_loss": -11.95152473449707, "global_step": 368516, "epoch": 2193} {"train_loss": -11.71781063079834, "global_step": 368517, "epoch": 2193} {"train_loss": -11.665538787841797, "global_step": 368518, "epoch": 2193} {"train_loss": -12.116382598876953, "global_step": 368519, "epoch": 2193} {"train_loss": -11.712963104248047, "global_step": 368520, "epoch": 2193} {"train_loss": -11.838130950927734, "global_step": 368521, "epoch": 2193} {"train_loss": -11.910605430603027, "global_step": 368522, "epoch": 2193} {"train_loss": -11.627037048339844, "global_step": 368523, "epoch": 2193} {"train_loss": -11.650001525878906, "global_step": 368524, "epoch": 2193} {"train_loss": -11.676399230957031, "global_step": 368525, "epoch": 2193} {"train_loss": -11.779803276062012, "global_step": 368526, "epoch": 2193} {"train_loss": -12.020756721496582, "global_step": 368527, "epoch": 2193} {"train_loss": -11.993074417114258, "global_step": 368528, "epoch": 2193} {"train_loss": -11.774110794067383, "global_step": 368529, "epoch": 2193} {"train_loss": -11.428956985473633, "global_step": 368530, "epoch": 2193} {"train_loss": -12.236379623413086, "global_step": 368531, "epoch": 2193} {"train_loss": -11.54463005065918, "global_step": 368532, "epoch": 2193} {"train_loss": -12.557334899902344, "global_step": 368533, "epoch": 2193} {"train_loss": -11.632580757141113, "global_step": 368534, "epoch": 2193} {"train_loss": -11.946531295776367, "global_step": 368535, "epoch": 2193} {"train_loss": -12.130010604858398, "global_step": 368536, "epoch": 2193} {"train_loss": -11.515792846679688, "global_step": 368537, "epoch": 2193} {"train_loss": -12.388314247131348, "global_step": 368538, "epoch": 2193} {"train_loss": -11.775233268737793, "global_step": 368539, "epoch": 2193} {"train_loss": -11.89240837097168, "global_step": 368540, "epoch": 2193} {"train_loss": -12.299039840698242, "global_step": 368541, "epoch": 2193} {"train_loss": -11.667766571044922, "global_step": 368542, "epoch": 2193} {"train_loss": -12.332195281982422, "global_step": 368543, "epoch": 2193} {"train_loss": -11.886234283447266, "global_step": 368544, "epoch": 2193} {"train_loss": -12.137287139892578, "global_step": 368545, "epoch": 2193} {"train_loss": -12.017595291137695, "global_step": 368546, "epoch": 2193} {"train_loss": -12.251484870910645, "global_step": 368547, "epoch": 2193} {"train_loss": -12.408320426940918, "global_step": 368548, "epoch": 2193} {"train_loss": -12.224581718444824, "global_step": 368549, "epoch": 2193} {"train_loss": -12.320430755615234, "global_step": 368550, "epoch": 2193} {"train_loss": -11.824714660644531, "global_step": 368551, "epoch": 2193} {"train_loss": -12.34325885772705, "global_step": 368552, "epoch": 2193} {"train_loss": -12.003898620605469, "global_step": 368553, "epoch": 2193} {"train_loss": -12.417795181274414, "global_step": 368554, "epoch": 2193} {"train_loss": -12.179712295532227, "global_step": 368555, "epoch": 2193} {"train_loss": -12.472517967224121, "global_step": 368556, "epoch": 2193} {"train_loss": -12.001619338989258, "global_step": 368557, "epoch": 2193} {"train_loss": -12.345285415649414, "global_step": 368558, "epoch": 2193} {"train_loss": -12.260416984558105, "global_step": 368559, "epoch": 2193} {"train_loss": -12.490013122558594, "global_step": 368560, "epoch": 2193} {"train_loss": -12.295632362365723, "global_step": 368561, "epoch": 2193} {"train_loss": -12.497030258178711, "global_step": 368562, "epoch": 2193} {"train_loss": -12.384162902832031, "global_step": 368563, "epoch": 2193} {"train_loss": -12.44327449798584, "global_step": 368564, "epoch": 2193} {"train_loss": -12.576576232910156, "global_step": 368565, "epoch": 2193} {"train_loss": -12.426596641540527, "global_step": 368566, "epoch": 2193} {"train_loss": -12.643918991088867, "global_step": 368567, "epoch": 2193} {"train_loss": -12.317649841308594, "global_step": 368568, "epoch": 2193} {"train_loss": -12.74047565460205, "global_step": 368569, "epoch": 2193} {"train_loss": -12.181035995483398, "global_step": 368570, "epoch": 2193} {"train_loss": -12.302149772644043, "global_step": 368571, "epoch": 2193} {"train_loss": -12.41014575958252, "global_step": 368572, "epoch": 2193} {"train_loss": -12.082744598388672, "global_step": 368573, "epoch": 2193} {"train_loss": -12.397579193115234, "global_step": 368574, "epoch": 2193} {"train_loss": -12.399927139282227, "global_step": 368575, "epoch": 2193} {"train_loss": -12.130295753479004, "global_step": 368576, "epoch": 2193} {"train_loss": -12.540643692016602, "global_step": 368577, "epoch": 2193} {"train_loss": -12.442740440368652, "global_step": 368578, "epoch": 2193} {"train_loss": -12.523932456970215, "global_step": 368579, "epoch": 2193} {"train_loss": -12.308723449707031, "global_step": 368580, "epoch": 2193} {"train_loss": -12.540729522705078, "global_step": 368581, "epoch": 2193} {"train_loss": -12.6068115234375, "global_step": 368582, "epoch": 2193} {"train_loss": -12.277300834655762, "global_step": 368583, "epoch": 2193} {"train_loss": -12.360883712768555, "global_step": 368584, "epoch": 2193} {"train_loss": -12.603791236877441, "global_step": 368585, "epoch": 2193} {"train_loss": -11.97694206237793, "global_step": 368586, "epoch": 2193} {"train_loss": -12.59262752532959, "global_step": 368587, "epoch": 2193} {"train_loss": -12.275733947753906, "global_step": 368588, "epoch": 2193} {"train_loss": -11.61034870147705, "global_step": 368589, "epoch": 2193} {"train_loss": -12.249099731445312, "global_step": 368590, "epoch": 2193} {"train_loss": -11.941969593365988, "global_step": 368591, "epoch": 2193, "val_loss": 294508.65625} {"train_loss": -11.34606647491455, "global_step": 368592, "epoch": 2194} {"train_loss": -12.555719375610352, "global_step": 368593, "epoch": 2194} {"train_loss": -11.933456420898438, "global_step": 368594, "epoch": 2194} {"train_loss": -12.25526237487793, "global_step": 368595, "epoch": 2194} {"train_loss": -12.534781455993652, "global_step": 368596, "epoch": 2194} {"train_loss": -12.174227714538574, "global_step": 368597, "epoch": 2194} {"train_loss": -12.454866409301758, "global_step": 368598, "epoch": 2194} {"train_loss": -12.397098541259766, "global_step": 368599, "epoch": 2194} {"train_loss": -12.537162780761719, "global_step": 368600, "epoch": 2194} {"train_loss": -12.626953125, "global_step": 368601, "epoch": 2194} {"train_loss": -12.521943092346191, "global_step": 368602, "epoch": 2194} {"train_loss": -12.489008903503418, "global_step": 368603, "epoch": 2194} {"train_loss": -12.504947662353516, "global_step": 368604, "epoch": 2194} {"train_loss": -12.469709396362305, "global_step": 368605, "epoch": 2194} {"train_loss": -12.56619644165039, "global_step": 368606, "epoch": 2194} {"train_loss": -12.433929443359375, "global_step": 368607, "epoch": 2194} {"train_loss": -12.573935508728027, "global_step": 368608, "epoch": 2194} {"train_loss": -12.326407432556152, "global_step": 368609, "epoch": 2194} {"train_loss": -12.422029495239258, "global_step": 368610, "epoch": 2194} {"train_loss": -12.483664512634277, "global_step": 368611, "epoch": 2194} {"train_loss": -12.15519905090332, "global_step": 368612, "epoch": 2194} {"train_loss": -11.825759887695312, "global_step": 368613, "epoch": 2194} {"train_loss": -12.140436172485352, "global_step": 368614, "epoch": 2194} {"train_loss": -12.147506713867188, "global_step": 368615, "epoch": 2194} {"train_loss": -12.000961303710938, "global_step": 368616, "epoch": 2194} {"train_loss": -12.527729034423828, "global_step": 368617, "epoch": 2194} {"train_loss": -12.549222946166992, "global_step": 368618, "epoch": 2194} {"train_loss": -11.874513626098633, "global_step": 368619, "epoch": 2194} {"train_loss": -11.700736999511719, "global_step": 368620, "epoch": 2194} {"train_loss": -12.30356502532959, "global_step": 368621, "epoch": 2194} {"train_loss": -12.339529991149902, "global_step": 368622, "epoch": 2194} {"train_loss": -12.076662063598633, "global_step": 368623, "epoch": 2194} {"train_loss": -12.122700691223145, "global_step": 368624, "epoch": 2194} {"train_loss": -12.58428955078125, "global_step": 368625, "epoch": 2194} {"train_loss": -12.490108489990234, "global_step": 368626, "epoch": 2194} {"train_loss": -12.258512496948242, "global_step": 368627, "epoch": 2194} {"train_loss": -12.430994987487793, "global_step": 368628, "epoch": 2194} {"train_loss": -12.036079406738281, "global_step": 368629, "epoch": 2194} {"train_loss": -11.726825714111328, "global_step": 368630, "epoch": 2194} {"train_loss": -12.333670616149902, "global_step": 368631, "epoch": 2194} {"train_loss": -11.717893600463867, "global_step": 368632, "epoch": 2194} {"train_loss": -12.037708282470703, "global_step": 368633, "epoch": 2194} {"train_loss": -12.023624420166016, "global_step": 368634, "epoch": 2194} {"train_loss": -11.856863021850586, "global_step": 368635, "epoch": 2194} {"train_loss": -11.767803192138672, "global_step": 368636, "epoch": 2194} {"train_loss": -10.56912899017334, "global_step": 368637, "epoch": 2194} {"train_loss": -12.400971412658691, "global_step": 368638, "epoch": 2194} {"train_loss": -10.84764575958252, "global_step": 368639, "epoch": 2194} {"train_loss": -11.71096134185791, "global_step": 368640, "epoch": 2194} {"train_loss": -12.097877502441406, "global_step": 368641, "epoch": 2194} {"train_loss": -11.910186767578125, "global_step": 368642, "epoch": 2194} {"train_loss": -11.74856185913086, "global_step": 368643, "epoch": 2194} {"train_loss": -12.398548126220703, "global_step": 368644, "epoch": 2194} {"train_loss": -11.762472152709961, "global_step": 368645, "epoch": 2194} {"train_loss": -12.092873573303223, "global_step": 368646, "epoch": 2194} {"train_loss": -11.968092918395996, "global_step": 368647, "epoch": 2194} {"train_loss": -11.880974769592285, "global_step": 368648, "epoch": 2194} {"train_loss": -12.029644966125488, "global_step": 368649, "epoch": 2194} {"train_loss": -12.254302978515625, "global_step": 368650, "epoch": 2194} {"train_loss": -11.13123607635498, "global_step": 368651, "epoch": 2194} {"train_loss": -11.909367561340332, "global_step": 368652, "epoch": 2194} {"train_loss": -11.811604499816895, "global_step": 368653, "epoch": 2194} {"train_loss": -11.377140998840332, "global_step": 368654, "epoch": 2194} {"train_loss": -11.787900924682617, "global_step": 368655, "epoch": 2194} {"train_loss": -11.145780563354492, "global_step": 368656, "epoch": 2194} {"train_loss": -10.608043670654297, "global_step": 368657, "epoch": 2194} {"train_loss": -11.281844139099121, "global_step": 368658, "epoch": 2194} {"train_loss": -10.281930923461914, "global_step": 368659, "epoch": 2194} {"train_loss": -10.74795913696289, "global_step": 368660, "epoch": 2194} {"train_loss": -11.179542541503906, "global_step": 368661, "epoch": 2194} {"train_loss": -11.560735702514648, "global_step": 368662, "epoch": 2194} {"train_loss": -10.336711883544922, "global_step": 368663, "epoch": 2194} {"train_loss": -11.384265899658203, "global_step": 368664, "epoch": 2194} {"train_loss": -11.609109878540039, "global_step": 368665, "epoch": 2194} {"train_loss": -10.439834594726562, "global_step": 368666, "epoch": 2194} {"train_loss": -11.553787231445312, "global_step": 368667, "epoch": 2194} {"train_loss": -11.628475189208984, "global_step": 368668, "epoch": 2194} {"train_loss": -10.958124160766602, "global_step": 368669, "epoch": 2194} {"train_loss": -11.803461074829102, "global_step": 368670, "epoch": 2194} {"train_loss": -11.321208000183105, "global_step": 368671, "epoch": 2194} {"train_loss": -11.681879997253418, "global_step": 368672, "epoch": 2194} {"train_loss": -11.416128158569336, "global_step": 368673, "epoch": 2194} {"train_loss": -10.772222518920898, "global_step": 368674, "epoch": 2194} {"train_loss": -11.440038681030273, "global_step": 368675, "epoch": 2194} {"train_loss": -11.528118133544922, "global_step": 368676, "epoch": 2194} {"train_loss": -10.788265228271484, "global_step": 368677, "epoch": 2194} {"train_loss": -11.668012619018555, "global_step": 368678, "epoch": 2194} {"train_loss": -11.172823905944824, "global_step": 368679, "epoch": 2194} {"train_loss": -10.535482406616211, "global_step": 368680, "epoch": 2194} {"train_loss": -9.801553726196289, "global_step": 368681, "epoch": 2194} {"train_loss": -10.37939739227295, "global_step": 368682, "epoch": 2194} {"train_loss": -11.032234191894531, "global_step": 368683, "epoch": 2194} {"train_loss": -10.705133438110352, "global_step": 368684, "epoch": 2194} {"train_loss": -10.801918029785156, "global_step": 368685, "epoch": 2194} {"train_loss": -10.915947914123535, "global_step": 368686, "epoch": 2194} {"train_loss": -11.841154098510742, "global_step": 368687, "epoch": 2194} {"train_loss": -10.28023910522461, "global_step": 368688, "epoch": 2194} {"train_loss": -11.582014083862305, "global_step": 368689, "epoch": 2194} {"train_loss": -11.011338233947754, "global_step": 368690, "epoch": 2194} {"train_loss": -10.936697006225586, "global_step": 368691, "epoch": 2194} {"train_loss": -11.063434600830078, "global_step": 368692, "epoch": 2194} {"train_loss": -9.04960823059082, "global_step": 368693, "epoch": 2194} {"train_loss": -10.793905258178711, "global_step": 368694, "epoch": 2194} {"train_loss": -9.825468063354492, "global_step": 368695, "epoch": 2194} {"train_loss": -10.025040626525879, "global_step": 368696, "epoch": 2194} {"train_loss": -9.93851089477539, "global_step": 368697, "epoch": 2194} {"train_loss": -10.574552536010742, "global_step": 368698, "epoch": 2194} {"train_loss": -10.067626953125, "global_step": 368699, "epoch": 2194} {"train_loss": -9.862431526184082, "global_step": 368700, "epoch": 2194} {"train_loss": -9.15462589263916, "global_step": 368701, "epoch": 2194} {"train_loss": -10.964763641357422, "global_step": 368702, "epoch": 2194} {"train_loss": -10.664997100830078, "global_step": 368703, "epoch": 2194} {"train_loss": -9.757936477661133, "global_step": 368704, "epoch": 2194} {"train_loss": -11.327204704284668, "global_step": 368705, "epoch": 2194} {"train_loss": -11.067931175231934, "global_step": 368706, "epoch": 2194} {"train_loss": -10.91657829284668, "global_step": 368707, "epoch": 2194} {"train_loss": -11.59342098236084, "global_step": 368708, "epoch": 2194} {"train_loss": -11.38479995727539, "global_step": 368709, "epoch": 2194} {"train_loss": -11.096352577209473, "global_step": 368710, "epoch": 2194} {"train_loss": -11.479469299316406, "global_step": 368711, "epoch": 2194} {"train_loss": -11.360138893127441, "global_step": 368712, "epoch": 2194} {"train_loss": -11.865335464477539, "global_step": 368713, "epoch": 2194} {"train_loss": -11.582123756408691, "global_step": 368714, "epoch": 2194} {"train_loss": -11.413298606872559, "global_step": 368715, "epoch": 2194} {"train_loss": -11.542264938354492, "global_step": 368716, "epoch": 2194} {"train_loss": -11.558687210083008, "global_step": 368717, "epoch": 2194} {"train_loss": -11.456574440002441, "global_step": 368718, "epoch": 2194} {"train_loss": -11.857307434082031, "global_step": 368719, "epoch": 2194} {"train_loss": -11.305766105651855, "global_step": 368720, "epoch": 2194} {"train_loss": -11.923421859741211, "global_step": 368721, "epoch": 2194} {"train_loss": -11.595852851867676, "global_step": 368722, "epoch": 2194} {"train_loss": -11.583305358886719, "global_step": 368723, "epoch": 2194} {"train_loss": -11.903677940368652, "global_step": 368724, "epoch": 2194} {"train_loss": -11.513309478759766, "global_step": 368725, "epoch": 2194} {"train_loss": -11.446370124816895, "global_step": 368726, "epoch": 2194} {"train_loss": -11.681070327758789, "global_step": 368727, "epoch": 2194} {"train_loss": -11.145341873168945, "global_step": 368728, "epoch": 2194} {"train_loss": -11.716299057006836, "global_step": 368729, "epoch": 2194} {"train_loss": -11.806838989257812, "global_step": 368730, "epoch": 2194} {"train_loss": -11.8856201171875, "global_step": 368731, "epoch": 2194} {"train_loss": -12.061264991760254, "global_step": 368732, "epoch": 2194} {"train_loss": -11.95001220703125, "global_step": 368733, "epoch": 2194} {"train_loss": -12.251996040344238, "global_step": 368734, "epoch": 2194} {"train_loss": -11.805967330932617, "global_step": 368735, "epoch": 2194} {"train_loss": -12.239341735839844, "global_step": 368736, "epoch": 2194} {"train_loss": -12.208823204040527, "global_step": 368737, "epoch": 2194} {"train_loss": -12.205297470092773, "global_step": 368738, "epoch": 2194} {"train_loss": -12.231504440307617, "global_step": 368739, "epoch": 2194} {"train_loss": -12.173450469970703, "global_step": 368740, "epoch": 2194} {"train_loss": -12.259056091308594, "global_step": 368741, "epoch": 2194} {"train_loss": -12.233620643615723, "global_step": 368742, "epoch": 2194} {"train_loss": -12.267580032348633, "global_step": 368743, "epoch": 2194} {"train_loss": -12.326337814331055, "global_step": 368744, "epoch": 2194} {"train_loss": -12.295726776123047, "global_step": 368745, "epoch": 2194} {"train_loss": -12.285298347473145, "global_step": 368746, "epoch": 2194} {"train_loss": -12.316974639892578, "global_step": 368747, "epoch": 2194} {"train_loss": -12.261890411376953, "global_step": 368748, "epoch": 2194} {"train_loss": -12.449110984802246, "global_step": 368749, "epoch": 2194} {"train_loss": -12.39349365234375, "global_step": 368750, "epoch": 2194} {"train_loss": -12.43990707397461, "global_step": 368751, "epoch": 2194} {"train_loss": -12.476278305053711, "global_step": 368752, "epoch": 2194} {"train_loss": -12.447892189025879, "global_step": 368753, "epoch": 2194} {"train_loss": -12.37919807434082, "global_step": 368754, "epoch": 2194} {"train_loss": -12.492250442504883, "global_step": 368755, "epoch": 2194} {"train_loss": -12.550827026367188, "global_step": 368756, "epoch": 2194} {"train_loss": -12.324814796447754, "global_step": 368757, "epoch": 2194} {"train_loss": -12.475854873657227, "global_step": 368758, "epoch": 2194} {"train_loss": -11.662485378129142, "global_step": 368759, "epoch": 2194, "val_loss": 287448.0625} {"train_loss": -12.507513046264648, "global_step": 368760, "epoch": 2195} {"train_loss": -12.510903358459473, "global_step": 368761, "epoch": 2195} {"train_loss": -12.567049980163574, "global_step": 368762, "epoch": 2195} {"train_loss": -12.321807861328125, "global_step": 368763, "epoch": 2195} {"train_loss": -12.187837600708008, "global_step": 368764, "epoch": 2195} {"train_loss": -12.50048542022705, "global_step": 368765, "epoch": 2195} {"train_loss": -12.448020935058594, "global_step": 368766, "epoch": 2195} {"train_loss": -12.649003028869629, "global_step": 368767, "epoch": 2195} {"train_loss": -12.446441650390625, "global_step": 368768, "epoch": 2195} {"train_loss": -12.422731399536133, "global_step": 368769, "epoch": 2195} {"train_loss": -12.397717475891113, "global_step": 368770, "epoch": 2195} {"train_loss": -12.440131187438965, "global_step": 368771, "epoch": 2195} {"train_loss": -12.447593688964844, "global_step": 368772, "epoch": 2195} {"train_loss": -12.481407165527344, "global_step": 368773, "epoch": 2195} {"train_loss": -12.451810836791992, "global_step": 368774, "epoch": 2195} {"train_loss": -12.455883026123047, "global_step": 368775, "epoch": 2195} {"train_loss": -12.474939346313477, "global_step": 368776, "epoch": 2195} {"train_loss": -12.56727409362793, "global_step": 368777, "epoch": 2195} {"train_loss": -12.50857925415039, "global_step": 368778, "epoch": 2195} {"train_loss": -12.405624389648438, "global_step": 368779, "epoch": 2195} {"train_loss": -12.392265319824219, "global_step": 368780, "epoch": 2195} {"train_loss": -12.581964492797852, "global_step": 368781, "epoch": 2195} {"train_loss": -12.655315399169922, "global_step": 368782, "epoch": 2195} {"train_loss": -12.714582443237305, "global_step": 368783, "epoch": 2195} {"train_loss": -12.525731086730957, "global_step": 368784, "epoch": 2195} {"train_loss": -12.677734375, "global_step": 368785, "epoch": 2195} {"train_loss": -12.612235069274902, "global_step": 368786, "epoch": 2195} {"train_loss": -12.572149276733398, "global_step": 368787, "epoch": 2195} {"train_loss": -12.694896697998047, "global_step": 368788, "epoch": 2195} {"train_loss": -12.437358856201172, "global_step": 368789, "epoch": 2195} {"train_loss": -12.69137954711914, "global_step": 368790, "epoch": 2195} {"train_loss": -12.629854202270508, "global_step": 368791, "epoch": 2195} {"train_loss": -12.771461486816406, "global_step": 368792, "epoch": 2195} {"train_loss": -12.625211715698242, "global_step": 368793, "epoch": 2195} {"train_loss": -12.78502368927002, "global_step": 368794, "epoch": 2195} {"train_loss": -12.577882766723633, "global_step": 368795, "epoch": 2195} {"train_loss": -12.62450122833252, "global_step": 368796, "epoch": 2195} {"train_loss": -12.451347351074219, "global_step": 368797, "epoch": 2195} {"train_loss": -12.44910717010498, "global_step": 368798, "epoch": 2195} {"train_loss": -12.663690567016602, "global_step": 368799, "epoch": 2195} {"train_loss": -12.241456985473633, "global_step": 368800, "epoch": 2195} {"train_loss": -12.47807502746582, "global_step": 368801, "epoch": 2195} {"train_loss": -12.569828987121582, "global_step": 368802, "epoch": 2195} {"train_loss": -12.279500961303711, "global_step": 368803, "epoch": 2195} {"train_loss": -12.255789756774902, "global_step": 368804, "epoch": 2195} {"train_loss": -12.17291259765625, "global_step": 368805, "epoch": 2195} {"train_loss": -12.06179428100586, "global_step": 368806, "epoch": 2195} {"train_loss": -11.853231430053711, "global_step": 368807, "epoch": 2195} {"train_loss": -11.96785831451416, "global_step": 368808, "epoch": 2195} {"train_loss": -12.209446907043457, "global_step": 368809, "epoch": 2195} {"train_loss": -12.257560729980469, "global_step": 368810, "epoch": 2195} {"train_loss": -12.078079223632812, "global_step": 368811, "epoch": 2195} {"train_loss": -12.400873184204102, "global_step": 368812, "epoch": 2195} {"train_loss": -12.358528137207031, "global_step": 368813, "epoch": 2195} {"train_loss": -11.955316543579102, "global_step": 368814, "epoch": 2195} {"train_loss": -12.215412139892578, "global_step": 368815, "epoch": 2195} {"train_loss": -12.361045837402344, "global_step": 368816, "epoch": 2195} {"train_loss": -11.446889877319336, "global_step": 368817, "epoch": 2195} {"train_loss": -11.869604110717773, "global_step": 368818, "epoch": 2195} {"train_loss": -12.328611373901367, "global_step": 368819, "epoch": 2195} {"train_loss": -11.106319427490234, "global_step": 368820, "epoch": 2195} {"train_loss": -11.853429794311523, "global_step": 368821, "epoch": 2195} {"train_loss": -11.967260360717773, "global_step": 368822, "epoch": 2195} {"train_loss": -10.395978927612305, "global_step": 368823, "epoch": 2195} {"train_loss": -11.758209228515625, "global_step": 368824, "epoch": 2195} {"train_loss": -11.175252914428711, "global_step": 368825, "epoch": 2195} {"train_loss": -10.080049514770508, "global_step": 368826, "epoch": 2195} {"train_loss": -12.349766731262207, "global_step": 368827, "epoch": 2195} {"train_loss": -10.807429313659668, "global_step": 368828, "epoch": 2195} {"train_loss": -11.987433433532715, "global_step": 368829, "epoch": 2195} {"train_loss": -10.91780948638916, "global_step": 368830, "epoch": 2195} {"train_loss": -12.146620750427246, "global_step": 368831, "epoch": 2195} {"train_loss": -12.28015422821045, "global_step": 368832, "epoch": 2195} {"train_loss": -11.212879180908203, "global_step": 368833, "epoch": 2195} {"train_loss": -12.102582931518555, "global_step": 368834, "epoch": 2195} {"train_loss": -12.007929801940918, "global_step": 368835, "epoch": 2195} {"train_loss": -11.629650115966797, "global_step": 368836, "epoch": 2195} {"train_loss": -12.328643798828125, "global_step": 368837, "epoch": 2195} {"train_loss": -11.604950904846191, "global_step": 368838, "epoch": 2195} {"train_loss": -11.999814987182617, "global_step": 368839, "epoch": 2195} {"train_loss": -12.232348442077637, "global_step": 368840, "epoch": 2195} {"train_loss": -12.004892349243164, "global_step": 368841, "epoch": 2195} {"train_loss": -12.125247955322266, "global_step": 368842, "epoch": 2195} {"train_loss": -12.109954833984375, "global_step": 368843, "epoch": 2195} {"train_loss": -12.042671203613281, "global_step": 368844, "epoch": 2195} {"train_loss": -12.114739418029785, "global_step": 368845, "epoch": 2195} {"train_loss": -12.086196899414062, "global_step": 368846, "epoch": 2195} {"train_loss": -11.896434783935547, "global_step": 368847, "epoch": 2195} {"train_loss": -12.001540184020996, "global_step": 368848, "epoch": 2195} {"train_loss": -12.314058303833008, "global_step": 368849, "epoch": 2195} {"train_loss": -11.644887924194336, "global_step": 368850, "epoch": 2195} {"train_loss": -11.91046142578125, "global_step": 368851, "epoch": 2195} {"train_loss": -12.37161922454834, "global_step": 368852, "epoch": 2195} {"train_loss": -12.391035079956055, "global_step": 368853, "epoch": 2195} {"train_loss": -12.1967191696167, "global_step": 368854, "epoch": 2195} {"train_loss": -12.528448104858398, "global_step": 368855, "epoch": 2195} {"train_loss": -12.262365341186523, "global_step": 368856, "epoch": 2195} {"train_loss": -12.560969352722168, "global_step": 368857, "epoch": 2195} {"train_loss": -12.398996353149414, "global_step": 368858, "epoch": 2195} {"train_loss": -12.373727798461914, "global_step": 368859, "epoch": 2195} {"train_loss": -12.547266006469727, "global_step": 368860, "epoch": 2195} {"train_loss": -12.073416709899902, "global_step": 368861, "epoch": 2195} {"train_loss": -12.31260871887207, "global_step": 368862, "epoch": 2195} {"train_loss": -11.982603073120117, "global_step": 368863, "epoch": 2195} {"train_loss": -12.54694938659668, "global_step": 368864, "epoch": 2195} {"train_loss": -12.17636775970459, "global_step": 368865, "epoch": 2195} {"train_loss": -12.203100204467773, "global_step": 368866, "epoch": 2195} {"train_loss": -12.005985260009766, "global_step": 368867, "epoch": 2195} {"train_loss": -12.037601470947266, "global_step": 368868, "epoch": 2195} {"train_loss": -12.227531433105469, "global_step": 368869, "epoch": 2195} {"train_loss": -12.195474624633789, "global_step": 368870, "epoch": 2195} {"train_loss": -12.012996673583984, "global_step": 368871, "epoch": 2195} {"train_loss": -12.160420417785645, "global_step": 368872, "epoch": 2195} {"train_loss": -11.936135292053223, "global_step": 368873, "epoch": 2195} {"train_loss": -11.97258186340332, "global_step": 368874, "epoch": 2195} {"train_loss": -11.483638763427734, "global_step": 368875, "epoch": 2195} {"train_loss": -11.525216102600098, "global_step": 368876, "epoch": 2195} {"train_loss": -11.438141822814941, "global_step": 368877, "epoch": 2195} {"train_loss": -12.263603210449219, "global_step": 368878, "epoch": 2195} {"train_loss": -11.117942810058594, "global_step": 368879, "epoch": 2195} {"train_loss": -11.496725082397461, "global_step": 368880, "epoch": 2195} {"train_loss": -11.751310348510742, "global_step": 368881, "epoch": 2195} {"train_loss": -11.913759231567383, "global_step": 368882, "epoch": 2195} {"train_loss": -11.782236099243164, "global_step": 368883, "epoch": 2195} {"train_loss": -11.553361892700195, "global_step": 368884, "epoch": 2195} {"train_loss": -11.58847713470459, "global_step": 368885, "epoch": 2195} {"train_loss": -12.033881187438965, "global_step": 368886, "epoch": 2195} {"train_loss": -12.21379566192627, "global_step": 368887, "epoch": 2195} {"train_loss": -11.969964981079102, "global_step": 368888, "epoch": 2195} {"train_loss": -11.564695358276367, "global_step": 368889, "epoch": 2195} {"train_loss": -12.58077335357666, "global_step": 368890, "epoch": 2195} {"train_loss": -11.504907608032227, "global_step": 368891, "epoch": 2195} {"train_loss": -11.508031845092773, "global_step": 368892, "epoch": 2195} {"train_loss": -12.189640998840332, "global_step": 368893, "epoch": 2195} {"train_loss": -12.556739807128906, "global_step": 368894, "epoch": 2195} {"train_loss": -12.215900421142578, "global_step": 368895, "epoch": 2195} {"train_loss": -12.351068496704102, "global_step": 368896, "epoch": 2195} {"train_loss": -11.740415573120117, "global_step": 368897, "epoch": 2195} {"train_loss": -11.603452682495117, "global_step": 368898, "epoch": 2195} {"train_loss": -12.019510269165039, "global_step": 368899, "epoch": 2195} {"train_loss": -12.383171081542969, "global_step": 368900, "epoch": 2195} {"train_loss": -12.306560516357422, "global_step": 368901, "epoch": 2195} {"train_loss": -12.126128196716309, "global_step": 368902, "epoch": 2195} {"train_loss": -12.386372566223145, "global_step": 368903, "epoch": 2195} {"train_loss": -12.314844131469727, "global_step": 368904, "epoch": 2195} {"train_loss": -12.412832260131836, "global_step": 368905, "epoch": 2195} {"train_loss": -12.43397331237793, "global_step": 368906, "epoch": 2195} {"train_loss": -12.316215515136719, "global_step": 368907, "epoch": 2195} {"train_loss": -12.179136276245117, "global_step": 368908, "epoch": 2195} {"train_loss": -11.981425285339355, "global_step": 368909, "epoch": 2195} {"train_loss": -12.3827486038208, "global_step": 368910, "epoch": 2195} {"train_loss": -12.51639175415039, "global_step": 368911, "epoch": 2195} {"train_loss": -12.331535339355469, "global_step": 368912, "epoch": 2195} {"train_loss": -12.494293212890625, "global_step": 368913, "epoch": 2195} {"train_loss": -12.254386901855469, "global_step": 368914, "epoch": 2195} {"train_loss": -12.470915794372559, "global_step": 368915, "epoch": 2195} {"train_loss": -12.50602912902832, "global_step": 368916, "epoch": 2195} {"train_loss": -12.513391494750977, "global_step": 368917, "epoch": 2195} {"train_loss": -12.607418060302734, "global_step": 368918, "epoch": 2195} {"train_loss": -12.526897430419922, "global_step": 368919, "epoch": 2195} {"train_loss": -12.572967529296875, "global_step": 368920, "epoch": 2195} {"train_loss": -12.532827377319336, "global_step": 368921, "epoch": 2195} {"train_loss": -12.59563159942627, "global_step": 368922, "epoch": 2195} {"train_loss": -12.644432067871094, "global_step": 368923, "epoch": 2195} {"train_loss": -12.435586929321289, "global_step": 368924, "epoch": 2195} {"train_loss": -12.585891723632812, "global_step": 368925, "epoch": 2195} {"train_loss": -12.586618423461914, "global_step": 368926, "epoch": 2195} {"train_loss": -12.180102081525893, "global_step": 368927, "epoch": 2195, "val_loss": 290522.78125, "train_action_mse_error": 1.3926799297332764} {"train_loss": -12.278261184692383, "global_step": 368928, "epoch": 2196} {"train_loss": -12.200550079345703, "global_step": 368929, "epoch": 2196} {"train_loss": -12.768806457519531, "global_step": 368930, "epoch": 2196} {"train_loss": -12.618362426757812, "global_step": 368931, "epoch": 2196} {"train_loss": -12.338041305541992, "global_step": 368932, "epoch": 2196} {"train_loss": -12.620048522949219, "global_step": 368933, "epoch": 2196} {"train_loss": -12.318017959594727, "global_step": 368934, "epoch": 2196} {"train_loss": -12.459407806396484, "global_step": 368935, "epoch": 2196} {"train_loss": -12.647711753845215, "global_step": 368936, "epoch": 2196} {"train_loss": -12.503131866455078, "global_step": 368937, "epoch": 2196} {"train_loss": -11.93839168548584, "global_step": 368938, "epoch": 2196} {"train_loss": -12.49504566192627, "global_step": 368939, "epoch": 2196} {"train_loss": -12.253278732299805, "global_step": 368940, "epoch": 2196} {"train_loss": -11.691341400146484, "global_step": 368941, "epoch": 2196} {"train_loss": -11.728878021240234, "global_step": 368942, "epoch": 2196} {"train_loss": -11.560800552368164, "global_step": 368943, "epoch": 2196} {"train_loss": -12.554736137390137, "global_step": 368944, "epoch": 2196} {"train_loss": -11.40005111694336, "global_step": 368945, "epoch": 2196} {"train_loss": -12.359373092651367, "global_step": 368946, "epoch": 2196} {"train_loss": -10.949190139770508, "global_step": 368947, "epoch": 2196} {"train_loss": -11.859441757202148, "global_step": 368948, "epoch": 2196} {"train_loss": -9.278837203979492, "global_step": 368949, "epoch": 2196} {"train_loss": -12.203609466552734, "global_step": 368950, "epoch": 2196} {"train_loss": -10.689881324768066, "global_step": 368951, "epoch": 2196} {"train_loss": -9.815011978149414, "global_step": 368952, "epoch": 2196} {"train_loss": -10.698711395263672, "global_step": 368953, "epoch": 2196} {"train_loss": -10.498719215393066, "global_step": 368954, "epoch": 2196} {"train_loss": -10.533882141113281, "global_step": 368955, "epoch": 2196} {"train_loss": -10.172651290893555, "global_step": 368956, "epoch": 2196} {"train_loss": -9.443026542663574, "global_step": 368957, "epoch": 2196} {"train_loss": -9.523460388183594, "global_step": 368958, "epoch": 2196} {"train_loss": -8.273295402526855, "global_step": 368959, "epoch": 2196} {"train_loss": -7.668026924133301, "global_step": 368960, "epoch": 2196} {"train_loss": -8.331899642944336, "global_step": 368961, "epoch": 2196} {"train_loss": -10.341510772705078, "global_step": 368962, "epoch": 2196} {"train_loss": -10.106880187988281, "global_step": 368963, "epoch": 2196} {"train_loss": -9.54409122467041, "global_step": 368964, "epoch": 2196} {"train_loss": -9.913870811462402, "global_step": 368965, "epoch": 2196} {"train_loss": -10.27249526977539, "global_step": 368966, "epoch": 2196} {"train_loss": -10.013802528381348, "global_step": 368967, "epoch": 2196} {"train_loss": -9.778104782104492, "global_step": 368968, "epoch": 2196} {"train_loss": -11.325023651123047, "global_step": 368969, "epoch": 2196} {"train_loss": -10.947251319885254, "global_step": 368970, "epoch": 2196} {"train_loss": -11.640052795410156, "global_step": 368971, "epoch": 2196} {"train_loss": -10.920005798339844, "global_step": 368972, "epoch": 2196} {"train_loss": -11.135746002197266, "global_step": 368973, "epoch": 2196} {"train_loss": -11.15499210357666, "global_step": 368974, "epoch": 2196} {"train_loss": -11.473897933959961, "global_step": 368975, "epoch": 2196} {"train_loss": -11.869366645812988, "global_step": 368976, "epoch": 2196} {"train_loss": -11.359095573425293, "global_step": 368977, "epoch": 2196} {"train_loss": -11.692231178283691, "global_step": 368978, "epoch": 2196} {"train_loss": -11.326523780822754, "global_step": 368979, "epoch": 2196} {"train_loss": -11.737701416015625, "global_step": 368980, "epoch": 2196} {"train_loss": -11.388493537902832, "global_step": 368981, "epoch": 2196} {"train_loss": -11.993346214294434, "global_step": 368982, "epoch": 2196} {"train_loss": -11.36952018737793, "global_step": 368983, "epoch": 2196} {"train_loss": -11.96478271484375, "global_step": 368984, "epoch": 2196} {"train_loss": -11.44149398803711, "global_step": 368985, "epoch": 2196} {"train_loss": -12.088497161865234, "global_step": 368986, "epoch": 2196} {"train_loss": -11.454174041748047, "global_step": 368987, "epoch": 2196} {"train_loss": -11.89976692199707, "global_step": 368988, "epoch": 2196} {"train_loss": -11.832182884216309, "global_step": 368989, "epoch": 2196} {"train_loss": -11.967880249023438, "global_step": 368990, "epoch": 2196} {"train_loss": -11.677239418029785, "global_step": 368991, "epoch": 2196} {"train_loss": -11.704245567321777, "global_step": 368992, "epoch": 2196} {"train_loss": -11.91625690460205, "global_step": 368993, "epoch": 2196} {"train_loss": -11.616451263427734, "global_step": 368994, "epoch": 2196} {"train_loss": -11.895095825195312, "global_step": 368995, "epoch": 2196} {"train_loss": -11.84896183013916, "global_step": 368996, "epoch": 2196} {"train_loss": -11.926727294921875, "global_step": 368997, "epoch": 2196} {"train_loss": -11.696329116821289, "global_step": 368998, "epoch": 2196} {"train_loss": -11.909381866455078, "global_step": 368999, "epoch": 2196} {"train_loss": -12.162153244018555, "global_step": 369000, "epoch": 2196} {"train_loss": -11.889616012573242, "global_step": 369001, "epoch": 2196} {"train_loss": -12.254889488220215, "global_step": 369002, "epoch": 2196} {"train_loss": -11.717867851257324, "global_step": 369003, "epoch": 2196} {"train_loss": -12.16158390045166, "global_step": 369004, "epoch": 2196} {"train_loss": -12.028242111206055, "global_step": 369005, "epoch": 2196} {"train_loss": -12.187723159790039, "global_step": 369006, "epoch": 2196} {"train_loss": -12.130395889282227, "global_step": 369007, "epoch": 2196} {"train_loss": -12.055852890014648, "global_step": 369008, "epoch": 2196} {"train_loss": -12.303045272827148, "global_step": 369009, "epoch": 2196} {"train_loss": -11.857418060302734, "global_step": 369010, "epoch": 2196} {"train_loss": -12.132438659667969, "global_step": 369011, "epoch": 2196} {"train_loss": -11.69165325164795, "global_step": 369012, "epoch": 2196} {"train_loss": -11.467049598693848, "global_step": 369013, "epoch": 2196} {"train_loss": -11.314870834350586, "global_step": 369014, "epoch": 2196} {"train_loss": -11.691650390625, "global_step": 369015, "epoch": 2196} {"train_loss": -12.261809349060059, "global_step": 369016, "epoch": 2196} {"train_loss": -11.612211227416992, "global_step": 369017, "epoch": 2196} {"train_loss": -11.639715194702148, "global_step": 369018, "epoch": 2196} {"train_loss": -11.937540054321289, "global_step": 369019, "epoch": 2196} {"train_loss": -11.64795970916748, "global_step": 369020, "epoch": 2196} {"train_loss": -12.097801208496094, "global_step": 369021, "epoch": 2196} {"train_loss": -11.892160415649414, "global_step": 369022, "epoch": 2196} {"train_loss": -11.979244232177734, "global_step": 369023, "epoch": 2196} {"train_loss": -12.165678024291992, "global_step": 369024, "epoch": 2196} {"train_loss": -11.725442886352539, "global_step": 369025, "epoch": 2196} {"train_loss": -12.094453811645508, "global_step": 369026, "epoch": 2196} {"train_loss": -11.981890678405762, "global_step": 369027, "epoch": 2196} {"train_loss": -11.961613655090332, "global_step": 369028, "epoch": 2196} {"train_loss": -12.180191040039062, "global_step": 369029, "epoch": 2196} {"train_loss": -11.645650863647461, "global_step": 369030, "epoch": 2196} {"train_loss": -12.166873931884766, "global_step": 369031, "epoch": 2196} {"train_loss": -11.887593269348145, "global_step": 369032, "epoch": 2196} {"train_loss": -12.470149993896484, "global_step": 369033, "epoch": 2196} {"train_loss": -11.955533981323242, "global_step": 369034, "epoch": 2196} {"train_loss": -12.21764087677002, "global_step": 369035, "epoch": 2196} {"train_loss": -12.039527893066406, "global_step": 369036, "epoch": 2196} {"train_loss": -12.204633712768555, "global_step": 369037, "epoch": 2196} {"train_loss": -12.240318298339844, "global_step": 369038, "epoch": 2196} {"train_loss": -11.958075523376465, "global_step": 369039, "epoch": 2196} {"train_loss": -12.436875343322754, "global_step": 369040, "epoch": 2196} {"train_loss": -12.004199028015137, "global_step": 369041, "epoch": 2196} {"train_loss": -12.447731018066406, "global_step": 369042, "epoch": 2196} {"train_loss": -12.017112731933594, "global_step": 369043, "epoch": 2196} {"train_loss": -12.349052429199219, "global_step": 369044, "epoch": 2196} {"train_loss": -11.904288291931152, "global_step": 369045, "epoch": 2196} {"train_loss": -12.418701171875, "global_step": 369046, "epoch": 2196} {"train_loss": -12.296859741210938, "global_step": 369047, "epoch": 2196} {"train_loss": -12.414535522460938, "global_step": 369048, "epoch": 2196} {"train_loss": -12.38227367401123, "global_step": 369049, "epoch": 2196} {"train_loss": -12.438039779663086, "global_step": 369050, "epoch": 2196} {"train_loss": -12.294031143188477, "global_step": 369051, "epoch": 2196} {"train_loss": -12.49312973022461, "global_step": 369052, "epoch": 2196} {"train_loss": -12.337054252624512, "global_step": 369053, "epoch": 2196} {"train_loss": -12.334068298339844, "global_step": 369054, "epoch": 2196} {"train_loss": -12.610654830932617, "global_step": 369055, "epoch": 2196} {"train_loss": -12.217287063598633, "global_step": 369056, "epoch": 2196} {"train_loss": -12.293127059936523, "global_step": 369057, "epoch": 2196} {"train_loss": -12.65050220489502, "global_step": 369058, "epoch": 2196} {"train_loss": -12.432710647583008, "global_step": 369059, "epoch": 2196} {"train_loss": -12.573455810546875, "global_step": 369060, "epoch": 2196} {"train_loss": -12.16530990600586, "global_step": 369061, "epoch": 2196} {"train_loss": -12.490076065063477, "global_step": 369062, "epoch": 2196} {"train_loss": -12.035825729370117, "global_step": 369063, "epoch": 2196} {"train_loss": -12.484540939331055, "global_step": 369064, "epoch": 2196} {"train_loss": -12.499032020568848, "global_step": 369065, "epoch": 2196} {"train_loss": -12.680449485778809, "global_step": 369066, "epoch": 2196} {"train_loss": -12.46151351928711, "global_step": 369067, "epoch": 2196} {"train_loss": -12.51940631866455, "global_step": 369068, "epoch": 2196} {"train_loss": -12.457551002502441, "global_step": 369069, "epoch": 2196} {"train_loss": -12.570045471191406, "global_step": 369070, "epoch": 2196} {"train_loss": -12.502613067626953, "global_step": 369071, "epoch": 2196} {"train_loss": -12.479509353637695, "global_step": 369072, "epoch": 2196} {"train_loss": -12.362068176269531, "global_step": 369073, "epoch": 2196} {"train_loss": -12.518831253051758, "global_step": 369074, "epoch": 2196} {"train_loss": -12.705761909484863, "global_step": 369075, "epoch": 2196} {"train_loss": -12.506288528442383, "global_step": 369076, "epoch": 2196} {"train_loss": -12.720232009887695, "global_step": 369077, "epoch": 2196} {"train_loss": -11.24081039428711, "global_step": 369078, "epoch": 2196} {"train_loss": -12.474702835083008, "global_step": 369079, "epoch": 2196} {"train_loss": -12.567350387573242, "global_step": 369080, "epoch": 2196} {"train_loss": -12.295331001281738, "global_step": 369081, "epoch": 2196} {"train_loss": -11.731592178344727, "global_step": 369082, "epoch": 2196} {"train_loss": -12.613628387451172, "global_step": 369083, "epoch": 2196} {"train_loss": -12.272139549255371, "global_step": 369084, "epoch": 2196} {"train_loss": -12.54134750366211, "global_step": 369085, "epoch": 2196} {"train_loss": -12.36606502532959, "global_step": 369086, "epoch": 2196} {"train_loss": -12.252389907836914, "global_step": 369087, "epoch": 2196} {"train_loss": -12.447725296020508, "global_step": 369088, "epoch": 2196} {"train_loss": -12.145206451416016, "global_step": 369089, "epoch": 2196} {"train_loss": -12.005956649780273, "global_step": 369090, "epoch": 2196} {"train_loss": -12.735139846801758, "global_step": 369091, "epoch": 2196} {"train_loss": -12.281010627746582, "global_step": 369092, "epoch": 2196} {"train_loss": -11.669322967529297, "global_step": 369093, "epoch": 2196} {"train_loss": -12.253716468811035, "global_step": 369094, "epoch": 2196} {"train_loss": -11.808779069355555, "global_step": 369095, "epoch": 2196, "val_loss": 293658.875} {"train_loss": -12.359916687011719, "global_step": 369096, "epoch": 2197} {"train_loss": -12.508466720581055, "global_step": 369097, "epoch": 2197} {"train_loss": -11.58326530456543, "global_step": 369098, "epoch": 2197} {"train_loss": -12.587135314941406, "global_step": 369099, "epoch": 2197} {"train_loss": -10.644207000732422, "global_step": 369100, "epoch": 2197} {"train_loss": -12.046516418457031, "global_step": 369101, "epoch": 2197} {"train_loss": -11.7637300491333, "global_step": 369102, "epoch": 2197} {"train_loss": -12.227731704711914, "global_step": 369103, "epoch": 2197} {"train_loss": -12.03455638885498, "global_step": 369104, "epoch": 2197} {"train_loss": -11.065790176391602, "global_step": 369105, "epoch": 2197} {"train_loss": -11.67631721496582, "global_step": 369106, "epoch": 2197} {"train_loss": -12.521637916564941, "global_step": 369107, "epoch": 2197} {"train_loss": -11.709643363952637, "global_step": 369108, "epoch": 2197} {"train_loss": -12.05268669128418, "global_step": 369109, "epoch": 2197} {"train_loss": -11.723302841186523, "global_step": 369110, "epoch": 2197} {"train_loss": -11.871392250061035, "global_step": 369111, "epoch": 2197} {"train_loss": -11.508804321289062, "global_step": 369112, "epoch": 2197} {"train_loss": -11.406646728515625, "global_step": 369113, "epoch": 2197} {"train_loss": -12.201009750366211, "global_step": 369114, "epoch": 2197} {"train_loss": -11.79975700378418, "global_step": 369115, "epoch": 2197} {"train_loss": -11.466999053955078, "global_step": 369116, "epoch": 2197} {"train_loss": -11.400343894958496, "global_step": 369117, "epoch": 2197} {"train_loss": -11.640498161315918, "global_step": 369118, "epoch": 2197} {"train_loss": -11.093563079833984, "global_step": 369119, "epoch": 2197} {"train_loss": -11.905424118041992, "global_step": 369120, "epoch": 2197} {"train_loss": -12.100833892822266, "global_step": 369121, "epoch": 2197} {"train_loss": -10.924732208251953, "global_step": 369122, "epoch": 2197} {"train_loss": -11.853178024291992, "global_step": 369123, "epoch": 2197} {"train_loss": -11.837846755981445, "global_step": 369124, "epoch": 2197} {"train_loss": -11.945785522460938, "global_step": 369125, "epoch": 2197} {"train_loss": -12.005399703979492, "global_step": 369126, "epoch": 2197} {"train_loss": -11.994608879089355, "global_step": 369127, "epoch": 2197} {"train_loss": -12.36229419708252, "global_step": 369128, "epoch": 2197} {"train_loss": -11.608946800231934, "global_step": 369129, "epoch": 2197} {"train_loss": -12.064285278320312, "global_step": 369130, "epoch": 2197} {"train_loss": -12.186708450317383, "global_step": 369131, "epoch": 2197} {"train_loss": -12.051359176635742, "global_step": 369132, "epoch": 2197} {"train_loss": -11.67115592956543, "global_step": 369133, "epoch": 2197} {"train_loss": -10.416906356811523, "global_step": 369134, "epoch": 2197} {"train_loss": -12.050880432128906, "global_step": 369135, "epoch": 2197} {"train_loss": -11.219979286193848, "global_step": 369136, "epoch": 2197} {"train_loss": -11.997905731201172, "global_step": 369137, "epoch": 2197} {"train_loss": -11.757604598999023, "global_step": 369138, "epoch": 2197} {"train_loss": -10.665861129760742, "global_step": 369139, "epoch": 2197} {"train_loss": -11.227594375610352, "global_step": 369140, "epoch": 2197} {"train_loss": -11.479304313659668, "global_step": 369141, "epoch": 2197} {"train_loss": -11.03781509399414, "global_step": 369142, "epoch": 2197} {"train_loss": -10.835643768310547, "global_step": 369143, "epoch": 2197} {"train_loss": -9.566638946533203, "global_step": 369144, "epoch": 2197} {"train_loss": -11.217291831970215, "global_step": 369145, "epoch": 2197} {"train_loss": -10.083784103393555, "global_step": 369146, "epoch": 2197} {"train_loss": -10.708929061889648, "global_step": 369147, "epoch": 2197} {"train_loss": -11.528711318969727, "global_step": 369148, "epoch": 2197} {"train_loss": -11.224398612976074, "global_step": 369149, "epoch": 2197} {"train_loss": -10.701547622680664, "global_step": 369150, "epoch": 2197} {"train_loss": -11.56170654296875, "global_step": 369151, "epoch": 2197} {"train_loss": -10.845972061157227, "global_step": 369152, "epoch": 2197} {"train_loss": -11.097858428955078, "global_step": 369153, "epoch": 2197} {"train_loss": -10.619160652160645, "global_step": 369154, "epoch": 2197} {"train_loss": -9.953842163085938, "global_step": 369155, "epoch": 2197} {"train_loss": -10.803444862365723, "global_step": 369156, "epoch": 2197} {"train_loss": -11.534189224243164, "global_step": 369157, "epoch": 2197} {"train_loss": -10.467904090881348, "global_step": 369158, "epoch": 2197} {"train_loss": -11.541349411010742, "global_step": 369159, "epoch": 2197} {"train_loss": -10.71275520324707, "global_step": 369160, "epoch": 2197} {"train_loss": -11.493257522583008, "global_step": 369161, "epoch": 2197} {"train_loss": -11.31220817565918, "global_step": 369162, "epoch": 2197} {"train_loss": -11.168224334716797, "global_step": 369163, "epoch": 2197} {"train_loss": -11.44680118560791, "global_step": 369164, "epoch": 2197} {"train_loss": -11.399726867675781, "global_step": 369165, "epoch": 2197} {"train_loss": -10.650205612182617, "global_step": 369166, "epoch": 2197} {"train_loss": -11.99852180480957, "global_step": 369167, "epoch": 2197} {"train_loss": -11.451684951782227, "global_step": 369168, "epoch": 2197} {"train_loss": -12.011083602905273, "global_step": 369169, "epoch": 2197} {"train_loss": -11.691730499267578, "global_step": 369170, "epoch": 2197} {"train_loss": -11.867554664611816, "global_step": 369171, "epoch": 2197} {"train_loss": -11.721632957458496, "global_step": 369172, "epoch": 2197} {"train_loss": -11.890939712524414, "global_step": 369173, "epoch": 2197} {"train_loss": -11.784971237182617, "global_step": 369174, "epoch": 2197} {"train_loss": -11.73876953125, "global_step": 369175, "epoch": 2197} {"train_loss": -11.709813117980957, "global_step": 369176, "epoch": 2197} {"train_loss": -11.98729133605957, "global_step": 369177, "epoch": 2197} {"train_loss": -11.770280838012695, "global_step": 369178, "epoch": 2197} {"train_loss": -11.798344612121582, "global_step": 369179, "epoch": 2197} {"train_loss": -11.643646240234375, "global_step": 369180, "epoch": 2197} {"train_loss": -11.870781898498535, "global_step": 369181, "epoch": 2197} {"train_loss": -11.942140579223633, "global_step": 369182, "epoch": 2197} {"train_loss": -12.10178279876709, "global_step": 369183, "epoch": 2197} {"train_loss": -12.026007652282715, "global_step": 369184, "epoch": 2197} {"train_loss": -12.027534484863281, "global_step": 369185, "epoch": 2197} {"train_loss": -12.233966827392578, "global_step": 369186, "epoch": 2197} {"train_loss": -12.183155059814453, "global_step": 369187, "epoch": 2197} {"train_loss": -12.085338592529297, "global_step": 369188, "epoch": 2197} {"train_loss": -12.098423957824707, "global_step": 369189, "epoch": 2197} {"train_loss": -11.897262573242188, "global_step": 369190, "epoch": 2197} {"train_loss": -12.13078498840332, "global_step": 369191, "epoch": 2197} {"train_loss": -12.057731628417969, "global_step": 369192, "epoch": 2197} {"train_loss": -12.013616561889648, "global_step": 369193, "epoch": 2197} {"train_loss": -12.196281433105469, "global_step": 369194, "epoch": 2197} {"train_loss": -12.08548355102539, "global_step": 369195, "epoch": 2197} {"train_loss": -12.358987808227539, "global_step": 369196, "epoch": 2197} {"train_loss": -12.302382469177246, "global_step": 369197, "epoch": 2197} {"train_loss": -12.09475326538086, "global_step": 369198, "epoch": 2197} {"train_loss": -12.233378410339355, "global_step": 369199, "epoch": 2197} {"train_loss": -12.05876350402832, "global_step": 369200, "epoch": 2197} {"train_loss": -12.512033462524414, "global_step": 369201, "epoch": 2197} {"train_loss": -11.990991592407227, "global_step": 369202, "epoch": 2197} {"train_loss": -12.079822540283203, "global_step": 369203, "epoch": 2197} {"train_loss": -12.18282699584961, "global_step": 369204, "epoch": 2197} {"train_loss": -12.249921798706055, "global_step": 369205, "epoch": 2197} {"train_loss": -12.373417854309082, "global_step": 369206, "epoch": 2197} {"train_loss": -12.19278335571289, "global_step": 369207, "epoch": 2197} {"train_loss": -12.567646980285645, "global_step": 369208, "epoch": 2197} {"train_loss": -12.317558288574219, "global_step": 369209, "epoch": 2197} {"train_loss": -12.364555358886719, "global_step": 369210, "epoch": 2197} {"train_loss": -12.206912994384766, "global_step": 369211, "epoch": 2197} {"train_loss": -12.39926528930664, "global_step": 369212, "epoch": 2197} {"train_loss": -12.430341720581055, "global_step": 369213, "epoch": 2197} {"train_loss": -12.44782829284668, "global_step": 369214, "epoch": 2197} {"train_loss": -12.558053016662598, "global_step": 369215, "epoch": 2197} {"train_loss": -12.124872207641602, "global_step": 369216, "epoch": 2197} {"train_loss": -12.546279907226562, "global_step": 369217, "epoch": 2197} {"train_loss": -12.358850479125977, "global_step": 369218, "epoch": 2197} {"train_loss": -12.57148551940918, "global_step": 369219, "epoch": 2197} {"train_loss": -12.161582946777344, "global_step": 369220, "epoch": 2197} {"train_loss": -12.459506034851074, "global_step": 369221, "epoch": 2197} {"train_loss": -12.258430480957031, "global_step": 369222, "epoch": 2197} {"train_loss": -12.240711212158203, "global_step": 369223, "epoch": 2197} {"train_loss": -12.34477424621582, "global_step": 369224, "epoch": 2197} {"train_loss": -12.487048149108887, "global_step": 369225, "epoch": 2197} {"train_loss": -12.097432136535645, "global_step": 369226, "epoch": 2197} {"train_loss": -12.367369651794434, "global_step": 369227, "epoch": 2197} {"train_loss": -12.247000694274902, "global_step": 369228, "epoch": 2197} {"train_loss": -12.170036315917969, "global_step": 369229, "epoch": 2197} {"train_loss": -12.726930618286133, "global_step": 369230, "epoch": 2197} {"train_loss": -12.498189926147461, "global_step": 369231, "epoch": 2197} {"train_loss": -12.50629997253418, "global_step": 369232, "epoch": 2197} {"train_loss": -12.694295883178711, "global_step": 369233, "epoch": 2197} {"train_loss": -12.384655952453613, "global_step": 369234, "epoch": 2197} {"train_loss": -12.501642227172852, "global_step": 369235, "epoch": 2197} {"train_loss": -12.56723403930664, "global_step": 369236, "epoch": 2197} {"train_loss": -12.683231353759766, "global_step": 369237, "epoch": 2197} {"train_loss": -12.43549919128418, "global_step": 369238, "epoch": 2197} {"train_loss": -12.623688697814941, "global_step": 369239, "epoch": 2197} {"train_loss": -12.625627517700195, "global_step": 369240, "epoch": 2197} {"train_loss": -12.571575164794922, "global_step": 369241, "epoch": 2197} {"train_loss": -12.809481620788574, "global_step": 369242, "epoch": 2197} {"train_loss": -12.542160034179688, "global_step": 369243, "epoch": 2197} {"train_loss": -12.515890121459961, "global_step": 369244, "epoch": 2197} {"train_loss": -12.467673301696777, "global_step": 369245, "epoch": 2197} {"train_loss": -12.403817176818848, "global_step": 369246, "epoch": 2197} {"train_loss": -12.482669830322266, "global_step": 369247, "epoch": 2197} {"train_loss": -12.380556106567383, "global_step": 369248, "epoch": 2197} {"train_loss": -12.337844848632812, "global_step": 369249, "epoch": 2197} {"train_loss": -12.682695388793945, "global_step": 369250, "epoch": 2197} {"train_loss": -12.259065628051758, "global_step": 369251, "epoch": 2197} {"train_loss": -12.11658000946045, "global_step": 369252, "epoch": 2197} {"train_loss": -12.486368179321289, "global_step": 369253, "epoch": 2197} {"train_loss": -11.884197235107422, "global_step": 369254, "epoch": 2197} {"train_loss": -11.23238754272461, "global_step": 369255, "epoch": 2197} {"train_loss": -12.164857864379883, "global_step": 369256, "epoch": 2197} {"train_loss": -11.805191040039062, "global_step": 369257, "epoch": 2197} {"train_loss": -10.550312995910645, "global_step": 369258, "epoch": 2197} {"train_loss": -11.339179992675781, "global_step": 369259, "epoch": 2197} {"train_loss": -10.996431350708008, "global_step": 369260, "epoch": 2197} {"train_loss": -12.119915008544922, "global_step": 369261, "epoch": 2197} {"train_loss": -11.087822914123535, "global_step": 369262, "epoch": 2197} {"train_loss": -11.866621170725141, "global_step": 369263, "epoch": 2197, "val_loss": 291105.53125} {"train_loss": -11.233145713806152, "global_step": 369264, "epoch": 2198} {"train_loss": -12.042680740356445, "global_step": 369265, "epoch": 2198} {"train_loss": -10.947060585021973, "global_step": 369266, "epoch": 2198} {"train_loss": -11.648632049560547, "global_step": 369267, "epoch": 2198} {"train_loss": -11.559991836547852, "global_step": 369268, "epoch": 2198} {"train_loss": -10.117541313171387, "global_step": 369269, "epoch": 2198} {"train_loss": -10.300819396972656, "global_step": 369270, "epoch": 2198} {"train_loss": -9.58738899230957, "global_step": 369271, "epoch": 2198} {"train_loss": -10.15864372253418, "global_step": 369272, "epoch": 2198} {"train_loss": -9.886697769165039, "global_step": 369273, "epoch": 2198} {"train_loss": -10.352697372436523, "global_step": 369274, "epoch": 2198} {"train_loss": -10.045756340026855, "global_step": 369275, "epoch": 2198} {"train_loss": -10.114063262939453, "global_step": 369276, "epoch": 2198} {"train_loss": -8.392483711242676, "global_step": 369277, "epoch": 2198} {"train_loss": -8.395999908447266, "global_step": 369278, "epoch": 2198} {"train_loss": -9.852080345153809, "global_step": 369279, "epoch": 2198} {"train_loss": -8.87625503540039, "global_step": 369280, "epoch": 2198} {"train_loss": -9.941694259643555, "global_step": 369281, "epoch": 2198} {"train_loss": -9.850963592529297, "global_step": 369282, "epoch": 2198} {"train_loss": -9.089603424072266, "global_step": 369283, "epoch": 2198} {"train_loss": -9.65750789642334, "global_step": 369284, "epoch": 2198} {"train_loss": -10.485742568969727, "global_step": 369285, "epoch": 2198} {"train_loss": -10.82816219329834, "global_step": 369286, "epoch": 2198} {"train_loss": -9.70083999633789, "global_step": 369287, "epoch": 2198} {"train_loss": -9.878267288208008, "global_step": 369288, "epoch": 2198} {"train_loss": -10.902862548828125, "global_step": 369289, "epoch": 2198} {"train_loss": -10.534378051757812, "global_step": 369290, "epoch": 2198} {"train_loss": -10.816105842590332, "global_step": 369291, "epoch": 2198} {"train_loss": -11.274669647216797, "global_step": 369292, "epoch": 2198} {"train_loss": -9.9266996383667, "global_step": 369293, "epoch": 2198} {"train_loss": -11.187577247619629, "global_step": 369294, "epoch": 2198} {"train_loss": -10.616693496704102, "global_step": 369295, "epoch": 2198} {"train_loss": -9.750385284423828, "global_step": 369296, "epoch": 2198} {"train_loss": -11.505523681640625, "global_step": 369297, "epoch": 2198} {"train_loss": -10.671957015991211, "global_step": 369298, "epoch": 2198} {"train_loss": -9.679709434509277, "global_step": 369299, "epoch": 2198} {"train_loss": -11.648216247558594, "global_step": 369300, "epoch": 2198} {"train_loss": -10.487875938415527, "global_step": 369301, "epoch": 2198} {"train_loss": -9.426957130432129, "global_step": 369302, "epoch": 2198} {"train_loss": -11.389375686645508, "global_step": 369303, "epoch": 2198} {"train_loss": -10.728952407836914, "global_step": 369304, "epoch": 2198} {"train_loss": -10.595229148864746, "global_step": 369305, "epoch": 2198} {"train_loss": -11.498002052307129, "global_step": 369306, "epoch": 2198} {"train_loss": -11.631233215332031, "global_step": 369307, "epoch": 2198} {"train_loss": -10.58311939239502, "global_step": 369308, "epoch": 2198} {"train_loss": -11.868257522583008, "global_step": 369309, "epoch": 2198} {"train_loss": -12.021268844604492, "global_step": 369310, "epoch": 2198} {"train_loss": -11.078117370605469, "global_step": 369311, "epoch": 2198} {"train_loss": -11.580389022827148, "global_step": 369312, "epoch": 2198} {"train_loss": -11.692499160766602, "global_step": 369313, "epoch": 2198} {"train_loss": -11.418977737426758, "global_step": 369314, "epoch": 2198} {"train_loss": -11.537880897521973, "global_step": 369315, "epoch": 2198} {"train_loss": -11.836565017700195, "global_step": 369316, "epoch": 2198} {"train_loss": -11.100116729736328, "global_step": 369317, "epoch": 2198} {"train_loss": -11.833906173706055, "global_step": 369318, "epoch": 2198} {"train_loss": -11.951164245605469, "global_step": 369319, "epoch": 2198} {"train_loss": -11.347488403320312, "global_step": 369320, "epoch": 2198} {"train_loss": -11.792295455932617, "global_step": 369321, "epoch": 2198} {"train_loss": -11.240069389343262, "global_step": 369322, "epoch": 2198} {"train_loss": -11.323219299316406, "global_step": 369323, "epoch": 2198} {"train_loss": -11.523422241210938, "global_step": 369324, "epoch": 2198} {"train_loss": -11.730020523071289, "global_step": 369325, "epoch": 2198} {"train_loss": -11.548322677612305, "global_step": 369326, "epoch": 2198} {"train_loss": -11.826465606689453, "global_step": 369327, "epoch": 2198} {"train_loss": -12.161476135253906, "global_step": 369328, "epoch": 2198} {"train_loss": -11.539237022399902, "global_step": 369329, "epoch": 2198} {"train_loss": -11.751450538635254, "global_step": 369330, "epoch": 2198} {"train_loss": -11.873156547546387, "global_step": 369331, "epoch": 2198} {"train_loss": -12.010037422180176, "global_step": 369332, "epoch": 2198} {"train_loss": -11.97381591796875, "global_step": 369333, "epoch": 2198} {"train_loss": -12.007988929748535, "global_step": 369334, "epoch": 2198} {"train_loss": -11.83763599395752, "global_step": 369335, "epoch": 2198} {"train_loss": -12.022015571594238, "global_step": 369336, "epoch": 2198} {"train_loss": -11.784695625305176, "global_step": 369337, "epoch": 2198} {"train_loss": -12.045479774475098, "global_step": 369338, "epoch": 2198} {"train_loss": -12.244495391845703, "global_step": 369339, "epoch": 2198} {"train_loss": -12.128464698791504, "global_step": 369340, "epoch": 2198} {"train_loss": -12.280345916748047, "global_step": 369341, "epoch": 2198} {"train_loss": -12.28633975982666, "global_step": 369342, "epoch": 2198} {"train_loss": -12.326452255249023, "global_step": 369343, "epoch": 2198} {"train_loss": -12.211193084716797, "global_step": 369344, "epoch": 2198} {"train_loss": -12.42232894897461, "global_step": 369345, "epoch": 2198} {"train_loss": -12.009659767150879, "global_step": 369346, "epoch": 2198} {"train_loss": -12.373929023742676, "global_step": 369347, "epoch": 2198} {"train_loss": -12.154436111450195, "global_step": 369348, "epoch": 2198} {"train_loss": -12.618812561035156, "global_step": 369349, "epoch": 2198} {"train_loss": -12.16690444946289, "global_step": 369350, "epoch": 2198} {"train_loss": -12.240823745727539, "global_step": 369351, "epoch": 2198} {"train_loss": -12.19427490234375, "global_step": 369352, "epoch": 2198} {"train_loss": -12.491849899291992, "global_step": 369353, "epoch": 2198} {"train_loss": -12.327932357788086, "global_step": 369354, "epoch": 2198} {"train_loss": -12.390645980834961, "global_step": 369355, "epoch": 2198} {"train_loss": -12.068796157836914, "global_step": 369356, "epoch": 2198} {"train_loss": -12.412773132324219, "global_step": 369357, "epoch": 2198} {"train_loss": -12.401727676391602, "global_step": 369358, "epoch": 2198} {"train_loss": -12.432483673095703, "global_step": 369359, "epoch": 2198} {"train_loss": -12.409067153930664, "global_step": 369360, "epoch": 2198} {"train_loss": -12.502233505249023, "global_step": 369361, "epoch": 2198} {"train_loss": -12.404938697814941, "global_step": 369362, "epoch": 2198} {"train_loss": -12.336833953857422, "global_step": 369363, "epoch": 2198} {"train_loss": -12.313135147094727, "global_step": 369364, "epoch": 2198} {"train_loss": -12.552303314208984, "global_step": 369365, "epoch": 2198} {"train_loss": -11.852031707763672, "global_step": 369366, "epoch": 2198} {"train_loss": -12.490555763244629, "global_step": 369367, "epoch": 2198} {"train_loss": -12.452875137329102, "global_step": 369368, "epoch": 2198} {"train_loss": -12.544010162353516, "global_step": 369369, "epoch": 2198} {"train_loss": -12.446477890014648, "global_step": 369370, "epoch": 2198} {"train_loss": -12.641417503356934, "global_step": 369371, "epoch": 2198} {"train_loss": -12.682132720947266, "global_step": 369372, "epoch": 2198} {"train_loss": -12.656147003173828, "global_step": 369373, "epoch": 2198} {"train_loss": -12.697099685668945, "global_step": 369374, "epoch": 2198} {"train_loss": -12.5575532913208, "global_step": 369375, "epoch": 2198} {"train_loss": -12.577783584594727, "global_step": 369376, "epoch": 2198} {"train_loss": -12.357915878295898, "global_step": 369377, "epoch": 2198} {"train_loss": -12.588171005249023, "global_step": 369378, "epoch": 2198} {"train_loss": -12.622794151306152, "global_step": 369379, "epoch": 2198} {"train_loss": -12.127962112426758, "global_step": 369380, "epoch": 2198} {"train_loss": -12.388960838317871, "global_step": 369381, "epoch": 2198} {"train_loss": -12.001913070678711, "global_step": 369382, "epoch": 2198} {"train_loss": -12.477884292602539, "global_step": 369383, "epoch": 2198} {"train_loss": -11.967308044433594, "global_step": 369384, "epoch": 2198} {"train_loss": -12.317545890808105, "global_step": 369385, "epoch": 2198} {"train_loss": -12.334529876708984, "global_step": 369386, "epoch": 2198} {"train_loss": -12.467997550964355, "global_step": 369387, "epoch": 2198} {"train_loss": -12.452463150024414, "global_step": 369388, "epoch": 2198} {"train_loss": -12.454252243041992, "global_step": 369389, "epoch": 2198} {"train_loss": -11.991549491882324, "global_step": 369390, "epoch": 2198} {"train_loss": -12.035134315490723, "global_step": 369391, "epoch": 2198} {"train_loss": -12.50754165649414, "global_step": 369392, "epoch": 2198} {"train_loss": -12.299259185791016, "global_step": 369393, "epoch": 2198} {"train_loss": -12.048065185546875, "global_step": 369394, "epoch": 2198} {"train_loss": -12.12181282043457, "global_step": 369395, "epoch": 2198} {"train_loss": -12.297008514404297, "global_step": 369396, "epoch": 2198} {"train_loss": -12.654741287231445, "global_step": 369397, "epoch": 2198} {"train_loss": -12.601311683654785, "global_step": 369398, "epoch": 2198} {"train_loss": -12.336028099060059, "global_step": 369399, "epoch": 2198} {"train_loss": -11.64177131652832, "global_step": 369400, "epoch": 2198} {"train_loss": -12.314014434814453, "global_step": 369401, "epoch": 2198} {"train_loss": -12.47648811340332, "global_step": 369402, "epoch": 2198} {"train_loss": -12.501004219055176, "global_step": 369403, "epoch": 2198} {"train_loss": -12.15224838256836, "global_step": 369404, "epoch": 2198} {"train_loss": -12.39589786529541, "global_step": 369405, "epoch": 2198} {"train_loss": -12.581985473632812, "global_step": 369406, "epoch": 2198} {"train_loss": -12.629331588745117, "global_step": 369407, "epoch": 2198} {"train_loss": -12.200227737426758, "global_step": 369408, "epoch": 2198} {"train_loss": -12.466695785522461, "global_step": 369409, "epoch": 2198} {"train_loss": -12.406415939331055, "global_step": 369410, "epoch": 2198} {"train_loss": -12.510871887207031, "global_step": 369411, "epoch": 2198} {"train_loss": -12.245135307312012, "global_step": 369412, "epoch": 2198} {"train_loss": -12.349555969238281, "global_step": 369413, "epoch": 2198} {"train_loss": -12.311944007873535, "global_step": 369414, "epoch": 2198} {"train_loss": -12.479284286499023, "global_step": 369415, "epoch": 2198} {"train_loss": -12.332979202270508, "global_step": 369416, "epoch": 2198} {"train_loss": -12.275264739990234, "global_step": 369417, "epoch": 2198} {"train_loss": -11.483942985534668, "global_step": 369418, "epoch": 2198} {"train_loss": -11.160555839538574, "global_step": 369419, "epoch": 2198} {"train_loss": -10.64523696899414, "global_step": 369420, "epoch": 2198} {"train_loss": -11.710464477539062, "global_step": 369421, "epoch": 2198} {"train_loss": -10.245037078857422, "global_step": 369422, "epoch": 2198} {"train_loss": -8.228239059448242, "global_step": 369423, "epoch": 2198} {"train_loss": -10.130570411682129, "global_step": 369424, "epoch": 2198} {"train_loss": -9.310224533081055, "global_step": 369425, "epoch": 2198} {"train_loss": -11.219688415527344, "global_step": 369426, "epoch": 2198} {"train_loss": -8.604177474975586, "global_step": 369427, "epoch": 2198} {"train_loss": -8.465002059936523, "global_step": 369428, "epoch": 2198} {"train_loss": -7.831455707550049, "global_step": 369429, "epoch": 2198} {"train_loss": -8.896527290344238, "global_step": 369430, "epoch": 2198} {"train_loss": -11.499825327169328, "global_step": 369431, "epoch": 2198, "val_loss": 291873.5625} {"train_loss": -9.68754768371582, "global_step": 369432, "epoch": 2199} {"train_loss": -8.209017753601074, "global_step": 369433, "epoch": 2199} {"train_loss": -9.107956886291504, "global_step": 369434, "epoch": 2199} {"train_loss": -9.9033842086792, "global_step": 369435, "epoch": 2199} {"train_loss": -10.110042572021484, "global_step": 369436, "epoch": 2199} {"train_loss": -9.53225326538086, "global_step": 369437, "epoch": 2199} {"train_loss": -9.491154670715332, "global_step": 369438, "epoch": 2199} {"train_loss": -10.146027565002441, "global_step": 369439, "epoch": 2199} {"train_loss": -11.184146881103516, "global_step": 369440, "epoch": 2199} {"train_loss": -10.924062728881836, "global_step": 369441, "epoch": 2199} {"train_loss": -10.264840126037598, "global_step": 369442, "epoch": 2199} {"train_loss": -11.005300521850586, "global_step": 369443, "epoch": 2199} {"train_loss": -10.511137008666992, "global_step": 369444, "epoch": 2199} {"train_loss": -10.6821928024292, "global_step": 369445, "epoch": 2199} {"train_loss": -10.715188980102539, "global_step": 369446, "epoch": 2199} {"train_loss": -11.263594627380371, "global_step": 369447, "epoch": 2199} {"train_loss": -10.276611328125, "global_step": 369448, "epoch": 2199} {"train_loss": -11.339300155639648, "global_step": 369449, "epoch": 2199} {"train_loss": -10.382116317749023, "global_step": 369450, "epoch": 2199} {"train_loss": -11.701873779296875, "global_step": 369451, "epoch": 2199} {"train_loss": -10.377580642700195, "global_step": 369452, "epoch": 2199} {"train_loss": -11.44002628326416, "global_step": 369453, "epoch": 2199} {"train_loss": -11.180606842041016, "global_step": 369454, "epoch": 2199} {"train_loss": -11.032657623291016, "global_step": 369455, "epoch": 2199} {"train_loss": -11.110642433166504, "global_step": 369456, "epoch": 2199} {"train_loss": -11.908493041992188, "global_step": 369457, "epoch": 2199} {"train_loss": -11.325923919677734, "global_step": 369458, "epoch": 2199} {"train_loss": -11.674057006835938, "global_step": 369459, "epoch": 2199} {"train_loss": -10.916842460632324, "global_step": 369460, "epoch": 2199} {"train_loss": -11.858214378356934, "global_step": 369461, "epoch": 2199} {"train_loss": -11.141447067260742, "global_step": 369462, "epoch": 2199} {"train_loss": -11.958732604980469, "global_step": 369463, "epoch": 2199} {"train_loss": -11.496138572692871, "global_step": 369464, "epoch": 2199} {"train_loss": -11.501920700073242, "global_step": 369465, "epoch": 2199} {"train_loss": -11.557195663452148, "global_step": 369466, "epoch": 2199} {"train_loss": -11.561601638793945, "global_step": 369467, "epoch": 2199} {"train_loss": -11.883584022521973, "global_step": 369468, "epoch": 2199} {"train_loss": -11.582772254943848, "global_step": 369469, "epoch": 2199} {"train_loss": -11.548553466796875, "global_step": 369470, "epoch": 2199} {"train_loss": -12.077590942382812, "global_step": 369471, "epoch": 2199} {"train_loss": -11.890382766723633, "global_step": 369472, "epoch": 2199} {"train_loss": -12.114145278930664, "global_step": 369473, "epoch": 2199} {"train_loss": -11.634099960327148, "global_step": 369474, "epoch": 2199} {"train_loss": -12.003523826599121, "global_step": 369475, "epoch": 2199} {"train_loss": -12.139275550842285, "global_step": 369476, "epoch": 2199} {"train_loss": -11.8277587890625, "global_step": 369477, "epoch": 2199} {"train_loss": -11.92103385925293, "global_step": 369478, "epoch": 2199} {"train_loss": -12.206585884094238, "global_step": 369479, "epoch": 2199} {"train_loss": -11.85551929473877, "global_step": 369480, "epoch": 2199} {"train_loss": -12.060188293457031, "global_step": 369481, "epoch": 2199} {"train_loss": -12.044541358947754, "global_step": 369482, "epoch": 2199} {"train_loss": -11.966485023498535, "global_step": 369483, "epoch": 2199} {"train_loss": -12.143526077270508, "global_step": 369484, "epoch": 2199} {"train_loss": -11.898048400878906, "global_step": 369485, "epoch": 2199} {"train_loss": -11.857000350952148, "global_step": 369486, "epoch": 2199} {"train_loss": -12.279430389404297, "global_step": 369487, "epoch": 2199} {"train_loss": -12.116813659667969, "global_step": 369488, "epoch": 2199} {"train_loss": -12.128538131713867, "global_step": 369489, "epoch": 2199} {"train_loss": -11.862239837646484, "global_step": 369490, "epoch": 2199} {"train_loss": -12.07740592956543, "global_step": 369491, "epoch": 2199} {"train_loss": -12.035537719726562, "global_step": 369492, "epoch": 2199} {"train_loss": -11.511667251586914, "global_step": 369493, "epoch": 2199} {"train_loss": -12.118860244750977, "global_step": 369494, "epoch": 2199} {"train_loss": -11.909896850585938, "global_step": 369495, "epoch": 2199} {"train_loss": -12.102205276489258, "global_step": 369496, "epoch": 2199} {"train_loss": -11.75924015045166, "global_step": 369497, "epoch": 2199} {"train_loss": -12.14601993560791, "global_step": 369498, "epoch": 2199} {"train_loss": -11.966421127319336, "global_step": 369499, "epoch": 2199} {"train_loss": -12.250126838684082, "global_step": 369500, "epoch": 2199} {"train_loss": -12.23309326171875, "global_step": 369501, "epoch": 2199} {"train_loss": -12.262022018432617, "global_step": 369502, "epoch": 2199} {"train_loss": -12.092536926269531, "global_step": 369503, "epoch": 2199} {"train_loss": -12.124238967895508, "global_step": 369504, "epoch": 2199} {"train_loss": -11.417097091674805, "global_step": 369505, "epoch": 2199} {"train_loss": -12.131616592407227, "global_step": 369506, "epoch": 2199} {"train_loss": -12.182600021362305, "global_step": 369507, "epoch": 2199} {"train_loss": -11.938980102539062, "global_step": 369508, "epoch": 2199} {"train_loss": -12.210653305053711, "global_step": 369509, "epoch": 2199} {"train_loss": -11.725156784057617, "global_step": 369510, "epoch": 2199} {"train_loss": -12.34018325805664, "global_step": 369511, "epoch": 2199} {"train_loss": -12.03271484375, "global_step": 369512, "epoch": 2199} {"train_loss": -12.367914199829102, "global_step": 369513, "epoch": 2199} {"train_loss": -11.932214736938477, "global_step": 369514, "epoch": 2199} {"train_loss": -12.323634147644043, "global_step": 369515, "epoch": 2199} {"train_loss": -11.524712562561035, "global_step": 369516, "epoch": 2199} {"train_loss": -11.971596717834473, "global_step": 369517, "epoch": 2199} {"train_loss": -11.751008987426758, "global_step": 369518, "epoch": 2199} {"train_loss": -12.00184154510498, "global_step": 369519, "epoch": 2199} {"train_loss": -12.19310474395752, "global_step": 369520, "epoch": 2199} {"train_loss": -12.094512939453125, "global_step": 369521, "epoch": 2199} {"train_loss": -12.16529369354248, "global_step": 369522, "epoch": 2199} {"train_loss": -12.05113410949707, "global_step": 369523, "epoch": 2199} {"train_loss": -12.252067565917969, "global_step": 369524, "epoch": 2199} {"train_loss": -12.562976837158203, "global_step": 369525, "epoch": 2199} {"train_loss": -11.96087646484375, "global_step": 369526, "epoch": 2199} {"train_loss": -12.407764434814453, "global_step": 369527, "epoch": 2199} {"train_loss": -12.528448104858398, "global_step": 369528, "epoch": 2199} {"train_loss": -12.339967727661133, "global_step": 369529, "epoch": 2199} {"train_loss": -12.456350326538086, "global_step": 369530, "epoch": 2199} {"train_loss": -12.378888130187988, "global_step": 369531, "epoch": 2199} {"train_loss": -12.188282012939453, "global_step": 369532, "epoch": 2199} {"train_loss": -12.360932350158691, "global_step": 369533, "epoch": 2199} {"train_loss": -12.408622741699219, "global_step": 369534, "epoch": 2199} {"train_loss": -12.434549331665039, "global_step": 369535, "epoch": 2199} {"train_loss": -12.563441276550293, "global_step": 369536, "epoch": 2199} {"train_loss": -12.518648147583008, "global_step": 369537, "epoch": 2199} {"train_loss": -12.490337371826172, "global_step": 369538, "epoch": 2199} {"train_loss": -12.534099578857422, "global_step": 369539, "epoch": 2199} {"train_loss": -12.517426490783691, "global_step": 369540, "epoch": 2199} {"train_loss": -12.79002571105957, "global_step": 369541, "epoch": 2199} {"train_loss": -12.319671630859375, "global_step": 369542, "epoch": 2199} {"train_loss": -12.347725868225098, "global_step": 369543, "epoch": 2199} {"train_loss": -12.109175682067871, "global_step": 369544, "epoch": 2199} {"train_loss": -12.642590522766113, "global_step": 369545, "epoch": 2199} {"train_loss": -12.491009712219238, "global_step": 369546, "epoch": 2199} {"train_loss": -12.175052642822266, "global_step": 369547, "epoch": 2199} {"train_loss": -12.48865795135498, "global_step": 369548, "epoch": 2199} {"train_loss": -12.31926155090332, "global_step": 369549, "epoch": 2199} {"train_loss": -12.69399642944336, "global_step": 369550, "epoch": 2199} {"train_loss": -12.531351089477539, "global_step": 369551, "epoch": 2199} {"train_loss": -12.566551208496094, "global_step": 369552, "epoch": 2199} {"train_loss": -12.626961708068848, "global_step": 369553, "epoch": 2199} {"train_loss": -12.499061584472656, "global_step": 369554, "epoch": 2199} {"train_loss": -12.004709243774414, "global_step": 369555, "epoch": 2199} {"train_loss": -12.106258392333984, "global_step": 369556, "epoch": 2199} {"train_loss": -12.385766983032227, "global_step": 369557, "epoch": 2199} {"train_loss": -12.418989181518555, "global_step": 369558, "epoch": 2199} {"train_loss": -12.026700973510742, "global_step": 369559, "epoch": 2199} {"train_loss": -12.515897750854492, "global_step": 369560, "epoch": 2199} {"train_loss": -12.611007690429688, "global_step": 369561, "epoch": 2199} {"train_loss": -12.199371337890625, "global_step": 369562, "epoch": 2199} {"train_loss": -12.505054473876953, "global_step": 369563, "epoch": 2199} {"train_loss": -12.291006088256836, "global_step": 369564, "epoch": 2199} {"train_loss": -12.4045991897583, "global_step": 369565, "epoch": 2199} {"train_loss": -12.586066246032715, "global_step": 369566, "epoch": 2199} {"train_loss": -12.128811836242676, "global_step": 369567, "epoch": 2199} {"train_loss": -11.888309478759766, "global_step": 369568, "epoch": 2199} {"train_loss": -11.816171646118164, "global_step": 369569, "epoch": 2199} {"train_loss": -11.919818878173828, "global_step": 369570, "epoch": 2199} {"train_loss": -12.339599609375, "global_step": 369571, "epoch": 2199} {"train_loss": -11.44028091430664, "global_step": 369572, "epoch": 2199} {"train_loss": -11.487964630126953, "global_step": 369573, "epoch": 2199} {"train_loss": -12.111907958984375, "global_step": 369574, "epoch": 2199} {"train_loss": -8.950660705566406, "global_step": 369575, "epoch": 2199} {"train_loss": -10.526880264282227, "global_step": 369576, "epoch": 2199} {"train_loss": -8.847225189208984, "global_step": 369577, "epoch": 2199} {"train_loss": -8.746109008789062, "global_step": 369578, "epoch": 2199} {"train_loss": -7.747008323669434, "global_step": 369579, "epoch": 2199} {"train_loss": -8.132877349853516, "global_step": 369580, "epoch": 2199} {"train_loss": -8.733285903930664, "global_step": 369581, "epoch": 2199} {"train_loss": -8.824625968933105, "global_step": 369582, "epoch": 2199} {"train_loss": -10.795933723449707, "global_step": 369583, "epoch": 2199} {"train_loss": -10.326190948486328, "global_step": 369584, "epoch": 2199} {"train_loss": -8.735006332397461, "global_step": 369585, "epoch": 2199} {"train_loss": -11.039361953735352, "global_step": 369586, "epoch": 2199} {"train_loss": -9.084634780883789, "global_step": 369587, "epoch": 2199} {"train_loss": -7.998565673828125, "global_step": 369588, "epoch": 2199} {"train_loss": -7.705981731414795, "global_step": 369589, "epoch": 2199} {"train_loss": -8.211763381958008, "global_step": 369590, "epoch": 2199} {"train_loss": -8.558826446533203, "global_step": 369591, "epoch": 2199} {"train_loss": -8.590827941894531, "global_step": 369592, "epoch": 2199} {"train_loss": -8.785067558288574, "global_step": 369593, "epoch": 2199} {"train_loss": -9.499214172363281, "global_step": 369594, "epoch": 2199} {"train_loss": -8.463356018066406, "global_step": 369595, "epoch": 2199} {"train_loss": -8.809062957763672, "global_step": 369596, "epoch": 2199} {"train_loss": -8.51298713684082, "global_step": 369597, "epoch": 2199} {"train_loss": -8.484220504760742, "global_step": 369598, "epoch": 2199} {"train_loss": -11.387732792468299, "global_step": 369599, "epoch": 2199, "val_loss": 293126.46875} {"train_loss": -9.417298316955566, "global_step": 369600, "epoch": 2200} {"train_loss": -9.133013725280762, "global_step": 369601, "epoch": 2200} {"train_loss": -9.282461166381836, "global_step": 369602, "epoch": 2200} {"train_loss": -9.22801399230957, "global_step": 369603, "epoch": 2200} {"train_loss": -9.743206024169922, "global_step": 369604, "epoch": 2200} {"train_loss": -10.647682189941406, "global_step": 369605, "epoch": 2200} {"train_loss": -10.549355506896973, "global_step": 369606, "epoch": 2200} {"train_loss": -10.2039155960083, "global_step": 369607, "epoch": 2200} {"train_loss": -11.194234848022461, "global_step": 369608, "epoch": 2200} {"train_loss": -10.991631507873535, "global_step": 369609, "epoch": 2200} {"train_loss": -11.211698532104492, "global_step": 369610, "epoch": 2200} {"train_loss": -11.044292449951172, "global_step": 369611, "epoch": 2200} {"train_loss": -10.546371459960938, "global_step": 369612, "epoch": 2200} {"train_loss": -11.583649635314941, "global_step": 369613, "epoch": 2200} {"train_loss": -11.028810501098633, "global_step": 369614, "epoch": 2200} {"train_loss": -11.339308738708496, "global_step": 369615, "epoch": 2200} {"train_loss": -11.437383651733398, "global_step": 369616, "epoch": 2200} {"train_loss": -11.725872993469238, "global_step": 369617, "epoch": 2200} {"train_loss": -11.672703742980957, "global_step": 369618, "epoch": 2200} {"train_loss": -11.418710708618164, "global_step": 369619, "epoch": 2200} {"train_loss": -11.650426864624023, "global_step": 369620, "epoch": 2200} {"train_loss": -11.596393585205078, "global_step": 369621, "epoch": 2200} {"train_loss": -11.490324020385742, "global_step": 369622, "epoch": 2200} {"train_loss": -11.881148338317871, "global_step": 369623, "epoch": 2200} {"train_loss": -11.866170883178711, "global_step": 369624, "epoch": 2200} {"train_loss": -12.14706039428711, "global_step": 369625, "epoch": 2200} {"train_loss": -11.918933868408203, "global_step": 369626, "epoch": 2200} {"train_loss": -11.974079132080078, "global_step": 369627, "epoch": 2200} {"train_loss": -11.92003059387207, "global_step": 369628, "epoch": 2200} {"train_loss": -11.671777725219727, "global_step": 369629, "epoch": 2200} {"train_loss": -11.778528213500977, "global_step": 369630, "epoch": 2200} {"train_loss": -11.705373764038086, "global_step": 369631, "epoch": 2200} {"train_loss": -12.209396362304688, "global_step": 369632, "epoch": 2200} {"train_loss": -11.957140922546387, "global_step": 369633, "epoch": 2200} {"train_loss": -12.094861030578613, "global_step": 369634, "epoch": 2200} {"train_loss": -12.101044654846191, "global_step": 369635, "epoch": 2200} {"train_loss": -12.037273406982422, "global_step": 369636, "epoch": 2200} {"train_loss": -12.089762687683105, "global_step": 369637, "epoch": 2200} {"train_loss": -12.31467056274414, "global_step": 369638, "epoch": 2200} {"train_loss": -12.000146865844727, "global_step": 369639, "epoch": 2200} {"train_loss": -12.106180191040039, "global_step": 369640, "epoch": 2200} {"train_loss": -12.205474853515625, "global_step": 369641, "epoch": 2200} {"train_loss": -12.298843383789062, "global_step": 369642, "epoch": 2200} {"train_loss": -12.402734756469727, "global_step": 369643, "epoch": 2200} {"train_loss": -12.237089157104492, "global_step": 369644, "epoch": 2200} {"train_loss": -12.105878829956055, "global_step": 369645, "epoch": 2200} {"train_loss": -12.129262924194336, "global_step": 369646, "epoch": 2200} {"train_loss": -12.370697021484375, "global_step": 369647, "epoch": 2200} {"train_loss": -12.070630073547363, "global_step": 369648, "epoch": 2200} {"train_loss": -12.266901016235352, "global_step": 369649, "epoch": 2200} {"train_loss": -12.191722869873047, "global_step": 369650, "epoch": 2200} {"train_loss": -12.456268310546875, "global_step": 369651, "epoch": 2200} {"train_loss": -12.27845573425293, "global_step": 369652, "epoch": 2200} {"train_loss": -12.381946563720703, "global_step": 369653, "epoch": 2200} {"train_loss": -12.363044738769531, "global_step": 369654, "epoch": 2200} {"train_loss": -12.32117748260498, "global_step": 369655, "epoch": 2200} {"train_loss": -12.55733871459961, "global_step": 369656, "epoch": 2200} {"train_loss": -12.307158470153809, "global_step": 369657, "epoch": 2200} {"train_loss": -12.47420883178711, "global_step": 369658, "epoch": 2200} {"train_loss": -12.518339157104492, "global_step": 369659, "epoch": 2200} {"train_loss": -12.176872253417969, "global_step": 369660, "epoch": 2200} {"train_loss": -12.331443786621094, "global_step": 369661, "epoch": 2200} {"train_loss": -12.466156005859375, "global_step": 369662, "epoch": 2200} {"train_loss": -12.167556762695312, "global_step": 369663, "epoch": 2200} {"train_loss": -12.442530632019043, "global_step": 369664, "epoch": 2200} {"train_loss": -12.426313400268555, "global_step": 369665, "epoch": 2200} {"train_loss": -12.492300033569336, "global_step": 369666, "epoch": 2200} {"train_loss": -12.346208572387695, "global_step": 369667, "epoch": 2200} {"train_loss": -12.519165992736816, "global_step": 369668, "epoch": 2200} {"train_loss": -12.533744812011719, "global_step": 369669, "epoch": 2200} {"train_loss": -12.179637908935547, "global_step": 369670, "epoch": 2200} {"train_loss": -12.564286231994629, "global_step": 369671, "epoch": 2200} {"train_loss": -12.157829284667969, "global_step": 369672, "epoch": 2200} {"train_loss": -12.587655067443848, "global_step": 369673, "epoch": 2200} {"train_loss": -12.059041976928711, "global_step": 369674, "epoch": 2200} {"train_loss": -11.88050651550293, "global_step": 369675, "epoch": 2200} {"train_loss": -12.167376518249512, "global_step": 369676, "epoch": 2200} {"train_loss": -12.398726463317871, "global_step": 369677, "epoch": 2200} {"train_loss": -11.924814224243164, "global_step": 369678, "epoch": 2200} {"train_loss": -12.571893692016602, "global_step": 369679, "epoch": 2200} {"train_loss": -12.11934757232666, "global_step": 369680, "epoch": 2200} {"train_loss": -12.208377838134766, "global_step": 369681, "epoch": 2200} {"train_loss": -12.312515258789062, "global_step": 369682, "epoch": 2200} {"train_loss": -12.429253578186035, "global_step": 369683, "epoch": 2200} {"train_loss": -11.960000991821289, "global_step": 369684, "epoch": 2200} {"train_loss": -12.519073486328125, "global_step": 369685, "epoch": 2200} {"train_loss": -12.295129776000977, "global_step": 369686, "epoch": 2200} {"train_loss": -12.120096206665039, "global_step": 369687, "epoch": 2200} {"train_loss": -11.695999145507812, "global_step": 369688, "epoch": 2200} {"train_loss": -12.3688325881958, "global_step": 369689, "epoch": 2200} {"train_loss": -11.96512222290039, "global_step": 369690, "epoch": 2200} {"train_loss": -11.741863250732422, "global_step": 369691, "epoch": 2200} {"train_loss": -11.90096378326416, "global_step": 369692, "epoch": 2200} {"train_loss": -11.957389831542969, "global_step": 369693, "epoch": 2200} {"train_loss": -11.215513229370117, "global_step": 369694, "epoch": 2200} {"train_loss": -12.442367553710938, "global_step": 369695, "epoch": 2200} {"train_loss": -11.765495300292969, "global_step": 369696, "epoch": 2200} {"train_loss": -11.231029510498047, "global_step": 369697, "epoch": 2200} {"train_loss": -12.548924446105957, "global_step": 369698, "epoch": 2200} {"train_loss": -10.80593204498291, "global_step": 369699, "epoch": 2200} {"train_loss": -11.365716934204102, "global_step": 369700, "epoch": 2200} {"train_loss": -11.97250747680664, "global_step": 369701, "epoch": 2200} {"train_loss": -11.061559677124023, "global_step": 369702, "epoch": 2200} {"train_loss": -12.350776672363281, "global_step": 369703, "epoch": 2200} {"train_loss": -11.952857971191406, "global_step": 369704, "epoch": 2200} {"train_loss": -11.442277908325195, "global_step": 369705, "epoch": 2200} {"train_loss": -12.008447647094727, "global_step": 369706, "epoch": 2200} {"train_loss": -11.314445495605469, "global_step": 369707, "epoch": 2200} {"train_loss": -11.457728385925293, "global_step": 369708, "epoch": 2200} {"train_loss": -11.64682388305664, "global_step": 369709, "epoch": 2200} {"train_loss": -11.219596862792969, "global_step": 369710, "epoch": 2200} {"train_loss": -11.000598907470703, "global_step": 369711, "epoch": 2200} {"train_loss": -12.1612548828125, "global_step": 369712, "epoch": 2200} {"train_loss": -10.944779396057129, "global_step": 369713, "epoch": 2200} {"train_loss": -12.431885719299316, "global_step": 369714, "epoch": 2200} {"train_loss": -11.438848495483398, "global_step": 369715, "epoch": 2200} {"train_loss": -11.51467514038086, "global_step": 369716, "epoch": 2200} {"train_loss": -11.893409729003906, "global_step": 369717, "epoch": 2200} {"train_loss": -11.226297378540039, "global_step": 369718, "epoch": 2200} {"train_loss": -11.310230255126953, "global_step": 369719, "epoch": 2200} {"train_loss": -12.152437210083008, "global_step": 369720, "epoch": 2200} {"train_loss": -11.125808715820312, "global_step": 369721, "epoch": 2200} {"train_loss": -12.432743072509766, "global_step": 369722, "epoch": 2200} {"train_loss": -11.590052604675293, "global_step": 369723, "epoch": 2200} {"train_loss": -12.163616180419922, "global_step": 369724, "epoch": 2200} {"train_loss": -11.786239624023438, "global_step": 369725, "epoch": 2200} {"train_loss": -11.817501068115234, "global_step": 369726, "epoch": 2200} {"train_loss": -12.128211975097656, "global_step": 369727, "epoch": 2200} {"train_loss": -11.874544143676758, "global_step": 369728, "epoch": 2200} {"train_loss": -12.20545768737793, "global_step": 369729, "epoch": 2200} {"train_loss": -12.051913261413574, "global_step": 369730, "epoch": 2200} {"train_loss": -11.948128700256348, "global_step": 369731, "epoch": 2200} {"train_loss": -12.25439739227295, "global_step": 369732, "epoch": 2200} {"train_loss": -12.069798469543457, "global_step": 369733, "epoch": 2200} {"train_loss": -12.177715301513672, "global_step": 369734, "epoch": 2200} {"train_loss": -12.272045135498047, "global_step": 369735, "epoch": 2200} {"train_loss": -12.215591430664062, "global_step": 369736, "epoch": 2200} {"train_loss": -12.116910934448242, "global_step": 369737, "epoch": 2200} {"train_loss": -12.251487731933594, "global_step": 369738, "epoch": 2200} {"train_loss": -12.163666725158691, "global_step": 369739, "epoch": 2200} {"train_loss": -11.973106384277344, "global_step": 369740, "epoch": 2200} {"train_loss": -12.015872955322266, "global_step": 369741, "epoch": 2200} {"train_loss": -12.212270736694336, "global_step": 369742, "epoch": 2200} {"train_loss": -12.018264770507812, "global_step": 369743, "epoch": 2200} {"train_loss": -11.912895202636719, "global_step": 369744, "epoch": 2200} {"train_loss": -11.928114891052246, "global_step": 369745, "epoch": 2200} {"train_loss": -12.28448486328125, "global_step": 369746, "epoch": 2200} {"train_loss": -12.025020599365234, "global_step": 369747, "epoch": 2200} {"train_loss": -12.219013214111328, "global_step": 369748, "epoch": 2200} {"train_loss": -11.995623588562012, "global_step": 369749, "epoch": 2200} {"train_loss": -12.245162963867188, "global_step": 369750, "epoch": 2200} {"train_loss": -11.702946662902832, "global_step": 369751, "epoch": 2200} {"train_loss": -11.637572288513184, "global_step": 369752, "epoch": 2200} {"train_loss": -12.354022979736328, "global_step": 369753, "epoch": 2200} {"train_loss": -10.92005729675293, "global_step": 369754, "epoch": 2200} {"train_loss": -11.226062774658203, "global_step": 369755, "epoch": 2200} {"train_loss": -11.460803985595703, "global_step": 369756, "epoch": 2200} {"train_loss": -11.872051239013672, "global_step": 369757, "epoch": 2200} {"train_loss": -11.411219596862793, "global_step": 369758, "epoch": 2200} {"train_loss": -11.819689750671387, "global_step": 369759, "epoch": 2200} {"train_loss": -11.699210166931152, "global_step": 369760, "epoch": 2200} {"train_loss": -10.890436172485352, "global_step": 369761, "epoch": 2200} {"train_loss": -11.916173934936523, "global_step": 369762, "epoch": 2200} {"train_loss": -11.890340805053711, "global_step": 369763, "epoch": 2200} {"train_loss": -11.55115795135498, "global_step": 369764, "epoch": 2200} {"train_loss": -11.524087905883789, "global_step": 369765, "epoch": 2200} {"train_loss": -11.69984245300293, "global_step": 369766, "epoch": 2200} {"train_loss": -11.82254489830562, "global_step": 369767, "epoch": 2200, "train/sim_max_reward_0": 0.6917727889518377, "train/sim_max_reward_1": 0.8713387354862484, "train/sim_max_reward_2": 0.0025130569160171827, "train/sim_max_reward_3": 0.6362763959458111, "train/sim_max_reward_4": 0.9996928053569851, "train/sim_max_reward_5": 0.5236102420171305, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.3762551336788446, "test/sim_max_reward_4400002": 0.06075520299340144, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.4808675660405545, "test/sim_max_reward_4400005": 0.9905433917718109, "test/sim_max_reward_4400006": 0.25555732880621396, "test/sim_max_reward_4400007": 0.25383666998786436, "test/sim_max_reward_4400008": 0.5474236165082953, "test/sim_max_reward_4400009": 0.3730869023502401, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 0.992265225864828, "test/sim_max_reward_4400012": 0.8816631262695861, "test/sim_max_reward_4400013": 0.9359225290086943, "test/sim_max_reward_4400014": 0.6031753903085288, "test/sim_max_reward_4400015": 0.47329093822323237, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.1620252275358809, "test/sim_max_reward_4400018": 0.9854877891430764, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.8981981890917523, "test/sim_max_reward_4400022": 0.9687263776676222, "test/sim_max_reward_4400023": 0.16092840589158164, "test/sim_max_reward_4400024": 0.8399060797803826, "test/sim_max_reward_4400025": 0.563200927390023, "test/sim_max_reward_4400026": 0.6677374719892553, "test/sim_max_reward_4400027": 0.6822158880706379, "test/sim_max_reward_4400028": 0.6078918652071068, "test/sim_max_reward_4400029": 0.4566347080053005, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.13400765352316943, "test/sim_max_reward_4400033": 0.4676305909546347, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.37300797258190815, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.29907876418351076, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.17485614834712654, "test/sim_max_reward_4400042": 0.6114176992765764, "test/sim_max_reward_4400043": 0.01985166508452029, "test/sim_max_reward_4400044": 0.9660969601534769, "test/sim_max_reward_4400045": 0.10467440200598997, "test/sim_max_reward_4400046": 0.31007824713209975, "test/sim_max_reward_4400047": 0.9943960142777475, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6208673374456716, "test/mean_score": 0.5073754463466311, "val_loss": 292675.28125, "train_action_mse_error": 1.3229053020477295} {"train_loss": -11.687540054321289, "global_step": 369768, "epoch": 2201} {"train_loss": -11.881797790527344, "global_step": 369769, "epoch": 2201} {"train_loss": -12.05918025970459, "global_step": 369770, "epoch": 2201} {"train_loss": -12.093791961669922, "global_step": 369771, "epoch": 2201} {"train_loss": -11.74464225769043, "global_step": 369772, "epoch": 2201} {"train_loss": -11.990821838378906, "global_step": 369773, "epoch": 2201} {"train_loss": -11.412650108337402, "global_step": 369774, "epoch": 2201} {"train_loss": -11.929015159606934, "global_step": 369775, "epoch": 2201} {"train_loss": -11.609983444213867, "global_step": 369776, "epoch": 2201} {"train_loss": -11.552705764770508, "global_step": 369777, "epoch": 2201} {"train_loss": -11.606761932373047, "global_step": 369778, "epoch": 2201} {"train_loss": -11.732257843017578, "global_step": 369779, "epoch": 2201} {"train_loss": -11.64661979675293, "global_step": 369780, "epoch": 2201} {"train_loss": -12.279420852661133, "global_step": 369781, "epoch": 2201} {"train_loss": -11.700974464416504, "global_step": 369782, "epoch": 2201} {"train_loss": -12.363096237182617, "global_step": 369783, "epoch": 2201} {"train_loss": -11.910444259643555, "global_step": 369784, "epoch": 2201} {"train_loss": -12.221689224243164, "global_step": 369785, "epoch": 2201} {"train_loss": -12.088735580444336, "global_step": 369786, "epoch": 2201} {"train_loss": -12.242644309997559, "global_step": 369787, "epoch": 2201} {"train_loss": -12.229281425476074, "global_step": 369788, "epoch": 2201} {"train_loss": -11.385184288024902, "global_step": 369789, "epoch": 2201} {"train_loss": -12.09652328491211, "global_step": 369790, "epoch": 2201} {"train_loss": -11.545612335205078, "global_step": 369791, "epoch": 2201} {"train_loss": -12.052414894104004, "global_step": 369792, "epoch": 2201} {"train_loss": -11.052664756774902, "global_step": 369793, "epoch": 2201} {"train_loss": -12.108762741088867, "global_step": 369794, "epoch": 2201} {"train_loss": -11.241998672485352, "global_step": 369795, "epoch": 2201} {"train_loss": -12.159652709960938, "global_step": 369796, "epoch": 2201} {"train_loss": -11.334060668945312, "global_step": 369797, "epoch": 2201} {"train_loss": -12.04460334777832, "global_step": 369798, "epoch": 2201} {"train_loss": -11.800955772399902, "global_step": 369799, "epoch": 2201} {"train_loss": -11.899601936340332, "global_step": 369800, "epoch": 2201} {"train_loss": -11.748716354370117, "global_step": 369801, "epoch": 2201} {"train_loss": -11.898706436157227, "global_step": 369802, "epoch": 2201} {"train_loss": -11.802719116210938, "global_step": 369803, "epoch": 2201} {"train_loss": -11.732105255126953, "global_step": 369804, "epoch": 2201} {"train_loss": -11.74058723449707, "global_step": 369805, "epoch": 2201} {"train_loss": -11.163179397583008, "global_step": 369806, "epoch": 2201} {"train_loss": -12.044548034667969, "global_step": 369807, "epoch": 2201} {"train_loss": -11.846673965454102, "global_step": 369808, "epoch": 2201} {"train_loss": -12.159085273742676, "global_step": 369809, "epoch": 2201} {"train_loss": -12.050529479980469, "global_step": 369810, "epoch": 2201} {"train_loss": -12.151168823242188, "global_step": 369811, "epoch": 2201} {"train_loss": -12.199113845825195, "global_step": 369812, "epoch": 2201} {"train_loss": -11.980142593383789, "global_step": 369813, "epoch": 2201} {"train_loss": -11.962392807006836, "global_step": 369814, "epoch": 2201} {"train_loss": -12.08004379272461, "global_step": 369815, "epoch": 2201} {"train_loss": -12.039535522460938, "global_step": 369816, "epoch": 2201} {"train_loss": -11.878410339355469, "global_step": 369817, "epoch": 2201} {"train_loss": -12.230770111083984, "global_step": 369818, "epoch": 2201} {"train_loss": -11.521066665649414, "global_step": 369819, "epoch": 2201} {"train_loss": -12.405563354492188, "global_step": 369820, "epoch": 2201} {"train_loss": -11.79344367980957, "global_step": 369821, "epoch": 2201} {"train_loss": -11.830709457397461, "global_step": 369822, "epoch": 2201} {"train_loss": -12.33095645904541, "global_step": 369823, "epoch": 2201} {"train_loss": -12.210306167602539, "global_step": 369824, "epoch": 2201} {"train_loss": -12.364526748657227, "global_step": 369825, "epoch": 2201} {"train_loss": -12.292706489562988, "global_step": 369826, "epoch": 2201} {"train_loss": -12.3638916015625, "global_step": 369827, "epoch": 2201} {"train_loss": -12.274103164672852, "global_step": 369828, "epoch": 2201} {"train_loss": -12.621820449829102, "global_step": 369829, "epoch": 2201} {"train_loss": -12.338810920715332, "global_step": 369830, "epoch": 2201} {"train_loss": -12.494961738586426, "global_step": 369831, "epoch": 2201} {"train_loss": -12.454431533813477, "global_step": 369832, "epoch": 2201} {"train_loss": -12.488069534301758, "global_step": 369833, "epoch": 2201} {"train_loss": -12.228588104248047, "global_step": 369834, "epoch": 2201} {"train_loss": -12.064849853515625, "global_step": 369835, "epoch": 2201} {"train_loss": -12.180907249450684, "global_step": 369836, "epoch": 2201} {"train_loss": -12.319421768188477, "global_step": 369837, "epoch": 2201} {"train_loss": -12.20425033569336, "global_step": 369838, "epoch": 2201} {"train_loss": -12.491971015930176, "global_step": 369839, "epoch": 2201} {"train_loss": -12.599039077758789, "global_step": 369840, "epoch": 2201} {"train_loss": -12.05299186706543, "global_step": 369841, "epoch": 2201} {"train_loss": -12.494731903076172, "global_step": 369842, "epoch": 2201} {"train_loss": -12.290897369384766, "global_step": 369843, "epoch": 2201} {"train_loss": -11.906508445739746, "global_step": 369844, "epoch": 2201} {"train_loss": -12.093097686767578, "global_step": 369845, "epoch": 2201} {"train_loss": -11.715904235839844, "global_step": 369846, "epoch": 2201} {"train_loss": -11.398082733154297, "global_step": 369847, "epoch": 2201} {"train_loss": -11.607057571411133, "global_step": 369848, "epoch": 2201} {"train_loss": -10.386099815368652, "global_step": 369849, "epoch": 2201} {"train_loss": -9.768710136413574, "global_step": 369850, "epoch": 2201} {"train_loss": -11.436081886291504, "global_step": 369851, "epoch": 2201} {"train_loss": -10.42680549621582, "global_step": 369852, "epoch": 2201} {"train_loss": -10.931559562683105, "global_step": 369853, "epoch": 2201} {"train_loss": -11.031197547912598, "global_step": 369854, "epoch": 2201} {"train_loss": -9.551899909973145, "global_step": 369855, "epoch": 2201} {"train_loss": -10.670888900756836, "global_step": 369856, "epoch": 2201} {"train_loss": -10.816041946411133, "global_step": 369857, "epoch": 2201} {"train_loss": -9.554262161254883, "global_step": 369858, "epoch": 2201} {"train_loss": -11.29326057434082, "global_step": 369859, "epoch": 2201} {"train_loss": -10.922539710998535, "global_step": 369860, "epoch": 2201} {"train_loss": -9.611272811889648, "global_step": 369861, "epoch": 2201} {"train_loss": -10.555870056152344, "global_step": 369862, "epoch": 2201} {"train_loss": -10.59599494934082, "global_step": 369863, "epoch": 2201} {"train_loss": -10.2642240524292, "global_step": 369864, "epoch": 2201} {"train_loss": -10.607491493225098, "global_step": 369865, "epoch": 2201} {"train_loss": -10.990677833557129, "global_step": 369866, "epoch": 2201} {"train_loss": -10.54251766204834, "global_step": 369867, "epoch": 2201} {"train_loss": -11.125057220458984, "global_step": 369868, "epoch": 2201} {"train_loss": -10.52468204498291, "global_step": 369869, "epoch": 2201} {"train_loss": -10.515018463134766, "global_step": 369870, "epoch": 2201} {"train_loss": -11.799670219421387, "global_step": 369871, "epoch": 2201} {"train_loss": -10.700828552246094, "global_step": 369872, "epoch": 2201} {"train_loss": -10.92593002319336, "global_step": 369873, "epoch": 2201} {"train_loss": -11.064959526062012, "global_step": 369874, "epoch": 2201} {"train_loss": -10.00694465637207, "global_step": 369875, "epoch": 2201} {"train_loss": -10.903914451599121, "global_step": 369876, "epoch": 2201} {"train_loss": -10.675430297851562, "global_step": 369877, "epoch": 2201} {"train_loss": -10.711721420288086, "global_step": 369878, "epoch": 2201} {"train_loss": -10.839786529541016, "global_step": 369879, "epoch": 2201} {"train_loss": -11.139812469482422, "global_step": 369880, "epoch": 2201} {"train_loss": -10.739145278930664, "global_step": 369881, "epoch": 2201} {"train_loss": -11.591266632080078, "global_step": 369882, "epoch": 2201} {"train_loss": -11.285247802734375, "global_step": 369883, "epoch": 2201} {"train_loss": -11.721281051635742, "global_step": 369884, "epoch": 2201} {"train_loss": -11.605355262756348, "global_step": 369885, "epoch": 2201} {"train_loss": -11.681468963623047, "global_step": 369886, "epoch": 2201} {"train_loss": -11.672775268554688, "global_step": 369887, "epoch": 2201} {"train_loss": -11.840941429138184, "global_step": 369888, "epoch": 2201} {"train_loss": -11.828275680541992, "global_step": 369889, "epoch": 2201} {"train_loss": -11.551607131958008, "global_step": 369890, "epoch": 2201} {"train_loss": -11.851008415222168, "global_step": 369891, "epoch": 2201} {"train_loss": -11.607583999633789, "global_step": 369892, "epoch": 2201} {"train_loss": -11.67353343963623, "global_step": 369893, "epoch": 2201} {"train_loss": -11.964345932006836, "global_step": 369894, "epoch": 2201} {"train_loss": -11.52254581451416, "global_step": 369895, "epoch": 2201} {"train_loss": -11.725553512573242, "global_step": 369896, "epoch": 2201} {"train_loss": -11.507741928100586, "global_step": 369897, "epoch": 2201} {"train_loss": -11.764726638793945, "global_step": 369898, "epoch": 2201} {"train_loss": -11.874649047851562, "global_step": 369899, "epoch": 2201} {"train_loss": -11.802576065063477, "global_step": 369900, "epoch": 2201} {"train_loss": -12.096991539001465, "global_step": 369901, "epoch": 2201} {"train_loss": -11.812453269958496, "global_step": 369902, "epoch": 2201} {"train_loss": -11.949963569641113, "global_step": 369903, "epoch": 2201} {"train_loss": -11.806586265563965, "global_step": 369904, "epoch": 2201} {"train_loss": -11.837400436401367, "global_step": 369905, "epoch": 2201} {"train_loss": -11.797889709472656, "global_step": 369906, "epoch": 2201} {"train_loss": -12.12449836730957, "global_step": 369907, "epoch": 2201} {"train_loss": -11.96458625793457, "global_step": 369908, "epoch": 2201} {"train_loss": -12.267934799194336, "global_step": 369909, "epoch": 2201} {"train_loss": -12.03213119506836, "global_step": 369910, "epoch": 2201} {"train_loss": -11.935935974121094, "global_step": 369911, "epoch": 2201} {"train_loss": -12.077455520629883, "global_step": 369912, "epoch": 2201} {"train_loss": -12.104398727416992, "global_step": 369913, "epoch": 2201} {"train_loss": -11.866296768188477, "global_step": 369914, "epoch": 2201} {"train_loss": -12.37302017211914, "global_step": 369915, "epoch": 2201} {"train_loss": -12.290618896484375, "global_step": 369916, "epoch": 2201} {"train_loss": -12.20590591430664, "global_step": 369917, "epoch": 2201} {"train_loss": -12.36726188659668, "global_step": 369918, "epoch": 2201} {"train_loss": -12.244110107421875, "global_step": 369919, "epoch": 2201} {"train_loss": -12.491985321044922, "global_step": 369920, "epoch": 2201} {"train_loss": -12.130165100097656, "global_step": 369921, "epoch": 2201} {"train_loss": -12.342531204223633, "global_step": 369922, "epoch": 2201} {"train_loss": -12.342628479003906, "global_step": 369923, "epoch": 2201} {"train_loss": -12.036575317382812, "global_step": 369924, "epoch": 2201} {"train_loss": -12.26944351196289, "global_step": 369925, "epoch": 2201} {"train_loss": -12.23534107208252, "global_step": 369926, "epoch": 2201} {"train_loss": -12.494148254394531, "global_step": 369927, "epoch": 2201} {"train_loss": -12.231778144836426, "global_step": 369928, "epoch": 2201} {"train_loss": -12.281623840332031, "global_step": 369929, "epoch": 2201} {"train_loss": -12.463226318359375, "global_step": 369930, "epoch": 2201} {"train_loss": -12.343141555786133, "global_step": 369931, "epoch": 2201} {"train_loss": -12.439990043640137, "global_step": 369932, "epoch": 2201} {"train_loss": -12.494610786437988, "global_step": 369933, "epoch": 2201} {"train_loss": -12.372270584106445, "global_step": 369934, "epoch": 2201} {"train_loss": -11.732713154384069, "global_step": 369935, "epoch": 2201, "val_loss": 294925.21875} {"train_loss": -11.993715286254883, "global_step": 369936, "epoch": 2202} {"train_loss": -11.929778099060059, "global_step": 369937, "epoch": 2202} {"train_loss": -11.99514102935791, "global_step": 369938, "epoch": 2202} {"train_loss": -11.622234344482422, "global_step": 369939, "epoch": 2202} {"train_loss": -11.576953887939453, "global_step": 369940, "epoch": 2202} {"train_loss": -11.20339584350586, "global_step": 369941, "epoch": 2202} {"train_loss": -11.550779342651367, "global_step": 369942, "epoch": 2202} {"train_loss": -10.804832458496094, "global_step": 369943, "epoch": 2202} {"train_loss": -11.496731758117676, "global_step": 369944, "epoch": 2202} {"train_loss": -11.151657104492188, "global_step": 369945, "epoch": 2202} {"train_loss": -11.740842819213867, "global_step": 369946, "epoch": 2202} {"train_loss": -10.895299911499023, "global_step": 369947, "epoch": 2202} {"train_loss": -11.468805313110352, "global_step": 369948, "epoch": 2202} {"train_loss": -11.479771614074707, "global_step": 369949, "epoch": 2202} {"train_loss": -11.825422286987305, "global_step": 369950, "epoch": 2202} {"train_loss": -11.06319522857666, "global_step": 369951, "epoch": 2202} {"train_loss": -12.136948585510254, "global_step": 369952, "epoch": 2202} {"train_loss": -12.092658996582031, "global_step": 369953, "epoch": 2202} {"train_loss": -11.879196166992188, "global_step": 369954, "epoch": 2202} {"train_loss": -12.281471252441406, "global_step": 369955, "epoch": 2202} {"train_loss": -11.215097427368164, "global_step": 369956, "epoch": 2202} {"train_loss": -12.059584617614746, "global_step": 369957, "epoch": 2202} {"train_loss": -11.7052001953125, "global_step": 369958, "epoch": 2202} {"train_loss": -12.119771003723145, "global_step": 369959, "epoch": 2202} {"train_loss": -11.983991622924805, "global_step": 369960, "epoch": 2202} {"train_loss": -11.942071914672852, "global_step": 369961, "epoch": 2202} {"train_loss": -12.41511344909668, "global_step": 369962, "epoch": 2202} {"train_loss": -12.186264991760254, "global_step": 369963, "epoch": 2202} {"train_loss": -12.321172714233398, "global_step": 369964, "epoch": 2202} {"train_loss": -12.290050506591797, "global_step": 369965, "epoch": 2202} {"train_loss": -12.378442764282227, "global_step": 369966, "epoch": 2202} {"train_loss": -12.218278884887695, "global_step": 369967, "epoch": 2202} {"train_loss": -12.443708419799805, "global_step": 369968, "epoch": 2202} {"train_loss": -12.17713737487793, "global_step": 369969, "epoch": 2202} {"train_loss": -12.412599563598633, "global_step": 369970, "epoch": 2202} {"train_loss": -12.431734085083008, "global_step": 369971, "epoch": 2202} {"train_loss": -12.488388061523438, "global_step": 369972, "epoch": 2202} {"train_loss": -12.135841369628906, "global_step": 369973, "epoch": 2202} {"train_loss": -12.435656547546387, "global_step": 369974, "epoch": 2202} {"train_loss": -12.236080169677734, "global_step": 369975, "epoch": 2202} {"train_loss": -12.060981750488281, "global_step": 369976, "epoch": 2202} {"train_loss": -12.445040702819824, "global_step": 369977, "epoch": 2202} {"train_loss": -12.483695983886719, "global_step": 369978, "epoch": 2202} {"train_loss": -12.318275451660156, "global_step": 369979, "epoch": 2202} {"train_loss": -12.402332305908203, "global_step": 369980, "epoch": 2202} {"train_loss": -12.045719146728516, "global_step": 369981, "epoch": 2202} {"train_loss": -12.521265983581543, "global_step": 369982, "epoch": 2202} {"train_loss": -12.157352447509766, "global_step": 369983, "epoch": 2202} {"train_loss": -12.296831130981445, "global_step": 369984, "epoch": 2202} {"train_loss": -12.33244514465332, "global_step": 369985, "epoch": 2202} {"train_loss": -12.130250930786133, "global_step": 369986, "epoch": 2202} {"train_loss": -12.481298446655273, "global_step": 369987, "epoch": 2202} {"train_loss": -12.256429672241211, "global_step": 369988, "epoch": 2202} {"train_loss": -12.114740371704102, "global_step": 369989, "epoch": 2202} {"train_loss": -12.284217834472656, "global_step": 369990, "epoch": 2202} {"train_loss": -12.054990768432617, "global_step": 369991, "epoch": 2202} {"train_loss": -12.363682746887207, "global_step": 369992, "epoch": 2202} {"train_loss": -12.138647079467773, "global_step": 369993, "epoch": 2202} {"train_loss": -12.054483413696289, "global_step": 369994, "epoch": 2202} {"train_loss": -12.386253356933594, "global_step": 369995, "epoch": 2202} {"train_loss": -11.904180526733398, "global_step": 369996, "epoch": 2202} {"train_loss": -12.379204750061035, "global_step": 369997, "epoch": 2202} {"train_loss": -12.407301902770996, "global_step": 369998, "epoch": 2202} {"train_loss": -12.483419418334961, "global_step": 369999, "epoch": 2202} {"train_loss": -12.492295265197754, "global_step": 370000, "epoch": 2202} {"train_loss": -12.413378715515137, "global_step": 370001, "epoch": 2202} {"train_loss": -12.165581703186035, "global_step": 370002, "epoch": 2202} {"train_loss": -12.685495376586914, "global_step": 370003, "epoch": 2202} {"train_loss": -11.948204040527344, "global_step": 370004, "epoch": 2202} {"train_loss": -12.228407859802246, "global_step": 370005, "epoch": 2202} {"train_loss": -12.426316261291504, "global_step": 370006, "epoch": 2202} {"train_loss": -12.451478958129883, "global_step": 370007, "epoch": 2202} {"train_loss": -12.497476577758789, "global_step": 370008, "epoch": 2202} {"train_loss": -12.430843353271484, "global_step": 370009, "epoch": 2202} {"train_loss": -12.25964641571045, "global_step": 370010, "epoch": 2202} {"train_loss": -12.43447208404541, "global_step": 370011, "epoch": 2202} {"train_loss": -12.263375282287598, "global_step": 370012, "epoch": 2202} {"train_loss": -12.407197952270508, "global_step": 370013, "epoch": 2202} {"train_loss": -12.680381774902344, "global_step": 370014, "epoch": 2202} {"train_loss": -12.4226713180542, "global_step": 370015, "epoch": 2202} {"train_loss": -12.314779281616211, "global_step": 370016, "epoch": 2202} {"train_loss": -12.514925956726074, "global_step": 370017, "epoch": 2202} {"train_loss": -12.145076751708984, "global_step": 370018, "epoch": 2202} {"train_loss": -12.498065948486328, "global_step": 370019, "epoch": 2202} {"train_loss": -12.3935546875, "global_step": 370020, "epoch": 2202} {"train_loss": -12.246715545654297, "global_step": 370021, "epoch": 2202} {"train_loss": -11.96570110321045, "global_step": 370022, "epoch": 2202} {"train_loss": -12.648193359375, "global_step": 370023, "epoch": 2202} {"train_loss": -12.12049388885498, "global_step": 370024, "epoch": 2202} {"train_loss": -12.105570793151855, "global_step": 370025, "epoch": 2202} {"train_loss": -12.143167495727539, "global_step": 370026, "epoch": 2202} {"train_loss": -12.47898006439209, "global_step": 370027, "epoch": 2202} {"train_loss": -12.183834075927734, "global_step": 370028, "epoch": 2202} {"train_loss": -12.584092140197754, "global_step": 370029, "epoch": 2202} {"train_loss": -12.507461547851562, "global_step": 370030, "epoch": 2202} {"train_loss": -12.392040252685547, "global_step": 370031, "epoch": 2202} {"train_loss": -12.403804779052734, "global_step": 370032, "epoch": 2202} {"train_loss": -12.628194808959961, "global_step": 370033, "epoch": 2202} {"train_loss": -12.140265464782715, "global_step": 370034, "epoch": 2202} {"train_loss": -11.83222770690918, "global_step": 370035, "epoch": 2202} {"train_loss": -12.189229965209961, "global_step": 370036, "epoch": 2202} {"train_loss": -12.347981452941895, "global_step": 370037, "epoch": 2202} {"train_loss": -12.245485305786133, "global_step": 370038, "epoch": 2202} {"train_loss": -12.487937927246094, "global_step": 370039, "epoch": 2202} {"train_loss": -12.147480010986328, "global_step": 370040, "epoch": 2202} {"train_loss": -12.335777282714844, "global_step": 370041, "epoch": 2202} {"train_loss": -12.409268379211426, "global_step": 370042, "epoch": 2202} {"train_loss": -12.381331443786621, "global_step": 370043, "epoch": 2202} {"train_loss": -12.398700714111328, "global_step": 370044, "epoch": 2202} {"train_loss": -12.243453025817871, "global_step": 370045, "epoch": 2202} {"train_loss": -12.634272575378418, "global_step": 370046, "epoch": 2202} {"train_loss": -12.488483428955078, "global_step": 370047, "epoch": 2202} {"train_loss": -12.623559951782227, "global_step": 370048, "epoch": 2202} {"train_loss": -12.440811157226562, "global_step": 370049, "epoch": 2202} {"train_loss": -12.61593246459961, "global_step": 370050, "epoch": 2202} {"train_loss": -12.406364440917969, "global_step": 370051, "epoch": 2202} {"train_loss": -12.040803909301758, "global_step": 370052, "epoch": 2202} {"train_loss": -11.100728988647461, "global_step": 370053, "epoch": 2202} {"train_loss": -12.236371994018555, "global_step": 370054, "epoch": 2202} {"train_loss": -12.104997634887695, "global_step": 370055, "epoch": 2202} {"train_loss": -12.214365005493164, "global_step": 370056, "epoch": 2202} {"train_loss": -12.069479942321777, "global_step": 370057, "epoch": 2202} {"train_loss": -12.213415145874023, "global_step": 370058, "epoch": 2202} {"train_loss": -12.158771514892578, "global_step": 370059, "epoch": 2202} {"train_loss": -12.16700267791748, "global_step": 370060, "epoch": 2202} {"train_loss": -12.120819091796875, "global_step": 370061, "epoch": 2202} {"train_loss": -12.304847717285156, "global_step": 370062, "epoch": 2202} {"train_loss": -11.266717910766602, "global_step": 370063, "epoch": 2202} {"train_loss": -10.592348098754883, "global_step": 370064, "epoch": 2202} {"train_loss": -11.270627975463867, "global_step": 370065, "epoch": 2202} {"train_loss": -11.967772483825684, "global_step": 370066, "epoch": 2202} {"train_loss": -10.775569915771484, "global_step": 370067, "epoch": 2202} {"train_loss": -8.320484161376953, "global_step": 370068, "epoch": 2202} {"train_loss": -10.335153579711914, "global_step": 370069, "epoch": 2202} {"train_loss": -9.57776927947998, "global_step": 370070, "epoch": 2202} {"train_loss": -10.030282974243164, "global_step": 370071, "epoch": 2202} {"train_loss": -10.00245189666748, "global_step": 370072, "epoch": 2202} {"train_loss": -10.111238479614258, "global_step": 370073, "epoch": 2202} {"train_loss": -10.191707611083984, "global_step": 370074, "epoch": 2202} {"train_loss": -9.94357681274414, "global_step": 370075, "epoch": 2202} {"train_loss": -9.596343994140625, "global_step": 370076, "epoch": 2202} {"train_loss": -11.279359817504883, "global_step": 370077, "epoch": 2202} {"train_loss": -10.130821228027344, "global_step": 370078, "epoch": 2202} {"train_loss": -10.814708709716797, "global_step": 370079, "epoch": 2202} {"train_loss": -10.001228332519531, "global_step": 370080, "epoch": 2202} {"train_loss": -10.540643692016602, "global_step": 370081, "epoch": 2202} {"train_loss": -9.230428695678711, "global_step": 370082, "epoch": 2202} {"train_loss": -11.305140495300293, "global_step": 370083, "epoch": 2202} {"train_loss": -8.98366928100586, "global_step": 370084, "epoch": 2202} {"train_loss": -9.941741943359375, "global_step": 370085, "epoch": 2202} {"train_loss": -9.588497161865234, "global_step": 370086, "epoch": 2202} {"train_loss": -9.596153259277344, "global_step": 370087, "epoch": 2202} {"train_loss": -9.789560317993164, "global_step": 370088, "epoch": 2202} {"train_loss": -11.01363468170166, "global_step": 370089, "epoch": 2202} {"train_loss": -10.218860626220703, "global_step": 370090, "epoch": 2202} {"train_loss": -10.960073471069336, "global_step": 370091, "epoch": 2202} {"train_loss": -11.064462661743164, "global_step": 370092, "epoch": 2202} {"train_loss": -9.716482162475586, "global_step": 370093, "epoch": 2202} {"train_loss": -11.226198196411133, "global_step": 370094, "epoch": 2202} {"train_loss": -10.775731086730957, "global_step": 370095, "epoch": 2202} {"train_loss": -10.671337127685547, "global_step": 370096, "epoch": 2202} {"train_loss": -11.076616287231445, "global_step": 370097, "epoch": 2202} {"train_loss": -10.556745529174805, "global_step": 370098, "epoch": 2202} {"train_loss": -11.115215301513672, "global_step": 370099, "epoch": 2202} {"train_loss": -11.536252975463867, "global_step": 370100, "epoch": 2202} {"train_loss": -10.980203628540039, "global_step": 370101, "epoch": 2202} {"train_loss": -11.033254623413086, "global_step": 370102, "epoch": 2202} {"train_loss": -11.750690874599275, "global_step": 370103, "epoch": 2202, "val_loss": 296436.46875} {"train_loss": -11.37961196899414, "global_step": 370104, "epoch": 2203} {"train_loss": -11.114938735961914, "global_step": 370105, "epoch": 2203} {"train_loss": -11.269807815551758, "global_step": 370106, "epoch": 2203} {"train_loss": -10.603130340576172, "global_step": 370107, "epoch": 2203} {"train_loss": -11.696678161621094, "global_step": 370108, "epoch": 2203} {"train_loss": -11.288039207458496, "global_step": 370109, "epoch": 2203} {"train_loss": -11.460111618041992, "global_step": 370110, "epoch": 2203} {"train_loss": -11.635961532592773, "global_step": 370111, "epoch": 2203} {"train_loss": -11.244155883789062, "global_step": 370112, "epoch": 2203} {"train_loss": -11.532732009887695, "global_step": 370113, "epoch": 2203} {"train_loss": -11.8345308303833, "global_step": 370114, "epoch": 2203} {"train_loss": -11.664201736450195, "global_step": 370115, "epoch": 2203} {"train_loss": -11.571921348571777, "global_step": 370116, "epoch": 2203} {"train_loss": -11.84077262878418, "global_step": 370117, "epoch": 2203} {"train_loss": -11.844447135925293, "global_step": 370118, "epoch": 2203} {"train_loss": -11.749347686767578, "global_step": 370119, "epoch": 2203} {"train_loss": -11.833107948303223, "global_step": 370120, "epoch": 2203} {"train_loss": -11.422225952148438, "global_step": 370121, "epoch": 2203} {"train_loss": -11.618349075317383, "global_step": 370122, "epoch": 2203} {"train_loss": -11.292587280273438, "global_step": 370123, "epoch": 2203} {"train_loss": -11.503507614135742, "global_step": 370124, "epoch": 2203} {"train_loss": -11.206953048706055, "global_step": 370125, "epoch": 2203} {"train_loss": -11.744634628295898, "global_step": 370126, "epoch": 2203} {"train_loss": -11.609968185424805, "global_step": 370127, "epoch": 2203} {"train_loss": -12.029437065124512, "global_step": 370128, "epoch": 2203} {"train_loss": -11.606651306152344, "global_step": 370129, "epoch": 2203} {"train_loss": -12.029634475708008, "global_step": 370130, "epoch": 2203} {"train_loss": -11.81281852722168, "global_step": 370131, "epoch": 2203} {"train_loss": -11.5255708694458, "global_step": 370132, "epoch": 2203} {"train_loss": -12.070721626281738, "global_step": 370133, "epoch": 2203} {"train_loss": -11.781639099121094, "global_step": 370134, "epoch": 2203} {"train_loss": -11.876882553100586, "global_step": 370135, "epoch": 2203} {"train_loss": -11.770671844482422, "global_step": 370136, "epoch": 2203} {"train_loss": -11.720970153808594, "global_step": 370137, "epoch": 2203} {"train_loss": -12.162528991699219, "global_step": 370138, "epoch": 2203} {"train_loss": -11.856861114501953, "global_step": 370139, "epoch": 2203} {"train_loss": -11.728671073913574, "global_step": 370140, "epoch": 2203} {"train_loss": -11.837533950805664, "global_step": 370141, "epoch": 2203} {"train_loss": -11.810264587402344, "global_step": 370142, "epoch": 2203} {"train_loss": -11.832300186157227, "global_step": 370143, "epoch": 2203} {"train_loss": -11.920499801635742, "global_step": 370144, "epoch": 2203} {"train_loss": -12.181876182556152, "global_step": 370145, "epoch": 2203} {"train_loss": -11.83913803100586, "global_step": 370146, "epoch": 2203} {"train_loss": -12.099773406982422, "global_step": 370147, "epoch": 2203} {"train_loss": -11.945211410522461, "global_step": 370148, "epoch": 2203} {"train_loss": -12.297468185424805, "global_step": 370149, "epoch": 2203} {"train_loss": -12.267386436462402, "global_step": 370150, "epoch": 2203} {"train_loss": -12.22229290008545, "global_step": 370151, "epoch": 2203} {"train_loss": -12.355823516845703, "global_step": 370152, "epoch": 2203} {"train_loss": -12.162253379821777, "global_step": 370153, "epoch": 2203} {"train_loss": -12.326337814331055, "global_step": 370154, "epoch": 2203} {"train_loss": -12.299568176269531, "global_step": 370155, "epoch": 2203} {"train_loss": -12.28868293762207, "global_step": 370156, "epoch": 2203} {"train_loss": -12.351783752441406, "global_step": 370157, "epoch": 2203} {"train_loss": -11.91897201538086, "global_step": 370158, "epoch": 2203} {"train_loss": -12.293478012084961, "global_step": 370159, "epoch": 2203} {"train_loss": -12.058405876159668, "global_step": 370160, "epoch": 2203} {"train_loss": -12.071599006652832, "global_step": 370161, "epoch": 2203} {"train_loss": -12.372757911682129, "global_step": 370162, "epoch": 2203} {"train_loss": -12.327810287475586, "global_step": 370163, "epoch": 2203} {"train_loss": -12.429113388061523, "global_step": 370164, "epoch": 2203} {"train_loss": -12.501033782958984, "global_step": 370165, "epoch": 2203} {"train_loss": -12.200950622558594, "global_step": 370166, "epoch": 2203} {"train_loss": -12.174753189086914, "global_step": 370167, "epoch": 2203} {"train_loss": -12.530909538269043, "global_step": 370168, "epoch": 2203} {"train_loss": -12.321822166442871, "global_step": 370169, "epoch": 2203} {"train_loss": -12.327733039855957, "global_step": 370170, "epoch": 2203} {"train_loss": -12.60135269165039, "global_step": 370171, "epoch": 2203} {"train_loss": -11.947282791137695, "global_step": 370172, "epoch": 2203} {"train_loss": -12.346866607666016, "global_step": 370173, "epoch": 2203} {"train_loss": -12.463186264038086, "global_step": 370174, "epoch": 2203} {"train_loss": -12.473587036132812, "global_step": 370175, "epoch": 2203} {"train_loss": -12.448972702026367, "global_step": 370176, "epoch": 2203} {"train_loss": -12.474960327148438, "global_step": 370177, "epoch": 2203} {"train_loss": -12.25111198425293, "global_step": 370178, "epoch": 2203} {"train_loss": -12.273978233337402, "global_step": 370179, "epoch": 2203} {"train_loss": -12.578954696655273, "global_step": 370180, "epoch": 2203} {"train_loss": -12.48032283782959, "global_step": 370181, "epoch": 2203} {"train_loss": -12.46718978881836, "global_step": 370182, "epoch": 2203} {"train_loss": -12.170391082763672, "global_step": 370183, "epoch": 2203} {"train_loss": -12.454818725585938, "global_step": 370184, "epoch": 2203} {"train_loss": -12.480266571044922, "global_step": 370185, "epoch": 2203} {"train_loss": -12.777948379516602, "global_step": 370186, "epoch": 2203} {"train_loss": -12.291683197021484, "global_step": 370187, "epoch": 2203} {"train_loss": -12.47412109375, "global_step": 370188, "epoch": 2203} {"train_loss": -12.412107467651367, "global_step": 370189, "epoch": 2203} {"train_loss": -12.506816864013672, "global_step": 370190, "epoch": 2203} {"train_loss": -12.354469299316406, "global_step": 370191, "epoch": 2203} {"train_loss": -12.597153663635254, "global_step": 370192, "epoch": 2203} {"train_loss": -12.45267105102539, "global_step": 370193, "epoch": 2203} {"train_loss": -12.54031753540039, "global_step": 370194, "epoch": 2203} {"train_loss": -12.6826171875, "global_step": 370195, "epoch": 2203} {"train_loss": -12.792810440063477, "global_step": 370196, "epoch": 2203} {"train_loss": -12.601228713989258, "global_step": 370197, "epoch": 2203} {"train_loss": -12.451492309570312, "global_step": 370198, "epoch": 2203} {"train_loss": -12.415834426879883, "global_step": 370199, "epoch": 2203} {"train_loss": -12.369068145751953, "global_step": 370200, "epoch": 2203} {"train_loss": -11.82805061340332, "global_step": 370201, "epoch": 2203} {"train_loss": -12.383540153503418, "global_step": 370202, "epoch": 2203} {"train_loss": -12.051116943359375, "global_step": 370203, "epoch": 2203} {"train_loss": -10.742109298706055, "global_step": 370204, "epoch": 2203} {"train_loss": -12.272701263427734, "global_step": 370205, "epoch": 2203} {"train_loss": -12.252429962158203, "global_step": 370206, "epoch": 2203} {"train_loss": -11.38891315460205, "global_step": 370207, "epoch": 2203} {"train_loss": -11.771374702453613, "global_step": 370208, "epoch": 2203} {"train_loss": -12.3391752243042, "global_step": 370209, "epoch": 2203} {"train_loss": -12.309700012207031, "global_step": 370210, "epoch": 2203} {"train_loss": -11.813924789428711, "global_step": 370211, "epoch": 2203} {"train_loss": -12.176372528076172, "global_step": 370212, "epoch": 2203} {"train_loss": -12.360994338989258, "global_step": 370213, "epoch": 2203} {"train_loss": -12.517226219177246, "global_step": 370214, "epoch": 2203} {"train_loss": -12.423280715942383, "global_step": 370215, "epoch": 2203} {"train_loss": -12.40817642211914, "global_step": 370216, "epoch": 2203} {"train_loss": -12.310813903808594, "global_step": 370217, "epoch": 2203} {"train_loss": -12.241312026977539, "global_step": 370218, "epoch": 2203} {"train_loss": -12.496084213256836, "global_step": 370219, "epoch": 2203} {"train_loss": -12.48338508605957, "global_step": 370220, "epoch": 2203} {"train_loss": -12.344087600708008, "global_step": 370221, "epoch": 2203} {"train_loss": -12.332754135131836, "global_step": 370222, "epoch": 2203} {"train_loss": -12.556276321411133, "global_step": 370223, "epoch": 2203} {"train_loss": -12.640215873718262, "global_step": 370224, "epoch": 2203} {"train_loss": -12.390058517456055, "global_step": 370225, "epoch": 2203} {"train_loss": -12.021639823913574, "global_step": 370226, "epoch": 2203} {"train_loss": -12.292816162109375, "global_step": 370227, "epoch": 2203} {"train_loss": -12.482603073120117, "global_step": 370228, "epoch": 2203} {"train_loss": -12.04922866821289, "global_step": 370229, "epoch": 2203} {"train_loss": -12.361408233642578, "global_step": 370230, "epoch": 2203} {"train_loss": -12.347354888916016, "global_step": 370231, "epoch": 2203} {"train_loss": -12.196330070495605, "global_step": 370232, "epoch": 2203} {"train_loss": -11.202446937561035, "global_step": 370233, "epoch": 2203} {"train_loss": -11.5213623046875, "global_step": 370234, "epoch": 2203} {"train_loss": -11.78209400177002, "global_step": 370235, "epoch": 2203} {"train_loss": -11.674821853637695, "global_step": 370236, "epoch": 2203} {"train_loss": -11.451765060424805, "global_step": 370237, "epoch": 2203} {"train_loss": -12.034187316894531, "global_step": 370238, "epoch": 2203} {"train_loss": -11.670005798339844, "global_step": 370239, "epoch": 2203} {"train_loss": -10.281797409057617, "global_step": 370240, "epoch": 2203} {"train_loss": -11.716293334960938, "global_step": 370241, "epoch": 2203} {"train_loss": -11.996267318725586, "global_step": 370242, "epoch": 2203} {"train_loss": -11.202159881591797, "global_step": 370243, "epoch": 2203} {"train_loss": -11.912964820861816, "global_step": 370244, "epoch": 2203} {"train_loss": -11.867912292480469, "global_step": 370245, "epoch": 2203} {"train_loss": -11.519275665283203, "global_step": 370246, "epoch": 2203} {"train_loss": -12.194615364074707, "global_step": 370247, "epoch": 2203} {"train_loss": -10.01897144317627, "global_step": 370248, "epoch": 2203} {"train_loss": -10.992536544799805, "global_step": 370249, "epoch": 2203} {"train_loss": -11.639568328857422, "global_step": 370250, "epoch": 2203} {"train_loss": -11.374656677246094, "global_step": 370251, "epoch": 2203} {"train_loss": -10.639248847961426, "global_step": 370252, "epoch": 2203} {"train_loss": -11.201736450195312, "global_step": 370253, "epoch": 2203} {"train_loss": -10.899520874023438, "global_step": 370254, "epoch": 2203} {"train_loss": -11.040776252746582, "global_step": 370255, "epoch": 2203} {"train_loss": -9.59926986694336, "global_step": 370256, "epoch": 2203} {"train_loss": -9.535418510437012, "global_step": 370257, "epoch": 2203} {"train_loss": -10.916971206665039, "global_step": 370258, "epoch": 2203} {"train_loss": -10.748889923095703, "global_step": 370259, "epoch": 2203} {"train_loss": -10.360605239868164, "global_step": 370260, "epoch": 2203} {"train_loss": -11.721044540405273, "global_step": 370261, "epoch": 2203} {"train_loss": -10.205303192138672, "global_step": 370262, "epoch": 2203} {"train_loss": -10.555183410644531, "global_step": 370263, "epoch": 2203} {"train_loss": -11.203532218933105, "global_step": 370264, "epoch": 2203} {"train_loss": -11.205421447753906, "global_step": 370265, "epoch": 2203} {"train_loss": -10.790847778320312, "global_step": 370266, "epoch": 2203} {"train_loss": -11.153603553771973, "global_step": 370267, "epoch": 2203} {"train_loss": -10.380582809448242, "global_step": 370268, "epoch": 2203} {"train_loss": -11.056746482849121, "global_step": 370269, "epoch": 2203} {"train_loss": -11.467001914978027, "global_step": 370270, "epoch": 2203} {"train_loss": -11.868287557647342, "global_step": 370271, "epoch": 2203, "val_loss": 292558.3125} {"train_loss": -11.626928329467773, "global_step": 370272, "epoch": 2204} {"train_loss": -11.742603302001953, "global_step": 370273, "epoch": 2204} {"train_loss": -11.726552963256836, "global_step": 370274, "epoch": 2204} {"train_loss": -11.536922454833984, "global_step": 370275, "epoch": 2204} {"train_loss": -11.299989700317383, "global_step": 370276, "epoch": 2204} {"train_loss": -11.73554515838623, "global_step": 370277, "epoch": 2204} {"train_loss": -11.087934494018555, "global_step": 370278, "epoch": 2204} {"train_loss": -11.774005889892578, "global_step": 370279, "epoch": 2204} {"train_loss": -11.628771781921387, "global_step": 370280, "epoch": 2204} {"train_loss": -11.365947723388672, "global_step": 370281, "epoch": 2204} {"train_loss": -11.27907943725586, "global_step": 370282, "epoch": 2204} {"train_loss": -12.004377365112305, "global_step": 370283, "epoch": 2204} {"train_loss": -10.815683364868164, "global_step": 370284, "epoch": 2204} {"train_loss": -11.90462875366211, "global_step": 370285, "epoch": 2204} {"train_loss": -11.02817153930664, "global_step": 370286, "epoch": 2204} {"train_loss": -11.759387969970703, "global_step": 370287, "epoch": 2204} {"train_loss": -10.95734977722168, "global_step": 370288, "epoch": 2204} {"train_loss": -11.34926986694336, "global_step": 370289, "epoch": 2204} {"train_loss": -11.303607940673828, "global_step": 370290, "epoch": 2204} {"train_loss": -10.559127807617188, "global_step": 370291, "epoch": 2204} {"train_loss": -11.596661567687988, "global_step": 370292, "epoch": 2204} {"train_loss": -10.671971321105957, "global_step": 370293, "epoch": 2204} {"train_loss": -11.449731826782227, "global_step": 370294, "epoch": 2204} {"train_loss": -11.327917098999023, "global_step": 370295, "epoch": 2204} {"train_loss": -11.619256019592285, "global_step": 370296, "epoch": 2204} {"train_loss": -11.028800964355469, "global_step": 370297, "epoch": 2204} {"train_loss": -12.141949653625488, "global_step": 370298, "epoch": 2204} {"train_loss": -11.075937271118164, "global_step": 370299, "epoch": 2204} {"train_loss": -11.507795333862305, "global_step": 370300, "epoch": 2204} {"train_loss": -11.431133270263672, "global_step": 370301, "epoch": 2204} {"train_loss": -11.766815185546875, "global_step": 370302, "epoch": 2204} {"train_loss": -10.81533432006836, "global_step": 370303, "epoch": 2204} {"train_loss": -12.105913162231445, "global_step": 370304, "epoch": 2204} {"train_loss": -10.85423469543457, "global_step": 370305, "epoch": 2204} {"train_loss": -11.812685012817383, "global_step": 370306, "epoch": 2204} {"train_loss": -11.140579223632812, "global_step": 370307, "epoch": 2204} {"train_loss": -11.549894332885742, "global_step": 370308, "epoch": 2204} {"train_loss": -11.708988189697266, "global_step": 370309, "epoch": 2204} {"train_loss": -11.642942428588867, "global_step": 370310, "epoch": 2204} {"train_loss": -11.658304214477539, "global_step": 370311, "epoch": 2204} {"train_loss": -12.116679191589355, "global_step": 370312, "epoch": 2204} {"train_loss": -11.893566131591797, "global_step": 370313, "epoch": 2204} {"train_loss": -11.713553428649902, "global_step": 370314, "epoch": 2204} {"train_loss": -12.264549255371094, "global_step": 370315, "epoch": 2204} {"train_loss": -11.674760818481445, "global_step": 370316, "epoch": 2204} {"train_loss": -12.073408126831055, "global_step": 370317, "epoch": 2204} {"train_loss": -11.753057479858398, "global_step": 370318, "epoch": 2204} {"train_loss": -11.804176330566406, "global_step": 370319, "epoch": 2204} {"train_loss": -11.741844177246094, "global_step": 370320, "epoch": 2204} {"train_loss": -11.698936462402344, "global_step": 370321, "epoch": 2204} {"train_loss": -11.945221900939941, "global_step": 370322, "epoch": 2204} {"train_loss": -11.641233444213867, "global_step": 370323, "epoch": 2204} {"train_loss": -12.38672924041748, "global_step": 370324, "epoch": 2204} {"train_loss": -11.915374755859375, "global_step": 370325, "epoch": 2204} {"train_loss": -12.123750686645508, "global_step": 370326, "epoch": 2204} {"train_loss": -12.00743293762207, "global_step": 370327, "epoch": 2204} {"train_loss": -11.82937240600586, "global_step": 370328, "epoch": 2204} {"train_loss": -12.010671615600586, "global_step": 370329, "epoch": 2204} {"train_loss": -11.572299003601074, "global_step": 370330, "epoch": 2204} {"train_loss": -11.466924667358398, "global_step": 370331, "epoch": 2204} {"train_loss": -11.971145629882812, "global_step": 370332, "epoch": 2204} {"train_loss": -11.552716255187988, "global_step": 370333, "epoch": 2204} {"train_loss": -12.240222930908203, "global_step": 370334, "epoch": 2204} {"train_loss": -11.45133113861084, "global_step": 370335, "epoch": 2204} {"train_loss": -11.777369499206543, "global_step": 370336, "epoch": 2204} {"train_loss": -12.261189460754395, "global_step": 370337, "epoch": 2204} {"train_loss": -11.79086685180664, "global_step": 370338, "epoch": 2204} {"train_loss": -12.093255996704102, "global_step": 370339, "epoch": 2204} {"train_loss": -11.7483549118042, "global_step": 370340, "epoch": 2204} {"train_loss": -11.602725982666016, "global_step": 370341, "epoch": 2204} {"train_loss": -12.293004989624023, "global_step": 370342, "epoch": 2204} {"train_loss": -11.995031356811523, "global_step": 370343, "epoch": 2204} {"train_loss": -12.36408805847168, "global_step": 370344, "epoch": 2204} {"train_loss": -12.559045791625977, "global_step": 370345, "epoch": 2204} {"train_loss": -12.05076789855957, "global_step": 370346, "epoch": 2204} {"train_loss": -12.277848243713379, "global_step": 370347, "epoch": 2204} {"train_loss": -12.309537887573242, "global_step": 370348, "epoch": 2204} {"train_loss": -12.430412292480469, "global_step": 370349, "epoch": 2204} {"train_loss": -12.36030387878418, "global_step": 370350, "epoch": 2204} {"train_loss": -12.239550590515137, "global_step": 370351, "epoch": 2204} {"train_loss": -12.415901184082031, "global_step": 370352, "epoch": 2204} {"train_loss": -12.241080284118652, "global_step": 370353, "epoch": 2204} {"train_loss": -12.405071258544922, "global_step": 370354, "epoch": 2204} {"train_loss": -12.27730941772461, "global_step": 370355, "epoch": 2204} {"train_loss": -12.304130554199219, "global_step": 370356, "epoch": 2204} {"train_loss": -12.571426391601562, "global_step": 370357, "epoch": 2204} {"train_loss": -12.443766593933105, "global_step": 370358, "epoch": 2204} {"train_loss": -12.587657928466797, "global_step": 370359, "epoch": 2204} {"train_loss": -12.253849983215332, "global_step": 370360, "epoch": 2204} {"train_loss": -12.485621452331543, "global_step": 370361, "epoch": 2204} {"train_loss": -12.020771026611328, "global_step": 370362, "epoch": 2204} {"train_loss": -12.38733959197998, "global_step": 370363, "epoch": 2204} {"train_loss": -12.373153686523438, "global_step": 370364, "epoch": 2204} {"train_loss": -12.007524490356445, "global_step": 370365, "epoch": 2204} {"train_loss": -12.701498985290527, "global_step": 370366, "epoch": 2204} {"train_loss": -12.158060073852539, "global_step": 370367, "epoch": 2204} {"train_loss": -12.575199127197266, "global_step": 370368, "epoch": 2204} {"train_loss": -12.414793968200684, "global_step": 370369, "epoch": 2204} {"train_loss": -12.70352554321289, "global_step": 370370, "epoch": 2204} {"train_loss": -12.645769119262695, "global_step": 370371, "epoch": 2204} {"train_loss": -12.453588485717773, "global_step": 370372, "epoch": 2204} {"train_loss": -12.542190551757812, "global_step": 370373, "epoch": 2204} {"train_loss": -12.538787841796875, "global_step": 370374, "epoch": 2204} {"train_loss": -12.36904525756836, "global_step": 370375, "epoch": 2204} {"train_loss": -12.351213455200195, "global_step": 370376, "epoch": 2204} {"train_loss": -12.297578811645508, "global_step": 370377, "epoch": 2204} {"train_loss": -12.42836856842041, "global_step": 370378, "epoch": 2204} {"train_loss": -12.618300437927246, "global_step": 370379, "epoch": 2204} {"train_loss": -12.400504112243652, "global_step": 370380, "epoch": 2204} {"train_loss": -12.123579978942871, "global_step": 370381, "epoch": 2204} {"train_loss": -12.646122932434082, "global_step": 370382, "epoch": 2204} {"train_loss": -12.358734130859375, "global_step": 370383, "epoch": 2204} {"train_loss": -12.586986541748047, "global_step": 370384, "epoch": 2204} {"train_loss": -12.549909591674805, "global_step": 370385, "epoch": 2204} {"train_loss": -12.378432273864746, "global_step": 370386, "epoch": 2204} {"train_loss": -12.600997924804688, "global_step": 370387, "epoch": 2204} {"train_loss": -12.254541397094727, "global_step": 370388, "epoch": 2204} {"train_loss": -12.214277267456055, "global_step": 370389, "epoch": 2204} {"train_loss": -12.654438018798828, "global_step": 370390, "epoch": 2204} {"train_loss": -12.449259757995605, "global_step": 370391, "epoch": 2204} {"train_loss": -12.5746488571167, "global_step": 370392, "epoch": 2204} {"train_loss": -12.6292724609375, "global_step": 370393, "epoch": 2204} {"train_loss": -12.579636573791504, "global_step": 370394, "epoch": 2204} {"train_loss": -12.375229835510254, "global_step": 370395, "epoch": 2204} {"train_loss": -12.468465805053711, "global_step": 370396, "epoch": 2204} {"train_loss": -12.414369583129883, "global_step": 370397, "epoch": 2204} {"train_loss": -12.361417770385742, "global_step": 370398, "epoch": 2204} {"train_loss": -12.537446975708008, "global_step": 370399, "epoch": 2204} {"train_loss": -12.27341079711914, "global_step": 370400, "epoch": 2204} {"train_loss": -12.37474536895752, "global_step": 370401, "epoch": 2204} {"train_loss": -12.38131332397461, "global_step": 370402, "epoch": 2204} {"train_loss": -12.462725639343262, "global_step": 370403, "epoch": 2204} {"train_loss": -12.301986694335938, "global_step": 370404, "epoch": 2204} {"train_loss": -12.193949699401855, "global_step": 370405, "epoch": 2204} {"train_loss": -12.364649772644043, "global_step": 370406, "epoch": 2204} {"train_loss": -11.393482208251953, "global_step": 370407, "epoch": 2204} {"train_loss": -12.053716659545898, "global_step": 370408, "epoch": 2204} {"train_loss": -12.251823425292969, "global_step": 370409, "epoch": 2204} {"train_loss": -12.226288795471191, "global_step": 370410, "epoch": 2204} {"train_loss": -12.243539810180664, "global_step": 370411, "epoch": 2204} {"train_loss": -12.448400497436523, "global_step": 370412, "epoch": 2204} {"train_loss": -12.366137504577637, "global_step": 370413, "epoch": 2204} {"train_loss": -12.63672161102295, "global_step": 370414, "epoch": 2204} {"train_loss": -12.568490028381348, "global_step": 370415, "epoch": 2204} {"train_loss": -12.395259857177734, "global_step": 370416, "epoch": 2204} {"train_loss": -12.308332443237305, "global_step": 370417, "epoch": 2204} {"train_loss": -12.407800674438477, "global_step": 370418, "epoch": 2204} {"train_loss": -12.472114562988281, "global_step": 370419, "epoch": 2204} {"train_loss": -12.482369422912598, "global_step": 370420, "epoch": 2204} {"train_loss": -12.48115348815918, "global_step": 370421, "epoch": 2204} {"train_loss": -12.669958114624023, "global_step": 370422, "epoch": 2204} {"train_loss": -12.125307083129883, "global_step": 370423, "epoch": 2204} {"train_loss": -12.579062461853027, "global_step": 370424, "epoch": 2204} {"train_loss": -12.479777336120605, "global_step": 370425, "epoch": 2204} {"train_loss": -12.050783157348633, "global_step": 370426, "epoch": 2204} {"train_loss": -11.597807884216309, "global_step": 370427, "epoch": 2204} {"train_loss": -12.249994277954102, "global_step": 370428, "epoch": 2204} {"train_loss": -12.082696914672852, "global_step": 370429, "epoch": 2204} {"train_loss": -12.470322608947754, "global_step": 370430, "epoch": 2204} {"train_loss": -11.749770164489746, "global_step": 370431, "epoch": 2204} {"train_loss": -11.357219696044922, "global_step": 370432, "epoch": 2204} {"train_loss": -10.662095069885254, "global_step": 370433, "epoch": 2204} {"train_loss": -10.619335174560547, "global_step": 370434, "epoch": 2204} {"train_loss": -8.509729385375977, "global_step": 370435, "epoch": 2204} {"train_loss": -10.299371719360352, "global_step": 370436, "epoch": 2204} {"train_loss": -9.561067581176758, "global_step": 370437, "epoch": 2204} {"train_loss": -7.7317047119140625, "global_step": 370438, "epoch": 2204} {"train_loss": -11.917698522408804, "global_step": 370439, "epoch": 2204, "val_loss": 291822.03125} {"train_loss": -7.177955150604248, "global_step": 370440, "epoch": 2205} {"train_loss": -7.049936294555664, "global_step": 370441, "epoch": 2205} {"train_loss": -7.352456569671631, "global_step": 370442, "epoch": 2205} {"train_loss": -7.32820463180542, "global_step": 370443, "epoch": 2205} {"train_loss": -7.8851447105407715, "global_step": 370444, "epoch": 2205} {"train_loss": -7.761709213256836, "global_step": 370445, "epoch": 2205} {"train_loss": -8.461334228515625, "global_step": 370446, "epoch": 2205} {"train_loss": -8.41034984588623, "global_step": 370447, "epoch": 2205} {"train_loss": -8.105363845825195, "global_step": 370448, "epoch": 2205} {"train_loss": -7.7019453048706055, "global_step": 370449, "epoch": 2205} {"train_loss": -8.515350341796875, "global_step": 370450, "epoch": 2205} {"train_loss": -8.403494834899902, "global_step": 370451, "epoch": 2205} {"train_loss": -9.007827758789062, "global_step": 370452, "epoch": 2205} {"train_loss": -9.641572952270508, "global_step": 370453, "epoch": 2205} {"train_loss": -9.917526245117188, "global_step": 370454, "epoch": 2205} {"train_loss": -10.03679084777832, "global_step": 370455, "epoch": 2205} {"train_loss": -10.540841102600098, "global_step": 370456, "epoch": 2205} {"train_loss": -11.33781623840332, "global_step": 370457, "epoch": 2205} {"train_loss": -10.80315113067627, "global_step": 370458, "epoch": 2205} {"train_loss": -10.878019332885742, "global_step": 370459, "epoch": 2205} {"train_loss": -10.289417266845703, "global_step": 370460, "epoch": 2205} {"train_loss": -10.696470260620117, "global_step": 370461, "epoch": 2205} {"train_loss": -10.998778343200684, "global_step": 370462, "epoch": 2205} {"train_loss": -11.24416732788086, "global_step": 370463, "epoch": 2205} {"train_loss": -11.124748229980469, "global_step": 370464, "epoch": 2205} {"train_loss": -11.827171325683594, "global_step": 370465, "epoch": 2205} {"train_loss": -11.316539764404297, "global_step": 370466, "epoch": 2205} {"train_loss": -11.595094680786133, "global_step": 370467, "epoch": 2205} {"train_loss": -11.765018463134766, "global_step": 370468, "epoch": 2205} {"train_loss": -11.064804077148438, "global_step": 370469, "epoch": 2205} {"train_loss": -11.288385391235352, "global_step": 370470, "epoch": 2205} {"train_loss": -11.561863899230957, "global_step": 370471, "epoch": 2205} {"train_loss": -11.130083084106445, "global_step": 370472, "epoch": 2205} {"train_loss": -11.078070640563965, "global_step": 370473, "epoch": 2205} {"train_loss": -11.434496879577637, "global_step": 370474, "epoch": 2205} {"train_loss": -11.33706283569336, "global_step": 370475, "epoch": 2205} {"train_loss": -11.39777946472168, "global_step": 370476, "epoch": 2205} {"train_loss": -11.166464805603027, "global_step": 370477, "epoch": 2205} {"train_loss": -11.789083480834961, "global_step": 370478, "epoch": 2205} {"train_loss": -11.614927291870117, "global_step": 370479, "epoch": 2205} {"train_loss": -11.771484375, "global_step": 370480, "epoch": 2205} {"train_loss": -11.963459968566895, "global_step": 370481, "epoch": 2205} {"train_loss": -11.433027267456055, "global_step": 370482, "epoch": 2205} {"train_loss": -12.059489250183105, "global_step": 370483, "epoch": 2205} {"train_loss": -11.643625259399414, "global_step": 370484, "epoch": 2205} {"train_loss": -11.71306324005127, "global_step": 370485, "epoch": 2205} {"train_loss": -12.050861358642578, "global_step": 370486, "epoch": 2205} {"train_loss": -11.670816421508789, "global_step": 370487, "epoch": 2205} {"train_loss": -12.033916473388672, "global_step": 370488, "epoch": 2205} {"train_loss": -11.799869537353516, "global_step": 370489, "epoch": 2205} {"train_loss": -12.111665725708008, "global_step": 370490, "epoch": 2205} {"train_loss": -12.077447891235352, "global_step": 370491, "epoch": 2205} {"train_loss": -12.165365219116211, "global_step": 370492, "epoch": 2205} {"train_loss": -12.12620735168457, "global_step": 370493, "epoch": 2205} {"train_loss": -12.184646606445312, "global_step": 370494, "epoch": 2205} {"train_loss": -11.851312637329102, "global_step": 370495, "epoch": 2205} {"train_loss": -12.115692138671875, "global_step": 370496, "epoch": 2205} {"train_loss": -11.927019119262695, "global_step": 370497, "epoch": 2205} {"train_loss": -11.867422103881836, "global_step": 370498, "epoch": 2205} {"train_loss": -12.26231861114502, "global_step": 370499, "epoch": 2205} {"train_loss": -11.529767990112305, "global_step": 370500, "epoch": 2205} {"train_loss": -12.093311309814453, "global_step": 370501, "epoch": 2205} {"train_loss": -11.923381805419922, "global_step": 370502, "epoch": 2205} {"train_loss": -12.010250091552734, "global_step": 370503, "epoch": 2205} {"train_loss": -12.275630950927734, "global_step": 370504, "epoch": 2205} {"train_loss": -11.69758415222168, "global_step": 370505, "epoch": 2205} {"train_loss": -12.312809944152832, "global_step": 370506, "epoch": 2205} {"train_loss": -11.90283489227295, "global_step": 370507, "epoch": 2205} {"train_loss": -12.179044723510742, "global_step": 370508, "epoch": 2205} {"train_loss": -12.173534393310547, "global_step": 370509, "epoch": 2205} {"train_loss": -12.037775039672852, "global_step": 370510, "epoch": 2205} {"train_loss": -12.11652660369873, "global_step": 370511, "epoch": 2205} {"train_loss": -12.060615539550781, "global_step": 370512, "epoch": 2205} {"train_loss": -12.183735847473145, "global_step": 370513, "epoch": 2205} {"train_loss": -11.951425552368164, "global_step": 370514, "epoch": 2205} {"train_loss": -12.290367126464844, "global_step": 370515, "epoch": 2205} {"train_loss": -12.143024444580078, "global_step": 370516, "epoch": 2205} {"train_loss": -12.040533065795898, "global_step": 370517, "epoch": 2205} {"train_loss": -12.215448379516602, "global_step": 370518, "epoch": 2205} {"train_loss": -12.546506881713867, "global_step": 370519, "epoch": 2205} {"train_loss": -12.039121627807617, "global_step": 370520, "epoch": 2205} {"train_loss": -12.439115524291992, "global_step": 370521, "epoch": 2205} {"train_loss": -12.057350158691406, "global_step": 370522, "epoch": 2205} {"train_loss": -12.083284378051758, "global_step": 370523, "epoch": 2205} {"train_loss": -12.007055282592773, "global_step": 370524, "epoch": 2205} {"train_loss": -12.366568565368652, "global_step": 370525, "epoch": 2205} {"train_loss": -12.113624572753906, "global_step": 370526, "epoch": 2205} {"train_loss": -12.28370475769043, "global_step": 370527, "epoch": 2205} {"train_loss": -12.134358406066895, "global_step": 370528, "epoch": 2205} {"train_loss": -12.43964958190918, "global_step": 370529, "epoch": 2205} {"train_loss": -12.456275939941406, "global_step": 370530, "epoch": 2205} {"train_loss": -12.377586364746094, "global_step": 370531, "epoch": 2205} {"train_loss": -12.472980499267578, "global_step": 370532, "epoch": 2205} {"train_loss": -12.298818588256836, "global_step": 370533, "epoch": 2205} {"train_loss": -12.40114974975586, "global_step": 370534, "epoch": 2205} {"train_loss": -11.954545974731445, "global_step": 370535, "epoch": 2205} {"train_loss": -12.216115951538086, "global_step": 370536, "epoch": 2205} {"train_loss": -12.319194793701172, "global_step": 370537, "epoch": 2205} {"train_loss": -12.374900817871094, "global_step": 370538, "epoch": 2205} {"train_loss": -12.295974731445312, "global_step": 370539, "epoch": 2205} {"train_loss": -11.932183265686035, "global_step": 370540, "epoch": 2205} {"train_loss": -12.768378257751465, "global_step": 370541, "epoch": 2205} {"train_loss": -12.138236999511719, "global_step": 370542, "epoch": 2205} {"train_loss": -12.612289428710938, "global_step": 370543, "epoch": 2205} {"train_loss": -12.406998634338379, "global_step": 370544, "epoch": 2205} {"train_loss": -12.349994659423828, "global_step": 370545, "epoch": 2205} {"train_loss": -12.255108833312988, "global_step": 370546, "epoch": 2205} {"train_loss": -11.836153030395508, "global_step": 370547, "epoch": 2205} {"train_loss": -12.060924530029297, "global_step": 370548, "epoch": 2205} {"train_loss": -10.996408462524414, "global_step": 370549, "epoch": 2205} {"train_loss": -12.185296058654785, "global_step": 370550, "epoch": 2205} {"train_loss": -12.280470848083496, "global_step": 370551, "epoch": 2205} {"train_loss": -12.349291801452637, "global_step": 370552, "epoch": 2205} {"train_loss": -12.277088165283203, "global_step": 370553, "epoch": 2205} {"train_loss": -12.525054931640625, "global_step": 370554, "epoch": 2205} {"train_loss": -12.383112907409668, "global_step": 370555, "epoch": 2205} {"train_loss": -12.28203296661377, "global_step": 370556, "epoch": 2205} {"train_loss": -12.201948165893555, "global_step": 370557, "epoch": 2205} {"train_loss": -12.052839279174805, "global_step": 370558, "epoch": 2205} {"train_loss": -12.435850143432617, "global_step": 370559, "epoch": 2205} {"train_loss": -11.691794395446777, "global_step": 370560, "epoch": 2205} {"train_loss": -11.962297439575195, "global_step": 370561, "epoch": 2205} {"train_loss": -12.162790298461914, "global_step": 370562, "epoch": 2205} {"train_loss": -12.086024284362793, "global_step": 370563, "epoch": 2205} {"train_loss": -11.27629566192627, "global_step": 370564, "epoch": 2205} {"train_loss": -11.917052268981934, "global_step": 370565, "epoch": 2205} {"train_loss": -11.62802791595459, "global_step": 370566, "epoch": 2205} {"train_loss": -12.270910263061523, "global_step": 370567, "epoch": 2205} {"train_loss": -10.968827247619629, "global_step": 370568, "epoch": 2205} {"train_loss": -11.753284454345703, "global_step": 370569, "epoch": 2205} {"train_loss": -9.561781883239746, "global_step": 370570, "epoch": 2205} {"train_loss": -11.781335830688477, "global_step": 370571, "epoch": 2205} {"train_loss": -10.674605369567871, "global_step": 370572, "epoch": 2205} {"train_loss": -11.816577911376953, "global_step": 370573, "epoch": 2205} {"train_loss": -11.53812026977539, "global_step": 370574, "epoch": 2205} {"train_loss": -11.00022029876709, "global_step": 370575, "epoch": 2205} {"train_loss": -11.057474136352539, "global_step": 370576, "epoch": 2205} {"train_loss": -10.607372283935547, "global_step": 370577, "epoch": 2205} {"train_loss": -11.42123794555664, "global_step": 370578, "epoch": 2205} {"train_loss": -11.514741897583008, "global_step": 370579, "epoch": 2205} {"train_loss": -11.100868225097656, "global_step": 370580, "epoch": 2205} {"train_loss": -11.332462310791016, "global_step": 370581, "epoch": 2205} {"train_loss": -10.292790412902832, "global_step": 370582, "epoch": 2205} {"train_loss": -10.76476764678955, "global_step": 370583, "epoch": 2205} {"train_loss": -9.356114387512207, "global_step": 370584, "epoch": 2205} {"train_loss": -10.50584602355957, "global_step": 370585, "epoch": 2205} {"train_loss": -10.054720878601074, "global_step": 370586, "epoch": 2205} {"train_loss": -11.352583885192871, "global_step": 370587, "epoch": 2205} {"train_loss": -9.996356964111328, "global_step": 370588, "epoch": 2205} {"train_loss": -11.576421737670898, "global_step": 370589, "epoch": 2205} {"train_loss": -10.545317649841309, "global_step": 370590, "epoch": 2205} {"train_loss": -10.705974578857422, "global_step": 370591, "epoch": 2205} {"train_loss": -10.410102844238281, "global_step": 370592, "epoch": 2205} {"train_loss": -10.814047813415527, "global_step": 370593, "epoch": 2205} {"train_loss": -11.35830307006836, "global_step": 370594, "epoch": 2205} {"train_loss": -10.880569458007812, "global_step": 370595, "epoch": 2205} {"train_loss": -11.177817344665527, "global_step": 370596, "epoch": 2205} {"train_loss": -10.460237503051758, "global_step": 370597, "epoch": 2205} {"train_loss": -11.518535614013672, "global_step": 370598, "epoch": 2205} {"train_loss": -11.0536527633667, "global_step": 370599, "epoch": 2205} {"train_loss": -11.518758773803711, "global_step": 370600, "epoch": 2205} {"train_loss": -10.845369338989258, "global_step": 370601, "epoch": 2205} {"train_loss": -11.607020378112793, "global_step": 370602, "epoch": 2205} {"train_loss": -11.01909065246582, "global_step": 370603, "epoch": 2205} {"train_loss": -11.895963668823242, "global_step": 370604, "epoch": 2205} {"train_loss": -10.900074005126953, "global_step": 370605, "epoch": 2205} {"train_loss": -11.852934837341309, "global_step": 370606, "epoch": 2205} {"train_loss": -11.351926201865787, "global_step": 370607, "epoch": 2205, "val_loss": 297533.03125, "train_action_mse_error": 1.809211015701294} {"train_loss": -11.994304656982422, "global_step": 370608, "epoch": 2206} {"train_loss": -11.712697982788086, "global_step": 370609, "epoch": 2206} {"train_loss": -12.047008514404297, "global_step": 370610, "epoch": 2206} {"train_loss": -11.61555290222168, "global_step": 370611, "epoch": 2206} {"train_loss": -12.197607040405273, "global_step": 370612, "epoch": 2206} {"train_loss": -11.92553997039795, "global_step": 370613, "epoch": 2206} {"train_loss": -11.895732879638672, "global_step": 370614, "epoch": 2206} {"train_loss": -12.120462417602539, "global_step": 370615, "epoch": 2206} {"train_loss": -11.73287582397461, "global_step": 370616, "epoch": 2206} {"train_loss": -11.745445251464844, "global_step": 370617, "epoch": 2206} {"train_loss": -11.813166618347168, "global_step": 370618, "epoch": 2206} {"train_loss": -12.004119873046875, "global_step": 370619, "epoch": 2206} {"train_loss": -12.361770629882812, "global_step": 370620, "epoch": 2206} {"train_loss": -11.800031661987305, "global_step": 370621, "epoch": 2206} {"train_loss": -11.5591402053833, "global_step": 370622, "epoch": 2206} {"train_loss": -11.904510498046875, "global_step": 370623, "epoch": 2206} {"train_loss": -11.973933219909668, "global_step": 370624, "epoch": 2206} {"train_loss": -11.952980041503906, "global_step": 370625, "epoch": 2206} {"train_loss": -11.826287269592285, "global_step": 370626, "epoch": 2206} {"train_loss": -11.994135856628418, "global_step": 370627, "epoch": 2206} {"train_loss": -11.433280944824219, "global_step": 370628, "epoch": 2206} {"train_loss": -11.695186614990234, "global_step": 370629, "epoch": 2206} {"train_loss": -12.029993057250977, "global_step": 370630, "epoch": 2206} {"train_loss": -12.060705184936523, "global_step": 370631, "epoch": 2206} {"train_loss": -11.891716003417969, "global_step": 370632, "epoch": 2206} {"train_loss": -12.450807571411133, "global_step": 370633, "epoch": 2206} {"train_loss": -11.626150131225586, "global_step": 370634, "epoch": 2206} {"train_loss": -11.948904037475586, "global_step": 370635, "epoch": 2206} {"train_loss": -11.927401542663574, "global_step": 370636, "epoch": 2206} {"train_loss": -12.27313232421875, "global_step": 370637, "epoch": 2206} {"train_loss": -11.893738746643066, "global_step": 370638, "epoch": 2206} {"train_loss": -12.187704086303711, "global_step": 370639, "epoch": 2206} {"train_loss": -12.09365463256836, "global_step": 370640, "epoch": 2206} {"train_loss": -11.849631309509277, "global_step": 370641, "epoch": 2206} {"train_loss": -12.205860137939453, "global_step": 370642, "epoch": 2206} {"train_loss": -11.831449508666992, "global_step": 370643, "epoch": 2206} {"train_loss": -11.6204252243042, "global_step": 370644, "epoch": 2206} {"train_loss": -11.917593002319336, "global_step": 370645, "epoch": 2206} {"train_loss": -12.005372047424316, "global_step": 370646, "epoch": 2206} {"train_loss": -12.241109848022461, "global_step": 370647, "epoch": 2206} {"train_loss": -12.121238708496094, "global_step": 370648, "epoch": 2206} {"train_loss": -12.360431671142578, "global_step": 370649, "epoch": 2206} {"train_loss": -12.11380386352539, "global_step": 370650, "epoch": 2206} {"train_loss": -12.019213676452637, "global_step": 370651, "epoch": 2206} {"train_loss": -12.346142768859863, "global_step": 370652, "epoch": 2206} {"train_loss": -12.233558654785156, "global_step": 370653, "epoch": 2206} {"train_loss": -11.993534088134766, "global_step": 370654, "epoch": 2206} {"train_loss": -12.377487182617188, "global_step": 370655, "epoch": 2206} {"train_loss": -12.34646224975586, "global_step": 370656, "epoch": 2206} {"train_loss": -12.624835014343262, "global_step": 370657, "epoch": 2206} {"train_loss": -12.090593338012695, "global_step": 370658, "epoch": 2206} {"train_loss": -12.125314712524414, "global_step": 370659, "epoch": 2206} {"train_loss": -12.703750610351562, "global_step": 370660, "epoch": 2206} {"train_loss": -12.299123764038086, "global_step": 370661, "epoch": 2206} {"train_loss": -12.166830062866211, "global_step": 370662, "epoch": 2206} {"train_loss": -12.49445629119873, "global_step": 370663, "epoch": 2206} {"train_loss": -12.285295486450195, "global_step": 370664, "epoch": 2206} {"train_loss": -12.515281677246094, "global_step": 370665, "epoch": 2206} {"train_loss": -12.204666137695312, "global_step": 370666, "epoch": 2206} {"train_loss": -12.289422035217285, "global_step": 370667, "epoch": 2206} {"train_loss": -11.868082046508789, "global_step": 370668, "epoch": 2206} {"train_loss": -12.504988670349121, "global_step": 370669, "epoch": 2206} {"train_loss": -12.29500961303711, "global_step": 370670, "epoch": 2206} {"train_loss": -12.36093521118164, "global_step": 370671, "epoch": 2206} {"train_loss": -12.197507858276367, "global_step": 370672, "epoch": 2206} {"train_loss": -12.131375312805176, "global_step": 370673, "epoch": 2206} {"train_loss": -12.208784103393555, "global_step": 370674, "epoch": 2206} {"train_loss": -12.097541809082031, "global_step": 370675, "epoch": 2206} {"train_loss": -12.25576400756836, "global_step": 370676, "epoch": 2206} {"train_loss": -12.323827743530273, "global_step": 370677, "epoch": 2206} {"train_loss": -12.398706436157227, "global_step": 370678, "epoch": 2206} {"train_loss": -12.365518569946289, "global_step": 370679, "epoch": 2206} {"train_loss": -12.348938941955566, "global_step": 370680, "epoch": 2206} {"train_loss": -12.27938175201416, "global_step": 370681, "epoch": 2206} {"train_loss": -12.264290809631348, "global_step": 370682, "epoch": 2206} {"train_loss": -11.904352188110352, "global_step": 370683, "epoch": 2206} {"train_loss": -11.066446304321289, "global_step": 370684, "epoch": 2206} {"train_loss": -12.013595581054688, "global_step": 370685, "epoch": 2206} {"train_loss": -11.530794143676758, "global_step": 370686, "epoch": 2206} {"train_loss": -11.624149322509766, "global_step": 370687, "epoch": 2206} {"train_loss": -12.326924324035645, "global_step": 370688, "epoch": 2206} {"train_loss": -11.934111595153809, "global_step": 370689, "epoch": 2206} {"train_loss": -12.20755672454834, "global_step": 370690, "epoch": 2206} {"train_loss": -11.989335060119629, "global_step": 370691, "epoch": 2206} {"train_loss": -12.265212059020996, "global_step": 370692, "epoch": 2206} {"train_loss": -12.412919998168945, "global_step": 370693, "epoch": 2206} {"train_loss": -11.58359432220459, "global_step": 370694, "epoch": 2206} {"train_loss": -12.16946792602539, "global_step": 370695, "epoch": 2206} {"train_loss": -11.83767032623291, "global_step": 370696, "epoch": 2206} {"train_loss": -11.93873405456543, "global_step": 370697, "epoch": 2206} {"train_loss": -11.86506175994873, "global_step": 370698, "epoch": 2206} {"train_loss": -12.044013977050781, "global_step": 370699, "epoch": 2206} {"train_loss": -12.210162162780762, "global_step": 370700, "epoch": 2206} {"train_loss": -12.259257316589355, "global_step": 370701, "epoch": 2206} {"train_loss": -12.009241104125977, "global_step": 370702, "epoch": 2206} {"train_loss": -12.093664169311523, "global_step": 370703, "epoch": 2206} {"train_loss": -12.167317390441895, "global_step": 370704, "epoch": 2206} {"train_loss": -12.43480110168457, "global_step": 370705, "epoch": 2206} {"train_loss": -12.309693336486816, "global_step": 370706, "epoch": 2206} {"train_loss": -11.750162124633789, "global_step": 370707, "epoch": 2206} {"train_loss": -12.29546070098877, "global_step": 370708, "epoch": 2206} {"train_loss": -12.177070617675781, "global_step": 370709, "epoch": 2206} {"train_loss": -12.18617057800293, "global_step": 370710, "epoch": 2206} {"train_loss": -12.618297576904297, "global_step": 370711, "epoch": 2206} {"train_loss": -12.04636287689209, "global_step": 370712, "epoch": 2206} {"train_loss": -12.331147193908691, "global_step": 370713, "epoch": 2206} {"train_loss": -11.961013793945312, "global_step": 370714, "epoch": 2206} {"train_loss": -11.006779670715332, "global_step": 370715, "epoch": 2206} {"train_loss": -12.036453247070312, "global_step": 370716, "epoch": 2206} {"train_loss": -11.49587345123291, "global_step": 370717, "epoch": 2206} {"train_loss": -11.026493072509766, "global_step": 370718, "epoch": 2206} {"train_loss": -12.282072067260742, "global_step": 370719, "epoch": 2206} {"train_loss": -11.999414443969727, "global_step": 370720, "epoch": 2206} {"train_loss": -11.983552932739258, "global_step": 370721, "epoch": 2206} {"train_loss": -11.79859733581543, "global_step": 370722, "epoch": 2206} {"train_loss": -11.781723976135254, "global_step": 370723, "epoch": 2206} {"train_loss": -12.045162200927734, "global_step": 370724, "epoch": 2206} {"train_loss": -12.314194679260254, "global_step": 370725, "epoch": 2206} {"train_loss": -11.957362174987793, "global_step": 370726, "epoch": 2206} {"train_loss": -12.397712707519531, "global_step": 370727, "epoch": 2206} {"train_loss": -12.01197338104248, "global_step": 370728, "epoch": 2206} {"train_loss": -12.294950485229492, "global_step": 370729, "epoch": 2206} {"train_loss": -12.030228614807129, "global_step": 370730, "epoch": 2206} {"train_loss": -11.887916564941406, "global_step": 370731, "epoch": 2206} {"train_loss": -11.419082641601562, "global_step": 370732, "epoch": 2206} {"train_loss": -12.164691925048828, "global_step": 370733, "epoch": 2206} {"train_loss": -12.019676208496094, "global_step": 370734, "epoch": 2206} {"train_loss": -11.708776473999023, "global_step": 370735, "epoch": 2206} {"train_loss": -11.331360816955566, "global_step": 370736, "epoch": 2206} {"train_loss": -12.081523895263672, "global_step": 370737, "epoch": 2206} {"train_loss": -11.52747631072998, "global_step": 370738, "epoch": 2206} {"train_loss": -12.006906509399414, "global_step": 370739, "epoch": 2206} {"train_loss": -12.439144134521484, "global_step": 370740, "epoch": 2206} {"train_loss": -11.417223930358887, "global_step": 370741, "epoch": 2206} {"train_loss": -11.812302589416504, "global_step": 370742, "epoch": 2206} {"train_loss": -11.953737258911133, "global_step": 370743, "epoch": 2206} {"train_loss": -11.305392265319824, "global_step": 370744, "epoch": 2206} {"train_loss": -10.920848846435547, "global_step": 370745, "epoch": 2206} {"train_loss": -11.53178882598877, "global_step": 370746, "epoch": 2206} {"train_loss": -10.970112800598145, "global_step": 370747, "epoch": 2206} {"train_loss": -10.972039222717285, "global_step": 370748, "epoch": 2206} {"train_loss": -10.981193542480469, "global_step": 370749, "epoch": 2206} {"train_loss": -10.508462905883789, "global_step": 370750, "epoch": 2206} {"train_loss": -11.078420639038086, "global_step": 370751, "epoch": 2206} {"train_loss": -11.199737548828125, "global_step": 370752, "epoch": 2206} {"train_loss": -10.822636604309082, "global_step": 370753, "epoch": 2206} {"train_loss": -11.167537689208984, "global_step": 370754, "epoch": 2206} {"train_loss": -10.491914749145508, "global_step": 370755, "epoch": 2206} {"train_loss": -11.106474876403809, "global_step": 370756, "epoch": 2206} {"train_loss": -10.357291221618652, "global_step": 370757, "epoch": 2206} {"train_loss": -11.775886535644531, "global_step": 370758, "epoch": 2206} {"train_loss": -10.38438606262207, "global_step": 370759, "epoch": 2206} {"train_loss": -11.563421249389648, "global_step": 370760, "epoch": 2206} {"train_loss": -10.770808219909668, "global_step": 370761, "epoch": 2206} {"train_loss": -11.34115982055664, "global_step": 370762, "epoch": 2206} {"train_loss": -11.321046829223633, "global_step": 370763, "epoch": 2206} {"train_loss": -11.405434608459473, "global_step": 370764, "epoch": 2206} {"train_loss": -11.254657745361328, "global_step": 370765, "epoch": 2206} {"train_loss": -11.914609909057617, "global_step": 370766, "epoch": 2206} {"train_loss": -11.303232192993164, "global_step": 370767, "epoch": 2206} {"train_loss": -11.68602180480957, "global_step": 370768, "epoch": 2206} {"train_loss": -11.755009651184082, "global_step": 370769, "epoch": 2206} {"train_loss": -11.931589126586914, "global_step": 370770, "epoch": 2206} {"train_loss": -10.937626838684082, "global_step": 370771, "epoch": 2206} {"train_loss": -11.07505989074707, "global_step": 370772, "epoch": 2206} {"train_loss": -11.282100677490234, "global_step": 370773, "epoch": 2206} {"train_loss": -10.97640609741211, "global_step": 370774, "epoch": 2206} {"train_loss": -11.871625883238655, "global_step": 370775, "epoch": 2206, "val_loss": 293893.40625} {"train_loss": -11.253569602966309, "global_step": 370776, "epoch": 2207} {"train_loss": -11.366279602050781, "global_step": 370777, "epoch": 2207} {"train_loss": -11.771770477294922, "global_step": 370778, "epoch": 2207} {"train_loss": -11.2981595993042, "global_step": 370779, "epoch": 2207} {"train_loss": -11.786020278930664, "global_step": 370780, "epoch": 2207} {"train_loss": -11.581037521362305, "global_step": 370781, "epoch": 2207} {"train_loss": -11.839000701904297, "global_step": 370782, "epoch": 2207} {"train_loss": -11.770528793334961, "global_step": 370783, "epoch": 2207} {"train_loss": -11.729446411132812, "global_step": 370784, "epoch": 2207} {"train_loss": -11.644229888916016, "global_step": 370785, "epoch": 2207} {"train_loss": -12.03049087524414, "global_step": 370786, "epoch": 2207} {"train_loss": -12.019989967346191, "global_step": 370787, "epoch": 2207} {"train_loss": -11.839227676391602, "global_step": 370788, "epoch": 2207} {"train_loss": -11.961028099060059, "global_step": 370789, "epoch": 2207} {"train_loss": -11.941075325012207, "global_step": 370790, "epoch": 2207} {"train_loss": -11.96507453918457, "global_step": 370791, "epoch": 2207} {"train_loss": -12.275049209594727, "global_step": 370792, "epoch": 2207} {"train_loss": -11.73989486694336, "global_step": 370793, "epoch": 2207} {"train_loss": -12.380125999450684, "global_step": 370794, "epoch": 2207} {"train_loss": -12.14391803741455, "global_step": 370795, "epoch": 2207} {"train_loss": -12.431436538696289, "global_step": 370796, "epoch": 2207} {"train_loss": -11.800567626953125, "global_step": 370797, "epoch": 2207} {"train_loss": -11.96240520477295, "global_step": 370798, "epoch": 2207} {"train_loss": -11.882673263549805, "global_step": 370799, "epoch": 2207} {"train_loss": -12.225563049316406, "global_step": 370800, "epoch": 2207} {"train_loss": -11.876863479614258, "global_step": 370801, "epoch": 2207} {"train_loss": -12.070146560668945, "global_step": 370802, "epoch": 2207} {"train_loss": -12.156587600708008, "global_step": 370803, "epoch": 2207} {"train_loss": -11.615211486816406, "global_step": 370804, "epoch": 2207} {"train_loss": -12.131574630737305, "global_step": 370805, "epoch": 2207} {"train_loss": -11.538389205932617, "global_step": 370806, "epoch": 2207} {"train_loss": -12.20897388458252, "global_step": 370807, "epoch": 2207} {"train_loss": -11.73491382598877, "global_step": 370808, "epoch": 2207} {"train_loss": -11.83140754699707, "global_step": 370809, "epoch": 2207} {"train_loss": -12.064678192138672, "global_step": 370810, "epoch": 2207} {"train_loss": -12.24949836730957, "global_step": 370811, "epoch": 2207} {"train_loss": -11.903701782226562, "global_step": 370812, "epoch": 2207} {"train_loss": -12.033221244812012, "global_step": 370813, "epoch": 2207} {"train_loss": -11.715799331665039, "global_step": 370814, "epoch": 2207} {"train_loss": -12.041985511779785, "global_step": 370815, "epoch": 2207} {"train_loss": -11.885507583618164, "global_step": 370816, "epoch": 2207} {"train_loss": -12.378694534301758, "global_step": 370817, "epoch": 2207} {"train_loss": -12.106009483337402, "global_step": 370818, "epoch": 2207} {"train_loss": -12.138338088989258, "global_step": 370819, "epoch": 2207} {"train_loss": -12.196613311767578, "global_step": 370820, "epoch": 2207} {"train_loss": -12.243843078613281, "global_step": 370821, "epoch": 2207} {"train_loss": -12.320173263549805, "global_step": 370822, "epoch": 2207} {"train_loss": -12.323493957519531, "global_step": 370823, "epoch": 2207} {"train_loss": -12.324541091918945, "global_step": 370824, "epoch": 2207} {"train_loss": -12.253334045410156, "global_step": 370825, "epoch": 2207} {"train_loss": -12.149892807006836, "global_step": 370826, "epoch": 2207} {"train_loss": -12.43338680267334, "global_step": 370827, "epoch": 2207} {"train_loss": -12.357956886291504, "global_step": 370828, "epoch": 2207} {"train_loss": -12.490592956542969, "global_step": 370829, "epoch": 2207} {"train_loss": -12.567596435546875, "global_step": 370830, "epoch": 2207} {"train_loss": -12.314362525939941, "global_step": 370831, "epoch": 2207} {"train_loss": -12.575518608093262, "global_step": 370832, "epoch": 2207} {"train_loss": -12.578957557678223, "global_step": 370833, "epoch": 2207} {"train_loss": -12.525203704833984, "global_step": 370834, "epoch": 2207} {"train_loss": -12.53083324432373, "global_step": 370835, "epoch": 2207} {"train_loss": -12.24119758605957, "global_step": 370836, "epoch": 2207} {"train_loss": -12.446917533874512, "global_step": 370837, "epoch": 2207} {"train_loss": -12.278752326965332, "global_step": 370838, "epoch": 2207} {"train_loss": -12.214431762695312, "global_step": 370839, "epoch": 2207} {"train_loss": -12.167428970336914, "global_step": 370840, "epoch": 2207} {"train_loss": -12.532849311828613, "global_step": 370841, "epoch": 2207} {"train_loss": -12.427202224731445, "global_step": 370842, "epoch": 2207} {"train_loss": -12.417739868164062, "global_step": 370843, "epoch": 2207} {"train_loss": -12.253698348999023, "global_step": 370844, "epoch": 2207} {"train_loss": -12.463659286499023, "global_step": 370845, "epoch": 2207} {"train_loss": -12.447011947631836, "global_step": 370846, "epoch": 2207} {"train_loss": -12.512582778930664, "global_step": 370847, "epoch": 2207} {"train_loss": -12.571551322937012, "global_step": 370848, "epoch": 2207} {"train_loss": -12.610422134399414, "global_step": 370849, "epoch": 2207} {"train_loss": -12.582639694213867, "global_step": 370850, "epoch": 2207} {"train_loss": -12.683067321777344, "global_step": 370851, "epoch": 2207} {"train_loss": -12.412094116210938, "global_step": 370852, "epoch": 2207} {"train_loss": -12.187763214111328, "global_step": 370853, "epoch": 2207} {"train_loss": -12.594277381896973, "global_step": 370854, "epoch": 2207} {"train_loss": -12.527961730957031, "global_step": 370855, "epoch": 2207} {"train_loss": -12.505385398864746, "global_step": 370856, "epoch": 2207} {"train_loss": -12.327686309814453, "global_step": 370857, "epoch": 2207} {"train_loss": -12.383758544921875, "global_step": 370858, "epoch": 2207} {"train_loss": -12.343398094177246, "global_step": 370859, "epoch": 2207} {"train_loss": -12.286953926086426, "global_step": 370860, "epoch": 2207} {"train_loss": -12.551008224487305, "global_step": 370861, "epoch": 2207} {"train_loss": -12.092674255371094, "global_step": 370862, "epoch": 2207} {"train_loss": -12.571346282958984, "global_step": 370863, "epoch": 2207} {"train_loss": -11.746610641479492, "global_step": 370864, "epoch": 2207} {"train_loss": -11.382343292236328, "global_step": 370865, "epoch": 2207} {"train_loss": -11.56644058227539, "global_step": 370866, "epoch": 2207} {"train_loss": -12.196674346923828, "global_step": 370867, "epoch": 2207} {"train_loss": -12.283648490905762, "global_step": 370868, "epoch": 2207} {"train_loss": -11.972447395324707, "global_step": 370869, "epoch": 2207} {"train_loss": -12.543468475341797, "global_step": 370870, "epoch": 2207} {"train_loss": -11.78504753112793, "global_step": 370871, "epoch": 2207} {"train_loss": -11.060089111328125, "global_step": 370872, "epoch": 2207} {"train_loss": -12.538300514221191, "global_step": 370873, "epoch": 2207} {"train_loss": -11.957807540893555, "global_step": 370874, "epoch": 2207} {"train_loss": -11.51108169555664, "global_step": 370875, "epoch": 2207} {"train_loss": -12.490426063537598, "global_step": 370876, "epoch": 2207} {"train_loss": -12.092830657958984, "global_step": 370877, "epoch": 2207} {"train_loss": -11.816404342651367, "global_step": 370878, "epoch": 2207} {"train_loss": -12.628695487976074, "global_step": 370879, "epoch": 2207} {"train_loss": -12.0078125, "global_step": 370880, "epoch": 2207} {"train_loss": -11.336596488952637, "global_step": 370881, "epoch": 2207} {"train_loss": -10.421855926513672, "global_step": 370882, "epoch": 2207} {"train_loss": -12.070489883422852, "global_step": 370883, "epoch": 2207} {"train_loss": -11.57882308959961, "global_step": 370884, "epoch": 2207} {"train_loss": -11.770938873291016, "global_step": 370885, "epoch": 2207} {"train_loss": -10.752355575561523, "global_step": 370886, "epoch": 2207} {"train_loss": -11.947831153869629, "global_step": 370887, "epoch": 2207} {"train_loss": -10.92109489440918, "global_step": 370888, "epoch": 2207} {"train_loss": -12.282342910766602, "global_step": 370889, "epoch": 2207} {"train_loss": -11.204952239990234, "global_step": 370890, "epoch": 2207} {"train_loss": -11.98967170715332, "global_step": 370891, "epoch": 2207} {"train_loss": -11.899858474731445, "global_step": 370892, "epoch": 2207} {"train_loss": -12.040693283081055, "global_step": 370893, "epoch": 2207} {"train_loss": -10.717269897460938, "global_step": 370894, "epoch": 2207} {"train_loss": -10.618180274963379, "global_step": 370895, "epoch": 2207} {"train_loss": -11.941192626953125, "global_step": 370896, "epoch": 2207} {"train_loss": -10.966588020324707, "global_step": 370897, "epoch": 2207} {"train_loss": -10.36959457397461, "global_step": 370898, "epoch": 2207} {"train_loss": -10.850881576538086, "global_step": 370899, "epoch": 2207} {"train_loss": -10.127152442932129, "global_step": 370900, "epoch": 2207} {"train_loss": -10.380741119384766, "global_step": 370901, "epoch": 2207} {"train_loss": -11.129201889038086, "global_step": 370902, "epoch": 2207} {"train_loss": -9.698623657226562, "global_step": 370903, "epoch": 2207} {"train_loss": -11.35464859008789, "global_step": 370904, "epoch": 2207} {"train_loss": -10.604879379272461, "global_step": 370905, "epoch": 2207} {"train_loss": -10.268209457397461, "global_step": 370906, "epoch": 2207} {"train_loss": -11.852348327636719, "global_step": 370907, "epoch": 2207} {"train_loss": -10.73325252532959, "global_step": 370908, "epoch": 2207} {"train_loss": -11.18061637878418, "global_step": 370909, "epoch": 2207} {"train_loss": -11.149991989135742, "global_step": 370910, "epoch": 2207} {"train_loss": -10.984502792358398, "global_step": 370911, "epoch": 2207} {"train_loss": -11.430082321166992, "global_step": 370912, "epoch": 2207} {"train_loss": -10.416544914245605, "global_step": 370913, "epoch": 2207} {"train_loss": -11.244049072265625, "global_step": 370914, "epoch": 2207} {"train_loss": -11.29273509979248, "global_step": 370915, "epoch": 2207} {"train_loss": -11.152793884277344, "global_step": 370916, "epoch": 2207} {"train_loss": -10.486381530761719, "global_step": 370917, "epoch": 2207} {"train_loss": -11.493756294250488, "global_step": 370918, "epoch": 2207} {"train_loss": -10.165216445922852, "global_step": 370919, "epoch": 2207} {"train_loss": -11.959734916687012, "global_step": 370920, "epoch": 2207} {"train_loss": -11.169435501098633, "global_step": 370921, "epoch": 2207} {"train_loss": -11.95042610168457, "global_step": 370922, "epoch": 2207} {"train_loss": -11.065622329711914, "global_step": 370923, "epoch": 2207} {"train_loss": -12.023262023925781, "global_step": 370924, "epoch": 2207} {"train_loss": -11.461139678955078, "global_step": 370925, "epoch": 2207} {"train_loss": -11.642934799194336, "global_step": 370926, "epoch": 2207} {"train_loss": -11.745235443115234, "global_step": 370927, "epoch": 2207} {"train_loss": -11.540254592895508, "global_step": 370928, "epoch": 2207} {"train_loss": -11.919825553894043, "global_step": 370929, "epoch": 2207} {"train_loss": -11.849483489990234, "global_step": 370930, "epoch": 2207} {"train_loss": -11.557416915893555, "global_step": 370931, "epoch": 2207} {"train_loss": -11.651104927062988, "global_step": 370932, "epoch": 2207} {"train_loss": -11.785287857055664, "global_step": 370933, "epoch": 2207} {"train_loss": -11.936826705932617, "global_step": 370934, "epoch": 2207} {"train_loss": -11.99515151977539, "global_step": 370935, "epoch": 2207} {"train_loss": -11.896768569946289, "global_step": 370936, "epoch": 2207} {"train_loss": -11.873485565185547, "global_step": 370937, "epoch": 2207} {"train_loss": -11.830944061279297, "global_step": 370938, "epoch": 2207} {"train_loss": -12.185132026672363, "global_step": 370939, "epoch": 2207} {"train_loss": -12.080204963684082, "global_step": 370940, "epoch": 2207} {"train_loss": -11.889388084411621, "global_step": 370941, "epoch": 2207} {"train_loss": -11.971616744995117, "global_step": 370942, "epoch": 2207} {"train_loss": -11.842395254543849, "global_step": 370943, "epoch": 2207, "val_loss": 290652.3125} {"train_loss": -12.069578170776367, "global_step": 370944, "epoch": 2208} {"train_loss": -12.42641544342041, "global_step": 370945, "epoch": 2208} {"train_loss": -12.161069869995117, "global_step": 370946, "epoch": 2208} {"train_loss": -12.083456039428711, "global_step": 370947, "epoch": 2208} {"train_loss": -12.05548095703125, "global_step": 370948, "epoch": 2208} {"train_loss": -12.137273788452148, "global_step": 370949, "epoch": 2208} {"train_loss": -12.148134231567383, "global_step": 370950, "epoch": 2208} {"train_loss": -12.40097713470459, "global_step": 370951, "epoch": 2208} {"train_loss": -12.148696899414062, "global_step": 370952, "epoch": 2208} {"train_loss": -12.252177238464355, "global_step": 370953, "epoch": 2208} {"train_loss": -12.239608764648438, "global_step": 370954, "epoch": 2208} {"train_loss": -12.268714904785156, "global_step": 370955, "epoch": 2208} {"train_loss": -12.058232307434082, "global_step": 370956, "epoch": 2208} {"train_loss": -12.353925704956055, "global_step": 370957, "epoch": 2208} {"train_loss": -12.34774398803711, "global_step": 370958, "epoch": 2208} {"train_loss": -12.522632598876953, "global_step": 370959, "epoch": 2208} {"train_loss": -12.42823600769043, "global_step": 370960, "epoch": 2208} {"train_loss": -12.155717849731445, "global_step": 370961, "epoch": 2208} {"train_loss": -12.427005767822266, "global_step": 370962, "epoch": 2208} {"train_loss": -12.417901992797852, "global_step": 370963, "epoch": 2208} {"train_loss": -12.443192481994629, "global_step": 370964, "epoch": 2208} {"train_loss": -12.273404121398926, "global_step": 370965, "epoch": 2208} {"train_loss": -12.494778633117676, "global_step": 370966, "epoch": 2208} {"train_loss": -12.423843383789062, "global_step": 370967, "epoch": 2208} {"train_loss": -12.469367980957031, "global_step": 370968, "epoch": 2208} {"train_loss": -12.435436248779297, "global_step": 370969, "epoch": 2208} {"train_loss": -12.557979583740234, "global_step": 370970, "epoch": 2208} {"train_loss": -12.422666549682617, "global_step": 370971, "epoch": 2208} {"train_loss": -12.027142524719238, "global_step": 370972, "epoch": 2208} {"train_loss": -12.474218368530273, "global_step": 370973, "epoch": 2208} {"train_loss": -12.079322814941406, "global_step": 370974, "epoch": 2208} {"train_loss": -12.340521812438965, "global_step": 370975, "epoch": 2208} {"train_loss": -12.337661743164062, "global_step": 370976, "epoch": 2208} {"train_loss": -12.368343353271484, "global_step": 370977, "epoch": 2208} {"train_loss": -12.093687057495117, "global_step": 370978, "epoch": 2208} {"train_loss": -12.428125381469727, "global_step": 370979, "epoch": 2208} {"train_loss": -12.172002792358398, "global_step": 370980, "epoch": 2208} {"train_loss": -12.153223037719727, "global_step": 370981, "epoch": 2208} {"train_loss": -12.51668930053711, "global_step": 370982, "epoch": 2208} {"train_loss": -12.705291748046875, "global_step": 370983, "epoch": 2208} {"train_loss": -11.665538787841797, "global_step": 370984, "epoch": 2208} {"train_loss": -12.333995819091797, "global_step": 370985, "epoch": 2208} {"train_loss": -12.511894226074219, "global_step": 370986, "epoch": 2208} {"train_loss": -12.394369125366211, "global_step": 370987, "epoch": 2208} {"train_loss": -12.606292724609375, "global_step": 370988, "epoch": 2208} {"train_loss": -12.63486099243164, "global_step": 370989, "epoch": 2208} {"train_loss": -12.44502067565918, "global_step": 370990, "epoch": 2208} {"train_loss": -12.700733184814453, "global_step": 370991, "epoch": 2208} {"train_loss": -12.6231689453125, "global_step": 370992, "epoch": 2208} {"train_loss": -12.464526176452637, "global_step": 370993, "epoch": 2208} {"train_loss": -12.648355484008789, "global_step": 370994, "epoch": 2208} {"train_loss": -12.651738166809082, "global_step": 370995, "epoch": 2208} {"train_loss": -12.583895683288574, "global_step": 370996, "epoch": 2208} {"train_loss": -12.467560768127441, "global_step": 370997, "epoch": 2208} {"train_loss": -12.62002182006836, "global_step": 370998, "epoch": 2208} {"train_loss": -12.576519966125488, "global_step": 370999, "epoch": 2208} {"train_loss": -12.187433242797852, "global_step": 371000, "epoch": 2208} {"train_loss": -12.111187934875488, "global_step": 371001, "epoch": 2208} {"train_loss": -12.427631378173828, "global_step": 371002, "epoch": 2208} {"train_loss": -12.470264434814453, "global_step": 371003, "epoch": 2208} {"train_loss": -11.845008850097656, "global_step": 371004, "epoch": 2208} {"train_loss": -11.446413040161133, "global_step": 371005, "epoch": 2208} {"train_loss": -10.723176956176758, "global_step": 371006, "epoch": 2208} {"train_loss": -12.052701950073242, "global_step": 371007, "epoch": 2208} {"train_loss": -12.468954086303711, "global_step": 371008, "epoch": 2208} {"train_loss": -11.773941040039062, "global_step": 371009, "epoch": 2208} {"train_loss": -11.741827964782715, "global_step": 371010, "epoch": 2208} {"train_loss": -12.394006729125977, "global_step": 371011, "epoch": 2208} {"train_loss": -11.946674346923828, "global_step": 371012, "epoch": 2208} {"train_loss": -11.883638381958008, "global_step": 371013, "epoch": 2208} {"train_loss": -12.303539276123047, "global_step": 371014, "epoch": 2208} {"train_loss": -12.281318664550781, "global_step": 371015, "epoch": 2208} {"train_loss": -12.451067924499512, "global_step": 371016, "epoch": 2208} {"train_loss": -12.225664138793945, "global_step": 371017, "epoch": 2208} {"train_loss": -12.444836616516113, "global_step": 371018, "epoch": 2208} {"train_loss": -12.21560001373291, "global_step": 371019, "epoch": 2208} {"train_loss": -12.333013534545898, "global_step": 371020, "epoch": 2208} {"train_loss": -12.240367889404297, "global_step": 371021, "epoch": 2208} {"train_loss": -12.634687423706055, "global_step": 371022, "epoch": 2208} {"train_loss": -12.44502067565918, "global_step": 371023, "epoch": 2208} {"train_loss": -12.496736526489258, "global_step": 371024, "epoch": 2208} {"train_loss": -12.178030967712402, "global_step": 371025, "epoch": 2208} {"train_loss": -12.486655235290527, "global_step": 371026, "epoch": 2208} {"train_loss": -12.150551795959473, "global_step": 371027, "epoch": 2208} {"train_loss": -12.264302253723145, "global_step": 371028, "epoch": 2208} {"train_loss": -12.340543746948242, "global_step": 371029, "epoch": 2208} {"train_loss": -12.070093154907227, "global_step": 371030, "epoch": 2208} {"train_loss": -12.269450187683105, "global_step": 371031, "epoch": 2208} {"train_loss": -11.928247451782227, "global_step": 371032, "epoch": 2208} {"train_loss": -11.430620193481445, "global_step": 371033, "epoch": 2208} {"train_loss": -11.054693222045898, "global_step": 371034, "epoch": 2208} {"train_loss": -11.902864456176758, "global_step": 371035, "epoch": 2208} {"train_loss": -12.076525688171387, "global_step": 371036, "epoch": 2208} {"train_loss": -12.08831787109375, "global_step": 371037, "epoch": 2208} {"train_loss": -12.050466537475586, "global_step": 371038, "epoch": 2208} {"train_loss": -12.056480407714844, "global_step": 371039, "epoch": 2208} {"train_loss": -11.702723503112793, "global_step": 371040, "epoch": 2208} {"train_loss": -11.680503845214844, "global_step": 371041, "epoch": 2208} {"train_loss": -11.934714317321777, "global_step": 371042, "epoch": 2208} {"train_loss": -11.854072570800781, "global_step": 371043, "epoch": 2208} {"train_loss": -11.562795639038086, "global_step": 371044, "epoch": 2208} {"train_loss": -11.466249465942383, "global_step": 371045, "epoch": 2208} {"train_loss": -11.251607894897461, "global_step": 371046, "epoch": 2208} {"train_loss": -11.615678787231445, "global_step": 371047, "epoch": 2208} {"train_loss": -12.415620803833008, "global_step": 371048, "epoch": 2208} {"train_loss": -11.179220199584961, "global_step": 371049, "epoch": 2208} {"train_loss": -12.098816871643066, "global_step": 371050, "epoch": 2208} {"train_loss": -12.189332962036133, "global_step": 371051, "epoch": 2208} {"train_loss": -11.779888153076172, "global_step": 371052, "epoch": 2208} {"train_loss": -11.223563194274902, "global_step": 371053, "epoch": 2208} {"train_loss": -12.391316413879395, "global_step": 371054, "epoch": 2208} {"train_loss": -12.73092269897461, "global_step": 371055, "epoch": 2208} {"train_loss": -11.897784233093262, "global_step": 371056, "epoch": 2208} {"train_loss": -12.25245475769043, "global_step": 371057, "epoch": 2208} {"train_loss": -12.397441864013672, "global_step": 371058, "epoch": 2208} {"train_loss": -12.149213790893555, "global_step": 371059, "epoch": 2208} {"train_loss": -11.941814422607422, "global_step": 371060, "epoch": 2208} {"train_loss": -12.498743057250977, "global_step": 371061, "epoch": 2208} {"train_loss": -12.397850036621094, "global_step": 371062, "epoch": 2208} {"train_loss": -12.511175155639648, "global_step": 371063, "epoch": 2208} {"train_loss": -12.402921676635742, "global_step": 371064, "epoch": 2208} {"train_loss": -12.488306045532227, "global_step": 371065, "epoch": 2208} {"train_loss": -12.388822555541992, "global_step": 371066, "epoch": 2208} {"train_loss": -12.14697265625, "global_step": 371067, "epoch": 2208} {"train_loss": -12.265482902526855, "global_step": 371068, "epoch": 2208} {"train_loss": -12.11596965789795, "global_step": 371069, "epoch": 2208} {"train_loss": -12.51522445678711, "global_step": 371070, "epoch": 2208} {"train_loss": -12.34621810913086, "global_step": 371071, "epoch": 2208} {"train_loss": -12.14389419555664, "global_step": 371072, "epoch": 2208} {"train_loss": -12.418380737304688, "global_step": 371073, "epoch": 2208} {"train_loss": -12.161998748779297, "global_step": 371074, "epoch": 2208} {"train_loss": -12.020991325378418, "global_step": 371075, "epoch": 2208} {"train_loss": -12.177002906799316, "global_step": 371076, "epoch": 2208} {"train_loss": -12.074933052062988, "global_step": 371077, "epoch": 2208} {"train_loss": -12.024669647216797, "global_step": 371078, "epoch": 2208} {"train_loss": -11.951969146728516, "global_step": 371079, "epoch": 2208} {"train_loss": -11.118066787719727, "global_step": 371080, "epoch": 2208} {"train_loss": -11.965826034545898, "global_step": 371081, "epoch": 2208} {"train_loss": -11.807721138000488, "global_step": 371082, "epoch": 2208} {"train_loss": -11.95329761505127, "global_step": 371083, "epoch": 2208} {"train_loss": -11.052874565124512, "global_step": 371084, "epoch": 2208} {"train_loss": -12.566411018371582, "global_step": 371085, "epoch": 2208} {"train_loss": -11.534077644348145, "global_step": 371086, "epoch": 2208} {"train_loss": -12.265449523925781, "global_step": 371087, "epoch": 2208} {"train_loss": -12.098146438598633, "global_step": 371088, "epoch": 2208} {"train_loss": -11.857120513916016, "global_step": 371089, "epoch": 2208} {"train_loss": -12.515233039855957, "global_step": 371090, "epoch": 2208} {"train_loss": -12.473443984985352, "global_step": 371091, "epoch": 2208} {"train_loss": -11.907844543457031, "global_step": 371092, "epoch": 2208} {"train_loss": -12.502163887023926, "global_step": 371093, "epoch": 2208} {"train_loss": -12.003101348876953, "global_step": 371094, "epoch": 2208} {"train_loss": -12.30121898651123, "global_step": 371095, "epoch": 2208} {"train_loss": -11.822153091430664, "global_step": 371096, "epoch": 2208} {"train_loss": -12.147577285766602, "global_step": 371097, "epoch": 2208} {"train_loss": -12.21190071105957, "global_step": 371098, "epoch": 2208} {"train_loss": -11.914554595947266, "global_step": 371099, "epoch": 2208} {"train_loss": -12.57037353515625, "global_step": 371100, "epoch": 2208} {"train_loss": -11.618053436279297, "global_step": 371101, "epoch": 2208} {"train_loss": -11.964533805847168, "global_step": 371102, "epoch": 2208} {"train_loss": -11.927766799926758, "global_step": 371103, "epoch": 2208} {"train_loss": -11.830913543701172, "global_step": 371104, "epoch": 2208} {"train_loss": -12.180829048156738, "global_step": 371105, "epoch": 2208} {"train_loss": -12.270923614501953, "global_step": 371106, "epoch": 2208} {"train_loss": -11.757883071899414, "global_step": 371107, "epoch": 2208} {"train_loss": -12.206804275512695, "global_step": 371108, "epoch": 2208} {"train_loss": -12.160606384277344, "global_step": 371109, "epoch": 2208} {"train_loss": -12.346048355102539, "global_step": 371110, "epoch": 2208} {"train_loss": -12.167180594943819, "global_step": 371111, "epoch": 2208, "val_loss": 290927.03125} {"train_loss": -11.240507125854492, "global_step": 371112, "epoch": 2209} {"train_loss": -11.930604934692383, "global_step": 371113, "epoch": 2209} {"train_loss": -12.252767562866211, "global_step": 371114, "epoch": 2209} {"train_loss": -10.800008773803711, "global_step": 371115, "epoch": 2209} {"train_loss": -12.354081153869629, "global_step": 371116, "epoch": 2209} {"train_loss": -10.760993957519531, "global_step": 371117, "epoch": 2209} {"train_loss": -11.773101806640625, "global_step": 371118, "epoch": 2209} {"train_loss": -11.037278175354004, "global_step": 371119, "epoch": 2209} {"train_loss": -11.941819190979004, "global_step": 371120, "epoch": 2209} {"train_loss": -11.111075401306152, "global_step": 371121, "epoch": 2209} {"train_loss": -11.52468490600586, "global_step": 371122, "epoch": 2209} {"train_loss": -8.976598739624023, "global_step": 371123, "epoch": 2209} {"train_loss": -9.919097900390625, "global_step": 371124, "epoch": 2209} {"train_loss": -11.647247314453125, "global_step": 371125, "epoch": 2209} {"train_loss": -10.17666244506836, "global_step": 371126, "epoch": 2209} {"train_loss": -10.123476028442383, "global_step": 371127, "epoch": 2209} {"train_loss": -10.947887420654297, "global_step": 371128, "epoch": 2209} {"train_loss": -11.163206100463867, "global_step": 371129, "epoch": 2209} {"train_loss": -10.946120262145996, "global_step": 371130, "epoch": 2209} {"train_loss": -10.481648445129395, "global_step": 371131, "epoch": 2209} {"train_loss": -11.480467796325684, "global_step": 371132, "epoch": 2209} {"train_loss": -10.371716499328613, "global_step": 371133, "epoch": 2209} {"train_loss": -11.687015533447266, "global_step": 371134, "epoch": 2209} {"train_loss": -11.105091094970703, "global_step": 371135, "epoch": 2209} {"train_loss": -10.450532913208008, "global_step": 371136, "epoch": 2209} {"train_loss": -11.073038101196289, "global_step": 371137, "epoch": 2209} {"train_loss": -9.90778636932373, "global_step": 371138, "epoch": 2209} {"train_loss": -10.156986236572266, "global_step": 371139, "epoch": 2209} {"train_loss": -10.228399276733398, "global_step": 371140, "epoch": 2209} {"train_loss": -10.258105278015137, "global_step": 371141, "epoch": 2209} {"train_loss": -9.690913200378418, "global_step": 371142, "epoch": 2209} {"train_loss": -11.196767807006836, "global_step": 371143, "epoch": 2209} {"train_loss": -10.718313217163086, "global_step": 371144, "epoch": 2209} {"train_loss": -10.436676979064941, "global_step": 371145, "epoch": 2209} {"train_loss": -11.02786922454834, "global_step": 371146, "epoch": 2209} {"train_loss": -11.632410049438477, "global_step": 371147, "epoch": 2209} {"train_loss": -11.262943267822266, "global_step": 371148, "epoch": 2209} {"train_loss": -11.188321113586426, "global_step": 371149, "epoch": 2209} {"train_loss": -10.491167068481445, "global_step": 371150, "epoch": 2209} {"train_loss": -11.741809844970703, "global_step": 371151, "epoch": 2209} {"train_loss": -10.45932388305664, "global_step": 371152, "epoch": 2209} {"train_loss": -11.93442440032959, "global_step": 371153, "epoch": 2209} {"train_loss": -11.511791229248047, "global_step": 371154, "epoch": 2209} {"train_loss": -11.781434059143066, "global_step": 371155, "epoch": 2209} {"train_loss": -11.606253623962402, "global_step": 371156, "epoch": 2209} {"train_loss": -11.851552963256836, "global_step": 371157, "epoch": 2209} {"train_loss": -11.512805938720703, "global_step": 371158, "epoch": 2209} {"train_loss": -12.180978775024414, "global_step": 371159, "epoch": 2209} {"train_loss": -11.882240295410156, "global_step": 371160, "epoch": 2209} {"train_loss": -12.301070213317871, "global_step": 371161, "epoch": 2209} {"train_loss": -11.834493637084961, "global_step": 371162, "epoch": 2209} {"train_loss": -12.21579360961914, "global_step": 371163, "epoch": 2209} {"train_loss": -11.878152847290039, "global_step": 371164, "epoch": 2209} {"train_loss": -12.012184143066406, "global_step": 371165, "epoch": 2209} {"train_loss": -12.238199234008789, "global_step": 371166, "epoch": 2209} {"train_loss": -11.999519348144531, "global_step": 371167, "epoch": 2209} {"train_loss": -12.011507034301758, "global_step": 371168, "epoch": 2209} {"train_loss": -12.358287811279297, "global_step": 371169, "epoch": 2209} {"train_loss": -12.410306930541992, "global_step": 371170, "epoch": 2209} {"train_loss": -12.185653686523438, "global_step": 371171, "epoch": 2209} {"train_loss": -12.332893371582031, "global_step": 371172, "epoch": 2209} {"train_loss": -12.396657943725586, "global_step": 371173, "epoch": 2209} {"train_loss": -12.319576263427734, "global_step": 371174, "epoch": 2209} {"train_loss": -12.456806182861328, "global_step": 371175, "epoch": 2209} {"train_loss": -12.450540542602539, "global_step": 371176, "epoch": 2209} {"train_loss": -12.319382667541504, "global_step": 371177, "epoch": 2209} {"train_loss": -12.3531494140625, "global_step": 371178, "epoch": 2209} {"train_loss": -12.559860229492188, "global_step": 371179, "epoch": 2209} {"train_loss": -12.467193603515625, "global_step": 371180, "epoch": 2209} {"train_loss": -12.549491882324219, "global_step": 371181, "epoch": 2209} {"train_loss": -12.408199310302734, "global_step": 371182, "epoch": 2209} {"train_loss": -12.567809104919434, "global_step": 371183, "epoch": 2209} {"train_loss": -12.467094421386719, "global_step": 371184, "epoch": 2209} {"train_loss": -12.419668197631836, "global_step": 371185, "epoch": 2209} {"train_loss": -12.52112102508545, "global_step": 371186, "epoch": 2209} {"train_loss": -12.344282150268555, "global_step": 371187, "epoch": 2209} {"train_loss": -12.249876022338867, "global_step": 371188, "epoch": 2209} {"train_loss": -12.400588035583496, "global_step": 371189, "epoch": 2209} {"train_loss": -12.497995376586914, "global_step": 371190, "epoch": 2209} {"train_loss": -12.351263046264648, "global_step": 371191, "epoch": 2209} {"train_loss": -12.396161079406738, "global_step": 371192, "epoch": 2209} {"train_loss": -12.352313041687012, "global_step": 371193, "epoch": 2209} {"train_loss": -12.478867530822754, "global_step": 371194, "epoch": 2209} {"train_loss": -12.4173583984375, "global_step": 371195, "epoch": 2209} {"train_loss": -12.124302864074707, "global_step": 371196, "epoch": 2209} {"train_loss": -12.452835083007812, "global_step": 371197, "epoch": 2209} {"train_loss": -12.286630630493164, "global_step": 371198, "epoch": 2209} {"train_loss": -12.212797164916992, "global_step": 371199, "epoch": 2209} {"train_loss": -12.135442733764648, "global_step": 371200, "epoch": 2209} {"train_loss": -12.373425483703613, "global_step": 371201, "epoch": 2209} {"train_loss": -12.136063575744629, "global_step": 371202, "epoch": 2209} {"train_loss": -12.712970733642578, "global_step": 371203, "epoch": 2209} {"train_loss": -12.225870132446289, "global_step": 371204, "epoch": 2209} {"train_loss": -12.583566665649414, "global_step": 371205, "epoch": 2209} {"train_loss": -12.45565414428711, "global_step": 371206, "epoch": 2209} {"train_loss": -12.454385757446289, "global_step": 371207, "epoch": 2209} {"train_loss": -12.317789077758789, "global_step": 371208, "epoch": 2209} {"train_loss": -12.285221099853516, "global_step": 371209, "epoch": 2209} {"train_loss": -12.435537338256836, "global_step": 371210, "epoch": 2209} {"train_loss": -12.14775562286377, "global_step": 371211, "epoch": 2209} {"train_loss": -12.639059066772461, "global_step": 371212, "epoch": 2209} {"train_loss": -12.090791702270508, "global_step": 371213, "epoch": 2209} {"train_loss": -12.184946060180664, "global_step": 371214, "epoch": 2209} {"train_loss": -12.376237869262695, "global_step": 371215, "epoch": 2209} {"train_loss": -12.29890251159668, "global_step": 371216, "epoch": 2209} {"train_loss": -12.403057098388672, "global_step": 371217, "epoch": 2209} {"train_loss": -12.431178092956543, "global_step": 371218, "epoch": 2209} {"train_loss": -12.458097457885742, "global_step": 371219, "epoch": 2209} {"train_loss": -12.458955764770508, "global_step": 371220, "epoch": 2209} {"train_loss": -12.339704513549805, "global_step": 371221, "epoch": 2209} {"train_loss": -12.673190116882324, "global_step": 371222, "epoch": 2209} {"train_loss": -12.362529754638672, "global_step": 371223, "epoch": 2209} {"train_loss": -12.747344970703125, "global_step": 371224, "epoch": 2209} {"train_loss": -12.222661972045898, "global_step": 371225, "epoch": 2209} {"train_loss": -12.534273147583008, "global_step": 371226, "epoch": 2209} {"train_loss": -12.527040481567383, "global_step": 371227, "epoch": 2209} {"train_loss": -11.676129341125488, "global_step": 371228, "epoch": 2209} {"train_loss": -12.684836387634277, "global_step": 371229, "epoch": 2209} {"train_loss": -12.199216842651367, "global_step": 371230, "epoch": 2209} {"train_loss": -11.781649589538574, "global_step": 371231, "epoch": 2209} {"train_loss": -11.419458389282227, "global_step": 371232, "epoch": 2209} {"train_loss": -11.926342010498047, "global_step": 371233, "epoch": 2209} {"train_loss": -12.537788391113281, "global_step": 371234, "epoch": 2209} {"train_loss": -12.550864219665527, "global_step": 371235, "epoch": 2209} {"train_loss": -11.849270820617676, "global_step": 371236, "epoch": 2209} {"train_loss": -12.129709243774414, "global_step": 371237, "epoch": 2209} {"train_loss": -12.593989372253418, "global_step": 371238, "epoch": 2209} {"train_loss": -12.663476943969727, "global_step": 371239, "epoch": 2209} {"train_loss": -12.450078010559082, "global_step": 371240, "epoch": 2209} {"train_loss": -12.51366901397705, "global_step": 371241, "epoch": 2209} {"train_loss": -12.349398612976074, "global_step": 371242, "epoch": 2209} {"train_loss": -11.8273286819458, "global_step": 371243, "epoch": 2209} {"train_loss": -11.782079696655273, "global_step": 371244, "epoch": 2209} {"train_loss": -12.586870193481445, "global_step": 371245, "epoch": 2209} {"train_loss": -12.107536315917969, "global_step": 371246, "epoch": 2209} {"train_loss": -12.574545860290527, "global_step": 371247, "epoch": 2209} {"train_loss": -12.243104934692383, "global_step": 371248, "epoch": 2209} {"train_loss": -12.580390930175781, "global_step": 371249, "epoch": 2209} {"train_loss": -12.037837028503418, "global_step": 371250, "epoch": 2209} {"train_loss": -12.747209548950195, "global_step": 371251, "epoch": 2209} {"train_loss": -12.486637115478516, "global_step": 371252, "epoch": 2209} {"train_loss": -12.320623397827148, "global_step": 371253, "epoch": 2209} {"train_loss": -12.186042785644531, "global_step": 371254, "epoch": 2209} {"train_loss": -12.538110733032227, "global_step": 371255, "epoch": 2209} {"train_loss": -12.482080459594727, "global_step": 371256, "epoch": 2209} {"train_loss": -12.281013488769531, "global_step": 371257, "epoch": 2209} {"train_loss": -11.911404609680176, "global_step": 371258, "epoch": 2209} {"train_loss": -11.863306999206543, "global_step": 371259, "epoch": 2209} {"train_loss": -12.45029354095459, "global_step": 371260, "epoch": 2209} {"train_loss": -12.082136154174805, "global_step": 371261, "epoch": 2209} {"train_loss": -12.511566162109375, "global_step": 371262, "epoch": 2209} {"train_loss": -12.504839897155762, "global_step": 371263, "epoch": 2209} {"train_loss": -12.35150146484375, "global_step": 371264, "epoch": 2209} {"train_loss": -12.184162139892578, "global_step": 371265, "epoch": 2209} {"train_loss": -12.428494453430176, "global_step": 371266, "epoch": 2209} {"train_loss": -12.662961959838867, "global_step": 371267, "epoch": 2209} {"train_loss": -12.398551940917969, "global_step": 371268, "epoch": 2209} {"train_loss": -12.565649032592773, "global_step": 371269, "epoch": 2209} {"train_loss": -12.410746574401855, "global_step": 371270, "epoch": 2209} {"train_loss": -12.415261268615723, "global_step": 371271, "epoch": 2209} {"train_loss": -12.52574348449707, "global_step": 371272, "epoch": 2209} {"train_loss": -12.605012893676758, "global_step": 371273, "epoch": 2209} {"train_loss": -12.62034797668457, "global_step": 371274, "epoch": 2209} {"train_loss": -12.759891510009766, "global_step": 371275, "epoch": 2209} {"train_loss": -12.093820571899414, "global_step": 371276, "epoch": 2209} {"train_loss": -12.422935485839844, "global_step": 371277, "epoch": 2209} {"train_loss": -12.715316772460938, "global_step": 371278, "epoch": 2209} {"train_loss": -11.967516802606129, "global_step": 371279, "epoch": 2209, "val_loss": 290029.0} {"train_loss": -12.0775146484375, "global_step": 371280, "epoch": 2210} {"train_loss": -12.295007705688477, "global_step": 371281, "epoch": 2210} {"train_loss": -11.79865837097168, "global_step": 371282, "epoch": 2210} {"train_loss": -11.95872974395752, "global_step": 371283, "epoch": 2210} {"train_loss": -11.642441749572754, "global_step": 371284, "epoch": 2210} {"train_loss": -11.796035766601562, "global_step": 371285, "epoch": 2210} {"train_loss": -11.373664855957031, "global_step": 371286, "epoch": 2210} {"train_loss": -8.14193058013916, "global_step": 371287, "epoch": 2210} {"train_loss": -10.942598342895508, "global_step": 371288, "epoch": 2210} {"train_loss": -9.95665168762207, "global_step": 371289, "epoch": 2210} {"train_loss": -10.056913375854492, "global_step": 371290, "epoch": 2210} {"train_loss": -11.016594886779785, "global_step": 371291, "epoch": 2210} {"train_loss": -11.845203399658203, "global_step": 371292, "epoch": 2210} {"train_loss": -11.097525596618652, "global_step": 371293, "epoch": 2210} {"train_loss": -11.202836990356445, "global_step": 371294, "epoch": 2210} {"train_loss": -10.918710708618164, "global_step": 371295, "epoch": 2210} {"train_loss": -12.423507690429688, "global_step": 371296, "epoch": 2210} {"train_loss": -11.231016159057617, "global_step": 371297, "epoch": 2210} {"train_loss": -11.464123725891113, "global_step": 371298, "epoch": 2210} {"train_loss": -11.20570182800293, "global_step": 371299, "epoch": 2210} {"train_loss": -10.877330780029297, "global_step": 371300, "epoch": 2210} {"train_loss": -11.40231990814209, "global_step": 371301, "epoch": 2210} {"train_loss": -11.860652923583984, "global_step": 371302, "epoch": 2210} {"train_loss": -11.499147415161133, "global_step": 371303, "epoch": 2210} {"train_loss": -11.76272964477539, "global_step": 371304, "epoch": 2210} {"train_loss": -10.82481575012207, "global_step": 371305, "epoch": 2210} {"train_loss": -11.437787055969238, "global_step": 371306, "epoch": 2210} {"train_loss": -11.849506378173828, "global_step": 371307, "epoch": 2210} {"train_loss": -11.580061912536621, "global_step": 371308, "epoch": 2210} {"train_loss": -11.735084533691406, "global_step": 371309, "epoch": 2210} {"train_loss": -11.522289276123047, "global_step": 371310, "epoch": 2210} {"train_loss": -11.903162002563477, "global_step": 371311, "epoch": 2210} {"train_loss": -11.532893180847168, "global_step": 371312, "epoch": 2210} {"train_loss": -12.234050750732422, "global_step": 371313, "epoch": 2210} {"train_loss": -11.973241806030273, "global_step": 371314, "epoch": 2210} {"train_loss": -11.894022941589355, "global_step": 371315, "epoch": 2210} {"train_loss": -12.196975708007812, "global_step": 371316, "epoch": 2210} {"train_loss": -12.13193130493164, "global_step": 371317, "epoch": 2210} {"train_loss": -12.177738189697266, "global_step": 371318, "epoch": 2210} {"train_loss": -12.097823143005371, "global_step": 371319, "epoch": 2210} {"train_loss": -11.683362007141113, "global_step": 371320, "epoch": 2210} {"train_loss": -12.112136840820312, "global_step": 371321, "epoch": 2210} {"train_loss": -12.31566333770752, "global_step": 371322, "epoch": 2210} {"train_loss": -11.484110832214355, "global_step": 371323, "epoch": 2210} {"train_loss": -12.155403137207031, "global_step": 371324, "epoch": 2210} {"train_loss": -11.49502182006836, "global_step": 371325, "epoch": 2210} {"train_loss": -11.625699996948242, "global_step": 371326, "epoch": 2210} {"train_loss": -11.662522315979004, "global_step": 371327, "epoch": 2210} {"train_loss": -11.527782440185547, "global_step": 371328, "epoch": 2210} {"train_loss": -11.778541564941406, "global_step": 371329, "epoch": 2210} {"train_loss": -10.547714233398438, "global_step": 371330, "epoch": 2210} {"train_loss": -11.70917797088623, "global_step": 371331, "epoch": 2210} {"train_loss": -11.686386108398438, "global_step": 371332, "epoch": 2210} {"train_loss": -11.141228675842285, "global_step": 371333, "epoch": 2210} {"train_loss": -12.026519775390625, "global_step": 371334, "epoch": 2210} {"train_loss": -10.876775741577148, "global_step": 371335, "epoch": 2210} {"train_loss": -11.985188484191895, "global_step": 371336, "epoch": 2210} {"train_loss": -11.40342903137207, "global_step": 371337, "epoch": 2210} {"train_loss": -11.741622924804688, "global_step": 371338, "epoch": 2210} {"train_loss": -11.40130615234375, "global_step": 371339, "epoch": 2210} {"train_loss": -11.524114608764648, "global_step": 371340, "epoch": 2210} {"train_loss": -10.829862594604492, "global_step": 371341, "epoch": 2210} {"train_loss": -11.263887405395508, "global_step": 371342, "epoch": 2210} {"train_loss": -11.432121276855469, "global_step": 371343, "epoch": 2210} {"train_loss": -11.502803802490234, "global_step": 371344, "epoch": 2210} {"train_loss": -11.26512336730957, "global_step": 371345, "epoch": 2210} {"train_loss": -11.855020523071289, "global_step": 371346, "epoch": 2210} {"train_loss": -11.634498596191406, "global_step": 371347, "epoch": 2210} {"train_loss": -11.245074272155762, "global_step": 371348, "epoch": 2210} {"train_loss": -12.071051597595215, "global_step": 371349, "epoch": 2210} {"train_loss": -11.152386665344238, "global_step": 371350, "epoch": 2210} {"train_loss": -12.250532150268555, "global_step": 371351, "epoch": 2210} {"train_loss": -11.08226203918457, "global_step": 371352, "epoch": 2210} {"train_loss": -11.462663650512695, "global_step": 371353, "epoch": 2210} {"train_loss": -11.529548645019531, "global_step": 371354, "epoch": 2210} {"train_loss": -11.373769760131836, "global_step": 371355, "epoch": 2210} {"train_loss": -11.89521598815918, "global_step": 371356, "epoch": 2210} {"train_loss": -11.328804016113281, "global_step": 371357, "epoch": 2210} {"train_loss": -12.070290565490723, "global_step": 371358, "epoch": 2210} {"train_loss": -11.308778762817383, "global_step": 371359, "epoch": 2210} {"train_loss": -12.270524978637695, "global_step": 371360, "epoch": 2210} {"train_loss": -11.315546989440918, "global_step": 371361, "epoch": 2210} {"train_loss": -12.368186950683594, "global_step": 371362, "epoch": 2210} {"train_loss": -11.623443603515625, "global_step": 371363, "epoch": 2210} {"train_loss": -11.725265502929688, "global_step": 371364, "epoch": 2210} {"train_loss": -11.862699508666992, "global_step": 371365, "epoch": 2210} {"train_loss": -11.9810209274292, "global_step": 371366, "epoch": 2210} {"train_loss": -11.933684349060059, "global_step": 371367, "epoch": 2210} {"train_loss": -12.139446258544922, "global_step": 371368, "epoch": 2210} {"train_loss": -11.860795974731445, "global_step": 371369, "epoch": 2210} {"train_loss": -12.261716842651367, "global_step": 371370, "epoch": 2210} {"train_loss": -11.971839904785156, "global_step": 371371, "epoch": 2210} {"train_loss": -12.335078239440918, "global_step": 371372, "epoch": 2210} {"train_loss": -12.0350341796875, "global_step": 371373, "epoch": 2210} {"train_loss": -12.376956939697266, "global_step": 371374, "epoch": 2210} {"train_loss": -12.418807983398438, "global_step": 371375, "epoch": 2210} {"train_loss": -11.95779037475586, "global_step": 371376, "epoch": 2210} {"train_loss": -12.416213989257812, "global_step": 371377, "epoch": 2210} {"train_loss": -12.31679916381836, "global_step": 371378, "epoch": 2210} {"train_loss": -12.241609573364258, "global_step": 371379, "epoch": 2210} {"train_loss": -12.248367309570312, "global_step": 371380, "epoch": 2210} {"train_loss": -12.490516662597656, "global_step": 371381, "epoch": 2210} {"train_loss": -12.419979095458984, "global_step": 371382, "epoch": 2210} {"train_loss": -12.467642784118652, "global_step": 371383, "epoch": 2210} {"train_loss": -12.6046781539917, "global_step": 371384, "epoch": 2210} {"train_loss": -12.463024139404297, "global_step": 371385, "epoch": 2210} {"train_loss": -12.443246841430664, "global_step": 371386, "epoch": 2210} {"train_loss": -12.275886535644531, "global_step": 371387, "epoch": 2210} {"train_loss": -12.27336311340332, "global_step": 371388, "epoch": 2210} {"train_loss": -12.462173461914062, "global_step": 371389, "epoch": 2210} {"train_loss": -12.466976165771484, "global_step": 371390, "epoch": 2210} {"train_loss": -12.401216506958008, "global_step": 371391, "epoch": 2210} {"train_loss": -12.250611305236816, "global_step": 371392, "epoch": 2210} {"train_loss": -12.375173568725586, "global_step": 371393, "epoch": 2210} {"train_loss": -12.468501091003418, "global_step": 371394, "epoch": 2210} {"train_loss": -12.502998352050781, "global_step": 371395, "epoch": 2210} {"train_loss": -12.173513412475586, "global_step": 371396, "epoch": 2210} {"train_loss": -12.393953323364258, "global_step": 371397, "epoch": 2210} {"train_loss": -12.119841575622559, "global_step": 371398, "epoch": 2210} {"train_loss": -12.52427864074707, "global_step": 371399, "epoch": 2210} {"train_loss": -12.376923561096191, "global_step": 371400, "epoch": 2210} {"train_loss": -12.633891105651855, "global_step": 371401, "epoch": 2210} {"train_loss": -12.316619873046875, "global_step": 371402, "epoch": 2210} {"train_loss": -12.66285514831543, "global_step": 371403, "epoch": 2210} {"train_loss": -12.165531158447266, "global_step": 371404, "epoch": 2210} {"train_loss": -12.665922164916992, "global_step": 371405, "epoch": 2210} {"train_loss": -12.310882568359375, "global_step": 371406, "epoch": 2210} {"train_loss": -12.215936660766602, "global_step": 371407, "epoch": 2210} {"train_loss": -12.30768871307373, "global_step": 371408, "epoch": 2210} {"train_loss": -12.212882995605469, "global_step": 371409, "epoch": 2210} {"train_loss": -12.502862930297852, "global_step": 371410, "epoch": 2210} {"train_loss": -12.205337524414062, "global_step": 371411, "epoch": 2210} {"train_loss": -12.584277153015137, "global_step": 371412, "epoch": 2210} {"train_loss": -12.335247039794922, "global_step": 371413, "epoch": 2210} {"train_loss": -12.080816268920898, "global_step": 371414, "epoch": 2210} {"train_loss": -12.065560340881348, "global_step": 371415, "epoch": 2210} {"train_loss": -11.931357383728027, "global_step": 371416, "epoch": 2210} {"train_loss": -11.866729736328125, "global_step": 371417, "epoch": 2210} {"train_loss": -11.874577522277832, "global_step": 371418, "epoch": 2210} {"train_loss": -12.424711227416992, "global_step": 371419, "epoch": 2210} {"train_loss": -12.39189624786377, "global_step": 371420, "epoch": 2210} {"train_loss": -12.613561630249023, "global_step": 371421, "epoch": 2210} {"train_loss": -12.247920036315918, "global_step": 371422, "epoch": 2210} {"train_loss": -12.742712020874023, "global_step": 371423, "epoch": 2210} {"train_loss": -12.382279396057129, "global_step": 371424, "epoch": 2210} {"train_loss": -12.698840141296387, "global_step": 371425, "epoch": 2210} {"train_loss": -12.431004524230957, "global_step": 371426, "epoch": 2210} {"train_loss": -12.414576530456543, "global_step": 371427, "epoch": 2210} {"train_loss": -12.476042747497559, "global_step": 371428, "epoch": 2210} {"train_loss": -12.426491737365723, "global_step": 371429, "epoch": 2210} {"train_loss": -12.346810340881348, "global_step": 371430, "epoch": 2210} {"train_loss": -12.739075660705566, "global_step": 371431, "epoch": 2210} {"train_loss": -12.48135757446289, "global_step": 371432, "epoch": 2210} {"train_loss": -12.608444213867188, "global_step": 371433, "epoch": 2210} {"train_loss": -12.57076644897461, "global_step": 371434, "epoch": 2210} {"train_loss": -12.228195190429688, "global_step": 371435, "epoch": 2210} {"train_loss": -12.214792251586914, "global_step": 371436, "epoch": 2210} {"train_loss": -11.692840576171875, "global_step": 371437, "epoch": 2210} {"train_loss": -11.285394668579102, "global_step": 371438, "epoch": 2210} {"train_loss": -12.456953048706055, "global_step": 371439, "epoch": 2210} {"train_loss": -11.787867546081543, "global_step": 371440, "epoch": 2210} {"train_loss": -11.372340202331543, "global_step": 371441, "epoch": 2210} {"train_loss": -11.47572135925293, "global_step": 371442, "epoch": 2210} {"train_loss": -11.652661323547363, "global_step": 371443, "epoch": 2210} {"train_loss": -11.794839859008789, "global_step": 371444, "epoch": 2210} {"train_loss": -11.836771965026855, "global_step": 371445, "epoch": 2210} {"train_loss": -11.485906600952148, "global_step": 371446, "epoch": 2210} {"train_loss": -11.888332514535813, "global_step": 371447, "epoch": 2210, "val_loss": 293200.375, "train_action_mse_error": 0.5502168536186218} {"train_loss": -11.74355411529541, "global_step": 371448, "epoch": 2211} {"train_loss": -11.736209869384766, "global_step": 371449, "epoch": 2211} {"train_loss": -11.603591918945312, "global_step": 371450, "epoch": 2211} {"train_loss": -11.808719635009766, "global_step": 371451, "epoch": 2211} {"train_loss": -10.749163627624512, "global_step": 371452, "epoch": 2211} {"train_loss": -11.683727264404297, "global_step": 371453, "epoch": 2211} {"train_loss": -11.350709915161133, "global_step": 371454, "epoch": 2211} {"train_loss": -10.379188537597656, "global_step": 371455, "epoch": 2211} {"train_loss": -11.33155345916748, "global_step": 371456, "epoch": 2211} {"train_loss": -11.076658248901367, "global_step": 371457, "epoch": 2211} {"train_loss": -10.366764068603516, "global_step": 371458, "epoch": 2211} {"train_loss": -10.083642959594727, "global_step": 371459, "epoch": 2211} {"train_loss": -12.00936222076416, "global_step": 371460, "epoch": 2211} {"train_loss": -10.210034370422363, "global_step": 371461, "epoch": 2211} {"train_loss": -9.777242660522461, "global_step": 371462, "epoch": 2211} {"train_loss": -11.330190658569336, "global_step": 371463, "epoch": 2211} {"train_loss": -9.884953498840332, "global_step": 371464, "epoch": 2211} {"train_loss": -10.803794860839844, "global_step": 371465, "epoch": 2211} {"train_loss": -10.256072998046875, "global_step": 371466, "epoch": 2211} {"train_loss": -11.580299377441406, "global_step": 371467, "epoch": 2211} {"train_loss": -10.238832473754883, "global_step": 371468, "epoch": 2211} {"train_loss": -11.344642639160156, "global_step": 371469, "epoch": 2211} {"train_loss": -10.771621704101562, "global_step": 371470, "epoch": 2211} {"train_loss": -11.372901916503906, "global_step": 371471, "epoch": 2211} {"train_loss": -11.108125686645508, "global_step": 371472, "epoch": 2211} {"train_loss": -11.980423927307129, "global_step": 371473, "epoch": 2211} {"train_loss": -11.474191665649414, "global_step": 371474, "epoch": 2211} {"train_loss": -11.729120254516602, "global_step": 371475, "epoch": 2211} {"train_loss": -11.883874893188477, "global_step": 371476, "epoch": 2211} {"train_loss": -11.652690887451172, "global_step": 371477, "epoch": 2211} {"train_loss": -12.064713478088379, "global_step": 371478, "epoch": 2211} {"train_loss": -11.66343879699707, "global_step": 371479, "epoch": 2211} {"train_loss": -11.557579040527344, "global_step": 371480, "epoch": 2211} {"train_loss": -11.984603881835938, "global_step": 371481, "epoch": 2211} {"train_loss": -12.011007308959961, "global_step": 371482, "epoch": 2211} {"train_loss": -12.297286033630371, "global_step": 371483, "epoch": 2211} {"train_loss": -12.113018035888672, "global_step": 371484, "epoch": 2211} {"train_loss": -12.03258991241455, "global_step": 371485, "epoch": 2211} {"train_loss": -12.228633880615234, "global_step": 371486, "epoch": 2211} {"train_loss": -12.36263656616211, "global_step": 371487, "epoch": 2211} {"train_loss": -12.08651351928711, "global_step": 371488, "epoch": 2211} {"train_loss": -12.300858497619629, "global_step": 371489, "epoch": 2211} {"train_loss": -12.275243759155273, "global_step": 371490, "epoch": 2211} {"train_loss": -12.160597801208496, "global_step": 371491, "epoch": 2211} {"train_loss": -12.052431106567383, "global_step": 371492, "epoch": 2211} {"train_loss": -12.433956146240234, "global_step": 371493, "epoch": 2211} {"train_loss": -12.328752517700195, "global_step": 371494, "epoch": 2211} {"train_loss": -12.298648834228516, "global_step": 371495, "epoch": 2211} {"train_loss": -12.375579833984375, "global_step": 371496, "epoch": 2211} {"train_loss": -12.414999008178711, "global_step": 371497, "epoch": 2211} {"train_loss": -12.299047470092773, "global_step": 371498, "epoch": 2211} {"train_loss": -12.561140060424805, "global_step": 371499, "epoch": 2211} {"train_loss": -12.389970779418945, "global_step": 371500, "epoch": 2211} {"train_loss": -12.42242431640625, "global_step": 371501, "epoch": 2211} {"train_loss": -12.24763298034668, "global_step": 371502, "epoch": 2211} {"train_loss": -12.442535400390625, "global_step": 371503, "epoch": 2211} {"train_loss": -12.143952369689941, "global_step": 371504, "epoch": 2211} {"train_loss": -12.540802955627441, "global_step": 371505, "epoch": 2211} {"train_loss": -12.370210647583008, "global_step": 371506, "epoch": 2211} {"train_loss": -12.204192161560059, "global_step": 371507, "epoch": 2211} {"train_loss": -12.283916473388672, "global_step": 371508, "epoch": 2211} {"train_loss": -12.55162239074707, "global_step": 371509, "epoch": 2211} {"train_loss": -12.554740905761719, "global_step": 371510, "epoch": 2211} {"train_loss": -12.578542709350586, "global_step": 371511, "epoch": 2211} {"train_loss": -12.485326766967773, "global_step": 371512, "epoch": 2211} {"train_loss": -12.508806228637695, "global_step": 371513, "epoch": 2211} {"train_loss": -12.476848602294922, "global_step": 371514, "epoch": 2211} {"train_loss": -12.528797149658203, "global_step": 371515, "epoch": 2211} {"train_loss": -12.672590255737305, "global_step": 371516, "epoch": 2211} {"train_loss": -12.371687889099121, "global_step": 371517, "epoch": 2211} {"train_loss": -12.505494117736816, "global_step": 371518, "epoch": 2211} {"train_loss": -12.319863319396973, "global_step": 371519, "epoch": 2211} {"train_loss": -12.441617012023926, "global_step": 371520, "epoch": 2211} {"train_loss": -12.661115646362305, "global_step": 371521, "epoch": 2211} {"train_loss": -12.506376266479492, "global_step": 371522, "epoch": 2211} {"train_loss": -12.71468448638916, "global_step": 371523, "epoch": 2211} {"train_loss": -12.597540855407715, "global_step": 371524, "epoch": 2211} {"train_loss": -12.539639472961426, "global_step": 371525, "epoch": 2211} {"train_loss": -12.609922409057617, "global_step": 371526, "epoch": 2211} {"train_loss": -12.600342750549316, "global_step": 371527, "epoch": 2211} {"train_loss": -12.449732780456543, "global_step": 371528, "epoch": 2211} {"train_loss": -12.634503364562988, "global_step": 371529, "epoch": 2211} {"train_loss": -12.543746948242188, "global_step": 371530, "epoch": 2211} {"train_loss": -12.262121200561523, "global_step": 371531, "epoch": 2211} {"train_loss": -12.794797897338867, "global_step": 371532, "epoch": 2211} {"train_loss": -12.691093444824219, "global_step": 371533, "epoch": 2211} {"train_loss": -12.571406364440918, "global_step": 371534, "epoch": 2211} {"train_loss": -12.820880889892578, "global_step": 371535, "epoch": 2211} {"train_loss": -12.70985221862793, "global_step": 371536, "epoch": 2211} {"train_loss": -12.583868980407715, "global_step": 371537, "epoch": 2211} {"train_loss": -12.640565872192383, "global_step": 371538, "epoch": 2211} {"train_loss": -12.62198257446289, "global_step": 371539, "epoch": 2211} {"train_loss": -12.419532775878906, "global_step": 371540, "epoch": 2211} {"train_loss": -12.600772857666016, "global_step": 371541, "epoch": 2211} {"train_loss": -12.541759490966797, "global_step": 371542, "epoch": 2211} {"train_loss": -12.629755020141602, "global_step": 371543, "epoch": 2211} {"train_loss": -12.788025856018066, "global_step": 371544, "epoch": 2211} {"train_loss": -12.531229019165039, "global_step": 371545, "epoch": 2211} {"train_loss": -12.518070220947266, "global_step": 371546, "epoch": 2211} {"train_loss": -12.582730293273926, "global_step": 371547, "epoch": 2211} {"train_loss": -12.310906410217285, "global_step": 371548, "epoch": 2211} {"train_loss": -12.373022079467773, "global_step": 371549, "epoch": 2211} {"train_loss": -12.595104217529297, "global_step": 371550, "epoch": 2211} {"train_loss": -12.666702270507812, "global_step": 371551, "epoch": 2211} {"train_loss": -12.611800193786621, "global_step": 371552, "epoch": 2211} {"train_loss": -12.609071731567383, "global_step": 371553, "epoch": 2211} {"train_loss": -12.586854934692383, "global_step": 371554, "epoch": 2211} {"train_loss": -12.726482391357422, "global_step": 371555, "epoch": 2211} {"train_loss": -12.270707130432129, "global_step": 371556, "epoch": 2211} {"train_loss": -11.922483444213867, "global_step": 371557, "epoch": 2211} {"train_loss": -12.473750114440918, "global_step": 371558, "epoch": 2211} {"train_loss": -12.801197052001953, "global_step": 371559, "epoch": 2211} {"train_loss": -12.17360782623291, "global_step": 371560, "epoch": 2211} {"train_loss": -11.622297286987305, "global_step": 371561, "epoch": 2211} {"train_loss": -12.309425354003906, "global_step": 371562, "epoch": 2211} {"train_loss": -12.618600845336914, "global_step": 371563, "epoch": 2211} {"train_loss": -12.523880958557129, "global_step": 371564, "epoch": 2211} {"train_loss": -11.555042266845703, "global_step": 371565, "epoch": 2211} {"train_loss": -12.106831550598145, "global_step": 371566, "epoch": 2211} {"train_loss": -13.015005111694336, "global_step": 371567, "epoch": 2211} {"train_loss": -11.985658645629883, "global_step": 371568, "epoch": 2211} {"train_loss": -12.136781692504883, "global_step": 371569, "epoch": 2211} {"train_loss": -12.353880882263184, "global_step": 371570, "epoch": 2211} {"train_loss": -12.438455581665039, "global_step": 371571, "epoch": 2211} {"train_loss": -12.669961929321289, "global_step": 371572, "epoch": 2211} {"train_loss": -12.493459701538086, "global_step": 371573, "epoch": 2211} {"train_loss": -12.535833358764648, "global_step": 371574, "epoch": 2211} {"train_loss": -12.141401290893555, "global_step": 371575, "epoch": 2211} {"train_loss": -12.228596687316895, "global_step": 371576, "epoch": 2211} {"train_loss": -12.56834888458252, "global_step": 371577, "epoch": 2211} {"train_loss": -12.74178695678711, "global_step": 371578, "epoch": 2211} {"train_loss": -12.327672958374023, "global_step": 371579, "epoch": 2211} {"train_loss": -12.13177490234375, "global_step": 371580, "epoch": 2211} {"train_loss": -12.379424095153809, "global_step": 371581, "epoch": 2211} {"train_loss": -12.410825729370117, "global_step": 371582, "epoch": 2211} {"train_loss": -12.540350914001465, "global_step": 371583, "epoch": 2211} {"train_loss": -12.045811653137207, "global_step": 371584, "epoch": 2211} {"train_loss": -12.657133102416992, "global_step": 371585, "epoch": 2211} {"train_loss": -12.34339714050293, "global_step": 371586, "epoch": 2211} {"train_loss": -12.65131664276123, "global_step": 371587, "epoch": 2211} {"train_loss": -12.129590034484863, "global_step": 371588, "epoch": 2211} {"train_loss": -11.564841270446777, "global_step": 371589, "epoch": 2211} {"train_loss": -11.691420555114746, "global_step": 371590, "epoch": 2211} {"train_loss": -12.127767562866211, "global_step": 371591, "epoch": 2211} {"train_loss": -11.26208209991455, "global_step": 371592, "epoch": 2211} {"train_loss": -8.054424285888672, "global_step": 371593, "epoch": 2211} {"train_loss": -10.793827056884766, "global_step": 371594, "epoch": 2211} {"train_loss": -7.268108367919922, "global_step": 371595, "epoch": 2211} {"train_loss": -8.946565628051758, "global_step": 371596, "epoch": 2211} {"train_loss": -8.806039810180664, "global_step": 371597, "epoch": 2211} {"train_loss": -9.755029678344727, "global_step": 371598, "epoch": 2211} {"train_loss": -9.848000526428223, "global_step": 371599, "epoch": 2211} {"train_loss": -9.705923080444336, "global_step": 371600, "epoch": 2211} {"train_loss": -9.250170707702637, "global_step": 371601, "epoch": 2211} {"train_loss": -10.352311134338379, "global_step": 371602, "epoch": 2211} {"train_loss": -10.268433570861816, "global_step": 371603, "epoch": 2211} {"train_loss": -9.89329719543457, "global_step": 371604, "epoch": 2211} {"train_loss": -10.249693870544434, "global_step": 371605, "epoch": 2211} {"train_loss": -10.105352401733398, "global_step": 371606, "epoch": 2211} {"train_loss": -10.351442337036133, "global_step": 371607, "epoch": 2211} {"train_loss": -10.354717254638672, "global_step": 371608, "epoch": 2211} {"train_loss": -11.120771408081055, "global_step": 371609, "epoch": 2211} {"train_loss": -10.725408554077148, "global_step": 371610, "epoch": 2211} {"train_loss": -10.766417503356934, "global_step": 371611, "epoch": 2211} {"train_loss": -11.40456771850586, "global_step": 371612, "epoch": 2211} {"train_loss": -11.168573379516602, "global_step": 371613, "epoch": 2211} {"train_loss": -11.315271377563477, "global_step": 371614, "epoch": 2211} {"train_loss": -11.833508570988974, "global_step": 371615, "epoch": 2211, "val_loss": 281495.25} {"train_loss": -10.148885726928711, "global_step": 371616, "epoch": 2212} {"train_loss": -11.499300956726074, "global_step": 371617, "epoch": 2212} {"train_loss": -10.133848190307617, "global_step": 371618, "epoch": 2212} {"train_loss": -10.956775665283203, "global_step": 371619, "epoch": 2212} {"train_loss": -10.266376495361328, "global_step": 371620, "epoch": 2212} {"train_loss": -10.3988037109375, "global_step": 371621, "epoch": 2212} {"train_loss": -10.2747802734375, "global_step": 371622, "epoch": 2212} {"train_loss": -9.546588897705078, "global_step": 371623, "epoch": 2212} {"train_loss": -10.257790565490723, "global_step": 371624, "epoch": 2212} {"train_loss": -10.50200080871582, "global_step": 371625, "epoch": 2212} {"train_loss": -10.531862258911133, "global_step": 371626, "epoch": 2212} {"train_loss": -10.836624145507812, "global_step": 371627, "epoch": 2212} {"train_loss": -10.221794128417969, "global_step": 371628, "epoch": 2212} {"train_loss": -10.606294631958008, "global_step": 371629, "epoch": 2212} {"train_loss": -10.460929870605469, "global_step": 371630, "epoch": 2212} {"train_loss": -11.397449493408203, "global_step": 371631, "epoch": 2212} {"train_loss": -10.447507858276367, "global_step": 371632, "epoch": 2212} {"train_loss": -10.711441040039062, "global_step": 371633, "epoch": 2212} {"train_loss": -10.681519508361816, "global_step": 371634, "epoch": 2212} {"train_loss": -10.412044525146484, "global_step": 371635, "epoch": 2212} {"train_loss": -10.444700241088867, "global_step": 371636, "epoch": 2212} {"train_loss": -11.498948097229004, "global_step": 371637, "epoch": 2212} {"train_loss": -10.432138442993164, "global_step": 371638, "epoch": 2212} {"train_loss": -11.17538833618164, "global_step": 371639, "epoch": 2212} {"train_loss": -10.938758850097656, "global_step": 371640, "epoch": 2212} {"train_loss": -11.633700370788574, "global_step": 371641, "epoch": 2212} {"train_loss": -10.925522804260254, "global_step": 371642, "epoch": 2212} {"train_loss": -11.631879806518555, "global_step": 371643, "epoch": 2212} {"train_loss": -11.683122634887695, "global_step": 371644, "epoch": 2212} {"train_loss": -11.462981224060059, "global_step": 371645, "epoch": 2212} {"train_loss": -11.581716537475586, "global_step": 371646, "epoch": 2212} {"train_loss": -11.514087677001953, "global_step": 371647, "epoch": 2212} {"train_loss": -11.295276641845703, "global_step": 371648, "epoch": 2212} {"train_loss": -11.984345436096191, "global_step": 371649, "epoch": 2212} {"train_loss": -11.403080940246582, "global_step": 371650, "epoch": 2212} {"train_loss": -11.999417304992676, "global_step": 371651, "epoch": 2212} {"train_loss": -11.44067668914795, "global_step": 371652, "epoch": 2212} {"train_loss": -12.067879676818848, "global_step": 371653, "epoch": 2212} {"train_loss": -12.09089469909668, "global_step": 371654, "epoch": 2212} {"train_loss": -11.906181335449219, "global_step": 371655, "epoch": 2212} {"train_loss": -11.786932945251465, "global_step": 371656, "epoch": 2212} {"train_loss": -11.949009895324707, "global_step": 371657, "epoch": 2212} {"train_loss": -12.053890228271484, "global_step": 371658, "epoch": 2212} {"train_loss": -11.98549747467041, "global_step": 371659, "epoch": 2212} {"train_loss": -12.05841064453125, "global_step": 371660, "epoch": 2212} {"train_loss": -12.09035873413086, "global_step": 371661, "epoch": 2212} {"train_loss": -11.869961738586426, "global_step": 371662, "epoch": 2212} {"train_loss": -12.30755615234375, "global_step": 371663, "epoch": 2212} {"train_loss": -12.064434051513672, "global_step": 371664, "epoch": 2212} {"train_loss": -12.156814575195312, "global_step": 371665, "epoch": 2212} {"train_loss": -11.948101997375488, "global_step": 371666, "epoch": 2212} {"train_loss": -12.114140510559082, "global_step": 371667, "epoch": 2212} {"train_loss": -12.10682487487793, "global_step": 371668, "epoch": 2212} {"train_loss": -12.296914100646973, "global_step": 371669, "epoch": 2212} {"train_loss": -12.082620620727539, "global_step": 371670, "epoch": 2212} {"train_loss": -12.306519508361816, "global_step": 371671, "epoch": 2212} {"train_loss": -12.005146026611328, "global_step": 371672, "epoch": 2212} {"train_loss": -12.386556625366211, "global_step": 371673, "epoch": 2212} {"train_loss": -12.211237907409668, "global_step": 371674, "epoch": 2212} {"train_loss": -12.231952667236328, "global_step": 371675, "epoch": 2212} {"train_loss": -12.145242691040039, "global_step": 371676, "epoch": 2212} {"train_loss": -12.117849349975586, "global_step": 371677, "epoch": 2212} {"train_loss": -12.039608001708984, "global_step": 371678, "epoch": 2212} {"train_loss": -12.24599838256836, "global_step": 371679, "epoch": 2212} {"train_loss": -12.214522361755371, "global_step": 371680, "epoch": 2212} {"train_loss": -12.217710494995117, "global_step": 371681, "epoch": 2212} {"train_loss": -12.171321868896484, "global_step": 371682, "epoch": 2212} {"train_loss": -12.377981185913086, "global_step": 371683, "epoch": 2212} {"train_loss": -12.461490631103516, "global_step": 371684, "epoch": 2212} {"train_loss": -12.56217098236084, "global_step": 371685, "epoch": 2212} {"train_loss": -12.153667449951172, "global_step": 371686, "epoch": 2212} {"train_loss": -12.301499366760254, "global_step": 371687, "epoch": 2212} {"train_loss": -12.487037658691406, "global_step": 371688, "epoch": 2212} {"train_loss": -12.447991371154785, "global_step": 371689, "epoch": 2212} {"train_loss": -12.309295654296875, "global_step": 371690, "epoch": 2212} {"train_loss": -12.351577758789062, "global_step": 371691, "epoch": 2212} {"train_loss": -12.36749267578125, "global_step": 371692, "epoch": 2212} {"train_loss": -12.263795852661133, "global_step": 371693, "epoch": 2212} {"train_loss": -12.607855796813965, "global_step": 371694, "epoch": 2212} {"train_loss": -12.254920959472656, "global_step": 371695, "epoch": 2212} {"train_loss": -12.667684555053711, "global_step": 371696, "epoch": 2212} {"train_loss": -12.374919891357422, "global_step": 371697, "epoch": 2212} {"train_loss": -12.33680534362793, "global_step": 371698, "epoch": 2212} {"train_loss": -12.458480834960938, "global_step": 371699, "epoch": 2212} {"train_loss": -12.365936279296875, "global_step": 371700, "epoch": 2212} {"train_loss": -12.466970443725586, "global_step": 371701, "epoch": 2212} {"train_loss": -12.457093238830566, "global_step": 371702, "epoch": 2212} {"train_loss": -12.353391647338867, "global_step": 371703, "epoch": 2212} {"train_loss": -12.483379364013672, "global_step": 371704, "epoch": 2212} {"train_loss": -12.433069229125977, "global_step": 371705, "epoch": 2212} {"train_loss": -12.38934326171875, "global_step": 371706, "epoch": 2212} {"train_loss": -12.544021606445312, "global_step": 371707, "epoch": 2212} {"train_loss": -12.257047653198242, "global_step": 371708, "epoch": 2212} {"train_loss": -12.506795883178711, "global_step": 371709, "epoch": 2212} {"train_loss": -12.533323287963867, "global_step": 371710, "epoch": 2212} {"train_loss": -12.023748397827148, "global_step": 371711, "epoch": 2212} {"train_loss": -12.620450973510742, "global_step": 371712, "epoch": 2212} {"train_loss": -12.363485336303711, "global_step": 371713, "epoch": 2212} {"train_loss": -12.248391151428223, "global_step": 371714, "epoch": 2212} {"train_loss": -12.65553092956543, "global_step": 371715, "epoch": 2212} {"train_loss": -12.362171173095703, "global_step": 371716, "epoch": 2212} {"train_loss": -12.331924438476562, "global_step": 371717, "epoch": 2212} {"train_loss": -12.205074310302734, "global_step": 371718, "epoch": 2212} {"train_loss": -11.94019603729248, "global_step": 371719, "epoch": 2212} {"train_loss": -12.243989944458008, "global_step": 371720, "epoch": 2212} {"train_loss": -12.174663543701172, "global_step": 371721, "epoch": 2212} {"train_loss": -11.9302978515625, "global_step": 371722, "epoch": 2212} {"train_loss": -12.516111373901367, "global_step": 371723, "epoch": 2212} {"train_loss": -12.00327205657959, "global_step": 371724, "epoch": 2212} {"train_loss": -12.290044784545898, "global_step": 371725, "epoch": 2212} {"train_loss": -12.447330474853516, "global_step": 371726, "epoch": 2212} {"train_loss": -12.184638977050781, "global_step": 371727, "epoch": 2212} {"train_loss": -12.386978149414062, "global_step": 371728, "epoch": 2212} {"train_loss": -12.337514877319336, "global_step": 371729, "epoch": 2212} {"train_loss": -11.979217529296875, "global_step": 371730, "epoch": 2212} {"train_loss": -12.288637161254883, "global_step": 371731, "epoch": 2212} {"train_loss": -12.233480453491211, "global_step": 371732, "epoch": 2212} {"train_loss": -12.27834701538086, "global_step": 371733, "epoch": 2212} {"train_loss": -12.288206100463867, "global_step": 371734, "epoch": 2212} {"train_loss": -11.940441131591797, "global_step": 371735, "epoch": 2212} {"train_loss": -12.021848678588867, "global_step": 371736, "epoch": 2212} {"train_loss": -12.08395767211914, "global_step": 371737, "epoch": 2212} {"train_loss": -11.998326301574707, "global_step": 371738, "epoch": 2212} {"train_loss": -12.331686019897461, "global_step": 371739, "epoch": 2212} {"train_loss": -12.158820152282715, "global_step": 371740, "epoch": 2212} {"train_loss": -12.273098945617676, "global_step": 371741, "epoch": 2212} {"train_loss": -11.8632230758667, "global_step": 371742, "epoch": 2212} {"train_loss": -12.55616569519043, "global_step": 371743, "epoch": 2212} {"train_loss": -12.02000617980957, "global_step": 371744, "epoch": 2212} {"train_loss": -12.53746223449707, "global_step": 371745, "epoch": 2212} {"train_loss": -12.13962173461914, "global_step": 371746, "epoch": 2212} {"train_loss": -12.472049713134766, "global_step": 371747, "epoch": 2212} {"train_loss": -12.196964263916016, "global_step": 371748, "epoch": 2212} {"train_loss": -12.14240837097168, "global_step": 371749, "epoch": 2212} {"train_loss": -12.392838478088379, "global_step": 371750, "epoch": 2212} {"train_loss": -12.30799674987793, "global_step": 371751, "epoch": 2212} {"train_loss": -12.247337341308594, "global_step": 371752, "epoch": 2212} {"train_loss": -12.243547439575195, "global_step": 371753, "epoch": 2212} {"train_loss": -12.456737518310547, "global_step": 371754, "epoch": 2212} {"train_loss": -12.3887939453125, "global_step": 371755, "epoch": 2212} {"train_loss": -12.20445442199707, "global_step": 371756, "epoch": 2212} {"train_loss": -12.481792449951172, "global_step": 371757, "epoch": 2212} {"train_loss": -12.49066162109375, "global_step": 371758, "epoch": 2212} {"train_loss": -12.113971710205078, "global_step": 371759, "epoch": 2212} {"train_loss": -12.185123443603516, "global_step": 371760, "epoch": 2212} {"train_loss": -12.341455459594727, "global_step": 371761, "epoch": 2212} {"train_loss": -10.896261215209961, "global_step": 371762, "epoch": 2212} {"train_loss": -11.657051086425781, "global_step": 371763, "epoch": 2212} {"train_loss": -12.063080787658691, "global_step": 371764, "epoch": 2212} {"train_loss": -11.994855880737305, "global_step": 371765, "epoch": 2212} {"train_loss": -11.737112998962402, "global_step": 371766, "epoch": 2212} {"train_loss": -11.736190795898438, "global_step": 371767, "epoch": 2212} {"train_loss": -12.47105884552002, "global_step": 371768, "epoch": 2212} {"train_loss": -11.889458656311035, "global_step": 371769, "epoch": 2212} {"train_loss": -11.524572372436523, "global_step": 371770, "epoch": 2212} {"train_loss": -11.851934432983398, "global_step": 371771, "epoch": 2212} {"train_loss": -12.246976852416992, "global_step": 371772, "epoch": 2212} {"train_loss": -11.995909690856934, "global_step": 371773, "epoch": 2212} {"train_loss": -11.468782424926758, "global_step": 371774, "epoch": 2212} {"train_loss": -12.444432258605957, "global_step": 371775, "epoch": 2212} {"train_loss": -11.962437629699707, "global_step": 371776, "epoch": 2212} {"train_loss": -11.960319519042969, "global_step": 371777, "epoch": 2212} {"train_loss": -12.16742992401123, "global_step": 371778, "epoch": 2212} {"train_loss": -11.29179573059082, "global_step": 371779, "epoch": 2212} {"train_loss": -11.620901107788086, "global_step": 371780, "epoch": 2212} {"train_loss": -12.693016052246094, "global_step": 371781, "epoch": 2212} {"train_loss": -11.660391807556152, "global_step": 371782, "epoch": 2212} {"train_loss": -11.906869434175038, "global_step": 371783, "epoch": 2212, "val_loss": 289700.15625} {"train_loss": -12.499580383300781, "global_step": 371784, "epoch": 2213} {"train_loss": -12.096956253051758, "global_step": 371785, "epoch": 2213} {"train_loss": -12.431107521057129, "global_step": 371786, "epoch": 2213} {"train_loss": -12.248014450073242, "global_step": 371787, "epoch": 2213} {"train_loss": -12.151926040649414, "global_step": 371788, "epoch": 2213} {"train_loss": -12.152030944824219, "global_step": 371789, "epoch": 2213} {"train_loss": -12.025318145751953, "global_step": 371790, "epoch": 2213} {"train_loss": -12.360376358032227, "global_step": 371791, "epoch": 2213} {"train_loss": -11.84619140625, "global_step": 371792, "epoch": 2213} {"train_loss": -12.463883399963379, "global_step": 371793, "epoch": 2213} {"train_loss": -11.967582702636719, "global_step": 371794, "epoch": 2213} {"train_loss": -12.202733039855957, "global_step": 371795, "epoch": 2213} {"train_loss": -12.001995086669922, "global_step": 371796, "epoch": 2213} {"train_loss": -12.148597717285156, "global_step": 371797, "epoch": 2213} {"train_loss": -12.094791412353516, "global_step": 371798, "epoch": 2213} {"train_loss": -12.48074722290039, "global_step": 371799, "epoch": 2213} {"train_loss": -12.211021423339844, "global_step": 371800, "epoch": 2213} {"train_loss": -12.294764518737793, "global_step": 371801, "epoch": 2213} {"train_loss": -12.342378616333008, "global_step": 371802, "epoch": 2213} {"train_loss": -12.361242294311523, "global_step": 371803, "epoch": 2213} {"train_loss": -12.213807106018066, "global_step": 371804, "epoch": 2213} {"train_loss": -11.518239974975586, "global_step": 371805, "epoch": 2213} {"train_loss": -12.409713745117188, "global_step": 371806, "epoch": 2213} {"train_loss": -11.540592193603516, "global_step": 371807, "epoch": 2213} {"train_loss": -12.375245094299316, "global_step": 371808, "epoch": 2213} {"train_loss": -11.747518539428711, "global_step": 371809, "epoch": 2213} {"train_loss": -12.260287284851074, "global_step": 371810, "epoch": 2213} {"train_loss": -12.376466751098633, "global_step": 371811, "epoch": 2213} {"train_loss": -12.37546443939209, "global_step": 371812, "epoch": 2213} {"train_loss": -12.352909088134766, "global_step": 371813, "epoch": 2213} {"train_loss": -12.485099792480469, "global_step": 371814, "epoch": 2213} {"train_loss": -12.248023986816406, "global_step": 371815, "epoch": 2213} {"train_loss": -12.750988006591797, "global_step": 371816, "epoch": 2213} {"train_loss": -12.008796691894531, "global_step": 371817, "epoch": 2213} {"train_loss": -12.329604148864746, "global_step": 371818, "epoch": 2213} {"train_loss": -12.040945053100586, "global_step": 371819, "epoch": 2213} {"train_loss": -12.44616413116455, "global_step": 371820, "epoch": 2213} {"train_loss": -12.317840576171875, "global_step": 371821, "epoch": 2213} {"train_loss": -12.378049850463867, "global_step": 371822, "epoch": 2213} {"train_loss": -12.371883392333984, "global_step": 371823, "epoch": 2213} {"train_loss": -12.692121505737305, "global_step": 371824, "epoch": 2213} {"train_loss": -12.260652542114258, "global_step": 371825, "epoch": 2213} {"train_loss": -12.75364875793457, "global_step": 371826, "epoch": 2213} {"train_loss": -12.447549819946289, "global_step": 371827, "epoch": 2213} {"train_loss": -12.047224044799805, "global_step": 371828, "epoch": 2213} {"train_loss": -12.26759147644043, "global_step": 371829, "epoch": 2213} {"train_loss": -12.086523056030273, "global_step": 371830, "epoch": 2213} {"train_loss": -12.789358139038086, "global_step": 371831, "epoch": 2213} {"train_loss": -12.568321228027344, "global_step": 371832, "epoch": 2213} {"train_loss": -12.591747283935547, "global_step": 371833, "epoch": 2213} {"train_loss": -12.55949592590332, "global_step": 371834, "epoch": 2213} {"train_loss": -12.328574180603027, "global_step": 371835, "epoch": 2213} {"train_loss": -12.625524520874023, "global_step": 371836, "epoch": 2213} {"train_loss": -12.321176528930664, "global_step": 371837, "epoch": 2213} {"train_loss": -12.608962059020996, "global_step": 371838, "epoch": 2213} {"train_loss": -12.193829536437988, "global_step": 371839, "epoch": 2213} {"train_loss": -12.82778549194336, "global_step": 371840, "epoch": 2213} {"train_loss": -12.321956634521484, "global_step": 371841, "epoch": 2213} {"train_loss": -12.306833267211914, "global_step": 371842, "epoch": 2213} {"train_loss": -12.424348831176758, "global_step": 371843, "epoch": 2213} {"train_loss": -12.2755126953125, "global_step": 371844, "epoch": 2213} {"train_loss": -12.441593170166016, "global_step": 371845, "epoch": 2213} {"train_loss": -12.422975540161133, "global_step": 371846, "epoch": 2213} {"train_loss": -12.074054718017578, "global_step": 371847, "epoch": 2213} {"train_loss": -12.64242172241211, "global_step": 371848, "epoch": 2213} {"train_loss": -12.63366413116455, "global_step": 371849, "epoch": 2213} {"train_loss": -12.757770538330078, "global_step": 371850, "epoch": 2213} {"train_loss": -12.171201705932617, "global_step": 371851, "epoch": 2213} {"train_loss": -12.737909317016602, "global_step": 371852, "epoch": 2213} {"train_loss": -12.59035873413086, "global_step": 371853, "epoch": 2213} {"train_loss": -12.668697357177734, "global_step": 371854, "epoch": 2213} {"train_loss": -12.847942352294922, "global_step": 371855, "epoch": 2213} {"train_loss": -12.757308959960938, "global_step": 371856, "epoch": 2213} {"train_loss": -12.483835220336914, "global_step": 371857, "epoch": 2213} {"train_loss": -12.032146453857422, "global_step": 371858, "epoch": 2213} {"train_loss": -12.518014907836914, "global_step": 371859, "epoch": 2213} {"train_loss": -12.194925308227539, "global_step": 371860, "epoch": 2213} {"train_loss": -12.466289520263672, "global_step": 371861, "epoch": 2213} {"train_loss": -12.162220001220703, "global_step": 371862, "epoch": 2213} {"train_loss": -12.808343887329102, "global_step": 371863, "epoch": 2213} {"train_loss": -11.952507019042969, "global_step": 371864, "epoch": 2213} {"train_loss": -10.877309799194336, "global_step": 371865, "epoch": 2213} {"train_loss": -11.455965042114258, "global_step": 371866, "epoch": 2213} {"train_loss": -11.759648323059082, "global_step": 371867, "epoch": 2213} {"train_loss": -12.025848388671875, "global_step": 371868, "epoch": 2213} {"train_loss": -12.054365158081055, "global_step": 371869, "epoch": 2213} {"train_loss": -12.176225662231445, "global_step": 371870, "epoch": 2213} {"train_loss": -12.130306243896484, "global_step": 371871, "epoch": 2213} {"train_loss": -11.61739730834961, "global_step": 371872, "epoch": 2213} {"train_loss": -11.721048355102539, "global_step": 371873, "epoch": 2213} {"train_loss": -10.648029327392578, "global_step": 371874, "epoch": 2213} {"train_loss": -11.662872314453125, "global_step": 371875, "epoch": 2213} {"train_loss": -12.052591323852539, "global_step": 371876, "epoch": 2213} {"train_loss": -12.156108856201172, "global_step": 371877, "epoch": 2213} {"train_loss": -10.856794357299805, "global_step": 371878, "epoch": 2213} {"train_loss": -11.91626262664795, "global_step": 371879, "epoch": 2213} {"train_loss": -11.781618118286133, "global_step": 371880, "epoch": 2213} {"train_loss": -11.046500205993652, "global_step": 371881, "epoch": 2213} {"train_loss": -11.294404983520508, "global_step": 371882, "epoch": 2213} {"train_loss": -11.93210506439209, "global_step": 371883, "epoch": 2213} {"train_loss": -11.309286117553711, "global_step": 371884, "epoch": 2213} {"train_loss": -11.455625534057617, "global_step": 371885, "epoch": 2213} {"train_loss": -11.2617769241333, "global_step": 371886, "epoch": 2213} {"train_loss": -11.40130615234375, "global_step": 371887, "epoch": 2213} {"train_loss": -11.393330574035645, "global_step": 371888, "epoch": 2213} {"train_loss": -10.34351921081543, "global_step": 371889, "epoch": 2213} {"train_loss": -10.573719024658203, "global_step": 371890, "epoch": 2213} {"train_loss": -11.268434524536133, "global_step": 371891, "epoch": 2213} {"train_loss": -10.40051555633545, "global_step": 371892, "epoch": 2213} {"train_loss": -10.413142204284668, "global_step": 371893, "epoch": 2213} {"train_loss": -11.139577865600586, "global_step": 371894, "epoch": 2213} {"train_loss": -10.93405532836914, "global_step": 371895, "epoch": 2213} {"train_loss": -11.990973472595215, "global_step": 371896, "epoch": 2213} {"train_loss": -11.294134140014648, "global_step": 371897, "epoch": 2213} {"train_loss": -11.739387512207031, "global_step": 371898, "epoch": 2213} {"train_loss": -11.785890579223633, "global_step": 371899, "epoch": 2213} {"train_loss": -11.875662803649902, "global_step": 371900, "epoch": 2213} {"train_loss": -11.73670768737793, "global_step": 371901, "epoch": 2213} {"train_loss": -11.791865348815918, "global_step": 371902, "epoch": 2213} {"train_loss": -12.246438980102539, "global_step": 371903, "epoch": 2213} {"train_loss": -11.987452507019043, "global_step": 371904, "epoch": 2213} {"train_loss": -12.206865310668945, "global_step": 371905, "epoch": 2213} {"train_loss": -11.977903366088867, "global_step": 371906, "epoch": 2213} {"train_loss": -12.254745483398438, "global_step": 371907, "epoch": 2213} {"train_loss": -12.237690925598145, "global_step": 371908, "epoch": 2213} {"train_loss": -12.25032901763916, "global_step": 371909, "epoch": 2213} {"train_loss": -11.753841400146484, "global_step": 371910, "epoch": 2213} {"train_loss": -12.025408744812012, "global_step": 371911, "epoch": 2213} {"train_loss": -12.23756217956543, "global_step": 371912, "epoch": 2213} {"train_loss": -12.188474655151367, "global_step": 371913, "epoch": 2213} {"train_loss": -12.332685470581055, "global_step": 371914, "epoch": 2213} {"train_loss": -12.19117546081543, "global_step": 371915, "epoch": 2213} {"train_loss": -12.242425918579102, "global_step": 371916, "epoch": 2213} {"train_loss": -12.145245552062988, "global_step": 371917, "epoch": 2213} {"train_loss": -12.185534477233887, "global_step": 371918, "epoch": 2213} {"train_loss": -12.068550109863281, "global_step": 371919, "epoch": 2213} {"train_loss": -12.256450653076172, "global_step": 371920, "epoch": 2213} {"train_loss": -12.11176872253418, "global_step": 371921, "epoch": 2213} {"train_loss": -12.272529602050781, "global_step": 371922, "epoch": 2213} {"train_loss": -12.318937301635742, "global_step": 371923, "epoch": 2213} {"train_loss": -12.319328308105469, "global_step": 371924, "epoch": 2213} {"train_loss": -11.915369033813477, "global_step": 371925, "epoch": 2213} {"train_loss": -12.187124252319336, "global_step": 371926, "epoch": 2213} {"train_loss": -12.108238220214844, "global_step": 371927, "epoch": 2213} {"train_loss": -12.533197402954102, "global_step": 371928, "epoch": 2213} {"train_loss": -12.262200355529785, "global_step": 371929, "epoch": 2213} {"train_loss": -12.212244987487793, "global_step": 371930, "epoch": 2213} {"train_loss": -12.044696807861328, "global_step": 371931, "epoch": 2213} {"train_loss": -12.021567344665527, "global_step": 371932, "epoch": 2213} {"train_loss": -12.016729354858398, "global_step": 371933, "epoch": 2213} {"train_loss": -12.138483047485352, "global_step": 371934, "epoch": 2213} {"train_loss": -12.43724250793457, "global_step": 371935, "epoch": 2213} {"train_loss": -12.474536895751953, "global_step": 371936, "epoch": 2213} {"train_loss": -12.334083557128906, "global_step": 371937, "epoch": 2213} {"train_loss": -12.499417304992676, "global_step": 371938, "epoch": 2213} {"train_loss": -12.496007919311523, "global_step": 371939, "epoch": 2213} {"train_loss": -12.639422416687012, "global_step": 371940, "epoch": 2213} {"train_loss": -12.434593200683594, "global_step": 371941, "epoch": 2213} {"train_loss": -12.645936965942383, "global_step": 371942, "epoch": 2213} {"train_loss": -12.595544815063477, "global_step": 371943, "epoch": 2213} {"train_loss": -12.693144798278809, "global_step": 371944, "epoch": 2213} {"train_loss": -12.585183143615723, "global_step": 371945, "epoch": 2213} {"train_loss": -12.335278511047363, "global_step": 371946, "epoch": 2213} {"train_loss": -12.148176193237305, "global_step": 371947, "epoch": 2213} {"train_loss": -12.4078950881958, "global_step": 371948, "epoch": 2213} {"train_loss": -12.400044441223145, "global_step": 371949, "epoch": 2213} {"train_loss": -12.113191604614258, "global_step": 371950, "epoch": 2213} {"train_loss": -12.117578886804127, "global_step": 371951, "epoch": 2213, "val_loss": 292776.53125} {"train_loss": -12.633062362670898, "global_step": 371952, "epoch": 2214} {"train_loss": -12.312350273132324, "global_step": 371953, "epoch": 2214} {"train_loss": -12.582597732543945, "global_step": 371954, "epoch": 2214} {"train_loss": -12.289758682250977, "global_step": 371955, "epoch": 2214} {"train_loss": -12.515727043151855, "global_step": 371956, "epoch": 2214} {"train_loss": -12.209157943725586, "global_step": 371957, "epoch": 2214} {"train_loss": -12.345297813415527, "global_step": 371958, "epoch": 2214} {"train_loss": -11.894640922546387, "global_step": 371959, "epoch": 2214} {"train_loss": -12.161214828491211, "global_step": 371960, "epoch": 2214} {"train_loss": -12.38808822631836, "global_step": 371961, "epoch": 2214} {"train_loss": -11.997722625732422, "global_step": 371962, "epoch": 2214} {"train_loss": -12.349980354309082, "global_step": 371963, "epoch": 2214} {"train_loss": -12.14646053314209, "global_step": 371964, "epoch": 2214} {"train_loss": -11.482772827148438, "global_step": 371965, "epoch": 2214} {"train_loss": -12.141080856323242, "global_step": 371966, "epoch": 2214} {"train_loss": -12.061412811279297, "global_step": 371967, "epoch": 2214} {"train_loss": -11.922526359558105, "global_step": 371968, "epoch": 2214} {"train_loss": -11.274124145507812, "global_step": 371969, "epoch": 2214} {"train_loss": -12.11106014251709, "global_step": 371970, "epoch": 2214} {"train_loss": -12.088602066040039, "global_step": 371971, "epoch": 2214} {"train_loss": -11.983870506286621, "global_step": 371972, "epoch": 2214} {"train_loss": -11.538395881652832, "global_step": 371973, "epoch": 2214} {"train_loss": -12.107955932617188, "global_step": 371974, "epoch": 2214} {"train_loss": -12.376065254211426, "global_step": 371975, "epoch": 2214} {"train_loss": -11.945310592651367, "global_step": 371976, "epoch": 2214} {"train_loss": -12.12397289276123, "global_step": 371977, "epoch": 2214} {"train_loss": -11.958610534667969, "global_step": 371978, "epoch": 2214} {"train_loss": -12.440984725952148, "global_step": 371979, "epoch": 2214} {"train_loss": -11.821784973144531, "global_step": 371980, "epoch": 2214} {"train_loss": -12.408492088317871, "global_step": 371981, "epoch": 2214} {"train_loss": -11.578570365905762, "global_step": 371982, "epoch": 2214} {"train_loss": -12.385896682739258, "global_step": 371983, "epoch": 2214} {"train_loss": -12.25379753112793, "global_step": 371984, "epoch": 2214} {"train_loss": -11.945291519165039, "global_step": 371985, "epoch": 2214} {"train_loss": -11.351789474487305, "global_step": 371986, "epoch": 2214} {"train_loss": -11.382513999938965, "global_step": 371987, "epoch": 2214} {"train_loss": -11.149377822875977, "global_step": 371988, "epoch": 2214} {"train_loss": -12.267410278320312, "global_step": 371989, "epoch": 2214} {"train_loss": -11.349519729614258, "global_step": 371990, "epoch": 2214} {"train_loss": -12.326531410217285, "global_step": 371991, "epoch": 2214} {"train_loss": -11.710793495178223, "global_step": 371992, "epoch": 2214} {"train_loss": -12.253278732299805, "global_step": 371993, "epoch": 2214} {"train_loss": -11.898552894592285, "global_step": 371994, "epoch": 2214} {"train_loss": -11.99168586730957, "global_step": 371995, "epoch": 2214} {"train_loss": -11.124300956726074, "global_step": 371996, "epoch": 2214} {"train_loss": -12.211660385131836, "global_step": 371997, "epoch": 2214} {"train_loss": -11.508644104003906, "global_step": 371998, "epoch": 2214} {"train_loss": -12.301544189453125, "global_step": 371999, "epoch": 2214} {"train_loss": -11.929880142211914, "global_step": 372000, "epoch": 2214} {"train_loss": -11.458455085754395, "global_step": 372001, "epoch": 2214} {"train_loss": -11.889789581298828, "global_step": 372002, "epoch": 2214} {"train_loss": -11.82150650024414, "global_step": 372003, "epoch": 2214} {"train_loss": -12.229681968688965, "global_step": 372004, "epoch": 2214} {"train_loss": -11.48985767364502, "global_step": 372005, "epoch": 2214} {"train_loss": -12.252025604248047, "global_step": 372006, "epoch": 2214} {"train_loss": -11.436205863952637, "global_step": 372007, "epoch": 2214} {"train_loss": -11.905924797058105, "global_step": 372008, "epoch": 2214} {"train_loss": -12.224756240844727, "global_step": 372009, "epoch": 2214} {"train_loss": -12.094953536987305, "global_step": 372010, "epoch": 2214} {"train_loss": -12.419816970825195, "global_step": 372011, "epoch": 2214} {"train_loss": -12.340757369995117, "global_step": 372012, "epoch": 2214} {"train_loss": -12.428853988647461, "global_step": 372013, "epoch": 2214} {"train_loss": -12.009355545043945, "global_step": 372014, "epoch": 2214} {"train_loss": -12.395835876464844, "global_step": 372015, "epoch": 2214} {"train_loss": -12.292584419250488, "global_step": 372016, "epoch": 2214} {"train_loss": -12.29776668548584, "global_step": 372017, "epoch": 2214} {"train_loss": -12.20742416381836, "global_step": 372018, "epoch": 2214} {"train_loss": -12.27332878112793, "global_step": 372019, "epoch": 2214} {"train_loss": -12.139463424682617, "global_step": 372020, "epoch": 2214} {"train_loss": -12.208992958068848, "global_step": 372021, "epoch": 2214} {"train_loss": -12.029733657836914, "global_step": 372022, "epoch": 2214} {"train_loss": -11.9942626953125, "global_step": 372023, "epoch": 2214} {"train_loss": -12.53225040435791, "global_step": 372024, "epoch": 2214} {"train_loss": -12.046810150146484, "global_step": 372025, "epoch": 2214} {"train_loss": -12.085639953613281, "global_step": 372026, "epoch": 2214} {"train_loss": -12.537454605102539, "global_step": 372027, "epoch": 2214} {"train_loss": -12.13293170928955, "global_step": 372028, "epoch": 2214} {"train_loss": -12.22232437133789, "global_step": 372029, "epoch": 2214} {"train_loss": -12.528367042541504, "global_step": 372030, "epoch": 2214} {"train_loss": -12.396907806396484, "global_step": 372031, "epoch": 2214} {"train_loss": -12.179071426391602, "global_step": 372032, "epoch": 2214} {"train_loss": -12.586978912353516, "global_step": 372033, "epoch": 2214} {"train_loss": -12.335530281066895, "global_step": 372034, "epoch": 2214} {"train_loss": -11.098541259765625, "global_step": 372035, "epoch": 2214} {"train_loss": -11.019901275634766, "global_step": 372036, "epoch": 2214} {"train_loss": -12.331958770751953, "global_step": 372037, "epoch": 2214} {"train_loss": -11.671791076660156, "global_step": 372038, "epoch": 2214} {"train_loss": -10.830534934997559, "global_step": 372039, "epoch": 2214} {"train_loss": -12.563698768615723, "global_step": 372040, "epoch": 2214} {"train_loss": -11.423948287963867, "global_step": 372041, "epoch": 2214} {"train_loss": -11.830339431762695, "global_step": 372042, "epoch": 2214} {"train_loss": -11.994298934936523, "global_step": 372043, "epoch": 2214} {"train_loss": -11.420770645141602, "global_step": 372044, "epoch": 2214} {"train_loss": -11.43822193145752, "global_step": 372045, "epoch": 2214} {"train_loss": -11.571977615356445, "global_step": 372046, "epoch": 2214} {"train_loss": -10.711051940917969, "global_step": 372047, "epoch": 2214} {"train_loss": -11.22366714477539, "global_step": 372048, "epoch": 2214} {"train_loss": -11.859429359436035, "global_step": 372049, "epoch": 2214} {"train_loss": -11.079183578491211, "global_step": 372050, "epoch": 2214} {"train_loss": -11.798425674438477, "global_step": 372051, "epoch": 2214} {"train_loss": -11.835128784179688, "global_step": 372052, "epoch": 2214} {"train_loss": -12.314377784729004, "global_step": 372053, "epoch": 2214} {"train_loss": -11.923604965209961, "global_step": 372054, "epoch": 2214} {"train_loss": -12.428909301757812, "global_step": 372055, "epoch": 2214} {"train_loss": -11.749946594238281, "global_step": 372056, "epoch": 2214} {"train_loss": -12.093527793884277, "global_step": 372057, "epoch": 2214} {"train_loss": -11.635733604431152, "global_step": 372058, "epoch": 2214} {"train_loss": -12.245521545410156, "global_step": 372059, "epoch": 2214} {"train_loss": -12.100154876708984, "global_step": 372060, "epoch": 2214} {"train_loss": -12.216766357421875, "global_step": 372061, "epoch": 2214} {"train_loss": -12.008094787597656, "global_step": 372062, "epoch": 2214} {"train_loss": -12.346267700195312, "global_step": 372063, "epoch": 2214} {"train_loss": -12.246747970581055, "global_step": 372064, "epoch": 2214} {"train_loss": -12.06185531616211, "global_step": 372065, "epoch": 2214} {"train_loss": -12.542937278747559, "global_step": 372066, "epoch": 2214} {"train_loss": -12.227078437805176, "global_step": 372067, "epoch": 2214} {"train_loss": -12.2982177734375, "global_step": 372068, "epoch": 2214} {"train_loss": -12.259389877319336, "global_step": 372069, "epoch": 2214} {"train_loss": -12.389963150024414, "global_step": 372070, "epoch": 2214} {"train_loss": -12.034505844116211, "global_step": 372071, "epoch": 2214} {"train_loss": -12.367820739746094, "global_step": 372072, "epoch": 2214} {"train_loss": -12.198274612426758, "global_step": 372073, "epoch": 2214} {"train_loss": -12.39553451538086, "global_step": 372074, "epoch": 2214} {"train_loss": -12.045380592346191, "global_step": 372075, "epoch": 2214} {"train_loss": -11.992197036743164, "global_step": 372076, "epoch": 2214} {"train_loss": -11.907166481018066, "global_step": 372077, "epoch": 2214} {"train_loss": -11.999090194702148, "global_step": 372078, "epoch": 2214} {"train_loss": -11.890159606933594, "global_step": 372079, "epoch": 2214} {"train_loss": -12.127228736877441, "global_step": 372080, "epoch": 2214} {"train_loss": -11.871370315551758, "global_step": 372081, "epoch": 2214} {"train_loss": -11.97431755065918, "global_step": 372082, "epoch": 2214} {"train_loss": -12.456672668457031, "global_step": 372083, "epoch": 2214} {"train_loss": -12.161864280700684, "global_step": 372084, "epoch": 2214} {"train_loss": -12.295618057250977, "global_step": 372085, "epoch": 2214} {"train_loss": -12.27899169921875, "global_step": 372086, "epoch": 2214} {"train_loss": -12.320338249206543, "global_step": 372087, "epoch": 2214} {"train_loss": -12.2282075881958, "global_step": 372088, "epoch": 2214} {"train_loss": -12.481517791748047, "global_step": 372089, "epoch": 2214} {"train_loss": -12.412826538085938, "global_step": 372090, "epoch": 2214} {"train_loss": -12.39897346496582, "global_step": 372091, "epoch": 2214} {"train_loss": -12.46113395690918, "global_step": 372092, "epoch": 2214} {"train_loss": -12.624764442443848, "global_step": 372093, "epoch": 2214} {"train_loss": -12.452356338500977, "global_step": 372094, "epoch": 2214} {"train_loss": -12.544817924499512, "global_step": 372095, "epoch": 2214} {"train_loss": -12.443653106689453, "global_step": 372096, "epoch": 2214} {"train_loss": -12.279810905456543, "global_step": 372097, "epoch": 2214} {"train_loss": -12.529001235961914, "global_step": 372098, "epoch": 2214} {"train_loss": -11.896074295043945, "global_step": 372099, "epoch": 2214} {"train_loss": -11.954803466796875, "global_step": 372100, "epoch": 2214} {"train_loss": -12.115653991699219, "global_step": 372101, "epoch": 2214} {"train_loss": -11.656052589416504, "global_step": 372102, "epoch": 2214} {"train_loss": -12.14417552947998, "global_step": 372103, "epoch": 2214} {"train_loss": -11.394163131713867, "global_step": 372104, "epoch": 2214} {"train_loss": -12.122930526733398, "global_step": 372105, "epoch": 2214} {"train_loss": -12.070795059204102, "global_step": 372106, "epoch": 2214} {"train_loss": -12.240758895874023, "global_step": 372107, "epoch": 2214} {"train_loss": -11.820585250854492, "global_step": 372108, "epoch": 2214} {"train_loss": -11.81059741973877, "global_step": 372109, "epoch": 2214} {"train_loss": -10.895614624023438, "global_step": 372110, "epoch": 2214} {"train_loss": -11.517755508422852, "global_step": 372111, "epoch": 2214} {"train_loss": -11.719860076904297, "global_step": 372112, "epoch": 2214} {"train_loss": -12.301847457885742, "global_step": 372113, "epoch": 2214} {"train_loss": -11.528913497924805, "global_step": 372114, "epoch": 2214} {"train_loss": -12.47203254699707, "global_step": 372115, "epoch": 2214} {"train_loss": -12.027658462524414, "global_step": 372116, "epoch": 2214} {"train_loss": -12.034106254577637, "global_step": 372117, "epoch": 2214} {"train_loss": -12.388479232788086, "global_step": 372118, "epoch": 2214} {"train_loss": -12.037911290214176, "global_step": 372119, "epoch": 2214, "val_loss": 293890.46875} {"train_loss": -12.044055938720703, "global_step": 372120, "epoch": 2215} {"train_loss": -12.27000617980957, "global_step": 372121, "epoch": 2215} {"train_loss": -11.873186111450195, "global_step": 372122, "epoch": 2215} {"train_loss": -12.24324893951416, "global_step": 372123, "epoch": 2215} {"train_loss": -12.429697036743164, "global_step": 372124, "epoch": 2215} {"train_loss": -12.279552459716797, "global_step": 372125, "epoch": 2215} {"train_loss": -11.920920372009277, "global_step": 372126, "epoch": 2215} {"train_loss": -11.482131004333496, "global_step": 372127, "epoch": 2215} {"train_loss": -12.215232849121094, "global_step": 372128, "epoch": 2215} {"train_loss": -12.124968528747559, "global_step": 372129, "epoch": 2215} {"train_loss": -11.924591064453125, "global_step": 372130, "epoch": 2215} {"train_loss": -11.595956802368164, "global_step": 372131, "epoch": 2215} {"train_loss": -10.978628158569336, "global_step": 372132, "epoch": 2215} {"train_loss": -11.927238464355469, "global_step": 372133, "epoch": 2215} {"train_loss": -10.920486450195312, "global_step": 372134, "epoch": 2215} {"train_loss": -11.413557052612305, "global_step": 372135, "epoch": 2215} {"train_loss": -11.948156356811523, "global_step": 372136, "epoch": 2215} {"train_loss": -11.460413932800293, "global_step": 372137, "epoch": 2215} {"train_loss": -11.365011215209961, "global_step": 372138, "epoch": 2215} {"train_loss": -11.86247444152832, "global_step": 372139, "epoch": 2215} {"train_loss": -11.356640815734863, "global_step": 372140, "epoch": 2215} {"train_loss": -12.160924911499023, "global_step": 372141, "epoch": 2215} {"train_loss": -11.921606063842773, "global_step": 372142, "epoch": 2215} {"train_loss": -11.615452766418457, "global_step": 372143, "epoch": 2215} {"train_loss": -11.971054077148438, "global_step": 372144, "epoch": 2215} {"train_loss": -11.866543769836426, "global_step": 372145, "epoch": 2215} {"train_loss": -12.085405349731445, "global_step": 372146, "epoch": 2215} {"train_loss": -12.071250915527344, "global_step": 372147, "epoch": 2215} {"train_loss": -12.534024238586426, "global_step": 372148, "epoch": 2215} {"train_loss": -12.35457992553711, "global_step": 372149, "epoch": 2215} {"train_loss": -12.37019157409668, "global_step": 372150, "epoch": 2215} {"train_loss": -12.288076400756836, "global_step": 372151, "epoch": 2215} {"train_loss": -12.163705825805664, "global_step": 372152, "epoch": 2215} {"train_loss": -12.473543167114258, "global_step": 372153, "epoch": 2215} {"train_loss": -11.988239288330078, "global_step": 372154, "epoch": 2215} {"train_loss": -12.298500061035156, "global_step": 372155, "epoch": 2215} {"train_loss": -12.30335807800293, "global_step": 372156, "epoch": 2215} {"train_loss": -12.38138484954834, "global_step": 372157, "epoch": 2215} {"train_loss": -12.609779357910156, "global_step": 372158, "epoch": 2215} {"train_loss": -12.008764266967773, "global_step": 372159, "epoch": 2215} {"train_loss": -12.609319686889648, "global_step": 372160, "epoch": 2215} {"train_loss": -11.910058975219727, "global_step": 372161, "epoch": 2215} {"train_loss": -12.128083229064941, "global_step": 372162, "epoch": 2215} {"train_loss": -11.871085166931152, "global_step": 372163, "epoch": 2215} {"train_loss": -11.820234298706055, "global_step": 372164, "epoch": 2215} {"train_loss": -12.337675094604492, "global_step": 372165, "epoch": 2215} {"train_loss": -11.75407600402832, "global_step": 372166, "epoch": 2215} {"train_loss": -12.288788795471191, "global_step": 372167, "epoch": 2215} {"train_loss": -12.107080459594727, "global_step": 372168, "epoch": 2215} {"train_loss": -12.100217819213867, "global_step": 372169, "epoch": 2215} {"train_loss": -12.231612205505371, "global_step": 372170, "epoch": 2215} {"train_loss": -11.995654106140137, "global_step": 372171, "epoch": 2215} {"train_loss": -11.936712265014648, "global_step": 372172, "epoch": 2215} {"train_loss": -12.496101379394531, "global_step": 372173, "epoch": 2215} {"train_loss": -11.289151191711426, "global_step": 372174, "epoch": 2215} {"train_loss": -12.323177337646484, "global_step": 372175, "epoch": 2215} {"train_loss": -11.92708969116211, "global_step": 372176, "epoch": 2215} {"train_loss": -12.135963439941406, "global_step": 372177, "epoch": 2215} {"train_loss": -12.229656219482422, "global_step": 372178, "epoch": 2215} {"train_loss": -12.602717399597168, "global_step": 372179, "epoch": 2215} {"train_loss": -12.18288516998291, "global_step": 372180, "epoch": 2215} {"train_loss": -12.354580879211426, "global_step": 372181, "epoch": 2215} {"train_loss": -12.00556755065918, "global_step": 372182, "epoch": 2215} {"train_loss": -12.226215362548828, "global_step": 372183, "epoch": 2215} {"train_loss": -12.41001033782959, "global_step": 372184, "epoch": 2215} {"train_loss": -12.201017379760742, "global_step": 372185, "epoch": 2215} {"train_loss": -11.845834732055664, "global_step": 372186, "epoch": 2215} {"train_loss": -12.401819229125977, "global_step": 372187, "epoch": 2215} {"train_loss": -12.58161735534668, "global_step": 372188, "epoch": 2215} {"train_loss": -11.786994934082031, "global_step": 372189, "epoch": 2215} {"train_loss": -12.302313804626465, "global_step": 372190, "epoch": 2215} {"train_loss": -12.445940017700195, "global_step": 372191, "epoch": 2215} {"train_loss": -12.026429176330566, "global_step": 372192, "epoch": 2215} {"train_loss": -12.095252990722656, "global_step": 372193, "epoch": 2215} {"train_loss": -12.376938819885254, "global_step": 372194, "epoch": 2215} {"train_loss": -11.78130054473877, "global_step": 372195, "epoch": 2215} {"train_loss": -12.328936576843262, "global_step": 372196, "epoch": 2215} {"train_loss": -11.718223571777344, "global_step": 372197, "epoch": 2215} {"train_loss": -10.96384048461914, "global_step": 372198, "epoch": 2215} {"train_loss": -11.710304260253906, "global_step": 372199, "epoch": 2215} {"train_loss": -11.999320983886719, "global_step": 372200, "epoch": 2215} {"train_loss": -10.981292724609375, "global_step": 372201, "epoch": 2215} {"train_loss": -12.095831871032715, "global_step": 372202, "epoch": 2215} {"train_loss": -11.882466316223145, "global_step": 372203, "epoch": 2215} {"train_loss": -12.08510971069336, "global_step": 372204, "epoch": 2215} {"train_loss": -12.323162078857422, "global_step": 372205, "epoch": 2215} {"train_loss": -12.187732696533203, "global_step": 372206, "epoch": 2215} {"train_loss": -12.014369010925293, "global_step": 372207, "epoch": 2215} {"train_loss": -12.175506591796875, "global_step": 372208, "epoch": 2215} {"train_loss": -12.027301788330078, "global_step": 372209, "epoch": 2215} {"train_loss": -11.888808250427246, "global_step": 372210, "epoch": 2215} {"train_loss": -11.826813697814941, "global_step": 372211, "epoch": 2215} {"train_loss": -12.297618865966797, "global_step": 372212, "epoch": 2215} {"train_loss": -12.263940811157227, "global_step": 372213, "epoch": 2215} {"train_loss": -12.174665451049805, "global_step": 372214, "epoch": 2215} {"train_loss": -12.264859199523926, "global_step": 372215, "epoch": 2215} {"train_loss": -12.327276229858398, "global_step": 372216, "epoch": 2215} {"train_loss": -11.391180992126465, "global_step": 372217, "epoch": 2215} {"train_loss": -12.58579158782959, "global_step": 372218, "epoch": 2215} {"train_loss": -11.70755386352539, "global_step": 372219, "epoch": 2215} {"train_loss": -12.192398071289062, "global_step": 372220, "epoch": 2215} {"train_loss": -11.8126220703125, "global_step": 372221, "epoch": 2215} {"train_loss": -11.973907470703125, "global_step": 372222, "epoch": 2215} {"train_loss": -12.322126388549805, "global_step": 372223, "epoch": 2215} {"train_loss": -12.16301155090332, "global_step": 372224, "epoch": 2215} {"train_loss": -12.50418472290039, "global_step": 372225, "epoch": 2215} {"train_loss": -12.328178405761719, "global_step": 372226, "epoch": 2215} {"train_loss": -12.348320007324219, "global_step": 372227, "epoch": 2215} {"train_loss": -12.252753257751465, "global_step": 372228, "epoch": 2215} {"train_loss": -11.952009201049805, "global_step": 372229, "epoch": 2215} {"train_loss": -12.261785507202148, "global_step": 372230, "epoch": 2215} {"train_loss": -12.124765396118164, "global_step": 372231, "epoch": 2215} {"train_loss": -12.434244155883789, "global_step": 372232, "epoch": 2215} {"train_loss": -12.351932525634766, "global_step": 372233, "epoch": 2215} {"train_loss": -12.271389961242676, "global_step": 372234, "epoch": 2215} {"train_loss": -12.53791618347168, "global_step": 372235, "epoch": 2215} {"train_loss": -12.227659225463867, "global_step": 372236, "epoch": 2215} {"train_loss": -12.25852108001709, "global_step": 372237, "epoch": 2215} {"train_loss": -12.334810256958008, "global_step": 372238, "epoch": 2215} {"train_loss": -12.186691284179688, "global_step": 372239, "epoch": 2215} {"train_loss": -12.450776100158691, "global_step": 372240, "epoch": 2215} {"train_loss": -12.340578079223633, "global_step": 372241, "epoch": 2215} {"train_loss": -12.550439834594727, "global_step": 372242, "epoch": 2215} {"train_loss": -12.111194610595703, "global_step": 372243, "epoch": 2215} {"train_loss": -12.288315773010254, "global_step": 372244, "epoch": 2215} {"train_loss": -11.835836410522461, "global_step": 372245, "epoch": 2215} {"train_loss": -12.354358673095703, "global_step": 372246, "epoch": 2215} {"train_loss": -12.278763771057129, "global_step": 372247, "epoch": 2215} {"train_loss": -11.670478820800781, "global_step": 372248, "epoch": 2215} {"train_loss": -12.540027618408203, "global_step": 372249, "epoch": 2215} {"train_loss": -12.21086597442627, "global_step": 372250, "epoch": 2215} {"train_loss": -12.379080772399902, "global_step": 372251, "epoch": 2215} {"train_loss": -12.48089599609375, "global_step": 372252, "epoch": 2215} {"train_loss": -11.716484069824219, "global_step": 372253, "epoch": 2215} {"train_loss": -12.564699172973633, "global_step": 372254, "epoch": 2215} {"train_loss": -12.145753860473633, "global_step": 372255, "epoch": 2215} {"train_loss": -11.832965850830078, "global_step": 372256, "epoch": 2215} {"train_loss": -12.395259857177734, "global_step": 372257, "epoch": 2215} {"train_loss": -11.84451675415039, "global_step": 372258, "epoch": 2215} {"train_loss": -12.557291030883789, "global_step": 372259, "epoch": 2215} {"train_loss": -11.832416534423828, "global_step": 372260, "epoch": 2215} {"train_loss": -12.484339714050293, "global_step": 372261, "epoch": 2215} {"train_loss": -11.622097969055176, "global_step": 372262, "epoch": 2215} {"train_loss": -12.26220703125, "global_step": 372263, "epoch": 2215} {"train_loss": -11.612565994262695, "global_step": 372264, "epoch": 2215} {"train_loss": -11.472356796264648, "global_step": 372265, "epoch": 2215} {"train_loss": -11.680638313293457, "global_step": 372266, "epoch": 2215} {"train_loss": -11.953125953674316, "global_step": 372267, "epoch": 2215} {"train_loss": -12.378543853759766, "global_step": 372268, "epoch": 2215} {"train_loss": -11.61293888092041, "global_step": 372269, "epoch": 2215} {"train_loss": -11.836311340332031, "global_step": 372270, "epoch": 2215} {"train_loss": -11.506932258605957, "global_step": 372271, "epoch": 2215} {"train_loss": -12.13493537902832, "global_step": 372272, "epoch": 2215} {"train_loss": -11.709765434265137, "global_step": 372273, "epoch": 2215} {"train_loss": -11.592907905578613, "global_step": 372274, "epoch": 2215} {"train_loss": -11.654254913330078, "global_step": 372275, "epoch": 2215} {"train_loss": -11.610011100769043, "global_step": 372276, "epoch": 2215} {"train_loss": -12.024567604064941, "global_step": 372277, "epoch": 2215} {"train_loss": -11.750866889953613, "global_step": 372278, "epoch": 2215} {"train_loss": -11.237140655517578, "global_step": 372279, "epoch": 2215} {"train_loss": -12.315481185913086, "global_step": 372280, "epoch": 2215} {"train_loss": -11.166707992553711, "global_step": 372281, "epoch": 2215} {"train_loss": -12.366090774536133, "global_step": 372282, "epoch": 2215} {"train_loss": -11.764241218566895, "global_step": 372283, "epoch": 2215} {"train_loss": -11.985626220703125, "global_step": 372284, "epoch": 2215} {"train_loss": -12.004810333251953, "global_step": 372285, "epoch": 2215} {"train_loss": -11.510137557983398, "global_step": 372286, "epoch": 2215} {"train_loss": -12.04922458103725, "global_step": 372287, "epoch": 2215, "val_loss": 293984.375, "train_action_mse_error": 1.4356403350830078} {"train_loss": -12.003235816955566, "global_step": 372288, "epoch": 2216} {"train_loss": -11.725967407226562, "global_step": 372289, "epoch": 2216} {"train_loss": -12.436761856079102, "global_step": 372290, "epoch": 2216} {"train_loss": -11.744911193847656, "global_step": 372291, "epoch": 2216} {"train_loss": -12.168766021728516, "global_step": 372292, "epoch": 2216} {"train_loss": -12.127821922302246, "global_step": 372293, "epoch": 2216} {"train_loss": -12.135063171386719, "global_step": 372294, "epoch": 2216} {"train_loss": -12.049348831176758, "global_step": 372295, "epoch": 2216} {"train_loss": -11.677057266235352, "global_step": 372296, "epoch": 2216} {"train_loss": -12.013618469238281, "global_step": 372297, "epoch": 2216} {"train_loss": -12.035003662109375, "global_step": 372298, "epoch": 2216} {"train_loss": -12.043123245239258, "global_step": 372299, "epoch": 2216} {"train_loss": -11.11146354675293, "global_step": 372300, "epoch": 2216} {"train_loss": -11.438591957092285, "global_step": 372301, "epoch": 2216} {"train_loss": -11.317291259765625, "global_step": 372302, "epoch": 2216} {"train_loss": -11.775903701782227, "global_step": 372303, "epoch": 2216} {"train_loss": -11.780784606933594, "global_step": 372304, "epoch": 2216} {"train_loss": -11.96823501586914, "global_step": 372305, "epoch": 2216} {"train_loss": -11.546024322509766, "global_step": 372306, "epoch": 2216} {"train_loss": -12.002091407775879, "global_step": 372307, "epoch": 2216} {"train_loss": -11.199996948242188, "global_step": 372308, "epoch": 2216} {"train_loss": -12.392563819885254, "global_step": 372309, "epoch": 2216} {"train_loss": -11.1553955078125, "global_step": 372310, "epoch": 2216} {"train_loss": -11.60761547088623, "global_step": 372311, "epoch": 2216} {"train_loss": -11.094528198242188, "global_step": 372312, "epoch": 2216} {"train_loss": -11.601731300354004, "global_step": 372313, "epoch": 2216} {"train_loss": -11.430879592895508, "global_step": 372314, "epoch": 2216} {"train_loss": -11.277732849121094, "global_step": 372315, "epoch": 2216} {"train_loss": -11.3876371383667, "global_step": 372316, "epoch": 2216} {"train_loss": -10.865707397460938, "global_step": 372317, "epoch": 2216} {"train_loss": -10.707189559936523, "global_step": 372318, "epoch": 2216} {"train_loss": -11.937721252441406, "global_step": 372319, "epoch": 2216} {"train_loss": -11.6732816696167, "global_step": 372320, "epoch": 2216} {"train_loss": -11.19503402709961, "global_step": 372321, "epoch": 2216} {"train_loss": -11.965158462524414, "global_step": 372322, "epoch": 2216} {"train_loss": -11.524917602539062, "global_step": 372323, "epoch": 2216} {"train_loss": -11.285515785217285, "global_step": 372324, "epoch": 2216} {"train_loss": -11.751176834106445, "global_step": 372325, "epoch": 2216} {"train_loss": -9.925895690917969, "global_step": 372326, "epoch": 2216} {"train_loss": -11.851404190063477, "global_step": 372327, "epoch": 2216} {"train_loss": -9.502029418945312, "global_step": 372328, "epoch": 2216} {"train_loss": -11.36190414428711, "global_step": 372329, "epoch": 2216} {"train_loss": -10.921590805053711, "global_step": 372330, "epoch": 2216} {"train_loss": -11.455741882324219, "global_step": 372331, "epoch": 2216} {"train_loss": -11.796401977539062, "global_step": 372332, "epoch": 2216} {"train_loss": -10.996213912963867, "global_step": 372333, "epoch": 2216} {"train_loss": -12.344171524047852, "global_step": 372334, "epoch": 2216} {"train_loss": -10.937711715698242, "global_step": 372335, "epoch": 2216} {"train_loss": -12.041423797607422, "global_step": 372336, "epoch": 2216} {"train_loss": -11.555713653564453, "global_step": 372337, "epoch": 2216} {"train_loss": -12.070405960083008, "global_step": 372338, "epoch": 2216} {"train_loss": -11.91111946105957, "global_step": 372339, "epoch": 2216} {"train_loss": -11.859916687011719, "global_step": 372340, "epoch": 2216} {"train_loss": -11.85468864440918, "global_step": 372341, "epoch": 2216} {"train_loss": -11.459993362426758, "global_step": 372342, "epoch": 2216} {"train_loss": -12.211477279663086, "global_step": 372343, "epoch": 2216} {"train_loss": -12.002222061157227, "global_step": 372344, "epoch": 2216} {"train_loss": -12.232627868652344, "global_step": 372345, "epoch": 2216} {"train_loss": -12.248922348022461, "global_step": 372346, "epoch": 2216} {"train_loss": -12.124889373779297, "global_step": 372347, "epoch": 2216} {"train_loss": -12.28780746459961, "global_step": 372348, "epoch": 2216} {"train_loss": -11.810056686401367, "global_step": 372349, "epoch": 2216} {"train_loss": -12.270577430725098, "global_step": 372350, "epoch": 2216} {"train_loss": -11.868783950805664, "global_step": 372351, "epoch": 2216} {"train_loss": -12.205162048339844, "global_step": 372352, "epoch": 2216} {"train_loss": -11.799895286560059, "global_step": 372353, "epoch": 2216} {"train_loss": -12.36294937133789, "global_step": 372354, "epoch": 2216} {"train_loss": -11.92198657989502, "global_step": 372355, "epoch": 2216} {"train_loss": -12.302915573120117, "global_step": 372356, "epoch": 2216} {"train_loss": -12.18859577178955, "global_step": 372357, "epoch": 2216} {"train_loss": -12.385403633117676, "global_step": 372358, "epoch": 2216} {"train_loss": -12.285719871520996, "global_step": 372359, "epoch": 2216} {"train_loss": -12.237226486206055, "global_step": 372360, "epoch": 2216} {"train_loss": -12.519181251525879, "global_step": 372361, "epoch": 2216} {"train_loss": -11.921358108520508, "global_step": 372362, "epoch": 2216} {"train_loss": -12.463693618774414, "global_step": 372363, "epoch": 2216} {"train_loss": -12.112406730651855, "global_step": 372364, "epoch": 2216} {"train_loss": -12.382593154907227, "global_step": 372365, "epoch": 2216} {"train_loss": -12.131574630737305, "global_step": 372366, "epoch": 2216} {"train_loss": -12.333039283752441, "global_step": 372367, "epoch": 2216} {"train_loss": -12.204292297363281, "global_step": 372368, "epoch": 2216} {"train_loss": -12.300207138061523, "global_step": 372369, "epoch": 2216} {"train_loss": -12.298164367675781, "global_step": 372370, "epoch": 2216} {"train_loss": -12.306953430175781, "global_step": 372371, "epoch": 2216} {"train_loss": -12.260555267333984, "global_step": 372372, "epoch": 2216} {"train_loss": -12.282747268676758, "global_step": 372373, "epoch": 2216} {"train_loss": -12.285940170288086, "global_step": 372374, "epoch": 2216} {"train_loss": -12.646707534790039, "global_step": 372375, "epoch": 2216} {"train_loss": -12.279200553894043, "global_step": 372376, "epoch": 2216} {"train_loss": -12.662345886230469, "global_step": 372377, "epoch": 2216} {"train_loss": -12.508159637451172, "global_step": 372378, "epoch": 2216} {"train_loss": -12.668608665466309, "global_step": 372379, "epoch": 2216} {"train_loss": -12.489208221435547, "global_step": 372380, "epoch": 2216} {"train_loss": -12.686637878417969, "global_step": 372381, "epoch": 2216} {"train_loss": -12.635480880737305, "global_step": 372382, "epoch": 2216} {"train_loss": -12.471960067749023, "global_step": 372383, "epoch": 2216} {"train_loss": -12.537939071655273, "global_step": 372384, "epoch": 2216} {"train_loss": -12.339290618896484, "global_step": 372385, "epoch": 2216} {"train_loss": -12.659546852111816, "global_step": 372386, "epoch": 2216} {"train_loss": -12.504046440124512, "global_step": 372387, "epoch": 2216} {"train_loss": -12.702911376953125, "global_step": 372388, "epoch": 2216} {"train_loss": -12.381423950195312, "global_step": 372389, "epoch": 2216} {"train_loss": -12.465225219726562, "global_step": 372390, "epoch": 2216} {"train_loss": -12.324361801147461, "global_step": 372391, "epoch": 2216} {"train_loss": -12.555495262145996, "global_step": 372392, "epoch": 2216} {"train_loss": -12.499395370483398, "global_step": 372393, "epoch": 2216} {"train_loss": -12.48243236541748, "global_step": 372394, "epoch": 2216} {"train_loss": -12.668018341064453, "global_step": 372395, "epoch": 2216} {"train_loss": -12.818683624267578, "global_step": 372396, "epoch": 2216} {"train_loss": -12.82797622680664, "global_step": 372397, "epoch": 2216} {"train_loss": -12.569711685180664, "global_step": 372398, "epoch": 2216} {"train_loss": -12.536467552185059, "global_step": 372399, "epoch": 2216} {"train_loss": -12.543916702270508, "global_step": 372400, "epoch": 2216} {"train_loss": -12.686349868774414, "global_step": 372401, "epoch": 2216} {"train_loss": -12.806548118591309, "global_step": 372402, "epoch": 2216} {"train_loss": -12.771842956542969, "global_step": 372403, "epoch": 2216} {"train_loss": -12.413808822631836, "global_step": 372404, "epoch": 2216} {"train_loss": -12.606170654296875, "global_step": 372405, "epoch": 2216} {"train_loss": -12.55947208404541, "global_step": 372406, "epoch": 2216} {"train_loss": -12.04736614227295, "global_step": 372407, "epoch": 2216} {"train_loss": -12.331368446350098, "global_step": 372408, "epoch": 2216} {"train_loss": -12.371198654174805, "global_step": 372409, "epoch": 2216} {"train_loss": -12.160377502441406, "global_step": 372410, "epoch": 2216} {"train_loss": -12.459386825561523, "global_step": 372411, "epoch": 2216} {"train_loss": -12.402022361755371, "global_step": 372412, "epoch": 2216} {"train_loss": -12.417903900146484, "global_step": 372413, "epoch": 2216} {"train_loss": -12.15809440612793, "global_step": 372414, "epoch": 2216} {"train_loss": -12.441783905029297, "global_step": 372415, "epoch": 2216} {"train_loss": -12.217506408691406, "global_step": 372416, "epoch": 2216} {"train_loss": -12.615803718566895, "global_step": 372417, "epoch": 2216} {"train_loss": -12.128582000732422, "global_step": 372418, "epoch": 2216} {"train_loss": -12.220787048339844, "global_step": 372419, "epoch": 2216} {"train_loss": -12.417932510375977, "global_step": 372420, "epoch": 2216} {"train_loss": -12.390172004699707, "global_step": 372421, "epoch": 2216} {"train_loss": -12.390571594238281, "global_step": 372422, "epoch": 2216} {"train_loss": -12.386808395385742, "global_step": 372423, "epoch": 2216} {"train_loss": -11.704984664916992, "global_step": 372424, "epoch": 2216} {"train_loss": -11.849294662475586, "global_step": 372425, "epoch": 2216} {"train_loss": -12.198297500610352, "global_step": 372426, "epoch": 2216} {"train_loss": -11.956258773803711, "global_step": 372427, "epoch": 2216} {"train_loss": -11.402807235717773, "global_step": 372428, "epoch": 2216} {"train_loss": -12.167980194091797, "global_step": 372429, "epoch": 2216} {"train_loss": -12.452234268188477, "global_step": 372430, "epoch": 2216} {"train_loss": -11.682121276855469, "global_step": 372431, "epoch": 2216} {"train_loss": -10.630067825317383, "global_step": 372432, "epoch": 2216} {"train_loss": -12.258648872375488, "global_step": 372433, "epoch": 2216} {"train_loss": -11.50665283203125, "global_step": 372434, "epoch": 2216} {"train_loss": -11.193643569946289, "global_step": 372435, "epoch": 2216} {"train_loss": -11.915458679199219, "global_step": 372436, "epoch": 2216} {"train_loss": -11.667367935180664, "global_step": 372437, "epoch": 2216} {"train_loss": -9.894826889038086, "global_step": 372438, "epoch": 2216} {"train_loss": -11.960603713989258, "global_step": 372439, "epoch": 2216} {"train_loss": -11.469358444213867, "global_step": 372440, "epoch": 2216} {"train_loss": -10.351706504821777, "global_step": 372441, "epoch": 2216} {"train_loss": -10.965559005737305, "global_step": 372442, "epoch": 2216} {"train_loss": -11.028884887695312, "global_step": 372443, "epoch": 2216} {"train_loss": -11.181658744812012, "global_step": 372444, "epoch": 2216} {"train_loss": -12.034975051879883, "global_step": 372445, "epoch": 2216} {"train_loss": -10.972371101379395, "global_step": 372446, "epoch": 2216} {"train_loss": -11.897607803344727, "global_step": 372447, "epoch": 2216} {"train_loss": -11.954134941101074, "global_step": 372448, "epoch": 2216} {"train_loss": -11.592296600341797, "global_step": 372449, "epoch": 2216} {"train_loss": -12.106139183044434, "global_step": 372450, "epoch": 2216} {"train_loss": -11.903131484985352, "global_step": 372451, "epoch": 2216} {"train_loss": -12.287315368652344, "global_step": 372452, "epoch": 2216} {"train_loss": -11.960227012634277, "global_step": 372453, "epoch": 2216} {"train_loss": -12.328004837036133, "global_step": 372454, "epoch": 2216} {"train_loss": -11.976939933640617, "global_step": 372455, "epoch": 2216, "val_loss": 290293.71875} {"train_loss": -12.465572357177734, "global_step": 372456, "epoch": 2217} {"train_loss": -11.924115180969238, "global_step": 372457, "epoch": 2217} {"train_loss": -12.632683753967285, "global_step": 372458, "epoch": 2217} {"train_loss": -11.75112247467041, "global_step": 372459, "epoch": 2217} {"train_loss": -12.169098854064941, "global_step": 372460, "epoch": 2217} {"train_loss": -12.272268295288086, "global_step": 372461, "epoch": 2217} {"train_loss": -12.300214767456055, "global_step": 372462, "epoch": 2217} {"train_loss": -12.019238471984863, "global_step": 372463, "epoch": 2217} {"train_loss": -12.475687026977539, "global_step": 372464, "epoch": 2217} {"train_loss": -12.093596458435059, "global_step": 372465, "epoch": 2217} {"train_loss": -12.185738563537598, "global_step": 372466, "epoch": 2217} {"train_loss": -11.903814315795898, "global_step": 372467, "epoch": 2217} {"train_loss": -12.33642864227295, "global_step": 372468, "epoch": 2217} {"train_loss": -11.90223503112793, "global_step": 372469, "epoch": 2217} {"train_loss": -12.177796363830566, "global_step": 372470, "epoch": 2217} {"train_loss": -11.62246036529541, "global_step": 372471, "epoch": 2217} {"train_loss": -11.87993049621582, "global_step": 372472, "epoch": 2217} {"train_loss": -12.347455024719238, "global_step": 372473, "epoch": 2217} {"train_loss": -11.862634658813477, "global_step": 372474, "epoch": 2217} {"train_loss": -12.23320484161377, "global_step": 372475, "epoch": 2217} {"train_loss": -12.04886245727539, "global_step": 372476, "epoch": 2217} {"train_loss": -11.706722259521484, "global_step": 372477, "epoch": 2217} {"train_loss": -11.895155906677246, "global_step": 372478, "epoch": 2217} {"train_loss": -11.651508331298828, "global_step": 372479, "epoch": 2217} {"train_loss": -10.485162734985352, "global_step": 372480, "epoch": 2217} {"train_loss": -12.213979721069336, "global_step": 372481, "epoch": 2217} {"train_loss": -11.076194763183594, "global_step": 372482, "epoch": 2217} {"train_loss": -11.767818450927734, "global_step": 372483, "epoch": 2217} {"train_loss": -10.957258224487305, "global_step": 372484, "epoch": 2217} {"train_loss": -10.738506317138672, "global_step": 372485, "epoch": 2217} {"train_loss": -12.100845336914062, "global_step": 372486, "epoch": 2217} {"train_loss": -10.698395729064941, "global_step": 372487, "epoch": 2217} {"train_loss": -11.944747924804688, "global_step": 372488, "epoch": 2217} {"train_loss": -10.490032196044922, "global_step": 372489, "epoch": 2217} {"train_loss": -11.104473114013672, "global_step": 372490, "epoch": 2217} {"train_loss": -11.784423828125, "global_step": 372491, "epoch": 2217} {"train_loss": -11.208173751831055, "global_step": 372492, "epoch": 2217} {"train_loss": -12.2787504196167, "global_step": 372493, "epoch": 2217} {"train_loss": -11.30291748046875, "global_step": 372494, "epoch": 2217} {"train_loss": -11.588081359863281, "global_step": 372495, "epoch": 2217} {"train_loss": -11.802694320678711, "global_step": 372496, "epoch": 2217} {"train_loss": -11.585884094238281, "global_step": 372497, "epoch": 2217} {"train_loss": -12.024914741516113, "global_step": 372498, "epoch": 2217} {"train_loss": -11.855817794799805, "global_step": 372499, "epoch": 2217} {"train_loss": -11.951513290405273, "global_step": 372500, "epoch": 2217} {"train_loss": -11.441934585571289, "global_step": 372501, "epoch": 2217} {"train_loss": -12.371172904968262, "global_step": 372502, "epoch": 2217} {"train_loss": -11.846183776855469, "global_step": 372503, "epoch": 2217} {"train_loss": -12.206006050109863, "global_step": 372504, "epoch": 2217} {"train_loss": -12.220362663269043, "global_step": 372505, "epoch": 2217} {"train_loss": -11.828537940979004, "global_step": 372506, "epoch": 2217} {"train_loss": -12.137577056884766, "global_step": 372507, "epoch": 2217} {"train_loss": -12.10068130493164, "global_step": 372508, "epoch": 2217} {"train_loss": -12.46839714050293, "global_step": 372509, "epoch": 2217} {"train_loss": -11.800897598266602, "global_step": 372510, "epoch": 2217} {"train_loss": -11.860430717468262, "global_step": 372511, "epoch": 2217} {"train_loss": -11.868330001831055, "global_step": 372512, "epoch": 2217} {"train_loss": -11.670609474182129, "global_step": 372513, "epoch": 2217} {"train_loss": -12.187623977661133, "global_step": 372514, "epoch": 2217} {"train_loss": -11.278512954711914, "global_step": 372515, "epoch": 2217} {"train_loss": -11.936227798461914, "global_step": 372516, "epoch": 2217} {"train_loss": -11.645525932312012, "global_step": 372517, "epoch": 2217} {"train_loss": -11.723522186279297, "global_step": 372518, "epoch": 2217} {"train_loss": -12.01915454864502, "global_step": 372519, "epoch": 2217} {"train_loss": -10.90176773071289, "global_step": 372520, "epoch": 2217} {"train_loss": -11.313774108886719, "global_step": 372521, "epoch": 2217} {"train_loss": -10.759241104125977, "global_step": 372522, "epoch": 2217} {"train_loss": -10.169092178344727, "global_step": 372523, "epoch": 2217} {"train_loss": -9.938678741455078, "global_step": 372524, "epoch": 2217} {"train_loss": -12.011829376220703, "global_step": 372525, "epoch": 2217} {"train_loss": -10.580301284790039, "global_step": 372526, "epoch": 2217} {"train_loss": -10.661006927490234, "global_step": 372527, "epoch": 2217} {"train_loss": -12.012831687927246, "global_step": 372528, "epoch": 2217} {"train_loss": -10.28533935546875, "global_step": 372529, "epoch": 2217} {"train_loss": -10.936238288879395, "global_step": 372530, "epoch": 2217} {"train_loss": -11.002668380737305, "global_step": 372531, "epoch": 2217} {"train_loss": -9.832889556884766, "global_step": 372532, "epoch": 2217} {"train_loss": -11.934921264648438, "global_step": 372533, "epoch": 2217} {"train_loss": -10.581438064575195, "global_step": 372534, "epoch": 2217} {"train_loss": -10.504642486572266, "global_step": 372535, "epoch": 2217} {"train_loss": -10.418055534362793, "global_step": 372536, "epoch": 2217} {"train_loss": -10.895856857299805, "global_step": 372537, "epoch": 2217} {"train_loss": -10.271625518798828, "global_step": 372538, "epoch": 2217} {"train_loss": -12.171761512756348, "global_step": 372539, "epoch": 2217} {"train_loss": -11.04818344116211, "global_step": 372540, "epoch": 2217} {"train_loss": -11.212919235229492, "global_step": 372541, "epoch": 2217} {"train_loss": -11.670112609863281, "global_step": 372542, "epoch": 2217} {"train_loss": -11.629602432250977, "global_step": 372543, "epoch": 2217} {"train_loss": -11.749723434448242, "global_step": 372544, "epoch": 2217} {"train_loss": -11.729989051818848, "global_step": 372545, "epoch": 2217} {"train_loss": -11.799737930297852, "global_step": 372546, "epoch": 2217} {"train_loss": -11.405559539794922, "global_step": 372547, "epoch": 2217} {"train_loss": -11.794011116027832, "global_step": 372548, "epoch": 2217} {"train_loss": -11.73444652557373, "global_step": 372549, "epoch": 2217} {"train_loss": -11.834543228149414, "global_step": 372550, "epoch": 2217} {"train_loss": -11.914703369140625, "global_step": 372551, "epoch": 2217} {"train_loss": -11.859886169433594, "global_step": 372552, "epoch": 2217} {"train_loss": -12.193742752075195, "global_step": 372553, "epoch": 2217} {"train_loss": -11.758386611938477, "global_step": 372554, "epoch": 2217} {"train_loss": -11.729057312011719, "global_step": 372555, "epoch": 2217} {"train_loss": -12.125139236450195, "global_step": 372556, "epoch": 2217} {"train_loss": -11.917420387268066, "global_step": 372557, "epoch": 2217} {"train_loss": -12.100149154663086, "global_step": 372558, "epoch": 2217} {"train_loss": -11.813691139221191, "global_step": 372559, "epoch": 2217} {"train_loss": -12.235063552856445, "global_step": 372560, "epoch": 2217} {"train_loss": -11.94253158569336, "global_step": 372561, "epoch": 2217} {"train_loss": -11.642061233520508, "global_step": 372562, "epoch": 2217} {"train_loss": -12.029386520385742, "global_step": 372563, "epoch": 2217} {"train_loss": -12.050239562988281, "global_step": 372564, "epoch": 2217} {"train_loss": -11.520441055297852, "global_step": 372565, "epoch": 2217} {"train_loss": -12.15379524230957, "global_step": 372566, "epoch": 2217} {"train_loss": -11.984563827514648, "global_step": 372567, "epoch": 2217} {"train_loss": -12.106101989746094, "global_step": 372568, "epoch": 2217} {"train_loss": -12.32780933380127, "global_step": 372569, "epoch": 2217} {"train_loss": -12.0123929977417, "global_step": 372570, "epoch": 2217} {"train_loss": -12.196806907653809, "global_step": 372571, "epoch": 2217} {"train_loss": -12.12021541595459, "global_step": 372572, "epoch": 2217} {"train_loss": -12.470474243164062, "global_step": 372573, "epoch": 2217} {"train_loss": -12.198352813720703, "global_step": 372574, "epoch": 2217} {"train_loss": -12.302591323852539, "global_step": 372575, "epoch": 2217} {"train_loss": -12.28640365600586, "global_step": 372576, "epoch": 2217} {"train_loss": -12.359298706054688, "global_step": 372577, "epoch": 2217} {"train_loss": -12.117561340332031, "global_step": 372578, "epoch": 2217} {"train_loss": -11.890035629272461, "global_step": 372579, "epoch": 2217} {"train_loss": -12.087815284729004, "global_step": 372580, "epoch": 2217} {"train_loss": -12.167839050292969, "global_step": 372581, "epoch": 2217} {"train_loss": -12.241480827331543, "global_step": 372582, "epoch": 2217} {"train_loss": -12.102188110351562, "global_step": 372583, "epoch": 2217} {"train_loss": -12.34874153137207, "global_step": 372584, "epoch": 2217} {"train_loss": -12.30762767791748, "global_step": 372585, "epoch": 2217} {"train_loss": -12.234686851501465, "global_step": 372586, "epoch": 2217} {"train_loss": -12.421335220336914, "global_step": 372587, "epoch": 2217} {"train_loss": -12.468120574951172, "global_step": 372588, "epoch": 2217} {"train_loss": -12.242324829101562, "global_step": 372589, "epoch": 2217} {"train_loss": -12.319849014282227, "global_step": 372590, "epoch": 2217} {"train_loss": -12.287836074829102, "global_step": 372591, "epoch": 2217} {"train_loss": -12.409340858459473, "global_step": 372592, "epoch": 2217} {"train_loss": -12.40592098236084, "global_step": 372593, "epoch": 2217} {"train_loss": -12.50961685180664, "global_step": 372594, "epoch": 2217} {"train_loss": -12.433374404907227, "global_step": 372595, "epoch": 2217} {"train_loss": -12.533209800720215, "global_step": 372596, "epoch": 2217} {"train_loss": -12.18423080444336, "global_step": 372597, "epoch": 2217} {"train_loss": -12.426658630371094, "global_step": 372598, "epoch": 2217} {"train_loss": -12.404704093933105, "global_step": 372599, "epoch": 2217} {"train_loss": -12.723363876342773, "global_step": 372600, "epoch": 2217} {"train_loss": -12.489782333374023, "global_step": 372601, "epoch": 2217} {"train_loss": -12.535446166992188, "global_step": 372602, "epoch": 2217} {"train_loss": -12.416109085083008, "global_step": 372603, "epoch": 2217} {"train_loss": -12.694987297058105, "global_step": 372604, "epoch": 2217} {"train_loss": -12.631576538085938, "global_step": 372605, "epoch": 2217} {"train_loss": -12.61038875579834, "global_step": 372606, "epoch": 2217} {"train_loss": -12.502494812011719, "global_step": 372607, "epoch": 2217} {"train_loss": -12.518108367919922, "global_step": 372608, "epoch": 2217} {"train_loss": -12.560152053833008, "global_step": 372609, "epoch": 2217} {"train_loss": -12.7731351852417, "global_step": 372610, "epoch": 2217} {"train_loss": -12.610382080078125, "global_step": 372611, "epoch": 2217} {"train_loss": -12.541923522949219, "global_step": 372612, "epoch": 2217} {"train_loss": -12.387890815734863, "global_step": 372613, "epoch": 2217} {"train_loss": -12.647579193115234, "global_step": 372614, "epoch": 2217} {"train_loss": -12.663780212402344, "global_step": 372615, "epoch": 2217} {"train_loss": -12.553861618041992, "global_step": 372616, "epoch": 2217} {"train_loss": -12.63516616821289, "global_step": 372617, "epoch": 2217} {"train_loss": -12.354288101196289, "global_step": 372618, "epoch": 2217} {"train_loss": -12.667654037475586, "global_step": 372619, "epoch": 2217} {"train_loss": -12.23105239868164, "global_step": 372620, "epoch": 2217} {"train_loss": -12.759317398071289, "global_step": 372621, "epoch": 2217} {"train_loss": -12.603132247924805, "global_step": 372622, "epoch": 2217} {"train_loss": -11.904210766156515, "global_step": 372623, "epoch": 2217, "val_loss": 293882.15625} {"train_loss": -12.613677024841309, "global_step": 372624, "epoch": 2218} {"train_loss": -12.512996673583984, "global_step": 372625, "epoch": 2218} {"train_loss": -12.523513793945312, "global_step": 372626, "epoch": 2218} {"train_loss": -12.606636047363281, "global_step": 372627, "epoch": 2218} {"train_loss": -12.361053466796875, "global_step": 372628, "epoch": 2218} {"train_loss": -12.51785659790039, "global_step": 372629, "epoch": 2218} {"train_loss": -12.34542465209961, "global_step": 372630, "epoch": 2218} {"train_loss": -11.528816223144531, "global_step": 372631, "epoch": 2218} {"train_loss": -11.91898250579834, "global_step": 372632, "epoch": 2218} {"train_loss": -12.396081924438477, "global_step": 372633, "epoch": 2218} {"train_loss": -11.359664916992188, "global_step": 372634, "epoch": 2218} {"train_loss": -10.553261756896973, "global_step": 372635, "epoch": 2218} {"train_loss": -11.640416145324707, "global_step": 372636, "epoch": 2218} {"train_loss": -12.434847831726074, "global_step": 372637, "epoch": 2218} {"train_loss": -12.148027420043945, "global_step": 372638, "epoch": 2218} {"train_loss": -10.981107711791992, "global_step": 372639, "epoch": 2218} {"train_loss": -11.961915969848633, "global_step": 372640, "epoch": 2218} {"train_loss": -12.426756858825684, "global_step": 372641, "epoch": 2218} {"train_loss": -12.108675956726074, "global_step": 372642, "epoch": 2218} {"train_loss": -11.970352172851562, "global_step": 372643, "epoch": 2218} {"train_loss": -12.166714668273926, "global_step": 372644, "epoch": 2218} {"train_loss": -11.797431945800781, "global_step": 372645, "epoch": 2218} {"train_loss": -12.261751174926758, "global_step": 372646, "epoch": 2218} {"train_loss": -11.873262405395508, "global_step": 372647, "epoch": 2218} {"train_loss": -12.11015796661377, "global_step": 372648, "epoch": 2218} {"train_loss": -11.959912300109863, "global_step": 372649, "epoch": 2218} {"train_loss": -11.146328926086426, "global_step": 372650, "epoch": 2218} {"train_loss": -12.236948013305664, "global_step": 372651, "epoch": 2218} {"train_loss": -11.666772842407227, "global_step": 372652, "epoch": 2218} {"train_loss": -11.08885383605957, "global_step": 372653, "epoch": 2218} {"train_loss": -12.277509689331055, "global_step": 372654, "epoch": 2218} {"train_loss": -11.335329055786133, "global_step": 372655, "epoch": 2218} {"train_loss": -12.017940521240234, "global_step": 372656, "epoch": 2218} {"train_loss": -11.85428237915039, "global_step": 372657, "epoch": 2218} {"train_loss": -12.255403518676758, "global_step": 372658, "epoch": 2218} {"train_loss": -12.10162353515625, "global_step": 372659, "epoch": 2218} {"train_loss": -11.844783782958984, "global_step": 372660, "epoch": 2218} {"train_loss": -12.112604141235352, "global_step": 372661, "epoch": 2218} {"train_loss": -12.035028457641602, "global_step": 372662, "epoch": 2218} {"train_loss": -11.564094543457031, "global_step": 372663, "epoch": 2218} {"train_loss": -11.762687683105469, "global_step": 372664, "epoch": 2218} {"train_loss": -11.779243469238281, "global_step": 372665, "epoch": 2218} {"train_loss": -11.168412208557129, "global_step": 372666, "epoch": 2218} {"train_loss": -11.922628402709961, "global_step": 372667, "epoch": 2218} {"train_loss": -10.570520401000977, "global_step": 372668, "epoch": 2218} {"train_loss": -12.105749130249023, "global_step": 372669, "epoch": 2218} {"train_loss": -11.821856498718262, "global_step": 372670, "epoch": 2218} {"train_loss": -12.481988906860352, "global_step": 372671, "epoch": 2218} {"train_loss": -11.844741821289062, "global_step": 372672, "epoch": 2218} {"train_loss": -12.06144905090332, "global_step": 372673, "epoch": 2218} {"train_loss": -12.046487808227539, "global_step": 372674, "epoch": 2218} {"train_loss": -11.982637405395508, "global_step": 372675, "epoch": 2218} {"train_loss": -12.319293022155762, "global_step": 372676, "epoch": 2218} {"train_loss": -11.76160717010498, "global_step": 372677, "epoch": 2218} {"train_loss": -12.456855773925781, "global_step": 372678, "epoch": 2218} {"train_loss": -11.526908874511719, "global_step": 372679, "epoch": 2218} {"train_loss": -12.1268892288208, "global_step": 372680, "epoch": 2218} {"train_loss": -11.323968887329102, "global_step": 372681, "epoch": 2218} {"train_loss": -12.063665390014648, "global_step": 372682, "epoch": 2218} {"train_loss": -11.511922836303711, "global_step": 372683, "epoch": 2218} {"train_loss": -12.035772323608398, "global_step": 372684, "epoch": 2218} {"train_loss": -11.608419418334961, "global_step": 372685, "epoch": 2218} {"train_loss": -11.62527847290039, "global_step": 372686, "epoch": 2218} {"train_loss": -11.942525863647461, "global_step": 372687, "epoch": 2218} {"train_loss": -11.143167495727539, "global_step": 372688, "epoch": 2218} {"train_loss": -12.01382827758789, "global_step": 372689, "epoch": 2218} {"train_loss": -11.3358793258667, "global_step": 372690, "epoch": 2218} {"train_loss": -11.421304702758789, "global_step": 372691, "epoch": 2218} {"train_loss": -11.853435516357422, "global_step": 372692, "epoch": 2218} {"train_loss": -11.600695610046387, "global_step": 372693, "epoch": 2218} {"train_loss": -11.5629243850708, "global_step": 372694, "epoch": 2218} {"train_loss": -11.632960319519043, "global_step": 372695, "epoch": 2218} {"train_loss": -11.878341674804688, "global_step": 372696, "epoch": 2218} {"train_loss": -11.714994430541992, "global_step": 372697, "epoch": 2218} {"train_loss": -11.732772827148438, "global_step": 372698, "epoch": 2218} {"train_loss": -11.631516456604004, "global_step": 372699, "epoch": 2218} {"train_loss": -11.9409818649292, "global_step": 372700, "epoch": 2218} {"train_loss": -11.382669448852539, "global_step": 372701, "epoch": 2218} {"train_loss": -12.10596752166748, "global_step": 372702, "epoch": 2218} {"train_loss": -11.436050415039062, "global_step": 372703, "epoch": 2218} {"train_loss": -11.581249237060547, "global_step": 372704, "epoch": 2218} {"train_loss": -11.842860221862793, "global_step": 372705, "epoch": 2218} {"train_loss": -11.401472091674805, "global_step": 372706, "epoch": 2218} {"train_loss": -11.939860343933105, "global_step": 372707, "epoch": 2218} {"train_loss": -11.97615909576416, "global_step": 372708, "epoch": 2218} {"train_loss": -11.63937759399414, "global_step": 372709, "epoch": 2218} {"train_loss": -12.034524917602539, "global_step": 372710, "epoch": 2218} {"train_loss": -11.845691680908203, "global_step": 372711, "epoch": 2218} {"train_loss": -11.883868217468262, "global_step": 372712, "epoch": 2218} {"train_loss": -11.510995864868164, "global_step": 372713, "epoch": 2218} {"train_loss": -11.567525863647461, "global_step": 372714, "epoch": 2218} {"train_loss": -12.072408676147461, "global_step": 372715, "epoch": 2218} {"train_loss": -11.67995834350586, "global_step": 372716, "epoch": 2218} {"train_loss": -12.159187316894531, "global_step": 372717, "epoch": 2218} {"train_loss": -11.943589210510254, "global_step": 372718, "epoch": 2218} {"train_loss": -12.076348304748535, "global_step": 372719, "epoch": 2218} {"train_loss": -12.29113483428955, "global_step": 372720, "epoch": 2218} {"train_loss": -12.209909439086914, "global_step": 372721, "epoch": 2218} {"train_loss": -12.235250473022461, "global_step": 372722, "epoch": 2218} {"train_loss": -12.232034683227539, "global_step": 372723, "epoch": 2218} {"train_loss": -12.093229293823242, "global_step": 372724, "epoch": 2218} {"train_loss": -12.079520225524902, "global_step": 372725, "epoch": 2218} {"train_loss": -12.202803611755371, "global_step": 372726, "epoch": 2218} {"train_loss": -12.12966537475586, "global_step": 372727, "epoch": 2218} {"train_loss": -12.024337768554688, "global_step": 372728, "epoch": 2218} {"train_loss": -12.347620010375977, "global_step": 372729, "epoch": 2218} {"train_loss": -12.364823341369629, "global_step": 372730, "epoch": 2218} {"train_loss": -12.009788513183594, "global_step": 372731, "epoch": 2218} {"train_loss": -12.237178802490234, "global_step": 372732, "epoch": 2218} {"train_loss": -12.050811767578125, "global_step": 372733, "epoch": 2218} {"train_loss": -12.517023086547852, "global_step": 372734, "epoch": 2218} {"train_loss": -11.811393737792969, "global_step": 372735, "epoch": 2218} {"train_loss": -12.269826889038086, "global_step": 372736, "epoch": 2218} {"train_loss": -12.210647583007812, "global_step": 372737, "epoch": 2218} {"train_loss": -12.002527236938477, "global_step": 372738, "epoch": 2218} {"train_loss": -12.021645545959473, "global_step": 372739, "epoch": 2218} {"train_loss": -12.24612808227539, "global_step": 372740, "epoch": 2218} {"train_loss": -12.012393951416016, "global_step": 372741, "epoch": 2218} {"train_loss": -12.59615707397461, "global_step": 372742, "epoch": 2218} {"train_loss": -12.159093856811523, "global_step": 372743, "epoch": 2218} {"train_loss": -12.539565086364746, "global_step": 372744, "epoch": 2218} {"train_loss": -12.275206565856934, "global_step": 372745, "epoch": 2218} {"train_loss": -12.280740737915039, "global_step": 372746, "epoch": 2218} {"train_loss": -12.35094165802002, "global_step": 372747, "epoch": 2218} {"train_loss": -11.91948413848877, "global_step": 372748, "epoch": 2218} {"train_loss": -12.698236465454102, "global_step": 372749, "epoch": 2218} {"train_loss": -12.013448715209961, "global_step": 372750, "epoch": 2218} {"train_loss": -12.292802810668945, "global_step": 372751, "epoch": 2218} {"train_loss": -12.146679878234863, "global_step": 372752, "epoch": 2218} {"train_loss": -12.218893051147461, "global_step": 372753, "epoch": 2218} {"train_loss": -12.273387908935547, "global_step": 372754, "epoch": 2218} {"train_loss": -12.229939460754395, "global_step": 372755, "epoch": 2218} {"train_loss": -12.592347145080566, "global_step": 372756, "epoch": 2218} {"train_loss": -12.209354400634766, "global_step": 372757, "epoch": 2218} {"train_loss": -12.428741455078125, "global_step": 372758, "epoch": 2218} {"train_loss": -12.552175521850586, "global_step": 372759, "epoch": 2218} {"train_loss": -12.726669311523438, "global_step": 372760, "epoch": 2218} {"train_loss": -12.478111267089844, "global_step": 372761, "epoch": 2218} {"train_loss": -12.585173606872559, "global_step": 372762, "epoch": 2218} {"train_loss": -12.48023509979248, "global_step": 372763, "epoch": 2218} {"train_loss": -12.686019897460938, "global_step": 372764, "epoch": 2218} {"train_loss": -12.545698165893555, "global_step": 372765, "epoch": 2218} {"train_loss": -12.46941089630127, "global_step": 372766, "epoch": 2218} {"train_loss": -12.644609451293945, "global_step": 372767, "epoch": 2218} {"train_loss": -12.690584182739258, "global_step": 372768, "epoch": 2218} {"train_loss": -12.528969764709473, "global_step": 372769, "epoch": 2218} {"train_loss": -12.651100158691406, "global_step": 372770, "epoch": 2218} {"train_loss": -12.595666885375977, "global_step": 372771, "epoch": 2218} {"train_loss": -12.502609252929688, "global_step": 372772, "epoch": 2218} {"train_loss": -12.663429260253906, "global_step": 372773, "epoch": 2218} {"train_loss": -12.687475204467773, "global_step": 372774, "epoch": 2218} {"train_loss": -12.38347053527832, "global_step": 372775, "epoch": 2218} {"train_loss": -12.638446807861328, "global_step": 372776, "epoch": 2218} {"train_loss": -12.516544342041016, "global_step": 372777, "epoch": 2218} {"train_loss": -12.691701889038086, "global_step": 372778, "epoch": 2218} {"train_loss": -12.718149185180664, "global_step": 372779, "epoch": 2218} {"train_loss": -12.666109085083008, "global_step": 372780, "epoch": 2218} {"train_loss": -12.750865936279297, "global_step": 372781, "epoch": 2218} {"train_loss": -12.87696647644043, "global_step": 372782, "epoch": 2218} {"train_loss": -12.683990478515625, "global_step": 372783, "epoch": 2218} {"train_loss": -12.844796180725098, "global_step": 372784, "epoch": 2218} {"train_loss": -12.734270095825195, "global_step": 372785, "epoch": 2218} {"train_loss": -12.703428268432617, "global_step": 372786, "epoch": 2218} {"train_loss": -12.757186889648438, "global_step": 372787, "epoch": 2218} {"train_loss": -12.641974449157715, "global_step": 372788, "epoch": 2218} {"train_loss": -12.834634780883789, "global_step": 372789, "epoch": 2218} {"train_loss": -13.072126388549805, "global_step": 372790, "epoch": 2218} {"train_loss": -12.09925659497579, "global_step": 372791, "epoch": 2218, "val_loss": 292646.75} {"train_loss": -12.996966361999512, "global_step": 372792, "epoch": 2219} {"train_loss": -12.848498344421387, "global_step": 372793, "epoch": 2219} {"train_loss": -12.651822090148926, "global_step": 372794, "epoch": 2219} {"train_loss": -12.51298999786377, "global_step": 372795, "epoch": 2219} {"train_loss": -12.692802429199219, "global_step": 372796, "epoch": 2219} {"train_loss": -12.597763061523438, "global_step": 372797, "epoch": 2219} {"train_loss": -12.525463104248047, "global_step": 372798, "epoch": 2219} {"train_loss": -12.85782241821289, "global_step": 372799, "epoch": 2219} {"train_loss": -12.484182357788086, "global_step": 372800, "epoch": 2219} {"train_loss": -12.406723022460938, "global_step": 372801, "epoch": 2219} {"train_loss": -12.843910217285156, "global_step": 372802, "epoch": 2219} {"train_loss": -12.71693229675293, "global_step": 372803, "epoch": 2219} {"train_loss": -12.743270874023438, "global_step": 372804, "epoch": 2219} {"train_loss": -12.576428413391113, "global_step": 372805, "epoch": 2219} {"train_loss": -12.428985595703125, "global_step": 372806, "epoch": 2219} {"train_loss": -12.355813980102539, "global_step": 372807, "epoch": 2219} {"train_loss": -12.434396743774414, "global_step": 372808, "epoch": 2219} {"train_loss": -12.018774032592773, "global_step": 372809, "epoch": 2219} {"train_loss": -11.392762184143066, "global_step": 372810, "epoch": 2219} {"train_loss": -11.991633415222168, "global_step": 372811, "epoch": 2219} {"train_loss": -12.648359298706055, "global_step": 372812, "epoch": 2219} {"train_loss": -12.018129348754883, "global_step": 372813, "epoch": 2219} {"train_loss": -10.832961082458496, "global_step": 372814, "epoch": 2219} {"train_loss": -11.641742706298828, "global_step": 372815, "epoch": 2219} {"train_loss": -12.056694984436035, "global_step": 372816, "epoch": 2219} {"train_loss": -11.494664192199707, "global_step": 372817, "epoch": 2219} {"train_loss": -11.714686393737793, "global_step": 372818, "epoch": 2219} {"train_loss": -12.494144439697266, "global_step": 372819, "epoch": 2219} {"train_loss": -11.46667194366455, "global_step": 372820, "epoch": 2219} {"train_loss": -11.99491024017334, "global_step": 372821, "epoch": 2219} {"train_loss": -11.737074851989746, "global_step": 372822, "epoch": 2219} {"train_loss": -12.4466552734375, "global_step": 372823, "epoch": 2219} {"train_loss": -12.404831886291504, "global_step": 372824, "epoch": 2219} {"train_loss": -12.155985832214355, "global_step": 372825, "epoch": 2219} {"train_loss": -12.15477466583252, "global_step": 372826, "epoch": 2219} {"train_loss": -11.765738487243652, "global_step": 372827, "epoch": 2219} {"train_loss": -11.783496856689453, "global_step": 372828, "epoch": 2219} {"train_loss": -11.492815971374512, "global_step": 372829, "epoch": 2219} {"train_loss": -11.930854797363281, "global_step": 372830, "epoch": 2219} {"train_loss": -10.466712951660156, "global_step": 372831, "epoch": 2219} {"train_loss": -12.321149826049805, "global_step": 372832, "epoch": 2219} {"train_loss": -11.137933731079102, "global_step": 372833, "epoch": 2219} {"train_loss": -10.23193359375, "global_step": 372834, "epoch": 2219} {"train_loss": -12.139398574829102, "global_step": 372835, "epoch": 2219} {"train_loss": -10.020147323608398, "global_step": 372836, "epoch": 2219} {"train_loss": -11.019190788269043, "global_step": 372837, "epoch": 2219} {"train_loss": -11.725428581237793, "global_step": 372838, "epoch": 2219} {"train_loss": -11.239286422729492, "global_step": 372839, "epoch": 2219} {"train_loss": -12.30296516418457, "global_step": 372840, "epoch": 2219} {"train_loss": -12.007720947265625, "global_step": 372841, "epoch": 2219} {"train_loss": -11.740071296691895, "global_step": 372842, "epoch": 2219} {"train_loss": -11.837865829467773, "global_step": 372843, "epoch": 2219} {"train_loss": -12.245413780212402, "global_step": 372844, "epoch": 2219} {"train_loss": -11.56070327758789, "global_step": 372845, "epoch": 2219} {"train_loss": -11.829436302185059, "global_step": 372846, "epoch": 2219} {"train_loss": -12.067272186279297, "global_step": 372847, "epoch": 2219} {"train_loss": -12.18862533569336, "global_step": 372848, "epoch": 2219} {"train_loss": -12.326980590820312, "global_step": 372849, "epoch": 2219} {"train_loss": -11.951601028442383, "global_step": 372850, "epoch": 2219} {"train_loss": -11.992331504821777, "global_step": 372851, "epoch": 2219} {"train_loss": -12.460790634155273, "global_step": 372852, "epoch": 2219} {"train_loss": -12.061832427978516, "global_step": 372853, "epoch": 2219} {"train_loss": -12.290512084960938, "global_step": 372854, "epoch": 2219} {"train_loss": -12.190231323242188, "global_step": 372855, "epoch": 2219} {"train_loss": -12.317350387573242, "global_step": 372856, "epoch": 2219} {"train_loss": -12.011380195617676, "global_step": 372857, "epoch": 2219} {"train_loss": -12.407181739807129, "global_step": 372858, "epoch": 2219} {"train_loss": -12.352766036987305, "global_step": 372859, "epoch": 2219} {"train_loss": -12.1520357131958, "global_step": 372860, "epoch": 2219} {"train_loss": -12.504737854003906, "global_step": 372861, "epoch": 2219} {"train_loss": -12.613595008850098, "global_step": 372862, "epoch": 2219} {"train_loss": -12.446306228637695, "global_step": 372863, "epoch": 2219} {"train_loss": -12.666816711425781, "global_step": 372864, "epoch": 2219} {"train_loss": -12.40410041809082, "global_step": 372865, "epoch": 2219} {"train_loss": -12.383378028869629, "global_step": 372866, "epoch": 2219} {"train_loss": -12.555980682373047, "global_step": 372867, "epoch": 2219} {"train_loss": -12.347339630126953, "global_step": 372868, "epoch": 2219} {"train_loss": -12.524505615234375, "global_step": 372869, "epoch": 2219} {"train_loss": -12.426630020141602, "global_step": 372870, "epoch": 2219} {"train_loss": -12.234224319458008, "global_step": 372871, "epoch": 2219} {"train_loss": -12.173391342163086, "global_step": 372872, "epoch": 2219} {"train_loss": -12.719857215881348, "global_step": 372873, "epoch": 2219} {"train_loss": -12.360628128051758, "global_step": 372874, "epoch": 2219} {"train_loss": -12.549084663391113, "global_step": 372875, "epoch": 2219} {"train_loss": -12.5531644821167, "global_step": 372876, "epoch": 2219} {"train_loss": -12.012880325317383, "global_step": 372877, "epoch": 2219} {"train_loss": -12.643945693969727, "global_step": 372878, "epoch": 2219} {"train_loss": -12.318635940551758, "global_step": 372879, "epoch": 2219} {"train_loss": -12.339313507080078, "global_step": 372880, "epoch": 2219} {"train_loss": -12.514095306396484, "global_step": 372881, "epoch": 2219} {"train_loss": -12.446333885192871, "global_step": 372882, "epoch": 2219} {"train_loss": -12.268468856811523, "global_step": 372883, "epoch": 2219} {"train_loss": -12.447242736816406, "global_step": 372884, "epoch": 2219} {"train_loss": -12.429065704345703, "global_step": 372885, "epoch": 2219} {"train_loss": -12.424676895141602, "global_step": 372886, "epoch": 2219} {"train_loss": -12.187820434570312, "global_step": 372887, "epoch": 2219} {"train_loss": -12.486294746398926, "global_step": 372888, "epoch": 2219} {"train_loss": -12.376665115356445, "global_step": 372889, "epoch": 2219} {"train_loss": -12.080223083496094, "global_step": 372890, "epoch": 2219} {"train_loss": -12.224102020263672, "global_step": 372891, "epoch": 2219} {"train_loss": -12.460338592529297, "global_step": 372892, "epoch": 2219} {"train_loss": -11.987707138061523, "global_step": 372893, "epoch": 2219} {"train_loss": -12.06193733215332, "global_step": 372894, "epoch": 2219} {"train_loss": -12.417509078979492, "global_step": 372895, "epoch": 2219} {"train_loss": -12.304200172424316, "global_step": 372896, "epoch": 2219} {"train_loss": -11.881834030151367, "global_step": 372897, "epoch": 2219} {"train_loss": -12.284686088562012, "global_step": 372898, "epoch": 2219} {"train_loss": -12.625635147094727, "global_step": 372899, "epoch": 2219} {"train_loss": -11.800527572631836, "global_step": 372900, "epoch": 2219} {"train_loss": -10.622827529907227, "global_step": 372901, "epoch": 2219} {"train_loss": -12.619983673095703, "global_step": 372902, "epoch": 2219} {"train_loss": -11.606374740600586, "global_step": 372903, "epoch": 2219} {"train_loss": -12.147993087768555, "global_step": 372904, "epoch": 2219} {"train_loss": -11.512913703918457, "global_step": 372905, "epoch": 2219} {"train_loss": -10.787118911743164, "global_step": 372906, "epoch": 2219} {"train_loss": -11.436683654785156, "global_step": 372907, "epoch": 2219} {"train_loss": -11.169228553771973, "global_step": 372908, "epoch": 2219} {"train_loss": -10.388481140136719, "global_step": 372909, "epoch": 2219} {"train_loss": -10.97881031036377, "global_step": 372910, "epoch": 2219} {"train_loss": -11.267065048217773, "global_step": 372911, "epoch": 2219} {"train_loss": -11.191354751586914, "global_step": 372912, "epoch": 2219} {"train_loss": -11.81114387512207, "global_step": 372913, "epoch": 2219} {"train_loss": -11.266246795654297, "global_step": 372914, "epoch": 2219} {"train_loss": -12.276110649108887, "global_step": 372915, "epoch": 2219} {"train_loss": -11.457296371459961, "global_step": 372916, "epoch": 2219} {"train_loss": -12.176980972290039, "global_step": 372917, "epoch": 2219} {"train_loss": -11.699869155883789, "global_step": 372918, "epoch": 2219} {"train_loss": -11.979072570800781, "global_step": 372919, "epoch": 2219} {"train_loss": -9.961129188537598, "global_step": 372920, "epoch": 2219} {"train_loss": -11.804559707641602, "global_step": 372921, "epoch": 2219} {"train_loss": -10.974264144897461, "global_step": 372922, "epoch": 2219} {"train_loss": -10.847126007080078, "global_step": 372923, "epoch": 2219} {"train_loss": -11.404617309570312, "global_step": 372924, "epoch": 2219} {"train_loss": -10.832013130187988, "global_step": 372925, "epoch": 2219} {"train_loss": -12.022571563720703, "global_step": 372926, "epoch": 2219} {"train_loss": -11.183547973632812, "global_step": 372927, "epoch": 2219} {"train_loss": -12.282142639160156, "global_step": 372928, "epoch": 2219} {"train_loss": -11.286500930786133, "global_step": 372929, "epoch": 2219} {"train_loss": -11.987460136413574, "global_step": 372930, "epoch": 2219} {"train_loss": -11.182426452636719, "global_step": 372931, "epoch": 2219} {"train_loss": -11.967830657958984, "global_step": 372932, "epoch": 2219} {"train_loss": -11.8947114944458, "global_step": 372933, "epoch": 2219} {"train_loss": -12.059985160827637, "global_step": 372934, "epoch": 2219} {"train_loss": -11.829170227050781, "global_step": 372935, "epoch": 2219} {"train_loss": -11.920184135437012, "global_step": 372936, "epoch": 2219} {"train_loss": -12.02763557434082, "global_step": 372937, "epoch": 2219} {"train_loss": -12.006449699401855, "global_step": 372938, "epoch": 2219} {"train_loss": -12.110040664672852, "global_step": 372939, "epoch": 2219} {"train_loss": -11.59947395324707, "global_step": 372940, "epoch": 2219} {"train_loss": -12.413419723510742, "global_step": 372941, "epoch": 2219} {"train_loss": -11.521795272827148, "global_step": 372942, "epoch": 2219} {"train_loss": -12.126263618469238, "global_step": 372943, "epoch": 2219} {"train_loss": -12.095449447631836, "global_step": 372944, "epoch": 2219} {"train_loss": -12.187041282653809, "global_step": 372945, "epoch": 2219} {"train_loss": -12.173940658569336, "global_step": 372946, "epoch": 2219} {"train_loss": -12.198945999145508, "global_step": 372947, "epoch": 2219} {"train_loss": -12.496767044067383, "global_step": 372948, "epoch": 2219} {"train_loss": -12.28740119934082, "global_step": 372949, "epoch": 2219} {"train_loss": -12.051509857177734, "global_step": 372950, "epoch": 2219} {"train_loss": -11.945215225219727, "global_step": 372951, "epoch": 2219} {"train_loss": -12.383143424987793, "global_step": 372952, "epoch": 2219} {"train_loss": -12.002052307128906, "global_step": 372953, "epoch": 2219} {"train_loss": -12.277669906616211, "global_step": 372954, "epoch": 2219} {"train_loss": -12.099851608276367, "global_step": 372955, "epoch": 2219} {"train_loss": -12.145486831665039, "global_step": 372956, "epoch": 2219} {"train_loss": -11.693876266479492, "global_step": 372957, "epoch": 2219} {"train_loss": -12.243844032287598, "global_step": 372958, "epoch": 2219} {"train_loss": -12.010714440118699, "global_step": 372959, "epoch": 2219, "val_loss": 291064.5625} {"train_loss": -11.668655395507812, "global_step": 372960, "epoch": 2220} {"train_loss": -12.4994478225708, "global_step": 372961, "epoch": 2220} {"train_loss": -11.894590377807617, "global_step": 372962, "epoch": 2220} {"train_loss": -12.123086929321289, "global_step": 372963, "epoch": 2220} {"train_loss": -11.893294334411621, "global_step": 372964, "epoch": 2220} {"train_loss": -12.364798545837402, "global_step": 372965, "epoch": 2220} {"train_loss": -12.266576766967773, "global_step": 372966, "epoch": 2220} {"train_loss": -12.446310043334961, "global_step": 372967, "epoch": 2220} {"train_loss": -11.959589004516602, "global_step": 372968, "epoch": 2220} {"train_loss": -12.097980499267578, "global_step": 372969, "epoch": 2220} {"train_loss": -12.410802841186523, "global_step": 372970, "epoch": 2220} {"train_loss": -12.308655738830566, "global_step": 372971, "epoch": 2220} {"train_loss": -12.260368347167969, "global_step": 372972, "epoch": 2220} {"train_loss": -12.425546646118164, "global_step": 372973, "epoch": 2220} {"train_loss": -12.193952560424805, "global_step": 372974, "epoch": 2220} {"train_loss": -12.45615005493164, "global_step": 372975, "epoch": 2220} {"train_loss": -12.312994003295898, "global_step": 372976, "epoch": 2220} {"train_loss": -12.218151092529297, "global_step": 372977, "epoch": 2220} {"train_loss": -12.366247177124023, "global_step": 372978, "epoch": 2220} {"train_loss": -12.210702896118164, "global_step": 372979, "epoch": 2220} {"train_loss": -12.456778526306152, "global_step": 372980, "epoch": 2220} {"train_loss": -12.336136817932129, "global_step": 372981, "epoch": 2220} {"train_loss": -12.18486499786377, "global_step": 372982, "epoch": 2220} {"train_loss": -12.009544372558594, "global_step": 372983, "epoch": 2220} {"train_loss": -12.515605926513672, "global_step": 372984, "epoch": 2220} {"train_loss": -12.271347999572754, "global_step": 372985, "epoch": 2220} {"train_loss": -12.360271453857422, "global_step": 372986, "epoch": 2220} {"train_loss": -12.359708786010742, "global_step": 372987, "epoch": 2220} {"train_loss": -12.707674980163574, "global_step": 372988, "epoch": 2220} {"train_loss": -12.466808319091797, "global_step": 372989, "epoch": 2220} {"train_loss": -12.165129661560059, "global_step": 372990, "epoch": 2220} {"train_loss": -12.353363990783691, "global_step": 372991, "epoch": 2220} {"train_loss": -12.019472122192383, "global_step": 372992, "epoch": 2220} {"train_loss": -12.37545394897461, "global_step": 372993, "epoch": 2220} {"train_loss": -12.018234252929688, "global_step": 372994, "epoch": 2220} {"train_loss": -12.196914672851562, "global_step": 372995, "epoch": 2220} {"train_loss": -12.338024139404297, "global_step": 372996, "epoch": 2220} {"train_loss": -12.062761306762695, "global_step": 372997, "epoch": 2220} {"train_loss": -12.27256965637207, "global_step": 372998, "epoch": 2220} {"train_loss": -11.628540992736816, "global_step": 372999, "epoch": 2220} {"train_loss": -12.574820518493652, "global_step": 373000, "epoch": 2220} {"train_loss": -12.435859680175781, "global_step": 373001, "epoch": 2220} {"train_loss": -12.16368293762207, "global_step": 373002, "epoch": 2220} {"train_loss": -12.345270156860352, "global_step": 373003, "epoch": 2220} {"train_loss": -12.527496337890625, "global_step": 373004, "epoch": 2220} {"train_loss": -12.027864456176758, "global_step": 373005, "epoch": 2220} {"train_loss": -11.947284698486328, "global_step": 373006, "epoch": 2220} {"train_loss": -12.20151138305664, "global_step": 373007, "epoch": 2220} {"train_loss": -11.226029396057129, "global_step": 373008, "epoch": 2220} {"train_loss": -12.024555206298828, "global_step": 373009, "epoch": 2220} {"train_loss": -12.247930526733398, "global_step": 373010, "epoch": 2220} {"train_loss": -12.044635772705078, "global_step": 373011, "epoch": 2220} {"train_loss": -12.44122314453125, "global_step": 373012, "epoch": 2220} {"train_loss": -12.127696990966797, "global_step": 373013, "epoch": 2220} {"train_loss": -12.36585807800293, "global_step": 373014, "epoch": 2220} {"train_loss": -11.803829193115234, "global_step": 373015, "epoch": 2220} {"train_loss": -12.197822570800781, "global_step": 373016, "epoch": 2220} {"train_loss": -11.938735961914062, "global_step": 373017, "epoch": 2220} {"train_loss": -11.790081024169922, "global_step": 373018, "epoch": 2220} {"train_loss": -11.885266304016113, "global_step": 373019, "epoch": 2220} {"train_loss": -11.039664268493652, "global_step": 373020, "epoch": 2220} {"train_loss": -10.33962345123291, "global_step": 373021, "epoch": 2220} {"train_loss": -12.12328052520752, "global_step": 373022, "epoch": 2220} {"train_loss": -10.667488098144531, "global_step": 373023, "epoch": 2220} {"train_loss": -10.372647285461426, "global_step": 373024, "epoch": 2220} {"train_loss": -11.499631881713867, "global_step": 373025, "epoch": 2220} {"train_loss": -9.652399063110352, "global_step": 373026, "epoch": 2220} {"train_loss": -11.388011932373047, "global_step": 373027, "epoch": 2220} {"train_loss": -9.107036590576172, "global_step": 373028, "epoch": 2220} {"train_loss": -10.452284812927246, "global_step": 373029, "epoch": 2220} {"train_loss": -9.981462478637695, "global_step": 373030, "epoch": 2220} {"train_loss": -10.513671875, "global_step": 373031, "epoch": 2220} {"train_loss": -10.16869068145752, "global_step": 373032, "epoch": 2220} {"train_loss": -8.355072021484375, "global_step": 373033, "epoch": 2220} {"train_loss": -7.660411834716797, "global_step": 373034, "epoch": 2220} {"train_loss": -7.705959796905518, "global_step": 373035, "epoch": 2220} {"train_loss": -8.35512638092041, "global_step": 373036, "epoch": 2220} {"train_loss": -9.375423431396484, "global_step": 373037, "epoch": 2220} {"train_loss": -9.528966903686523, "global_step": 373038, "epoch": 2220} {"train_loss": -8.787954330444336, "global_step": 373039, "epoch": 2220} {"train_loss": -8.62502384185791, "global_step": 373040, "epoch": 2220} {"train_loss": -9.22553825378418, "global_step": 373041, "epoch": 2220} {"train_loss": -9.075848579406738, "global_step": 373042, "epoch": 2220} {"train_loss": -10.056473731994629, "global_step": 373043, "epoch": 2220} {"train_loss": -9.095331192016602, "global_step": 373044, "epoch": 2220} {"train_loss": -10.08863353729248, "global_step": 373045, "epoch": 2220} {"train_loss": -10.254854202270508, "global_step": 373046, "epoch": 2220} {"train_loss": -8.731496810913086, "global_step": 373047, "epoch": 2220} {"train_loss": -11.258672714233398, "global_step": 373048, "epoch": 2220} {"train_loss": -9.895090103149414, "global_step": 373049, "epoch": 2220} {"train_loss": -9.595905303955078, "global_step": 373050, "epoch": 2220} {"train_loss": -11.045862197875977, "global_step": 373051, "epoch": 2220} {"train_loss": -11.238645553588867, "global_step": 373052, "epoch": 2220} {"train_loss": -10.25415325164795, "global_step": 373053, "epoch": 2220} {"train_loss": -10.397972106933594, "global_step": 373054, "epoch": 2220} {"train_loss": -11.134214401245117, "global_step": 373055, "epoch": 2220} {"train_loss": -10.421197891235352, "global_step": 373056, "epoch": 2220} {"train_loss": -11.452411651611328, "global_step": 373057, "epoch": 2220} {"train_loss": -10.794299125671387, "global_step": 373058, "epoch": 2220} {"train_loss": -10.93553638458252, "global_step": 373059, "epoch": 2220} {"train_loss": -11.596287727355957, "global_step": 373060, "epoch": 2220} {"train_loss": -10.768528938293457, "global_step": 373061, "epoch": 2220} {"train_loss": -11.384592056274414, "global_step": 373062, "epoch": 2220} {"train_loss": -11.828272819519043, "global_step": 373063, "epoch": 2220} {"train_loss": -11.023396492004395, "global_step": 373064, "epoch": 2220} {"train_loss": -11.836435317993164, "global_step": 373065, "epoch": 2220} {"train_loss": -11.691113471984863, "global_step": 373066, "epoch": 2220} {"train_loss": -11.315216064453125, "global_step": 373067, "epoch": 2220} {"train_loss": -12.011177062988281, "global_step": 373068, "epoch": 2220} {"train_loss": -11.663875579833984, "global_step": 373069, "epoch": 2220} {"train_loss": -11.705399513244629, "global_step": 373070, "epoch": 2220} {"train_loss": -12.007887840270996, "global_step": 373071, "epoch": 2220} {"train_loss": -11.78019905090332, "global_step": 373072, "epoch": 2220} {"train_loss": -11.78785228729248, "global_step": 373073, "epoch": 2220} {"train_loss": -11.751775741577148, "global_step": 373074, "epoch": 2220} {"train_loss": -11.593708992004395, "global_step": 373075, "epoch": 2220} {"train_loss": -11.904125213623047, "global_step": 373076, "epoch": 2220} {"train_loss": -12.018863677978516, "global_step": 373077, "epoch": 2220} {"train_loss": -11.713360786437988, "global_step": 373078, "epoch": 2220} {"train_loss": -12.010899543762207, "global_step": 373079, "epoch": 2220} {"train_loss": -11.87744140625, "global_step": 373080, "epoch": 2220} {"train_loss": -11.767663955688477, "global_step": 373081, "epoch": 2220} {"train_loss": -11.815017700195312, "global_step": 373082, "epoch": 2220} {"train_loss": -11.891496658325195, "global_step": 373083, "epoch": 2220} {"train_loss": -12.135595321655273, "global_step": 373084, "epoch": 2220} {"train_loss": -12.079963684082031, "global_step": 373085, "epoch": 2220} {"train_loss": -12.235838890075684, "global_step": 373086, "epoch": 2220} {"train_loss": -12.041574478149414, "global_step": 373087, "epoch": 2220} {"train_loss": -12.312198638916016, "global_step": 373088, "epoch": 2220} {"train_loss": -12.057762145996094, "global_step": 373089, "epoch": 2220} {"train_loss": -12.103008270263672, "global_step": 373090, "epoch": 2220} {"train_loss": -11.948690414428711, "global_step": 373091, "epoch": 2220} {"train_loss": -12.141966819763184, "global_step": 373092, "epoch": 2220} {"train_loss": -12.053542137145996, "global_step": 373093, "epoch": 2220} {"train_loss": -12.088494300842285, "global_step": 373094, "epoch": 2220} {"train_loss": -12.373346328735352, "global_step": 373095, "epoch": 2220} {"train_loss": -12.210744857788086, "global_step": 373096, "epoch": 2220} {"train_loss": -12.345197677612305, "global_step": 373097, "epoch": 2220} {"train_loss": -12.255288124084473, "global_step": 373098, "epoch": 2220} {"train_loss": -12.347087860107422, "global_step": 373099, "epoch": 2220} {"train_loss": -12.261124610900879, "global_step": 373100, "epoch": 2220} {"train_loss": -12.304712295532227, "global_step": 373101, "epoch": 2220} {"train_loss": -12.455060958862305, "global_step": 373102, "epoch": 2220} {"train_loss": -12.262022972106934, "global_step": 373103, "epoch": 2220} {"train_loss": -12.45185661315918, "global_step": 373104, "epoch": 2220} {"train_loss": -12.452432632446289, "global_step": 373105, "epoch": 2220} {"train_loss": -12.36562728881836, "global_step": 373106, "epoch": 2220} {"train_loss": -12.549874305725098, "global_step": 373107, "epoch": 2220} {"train_loss": -12.419408798217773, "global_step": 373108, "epoch": 2220} {"train_loss": -12.32519817352295, "global_step": 373109, "epoch": 2220} {"train_loss": -12.562389373779297, "global_step": 373110, "epoch": 2220} {"train_loss": -12.361639022827148, "global_step": 373111, "epoch": 2220} {"train_loss": -12.455620765686035, "global_step": 373112, "epoch": 2220} {"train_loss": -12.375288009643555, "global_step": 373113, "epoch": 2220} {"train_loss": -12.330945014953613, "global_step": 373114, "epoch": 2220} {"train_loss": -12.47165298461914, "global_step": 373115, "epoch": 2220} {"train_loss": -12.441011428833008, "global_step": 373116, "epoch": 2220} {"train_loss": -12.453588485717773, "global_step": 373117, "epoch": 2220} {"train_loss": -12.598875045776367, "global_step": 373118, "epoch": 2220} {"train_loss": -12.572627067565918, "global_step": 373119, "epoch": 2220} {"train_loss": -12.462793350219727, "global_step": 373120, "epoch": 2220} {"train_loss": -12.506729125976562, "global_step": 373121, "epoch": 2220} {"train_loss": -12.50093936920166, "global_step": 373122, "epoch": 2220} {"train_loss": -12.452018737792969, "global_step": 373123, "epoch": 2220} {"train_loss": -12.400943756103516, "global_step": 373124, "epoch": 2220} {"train_loss": -12.644767761230469, "global_step": 373125, "epoch": 2220} {"train_loss": -12.507402420043945, "global_step": 373126, "epoch": 2220} {"train_loss": -11.647326188428062, "global_step": 373127, "epoch": 2220, "val_loss": 288440.34375, "train_action_mse_error": 0.3284232020378113} {"train_loss": -12.529322624206543, "global_step": 373128, "epoch": 2221} {"train_loss": -12.70442008972168, "global_step": 373129, "epoch": 2221} {"train_loss": -12.53355598449707, "global_step": 373130, "epoch": 2221} {"train_loss": -12.624055862426758, "global_step": 373131, "epoch": 2221} {"train_loss": -12.588898658752441, "global_step": 373132, "epoch": 2221} {"train_loss": -12.615819931030273, "global_step": 373133, "epoch": 2221} {"train_loss": -12.643007278442383, "global_step": 373134, "epoch": 2221} {"train_loss": -12.621307373046875, "global_step": 373135, "epoch": 2221} {"train_loss": -12.5772705078125, "global_step": 373136, "epoch": 2221} {"train_loss": -12.65690803527832, "global_step": 373137, "epoch": 2221} {"train_loss": -12.40843391418457, "global_step": 373138, "epoch": 2221} {"train_loss": -12.375884056091309, "global_step": 373139, "epoch": 2221} {"train_loss": -12.672118186950684, "global_step": 373140, "epoch": 2221} {"train_loss": -12.662490844726562, "global_step": 373141, "epoch": 2221} {"train_loss": -12.679498672485352, "global_step": 373142, "epoch": 2221} {"train_loss": -12.709951400756836, "global_step": 373143, "epoch": 2221} {"train_loss": -12.88888168334961, "global_step": 373144, "epoch": 2221} {"train_loss": -12.500656127929688, "global_step": 373145, "epoch": 2221} {"train_loss": -12.63978385925293, "global_step": 373146, "epoch": 2221} {"train_loss": -12.687232971191406, "global_step": 373147, "epoch": 2221} {"train_loss": -12.669340133666992, "global_step": 373148, "epoch": 2221} {"train_loss": -12.843844413757324, "global_step": 373149, "epoch": 2221} {"train_loss": -12.631675720214844, "global_step": 373150, "epoch": 2221} {"train_loss": -12.693607330322266, "global_step": 373151, "epoch": 2221} {"train_loss": -12.85034465789795, "global_step": 373152, "epoch": 2221} {"train_loss": -12.344686508178711, "global_step": 373153, "epoch": 2221} {"train_loss": -12.638304710388184, "global_step": 373154, "epoch": 2221} {"train_loss": -12.65165901184082, "global_step": 373155, "epoch": 2221} {"train_loss": -12.510641098022461, "global_step": 373156, "epoch": 2221} {"train_loss": -12.428376197814941, "global_step": 373157, "epoch": 2221} {"train_loss": -12.715002059936523, "global_step": 373158, "epoch": 2221} {"train_loss": -12.299485206604004, "global_step": 373159, "epoch": 2221} {"train_loss": -12.372735023498535, "global_step": 373160, "epoch": 2221} {"train_loss": -12.671239852905273, "global_step": 373161, "epoch": 2221} {"train_loss": -12.51239013671875, "global_step": 373162, "epoch": 2221} {"train_loss": -11.192895889282227, "global_step": 373163, "epoch": 2221} {"train_loss": -12.072625160217285, "global_step": 373164, "epoch": 2221} {"train_loss": -12.780421257019043, "global_step": 373165, "epoch": 2221} {"train_loss": -12.138620376586914, "global_step": 373166, "epoch": 2221} {"train_loss": -12.393830299377441, "global_step": 373167, "epoch": 2221} {"train_loss": -12.505693435668945, "global_step": 373168, "epoch": 2221} {"train_loss": -12.478687286376953, "global_step": 373169, "epoch": 2221} {"train_loss": -12.212667465209961, "global_step": 373170, "epoch": 2221} {"train_loss": -12.389473915100098, "global_step": 373171, "epoch": 2221} {"train_loss": -11.741242408752441, "global_step": 373172, "epoch": 2221} {"train_loss": -10.504301071166992, "global_step": 373173, "epoch": 2221} {"train_loss": -11.341135025024414, "global_step": 373174, "epoch": 2221} {"train_loss": -10.346515655517578, "global_step": 373175, "epoch": 2221} {"train_loss": -8.77796745300293, "global_step": 373176, "epoch": 2221} {"train_loss": -7.5109429359436035, "global_step": 373177, "epoch": 2221} {"train_loss": -6.78212833404541, "global_step": 373178, "epoch": 2221} {"train_loss": -8.264610290527344, "global_step": 373179, "epoch": 2221} {"train_loss": -7.714468479156494, "global_step": 373180, "epoch": 2221} {"train_loss": -8.740299224853516, "global_step": 373181, "epoch": 2221} {"train_loss": -8.320924758911133, "global_step": 373182, "epoch": 2221} {"train_loss": -7.778932571411133, "global_step": 373183, "epoch": 2221} {"train_loss": -9.026445388793945, "global_step": 373184, "epoch": 2221} {"train_loss": -8.932737350463867, "global_step": 373185, "epoch": 2221} {"train_loss": -7.764619827270508, "global_step": 373186, "epoch": 2221} {"train_loss": -8.460660934448242, "global_step": 373187, "epoch": 2221} {"train_loss": -9.820741653442383, "global_step": 373188, "epoch": 2221} {"train_loss": -9.022758483886719, "global_step": 373189, "epoch": 2221} {"train_loss": -10.267891883850098, "global_step": 373190, "epoch": 2221} {"train_loss": -8.024565696716309, "global_step": 373191, "epoch": 2221} {"train_loss": -9.708935737609863, "global_step": 373192, "epoch": 2221} {"train_loss": -8.720413208007812, "global_step": 373193, "epoch": 2221} {"train_loss": -10.097423553466797, "global_step": 373194, "epoch": 2221} {"train_loss": -9.303620338439941, "global_step": 373195, "epoch": 2221} {"train_loss": -8.678096771240234, "global_step": 373196, "epoch": 2221} {"train_loss": -9.68789291381836, "global_step": 373197, "epoch": 2221} {"train_loss": -11.116863250732422, "global_step": 373198, "epoch": 2221} {"train_loss": -9.863147735595703, "global_step": 373199, "epoch": 2221} {"train_loss": -10.748761177062988, "global_step": 373200, "epoch": 2221} {"train_loss": -10.480323791503906, "global_step": 373201, "epoch": 2221} {"train_loss": -10.700138092041016, "global_step": 373202, "epoch": 2221} {"train_loss": -11.339395523071289, "global_step": 373203, "epoch": 2221} {"train_loss": -11.040412902832031, "global_step": 373204, "epoch": 2221} {"train_loss": -11.048768997192383, "global_step": 373205, "epoch": 2221} {"train_loss": -11.219348907470703, "global_step": 373206, "epoch": 2221} {"train_loss": -11.147409439086914, "global_step": 373207, "epoch": 2221} {"train_loss": -10.5665283203125, "global_step": 373208, "epoch": 2221} {"train_loss": -11.070056915283203, "global_step": 373209, "epoch": 2221} {"train_loss": -11.013148307800293, "global_step": 373210, "epoch": 2221} {"train_loss": -11.382503509521484, "global_step": 373211, "epoch": 2221} {"train_loss": -11.330531120300293, "global_step": 373212, "epoch": 2221} {"train_loss": -11.689599990844727, "global_step": 373213, "epoch": 2221} {"train_loss": -11.272684097290039, "global_step": 373214, "epoch": 2221} {"train_loss": -11.760369300842285, "global_step": 373215, "epoch": 2221} {"train_loss": -11.18133544921875, "global_step": 373216, "epoch": 2221} {"train_loss": -11.435834884643555, "global_step": 373217, "epoch": 2221} {"train_loss": -11.686187744140625, "global_step": 373218, "epoch": 2221} {"train_loss": -11.26181411743164, "global_step": 373219, "epoch": 2221} {"train_loss": -11.010326385498047, "global_step": 373220, "epoch": 2221} {"train_loss": -10.990639686584473, "global_step": 373221, "epoch": 2221} {"train_loss": -10.96249008178711, "global_step": 373222, "epoch": 2221} {"train_loss": -11.5687894821167, "global_step": 373223, "epoch": 2221} {"train_loss": -11.260955810546875, "global_step": 373224, "epoch": 2221} {"train_loss": -11.267504692077637, "global_step": 373225, "epoch": 2221} {"train_loss": -11.172821044921875, "global_step": 373226, "epoch": 2221} {"train_loss": -11.55291748046875, "global_step": 373227, "epoch": 2221} {"train_loss": -11.466165542602539, "global_step": 373228, "epoch": 2221} {"train_loss": -11.523921966552734, "global_step": 373229, "epoch": 2221} {"train_loss": -11.528921127319336, "global_step": 373230, "epoch": 2221} {"train_loss": -11.539685249328613, "global_step": 373231, "epoch": 2221} {"train_loss": -11.299903869628906, "global_step": 373232, "epoch": 2221} {"train_loss": -12.056411743164062, "global_step": 373233, "epoch": 2221} {"train_loss": -11.284481048583984, "global_step": 373234, "epoch": 2221} {"train_loss": -11.826323509216309, "global_step": 373235, "epoch": 2221} {"train_loss": -11.951635360717773, "global_step": 373236, "epoch": 2221} {"train_loss": -11.633845329284668, "global_step": 373237, "epoch": 2221} {"train_loss": -12.127689361572266, "global_step": 373238, "epoch": 2221} {"train_loss": -11.605466842651367, "global_step": 373239, "epoch": 2221} {"train_loss": -11.911828994750977, "global_step": 373240, "epoch": 2221} {"train_loss": -11.595760345458984, "global_step": 373241, "epoch": 2221} {"train_loss": -11.875558853149414, "global_step": 373242, "epoch": 2221} {"train_loss": -12.053851127624512, "global_step": 373243, "epoch": 2221} {"train_loss": -11.551004409790039, "global_step": 373244, "epoch": 2221} {"train_loss": -12.132555961608887, "global_step": 373245, "epoch": 2221} {"train_loss": -11.729480743408203, "global_step": 373246, "epoch": 2221} {"train_loss": -12.062811851501465, "global_step": 373247, "epoch": 2221} {"train_loss": -12.26217269897461, "global_step": 373248, "epoch": 2221} {"train_loss": -11.918632507324219, "global_step": 373249, "epoch": 2221} {"train_loss": -12.113808631896973, "global_step": 373250, "epoch": 2221} {"train_loss": -12.14168930053711, "global_step": 373251, "epoch": 2221} {"train_loss": -12.231246948242188, "global_step": 373252, "epoch": 2221} {"train_loss": -12.018539428710938, "global_step": 373253, "epoch": 2221} {"train_loss": -12.087879180908203, "global_step": 373254, "epoch": 2221} {"train_loss": -12.472439765930176, "global_step": 373255, "epoch": 2221} {"train_loss": -12.309125900268555, "global_step": 373256, "epoch": 2221} {"train_loss": -12.206445693969727, "global_step": 373257, "epoch": 2221} {"train_loss": -12.284477233886719, "global_step": 373258, "epoch": 2221} {"train_loss": -12.124645233154297, "global_step": 373259, "epoch": 2221} {"train_loss": -12.453563690185547, "global_step": 373260, "epoch": 2221} {"train_loss": -12.093162536621094, "global_step": 373261, "epoch": 2221} {"train_loss": -12.225580215454102, "global_step": 373262, "epoch": 2221} {"train_loss": -12.54625129699707, "global_step": 373263, "epoch": 2221} {"train_loss": -12.22031021118164, "global_step": 373264, "epoch": 2221} {"train_loss": -12.293628692626953, "global_step": 373265, "epoch": 2221} {"train_loss": -11.884740829467773, "global_step": 373266, "epoch": 2221} {"train_loss": -12.258247375488281, "global_step": 373267, "epoch": 2221} {"train_loss": -12.11634635925293, "global_step": 373268, "epoch": 2221} {"train_loss": -12.282937049865723, "global_step": 373269, "epoch": 2221} {"train_loss": -12.422258377075195, "global_step": 373270, "epoch": 2221} {"train_loss": -12.22929573059082, "global_step": 373271, "epoch": 2221} {"train_loss": -12.09088134765625, "global_step": 373272, "epoch": 2221} {"train_loss": -12.427571296691895, "global_step": 373273, "epoch": 2221} {"train_loss": -12.348335266113281, "global_step": 373274, "epoch": 2221} {"train_loss": -12.353811264038086, "global_step": 373275, "epoch": 2221} {"train_loss": -12.348305702209473, "global_step": 373276, "epoch": 2221} {"train_loss": -12.470247268676758, "global_step": 373277, "epoch": 2221} {"train_loss": -12.412890434265137, "global_step": 373278, "epoch": 2221} {"train_loss": -12.422893524169922, "global_step": 373279, "epoch": 2221} {"train_loss": -12.596200942993164, "global_step": 373280, "epoch": 2221} {"train_loss": -12.365574836730957, "global_step": 373281, "epoch": 2221} {"train_loss": -12.525160789489746, "global_step": 373282, "epoch": 2221} {"train_loss": -12.376118659973145, "global_step": 373283, "epoch": 2221} {"train_loss": -12.222890853881836, "global_step": 373284, "epoch": 2221} {"train_loss": -12.520523071289062, "global_step": 373285, "epoch": 2221} {"train_loss": -12.370047569274902, "global_step": 373286, "epoch": 2221} {"train_loss": -12.648405075073242, "global_step": 373287, "epoch": 2221} {"train_loss": -12.475979804992676, "global_step": 373288, "epoch": 2221} {"train_loss": -12.366556167602539, "global_step": 373289, "epoch": 2221} {"train_loss": -12.665205001831055, "global_step": 373290, "epoch": 2221} {"train_loss": -12.590324401855469, "global_step": 373291, "epoch": 2221} {"train_loss": -12.67064094543457, "global_step": 373292, "epoch": 2221} {"train_loss": -12.52142333984375, "global_step": 373293, "epoch": 2221} {"train_loss": -12.676647186279297, "global_step": 373294, "epoch": 2221} {"train_loss": -11.595511379696074, "global_step": 373295, "epoch": 2221, "val_loss": 292155.28125} {"train_loss": -12.598431587219238, "global_step": 373296, "epoch": 2222} {"train_loss": -12.611221313476562, "global_step": 373297, "epoch": 2222} {"train_loss": -12.721710205078125, "global_step": 373298, "epoch": 2222} {"train_loss": -12.452698707580566, "global_step": 373299, "epoch": 2222} {"train_loss": -12.766613006591797, "global_step": 373300, "epoch": 2222} {"train_loss": -12.730551719665527, "global_step": 373301, "epoch": 2222} {"train_loss": -12.755685806274414, "global_step": 373302, "epoch": 2222} {"train_loss": -12.62470817565918, "global_step": 373303, "epoch": 2222} {"train_loss": -12.622081756591797, "global_step": 373304, "epoch": 2222} {"train_loss": -12.631893157958984, "global_step": 373305, "epoch": 2222} {"train_loss": -12.79716968536377, "global_step": 373306, "epoch": 2222} {"train_loss": -12.596332550048828, "global_step": 373307, "epoch": 2222} {"train_loss": -12.735875129699707, "global_step": 373308, "epoch": 2222} {"train_loss": -12.600578308105469, "global_step": 373309, "epoch": 2222} {"train_loss": -12.488537788391113, "global_step": 373310, "epoch": 2222} {"train_loss": -12.54012680053711, "global_step": 373311, "epoch": 2222} {"train_loss": -12.339849472045898, "global_step": 373312, "epoch": 2222} {"train_loss": -12.28575611114502, "global_step": 373313, "epoch": 2222} {"train_loss": -12.53692626953125, "global_step": 373314, "epoch": 2222} {"train_loss": -12.55546760559082, "global_step": 373315, "epoch": 2222} {"train_loss": -12.234079360961914, "global_step": 373316, "epoch": 2222} {"train_loss": -12.300146102905273, "global_step": 373317, "epoch": 2222} {"train_loss": -12.41956901550293, "global_step": 373318, "epoch": 2222} {"train_loss": -12.462223052978516, "global_step": 373319, "epoch": 2222} {"train_loss": -12.602581024169922, "global_step": 373320, "epoch": 2222} {"train_loss": -12.453353881835938, "global_step": 373321, "epoch": 2222} {"train_loss": -12.424042701721191, "global_step": 373322, "epoch": 2222} {"train_loss": -12.570165634155273, "global_step": 373323, "epoch": 2222} {"train_loss": -12.695230484008789, "global_step": 373324, "epoch": 2222} {"train_loss": -12.566261291503906, "global_step": 373325, "epoch": 2222} {"train_loss": -12.845768928527832, "global_step": 373326, "epoch": 2222} {"train_loss": -12.60947322845459, "global_step": 373327, "epoch": 2222} {"train_loss": -12.719704627990723, "global_step": 373328, "epoch": 2222} {"train_loss": -12.453981399536133, "global_step": 373329, "epoch": 2222} {"train_loss": -12.646976470947266, "global_step": 373330, "epoch": 2222} {"train_loss": -12.626304626464844, "global_step": 373331, "epoch": 2222} {"train_loss": -12.012157440185547, "global_step": 373332, "epoch": 2222} {"train_loss": -11.807857513427734, "global_step": 373333, "epoch": 2222} {"train_loss": -12.105729103088379, "global_step": 373334, "epoch": 2222} {"train_loss": -12.07588005065918, "global_step": 373335, "epoch": 2222} {"train_loss": -12.075932502746582, "global_step": 373336, "epoch": 2222} {"train_loss": -12.607914924621582, "global_step": 373337, "epoch": 2222} {"train_loss": -11.447406768798828, "global_step": 373338, "epoch": 2222} {"train_loss": -11.288642883300781, "global_step": 373339, "epoch": 2222} {"train_loss": -12.065911293029785, "global_step": 373340, "epoch": 2222} {"train_loss": -12.12299919128418, "global_step": 373341, "epoch": 2222} {"train_loss": -11.603931427001953, "global_step": 373342, "epoch": 2222} {"train_loss": -12.03286361694336, "global_step": 373343, "epoch": 2222} {"train_loss": -11.40216064453125, "global_step": 373344, "epoch": 2222} {"train_loss": -11.562774658203125, "global_step": 373345, "epoch": 2222} {"train_loss": -12.136906623840332, "global_step": 373346, "epoch": 2222} {"train_loss": -10.1127347946167, "global_step": 373347, "epoch": 2222} {"train_loss": -11.575992584228516, "global_step": 373348, "epoch": 2222} {"train_loss": -12.385943412780762, "global_step": 373349, "epoch": 2222} {"train_loss": -10.86751651763916, "global_step": 373350, "epoch": 2222} {"train_loss": -11.977985382080078, "global_step": 373351, "epoch": 2222} {"train_loss": -12.178412437438965, "global_step": 373352, "epoch": 2222} {"train_loss": -10.746273040771484, "global_step": 373353, "epoch": 2222} {"train_loss": -12.366266250610352, "global_step": 373354, "epoch": 2222} {"train_loss": -11.538093566894531, "global_step": 373355, "epoch": 2222} {"train_loss": -11.88326358795166, "global_step": 373356, "epoch": 2222} {"train_loss": -12.165552139282227, "global_step": 373357, "epoch": 2222} {"train_loss": -12.008240699768066, "global_step": 373358, "epoch": 2222} {"train_loss": -11.862579345703125, "global_step": 373359, "epoch": 2222} {"train_loss": -12.05616569519043, "global_step": 373360, "epoch": 2222} {"train_loss": -10.692129135131836, "global_step": 373361, "epoch": 2222} {"train_loss": -11.973980903625488, "global_step": 373362, "epoch": 2222} {"train_loss": -12.245194435119629, "global_step": 373363, "epoch": 2222} {"train_loss": -10.259705543518066, "global_step": 373364, "epoch": 2222} {"train_loss": -10.543304443359375, "global_step": 373365, "epoch": 2222} {"train_loss": -11.885302543640137, "global_step": 373366, "epoch": 2222} {"train_loss": -10.884218215942383, "global_step": 373367, "epoch": 2222} {"train_loss": -10.736324310302734, "global_step": 373368, "epoch": 2222} {"train_loss": -11.662334442138672, "global_step": 373369, "epoch": 2222} {"train_loss": -12.004194259643555, "global_step": 373370, "epoch": 2222} {"train_loss": -11.727141380310059, "global_step": 373371, "epoch": 2222} {"train_loss": -12.229073524475098, "global_step": 373372, "epoch": 2222} {"train_loss": -11.91696548461914, "global_step": 373373, "epoch": 2222} {"train_loss": -11.983068466186523, "global_step": 373374, "epoch": 2222} {"train_loss": -12.031742095947266, "global_step": 373375, "epoch": 2222} {"train_loss": -12.402571678161621, "global_step": 373376, "epoch": 2222} {"train_loss": -12.276350021362305, "global_step": 373377, "epoch": 2222} {"train_loss": -12.382564544677734, "global_step": 373378, "epoch": 2222} {"train_loss": -12.387092590332031, "global_step": 373379, "epoch": 2222} {"train_loss": -12.46794319152832, "global_step": 373380, "epoch": 2222} {"train_loss": -12.521484375, "global_step": 373381, "epoch": 2222} {"train_loss": -12.427364349365234, "global_step": 373382, "epoch": 2222} {"train_loss": -12.319780349731445, "global_step": 373383, "epoch": 2222} {"train_loss": -12.266594886779785, "global_step": 373384, "epoch": 2222} {"train_loss": -12.465534210205078, "global_step": 373385, "epoch": 2222} {"train_loss": -12.725120544433594, "global_step": 373386, "epoch": 2222} {"train_loss": -12.438993453979492, "global_step": 373387, "epoch": 2222} {"train_loss": -12.609668731689453, "global_step": 373388, "epoch": 2222} {"train_loss": -12.462133407592773, "global_step": 373389, "epoch": 2222} {"train_loss": -12.637100219726562, "global_step": 373390, "epoch": 2222} {"train_loss": -12.466485023498535, "global_step": 373391, "epoch": 2222} {"train_loss": -12.574237823486328, "global_step": 373392, "epoch": 2222} {"train_loss": -12.557302474975586, "global_step": 373393, "epoch": 2222} {"train_loss": -12.622465133666992, "global_step": 373394, "epoch": 2222} {"train_loss": -12.660528182983398, "global_step": 373395, "epoch": 2222} {"train_loss": -12.535467147827148, "global_step": 373396, "epoch": 2222} {"train_loss": -12.683273315429688, "global_step": 373397, "epoch": 2222} {"train_loss": -12.598306655883789, "global_step": 373398, "epoch": 2222} {"train_loss": -12.629670143127441, "global_step": 373399, "epoch": 2222} {"train_loss": -12.576326370239258, "global_step": 373400, "epoch": 2222} {"train_loss": -12.625472068786621, "global_step": 373401, "epoch": 2222} {"train_loss": -12.769861221313477, "global_step": 373402, "epoch": 2222} {"train_loss": -12.387939453125, "global_step": 373403, "epoch": 2222} {"train_loss": -12.608915328979492, "global_step": 373404, "epoch": 2222} {"train_loss": -12.806640625, "global_step": 373405, "epoch": 2222} {"train_loss": -12.709630012512207, "global_step": 373406, "epoch": 2222} {"train_loss": -12.537378311157227, "global_step": 373407, "epoch": 2222} {"train_loss": -12.594758033752441, "global_step": 373408, "epoch": 2222} {"train_loss": -12.549013137817383, "global_step": 373409, "epoch": 2222} {"train_loss": -12.634069442749023, "global_step": 373410, "epoch": 2222} {"train_loss": -12.579957962036133, "global_step": 373411, "epoch": 2222} {"train_loss": -12.481009483337402, "global_step": 373412, "epoch": 2222} {"train_loss": -12.747546195983887, "global_step": 373413, "epoch": 2222} {"train_loss": -12.580257415771484, "global_step": 373414, "epoch": 2222} {"train_loss": -12.741679191589355, "global_step": 373415, "epoch": 2222} {"train_loss": -12.621515274047852, "global_step": 373416, "epoch": 2222} {"train_loss": -12.505302429199219, "global_step": 373417, "epoch": 2222} {"train_loss": -12.35445499420166, "global_step": 373418, "epoch": 2222} {"train_loss": -12.41504955291748, "global_step": 373419, "epoch": 2222} {"train_loss": -12.879781723022461, "global_step": 373420, "epoch": 2222} {"train_loss": -12.673619270324707, "global_step": 373421, "epoch": 2222} {"train_loss": -12.168126106262207, "global_step": 373422, "epoch": 2222} {"train_loss": -12.512417793273926, "global_step": 373423, "epoch": 2222} {"train_loss": -12.42904281616211, "global_step": 373424, "epoch": 2222} {"train_loss": -12.539594650268555, "global_step": 373425, "epoch": 2222} {"train_loss": -12.376115798950195, "global_step": 373426, "epoch": 2222} {"train_loss": -12.59886360168457, "global_step": 373427, "epoch": 2222} {"train_loss": -12.342321395874023, "global_step": 373428, "epoch": 2222} {"train_loss": -12.271485328674316, "global_step": 373429, "epoch": 2222} {"train_loss": -12.493606567382812, "global_step": 373430, "epoch": 2222} {"train_loss": -11.807881355285645, "global_step": 373431, "epoch": 2222} {"train_loss": -12.020000457763672, "global_step": 373432, "epoch": 2222} {"train_loss": -12.285174369812012, "global_step": 373433, "epoch": 2222} {"train_loss": -12.391182899475098, "global_step": 373434, "epoch": 2222} {"train_loss": -12.165099143981934, "global_step": 373435, "epoch": 2222} {"train_loss": -12.596762657165527, "global_step": 373436, "epoch": 2222} {"train_loss": -11.233518600463867, "global_step": 373437, "epoch": 2222} {"train_loss": -10.452890396118164, "global_step": 373438, "epoch": 2222} {"train_loss": -10.844193458557129, "global_step": 373439, "epoch": 2222} {"train_loss": -11.085575103759766, "global_step": 373440, "epoch": 2222} {"train_loss": -7.051990509033203, "global_step": 373441, "epoch": 2222} {"train_loss": -7.115118026733398, "global_step": 373442, "epoch": 2222} {"train_loss": -7.2744855880737305, "global_step": 373443, "epoch": 2222} {"train_loss": -6.508632183074951, "global_step": 373444, "epoch": 2222} {"train_loss": -7.525461196899414, "global_step": 373445, "epoch": 2222} {"train_loss": -7.674165725708008, "global_step": 373446, "epoch": 2222} {"train_loss": -7.545328617095947, "global_step": 373447, "epoch": 2222} {"train_loss": -8.78768539428711, "global_step": 373448, "epoch": 2222} {"train_loss": -7.758965492248535, "global_step": 373449, "epoch": 2222} {"train_loss": -7.659173011779785, "global_step": 373450, "epoch": 2222} {"train_loss": -8.111747741699219, "global_step": 373451, "epoch": 2222} {"train_loss": -7.752608299255371, "global_step": 373452, "epoch": 2222} {"train_loss": -8.816732406616211, "global_step": 373453, "epoch": 2222} {"train_loss": -8.116537094116211, "global_step": 373454, "epoch": 2222} {"train_loss": -8.12502670288086, "global_step": 373455, "epoch": 2222} {"train_loss": -8.630440711975098, "global_step": 373456, "epoch": 2222} {"train_loss": -8.523390769958496, "global_step": 373457, "epoch": 2222} {"train_loss": -10.16455078125, "global_step": 373458, "epoch": 2222} {"train_loss": -8.879743576049805, "global_step": 373459, "epoch": 2222} {"train_loss": -9.593208312988281, "global_step": 373460, "epoch": 2222} {"train_loss": -10.096491813659668, "global_step": 373461, "epoch": 2222} {"train_loss": -9.356101989746094, "global_step": 373462, "epoch": 2222} {"train_loss": -11.698890958513532, "global_step": 373463, "epoch": 2222, "val_loss": 290628.9375} {"train_loss": -9.80958366394043, "global_step": 373464, "epoch": 2223} {"train_loss": -9.729303359985352, "global_step": 373465, "epoch": 2223} {"train_loss": -10.302274703979492, "global_step": 373466, "epoch": 2223} {"train_loss": -9.997342109680176, "global_step": 373467, "epoch": 2223} {"train_loss": -10.395844459533691, "global_step": 373468, "epoch": 2223} {"train_loss": -11.566451072692871, "global_step": 373469, "epoch": 2223} {"train_loss": -11.059078216552734, "global_step": 373470, "epoch": 2223} {"train_loss": -11.791954040527344, "global_step": 373471, "epoch": 2223} {"train_loss": -11.476236343383789, "global_step": 373472, "epoch": 2223} {"train_loss": -11.201302528381348, "global_step": 373473, "epoch": 2223} {"train_loss": -11.422433853149414, "global_step": 373474, "epoch": 2223} {"train_loss": -11.869010925292969, "global_step": 373475, "epoch": 2223} {"train_loss": -11.293961524963379, "global_step": 373476, "epoch": 2223} {"train_loss": -11.595808029174805, "global_step": 373477, "epoch": 2223} {"train_loss": -11.285492897033691, "global_step": 373478, "epoch": 2223} {"train_loss": -11.691717147827148, "global_step": 373479, "epoch": 2223} {"train_loss": -11.551355361938477, "global_step": 373480, "epoch": 2223} {"train_loss": -11.798465728759766, "global_step": 373481, "epoch": 2223} {"train_loss": -11.947613716125488, "global_step": 373482, "epoch": 2223} {"train_loss": -11.757545471191406, "global_step": 373483, "epoch": 2223} {"train_loss": -11.88119125366211, "global_step": 373484, "epoch": 2223} {"train_loss": -12.132174491882324, "global_step": 373485, "epoch": 2223} {"train_loss": -11.942113876342773, "global_step": 373486, "epoch": 2223} {"train_loss": -12.188457489013672, "global_step": 373487, "epoch": 2223} {"train_loss": -11.986479759216309, "global_step": 373488, "epoch": 2223} {"train_loss": -12.487040519714355, "global_step": 373489, "epoch": 2223} {"train_loss": -12.15017318725586, "global_step": 373490, "epoch": 2223} {"train_loss": -12.088990211486816, "global_step": 373491, "epoch": 2223} {"train_loss": -12.064191818237305, "global_step": 373492, "epoch": 2223} {"train_loss": -12.253908157348633, "global_step": 373493, "epoch": 2223} {"train_loss": -12.206390380859375, "global_step": 373494, "epoch": 2223} {"train_loss": -12.239171981811523, "global_step": 373495, "epoch": 2223} {"train_loss": -12.080205917358398, "global_step": 373496, "epoch": 2223} {"train_loss": -12.217662811279297, "global_step": 373497, "epoch": 2223} {"train_loss": -12.267440795898438, "global_step": 373498, "epoch": 2223} {"train_loss": -12.299484252929688, "global_step": 373499, "epoch": 2223} {"train_loss": -12.305658340454102, "global_step": 373500, "epoch": 2223} {"train_loss": -12.332921981811523, "global_step": 373501, "epoch": 2223} {"train_loss": -12.077179908752441, "global_step": 373502, "epoch": 2223} {"train_loss": -12.235201835632324, "global_step": 373503, "epoch": 2223} {"train_loss": -12.511397361755371, "global_step": 373504, "epoch": 2223} {"train_loss": -12.42670726776123, "global_step": 373505, "epoch": 2223} {"train_loss": -12.207014083862305, "global_step": 373506, "epoch": 2223} {"train_loss": -12.620549201965332, "global_step": 373507, "epoch": 2223} {"train_loss": -12.210419654846191, "global_step": 373508, "epoch": 2223} {"train_loss": -12.224876403808594, "global_step": 373509, "epoch": 2223} {"train_loss": -12.391773223876953, "global_step": 373510, "epoch": 2223} {"train_loss": -12.331520080566406, "global_step": 373511, "epoch": 2223} {"train_loss": -12.556203842163086, "global_step": 373512, "epoch": 2223} {"train_loss": -12.406442642211914, "global_step": 373513, "epoch": 2223} {"train_loss": -12.504255294799805, "global_step": 373514, "epoch": 2223} {"train_loss": -12.603921890258789, "global_step": 373515, "epoch": 2223} {"train_loss": -12.393072128295898, "global_step": 373516, "epoch": 2223} {"train_loss": -12.297014236450195, "global_step": 373517, "epoch": 2223} {"train_loss": -12.320398330688477, "global_step": 373518, "epoch": 2223} {"train_loss": -12.540111541748047, "global_step": 373519, "epoch": 2223} {"train_loss": -12.472663879394531, "global_step": 373520, "epoch": 2223} {"train_loss": -12.249778747558594, "global_step": 373521, "epoch": 2223} {"train_loss": -12.55064582824707, "global_step": 373522, "epoch": 2223} {"train_loss": -12.577274322509766, "global_step": 373523, "epoch": 2223} {"train_loss": -12.450298309326172, "global_step": 373524, "epoch": 2223} {"train_loss": -12.758220672607422, "global_step": 373525, "epoch": 2223} {"train_loss": -12.6417236328125, "global_step": 373526, "epoch": 2223} {"train_loss": -12.352720260620117, "global_step": 373527, "epoch": 2223} {"train_loss": -12.600452423095703, "global_step": 373528, "epoch": 2223} {"train_loss": -12.347664833068848, "global_step": 373529, "epoch": 2223} {"train_loss": -12.533556938171387, "global_step": 373530, "epoch": 2223} {"train_loss": -12.518769264221191, "global_step": 373531, "epoch": 2223} {"train_loss": -12.73934555053711, "global_step": 373532, "epoch": 2223} {"train_loss": -12.484764099121094, "global_step": 373533, "epoch": 2223} {"train_loss": -12.643474578857422, "global_step": 373534, "epoch": 2223} {"train_loss": -11.359286308288574, "global_step": 373535, "epoch": 2223} {"train_loss": -11.634109497070312, "global_step": 373536, "epoch": 2223} {"train_loss": -11.849874496459961, "global_step": 373537, "epoch": 2223} {"train_loss": -12.555654525756836, "global_step": 373538, "epoch": 2223} {"train_loss": -12.522976875305176, "global_step": 373539, "epoch": 2223} {"train_loss": -12.464823722839355, "global_step": 373540, "epoch": 2223} {"train_loss": -12.201557159423828, "global_step": 373541, "epoch": 2223} {"train_loss": -12.187578201293945, "global_step": 373542, "epoch": 2223} {"train_loss": -12.302183151245117, "global_step": 373543, "epoch": 2223} {"train_loss": -12.352859497070312, "global_step": 373544, "epoch": 2223} {"train_loss": -12.368684768676758, "global_step": 373545, "epoch": 2223} {"train_loss": -12.741582870483398, "global_step": 373546, "epoch": 2223} {"train_loss": -11.937515258789062, "global_step": 373547, "epoch": 2223} {"train_loss": -11.925443649291992, "global_step": 373548, "epoch": 2223} {"train_loss": -12.062009811401367, "global_step": 373549, "epoch": 2223} {"train_loss": -12.669837951660156, "global_step": 373550, "epoch": 2223} {"train_loss": -12.31714153289795, "global_step": 373551, "epoch": 2223} {"train_loss": -12.576797485351562, "global_step": 373552, "epoch": 2223} {"train_loss": -12.517990112304688, "global_step": 373553, "epoch": 2223} {"train_loss": -12.12346363067627, "global_step": 373554, "epoch": 2223} {"train_loss": -12.425677299499512, "global_step": 373555, "epoch": 2223} {"train_loss": -11.874284744262695, "global_step": 373556, "epoch": 2223} {"train_loss": -11.455110549926758, "global_step": 373557, "epoch": 2223} {"train_loss": -12.177661895751953, "global_step": 373558, "epoch": 2223} {"train_loss": -11.92631721496582, "global_step": 373559, "epoch": 2223} {"train_loss": -11.46074104309082, "global_step": 373560, "epoch": 2223} {"train_loss": -11.349175453186035, "global_step": 373561, "epoch": 2223} {"train_loss": -12.090538024902344, "global_step": 373562, "epoch": 2223} {"train_loss": -11.198675155639648, "global_step": 373563, "epoch": 2223} {"train_loss": -12.341585159301758, "global_step": 373564, "epoch": 2223} {"train_loss": -11.784276962280273, "global_step": 373565, "epoch": 2223} {"train_loss": -12.373272895812988, "global_step": 373566, "epoch": 2223} {"train_loss": -11.784120559692383, "global_step": 373567, "epoch": 2223} {"train_loss": -11.38518238067627, "global_step": 373568, "epoch": 2223} {"train_loss": -11.051980972290039, "global_step": 373569, "epoch": 2223} {"train_loss": -12.148754119873047, "global_step": 373570, "epoch": 2223} {"train_loss": -11.047723770141602, "global_step": 373571, "epoch": 2223} {"train_loss": -11.981562614440918, "global_step": 373572, "epoch": 2223} {"train_loss": -11.080747604370117, "global_step": 373573, "epoch": 2223} {"train_loss": -11.371063232421875, "global_step": 373574, "epoch": 2223} {"train_loss": -11.923585891723633, "global_step": 373575, "epoch": 2223} {"train_loss": -10.972084045410156, "global_step": 373576, "epoch": 2223} {"train_loss": -11.42151165008545, "global_step": 373577, "epoch": 2223} {"train_loss": -10.871773719787598, "global_step": 373578, "epoch": 2223} {"train_loss": -10.665748596191406, "global_step": 373579, "epoch": 2223} {"train_loss": -11.942420959472656, "global_step": 373580, "epoch": 2223} {"train_loss": -11.323331832885742, "global_step": 373581, "epoch": 2223} {"train_loss": -11.96364974975586, "global_step": 373582, "epoch": 2223} {"train_loss": -11.730852127075195, "global_step": 373583, "epoch": 2223} {"train_loss": -11.02424430847168, "global_step": 373584, "epoch": 2223} {"train_loss": -11.508500099182129, "global_step": 373585, "epoch": 2223} {"train_loss": -11.779622077941895, "global_step": 373586, "epoch": 2223} {"train_loss": -10.758404731750488, "global_step": 373587, "epoch": 2223} {"train_loss": -11.826369285583496, "global_step": 373588, "epoch": 2223} {"train_loss": -11.70838451385498, "global_step": 373589, "epoch": 2223} {"train_loss": -11.619867324829102, "global_step": 373590, "epoch": 2223} {"train_loss": -11.452672958374023, "global_step": 373591, "epoch": 2223} {"train_loss": -12.219825744628906, "global_step": 373592, "epoch": 2223} {"train_loss": -11.11606216430664, "global_step": 373593, "epoch": 2223} {"train_loss": -12.016831398010254, "global_step": 373594, "epoch": 2223} {"train_loss": -11.108675003051758, "global_step": 373595, "epoch": 2223} {"train_loss": -11.606229782104492, "global_step": 373596, "epoch": 2223} {"train_loss": -12.014592170715332, "global_step": 373597, "epoch": 2223} {"train_loss": -11.58088493347168, "global_step": 373598, "epoch": 2223} {"train_loss": -12.01492691040039, "global_step": 373599, "epoch": 2223} {"train_loss": -11.90516471862793, "global_step": 373600, "epoch": 2223} {"train_loss": -11.702287673950195, "global_step": 373601, "epoch": 2223} {"train_loss": -12.01751708984375, "global_step": 373602, "epoch": 2223} {"train_loss": -12.03404426574707, "global_step": 373603, "epoch": 2223} {"train_loss": -11.59909439086914, "global_step": 373604, "epoch": 2223} {"train_loss": -12.355123519897461, "global_step": 373605, "epoch": 2223} {"train_loss": -11.406651496887207, "global_step": 373606, "epoch": 2223} {"train_loss": -12.326446533203125, "global_step": 373607, "epoch": 2223} {"train_loss": -12.015949249267578, "global_step": 373608, "epoch": 2223} {"train_loss": -12.321855545043945, "global_step": 373609, "epoch": 2223} {"train_loss": -12.077035903930664, "global_step": 373610, "epoch": 2223} {"train_loss": -11.951499938964844, "global_step": 373611, "epoch": 2223} {"train_loss": -11.978515625, "global_step": 373612, "epoch": 2223} {"train_loss": -11.775192260742188, "global_step": 373613, "epoch": 2223} {"train_loss": -12.25948715209961, "global_step": 373614, "epoch": 2223} {"train_loss": -11.65937614440918, "global_step": 373615, "epoch": 2223} {"train_loss": -11.73997688293457, "global_step": 373616, "epoch": 2223} {"train_loss": -11.658201217651367, "global_step": 373617, "epoch": 2223} {"train_loss": -11.918071746826172, "global_step": 373618, "epoch": 2223} {"train_loss": -11.441339492797852, "global_step": 373619, "epoch": 2223} {"train_loss": -11.424680709838867, "global_step": 373620, "epoch": 2223} {"train_loss": -11.425542831420898, "global_step": 373621, "epoch": 2223} {"train_loss": -11.660745620727539, "global_step": 373622, "epoch": 2223} {"train_loss": -11.435447692871094, "global_step": 373623, "epoch": 2223} {"train_loss": -12.131577491760254, "global_step": 373624, "epoch": 2223} {"train_loss": -11.750192642211914, "global_step": 373625, "epoch": 2223} {"train_loss": -11.430048942565918, "global_step": 373626, "epoch": 2223} {"train_loss": -11.347454071044922, "global_step": 373627, "epoch": 2223} {"train_loss": -12.174148559570312, "global_step": 373628, "epoch": 2223} {"train_loss": -10.48481559753418, "global_step": 373629, "epoch": 2223} {"train_loss": -12.150779724121094, "global_step": 373630, "epoch": 2223} {"train_loss": -11.888625508262997, "global_step": 373631, "epoch": 2223, "val_loss": 295284.65625} {"train_loss": -10.897237777709961, "global_step": 373632, "epoch": 2224} {"train_loss": -10.833761215209961, "global_step": 373633, "epoch": 2224} {"train_loss": -11.809234619140625, "global_step": 373634, "epoch": 2224} {"train_loss": -11.562591552734375, "global_step": 373635, "epoch": 2224} {"train_loss": -10.264181137084961, "global_step": 373636, "epoch": 2224} {"train_loss": -11.801288604736328, "global_step": 373637, "epoch": 2224} {"train_loss": -9.316757202148438, "global_step": 373638, "epoch": 2224} {"train_loss": -11.194887161254883, "global_step": 373639, "epoch": 2224} {"train_loss": -10.148234367370605, "global_step": 373640, "epoch": 2224} {"train_loss": -11.058117866516113, "global_step": 373641, "epoch": 2224} {"train_loss": -9.808343887329102, "global_step": 373642, "epoch": 2224} {"train_loss": -11.021095275878906, "global_step": 373643, "epoch": 2224} {"train_loss": -10.383132934570312, "global_step": 373644, "epoch": 2224} {"train_loss": -11.262445449829102, "global_step": 373645, "epoch": 2224} {"train_loss": -10.631141662597656, "global_step": 373646, "epoch": 2224} {"train_loss": -11.238073348999023, "global_step": 373647, "epoch": 2224} {"train_loss": -11.491043090820312, "global_step": 373648, "epoch": 2224} {"train_loss": -11.314759254455566, "global_step": 373649, "epoch": 2224} {"train_loss": -12.040611267089844, "global_step": 373650, "epoch": 2224} {"train_loss": -11.892754554748535, "global_step": 373651, "epoch": 2224} {"train_loss": -11.718080520629883, "global_step": 373652, "epoch": 2224} {"train_loss": -11.553691864013672, "global_step": 373653, "epoch": 2224} {"train_loss": -12.128937721252441, "global_step": 373654, "epoch": 2224} {"train_loss": -11.794670104980469, "global_step": 373655, "epoch": 2224} {"train_loss": -11.909736633300781, "global_step": 373656, "epoch": 2224} {"train_loss": -12.12408447265625, "global_step": 373657, "epoch": 2224} {"train_loss": -11.991222381591797, "global_step": 373658, "epoch": 2224} {"train_loss": -11.941102981567383, "global_step": 373659, "epoch": 2224} {"train_loss": -11.71378231048584, "global_step": 373660, "epoch": 2224} {"train_loss": -11.850375175476074, "global_step": 373661, "epoch": 2224} {"train_loss": -12.076976776123047, "global_step": 373662, "epoch": 2224} {"train_loss": -11.909271240234375, "global_step": 373663, "epoch": 2224} {"train_loss": -12.247757911682129, "global_step": 373664, "epoch": 2224} {"train_loss": -11.840204238891602, "global_step": 373665, "epoch": 2224} {"train_loss": -12.147976875305176, "global_step": 373666, "epoch": 2224} {"train_loss": -12.326769828796387, "global_step": 373667, "epoch": 2224} {"train_loss": -12.07502555847168, "global_step": 373668, "epoch": 2224} {"train_loss": -11.996667861938477, "global_step": 373669, "epoch": 2224} {"train_loss": -12.343033790588379, "global_step": 373670, "epoch": 2224} {"train_loss": -12.281207084655762, "global_step": 373671, "epoch": 2224} {"train_loss": -12.405862808227539, "global_step": 373672, "epoch": 2224} {"train_loss": -12.355327606201172, "global_step": 373673, "epoch": 2224} {"train_loss": -12.318609237670898, "global_step": 373674, "epoch": 2224} {"train_loss": -12.037313461303711, "global_step": 373675, "epoch": 2224} {"train_loss": -12.342569351196289, "global_step": 373676, "epoch": 2224} {"train_loss": -12.151256561279297, "global_step": 373677, "epoch": 2224} {"train_loss": -12.252673149108887, "global_step": 373678, "epoch": 2224} {"train_loss": -12.301761627197266, "global_step": 373679, "epoch": 2224} {"train_loss": -12.374300003051758, "global_step": 373680, "epoch": 2224} {"train_loss": -12.455101013183594, "global_step": 373681, "epoch": 2224} {"train_loss": -12.42544174194336, "global_step": 373682, "epoch": 2224} {"train_loss": -12.467432022094727, "global_step": 373683, "epoch": 2224} {"train_loss": -12.440406799316406, "global_step": 373684, "epoch": 2224} {"train_loss": -12.258583068847656, "global_step": 373685, "epoch": 2224} {"train_loss": -12.464841842651367, "global_step": 373686, "epoch": 2224} {"train_loss": -12.44932746887207, "global_step": 373687, "epoch": 2224} {"train_loss": -12.576473236083984, "global_step": 373688, "epoch": 2224} {"train_loss": -12.412064552307129, "global_step": 373689, "epoch": 2224} {"train_loss": -12.210824966430664, "global_step": 373690, "epoch": 2224} {"train_loss": -12.358665466308594, "global_step": 373691, "epoch": 2224} {"train_loss": -12.475375175476074, "global_step": 373692, "epoch": 2224} {"train_loss": -12.400911331176758, "global_step": 373693, "epoch": 2224} {"train_loss": -11.791548728942871, "global_step": 373694, "epoch": 2224} {"train_loss": -12.492782592773438, "global_step": 373695, "epoch": 2224} {"train_loss": -12.217586517333984, "global_step": 373696, "epoch": 2224} {"train_loss": -12.533313751220703, "global_step": 373697, "epoch": 2224} {"train_loss": -12.488773345947266, "global_step": 373698, "epoch": 2224} {"train_loss": -12.471647262573242, "global_step": 373699, "epoch": 2224} {"train_loss": -12.576083183288574, "global_step": 373700, "epoch": 2224} {"train_loss": -12.562079429626465, "global_step": 373701, "epoch": 2224} {"train_loss": -12.45783805847168, "global_step": 373702, "epoch": 2224} {"train_loss": -12.248798370361328, "global_step": 373703, "epoch": 2224} {"train_loss": -12.3077392578125, "global_step": 373704, "epoch": 2224} {"train_loss": -12.270269393920898, "global_step": 373705, "epoch": 2224} {"train_loss": -12.329111099243164, "global_step": 373706, "epoch": 2224} {"train_loss": -12.272439956665039, "global_step": 373707, "epoch": 2224} {"train_loss": -12.46712875366211, "global_step": 373708, "epoch": 2224} {"train_loss": -12.474668502807617, "global_step": 373709, "epoch": 2224} {"train_loss": -12.262653350830078, "global_step": 373710, "epoch": 2224} {"train_loss": -12.491503715515137, "global_step": 373711, "epoch": 2224} {"train_loss": -12.336118698120117, "global_step": 373712, "epoch": 2224} {"train_loss": -12.7177095413208, "global_step": 373713, "epoch": 2224} {"train_loss": -12.169994354248047, "global_step": 373714, "epoch": 2224} {"train_loss": -12.527037620544434, "global_step": 373715, "epoch": 2224} {"train_loss": -11.888185501098633, "global_step": 373716, "epoch": 2224} {"train_loss": -12.316946029663086, "global_step": 373717, "epoch": 2224} {"train_loss": -12.541258811950684, "global_step": 373718, "epoch": 2224} {"train_loss": -12.641023635864258, "global_step": 373719, "epoch": 2224} {"train_loss": -12.213813781738281, "global_step": 373720, "epoch": 2224} {"train_loss": -12.3612060546875, "global_step": 373721, "epoch": 2224} {"train_loss": -12.531095504760742, "global_step": 373722, "epoch": 2224} {"train_loss": -12.401763916015625, "global_step": 373723, "epoch": 2224} {"train_loss": -12.399236679077148, "global_step": 373724, "epoch": 2224} {"train_loss": -12.548717498779297, "global_step": 373725, "epoch": 2224} {"train_loss": -12.605489730834961, "global_step": 373726, "epoch": 2224} {"train_loss": -12.56629467010498, "global_step": 373727, "epoch": 2224} {"train_loss": -12.637331008911133, "global_step": 373728, "epoch": 2224} {"train_loss": -12.445104598999023, "global_step": 373729, "epoch": 2224} {"train_loss": -12.487571716308594, "global_step": 373730, "epoch": 2224} {"train_loss": -12.342781066894531, "global_step": 373731, "epoch": 2224} {"train_loss": -12.69929027557373, "global_step": 373732, "epoch": 2224} {"train_loss": -12.45108413696289, "global_step": 373733, "epoch": 2224} {"train_loss": -12.611988067626953, "global_step": 373734, "epoch": 2224} {"train_loss": -12.565423965454102, "global_step": 373735, "epoch": 2224} {"train_loss": -12.664643287658691, "global_step": 373736, "epoch": 2224} {"train_loss": -12.615028381347656, "global_step": 373737, "epoch": 2224} {"train_loss": -12.592321395874023, "global_step": 373738, "epoch": 2224} {"train_loss": -12.674484252929688, "global_step": 373739, "epoch": 2224} {"train_loss": -12.921770095825195, "global_step": 373740, "epoch": 2224} {"train_loss": -12.747879981994629, "global_step": 373741, "epoch": 2224} {"train_loss": -12.422913551330566, "global_step": 373742, "epoch": 2224} {"train_loss": -12.45209789276123, "global_step": 373743, "epoch": 2224} {"train_loss": -12.673019409179688, "global_step": 373744, "epoch": 2224} {"train_loss": -12.349014282226562, "global_step": 373745, "epoch": 2224} {"train_loss": -12.710897445678711, "global_step": 373746, "epoch": 2224} {"train_loss": -12.531517028808594, "global_step": 373747, "epoch": 2224} {"train_loss": -12.033302307128906, "global_step": 373748, "epoch": 2224} {"train_loss": -11.575458526611328, "global_step": 373749, "epoch": 2224} {"train_loss": -12.12100601196289, "global_step": 373750, "epoch": 2224} {"train_loss": -12.51233196258545, "global_step": 373751, "epoch": 2224} {"train_loss": -12.271581649780273, "global_step": 373752, "epoch": 2224} {"train_loss": -11.045833587646484, "global_step": 373753, "epoch": 2224} {"train_loss": -9.21763801574707, "global_step": 373754, "epoch": 2224} {"train_loss": -11.78148078918457, "global_step": 373755, "epoch": 2224} {"train_loss": -10.60139274597168, "global_step": 373756, "epoch": 2224} {"train_loss": -8.043346405029297, "global_step": 373757, "epoch": 2224} {"train_loss": -8.371015548706055, "global_step": 373758, "epoch": 2224} {"train_loss": -10.583012580871582, "global_step": 373759, "epoch": 2224} {"train_loss": -9.769349098205566, "global_step": 373760, "epoch": 2224} {"train_loss": -10.831547737121582, "global_step": 373761, "epoch": 2224} {"train_loss": -10.601531982421875, "global_step": 373762, "epoch": 2224} {"train_loss": -10.851420402526855, "global_step": 373763, "epoch": 2224} {"train_loss": -11.142557144165039, "global_step": 373764, "epoch": 2224} {"train_loss": -11.260848045349121, "global_step": 373765, "epoch": 2224} {"train_loss": -10.610719680786133, "global_step": 373766, "epoch": 2224} {"train_loss": -9.9514741897583, "global_step": 373767, "epoch": 2224} {"train_loss": -10.514846801757812, "global_step": 373768, "epoch": 2224} {"train_loss": -10.904435157775879, "global_step": 373769, "epoch": 2224} {"train_loss": -11.147640228271484, "global_step": 373770, "epoch": 2224} {"train_loss": -11.522817611694336, "global_step": 373771, "epoch": 2224} {"train_loss": -10.27783489227295, "global_step": 373772, "epoch": 2224} {"train_loss": -10.87389087677002, "global_step": 373773, "epoch": 2224} {"train_loss": -11.760875701904297, "global_step": 373774, "epoch": 2224} {"train_loss": -11.95020866394043, "global_step": 373775, "epoch": 2224} {"train_loss": -11.703838348388672, "global_step": 373776, "epoch": 2224} {"train_loss": -11.57041072845459, "global_step": 373777, "epoch": 2224} {"train_loss": -11.236581802368164, "global_step": 373778, "epoch": 2224} {"train_loss": -12.165763854980469, "global_step": 373779, "epoch": 2224} {"train_loss": -12.008587837219238, "global_step": 373780, "epoch": 2224} {"train_loss": -11.794025421142578, "global_step": 373781, "epoch": 2224} {"train_loss": -12.060310363769531, "global_step": 373782, "epoch": 2224} {"train_loss": -12.007883071899414, "global_step": 373783, "epoch": 2224} {"train_loss": -11.366334915161133, "global_step": 373784, "epoch": 2224} {"train_loss": -12.151298522949219, "global_step": 373785, "epoch": 2224} {"train_loss": -11.689611434936523, "global_step": 373786, "epoch": 2224} {"train_loss": -11.504709243774414, "global_step": 373787, "epoch": 2224} {"train_loss": -12.055545806884766, "global_step": 373788, "epoch": 2224} {"train_loss": -11.538379669189453, "global_step": 373789, "epoch": 2224} {"train_loss": -12.043471336364746, "global_step": 373790, "epoch": 2224} {"train_loss": -11.88461685180664, "global_step": 373791, "epoch": 2224} {"train_loss": -11.806943893432617, "global_step": 373792, "epoch": 2224} {"train_loss": -11.785307884216309, "global_step": 373793, "epoch": 2224} {"train_loss": -11.810677528381348, "global_step": 373794, "epoch": 2224} {"train_loss": -12.116056442260742, "global_step": 373795, "epoch": 2224} {"train_loss": -11.83709716796875, "global_step": 373796, "epoch": 2224} {"train_loss": -12.173789024353027, "global_step": 373797, "epoch": 2224} {"train_loss": -11.877655029296875, "global_step": 373798, "epoch": 2224} {"train_loss": -11.866799734887623, "global_step": 373799, "epoch": 2224, "val_loss": 295259.65625} {"train_loss": -12.217988014221191, "global_step": 373800, "epoch": 2225} {"train_loss": -11.834423065185547, "global_step": 373801, "epoch": 2225} {"train_loss": -12.464824676513672, "global_step": 373802, "epoch": 2225} {"train_loss": -11.944180488586426, "global_step": 373803, "epoch": 2225} {"train_loss": -12.127420425415039, "global_step": 373804, "epoch": 2225} {"train_loss": -12.441734313964844, "global_step": 373805, "epoch": 2225} {"train_loss": -12.290302276611328, "global_step": 373806, "epoch": 2225} {"train_loss": -12.295876502990723, "global_step": 373807, "epoch": 2225} {"train_loss": -12.291316986083984, "global_step": 373808, "epoch": 2225} {"train_loss": -12.403741836547852, "global_step": 373809, "epoch": 2225} {"train_loss": -12.099767684936523, "global_step": 373810, "epoch": 2225} {"train_loss": -12.26689624786377, "global_step": 373811, "epoch": 2225} {"train_loss": -12.090401649475098, "global_step": 373812, "epoch": 2225} {"train_loss": -12.245849609375, "global_step": 373813, "epoch": 2225} {"train_loss": -12.165718078613281, "global_step": 373814, "epoch": 2225} {"train_loss": -11.680858612060547, "global_step": 373815, "epoch": 2225} {"train_loss": -12.006258010864258, "global_step": 373816, "epoch": 2225} {"train_loss": -11.980250358581543, "global_step": 373817, "epoch": 2225} {"train_loss": -11.714271545410156, "global_step": 373818, "epoch": 2225} {"train_loss": -12.196171760559082, "global_step": 373819, "epoch": 2225} {"train_loss": -12.203495025634766, "global_step": 373820, "epoch": 2225} {"train_loss": -12.014148712158203, "global_step": 373821, "epoch": 2225} {"train_loss": -12.001298904418945, "global_step": 373822, "epoch": 2225} {"train_loss": -12.210277557373047, "global_step": 373823, "epoch": 2225} {"train_loss": -12.175607681274414, "global_step": 373824, "epoch": 2225} {"train_loss": -11.966758728027344, "global_step": 373825, "epoch": 2225} {"train_loss": -12.362060546875, "global_step": 373826, "epoch": 2225} {"train_loss": -12.00406265258789, "global_step": 373827, "epoch": 2225} {"train_loss": -12.272377967834473, "global_step": 373828, "epoch": 2225} {"train_loss": -11.092530250549316, "global_step": 373829, "epoch": 2225} {"train_loss": -11.983572006225586, "global_step": 373830, "epoch": 2225} {"train_loss": -12.086106300354004, "global_step": 373831, "epoch": 2225} {"train_loss": -12.445375442504883, "global_step": 373832, "epoch": 2225} {"train_loss": -12.382898330688477, "global_step": 373833, "epoch": 2225} {"train_loss": -12.42747974395752, "global_step": 373834, "epoch": 2225} {"train_loss": -12.33685302734375, "global_step": 373835, "epoch": 2225} {"train_loss": -12.313043594360352, "global_step": 373836, "epoch": 2225} {"train_loss": -12.501224517822266, "global_step": 373837, "epoch": 2225} {"train_loss": -12.272797584533691, "global_step": 373838, "epoch": 2225} {"train_loss": -12.034271240234375, "global_step": 373839, "epoch": 2225} {"train_loss": -12.15751838684082, "global_step": 373840, "epoch": 2225} {"train_loss": -12.618316650390625, "global_step": 373841, "epoch": 2225} {"train_loss": -12.455696105957031, "global_step": 373842, "epoch": 2225} {"train_loss": -12.60311222076416, "global_step": 373843, "epoch": 2225} {"train_loss": -12.484798431396484, "global_step": 373844, "epoch": 2225} {"train_loss": -12.243709564208984, "global_step": 373845, "epoch": 2225} {"train_loss": -12.32164192199707, "global_step": 373846, "epoch": 2225} {"train_loss": -12.496448516845703, "global_step": 373847, "epoch": 2225} {"train_loss": -12.297256469726562, "global_step": 373848, "epoch": 2225} {"train_loss": -12.63941764831543, "global_step": 373849, "epoch": 2225} {"train_loss": -12.430948257446289, "global_step": 373850, "epoch": 2225} {"train_loss": -12.359454154968262, "global_step": 373851, "epoch": 2225} {"train_loss": -12.558670043945312, "global_step": 373852, "epoch": 2225} {"train_loss": -11.951862335205078, "global_step": 373853, "epoch": 2225} {"train_loss": -12.288021087646484, "global_step": 373854, "epoch": 2225} {"train_loss": -11.668448448181152, "global_step": 373855, "epoch": 2225} {"train_loss": -11.623730659484863, "global_step": 373856, "epoch": 2225} {"train_loss": -11.881824493408203, "global_step": 373857, "epoch": 2225} {"train_loss": -12.365571975708008, "global_step": 373858, "epoch": 2225} {"train_loss": -11.824222564697266, "global_step": 373859, "epoch": 2225} {"train_loss": -11.768479347229004, "global_step": 373860, "epoch": 2225} {"train_loss": -12.263440132141113, "global_step": 373861, "epoch": 2225} {"train_loss": -12.092327117919922, "global_step": 373862, "epoch": 2225} {"train_loss": -11.928445816040039, "global_step": 373863, "epoch": 2225} {"train_loss": -12.034280776977539, "global_step": 373864, "epoch": 2225} {"train_loss": -12.25295352935791, "global_step": 373865, "epoch": 2225} {"train_loss": -12.143278121948242, "global_step": 373866, "epoch": 2225} {"train_loss": -12.163195610046387, "global_step": 373867, "epoch": 2225} {"train_loss": -12.348902702331543, "global_step": 373868, "epoch": 2225} {"train_loss": -12.202162742614746, "global_step": 373869, "epoch": 2225} {"train_loss": -12.266073226928711, "global_step": 373870, "epoch": 2225} {"train_loss": -12.14819622039795, "global_step": 373871, "epoch": 2225} {"train_loss": -11.918476104736328, "global_step": 373872, "epoch": 2225} {"train_loss": -10.881824493408203, "global_step": 373873, "epoch": 2225} {"train_loss": -12.162744522094727, "global_step": 373874, "epoch": 2225} {"train_loss": -11.916746139526367, "global_step": 373875, "epoch": 2225} {"train_loss": -11.435953140258789, "global_step": 373876, "epoch": 2225} {"train_loss": -12.34579849243164, "global_step": 373877, "epoch": 2225} {"train_loss": -11.164687156677246, "global_step": 373878, "epoch": 2225} {"train_loss": -12.210042953491211, "global_step": 373879, "epoch": 2225} {"train_loss": -11.735923767089844, "global_step": 373880, "epoch": 2225} {"train_loss": -11.91418743133545, "global_step": 373881, "epoch": 2225} {"train_loss": -11.674333572387695, "global_step": 373882, "epoch": 2225} {"train_loss": -10.772909164428711, "global_step": 373883, "epoch": 2225} {"train_loss": -11.44314956665039, "global_step": 373884, "epoch": 2225} {"train_loss": -11.037642478942871, "global_step": 373885, "epoch": 2225} {"train_loss": -9.689738273620605, "global_step": 373886, "epoch": 2225} {"train_loss": -9.467053413391113, "global_step": 373887, "epoch": 2225} {"train_loss": -10.893789291381836, "global_step": 373888, "epoch": 2225} {"train_loss": -10.179252624511719, "global_step": 373889, "epoch": 2225} {"train_loss": -10.673990249633789, "global_step": 373890, "epoch": 2225} {"train_loss": -10.401951789855957, "global_step": 373891, "epoch": 2225} {"train_loss": -9.057767868041992, "global_step": 373892, "epoch": 2225} {"train_loss": -9.116212844848633, "global_step": 373893, "epoch": 2225} {"train_loss": -9.412352561950684, "global_step": 373894, "epoch": 2225} {"train_loss": -9.910770416259766, "global_step": 373895, "epoch": 2225} {"train_loss": -9.333881378173828, "global_step": 373896, "epoch": 2225} {"train_loss": -10.628314971923828, "global_step": 373897, "epoch": 2225} {"train_loss": -11.126354217529297, "global_step": 373898, "epoch": 2225} {"train_loss": -10.429040908813477, "global_step": 373899, "epoch": 2225} {"train_loss": -11.04640007019043, "global_step": 373900, "epoch": 2225} {"train_loss": -11.459047317504883, "global_step": 373901, "epoch": 2225} {"train_loss": -10.348066329956055, "global_step": 373902, "epoch": 2225} {"train_loss": -11.446735382080078, "global_step": 373903, "epoch": 2225} {"train_loss": -10.175057411193848, "global_step": 373904, "epoch": 2225} {"train_loss": -11.249034881591797, "global_step": 373905, "epoch": 2225} {"train_loss": -10.21143913269043, "global_step": 373906, "epoch": 2225} {"train_loss": -10.576493263244629, "global_step": 373907, "epoch": 2225} {"train_loss": -11.234286308288574, "global_step": 373908, "epoch": 2225} {"train_loss": -10.954231262207031, "global_step": 373909, "epoch": 2225} {"train_loss": -11.75843620300293, "global_step": 373910, "epoch": 2225} {"train_loss": -11.051956176757812, "global_step": 373911, "epoch": 2225} {"train_loss": -11.56416130065918, "global_step": 373912, "epoch": 2225} {"train_loss": -11.38613510131836, "global_step": 373913, "epoch": 2225} {"train_loss": -11.469094276428223, "global_step": 373914, "epoch": 2225} {"train_loss": -11.470990180969238, "global_step": 373915, "epoch": 2225} {"train_loss": -11.39285659790039, "global_step": 373916, "epoch": 2225} {"train_loss": -11.6195707321167, "global_step": 373917, "epoch": 2225} {"train_loss": -11.751291275024414, "global_step": 373918, "epoch": 2225} {"train_loss": -11.92654800415039, "global_step": 373919, "epoch": 2225} {"train_loss": -11.327649116516113, "global_step": 373920, "epoch": 2225} {"train_loss": -11.440839767456055, "global_step": 373921, "epoch": 2225} {"train_loss": -12.205337524414062, "global_step": 373922, "epoch": 2225} {"train_loss": -11.361583709716797, "global_step": 373923, "epoch": 2225} {"train_loss": -12.075783729553223, "global_step": 373924, "epoch": 2225} {"train_loss": -12.065143585205078, "global_step": 373925, "epoch": 2225} {"train_loss": -12.190572738647461, "global_step": 373926, "epoch": 2225} {"train_loss": -12.078052520751953, "global_step": 373927, "epoch": 2225} {"train_loss": -12.047540664672852, "global_step": 373928, "epoch": 2225} {"train_loss": -11.868392944335938, "global_step": 373929, "epoch": 2225} {"train_loss": -12.20582103729248, "global_step": 373930, "epoch": 2225} {"train_loss": -11.955979347229004, "global_step": 373931, "epoch": 2225} {"train_loss": -12.408737182617188, "global_step": 373932, "epoch": 2225} {"train_loss": -12.320929527282715, "global_step": 373933, "epoch": 2225} {"train_loss": -12.242319107055664, "global_step": 373934, "epoch": 2225} {"train_loss": -12.407123565673828, "global_step": 373935, "epoch": 2225} {"train_loss": -12.352555274963379, "global_step": 373936, "epoch": 2225} {"train_loss": -12.25671100616455, "global_step": 373937, "epoch": 2225} {"train_loss": -12.238388061523438, "global_step": 373938, "epoch": 2225} {"train_loss": -12.287395477294922, "global_step": 373939, "epoch": 2225} {"train_loss": -12.490629196166992, "global_step": 373940, "epoch": 2225} {"train_loss": -12.361211776733398, "global_step": 373941, "epoch": 2225} {"train_loss": -12.350459098815918, "global_step": 373942, "epoch": 2225} {"train_loss": -12.467117309570312, "global_step": 373943, "epoch": 2225} {"train_loss": -12.351703643798828, "global_step": 373944, "epoch": 2225} {"train_loss": -12.22400188446045, "global_step": 373945, "epoch": 2225} {"train_loss": -12.227277755737305, "global_step": 373946, "epoch": 2225} {"train_loss": -12.453651428222656, "global_step": 373947, "epoch": 2225} {"train_loss": -12.339155197143555, "global_step": 373948, "epoch": 2225} {"train_loss": -12.3011474609375, "global_step": 373949, "epoch": 2225} {"train_loss": -12.568607330322266, "global_step": 373950, "epoch": 2225} {"train_loss": -12.61498737335205, "global_step": 373951, "epoch": 2225} {"train_loss": -12.504420280456543, "global_step": 373952, "epoch": 2225} {"train_loss": -12.56214714050293, "global_step": 373953, "epoch": 2225} {"train_loss": -12.550756454467773, "global_step": 373954, "epoch": 2225} {"train_loss": -12.621110916137695, "global_step": 373955, "epoch": 2225} {"train_loss": -12.653234481811523, "global_step": 373956, "epoch": 2225} {"train_loss": -12.571503639221191, "global_step": 373957, "epoch": 2225} {"train_loss": -12.577527046203613, "global_step": 373958, "epoch": 2225} {"train_loss": -12.654878616333008, "global_step": 373959, "epoch": 2225} {"train_loss": -12.37826156616211, "global_step": 373960, "epoch": 2225} {"train_loss": -12.700662612915039, "global_step": 373961, "epoch": 2225} {"train_loss": -12.553285598754883, "global_step": 373962, "epoch": 2225} {"train_loss": -12.537909507751465, "global_step": 373963, "epoch": 2225} {"train_loss": -12.515527725219727, "global_step": 373964, "epoch": 2225} {"train_loss": -12.301419258117676, "global_step": 373965, "epoch": 2225} {"train_loss": -12.65643310546875, "global_step": 373966, "epoch": 2225} {"train_loss": -11.874508942876544, "global_step": 373967, "epoch": 2225, "val_loss": 295377.75, "train_action_mse_error": 1.387652039527893} {"train_loss": -12.690656661987305, "global_step": 373968, "epoch": 2226} {"train_loss": -12.872883796691895, "global_step": 373969, "epoch": 2226} {"train_loss": -12.626778602600098, "global_step": 373970, "epoch": 2226} {"train_loss": -12.468145370483398, "global_step": 373971, "epoch": 2226} {"train_loss": -12.635687828063965, "global_step": 373972, "epoch": 2226} {"train_loss": -12.719600677490234, "global_step": 373973, "epoch": 2226} {"train_loss": -12.63508415222168, "global_step": 373974, "epoch": 2226} {"train_loss": -12.711078643798828, "global_step": 373975, "epoch": 2226} {"train_loss": -12.887771606445312, "global_step": 373976, "epoch": 2226} {"train_loss": -12.72008991241455, "global_step": 373977, "epoch": 2226} {"train_loss": -12.633362770080566, "global_step": 373978, "epoch": 2226} {"train_loss": -12.737797737121582, "global_step": 373979, "epoch": 2226} {"train_loss": -12.562405586242676, "global_step": 373980, "epoch": 2226} {"train_loss": -12.651939392089844, "global_step": 373981, "epoch": 2226} {"train_loss": -12.706745147705078, "global_step": 373982, "epoch": 2226} {"train_loss": -12.482738494873047, "global_step": 373983, "epoch": 2226} {"train_loss": -12.693367004394531, "global_step": 373984, "epoch": 2226} {"train_loss": -12.772638320922852, "global_step": 373985, "epoch": 2226} {"train_loss": -12.089784622192383, "global_step": 373986, "epoch": 2226} {"train_loss": -11.963249206542969, "global_step": 373987, "epoch": 2226} {"train_loss": -12.413010597229004, "global_step": 373988, "epoch": 2226} {"train_loss": -12.50857925415039, "global_step": 373989, "epoch": 2226} {"train_loss": -12.534461975097656, "global_step": 373990, "epoch": 2226} {"train_loss": -12.174022674560547, "global_step": 373991, "epoch": 2226} {"train_loss": -12.279886245727539, "global_step": 373992, "epoch": 2226} {"train_loss": -12.611909866333008, "global_step": 373993, "epoch": 2226} {"train_loss": -12.649673461914062, "global_step": 373994, "epoch": 2226} {"train_loss": -12.619930267333984, "global_step": 373995, "epoch": 2226} {"train_loss": -12.476470947265625, "global_step": 373996, "epoch": 2226} {"train_loss": -12.768622398376465, "global_step": 373997, "epoch": 2226} {"train_loss": -11.966594696044922, "global_step": 373998, "epoch": 2226} {"train_loss": -12.433370590209961, "global_step": 373999, "epoch": 2226} {"train_loss": -12.600133895874023, "global_step": 374000, "epoch": 2226} {"train_loss": -12.578422546386719, "global_step": 374001, "epoch": 2226} {"train_loss": -12.210744857788086, "global_step": 374002, "epoch": 2226} {"train_loss": -12.279475212097168, "global_step": 374003, "epoch": 2226} {"train_loss": -12.353591918945312, "global_step": 374004, "epoch": 2226} {"train_loss": -12.184818267822266, "global_step": 374005, "epoch": 2226} {"train_loss": -12.3539457321167, "global_step": 374006, "epoch": 2226} {"train_loss": -12.451862335205078, "global_step": 374007, "epoch": 2226} {"train_loss": -12.117660522460938, "global_step": 374008, "epoch": 2226} {"train_loss": -12.233633041381836, "global_step": 374009, "epoch": 2226} {"train_loss": -12.81137466430664, "global_step": 374010, "epoch": 2226} {"train_loss": -11.829233169555664, "global_step": 374011, "epoch": 2226} {"train_loss": -11.718293190002441, "global_step": 374012, "epoch": 2226} {"train_loss": -12.119172096252441, "global_step": 374013, "epoch": 2226} {"train_loss": -12.221185684204102, "global_step": 374014, "epoch": 2226} {"train_loss": -11.730372428894043, "global_step": 374015, "epoch": 2226} {"train_loss": -11.702503204345703, "global_step": 374016, "epoch": 2226} {"train_loss": -11.539657592773438, "global_step": 374017, "epoch": 2226} {"train_loss": -11.542755126953125, "global_step": 374018, "epoch": 2226} {"train_loss": -12.056000709533691, "global_step": 374019, "epoch": 2226} {"train_loss": -11.767810821533203, "global_step": 374020, "epoch": 2226} {"train_loss": -11.769017219543457, "global_step": 374021, "epoch": 2226} {"train_loss": -12.0166654586792, "global_step": 374022, "epoch": 2226} {"train_loss": -12.417570114135742, "global_step": 374023, "epoch": 2226} {"train_loss": -12.260892868041992, "global_step": 374024, "epoch": 2226} {"train_loss": -11.390357971191406, "global_step": 374025, "epoch": 2226} {"train_loss": -12.462909698486328, "global_step": 374026, "epoch": 2226} {"train_loss": -11.1923828125, "global_step": 374027, "epoch": 2226} {"train_loss": -10.370222091674805, "global_step": 374028, "epoch": 2226} {"train_loss": -10.810783386230469, "global_step": 374029, "epoch": 2226} {"train_loss": -11.299031257629395, "global_step": 374030, "epoch": 2226} {"train_loss": -8.822349548339844, "global_step": 374031, "epoch": 2226} {"train_loss": -7.602756500244141, "global_step": 374032, "epoch": 2226} {"train_loss": -7.442939281463623, "global_step": 374033, "epoch": 2226} {"train_loss": -6.944338798522949, "global_step": 374034, "epoch": 2226} {"train_loss": -8.912036895751953, "global_step": 374035, "epoch": 2226} {"train_loss": -7.590854644775391, "global_step": 374036, "epoch": 2226} {"train_loss": -8.060911178588867, "global_step": 374037, "epoch": 2226} {"train_loss": -8.49521255493164, "global_step": 374038, "epoch": 2226} {"train_loss": -8.527894973754883, "global_step": 374039, "epoch": 2226} {"train_loss": -9.055671691894531, "global_step": 374040, "epoch": 2226} {"train_loss": -8.470846176147461, "global_step": 374041, "epoch": 2226} {"train_loss": -9.0241117477417, "global_step": 374042, "epoch": 2226} {"train_loss": -9.09997844696045, "global_step": 374043, "epoch": 2226} {"train_loss": -9.143732070922852, "global_step": 374044, "epoch": 2226} {"train_loss": -11.029556274414062, "global_step": 374045, "epoch": 2226} {"train_loss": -10.623098373413086, "global_step": 374046, "epoch": 2226} {"train_loss": -10.923972129821777, "global_step": 374047, "epoch": 2226} {"train_loss": -9.1806640625, "global_step": 374048, "epoch": 2226} {"train_loss": -9.473876953125, "global_step": 374049, "epoch": 2226} {"train_loss": -9.333599090576172, "global_step": 374050, "epoch": 2226} {"train_loss": -9.950961112976074, "global_step": 374051, "epoch": 2226} {"train_loss": -9.699454307556152, "global_step": 374052, "epoch": 2226} {"train_loss": -8.652734756469727, "global_step": 374053, "epoch": 2226} {"train_loss": -9.862249374389648, "global_step": 374054, "epoch": 2226} {"train_loss": -10.352312088012695, "global_step": 374055, "epoch": 2226} {"train_loss": -10.249717712402344, "global_step": 374056, "epoch": 2226} {"train_loss": -10.457633018493652, "global_step": 374057, "epoch": 2226} {"train_loss": -10.31379508972168, "global_step": 374058, "epoch": 2226} {"train_loss": -10.843477249145508, "global_step": 374059, "epoch": 2226} {"train_loss": -9.988017082214355, "global_step": 374060, "epoch": 2226} {"train_loss": -10.651789665222168, "global_step": 374061, "epoch": 2226} {"train_loss": -10.923833847045898, "global_step": 374062, "epoch": 2226} {"train_loss": -9.4671630859375, "global_step": 374063, "epoch": 2226} {"train_loss": -11.444063186645508, "global_step": 374064, "epoch": 2226} {"train_loss": -9.83087158203125, "global_step": 374065, "epoch": 2226} {"train_loss": -11.604524612426758, "global_step": 374066, "epoch": 2226} {"train_loss": -9.768478393554688, "global_step": 374067, "epoch": 2226} {"train_loss": -11.577943801879883, "global_step": 374068, "epoch": 2226} {"train_loss": -10.886934280395508, "global_step": 374069, "epoch": 2226} {"train_loss": -11.444337844848633, "global_step": 374070, "epoch": 2226} {"train_loss": -10.985823631286621, "global_step": 374071, "epoch": 2226} {"train_loss": -10.669225692749023, "global_step": 374072, "epoch": 2226} {"train_loss": -10.632733345031738, "global_step": 374073, "epoch": 2226} {"train_loss": -11.241118431091309, "global_step": 374074, "epoch": 2226} {"train_loss": -11.023843765258789, "global_step": 374075, "epoch": 2226} {"train_loss": -10.630280494689941, "global_step": 374076, "epoch": 2226} {"train_loss": -11.385828971862793, "global_step": 374077, "epoch": 2226} {"train_loss": -11.249002456665039, "global_step": 374078, "epoch": 2226} {"train_loss": -11.190343856811523, "global_step": 374079, "epoch": 2226} {"train_loss": -11.497699737548828, "global_step": 374080, "epoch": 2226} {"train_loss": -11.046812057495117, "global_step": 374081, "epoch": 2226} {"train_loss": -11.670995712280273, "global_step": 374082, "epoch": 2226} {"train_loss": -11.609174728393555, "global_step": 374083, "epoch": 2226} {"train_loss": -11.825222969055176, "global_step": 374084, "epoch": 2226} {"train_loss": -11.420459747314453, "global_step": 374085, "epoch": 2226} {"train_loss": -12.108219146728516, "global_step": 374086, "epoch": 2226} {"train_loss": -11.387055397033691, "global_step": 374087, "epoch": 2226} {"train_loss": -11.874371528625488, "global_step": 374088, "epoch": 2226} {"train_loss": -11.859813690185547, "global_step": 374089, "epoch": 2226} {"train_loss": -11.65237808227539, "global_step": 374090, "epoch": 2226} {"train_loss": -12.141366958618164, "global_step": 374091, "epoch": 2226} {"train_loss": -11.680316925048828, "global_step": 374092, "epoch": 2226} {"train_loss": -11.789950370788574, "global_step": 374093, "epoch": 2226} {"train_loss": -11.88176155090332, "global_step": 374094, "epoch": 2226} {"train_loss": -11.724299430847168, "global_step": 374095, "epoch": 2226} {"train_loss": -11.926912307739258, "global_step": 374096, "epoch": 2226} {"train_loss": -12.148880004882812, "global_step": 374097, "epoch": 2226} {"train_loss": -11.937992095947266, "global_step": 374098, "epoch": 2226} {"train_loss": -12.177874565124512, "global_step": 374099, "epoch": 2226} {"train_loss": -11.994721412658691, "global_step": 374100, "epoch": 2226} {"train_loss": -12.037694931030273, "global_step": 374101, "epoch": 2226} {"train_loss": -12.230209350585938, "global_step": 374102, "epoch": 2226} {"train_loss": -12.070182800292969, "global_step": 374103, "epoch": 2226} {"train_loss": -12.0699462890625, "global_step": 374104, "epoch": 2226} {"train_loss": -12.119640350341797, "global_step": 374105, "epoch": 2226} {"train_loss": -12.205378532409668, "global_step": 374106, "epoch": 2226} {"train_loss": -11.892297744750977, "global_step": 374107, "epoch": 2226} {"train_loss": -12.265408515930176, "global_step": 374108, "epoch": 2226} {"train_loss": -12.127193450927734, "global_step": 374109, "epoch": 2226} {"train_loss": -12.110527992248535, "global_step": 374110, "epoch": 2226} {"train_loss": -12.179155349731445, "global_step": 374111, "epoch": 2226} {"train_loss": -12.023008346557617, "global_step": 374112, "epoch": 2226} {"train_loss": -12.330126762390137, "global_step": 374113, "epoch": 2226} {"train_loss": -12.018835067749023, "global_step": 374114, "epoch": 2226} {"train_loss": -12.151830673217773, "global_step": 374115, "epoch": 2226} {"train_loss": -12.182879447937012, "global_step": 374116, "epoch": 2226} {"train_loss": -12.16781234741211, "global_step": 374117, "epoch": 2226} {"train_loss": -12.367111206054688, "global_step": 374118, "epoch": 2226} {"train_loss": -12.172532081604004, "global_step": 374119, "epoch": 2226} {"train_loss": -12.282032012939453, "global_step": 374120, "epoch": 2226} {"train_loss": -12.348004341125488, "global_step": 374121, "epoch": 2226} {"train_loss": -12.273534774780273, "global_step": 374122, "epoch": 2226} {"train_loss": -12.280902862548828, "global_step": 374123, "epoch": 2226} {"train_loss": -12.302023887634277, "global_step": 374124, "epoch": 2226} {"train_loss": -12.034090995788574, "global_step": 374125, "epoch": 2226} {"train_loss": -12.378846168518066, "global_step": 374126, "epoch": 2226} {"train_loss": -12.279884338378906, "global_step": 374127, "epoch": 2226} {"train_loss": -12.39033317565918, "global_step": 374128, "epoch": 2226} {"train_loss": -12.126041412353516, "global_step": 374129, "epoch": 2226} {"train_loss": -12.449748039245605, "global_step": 374130, "epoch": 2226} {"train_loss": -12.419271469116211, "global_step": 374131, "epoch": 2226} {"train_loss": -12.35283088684082, "global_step": 374132, "epoch": 2226} {"train_loss": -12.269126892089844, "global_step": 374133, "epoch": 2226} {"train_loss": -12.442872047424316, "global_step": 374134, "epoch": 2226} {"train_loss": -11.499733456543513, "global_step": 374135, "epoch": 2226, "val_loss": 292778.1875} {"train_loss": -12.423786163330078, "global_step": 374136, "epoch": 2227} {"train_loss": -12.537749290466309, "global_step": 374137, "epoch": 2227} {"train_loss": -12.351278305053711, "global_step": 374138, "epoch": 2227} {"train_loss": -12.514060020446777, "global_step": 374139, "epoch": 2227} {"train_loss": -12.394183158874512, "global_step": 374140, "epoch": 2227} {"train_loss": -12.574442863464355, "global_step": 374141, "epoch": 2227} {"train_loss": -12.596202850341797, "global_step": 374142, "epoch": 2227} {"train_loss": -12.363666534423828, "global_step": 374143, "epoch": 2227} {"train_loss": -12.48409652709961, "global_step": 374144, "epoch": 2227} {"train_loss": -12.67935562133789, "global_step": 374145, "epoch": 2227} {"train_loss": -12.584542274475098, "global_step": 374146, "epoch": 2227} {"train_loss": -12.643871307373047, "global_step": 374147, "epoch": 2227} {"train_loss": -12.563201904296875, "global_step": 374148, "epoch": 2227} {"train_loss": -12.172187805175781, "global_step": 374149, "epoch": 2227} {"train_loss": -12.605417251586914, "global_step": 374150, "epoch": 2227} {"train_loss": -12.725738525390625, "global_step": 374151, "epoch": 2227} {"train_loss": -12.645882606506348, "global_step": 374152, "epoch": 2227} {"train_loss": -12.429060935974121, "global_step": 374153, "epoch": 2227} {"train_loss": -12.88455581665039, "global_step": 374154, "epoch": 2227} {"train_loss": -12.762176513671875, "global_step": 374155, "epoch": 2227} {"train_loss": -12.528940200805664, "global_step": 374156, "epoch": 2227} {"train_loss": -12.773578643798828, "global_step": 374157, "epoch": 2227} {"train_loss": -12.768259048461914, "global_step": 374158, "epoch": 2227} {"train_loss": -12.535374641418457, "global_step": 374159, "epoch": 2227} {"train_loss": -12.587616920471191, "global_step": 374160, "epoch": 2227} {"train_loss": -12.769306182861328, "global_step": 374161, "epoch": 2227} {"train_loss": -12.675209045410156, "global_step": 374162, "epoch": 2227} {"train_loss": -12.362913131713867, "global_step": 374163, "epoch": 2227} {"train_loss": -11.913057327270508, "global_step": 374164, "epoch": 2227} {"train_loss": -12.023588180541992, "global_step": 374165, "epoch": 2227} {"train_loss": -12.088057518005371, "global_step": 374166, "epoch": 2227} {"train_loss": -12.395401000976562, "global_step": 374167, "epoch": 2227} {"train_loss": -11.850211143493652, "global_step": 374168, "epoch": 2227} {"train_loss": -12.180042266845703, "global_step": 374169, "epoch": 2227} {"train_loss": -11.718889236450195, "global_step": 374170, "epoch": 2227} {"train_loss": -10.155858039855957, "global_step": 374171, "epoch": 2227} {"train_loss": -9.329174995422363, "global_step": 374172, "epoch": 2227} {"train_loss": -7.57186222076416, "global_step": 374173, "epoch": 2227} {"train_loss": -9.497480392456055, "global_step": 374174, "epoch": 2227} {"train_loss": -8.922784805297852, "global_step": 374175, "epoch": 2227} {"train_loss": -9.509449005126953, "global_step": 374176, "epoch": 2227} {"train_loss": -9.146474838256836, "global_step": 374177, "epoch": 2227} {"train_loss": -8.804593086242676, "global_step": 374178, "epoch": 2227} {"train_loss": -8.667338371276855, "global_step": 374179, "epoch": 2227} {"train_loss": -11.008169174194336, "global_step": 374180, "epoch": 2227} {"train_loss": -8.677480697631836, "global_step": 374181, "epoch": 2227} {"train_loss": -9.692056655883789, "global_step": 374182, "epoch": 2227} {"train_loss": -9.40982437133789, "global_step": 374183, "epoch": 2227} {"train_loss": -10.805900573730469, "global_step": 374184, "epoch": 2227} {"train_loss": -9.452152252197266, "global_step": 374185, "epoch": 2227} {"train_loss": -9.584931373596191, "global_step": 374186, "epoch": 2227} {"train_loss": -10.59823989868164, "global_step": 374187, "epoch": 2227} {"train_loss": -10.721170425415039, "global_step": 374188, "epoch": 2227} {"train_loss": -11.246740341186523, "global_step": 374189, "epoch": 2227} {"train_loss": -10.490464210510254, "global_step": 374190, "epoch": 2227} {"train_loss": -11.136442184448242, "global_step": 374191, "epoch": 2227} {"train_loss": -9.784021377563477, "global_step": 374192, "epoch": 2227} {"train_loss": -11.025547981262207, "global_step": 374193, "epoch": 2227} {"train_loss": -10.720245361328125, "global_step": 374194, "epoch": 2227} {"train_loss": -10.816524505615234, "global_step": 374195, "epoch": 2227} {"train_loss": -11.2730131149292, "global_step": 374196, "epoch": 2227} {"train_loss": -10.310050964355469, "global_step": 374197, "epoch": 2227} {"train_loss": -10.924612045288086, "global_step": 374198, "epoch": 2227} {"train_loss": -11.112054824829102, "global_step": 374199, "epoch": 2227} {"train_loss": -10.576395034790039, "global_step": 374200, "epoch": 2227} {"train_loss": -11.712324142456055, "global_step": 374201, "epoch": 2227} {"train_loss": -10.565267562866211, "global_step": 374202, "epoch": 2227} {"train_loss": -11.573476791381836, "global_step": 374203, "epoch": 2227} {"train_loss": -11.127471923828125, "global_step": 374204, "epoch": 2227} {"train_loss": -11.499401092529297, "global_step": 374205, "epoch": 2227} {"train_loss": -11.5487642288208, "global_step": 374206, "epoch": 2227} {"train_loss": -11.119611740112305, "global_step": 374207, "epoch": 2227} {"train_loss": -10.947970390319824, "global_step": 374208, "epoch": 2227} {"train_loss": -11.840132713317871, "global_step": 374209, "epoch": 2227} {"train_loss": -10.654610633850098, "global_step": 374210, "epoch": 2227} {"train_loss": -11.974650382995605, "global_step": 374211, "epoch": 2227} {"train_loss": -10.948814392089844, "global_step": 374212, "epoch": 2227} {"train_loss": -12.091718673706055, "global_step": 374213, "epoch": 2227} {"train_loss": -11.491277694702148, "global_step": 374214, "epoch": 2227} {"train_loss": -11.445396423339844, "global_step": 374215, "epoch": 2227} {"train_loss": -11.718564987182617, "global_step": 374216, "epoch": 2227} {"train_loss": -11.627798080444336, "global_step": 374217, "epoch": 2227} {"train_loss": -11.859975814819336, "global_step": 374218, "epoch": 2227} {"train_loss": -11.640533447265625, "global_step": 374219, "epoch": 2227} {"train_loss": -11.638262748718262, "global_step": 374220, "epoch": 2227} {"train_loss": -12.000574111938477, "global_step": 374221, "epoch": 2227} {"train_loss": -11.945478439331055, "global_step": 374222, "epoch": 2227} {"train_loss": -11.56252384185791, "global_step": 374223, "epoch": 2227} {"train_loss": -11.983101844787598, "global_step": 374224, "epoch": 2227} {"train_loss": -11.892557144165039, "global_step": 374225, "epoch": 2227} {"train_loss": -12.146219253540039, "global_step": 374226, "epoch": 2227} {"train_loss": -11.951335906982422, "global_step": 374227, "epoch": 2227} {"train_loss": -11.876148223876953, "global_step": 374228, "epoch": 2227} {"train_loss": -11.954835891723633, "global_step": 374229, "epoch": 2227} {"train_loss": -12.113990783691406, "global_step": 374230, "epoch": 2227} {"train_loss": -12.082475662231445, "global_step": 374231, "epoch": 2227} {"train_loss": -12.140579223632812, "global_step": 374232, "epoch": 2227} {"train_loss": -11.951555252075195, "global_step": 374233, "epoch": 2227} {"train_loss": -12.005125045776367, "global_step": 374234, "epoch": 2227} {"train_loss": -12.239359855651855, "global_step": 374235, "epoch": 2227} {"train_loss": -12.130010604858398, "global_step": 374236, "epoch": 2227} {"train_loss": -12.308005332946777, "global_step": 374237, "epoch": 2227} {"train_loss": -12.321301460266113, "global_step": 374238, "epoch": 2227} {"train_loss": -12.332672119140625, "global_step": 374239, "epoch": 2227} {"train_loss": -12.331796646118164, "global_step": 374240, "epoch": 2227} {"train_loss": -12.053998947143555, "global_step": 374241, "epoch": 2227} {"train_loss": -12.3333740234375, "global_step": 374242, "epoch": 2227} {"train_loss": -12.188916206359863, "global_step": 374243, "epoch": 2227} {"train_loss": -12.058683395385742, "global_step": 374244, "epoch": 2227} {"train_loss": -12.396919250488281, "global_step": 374245, "epoch": 2227} {"train_loss": -12.27367877960205, "global_step": 374246, "epoch": 2227} {"train_loss": -12.308635711669922, "global_step": 374247, "epoch": 2227} {"train_loss": -12.262664794921875, "global_step": 374248, "epoch": 2227} {"train_loss": -12.114826202392578, "global_step": 374249, "epoch": 2227} {"train_loss": -12.113210678100586, "global_step": 374250, "epoch": 2227} {"train_loss": -12.400562286376953, "global_step": 374251, "epoch": 2227} {"train_loss": -11.7612943649292, "global_step": 374252, "epoch": 2227} {"train_loss": -12.232189178466797, "global_step": 374253, "epoch": 2227} {"train_loss": -12.291881561279297, "global_step": 374254, "epoch": 2227} {"train_loss": -12.310972213745117, "global_step": 374255, "epoch": 2227} {"train_loss": -12.394251823425293, "global_step": 374256, "epoch": 2227} {"train_loss": -12.295767784118652, "global_step": 374257, "epoch": 2227} {"train_loss": -12.176987648010254, "global_step": 374258, "epoch": 2227} {"train_loss": -12.343884468078613, "global_step": 374259, "epoch": 2227} {"train_loss": -12.409008026123047, "global_step": 374260, "epoch": 2227} {"train_loss": -12.332880973815918, "global_step": 374261, "epoch": 2227} {"train_loss": -12.557465553283691, "global_step": 374262, "epoch": 2227} {"train_loss": -12.368206024169922, "global_step": 374263, "epoch": 2227} {"train_loss": -12.279342651367188, "global_step": 374264, "epoch": 2227} {"train_loss": -12.321830749511719, "global_step": 374265, "epoch": 2227} {"train_loss": -12.296152114868164, "global_step": 374266, "epoch": 2227} {"train_loss": -12.281837463378906, "global_step": 374267, "epoch": 2227} {"train_loss": -12.338605880737305, "global_step": 374268, "epoch": 2227} {"train_loss": -12.217573165893555, "global_step": 374269, "epoch": 2227} {"train_loss": -12.158411979675293, "global_step": 374270, "epoch": 2227} {"train_loss": -12.311158180236816, "global_step": 374271, "epoch": 2227} {"train_loss": -12.293296813964844, "global_step": 374272, "epoch": 2227} {"train_loss": -11.996614456176758, "global_step": 374273, "epoch": 2227} {"train_loss": -12.098634719848633, "global_step": 374274, "epoch": 2227} {"train_loss": -12.122461318969727, "global_step": 374275, "epoch": 2227} {"train_loss": -12.42332649230957, "global_step": 374276, "epoch": 2227} {"train_loss": -12.082801818847656, "global_step": 374277, "epoch": 2227} {"train_loss": -12.415021896362305, "global_step": 374278, "epoch": 2227} {"train_loss": -12.021883010864258, "global_step": 374279, "epoch": 2227} {"train_loss": -12.166502952575684, "global_step": 374280, "epoch": 2227} {"train_loss": -12.417935371398926, "global_step": 374281, "epoch": 2227} {"train_loss": -12.175264358520508, "global_step": 374282, "epoch": 2227} {"train_loss": -12.15779972076416, "global_step": 374283, "epoch": 2227} {"train_loss": -12.250057220458984, "global_step": 374284, "epoch": 2227} {"train_loss": -12.60899829864502, "global_step": 374285, "epoch": 2227} {"train_loss": -12.306964874267578, "global_step": 374286, "epoch": 2227} {"train_loss": -12.490816116333008, "global_step": 374287, "epoch": 2227} {"train_loss": -12.350029945373535, "global_step": 374288, "epoch": 2227} {"train_loss": -12.744863510131836, "global_step": 374289, "epoch": 2227} {"train_loss": -12.215158462524414, "global_step": 374290, "epoch": 2227} {"train_loss": -12.099206924438477, "global_step": 374291, "epoch": 2227} {"train_loss": -12.281436920166016, "global_step": 374292, "epoch": 2227} {"train_loss": -12.573844909667969, "global_step": 374293, "epoch": 2227} {"train_loss": -12.215688705444336, "global_step": 374294, "epoch": 2227} {"train_loss": -12.379478454589844, "global_step": 374295, "epoch": 2227} {"train_loss": -12.537073135375977, "global_step": 374296, "epoch": 2227} {"train_loss": -12.198089599609375, "global_step": 374297, "epoch": 2227} {"train_loss": -12.226499557495117, "global_step": 374298, "epoch": 2227} {"train_loss": -12.45566177368164, "global_step": 374299, "epoch": 2227} {"train_loss": -12.524742126464844, "global_step": 374300, "epoch": 2227} {"train_loss": -12.577466011047363, "global_step": 374301, "epoch": 2227} {"train_loss": -12.528946876525879, "global_step": 374302, "epoch": 2227} {"train_loss": -11.79919535773141, "global_step": 374303, "epoch": 2227, "val_loss": 291656.15625} {"train_loss": -12.484783172607422, "global_step": 374304, "epoch": 2228} {"train_loss": -12.566780090332031, "global_step": 374305, "epoch": 2228} {"train_loss": -12.460667610168457, "global_step": 374306, "epoch": 2228} {"train_loss": -12.850568771362305, "global_step": 374307, "epoch": 2228} {"train_loss": -12.632472038269043, "global_step": 374308, "epoch": 2228} {"train_loss": -12.765663146972656, "global_step": 374309, "epoch": 2228} {"train_loss": -12.371734619140625, "global_step": 374310, "epoch": 2228} {"train_loss": -12.22266960144043, "global_step": 374311, "epoch": 2228} {"train_loss": -12.609728813171387, "global_step": 374312, "epoch": 2228} {"train_loss": -12.32577133178711, "global_step": 374313, "epoch": 2228} {"train_loss": -12.140522956848145, "global_step": 374314, "epoch": 2228} {"train_loss": -11.646398544311523, "global_step": 374315, "epoch": 2228} {"train_loss": -12.660962104797363, "global_step": 374316, "epoch": 2228} {"train_loss": -12.16643238067627, "global_step": 374317, "epoch": 2228} {"train_loss": -11.96455192565918, "global_step": 374318, "epoch": 2228} {"train_loss": -12.504438400268555, "global_step": 374319, "epoch": 2228} {"train_loss": -12.317150115966797, "global_step": 374320, "epoch": 2228} {"train_loss": -12.07067584991455, "global_step": 374321, "epoch": 2228} {"train_loss": -12.499789237976074, "global_step": 374322, "epoch": 2228} {"train_loss": -12.44848918914795, "global_step": 374323, "epoch": 2228} {"train_loss": -12.34906005859375, "global_step": 374324, "epoch": 2228} {"train_loss": -11.55526065826416, "global_step": 374325, "epoch": 2228} {"train_loss": -12.287013053894043, "global_step": 374326, "epoch": 2228} {"train_loss": -12.411457061767578, "global_step": 374327, "epoch": 2228} {"train_loss": -12.431635856628418, "global_step": 374328, "epoch": 2228} {"train_loss": -12.24095344543457, "global_step": 374329, "epoch": 2228} {"train_loss": -12.562312126159668, "global_step": 374330, "epoch": 2228} {"train_loss": -12.439138412475586, "global_step": 374331, "epoch": 2228} {"train_loss": -12.843301773071289, "global_step": 374332, "epoch": 2228} {"train_loss": -12.458398818969727, "global_step": 374333, "epoch": 2228} {"train_loss": -12.469818115234375, "global_step": 374334, "epoch": 2228} {"train_loss": -12.746747970581055, "global_step": 374335, "epoch": 2228} {"train_loss": -12.478018760681152, "global_step": 374336, "epoch": 2228} {"train_loss": -12.367729187011719, "global_step": 374337, "epoch": 2228} {"train_loss": -12.448572158813477, "global_step": 374338, "epoch": 2228} {"train_loss": -12.367620468139648, "global_step": 374339, "epoch": 2228} {"train_loss": -12.313074111938477, "global_step": 374340, "epoch": 2228} {"train_loss": -12.111007690429688, "global_step": 374341, "epoch": 2228} {"train_loss": -11.952794075012207, "global_step": 374342, "epoch": 2228} {"train_loss": -11.603734016418457, "global_step": 374343, "epoch": 2228} {"train_loss": -12.12783145904541, "global_step": 374344, "epoch": 2228} {"train_loss": -11.141521453857422, "global_step": 374345, "epoch": 2228} {"train_loss": -11.57529067993164, "global_step": 374346, "epoch": 2228} {"train_loss": -10.905654907226562, "global_step": 374347, "epoch": 2228} {"train_loss": -11.864452362060547, "global_step": 374348, "epoch": 2228} {"train_loss": -10.946260452270508, "global_step": 374349, "epoch": 2228} {"train_loss": -11.572999954223633, "global_step": 374350, "epoch": 2228} {"train_loss": -10.616857528686523, "global_step": 374351, "epoch": 2228} {"train_loss": -11.532174110412598, "global_step": 374352, "epoch": 2228} {"train_loss": -11.777559280395508, "global_step": 374353, "epoch": 2228} {"train_loss": -11.077529907226562, "global_step": 374354, "epoch": 2228} {"train_loss": -11.373300552368164, "global_step": 374355, "epoch": 2228} {"train_loss": -11.608536720275879, "global_step": 374356, "epoch": 2228} {"train_loss": -12.043392181396484, "global_step": 374357, "epoch": 2228} {"train_loss": -11.087437629699707, "global_step": 374358, "epoch": 2228} {"train_loss": -11.791022300720215, "global_step": 374359, "epoch": 2228} {"train_loss": -12.06233024597168, "global_step": 374360, "epoch": 2228} {"train_loss": -11.524200439453125, "global_step": 374361, "epoch": 2228} {"train_loss": -11.36024284362793, "global_step": 374362, "epoch": 2228} {"train_loss": -11.679567337036133, "global_step": 374363, "epoch": 2228} {"train_loss": -11.704124450683594, "global_step": 374364, "epoch": 2228} {"train_loss": -12.008658409118652, "global_step": 374365, "epoch": 2228} {"train_loss": -12.191627502441406, "global_step": 374366, "epoch": 2228} {"train_loss": -12.057515144348145, "global_step": 374367, "epoch": 2228} {"train_loss": -12.017183303833008, "global_step": 374368, "epoch": 2228} {"train_loss": -11.968183517456055, "global_step": 374369, "epoch": 2228} {"train_loss": -11.069161415100098, "global_step": 374370, "epoch": 2228} {"train_loss": -12.038182258605957, "global_step": 374371, "epoch": 2228} {"train_loss": -12.36056137084961, "global_step": 374372, "epoch": 2228} {"train_loss": -11.102666854858398, "global_step": 374373, "epoch": 2228} {"train_loss": -11.586860656738281, "global_step": 374374, "epoch": 2228} {"train_loss": -12.29164981842041, "global_step": 374375, "epoch": 2228} {"train_loss": -11.417549133300781, "global_step": 374376, "epoch": 2228} {"train_loss": -12.25554370880127, "global_step": 374377, "epoch": 2228} {"train_loss": -11.93277645111084, "global_step": 374378, "epoch": 2228} {"train_loss": -11.778541564941406, "global_step": 374379, "epoch": 2228} {"train_loss": -12.326972007751465, "global_step": 374380, "epoch": 2228} {"train_loss": -11.885693550109863, "global_step": 374381, "epoch": 2228} {"train_loss": -12.039360046386719, "global_step": 374382, "epoch": 2228} {"train_loss": -12.1845703125, "global_step": 374383, "epoch": 2228} {"train_loss": -11.75076675415039, "global_step": 374384, "epoch": 2228} {"train_loss": -12.099010467529297, "global_step": 374385, "epoch": 2228} {"train_loss": -11.810483932495117, "global_step": 374386, "epoch": 2228} {"train_loss": -11.033868789672852, "global_step": 374387, "epoch": 2228} {"train_loss": -12.166763305664062, "global_step": 374388, "epoch": 2228} {"train_loss": -12.435789108276367, "global_step": 374389, "epoch": 2228} {"train_loss": -12.269033432006836, "global_step": 374390, "epoch": 2228} {"train_loss": -12.602346420288086, "global_step": 374391, "epoch": 2228} {"train_loss": -12.313713073730469, "global_step": 374392, "epoch": 2228} {"train_loss": -12.196914672851562, "global_step": 374393, "epoch": 2228} {"train_loss": -12.47085952758789, "global_step": 374394, "epoch": 2228} {"train_loss": -12.020416259765625, "global_step": 374395, "epoch": 2228} {"train_loss": -11.684133529663086, "global_step": 374396, "epoch": 2228} {"train_loss": -12.245458602905273, "global_step": 374397, "epoch": 2228} {"train_loss": -11.895410537719727, "global_step": 374398, "epoch": 2228} {"train_loss": -11.893621444702148, "global_step": 374399, "epoch": 2228} {"train_loss": -11.938650131225586, "global_step": 374400, "epoch": 2228} {"train_loss": -12.194509506225586, "global_step": 374401, "epoch": 2228} {"train_loss": -11.777793884277344, "global_step": 374402, "epoch": 2228} {"train_loss": -12.022994995117188, "global_step": 374403, "epoch": 2228} {"train_loss": -12.36262035369873, "global_step": 374404, "epoch": 2228} {"train_loss": -11.352643013000488, "global_step": 374405, "epoch": 2228} {"train_loss": -11.065706253051758, "global_step": 374406, "epoch": 2228} {"train_loss": -12.251043319702148, "global_step": 374407, "epoch": 2228} {"train_loss": -11.560818672180176, "global_step": 374408, "epoch": 2228} {"train_loss": -11.381792068481445, "global_step": 374409, "epoch": 2228} {"train_loss": -12.05154800415039, "global_step": 374410, "epoch": 2228} {"train_loss": -11.690607070922852, "global_step": 374411, "epoch": 2228} {"train_loss": -11.402569770812988, "global_step": 374412, "epoch": 2228} {"train_loss": -12.144716262817383, "global_step": 374413, "epoch": 2228} {"train_loss": -11.931665420532227, "global_step": 374414, "epoch": 2228} {"train_loss": -11.458147048950195, "global_step": 374415, "epoch": 2228} {"train_loss": -11.795282363891602, "global_step": 374416, "epoch": 2228} {"train_loss": -12.175657272338867, "global_step": 374417, "epoch": 2228} {"train_loss": -11.628727912902832, "global_step": 374418, "epoch": 2228} {"train_loss": -12.5071439743042, "global_step": 374419, "epoch": 2228} {"train_loss": -11.993094444274902, "global_step": 374420, "epoch": 2228} {"train_loss": -11.946533203125, "global_step": 374421, "epoch": 2228} {"train_loss": -12.262327194213867, "global_step": 374422, "epoch": 2228} {"train_loss": -12.045019149780273, "global_step": 374423, "epoch": 2228} {"train_loss": -11.917319297790527, "global_step": 374424, "epoch": 2228} {"train_loss": -12.602113723754883, "global_step": 374425, "epoch": 2228} {"train_loss": -11.995589256286621, "global_step": 374426, "epoch": 2228} {"train_loss": -12.314157485961914, "global_step": 374427, "epoch": 2228} {"train_loss": -12.25640869140625, "global_step": 374428, "epoch": 2228} {"train_loss": -11.99795150756836, "global_step": 374429, "epoch": 2228} {"train_loss": -12.164958953857422, "global_step": 374430, "epoch": 2228} {"train_loss": -12.297325134277344, "global_step": 374431, "epoch": 2228} {"train_loss": -11.427515029907227, "global_step": 374432, "epoch": 2228} {"train_loss": -12.279983520507812, "global_step": 374433, "epoch": 2228} {"train_loss": -11.892729759216309, "global_step": 374434, "epoch": 2228} {"train_loss": -11.898316383361816, "global_step": 374435, "epoch": 2228} {"train_loss": -12.30091667175293, "global_step": 374436, "epoch": 2228} {"train_loss": -11.196491241455078, "global_step": 374437, "epoch": 2228} {"train_loss": -11.770539283752441, "global_step": 374438, "epoch": 2228} {"train_loss": -11.995514869689941, "global_step": 374439, "epoch": 2228} {"train_loss": -10.968610763549805, "global_step": 374440, "epoch": 2228} {"train_loss": -12.499320030212402, "global_step": 374441, "epoch": 2228} {"train_loss": -11.776118278503418, "global_step": 374442, "epoch": 2228} {"train_loss": -12.338081359863281, "global_step": 374443, "epoch": 2228} {"train_loss": -11.881790161132812, "global_step": 374444, "epoch": 2228} {"train_loss": -11.871971130371094, "global_step": 374445, "epoch": 2228} {"train_loss": -12.494959831237793, "global_step": 374446, "epoch": 2228} {"train_loss": -12.077094078063965, "global_step": 374447, "epoch": 2228} {"train_loss": -12.254470825195312, "global_step": 374448, "epoch": 2228} {"train_loss": -12.25997543334961, "global_step": 374449, "epoch": 2228} {"train_loss": -12.158356666564941, "global_step": 374450, "epoch": 2228} {"train_loss": -12.471517562866211, "global_step": 374451, "epoch": 2228} {"train_loss": -11.996612548828125, "global_step": 374452, "epoch": 2228} {"train_loss": -12.204754829406738, "global_step": 374453, "epoch": 2228} {"train_loss": -12.483592987060547, "global_step": 374454, "epoch": 2228} {"train_loss": -12.19096565246582, "global_step": 374455, "epoch": 2228} {"train_loss": -12.418028831481934, "global_step": 374456, "epoch": 2228} {"train_loss": -12.315286636352539, "global_step": 374457, "epoch": 2228} {"train_loss": -12.31783676147461, "global_step": 374458, "epoch": 2228} {"train_loss": -12.453300476074219, "global_step": 374459, "epoch": 2228} {"train_loss": -11.900941848754883, "global_step": 374460, "epoch": 2228} {"train_loss": -12.214788436889648, "global_step": 374461, "epoch": 2228} {"train_loss": -11.824626922607422, "global_step": 374462, "epoch": 2228} {"train_loss": -11.358362197875977, "global_step": 374463, "epoch": 2228} {"train_loss": -12.388753890991211, "global_step": 374464, "epoch": 2228} {"train_loss": -11.42548656463623, "global_step": 374465, "epoch": 2228} {"train_loss": -12.072397232055664, "global_step": 374466, "epoch": 2228} {"train_loss": -12.155056953430176, "global_step": 374467, "epoch": 2228} {"train_loss": -11.426584243774414, "global_step": 374468, "epoch": 2228} {"train_loss": -12.380441665649414, "global_step": 374469, "epoch": 2228} {"train_loss": -11.393320083618164, "global_step": 374470, "epoch": 2228} {"train_loss": -12.013838092486063, "global_step": 374471, "epoch": 2228, "val_loss": 292094.46875} {"train_loss": -11.66864013671875, "global_step": 374472, "epoch": 2229} {"train_loss": -11.430534362792969, "global_step": 374473, "epoch": 2229} {"train_loss": -12.18733024597168, "global_step": 374474, "epoch": 2229} {"train_loss": -11.835466384887695, "global_step": 374475, "epoch": 2229} {"train_loss": -11.466583251953125, "global_step": 374476, "epoch": 2229} {"train_loss": -11.817268371582031, "global_step": 374477, "epoch": 2229} {"train_loss": -10.293198585510254, "global_step": 374478, "epoch": 2229} {"train_loss": -11.767579078674316, "global_step": 374479, "epoch": 2229} {"train_loss": -11.072126388549805, "global_step": 374480, "epoch": 2229} {"train_loss": -11.62973403930664, "global_step": 374481, "epoch": 2229} {"train_loss": -11.05653190612793, "global_step": 374482, "epoch": 2229} {"train_loss": -11.196911811828613, "global_step": 374483, "epoch": 2229} {"train_loss": -11.529236793518066, "global_step": 374484, "epoch": 2229} {"train_loss": -11.470475196838379, "global_step": 374485, "epoch": 2229} {"train_loss": -12.113861083984375, "global_step": 374486, "epoch": 2229} {"train_loss": -11.194784164428711, "global_step": 374487, "epoch": 2229} {"train_loss": -11.203359603881836, "global_step": 374488, "epoch": 2229} {"train_loss": -11.804676055908203, "global_step": 374489, "epoch": 2229} {"train_loss": -10.600442886352539, "global_step": 374490, "epoch": 2229} {"train_loss": -12.1338529586792, "global_step": 374491, "epoch": 2229} {"train_loss": -11.004201889038086, "global_step": 374492, "epoch": 2229} {"train_loss": -11.78542709350586, "global_step": 374493, "epoch": 2229} {"train_loss": -11.617588996887207, "global_step": 374494, "epoch": 2229} {"train_loss": -12.120355606079102, "global_step": 374495, "epoch": 2229} {"train_loss": -11.93392276763916, "global_step": 374496, "epoch": 2229} {"train_loss": -12.19295597076416, "global_step": 374497, "epoch": 2229} {"train_loss": -12.08005142211914, "global_step": 374498, "epoch": 2229} {"train_loss": -12.098764419555664, "global_step": 374499, "epoch": 2229} {"train_loss": -12.213872909545898, "global_step": 374500, "epoch": 2229} {"train_loss": -12.116606712341309, "global_step": 374501, "epoch": 2229} {"train_loss": -12.16320514678955, "global_step": 374502, "epoch": 2229} {"train_loss": -12.155606269836426, "global_step": 374503, "epoch": 2229} {"train_loss": -12.248781204223633, "global_step": 374504, "epoch": 2229} {"train_loss": -11.726736068725586, "global_step": 374505, "epoch": 2229} {"train_loss": -12.636512756347656, "global_step": 374506, "epoch": 2229} {"train_loss": -12.604278564453125, "global_step": 374507, "epoch": 2229} {"train_loss": -12.406214714050293, "global_step": 374508, "epoch": 2229} {"train_loss": -12.222429275512695, "global_step": 374509, "epoch": 2229} {"train_loss": -12.220681190490723, "global_step": 374510, "epoch": 2229} {"train_loss": -12.30258846282959, "global_step": 374511, "epoch": 2229} {"train_loss": -11.749883651733398, "global_step": 374512, "epoch": 2229} {"train_loss": -12.433393478393555, "global_step": 374513, "epoch": 2229} {"train_loss": -12.153039932250977, "global_step": 374514, "epoch": 2229} {"train_loss": -12.348165512084961, "global_step": 374515, "epoch": 2229} {"train_loss": -12.154918670654297, "global_step": 374516, "epoch": 2229} {"train_loss": -12.31540584564209, "global_step": 374517, "epoch": 2229} {"train_loss": -12.180338859558105, "global_step": 374518, "epoch": 2229} {"train_loss": -12.368525505065918, "global_step": 374519, "epoch": 2229} {"train_loss": -12.02423095703125, "global_step": 374520, "epoch": 2229} {"train_loss": -12.274752616882324, "global_step": 374521, "epoch": 2229} {"train_loss": -12.444892883300781, "global_step": 374522, "epoch": 2229} {"train_loss": -12.627634048461914, "global_step": 374523, "epoch": 2229} {"train_loss": -12.179929733276367, "global_step": 374524, "epoch": 2229} {"train_loss": -12.339080810546875, "global_step": 374525, "epoch": 2229} {"train_loss": -11.796100616455078, "global_step": 374526, "epoch": 2229} {"train_loss": -12.028430938720703, "global_step": 374527, "epoch": 2229} {"train_loss": -11.87479305267334, "global_step": 374528, "epoch": 2229} {"train_loss": -12.449710845947266, "global_step": 374529, "epoch": 2229} {"train_loss": -11.784433364868164, "global_step": 374530, "epoch": 2229} {"train_loss": -12.230148315429688, "global_step": 374531, "epoch": 2229} {"train_loss": -12.003097534179688, "global_step": 374532, "epoch": 2229} {"train_loss": -12.297714233398438, "global_step": 374533, "epoch": 2229} {"train_loss": -11.626508712768555, "global_step": 374534, "epoch": 2229} {"train_loss": -12.137462615966797, "global_step": 374535, "epoch": 2229} {"train_loss": -12.481629371643066, "global_step": 374536, "epoch": 2229} {"train_loss": -11.236610412597656, "global_step": 374537, "epoch": 2229} {"train_loss": -12.509342193603516, "global_step": 374538, "epoch": 2229} {"train_loss": -11.536521911621094, "global_step": 374539, "epoch": 2229} {"train_loss": -11.870588302612305, "global_step": 374540, "epoch": 2229} {"train_loss": -12.208221435546875, "global_step": 374541, "epoch": 2229} {"train_loss": -11.797220230102539, "global_step": 374542, "epoch": 2229} {"train_loss": -12.159303665161133, "global_step": 374543, "epoch": 2229} {"train_loss": -11.680899620056152, "global_step": 374544, "epoch": 2229} {"train_loss": -11.778305053710938, "global_step": 374545, "epoch": 2229} {"train_loss": -11.531806945800781, "global_step": 374546, "epoch": 2229} {"train_loss": -11.992973327636719, "global_step": 374547, "epoch": 2229} {"train_loss": -10.54440689086914, "global_step": 374548, "epoch": 2229} {"train_loss": -12.424137115478516, "global_step": 374549, "epoch": 2229} {"train_loss": -11.324499130249023, "global_step": 374550, "epoch": 2229} {"train_loss": -11.398918151855469, "global_step": 374551, "epoch": 2229} {"train_loss": -12.105960845947266, "global_step": 374552, "epoch": 2229} {"train_loss": -11.854836463928223, "global_step": 374553, "epoch": 2229} {"train_loss": -12.320524215698242, "global_step": 374554, "epoch": 2229} {"train_loss": -11.587162017822266, "global_step": 374555, "epoch": 2229} {"train_loss": -12.22024917602539, "global_step": 374556, "epoch": 2229} {"train_loss": -12.060161590576172, "global_step": 374557, "epoch": 2229} {"train_loss": -11.917047500610352, "global_step": 374558, "epoch": 2229} {"train_loss": -11.811641693115234, "global_step": 374559, "epoch": 2229} {"train_loss": -11.852750778198242, "global_step": 374560, "epoch": 2229} {"train_loss": -12.305063247680664, "global_step": 374561, "epoch": 2229} {"train_loss": -12.077642440795898, "global_step": 374562, "epoch": 2229} {"train_loss": -12.181854248046875, "global_step": 374563, "epoch": 2229} {"train_loss": -11.97746753692627, "global_step": 374564, "epoch": 2229} {"train_loss": -11.957719802856445, "global_step": 374565, "epoch": 2229} {"train_loss": -11.911996841430664, "global_step": 374566, "epoch": 2229} {"train_loss": -11.541913986206055, "global_step": 374567, "epoch": 2229} {"train_loss": -11.976000785827637, "global_step": 374568, "epoch": 2229} {"train_loss": -12.148763656616211, "global_step": 374569, "epoch": 2229} {"train_loss": -11.648027420043945, "global_step": 374570, "epoch": 2229} {"train_loss": -12.249410629272461, "global_step": 374571, "epoch": 2229} {"train_loss": -12.12857437133789, "global_step": 374572, "epoch": 2229} {"train_loss": -12.027313232421875, "global_step": 374573, "epoch": 2229} {"train_loss": -12.257829666137695, "global_step": 374574, "epoch": 2229} {"train_loss": -11.737937927246094, "global_step": 374575, "epoch": 2229} {"train_loss": -11.828567504882812, "global_step": 374576, "epoch": 2229} {"train_loss": -12.08863639831543, "global_step": 374577, "epoch": 2229} {"train_loss": -12.311053276062012, "global_step": 374578, "epoch": 2229} {"train_loss": -12.017251968383789, "global_step": 374579, "epoch": 2229} {"train_loss": -12.404258728027344, "global_step": 374580, "epoch": 2229} {"train_loss": -11.945470809936523, "global_step": 374581, "epoch": 2229} {"train_loss": -12.468053817749023, "global_step": 374582, "epoch": 2229} {"train_loss": -11.724392890930176, "global_step": 374583, "epoch": 2229} {"train_loss": -12.220806121826172, "global_step": 374584, "epoch": 2229} {"train_loss": -12.328096389770508, "global_step": 374585, "epoch": 2229} {"train_loss": -12.41168212890625, "global_step": 374586, "epoch": 2229} {"train_loss": -12.40641975402832, "global_step": 374587, "epoch": 2229} {"train_loss": -12.086536407470703, "global_step": 374588, "epoch": 2229} {"train_loss": -12.280599594116211, "global_step": 374589, "epoch": 2229} {"train_loss": -12.272125244140625, "global_step": 374590, "epoch": 2229} {"train_loss": -12.415029525756836, "global_step": 374591, "epoch": 2229} {"train_loss": -12.350045204162598, "global_step": 374592, "epoch": 2229} {"train_loss": -12.576175689697266, "global_step": 374593, "epoch": 2229} {"train_loss": -12.346981048583984, "global_step": 374594, "epoch": 2229} {"train_loss": -12.354707717895508, "global_step": 374595, "epoch": 2229} {"train_loss": -12.119630813598633, "global_step": 374596, "epoch": 2229} {"train_loss": -12.394908905029297, "global_step": 374597, "epoch": 2229} {"train_loss": -12.32042121887207, "global_step": 374598, "epoch": 2229} {"train_loss": -11.888246536254883, "global_step": 374599, "epoch": 2229} {"train_loss": -12.410409927368164, "global_step": 374600, "epoch": 2229} {"train_loss": -11.972381591796875, "global_step": 374601, "epoch": 2229} {"train_loss": -12.481285095214844, "global_step": 374602, "epoch": 2229} {"train_loss": -12.021455764770508, "global_step": 374603, "epoch": 2229} {"train_loss": -10.646589279174805, "global_step": 374604, "epoch": 2229} {"train_loss": -12.000747680664062, "global_step": 374605, "epoch": 2229} {"train_loss": -11.782959938049316, "global_step": 374606, "epoch": 2229} {"train_loss": -10.929418563842773, "global_step": 374607, "epoch": 2229} {"train_loss": -11.934290885925293, "global_step": 374608, "epoch": 2229} {"train_loss": -11.65239429473877, "global_step": 374609, "epoch": 2229} {"train_loss": -11.46514892578125, "global_step": 374610, "epoch": 2229} {"train_loss": -11.76607894897461, "global_step": 374611, "epoch": 2229} {"train_loss": -11.653602600097656, "global_step": 374612, "epoch": 2229} {"train_loss": -11.57584285736084, "global_step": 374613, "epoch": 2229} {"train_loss": -11.430702209472656, "global_step": 374614, "epoch": 2229} {"train_loss": -11.726686477661133, "global_step": 374615, "epoch": 2229} {"train_loss": -11.200490951538086, "global_step": 374616, "epoch": 2229} {"train_loss": -11.751921653747559, "global_step": 374617, "epoch": 2229} {"train_loss": -11.800568580627441, "global_step": 374618, "epoch": 2229} {"train_loss": -11.418503761291504, "global_step": 374619, "epoch": 2229} {"train_loss": -12.170356750488281, "global_step": 374620, "epoch": 2229} {"train_loss": -11.290702819824219, "global_step": 374621, "epoch": 2229} {"train_loss": -12.167240142822266, "global_step": 374622, "epoch": 2229} {"train_loss": -12.036760330200195, "global_step": 374623, "epoch": 2229} {"train_loss": -12.178289413452148, "global_step": 374624, "epoch": 2229} {"train_loss": -12.227606773376465, "global_step": 374625, "epoch": 2229} {"train_loss": -11.877363204956055, "global_step": 374626, "epoch": 2229} {"train_loss": -12.033836364746094, "global_step": 374627, "epoch": 2229} {"train_loss": -12.21837329864502, "global_step": 374628, "epoch": 2229} {"train_loss": -12.321528434753418, "global_step": 374629, "epoch": 2229} {"train_loss": -12.074313163757324, "global_step": 374630, "epoch": 2229} {"train_loss": -12.383362770080566, "global_step": 374631, "epoch": 2229} {"train_loss": -12.073883056640625, "global_step": 374632, "epoch": 2229} {"train_loss": -12.594219207763672, "global_step": 374633, "epoch": 2229} {"train_loss": -12.081855773925781, "global_step": 374634, "epoch": 2229} {"train_loss": -12.22779655456543, "global_step": 374635, "epoch": 2229} {"train_loss": -12.294840812683105, "global_step": 374636, "epoch": 2229} {"train_loss": -12.311800003051758, "global_step": 374637, "epoch": 2229} {"train_loss": -12.663270950317383, "global_step": 374638, "epoch": 2229} {"train_loss": -11.964376773153033, "global_step": 374639, "epoch": 2229, "val_loss": 295371.59375} {"train_loss": -12.526897430419922, "global_step": 374640, "epoch": 2230} {"train_loss": -12.140997886657715, "global_step": 374641, "epoch": 2230} {"train_loss": -12.352615356445312, "global_step": 374642, "epoch": 2230} {"train_loss": -12.296077728271484, "global_step": 374643, "epoch": 2230} {"train_loss": -11.911209106445312, "global_step": 374644, "epoch": 2230} {"train_loss": -12.264297485351562, "global_step": 374645, "epoch": 2230} {"train_loss": -11.861858367919922, "global_step": 374646, "epoch": 2230} {"train_loss": -12.43934440612793, "global_step": 374647, "epoch": 2230} {"train_loss": -11.521614074707031, "global_step": 374648, "epoch": 2230} {"train_loss": -12.18636703491211, "global_step": 374649, "epoch": 2230} {"train_loss": -12.049312591552734, "global_step": 374650, "epoch": 2230} {"train_loss": -11.845491409301758, "global_step": 374651, "epoch": 2230} {"train_loss": -12.478780746459961, "global_step": 374652, "epoch": 2230} {"train_loss": -11.509544372558594, "global_step": 374653, "epoch": 2230} {"train_loss": -11.583126068115234, "global_step": 374654, "epoch": 2230} {"train_loss": -11.17343521118164, "global_step": 374655, "epoch": 2230} {"train_loss": -12.281078338623047, "global_step": 374656, "epoch": 2230} {"train_loss": -11.10713005065918, "global_step": 374657, "epoch": 2230} {"train_loss": -11.182005882263184, "global_step": 374658, "epoch": 2230} {"train_loss": -12.041769027709961, "global_step": 374659, "epoch": 2230} {"train_loss": -12.238046646118164, "global_step": 374660, "epoch": 2230} {"train_loss": -11.400938034057617, "global_step": 374661, "epoch": 2230} {"train_loss": -12.398937225341797, "global_step": 374662, "epoch": 2230} {"train_loss": -11.646860122680664, "global_step": 374663, "epoch": 2230} {"train_loss": -11.843246459960938, "global_step": 374664, "epoch": 2230} {"train_loss": -11.967192649841309, "global_step": 374665, "epoch": 2230} {"train_loss": -12.183141708374023, "global_step": 374666, "epoch": 2230} {"train_loss": -12.055354118347168, "global_step": 374667, "epoch": 2230} {"train_loss": -12.323084831237793, "global_step": 374668, "epoch": 2230} {"train_loss": -12.181241989135742, "global_step": 374669, "epoch": 2230} {"train_loss": -12.324628829956055, "global_step": 374670, "epoch": 2230} {"train_loss": -12.357630729675293, "global_step": 374671, "epoch": 2230} {"train_loss": -12.291461944580078, "global_step": 374672, "epoch": 2230} {"train_loss": -12.418218612670898, "global_step": 374673, "epoch": 2230} {"train_loss": -12.239639282226562, "global_step": 374674, "epoch": 2230} {"train_loss": -12.122002601623535, "global_step": 374675, "epoch": 2230} {"train_loss": -12.284406661987305, "global_step": 374676, "epoch": 2230} {"train_loss": -12.356794357299805, "global_step": 374677, "epoch": 2230} {"train_loss": -12.400870323181152, "global_step": 374678, "epoch": 2230} {"train_loss": -12.328685760498047, "global_step": 374679, "epoch": 2230} {"train_loss": -12.458307266235352, "global_step": 374680, "epoch": 2230} {"train_loss": -12.38905143737793, "global_step": 374681, "epoch": 2230} {"train_loss": -12.502988815307617, "global_step": 374682, "epoch": 2230} {"train_loss": -12.42831802368164, "global_step": 374683, "epoch": 2230} {"train_loss": -12.262262344360352, "global_step": 374684, "epoch": 2230} {"train_loss": -12.591742515563965, "global_step": 374685, "epoch": 2230} {"train_loss": -12.49381160736084, "global_step": 374686, "epoch": 2230} {"train_loss": -12.516075134277344, "global_step": 374687, "epoch": 2230} {"train_loss": -12.434170722961426, "global_step": 374688, "epoch": 2230} {"train_loss": -12.703496932983398, "global_step": 374689, "epoch": 2230} {"train_loss": -12.307001113891602, "global_step": 374690, "epoch": 2230} {"train_loss": -12.634865760803223, "global_step": 374691, "epoch": 2230} {"train_loss": -12.613516807556152, "global_step": 374692, "epoch": 2230} {"train_loss": -12.6647310256958, "global_step": 374693, "epoch": 2230} {"train_loss": -12.621800422668457, "global_step": 374694, "epoch": 2230} {"train_loss": -12.609024047851562, "global_step": 374695, "epoch": 2230} {"train_loss": -12.689390182495117, "global_step": 374696, "epoch": 2230} {"train_loss": -12.814525604248047, "global_step": 374697, "epoch": 2230} {"train_loss": -12.611482620239258, "global_step": 374698, "epoch": 2230} {"train_loss": -12.675764083862305, "global_step": 374699, "epoch": 2230} {"train_loss": -12.919307708740234, "global_step": 374700, "epoch": 2230} {"train_loss": -12.64157485961914, "global_step": 374701, "epoch": 2230} {"train_loss": -12.54880142211914, "global_step": 374702, "epoch": 2230} {"train_loss": -12.846855163574219, "global_step": 374703, "epoch": 2230} {"train_loss": -12.753259658813477, "global_step": 374704, "epoch": 2230} {"train_loss": -12.640092849731445, "global_step": 374705, "epoch": 2230} {"train_loss": -12.564567565917969, "global_step": 374706, "epoch": 2230} {"train_loss": -12.660406112670898, "global_step": 374707, "epoch": 2230} {"train_loss": -12.535600662231445, "global_step": 374708, "epoch": 2230} {"train_loss": -12.602261543273926, "global_step": 374709, "epoch": 2230} {"train_loss": -12.823493003845215, "global_step": 374710, "epoch": 2230} {"train_loss": -12.22213077545166, "global_step": 374711, "epoch": 2230} {"train_loss": -12.611939430236816, "global_step": 374712, "epoch": 2230} {"train_loss": -12.45151138305664, "global_step": 374713, "epoch": 2230} {"train_loss": -11.970492362976074, "global_step": 374714, "epoch": 2230} {"train_loss": -12.26573371887207, "global_step": 374715, "epoch": 2230} {"train_loss": -11.13372802734375, "global_step": 374716, "epoch": 2230} {"train_loss": -12.452999114990234, "global_step": 374717, "epoch": 2230} {"train_loss": -10.438249588012695, "global_step": 374718, "epoch": 2230} {"train_loss": -10.213508605957031, "global_step": 374719, "epoch": 2230} {"train_loss": -9.347206115722656, "global_step": 374720, "epoch": 2230} {"train_loss": -9.664173126220703, "global_step": 374721, "epoch": 2230} {"train_loss": -9.907918930053711, "global_step": 374722, "epoch": 2230} {"train_loss": -9.183781623840332, "global_step": 374723, "epoch": 2230} {"train_loss": -7.576038360595703, "global_step": 374724, "epoch": 2230} {"train_loss": -6.875125408172607, "global_step": 374725, "epoch": 2230} {"train_loss": -8.27629566192627, "global_step": 374726, "epoch": 2230} {"train_loss": -9.107574462890625, "global_step": 374727, "epoch": 2230} {"train_loss": -8.496772766113281, "global_step": 374728, "epoch": 2230} {"train_loss": -8.88808822631836, "global_step": 374729, "epoch": 2230} {"train_loss": -8.946863174438477, "global_step": 374730, "epoch": 2230} {"train_loss": -7.939877510070801, "global_step": 374731, "epoch": 2230} {"train_loss": -7.735706329345703, "global_step": 374732, "epoch": 2230} {"train_loss": -8.134833335876465, "global_step": 374733, "epoch": 2230} {"train_loss": -8.777154922485352, "global_step": 374734, "epoch": 2230} {"train_loss": -10.229766845703125, "global_step": 374735, "epoch": 2230} {"train_loss": -9.078229904174805, "global_step": 374736, "epoch": 2230} {"train_loss": -9.115798950195312, "global_step": 374737, "epoch": 2230} {"train_loss": -10.07233715057373, "global_step": 374738, "epoch": 2230} {"train_loss": -9.127037048339844, "global_step": 374739, "epoch": 2230} {"train_loss": -8.163140296936035, "global_step": 374740, "epoch": 2230} {"train_loss": -9.241193771362305, "global_step": 374741, "epoch": 2230} {"train_loss": -9.672527313232422, "global_step": 374742, "epoch": 2230} {"train_loss": -10.205294609069824, "global_step": 374743, "epoch": 2230} {"train_loss": -9.293601989746094, "global_step": 374744, "epoch": 2230} {"train_loss": -10.767135620117188, "global_step": 374745, "epoch": 2230} {"train_loss": -9.793338775634766, "global_step": 374746, "epoch": 2230} {"train_loss": -10.85621452331543, "global_step": 374747, "epoch": 2230} {"train_loss": -11.322108268737793, "global_step": 374748, "epoch": 2230} {"train_loss": -10.526033401489258, "global_step": 374749, "epoch": 2230} {"train_loss": -11.14820384979248, "global_step": 374750, "epoch": 2230} {"train_loss": -10.870757102966309, "global_step": 374751, "epoch": 2230} {"train_loss": -11.192071914672852, "global_step": 374752, "epoch": 2230} {"train_loss": -11.283459663391113, "global_step": 374753, "epoch": 2230} {"train_loss": -11.662031173706055, "global_step": 374754, "epoch": 2230} {"train_loss": -11.815107345581055, "global_step": 374755, "epoch": 2230} {"train_loss": -11.703376770019531, "global_step": 374756, "epoch": 2230} {"train_loss": -11.499519348144531, "global_step": 374757, "epoch": 2230} {"train_loss": -11.48122787475586, "global_step": 374758, "epoch": 2230} {"train_loss": -11.871856689453125, "global_step": 374759, "epoch": 2230} {"train_loss": -11.76209831237793, "global_step": 374760, "epoch": 2230} {"train_loss": -11.909798622131348, "global_step": 374761, "epoch": 2230} {"train_loss": -11.890214920043945, "global_step": 374762, "epoch": 2230} {"train_loss": -11.775297164916992, "global_step": 374763, "epoch": 2230} {"train_loss": -12.00993824005127, "global_step": 374764, "epoch": 2230} {"train_loss": -11.952324867248535, "global_step": 374765, "epoch": 2230} {"train_loss": -11.83814811706543, "global_step": 374766, "epoch": 2230} {"train_loss": -12.00639820098877, "global_step": 374767, "epoch": 2230} {"train_loss": -11.821111679077148, "global_step": 374768, "epoch": 2230} {"train_loss": -12.116358757019043, "global_step": 374769, "epoch": 2230} {"train_loss": -11.856363296508789, "global_step": 374770, "epoch": 2230} {"train_loss": -12.196815490722656, "global_step": 374771, "epoch": 2230} {"train_loss": -12.151602745056152, "global_step": 374772, "epoch": 2230} {"train_loss": -12.008362770080566, "global_step": 374773, "epoch": 2230} {"train_loss": -12.153730392456055, "global_step": 374774, "epoch": 2230} {"train_loss": -12.324605941772461, "global_step": 374775, "epoch": 2230} {"train_loss": -12.386157989501953, "global_step": 374776, "epoch": 2230} {"train_loss": -12.343870162963867, "global_step": 374777, "epoch": 2230} {"train_loss": -12.190092086791992, "global_step": 374778, "epoch": 2230} {"train_loss": -12.228100776672363, "global_step": 374779, "epoch": 2230} {"train_loss": -12.095161437988281, "global_step": 374780, "epoch": 2230} {"train_loss": -12.458104133605957, "global_step": 374781, "epoch": 2230} {"train_loss": -12.337778091430664, "global_step": 374782, "epoch": 2230} {"train_loss": -12.532405853271484, "global_step": 374783, "epoch": 2230} {"train_loss": -12.560508728027344, "global_step": 374784, "epoch": 2230} {"train_loss": -12.38920783996582, "global_step": 374785, "epoch": 2230} {"train_loss": -12.51854133605957, "global_step": 374786, "epoch": 2230} {"train_loss": -12.415019989013672, "global_step": 374787, "epoch": 2230} {"train_loss": -12.428879737854004, "global_step": 374788, "epoch": 2230} {"train_loss": -12.365336418151855, "global_step": 374789, "epoch": 2230} {"train_loss": -12.53837776184082, "global_step": 374790, "epoch": 2230} {"train_loss": -12.391988754272461, "global_step": 374791, "epoch": 2230} {"train_loss": -12.548587799072266, "global_step": 374792, "epoch": 2230} {"train_loss": -12.535436630249023, "global_step": 374793, "epoch": 2230} {"train_loss": -12.495655059814453, "global_step": 374794, "epoch": 2230} {"train_loss": -12.65974235534668, "global_step": 374795, "epoch": 2230} {"train_loss": -12.486772537231445, "global_step": 374796, "epoch": 2230} {"train_loss": -12.632749557495117, "global_step": 374797, "epoch": 2230} {"train_loss": -12.378007888793945, "global_step": 374798, "epoch": 2230} {"train_loss": -12.412609100341797, "global_step": 374799, "epoch": 2230} {"train_loss": -12.332170486450195, "global_step": 374800, "epoch": 2230} {"train_loss": -12.439452171325684, "global_step": 374801, "epoch": 2230} {"train_loss": -12.626663208007812, "global_step": 374802, "epoch": 2230} {"train_loss": -12.700775146484375, "global_step": 374803, "epoch": 2230} {"train_loss": -12.468488693237305, "global_step": 374804, "epoch": 2230} {"train_loss": -12.728851318359375, "global_step": 374805, "epoch": 2230} {"train_loss": -12.544708251953125, "global_step": 374806, "epoch": 2230} {"train_loss": -11.666630253905343, "global_step": 374807, "epoch": 2230, "val_loss": 292218.90625, "train_action_mse_error": 1.6336913108825684} {"train_loss": -12.61270523071289, "global_step": 374808, "epoch": 2231} {"train_loss": -12.647015571594238, "global_step": 374809, "epoch": 2231} {"train_loss": -12.580013275146484, "global_step": 374810, "epoch": 2231} {"train_loss": -12.79885196685791, "global_step": 374811, "epoch": 2231} {"train_loss": -12.630022048950195, "global_step": 374812, "epoch": 2231} {"train_loss": -12.542276382446289, "global_step": 374813, "epoch": 2231} {"train_loss": -12.684488296508789, "global_step": 374814, "epoch": 2231} {"train_loss": -12.662078857421875, "global_step": 374815, "epoch": 2231} {"train_loss": -12.566123962402344, "global_step": 374816, "epoch": 2231} {"train_loss": -12.57850170135498, "global_step": 374817, "epoch": 2231} {"train_loss": -12.522968292236328, "global_step": 374818, "epoch": 2231} {"train_loss": -12.24887466430664, "global_step": 374819, "epoch": 2231} {"train_loss": -12.786696434020996, "global_step": 374820, "epoch": 2231} {"train_loss": -12.363066673278809, "global_step": 374821, "epoch": 2231} {"train_loss": -12.672770500183105, "global_step": 374822, "epoch": 2231} {"train_loss": -12.506328582763672, "global_step": 374823, "epoch": 2231} {"train_loss": -12.482643127441406, "global_step": 374824, "epoch": 2231} {"train_loss": -12.466594696044922, "global_step": 374825, "epoch": 2231} {"train_loss": -12.686836242675781, "global_step": 374826, "epoch": 2231} {"train_loss": -12.613507270812988, "global_step": 374827, "epoch": 2231} {"train_loss": -12.826021194458008, "global_step": 374828, "epoch": 2231} {"train_loss": -12.539665222167969, "global_step": 374829, "epoch": 2231} {"train_loss": -12.829239845275879, "global_step": 374830, "epoch": 2231} {"train_loss": -12.822505950927734, "global_step": 374831, "epoch": 2231} {"train_loss": -12.980184555053711, "global_step": 374832, "epoch": 2231} {"train_loss": -12.642460823059082, "global_step": 374833, "epoch": 2231} {"train_loss": -12.373063087463379, "global_step": 374834, "epoch": 2231} {"train_loss": -12.58330249786377, "global_step": 374835, "epoch": 2231} {"train_loss": -12.382015228271484, "global_step": 374836, "epoch": 2231} {"train_loss": -12.328259468078613, "global_step": 374837, "epoch": 2231} {"train_loss": -12.743427276611328, "global_step": 374838, "epoch": 2231} {"train_loss": -12.768763542175293, "global_step": 374839, "epoch": 2231} {"train_loss": -12.50350570678711, "global_step": 374840, "epoch": 2231} {"train_loss": -12.541215896606445, "global_step": 374841, "epoch": 2231} {"train_loss": -12.863544464111328, "global_step": 374842, "epoch": 2231} {"train_loss": -12.484175682067871, "global_step": 374843, "epoch": 2231} {"train_loss": -12.725435256958008, "global_step": 374844, "epoch": 2231} {"train_loss": -12.622052192687988, "global_step": 374845, "epoch": 2231} {"train_loss": -11.955849647521973, "global_step": 374846, "epoch": 2231} {"train_loss": -11.667348861694336, "global_step": 374847, "epoch": 2231} {"train_loss": -11.181684494018555, "global_step": 374848, "epoch": 2231} {"train_loss": -11.34732437133789, "global_step": 374849, "epoch": 2231} {"train_loss": -12.242878913879395, "global_step": 374850, "epoch": 2231} {"train_loss": -12.576150894165039, "global_step": 374851, "epoch": 2231} {"train_loss": -11.751751899719238, "global_step": 374852, "epoch": 2231} {"train_loss": -10.004463195800781, "global_step": 374853, "epoch": 2231} {"train_loss": -11.123008728027344, "global_step": 374854, "epoch": 2231} {"train_loss": -11.77780532836914, "global_step": 374855, "epoch": 2231} {"train_loss": -11.224908828735352, "global_step": 374856, "epoch": 2231} {"train_loss": -11.338065147399902, "global_step": 374857, "epoch": 2231} {"train_loss": -12.077937126159668, "global_step": 374858, "epoch": 2231} {"train_loss": -11.27391242980957, "global_step": 374859, "epoch": 2231} {"train_loss": -11.311721801757812, "global_step": 374860, "epoch": 2231} {"train_loss": -11.4810791015625, "global_step": 374861, "epoch": 2231} {"train_loss": -11.370048522949219, "global_step": 374862, "epoch": 2231} {"train_loss": -8.49465274810791, "global_step": 374863, "epoch": 2231} {"train_loss": -9.641389846801758, "global_step": 374864, "epoch": 2231} {"train_loss": -11.757588386535645, "global_step": 374865, "epoch": 2231} {"train_loss": -8.56208610534668, "global_step": 374866, "epoch": 2231} {"train_loss": -10.882194519042969, "global_step": 374867, "epoch": 2231} {"train_loss": -10.367055892944336, "global_step": 374868, "epoch": 2231} {"train_loss": -9.116455078125, "global_step": 374869, "epoch": 2231} {"train_loss": -9.84207534790039, "global_step": 374870, "epoch": 2231} {"train_loss": -10.460546493530273, "global_step": 374871, "epoch": 2231} {"train_loss": -11.372501373291016, "global_step": 374872, "epoch": 2231} {"train_loss": -10.183619499206543, "global_step": 374873, "epoch": 2231} {"train_loss": -10.178881645202637, "global_step": 374874, "epoch": 2231} {"train_loss": -11.592178344726562, "global_step": 374875, "epoch": 2231} {"train_loss": -9.098363876342773, "global_step": 374876, "epoch": 2231} {"train_loss": -11.0958251953125, "global_step": 374877, "epoch": 2231} {"train_loss": -11.296439170837402, "global_step": 374878, "epoch": 2231} {"train_loss": -10.001129150390625, "global_step": 374879, "epoch": 2231} {"train_loss": -11.67770767211914, "global_step": 374880, "epoch": 2231} {"train_loss": -11.165794372558594, "global_step": 374881, "epoch": 2231} {"train_loss": -11.276872634887695, "global_step": 374882, "epoch": 2231} {"train_loss": -11.6029052734375, "global_step": 374883, "epoch": 2231} {"train_loss": -10.729415893554688, "global_step": 374884, "epoch": 2231} {"train_loss": -11.632092475891113, "global_step": 374885, "epoch": 2231} {"train_loss": -10.918875694274902, "global_step": 374886, "epoch": 2231} {"train_loss": -11.377849578857422, "global_step": 374887, "epoch": 2231} {"train_loss": -11.270450592041016, "global_step": 374888, "epoch": 2231} {"train_loss": -11.597354888916016, "global_step": 374889, "epoch": 2231} {"train_loss": -11.115561485290527, "global_step": 374890, "epoch": 2231} {"train_loss": -11.824050903320312, "global_step": 374891, "epoch": 2231} {"train_loss": -11.256551742553711, "global_step": 374892, "epoch": 2231} {"train_loss": -11.077630996704102, "global_step": 374893, "epoch": 2231} {"train_loss": -10.709495544433594, "global_step": 374894, "epoch": 2231} {"train_loss": -11.402542114257812, "global_step": 374895, "epoch": 2231} {"train_loss": -11.637798309326172, "global_step": 374896, "epoch": 2231} {"train_loss": -11.06193733215332, "global_step": 374897, "epoch": 2231} {"train_loss": -11.701406478881836, "global_step": 374898, "epoch": 2231} {"train_loss": -10.95208740234375, "global_step": 374899, "epoch": 2231} {"train_loss": -11.646739959716797, "global_step": 374900, "epoch": 2231} {"train_loss": -11.63399600982666, "global_step": 374901, "epoch": 2231} {"train_loss": -11.819522857666016, "global_step": 374902, "epoch": 2231} {"train_loss": -11.812704086303711, "global_step": 374903, "epoch": 2231} {"train_loss": -11.846792221069336, "global_step": 374904, "epoch": 2231} {"train_loss": -11.888091087341309, "global_step": 374905, "epoch": 2231} {"train_loss": -11.727910995483398, "global_step": 374906, "epoch": 2231} {"train_loss": -11.6597900390625, "global_step": 374907, "epoch": 2231} {"train_loss": -11.858949661254883, "global_step": 374908, "epoch": 2231} {"train_loss": -11.595362663269043, "global_step": 374909, "epoch": 2231} {"train_loss": -11.860587120056152, "global_step": 374910, "epoch": 2231} {"train_loss": -11.498703956604004, "global_step": 374911, "epoch": 2231} {"train_loss": -12.039063453674316, "global_step": 374912, "epoch": 2231} {"train_loss": -11.595314025878906, "global_step": 374913, "epoch": 2231} {"train_loss": -11.755895614624023, "global_step": 374914, "epoch": 2231} {"train_loss": -11.716636657714844, "global_step": 374915, "epoch": 2231} {"train_loss": -11.93203353881836, "global_step": 374916, "epoch": 2231} {"train_loss": -11.497184753417969, "global_step": 374917, "epoch": 2231} {"train_loss": -11.832930564880371, "global_step": 374918, "epoch": 2231} {"train_loss": -12.130972862243652, "global_step": 374919, "epoch": 2231} {"train_loss": -11.845723152160645, "global_step": 374920, "epoch": 2231} {"train_loss": -12.00561809539795, "global_step": 374921, "epoch": 2231} {"train_loss": -12.107076644897461, "global_step": 374922, "epoch": 2231} {"train_loss": -12.061239242553711, "global_step": 374923, "epoch": 2231} {"train_loss": -11.990310668945312, "global_step": 374924, "epoch": 2231} {"train_loss": -12.437627792358398, "global_step": 374925, "epoch": 2231} {"train_loss": -12.043920516967773, "global_step": 374926, "epoch": 2231} {"train_loss": -12.252870559692383, "global_step": 374927, "epoch": 2231} {"train_loss": -12.303443908691406, "global_step": 374928, "epoch": 2231} {"train_loss": -12.29718017578125, "global_step": 374929, "epoch": 2231} {"train_loss": -12.038748741149902, "global_step": 374930, "epoch": 2231} {"train_loss": -12.48546028137207, "global_step": 374931, "epoch": 2231} {"train_loss": -12.262552261352539, "global_step": 374932, "epoch": 2231} {"train_loss": -12.415980339050293, "global_step": 374933, "epoch": 2231} {"train_loss": -12.331697463989258, "global_step": 374934, "epoch": 2231} {"train_loss": -12.077430725097656, "global_step": 374935, "epoch": 2231} {"train_loss": -12.40954875946045, "global_step": 374936, "epoch": 2231} {"train_loss": -12.111394882202148, "global_step": 374937, "epoch": 2231} {"train_loss": -12.503952026367188, "global_step": 374938, "epoch": 2231} {"train_loss": -12.184590339660645, "global_step": 374939, "epoch": 2231} {"train_loss": -12.328208923339844, "global_step": 374940, "epoch": 2231} {"train_loss": -12.32365608215332, "global_step": 374941, "epoch": 2231} {"train_loss": -12.480928421020508, "global_step": 374942, "epoch": 2231} {"train_loss": -12.14865493774414, "global_step": 374943, "epoch": 2231} {"train_loss": -12.059052467346191, "global_step": 374944, "epoch": 2231} {"train_loss": -11.76754379272461, "global_step": 374945, "epoch": 2231} {"train_loss": -11.597046852111816, "global_step": 374946, "epoch": 2231} {"train_loss": -12.326851844787598, "global_step": 374947, "epoch": 2231} {"train_loss": -11.911721229553223, "global_step": 374948, "epoch": 2231} {"train_loss": -12.253053665161133, "global_step": 374949, "epoch": 2231} {"train_loss": -12.349180221557617, "global_step": 374950, "epoch": 2231} {"train_loss": -12.212553977966309, "global_step": 374951, "epoch": 2231} {"train_loss": -12.520371437072754, "global_step": 374952, "epoch": 2231} {"train_loss": -12.39205551147461, "global_step": 374953, "epoch": 2231} {"train_loss": -12.271002769470215, "global_step": 374954, "epoch": 2231} {"train_loss": -12.47622013092041, "global_step": 374955, "epoch": 2231} {"train_loss": -12.107257843017578, "global_step": 374956, "epoch": 2231} {"train_loss": -12.507020950317383, "global_step": 374957, "epoch": 2231} {"train_loss": -12.253124237060547, "global_step": 374958, "epoch": 2231} {"train_loss": -12.423624038696289, "global_step": 374959, "epoch": 2231} {"train_loss": -12.397201538085938, "global_step": 374960, "epoch": 2231} {"train_loss": -12.095856666564941, "global_step": 374961, "epoch": 2231} {"train_loss": -12.526544570922852, "global_step": 374962, "epoch": 2231} {"train_loss": -12.185742378234863, "global_step": 374963, "epoch": 2231} {"train_loss": -12.351911544799805, "global_step": 374964, "epoch": 2231} {"train_loss": -12.118369102478027, "global_step": 374965, "epoch": 2231} {"train_loss": -12.494232177734375, "global_step": 374966, "epoch": 2231} {"train_loss": -12.442951202392578, "global_step": 374967, "epoch": 2231} {"train_loss": -12.427583694458008, "global_step": 374968, "epoch": 2231} {"train_loss": -12.418266296386719, "global_step": 374969, "epoch": 2231} {"train_loss": -12.525569915771484, "global_step": 374970, "epoch": 2231} {"train_loss": -12.462411880493164, "global_step": 374971, "epoch": 2231} {"train_loss": -12.514129638671875, "global_step": 374972, "epoch": 2231} {"train_loss": -12.611309051513672, "global_step": 374973, "epoch": 2231} {"train_loss": -12.379631996154785, "global_step": 374974, "epoch": 2231} {"train_loss": -11.89004833925338, "global_step": 374975, "epoch": 2231, "val_loss": 286316.375} {"train_loss": -12.540814399719238, "global_step": 374976, "epoch": 2232} {"train_loss": -12.455107688903809, "global_step": 374977, "epoch": 2232} {"train_loss": -12.572530746459961, "global_step": 374978, "epoch": 2232} {"train_loss": -12.523089408874512, "global_step": 374979, "epoch": 2232} {"train_loss": -12.44656753540039, "global_step": 374980, "epoch": 2232} {"train_loss": -12.56157112121582, "global_step": 374981, "epoch": 2232} {"train_loss": -12.448558807373047, "global_step": 374982, "epoch": 2232} {"train_loss": -12.479894638061523, "global_step": 374983, "epoch": 2232} {"train_loss": -12.591276168823242, "global_step": 374984, "epoch": 2232} {"train_loss": -12.451622009277344, "global_step": 374985, "epoch": 2232} {"train_loss": -12.602043151855469, "global_step": 374986, "epoch": 2232} {"train_loss": -12.834468841552734, "global_step": 374987, "epoch": 2232} {"train_loss": -12.617077827453613, "global_step": 374988, "epoch": 2232} {"train_loss": -12.697132110595703, "global_step": 374989, "epoch": 2232} {"train_loss": -12.629262924194336, "global_step": 374990, "epoch": 2232} {"train_loss": -12.657939910888672, "global_step": 374991, "epoch": 2232} {"train_loss": -12.470855712890625, "global_step": 374992, "epoch": 2232} {"train_loss": -12.550050735473633, "global_step": 374993, "epoch": 2232} {"train_loss": -12.446874618530273, "global_step": 374994, "epoch": 2232} {"train_loss": -12.656717300415039, "global_step": 374995, "epoch": 2232} {"train_loss": -12.632225036621094, "global_step": 374996, "epoch": 2232} {"train_loss": -12.672563552856445, "global_step": 374997, "epoch": 2232} {"train_loss": -12.762540817260742, "global_step": 374998, "epoch": 2232} {"train_loss": -12.8887939453125, "global_step": 374999, "epoch": 2232} {"train_loss": -12.3721923828125, "global_step": 375000, "epoch": 2232} {"train_loss": -12.699478149414062, "global_step": 375001, "epoch": 2232} {"train_loss": -12.145648956298828, "global_step": 375002, "epoch": 2232} {"train_loss": -12.769291877746582, "global_step": 375003, "epoch": 2232} {"train_loss": -12.150052070617676, "global_step": 375004, "epoch": 2232} {"train_loss": -12.411609649658203, "global_step": 375005, "epoch": 2232} {"train_loss": -12.566631317138672, "global_step": 375006, "epoch": 2232} {"train_loss": -12.444889068603516, "global_step": 375007, "epoch": 2232} {"train_loss": -12.306609153747559, "global_step": 375008, "epoch": 2232} {"train_loss": -11.620372772216797, "global_step": 375009, "epoch": 2232} {"train_loss": -11.056840896606445, "global_step": 375010, "epoch": 2232} {"train_loss": -12.13856029510498, "global_step": 375011, "epoch": 2232} {"train_loss": -12.032439231872559, "global_step": 375012, "epoch": 2232} {"train_loss": -11.383197784423828, "global_step": 375013, "epoch": 2232} {"train_loss": -12.101263046264648, "global_step": 375014, "epoch": 2232} {"train_loss": -11.313918113708496, "global_step": 375015, "epoch": 2232} {"train_loss": -12.57602310180664, "global_step": 375016, "epoch": 2232} {"train_loss": -11.137142181396484, "global_step": 375017, "epoch": 2232} {"train_loss": -12.168723106384277, "global_step": 375018, "epoch": 2232} {"train_loss": -11.318845748901367, "global_step": 375019, "epoch": 2232} {"train_loss": -12.008328437805176, "global_step": 375020, "epoch": 2232} {"train_loss": -10.959968566894531, "global_step": 375021, "epoch": 2232} {"train_loss": -11.964462280273438, "global_step": 375022, "epoch": 2232} {"train_loss": -11.084217071533203, "global_step": 375023, "epoch": 2232} {"train_loss": -12.002158164978027, "global_step": 375024, "epoch": 2232} {"train_loss": -11.224571228027344, "global_step": 375025, "epoch": 2232} {"train_loss": -11.23843002319336, "global_step": 375026, "epoch": 2232} {"train_loss": -11.452170372009277, "global_step": 375027, "epoch": 2232} {"train_loss": -11.905693054199219, "global_step": 375028, "epoch": 2232} {"train_loss": -11.144916534423828, "global_step": 375029, "epoch": 2232} {"train_loss": -12.280344009399414, "global_step": 375030, "epoch": 2232} {"train_loss": -11.591960906982422, "global_step": 375031, "epoch": 2232} {"train_loss": -11.495845794677734, "global_step": 375032, "epoch": 2232} {"train_loss": -11.0853271484375, "global_step": 375033, "epoch": 2232} {"train_loss": -12.172890663146973, "global_step": 375034, "epoch": 2232} {"train_loss": -10.748038291931152, "global_step": 375035, "epoch": 2232} {"train_loss": -12.092662811279297, "global_step": 375036, "epoch": 2232} {"train_loss": -11.63098430633545, "global_step": 375037, "epoch": 2232} {"train_loss": -11.876357078552246, "global_step": 375038, "epoch": 2232} {"train_loss": -11.967327117919922, "global_step": 375039, "epoch": 2232} {"train_loss": -11.137414932250977, "global_step": 375040, "epoch": 2232} {"train_loss": -11.7177734375, "global_step": 375041, "epoch": 2232} {"train_loss": -11.243114471435547, "global_step": 375042, "epoch": 2232} {"train_loss": -9.558734893798828, "global_step": 375043, "epoch": 2232} {"train_loss": -11.11612319946289, "global_step": 375044, "epoch": 2232} {"train_loss": -10.822075843811035, "global_step": 375045, "epoch": 2232} {"train_loss": -11.40414047241211, "global_step": 375046, "epoch": 2232} {"train_loss": -10.943437576293945, "global_step": 375047, "epoch": 2232} {"train_loss": -11.380887985229492, "global_step": 375048, "epoch": 2232} {"train_loss": -10.97781753540039, "global_step": 375049, "epoch": 2232} {"train_loss": -11.028020858764648, "global_step": 375050, "epoch": 2232} {"train_loss": -11.092609405517578, "global_step": 375051, "epoch": 2232} {"train_loss": -11.526418685913086, "global_step": 375052, "epoch": 2232} {"train_loss": -11.416922569274902, "global_step": 375053, "epoch": 2232} {"train_loss": -11.244974136352539, "global_step": 375054, "epoch": 2232} {"train_loss": -12.063817977905273, "global_step": 375055, "epoch": 2232} {"train_loss": -11.401900291442871, "global_step": 375056, "epoch": 2232} {"train_loss": -11.628143310546875, "global_step": 375057, "epoch": 2232} {"train_loss": -11.367741584777832, "global_step": 375058, "epoch": 2232} {"train_loss": -11.450420379638672, "global_step": 375059, "epoch": 2232} {"train_loss": -11.373086929321289, "global_step": 375060, "epoch": 2232} {"train_loss": -11.450052261352539, "global_step": 375061, "epoch": 2232} {"train_loss": -10.972602844238281, "global_step": 375062, "epoch": 2232} {"train_loss": -11.597604751586914, "global_step": 375063, "epoch": 2232} {"train_loss": -11.053735733032227, "global_step": 375064, "epoch": 2232} {"train_loss": -11.504456520080566, "global_step": 375065, "epoch": 2232} {"train_loss": -11.723058700561523, "global_step": 375066, "epoch": 2232} {"train_loss": -11.269157409667969, "global_step": 375067, "epoch": 2232} {"train_loss": -11.973328590393066, "global_step": 375068, "epoch": 2232} {"train_loss": -11.444870948791504, "global_step": 375069, "epoch": 2232} {"train_loss": -11.9797945022583, "global_step": 375070, "epoch": 2232} {"train_loss": -12.04982852935791, "global_step": 375071, "epoch": 2232} {"train_loss": -11.850896835327148, "global_step": 375072, "epoch": 2232} {"train_loss": -12.186551094055176, "global_step": 375073, "epoch": 2232} {"train_loss": -11.943220138549805, "global_step": 375074, "epoch": 2232} {"train_loss": -12.242547988891602, "global_step": 375075, "epoch": 2232} {"train_loss": -12.398433685302734, "global_step": 375076, "epoch": 2232} {"train_loss": -12.096391677856445, "global_step": 375077, "epoch": 2232} {"train_loss": -12.342035293579102, "global_step": 375078, "epoch": 2232} {"train_loss": -12.233804702758789, "global_step": 375079, "epoch": 2232} {"train_loss": -12.175935745239258, "global_step": 375080, "epoch": 2232} {"train_loss": -12.1588134765625, "global_step": 375081, "epoch": 2232} {"train_loss": -11.992443084716797, "global_step": 375082, "epoch": 2232} {"train_loss": -12.226980209350586, "global_step": 375083, "epoch": 2232} {"train_loss": -12.020925521850586, "global_step": 375084, "epoch": 2232} {"train_loss": -12.222911834716797, "global_step": 375085, "epoch": 2232} {"train_loss": -12.1299467086792, "global_step": 375086, "epoch": 2232} {"train_loss": -12.111838340759277, "global_step": 375087, "epoch": 2232} {"train_loss": -12.02212142944336, "global_step": 375088, "epoch": 2232} {"train_loss": -12.206653594970703, "global_step": 375089, "epoch": 2232} {"train_loss": -12.342687606811523, "global_step": 375090, "epoch": 2232} {"train_loss": -11.978671073913574, "global_step": 375091, "epoch": 2232} {"train_loss": -12.246223449707031, "global_step": 375092, "epoch": 2232} {"train_loss": -11.700113296508789, "global_step": 375093, "epoch": 2232} {"train_loss": -12.336103439331055, "global_step": 375094, "epoch": 2232} {"train_loss": -12.209386825561523, "global_step": 375095, "epoch": 2232} {"train_loss": -12.14372444152832, "global_step": 375096, "epoch": 2232} {"train_loss": -12.077220916748047, "global_step": 375097, "epoch": 2232} {"train_loss": -12.199889183044434, "global_step": 375098, "epoch": 2232} {"train_loss": -12.231325149536133, "global_step": 375099, "epoch": 2232} {"train_loss": -12.597923278808594, "global_step": 375100, "epoch": 2232} {"train_loss": -12.001355171203613, "global_step": 375101, "epoch": 2232} {"train_loss": -12.311582565307617, "global_step": 375102, "epoch": 2232} {"train_loss": -12.177620887756348, "global_step": 375103, "epoch": 2232} {"train_loss": -11.63176155090332, "global_step": 375104, "epoch": 2232} {"train_loss": -11.349099159240723, "global_step": 375105, "epoch": 2232} {"train_loss": -11.431365966796875, "global_step": 375106, "epoch": 2232} {"train_loss": -9.696769714355469, "global_step": 375107, "epoch": 2232} {"train_loss": -11.641850471496582, "global_step": 375108, "epoch": 2232} {"train_loss": -10.145552635192871, "global_step": 375109, "epoch": 2232} {"train_loss": -9.311859130859375, "global_step": 375110, "epoch": 2232} {"train_loss": -9.45675277709961, "global_step": 375111, "epoch": 2232} {"train_loss": -10.647493362426758, "global_step": 375112, "epoch": 2232} {"train_loss": -9.491203308105469, "global_step": 375113, "epoch": 2232} {"train_loss": -11.55643081665039, "global_step": 375114, "epoch": 2232} {"train_loss": -11.00497817993164, "global_step": 375115, "epoch": 2232} {"train_loss": -11.362088203430176, "global_step": 375116, "epoch": 2232} {"train_loss": -11.95991325378418, "global_step": 375117, "epoch": 2232} {"train_loss": -11.388678550720215, "global_step": 375118, "epoch": 2232} {"train_loss": -12.014297485351562, "global_step": 375119, "epoch": 2232} {"train_loss": -11.649259567260742, "global_step": 375120, "epoch": 2232} {"train_loss": -11.703598022460938, "global_step": 375121, "epoch": 2232} {"train_loss": -11.512554168701172, "global_step": 375122, "epoch": 2232} {"train_loss": -11.965568542480469, "global_step": 375123, "epoch": 2232} {"train_loss": -11.52957534790039, "global_step": 375124, "epoch": 2232} {"train_loss": -11.90909194946289, "global_step": 375125, "epoch": 2232} {"train_loss": -11.508774757385254, "global_step": 375126, "epoch": 2232} {"train_loss": -11.619235038757324, "global_step": 375127, "epoch": 2232} {"train_loss": -11.774591445922852, "global_step": 375128, "epoch": 2232} {"train_loss": -11.90113639831543, "global_step": 375129, "epoch": 2232} {"train_loss": -11.419015884399414, "global_step": 375130, "epoch": 2232} {"train_loss": -12.240671157836914, "global_step": 375131, "epoch": 2232} {"train_loss": -11.470939636230469, "global_step": 375132, "epoch": 2232} {"train_loss": -11.974369049072266, "global_step": 375133, "epoch": 2232} {"train_loss": -11.464261054992676, "global_step": 375134, "epoch": 2232} {"train_loss": -11.993297576904297, "global_step": 375135, "epoch": 2232} {"train_loss": -11.829795837402344, "global_step": 375136, "epoch": 2232} {"train_loss": -11.685876846313477, "global_step": 375137, "epoch": 2232} {"train_loss": -11.834921836853027, "global_step": 375138, "epoch": 2232} {"train_loss": -11.260984420776367, "global_step": 375139, "epoch": 2232} {"train_loss": -11.743227005004883, "global_step": 375140, "epoch": 2232} {"train_loss": -11.326361656188965, "global_step": 375141, "epoch": 2232} {"train_loss": -11.719754219055176, "global_step": 375142, "epoch": 2232} {"train_loss": -11.792283637183052, "global_step": 375143, "epoch": 2232, "val_loss": 289001.625} {"train_loss": -11.586780548095703, "global_step": 375144, "epoch": 2233} {"train_loss": -11.853536605834961, "global_step": 375145, "epoch": 2233} {"train_loss": -11.353998184204102, "global_step": 375146, "epoch": 2233} {"train_loss": -11.913270950317383, "global_step": 375147, "epoch": 2233} {"train_loss": -11.508810997009277, "global_step": 375148, "epoch": 2233} {"train_loss": -11.945785522460938, "global_step": 375149, "epoch": 2233} {"train_loss": -12.000106811523438, "global_step": 375150, "epoch": 2233} {"train_loss": -11.659141540527344, "global_step": 375151, "epoch": 2233} {"train_loss": -11.893828392028809, "global_step": 375152, "epoch": 2233} {"train_loss": -11.90580940246582, "global_step": 375153, "epoch": 2233} {"train_loss": -11.861167907714844, "global_step": 375154, "epoch": 2233} {"train_loss": -12.11182975769043, "global_step": 375155, "epoch": 2233} {"train_loss": -11.779231071472168, "global_step": 375156, "epoch": 2233} {"train_loss": -12.224393844604492, "global_step": 375157, "epoch": 2233} {"train_loss": -11.931644439697266, "global_step": 375158, "epoch": 2233} {"train_loss": -11.965129852294922, "global_step": 375159, "epoch": 2233} {"train_loss": -12.130058288574219, "global_step": 375160, "epoch": 2233} {"train_loss": -11.77596664428711, "global_step": 375161, "epoch": 2233} {"train_loss": -12.168545722961426, "global_step": 375162, "epoch": 2233} {"train_loss": -12.186103820800781, "global_step": 375163, "epoch": 2233} {"train_loss": -12.45556354522705, "global_step": 375164, "epoch": 2233} {"train_loss": -12.27059555053711, "global_step": 375165, "epoch": 2233} {"train_loss": -12.219541549682617, "global_step": 375166, "epoch": 2233} {"train_loss": -12.308481216430664, "global_step": 375167, "epoch": 2233} {"train_loss": -12.20175552368164, "global_step": 375168, "epoch": 2233} {"train_loss": -12.291786193847656, "global_step": 375169, "epoch": 2233} {"train_loss": -12.237215042114258, "global_step": 375170, "epoch": 2233} {"train_loss": -12.370187759399414, "global_step": 375171, "epoch": 2233} {"train_loss": -12.275849342346191, "global_step": 375172, "epoch": 2233} {"train_loss": -12.244532585144043, "global_step": 375173, "epoch": 2233} {"train_loss": -12.386478424072266, "global_step": 375174, "epoch": 2233} {"train_loss": -12.006980895996094, "global_step": 375175, "epoch": 2233} {"train_loss": -12.05003547668457, "global_step": 375176, "epoch": 2233} {"train_loss": -11.471049308776855, "global_step": 375177, "epoch": 2233} {"train_loss": -12.247637748718262, "global_step": 375178, "epoch": 2233} {"train_loss": -11.706856727600098, "global_step": 375179, "epoch": 2233} {"train_loss": -12.217058181762695, "global_step": 375180, "epoch": 2233} {"train_loss": -11.907928466796875, "global_step": 375181, "epoch": 2233} {"train_loss": -12.374776840209961, "global_step": 375182, "epoch": 2233} {"train_loss": -11.81302261352539, "global_step": 375183, "epoch": 2233} {"train_loss": -12.083978652954102, "global_step": 375184, "epoch": 2233} {"train_loss": -12.111982345581055, "global_step": 375185, "epoch": 2233} {"train_loss": -12.135381698608398, "global_step": 375186, "epoch": 2233} {"train_loss": -12.351824760437012, "global_step": 375187, "epoch": 2233} {"train_loss": -12.320074081420898, "global_step": 375188, "epoch": 2233} {"train_loss": -12.109370231628418, "global_step": 375189, "epoch": 2233} {"train_loss": -12.27291488647461, "global_step": 375190, "epoch": 2233} {"train_loss": -12.429697036743164, "global_step": 375191, "epoch": 2233} {"train_loss": -12.340862274169922, "global_step": 375192, "epoch": 2233} {"train_loss": -12.370723724365234, "global_step": 375193, "epoch": 2233} {"train_loss": -12.503634452819824, "global_step": 375194, "epoch": 2233} {"train_loss": -12.432424545288086, "global_step": 375195, "epoch": 2233} {"train_loss": -12.452509880065918, "global_step": 375196, "epoch": 2233} {"train_loss": -12.661931991577148, "global_step": 375197, "epoch": 2233} {"train_loss": -12.45565414428711, "global_step": 375198, "epoch": 2233} {"train_loss": -12.455642700195312, "global_step": 375199, "epoch": 2233} {"train_loss": -12.694562911987305, "global_step": 375200, "epoch": 2233} {"train_loss": -12.68441390991211, "global_step": 375201, "epoch": 2233} {"train_loss": -12.735762596130371, "global_step": 375202, "epoch": 2233} {"train_loss": -12.57982063293457, "global_step": 375203, "epoch": 2233} {"train_loss": -12.708927154541016, "global_step": 375204, "epoch": 2233} {"train_loss": -12.41805648803711, "global_step": 375205, "epoch": 2233} {"train_loss": -12.624225616455078, "global_step": 375206, "epoch": 2233} {"train_loss": -12.394336700439453, "global_step": 375207, "epoch": 2233} {"train_loss": -12.54552173614502, "global_step": 375208, "epoch": 2233} {"train_loss": -12.812392234802246, "global_step": 375209, "epoch": 2233} {"train_loss": -12.498359680175781, "global_step": 375210, "epoch": 2233} {"train_loss": -12.769346237182617, "global_step": 375211, "epoch": 2233} {"train_loss": -12.608417510986328, "global_step": 375212, "epoch": 2233} {"train_loss": -12.623736381530762, "global_step": 375213, "epoch": 2233} {"train_loss": -12.705039978027344, "global_step": 375214, "epoch": 2233} {"train_loss": -12.533061027526855, "global_step": 375215, "epoch": 2233} {"train_loss": -12.434745788574219, "global_step": 375216, "epoch": 2233} {"train_loss": -12.781596183776855, "global_step": 375217, "epoch": 2233} {"train_loss": -12.569194793701172, "global_step": 375218, "epoch": 2233} {"train_loss": -12.408891677856445, "global_step": 375219, "epoch": 2233} {"train_loss": -12.406294822692871, "global_step": 375220, "epoch": 2233} {"train_loss": -12.459226608276367, "global_step": 375221, "epoch": 2233} {"train_loss": -12.52834701538086, "global_step": 375222, "epoch": 2233} {"train_loss": -12.303391456604004, "global_step": 375223, "epoch": 2233} {"train_loss": -12.853259086608887, "global_step": 375224, "epoch": 2233} {"train_loss": -12.437982559204102, "global_step": 375225, "epoch": 2233} {"train_loss": -12.339411735534668, "global_step": 375226, "epoch": 2233} {"train_loss": -12.685487747192383, "global_step": 375227, "epoch": 2233} {"train_loss": -12.558094024658203, "global_step": 375228, "epoch": 2233} {"train_loss": -12.36881160736084, "global_step": 375229, "epoch": 2233} {"train_loss": -12.276321411132812, "global_step": 375230, "epoch": 2233} {"train_loss": -12.28903579711914, "global_step": 375231, "epoch": 2233} {"train_loss": -12.355443954467773, "global_step": 375232, "epoch": 2233} {"train_loss": -12.222343444824219, "global_step": 375233, "epoch": 2233} {"train_loss": -11.639452934265137, "global_step": 375234, "epoch": 2233} {"train_loss": -12.422294616699219, "global_step": 375235, "epoch": 2233} {"train_loss": -12.249351501464844, "global_step": 375236, "epoch": 2233} {"train_loss": -12.227046012878418, "global_step": 375237, "epoch": 2233} {"train_loss": -12.104813575744629, "global_step": 375238, "epoch": 2233} {"train_loss": -11.939794540405273, "global_step": 375239, "epoch": 2233} {"train_loss": -11.718612670898438, "global_step": 375240, "epoch": 2233} {"train_loss": -11.932077407836914, "global_step": 375241, "epoch": 2233} {"train_loss": -11.651527404785156, "global_step": 375242, "epoch": 2233} {"train_loss": -11.672412872314453, "global_step": 375243, "epoch": 2233} {"train_loss": -12.099128723144531, "global_step": 375244, "epoch": 2233} {"train_loss": -11.666383743286133, "global_step": 375245, "epoch": 2233} {"train_loss": -11.923638343811035, "global_step": 375246, "epoch": 2233} {"train_loss": -11.716695785522461, "global_step": 375247, "epoch": 2233} {"train_loss": -11.67486572265625, "global_step": 375248, "epoch": 2233} {"train_loss": -10.758410453796387, "global_step": 375249, "epoch": 2233} {"train_loss": -11.947381973266602, "global_step": 375250, "epoch": 2233} {"train_loss": -11.271265029907227, "global_step": 375251, "epoch": 2233} {"train_loss": -10.289027214050293, "global_step": 375252, "epoch": 2233} {"train_loss": -11.056777954101562, "global_step": 375253, "epoch": 2233} {"train_loss": -9.664754867553711, "global_step": 375254, "epoch": 2233} {"train_loss": -10.8907470703125, "global_step": 375255, "epoch": 2233} {"train_loss": -9.481308937072754, "global_step": 375256, "epoch": 2233} {"train_loss": -8.129756927490234, "global_step": 375257, "epoch": 2233} {"train_loss": -9.458335876464844, "global_step": 375258, "epoch": 2233} {"train_loss": -9.962358474731445, "global_step": 375259, "epoch": 2233} {"train_loss": -8.803555488586426, "global_step": 375260, "epoch": 2233} {"train_loss": -7.965020656585693, "global_step": 375261, "epoch": 2233} {"train_loss": -8.04654312133789, "global_step": 375262, "epoch": 2233} {"train_loss": -9.749335289001465, "global_step": 375263, "epoch": 2233} {"train_loss": -9.661449432373047, "global_step": 375264, "epoch": 2233} {"train_loss": -9.566847801208496, "global_step": 375265, "epoch": 2233} {"train_loss": -10.26047134399414, "global_step": 375266, "epoch": 2233} {"train_loss": -11.139237403869629, "global_step": 375267, "epoch": 2233} {"train_loss": -11.035163879394531, "global_step": 375268, "epoch": 2233} {"train_loss": -10.209203720092773, "global_step": 375269, "epoch": 2233} {"train_loss": -10.688940048217773, "global_step": 375270, "epoch": 2233} {"train_loss": -10.831199645996094, "global_step": 375271, "epoch": 2233} {"train_loss": -10.82239055633545, "global_step": 375272, "epoch": 2233} {"train_loss": -11.273979187011719, "global_step": 375273, "epoch": 2233} {"train_loss": -11.047513961791992, "global_step": 375274, "epoch": 2233} {"train_loss": -11.832926750183105, "global_step": 375275, "epoch": 2233} {"train_loss": -11.458733558654785, "global_step": 375276, "epoch": 2233} {"train_loss": -11.310343742370605, "global_step": 375277, "epoch": 2233} {"train_loss": -11.240410804748535, "global_step": 375278, "epoch": 2233} {"train_loss": -11.653909683227539, "global_step": 375279, "epoch": 2233} {"train_loss": -11.69648551940918, "global_step": 375280, "epoch": 2233} {"train_loss": -11.409896850585938, "global_step": 375281, "epoch": 2233} {"train_loss": -12.137988090515137, "global_step": 375282, "epoch": 2233} {"train_loss": -11.716161727905273, "global_step": 375283, "epoch": 2233} {"train_loss": -12.074334144592285, "global_step": 375284, "epoch": 2233} {"train_loss": -11.726886749267578, "global_step": 375285, "epoch": 2233} {"train_loss": -11.728771209716797, "global_step": 375286, "epoch": 2233} {"train_loss": -12.026667594909668, "global_step": 375287, "epoch": 2233} {"train_loss": -11.873600006103516, "global_step": 375288, "epoch": 2233} {"train_loss": -12.106078147888184, "global_step": 375289, "epoch": 2233} {"train_loss": -11.664224624633789, "global_step": 375290, "epoch": 2233} {"train_loss": -12.051921844482422, "global_step": 375291, "epoch": 2233} {"train_loss": -11.760374069213867, "global_step": 375292, "epoch": 2233} {"train_loss": -11.887104034423828, "global_step": 375293, "epoch": 2233} {"train_loss": -12.326164245605469, "global_step": 375294, "epoch": 2233} {"train_loss": -11.992353439331055, "global_step": 375295, "epoch": 2233} {"train_loss": -12.386444091796875, "global_step": 375296, "epoch": 2233} {"train_loss": -12.201736450195312, "global_step": 375297, "epoch": 2233} {"train_loss": -12.318105697631836, "global_step": 375298, "epoch": 2233} {"train_loss": -12.238724708557129, "global_step": 375299, "epoch": 2233} {"train_loss": -12.367618560791016, "global_step": 375300, "epoch": 2233} {"train_loss": -12.375922203063965, "global_step": 375301, "epoch": 2233} {"train_loss": -12.364646911621094, "global_step": 375302, "epoch": 2233} {"train_loss": -12.43387508392334, "global_step": 375303, "epoch": 2233} {"train_loss": -12.358503341674805, "global_step": 375304, "epoch": 2233} {"train_loss": -12.285123825073242, "global_step": 375305, "epoch": 2233} {"train_loss": -12.15150260925293, "global_step": 375306, "epoch": 2233} {"train_loss": -12.390045166015625, "global_step": 375307, "epoch": 2233} {"train_loss": -12.161492347717285, "global_step": 375308, "epoch": 2233} {"train_loss": -12.305144309997559, "global_step": 375309, "epoch": 2233} {"train_loss": -12.219568252563477, "global_step": 375310, "epoch": 2233} {"train_loss": -11.85104824531646, "global_step": 375311, "epoch": 2233, "val_loss": 290465.0} {"train_loss": -12.214031219482422, "global_step": 375312, "epoch": 2234} {"train_loss": -12.10209846496582, "global_step": 375313, "epoch": 2234} {"train_loss": -11.616488456726074, "global_step": 375314, "epoch": 2234} {"train_loss": -12.253145217895508, "global_step": 375315, "epoch": 2234} {"train_loss": -11.879096984863281, "global_step": 375316, "epoch": 2234} {"train_loss": -12.183259963989258, "global_step": 375317, "epoch": 2234} {"train_loss": -12.1922607421875, "global_step": 375318, "epoch": 2234} {"train_loss": -11.406896591186523, "global_step": 375319, "epoch": 2234} {"train_loss": -12.544316291809082, "global_step": 375320, "epoch": 2234} {"train_loss": -12.257737159729004, "global_step": 375321, "epoch": 2234} {"train_loss": -12.222417831420898, "global_step": 375322, "epoch": 2234} {"train_loss": -12.427168846130371, "global_step": 375323, "epoch": 2234} {"train_loss": -12.220494270324707, "global_step": 375324, "epoch": 2234} {"train_loss": -12.36153793334961, "global_step": 375325, "epoch": 2234} {"train_loss": -12.302933692932129, "global_step": 375326, "epoch": 2234} {"train_loss": -12.002340316772461, "global_step": 375327, "epoch": 2234} {"train_loss": -12.407594680786133, "global_step": 375328, "epoch": 2234} {"train_loss": -12.376531600952148, "global_step": 375329, "epoch": 2234} {"train_loss": -12.2462158203125, "global_step": 375330, "epoch": 2234} {"train_loss": -12.415909767150879, "global_step": 375331, "epoch": 2234} {"train_loss": -12.264900207519531, "global_step": 375332, "epoch": 2234} {"train_loss": -12.234586715698242, "global_step": 375333, "epoch": 2234} {"train_loss": -12.63908576965332, "global_step": 375334, "epoch": 2234} {"train_loss": -12.322408676147461, "global_step": 375335, "epoch": 2234} {"train_loss": -12.354301452636719, "global_step": 375336, "epoch": 2234} {"train_loss": -12.197900772094727, "global_step": 375337, "epoch": 2234} {"train_loss": -12.40722942352295, "global_step": 375338, "epoch": 2234} {"train_loss": -12.294122695922852, "global_step": 375339, "epoch": 2234} {"train_loss": -12.439212799072266, "global_step": 375340, "epoch": 2234} {"train_loss": -12.527345657348633, "global_step": 375341, "epoch": 2234} {"train_loss": -12.672061920166016, "global_step": 375342, "epoch": 2234} {"train_loss": -12.607868194580078, "global_step": 375343, "epoch": 2234} {"train_loss": -12.78040885925293, "global_step": 375344, "epoch": 2234} {"train_loss": -12.704455375671387, "global_step": 375345, "epoch": 2234} {"train_loss": -12.210951805114746, "global_step": 375346, "epoch": 2234} {"train_loss": -12.46125316619873, "global_step": 375347, "epoch": 2234} {"train_loss": -12.204206466674805, "global_step": 375348, "epoch": 2234} {"train_loss": -12.090608596801758, "global_step": 375349, "epoch": 2234} {"train_loss": -12.491024017333984, "global_step": 375350, "epoch": 2234} {"train_loss": -12.079061508178711, "global_step": 375351, "epoch": 2234} {"train_loss": -12.211063385009766, "global_step": 375352, "epoch": 2234} {"train_loss": -12.125741958618164, "global_step": 375353, "epoch": 2234} {"train_loss": -12.340599060058594, "global_step": 375354, "epoch": 2234} {"train_loss": -11.721962928771973, "global_step": 375355, "epoch": 2234} {"train_loss": -12.113252639770508, "global_step": 375356, "epoch": 2234} {"train_loss": -11.86015510559082, "global_step": 375357, "epoch": 2234} {"train_loss": -12.319527626037598, "global_step": 375358, "epoch": 2234} {"train_loss": -12.16995620727539, "global_step": 375359, "epoch": 2234} {"train_loss": -12.755033493041992, "global_step": 375360, "epoch": 2234} {"train_loss": -12.149707794189453, "global_step": 375361, "epoch": 2234} {"train_loss": -12.647140502929688, "global_step": 375362, "epoch": 2234} {"train_loss": -12.588525772094727, "global_step": 375363, "epoch": 2234} {"train_loss": -12.538759231567383, "global_step": 375364, "epoch": 2234} {"train_loss": -12.46419620513916, "global_step": 375365, "epoch": 2234} {"train_loss": -12.594372749328613, "global_step": 375366, "epoch": 2234} {"train_loss": -12.619930267333984, "global_step": 375367, "epoch": 2234} {"train_loss": -12.426505088806152, "global_step": 375368, "epoch": 2234} {"train_loss": -12.76295280456543, "global_step": 375369, "epoch": 2234} {"train_loss": -12.463098526000977, "global_step": 375370, "epoch": 2234} {"train_loss": -12.26919174194336, "global_step": 375371, "epoch": 2234} {"train_loss": -12.618352890014648, "global_step": 375372, "epoch": 2234} {"train_loss": -12.571189880371094, "global_step": 375373, "epoch": 2234} {"train_loss": -12.322534561157227, "global_step": 375374, "epoch": 2234} {"train_loss": -12.509292602539062, "global_step": 375375, "epoch": 2234} {"train_loss": -12.323533058166504, "global_step": 375376, "epoch": 2234} {"train_loss": -12.002908706665039, "global_step": 375377, "epoch": 2234} {"train_loss": -12.191981315612793, "global_step": 375378, "epoch": 2234} {"train_loss": -12.658178329467773, "global_step": 375379, "epoch": 2234} {"train_loss": -12.343332290649414, "global_step": 375380, "epoch": 2234} {"train_loss": -12.542497634887695, "global_step": 375381, "epoch": 2234} {"train_loss": -12.438146591186523, "global_step": 375382, "epoch": 2234} {"train_loss": -12.399164199829102, "global_step": 375383, "epoch": 2234} {"train_loss": -12.070354461669922, "global_step": 375384, "epoch": 2234} {"train_loss": -12.373674392700195, "global_step": 375385, "epoch": 2234} {"train_loss": -12.445611953735352, "global_step": 375386, "epoch": 2234} {"train_loss": -11.875316619873047, "global_step": 375387, "epoch": 2234} {"train_loss": -12.561107635498047, "global_step": 375388, "epoch": 2234} {"train_loss": -12.140121459960938, "global_step": 375389, "epoch": 2234} {"train_loss": -12.300700187683105, "global_step": 375390, "epoch": 2234} {"train_loss": -12.258383750915527, "global_step": 375391, "epoch": 2234} {"train_loss": -12.37289047241211, "global_step": 375392, "epoch": 2234} {"train_loss": -11.491740226745605, "global_step": 375393, "epoch": 2234} {"train_loss": -12.046361923217773, "global_step": 375394, "epoch": 2234} {"train_loss": -12.211257934570312, "global_step": 375395, "epoch": 2234} {"train_loss": -12.30562973022461, "global_step": 375396, "epoch": 2234} {"train_loss": -11.989116668701172, "global_step": 375397, "epoch": 2234} {"train_loss": -12.148184776306152, "global_step": 375398, "epoch": 2234} {"train_loss": -12.097742080688477, "global_step": 375399, "epoch": 2234} {"train_loss": -12.435785293579102, "global_step": 375400, "epoch": 2234} {"train_loss": -12.258123397827148, "global_step": 375401, "epoch": 2234} {"train_loss": -12.179084777832031, "global_step": 375402, "epoch": 2234} {"train_loss": -12.308469772338867, "global_step": 375403, "epoch": 2234} {"train_loss": -12.253133773803711, "global_step": 375404, "epoch": 2234} {"train_loss": -12.385554313659668, "global_step": 375405, "epoch": 2234} {"train_loss": -12.193340301513672, "global_step": 375406, "epoch": 2234} {"train_loss": -12.064542770385742, "global_step": 375407, "epoch": 2234} {"train_loss": -12.465532302856445, "global_step": 375408, "epoch": 2234} {"train_loss": -11.96041488647461, "global_step": 375409, "epoch": 2234} {"train_loss": -11.664816856384277, "global_step": 375410, "epoch": 2234} {"train_loss": -11.884222030639648, "global_step": 375411, "epoch": 2234} {"train_loss": -12.557845115661621, "global_step": 375412, "epoch": 2234} {"train_loss": -10.533198356628418, "global_step": 375413, "epoch": 2234} {"train_loss": -10.534599304199219, "global_step": 375414, "epoch": 2234} {"train_loss": -12.367269515991211, "global_step": 375415, "epoch": 2234} {"train_loss": -10.555780410766602, "global_step": 375416, "epoch": 2234} {"train_loss": -10.714046478271484, "global_step": 375417, "epoch": 2234} {"train_loss": -10.437482833862305, "global_step": 375418, "epoch": 2234} {"train_loss": -10.215662956237793, "global_step": 375419, "epoch": 2234} {"train_loss": -10.244694709777832, "global_step": 375420, "epoch": 2234} {"train_loss": -10.292832374572754, "global_step": 375421, "epoch": 2234} {"train_loss": -9.288000106811523, "global_step": 375422, "epoch": 2234} {"train_loss": -10.019743919372559, "global_step": 375423, "epoch": 2234} {"train_loss": -10.200977325439453, "global_step": 375424, "epoch": 2234} {"train_loss": -10.971870422363281, "global_step": 375425, "epoch": 2234} {"train_loss": -10.583246231079102, "global_step": 375426, "epoch": 2234} {"train_loss": -9.989969253540039, "global_step": 375427, "epoch": 2234} {"train_loss": -11.495166778564453, "global_step": 375428, "epoch": 2234} {"train_loss": -9.835278511047363, "global_step": 375429, "epoch": 2234} {"train_loss": -10.891084671020508, "global_step": 375430, "epoch": 2234} {"train_loss": -11.190223693847656, "global_step": 375431, "epoch": 2234} {"train_loss": -10.021472930908203, "global_step": 375432, "epoch": 2234} {"train_loss": -11.692670822143555, "global_step": 375433, "epoch": 2234} {"train_loss": -11.764766693115234, "global_step": 375434, "epoch": 2234} {"train_loss": -11.567564010620117, "global_step": 375435, "epoch": 2234} {"train_loss": -12.206514358520508, "global_step": 375436, "epoch": 2234} {"train_loss": -11.752388000488281, "global_step": 375437, "epoch": 2234} {"train_loss": -11.886926651000977, "global_step": 375438, "epoch": 2234} {"train_loss": -11.822455406188965, "global_step": 375439, "epoch": 2234} {"train_loss": -11.930140495300293, "global_step": 375440, "epoch": 2234} {"train_loss": -12.033941268920898, "global_step": 375441, "epoch": 2234} {"train_loss": -12.136279106140137, "global_step": 375442, "epoch": 2234} {"train_loss": -11.990711212158203, "global_step": 375443, "epoch": 2234} {"train_loss": -11.83443832397461, "global_step": 375444, "epoch": 2234} {"train_loss": -12.081798553466797, "global_step": 375445, "epoch": 2234} {"train_loss": -11.983576774597168, "global_step": 375446, "epoch": 2234} {"train_loss": -12.275737762451172, "global_step": 375447, "epoch": 2234} {"train_loss": -12.107076644897461, "global_step": 375448, "epoch": 2234} {"train_loss": -11.795746803283691, "global_step": 375449, "epoch": 2234} {"train_loss": -11.852052688598633, "global_step": 375450, "epoch": 2234} {"train_loss": -11.959233283996582, "global_step": 375451, "epoch": 2234} {"train_loss": -12.205374717712402, "global_step": 375452, "epoch": 2234} {"train_loss": -11.457176208496094, "global_step": 375453, "epoch": 2234} {"train_loss": -12.415645599365234, "global_step": 375454, "epoch": 2234} {"train_loss": -11.654302597045898, "global_step": 375455, "epoch": 2234} {"train_loss": -12.085713386535645, "global_step": 375456, "epoch": 2234} {"train_loss": -11.803318977355957, "global_step": 375457, "epoch": 2234} {"train_loss": -11.633862495422363, "global_step": 375458, "epoch": 2234} {"train_loss": -12.119848251342773, "global_step": 375459, "epoch": 2234} {"train_loss": -12.108060836791992, "global_step": 375460, "epoch": 2234} {"train_loss": -12.197328567504883, "global_step": 375461, "epoch": 2234} {"train_loss": -11.522100448608398, "global_step": 375462, "epoch": 2234} {"train_loss": -12.154738426208496, "global_step": 375463, "epoch": 2234} {"train_loss": -11.916608810424805, "global_step": 375464, "epoch": 2234} {"train_loss": -12.282903671264648, "global_step": 375465, "epoch": 2234} {"train_loss": -11.90807819366455, "global_step": 375466, "epoch": 2234} {"train_loss": -11.923849105834961, "global_step": 375467, "epoch": 2234} {"train_loss": -12.274951934814453, "global_step": 375468, "epoch": 2234} {"train_loss": -12.029031753540039, "global_step": 375469, "epoch": 2234} {"train_loss": -12.241764068603516, "global_step": 375470, "epoch": 2234} {"train_loss": -12.140826225280762, "global_step": 375471, "epoch": 2234} {"train_loss": -12.314313888549805, "global_step": 375472, "epoch": 2234} {"train_loss": -11.562904357910156, "global_step": 375473, "epoch": 2234} {"train_loss": -12.096614837646484, "global_step": 375474, "epoch": 2234} {"train_loss": -12.04792594909668, "global_step": 375475, "epoch": 2234} {"train_loss": -12.006394386291504, "global_step": 375476, "epoch": 2234} {"train_loss": -12.611905097961426, "global_step": 375477, "epoch": 2234} {"train_loss": -11.726319313049316, "global_step": 375478, "epoch": 2234} {"train_loss": -11.993084663436527, "global_step": 375479, "epoch": 2234, "val_loss": 289920.3125} {"train_loss": -12.022735595703125, "global_step": 375480, "epoch": 2235} {"train_loss": -12.461282730102539, "global_step": 375481, "epoch": 2235} {"train_loss": -12.400884628295898, "global_step": 375482, "epoch": 2235} {"train_loss": -12.002019882202148, "global_step": 375483, "epoch": 2235} {"train_loss": -12.248592376708984, "global_step": 375484, "epoch": 2235} {"train_loss": -11.882892608642578, "global_step": 375485, "epoch": 2235} {"train_loss": -11.962373733520508, "global_step": 375486, "epoch": 2235} {"train_loss": -12.282527923583984, "global_step": 375487, "epoch": 2235} {"train_loss": -12.31527328491211, "global_step": 375488, "epoch": 2235} {"train_loss": -12.38418197631836, "global_step": 375489, "epoch": 2235} {"train_loss": -12.193209648132324, "global_step": 375490, "epoch": 2235} {"train_loss": -12.451214790344238, "global_step": 375491, "epoch": 2235} {"train_loss": -12.315347671508789, "global_step": 375492, "epoch": 2235} {"train_loss": -12.304495811462402, "global_step": 375493, "epoch": 2235} {"train_loss": -11.895986557006836, "global_step": 375494, "epoch": 2235} {"train_loss": -12.059549331665039, "global_step": 375495, "epoch": 2235} {"train_loss": -11.673966407775879, "global_step": 375496, "epoch": 2235} {"train_loss": -12.191189765930176, "global_step": 375497, "epoch": 2235} {"train_loss": -12.305074691772461, "global_step": 375498, "epoch": 2235} {"train_loss": -11.343254089355469, "global_step": 375499, "epoch": 2235} {"train_loss": -12.453001022338867, "global_step": 375500, "epoch": 2235} {"train_loss": -12.015083312988281, "global_step": 375501, "epoch": 2235} {"train_loss": -12.32789134979248, "global_step": 375502, "epoch": 2235} {"train_loss": -11.918951034545898, "global_step": 375503, "epoch": 2235} {"train_loss": -12.297972679138184, "global_step": 375504, "epoch": 2235} {"train_loss": -12.390893936157227, "global_step": 375505, "epoch": 2235} {"train_loss": -12.28406810760498, "global_step": 375506, "epoch": 2235} {"train_loss": -12.181239128112793, "global_step": 375507, "epoch": 2235} {"train_loss": -11.5779390335083, "global_step": 375508, "epoch": 2235} {"train_loss": -12.288773536682129, "global_step": 375509, "epoch": 2235} {"train_loss": -12.110101699829102, "global_step": 375510, "epoch": 2235} {"train_loss": -11.978706359863281, "global_step": 375511, "epoch": 2235} {"train_loss": -12.271675109863281, "global_step": 375512, "epoch": 2235} {"train_loss": -12.10347843170166, "global_step": 375513, "epoch": 2235} {"train_loss": -12.382242202758789, "global_step": 375514, "epoch": 2235} {"train_loss": -12.418584823608398, "global_step": 375515, "epoch": 2235} {"train_loss": -12.440828323364258, "global_step": 375516, "epoch": 2235} {"train_loss": -12.001524925231934, "global_step": 375517, "epoch": 2235} {"train_loss": -11.732484817504883, "global_step": 375518, "epoch": 2235} {"train_loss": -12.478848457336426, "global_step": 375519, "epoch": 2235} {"train_loss": -11.878122329711914, "global_step": 375520, "epoch": 2235} {"train_loss": -11.013235092163086, "global_step": 375521, "epoch": 2235} {"train_loss": -11.294417381286621, "global_step": 375522, "epoch": 2235} {"train_loss": -11.07258415222168, "global_step": 375523, "epoch": 2235} {"train_loss": -8.583620071411133, "global_step": 375524, "epoch": 2235} {"train_loss": -11.184898376464844, "global_step": 375525, "epoch": 2235} {"train_loss": -9.607152938842773, "global_step": 375526, "epoch": 2235} {"train_loss": -10.26915168762207, "global_step": 375527, "epoch": 2235} {"train_loss": -10.985376358032227, "global_step": 375528, "epoch": 2235} {"train_loss": -9.4202880859375, "global_step": 375529, "epoch": 2235} {"train_loss": -10.882404327392578, "global_step": 375530, "epoch": 2235} {"train_loss": -9.990758895874023, "global_step": 375531, "epoch": 2235} {"train_loss": -10.850390434265137, "global_step": 375532, "epoch": 2235} {"train_loss": -10.124099731445312, "global_step": 375533, "epoch": 2235} {"train_loss": -11.194156646728516, "global_step": 375534, "epoch": 2235} {"train_loss": -10.289143562316895, "global_step": 375535, "epoch": 2235} {"train_loss": -11.601393699645996, "global_step": 375536, "epoch": 2235} {"train_loss": -10.006874084472656, "global_step": 375537, "epoch": 2235} {"train_loss": -10.707356452941895, "global_step": 375538, "epoch": 2235} {"train_loss": -11.454864501953125, "global_step": 375539, "epoch": 2235} {"train_loss": -10.164407730102539, "global_step": 375540, "epoch": 2235} {"train_loss": -11.87363052368164, "global_step": 375541, "epoch": 2235} {"train_loss": -10.233297348022461, "global_step": 375542, "epoch": 2235} {"train_loss": -11.366680145263672, "global_step": 375543, "epoch": 2235} {"train_loss": -11.479074478149414, "global_step": 375544, "epoch": 2235} {"train_loss": -11.290302276611328, "global_step": 375545, "epoch": 2235} {"train_loss": -11.624077796936035, "global_step": 375546, "epoch": 2235} {"train_loss": -11.129304885864258, "global_step": 375547, "epoch": 2235} {"train_loss": -11.145215034484863, "global_step": 375548, "epoch": 2235} {"train_loss": -11.925552368164062, "global_step": 375549, "epoch": 2235} {"train_loss": -11.744707107543945, "global_step": 375550, "epoch": 2235} {"train_loss": -11.270421981811523, "global_step": 375551, "epoch": 2235} {"train_loss": -11.179999351501465, "global_step": 375552, "epoch": 2235} {"train_loss": -10.835271835327148, "global_step": 375553, "epoch": 2235} {"train_loss": -11.736227035522461, "global_step": 375554, "epoch": 2235} {"train_loss": -10.967269897460938, "global_step": 375555, "epoch": 2235} {"train_loss": -11.012641906738281, "global_step": 375556, "epoch": 2235} {"train_loss": -11.359149932861328, "global_step": 375557, "epoch": 2235} {"train_loss": -11.387487411499023, "global_step": 375558, "epoch": 2235} {"train_loss": -10.80338191986084, "global_step": 375559, "epoch": 2235} {"train_loss": -10.793543815612793, "global_step": 375560, "epoch": 2235} {"train_loss": -9.496681213378906, "global_step": 375561, "epoch": 2235} {"train_loss": -10.38508415222168, "global_step": 375562, "epoch": 2235} {"train_loss": -10.180862426757812, "global_step": 375563, "epoch": 2235} {"train_loss": -10.377644538879395, "global_step": 375564, "epoch": 2235} {"train_loss": -10.632415771484375, "global_step": 375565, "epoch": 2235} {"train_loss": -11.031537055969238, "global_step": 375566, "epoch": 2235} {"train_loss": -11.152191162109375, "global_step": 375567, "epoch": 2235} {"train_loss": -10.765153884887695, "global_step": 375568, "epoch": 2235} {"train_loss": -10.696986198425293, "global_step": 375569, "epoch": 2235} {"train_loss": -10.415884017944336, "global_step": 375570, "epoch": 2235} {"train_loss": -11.92393684387207, "global_step": 375571, "epoch": 2235} {"train_loss": -10.344093322753906, "global_step": 375572, "epoch": 2235} {"train_loss": -11.080869674682617, "global_step": 375573, "epoch": 2235} {"train_loss": -10.682222366333008, "global_step": 375574, "epoch": 2235} {"train_loss": -11.532559394836426, "global_step": 375575, "epoch": 2235} {"train_loss": -10.580979347229004, "global_step": 375576, "epoch": 2235} {"train_loss": -11.498802185058594, "global_step": 375577, "epoch": 2235} {"train_loss": -11.187246322631836, "global_step": 375578, "epoch": 2235} {"train_loss": -11.137236595153809, "global_step": 375579, "epoch": 2235} {"train_loss": -11.9680757522583, "global_step": 375580, "epoch": 2235} {"train_loss": -10.95484447479248, "global_step": 375581, "epoch": 2235} {"train_loss": -11.758516311645508, "global_step": 375582, "epoch": 2235} {"train_loss": -10.93458080291748, "global_step": 375583, "epoch": 2235} {"train_loss": -11.079742431640625, "global_step": 375584, "epoch": 2235} {"train_loss": -11.329193115234375, "global_step": 375585, "epoch": 2235} {"train_loss": -11.059465408325195, "global_step": 375586, "epoch": 2235} {"train_loss": -11.607742309570312, "global_step": 375587, "epoch": 2235} {"train_loss": -11.875629425048828, "global_step": 375588, "epoch": 2235} {"train_loss": -11.407670974731445, "global_step": 375589, "epoch": 2235} {"train_loss": -11.557666778564453, "global_step": 375590, "epoch": 2235} {"train_loss": -11.6782865524292, "global_step": 375591, "epoch": 2235} {"train_loss": -10.882603645324707, "global_step": 375592, "epoch": 2235} {"train_loss": -11.651975631713867, "global_step": 375593, "epoch": 2235} {"train_loss": -11.267288208007812, "global_step": 375594, "epoch": 2235} {"train_loss": -11.149478912353516, "global_step": 375595, "epoch": 2235} {"train_loss": -11.454333305358887, "global_step": 375596, "epoch": 2235} {"train_loss": -11.507284164428711, "global_step": 375597, "epoch": 2235} {"train_loss": -11.547866821289062, "global_step": 375598, "epoch": 2235} {"train_loss": -11.485801696777344, "global_step": 375599, "epoch": 2235} {"train_loss": -11.558448791503906, "global_step": 375600, "epoch": 2235} {"train_loss": -11.578325271606445, "global_step": 375601, "epoch": 2235} {"train_loss": -11.299295425415039, "global_step": 375602, "epoch": 2235} {"train_loss": -11.734984397888184, "global_step": 375603, "epoch": 2235} {"train_loss": -11.383814811706543, "global_step": 375604, "epoch": 2235} {"train_loss": -11.297161102294922, "global_step": 375605, "epoch": 2235} {"train_loss": -11.360958099365234, "global_step": 375606, "epoch": 2235} {"train_loss": -11.742572784423828, "global_step": 375607, "epoch": 2235} {"train_loss": -11.335811614990234, "global_step": 375608, "epoch": 2235} {"train_loss": -11.836462020874023, "global_step": 375609, "epoch": 2235} {"train_loss": -11.905524253845215, "global_step": 375610, "epoch": 2235} {"train_loss": -11.77701473236084, "global_step": 375611, "epoch": 2235} {"train_loss": -11.943893432617188, "global_step": 375612, "epoch": 2235} {"train_loss": -11.949697494506836, "global_step": 375613, "epoch": 2235} {"train_loss": -11.888046264648438, "global_step": 375614, "epoch": 2235} {"train_loss": -12.094881057739258, "global_step": 375615, "epoch": 2235} {"train_loss": -11.760791778564453, "global_step": 375616, "epoch": 2235} {"train_loss": -12.048503875732422, "global_step": 375617, "epoch": 2235} {"train_loss": -12.016207695007324, "global_step": 375618, "epoch": 2235} {"train_loss": -12.283234596252441, "global_step": 375619, "epoch": 2235} {"train_loss": -11.939672470092773, "global_step": 375620, "epoch": 2235} {"train_loss": -11.790332794189453, "global_step": 375621, "epoch": 2235} {"train_loss": -12.226296424865723, "global_step": 375622, "epoch": 2235} {"train_loss": -12.114801406860352, "global_step": 375623, "epoch": 2235} {"train_loss": -12.169349670410156, "global_step": 375624, "epoch": 2235} {"train_loss": -12.206587791442871, "global_step": 375625, "epoch": 2235} {"train_loss": -12.222225189208984, "global_step": 375626, "epoch": 2235} {"train_loss": -12.36800765991211, "global_step": 375627, "epoch": 2235} {"train_loss": -12.05827808380127, "global_step": 375628, "epoch": 2235} {"train_loss": -12.04810905456543, "global_step": 375629, "epoch": 2235} {"train_loss": -12.157306671142578, "global_step": 375630, "epoch": 2235} {"train_loss": -11.888049125671387, "global_step": 375631, "epoch": 2235} {"train_loss": -12.242156982421875, "global_step": 375632, "epoch": 2235} {"train_loss": -12.312752723693848, "global_step": 375633, "epoch": 2235} {"train_loss": -12.079492568969727, "global_step": 375634, "epoch": 2235} {"train_loss": -12.317880630493164, "global_step": 375635, "epoch": 2235} {"train_loss": -12.128456115722656, "global_step": 375636, "epoch": 2235} {"train_loss": -12.067143440246582, "global_step": 375637, "epoch": 2235} {"train_loss": -12.408130645751953, "global_step": 375638, "epoch": 2235} {"train_loss": -12.287267684936523, "global_step": 375639, "epoch": 2235} {"train_loss": -12.264667510986328, "global_step": 375640, "epoch": 2235} {"train_loss": -12.169626235961914, "global_step": 375641, "epoch": 2235} {"train_loss": -12.43536376953125, "global_step": 375642, "epoch": 2235} {"train_loss": -12.566719055175781, "global_step": 375643, "epoch": 2235} {"train_loss": -12.45287036895752, "global_step": 375644, "epoch": 2235} {"train_loss": -12.50956916809082, "global_step": 375645, "epoch": 2235} {"train_loss": -12.486705780029297, "global_step": 375646, "epoch": 2235} {"train_loss": -11.569988381294976, "global_step": 375647, "epoch": 2235, "val_loss": 291971.875, "train_action_mse_error": 1.4420117139816284} {"train_loss": -12.25772762298584, "global_step": 375648, "epoch": 2236} {"train_loss": -12.156846046447754, "global_step": 375649, "epoch": 2236} {"train_loss": -12.388886451721191, "global_step": 375650, "epoch": 2236} {"train_loss": -12.244686126708984, "global_step": 375651, "epoch": 2236} {"train_loss": -12.623080253601074, "global_step": 375652, "epoch": 2236} {"train_loss": -12.311948776245117, "global_step": 375653, "epoch": 2236} {"train_loss": -12.477254867553711, "global_step": 375654, "epoch": 2236} {"train_loss": -12.599838256835938, "global_step": 375655, "epoch": 2236} {"train_loss": -12.316354751586914, "global_step": 375656, "epoch": 2236} {"train_loss": -12.266910552978516, "global_step": 375657, "epoch": 2236} {"train_loss": -12.472289085388184, "global_step": 375658, "epoch": 2236} {"train_loss": -12.652116775512695, "global_step": 375659, "epoch": 2236} {"train_loss": -12.642375946044922, "global_step": 375660, "epoch": 2236} {"train_loss": -12.372051239013672, "global_step": 375661, "epoch": 2236} {"train_loss": -12.397754669189453, "global_step": 375662, "epoch": 2236} {"train_loss": -12.33578109741211, "global_step": 375663, "epoch": 2236} {"train_loss": -12.403063774108887, "global_step": 375664, "epoch": 2236} {"train_loss": -12.568623542785645, "global_step": 375665, "epoch": 2236} {"train_loss": -12.611878395080566, "global_step": 375666, "epoch": 2236} {"train_loss": -12.754552841186523, "global_step": 375667, "epoch": 2236} {"train_loss": -12.434613227844238, "global_step": 375668, "epoch": 2236} {"train_loss": -12.096948623657227, "global_step": 375669, "epoch": 2236} {"train_loss": -12.70121955871582, "global_step": 375670, "epoch": 2236} {"train_loss": -12.559446334838867, "global_step": 375671, "epoch": 2236} {"train_loss": -12.44253921508789, "global_step": 375672, "epoch": 2236} {"train_loss": -12.466672897338867, "global_step": 375673, "epoch": 2236} {"train_loss": -12.644953727722168, "global_step": 375674, "epoch": 2236} {"train_loss": -12.570868492126465, "global_step": 375675, "epoch": 2236} {"train_loss": -12.598760604858398, "global_step": 375676, "epoch": 2236} {"train_loss": -12.717903137207031, "global_step": 375677, "epoch": 2236} {"train_loss": -12.734501838684082, "global_step": 375678, "epoch": 2236} {"train_loss": -12.448492050170898, "global_step": 375679, "epoch": 2236} {"train_loss": -12.151697158813477, "global_step": 375680, "epoch": 2236} {"train_loss": -12.601401329040527, "global_step": 375681, "epoch": 2236} {"train_loss": -12.651426315307617, "global_step": 375682, "epoch": 2236} {"train_loss": -12.432960510253906, "global_step": 375683, "epoch": 2236} {"train_loss": -12.846571922302246, "global_step": 375684, "epoch": 2236} {"train_loss": -12.58144760131836, "global_step": 375685, "epoch": 2236} {"train_loss": -12.485006332397461, "global_step": 375686, "epoch": 2236} {"train_loss": -12.394994735717773, "global_step": 375687, "epoch": 2236} {"train_loss": -12.405773162841797, "global_step": 375688, "epoch": 2236} {"train_loss": -12.340831756591797, "global_step": 375689, "epoch": 2236} {"train_loss": -12.445481300354004, "global_step": 375690, "epoch": 2236} {"train_loss": -12.534753799438477, "global_step": 375691, "epoch": 2236} {"train_loss": -12.673178672790527, "global_step": 375692, "epoch": 2236} {"train_loss": -12.677857398986816, "global_step": 375693, "epoch": 2236} {"train_loss": -12.17756175994873, "global_step": 375694, "epoch": 2236} {"train_loss": -12.258232116699219, "global_step": 375695, "epoch": 2236} {"train_loss": -12.680304527282715, "global_step": 375696, "epoch": 2236} {"train_loss": -12.12339973449707, "global_step": 375697, "epoch": 2236} {"train_loss": -12.492683410644531, "global_step": 375698, "epoch": 2236} {"train_loss": -12.46908187866211, "global_step": 375699, "epoch": 2236} {"train_loss": -12.249122619628906, "global_step": 375700, "epoch": 2236} {"train_loss": -12.64105224609375, "global_step": 375701, "epoch": 2236} {"train_loss": -12.382543563842773, "global_step": 375702, "epoch": 2236} {"train_loss": -12.489171981811523, "global_step": 375703, "epoch": 2236} {"train_loss": -12.515135765075684, "global_step": 375704, "epoch": 2236} {"train_loss": -12.054052352905273, "global_step": 375705, "epoch": 2236} {"train_loss": -12.53817367553711, "global_step": 375706, "epoch": 2236} {"train_loss": -12.336450576782227, "global_step": 375707, "epoch": 2236} {"train_loss": -12.679306030273438, "global_step": 375708, "epoch": 2236} {"train_loss": -12.305041313171387, "global_step": 375709, "epoch": 2236} {"train_loss": -12.220357894897461, "global_step": 375710, "epoch": 2236} {"train_loss": -12.363431930541992, "global_step": 375711, "epoch": 2236} {"train_loss": -12.106624603271484, "global_step": 375712, "epoch": 2236} {"train_loss": -11.982365608215332, "global_step": 375713, "epoch": 2236} {"train_loss": -11.920832633972168, "global_step": 375714, "epoch": 2236} {"train_loss": -12.451227188110352, "global_step": 375715, "epoch": 2236} {"train_loss": -12.20084285736084, "global_step": 375716, "epoch": 2236} {"train_loss": -12.303998947143555, "global_step": 375717, "epoch": 2236} {"train_loss": -12.44649887084961, "global_step": 375718, "epoch": 2236} {"train_loss": -12.357812881469727, "global_step": 375719, "epoch": 2236} {"train_loss": -12.507665634155273, "global_step": 375720, "epoch": 2236} {"train_loss": -12.373696327209473, "global_step": 375721, "epoch": 2236} {"train_loss": -12.23515796661377, "global_step": 375722, "epoch": 2236} {"train_loss": -12.009798049926758, "global_step": 375723, "epoch": 2236} {"train_loss": -12.671244621276855, "global_step": 375724, "epoch": 2236} {"train_loss": -12.451112747192383, "global_step": 375725, "epoch": 2236} {"train_loss": -11.822104454040527, "global_step": 375726, "epoch": 2236} {"train_loss": -11.889159202575684, "global_step": 375727, "epoch": 2236} {"train_loss": -12.02498722076416, "global_step": 375728, "epoch": 2236} {"train_loss": -12.090067863464355, "global_step": 375729, "epoch": 2236} {"train_loss": -12.038673400878906, "global_step": 375730, "epoch": 2236} {"train_loss": -12.319782257080078, "global_step": 375731, "epoch": 2236} {"train_loss": -11.834423065185547, "global_step": 375732, "epoch": 2236} {"train_loss": -11.190200805664062, "global_step": 375733, "epoch": 2236} {"train_loss": -12.081337928771973, "global_step": 375734, "epoch": 2236} {"train_loss": -12.378083229064941, "global_step": 375735, "epoch": 2236} {"train_loss": -12.212663650512695, "global_step": 375736, "epoch": 2236} {"train_loss": -11.24246883392334, "global_step": 375737, "epoch": 2236} {"train_loss": -11.21184253692627, "global_step": 375738, "epoch": 2236} {"train_loss": -12.388509750366211, "global_step": 375739, "epoch": 2236} {"train_loss": -11.26832389831543, "global_step": 375740, "epoch": 2236} {"train_loss": -10.940689086914062, "global_step": 375741, "epoch": 2236} {"train_loss": -11.928070068359375, "global_step": 375742, "epoch": 2236} {"train_loss": -12.521249771118164, "global_step": 375743, "epoch": 2236} {"train_loss": -11.381525993347168, "global_step": 375744, "epoch": 2236} {"train_loss": -11.822702407836914, "global_step": 375745, "epoch": 2236} {"train_loss": -12.000001907348633, "global_step": 375746, "epoch": 2236} {"train_loss": -11.678220748901367, "global_step": 375747, "epoch": 2236} {"train_loss": -12.276508331298828, "global_step": 375748, "epoch": 2236} {"train_loss": -11.39111328125, "global_step": 375749, "epoch": 2236} {"train_loss": -11.591967582702637, "global_step": 375750, "epoch": 2236} {"train_loss": -12.10316276550293, "global_step": 375751, "epoch": 2236} {"train_loss": -11.737451553344727, "global_step": 375752, "epoch": 2236} {"train_loss": -10.918632507324219, "global_step": 375753, "epoch": 2236} {"train_loss": -12.215248107910156, "global_step": 375754, "epoch": 2236} {"train_loss": -11.30113410949707, "global_step": 375755, "epoch": 2236} {"train_loss": -11.110376358032227, "global_step": 375756, "epoch": 2236} {"train_loss": -11.840800285339355, "global_step": 375757, "epoch": 2236} {"train_loss": -11.55830192565918, "global_step": 375758, "epoch": 2236} {"train_loss": -11.243850708007812, "global_step": 375759, "epoch": 2236} {"train_loss": -12.23187255859375, "global_step": 375760, "epoch": 2236} {"train_loss": -11.686239242553711, "global_step": 375761, "epoch": 2236} {"train_loss": -11.345453262329102, "global_step": 375762, "epoch": 2236} {"train_loss": -11.782330513000488, "global_step": 375763, "epoch": 2236} {"train_loss": -12.008479118347168, "global_step": 375764, "epoch": 2236} {"train_loss": -11.2058744430542, "global_step": 375765, "epoch": 2236} {"train_loss": -11.533352851867676, "global_step": 375766, "epoch": 2236} {"train_loss": -11.161157608032227, "global_step": 375767, "epoch": 2236} {"train_loss": -11.454408645629883, "global_step": 375768, "epoch": 2236} {"train_loss": -11.682912826538086, "global_step": 375769, "epoch": 2236} {"train_loss": -11.366717338562012, "global_step": 375770, "epoch": 2236} {"train_loss": -11.866128921508789, "global_step": 375771, "epoch": 2236} {"train_loss": -11.440893173217773, "global_step": 375772, "epoch": 2236} {"train_loss": -11.025585174560547, "global_step": 375773, "epoch": 2236} {"train_loss": -11.852737426757812, "global_step": 375774, "epoch": 2236} {"train_loss": -11.077070236206055, "global_step": 375775, "epoch": 2236} {"train_loss": -12.422134399414062, "global_step": 375776, "epoch": 2236} {"train_loss": -11.32040786743164, "global_step": 375777, "epoch": 2236} {"train_loss": -11.615118026733398, "global_step": 375778, "epoch": 2236} {"train_loss": -12.013175964355469, "global_step": 375779, "epoch": 2236} {"train_loss": -10.803197860717773, "global_step": 375780, "epoch": 2236} {"train_loss": -11.89590072631836, "global_step": 375781, "epoch": 2236} {"train_loss": -11.098098754882812, "global_step": 375782, "epoch": 2236} {"train_loss": -11.624466896057129, "global_step": 375783, "epoch": 2236} {"train_loss": -11.511786460876465, "global_step": 375784, "epoch": 2236} {"train_loss": -11.680977821350098, "global_step": 375785, "epoch": 2236} {"train_loss": -11.326215744018555, "global_step": 375786, "epoch": 2236} {"train_loss": -11.013814926147461, "global_step": 375787, "epoch": 2236} {"train_loss": -10.671737670898438, "global_step": 375788, "epoch": 2236} {"train_loss": -11.411829948425293, "global_step": 375789, "epoch": 2236} {"train_loss": -11.145471572875977, "global_step": 375790, "epoch": 2236} {"train_loss": -11.61468505859375, "global_step": 375791, "epoch": 2236} {"train_loss": -11.507940292358398, "global_step": 375792, "epoch": 2236} {"train_loss": -11.760089874267578, "global_step": 375793, "epoch": 2236} {"train_loss": -10.532392501831055, "global_step": 375794, "epoch": 2236} {"train_loss": -11.441916465759277, "global_step": 375795, "epoch": 2236} {"train_loss": -11.292522430419922, "global_step": 375796, "epoch": 2236} {"train_loss": -11.60562801361084, "global_step": 375797, "epoch": 2236} {"train_loss": -11.439345359802246, "global_step": 375798, "epoch": 2236} {"train_loss": -12.301600456237793, "global_step": 375799, "epoch": 2236} {"train_loss": -10.975492477416992, "global_step": 375800, "epoch": 2236} {"train_loss": -11.955158233642578, "global_step": 375801, "epoch": 2236} {"train_loss": -11.719427108764648, "global_step": 375802, "epoch": 2236} {"train_loss": -11.372161865234375, "global_step": 375803, "epoch": 2236} {"train_loss": -11.741168022155762, "global_step": 375804, "epoch": 2236} {"train_loss": -10.822135925292969, "global_step": 375805, "epoch": 2236} {"train_loss": -11.874404907226562, "global_step": 375806, "epoch": 2236} {"train_loss": -11.730855941772461, "global_step": 375807, "epoch": 2236} {"train_loss": -12.021904945373535, "global_step": 375808, "epoch": 2236} {"train_loss": -11.595130920410156, "global_step": 375809, "epoch": 2236} {"train_loss": -11.952421188354492, "global_step": 375810, "epoch": 2236} {"train_loss": -11.711283683776855, "global_step": 375811, "epoch": 2236} {"train_loss": -12.16236686706543, "global_step": 375812, "epoch": 2236} {"train_loss": -12.198622703552246, "global_step": 375813, "epoch": 2236} {"train_loss": -12.080606460571289, "global_step": 375814, "epoch": 2236} {"train_loss": -12.003150661786398, "global_step": 375815, "epoch": 2236, "val_loss": 293117.3125} {"train_loss": -12.216519355773926, "global_step": 375816, "epoch": 2237} {"train_loss": -11.883158683776855, "global_step": 375817, "epoch": 2237} {"train_loss": -12.257139205932617, "global_step": 375818, "epoch": 2237} {"train_loss": -12.174027442932129, "global_step": 375819, "epoch": 2237} {"train_loss": -12.066360473632812, "global_step": 375820, "epoch": 2237} {"train_loss": -12.220667839050293, "global_step": 375821, "epoch": 2237} {"train_loss": -12.137208938598633, "global_step": 375822, "epoch": 2237} {"train_loss": -12.37059497833252, "global_step": 375823, "epoch": 2237} {"train_loss": -12.27673625946045, "global_step": 375824, "epoch": 2237} {"train_loss": -12.066012382507324, "global_step": 375825, "epoch": 2237} {"train_loss": -12.189510345458984, "global_step": 375826, "epoch": 2237} {"train_loss": -11.94830322265625, "global_step": 375827, "epoch": 2237} {"train_loss": -12.40256118774414, "global_step": 375828, "epoch": 2237} {"train_loss": -11.565587997436523, "global_step": 375829, "epoch": 2237} {"train_loss": -12.468877792358398, "global_step": 375830, "epoch": 2237} {"train_loss": -12.036088943481445, "global_step": 375831, "epoch": 2237} {"train_loss": -12.175036430358887, "global_step": 375832, "epoch": 2237} {"train_loss": -12.151311874389648, "global_step": 375833, "epoch": 2237} {"train_loss": -11.989160537719727, "global_step": 375834, "epoch": 2237} {"train_loss": -12.361370086669922, "global_step": 375835, "epoch": 2237} {"train_loss": -11.857748985290527, "global_step": 375836, "epoch": 2237} {"train_loss": -11.819607734680176, "global_step": 375837, "epoch": 2237} {"train_loss": -11.881294250488281, "global_step": 375838, "epoch": 2237} {"train_loss": -12.270482063293457, "global_step": 375839, "epoch": 2237} {"train_loss": -12.119998931884766, "global_step": 375840, "epoch": 2237} {"train_loss": -12.188837051391602, "global_step": 375841, "epoch": 2237} {"train_loss": -12.390809059143066, "global_step": 375842, "epoch": 2237} {"train_loss": -12.413442611694336, "global_step": 375843, "epoch": 2237} {"train_loss": -12.171487808227539, "global_step": 375844, "epoch": 2237} {"train_loss": -12.444558143615723, "global_step": 375845, "epoch": 2237} {"train_loss": -12.268470764160156, "global_step": 375846, "epoch": 2237} {"train_loss": -12.260053634643555, "global_step": 375847, "epoch": 2237} {"train_loss": -12.186151504516602, "global_step": 375848, "epoch": 2237} {"train_loss": -12.439750671386719, "global_step": 375849, "epoch": 2237} {"train_loss": -12.304311752319336, "global_step": 375850, "epoch": 2237} {"train_loss": -12.23881721496582, "global_step": 375851, "epoch": 2237} {"train_loss": -12.353797912597656, "global_step": 375852, "epoch": 2237} {"train_loss": -12.420673370361328, "global_step": 375853, "epoch": 2237} {"train_loss": -12.014236450195312, "global_step": 375854, "epoch": 2237} {"train_loss": -12.294208526611328, "global_step": 375855, "epoch": 2237} {"train_loss": -11.990121841430664, "global_step": 375856, "epoch": 2237} {"train_loss": -11.443859100341797, "global_step": 375857, "epoch": 2237} {"train_loss": -12.15644359588623, "global_step": 375858, "epoch": 2237} {"train_loss": -11.253721237182617, "global_step": 375859, "epoch": 2237} {"train_loss": -12.624016761779785, "global_step": 375860, "epoch": 2237} {"train_loss": -11.822507858276367, "global_step": 375861, "epoch": 2237} {"train_loss": -11.877578735351562, "global_step": 375862, "epoch": 2237} {"train_loss": -12.22146987915039, "global_step": 375863, "epoch": 2237} {"train_loss": -11.92568588256836, "global_step": 375864, "epoch": 2237} {"train_loss": -12.602632522583008, "global_step": 375865, "epoch": 2237} {"train_loss": -11.917282104492188, "global_step": 375866, "epoch": 2237} {"train_loss": -12.327330589294434, "global_step": 375867, "epoch": 2237} {"train_loss": -12.222982406616211, "global_step": 375868, "epoch": 2237} {"train_loss": -12.145503044128418, "global_step": 375869, "epoch": 2237} {"train_loss": -12.419672966003418, "global_step": 375870, "epoch": 2237} {"train_loss": -12.350957870483398, "global_step": 375871, "epoch": 2237} {"train_loss": -12.721059799194336, "global_step": 375872, "epoch": 2237} {"train_loss": -12.418109893798828, "global_step": 375873, "epoch": 2237} {"train_loss": -12.696952819824219, "global_step": 375874, "epoch": 2237} {"train_loss": -12.460745811462402, "global_step": 375875, "epoch": 2237} {"train_loss": -12.362800598144531, "global_step": 375876, "epoch": 2237} {"train_loss": -12.786397933959961, "global_step": 375877, "epoch": 2237} {"train_loss": -12.309503555297852, "global_step": 375878, "epoch": 2237} {"train_loss": -12.445852279663086, "global_step": 375879, "epoch": 2237} {"train_loss": -12.20644760131836, "global_step": 375880, "epoch": 2237} {"train_loss": -12.37166976928711, "global_step": 375881, "epoch": 2237} {"train_loss": -12.095800399780273, "global_step": 375882, "epoch": 2237} {"train_loss": -12.379009246826172, "global_step": 375883, "epoch": 2237} {"train_loss": -12.477582931518555, "global_step": 375884, "epoch": 2237} {"train_loss": -12.290209770202637, "global_step": 375885, "epoch": 2237} {"train_loss": -12.366739273071289, "global_step": 375886, "epoch": 2237} {"train_loss": -12.490697860717773, "global_step": 375887, "epoch": 2237} {"train_loss": -12.343070983886719, "global_step": 375888, "epoch": 2237} {"train_loss": -12.433843612670898, "global_step": 375889, "epoch": 2237} {"train_loss": -12.310417175292969, "global_step": 375890, "epoch": 2237} {"train_loss": -12.29230785369873, "global_step": 375891, "epoch": 2237} {"train_loss": -11.980606079101562, "global_step": 375892, "epoch": 2237} {"train_loss": -12.019523620605469, "global_step": 375893, "epoch": 2237} {"train_loss": -11.928683280944824, "global_step": 375894, "epoch": 2237} {"train_loss": -10.25500774383545, "global_step": 375895, "epoch": 2237} {"train_loss": -11.867103576660156, "global_step": 375896, "epoch": 2237} {"train_loss": -12.252033233642578, "global_step": 375897, "epoch": 2237} {"train_loss": -10.725105285644531, "global_step": 375898, "epoch": 2237} {"train_loss": -11.083529472351074, "global_step": 375899, "epoch": 2237} {"train_loss": -12.280027389526367, "global_step": 375900, "epoch": 2237} {"train_loss": -10.883323669433594, "global_step": 375901, "epoch": 2237} {"train_loss": -11.43307876586914, "global_step": 375902, "epoch": 2237} {"train_loss": -12.046947479248047, "global_step": 375903, "epoch": 2237} {"train_loss": -9.96762752532959, "global_step": 375904, "epoch": 2237} {"train_loss": -11.13751220703125, "global_step": 375905, "epoch": 2237} {"train_loss": -12.512544631958008, "global_step": 375906, "epoch": 2237} {"train_loss": -11.294050216674805, "global_step": 375907, "epoch": 2237} {"train_loss": -11.512533187866211, "global_step": 375908, "epoch": 2237} {"train_loss": -12.064006805419922, "global_step": 375909, "epoch": 2237} {"train_loss": -11.89516830444336, "global_step": 375910, "epoch": 2237} {"train_loss": -11.655182838439941, "global_step": 375911, "epoch": 2237} {"train_loss": -12.317132949829102, "global_step": 375912, "epoch": 2237} {"train_loss": -12.30748462677002, "global_step": 375913, "epoch": 2237} {"train_loss": -12.14107894897461, "global_step": 375914, "epoch": 2237} {"train_loss": -11.903179168701172, "global_step": 375915, "epoch": 2237} {"train_loss": -12.546758651733398, "global_step": 375916, "epoch": 2237} {"train_loss": -12.452251434326172, "global_step": 375917, "epoch": 2237} {"train_loss": -12.286951065063477, "global_step": 375918, "epoch": 2237} {"train_loss": -12.45545768737793, "global_step": 375919, "epoch": 2237} {"train_loss": -12.616909980773926, "global_step": 375920, "epoch": 2237} {"train_loss": -12.402185440063477, "global_step": 375921, "epoch": 2237} {"train_loss": -12.24264907836914, "global_step": 375922, "epoch": 2237} {"train_loss": -12.04731273651123, "global_step": 375923, "epoch": 2237} {"train_loss": -12.700346946716309, "global_step": 375924, "epoch": 2237} {"train_loss": -12.043083190917969, "global_step": 375925, "epoch": 2237} {"train_loss": -11.599159240722656, "global_step": 375926, "epoch": 2237} {"train_loss": -12.5855712890625, "global_step": 375927, "epoch": 2237} {"train_loss": -11.797039031982422, "global_step": 375928, "epoch": 2237} {"train_loss": -12.043001174926758, "global_step": 375929, "epoch": 2237} {"train_loss": -12.038056373596191, "global_step": 375930, "epoch": 2237} {"train_loss": -12.292427062988281, "global_step": 375931, "epoch": 2237} {"train_loss": -12.245386123657227, "global_step": 375932, "epoch": 2237} {"train_loss": -12.163557052612305, "global_step": 375933, "epoch": 2237} {"train_loss": -12.542920112609863, "global_step": 375934, "epoch": 2237} {"train_loss": -12.43026351928711, "global_step": 375935, "epoch": 2237} {"train_loss": -12.328288078308105, "global_step": 375936, "epoch": 2237} {"train_loss": -12.557328224182129, "global_step": 375937, "epoch": 2237} {"train_loss": -12.279875755310059, "global_step": 375938, "epoch": 2237} {"train_loss": -12.390838623046875, "global_step": 375939, "epoch": 2237} {"train_loss": -11.988618850708008, "global_step": 375940, "epoch": 2237} {"train_loss": -12.487421989440918, "global_step": 375941, "epoch": 2237} {"train_loss": -12.431358337402344, "global_step": 375942, "epoch": 2237} {"train_loss": -12.015210151672363, "global_step": 375943, "epoch": 2237} {"train_loss": -11.58011245727539, "global_step": 375944, "epoch": 2237} {"train_loss": -12.461584091186523, "global_step": 375945, "epoch": 2237} {"train_loss": -11.118561744689941, "global_step": 375946, "epoch": 2237} {"train_loss": -12.384248733520508, "global_step": 375947, "epoch": 2237} {"train_loss": -11.273114204406738, "global_step": 375948, "epoch": 2237} {"train_loss": -11.360298156738281, "global_step": 375949, "epoch": 2237} {"train_loss": -12.135415077209473, "global_step": 375950, "epoch": 2237} {"train_loss": -12.024299621582031, "global_step": 375951, "epoch": 2237} {"train_loss": -11.845863342285156, "global_step": 375952, "epoch": 2237} {"train_loss": -12.385393142700195, "global_step": 375953, "epoch": 2237} {"train_loss": -11.967140197753906, "global_step": 375954, "epoch": 2237} {"train_loss": -12.083209991455078, "global_step": 375955, "epoch": 2237} {"train_loss": -11.876049041748047, "global_step": 375956, "epoch": 2237} {"train_loss": -12.10392951965332, "global_step": 375957, "epoch": 2237} {"train_loss": -12.128028869628906, "global_step": 375958, "epoch": 2237} {"train_loss": -12.083996772766113, "global_step": 375959, "epoch": 2237} {"train_loss": -12.438458442687988, "global_step": 375960, "epoch": 2237} {"train_loss": -11.853875160217285, "global_step": 375961, "epoch": 2237} {"train_loss": -12.199634552001953, "global_step": 375962, "epoch": 2237} {"train_loss": -11.784392356872559, "global_step": 375963, "epoch": 2237} {"train_loss": -11.665671348571777, "global_step": 375964, "epoch": 2237} {"train_loss": -11.933813095092773, "global_step": 375965, "epoch": 2237} {"train_loss": -11.420723915100098, "global_step": 375966, "epoch": 2237} {"train_loss": -11.758927345275879, "global_step": 375967, "epoch": 2237} {"train_loss": -12.419045448303223, "global_step": 375968, "epoch": 2237} {"train_loss": -11.773897171020508, "global_step": 375969, "epoch": 2237} {"train_loss": -12.157413482666016, "global_step": 375970, "epoch": 2237} {"train_loss": -12.187918663024902, "global_step": 375971, "epoch": 2237} {"train_loss": -11.663776397705078, "global_step": 375972, "epoch": 2237} {"train_loss": -11.880500793457031, "global_step": 375973, "epoch": 2237} {"train_loss": -12.579012870788574, "global_step": 375974, "epoch": 2237} {"train_loss": -12.324687957763672, "global_step": 375975, "epoch": 2237} {"train_loss": -12.402153015136719, "global_step": 375976, "epoch": 2237} {"train_loss": -12.297663688659668, "global_step": 375977, "epoch": 2237} {"train_loss": -12.46625804901123, "global_step": 375978, "epoch": 2237} {"train_loss": -12.498058319091797, "global_step": 375979, "epoch": 2237} {"train_loss": -12.464969635009766, "global_step": 375980, "epoch": 2237} {"train_loss": -12.178082466125488, "global_step": 375981, "epoch": 2237} {"train_loss": -12.602031707763672, "global_step": 375982, "epoch": 2237} {"train_loss": -12.110668085870289, "global_step": 375983, "epoch": 2237, "val_loss": 294202.0625} {"train_loss": -12.48957633972168, "global_step": 375984, "epoch": 2238} {"train_loss": -12.529552459716797, "global_step": 375985, "epoch": 2238} {"train_loss": -12.637609481811523, "global_step": 375986, "epoch": 2238} {"train_loss": -12.415077209472656, "global_step": 375987, "epoch": 2238} {"train_loss": -12.580801963806152, "global_step": 375988, "epoch": 2238} {"train_loss": -12.581119537353516, "global_step": 375989, "epoch": 2238} {"train_loss": -12.506689071655273, "global_step": 375990, "epoch": 2238} {"train_loss": -12.477593421936035, "global_step": 375991, "epoch": 2238} {"train_loss": -12.155050277709961, "global_step": 375992, "epoch": 2238} {"train_loss": -12.189803123474121, "global_step": 375993, "epoch": 2238} {"train_loss": -12.45130443572998, "global_step": 375994, "epoch": 2238} {"train_loss": -12.330066680908203, "global_step": 375995, "epoch": 2238} {"train_loss": -12.429582595825195, "global_step": 375996, "epoch": 2238} {"train_loss": -12.071911811828613, "global_step": 375997, "epoch": 2238} {"train_loss": -12.163249969482422, "global_step": 375998, "epoch": 2238} {"train_loss": -12.577938079833984, "global_step": 375999, "epoch": 2238} {"train_loss": -11.85992431640625, "global_step": 376000, "epoch": 2238} {"train_loss": -12.644500732421875, "global_step": 376001, "epoch": 2238} {"train_loss": -11.721189498901367, "global_step": 376002, "epoch": 2238} {"train_loss": -12.623355865478516, "global_step": 376003, "epoch": 2238} {"train_loss": -12.411369323730469, "global_step": 376004, "epoch": 2238} {"train_loss": -12.772113800048828, "global_step": 376005, "epoch": 2238} {"train_loss": -12.37722396850586, "global_step": 376006, "epoch": 2238} {"train_loss": -12.554884910583496, "global_step": 376007, "epoch": 2238} {"train_loss": -12.560449600219727, "global_step": 376008, "epoch": 2238} {"train_loss": -12.328824043273926, "global_step": 376009, "epoch": 2238} {"train_loss": -12.339803695678711, "global_step": 376010, "epoch": 2238} {"train_loss": -12.604369163513184, "global_step": 376011, "epoch": 2238} {"train_loss": -12.620524406433105, "global_step": 376012, "epoch": 2238} {"train_loss": -12.577025413513184, "global_step": 376013, "epoch": 2238} {"train_loss": -12.611272811889648, "global_step": 376014, "epoch": 2238} {"train_loss": -12.716360092163086, "global_step": 376015, "epoch": 2238} {"train_loss": -12.871370315551758, "global_step": 376016, "epoch": 2238} {"train_loss": -12.587688446044922, "global_step": 376017, "epoch": 2238} {"train_loss": -12.612030029296875, "global_step": 376018, "epoch": 2238} {"train_loss": -12.65198802947998, "global_step": 376019, "epoch": 2238} {"train_loss": -12.664908409118652, "global_step": 376020, "epoch": 2238} {"train_loss": -12.37783432006836, "global_step": 376021, "epoch": 2238} {"train_loss": -12.339515686035156, "global_step": 376022, "epoch": 2238} {"train_loss": -12.715030670166016, "global_step": 376023, "epoch": 2238} {"train_loss": -12.358394622802734, "global_step": 376024, "epoch": 2238} {"train_loss": -11.921306610107422, "global_step": 376025, "epoch": 2238} {"train_loss": -12.359018325805664, "global_step": 376026, "epoch": 2238} {"train_loss": -12.776412963867188, "global_step": 376027, "epoch": 2238} {"train_loss": -12.397117614746094, "global_step": 376028, "epoch": 2238} {"train_loss": -12.309696197509766, "global_step": 376029, "epoch": 2238} {"train_loss": -12.41763687133789, "global_step": 376030, "epoch": 2238} {"train_loss": -12.467195510864258, "global_step": 376031, "epoch": 2238} {"train_loss": -12.505624771118164, "global_step": 376032, "epoch": 2238} {"train_loss": -12.000792503356934, "global_step": 376033, "epoch": 2238} {"train_loss": -12.036225318908691, "global_step": 376034, "epoch": 2238} {"train_loss": -11.983160018920898, "global_step": 376035, "epoch": 2238} {"train_loss": -12.26347541809082, "global_step": 376036, "epoch": 2238} {"train_loss": -12.584945678710938, "global_step": 376037, "epoch": 2238} {"train_loss": -12.245185852050781, "global_step": 376038, "epoch": 2238} {"train_loss": -11.966487884521484, "global_step": 376039, "epoch": 2238} {"train_loss": -12.306982040405273, "global_step": 376040, "epoch": 2238} {"train_loss": -11.99582576751709, "global_step": 376041, "epoch": 2238} {"train_loss": -12.019998550415039, "global_step": 376042, "epoch": 2238} {"train_loss": -12.180709838867188, "global_step": 376043, "epoch": 2238} {"train_loss": -10.979777336120605, "global_step": 376044, "epoch": 2238} {"train_loss": -10.34895133972168, "global_step": 376045, "epoch": 2238} {"train_loss": -11.661433219909668, "global_step": 376046, "epoch": 2238} {"train_loss": -9.244771957397461, "global_step": 376047, "epoch": 2238} {"train_loss": -8.167673110961914, "global_step": 376048, "epoch": 2238} {"train_loss": -9.561140060424805, "global_step": 376049, "epoch": 2238} {"train_loss": -10.250345230102539, "global_step": 376050, "epoch": 2238} {"train_loss": -7.5885009765625, "global_step": 376051, "epoch": 2238} {"train_loss": -6.155501842498779, "global_step": 376052, "epoch": 2238} {"train_loss": -7.3670654296875, "global_step": 376053, "epoch": 2238} {"train_loss": -7.039012908935547, "global_step": 376054, "epoch": 2238} {"train_loss": -6.747531414031982, "global_step": 376055, "epoch": 2238} {"train_loss": -7.15413761138916, "global_step": 376056, "epoch": 2238} {"train_loss": -7.318826675415039, "global_step": 376057, "epoch": 2238} {"train_loss": -7.203843116760254, "global_step": 376058, "epoch": 2238} {"train_loss": -8.688587188720703, "global_step": 376059, "epoch": 2238} {"train_loss": -8.603403091430664, "global_step": 376060, "epoch": 2238} {"train_loss": -8.228372573852539, "global_step": 376061, "epoch": 2238} {"train_loss": -7.897556304931641, "global_step": 376062, "epoch": 2238} {"train_loss": -7.844505310058594, "global_step": 376063, "epoch": 2238} {"train_loss": -9.310117721557617, "global_step": 376064, "epoch": 2238} {"train_loss": -8.36444091796875, "global_step": 376065, "epoch": 2238} {"train_loss": -9.1314115524292, "global_step": 376066, "epoch": 2238} {"train_loss": -9.485085487365723, "global_step": 376067, "epoch": 2238} {"train_loss": -9.790464401245117, "global_step": 376068, "epoch": 2238} {"train_loss": -9.771809577941895, "global_step": 376069, "epoch": 2238} {"train_loss": -10.320586204528809, "global_step": 376070, "epoch": 2238} {"train_loss": -10.101648330688477, "global_step": 376071, "epoch": 2238} {"train_loss": -10.041543960571289, "global_step": 376072, "epoch": 2238} {"train_loss": -10.793915748596191, "global_step": 376073, "epoch": 2238} {"train_loss": -10.747629165649414, "global_step": 376074, "epoch": 2238} {"train_loss": -10.445775032043457, "global_step": 376075, "epoch": 2238} {"train_loss": -11.15923023223877, "global_step": 376076, "epoch": 2238} {"train_loss": -10.414663314819336, "global_step": 376077, "epoch": 2238} {"train_loss": -11.209457397460938, "global_step": 376078, "epoch": 2238} {"train_loss": -10.53482437133789, "global_step": 376079, "epoch": 2238} {"train_loss": -10.625194549560547, "global_step": 376080, "epoch": 2238} {"train_loss": -10.221593856811523, "global_step": 376081, "epoch": 2238} {"train_loss": -10.709920883178711, "global_step": 376082, "epoch": 2238} {"train_loss": -10.374046325683594, "global_step": 376083, "epoch": 2238} {"train_loss": -11.04716682434082, "global_step": 376084, "epoch": 2238} {"train_loss": -10.584916114807129, "global_step": 376085, "epoch": 2238} {"train_loss": -11.391389846801758, "global_step": 376086, "epoch": 2238} {"train_loss": -10.511619567871094, "global_step": 376087, "epoch": 2238} {"train_loss": -10.94339656829834, "global_step": 376088, "epoch": 2238} {"train_loss": -10.85593318939209, "global_step": 376089, "epoch": 2238} {"train_loss": -10.77711296081543, "global_step": 376090, "epoch": 2238} {"train_loss": -11.526782035827637, "global_step": 376091, "epoch": 2238} {"train_loss": -10.489290237426758, "global_step": 376092, "epoch": 2238} {"train_loss": -10.944554328918457, "global_step": 376093, "epoch": 2238} {"train_loss": -11.612232208251953, "global_step": 376094, "epoch": 2238} {"train_loss": -10.775869369506836, "global_step": 376095, "epoch": 2238} {"train_loss": -11.08405590057373, "global_step": 376096, "epoch": 2238} {"train_loss": -11.515653610229492, "global_step": 376097, "epoch": 2238} {"train_loss": -11.162623405456543, "global_step": 376098, "epoch": 2238} {"train_loss": -10.953330993652344, "global_step": 376099, "epoch": 2238} {"train_loss": -11.395376205444336, "global_step": 376100, "epoch": 2238} {"train_loss": -11.130332946777344, "global_step": 376101, "epoch": 2238} {"train_loss": -11.931699752807617, "global_step": 376102, "epoch": 2238} {"train_loss": -11.485954284667969, "global_step": 376103, "epoch": 2238} {"train_loss": -11.713848114013672, "global_step": 376104, "epoch": 2238} {"train_loss": -11.817523956298828, "global_step": 376105, "epoch": 2238} {"train_loss": -11.463226318359375, "global_step": 376106, "epoch": 2238} {"train_loss": -11.643180847167969, "global_step": 376107, "epoch": 2238} {"train_loss": -11.95616340637207, "global_step": 376108, "epoch": 2238} {"train_loss": -11.544822692871094, "global_step": 376109, "epoch": 2238} {"train_loss": -11.923596382141113, "global_step": 376110, "epoch": 2238} {"train_loss": -11.629657745361328, "global_step": 376111, "epoch": 2238} {"train_loss": -11.797947883605957, "global_step": 376112, "epoch": 2238} {"train_loss": -11.782123565673828, "global_step": 376113, "epoch": 2238} {"train_loss": -12.084672927856445, "global_step": 376114, "epoch": 2238} {"train_loss": -11.625114440917969, "global_step": 376115, "epoch": 2238} {"train_loss": -12.067525863647461, "global_step": 376116, "epoch": 2238} {"train_loss": -11.714759826660156, "global_step": 376117, "epoch": 2238} {"train_loss": -11.829692840576172, "global_step": 376118, "epoch": 2238} {"train_loss": -12.069046020507812, "global_step": 376119, "epoch": 2238} {"train_loss": -11.767950057983398, "global_step": 376120, "epoch": 2238} {"train_loss": -11.911317825317383, "global_step": 376121, "epoch": 2238} {"train_loss": -11.860044479370117, "global_step": 376122, "epoch": 2238} {"train_loss": -11.911579132080078, "global_step": 376123, "epoch": 2238} {"train_loss": -12.041438102722168, "global_step": 376124, "epoch": 2238} {"train_loss": -12.14042854309082, "global_step": 376125, "epoch": 2238} {"train_loss": -11.890360832214355, "global_step": 376126, "epoch": 2238} {"train_loss": -12.190019607543945, "global_step": 376127, "epoch": 2238} {"train_loss": -11.558185577392578, "global_step": 376128, "epoch": 2238} {"train_loss": -12.260011672973633, "global_step": 376129, "epoch": 2238} {"train_loss": -11.832962989807129, "global_step": 376130, "epoch": 2238} {"train_loss": -12.058633804321289, "global_step": 376131, "epoch": 2238} {"train_loss": -12.196739196777344, "global_step": 376132, "epoch": 2238} {"train_loss": -11.917367935180664, "global_step": 376133, "epoch": 2238} {"train_loss": -12.035001754760742, "global_step": 376134, "epoch": 2238} {"train_loss": -11.657402038574219, "global_step": 376135, "epoch": 2238} {"train_loss": -12.095964431762695, "global_step": 376136, "epoch": 2238} {"train_loss": -12.155460357666016, "global_step": 376137, "epoch": 2238} {"train_loss": -11.968915939331055, "global_step": 376138, "epoch": 2238} {"train_loss": -11.872149467468262, "global_step": 376139, "epoch": 2238} {"train_loss": -12.108185768127441, "global_step": 376140, "epoch": 2238} {"train_loss": -12.50389575958252, "global_step": 376141, "epoch": 2238} {"train_loss": -12.133383750915527, "global_step": 376142, "epoch": 2238} {"train_loss": -12.336858749389648, "global_step": 376143, "epoch": 2238} {"train_loss": -12.363162994384766, "global_step": 376144, "epoch": 2238} {"train_loss": -12.270092010498047, "global_step": 376145, "epoch": 2238} {"train_loss": -12.117181777954102, "global_step": 376146, "epoch": 2238} {"train_loss": -11.921226501464844, "global_step": 376147, "epoch": 2238} {"train_loss": -12.36744499206543, "global_step": 376148, "epoch": 2238} {"train_loss": -12.031156539916992, "global_step": 376149, "epoch": 2238} {"train_loss": -12.481801986694336, "global_step": 376150, "epoch": 2238} {"train_loss": -11.382680552346367, "global_step": 376151, "epoch": 2238, "val_loss": 290273.25} {"train_loss": -12.019033432006836, "global_step": 376152, "epoch": 2239} {"train_loss": -12.549497604370117, "global_step": 376153, "epoch": 2239} {"train_loss": -12.237201690673828, "global_step": 376154, "epoch": 2239} {"train_loss": -12.390880584716797, "global_step": 376155, "epoch": 2239} {"train_loss": -12.31491470336914, "global_step": 376156, "epoch": 2239} {"train_loss": -12.320596694946289, "global_step": 376157, "epoch": 2239} {"train_loss": -12.617341995239258, "global_step": 376158, "epoch": 2239} {"train_loss": -12.208653450012207, "global_step": 376159, "epoch": 2239} {"train_loss": -12.504610061645508, "global_step": 376160, "epoch": 2239} {"train_loss": -12.467679023742676, "global_step": 376161, "epoch": 2239} {"train_loss": -12.248533248901367, "global_step": 376162, "epoch": 2239} {"train_loss": -12.520195007324219, "global_step": 376163, "epoch": 2239} {"train_loss": -12.354114532470703, "global_step": 376164, "epoch": 2239} {"train_loss": -12.602510452270508, "global_step": 376165, "epoch": 2239} {"train_loss": -12.60000991821289, "global_step": 376166, "epoch": 2239} {"train_loss": -12.392889976501465, "global_step": 376167, "epoch": 2239} {"train_loss": -12.379865646362305, "global_step": 376168, "epoch": 2239} {"train_loss": -12.421004295349121, "global_step": 376169, "epoch": 2239} {"train_loss": -12.510763168334961, "global_step": 376170, "epoch": 2239} {"train_loss": -12.403406143188477, "global_step": 376171, "epoch": 2239} {"train_loss": -12.487468719482422, "global_step": 376172, "epoch": 2239} {"train_loss": -12.25230598449707, "global_step": 376173, "epoch": 2239} {"train_loss": -12.392288208007812, "global_step": 376174, "epoch": 2239} {"train_loss": -12.113224029541016, "global_step": 376175, "epoch": 2239} {"train_loss": -12.106124877929688, "global_step": 376176, "epoch": 2239} {"train_loss": -12.563015937805176, "global_step": 376177, "epoch": 2239} {"train_loss": -11.90080738067627, "global_step": 376178, "epoch": 2239} {"train_loss": -12.52389144897461, "global_step": 376179, "epoch": 2239} {"train_loss": -12.39793586730957, "global_step": 376180, "epoch": 2239} {"train_loss": -12.322296142578125, "global_step": 376181, "epoch": 2239} {"train_loss": -12.273648262023926, "global_step": 376182, "epoch": 2239} {"train_loss": -12.629304885864258, "global_step": 376183, "epoch": 2239} {"train_loss": -12.139802932739258, "global_step": 376184, "epoch": 2239} {"train_loss": -12.282123565673828, "global_step": 376185, "epoch": 2239} {"train_loss": -11.896347045898438, "global_step": 376186, "epoch": 2239} {"train_loss": -12.50804328918457, "global_step": 376187, "epoch": 2239} {"train_loss": -12.355262756347656, "global_step": 376188, "epoch": 2239} {"train_loss": -12.368688583374023, "global_step": 376189, "epoch": 2239} {"train_loss": -12.465048789978027, "global_step": 376190, "epoch": 2239} {"train_loss": -12.064687728881836, "global_step": 376191, "epoch": 2239} {"train_loss": -12.70059585571289, "global_step": 376192, "epoch": 2239} {"train_loss": -12.474184036254883, "global_step": 376193, "epoch": 2239} {"train_loss": -12.235345840454102, "global_step": 376194, "epoch": 2239} {"train_loss": -12.541006088256836, "global_step": 376195, "epoch": 2239} {"train_loss": -12.284525871276855, "global_step": 376196, "epoch": 2239} {"train_loss": -11.906160354614258, "global_step": 376197, "epoch": 2239} {"train_loss": -12.321020126342773, "global_step": 376198, "epoch": 2239} {"train_loss": -12.682451248168945, "global_step": 376199, "epoch": 2239} {"train_loss": -12.228869438171387, "global_step": 376200, "epoch": 2239} {"train_loss": -12.293828964233398, "global_step": 376201, "epoch": 2239} {"train_loss": -12.47390365600586, "global_step": 376202, "epoch": 2239} {"train_loss": -12.623817443847656, "global_step": 376203, "epoch": 2239} {"train_loss": -12.344959259033203, "global_step": 376204, "epoch": 2239} {"train_loss": -12.572790145874023, "global_step": 376205, "epoch": 2239} {"train_loss": -12.741144180297852, "global_step": 376206, "epoch": 2239} {"train_loss": -12.144298553466797, "global_step": 376207, "epoch": 2239} {"train_loss": -12.323162078857422, "global_step": 376208, "epoch": 2239} {"train_loss": -12.472249984741211, "global_step": 376209, "epoch": 2239} {"train_loss": -12.107532501220703, "global_step": 376210, "epoch": 2239} {"train_loss": -11.995110511779785, "global_step": 376211, "epoch": 2239} {"train_loss": -12.195451736450195, "global_step": 376212, "epoch": 2239} {"train_loss": -12.15600872039795, "global_step": 376213, "epoch": 2239} {"train_loss": -12.336174011230469, "global_step": 376214, "epoch": 2239} {"train_loss": -12.167062759399414, "global_step": 376215, "epoch": 2239} {"train_loss": -11.967187881469727, "global_step": 376216, "epoch": 2239} {"train_loss": -12.354368209838867, "global_step": 376217, "epoch": 2239} {"train_loss": -11.953550338745117, "global_step": 376218, "epoch": 2239} {"train_loss": -11.892019271850586, "global_step": 376219, "epoch": 2239} {"train_loss": -12.120853424072266, "global_step": 376220, "epoch": 2239} {"train_loss": -12.28239631652832, "global_step": 376221, "epoch": 2239} {"train_loss": -11.39238166809082, "global_step": 376222, "epoch": 2239} {"train_loss": -12.23189640045166, "global_step": 376223, "epoch": 2239} {"train_loss": -11.983293533325195, "global_step": 376224, "epoch": 2239} {"train_loss": -11.839452743530273, "global_step": 376225, "epoch": 2239} {"train_loss": -12.069913864135742, "global_step": 376226, "epoch": 2239} {"train_loss": -12.25008487701416, "global_step": 376227, "epoch": 2239} {"train_loss": -11.434751510620117, "global_step": 376228, "epoch": 2239} {"train_loss": -12.28333854675293, "global_step": 376229, "epoch": 2239} {"train_loss": -11.73719596862793, "global_step": 376230, "epoch": 2239} {"train_loss": -12.117486953735352, "global_step": 376231, "epoch": 2239} {"train_loss": -11.039918899536133, "global_step": 376232, "epoch": 2239} {"train_loss": -11.893009185791016, "global_step": 376233, "epoch": 2239} {"train_loss": -12.276636123657227, "global_step": 376234, "epoch": 2239} {"train_loss": -12.190908432006836, "global_step": 376235, "epoch": 2239} {"train_loss": -11.988775253295898, "global_step": 376236, "epoch": 2239} {"train_loss": -12.158581733703613, "global_step": 376237, "epoch": 2239} {"train_loss": -11.399776458740234, "global_step": 376238, "epoch": 2239} {"train_loss": -12.15708065032959, "global_step": 376239, "epoch": 2239} {"train_loss": -12.251256942749023, "global_step": 376240, "epoch": 2239} {"train_loss": -12.071426391601562, "global_step": 376241, "epoch": 2239} {"train_loss": -12.104231834411621, "global_step": 376242, "epoch": 2239} {"train_loss": -12.163029670715332, "global_step": 376243, "epoch": 2239} {"train_loss": -12.130805015563965, "global_step": 376244, "epoch": 2239} {"train_loss": -12.030359268188477, "global_step": 376245, "epoch": 2239} {"train_loss": -12.06002140045166, "global_step": 376246, "epoch": 2239} {"train_loss": -12.071198463439941, "global_step": 376247, "epoch": 2239} {"train_loss": -12.114388465881348, "global_step": 376248, "epoch": 2239} {"train_loss": -11.818840980529785, "global_step": 376249, "epoch": 2239} {"train_loss": -12.380001068115234, "global_step": 376250, "epoch": 2239} {"train_loss": -12.22280502319336, "global_step": 376251, "epoch": 2239} {"train_loss": -12.103779792785645, "global_step": 376252, "epoch": 2239} {"train_loss": -12.187459945678711, "global_step": 376253, "epoch": 2239} {"train_loss": -12.093084335327148, "global_step": 376254, "epoch": 2239} {"train_loss": -12.390738487243652, "global_step": 376255, "epoch": 2239} {"train_loss": -11.924864768981934, "global_step": 376256, "epoch": 2239} {"train_loss": -12.021699905395508, "global_step": 376257, "epoch": 2239} {"train_loss": -12.115669250488281, "global_step": 376258, "epoch": 2239} {"train_loss": -12.423142433166504, "global_step": 376259, "epoch": 2239} {"train_loss": -11.95448112487793, "global_step": 376260, "epoch": 2239} {"train_loss": -12.454044342041016, "global_step": 376261, "epoch": 2239} {"train_loss": -11.753435134887695, "global_step": 376262, "epoch": 2239} {"train_loss": -11.531801223754883, "global_step": 376263, "epoch": 2239} {"train_loss": -12.25520133972168, "global_step": 376264, "epoch": 2239} {"train_loss": -11.723108291625977, "global_step": 376265, "epoch": 2239} {"train_loss": -9.552499771118164, "global_step": 376266, "epoch": 2239} {"train_loss": -11.830586433410645, "global_step": 376267, "epoch": 2239} {"train_loss": -10.305047988891602, "global_step": 376268, "epoch": 2239} {"train_loss": -9.152328491210938, "global_step": 376269, "epoch": 2239} {"train_loss": -8.34199333190918, "global_step": 376270, "epoch": 2239} {"train_loss": -8.623312950134277, "global_step": 376271, "epoch": 2239} {"train_loss": -9.57303524017334, "global_step": 376272, "epoch": 2239} {"train_loss": -10.515504837036133, "global_step": 376273, "epoch": 2239} {"train_loss": -9.327274322509766, "global_step": 376274, "epoch": 2239} {"train_loss": -8.300067901611328, "global_step": 376275, "epoch": 2239} {"train_loss": -9.706817626953125, "global_step": 376276, "epoch": 2239} {"train_loss": -9.673833847045898, "global_step": 376277, "epoch": 2239} {"train_loss": -9.492919921875, "global_step": 376278, "epoch": 2239} {"train_loss": -10.033105850219727, "global_step": 376279, "epoch": 2239} {"train_loss": -10.011184692382812, "global_step": 376280, "epoch": 2239} {"train_loss": -11.130026817321777, "global_step": 376281, "epoch": 2239} {"train_loss": -10.87460708618164, "global_step": 376282, "epoch": 2239} {"train_loss": -11.787878036499023, "global_step": 376283, "epoch": 2239} {"train_loss": -10.852771759033203, "global_step": 376284, "epoch": 2239} {"train_loss": -10.294330596923828, "global_step": 376285, "epoch": 2239} {"train_loss": -11.148988723754883, "global_step": 376286, "epoch": 2239} {"train_loss": -10.583885192871094, "global_step": 376287, "epoch": 2239} {"train_loss": -11.443135261535645, "global_step": 376288, "epoch": 2239} {"train_loss": -11.020048141479492, "global_step": 376289, "epoch": 2239} {"train_loss": -11.620346069335938, "global_step": 376290, "epoch": 2239} {"train_loss": -11.714062690734863, "global_step": 376291, "epoch": 2239} {"train_loss": -11.521453857421875, "global_step": 376292, "epoch": 2239} {"train_loss": -11.535755157470703, "global_step": 376293, "epoch": 2239} {"train_loss": -11.076639175415039, "global_step": 376294, "epoch": 2239} {"train_loss": -11.42289924621582, "global_step": 376295, "epoch": 2239} {"train_loss": -11.306207656860352, "global_step": 376296, "epoch": 2239} {"train_loss": -11.42087173461914, "global_step": 376297, "epoch": 2239} {"train_loss": -11.514307975769043, "global_step": 376298, "epoch": 2239} {"train_loss": -12.142046928405762, "global_step": 376299, "epoch": 2239} {"train_loss": -11.430990219116211, "global_step": 376300, "epoch": 2239} {"train_loss": -11.954625129699707, "global_step": 376301, "epoch": 2239} {"train_loss": -11.49770736694336, "global_step": 376302, "epoch": 2239} {"train_loss": -11.594892501831055, "global_step": 376303, "epoch": 2239} {"train_loss": -11.91804313659668, "global_step": 376304, "epoch": 2239} {"train_loss": -11.88619613647461, "global_step": 376305, "epoch": 2239} {"train_loss": -11.76648998260498, "global_step": 376306, "epoch": 2239} {"train_loss": -12.31785774230957, "global_step": 376307, "epoch": 2239} {"train_loss": -11.66847038269043, "global_step": 376308, "epoch": 2239} {"train_loss": -12.12472915649414, "global_step": 376309, "epoch": 2239} {"train_loss": -11.817085266113281, "global_step": 376310, "epoch": 2239} {"train_loss": -11.989238739013672, "global_step": 376311, "epoch": 2239} {"train_loss": -11.629169464111328, "global_step": 376312, "epoch": 2239} {"train_loss": -11.70479679107666, "global_step": 376313, "epoch": 2239} {"train_loss": -11.479820251464844, "global_step": 376314, "epoch": 2239} {"train_loss": -11.684907913208008, "global_step": 376315, "epoch": 2239} {"train_loss": -11.187926292419434, "global_step": 376316, "epoch": 2239} {"train_loss": -11.481029510498047, "global_step": 376317, "epoch": 2239} {"train_loss": -11.685290336608887, "global_step": 376318, "epoch": 2239} {"train_loss": -11.814651188396272, "global_step": 376319, "epoch": 2239, "val_loss": 290074.125} {"train_loss": -11.660926818847656, "global_step": 376320, "epoch": 2240} {"train_loss": -11.817666053771973, "global_step": 376321, "epoch": 2240} {"train_loss": -11.885812759399414, "global_step": 376322, "epoch": 2240} {"train_loss": -11.592918395996094, "global_step": 376323, "epoch": 2240} {"train_loss": -12.088025093078613, "global_step": 376324, "epoch": 2240} {"train_loss": -11.750056266784668, "global_step": 376325, "epoch": 2240} {"train_loss": -12.050952911376953, "global_step": 376326, "epoch": 2240} {"train_loss": -12.063782691955566, "global_step": 376327, "epoch": 2240} {"train_loss": -12.145421028137207, "global_step": 376328, "epoch": 2240} {"train_loss": -12.285345077514648, "global_step": 376329, "epoch": 2240} {"train_loss": -12.143264770507812, "global_step": 376330, "epoch": 2240} {"train_loss": -12.328251838684082, "global_step": 376331, "epoch": 2240} {"train_loss": -12.090106964111328, "global_step": 376332, "epoch": 2240} {"train_loss": -12.644726753234863, "global_step": 376333, "epoch": 2240} {"train_loss": -12.240381240844727, "global_step": 376334, "epoch": 2240} {"train_loss": -12.228606224060059, "global_step": 376335, "epoch": 2240} {"train_loss": -12.280512809753418, "global_step": 376336, "epoch": 2240} {"train_loss": -11.990314483642578, "global_step": 376337, "epoch": 2240} {"train_loss": -12.291550636291504, "global_step": 376338, "epoch": 2240} {"train_loss": -12.409260749816895, "global_step": 376339, "epoch": 2240} {"train_loss": -12.103522300720215, "global_step": 376340, "epoch": 2240} {"train_loss": -12.387958526611328, "global_step": 376341, "epoch": 2240} {"train_loss": -12.321529388427734, "global_step": 376342, "epoch": 2240} {"train_loss": -12.245705604553223, "global_step": 376343, "epoch": 2240} {"train_loss": -12.318323135375977, "global_step": 376344, "epoch": 2240} {"train_loss": -12.59028434753418, "global_step": 376345, "epoch": 2240} {"train_loss": -12.257055282592773, "global_step": 376346, "epoch": 2240} {"train_loss": -12.468195915222168, "global_step": 376347, "epoch": 2240} {"train_loss": -12.475393295288086, "global_step": 376348, "epoch": 2240} {"train_loss": -12.578729629516602, "global_step": 376349, "epoch": 2240} {"train_loss": -12.44027042388916, "global_step": 376350, "epoch": 2240} {"train_loss": -12.346723556518555, "global_step": 376351, "epoch": 2240} {"train_loss": -12.54712963104248, "global_step": 376352, "epoch": 2240} {"train_loss": -12.470955848693848, "global_step": 376353, "epoch": 2240} {"train_loss": -12.454710960388184, "global_step": 376354, "epoch": 2240} {"train_loss": -12.392671585083008, "global_step": 376355, "epoch": 2240} {"train_loss": -12.536556243896484, "global_step": 376356, "epoch": 2240} {"train_loss": -12.355121612548828, "global_step": 376357, "epoch": 2240} {"train_loss": -12.382540702819824, "global_step": 376358, "epoch": 2240} {"train_loss": -12.048835754394531, "global_step": 376359, "epoch": 2240} {"train_loss": -12.528007507324219, "global_step": 376360, "epoch": 2240} {"train_loss": -12.274913787841797, "global_step": 376361, "epoch": 2240} {"train_loss": -12.386703491210938, "global_step": 376362, "epoch": 2240} {"train_loss": -12.614891052246094, "global_step": 376363, "epoch": 2240} {"train_loss": -12.487722396850586, "global_step": 376364, "epoch": 2240} {"train_loss": -12.762813568115234, "global_step": 376365, "epoch": 2240} {"train_loss": -12.612895965576172, "global_step": 376366, "epoch": 2240} {"train_loss": -12.679819107055664, "global_step": 376367, "epoch": 2240} {"train_loss": -12.550209045410156, "global_step": 376368, "epoch": 2240} {"train_loss": -12.606369018554688, "global_step": 376369, "epoch": 2240} {"train_loss": -12.350723266601562, "global_step": 376370, "epoch": 2240} {"train_loss": -12.519702911376953, "global_step": 376371, "epoch": 2240} {"train_loss": -12.735179901123047, "global_step": 376372, "epoch": 2240} {"train_loss": -12.380815505981445, "global_step": 376373, "epoch": 2240} {"train_loss": -12.464437484741211, "global_step": 376374, "epoch": 2240} {"train_loss": -12.582891464233398, "global_step": 376375, "epoch": 2240} {"train_loss": -12.440719604492188, "global_step": 376376, "epoch": 2240} {"train_loss": -12.647136688232422, "global_step": 376377, "epoch": 2240} {"train_loss": -12.67141342163086, "global_step": 376378, "epoch": 2240} {"train_loss": -12.765976905822754, "global_step": 376379, "epoch": 2240} {"train_loss": -12.602611541748047, "global_step": 376380, "epoch": 2240} {"train_loss": -12.652152061462402, "global_step": 376381, "epoch": 2240} {"train_loss": -12.507095336914062, "global_step": 376382, "epoch": 2240} {"train_loss": -12.708470344543457, "global_step": 376383, "epoch": 2240} {"train_loss": -12.7421875, "global_step": 376384, "epoch": 2240} {"train_loss": -12.83535099029541, "global_step": 376385, "epoch": 2240} {"train_loss": -12.535725593566895, "global_step": 376386, "epoch": 2240} {"train_loss": -12.753253936767578, "global_step": 376387, "epoch": 2240} {"train_loss": -12.493091583251953, "global_step": 376388, "epoch": 2240} {"train_loss": -12.205411911010742, "global_step": 376389, "epoch": 2240} {"train_loss": -12.195347785949707, "global_step": 376390, "epoch": 2240} {"train_loss": -12.2164306640625, "global_step": 376391, "epoch": 2240} {"train_loss": -11.96542739868164, "global_step": 376392, "epoch": 2240} {"train_loss": -12.227834701538086, "global_step": 376393, "epoch": 2240} {"train_loss": -10.11327075958252, "global_step": 376394, "epoch": 2240} {"train_loss": -9.049531936645508, "global_step": 376395, "epoch": 2240} {"train_loss": -10.332695960998535, "global_step": 376396, "epoch": 2240} {"train_loss": -10.035350799560547, "global_step": 376397, "epoch": 2240} {"train_loss": -10.663387298583984, "global_step": 376398, "epoch": 2240} {"train_loss": -9.110086441040039, "global_step": 376399, "epoch": 2240} {"train_loss": -8.647385597229004, "global_step": 376400, "epoch": 2240} {"train_loss": -9.524856567382812, "global_step": 376401, "epoch": 2240} {"train_loss": -11.095741271972656, "global_step": 376402, "epoch": 2240} {"train_loss": -10.195653915405273, "global_step": 376403, "epoch": 2240} {"train_loss": -10.217449188232422, "global_step": 376404, "epoch": 2240} {"train_loss": -10.885730743408203, "global_step": 376405, "epoch": 2240} {"train_loss": -11.337822914123535, "global_step": 376406, "epoch": 2240} {"train_loss": -11.166706085205078, "global_step": 376407, "epoch": 2240} {"train_loss": -10.51206111907959, "global_step": 376408, "epoch": 2240} {"train_loss": -10.757387161254883, "global_step": 376409, "epoch": 2240} {"train_loss": -11.683161735534668, "global_step": 376410, "epoch": 2240} {"train_loss": -9.837970733642578, "global_step": 376411, "epoch": 2240} {"train_loss": -11.604703903198242, "global_step": 376412, "epoch": 2240} {"train_loss": -11.734770774841309, "global_step": 376413, "epoch": 2240} {"train_loss": -11.202167510986328, "global_step": 376414, "epoch": 2240} {"train_loss": -11.010984420776367, "global_step": 376415, "epoch": 2240} {"train_loss": -11.268558502197266, "global_step": 376416, "epoch": 2240} {"train_loss": -9.864124298095703, "global_step": 376417, "epoch": 2240} {"train_loss": -11.56733226776123, "global_step": 376418, "epoch": 2240} {"train_loss": -10.331026077270508, "global_step": 376419, "epoch": 2240} {"train_loss": -11.394048690795898, "global_step": 376420, "epoch": 2240} {"train_loss": -11.767927169799805, "global_step": 376421, "epoch": 2240} {"train_loss": -11.085410118103027, "global_step": 376422, "epoch": 2240} {"train_loss": -11.911687850952148, "global_step": 376423, "epoch": 2240} {"train_loss": -10.344196319580078, "global_step": 376424, "epoch": 2240} {"train_loss": -11.80801010131836, "global_step": 376425, "epoch": 2240} {"train_loss": -11.162044525146484, "global_step": 376426, "epoch": 2240} {"train_loss": -11.278515815734863, "global_step": 376427, "epoch": 2240} {"train_loss": -11.660902976989746, "global_step": 376428, "epoch": 2240} {"train_loss": -11.42671012878418, "global_step": 376429, "epoch": 2240} {"train_loss": -11.718888282775879, "global_step": 376430, "epoch": 2240} {"train_loss": -11.659107208251953, "global_step": 376431, "epoch": 2240} {"train_loss": -11.862563133239746, "global_step": 376432, "epoch": 2240} {"train_loss": -11.926502227783203, "global_step": 376433, "epoch": 2240} {"train_loss": -11.477069854736328, "global_step": 376434, "epoch": 2240} {"train_loss": -12.203505516052246, "global_step": 376435, "epoch": 2240} {"train_loss": -11.14221477508545, "global_step": 376436, "epoch": 2240} {"train_loss": -12.246991157531738, "global_step": 376437, "epoch": 2240} {"train_loss": -11.313854217529297, "global_step": 376438, "epoch": 2240} {"train_loss": -12.16113567352295, "global_step": 376439, "epoch": 2240} {"train_loss": -11.764785766601562, "global_step": 376440, "epoch": 2240} {"train_loss": -12.098151206970215, "global_step": 376441, "epoch": 2240} {"train_loss": -11.90534782409668, "global_step": 376442, "epoch": 2240} {"train_loss": -12.383235931396484, "global_step": 376443, "epoch": 2240} {"train_loss": -12.193841934204102, "global_step": 376444, "epoch": 2240} {"train_loss": -12.080982208251953, "global_step": 376445, "epoch": 2240} {"train_loss": -12.028753280639648, "global_step": 376446, "epoch": 2240} {"train_loss": -12.192925453186035, "global_step": 376447, "epoch": 2240} {"train_loss": -12.169589042663574, "global_step": 376448, "epoch": 2240} {"train_loss": -11.89407730102539, "global_step": 376449, "epoch": 2240} {"train_loss": -12.344096183776855, "global_step": 376450, "epoch": 2240} {"train_loss": -12.095369338989258, "global_step": 376451, "epoch": 2240} {"train_loss": -12.40890121459961, "global_step": 376452, "epoch": 2240} {"train_loss": -12.18172550201416, "global_step": 376453, "epoch": 2240} {"train_loss": -12.399410247802734, "global_step": 376454, "epoch": 2240} {"train_loss": -12.269124031066895, "global_step": 376455, "epoch": 2240} {"train_loss": -12.170351028442383, "global_step": 376456, "epoch": 2240} {"train_loss": -12.212766647338867, "global_step": 376457, "epoch": 2240} {"train_loss": -12.07616138458252, "global_step": 376458, "epoch": 2240} {"train_loss": -12.493640899658203, "global_step": 376459, "epoch": 2240} {"train_loss": -12.065485000610352, "global_step": 376460, "epoch": 2240} {"train_loss": -12.491060256958008, "global_step": 376461, "epoch": 2240} {"train_loss": -12.07672119140625, "global_step": 376462, "epoch": 2240} {"train_loss": -12.342689514160156, "global_step": 376463, "epoch": 2240} {"train_loss": -12.413349151611328, "global_step": 376464, "epoch": 2240} {"train_loss": -12.379064559936523, "global_step": 376465, "epoch": 2240} {"train_loss": -12.243474006652832, "global_step": 376466, "epoch": 2240} {"train_loss": -12.258143424987793, "global_step": 376467, "epoch": 2240} {"train_loss": -12.349164962768555, "global_step": 376468, "epoch": 2240} {"train_loss": -12.20876407623291, "global_step": 376469, "epoch": 2240} {"train_loss": -12.381475448608398, "global_step": 376470, "epoch": 2240} {"train_loss": -12.275714874267578, "global_step": 376471, "epoch": 2240} {"train_loss": -12.088125228881836, "global_step": 376472, "epoch": 2240} {"train_loss": -11.799276351928711, "global_step": 376473, "epoch": 2240} {"train_loss": -11.844858169555664, "global_step": 376474, "epoch": 2240} {"train_loss": -12.456832885742188, "global_step": 376475, "epoch": 2240} {"train_loss": -11.749065399169922, "global_step": 376476, "epoch": 2240} {"train_loss": -12.458179473876953, "global_step": 376477, "epoch": 2240} {"train_loss": -12.378392219543457, "global_step": 376478, "epoch": 2240} {"train_loss": -11.823241233825684, "global_step": 376479, "epoch": 2240} {"train_loss": -12.443071365356445, "global_step": 376480, "epoch": 2240} {"train_loss": -11.977540969848633, "global_step": 376481, "epoch": 2240} {"train_loss": -12.565258979797363, "global_step": 376482, "epoch": 2240} {"train_loss": -11.850802421569824, "global_step": 376483, "epoch": 2240} {"train_loss": -12.439196586608887, "global_step": 376484, "epoch": 2240} {"train_loss": -12.195043563842773, "global_step": 376485, "epoch": 2240} {"train_loss": -12.58026123046875, "global_step": 376486, "epoch": 2240} {"train_loss": -11.942608560834612, "global_step": 376487, "epoch": 2240, "val_loss": 292393.03125, "train_action_mse_error": 0.36149632930755615} {"train_loss": -12.211055755615234, "global_step": 376488, "epoch": 2241} {"train_loss": -12.448240280151367, "global_step": 376489, "epoch": 2241} {"train_loss": -12.186023712158203, "global_step": 376490, "epoch": 2241} {"train_loss": -12.393938064575195, "global_step": 376491, "epoch": 2241} {"train_loss": -12.493013381958008, "global_step": 376492, "epoch": 2241} {"train_loss": -12.164525985717773, "global_step": 376493, "epoch": 2241} {"train_loss": -12.262611389160156, "global_step": 376494, "epoch": 2241} {"train_loss": -11.905355453491211, "global_step": 376495, "epoch": 2241} {"train_loss": -11.884344100952148, "global_step": 376496, "epoch": 2241} {"train_loss": -11.847673416137695, "global_step": 376497, "epoch": 2241} {"train_loss": -11.164570808410645, "global_step": 376498, "epoch": 2241} {"train_loss": -10.437771797180176, "global_step": 376499, "epoch": 2241} {"train_loss": -10.36227035522461, "global_step": 376500, "epoch": 2241} {"train_loss": -11.507341384887695, "global_step": 376501, "epoch": 2241} {"train_loss": -10.748074531555176, "global_step": 376502, "epoch": 2241} {"train_loss": -11.663827896118164, "global_step": 376503, "epoch": 2241} {"train_loss": -10.87088394165039, "global_step": 376504, "epoch": 2241} {"train_loss": -11.797676086425781, "global_step": 376505, "epoch": 2241} {"train_loss": -11.954751968383789, "global_step": 376506, "epoch": 2241} {"train_loss": -11.593896865844727, "global_step": 376507, "epoch": 2241} {"train_loss": -12.243128776550293, "global_step": 376508, "epoch": 2241} {"train_loss": -10.935077667236328, "global_step": 376509, "epoch": 2241} {"train_loss": -12.175047874450684, "global_step": 376510, "epoch": 2241} {"train_loss": -10.678881645202637, "global_step": 376511, "epoch": 2241} {"train_loss": -11.268184661865234, "global_step": 376512, "epoch": 2241} {"train_loss": -11.353897094726562, "global_step": 376513, "epoch": 2241} {"train_loss": -11.806011199951172, "global_step": 376514, "epoch": 2241} {"train_loss": -12.104137420654297, "global_step": 376515, "epoch": 2241} {"train_loss": -11.353530883789062, "global_step": 376516, "epoch": 2241} {"train_loss": -11.938003540039062, "global_step": 376517, "epoch": 2241} {"train_loss": -11.790931701660156, "global_step": 376518, "epoch": 2241} {"train_loss": -11.766362190246582, "global_step": 376519, "epoch": 2241} {"train_loss": -11.659036636352539, "global_step": 376520, "epoch": 2241} {"train_loss": -11.72494888305664, "global_step": 376521, "epoch": 2241} {"train_loss": -11.846159934997559, "global_step": 376522, "epoch": 2241} {"train_loss": -12.183124542236328, "global_step": 376523, "epoch": 2241} {"train_loss": -12.047140121459961, "global_step": 376524, "epoch": 2241} {"train_loss": -12.130823135375977, "global_step": 376525, "epoch": 2241} {"train_loss": -11.883651733398438, "global_step": 376526, "epoch": 2241} {"train_loss": -12.158677101135254, "global_step": 376527, "epoch": 2241} {"train_loss": -12.024980545043945, "global_step": 376528, "epoch": 2241} {"train_loss": -11.867502212524414, "global_step": 376529, "epoch": 2241} {"train_loss": -12.099013328552246, "global_step": 376530, "epoch": 2241} {"train_loss": -11.862762451171875, "global_step": 376531, "epoch": 2241} {"train_loss": -12.142674446105957, "global_step": 376532, "epoch": 2241} {"train_loss": -11.996338844299316, "global_step": 376533, "epoch": 2241} {"train_loss": -12.021062850952148, "global_step": 376534, "epoch": 2241} {"train_loss": -12.365754127502441, "global_step": 376535, "epoch": 2241} {"train_loss": -11.918600082397461, "global_step": 376536, "epoch": 2241} {"train_loss": -11.508098602294922, "global_step": 376537, "epoch": 2241} {"train_loss": -12.226911544799805, "global_step": 376538, "epoch": 2241} {"train_loss": -11.978771209716797, "global_step": 376539, "epoch": 2241} {"train_loss": -12.308053970336914, "global_step": 376540, "epoch": 2241} {"train_loss": -12.162522315979004, "global_step": 376541, "epoch": 2241} {"train_loss": -12.442829132080078, "global_step": 376542, "epoch": 2241} {"train_loss": -11.960205078125, "global_step": 376543, "epoch": 2241} {"train_loss": -12.415542602539062, "global_step": 376544, "epoch": 2241} {"train_loss": -11.972978591918945, "global_step": 376545, "epoch": 2241} {"train_loss": -12.173009872436523, "global_step": 376546, "epoch": 2241} {"train_loss": -11.825288772583008, "global_step": 376547, "epoch": 2241} {"train_loss": -11.693940162658691, "global_step": 376548, "epoch": 2241} {"train_loss": -12.108848571777344, "global_step": 376549, "epoch": 2241} {"train_loss": -11.881200790405273, "global_step": 376550, "epoch": 2241} {"train_loss": -12.049888610839844, "global_step": 376551, "epoch": 2241} {"train_loss": -11.516998291015625, "global_step": 376552, "epoch": 2241} {"train_loss": -11.839630126953125, "global_step": 376553, "epoch": 2241} {"train_loss": -11.89343547821045, "global_step": 376554, "epoch": 2241} {"train_loss": -11.793503761291504, "global_step": 376555, "epoch": 2241} {"train_loss": -11.893097877502441, "global_step": 376556, "epoch": 2241} {"train_loss": -12.05253791809082, "global_step": 376557, "epoch": 2241} {"train_loss": -11.014237403869629, "global_step": 376558, "epoch": 2241} {"train_loss": -12.015356063842773, "global_step": 376559, "epoch": 2241} {"train_loss": -11.64919662475586, "global_step": 376560, "epoch": 2241} {"train_loss": -12.354280471801758, "global_step": 376561, "epoch": 2241} {"train_loss": -11.828125, "global_step": 376562, "epoch": 2241} {"train_loss": -11.991861343383789, "global_step": 376563, "epoch": 2241} {"train_loss": -12.219293594360352, "global_step": 376564, "epoch": 2241} {"train_loss": -11.984678268432617, "global_step": 376565, "epoch": 2241} {"train_loss": -12.031219482421875, "global_step": 376566, "epoch": 2241} {"train_loss": -12.428818702697754, "global_step": 376567, "epoch": 2241} {"train_loss": -12.174802780151367, "global_step": 376568, "epoch": 2241} {"train_loss": -12.140132904052734, "global_step": 376569, "epoch": 2241} {"train_loss": -12.026555061340332, "global_step": 376570, "epoch": 2241} {"train_loss": -12.198067665100098, "global_step": 376571, "epoch": 2241} {"train_loss": -11.991907119750977, "global_step": 376572, "epoch": 2241} {"train_loss": -11.882274627685547, "global_step": 376573, "epoch": 2241} {"train_loss": -12.174967765808105, "global_step": 376574, "epoch": 2241} {"train_loss": -11.782232284545898, "global_step": 376575, "epoch": 2241} {"train_loss": -11.537104606628418, "global_step": 376576, "epoch": 2241} {"train_loss": -11.979301452636719, "global_step": 376577, "epoch": 2241} {"train_loss": -11.953020095825195, "global_step": 376578, "epoch": 2241} {"train_loss": -12.187287330627441, "global_step": 376579, "epoch": 2241} {"train_loss": -11.785318374633789, "global_step": 376580, "epoch": 2241} {"train_loss": -12.041669845581055, "global_step": 376581, "epoch": 2241} {"train_loss": -11.703935623168945, "global_step": 376582, "epoch": 2241} {"train_loss": -10.967164993286133, "global_step": 376583, "epoch": 2241} {"train_loss": -11.542351722717285, "global_step": 376584, "epoch": 2241} {"train_loss": -9.924901962280273, "global_step": 376585, "epoch": 2241} {"train_loss": -11.083579063415527, "global_step": 376586, "epoch": 2241} {"train_loss": -11.283620834350586, "global_step": 376587, "epoch": 2241} {"train_loss": -10.950019836425781, "global_step": 376588, "epoch": 2241} {"train_loss": -11.93889045715332, "global_step": 376589, "epoch": 2241} {"train_loss": -11.241206169128418, "global_step": 376590, "epoch": 2241} {"train_loss": -11.265864372253418, "global_step": 376591, "epoch": 2241} {"train_loss": -11.605411529541016, "global_step": 376592, "epoch": 2241} {"train_loss": -11.712644577026367, "global_step": 376593, "epoch": 2241} {"train_loss": -11.21953296661377, "global_step": 376594, "epoch": 2241} {"train_loss": -11.64246940612793, "global_step": 376595, "epoch": 2241} {"train_loss": -11.574596405029297, "global_step": 376596, "epoch": 2241} {"train_loss": -11.836542129516602, "global_step": 376597, "epoch": 2241} {"train_loss": -11.47928237915039, "global_step": 376598, "epoch": 2241} {"train_loss": -10.868106842041016, "global_step": 376599, "epoch": 2241} {"train_loss": -11.291147232055664, "global_step": 376600, "epoch": 2241} {"train_loss": -10.346814155578613, "global_step": 376601, "epoch": 2241} {"train_loss": -11.38218879699707, "global_step": 376602, "epoch": 2241} {"train_loss": -11.040048599243164, "global_step": 376603, "epoch": 2241} {"train_loss": -10.816962242126465, "global_step": 376604, "epoch": 2241} {"train_loss": -10.440463066101074, "global_step": 376605, "epoch": 2241} {"train_loss": -11.011697769165039, "global_step": 376606, "epoch": 2241} {"train_loss": -10.34742546081543, "global_step": 376607, "epoch": 2241} {"train_loss": -10.349043846130371, "global_step": 376608, "epoch": 2241} {"train_loss": -11.530776977539062, "global_step": 376609, "epoch": 2241} {"train_loss": -9.809192657470703, "global_step": 376610, "epoch": 2241} {"train_loss": -9.57478141784668, "global_step": 376611, "epoch": 2241} {"train_loss": -10.091309547424316, "global_step": 376612, "epoch": 2241} {"train_loss": -10.903739929199219, "global_step": 376613, "epoch": 2241} {"train_loss": -10.436287879943848, "global_step": 376614, "epoch": 2241} {"train_loss": -10.600265502929688, "global_step": 376615, "epoch": 2241} {"train_loss": -10.42215347290039, "global_step": 376616, "epoch": 2241} {"train_loss": -11.101460456848145, "global_step": 376617, "epoch": 2241} {"train_loss": -10.62088394165039, "global_step": 376618, "epoch": 2241} {"train_loss": -10.7597017288208, "global_step": 376619, "epoch": 2241} {"train_loss": -10.40082836151123, "global_step": 376620, "epoch": 2241} {"train_loss": -10.430049896240234, "global_step": 376621, "epoch": 2241} {"train_loss": -11.170439720153809, "global_step": 376622, "epoch": 2241} {"train_loss": -11.141122817993164, "global_step": 376623, "epoch": 2241} {"train_loss": -11.638668060302734, "global_step": 376624, "epoch": 2241} {"train_loss": -11.912184715270996, "global_step": 376625, "epoch": 2241} {"train_loss": -11.194173812866211, "global_step": 376626, "epoch": 2241} {"train_loss": -11.576786041259766, "global_step": 376627, "epoch": 2241} {"train_loss": -11.692745208740234, "global_step": 376628, "epoch": 2241} {"train_loss": -11.165691375732422, "global_step": 376629, "epoch": 2241} {"train_loss": -11.818124771118164, "global_step": 376630, "epoch": 2241} {"train_loss": -11.803376197814941, "global_step": 376631, "epoch": 2241} {"train_loss": -11.48820686340332, "global_step": 376632, "epoch": 2241} {"train_loss": -11.889673233032227, "global_step": 376633, "epoch": 2241} {"train_loss": -11.175508499145508, "global_step": 376634, "epoch": 2241} {"train_loss": -11.961833953857422, "global_step": 376635, "epoch": 2241} {"train_loss": -11.460845947265625, "global_step": 376636, "epoch": 2241} {"train_loss": -11.826510429382324, "global_step": 376637, "epoch": 2241} {"train_loss": -11.716423034667969, "global_step": 376638, "epoch": 2241} {"train_loss": -11.95927906036377, "global_step": 376639, "epoch": 2241} {"train_loss": -11.457099914550781, "global_step": 376640, "epoch": 2241} {"train_loss": -12.1411714553833, "global_step": 376641, "epoch": 2241} {"train_loss": -11.355846405029297, "global_step": 376642, "epoch": 2241} {"train_loss": -12.248889923095703, "global_step": 376643, "epoch": 2241} {"train_loss": -11.856595039367676, "global_step": 376644, "epoch": 2241} {"train_loss": -12.092916488647461, "global_step": 376645, "epoch": 2241} {"train_loss": -12.250843048095703, "global_step": 376646, "epoch": 2241} {"train_loss": -12.028079986572266, "global_step": 376647, "epoch": 2241} {"train_loss": -12.236408233642578, "global_step": 376648, "epoch": 2241} {"train_loss": -12.12419319152832, "global_step": 376649, "epoch": 2241} {"train_loss": -12.0853910446167, "global_step": 376650, "epoch": 2241} {"train_loss": -12.2132568359375, "global_step": 376651, "epoch": 2241} {"train_loss": -12.075088500976562, "global_step": 376652, "epoch": 2241} {"train_loss": -11.919807434082031, "global_step": 376653, "epoch": 2241} {"train_loss": -12.448707580566406, "global_step": 376654, "epoch": 2241} {"train_loss": -11.637975533803305, "global_step": 376655, "epoch": 2241, "val_loss": 294007.0} {"train_loss": -12.359553337097168, "global_step": 376656, "epoch": 2242} {"train_loss": -12.246371269226074, "global_step": 376657, "epoch": 2242} {"train_loss": -12.174330711364746, "global_step": 376658, "epoch": 2242} {"train_loss": -12.324214935302734, "global_step": 376659, "epoch": 2242} {"train_loss": -12.296993255615234, "global_step": 376660, "epoch": 2242} {"train_loss": -12.339887619018555, "global_step": 376661, "epoch": 2242} {"train_loss": -12.331011772155762, "global_step": 376662, "epoch": 2242} {"train_loss": -12.27985954284668, "global_step": 376663, "epoch": 2242} {"train_loss": -12.403682708740234, "global_step": 376664, "epoch": 2242} {"train_loss": -12.48438835144043, "global_step": 376665, "epoch": 2242} {"train_loss": -12.354802131652832, "global_step": 376666, "epoch": 2242} {"train_loss": -12.351383209228516, "global_step": 376667, "epoch": 2242} {"train_loss": -12.144095420837402, "global_step": 376668, "epoch": 2242} {"train_loss": -12.212711334228516, "global_step": 376669, "epoch": 2242} {"train_loss": -12.429372787475586, "global_step": 376670, "epoch": 2242} {"train_loss": -12.44428539276123, "global_step": 376671, "epoch": 2242} {"train_loss": -12.595931053161621, "global_step": 376672, "epoch": 2242} {"train_loss": -12.291364669799805, "global_step": 376673, "epoch": 2242} {"train_loss": -12.181392669677734, "global_step": 376674, "epoch": 2242} {"train_loss": -12.224639892578125, "global_step": 376675, "epoch": 2242} {"train_loss": -12.368545532226562, "global_step": 376676, "epoch": 2242} {"train_loss": -12.183637619018555, "global_step": 376677, "epoch": 2242} {"train_loss": -12.318717956542969, "global_step": 376678, "epoch": 2242} {"train_loss": -12.211644172668457, "global_step": 376679, "epoch": 2242} {"train_loss": -12.422863960266113, "global_step": 376680, "epoch": 2242} {"train_loss": -12.446932792663574, "global_step": 376681, "epoch": 2242} {"train_loss": -12.15786361694336, "global_step": 376682, "epoch": 2242} {"train_loss": -12.639991760253906, "global_step": 376683, "epoch": 2242} {"train_loss": -12.204330444335938, "global_step": 376684, "epoch": 2242} {"train_loss": -12.421965599060059, "global_step": 376685, "epoch": 2242} {"train_loss": -12.49362564086914, "global_step": 376686, "epoch": 2242} {"train_loss": -12.294306755065918, "global_step": 376687, "epoch": 2242} {"train_loss": -12.630228042602539, "global_step": 376688, "epoch": 2242} {"train_loss": -12.557263374328613, "global_step": 376689, "epoch": 2242} {"train_loss": -12.689470291137695, "global_step": 376690, "epoch": 2242} {"train_loss": -12.453643798828125, "global_step": 376691, "epoch": 2242} {"train_loss": -12.568687438964844, "global_step": 376692, "epoch": 2242} {"train_loss": -12.473335266113281, "global_step": 376693, "epoch": 2242} {"train_loss": -12.73404598236084, "global_step": 376694, "epoch": 2242} {"train_loss": -12.297987937927246, "global_step": 376695, "epoch": 2242} {"train_loss": -12.466032028198242, "global_step": 376696, "epoch": 2242} {"train_loss": -12.717430114746094, "global_step": 376697, "epoch": 2242} {"train_loss": -12.309930801391602, "global_step": 376698, "epoch": 2242} {"train_loss": -12.518403053283691, "global_step": 376699, "epoch": 2242} {"train_loss": -12.499979019165039, "global_step": 376700, "epoch": 2242} {"train_loss": -12.528675079345703, "global_step": 376701, "epoch": 2242} {"train_loss": -12.286523818969727, "global_step": 376702, "epoch": 2242} {"train_loss": -12.752548217773438, "global_step": 376703, "epoch": 2242} {"train_loss": -12.513080596923828, "global_step": 376704, "epoch": 2242} {"train_loss": -12.520075798034668, "global_step": 376705, "epoch": 2242} {"train_loss": -12.606395721435547, "global_step": 376706, "epoch": 2242} {"train_loss": -12.397408485412598, "global_step": 376707, "epoch": 2242} {"train_loss": -12.455692291259766, "global_step": 376708, "epoch": 2242} {"train_loss": -12.368431091308594, "global_step": 376709, "epoch": 2242} {"train_loss": -12.353399276733398, "global_step": 376710, "epoch": 2242} {"train_loss": -12.54116153717041, "global_step": 376711, "epoch": 2242} {"train_loss": -12.52163314819336, "global_step": 376712, "epoch": 2242} {"train_loss": -12.582427978515625, "global_step": 376713, "epoch": 2242} {"train_loss": -12.333816528320312, "global_step": 376714, "epoch": 2242} {"train_loss": -12.667122840881348, "global_step": 376715, "epoch": 2242} {"train_loss": -12.417954444885254, "global_step": 376716, "epoch": 2242} {"train_loss": -12.677000999450684, "global_step": 376717, "epoch": 2242} {"train_loss": -12.719465255737305, "global_step": 376718, "epoch": 2242} {"train_loss": -12.542119026184082, "global_step": 376719, "epoch": 2242} {"train_loss": -12.860441207885742, "global_step": 376720, "epoch": 2242} {"train_loss": -12.798909187316895, "global_step": 376721, "epoch": 2242} {"train_loss": -12.54494857788086, "global_step": 376722, "epoch": 2242} {"train_loss": -12.560428619384766, "global_step": 376723, "epoch": 2242} {"train_loss": -12.547632217407227, "global_step": 376724, "epoch": 2242} {"train_loss": -12.276806831359863, "global_step": 376725, "epoch": 2242} {"train_loss": -12.325908660888672, "global_step": 376726, "epoch": 2242} {"train_loss": -12.54688835144043, "global_step": 376727, "epoch": 2242} {"train_loss": -12.254539489746094, "global_step": 376728, "epoch": 2242} {"train_loss": -12.430545806884766, "global_step": 376729, "epoch": 2242} {"train_loss": -12.51966381072998, "global_step": 376730, "epoch": 2242} {"train_loss": -12.596105575561523, "global_step": 376731, "epoch": 2242} {"train_loss": -12.366241455078125, "global_step": 376732, "epoch": 2242} {"train_loss": -12.258398056030273, "global_step": 376733, "epoch": 2242} {"train_loss": -12.195926666259766, "global_step": 376734, "epoch": 2242} {"train_loss": -11.80341911315918, "global_step": 376735, "epoch": 2242} {"train_loss": -12.245976448059082, "global_step": 376736, "epoch": 2242} {"train_loss": -12.218807220458984, "global_step": 376737, "epoch": 2242} {"train_loss": -12.156641006469727, "global_step": 376738, "epoch": 2242} {"train_loss": -10.650991439819336, "global_step": 376739, "epoch": 2242} {"train_loss": -12.154230117797852, "global_step": 376740, "epoch": 2242} {"train_loss": -11.802970886230469, "global_step": 376741, "epoch": 2242} {"train_loss": -10.226700782775879, "global_step": 376742, "epoch": 2242} {"train_loss": -11.351170539855957, "global_step": 376743, "epoch": 2242} {"train_loss": -11.250877380371094, "global_step": 376744, "epoch": 2242} {"train_loss": -10.151632308959961, "global_step": 376745, "epoch": 2242} {"train_loss": -10.801839828491211, "global_step": 376746, "epoch": 2242} {"train_loss": -9.536375045776367, "global_step": 376747, "epoch": 2242} {"train_loss": -11.280694961547852, "global_step": 376748, "epoch": 2242} {"train_loss": -9.981488227844238, "global_step": 376749, "epoch": 2242} {"train_loss": -11.782069206237793, "global_step": 376750, "epoch": 2242} {"train_loss": -10.1240816116333, "global_step": 376751, "epoch": 2242} {"train_loss": -11.649909019470215, "global_step": 376752, "epoch": 2242} {"train_loss": -11.76162338256836, "global_step": 376753, "epoch": 2242} {"train_loss": -11.4596529006958, "global_step": 376754, "epoch": 2242} {"train_loss": -11.828015327453613, "global_step": 376755, "epoch": 2242} {"train_loss": -11.793169021606445, "global_step": 376756, "epoch": 2242} {"train_loss": -12.16240406036377, "global_step": 376757, "epoch": 2242} {"train_loss": -12.011665344238281, "global_step": 376758, "epoch": 2242} {"train_loss": -11.846485137939453, "global_step": 376759, "epoch": 2242} {"train_loss": -11.942815780639648, "global_step": 376760, "epoch": 2242} {"train_loss": -12.103663444519043, "global_step": 376761, "epoch": 2242} {"train_loss": -12.235005378723145, "global_step": 376762, "epoch": 2242} {"train_loss": -12.191803932189941, "global_step": 376763, "epoch": 2242} {"train_loss": -12.255626678466797, "global_step": 376764, "epoch": 2242} {"train_loss": -11.88676643371582, "global_step": 376765, "epoch": 2242} {"train_loss": -12.383695602416992, "global_step": 376766, "epoch": 2242} {"train_loss": -12.030130386352539, "global_step": 376767, "epoch": 2242} {"train_loss": -11.61398696899414, "global_step": 376768, "epoch": 2242} {"train_loss": -11.974858283996582, "global_step": 376769, "epoch": 2242} {"train_loss": -11.98615837097168, "global_step": 376770, "epoch": 2242} {"train_loss": -11.789888381958008, "global_step": 376771, "epoch": 2242} {"train_loss": -11.83873176574707, "global_step": 376772, "epoch": 2242} {"train_loss": -12.318745613098145, "global_step": 376773, "epoch": 2242} {"train_loss": -12.17076587677002, "global_step": 376774, "epoch": 2242} {"train_loss": -12.02985668182373, "global_step": 376775, "epoch": 2242} {"train_loss": -12.318323135375977, "global_step": 376776, "epoch": 2242} {"train_loss": -12.472801208496094, "global_step": 376777, "epoch": 2242} {"train_loss": -12.340547561645508, "global_step": 376778, "epoch": 2242} {"train_loss": -12.254446029663086, "global_step": 376779, "epoch": 2242} {"train_loss": -12.420869827270508, "global_step": 376780, "epoch": 2242} {"train_loss": -11.963154792785645, "global_step": 376781, "epoch": 2242} {"train_loss": -11.88907241821289, "global_step": 376782, "epoch": 2242} {"train_loss": -12.35270881652832, "global_step": 376783, "epoch": 2242} {"train_loss": -11.49561882019043, "global_step": 376784, "epoch": 2242} {"train_loss": -11.742205619812012, "global_step": 376785, "epoch": 2242} {"train_loss": -12.198861122131348, "global_step": 376786, "epoch": 2242} {"train_loss": -11.226005554199219, "global_step": 376787, "epoch": 2242} {"train_loss": -10.740854263305664, "global_step": 376788, "epoch": 2242} {"train_loss": -12.478267669677734, "global_step": 376789, "epoch": 2242} {"train_loss": -11.2113676071167, "global_step": 376790, "epoch": 2242} {"train_loss": -11.375165939331055, "global_step": 376791, "epoch": 2242} {"train_loss": -12.463878631591797, "global_step": 376792, "epoch": 2242} {"train_loss": -11.154132843017578, "global_step": 376793, "epoch": 2242} {"train_loss": -12.166421890258789, "global_step": 376794, "epoch": 2242} {"train_loss": -11.95874309539795, "global_step": 376795, "epoch": 2242} {"train_loss": -11.922966003417969, "global_step": 376796, "epoch": 2242} {"train_loss": -12.035454750061035, "global_step": 376797, "epoch": 2242} {"train_loss": -11.912080764770508, "global_step": 376798, "epoch": 2242} {"train_loss": -12.036643981933594, "global_step": 376799, "epoch": 2242} {"train_loss": -12.256803512573242, "global_step": 376800, "epoch": 2242} {"train_loss": -11.334895133972168, "global_step": 376801, "epoch": 2242} {"train_loss": -12.191057205200195, "global_step": 376802, "epoch": 2242} {"train_loss": -10.671031951904297, "global_step": 376803, "epoch": 2242} {"train_loss": -12.44719409942627, "global_step": 376804, "epoch": 2242} {"train_loss": -10.936893463134766, "global_step": 376805, "epoch": 2242} {"train_loss": -12.202530860900879, "global_step": 376806, "epoch": 2242} {"train_loss": -12.031904220581055, "global_step": 376807, "epoch": 2242} {"train_loss": -11.656618118286133, "global_step": 376808, "epoch": 2242} {"train_loss": -12.02408218383789, "global_step": 376809, "epoch": 2242} {"train_loss": -12.085982322692871, "global_step": 376810, "epoch": 2242} {"train_loss": -11.96120834350586, "global_step": 376811, "epoch": 2242} {"train_loss": -12.333599090576172, "global_step": 376812, "epoch": 2242} {"train_loss": -11.858359336853027, "global_step": 376813, "epoch": 2242} {"train_loss": -12.427422523498535, "global_step": 376814, "epoch": 2242} {"train_loss": -12.297296524047852, "global_step": 376815, "epoch": 2242} {"train_loss": -12.363338470458984, "global_step": 376816, "epoch": 2242} {"train_loss": -12.675802230834961, "global_step": 376817, "epoch": 2242} {"train_loss": -11.933042526245117, "global_step": 376818, "epoch": 2242} {"train_loss": -12.146354675292969, "global_step": 376819, "epoch": 2242} {"train_loss": -12.256479263305664, "global_step": 376820, "epoch": 2242} {"train_loss": -12.248703002929688, "global_step": 376821, "epoch": 2242} {"train_loss": -12.322970390319824, "global_step": 376822, "epoch": 2242} {"train_loss": -12.108382866496132, "global_step": 376823, "epoch": 2242, "val_loss": 294403.65625} {"train_loss": -12.182506561279297, "global_step": 376824, "epoch": 2243} {"train_loss": -12.373358726501465, "global_step": 376825, "epoch": 2243} {"train_loss": -11.70384693145752, "global_step": 376826, "epoch": 2243} {"train_loss": -12.558719635009766, "global_step": 376827, "epoch": 2243} {"train_loss": -12.455700874328613, "global_step": 376828, "epoch": 2243} {"train_loss": -12.345685005187988, "global_step": 376829, "epoch": 2243} {"train_loss": -12.515237808227539, "global_step": 376830, "epoch": 2243} {"train_loss": -12.154459953308105, "global_step": 376831, "epoch": 2243} {"train_loss": -12.254961967468262, "global_step": 376832, "epoch": 2243} {"train_loss": -12.602487564086914, "global_step": 376833, "epoch": 2243} {"train_loss": -12.430023193359375, "global_step": 376834, "epoch": 2243} {"train_loss": -12.532898902893066, "global_step": 376835, "epoch": 2243} {"train_loss": -12.558279037475586, "global_step": 376836, "epoch": 2243} {"train_loss": -12.525474548339844, "global_step": 376837, "epoch": 2243} {"train_loss": -12.623153686523438, "global_step": 376838, "epoch": 2243} {"train_loss": -12.627976417541504, "global_step": 376839, "epoch": 2243} {"train_loss": -12.527413368225098, "global_step": 376840, "epoch": 2243} {"train_loss": -12.299697875976562, "global_step": 376841, "epoch": 2243} {"train_loss": -12.438085556030273, "global_step": 376842, "epoch": 2243} {"train_loss": -12.350835800170898, "global_step": 376843, "epoch": 2243} {"train_loss": -12.401678085327148, "global_step": 376844, "epoch": 2243} {"train_loss": -12.565235137939453, "global_step": 376845, "epoch": 2243} {"train_loss": -12.750419616699219, "global_step": 376846, "epoch": 2243} {"train_loss": -12.650468826293945, "global_step": 376847, "epoch": 2243} {"train_loss": -12.442057609558105, "global_step": 376848, "epoch": 2243} {"train_loss": -12.555268287658691, "global_step": 376849, "epoch": 2243} {"train_loss": -12.762048721313477, "global_step": 376850, "epoch": 2243} {"train_loss": -12.41655445098877, "global_step": 376851, "epoch": 2243} {"train_loss": -12.505568504333496, "global_step": 376852, "epoch": 2243} {"train_loss": -12.899046897888184, "global_step": 376853, "epoch": 2243} {"train_loss": -12.429448127746582, "global_step": 376854, "epoch": 2243} {"train_loss": -12.572322845458984, "global_step": 376855, "epoch": 2243} {"train_loss": -12.405128479003906, "global_step": 376856, "epoch": 2243} {"train_loss": -12.489818572998047, "global_step": 376857, "epoch": 2243} {"train_loss": -12.753907203674316, "global_step": 376858, "epoch": 2243} {"train_loss": -12.49407958984375, "global_step": 376859, "epoch": 2243} {"train_loss": -12.374105453491211, "global_step": 376860, "epoch": 2243} {"train_loss": -12.479266166687012, "global_step": 376861, "epoch": 2243} {"train_loss": -12.637605667114258, "global_step": 376862, "epoch": 2243} {"train_loss": -11.802669525146484, "global_step": 376863, "epoch": 2243} {"train_loss": -11.732014656066895, "global_step": 376864, "epoch": 2243} {"train_loss": -12.261404037475586, "global_step": 376865, "epoch": 2243} {"train_loss": -12.090777397155762, "global_step": 376866, "epoch": 2243} {"train_loss": -11.389062881469727, "global_step": 376867, "epoch": 2243} {"train_loss": -11.539530754089355, "global_step": 376868, "epoch": 2243} {"train_loss": -12.153064727783203, "global_step": 376869, "epoch": 2243} {"train_loss": -10.906959533691406, "global_step": 376870, "epoch": 2243} {"train_loss": -10.764392852783203, "global_step": 376871, "epoch": 2243} {"train_loss": -11.805864334106445, "global_step": 376872, "epoch": 2243} {"train_loss": -11.190401077270508, "global_step": 376873, "epoch": 2243} {"train_loss": -11.413970947265625, "global_step": 376874, "epoch": 2243} {"train_loss": -11.584823608398438, "global_step": 376875, "epoch": 2243} {"train_loss": -10.598527908325195, "global_step": 376876, "epoch": 2243} {"train_loss": -10.048938751220703, "global_step": 376877, "epoch": 2243} {"train_loss": -12.058710098266602, "global_step": 376878, "epoch": 2243} {"train_loss": -11.295021057128906, "global_step": 376879, "epoch": 2243} {"train_loss": -11.991674423217773, "global_step": 376880, "epoch": 2243} {"train_loss": -10.33331298828125, "global_step": 376881, "epoch": 2243} {"train_loss": -11.351581573486328, "global_step": 376882, "epoch": 2243} {"train_loss": -11.257119178771973, "global_step": 376883, "epoch": 2243} {"train_loss": -10.791259765625, "global_step": 376884, "epoch": 2243} {"train_loss": -11.59917163848877, "global_step": 376885, "epoch": 2243} {"train_loss": -10.819327354431152, "global_step": 376886, "epoch": 2243} {"train_loss": -11.634541511535645, "global_step": 376887, "epoch": 2243} {"train_loss": -11.37204647064209, "global_step": 376888, "epoch": 2243} {"train_loss": -10.914901733398438, "global_step": 376889, "epoch": 2243} {"train_loss": -12.040620803833008, "global_step": 376890, "epoch": 2243} {"train_loss": -10.888256072998047, "global_step": 376891, "epoch": 2243} {"train_loss": -12.16657829284668, "global_step": 376892, "epoch": 2243} {"train_loss": -11.373464584350586, "global_step": 376893, "epoch": 2243} {"train_loss": -11.426006317138672, "global_step": 376894, "epoch": 2243} {"train_loss": -11.384056091308594, "global_step": 376895, "epoch": 2243} {"train_loss": -11.301177978515625, "global_step": 376896, "epoch": 2243} {"train_loss": -11.626585960388184, "global_step": 376897, "epoch": 2243} {"train_loss": -11.204408645629883, "global_step": 376898, "epoch": 2243} {"train_loss": -11.111879348754883, "global_step": 376899, "epoch": 2243} {"train_loss": -12.079817771911621, "global_step": 376900, "epoch": 2243} {"train_loss": -11.454679489135742, "global_step": 376901, "epoch": 2243} {"train_loss": -11.615836143493652, "global_step": 376902, "epoch": 2243} {"train_loss": -11.60811996459961, "global_step": 376903, "epoch": 2243} {"train_loss": -11.005606651306152, "global_step": 376904, "epoch": 2243} {"train_loss": -12.069811820983887, "global_step": 376905, "epoch": 2243} {"train_loss": -11.662188529968262, "global_step": 376906, "epoch": 2243} {"train_loss": -11.559537887573242, "global_step": 376907, "epoch": 2243} {"train_loss": -11.619526863098145, "global_step": 376908, "epoch": 2243} {"train_loss": -10.959848403930664, "global_step": 376909, "epoch": 2243} {"train_loss": -11.392374038696289, "global_step": 376910, "epoch": 2243} {"train_loss": -11.564521789550781, "global_step": 376911, "epoch": 2243} {"train_loss": -11.017084121704102, "global_step": 376912, "epoch": 2243} {"train_loss": -11.641069412231445, "global_step": 376913, "epoch": 2243} {"train_loss": -10.855793952941895, "global_step": 376914, "epoch": 2243} {"train_loss": -11.655595779418945, "global_step": 376915, "epoch": 2243} {"train_loss": -11.655370712280273, "global_step": 376916, "epoch": 2243} {"train_loss": -11.5533447265625, "global_step": 376917, "epoch": 2243} {"train_loss": -12.19435977935791, "global_step": 376918, "epoch": 2243} {"train_loss": -11.622198104858398, "global_step": 376919, "epoch": 2243} {"train_loss": -12.310892105102539, "global_step": 376920, "epoch": 2243} {"train_loss": -11.7964506149292, "global_step": 376921, "epoch": 2243} {"train_loss": -12.260320663452148, "global_step": 376922, "epoch": 2243} {"train_loss": -12.290105819702148, "global_step": 376923, "epoch": 2243} {"train_loss": -12.067889213562012, "global_step": 376924, "epoch": 2243} {"train_loss": -12.244915008544922, "global_step": 376925, "epoch": 2243} {"train_loss": -12.192039489746094, "global_step": 376926, "epoch": 2243} {"train_loss": -12.213214874267578, "global_step": 376927, "epoch": 2243} {"train_loss": -12.14057731628418, "global_step": 376928, "epoch": 2243} {"train_loss": -12.389450073242188, "global_step": 376929, "epoch": 2243} {"train_loss": -12.240069389343262, "global_step": 376930, "epoch": 2243} {"train_loss": -12.457616806030273, "global_step": 376931, "epoch": 2243} {"train_loss": -12.253074645996094, "global_step": 376932, "epoch": 2243} {"train_loss": -12.329985618591309, "global_step": 376933, "epoch": 2243} {"train_loss": -12.275259971618652, "global_step": 376934, "epoch": 2243} {"train_loss": -12.389400482177734, "global_step": 376935, "epoch": 2243} {"train_loss": -12.251729965209961, "global_step": 376936, "epoch": 2243} {"train_loss": -12.162559509277344, "global_step": 376937, "epoch": 2243} {"train_loss": -12.407123565673828, "global_step": 376938, "epoch": 2243} {"train_loss": -12.31246280670166, "global_step": 376939, "epoch": 2243} {"train_loss": -12.346709251403809, "global_step": 376940, "epoch": 2243} {"train_loss": -12.433062553405762, "global_step": 376941, "epoch": 2243} {"train_loss": -11.981473922729492, "global_step": 376942, "epoch": 2243} {"train_loss": -12.551918983459473, "global_step": 376943, "epoch": 2243} {"train_loss": -11.679389953613281, "global_step": 376944, "epoch": 2243} {"train_loss": -12.266183853149414, "global_step": 376945, "epoch": 2243} {"train_loss": -12.273685455322266, "global_step": 376946, "epoch": 2243} {"train_loss": -12.223133087158203, "global_step": 376947, "epoch": 2243} {"train_loss": -12.391094207763672, "global_step": 376948, "epoch": 2243} {"train_loss": -12.14303970336914, "global_step": 376949, "epoch": 2243} {"train_loss": -12.271271705627441, "global_step": 376950, "epoch": 2243} {"train_loss": -12.282537460327148, "global_step": 376951, "epoch": 2243} {"train_loss": -12.175196647644043, "global_step": 376952, "epoch": 2243} {"train_loss": -12.044918060302734, "global_step": 376953, "epoch": 2243} {"train_loss": -12.310670852661133, "global_step": 376954, "epoch": 2243} {"train_loss": -11.973810195922852, "global_step": 376955, "epoch": 2243} {"train_loss": -12.061372756958008, "global_step": 376956, "epoch": 2243} {"train_loss": -12.443280220031738, "global_step": 376957, "epoch": 2243} {"train_loss": -12.186614990234375, "global_step": 376958, "epoch": 2243} {"train_loss": -12.435983657836914, "global_step": 376959, "epoch": 2243} {"train_loss": -12.088371276855469, "global_step": 376960, "epoch": 2243} {"train_loss": -12.652204513549805, "global_step": 376961, "epoch": 2243} {"train_loss": -12.127115249633789, "global_step": 376962, "epoch": 2243} {"train_loss": -12.073898315429688, "global_step": 376963, "epoch": 2243} {"train_loss": -12.183797836303711, "global_step": 376964, "epoch": 2243} {"train_loss": -12.213895797729492, "global_step": 376965, "epoch": 2243} {"train_loss": -12.29412841796875, "global_step": 376966, "epoch": 2243} {"train_loss": -12.270881652832031, "global_step": 376967, "epoch": 2243} {"train_loss": -11.98731803894043, "global_step": 376968, "epoch": 2243} {"train_loss": -11.805219650268555, "global_step": 376969, "epoch": 2243} {"train_loss": -11.95683479309082, "global_step": 376970, "epoch": 2243} {"train_loss": -11.887313842773438, "global_step": 376971, "epoch": 2243} {"train_loss": -12.367274284362793, "global_step": 376972, "epoch": 2243} {"train_loss": -10.953672409057617, "global_step": 376973, "epoch": 2243} {"train_loss": -11.405184745788574, "global_step": 376974, "epoch": 2243} {"train_loss": -12.406753540039062, "global_step": 376975, "epoch": 2243} {"train_loss": -11.97061824798584, "global_step": 376976, "epoch": 2243} {"train_loss": -11.444225311279297, "global_step": 376977, "epoch": 2243} {"train_loss": -12.087605476379395, "global_step": 376978, "epoch": 2243} {"train_loss": -12.363580703735352, "global_step": 376979, "epoch": 2243} {"train_loss": -12.299579620361328, "global_step": 376980, "epoch": 2243} {"train_loss": -12.205381393432617, "global_step": 376981, "epoch": 2243} {"train_loss": -12.431760787963867, "global_step": 376982, "epoch": 2243} {"train_loss": -12.255282402038574, "global_step": 376983, "epoch": 2243} {"train_loss": -11.956015586853027, "global_step": 376984, "epoch": 2243} {"train_loss": -11.969691276550293, "global_step": 376985, "epoch": 2243} {"train_loss": -11.898329734802246, "global_step": 376986, "epoch": 2243} {"train_loss": -12.048223495483398, "global_step": 376987, "epoch": 2243} {"train_loss": -12.36683464050293, "global_step": 376988, "epoch": 2243} {"train_loss": -11.670816421508789, "global_step": 376989, "epoch": 2243} {"train_loss": -11.384149551391602, "global_step": 376990, "epoch": 2243} {"train_loss": -11.981435054824466, "global_step": 376991, "epoch": 2243, "val_loss": 287052.4375} {"train_loss": -11.235017776489258, "global_step": 376992, "epoch": 2244} {"train_loss": -12.034239768981934, "global_step": 376993, "epoch": 2244} {"train_loss": -11.61412239074707, "global_step": 376994, "epoch": 2244} {"train_loss": -11.260343551635742, "global_step": 376995, "epoch": 2244} {"train_loss": -12.349357604980469, "global_step": 376996, "epoch": 2244} {"train_loss": -11.915735244750977, "global_step": 376997, "epoch": 2244} {"train_loss": -11.688957214355469, "global_step": 376998, "epoch": 2244} {"train_loss": -11.79928207397461, "global_step": 376999, "epoch": 2244} {"train_loss": -11.56009292602539, "global_step": 377000, "epoch": 2244} {"train_loss": -11.98341178894043, "global_step": 377001, "epoch": 2244} {"train_loss": -11.474928855895996, "global_step": 377002, "epoch": 2244} {"train_loss": -12.330060958862305, "global_step": 377003, "epoch": 2244} {"train_loss": -11.969050407409668, "global_step": 377004, "epoch": 2244} {"train_loss": -12.31056022644043, "global_step": 377005, "epoch": 2244} {"train_loss": -12.359108924865723, "global_step": 377006, "epoch": 2244} {"train_loss": -12.084277153015137, "global_step": 377007, "epoch": 2244} {"train_loss": -12.251127243041992, "global_step": 377008, "epoch": 2244} {"train_loss": -12.29886245727539, "global_step": 377009, "epoch": 2244} {"train_loss": -12.533441543579102, "global_step": 377010, "epoch": 2244} {"train_loss": -12.13586711883545, "global_step": 377011, "epoch": 2244} {"train_loss": -12.514863967895508, "global_step": 377012, "epoch": 2244} {"train_loss": -12.369367599487305, "global_step": 377013, "epoch": 2244} {"train_loss": -12.568561553955078, "global_step": 377014, "epoch": 2244} {"train_loss": -12.427512168884277, "global_step": 377015, "epoch": 2244} {"train_loss": -12.315340042114258, "global_step": 377016, "epoch": 2244} {"train_loss": -12.42177963256836, "global_step": 377017, "epoch": 2244} {"train_loss": -12.207372665405273, "global_step": 377018, "epoch": 2244} {"train_loss": -12.477893829345703, "global_step": 377019, "epoch": 2244} {"train_loss": -12.261087417602539, "global_step": 377020, "epoch": 2244} {"train_loss": -12.441563606262207, "global_step": 377021, "epoch": 2244} {"train_loss": -12.586867332458496, "global_step": 377022, "epoch": 2244} {"train_loss": -12.390412330627441, "global_step": 377023, "epoch": 2244} {"train_loss": -12.491556167602539, "global_step": 377024, "epoch": 2244} {"train_loss": -12.009004592895508, "global_step": 377025, "epoch": 2244} {"train_loss": -12.422660827636719, "global_step": 377026, "epoch": 2244} {"train_loss": -12.640640258789062, "global_step": 377027, "epoch": 2244} {"train_loss": -12.236105918884277, "global_step": 377028, "epoch": 2244} {"train_loss": -12.312685012817383, "global_step": 377029, "epoch": 2244} {"train_loss": -12.112689971923828, "global_step": 377030, "epoch": 2244} {"train_loss": -11.821916580200195, "global_step": 377031, "epoch": 2244} {"train_loss": -12.519807815551758, "global_step": 377032, "epoch": 2244} {"train_loss": -11.820335388183594, "global_step": 377033, "epoch": 2244} {"train_loss": -12.252859115600586, "global_step": 377034, "epoch": 2244} {"train_loss": -11.830367088317871, "global_step": 377035, "epoch": 2244} {"train_loss": -11.958444595336914, "global_step": 377036, "epoch": 2244} {"train_loss": -11.881860733032227, "global_step": 377037, "epoch": 2244} {"train_loss": -11.331979751586914, "global_step": 377038, "epoch": 2244} {"train_loss": -12.187511444091797, "global_step": 377039, "epoch": 2244} {"train_loss": -11.894477844238281, "global_step": 377040, "epoch": 2244} {"train_loss": -11.551711082458496, "global_step": 377041, "epoch": 2244} {"train_loss": -11.71597671508789, "global_step": 377042, "epoch": 2244} {"train_loss": -11.080666542053223, "global_step": 377043, "epoch": 2244} {"train_loss": -12.089067459106445, "global_step": 377044, "epoch": 2244} {"train_loss": -11.636526107788086, "global_step": 377045, "epoch": 2244} {"train_loss": -12.019302368164062, "global_step": 377046, "epoch": 2244} {"train_loss": -12.217750549316406, "global_step": 377047, "epoch": 2244} {"train_loss": -10.865701675415039, "global_step": 377048, "epoch": 2244} {"train_loss": -12.06471061706543, "global_step": 377049, "epoch": 2244} {"train_loss": -10.783661842346191, "global_step": 377050, "epoch": 2244} {"train_loss": -11.583917617797852, "global_step": 377051, "epoch": 2244} {"train_loss": -12.040609359741211, "global_step": 377052, "epoch": 2244} {"train_loss": -11.109685897827148, "global_step": 377053, "epoch": 2244} {"train_loss": -12.180192947387695, "global_step": 377054, "epoch": 2244} {"train_loss": -11.060675621032715, "global_step": 377055, "epoch": 2244} {"train_loss": -12.329355239868164, "global_step": 377056, "epoch": 2244} {"train_loss": -10.898048400878906, "global_step": 377057, "epoch": 2244} {"train_loss": -11.68466567993164, "global_step": 377058, "epoch": 2244} {"train_loss": -11.75899887084961, "global_step": 377059, "epoch": 2244} {"train_loss": -11.418298721313477, "global_step": 377060, "epoch": 2244} {"train_loss": -11.697721481323242, "global_step": 377061, "epoch": 2244} {"train_loss": -11.078027725219727, "global_step": 377062, "epoch": 2244} {"train_loss": -12.324270248413086, "global_step": 377063, "epoch": 2244} {"train_loss": -11.096163749694824, "global_step": 377064, "epoch": 2244} {"train_loss": -11.857126235961914, "global_step": 377065, "epoch": 2244} {"train_loss": -11.341033935546875, "global_step": 377066, "epoch": 2244} {"train_loss": -11.712924003601074, "global_step": 377067, "epoch": 2244} {"train_loss": -11.54227066040039, "global_step": 377068, "epoch": 2244} {"train_loss": -12.215733528137207, "global_step": 377069, "epoch": 2244} {"train_loss": -12.243325233459473, "global_step": 377070, "epoch": 2244} {"train_loss": -11.954012870788574, "global_step": 377071, "epoch": 2244} {"train_loss": -11.956670761108398, "global_step": 377072, "epoch": 2244} {"train_loss": -11.842641830444336, "global_step": 377073, "epoch": 2244} {"train_loss": -12.358566284179688, "global_step": 377074, "epoch": 2244} {"train_loss": -11.958051681518555, "global_step": 377075, "epoch": 2244} {"train_loss": -12.049110412597656, "global_step": 377076, "epoch": 2244} {"train_loss": -11.760907173156738, "global_step": 377077, "epoch": 2244} {"train_loss": -12.166557312011719, "global_step": 377078, "epoch": 2244} {"train_loss": -11.796419143676758, "global_step": 377079, "epoch": 2244} {"train_loss": -12.450433731079102, "global_step": 377080, "epoch": 2244} {"train_loss": -11.736350059509277, "global_step": 377081, "epoch": 2244} {"train_loss": -12.225381851196289, "global_step": 377082, "epoch": 2244} {"train_loss": -11.742456436157227, "global_step": 377083, "epoch": 2244} {"train_loss": -12.16699504852295, "global_step": 377084, "epoch": 2244} {"train_loss": -11.964754104614258, "global_step": 377085, "epoch": 2244} {"train_loss": -12.358373641967773, "global_step": 377086, "epoch": 2244} {"train_loss": -11.951395034790039, "global_step": 377087, "epoch": 2244} {"train_loss": -12.474885940551758, "global_step": 377088, "epoch": 2244} {"train_loss": -12.155719757080078, "global_step": 377089, "epoch": 2244} {"train_loss": -12.265609741210938, "global_step": 377090, "epoch": 2244} {"train_loss": -12.525306701660156, "global_step": 377091, "epoch": 2244} {"train_loss": -12.201436042785645, "global_step": 377092, "epoch": 2244} {"train_loss": -12.408567428588867, "global_step": 377093, "epoch": 2244} {"train_loss": -12.408631324768066, "global_step": 377094, "epoch": 2244} {"train_loss": -12.25295639038086, "global_step": 377095, "epoch": 2244} {"train_loss": -11.963177680969238, "global_step": 377096, "epoch": 2244} {"train_loss": -12.310686111450195, "global_step": 377097, "epoch": 2244} {"train_loss": -12.310955047607422, "global_step": 377098, "epoch": 2244} {"train_loss": -12.179854393005371, "global_step": 377099, "epoch": 2244} {"train_loss": -12.342845916748047, "global_step": 377100, "epoch": 2244} {"train_loss": -12.195480346679688, "global_step": 377101, "epoch": 2244} {"train_loss": -12.435760498046875, "global_step": 377102, "epoch": 2244} {"train_loss": -12.451559066772461, "global_step": 377103, "epoch": 2244} {"train_loss": -12.087031364440918, "global_step": 377104, "epoch": 2244} {"train_loss": -11.878103256225586, "global_step": 377105, "epoch": 2244} {"train_loss": -12.279520034790039, "global_step": 377106, "epoch": 2244} {"train_loss": -12.534675598144531, "global_step": 377107, "epoch": 2244} {"train_loss": -12.056228637695312, "global_step": 377108, "epoch": 2244} {"train_loss": -12.292547225952148, "global_step": 377109, "epoch": 2244} {"train_loss": -12.541753768920898, "global_step": 377110, "epoch": 2244} {"train_loss": -12.299577713012695, "global_step": 377111, "epoch": 2244} {"train_loss": -12.396636009216309, "global_step": 377112, "epoch": 2244} {"train_loss": -12.390701293945312, "global_step": 377113, "epoch": 2244} {"train_loss": -12.426648139953613, "global_step": 377114, "epoch": 2244} {"train_loss": -12.248272895812988, "global_step": 377115, "epoch": 2244} {"train_loss": -12.542932510375977, "global_step": 377116, "epoch": 2244} {"train_loss": -12.639715194702148, "global_step": 377117, "epoch": 2244} {"train_loss": -12.450183868408203, "global_step": 377118, "epoch": 2244} {"train_loss": -12.432607650756836, "global_step": 377119, "epoch": 2244} {"train_loss": -12.467710494995117, "global_step": 377120, "epoch": 2244} {"train_loss": -12.6591215133667, "global_step": 377121, "epoch": 2244} {"train_loss": -12.328819274902344, "global_step": 377122, "epoch": 2244} {"train_loss": -12.318366050720215, "global_step": 377123, "epoch": 2244} {"train_loss": -12.712528228759766, "global_step": 377124, "epoch": 2244} {"train_loss": -12.331138610839844, "global_step": 377125, "epoch": 2244} {"train_loss": -11.890863418579102, "global_step": 377126, "epoch": 2244} {"train_loss": -12.026695251464844, "global_step": 377127, "epoch": 2244} {"train_loss": -11.991114616394043, "global_step": 377128, "epoch": 2244} {"train_loss": -12.260589599609375, "global_step": 377129, "epoch": 2244} {"train_loss": -11.853622436523438, "global_step": 377130, "epoch": 2244} {"train_loss": -12.378976821899414, "global_step": 377131, "epoch": 2244} {"train_loss": -11.952876091003418, "global_step": 377132, "epoch": 2244} {"train_loss": -12.544705390930176, "global_step": 377133, "epoch": 2244} {"train_loss": -11.703171730041504, "global_step": 377134, "epoch": 2244} {"train_loss": -11.807781219482422, "global_step": 377135, "epoch": 2244} {"train_loss": -11.506227493286133, "global_step": 377136, "epoch": 2244} {"train_loss": -12.342528343200684, "global_step": 377137, "epoch": 2244} {"train_loss": -12.340957641601562, "global_step": 377138, "epoch": 2244} {"train_loss": -12.21278190612793, "global_step": 377139, "epoch": 2244} {"train_loss": -11.960111618041992, "global_step": 377140, "epoch": 2244} {"train_loss": -11.744035720825195, "global_step": 377141, "epoch": 2244} {"train_loss": -12.268428802490234, "global_step": 377142, "epoch": 2244} {"train_loss": -11.920995712280273, "global_step": 377143, "epoch": 2244} {"train_loss": -12.303897857666016, "global_step": 377144, "epoch": 2244} {"train_loss": -12.408735275268555, "global_step": 377145, "epoch": 2244} {"train_loss": -12.509078025817871, "global_step": 377146, "epoch": 2244} {"train_loss": -12.438850402832031, "global_step": 377147, "epoch": 2244} {"train_loss": -12.008814811706543, "global_step": 377148, "epoch": 2244} {"train_loss": -11.944300651550293, "global_step": 377149, "epoch": 2244} {"train_loss": -12.597764015197754, "global_step": 377150, "epoch": 2244} {"train_loss": -11.943622589111328, "global_step": 377151, "epoch": 2244} {"train_loss": -11.978948593139648, "global_step": 377152, "epoch": 2244} {"train_loss": -11.544651985168457, "global_step": 377153, "epoch": 2244} {"train_loss": -11.429752349853516, "global_step": 377154, "epoch": 2244} {"train_loss": -11.680105209350586, "global_step": 377155, "epoch": 2244} {"train_loss": -11.487991333007812, "global_step": 377156, "epoch": 2244} {"train_loss": -11.034149169921875, "global_step": 377157, "epoch": 2244} {"train_loss": -11.666482925415039, "global_step": 377158, "epoch": 2244} {"train_loss": -12.039094595682053, "global_step": 377159, "epoch": 2244, "val_loss": 293004.28125} {"train_loss": -11.460526466369629, "global_step": 377160, "epoch": 2245} {"train_loss": -9.009645462036133, "global_step": 377161, "epoch": 2245} {"train_loss": -10.73479175567627, "global_step": 377162, "epoch": 2245} {"train_loss": -10.289091110229492, "global_step": 377163, "epoch": 2245} {"train_loss": -10.185887336730957, "global_step": 377164, "epoch": 2245} {"train_loss": -10.754003524780273, "global_step": 377165, "epoch": 2245} {"train_loss": -8.819721221923828, "global_step": 377166, "epoch": 2245} {"train_loss": -11.19681453704834, "global_step": 377167, "epoch": 2245} {"train_loss": -9.465855598449707, "global_step": 377168, "epoch": 2245} {"train_loss": -7.89129638671875, "global_step": 377169, "epoch": 2245} {"train_loss": -8.746891021728516, "global_step": 377170, "epoch": 2245} {"train_loss": -10.451751708984375, "global_step": 377171, "epoch": 2245} {"train_loss": -8.77530288696289, "global_step": 377172, "epoch": 2245} {"train_loss": -10.125648498535156, "global_step": 377173, "epoch": 2245} {"train_loss": -9.599189758300781, "global_step": 377174, "epoch": 2245} {"train_loss": -9.302621841430664, "global_step": 377175, "epoch": 2245} {"train_loss": -8.69871711730957, "global_step": 377176, "epoch": 2245} {"train_loss": -11.617156982421875, "global_step": 377177, "epoch": 2245} {"train_loss": -9.006280899047852, "global_step": 377178, "epoch": 2245} {"train_loss": -10.652692794799805, "global_step": 377179, "epoch": 2245} {"train_loss": -11.418875694274902, "global_step": 377180, "epoch": 2245} {"train_loss": -10.248960494995117, "global_step": 377181, "epoch": 2245} {"train_loss": -11.15413761138916, "global_step": 377182, "epoch": 2245} {"train_loss": -11.311466217041016, "global_step": 377183, "epoch": 2245} {"train_loss": -11.091894149780273, "global_step": 377184, "epoch": 2245} {"train_loss": -11.165874481201172, "global_step": 377185, "epoch": 2245} {"train_loss": -11.544136047363281, "global_step": 377186, "epoch": 2245} {"train_loss": -11.279227256774902, "global_step": 377187, "epoch": 2245} {"train_loss": -11.563896179199219, "global_step": 377188, "epoch": 2245} {"train_loss": -11.894466400146484, "global_step": 377189, "epoch": 2245} {"train_loss": -11.749671936035156, "global_step": 377190, "epoch": 2245} {"train_loss": -12.07381534576416, "global_step": 377191, "epoch": 2245} {"train_loss": -11.730876922607422, "global_step": 377192, "epoch": 2245} {"train_loss": -12.028876304626465, "global_step": 377193, "epoch": 2245} {"train_loss": -11.862884521484375, "global_step": 377194, "epoch": 2245} {"train_loss": -11.691998481750488, "global_step": 377195, "epoch": 2245} {"train_loss": -12.22438907623291, "global_step": 377196, "epoch": 2245} {"train_loss": -11.886482238769531, "global_step": 377197, "epoch": 2245} {"train_loss": -12.024335861206055, "global_step": 377198, "epoch": 2245} {"train_loss": -11.80630111694336, "global_step": 377199, "epoch": 2245} {"train_loss": -11.873016357421875, "global_step": 377200, "epoch": 2245} {"train_loss": -12.23548698425293, "global_step": 377201, "epoch": 2245} {"train_loss": -12.07607650756836, "global_step": 377202, "epoch": 2245} {"train_loss": -12.133437156677246, "global_step": 377203, "epoch": 2245} {"train_loss": -12.07888126373291, "global_step": 377204, "epoch": 2245} {"train_loss": -12.257463455200195, "global_step": 377205, "epoch": 2245} {"train_loss": -12.017569541931152, "global_step": 377206, "epoch": 2245} {"train_loss": -12.217479705810547, "global_step": 377207, "epoch": 2245} {"train_loss": -12.153597831726074, "global_step": 377208, "epoch": 2245} {"train_loss": -12.177472114562988, "global_step": 377209, "epoch": 2245} {"train_loss": -12.270719528198242, "global_step": 377210, "epoch": 2245} {"train_loss": -12.213159561157227, "global_step": 377211, "epoch": 2245} {"train_loss": -12.450697898864746, "global_step": 377212, "epoch": 2245} {"train_loss": -12.165695190429688, "global_step": 377213, "epoch": 2245} {"train_loss": -12.32886791229248, "global_step": 377214, "epoch": 2245} {"train_loss": -12.224894523620605, "global_step": 377215, "epoch": 2245} {"train_loss": -12.189294815063477, "global_step": 377216, "epoch": 2245} {"train_loss": -12.409404754638672, "global_step": 377217, "epoch": 2245} {"train_loss": -12.319488525390625, "global_step": 377218, "epoch": 2245} {"train_loss": -12.35345458984375, "global_step": 377219, "epoch": 2245} {"train_loss": -12.15213394165039, "global_step": 377220, "epoch": 2245} {"train_loss": -12.137750625610352, "global_step": 377221, "epoch": 2245} {"train_loss": -12.328203201293945, "global_step": 377222, "epoch": 2245} {"train_loss": -12.448948860168457, "global_step": 377223, "epoch": 2245} {"train_loss": -12.355685234069824, "global_step": 377224, "epoch": 2245} {"train_loss": -12.183307647705078, "global_step": 377225, "epoch": 2245} {"train_loss": -12.601638793945312, "global_step": 377226, "epoch": 2245} {"train_loss": -12.520002365112305, "global_step": 377227, "epoch": 2245} {"train_loss": -12.190364837646484, "global_step": 377228, "epoch": 2245} {"train_loss": -12.445488929748535, "global_step": 377229, "epoch": 2245} {"train_loss": -12.341209411621094, "global_step": 377230, "epoch": 2245} {"train_loss": -12.654338836669922, "global_step": 377231, "epoch": 2245} {"train_loss": -12.384565353393555, "global_step": 377232, "epoch": 2245} {"train_loss": -12.67534351348877, "global_step": 377233, "epoch": 2245} {"train_loss": -12.414777755737305, "global_step": 377234, "epoch": 2245} {"train_loss": -12.442309379577637, "global_step": 377235, "epoch": 2245} {"train_loss": -12.305821418762207, "global_step": 377236, "epoch": 2245} {"train_loss": -12.573612213134766, "global_step": 377237, "epoch": 2245} {"train_loss": -12.386910438537598, "global_step": 377238, "epoch": 2245} {"train_loss": -12.547590255737305, "global_step": 377239, "epoch": 2245} {"train_loss": -12.688488006591797, "global_step": 377240, "epoch": 2245} {"train_loss": -12.277400970458984, "global_step": 377241, "epoch": 2245} {"train_loss": -12.670618057250977, "global_step": 377242, "epoch": 2245} {"train_loss": -12.727184295654297, "global_step": 377243, "epoch": 2245} {"train_loss": -12.68757438659668, "global_step": 377244, "epoch": 2245} {"train_loss": -12.543500900268555, "global_step": 377245, "epoch": 2245} {"train_loss": -12.692025184631348, "global_step": 377246, "epoch": 2245} {"train_loss": -12.679462432861328, "global_step": 377247, "epoch": 2245} {"train_loss": -12.6156587600708, "global_step": 377248, "epoch": 2245} {"train_loss": -12.625507354736328, "global_step": 377249, "epoch": 2245} {"train_loss": -12.554680824279785, "global_step": 377250, "epoch": 2245} {"train_loss": -12.619439125061035, "global_step": 377251, "epoch": 2245} {"train_loss": -12.709847450256348, "global_step": 377252, "epoch": 2245} {"train_loss": -12.641778945922852, "global_step": 377253, "epoch": 2245} {"train_loss": -12.51340103149414, "global_step": 377254, "epoch": 2245} {"train_loss": -12.66835880279541, "global_step": 377255, "epoch": 2245} {"train_loss": -12.49860954284668, "global_step": 377256, "epoch": 2245} {"train_loss": -12.679947853088379, "global_step": 377257, "epoch": 2245} {"train_loss": -12.838363647460938, "global_step": 377258, "epoch": 2245} {"train_loss": -12.446924209594727, "global_step": 377259, "epoch": 2245} {"train_loss": -12.630059242248535, "global_step": 377260, "epoch": 2245} {"train_loss": -12.623058319091797, "global_step": 377261, "epoch": 2245} {"train_loss": -12.619424819946289, "global_step": 377262, "epoch": 2245} {"train_loss": -12.194520950317383, "global_step": 377263, "epoch": 2245} {"train_loss": -12.618898391723633, "global_step": 377264, "epoch": 2245} {"train_loss": -12.407800674438477, "global_step": 377265, "epoch": 2245} {"train_loss": -12.326769828796387, "global_step": 377266, "epoch": 2245} {"train_loss": -12.660882949829102, "global_step": 377267, "epoch": 2245} {"train_loss": -12.12071418762207, "global_step": 377268, "epoch": 2245} {"train_loss": -12.266300201416016, "global_step": 377269, "epoch": 2245} {"train_loss": -12.656330108642578, "global_step": 377270, "epoch": 2245} {"train_loss": -12.173812866210938, "global_step": 377271, "epoch": 2245} {"train_loss": -12.629638671875, "global_step": 377272, "epoch": 2245} {"train_loss": -12.639742851257324, "global_step": 377273, "epoch": 2245} {"train_loss": -12.335506439208984, "global_step": 377274, "epoch": 2245} {"train_loss": -11.933935165405273, "global_step": 377275, "epoch": 2245} {"train_loss": -12.785663604736328, "global_step": 377276, "epoch": 2245} {"train_loss": -12.5048828125, "global_step": 377277, "epoch": 2245} {"train_loss": -12.52581787109375, "global_step": 377278, "epoch": 2245} {"train_loss": -12.293290138244629, "global_step": 377279, "epoch": 2245} {"train_loss": -12.582737922668457, "global_step": 377280, "epoch": 2245} {"train_loss": -12.572661399841309, "global_step": 377281, "epoch": 2245} {"train_loss": -12.5894775390625, "global_step": 377282, "epoch": 2245} {"train_loss": -12.462080001831055, "global_step": 377283, "epoch": 2245} {"train_loss": -12.663711547851562, "global_step": 377284, "epoch": 2245} {"train_loss": -12.436067581176758, "global_step": 377285, "epoch": 2245} {"train_loss": -12.468347549438477, "global_step": 377286, "epoch": 2245} {"train_loss": -12.604689598083496, "global_step": 377287, "epoch": 2245} {"train_loss": -12.782142639160156, "global_step": 377288, "epoch": 2245} {"train_loss": -12.58649730682373, "global_step": 377289, "epoch": 2245} {"train_loss": -12.552762985229492, "global_step": 377290, "epoch": 2245} {"train_loss": -12.511842727661133, "global_step": 377291, "epoch": 2245} {"train_loss": -12.623214721679688, "global_step": 377292, "epoch": 2245} {"train_loss": -12.311809539794922, "global_step": 377293, "epoch": 2245} {"train_loss": -12.584695816040039, "global_step": 377294, "epoch": 2245} {"train_loss": -12.527917861938477, "global_step": 377295, "epoch": 2245} {"train_loss": -12.103325843811035, "global_step": 377296, "epoch": 2245} {"train_loss": -12.235870361328125, "global_step": 377297, "epoch": 2245} {"train_loss": -12.362934112548828, "global_step": 377298, "epoch": 2245} {"train_loss": -12.41787338256836, "global_step": 377299, "epoch": 2245} {"train_loss": -12.809239387512207, "global_step": 377300, "epoch": 2245} {"train_loss": -12.65414810180664, "global_step": 377301, "epoch": 2245} {"train_loss": -12.607053756713867, "global_step": 377302, "epoch": 2245} {"train_loss": -12.51381778717041, "global_step": 377303, "epoch": 2245} {"train_loss": -12.602251052856445, "global_step": 377304, "epoch": 2245} {"train_loss": -12.55145263671875, "global_step": 377305, "epoch": 2245} {"train_loss": -12.283477783203125, "global_step": 377306, "epoch": 2245} {"train_loss": -12.524358749389648, "global_step": 377307, "epoch": 2245} {"train_loss": -12.027830123901367, "global_step": 377308, "epoch": 2245} {"train_loss": -12.172809600830078, "global_step": 377309, "epoch": 2245} {"train_loss": -11.917795181274414, "global_step": 377310, "epoch": 2245} {"train_loss": -12.41983413696289, "global_step": 377311, "epoch": 2245} {"train_loss": -11.23617172241211, "global_step": 377312, "epoch": 2245} {"train_loss": -12.193122863769531, "global_step": 377313, "epoch": 2245} {"train_loss": -11.719382286071777, "global_step": 377314, "epoch": 2245} {"train_loss": -12.32921028137207, "global_step": 377315, "epoch": 2245} {"train_loss": -12.169734954833984, "global_step": 377316, "epoch": 2245} {"train_loss": -12.161426544189453, "global_step": 377317, "epoch": 2245} {"train_loss": -11.613943099975586, "global_step": 377318, "epoch": 2245} {"train_loss": -11.732336044311523, "global_step": 377319, "epoch": 2245} {"train_loss": -11.861054420471191, "global_step": 377320, "epoch": 2245} {"train_loss": -12.224325180053711, "global_step": 377321, "epoch": 2245} {"train_loss": -11.806352615356445, "global_step": 377322, "epoch": 2245} {"train_loss": -11.758930206298828, "global_step": 377323, "epoch": 2245} {"train_loss": -11.203971862792969, "global_step": 377324, "epoch": 2245} {"train_loss": -12.051778793334961, "global_step": 377325, "epoch": 2245} {"train_loss": -11.866455078125, "global_step": 377326, "epoch": 2245} {"train_loss": -11.968510406357902, "global_step": 377327, "epoch": 2245, "val_loss": 293381.5, "train_action_mse_error": 1.4904776811599731} {"train_loss": -11.747568130493164, "global_step": 377328, "epoch": 2246} {"train_loss": -11.89529800415039, "global_step": 377329, "epoch": 2246} {"train_loss": -12.18135929107666, "global_step": 377330, "epoch": 2246} {"train_loss": -11.932671546936035, "global_step": 377331, "epoch": 2246} {"train_loss": -11.457740783691406, "global_step": 377332, "epoch": 2246} {"train_loss": -12.201580047607422, "global_step": 377333, "epoch": 2246} {"train_loss": -12.215734481811523, "global_step": 377334, "epoch": 2246} {"train_loss": -11.963430404663086, "global_step": 377335, "epoch": 2246} {"train_loss": -12.279012680053711, "global_step": 377336, "epoch": 2246} {"train_loss": -12.150440216064453, "global_step": 377337, "epoch": 2246} {"train_loss": -11.276687622070312, "global_step": 377338, "epoch": 2246} {"train_loss": -12.393397331237793, "global_step": 377339, "epoch": 2246} {"train_loss": -11.729558944702148, "global_step": 377340, "epoch": 2246} {"train_loss": -11.99869155883789, "global_step": 377341, "epoch": 2246} {"train_loss": -11.98851203918457, "global_step": 377342, "epoch": 2246} {"train_loss": -11.972225189208984, "global_step": 377343, "epoch": 2246} {"train_loss": -12.29647159576416, "global_step": 377344, "epoch": 2246} {"train_loss": -12.078027725219727, "global_step": 377345, "epoch": 2246} {"train_loss": -12.142298698425293, "global_step": 377346, "epoch": 2246} {"train_loss": -11.745875358581543, "global_step": 377347, "epoch": 2246} {"train_loss": -12.157556533813477, "global_step": 377348, "epoch": 2246} {"train_loss": -12.108644485473633, "global_step": 377349, "epoch": 2246} {"train_loss": -11.920915603637695, "global_step": 377350, "epoch": 2246} {"train_loss": -11.844159126281738, "global_step": 377351, "epoch": 2246} {"train_loss": -10.139270782470703, "global_step": 377352, "epoch": 2246} {"train_loss": -11.206377983093262, "global_step": 377353, "epoch": 2246} {"train_loss": -11.255849838256836, "global_step": 377354, "epoch": 2246} {"train_loss": -10.023167610168457, "global_step": 377355, "epoch": 2246} {"train_loss": -11.978353500366211, "global_step": 377356, "epoch": 2246} {"train_loss": -9.715215682983398, "global_step": 377357, "epoch": 2246} {"train_loss": -12.067798614501953, "global_step": 377358, "epoch": 2246} {"train_loss": -10.584782600402832, "global_step": 377359, "epoch": 2246} {"train_loss": -11.51571273803711, "global_step": 377360, "epoch": 2246} {"train_loss": -11.780258178710938, "global_step": 377361, "epoch": 2246} {"train_loss": -11.667627334594727, "global_step": 377362, "epoch": 2246} {"train_loss": -11.77059555053711, "global_step": 377363, "epoch": 2246} {"train_loss": -12.07651424407959, "global_step": 377364, "epoch": 2246} {"train_loss": -11.911890029907227, "global_step": 377365, "epoch": 2246} {"train_loss": -12.312921524047852, "global_step": 377366, "epoch": 2246} {"train_loss": -11.626676559448242, "global_step": 377367, "epoch": 2246} {"train_loss": -12.221220016479492, "global_step": 377368, "epoch": 2246} {"train_loss": -11.850001335144043, "global_step": 377369, "epoch": 2246} {"train_loss": -11.783082008361816, "global_step": 377370, "epoch": 2246} {"train_loss": -12.101509094238281, "global_step": 377371, "epoch": 2246} {"train_loss": -12.141107559204102, "global_step": 377372, "epoch": 2246} {"train_loss": -12.118782043457031, "global_step": 377373, "epoch": 2246} {"train_loss": -12.198040008544922, "global_step": 377374, "epoch": 2246} {"train_loss": -12.211750984191895, "global_step": 377375, "epoch": 2246} {"train_loss": -12.208780288696289, "global_step": 377376, "epoch": 2246} {"train_loss": -12.170632362365723, "global_step": 377377, "epoch": 2246} {"train_loss": -12.252166748046875, "global_step": 377378, "epoch": 2246} {"train_loss": -12.35301399230957, "global_step": 377379, "epoch": 2246} {"train_loss": -12.435023307800293, "global_step": 377380, "epoch": 2246} {"train_loss": -11.525518417358398, "global_step": 377381, "epoch": 2246} {"train_loss": -12.29630184173584, "global_step": 377382, "epoch": 2246} {"train_loss": -12.026959419250488, "global_step": 377383, "epoch": 2246} {"train_loss": -12.467632293701172, "global_step": 377384, "epoch": 2246} {"train_loss": -11.833039283752441, "global_step": 377385, "epoch": 2246} {"train_loss": -12.38774299621582, "global_step": 377386, "epoch": 2246} {"train_loss": -11.929993629455566, "global_step": 377387, "epoch": 2246} {"train_loss": -12.081223487854004, "global_step": 377388, "epoch": 2246} {"train_loss": -12.249448776245117, "global_step": 377389, "epoch": 2246} {"train_loss": -12.325403213500977, "global_step": 377390, "epoch": 2246} {"train_loss": -11.735700607299805, "global_step": 377391, "epoch": 2246} {"train_loss": -12.163745880126953, "global_step": 377392, "epoch": 2246} {"train_loss": -12.509905815124512, "global_step": 377393, "epoch": 2246} {"train_loss": -11.822037696838379, "global_step": 377394, "epoch": 2246} {"train_loss": -12.035932540893555, "global_step": 377395, "epoch": 2246} {"train_loss": -12.169681549072266, "global_step": 377396, "epoch": 2246} {"train_loss": -11.661657333374023, "global_step": 377397, "epoch": 2246} {"train_loss": -12.021246910095215, "global_step": 377398, "epoch": 2246} {"train_loss": -12.389019012451172, "global_step": 377399, "epoch": 2246} {"train_loss": -12.084234237670898, "global_step": 377400, "epoch": 2246} {"train_loss": -12.214401245117188, "global_step": 377401, "epoch": 2246} {"train_loss": -12.261788368225098, "global_step": 377402, "epoch": 2246} {"train_loss": -12.318641662597656, "global_step": 377403, "epoch": 2246} {"train_loss": -12.326078414916992, "global_step": 377404, "epoch": 2246} {"train_loss": -12.231711387634277, "global_step": 377405, "epoch": 2246} {"train_loss": -12.307730674743652, "global_step": 377406, "epoch": 2246} {"train_loss": -11.762887954711914, "global_step": 377407, "epoch": 2246} {"train_loss": -11.9087495803833, "global_step": 377408, "epoch": 2246} {"train_loss": -11.437169075012207, "global_step": 377409, "epoch": 2246} {"train_loss": -12.062300682067871, "global_step": 377410, "epoch": 2246} {"train_loss": -11.912439346313477, "global_step": 377411, "epoch": 2246} {"train_loss": -12.393020629882812, "global_step": 377412, "epoch": 2246} {"train_loss": -11.89569091796875, "global_step": 377413, "epoch": 2246} {"train_loss": -12.43589973449707, "global_step": 377414, "epoch": 2246} {"train_loss": -11.70223617553711, "global_step": 377415, "epoch": 2246} {"train_loss": -11.261189460754395, "global_step": 377416, "epoch": 2246} {"train_loss": -12.699831008911133, "global_step": 377417, "epoch": 2246} {"train_loss": -11.266658782958984, "global_step": 377418, "epoch": 2246} {"train_loss": -11.836465835571289, "global_step": 377419, "epoch": 2246} {"train_loss": -11.533384323120117, "global_step": 377420, "epoch": 2246} {"train_loss": -12.05927562713623, "global_step": 377421, "epoch": 2246} {"train_loss": -10.797321319580078, "global_step": 377422, "epoch": 2246} {"train_loss": -11.612245559692383, "global_step": 377423, "epoch": 2246} {"train_loss": -11.15073299407959, "global_step": 377424, "epoch": 2246} {"train_loss": -11.890935897827148, "global_step": 377425, "epoch": 2246} {"train_loss": -11.454784393310547, "global_step": 377426, "epoch": 2246} {"train_loss": -11.859188079833984, "global_step": 377427, "epoch": 2246} {"train_loss": -11.34756851196289, "global_step": 377428, "epoch": 2246} {"train_loss": -12.29232120513916, "global_step": 377429, "epoch": 2246} {"train_loss": -11.86166763305664, "global_step": 377430, "epoch": 2246} {"train_loss": -11.884425163269043, "global_step": 377431, "epoch": 2246} {"train_loss": -12.089432716369629, "global_step": 377432, "epoch": 2246} {"train_loss": -12.040409088134766, "global_step": 377433, "epoch": 2246} {"train_loss": -12.148115158081055, "global_step": 377434, "epoch": 2246} {"train_loss": -12.37717056274414, "global_step": 377435, "epoch": 2246} {"train_loss": -11.9811372756958, "global_step": 377436, "epoch": 2246} {"train_loss": -12.077692031860352, "global_step": 377437, "epoch": 2246} {"train_loss": -12.362324714660645, "global_step": 377438, "epoch": 2246} {"train_loss": -12.352811813354492, "global_step": 377439, "epoch": 2246} {"train_loss": -12.538400650024414, "global_step": 377440, "epoch": 2246} {"train_loss": -12.10769271850586, "global_step": 377441, "epoch": 2246} {"train_loss": -12.630430221557617, "global_step": 377442, "epoch": 2246} {"train_loss": -12.173975944519043, "global_step": 377443, "epoch": 2246} {"train_loss": -12.243276596069336, "global_step": 377444, "epoch": 2246} {"train_loss": -12.474079132080078, "global_step": 377445, "epoch": 2246} {"train_loss": -12.030847549438477, "global_step": 377446, "epoch": 2246} {"train_loss": -12.515430450439453, "global_step": 377447, "epoch": 2246} {"train_loss": -11.774452209472656, "global_step": 377448, "epoch": 2246} {"train_loss": -11.962503433227539, "global_step": 377449, "epoch": 2246} {"train_loss": -12.287002563476562, "global_step": 377450, "epoch": 2246} {"train_loss": -12.15853214263916, "global_step": 377451, "epoch": 2246} {"train_loss": -11.823436737060547, "global_step": 377452, "epoch": 2246} {"train_loss": -12.108953475952148, "global_step": 377453, "epoch": 2246} {"train_loss": -11.777417182922363, "global_step": 377454, "epoch": 2246} {"train_loss": -11.995634078979492, "global_step": 377455, "epoch": 2246} {"train_loss": -11.961231231689453, "global_step": 377456, "epoch": 2246} {"train_loss": -11.609720230102539, "global_step": 377457, "epoch": 2246} {"train_loss": -11.54521369934082, "global_step": 377458, "epoch": 2246} {"train_loss": -11.958988189697266, "global_step": 377459, "epoch": 2246} {"train_loss": -10.914281845092773, "global_step": 377460, "epoch": 2246} {"train_loss": -11.471036911010742, "global_step": 377461, "epoch": 2246} {"train_loss": -11.44626235961914, "global_step": 377462, "epoch": 2246} {"train_loss": -10.896280288696289, "global_step": 377463, "epoch": 2246} {"train_loss": -12.308937072753906, "global_step": 377464, "epoch": 2246} {"train_loss": -11.327106475830078, "global_step": 377465, "epoch": 2246} {"train_loss": -12.165736198425293, "global_step": 377466, "epoch": 2246} {"train_loss": -11.667360305786133, "global_step": 377467, "epoch": 2246} {"train_loss": -12.28209114074707, "global_step": 377468, "epoch": 2246} {"train_loss": -11.704681396484375, "global_step": 377469, "epoch": 2246} {"train_loss": -12.157801628112793, "global_step": 377470, "epoch": 2246} {"train_loss": -11.150960922241211, "global_step": 377471, "epoch": 2246} {"train_loss": -11.831193923950195, "global_step": 377472, "epoch": 2246} {"train_loss": -11.979944229125977, "global_step": 377473, "epoch": 2246} {"train_loss": -11.479828834533691, "global_step": 377474, "epoch": 2246} {"train_loss": -12.135254859924316, "global_step": 377475, "epoch": 2246} {"train_loss": -11.582508087158203, "global_step": 377476, "epoch": 2246} {"train_loss": -11.467314720153809, "global_step": 377477, "epoch": 2246} {"train_loss": -12.243120193481445, "global_step": 377478, "epoch": 2246} {"train_loss": -11.409688949584961, "global_step": 377479, "epoch": 2246} {"train_loss": -11.806591033935547, "global_step": 377480, "epoch": 2246} {"train_loss": -12.269733428955078, "global_step": 377481, "epoch": 2246} {"train_loss": -11.745501518249512, "global_step": 377482, "epoch": 2246} {"train_loss": -12.045797348022461, "global_step": 377483, "epoch": 2246} {"train_loss": -11.697978973388672, "global_step": 377484, "epoch": 2246} {"train_loss": -11.980474472045898, "global_step": 377485, "epoch": 2246} {"train_loss": -12.016886711120605, "global_step": 377486, "epoch": 2246} {"train_loss": -12.554913520812988, "global_step": 377487, "epoch": 2246} {"train_loss": -12.033157348632812, "global_step": 377488, "epoch": 2246} {"train_loss": -11.78668212890625, "global_step": 377489, "epoch": 2246} {"train_loss": -12.134248733520508, "global_step": 377490, "epoch": 2246} {"train_loss": -12.10423755645752, "global_step": 377491, "epoch": 2246} {"train_loss": -11.791753768920898, "global_step": 377492, "epoch": 2246} {"train_loss": -11.88215446472168, "global_step": 377493, "epoch": 2246} {"train_loss": -12.323807716369629, "global_step": 377494, "epoch": 2246} {"train_loss": -11.91573220775241, "global_step": 377495, "epoch": 2246, "val_loss": 288767.625} {"train_loss": -11.891944885253906, "global_step": 377496, "epoch": 2247} {"train_loss": -12.181245803833008, "global_step": 377497, "epoch": 2247} {"train_loss": -11.906925201416016, "global_step": 377498, "epoch": 2247} {"train_loss": -12.341651916503906, "global_step": 377499, "epoch": 2247} {"train_loss": -12.127761840820312, "global_step": 377500, "epoch": 2247} {"train_loss": -12.276456832885742, "global_step": 377501, "epoch": 2247} {"train_loss": -12.33568286895752, "global_step": 377502, "epoch": 2247} {"train_loss": -12.035297393798828, "global_step": 377503, "epoch": 2247} {"train_loss": -12.493817329406738, "global_step": 377504, "epoch": 2247} {"train_loss": -12.065929412841797, "global_step": 377505, "epoch": 2247} {"train_loss": -12.421138763427734, "global_step": 377506, "epoch": 2247} {"train_loss": -12.140254974365234, "global_step": 377507, "epoch": 2247} {"train_loss": -12.504960060119629, "global_step": 377508, "epoch": 2247} {"train_loss": -12.484148025512695, "global_step": 377509, "epoch": 2247} {"train_loss": -12.172529220581055, "global_step": 377510, "epoch": 2247} {"train_loss": -12.463631629943848, "global_step": 377511, "epoch": 2247} {"train_loss": -12.226812362670898, "global_step": 377512, "epoch": 2247} {"train_loss": -12.560762405395508, "global_step": 377513, "epoch": 2247} {"train_loss": -12.538389205932617, "global_step": 377514, "epoch": 2247} {"train_loss": -12.20869255065918, "global_step": 377515, "epoch": 2247} {"train_loss": -12.595959663391113, "global_step": 377516, "epoch": 2247} {"train_loss": -12.580766677856445, "global_step": 377517, "epoch": 2247} {"train_loss": -12.289379119873047, "global_step": 377518, "epoch": 2247} {"train_loss": -12.265031814575195, "global_step": 377519, "epoch": 2247} {"train_loss": -12.237796783447266, "global_step": 377520, "epoch": 2247} {"train_loss": -12.529838562011719, "global_step": 377521, "epoch": 2247} {"train_loss": -11.985159873962402, "global_step": 377522, "epoch": 2247} {"train_loss": -12.17007064819336, "global_step": 377523, "epoch": 2247} {"train_loss": -11.848085403442383, "global_step": 377524, "epoch": 2247} {"train_loss": -11.735212326049805, "global_step": 377525, "epoch": 2247} {"train_loss": -11.397663116455078, "global_step": 377526, "epoch": 2247} {"train_loss": -11.748095512390137, "global_step": 377527, "epoch": 2247} {"train_loss": -11.41304874420166, "global_step": 377528, "epoch": 2247} {"train_loss": -12.344371795654297, "global_step": 377529, "epoch": 2247} {"train_loss": -11.172825813293457, "global_step": 377530, "epoch": 2247} {"train_loss": -11.21176528930664, "global_step": 377531, "epoch": 2247} {"train_loss": -12.224102973937988, "global_step": 377532, "epoch": 2247} {"train_loss": -11.775257110595703, "global_step": 377533, "epoch": 2247} {"train_loss": -11.816553115844727, "global_step": 377534, "epoch": 2247} {"train_loss": -11.35732650756836, "global_step": 377535, "epoch": 2247} {"train_loss": -12.227356910705566, "global_step": 377536, "epoch": 2247} {"train_loss": -11.820924758911133, "global_step": 377537, "epoch": 2247} {"train_loss": -11.528657913208008, "global_step": 377538, "epoch": 2247} {"train_loss": -12.323911666870117, "global_step": 377539, "epoch": 2247} {"train_loss": -11.86581802368164, "global_step": 377540, "epoch": 2247} {"train_loss": -12.058767318725586, "global_step": 377541, "epoch": 2247} {"train_loss": -12.175619125366211, "global_step": 377542, "epoch": 2247} {"train_loss": -11.37939453125, "global_step": 377543, "epoch": 2247} {"train_loss": -9.742091178894043, "global_step": 377544, "epoch": 2247} {"train_loss": -12.118640899658203, "global_step": 377545, "epoch": 2247} {"train_loss": -10.986839294433594, "global_step": 377546, "epoch": 2247} {"train_loss": -11.290901184082031, "global_step": 377547, "epoch": 2247} {"train_loss": -11.929770469665527, "global_step": 377548, "epoch": 2247} {"train_loss": -11.899187088012695, "global_step": 377549, "epoch": 2247} {"train_loss": -11.471861839294434, "global_step": 377550, "epoch": 2247} {"train_loss": -11.479593276977539, "global_step": 377551, "epoch": 2247} {"train_loss": -11.534798622131348, "global_step": 377552, "epoch": 2247} {"train_loss": -10.976480484008789, "global_step": 377553, "epoch": 2247} {"train_loss": -11.874201774597168, "global_step": 377554, "epoch": 2247} {"train_loss": -9.77685832977295, "global_step": 377555, "epoch": 2247} {"train_loss": -12.037729263305664, "global_step": 377556, "epoch": 2247} {"train_loss": -11.069733619689941, "global_step": 377557, "epoch": 2247} {"train_loss": -11.641534805297852, "global_step": 377558, "epoch": 2247} {"train_loss": -9.328063011169434, "global_step": 377559, "epoch": 2247} {"train_loss": -9.809549331665039, "global_step": 377560, "epoch": 2247} {"train_loss": -11.397375106811523, "global_step": 377561, "epoch": 2247} {"train_loss": -9.757322311401367, "global_step": 377562, "epoch": 2247} {"train_loss": -11.289327621459961, "global_step": 377563, "epoch": 2247} {"train_loss": -10.029062271118164, "global_step": 377564, "epoch": 2247} {"train_loss": -10.329916000366211, "global_step": 377565, "epoch": 2247} {"train_loss": -10.58643913269043, "global_step": 377566, "epoch": 2247} {"train_loss": -10.716822624206543, "global_step": 377567, "epoch": 2247} {"train_loss": -10.069989204406738, "global_step": 377568, "epoch": 2247} {"train_loss": -11.168094635009766, "global_step": 377569, "epoch": 2247} {"train_loss": -10.296027183532715, "global_step": 377570, "epoch": 2247} {"train_loss": -11.452327728271484, "global_step": 377571, "epoch": 2247} {"train_loss": -11.152595520019531, "global_step": 377572, "epoch": 2247} {"train_loss": -11.581890106201172, "global_step": 377573, "epoch": 2247} {"train_loss": -10.997522354125977, "global_step": 377574, "epoch": 2247} {"train_loss": -11.506587982177734, "global_step": 377575, "epoch": 2247} {"train_loss": -11.19340705871582, "global_step": 377576, "epoch": 2247} {"train_loss": -11.930150032043457, "global_step": 377577, "epoch": 2247} {"train_loss": -11.241897583007812, "global_step": 377578, "epoch": 2247} {"train_loss": -12.007396697998047, "global_step": 377579, "epoch": 2247} {"train_loss": -11.162607192993164, "global_step": 377580, "epoch": 2247} {"train_loss": -11.992595672607422, "global_step": 377581, "epoch": 2247} {"train_loss": -11.091575622558594, "global_step": 377582, "epoch": 2247} {"train_loss": -11.548978805541992, "global_step": 377583, "epoch": 2247} {"train_loss": -11.401910781860352, "global_step": 377584, "epoch": 2247} {"train_loss": -12.028359413146973, "global_step": 377585, "epoch": 2247} {"train_loss": -11.481744766235352, "global_step": 377586, "epoch": 2247} {"train_loss": -12.080735206604004, "global_step": 377587, "epoch": 2247} {"train_loss": -11.126976013183594, "global_step": 377588, "epoch": 2247} {"train_loss": -12.067874908447266, "global_step": 377589, "epoch": 2247} {"train_loss": -11.715057373046875, "global_step": 377590, "epoch": 2247} {"train_loss": -11.830426216125488, "global_step": 377591, "epoch": 2247} {"train_loss": -12.138578414916992, "global_step": 377592, "epoch": 2247} {"train_loss": -11.875869750976562, "global_step": 377593, "epoch": 2247} {"train_loss": -11.792821884155273, "global_step": 377594, "epoch": 2247} {"train_loss": -12.163393020629883, "global_step": 377595, "epoch": 2247} {"train_loss": -11.74775505065918, "global_step": 377596, "epoch": 2247} {"train_loss": -12.385175704956055, "global_step": 377597, "epoch": 2247} {"train_loss": -11.910511016845703, "global_step": 377598, "epoch": 2247} {"train_loss": -12.017354011535645, "global_step": 377599, "epoch": 2247} {"train_loss": -12.077796936035156, "global_step": 377600, "epoch": 2247} {"train_loss": -12.219230651855469, "global_step": 377601, "epoch": 2247} {"train_loss": -12.469468116760254, "global_step": 377602, "epoch": 2247} {"train_loss": -12.472976684570312, "global_step": 377603, "epoch": 2247} {"train_loss": -12.325063705444336, "global_step": 377604, "epoch": 2247} {"train_loss": -12.486323356628418, "global_step": 377605, "epoch": 2247} {"train_loss": -12.280322074890137, "global_step": 377606, "epoch": 2247} {"train_loss": -12.518970489501953, "global_step": 377607, "epoch": 2247} {"train_loss": -12.217948913574219, "global_step": 377608, "epoch": 2247} {"train_loss": -12.3742036819458, "global_step": 377609, "epoch": 2247} {"train_loss": -12.507476806640625, "global_step": 377610, "epoch": 2247} {"train_loss": -11.961127281188965, "global_step": 377611, "epoch": 2247} {"train_loss": -12.420087814331055, "global_step": 377612, "epoch": 2247} {"train_loss": -12.240848541259766, "global_step": 377613, "epoch": 2247} {"train_loss": -12.32190227508545, "global_step": 377614, "epoch": 2247} {"train_loss": -12.308687210083008, "global_step": 377615, "epoch": 2247} {"train_loss": -12.557974815368652, "global_step": 377616, "epoch": 2247} {"train_loss": -12.448902130126953, "global_step": 377617, "epoch": 2247} {"train_loss": -12.459659576416016, "global_step": 377618, "epoch": 2247} {"train_loss": -12.67207145690918, "global_step": 377619, "epoch": 2247} {"train_loss": -12.494050979614258, "global_step": 377620, "epoch": 2247} {"train_loss": -12.379819869995117, "global_step": 377621, "epoch": 2247} {"train_loss": -12.579551696777344, "global_step": 377622, "epoch": 2247} {"train_loss": -12.548681259155273, "global_step": 377623, "epoch": 2247} {"train_loss": -12.595510482788086, "global_step": 377624, "epoch": 2247} {"train_loss": -12.540435791015625, "global_step": 377625, "epoch": 2247} {"train_loss": -12.420233726501465, "global_step": 377626, "epoch": 2247} {"train_loss": -12.63441276550293, "global_step": 377627, "epoch": 2247} {"train_loss": -12.43179702758789, "global_step": 377628, "epoch": 2247} {"train_loss": -12.517951965332031, "global_step": 377629, "epoch": 2247} {"train_loss": -12.445209503173828, "global_step": 377630, "epoch": 2247} {"train_loss": -12.650365829467773, "global_step": 377631, "epoch": 2247} {"train_loss": -12.536088943481445, "global_step": 377632, "epoch": 2247} {"train_loss": -12.35311508178711, "global_step": 377633, "epoch": 2247} {"train_loss": -12.745345115661621, "global_step": 377634, "epoch": 2247} {"train_loss": -12.507530212402344, "global_step": 377635, "epoch": 2247} {"train_loss": -12.568893432617188, "global_step": 377636, "epoch": 2247} {"train_loss": -12.399064064025879, "global_step": 377637, "epoch": 2247} {"train_loss": -12.276223182678223, "global_step": 377638, "epoch": 2247} {"train_loss": -12.728046417236328, "global_step": 377639, "epoch": 2247} {"train_loss": -12.236831665039062, "global_step": 377640, "epoch": 2247} {"train_loss": -12.245718002319336, "global_step": 377641, "epoch": 2247} {"train_loss": -12.681079864501953, "global_step": 377642, "epoch": 2247} {"train_loss": -12.464271545410156, "global_step": 377643, "epoch": 2247} {"train_loss": -12.375415802001953, "global_step": 377644, "epoch": 2247} {"train_loss": -12.72654914855957, "global_step": 377645, "epoch": 2247} {"train_loss": -11.768352508544922, "global_step": 377646, "epoch": 2247} {"train_loss": -12.930696487426758, "global_step": 377647, "epoch": 2247} {"train_loss": -12.272143363952637, "global_step": 377648, "epoch": 2247} {"train_loss": -12.732393264770508, "global_step": 377649, "epoch": 2247} {"train_loss": -12.3922700881958, "global_step": 377650, "epoch": 2247} {"train_loss": -12.328327178955078, "global_step": 377651, "epoch": 2247} {"train_loss": -12.506223678588867, "global_step": 377652, "epoch": 2247} {"train_loss": -12.447933197021484, "global_step": 377653, "epoch": 2247} {"train_loss": -12.483926773071289, "global_step": 377654, "epoch": 2247} {"train_loss": -12.792713165283203, "global_step": 377655, "epoch": 2247} {"train_loss": -12.461869239807129, "global_step": 377656, "epoch": 2247} {"train_loss": -12.329703330993652, "global_step": 377657, "epoch": 2247} {"train_loss": -12.773218154907227, "global_step": 377658, "epoch": 2247} {"train_loss": -12.610588073730469, "global_step": 377659, "epoch": 2247} {"train_loss": -12.521434783935547, "global_step": 377660, "epoch": 2247} {"train_loss": -12.369744300842285, "global_step": 377661, "epoch": 2247} {"train_loss": -12.68276596069336, "global_step": 377662, "epoch": 2247} {"train_loss": -11.964650443622045, "global_step": 377663, "epoch": 2247, "val_loss": 288216.03125} {"train_loss": -12.44853687286377, "global_step": 377664, "epoch": 2248} {"train_loss": -12.568868637084961, "global_step": 377665, "epoch": 2248} {"train_loss": -11.925662994384766, "global_step": 377666, "epoch": 2248} {"train_loss": -11.954204559326172, "global_step": 377667, "epoch": 2248} {"train_loss": -12.610574722290039, "global_step": 377668, "epoch": 2248} {"train_loss": -12.1500883102417, "global_step": 377669, "epoch": 2248} {"train_loss": -11.709831237792969, "global_step": 377670, "epoch": 2248} {"train_loss": -12.214008331298828, "global_step": 377671, "epoch": 2248} {"train_loss": -11.578455924987793, "global_step": 377672, "epoch": 2248} {"train_loss": -12.238637924194336, "global_step": 377673, "epoch": 2248} {"train_loss": -12.146730422973633, "global_step": 377674, "epoch": 2248} {"train_loss": -12.015901565551758, "global_step": 377675, "epoch": 2248} {"train_loss": -11.13569164276123, "global_step": 377676, "epoch": 2248} {"train_loss": -12.302661895751953, "global_step": 377677, "epoch": 2248} {"train_loss": -11.95037841796875, "global_step": 377678, "epoch": 2248} {"train_loss": -11.100980758666992, "global_step": 377679, "epoch": 2248} {"train_loss": -12.103008270263672, "global_step": 377680, "epoch": 2248} {"train_loss": -12.469969749450684, "global_step": 377681, "epoch": 2248} {"train_loss": -11.94495964050293, "global_step": 377682, "epoch": 2248} {"train_loss": -12.232539176940918, "global_step": 377683, "epoch": 2248} {"train_loss": -11.930153846740723, "global_step": 377684, "epoch": 2248} {"train_loss": -12.220827102661133, "global_step": 377685, "epoch": 2248} {"train_loss": -12.223901748657227, "global_step": 377686, "epoch": 2248} {"train_loss": -12.47160530090332, "global_step": 377687, "epoch": 2248} {"train_loss": -11.670372009277344, "global_step": 377688, "epoch": 2248} {"train_loss": -12.441082000732422, "global_step": 377689, "epoch": 2248} {"train_loss": -11.867579460144043, "global_step": 377690, "epoch": 2248} {"train_loss": -12.10816764831543, "global_step": 377691, "epoch": 2248} {"train_loss": -11.501501083374023, "global_step": 377692, "epoch": 2248} {"train_loss": -11.785272598266602, "global_step": 377693, "epoch": 2248} {"train_loss": -12.108407974243164, "global_step": 377694, "epoch": 2248} {"train_loss": -11.624635696411133, "global_step": 377695, "epoch": 2248} {"train_loss": -12.540315628051758, "global_step": 377696, "epoch": 2248} {"train_loss": -11.723151206970215, "global_step": 377697, "epoch": 2248} {"train_loss": -12.426006317138672, "global_step": 377698, "epoch": 2248} {"train_loss": -11.99074935913086, "global_step": 377699, "epoch": 2248} {"train_loss": -11.956878662109375, "global_step": 377700, "epoch": 2248} {"train_loss": -11.926679611206055, "global_step": 377701, "epoch": 2248} {"train_loss": -12.2796049118042, "global_step": 377702, "epoch": 2248} {"train_loss": -12.178483009338379, "global_step": 377703, "epoch": 2248} {"train_loss": -11.285978317260742, "global_step": 377704, "epoch": 2248} {"train_loss": -12.43336296081543, "global_step": 377705, "epoch": 2248} {"train_loss": -11.719571113586426, "global_step": 377706, "epoch": 2248} {"train_loss": -11.228290557861328, "global_step": 377707, "epoch": 2248} {"train_loss": -12.434776306152344, "global_step": 377708, "epoch": 2248} {"train_loss": -11.779472351074219, "global_step": 377709, "epoch": 2248} {"train_loss": -11.095476150512695, "global_step": 377710, "epoch": 2248} {"train_loss": -11.687174797058105, "global_step": 377711, "epoch": 2248} {"train_loss": -11.270959854125977, "global_step": 377712, "epoch": 2248} {"train_loss": -11.06753921508789, "global_step": 377713, "epoch": 2248} {"train_loss": -11.841896057128906, "global_step": 377714, "epoch": 2248} {"train_loss": -10.356225967407227, "global_step": 377715, "epoch": 2248} {"train_loss": -11.8892240524292, "global_step": 377716, "epoch": 2248} {"train_loss": -11.805021286010742, "global_step": 377717, "epoch": 2248} {"train_loss": -10.68380355834961, "global_step": 377718, "epoch": 2248} {"train_loss": -10.934701919555664, "global_step": 377719, "epoch": 2248} {"train_loss": -11.435811996459961, "global_step": 377720, "epoch": 2248} {"train_loss": -10.23125171661377, "global_step": 377721, "epoch": 2248} {"train_loss": -11.74376392364502, "global_step": 377722, "epoch": 2248} {"train_loss": -11.702856063842773, "global_step": 377723, "epoch": 2248} {"train_loss": -11.555587768554688, "global_step": 377724, "epoch": 2248} {"train_loss": -12.307882308959961, "global_step": 377725, "epoch": 2248} {"train_loss": -11.616154670715332, "global_step": 377726, "epoch": 2248} {"train_loss": -11.727678298950195, "global_step": 377727, "epoch": 2248} {"train_loss": -11.616362571716309, "global_step": 377728, "epoch": 2248} {"train_loss": -12.083700180053711, "global_step": 377729, "epoch": 2248} {"train_loss": -12.017656326293945, "global_step": 377730, "epoch": 2248} {"train_loss": -11.224064826965332, "global_step": 377731, "epoch": 2248} {"train_loss": -12.20715045928955, "global_step": 377732, "epoch": 2248} {"train_loss": -11.910808563232422, "global_step": 377733, "epoch": 2248} {"train_loss": -11.995229721069336, "global_step": 377734, "epoch": 2248} {"train_loss": -12.09257698059082, "global_step": 377735, "epoch": 2248} {"train_loss": -12.027231216430664, "global_step": 377736, "epoch": 2248} {"train_loss": -11.992441177368164, "global_step": 377737, "epoch": 2248} {"train_loss": -12.11053466796875, "global_step": 377738, "epoch": 2248} {"train_loss": -12.341785430908203, "global_step": 377739, "epoch": 2248} {"train_loss": -12.182784080505371, "global_step": 377740, "epoch": 2248} {"train_loss": -12.51271915435791, "global_step": 377741, "epoch": 2248} {"train_loss": -12.432621002197266, "global_step": 377742, "epoch": 2248} {"train_loss": -12.390490531921387, "global_step": 377743, "epoch": 2248} {"train_loss": -11.848678588867188, "global_step": 377744, "epoch": 2248} {"train_loss": -12.464704513549805, "global_step": 377745, "epoch": 2248} {"train_loss": -12.213465690612793, "global_step": 377746, "epoch": 2248} {"train_loss": -12.543148040771484, "global_step": 377747, "epoch": 2248} {"train_loss": -12.258934020996094, "global_step": 377748, "epoch": 2248} {"train_loss": -12.479095458984375, "global_step": 377749, "epoch": 2248} {"train_loss": -12.468182563781738, "global_step": 377750, "epoch": 2248} {"train_loss": -12.066092491149902, "global_step": 377751, "epoch": 2248} {"train_loss": -12.25008773803711, "global_step": 377752, "epoch": 2248} {"train_loss": -12.39148235321045, "global_step": 377753, "epoch": 2248} {"train_loss": -12.431224822998047, "global_step": 377754, "epoch": 2248} {"train_loss": -12.339118003845215, "global_step": 377755, "epoch": 2248} {"train_loss": -12.301887512207031, "global_step": 377756, "epoch": 2248} {"train_loss": -12.459379196166992, "global_step": 377757, "epoch": 2248} {"train_loss": -12.293983459472656, "global_step": 377758, "epoch": 2248} {"train_loss": -12.146631240844727, "global_step": 377759, "epoch": 2248} {"train_loss": -12.26791763305664, "global_step": 377760, "epoch": 2248} {"train_loss": -12.401987075805664, "global_step": 377761, "epoch": 2248} {"train_loss": -12.275945663452148, "global_step": 377762, "epoch": 2248} {"train_loss": -12.508481979370117, "global_step": 377763, "epoch": 2248} {"train_loss": -12.071364402770996, "global_step": 377764, "epoch": 2248} {"train_loss": -12.620328903198242, "global_step": 377765, "epoch": 2248} {"train_loss": -12.513483047485352, "global_step": 377766, "epoch": 2248} {"train_loss": -12.068937301635742, "global_step": 377767, "epoch": 2248} {"train_loss": -12.04738998413086, "global_step": 377768, "epoch": 2248} {"train_loss": -12.637994766235352, "global_step": 377769, "epoch": 2248} {"train_loss": -12.131898880004883, "global_step": 377770, "epoch": 2248} {"train_loss": -12.48410701751709, "global_step": 377771, "epoch": 2248} {"train_loss": -12.144234657287598, "global_step": 377772, "epoch": 2248} {"train_loss": -11.801185607910156, "global_step": 377773, "epoch": 2248} {"train_loss": -12.082275390625, "global_step": 377774, "epoch": 2248} {"train_loss": -12.534910202026367, "global_step": 377775, "epoch": 2248} {"train_loss": -11.899827003479004, "global_step": 377776, "epoch": 2248} {"train_loss": -11.64421558380127, "global_step": 377777, "epoch": 2248} {"train_loss": -12.10339641571045, "global_step": 377778, "epoch": 2248} {"train_loss": -11.324614524841309, "global_step": 377779, "epoch": 2248} {"train_loss": -11.834678649902344, "global_step": 377780, "epoch": 2248} {"train_loss": -12.264202117919922, "global_step": 377781, "epoch": 2248} {"train_loss": -11.635339736938477, "global_step": 377782, "epoch": 2248} {"train_loss": -12.461481094360352, "global_step": 377783, "epoch": 2248} {"train_loss": -11.514810562133789, "global_step": 377784, "epoch": 2248} {"train_loss": -12.732353210449219, "global_step": 377785, "epoch": 2248} {"train_loss": -11.615707397460938, "global_step": 377786, "epoch": 2248} {"train_loss": -12.528688430786133, "global_step": 377787, "epoch": 2248} {"train_loss": -11.912731170654297, "global_step": 377788, "epoch": 2248} {"train_loss": -12.438467979431152, "global_step": 377789, "epoch": 2248} {"train_loss": -12.272254943847656, "global_step": 377790, "epoch": 2248} {"train_loss": -12.234487533569336, "global_step": 377791, "epoch": 2248} {"train_loss": -12.211740493774414, "global_step": 377792, "epoch": 2248} {"train_loss": -12.194672584533691, "global_step": 377793, "epoch": 2248} {"train_loss": -11.946210861206055, "global_step": 377794, "epoch": 2248} {"train_loss": -12.290586471557617, "global_step": 377795, "epoch": 2248} {"train_loss": -12.06789493560791, "global_step": 377796, "epoch": 2248} {"train_loss": -12.381041526794434, "global_step": 377797, "epoch": 2248} {"train_loss": -12.501644134521484, "global_step": 377798, "epoch": 2248} {"train_loss": -12.027236938476562, "global_step": 377799, "epoch": 2248} {"train_loss": -11.89371109008789, "global_step": 377800, "epoch": 2248} {"train_loss": -12.204153060913086, "global_step": 377801, "epoch": 2248} {"train_loss": -11.810829162597656, "global_step": 377802, "epoch": 2248} {"train_loss": -10.603842735290527, "global_step": 377803, "epoch": 2248} {"train_loss": -11.53870964050293, "global_step": 377804, "epoch": 2248} {"train_loss": -11.760364532470703, "global_step": 377805, "epoch": 2248} {"train_loss": -9.486042976379395, "global_step": 377806, "epoch": 2248} {"train_loss": -10.688858985900879, "global_step": 377807, "epoch": 2248} {"train_loss": -11.01037883758545, "global_step": 377808, "epoch": 2248} {"train_loss": -10.901895523071289, "global_step": 377809, "epoch": 2248} {"train_loss": -11.421998977661133, "global_step": 377810, "epoch": 2248} {"train_loss": -11.337218284606934, "global_step": 377811, "epoch": 2248} {"train_loss": -11.921113014221191, "global_step": 377812, "epoch": 2248} {"train_loss": -11.786179542541504, "global_step": 377813, "epoch": 2248} {"train_loss": -11.403156280517578, "global_step": 377814, "epoch": 2248} {"train_loss": -11.893428802490234, "global_step": 377815, "epoch": 2248} {"train_loss": -10.526532173156738, "global_step": 377816, "epoch": 2248} {"train_loss": -12.230915069580078, "global_step": 377817, "epoch": 2248} {"train_loss": -10.664712905883789, "global_step": 377818, "epoch": 2248} {"train_loss": -11.631531715393066, "global_step": 377819, "epoch": 2248} {"train_loss": -10.909967422485352, "global_step": 377820, "epoch": 2248} {"train_loss": -11.241338729858398, "global_step": 377821, "epoch": 2248} {"train_loss": -10.804842948913574, "global_step": 377822, "epoch": 2248} {"train_loss": -10.989880561828613, "global_step": 377823, "epoch": 2248} {"train_loss": -11.660947799682617, "global_step": 377824, "epoch": 2248} {"train_loss": -10.75208854675293, "global_step": 377825, "epoch": 2248} {"train_loss": -11.63203239440918, "global_step": 377826, "epoch": 2248} {"train_loss": -11.199833869934082, "global_step": 377827, "epoch": 2248} {"train_loss": -11.223431587219238, "global_step": 377828, "epoch": 2248} {"train_loss": -11.127899169921875, "global_step": 377829, "epoch": 2248} {"train_loss": -11.421911239624023, "global_step": 377830, "epoch": 2248} {"train_loss": -11.875209042004176, "global_step": 377831, "epoch": 2248, "val_loss": 294097.8125} {"train_loss": -11.811508178710938, "global_step": 377832, "epoch": 2249} {"train_loss": -11.674437522888184, "global_step": 377833, "epoch": 2249} {"train_loss": -11.564197540283203, "global_step": 377834, "epoch": 2249} {"train_loss": -11.86397933959961, "global_step": 377835, "epoch": 2249} {"train_loss": -11.161214828491211, "global_step": 377836, "epoch": 2249} {"train_loss": -12.0382719039917, "global_step": 377837, "epoch": 2249} {"train_loss": -11.714994430541992, "global_step": 377838, "epoch": 2249} {"train_loss": -12.251750946044922, "global_step": 377839, "epoch": 2249} {"train_loss": -11.825368881225586, "global_step": 377840, "epoch": 2249} {"train_loss": -11.849454879760742, "global_step": 377841, "epoch": 2249} {"train_loss": -12.08935546875, "global_step": 377842, "epoch": 2249} {"train_loss": -11.559554100036621, "global_step": 377843, "epoch": 2249} {"train_loss": -12.230375289916992, "global_step": 377844, "epoch": 2249} {"train_loss": -11.86629867553711, "global_step": 377845, "epoch": 2249} {"train_loss": -12.179941177368164, "global_step": 377846, "epoch": 2249} {"train_loss": -12.227514266967773, "global_step": 377847, "epoch": 2249} {"train_loss": -12.050636291503906, "global_step": 377848, "epoch": 2249} {"train_loss": -12.209566116333008, "global_step": 377849, "epoch": 2249} {"train_loss": -12.069735527038574, "global_step": 377850, "epoch": 2249} {"train_loss": -12.37839412689209, "global_step": 377851, "epoch": 2249} {"train_loss": -11.879068374633789, "global_step": 377852, "epoch": 2249} {"train_loss": -11.923725128173828, "global_step": 377853, "epoch": 2249} {"train_loss": -11.750940322875977, "global_step": 377854, "epoch": 2249} {"train_loss": -12.11673355102539, "global_step": 377855, "epoch": 2249} {"train_loss": -11.730401992797852, "global_step": 377856, "epoch": 2249} {"train_loss": -12.17539119720459, "global_step": 377857, "epoch": 2249} {"train_loss": -11.784402847290039, "global_step": 377858, "epoch": 2249} {"train_loss": -12.0611572265625, "global_step": 377859, "epoch": 2249} {"train_loss": -11.657979011535645, "global_step": 377860, "epoch": 2249} {"train_loss": -12.100688934326172, "global_step": 377861, "epoch": 2249} {"train_loss": -11.524786949157715, "global_step": 377862, "epoch": 2249} {"train_loss": -12.0536527633667, "global_step": 377863, "epoch": 2249} {"train_loss": -11.996745109558105, "global_step": 377864, "epoch": 2249} {"train_loss": -11.50914192199707, "global_step": 377865, "epoch": 2249} {"train_loss": -12.271085739135742, "global_step": 377866, "epoch": 2249} {"train_loss": -11.823436737060547, "global_step": 377867, "epoch": 2249} {"train_loss": -12.336088180541992, "global_step": 377868, "epoch": 2249} {"train_loss": -12.163614273071289, "global_step": 377869, "epoch": 2249} {"train_loss": -12.191848754882812, "global_step": 377870, "epoch": 2249} {"train_loss": -12.453701972961426, "global_step": 377871, "epoch": 2249} {"train_loss": -12.237152099609375, "global_step": 377872, "epoch": 2249} {"train_loss": -12.494221687316895, "global_step": 377873, "epoch": 2249} {"train_loss": -12.146810531616211, "global_step": 377874, "epoch": 2249} {"train_loss": -12.32368278503418, "global_step": 377875, "epoch": 2249} {"train_loss": -12.58685302734375, "global_step": 377876, "epoch": 2249} {"train_loss": -12.288084030151367, "global_step": 377877, "epoch": 2249} {"train_loss": -12.420909881591797, "global_step": 377878, "epoch": 2249} {"train_loss": -12.41390323638916, "global_step": 377879, "epoch": 2249} {"train_loss": -12.323873519897461, "global_step": 377880, "epoch": 2249} {"train_loss": -12.44820499420166, "global_step": 377881, "epoch": 2249} {"train_loss": -12.599567413330078, "global_step": 377882, "epoch": 2249} {"train_loss": -12.402085304260254, "global_step": 377883, "epoch": 2249} {"train_loss": -12.535045623779297, "global_step": 377884, "epoch": 2249} {"train_loss": -12.38759708404541, "global_step": 377885, "epoch": 2249} {"train_loss": -12.597589492797852, "global_step": 377886, "epoch": 2249} {"train_loss": -12.377766609191895, "global_step": 377887, "epoch": 2249} {"train_loss": -12.720869064331055, "global_step": 377888, "epoch": 2249} {"train_loss": -12.2442626953125, "global_step": 377889, "epoch": 2249} {"train_loss": -12.631832122802734, "global_step": 377890, "epoch": 2249} {"train_loss": -12.613090515136719, "global_step": 377891, "epoch": 2249} {"train_loss": -12.444329261779785, "global_step": 377892, "epoch": 2249} {"train_loss": -12.542423248291016, "global_step": 377893, "epoch": 2249} {"train_loss": -12.552847862243652, "global_step": 377894, "epoch": 2249} {"train_loss": -12.613138198852539, "global_step": 377895, "epoch": 2249} {"train_loss": -12.331460952758789, "global_step": 377896, "epoch": 2249} {"train_loss": -12.403982162475586, "global_step": 377897, "epoch": 2249} {"train_loss": -12.257766723632812, "global_step": 377898, "epoch": 2249} {"train_loss": -11.946329116821289, "global_step": 377899, "epoch": 2249} {"train_loss": -12.31859302520752, "global_step": 377900, "epoch": 2249} {"train_loss": -11.780355453491211, "global_step": 377901, "epoch": 2249} {"train_loss": -12.338231086730957, "global_step": 377902, "epoch": 2249} {"train_loss": -11.991767883300781, "global_step": 377903, "epoch": 2249} {"train_loss": -12.063735961914062, "global_step": 377904, "epoch": 2249} {"train_loss": -10.813615798950195, "global_step": 377905, "epoch": 2249} {"train_loss": -11.8865385055542, "global_step": 377906, "epoch": 2249} {"train_loss": -11.742969512939453, "global_step": 377907, "epoch": 2249} {"train_loss": -11.275510787963867, "global_step": 377908, "epoch": 2249} {"train_loss": -11.465387344360352, "global_step": 377909, "epoch": 2249} {"train_loss": -11.89801025390625, "global_step": 377910, "epoch": 2249} {"train_loss": -10.682271003723145, "global_step": 377911, "epoch": 2249} {"train_loss": -11.492631912231445, "global_step": 377912, "epoch": 2249} {"train_loss": -11.717971801757812, "global_step": 377913, "epoch": 2249} {"train_loss": -10.929943084716797, "global_step": 377914, "epoch": 2249} {"train_loss": -11.387594223022461, "global_step": 377915, "epoch": 2249} {"train_loss": -10.993471145629883, "global_step": 377916, "epoch": 2249} {"train_loss": -11.588506698608398, "global_step": 377917, "epoch": 2249} {"train_loss": -10.82040023803711, "global_step": 377918, "epoch": 2249} {"train_loss": -11.314970016479492, "global_step": 377919, "epoch": 2249} {"train_loss": -11.818697929382324, "global_step": 377920, "epoch": 2249} {"train_loss": -11.187030792236328, "global_step": 377921, "epoch": 2249} {"train_loss": -11.463932037353516, "global_step": 377922, "epoch": 2249} {"train_loss": -11.968881607055664, "global_step": 377923, "epoch": 2249} {"train_loss": -11.498516082763672, "global_step": 377924, "epoch": 2249} {"train_loss": -12.004338264465332, "global_step": 377925, "epoch": 2249} {"train_loss": -11.795928955078125, "global_step": 377926, "epoch": 2249} {"train_loss": -10.802366256713867, "global_step": 377927, "epoch": 2249} {"train_loss": -11.820701599121094, "global_step": 377928, "epoch": 2249} {"train_loss": -11.281280517578125, "global_step": 377929, "epoch": 2249} {"train_loss": -11.325733184814453, "global_step": 377930, "epoch": 2249} {"train_loss": -11.716679573059082, "global_step": 377931, "epoch": 2249} {"train_loss": -11.34854507446289, "global_step": 377932, "epoch": 2249} {"train_loss": -12.209587097167969, "global_step": 377933, "epoch": 2249} {"train_loss": -11.369989395141602, "global_step": 377934, "epoch": 2249} {"train_loss": -11.93834114074707, "global_step": 377935, "epoch": 2249} {"train_loss": -11.622536659240723, "global_step": 377936, "epoch": 2249} {"train_loss": -12.015913963317871, "global_step": 377937, "epoch": 2249} {"train_loss": -11.633686065673828, "global_step": 377938, "epoch": 2249} {"train_loss": -12.128989219665527, "global_step": 377939, "epoch": 2249} {"train_loss": -11.747817993164062, "global_step": 377940, "epoch": 2249} {"train_loss": -12.134790420532227, "global_step": 377941, "epoch": 2249} {"train_loss": -11.712003707885742, "global_step": 377942, "epoch": 2249} {"train_loss": -12.273628234863281, "global_step": 377943, "epoch": 2249} {"train_loss": -12.197985649108887, "global_step": 377944, "epoch": 2249} {"train_loss": -12.03428840637207, "global_step": 377945, "epoch": 2249} {"train_loss": -11.850571632385254, "global_step": 377946, "epoch": 2249} {"train_loss": -11.999856948852539, "global_step": 377947, "epoch": 2249} {"train_loss": -12.171457290649414, "global_step": 377948, "epoch": 2249} {"train_loss": -12.158921241760254, "global_step": 377949, "epoch": 2249} {"train_loss": -12.228486061096191, "global_step": 377950, "epoch": 2249} {"train_loss": -12.211088180541992, "global_step": 377951, "epoch": 2249} {"train_loss": -12.135153770446777, "global_step": 377952, "epoch": 2249} {"train_loss": -12.290358543395996, "global_step": 377953, "epoch": 2249} {"train_loss": -12.057426452636719, "global_step": 377954, "epoch": 2249} {"train_loss": -12.342103004455566, "global_step": 377955, "epoch": 2249} {"train_loss": -11.714345932006836, "global_step": 377956, "epoch": 2249} {"train_loss": -12.171162605285645, "global_step": 377957, "epoch": 2249} {"train_loss": -11.879966735839844, "global_step": 377958, "epoch": 2249} {"train_loss": -12.516571044921875, "global_step": 377959, "epoch": 2249} {"train_loss": -11.685937881469727, "global_step": 377960, "epoch": 2249} {"train_loss": -12.336007118225098, "global_step": 377961, "epoch": 2249} {"train_loss": -12.172464370727539, "global_step": 377962, "epoch": 2249} {"train_loss": -12.059752464294434, "global_step": 377963, "epoch": 2249} {"train_loss": -12.501893997192383, "global_step": 377964, "epoch": 2249} {"train_loss": -12.19076919555664, "global_step": 377965, "epoch": 2249} {"train_loss": -12.488866806030273, "global_step": 377966, "epoch": 2249} {"train_loss": -12.65658187866211, "global_step": 377967, "epoch": 2249} {"train_loss": -12.38884162902832, "global_step": 377968, "epoch": 2249} {"train_loss": -12.33035659790039, "global_step": 377969, "epoch": 2249} {"train_loss": -12.65764045715332, "global_step": 377970, "epoch": 2249} {"train_loss": -12.36761474609375, "global_step": 377971, "epoch": 2249} {"train_loss": -12.496162414550781, "global_step": 377972, "epoch": 2249} {"train_loss": -12.394622802734375, "global_step": 377973, "epoch": 2249} {"train_loss": -12.644857406616211, "global_step": 377974, "epoch": 2249} {"train_loss": -12.456520080566406, "global_step": 377975, "epoch": 2249} {"train_loss": -12.686775207519531, "global_step": 377976, "epoch": 2249} {"train_loss": -12.472759246826172, "global_step": 377977, "epoch": 2249} {"train_loss": -12.574203491210938, "global_step": 377978, "epoch": 2249} {"train_loss": -12.737689971923828, "global_step": 377979, "epoch": 2249} {"train_loss": -12.306808471679688, "global_step": 377980, "epoch": 2249} {"train_loss": -12.653484344482422, "global_step": 377981, "epoch": 2249} {"train_loss": -12.346003532409668, "global_step": 377982, "epoch": 2249} {"train_loss": -12.187384605407715, "global_step": 377983, "epoch": 2249} {"train_loss": -12.58212661743164, "global_step": 377984, "epoch": 2249} {"train_loss": -12.423942565917969, "global_step": 377985, "epoch": 2249} {"train_loss": -12.872438430786133, "global_step": 377986, "epoch": 2249} {"train_loss": -12.527201652526855, "global_step": 377987, "epoch": 2249} {"train_loss": -12.478781700134277, "global_step": 377988, "epoch": 2249} {"train_loss": -12.45765209197998, "global_step": 377989, "epoch": 2249} {"train_loss": -12.45938491821289, "global_step": 377990, "epoch": 2249} {"train_loss": -12.733110427856445, "global_step": 377991, "epoch": 2249} {"train_loss": -12.75261116027832, "global_step": 377992, "epoch": 2249} {"train_loss": -12.586177825927734, "global_step": 377993, "epoch": 2249} {"train_loss": -12.519170761108398, "global_step": 377994, "epoch": 2249} {"train_loss": -12.376734733581543, "global_step": 377995, "epoch": 2249} {"train_loss": -12.617607116699219, "global_step": 377996, "epoch": 2249} {"train_loss": -12.656598091125488, "global_step": 377997, "epoch": 2249} {"train_loss": -12.838582992553711, "global_step": 377998, "epoch": 2249} {"train_loss": -12.086035654658364, "global_step": 377999, "epoch": 2249, "val_loss": 293300.84375} {"train_loss": -12.51561164855957, "global_step": 378000, "epoch": 2250} {"train_loss": -12.248947143554688, "global_step": 378001, "epoch": 2250} {"train_loss": -12.595483779907227, "global_step": 378002, "epoch": 2250} {"train_loss": -12.355974197387695, "global_step": 378003, "epoch": 2250} {"train_loss": -12.212072372436523, "global_step": 378004, "epoch": 2250} {"train_loss": -12.133956909179688, "global_step": 378005, "epoch": 2250} {"train_loss": -12.136180877685547, "global_step": 378006, "epoch": 2250} {"train_loss": -12.072942733764648, "global_step": 378007, "epoch": 2250} {"train_loss": -12.40811824798584, "global_step": 378008, "epoch": 2250} {"train_loss": -12.23437786102295, "global_step": 378009, "epoch": 2250} {"train_loss": -12.55548095703125, "global_step": 378010, "epoch": 2250} {"train_loss": -12.67835807800293, "global_step": 378011, "epoch": 2250} {"train_loss": -12.55047607421875, "global_step": 378012, "epoch": 2250} {"train_loss": -12.137163162231445, "global_step": 378013, "epoch": 2250} {"train_loss": -12.513816833496094, "global_step": 378014, "epoch": 2250} {"train_loss": -12.385512351989746, "global_step": 378015, "epoch": 2250} {"train_loss": -12.445882797241211, "global_step": 378016, "epoch": 2250} {"train_loss": -12.673561096191406, "global_step": 378017, "epoch": 2250} {"train_loss": -12.31922721862793, "global_step": 378018, "epoch": 2250} {"train_loss": -12.101375579833984, "global_step": 378019, "epoch": 2250} {"train_loss": -11.193673133850098, "global_step": 378020, "epoch": 2250} {"train_loss": -12.592342376708984, "global_step": 378021, "epoch": 2250} {"train_loss": -10.963262557983398, "global_step": 378022, "epoch": 2250} {"train_loss": -11.009510040283203, "global_step": 378023, "epoch": 2250} {"train_loss": -11.98316478729248, "global_step": 378024, "epoch": 2250} {"train_loss": -12.08830738067627, "global_step": 378025, "epoch": 2250} {"train_loss": -11.001581192016602, "global_step": 378026, "epoch": 2250} {"train_loss": -11.844442367553711, "global_step": 378027, "epoch": 2250} {"train_loss": -11.594566345214844, "global_step": 378028, "epoch": 2250} {"train_loss": -11.397603988647461, "global_step": 378029, "epoch": 2250} {"train_loss": -12.405340194702148, "global_step": 378030, "epoch": 2250} {"train_loss": -10.675941467285156, "global_step": 378031, "epoch": 2250} {"train_loss": -11.939913749694824, "global_step": 378032, "epoch": 2250} {"train_loss": -11.284482955932617, "global_step": 378033, "epoch": 2250} {"train_loss": -11.967575073242188, "global_step": 378034, "epoch": 2250} {"train_loss": -10.466489791870117, "global_step": 378035, "epoch": 2250} {"train_loss": -11.15374755859375, "global_step": 378036, "epoch": 2250} {"train_loss": -7.871211051940918, "global_step": 378037, "epoch": 2250} {"train_loss": -6.771551132202148, "global_step": 378038, "epoch": 2250} {"train_loss": -7.425868034362793, "global_step": 378039, "epoch": 2250} {"train_loss": -6.504889011383057, "global_step": 378040, "epoch": 2250} {"train_loss": -5.860823631286621, "global_step": 378041, "epoch": 2250} {"train_loss": -6.699676036834717, "global_step": 378042, "epoch": 2250} {"train_loss": -6.8406829833984375, "global_step": 378043, "epoch": 2250} {"train_loss": -7.37200927734375, "global_step": 378044, "epoch": 2250} {"train_loss": -7.410009384155273, "global_step": 378045, "epoch": 2250} {"train_loss": -7.7443084716796875, "global_step": 378046, "epoch": 2250} {"train_loss": -9.470491409301758, "global_step": 378047, "epoch": 2250} {"train_loss": -7.964832782745361, "global_step": 378048, "epoch": 2250} {"train_loss": -8.169792175292969, "global_step": 378049, "epoch": 2250} {"train_loss": -8.54437255859375, "global_step": 378050, "epoch": 2250} {"train_loss": -7.904447078704834, "global_step": 378051, "epoch": 2250} {"train_loss": -8.484877586364746, "global_step": 378052, "epoch": 2250} {"train_loss": -8.736225128173828, "global_step": 378053, "epoch": 2250} {"train_loss": -8.684480667114258, "global_step": 378054, "epoch": 2250} {"train_loss": -8.952507972717285, "global_step": 378055, "epoch": 2250} {"train_loss": -10.256531715393066, "global_step": 378056, "epoch": 2250} {"train_loss": -8.98805046081543, "global_step": 378057, "epoch": 2250} {"train_loss": -9.686848640441895, "global_step": 378058, "epoch": 2250} {"train_loss": -9.749622344970703, "global_step": 378059, "epoch": 2250} {"train_loss": -9.798120498657227, "global_step": 378060, "epoch": 2250} {"train_loss": -10.568609237670898, "global_step": 378061, "epoch": 2250} {"train_loss": -10.360445022583008, "global_step": 378062, "epoch": 2250} {"train_loss": -10.393362045288086, "global_step": 378063, "epoch": 2250} {"train_loss": -10.597515106201172, "global_step": 378064, "epoch": 2250} {"train_loss": -10.926717758178711, "global_step": 378065, "epoch": 2250} {"train_loss": -10.720745086669922, "global_step": 378066, "epoch": 2250} {"train_loss": -11.182929039001465, "global_step": 378067, "epoch": 2250} {"train_loss": -10.61711311340332, "global_step": 378068, "epoch": 2250} {"train_loss": -11.815969467163086, "global_step": 378069, "epoch": 2250} {"train_loss": -11.290006637573242, "global_step": 378070, "epoch": 2250} {"train_loss": -11.582484245300293, "global_step": 378071, "epoch": 2250} {"train_loss": -11.954032897949219, "global_step": 378072, "epoch": 2250} {"train_loss": -11.121145248413086, "global_step": 378073, "epoch": 2250} {"train_loss": -11.46670150756836, "global_step": 378074, "epoch": 2250} {"train_loss": -11.664278030395508, "global_step": 378075, "epoch": 2250} {"train_loss": -11.97091293334961, "global_step": 378076, "epoch": 2250} {"train_loss": -11.819802284240723, "global_step": 378077, "epoch": 2250} {"train_loss": -11.451408386230469, "global_step": 378078, "epoch": 2250} {"train_loss": -11.650371551513672, "global_step": 378079, "epoch": 2250} {"train_loss": -11.677667617797852, "global_step": 378080, "epoch": 2250} {"train_loss": -11.33023452758789, "global_step": 378081, "epoch": 2250} {"train_loss": -11.42082691192627, "global_step": 378082, "epoch": 2250} {"train_loss": -11.5172119140625, "global_step": 378083, "epoch": 2250} {"train_loss": -11.86816120147705, "global_step": 378084, "epoch": 2250} {"train_loss": -12.166993141174316, "global_step": 378085, "epoch": 2250} {"train_loss": -11.918811798095703, "global_step": 378086, "epoch": 2250} {"train_loss": -12.021848678588867, "global_step": 378087, "epoch": 2250} {"train_loss": -12.117179870605469, "global_step": 378088, "epoch": 2250} {"train_loss": -12.299345016479492, "global_step": 378089, "epoch": 2250} {"train_loss": -12.151008605957031, "global_step": 378090, "epoch": 2250} {"train_loss": -12.179131507873535, "global_step": 378091, "epoch": 2250} {"train_loss": -12.430746078491211, "global_step": 378092, "epoch": 2250} {"train_loss": -12.11252212524414, "global_step": 378093, "epoch": 2250} {"train_loss": -12.013090133666992, "global_step": 378094, "epoch": 2250} {"train_loss": -12.257915496826172, "global_step": 378095, "epoch": 2250} {"train_loss": -12.268001556396484, "global_step": 378096, "epoch": 2250} {"train_loss": -12.118534088134766, "global_step": 378097, "epoch": 2250} {"train_loss": -12.29511833190918, "global_step": 378098, "epoch": 2250} {"train_loss": -12.319263458251953, "global_step": 378099, "epoch": 2250} {"train_loss": -12.33039665222168, "global_step": 378100, "epoch": 2250} {"train_loss": -12.368955612182617, "global_step": 378101, "epoch": 2250} {"train_loss": -12.31680679321289, "global_step": 378102, "epoch": 2250} {"train_loss": -12.374959945678711, "global_step": 378103, "epoch": 2250} {"train_loss": -12.497922897338867, "global_step": 378104, "epoch": 2250} {"train_loss": -12.43204402923584, "global_step": 378105, "epoch": 2250} {"train_loss": -12.480301856994629, "global_step": 378106, "epoch": 2250} {"train_loss": -12.346626281738281, "global_step": 378107, "epoch": 2250} {"train_loss": -12.254483222961426, "global_step": 378108, "epoch": 2250} {"train_loss": -12.361189842224121, "global_step": 378109, "epoch": 2250} {"train_loss": -12.663399696350098, "global_step": 378110, "epoch": 2250} {"train_loss": -12.210372924804688, "global_step": 378111, "epoch": 2250} {"train_loss": -12.5070161819458, "global_step": 378112, "epoch": 2250} {"train_loss": -12.495393753051758, "global_step": 378113, "epoch": 2250} {"train_loss": -12.320433616638184, "global_step": 378114, "epoch": 2250} {"train_loss": -12.208869934082031, "global_step": 378115, "epoch": 2250} {"train_loss": -12.434911727905273, "global_step": 378116, "epoch": 2250} {"train_loss": -12.357701301574707, "global_step": 378117, "epoch": 2250} {"train_loss": -12.527755737304688, "global_step": 378118, "epoch": 2250} {"train_loss": -12.534000396728516, "global_step": 378119, "epoch": 2250} {"train_loss": -12.711009979248047, "global_step": 378120, "epoch": 2250} {"train_loss": -12.46207046508789, "global_step": 378121, "epoch": 2250} {"train_loss": -12.487531661987305, "global_step": 378122, "epoch": 2250} {"train_loss": -12.47458267211914, "global_step": 378123, "epoch": 2250} {"train_loss": -12.739217758178711, "global_step": 378124, "epoch": 2250} {"train_loss": -12.48504638671875, "global_step": 378125, "epoch": 2250} {"train_loss": -12.733716011047363, "global_step": 378126, "epoch": 2250} {"train_loss": -12.675466537475586, "global_step": 378127, "epoch": 2250} {"train_loss": -12.411376953125, "global_step": 378128, "epoch": 2250} {"train_loss": -12.685511589050293, "global_step": 378129, "epoch": 2250} {"train_loss": -12.45344066619873, "global_step": 378130, "epoch": 2250} {"train_loss": -12.478840827941895, "global_step": 378131, "epoch": 2250} {"train_loss": -12.494441986083984, "global_step": 378132, "epoch": 2250} {"train_loss": -12.523951530456543, "global_step": 378133, "epoch": 2250} {"train_loss": -12.611772537231445, "global_step": 378134, "epoch": 2250} {"train_loss": -12.589340209960938, "global_step": 378135, "epoch": 2250} {"train_loss": -12.506884574890137, "global_step": 378136, "epoch": 2250} {"train_loss": -12.589347839355469, "global_step": 378137, "epoch": 2250} {"train_loss": -12.721500396728516, "global_step": 378138, "epoch": 2250} {"train_loss": -12.584264755249023, "global_step": 378139, "epoch": 2250} {"train_loss": -12.44709300994873, "global_step": 378140, "epoch": 2250} {"train_loss": -12.768302917480469, "global_step": 378141, "epoch": 2250} {"train_loss": -12.361023902893066, "global_step": 378142, "epoch": 2250} {"train_loss": -12.744590759277344, "global_step": 378143, "epoch": 2250} {"train_loss": -12.052921295166016, "global_step": 378144, "epoch": 2250} {"train_loss": -12.504079818725586, "global_step": 378145, "epoch": 2250} {"train_loss": -12.356968879699707, "global_step": 378146, "epoch": 2250} {"train_loss": -12.25082778930664, "global_step": 378147, "epoch": 2250} {"train_loss": -12.550334930419922, "global_step": 378148, "epoch": 2250} {"train_loss": -12.297719955444336, "global_step": 378149, "epoch": 2250} {"train_loss": -12.289597511291504, "global_step": 378150, "epoch": 2250} {"train_loss": -12.745950698852539, "global_step": 378151, "epoch": 2250} {"train_loss": -12.428739547729492, "global_step": 378152, "epoch": 2250} {"train_loss": -12.253311157226562, "global_step": 378153, "epoch": 2250} {"train_loss": -12.570144653320312, "global_step": 378154, "epoch": 2250} {"train_loss": -12.203744888305664, "global_step": 378155, "epoch": 2250} {"train_loss": -11.93820571899414, "global_step": 378156, "epoch": 2250} {"train_loss": -12.351143836975098, "global_step": 378157, "epoch": 2250} {"train_loss": -12.10006332397461, "global_step": 378158, "epoch": 2250} {"train_loss": -12.308364868164062, "global_step": 378159, "epoch": 2250} {"train_loss": -12.256612777709961, "global_step": 378160, "epoch": 2250} {"train_loss": -12.45834732055664, "global_step": 378161, "epoch": 2250} {"train_loss": -12.52145767211914, "global_step": 378162, "epoch": 2250} {"train_loss": -12.787813186645508, "global_step": 378163, "epoch": 2250} {"train_loss": -12.206021308898926, "global_step": 378164, "epoch": 2250} {"train_loss": -12.532901763916016, "global_step": 378165, "epoch": 2250} {"train_loss": -12.502235412597656, "global_step": 378166, "epoch": 2250} {"train_loss": -11.540957848230997, "global_step": 378167, "epoch": 2250, "train/sim_max_reward_0": 0.6638225781054705, "train/sim_max_reward_1": 0.9452759738142577, "train/sim_max_reward_2": 0.0010936468400468973, "train/sim_max_reward_3": 0.11370081673661497, "train/sim_max_reward_4": 0.9854867012230695, "train/sim_max_reward_5": 0.5102037182723679, "test/sim_max_reward_4400000": 0.9565416738292932, "test/sim_max_reward_4400001": 0.9537649426436413, "test/sim_max_reward_4400002": 0.5691847154803839, "test/sim_max_reward_4400003": 0.8836714693306114, "test/sim_max_reward_4400004": 0.4722329037831755, "test/sim_max_reward_4400005": 0.9614335811650114, "test/sim_max_reward_4400006": 0.2991445229620346, "test/sim_max_reward_4400007": 0.4073457510540723, "test/sim_max_reward_4400008": 0.6115724184566232, "test/sim_max_reward_4400009": 0.02996840917777387, "test/sim_max_reward_4400010": 0.8362881720105907, "test/sim_max_reward_4400011": 0.2943051346332886, "test/sim_max_reward_4400012": 0.4207828732830302, "test/sim_max_reward_4400013": 0.9598566162562066, "test/sim_max_reward_4400014": 0.987014085020581, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.09279930934132405, "test/sim_max_reward_4400018": 0.9152760383110101, "test/sim_max_reward_4400019": 0.489485788332387, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.6011943237904844, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.14020195477439726, "test/sim_max_reward_4400024": 0.9053444589799106, "test/sim_max_reward_4400025": 0.7191115342967913, "test/sim_max_reward_4400026": 0.9672716867671511, "test/sim_max_reward_4400027": 0.4571639043785056, "test/sim_max_reward_4400028": 0.9610944921074356, "test/sim_max_reward_4400029": 0.8809795861152232, "test/sim_max_reward_4400030": 0.9808206902796551, "test/sim_max_reward_4400031": 0.897096095625586, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.4694171306304294, "test/sim_max_reward_4400034": 0.6345285260221284, "test/sim_max_reward_4400035": 0.8738936524435758, "test/sim_max_reward_4400036": 0.3765373390327301, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.32676290586270307, "test/sim_max_reward_4400039": 0.9631683148982346, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.17075643271307875, "test/sim_max_reward_4400042": 0.18118035729053644, "test/sim_max_reward_4400043": 0.02498390151891271, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.0, "test/sim_max_reward_4400046": 0.9971088791402268, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.5365972391653046, "test/mean_score": 0.5533898999469011, "val_loss": 292598.53125, "train_action_mse_error": 1.5994887351989746} {"train_loss": -12.667886734008789, "global_step": 378168, "epoch": 2251} {"train_loss": -12.474406242370605, "global_step": 378169, "epoch": 2251} {"train_loss": -12.254963874816895, "global_step": 378170, "epoch": 2251} {"train_loss": -12.591116905212402, "global_step": 378171, "epoch": 2251} {"train_loss": -12.459705352783203, "global_step": 378172, "epoch": 2251} {"train_loss": -12.01826286315918, "global_step": 378173, "epoch": 2251} {"train_loss": -10.805999755859375, "global_step": 378174, "epoch": 2251} {"train_loss": -10.389822006225586, "global_step": 378175, "epoch": 2251} {"train_loss": -11.502659797668457, "global_step": 378176, "epoch": 2251} {"train_loss": -12.020395278930664, "global_step": 378177, "epoch": 2251} {"train_loss": -10.95374870300293, "global_step": 378178, "epoch": 2251} {"train_loss": -12.145928382873535, "global_step": 378179, "epoch": 2251} {"train_loss": -10.886561393737793, "global_step": 378180, "epoch": 2251} {"train_loss": -11.339847564697266, "global_step": 378181, "epoch": 2251} {"train_loss": -11.542488098144531, "global_step": 378182, "epoch": 2251} {"train_loss": -10.961405754089355, "global_step": 378183, "epoch": 2251} {"train_loss": -11.719795227050781, "global_step": 378184, "epoch": 2251} {"train_loss": -11.939711570739746, "global_step": 378185, "epoch": 2251} {"train_loss": -11.906789779663086, "global_step": 378186, "epoch": 2251} {"train_loss": -11.574699401855469, "global_step": 378187, "epoch": 2251} {"train_loss": -11.114021301269531, "global_step": 378188, "epoch": 2251} {"train_loss": -10.109210968017578, "global_step": 378189, "epoch": 2251} {"train_loss": -9.947117805480957, "global_step": 378190, "epoch": 2251} {"train_loss": -10.381050109863281, "global_step": 378191, "epoch": 2251} {"train_loss": -10.311500549316406, "global_step": 378192, "epoch": 2251} {"train_loss": -11.498699188232422, "global_step": 378193, "epoch": 2251} {"train_loss": -10.772628784179688, "global_step": 378194, "epoch": 2251} {"train_loss": -11.493509292602539, "global_step": 378195, "epoch": 2251} {"train_loss": -11.38327693939209, "global_step": 378196, "epoch": 2251} {"train_loss": -11.554682731628418, "global_step": 378197, "epoch": 2251} {"train_loss": -11.504440307617188, "global_step": 378198, "epoch": 2251} {"train_loss": -11.608983993530273, "global_step": 378199, "epoch": 2251} {"train_loss": -12.005559921264648, "global_step": 378200, "epoch": 2251} {"train_loss": -11.641843795776367, "global_step": 378201, "epoch": 2251} {"train_loss": -11.816356658935547, "global_step": 378202, "epoch": 2251} {"train_loss": -11.922496795654297, "global_step": 378203, "epoch": 2251} {"train_loss": -11.990888595581055, "global_step": 378204, "epoch": 2251} {"train_loss": -12.200600624084473, "global_step": 378205, "epoch": 2251} {"train_loss": -12.425060272216797, "global_step": 378206, "epoch": 2251} {"train_loss": -11.99570083618164, "global_step": 378207, "epoch": 2251} {"train_loss": -12.146256446838379, "global_step": 378208, "epoch": 2251} {"train_loss": -11.93186092376709, "global_step": 378209, "epoch": 2251} {"train_loss": -12.409173011779785, "global_step": 378210, "epoch": 2251} {"train_loss": -12.097041130065918, "global_step": 378211, "epoch": 2251} {"train_loss": -12.350093841552734, "global_step": 378212, "epoch": 2251} {"train_loss": -12.146684646606445, "global_step": 378213, "epoch": 2251} {"train_loss": -12.286819458007812, "global_step": 378214, "epoch": 2251} {"train_loss": -12.012020111083984, "global_step": 378215, "epoch": 2251} {"train_loss": -12.053873062133789, "global_step": 378216, "epoch": 2251} {"train_loss": -12.228361129760742, "global_step": 378217, "epoch": 2251} {"train_loss": -12.30128002166748, "global_step": 378218, "epoch": 2251} {"train_loss": -12.223955154418945, "global_step": 378219, "epoch": 2251} {"train_loss": -12.298940658569336, "global_step": 378220, "epoch": 2251} {"train_loss": -12.277582168579102, "global_step": 378221, "epoch": 2251} {"train_loss": -12.537994384765625, "global_step": 378222, "epoch": 2251} {"train_loss": -12.111605644226074, "global_step": 378223, "epoch": 2251} {"train_loss": -12.317033767700195, "global_step": 378224, "epoch": 2251} {"train_loss": -11.909904479980469, "global_step": 378225, "epoch": 2251} {"train_loss": -12.350414276123047, "global_step": 378226, "epoch": 2251} {"train_loss": -12.11617660522461, "global_step": 378227, "epoch": 2251} {"train_loss": -12.546477317810059, "global_step": 378228, "epoch": 2251} {"train_loss": -12.267365455627441, "global_step": 378229, "epoch": 2251} {"train_loss": -12.122675895690918, "global_step": 378230, "epoch": 2251} {"train_loss": -12.644323348999023, "global_step": 378231, "epoch": 2251} {"train_loss": -11.851577758789062, "global_step": 378232, "epoch": 2251} {"train_loss": -12.34256362915039, "global_step": 378233, "epoch": 2251} {"train_loss": -12.333359718322754, "global_step": 378234, "epoch": 2251} {"train_loss": -11.945489883422852, "global_step": 378235, "epoch": 2251} {"train_loss": -12.29957389831543, "global_step": 378236, "epoch": 2251} {"train_loss": -11.912345886230469, "global_step": 378237, "epoch": 2251} {"train_loss": -11.662897109985352, "global_step": 378238, "epoch": 2251} {"train_loss": -12.470996856689453, "global_step": 378239, "epoch": 2251} {"train_loss": -12.506406784057617, "global_step": 378240, "epoch": 2251} {"train_loss": -12.126773834228516, "global_step": 378241, "epoch": 2251} {"train_loss": -12.504829406738281, "global_step": 378242, "epoch": 2251} {"train_loss": -11.92004680633545, "global_step": 378243, "epoch": 2251} {"train_loss": -12.026073455810547, "global_step": 378244, "epoch": 2251} {"train_loss": -12.352829933166504, "global_step": 378245, "epoch": 2251} {"train_loss": -11.879633903503418, "global_step": 378246, "epoch": 2251} {"train_loss": -12.075818061828613, "global_step": 378247, "epoch": 2251} {"train_loss": -12.258386611938477, "global_step": 378248, "epoch": 2251} {"train_loss": -12.359444618225098, "global_step": 378249, "epoch": 2251} {"train_loss": -12.082091331481934, "global_step": 378250, "epoch": 2251} {"train_loss": -11.906179428100586, "global_step": 378251, "epoch": 2251} {"train_loss": -12.763256072998047, "global_step": 378252, "epoch": 2251} {"train_loss": -12.368387222290039, "global_step": 378253, "epoch": 2251} {"train_loss": -12.532787322998047, "global_step": 378254, "epoch": 2251} {"train_loss": -12.364900588989258, "global_step": 378255, "epoch": 2251} {"train_loss": -12.009587287902832, "global_step": 378256, "epoch": 2251} {"train_loss": -11.943556785583496, "global_step": 378257, "epoch": 2251} {"train_loss": -12.131986618041992, "global_step": 378258, "epoch": 2251} {"train_loss": -12.13361930847168, "global_step": 378259, "epoch": 2251} {"train_loss": -12.435832977294922, "global_step": 378260, "epoch": 2251} {"train_loss": -11.473603248596191, "global_step": 378261, "epoch": 2251} {"train_loss": -12.514299392700195, "global_step": 378262, "epoch": 2251} {"train_loss": -11.89023494720459, "global_step": 378263, "epoch": 2251} {"train_loss": -12.42251968383789, "global_step": 378264, "epoch": 2251} {"train_loss": -12.514822006225586, "global_step": 378265, "epoch": 2251} {"train_loss": -12.216951370239258, "global_step": 378266, "epoch": 2251} {"train_loss": -12.206047058105469, "global_step": 378267, "epoch": 2251} {"train_loss": -12.435030937194824, "global_step": 378268, "epoch": 2251} {"train_loss": -12.204597473144531, "global_step": 378269, "epoch": 2251} {"train_loss": -12.216934204101562, "global_step": 378270, "epoch": 2251} {"train_loss": -12.576400756835938, "global_step": 378271, "epoch": 2251} {"train_loss": -12.42802906036377, "global_step": 378272, "epoch": 2251} {"train_loss": -12.508794784545898, "global_step": 378273, "epoch": 2251} {"train_loss": -11.89332103729248, "global_step": 378274, "epoch": 2251} {"train_loss": -11.734625816345215, "global_step": 378275, "epoch": 2251} {"train_loss": -12.345443725585938, "global_step": 378276, "epoch": 2251} {"train_loss": -12.129148483276367, "global_step": 378277, "epoch": 2251} {"train_loss": -11.866865158081055, "global_step": 378278, "epoch": 2251} {"train_loss": -11.284799575805664, "global_step": 378279, "epoch": 2251} {"train_loss": -12.149020195007324, "global_step": 378280, "epoch": 2251} {"train_loss": -12.011808395385742, "global_step": 378281, "epoch": 2251} {"train_loss": -11.415799140930176, "global_step": 378282, "epoch": 2251} {"train_loss": -11.99233627319336, "global_step": 378283, "epoch": 2251} {"train_loss": -12.165528297424316, "global_step": 378284, "epoch": 2251} {"train_loss": -12.443215370178223, "global_step": 378285, "epoch": 2251} {"train_loss": -12.496539115905762, "global_step": 378286, "epoch": 2251} {"train_loss": -12.54873275756836, "global_step": 378287, "epoch": 2251} {"train_loss": -12.234930992126465, "global_step": 378288, "epoch": 2251} {"train_loss": -12.28506851196289, "global_step": 378289, "epoch": 2251} {"train_loss": -12.357864379882812, "global_step": 378290, "epoch": 2251} {"train_loss": -12.62343978881836, "global_step": 378291, "epoch": 2251} {"train_loss": -12.488365173339844, "global_step": 378292, "epoch": 2251} {"train_loss": -12.510994911193848, "global_step": 378293, "epoch": 2251} {"train_loss": -12.506292343139648, "global_step": 378294, "epoch": 2251} {"train_loss": -12.301840782165527, "global_step": 378295, "epoch": 2251} {"train_loss": -12.23238468170166, "global_step": 378296, "epoch": 2251} {"train_loss": -12.482067108154297, "global_step": 378297, "epoch": 2251} {"train_loss": -12.569631576538086, "global_step": 378298, "epoch": 2251} {"train_loss": -12.499783515930176, "global_step": 378299, "epoch": 2251} {"train_loss": -12.478743553161621, "global_step": 378300, "epoch": 2251} {"train_loss": -12.3323335647583, "global_step": 378301, "epoch": 2251} {"train_loss": -12.46153736114502, "global_step": 378302, "epoch": 2251} {"train_loss": -12.362330436706543, "global_step": 378303, "epoch": 2251} {"train_loss": -12.073619842529297, "global_step": 378304, "epoch": 2251} {"train_loss": -11.94851016998291, "global_step": 378305, "epoch": 2251} {"train_loss": -12.073974609375, "global_step": 378306, "epoch": 2251} {"train_loss": -12.13411808013916, "global_step": 378307, "epoch": 2251} {"train_loss": -11.765960693359375, "global_step": 378308, "epoch": 2251} {"train_loss": -12.373042106628418, "global_step": 378309, "epoch": 2251} {"train_loss": -12.191097259521484, "global_step": 378310, "epoch": 2251} {"train_loss": -12.42391586303711, "global_step": 378311, "epoch": 2251} {"train_loss": -11.773714065551758, "global_step": 378312, "epoch": 2251} {"train_loss": -12.730852127075195, "global_step": 378313, "epoch": 2251} {"train_loss": -11.878039360046387, "global_step": 378314, "epoch": 2251} {"train_loss": -11.660322189331055, "global_step": 378315, "epoch": 2251} {"train_loss": -11.936717987060547, "global_step": 378316, "epoch": 2251} {"train_loss": -11.42873764038086, "global_step": 378317, "epoch": 2251} {"train_loss": -12.159761428833008, "global_step": 378318, "epoch": 2251} {"train_loss": -12.156906127929688, "global_step": 378319, "epoch": 2251} {"train_loss": -11.834518432617188, "global_step": 378320, "epoch": 2251} {"train_loss": -11.71291732788086, "global_step": 378321, "epoch": 2251} {"train_loss": -11.686601638793945, "global_step": 378322, "epoch": 2251} {"train_loss": -10.972793579101562, "global_step": 378323, "epoch": 2251} {"train_loss": -11.527237892150879, "global_step": 378324, "epoch": 2251} {"train_loss": -11.800670623779297, "global_step": 378325, "epoch": 2251} {"train_loss": -12.021343231201172, "global_step": 378326, "epoch": 2251} {"train_loss": -11.80965518951416, "global_step": 378327, "epoch": 2251} {"train_loss": -11.54802417755127, "global_step": 378328, "epoch": 2251} {"train_loss": -11.173192977905273, "global_step": 378329, "epoch": 2251} {"train_loss": -11.783757209777832, "global_step": 378330, "epoch": 2251} {"train_loss": -10.201013565063477, "global_step": 378331, "epoch": 2251} {"train_loss": -11.851146697998047, "global_step": 378332, "epoch": 2251} {"train_loss": -10.977848052978516, "global_step": 378333, "epoch": 2251} {"train_loss": -12.072317123413086, "global_step": 378334, "epoch": 2251} {"train_loss": -11.983377280689421, "global_step": 378335, "epoch": 2251, "val_loss": 293783.40625} {"train_loss": -10.689218521118164, "global_step": 378336, "epoch": 2252} {"train_loss": -11.941542625427246, "global_step": 378337, "epoch": 2252} {"train_loss": -11.53937816619873, "global_step": 378338, "epoch": 2252} {"train_loss": -11.11408805847168, "global_step": 378339, "epoch": 2252} {"train_loss": -12.028632164001465, "global_step": 378340, "epoch": 2252} {"train_loss": -11.929937362670898, "global_step": 378341, "epoch": 2252} {"train_loss": -11.943571090698242, "global_step": 378342, "epoch": 2252} {"train_loss": -11.8441801071167, "global_step": 378343, "epoch": 2252} {"train_loss": -11.950700759887695, "global_step": 378344, "epoch": 2252} {"train_loss": -12.338757514953613, "global_step": 378345, "epoch": 2252} {"train_loss": -11.3258638381958, "global_step": 378346, "epoch": 2252} {"train_loss": -12.179805755615234, "global_step": 378347, "epoch": 2252} {"train_loss": -11.561882019042969, "global_step": 378348, "epoch": 2252} {"train_loss": -12.40227222442627, "global_step": 378349, "epoch": 2252} {"train_loss": -12.172896385192871, "global_step": 378350, "epoch": 2252} {"train_loss": -12.03575325012207, "global_step": 378351, "epoch": 2252} {"train_loss": -11.68832778930664, "global_step": 378352, "epoch": 2252} {"train_loss": -11.995600700378418, "global_step": 378353, "epoch": 2252} {"train_loss": -11.97840690612793, "global_step": 378354, "epoch": 2252} {"train_loss": -11.803772926330566, "global_step": 378355, "epoch": 2252} {"train_loss": -11.824953079223633, "global_step": 378356, "epoch": 2252} {"train_loss": -11.720074653625488, "global_step": 378357, "epoch": 2252} {"train_loss": -12.035326957702637, "global_step": 378358, "epoch": 2252} {"train_loss": -11.780169486999512, "global_step": 378359, "epoch": 2252} {"train_loss": -12.29328727722168, "global_step": 378360, "epoch": 2252} {"train_loss": -11.237512588500977, "global_step": 378361, "epoch": 2252} {"train_loss": -12.038527488708496, "global_step": 378362, "epoch": 2252} {"train_loss": -11.059964179992676, "global_step": 378363, "epoch": 2252} {"train_loss": -11.386110305786133, "global_step": 378364, "epoch": 2252} {"train_loss": -11.081045150756836, "global_step": 378365, "epoch": 2252} {"train_loss": -11.442792892456055, "global_step": 378366, "epoch": 2252} {"train_loss": -11.773136138916016, "global_step": 378367, "epoch": 2252} {"train_loss": -10.152064323425293, "global_step": 378368, "epoch": 2252} {"train_loss": -10.565299987792969, "global_step": 378369, "epoch": 2252} {"train_loss": -10.329887390136719, "global_step": 378370, "epoch": 2252} {"train_loss": -9.952552795410156, "global_step": 378371, "epoch": 2252} {"train_loss": -11.653875350952148, "global_step": 378372, "epoch": 2252} {"train_loss": -8.99702262878418, "global_step": 378373, "epoch": 2252} {"train_loss": -9.774129867553711, "global_step": 378374, "epoch": 2252} {"train_loss": -10.51848316192627, "global_step": 378375, "epoch": 2252} {"train_loss": -10.271157264709473, "global_step": 378376, "epoch": 2252} {"train_loss": -10.40597152709961, "global_step": 378377, "epoch": 2252} {"train_loss": -11.087886810302734, "global_step": 378378, "epoch": 2252} {"train_loss": -10.129712104797363, "global_step": 378379, "epoch": 2252} {"train_loss": -9.925863265991211, "global_step": 378380, "epoch": 2252} {"train_loss": -11.306100845336914, "global_step": 378381, "epoch": 2252} {"train_loss": -9.816884994506836, "global_step": 378382, "epoch": 2252} {"train_loss": -9.70950698852539, "global_step": 378383, "epoch": 2252} {"train_loss": -11.957210540771484, "global_step": 378384, "epoch": 2252} {"train_loss": -10.569931030273438, "global_step": 378385, "epoch": 2252} {"train_loss": -10.076199531555176, "global_step": 378386, "epoch": 2252} {"train_loss": -11.325973510742188, "global_step": 378387, "epoch": 2252} {"train_loss": -10.329052925109863, "global_step": 378388, "epoch": 2252} {"train_loss": -10.76911449432373, "global_step": 378389, "epoch": 2252} {"train_loss": -11.986918449401855, "global_step": 378390, "epoch": 2252} {"train_loss": -11.143560409545898, "global_step": 378391, "epoch": 2252} {"train_loss": -11.560030937194824, "global_step": 378392, "epoch": 2252} {"train_loss": -11.651805877685547, "global_step": 378393, "epoch": 2252} {"train_loss": -11.390237808227539, "global_step": 378394, "epoch": 2252} {"train_loss": -11.351425170898438, "global_step": 378395, "epoch": 2252} {"train_loss": -11.90266227722168, "global_step": 378396, "epoch": 2252} {"train_loss": -11.009557723999023, "global_step": 378397, "epoch": 2252} {"train_loss": -11.797042846679688, "global_step": 378398, "epoch": 2252} {"train_loss": -11.423089981079102, "global_step": 378399, "epoch": 2252} {"train_loss": -10.997112274169922, "global_step": 378400, "epoch": 2252} {"train_loss": -11.728960037231445, "global_step": 378401, "epoch": 2252} {"train_loss": -11.745645523071289, "global_step": 378402, "epoch": 2252} {"train_loss": -11.549178123474121, "global_step": 378403, "epoch": 2252} {"train_loss": -11.522787094116211, "global_step": 378404, "epoch": 2252} {"train_loss": -11.78119945526123, "global_step": 378405, "epoch": 2252} {"train_loss": -11.448948860168457, "global_step": 378406, "epoch": 2252} {"train_loss": -12.061005592346191, "global_step": 378407, "epoch": 2252} {"train_loss": -11.51310920715332, "global_step": 378408, "epoch": 2252} {"train_loss": -12.048568725585938, "global_step": 378409, "epoch": 2252} {"train_loss": -11.828372955322266, "global_step": 378410, "epoch": 2252} {"train_loss": -11.971851348876953, "global_step": 378411, "epoch": 2252} {"train_loss": -12.088171005249023, "global_step": 378412, "epoch": 2252} {"train_loss": -11.91876220703125, "global_step": 378413, "epoch": 2252} {"train_loss": -12.343791961669922, "global_step": 378414, "epoch": 2252} {"train_loss": -11.961408615112305, "global_step": 378415, "epoch": 2252} {"train_loss": -12.211851119995117, "global_step": 378416, "epoch": 2252} {"train_loss": -11.89096736907959, "global_step": 378417, "epoch": 2252} {"train_loss": -12.320775032043457, "global_step": 378418, "epoch": 2252} {"train_loss": -12.081483840942383, "global_step": 378419, "epoch": 2252} {"train_loss": -12.165380477905273, "global_step": 378420, "epoch": 2252} {"train_loss": -12.33682918548584, "global_step": 378421, "epoch": 2252} {"train_loss": -12.134848594665527, "global_step": 378422, "epoch": 2252} {"train_loss": -12.327613830566406, "global_step": 378423, "epoch": 2252} {"train_loss": -12.217004776000977, "global_step": 378424, "epoch": 2252} {"train_loss": -12.475737571716309, "global_step": 378425, "epoch": 2252} {"train_loss": -12.18709945678711, "global_step": 378426, "epoch": 2252} {"train_loss": -12.291415214538574, "global_step": 378427, "epoch": 2252} {"train_loss": -12.264179229736328, "global_step": 378428, "epoch": 2252} {"train_loss": -12.123034477233887, "global_step": 378429, "epoch": 2252} {"train_loss": -12.186067581176758, "global_step": 378430, "epoch": 2252} {"train_loss": -12.274105072021484, "global_step": 378431, "epoch": 2252} {"train_loss": -11.91714859008789, "global_step": 378432, "epoch": 2252} {"train_loss": -12.032360076904297, "global_step": 378433, "epoch": 2252} {"train_loss": -12.262443542480469, "global_step": 378434, "epoch": 2252} {"train_loss": -12.18017864227295, "global_step": 378435, "epoch": 2252} {"train_loss": -12.30029296875, "global_step": 378436, "epoch": 2252} {"train_loss": -12.395609855651855, "global_step": 378437, "epoch": 2252} {"train_loss": -12.418034553527832, "global_step": 378438, "epoch": 2252} {"train_loss": -12.28524112701416, "global_step": 378439, "epoch": 2252} {"train_loss": -12.252593994140625, "global_step": 378440, "epoch": 2252} {"train_loss": -12.530801773071289, "global_step": 378441, "epoch": 2252} {"train_loss": -12.260452270507812, "global_step": 378442, "epoch": 2252} {"train_loss": -12.389432907104492, "global_step": 378443, "epoch": 2252} {"train_loss": -12.437440872192383, "global_step": 378444, "epoch": 2252} {"train_loss": -12.29106330871582, "global_step": 378445, "epoch": 2252} {"train_loss": -12.488090515136719, "global_step": 378446, "epoch": 2252} {"train_loss": -12.279970169067383, "global_step": 378447, "epoch": 2252} {"train_loss": -12.457950592041016, "global_step": 378448, "epoch": 2252} {"train_loss": -12.282247543334961, "global_step": 378449, "epoch": 2252} {"train_loss": -12.622650146484375, "global_step": 378450, "epoch": 2252} {"train_loss": -12.654890060424805, "global_step": 378451, "epoch": 2252} {"train_loss": -12.373022079467773, "global_step": 378452, "epoch": 2252} {"train_loss": -12.424992561340332, "global_step": 378453, "epoch": 2252} {"train_loss": -12.591297149658203, "global_step": 378454, "epoch": 2252} {"train_loss": -12.438741683959961, "global_step": 378455, "epoch": 2252} {"train_loss": -12.5185546875, "global_step": 378456, "epoch": 2252} {"train_loss": -12.521324157714844, "global_step": 378457, "epoch": 2252} {"train_loss": -12.675790786743164, "global_step": 378458, "epoch": 2252} {"train_loss": -12.451455116271973, "global_step": 378459, "epoch": 2252} {"train_loss": -12.420079231262207, "global_step": 378460, "epoch": 2252} {"train_loss": -12.600423812866211, "global_step": 378461, "epoch": 2252} {"train_loss": -12.35267448425293, "global_step": 378462, "epoch": 2252} {"train_loss": -12.658526420593262, "global_step": 378463, "epoch": 2252} {"train_loss": -12.589852333068848, "global_step": 378464, "epoch": 2252} {"train_loss": -12.34900188446045, "global_step": 378465, "epoch": 2252} {"train_loss": -12.62575912475586, "global_step": 378466, "epoch": 2252} {"train_loss": -12.609783172607422, "global_step": 378467, "epoch": 2252} {"train_loss": -12.640968322753906, "global_step": 378468, "epoch": 2252} {"train_loss": -12.569602966308594, "global_step": 378469, "epoch": 2252} {"train_loss": -12.664676666259766, "global_step": 378470, "epoch": 2252} {"train_loss": -12.68870735168457, "global_step": 378471, "epoch": 2252} {"train_loss": -12.651957511901855, "global_step": 378472, "epoch": 2252} {"train_loss": -12.647771835327148, "global_step": 378473, "epoch": 2252} {"train_loss": -12.55629825592041, "global_step": 378474, "epoch": 2252} {"train_loss": -12.773775100708008, "global_step": 378475, "epoch": 2252} {"train_loss": -12.687821388244629, "global_step": 378476, "epoch": 2252} {"train_loss": -12.573966026306152, "global_step": 378477, "epoch": 2252} {"train_loss": -12.894100189208984, "global_step": 378478, "epoch": 2252} {"train_loss": -12.662940979003906, "global_step": 378479, "epoch": 2252} {"train_loss": -12.720047950744629, "global_step": 378480, "epoch": 2252} {"train_loss": -12.686918258666992, "global_step": 378481, "epoch": 2252} {"train_loss": -12.864030838012695, "global_step": 378482, "epoch": 2252} {"train_loss": -12.578304290771484, "global_step": 378483, "epoch": 2252} {"train_loss": -12.297295570373535, "global_step": 378484, "epoch": 2252} {"train_loss": -12.554441452026367, "global_step": 378485, "epoch": 2252} {"train_loss": -12.549650192260742, "global_step": 378486, "epoch": 2252} {"train_loss": -12.422203063964844, "global_step": 378487, "epoch": 2252} {"train_loss": -12.808055877685547, "global_step": 378488, "epoch": 2252} {"train_loss": -12.11723804473877, "global_step": 378489, "epoch": 2252} {"train_loss": -11.994401931762695, "global_step": 378490, "epoch": 2252} {"train_loss": -11.55370044708252, "global_step": 378491, "epoch": 2252} {"train_loss": -10.803464889526367, "global_step": 378492, "epoch": 2252} {"train_loss": -11.756540298461914, "global_step": 378493, "epoch": 2252} {"train_loss": -12.241323471069336, "global_step": 378494, "epoch": 2252} {"train_loss": -10.706463813781738, "global_step": 378495, "epoch": 2252} {"train_loss": -9.364828109741211, "global_step": 378496, "epoch": 2252} {"train_loss": -11.669449806213379, "global_step": 378497, "epoch": 2252} {"train_loss": -10.754196166992188, "global_step": 378498, "epoch": 2252} {"train_loss": -9.339838027954102, "global_step": 378499, "epoch": 2252} {"train_loss": -10.696342468261719, "global_step": 378500, "epoch": 2252} {"train_loss": -10.56791877746582, "global_step": 378501, "epoch": 2252} {"train_loss": -10.580968856811523, "global_step": 378502, "epoch": 2252} {"train_loss": -11.80669561454228, "global_step": 378503, "epoch": 2252, "val_loss": 292221.9375} {"train_loss": -10.657405853271484, "global_step": 378504, "epoch": 2253} {"train_loss": -11.955025672912598, "global_step": 378505, "epoch": 2253} {"train_loss": -10.503375053405762, "global_step": 378506, "epoch": 2253} {"train_loss": -10.787667274475098, "global_step": 378507, "epoch": 2253} {"train_loss": -11.8915433883667, "global_step": 378508, "epoch": 2253} {"train_loss": -9.727155685424805, "global_step": 378509, "epoch": 2253} {"train_loss": -11.628558158874512, "global_step": 378510, "epoch": 2253} {"train_loss": -11.379161834716797, "global_step": 378511, "epoch": 2253} {"train_loss": -11.351532936096191, "global_step": 378512, "epoch": 2253} {"train_loss": -11.832038879394531, "global_step": 378513, "epoch": 2253} {"train_loss": -11.353260040283203, "global_step": 378514, "epoch": 2253} {"train_loss": -11.400619506835938, "global_step": 378515, "epoch": 2253} {"train_loss": -11.744158744812012, "global_step": 378516, "epoch": 2253} {"train_loss": -11.765031814575195, "global_step": 378517, "epoch": 2253} {"train_loss": -12.208390235900879, "global_step": 378518, "epoch": 2253} {"train_loss": -11.842312812805176, "global_step": 378519, "epoch": 2253} {"train_loss": -11.94757080078125, "global_step": 378520, "epoch": 2253} {"train_loss": -11.67906665802002, "global_step": 378521, "epoch": 2253} {"train_loss": -11.91556167602539, "global_step": 378522, "epoch": 2253} {"train_loss": -11.87392807006836, "global_step": 378523, "epoch": 2253} {"train_loss": -12.441591262817383, "global_step": 378524, "epoch": 2253} {"train_loss": -12.00631332397461, "global_step": 378525, "epoch": 2253} {"train_loss": -12.331818580627441, "global_step": 378526, "epoch": 2253} {"train_loss": -11.867913246154785, "global_step": 378527, "epoch": 2253} {"train_loss": -12.19961166381836, "global_step": 378528, "epoch": 2253} {"train_loss": -12.112043380737305, "global_step": 378529, "epoch": 2253} {"train_loss": -12.324223518371582, "global_step": 378530, "epoch": 2253} {"train_loss": -12.272175788879395, "global_step": 378531, "epoch": 2253} {"train_loss": -12.34797477722168, "global_step": 378532, "epoch": 2253} {"train_loss": -12.403907775878906, "global_step": 378533, "epoch": 2253} {"train_loss": -12.573854446411133, "global_step": 378534, "epoch": 2253} {"train_loss": -12.30292797088623, "global_step": 378535, "epoch": 2253} {"train_loss": -12.46750259399414, "global_step": 378536, "epoch": 2253} {"train_loss": -12.225919723510742, "global_step": 378537, "epoch": 2253} {"train_loss": -12.25709342956543, "global_step": 378538, "epoch": 2253} {"train_loss": -12.59666633605957, "global_step": 378539, "epoch": 2253} {"train_loss": -12.162202835083008, "global_step": 378540, "epoch": 2253} {"train_loss": -12.29594612121582, "global_step": 378541, "epoch": 2253} {"train_loss": -12.35548210144043, "global_step": 378542, "epoch": 2253} {"train_loss": -12.731487274169922, "global_step": 378543, "epoch": 2253} {"train_loss": -12.14598560333252, "global_step": 378544, "epoch": 2253} {"train_loss": -12.519247055053711, "global_step": 378545, "epoch": 2253} {"train_loss": -12.498964309692383, "global_step": 378546, "epoch": 2253} {"train_loss": -12.319578170776367, "global_step": 378547, "epoch": 2253} {"train_loss": -12.589111328125, "global_step": 378548, "epoch": 2253} {"train_loss": -12.264131546020508, "global_step": 378549, "epoch": 2253} {"train_loss": -12.360943794250488, "global_step": 378550, "epoch": 2253} {"train_loss": -11.992202758789062, "global_step": 378551, "epoch": 2253} {"train_loss": -12.401602745056152, "global_step": 378552, "epoch": 2253} {"train_loss": -12.10308837890625, "global_step": 378553, "epoch": 2253} {"train_loss": -12.206230163574219, "global_step": 378554, "epoch": 2253} {"train_loss": -12.035229682922363, "global_step": 378555, "epoch": 2253} {"train_loss": -12.217428207397461, "global_step": 378556, "epoch": 2253} {"train_loss": -11.839258193969727, "global_step": 378557, "epoch": 2253} {"train_loss": -12.273287773132324, "global_step": 378558, "epoch": 2253} {"train_loss": -11.985395431518555, "global_step": 378559, "epoch": 2253} {"train_loss": -12.188913345336914, "global_step": 378560, "epoch": 2253} {"train_loss": -11.951799392700195, "global_step": 378561, "epoch": 2253} {"train_loss": -12.184778213500977, "global_step": 378562, "epoch": 2253} {"train_loss": -12.308152198791504, "global_step": 378563, "epoch": 2253} {"train_loss": -12.537399291992188, "global_step": 378564, "epoch": 2253} {"train_loss": -12.150352478027344, "global_step": 378565, "epoch": 2253} {"train_loss": -12.572158813476562, "global_step": 378566, "epoch": 2253} {"train_loss": -12.292083740234375, "global_step": 378567, "epoch": 2253} {"train_loss": -12.510370254516602, "global_step": 378568, "epoch": 2253} {"train_loss": -12.470352172851562, "global_step": 378569, "epoch": 2253} {"train_loss": -12.377274513244629, "global_step": 378570, "epoch": 2253} {"train_loss": -12.303277969360352, "global_step": 378571, "epoch": 2253} {"train_loss": -12.336433410644531, "global_step": 378572, "epoch": 2253} {"train_loss": -12.52074146270752, "global_step": 378573, "epoch": 2253} {"train_loss": -12.548515319824219, "global_step": 378574, "epoch": 2253} {"train_loss": -12.55367660522461, "global_step": 378575, "epoch": 2253} {"train_loss": -12.64737606048584, "global_step": 378576, "epoch": 2253} {"train_loss": -12.307709693908691, "global_step": 378577, "epoch": 2253} {"train_loss": -12.199197769165039, "global_step": 378578, "epoch": 2253} {"train_loss": -12.249208450317383, "global_step": 378579, "epoch": 2253} {"train_loss": -12.334190368652344, "global_step": 378580, "epoch": 2253} {"train_loss": -12.220359802246094, "global_step": 378581, "epoch": 2253} {"train_loss": -12.407491683959961, "global_step": 378582, "epoch": 2253} {"train_loss": -11.967405319213867, "global_step": 378583, "epoch": 2253} {"train_loss": -12.419598579406738, "global_step": 378584, "epoch": 2253} {"train_loss": -12.4241361618042, "global_step": 378585, "epoch": 2253} {"train_loss": -12.405189514160156, "global_step": 378586, "epoch": 2253} {"train_loss": -12.451074600219727, "global_step": 378587, "epoch": 2253} {"train_loss": -12.481817245483398, "global_step": 378588, "epoch": 2253} {"train_loss": -12.447420120239258, "global_step": 378589, "epoch": 2253} {"train_loss": -12.458911895751953, "global_step": 378590, "epoch": 2253} {"train_loss": -12.35319995880127, "global_step": 378591, "epoch": 2253} {"train_loss": -12.39907169342041, "global_step": 378592, "epoch": 2253} {"train_loss": -12.639778137207031, "global_step": 378593, "epoch": 2253} {"train_loss": -12.331537246704102, "global_step": 378594, "epoch": 2253} {"train_loss": -12.412680625915527, "global_step": 378595, "epoch": 2253} {"train_loss": -12.051763534545898, "global_step": 378596, "epoch": 2253} {"train_loss": -12.526191711425781, "global_step": 378597, "epoch": 2253} {"train_loss": -12.770637512207031, "global_step": 378598, "epoch": 2253} {"train_loss": -12.147865295410156, "global_step": 378599, "epoch": 2253} {"train_loss": -11.985505104064941, "global_step": 378600, "epoch": 2253} {"train_loss": -12.138395309448242, "global_step": 378601, "epoch": 2253} {"train_loss": -11.776139259338379, "global_step": 378602, "epoch": 2253} {"train_loss": -12.128724098205566, "global_step": 378603, "epoch": 2253} {"train_loss": -12.407892227172852, "global_step": 378604, "epoch": 2253} {"train_loss": -12.209806442260742, "global_step": 378605, "epoch": 2253} {"train_loss": -12.728901863098145, "global_step": 378606, "epoch": 2253} {"train_loss": -11.969376564025879, "global_step": 378607, "epoch": 2253} {"train_loss": -11.882848739624023, "global_step": 378608, "epoch": 2253} {"train_loss": -12.418166160583496, "global_step": 378609, "epoch": 2253} {"train_loss": -12.447589874267578, "global_step": 378610, "epoch": 2253} {"train_loss": -11.546777725219727, "global_step": 378611, "epoch": 2253} {"train_loss": -11.755746841430664, "global_step": 378612, "epoch": 2253} {"train_loss": -12.24007797241211, "global_step": 378613, "epoch": 2253} {"train_loss": -12.34462833404541, "global_step": 378614, "epoch": 2253} {"train_loss": -12.33935546875, "global_step": 378615, "epoch": 2253} {"train_loss": -12.379484176635742, "global_step": 378616, "epoch": 2253} {"train_loss": -12.507272720336914, "global_step": 378617, "epoch": 2253} {"train_loss": -12.20323371887207, "global_step": 378618, "epoch": 2253} {"train_loss": -12.148646354675293, "global_step": 378619, "epoch": 2253} {"train_loss": -11.960294723510742, "global_step": 378620, "epoch": 2253} {"train_loss": -12.146862983703613, "global_step": 378621, "epoch": 2253} {"train_loss": -12.290517807006836, "global_step": 378622, "epoch": 2253} {"train_loss": -12.440181732177734, "global_step": 378623, "epoch": 2253} {"train_loss": -12.186918258666992, "global_step": 378624, "epoch": 2253} {"train_loss": -12.561120986938477, "global_step": 378625, "epoch": 2253} {"train_loss": -12.201229095458984, "global_step": 378626, "epoch": 2253} {"train_loss": -12.466014862060547, "global_step": 378627, "epoch": 2253} {"train_loss": -12.629772186279297, "global_step": 378628, "epoch": 2253} {"train_loss": -12.102775573730469, "global_step": 378629, "epoch": 2253} {"train_loss": -12.211923599243164, "global_step": 378630, "epoch": 2253} {"train_loss": -11.975112915039062, "global_step": 378631, "epoch": 2253} {"train_loss": -11.91966438293457, "global_step": 378632, "epoch": 2253} {"train_loss": -12.46506118774414, "global_step": 378633, "epoch": 2253} {"train_loss": -12.026498794555664, "global_step": 378634, "epoch": 2253} {"train_loss": -12.008718490600586, "global_step": 378635, "epoch": 2253} {"train_loss": -12.456514358520508, "global_step": 378636, "epoch": 2253} {"train_loss": -12.073060989379883, "global_step": 378637, "epoch": 2253} {"train_loss": -11.628196716308594, "global_step": 378638, "epoch": 2253} {"train_loss": -12.497466087341309, "global_step": 378639, "epoch": 2253} {"train_loss": -11.856647491455078, "global_step": 378640, "epoch": 2253} {"train_loss": -12.151338577270508, "global_step": 378641, "epoch": 2253} {"train_loss": -11.727808952331543, "global_step": 378642, "epoch": 2253} {"train_loss": -12.197023391723633, "global_step": 378643, "epoch": 2253} {"train_loss": -11.66208267211914, "global_step": 378644, "epoch": 2253} {"train_loss": -12.60333251953125, "global_step": 378645, "epoch": 2253} {"train_loss": -11.604097366333008, "global_step": 378646, "epoch": 2253} {"train_loss": -11.722871780395508, "global_step": 378647, "epoch": 2253} {"train_loss": -11.860639572143555, "global_step": 378648, "epoch": 2253} {"train_loss": -11.885520935058594, "global_step": 378649, "epoch": 2253} {"train_loss": -11.544347763061523, "global_step": 378650, "epoch": 2253} {"train_loss": -11.44974136352539, "global_step": 378651, "epoch": 2253} {"train_loss": -12.584959030151367, "global_step": 378652, "epoch": 2253} {"train_loss": -10.879239082336426, "global_step": 378653, "epoch": 2253} {"train_loss": -11.11526870727539, "global_step": 378654, "epoch": 2253} {"train_loss": -10.286116600036621, "global_step": 378655, "epoch": 2253} {"train_loss": -11.880280494689941, "global_step": 378656, "epoch": 2253} {"train_loss": -9.440038681030273, "global_step": 378657, "epoch": 2253} {"train_loss": -10.783798217773438, "global_step": 378658, "epoch": 2253} {"train_loss": -10.894083976745605, "global_step": 378659, "epoch": 2253} {"train_loss": -9.540674209594727, "global_step": 378660, "epoch": 2253} {"train_loss": -10.961688995361328, "global_step": 378661, "epoch": 2253} {"train_loss": -9.596883773803711, "global_step": 378662, "epoch": 2253} {"train_loss": -11.769838333129883, "global_step": 378663, "epoch": 2253} {"train_loss": -9.93522834777832, "global_step": 378664, "epoch": 2253} {"train_loss": -10.311622619628906, "global_step": 378665, "epoch": 2253} {"train_loss": -10.833442687988281, "global_step": 378666, "epoch": 2253} {"train_loss": -9.402612686157227, "global_step": 378667, "epoch": 2253} {"train_loss": -11.849504470825195, "global_step": 378668, "epoch": 2253} {"train_loss": -9.883474349975586, "global_step": 378669, "epoch": 2253} {"train_loss": -11.076091766357422, "global_step": 378670, "epoch": 2253} {"train_loss": -11.96468388466608, "global_step": 378671, "epoch": 2253, "val_loss": 291145.25} {"train_loss": -11.41046142578125, "global_step": 378672, "epoch": 2254} {"train_loss": -10.991878509521484, "global_step": 378673, "epoch": 2254} {"train_loss": -10.636259078979492, "global_step": 378674, "epoch": 2254} {"train_loss": -11.585439682006836, "global_step": 378675, "epoch": 2254} {"train_loss": -11.241722106933594, "global_step": 378676, "epoch": 2254} {"train_loss": -11.378357887268066, "global_step": 378677, "epoch": 2254} {"train_loss": -9.939372062683105, "global_step": 378678, "epoch": 2254} {"train_loss": -9.90135669708252, "global_step": 378679, "epoch": 2254} {"train_loss": -10.772228240966797, "global_step": 378680, "epoch": 2254} {"train_loss": -11.494173049926758, "global_step": 378681, "epoch": 2254} {"train_loss": -9.593080520629883, "global_step": 378682, "epoch": 2254} {"train_loss": -10.069547653198242, "global_step": 378683, "epoch": 2254} {"train_loss": -11.652968406677246, "global_step": 378684, "epoch": 2254} {"train_loss": -9.941177368164062, "global_step": 378685, "epoch": 2254} {"train_loss": -10.794363021850586, "global_step": 378686, "epoch": 2254} {"train_loss": -9.522680282592773, "global_step": 378687, "epoch": 2254} {"train_loss": -10.886659622192383, "global_step": 378688, "epoch": 2254} {"train_loss": -11.053187370300293, "global_step": 378689, "epoch": 2254} {"train_loss": -10.826138496398926, "global_step": 378690, "epoch": 2254} {"train_loss": -10.330133438110352, "global_step": 378691, "epoch": 2254} {"train_loss": -10.565413475036621, "global_step": 378692, "epoch": 2254} {"train_loss": -10.020637512207031, "global_step": 378693, "epoch": 2254} {"train_loss": -8.615779876708984, "global_step": 378694, "epoch": 2254} {"train_loss": -8.820040702819824, "global_step": 378695, "epoch": 2254} {"train_loss": -8.93515396118164, "global_step": 378696, "epoch": 2254} {"train_loss": -10.863430976867676, "global_step": 378697, "epoch": 2254} {"train_loss": -10.059049606323242, "global_step": 378698, "epoch": 2254} {"train_loss": -9.561954498291016, "global_step": 378699, "epoch": 2254} {"train_loss": -10.39161491394043, "global_step": 378700, "epoch": 2254} {"train_loss": -10.436452865600586, "global_step": 378701, "epoch": 2254} {"train_loss": -10.477500915527344, "global_step": 378702, "epoch": 2254} {"train_loss": -9.577079772949219, "global_step": 378703, "epoch": 2254} {"train_loss": -11.483386993408203, "global_step": 378704, "epoch": 2254} {"train_loss": -10.377235412597656, "global_step": 378705, "epoch": 2254} {"train_loss": -10.948051452636719, "global_step": 378706, "epoch": 2254} {"train_loss": -10.65865707397461, "global_step": 378707, "epoch": 2254} {"train_loss": -10.439188003540039, "global_step": 378708, "epoch": 2254} {"train_loss": -10.706639289855957, "global_step": 378709, "epoch": 2254} {"train_loss": -11.040350914001465, "global_step": 378710, "epoch": 2254} {"train_loss": -10.885578155517578, "global_step": 378711, "epoch": 2254} {"train_loss": -10.872105598449707, "global_step": 378712, "epoch": 2254} {"train_loss": -11.638620376586914, "global_step": 378713, "epoch": 2254} {"train_loss": -11.418680191040039, "global_step": 378714, "epoch": 2254} {"train_loss": -11.213621139526367, "global_step": 378715, "epoch": 2254} {"train_loss": -11.303077697753906, "global_step": 378716, "epoch": 2254} {"train_loss": -11.663814544677734, "global_step": 378717, "epoch": 2254} {"train_loss": -10.922365188598633, "global_step": 378718, "epoch": 2254} {"train_loss": -11.757495880126953, "global_step": 378719, "epoch": 2254} {"train_loss": -11.361421585083008, "global_step": 378720, "epoch": 2254} {"train_loss": -11.25167465209961, "global_step": 378721, "epoch": 2254} {"train_loss": -11.963111877441406, "global_step": 378722, "epoch": 2254} {"train_loss": -11.404191017150879, "global_step": 378723, "epoch": 2254} {"train_loss": -11.802818298339844, "global_step": 378724, "epoch": 2254} {"train_loss": -11.97035026550293, "global_step": 378725, "epoch": 2254} {"train_loss": -11.930031776428223, "global_step": 378726, "epoch": 2254} {"train_loss": -11.704017639160156, "global_step": 378727, "epoch": 2254} {"train_loss": -12.0232515335083, "global_step": 378728, "epoch": 2254} {"train_loss": -11.823444366455078, "global_step": 378729, "epoch": 2254} {"train_loss": -11.8368558883667, "global_step": 378730, "epoch": 2254} {"train_loss": -12.046639442443848, "global_step": 378731, "epoch": 2254} {"train_loss": -11.963027954101562, "global_step": 378732, "epoch": 2254} {"train_loss": -11.860698699951172, "global_step": 378733, "epoch": 2254} {"train_loss": -12.07512092590332, "global_step": 378734, "epoch": 2254} {"train_loss": -11.95169448852539, "global_step": 378735, "epoch": 2254} {"train_loss": -11.933175086975098, "global_step": 378736, "epoch": 2254} {"train_loss": -12.03184700012207, "global_step": 378737, "epoch": 2254} {"train_loss": -11.947511672973633, "global_step": 378738, "epoch": 2254} {"train_loss": -12.108925819396973, "global_step": 378739, "epoch": 2254} {"train_loss": -12.044668197631836, "global_step": 378740, "epoch": 2254} {"train_loss": -12.078535079956055, "global_step": 378741, "epoch": 2254} {"train_loss": -11.923933029174805, "global_step": 378742, "epoch": 2254} {"train_loss": -12.295269012451172, "global_step": 378743, "epoch": 2254} {"train_loss": -11.962481498718262, "global_step": 378744, "epoch": 2254} {"train_loss": -12.096043586730957, "global_step": 378745, "epoch": 2254} {"train_loss": -12.166423797607422, "global_step": 378746, "epoch": 2254} {"train_loss": -11.739892959594727, "global_step": 378747, "epoch": 2254} {"train_loss": -12.263635635375977, "global_step": 378748, "epoch": 2254} {"train_loss": -12.144702911376953, "global_step": 378749, "epoch": 2254} {"train_loss": -12.11649227142334, "global_step": 378750, "epoch": 2254} {"train_loss": -11.832632064819336, "global_step": 378751, "epoch": 2254} {"train_loss": -12.306164741516113, "global_step": 378752, "epoch": 2254} {"train_loss": -12.164600372314453, "global_step": 378753, "epoch": 2254} {"train_loss": -12.21783447265625, "global_step": 378754, "epoch": 2254} {"train_loss": -11.609881401062012, "global_step": 378755, "epoch": 2254} {"train_loss": -12.284655570983887, "global_step": 378756, "epoch": 2254} {"train_loss": -12.031783103942871, "global_step": 378757, "epoch": 2254} {"train_loss": -12.175655364990234, "global_step": 378758, "epoch": 2254} {"train_loss": -12.428890228271484, "global_step": 378759, "epoch": 2254} {"train_loss": -12.14642333984375, "global_step": 378760, "epoch": 2254} {"train_loss": -12.294767379760742, "global_step": 378761, "epoch": 2254} {"train_loss": -12.205666542053223, "global_step": 378762, "epoch": 2254} {"train_loss": -12.220633506774902, "global_step": 378763, "epoch": 2254} {"train_loss": -12.224788665771484, "global_step": 378764, "epoch": 2254} {"train_loss": -12.392927169799805, "global_step": 378765, "epoch": 2254} {"train_loss": -12.276938438415527, "global_step": 378766, "epoch": 2254} {"train_loss": -12.411332130432129, "global_step": 378767, "epoch": 2254} {"train_loss": -12.203439712524414, "global_step": 378768, "epoch": 2254} {"train_loss": -12.168120384216309, "global_step": 378769, "epoch": 2254} {"train_loss": -12.379016876220703, "global_step": 378770, "epoch": 2254} {"train_loss": -12.307512283325195, "global_step": 378771, "epoch": 2254} {"train_loss": -12.348939895629883, "global_step": 378772, "epoch": 2254} {"train_loss": -12.175609588623047, "global_step": 378773, "epoch": 2254} {"train_loss": -12.268892288208008, "global_step": 378774, "epoch": 2254} {"train_loss": -12.232624053955078, "global_step": 378775, "epoch": 2254} {"train_loss": -12.37425422668457, "global_step": 378776, "epoch": 2254} {"train_loss": -12.445528030395508, "global_step": 378777, "epoch": 2254} {"train_loss": -12.406469345092773, "global_step": 378778, "epoch": 2254} {"train_loss": -12.389936447143555, "global_step": 378779, "epoch": 2254} {"train_loss": -11.877509117126465, "global_step": 378780, "epoch": 2254} {"train_loss": -12.559470176696777, "global_step": 378781, "epoch": 2254} {"train_loss": -12.522372245788574, "global_step": 378782, "epoch": 2254} {"train_loss": -12.192211151123047, "global_step": 378783, "epoch": 2254} {"train_loss": -12.554484367370605, "global_step": 378784, "epoch": 2254} {"train_loss": -12.512275695800781, "global_step": 378785, "epoch": 2254} {"train_loss": -12.492668151855469, "global_step": 378786, "epoch": 2254} {"train_loss": -12.285327911376953, "global_step": 378787, "epoch": 2254} {"train_loss": -12.352644920349121, "global_step": 378788, "epoch": 2254} {"train_loss": -12.670095443725586, "global_step": 378789, "epoch": 2254} {"train_loss": -12.389436721801758, "global_step": 378790, "epoch": 2254} {"train_loss": -12.477638244628906, "global_step": 378791, "epoch": 2254} {"train_loss": -12.496603965759277, "global_step": 378792, "epoch": 2254} {"train_loss": -12.463499069213867, "global_step": 378793, "epoch": 2254} {"train_loss": -12.353374481201172, "global_step": 378794, "epoch": 2254} {"train_loss": -12.66092586517334, "global_step": 378795, "epoch": 2254} {"train_loss": -12.35973072052002, "global_step": 378796, "epoch": 2254} {"train_loss": -12.22409439086914, "global_step": 378797, "epoch": 2254} {"train_loss": -12.19760513305664, "global_step": 378798, "epoch": 2254} {"train_loss": -12.217489242553711, "global_step": 378799, "epoch": 2254} {"train_loss": -12.582698822021484, "global_step": 378800, "epoch": 2254} {"train_loss": -12.241083145141602, "global_step": 378801, "epoch": 2254} {"train_loss": -12.582767486572266, "global_step": 378802, "epoch": 2254} {"train_loss": -12.012508392333984, "global_step": 378803, "epoch": 2254} {"train_loss": -12.524332046508789, "global_step": 378804, "epoch": 2254} {"train_loss": -11.987777709960938, "global_step": 378805, "epoch": 2254} {"train_loss": -12.420511245727539, "global_step": 378806, "epoch": 2254} {"train_loss": -10.575014114379883, "global_step": 378807, "epoch": 2254} {"train_loss": -12.625518798828125, "global_step": 378808, "epoch": 2254} {"train_loss": -12.352829933166504, "global_step": 378809, "epoch": 2254} {"train_loss": -12.353489875793457, "global_step": 378810, "epoch": 2254} {"train_loss": -12.357078552246094, "global_step": 378811, "epoch": 2254} {"train_loss": -12.154851913452148, "global_step": 378812, "epoch": 2254} {"train_loss": -12.008564949035645, "global_step": 378813, "epoch": 2254} {"train_loss": -12.274620056152344, "global_step": 378814, "epoch": 2254} {"train_loss": -12.344863891601562, "global_step": 378815, "epoch": 2254} {"train_loss": -11.605319023132324, "global_step": 378816, "epoch": 2254} {"train_loss": -12.293724060058594, "global_step": 378817, "epoch": 2254} {"train_loss": -12.477701187133789, "global_step": 378818, "epoch": 2254} {"train_loss": -11.740997314453125, "global_step": 378819, "epoch": 2254} {"train_loss": -11.90739631652832, "global_step": 378820, "epoch": 2254} {"train_loss": -12.083120346069336, "global_step": 378821, "epoch": 2254} {"train_loss": -12.181564331054688, "global_step": 378822, "epoch": 2254} {"train_loss": -12.01144790649414, "global_step": 378823, "epoch": 2254} {"train_loss": -11.930383682250977, "global_step": 378824, "epoch": 2254} {"train_loss": -11.80440902709961, "global_step": 378825, "epoch": 2254} {"train_loss": -12.177485466003418, "global_step": 378826, "epoch": 2254} {"train_loss": -12.042668342590332, "global_step": 378827, "epoch": 2254} {"train_loss": -11.762161254882812, "global_step": 378828, "epoch": 2254} {"train_loss": -11.96615982055664, "global_step": 378829, "epoch": 2254} {"train_loss": -11.589826583862305, "global_step": 378830, "epoch": 2254} {"train_loss": -12.019059181213379, "global_step": 378831, "epoch": 2254} {"train_loss": -12.233503341674805, "global_step": 378832, "epoch": 2254} {"train_loss": -11.79840087890625, "global_step": 378833, "epoch": 2254} {"train_loss": -12.28013801574707, "global_step": 378834, "epoch": 2254} {"train_loss": -12.298852920532227, "global_step": 378835, "epoch": 2254} {"train_loss": -12.325052261352539, "global_step": 378836, "epoch": 2254} {"train_loss": -11.931875228881836, "global_step": 378837, "epoch": 2254} {"train_loss": -12.484195709228516, "global_step": 378838, "epoch": 2254} {"train_loss": -11.7059139808019, "global_step": 378839, "epoch": 2254, "val_loss": 288641.9375} {"train_loss": -12.116886138916016, "global_step": 378840, "epoch": 2255} {"train_loss": -12.464888572692871, "global_step": 378841, "epoch": 2255} {"train_loss": -12.134871482849121, "global_step": 378842, "epoch": 2255} {"train_loss": -11.952535629272461, "global_step": 378843, "epoch": 2255} {"train_loss": -11.612140655517578, "global_step": 378844, "epoch": 2255} {"train_loss": -12.2064208984375, "global_step": 378845, "epoch": 2255} {"train_loss": -12.039061546325684, "global_step": 378846, "epoch": 2255} {"train_loss": -12.108987808227539, "global_step": 378847, "epoch": 2255} {"train_loss": -12.236690521240234, "global_step": 378848, "epoch": 2255} {"train_loss": -11.77864933013916, "global_step": 378849, "epoch": 2255} {"train_loss": -12.404753684997559, "global_step": 378850, "epoch": 2255} {"train_loss": -12.349617958068848, "global_step": 378851, "epoch": 2255} {"train_loss": -12.232728958129883, "global_step": 378852, "epoch": 2255} {"train_loss": -12.465871810913086, "global_step": 378853, "epoch": 2255} {"train_loss": -11.64699935913086, "global_step": 378854, "epoch": 2255} {"train_loss": -12.137948989868164, "global_step": 378855, "epoch": 2255} {"train_loss": -12.162446022033691, "global_step": 378856, "epoch": 2255} {"train_loss": -12.195505142211914, "global_step": 378857, "epoch": 2255} {"train_loss": -12.351581573486328, "global_step": 378858, "epoch": 2255} {"train_loss": -11.871867179870605, "global_step": 378859, "epoch": 2255} {"train_loss": -12.2174072265625, "global_step": 378860, "epoch": 2255} {"train_loss": -12.284246444702148, "global_step": 378861, "epoch": 2255} {"train_loss": -12.563794136047363, "global_step": 378862, "epoch": 2255} {"train_loss": -12.152531623840332, "global_step": 378863, "epoch": 2255} {"train_loss": -12.056358337402344, "global_step": 378864, "epoch": 2255} {"train_loss": -11.405380249023438, "global_step": 378865, "epoch": 2255} {"train_loss": -11.992931365966797, "global_step": 378866, "epoch": 2255} {"train_loss": -11.960601806640625, "global_step": 378867, "epoch": 2255} {"train_loss": -12.289421081542969, "global_step": 378868, "epoch": 2255} {"train_loss": -12.341081619262695, "global_step": 378869, "epoch": 2255} {"train_loss": -12.558675765991211, "global_step": 378870, "epoch": 2255} {"train_loss": -11.71403694152832, "global_step": 378871, "epoch": 2255} {"train_loss": -11.963213920593262, "global_step": 378872, "epoch": 2255} {"train_loss": -12.330473899841309, "global_step": 378873, "epoch": 2255} {"train_loss": -12.257122039794922, "global_step": 378874, "epoch": 2255} {"train_loss": -11.944637298583984, "global_step": 378875, "epoch": 2255} {"train_loss": -12.123932838439941, "global_step": 378876, "epoch": 2255} {"train_loss": -12.22215461730957, "global_step": 378877, "epoch": 2255} {"train_loss": -12.418314933776855, "global_step": 378878, "epoch": 2255} {"train_loss": -11.24005126953125, "global_step": 378879, "epoch": 2255} {"train_loss": -12.082204818725586, "global_step": 378880, "epoch": 2255} {"train_loss": -11.744909286499023, "global_step": 378881, "epoch": 2255} {"train_loss": -12.054559707641602, "global_step": 378882, "epoch": 2255} {"train_loss": -11.565621376037598, "global_step": 378883, "epoch": 2255} {"train_loss": -10.829797744750977, "global_step": 378884, "epoch": 2255} {"train_loss": -11.635719299316406, "global_step": 378885, "epoch": 2255} {"train_loss": -11.569319725036621, "global_step": 378886, "epoch": 2255} {"train_loss": -12.126670837402344, "global_step": 378887, "epoch": 2255} {"train_loss": -11.142969131469727, "global_step": 378888, "epoch": 2255} {"train_loss": -12.186744689941406, "global_step": 378889, "epoch": 2255} {"train_loss": -12.161846160888672, "global_step": 378890, "epoch": 2255} {"train_loss": -11.284564018249512, "global_step": 378891, "epoch": 2255} {"train_loss": -11.568330764770508, "global_step": 378892, "epoch": 2255} {"train_loss": -12.199538230895996, "global_step": 378893, "epoch": 2255} {"train_loss": -11.612805366516113, "global_step": 378894, "epoch": 2255} {"train_loss": -11.196514129638672, "global_step": 378895, "epoch": 2255} {"train_loss": -12.233816146850586, "global_step": 378896, "epoch": 2255} {"train_loss": -11.729543685913086, "global_step": 378897, "epoch": 2255} {"train_loss": -11.715391159057617, "global_step": 378898, "epoch": 2255} {"train_loss": -12.406326293945312, "global_step": 378899, "epoch": 2255} {"train_loss": -11.736634254455566, "global_step": 378900, "epoch": 2255} {"train_loss": -11.301482200622559, "global_step": 378901, "epoch": 2255} {"train_loss": -12.093754768371582, "global_step": 378902, "epoch": 2255} {"train_loss": -11.938745498657227, "global_step": 378903, "epoch": 2255} {"train_loss": -11.426501274108887, "global_step": 378904, "epoch": 2255} {"train_loss": -12.36630916595459, "global_step": 378905, "epoch": 2255} {"train_loss": -11.583480834960938, "global_step": 378906, "epoch": 2255} {"train_loss": -11.162924766540527, "global_step": 378907, "epoch": 2255} {"train_loss": -12.015275955200195, "global_step": 378908, "epoch": 2255} {"train_loss": -11.361006736755371, "global_step": 378909, "epoch": 2255} {"train_loss": -12.16313648223877, "global_step": 378910, "epoch": 2255} {"train_loss": -11.788436889648438, "global_step": 378911, "epoch": 2255} {"train_loss": -11.479342460632324, "global_step": 378912, "epoch": 2255} {"train_loss": -12.27268123626709, "global_step": 378913, "epoch": 2255} {"train_loss": -11.707219123840332, "global_step": 378914, "epoch": 2255} {"train_loss": -11.757981300354004, "global_step": 378915, "epoch": 2255} {"train_loss": -11.757915496826172, "global_step": 378916, "epoch": 2255} {"train_loss": -11.695384979248047, "global_step": 378917, "epoch": 2255} {"train_loss": -11.607982635498047, "global_step": 378918, "epoch": 2255} {"train_loss": -10.91734504699707, "global_step": 378919, "epoch": 2255} {"train_loss": -12.118271827697754, "global_step": 378920, "epoch": 2255} {"train_loss": -11.443731307983398, "global_step": 378921, "epoch": 2255} {"train_loss": -11.341651916503906, "global_step": 378922, "epoch": 2255} {"train_loss": -11.699491500854492, "global_step": 378923, "epoch": 2255} {"train_loss": -11.564011573791504, "global_step": 378924, "epoch": 2255} {"train_loss": -9.937162399291992, "global_step": 378925, "epoch": 2255} {"train_loss": -11.998113632202148, "global_step": 378926, "epoch": 2255} {"train_loss": -11.533449172973633, "global_step": 378927, "epoch": 2255} {"train_loss": -11.822538375854492, "global_step": 378928, "epoch": 2255} {"train_loss": -10.725139617919922, "global_step": 378929, "epoch": 2255} {"train_loss": -11.76809310913086, "global_step": 378930, "epoch": 2255} {"train_loss": -11.165651321411133, "global_step": 378931, "epoch": 2255} {"train_loss": -11.29375171661377, "global_step": 378932, "epoch": 2255} {"train_loss": -10.650703430175781, "global_step": 378933, "epoch": 2255} {"train_loss": -11.246524810791016, "global_step": 378934, "epoch": 2255} {"train_loss": -11.143099784851074, "global_step": 378935, "epoch": 2255} {"train_loss": -11.324350357055664, "global_step": 378936, "epoch": 2255} {"train_loss": -11.8663911819458, "global_step": 378937, "epoch": 2255} {"train_loss": -11.61782455444336, "global_step": 378938, "epoch": 2255} {"train_loss": -11.81071949005127, "global_step": 378939, "epoch": 2255} {"train_loss": -11.772550582885742, "global_step": 378940, "epoch": 2255} {"train_loss": -12.090771675109863, "global_step": 378941, "epoch": 2255} {"train_loss": -11.618278503417969, "global_step": 378942, "epoch": 2255} {"train_loss": -12.019227981567383, "global_step": 378943, "epoch": 2255} {"train_loss": -11.666078567504883, "global_step": 378944, "epoch": 2255} {"train_loss": -11.798846244812012, "global_step": 378945, "epoch": 2255} {"train_loss": -11.92640495300293, "global_step": 378946, "epoch": 2255} {"train_loss": -11.810131072998047, "global_step": 378947, "epoch": 2255} {"train_loss": -11.924482345581055, "global_step": 378948, "epoch": 2255} {"train_loss": -12.13541030883789, "global_step": 378949, "epoch": 2255} {"train_loss": -12.052059173583984, "global_step": 378950, "epoch": 2255} {"train_loss": -12.015447616577148, "global_step": 378951, "epoch": 2255} {"train_loss": -12.183937072753906, "global_step": 378952, "epoch": 2255} {"train_loss": -11.923446655273438, "global_step": 378953, "epoch": 2255} {"train_loss": -12.0155611038208, "global_step": 378954, "epoch": 2255} {"train_loss": -11.672794342041016, "global_step": 378955, "epoch": 2255} {"train_loss": -11.715587615966797, "global_step": 378956, "epoch": 2255} {"train_loss": -12.230757713317871, "global_step": 378957, "epoch": 2255} {"train_loss": -11.820991516113281, "global_step": 378958, "epoch": 2255} {"train_loss": -12.056940078735352, "global_step": 378959, "epoch": 2255} {"train_loss": -11.802366256713867, "global_step": 378960, "epoch": 2255} {"train_loss": -11.969053268432617, "global_step": 378961, "epoch": 2255} {"train_loss": -11.644433975219727, "global_step": 378962, "epoch": 2255} {"train_loss": -11.938913345336914, "global_step": 378963, "epoch": 2255} {"train_loss": -11.443868637084961, "global_step": 378964, "epoch": 2255} {"train_loss": -11.682612419128418, "global_step": 378965, "epoch": 2255} {"train_loss": -11.858661651611328, "global_step": 378966, "epoch": 2255} {"train_loss": -11.563949584960938, "global_step": 378967, "epoch": 2255} {"train_loss": -11.875356674194336, "global_step": 378968, "epoch": 2255} {"train_loss": -12.06342887878418, "global_step": 378969, "epoch": 2255} {"train_loss": -11.666488647460938, "global_step": 378970, "epoch": 2255} {"train_loss": -12.071444511413574, "global_step": 378971, "epoch": 2255} {"train_loss": -11.998685836791992, "global_step": 378972, "epoch": 2255} {"train_loss": -12.199981689453125, "global_step": 378973, "epoch": 2255} {"train_loss": -12.128438949584961, "global_step": 378974, "epoch": 2255} {"train_loss": -12.002944946289062, "global_step": 378975, "epoch": 2255} {"train_loss": -11.643274307250977, "global_step": 378976, "epoch": 2255} {"train_loss": -12.320865631103516, "global_step": 378977, "epoch": 2255} {"train_loss": -11.949201583862305, "global_step": 378978, "epoch": 2255} {"train_loss": -12.109955787658691, "global_step": 378979, "epoch": 2255} {"train_loss": -12.404427528381348, "global_step": 378980, "epoch": 2255} {"train_loss": -11.999691009521484, "global_step": 378981, "epoch": 2255} {"train_loss": -12.37660026550293, "global_step": 378982, "epoch": 2255} {"train_loss": -12.186952590942383, "global_step": 378983, "epoch": 2255} {"train_loss": -12.247383117675781, "global_step": 378984, "epoch": 2255} {"train_loss": -12.314931869506836, "global_step": 378985, "epoch": 2255} {"train_loss": -12.190666198730469, "global_step": 378986, "epoch": 2255} {"train_loss": -12.043903350830078, "global_step": 378987, "epoch": 2255} {"train_loss": -12.330546379089355, "global_step": 378988, "epoch": 2255} {"train_loss": -12.008074760437012, "global_step": 378989, "epoch": 2255} {"train_loss": -12.452478408813477, "global_step": 378990, "epoch": 2255} {"train_loss": -12.25171947479248, "global_step": 378991, "epoch": 2255} {"train_loss": -12.059710502624512, "global_step": 378992, "epoch": 2255} {"train_loss": -12.280109405517578, "global_step": 378993, "epoch": 2255} {"train_loss": -12.008960723876953, "global_step": 378994, "epoch": 2255} {"train_loss": -12.028070449829102, "global_step": 378995, "epoch": 2255} {"train_loss": -12.123563766479492, "global_step": 378996, "epoch": 2255} {"train_loss": -11.634550094604492, "global_step": 378997, "epoch": 2255} {"train_loss": -12.037864685058594, "global_step": 378998, "epoch": 2255} {"train_loss": -12.057525634765625, "global_step": 378999, "epoch": 2255} {"train_loss": -12.255117416381836, "global_step": 379000, "epoch": 2255} {"train_loss": -11.919523239135742, "global_step": 379001, "epoch": 2255} {"train_loss": -12.231327056884766, "global_step": 379002, "epoch": 2255} {"train_loss": -12.178187370300293, "global_step": 379003, "epoch": 2255} {"train_loss": -12.066072463989258, "global_step": 379004, "epoch": 2255} {"train_loss": -12.160913467407227, "global_step": 379005, "epoch": 2255} {"train_loss": -12.198175430297852, "global_step": 379006, "epoch": 2255} {"train_loss": -11.89414089634305, "global_step": 379007, "epoch": 2255, "val_loss": 286083.5, "train_action_mse_error": 1.3361892700195312} {"train_loss": -12.236217498779297, "global_step": 379008, "epoch": 2256} {"train_loss": -11.456928253173828, "global_step": 379009, "epoch": 2256} {"train_loss": -11.906952857971191, "global_step": 379010, "epoch": 2256} {"train_loss": -12.054838180541992, "global_step": 379011, "epoch": 2256} {"train_loss": -11.57026481628418, "global_step": 379012, "epoch": 2256} {"train_loss": -11.862039566040039, "global_step": 379013, "epoch": 2256} {"train_loss": -11.715150833129883, "global_step": 379014, "epoch": 2256} {"train_loss": -12.026676177978516, "global_step": 379015, "epoch": 2256} {"train_loss": -11.737804412841797, "global_step": 379016, "epoch": 2256} {"train_loss": -12.01660442352295, "global_step": 379017, "epoch": 2256} {"train_loss": -12.383055686950684, "global_step": 379018, "epoch": 2256} {"train_loss": -12.201190948486328, "global_step": 379019, "epoch": 2256} {"train_loss": -12.056269645690918, "global_step": 379020, "epoch": 2256} {"train_loss": -12.318989753723145, "global_step": 379021, "epoch": 2256} {"train_loss": -12.021295547485352, "global_step": 379022, "epoch": 2256} {"train_loss": -12.470197677612305, "global_step": 379023, "epoch": 2256} {"train_loss": -12.178879737854004, "global_step": 379024, "epoch": 2256} {"train_loss": -12.206554412841797, "global_step": 379025, "epoch": 2256} {"train_loss": -12.101362228393555, "global_step": 379026, "epoch": 2256} {"train_loss": -12.345304489135742, "global_step": 379027, "epoch": 2256} {"train_loss": -12.012849807739258, "global_step": 379028, "epoch": 2256} {"train_loss": -12.471563339233398, "global_step": 379029, "epoch": 2256} {"train_loss": -12.336332321166992, "global_step": 379030, "epoch": 2256} {"train_loss": -12.111905097961426, "global_step": 379031, "epoch": 2256} {"train_loss": -12.233414649963379, "global_step": 379032, "epoch": 2256} {"train_loss": -11.77318000793457, "global_step": 379033, "epoch": 2256} {"train_loss": -12.140016555786133, "global_step": 379034, "epoch": 2256} {"train_loss": -11.415648460388184, "global_step": 379035, "epoch": 2256} {"train_loss": -12.118692398071289, "global_step": 379036, "epoch": 2256} {"train_loss": -12.079570770263672, "global_step": 379037, "epoch": 2256} {"train_loss": -12.109245300292969, "global_step": 379038, "epoch": 2256} {"train_loss": -12.475007057189941, "global_step": 379039, "epoch": 2256} {"train_loss": -11.9083251953125, "global_step": 379040, "epoch": 2256} {"train_loss": -12.576732635498047, "global_step": 379041, "epoch": 2256} {"train_loss": -12.06246566772461, "global_step": 379042, "epoch": 2256} {"train_loss": -11.132004737854004, "global_step": 379043, "epoch": 2256} {"train_loss": -10.831931114196777, "global_step": 379044, "epoch": 2256} {"train_loss": -11.887360572814941, "global_step": 379045, "epoch": 2256} {"train_loss": -11.152275085449219, "global_step": 379046, "epoch": 2256} {"train_loss": -11.4944486618042, "global_step": 379047, "epoch": 2256} {"train_loss": -11.97638988494873, "global_step": 379048, "epoch": 2256} {"train_loss": -11.08106803894043, "global_step": 379049, "epoch": 2256} {"train_loss": -11.64322566986084, "global_step": 379050, "epoch": 2256} {"train_loss": -10.805322647094727, "global_step": 379051, "epoch": 2256} {"train_loss": -10.668498039245605, "global_step": 379052, "epoch": 2256} {"train_loss": -10.266888618469238, "global_step": 379053, "epoch": 2256} {"train_loss": -10.629417419433594, "global_step": 379054, "epoch": 2256} {"train_loss": -11.343948364257812, "global_step": 379055, "epoch": 2256} {"train_loss": -9.879895210266113, "global_step": 379056, "epoch": 2256} {"train_loss": -9.42398738861084, "global_step": 379057, "epoch": 2256} {"train_loss": -8.018139839172363, "global_step": 379058, "epoch": 2256} {"train_loss": -9.01094913482666, "global_step": 379059, "epoch": 2256} {"train_loss": -9.85586166381836, "global_step": 379060, "epoch": 2256} {"train_loss": -9.560640335083008, "global_step": 379061, "epoch": 2256} {"train_loss": -10.56347370147705, "global_step": 379062, "epoch": 2256} {"train_loss": -10.669877052307129, "global_step": 379063, "epoch": 2256} {"train_loss": -10.386746406555176, "global_step": 379064, "epoch": 2256} {"train_loss": -10.942556381225586, "global_step": 379065, "epoch": 2256} {"train_loss": -11.354798316955566, "global_step": 379066, "epoch": 2256} {"train_loss": -10.681397438049316, "global_step": 379067, "epoch": 2256} {"train_loss": -10.541329383850098, "global_step": 379068, "epoch": 2256} {"train_loss": -11.71978759765625, "global_step": 379069, "epoch": 2256} {"train_loss": -10.452220916748047, "global_step": 379070, "epoch": 2256} {"train_loss": -11.838617324829102, "global_step": 379071, "epoch": 2256} {"train_loss": -11.309795379638672, "global_step": 379072, "epoch": 2256} {"train_loss": -11.789052963256836, "global_step": 379073, "epoch": 2256} {"train_loss": -11.991104125976562, "global_step": 379074, "epoch": 2256} {"train_loss": -11.401102066040039, "global_step": 379075, "epoch": 2256} {"train_loss": -11.914398193359375, "global_step": 379076, "epoch": 2256} {"train_loss": -11.513764381408691, "global_step": 379077, "epoch": 2256} {"train_loss": -11.866031646728516, "global_step": 379078, "epoch": 2256} {"train_loss": -12.283868789672852, "global_step": 379079, "epoch": 2256} {"train_loss": -11.890950202941895, "global_step": 379080, "epoch": 2256} {"train_loss": -12.26003646850586, "global_step": 379081, "epoch": 2256} {"train_loss": -11.8934326171875, "global_step": 379082, "epoch": 2256} {"train_loss": -12.300948143005371, "global_step": 379083, "epoch": 2256} {"train_loss": -12.105000495910645, "global_step": 379084, "epoch": 2256} {"train_loss": -11.954849243164062, "global_step": 379085, "epoch": 2256} {"train_loss": -11.879619598388672, "global_step": 379086, "epoch": 2256} {"train_loss": -12.267610549926758, "global_step": 379087, "epoch": 2256} {"train_loss": -12.083234786987305, "global_step": 379088, "epoch": 2256} {"train_loss": -12.184547424316406, "global_step": 379089, "epoch": 2256} {"train_loss": -12.247262954711914, "global_step": 379090, "epoch": 2256} {"train_loss": -12.396714210510254, "global_step": 379091, "epoch": 2256} {"train_loss": -12.213165283203125, "global_step": 379092, "epoch": 2256} {"train_loss": -11.971833229064941, "global_step": 379093, "epoch": 2256} {"train_loss": -12.14600944519043, "global_step": 379094, "epoch": 2256} {"train_loss": -12.387051582336426, "global_step": 379095, "epoch": 2256} {"train_loss": -12.294755935668945, "global_step": 379096, "epoch": 2256} {"train_loss": -12.345847129821777, "global_step": 379097, "epoch": 2256} {"train_loss": -12.184322357177734, "global_step": 379098, "epoch": 2256} {"train_loss": -12.457966804504395, "global_step": 379099, "epoch": 2256} {"train_loss": -12.43480110168457, "global_step": 379100, "epoch": 2256} {"train_loss": -12.30276107788086, "global_step": 379101, "epoch": 2256} {"train_loss": -12.377150535583496, "global_step": 379102, "epoch": 2256} {"train_loss": -12.154911041259766, "global_step": 379103, "epoch": 2256} {"train_loss": -12.354198455810547, "global_step": 379104, "epoch": 2256} {"train_loss": -12.093765258789062, "global_step": 379105, "epoch": 2256} {"train_loss": -12.124643325805664, "global_step": 379106, "epoch": 2256} {"train_loss": -12.456705093383789, "global_step": 379107, "epoch": 2256} {"train_loss": -12.139823913574219, "global_step": 379108, "epoch": 2256} {"train_loss": -12.326168060302734, "global_step": 379109, "epoch": 2256} {"train_loss": -12.330228805541992, "global_step": 379110, "epoch": 2256} {"train_loss": -12.20419692993164, "global_step": 379111, "epoch": 2256} {"train_loss": -12.390085220336914, "global_step": 379112, "epoch": 2256} {"train_loss": -12.417877197265625, "global_step": 379113, "epoch": 2256} {"train_loss": -12.294595718383789, "global_step": 379114, "epoch": 2256} {"train_loss": -12.547233581542969, "global_step": 379115, "epoch": 2256} {"train_loss": -12.444975852966309, "global_step": 379116, "epoch": 2256} {"train_loss": -12.426919937133789, "global_step": 379117, "epoch": 2256} {"train_loss": -12.565025329589844, "global_step": 379118, "epoch": 2256} {"train_loss": -12.48226547241211, "global_step": 379119, "epoch": 2256} {"train_loss": -12.467340469360352, "global_step": 379120, "epoch": 2256} {"train_loss": -12.39264965057373, "global_step": 379121, "epoch": 2256} {"train_loss": -12.431078910827637, "global_step": 379122, "epoch": 2256} {"train_loss": -12.486780166625977, "global_step": 379123, "epoch": 2256} {"train_loss": -12.324918746948242, "global_step": 379124, "epoch": 2256} {"train_loss": -12.634804725646973, "global_step": 379125, "epoch": 2256} {"train_loss": -12.512666702270508, "global_step": 379126, "epoch": 2256} {"train_loss": -12.61324691772461, "global_step": 379127, "epoch": 2256} {"train_loss": -12.512547492980957, "global_step": 379128, "epoch": 2256} {"train_loss": -12.421220779418945, "global_step": 379129, "epoch": 2256} {"train_loss": -12.77971076965332, "global_step": 379130, "epoch": 2256} {"train_loss": -12.77792739868164, "global_step": 379131, "epoch": 2256} {"train_loss": -12.768881797790527, "global_step": 379132, "epoch": 2256} {"train_loss": -12.612957954406738, "global_step": 379133, "epoch": 2256} {"train_loss": -12.666175842285156, "global_step": 379134, "epoch": 2256} {"train_loss": -12.744492530822754, "global_step": 379135, "epoch": 2256} {"train_loss": -12.660438537597656, "global_step": 379136, "epoch": 2256} {"train_loss": -12.670611381530762, "global_step": 379137, "epoch": 2256} {"train_loss": -12.598249435424805, "global_step": 379138, "epoch": 2256} {"train_loss": -12.671608924865723, "global_step": 379139, "epoch": 2256} {"train_loss": -12.669328689575195, "global_step": 379140, "epoch": 2256} {"train_loss": -12.250469207763672, "global_step": 379141, "epoch": 2256} {"train_loss": -12.69127082824707, "global_step": 379142, "epoch": 2256} {"train_loss": -12.572454452514648, "global_step": 379143, "epoch": 2256} {"train_loss": -12.562262535095215, "global_step": 379144, "epoch": 2256} {"train_loss": -12.530010223388672, "global_step": 379145, "epoch": 2256} {"train_loss": -12.726677894592285, "global_step": 379146, "epoch": 2256} {"train_loss": -12.702644348144531, "global_step": 379147, "epoch": 2256} {"train_loss": -12.580480575561523, "global_step": 379148, "epoch": 2256} {"train_loss": -12.812345504760742, "global_step": 379149, "epoch": 2256} {"train_loss": -12.77724552154541, "global_step": 379150, "epoch": 2256} {"train_loss": -12.80691146850586, "global_step": 379151, "epoch": 2256} {"train_loss": -12.777386665344238, "global_step": 379152, "epoch": 2256} {"train_loss": -12.600380897521973, "global_step": 379153, "epoch": 2256} {"train_loss": -12.534490585327148, "global_step": 379154, "epoch": 2256} {"train_loss": -12.075264930725098, "global_step": 379155, "epoch": 2256} {"train_loss": -12.169788360595703, "global_step": 379156, "epoch": 2256} {"train_loss": -12.493705749511719, "global_step": 379157, "epoch": 2256} {"train_loss": -12.458589553833008, "global_step": 379158, "epoch": 2256} {"train_loss": -12.042537689208984, "global_step": 379159, "epoch": 2256} {"train_loss": -12.4588623046875, "global_step": 379160, "epoch": 2256} {"train_loss": -12.146928787231445, "global_step": 379161, "epoch": 2256} {"train_loss": -11.359025955200195, "global_step": 379162, "epoch": 2256} {"train_loss": -11.830028533935547, "global_step": 379163, "epoch": 2256} {"train_loss": -12.424464225769043, "global_step": 379164, "epoch": 2256} {"train_loss": -11.32243824005127, "global_step": 379165, "epoch": 2256} {"train_loss": -10.430120468139648, "global_step": 379166, "epoch": 2256} {"train_loss": -11.66357135772705, "global_step": 379167, "epoch": 2256} {"train_loss": -7.799165725708008, "global_step": 379168, "epoch": 2256} {"train_loss": -9.50808334350586, "global_step": 379169, "epoch": 2256} {"train_loss": -8.00240421295166, "global_step": 379170, "epoch": 2256} {"train_loss": -8.095293045043945, "global_step": 379171, "epoch": 2256} {"train_loss": -9.580984115600586, "global_step": 379172, "epoch": 2256} {"train_loss": -8.452674865722656, "global_step": 379173, "epoch": 2256} {"train_loss": -7.6103596687316895, "global_step": 379174, "epoch": 2256} {"train_loss": -11.785979211330414, "global_step": 379175, "epoch": 2256, "val_loss": 288167.78125} {"train_loss": -8.736800193786621, "global_step": 379176, "epoch": 2257} {"train_loss": -9.506983757019043, "global_step": 379177, "epoch": 2257} {"train_loss": -8.667236328125, "global_step": 379178, "epoch": 2257} {"train_loss": -7.662319183349609, "global_step": 379179, "epoch": 2257} {"train_loss": -9.64622974395752, "global_step": 379180, "epoch": 2257} {"train_loss": -10.439972877502441, "global_step": 379181, "epoch": 2257} {"train_loss": -8.999466896057129, "global_step": 379182, "epoch": 2257} {"train_loss": -10.535255432128906, "global_step": 379183, "epoch": 2257} {"train_loss": -9.278650283813477, "global_step": 379184, "epoch": 2257} {"train_loss": -8.744388580322266, "global_step": 379185, "epoch": 2257} {"train_loss": -11.071667671203613, "global_step": 379186, "epoch": 2257} {"train_loss": -9.805606842041016, "global_step": 379187, "epoch": 2257} {"train_loss": -10.673484802246094, "global_step": 379188, "epoch": 2257} {"train_loss": -10.387316703796387, "global_step": 379189, "epoch": 2257} {"train_loss": -11.042957305908203, "global_step": 379190, "epoch": 2257} {"train_loss": -10.601005554199219, "global_step": 379191, "epoch": 2257} {"train_loss": -10.589889526367188, "global_step": 379192, "epoch": 2257} {"train_loss": -10.272878646850586, "global_step": 379193, "epoch": 2257} {"train_loss": -10.984947204589844, "global_step": 379194, "epoch": 2257} {"train_loss": -11.163749694824219, "global_step": 379195, "epoch": 2257} {"train_loss": -11.314471244812012, "global_step": 379196, "epoch": 2257} {"train_loss": -11.237537384033203, "global_step": 379197, "epoch": 2257} {"train_loss": -11.84678840637207, "global_step": 379198, "epoch": 2257} {"train_loss": -11.285913467407227, "global_step": 379199, "epoch": 2257} {"train_loss": -11.432586669921875, "global_step": 379200, "epoch": 2257} {"train_loss": -11.146489143371582, "global_step": 379201, "epoch": 2257} {"train_loss": -11.472345352172852, "global_step": 379202, "epoch": 2257} {"train_loss": -11.620046615600586, "global_step": 379203, "epoch": 2257} {"train_loss": -11.303901672363281, "global_step": 379204, "epoch": 2257} {"train_loss": -11.609891891479492, "global_step": 379205, "epoch": 2257} {"train_loss": -11.241108894348145, "global_step": 379206, "epoch": 2257} {"train_loss": -11.336657524108887, "global_step": 379207, "epoch": 2257} {"train_loss": -11.320661544799805, "global_step": 379208, "epoch": 2257} {"train_loss": -11.172433853149414, "global_step": 379209, "epoch": 2257} {"train_loss": -12.062057495117188, "global_step": 379210, "epoch": 2257} {"train_loss": -11.495412826538086, "global_step": 379211, "epoch": 2257} {"train_loss": -11.397645950317383, "global_step": 379212, "epoch": 2257} {"train_loss": -11.786537170410156, "global_step": 379213, "epoch": 2257} {"train_loss": -11.530498504638672, "global_step": 379214, "epoch": 2257} {"train_loss": -12.023109436035156, "global_step": 379215, "epoch": 2257} {"train_loss": -11.491373062133789, "global_step": 379216, "epoch": 2257} {"train_loss": -11.608406066894531, "global_step": 379217, "epoch": 2257} {"train_loss": -11.378717422485352, "global_step": 379218, "epoch": 2257} {"train_loss": -11.809446334838867, "global_step": 379219, "epoch": 2257} {"train_loss": -11.229698181152344, "global_step": 379220, "epoch": 2257} {"train_loss": -12.050049781799316, "global_step": 379221, "epoch": 2257} {"train_loss": -11.607573509216309, "global_step": 379222, "epoch": 2257} {"train_loss": -11.900339126586914, "global_step": 379223, "epoch": 2257} {"train_loss": -11.999776840209961, "global_step": 379224, "epoch": 2257} {"train_loss": -11.45203971862793, "global_step": 379225, "epoch": 2257} {"train_loss": -12.241230010986328, "global_step": 379226, "epoch": 2257} {"train_loss": -11.69890308380127, "global_step": 379227, "epoch": 2257} {"train_loss": -11.851667404174805, "global_step": 379228, "epoch": 2257} {"train_loss": -11.906185150146484, "global_step": 379229, "epoch": 2257} {"train_loss": -11.782523155212402, "global_step": 379230, "epoch": 2257} {"train_loss": -12.2683687210083, "global_step": 379231, "epoch": 2257} {"train_loss": -11.746556282043457, "global_step": 379232, "epoch": 2257} {"train_loss": -11.906360626220703, "global_step": 379233, "epoch": 2257} {"train_loss": -12.26558780670166, "global_step": 379234, "epoch": 2257} {"train_loss": -12.174077987670898, "global_step": 379235, "epoch": 2257} {"train_loss": -12.169816970825195, "global_step": 379236, "epoch": 2257} {"train_loss": -12.233745574951172, "global_step": 379237, "epoch": 2257} {"train_loss": -12.047547340393066, "global_step": 379238, "epoch": 2257} {"train_loss": -12.393548965454102, "global_step": 379239, "epoch": 2257} {"train_loss": -12.060219764709473, "global_step": 379240, "epoch": 2257} {"train_loss": -12.130807876586914, "global_step": 379241, "epoch": 2257} {"train_loss": -12.483606338500977, "global_step": 379242, "epoch": 2257} {"train_loss": -12.049253463745117, "global_step": 379243, "epoch": 2257} {"train_loss": -12.116127014160156, "global_step": 379244, "epoch": 2257} {"train_loss": -12.537374496459961, "global_step": 379245, "epoch": 2257} {"train_loss": -12.211294174194336, "global_step": 379246, "epoch": 2257} {"train_loss": -12.090766906738281, "global_step": 379247, "epoch": 2257} {"train_loss": -12.113526344299316, "global_step": 379248, "epoch": 2257} {"train_loss": -12.473773956298828, "global_step": 379249, "epoch": 2257} {"train_loss": -12.386199951171875, "global_step": 379250, "epoch": 2257} {"train_loss": -12.138769149780273, "global_step": 379251, "epoch": 2257} {"train_loss": -12.484667778015137, "global_step": 379252, "epoch": 2257} {"train_loss": -12.5443115234375, "global_step": 379253, "epoch": 2257} {"train_loss": -12.355754852294922, "global_step": 379254, "epoch": 2257} {"train_loss": -12.245818138122559, "global_step": 379255, "epoch": 2257} {"train_loss": -12.45590591430664, "global_step": 379256, "epoch": 2257} {"train_loss": -12.21621322631836, "global_step": 379257, "epoch": 2257} {"train_loss": -12.216073989868164, "global_step": 379258, "epoch": 2257} {"train_loss": -12.38302993774414, "global_step": 379259, "epoch": 2257} {"train_loss": -12.43671989440918, "global_step": 379260, "epoch": 2257} {"train_loss": -12.472763061523438, "global_step": 379261, "epoch": 2257} {"train_loss": -12.561563491821289, "global_step": 379262, "epoch": 2257} {"train_loss": -12.178723335266113, "global_step": 379263, "epoch": 2257} {"train_loss": -12.298961639404297, "global_step": 379264, "epoch": 2257} {"train_loss": -12.344175338745117, "global_step": 379265, "epoch": 2257} {"train_loss": -12.456573486328125, "global_step": 379266, "epoch": 2257} {"train_loss": -12.710346221923828, "global_step": 379267, "epoch": 2257} {"train_loss": -12.550495147705078, "global_step": 379268, "epoch": 2257} {"train_loss": -12.636038780212402, "global_step": 379269, "epoch": 2257} {"train_loss": -12.548145294189453, "global_step": 379270, "epoch": 2257} {"train_loss": -12.628965377807617, "global_step": 379271, "epoch": 2257} {"train_loss": -12.342639923095703, "global_step": 379272, "epoch": 2257} {"train_loss": -12.499303817749023, "global_step": 379273, "epoch": 2257} {"train_loss": -12.783714294433594, "global_step": 379274, "epoch": 2257} {"train_loss": -12.513603210449219, "global_step": 379275, "epoch": 2257} {"train_loss": -12.33686351776123, "global_step": 379276, "epoch": 2257} {"train_loss": -12.548539161682129, "global_step": 379277, "epoch": 2257} {"train_loss": -12.727117538452148, "global_step": 379278, "epoch": 2257} {"train_loss": -12.63424301147461, "global_step": 379279, "epoch": 2257} {"train_loss": -12.812641143798828, "global_step": 379280, "epoch": 2257} {"train_loss": -12.604942321777344, "global_step": 379281, "epoch": 2257} {"train_loss": -12.754327774047852, "global_step": 379282, "epoch": 2257} {"train_loss": -12.619524955749512, "global_step": 379283, "epoch": 2257} {"train_loss": -12.614116668701172, "global_step": 379284, "epoch": 2257} {"train_loss": -12.401200294494629, "global_step": 379285, "epoch": 2257} {"train_loss": -12.748344421386719, "global_step": 379286, "epoch": 2257} {"train_loss": -12.619729995727539, "global_step": 379287, "epoch": 2257} {"train_loss": -12.381593704223633, "global_step": 379288, "epoch": 2257} {"train_loss": -12.35871696472168, "global_step": 379289, "epoch": 2257} {"train_loss": -12.502415657043457, "global_step": 379290, "epoch": 2257} {"train_loss": -12.741111755371094, "global_step": 379291, "epoch": 2257} {"train_loss": -12.671756744384766, "global_step": 379292, "epoch": 2257} {"train_loss": -12.019485473632812, "global_step": 379293, "epoch": 2257} {"train_loss": -12.301176071166992, "global_step": 379294, "epoch": 2257} {"train_loss": -12.542646408081055, "global_step": 379295, "epoch": 2257} {"train_loss": -12.00803279876709, "global_step": 379296, "epoch": 2257} {"train_loss": -11.76675796508789, "global_step": 379297, "epoch": 2257} {"train_loss": -11.796773910522461, "global_step": 379298, "epoch": 2257} {"train_loss": -11.336925506591797, "global_step": 379299, "epoch": 2257} {"train_loss": -11.501091003417969, "global_step": 379300, "epoch": 2257} {"train_loss": -10.008872985839844, "global_step": 379301, "epoch": 2257} {"train_loss": -10.257793426513672, "global_step": 379302, "epoch": 2257} {"train_loss": -10.493224143981934, "global_step": 379303, "epoch": 2257} {"train_loss": -10.69387149810791, "global_step": 379304, "epoch": 2257} {"train_loss": -10.872255325317383, "global_step": 379305, "epoch": 2257} {"train_loss": -9.95002269744873, "global_step": 379306, "epoch": 2257} {"train_loss": -10.686370849609375, "global_step": 379307, "epoch": 2257} {"train_loss": -10.762842178344727, "global_step": 379308, "epoch": 2257} {"train_loss": -11.457109451293945, "global_step": 379309, "epoch": 2257} {"train_loss": -11.473929405212402, "global_step": 379310, "epoch": 2257} {"train_loss": -10.513261795043945, "global_step": 379311, "epoch": 2257} {"train_loss": -10.755678176879883, "global_step": 379312, "epoch": 2257} {"train_loss": -11.752107620239258, "global_step": 379313, "epoch": 2257} {"train_loss": -11.845566749572754, "global_step": 379314, "epoch": 2257} {"train_loss": -11.745033264160156, "global_step": 379315, "epoch": 2257} {"train_loss": -11.450615882873535, "global_step": 379316, "epoch": 2257} {"train_loss": -12.156755447387695, "global_step": 379317, "epoch": 2257} {"train_loss": -12.065824508666992, "global_step": 379318, "epoch": 2257} {"train_loss": -12.129453659057617, "global_step": 379319, "epoch": 2257} {"train_loss": -11.846556663513184, "global_step": 379320, "epoch": 2257} {"train_loss": -11.646990776062012, "global_step": 379321, "epoch": 2257} {"train_loss": -11.782747268676758, "global_step": 379322, "epoch": 2257} {"train_loss": -12.21353530883789, "global_step": 379323, "epoch": 2257} {"train_loss": -11.817572593688965, "global_step": 379324, "epoch": 2257} {"train_loss": -12.093228340148926, "global_step": 379325, "epoch": 2257} {"train_loss": -12.179585456848145, "global_step": 379326, "epoch": 2257} {"train_loss": -11.939861297607422, "global_step": 379327, "epoch": 2257} {"train_loss": -12.253990173339844, "global_step": 379328, "epoch": 2257} {"train_loss": -12.177943229675293, "global_step": 379329, "epoch": 2257} {"train_loss": -12.387730598449707, "global_step": 379330, "epoch": 2257} {"train_loss": -11.84850025177002, "global_step": 379331, "epoch": 2257} {"train_loss": -12.375175476074219, "global_step": 379332, "epoch": 2257} {"train_loss": -12.00932502746582, "global_step": 379333, "epoch": 2257} {"train_loss": -12.344968795776367, "global_step": 379334, "epoch": 2257} {"train_loss": -12.02772331237793, "global_step": 379335, "epoch": 2257} {"train_loss": -11.497289657592773, "global_step": 379336, "epoch": 2257} {"train_loss": -12.23284912109375, "global_step": 379337, "epoch": 2257} {"train_loss": -12.020467758178711, "global_step": 379338, "epoch": 2257} {"train_loss": -11.879596710205078, "global_step": 379339, "epoch": 2257} {"train_loss": -11.822832107543945, "global_step": 379340, "epoch": 2257} {"train_loss": -12.322858810424805, "global_step": 379341, "epoch": 2257} {"train_loss": -11.874990463256836, "global_step": 379342, "epoch": 2257} {"train_loss": -11.717341655776615, "global_step": 379343, "epoch": 2257, "val_loss": 286964.03125} {"train_loss": -12.110984802246094, "global_step": 379344, "epoch": 2258} {"train_loss": -11.99312973022461, "global_step": 379345, "epoch": 2258} {"train_loss": -12.285423278808594, "global_step": 379346, "epoch": 2258} {"train_loss": -11.93709945678711, "global_step": 379347, "epoch": 2258} {"train_loss": -12.322168350219727, "global_step": 379348, "epoch": 2258} {"train_loss": -12.12060546875, "global_step": 379349, "epoch": 2258} {"train_loss": -12.59305191040039, "global_step": 379350, "epoch": 2258} {"train_loss": -12.062307357788086, "global_step": 379351, "epoch": 2258} {"train_loss": -12.694025039672852, "global_step": 379352, "epoch": 2258} {"train_loss": -11.720052719116211, "global_step": 379353, "epoch": 2258} {"train_loss": -12.291784286499023, "global_step": 379354, "epoch": 2258} {"train_loss": -12.062177658081055, "global_step": 379355, "epoch": 2258} {"train_loss": -12.148019790649414, "global_step": 379356, "epoch": 2258} {"train_loss": -12.387697219848633, "global_step": 379357, "epoch": 2258} {"train_loss": -12.202400207519531, "global_step": 379358, "epoch": 2258} {"train_loss": -12.187870025634766, "global_step": 379359, "epoch": 2258} {"train_loss": -12.444343566894531, "global_step": 379360, "epoch": 2258} {"train_loss": -12.128679275512695, "global_step": 379361, "epoch": 2258} {"train_loss": -12.410825729370117, "global_step": 379362, "epoch": 2258} {"train_loss": -12.505916595458984, "global_step": 379363, "epoch": 2258} {"train_loss": -12.507621765136719, "global_step": 379364, "epoch": 2258} {"train_loss": -12.633465766906738, "global_step": 379365, "epoch": 2258} {"train_loss": -11.618016242980957, "global_step": 379366, "epoch": 2258} {"train_loss": -11.605199813842773, "global_step": 379367, "epoch": 2258} {"train_loss": -12.450484275817871, "global_step": 379368, "epoch": 2258} {"train_loss": -11.228446006774902, "global_step": 379369, "epoch": 2258} {"train_loss": -11.691020011901855, "global_step": 379370, "epoch": 2258} {"train_loss": -11.701130867004395, "global_step": 379371, "epoch": 2258} {"train_loss": -11.866233825683594, "global_step": 379372, "epoch": 2258} {"train_loss": -11.714046478271484, "global_step": 379373, "epoch": 2258} {"train_loss": -11.318702697753906, "global_step": 379374, "epoch": 2258} {"train_loss": -10.564367294311523, "global_step": 379375, "epoch": 2258} {"train_loss": -12.08340072631836, "global_step": 379376, "epoch": 2258} {"train_loss": -11.376579284667969, "global_step": 379377, "epoch": 2258} {"train_loss": -12.339437484741211, "global_step": 379378, "epoch": 2258} {"train_loss": -11.050575256347656, "global_step": 379379, "epoch": 2258} {"train_loss": -12.050217628479004, "global_step": 379380, "epoch": 2258} {"train_loss": -11.115873336791992, "global_step": 379381, "epoch": 2258} {"train_loss": -11.297986030578613, "global_step": 379382, "epoch": 2258} {"train_loss": -12.067516326904297, "global_step": 379383, "epoch": 2258} {"train_loss": -11.685930252075195, "global_step": 379384, "epoch": 2258} {"train_loss": -11.762659072875977, "global_step": 379385, "epoch": 2258} {"train_loss": -12.077482223510742, "global_step": 379386, "epoch": 2258} {"train_loss": -11.738162994384766, "global_step": 379387, "epoch": 2258} {"train_loss": -11.936007499694824, "global_step": 379388, "epoch": 2258} {"train_loss": -12.133722305297852, "global_step": 379389, "epoch": 2258} {"train_loss": -12.302167892456055, "global_step": 379390, "epoch": 2258} {"train_loss": -12.097354888916016, "global_step": 379391, "epoch": 2258} {"train_loss": -12.09154987335205, "global_step": 379392, "epoch": 2258} {"train_loss": -11.749467849731445, "global_step": 379393, "epoch": 2258} {"train_loss": -12.21683406829834, "global_step": 379394, "epoch": 2258} {"train_loss": -11.826935768127441, "global_step": 379395, "epoch": 2258} {"train_loss": -12.105266571044922, "global_step": 379396, "epoch": 2258} {"train_loss": -11.969717025756836, "global_step": 379397, "epoch": 2258} {"train_loss": -12.331844329833984, "global_step": 379398, "epoch": 2258} {"train_loss": -12.001520156860352, "global_step": 379399, "epoch": 2258} {"train_loss": -11.99246883392334, "global_step": 379400, "epoch": 2258} {"train_loss": -12.162799835205078, "global_step": 379401, "epoch": 2258} {"train_loss": -12.198189735412598, "global_step": 379402, "epoch": 2258} {"train_loss": -12.292545318603516, "global_step": 379403, "epoch": 2258} {"train_loss": -12.14263916015625, "global_step": 379404, "epoch": 2258} {"train_loss": -12.448017120361328, "global_step": 379405, "epoch": 2258} {"train_loss": -12.170451164245605, "global_step": 379406, "epoch": 2258} {"train_loss": -12.423157691955566, "global_step": 379407, "epoch": 2258} {"train_loss": -12.319042205810547, "global_step": 379408, "epoch": 2258} {"train_loss": -12.324539184570312, "global_step": 379409, "epoch": 2258} {"train_loss": -12.07821273803711, "global_step": 379410, "epoch": 2258} {"train_loss": -12.311117172241211, "global_step": 379411, "epoch": 2258} {"train_loss": -12.052094459533691, "global_step": 379412, "epoch": 2258} {"train_loss": -12.391057968139648, "global_step": 379413, "epoch": 2258} {"train_loss": -12.200233459472656, "global_step": 379414, "epoch": 2258} {"train_loss": -12.280328750610352, "global_step": 379415, "epoch": 2258} {"train_loss": -12.389545440673828, "global_step": 379416, "epoch": 2258} {"train_loss": -12.408025741577148, "global_step": 379417, "epoch": 2258} {"train_loss": -12.479308128356934, "global_step": 379418, "epoch": 2258} {"train_loss": -12.147904396057129, "global_step": 379419, "epoch": 2258} {"train_loss": -12.394378662109375, "global_step": 379420, "epoch": 2258} {"train_loss": -12.417020797729492, "global_step": 379421, "epoch": 2258} {"train_loss": -12.203750610351562, "global_step": 379422, "epoch": 2258} {"train_loss": -12.566582679748535, "global_step": 379423, "epoch": 2258} {"train_loss": -12.65852165222168, "global_step": 379424, "epoch": 2258} {"train_loss": -12.497270584106445, "global_step": 379425, "epoch": 2258} {"train_loss": -12.571476936340332, "global_step": 379426, "epoch": 2258} {"train_loss": -12.609524726867676, "global_step": 379427, "epoch": 2258} {"train_loss": -12.464179992675781, "global_step": 379428, "epoch": 2258} {"train_loss": -12.32203483581543, "global_step": 379429, "epoch": 2258} {"train_loss": -12.621784210205078, "global_step": 379430, "epoch": 2258} {"train_loss": -12.209046363830566, "global_step": 379431, "epoch": 2258} {"train_loss": -12.368642807006836, "global_step": 379432, "epoch": 2258} {"train_loss": -12.656842231750488, "global_step": 379433, "epoch": 2258} {"train_loss": -12.515483856201172, "global_step": 379434, "epoch": 2258} {"train_loss": -12.388025283813477, "global_step": 379435, "epoch": 2258} {"train_loss": -12.620443344116211, "global_step": 379436, "epoch": 2258} {"train_loss": -11.817005157470703, "global_step": 379437, "epoch": 2258} {"train_loss": -12.184255599975586, "global_step": 379438, "epoch": 2258} {"train_loss": -12.324728012084961, "global_step": 379439, "epoch": 2258} {"train_loss": -12.45751667022705, "global_step": 379440, "epoch": 2258} {"train_loss": -12.132096290588379, "global_step": 379441, "epoch": 2258} {"train_loss": -12.429736137390137, "global_step": 379442, "epoch": 2258} {"train_loss": -12.603805541992188, "global_step": 379443, "epoch": 2258} {"train_loss": -12.053323745727539, "global_step": 379444, "epoch": 2258} {"train_loss": -12.493646621704102, "global_step": 379445, "epoch": 2258} {"train_loss": -12.410754203796387, "global_step": 379446, "epoch": 2258} {"train_loss": -12.700234413146973, "global_step": 379447, "epoch": 2258} {"train_loss": -12.704503059387207, "global_step": 379448, "epoch": 2258} {"train_loss": -12.645545959472656, "global_step": 379449, "epoch": 2258} {"train_loss": -12.426133155822754, "global_step": 379450, "epoch": 2258} {"train_loss": -12.491497039794922, "global_step": 379451, "epoch": 2258} {"train_loss": -11.898957252502441, "global_step": 379452, "epoch": 2258} {"train_loss": -12.751335144042969, "global_step": 379453, "epoch": 2258} {"train_loss": -12.33809757232666, "global_step": 379454, "epoch": 2258} {"train_loss": -12.674878120422363, "global_step": 379455, "epoch": 2258} {"train_loss": -12.468595504760742, "global_step": 379456, "epoch": 2258} {"train_loss": -12.604765892028809, "global_step": 379457, "epoch": 2258} {"train_loss": -12.427227973937988, "global_step": 379458, "epoch": 2258} {"train_loss": -12.578323364257812, "global_step": 379459, "epoch": 2258} {"train_loss": -12.41169261932373, "global_step": 379460, "epoch": 2258} {"train_loss": -12.338539123535156, "global_step": 379461, "epoch": 2258} {"train_loss": -12.29496955871582, "global_step": 379462, "epoch": 2258} {"train_loss": -12.65912914276123, "global_step": 379463, "epoch": 2258} {"train_loss": -12.61179256439209, "global_step": 379464, "epoch": 2258} {"train_loss": -12.393999099731445, "global_step": 379465, "epoch": 2258} {"train_loss": -12.481576919555664, "global_step": 379466, "epoch": 2258} {"train_loss": -12.196906089782715, "global_step": 379467, "epoch": 2258} {"train_loss": -12.288370132446289, "global_step": 379468, "epoch": 2258} {"train_loss": -12.276191711425781, "global_step": 379469, "epoch": 2258} {"train_loss": -12.27613353729248, "global_step": 379470, "epoch": 2258} {"train_loss": -11.933393478393555, "global_step": 379471, "epoch": 2258} {"train_loss": -11.94359302520752, "global_step": 379472, "epoch": 2258} {"train_loss": -12.620662689208984, "global_step": 379473, "epoch": 2258} {"train_loss": -12.60305404663086, "global_step": 379474, "epoch": 2258} {"train_loss": -11.762914657592773, "global_step": 379475, "epoch": 2258} {"train_loss": -12.041374206542969, "global_step": 379476, "epoch": 2258} {"train_loss": -12.155071258544922, "global_step": 379477, "epoch": 2258} {"train_loss": -12.644859313964844, "global_step": 379478, "epoch": 2258} {"train_loss": -11.757654190063477, "global_step": 379479, "epoch": 2258} {"train_loss": -11.26541519165039, "global_step": 379480, "epoch": 2258} {"train_loss": -12.04901123046875, "global_step": 379481, "epoch": 2258} {"train_loss": -12.370416641235352, "global_step": 379482, "epoch": 2258} {"train_loss": -12.400837898254395, "global_step": 379483, "epoch": 2258} {"train_loss": -12.353023529052734, "global_step": 379484, "epoch": 2258} {"train_loss": -12.405352592468262, "global_step": 379485, "epoch": 2258} {"train_loss": -12.104137420654297, "global_step": 379486, "epoch": 2258} {"train_loss": -12.592182159423828, "global_step": 379487, "epoch": 2258} {"train_loss": -11.432820320129395, "global_step": 379488, "epoch": 2258} {"train_loss": -11.236045837402344, "global_step": 379489, "epoch": 2258} {"train_loss": -12.264049530029297, "global_step": 379490, "epoch": 2258} {"train_loss": -12.205345153808594, "global_step": 379491, "epoch": 2258} {"train_loss": -11.169187545776367, "global_step": 379492, "epoch": 2258} {"train_loss": -11.61231803894043, "global_step": 379493, "epoch": 2258} {"train_loss": -11.871712684631348, "global_step": 379494, "epoch": 2258} {"train_loss": -10.10025691986084, "global_step": 379495, "epoch": 2258} {"train_loss": -11.67798900604248, "global_step": 379496, "epoch": 2258} {"train_loss": -11.084579467773438, "global_step": 379497, "epoch": 2258} {"train_loss": -7.965859413146973, "global_step": 379498, "epoch": 2258} {"train_loss": -8.398904800415039, "global_step": 379499, "epoch": 2258} {"train_loss": -9.289795875549316, "global_step": 379500, "epoch": 2258} {"train_loss": -8.267427444458008, "global_step": 379501, "epoch": 2258} {"train_loss": -9.242437362670898, "global_step": 379502, "epoch": 2258} {"train_loss": -8.502922058105469, "global_step": 379503, "epoch": 2258} {"train_loss": -8.779903411865234, "global_step": 379504, "epoch": 2258} {"train_loss": -9.350421905517578, "global_step": 379505, "epoch": 2258} {"train_loss": -9.700182914733887, "global_step": 379506, "epoch": 2258} {"train_loss": -9.438727378845215, "global_step": 379507, "epoch": 2258} {"train_loss": -8.75848388671875, "global_step": 379508, "epoch": 2258} {"train_loss": -8.52665901184082, "global_step": 379509, "epoch": 2258} {"train_loss": -8.51430892944336, "global_step": 379510, "epoch": 2258} {"train_loss": -11.876477678616842, "global_step": 379511, "epoch": 2258, "val_loss": 292306.5} {"train_loss": -10.035192489624023, "global_step": 379512, "epoch": 2259} {"train_loss": -8.609792709350586, "global_step": 379513, "epoch": 2259} {"train_loss": -9.341943740844727, "global_step": 379514, "epoch": 2259} {"train_loss": -9.011699676513672, "global_step": 379515, "epoch": 2259} {"train_loss": -10.94028377532959, "global_step": 379516, "epoch": 2259} {"train_loss": -9.633790969848633, "global_step": 379517, "epoch": 2259} {"train_loss": -10.560687065124512, "global_step": 379518, "epoch": 2259} {"train_loss": -10.46910285949707, "global_step": 379519, "epoch": 2259} {"train_loss": -10.498011589050293, "global_step": 379520, "epoch": 2259} {"train_loss": -9.949246406555176, "global_step": 379521, "epoch": 2259} {"train_loss": -9.940381050109863, "global_step": 379522, "epoch": 2259} {"train_loss": -9.295778274536133, "global_step": 379523, "epoch": 2259} {"train_loss": -11.068904876708984, "global_step": 379524, "epoch": 2259} {"train_loss": -10.837629318237305, "global_step": 379525, "epoch": 2259} {"train_loss": -10.880817413330078, "global_step": 379526, "epoch": 2259} {"train_loss": -10.834600448608398, "global_step": 379527, "epoch": 2259} {"train_loss": -10.717926025390625, "global_step": 379528, "epoch": 2259} {"train_loss": -10.726737976074219, "global_step": 379529, "epoch": 2259} {"train_loss": -11.519532203674316, "global_step": 379530, "epoch": 2259} {"train_loss": -11.074788093566895, "global_step": 379531, "epoch": 2259} {"train_loss": -11.590095520019531, "global_step": 379532, "epoch": 2259} {"train_loss": -11.593490600585938, "global_step": 379533, "epoch": 2259} {"train_loss": -11.416799545288086, "global_step": 379534, "epoch": 2259} {"train_loss": -12.011204719543457, "global_step": 379535, "epoch": 2259} {"train_loss": -11.529312133789062, "global_step": 379536, "epoch": 2259} {"train_loss": -11.502580642700195, "global_step": 379537, "epoch": 2259} {"train_loss": -11.789324760437012, "global_step": 379538, "epoch": 2259} {"train_loss": -11.405731201171875, "global_step": 379539, "epoch": 2259} {"train_loss": -11.08456802368164, "global_step": 379540, "epoch": 2259} {"train_loss": -11.925556182861328, "global_step": 379541, "epoch": 2259} {"train_loss": -11.21091079711914, "global_step": 379542, "epoch": 2259} {"train_loss": -11.83311939239502, "global_step": 379543, "epoch": 2259} {"train_loss": -11.750957489013672, "global_step": 379544, "epoch": 2259} {"train_loss": -11.528482437133789, "global_step": 379545, "epoch": 2259} {"train_loss": -11.952127456665039, "global_step": 379546, "epoch": 2259} {"train_loss": -11.79240894317627, "global_step": 379547, "epoch": 2259} {"train_loss": -11.405131340026855, "global_step": 379548, "epoch": 2259} {"train_loss": -12.067671775817871, "global_step": 379549, "epoch": 2259} {"train_loss": -11.51744556427002, "global_step": 379550, "epoch": 2259} {"train_loss": -11.969487190246582, "global_step": 379551, "epoch": 2259} {"train_loss": -11.942233085632324, "global_step": 379552, "epoch": 2259} {"train_loss": -11.710548400878906, "global_step": 379553, "epoch": 2259} {"train_loss": -11.961767196655273, "global_step": 379554, "epoch": 2259} {"train_loss": -12.033737182617188, "global_step": 379555, "epoch": 2259} {"train_loss": -12.06917667388916, "global_step": 379556, "epoch": 2259} {"train_loss": -12.228313446044922, "global_step": 379557, "epoch": 2259} {"train_loss": -12.207809448242188, "global_step": 379558, "epoch": 2259} {"train_loss": -12.250408172607422, "global_step": 379559, "epoch": 2259} {"train_loss": -12.31527328491211, "global_step": 379560, "epoch": 2259} {"train_loss": -12.093975067138672, "global_step": 379561, "epoch": 2259} {"train_loss": -12.200852394104004, "global_step": 379562, "epoch": 2259} {"train_loss": -12.262186050415039, "global_step": 379563, "epoch": 2259} {"train_loss": -12.303550720214844, "global_step": 379564, "epoch": 2259} {"train_loss": -12.161083221435547, "global_step": 379565, "epoch": 2259} {"train_loss": -12.150932312011719, "global_step": 379566, "epoch": 2259} {"train_loss": -12.28004264831543, "global_step": 379567, "epoch": 2259} {"train_loss": -12.465811729431152, "global_step": 379568, "epoch": 2259} {"train_loss": -12.200370788574219, "global_step": 379569, "epoch": 2259} {"train_loss": -12.261682510375977, "global_step": 379570, "epoch": 2259} {"train_loss": -12.26113510131836, "global_step": 379571, "epoch": 2259} {"train_loss": -12.35338020324707, "global_step": 379572, "epoch": 2259} {"train_loss": -12.382630348205566, "global_step": 379573, "epoch": 2259} {"train_loss": -12.208061218261719, "global_step": 379574, "epoch": 2259} {"train_loss": -12.322668075561523, "global_step": 379575, "epoch": 2259} {"train_loss": -12.529540061950684, "global_step": 379576, "epoch": 2259} {"train_loss": -12.38272476196289, "global_step": 379577, "epoch": 2259} {"train_loss": -12.536447525024414, "global_step": 379578, "epoch": 2259} {"train_loss": -12.476306915283203, "global_step": 379579, "epoch": 2259} {"train_loss": -12.25887680053711, "global_step": 379580, "epoch": 2259} {"train_loss": -12.342033386230469, "global_step": 379581, "epoch": 2259} {"train_loss": -12.18635082244873, "global_step": 379582, "epoch": 2259} {"train_loss": -12.246188163757324, "global_step": 379583, "epoch": 2259} {"train_loss": -12.405517578125, "global_step": 379584, "epoch": 2259} {"train_loss": -12.555302619934082, "global_step": 379585, "epoch": 2259} {"train_loss": -12.521772384643555, "global_step": 379586, "epoch": 2259} {"train_loss": -12.632392883300781, "global_step": 379587, "epoch": 2259} {"train_loss": -12.416473388671875, "global_step": 379588, "epoch": 2259} {"train_loss": -12.497747421264648, "global_step": 379589, "epoch": 2259} {"train_loss": -12.283662796020508, "global_step": 379590, "epoch": 2259} {"train_loss": -12.302192687988281, "global_step": 379591, "epoch": 2259} {"train_loss": -12.507959365844727, "global_step": 379592, "epoch": 2259} {"train_loss": -12.231058120727539, "global_step": 379593, "epoch": 2259} {"train_loss": -12.462028503417969, "global_step": 379594, "epoch": 2259} {"train_loss": -12.23167610168457, "global_step": 379595, "epoch": 2259} {"train_loss": -12.479896545410156, "global_step": 379596, "epoch": 2259} {"train_loss": -12.335205078125, "global_step": 379597, "epoch": 2259} {"train_loss": -12.041040420532227, "global_step": 379598, "epoch": 2259} {"train_loss": -12.643783569335938, "global_step": 379599, "epoch": 2259} {"train_loss": -12.73370361328125, "global_step": 379600, "epoch": 2259} {"train_loss": -12.525688171386719, "global_step": 379601, "epoch": 2259} {"train_loss": -12.32579231262207, "global_step": 379602, "epoch": 2259} {"train_loss": -12.419021606445312, "global_step": 379603, "epoch": 2259} {"train_loss": -12.053869247436523, "global_step": 379604, "epoch": 2259} {"train_loss": -12.592960357666016, "global_step": 379605, "epoch": 2259} {"train_loss": -12.45022201538086, "global_step": 379606, "epoch": 2259} {"train_loss": -12.361090660095215, "global_step": 379607, "epoch": 2259} {"train_loss": -12.648980140686035, "global_step": 379608, "epoch": 2259} {"train_loss": -12.471357345581055, "global_step": 379609, "epoch": 2259} {"train_loss": -12.528493881225586, "global_step": 379610, "epoch": 2259} {"train_loss": -12.59133243560791, "global_step": 379611, "epoch": 2259} {"train_loss": -12.50159740447998, "global_step": 379612, "epoch": 2259} {"train_loss": -12.509236335754395, "global_step": 379613, "epoch": 2259} {"train_loss": -12.675738334655762, "global_step": 379614, "epoch": 2259} {"train_loss": -12.533380508422852, "global_step": 379615, "epoch": 2259} {"train_loss": -12.496461868286133, "global_step": 379616, "epoch": 2259} {"train_loss": -12.52670669555664, "global_step": 379617, "epoch": 2259} {"train_loss": -12.5593900680542, "global_step": 379618, "epoch": 2259} {"train_loss": -12.540864944458008, "global_step": 379619, "epoch": 2259} {"train_loss": -12.601499557495117, "global_step": 379620, "epoch": 2259} {"train_loss": -12.594108581542969, "global_step": 379621, "epoch": 2259} {"train_loss": -12.635808944702148, "global_step": 379622, "epoch": 2259} {"train_loss": -12.410161972045898, "global_step": 379623, "epoch": 2259} {"train_loss": -12.398693084716797, "global_step": 379624, "epoch": 2259} {"train_loss": -12.497671127319336, "global_step": 379625, "epoch": 2259} {"train_loss": -12.343782424926758, "global_step": 379626, "epoch": 2259} {"train_loss": -12.510295867919922, "global_step": 379627, "epoch": 2259} {"train_loss": -11.77823257446289, "global_step": 379628, "epoch": 2259} {"train_loss": -12.485258102416992, "global_step": 379629, "epoch": 2259} {"train_loss": -11.142930030822754, "global_step": 379630, "epoch": 2259} {"train_loss": -12.285880088806152, "global_step": 379631, "epoch": 2259} {"train_loss": -11.97278118133545, "global_step": 379632, "epoch": 2259} {"train_loss": -11.621837615966797, "global_step": 379633, "epoch": 2259} {"train_loss": -11.685173034667969, "global_step": 379634, "epoch": 2259} {"train_loss": -11.198225021362305, "global_step": 379635, "epoch": 2259} {"train_loss": -10.245511054992676, "global_step": 379636, "epoch": 2259} {"train_loss": -10.391603469848633, "global_step": 379637, "epoch": 2259} {"train_loss": -9.826361656188965, "global_step": 379638, "epoch": 2259} {"train_loss": -8.94489860534668, "global_step": 379639, "epoch": 2259} {"train_loss": -9.34653091430664, "global_step": 379640, "epoch": 2259} {"train_loss": -9.928268432617188, "global_step": 379641, "epoch": 2259} {"train_loss": -10.835780143737793, "global_step": 379642, "epoch": 2259} {"train_loss": -10.026931762695312, "global_step": 379643, "epoch": 2259} {"train_loss": -9.345550537109375, "global_step": 379644, "epoch": 2259} {"train_loss": -10.884295463562012, "global_step": 379645, "epoch": 2259} {"train_loss": -9.789661407470703, "global_step": 379646, "epoch": 2259} {"train_loss": -9.492578506469727, "global_step": 379647, "epoch": 2259} {"train_loss": -9.80107307434082, "global_step": 379648, "epoch": 2259} {"train_loss": -10.642805099487305, "global_step": 379649, "epoch": 2259} {"train_loss": -7.95542049407959, "global_step": 379650, "epoch": 2259} {"train_loss": -11.127705574035645, "global_step": 379651, "epoch": 2259} {"train_loss": -10.488656997680664, "global_step": 379652, "epoch": 2259} {"train_loss": -11.336833000183105, "global_step": 379653, "epoch": 2259} {"train_loss": -10.935997009277344, "global_step": 379654, "epoch": 2259} {"train_loss": -10.827991485595703, "global_step": 379655, "epoch": 2259} {"train_loss": -11.426860809326172, "global_step": 379656, "epoch": 2259} {"train_loss": -11.191003799438477, "global_step": 379657, "epoch": 2259} {"train_loss": -10.654007911682129, "global_step": 379658, "epoch": 2259} {"train_loss": -11.691246032714844, "global_step": 379659, "epoch": 2259} {"train_loss": -10.538745880126953, "global_step": 379660, "epoch": 2259} {"train_loss": -11.570494651794434, "global_step": 379661, "epoch": 2259} {"train_loss": -11.24289321899414, "global_step": 379662, "epoch": 2259} {"train_loss": -11.08387565612793, "global_step": 379663, "epoch": 2259} {"train_loss": -11.02731704711914, "global_step": 379664, "epoch": 2259} {"train_loss": -10.977869033813477, "global_step": 379665, "epoch": 2259} {"train_loss": -11.83740234375, "global_step": 379666, "epoch": 2259} {"train_loss": -11.301498413085938, "global_step": 379667, "epoch": 2259} {"train_loss": -11.605222702026367, "global_step": 379668, "epoch": 2259} {"train_loss": -11.090341567993164, "global_step": 379669, "epoch": 2259} {"train_loss": -11.331894874572754, "global_step": 379670, "epoch": 2259} {"train_loss": -12.010534286499023, "global_step": 379671, "epoch": 2259} {"train_loss": -11.504534721374512, "global_step": 379672, "epoch": 2259} {"train_loss": -11.912510871887207, "global_step": 379673, "epoch": 2259} {"train_loss": -11.724946975708008, "global_step": 379674, "epoch": 2259} {"train_loss": -11.788838386535645, "global_step": 379675, "epoch": 2259} {"train_loss": -11.994138717651367, "global_step": 379676, "epoch": 2259} {"train_loss": -11.724143028259277, "global_step": 379677, "epoch": 2259} {"train_loss": -12.096429824829102, "global_step": 379678, "epoch": 2259} {"train_loss": -11.609801411628723, "global_step": 379679, "epoch": 2259, "val_loss": 284691.4375} {"train_loss": -11.939020156860352, "global_step": 379680, "epoch": 2260} {"train_loss": -11.88790512084961, "global_step": 379681, "epoch": 2260} {"train_loss": -12.096874237060547, "global_step": 379682, "epoch": 2260} {"train_loss": -11.776860237121582, "global_step": 379683, "epoch": 2260} {"train_loss": -12.184287071228027, "global_step": 379684, "epoch": 2260} {"train_loss": -11.856706619262695, "global_step": 379685, "epoch": 2260} {"train_loss": -12.145713806152344, "global_step": 379686, "epoch": 2260} {"train_loss": -12.085111618041992, "global_step": 379687, "epoch": 2260} {"train_loss": -11.509023666381836, "global_step": 379688, "epoch": 2260} {"train_loss": -12.10297966003418, "global_step": 379689, "epoch": 2260} {"train_loss": -11.36741828918457, "global_step": 379690, "epoch": 2260} {"train_loss": -12.054433822631836, "global_step": 379691, "epoch": 2260} {"train_loss": -11.519638061523438, "global_step": 379692, "epoch": 2260} {"train_loss": -11.96977424621582, "global_step": 379693, "epoch": 2260} {"train_loss": -11.567703247070312, "global_step": 379694, "epoch": 2260} {"train_loss": -12.043668746948242, "global_step": 379695, "epoch": 2260} {"train_loss": -11.72966194152832, "global_step": 379696, "epoch": 2260} {"train_loss": -11.990755081176758, "global_step": 379697, "epoch": 2260} {"train_loss": -12.217700958251953, "global_step": 379698, "epoch": 2260} {"train_loss": -11.88945198059082, "global_step": 379699, "epoch": 2260} {"train_loss": -12.27595043182373, "global_step": 379700, "epoch": 2260} {"train_loss": -11.972833633422852, "global_step": 379701, "epoch": 2260} {"train_loss": -12.199584007263184, "global_step": 379702, "epoch": 2260} {"train_loss": -11.583028793334961, "global_step": 379703, "epoch": 2260} {"train_loss": -12.155668258666992, "global_step": 379704, "epoch": 2260} {"train_loss": -11.711301803588867, "global_step": 379705, "epoch": 2260} {"train_loss": -11.571083068847656, "global_step": 379706, "epoch": 2260} {"train_loss": -12.392863273620605, "global_step": 379707, "epoch": 2260} {"train_loss": -11.445744514465332, "global_step": 379708, "epoch": 2260} {"train_loss": -12.469099998474121, "global_step": 379709, "epoch": 2260} {"train_loss": -11.758328437805176, "global_step": 379710, "epoch": 2260} {"train_loss": -12.253260612487793, "global_step": 379711, "epoch": 2260} {"train_loss": -11.977932929992676, "global_step": 379712, "epoch": 2260} {"train_loss": -12.21946907043457, "global_step": 379713, "epoch": 2260} {"train_loss": -12.419708251953125, "global_step": 379714, "epoch": 2260} {"train_loss": -12.076299667358398, "global_step": 379715, "epoch": 2260} {"train_loss": -12.372268676757812, "global_step": 379716, "epoch": 2260} {"train_loss": -12.122509002685547, "global_step": 379717, "epoch": 2260} {"train_loss": -12.281350135803223, "global_step": 379718, "epoch": 2260} {"train_loss": -12.207908630371094, "global_step": 379719, "epoch": 2260} {"train_loss": -12.338850975036621, "global_step": 379720, "epoch": 2260} {"train_loss": -12.423494338989258, "global_step": 379721, "epoch": 2260} {"train_loss": -12.20742130279541, "global_step": 379722, "epoch": 2260} {"train_loss": -12.197792053222656, "global_step": 379723, "epoch": 2260} {"train_loss": -12.485969543457031, "global_step": 379724, "epoch": 2260} {"train_loss": -12.274300575256348, "global_step": 379725, "epoch": 2260} {"train_loss": -12.23763370513916, "global_step": 379726, "epoch": 2260} {"train_loss": -12.468155860900879, "global_step": 379727, "epoch": 2260} {"train_loss": -12.431190490722656, "global_step": 379728, "epoch": 2260} {"train_loss": -12.41250228881836, "global_step": 379729, "epoch": 2260} {"train_loss": -12.408612251281738, "global_step": 379730, "epoch": 2260} {"train_loss": -12.395720481872559, "global_step": 379731, "epoch": 2260} {"train_loss": -12.434967041015625, "global_step": 379732, "epoch": 2260} {"train_loss": -12.46504020690918, "global_step": 379733, "epoch": 2260} {"train_loss": -12.596881866455078, "global_step": 379734, "epoch": 2260} {"train_loss": -12.432840347290039, "global_step": 379735, "epoch": 2260} {"train_loss": -12.586787223815918, "global_step": 379736, "epoch": 2260} {"train_loss": -12.584698677062988, "global_step": 379737, "epoch": 2260} {"train_loss": -12.355113983154297, "global_step": 379738, "epoch": 2260} {"train_loss": -12.601680755615234, "global_step": 379739, "epoch": 2260} {"train_loss": -12.65266227722168, "global_step": 379740, "epoch": 2260} {"train_loss": -12.636765480041504, "global_step": 379741, "epoch": 2260} {"train_loss": -12.717988967895508, "global_step": 379742, "epoch": 2260} {"train_loss": -12.40331745147705, "global_step": 379743, "epoch": 2260} {"train_loss": -12.794851303100586, "global_step": 379744, "epoch": 2260} {"train_loss": -12.48984432220459, "global_step": 379745, "epoch": 2260} {"train_loss": -12.695308685302734, "global_step": 379746, "epoch": 2260} {"train_loss": -12.584118843078613, "global_step": 379747, "epoch": 2260} {"train_loss": -12.457109451293945, "global_step": 379748, "epoch": 2260} {"train_loss": -12.575958251953125, "global_step": 379749, "epoch": 2260} {"train_loss": -12.533149719238281, "global_step": 379750, "epoch": 2260} {"train_loss": -12.781085968017578, "global_step": 379751, "epoch": 2260} {"train_loss": -12.5413818359375, "global_step": 379752, "epoch": 2260} {"train_loss": -12.639993667602539, "global_step": 379753, "epoch": 2260} {"train_loss": -12.613880157470703, "global_step": 379754, "epoch": 2260} {"train_loss": -12.674640655517578, "global_step": 379755, "epoch": 2260} {"train_loss": -12.398374557495117, "global_step": 379756, "epoch": 2260} {"train_loss": -12.574128150939941, "global_step": 379757, "epoch": 2260} {"train_loss": -12.677172660827637, "global_step": 379758, "epoch": 2260} {"train_loss": -12.574952125549316, "global_step": 379759, "epoch": 2260} {"train_loss": -12.119915008544922, "global_step": 379760, "epoch": 2260} {"train_loss": -12.286441802978516, "global_step": 379761, "epoch": 2260} {"train_loss": -12.399840354919434, "global_step": 379762, "epoch": 2260} {"train_loss": -11.411346435546875, "global_step": 379763, "epoch": 2260} {"train_loss": -12.338476181030273, "global_step": 379764, "epoch": 2260} {"train_loss": -12.354470252990723, "global_step": 379765, "epoch": 2260} {"train_loss": -11.341880798339844, "global_step": 379766, "epoch": 2260} {"train_loss": -11.806502342224121, "global_step": 379767, "epoch": 2260} {"train_loss": -12.241931915283203, "global_step": 379768, "epoch": 2260} {"train_loss": -11.59051513671875, "global_step": 379769, "epoch": 2260} {"train_loss": -11.215657234191895, "global_step": 379770, "epoch": 2260} {"train_loss": -12.021039962768555, "global_step": 379771, "epoch": 2260} {"train_loss": -12.030713081359863, "global_step": 379772, "epoch": 2260} {"train_loss": -12.289581298828125, "global_step": 379773, "epoch": 2260} {"train_loss": -12.315958023071289, "global_step": 379774, "epoch": 2260} {"train_loss": -11.880353927612305, "global_step": 379775, "epoch": 2260} {"train_loss": -12.392807006835938, "global_step": 379776, "epoch": 2260} {"train_loss": -12.270864486694336, "global_step": 379777, "epoch": 2260} {"train_loss": -12.054956436157227, "global_step": 379778, "epoch": 2260} {"train_loss": -11.90081787109375, "global_step": 379779, "epoch": 2260} {"train_loss": -11.626202583312988, "global_step": 379780, "epoch": 2260} {"train_loss": -12.353883743286133, "global_step": 379781, "epoch": 2260} {"train_loss": -11.97935676574707, "global_step": 379782, "epoch": 2260} {"train_loss": -11.8826904296875, "global_step": 379783, "epoch": 2260} {"train_loss": -12.523477554321289, "global_step": 379784, "epoch": 2260} {"train_loss": -12.118953704833984, "global_step": 379785, "epoch": 2260} {"train_loss": -11.805610656738281, "global_step": 379786, "epoch": 2260} {"train_loss": -12.28761100769043, "global_step": 379787, "epoch": 2260} {"train_loss": -12.168806076049805, "global_step": 379788, "epoch": 2260} {"train_loss": -11.311633110046387, "global_step": 379789, "epoch": 2260} {"train_loss": -12.531152725219727, "global_step": 379790, "epoch": 2260} {"train_loss": -12.38905143737793, "global_step": 379791, "epoch": 2260} {"train_loss": -12.030868530273438, "global_step": 379792, "epoch": 2260} {"train_loss": -12.01583194732666, "global_step": 379793, "epoch": 2260} {"train_loss": -12.626672744750977, "global_step": 379794, "epoch": 2260} {"train_loss": -11.872260093688965, "global_step": 379795, "epoch": 2260} {"train_loss": -12.043794631958008, "global_step": 379796, "epoch": 2260} {"train_loss": -11.780904769897461, "global_step": 379797, "epoch": 2260} {"train_loss": -11.127665519714355, "global_step": 379798, "epoch": 2260} {"train_loss": -11.460390090942383, "global_step": 379799, "epoch": 2260} {"train_loss": -11.768386840820312, "global_step": 379800, "epoch": 2260} {"train_loss": -10.799077987670898, "global_step": 379801, "epoch": 2260} {"train_loss": -11.757760047912598, "global_step": 379802, "epoch": 2260} {"train_loss": -10.686260223388672, "global_step": 379803, "epoch": 2260} {"train_loss": -11.82206916809082, "global_step": 379804, "epoch": 2260} {"train_loss": -11.799781799316406, "global_step": 379805, "epoch": 2260} {"train_loss": -10.222887992858887, "global_step": 379806, "epoch": 2260} {"train_loss": -12.123113632202148, "global_step": 379807, "epoch": 2260} {"train_loss": -10.389028549194336, "global_step": 379808, "epoch": 2260} {"train_loss": -10.583019256591797, "global_step": 379809, "epoch": 2260} {"train_loss": -9.938647270202637, "global_step": 379810, "epoch": 2260} {"train_loss": -10.919412612915039, "global_step": 379811, "epoch": 2260} {"train_loss": -9.374944686889648, "global_step": 379812, "epoch": 2260} {"train_loss": -11.259424209594727, "global_step": 379813, "epoch": 2260} {"train_loss": -10.203214645385742, "global_step": 379814, "epoch": 2260} {"train_loss": -10.701337814331055, "global_step": 379815, "epoch": 2260} {"train_loss": -10.286834716796875, "global_step": 379816, "epoch": 2260} {"train_loss": -10.358678817749023, "global_step": 379817, "epoch": 2260} {"train_loss": -11.4121732711792, "global_step": 379818, "epoch": 2260} {"train_loss": -9.888378143310547, "global_step": 379819, "epoch": 2260} {"train_loss": -12.119497299194336, "global_step": 379820, "epoch": 2260} {"train_loss": -9.946867942810059, "global_step": 379821, "epoch": 2260} {"train_loss": -10.698333740234375, "global_step": 379822, "epoch": 2260} {"train_loss": -10.933204650878906, "global_step": 379823, "epoch": 2260} {"train_loss": -11.06419563293457, "global_step": 379824, "epoch": 2260} {"train_loss": -10.903295516967773, "global_step": 379825, "epoch": 2260} {"train_loss": -11.475889205932617, "global_step": 379826, "epoch": 2260} {"train_loss": -11.39858627319336, "global_step": 379827, "epoch": 2260} {"train_loss": -10.671321868896484, "global_step": 379828, "epoch": 2260} {"train_loss": -11.572097778320312, "global_step": 379829, "epoch": 2260} {"train_loss": -9.925702095031738, "global_step": 379830, "epoch": 2260} {"train_loss": -12.134506225585938, "global_step": 379831, "epoch": 2260} {"train_loss": -10.879905700683594, "global_step": 379832, "epoch": 2260} {"train_loss": -11.702985763549805, "global_step": 379833, "epoch": 2260} {"train_loss": -10.572479248046875, "global_step": 379834, "epoch": 2260} {"train_loss": -11.826536178588867, "global_step": 379835, "epoch": 2260} {"train_loss": -11.70337200164795, "global_step": 379836, "epoch": 2260} {"train_loss": -11.56606674194336, "global_step": 379837, "epoch": 2260} {"train_loss": -11.339181900024414, "global_step": 379838, "epoch": 2260} {"train_loss": -11.644536972045898, "global_step": 379839, "epoch": 2260} {"train_loss": -11.39013671875, "global_step": 379840, "epoch": 2260} {"train_loss": -12.016090393066406, "global_step": 379841, "epoch": 2260} {"train_loss": -11.34829044342041, "global_step": 379842, "epoch": 2260} {"train_loss": -11.712780952453613, "global_step": 379843, "epoch": 2260} {"train_loss": -12.003100395202637, "global_step": 379844, "epoch": 2260} {"train_loss": -11.682581901550293, "global_step": 379845, "epoch": 2260} {"train_loss": -12.089349746704102, "global_step": 379846, "epoch": 2260} {"train_loss": -11.873583634694418, "global_step": 379847, "epoch": 2260, "val_loss": 287798.71875, "train_action_mse_error": 1.2126998901367188} {"train_loss": -12.080366134643555, "global_step": 379848, "epoch": 2261} {"train_loss": -12.07845687866211, "global_step": 379849, "epoch": 2261} {"train_loss": -12.10287094116211, "global_step": 379850, "epoch": 2261} {"train_loss": -11.744427680969238, "global_step": 379851, "epoch": 2261} {"train_loss": -12.165792465209961, "global_step": 379852, "epoch": 2261} {"train_loss": -11.916467666625977, "global_step": 379853, "epoch": 2261} {"train_loss": -11.935157775878906, "global_step": 379854, "epoch": 2261} {"train_loss": -12.178723335266113, "global_step": 379855, "epoch": 2261} {"train_loss": -12.08383560180664, "global_step": 379856, "epoch": 2261} {"train_loss": -12.268356323242188, "global_step": 379857, "epoch": 2261} {"train_loss": -12.00269603729248, "global_step": 379858, "epoch": 2261} {"train_loss": -12.03973388671875, "global_step": 379859, "epoch": 2261} {"train_loss": -12.034130096435547, "global_step": 379860, "epoch": 2261} {"train_loss": -11.837279319763184, "global_step": 379861, "epoch": 2261} {"train_loss": -12.130054473876953, "global_step": 379862, "epoch": 2261} {"train_loss": -12.033462524414062, "global_step": 379863, "epoch": 2261} {"train_loss": -12.166410446166992, "global_step": 379864, "epoch": 2261} {"train_loss": -11.72785758972168, "global_step": 379865, "epoch": 2261} {"train_loss": -12.298093795776367, "global_step": 379866, "epoch": 2261} {"train_loss": -12.160947799682617, "global_step": 379867, "epoch": 2261} {"train_loss": -12.022726058959961, "global_step": 379868, "epoch": 2261} {"train_loss": -12.31574535369873, "global_step": 379869, "epoch": 2261} {"train_loss": -11.959249496459961, "global_step": 379870, "epoch": 2261} {"train_loss": -12.161796569824219, "global_step": 379871, "epoch": 2261} {"train_loss": -11.993597984313965, "global_step": 379872, "epoch": 2261} {"train_loss": -12.013736724853516, "global_step": 379873, "epoch": 2261} {"train_loss": -12.294858932495117, "global_step": 379874, "epoch": 2261} {"train_loss": -12.190238952636719, "global_step": 379875, "epoch": 2261} {"train_loss": -12.092306137084961, "global_step": 379876, "epoch": 2261} {"train_loss": -12.250844955444336, "global_step": 379877, "epoch": 2261} {"train_loss": -12.415667533874512, "global_step": 379878, "epoch": 2261} {"train_loss": -12.146924018859863, "global_step": 379879, "epoch": 2261} {"train_loss": -12.456884384155273, "global_step": 379880, "epoch": 2261} {"train_loss": -12.422843933105469, "global_step": 379881, "epoch": 2261} {"train_loss": -12.374256134033203, "global_step": 379882, "epoch": 2261} {"train_loss": -12.443071365356445, "global_step": 379883, "epoch": 2261} {"train_loss": -12.332633018493652, "global_step": 379884, "epoch": 2261} {"train_loss": -12.2781982421875, "global_step": 379885, "epoch": 2261} {"train_loss": -12.316795349121094, "global_step": 379886, "epoch": 2261} {"train_loss": -12.351326942443848, "global_step": 379887, "epoch": 2261} {"train_loss": -12.396903991699219, "global_step": 379888, "epoch": 2261} {"train_loss": -12.182840347290039, "global_step": 379889, "epoch": 2261} {"train_loss": -12.644038200378418, "global_step": 379890, "epoch": 2261} {"train_loss": -12.456375122070312, "global_step": 379891, "epoch": 2261} {"train_loss": -12.529682159423828, "global_step": 379892, "epoch": 2261} {"train_loss": -12.505794525146484, "global_step": 379893, "epoch": 2261} {"train_loss": -12.420014381408691, "global_step": 379894, "epoch": 2261} {"train_loss": -12.487003326416016, "global_step": 379895, "epoch": 2261} {"train_loss": -12.190337181091309, "global_step": 379896, "epoch": 2261} {"train_loss": -12.3702392578125, "global_step": 379897, "epoch": 2261} {"train_loss": -12.208953857421875, "global_step": 379898, "epoch": 2261} {"train_loss": -12.077929496765137, "global_step": 379899, "epoch": 2261} {"train_loss": -12.420910835266113, "global_step": 379900, "epoch": 2261} {"train_loss": -12.110481262207031, "global_step": 379901, "epoch": 2261} {"train_loss": -12.19007682800293, "global_step": 379902, "epoch": 2261} {"train_loss": -12.734075546264648, "global_step": 379903, "epoch": 2261} {"train_loss": -12.09337043762207, "global_step": 379904, "epoch": 2261} {"train_loss": -12.64587116241455, "global_step": 379905, "epoch": 2261} {"train_loss": -12.090982437133789, "global_step": 379906, "epoch": 2261} {"train_loss": -12.597554206848145, "global_step": 379907, "epoch": 2261} {"train_loss": -12.219793319702148, "global_step": 379908, "epoch": 2261} {"train_loss": -12.64326000213623, "global_step": 379909, "epoch": 2261} {"train_loss": -12.380571365356445, "global_step": 379910, "epoch": 2261} {"train_loss": -12.63650131225586, "global_step": 379911, "epoch": 2261} {"train_loss": -12.537674903869629, "global_step": 379912, "epoch": 2261} {"train_loss": -12.586140632629395, "global_step": 379913, "epoch": 2261} {"train_loss": -12.441398620605469, "global_step": 379914, "epoch": 2261} {"train_loss": -12.660085678100586, "global_step": 379915, "epoch": 2261} {"train_loss": -12.2733154296875, "global_step": 379916, "epoch": 2261} {"train_loss": -12.787225723266602, "global_step": 379917, "epoch": 2261} {"train_loss": -12.420376777648926, "global_step": 379918, "epoch": 2261} {"train_loss": -12.517809867858887, "global_step": 379919, "epoch": 2261} {"train_loss": -12.179234504699707, "global_step": 379920, "epoch": 2261} {"train_loss": -12.627891540527344, "global_step": 379921, "epoch": 2261} {"train_loss": -12.364472389221191, "global_step": 379922, "epoch": 2261} {"train_loss": -12.573324203491211, "global_step": 379923, "epoch": 2261} {"train_loss": -12.535821914672852, "global_step": 379924, "epoch": 2261} {"train_loss": -12.60118293762207, "global_step": 379925, "epoch": 2261} {"train_loss": -12.519964218139648, "global_step": 379926, "epoch": 2261} {"train_loss": -12.25533390045166, "global_step": 379927, "epoch": 2261} {"train_loss": -12.831408500671387, "global_step": 379928, "epoch": 2261} {"train_loss": -12.570419311523438, "global_step": 379929, "epoch": 2261} {"train_loss": -12.599088668823242, "global_step": 379930, "epoch": 2261} {"train_loss": -12.708931922912598, "global_step": 379931, "epoch": 2261} {"train_loss": -12.624177932739258, "global_step": 379932, "epoch": 2261} {"train_loss": -12.308902740478516, "global_step": 379933, "epoch": 2261} {"train_loss": -12.830741882324219, "global_step": 379934, "epoch": 2261} {"train_loss": -12.356785774230957, "global_step": 379935, "epoch": 2261} {"train_loss": -12.733550071716309, "global_step": 379936, "epoch": 2261} {"train_loss": -12.700448036193848, "global_step": 379937, "epoch": 2261} {"train_loss": -12.508408546447754, "global_step": 379938, "epoch": 2261} {"train_loss": -12.543452262878418, "global_step": 379939, "epoch": 2261} {"train_loss": -11.947693824768066, "global_step": 379940, "epoch": 2261} {"train_loss": -12.639521598815918, "global_step": 379941, "epoch": 2261} {"train_loss": -12.549690246582031, "global_step": 379942, "epoch": 2261} {"train_loss": -11.829469680786133, "global_step": 379943, "epoch": 2261} {"train_loss": -11.337132453918457, "global_step": 379944, "epoch": 2261} {"train_loss": -12.399658203125, "global_step": 379945, "epoch": 2261} {"train_loss": -12.472208976745605, "global_step": 379946, "epoch": 2261} {"train_loss": -11.874124526977539, "global_step": 379947, "epoch": 2261} {"train_loss": -12.235666275024414, "global_step": 379948, "epoch": 2261} {"train_loss": -12.364992141723633, "global_step": 379949, "epoch": 2261} {"train_loss": -11.857336044311523, "global_step": 379950, "epoch": 2261} {"train_loss": -12.137422561645508, "global_step": 379951, "epoch": 2261} {"train_loss": -12.61199951171875, "global_step": 379952, "epoch": 2261} {"train_loss": -12.395572662353516, "global_step": 379953, "epoch": 2261} {"train_loss": -12.36087417602539, "global_step": 379954, "epoch": 2261} {"train_loss": -12.086769104003906, "global_step": 379955, "epoch": 2261} {"train_loss": -12.44323444366455, "global_step": 379956, "epoch": 2261} {"train_loss": -12.550710678100586, "global_step": 379957, "epoch": 2261} {"train_loss": -12.50967788696289, "global_step": 379958, "epoch": 2261} {"train_loss": -12.546154022216797, "global_step": 379959, "epoch": 2261} {"train_loss": -12.5338134765625, "global_step": 379960, "epoch": 2261} {"train_loss": -12.464393615722656, "global_step": 379961, "epoch": 2261} {"train_loss": -12.122408866882324, "global_step": 379962, "epoch": 2261} {"train_loss": -12.608625411987305, "global_step": 379963, "epoch": 2261} {"train_loss": -12.009264945983887, "global_step": 379964, "epoch": 2261} {"train_loss": -12.662164688110352, "global_step": 379965, "epoch": 2261} {"train_loss": -11.818750381469727, "global_step": 379966, "epoch": 2261} {"train_loss": -12.701013565063477, "global_step": 379967, "epoch": 2261} {"train_loss": -11.858097076416016, "global_step": 379968, "epoch": 2261} {"train_loss": -11.087368965148926, "global_step": 379969, "epoch": 2261} {"train_loss": -11.517171859741211, "global_step": 379970, "epoch": 2261} {"train_loss": -11.900106430053711, "global_step": 379971, "epoch": 2261} {"train_loss": -11.228612899780273, "global_step": 379972, "epoch": 2261} {"train_loss": -10.741103172302246, "global_step": 379973, "epoch": 2261} {"train_loss": -12.317005157470703, "global_step": 379974, "epoch": 2261} {"train_loss": -12.124147415161133, "global_step": 379975, "epoch": 2261} {"train_loss": -11.612390518188477, "global_step": 379976, "epoch": 2261} {"train_loss": -11.963822364807129, "global_step": 379977, "epoch": 2261} {"train_loss": -11.868833541870117, "global_step": 379978, "epoch": 2261} {"train_loss": -12.152454376220703, "global_step": 379979, "epoch": 2261} {"train_loss": -11.597953796386719, "global_step": 379980, "epoch": 2261} {"train_loss": -11.923794746398926, "global_step": 379981, "epoch": 2261} {"train_loss": -11.654470443725586, "global_step": 379982, "epoch": 2261} {"train_loss": -12.507500648498535, "global_step": 379983, "epoch": 2261} {"train_loss": -12.027313232421875, "global_step": 379984, "epoch": 2261} {"train_loss": -12.071710586547852, "global_step": 379985, "epoch": 2261} {"train_loss": -11.792252540588379, "global_step": 379986, "epoch": 2261} {"train_loss": -11.903045654296875, "global_step": 379987, "epoch": 2261} {"train_loss": -12.602907180786133, "global_step": 379988, "epoch": 2261} {"train_loss": -11.743232727050781, "global_step": 379989, "epoch": 2261} {"train_loss": -12.304449081420898, "global_step": 379990, "epoch": 2261} {"train_loss": -12.038642883300781, "global_step": 379991, "epoch": 2261} {"train_loss": -12.361082077026367, "global_step": 379992, "epoch": 2261} {"train_loss": -12.102503776550293, "global_step": 379993, "epoch": 2261} {"train_loss": -12.509929656982422, "global_step": 379994, "epoch": 2261} {"train_loss": -11.930713653564453, "global_step": 379995, "epoch": 2261} {"train_loss": -12.214645385742188, "global_step": 379996, "epoch": 2261} {"train_loss": -12.211509704589844, "global_step": 379997, "epoch": 2261} {"train_loss": -12.251873970031738, "global_step": 379998, "epoch": 2261} {"train_loss": -12.336772918701172, "global_step": 379999, "epoch": 2261} {"train_loss": -12.320876121520996, "global_step": 380000, "epoch": 2261} {"train_loss": -12.21542739868164, "global_step": 380001, "epoch": 2261} {"train_loss": -12.000256538391113, "global_step": 380002, "epoch": 2261} {"train_loss": -11.776887893676758, "global_step": 380003, "epoch": 2261} {"train_loss": -11.699480056762695, "global_step": 380004, "epoch": 2261} {"train_loss": -12.35630989074707, "global_step": 380005, "epoch": 2261} {"train_loss": -11.873905181884766, "global_step": 380006, "epoch": 2261} {"train_loss": -12.04013729095459, "global_step": 380007, "epoch": 2261} {"train_loss": -12.346024513244629, "global_step": 380008, "epoch": 2261} {"train_loss": -12.13377857208252, "global_step": 380009, "epoch": 2261} {"train_loss": -12.042889595031738, "global_step": 380010, "epoch": 2261} {"train_loss": -11.666520118713379, "global_step": 380011, "epoch": 2261} {"train_loss": -12.038494110107422, "global_step": 380012, "epoch": 2261} {"train_loss": -11.104558944702148, "global_step": 380013, "epoch": 2261} {"train_loss": -12.169065475463867, "global_step": 380014, "epoch": 2261} {"train_loss": -12.21494208063398, "global_step": 380015, "epoch": 2261, "val_loss": 285056.53125} {"train_loss": -11.53136920928955, "global_step": 380016, "epoch": 2262} {"train_loss": -11.835915565490723, "global_step": 380017, "epoch": 2262} {"train_loss": -10.378292083740234, "global_step": 380018, "epoch": 2262} {"train_loss": -11.058420181274414, "global_step": 380019, "epoch": 2262} {"train_loss": -11.160114288330078, "global_step": 380020, "epoch": 2262} {"train_loss": -10.271547317504883, "global_step": 380021, "epoch": 2262} {"train_loss": -10.97130012512207, "global_step": 380022, "epoch": 2262} {"train_loss": -11.668062210083008, "global_step": 380023, "epoch": 2262} {"train_loss": -10.891855239868164, "global_step": 380024, "epoch": 2262} {"train_loss": -11.09276008605957, "global_step": 380025, "epoch": 2262} {"train_loss": -11.509401321411133, "global_step": 380026, "epoch": 2262} {"train_loss": -9.63663101196289, "global_step": 380027, "epoch": 2262} {"train_loss": -11.099605560302734, "global_step": 380028, "epoch": 2262} {"train_loss": -10.72006893157959, "global_step": 380029, "epoch": 2262} {"train_loss": -8.499734878540039, "global_step": 380030, "epoch": 2262} {"train_loss": -10.969650268554688, "global_step": 380031, "epoch": 2262} {"train_loss": -9.297538757324219, "global_step": 380032, "epoch": 2262} {"train_loss": -10.725543022155762, "global_step": 380033, "epoch": 2262} {"train_loss": -9.950037956237793, "global_step": 380034, "epoch": 2262} {"train_loss": -9.64968490600586, "global_step": 380035, "epoch": 2262} {"train_loss": -11.831489562988281, "global_step": 380036, "epoch": 2262} {"train_loss": -10.415060997009277, "global_step": 380037, "epoch": 2262} {"train_loss": -11.353141784667969, "global_step": 380038, "epoch": 2262} {"train_loss": -10.209277153015137, "global_step": 380039, "epoch": 2262} {"train_loss": -11.011117935180664, "global_step": 380040, "epoch": 2262} {"train_loss": -10.322053909301758, "global_step": 380041, "epoch": 2262} {"train_loss": -11.708913803100586, "global_step": 380042, "epoch": 2262} {"train_loss": -10.014668464660645, "global_step": 380043, "epoch": 2262} {"train_loss": -12.053726196289062, "global_step": 380044, "epoch": 2262} {"train_loss": -10.6819486618042, "global_step": 380045, "epoch": 2262} {"train_loss": -11.399468421936035, "global_step": 380046, "epoch": 2262} {"train_loss": -11.293661117553711, "global_step": 380047, "epoch": 2262} {"train_loss": -11.499073028564453, "global_step": 380048, "epoch": 2262} {"train_loss": -10.883916854858398, "global_step": 380049, "epoch": 2262} {"train_loss": -11.664247512817383, "global_step": 380050, "epoch": 2262} {"train_loss": -11.43221378326416, "global_step": 380051, "epoch": 2262} {"train_loss": -11.62177848815918, "global_step": 380052, "epoch": 2262} {"train_loss": -11.756553649902344, "global_step": 380053, "epoch": 2262} {"train_loss": -11.59552001953125, "global_step": 380054, "epoch": 2262} {"train_loss": -11.944975852966309, "global_step": 380055, "epoch": 2262} {"train_loss": -12.03000545501709, "global_step": 380056, "epoch": 2262} {"train_loss": -11.994492530822754, "global_step": 380057, "epoch": 2262} {"train_loss": -12.25657844543457, "global_step": 380058, "epoch": 2262} {"train_loss": -12.10091495513916, "global_step": 380059, "epoch": 2262} {"train_loss": -11.829959869384766, "global_step": 380060, "epoch": 2262} {"train_loss": -12.364704132080078, "global_step": 380061, "epoch": 2262} {"train_loss": -12.178817749023438, "global_step": 380062, "epoch": 2262} {"train_loss": -12.150405883789062, "global_step": 380063, "epoch": 2262} {"train_loss": -12.158458709716797, "global_step": 380064, "epoch": 2262} {"train_loss": -12.13900375366211, "global_step": 380065, "epoch": 2262} {"train_loss": -12.044614791870117, "global_step": 380066, "epoch": 2262} {"train_loss": -12.332447052001953, "global_step": 380067, "epoch": 2262} {"train_loss": -12.41706657409668, "global_step": 380068, "epoch": 2262} {"train_loss": -12.128475189208984, "global_step": 380069, "epoch": 2262} {"train_loss": -12.343088150024414, "global_step": 380070, "epoch": 2262} {"train_loss": -12.164438247680664, "global_step": 380071, "epoch": 2262} {"train_loss": -12.128952026367188, "global_step": 380072, "epoch": 2262} {"train_loss": -12.315719604492188, "global_step": 380073, "epoch": 2262} {"train_loss": -12.225457191467285, "global_step": 380074, "epoch": 2262} {"train_loss": -12.167896270751953, "global_step": 380075, "epoch": 2262} {"train_loss": -12.028406143188477, "global_step": 380076, "epoch": 2262} {"train_loss": -12.008420944213867, "global_step": 380077, "epoch": 2262} {"train_loss": -12.065860748291016, "global_step": 380078, "epoch": 2262} {"train_loss": -12.12476634979248, "global_step": 380079, "epoch": 2262} {"train_loss": -12.029261589050293, "global_step": 380080, "epoch": 2262} {"train_loss": -12.294198989868164, "global_step": 380081, "epoch": 2262} {"train_loss": -11.776798248291016, "global_step": 380082, "epoch": 2262} {"train_loss": -12.490878105163574, "global_step": 380083, "epoch": 2262} {"train_loss": -12.296834945678711, "global_step": 380084, "epoch": 2262} {"train_loss": -12.335075378417969, "global_step": 380085, "epoch": 2262} {"train_loss": -12.323665618896484, "global_step": 380086, "epoch": 2262} {"train_loss": -12.266870498657227, "global_step": 380087, "epoch": 2262} {"train_loss": -12.410901069641113, "global_step": 380088, "epoch": 2262} {"train_loss": -11.975590705871582, "global_step": 380089, "epoch": 2262} {"train_loss": -12.204927444458008, "global_step": 380090, "epoch": 2262} {"train_loss": -12.232827186584473, "global_step": 380091, "epoch": 2262} {"train_loss": -12.33623218536377, "global_step": 380092, "epoch": 2262} {"train_loss": -12.5400390625, "global_step": 380093, "epoch": 2262} {"train_loss": -12.41761589050293, "global_step": 380094, "epoch": 2262} {"train_loss": -12.340225219726562, "global_step": 380095, "epoch": 2262} {"train_loss": -12.53789234161377, "global_step": 380096, "epoch": 2262} {"train_loss": -12.521894454956055, "global_step": 380097, "epoch": 2262} {"train_loss": -12.52798080444336, "global_step": 380098, "epoch": 2262} {"train_loss": -12.419490814208984, "global_step": 380099, "epoch": 2262} {"train_loss": -12.501932144165039, "global_step": 380100, "epoch": 2262} {"train_loss": -12.598386764526367, "global_step": 380101, "epoch": 2262} {"train_loss": -12.496448516845703, "global_step": 380102, "epoch": 2262} {"train_loss": -12.758745193481445, "global_step": 380103, "epoch": 2262} {"train_loss": -12.462709426879883, "global_step": 380104, "epoch": 2262} {"train_loss": -12.724093437194824, "global_step": 380105, "epoch": 2262} {"train_loss": -12.569501876831055, "global_step": 380106, "epoch": 2262} {"train_loss": -12.655013084411621, "global_step": 380107, "epoch": 2262} {"train_loss": -12.746142387390137, "global_step": 380108, "epoch": 2262} {"train_loss": -12.716737747192383, "global_step": 380109, "epoch": 2262} {"train_loss": -12.567140579223633, "global_step": 380110, "epoch": 2262} {"train_loss": -12.589107513427734, "global_step": 380111, "epoch": 2262} {"train_loss": -12.60955810546875, "global_step": 380112, "epoch": 2262} {"train_loss": -12.55620002746582, "global_step": 380113, "epoch": 2262} {"train_loss": -12.650415420532227, "global_step": 380114, "epoch": 2262} {"train_loss": -12.558719635009766, "global_step": 380115, "epoch": 2262} {"train_loss": -12.46451473236084, "global_step": 380116, "epoch": 2262} {"train_loss": -12.649589538574219, "global_step": 380117, "epoch": 2262} {"train_loss": -12.691673278808594, "global_step": 380118, "epoch": 2262} {"train_loss": -12.65579605102539, "global_step": 380119, "epoch": 2262} {"train_loss": -12.682202339172363, "global_step": 380120, "epoch": 2262} {"train_loss": -12.688336372375488, "global_step": 380121, "epoch": 2262} {"train_loss": -12.744758605957031, "global_step": 380122, "epoch": 2262} {"train_loss": -12.67282772064209, "global_step": 380123, "epoch": 2262} {"train_loss": -12.486902236938477, "global_step": 380124, "epoch": 2262} {"train_loss": -12.401510238647461, "global_step": 380125, "epoch": 2262} {"train_loss": -12.684122085571289, "global_step": 380126, "epoch": 2262} {"train_loss": -12.365739822387695, "global_step": 380127, "epoch": 2262} {"train_loss": -12.461750030517578, "global_step": 380128, "epoch": 2262} {"train_loss": -12.662070274353027, "global_step": 380129, "epoch": 2262} {"train_loss": -12.243568420410156, "global_step": 380130, "epoch": 2262} {"train_loss": -12.08480167388916, "global_step": 380131, "epoch": 2262} {"train_loss": -12.777682304382324, "global_step": 380132, "epoch": 2262} {"train_loss": -12.693970680236816, "global_step": 380133, "epoch": 2262} {"train_loss": -12.69900894165039, "global_step": 380134, "epoch": 2262} {"train_loss": -12.558473587036133, "global_step": 380135, "epoch": 2262} {"train_loss": -12.761293411254883, "global_step": 380136, "epoch": 2262} {"train_loss": -12.751677513122559, "global_step": 380137, "epoch": 2262} {"train_loss": -12.697933197021484, "global_step": 380138, "epoch": 2262} {"train_loss": -12.667099952697754, "global_step": 380139, "epoch": 2262} {"train_loss": -12.931596755981445, "global_step": 380140, "epoch": 2262} {"train_loss": -12.824054718017578, "global_step": 380141, "epoch": 2262} {"train_loss": -12.631250381469727, "global_step": 380142, "epoch": 2262} {"train_loss": -12.606778144836426, "global_step": 380143, "epoch": 2262} {"train_loss": -12.569799423217773, "global_step": 380144, "epoch": 2262} {"train_loss": -12.591139793395996, "global_step": 380145, "epoch": 2262} {"train_loss": -12.35885238647461, "global_step": 380146, "epoch": 2262} {"train_loss": -12.65902328491211, "global_step": 380147, "epoch": 2262} {"train_loss": -12.425432205200195, "global_step": 380148, "epoch": 2262} {"train_loss": -12.32320499420166, "global_step": 380149, "epoch": 2262} {"train_loss": -12.765691757202148, "global_step": 380150, "epoch": 2262} {"train_loss": -12.581497192382812, "global_step": 380151, "epoch": 2262} {"train_loss": -12.555667877197266, "global_step": 380152, "epoch": 2262} {"train_loss": -12.49423599243164, "global_step": 380153, "epoch": 2262} {"train_loss": -12.530874252319336, "global_step": 380154, "epoch": 2262} {"train_loss": -12.541401863098145, "global_step": 380155, "epoch": 2262} {"train_loss": -11.825953483581543, "global_step": 380156, "epoch": 2262} {"train_loss": -11.740864753723145, "global_step": 380157, "epoch": 2262} {"train_loss": -11.60609245300293, "global_step": 380158, "epoch": 2262} {"train_loss": -11.508084297180176, "global_step": 380159, "epoch": 2262} {"train_loss": -10.4351806640625, "global_step": 380160, "epoch": 2262} {"train_loss": -12.164730072021484, "global_step": 380161, "epoch": 2262} {"train_loss": -10.836523056030273, "global_step": 380162, "epoch": 2262} {"train_loss": -10.264609336853027, "global_step": 380163, "epoch": 2262} {"train_loss": -11.835124969482422, "global_step": 380164, "epoch": 2262} {"train_loss": -11.727941513061523, "global_step": 380165, "epoch": 2262} {"train_loss": -11.49662971496582, "global_step": 380166, "epoch": 2262} {"train_loss": -10.320808410644531, "global_step": 380167, "epoch": 2262} {"train_loss": -11.199174880981445, "global_step": 380168, "epoch": 2262} {"train_loss": -8.809560775756836, "global_step": 380169, "epoch": 2262} {"train_loss": -10.498388290405273, "global_step": 380170, "epoch": 2262} {"train_loss": -10.7093505859375, "global_step": 380171, "epoch": 2262} {"train_loss": -9.265162467956543, "global_step": 380172, "epoch": 2262} {"train_loss": -9.221467971801758, "global_step": 380173, "epoch": 2262} {"train_loss": -9.28664779663086, "global_step": 380174, "epoch": 2262} {"train_loss": -8.593894958496094, "global_step": 380175, "epoch": 2262} {"train_loss": -9.645241737365723, "global_step": 380176, "epoch": 2262} {"train_loss": -8.998910903930664, "global_step": 380177, "epoch": 2262} {"train_loss": -8.804292678833008, "global_step": 380178, "epoch": 2262} {"train_loss": -9.671611785888672, "global_step": 380179, "epoch": 2262} {"train_loss": -10.069259643554688, "global_step": 380180, "epoch": 2262} {"train_loss": -9.320135116577148, "global_step": 380181, "epoch": 2262} {"train_loss": -11.54757308959961, "global_step": 380182, "epoch": 2262} {"train_loss": -11.737758750007266, "global_step": 380183, "epoch": 2262, "val_loss": 290233.28125} {"train_loss": -9.881441116333008, "global_step": 380184, "epoch": 2263} {"train_loss": -10.886457443237305, "global_step": 380185, "epoch": 2263} {"train_loss": -10.460211753845215, "global_step": 380186, "epoch": 2263} {"train_loss": -11.158937454223633, "global_step": 380187, "epoch": 2263} {"train_loss": -10.867387771606445, "global_step": 380188, "epoch": 2263} {"train_loss": -11.460073471069336, "global_step": 380189, "epoch": 2263} {"train_loss": -10.949553489685059, "global_step": 380190, "epoch": 2263} {"train_loss": -11.543052673339844, "global_step": 380191, "epoch": 2263} {"train_loss": -11.11363697052002, "global_step": 380192, "epoch": 2263} {"train_loss": -11.541749954223633, "global_step": 380193, "epoch": 2263} {"train_loss": -11.80888557434082, "global_step": 380194, "epoch": 2263} {"train_loss": -11.456929206848145, "global_step": 380195, "epoch": 2263} {"train_loss": -11.98065185546875, "global_step": 380196, "epoch": 2263} {"train_loss": -11.655549049377441, "global_step": 380197, "epoch": 2263} {"train_loss": -11.99809455871582, "global_step": 380198, "epoch": 2263} {"train_loss": -11.713329315185547, "global_step": 380199, "epoch": 2263} {"train_loss": -11.682727813720703, "global_step": 380200, "epoch": 2263} {"train_loss": -11.704645156860352, "global_step": 380201, "epoch": 2263} {"train_loss": -11.916437149047852, "global_step": 380202, "epoch": 2263} {"train_loss": -11.859045028686523, "global_step": 380203, "epoch": 2263} {"train_loss": -11.9580078125, "global_step": 380204, "epoch": 2263} {"train_loss": -11.623385429382324, "global_step": 380205, "epoch": 2263} {"train_loss": -11.963558197021484, "global_step": 380206, "epoch": 2263} {"train_loss": -12.017606735229492, "global_step": 380207, "epoch": 2263} {"train_loss": -11.846565246582031, "global_step": 380208, "epoch": 2263} {"train_loss": -12.009052276611328, "global_step": 380209, "epoch": 2263} {"train_loss": -12.076146125793457, "global_step": 380210, "epoch": 2263} {"train_loss": -12.000734329223633, "global_step": 380211, "epoch": 2263} {"train_loss": -11.843121528625488, "global_step": 380212, "epoch": 2263} {"train_loss": -12.222833633422852, "global_step": 380213, "epoch": 2263} {"train_loss": -12.066158294677734, "global_step": 380214, "epoch": 2263} {"train_loss": -12.046834945678711, "global_step": 380215, "epoch": 2263} {"train_loss": -12.27294921875, "global_step": 380216, "epoch": 2263} {"train_loss": -12.12624740600586, "global_step": 380217, "epoch": 2263} {"train_loss": -12.21859073638916, "global_step": 380218, "epoch": 2263} {"train_loss": -12.29392147064209, "global_step": 380219, "epoch": 2263} {"train_loss": -12.252096176147461, "global_step": 380220, "epoch": 2263} {"train_loss": -12.093684196472168, "global_step": 380221, "epoch": 2263} {"train_loss": -12.248967170715332, "global_step": 380222, "epoch": 2263} {"train_loss": -12.267353057861328, "global_step": 380223, "epoch": 2263} {"train_loss": -12.568511962890625, "global_step": 380224, "epoch": 2263} {"train_loss": -12.362588882446289, "global_step": 380225, "epoch": 2263} {"train_loss": -12.30308723449707, "global_step": 380226, "epoch": 2263} {"train_loss": -12.192898750305176, "global_step": 380227, "epoch": 2263} {"train_loss": -12.290016174316406, "global_step": 380228, "epoch": 2263} {"train_loss": -12.288888931274414, "global_step": 380229, "epoch": 2263} {"train_loss": -12.3032808303833, "global_step": 380230, "epoch": 2263} {"train_loss": -12.372506141662598, "global_step": 380231, "epoch": 2263} {"train_loss": -12.310330390930176, "global_step": 380232, "epoch": 2263} {"train_loss": -12.238215446472168, "global_step": 380233, "epoch": 2263} {"train_loss": -12.488576889038086, "global_step": 380234, "epoch": 2263} {"train_loss": -12.31035327911377, "global_step": 380235, "epoch": 2263} {"train_loss": -12.535755157470703, "global_step": 380236, "epoch": 2263} {"train_loss": -12.44282341003418, "global_step": 380237, "epoch": 2263} {"train_loss": -12.534379959106445, "global_step": 380238, "epoch": 2263} {"train_loss": -12.403858184814453, "global_step": 380239, "epoch": 2263} {"train_loss": -12.392807006835938, "global_step": 380240, "epoch": 2263} {"train_loss": -12.360002517700195, "global_step": 380241, "epoch": 2263} {"train_loss": -12.255640029907227, "global_step": 380242, "epoch": 2263} {"train_loss": -12.280078887939453, "global_step": 380243, "epoch": 2263} {"train_loss": -12.394535064697266, "global_step": 380244, "epoch": 2263} {"train_loss": -12.167251586914062, "global_step": 380245, "epoch": 2263} {"train_loss": -12.34262466430664, "global_step": 380246, "epoch": 2263} {"train_loss": -12.504732131958008, "global_step": 380247, "epoch": 2263} {"train_loss": -12.266193389892578, "global_step": 380248, "epoch": 2263} {"train_loss": -12.671831130981445, "global_step": 380249, "epoch": 2263} {"train_loss": -12.431123733520508, "global_step": 380250, "epoch": 2263} {"train_loss": -12.311107635498047, "global_step": 380251, "epoch": 2263} {"train_loss": -12.563440322875977, "global_step": 380252, "epoch": 2263} {"train_loss": -12.340102195739746, "global_step": 380253, "epoch": 2263} {"train_loss": -12.755133628845215, "global_step": 380254, "epoch": 2263} {"train_loss": -12.560380935668945, "global_step": 380255, "epoch": 2263} {"train_loss": -12.290728569030762, "global_step": 380256, "epoch": 2263} {"train_loss": -12.677698135375977, "global_step": 380257, "epoch": 2263} {"train_loss": -11.958633422851562, "global_step": 380258, "epoch": 2263} {"train_loss": -12.587743759155273, "global_step": 380259, "epoch": 2263} {"train_loss": -12.700998306274414, "global_step": 380260, "epoch": 2263} {"train_loss": -12.275760650634766, "global_step": 380261, "epoch": 2263} {"train_loss": -12.67020034790039, "global_step": 380262, "epoch": 2263} {"train_loss": -12.481158256530762, "global_step": 380263, "epoch": 2263} {"train_loss": -12.157140731811523, "global_step": 380264, "epoch": 2263} {"train_loss": -12.369829177856445, "global_step": 380265, "epoch": 2263} {"train_loss": -12.593059539794922, "global_step": 380266, "epoch": 2263} {"train_loss": -12.337691307067871, "global_step": 380267, "epoch": 2263} {"train_loss": -12.310493469238281, "global_step": 380268, "epoch": 2263} {"train_loss": -12.432504653930664, "global_step": 380269, "epoch": 2263} {"train_loss": -12.566444396972656, "global_step": 380270, "epoch": 2263} {"train_loss": -12.71721076965332, "global_step": 380271, "epoch": 2263} {"train_loss": -12.487756729125977, "global_step": 380272, "epoch": 2263} {"train_loss": -12.628667831420898, "global_step": 380273, "epoch": 2263} {"train_loss": -12.759326934814453, "global_step": 380274, "epoch": 2263} {"train_loss": -12.397066116333008, "global_step": 380275, "epoch": 2263} {"train_loss": -12.654793739318848, "global_step": 380276, "epoch": 2263} {"train_loss": -12.420721054077148, "global_step": 380277, "epoch": 2263} {"train_loss": -12.468361854553223, "global_step": 380278, "epoch": 2263} {"train_loss": -12.16971492767334, "global_step": 380279, "epoch": 2263} {"train_loss": -12.808287620544434, "global_step": 380280, "epoch": 2263} {"train_loss": -12.335206985473633, "global_step": 380281, "epoch": 2263} {"train_loss": -12.738117218017578, "global_step": 380282, "epoch": 2263} {"train_loss": -12.341218948364258, "global_step": 380283, "epoch": 2263} {"train_loss": -12.450241088867188, "global_step": 380284, "epoch": 2263} {"train_loss": -12.836952209472656, "global_step": 380285, "epoch": 2263} {"train_loss": -12.57223892211914, "global_step": 380286, "epoch": 2263} {"train_loss": -12.605717658996582, "global_step": 380287, "epoch": 2263} {"train_loss": -12.799586296081543, "global_step": 380288, "epoch": 2263} {"train_loss": -12.595705032348633, "global_step": 380289, "epoch": 2263} {"train_loss": -12.236837387084961, "global_step": 380290, "epoch": 2263} {"train_loss": -12.848008155822754, "global_step": 380291, "epoch": 2263} {"train_loss": -12.34980583190918, "global_step": 380292, "epoch": 2263} {"train_loss": -12.294942855834961, "global_step": 380293, "epoch": 2263} {"train_loss": -12.745122909545898, "global_step": 380294, "epoch": 2263} {"train_loss": -12.43427848815918, "global_step": 380295, "epoch": 2263} {"train_loss": -10.810417175292969, "global_step": 380296, "epoch": 2263} {"train_loss": -10.795711517333984, "global_step": 380297, "epoch": 2263} {"train_loss": -11.544441223144531, "global_step": 380298, "epoch": 2263} {"train_loss": -9.691919326782227, "global_step": 380299, "epoch": 2263} {"train_loss": -11.423977851867676, "global_step": 380300, "epoch": 2263} {"train_loss": -8.975130081176758, "global_step": 380301, "epoch": 2263} {"train_loss": -9.3893404006958, "global_step": 380302, "epoch": 2263} {"train_loss": -8.503303527832031, "global_step": 380303, "epoch": 2263} {"train_loss": -11.017993927001953, "global_step": 380304, "epoch": 2263} {"train_loss": -8.474443435668945, "global_step": 380305, "epoch": 2263} {"train_loss": -7.375060081481934, "global_step": 380306, "epoch": 2263} {"train_loss": -9.498735427856445, "global_step": 380307, "epoch": 2263} {"train_loss": -8.775239944458008, "global_step": 380308, "epoch": 2263} {"train_loss": -9.698343276977539, "global_step": 380309, "epoch": 2263} {"train_loss": -9.43919849395752, "global_step": 380310, "epoch": 2263} {"train_loss": -8.441925048828125, "global_step": 380311, "epoch": 2263} {"train_loss": -9.574341773986816, "global_step": 380312, "epoch": 2263} {"train_loss": -10.141647338867188, "global_step": 380313, "epoch": 2263} {"train_loss": -10.46837043762207, "global_step": 380314, "epoch": 2263} {"train_loss": -10.066719055175781, "global_step": 380315, "epoch": 2263} {"train_loss": -11.347105979919434, "global_step": 380316, "epoch": 2263} {"train_loss": -9.988790512084961, "global_step": 380317, "epoch": 2263} {"train_loss": -11.21833324432373, "global_step": 380318, "epoch": 2263} {"train_loss": -11.249306678771973, "global_step": 380319, "epoch": 2263} {"train_loss": -11.017303466796875, "global_step": 380320, "epoch": 2263} {"train_loss": -11.347803115844727, "global_step": 380321, "epoch": 2263} {"train_loss": -11.440814018249512, "global_step": 380322, "epoch": 2263} {"train_loss": -11.397224426269531, "global_step": 380323, "epoch": 2263} {"train_loss": -12.099690437316895, "global_step": 380324, "epoch": 2263} {"train_loss": -11.332597732543945, "global_step": 380325, "epoch": 2263} {"train_loss": -11.600061416625977, "global_step": 380326, "epoch": 2263} {"train_loss": -11.617332458496094, "global_step": 380327, "epoch": 2263} {"train_loss": -12.235570907592773, "global_step": 380328, "epoch": 2263} {"train_loss": -12.010766983032227, "global_step": 380329, "epoch": 2263} {"train_loss": -11.999613761901855, "global_step": 380330, "epoch": 2263} {"train_loss": -11.772191047668457, "global_step": 380331, "epoch": 2263} {"train_loss": -12.351370811462402, "global_step": 380332, "epoch": 2263} {"train_loss": -11.746837615966797, "global_step": 380333, "epoch": 2263} {"train_loss": -12.169212341308594, "global_step": 380334, "epoch": 2263} {"train_loss": -12.115564346313477, "global_step": 380335, "epoch": 2263} {"train_loss": -12.25326919555664, "global_step": 380336, "epoch": 2263} {"train_loss": -12.032462120056152, "global_step": 380337, "epoch": 2263} {"train_loss": -12.15296745300293, "global_step": 380338, "epoch": 2263} {"train_loss": -12.129900932312012, "global_step": 380339, "epoch": 2263} {"train_loss": -12.156615257263184, "global_step": 380340, "epoch": 2263} {"train_loss": -12.012569427490234, "global_step": 380341, "epoch": 2263} {"train_loss": -12.325847625732422, "global_step": 380342, "epoch": 2263} {"train_loss": -12.17999267578125, "global_step": 380343, "epoch": 2263} {"train_loss": -12.041208267211914, "global_step": 380344, "epoch": 2263} {"train_loss": -12.185525894165039, "global_step": 380345, "epoch": 2263} {"train_loss": -12.000507354736328, "global_step": 380346, "epoch": 2263} {"train_loss": -12.556374549865723, "global_step": 380347, "epoch": 2263} {"train_loss": -12.241716384887695, "global_step": 380348, "epoch": 2263} {"train_loss": -12.478658676147461, "global_step": 380349, "epoch": 2263} {"train_loss": -12.134834289550781, "global_step": 380350, "epoch": 2263} {"train_loss": -11.827167079562233, "global_step": 380351, "epoch": 2263, "val_loss": 284455.625} {"train_loss": -12.264605522155762, "global_step": 380352, "epoch": 2264} {"train_loss": -12.011825561523438, "global_step": 380353, "epoch": 2264} {"train_loss": -12.290243148803711, "global_step": 380354, "epoch": 2264} {"train_loss": -12.416608810424805, "global_step": 380355, "epoch": 2264} {"train_loss": -12.39668083190918, "global_step": 380356, "epoch": 2264} {"train_loss": -12.524721145629883, "global_step": 380357, "epoch": 2264} {"train_loss": -12.401397705078125, "global_step": 380358, "epoch": 2264} {"train_loss": -12.345701217651367, "global_step": 380359, "epoch": 2264} {"train_loss": -12.561970710754395, "global_step": 380360, "epoch": 2264} {"train_loss": -12.2919921875, "global_step": 380361, "epoch": 2264} {"train_loss": -12.334663391113281, "global_step": 380362, "epoch": 2264} {"train_loss": -12.528318405151367, "global_step": 380363, "epoch": 2264} {"train_loss": -12.250518798828125, "global_step": 380364, "epoch": 2264} {"train_loss": -12.42798900604248, "global_step": 380365, "epoch": 2264} {"train_loss": -12.409400939941406, "global_step": 380366, "epoch": 2264} {"train_loss": -12.446388244628906, "global_step": 380367, "epoch": 2264} {"train_loss": -12.477824211120605, "global_step": 380368, "epoch": 2264} {"train_loss": -12.314414978027344, "global_step": 380369, "epoch": 2264} {"train_loss": -12.415190696716309, "global_step": 380370, "epoch": 2264} {"train_loss": -12.461036682128906, "global_step": 380371, "epoch": 2264} {"train_loss": -12.614312171936035, "global_step": 380372, "epoch": 2264} {"train_loss": -12.300291061401367, "global_step": 380373, "epoch": 2264} {"train_loss": -12.67798137664795, "global_step": 380374, "epoch": 2264} {"train_loss": -12.513460159301758, "global_step": 380375, "epoch": 2264} {"train_loss": -11.90034294128418, "global_step": 380376, "epoch": 2264} {"train_loss": -12.391317367553711, "global_step": 380377, "epoch": 2264} {"train_loss": -12.48031234741211, "global_step": 380378, "epoch": 2264} {"train_loss": -12.308652877807617, "global_step": 380379, "epoch": 2264} {"train_loss": -12.413269996643066, "global_step": 380380, "epoch": 2264} {"train_loss": -12.366363525390625, "global_step": 380381, "epoch": 2264} {"train_loss": -12.476133346557617, "global_step": 380382, "epoch": 2264} {"train_loss": -12.431446075439453, "global_step": 380383, "epoch": 2264} {"train_loss": -12.417137145996094, "global_step": 380384, "epoch": 2264} {"train_loss": -12.498982429504395, "global_step": 380385, "epoch": 2264} {"train_loss": -12.33658218383789, "global_step": 380386, "epoch": 2264} {"train_loss": -12.089771270751953, "global_step": 380387, "epoch": 2264} {"train_loss": -12.397623062133789, "global_step": 380388, "epoch": 2264} {"train_loss": -12.448417663574219, "global_step": 380389, "epoch": 2264} {"train_loss": -12.311057090759277, "global_step": 380390, "epoch": 2264} {"train_loss": -12.311979293823242, "global_step": 380391, "epoch": 2264} {"train_loss": -12.421308517456055, "global_step": 380392, "epoch": 2264} {"train_loss": -12.406562805175781, "global_step": 380393, "epoch": 2264} {"train_loss": -12.64000129699707, "global_step": 380394, "epoch": 2264} {"train_loss": -12.524699211120605, "global_step": 380395, "epoch": 2264} {"train_loss": -12.068731307983398, "global_step": 380396, "epoch": 2264} {"train_loss": -12.393228530883789, "global_step": 380397, "epoch": 2264} {"train_loss": -12.68416690826416, "global_step": 380398, "epoch": 2264} {"train_loss": -12.547022819519043, "global_step": 380399, "epoch": 2264} {"train_loss": -12.410795211791992, "global_step": 380400, "epoch": 2264} {"train_loss": -12.417630195617676, "global_step": 380401, "epoch": 2264} {"train_loss": -12.456401824951172, "global_step": 380402, "epoch": 2264} {"train_loss": -12.413936614990234, "global_step": 380403, "epoch": 2264} {"train_loss": -12.331618309020996, "global_step": 380404, "epoch": 2264} {"train_loss": -11.00818157196045, "global_step": 380405, "epoch": 2264} {"train_loss": -11.305352210998535, "global_step": 380406, "epoch": 2264} {"train_loss": -11.851834297180176, "global_step": 380407, "epoch": 2264} {"train_loss": -12.159440040588379, "global_step": 380408, "epoch": 2264} {"train_loss": -11.750696182250977, "global_step": 380409, "epoch": 2264} {"train_loss": -11.363380432128906, "global_step": 380410, "epoch": 2264} {"train_loss": -12.201420783996582, "global_step": 380411, "epoch": 2264} {"train_loss": -11.285730361938477, "global_step": 380412, "epoch": 2264} {"train_loss": -10.977631568908691, "global_step": 380413, "epoch": 2264} {"train_loss": -10.790650367736816, "global_step": 380414, "epoch": 2264} {"train_loss": -10.974996566772461, "global_step": 380415, "epoch": 2264} {"train_loss": -10.84686279296875, "global_step": 380416, "epoch": 2264} {"train_loss": -10.336874961853027, "global_step": 380417, "epoch": 2264} {"train_loss": -10.33896541595459, "global_step": 380418, "epoch": 2264} {"train_loss": -8.619625091552734, "global_step": 380419, "epoch": 2264} {"train_loss": -9.374946594238281, "global_step": 380420, "epoch": 2264} {"train_loss": -10.547223091125488, "global_step": 380421, "epoch": 2264} {"train_loss": -10.079957962036133, "global_step": 380422, "epoch": 2264} {"train_loss": -10.4632568359375, "global_step": 380423, "epoch": 2264} {"train_loss": -9.449729919433594, "global_step": 380424, "epoch": 2264} {"train_loss": -11.526268005371094, "global_step": 380425, "epoch": 2264} {"train_loss": -9.786725997924805, "global_step": 380426, "epoch": 2264} {"train_loss": -10.906892776489258, "global_step": 380427, "epoch": 2264} {"train_loss": -10.507026672363281, "global_step": 380428, "epoch": 2264} {"train_loss": -10.193319320678711, "global_step": 380429, "epoch": 2264} {"train_loss": -10.942351341247559, "global_step": 380430, "epoch": 2264} {"train_loss": -11.16508674621582, "global_step": 380431, "epoch": 2264} {"train_loss": -10.936586380004883, "global_step": 380432, "epoch": 2264} {"train_loss": -11.010324478149414, "global_step": 380433, "epoch": 2264} {"train_loss": -11.66128921508789, "global_step": 380434, "epoch": 2264} {"train_loss": -10.87568473815918, "global_step": 380435, "epoch": 2264} {"train_loss": -11.31904411315918, "global_step": 380436, "epoch": 2264} {"train_loss": -10.731804847717285, "global_step": 380437, "epoch": 2264} {"train_loss": -10.943951606750488, "global_step": 380438, "epoch": 2264} {"train_loss": -11.392545700073242, "global_step": 380439, "epoch": 2264} {"train_loss": -11.001012802124023, "global_step": 380440, "epoch": 2264} {"train_loss": -10.888952255249023, "global_step": 380441, "epoch": 2264} {"train_loss": -11.089728355407715, "global_step": 380442, "epoch": 2264} {"train_loss": -11.863882064819336, "global_step": 380443, "epoch": 2264} {"train_loss": -10.961987495422363, "global_step": 380444, "epoch": 2264} {"train_loss": -11.680421829223633, "global_step": 380445, "epoch": 2264} {"train_loss": -11.780008316040039, "global_step": 380446, "epoch": 2264} {"train_loss": -11.633044242858887, "global_step": 380447, "epoch": 2264} {"train_loss": -12.157011985778809, "global_step": 380448, "epoch": 2264} {"train_loss": -11.528629302978516, "global_step": 380449, "epoch": 2264} {"train_loss": -12.05181884765625, "global_step": 380450, "epoch": 2264} {"train_loss": -11.86274528503418, "global_step": 380451, "epoch": 2264} {"train_loss": -11.955536842346191, "global_step": 380452, "epoch": 2264} {"train_loss": -11.99666976928711, "global_step": 380453, "epoch": 2264} {"train_loss": -12.081478118896484, "global_step": 380454, "epoch": 2264} {"train_loss": -12.111845016479492, "global_step": 380455, "epoch": 2264} {"train_loss": -12.229808807373047, "global_step": 380456, "epoch": 2264} {"train_loss": -12.292655944824219, "global_step": 380457, "epoch": 2264} {"train_loss": -12.272536277770996, "global_step": 380458, "epoch": 2264} {"train_loss": -12.308550834655762, "global_step": 380459, "epoch": 2264} {"train_loss": -12.214605331420898, "global_step": 380460, "epoch": 2264} {"train_loss": -12.317642211914062, "global_step": 380461, "epoch": 2264} {"train_loss": -12.27360725402832, "global_step": 380462, "epoch": 2264} {"train_loss": -12.406312942504883, "global_step": 380463, "epoch": 2264} {"train_loss": -12.353523254394531, "global_step": 380464, "epoch": 2264} {"train_loss": -12.4150390625, "global_step": 380465, "epoch": 2264} {"train_loss": -12.190874099731445, "global_step": 380466, "epoch": 2264} {"train_loss": -12.306414604187012, "global_step": 380467, "epoch": 2264} {"train_loss": -12.452048301696777, "global_step": 380468, "epoch": 2264} {"train_loss": -12.40295124053955, "global_step": 380469, "epoch": 2264} {"train_loss": -12.447620391845703, "global_step": 380470, "epoch": 2264} {"train_loss": -12.581711769104004, "global_step": 380471, "epoch": 2264} {"train_loss": -12.313583374023438, "global_step": 380472, "epoch": 2264} {"train_loss": -12.576875686645508, "global_step": 380473, "epoch": 2264} {"train_loss": -12.243715286254883, "global_step": 380474, "epoch": 2264} {"train_loss": -12.420289993286133, "global_step": 380475, "epoch": 2264} {"train_loss": -12.251649856567383, "global_step": 380476, "epoch": 2264} {"train_loss": -12.458970069885254, "global_step": 380477, "epoch": 2264} {"train_loss": -12.308158874511719, "global_step": 380478, "epoch": 2264} {"train_loss": -12.152393341064453, "global_step": 380479, "epoch": 2264} {"train_loss": -12.459810256958008, "global_step": 380480, "epoch": 2264} {"train_loss": -12.452278137207031, "global_step": 380481, "epoch": 2264} {"train_loss": -12.408014297485352, "global_step": 380482, "epoch": 2264} {"train_loss": -12.266956329345703, "global_step": 380483, "epoch": 2264} {"train_loss": -12.390987396240234, "global_step": 380484, "epoch": 2264} {"train_loss": -12.007457733154297, "global_step": 380485, "epoch": 2264} {"train_loss": -12.418277740478516, "global_step": 380486, "epoch": 2264} {"train_loss": -12.188658714294434, "global_step": 380487, "epoch": 2264} {"train_loss": -12.129648208618164, "global_step": 380488, "epoch": 2264} {"train_loss": -12.267602920532227, "global_step": 380489, "epoch": 2264} {"train_loss": -12.19527530670166, "global_step": 380490, "epoch": 2264} {"train_loss": -12.362751960754395, "global_step": 380491, "epoch": 2264} {"train_loss": -12.010498046875, "global_step": 380492, "epoch": 2264} {"train_loss": -12.398807525634766, "global_step": 380493, "epoch": 2264} {"train_loss": -12.100834846496582, "global_step": 380494, "epoch": 2264} {"train_loss": -12.367660522460938, "global_step": 380495, "epoch": 2264} {"train_loss": -12.252388000488281, "global_step": 380496, "epoch": 2264} {"train_loss": -12.168350219726562, "global_step": 380497, "epoch": 2264} {"train_loss": -12.506204605102539, "global_step": 380498, "epoch": 2264} {"train_loss": -12.074104309082031, "global_step": 380499, "epoch": 2264} {"train_loss": -12.036527633666992, "global_step": 380500, "epoch": 2264} {"train_loss": -12.12120532989502, "global_step": 380501, "epoch": 2264} {"train_loss": -11.936674118041992, "global_step": 380502, "epoch": 2264} {"train_loss": -12.42718505859375, "global_step": 380503, "epoch": 2264} {"train_loss": -11.690452575683594, "global_step": 380504, "epoch": 2264} {"train_loss": -11.94854736328125, "global_step": 380505, "epoch": 2264} {"train_loss": -12.230849266052246, "global_step": 380506, "epoch": 2264} {"train_loss": -11.571149826049805, "global_step": 380507, "epoch": 2264} {"train_loss": -12.628456115722656, "global_step": 380508, "epoch": 2264} {"train_loss": -11.8345947265625, "global_step": 380509, "epoch": 2264} {"train_loss": -12.010871887207031, "global_step": 380510, "epoch": 2264} {"train_loss": -11.938307762145996, "global_step": 380511, "epoch": 2264} {"train_loss": -12.373491287231445, "global_step": 380512, "epoch": 2264} {"train_loss": -11.696425437927246, "global_step": 380513, "epoch": 2264} {"train_loss": -11.80329704284668, "global_step": 380514, "epoch": 2264} {"train_loss": -11.927608489990234, "global_step": 380515, "epoch": 2264} {"train_loss": -12.209250450134277, "global_step": 380516, "epoch": 2264} {"train_loss": -12.51069450378418, "global_step": 380517, "epoch": 2264} {"train_loss": -11.918628692626953, "global_step": 380518, "epoch": 2264} {"train_loss": -11.9400463615145, "global_step": 380519, "epoch": 2264, "val_loss": 288386.09375} {"train_loss": -12.286964416503906, "global_step": 380520, "epoch": 2265} {"train_loss": -12.277303695678711, "global_step": 380521, "epoch": 2265} {"train_loss": -11.806194305419922, "global_step": 380522, "epoch": 2265} {"train_loss": -12.184028625488281, "global_step": 380523, "epoch": 2265} {"train_loss": -12.33346939086914, "global_step": 380524, "epoch": 2265} {"train_loss": -11.923643112182617, "global_step": 380525, "epoch": 2265} {"train_loss": -12.379158020019531, "global_step": 380526, "epoch": 2265} {"train_loss": -11.881916999816895, "global_step": 380527, "epoch": 2265} {"train_loss": -11.677572250366211, "global_step": 380528, "epoch": 2265} {"train_loss": -12.380001068115234, "global_step": 380529, "epoch": 2265} {"train_loss": -11.828909873962402, "global_step": 380530, "epoch": 2265} {"train_loss": -12.406936645507812, "global_step": 380531, "epoch": 2265} {"train_loss": -12.08867359161377, "global_step": 380532, "epoch": 2265} {"train_loss": -12.556943893432617, "global_step": 380533, "epoch": 2265} {"train_loss": -11.84842586517334, "global_step": 380534, "epoch": 2265} {"train_loss": -12.42695140838623, "global_step": 380535, "epoch": 2265} {"train_loss": -12.329095840454102, "global_step": 380536, "epoch": 2265} {"train_loss": -11.910432815551758, "global_step": 380537, "epoch": 2265} {"train_loss": -11.85339641571045, "global_step": 380538, "epoch": 2265} {"train_loss": -12.405433654785156, "global_step": 380539, "epoch": 2265} {"train_loss": -12.02518367767334, "global_step": 380540, "epoch": 2265} {"train_loss": -11.985471725463867, "global_step": 380541, "epoch": 2265} {"train_loss": -12.031739234924316, "global_step": 380542, "epoch": 2265} {"train_loss": -12.106224060058594, "global_step": 380543, "epoch": 2265} {"train_loss": -11.37669563293457, "global_step": 380544, "epoch": 2265} {"train_loss": -11.911409378051758, "global_step": 380545, "epoch": 2265} {"train_loss": -11.717164993286133, "global_step": 380546, "epoch": 2265} {"train_loss": -11.534883499145508, "global_step": 380547, "epoch": 2265} {"train_loss": -11.609813690185547, "global_step": 380548, "epoch": 2265} {"train_loss": -11.206686019897461, "global_step": 380549, "epoch": 2265} {"train_loss": -11.284941673278809, "global_step": 380550, "epoch": 2265} {"train_loss": -11.348101615905762, "global_step": 380551, "epoch": 2265} {"train_loss": -11.634862899780273, "global_step": 380552, "epoch": 2265} {"train_loss": -11.063886642456055, "global_step": 380553, "epoch": 2265} {"train_loss": -11.520648002624512, "global_step": 380554, "epoch": 2265} {"train_loss": -10.484512329101562, "global_step": 380555, "epoch": 2265} {"train_loss": -11.31395149230957, "global_step": 380556, "epoch": 2265} {"train_loss": -11.330707550048828, "global_step": 380557, "epoch": 2265} {"train_loss": -10.683734893798828, "global_step": 380558, "epoch": 2265} {"train_loss": -11.919607162475586, "global_step": 380559, "epoch": 2265} {"train_loss": -11.110581398010254, "global_step": 380560, "epoch": 2265} {"train_loss": -11.813352584838867, "global_step": 380561, "epoch": 2265} {"train_loss": -11.812931060791016, "global_step": 380562, "epoch": 2265} {"train_loss": -11.36088752746582, "global_step": 380563, "epoch": 2265} {"train_loss": -12.634147644042969, "global_step": 380564, "epoch": 2265} {"train_loss": -11.758208274841309, "global_step": 380565, "epoch": 2265} {"train_loss": -12.450542449951172, "global_step": 380566, "epoch": 2265} {"train_loss": -12.071020126342773, "global_step": 380567, "epoch": 2265} {"train_loss": -12.14149284362793, "global_step": 380568, "epoch": 2265} {"train_loss": -11.910390853881836, "global_step": 380569, "epoch": 2265} {"train_loss": -11.841743469238281, "global_step": 380570, "epoch": 2265} {"train_loss": -11.994979858398438, "global_step": 380571, "epoch": 2265} {"train_loss": -12.405082702636719, "global_step": 380572, "epoch": 2265} {"train_loss": -12.126258850097656, "global_step": 380573, "epoch": 2265} {"train_loss": -11.953190803527832, "global_step": 380574, "epoch": 2265} {"train_loss": -12.230124473571777, "global_step": 380575, "epoch": 2265} {"train_loss": -11.66046142578125, "global_step": 380576, "epoch": 2265} {"train_loss": -12.3518705368042, "global_step": 380577, "epoch": 2265} {"train_loss": -11.611343383789062, "global_step": 380578, "epoch": 2265} {"train_loss": -12.289752006530762, "global_step": 380579, "epoch": 2265} {"train_loss": -12.099386215209961, "global_step": 380580, "epoch": 2265} {"train_loss": -12.19014835357666, "global_step": 380581, "epoch": 2265} {"train_loss": -12.186849594116211, "global_step": 380582, "epoch": 2265} {"train_loss": -12.55356502532959, "global_step": 380583, "epoch": 2265} {"train_loss": -12.080023765563965, "global_step": 380584, "epoch": 2265} {"train_loss": -12.33889102935791, "global_step": 380585, "epoch": 2265} {"train_loss": -12.122702598571777, "global_step": 380586, "epoch": 2265} {"train_loss": -12.023384094238281, "global_step": 380587, "epoch": 2265} {"train_loss": -12.360445022583008, "global_step": 380588, "epoch": 2265} {"train_loss": -11.632705688476562, "global_step": 380589, "epoch": 2265} {"train_loss": -12.47677993774414, "global_step": 380590, "epoch": 2265} {"train_loss": -12.04426097869873, "global_step": 380591, "epoch": 2265} {"train_loss": -12.222521781921387, "global_step": 380592, "epoch": 2265} {"train_loss": -11.888586044311523, "global_step": 380593, "epoch": 2265} {"train_loss": -12.398616790771484, "global_step": 380594, "epoch": 2265} {"train_loss": -12.450263977050781, "global_step": 380595, "epoch": 2265} {"train_loss": -12.491275787353516, "global_step": 380596, "epoch": 2265} {"train_loss": -12.455971717834473, "global_step": 380597, "epoch": 2265} {"train_loss": -12.636564254760742, "global_step": 380598, "epoch": 2265} {"train_loss": -12.497304916381836, "global_step": 380599, "epoch": 2265} {"train_loss": -12.538919448852539, "global_step": 380600, "epoch": 2265} {"train_loss": -12.656669616699219, "global_step": 380601, "epoch": 2265} {"train_loss": -12.498160362243652, "global_step": 380602, "epoch": 2265} {"train_loss": -12.554821014404297, "global_step": 380603, "epoch": 2265} {"train_loss": -12.547950744628906, "global_step": 380604, "epoch": 2265} {"train_loss": -12.691019058227539, "global_step": 380605, "epoch": 2265} {"train_loss": -12.35641860961914, "global_step": 380606, "epoch": 2265} {"train_loss": -12.499516487121582, "global_step": 380607, "epoch": 2265} {"train_loss": -12.438373565673828, "global_step": 380608, "epoch": 2265} {"train_loss": -12.687066078186035, "global_step": 380609, "epoch": 2265} {"train_loss": -12.54702091217041, "global_step": 380610, "epoch": 2265} {"train_loss": -12.63067626953125, "global_step": 380611, "epoch": 2265} {"train_loss": -12.498952865600586, "global_step": 380612, "epoch": 2265} {"train_loss": -12.778051376342773, "global_step": 380613, "epoch": 2265} {"train_loss": -12.942819595336914, "global_step": 380614, "epoch": 2265} {"train_loss": -12.598592758178711, "global_step": 380615, "epoch": 2265} {"train_loss": -12.31965160369873, "global_step": 380616, "epoch": 2265} {"train_loss": -12.629671096801758, "global_step": 380617, "epoch": 2265} {"train_loss": -12.785111427307129, "global_step": 380618, "epoch": 2265} {"train_loss": -12.628558158874512, "global_step": 380619, "epoch": 2265} {"train_loss": -12.605857849121094, "global_step": 380620, "epoch": 2265} {"train_loss": -12.502096176147461, "global_step": 380621, "epoch": 2265} {"train_loss": -12.425013542175293, "global_step": 380622, "epoch": 2265} {"train_loss": -12.814876556396484, "global_step": 380623, "epoch": 2265} {"train_loss": -12.411674499511719, "global_step": 380624, "epoch": 2265} {"train_loss": -12.692178726196289, "global_step": 380625, "epoch": 2265} {"train_loss": -12.487348556518555, "global_step": 380626, "epoch": 2265} {"train_loss": -12.267751693725586, "global_step": 380627, "epoch": 2265} {"train_loss": -12.515457153320312, "global_step": 380628, "epoch": 2265} {"train_loss": -12.201421737670898, "global_step": 380629, "epoch": 2265} {"train_loss": -12.231058120727539, "global_step": 380630, "epoch": 2265} {"train_loss": -12.225446701049805, "global_step": 380631, "epoch": 2265} {"train_loss": -12.319406509399414, "global_step": 380632, "epoch": 2265} {"train_loss": -11.752820014953613, "global_step": 380633, "epoch": 2265} {"train_loss": -11.910335540771484, "global_step": 380634, "epoch": 2265} {"train_loss": -11.742742538452148, "global_step": 380635, "epoch": 2265} {"train_loss": -12.452144622802734, "global_step": 380636, "epoch": 2265} {"train_loss": -12.661113739013672, "global_step": 380637, "epoch": 2265} {"train_loss": -12.3431396484375, "global_step": 380638, "epoch": 2265} {"train_loss": -12.155158996582031, "global_step": 380639, "epoch": 2265} {"train_loss": -12.160231590270996, "global_step": 380640, "epoch": 2265} {"train_loss": -12.299712181091309, "global_step": 380641, "epoch": 2265} {"train_loss": -12.418806076049805, "global_step": 380642, "epoch": 2265} {"train_loss": -11.967714309692383, "global_step": 380643, "epoch": 2265} {"train_loss": -11.727324485778809, "global_step": 380644, "epoch": 2265} {"train_loss": -11.897465705871582, "global_step": 380645, "epoch": 2265} {"train_loss": -12.651325225830078, "global_step": 380646, "epoch": 2265} {"train_loss": -12.472596168518066, "global_step": 380647, "epoch": 2265} {"train_loss": -12.00904369354248, "global_step": 380648, "epoch": 2265} {"train_loss": -11.772058486938477, "global_step": 380649, "epoch": 2265} {"train_loss": -12.564067840576172, "global_step": 380650, "epoch": 2265} {"train_loss": -11.948503494262695, "global_step": 380651, "epoch": 2265} {"train_loss": -11.363043785095215, "global_step": 380652, "epoch": 2265} {"train_loss": -11.716659545898438, "global_step": 380653, "epoch": 2265} {"train_loss": -11.672988891601562, "global_step": 380654, "epoch": 2265} {"train_loss": -9.72683334350586, "global_step": 380655, "epoch": 2265} {"train_loss": -10.168392181396484, "global_step": 380656, "epoch": 2265} {"train_loss": -10.231759071350098, "global_step": 380657, "epoch": 2265} {"train_loss": -10.93901538848877, "global_step": 380658, "epoch": 2265} {"train_loss": -10.436714172363281, "global_step": 380659, "epoch": 2265} {"train_loss": -10.537211418151855, "global_step": 380660, "epoch": 2265} {"train_loss": -11.083541870117188, "global_step": 380661, "epoch": 2265} {"train_loss": -11.799412727355957, "global_step": 380662, "epoch": 2265} {"train_loss": -11.031543731689453, "global_step": 380663, "epoch": 2265} {"train_loss": -11.551342010498047, "global_step": 380664, "epoch": 2265} {"train_loss": -8.963232040405273, "global_step": 380665, "epoch": 2265} {"train_loss": -8.008515357971191, "global_step": 380666, "epoch": 2265} {"train_loss": -8.152623176574707, "global_step": 380667, "epoch": 2265} {"train_loss": -7.931828022003174, "global_step": 380668, "epoch": 2265} {"train_loss": -8.312265396118164, "global_step": 380669, "epoch": 2265} {"train_loss": -9.215930938720703, "global_step": 380670, "epoch": 2265} {"train_loss": -8.708526611328125, "global_step": 380671, "epoch": 2265} {"train_loss": -8.939140319824219, "global_step": 380672, "epoch": 2265} {"train_loss": -8.661249160766602, "global_step": 380673, "epoch": 2265} {"train_loss": -8.615066528320312, "global_step": 380674, "epoch": 2265} {"train_loss": -9.266953468322754, "global_step": 380675, "epoch": 2265} {"train_loss": -8.147594451904297, "global_step": 380676, "epoch": 2265} {"train_loss": -9.498929977416992, "global_step": 380677, "epoch": 2265} {"train_loss": -10.001980781555176, "global_step": 380678, "epoch": 2265} {"train_loss": -9.501779556274414, "global_step": 380679, "epoch": 2265} {"train_loss": -9.947502136230469, "global_step": 380680, "epoch": 2265} {"train_loss": -10.216354370117188, "global_step": 380681, "epoch": 2265} {"train_loss": -10.98892593383789, "global_step": 380682, "epoch": 2265} {"train_loss": -10.588600158691406, "global_step": 380683, "epoch": 2265} {"train_loss": -11.204012870788574, "global_step": 380684, "epoch": 2265} {"train_loss": -11.239706039428711, "global_step": 380685, "epoch": 2265} {"train_loss": -10.717527389526367, "global_step": 380686, "epoch": 2265} {"train_loss": -11.669700398331596, "global_step": 380687, "epoch": 2265, "val_loss": 288809.28125, "train_action_mse_error": 1.2912847995758057} {"train_loss": -11.348780632019043, "global_step": 380688, "epoch": 2266} {"train_loss": -9.933446884155273, "global_step": 380689, "epoch": 2266} {"train_loss": -11.354970932006836, "global_step": 380690, "epoch": 2266} {"train_loss": -11.151561737060547, "global_step": 380691, "epoch": 2266} {"train_loss": -11.726943016052246, "global_step": 380692, "epoch": 2266} {"train_loss": -11.578014373779297, "global_step": 380693, "epoch": 2266} {"train_loss": -11.291570663452148, "global_step": 380694, "epoch": 2266} {"train_loss": -11.104043960571289, "global_step": 380695, "epoch": 2266} {"train_loss": -11.194963455200195, "global_step": 380696, "epoch": 2266} {"train_loss": -10.8695650100708, "global_step": 380697, "epoch": 2266} {"train_loss": -11.122442245483398, "global_step": 380698, "epoch": 2266} {"train_loss": -10.690776824951172, "global_step": 380699, "epoch": 2266} {"train_loss": -11.824151992797852, "global_step": 380700, "epoch": 2266} {"train_loss": -11.423066139221191, "global_step": 380701, "epoch": 2266} {"train_loss": -11.521623611450195, "global_step": 380702, "epoch": 2266} {"train_loss": -11.778938293457031, "global_step": 380703, "epoch": 2266} {"train_loss": -11.816974639892578, "global_step": 380704, "epoch": 2266} {"train_loss": -11.53718376159668, "global_step": 380705, "epoch": 2266} {"train_loss": -11.868566513061523, "global_step": 380706, "epoch": 2266} {"train_loss": -11.981056213378906, "global_step": 380707, "epoch": 2266} {"train_loss": -11.679540634155273, "global_step": 380708, "epoch": 2266} {"train_loss": -11.879816055297852, "global_step": 380709, "epoch": 2266} {"train_loss": -11.959508895874023, "global_step": 380710, "epoch": 2266} {"train_loss": -12.008382797241211, "global_step": 380711, "epoch": 2266} {"train_loss": -12.022268295288086, "global_step": 380712, "epoch": 2266} {"train_loss": -12.230605125427246, "global_step": 380713, "epoch": 2266} {"train_loss": -12.130605697631836, "global_step": 380714, "epoch": 2266} {"train_loss": -12.035778045654297, "global_step": 380715, "epoch": 2266} {"train_loss": -11.921932220458984, "global_step": 380716, "epoch": 2266} {"train_loss": -11.876775741577148, "global_step": 380717, "epoch": 2266} {"train_loss": -12.394583702087402, "global_step": 380718, "epoch": 2266} {"train_loss": -12.051389694213867, "global_step": 380719, "epoch": 2266} {"train_loss": -12.142218589782715, "global_step": 380720, "epoch": 2266} {"train_loss": -12.062582015991211, "global_step": 380721, "epoch": 2266} {"train_loss": -12.292400360107422, "global_step": 380722, "epoch": 2266} {"train_loss": -12.25918197631836, "global_step": 380723, "epoch": 2266} {"train_loss": -12.331863403320312, "global_step": 380724, "epoch": 2266} {"train_loss": -12.125587463378906, "global_step": 380725, "epoch": 2266} {"train_loss": -12.321821212768555, "global_step": 380726, "epoch": 2266} {"train_loss": -12.305520057678223, "global_step": 380727, "epoch": 2266} {"train_loss": -12.225749969482422, "global_step": 380728, "epoch": 2266} {"train_loss": -12.363910675048828, "global_step": 380729, "epoch": 2266} {"train_loss": -12.479076385498047, "global_step": 380730, "epoch": 2266} {"train_loss": -12.329404830932617, "global_step": 380731, "epoch": 2266} {"train_loss": -12.157186508178711, "global_step": 380732, "epoch": 2266} {"train_loss": -12.212623596191406, "global_step": 380733, "epoch": 2266} {"train_loss": -12.47467041015625, "global_step": 380734, "epoch": 2266} {"train_loss": -12.296320915222168, "global_step": 380735, "epoch": 2266} {"train_loss": -12.472477912902832, "global_step": 380736, "epoch": 2266} {"train_loss": -12.463140487670898, "global_step": 380737, "epoch": 2266} {"train_loss": -12.424337387084961, "global_step": 380738, "epoch": 2266} {"train_loss": -12.437887191772461, "global_step": 380739, "epoch": 2266} {"train_loss": -12.201667785644531, "global_step": 380740, "epoch": 2266} {"train_loss": -12.34040355682373, "global_step": 380741, "epoch": 2266} {"train_loss": -12.28680419921875, "global_step": 380742, "epoch": 2266} {"train_loss": -12.35525894165039, "global_step": 380743, "epoch": 2266} {"train_loss": -12.220813751220703, "global_step": 380744, "epoch": 2266} {"train_loss": -12.636802673339844, "global_step": 380745, "epoch": 2266} {"train_loss": -12.559002876281738, "global_step": 380746, "epoch": 2266} {"train_loss": -12.472169876098633, "global_step": 380747, "epoch": 2266} {"train_loss": -12.486676216125488, "global_step": 380748, "epoch": 2266} {"train_loss": -12.343704223632812, "global_step": 380749, "epoch": 2266} {"train_loss": -12.337823867797852, "global_step": 380750, "epoch": 2266} {"train_loss": -12.410513877868652, "global_step": 380751, "epoch": 2266} {"train_loss": -12.423881530761719, "global_step": 380752, "epoch": 2266} {"train_loss": -12.564427375793457, "global_step": 380753, "epoch": 2266} {"train_loss": -12.454818725585938, "global_step": 380754, "epoch": 2266} {"train_loss": -12.410292625427246, "global_step": 380755, "epoch": 2266} {"train_loss": -12.60317325592041, "global_step": 380756, "epoch": 2266} {"train_loss": -12.559698104858398, "global_step": 380757, "epoch": 2266} {"train_loss": -12.412900924682617, "global_step": 380758, "epoch": 2266} {"train_loss": -12.70237922668457, "global_step": 380759, "epoch": 2266} {"train_loss": -12.602926254272461, "global_step": 380760, "epoch": 2266} {"train_loss": -12.36410140991211, "global_step": 380761, "epoch": 2266} {"train_loss": -12.541143417358398, "global_step": 380762, "epoch": 2266} {"train_loss": -12.47121810913086, "global_step": 380763, "epoch": 2266} {"train_loss": -12.500799179077148, "global_step": 380764, "epoch": 2266} {"train_loss": -12.75355339050293, "global_step": 380765, "epoch": 2266} {"train_loss": -12.47754192352295, "global_step": 380766, "epoch": 2266} {"train_loss": -12.733762741088867, "global_step": 380767, "epoch": 2266} {"train_loss": -12.32944393157959, "global_step": 380768, "epoch": 2266} {"train_loss": -12.710506439208984, "global_step": 380769, "epoch": 2266} {"train_loss": -12.637094497680664, "global_step": 380770, "epoch": 2266} {"train_loss": -12.74737548828125, "global_step": 380771, "epoch": 2266} {"train_loss": -12.650217056274414, "global_step": 380772, "epoch": 2266} {"train_loss": -12.522656440734863, "global_step": 380773, "epoch": 2266} {"train_loss": -12.420429229736328, "global_step": 380774, "epoch": 2266} {"train_loss": -12.7511625289917, "global_step": 380775, "epoch": 2266} {"train_loss": -12.2855224609375, "global_step": 380776, "epoch": 2266} {"train_loss": -12.72773265838623, "global_step": 380777, "epoch": 2266} {"train_loss": -12.744551658630371, "global_step": 380778, "epoch": 2266} {"train_loss": -12.61972427368164, "global_step": 380779, "epoch": 2266} {"train_loss": -12.846055030822754, "global_step": 380780, "epoch": 2266} {"train_loss": -12.684025764465332, "global_step": 380781, "epoch": 2266} {"train_loss": -12.494688034057617, "global_step": 380782, "epoch": 2266} {"train_loss": -12.587984085083008, "global_step": 380783, "epoch": 2266} {"train_loss": -12.541542053222656, "global_step": 380784, "epoch": 2266} {"train_loss": -12.756732940673828, "global_step": 380785, "epoch": 2266} {"train_loss": -12.817517280578613, "global_step": 380786, "epoch": 2266} {"train_loss": -12.804771423339844, "global_step": 380787, "epoch": 2266} {"train_loss": -12.512006759643555, "global_step": 380788, "epoch": 2266} {"train_loss": -12.247014999389648, "global_step": 380789, "epoch": 2266} {"train_loss": -12.369184494018555, "global_step": 380790, "epoch": 2266} {"train_loss": -12.57850456237793, "global_step": 380791, "epoch": 2266} {"train_loss": -12.634681701660156, "global_step": 380792, "epoch": 2266} {"train_loss": -12.489355087280273, "global_step": 380793, "epoch": 2266} {"train_loss": -12.868725776672363, "global_step": 380794, "epoch": 2266} {"train_loss": -12.08006477355957, "global_step": 380795, "epoch": 2266} {"train_loss": -11.837145805358887, "global_step": 380796, "epoch": 2266} {"train_loss": -12.330299377441406, "global_step": 380797, "epoch": 2266} {"train_loss": -11.769210815429688, "global_step": 380798, "epoch": 2266} {"train_loss": -11.954130172729492, "global_step": 380799, "epoch": 2266} {"train_loss": -11.67499828338623, "global_step": 380800, "epoch": 2266} {"train_loss": -11.396239280700684, "global_step": 380801, "epoch": 2266} {"train_loss": -11.25472640991211, "global_step": 380802, "epoch": 2266} {"train_loss": -11.239315032958984, "global_step": 380803, "epoch": 2266} {"train_loss": -11.036857604980469, "global_step": 380804, "epoch": 2266} {"train_loss": -10.184304237365723, "global_step": 380805, "epoch": 2266} {"train_loss": -11.01974105834961, "global_step": 380806, "epoch": 2266} {"train_loss": -10.174196243286133, "global_step": 380807, "epoch": 2266} {"train_loss": -10.97310733795166, "global_step": 380808, "epoch": 2266} {"train_loss": -11.068843841552734, "global_step": 380809, "epoch": 2266} {"train_loss": -9.542501449584961, "global_step": 380810, "epoch": 2266} {"train_loss": -10.503164291381836, "global_step": 380811, "epoch": 2266} {"train_loss": -10.299379348754883, "global_step": 380812, "epoch": 2266} {"train_loss": -11.345499038696289, "global_step": 380813, "epoch": 2266} {"train_loss": -8.367372512817383, "global_step": 380814, "epoch": 2266} {"train_loss": -11.737381935119629, "global_step": 380815, "epoch": 2266} {"train_loss": -9.367740631103516, "global_step": 380816, "epoch": 2266} {"train_loss": -9.960103988647461, "global_step": 380817, "epoch": 2266} {"train_loss": -9.285282135009766, "global_step": 380818, "epoch": 2266} {"train_loss": -11.377837181091309, "global_step": 380819, "epoch": 2266} {"train_loss": -9.055913925170898, "global_step": 380820, "epoch": 2266} {"train_loss": -9.347515106201172, "global_step": 380821, "epoch": 2266} {"train_loss": -8.447196006774902, "global_step": 380822, "epoch": 2266} {"train_loss": -9.265010833740234, "global_step": 380823, "epoch": 2266} {"train_loss": -10.362661361694336, "global_step": 380824, "epoch": 2266} {"train_loss": -10.21291732788086, "global_step": 380825, "epoch": 2266} {"train_loss": -9.867578506469727, "global_step": 380826, "epoch": 2266} {"train_loss": -9.494218826293945, "global_step": 380827, "epoch": 2266} {"train_loss": -10.413671493530273, "global_step": 380828, "epoch": 2266} {"train_loss": -9.858298301696777, "global_step": 380829, "epoch": 2266} {"train_loss": -10.770889282226562, "global_step": 380830, "epoch": 2266} {"train_loss": -9.079163551330566, "global_step": 380831, "epoch": 2266} {"train_loss": -11.222917556762695, "global_step": 380832, "epoch": 2266} {"train_loss": -9.656599044799805, "global_step": 380833, "epoch": 2266} {"train_loss": -10.645633697509766, "global_step": 380834, "epoch": 2266} {"train_loss": -10.7507905960083, "global_step": 380835, "epoch": 2266} {"train_loss": -10.954973220825195, "global_step": 380836, "epoch": 2266} {"train_loss": -10.904809951782227, "global_step": 380837, "epoch": 2266} {"train_loss": -11.005393028259277, "global_step": 380838, "epoch": 2266} {"train_loss": -9.889060974121094, "global_step": 380839, "epoch": 2266} {"train_loss": -10.446327209472656, "global_step": 380840, "epoch": 2266} {"train_loss": -10.347588539123535, "global_step": 380841, "epoch": 2266} {"train_loss": -10.660048484802246, "global_step": 380842, "epoch": 2266} {"train_loss": -10.736930847167969, "global_step": 380843, "epoch": 2266} {"train_loss": -10.033916473388672, "global_step": 380844, "epoch": 2266} {"train_loss": -11.899212837219238, "global_step": 380845, "epoch": 2266} {"train_loss": -10.785805702209473, "global_step": 380846, "epoch": 2266} {"train_loss": -10.753222465515137, "global_step": 380847, "epoch": 2266} {"train_loss": -11.273521423339844, "global_step": 380848, "epoch": 2266} {"train_loss": -11.266572952270508, "global_step": 380849, "epoch": 2266} {"train_loss": -11.176743507385254, "global_step": 380850, "epoch": 2266} {"train_loss": -11.944913864135742, "global_step": 380851, "epoch": 2266} {"train_loss": -11.781400680541992, "global_step": 380852, "epoch": 2266} {"train_loss": -11.820154190063477, "global_step": 380853, "epoch": 2266} {"train_loss": -11.737318992614746, "global_step": 380854, "epoch": 2266} {"train_loss": -11.658262383370172, "global_step": 380855, "epoch": 2266, "val_loss": 289538.8125} {"train_loss": -11.648101806640625, "global_step": 380856, "epoch": 2267} {"train_loss": -12.086215019226074, "global_step": 380857, "epoch": 2267} {"train_loss": -11.986675262451172, "global_step": 380858, "epoch": 2267} {"train_loss": -11.357331275939941, "global_step": 380859, "epoch": 2267} {"train_loss": -11.899555206298828, "global_step": 380860, "epoch": 2267} {"train_loss": -11.679513931274414, "global_step": 380861, "epoch": 2267} {"train_loss": -11.753389358520508, "global_step": 380862, "epoch": 2267} {"train_loss": -11.972639083862305, "global_step": 380863, "epoch": 2267} {"train_loss": -11.911993026733398, "global_step": 380864, "epoch": 2267} {"train_loss": -11.850093841552734, "global_step": 380865, "epoch": 2267} {"train_loss": -12.068279266357422, "global_step": 380866, "epoch": 2267} {"train_loss": -12.108190536499023, "global_step": 380867, "epoch": 2267} {"train_loss": -12.087892532348633, "global_step": 380868, "epoch": 2267} {"train_loss": -12.016122817993164, "global_step": 380869, "epoch": 2267} {"train_loss": -12.116812705993652, "global_step": 380870, "epoch": 2267} {"train_loss": -11.856985092163086, "global_step": 380871, "epoch": 2267} {"train_loss": -12.042139053344727, "global_step": 380872, "epoch": 2267} {"train_loss": -12.175045013427734, "global_step": 380873, "epoch": 2267} {"train_loss": -11.999397277832031, "global_step": 380874, "epoch": 2267} {"train_loss": -11.961731910705566, "global_step": 380875, "epoch": 2267} {"train_loss": -12.053844451904297, "global_step": 380876, "epoch": 2267} {"train_loss": -12.25151252746582, "global_step": 380877, "epoch": 2267} {"train_loss": -12.155414581298828, "global_step": 380878, "epoch": 2267} {"train_loss": -12.068925857543945, "global_step": 380879, "epoch": 2267} {"train_loss": -12.236310005187988, "global_step": 380880, "epoch": 2267} {"train_loss": -12.143731117248535, "global_step": 380881, "epoch": 2267} {"train_loss": -12.314949989318848, "global_step": 380882, "epoch": 2267} {"train_loss": -12.241891860961914, "global_step": 380883, "epoch": 2267} {"train_loss": -12.333441734313965, "global_step": 380884, "epoch": 2267} {"train_loss": -12.475223541259766, "global_step": 380885, "epoch": 2267} {"train_loss": -12.387972831726074, "global_step": 380886, "epoch": 2267} {"train_loss": -12.317883491516113, "global_step": 380887, "epoch": 2267} {"train_loss": -12.595072746276855, "global_step": 380888, "epoch": 2267} {"train_loss": -12.30350112915039, "global_step": 380889, "epoch": 2267} {"train_loss": -12.288224220275879, "global_step": 380890, "epoch": 2267} {"train_loss": -12.447747230529785, "global_step": 380891, "epoch": 2267} {"train_loss": -12.355566024780273, "global_step": 380892, "epoch": 2267} {"train_loss": -12.51225471496582, "global_step": 380893, "epoch": 2267} {"train_loss": -12.246549606323242, "global_step": 380894, "epoch": 2267} {"train_loss": -12.490912437438965, "global_step": 380895, "epoch": 2267} {"train_loss": -12.412121772766113, "global_step": 380896, "epoch": 2267} {"train_loss": -12.566263198852539, "global_step": 380897, "epoch": 2267} {"train_loss": -12.367276191711426, "global_step": 380898, "epoch": 2267} {"train_loss": -12.548053741455078, "global_step": 380899, "epoch": 2267} {"train_loss": -12.571413040161133, "global_step": 380900, "epoch": 2267} {"train_loss": -12.58005142211914, "global_step": 380901, "epoch": 2267} {"train_loss": -12.58237075805664, "global_step": 380902, "epoch": 2267} {"train_loss": -12.654988288879395, "global_step": 380903, "epoch": 2267} {"train_loss": -12.509223937988281, "global_step": 380904, "epoch": 2267} {"train_loss": -12.5536527633667, "global_step": 380905, "epoch": 2267} {"train_loss": -12.629392623901367, "global_step": 380906, "epoch": 2267} {"train_loss": -12.435840606689453, "global_step": 380907, "epoch": 2267} {"train_loss": -12.498990058898926, "global_step": 380908, "epoch": 2267} {"train_loss": -12.492118835449219, "global_step": 380909, "epoch": 2267} {"train_loss": -12.495248794555664, "global_step": 380910, "epoch": 2267} {"train_loss": -12.680780410766602, "global_step": 380911, "epoch": 2267} {"train_loss": -12.65406608581543, "global_step": 380912, "epoch": 2267} {"train_loss": -12.719281196594238, "global_step": 380913, "epoch": 2267} {"train_loss": -12.499597549438477, "global_step": 380914, "epoch": 2267} {"train_loss": -12.634712219238281, "global_step": 380915, "epoch": 2267} {"train_loss": -12.658443450927734, "global_step": 380916, "epoch": 2267} {"train_loss": -12.849233627319336, "global_step": 380917, "epoch": 2267} {"train_loss": -12.723811149597168, "global_step": 380918, "epoch": 2267} {"train_loss": -12.566043853759766, "global_step": 380919, "epoch": 2267} {"train_loss": -12.578829765319824, "global_step": 380920, "epoch": 2267} {"train_loss": -12.640707015991211, "global_step": 380921, "epoch": 2267} {"train_loss": -12.61785888671875, "global_step": 380922, "epoch": 2267} {"train_loss": -12.60379409790039, "global_step": 380923, "epoch": 2267} {"train_loss": -12.50741958618164, "global_step": 380924, "epoch": 2267} {"train_loss": -12.461014747619629, "global_step": 380925, "epoch": 2267} {"train_loss": -12.587987899780273, "global_step": 380926, "epoch": 2267} {"train_loss": -12.32656192779541, "global_step": 380927, "epoch": 2267} {"train_loss": -12.46173095703125, "global_step": 380928, "epoch": 2267} {"train_loss": -12.792187690734863, "global_step": 380929, "epoch": 2267} {"train_loss": -12.283927917480469, "global_step": 380930, "epoch": 2267} {"train_loss": -12.365257263183594, "global_step": 380931, "epoch": 2267} {"train_loss": -12.241719245910645, "global_step": 380932, "epoch": 2267} {"train_loss": -12.527750968933105, "global_step": 380933, "epoch": 2267} {"train_loss": -12.30410099029541, "global_step": 380934, "epoch": 2267} {"train_loss": -12.405462265014648, "global_step": 380935, "epoch": 2267} {"train_loss": -12.576407432556152, "global_step": 380936, "epoch": 2267} {"train_loss": -12.315441131591797, "global_step": 380937, "epoch": 2267} {"train_loss": -11.677876472473145, "global_step": 380938, "epoch": 2267} {"train_loss": -11.420011520385742, "global_step": 380939, "epoch": 2267} {"train_loss": -12.43226146697998, "global_step": 380940, "epoch": 2267} {"train_loss": -12.070170402526855, "global_step": 380941, "epoch": 2267} {"train_loss": -10.249423027038574, "global_step": 380942, "epoch": 2267} {"train_loss": -10.528742790222168, "global_step": 380943, "epoch": 2267} {"train_loss": -12.343830108642578, "global_step": 380944, "epoch": 2267} {"train_loss": -9.882576942443848, "global_step": 380945, "epoch": 2267} {"train_loss": -11.349675178527832, "global_step": 380946, "epoch": 2267} {"train_loss": -12.184589385986328, "global_step": 380947, "epoch": 2267} {"train_loss": -12.129192352294922, "global_step": 380948, "epoch": 2267} {"train_loss": -10.816265106201172, "global_step": 380949, "epoch": 2267} {"train_loss": -11.226632118225098, "global_step": 380950, "epoch": 2267} {"train_loss": -11.066131591796875, "global_step": 380951, "epoch": 2267} {"train_loss": -10.309646606445312, "global_step": 380952, "epoch": 2267} {"train_loss": -10.452197074890137, "global_step": 380953, "epoch": 2267} {"train_loss": -11.32192611694336, "global_step": 380954, "epoch": 2267} {"train_loss": -9.486579895019531, "global_step": 380955, "epoch": 2267} {"train_loss": -10.02485466003418, "global_step": 380956, "epoch": 2267} {"train_loss": -8.475835800170898, "global_step": 380957, "epoch": 2267} {"train_loss": -9.853691101074219, "global_step": 380958, "epoch": 2267} {"train_loss": -10.195422172546387, "global_step": 380959, "epoch": 2267} {"train_loss": -8.143274307250977, "global_step": 380960, "epoch": 2267} {"train_loss": -9.818058013916016, "global_step": 380961, "epoch": 2267} {"train_loss": -8.242879867553711, "global_step": 380962, "epoch": 2267} {"train_loss": -8.43798828125, "global_step": 380963, "epoch": 2267} {"train_loss": -9.529963493347168, "global_step": 380964, "epoch": 2267} {"train_loss": -8.245682716369629, "global_step": 380965, "epoch": 2267} {"train_loss": -11.075596809387207, "global_step": 380966, "epoch": 2267} {"train_loss": -8.711214065551758, "global_step": 380967, "epoch": 2267} {"train_loss": -8.558685302734375, "global_step": 380968, "epoch": 2267} {"train_loss": -9.297025680541992, "global_step": 380969, "epoch": 2267} {"train_loss": -9.348301887512207, "global_step": 380970, "epoch": 2267} {"train_loss": -9.895034790039062, "global_step": 380971, "epoch": 2267} {"train_loss": -8.506128311157227, "global_step": 380972, "epoch": 2267} {"train_loss": -10.10653018951416, "global_step": 380973, "epoch": 2267} {"train_loss": -8.980566024780273, "global_step": 380974, "epoch": 2267} {"train_loss": -8.661359786987305, "global_step": 380975, "epoch": 2267} {"train_loss": -10.212949752807617, "global_step": 380976, "epoch": 2267} {"train_loss": -7.218918323516846, "global_step": 380977, "epoch": 2267} {"train_loss": -7.738541603088379, "global_step": 380978, "epoch": 2267} {"train_loss": -8.670154571533203, "global_step": 380979, "epoch": 2267} {"train_loss": -8.551222801208496, "global_step": 380980, "epoch": 2267} {"train_loss": -8.628501892089844, "global_step": 380981, "epoch": 2267} {"train_loss": -10.628641128540039, "global_step": 380982, "epoch": 2267} {"train_loss": -9.326763153076172, "global_step": 380983, "epoch": 2267} {"train_loss": -10.157381057739258, "global_step": 380984, "epoch": 2267} {"train_loss": -10.678007125854492, "global_step": 380985, "epoch": 2267} {"train_loss": -10.589170455932617, "global_step": 380986, "epoch": 2267} {"train_loss": -10.095237731933594, "global_step": 380987, "epoch": 2267} {"train_loss": -10.475845336914062, "global_step": 380988, "epoch": 2267} {"train_loss": -11.413963317871094, "global_step": 380989, "epoch": 2267} {"train_loss": -10.148723602294922, "global_step": 380990, "epoch": 2267} {"train_loss": -10.987140655517578, "global_step": 380991, "epoch": 2267} {"train_loss": -11.199289321899414, "global_step": 380992, "epoch": 2267} {"train_loss": -11.039115905761719, "global_step": 380993, "epoch": 2267} {"train_loss": -10.85651683807373, "global_step": 380994, "epoch": 2267} {"train_loss": -11.574052810668945, "global_step": 380995, "epoch": 2267} {"train_loss": -11.247285842895508, "global_step": 380996, "epoch": 2267} {"train_loss": -11.1043701171875, "global_step": 380997, "epoch": 2267} {"train_loss": -11.815545082092285, "global_step": 380998, "epoch": 2267} {"train_loss": -11.488380432128906, "global_step": 380999, "epoch": 2267} {"train_loss": -11.217473983764648, "global_step": 381000, "epoch": 2267} {"train_loss": -11.74451732635498, "global_step": 381001, "epoch": 2267} {"train_loss": -11.710721969604492, "global_step": 381002, "epoch": 2267} {"train_loss": -11.40191650390625, "global_step": 381003, "epoch": 2267} {"train_loss": -11.836485862731934, "global_step": 381004, "epoch": 2267} {"train_loss": -11.887628555297852, "global_step": 381005, "epoch": 2267} {"train_loss": -11.803714752197266, "global_step": 381006, "epoch": 2267} {"train_loss": -11.998634338378906, "global_step": 381007, "epoch": 2267} {"train_loss": -11.756284713745117, "global_step": 381008, "epoch": 2267} {"train_loss": -11.749361991882324, "global_step": 381009, "epoch": 2267} {"train_loss": -11.975332260131836, "global_step": 381010, "epoch": 2267} {"train_loss": -11.935476303100586, "global_step": 381011, "epoch": 2267} {"train_loss": -12.038443565368652, "global_step": 381012, "epoch": 2267} {"train_loss": -11.913326263427734, "global_step": 381013, "epoch": 2267} {"train_loss": -11.940287590026855, "global_step": 381014, "epoch": 2267} {"train_loss": -11.929695129394531, "global_step": 381015, "epoch": 2267} {"train_loss": -11.918133735656738, "global_step": 381016, "epoch": 2267} {"train_loss": -12.149940490722656, "global_step": 381017, "epoch": 2267} {"train_loss": -11.988790512084961, "global_step": 381018, "epoch": 2267} {"train_loss": -11.972002029418945, "global_step": 381019, "epoch": 2267} {"train_loss": -11.978252410888672, "global_step": 381020, "epoch": 2267} {"train_loss": -12.186431884765625, "global_step": 381021, "epoch": 2267} {"train_loss": -12.086852073669434, "global_step": 381022, "epoch": 2267} {"train_loss": -11.473287613618941, "global_step": 381023, "epoch": 2267, "val_loss": 294066.875} {"train_loss": -12.158121109008789, "global_step": 381024, "epoch": 2268} {"train_loss": -11.7879638671875, "global_step": 381025, "epoch": 2268} {"train_loss": -12.313800811767578, "global_step": 381026, "epoch": 2268} {"train_loss": -12.091995239257812, "global_step": 381027, "epoch": 2268} {"train_loss": -12.158903121948242, "global_step": 381028, "epoch": 2268} {"train_loss": -12.1939058303833, "global_step": 381029, "epoch": 2268} {"train_loss": -12.06662368774414, "global_step": 381030, "epoch": 2268} {"train_loss": -12.239419937133789, "global_step": 381031, "epoch": 2268} {"train_loss": -12.182565689086914, "global_step": 381032, "epoch": 2268} {"train_loss": -12.12484359741211, "global_step": 381033, "epoch": 2268} {"train_loss": -12.293380737304688, "global_step": 381034, "epoch": 2268} {"train_loss": -12.435364723205566, "global_step": 381035, "epoch": 2268} {"train_loss": -12.080650329589844, "global_step": 381036, "epoch": 2268} {"train_loss": -12.176589012145996, "global_step": 381037, "epoch": 2268} {"train_loss": -12.374536514282227, "global_step": 381038, "epoch": 2268} {"train_loss": -12.073785781860352, "global_step": 381039, "epoch": 2268} {"train_loss": -12.190674781799316, "global_step": 381040, "epoch": 2268} {"train_loss": -12.244205474853516, "global_step": 381041, "epoch": 2268} {"train_loss": -12.400900840759277, "global_step": 381042, "epoch": 2268} {"train_loss": -12.028902053833008, "global_step": 381043, "epoch": 2268} {"train_loss": -12.340149879455566, "global_step": 381044, "epoch": 2268} {"train_loss": -12.021780014038086, "global_step": 381045, "epoch": 2268} {"train_loss": -12.313688278198242, "global_step": 381046, "epoch": 2268} {"train_loss": -12.195262908935547, "global_step": 381047, "epoch": 2268} {"train_loss": -12.296868324279785, "global_step": 381048, "epoch": 2268} {"train_loss": -12.467477798461914, "global_step": 381049, "epoch": 2268} {"train_loss": -12.295746803283691, "global_step": 381050, "epoch": 2268} {"train_loss": -12.321900367736816, "global_step": 381051, "epoch": 2268} {"train_loss": -12.316384315490723, "global_step": 381052, "epoch": 2268} {"train_loss": -12.256896018981934, "global_step": 381053, "epoch": 2268} {"train_loss": -12.344093322753906, "global_step": 381054, "epoch": 2268} {"train_loss": -12.22616958618164, "global_step": 381055, "epoch": 2268} {"train_loss": -12.37090015411377, "global_step": 381056, "epoch": 2268} {"train_loss": -12.290718078613281, "global_step": 381057, "epoch": 2268} {"train_loss": -12.441638946533203, "global_step": 381058, "epoch": 2268} {"train_loss": -12.418243408203125, "global_step": 381059, "epoch": 2268} {"train_loss": -12.548537254333496, "global_step": 381060, "epoch": 2268} {"train_loss": -12.431025505065918, "global_step": 381061, "epoch": 2268} {"train_loss": -12.395381927490234, "global_step": 381062, "epoch": 2268} {"train_loss": -12.39434814453125, "global_step": 381063, "epoch": 2268} {"train_loss": -12.316518783569336, "global_step": 381064, "epoch": 2268} {"train_loss": -12.688497543334961, "global_step": 381065, "epoch": 2268} {"train_loss": -12.161176681518555, "global_step": 381066, "epoch": 2268} {"train_loss": -12.664410591125488, "global_step": 381067, "epoch": 2268} {"train_loss": -11.993927001953125, "global_step": 381068, "epoch": 2268} {"train_loss": -12.45191764831543, "global_step": 381069, "epoch": 2268} {"train_loss": -12.343524932861328, "global_step": 381070, "epoch": 2268} {"train_loss": -12.381782531738281, "global_step": 381071, "epoch": 2268} {"train_loss": -12.464812278747559, "global_step": 381072, "epoch": 2268} {"train_loss": -12.370509147644043, "global_step": 381073, "epoch": 2268} {"train_loss": -12.479944229125977, "global_step": 381074, "epoch": 2268} {"train_loss": -12.51286506652832, "global_step": 381075, "epoch": 2268} {"train_loss": -12.404233932495117, "global_step": 381076, "epoch": 2268} {"train_loss": -12.675382614135742, "global_step": 381077, "epoch": 2268} {"train_loss": -12.72795295715332, "global_step": 381078, "epoch": 2268} {"train_loss": -12.495981216430664, "global_step": 381079, "epoch": 2268} {"train_loss": -12.38708782196045, "global_step": 381080, "epoch": 2268} {"train_loss": -12.473962783813477, "global_step": 381081, "epoch": 2268} {"train_loss": -12.584575653076172, "global_step": 381082, "epoch": 2268} {"train_loss": -12.739395141601562, "global_step": 381083, "epoch": 2268} {"train_loss": -12.647717475891113, "global_step": 381084, "epoch": 2268} {"train_loss": -12.395029067993164, "global_step": 381085, "epoch": 2268} {"train_loss": -12.42355728149414, "global_step": 381086, "epoch": 2268} {"train_loss": -12.546391487121582, "global_step": 381087, "epoch": 2268} {"train_loss": -12.14755916595459, "global_step": 381088, "epoch": 2268} {"train_loss": -12.675092697143555, "global_step": 381089, "epoch": 2268} {"train_loss": -12.484550476074219, "global_step": 381090, "epoch": 2268} {"train_loss": -12.222440719604492, "global_step": 381091, "epoch": 2268} {"train_loss": -12.400873184204102, "global_step": 381092, "epoch": 2268} {"train_loss": -12.456134796142578, "global_step": 381093, "epoch": 2268} {"train_loss": -12.287273406982422, "global_step": 381094, "epoch": 2268} {"train_loss": -11.505127906799316, "global_step": 381095, "epoch": 2268} {"train_loss": -11.741704940795898, "global_step": 381096, "epoch": 2268} {"train_loss": -12.045248031616211, "global_step": 381097, "epoch": 2268} {"train_loss": -12.014208793640137, "global_step": 381098, "epoch": 2268} {"train_loss": -11.765592575073242, "global_step": 381099, "epoch": 2268} {"train_loss": -11.455377578735352, "global_step": 381100, "epoch": 2268} {"train_loss": -12.453594207763672, "global_step": 381101, "epoch": 2268} {"train_loss": -12.497697830200195, "global_step": 381102, "epoch": 2268} {"train_loss": -12.494743347167969, "global_step": 381103, "epoch": 2268} {"train_loss": -12.57832145690918, "global_step": 381104, "epoch": 2268} {"train_loss": -12.734782218933105, "global_step": 381105, "epoch": 2268} {"train_loss": -12.500442504882812, "global_step": 381106, "epoch": 2268} {"train_loss": -12.63591194152832, "global_step": 381107, "epoch": 2268} {"train_loss": -12.222297668457031, "global_step": 381108, "epoch": 2268} {"train_loss": -12.830696105957031, "global_step": 381109, "epoch": 2268} {"train_loss": -12.453789710998535, "global_step": 381110, "epoch": 2268} {"train_loss": -12.363296508789062, "global_step": 381111, "epoch": 2268} {"train_loss": -12.352544784545898, "global_step": 381112, "epoch": 2268} {"train_loss": -12.505935668945312, "global_step": 381113, "epoch": 2268} {"train_loss": -12.18598747253418, "global_step": 381114, "epoch": 2268} {"train_loss": -12.520415306091309, "global_step": 381115, "epoch": 2268} {"train_loss": -12.591707229614258, "global_step": 381116, "epoch": 2268} {"train_loss": -12.440221786499023, "global_step": 381117, "epoch": 2268} {"train_loss": -12.615947723388672, "global_step": 381118, "epoch": 2268} {"train_loss": -12.458178520202637, "global_step": 381119, "epoch": 2268} {"train_loss": -12.581526756286621, "global_step": 381120, "epoch": 2268} {"train_loss": -12.403393745422363, "global_step": 381121, "epoch": 2268} {"train_loss": -12.644798278808594, "global_step": 381122, "epoch": 2268} {"train_loss": -12.741246223449707, "global_step": 381123, "epoch": 2268} {"train_loss": -12.692863464355469, "global_step": 381124, "epoch": 2268} {"train_loss": -12.680265426635742, "global_step": 381125, "epoch": 2268} {"train_loss": -12.51117992401123, "global_step": 381126, "epoch": 2268} {"train_loss": -12.615617752075195, "global_step": 381127, "epoch": 2268} {"train_loss": -12.618305206298828, "global_step": 381128, "epoch": 2268} {"train_loss": -12.299454689025879, "global_step": 381129, "epoch": 2268} {"train_loss": -12.375751495361328, "global_step": 381130, "epoch": 2268} {"train_loss": -12.26248550415039, "global_step": 381131, "epoch": 2268} {"train_loss": -12.6981782913208, "global_step": 381132, "epoch": 2268} {"train_loss": -12.437630653381348, "global_step": 381133, "epoch": 2268} {"train_loss": -12.639538764953613, "global_step": 381134, "epoch": 2268} {"train_loss": -12.413095474243164, "global_step": 381135, "epoch": 2268} {"train_loss": -12.568170547485352, "global_step": 381136, "epoch": 2268} {"train_loss": -12.582371711730957, "global_step": 381137, "epoch": 2268} {"train_loss": -11.846813201904297, "global_step": 381138, "epoch": 2268} {"train_loss": -12.512118339538574, "global_step": 381139, "epoch": 2268} {"train_loss": -12.223388671875, "global_step": 381140, "epoch": 2268} {"train_loss": -12.485689163208008, "global_step": 381141, "epoch": 2268} {"train_loss": -12.245243072509766, "global_step": 381142, "epoch": 2268} {"train_loss": -11.302213668823242, "global_step": 381143, "epoch": 2268} {"train_loss": -10.393497467041016, "global_step": 381144, "epoch": 2268} {"train_loss": -11.338190078735352, "global_step": 381145, "epoch": 2268} {"train_loss": -11.516727447509766, "global_step": 381146, "epoch": 2268} {"train_loss": -11.242783546447754, "global_step": 381147, "epoch": 2268} {"train_loss": -11.656699180603027, "global_step": 381148, "epoch": 2268} {"train_loss": -12.053847312927246, "global_step": 381149, "epoch": 2268} {"train_loss": -11.362564086914062, "global_step": 381150, "epoch": 2268} {"train_loss": -12.193227767944336, "global_step": 381151, "epoch": 2268} {"train_loss": -11.761314392089844, "global_step": 381152, "epoch": 2268} {"train_loss": -11.383161544799805, "global_step": 381153, "epoch": 2268} {"train_loss": -10.905527114868164, "global_step": 381154, "epoch": 2268} {"train_loss": -12.055336952209473, "global_step": 381155, "epoch": 2268} {"train_loss": -11.23373794555664, "global_step": 381156, "epoch": 2268} {"train_loss": -10.45016860961914, "global_step": 381157, "epoch": 2268} {"train_loss": -11.508943557739258, "global_step": 381158, "epoch": 2268} {"train_loss": -9.543730735778809, "global_step": 381159, "epoch": 2268} {"train_loss": -11.809993743896484, "global_step": 381160, "epoch": 2268} {"train_loss": -8.760140419006348, "global_step": 381161, "epoch": 2268} {"train_loss": -10.438859939575195, "global_step": 381162, "epoch": 2268} {"train_loss": -9.518749237060547, "global_step": 381163, "epoch": 2268} {"train_loss": -9.228687286376953, "global_step": 381164, "epoch": 2268} {"train_loss": -11.282586097717285, "global_step": 381165, "epoch": 2268} {"train_loss": -10.30648422241211, "global_step": 381166, "epoch": 2268} {"train_loss": -10.549294471740723, "global_step": 381167, "epoch": 2268} {"train_loss": -10.256725311279297, "global_step": 381168, "epoch": 2268} {"train_loss": -11.627506256103516, "global_step": 381169, "epoch": 2268} {"train_loss": -10.395856857299805, "global_step": 381170, "epoch": 2268} {"train_loss": -11.531242370605469, "global_step": 381171, "epoch": 2268} {"train_loss": -11.362722396850586, "global_step": 381172, "epoch": 2268} {"train_loss": -10.26371955871582, "global_step": 381173, "epoch": 2268} {"train_loss": -12.287327766418457, "global_step": 381174, "epoch": 2268} {"train_loss": -10.97983169555664, "global_step": 381175, "epoch": 2268} {"train_loss": -11.32145881652832, "global_step": 381176, "epoch": 2268} {"train_loss": -12.156048774719238, "global_step": 381177, "epoch": 2268} {"train_loss": -11.584003448486328, "global_step": 381178, "epoch": 2268} {"train_loss": -11.795341491699219, "global_step": 381179, "epoch": 2268} {"train_loss": -11.703904151916504, "global_step": 381180, "epoch": 2268} {"train_loss": -12.053834915161133, "global_step": 381181, "epoch": 2268} {"train_loss": -11.924211502075195, "global_step": 381182, "epoch": 2268} {"train_loss": -12.172943115234375, "global_step": 381183, "epoch": 2268} {"train_loss": -12.210598945617676, "global_step": 381184, "epoch": 2268} {"train_loss": -12.04461669921875, "global_step": 381185, "epoch": 2268} {"train_loss": -12.104418754577637, "global_step": 381186, "epoch": 2268} {"train_loss": -12.182706832885742, "global_step": 381187, "epoch": 2268} {"train_loss": -12.111181259155273, "global_step": 381188, "epoch": 2268} {"train_loss": -12.16405963897705, "global_step": 381189, "epoch": 2268} {"train_loss": -12.255131721496582, "global_step": 381190, "epoch": 2268} {"train_loss": -12.059099736667815, "global_step": 381191, "epoch": 2268, "val_loss": 290118.0} {"train_loss": -11.84516429901123, "global_step": 381192, "epoch": 2269} {"train_loss": -12.203338623046875, "global_step": 381193, "epoch": 2269} {"train_loss": -12.291938781738281, "global_step": 381194, "epoch": 2269} {"train_loss": -11.836128234863281, "global_step": 381195, "epoch": 2269} {"train_loss": -12.245923042297363, "global_step": 381196, "epoch": 2269} {"train_loss": -12.527999877929688, "global_step": 381197, "epoch": 2269} {"train_loss": -12.419775009155273, "global_step": 381198, "epoch": 2269} {"train_loss": -12.309267044067383, "global_step": 381199, "epoch": 2269} {"train_loss": -12.217491149902344, "global_step": 381200, "epoch": 2269} {"train_loss": -12.13209342956543, "global_step": 381201, "epoch": 2269} {"train_loss": -12.32442855834961, "global_step": 381202, "epoch": 2269} {"train_loss": -12.381529808044434, "global_step": 381203, "epoch": 2269} {"train_loss": -12.5068941116333, "global_step": 381204, "epoch": 2269} {"train_loss": -12.299768447875977, "global_step": 381205, "epoch": 2269} {"train_loss": -12.364806175231934, "global_step": 381206, "epoch": 2269} {"train_loss": -12.291096687316895, "global_step": 381207, "epoch": 2269} {"train_loss": -12.299874305725098, "global_step": 381208, "epoch": 2269} {"train_loss": -12.363470077514648, "global_step": 381209, "epoch": 2269} {"train_loss": -12.027647018432617, "global_step": 381210, "epoch": 2269} {"train_loss": -12.533025741577148, "global_step": 381211, "epoch": 2269} {"train_loss": -12.196280479431152, "global_step": 381212, "epoch": 2269} {"train_loss": -12.098560333251953, "global_step": 381213, "epoch": 2269} {"train_loss": -12.315216064453125, "global_step": 381214, "epoch": 2269} {"train_loss": -11.862870216369629, "global_step": 381215, "epoch": 2269} {"train_loss": -12.226030349731445, "global_step": 381216, "epoch": 2269} {"train_loss": -12.534992218017578, "global_step": 381217, "epoch": 2269} {"train_loss": -11.857917785644531, "global_step": 381218, "epoch": 2269} {"train_loss": -12.185260772705078, "global_step": 381219, "epoch": 2269} {"train_loss": -12.311119079589844, "global_step": 381220, "epoch": 2269} {"train_loss": -11.815824508666992, "global_step": 381221, "epoch": 2269} {"train_loss": -12.025920867919922, "global_step": 381222, "epoch": 2269} {"train_loss": -12.304227828979492, "global_step": 381223, "epoch": 2269} {"train_loss": -12.062323570251465, "global_step": 381224, "epoch": 2269} {"train_loss": -12.458120346069336, "global_step": 381225, "epoch": 2269} {"train_loss": -12.424525260925293, "global_step": 381226, "epoch": 2269} {"train_loss": -12.084983825683594, "global_step": 381227, "epoch": 2269} {"train_loss": -12.01577377319336, "global_step": 381228, "epoch": 2269} {"train_loss": -12.248620986938477, "global_step": 381229, "epoch": 2269} {"train_loss": -11.47869873046875, "global_step": 381230, "epoch": 2269} {"train_loss": -12.354469299316406, "global_step": 381231, "epoch": 2269} {"train_loss": -11.716287612915039, "global_step": 381232, "epoch": 2269} {"train_loss": -12.225160598754883, "global_step": 381233, "epoch": 2269} {"train_loss": -11.770781517028809, "global_step": 381234, "epoch": 2269} {"train_loss": -11.92072868347168, "global_step": 381235, "epoch": 2269} {"train_loss": -12.278383255004883, "global_step": 381236, "epoch": 2269} {"train_loss": -11.792332649230957, "global_step": 381237, "epoch": 2269} {"train_loss": -12.445460319519043, "global_step": 381238, "epoch": 2269} {"train_loss": -11.898567199707031, "global_step": 381239, "epoch": 2269} {"train_loss": -12.794239044189453, "global_step": 381240, "epoch": 2269} {"train_loss": -12.237003326416016, "global_step": 381241, "epoch": 2269} {"train_loss": -12.513691902160645, "global_step": 381242, "epoch": 2269} {"train_loss": -12.123086929321289, "global_step": 381243, "epoch": 2269} {"train_loss": -12.156405448913574, "global_step": 381244, "epoch": 2269} {"train_loss": -12.342020988464355, "global_step": 381245, "epoch": 2269} {"train_loss": -12.204699516296387, "global_step": 381246, "epoch": 2269} {"train_loss": -12.487127304077148, "global_step": 381247, "epoch": 2269} {"train_loss": -12.462190628051758, "global_step": 381248, "epoch": 2269} {"train_loss": -12.38632583618164, "global_step": 381249, "epoch": 2269} {"train_loss": -12.455490112304688, "global_step": 381250, "epoch": 2269} {"train_loss": -12.033696174621582, "global_step": 381251, "epoch": 2269} {"train_loss": -12.672164916992188, "global_step": 381252, "epoch": 2269} {"train_loss": -12.395476341247559, "global_step": 381253, "epoch": 2269} {"train_loss": -12.464634895324707, "global_step": 381254, "epoch": 2269} {"train_loss": -12.424150466918945, "global_step": 381255, "epoch": 2269} {"train_loss": -12.153505325317383, "global_step": 381256, "epoch": 2269} {"train_loss": -12.471227645874023, "global_step": 381257, "epoch": 2269} {"train_loss": -12.544961929321289, "global_step": 381258, "epoch": 2269} {"train_loss": -12.06716251373291, "global_step": 381259, "epoch": 2269} {"train_loss": -12.608342170715332, "global_step": 381260, "epoch": 2269} {"train_loss": -11.7058744430542, "global_step": 381261, "epoch": 2269} {"train_loss": -12.132600784301758, "global_step": 381262, "epoch": 2269} {"train_loss": -12.663186073303223, "global_step": 381263, "epoch": 2269} {"train_loss": -12.073362350463867, "global_step": 381264, "epoch": 2269} {"train_loss": -11.656105995178223, "global_step": 381265, "epoch": 2269} {"train_loss": -12.449026107788086, "global_step": 381266, "epoch": 2269} {"train_loss": -11.613462448120117, "global_step": 381267, "epoch": 2269} {"train_loss": -11.906521797180176, "global_step": 381268, "epoch": 2269} {"train_loss": -11.974771499633789, "global_step": 381269, "epoch": 2269} {"train_loss": -11.51301097869873, "global_step": 381270, "epoch": 2269} {"train_loss": -11.182038307189941, "global_step": 381271, "epoch": 2269} {"train_loss": -12.060453414916992, "global_step": 381272, "epoch": 2269} {"train_loss": -11.561593055725098, "global_step": 381273, "epoch": 2269} {"train_loss": -12.421624183654785, "global_step": 381274, "epoch": 2269} {"train_loss": -12.322877883911133, "global_step": 381275, "epoch": 2269} {"train_loss": -12.338788986206055, "global_step": 381276, "epoch": 2269} {"train_loss": -12.298070907592773, "global_step": 381277, "epoch": 2269} {"train_loss": -12.622177124023438, "global_step": 381278, "epoch": 2269} {"train_loss": -12.568058013916016, "global_step": 381279, "epoch": 2269} {"train_loss": -12.309669494628906, "global_step": 381280, "epoch": 2269} {"train_loss": -11.994958877563477, "global_step": 381281, "epoch": 2269} {"train_loss": -12.501752853393555, "global_step": 381282, "epoch": 2269} {"train_loss": -12.667741775512695, "global_step": 381283, "epoch": 2269} {"train_loss": -12.312442779541016, "global_step": 381284, "epoch": 2269} {"train_loss": -12.417978286743164, "global_step": 381285, "epoch": 2269} {"train_loss": -12.42459487915039, "global_step": 381286, "epoch": 2269} {"train_loss": -12.26655387878418, "global_step": 381287, "epoch": 2269} {"train_loss": -12.093361854553223, "global_step": 381288, "epoch": 2269} {"train_loss": -12.575399398803711, "global_step": 381289, "epoch": 2269} {"train_loss": -11.939149856567383, "global_step": 381290, "epoch": 2269} {"train_loss": -12.395073890686035, "global_step": 381291, "epoch": 2269} {"train_loss": -12.316194534301758, "global_step": 381292, "epoch": 2269} {"train_loss": -12.390512466430664, "global_step": 381293, "epoch": 2269} {"train_loss": -12.44028377532959, "global_step": 381294, "epoch": 2269} {"train_loss": -12.335187911987305, "global_step": 381295, "epoch": 2269} {"train_loss": -12.162464141845703, "global_step": 381296, "epoch": 2269} {"train_loss": -11.882562637329102, "global_step": 381297, "epoch": 2269} {"train_loss": -12.656942367553711, "global_step": 381298, "epoch": 2269} {"train_loss": -12.605239868164062, "global_step": 381299, "epoch": 2269} {"train_loss": -11.950197219848633, "global_step": 381300, "epoch": 2269} {"train_loss": -12.527705192565918, "global_step": 381301, "epoch": 2269} {"train_loss": -12.549600601196289, "global_step": 381302, "epoch": 2269} {"train_loss": -12.629659652709961, "global_step": 381303, "epoch": 2269} {"train_loss": -12.653669357299805, "global_step": 381304, "epoch": 2269} {"train_loss": -12.151283264160156, "global_step": 381305, "epoch": 2269} {"train_loss": -12.460657119750977, "global_step": 381306, "epoch": 2269} {"train_loss": -12.482311248779297, "global_step": 381307, "epoch": 2269} {"train_loss": -12.27920913696289, "global_step": 381308, "epoch": 2269} {"train_loss": -12.535831451416016, "global_step": 381309, "epoch": 2269} {"train_loss": -12.596799850463867, "global_step": 381310, "epoch": 2269} {"train_loss": -12.389167785644531, "global_step": 381311, "epoch": 2269} {"train_loss": -12.771028518676758, "global_step": 381312, "epoch": 2269} {"train_loss": -12.624265670776367, "global_step": 381313, "epoch": 2269} {"train_loss": -12.15488052368164, "global_step": 381314, "epoch": 2269} {"train_loss": -12.166881561279297, "global_step": 381315, "epoch": 2269} {"train_loss": -12.75472640991211, "global_step": 381316, "epoch": 2269} {"train_loss": -12.337616920471191, "global_step": 381317, "epoch": 2269} {"train_loss": -12.120002746582031, "global_step": 381318, "epoch": 2269} {"train_loss": -12.126717567443848, "global_step": 381319, "epoch": 2269} {"train_loss": -12.111490249633789, "global_step": 381320, "epoch": 2269} {"train_loss": -12.230812072753906, "global_step": 381321, "epoch": 2269} {"train_loss": -12.445651054382324, "global_step": 381322, "epoch": 2269} {"train_loss": -11.333982467651367, "global_step": 381323, "epoch": 2269} {"train_loss": -11.457817077636719, "global_step": 381324, "epoch": 2269} {"train_loss": -12.205101013183594, "global_step": 381325, "epoch": 2269} {"train_loss": -10.558483123779297, "global_step": 381326, "epoch": 2269} {"train_loss": -12.024750709533691, "global_step": 381327, "epoch": 2269} {"train_loss": -12.283811569213867, "global_step": 381328, "epoch": 2269} {"train_loss": -11.160542488098145, "global_step": 381329, "epoch": 2269} {"train_loss": -10.952178001403809, "global_step": 381330, "epoch": 2269} {"train_loss": -12.407950401306152, "global_step": 381331, "epoch": 2269} {"train_loss": -11.735454559326172, "global_step": 381332, "epoch": 2269} {"train_loss": -12.00810432434082, "global_step": 381333, "epoch": 2269} {"train_loss": -12.105074882507324, "global_step": 381334, "epoch": 2269} {"train_loss": -11.497522354125977, "global_step": 381335, "epoch": 2269} {"train_loss": -10.619678497314453, "global_step": 381336, "epoch": 2269} {"train_loss": -12.046165466308594, "global_step": 381337, "epoch": 2269} {"train_loss": -9.82385540008545, "global_step": 381338, "epoch": 2269} {"train_loss": -9.39513874053955, "global_step": 381339, "epoch": 2269} {"train_loss": -8.783622741699219, "global_step": 381340, "epoch": 2269} {"train_loss": -10.51624870300293, "global_step": 381341, "epoch": 2269} {"train_loss": -8.508772850036621, "global_step": 381342, "epoch": 2269} {"train_loss": -11.278644561767578, "global_step": 381343, "epoch": 2269} {"train_loss": -8.488411903381348, "global_step": 381344, "epoch": 2269} {"train_loss": -10.363009452819824, "global_step": 381345, "epoch": 2269} {"train_loss": -10.22203540802002, "global_step": 381346, "epoch": 2269} {"train_loss": -11.142718315124512, "global_step": 381347, "epoch": 2269} {"train_loss": -11.476057052612305, "global_step": 381348, "epoch": 2269} {"train_loss": -11.590906143188477, "global_step": 381349, "epoch": 2269} {"train_loss": -11.734450340270996, "global_step": 381350, "epoch": 2269} {"train_loss": -10.83318042755127, "global_step": 381351, "epoch": 2269} {"train_loss": -11.571533203125, "global_step": 381352, "epoch": 2269} {"train_loss": -11.134628295898438, "global_step": 381353, "epoch": 2269} {"train_loss": -11.271207809448242, "global_step": 381354, "epoch": 2269} {"train_loss": -11.81662368774414, "global_step": 381355, "epoch": 2269} {"train_loss": -11.38831615447998, "global_step": 381356, "epoch": 2269} {"train_loss": -12.154210090637207, "global_step": 381357, "epoch": 2269} {"train_loss": -11.324882507324219, "global_step": 381358, "epoch": 2269} {"train_loss": -12.001205745197478, "global_step": 381359, "epoch": 2269, "val_loss": 293285.8125} {"train_loss": -11.828263282775879, "global_step": 381360, "epoch": 2270} {"train_loss": -11.765615463256836, "global_step": 381361, "epoch": 2270} {"train_loss": -11.794428825378418, "global_step": 381362, "epoch": 2270} {"train_loss": -11.728950500488281, "global_step": 381363, "epoch": 2270} {"train_loss": -11.68204116821289, "global_step": 381364, "epoch": 2270} {"train_loss": -11.928030014038086, "global_step": 381365, "epoch": 2270} {"train_loss": -12.315670013427734, "global_step": 381366, "epoch": 2270} {"train_loss": -11.56532096862793, "global_step": 381367, "epoch": 2270} {"train_loss": -12.096406936645508, "global_step": 381368, "epoch": 2270} {"train_loss": -11.842941284179688, "global_step": 381369, "epoch": 2270} {"train_loss": -12.22101879119873, "global_step": 381370, "epoch": 2270} {"train_loss": -12.228964805603027, "global_step": 381371, "epoch": 2270} {"train_loss": -11.859947204589844, "global_step": 381372, "epoch": 2270} {"train_loss": -11.973498344421387, "global_step": 381373, "epoch": 2270} {"train_loss": -11.671178817749023, "global_step": 381374, "epoch": 2270} {"train_loss": -12.197385787963867, "global_step": 381375, "epoch": 2270} {"train_loss": -11.775690078735352, "global_step": 381376, "epoch": 2270} {"train_loss": -12.134782791137695, "global_step": 381377, "epoch": 2270} {"train_loss": -11.926025390625, "global_step": 381378, "epoch": 2270} {"train_loss": -11.915742874145508, "global_step": 381379, "epoch": 2270} {"train_loss": -12.137351989746094, "global_step": 381380, "epoch": 2270} {"train_loss": -12.174500465393066, "global_step": 381381, "epoch": 2270} {"train_loss": -12.101160049438477, "global_step": 381382, "epoch": 2270} {"train_loss": -12.337386131286621, "global_step": 381383, "epoch": 2270} {"train_loss": -11.894861221313477, "global_step": 381384, "epoch": 2270} {"train_loss": -12.158214569091797, "global_step": 381385, "epoch": 2270} {"train_loss": -12.265069961547852, "global_step": 381386, "epoch": 2270} {"train_loss": -12.157888412475586, "global_step": 381387, "epoch": 2270} {"train_loss": -12.40865421295166, "global_step": 381388, "epoch": 2270} {"train_loss": -12.126411437988281, "global_step": 381389, "epoch": 2270} {"train_loss": -12.501729965209961, "global_step": 381390, "epoch": 2270} {"train_loss": -12.167991638183594, "global_step": 381391, "epoch": 2270} {"train_loss": -12.35389518737793, "global_step": 381392, "epoch": 2270} {"train_loss": -12.531113624572754, "global_step": 381393, "epoch": 2270} {"train_loss": -12.282754898071289, "global_step": 381394, "epoch": 2270} {"train_loss": -12.466459274291992, "global_step": 381395, "epoch": 2270} {"train_loss": -12.503244400024414, "global_step": 381396, "epoch": 2270} {"train_loss": -12.537150382995605, "global_step": 381397, "epoch": 2270} {"train_loss": -12.620590209960938, "global_step": 381398, "epoch": 2270} {"train_loss": -12.54698371887207, "global_step": 381399, "epoch": 2270} {"train_loss": -12.625410079956055, "global_step": 381400, "epoch": 2270} {"train_loss": -12.348506927490234, "global_step": 381401, "epoch": 2270} {"train_loss": -12.682821273803711, "global_step": 381402, "epoch": 2270} {"train_loss": -12.633888244628906, "global_step": 381403, "epoch": 2270} {"train_loss": -11.945454597473145, "global_step": 381404, "epoch": 2270} {"train_loss": -12.50389289855957, "global_step": 381405, "epoch": 2270} {"train_loss": -12.313821792602539, "global_step": 381406, "epoch": 2270} {"train_loss": -12.28519058227539, "global_step": 381407, "epoch": 2270} {"train_loss": -12.60472297668457, "global_step": 381408, "epoch": 2270} {"train_loss": -12.08777141571045, "global_step": 381409, "epoch": 2270} {"train_loss": -12.523681640625, "global_step": 381410, "epoch": 2270} {"train_loss": -12.625837326049805, "global_step": 381411, "epoch": 2270} {"train_loss": -12.182764053344727, "global_step": 381412, "epoch": 2270} {"train_loss": -12.306343078613281, "global_step": 381413, "epoch": 2270} {"train_loss": -12.71263599395752, "global_step": 381414, "epoch": 2270} {"train_loss": -12.481273651123047, "global_step": 381415, "epoch": 2270} {"train_loss": -12.470518112182617, "global_step": 381416, "epoch": 2270} {"train_loss": -12.503732681274414, "global_step": 381417, "epoch": 2270} {"train_loss": -12.434670448303223, "global_step": 381418, "epoch": 2270} {"train_loss": -12.4646577835083, "global_step": 381419, "epoch": 2270} {"train_loss": -12.214827537536621, "global_step": 381420, "epoch": 2270} {"train_loss": -12.337388038635254, "global_step": 381421, "epoch": 2270} {"train_loss": -12.183489799499512, "global_step": 381422, "epoch": 2270} {"train_loss": -12.290756225585938, "global_step": 381423, "epoch": 2270} {"train_loss": -11.80841064453125, "global_step": 381424, "epoch": 2270} {"train_loss": -11.58355712890625, "global_step": 381425, "epoch": 2270} {"train_loss": -12.587688446044922, "global_step": 381426, "epoch": 2270} {"train_loss": -12.20181655883789, "global_step": 381427, "epoch": 2270} {"train_loss": -11.911114692687988, "global_step": 381428, "epoch": 2270} {"train_loss": -11.95417594909668, "global_step": 381429, "epoch": 2270} {"train_loss": -12.552434921264648, "global_step": 381430, "epoch": 2270} {"train_loss": -12.246599197387695, "global_step": 381431, "epoch": 2270} {"train_loss": -12.148025512695312, "global_step": 381432, "epoch": 2270} {"train_loss": -12.434170722961426, "global_step": 381433, "epoch": 2270} {"train_loss": -11.593155860900879, "global_step": 381434, "epoch": 2270} {"train_loss": -10.809310913085938, "global_step": 381435, "epoch": 2270} {"train_loss": -11.945169448852539, "global_step": 381436, "epoch": 2270} {"train_loss": -11.42141342163086, "global_step": 381437, "epoch": 2270} {"train_loss": -11.762884140014648, "global_step": 381438, "epoch": 2270} {"train_loss": -11.858922958374023, "global_step": 381439, "epoch": 2270} {"train_loss": -11.377306938171387, "global_step": 381440, "epoch": 2270} {"train_loss": -12.190288543701172, "global_step": 381441, "epoch": 2270} {"train_loss": -11.841571807861328, "global_step": 381442, "epoch": 2270} {"train_loss": -11.439411163330078, "global_step": 381443, "epoch": 2270} {"train_loss": -11.831441879272461, "global_step": 381444, "epoch": 2270} {"train_loss": -11.684051513671875, "global_step": 381445, "epoch": 2270} {"train_loss": -11.985773086547852, "global_step": 381446, "epoch": 2270} {"train_loss": -11.59961223602295, "global_step": 381447, "epoch": 2270} {"train_loss": -11.723653793334961, "global_step": 381448, "epoch": 2270} {"train_loss": -10.58999252319336, "global_step": 381449, "epoch": 2270} {"train_loss": -11.841175079345703, "global_step": 381450, "epoch": 2270} {"train_loss": -11.05698013305664, "global_step": 381451, "epoch": 2270} {"train_loss": -10.90227222442627, "global_step": 381452, "epoch": 2270} {"train_loss": -10.061397552490234, "global_step": 381453, "epoch": 2270} {"train_loss": -10.878137588500977, "global_step": 381454, "epoch": 2270} {"train_loss": -10.067218780517578, "global_step": 381455, "epoch": 2270} {"train_loss": -11.34030532836914, "global_step": 381456, "epoch": 2270} {"train_loss": -10.467208862304688, "global_step": 381457, "epoch": 2270} {"train_loss": -11.627859115600586, "global_step": 381458, "epoch": 2270} {"train_loss": -10.967352867126465, "global_step": 381459, "epoch": 2270} {"train_loss": -11.833904266357422, "global_step": 381460, "epoch": 2270} {"train_loss": -10.809114456176758, "global_step": 381461, "epoch": 2270} {"train_loss": -11.990519523620605, "global_step": 381462, "epoch": 2270} {"train_loss": -11.440461158752441, "global_step": 381463, "epoch": 2270} {"train_loss": -11.673291206359863, "global_step": 381464, "epoch": 2270} {"train_loss": -11.762680053710938, "global_step": 381465, "epoch": 2270} {"train_loss": -11.357183456420898, "global_step": 381466, "epoch": 2270} {"train_loss": -12.309745788574219, "global_step": 381467, "epoch": 2270} {"train_loss": -11.335135459899902, "global_step": 381468, "epoch": 2270} {"train_loss": -12.036552429199219, "global_step": 381469, "epoch": 2270} {"train_loss": -11.679686546325684, "global_step": 381470, "epoch": 2270} {"train_loss": -11.788145065307617, "global_step": 381471, "epoch": 2270} {"train_loss": -12.01608657836914, "global_step": 381472, "epoch": 2270} {"train_loss": -11.858165740966797, "global_step": 381473, "epoch": 2270} {"train_loss": -12.293468475341797, "global_step": 381474, "epoch": 2270} {"train_loss": -11.835897445678711, "global_step": 381475, "epoch": 2270} {"train_loss": -12.341066360473633, "global_step": 381476, "epoch": 2270} {"train_loss": -12.016133308410645, "global_step": 381477, "epoch": 2270} {"train_loss": -12.654642105102539, "global_step": 381478, "epoch": 2270} {"train_loss": -12.277546882629395, "global_step": 381479, "epoch": 2270} {"train_loss": -12.039520263671875, "global_step": 381480, "epoch": 2270} {"train_loss": -12.288667678833008, "global_step": 381481, "epoch": 2270} {"train_loss": -12.16998291015625, "global_step": 381482, "epoch": 2270} {"train_loss": -12.434734344482422, "global_step": 381483, "epoch": 2270} {"train_loss": -12.086188316345215, "global_step": 381484, "epoch": 2270} {"train_loss": -12.463094711303711, "global_step": 381485, "epoch": 2270} {"train_loss": -12.335073471069336, "global_step": 381486, "epoch": 2270} {"train_loss": -12.423097610473633, "global_step": 381487, "epoch": 2270} {"train_loss": -12.2977876663208, "global_step": 381488, "epoch": 2270} {"train_loss": -12.504865646362305, "global_step": 381489, "epoch": 2270} {"train_loss": -12.273064613342285, "global_step": 381490, "epoch": 2270} {"train_loss": -12.433717727661133, "global_step": 381491, "epoch": 2270} {"train_loss": -12.383580207824707, "global_step": 381492, "epoch": 2270} {"train_loss": -12.111753463745117, "global_step": 381493, "epoch": 2270} {"train_loss": -12.544724464416504, "global_step": 381494, "epoch": 2270} {"train_loss": -12.252392768859863, "global_step": 381495, "epoch": 2270} {"train_loss": -12.374841690063477, "global_step": 381496, "epoch": 2270} {"train_loss": -12.39100170135498, "global_step": 381497, "epoch": 2270} {"train_loss": -12.328587532043457, "global_step": 381498, "epoch": 2270} {"train_loss": -12.558134078979492, "global_step": 381499, "epoch": 2270} {"train_loss": -12.405937194824219, "global_step": 381500, "epoch": 2270} {"train_loss": -12.557796478271484, "global_step": 381501, "epoch": 2270} {"train_loss": -12.350360870361328, "global_step": 381502, "epoch": 2270} {"train_loss": -12.486747741699219, "global_step": 381503, "epoch": 2270} {"train_loss": -12.308286666870117, "global_step": 381504, "epoch": 2270} {"train_loss": -11.992232322692871, "global_step": 381505, "epoch": 2270} {"train_loss": -12.553964614868164, "global_step": 381506, "epoch": 2270} {"train_loss": -12.345499038696289, "global_step": 381507, "epoch": 2270} {"train_loss": -12.360580444335938, "global_step": 381508, "epoch": 2270} {"train_loss": -12.273026466369629, "global_step": 381509, "epoch": 2270} {"train_loss": -12.239858627319336, "global_step": 381510, "epoch": 2270} {"train_loss": -12.730647087097168, "global_step": 381511, "epoch": 2270} {"train_loss": -12.21625804901123, "global_step": 381512, "epoch": 2270} {"train_loss": -12.623396873474121, "global_step": 381513, "epoch": 2270} {"train_loss": -12.252774238586426, "global_step": 381514, "epoch": 2270} {"train_loss": -12.484989166259766, "global_step": 381515, "epoch": 2270} {"train_loss": -12.298261642456055, "global_step": 381516, "epoch": 2270} {"train_loss": -12.347396850585938, "global_step": 381517, "epoch": 2270} {"train_loss": -12.167076110839844, "global_step": 381518, "epoch": 2270} {"train_loss": -12.24193000793457, "global_step": 381519, "epoch": 2270} {"train_loss": -12.520735740661621, "global_step": 381520, "epoch": 2270} {"train_loss": -12.406049728393555, "global_step": 381521, "epoch": 2270} {"train_loss": -11.904277801513672, "global_step": 381522, "epoch": 2270} {"train_loss": -11.810951232910156, "global_step": 381523, "epoch": 2270} {"train_loss": -12.731351852416992, "global_step": 381524, "epoch": 2270} {"train_loss": -11.548640251159668, "global_step": 381525, "epoch": 2270} {"train_loss": -11.912128448486328, "global_step": 381526, "epoch": 2270} {"train_loss": -12.062947085925511, "global_step": 381527, "epoch": 2270, "val_loss": 294486.6875, "train_action_mse_error": 1.1872408390045166} {"train_loss": -11.606125831604004, "global_step": 381528, "epoch": 2271} {"train_loss": -11.36204719543457, "global_step": 381529, "epoch": 2271} {"train_loss": -11.822565078735352, "global_step": 381530, "epoch": 2271} {"train_loss": -11.659223556518555, "global_step": 381531, "epoch": 2271} {"train_loss": -11.797606468200684, "global_step": 381532, "epoch": 2271} {"train_loss": -11.192904472351074, "global_step": 381533, "epoch": 2271} {"train_loss": -12.062698364257812, "global_step": 381534, "epoch": 2271} {"train_loss": -11.05109977722168, "global_step": 381535, "epoch": 2271} {"train_loss": -10.50509262084961, "global_step": 381536, "epoch": 2271} {"train_loss": -12.20866870880127, "global_step": 381537, "epoch": 2271} {"train_loss": -10.549467086791992, "global_step": 381538, "epoch": 2271} {"train_loss": -11.955841064453125, "global_step": 381539, "epoch": 2271} {"train_loss": -9.705009460449219, "global_step": 381540, "epoch": 2271} {"train_loss": -11.057219505310059, "global_step": 381541, "epoch": 2271} {"train_loss": -10.057165145874023, "global_step": 381542, "epoch": 2271} {"train_loss": -11.034873962402344, "global_step": 381543, "epoch": 2271} {"train_loss": -10.740489959716797, "global_step": 381544, "epoch": 2271} {"train_loss": -10.02044677734375, "global_step": 381545, "epoch": 2271} {"train_loss": -10.858894348144531, "global_step": 381546, "epoch": 2271} {"train_loss": -10.387648582458496, "global_step": 381547, "epoch": 2271} {"train_loss": -9.978034973144531, "global_step": 381548, "epoch": 2271} {"train_loss": -10.510797500610352, "global_step": 381549, "epoch": 2271} {"train_loss": -10.370140075683594, "global_step": 381550, "epoch": 2271} {"train_loss": -9.850699424743652, "global_step": 381551, "epoch": 2271} {"train_loss": -11.03878402709961, "global_step": 381552, "epoch": 2271} {"train_loss": -10.556743621826172, "global_step": 381553, "epoch": 2271} {"train_loss": -11.120298385620117, "global_step": 381554, "epoch": 2271} {"train_loss": -10.960929870605469, "global_step": 381555, "epoch": 2271} {"train_loss": -11.260411262512207, "global_step": 381556, "epoch": 2271} {"train_loss": -10.547393798828125, "global_step": 381557, "epoch": 2271} {"train_loss": -11.318012237548828, "global_step": 381558, "epoch": 2271} {"train_loss": -11.604753494262695, "global_step": 381559, "epoch": 2271} {"train_loss": -11.532533645629883, "global_step": 381560, "epoch": 2271} {"train_loss": -11.558999061584473, "global_step": 381561, "epoch": 2271} {"train_loss": -11.49325942993164, "global_step": 381562, "epoch": 2271} {"train_loss": -11.696784019470215, "global_step": 381563, "epoch": 2271} {"train_loss": -11.820947647094727, "global_step": 381564, "epoch": 2271} {"train_loss": -11.593219757080078, "global_step": 381565, "epoch": 2271} {"train_loss": -11.326759338378906, "global_step": 381566, "epoch": 2271} {"train_loss": -12.119340896606445, "global_step": 381567, "epoch": 2271} {"train_loss": -11.626599311828613, "global_step": 381568, "epoch": 2271} {"train_loss": -12.023918151855469, "global_step": 381569, "epoch": 2271} {"train_loss": -12.108367919921875, "global_step": 381570, "epoch": 2271} {"train_loss": -12.035009384155273, "global_step": 381571, "epoch": 2271} {"train_loss": -12.064465522766113, "global_step": 381572, "epoch": 2271} {"train_loss": -11.659913063049316, "global_step": 381573, "epoch": 2271} {"train_loss": -12.109016418457031, "global_step": 381574, "epoch": 2271} {"train_loss": -11.32994556427002, "global_step": 381575, "epoch": 2271} {"train_loss": -12.143851280212402, "global_step": 381576, "epoch": 2271} {"train_loss": -11.848335266113281, "global_step": 381577, "epoch": 2271} {"train_loss": -11.692914009094238, "global_step": 381578, "epoch": 2271} {"train_loss": -12.050946235656738, "global_step": 381579, "epoch": 2271} {"train_loss": -11.483945846557617, "global_step": 381580, "epoch": 2271} {"train_loss": -12.174535751342773, "global_step": 381581, "epoch": 2271} {"train_loss": -11.72369384765625, "global_step": 381582, "epoch": 2271} {"train_loss": -12.271745681762695, "global_step": 381583, "epoch": 2271} {"train_loss": -12.032520294189453, "global_step": 381584, "epoch": 2271} {"train_loss": -11.818561553955078, "global_step": 381585, "epoch": 2271} {"train_loss": -12.16920280456543, "global_step": 381586, "epoch": 2271} {"train_loss": -11.833000183105469, "global_step": 381587, "epoch": 2271} {"train_loss": -12.169207572937012, "global_step": 381588, "epoch": 2271} {"train_loss": -11.786768913269043, "global_step": 381589, "epoch": 2271} {"train_loss": -12.43916130065918, "global_step": 381590, "epoch": 2271} {"train_loss": -12.014504432678223, "global_step": 381591, "epoch": 2271} {"train_loss": -12.123929977416992, "global_step": 381592, "epoch": 2271} {"train_loss": -12.289032936096191, "global_step": 381593, "epoch": 2271} {"train_loss": -12.228338241577148, "global_step": 381594, "epoch": 2271} {"train_loss": -12.310088157653809, "global_step": 381595, "epoch": 2271} {"train_loss": -12.272842407226562, "global_step": 381596, "epoch": 2271} {"train_loss": -11.995377540588379, "global_step": 381597, "epoch": 2271} {"train_loss": -12.260927200317383, "global_step": 381598, "epoch": 2271} {"train_loss": -12.032258987426758, "global_step": 381599, "epoch": 2271} {"train_loss": -12.271269798278809, "global_step": 381600, "epoch": 2271} {"train_loss": -12.030038833618164, "global_step": 381601, "epoch": 2271} {"train_loss": -12.149646759033203, "global_step": 381602, "epoch": 2271} {"train_loss": -12.19320297241211, "global_step": 381603, "epoch": 2271} {"train_loss": -11.991189956665039, "global_step": 381604, "epoch": 2271} {"train_loss": -12.323148727416992, "global_step": 381605, "epoch": 2271} {"train_loss": -12.306844711303711, "global_step": 381606, "epoch": 2271} {"train_loss": -12.314886093139648, "global_step": 381607, "epoch": 2271} {"train_loss": -12.475321769714355, "global_step": 381608, "epoch": 2271} {"train_loss": -12.467222213745117, "global_step": 381609, "epoch": 2271} {"train_loss": -12.589577674865723, "global_step": 381610, "epoch": 2271} {"train_loss": -12.410951614379883, "global_step": 381611, "epoch": 2271} {"train_loss": -12.572158813476562, "global_step": 381612, "epoch": 2271} {"train_loss": -12.427759170532227, "global_step": 381613, "epoch": 2271} {"train_loss": -12.24451732635498, "global_step": 381614, "epoch": 2271} {"train_loss": -12.631853103637695, "global_step": 381615, "epoch": 2271} {"train_loss": -12.370342254638672, "global_step": 381616, "epoch": 2271} {"train_loss": -12.342473983764648, "global_step": 381617, "epoch": 2271} {"train_loss": -12.432565689086914, "global_step": 381618, "epoch": 2271} {"train_loss": -12.448620796203613, "global_step": 381619, "epoch": 2271} {"train_loss": -12.342991828918457, "global_step": 381620, "epoch": 2271} {"train_loss": -12.614831924438477, "global_step": 381621, "epoch": 2271} {"train_loss": -12.516517639160156, "global_step": 381622, "epoch": 2271} {"train_loss": -12.493293762207031, "global_step": 381623, "epoch": 2271} {"train_loss": -12.495443344116211, "global_step": 381624, "epoch": 2271} {"train_loss": -12.395875930786133, "global_step": 381625, "epoch": 2271} {"train_loss": -12.510760307312012, "global_step": 381626, "epoch": 2271} {"train_loss": -12.389313697814941, "global_step": 381627, "epoch": 2271} {"train_loss": -12.488046646118164, "global_step": 381628, "epoch": 2271} {"train_loss": -12.458763122558594, "global_step": 381629, "epoch": 2271} {"train_loss": -12.623337745666504, "global_step": 381630, "epoch": 2271} {"train_loss": -12.604402542114258, "global_step": 381631, "epoch": 2271} {"train_loss": -12.591163635253906, "global_step": 381632, "epoch": 2271} {"train_loss": -12.63165283203125, "global_step": 381633, "epoch": 2271} {"train_loss": -12.805879592895508, "global_step": 381634, "epoch": 2271} {"train_loss": -12.804844856262207, "global_step": 381635, "epoch": 2271} {"train_loss": -12.540567398071289, "global_step": 381636, "epoch": 2271} {"train_loss": -12.59147834777832, "global_step": 381637, "epoch": 2271} {"train_loss": -12.59189224243164, "global_step": 381638, "epoch": 2271} {"train_loss": -12.573827743530273, "global_step": 381639, "epoch": 2271} {"train_loss": -12.7889404296875, "global_step": 381640, "epoch": 2271} {"train_loss": -12.528206825256348, "global_step": 381641, "epoch": 2271} {"train_loss": -12.588554382324219, "global_step": 381642, "epoch": 2271} {"train_loss": -12.732418060302734, "global_step": 381643, "epoch": 2271} {"train_loss": -12.696112632751465, "global_step": 381644, "epoch": 2271} {"train_loss": -12.811551094055176, "global_step": 381645, "epoch": 2271} {"train_loss": -12.740245819091797, "global_step": 381646, "epoch": 2271} {"train_loss": -12.803369522094727, "global_step": 381647, "epoch": 2271} {"train_loss": -12.788129806518555, "global_step": 381648, "epoch": 2271} {"train_loss": -12.692346572875977, "global_step": 381649, "epoch": 2271} {"train_loss": -12.79696273803711, "global_step": 381650, "epoch": 2271} {"train_loss": -12.562850952148438, "global_step": 381651, "epoch": 2271} {"train_loss": -12.768199920654297, "global_step": 381652, "epoch": 2271} {"train_loss": -12.59554672241211, "global_step": 381653, "epoch": 2271} {"train_loss": -12.60311508178711, "global_step": 381654, "epoch": 2271} {"train_loss": -12.55899429321289, "global_step": 381655, "epoch": 2271} {"train_loss": -12.705204010009766, "global_step": 381656, "epoch": 2271} {"train_loss": -12.339803695678711, "global_step": 381657, "epoch": 2271} {"train_loss": -12.694744110107422, "global_step": 381658, "epoch": 2271} {"train_loss": -12.95798397064209, "global_step": 381659, "epoch": 2271} {"train_loss": -12.452924728393555, "global_step": 381660, "epoch": 2271} {"train_loss": -12.594317436218262, "global_step": 381661, "epoch": 2271} {"train_loss": -12.807296752929688, "global_step": 381662, "epoch": 2271} {"train_loss": -12.646451950073242, "global_step": 381663, "epoch": 2271} {"train_loss": -12.833453178405762, "global_step": 381664, "epoch": 2271} {"train_loss": -12.265189170837402, "global_step": 381665, "epoch": 2271} {"train_loss": -12.27767276763916, "global_step": 381666, "epoch": 2271} {"train_loss": -12.219778060913086, "global_step": 381667, "epoch": 2271} {"train_loss": -11.793843269348145, "global_step": 381668, "epoch": 2271} {"train_loss": -11.919329643249512, "global_step": 381669, "epoch": 2271} {"train_loss": -12.802494049072266, "global_step": 381670, "epoch": 2271} {"train_loss": -11.726337432861328, "global_step": 381671, "epoch": 2271} {"train_loss": -12.107112884521484, "global_step": 381672, "epoch": 2271} {"train_loss": -11.932756423950195, "global_step": 381673, "epoch": 2271} {"train_loss": -12.654550552368164, "global_step": 381674, "epoch": 2271} {"train_loss": -11.946858406066895, "global_step": 381675, "epoch": 2271} {"train_loss": -11.974380493164062, "global_step": 381676, "epoch": 2271} {"train_loss": -11.425966262817383, "global_step": 381677, "epoch": 2271} {"train_loss": -12.725053787231445, "global_step": 381678, "epoch": 2271} {"train_loss": -11.887348175048828, "global_step": 381679, "epoch": 2271} {"train_loss": -12.722171783447266, "global_step": 381680, "epoch": 2271} {"train_loss": -12.164113998413086, "global_step": 381681, "epoch": 2271} {"train_loss": -12.29229736328125, "global_step": 381682, "epoch": 2271} {"train_loss": -11.867562294006348, "global_step": 381683, "epoch": 2271} {"train_loss": -11.793950080871582, "global_step": 381684, "epoch": 2271} {"train_loss": -12.316953659057617, "global_step": 381685, "epoch": 2271} {"train_loss": -12.410649299621582, "global_step": 381686, "epoch": 2271} {"train_loss": -11.591665267944336, "global_step": 381687, "epoch": 2271} {"train_loss": -11.181293487548828, "global_step": 381688, "epoch": 2271} {"train_loss": -12.60000991821289, "global_step": 381689, "epoch": 2271} {"train_loss": -11.739839553833008, "global_step": 381690, "epoch": 2271} {"train_loss": -12.288954734802246, "global_step": 381691, "epoch": 2271} {"train_loss": -12.023387908935547, "global_step": 381692, "epoch": 2271} {"train_loss": -12.120950698852539, "global_step": 381693, "epoch": 2271} {"train_loss": -11.68027114868164, "global_step": 381694, "epoch": 2271} {"train_loss": -12.0124526932126, "global_step": 381695, "epoch": 2271, "val_loss": 294149.0625} {"train_loss": -12.244556427001953, "global_step": 381696, "epoch": 2272} {"train_loss": -11.75467300415039, "global_step": 381697, "epoch": 2272} {"train_loss": -12.287001609802246, "global_step": 381698, "epoch": 2272} {"train_loss": -12.227865219116211, "global_step": 381699, "epoch": 2272} {"train_loss": -11.451498031616211, "global_step": 381700, "epoch": 2272} {"train_loss": -10.863546371459961, "global_step": 381701, "epoch": 2272} {"train_loss": -11.772865295410156, "global_step": 381702, "epoch": 2272} {"train_loss": -9.745463371276855, "global_step": 381703, "epoch": 2272} {"train_loss": -12.170226097106934, "global_step": 381704, "epoch": 2272} {"train_loss": -7.794018745422363, "global_step": 381705, "epoch": 2272} {"train_loss": -9.132406234741211, "global_step": 381706, "epoch": 2272} {"train_loss": -8.561483383178711, "global_step": 381707, "epoch": 2272} {"train_loss": -8.901752471923828, "global_step": 381708, "epoch": 2272} {"train_loss": -10.166959762573242, "global_step": 381709, "epoch": 2272} {"train_loss": -8.899409294128418, "global_step": 381710, "epoch": 2272} {"train_loss": -10.72765064239502, "global_step": 381711, "epoch": 2272} {"train_loss": -10.871074676513672, "global_step": 381712, "epoch": 2272} {"train_loss": -10.414590835571289, "global_step": 381713, "epoch": 2272} {"train_loss": -11.382548332214355, "global_step": 381714, "epoch": 2272} {"train_loss": -10.766363143920898, "global_step": 381715, "epoch": 2272} {"train_loss": -10.405144691467285, "global_step": 381716, "epoch": 2272} {"train_loss": -10.82676887512207, "global_step": 381717, "epoch": 2272} {"train_loss": -11.205049514770508, "global_step": 381718, "epoch": 2272} {"train_loss": -11.487242698669434, "global_step": 381719, "epoch": 2272} {"train_loss": -11.70804214477539, "global_step": 381720, "epoch": 2272} {"train_loss": -11.802717208862305, "global_step": 381721, "epoch": 2272} {"train_loss": -11.691158294677734, "global_step": 381722, "epoch": 2272} {"train_loss": -11.93846321105957, "global_step": 381723, "epoch": 2272} {"train_loss": -11.402887344360352, "global_step": 381724, "epoch": 2272} {"train_loss": -11.9578857421875, "global_step": 381725, "epoch": 2272} {"train_loss": -11.663089752197266, "global_step": 381726, "epoch": 2272} {"train_loss": -11.52298641204834, "global_step": 381727, "epoch": 2272} {"train_loss": -12.247053146362305, "global_step": 381728, "epoch": 2272} {"train_loss": -11.727437973022461, "global_step": 381729, "epoch": 2272} {"train_loss": -11.993268966674805, "global_step": 381730, "epoch": 2272} {"train_loss": -11.407510757446289, "global_step": 381731, "epoch": 2272} {"train_loss": -11.441781044006348, "global_step": 381732, "epoch": 2272} {"train_loss": -11.85002326965332, "global_step": 381733, "epoch": 2272} {"train_loss": -11.299822807312012, "global_step": 381734, "epoch": 2272} {"train_loss": -11.736736297607422, "global_step": 381735, "epoch": 2272} {"train_loss": -12.222175598144531, "global_step": 381736, "epoch": 2272} {"train_loss": -11.806758880615234, "global_step": 381737, "epoch": 2272} {"train_loss": -11.87984848022461, "global_step": 381738, "epoch": 2272} {"train_loss": -12.00938606262207, "global_step": 381739, "epoch": 2272} {"train_loss": -11.887267112731934, "global_step": 381740, "epoch": 2272} {"train_loss": -12.09528636932373, "global_step": 381741, "epoch": 2272} {"train_loss": -11.71477222442627, "global_step": 381742, "epoch": 2272} {"train_loss": -12.01543140411377, "global_step": 381743, "epoch": 2272} {"train_loss": -12.138322830200195, "global_step": 381744, "epoch": 2272} {"train_loss": -12.150995254516602, "global_step": 381745, "epoch": 2272} {"train_loss": -11.969449996948242, "global_step": 381746, "epoch": 2272} {"train_loss": -11.657539367675781, "global_step": 381747, "epoch": 2272} {"train_loss": -11.807504653930664, "global_step": 381748, "epoch": 2272} {"train_loss": -11.520758628845215, "global_step": 381749, "epoch": 2272} {"train_loss": -11.483840942382812, "global_step": 381750, "epoch": 2272} {"train_loss": -12.107353210449219, "global_step": 381751, "epoch": 2272} {"train_loss": -11.749502182006836, "global_step": 381752, "epoch": 2272} {"train_loss": -12.267701148986816, "global_step": 381753, "epoch": 2272} {"train_loss": -12.219304084777832, "global_step": 381754, "epoch": 2272} {"train_loss": -11.969487190246582, "global_step": 381755, "epoch": 2272} {"train_loss": -12.164039611816406, "global_step": 381756, "epoch": 2272} {"train_loss": -11.886384963989258, "global_step": 381757, "epoch": 2272} {"train_loss": -12.067381858825684, "global_step": 381758, "epoch": 2272} {"train_loss": -11.67373275756836, "global_step": 381759, "epoch": 2272} {"train_loss": -12.251219749450684, "global_step": 381760, "epoch": 2272} {"train_loss": -11.770447731018066, "global_step": 381761, "epoch": 2272} {"train_loss": -12.091798782348633, "global_step": 381762, "epoch": 2272} {"train_loss": -12.063057899475098, "global_step": 381763, "epoch": 2272} {"train_loss": -11.781179428100586, "global_step": 381764, "epoch": 2272} {"train_loss": -12.450833320617676, "global_step": 381765, "epoch": 2272} {"train_loss": -11.752973556518555, "global_step": 381766, "epoch": 2272} {"train_loss": -11.972329139709473, "global_step": 381767, "epoch": 2272} {"train_loss": -11.761699676513672, "global_step": 381768, "epoch": 2272} {"train_loss": -12.06091022491455, "global_step": 381769, "epoch": 2272} {"train_loss": -11.843876838684082, "global_step": 381770, "epoch": 2272} {"train_loss": -11.87299919128418, "global_step": 381771, "epoch": 2272} {"train_loss": -12.329970359802246, "global_step": 381772, "epoch": 2272} {"train_loss": -11.757254600524902, "global_step": 381773, "epoch": 2272} {"train_loss": -12.222824096679688, "global_step": 381774, "epoch": 2272} {"train_loss": -11.973149299621582, "global_step": 381775, "epoch": 2272} {"train_loss": -12.25669002532959, "global_step": 381776, "epoch": 2272} {"train_loss": -11.988138198852539, "global_step": 381777, "epoch": 2272} {"train_loss": -12.35187816619873, "global_step": 381778, "epoch": 2272} {"train_loss": -11.860261917114258, "global_step": 381779, "epoch": 2272} {"train_loss": -12.425105094909668, "global_step": 381780, "epoch": 2272} {"train_loss": -12.352607727050781, "global_step": 381781, "epoch": 2272} {"train_loss": -12.26443862915039, "global_step": 381782, "epoch": 2272} {"train_loss": -12.414487838745117, "global_step": 381783, "epoch": 2272} {"train_loss": -12.182548522949219, "global_step": 381784, "epoch": 2272} {"train_loss": -12.304045677185059, "global_step": 381785, "epoch": 2272} {"train_loss": -12.08568286895752, "global_step": 381786, "epoch": 2272} {"train_loss": -12.409430503845215, "global_step": 381787, "epoch": 2272} {"train_loss": -12.291803359985352, "global_step": 381788, "epoch": 2272} {"train_loss": -12.31933879852295, "global_step": 381789, "epoch": 2272} {"train_loss": -12.323287963867188, "global_step": 381790, "epoch": 2272} {"train_loss": -12.196084976196289, "global_step": 381791, "epoch": 2272} {"train_loss": -12.255916595458984, "global_step": 381792, "epoch": 2272} {"train_loss": -12.28433895111084, "global_step": 381793, "epoch": 2272} {"train_loss": -12.242061614990234, "global_step": 381794, "epoch": 2272} {"train_loss": -12.29334831237793, "global_step": 381795, "epoch": 2272} {"train_loss": -12.14423942565918, "global_step": 381796, "epoch": 2272} {"train_loss": -12.397706031799316, "global_step": 381797, "epoch": 2272} {"train_loss": -12.263282775878906, "global_step": 381798, "epoch": 2272} {"train_loss": -12.337650299072266, "global_step": 381799, "epoch": 2272} {"train_loss": -12.507402420043945, "global_step": 381800, "epoch": 2272} {"train_loss": -12.318193435668945, "global_step": 381801, "epoch": 2272} {"train_loss": -12.316948890686035, "global_step": 381802, "epoch": 2272} {"train_loss": -12.358078002929688, "global_step": 381803, "epoch": 2272} {"train_loss": -12.160242080688477, "global_step": 381804, "epoch": 2272} {"train_loss": -12.345914840698242, "global_step": 381805, "epoch": 2272} {"train_loss": -12.34366512298584, "global_step": 381806, "epoch": 2272} {"train_loss": -12.206043243408203, "global_step": 381807, "epoch": 2272} {"train_loss": -12.180904388427734, "global_step": 381808, "epoch": 2272} {"train_loss": -12.535961151123047, "global_step": 381809, "epoch": 2272} {"train_loss": -11.981084823608398, "global_step": 381810, "epoch": 2272} {"train_loss": -12.080625534057617, "global_step": 381811, "epoch": 2272} {"train_loss": -12.363337516784668, "global_step": 381812, "epoch": 2272} {"train_loss": -12.383037567138672, "global_step": 381813, "epoch": 2272} {"train_loss": -11.76369571685791, "global_step": 381814, "epoch": 2272} {"train_loss": -12.253776550292969, "global_step": 381815, "epoch": 2272} {"train_loss": -12.448491096496582, "global_step": 381816, "epoch": 2272} {"train_loss": -12.228618621826172, "global_step": 381817, "epoch": 2272} {"train_loss": -11.465693473815918, "global_step": 381818, "epoch": 2272} {"train_loss": -12.222953796386719, "global_step": 381819, "epoch": 2272} {"train_loss": -12.288908004760742, "global_step": 381820, "epoch": 2272} {"train_loss": -11.359219551086426, "global_step": 381821, "epoch": 2272} {"train_loss": -11.36880874633789, "global_step": 381822, "epoch": 2272} {"train_loss": -11.627737045288086, "global_step": 381823, "epoch": 2272} {"train_loss": -9.53011417388916, "global_step": 381824, "epoch": 2272} {"train_loss": -10.887290954589844, "global_step": 381825, "epoch": 2272} {"train_loss": -9.979969024658203, "global_step": 381826, "epoch": 2272} {"train_loss": -11.59178352355957, "global_step": 381827, "epoch": 2272} {"train_loss": -10.267765998840332, "global_step": 381828, "epoch": 2272} {"train_loss": -12.169944763183594, "global_step": 381829, "epoch": 2272} {"train_loss": -10.467243194580078, "global_step": 381830, "epoch": 2272} {"train_loss": -11.391093254089355, "global_step": 381831, "epoch": 2272} {"train_loss": -12.138011932373047, "global_step": 381832, "epoch": 2272} {"train_loss": -11.248087882995605, "global_step": 381833, "epoch": 2272} {"train_loss": -11.637737274169922, "global_step": 381834, "epoch": 2272} {"train_loss": -11.301790237426758, "global_step": 381835, "epoch": 2272} {"train_loss": -11.71735954284668, "global_step": 381836, "epoch": 2272} {"train_loss": -11.749404907226562, "global_step": 381837, "epoch": 2272} {"train_loss": -11.383129119873047, "global_step": 381838, "epoch": 2272} {"train_loss": -11.630001068115234, "global_step": 381839, "epoch": 2272} {"train_loss": -11.976154327392578, "global_step": 381840, "epoch": 2272} {"train_loss": -11.962812423706055, "global_step": 381841, "epoch": 2272} {"train_loss": -12.008974075317383, "global_step": 381842, "epoch": 2272} {"train_loss": -12.383888244628906, "global_step": 381843, "epoch": 2272} {"train_loss": -11.887619018554688, "global_step": 381844, "epoch": 2272} {"train_loss": -12.33575439453125, "global_step": 381845, "epoch": 2272} {"train_loss": -11.703835487365723, "global_step": 381846, "epoch": 2272} {"train_loss": -12.057759284973145, "global_step": 381847, "epoch": 2272} {"train_loss": -11.5798921585083, "global_step": 381848, "epoch": 2272} {"train_loss": -11.884998321533203, "global_step": 381849, "epoch": 2272} {"train_loss": -11.357879638671875, "global_step": 381850, "epoch": 2272} {"train_loss": -10.752153396606445, "global_step": 381851, "epoch": 2272} {"train_loss": -12.128421783447266, "global_step": 381852, "epoch": 2272} {"train_loss": -10.777156829833984, "global_step": 381853, "epoch": 2272} {"train_loss": -11.678438186645508, "global_step": 381854, "epoch": 2272} {"train_loss": -10.72165298461914, "global_step": 381855, "epoch": 2272} {"train_loss": -11.923271179199219, "global_step": 381856, "epoch": 2272} {"train_loss": -11.691905975341797, "global_step": 381857, "epoch": 2272} {"train_loss": -12.072761535644531, "global_step": 381858, "epoch": 2272} {"train_loss": -11.338485717773438, "global_step": 381859, "epoch": 2272} {"train_loss": -11.97425651550293, "global_step": 381860, "epoch": 2272} {"train_loss": -11.612914085388184, "global_step": 381861, "epoch": 2272} {"train_loss": -11.951119422912598, "global_step": 381862, "epoch": 2272} {"train_loss": -11.714321681431361, "global_step": 381863, "epoch": 2272, "val_loss": 292152.65625} {"train_loss": -11.723243713378906, "global_step": 381864, "epoch": 2273} {"train_loss": -12.126411437988281, "global_step": 381865, "epoch": 2273} {"train_loss": -11.839171409606934, "global_step": 381866, "epoch": 2273} {"train_loss": -12.044024467468262, "global_step": 381867, "epoch": 2273} {"train_loss": -12.19487190246582, "global_step": 381868, "epoch": 2273} {"train_loss": -12.351743698120117, "global_step": 381869, "epoch": 2273} {"train_loss": -12.478306770324707, "global_step": 381870, "epoch": 2273} {"train_loss": -12.307411193847656, "global_step": 381871, "epoch": 2273} {"train_loss": -12.409950256347656, "global_step": 381872, "epoch": 2273} {"train_loss": -12.4691743850708, "global_step": 381873, "epoch": 2273} {"train_loss": -12.380906105041504, "global_step": 381874, "epoch": 2273} {"train_loss": -12.552436828613281, "global_step": 381875, "epoch": 2273} {"train_loss": -12.407356262207031, "global_step": 381876, "epoch": 2273} {"train_loss": -12.428921699523926, "global_step": 381877, "epoch": 2273} {"train_loss": -12.456636428833008, "global_step": 381878, "epoch": 2273} {"train_loss": -12.29716682434082, "global_step": 381879, "epoch": 2273} {"train_loss": -12.612016677856445, "global_step": 381880, "epoch": 2273} {"train_loss": -12.449134826660156, "global_step": 381881, "epoch": 2273} {"train_loss": -12.67203140258789, "global_step": 381882, "epoch": 2273} {"train_loss": -12.441969871520996, "global_step": 381883, "epoch": 2273} {"train_loss": -12.335805892944336, "global_step": 381884, "epoch": 2273} {"train_loss": -12.478759765625, "global_step": 381885, "epoch": 2273} {"train_loss": -12.298221588134766, "global_step": 381886, "epoch": 2273} {"train_loss": -12.208473205566406, "global_step": 381887, "epoch": 2273} {"train_loss": -12.616484642028809, "global_step": 381888, "epoch": 2273} {"train_loss": -12.0306978225708, "global_step": 381889, "epoch": 2273} {"train_loss": -12.457954406738281, "global_step": 381890, "epoch": 2273} {"train_loss": -12.419276237487793, "global_step": 381891, "epoch": 2273} {"train_loss": -12.28122329711914, "global_step": 381892, "epoch": 2273} {"train_loss": -12.187759399414062, "global_step": 381893, "epoch": 2273} {"train_loss": -12.386539459228516, "global_step": 381894, "epoch": 2273} {"train_loss": -12.55976676940918, "global_step": 381895, "epoch": 2273} {"train_loss": -12.458866119384766, "global_step": 381896, "epoch": 2273} {"train_loss": -12.393011093139648, "global_step": 381897, "epoch": 2273} {"train_loss": -12.557587623596191, "global_step": 381898, "epoch": 2273} {"train_loss": -12.740306854248047, "global_step": 381899, "epoch": 2273} {"train_loss": -12.536975860595703, "global_step": 381900, "epoch": 2273} {"train_loss": -12.747782707214355, "global_step": 381901, "epoch": 2273} {"train_loss": -12.575653076171875, "global_step": 381902, "epoch": 2273} {"train_loss": -12.452279090881348, "global_step": 381903, "epoch": 2273} {"train_loss": -12.671560287475586, "global_step": 381904, "epoch": 2273} {"train_loss": -12.555959701538086, "global_step": 381905, "epoch": 2273} {"train_loss": -12.433789253234863, "global_step": 381906, "epoch": 2273} {"train_loss": -12.387375831604004, "global_step": 381907, "epoch": 2273} {"train_loss": -12.8274507522583, "global_step": 381908, "epoch": 2273} {"train_loss": -12.38753604888916, "global_step": 381909, "epoch": 2273} {"train_loss": -12.376256942749023, "global_step": 381910, "epoch": 2273} {"train_loss": -12.441400527954102, "global_step": 381911, "epoch": 2273} {"train_loss": -12.454415321350098, "global_step": 381912, "epoch": 2273} {"train_loss": -12.571683883666992, "global_step": 381913, "epoch": 2273} {"train_loss": -12.508013725280762, "global_step": 381914, "epoch": 2273} {"train_loss": -12.535024642944336, "global_step": 381915, "epoch": 2273} {"train_loss": -12.530998229980469, "global_step": 381916, "epoch": 2273} {"train_loss": -12.546578407287598, "global_step": 381917, "epoch": 2273} {"train_loss": -12.737561225891113, "global_step": 381918, "epoch": 2273} {"train_loss": -12.520238876342773, "global_step": 381919, "epoch": 2273} {"train_loss": -12.595462799072266, "global_step": 381920, "epoch": 2273} {"train_loss": -12.679441452026367, "global_step": 381921, "epoch": 2273} {"train_loss": -12.45187759399414, "global_step": 381922, "epoch": 2273} {"train_loss": -12.635238647460938, "global_step": 381923, "epoch": 2273} {"train_loss": -12.657430648803711, "global_step": 381924, "epoch": 2273} {"train_loss": -12.72599983215332, "global_step": 381925, "epoch": 2273} {"train_loss": -12.471735000610352, "global_step": 381926, "epoch": 2273} {"train_loss": -12.578882217407227, "global_step": 381927, "epoch": 2273} {"train_loss": -12.634090423583984, "global_step": 381928, "epoch": 2273} {"train_loss": -12.455474853515625, "global_step": 381929, "epoch": 2273} {"train_loss": -12.567911148071289, "global_step": 381930, "epoch": 2273} {"train_loss": -12.542657852172852, "global_step": 381931, "epoch": 2273} {"train_loss": -12.471750259399414, "global_step": 381932, "epoch": 2273} {"train_loss": -12.672750473022461, "global_step": 381933, "epoch": 2273} {"train_loss": -12.570355415344238, "global_step": 381934, "epoch": 2273} {"train_loss": -12.596929550170898, "global_step": 381935, "epoch": 2273} {"train_loss": -12.932634353637695, "global_step": 381936, "epoch": 2273} {"train_loss": -12.69836139678955, "global_step": 381937, "epoch": 2273} {"train_loss": -12.59798526763916, "global_step": 381938, "epoch": 2273} {"train_loss": -12.647603034973145, "global_step": 381939, "epoch": 2273} {"train_loss": -12.926812171936035, "global_step": 381940, "epoch": 2273} {"train_loss": -12.946882247924805, "global_step": 381941, "epoch": 2273} {"train_loss": -12.581377983093262, "global_step": 381942, "epoch": 2273} {"train_loss": -12.80824089050293, "global_step": 381943, "epoch": 2273} {"train_loss": -12.745765686035156, "global_step": 381944, "epoch": 2273} {"train_loss": -12.478372573852539, "global_step": 381945, "epoch": 2273} {"train_loss": -12.28451156616211, "global_step": 381946, "epoch": 2273} {"train_loss": -11.993265151977539, "global_step": 381947, "epoch": 2273} {"train_loss": -12.754693984985352, "global_step": 381948, "epoch": 2273} {"train_loss": -12.158578872680664, "global_step": 381949, "epoch": 2273} {"train_loss": -10.637235641479492, "global_step": 381950, "epoch": 2273} {"train_loss": -9.2980375289917, "global_step": 381951, "epoch": 2273} {"train_loss": -11.06591796875, "global_step": 381952, "epoch": 2273} {"train_loss": -8.107295989990234, "global_step": 381953, "epoch": 2273} {"train_loss": -9.025705337524414, "global_step": 381954, "epoch": 2273} {"train_loss": -8.825640678405762, "global_step": 381955, "epoch": 2273} {"train_loss": -11.079385757446289, "global_step": 381956, "epoch": 2273} {"train_loss": -8.658008575439453, "global_step": 381957, "epoch": 2273} {"train_loss": -8.755952835083008, "global_step": 381958, "epoch": 2273} {"train_loss": -9.06674575805664, "global_step": 381959, "epoch": 2273} {"train_loss": -8.918357849121094, "global_step": 381960, "epoch": 2273} {"train_loss": -8.600250244140625, "global_step": 381961, "epoch": 2273} {"train_loss": -9.200794219970703, "global_step": 381962, "epoch": 2273} {"train_loss": -9.301444053649902, "global_step": 381963, "epoch": 2273} {"train_loss": -8.897884368896484, "global_step": 381964, "epoch": 2273} {"train_loss": -8.190933227539062, "global_step": 381965, "epoch": 2273} {"train_loss": -7.751862525939941, "global_step": 381966, "epoch": 2273} {"train_loss": -8.311346054077148, "global_step": 381967, "epoch": 2273} {"train_loss": -8.66574478149414, "global_step": 381968, "epoch": 2273} {"train_loss": -9.077444076538086, "global_step": 381969, "epoch": 2273} {"train_loss": -8.904630661010742, "global_step": 381970, "epoch": 2273} {"train_loss": -9.59939193725586, "global_step": 381971, "epoch": 2273} {"train_loss": -9.201986312866211, "global_step": 381972, "epoch": 2273} {"train_loss": -10.499649047851562, "global_step": 381973, "epoch": 2273} {"train_loss": -10.235512733459473, "global_step": 381974, "epoch": 2273} {"train_loss": -10.176261901855469, "global_step": 381975, "epoch": 2273} {"train_loss": -11.11562728881836, "global_step": 381976, "epoch": 2273} {"train_loss": -9.730692863464355, "global_step": 381977, "epoch": 2273} {"train_loss": -9.913649559020996, "global_step": 381978, "epoch": 2273} {"train_loss": -11.446257591247559, "global_step": 381979, "epoch": 2273} {"train_loss": -9.712159156799316, "global_step": 381980, "epoch": 2273} {"train_loss": -10.599696159362793, "global_step": 381981, "epoch": 2273} {"train_loss": -10.812211990356445, "global_step": 381982, "epoch": 2273} {"train_loss": -9.982446670532227, "global_step": 381983, "epoch": 2273} {"train_loss": -11.13875675201416, "global_step": 381984, "epoch": 2273} {"train_loss": -10.501555442810059, "global_step": 381985, "epoch": 2273} {"train_loss": -10.287824630737305, "global_step": 381986, "epoch": 2273} {"train_loss": -11.708492279052734, "global_step": 381987, "epoch": 2273} {"train_loss": -11.447883605957031, "global_step": 381988, "epoch": 2273} {"train_loss": -11.585823059082031, "global_step": 381989, "epoch": 2273} {"train_loss": -11.724935531616211, "global_step": 381990, "epoch": 2273} {"train_loss": -10.745838165283203, "global_step": 381991, "epoch": 2273} {"train_loss": -11.541162490844727, "global_step": 381992, "epoch": 2273} {"train_loss": -11.669027328491211, "global_step": 381993, "epoch": 2273} {"train_loss": -10.921883583068848, "global_step": 381994, "epoch": 2273} {"train_loss": -11.574395179748535, "global_step": 381995, "epoch": 2273} {"train_loss": -11.326752662658691, "global_step": 381996, "epoch": 2273} {"train_loss": -11.321242332458496, "global_step": 381997, "epoch": 2273} {"train_loss": -11.382790565490723, "global_step": 381998, "epoch": 2273} {"train_loss": -11.110881805419922, "global_step": 381999, "epoch": 2273} {"train_loss": -11.359907150268555, "global_step": 382000, "epoch": 2273} {"train_loss": -10.969914436340332, "global_step": 382001, "epoch": 2273} {"train_loss": -10.919857025146484, "global_step": 382002, "epoch": 2273} {"train_loss": -11.060562133789062, "global_step": 382003, "epoch": 2273} {"train_loss": -10.963204383850098, "global_step": 382004, "epoch": 2273} {"train_loss": -11.935003280639648, "global_step": 382005, "epoch": 2273} {"train_loss": -10.709463119506836, "global_step": 382006, "epoch": 2273} {"train_loss": -12.102167129516602, "global_step": 382007, "epoch": 2273} {"train_loss": -11.285345077514648, "global_step": 382008, "epoch": 2273} {"train_loss": -11.99098014831543, "global_step": 382009, "epoch": 2273} {"train_loss": -11.911903381347656, "global_step": 382010, "epoch": 2273} {"train_loss": -11.641754150390625, "global_step": 382011, "epoch": 2273} {"train_loss": -11.911852836608887, "global_step": 382012, "epoch": 2273} {"train_loss": -12.076753616333008, "global_step": 382013, "epoch": 2273} {"train_loss": -11.880171775817871, "global_step": 382014, "epoch": 2273} {"train_loss": -12.22591781616211, "global_step": 382015, "epoch": 2273} {"train_loss": -11.902941703796387, "global_step": 382016, "epoch": 2273} {"train_loss": -12.143534660339355, "global_step": 382017, "epoch": 2273} {"train_loss": -12.21568775177002, "global_step": 382018, "epoch": 2273} {"train_loss": -11.714010238647461, "global_step": 382019, "epoch": 2273} {"train_loss": -12.093541145324707, "global_step": 382020, "epoch": 2273} {"train_loss": -11.857475280761719, "global_step": 382021, "epoch": 2273} {"train_loss": -12.110260009765625, "global_step": 382022, "epoch": 2273} {"train_loss": -11.852884292602539, "global_step": 382023, "epoch": 2273} {"train_loss": -11.850053787231445, "global_step": 382024, "epoch": 2273} {"train_loss": -12.233461380004883, "global_step": 382025, "epoch": 2273} {"train_loss": -11.884294509887695, "global_step": 382026, "epoch": 2273} {"train_loss": -11.955202102661133, "global_step": 382027, "epoch": 2273} {"train_loss": -12.110945701599121, "global_step": 382028, "epoch": 2273} {"train_loss": -11.798863410949707, "global_step": 382029, "epoch": 2273} {"train_loss": -12.163509368896484, "global_step": 382030, "epoch": 2273} {"train_loss": -11.629144555046445, "global_step": 382031, "epoch": 2273, "val_loss": 292388.625} {"train_loss": -12.05130386352539, "global_step": 382032, "epoch": 2274} {"train_loss": -11.903108596801758, "global_step": 382033, "epoch": 2274} {"train_loss": -11.953865051269531, "global_step": 382034, "epoch": 2274} {"train_loss": -12.060781478881836, "global_step": 382035, "epoch": 2274} {"train_loss": -11.586288452148438, "global_step": 382036, "epoch": 2274} {"train_loss": -12.194209098815918, "global_step": 382037, "epoch": 2274} {"train_loss": -12.001911163330078, "global_step": 382038, "epoch": 2274} {"train_loss": -12.223579406738281, "global_step": 382039, "epoch": 2274} {"train_loss": -12.027414321899414, "global_step": 382040, "epoch": 2274} {"train_loss": -11.927801132202148, "global_step": 382041, "epoch": 2274} {"train_loss": -12.019454956054688, "global_step": 382042, "epoch": 2274} {"train_loss": -12.148492813110352, "global_step": 382043, "epoch": 2274} {"train_loss": -11.727243423461914, "global_step": 382044, "epoch": 2274} {"train_loss": -12.157983779907227, "global_step": 382045, "epoch": 2274} {"train_loss": -11.926050186157227, "global_step": 382046, "epoch": 2274} {"train_loss": -12.221590042114258, "global_step": 382047, "epoch": 2274} {"train_loss": -12.06254768371582, "global_step": 382048, "epoch": 2274} {"train_loss": -12.085610389709473, "global_step": 382049, "epoch": 2274} {"train_loss": -12.080212593078613, "global_step": 382050, "epoch": 2274} {"train_loss": -12.29305648803711, "global_step": 382051, "epoch": 2274} {"train_loss": -11.927131652832031, "global_step": 382052, "epoch": 2274} {"train_loss": -12.325096130371094, "global_step": 382053, "epoch": 2274} {"train_loss": -12.314233779907227, "global_step": 382054, "epoch": 2274} {"train_loss": -12.304512977600098, "global_step": 382055, "epoch": 2274} {"train_loss": -12.276744842529297, "global_step": 382056, "epoch": 2274} {"train_loss": -12.117162704467773, "global_step": 382057, "epoch": 2274} {"train_loss": -12.199573516845703, "global_step": 382058, "epoch": 2274} {"train_loss": -12.117500305175781, "global_step": 382059, "epoch": 2274} {"train_loss": -12.241694450378418, "global_step": 382060, "epoch": 2274} {"train_loss": -12.428081512451172, "global_step": 382061, "epoch": 2274} {"train_loss": -12.071117401123047, "global_step": 382062, "epoch": 2274} {"train_loss": -12.59212589263916, "global_step": 382063, "epoch": 2274} {"train_loss": -11.912941932678223, "global_step": 382064, "epoch": 2274} {"train_loss": -12.586932182312012, "global_step": 382065, "epoch": 2274} {"train_loss": -12.040271759033203, "global_step": 382066, "epoch": 2274} {"train_loss": -12.32641887664795, "global_step": 382067, "epoch": 2274} {"train_loss": -12.323104858398438, "global_step": 382068, "epoch": 2274} {"train_loss": -12.048299789428711, "global_step": 382069, "epoch": 2274} {"train_loss": -12.42837142944336, "global_step": 382070, "epoch": 2274} {"train_loss": -11.849342346191406, "global_step": 382071, "epoch": 2274} {"train_loss": -12.349832534790039, "global_step": 382072, "epoch": 2274} {"train_loss": -12.132148742675781, "global_step": 382073, "epoch": 2274} {"train_loss": -12.367216110229492, "global_step": 382074, "epoch": 2274} {"train_loss": -12.281919479370117, "global_step": 382075, "epoch": 2274} {"train_loss": -12.069494247436523, "global_step": 382076, "epoch": 2274} {"train_loss": -12.508544921875, "global_step": 382077, "epoch": 2274} {"train_loss": -11.749770164489746, "global_step": 382078, "epoch": 2274} {"train_loss": -12.572033882141113, "global_step": 382079, "epoch": 2274} {"train_loss": -12.03048324584961, "global_step": 382080, "epoch": 2274} {"train_loss": -12.32221794128418, "global_step": 382081, "epoch": 2274} {"train_loss": -12.618316650390625, "global_step": 382082, "epoch": 2274} {"train_loss": -11.897300720214844, "global_step": 382083, "epoch": 2274} {"train_loss": -12.302152633666992, "global_step": 382084, "epoch": 2274} {"train_loss": -12.173989295959473, "global_step": 382085, "epoch": 2274} {"train_loss": -12.2406587600708, "global_step": 382086, "epoch": 2274} {"train_loss": -12.475545883178711, "global_step": 382087, "epoch": 2274} {"train_loss": -12.416107177734375, "global_step": 382088, "epoch": 2274} {"train_loss": -12.531850814819336, "global_step": 382089, "epoch": 2274} {"train_loss": -12.307872772216797, "global_step": 382090, "epoch": 2274} {"train_loss": -12.149392127990723, "global_step": 382091, "epoch": 2274} {"train_loss": -12.536386489868164, "global_step": 382092, "epoch": 2274} {"train_loss": -12.516959190368652, "global_step": 382093, "epoch": 2274} {"train_loss": -12.229594230651855, "global_step": 382094, "epoch": 2274} {"train_loss": -12.388788223266602, "global_step": 382095, "epoch": 2274} {"train_loss": -12.0746488571167, "global_step": 382096, "epoch": 2274} {"train_loss": -12.375635147094727, "global_step": 382097, "epoch": 2274} {"train_loss": -12.551387786865234, "global_step": 382098, "epoch": 2274} {"train_loss": -12.505634307861328, "global_step": 382099, "epoch": 2274} {"train_loss": -12.321723937988281, "global_step": 382100, "epoch": 2274} {"train_loss": -12.305623054504395, "global_step": 382101, "epoch": 2274} {"train_loss": -12.481125831604004, "global_step": 382102, "epoch": 2274} {"train_loss": -12.15468978881836, "global_step": 382103, "epoch": 2274} {"train_loss": -12.404797554016113, "global_step": 382104, "epoch": 2274} {"train_loss": -12.360814094543457, "global_step": 382105, "epoch": 2274} {"train_loss": -12.377630233764648, "global_step": 382106, "epoch": 2274} {"train_loss": -12.03271198272705, "global_step": 382107, "epoch": 2274} {"train_loss": -12.536661148071289, "global_step": 382108, "epoch": 2274} {"train_loss": -11.793170928955078, "global_step": 382109, "epoch": 2274} {"train_loss": -12.155170440673828, "global_step": 382110, "epoch": 2274} {"train_loss": -12.346875190734863, "global_step": 382111, "epoch": 2274} {"train_loss": -11.52509593963623, "global_step": 382112, "epoch": 2274} {"train_loss": -12.346158027648926, "global_step": 382113, "epoch": 2274} {"train_loss": -11.23052978515625, "global_step": 382114, "epoch": 2274} {"train_loss": -12.381120681762695, "global_step": 382115, "epoch": 2274} {"train_loss": -11.801065444946289, "global_step": 382116, "epoch": 2274} {"train_loss": -12.198690414428711, "global_step": 382117, "epoch": 2274} {"train_loss": -11.840641975402832, "global_step": 382118, "epoch": 2274} {"train_loss": -11.999130249023438, "global_step": 382119, "epoch": 2274} {"train_loss": -12.376160621643066, "global_step": 382120, "epoch": 2274} {"train_loss": -12.452329635620117, "global_step": 382121, "epoch": 2274} {"train_loss": -12.353486061096191, "global_step": 382122, "epoch": 2274} {"train_loss": -11.567277908325195, "global_step": 382123, "epoch": 2274} {"train_loss": -11.255791664123535, "global_step": 382124, "epoch": 2274} {"train_loss": -12.037383079528809, "global_step": 382125, "epoch": 2274} {"train_loss": -11.949463844299316, "global_step": 382126, "epoch": 2274} {"train_loss": -11.488524436950684, "global_step": 382127, "epoch": 2274} {"train_loss": -11.92949390411377, "global_step": 382128, "epoch": 2274} {"train_loss": -12.140442848205566, "global_step": 382129, "epoch": 2274} {"train_loss": -11.226881980895996, "global_step": 382130, "epoch": 2274} {"train_loss": -12.089502334594727, "global_step": 382131, "epoch": 2274} {"train_loss": -12.300763130187988, "global_step": 382132, "epoch": 2274} {"train_loss": -12.120394706726074, "global_step": 382133, "epoch": 2274} {"train_loss": -12.224050521850586, "global_step": 382134, "epoch": 2274} {"train_loss": -11.876945495605469, "global_step": 382135, "epoch": 2274} {"train_loss": -12.052386283874512, "global_step": 382136, "epoch": 2274} {"train_loss": -12.101922988891602, "global_step": 382137, "epoch": 2274} {"train_loss": -11.931947708129883, "global_step": 382138, "epoch": 2274} {"train_loss": -12.121800422668457, "global_step": 382139, "epoch": 2274} {"train_loss": -12.175711631774902, "global_step": 382140, "epoch": 2274} {"train_loss": -11.4413423538208, "global_step": 382141, "epoch": 2274} {"train_loss": -11.69914436340332, "global_step": 382142, "epoch": 2274} {"train_loss": -10.996565818786621, "global_step": 382143, "epoch": 2274} {"train_loss": -12.212530136108398, "global_step": 382144, "epoch": 2274} {"train_loss": -11.44216251373291, "global_step": 382145, "epoch": 2274} {"train_loss": -12.006758689880371, "global_step": 382146, "epoch": 2274} {"train_loss": -10.817819595336914, "global_step": 382147, "epoch": 2274} {"train_loss": -11.500421524047852, "global_step": 382148, "epoch": 2274} {"train_loss": -11.538248062133789, "global_step": 382149, "epoch": 2274} {"train_loss": -10.747642517089844, "global_step": 382150, "epoch": 2274} {"train_loss": -11.294349670410156, "global_step": 382151, "epoch": 2274} {"train_loss": -10.815322875976562, "global_step": 382152, "epoch": 2274} {"train_loss": -11.407963752746582, "global_step": 382153, "epoch": 2274} {"train_loss": -11.121965408325195, "global_step": 382154, "epoch": 2274} {"train_loss": -10.750236511230469, "global_step": 382155, "epoch": 2274} {"train_loss": -11.59605884552002, "global_step": 382156, "epoch": 2274} {"train_loss": -11.582818984985352, "global_step": 382157, "epoch": 2274} {"train_loss": -11.408231735229492, "global_step": 382158, "epoch": 2274} {"train_loss": -11.368124961853027, "global_step": 382159, "epoch": 2274} {"train_loss": -11.777043342590332, "global_step": 382160, "epoch": 2274} {"train_loss": -11.938348770141602, "global_step": 382161, "epoch": 2274} {"train_loss": -11.979744911193848, "global_step": 382162, "epoch": 2274} {"train_loss": -11.723664283752441, "global_step": 382163, "epoch": 2274} {"train_loss": -11.557584762573242, "global_step": 382164, "epoch": 2274} {"train_loss": -11.885313034057617, "global_step": 382165, "epoch": 2274} {"train_loss": -11.032883644104004, "global_step": 382166, "epoch": 2274} {"train_loss": -11.660533905029297, "global_step": 382167, "epoch": 2274} {"train_loss": -11.114078521728516, "global_step": 382168, "epoch": 2274} {"train_loss": -10.543777465820312, "global_step": 382169, "epoch": 2274} {"train_loss": -12.020086288452148, "global_step": 382170, "epoch": 2274} {"train_loss": -11.125785827636719, "global_step": 382171, "epoch": 2274} {"train_loss": -11.842779159545898, "global_step": 382172, "epoch": 2274} {"train_loss": -11.123268127441406, "global_step": 382173, "epoch": 2274} {"train_loss": -11.924843788146973, "global_step": 382174, "epoch": 2274} {"train_loss": -11.345534324645996, "global_step": 382175, "epoch": 2274} {"train_loss": -11.815530776977539, "global_step": 382176, "epoch": 2274} {"train_loss": -11.633710861206055, "global_step": 382177, "epoch": 2274} {"train_loss": -12.08266830444336, "global_step": 382178, "epoch": 2274} {"train_loss": -11.580974578857422, "global_step": 382179, "epoch": 2274} {"train_loss": -12.286798477172852, "global_step": 382180, "epoch": 2274} {"train_loss": -11.662814140319824, "global_step": 382181, "epoch": 2274} {"train_loss": -12.275001525878906, "global_step": 382182, "epoch": 2274} {"train_loss": -11.83840560913086, "global_step": 382183, "epoch": 2274} {"train_loss": -12.305974960327148, "global_step": 382184, "epoch": 2274} {"train_loss": -11.475921630859375, "global_step": 382185, "epoch": 2274} {"train_loss": -12.01251220703125, "global_step": 382186, "epoch": 2274} {"train_loss": -11.467967987060547, "global_step": 382187, "epoch": 2274} {"train_loss": -11.893848419189453, "global_step": 382188, "epoch": 2274} {"train_loss": -11.533407211303711, "global_step": 382189, "epoch": 2274} {"train_loss": -12.09114933013916, "global_step": 382190, "epoch": 2274} {"train_loss": -11.597747802734375, "global_step": 382191, "epoch": 2274} {"train_loss": -12.235361099243164, "global_step": 382192, "epoch": 2274} {"train_loss": -11.572669982910156, "global_step": 382193, "epoch": 2274} {"train_loss": -12.176307678222656, "global_step": 382194, "epoch": 2274} {"train_loss": -11.628948211669922, "global_step": 382195, "epoch": 2274} {"train_loss": -12.105199813842773, "global_step": 382196, "epoch": 2274} {"train_loss": -11.49197006225586, "global_step": 382197, "epoch": 2274} {"train_loss": -12.186864852905273, "global_step": 382198, "epoch": 2274} {"train_loss": -11.961178813661848, "global_step": 382199, "epoch": 2274, "val_loss": 294562.78125} {"train_loss": -11.864374160766602, "global_step": 382200, "epoch": 2275} {"train_loss": -11.876213073730469, "global_step": 382201, "epoch": 2275} {"train_loss": -11.803539276123047, "global_step": 382202, "epoch": 2275} {"train_loss": -11.789005279541016, "global_step": 382203, "epoch": 2275} {"train_loss": -12.038301467895508, "global_step": 382204, "epoch": 2275} {"train_loss": -11.488905906677246, "global_step": 382205, "epoch": 2275} {"train_loss": -11.844831466674805, "global_step": 382206, "epoch": 2275} {"train_loss": -11.998834609985352, "global_step": 382207, "epoch": 2275} {"train_loss": -12.215020179748535, "global_step": 382208, "epoch": 2275} {"train_loss": -11.185628890991211, "global_step": 382209, "epoch": 2275} {"train_loss": -11.932963371276855, "global_step": 382210, "epoch": 2275} {"train_loss": -11.932586669921875, "global_step": 382211, "epoch": 2275} {"train_loss": -11.93804931640625, "global_step": 382212, "epoch": 2275} {"train_loss": -11.847234725952148, "global_step": 382213, "epoch": 2275} {"train_loss": -11.90799617767334, "global_step": 382214, "epoch": 2275} {"train_loss": -11.60209846496582, "global_step": 382215, "epoch": 2275} {"train_loss": -11.663471221923828, "global_step": 382216, "epoch": 2275} {"train_loss": -12.308186531066895, "global_step": 382217, "epoch": 2275} {"train_loss": -11.46981430053711, "global_step": 382218, "epoch": 2275} {"train_loss": -12.07697582244873, "global_step": 382219, "epoch": 2275} {"train_loss": -11.472373008728027, "global_step": 382220, "epoch": 2275} {"train_loss": -12.306747436523438, "global_step": 382221, "epoch": 2275} {"train_loss": -11.7316312789917, "global_step": 382222, "epoch": 2275} {"train_loss": -12.455619812011719, "global_step": 382223, "epoch": 2275} {"train_loss": -11.647954940795898, "global_step": 382224, "epoch": 2275} {"train_loss": -12.390644073486328, "global_step": 382225, "epoch": 2275} {"train_loss": -12.032475471496582, "global_step": 382226, "epoch": 2275} {"train_loss": -12.014324188232422, "global_step": 382227, "epoch": 2275} {"train_loss": -12.024877548217773, "global_step": 382228, "epoch": 2275} {"train_loss": -12.24300765991211, "global_step": 382229, "epoch": 2275} {"train_loss": -11.559579849243164, "global_step": 382230, "epoch": 2275} {"train_loss": -12.504365921020508, "global_step": 382231, "epoch": 2275} {"train_loss": -11.950614929199219, "global_step": 382232, "epoch": 2275} {"train_loss": -12.37186050415039, "global_step": 382233, "epoch": 2275} {"train_loss": -12.289510726928711, "global_step": 382234, "epoch": 2275} {"train_loss": -12.133621215820312, "global_step": 382235, "epoch": 2275} {"train_loss": -12.13741683959961, "global_step": 382236, "epoch": 2275} {"train_loss": -11.934846878051758, "global_step": 382237, "epoch": 2275} {"train_loss": -11.238542556762695, "global_step": 382238, "epoch": 2275} {"train_loss": -11.661726951599121, "global_step": 382239, "epoch": 2275} {"train_loss": -12.109612464904785, "global_step": 382240, "epoch": 2275} {"train_loss": -11.762308120727539, "global_step": 382241, "epoch": 2275} {"train_loss": -12.33602523803711, "global_step": 382242, "epoch": 2275} {"train_loss": -12.210502624511719, "global_step": 382243, "epoch": 2275} {"train_loss": -11.882952690124512, "global_step": 382244, "epoch": 2275} {"train_loss": -12.198373794555664, "global_step": 382245, "epoch": 2275} {"train_loss": -11.9996337890625, "global_step": 382246, "epoch": 2275} {"train_loss": -12.234432220458984, "global_step": 382247, "epoch": 2275} {"train_loss": -12.040596008300781, "global_step": 382248, "epoch": 2275} {"train_loss": -11.645303726196289, "global_step": 382249, "epoch": 2275} {"train_loss": -11.793497085571289, "global_step": 382250, "epoch": 2275} {"train_loss": -11.964666366577148, "global_step": 382251, "epoch": 2275} {"train_loss": -11.65151596069336, "global_step": 382252, "epoch": 2275} {"train_loss": -12.023843765258789, "global_step": 382253, "epoch": 2275} {"train_loss": -11.813624382019043, "global_step": 382254, "epoch": 2275} {"train_loss": -12.000283241271973, "global_step": 382255, "epoch": 2275} {"train_loss": -12.529200553894043, "global_step": 382256, "epoch": 2275} {"train_loss": -11.919160842895508, "global_step": 382257, "epoch": 2275} {"train_loss": -12.438074111938477, "global_step": 382258, "epoch": 2275} {"train_loss": -11.814111709594727, "global_step": 382259, "epoch": 2275} {"train_loss": -12.205851554870605, "global_step": 382260, "epoch": 2275} {"train_loss": -12.431937217712402, "global_step": 382261, "epoch": 2275} {"train_loss": -12.266081809997559, "global_step": 382262, "epoch": 2275} {"train_loss": -12.079858779907227, "global_step": 382263, "epoch": 2275} {"train_loss": -12.532337188720703, "global_step": 382264, "epoch": 2275} {"train_loss": -12.162433624267578, "global_step": 382265, "epoch": 2275} {"train_loss": -12.385748863220215, "global_step": 382266, "epoch": 2275} {"train_loss": -12.312381744384766, "global_step": 382267, "epoch": 2275} {"train_loss": -12.376192092895508, "global_step": 382268, "epoch": 2275} {"train_loss": -12.321479797363281, "global_step": 382269, "epoch": 2275} {"train_loss": -12.358076095581055, "global_step": 382270, "epoch": 2275} {"train_loss": -12.359565734863281, "global_step": 382271, "epoch": 2275} {"train_loss": -12.34831714630127, "global_step": 382272, "epoch": 2275} {"train_loss": -12.259000778198242, "global_step": 382273, "epoch": 2275} {"train_loss": -12.460172653198242, "global_step": 382274, "epoch": 2275} {"train_loss": -12.654870986938477, "global_step": 382275, "epoch": 2275} {"train_loss": -12.227691650390625, "global_step": 382276, "epoch": 2275} {"train_loss": -12.57872486114502, "global_step": 382277, "epoch": 2275} {"train_loss": -12.476329803466797, "global_step": 382278, "epoch": 2275} {"train_loss": -12.621312141418457, "global_step": 382279, "epoch": 2275} {"train_loss": -12.635721206665039, "global_step": 382280, "epoch": 2275} {"train_loss": -12.560304641723633, "global_step": 382281, "epoch": 2275} {"train_loss": -12.424495697021484, "global_step": 382282, "epoch": 2275} {"train_loss": -12.597957611083984, "global_step": 382283, "epoch": 2275} {"train_loss": -12.552722930908203, "global_step": 382284, "epoch": 2275} {"train_loss": -12.630489349365234, "global_step": 382285, "epoch": 2275} {"train_loss": -12.374470710754395, "global_step": 382286, "epoch": 2275} {"train_loss": -12.618730545043945, "global_step": 382287, "epoch": 2275} {"train_loss": -12.668853759765625, "global_step": 382288, "epoch": 2275} {"train_loss": -12.779153823852539, "global_step": 382289, "epoch": 2275} {"train_loss": -12.667938232421875, "global_step": 382290, "epoch": 2275} {"train_loss": -12.28236198425293, "global_step": 382291, "epoch": 2275} {"train_loss": -12.300161361694336, "global_step": 382292, "epoch": 2275} {"train_loss": -12.498940467834473, "global_step": 382293, "epoch": 2275} {"train_loss": -12.604649543762207, "global_step": 382294, "epoch": 2275} {"train_loss": -12.385831832885742, "global_step": 382295, "epoch": 2275} {"train_loss": -11.9932861328125, "global_step": 382296, "epoch": 2275} {"train_loss": -12.387126922607422, "global_step": 382297, "epoch": 2275} {"train_loss": -12.275525093078613, "global_step": 382298, "epoch": 2275} {"train_loss": -11.826730728149414, "global_step": 382299, "epoch": 2275} {"train_loss": -12.46005630493164, "global_step": 382300, "epoch": 2275} {"train_loss": -12.179962158203125, "global_step": 382301, "epoch": 2275} {"train_loss": -12.660937309265137, "global_step": 382302, "epoch": 2275} {"train_loss": -11.989426612854004, "global_step": 382303, "epoch": 2275} {"train_loss": -12.422812461853027, "global_step": 382304, "epoch": 2275} {"train_loss": -11.806844711303711, "global_step": 382305, "epoch": 2275} {"train_loss": -11.662163734436035, "global_step": 382306, "epoch": 2275} {"train_loss": -12.290878295898438, "global_step": 382307, "epoch": 2275} {"train_loss": -12.020034790039062, "global_step": 382308, "epoch": 2275} {"train_loss": -11.844131469726562, "global_step": 382309, "epoch": 2275} {"train_loss": -11.408703804016113, "global_step": 382310, "epoch": 2275} {"train_loss": -11.404958724975586, "global_step": 382311, "epoch": 2275} {"train_loss": -11.855489730834961, "global_step": 382312, "epoch": 2275} {"train_loss": -10.570328712463379, "global_step": 382313, "epoch": 2275} {"train_loss": -10.322467803955078, "global_step": 382314, "epoch": 2275} {"train_loss": -10.825359344482422, "global_step": 382315, "epoch": 2275} {"train_loss": -11.310606002807617, "global_step": 382316, "epoch": 2275} {"train_loss": -11.507535934448242, "global_step": 382317, "epoch": 2275} {"train_loss": -11.695772171020508, "global_step": 382318, "epoch": 2275} {"train_loss": -11.346025466918945, "global_step": 382319, "epoch": 2275} {"train_loss": -11.6537446975708, "global_step": 382320, "epoch": 2275} {"train_loss": -11.470788955688477, "global_step": 382321, "epoch": 2275} {"train_loss": -12.022527694702148, "global_step": 382322, "epoch": 2275} {"train_loss": -12.043192863464355, "global_step": 382323, "epoch": 2275} {"train_loss": -11.110754013061523, "global_step": 382324, "epoch": 2275} {"train_loss": -12.30984878540039, "global_step": 382325, "epoch": 2275} {"train_loss": -11.927114486694336, "global_step": 382326, "epoch": 2275} {"train_loss": -11.360552787780762, "global_step": 382327, "epoch": 2275} {"train_loss": -12.208003044128418, "global_step": 382328, "epoch": 2275} {"train_loss": -11.552902221679688, "global_step": 382329, "epoch": 2275} {"train_loss": -11.576652526855469, "global_step": 382330, "epoch": 2275} {"train_loss": -12.311136245727539, "global_step": 382331, "epoch": 2275} {"train_loss": -12.138702392578125, "global_step": 382332, "epoch": 2275} {"train_loss": -11.309157371520996, "global_step": 382333, "epoch": 2275} {"train_loss": -12.220600128173828, "global_step": 382334, "epoch": 2275} {"train_loss": -12.033321380615234, "global_step": 382335, "epoch": 2275} {"train_loss": -12.150537490844727, "global_step": 382336, "epoch": 2275} {"train_loss": -12.245071411132812, "global_step": 382337, "epoch": 2275} {"train_loss": -12.55770492553711, "global_step": 382338, "epoch": 2275} {"train_loss": -12.457908630371094, "global_step": 382339, "epoch": 2275} {"train_loss": -12.309919357299805, "global_step": 382340, "epoch": 2275} {"train_loss": -12.346366882324219, "global_step": 382341, "epoch": 2275} {"train_loss": -12.245019912719727, "global_step": 382342, "epoch": 2275} {"train_loss": -12.428815841674805, "global_step": 382343, "epoch": 2275} {"train_loss": -12.152217864990234, "global_step": 382344, "epoch": 2275} {"train_loss": -12.535069465637207, "global_step": 382345, "epoch": 2275} {"train_loss": -12.19439697265625, "global_step": 382346, "epoch": 2275} {"train_loss": -12.457944869995117, "global_step": 382347, "epoch": 2275} {"train_loss": -12.176485061645508, "global_step": 382348, "epoch": 2275} {"train_loss": -12.254508972167969, "global_step": 382349, "epoch": 2275} {"train_loss": -12.069546699523926, "global_step": 382350, "epoch": 2275} {"train_loss": -12.376405715942383, "global_step": 382351, "epoch": 2275} {"train_loss": -11.314434051513672, "global_step": 382352, "epoch": 2275} {"train_loss": -12.295421600341797, "global_step": 382353, "epoch": 2275} {"train_loss": -11.660711288452148, "global_step": 382354, "epoch": 2275} {"train_loss": -11.400947570800781, "global_step": 382355, "epoch": 2275} {"train_loss": -11.145851135253906, "global_step": 382356, "epoch": 2275} {"train_loss": -11.497207641601562, "global_step": 382357, "epoch": 2275} {"train_loss": -9.724149703979492, "global_step": 382358, "epoch": 2275} {"train_loss": -11.746009826660156, "global_step": 382359, "epoch": 2275} {"train_loss": -10.221362113952637, "global_step": 382360, "epoch": 2275} {"train_loss": -11.462631225585938, "global_step": 382361, "epoch": 2275} {"train_loss": -11.151756286621094, "global_step": 382362, "epoch": 2275} {"train_loss": -10.022916793823242, "global_step": 382363, "epoch": 2275} {"train_loss": -10.664073944091797, "global_step": 382364, "epoch": 2275} {"train_loss": -11.000452995300293, "global_step": 382365, "epoch": 2275} {"train_loss": -11.735016822814941, "global_step": 382366, "epoch": 2275} {"train_loss": -11.972163189025153, "global_step": 382367, "epoch": 2275, "val_loss": 294414.6875, "train_action_mse_error": 1.6034116744995117} {"train_loss": -11.988005638122559, "global_step": 382368, "epoch": 2276} {"train_loss": -10.578787803649902, "global_step": 382369, "epoch": 2276} {"train_loss": -12.173133850097656, "global_step": 382370, "epoch": 2276} {"train_loss": -11.131267547607422, "global_step": 382371, "epoch": 2276} {"train_loss": -11.480981826782227, "global_step": 382372, "epoch": 2276} {"train_loss": -11.962353706359863, "global_step": 382373, "epoch": 2276} {"train_loss": -11.279645919799805, "global_step": 382374, "epoch": 2276} {"train_loss": -12.391511917114258, "global_step": 382375, "epoch": 2276} {"train_loss": -11.259315490722656, "global_step": 382376, "epoch": 2276} {"train_loss": -12.180023193359375, "global_step": 382377, "epoch": 2276} {"train_loss": -10.948780059814453, "global_step": 382378, "epoch": 2276} {"train_loss": -11.905449867248535, "global_step": 382379, "epoch": 2276} {"train_loss": -11.130780220031738, "global_step": 382380, "epoch": 2276} {"train_loss": -12.11668586730957, "global_step": 382381, "epoch": 2276} {"train_loss": -11.307498931884766, "global_step": 382382, "epoch": 2276} {"train_loss": -11.741212844848633, "global_step": 382383, "epoch": 2276} {"train_loss": -11.88467025756836, "global_step": 382384, "epoch": 2276} {"train_loss": -11.755546569824219, "global_step": 382385, "epoch": 2276} {"train_loss": -11.890527725219727, "global_step": 382386, "epoch": 2276} {"train_loss": -11.980728149414062, "global_step": 382387, "epoch": 2276} {"train_loss": -12.015190124511719, "global_step": 382388, "epoch": 2276} {"train_loss": -11.732315063476562, "global_step": 382389, "epoch": 2276} {"train_loss": -12.0238037109375, "global_step": 382390, "epoch": 2276} {"train_loss": -11.972352027893066, "global_step": 382391, "epoch": 2276} {"train_loss": -11.232988357543945, "global_step": 382392, "epoch": 2276} {"train_loss": -12.168529510498047, "global_step": 382393, "epoch": 2276} {"train_loss": -11.621600151062012, "global_step": 382394, "epoch": 2276} {"train_loss": -11.882108688354492, "global_step": 382395, "epoch": 2276} {"train_loss": -12.215872764587402, "global_step": 382396, "epoch": 2276} {"train_loss": -11.83848762512207, "global_step": 382397, "epoch": 2276} {"train_loss": -12.42922592163086, "global_step": 382398, "epoch": 2276} {"train_loss": -11.775583267211914, "global_step": 382399, "epoch": 2276} {"train_loss": -11.977108001708984, "global_step": 382400, "epoch": 2276} {"train_loss": -12.100362777709961, "global_step": 382401, "epoch": 2276} {"train_loss": -11.34637451171875, "global_step": 382402, "epoch": 2276} {"train_loss": -11.979082107543945, "global_step": 382403, "epoch": 2276} {"train_loss": -11.350765228271484, "global_step": 382404, "epoch": 2276} {"train_loss": -12.281630516052246, "global_step": 382405, "epoch": 2276} {"train_loss": -12.115071296691895, "global_step": 382406, "epoch": 2276} {"train_loss": -12.09495735168457, "global_step": 382407, "epoch": 2276} {"train_loss": -12.173412322998047, "global_step": 382408, "epoch": 2276} {"train_loss": -12.34823226928711, "global_step": 382409, "epoch": 2276} {"train_loss": -12.09792423248291, "global_step": 382410, "epoch": 2276} {"train_loss": -12.475824356079102, "global_step": 382411, "epoch": 2276} {"train_loss": -12.257923126220703, "global_step": 382412, "epoch": 2276} {"train_loss": -12.384971618652344, "global_step": 382413, "epoch": 2276} {"train_loss": -12.397536277770996, "global_step": 382414, "epoch": 2276} {"train_loss": -12.283327102661133, "global_step": 382415, "epoch": 2276} {"train_loss": -12.467493057250977, "global_step": 382416, "epoch": 2276} {"train_loss": -12.378782272338867, "global_step": 382417, "epoch": 2276} {"train_loss": -12.532441139221191, "global_step": 382418, "epoch": 2276} {"train_loss": -12.55647087097168, "global_step": 382419, "epoch": 2276} {"train_loss": -12.406890869140625, "global_step": 382420, "epoch": 2276} {"train_loss": -12.273138046264648, "global_step": 382421, "epoch": 2276} {"train_loss": -12.414885520935059, "global_step": 382422, "epoch": 2276} {"train_loss": -12.521066665649414, "global_step": 382423, "epoch": 2276} {"train_loss": -12.559026718139648, "global_step": 382424, "epoch": 2276} {"train_loss": -12.528812408447266, "global_step": 382425, "epoch": 2276} {"train_loss": -12.653501510620117, "global_step": 382426, "epoch": 2276} {"train_loss": -12.512046813964844, "global_step": 382427, "epoch": 2276} {"train_loss": -12.508810997009277, "global_step": 382428, "epoch": 2276} {"train_loss": -12.674873352050781, "global_step": 382429, "epoch": 2276} {"train_loss": -12.408727645874023, "global_step": 382430, "epoch": 2276} {"train_loss": -12.5040922164917, "global_step": 382431, "epoch": 2276} {"train_loss": -12.454923629760742, "global_step": 382432, "epoch": 2276} {"train_loss": -12.403566360473633, "global_step": 382433, "epoch": 2276} {"train_loss": -12.66629409790039, "global_step": 382434, "epoch": 2276} {"train_loss": -12.534286499023438, "global_step": 382435, "epoch": 2276} {"train_loss": -12.675440788269043, "global_step": 382436, "epoch": 2276} {"train_loss": -12.76754379272461, "global_step": 382437, "epoch": 2276} {"train_loss": -12.54969596862793, "global_step": 382438, "epoch": 2276} {"train_loss": -12.669865608215332, "global_step": 382439, "epoch": 2276} {"train_loss": -12.774300575256348, "global_step": 382440, "epoch": 2276} {"train_loss": -12.811210632324219, "global_step": 382441, "epoch": 2276} {"train_loss": -12.685600280761719, "global_step": 382442, "epoch": 2276} {"train_loss": -12.38167953491211, "global_step": 382443, "epoch": 2276} {"train_loss": -12.864173889160156, "global_step": 382444, "epoch": 2276} {"train_loss": -12.621956825256348, "global_step": 382445, "epoch": 2276} {"train_loss": -12.651826858520508, "global_step": 382446, "epoch": 2276} {"train_loss": -12.750570297241211, "global_step": 382447, "epoch": 2276} {"train_loss": -12.526052474975586, "global_step": 382448, "epoch": 2276} {"train_loss": -12.657625198364258, "global_step": 382449, "epoch": 2276} {"train_loss": -12.506803512573242, "global_step": 382450, "epoch": 2276} {"train_loss": -12.360442161560059, "global_step": 382451, "epoch": 2276} {"train_loss": -12.32708740234375, "global_step": 382452, "epoch": 2276} {"train_loss": -12.577940940856934, "global_step": 382453, "epoch": 2276} {"train_loss": -12.570650100708008, "global_step": 382454, "epoch": 2276} {"train_loss": -12.574409484863281, "global_step": 382455, "epoch": 2276} {"train_loss": -12.446556091308594, "global_step": 382456, "epoch": 2276} {"train_loss": -11.823575973510742, "global_step": 382457, "epoch": 2276} {"train_loss": -12.594396591186523, "global_step": 382458, "epoch": 2276} {"train_loss": -12.508731842041016, "global_step": 382459, "epoch": 2276} {"train_loss": -12.52755355834961, "global_step": 382460, "epoch": 2276} {"train_loss": -12.536466598510742, "global_step": 382461, "epoch": 2276} {"train_loss": -12.63222885131836, "global_step": 382462, "epoch": 2276} {"train_loss": -12.560369491577148, "global_step": 382463, "epoch": 2276} {"train_loss": -12.830751419067383, "global_step": 382464, "epoch": 2276} {"train_loss": -12.725603103637695, "global_step": 382465, "epoch": 2276} {"train_loss": -12.857514381408691, "global_step": 382466, "epoch": 2276} {"train_loss": -12.671680450439453, "global_step": 382467, "epoch": 2276} {"train_loss": -12.665287017822266, "global_step": 382468, "epoch": 2276} {"train_loss": -12.481889724731445, "global_step": 382469, "epoch": 2276} {"train_loss": -12.677949905395508, "global_step": 382470, "epoch": 2276} {"train_loss": -12.751890182495117, "global_step": 382471, "epoch": 2276} {"train_loss": -12.674703598022461, "global_step": 382472, "epoch": 2276} {"train_loss": -12.478769302368164, "global_step": 382473, "epoch": 2276} {"train_loss": -12.862826347351074, "global_step": 382474, "epoch": 2276} {"train_loss": -12.260068893432617, "global_step": 382475, "epoch": 2276} {"train_loss": -11.938470840454102, "global_step": 382476, "epoch": 2276} {"train_loss": -11.24513053894043, "global_step": 382477, "epoch": 2276} {"train_loss": -11.641559600830078, "global_step": 382478, "epoch": 2276} {"train_loss": -11.741703987121582, "global_step": 382479, "epoch": 2276} {"train_loss": -11.189297676086426, "global_step": 382480, "epoch": 2276} {"train_loss": -10.404515266418457, "global_step": 382481, "epoch": 2276} {"train_loss": -11.60906982421875, "global_step": 382482, "epoch": 2276} {"train_loss": -12.307607650756836, "global_step": 382483, "epoch": 2276} {"train_loss": -10.630041122436523, "global_step": 382484, "epoch": 2276} {"train_loss": -11.275409698486328, "global_step": 382485, "epoch": 2276} {"train_loss": -10.398069381713867, "global_step": 382486, "epoch": 2276} {"train_loss": -10.434274673461914, "global_step": 382487, "epoch": 2276} {"train_loss": -10.596416473388672, "global_step": 382488, "epoch": 2276} {"train_loss": -10.234529495239258, "global_step": 382489, "epoch": 2276} {"train_loss": -8.254060745239258, "global_step": 382490, "epoch": 2276} {"train_loss": -8.582979202270508, "global_step": 382491, "epoch": 2276} {"train_loss": -10.055298805236816, "global_step": 382492, "epoch": 2276} {"train_loss": -9.873907089233398, "global_step": 382493, "epoch": 2276} {"train_loss": -10.214582443237305, "global_step": 382494, "epoch": 2276} {"train_loss": -9.737909317016602, "global_step": 382495, "epoch": 2276} {"train_loss": -10.703400611877441, "global_step": 382496, "epoch": 2276} {"train_loss": -10.210943222045898, "global_step": 382497, "epoch": 2276} {"train_loss": -10.488517761230469, "global_step": 382498, "epoch": 2276} {"train_loss": -10.090320587158203, "global_step": 382499, "epoch": 2276} {"train_loss": -9.685436248779297, "global_step": 382500, "epoch": 2276} {"train_loss": -9.586225509643555, "global_step": 382501, "epoch": 2276} {"train_loss": -10.161479949951172, "global_step": 382502, "epoch": 2276} {"train_loss": -10.695854187011719, "global_step": 382503, "epoch": 2276} {"train_loss": -11.087156295776367, "global_step": 382504, "epoch": 2276} {"train_loss": -10.263522148132324, "global_step": 382505, "epoch": 2276} {"train_loss": -10.859672546386719, "global_step": 382506, "epoch": 2276} {"train_loss": -10.914445877075195, "global_step": 382507, "epoch": 2276} {"train_loss": -10.495765686035156, "global_step": 382508, "epoch": 2276} {"train_loss": -10.746000289916992, "global_step": 382509, "epoch": 2276} {"train_loss": -11.206416130065918, "global_step": 382510, "epoch": 2276} {"train_loss": -10.338651657104492, "global_step": 382511, "epoch": 2276} {"train_loss": -11.466938972473145, "global_step": 382512, "epoch": 2276} {"train_loss": -10.803129196166992, "global_step": 382513, "epoch": 2276} {"train_loss": -11.364818572998047, "global_step": 382514, "epoch": 2276} {"train_loss": -10.274162292480469, "global_step": 382515, "epoch": 2276} {"train_loss": -11.137584686279297, "global_step": 382516, "epoch": 2276} {"train_loss": -11.528739929199219, "global_step": 382517, "epoch": 2276} {"train_loss": -11.057069778442383, "global_step": 382518, "epoch": 2276} {"train_loss": -11.176365852355957, "global_step": 382519, "epoch": 2276} {"train_loss": -12.047819137573242, "global_step": 382520, "epoch": 2276} {"train_loss": -11.303184509277344, "global_step": 382521, "epoch": 2276} {"train_loss": -11.769851684570312, "global_step": 382522, "epoch": 2276} {"train_loss": -11.80221176147461, "global_step": 382523, "epoch": 2276} {"train_loss": -11.458738327026367, "global_step": 382524, "epoch": 2276} {"train_loss": -11.812891006469727, "global_step": 382525, "epoch": 2276} {"train_loss": -11.735525131225586, "global_step": 382526, "epoch": 2276} {"train_loss": -11.54858112335205, "global_step": 382527, "epoch": 2276} {"train_loss": -11.769258499145508, "global_step": 382528, "epoch": 2276} {"train_loss": -11.850889205932617, "global_step": 382529, "epoch": 2276} {"train_loss": -11.742023468017578, "global_step": 382530, "epoch": 2276} {"train_loss": -11.968931198120117, "global_step": 382531, "epoch": 2276} {"train_loss": -10.924835205078125, "global_step": 382532, "epoch": 2276} {"train_loss": -12.062005996704102, "global_step": 382533, "epoch": 2276} {"train_loss": -11.320795059204102, "global_step": 382534, "epoch": 2276} {"train_loss": -11.782361013548714, "global_step": 382535, "epoch": 2276, "val_loss": 289389.09375} {"train_loss": -11.778346061706543, "global_step": 382536, "epoch": 2277} {"train_loss": -12.016883850097656, "global_step": 382537, "epoch": 2277} {"train_loss": -11.545944213867188, "global_step": 382538, "epoch": 2277} {"train_loss": -12.007099151611328, "global_step": 382539, "epoch": 2277} {"train_loss": -11.926758766174316, "global_step": 382540, "epoch": 2277} {"train_loss": -11.811433792114258, "global_step": 382541, "epoch": 2277} {"train_loss": -11.908668518066406, "global_step": 382542, "epoch": 2277} {"train_loss": -11.709739685058594, "global_step": 382543, "epoch": 2277} {"train_loss": -12.251579284667969, "global_step": 382544, "epoch": 2277} {"train_loss": -11.959579467773438, "global_step": 382545, "epoch": 2277} {"train_loss": -12.218385696411133, "global_step": 382546, "epoch": 2277} {"train_loss": -12.086119651794434, "global_step": 382547, "epoch": 2277} {"train_loss": -11.894783973693848, "global_step": 382548, "epoch": 2277} {"train_loss": -12.221257209777832, "global_step": 382549, "epoch": 2277} {"train_loss": -12.272512435913086, "global_step": 382550, "epoch": 2277} {"train_loss": -12.190139770507812, "global_step": 382551, "epoch": 2277} {"train_loss": -12.263664245605469, "global_step": 382552, "epoch": 2277} {"train_loss": -12.126693725585938, "global_step": 382553, "epoch": 2277} {"train_loss": -12.39514446258545, "global_step": 382554, "epoch": 2277} {"train_loss": -12.356045722961426, "global_step": 382555, "epoch": 2277} {"train_loss": -12.53574275970459, "global_step": 382556, "epoch": 2277} {"train_loss": -12.361334800720215, "global_step": 382557, "epoch": 2277} {"train_loss": -12.404067993164062, "global_step": 382558, "epoch": 2277} {"train_loss": -12.40805435180664, "global_step": 382559, "epoch": 2277} {"train_loss": -12.27165412902832, "global_step": 382560, "epoch": 2277} {"train_loss": -12.450955390930176, "global_step": 382561, "epoch": 2277} {"train_loss": -12.453205108642578, "global_step": 382562, "epoch": 2277} {"train_loss": -12.426986694335938, "global_step": 382563, "epoch": 2277} {"train_loss": -12.50490951538086, "global_step": 382564, "epoch": 2277} {"train_loss": -12.491519927978516, "global_step": 382565, "epoch": 2277} {"train_loss": -12.408085823059082, "global_step": 382566, "epoch": 2277} {"train_loss": -12.265907287597656, "global_step": 382567, "epoch": 2277} {"train_loss": -12.507527351379395, "global_step": 382568, "epoch": 2277} {"train_loss": -12.516758918762207, "global_step": 382569, "epoch": 2277} {"train_loss": -12.630586624145508, "global_step": 382570, "epoch": 2277} {"train_loss": -12.543082237243652, "global_step": 382571, "epoch": 2277} {"train_loss": -12.320789337158203, "global_step": 382572, "epoch": 2277} {"train_loss": -12.427921295166016, "global_step": 382573, "epoch": 2277} {"train_loss": -12.632328033447266, "global_step": 382574, "epoch": 2277} {"train_loss": -12.605409622192383, "global_step": 382575, "epoch": 2277} {"train_loss": -12.482725143432617, "global_step": 382576, "epoch": 2277} {"train_loss": -12.646676063537598, "global_step": 382577, "epoch": 2277} {"train_loss": -12.569944381713867, "global_step": 382578, "epoch": 2277} {"train_loss": -12.584556579589844, "global_step": 382579, "epoch": 2277} {"train_loss": -12.537946701049805, "global_step": 382580, "epoch": 2277} {"train_loss": -12.543012619018555, "global_step": 382581, "epoch": 2277} {"train_loss": -12.525035858154297, "global_step": 382582, "epoch": 2277} {"train_loss": -12.594963073730469, "global_step": 382583, "epoch": 2277} {"train_loss": -12.698406219482422, "global_step": 382584, "epoch": 2277} {"train_loss": -12.590521812438965, "global_step": 382585, "epoch": 2277} {"train_loss": -12.736705780029297, "global_step": 382586, "epoch": 2277} {"train_loss": -12.688064575195312, "global_step": 382587, "epoch": 2277} {"train_loss": -12.537439346313477, "global_step": 382588, "epoch": 2277} {"train_loss": -12.607633590698242, "global_step": 382589, "epoch": 2277} {"train_loss": -12.566719055175781, "global_step": 382590, "epoch": 2277} {"train_loss": -12.815320014953613, "global_step": 382591, "epoch": 2277} {"train_loss": -12.47992992401123, "global_step": 382592, "epoch": 2277} {"train_loss": -12.602907180786133, "global_step": 382593, "epoch": 2277} {"train_loss": -12.809406280517578, "global_step": 382594, "epoch": 2277} {"train_loss": -12.648615837097168, "global_step": 382595, "epoch": 2277} {"train_loss": -12.733208656311035, "global_step": 382596, "epoch": 2277} {"train_loss": -12.568575859069824, "global_step": 382597, "epoch": 2277} {"train_loss": -12.701231956481934, "global_step": 382598, "epoch": 2277} {"train_loss": -12.80827808380127, "global_step": 382599, "epoch": 2277} {"train_loss": -12.827055931091309, "global_step": 382600, "epoch": 2277} {"train_loss": -12.615107536315918, "global_step": 382601, "epoch": 2277} {"train_loss": -12.470939636230469, "global_step": 382602, "epoch": 2277} {"train_loss": -12.705940246582031, "global_step": 382603, "epoch": 2277} {"train_loss": -12.859734535217285, "global_step": 382604, "epoch": 2277} {"train_loss": -12.549654006958008, "global_step": 382605, "epoch": 2277} {"train_loss": -12.824647903442383, "global_step": 382606, "epoch": 2277} {"train_loss": -12.786155700683594, "global_step": 382607, "epoch": 2277} {"train_loss": -12.755261421203613, "global_step": 382608, "epoch": 2277} {"train_loss": -12.112536430358887, "global_step": 382609, "epoch": 2277} {"train_loss": -12.414538383483887, "global_step": 382610, "epoch": 2277} {"train_loss": -12.250089645385742, "global_step": 382611, "epoch": 2277} {"train_loss": -11.942658424377441, "global_step": 382612, "epoch": 2277} {"train_loss": -11.821174621582031, "global_step": 382613, "epoch": 2277} {"train_loss": -11.297689437866211, "global_step": 382614, "epoch": 2277} {"train_loss": -11.913490295410156, "global_step": 382615, "epoch": 2277} {"train_loss": -12.016727447509766, "global_step": 382616, "epoch": 2277} {"train_loss": -12.235884666442871, "global_step": 382617, "epoch": 2277} {"train_loss": -11.954702377319336, "global_step": 382618, "epoch": 2277} {"train_loss": -10.78354549407959, "global_step": 382619, "epoch": 2277} {"train_loss": -9.99040412902832, "global_step": 382620, "epoch": 2277} {"train_loss": -11.432316780090332, "global_step": 382621, "epoch": 2277} {"train_loss": -11.116890907287598, "global_step": 382622, "epoch": 2277} {"train_loss": -11.538444519042969, "global_step": 382623, "epoch": 2277} {"train_loss": -12.09450912475586, "global_step": 382624, "epoch": 2277} {"train_loss": -10.545707702636719, "global_step": 382625, "epoch": 2277} {"train_loss": -11.133550643920898, "global_step": 382626, "epoch": 2277} {"train_loss": -11.919055938720703, "global_step": 382627, "epoch": 2277} {"train_loss": -11.651021957397461, "global_step": 382628, "epoch": 2277} {"train_loss": -12.193304061889648, "global_step": 382629, "epoch": 2277} {"train_loss": -12.272420883178711, "global_step": 382630, "epoch": 2277} {"train_loss": -11.533620834350586, "global_step": 382631, "epoch": 2277} {"train_loss": -11.788900375366211, "global_step": 382632, "epoch": 2277} {"train_loss": -11.955865859985352, "global_step": 382633, "epoch": 2277} {"train_loss": -10.699516296386719, "global_step": 382634, "epoch": 2277} {"train_loss": -10.684701919555664, "global_step": 382635, "epoch": 2277} {"train_loss": -12.392001152038574, "global_step": 382636, "epoch": 2277} {"train_loss": -10.99218463897705, "global_step": 382637, "epoch": 2277} {"train_loss": -11.652870178222656, "global_step": 382638, "epoch": 2277} {"train_loss": -12.487353324890137, "global_step": 382639, "epoch": 2277} {"train_loss": -12.110174179077148, "global_step": 382640, "epoch": 2277} {"train_loss": -11.876747131347656, "global_step": 382641, "epoch": 2277} {"train_loss": -12.213188171386719, "global_step": 382642, "epoch": 2277} {"train_loss": -11.460525512695312, "global_step": 382643, "epoch": 2277} {"train_loss": -12.20798397064209, "global_step": 382644, "epoch": 2277} {"train_loss": -11.150960922241211, "global_step": 382645, "epoch": 2277} {"train_loss": -11.56126880645752, "global_step": 382646, "epoch": 2277} {"train_loss": -12.127806663513184, "global_step": 382647, "epoch": 2277} {"train_loss": -11.700101852416992, "global_step": 382648, "epoch": 2277} {"train_loss": -11.76272201538086, "global_step": 382649, "epoch": 2277} {"train_loss": -11.963138580322266, "global_step": 382650, "epoch": 2277} {"train_loss": -11.684808731079102, "global_step": 382651, "epoch": 2277} {"train_loss": -12.531807899475098, "global_step": 382652, "epoch": 2277} {"train_loss": -11.9064302444458, "global_step": 382653, "epoch": 2277} {"train_loss": -12.117036819458008, "global_step": 382654, "epoch": 2277} {"train_loss": -12.414772033691406, "global_step": 382655, "epoch": 2277} {"train_loss": -12.357843399047852, "global_step": 382656, "epoch": 2277} {"train_loss": -12.190420150756836, "global_step": 382657, "epoch": 2277} {"train_loss": -12.333107948303223, "global_step": 382658, "epoch": 2277} {"train_loss": -12.282485008239746, "global_step": 382659, "epoch": 2277} {"train_loss": -12.12535572052002, "global_step": 382660, "epoch": 2277} {"train_loss": -12.097419738769531, "global_step": 382661, "epoch": 2277} {"train_loss": -12.269283294677734, "global_step": 382662, "epoch": 2277} {"train_loss": -12.153106689453125, "global_step": 382663, "epoch": 2277} {"train_loss": -12.006767272949219, "global_step": 382664, "epoch": 2277} {"train_loss": -12.276145935058594, "global_step": 382665, "epoch": 2277} {"train_loss": -12.268415451049805, "global_step": 382666, "epoch": 2277} {"train_loss": -11.762572288513184, "global_step": 382667, "epoch": 2277} {"train_loss": -12.201904296875, "global_step": 382668, "epoch": 2277} {"train_loss": -12.501389503479004, "global_step": 382669, "epoch": 2277} {"train_loss": -12.014413833618164, "global_step": 382670, "epoch": 2277} {"train_loss": -11.705595016479492, "global_step": 382671, "epoch": 2277} {"train_loss": -12.238548278808594, "global_step": 382672, "epoch": 2277} {"train_loss": -11.964048385620117, "global_step": 382673, "epoch": 2277} {"train_loss": -12.344722747802734, "global_step": 382674, "epoch": 2277} {"train_loss": -12.149198532104492, "global_step": 382675, "epoch": 2277} {"train_loss": -11.886516571044922, "global_step": 382676, "epoch": 2277} {"train_loss": -11.757792472839355, "global_step": 382677, "epoch": 2277} {"train_loss": -12.089266777038574, "global_step": 382678, "epoch": 2277} {"train_loss": -11.126725196838379, "global_step": 382679, "epoch": 2277} {"train_loss": -12.245981216430664, "global_step": 382680, "epoch": 2277} {"train_loss": -11.96221923828125, "global_step": 382681, "epoch": 2277} {"train_loss": -11.615278244018555, "global_step": 382682, "epoch": 2277} {"train_loss": -12.355674743652344, "global_step": 382683, "epoch": 2277} {"train_loss": -11.861257553100586, "global_step": 382684, "epoch": 2277} {"train_loss": -12.149559020996094, "global_step": 382685, "epoch": 2277} {"train_loss": -11.776126861572266, "global_step": 382686, "epoch": 2277} {"train_loss": -10.94189453125, "global_step": 382687, "epoch": 2277} {"train_loss": -12.514795303344727, "global_step": 382688, "epoch": 2277} {"train_loss": -11.266153335571289, "global_step": 382689, "epoch": 2277} {"train_loss": -12.145393371582031, "global_step": 382690, "epoch": 2277} {"train_loss": -11.139169692993164, "global_step": 382691, "epoch": 2277} {"train_loss": -12.176431655883789, "global_step": 382692, "epoch": 2277} {"train_loss": -11.232503890991211, "global_step": 382693, "epoch": 2277} {"train_loss": -11.957721710205078, "global_step": 382694, "epoch": 2277} {"train_loss": -10.38119125366211, "global_step": 382695, "epoch": 2277} {"train_loss": -11.786262512207031, "global_step": 382696, "epoch": 2277} {"train_loss": -10.197620391845703, "global_step": 382697, "epoch": 2277} {"train_loss": -9.558759689331055, "global_step": 382698, "epoch": 2277} {"train_loss": -11.863849639892578, "global_step": 382699, "epoch": 2277} {"train_loss": -10.353752136230469, "global_step": 382700, "epoch": 2277} {"train_loss": -11.365701675415039, "global_step": 382701, "epoch": 2277} {"train_loss": -10.532378196716309, "global_step": 382702, "epoch": 2277} {"train_loss": -12.044001619021097, "global_step": 382703, "epoch": 2277, "val_loss": 290867.625} {"train_loss": -11.124580383300781, "global_step": 382704, "epoch": 2278} {"train_loss": -11.037191390991211, "global_step": 382705, "epoch": 2278} {"train_loss": -11.146103858947754, "global_step": 382706, "epoch": 2278} {"train_loss": -10.58570671081543, "global_step": 382707, "epoch": 2278} {"train_loss": -10.258398056030273, "global_step": 382708, "epoch": 2278} {"train_loss": -11.708454132080078, "global_step": 382709, "epoch": 2278} {"train_loss": -10.234928131103516, "global_step": 382710, "epoch": 2278} {"train_loss": -11.616744041442871, "global_step": 382711, "epoch": 2278} {"train_loss": -10.338308334350586, "global_step": 382712, "epoch": 2278} {"train_loss": -12.101192474365234, "global_step": 382713, "epoch": 2278} {"train_loss": -11.14054012298584, "global_step": 382714, "epoch": 2278} {"train_loss": -11.888776779174805, "global_step": 382715, "epoch": 2278} {"train_loss": -11.331947326660156, "global_step": 382716, "epoch": 2278} {"train_loss": -11.934476852416992, "global_step": 382717, "epoch": 2278} {"train_loss": -11.655052185058594, "global_step": 382718, "epoch": 2278} {"train_loss": -12.132315635681152, "global_step": 382719, "epoch": 2278} {"train_loss": -12.031353950500488, "global_step": 382720, "epoch": 2278} {"train_loss": -12.115039825439453, "global_step": 382721, "epoch": 2278} {"train_loss": -11.679285049438477, "global_step": 382722, "epoch": 2278} {"train_loss": -12.12724781036377, "global_step": 382723, "epoch": 2278} {"train_loss": -11.81635856628418, "global_step": 382724, "epoch": 2278} {"train_loss": -12.358796119689941, "global_step": 382725, "epoch": 2278} {"train_loss": -12.138738632202148, "global_step": 382726, "epoch": 2278} {"train_loss": -12.055608749389648, "global_step": 382727, "epoch": 2278} {"train_loss": -12.102092742919922, "global_step": 382728, "epoch": 2278} {"train_loss": -12.168926239013672, "global_step": 382729, "epoch": 2278} {"train_loss": -12.144572257995605, "global_step": 382730, "epoch": 2278} {"train_loss": -11.861867904663086, "global_step": 382731, "epoch": 2278} {"train_loss": -12.163076400756836, "global_step": 382732, "epoch": 2278} {"train_loss": -12.098747253417969, "global_step": 382733, "epoch": 2278} {"train_loss": -12.166358947753906, "global_step": 382734, "epoch": 2278} {"train_loss": -12.386363983154297, "global_step": 382735, "epoch": 2278} {"train_loss": -11.743986129760742, "global_step": 382736, "epoch": 2278} {"train_loss": -12.138662338256836, "global_step": 382737, "epoch": 2278} {"train_loss": -11.94277286529541, "global_step": 382738, "epoch": 2278} {"train_loss": -12.5433988571167, "global_step": 382739, "epoch": 2278} {"train_loss": -11.877633094787598, "global_step": 382740, "epoch": 2278} {"train_loss": -12.123529434204102, "global_step": 382741, "epoch": 2278} {"train_loss": -12.288403511047363, "global_step": 382742, "epoch": 2278} {"train_loss": -11.744441986083984, "global_step": 382743, "epoch": 2278} {"train_loss": -12.504878997802734, "global_step": 382744, "epoch": 2278} {"train_loss": -12.173625946044922, "global_step": 382745, "epoch": 2278} {"train_loss": -11.711723327636719, "global_step": 382746, "epoch": 2278} {"train_loss": -12.306525230407715, "global_step": 382747, "epoch": 2278} {"train_loss": -11.816343307495117, "global_step": 382748, "epoch": 2278} {"train_loss": -12.31679630279541, "global_step": 382749, "epoch": 2278} {"train_loss": -12.333295822143555, "global_step": 382750, "epoch": 2278} {"train_loss": -12.462838172912598, "global_step": 382751, "epoch": 2278} {"train_loss": -12.515439987182617, "global_step": 382752, "epoch": 2278} {"train_loss": -12.09908390045166, "global_step": 382753, "epoch": 2278} {"train_loss": -12.408591270446777, "global_step": 382754, "epoch": 2278} {"train_loss": -12.389299392700195, "global_step": 382755, "epoch": 2278} {"train_loss": -12.057783126831055, "global_step": 382756, "epoch": 2278} {"train_loss": -12.496587753295898, "global_step": 382757, "epoch": 2278} {"train_loss": -12.40863037109375, "global_step": 382758, "epoch": 2278} {"train_loss": -12.44023609161377, "global_step": 382759, "epoch": 2278} {"train_loss": -12.33401870727539, "global_step": 382760, "epoch": 2278} {"train_loss": -12.380208015441895, "global_step": 382761, "epoch": 2278} {"train_loss": -12.534455299377441, "global_step": 382762, "epoch": 2278} {"train_loss": -12.462711334228516, "global_step": 382763, "epoch": 2278} {"train_loss": -12.52260971069336, "global_step": 382764, "epoch": 2278} {"train_loss": -12.556546211242676, "global_step": 382765, "epoch": 2278} {"train_loss": -12.602023124694824, "global_step": 382766, "epoch": 2278} {"train_loss": -12.452394485473633, "global_step": 382767, "epoch": 2278} {"train_loss": -12.256704330444336, "global_step": 382768, "epoch": 2278} {"train_loss": -12.531357765197754, "global_step": 382769, "epoch": 2278} {"train_loss": -12.478565216064453, "global_step": 382770, "epoch": 2278} {"train_loss": -12.543655395507812, "global_step": 382771, "epoch": 2278} {"train_loss": -12.290472030639648, "global_step": 382772, "epoch": 2278} {"train_loss": -12.562540054321289, "global_step": 382773, "epoch": 2278} {"train_loss": -12.431316375732422, "global_step": 382774, "epoch": 2278} {"train_loss": -12.056363105773926, "global_step": 382775, "epoch": 2278} {"train_loss": -12.417518615722656, "global_step": 382776, "epoch": 2278} {"train_loss": -11.603876113891602, "global_step": 382777, "epoch": 2278} {"train_loss": -12.660425186157227, "global_step": 382778, "epoch": 2278} {"train_loss": -12.591374397277832, "global_step": 382779, "epoch": 2278} {"train_loss": -12.585323333740234, "global_step": 382780, "epoch": 2278} {"train_loss": -12.4464750289917, "global_step": 382781, "epoch": 2278} {"train_loss": -12.702142715454102, "global_step": 382782, "epoch": 2278} {"train_loss": -12.675948143005371, "global_step": 382783, "epoch": 2278} {"train_loss": -12.01041030883789, "global_step": 382784, "epoch": 2278} {"train_loss": -12.64478874206543, "global_step": 382785, "epoch": 2278} {"train_loss": -12.336377143859863, "global_step": 382786, "epoch": 2278} {"train_loss": -12.486445426940918, "global_step": 382787, "epoch": 2278} {"train_loss": -12.31610107421875, "global_step": 382788, "epoch": 2278} {"train_loss": -12.49802017211914, "global_step": 382789, "epoch": 2278} {"train_loss": -12.470821380615234, "global_step": 382790, "epoch": 2278} {"train_loss": -12.516117095947266, "global_step": 382791, "epoch": 2278} {"train_loss": -12.324833869934082, "global_step": 382792, "epoch": 2278} {"train_loss": -12.350593566894531, "global_step": 382793, "epoch": 2278} {"train_loss": -12.344974517822266, "global_step": 382794, "epoch": 2278} {"train_loss": -12.521382331848145, "global_step": 382795, "epoch": 2278} {"train_loss": -12.628671646118164, "global_step": 382796, "epoch": 2278} {"train_loss": -12.265670776367188, "global_step": 382797, "epoch": 2278} {"train_loss": -12.308649063110352, "global_step": 382798, "epoch": 2278} {"train_loss": -12.210991859436035, "global_step": 382799, "epoch": 2278} {"train_loss": -12.733805656433105, "global_step": 382800, "epoch": 2278} {"train_loss": -12.251801490783691, "global_step": 382801, "epoch": 2278} {"train_loss": -11.745058059692383, "global_step": 382802, "epoch": 2278} {"train_loss": -12.000341415405273, "global_step": 382803, "epoch": 2278} {"train_loss": -12.604415893554688, "global_step": 382804, "epoch": 2278} {"train_loss": -12.301778793334961, "global_step": 382805, "epoch": 2278} {"train_loss": -12.215118408203125, "global_step": 382806, "epoch": 2278} {"train_loss": -12.502176284790039, "global_step": 382807, "epoch": 2278} {"train_loss": -12.268728256225586, "global_step": 382808, "epoch": 2278} {"train_loss": -11.807320594787598, "global_step": 382809, "epoch": 2278} {"train_loss": -12.303138732910156, "global_step": 382810, "epoch": 2278} {"train_loss": -10.812061309814453, "global_step": 382811, "epoch": 2278} {"train_loss": -11.763078689575195, "global_step": 382812, "epoch": 2278} {"train_loss": -11.753551483154297, "global_step": 382813, "epoch": 2278} {"train_loss": -11.165674209594727, "global_step": 382814, "epoch": 2278} {"train_loss": -11.41942024230957, "global_step": 382815, "epoch": 2278} {"train_loss": -11.058034896850586, "global_step": 382816, "epoch": 2278} {"train_loss": -9.140204429626465, "global_step": 382817, "epoch": 2278} {"train_loss": -11.35650634765625, "global_step": 382818, "epoch": 2278} {"train_loss": -8.829208374023438, "global_step": 382819, "epoch": 2278} {"train_loss": -8.225835800170898, "global_step": 382820, "epoch": 2278} {"train_loss": -9.191591262817383, "global_step": 382821, "epoch": 2278} {"train_loss": -11.243847846984863, "global_step": 382822, "epoch": 2278} {"train_loss": -9.982110977172852, "global_step": 382823, "epoch": 2278} {"train_loss": -9.700712203979492, "global_step": 382824, "epoch": 2278} {"train_loss": -10.46163558959961, "global_step": 382825, "epoch": 2278} {"train_loss": -10.14427661895752, "global_step": 382826, "epoch": 2278} {"train_loss": -11.065288543701172, "global_step": 382827, "epoch": 2278} {"train_loss": -9.730860710144043, "global_step": 382828, "epoch": 2278} {"train_loss": -9.173774719238281, "global_step": 382829, "epoch": 2278} {"train_loss": -11.141241073608398, "global_step": 382830, "epoch": 2278} {"train_loss": -11.369009017944336, "global_step": 382831, "epoch": 2278} {"train_loss": -11.14625358581543, "global_step": 382832, "epoch": 2278} {"train_loss": -11.733845710754395, "global_step": 382833, "epoch": 2278} {"train_loss": -11.206672668457031, "global_step": 382834, "epoch": 2278} {"train_loss": -11.340570449829102, "global_step": 382835, "epoch": 2278} {"train_loss": -11.771265029907227, "global_step": 382836, "epoch": 2278} {"train_loss": -11.299513816833496, "global_step": 382837, "epoch": 2278} {"train_loss": -11.375813484191895, "global_step": 382838, "epoch": 2278} {"train_loss": -11.662519454956055, "global_step": 382839, "epoch": 2278} {"train_loss": -11.471906661987305, "global_step": 382840, "epoch": 2278} {"train_loss": -11.579188346862793, "global_step": 382841, "epoch": 2278} {"train_loss": -11.068487167358398, "global_step": 382842, "epoch": 2278} {"train_loss": -11.627366065979004, "global_step": 382843, "epoch": 2278} {"train_loss": -11.00982666015625, "global_step": 382844, "epoch": 2278} {"train_loss": -11.337182998657227, "global_step": 382845, "epoch": 2278} {"train_loss": -11.088031768798828, "global_step": 382846, "epoch": 2278} {"train_loss": -10.660978317260742, "global_step": 382847, "epoch": 2278} {"train_loss": -11.864110946655273, "global_step": 382848, "epoch": 2278} {"train_loss": -11.38827133178711, "global_step": 382849, "epoch": 2278} {"train_loss": -12.040449142456055, "global_step": 382850, "epoch": 2278} {"train_loss": -11.679037094116211, "global_step": 382851, "epoch": 2278} {"train_loss": -11.878002166748047, "global_step": 382852, "epoch": 2278} {"train_loss": -11.708065032958984, "global_step": 382853, "epoch": 2278} {"train_loss": -11.93802261352539, "global_step": 382854, "epoch": 2278} {"train_loss": -10.895566940307617, "global_step": 382855, "epoch": 2278} {"train_loss": -10.924213409423828, "global_step": 382856, "epoch": 2278} {"train_loss": -11.987981796264648, "global_step": 382857, "epoch": 2278} {"train_loss": -12.075380325317383, "global_step": 382858, "epoch": 2278} {"train_loss": -10.539332389831543, "global_step": 382859, "epoch": 2278} {"train_loss": -10.924333572387695, "global_step": 382860, "epoch": 2278} {"train_loss": -8.483509063720703, "global_step": 382861, "epoch": 2278} {"train_loss": -10.413055419921875, "global_step": 382862, "epoch": 2278} {"train_loss": -10.888872146606445, "global_step": 382863, "epoch": 2278} {"train_loss": -10.859841346740723, "global_step": 382864, "epoch": 2278} {"train_loss": -11.554034233093262, "global_step": 382865, "epoch": 2278} {"train_loss": -10.837238311767578, "global_step": 382866, "epoch": 2278} {"train_loss": -10.725910186767578, "global_step": 382867, "epoch": 2278} {"train_loss": -11.539084434509277, "global_step": 382868, "epoch": 2278} {"train_loss": -11.753435134887695, "global_step": 382869, "epoch": 2278} {"train_loss": -11.022058486938477, "global_step": 382870, "epoch": 2278} {"train_loss": -11.713317763237725, "global_step": 382871, "epoch": 2278, "val_loss": 307060.40625} {"train_loss": -11.508380889892578, "global_step": 382872, "epoch": 2279} {"train_loss": -11.39398193359375, "global_step": 382873, "epoch": 2279} {"train_loss": -11.524097442626953, "global_step": 382874, "epoch": 2279} {"train_loss": -11.34826374053955, "global_step": 382875, "epoch": 2279} {"train_loss": -11.223214149475098, "global_step": 382876, "epoch": 2279} {"train_loss": -11.25601577758789, "global_step": 382877, "epoch": 2279} {"train_loss": -11.10316276550293, "global_step": 382878, "epoch": 2279} {"train_loss": -11.543978691101074, "global_step": 382879, "epoch": 2279} {"train_loss": -11.589395523071289, "global_step": 382880, "epoch": 2279} {"train_loss": -11.82343864440918, "global_step": 382881, "epoch": 2279} {"train_loss": -11.421741485595703, "global_step": 382882, "epoch": 2279} {"train_loss": -11.729974746704102, "global_step": 382883, "epoch": 2279} {"train_loss": -11.599658012390137, "global_step": 382884, "epoch": 2279} {"train_loss": -11.497547149658203, "global_step": 382885, "epoch": 2279} {"train_loss": -11.670914649963379, "global_step": 382886, "epoch": 2279} {"train_loss": -11.590192794799805, "global_step": 382887, "epoch": 2279} {"train_loss": -11.743236541748047, "global_step": 382888, "epoch": 2279} {"train_loss": -11.758313179016113, "global_step": 382889, "epoch": 2279} {"train_loss": -11.97829532623291, "global_step": 382890, "epoch": 2279} {"train_loss": -11.943683624267578, "global_step": 382891, "epoch": 2279} {"train_loss": -12.12641716003418, "global_step": 382892, "epoch": 2279} {"train_loss": -11.867741584777832, "global_step": 382893, "epoch": 2279} {"train_loss": -12.107889175415039, "global_step": 382894, "epoch": 2279} {"train_loss": -11.616125106811523, "global_step": 382895, "epoch": 2279} {"train_loss": -10.994948387145996, "global_step": 382896, "epoch": 2279} {"train_loss": -11.952421188354492, "global_step": 382897, "epoch": 2279} {"train_loss": -11.87792682647705, "global_step": 382898, "epoch": 2279} {"train_loss": -11.792558670043945, "global_step": 382899, "epoch": 2279} {"train_loss": -11.739190101623535, "global_step": 382900, "epoch": 2279} {"train_loss": -12.008136749267578, "global_step": 382901, "epoch": 2279} {"train_loss": -11.433036804199219, "global_step": 382902, "epoch": 2279} {"train_loss": -12.083005905151367, "global_step": 382903, "epoch": 2279} {"train_loss": -11.51544189453125, "global_step": 382904, "epoch": 2279} {"train_loss": -11.82382583618164, "global_step": 382905, "epoch": 2279} {"train_loss": -11.934919357299805, "global_step": 382906, "epoch": 2279} {"train_loss": -12.205770492553711, "global_step": 382907, "epoch": 2279} {"train_loss": -10.961148262023926, "global_step": 382908, "epoch": 2279} {"train_loss": -11.967071533203125, "global_step": 382909, "epoch": 2279} {"train_loss": -12.101726531982422, "global_step": 382910, "epoch": 2279} {"train_loss": -12.058629989624023, "global_step": 382911, "epoch": 2279} {"train_loss": -11.56260871887207, "global_step": 382912, "epoch": 2279} {"train_loss": -12.365601539611816, "global_step": 382913, "epoch": 2279} {"train_loss": -11.846525192260742, "global_step": 382914, "epoch": 2279} {"train_loss": -12.13898754119873, "global_step": 382915, "epoch": 2279} {"train_loss": -11.499029159545898, "global_step": 382916, "epoch": 2279} {"train_loss": -11.579387664794922, "global_step": 382917, "epoch": 2279} {"train_loss": -12.286985397338867, "global_step": 382918, "epoch": 2279} {"train_loss": -11.88262939453125, "global_step": 382919, "epoch": 2279} {"train_loss": -12.17945671081543, "global_step": 382920, "epoch": 2279} {"train_loss": -11.81218147277832, "global_step": 382921, "epoch": 2279} {"train_loss": -12.186683654785156, "global_step": 382922, "epoch": 2279} {"train_loss": -12.090964317321777, "global_step": 382923, "epoch": 2279} {"train_loss": -11.643564224243164, "global_step": 382924, "epoch": 2279} {"train_loss": -11.965788841247559, "global_step": 382925, "epoch": 2279} {"train_loss": -11.871935844421387, "global_step": 382926, "epoch": 2279} {"train_loss": -11.373065948486328, "global_step": 382927, "epoch": 2279} {"train_loss": -12.281689643859863, "global_step": 382928, "epoch": 2279} {"train_loss": -12.227078437805176, "global_step": 382929, "epoch": 2279} {"train_loss": -12.36023998260498, "global_step": 382930, "epoch": 2279} {"train_loss": -12.517425537109375, "global_step": 382931, "epoch": 2279} {"train_loss": -12.373869895935059, "global_step": 382932, "epoch": 2279} {"train_loss": -12.361948013305664, "global_step": 382933, "epoch": 2279} {"train_loss": -12.335929870605469, "global_step": 382934, "epoch": 2279} {"train_loss": -12.068155288696289, "global_step": 382935, "epoch": 2279} {"train_loss": -12.242372512817383, "global_step": 382936, "epoch": 2279} {"train_loss": -11.881889343261719, "global_step": 382937, "epoch": 2279} {"train_loss": -11.829845428466797, "global_step": 382938, "epoch": 2279} {"train_loss": -12.009223937988281, "global_step": 382939, "epoch": 2279} {"train_loss": -12.409921646118164, "global_step": 382940, "epoch": 2279} {"train_loss": -12.04775619506836, "global_step": 382941, "epoch": 2279} {"train_loss": -11.936967849731445, "global_step": 382942, "epoch": 2279} {"train_loss": -12.641254425048828, "global_step": 382943, "epoch": 2279} {"train_loss": -12.411966323852539, "global_step": 382944, "epoch": 2279} {"train_loss": -12.307225227355957, "global_step": 382945, "epoch": 2279} {"train_loss": -12.181461334228516, "global_step": 382946, "epoch": 2279} {"train_loss": -12.38705062866211, "global_step": 382947, "epoch": 2279} {"train_loss": -12.254276275634766, "global_step": 382948, "epoch": 2279} {"train_loss": -12.452898979187012, "global_step": 382949, "epoch": 2279} {"train_loss": -12.471538543701172, "global_step": 382950, "epoch": 2279} {"train_loss": -12.543436050415039, "global_step": 382951, "epoch": 2279} {"train_loss": -12.473915100097656, "global_step": 382952, "epoch": 2279} {"train_loss": -12.17611312866211, "global_step": 382953, "epoch": 2279} {"train_loss": -12.215370178222656, "global_step": 382954, "epoch": 2279} {"train_loss": -12.432981491088867, "global_step": 382955, "epoch": 2279} {"train_loss": -12.251974105834961, "global_step": 382956, "epoch": 2279} {"train_loss": -12.54958724975586, "global_step": 382957, "epoch": 2279} {"train_loss": -12.149903297424316, "global_step": 382958, "epoch": 2279} {"train_loss": -12.11825180053711, "global_step": 382959, "epoch": 2279} {"train_loss": -12.524517059326172, "global_step": 382960, "epoch": 2279} {"train_loss": -12.420055389404297, "global_step": 382961, "epoch": 2279} {"train_loss": -12.470824241638184, "global_step": 382962, "epoch": 2279} {"train_loss": -12.234201431274414, "global_step": 382963, "epoch": 2279} {"train_loss": -12.497056007385254, "global_step": 382964, "epoch": 2279} {"train_loss": -12.163311004638672, "global_step": 382965, "epoch": 2279} {"train_loss": -12.719442367553711, "global_step": 382966, "epoch": 2279} {"train_loss": -12.277326583862305, "global_step": 382967, "epoch": 2279} {"train_loss": -12.415363311767578, "global_step": 382968, "epoch": 2279} {"train_loss": -12.636810302734375, "global_step": 382969, "epoch": 2279} {"train_loss": -12.069391250610352, "global_step": 382970, "epoch": 2279} {"train_loss": -11.989114761352539, "global_step": 382971, "epoch": 2279} {"train_loss": -12.622575759887695, "global_step": 382972, "epoch": 2279} {"train_loss": -12.408477783203125, "global_step": 382973, "epoch": 2279} {"train_loss": -12.312159538269043, "global_step": 382974, "epoch": 2279} {"train_loss": -12.386852264404297, "global_step": 382975, "epoch": 2279} {"train_loss": -12.110591888427734, "global_step": 382976, "epoch": 2279} {"train_loss": -11.793939590454102, "global_step": 382977, "epoch": 2279} {"train_loss": -11.846342086791992, "global_step": 382978, "epoch": 2279} {"train_loss": -12.277626037597656, "global_step": 382979, "epoch": 2279} {"train_loss": -12.363297462463379, "global_step": 382980, "epoch": 2279} {"train_loss": -11.839069366455078, "global_step": 382981, "epoch": 2279} {"train_loss": -12.080469131469727, "global_step": 382982, "epoch": 2279} {"train_loss": -12.242880821228027, "global_step": 382983, "epoch": 2279} {"train_loss": -12.451096534729004, "global_step": 382984, "epoch": 2279} {"train_loss": -12.104072570800781, "global_step": 382985, "epoch": 2279} {"train_loss": -12.340943336486816, "global_step": 382986, "epoch": 2279} {"train_loss": -12.35740852355957, "global_step": 382987, "epoch": 2279} {"train_loss": -12.241676330566406, "global_step": 382988, "epoch": 2279} {"train_loss": -12.675683975219727, "global_step": 382989, "epoch": 2279} {"train_loss": -12.635387420654297, "global_step": 382990, "epoch": 2279} {"train_loss": -12.448220252990723, "global_step": 382991, "epoch": 2279} {"train_loss": -12.135377883911133, "global_step": 382992, "epoch": 2279} {"train_loss": -12.5928955078125, "global_step": 382993, "epoch": 2279} {"train_loss": -12.215968132019043, "global_step": 382994, "epoch": 2279} {"train_loss": -12.466297149658203, "global_step": 382995, "epoch": 2279} {"train_loss": -12.460227966308594, "global_step": 382996, "epoch": 2279} {"train_loss": -12.876989364624023, "global_step": 382997, "epoch": 2279} {"train_loss": -12.525611877441406, "global_step": 382998, "epoch": 2279} {"train_loss": -12.385818481445312, "global_step": 382999, "epoch": 2279} {"train_loss": -12.480386734008789, "global_step": 383000, "epoch": 2279} {"train_loss": -12.720004081726074, "global_step": 383001, "epoch": 2279} {"train_loss": -12.597127914428711, "global_step": 383002, "epoch": 2279} {"train_loss": -12.602570533752441, "global_step": 383003, "epoch": 2279} {"train_loss": -12.201314926147461, "global_step": 383004, "epoch": 2279} {"train_loss": -12.180707931518555, "global_step": 383005, "epoch": 2279} {"train_loss": -11.97762680053711, "global_step": 383006, "epoch": 2279} {"train_loss": -12.741376876831055, "global_step": 383007, "epoch": 2279} {"train_loss": -12.032623291015625, "global_step": 383008, "epoch": 2279} {"train_loss": -12.163741111755371, "global_step": 383009, "epoch": 2279} {"train_loss": -12.312382698059082, "global_step": 383010, "epoch": 2279} {"train_loss": -12.275795936584473, "global_step": 383011, "epoch": 2279} {"train_loss": -12.612305641174316, "global_step": 383012, "epoch": 2279} {"train_loss": -11.362770080566406, "global_step": 383013, "epoch": 2279} {"train_loss": -10.831100463867188, "global_step": 383014, "epoch": 2279} {"train_loss": -10.964999198913574, "global_step": 383015, "epoch": 2279} {"train_loss": -11.988643646240234, "global_step": 383016, "epoch": 2279} {"train_loss": -11.634695053100586, "global_step": 383017, "epoch": 2279} {"train_loss": -9.943777084350586, "global_step": 383018, "epoch": 2279} {"train_loss": -10.252522468566895, "global_step": 383019, "epoch": 2279} {"train_loss": -11.030012130737305, "global_step": 383020, "epoch": 2279} {"train_loss": -10.537503242492676, "global_step": 383021, "epoch": 2279} {"train_loss": -11.091739654541016, "global_step": 383022, "epoch": 2279} {"train_loss": -10.978466033935547, "global_step": 383023, "epoch": 2279} {"train_loss": -10.790325164794922, "global_step": 383024, "epoch": 2279} {"train_loss": -11.746699333190918, "global_step": 383025, "epoch": 2279} {"train_loss": -10.43459701538086, "global_step": 383026, "epoch": 2279} {"train_loss": -12.001470565795898, "global_step": 383027, "epoch": 2279} {"train_loss": -11.828215599060059, "global_step": 383028, "epoch": 2279} {"train_loss": -10.847526550292969, "global_step": 383029, "epoch": 2279} {"train_loss": -11.371803283691406, "global_step": 383030, "epoch": 2279} {"train_loss": -11.469755172729492, "global_step": 383031, "epoch": 2279} {"train_loss": -11.260417938232422, "global_step": 383032, "epoch": 2279} {"train_loss": -11.697858810424805, "global_step": 383033, "epoch": 2279} {"train_loss": -11.444151878356934, "global_step": 383034, "epoch": 2279} {"train_loss": -11.541732788085938, "global_step": 383035, "epoch": 2279} {"train_loss": -11.162683486938477, "global_step": 383036, "epoch": 2279} {"train_loss": -10.643999099731445, "global_step": 383037, "epoch": 2279} {"train_loss": -11.964092254638672, "global_step": 383038, "epoch": 2279} {"train_loss": -11.941161939076014, "global_step": 383039, "epoch": 2279, "val_loss": 290336.375} {"train_loss": -11.73193359375, "global_step": 383040, "epoch": 2280} {"train_loss": -11.803486824035645, "global_step": 383041, "epoch": 2280} {"train_loss": -11.12971305847168, "global_step": 383042, "epoch": 2280} {"train_loss": -11.390982627868652, "global_step": 383043, "epoch": 2280} {"train_loss": -11.36696720123291, "global_step": 383044, "epoch": 2280} {"train_loss": -10.811052322387695, "global_step": 383045, "epoch": 2280} {"train_loss": -11.292940139770508, "global_step": 383046, "epoch": 2280} {"train_loss": -10.697492599487305, "global_step": 383047, "epoch": 2280} {"train_loss": -11.368416786193848, "global_step": 383048, "epoch": 2280} {"train_loss": -11.31161117553711, "global_step": 383049, "epoch": 2280} {"train_loss": -11.514595031738281, "global_step": 383050, "epoch": 2280} {"train_loss": -11.180665969848633, "global_step": 383051, "epoch": 2280} {"train_loss": -10.983023643493652, "global_step": 383052, "epoch": 2280} {"train_loss": -10.681967735290527, "global_step": 383053, "epoch": 2280} {"train_loss": -10.875057220458984, "global_step": 383054, "epoch": 2280} {"train_loss": -9.293922424316406, "global_step": 383055, "epoch": 2280} {"train_loss": -10.618016242980957, "global_step": 383056, "epoch": 2280} {"train_loss": -10.18563461303711, "global_step": 383057, "epoch": 2280} {"train_loss": -10.735281944274902, "global_step": 383058, "epoch": 2280} {"train_loss": -10.695432662963867, "global_step": 383059, "epoch": 2280} {"train_loss": -10.118724822998047, "global_step": 383060, "epoch": 2280} {"train_loss": -10.311573028564453, "global_step": 383061, "epoch": 2280} {"train_loss": -10.546696662902832, "global_step": 383062, "epoch": 2280} {"train_loss": -10.575018882751465, "global_step": 383063, "epoch": 2280} {"train_loss": -9.723453521728516, "global_step": 383064, "epoch": 2280} {"train_loss": -11.044794082641602, "global_step": 383065, "epoch": 2280} {"train_loss": -11.230798721313477, "global_step": 383066, "epoch": 2280} {"train_loss": -10.803153991699219, "global_step": 383067, "epoch": 2280} {"train_loss": -11.159748077392578, "global_step": 383068, "epoch": 2280} {"train_loss": -10.92685317993164, "global_step": 383069, "epoch": 2280} {"train_loss": -11.574715614318848, "global_step": 383070, "epoch": 2280} {"train_loss": -11.550893783569336, "global_step": 383071, "epoch": 2280} {"train_loss": -11.395528793334961, "global_step": 383072, "epoch": 2280} {"train_loss": -11.953780174255371, "global_step": 383073, "epoch": 2280} {"train_loss": -11.450128555297852, "global_step": 383074, "epoch": 2280} {"train_loss": -11.804832458496094, "global_step": 383075, "epoch": 2280} {"train_loss": -11.598583221435547, "global_step": 383076, "epoch": 2280} {"train_loss": -12.007538795471191, "global_step": 383077, "epoch": 2280} {"train_loss": -12.095276832580566, "global_step": 383078, "epoch": 2280} {"train_loss": -12.063440322875977, "global_step": 383079, "epoch": 2280} {"train_loss": -11.68628978729248, "global_step": 383080, "epoch": 2280} {"train_loss": -11.89480209350586, "global_step": 383081, "epoch": 2280} {"train_loss": -11.371896743774414, "global_step": 383082, "epoch": 2280} {"train_loss": -12.00625228881836, "global_step": 383083, "epoch": 2280} {"train_loss": -11.620048522949219, "global_step": 383084, "epoch": 2280} {"train_loss": -11.87698745727539, "global_step": 383085, "epoch": 2280} {"train_loss": -12.003543853759766, "global_step": 383086, "epoch": 2280} {"train_loss": -11.834370613098145, "global_step": 383087, "epoch": 2280} {"train_loss": -12.203912734985352, "global_step": 383088, "epoch": 2280} {"train_loss": -11.930147171020508, "global_step": 383089, "epoch": 2280} {"train_loss": -12.053655624389648, "global_step": 383090, "epoch": 2280} {"train_loss": -11.915595054626465, "global_step": 383091, "epoch": 2280} {"train_loss": -12.012436866760254, "global_step": 383092, "epoch": 2280} {"train_loss": -11.980413436889648, "global_step": 383093, "epoch": 2280} {"train_loss": -11.953289031982422, "global_step": 383094, "epoch": 2280} {"train_loss": -12.101428985595703, "global_step": 383095, "epoch": 2280} {"train_loss": -11.760906219482422, "global_step": 383096, "epoch": 2280} {"train_loss": -11.832630157470703, "global_step": 383097, "epoch": 2280} {"train_loss": -12.320557594299316, "global_step": 383098, "epoch": 2280} {"train_loss": -11.831876754760742, "global_step": 383099, "epoch": 2280} {"train_loss": -12.25599479675293, "global_step": 383100, "epoch": 2280} {"train_loss": -11.93263053894043, "global_step": 383101, "epoch": 2280} {"train_loss": -12.020038604736328, "global_step": 383102, "epoch": 2280} {"train_loss": -11.966325759887695, "global_step": 383103, "epoch": 2280} {"train_loss": -11.999237060546875, "global_step": 383104, "epoch": 2280} {"train_loss": -12.233061790466309, "global_step": 383105, "epoch": 2280} {"train_loss": -12.053544998168945, "global_step": 383106, "epoch": 2280} {"train_loss": -12.099084854125977, "global_step": 383107, "epoch": 2280} {"train_loss": -12.207509994506836, "global_step": 383108, "epoch": 2280} {"train_loss": -12.21955680847168, "global_step": 383109, "epoch": 2280} {"train_loss": -11.94670295715332, "global_step": 383110, "epoch": 2280} {"train_loss": -12.151594161987305, "global_step": 383111, "epoch": 2280} {"train_loss": -12.187219619750977, "global_step": 383112, "epoch": 2280} {"train_loss": -12.121292114257812, "global_step": 383113, "epoch": 2280} {"train_loss": -12.294140815734863, "global_step": 383114, "epoch": 2280} {"train_loss": -12.468238830566406, "global_step": 383115, "epoch": 2280} {"train_loss": -12.464424133300781, "global_step": 383116, "epoch": 2280} {"train_loss": -12.36212158203125, "global_step": 383117, "epoch": 2280} {"train_loss": -12.414124488830566, "global_step": 383118, "epoch": 2280} {"train_loss": -12.008544921875, "global_step": 383119, "epoch": 2280} {"train_loss": -12.247528076171875, "global_step": 383120, "epoch": 2280} {"train_loss": -12.205663681030273, "global_step": 383121, "epoch": 2280} {"train_loss": -12.39538860321045, "global_step": 383122, "epoch": 2280} {"train_loss": -12.585596084594727, "global_step": 383123, "epoch": 2280} {"train_loss": -12.502188682556152, "global_step": 383124, "epoch": 2280} {"train_loss": -12.63940143585205, "global_step": 383125, "epoch": 2280} {"train_loss": -12.575740814208984, "global_step": 383126, "epoch": 2280} {"train_loss": -12.077644348144531, "global_step": 383127, "epoch": 2280} {"train_loss": -12.622177124023438, "global_step": 383128, "epoch": 2280} {"train_loss": -12.184879302978516, "global_step": 383129, "epoch": 2280} {"train_loss": -12.581928253173828, "global_step": 383130, "epoch": 2280} {"train_loss": -12.579051971435547, "global_step": 383131, "epoch": 2280} {"train_loss": -12.37010669708252, "global_step": 383132, "epoch": 2280} {"train_loss": -12.51902961730957, "global_step": 383133, "epoch": 2280} {"train_loss": -12.36610221862793, "global_step": 383134, "epoch": 2280} {"train_loss": -12.314617156982422, "global_step": 383135, "epoch": 2280} {"train_loss": -12.575194358825684, "global_step": 383136, "epoch": 2280} {"train_loss": -12.397913932800293, "global_step": 383137, "epoch": 2280} {"train_loss": -12.35556411743164, "global_step": 383138, "epoch": 2280} {"train_loss": -12.513566970825195, "global_step": 383139, "epoch": 2280} {"train_loss": -12.4344482421875, "global_step": 383140, "epoch": 2280} {"train_loss": -12.432300567626953, "global_step": 383141, "epoch": 2280} {"train_loss": -12.547252655029297, "global_step": 383142, "epoch": 2280} {"train_loss": -12.486137390136719, "global_step": 383143, "epoch": 2280} {"train_loss": -12.417997360229492, "global_step": 383144, "epoch": 2280} {"train_loss": -12.47970962524414, "global_step": 383145, "epoch": 2280} {"train_loss": -12.457921981811523, "global_step": 383146, "epoch": 2280} {"train_loss": -12.434277534484863, "global_step": 383147, "epoch": 2280} {"train_loss": -12.609901428222656, "global_step": 383148, "epoch": 2280} {"train_loss": -12.406656265258789, "global_step": 383149, "epoch": 2280} {"train_loss": -12.15205192565918, "global_step": 383150, "epoch": 2280} {"train_loss": -12.691149711608887, "global_step": 383151, "epoch": 2280} {"train_loss": -12.611150741577148, "global_step": 383152, "epoch": 2280} {"train_loss": -12.584970474243164, "global_step": 383153, "epoch": 2280} {"train_loss": -12.378986358642578, "global_step": 383154, "epoch": 2280} {"train_loss": -12.629287719726562, "global_step": 383155, "epoch": 2280} {"train_loss": -12.551589965820312, "global_step": 383156, "epoch": 2280} {"train_loss": -12.611421585083008, "global_step": 383157, "epoch": 2280} {"train_loss": -12.402118682861328, "global_step": 383158, "epoch": 2280} {"train_loss": -12.19637680053711, "global_step": 383159, "epoch": 2280} {"train_loss": -12.405390739440918, "global_step": 383160, "epoch": 2280} {"train_loss": -12.405674934387207, "global_step": 383161, "epoch": 2280} {"train_loss": -12.260684967041016, "global_step": 383162, "epoch": 2280} {"train_loss": -11.901708602905273, "global_step": 383163, "epoch": 2280} {"train_loss": -12.72780704498291, "global_step": 383164, "epoch": 2280} {"train_loss": -12.169548034667969, "global_step": 383165, "epoch": 2280} {"train_loss": -12.48250961303711, "global_step": 383166, "epoch": 2280} {"train_loss": -12.77402114868164, "global_step": 383167, "epoch": 2280} {"train_loss": -12.386474609375, "global_step": 383168, "epoch": 2280} {"train_loss": -12.236810684204102, "global_step": 383169, "epoch": 2280} {"train_loss": -12.281505584716797, "global_step": 383170, "epoch": 2280} {"train_loss": -12.58344554901123, "global_step": 383171, "epoch": 2280} {"train_loss": -12.19270133972168, "global_step": 383172, "epoch": 2280} {"train_loss": -12.142339706420898, "global_step": 383173, "epoch": 2280} {"train_loss": -12.00972843170166, "global_step": 383174, "epoch": 2280} {"train_loss": -12.39358139038086, "global_step": 383175, "epoch": 2280} {"train_loss": -12.383890151977539, "global_step": 383176, "epoch": 2280} {"train_loss": -12.724435806274414, "global_step": 383177, "epoch": 2280} {"train_loss": -12.178791046142578, "global_step": 383178, "epoch": 2280} {"train_loss": -12.422849655151367, "global_step": 383179, "epoch": 2280} {"train_loss": -11.996990203857422, "global_step": 383180, "epoch": 2280} {"train_loss": -12.425168991088867, "global_step": 383181, "epoch": 2280} {"train_loss": -12.216181755065918, "global_step": 383182, "epoch": 2280} {"train_loss": -12.763647079467773, "global_step": 383183, "epoch": 2280} {"train_loss": -12.083585739135742, "global_step": 383184, "epoch": 2280} {"train_loss": -12.495491981506348, "global_step": 383185, "epoch": 2280} {"train_loss": -12.167268753051758, "global_step": 383186, "epoch": 2280} {"train_loss": -12.36712646484375, "global_step": 383187, "epoch": 2280} {"train_loss": -12.225109100341797, "global_step": 383188, "epoch": 2280} {"train_loss": -12.523758888244629, "global_step": 383189, "epoch": 2280} {"train_loss": -12.171781539916992, "global_step": 383190, "epoch": 2280} {"train_loss": -12.667799949645996, "global_step": 383191, "epoch": 2280} {"train_loss": -12.553253173828125, "global_step": 383192, "epoch": 2280} {"train_loss": -12.401052474975586, "global_step": 383193, "epoch": 2280} {"train_loss": -12.488831520080566, "global_step": 383194, "epoch": 2280} {"train_loss": -12.105053901672363, "global_step": 383195, "epoch": 2280} {"train_loss": -11.751493453979492, "global_step": 383196, "epoch": 2280} {"train_loss": -11.63619613647461, "global_step": 383197, "epoch": 2280} {"train_loss": -12.171821594238281, "global_step": 383198, "epoch": 2280} {"train_loss": -12.29630184173584, "global_step": 383199, "epoch": 2280} {"train_loss": -11.825349807739258, "global_step": 383200, "epoch": 2280} {"train_loss": -12.035870552062988, "global_step": 383201, "epoch": 2280} {"train_loss": -11.194982528686523, "global_step": 383202, "epoch": 2280} {"train_loss": -10.917350769042969, "global_step": 383203, "epoch": 2280} {"train_loss": -10.37533187866211, "global_step": 383204, "epoch": 2280} {"train_loss": -10.670757293701172, "global_step": 383205, "epoch": 2280} {"train_loss": -12.07297134399414, "global_step": 383206, "epoch": 2280} {"train_loss": -11.935900557608832, "global_step": 383207, "epoch": 2280, "val_loss": 292309.5625, "train_action_mse_error": 1.5155370235443115} {"train_loss": -11.381763458251953, "global_step": 383208, "epoch": 2281} {"train_loss": -10.24378776550293, "global_step": 383209, "epoch": 2281} {"train_loss": -10.387659072875977, "global_step": 383210, "epoch": 2281} {"train_loss": -11.482994079589844, "global_step": 383211, "epoch": 2281} {"train_loss": -10.40833854675293, "global_step": 383212, "epoch": 2281} {"train_loss": -10.088946342468262, "global_step": 383213, "epoch": 2281} {"train_loss": -10.96463394165039, "global_step": 383214, "epoch": 2281} {"train_loss": -11.743870735168457, "global_step": 383215, "epoch": 2281} {"train_loss": -9.62977409362793, "global_step": 383216, "epoch": 2281} {"train_loss": -10.597816467285156, "global_step": 383217, "epoch": 2281} {"train_loss": -10.88802433013916, "global_step": 383218, "epoch": 2281} {"train_loss": -10.460905075073242, "global_step": 383219, "epoch": 2281} {"train_loss": -11.398115158081055, "global_step": 383220, "epoch": 2281} {"train_loss": -9.531280517578125, "global_step": 383221, "epoch": 2281} {"train_loss": -10.788105010986328, "global_step": 383222, "epoch": 2281} {"train_loss": -10.236652374267578, "global_step": 383223, "epoch": 2281} {"train_loss": -10.752551078796387, "global_step": 383224, "epoch": 2281} {"train_loss": -11.287097930908203, "global_step": 383225, "epoch": 2281} {"train_loss": -10.470405578613281, "global_step": 383226, "epoch": 2281} {"train_loss": -11.040407180786133, "global_step": 383227, "epoch": 2281} {"train_loss": -11.446022033691406, "global_step": 383228, "epoch": 2281} {"train_loss": -10.64758014678955, "global_step": 383229, "epoch": 2281} {"train_loss": -11.641061782836914, "global_step": 383230, "epoch": 2281} {"train_loss": -10.207356452941895, "global_step": 383231, "epoch": 2281} {"train_loss": -11.057180404663086, "global_step": 383232, "epoch": 2281} {"train_loss": -11.347518920898438, "global_step": 383233, "epoch": 2281} {"train_loss": -11.285853385925293, "global_step": 383234, "epoch": 2281} {"train_loss": -11.029715538024902, "global_step": 383235, "epoch": 2281} {"train_loss": -11.06025505065918, "global_step": 383236, "epoch": 2281} {"train_loss": -11.368295669555664, "global_step": 383237, "epoch": 2281} {"train_loss": -11.424306869506836, "global_step": 383238, "epoch": 2281} {"train_loss": -11.680086135864258, "global_step": 383239, "epoch": 2281} {"train_loss": -10.767997741699219, "global_step": 383240, "epoch": 2281} {"train_loss": -11.89578628540039, "global_step": 383241, "epoch": 2281} {"train_loss": -10.982131004333496, "global_step": 383242, "epoch": 2281} {"train_loss": -11.742835998535156, "global_step": 383243, "epoch": 2281} {"train_loss": -11.726566314697266, "global_step": 383244, "epoch": 2281} {"train_loss": -11.70228385925293, "global_step": 383245, "epoch": 2281} {"train_loss": -12.153610229492188, "global_step": 383246, "epoch": 2281} {"train_loss": -11.77018928527832, "global_step": 383247, "epoch": 2281} {"train_loss": -11.736488342285156, "global_step": 383248, "epoch": 2281} {"train_loss": -12.0118408203125, "global_step": 383249, "epoch": 2281} {"train_loss": -12.154727935791016, "global_step": 383250, "epoch": 2281} {"train_loss": -11.640358924865723, "global_step": 383251, "epoch": 2281} {"train_loss": -11.95710277557373, "global_step": 383252, "epoch": 2281} {"train_loss": -11.964471817016602, "global_step": 383253, "epoch": 2281} {"train_loss": -12.110595703125, "global_step": 383254, "epoch": 2281} {"train_loss": -11.796039581298828, "global_step": 383255, "epoch": 2281} {"train_loss": -11.974879264831543, "global_step": 383256, "epoch": 2281} {"train_loss": -12.070369720458984, "global_step": 383257, "epoch": 2281} {"train_loss": -11.909479141235352, "global_step": 383258, "epoch": 2281} {"train_loss": -12.081323623657227, "global_step": 383259, "epoch": 2281} {"train_loss": -12.11562728881836, "global_step": 383260, "epoch": 2281} {"train_loss": -12.134011268615723, "global_step": 383261, "epoch": 2281} {"train_loss": -12.003671646118164, "global_step": 383262, "epoch": 2281} {"train_loss": -12.011488914489746, "global_step": 383263, "epoch": 2281} {"train_loss": -12.223261833190918, "global_step": 383264, "epoch": 2281} {"train_loss": -12.234392166137695, "global_step": 383265, "epoch": 2281} {"train_loss": -12.26276683807373, "global_step": 383266, "epoch": 2281} {"train_loss": -12.063542366027832, "global_step": 383267, "epoch": 2281} {"train_loss": -12.328022003173828, "global_step": 383268, "epoch": 2281} {"train_loss": -12.34480094909668, "global_step": 383269, "epoch": 2281} {"train_loss": -12.300105094909668, "global_step": 383270, "epoch": 2281} {"train_loss": -12.22787857055664, "global_step": 383271, "epoch": 2281} {"train_loss": -12.328941345214844, "global_step": 383272, "epoch": 2281} {"train_loss": -12.418367385864258, "global_step": 383273, "epoch": 2281} {"train_loss": -12.465588569641113, "global_step": 383274, "epoch": 2281} {"train_loss": -12.278186798095703, "global_step": 383275, "epoch": 2281} {"train_loss": -12.249032974243164, "global_step": 383276, "epoch": 2281} {"train_loss": -12.507386207580566, "global_step": 383277, "epoch": 2281} {"train_loss": -12.203374862670898, "global_step": 383278, "epoch": 2281} {"train_loss": -12.38403606414795, "global_step": 383279, "epoch": 2281} {"train_loss": -12.410929679870605, "global_step": 383280, "epoch": 2281} {"train_loss": -12.13198471069336, "global_step": 383281, "epoch": 2281} {"train_loss": -12.479143142700195, "global_step": 383282, "epoch": 2281} {"train_loss": -12.477392196655273, "global_step": 383283, "epoch": 2281} {"train_loss": -12.69717025756836, "global_step": 383284, "epoch": 2281} {"train_loss": -12.480892181396484, "global_step": 383285, "epoch": 2281} {"train_loss": -12.638326644897461, "global_step": 383286, "epoch": 2281} {"train_loss": -12.51257038116455, "global_step": 383287, "epoch": 2281} {"train_loss": -12.54078197479248, "global_step": 383288, "epoch": 2281} {"train_loss": -12.291891098022461, "global_step": 383289, "epoch": 2281} {"train_loss": -12.531492233276367, "global_step": 383290, "epoch": 2281} {"train_loss": -12.491354942321777, "global_step": 383291, "epoch": 2281} {"train_loss": -12.521323204040527, "global_step": 383292, "epoch": 2281} {"train_loss": -12.649730682373047, "global_step": 383293, "epoch": 2281} {"train_loss": -12.552547454833984, "global_step": 383294, "epoch": 2281} {"train_loss": -12.626091957092285, "global_step": 383295, "epoch": 2281} {"train_loss": -12.591845512390137, "global_step": 383296, "epoch": 2281} {"train_loss": -12.455330848693848, "global_step": 383297, "epoch": 2281} {"train_loss": -12.625788688659668, "global_step": 383298, "epoch": 2281} {"train_loss": -12.414163589477539, "global_step": 383299, "epoch": 2281} {"train_loss": -12.596458435058594, "global_step": 383300, "epoch": 2281} {"train_loss": -12.236602783203125, "global_step": 383301, "epoch": 2281} {"train_loss": -12.42354965209961, "global_step": 383302, "epoch": 2281} {"train_loss": -12.52214241027832, "global_step": 383303, "epoch": 2281} {"train_loss": -12.544851303100586, "global_step": 383304, "epoch": 2281} {"train_loss": -12.577987670898438, "global_step": 383305, "epoch": 2281} {"train_loss": -12.342926025390625, "global_step": 383306, "epoch": 2281} {"train_loss": -12.72308349609375, "global_step": 383307, "epoch": 2281} {"train_loss": -12.45685863494873, "global_step": 383308, "epoch": 2281} {"train_loss": -12.661822319030762, "global_step": 383309, "epoch": 2281} {"train_loss": -12.591495513916016, "global_step": 383310, "epoch": 2281} {"train_loss": -12.656560897827148, "global_step": 383311, "epoch": 2281} {"train_loss": -12.575315475463867, "global_step": 383312, "epoch": 2281} {"train_loss": -12.781058311462402, "global_step": 383313, "epoch": 2281} {"train_loss": -12.623897552490234, "global_step": 383314, "epoch": 2281} {"train_loss": -12.743155479431152, "global_step": 383315, "epoch": 2281} {"train_loss": -12.709918975830078, "global_step": 383316, "epoch": 2281} {"train_loss": -12.624605178833008, "global_step": 383317, "epoch": 2281} {"train_loss": -12.529522895812988, "global_step": 383318, "epoch": 2281} {"train_loss": -12.744484901428223, "global_step": 383319, "epoch": 2281} {"train_loss": -12.440281867980957, "global_step": 383320, "epoch": 2281} {"train_loss": -12.689064979553223, "global_step": 383321, "epoch": 2281} {"train_loss": -12.385249137878418, "global_step": 383322, "epoch": 2281} {"train_loss": -12.661405563354492, "global_step": 383323, "epoch": 2281} {"train_loss": -12.690010070800781, "global_step": 383324, "epoch": 2281} {"train_loss": -12.262861251831055, "global_step": 383325, "epoch": 2281} {"train_loss": -12.508560180664062, "global_step": 383326, "epoch": 2281} {"train_loss": -12.473758697509766, "global_step": 383327, "epoch": 2281} {"train_loss": -11.741569519042969, "global_step": 383328, "epoch": 2281} {"train_loss": -11.147741317749023, "global_step": 383329, "epoch": 2281} {"train_loss": -11.84815502166748, "global_step": 383330, "epoch": 2281} {"train_loss": -11.475448608398438, "global_step": 383331, "epoch": 2281} {"train_loss": -11.552050590515137, "global_step": 383332, "epoch": 2281} {"train_loss": -12.033930778503418, "global_step": 383333, "epoch": 2281} {"train_loss": -11.449525833129883, "global_step": 383334, "epoch": 2281} {"train_loss": -10.987010955810547, "global_step": 383335, "epoch": 2281} {"train_loss": -11.39199447631836, "global_step": 383336, "epoch": 2281} {"train_loss": -11.868119239807129, "global_step": 383337, "epoch": 2281} {"train_loss": -10.91935920715332, "global_step": 383338, "epoch": 2281} {"train_loss": -12.471725463867188, "global_step": 383339, "epoch": 2281} {"train_loss": -11.188043594360352, "global_step": 383340, "epoch": 2281} {"train_loss": -11.483053207397461, "global_step": 383341, "epoch": 2281} {"train_loss": -12.175046920776367, "global_step": 383342, "epoch": 2281} {"train_loss": -12.218212127685547, "global_step": 383343, "epoch": 2281} {"train_loss": -12.057568550109863, "global_step": 383344, "epoch": 2281} {"train_loss": -12.501982688903809, "global_step": 383345, "epoch": 2281} {"train_loss": -12.019672393798828, "global_step": 383346, "epoch": 2281} {"train_loss": -11.766180038452148, "global_step": 383347, "epoch": 2281} {"train_loss": -12.252296447753906, "global_step": 383348, "epoch": 2281} {"train_loss": -11.647856712341309, "global_step": 383349, "epoch": 2281} {"train_loss": -12.17894458770752, "global_step": 383350, "epoch": 2281} {"train_loss": -12.182987213134766, "global_step": 383351, "epoch": 2281} {"train_loss": -12.185934066772461, "global_step": 383352, "epoch": 2281} {"train_loss": -11.980350494384766, "global_step": 383353, "epoch": 2281} {"train_loss": -12.203944206237793, "global_step": 383354, "epoch": 2281} {"train_loss": -12.018043518066406, "global_step": 383355, "epoch": 2281} {"train_loss": -12.332109451293945, "global_step": 383356, "epoch": 2281} {"train_loss": -11.822946548461914, "global_step": 383357, "epoch": 2281} {"train_loss": -11.765108108520508, "global_step": 383358, "epoch": 2281} {"train_loss": -12.171030044555664, "global_step": 383359, "epoch": 2281} {"train_loss": -12.0859375, "global_step": 383360, "epoch": 2281} {"train_loss": -12.399754524230957, "global_step": 383361, "epoch": 2281} {"train_loss": -11.45971393585205, "global_step": 383362, "epoch": 2281} {"train_loss": -11.646537780761719, "global_step": 383363, "epoch": 2281} {"train_loss": -12.24821662902832, "global_step": 383364, "epoch": 2281} {"train_loss": -11.806618690490723, "global_step": 383365, "epoch": 2281} {"train_loss": -11.374732971191406, "global_step": 383366, "epoch": 2281} {"train_loss": -11.63956069946289, "global_step": 383367, "epoch": 2281} {"train_loss": -11.748388290405273, "global_step": 383368, "epoch": 2281} {"train_loss": -11.065021514892578, "global_step": 383369, "epoch": 2281} {"train_loss": -12.278604507446289, "global_step": 383370, "epoch": 2281} {"train_loss": -11.43496036529541, "global_step": 383371, "epoch": 2281} {"train_loss": -11.57791519165039, "global_step": 383372, "epoch": 2281} {"train_loss": -12.25434684753418, "global_step": 383373, "epoch": 2281} {"train_loss": -11.814590454101562, "global_step": 383374, "epoch": 2281} {"train_loss": -11.8933584690094, "global_step": 383375, "epoch": 2281, "val_loss": 293517.375} {"train_loss": -12.057333946228027, "global_step": 383376, "epoch": 2282} {"train_loss": -11.993263244628906, "global_step": 383377, "epoch": 2282} {"train_loss": -12.026067733764648, "global_step": 383378, "epoch": 2282} {"train_loss": -12.395220756530762, "global_step": 383379, "epoch": 2282} {"train_loss": -12.146345138549805, "global_step": 383380, "epoch": 2282} {"train_loss": -11.857547760009766, "global_step": 383381, "epoch": 2282} {"train_loss": -12.300586700439453, "global_step": 383382, "epoch": 2282} {"train_loss": -12.090303421020508, "global_step": 383383, "epoch": 2282} {"train_loss": -12.103595733642578, "global_step": 383384, "epoch": 2282} {"train_loss": -11.890022277832031, "global_step": 383385, "epoch": 2282} {"train_loss": -12.01346206665039, "global_step": 383386, "epoch": 2282} {"train_loss": -11.880273818969727, "global_step": 383387, "epoch": 2282} {"train_loss": -11.804611206054688, "global_step": 383388, "epoch": 2282} {"train_loss": -11.875617980957031, "global_step": 383389, "epoch": 2282} {"train_loss": -12.022452354431152, "global_step": 383390, "epoch": 2282} {"train_loss": -11.822582244873047, "global_step": 383391, "epoch": 2282} {"train_loss": -11.676714897155762, "global_step": 383392, "epoch": 2282} {"train_loss": -11.517885208129883, "global_step": 383393, "epoch": 2282} {"train_loss": -11.857336044311523, "global_step": 383394, "epoch": 2282} {"train_loss": -11.787774085998535, "global_step": 383395, "epoch": 2282} {"train_loss": -12.001420021057129, "global_step": 383396, "epoch": 2282} {"train_loss": -11.5347318649292, "global_step": 383397, "epoch": 2282} {"train_loss": -11.951011657714844, "global_step": 383398, "epoch": 2282} {"train_loss": -11.700838088989258, "global_step": 383399, "epoch": 2282} {"train_loss": -11.292895317077637, "global_step": 383400, "epoch": 2282} {"train_loss": -11.628353118896484, "global_step": 383401, "epoch": 2282} {"train_loss": -11.194039344787598, "global_step": 383402, "epoch": 2282} {"train_loss": -11.460060119628906, "global_step": 383403, "epoch": 2282} {"train_loss": -11.547019958496094, "global_step": 383404, "epoch": 2282} {"train_loss": -11.112098693847656, "global_step": 383405, "epoch": 2282} {"train_loss": -11.241806030273438, "global_step": 383406, "epoch": 2282} {"train_loss": -11.987010955810547, "global_step": 383407, "epoch": 2282} {"train_loss": -11.208765983581543, "global_step": 383408, "epoch": 2282} {"train_loss": -11.874856948852539, "global_step": 383409, "epoch": 2282} {"train_loss": -11.766404151916504, "global_step": 383410, "epoch": 2282} {"train_loss": -11.073253631591797, "global_step": 383411, "epoch": 2282} {"train_loss": -11.634363174438477, "global_step": 383412, "epoch": 2282} {"train_loss": -10.664349555969238, "global_step": 383413, "epoch": 2282} {"train_loss": -11.87257194519043, "global_step": 383414, "epoch": 2282} {"train_loss": -10.322858810424805, "global_step": 383415, "epoch": 2282} {"train_loss": -11.32665729522705, "global_step": 383416, "epoch": 2282} {"train_loss": -11.17782211303711, "global_step": 383417, "epoch": 2282} {"train_loss": -10.651762008666992, "global_step": 383418, "epoch": 2282} {"train_loss": -10.998367309570312, "global_step": 383419, "epoch": 2282} {"train_loss": -10.659555435180664, "global_step": 383420, "epoch": 2282} {"train_loss": -10.111228942871094, "global_step": 383421, "epoch": 2282} {"train_loss": -11.530726432800293, "global_step": 383422, "epoch": 2282} {"train_loss": -9.8505859375, "global_step": 383423, "epoch": 2282} {"train_loss": -11.109878540039062, "global_step": 383424, "epoch": 2282} {"train_loss": -9.609687805175781, "global_step": 383425, "epoch": 2282} {"train_loss": -10.429147720336914, "global_step": 383426, "epoch": 2282} {"train_loss": -10.774646759033203, "global_step": 383427, "epoch": 2282} {"train_loss": -10.428537368774414, "global_step": 383428, "epoch": 2282} {"train_loss": -10.194526672363281, "global_step": 383429, "epoch": 2282} {"train_loss": -10.970871925354004, "global_step": 383430, "epoch": 2282} {"train_loss": -10.484415054321289, "global_step": 383431, "epoch": 2282} {"train_loss": -10.798345565795898, "global_step": 383432, "epoch": 2282} {"train_loss": -10.717780113220215, "global_step": 383433, "epoch": 2282} {"train_loss": -11.889314651489258, "global_step": 383434, "epoch": 2282} {"train_loss": -10.341660499572754, "global_step": 383435, "epoch": 2282} {"train_loss": -11.998357772827148, "global_step": 383436, "epoch": 2282} {"train_loss": -11.070761680603027, "global_step": 383437, "epoch": 2282} {"train_loss": -11.410655975341797, "global_step": 383438, "epoch": 2282} {"train_loss": -10.707181930541992, "global_step": 383439, "epoch": 2282} {"train_loss": -11.514175415039062, "global_step": 383440, "epoch": 2282} {"train_loss": -10.87495231628418, "global_step": 383441, "epoch": 2282} {"train_loss": -12.08653450012207, "global_step": 383442, "epoch": 2282} {"train_loss": -11.081486701965332, "global_step": 383443, "epoch": 2282} {"train_loss": -11.73417854309082, "global_step": 383444, "epoch": 2282} {"train_loss": -11.64027214050293, "global_step": 383445, "epoch": 2282} {"train_loss": -11.61070442199707, "global_step": 383446, "epoch": 2282} {"train_loss": -11.786336898803711, "global_step": 383447, "epoch": 2282} {"train_loss": -11.546606063842773, "global_step": 383448, "epoch": 2282} {"train_loss": -11.694398880004883, "global_step": 383449, "epoch": 2282} {"train_loss": -12.019430160522461, "global_step": 383450, "epoch": 2282} {"train_loss": -11.520626068115234, "global_step": 383451, "epoch": 2282} {"train_loss": -12.02491283416748, "global_step": 383452, "epoch": 2282} {"train_loss": -11.653977394104004, "global_step": 383453, "epoch": 2282} {"train_loss": -11.764480590820312, "global_step": 383454, "epoch": 2282} {"train_loss": -12.052277565002441, "global_step": 383455, "epoch": 2282} {"train_loss": -11.80770492553711, "global_step": 383456, "epoch": 2282} {"train_loss": -12.157825469970703, "global_step": 383457, "epoch": 2282} {"train_loss": -11.638862609863281, "global_step": 383458, "epoch": 2282} {"train_loss": -12.207159042358398, "global_step": 383459, "epoch": 2282} {"train_loss": -12.182321548461914, "global_step": 383460, "epoch": 2282} {"train_loss": -12.248907089233398, "global_step": 383461, "epoch": 2282} {"train_loss": -12.200641632080078, "global_step": 383462, "epoch": 2282} {"train_loss": -12.22993278503418, "global_step": 383463, "epoch": 2282} {"train_loss": -12.172853469848633, "global_step": 383464, "epoch": 2282} {"train_loss": -12.36251163482666, "global_step": 383465, "epoch": 2282} {"train_loss": -12.446733474731445, "global_step": 383466, "epoch": 2282} {"train_loss": -12.06185245513916, "global_step": 383467, "epoch": 2282} {"train_loss": -12.3513822555542, "global_step": 383468, "epoch": 2282} {"train_loss": -12.293962478637695, "global_step": 383469, "epoch": 2282} {"train_loss": -12.296581268310547, "global_step": 383470, "epoch": 2282} {"train_loss": -12.197454452514648, "global_step": 383471, "epoch": 2282} {"train_loss": -12.30256175994873, "global_step": 383472, "epoch": 2282} {"train_loss": -12.251981735229492, "global_step": 383473, "epoch": 2282} {"train_loss": -12.371047973632812, "global_step": 383474, "epoch": 2282} {"train_loss": -12.313501358032227, "global_step": 383475, "epoch": 2282} {"train_loss": -12.479836463928223, "global_step": 383476, "epoch": 2282} {"train_loss": -12.333513259887695, "global_step": 383477, "epoch": 2282} {"train_loss": -12.271158218383789, "global_step": 383478, "epoch": 2282} {"train_loss": -12.243688583374023, "global_step": 383479, "epoch": 2282} {"train_loss": -12.247934341430664, "global_step": 383480, "epoch": 2282} {"train_loss": -12.271404266357422, "global_step": 383481, "epoch": 2282} {"train_loss": -12.259393692016602, "global_step": 383482, "epoch": 2282} {"train_loss": -12.281536102294922, "global_step": 383483, "epoch": 2282} {"train_loss": -12.415416717529297, "global_step": 383484, "epoch": 2282} {"train_loss": -12.495383262634277, "global_step": 383485, "epoch": 2282} {"train_loss": -12.431562423706055, "global_step": 383486, "epoch": 2282} {"train_loss": -12.31570053100586, "global_step": 383487, "epoch": 2282} {"train_loss": -12.502481460571289, "global_step": 383488, "epoch": 2282} {"train_loss": -12.04609489440918, "global_step": 383489, "epoch": 2282} {"train_loss": -12.541727066040039, "global_step": 383490, "epoch": 2282} {"train_loss": -12.582284927368164, "global_step": 383491, "epoch": 2282} {"train_loss": -12.466423034667969, "global_step": 383492, "epoch": 2282} {"train_loss": -12.662079811096191, "global_step": 383493, "epoch": 2282} {"train_loss": -12.606062889099121, "global_step": 383494, "epoch": 2282} {"train_loss": -12.495317459106445, "global_step": 383495, "epoch": 2282} {"train_loss": -12.454605102539062, "global_step": 383496, "epoch": 2282} {"train_loss": -12.445352554321289, "global_step": 383497, "epoch": 2282} {"train_loss": -12.423479080200195, "global_step": 383498, "epoch": 2282} {"train_loss": -12.482952117919922, "global_step": 383499, "epoch": 2282} {"train_loss": -12.373838424682617, "global_step": 383500, "epoch": 2282} {"train_loss": -12.584953308105469, "global_step": 383501, "epoch": 2282} {"train_loss": -12.489824295043945, "global_step": 383502, "epoch": 2282} {"train_loss": -12.269835472106934, "global_step": 383503, "epoch": 2282} {"train_loss": -12.58624267578125, "global_step": 383504, "epoch": 2282} {"train_loss": -12.604938507080078, "global_step": 383505, "epoch": 2282} {"train_loss": -12.420829772949219, "global_step": 383506, "epoch": 2282} {"train_loss": -12.793675422668457, "global_step": 383507, "epoch": 2282} {"train_loss": -12.618696212768555, "global_step": 383508, "epoch": 2282} {"train_loss": -12.570409774780273, "global_step": 383509, "epoch": 2282} {"train_loss": -12.548667907714844, "global_step": 383510, "epoch": 2282} {"train_loss": -12.512718200683594, "global_step": 383511, "epoch": 2282} {"train_loss": -12.76342487335205, "global_step": 383512, "epoch": 2282} {"train_loss": -12.449893951416016, "global_step": 383513, "epoch": 2282} {"train_loss": -12.73575210571289, "global_step": 383514, "epoch": 2282} {"train_loss": -12.650932312011719, "global_step": 383515, "epoch": 2282} {"train_loss": -12.654521942138672, "global_step": 383516, "epoch": 2282} {"train_loss": -12.64101791381836, "global_step": 383517, "epoch": 2282} {"train_loss": -12.475908279418945, "global_step": 383518, "epoch": 2282} {"train_loss": -12.531630516052246, "global_step": 383519, "epoch": 2282} {"train_loss": -12.297307968139648, "global_step": 383520, "epoch": 2282} {"train_loss": -12.503226280212402, "global_step": 383521, "epoch": 2282} {"train_loss": -12.66057300567627, "global_step": 383522, "epoch": 2282} {"train_loss": -12.155417442321777, "global_step": 383523, "epoch": 2282} {"train_loss": -12.346810340881348, "global_step": 383524, "epoch": 2282} {"train_loss": -12.105223655700684, "global_step": 383525, "epoch": 2282} {"train_loss": -12.25118637084961, "global_step": 383526, "epoch": 2282} {"train_loss": -12.52134895324707, "global_step": 383527, "epoch": 2282} {"train_loss": -12.224100112915039, "global_step": 383528, "epoch": 2282} {"train_loss": -12.784019470214844, "global_step": 383529, "epoch": 2282} {"train_loss": -12.095498085021973, "global_step": 383530, "epoch": 2282} {"train_loss": -12.312553405761719, "global_step": 383531, "epoch": 2282} {"train_loss": -12.537352561950684, "global_step": 383532, "epoch": 2282} {"train_loss": -11.883014678955078, "global_step": 383533, "epoch": 2282} {"train_loss": -12.401294708251953, "global_step": 383534, "epoch": 2282} {"train_loss": -12.503921508789062, "global_step": 383535, "epoch": 2282} {"train_loss": -12.383975982666016, "global_step": 383536, "epoch": 2282} {"train_loss": -12.401596069335938, "global_step": 383537, "epoch": 2282} {"train_loss": -12.055448532104492, "global_step": 383538, "epoch": 2282} {"train_loss": -11.655519485473633, "global_step": 383539, "epoch": 2282} {"train_loss": -12.444892883300781, "global_step": 383540, "epoch": 2282} {"train_loss": -12.130270004272461, "global_step": 383541, "epoch": 2282} {"train_loss": -12.378552436828613, "global_step": 383542, "epoch": 2282} {"train_loss": -11.920894151642209, "global_step": 383543, "epoch": 2282, "val_loss": 294042.8125} {"train_loss": -12.298651695251465, "global_step": 383544, "epoch": 2283} {"train_loss": -12.593849182128906, "global_step": 383545, "epoch": 2283} {"train_loss": -12.451555252075195, "global_step": 383546, "epoch": 2283} {"train_loss": -12.326645851135254, "global_step": 383547, "epoch": 2283} {"train_loss": -12.593372344970703, "global_step": 383548, "epoch": 2283} {"train_loss": -12.614701271057129, "global_step": 383549, "epoch": 2283} {"train_loss": -12.387027740478516, "global_step": 383550, "epoch": 2283} {"train_loss": -12.515368461608887, "global_step": 383551, "epoch": 2283} {"train_loss": -12.672920227050781, "global_step": 383552, "epoch": 2283} {"train_loss": -12.245878219604492, "global_step": 383553, "epoch": 2283} {"train_loss": -12.722223281860352, "global_step": 383554, "epoch": 2283} {"train_loss": -11.875740051269531, "global_step": 383555, "epoch": 2283} {"train_loss": -11.631474494934082, "global_step": 383556, "epoch": 2283} {"train_loss": -12.03890323638916, "global_step": 383557, "epoch": 2283} {"train_loss": -12.120080947875977, "global_step": 383558, "epoch": 2283} {"train_loss": -11.951884269714355, "global_step": 383559, "epoch": 2283} {"train_loss": -11.198174476623535, "global_step": 383560, "epoch": 2283} {"train_loss": -11.700338363647461, "global_step": 383561, "epoch": 2283} {"train_loss": -12.546958923339844, "global_step": 383562, "epoch": 2283} {"train_loss": -11.805726051330566, "global_step": 383563, "epoch": 2283} {"train_loss": -12.173032760620117, "global_step": 383564, "epoch": 2283} {"train_loss": -11.216628074645996, "global_step": 383565, "epoch": 2283} {"train_loss": -11.607743263244629, "global_step": 383566, "epoch": 2283} {"train_loss": -9.18387222290039, "global_step": 383567, "epoch": 2283} {"train_loss": -11.703902244567871, "global_step": 383568, "epoch": 2283} {"train_loss": -9.539328575134277, "global_step": 383569, "epoch": 2283} {"train_loss": -9.121916770935059, "global_step": 383570, "epoch": 2283} {"train_loss": -9.197396278381348, "global_step": 383571, "epoch": 2283} {"train_loss": -10.765384674072266, "global_step": 383572, "epoch": 2283} {"train_loss": -7.429039478302002, "global_step": 383573, "epoch": 2283} {"train_loss": -8.127233505249023, "global_step": 383574, "epoch": 2283} {"train_loss": -8.777472496032715, "global_step": 383575, "epoch": 2283} {"train_loss": -10.23067855834961, "global_step": 383576, "epoch": 2283} {"train_loss": -7.438549041748047, "global_step": 383577, "epoch": 2283} {"train_loss": -9.571925163269043, "global_step": 383578, "epoch": 2283} {"train_loss": -8.285959243774414, "global_step": 383579, "epoch": 2283} {"train_loss": -9.627129554748535, "global_step": 383580, "epoch": 2283} {"train_loss": -9.169185638427734, "global_step": 383581, "epoch": 2283} {"train_loss": -10.410208702087402, "global_step": 383582, "epoch": 2283} {"train_loss": -9.359171867370605, "global_step": 383583, "epoch": 2283} {"train_loss": -11.374555587768555, "global_step": 383584, "epoch": 2283} {"train_loss": -10.283740043640137, "global_step": 383585, "epoch": 2283} {"train_loss": -11.323358535766602, "global_step": 383586, "epoch": 2283} {"train_loss": -10.01272201538086, "global_step": 383587, "epoch": 2283} {"train_loss": -10.9645414352417, "global_step": 383588, "epoch": 2283} {"train_loss": -10.344947814941406, "global_step": 383589, "epoch": 2283} {"train_loss": -10.594743728637695, "global_step": 383590, "epoch": 2283} {"train_loss": -11.191866874694824, "global_step": 383591, "epoch": 2283} {"train_loss": -10.770317077636719, "global_step": 383592, "epoch": 2283} {"train_loss": -10.972485542297363, "global_step": 383593, "epoch": 2283} {"train_loss": -11.722047805786133, "global_step": 383594, "epoch": 2283} {"train_loss": -11.335688591003418, "global_step": 383595, "epoch": 2283} {"train_loss": -11.906900405883789, "global_step": 383596, "epoch": 2283} {"train_loss": -11.625182151794434, "global_step": 383597, "epoch": 2283} {"train_loss": -11.741575241088867, "global_step": 383598, "epoch": 2283} {"train_loss": -11.349311828613281, "global_step": 383599, "epoch": 2283} {"train_loss": -11.854999542236328, "global_step": 383600, "epoch": 2283} {"train_loss": -11.634851455688477, "global_step": 383601, "epoch": 2283} {"train_loss": -11.918464660644531, "global_step": 383602, "epoch": 2283} {"train_loss": -11.982367515563965, "global_step": 383603, "epoch": 2283} {"train_loss": -11.743303298950195, "global_step": 383604, "epoch": 2283} {"train_loss": -11.74613094329834, "global_step": 383605, "epoch": 2283} {"train_loss": -11.807147026062012, "global_step": 383606, "epoch": 2283} {"train_loss": -11.816059112548828, "global_step": 383607, "epoch": 2283} {"train_loss": -11.87131118774414, "global_step": 383608, "epoch": 2283} {"train_loss": -12.056132316589355, "global_step": 383609, "epoch": 2283} {"train_loss": -12.156850814819336, "global_step": 383610, "epoch": 2283} {"train_loss": -12.113218307495117, "global_step": 383611, "epoch": 2283} {"train_loss": -11.990409851074219, "global_step": 383612, "epoch": 2283} {"train_loss": -12.013809204101562, "global_step": 383613, "epoch": 2283} {"train_loss": -12.168913841247559, "global_step": 383614, "epoch": 2283} {"train_loss": -12.1719388961792, "global_step": 383615, "epoch": 2283} {"train_loss": -12.366162300109863, "global_step": 383616, "epoch": 2283} {"train_loss": -12.090476989746094, "global_step": 383617, "epoch": 2283} {"train_loss": -12.169448852539062, "global_step": 383618, "epoch": 2283} {"train_loss": -12.115341186523438, "global_step": 383619, "epoch": 2283} {"train_loss": -12.250076293945312, "global_step": 383620, "epoch": 2283} {"train_loss": -12.21833324432373, "global_step": 383621, "epoch": 2283} {"train_loss": -12.12725830078125, "global_step": 383622, "epoch": 2283} {"train_loss": -12.19141960144043, "global_step": 383623, "epoch": 2283} {"train_loss": -12.280439376831055, "global_step": 383624, "epoch": 2283} {"train_loss": -12.279088020324707, "global_step": 383625, "epoch": 2283} {"train_loss": -12.37257194519043, "global_step": 383626, "epoch": 2283} {"train_loss": -12.213727951049805, "global_step": 383627, "epoch": 2283} {"train_loss": -12.399110794067383, "global_step": 383628, "epoch": 2283} {"train_loss": -12.313821792602539, "global_step": 383629, "epoch": 2283} {"train_loss": -12.340940475463867, "global_step": 383630, "epoch": 2283} {"train_loss": -12.622269630432129, "global_step": 383631, "epoch": 2283} {"train_loss": -12.206136703491211, "global_step": 383632, "epoch": 2283} {"train_loss": -12.551430702209473, "global_step": 383633, "epoch": 2283} {"train_loss": -12.279531478881836, "global_step": 383634, "epoch": 2283} {"train_loss": -12.560997009277344, "global_step": 383635, "epoch": 2283} {"train_loss": -12.550758361816406, "global_step": 383636, "epoch": 2283} {"train_loss": -12.40020751953125, "global_step": 383637, "epoch": 2283} {"train_loss": -12.350581169128418, "global_step": 383638, "epoch": 2283} {"train_loss": -12.17822265625, "global_step": 383639, "epoch": 2283} {"train_loss": -12.39619255065918, "global_step": 383640, "epoch": 2283} {"train_loss": -12.517501831054688, "global_step": 383641, "epoch": 2283} {"train_loss": -12.5581636428833, "global_step": 383642, "epoch": 2283} {"train_loss": -12.306819915771484, "global_step": 383643, "epoch": 2283} {"train_loss": -12.676498413085938, "global_step": 383644, "epoch": 2283} {"train_loss": -12.574396133422852, "global_step": 383645, "epoch": 2283} {"train_loss": -12.44044303894043, "global_step": 383646, "epoch": 2283} {"train_loss": -12.086762428283691, "global_step": 383647, "epoch": 2283} {"train_loss": -12.379348754882812, "global_step": 383648, "epoch": 2283} {"train_loss": -12.50422477722168, "global_step": 383649, "epoch": 2283} {"train_loss": -12.373929977416992, "global_step": 383650, "epoch": 2283} {"train_loss": -12.561117172241211, "global_step": 383651, "epoch": 2283} {"train_loss": -12.338886260986328, "global_step": 383652, "epoch": 2283} {"train_loss": -12.244699478149414, "global_step": 383653, "epoch": 2283} {"train_loss": -12.61406421661377, "global_step": 383654, "epoch": 2283} {"train_loss": -12.294801712036133, "global_step": 383655, "epoch": 2283} {"train_loss": -12.34931468963623, "global_step": 383656, "epoch": 2283} {"train_loss": -12.473060607910156, "global_step": 383657, "epoch": 2283} {"train_loss": -12.458202362060547, "global_step": 383658, "epoch": 2283} {"train_loss": -12.275218963623047, "global_step": 383659, "epoch": 2283} {"train_loss": -12.674057006835938, "global_step": 383660, "epoch": 2283} {"train_loss": -12.441350936889648, "global_step": 383661, "epoch": 2283} {"train_loss": -12.521331787109375, "global_step": 383662, "epoch": 2283} {"train_loss": -12.825138092041016, "global_step": 383663, "epoch": 2283} {"train_loss": -12.561450004577637, "global_step": 383664, "epoch": 2283} {"train_loss": -12.511946678161621, "global_step": 383665, "epoch": 2283} {"train_loss": -12.636938095092773, "global_step": 383666, "epoch": 2283} {"train_loss": -12.715402603149414, "global_step": 383667, "epoch": 2283} {"train_loss": -12.530420303344727, "global_step": 383668, "epoch": 2283} {"train_loss": -12.454814910888672, "global_step": 383669, "epoch": 2283} {"train_loss": -12.66240119934082, "global_step": 383670, "epoch": 2283} {"train_loss": -12.478189468383789, "global_step": 383671, "epoch": 2283} {"train_loss": -12.591571807861328, "global_step": 383672, "epoch": 2283} {"train_loss": -12.564311981201172, "global_step": 383673, "epoch": 2283} {"train_loss": -12.640296936035156, "global_step": 383674, "epoch": 2283} {"train_loss": -12.60163688659668, "global_step": 383675, "epoch": 2283} {"train_loss": -12.53997802734375, "global_step": 383676, "epoch": 2283} {"train_loss": -12.6956787109375, "global_step": 383677, "epoch": 2283} {"train_loss": -12.548242568969727, "global_step": 383678, "epoch": 2283} {"train_loss": -12.778023719787598, "global_step": 383679, "epoch": 2283} {"train_loss": -12.494409561157227, "global_step": 383680, "epoch": 2283} {"train_loss": -12.589585304260254, "global_step": 383681, "epoch": 2283} {"train_loss": -12.793035507202148, "global_step": 383682, "epoch": 2283} {"train_loss": -12.719478607177734, "global_step": 383683, "epoch": 2283} {"train_loss": -12.471885681152344, "global_step": 383684, "epoch": 2283} {"train_loss": -12.2703275680542, "global_step": 383685, "epoch": 2283} {"train_loss": -11.791596412658691, "global_step": 383686, "epoch": 2283} {"train_loss": -12.769490242004395, "global_step": 383687, "epoch": 2283} {"train_loss": -12.103723526000977, "global_step": 383688, "epoch": 2283} {"train_loss": -11.919963836669922, "global_step": 383689, "epoch": 2283} {"train_loss": -11.577381134033203, "global_step": 383690, "epoch": 2283} {"train_loss": -11.665372848510742, "global_step": 383691, "epoch": 2283} {"train_loss": -12.363182067871094, "global_step": 383692, "epoch": 2283} {"train_loss": -12.220626831054688, "global_step": 383693, "epoch": 2283} {"train_loss": -11.997711181640625, "global_step": 383694, "epoch": 2283} {"train_loss": -12.122950553894043, "global_step": 383695, "epoch": 2283} {"train_loss": -11.514840126037598, "global_step": 383696, "epoch": 2283} {"train_loss": -8.818465232849121, "global_step": 383697, "epoch": 2283} {"train_loss": -11.644389152526855, "global_step": 383698, "epoch": 2283} {"train_loss": -9.050886154174805, "global_step": 383699, "epoch": 2283} {"train_loss": -10.317048072814941, "global_step": 383700, "epoch": 2283} {"train_loss": -8.426758766174316, "global_step": 383701, "epoch": 2283} {"train_loss": -8.612493515014648, "global_step": 383702, "epoch": 2283} {"train_loss": -7.209779739379883, "global_step": 383703, "epoch": 2283} {"train_loss": -8.54047966003418, "global_step": 383704, "epoch": 2283} {"train_loss": -7.640440940856934, "global_step": 383705, "epoch": 2283} {"train_loss": -7.702204704284668, "global_step": 383706, "epoch": 2283} {"train_loss": -9.191734313964844, "global_step": 383707, "epoch": 2283} {"train_loss": -9.144525527954102, "global_step": 383708, "epoch": 2283} {"train_loss": -10.112447738647461, "global_step": 383709, "epoch": 2283} {"train_loss": -9.665539741516113, "global_step": 383710, "epoch": 2283} {"train_loss": -11.575954559303465, "global_step": 383711, "epoch": 2283, "val_loss": 286887.15625} {"train_loss": -10.232389450073242, "global_step": 383712, "epoch": 2284} {"train_loss": -9.122770309448242, "global_step": 383713, "epoch": 2284} {"train_loss": -10.696587562561035, "global_step": 383714, "epoch": 2284} {"train_loss": -10.490549087524414, "global_step": 383715, "epoch": 2284} {"train_loss": -11.276185989379883, "global_step": 383716, "epoch": 2284} {"train_loss": -11.368165016174316, "global_step": 383717, "epoch": 2284} {"train_loss": -11.137584686279297, "global_step": 383718, "epoch": 2284} {"train_loss": -11.9772310256958, "global_step": 383719, "epoch": 2284} {"train_loss": -11.507137298583984, "global_step": 383720, "epoch": 2284} {"train_loss": -11.395912170410156, "global_step": 383721, "epoch": 2284} {"train_loss": -11.933713912963867, "global_step": 383722, "epoch": 2284} {"train_loss": -11.766546249389648, "global_step": 383723, "epoch": 2284} {"train_loss": -12.026987075805664, "global_step": 383724, "epoch": 2284} {"train_loss": -11.626490592956543, "global_step": 383725, "epoch": 2284} {"train_loss": -11.684415817260742, "global_step": 383726, "epoch": 2284} {"train_loss": -11.449687004089355, "global_step": 383727, "epoch": 2284} {"train_loss": -11.891986846923828, "global_step": 383728, "epoch": 2284} {"train_loss": -11.939959526062012, "global_step": 383729, "epoch": 2284} {"train_loss": -11.942490577697754, "global_step": 383730, "epoch": 2284} {"train_loss": -12.052499771118164, "global_step": 383731, "epoch": 2284} {"train_loss": -12.117622375488281, "global_step": 383732, "epoch": 2284} {"train_loss": -11.986506462097168, "global_step": 383733, "epoch": 2284} {"train_loss": -11.87918472290039, "global_step": 383734, "epoch": 2284} {"train_loss": -12.080411911010742, "global_step": 383735, "epoch": 2284} {"train_loss": -12.406362533569336, "global_step": 383736, "epoch": 2284} {"train_loss": -12.20840072631836, "global_step": 383737, "epoch": 2284} {"train_loss": -12.222763061523438, "global_step": 383738, "epoch": 2284} {"train_loss": -12.131383895874023, "global_step": 383739, "epoch": 2284} {"train_loss": -12.092504501342773, "global_step": 383740, "epoch": 2284} {"train_loss": -12.196969032287598, "global_step": 383741, "epoch": 2284} {"train_loss": -12.095674514770508, "global_step": 383742, "epoch": 2284} {"train_loss": -12.219307899475098, "global_step": 383743, "epoch": 2284} {"train_loss": -12.437080383300781, "global_step": 383744, "epoch": 2284} {"train_loss": -12.170120239257812, "global_step": 383745, "epoch": 2284} {"train_loss": -12.242273330688477, "global_step": 383746, "epoch": 2284} {"train_loss": -12.203628540039062, "global_step": 383747, "epoch": 2284} {"train_loss": -12.440095901489258, "global_step": 383748, "epoch": 2284} {"train_loss": -12.02546501159668, "global_step": 383749, "epoch": 2284} {"train_loss": -12.36434555053711, "global_step": 383750, "epoch": 2284} {"train_loss": -12.17624282836914, "global_step": 383751, "epoch": 2284} {"train_loss": -12.22213363647461, "global_step": 383752, "epoch": 2284} {"train_loss": -12.233935356140137, "global_step": 383753, "epoch": 2284} {"train_loss": -12.327569007873535, "global_step": 383754, "epoch": 2284} {"train_loss": -12.57083511352539, "global_step": 383755, "epoch": 2284} {"train_loss": -12.526410102844238, "global_step": 383756, "epoch": 2284} {"train_loss": -12.545072555541992, "global_step": 383757, "epoch": 2284} {"train_loss": -12.54293155670166, "global_step": 383758, "epoch": 2284} {"train_loss": -12.75699234008789, "global_step": 383759, "epoch": 2284} {"train_loss": -12.64085578918457, "global_step": 383760, "epoch": 2284} {"train_loss": -12.478761672973633, "global_step": 383761, "epoch": 2284} {"train_loss": -12.589963912963867, "global_step": 383762, "epoch": 2284} {"train_loss": -12.64896297454834, "global_step": 383763, "epoch": 2284} {"train_loss": -12.550237655639648, "global_step": 383764, "epoch": 2284} {"train_loss": -12.365013122558594, "global_step": 383765, "epoch": 2284} {"train_loss": -12.487945556640625, "global_step": 383766, "epoch": 2284} {"train_loss": -12.562337875366211, "global_step": 383767, "epoch": 2284} {"train_loss": -12.531501770019531, "global_step": 383768, "epoch": 2284} {"train_loss": -12.39268684387207, "global_step": 383769, "epoch": 2284} {"train_loss": -12.491146087646484, "global_step": 383770, "epoch": 2284} {"train_loss": -12.260318756103516, "global_step": 383771, "epoch": 2284} {"train_loss": -12.488747596740723, "global_step": 383772, "epoch": 2284} {"train_loss": -12.514997482299805, "global_step": 383773, "epoch": 2284} {"train_loss": -12.227089881896973, "global_step": 383774, "epoch": 2284} {"train_loss": -12.763898849487305, "global_step": 383775, "epoch": 2284} {"train_loss": -12.406288146972656, "global_step": 383776, "epoch": 2284} {"train_loss": -12.368061065673828, "global_step": 383777, "epoch": 2284} {"train_loss": -12.429065704345703, "global_step": 383778, "epoch": 2284} {"train_loss": -12.450508117675781, "global_step": 383779, "epoch": 2284} {"train_loss": -11.828723907470703, "global_step": 383780, "epoch": 2284} {"train_loss": -12.362573623657227, "global_step": 383781, "epoch": 2284} {"train_loss": -12.274770736694336, "global_step": 383782, "epoch": 2284} {"train_loss": -10.92002010345459, "global_step": 383783, "epoch": 2284} {"train_loss": -11.692407608032227, "global_step": 383784, "epoch": 2284} {"train_loss": -12.404668807983398, "global_step": 383785, "epoch": 2284} {"train_loss": -11.108083724975586, "global_step": 383786, "epoch": 2284} {"train_loss": -11.374967575073242, "global_step": 383787, "epoch": 2284} {"train_loss": -12.050817489624023, "global_step": 383788, "epoch": 2284} {"train_loss": -12.243268013000488, "global_step": 383789, "epoch": 2284} {"train_loss": -11.666693687438965, "global_step": 383790, "epoch": 2284} {"train_loss": -12.378146171569824, "global_step": 383791, "epoch": 2284} {"train_loss": -12.260339736938477, "global_step": 383792, "epoch": 2284} {"train_loss": -12.432782173156738, "global_step": 383793, "epoch": 2284} {"train_loss": -12.322362899780273, "global_step": 383794, "epoch": 2284} {"train_loss": -12.525588989257812, "global_step": 383795, "epoch": 2284} {"train_loss": -12.12543773651123, "global_step": 383796, "epoch": 2284} {"train_loss": -12.015264511108398, "global_step": 383797, "epoch": 2284} {"train_loss": -12.006429672241211, "global_step": 383798, "epoch": 2284} {"train_loss": -11.605751037597656, "global_step": 383799, "epoch": 2284} {"train_loss": -11.817941665649414, "global_step": 383800, "epoch": 2284} {"train_loss": -11.040660858154297, "global_step": 383801, "epoch": 2284} {"train_loss": -12.291620254516602, "global_step": 383802, "epoch": 2284} {"train_loss": -10.62612247467041, "global_step": 383803, "epoch": 2284} {"train_loss": -11.877557754516602, "global_step": 383804, "epoch": 2284} {"train_loss": -10.775354385375977, "global_step": 383805, "epoch": 2284} {"train_loss": -10.288344383239746, "global_step": 383806, "epoch": 2284} {"train_loss": -11.498580932617188, "global_step": 383807, "epoch": 2284} {"train_loss": -10.174372673034668, "global_step": 383808, "epoch": 2284} {"train_loss": -11.83401870727539, "global_step": 383809, "epoch": 2284} {"train_loss": -11.590150833129883, "global_step": 383810, "epoch": 2284} {"train_loss": -11.905805587768555, "global_step": 383811, "epoch": 2284} {"train_loss": -12.248444557189941, "global_step": 383812, "epoch": 2284} {"train_loss": -11.925704956054688, "global_step": 383813, "epoch": 2284} {"train_loss": -12.468099594116211, "global_step": 383814, "epoch": 2284} {"train_loss": -12.365789413452148, "global_step": 383815, "epoch": 2284} {"train_loss": -12.298151016235352, "global_step": 383816, "epoch": 2284} {"train_loss": -12.237507820129395, "global_step": 383817, "epoch": 2284} {"train_loss": -12.029925346374512, "global_step": 383818, "epoch": 2284} {"train_loss": -11.625405311584473, "global_step": 383819, "epoch": 2284} {"train_loss": -12.027311325073242, "global_step": 383820, "epoch": 2284} {"train_loss": -11.916555404663086, "global_step": 383821, "epoch": 2284} {"train_loss": -12.038089752197266, "global_step": 383822, "epoch": 2284} {"train_loss": -12.16330623626709, "global_step": 383823, "epoch": 2284} {"train_loss": -12.257616996765137, "global_step": 383824, "epoch": 2284} {"train_loss": -12.26231575012207, "global_step": 383825, "epoch": 2284} {"train_loss": -12.325254440307617, "global_step": 383826, "epoch": 2284} {"train_loss": -12.15673542022705, "global_step": 383827, "epoch": 2284} {"train_loss": -12.268451690673828, "global_step": 383828, "epoch": 2284} {"train_loss": -12.083137512207031, "global_step": 383829, "epoch": 2284} {"train_loss": -12.301850318908691, "global_step": 383830, "epoch": 2284} {"train_loss": -12.349435806274414, "global_step": 383831, "epoch": 2284} {"train_loss": -12.46294116973877, "global_step": 383832, "epoch": 2284} {"train_loss": -12.109325408935547, "global_step": 383833, "epoch": 2284} {"train_loss": -12.424783706665039, "global_step": 383834, "epoch": 2284} {"train_loss": -11.990127563476562, "global_step": 383835, "epoch": 2284} {"train_loss": -12.27151107788086, "global_step": 383836, "epoch": 2284} {"train_loss": -12.004537582397461, "global_step": 383837, "epoch": 2284} {"train_loss": -12.49769115447998, "global_step": 383838, "epoch": 2284} {"train_loss": -12.388641357421875, "global_step": 383839, "epoch": 2284} {"train_loss": -12.495046615600586, "global_step": 383840, "epoch": 2284} {"train_loss": -12.41724967956543, "global_step": 383841, "epoch": 2284} {"train_loss": -12.377218246459961, "global_step": 383842, "epoch": 2284} {"train_loss": -12.365501403808594, "global_step": 383843, "epoch": 2284} {"train_loss": -12.167587280273438, "global_step": 383844, "epoch": 2284} {"train_loss": -12.31972885131836, "global_step": 383845, "epoch": 2284} {"train_loss": -12.176247596740723, "global_step": 383846, "epoch": 2284} {"train_loss": -11.353650093078613, "global_step": 383847, "epoch": 2284} {"train_loss": -11.970232009887695, "global_step": 383848, "epoch": 2284} {"train_loss": -12.1474609375, "global_step": 383849, "epoch": 2284} {"train_loss": -11.207603454589844, "global_step": 383850, "epoch": 2284} {"train_loss": -11.921165466308594, "global_step": 383851, "epoch": 2284} {"train_loss": -12.014566421508789, "global_step": 383852, "epoch": 2284} {"train_loss": -10.98459529876709, "global_step": 383853, "epoch": 2284} {"train_loss": -12.315221786499023, "global_step": 383854, "epoch": 2284} {"train_loss": -12.025986671447754, "global_step": 383855, "epoch": 2284} {"train_loss": -11.81355094909668, "global_step": 383856, "epoch": 2284} {"train_loss": -12.660562515258789, "global_step": 383857, "epoch": 2284} {"train_loss": -11.58820629119873, "global_step": 383858, "epoch": 2284} {"train_loss": -12.293733596801758, "global_step": 383859, "epoch": 2284} {"train_loss": -11.397640228271484, "global_step": 383860, "epoch": 2284} {"train_loss": -12.04731559753418, "global_step": 383861, "epoch": 2284} {"train_loss": -11.963937759399414, "global_step": 383862, "epoch": 2284} {"train_loss": -11.453023910522461, "global_step": 383863, "epoch": 2284} {"train_loss": -11.554947853088379, "global_step": 383864, "epoch": 2284} {"train_loss": -11.453777313232422, "global_step": 383865, "epoch": 2284} {"train_loss": -10.953031539916992, "global_step": 383866, "epoch": 2284} {"train_loss": -11.031350135803223, "global_step": 383867, "epoch": 2284} {"train_loss": -11.74896240234375, "global_step": 383868, "epoch": 2284} {"train_loss": -11.747695922851562, "global_step": 383869, "epoch": 2284} {"train_loss": -10.714061737060547, "global_step": 383870, "epoch": 2284} {"train_loss": -12.094625473022461, "global_step": 383871, "epoch": 2284} {"train_loss": -11.566133499145508, "global_step": 383872, "epoch": 2284} {"train_loss": -12.208013534545898, "global_step": 383873, "epoch": 2284} {"train_loss": -12.023969650268555, "global_step": 383874, "epoch": 2284} {"train_loss": -11.811281204223633, "global_step": 383875, "epoch": 2284} {"train_loss": -11.918834686279297, "global_step": 383876, "epoch": 2284} {"train_loss": -12.18614673614502, "global_step": 383877, "epoch": 2284} {"train_loss": -12.21799087524414, "global_step": 383878, "epoch": 2284} {"train_loss": -11.977434379713875, "global_step": 383879, "epoch": 2284, "val_loss": 293051.375} {"train_loss": -12.223213195800781, "global_step": 383880, "epoch": 2285} {"train_loss": -12.427024841308594, "global_step": 383881, "epoch": 2285} {"train_loss": -12.302472114562988, "global_step": 383882, "epoch": 2285} {"train_loss": -12.342560768127441, "global_step": 383883, "epoch": 2285} {"train_loss": -12.121955871582031, "global_step": 383884, "epoch": 2285} {"train_loss": -12.062896728515625, "global_step": 383885, "epoch": 2285} {"train_loss": -12.149242401123047, "global_step": 383886, "epoch": 2285} {"train_loss": -11.865315437316895, "global_step": 383887, "epoch": 2285} {"train_loss": -12.188919067382812, "global_step": 383888, "epoch": 2285} {"train_loss": -11.975841522216797, "global_step": 383889, "epoch": 2285} {"train_loss": -11.951051712036133, "global_step": 383890, "epoch": 2285} {"train_loss": -12.00860595703125, "global_step": 383891, "epoch": 2285} {"train_loss": -12.41867446899414, "global_step": 383892, "epoch": 2285} {"train_loss": -12.110122680664062, "global_step": 383893, "epoch": 2285} {"train_loss": -12.443251609802246, "global_step": 383894, "epoch": 2285} {"train_loss": -12.167093276977539, "global_step": 383895, "epoch": 2285} {"train_loss": -12.478885650634766, "global_step": 383896, "epoch": 2285} {"train_loss": -11.717681884765625, "global_step": 383897, "epoch": 2285} {"train_loss": -12.318214416503906, "global_step": 383898, "epoch": 2285} {"train_loss": -12.22966194152832, "global_step": 383899, "epoch": 2285} {"train_loss": -11.834888458251953, "global_step": 383900, "epoch": 2285} {"train_loss": -11.696049690246582, "global_step": 383901, "epoch": 2285} {"train_loss": -12.091829299926758, "global_step": 383902, "epoch": 2285} {"train_loss": -11.908037185668945, "global_step": 383903, "epoch": 2285} {"train_loss": -12.345296859741211, "global_step": 383904, "epoch": 2285} {"train_loss": -11.746115684509277, "global_step": 383905, "epoch": 2285} {"train_loss": -12.363842010498047, "global_step": 383906, "epoch": 2285} {"train_loss": -12.16313362121582, "global_step": 383907, "epoch": 2285} {"train_loss": -12.134401321411133, "global_step": 383908, "epoch": 2285} {"train_loss": -12.16645622253418, "global_step": 383909, "epoch": 2285} {"train_loss": -12.10563850402832, "global_step": 383910, "epoch": 2285} {"train_loss": -11.899439811706543, "global_step": 383911, "epoch": 2285} {"train_loss": -12.027095794677734, "global_step": 383912, "epoch": 2285} {"train_loss": -12.00533676147461, "global_step": 383913, "epoch": 2285} {"train_loss": -11.629189491271973, "global_step": 383914, "epoch": 2285} {"train_loss": -12.037740707397461, "global_step": 383915, "epoch": 2285} {"train_loss": -11.683600425720215, "global_step": 383916, "epoch": 2285} {"train_loss": -11.658602714538574, "global_step": 383917, "epoch": 2285} {"train_loss": -11.399208068847656, "global_step": 383918, "epoch": 2285} {"train_loss": -12.197967529296875, "global_step": 383919, "epoch": 2285} {"train_loss": -12.027694702148438, "global_step": 383920, "epoch": 2285} {"train_loss": -11.653152465820312, "global_step": 383921, "epoch": 2285} {"train_loss": -12.496362686157227, "global_step": 383922, "epoch": 2285} {"train_loss": -11.823993682861328, "global_step": 383923, "epoch": 2285} {"train_loss": -12.081511497497559, "global_step": 383924, "epoch": 2285} {"train_loss": -12.164384841918945, "global_step": 383925, "epoch": 2285} {"train_loss": -11.54340934753418, "global_step": 383926, "epoch": 2285} {"train_loss": -11.831937789916992, "global_step": 383927, "epoch": 2285} {"train_loss": -12.096198081970215, "global_step": 383928, "epoch": 2285} {"train_loss": -11.22039794921875, "global_step": 383929, "epoch": 2285} {"train_loss": -12.353228569030762, "global_step": 383930, "epoch": 2285} {"train_loss": -12.256421089172363, "global_step": 383931, "epoch": 2285} {"train_loss": -12.05652141571045, "global_step": 383932, "epoch": 2285} {"train_loss": -12.534364700317383, "global_step": 383933, "epoch": 2285} {"train_loss": -12.114241600036621, "global_step": 383934, "epoch": 2285} {"train_loss": -12.530195236206055, "global_step": 383935, "epoch": 2285} {"train_loss": -12.37348461151123, "global_step": 383936, "epoch": 2285} {"train_loss": -12.374673843383789, "global_step": 383937, "epoch": 2285} {"train_loss": -12.303346633911133, "global_step": 383938, "epoch": 2285} {"train_loss": -12.48520278930664, "global_step": 383939, "epoch": 2285} {"train_loss": -12.399283409118652, "global_step": 383940, "epoch": 2285} {"train_loss": -12.476974487304688, "global_step": 383941, "epoch": 2285} {"train_loss": -12.514646530151367, "global_step": 383942, "epoch": 2285} {"train_loss": -12.492044448852539, "global_step": 383943, "epoch": 2285} {"train_loss": -12.400798797607422, "global_step": 383944, "epoch": 2285} {"train_loss": -12.175415992736816, "global_step": 383945, "epoch": 2285} {"train_loss": -11.992207527160645, "global_step": 383946, "epoch": 2285} {"train_loss": -12.656994819641113, "global_step": 383947, "epoch": 2285} {"train_loss": -12.181836128234863, "global_step": 383948, "epoch": 2285} {"train_loss": -12.635826110839844, "global_step": 383949, "epoch": 2285} {"train_loss": -12.419614791870117, "global_step": 383950, "epoch": 2285} {"train_loss": -12.322809219360352, "global_step": 383951, "epoch": 2285} {"train_loss": -12.685272216796875, "global_step": 383952, "epoch": 2285} {"train_loss": -12.171645164489746, "global_step": 383953, "epoch": 2285} {"train_loss": -12.603325843811035, "global_step": 383954, "epoch": 2285} {"train_loss": -12.508563995361328, "global_step": 383955, "epoch": 2285} {"train_loss": -12.455739974975586, "global_step": 383956, "epoch": 2285} {"train_loss": -12.333544731140137, "global_step": 383957, "epoch": 2285} {"train_loss": -12.796533584594727, "global_step": 383958, "epoch": 2285} {"train_loss": -12.461709976196289, "global_step": 383959, "epoch": 2285} {"train_loss": -12.459840774536133, "global_step": 383960, "epoch": 2285} {"train_loss": -12.332748413085938, "global_step": 383961, "epoch": 2285} {"train_loss": -12.301652908325195, "global_step": 383962, "epoch": 2285} {"train_loss": -12.354684829711914, "global_step": 383963, "epoch": 2285} {"train_loss": -12.27466869354248, "global_step": 383964, "epoch": 2285} {"train_loss": -12.208401679992676, "global_step": 383965, "epoch": 2285} {"train_loss": -12.459033966064453, "global_step": 383966, "epoch": 2285} {"train_loss": -12.475865364074707, "global_step": 383967, "epoch": 2285} {"train_loss": -12.259807586669922, "global_step": 383968, "epoch": 2285} {"train_loss": -12.473119735717773, "global_step": 383969, "epoch": 2285} {"train_loss": -12.21275806427002, "global_step": 383970, "epoch": 2285} {"train_loss": -12.575800895690918, "global_step": 383971, "epoch": 2285} {"train_loss": -12.211408615112305, "global_step": 383972, "epoch": 2285} {"train_loss": -12.276861190795898, "global_step": 383973, "epoch": 2285} {"train_loss": -12.451152801513672, "global_step": 383974, "epoch": 2285} {"train_loss": -12.29815673828125, "global_step": 383975, "epoch": 2285} {"train_loss": -11.641002655029297, "global_step": 383976, "epoch": 2285} {"train_loss": -12.522123336791992, "global_step": 383977, "epoch": 2285} {"train_loss": -11.646440505981445, "global_step": 383978, "epoch": 2285} {"train_loss": -11.795969009399414, "global_step": 383979, "epoch": 2285} {"train_loss": -12.138562202453613, "global_step": 383980, "epoch": 2285} {"train_loss": -11.790492057800293, "global_step": 383981, "epoch": 2285} {"train_loss": -11.499150276184082, "global_step": 383982, "epoch": 2285} {"train_loss": -12.060297012329102, "global_step": 383983, "epoch": 2285} {"train_loss": -11.923246383666992, "global_step": 383984, "epoch": 2285} {"train_loss": -12.684402465820312, "global_step": 383985, "epoch": 2285} {"train_loss": -12.074094772338867, "global_step": 383986, "epoch": 2285} {"train_loss": -11.803991317749023, "global_step": 383987, "epoch": 2285} {"train_loss": -12.560179710388184, "global_step": 383988, "epoch": 2285} {"train_loss": -12.127685546875, "global_step": 383989, "epoch": 2285} {"train_loss": -12.034428596496582, "global_step": 383990, "epoch": 2285} {"train_loss": -11.859672546386719, "global_step": 383991, "epoch": 2285} {"train_loss": -11.678533554077148, "global_step": 383992, "epoch": 2285} {"train_loss": -12.232217788696289, "global_step": 383993, "epoch": 2285} {"train_loss": -11.2611083984375, "global_step": 383994, "epoch": 2285} {"train_loss": -11.878280639648438, "global_step": 383995, "epoch": 2285} {"train_loss": -11.416702270507812, "global_step": 383996, "epoch": 2285} {"train_loss": -12.208484649658203, "global_step": 383997, "epoch": 2285} {"train_loss": -11.979254722595215, "global_step": 383998, "epoch": 2285} {"train_loss": -11.643818855285645, "global_step": 383999, "epoch": 2285} {"train_loss": -11.29738998413086, "global_step": 384000, "epoch": 2285} {"train_loss": -12.14712142944336, "global_step": 384001, "epoch": 2285} {"train_loss": -11.987943649291992, "global_step": 384002, "epoch": 2285} {"train_loss": -11.830137252807617, "global_step": 384003, "epoch": 2285} {"train_loss": -11.28398323059082, "global_step": 384004, "epoch": 2285} {"train_loss": -11.268357276916504, "global_step": 384005, "epoch": 2285} {"train_loss": -12.44930648803711, "global_step": 384006, "epoch": 2285} {"train_loss": -11.409025192260742, "global_step": 384007, "epoch": 2285} {"train_loss": -12.125588417053223, "global_step": 384008, "epoch": 2285} {"train_loss": -11.902486801147461, "global_step": 384009, "epoch": 2285} {"train_loss": -12.14897346496582, "global_step": 384010, "epoch": 2285} {"train_loss": -12.258111953735352, "global_step": 384011, "epoch": 2285} {"train_loss": -12.479812622070312, "global_step": 384012, "epoch": 2285} {"train_loss": -12.186225891113281, "global_step": 384013, "epoch": 2285} {"train_loss": -12.476800918579102, "global_step": 384014, "epoch": 2285} {"train_loss": -12.0816650390625, "global_step": 384015, "epoch": 2285} {"train_loss": -12.11889934539795, "global_step": 384016, "epoch": 2285} {"train_loss": -12.492986679077148, "global_step": 384017, "epoch": 2285} {"train_loss": -12.432218551635742, "global_step": 384018, "epoch": 2285} {"train_loss": -12.203709602355957, "global_step": 384019, "epoch": 2285} {"train_loss": -12.514951705932617, "global_step": 384020, "epoch": 2285} {"train_loss": -12.563146591186523, "global_step": 384021, "epoch": 2285} {"train_loss": -12.451085090637207, "global_step": 384022, "epoch": 2285} {"train_loss": -12.348071098327637, "global_step": 384023, "epoch": 2285} {"train_loss": -12.425042152404785, "global_step": 384024, "epoch": 2285} {"train_loss": -12.553664207458496, "global_step": 384025, "epoch": 2285} {"train_loss": -12.704251289367676, "global_step": 384026, "epoch": 2285} {"train_loss": -12.376553535461426, "global_step": 384027, "epoch": 2285} {"train_loss": -12.424253463745117, "global_step": 384028, "epoch": 2285} {"train_loss": -12.588275909423828, "global_step": 384029, "epoch": 2285} {"train_loss": -12.701403617858887, "global_step": 384030, "epoch": 2285} {"train_loss": -12.73274040222168, "global_step": 384031, "epoch": 2285} {"train_loss": -12.618523597717285, "global_step": 384032, "epoch": 2285} {"train_loss": -12.274683952331543, "global_step": 384033, "epoch": 2285} {"train_loss": -12.43531608581543, "global_step": 384034, "epoch": 2285} {"train_loss": -12.412919044494629, "global_step": 384035, "epoch": 2285} {"train_loss": -12.428380966186523, "global_step": 384036, "epoch": 2285} {"train_loss": -12.354488372802734, "global_step": 384037, "epoch": 2285} {"train_loss": -12.430792808532715, "global_step": 384038, "epoch": 2285} {"train_loss": -12.68099308013916, "global_step": 384039, "epoch": 2285} {"train_loss": -12.4793701171875, "global_step": 384040, "epoch": 2285} {"train_loss": -12.421873092651367, "global_step": 384041, "epoch": 2285} {"train_loss": -12.404623031616211, "global_step": 384042, "epoch": 2285} {"train_loss": -12.682308197021484, "global_step": 384043, "epoch": 2285} {"train_loss": -12.095626831054688, "global_step": 384044, "epoch": 2285} {"train_loss": -12.386675834655762, "global_step": 384045, "epoch": 2285} {"train_loss": -12.708389282226562, "global_step": 384046, "epoch": 2285} {"train_loss": -12.188800709588188, "global_step": 384047, "epoch": 2285, "val_loss": 293652.625, "train_action_mse_error": 1.6905102729797363} {"train_loss": -12.46834945678711, "global_step": 384048, "epoch": 2286} {"train_loss": -12.425731658935547, "global_step": 384049, "epoch": 2286} {"train_loss": -12.445476531982422, "global_step": 384050, "epoch": 2286} {"train_loss": -12.365570068359375, "global_step": 384051, "epoch": 2286} {"train_loss": -12.292957305908203, "global_step": 384052, "epoch": 2286} {"train_loss": -11.799777030944824, "global_step": 384053, "epoch": 2286} {"train_loss": -11.373377799987793, "global_step": 384054, "epoch": 2286} {"train_loss": -12.492018699645996, "global_step": 384055, "epoch": 2286} {"train_loss": -11.295279502868652, "global_step": 384056, "epoch": 2286} {"train_loss": -10.187772750854492, "global_step": 384057, "epoch": 2286} {"train_loss": -11.328185081481934, "global_step": 384058, "epoch": 2286} {"train_loss": -8.81650161743164, "global_step": 384059, "epoch": 2286} {"train_loss": -8.40864372253418, "global_step": 384060, "epoch": 2286} {"train_loss": -8.038263320922852, "global_step": 384061, "epoch": 2286} {"train_loss": -9.483881950378418, "global_step": 384062, "epoch": 2286} {"train_loss": -9.217318534851074, "global_step": 384063, "epoch": 2286} {"train_loss": -9.483463287353516, "global_step": 384064, "epoch": 2286} {"train_loss": -8.619773864746094, "global_step": 384065, "epoch": 2286} {"train_loss": -10.43282699584961, "global_step": 384066, "epoch": 2286} {"train_loss": -10.014808654785156, "global_step": 384067, "epoch": 2286} {"train_loss": -10.602838516235352, "global_step": 384068, "epoch": 2286} {"train_loss": -10.35910415649414, "global_step": 384069, "epoch": 2286} {"train_loss": -9.786479949951172, "global_step": 384070, "epoch": 2286} {"train_loss": -11.057262420654297, "global_step": 384071, "epoch": 2286} {"train_loss": -10.5987548828125, "global_step": 384072, "epoch": 2286} {"train_loss": -9.405244827270508, "global_step": 384073, "epoch": 2286} {"train_loss": -9.977203369140625, "global_step": 384074, "epoch": 2286} {"train_loss": -10.186079025268555, "global_step": 384075, "epoch": 2286} {"train_loss": -10.192159652709961, "global_step": 384076, "epoch": 2286} {"train_loss": -9.678197860717773, "global_step": 384077, "epoch": 2286} {"train_loss": -10.665374755859375, "global_step": 384078, "epoch": 2286} {"train_loss": -10.702759742736816, "global_step": 384079, "epoch": 2286} {"train_loss": -10.069607734680176, "global_step": 384080, "epoch": 2286} {"train_loss": -11.206857681274414, "global_step": 384081, "epoch": 2286} {"train_loss": -10.864163398742676, "global_step": 384082, "epoch": 2286} {"train_loss": -10.972214698791504, "global_step": 384083, "epoch": 2286} {"train_loss": -10.990757942199707, "global_step": 384084, "epoch": 2286} {"train_loss": -10.876710891723633, "global_step": 384085, "epoch": 2286} {"train_loss": -11.370387077331543, "global_step": 384086, "epoch": 2286} {"train_loss": -10.833362579345703, "global_step": 384087, "epoch": 2286} {"train_loss": -11.47480583190918, "global_step": 384088, "epoch": 2286} {"train_loss": -10.836822509765625, "global_step": 384089, "epoch": 2286} {"train_loss": -11.625744819641113, "global_step": 384090, "epoch": 2286} {"train_loss": -11.069228172302246, "global_step": 384091, "epoch": 2286} {"train_loss": -11.535598754882812, "global_step": 384092, "epoch": 2286} {"train_loss": -11.590270042419434, "global_step": 384093, "epoch": 2286} {"train_loss": -11.693115234375, "global_step": 384094, "epoch": 2286} {"train_loss": -11.734663009643555, "global_step": 384095, "epoch": 2286} {"train_loss": -12.008413314819336, "global_step": 384096, "epoch": 2286} {"train_loss": -11.979472160339355, "global_step": 384097, "epoch": 2286} {"train_loss": -11.945564270019531, "global_step": 384098, "epoch": 2286} {"train_loss": -11.761384963989258, "global_step": 384099, "epoch": 2286} {"train_loss": -11.93150520324707, "global_step": 384100, "epoch": 2286} {"train_loss": -11.917481422424316, "global_step": 384101, "epoch": 2286} {"train_loss": -12.112201690673828, "global_step": 384102, "epoch": 2286} {"train_loss": -11.884902954101562, "global_step": 384103, "epoch": 2286} {"train_loss": -12.321020126342773, "global_step": 384104, "epoch": 2286} {"train_loss": -11.769669532775879, "global_step": 384105, "epoch": 2286} {"train_loss": -12.05424976348877, "global_step": 384106, "epoch": 2286} {"train_loss": -11.810239791870117, "global_step": 384107, "epoch": 2286} {"train_loss": -12.197715759277344, "global_step": 384108, "epoch": 2286} {"train_loss": -12.083854675292969, "global_step": 384109, "epoch": 2286} {"train_loss": -12.147453308105469, "global_step": 384110, "epoch": 2286} {"train_loss": -12.410337448120117, "global_step": 384111, "epoch": 2286} {"train_loss": -11.848432540893555, "global_step": 384112, "epoch": 2286} {"train_loss": -12.305455207824707, "global_step": 384113, "epoch": 2286} {"train_loss": -12.327220916748047, "global_step": 384114, "epoch": 2286} {"train_loss": -11.98660945892334, "global_step": 384115, "epoch": 2286} {"train_loss": -12.281288146972656, "global_step": 384116, "epoch": 2286} {"train_loss": -12.129966735839844, "global_step": 384117, "epoch": 2286} {"train_loss": -12.265291213989258, "global_step": 384118, "epoch": 2286} {"train_loss": -12.111892700195312, "global_step": 384119, "epoch": 2286} {"train_loss": -12.061805725097656, "global_step": 384120, "epoch": 2286} {"train_loss": -12.367414474487305, "global_step": 384121, "epoch": 2286} {"train_loss": -11.880672454833984, "global_step": 384122, "epoch": 2286} {"train_loss": -12.271055221557617, "global_step": 384123, "epoch": 2286} {"train_loss": -11.58154296875, "global_step": 384124, "epoch": 2286} {"train_loss": -12.349817276000977, "global_step": 384125, "epoch": 2286} {"train_loss": -11.99039363861084, "global_step": 384126, "epoch": 2286} {"train_loss": -12.067337036132812, "global_step": 384127, "epoch": 2286} {"train_loss": -12.002548217773438, "global_step": 384128, "epoch": 2286} {"train_loss": -12.07771110534668, "global_step": 384129, "epoch": 2286} {"train_loss": -12.151985168457031, "global_step": 384130, "epoch": 2286} {"train_loss": -12.045608520507812, "global_step": 384131, "epoch": 2286} {"train_loss": -12.570928573608398, "global_step": 384132, "epoch": 2286} {"train_loss": -12.148205757141113, "global_step": 384133, "epoch": 2286} {"train_loss": -12.361873626708984, "global_step": 384134, "epoch": 2286} {"train_loss": -12.33336067199707, "global_step": 384135, "epoch": 2286} {"train_loss": -11.822908401489258, "global_step": 384136, "epoch": 2286} {"train_loss": -12.25269603729248, "global_step": 384137, "epoch": 2286} {"train_loss": -12.043619155883789, "global_step": 384138, "epoch": 2286} {"train_loss": -12.42357063293457, "global_step": 384139, "epoch": 2286} {"train_loss": -12.032434463500977, "global_step": 384140, "epoch": 2286} {"train_loss": -12.275671005249023, "global_step": 384141, "epoch": 2286} {"train_loss": -12.187582015991211, "global_step": 384142, "epoch": 2286} {"train_loss": -12.376487731933594, "global_step": 384143, "epoch": 2286} {"train_loss": -12.607789039611816, "global_step": 384144, "epoch": 2286} {"train_loss": -12.274856567382812, "global_step": 384145, "epoch": 2286} {"train_loss": -12.605573654174805, "global_step": 384146, "epoch": 2286} {"train_loss": -12.47850227355957, "global_step": 384147, "epoch": 2286} {"train_loss": -12.483946800231934, "global_step": 384148, "epoch": 2286} {"train_loss": -12.580804824829102, "global_step": 384149, "epoch": 2286} {"train_loss": -12.331241607666016, "global_step": 384150, "epoch": 2286} {"train_loss": -12.307340621948242, "global_step": 384151, "epoch": 2286} {"train_loss": -12.597188949584961, "global_step": 384152, "epoch": 2286} {"train_loss": -12.537874221801758, "global_step": 384153, "epoch": 2286} {"train_loss": -12.554162979125977, "global_step": 384154, "epoch": 2286} {"train_loss": -12.36441421508789, "global_step": 384155, "epoch": 2286} {"train_loss": -12.552586555480957, "global_step": 384156, "epoch": 2286} {"train_loss": -12.510860443115234, "global_step": 384157, "epoch": 2286} {"train_loss": -12.503950119018555, "global_step": 384158, "epoch": 2286} {"train_loss": -12.770791053771973, "global_step": 384159, "epoch": 2286} {"train_loss": -12.525075912475586, "global_step": 384160, "epoch": 2286} {"train_loss": -12.798689842224121, "global_step": 384161, "epoch": 2286} {"train_loss": -12.489355087280273, "global_step": 384162, "epoch": 2286} {"train_loss": -12.655399322509766, "global_step": 384163, "epoch": 2286} {"train_loss": -12.63619613647461, "global_step": 384164, "epoch": 2286} {"train_loss": -12.666833877563477, "global_step": 384165, "epoch": 2286} {"train_loss": -12.93404769897461, "global_step": 384166, "epoch": 2286} {"train_loss": -12.449987411499023, "global_step": 384167, "epoch": 2286} {"train_loss": -11.894877433776855, "global_step": 384168, "epoch": 2286} {"train_loss": -12.424040794372559, "global_step": 384169, "epoch": 2286} {"train_loss": -12.500852584838867, "global_step": 384170, "epoch": 2286} {"train_loss": -12.338150024414062, "global_step": 384171, "epoch": 2286} {"train_loss": -11.904385566711426, "global_step": 384172, "epoch": 2286} {"train_loss": -12.042867660522461, "global_step": 384173, "epoch": 2286} {"train_loss": -12.649626731872559, "global_step": 384174, "epoch": 2286} {"train_loss": -12.008513450622559, "global_step": 384175, "epoch": 2286} {"train_loss": -12.221389770507812, "global_step": 384176, "epoch": 2286} {"train_loss": -12.469184875488281, "global_step": 384177, "epoch": 2286} {"train_loss": -12.384452819824219, "global_step": 384178, "epoch": 2286} {"train_loss": -12.145203590393066, "global_step": 384179, "epoch": 2286} {"train_loss": -12.646201133728027, "global_step": 384180, "epoch": 2286} {"train_loss": -11.786140441894531, "global_step": 384181, "epoch": 2286} {"train_loss": -11.119367599487305, "global_step": 384182, "epoch": 2286} {"train_loss": -12.581613540649414, "global_step": 384183, "epoch": 2286} {"train_loss": -12.317569732666016, "global_step": 384184, "epoch": 2286} {"train_loss": -11.869363784790039, "global_step": 384185, "epoch": 2286} {"train_loss": -12.275453567504883, "global_step": 384186, "epoch": 2286} {"train_loss": -11.536626815795898, "global_step": 384187, "epoch": 2286} {"train_loss": -10.557841300964355, "global_step": 384188, "epoch": 2286} {"train_loss": -12.428266525268555, "global_step": 384189, "epoch": 2286} {"train_loss": -10.802253723144531, "global_step": 384190, "epoch": 2286} {"train_loss": -9.622236251831055, "global_step": 384191, "epoch": 2286} {"train_loss": -11.309367179870605, "global_step": 384192, "epoch": 2286} {"train_loss": -8.440826416015625, "global_step": 384193, "epoch": 2286} {"train_loss": -10.963847160339355, "global_step": 384194, "epoch": 2286} {"train_loss": -8.876565933227539, "global_step": 384195, "epoch": 2286} {"train_loss": -11.055335998535156, "global_step": 384196, "epoch": 2286} {"train_loss": -8.289892196655273, "global_step": 384197, "epoch": 2286} {"train_loss": -8.72134780883789, "global_step": 384198, "epoch": 2286} {"train_loss": -10.940914154052734, "global_step": 384199, "epoch": 2286} {"train_loss": -8.066000938415527, "global_step": 384200, "epoch": 2286} {"train_loss": -9.423605918884277, "global_step": 384201, "epoch": 2286} {"train_loss": -8.03913402557373, "global_step": 384202, "epoch": 2286} {"train_loss": -8.396629333496094, "global_step": 384203, "epoch": 2286} {"train_loss": -8.351222038269043, "global_step": 384204, "epoch": 2286} {"train_loss": -9.099555969238281, "global_step": 384205, "epoch": 2286} {"train_loss": -9.062253952026367, "global_step": 384206, "epoch": 2286} {"train_loss": -8.992141723632812, "global_step": 384207, "epoch": 2286} {"train_loss": -10.269909858703613, "global_step": 384208, "epoch": 2286} {"train_loss": -10.839910507202148, "global_step": 384209, "epoch": 2286} {"train_loss": -9.237948417663574, "global_step": 384210, "epoch": 2286} {"train_loss": -8.68637752532959, "global_step": 384211, "epoch": 2286} {"train_loss": -9.80014419555664, "global_step": 384212, "epoch": 2286} {"train_loss": -10.281693458557129, "global_step": 384213, "epoch": 2286} {"train_loss": -9.033308029174805, "global_step": 384214, "epoch": 2286} {"train_loss": -11.365808611824399, "global_step": 384215, "epoch": 2286, "val_loss": 287676.65625} {"train_loss": -10.141183853149414, "global_step": 384216, "epoch": 2287} {"train_loss": -10.186054229736328, "global_step": 384217, "epoch": 2287} {"train_loss": -10.95455551147461, "global_step": 384218, "epoch": 2287} {"train_loss": -9.855791091918945, "global_step": 384219, "epoch": 2287} {"train_loss": -10.026309967041016, "global_step": 384220, "epoch": 2287} {"train_loss": -11.17712688446045, "global_step": 384221, "epoch": 2287} {"train_loss": -11.033792495727539, "global_step": 384222, "epoch": 2287} {"train_loss": -10.634173393249512, "global_step": 384223, "epoch": 2287} {"train_loss": -10.9359769821167, "global_step": 384224, "epoch": 2287} {"train_loss": -11.121492385864258, "global_step": 384225, "epoch": 2287} {"train_loss": -10.939825057983398, "global_step": 384226, "epoch": 2287} {"train_loss": -11.716399192810059, "global_step": 384227, "epoch": 2287} {"train_loss": -11.780338287353516, "global_step": 384228, "epoch": 2287} {"train_loss": -11.570012092590332, "global_step": 384229, "epoch": 2287} {"train_loss": -11.227604866027832, "global_step": 384230, "epoch": 2287} {"train_loss": -11.719260215759277, "global_step": 384231, "epoch": 2287} {"train_loss": -11.134292602539062, "global_step": 384232, "epoch": 2287} {"train_loss": -11.767023086547852, "global_step": 384233, "epoch": 2287} {"train_loss": -11.573923110961914, "global_step": 384234, "epoch": 2287} {"train_loss": -11.72867202758789, "global_step": 384235, "epoch": 2287} {"train_loss": -11.958345413208008, "global_step": 384236, "epoch": 2287} {"train_loss": -12.033190727233887, "global_step": 384237, "epoch": 2287} {"train_loss": -11.364984512329102, "global_step": 384238, "epoch": 2287} {"train_loss": -11.637356758117676, "global_step": 384239, "epoch": 2287} {"train_loss": -11.89358139038086, "global_step": 384240, "epoch": 2287} {"train_loss": -12.101024627685547, "global_step": 384241, "epoch": 2287} {"train_loss": -12.17306137084961, "global_step": 384242, "epoch": 2287} {"train_loss": -11.642170906066895, "global_step": 384243, "epoch": 2287} {"train_loss": -11.930682182312012, "global_step": 384244, "epoch": 2287} {"train_loss": -11.81075668334961, "global_step": 384245, "epoch": 2287} {"train_loss": -12.179452896118164, "global_step": 384246, "epoch": 2287} {"train_loss": -12.117740631103516, "global_step": 384247, "epoch": 2287} {"train_loss": -12.190980911254883, "global_step": 384248, "epoch": 2287} {"train_loss": -12.181621551513672, "global_step": 384249, "epoch": 2287} {"train_loss": -12.226861953735352, "global_step": 384250, "epoch": 2287} {"train_loss": -12.115615844726562, "global_step": 384251, "epoch": 2287} {"train_loss": -12.195114135742188, "global_step": 384252, "epoch": 2287} {"train_loss": -12.208621978759766, "global_step": 384253, "epoch": 2287} {"train_loss": -12.047956466674805, "global_step": 384254, "epoch": 2287} {"train_loss": -12.213260650634766, "global_step": 384255, "epoch": 2287} {"train_loss": -11.892057418823242, "global_step": 384256, "epoch": 2287} {"train_loss": -12.250560760498047, "global_step": 384257, "epoch": 2287} {"train_loss": -12.363234519958496, "global_step": 384258, "epoch": 2287} {"train_loss": -12.312323570251465, "global_step": 384259, "epoch": 2287} {"train_loss": -12.24189567565918, "global_step": 384260, "epoch": 2287} {"train_loss": -12.499162673950195, "global_step": 384261, "epoch": 2287} {"train_loss": -12.05489444732666, "global_step": 384262, "epoch": 2287} {"train_loss": -12.272735595703125, "global_step": 384263, "epoch": 2287} {"train_loss": -12.462709426879883, "global_step": 384264, "epoch": 2287} {"train_loss": -12.307093620300293, "global_step": 384265, "epoch": 2287} {"train_loss": -12.41220474243164, "global_step": 384266, "epoch": 2287} {"train_loss": -12.25568675994873, "global_step": 384267, "epoch": 2287} {"train_loss": -12.313213348388672, "global_step": 384268, "epoch": 2287} {"train_loss": -12.564483642578125, "global_step": 384269, "epoch": 2287} {"train_loss": -12.384671211242676, "global_step": 384270, "epoch": 2287} {"train_loss": -12.443618774414062, "global_step": 384271, "epoch": 2287} {"train_loss": -12.341054916381836, "global_step": 384272, "epoch": 2287} {"train_loss": -12.511680603027344, "global_step": 384273, "epoch": 2287} {"train_loss": -12.48434829711914, "global_step": 384274, "epoch": 2287} {"train_loss": -12.237466812133789, "global_step": 384275, "epoch": 2287} {"train_loss": -12.46280574798584, "global_step": 384276, "epoch": 2287} {"train_loss": -12.497634887695312, "global_step": 384277, "epoch": 2287} {"train_loss": -12.225142478942871, "global_step": 384278, "epoch": 2287} {"train_loss": -12.464603424072266, "global_step": 384279, "epoch": 2287} {"train_loss": -12.492555618286133, "global_step": 384280, "epoch": 2287} {"train_loss": -12.470419883728027, "global_step": 384281, "epoch": 2287} {"train_loss": -12.532037734985352, "global_step": 384282, "epoch": 2287} {"train_loss": -12.476922988891602, "global_step": 384283, "epoch": 2287} {"train_loss": -12.484644889831543, "global_step": 384284, "epoch": 2287} {"train_loss": -12.408124923706055, "global_step": 384285, "epoch": 2287} {"train_loss": -12.469675064086914, "global_step": 384286, "epoch": 2287} {"train_loss": -12.396096229553223, "global_step": 384287, "epoch": 2287} {"train_loss": -12.570836067199707, "global_step": 384288, "epoch": 2287} {"train_loss": -12.630281448364258, "global_step": 384289, "epoch": 2287} {"train_loss": -12.218318939208984, "global_step": 384290, "epoch": 2287} {"train_loss": -12.543977737426758, "global_step": 384291, "epoch": 2287} {"train_loss": -12.463520050048828, "global_step": 384292, "epoch": 2287} {"train_loss": -12.476678848266602, "global_step": 384293, "epoch": 2287} {"train_loss": -12.423029899597168, "global_step": 384294, "epoch": 2287} {"train_loss": -12.516006469726562, "global_step": 384295, "epoch": 2287} {"train_loss": -12.72739028930664, "global_step": 384296, "epoch": 2287} {"train_loss": -12.473543167114258, "global_step": 384297, "epoch": 2287} {"train_loss": -12.4666109085083, "global_step": 384298, "epoch": 2287} {"train_loss": -12.675084114074707, "global_step": 384299, "epoch": 2287} {"train_loss": -12.570255279541016, "global_step": 384300, "epoch": 2287} {"train_loss": -12.611639022827148, "global_step": 384301, "epoch": 2287} {"train_loss": -12.733643531799316, "global_step": 384302, "epoch": 2287} {"train_loss": -12.503220558166504, "global_step": 384303, "epoch": 2287} {"train_loss": -12.69369888305664, "global_step": 384304, "epoch": 2287} {"train_loss": -12.544261932373047, "global_step": 384305, "epoch": 2287} {"train_loss": -12.384296417236328, "global_step": 384306, "epoch": 2287} {"train_loss": -12.35312271118164, "global_step": 384307, "epoch": 2287} {"train_loss": -11.907831192016602, "global_step": 384308, "epoch": 2287} {"train_loss": -12.309804916381836, "global_step": 384309, "epoch": 2287} {"train_loss": -12.454010963439941, "global_step": 384310, "epoch": 2287} {"train_loss": -11.807121276855469, "global_step": 384311, "epoch": 2287} {"train_loss": -11.581851959228516, "global_step": 384312, "epoch": 2287} {"train_loss": -11.237926483154297, "global_step": 384313, "epoch": 2287} {"train_loss": -10.072912216186523, "global_step": 384314, "epoch": 2287} {"train_loss": -9.017580032348633, "global_step": 384315, "epoch": 2287} {"train_loss": -9.584897994995117, "global_step": 384316, "epoch": 2287} {"train_loss": -9.727194786071777, "global_step": 384317, "epoch": 2287} {"train_loss": -9.761669158935547, "global_step": 384318, "epoch": 2287} {"train_loss": -9.978645324707031, "global_step": 384319, "epoch": 2287} {"train_loss": -10.419575691223145, "global_step": 384320, "epoch": 2287} {"train_loss": -10.120534896850586, "global_step": 384321, "epoch": 2287} {"train_loss": -10.76214599609375, "global_step": 384322, "epoch": 2287} {"train_loss": -10.791707038879395, "global_step": 384323, "epoch": 2287} {"train_loss": -11.28418254852295, "global_step": 384324, "epoch": 2287} {"train_loss": -10.715261459350586, "global_step": 384325, "epoch": 2287} {"train_loss": -11.425093650817871, "global_step": 384326, "epoch": 2287} {"train_loss": -11.00046157836914, "global_step": 384327, "epoch": 2287} {"train_loss": -10.57233715057373, "global_step": 384328, "epoch": 2287} {"train_loss": -12.029749870300293, "global_step": 384329, "epoch": 2287} {"train_loss": -11.305509567260742, "global_step": 384330, "epoch": 2287} {"train_loss": -11.726751327514648, "global_step": 384331, "epoch": 2287} {"train_loss": -11.251635551452637, "global_step": 384332, "epoch": 2287} {"train_loss": -11.699945449829102, "global_step": 384333, "epoch": 2287} {"train_loss": -11.13098430633545, "global_step": 384334, "epoch": 2287} {"train_loss": -11.889533996582031, "global_step": 384335, "epoch": 2287} {"train_loss": -11.377243041992188, "global_step": 384336, "epoch": 2287} {"train_loss": -11.94601058959961, "global_step": 384337, "epoch": 2287} {"train_loss": -11.88532829284668, "global_step": 384338, "epoch": 2287} {"train_loss": -11.759000778198242, "global_step": 384339, "epoch": 2287} {"train_loss": -11.728384971618652, "global_step": 384340, "epoch": 2287} {"train_loss": -11.608612060546875, "global_step": 384341, "epoch": 2287} {"train_loss": -11.657999992370605, "global_step": 384342, "epoch": 2287} {"train_loss": -11.53591537475586, "global_step": 384343, "epoch": 2287} {"train_loss": -12.181377410888672, "global_step": 384344, "epoch": 2287} {"train_loss": -11.325613975524902, "global_step": 384345, "epoch": 2287} {"train_loss": -12.148614883422852, "global_step": 384346, "epoch": 2287} {"train_loss": -11.395267486572266, "global_step": 384347, "epoch": 2287} {"train_loss": -11.707338333129883, "global_step": 384348, "epoch": 2287} {"train_loss": -10.67399787902832, "global_step": 384349, "epoch": 2287} {"train_loss": -11.561050415039062, "global_step": 384350, "epoch": 2287} {"train_loss": -10.987510681152344, "global_step": 384351, "epoch": 2287} {"train_loss": -10.866174697875977, "global_step": 384352, "epoch": 2287} {"train_loss": -10.294426918029785, "global_step": 384353, "epoch": 2287} {"train_loss": -11.146596908569336, "global_step": 384354, "epoch": 2287} {"train_loss": -10.720460891723633, "global_step": 384355, "epoch": 2287} {"train_loss": -10.702184677124023, "global_step": 384356, "epoch": 2287} {"train_loss": -10.727642059326172, "global_step": 384357, "epoch": 2287} {"train_loss": -11.267295837402344, "global_step": 384358, "epoch": 2287} {"train_loss": -11.017749786376953, "global_step": 384359, "epoch": 2287} {"train_loss": -10.463699340820312, "global_step": 384360, "epoch": 2287} {"train_loss": -11.082335472106934, "global_step": 384361, "epoch": 2287} {"train_loss": -10.878569602966309, "global_step": 384362, "epoch": 2287} {"train_loss": -9.930086135864258, "global_step": 384363, "epoch": 2287} {"train_loss": -11.490324020385742, "global_step": 384364, "epoch": 2287} {"train_loss": -10.96034049987793, "global_step": 384365, "epoch": 2287} {"train_loss": -9.872126579284668, "global_step": 384366, "epoch": 2287} {"train_loss": -11.658709526062012, "global_step": 384367, "epoch": 2287} {"train_loss": -11.420631408691406, "global_step": 384368, "epoch": 2287} {"train_loss": -11.024351119995117, "global_step": 384369, "epoch": 2287} {"train_loss": -11.315985679626465, "global_step": 384370, "epoch": 2287} {"train_loss": -11.012310028076172, "global_step": 384371, "epoch": 2287} {"train_loss": -10.900720596313477, "global_step": 384372, "epoch": 2287} {"train_loss": -11.307079315185547, "global_step": 384373, "epoch": 2287} {"train_loss": -11.145631790161133, "global_step": 384374, "epoch": 2287} {"train_loss": -11.280627250671387, "global_step": 384375, "epoch": 2287} {"train_loss": -11.561439514160156, "global_step": 384376, "epoch": 2287} {"train_loss": -11.288667678833008, "global_step": 384377, "epoch": 2287} {"train_loss": -11.169755935668945, "global_step": 384378, "epoch": 2287} {"train_loss": -11.67344856262207, "global_step": 384379, "epoch": 2287} {"train_loss": -10.550981521606445, "global_step": 384380, "epoch": 2287} {"train_loss": -11.428091049194336, "global_step": 384381, "epoch": 2287} {"train_loss": -11.233541488647461, "global_step": 384382, "epoch": 2287} {"train_loss": -11.627140908014207, "global_step": 384383, "epoch": 2287, "val_loss": 291696.09375} {"train_loss": -12.061033248901367, "global_step": 384384, "epoch": 2288} {"train_loss": -11.192188262939453, "global_step": 384385, "epoch": 2288} {"train_loss": -12.015206336975098, "global_step": 384386, "epoch": 2288} {"train_loss": -11.558565139770508, "global_step": 384387, "epoch": 2288} {"train_loss": -11.354902267456055, "global_step": 384388, "epoch": 2288} {"train_loss": -11.366445541381836, "global_step": 384389, "epoch": 2288} {"train_loss": -11.795808792114258, "global_step": 384390, "epoch": 2288} {"train_loss": -11.885501861572266, "global_step": 384391, "epoch": 2288} {"train_loss": -11.215368270874023, "global_step": 384392, "epoch": 2288} {"train_loss": -11.901947021484375, "global_step": 384393, "epoch": 2288} {"train_loss": -11.901346206665039, "global_step": 384394, "epoch": 2288} {"train_loss": -11.017032623291016, "global_step": 384395, "epoch": 2288} {"train_loss": -11.421401977539062, "global_step": 384396, "epoch": 2288} {"train_loss": -11.484976768493652, "global_step": 384397, "epoch": 2288} {"train_loss": -11.411457061767578, "global_step": 384398, "epoch": 2288} {"train_loss": -12.008338928222656, "global_step": 384399, "epoch": 2288} {"train_loss": -11.805732727050781, "global_step": 384400, "epoch": 2288} {"train_loss": -11.920918464660645, "global_step": 384401, "epoch": 2288} {"train_loss": -12.189193725585938, "global_step": 384402, "epoch": 2288} {"train_loss": -12.117302894592285, "global_step": 384403, "epoch": 2288} {"train_loss": -11.842357635498047, "global_step": 384404, "epoch": 2288} {"train_loss": -12.202022552490234, "global_step": 384405, "epoch": 2288} {"train_loss": -11.996698379516602, "global_step": 384406, "epoch": 2288} {"train_loss": -12.153266906738281, "global_step": 384407, "epoch": 2288} {"train_loss": -11.910411834716797, "global_step": 384408, "epoch": 2288} {"train_loss": -12.140438079833984, "global_step": 384409, "epoch": 2288} {"train_loss": -11.866750717163086, "global_step": 384410, "epoch": 2288} {"train_loss": -12.371929168701172, "global_step": 384411, "epoch": 2288} {"train_loss": -11.958269119262695, "global_step": 384412, "epoch": 2288} {"train_loss": -12.130704879760742, "global_step": 384413, "epoch": 2288} {"train_loss": -12.14295768737793, "global_step": 384414, "epoch": 2288} {"train_loss": -12.14555549621582, "global_step": 384415, "epoch": 2288} {"train_loss": -12.135234832763672, "global_step": 384416, "epoch": 2288} {"train_loss": -12.296453475952148, "global_step": 384417, "epoch": 2288} {"train_loss": -12.086398124694824, "global_step": 384418, "epoch": 2288} {"train_loss": -12.133127212524414, "global_step": 384419, "epoch": 2288} {"train_loss": -12.070032119750977, "global_step": 384420, "epoch": 2288} {"train_loss": -12.236601829528809, "global_step": 384421, "epoch": 2288} {"train_loss": -12.24522590637207, "global_step": 384422, "epoch": 2288} {"train_loss": -12.059256553649902, "global_step": 384423, "epoch": 2288} {"train_loss": -12.295555114746094, "global_step": 384424, "epoch": 2288} {"train_loss": -12.358766555786133, "global_step": 384425, "epoch": 2288} {"train_loss": -12.421295166015625, "global_step": 384426, "epoch": 2288} {"train_loss": -12.405207633972168, "global_step": 384427, "epoch": 2288} {"train_loss": -12.384176254272461, "global_step": 384428, "epoch": 2288} {"train_loss": -12.03492546081543, "global_step": 384429, "epoch": 2288} {"train_loss": -12.54580307006836, "global_step": 384430, "epoch": 2288} {"train_loss": -12.312276840209961, "global_step": 384431, "epoch": 2288} {"train_loss": -12.430477142333984, "global_step": 384432, "epoch": 2288} {"train_loss": -12.354155540466309, "global_step": 384433, "epoch": 2288} {"train_loss": -12.513481140136719, "global_step": 384434, "epoch": 2288} {"train_loss": -12.255941390991211, "global_step": 384435, "epoch": 2288} {"train_loss": -12.552902221679688, "global_step": 384436, "epoch": 2288} {"train_loss": -12.333942413330078, "global_step": 384437, "epoch": 2288} {"train_loss": -12.44168758392334, "global_step": 384438, "epoch": 2288} {"train_loss": -12.184457778930664, "global_step": 384439, "epoch": 2288} {"train_loss": -12.601753234863281, "global_step": 384440, "epoch": 2288} {"train_loss": -12.394665718078613, "global_step": 384441, "epoch": 2288} {"train_loss": -12.615610122680664, "global_step": 384442, "epoch": 2288} {"train_loss": -12.264602661132812, "global_step": 384443, "epoch": 2288} {"train_loss": -12.624725341796875, "global_step": 384444, "epoch": 2288} {"train_loss": -12.1527738571167, "global_step": 384445, "epoch": 2288} {"train_loss": -12.407660484313965, "global_step": 384446, "epoch": 2288} {"train_loss": -12.305571556091309, "global_step": 384447, "epoch": 2288} {"train_loss": -12.51414966583252, "global_step": 384448, "epoch": 2288} {"train_loss": -12.501218795776367, "global_step": 384449, "epoch": 2288} {"train_loss": -11.79462718963623, "global_step": 384450, "epoch": 2288} {"train_loss": -12.440720558166504, "global_step": 384451, "epoch": 2288} {"train_loss": -12.155265808105469, "global_step": 384452, "epoch": 2288} {"train_loss": -12.47947883605957, "global_step": 384453, "epoch": 2288} {"train_loss": -12.451769828796387, "global_step": 384454, "epoch": 2288} {"train_loss": -12.464933395385742, "global_step": 384455, "epoch": 2288} {"train_loss": -12.103023529052734, "global_step": 384456, "epoch": 2288} {"train_loss": -12.119149208068848, "global_step": 384457, "epoch": 2288} {"train_loss": -12.347787857055664, "global_step": 384458, "epoch": 2288} {"train_loss": -12.434697151184082, "global_step": 384459, "epoch": 2288} {"train_loss": -12.539016723632812, "global_step": 384460, "epoch": 2288} {"train_loss": -12.714981079101562, "global_step": 384461, "epoch": 2288} {"train_loss": -12.765591621398926, "global_step": 384462, "epoch": 2288} {"train_loss": -12.415302276611328, "global_step": 384463, "epoch": 2288} {"train_loss": -12.729060173034668, "global_step": 384464, "epoch": 2288} {"train_loss": -12.457900047302246, "global_step": 384465, "epoch": 2288} {"train_loss": -12.436275482177734, "global_step": 384466, "epoch": 2288} {"train_loss": -12.757415771484375, "global_step": 384467, "epoch": 2288} {"train_loss": -12.304401397705078, "global_step": 384468, "epoch": 2288} {"train_loss": -12.515755653381348, "global_step": 384469, "epoch": 2288} {"train_loss": -12.598989486694336, "global_step": 384470, "epoch": 2288} {"train_loss": -12.69124984741211, "global_step": 384471, "epoch": 2288} {"train_loss": -12.70456600189209, "global_step": 384472, "epoch": 2288} {"train_loss": -12.520625114440918, "global_step": 384473, "epoch": 2288} {"train_loss": -12.625873565673828, "global_step": 384474, "epoch": 2288} {"train_loss": -12.494513511657715, "global_step": 384475, "epoch": 2288} {"train_loss": -12.794563293457031, "global_step": 384476, "epoch": 2288} {"train_loss": -12.833066940307617, "global_step": 384477, "epoch": 2288} {"train_loss": -12.595430374145508, "global_step": 384478, "epoch": 2288} {"train_loss": -12.749238967895508, "global_step": 384479, "epoch": 2288} {"train_loss": -12.658787727355957, "global_step": 384480, "epoch": 2288} {"train_loss": -12.810243606567383, "global_step": 384481, "epoch": 2288} {"train_loss": -12.78076171875, "global_step": 384482, "epoch": 2288} {"train_loss": -12.757832527160645, "global_step": 384483, "epoch": 2288} {"train_loss": -12.549728393554688, "global_step": 384484, "epoch": 2288} {"train_loss": -12.528802871704102, "global_step": 384485, "epoch": 2288} {"train_loss": -12.538537979125977, "global_step": 384486, "epoch": 2288} {"train_loss": -12.608543395996094, "global_step": 384487, "epoch": 2288} {"train_loss": -12.627595901489258, "global_step": 384488, "epoch": 2288} {"train_loss": -12.534896850585938, "global_step": 384489, "epoch": 2288} {"train_loss": -12.619270324707031, "global_step": 384490, "epoch": 2288} {"train_loss": -12.334314346313477, "global_step": 384491, "epoch": 2288} {"train_loss": -12.100687980651855, "global_step": 384492, "epoch": 2288} {"train_loss": -11.700310707092285, "global_step": 384493, "epoch": 2288} {"train_loss": -11.989276885986328, "global_step": 384494, "epoch": 2288} {"train_loss": -12.394460678100586, "global_step": 384495, "epoch": 2288} {"train_loss": -12.293323516845703, "global_step": 384496, "epoch": 2288} {"train_loss": -12.700737953186035, "global_step": 384497, "epoch": 2288} {"train_loss": -12.515151977539062, "global_step": 384498, "epoch": 2288} {"train_loss": -12.599761009216309, "global_step": 384499, "epoch": 2288} {"train_loss": -12.413976669311523, "global_step": 384500, "epoch": 2288} {"train_loss": -12.211835861206055, "global_step": 384501, "epoch": 2288} {"train_loss": -12.394933700561523, "global_step": 384502, "epoch": 2288} {"train_loss": -11.110481262207031, "global_step": 384503, "epoch": 2288} {"train_loss": -11.80898666381836, "global_step": 384504, "epoch": 2288} {"train_loss": -12.109359741210938, "global_step": 384505, "epoch": 2288} {"train_loss": -12.25633430480957, "global_step": 384506, "epoch": 2288} {"train_loss": -11.892914772033691, "global_step": 384507, "epoch": 2288} {"train_loss": -12.671283721923828, "global_step": 384508, "epoch": 2288} {"train_loss": -12.481388092041016, "global_step": 384509, "epoch": 2288} {"train_loss": -12.317094802856445, "global_step": 384510, "epoch": 2288} {"train_loss": -12.114789009094238, "global_step": 384511, "epoch": 2288} {"train_loss": -12.554576873779297, "global_step": 384512, "epoch": 2288} {"train_loss": -12.343181610107422, "global_step": 384513, "epoch": 2288} {"train_loss": -12.418350219726562, "global_step": 384514, "epoch": 2288} {"train_loss": -12.209997177124023, "global_step": 384515, "epoch": 2288} {"train_loss": -12.721078872680664, "global_step": 384516, "epoch": 2288} {"train_loss": -11.298484802246094, "global_step": 384517, "epoch": 2288} {"train_loss": -11.06777572631836, "global_step": 384518, "epoch": 2288} {"train_loss": -11.173622131347656, "global_step": 384519, "epoch": 2288} {"train_loss": -12.040614128112793, "global_step": 384520, "epoch": 2288} {"train_loss": -11.126827239990234, "global_step": 384521, "epoch": 2288} {"train_loss": -10.900432586669922, "global_step": 384522, "epoch": 2288} {"train_loss": -11.191691398620605, "global_step": 384523, "epoch": 2288} {"train_loss": -9.544885635375977, "global_step": 384524, "epoch": 2288} {"train_loss": -9.78999137878418, "global_step": 384525, "epoch": 2288} {"train_loss": -10.202640533447266, "global_step": 384526, "epoch": 2288} {"train_loss": -11.406217575073242, "global_step": 384527, "epoch": 2288} {"train_loss": -10.166345596313477, "global_step": 384528, "epoch": 2288} {"train_loss": -10.578557968139648, "global_step": 384529, "epoch": 2288} {"train_loss": -11.669453620910645, "global_step": 384530, "epoch": 2288} {"train_loss": -9.968000411987305, "global_step": 384531, "epoch": 2288} {"train_loss": -11.589365005493164, "global_step": 384532, "epoch": 2288} {"train_loss": -11.45810317993164, "global_step": 384533, "epoch": 2288} {"train_loss": -9.775130271911621, "global_step": 384534, "epoch": 2288} {"train_loss": -11.751581192016602, "global_step": 384535, "epoch": 2288} {"train_loss": -10.126420974731445, "global_step": 384536, "epoch": 2288} {"train_loss": -11.736607551574707, "global_step": 384537, "epoch": 2288} {"train_loss": -10.945199966430664, "global_step": 384538, "epoch": 2288} {"train_loss": -11.739192008972168, "global_step": 384539, "epoch": 2288} {"train_loss": -10.858484268188477, "global_step": 384540, "epoch": 2288} {"train_loss": -11.425765037536621, "global_step": 384541, "epoch": 2288} {"train_loss": -11.081425666809082, "global_step": 384542, "epoch": 2288} {"train_loss": -12.297858238220215, "global_step": 384543, "epoch": 2288} {"train_loss": -11.591739654541016, "global_step": 384544, "epoch": 2288} {"train_loss": -12.264076232910156, "global_step": 384545, "epoch": 2288} {"train_loss": -11.699718475341797, "global_step": 384546, "epoch": 2288} {"train_loss": -11.488417625427246, "global_step": 384547, "epoch": 2288} {"train_loss": -11.887146949768066, "global_step": 384548, "epoch": 2288} {"train_loss": -12.085310935974121, "global_step": 384549, "epoch": 2288} {"train_loss": -12.086494445800781, "global_step": 384550, "epoch": 2288} {"train_loss": -12.03780276434762, "global_step": 384551, "epoch": 2288, "val_loss": 289988.09375} {"train_loss": -12.23959732055664, "global_step": 384552, "epoch": 2289} {"train_loss": -11.803598403930664, "global_step": 384553, "epoch": 2289} {"train_loss": -12.181198120117188, "global_step": 384554, "epoch": 2289} {"train_loss": -12.197433471679688, "global_step": 384555, "epoch": 2289} {"train_loss": -12.053833961486816, "global_step": 384556, "epoch": 2289} {"train_loss": -12.370519638061523, "global_step": 384557, "epoch": 2289} {"train_loss": -11.912040710449219, "global_step": 384558, "epoch": 2289} {"train_loss": -12.554064750671387, "global_step": 384559, "epoch": 2289} {"train_loss": -12.32388973236084, "global_step": 384560, "epoch": 2289} {"train_loss": -12.25528621673584, "global_step": 384561, "epoch": 2289} {"train_loss": -12.436530113220215, "global_step": 384562, "epoch": 2289} {"train_loss": -12.298524856567383, "global_step": 384563, "epoch": 2289} {"train_loss": -12.554537773132324, "global_step": 384564, "epoch": 2289} {"train_loss": -12.433866500854492, "global_step": 384565, "epoch": 2289} {"train_loss": -12.415384292602539, "global_step": 384566, "epoch": 2289} {"train_loss": -12.627038955688477, "global_step": 384567, "epoch": 2289} {"train_loss": -12.645292282104492, "global_step": 384568, "epoch": 2289} {"train_loss": -12.571662902832031, "global_step": 384569, "epoch": 2289} {"train_loss": -12.37514591217041, "global_step": 384570, "epoch": 2289} {"train_loss": -12.355487823486328, "global_step": 384571, "epoch": 2289} {"train_loss": -12.486326217651367, "global_step": 384572, "epoch": 2289} {"train_loss": -12.448773384094238, "global_step": 384573, "epoch": 2289} {"train_loss": -12.422950744628906, "global_step": 384574, "epoch": 2289} {"train_loss": -12.519309997558594, "global_step": 384575, "epoch": 2289} {"train_loss": -12.418366432189941, "global_step": 384576, "epoch": 2289} {"train_loss": -12.581714630126953, "global_step": 384577, "epoch": 2289} {"train_loss": -12.638980865478516, "global_step": 384578, "epoch": 2289} {"train_loss": -12.594284057617188, "global_step": 384579, "epoch": 2289} {"train_loss": -12.468151092529297, "global_step": 384580, "epoch": 2289} {"train_loss": -12.374821662902832, "global_step": 384581, "epoch": 2289} {"train_loss": -12.771573066711426, "global_step": 384582, "epoch": 2289} {"train_loss": -12.61333179473877, "global_step": 384583, "epoch": 2289} {"train_loss": -12.358648300170898, "global_step": 384584, "epoch": 2289} {"train_loss": -12.485803604125977, "global_step": 384585, "epoch": 2289} {"train_loss": -12.61644172668457, "global_step": 384586, "epoch": 2289} {"train_loss": -12.472399711608887, "global_step": 384587, "epoch": 2289} {"train_loss": -12.477729797363281, "global_step": 384588, "epoch": 2289} {"train_loss": -12.372209548950195, "global_step": 384589, "epoch": 2289} {"train_loss": -12.273481369018555, "global_step": 384590, "epoch": 2289} {"train_loss": -12.762931823730469, "global_step": 384591, "epoch": 2289} {"train_loss": -12.337212562561035, "global_step": 384592, "epoch": 2289} {"train_loss": -12.539644241333008, "global_step": 384593, "epoch": 2289} {"train_loss": -12.484716415405273, "global_step": 384594, "epoch": 2289} {"train_loss": -12.326085090637207, "global_step": 384595, "epoch": 2289} {"train_loss": -12.496098518371582, "global_step": 384596, "epoch": 2289} {"train_loss": -12.689854621887207, "global_step": 384597, "epoch": 2289} {"train_loss": -12.088983535766602, "global_step": 384598, "epoch": 2289} {"train_loss": -12.51672649383545, "global_step": 384599, "epoch": 2289} {"train_loss": -12.548505783081055, "global_step": 384600, "epoch": 2289} {"train_loss": -12.172110557556152, "global_step": 384601, "epoch": 2289} {"train_loss": -12.45752239227295, "global_step": 384602, "epoch": 2289} {"train_loss": -12.621688842773438, "global_step": 384603, "epoch": 2289} {"train_loss": -12.230347633361816, "global_step": 384604, "epoch": 2289} {"train_loss": -12.125266075134277, "global_step": 384605, "epoch": 2289} {"train_loss": -12.332744598388672, "global_step": 384606, "epoch": 2289} {"train_loss": -11.755102157592773, "global_step": 384607, "epoch": 2289} {"train_loss": -10.709152221679688, "global_step": 384608, "epoch": 2289} {"train_loss": -11.738397598266602, "global_step": 384609, "epoch": 2289} {"train_loss": -9.942682266235352, "global_step": 384610, "epoch": 2289} {"train_loss": -11.617840766906738, "global_step": 384611, "epoch": 2289} {"train_loss": -12.173051834106445, "global_step": 384612, "epoch": 2289} {"train_loss": -11.479854583740234, "global_step": 384613, "epoch": 2289} {"train_loss": -11.987863540649414, "global_step": 384614, "epoch": 2289} {"train_loss": -12.380632400512695, "global_step": 384615, "epoch": 2289} {"train_loss": -11.671680450439453, "global_step": 384616, "epoch": 2289} {"train_loss": -11.963672637939453, "global_step": 384617, "epoch": 2289} {"train_loss": -10.934233665466309, "global_step": 384618, "epoch": 2289} {"train_loss": -10.936599731445312, "global_step": 384619, "epoch": 2289} {"train_loss": -12.126317977905273, "global_step": 384620, "epoch": 2289} {"train_loss": -11.253335952758789, "global_step": 384621, "epoch": 2289} {"train_loss": -11.503824234008789, "global_step": 384622, "epoch": 2289} {"train_loss": -10.408872604370117, "global_step": 384623, "epoch": 2289} {"train_loss": -9.035091400146484, "global_step": 384624, "epoch": 2289} {"train_loss": -8.806660652160645, "global_step": 384625, "epoch": 2289} {"train_loss": -9.328741073608398, "global_step": 384626, "epoch": 2289} {"train_loss": -10.478708267211914, "global_step": 384627, "epoch": 2289} {"train_loss": -9.189228057861328, "global_step": 384628, "epoch": 2289} {"train_loss": -9.28200912475586, "global_step": 384629, "epoch": 2289} {"train_loss": -10.017759323120117, "global_step": 384630, "epoch": 2289} {"train_loss": -9.79539680480957, "global_step": 384631, "epoch": 2289} {"train_loss": -10.758811950683594, "global_step": 384632, "epoch": 2289} {"train_loss": -9.729743957519531, "global_step": 384633, "epoch": 2289} {"train_loss": -11.765813827514648, "global_step": 384634, "epoch": 2289} {"train_loss": -10.772298812866211, "global_step": 384635, "epoch": 2289} {"train_loss": -10.96823501586914, "global_step": 384636, "epoch": 2289} {"train_loss": -10.56814193725586, "global_step": 384637, "epoch": 2289} {"train_loss": -10.89560317993164, "global_step": 384638, "epoch": 2289} {"train_loss": -9.532249450683594, "global_step": 384639, "epoch": 2289} {"train_loss": -10.697427749633789, "global_step": 384640, "epoch": 2289} {"train_loss": -11.046223640441895, "global_step": 384641, "epoch": 2289} {"train_loss": -11.381561279296875, "global_step": 384642, "epoch": 2289} {"train_loss": -10.932218551635742, "global_step": 384643, "epoch": 2289} {"train_loss": -11.157491683959961, "global_step": 384644, "epoch": 2289} {"train_loss": -11.743246078491211, "global_step": 384645, "epoch": 2289} {"train_loss": -10.619146347045898, "global_step": 384646, "epoch": 2289} {"train_loss": -11.905760765075684, "global_step": 384647, "epoch": 2289} {"train_loss": -11.309294700622559, "global_step": 384648, "epoch": 2289} {"train_loss": -11.477924346923828, "global_step": 384649, "epoch": 2289} {"train_loss": -11.681131362915039, "global_step": 384650, "epoch": 2289} {"train_loss": -11.036705017089844, "global_step": 384651, "epoch": 2289} {"train_loss": -11.17307186126709, "global_step": 384652, "epoch": 2289} {"train_loss": -11.818005561828613, "global_step": 384653, "epoch": 2289} {"train_loss": -11.652204513549805, "global_step": 384654, "epoch": 2289} {"train_loss": -11.593318939208984, "global_step": 384655, "epoch": 2289} {"train_loss": -11.82573127746582, "global_step": 384656, "epoch": 2289} {"train_loss": -11.944780349731445, "global_step": 384657, "epoch": 2289} {"train_loss": -12.00182056427002, "global_step": 384658, "epoch": 2289} {"train_loss": -11.413185119628906, "global_step": 384659, "epoch": 2289} {"train_loss": -11.847591400146484, "global_step": 384660, "epoch": 2289} {"train_loss": -11.861104965209961, "global_step": 384661, "epoch": 2289} {"train_loss": -11.948850631713867, "global_step": 384662, "epoch": 2289} {"train_loss": -11.894338607788086, "global_step": 384663, "epoch": 2289} {"train_loss": -12.020734786987305, "global_step": 384664, "epoch": 2289} {"train_loss": -11.953834533691406, "global_step": 384665, "epoch": 2289} {"train_loss": -11.795003890991211, "global_step": 384666, "epoch": 2289} {"train_loss": -11.935401916503906, "global_step": 384667, "epoch": 2289} {"train_loss": -12.115532875061035, "global_step": 384668, "epoch": 2289} {"train_loss": -11.946840286254883, "global_step": 384669, "epoch": 2289} {"train_loss": -12.097211837768555, "global_step": 384670, "epoch": 2289} {"train_loss": -11.993973731994629, "global_step": 384671, "epoch": 2289} {"train_loss": -12.35283088684082, "global_step": 384672, "epoch": 2289} {"train_loss": -12.09483528137207, "global_step": 384673, "epoch": 2289} {"train_loss": -12.206758499145508, "global_step": 384674, "epoch": 2289} {"train_loss": -12.013352394104004, "global_step": 384675, "epoch": 2289} {"train_loss": -12.250899314880371, "global_step": 384676, "epoch": 2289} {"train_loss": -11.896842002868652, "global_step": 384677, "epoch": 2289} {"train_loss": -12.398723602294922, "global_step": 384678, "epoch": 2289} {"train_loss": -12.242919921875, "global_step": 384679, "epoch": 2289} {"train_loss": -12.409518241882324, "global_step": 384680, "epoch": 2289} {"train_loss": -12.554841995239258, "global_step": 384681, "epoch": 2289} {"train_loss": -12.553840637207031, "global_step": 384682, "epoch": 2289} {"train_loss": -12.217813491821289, "global_step": 384683, "epoch": 2289} {"train_loss": -12.431343078613281, "global_step": 384684, "epoch": 2289} {"train_loss": -12.400898933410645, "global_step": 384685, "epoch": 2289} {"train_loss": -12.370195388793945, "global_step": 384686, "epoch": 2289} {"train_loss": -12.318510055541992, "global_step": 384687, "epoch": 2289} {"train_loss": -12.472099304199219, "global_step": 384688, "epoch": 2289} {"train_loss": -12.480401992797852, "global_step": 384689, "epoch": 2289} {"train_loss": -12.498762130737305, "global_step": 384690, "epoch": 2289} {"train_loss": -12.567756652832031, "global_step": 384691, "epoch": 2289} {"train_loss": -12.436515808105469, "global_step": 384692, "epoch": 2289} {"train_loss": -12.552978515625, "global_step": 384693, "epoch": 2289} {"train_loss": -12.513675689697266, "global_step": 384694, "epoch": 2289} {"train_loss": -12.48398494720459, "global_step": 384695, "epoch": 2289} {"train_loss": -12.36446762084961, "global_step": 384696, "epoch": 2289} {"train_loss": -12.50086498260498, "global_step": 384697, "epoch": 2289} {"train_loss": -12.750776290893555, "global_step": 384698, "epoch": 2289} {"train_loss": -12.385151863098145, "global_step": 384699, "epoch": 2289} {"train_loss": -12.530160903930664, "global_step": 384700, "epoch": 2289} {"train_loss": -12.647680282592773, "global_step": 384701, "epoch": 2289} {"train_loss": -12.521760940551758, "global_step": 384702, "epoch": 2289} {"train_loss": -12.719976425170898, "global_step": 384703, "epoch": 2289} {"train_loss": -12.64745807647705, "global_step": 384704, "epoch": 2289} {"train_loss": -12.434120178222656, "global_step": 384705, "epoch": 2289} {"train_loss": -12.77409553527832, "global_step": 384706, "epoch": 2289} {"train_loss": -12.438722610473633, "global_step": 384707, "epoch": 2289} {"train_loss": -12.722271919250488, "global_step": 384708, "epoch": 2289} {"train_loss": -12.462119102478027, "global_step": 384709, "epoch": 2289} {"train_loss": -12.561808586120605, "global_step": 384710, "epoch": 2289} {"train_loss": -12.798995971679688, "global_step": 384711, "epoch": 2289} {"train_loss": -12.67302131652832, "global_step": 384712, "epoch": 2289} {"train_loss": -12.562328338623047, "global_step": 384713, "epoch": 2289} {"train_loss": -12.839641571044922, "global_step": 384714, "epoch": 2289} {"train_loss": -12.769981384277344, "global_step": 384715, "epoch": 2289} {"train_loss": -12.681768417358398, "global_step": 384716, "epoch": 2289} {"train_loss": -12.492584228515625, "global_step": 384717, "epoch": 2289} {"train_loss": -12.551774978637695, "global_step": 384718, "epoch": 2289} {"train_loss": -11.958933699698676, "global_step": 384719, "epoch": 2289, "val_loss": 291471.96875} {"train_loss": -12.747575759887695, "global_step": 384720, "epoch": 2290} {"train_loss": -12.495745658874512, "global_step": 384721, "epoch": 2290} {"train_loss": -12.620223999023438, "global_step": 384722, "epoch": 2290} {"train_loss": -12.644789695739746, "global_step": 384723, "epoch": 2290} {"train_loss": -12.68073558807373, "global_step": 384724, "epoch": 2290} {"train_loss": -12.663705825805664, "global_step": 384725, "epoch": 2290} {"train_loss": -12.518157958984375, "global_step": 384726, "epoch": 2290} {"train_loss": -12.606300354003906, "global_step": 384727, "epoch": 2290} {"train_loss": -12.818277359008789, "global_step": 384728, "epoch": 2290} {"train_loss": -12.807147979736328, "global_step": 384729, "epoch": 2290} {"train_loss": -12.691938400268555, "global_step": 384730, "epoch": 2290} {"train_loss": -11.97413444519043, "global_step": 384731, "epoch": 2290} {"train_loss": -12.440546035766602, "global_step": 384732, "epoch": 2290} {"train_loss": -12.614448547363281, "global_step": 384733, "epoch": 2290} {"train_loss": -12.52660846710205, "global_step": 384734, "epoch": 2290} {"train_loss": -12.837424278259277, "global_step": 384735, "epoch": 2290} {"train_loss": -12.893369674682617, "global_step": 384736, "epoch": 2290} {"train_loss": -12.471901893615723, "global_step": 384737, "epoch": 2290} {"train_loss": -12.494503021240234, "global_step": 384738, "epoch": 2290} {"train_loss": -12.631702423095703, "global_step": 384739, "epoch": 2290} {"train_loss": -12.646112442016602, "global_step": 384740, "epoch": 2290} {"train_loss": -11.346721649169922, "global_step": 384741, "epoch": 2290} {"train_loss": -10.252803802490234, "global_step": 384742, "epoch": 2290} {"train_loss": -10.827369689941406, "global_step": 384743, "epoch": 2290} {"train_loss": -9.333429336547852, "global_step": 384744, "epoch": 2290} {"train_loss": -10.158356666564941, "global_step": 384745, "epoch": 2290} {"train_loss": -11.014243125915527, "global_step": 384746, "epoch": 2290} {"train_loss": -9.380571365356445, "global_step": 384747, "epoch": 2290} {"train_loss": -9.427111625671387, "global_step": 384748, "epoch": 2290} {"train_loss": -10.44157600402832, "global_step": 384749, "epoch": 2290} {"train_loss": -8.74970531463623, "global_step": 384750, "epoch": 2290} {"train_loss": -9.18782901763916, "global_step": 384751, "epoch": 2290} {"train_loss": -8.980104446411133, "global_step": 384752, "epoch": 2290} {"train_loss": -10.400481224060059, "global_step": 384753, "epoch": 2290} {"train_loss": -10.684417724609375, "global_step": 384754, "epoch": 2290} {"train_loss": -9.216222763061523, "global_step": 384755, "epoch": 2290} {"train_loss": -10.618208885192871, "global_step": 384756, "epoch": 2290} {"train_loss": -10.741083145141602, "global_step": 384757, "epoch": 2290} {"train_loss": -10.117657661437988, "global_step": 384758, "epoch": 2290} {"train_loss": -8.618377685546875, "global_step": 384759, "epoch": 2290} {"train_loss": -10.446083068847656, "global_step": 384760, "epoch": 2290} {"train_loss": -10.825538635253906, "global_step": 384761, "epoch": 2290} {"train_loss": -11.152925491333008, "global_step": 384762, "epoch": 2290} {"train_loss": -11.505084037780762, "global_step": 384763, "epoch": 2290} {"train_loss": -10.979840278625488, "global_step": 384764, "epoch": 2290} {"train_loss": -11.031244277954102, "global_step": 384765, "epoch": 2290} {"train_loss": -11.281820297241211, "global_step": 384766, "epoch": 2290} {"train_loss": -11.436868667602539, "global_step": 384767, "epoch": 2290} {"train_loss": -11.499008178710938, "global_step": 384768, "epoch": 2290} {"train_loss": -12.001575469970703, "global_step": 384769, "epoch": 2290} {"train_loss": -11.25217056274414, "global_step": 384770, "epoch": 2290} {"train_loss": -11.551183700561523, "global_step": 384771, "epoch": 2290} {"train_loss": -11.56382942199707, "global_step": 384772, "epoch": 2290} {"train_loss": -11.780817985534668, "global_step": 384773, "epoch": 2290} {"train_loss": -11.660533905029297, "global_step": 384774, "epoch": 2290} {"train_loss": -11.897850036621094, "global_step": 384775, "epoch": 2290} {"train_loss": -11.898920059204102, "global_step": 384776, "epoch": 2290} {"train_loss": -11.74652099609375, "global_step": 384777, "epoch": 2290} {"train_loss": -11.659894943237305, "global_step": 384778, "epoch": 2290} {"train_loss": -12.127106666564941, "global_step": 384779, "epoch": 2290} {"train_loss": -11.811309814453125, "global_step": 384780, "epoch": 2290} {"train_loss": -11.834943771362305, "global_step": 384781, "epoch": 2290} {"train_loss": -11.785299301147461, "global_step": 384782, "epoch": 2290} {"train_loss": -11.962127685546875, "global_step": 384783, "epoch": 2290} {"train_loss": -11.927812576293945, "global_step": 384784, "epoch": 2290} {"train_loss": -12.082378387451172, "global_step": 384785, "epoch": 2290} {"train_loss": -12.079208374023438, "global_step": 384786, "epoch": 2290} {"train_loss": -12.147001266479492, "global_step": 384787, "epoch": 2290} {"train_loss": -12.268457412719727, "global_step": 384788, "epoch": 2290} {"train_loss": -12.018451690673828, "global_step": 384789, "epoch": 2290} {"train_loss": -11.955742835998535, "global_step": 384790, "epoch": 2290} {"train_loss": -11.76496410369873, "global_step": 384791, "epoch": 2290} {"train_loss": -11.878541946411133, "global_step": 384792, "epoch": 2290} {"train_loss": -11.986252784729004, "global_step": 384793, "epoch": 2290} {"train_loss": -12.04364013671875, "global_step": 384794, "epoch": 2290} {"train_loss": -12.37148666381836, "global_step": 384795, "epoch": 2290} {"train_loss": -11.993937492370605, "global_step": 384796, "epoch": 2290} {"train_loss": -12.508838653564453, "global_step": 384797, "epoch": 2290} {"train_loss": -11.903837203979492, "global_step": 384798, "epoch": 2290} {"train_loss": -12.308588981628418, "global_step": 384799, "epoch": 2290} {"train_loss": -12.312898635864258, "global_step": 384800, "epoch": 2290} {"train_loss": -12.352326393127441, "global_step": 384801, "epoch": 2290} {"train_loss": -12.32897663116455, "global_step": 384802, "epoch": 2290} {"train_loss": -11.981809616088867, "global_step": 384803, "epoch": 2290} {"train_loss": -12.274616241455078, "global_step": 384804, "epoch": 2290} {"train_loss": -12.228239059448242, "global_step": 384805, "epoch": 2290} {"train_loss": -12.352816581726074, "global_step": 384806, "epoch": 2290} {"train_loss": -12.291056632995605, "global_step": 384807, "epoch": 2290} {"train_loss": -12.143199920654297, "global_step": 384808, "epoch": 2290} {"train_loss": -12.441686630249023, "global_step": 384809, "epoch": 2290} {"train_loss": -12.05735969543457, "global_step": 384810, "epoch": 2290} {"train_loss": -12.138771057128906, "global_step": 384811, "epoch": 2290} {"train_loss": -12.403987884521484, "global_step": 384812, "epoch": 2290} {"train_loss": -12.061415672302246, "global_step": 384813, "epoch": 2290} {"train_loss": -12.30876350402832, "global_step": 384814, "epoch": 2290} {"train_loss": -12.201580047607422, "global_step": 384815, "epoch": 2290} {"train_loss": -12.48197078704834, "global_step": 384816, "epoch": 2290} {"train_loss": -12.132977485656738, "global_step": 384817, "epoch": 2290} {"train_loss": -12.476499557495117, "global_step": 384818, "epoch": 2290} {"train_loss": -12.392542839050293, "global_step": 384819, "epoch": 2290} {"train_loss": -12.43134880065918, "global_step": 384820, "epoch": 2290} {"train_loss": -12.385522842407227, "global_step": 384821, "epoch": 2290} {"train_loss": -12.529770851135254, "global_step": 384822, "epoch": 2290} {"train_loss": -12.438966751098633, "global_step": 384823, "epoch": 2290} {"train_loss": -12.337574005126953, "global_step": 384824, "epoch": 2290} {"train_loss": -12.209025382995605, "global_step": 384825, "epoch": 2290} {"train_loss": -12.409088134765625, "global_step": 384826, "epoch": 2290} {"train_loss": -12.467735290527344, "global_step": 384827, "epoch": 2290} {"train_loss": -12.186857223510742, "global_step": 384828, "epoch": 2290} {"train_loss": -12.31533432006836, "global_step": 384829, "epoch": 2290} {"train_loss": -12.356034278869629, "global_step": 384830, "epoch": 2290} {"train_loss": -12.6080322265625, "global_step": 384831, "epoch": 2290} {"train_loss": -12.080953598022461, "global_step": 384832, "epoch": 2290} {"train_loss": -12.23757266998291, "global_step": 384833, "epoch": 2290} {"train_loss": -12.465902328491211, "global_step": 384834, "epoch": 2290} {"train_loss": -12.303621292114258, "global_step": 384835, "epoch": 2290} {"train_loss": -12.722265243530273, "global_step": 384836, "epoch": 2290} {"train_loss": -11.804008483886719, "global_step": 384837, "epoch": 2290} {"train_loss": -12.185958862304688, "global_step": 384838, "epoch": 2290} {"train_loss": -12.290304183959961, "global_step": 384839, "epoch": 2290} {"train_loss": -11.844820022583008, "global_step": 384840, "epoch": 2290} {"train_loss": -12.362018585205078, "global_step": 384841, "epoch": 2290} {"train_loss": -11.356571197509766, "global_step": 384842, "epoch": 2290} {"train_loss": -11.584085464477539, "global_step": 384843, "epoch": 2290} {"train_loss": -11.970281600952148, "global_step": 384844, "epoch": 2290} {"train_loss": -11.394352912902832, "global_step": 384845, "epoch": 2290} {"train_loss": -11.856407165527344, "global_step": 384846, "epoch": 2290} {"train_loss": -11.236831665039062, "global_step": 384847, "epoch": 2290} {"train_loss": -11.000865936279297, "global_step": 384848, "epoch": 2290} {"train_loss": -11.131343841552734, "global_step": 384849, "epoch": 2290} {"train_loss": -10.480329513549805, "global_step": 384850, "epoch": 2290} {"train_loss": -11.48826789855957, "global_step": 384851, "epoch": 2290} {"train_loss": -10.548354148864746, "global_step": 384852, "epoch": 2290} {"train_loss": -10.494468688964844, "global_step": 384853, "epoch": 2290} {"train_loss": -11.074686050415039, "global_step": 384854, "epoch": 2290} {"train_loss": -10.00028133392334, "global_step": 384855, "epoch": 2290} {"train_loss": -11.240974426269531, "global_step": 384856, "epoch": 2290} {"train_loss": -10.188020706176758, "global_step": 384857, "epoch": 2290} {"train_loss": -10.032278060913086, "global_step": 384858, "epoch": 2290} {"train_loss": -11.231180191040039, "global_step": 384859, "epoch": 2290} {"train_loss": -11.050493240356445, "global_step": 384860, "epoch": 2290} {"train_loss": -11.073354721069336, "global_step": 384861, "epoch": 2290} {"train_loss": -11.681221008300781, "global_step": 384862, "epoch": 2290} {"train_loss": -11.458547592163086, "global_step": 384863, "epoch": 2290} {"train_loss": -11.614452362060547, "global_step": 384864, "epoch": 2290} {"train_loss": -11.623361587524414, "global_step": 384865, "epoch": 2290} {"train_loss": -11.963434219360352, "global_step": 384866, "epoch": 2290} {"train_loss": -11.00659465789795, "global_step": 384867, "epoch": 2290} {"train_loss": -11.130313873291016, "global_step": 384868, "epoch": 2290} {"train_loss": -11.934532165527344, "global_step": 384869, "epoch": 2290} {"train_loss": -11.550036430358887, "global_step": 384870, "epoch": 2290} {"train_loss": -12.043169021606445, "global_step": 384871, "epoch": 2290} {"train_loss": -11.904611587524414, "global_step": 384872, "epoch": 2290} {"train_loss": -11.779661178588867, "global_step": 384873, "epoch": 2290} {"train_loss": -11.699357986450195, "global_step": 384874, "epoch": 2290} {"train_loss": -12.209230422973633, "global_step": 384875, "epoch": 2290} {"train_loss": -11.935137748718262, "global_step": 384876, "epoch": 2290} {"train_loss": -12.15713119506836, "global_step": 384877, "epoch": 2290} {"train_loss": -11.984724044799805, "global_step": 384878, "epoch": 2290} {"train_loss": -12.269418716430664, "global_step": 384879, "epoch": 2290} {"train_loss": -12.235843658447266, "global_step": 384880, "epoch": 2290} {"train_loss": -11.918208122253418, "global_step": 384881, "epoch": 2290} {"train_loss": -12.187440872192383, "global_step": 384882, "epoch": 2290} {"train_loss": -12.28376579284668, "global_step": 384883, "epoch": 2290} {"train_loss": -12.010729789733887, "global_step": 384884, "epoch": 2290} {"train_loss": -12.333086967468262, "global_step": 384885, "epoch": 2290} {"train_loss": -12.342316627502441, "global_step": 384886, "epoch": 2290} {"train_loss": -11.730566314288549, "global_step": 384887, "epoch": 2290, "val_loss": 293243.375, "train_action_mse_error": 1.5037158727645874} {"train_loss": -12.250960350036621, "global_step": 384888, "epoch": 2291} {"train_loss": -12.303467750549316, "global_step": 384889, "epoch": 2291} {"train_loss": -12.431523323059082, "global_step": 384890, "epoch": 2291} {"train_loss": -12.191534042358398, "global_step": 384891, "epoch": 2291} {"train_loss": -12.389791488647461, "global_step": 384892, "epoch": 2291} {"train_loss": -12.174433708190918, "global_step": 384893, "epoch": 2291} {"train_loss": -12.371353149414062, "global_step": 384894, "epoch": 2291} {"train_loss": -12.144135475158691, "global_step": 384895, "epoch": 2291} {"train_loss": -12.435701370239258, "global_step": 384896, "epoch": 2291} {"train_loss": -12.250042915344238, "global_step": 384897, "epoch": 2291} {"train_loss": -12.22718620300293, "global_step": 384898, "epoch": 2291} {"train_loss": -12.363828659057617, "global_step": 384899, "epoch": 2291} {"train_loss": -12.486180305480957, "global_step": 384900, "epoch": 2291} {"train_loss": -12.279775619506836, "global_step": 384901, "epoch": 2291} {"train_loss": -12.488659858703613, "global_step": 384902, "epoch": 2291} {"train_loss": -12.231213569641113, "global_step": 384903, "epoch": 2291} {"train_loss": -12.428007125854492, "global_step": 384904, "epoch": 2291} {"train_loss": -12.531464576721191, "global_step": 384905, "epoch": 2291} {"train_loss": -12.36822509765625, "global_step": 384906, "epoch": 2291} {"train_loss": -12.438573837280273, "global_step": 384907, "epoch": 2291} {"train_loss": -12.394289016723633, "global_step": 384908, "epoch": 2291} {"train_loss": -12.238616943359375, "global_step": 384909, "epoch": 2291} {"train_loss": -12.552159309387207, "global_step": 384910, "epoch": 2291} {"train_loss": -12.373603820800781, "global_step": 384911, "epoch": 2291} {"train_loss": -12.563250541687012, "global_step": 384912, "epoch": 2291} {"train_loss": -12.138258934020996, "global_step": 384913, "epoch": 2291} {"train_loss": -12.58968448638916, "global_step": 384914, "epoch": 2291} {"train_loss": -12.354230880737305, "global_step": 384915, "epoch": 2291} {"train_loss": -12.005590438842773, "global_step": 384916, "epoch": 2291} {"train_loss": -12.403312683105469, "global_step": 384917, "epoch": 2291} {"train_loss": -12.420391082763672, "global_step": 384918, "epoch": 2291} {"train_loss": -12.414085388183594, "global_step": 384919, "epoch": 2291} {"train_loss": -12.331360816955566, "global_step": 384920, "epoch": 2291} {"train_loss": -12.718555450439453, "global_step": 384921, "epoch": 2291} {"train_loss": -12.461512565612793, "global_step": 384922, "epoch": 2291} {"train_loss": -12.544279098510742, "global_step": 384923, "epoch": 2291} {"train_loss": -12.506103515625, "global_step": 384924, "epoch": 2291} {"train_loss": -12.595966339111328, "global_step": 384925, "epoch": 2291} {"train_loss": -12.494379997253418, "global_step": 384926, "epoch": 2291} {"train_loss": -12.404053688049316, "global_step": 384927, "epoch": 2291} {"train_loss": -12.513050079345703, "global_step": 384928, "epoch": 2291} {"train_loss": -12.595163345336914, "global_step": 384929, "epoch": 2291} {"train_loss": -12.542293548583984, "global_step": 384930, "epoch": 2291} {"train_loss": -12.679004669189453, "global_step": 384931, "epoch": 2291} {"train_loss": -12.4188814163208, "global_step": 384932, "epoch": 2291} {"train_loss": -12.622371673583984, "global_step": 384933, "epoch": 2291} {"train_loss": -12.515596389770508, "global_step": 384934, "epoch": 2291} {"train_loss": -12.617792129516602, "global_step": 384935, "epoch": 2291} {"train_loss": -12.511588096618652, "global_step": 384936, "epoch": 2291} {"train_loss": -12.358613014221191, "global_step": 384937, "epoch": 2291} {"train_loss": -12.655162811279297, "global_step": 384938, "epoch": 2291} {"train_loss": -12.374349594116211, "global_step": 384939, "epoch": 2291} {"train_loss": -12.726425170898438, "global_step": 384940, "epoch": 2291} {"train_loss": -12.804801940917969, "global_step": 384941, "epoch": 2291} {"train_loss": -12.583078384399414, "global_step": 384942, "epoch": 2291} {"train_loss": -12.435956954956055, "global_step": 384943, "epoch": 2291} {"train_loss": -12.682886123657227, "global_step": 384944, "epoch": 2291} {"train_loss": -12.510419845581055, "global_step": 384945, "epoch": 2291} {"train_loss": -12.881721496582031, "global_step": 384946, "epoch": 2291} {"train_loss": -12.687625885009766, "global_step": 384947, "epoch": 2291} {"train_loss": -12.437952995300293, "global_step": 384948, "epoch": 2291} {"train_loss": -12.726557731628418, "global_step": 384949, "epoch": 2291} {"train_loss": -12.591402053833008, "global_step": 384950, "epoch": 2291} {"train_loss": -12.144745826721191, "global_step": 384951, "epoch": 2291} {"train_loss": -11.896139144897461, "global_step": 384952, "epoch": 2291} {"train_loss": -12.672784805297852, "global_step": 384953, "epoch": 2291} {"train_loss": -12.274988174438477, "global_step": 384954, "epoch": 2291} {"train_loss": -11.6483736038208, "global_step": 384955, "epoch": 2291} {"train_loss": -12.597532272338867, "global_step": 384956, "epoch": 2291} {"train_loss": -11.984293937683105, "global_step": 384957, "epoch": 2291} {"train_loss": -11.79869270324707, "global_step": 384958, "epoch": 2291} {"train_loss": -11.530109405517578, "global_step": 384959, "epoch": 2291} {"train_loss": -11.539345741271973, "global_step": 384960, "epoch": 2291} {"train_loss": -12.591297149658203, "global_step": 384961, "epoch": 2291} {"train_loss": -12.50759506225586, "global_step": 384962, "epoch": 2291} {"train_loss": -12.011659622192383, "global_step": 384963, "epoch": 2291} {"train_loss": -11.986146926879883, "global_step": 384964, "epoch": 2291} {"train_loss": -12.510444641113281, "global_step": 384965, "epoch": 2291} {"train_loss": -12.433062553405762, "global_step": 384966, "epoch": 2291} {"train_loss": -12.324186325073242, "global_step": 384967, "epoch": 2291} {"train_loss": -11.676191329956055, "global_step": 384968, "epoch": 2291} {"train_loss": -12.60099983215332, "global_step": 384969, "epoch": 2291} {"train_loss": -10.552684783935547, "global_step": 384970, "epoch": 2291} {"train_loss": -11.369743347167969, "global_step": 384971, "epoch": 2291} {"train_loss": -12.13614273071289, "global_step": 384972, "epoch": 2291} {"train_loss": -11.802717208862305, "global_step": 384973, "epoch": 2291} {"train_loss": -11.754936218261719, "global_step": 384974, "epoch": 2291} {"train_loss": -11.818746566772461, "global_step": 384975, "epoch": 2291} {"train_loss": -10.963830947875977, "global_step": 384976, "epoch": 2291} {"train_loss": -11.62026309967041, "global_step": 384977, "epoch": 2291} {"train_loss": -11.825891494750977, "global_step": 384978, "epoch": 2291} {"train_loss": -10.733972549438477, "global_step": 384979, "epoch": 2291} {"train_loss": -11.396530151367188, "global_step": 384980, "epoch": 2291} {"train_loss": -11.75436782836914, "global_step": 384981, "epoch": 2291} {"train_loss": -10.159233093261719, "global_step": 384982, "epoch": 2291} {"train_loss": -11.732911109924316, "global_step": 384983, "epoch": 2291} {"train_loss": -11.044567108154297, "global_step": 384984, "epoch": 2291} {"train_loss": -11.144549369812012, "global_step": 384985, "epoch": 2291} {"train_loss": -12.196112632751465, "global_step": 384986, "epoch": 2291} {"train_loss": -11.765168190002441, "global_step": 384987, "epoch": 2291} {"train_loss": -11.994548797607422, "global_step": 384988, "epoch": 2291} {"train_loss": -12.00300407409668, "global_step": 384989, "epoch": 2291} {"train_loss": -11.256091117858887, "global_step": 384990, "epoch": 2291} {"train_loss": -12.077737808227539, "global_step": 384991, "epoch": 2291} {"train_loss": -11.126547813415527, "global_step": 384992, "epoch": 2291} {"train_loss": -11.932233810424805, "global_step": 384993, "epoch": 2291} {"train_loss": -11.140636444091797, "global_step": 384994, "epoch": 2291} {"train_loss": -11.648895263671875, "global_step": 384995, "epoch": 2291} {"train_loss": -11.876882553100586, "global_step": 384996, "epoch": 2291} {"train_loss": -12.123990058898926, "global_step": 384997, "epoch": 2291} {"train_loss": -12.064718246459961, "global_step": 384998, "epoch": 2291} {"train_loss": -12.225645065307617, "global_step": 384999, "epoch": 2291} {"train_loss": -11.874480247497559, "global_step": 385000, "epoch": 2291} {"train_loss": -11.836061477661133, "global_step": 385001, "epoch": 2291} {"train_loss": -12.12269401550293, "global_step": 385002, "epoch": 2291} {"train_loss": -11.014208793640137, "global_step": 385003, "epoch": 2291} {"train_loss": -11.737279891967773, "global_step": 385004, "epoch": 2291} {"train_loss": -11.001977920532227, "global_step": 385005, "epoch": 2291} {"train_loss": -11.010122299194336, "global_step": 385006, "epoch": 2291} {"train_loss": -11.981523513793945, "global_step": 385007, "epoch": 2291} {"train_loss": -11.12702751159668, "global_step": 385008, "epoch": 2291} {"train_loss": -12.261598587036133, "global_step": 385009, "epoch": 2291} {"train_loss": -11.369905471801758, "global_step": 385010, "epoch": 2291} {"train_loss": -12.155046463012695, "global_step": 385011, "epoch": 2291} {"train_loss": -12.051920890808105, "global_step": 385012, "epoch": 2291} {"train_loss": -12.038676261901855, "global_step": 385013, "epoch": 2291} {"train_loss": -12.212505340576172, "global_step": 385014, "epoch": 2291} {"train_loss": -12.013069152832031, "global_step": 385015, "epoch": 2291} {"train_loss": -11.801142692565918, "global_step": 385016, "epoch": 2291} {"train_loss": -12.370506286621094, "global_step": 385017, "epoch": 2291} {"train_loss": -12.265392303466797, "global_step": 385018, "epoch": 2291} {"train_loss": -11.927592277526855, "global_step": 385019, "epoch": 2291} {"train_loss": -12.015972137451172, "global_step": 385020, "epoch": 2291} {"train_loss": -12.258142471313477, "global_step": 385021, "epoch": 2291} {"train_loss": -11.85699462890625, "global_step": 385022, "epoch": 2291} {"train_loss": -12.312236785888672, "global_step": 385023, "epoch": 2291} {"train_loss": -11.728228569030762, "global_step": 385024, "epoch": 2291} {"train_loss": -12.604029655456543, "global_step": 385025, "epoch": 2291} {"train_loss": -11.899238586425781, "global_step": 385026, "epoch": 2291} {"train_loss": -12.008504867553711, "global_step": 385027, "epoch": 2291} {"train_loss": -11.93277359008789, "global_step": 385028, "epoch": 2291} {"train_loss": -11.733724594116211, "global_step": 385029, "epoch": 2291} {"train_loss": -12.329509735107422, "global_step": 385030, "epoch": 2291} {"train_loss": -11.893939971923828, "global_step": 385031, "epoch": 2291} {"train_loss": -12.117673873901367, "global_step": 385032, "epoch": 2291} {"train_loss": -11.850143432617188, "global_step": 385033, "epoch": 2291} {"train_loss": -11.71408462524414, "global_step": 385034, "epoch": 2291} {"train_loss": -12.017267227172852, "global_step": 385035, "epoch": 2291} {"train_loss": -12.231804847717285, "global_step": 385036, "epoch": 2291} {"train_loss": -12.062012672424316, "global_step": 385037, "epoch": 2291} {"train_loss": -11.86708927154541, "global_step": 385038, "epoch": 2291} {"train_loss": -11.439130783081055, "global_step": 385039, "epoch": 2291} {"train_loss": -12.225746154785156, "global_step": 385040, "epoch": 2291} {"train_loss": -11.857770919799805, "global_step": 385041, "epoch": 2291} {"train_loss": -12.018426895141602, "global_step": 385042, "epoch": 2291} {"train_loss": -12.21570110321045, "global_step": 385043, "epoch": 2291} {"train_loss": -12.028038024902344, "global_step": 385044, "epoch": 2291} {"train_loss": -11.309109687805176, "global_step": 385045, "epoch": 2291} {"train_loss": -12.0943021774292, "global_step": 385046, "epoch": 2291} {"train_loss": -11.286532402038574, "global_step": 385047, "epoch": 2291} {"train_loss": -11.325753211975098, "global_step": 385048, "epoch": 2291} {"train_loss": -11.498943328857422, "global_step": 385049, "epoch": 2291} {"train_loss": -10.931742668151855, "global_step": 385050, "epoch": 2291} {"train_loss": -11.882641792297363, "global_step": 385051, "epoch": 2291} {"train_loss": -11.365961074829102, "global_step": 385052, "epoch": 2291} {"train_loss": -11.60478687286377, "global_step": 385053, "epoch": 2291} {"train_loss": -11.785036087036133, "global_step": 385054, "epoch": 2291} {"train_loss": -12.059317248208183, "global_step": 385055, "epoch": 2291, "val_loss": 294143.0} {"train_loss": -11.829193115234375, "global_step": 385056, "epoch": 2292} {"train_loss": -11.93411636352539, "global_step": 385057, "epoch": 2292} {"train_loss": -11.688565254211426, "global_step": 385058, "epoch": 2292} {"train_loss": -11.735052108764648, "global_step": 385059, "epoch": 2292} {"train_loss": -11.768730163574219, "global_step": 385060, "epoch": 2292} {"train_loss": -11.676727294921875, "global_step": 385061, "epoch": 2292} {"train_loss": -12.124950408935547, "global_step": 385062, "epoch": 2292} {"train_loss": -11.580777168273926, "global_step": 385063, "epoch": 2292} {"train_loss": -12.414100646972656, "global_step": 385064, "epoch": 2292} {"train_loss": -11.980226516723633, "global_step": 385065, "epoch": 2292} {"train_loss": -12.0233793258667, "global_step": 385066, "epoch": 2292} {"train_loss": -11.914645195007324, "global_step": 385067, "epoch": 2292} {"train_loss": -11.883676528930664, "global_step": 385068, "epoch": 2292} {"train_loss": -12.259904861450195, "global_step": 385069, "epoch": 2292} {"train_loss": -11.162866592407227, "global_step": 385070, "epoch": 2292} {"train_loss": -12.20781135559082, "global_step": 385071, "epoch": 2292} {"train_loss": -11.44399642944336, "global_step": 385072, "epoch": 2292} {"train_loss": -11.75981616973877, "global_step": 385073, "epoch": 2292} {"train_loss": -12.352071762084961, "global_step": 385074, "epoch": 2292} {"train_loss": -11.966071128845215, "global_step": 385075, "epoch": 2292} {"train_loss": -12.020885467529297, "global_step": 385076, "epoch": 2292} {"train_loss": -12.322381973266602, "global_step": 385077, "epoch": 2292} {"train_loss": -12.216545104980469, "global_step": 385078, "epoch": 2292} {"train_loss": -11.989067077636719, "global_step": 385079, "epoch": 2292} {"train_loss": -12.32568645477295, "global_step": 385080, "epoch": 2292} {"train_loss": -12.160754203796387, "global_step": 385081, "epoch": 2292} {"train_loss": -12.088281631469727, "global_step": 385082, "epoch": 2292} {"train_loss": -12.085671424865723, "global_step": 385083, "epoch": 2292} {"train_loss": -11.985530853271484, "global_step": 385084, "epoch": 2292} {"train_loss": -12.07461166381836, "global_step": 385085, "epoch": 2292} {"train_loss": -12.61387825012207, "global_step": 385086, "epoch": 2292} {"train_loss": -12.39295482635498, "global_step": 385087, "epoch": 2292} {"train_loss": -12.480958938598633, "global_step": 385088, "epoch": 2292} {"train_loss": -12.48802661895752, "global_step": 385089, "epoch": 2292} {"train_loss": -12.811870574951172, "global_step": 385090, "epoch": 2292} {"train_loss": -12.459238052368164, "global_step": 385091, "epoch": 2292} {"train_loss": -12.572860717773438, "global_step": 385092, "epoch": 2292} {"train_loss": -12.54340648651123, "global_step": 385093, "epoch": 2292} {"train_loss": -12.493371963500977, "global_step": 385094, "epoch": 2292} {"train_loss": -12.462974548339844, "global_step": 385095, "epoch": 2292} {"train_loss": -12.58035945892334, "global_step": 385096, "epoch": 2292} {"train_loss": -12.545982360839844, "global_step": 385097, "epoch": 2292} {"train_loss": -12.535432815551758, "global_step": 385098, "epoch": 2292} {"train_loss": -12.470650672912598, "global_step": 385099, "epoch": 2292} {"train_loss": -12.560262680053711, "global_step": 385100, "epoch": 2292} {"train_loss": -12.375027656555176, "global_step": 385101, "epoch": 2292} {"train_loss": -12.364625930786133, "global_step": 385102, "epoch": 2292} {"train_loss": -12.370088577270508, "global_step": 385103, "epoch": 2292} {"train_loss": -12.487911224365234, "global_step": 385104, "epoch": 2292} {"train_loss": -12.46246337890625, "global_step": 385105, "epoch": 2292} {"train_loss": -12.497428894042969, "global_step": 385106, "epoch": 2292} {"train_loss": -12.253704071044922, "global_step": 385107, "epoch": 2292} {"train_loss": -12.37435245513916, "global_step": 385108, "epoch": 2292} {"train_loss": -12.597040176391602, "global_step": 385109, "epoch": 2292} {"train_loss": -12.046411514282227, "global_step": 385110, "epoch": 2292} {"train_loss": -12.567500114440918, "global_step": 385111, "epoch": 2292} {"train_loss": -12.143680572509766, "global_step": 385112, "epoch": 2292} {"train_loss": -12.531785011291504, "global_step": 385113, "epoch": 2292} {"train_loss": -12.265430450439453, "global_step": 385114, "epoch": 2292} {"train_loss": -12.584638595581055, "global_step": 385115, "epoch": 2292} {"train_loss": -12.22883415222168, "global_step": 385116, "epoch": 2292} {"train_loss": -12.5968656539917, "global_step": 385117, "epoch": 2292} {"train_loss": -11.705678939819336, "global_step": 385118, "epoch": 2292} {"train_loss": -12.076570510864258, "global_step": 385119, "epoch": 2292} {"train_loss": -10.936210632324219, "global_step": 385120, "epoch": 2292} {"train_loss": -11.29786491394043, "global_step": 385121, "epoch": 2292} {"train_loss": -11.284875869750977, "global_step": 385122, "epoch": 2292} {"train_loss": -11.012035369873047, "global_step": 385123, "epoch": 2292} {"train_loss": -9.558351516723633, "global_step": 385124, "epoch": 2292} {"train_loss": -10.288090705871582, "global_step": 385125, "epoch": 2292} {"train_loss": -11.215021133422852, "global_step": 385126, "epoch": 2292} {"train_loss": -11.2484130859375, "global_step": 385127, "epoch": 2292} {"train_loss": -10.283506393432617, "global_step": 385128, "epoch": 2292} {"train_loss": -11.733039855957031, "global_step": 385129, "epoch": 2292} {"train_loss": -10.47072696685791, "global_step": 385130, "epoch": 2292} {"train_loss": -9.9940185546875, "global_step": 385131, "epoch": 2292} {"train_loss": -11.0162992477417, "global_step": 385132, "epoch": 2292} {"train_loss": -9.925829887390137, "global_step": 385133, "epoch": 2292} {"train_loss": -10.512046813964844, "global_step": 385134, "epoch": 2292} {"train_loss": -9.398580551147461, "global_step": 385135, "epoch": 2292} {"train_loss": -11.444524765014648, "global_step": 385136, "epoch": 2292} {"train_loss": -9.431285858154297, "global_step": 385137, "epoch": 2292} {"train_loss": -9.302718162536621, "global_step": 385138, "epoch": 2292} {"train_loss": -10.339362144470215, "global_step": 385139, "epoch": 2292} {"train_loss": -10.345943450927734, "global_step": 385140, "epoch": 2292} {"train_loss": -9.53938102722168, "global_step": 385141, "epoch": 2292} {"train_loss": -11.360685348510742, "global_step": 385142, "epoch": 2292} {"train_loss": -9.186635971069336, "global_step": 385143, "epoch": 2292} {"train_loss": -9.881839752197266, "global_step": 385144, "epoch": 2292} {"train_loss": -10.384506225585938, "global_step": 385145, "epoch": 2292} {"train_loss": -11.483437538146973, "global_step": 385146, "epoch": 2292} {"train_loss": -10.586091995239258, "global_step": 385147, "epoch": 2292} {"train_loss": -11.185250282287598, "global_step": 385148, "epoch": 2292} {"train_loss": -11.147216796875, "global_step": 385149, "epoch": 2292} {"train_loss": -11.120012283325195, "global_step": 385150, "epoch": 2292} {"train_loss": -11.068049430847168, "global_step": 385151, "epoch": 2292} {"train_loss": -11.332874298095703, "global_step": 385152, "epoch": 2292} {"train_loss": -10.522268295288086, "global_step": 385153, "epoch": 2292} {"train_loss": -11.721207618713379, "global_step": 385154, "epoch": 2292} {"train_loss": -11.470137596130371, "global_step": 385155, "epoch": 2292} {"train_loss": -11.634832382202148, "global_step": 385156, "epoch": 2292} {"train_loss": -11.682907104492188, "global_step": 385157, "epoch": 2292} {"train_loss": -11.32887077331543, "global_step": 385158, "epoch": 2292} {"train_loss": -11.71565055847168, "global_step": 385159, "epoch": 2292} {"train_loss": -11.741911888122559, "global_step": 385160, "epoch": 2292} {"train_loss": -11.611568450927734, "global_step": 385161, "epoch": 2292} {"train_loss": -11.940814971923828, "global_step": 385162, "epoch": 2292} {"train_loss": -11.66301155090332, "global_step": 385163, "epoch": 2292} {"train_loss": -11.934133529663086, "global_step": 385164, "epoch": 2292} {"train_loss": -12.259234428405762, "global_step": 385165, "epoch": 2292} {"train_loss": -11.899245262145996, "global_step": 385166, "epoch": 2292} {"train_loss": -11.990196228027344, "global_step": 385167, "epoch": 2292} {"train_loss": -11.926199913024902, "global_step": 385168, "epoch": 2292} {"train_loss": -11.135313034057617, "global_step": 385169, "epoch": 2292} {"train_loss": -11.977710723876953, "global_step": 385170, "epoch": 2292} {"train_loss": -11.744455337524414, "global_step": 385171, "epoch": 2292} {"train_loss": -12.019181251525879, "global_step": 385172, "epoch": 2292} {"train_loss": -11.916885375976562, "global_step": 385173, "epoch": 2292} {"train_loss": -11.958868026733398, "global_step": 385174, "epoch": 2292} {"train_loss": -11.657380104064941, "global_step": 385175, "epoch": 2292} {"train_loss": -12.286735534667969, "global_step": 385176, "epoch": 2292} {"train_loss": -12.032745361328125, "global_step": 385177, "epoch": 2292} {"train_loss": -12.288982391357422, "global_step": 385178, "epoch": 2292} {"train_loss": -11.631102561950684, "global_step": 385179, "epoch": 2292} {"train_loss": -12.114620208740234, "global_step": 385180, "epoch": 2292} {"train_loss": -12.27670669555664, "global_step": 385181, "epoch": 2292} {"train_loss": -12.266134262084961, "global_step": 385182, "epoch": 2292} {"train_loss": -12.177806854248047, "global_step": 385183, "epoch": 2292} {"train_loss": -12.26467514038086, "global_step": 385184, "epoch": 2292} {"train_loss": -11.96799087524414, "global_step": 385185, "epoch": 2292} {"train_loss": -12.207578659057617, "global_step": 385186, "epoch": 2292} {"train_loss": -12.253030776977539, "global_step": 385187, "epoch": 2292} {"train_loss": -11.84091567993164, "global_step": 385188, "epoch": 2292} {"train_loss": -12.124968528747559, "global_step": 385189, "epoch": 2292} {"train_loss": -12.03286361694336, "global_step": 385190, "epoch": 2292} {"train_loss": -12.116692543029785, "global_step": 385191, "epoch": 2292} {"train_loss": -12.247164726257324, "global_step": 385192, "epoch": 2292} {"train_loss": -12.071444511413574, "global_step": 385193, "epoch": 2292} {"train_loss": -12.033827781677246, "global_step": 385194, "epoch": 2292} {"train_loss": -12.43906021118164, "global_step": 385195, "epoch": 2292} {"train_loss": -12.16341781616211, "global_step": 385196, "epoch": 2292} {"train_loss": -12.233170509338379, "global_step": 385197, "epoch": 2292} {"train_loss": -12.376699447631836, "global_step": 385198, "epoch": 2292} {"train_loss": -12.28333568572998, "global_step": 385199, "epoch": 2292} {"train_loss": -12.224967956542969, "global_step": 385200, "epoch": 2292} {"train_loss": -12.252693176269531, "global_step": 385201, "epoch": 2292} {"train_loss": -12.47195816040039, "global_step": 385202, "epoch": 2292} {"train_loss": -12.567288398742676, "global_step": 385203, "epoch": 2292} {"train_loss": -12.213056564331055, "global_step": 385204, "epoch": 2292} {"train_loss": -12.487748146057129, "global_step": 385205, "epoch": 2292} {"train_loss": -12.078414916992188, "global_step": 385206, "epoch": 2292} {"train_loss": -12.250259399414062, "global_step": 385207, "epoch": 2292} {"train_loss": -11.992732048034668, "global_step": 385208, "epoch": 2292} {"train_loss": -12.418807983398438, "global_step": 385209, "epoch": 2292} {"train_loss": -12.032600402832031, "global_step": 385210, "epoch": 2292} {"train_loss": -12.182941436767578, "global_step": 385211, "epoch": 2292} {"train_loss": -12.252985000610352, "global_step": 385212, "epoch": 2292} {"train_loss": -11.934268951416016, "global_step": 385213, "epoch": 2292} {"train_loss": -12.124261856079102, "global_step": 385214, "epoch": 2292} {"train_loss": -12.0425443649292, "global_step": 385215, "epoch": 2292} {"train_loss": -12.294905662536621, "global_step": 385216, "epoch": 2292} {"train_loss": -11.982640266418457, "global_step": 385217, "epoch": 2292} {"train_loss": -11.900571823120117, "global_step": 385218, "epoch": 2292} {"train_loss": -12.34986686706543, "global_step": 385219, "epoch": 2292} {"train_loss": -11.808006286621094, "global_step": 385220, "epoch": 2292} {"train_loss": -12.12273120880127, "global_step": 385221, "epoch": 2292} {"train_loss": -11.972373962402344, "global_step": 385222, "epoch": 2292} {"train_loss": -11.809299900418235, "global_step": 385223, "epoch": 2292, "val_loss": 294253.3125} {"train_loss": -10.882490158081055, "global_step": 385224, "epoch": 2293} {"train_loss": -11.992647171020508, "global_step": 385225, "epoch": 2293} {"train_loss": -12.255191802978516, "global_step": 385226, "epoch": 2293} {"train_loss": -12.10244083404541, "global_step": 385227, "epoch": 2293} {"train_loss": -12.181317329406738, "global_step": 385228, "epoch": 2293} {"train_loss": -12.115740776062012, "global_step": 385229, "epoch": 2293} {"train_loss": -11.790956497192383, "global_step": 385230, "epoch": 2293} {"train_loss": -12.495393753051758, "global_step": 385231, "epoch": 2293} {"train_loss": -12.051268577575684, "global_step": 385232, "epoch": 2293} {"train_loss": -12.168254852294922, "global_step": 385233, "epoch": 2293} {"train_loss": -12.09478759765625, "global_step": 385234, "epoch": 2293} {"train_loss": -12.247013092041016, "global_step": 385235, "epoch": 2293} {"train_loss": -12.348787307739258, "global_step": 385236, "epoch": 2293} {"train_loss": -12.27480697631836, "global_step": 385237, "epoch": 2293} {"train_loss": -12.537374496459961, "global_step": 385238, "epoch": 2293} {"train_loss": -12.229220390319824, "global_step": 385239, "epoch": 2293} {"train_loss": -12.658188819885254, "global_step": 385240, "epoch": 2293} {"train_loss": -12.506790161132812, "global_step": 385241, "epoch": 2293} {"train_loss": -12.488554000854492, "global_step": 385242, "epoch": 2293} {"train_loss": -12.560579299926758, "global_step": 385243, "epoch": 2293} {"train_loss": -12.571832656860352, "global_step": 385244, "epoch": 2293} {"train_loss": -12.535465240478516, "global_step": 385245, "epoch": 2293} {"train_loss": -12.555350303649902, "global_step": 385246, "epoch": 2293} {"train_loss": -12.750988960266113, "global_step": 385247, "epoch": 2293} {"train_loss": -12.612495422363281, "global_step": 385248, "epoch": 2293} {"train_loss": -12.422114372253418, "global_step": 385249, "epoch": 2293} {"train_loss": -12.63542366027832, "global_step": 385250, "epoch": 2293} {"train_loss": -12.326889038085938, "global_step": 385251, "epoch": 2293} {"train_loss": -12.376007080078125, "global_step": 385252, "epoch": 2293} {"train_loss": -12.35326099395752, "global_step": 385253, "epoch": 2293} {"train_loss": -12.344839096069336, "global_step": 385254, "epoch": 2293} {"train_loss": -12.619607925415039, "global_step": 385255, "epoch": 2293} {"train_loss": -12.434938430786133, "global_step": 385256, "epoch": 2293} {"train_loss": -12.231707572937012, "global_step": 385257, "epoch": 2293} {"train_loss": -12.150989532470703, "global_step": 385258, "epoch": 2293} {"train_loss": -12.242727279663086, "global_step": 385259, "epoch": 2293} {"train_loss": -12.326288223266602, "global_step": 385260, "epoch": 2293} {"train_loss": -12.170525550842285, "global_step": 385261, "epoch": 2293} {"train_loss": -12.205876350402832, "global_step": 385262, "epoch": 2293} {"train_loss": -12.37744426727295, "global_step": 385263, "epoch": 2293} {"train_loss": -11.967391967773438, "global_step": 385264, "epoch": 2293} {"train_loss": -12.621559143066406, "global_step": 385265, "epoch": 2293} {"train_loss": -11.81939697265625, "global_step": 385266, "epoch": 2293} {"train_loss": -12.008875846862793, "global_step": 385267, "epoch": 2293} {"train_loss": -12.535679817199707, "global_step": 385268, "epoch": 2293} {"train_loss": -12.411706924438477, "global_step": 385269, "epoch": 2293} {"train_loss": -12.659049987792969, "global_step": 385270, "epoch": 2293} {"train_loss": -12.459917068481445, "global_step": 385271, "epoch": 2293} {"train_loss": -12.566301345825195, "global_step": 385272, "epoch": 2293} {"train_loss": -12.289462089538574, "global_step": 385273, "epoch": 2293} {"train_loss": -12.19620418548584, "global_step": 385274, "epoch": 2293} {"train_loss": -12.320856094360352, "global_step": 385275, "epoch": 2293} {"train_loss": -12.571887969970703, "global_step": 385276, "epoch": 2293} {"train_loss": -11.990304946899414, "global_step": 385277, "epoch": 2293} {"train_loss": -12.437411308288574, "global_step": 385278, "epoch": 2293} {"train_loss": -11.292516708374023, "global_step": 385279, "epoch": 2293} {"train_loss": -12.349100112915039, "global_step": 385280, "epoch": 2293} {"train_loss": -11.546873092651367, "global_step": 385281, "epoch": 2293} {"train_loss": -12.545234680175781, "global_step": 385282, "epoch": 2293} {"train_loss": -11.891727447509766, "global_step": 385283, "epoch": 2293} {"train_loss": -12.099224090576172, "global_step": 385284, "epoch": 2293} {"train_loss": -11.286410331726074, "global_step": 385285, "epoch": 2293} {"train_loss": -11.851142883300781, "global_step": 385286, "epoch": 2293} {"train_loss": -12.22970962524414, "global_step": 385287, "epoch": 2293} {"train_loss": -10.9653959274292, "global_step": 385288, "epoch": 2293} {"train_loss": -12.35816764831543, "global_step": 385289, "epoch": 2293} {"train_loss": -11.446077346801758, "global_step": 385290, "epoch": 2293} {"train_loss": -11.380059242248535, "global_step": 385291, "epoch": 2293} {"train_loss": -11.940603256225586, "global_step": 385292, "epoch": 2293} {"train_loss": -12.249649047851562, "global_step": 385293, "epoch": 2293} {"train_loss": -11.164138793945312, "global_step": 385294, "epoch": 2293} {"train_loss": -11.72207260131836, "global_step": 385295, "epoch": 2293} {"train_loss": -10.642473220825195, "global_step": 385296, "epoch": 2293} {"train_loss": -10.149005889892578, "global_step": 385297, "epoch": 2293} {"train_loss": -10.75345230102539, "global_step": 385298, "epoch": 2293} {"train_loss": -10.498218536376953, "global_step": 385299, "epoch": 2293} {"train_loss": -11.004085540771484, "global_step": 385300, "epoch": 2293} {"train_loss": -11.105493545532227, "global_step": 385301, "epoch": 2293} {"train_loss": -10.109834671020508, "global_step": 385302, "epoch": 2293} {"train_loss": -9.552690505981445, "global_step": 385303, "epoch": 2293} {"train_loss": -10.142492294311523, "global_step": 385304, "epoch": 2293} {"train_loss": -10.799821853637695, "global_step": 385305, "epoch": 2293} {"train_loss": -9.997590065002441, "global_step": 385306, "epoch": 2293} {"train_loss": -10.201314926147461, "global_step": 385307, "epoch": 2293} {"train_loss": -9.624921798706055, "global_step": 385308, "epoch": 2293} {"train_loss": -11.14066219329834, "global_step": 385309, "epoch": 2293} {"train_loss": -9.954565048217773, "global_step": 385310, "epoch": 2293} {"train_loss": -11.572301864624023, "global_step": 385311, "epoch": 2293} {"train_loss": -9.957508087158203, "global_step": 385312, "epoch": 2293} {"train_loss": -10.070862770080566, "global_step": 385313, "epoch": 2293} {"train_loss": -11.186184883117676, "global_step": 385314, "epoch": 2293} {"train_loss": -9.567573547363281, "global_step": 385315, "epoch": 2293} {"train_loss": -11.752737998962402, "global_step": 385316, "epoch": 2293} {"train_loss": -10.177433967590332, "global_step": 385317, "epoch": 2293} {"train_loss": -10.557872772216797, "global_step": 385318, "epoch": 2293} {"train_loss": -10.876480102539062, "global_step": 385319, "epoch": 2293} {"train_loss": -11.00904655456543, "global_step": 385320, "epoch": 2293} {"train_loss": -11.20602798461914, "global_step": 385321, "epoch": 2293} {"train_loss": -11.548826217651367, "global_step": 385322, "epoch": 2293} {"train_loss": -11.381120681762695, "global_step": 385323, "epoch": 2293} {"train_loss": -11.356245040893555, "global_step": 385324, "epoch": 2293} {"train_loss": -11.215280532836914, "global_step": 385325, "epoch": 2293} {"train_loss": -11.638690948486328, "global_step": 385326, "epoch": 2293} {"train_loss": -11.736404418945312, "global_step": 385327, "epoch": 2293} {"train_loss": -12.024311065673828, "global_step": 385328, "epoch": 2293} {"train_loss": -11.928566932678223, "global_step": 385329, "epoch": 2293} {"train_loss": -11.801037788391113, "global_step": 385330, "epoch": 2293} {"train_loss": -11.844167709350586, "global_step": 385331, "epoch": 2293} {"train_loss": -12.082529067993164, "global_step": 385332, "epoch": 2293} {"train_loss": -11.486787796020508, "global_step": 385333, "epoch": 2293} {"train_loss": -12.299331665039062, "global_step": 385334, "epoch": 2293} {"train_loss": -11.634366989135742, "global_step": 385335, "epoch": 2293} {"train_loss": -11.744351387023926, "global_step": 385336, "epoch": 2293} {"train_loss": -11.912819862365723, "global_step": 385337, "epoch": 2293} {"train_loss": -12.157411575317383, "global_step": 385338, "epoch": 2293} {"train_loss": -11.94383716583252, "global_step": 385339, "epoch": 2293} {"train_loss": -12.131720542907715, "global_step": 385340, "epoch": 2293} {"train_loss": -12.11518669128418, "global_step": 385341, "epoch": 2293} {"train_loss": -11.986881256103516, "global_step": 385342, "epoch": 2293} {"train_loss": -12.392206192016602, "global_step": 385343, "epoch": 2293} {"train_loss": -11.95427417755127, "global_step": 385344, "epoch": 2293} {"train_loss": -12.340195655822754, "global_step": 385345, "epoch": 2293} {"train_loss": -12.219017028808594, "global_step": 385346, "epoch": 2293} {"train_loss": -12.115696907043457, "global_step": 385347, "epoch": 2293} {"train_loss": -12.32680892944336, "global_step": 385348, "epoch": 2293} {"train_loss": -12.265911102294922, "global_step": 385349, "epoch": 2293} {"train_loss": -12.391984939575195, "global_step": 385350, "epoch": 2293} {"train_loss": -12.195615768432617, "global_step": 385351, "epoch": 2293} {"train_loss": -12.412500381469727, "global_step": 385352, "epoch": 2293} {"train_loss": -12.374751091003418, "global_step": 385353, "epoch": 2293} {"train_loss": -12.02253246307373, "global_step": 385354, "epoch": 2293} {"train_loss": -12.267809867858887, "global_step": 385355, "epoch": 2293} {"train_loss": -12.28194808959961, "global_step": 385356, "epoch": 2293} {"train_loss": -12.501340866088867, "global_step": 385357, "epoch": 2293} {"train_loss": -12.267925262451172, "global_step": 385358, "epoch": 2293} {"train_loss": -12.351175308227539, "global_step": 385359, "epoch": 2293} {"train_loss": -12.461294174194336, "global_step": 385360, "epoch": 2293} {"train_loss": -12.458362579345703, "global_step": 385361, "epoch": 2293} {"train_loss": -12.524181365966797, "global_step": 385362, "epoch": 2293} {"train_loss": -12.417141914367676, "global_step": 385363, "epoch": 2293} {"train_loss": -12.349600791931152, "global_step": 385364, "epoch": 2293} {"train_loss": -12.571271896362305, "global_step": 385365, "epoch": 2293} {"train_loss": -12.287555694580078, "global_step": 385366, "epoch": 2293} {"train_loss": -12.352452278137207, "global_step": 385367, "epoch": 2293} {"train_loss": -12.430387496948242, "global_step": 385368, "epoch": 2293} {"train_loss": -12.456169128417969, "global_step": 385369, "epoch": 2293} {"train_loss": -12.27798080444336, "global_step": 385370, "epoch": 2293} {"train_loss": -12.57951545715332, "global_step": 385371, "epoch": 2293} {"train_loss": -12.365795135498047, "global_step": 385372, "epoch": 2293} {"train_loss": -12.510068893432617, "global_step": 385373, "epoch": 2293} {"train_loss": -12.437182426452637, "global_step": 385374, "epoch": 2293} {"train_loss": -12.542518615722656, "global_step": 385375, "epoch": 2293} {"train_loss": -12.302984237670898, "global_step": 385376, "epoch": 2293} {"train_loss": -12.382715225219727, "global_step": 385377, "epoch": 2293} {"train_loss": -12.541557312011719, "global_step": 385378, "epoch": 2293} {"train_loss": -12.288382530212402, "global_step": 385379, "epoch": 2293} {"train_loss": -12.614187240600586, "global_step": 385380, "epoch": 2293} {"train_loss": -12.114690780639648, "global_step": 385381, "epoch": 2293} {"train_loss": -12.369376182556152, "global_step": 385382, "epoch": 2293} {"train_loss": -12.440587997436523, "global_step": 385383, "epoch": 2293} {"train_loss": -12.426687240600586, "global_step": 385384, "epoch": 2293} {"train_loss": -12.410804748535156, "global_step": 385385, "epoch": 2293} {"train_loss": -12.296062469482422, "global_step": 385386, "epoch": 2293} {"train_loss": -12.680610656738281, "global_step": 385387, "epoch": 2293} {"train_loss": -12.522504806518555, "global_step": 385388, "epoch": 2293} {"train_loss": -12.576122283935547, "global_step": 385389, "epoch": 2293} {"train_loss": -12.558015823364258, "global_step": 385390, "epoch": 2293} {"train_loss": -11.937975395293464, "global_step": 385391, "epoch": 2293, "val_loss": 296474.125} {"train_loss": -12.411341667175293, "global_step": 385392, "epoch": 2294} {"train_loss": -12.373043060302734, "global_step": 385393, "epoch": 2294} {"train_loss": -12.253047943115234, "global_step": 385394, "epoch": 2294} {"train_loss": -12.155387878417969, "global_step": 385395, "epoch": 2294} {"train_loss": -12.42265510559082, "global_step": 385396, "epoch": 2294} {"train_loss": -12.070013999938965, "global_step": 385397, "epoch": 2294} {"train_loss": -12.09875774383545, "global_step": 385398, "epoch": 2294} {"train_loss": -12.299232482910156, "global_step": 385399, "epoch": 2294} {"train_loss": -11.91047477722168, "global_step": 385400, "epoch": 2294} {"train_loss": -12.427994728088379, "global_step": 385401, "epoch": 2294} {"train_loss": -11.889566421508789, "global_step": 385402, "epoch": 2294} {"train_loss": -12.048128128051758, "global_step": 385403, "epoch": 2294} {"train_loss": -12.142143249511719, "global_step": 385404, "epoch": 2294} {"train_loss": -12.2493314743042, "global_step": 385405, "epoch": 2294} {"train_loss": -12.377958297729492, "global_step": 385406, "epoch": 2294} {"train_loss": -11.893537521362305, "global_step": 385407, "epoch": 2294} {"train_loss": -12.275409698486328, "global_step": 385408, "epoch": 2294} {"train_loss": -12.297371864318848, "global_step": 385409, "epoch": 2294} {"train_loss": -12.61717414855957, "global_step": 385410, "epoch": 2294} {"train_loss": -12.429788589477539, "global_step": 385411, "epoch": 2294} {"train_loss": -12.246893882751465, "global_step": 385412, "epoch": 2294} {"train_loss": -12.459917068481445, "global_step": 385413, "epoch": 2294} {"train_loss": -12.381095886230469, "global_step": 385414, "epoch": 2294} {"train_loss": -12.425975799560547, "global_step": 385415, "epoch": 2294} {"train_loss": -12.681510925292969, "global_step": 385416, "epoch": 2294} {"train_loss": -12.3964204788208, "global_step": 385417, "epoch": 2294} {"train_loss": -12.502185821533203, "global_step": 385418, "epoch": 2294} {"train_loss": -12.085625648498535, "global_step": 385419, "epoch": 2294} {"train_loss": -12.440102577209473, "global_step": 385420, "epoch": 2294} {"train_loss": -12.464282989501953, "global_step": 385421, "epoch": 2294} {"train_loss": -12.534749984741211, "global_step": 385422, "epoch": 2294} {"train_loss": -12.291175842285156, "global_step": 385423, "epoch": 2294} {"train_loss": -12.615242004394531, "global_step": 385424, "epoch": 2294} {"train_loss": -12.53255558013916, "global_step": 385425, "epoch": 2294} {"train_loss": -12.794805526733398, "global_step": 385426, "epoch": 2294} {"train_loss": -12.377685546875, "global_step": 385427, "epoch": 2294} {"train_loss": -12.57027530670166, "global_step": 385428, "epoch": 2294} {"train_loss": -12.354321479797363, "global_step": 385429, "epoch": 2294} {"train_loss": -12.603535652160645, "global_step": 385430, "epoch": 2294} {"train_loss": -12.398599624633789, "global_step": 385431, "epoch": 2294} {"train_loss": -12.298478126525879, "global_step": 385432, "epoch": 2294} {"train_loss": -12.330774307250977, "global_step": 385433, "epoch": 2294} {"train_loss": -12.410070419311523, "global_step": 385434, "epoch": 2294} {"train_loss": -12.402212142944336, "global_step": 385435, "epoch": 2294} {"train_loss": -12.35244369506836, "global_step": 385436, "epoch": 2294} {"train_loss": -12.306268692016602, "global_step": 385437, "epoch": 2294} {"train_loss": -12.05554485321045, "global_step": 385438, "epoch": 2294} {"train_loss": -12.50033950805664, "global_step": 385439, "epoch": 2294} {"train_loss": -12.427103042602539, "global_step": 385440, "epoch": 2294} {"train_loss": -12.331544876098633, "global_step": 385441, "epoch": 2294} {"train_loss": -11.92929458618164, "global_step": 385442, "epoch": 2294} {"train_loss": -12.400986671447754, "global_step": 385443, "epoch": 2294} {"train_loss": -12.65078353881836, "global_step": 385444, "epoch": 2294} {"train_loss": -12.064613342285156, "global_step": 385445, "epoch": 2294} {"train_loss": -12.582948684692383, "global_step": 385446, "epoch": 2294} {"train_loss": -11.86375617980957, "global_step": 385447, "epoch": 2294} {"train_loss": -11.574803352355957, "global_step": 385448, "epoch": 2294} {"train_loss": -11.34406566619873, "global_step": 385449, "epoch": 2294} {"train_loss": -11.248096466064453, "global_step": 385450, "epoch": 2294} {"train_loss": -10.58120059967041, "global_step": 385451, "epoch": 2294} {"train_loss": -10.288656234741211, "global_step": 385452, "epoch": 2294} {"train_loss": -10.348703384399414, "global_step": 385453, "epoch": 2294} {"train_loss": -10.979011535644531, "global_step": 385454, "epoch": 2294} {"train_loss": -8.528671264648438, "global_step": 385455, "epoch": 2294} {"train_loss": -11.009269714355469, "global_step": 385456, "epoch": 2294} {"train_loss": -10.819013595581055, "global_step": 385457, "epoch": 2294} {"train_loss": -9.297330856323242, "global_step": 385458, "epoch": 2294} {"train_loss": -11.258866310119629, "global_step": 385459, "epoch": 2294} {"train_loss": -9.313982009887695, "global_step": 385460, "epoch": 2294} {"train_loss": -9.909404754638672, "global_step": 385461, "epoch": 2294} {"train_loss": -9.846631050109863, "global_step": 385462, "epoch": 2294} {"train_loss": -9.022775650024414, "global_step": 385463, "epoch": 2294} {"train_loss": -9.57307243347168, "global_step": 385464, "epoch": 2294} {"train_loss": -10.536087036132812, "global_step": 385465, "epoch": 2294} {"train_loss": -8.021284103393555, "global_step": 385466, "epoch": 2294} {"train_loss": -9.748019218444824, "global_step": 385467, "epoch": 2294} {"train_loss": -8.808950424194336, "global_step": 385468, "epoch": 2294} {"train_loss": -9.205355644226074, "global_step": 385469, "epoch": 2294} {"train_loss": -8.8072509765625, "global_step": 385470, "epoch": 2294} {"train_loss": -8.562294006347656, "global_step": 385471, "epoch": 2294} {"train_loss": -9.962197303771973, "global_step": 385472, "epoch": 2294} {"train_loss": -9.86473274230957, "global_step": 385473, "epoch": 2294} {"train_loss": -9.265932083129883, "global_step": 385474, "epoch": 2294} {"train_loss": -9.584285736083984, "global_step": 385475, "epoch": 2294} {"train_loss": -10.135765075683594, "global_step": 385476, "epoch": 2294} {"train_loss": -10.38383674621582, "global_step": 385477, "epoch": 2294} {"train_loss": -10.575021743774414, "global_step": 385478, "epoch": 2294} {"train_loss": -10.557326316833496, "global_step": 385479, "epoch": 2294} {"train_loss": -10.24491024017334, "global_step": 385480, "epoch": 2294} {"train_loss": -10.261383056640625, "global_step": 385481, "epoch": 2294} {"train_loss": -11.333586692810059, "global_step": 385482, "epoch": 2294} {"train_loss": -10.89918327331543, "global_step": 385483, "epoch": 2294} {"train_loss": -11.559703826904297, "global_step": 385484, "epoch": 2294} {"train_loss": -11.088109970092773, "global_step": 385485, "epoch": 2294} {"train_loss": -11.045089721679688, "global_step": 385486, "epoch": 2294} {"train_loss": -11.150030136108398, "global_step": 385487, "epoch": 2294} {"train_loss": -11.15367603302002, "global_step": 385488, "epoch": 2294} {"train_loss": -11.603789329528809, "global_step": 385489, "epoch": 2294} {"train_loss": -11.526368141174316, "global_step": 385490, "epoch": 2294} {"train_loss": -11.546143531799316, "global_step": 385491, "epoch": 2294} {"train_loss": -11.329172134399414, "global_step": 385492, "epoch": 2294} {"train_loss": -11.579305648803711, "global_step": 385493, "epoch": 2294} {"train_loss": -11.40710163116455, "global_step": 385494, "epoch": 2294} {"train_loss": -11.625032424926758, "global_step": 385495, "epoch": 2294} {"train_loss": -11.236413955688477, "global_step": 385496, "epoch": 2294} {"train_loss": -11.68047046661377, "global_step": 385497, "epoch": 2294} {"train_loss": -11.517752647399902, "global_step": 385498, "epoch": 2294} {"train_loss": -11.777278900146484, "global_step": 385499, "epoch": 2294} {"train_loss": -11.872481346130371, "global_step": 385500, "epoch": 2294} {"train_loss": -11.900323867797852, "global_step": 385501, "epoch": 2294} {"train_loss": -11.987419128417969, "global_step": 385502, "epoch": 2294} {"train_loss": -11.520953178405762, "global_step": 385503, "epoch": 2294} {"train_loss": -11.885885238647461, "global_step": 385504, "epoch": 2294} {"train_loss": -12.015263557434082, "global_step": 385505, "epoch": 2294} {"train_loss": -11.823945999145508, "global_step": 385506, "epoch": 2294} {"train_loss": -12.056570053100586, "global_step": 385507, "epoch": 2294} {"train_loss": -11.701619148254395, "global_step": 385508, "epoch": 2294} {"train_loss": -12.003084182739258, "global_step": 385509, "epoch": 2294} {"train_loss": -12.163281440734863, "global_step": 385510, "epoch": 2294} {"train_loss": -11.977235794067383, "global_step": 385511, "epoch": 2294} {"train_loss": -12.019996643066406, "global_step": 385512, "epoch": 2294} {"train_loss": -11.868949890136719, "global_step": 385513, "epoch": 2294} {"train_loss": -11.812235832214355, "global_step": 385514, "epoch": 2294} {"train_loss": -12.165390968322754, "global_step": 385515, "epoch": 2294} {"train_loss": -11.71530818939209, "global_step": 385516, "epoch": 2294} {"train_loss": -12.106837272644043, "global_step": 385517, "epoch": 2294} {"train_loss": -12.051631927490234, "global_step": 385518, "epoch": 2294} {"train_loss": -12.080750465393066, "global_step": 385519, "epoch": 2294} {"train_loss": -12.075193405151367, "global_step": 385520, "epoch": 2294} {"train_loss": -11.898214340209961, "global_step": 385521, "epoch": 2294} {"train_loss": -12.243415832519531, "global_step": 385522, "epoch": 2294} {"train_loss": -12.171012878417969, "global_step": 385523, "epoch": 2294} {"train_loss": -12.259549140930176, "global_step": 385524, "epoch": 2294} {"train_loss": -12.21475887298584, "global_step": 385525, "epoch": 2294} {"train_loss": -12.361804008483887, "global_step": 385526, "epoch": 2294} {"train_loss": -12.296602249145508, "global_step": 385527, "epoch": 2294} {"train_loss": -12.35147762298584, "global_step": 385528, "epoch": 2294} {"train_loss": -12.256852149963379, "global_step": 385529, "epoch": 2294} {"train_loss": -12.289848327636719, "global_step": 385530, "epoch": 2294} {"train_loss": -12.39725112915039, "global_step": 385531, "epoch": 2294} {"train_loss": -12.488197326660156, "global_step": 385532, "epoch": 2294} {"train_loss": -12.540048599243164, "global_step": 385533, "epoch": 2294} {"train_loss": -12.340293884277344, "global_step": 385534, "epoch": 2294} {"train_loss": -12.449858665466309, "global_step": 385535, "epoch": 2294} {"train_loss": -12.344293594360352, "global_step": 385536, "epoch": 2294} {"train_loss": -12.437244415283203, "global_step": 385537, "epoch": 2294} {"train_loss": -12.365511894226074, "global_step": 385538, "epoch": 2294} {"train_loss": -12.361676216125488, "global_step": 385539, "epoch": 2294} {"train_loss": -12.456008911132812, "global_step": 385540, "epoch": 2294} {"train_loss": -12.414321899414062, "global_step": 385541, "epoch": 2294} {"train_loss": -12.59391975402832, "global_step": 385542, "epoch": 2294} {"train_loss": -12.621539115905762, "global_step": 385543, "epoch": 2294} {"train_loss": -12.543980598449707, "global_step": 385544, "epoch": 2294} {"train_loss": -12.402676582336426, "global_step": 385545, "epoch": 2294} {"train_loss": -12.296177864074707, "global_step": 385546, "epoch": 2294} {"train_loss": -12.574405670166016, "global_step": 385547, "epoch": 2294} {"train_loss": -12.61043643951416, "global_step": 385548, "epoch": 2294} {"train_loss": -12.645503997802734, "global_step": 385549, "epoch": 2294} {"train_loss": -12.438762664794922, "global_step": 385550, "epoch": 2294} {"train_loss": -12.481489181518555, "global_step": 385551, "epoch": 2294} {"train_loss": -12.59824275970459, "global_step": 385552, "epoch": 2294} {"train_loss": -12.711618423461914, "global_step": 385553, "epoch": 2294} {"train_loss": -12.867191314697266, "global_step": 385554, "epoch": 2294} {"train_loss": -12.518157958984375, "global_step": 385555, "epoch": 2294} {"train_loss": -12.454972267150879, "global_step": 385556, "epoch": 2294} {"train_loss": -12.432768821716309, "global_step": 385557, "epoch": 2294} {"train_loss": -12.326223373413086, "global_step": 385558, "epoch": 2294} {"train_loss": -11.72916328907013, "global_step": 385559, "epoch": 2294, "val_loss": 295562.4375} {"train_loss": -11.803693771362305, "global_step": 385560, "epoch": 2295} {"train_loss": -11.686999320983887, "global_step": 385561, "epoch": 2295} {"train_loss": -12.726073265075684, "global_step": 385562, "epoch": 2295} {"train_loss": -12.199377059936523, "global_step": 385563, "epoch": 2295} {"train_loss": -12.347404479980469, "global_step": 385564, "epoch": 2295} {"train_loss": -12.434181213378906, "global_step": 385565, "epoch": 2295} {"train_loss": -12.283957481384277, "global_step": 385566, "epoch": 2295} {"train_loss": -11.9296236038208, "global_step": 385567, "epoch": 2295} {"train_loss": -12.525999069213867, "global_step": 385568, "epoch": 2295} {"train_loss": -12.53103256225586, "global_step": 385569, "epoch": 2295} {"train_loss": -12.258974075317383, "global_step": 385570, "epoch": 2295} {"train_loss": -12.171649932861328, "global_step": 385571, "epoch": 2295} {"train_loss": -12.168639183044434, "global_step": 385572, "epoch": 2295} {"train_loss": -12.073027610778809, "global_step": 385573, "epoch": 2295} {"train_loss": -12.502964973449707, "global_step": 385574, "epoch": 2295} {"train_loss": -12.20345401763916, "global_step": 385575, "epoch": 2295} {"train_loss": -12.621712684631348, "global_step": 385576, "epoch": 2295} {"train_loss": -12.745840072631836, "global_step": 385577, "epoch": 2295} {"train_loss": -12.527191162109375, "global_step": 385578, "epoch": 2295} {"train_loss": -12.451667785644531, "global_step": 385579, "epoch": 2295} {"train_loss": -12.484073638916016, "global_step": 385580, "epoch": 2295} {"train_loss": -12.448753356933594, "global_step": 385581, "epoch": 2295} {"train_loss": -12.416635513305664, "global_step": 385582, "epoch": 2295} {"train_loss": -12.332996368408203, "global_step": 385583, "epoch": 2295} {"train_loss": -12.022408485412598, "global_step": 385584, "epoch": 2295} {"train_loss": -11.871271133422852, "global_step": 385585, "epoch": 2295} {"train_loss": -11.46173095703125, "global_step": 385586, "epoch": 2295} {"train_loss": -12.234058380126953, "global_step": 385587, "epoch": 2295} {"train_loss": -11.794208526611328, "global_step": 385588, "epoch": 2295} {"train_loss": -12.11577320098877, "global_step": 385589, "epoch": 2295} {"train_loss": -12.208963394165039, "global_step": 385590, "epoch": 2295} {"train_loss": -11.983041763305664, "global_step": 385591, "epoch": 2295} {"train_loss": -11.714500427246094, "global_step": 385592, "epoch": 2295} {"train_loss": -12.449424743652344, "global_step": 385593, "epoch": 2295} {"train_loss": -11.811877250671387, "global_step": 385594, "epoch": 2295} {"train_loss": -11.237115859985352, "global_step": 385595, "epoch": 2295} {"train_loss": -12.167377471923828, "global_step": 385596, "epoch": 2295} {"train_loss": -11.787933349609375, "global_step": 385597, "epoch": 2295} {"train_loss": -11.895813941955566, "global_step": 385598, "epoch": 2295} {"train_loss": -12.188941955566406, "global_step": 385599, "epoch": 2295} {"train_loss": -11.606281280517578, "global_step": 385600, "epoch": 2295} {"train_loss": -12.233166694641113, "global_step": 385601, "epoch": 2295} {"train_loss": -12.033048629760742, "global_step": 385602, "epoch": 2295} {"train_loss": -12.206836700439453, "global_step": 385603, "epoch": 2295} {"train_loss": -12.145101547241211, "global_step": 385604, "epoch": 2295} {"train_loss": -12.255685806274414, "global_step": 385605, "epoch": 2295} {"train_loss": -12.2979736328125, "global_step": 385606, "epoch": 2295} {"train_loss": -12.233532905578613, "global_step": 385607, "epoch": 2295} {"train_loss": -12.154131889343262, "global_step": 385608, "epoch": 2295} {"train_loss": -12.03070068359375, "global_step": 385609, "epoch": 2295} {"train_loss": -12.16988754272461, "global_step": 385610, "epoch": 2295} {"train_loss": -12.182497024536133, "global_step": 385611, "epoch": 2295} {"train_loss": -12.26148796081543, "global_step": 385612, "epoch": 2295} {"train_loss": -12.325882911682129, "global_step": 385613, "epoch": 2295} {"train_loss": -12.494157791137695, "global_step": 385614, "epoch": 2295} {"train_loss": -12.231155395507812, "global_step": 385615, "epoch": 2295} {"train_loss": -11.810823440551758, "global_step": 385616, "epoch": 2295} {"train_loss": -12.057395935058594, "global_step": 385617, "epoch": 2295} {"train_loss": -12.515726089477539, "global_step": 385618, "epoch": 2295} {"train_loss": -12.386198043823242, "global_step": 385619, "epoch": 2295} {"train_loss": -12.081356048583984, "global_step": 385620, "epoch": 2295} {"train_loss": -12.310397148132324, "global_step": 385621, "epoch": 2295} {"train_loss": -12.025897979736328, "global_step": 385622, "epoch": 2295} {"train_loss": -11.648205757141113, "global_step": 385623, "epoch": 2295} {"train_loss": -12.057722091674805, "global_step": 385624, "epoch": 2295} {"train_loss": -11.714731216430664, "global_step": 385625, "epoch": 2295} {"train_loss": -10.98583698272705, "global_step": 385626, "epoch": 2295} {"train_loss": -11.14145565032959, "global_step": 385627, "epoch": 2295} {"train_loss": -11.515233993530273, "global_step": 385628, "epoch": 2295} {"train_loss": -10.742057800292969, "global_step": 385629, "epoch": 2295} {"train_loss": -11.967926025390625, "global_step": 385630, "epoch": 2295} {"train_loss": -11.73287296295166, "global_step": 385631, "epoch": 2295} {"train_loss": -11.816651344299316, "global_step": 385632, "epoch": 2295} {"train_loss": -11.055566787719727, "global_step": 385633, "epoch": 2295} {"train_loss": -11.533039093017578, "global_step": 385634, "epoch": 2295} {"train_loss": -12.022424697875977, "global_step": 385635, "epoch": 2295} {"train_loss": -10.92681884765625, "global_step": 385636, "epoch": 2295} {"train_loss": -12.379358291625977, "global_step": 385637, "epoch": 2295} {"train_loss": -11.363554000854492, "global_step": 385638, "epoch": 2295} {"train_loss": -11.09323501586914, "global_step": 385639, "epoch": 2295} {"train_loss": -11.357356071472168, "global_step": 385640, "epoch": 2295} {"train_loss": -12.00320816040039, "global_step": 385641, "epoch": 2295} {"train_loss": -11.282902717590332, "global_step": 385642, "epoch": 2295} {"train_loss": -10.635397911071777, "global_step": 385643, "epoch": 2295} {"train_loss": -11.253400802612305, "global_step": 385644, "epoch": 2295} {"train_loss": -9.954867362976074, "global_step": 385645, "epoch": 2295} {"train_loss": -8.768390655517578, "global_step": 385646, "epoch": 2295} {"train_loss": -9.610443115234375, "global_step": 385647, "epoch": 2295} {"train_loss": -9.52662181854248, "global_step": 385648, "epoch": 2295} {"train_loss": -9.59585189819336, "global_step": 385649, "epoch": 2295} {"train_loss": -9.98490047454834, "global_step": 385650, "epoch": 2295} {"train_loss": -10.569162368774414, "global_step": 385651, "epoch": 2295} {"train_loss": -9.081361770629883, "global_step": 385652, "epoch": 2295} {"train_loss": -8.226318359375, "global_step": 385653, "epoch": 2295} {"train_loss": -9.393040657043457, "global_step": 385654, "epoch": 2295} {"train_loss": -10.914451599121094, "global_step": 385655, "epoch": 2295} {"train_loss": -9.876696586608887, "global_step": 385656, "epoch": 2295} {"train_loss": -9.621423721313477, "global_step": 385657, "epoch": 2295} {"train_loss": -10.365591049194336, "global_step": 385658, "epoch": 2295} {"train_loss": -10.424543380737305, "global_step": 385659, "epoch": 2295} {"train_loss": -10.444616317749023, "global_step": 385660, "epoch": 2295} {"train_loss": -10.583309173583984, "global_step": 385661, "epoch": 2295} {"train_loss": -10.80052661895752, "global_step": 385662, "epoch": 2295} {"train_loss": -10.874631881713867, "global_step": 385663, "epoch": 2295} {"train_loss": -10.404195785522461, "global_step": 385664, "epoch": 2295} {"train_loss": -10.720550537109375, "global_step": 385665, "epoch": 2295} {"train_loss": -11.041266441345215, "global_step": 385666, "epoch": 2295} {"train_loss": -11.039972305297852, "global_step": 385667, "epoch": 2295} {"train_loss": -11.282796859741211, "global_step": 385668, "epoch": 2295} {"train_loss": -11.571483612060547, "global_step": 385669, "epoch": 2295} {"train_loss": -10.609905242919922, "global_step": 385670, "epoch": 2295} {"train_loss": -11.917885780334473, "global_step": 385671, "epoch": 2295} {"train_loss": -10.857135772705078, "global_step": 385672, "epoch": 2295} {"train_loss": -11.367490768432617, "global_step": 385673, "epoch": 2295} {"train_loss": -11.426942825317383, "global_step": 385674, "epoch": 2295} {"train_loss": -11.544751167297363, "global_step": 385675, "epoch": 2295} {"train_loss": -11.578567504882812, "global_step": 385676, "epoch": 2295} {"train_loss": -11.67141342163086, "global_step": 385677, "epoch": 2295} {"train_loss": -11.561854362487793, "global_step": 385678, "epoch": 2295} {"train_loss": -11.584258079528809, "global_step": 385679, "epoch": 2295} {"train_loss": -11.670656204223633, "global_step": 385680, "epoch": 2295} {"train_loss": -11.701387405395508, "global_step": 385681, "epoch": 2295} {"train_loss": -11.878338813781738, "global_step": 385682, "epoch": 2295} {"train_loss": -12.040031433105469, "global_step": 385683, "epoch": 2295} {"train_loss": -11.931072235107422, "global_step": 385684, "epoch": 2295} {"train_loss": -12.011838912963867, "global_step": 385685, "epoch": 2295} {"train_loss": -11.695666313171387, "global_step": 385686, "epoch": 2295} {"train_loss": -11.922603607177734, "global_step": 385687, "epoch": 2295} {"train_loss": -11.94442081451416, "global_step": 385688, "epoch": 2295} {"train_loss": -11.579468727111816, "global_step": 385689, "epoch": 2295} {"train_loss": -11.997539520263672, "global_step": 385690, "epoch": 2295} {"train_loss": -12.215883255004883, "global_step": 385691, "epoch": 2295} {"train_loss": -11.957695960998535, "global_step": 385692, "epoch": 2295} {"train_loss": -12.050745010375977, "global_step": 385693, "epoch": 2295} {"train_loss": -11.999698638916016, "global_step": 385694, "epoch": 2295} {"train_loss": -12.036846160888672, "global_step": 385695, "epoch": 2295} {"train_loss": -12.073197364807129, "global_step": 385696, "epoch": 2295} {"train_loss": -12.045367240905762, "global_step": 385697, "epoch": 2295} {"train_loss": -12.052518844604492, "global_step": 385698, "epoch": 2295} {"train_loss": -12.316303253173828, "global_step": 385699, "epoch": 2295} {"train_loss": -11.654794692993164, "global_step": 385700, "epoch": 2295} {"train_loss": -12.462255477905273, "global_step": 385701, "epoch": 2295} {"train_loss": -11.903194427490234, "global_step": 385702, "epoch": 2295} {"train_loss": -12.168729782104492, "global_step": 385703, "epoch": 2295} {"train_loss": -12.299945831298828, "global_step": 385704, "epoch": 2295} {"train_loss": -12.322219848632812, "global_step": 385705, "epoch": 2295} {"train_loss": -12.27833366394043, "global_step": 385706, "epoch": 2295} {"train_loss": -12.37242317199707, "global_step": 385707, "epoch": 2295} {"train_loss": -12.14537239074707, "global_step": 385708, "epoch": 2295} {"train_loss": -12.47445297241211, "global_step": 385709, "epoch": 2295} {"train_loss": -12.071186065673828, "global_step": 385710, "epoch": 2295} {"train_loss": -12.316638946533203, "global_step": 385711, "epoch": 2295} {"train_loss": -12.259543418884277, "global_step": 385712, "epoch": 2295} {"train_loss": -12.284873962402344, "global_step": 385713, "epoch": 2295} {"train_loss": -12.325733184814453, "global_step": 385714, "epoch": 2295} {"train_loss": -12.3231201171875, "global_step": 385715, "epoch": 2295} {"train_loss": -12.2947998046875, "global_step": 385716, "epoch": 2295} {"train_loss": -12.273077011108398, "global_step": 385717, "epoch": 2295} {"train_loss": -12.416159629821777, "global_step": 385718, "epoch": 2295} {"train_loss": -12.418071746826172, "global_step": 385719, "epoch": 2295} {"train_loss": -12.48524284362793, "global_step": 385720, "epoch": 2295} {"train_loss": -12.217857360839844, "global_step": 385721, "epoch": 2295} {"train_loss": -12.413347244262695, "global_step": 385722, "epoch": 2295} {"train_loss": -12.365079879760742, "global_step": 385723, "epoch": 2295} {"train_loss": -12.390649795532227, "global_step": 385724, "epoch": 2295} {"train_loss": -12.520503997802734, "global_step": 385725, "epoch": 2295} {"train_loss": -12.520570755004883, "global_step": 385726, "epoch": 2295} {"train_loss": -11.733775229681106, "global_step": 385727, "epoch": 2295, "val_loss": 291652.03125, "train_action_mse_error": 1.2580903768539429} {"train_loss": -12.534926414489746, "global_step": 385728, "epoch": 2296} {"train_loss": -12.251689910888672, "global_step": 385729, "epoch": 2296} {"train_loss": -12.498692512512207, "global_step": 385730, "epoch": 2296} {"train_loss": -12.094882011413574, "global_step": 385731, "epoch": 2296} {"train_loss": -12.078795433044434, "global_step": 385732, "epoch": 2296} {"train_loss": -12.72079086303711, "global_step": 385733, "epoch": 2296} {"train_loss": -11.965015411376953, "global_step": 385734, "epoch": 2296} {"train_loss": -12.267037391662598, "global_step": 385735, "epoch": 2296} {"train_loss": -12.473811149597168, "global_step": 385736, "epoch": 2296} {"train_loss": -12.471699714660645, "global_step": 385737, "epoch": 2296} {"train_loss": -12.278436660766602, "global_step": 385738, "epoch": 2296} {"train_loss": -12.556787490844727, "global_step": 385739, "epoch": 2296} {"train_loss": -12.60368537902832, "global_step": 385740, "epoch": 2296} {"train_loss": -12.56142807006836, "global_step": 385741, "epoch": 2296} {"train_loss": -12.6177978515625, "global_step": 385742, "epoch": 2296} {"train_loss": -12.496965408325195, "global_step": 385743, "epoch": 2296} {"train_loss": -12.530107498168945, "global_step": 385744, "epoch": 2296} {"train_loss": -12.382339477539062, "global_step": 385745, "epoch": 2296} {"train_loss": -12.56185531616211, "global_step": 385746, "epoch": 2296} {"train_loss": -12.620311737060547, "global_step": 385747, "epoch": 2296} {"train_loss": -12.668323516845703, "global_step": 385748, "epoch": 2296} {"train_loss": -12.730949401855469, "global_step": 385749, "epoch": 2296} {"train_loss": -12.685043334960938, "global_step": 385750, "epoch": 2296} {"train_loss": -12.420008659362793, "global_step": 385751, "epoch": 2296} {"train_loss": -12.688175201416016, "global_step": 385752, "epoch": 2296} {"train_loss": -12.561809539794922, "global_step": 385753, "epoch": 2296} {"train_loss": -12.749588012695312, "global_step": 385754, "epoch": 2296} {"train_loss": -12.610184669494629, "global_step": 385755, "epoch": 2296} {"train_loss": -12.584169387817383, "global_step": 385756, "epoch": 2296} {"train_loss": -12.46726131439209, "global_step": 385757, "epoch": 2296} {"train_loss": -12.710546493530273, "global_step": 385758, "epoch": 2296} {"train_loss": -12.839140892028809, "global_step": 385759, "epoch": 2296} {"train_loss": -12.545666694641113, "global_step": 385760, "epoch": 2296} {"train_loss": -12.340890884399414, "global_step": 385761, "epoch": 2296} {"train_loss": -12.480457305908203, "global_step": 385762, "epoch": 2296} {"train_loss": -12.591787338256836, "global_step": 385763, "epoch": 2296} {"train_loss": -12.213581085205078, "global_step": 385764, "epoch": 2296} {"train_loss": -12.683786392211914, "global_step": 385765, "epoch": 2296} {"train_loss": -12.473129272460938, "global_step": 385766, "epoch": 2296} {"train_loss": -12.553169250488281, "global_step": 385767, "epoch": 2296} {"train_loss": -12.550308227539062, "global_step": 385768, "epoch": 2296} {"train_loss": -12.70506763458252, "global_step": 385769, "epoch": 2296} {"train_loss": -12.542886734008789, "global_step": 385770, "epoch": 2296} {"train_loss": -12.529023170471191, "global_step": 385771, "epoch": 2296} {"train_loss": -12.582080841064453, "global_step": 385772, "epoch": 2296} {"train_loss": -12.454339981079102, "global_step": 385773, "epoch": 2296} {"train_loss": -12.37587833404541, "global_step": 385774, "epoch": 2296} {"train_loss": -12.501031875610352, "global_step": 385775, "epoch": 2296} {"train_loss": -12.38805866241455, "global_step": 385776, "epoch": 2296} {"train_loss": -12.42704963684082, "global_step": 385777, "epoch": 2296} {"train_loss": -12.554784774780273, "global_step": 385778, "epoch": 2296} {"train_loss": -12.342345237731934, "global_step": 385779, "epoch": 2296} {"train_loss": -12.433412551879883, "global_step": 385780, "epoch": 2296} {"train_loss": -12.615682601928711, "global_step": 385781, "epoch": 2296} {"train_loss": -12.380508422851562, "global_step": 385782, "epoch": 2296} {"train_loss": -12.329612731933594, "global_step": 385783, "epoch": 2296} {"train_loss": -12.643150329589844, "global_step": 385784, "epoch": 2296} {"train_loss": -12.484549522399902, "global_step": 385785, "epoch": 2296} {"train_loss": -12.388625144958496, "global_step": 385786, "epoch": 2296} {"train_loss": -12.51351547241211, "global_step": 385787, "epoch": 2296} {"train_loss": -11.968289375305176, "global_step": 385788, "epoch": 2296} {"train_loss": -11.912397384643555, "global_step": 385789, "epoch": 2296} {"train_loss": -12.532027244567871, "global_step": 385790, "epoch": 2296} {"train_loss": -11.695655822753906, "global_step": 385791, "epoch": 2296} {"train_loss": -11.180764198303223, "global_step": 385792, "epoch": 2296} {"train_loss": -11.957712173461914, "global_step": 385793, "epoch": 2296} {"train_loss": -12.31274127960205, "global_step": 385794, "epoch": 2296} {"train_loss": -11.768108367919922, "global_step": 385795, "epoch": 2296} {"train_loss": -12.305534362792969, "global_step": 385796, "epoch": 2296} {"train_loss": -12.313159942626953, "global_step": 385797, "epoch": 2296} {"train_loss": -11.655131340026855, "global_step": 385798, "epoch": 2296} {"train_loss": -11.99812126159668, "global_step": 385799, "epoch": 2296} {"train_loss": -11.705750465393066, "global_step": 385800, "epoch": 2296} {"train_loss": -12.212503433227539, "global_step": 385801, "epoch": 2296} {"train_loss": -11.990987777709961, "global_step": 385802, "epoch": 2296} {"train_loss": -12.093329429626465, "global_step": 385803, "epoch": 2296} {"train_loss": -11.27895736694336, "global_step": 385804, "epoch": 2296} {"train_loss": -11.397231101989746, "global_step": 385805, "epoch": 2296} {"train_loss": -12.029446601867676, "global_step": 385806, "epoch": 2296} {"train_loss": -12.374404907226562, "global_step": 385807, "epoch": 2296} {"train_loss": -12.035955429077148, "global_step": 385808, "epoch": 2296} {"train_loss": -11.755229949951172, "global_step": 385809, "epoch": 2296} {"train_loss": -11.874759674072266, "global_step": 385810, "epoch": 2296} {"train_loss": -11.982316017150879, "global_step": 385811, "epoch": 2296} {"train_loss": -12.189774513244629, "global_step": 385812, "epoch": 2296} {"train_loss": -11.418845176696777, "global_step": 385813, "epoch": 2296} {"train_loss": -11.40468978881836, "global_step": 385814, "epoch": 2296} {"train_loss": -11.637243270874023, "global_step": 385815, "epoch": 2296} {"train_loss": -11.855634689331055, "global_step": 385816, "epoch": 2296} {"train_loss": -11.697576522827148, "global_step": 385817, "epoch": 2296} {"train_loss": -12.157718658447266, "global_step": 385818, "epoch": 2296} {"train_loss": -11.770464897155762, "global_step": 385819, "epoch": 2296} {"train_loss": -12.091521263122559, "global_step": 385820, "epoch": 2296} {"train_loss": -11.574966430664062, "global_step": 385821, "epoch": 2296} {"train_loss": -12.245721817016602, "global_step": 385822, "epoch": 2296} {"train_loss": -11.855257987976074, "global_step": 385823, "epoch": 2296} {"train_loss": -11.747754096984863, "global_step": 385824, "epoch": 2296} {"train_loss": -11.594125747680664, "global_step": 385825, "epoch": 2296} {"train_loss": -11.657415390014648, "global_step": 385826, "epoch": 2296} {"train_loss": -12.007157325744629, "global_step": 385827, "epoch": 2296} {"train_loss": -11.008193969726562, "global_step": 385828, "epoch": 2296} {"train_loss": -11.244239807128906, "global_step": 385829, "epoch": 2296} {"train_loss": -10.720803260803223, "global_step": 385830, "epoch": 2296} {"train_loss": -11.19186782836914, "global_step": 385831, "epoch": 2296} {"train_loss": -11.601057052612305, "global_step": 385832, "epoch": 2296} {"train_loss": -10.270441055297852, "global_step": 385833, "epoch": 2296} {"train_loss": -12.256214141845703, "global_step": 385834, "epoch": 2296} {"train_loss": -9.12173080444336, "global_step": 385835, "epoch": 2296} {"train_loss": -10.975627899169922, "global_step": 385836, "epoch": 2296} {"train_loss": -9.354399681091309, "global_step": 385837, "epoch": 2296} {"train_loss": -9.67852783203125, "global_step": 385838, "epoch": 2296} {"train_loss": -10.255622863769531, "global_step": 385839, "epoch": 2296} {"train_loss": -9.803096771240234, "global_step": 385840, "epoch": 2296} {"train_loss": -10.45950984954834, "global_step": 385841, "epoch": 2296} {"train_loss": -9.856457710266113, "global_step": 385842, "epoch": 2296} {"train_loss": -9.409055709838867, "global_step": 385843, "epoch": 2296} {"train_loss": -10.277376174926758, "global_step": 385844, "epoch": 2296} {"train_loss": -10.727909088134766, "global_step": 385845, "epoch": 2296} {"train_loss": -9.680731773376465, "global_step": 385846, "epoch": 2296} {"train_loss": -9.596851348876953, "global_step": 385847, "epoch": 2296} {"train_loss": -10.295003890991211, "global_step": 385848, "epoch": 2296} {"train_loss": -10.148972511291504, "global_step": 385849, "epoch": 2296} {"train_loss": -11.64754867553711, "global_step": 385850, "epoch": 2296} {"train_loss": -10.47326946258545, "global_step": 385851, "epoch": 2296} {"train_loss": -11.213361740112305, "global_step": 385852, "epoch": 2296} {"train_loss": -11.576211929321289, "global_step": 385853, "epoch": 2296} {"train_loss": -11.007538795471191, "global_step": 385854, "epoch": 2296} {"train_loss": -11.437911987304688, "global_step": 385855, "epoch": 2296} {"train_loss": -11.210537910461426, "global_step": 385856, "epoch": 2296} {"train_loss": -10.107551574707031, "global_step": 385857, "epoch": 2296} {"train_loss": -11.957379341125488, "global_step": 385858, "epoch": 2296} {"train_loss": -10.716087341308594, "global_step": 385859, "epoch": 2296} {"train_loss": -11.648768424987793, "global_step": 385860, "epoch": 2296} {"train_loss": -11.506633758544922, "global_step": 385861, "epoch": 2296} {"train_loss": -11.849689483642578, "global_step": 385862, "epoch": 2296} {"train_loss": -11.918643951416016, "global_step": 385863, "epoch": 2296} {"train_loss": -11.431636810302734, "global_step": 385864, "epoch": 2296} {"train_loss": -12.222524642944336, "global_step": 385865, "epoch": 2296} {"train_loss": -11.85006046295166, "global_step": 385866, "epoch": 2296} {"train_loss": -11.980870246887207, "global_step": 385867, "epoch": 2296} {"train_loss": -11.75275993347168, "global_step": 385868, "epoch": 2296} {"train_loss": -12.138589859008789, "global_step": 385869, "epoch": 2296} {"train_loss": -11.595386505126953, "global_step": 385870, "epoch": 2296} {"train_loss": -11.749958038330078, "global_step": 385871, "epoch": 2296} {"train_loss": -12.130531311035156, "global_step": 385872, "epoch": 2296} {"train_loss": -11.781585693359375, "global_step": 385873, "epoch": 2296} {"train_loss": -12.259206771850586, "global_step": 385874, "epoch": 2296} {"train_loss": -12.125370025634766, "global_step": 385875, "epoch": 2296} {"train_loss": -11.949014663696289, "global_step": 385876, "epoch": 2296} {"train_loss": -11.995901107788086, "global_step": 385877, "epoch": 2296} {"train_loss": -12.278871536254883, "global_step": 385878, "epoch": 2296} {"train_loss": -11.995157241821289, "global_step": 385879, "epoch": 2296} {"train_loss": -12.175420761108398, "global_step": 385880, "epoch": 2296} {"train_loss": -12.253353118896484, "global_step": 385881, "epoch": 2296} {"train_loss": -12.164676666259766, "global_step": 385882, "epoch": 2296} {"train_loss": -12.095795631408691, "global_step": 385883, "epoch": 2296} {"train_loss": -12.325353622436523, "global_step": 385884, "epoch": 2296} {"train_loss": -12.167391777038574, "global_step": 385885, "epoch": 2296} {"train_loss": -12.34390640258789, "global_step": 385886, "epoch": 2296} {"train_loss": -12.410226821899414, "global_step": 385887, "epoch": 2296} {"train_loss": -12.198057174682617, "global_step": 385888, "epoch": 2296} {"train_loss": -12.46721076965332, "global_step": 385889, "epoch": 2296} {"train_loss": -12.315666198730469, "global_step": 385890, "epoch": 2296} {"train_loss": -12.51932430267334, "global_step": 385891, "epoch": 2296} {"train_loss": -12.385293960571289, "global_step": 385892, "epoch": 2296} {"train_loss": -12.503021240234375, "global_step": 385893, "epoch": 2296} {"train_loss": -12.427974700927734, "global_step": 385894, "epoch": 2296} {"train_loss": -11.902112024171013, "global_step": 385895, "epoch": 2296, "val_loss": 294264.625} {"train_loss": -12.317397117614746, "global_step": 385896, "epoch": 2297} {"train_loss": -12.513538360595703, "global_step": 385897, "epoch": 2297} {"train_loss": -12.318962097167969, "global_step": 385898, "epoch": 2297} {"train_loss": -12.391424179077148, "global_step": 385899, "epoch": 2297} {"train_loss": -12.62681770324707, "global_step": 385900, "epoch": 2297} {"train_loss": -12.589113235473633, "global_step": 385901, "epoch": 2297} {"train_loss": -12.447334289550781, "global_step": 385902, "epoch": 2297} {"train_loss": -12.642722129821777, "global_step": 385903, "epoch": 2297} {"train_loss": -12.36136245727539, "global_step": 385904, "epoch": 2297} {"train_loss": -12.655242919921875, "global_step": 385905, "epoch": 2297} {"train_loss": -12.542438507080078, "global_step": 385906, "epoch": 2297} {"train_loss": -12.555562973022461, "global_step": 385907, "epoch": 2297} {"train_loss": -12.487983703613281, "global_step": 385908, "epoch": 2297} {"train_loss": -12.6126708984375, "global_step": 385909, "epoch": 2297} {"train_loss": -12.62641429901123, "global_step": 385910, "epoch": 2297} {"train_loss": -12.354795455932617, "global_step": 385911, "epoch": 2297} {"train_loss": -12.678257942199707, "global_step": 385912, "epoch": 2297} {"train_loss": -12.526344299316406, "global_step": 385913, "epoch": 2297} {"train_loss": -12.588396072387695, "global_step": 385914, "epoch": 2297} {"train_loss": -12.457038879394531, "global_step": 385915, "epoch": 2297} {"train_loss": -12.641557693481445, "global_step": 385916, "epoch": 2297} {"train_loss": -12.706951141357422, "global_step": 385917, "epoch": 2297} {"train_loss": -12.451602935791016, "global_step": 385918, "epoch": 2297} {"train_loss": -12.613567352294922, "global_step": 385919, "epoch": 2297} {"train_loss": -12.550596237182617, "global_step": 385920, "epoch": 2297} {"train_loss": -12.893360137939453, "global_step": 385921, "epoch": 2297} {"train_loss": -12.505867004394531, "global_step": 385922, "epoch": 2297} {"train_loss": -12.793853759765625, "global_step": 385923, "epoch": 2297} {"train_loss": -12.80508804321289, "global_step": 385924, "epoch": 2297} {"train_loss": -12.843571662902832, "global_step": 385925, "epoch": 2297} {"train_loss": -12.687759399414062, "global_step": 385926, "epoch": 2297} {"train_loss": -12.78875732421875, "global_step": 385927, "epoch": 2297} {"train_loss": -12.834309577941895, "global_step": 385928, "epoch": 2297} {"train_loss": -12.57390022277832, "global_step": 385929, "epoch": 2297} {"train_loss": -12.695016860961914, "global_step": 385930, "epoch": 2297} {"train_loss": -12.589895248413086, "global_step": 385931, "epoch": 2297} {"train_loss": -12.818605422973633, "global_step": 385932, "epoch": 2297} {"train_loss": -12.874577522277832, "global_step": 385933, "epoch": 2297} {"train_loss": -12.663908958435059, "global_step": 385934, "epoch": 2297} {"train_loss": -12.75541877746582, "global_step": 385935, "epoch": 2297} {"train_loss": -12.860614776611328, "global_step": 385936, "epoch": 2297} {"train_loss": -12.755159378051758, "global_step": 385937, "epoch": 2297} {"train_loss": -12.658824920654297, "global_step": 385938, "epoch": 2297} {"train_loss": -12.745012283325195, "global_step": 385939, "epoch": 2297} {"train_loss": -12.835944175720215, "global_step": 385940, "epoch": 2297} {"train_loss": -12.629560470581055, "global_step": 385941, "epoch": 2297} {"train_loss": -12.574665069580078, "global_step": 385942, "epoch": 2297} {"train_loss": -12.30447006225586, "global_step": 385943, "epoch": 2297} {"train_loss": -12.386728286743164, "global_step": 385944, "epoch": 2297} {"train_loss": -12.787018775939941, "global_step": 385945, "epoch": 2297} {"train_loss": -12.615391731262207, "global_step": 385946, "epoch": 2297} {"train_loss": -12.293294906616211, "global_step": 385947, "epoch": 2297} {"train_loss": -12.36724853515625, "global_step": 385948, "epoch": 2297} {"train_loss": -12.221776962280273, "global_step": 385949, "epoch": 2297} {"train_loss": -12.56233024597168, "global_step": 385950, "epoch": 2297} {"train_loss": -12.760919570922852, "global_step": 385951, "epoch": 2297} {"train_loss": -12.882251739501953, "global_step": 385952, "epoch": 2297} {"train_loss": -12.76077651977539, "global_step": 385953, "epoch": 2297} {"train_loss": -12.673229217529297, "global_step": 385954, "epoch": 2297} {"train_loss": -12.38016128540039, "global_step": 385955, "epoch": 2297} {"train_loss": -12.595457077026367, "global_step": 385956, "epoch": 2297} {"train_loss": -12.798887252807617, "global_step": 385957, "epoch": 2297} {"train_loss": -12.717485427856445, "global_step": 385958, "epoch": 2297} {"train_loss": -12.691587448120117, "global_step": 385959, "epoch": 2297} {"train_loss": -12.676745414733887, "global_step": 385960, "epoch": 2297} {"train_loss": -12.396211624145508, "global_step": 385961, "epoch": 2297} {"train_loss": -12.272056579589844, "global_step": 385962, "epoch": 2297} {"train_loss": -12.318078994750977, "global_step": 385963, "epoch": 2297} {"train_loss": -12.442577362060547, "global_step": 385964, "epoch": 2297} {"train_loss": -12.162335395812988, "global_step": 385965, "epoch": 2297} {"train_loss": -12.858878135681152, "global_step": 385966, "epoch": 2297} {"train_loss": -12.399940490722656, "global_step": 385967, "epoch": 2297} {"train_loss": -12.577363014221191, "global_step": 385968, "epoch": 2297} {"train_loss": -12.535079956054688, "global_step": 385969, "epoch": 2297} {"train_loss": -12.632987976074219, "global_step": 385970, "epoch": 2297} {"train_loss": -12.340150833129883, "global_step": 385971, "epoch": 2297} {"train_loss": -10.527854919433594, "global_step": 385972, "epoch": 2297} {"train_loss": -10.97475814819336, "global_step": 385973, "epoch": 2297} {"train_loss": -11.338128089904785, "global_step": 385974, "epoch": 2297} {"train_loss": -11.740154266357422, "global_step": 385975, "epoch": 2297} {"train_loss": -11.252429962158203, "global_step": 385976, "epoch": 2297} {"train_loss": -11.407415390014648, "global_step": 385977, "epoch": 2297} {"train_loss": -11.864641189575195, "global_step": 385978, "epoch": 2297} {"train_loss": -11.400009155273438, "global_step": 385979, "epoch": 2297} {"train_loss": -11.834678649902344, "global_step": 385980, "epoch": 2297} {"train_loss": -11.380708694458008, "global_step": 385981, "epoch": 2297} {"train_loss": -11.121167182922363, "global_step": 385982, "epoch": 2297} {"train_loss": -11.492855072021484, "global_step": 385983, "epoch": 2297} {"train_loss": -12.446704864501953, "global_step": 385984, "epoch": 2297} {"train_loss": -11.436860084533691, "global_step": 385985, "epoch": 2297} {"train_loss": -11.601557731628418, "global_step": 385986, "epoch": 2297} {"train_loss": -11.506424903869629, "global_step": 385987, "epoch": 2297} {"train_loss": -11.666086196899414, "global_step": 385988, "epoch": 2297} {"train_loss": -10.871135711669922, "global_step": 385989, "epoch": 2297} {"train_loss": -11.311070442199707, "global_step": 385990, "epoch": 2297} {"train_loss": -11.61294174194336, "global_step": 385991, "epoch": 2297} {"train_loss": -10.419649124145508, "global_step": 385992, "epoch": 2297} {"train_loss": -11.667106628417969, "global_step": 385993, "epoch": 2297} {"train_loss": -10.587007522583008, "global_step": 385994, "epoch": 2297} {"train_loss": -10.740422248840332, "global_step": 385995, "epoch": 2297} {"train_loss": -11.935412406921387, "global_step": 385996, "epoch": 2297} {"train_loss": -11.583047866821289, "global_step": 385997, "epoch": 2297} {"train_loss": -12.298457145690918, "global_step": 385998, "epoch": 2297} {"train_loss": -11.594951629638672, "global_step": 385999, "epoch": 2297} {"train_loss": -11.582380294799805, "global_step": 386000, "epoch": 2297} {"train_loss": -11.63011360168457, "global_step": 386001, "epoch": 2297} {"train_loss": -11.874515533447266, "global_step": 386002, "epoch": 2297} {"train_loss": -12.323561668395996, "global_step": 386003, "epoch": 2297} {"train_loss": -12.066967010498047, "global_step": 386004, "epoch": 2297} {"train_loss": -11.829269409179688, "global_step": 386005, "epoch": 2297} {"train_loss": -12.093351364135742, "global_step": 386006, "epoch": 2297} {"train_loss": -11.861611366271973, "global_step": 386007, "epoch": 2297} {"train_loss": -12.181705474853516, "global_step": 386008, "epoch": 2297} {"train_loss": -11.885116577148438, "global_step": 386009, "epoch": 2297} {"train_loss": -12.25199031829834, "global_step": 386010, "epoch": 2297} {"train_loss": -12.299657821655273, "global_step": 386011, "epoch": 2297} {"train_loss": -12.373233795166016, "global_step": 386012, "epoch": 2297} {"train_loss": -12.063751220703125, "global_step": 386013, "epoch": 2297} {"train_loss": -12.346349716186523, "global_step": 386014, "epoch": 2297} {"train_loss": -12.172150611877441, "global_step": 386015, "epoch": 2297} {"train_loss": -12.150959014892578, "global_step": 386016, "epoch": 2297} {"train_loss": -11.920008659362793, "global_step": 386017, "epoch": 2297} {"train_loss": -12.505159378051758, "global_step": 386018, "epoch": 2297} {"train_loss": -11.76097297668457, "global_step": 386019, "epoch": 2297} {"train_loss": -12.106973648071289, "global_step": 386020, "epoch": 2297} {"train_loss": -12.117010116577148, "global_step": 386021, "epoch": 2297} {"train_loss": -12.197525024414062, "global_step": 386022, "epoch": 2297} {"train_loss": -12.089597702026367, "global_step": 386023, "epoch": 2297} {"train_loss": -12.30803108215332, "global_step": 386024, "epoch": 2297} {"train_loss": -12.445146560668945, "global_step": 386025, "epoch": 2297} {"train_loss": -12.636249542236328, "global_step": 386026, "epoch": 2297} {"train_loss": -12.645469665527344, "global_step": 386027, "epoch": 2297} {"train_loss": -12.312764167785645, "global_step": 386028, "epoch": 2297} {"train_loss": -12.484247207641602, "global_step": 386029, "epoch": 2297} {"train_loss": -12.401792526245117, "global_step": 386030, "epoch": 2297} {"train_loss": -12.020947456359863, "global_step": 386031, "epoch": 2297} {"train_loss": -12.292036056518555, "global_step": 386032, "epoch": 2297} {"train_loss": -12.386528015136719, "global_step": 386033, "epoch": 2297} {"train_loss": -12.567651748657227, "global_step": 386034, "epoch": 2297} {"train_loss": -12.178573608398438, "global_step": 386035, "epoch": 2297} {"train_loss": -12.674063682556152, "global_step": 386036, "epoch": 2297} {"train_loss": -11.994915962219238, "global_step": 386037, "epoch": 2297} {"train_loss": -11.984670639038086, "global_step": 386038, "epoch": 2297} {"train_loss": -11.572553634643555, "global_step": 386039, "epoch": 2297} {"train_loss": -12.266911506652832, "global_step": 386040, "epoch": 2297} {"train_loss": -11.780659675598145, "global_step": 386041, "epoch": 2297} {"train_loss": -11.502084732055664, "global_step": 386042, "epoch": 2297} {"train_loss": -12.298284530639648, "global_step": 386043, "epoch": 2297} {"train_loss": -12.556105613708496, "global_step": 386044, "epoch": 2297} {"train_loss": -12.393621444702148, "global_step": 386045, "epoch": 2297} {"train_loss": -12.536101341247559, "global_step": 386046, "epoch": 2297} {"train_loss": -12.38416862487793, "global_step": 386047, "epoch": 2297} {"train_loss": -11.833044052124023, "global_step": 386048, "epoch": 2297} {"train_loss": -11.687394142150879, "global_step": 386049, "epoch": 2297} {"train_loss": -12.241101264953613, "global_step": 386050, "epoch": 2297} {"train_loss": -11.96227741241455, "global_step": 386051, "epoch": 2297} {"train_loss": -11.843807220458984, "global_step": 386052, "epoch": 2297} {"train_loss": -12.47470760345459, "global_step": 386053, "epoch": 2297} {"train_loss": -12.300863265991211, "global_step": 386054, "epoch": 2297} {"train_loss": -11.932064056396484, "global_step": 386055, "epoch": 2297} {"train_loss": -12.505600929260254, "global_step": 386056, "epoch": 2297} {"train_loss": -12.496058464050293, "global_step": 386057, "epoch": 2297} {"train_loss": -12.486017227172852, "global_step": 386058, "epoch": 2297} {"train_loss": -12.308351516723633, "global_step": 386059, "epoch": 2297} {"train_loss": -11.84627914428711, "global_step": 386060, "epoch": 2297} {"train_loss": -12.472214698791504, "global_step": 386061, "epoch": 2297} {"train_loss": -12.162824630737305, "global_step": 386062, "epoch": 2297} {"train_loss": -12.236594069571723, "global_step": 386063, "epoch": 2297, "val_loss": 296134.4375} {"train_loss": -11.742341995239258, "global_step": 386064, "epoch": 2298} {"train_loss": -12.206405639648438, "global_step": 386065, "epoch": 2298} {"train_loss": -12.35201644897461, "global_step": 386066, "epoch": 2298} {"train_loss": -12.742610931396484, "global_step": 386067, "epoch": 2298} {"train_loss": -12.452692031860352, "global_step": 386068, "epoch": 2298} {"train_loss": -12.442705154418945, "global_step": 386069, "epoch": 2298} {"train_loss": -12.710168838500977, "global_step": 386070, "epoch": 2298} {"train_loss": -12.594890594482422, "global_step": 386071, "epoch": 2298} {"train_loss": -12.593048095703125, "global_step": 386072, "epoch": 2298} {"train_loss": -12.57642936706543, "global_step": 386073, "epoch": 2298} {"train_loss": -12.517648696899414, "global_step": 386074, "epoch": 2298} {"train_loss": -12.661649703979492, "global_step": 386075, "epoch": 2298} {"train_loss": -12.815179824829102, "global_step": 386076, "epoch": 2298} {"train_loss": -12.535303115844727, "global_step": 386077, "epoch": 2298} {"train_loss": -12.516593933105469, "global_step": 386078, "epoch": 2298} {"train_loss": -12.472782135009766, "global_step": 386079, "epoch": 2298} {"train_loss": -12.465346336364746, "global_step": 386080, "epoch": 2298} {"train_loss": -12.418204307556152, "global_step": 386081, "epoch": 2298} {"train_loss": -11.434560775756836, "global_step": 386082, "epoch": 2298} {"train_loss": -12.54619312286377, "global_step": 386083, "epoch": 2298} {"train_loss": -11.072312355041504, "global_step": 386084, "epoch": 2298} {"train_loss": -11.37822437286377, "global_step": 386085, "epoch": 2298} {"train_loss": -11.000602722167969, "global_step": 386086, "epoch": 2298} {"train_loss": -11.636293411254883, "global_step": 386087, "epoch": 2298} {"train_loss": -11.701635360717773, "global_step": 386088, "epoch": 2298} {"train_loss": -11.13078498840332, "global_step": 386089, "epoch": 2298} {"train_loss": -10.570005416870117, "global_step": 386090, "epoch": 2298} {"train_loss": -12.473970413208008, "global_step": 386091, "epoch": 2298} {"train_loss": -11.206241607666016, "global_step": 386092, "epoch": 2298} {"train_loss": -11.317561149597168, "global_step": 386093, "epoch": 2298} {"train_loss": -12.111825942993164, "global_step": 386094, "epoch": 2298} {"train_loss": -10.974773406982422, "global_step": 386095, "epoch": 2298} {"train_loss": -11.103793144226074, "global_step": 386096, "epoch": 2298} {"train_loss": -12.007267951965332, "global_step": 386097, "epoch": 2298} {"train_loss": -11.22675609588623, "global_step": 386098, "epoch": 2298} {"train_loss": -10.253761291503906, "global_step": 386099, "epoch": 2298} {"train_loss": -11.501936912536621, "global_step": 386100, "epoch": 2298} {"train_loss": -10.970428466796875, "global_step": 386101, "epoch": 2298} {"train_loss": -10.307311058044434, "global_step": 386102, "epoch": 2298} {"train_loss": -11.286375999450684, "global_step": 386103, "epoch": 2298} {"train_loss": -9.886521339416504, "global_step": 386104, "epoch": 2298} {"train_loss": -11.413093566894531, "global_step": 386105, "epoch": 2298} {"train_loss": -11.319770812988281, "global_step": 386106, "epoch": 2298} {"train_loss": -11.78449821472168, "global_step": 386107, "epoch": 2298} {"train_loss": -10.642790794372559, "global_step": 386108, "epoch": 2298} {"train_loss": -11.921646118164062, "global_step": 386109, "epoch": 2298} {"train_loss": -10.91402816772461, "global_step": 386110, "epoch": 2298} {"train_loss": -10.290628433227539, "global_step": 386111, "epoch": 2298} {"train_loss": -10.837995529174805, "global_step": 386112, "epoch": 2298} {"train_loss": -10.74888801574707, "global_step": 386113, "epoch": 2298} {"train_loss": -11.390427589416504, "global_step": 386114, "epoch": 2298} {"train_loss": -11.083213806152344, "global_step": 386115, "epoch": 2298} {"train_loss": -11.547441482543945, "global_step": 386116, "epoch": 2298} {"train_loss": -11.017377853393555, "global_step": 386117, "epoch": 2298} {"train_loss": -11.739906311035156, "global_step": 386118, "epoch": 2298} {"train_loss": -11.69843864440918, "global_step": 386119, "epoch": 2298} {"train_loss": -11.914640426635742, "global_step": 386120, "epoch": 2298} {"train_loss": -11.777247428894043, "global_step": 386121, "epoch": 2298} {"train_loss": -11.439193725585938, "global_step": 386122, "epoch": 2298} {"train_loss": -11.929311752319336, "global_step": 386123, "epoch": 2298} {"train_loss": -11.865442276000977, "global_step": 386124, "epoch": 2298} {"train_loss": -11.945884704589844, "global_step": 386125, "epoch": 2298} {"train_loss": -11.886143684387207, "global_step": 386126, "epoch": 2298} {"train_loss": -11.292342185974121, "global_step": 386127, "epoch": 2298} {"train_loss": -11.571057319641113, "global_step": 386128, "epoch": 2298} {"train_loss": -11.938215255737305, "global_step": 386129, "epoch": 2298} {"train_loss": -11.586400985717773, "global_step": 386130, "epoch": 2298} {"train_loss": -12.214802742004395, "global_step": 386131, "epoch": 2298} {"train_loss": -11.524466514587402, "global_step": 386132, "epoch": 2298} {"train_loss": -11.95366096496582, "global_step": 386133, "epoch": 2298} {"train_loss": -11.744555473327637, "global_step": 386134, "epoch": 2298} {"train_loss": -11.870340347290039, "global_step": 386135, "epoch": 2298} {"train_loss": -12.100202560424805, "global_step": 386136, "epoch": 2298} {"train_loss": -12.082635879516602, "global_step": 386137, "epoch": 2298} {"train_loss": -12.122722625732422, "global_step": 386138, "epoch": 2298} {"train_loss": -12.2445707321167, "global_step": 386139, "epoch": 2298} {"train_loss": -12.424955368041992, "global_step": 386140, "epoch": 2298} {"train_loss": -12.363929748535156, "global_step": 386141, "epoch": 2298} {"train_loss": -12.275672912597656, "global_step": 386142, "epoch": 2298} {"train_loss": -12.363670349121094, "global_step": 386143, "epoch": 2298} {"train_loss": -12.245567321777344, "global_step": 386144, "epoch": 2298} {"train_loss": -12.396767616271973, "global_step": 386145, "epoch": 2298} {"train_loss": -12.153430938720703, "global_step": 386146, "epoch": 2298} {"train_loss": -12.271987915039062, "global_step": 386147, "epoch": 2298} {"train_loss": -12.424125671386719, "global_step": 386148, "epoch": 2298} {"train_loss": -12.173856735229492, "global_step": 386149, "epoch": 2298} {"train_loss": -12.520298957824707, "global_step": 386150, "epoch": 2298} {"train_loss": -12.318184852600098, "global_step": 386151, "epoch": 2298} {"train_loss": -12.374580383300781, "global_step": 386152, "epoch": 2298} {"train_loss": -12.248872756958008, "global_step": 386153, "epoch": 2298} {"train_loss": -12.224508285522461, "global_step": 386154, "epoch": 2298} {"train_loss": -12.390697479248047, "global_step": 386155, "epoch": 2298} {"train_loss": -12.120149612426758, "global_step": 386156, "epoch": 2298} {"train_loss": -12.633378982543945, "global_step": 386157, "epoch": 2298} {"train_loss": -12.438087463378906, "global_step": 386158, "epoch": 2298} {"train_loss": -12.414348602294922, "global_step": 386159, "epoch": 2298} {"train_loss": -12.234392166137695, "global_step": 386160, "epoch": 2298} {"train_loss": -12.642290115356445, "global_step": 386161, "epoch": 2298} {"train_loss": -12.216201782226562, "global_step": 386162, "epoch": 2298} {"train_loss": -12.550491333007812, "global_step": 386163, "epoch": 2298} {"train_loss": -12.224191665649414, "global_step": 386164, "epoch": 2298} {"train_loss": -12.338467597961426, "global_step": 386165, "epoch": 2298} {"train_loss": -12.52452278137207, "global_step": 386166, "epoch": 2298} {"train_loss": -11.960162162780762, "global_step": 386167, "epoch": 2298} {"train_loss": -12.369482040405273, "global_step": 386168, "epoch": 2298} {"train_loss": -12.44327449798584, "global_step": 386169, "epoch": 2298} {"train_loss": -12.449302673339844, "global_step": 386170, "epoch": 2298} {"train_loss": -12.563359260559082, "global_step": 386171, "epoch": 2298} {"train_loss": -12.536073684692383, "global_step": 386172, "epoch": 2298} {"train_loss": -12.648717880249023, "global_step": 386173, "epoch": 2298} {"train_loss": -12.664885520935059, "global_step": 386174, "epoch": 2298} {"train_loss": -12.483072280883789, "global_step": 386175, "epoch": 2298} {"train_loss": -12.564179420471191, "global_step": 386176, "epoch": 2298} {"train_loss": -12.569226264953613, "global_step": 386177, "epoch": 2298} {"train_loss": -12.522212028503418, "global_step": 386178, "epoch": 2298} {"train_loss": -12.613001823425293, "global_step": 386179, "epoch": 2298} {"train_loss": -12.370519638061523, "global_step": 386180, "epoch": 2298} {"train_loss": -12.728137969970703, "global_step": 386181, "epoch": 2298} {"train_loss": -12.894279479980469, "global_step": 386182, "epoch": 2298} {"train_loss": -12.638845443725586, "global_step": 386183, "epoch": 2298} {"train_loss": -12.877907752990723, "global_step": 386184, "epoch": 2298} {"train_loss": -12.5930757522583, "global_step": 386185, "epoch": 2298} {"train_loss": -12.599167823791504, "global_step": 386186, "epoch": 2298} {"train_loss": -12.600784301757812, "global_step": 386187, "epoch": 2298} {"train_loss": -12.394350051879883, "global_step": 386188, "epoch": 2298} {"train_loss": -12.608312606811523, "global_step": 386189, "epoch": 2298} {"train_loss": -12.411493301391602, "global_step": 386190, "epoch": 2298} {"train_loss": -12.461071968078613, "global_step": 386191, "epoch": 2298} {"train_loss": -11.354158401489258, "global_step": 386192, "epoch": 2298} {"train_loss": -12.457587242126465, "global_step": 386193, "epoch": 2298} {"train_loss": -11.768494606018066, "global_step": 386194, "epoch": 2298} {"train_loss": -11.07502555847168, "global_step": 386195, "epoch": 2298} {"train_loss": -12.468095779418945, "global_step": 386196, "epoch": 2298} {"train_loss": -12.221992492675781, "global_step": 386197, "epoch": 2298} {"train_loss": -11.288647651672363, "global_step": 386198, "epoch": 2298} {"train_loss": -11.469655990600586, "global_step": 386199, "epoch": 2298} {"train_loss": -12.369522094726562, "global_step": 386200, "epoch": 2298} {"train_loss": -11.269177436828613, "global_step": 386201, "epoch": 2298} {"train_loss": -12.134669303894043, "global_step": 386202, "epoch": 2298} {"train_loss": -11.468297004699707, "global_step": 386203, "epoch": 2298} {"train_loss": -11.272150039672852, "global_step": 386204, "epoch": 2298} {"train_loss": -12.26365852355957, "global_step": 386205, "epoch": 2298} {"train_loss": -10.657928466796875, "global_step": 386206, "epoch": 2298} {"train_loss": -12.226032257080078, "global_step": 386207, "epoch": 2298} {"train_loss": -11.67418384552002, "global_step": 386208, "epoch": 2298} {"train_loss": -10.473390579223633, "global_step": 386209, "epoch": 2298} {"train_loss": -12.023181915283203, "global_step": 386210, "epoch": 2298} {"train_loss": -11.243942260742188, "global_step": 386211, "epoch": 2298} {"train_loss": -10.677393913269043, "global_step": 386212, "epoch": 2298} {"train_loss": -10.651219367980957, "global_step": 386213, "epoch": 2298} {"train_loss": -10.871037483215332, "global_step": 386214, "epoch": 2298} {"train_loss": -10.836246490478516, "global_step": 386215, "epoch": 2298} {"train_loss": -9.002021789550781, "global_step": 386216, "epoch": 2298} {"train_loss": -11.300825119018555, "global_step": 386217, "epoch": 2298} {"train_loss": -10.021970748901367, "global_step": 386218, "epoch": 2298} {"train_loss": -9.021405220031738, "global_step": 386219, "epoch": 2298} {"train_loss": -10.060622215270996, "global_step": 386220, "epoch": 2298} {"train_loss": -10.058389663696289, "global_step": 386221, "epoch": 2298} {"train_loss": -10.077937126159668, "global_step": 386222, "epoch": 2298} {"train_loss": -10.153205871582031, "global_step": 386223, "epoch": 2298} {"train_loss": -11.050349235534668, "global_step": 386224, "epoch": 2298} {"train_loss": -11.536091804504395, "global_step": 386225, "epoch": 2298} {"train_loss": -9.100225448608398, "global_step": 386226, "epoch": 2298} {"train_loss": -11.097474098205566, "global_step": 386227, "epoch": 2298} {"train_loss": -11.349519729614258, "global_step": 386228, "epoch": 2298} {"train_loss": -10.79777717590332, "global_step": 386229, "epoch": 2298} {"train_loss": -11.621582984924316, "global_step": 386230, "epoch": 2298} {"train_loss": -11.784266545659019, "global_step": 386231, "epoch": 2298, "val_loss": 289731.0} {"train_loss": -12.189653396606445, "global_step": 386232, "epoch": 2299} {"train_loss": -11.314669609069824, "global_step": 386233, "epoch": 2299} {"train_loss": -11.398645401000977, "global_step": 386234, "epoch": 2299} {"train_loss": -12.011372566223145, "global_step": 386235, "epoch": 2299} {"train_loss": -11.007282257080078, "global_step": 386236, "epoch": 2299} {"train_loss": -12.004100799560547, "global_step": 386237, "epoch": 2299} {"train_loss": -11.737424850463867, "global_step": 386238, "epoch": 2299} {"train_loss": -11.62276840209961, "global_step": 386239, "epoch": 2299} {"train_loss": -12.056903839111328, "global_step": 386240, "epoch": 2299} {"train_loss": -11.486522674560547, "global_step": 386241, "epoch": 2299} {"train_loss": -11.95020866394043, "global_step": 386242, "epoch": 2299} {"train_loss": -11.948346138000488, "global_step": 386243, "epoch": 2299} {"train_loss": -11.654972076416016, "global_step": 386244, "epoch": 2299} {"train_loss": -11.803112030029297, "global_step": 386245, "epoch": 2299} {"train_loss": -11.913736343383789, "global_step": 386246, "epoch": 2299} {"train_loss": -11.846695899963379, "global_step": 386247, "epoch": 2299} {"train_loss": -11.675846099853516, "global_step": 386248, "epoch": 2299} {"train_loss": -11.474093437194824, "global_step": 386249, "epoch": 2299} {"train_loss": -12.10441780090332, "global_step": 386250, "epoch": 2299} {"train_loss": -11.673799514770508, "global_step": 386251, "epoch": 2299} {"train_loss": -11.57310676574707, "global_step": 386252, "epoch": 2299} {"train_loss": -12.218470573425293, "global_step": 386253, "epoch": 2299} {"train_loss": -11.800333023071289, "global_step": 386254, "epoch": 2299} {"train_loss": -11.450536727905273, "global_step": 386255, "epoch": 2299} {"train_loss": -11.995041847229004, "global_step": 386256, "epoch": 2299} {"train_loss": -11.774147033691406, "global_step": 386257, "epoch": 2299} {"train_loss": -11.769723892211914, "global_step": 386258, "epoch": 2299} {"train_loss": -12.207042694091797, "global_step": 386259, "epoch": 2299} {"train_loss": -11.686788558959961, "global_step": 386260, "epoch": 2299} {"train_loss": -12.325078964233398, "global_step": 386261, "epoch": 2299} {"train_loss": -12.023569107055664, "global_step": 386262, "epoch": 2299} {"train_loss": -12.336647033691406, "global_step": 386263, "epoch": 2299} {"train_loss": -12.427321434020996, "global_step": 386264, "epoch": 2299} {"train_loss": -12.26657772064209, "global_step": 386265, "epoch": 2299} {"train_loss": -12.305055618286133, "global_step": 386266, "epoch": 2299} {"train_loss": -12.250894546508789, "global_step": 386267, "epoch": 2299} {"train_loss": -12.39055347442627, "global_step": 386268, "epoch": 2299} {"train_loss": -12.118997573852539, "global_step": 386269, "epoch": 2299} {"train_loss": -12.468629837036133, "global_step": 386270, "epoch": 2299} {"train_loss": -12.22458267211914, "global_step": 386271, "epoch": 2299} {"train_loss": -12.20004653930664, "global_step": 386272, "epoch": 2299} {"train_loss": -12.257671356201172, "global_step": 386273, "epoch": 2299} {"train_loss": -12.629730224609375, "global_step": 386274, "epoch": 2299} {"train_loss": -12.437540054321289, "global_step": 386275, "epoch": 2299} {"train_loss": -12.311643600463867, "global_step": 386276, "epoch": 2299} {"train_loss": -12.308348655700684, "global_step": 386277, "epoch": 2299} {"train_loss": -12.460420608520508, "global_step": 386278, "epoch": 2299} {"train_loss": -12.60719108581543, "global_step": 386279, "epoch": 2299} {"train_loss": -12.612180709838867, "global_step": 386280, "epoch": 2299} {"train_loss": -12.519786834716797, "global_step": 386281, "epoch": 2299} {"train_loss": -12.709156036376953, "global_step": 386282, "epoch": 2299} {"train_loss": -12.673513412475586, "global_step": 386283, "epoch": 2299} {"train_loss": -12.623897552490234, "global_step": 386284, "epoch": 2299} {"train_loss": -12.53805160522461, "global_step": 386285, "epoch": 2299} {"train_loss": -12.470117568969727, "global_step": 386286, "epoch": 2299} {"train_loss": -12.470726013183594, "global_step": 386287, "epoch": 2299} {"train_loss": -12.651359558105469, "global_step": 386288, "epoch": 2299} {"train_loss": -12.559141159057617, "global_step": 386289, "epoch": 2299} {"train_loss": -12.353271484375, "global_step": 386290, "epoch": 2299} {"train_loss": -12.49641227722168, "global_step": 386291, "epoch": 2299} {"train_loss": -12.573006629943848, "global_step": 386292, "epoch": 2299} {"train_loss": -12.555929183959961, "global_step": 386293, "epoch": 2299} {"train_loss": -12.234427452087402, "global_step": 386294, "epoch": 2299} {"train_loss": -12.211348533630371, "global_step": 386295, "epoch": 2299} {"train_loss": -12.491506576538086, "global_step": 386296, "epoch": 2299} {"train_loss": -12.188572883605957, "global_step": 386297, "epoch": 2299} {"train_loss": -12.442159652709961, "global_step": 386298, "epoch": 2299} {"train_loss": -12.414278030395508, "global_step": 386299, "epoch": 2299} {"train_loss": -12.541221618652344, "global_step": 386300, "epoch": 2299} {"train_loss": -12.430265426635742, "global_step": 386301, "epoch": 2299} {"train_loss": -12.272043228149414, "global_step": 386302, "epoch": 2299} {"train_loss": -11.459736824035645, "global_step": 386303, "epoch": 2299} {"train_loss": -12.1013765335083, "global_step": 386304, "epoch": 2299} {"train_loss": -12.275362014770508, "global_step": 386305, "epoch": 2299} {"train_loss": -11.655052185058594, "global_step": 386306, "epoch": 2299} {"train_loss": -11.105297088623047, "global_step": 386307, "epoch": 2299} {"train_loss": -12.171414375305176, "global_step": 386308, "epoch": 2299} {"train_loss": -10.55656909942627, "global_step": 386309, "epoch": 2299} {"train_loss": -11.419507026672363, "global_step": 386310, "epoch": 2299} {"train_loss": -12.219922065734863, "global_step": 386311, "epoch": 2299} {"train_loss": -10.838560104370117, "global_step": 386312, "epoch": 2299} {"train_loss": -11.081878662109375, "global_step": 386313, "epoch": 2299} {"train_loss": -10.695219993591309, "global_step": 386314, "epoch": 2299} {"train_loss": -11.013481140136719, "global_step": 386315, "epoch": 2299} {"train_loss": -11.951677322387695, "global_step": 386316, "epoch": 2299} {"train_loss": -11.627588272094727, "global_step": 386317, "epoch": 2299} {"train_loss": -11.38175106048584, "global_step": 386318, "epoch": 2299} {"train_loss": -11.612071990966797, "global_step": 386319, "epoch": 2299} {"train_loss": -11.109834671020508, "global_step": 386320, "epoch": 2299} {"train_loss": -10.870124816894531, "global_step": 386321, "epoch": 2299} {"train_loss": -10.659772872924805, "global_step": 386322, "epoch": 2299} {"train_loss": -12.221893310546875, "global_step": 386323, "epoch": 2299} {"train_loss": -11.109355926513672, "global_step": 386324, "epoch": 2299} {"train_loss": -11.38341236114502, "global_step": 386325, "epoch": 2299} {"train_loss": -11.249719619750977, "global_step": 386326, "epoch": 2299} {"train_loss": -11.149601936340332, "global_step": 386327, "epoch": 2299} {"train_loss": -10.741645812988281, "global_step": 386328, "epoch": 2299} {"train_loss": -11.630231857299805, "global_step": 386329, "epoch": 2299} {"train_loss": -10.674884796142578, "global_step": 386330, "epoch": 2299} {"train_loss": -11.00369930267334, "global_step": 386331, "epoch": 2299} {"train_loss": -11.78322982788086, "global_step": 386332, "epoch": 2299} {"train_loss": -11.11075210571289, "global_step": 386333, "epoch": 2299} {"train_loss": -11.243452072143555, "global_step": 386334, "epoch": 2299} {"train_loss": -11.088112831115723, "global_step": 386335, "epoch": 2299} {"train_loss": -10.216584205627441, "global_step": 386336, "epoch": 2299} {"train_loss": -9.82696533203125, "global_step": 386337, "epoch": 2299} {"train_loss": -10.456937789916992, "global_step": 386338, "epoch": 2299} {"train_loss": -11.746999740600586, "global_step": 386339, "epoch": 2299} {"train_loss": -10.41324234008789, "global_step": 386340, "epoch": 2299} {"train_loss": -10.925859451293945, "global_step": 386341, "epoch": 2299} {"train_loss": -11.399118423461914, "global_step": 386342, "epoch": 2299} {"train_loss": -11.490507125854492, "global_step": 386343, "epoch": 2299} {"train_loss": -10.875898361206055, "global_step": 386344, "epoch": 2299} {"train_loss": -11.927536010742188, "global_step": 386345, "epoch": 2299} {"train_loss": -10.911224365234375, "global_step": 386346, "epoch": 2299} {"train_loss": -11.41651725769043, "global_step": 386347, "epoch": 2299} {"train_loss": -11.518942832946777, "global_step": 386348, "epoch": 2299} {"train_loss": -11.356302261352539, "global_step": 386349, "epoch": 2299} {"train_loss": -11.95022964477539, "global_step": 386350, "epoch": 2299} {"train_loss": -11.833368301391602, "global_step": 386351, "epoch": 2299} {"train_loss": -11.689330101013184, "global_step": 386352, "epoch": 2299} {"train_loss": -11.801027297973633, "global_step": 386353, "epoch": 2299} {"train_loss": -12.072225570678711, "global_step": 386354, "epoch": 2299} {"train_loss": -11.693317413330078, "global_step": 386355, "epoch": 2299} {"train_loss": -12.076820373535156, "global_step": 386356, "epoch": 2299} {"train_loss": -11.449969291687012, "global_step": 386357, "epoch": 2299} {"train_loss": -11.82863998413086, "global_step": 386358, "epoch": 2299} {"train_loss": -11.96851921081543, "global_step": 386359, "epoch": 2299} {"train_loss": -11.708478927612305, "global_step": 386360, "epoch": 2299} {"train_loss": -12.04578685760498, "global_step": 386361, "epoch": 2299} {"train_loss": -12.10458755493164, "global_step": 386362, "epoch": 2299} {"train_loss": -11.920677185058594, "global_step": 386363, "epoch": 2299} {"train_loss": -12.341184616088867, "global_step": 386364, "epoch": 2299} {"train_loss": -12.010397911071777, "global_step": 386365, "epoch": 2299} {"train_loss": -12.04848861694336, "global_step": 386366, "epoch": 2299} {"train_loss": -12.063709259033203, "global_step": 386367, "epoch": 2299} {"train_loss": -11.866809844970703, "global_step": 386368, "epoch": 2299} {"train_loss": -12.26645565032959, "global_step": 386369, "epoch": 2299} {"train_loss": -12.047462463378906, "global_step": 386370, "epoch": 2299} {"train_loss": -12.093027114868164, "global_step": 386371, "epoch": 2299} {"train_loss": -12.161308288574219, "global_step": 386372, "epoch": 2299} {"train_loss": -12.169671058654785, "global_step": 386373, "epoch": 2299} {"train_loss": -12.235883712768555, "global_step": 386374, "epoch": 2299} {"train_loss": -12.213932991027832, "global_step": 386375, "epoch": 2299} {"train_loss": -12.311540603637695, "global_step": 386376, "epoch": 2299} {"train_loss": -12.150253295898438, "global_step": 386377, "epoch": 2299} {"train_loss": -12.32503890991211, "global_step": 386378, "epoch": 2299} {"train_loss": -12.168375015258789, "global_step": 386379, "epoch": 2299} {"train_loss": -12.446245193481445, "global_step": 386380, "epoch": 2299} {"train_loss": -12.358823776245117, "global_step": 386381, "epoch": 2299} {"train_loss": -12.336143493652344, "global_step": 386382, "epoch": 2299} {"train_loss": -12.263103485107422, "global_step": 386383, "epoch": 2299} {"train_loss": -12.176519393920898, "global_step": 386384, "epoch": 2299} {"train_loss": -12.109331130981445, "global_step": 386385, "epoch": 2299} {"train_loss": -12.457460403442383, "global_step": 386386, "epoch": 2299} {"train_loss": -12.377690315246582, "global_step": 386387, "epoch": 2299} {"train_loss": -12.452455520629883, "global_step": 386388, "epoch": 2299} {"train_loss": -12.62525749206543, "global_step": 386389, "epoch": 2299} {"train_loss": -12.239395141601562, "global_step": 386390, "epoch": 2299} {"train_loss": -12.492128372192383, "global_step": 386391, "epoch": 2299} {"train_loss": -12.444332122802734, "global_step": 386392, "epoch": 2299} {"train_loss": -12.497101783752441, "global_step": 386393, "epoch": 2299} {"train_loss": -12.483711242675781, "global_step": 386394, "epoch": 2299} {"train_loss": -12.464909553527832, "global_step": 386395, "epoch": 2299} {"train_loss": -12.565196990966797, "global_step": 386396, "epoch": 2299} {"train_loss": -12.562929153442383, "global_step": 386397, "epoch": 2299} {"train_loss": -12.58806324005127, "global_step": 386398, "epoch": 2299} {"train_loss": -11.90791240192595, "global_step": 386399, "epoch": 2299, "val_loss": 297233.96875} {"train_loss": -12.664493560791016, "global_step": 386400, "epoch": 2300} {"train_loss": -12.485244750976562, "global_step": 386401, "epoch": 2300} {"train_loss": -12.715831756591797, "global_step": 386402, "epoch": 2300} {"train_loss": -12.557130813598633, "global_step": 386403, "epoch": 2300} {"train_loss": -12.635354995727539, "global_step": 386404, "epoch": 2300} {"train_loss": -12.540407180786133, "global_step": 386405, "epoch": 2300} {"train_loss": -12.541218757629395, "global_step": 386406, "epoch": 2300} {"train_loss": -12.581899642944336, "global_step": 386407, "epoch": 2300} {"train_loss": -12.487771987915039, "global_step": 386408, "epoch": 2300} {"train_loss": -12.50737190246582, "global_step": 386409, "epoch": 2300} {"train_loss": -12.384256362915039, "global_step": 386410, "epoch": 2300} {"train_loss": -12.083264350891113, "global_step": 386411, "epoch": 2300} {"train_loss": -11.93293571472168, "global_step": 386412, "epoch": 2300} {"train_loss": -12.217833518981934, "global_step": 386413, "epoch": 2300} {"train_loss": -11.316277503967285, "global_step": 386414, "epoch": 2300} {"train_loss": -12.066577911376953, "global_step": 386415, "epoch": 2300} {"train_loss": -11.893752098083496, "global_step": 386416, "epoch": 2300} {"train_loss": -12.221956253051758, "global_step": 386417, "epoch": 2300} {"train_loss": -11.058965682983398, "global_step": 386418, "epoch": 2300} {"train_loss": -12.726007461547852, "global_step": 386419, "epoch": 2300} {"train_loss": -11.473767280578613, "global_step": 386420, "epoch": 2300} {"train_loss": -12.227363586425781, "global_step": 386421, "epoch": 2300} {"train_loss": -12.173835754394531, "global_step": 386422, "epoch": 2300} {"train_loss": -12.066530227661133, "global_step": 386423, "epoch": 2300} {"train_loss": -12.013895034790039, "global_step": 386424, "epoch": 2300} {"train_loss": -12.44392204284668, "global_step": 386425, "epoch": 2300} {"train_loss": -11.430612564086914, "global_step": 386426, "epoch": 2300} {"train_loss": -12.536697387695312, "global_step": 386427, "epoch": 2300} {"train_loss": -12.26198673248291, "global_step": 386428, "epoch": 2300} {"train_loss": -11.078009605407715, "global_step": 386429, "epoch": 2300} {"train_loss": -11.121317863464355, "global_step": 386430, "epoch": 2300} {"train_loss": -11.392845153808594, "global_step": 386431, "epoch": 2300} {"train_loss": -9.013022422790527, "global_step": 386432, "epoch": 2300} {"train_loss": -9.822250366210938, "global_step": 386433, "epoch": 2300} {"train_loss": -9.774620056152344, "global_step": 386434, "epoch": 2300} {"train_loss": -11.414072036743164, "global_step": 386435, "epoch": 2300} {"train_loss": -11.106866836547852, "global_step": 386436, "epoch": 2300} {"train_loss": -10.745401382446289, "global_step": 386437, "epoch": 2300} {"train_loss": -11.199357032775879, "global_step": 386438, "epoch": 2300} {"train_loss": -11.108663558959961, "global_step": 386439, "epoch": 2300} {"train_loss": -11.49630069732666, "global_step": 386440, "epoch": 2300} {"train_loss": -11.689865112304688, "global_step": 386441, "epoch": 2300} {"train_loss": -11.697771072387695, "global_step": 386442, "epoch": 2300} {"train_loss": -11.82961654663086, "global_step": 386443, "epoch": 2300} {"train_loss": -11.646954536437988, "global_step": 386444, "epoch": 2300} {"train_loss": -12.275774955749512, "global_step": 386445, "epoch": 2300} {"train_loss": -11.723478317260742, "global_step": 386446, "epoch": 2300} {"train_loss": -12.285444259643555, "global_step": 386447, "epoch": 2300} {"train_loss": -11.496307373046875, "global_step": 386448, "epoch": 2300} {"train_loss": -12.154752731323242, "global_step": 386449, "epoch": 2300} {"train_loss": -11.69792366027832, "global_step": 386450, "epoch": 2300} {"train_loss": -11.952767372131348, "global_step": 386451, "epoch": 2300} {"train_loss": -11.958751678466797, "global_step": 386452, "epoch": 2300} {"train_loss": -12.318559646606445, "global_step": 386453, "epoch": 2300} {"train_loss": -12.353212356567383, "global_step": 386454, "epoch": 2300} {"train_loss": -12.014945983886719, "global_step": 386455, "epoch": 2300} {"train_loss": -11.80328369140625, "global_step": 386456, "epoch": 2300} {"train_loss": -12.063358306884766, "global_step": 386457, "epoch": 2300} {"train_loss": -11.86967945098877, "global_step": 386458, "epoch": 2300} {"train_loss": -12.025816917419434, "global_step": 386459, "epoch": 2300} {"train_loss": -12.014463424682617, "global_step": 386460, "epoch": 2300} {"train_loss": -12.309610366821289, "global_step": 386461, "epoch": 2300} {"train_loss": -12.287399291992188, "global_step": 386462, "epoch": 2300} {"train_loss": -12.393614768981934, "global_step": 386463, "epoch": 2300} {"train_loss": -12.40291690826416, "global_step": 386464, "epoch": 2300} {"train_loss": -12.173248291015625, "global_step": 386465, "epoch": 2300} {"train_loss": -12.293622970581055, "global_step": 386466, "epoch": 2300} {"train_loss": -12.35179615020752, "global_step": 386467, "epoch": 2300} {"train_loss": -12.32286262512207, "global_step": 386468, "epoch": 2300} {"train_loss": -12.006669998168945, "global_step": 386469, "epoch": 2300} {"train_loss": -12.295318603515625, "global_step": 386470, "epoch": 2300} {"train_loss": -12.11449146270752, "global_step": 386471, "epoch": 2300} {"train_loss": -12.614505767822266, "global_step": 386472, "epoch": 2300} {"train_loss": -12.191576957702637, "global_step": 386473, "epoch": 2300} {"train_loss": -12.694539070129395, "global_step": 386474, "epoch": 2300} {"train_loss": -12.560222625732422, "global_step": 386475, "epoch": 2300} {"train_loss": -12.423359870910645, "global_step": 386476, "epoch": 2300} {"train_loss": -12.250070571899414, "global_step": 386477, "epoch": 2300} {"train_loss": -12.464681625366211, "global_step": 386478, "epoch": 2300} {"train_loss": -12.307167053222656, "global_step": 386479, "epoch": 2300} {"train_loss": -12.567062377929688, "global_step": 386480, "epoch": 2300} {"train_loss": -12.4966402053833, "global_step": 386481, "epoch": 2300} {"train_loss": -12.592174530029297, "global_step": 386482, "epoch": 2300} {"train_loss": -12.777449607849121, "global_step": 386483, "epoch": 2300} {"train_loss": -12.55227279663086, "global_step": 386484, "epoch": 2300} {"train_loss": -12.620109558105469, "global_step": 386485, "epoch": 2300} {"train_loss": -12.698711395263672, "global_step": 386486, "epoch": 2300} {"train_loss": -12.573197364807129, "global_step": 386487, "epoch": 2300} {"train_loss": -12.485980033874512, "global_step": 386488, "epoch": 2300} {"train_loss": -12.7383451461792, "global_step": 386489, "epoch": 2300} {"train_loss": -12.646422386169434, "global_step": 386490, "epoch": 2300} {"train_loss": -12.414862632751465, "global_step": 386491, "epoch": 2300} {"train_loss": -12.633321762084961, "global_step": 386492, "epoch": 2300} {"train_loss": -12.511397361755371, "global_step": 386493, "epoch": 2300} {"train_loss": -12.64961051940918, "global_step": 386494, "epoch": 2300} {"train_loss": -12.508430480957031, "global_step": 386495, "epoch": 2300} {"train_loss": -12.618985176086426, "global_step": 386496, "epoch": 2300} {"train_loss": -12.506516456604004, "global_step": 386497, "epoch": 2300} {"train_loss": -12.506406784057617, "global_step": 386498, "epoch": 2300} {"train_loss": -12.647891998291016, "global_step": 386499, "epoch": 2300} {"train_loss": -12.61180305480957, "global_step": 386500, "epoch": 2300} {"train_loss": -12.692805290222168, "global_step": 386501, "epoch": 2300} {"train_loss": -12.620834350585938, "global_step": 386502, "epoch": 2300} {"train_loss": -12.462407112121582, "global_step": 386503, "epoch": 2300} {"train_loss": -12.465287208557129, "global_step": 386504, "epoch": 2300} {"train_loss": -12.450994491577148, "global_step": 386505, "epoch": 2300} {"train_loss": -12.285993576049805, "global_step": 386506, "epoch": 2300} {"train_loss": -11.517767906188965, "global_step": 386507, "epoch": 2300} {"train_loss": -11.584493637084961, "global_step": 386508, "epoch": 2300} {"train_loss": -12.511131286621094, "global_step": 386509, "epoch": 2300} {"train_loss": -12.251928329467773, "global_step": 386510, "epoch": 2300} {"train_loss": -11.7335844039917, "global_step": 386511, "epoch": 2300} {"train_loss": -12.558633804321289, "global_step": 386512, "epoch": 2300} {"train_loss": -12.109166145324707, "global_step": 386513, "epoch": 2300} {"train_loss": -11.796802520751953, "global_step": 386514, "epoch": 2300} {"train_loss": -11.605672836303711, "global_step": 386515, "epoch": 2300} {"train_loss": -12.001558303833008, "global_step": 386516, "epoch": 2300} {"train_loss": -11.061086654663086, "global_step": 386517, "epoch": 2300} {"train_loss": -11.628813743591309, "global_step": 386518, "epoch": 2300} {"train_loss": -11.564958572387695, "global_step": 386519, "epoch": 2300} {"train_loss": -11.749452590942383, "global_step": 386520, "epoch": 2300} {"train_loss": -11.358834266662598, "global_step": 386521, "epoch": 2300} {"train_loss": -11.82713794708252, "global_step": 386522, "epoch": 2300} {"train_loss": -10.941997528076172, "global_step": 386523, "epoch": 2300} {"train_loss": -11.97147274017334, "global_step": 386524, "epoch": 2300} {"train_loss": -12.15918254852295, "global_step": 386525, "epoch": 2300} {"train_loss": -10.8504056930542, "global_step": 386526, "epoch": 2300} {"train_loss": -12.044793128967285, "global_step": 386527, "epoch": 2300} {"train_loss": -11.67559814453125, "global_step": 386528, "epoch": 2300} {"train_loss": -10.261343002319336, "global_step": 386529, "epoch": 2300} {"train_loss": -12.450860977172852, "global_step": 386530, "epoch": 2300} {"train_loss": -10.431262969970703, "global_step": 386531, "epoch": 2300} {"train_loss": -12.348142623901367, "global_step": 386532, "epoch": 2300} {"train_loss": -10.841096878051758, "global_step": 386533, "epoch": 2300} {"train_loss": -11.306431770324707, "global_step": 386534, "epoch": 2300} {"train_loss": -12.274412155151367, "global_step": 386535, "epoch": 2300} {"train_loss": -11.313258171081543, "global_step": 386536, "epoch": 2300} {"train_loss": -12.404321670532227, "global_step": 386537, "epoch": 2300} {"train_loss": -12.01087760925293, "global_step": 386538, "epoch": 2300} {"train_loss": -12.316354751586914, "global_step": 386539, "epoch": 2300} {"train_loss": -12.191709518432617, "global_step": 386540, "epoch": 2300} {"train_loss": -11.791620254516602, "global_step": 386541, "epoch": 2300} {"train_loss": -11.996929168701172, "global_step": 386542, "epoch": 2300} {"train_loss": -12.114672660827637, "global_step": 386543, "epoch": 2300} {"train_loss": -12.01489543914795, "global_step": 386544, "epoch": 2300} {"train_loss": -12.031578063964844, "global_step": 386545, "epoch": 2300} {"train_loss": -12.124126434326172, "global_step": 386546, "epoch": 2300} {"train_loss": -12.401874542236328, "global_step": 386547, "epoch": 2300} {"train_loss": -11.822738647460938, "global_step": 386548, "epoch": 2300} {"train_loss": -12.044968605041504, "global_step": 386549, "epoch": 2300} {"train_loss": -12.12375259399414, "global_step": 386550, "epoch": 2300} {"train_loss": -12.122478485107422, "global_step": 386551, "epoch": 2300} {"train_loss": -11.885419845581055, "global_step": 386552, "epoch": 2300} {"train_loss": -11.876630783081055, "global_step": 386553, "epoch": 2300} {"train_loss": -11.942205429077148, "global_step": 386554, "epoch": 2300} {"train_loss": -11.878148078918457, "global_step": 386555, "epoch": 2300} {"train_loss": -11.96929931640625, "global_step": 386556, "epoch": 2300} {"train_loss": -12.029632568359375, "global_step": 386557, "epoch": 2300} {"train_loss": -11.601570129394531, "global_step": 386558, "epoch": 2300} {"train_loss": -11.848712921142578, "global_step": 386559, "epoch": 2300} {"train_loss": -12.37579345703125, "global_step": 386560, "epoch": 2300} {"train_loss": -11.792692184448242, "global_step": 386561, "epoch": 2300} {"train_loss": -11.808018684387207, "global_step": 386562, "epoch": 2300} {"train_loss": -12.323724746704102, "global_step": 386563, "epoch": 2300} {"train_loss": -12.011275291442871, "global_step": 386564, "epoch": 2300} {"train_loss": -12.049671173095703, "global_step": 386565, "epoch": 2300} {"train_loss": -11.78293514251709, "global_step": 386566, "epoch": 2300} {"train_loss": -12.015919129053751, "global_step": 386567, "epoch": 2300, "train/sim_max_reward_0": 0.683677704004205, "train/sim_max_reward_1": 0.8959805632768335, "train/sim_max_reward_2": 5.303654020526609e-05, "train/sim_max_reward_3": 0.6655686718193841, "train/sim_max_reward_4": 0.45229488000164697, "train/sim_max_reward_5": 0.5499730424968906, "test/sim_max_reward_4400000": 0.9468209078506928, "test/sim_max_reward_4400001": 0.3638475643798245, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.9487067595650626, "test/sim_max_reward_4400004": 0.4069682016378368, "test/sim_max_reward_4400005": 0.9270606996113476, "test/sim_max_reward_4400006": 0.3756535110670371, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 0.6444208367034167, "test/sim_max_reward_4400009": 0.0333636889040716, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 0.4750234729989518, "test/sim_max_reward_4400012": 0.14110722128947978, "test/sim_max_reward_4400013": 0.7937637061321189, "test/sim_max_reward_4400014": 0.986484379615761, "test/sim_max_reward_4400015": 0.5447137904625938, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.1074825047126136, "test/sim_max_reward_4400018": 0.8939665149820997, "test/sim_max_reward_4400019": 0.2148067508137076, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.5641322648306876, "test/sim_max_reward_4400022": 0.9440506566331061, "test/sim_max_reward_4400023": 0.13915375615497833, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.5827151234965887, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.6110996371944036, "test/sim_max_reward_4400028": 0.6941769219756768, "test/sim_max_reward_4400029": 0.9299885800059209, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.5441387956356492, "test/sim_max_reward_4400032": 0.3711108672348018, "test/sim_max_reward_4400033": 0.6322382404916689, "test/sim_max_reward_4400034": 0.9765365859420722, "test/sim_max_reward_4400035": 0.9512654244096939, "test/sim_max_reward_4400036": 0.9733109019926889, "test/sim_max_reward_4400037": 0.9777717955645067, "test/sim_max_reward_4400038": 0.3242372328862331, "test/sim_max_reward_4400039": 0.41280283836350484, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.25319885860027985, "test/sim_max_reward_4400042": 0.1348852069507808, "test/sim_max_reward_4400043": 0.031910024575954904, "test/sim_max_reward_4400044": 0.7853795216103272, "test/sim_max_reward_4400045": 0.08270613487675807, "test/sim_max_reward_4400046": 0.9501636491308668, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.5412579830231942, "test/mean_score": 0.5353894035221082, "val_loss": 295148.5, "train_action_mse_error": 2.371251344680786} {"train_loss": -10.982059478759766, "global_step": 386568, "epoch": 2301} {"train_loss": -11.325811386108398, "global_step": 386569, "epoch": 2301} {"train_loss": -11.566875457763672, "global_step": 386570, "epoch": 2301} {"train_loss": -11.8329439163208, "global_step": 386571, "epoch": 2301} {"train_loss": -11.157907485961914, "global_step": 386572, "epoch": 2301} {"train_loss": -11.036062240600586, "global_step": 386573, "epoch": 2301} {"train_loss": -11.870787620544434, "global_step": 386574, "epoch": 2301} {"train_loss": -11.431251525878906, "global_step": 386575, "epoch": 2301} {"train_loss": -11.702808380126953, "global_step": 386576, "epoch": 2301} {"train_loss": -11.083122253417969, "global_step": 386577, "epoch": 2301} {"train_loss": -11.89124584197998, "global_step": 386578, "epoch": 2301} {"train_loss": -11.43769645690918, "global_step": 386579, "epoch": 2301} {"train_loss": -11.90875244140625, "global_step": 386580, "epoch": 2301} {"train_loss": -11.128891944885254, "global_step": 386581, "epoch": 2301} {"train_loss": -11.753567695617676, "global_step": 386582, "epoch": 2301} {"train_loss": -11.699867248535156, "global_step": 386583, "epoch": 2301} {"train_loss": -11.966026306152344, "global_step": 386584, "epoch": 2301} {"train_loss": -12.327919006347656, "global_step": 386585, "epoch": 2301} {"train_loss": -11.763178825378418, "global_step": 386586, "epoch": 2301} {"train_loss": -12.214798927307129, "global_step": 386587, "epoch": 2301} {"train_loss": -11.81389045715332, "global_step": 386588, "epoch": 2301} {"train_loss": -12.245940208435059, "global_step": 386589, "epoch": 2301} {"train_loss": -11.380826950073242, "global_step": 386590, "epoch": 2301} {"train_loss": -12.142284393310547, "global_step": 386591, "epoch": 2301} {"train_loss": -11.848280906677246, "global_step": 386592, "epoch": 2301} {"train_loss": -12.104211807250977, "global_step": 386593, "epoch": 2301} {"train_loss": -12.23942756652832, "global_step": 386594, "epoch": 2301} {"train_loss": -12.111577987670898, "global_step": 386595, "epoch": 2301} {"train_loss": -12.10642147064209, "global_step": 386596, "epoch": 2301} {"train_loss": -11.889119148254395, "global_step": 386597, "epoch": 2301} {"train_loss": -12.285980224609375, "global_step": 386598, "epoch": 2301} {"train_loss": -11.953649520874023, "global_step": 386599, "epoch": 2301} {"train_loss": -11.842442512512207, "global_step": 386600, "epoch": 2301} {"train_loss": -11.946250915527344, "global_step": 386601, "epoch": 2301} {"train_loss": -11.458951950073242, "global_step": 386602, "epoch": 2301} {"train_loss": -11.562154769897461, "global_step": 386603, "epoch": 2301} {"train_loss": -11.431506156921387, "global_step": 386604, "epoch": 2301} {"train_loss": -11.020950317382812, "global_step": 386605, "epoch": 2301} {"train_loss": -11.850707054138184, "global_step": 386606, "epoch": 2301} {"train_loss": -10.81673812866211, "global_step": 386607, "epoch": 2301} {"train_loss": -11.995755195617676, "global_step": 386608, "epoch": 2301} {"train_loss": -11.752923965454102, "global_step": 386609, "epoch": 2301} {"train_loss": -11.478961944580078, "global_step": 386610, "epoch": 2301} {"train_loss": -11.573495864868164, "global_step": 386611, "epoch": 2301} {"train_loss": -12.030200958251953, "global_step": 386612, "epoch": 2301} {"train_loss": -11.114309310913086, "global_step": 386613, "epoch": 2301} {"train_loss": -12.05555534362793, "global_step": 386614, "epoch": 2301} {"train_loss": -11.526866912841797, "global_step": 386615, "epoch": 2301} {"train_loss": -12.129300117492676, "global_step": 386616, "epoch": 2301} {"train_loss": -11.912208557128906, "global_step": 386617, "epoch": 2301} {"train_loss": -12.159875869750977, "global_step": 386618, "epoch": 2301} {"train_loss": -11.750680923461914, "global_step": 386619, "epoch": 2301} {"train_loss": -12.139606475830078, "global_step": 386620, "epoch": 2301} {"train_loss": -12.192081451416016, "global_step": 386621, "epoch": 2301} {"train_loss": -12.236710548400879, "global_step": 386622, "epoch": 2301} {"train_loss": -12.149508476257324, "global_step": 386623, "epoch": 2301} {"train_loss": -12.080282211303711, "global_step": 386624, "epoch": 2301} {"train_loss": -12.225271224975586, "global_step": 386625, "epoch": 2301} {"train_loss": -12.507125854492188, "global_step": 386626, "epoch": 2301} {"train_loss": -12.227813720703125, "global_step": 386627, "epoch": 2301} {"train_loss": -12.51456069946289, "global_step": 386628, "epoch": 2301} {"train_loss": -12.418712615966797, "global_step": 386629, "epoch": 2301} {"train_loss": -12.27847671508789, "global_step": 386630, "epoch": 2301} {"train_loss": -12.39126205444336, "global_step": 386631, "epoch": 2301} {"train_loss": -12.374552726745605, "global_step": 386632, "epoch": 2301} {"train_loss": -12.4884672164917, "global_step": 386633, "epoch": 2301} {"train_loss": -12.445528984069824, "global_step": 386634, "epoch": 2301} {"train_loss": -12.270462989807129, "global_step": 386635, "epoch": 2301} {"train_loss": -12.416685104370117, "global_step": 386636, "epoch": 2301} {"train_loss": -12.35750961303711, "global_step": 386637, "epoch": 2301} {"train_loss": -12.292856216430664, "global_step": 386638, "epoch": 2301} {"train_loss": -12.395992279052734, "global_step": 386639, "epoch": 2301} {"train_loss": -12.234291076660156, "global_step": 386640, "epoch": 2301} {"train_loss": -12.265890121459961, "global_step": 386641, "epoch": 2301} {"train_loss": -12.42296028137207, "global_step": 386642, "epoch": 2301} {"train_loss": -12.257837295532227, "global_step": 386643, "epoch": 2301} {"train_loss": -12.412906646728516, "global_step": 386644, "epoch": 2301} {"train_loss": -12.297691345214844, "global_step": 386645, "epoch": 2301} {"train_loss": -11.987669944763184, "global_step": 386646, "epoch": 2301} {"train_loss": -12.364095687866211, "global_step": 386647, "epoch": 2301} {"train_loss": -12.179276466369629, "global_step": 386648, "epoch": 2301} {"train_loss": -11.944085121154785, "global_step": 386649, "epoch": 2301} {"train_loss": -12.083391189575195, "global_step": 386650, "epoch": 2301} {"train_loss": -11.865201950073242, "global_step": 386651, "epoch": 2301} {"train_loss": -12.127521514892578, "global_step": 386652, "epoch": 2301} {"train_loss": -11.838434219360352, "global_step": 386653, "epoch": 2301} {"train_loss": -12.297256469726562, "global_step": 386654, "epoch": 2301} {"train_loss": -11.976094245910645, "global_step": 386655, "epoch": 2301} {"train_loss": -12.135168075561523, "global_step": 386656, "epoch": 2301} {"train_loss": -12.409879684448242, "global_step": 386657, "epoch": 2301} {"train_loss": -12.17715072631836, "global_step": 386658, "epoch": 2301} {"train_loss": -12.485481262207031, "global_step": 386659, "epoch": 2301} {"train_loss": -12.169266700744629, "global_step": 386660, "epoch": 2301} {"train_loss": -12.361227989196777, "global_step": 386661, "epoch": 2301} {"train_loss": -12.289237976074219, "global_step": 386662, "epoch": 2301} {"train_loss": -12.406410217285156, "global_step": 386663, "epoch": 2301} {"train_loss": -12.325065612792969, "global_step": 386664, "epoch": 2301} {"train_loss": -11.94167423248291, "global_step": 386665, "epoch": 2301} {"train_loss": -12.415576934814453, "global_step": 386666, "epoch": 2301} {"train_loss": -11.978708267211914, "global_step": 386667, "epoch": 2301} {"train_loss": -12.089179039001465, "global_step": 386668, "epoch": 2301} {"train_loss": -11.698580741882324, "global_step": 386669, "epoch": 2301} {"train_loss": -11.94092082977295, "global_step": 386670, "epoch": 2301} {"train_loss": -12.54825496673584, "global_step": 386671, "epoch": 2301} {"train_loss": -11.907256126403809, "global_step": 386672, "epoch": 2301} {"train_loss": -12.349825859069824, "global_step": 386673, "epoch": 2301} {"train_loss": -11.50997543334961, "global_step": 386674, "epoch": 2301} {"train_loss": -12.476613998413086, "global_step": 386675, "epoch": 2301} {"train_loss": -11.33094596862793, "global_step": 386676, "epoch": 2301} {"train_loss": -12.27865982055664, "global_step": 386677, "epoch": 2301} {"train_loss": -11.00027084350586, "global_step": 386678, "epoch": 2301} {"train_loss": -12.460733413696289, "global_step": 386679, "epoch": 2301} {"train_loss": -10.875578880310059, "global_step": 386680, "epoch": 2301} {"train_loss": -11.491216659545898, "global_step": 386681, "epoch": 2301} {"train_loss": -11.26333999633789, "global_step": 386682, "epoch": 2301} {"train_loss": -11.673998832702637, "global_step": 386683, "epoch": 2301} {"train_loss": -11.293233871459961, "global_step": 386684, "epoch": 2301} {"train_loss": -11.80691909790039, "global_step": 386685, "epoch": 2301} {"train_loss": -11.182988166809082, "global_step": 386686, "epoch": 2301} {"train_loss": -11.98336124420166, "global_step": 386687, "epoch": 2301} {"train_loss": -11.99638557434082, "global_step": 386688, "epoch": 2301} {"train_loss": -11.658709526062012, "global_step": 386689, "epoch": 2301} {"train_loss": -11.615577697753906, "global_step": 386690, "epoch": 2301} {"train_loss": -12.23457145690918, "global_step": 386691, "epoch": 2301} {"train_loss": -12.057167053222656, "global_step": 386692, "epoch": 2301} {"train_loss": -12.598739624023438, "global_step": 386693, "epoch": 2301} {"train_loss": -12.22293472290039, "global_step": 386694, "epoch": 2301} {"train_loss": -12.337736129760742, "global_step": 386695, "epoch": 2301} {"train_loss": -11.79014778137207, "global_step": 386696, "epoch": 2301} {"train_loss": -11.581855773925781, "global_step": 386697, "epoch": 2301} {"train_loss": -12.361520767211914, "global_step": 386698, "epoch": 2301} {"train_loss": -11.752424240112305, "global_step": 386699, "epoch": 2301} {"train_loss": -12.202738761901855, "global_step": 386700, "epoch": 2301} {"train_loss": -11.904581069946289, "global_step": 386701, "epoch": 2301} {"train_loss": -11.866002082824707, "global_step": 386702, "epoch": 2301} {"train_loss": -12.232524871826172, "global_step": 386703, "epoch": 2301} {"train_loss": -12.055215835571289, "global_step": 386704, "epoch": 2301} {"train_loss": -12.107343673706055, "global_step": 386705, "epoch": 2301} {"train_loss": -12.211318969726562, "global_step": 386706, "epoch": 2301} {"train_loss": -12.071579933166504, "global_step": 386707, "epoch": 2301} {"train_loss": -11.962655067443848, "global_step": 386708, "epoch": 2301} {"train_loss": -11.713170051574707, "global_step": 386709, "epoch": 2301} {"train_loss": -12.341165542602539, "global_step": 386710, "epoch": 2301} {"train_loss": -11.947790145874023, "global_step": 386711, "epoch": 2301} {"train_loss": -12.32536506652832, "global_step": 386712, "epoch": 2301} {"train_loss": -12.184671401977539, "global_step": 386713, "epoch": 2301} {"train_loss": -12.050203323364258, "global_step": 386714, "epoch": 2301} {"train_loss": -12.370290756225586, "global_step": 386715, "epoch": 2301} {"train_loss": -12.342686653137207, "global_step": 386716, "epoch": 2301} {"train_loss": -12.323408126831055, "global_step": 386717, "epoch": 2301} {"train_loss": -12.585886001586914, "global_step": 386718, "epoch": 2301} {"train_loss": -12.595272064208984, "global_step": 386719, "epoch": 2301} {"train_loss": -12.568334579467773, "global_step": 386720, "epoch": 2301} {"train_loss": -12.58102798461914, "global_step": 386721, "epoch": 2301} {"train_loss": -12.536865234375, "global_step": 386722, "epoch": 2301} {"train_loss": -12.66825008392334, "global_step": 386723, "epoch": 2301} {"train_loss": -12.213141441345215, "global_step": 386724, "epoch": 2301} {"train_loss": -12.573734283447266, "global_step": 386725, "epoch": 2301} {"train_loss": -12.327320098876953, "global_step": 386726, "epoch": 2301} {"train_loss": -12.326093673706055, "global_step": 386727, "epoch": 2301} {"train_loss": -12.312540054321289, "global_step": 386728, "epoch": 2301} {"train_loss": -12.394611358642578, "global_step": 386729, "epoch": 2301} {"train_loss": -12.348591804504395, "global_step": 386730, "epoch": 2301} {"train_loss": -12.49026870727539, "global_step": 386731, "epoch": 2301} {"train_loss": -12.256762504577637, "global_step": 386732, "epoch": 2301} {"train_loss": -12.18688678741455, "global_step": 386733, "epoch": 2301} {"train_loss": -12.233634948730469, "global_step": 386734, "epoch": 2301} {"train_loss": -12.017995607285272, "global_step": 386735, "epoch": 2301, "val_loss": 295528.59375} {"train_loss": -12.237091064453125, "global_step": 386736, "epoch": 2302} {"train_loss": -12.220908164978027, "global_step": 386737, "epoch": 2302} {"train_loss": -12.560677528381348, "global_step": 386738, "epoch": 2302} {"train_loss": -12.11503791809082, "global_step": 386739, "epoch": 2302} {"train_loss": -12.312240600585938, "global_step": 386740, "epoch": 2302} {"train_loss": -11.893335342407227, "global_step": 386741, "epoch": 2302} {"train_loss": -11.968292236328125, "global_step": 386742, "epoch": 2302} {"train_loss": -12.279427528381348, "global_step": 386743, "epoch": 2302} {"train_loss": -12.471588134765625, "global_step": 386744, "epoch": 2302} {"train_loss": -12.309858322143555, "global_step": 386745, "epoch": 2302} {"train_loss": -12.511343955993652, "global_step": 386746, "epoch": 2302} {"train_loss": -12.496733665466309, "global_step": 386747, "epoch": 2302} {"train_loss": -12.623353004455566, "global_step": 386748, "epoch": 2302} {"train_loss": -12.78073787689209, "global_step": 386749, "epoch": 2302} {"train_loss": -12.338027000427246, "global_step": 386750, "epoch": 2302} {"train_loss": -12.364097595214844, "global_step": 386751, "epoch": 2302} {"train_loss": -12.526519775390625, "global_step": 386752, "epoch": 2302} {"train_loss": -12.628124237060547, "global_step": 386753, "epoch": 2302} {"train_loss": -12.550688743591309, "global_step": 386754, "epoch": 2302} {"train_loss": -12.638320922851562, "global_step": 386755, "epoch": 2302} {"train_loss": -12.503669738769531, "global_step": 386756, "epoch": 2302} {"train_loss": -12.300470352172852, "global_step": 386757, "epoch": 2302} {"train_loss": -12.270512580871582, "global_step": 386758, "epoch": 2302} {"train_loss": -12.607490539550781, "global_step": 386759, "epoch": 2302} {"train_loss": -12.501590728759766, "global_step": 386760, "epoch": 2302} {"train_loss": -12.194860458374023, "global_step": 386761, "epoch": 2302} {"train_loss": -12.14192008972168, "global_step": 386762, "epoch": 2302} {"train_loss": -12.341601371765137, "global_step": 386763, "epoch": 2302} {"train_loss": -12.05184268951416, "global_step": 386764, "epoch": 2302} {"train_loss": -12.433884620666504, "global_step": 386765, "epoch": 2302} {"train_loss": -12.509044647216797, "global_step": 386766, "epoch": 2302} {"train_loss": -12.504313468933105, "global_step": 386767, "epoch": 2302} {"train_loss": -11.694190979003906, "global_step": 386768, "epoch": 2302} {"train_loss": -11.710868835449219, "global_step": 386769, "epoch": 2302} {"train_loss": -11.98006820678711, "global_step": 386770, "epoch": 2302} {"train_loss": -12.44345474243164, "global_step": 386771, "epoch": 2302} {"train_loss": -11.71761703491211, "global_step": 386772, "epoch": 2302} {"train_loss": -11.772090911865234, "global_step": 386773, "epoch": 2302} {"train_loss": -11.861148834228516, "global_step": 386774, "epoch": 2302} {"train_loss": -12.220365524291992, "global_step": 386775, "epoch": 2302} {"train_loss": -11.543582916259766, "global_step": 386776, "epoch": 2302} {"train_loss": -12.381887435913086, "global_step": 386777, "epoch": 2302} {"train_loss": -11.764577865600586, "global_step": 386778, "epoch": 2302} {"train_loss": -11.73733901977539, "global_step": 386779, "epoch": 2302} {"train_loss": -12.246179580688477, "global_step": 386780, "epoch": 2302} {"train_loss": -12.288078308105469, "global_step": 386781, "epoch": 2302} {"train_loss": -12.023012161254883, "global_step": 386782, "epoch": 2302} {"train_loss": -11.666610717773438, "global_step": 386783, "epoch": 2302} {"train_loss": -11.898181915283203, "global_step": 386784, "epoch": 2302} {"train_loss": -11.919965744018555, "global_step": 386785, "epoch": 2302} {"train_loss": -11.235404968261719, "global_step": 386786, "epoch": 2302} {"train_loss": -12.389951705932617, "global_step": 386787, "epoch": 2302} {"train_loss": -12.051331520080566, "global_step": 386788, "epoch": 2302} {"train_loss": -12.237436294555664, "global_step": 386789, "epoch": 2302} {"train_loss": -12.37462043762207, "global_step": 386790, "epoch": 2302} {"train_loss": -12.44349479675293, "global_step": 386791, "epoch": 2302} {"train_loss": -11.976263046264648, "global_step": 386792, "epoch": 2302} {"train_loss": -12.224727630615234, "global_step": 386793, "epoch": 2302} {"train_loss": -12.205402374267578, "global_step": 386794, "epoch": 2302} {"train_loss": -12.167832374572754, "global_step": 386795, "epoch": 2302} {"train_loss": -12.33822250366211, "global_step": 386796, "epoch": 2302} {"train_loss": -12.216419219970703, "global_step": 386797, "epoch": 2302} {"train_loss": -12.32120418548584, "global_step": 386798, "epoch": 2302} {"train_loss": -12.362918853759766, "global_step": 386799, "epoch": 2302} {"train_loss": -11.934377670288086, "global_step": 386800, "epoch": 2302} {"train_loss": -12.225027084350586, "global_step": 386801, "epoch": 2302} {"train_loss": -11.122696876525879, "global_step": 386802, "epoch": 2302} {"train_loss": -10.989862442016602, "global_step": 386803, "epoch": 2302} {"train_loss": -11.342207908630371, "global_step": 386804, "epoch": 2302} {"train_loss": -11.944096565246582, "global_step": 386805, "epoch": 2302} {"train_loss": -11.45075511932373, "global_step": 386806, "epoch": 2302} {"train_loss": -10.58299732208252, "global_step": 386807, "epoch": 2302} {"train_loss": -12.191781997680664, "global_step": 386808, "epoch": 2302} {"train_loss": -9.716780662536621, "global_step": 386809, "epoch": 2302} {"train_loss": -11.8254976272583, "global_step": 386810, "epoch": 2302} {"train_loss": -10.36648941040039, "global_step": 386811, "epoch": 2302} {"train_loss": -11.239455223083496, "global_step": 386812, "epoch": 2302} {"train_loss": -11.965536117553711, "global_step": 386813, "epoch": 2302} {"train_loss": -9.788180351257324, "global_step": 386814, "epoch": 2302} {"train_loss": -12.12535285949707, "global_step": 386815, "epoch": 2302} {"train_loss": -10.488264083862305, "global_step": 386816, "epoch": 2302} {"train_loss": -12.00454330444336, "global_step": 386817, "epoch": 2302} {"train_loss": -11.43882942199707, "global_step": 386818, "epoch": 2302} {"train_loss": -10.746366500854492, "global_step": 386819, "epoch": 2302} {"train_loss": -11.993812561035156, "global_step": 386820, "epoch": 2302} {"train_loss": -11.120881080627441, "global_step": 386821, "epoch": 2302} {"train_loss": -11.276535034179688, "global_step": 386822, "epoch": 2302} {"train_loss": -12.214728355407715, "global_step": 386823, "epoch": 2302} {"train_loss": -11.740678787231445, "global_step": 386824, "epoch": 2302} {"train_loss": -11.830717086791992, "global_step": 386825, "epoch": 2302} {"train_loss": -12.098557472229004, "global_step": 386826, "epoch": 2302} {"train_loss": -11.800508499145508, "global_step": 386827, "epoch": 2302} {"train_loss": -11.95811653137207, "global_step": 386828, "epoch": 2302} {"train_loss": -11.813347816467285, "global_step": 386829, "epoch": 2302} {"train_loss": -11.842050552368164, "global_step": 386830, "epoch": 2302} {"train_loss": -11.946319580078125, "global_step": 386831, "epoch": 2302} {"train_loss": -12.110532760620117, "global_step": 386832, "epoch": 2302} {"train_loss": -12.118806838989258, "global_step": 386833, "epoch": 2302} {"train_loss": -12.280872344970703, "global_step": 386834, "epoch": 2302} {"train_loss": -11.998641967773438, "global_step": 386835, "epoch": 2302} {"train_loss": -12.296754837036133, "global_step": 386836, "epoch": 2302} {"train_loss": -11.914114952087402, "global_step": 386837, "epoch": 2302} {"train_loss": -11.711041450500488, "global_step": 386838, "epoch": 2302} {"train_loss": -12.011192321777344, "global_step": 386839, "epoch": 2302} {"train_loss": -11.936397552490234, "global_step": 386840, "epoch": 2302} {"train_loss": -11.718982696533203, "global_step": 386841, "epoch": 2302} {"train_loss": -12.075892448425293, "global_step": 386842, "epoch": 2302} {"train_loss": -11.543047904968262, "global_step": 386843, "epoch": 2302} {"train_loss": -12.031420707702637, "global_step": 386844, "epoch": 2302} {"train_loss": -12.277948379516602, "global_step": 386845, "epoch": 2302} {"train_loss": -12.196252822875977, "global_step": 386846, "epoch": 2302} {"train_loss": -11.958678245544434, "global_step": 386847, "epoch": 2302} {"train_loss": -11.85359001159668, "global_step": 386848, "epoch": 2302} {"train_loss": -12.230780601501465, "global_step": 386849, "epoch": 2302} {"train_loss": -12.299196243286133, "global_step": 386850, "epoch": 2302} {"train_loss": -12.24557113647461, "global_step": 386851, "epoch": 2302} {"train_loss": -12.124135971069336, "global_step": 386852, "epoch": 2302} {"train_loss": -12.200029373168945, "global_step": 386853, "epoch": 2302} {"train_loss": -12.084716796875, "global_step": 386854, "epoch": 2302} {"train_loss": -12.155096054077148, "global_step": 386855, "epoch": 2302} {"train_loss": -11.60562801361084, "global_step": 386856, "epoch": 2302} {"train_loss": -12.365253448486328, "global_step": 386857, "epoch": 2302} {"train_loss": -11.815744400024414, "global_step": 386858, "epoch": 2302} {"train_loss": -12.26560115814209, "global_step": 386859, "epoch": 2302} {"train_loss": -12.186834335327148, "global_step": 386860, "epoch": 2302} {"train_loss": -11.936262130737305, "global_step": 386861, "epoch": 2302} {"train_loss": -11.854391098022461, "global_step": 386862, "epoch": 2302} {"train_loss": -11.40119743347168, "global_step": 386863, "epoch": 2302} {"train_loss": -12.339522361755371, "global_step": 386864, "epoch": 2302} {"train_loss": -12.20032024383545, "global_step": 386865, "epoch": 2302} {"train_loss": -11.869575500488281, "global_step": 386866, "epoch": 2302} {"train_loss": -12.365073204040527, "global_step": 386867, "epoch": 2302} {"train_loss": -11.635059356689453, "global_step": 386868, "epoch": 2302} {"train_loss": -12.209516525268555, "global_step": 386869, "epoch": 2302} {"train_loss": -11.994941711425781, "global_step": 386870, "epoch": 2302} {"train_loss": -12.496072769165039, "global_step": 386871, "epoch": 2302} {"train_loss": -12.086736679077148, "global_step": 386872, "epoch": 2302} {"train_loss": -12.596901893615723, "global_step": 386873, "epoch": 2302} {"train_loss": -12.355104446411133, "global_step": 386874, "epoch": 2302} {"train_loss": -12.407352447509766, "global_step": 386875, "epoch": 2302} {"train_loss": -12.515668869018555, "global_step": 386876, "epoch": 2302} {"train_loss": -12.299994468688965, "global_step": 386877, "epoch": 2302} {"train_loss": -12.51167106628418, "global_step": 386878, "epoch": 2302} {"train_loss": -12.393125534057617, "global_step": 386879, "epoch": 2302} {"train_loss": -12.691110610961914, "global_step": 386880, "epoch": 2302} {"train_loss": -12.518549919128418, "global_step": 386881, "epoch": 2302} {"train_loss": -12.275566101074219, "global_step": 386882, "epoch": 2302} {"train_loss": -12.335492134094238, "global_step": 386883, "epoch": 2302} {"train_loss": -12.351846694946289, "global_step": 386884, "epoch": 2302} {"train_loss": -11.359084129333496, "global_step": 386885, "epoch": 2302} {"train_loss": -12.247715950012207, "global_step": 386886, "epoch": 2302} {"train_loss": -12.41719913482666, "global_step": 386887, "epoch": 2302} {"train_loss": -12.462486267089844, "global_step": 386888, "epoch": 2302} {"train_loss": -12.447108268737793, "global_step": 386889, "epoch": 2302} {"train_loss": -12.114980697631836, "global_step": 386890, "epoch": 2302} {"train_loss": -12.52684211730957, "global_step": 386891, "epoch": 2302} {"train_loss": -12.207215309143066, "global_step": 386892, "epoch": 2302} {"train_loss": -12.10122013092041, "global_step": 386893, "epoch": 2302} {"train_loss": -12.529598236083984, "global_step": 386894, "epoch": 2302} {"train_loss": -12.538190841674805, "global_step": 386895, "epoch": 2302} {"train_loss": -12.419645309448242, "global_step": 386896, "epoch": 2302} {"train_loss": -12.39474105834961, "global_step": 386897, "epoch": 2302} {"train_loss": -12.575057983398438, "global_step": 386898, "epoch": 2302} {"train_loss": -12.901693344116211, "global_step": 386899, "epoch": 2302} {"train_loss": -12.298622131347656, "global_step": 386900, "epoch": 2302} {"train_loss": -12.735746383666992, "global_step": 386901, "epoch": 2302} {"train_loss": -12.453512191772461, "global_step": 386902, "epoch": 2302} {"train_loss": -12.068494649160476, "global_step": 386903, "epoch": 2302, "val_loss": 296401.9375} {"train_loss": -12.658414840698242, "global_step": 386904, "epoch": 2303} {"train_loss": -12.573310852050781, "global_step": 386905, "epoch": 2303} {"train_loss": -12.495384216308594, "global_step": 386906, "epoch": 2303} {"train_loss": -12.617116928100586, "global_step": 386907, "epoch": 2303} {"train_loss": -12.39193058013916, "global_step": 386908, "epoch": 2303} {"train_loss": -12.038406372070312, "global_step": 386909, "epoch": 2303} {"train_loss": -12.526235580444336, "global_step": 386910, "epoch": 2303} {"train_loss": -12.382394790649414, "global_step": 386911, "epoch": 2303} {"train_loss": -12.136346817016602, "global_step": 386912, "epoch": 2303} {"train_loss": -11.926143646240234, "global_step": 386913, "epoch": 2303} {"train_loss": -12.667821884155273, "global_step": 386914, "epoch": 2303} {"train_loss": -11.402926445007324, "global_step": 386915, "epoch": 2303} {"train_loss": -11.236162185668945, "global_step": 386916, "epoch": 2303} {"train_loss": -12.007498741149902, "global_step": 386917, "epoch": 2303} {"train_loss": -12.196943283081055, "global_step": 386918, "epoch": 2303} {"train_loss": -10.743764877319336, "global_step": 386919, "epoch": 2303} {"train_loss": -11.318390846252441, "global_step": 386920, "epoch": 2303} {"train_loss": -11.79967212677002, "global_step": 386921, "epoch": 2303} {"train_loss": -11.643661499023438, "global_step": 386922, "epoch": 2303} {"train_loss": -12.013452529907227, "global_step": 386923, "epoch": 2303} {"train_loss": -12.185417175292969, "global_step": 386924, "epoch": 2303} {"train_loss": -12.031187057495117, "global_step": 386925, "epoch": 2303} {"train_loss": -12.227837562561035, "global_step": 386926, "epoch": 2303} {"train_loss": -12.014479637145996, "global_step": 386927, "epoch": 2303} {"train_loss": -12.150136947631836, "global_step": 386928, "epoch": 2303} {"train_loss": -12.110152244567871, "global_step": 386929, "epoch": 2303} {"train_loss": -12.467910766601562, "global_step": 386930, "epoch": 2303} {"train_loss": -12.03449535369873, "global_step": 386931, "epoch": 2303} {"train_loss": -11.645689964294434, "global_step": 386932, "epoch": 2303} {"train_loss": -12.279918670654297, "global_step": 386933, "epoch": 2303} {"train_loss": -10.997359275817871, "global_step": 386934, "epoch": 2303} {"train_loss": -11.785985946655273, "global_step": 386935, "epoch": 2303} {"train_loss": -12.259204864501953, "global_step": 386936, "epoch": 2303} {"train_loss": -10.897579193115234, "global_step": 386937, "epoch": 2303} {"train_loss": -11.662386894226074, "global_step": 386938, "epoch": 2303} {"train_loss": -9.504929542541504, "global_step": 386939, "epoch": 2303} {"train_loss": -10.540207862854004, "global_step": 386940, "epoch": 2303} {"train_loss": -11.048765182495117, "global_step": 386941, "epoch": 2303} {"train_loss": -11.351755142211914, "global_step": 386942, "epoch": 2303} {"train_loss": -11.115297317504883, "global_step": 386943, "epoch": 2303} {"train_loss": -11.474565505981445, "global_step": 386944, "epoch": 2303} {"train_loss": -11.468536376953125, "global_step": 386945, "epoch": 2303} {"train_loss": -11.814847946166992, "global_step": 386946, "epoch": 2303} {"train_loss": -11.706319808959961, "global_step": 386947, "epoch": 2303} {"train_loss": -12.358686447143555, "global_step": 386948, "epoch": 2303} {"train_loss": -11.63723373413086, "global_step": 386949, "epoch": 2303} {"train_loss": -12.442493438720703, "global_step": 386950, "epoch": 2303} {"train_loss": -11.757148742675781, "global_step": 386951, "epoch": 2303} {"train_loss": -12.05866813659668, "global_step": 386952, "epoch": 2303} {"train_loss": -12.30615234375, "global_step": 386953, "epoch": 2303} {"train_loss": -11.435559272766113, "global_step": 386954, "epoch": 2303} {"train_loss": -12.326690673828125, "global_step": 386955, "epoch": 2303} {"train_loss": -12.075480461120605, "global_step": 386956, "epoch": 2303} {"train_loss": -12.141709327697754, "global_step": 386957, "epoch": 2303} {"train_loss": -12.288227081298828, "global_step": 386958, "epoch": 2303} {"train_loss": -12.121236801147461, "global_step": 386959, "epoch": 2303} {"train_loss": -12.094436645507812, "global_step": 386960, "epoch": 2303} {"train_loss": -12.3775634765625, "global_step": 386961, "epoch": 2303} {"train_loss": -11.976253509521484, "global_step": 386962, "epoch": 2303} {"train_loss": -12.152091026306152, "global_step": 386963, "epoch": 2303} {"train_loss": -12.194026947021484, "global_step": 386964, "epoch": 2303} {"train_loss": -12.169448852539062, "global_step": 386965, "epoch": 2303} {"train_loss": -12.153338432312012, "global_step": 386966, "epoch": 2303} {"train_loss": -12.29833984375, "global_step": 386967, "epoch": 2303} {"train_loss": -11.64301872253418, "global_step": 386968, "epoch": 2303} {"train_loss": -12.428909301757812, "global_step": 386969, "epoch": 2303} {"train_loss": -12.019312858581543, "global_step": 386970, "epoch": 2303} {"train_loss": -12.387351989746094, "global_step": 386971, "epoch": 2303} {"train_loss": -12.184287071228027, "global_step": 386972, "epoch": 2303} {"train_loss": -12.403238296508789, "global_step": 386973, "epoch": 2303} {"train_loss": -12.351095199584961, "global_step": 386974, "epoch": 2303} {"train_loss": -12.35875129699707, "global_step": 386975, "epoch": 2303} {"train_loss": -12.11338996887207, "global_step": 386976, "epoch": 2303} {"train_loss": -11.806279182434082, "global_step": 386977, "epoch": 2303} {"train_loss": -12.316816329956055, "global_step": 386978, "epoch": 2303} {"train_loss": -11.667844772338867, "global_step": 386979, "epoch": 2303} {"train_loss": -12.178641319274902, "global_step": 386980, "epoch": 2303} {"train_loss": -12.140020370483398, "global_step": 386981, "epoch": 2303} {"train_loss": -12.105766296386719, "global_step": 386982, "epoch": 2303} {"train_loss": -12.312243461608887, "global_step": 386983, "epoch": 2303} {"train_loss": -11.804443359375, "global_step": 386984, "epoch": 2303} {"train_loss": -12.55258846282959, "global_step": 386985, "epoch": 2303} {"train_loss": -11.872940063476562, "global_step": 386986, "epoch": 2303} {"train_loss": -12.499591827392578, "global_step": 386987, "epoch": 2303} {"train_loss": -12.417715072631836, "global_step": 386988, "epoch": 2303} {"train_loss": -12.45510482788086, "global_step": 386989, "epoch": 2303} {"train_loss": -12.346904754638672, "global_step": 386990, "epoch": 2303} {"train_loss": -12.041236877441406, "global_step": 386991, "epoch": 2303} {"train_loss": -12.43529987335205, "global_step": 386992, "epoch": 2303} {"train_loss": -12.057071685791016, "global_step": 386993, "epoch": 2303} {"train_loss": -12.467244148254395, "global_step": 386994, "epoch": 2303} {"train_loss": -12.280345916748047, "global_step": 386995, "epoch": 2303} {"train_loss": -12.510540008544922, "global_step": 386996, "epoch": 2303} {"train_loss": -12.437871932983398, "global_step": 386997, "epoch": 2303} {"train_loss": -11.978998184204102, "global_step": 386998, "epoch": 2303} {"train_loss": -12.13194751739502, "global_step": 386999, "epoch": 2303} {"train_loss": -11.497385025024414, "global_step": 387000, "epoch": 2303} {"train_loss": -12.498635292053223, "global_step": 387001, "epoch": 2303} {"train_loss": -10.948866844177246, "global_step": 387002, "epoch": 2303} {"train_loss": -12.110357284545898, "global_step": 387003, "epoch": 2303} {"train_loss": -11.245857238769531, "global_step": 387004, "epoch": 2303} {"train_loss": -12.293268203735352, "global_step": 387005, "epoch": 2303} {"train_loss": -11.74567985534668, "global_step": 387006, "epoch": 2303} {"train_loss": -11.232748031616211, "global_step": 387007, "epoch": 2303} {"train_loss": -11.464179992675781, "global_step": 387008, "epoch": 2303} {"train_loss": -11.629161834716797, "global_step": 387009, "epoch": 2303} {"train_loss": -11.478494644165039, "global_step": 387010, "epoch": 2303} {"train_loss": -11.29624080657959, "global_step": 387011, "epoch": 2303} {"train_loss": -12.116680145263672, "global_step": 387012, "epoch": 2303} {"train_loss": -11.067763328552246, "global_step": 387013, "epoch": 2303} {"train_loss": -11.368183135986328, "global_step": 387014, "epoch": 2303} {"train_loss": -12.259807586669922, "global_step": 387015, "epoch": 2303} {"train_loss": -10.321367263793945, "global_step": 387016, "epoch": 2303} {"train_loss": -11.046083450317383, "global_step": 387017, "epoch": 2303} {"train_loss": -9.43795108795166, "global_step": 387018, "epoch": 2303} {"train_loss": -8.438474655151367, "global_step": 387019, "epoch": 2303} {"train_loss": -9.298068046569824, "global_step": 387020, "epoch": 2303} {"train_loss": -8.873607635498047, "global_step": 387021, "epoch": 2303} {"train_loss": -9.36030387878418, "global_step": 387022, "epoch": 2303} {"train_loss": -9.208744049072266, "global_step": 387023, "epoch": 2303} {"train_loss": -9.093135833740234, "global_step": 387024, "epoch": 2303} {"train_loss": -10.236822128295898, "global_step": 387025, "epoch": 2303} {"train_loss": -8.31673812866211, "global_step": 387026, "epoch": 2303} {"train_loss": -9.32470703125, "global_step": 387027, "epoch": 2303} {"train_loss": -10.111466407775879, "global_step": 387028, "epoch": 2303} {"train_loss": -8.564542770385742, "global_step": 387029, "epoch": 2303} {"train_loss": -11.339942932128906, "global_step": 387030, "epoch": 2303} {"train_loss": -8.685773849487305, "global_step": 387031, "epoch": 2303} {"train_loss": -9.0362548828125, "global_step": 387032, "epoch": 2303} {"train_loss": -10.245744705200195, "global_step": 387033, "epoch": 2303} {"train_loss": -10.695856094360352, "global_step": 387034, "epoch": 2303} {"train_loss": -10.484807968139648, "global_step": 387035, "epoch": 2303} {"train_loss": -9.27845573425293, "global_step": 387036, "epoch": 2303} {"train_loss": -9.601950645446777, "global_step": 387037, "epoch": 2303} {"train_loss": -11.294198989868164, "global_step": 387038, "epoch": 2303} {"train_loss": -11.120710372924805, "global_step": 387039, "epoch": 2303} {"train_loss": -11.193833351135254, "global_step": 387040, "epoch": 2303} {"train_loss": -11.614740371704102, "global_step": 387041, "epoch": 2303} {"train_loss": -11.56424331665039, "global_step": 387042, "epoch": 2303} {"train_loss": -11.936607360839844, "global_step": 387043, "epoch": 2303} {"train_loss": -11.674280166625977, "global_step": 387044, "epoch": 2303} {"train_loss": -11.629751205444336, "global_step": 387045, "epoch": 2303} {"train_loss": -11.675399780273438, "global_step": 387046, "epoch": 2303} {"train_loss": -11.611310958862305, "global_step": 387047, "epoch": 2303} {"train_loss": -11.699934005737305, "global_step": 387048, "epoch": 2303} {"train_loss": -11.872142791748047, "global_step": 387049, "epoch": 2303} {"train_loss": -11.465121269226074, "global_step": 387050, "epoch": 2303} {"train_loss": -12.294071197509766, "global_step": 387051, "epoch": 2303} {"train_loss": -11.78480339050293, "global_step": 387052, "epoch": 2303} {"train_loss": -12.007031440734863, "global_step": 387053, "epoch": 2303} {"train_loss": -12.051416397094727, "global_step": 387054, "epoch": 2303} {"train_loss": -11.67249584197998, "global_step": 387055, "epoch": 2303} {"train_loss": -11.989701271057129, "global_step": 387056, "epoch": 2303} {"train_loss": -12.12086009979248, "global_step": 387057, "epoch": 2303} {"train_loss": -11.64556884765625, "global_step": 387058, "epoch": 2303} {"train_loss": -12.187685012817383, "global_step": 387059, "epoch": 2303} {"train_loss": -11.531479835510254, "global_step": 387060, "epoch": 2303} {"train_loss": -12.255277633666992, "global_step": 387061, "epoch": 2303} {"train_loss": -11.873172760009766, "global_step": 387062, "epoch": 2303} {"train_loss": -11.716564178466797, "global_step": 387063, "epoch": 2303} {"train_loss": -12.054887771606445, "global_step": 387064, "epoch": 2303} {"train_loss": -11.964219093322754, "global_step": 387065, "epoch": 2303} {"train_loss": -11.955761909484863, "global_step": 387066, "epoch": 2303} {"train_loss": -12.070516586303711, "global_step": 387067, "epoch": 2303} {"train_loss": -12.044248580932617, "global_step": 387068, "epoch": 2303} {"train_loss": -12.274784088134766, "global_step": 387069, "epoch": 2303} {"train_loss": -12.08579158782959, "global_step": 387070, "epoch": 2303} {"train_loss": -11.619667263258071, "global_step": 387071, "epoch": 2303, "val_loss": 291040.03125} {"train_loss": -12.292097091674805, "global_step": 387072, "epoch": 2304} {"train_loss": -12.285751342773438, "global_step": 387073, "epoch": 2304} {"train_loss": -12.213587760925293, "global_step": 387074, "epoch": 2304} {"train_loss": -12.164140701293945, "global_step": 387075, "epoch": 2304} {"train_loss": -12.146766662597656, "global_step": 387076, "epoch": 2304} {"train_loss": -12.392232894897461, "global_step": 387077, "epoch": 2304} {"train_loss": -12.315625190734863, "global_step": 387078, "epoch": 2304} {"train_loss": -12.143257141113281, "global_step": 387079, "epoch": 2304} {"train_loss": -12.270910263061523, "global_step": 387080, "epoch": 2304} {"train_loss": -12.303662300109863, "global_step": 387081, "epoch": 2304} {"train_loss": -12.37602424621582, "global_step": 387082, "epoch": 2304} {"train_loss": -12.260833740234375, "global_step": 387083, "epoch": 2304} {"train_loss": -12.366556167602539, "global_step": 387084, "epoch": 2304} {"train_loss": -12.29660415649414, "global_step": 387085, "epoch": 2304} {"train_loss": -12.352170944213867, "global_step": 387086, "epoch": 2304} {"train_loss": -12.37026596069336, "global_step": 387087, "epoch": 2304} {"train_loss": -12.510119438171387, "global_step": 387088, "epoch": 2304} {"train_loss": -12.501972198486328, "global_step": 387089, "epoch": 2304} {"train_loss": -12.610834121704102, "global_step": 387090, "epoch": 2304} {"train_loss": -12.43234634399414, "global_step": 387091, "epoch": 2304} {"train_loss": -12.47636604309082, "global_step": 387092, "epoch": 2304} {"train_loss": -12.502935409545898, "global_step": 387093, "epoch": 2304} {"train_loss": -12.420347213745117, "global_step": 387094, "epoch": 2304} {"train_loss": -12.513633728027344, "global_step": 387095, "epoch": 2304} {"train_loss": -12.412739753723145, "global_step": 387096, "epoch": 2304} {"train_loss": -12.654966354370117, "global_step": 387097, "epoch": 2304} {"train_loss": -12.411563873291016, "global_step": 387098, "epoch": 2304} {"train_loss": -12.436445236206055, "global_step": 387099, "epoch": 2304} {"train_loss": -12.529272079467773, "global_step": 387100, "epoch": 2304} {"train_loss": -12.656455993652344, "global_step": 387101, "epoch": 2304} {"train_loss": -12.474699974060059, "global_step": 387102, "epoch": 2304} {"train_loss": -12.541596412658691, "global_step": 387103, "epoch": 2304} {"train_loss": -12.48751449584961, "global_step": 387104, "epoch": 2304} {"train_loss": -12.24858570098877, "global_step": 387105, "epoch": 2304} {"train_loss": -12.389278411865234, "global_step": 387106, "epoch": 2304} {"train_loss": -12.453178405761719, "global_step": 387107, "epoch": 2304} {"train_loss": -12.652084350585938, "global_step": 387108, "epoch": 2304} {"train_loss": -12.366827964782715, "global_step": 387109, "epoch": 2304} {"train_loss": -12.551021575927734, "global_step": 387110, "epoch": 2304} {"train_loss": -12.77686882019043, "global_step": 387111, "epoch": 2304} {"train_loss": -12.625321388244629, "global_step": 387112, "epoch": 2304} {"train_loss": -12.765703201293945, "global_step": 387113, "epoch": 2304} {"train_loss": -12.50230598449707, "global_step": 387114, "epoch": 2304} {"train_loss": -12.732269287109375, "global_step": 387115, "epoch": 2304} {"train_loss": -12.225061416625977, "global_step": 387116, "epoch": 2304} {"train_loss": -12.736520767211914, "global_step": 387117, "epoch": 2304} {"train_loss": -12.374237060546875, "global_step": 387118, "epoch": 2304} {"train_loss": -12.337173461914062, "global_step": 387119, "epoch": 2304} {"train_loss": -12.557170867919922, "global_step": 387120, "epoch": 2304} {"train_loss": -12.337200164794922, "global_step": 387121, "epoch": 2304} {"train_loss": -12.385478019714355, "global_step": 387122, "epoch": 2304} {"train_loss": -12.750585556030273, "global_step": 387123, "epoch": 2304} {"train_loss": -12.50473403930664, "global_step": 387124, "epoch": 2304} {"train_loss": -12.565799713134766, "global_step": 387125, "epoch": 2304} {"train_loss": -12.518704414367676, "global_step": 387126, "epoch": 2304} {"train_loss": -12.549666404724121, "global_step": 387127, "epoch": 2304} {"train_loss": -12.661460876464844, "global_step": 387128, "epoch": 2304} {"train_loss": -12.447586059570312, "global_step": 387129, "epoch": 2304} {"train_loss": -12.69082260131836, "global_step": 387130, "epoch": 2304} {"train_loss": -12.422826766967773, "global_step": 387131, "epoch": 2304} {"train_loss": -12.36832046508789, "global_step": 387132, "epoch": 2304} {"train_loss": -12.621402740478516, "global_step": 387133, "epoch": 2304} {"train_loss": -12.415714263916016, "global_step": 387134, "epoch": 2304} {"train_loss": -12.161109924316406, "global_step": 387135, "epoch": 2304} {"train_loss": -12.180668830871582, "global_step": 387136, "epoch": 2304} {"train_loss": -11.923028945922852, "global_step": 387137, "epoch": 2304} {"train_loss": -11.863161087036133, "global_step": 387138, "epoch": 2304} {"train_loss": -12.209127426147461, "global_step": 387139, "epoch": 2304} {"train_loss": -11.913707733154297, "global_step": 387140, "epoch": 2304} {"train_loss": -11.887187957763672, "global_step": 387141, "epoch": 2304} {"train_loss": -11.596456527709961, "global_step": 387142, "epoch": 2304} {"train_loss": -11.927986145019531, "global_step": 387143, "epoch": 2304} {"train_loss": -12.240182876586914, "global_step": 387144, "epoch": 2304} {"train_loss": -12.142273902893066, "global_step": 387145, "epoch": 2304} {"train_loss": -12.065567016601562, "global_step": 387146, "epoch": 2304} {"train_loss": -12.155799865722656, "global_step": 387147, "epoch": 2304} {"train_loss": -12.105457305908203, "global_step": 387148, "epoch": 2304} {"train_loss": -11.810760498046875, "global_step": 387149, "epoch": 2304} {"train_loss": -12.260278701782227, "global_step": 387150, "epoch": 2304} {"train_loss": -11.626220703125, "global_step": 387151, "epoch": 2304} {"train_loss": -12.253149032592773, "global_step": 387152, "epoch": 2304} {"train_loss": -11.719135284423828, "global_step": 387153, "epoch": 2304} {"train_loss": -11.528486251831055, "global_step": 387154, "epoch": 2304} {"train_loss": -10.873970031738281, "global_step": 387155, "epoch": 2304} {"train_loss": -11.981074333190918, "global_step": 387156, "epoch": 2304} {"train_loss": -9.333208084106445, "global_step": 387157, "epoch": 2304} {"train_loss": -9.995723724365234, "global_step": 387158, "epoch": 2304} {"train_loss": -11.847810745239258, "global_step": 387159, "epoch": 2304} {"train_loss": -10.101518630981445, "global_step": 387160, "epoch": 2304} {"train_loss": -9.298684120178223, "global_step": 387161, "epoch": 2304} {"train_loss": -10.57120418548584, "global_step": 387162, "epoch": 2304} {"train_loss": -10.661438941955566, "global_step": 387163, "epoch": 2304} {"train_loss": -11.1629056930542, "global_step": 387164, "epoch": 2304} {"train_loss": -10.120490074157715, "global_step": 387165, "epoch": 2304} {"train_loss": -10.369756698608398, "global_step": 387166, "epoch": 2304} {"train_loss": -11.063213348388672, "global_step": 387167, "epoch": 2304} {"train_loss": -10.658945083618164, "global_step": 387168, "epoch": 2304} {"train_loss": -11.450265884399414, "global_step": 387169, "epoch": 2304} {"train_loss": -10.05299186706543, "global_step": 387170, "epoch": 2304} {"train_loss": -10.152388572692871, "global_step": 387171, "epoch": 2304} {"train_loss": -10.897272109985352, "global_step": 387172, "epoch": 2304} {"train_loss": -9.724004745483398, "global_step": 387173, "epoch": 2304} {"train_loss": -11.154769897460938, "global_step": 387174, "epoch": 2304} {"train_loss": -9.724141120910645, "global_step": 387175, "epoch": 2304} {"train_loss": -10.58144760131836, "global_step": 387176, "epoch": 2304} {"train_loss": -10.232135772705078, "global_step": 387177, "epoch": 2304} {"train_loss": -11.146682739257812, "global_step": 387178, "epoch": 2304} {"train_loss": -9.876453399658203, "global_step": 387179, "epoch": 2304} {"train_loss": -10.743995666503906, "global_step": 387180, "epoch": 2304} {"train_loss": -9.732675552368164, "global_step": 387181, "epoch": 2304} {"train_loss": -10.301023483276367, "global_step": 387182, "epoch": 2304} {"train_loss": -10.312286376953125, "global_step": 387183, "epoch": 2304} {"train_loss": -10.40788745880127, "global_step": 387184, "epoch": 2304} {"train_loss": -11.017814636230469, "global_step": 387185, "epoch": 2304} {"train_loss": -11.676813125610352, "global_step": 387186, "epoch": 2304} {"train_loss": -11.573469161987305, "global_step": 387187, "epoch": 2304} {"train_loss": -11.286325454711914, "global_step": 387188, "epoch": 2304} {"train_loss": -11.821050643920898, "global_step": 387189, "epoch": 2304} {"train_loss": -11.799179077148438, "global_step": 387190, "epoch": 2304} {"train_loss": -11.695175170898438, "global_step": 387191, "epoch": 2304} {"train_loss": -11.840283393859863, "global_step": 387192, "epoch": 2304} {"train_loss": -11.497430801391602, "global_step": 387193, "epoch": 2304} {"train_loss": -11.94393539428711, "global_step": 387194, "epoch": 2304} {"train_loss": -11.840781211853027, "global_step": 387195, "epoch": 2304} {"train_loss": -11.715755462646484, "global_step": 387196, "epoch": 2304} {"train_loss": -12.046463012695312, "global_step": 387197, "epoch": 2304} {"train_loss": -11.796865463256836, "global_step": 387198, "epoch": 2304} {"train_loss": -11.953290939331055, "global_step": 387199, "epoch": 2304} {"train_loss": -12.170980453491211, "global_step": 387200, "epoch": 2304} {"train_loss": -11.539528846740723, "global_step": 387201, "epoch": 2304} {"train_loss": -12.026262283325195, "global_step": 387202, "epoch": 2304} {"train_loss": -11.92239761352539, "global_step": 387203, "epoch": 2304} {"train_loss": -11.93838882446289, "global_step": 387204, "epoch": 2304} {"train_loss": -12.190183639526367, "global_step": 387205, "epoch": 2304} {"train_loss": -12.062070846557617, "global_step": 387206, "epoch": 2304} {"train_loss": -12.01738452911377, "global_step": 387207, "epoch": 2304} {"train_loss": -12.12679672241211, "global_step": 387208, "epoch": 2304} {"train_loss": -11.888656616210938, "global_step": 387209, "epoch": 2304} {"train_loss": -12.303119659423828, "global_step": 387210, "epoch": 2304} {"train_loss": -11.826738357543945, "global_step": 387211, "epoch": 2304} {"train_loss": -12.094554901123047, "global_step": 387212, "epoch": 2304} {"train_loss": -12.263866424560547, "global_step": 387213, "epoch": 2304} {"train_loss": -12.054688453674316, "global_step": 387214, "epoch": 2304} {"train_loss": -12.337662696838379, "global_step": 387215, "epoch": 2304} {"train_loss": -12.117652893066406, "global_step": 387216, "epoch": 2304} {"train_loss": -12.314698219299316, "global_step": 387217, "epoch": 2304} {"train_loss": -12.203126907348633, "global_step": 387218, "epoch": 2304} {"train_loss": -12.262544631958008, "global_step": 387219, "epoch": 2304} {"train_loss": -12.32594108581543, "global_step": 387220, "epoch": 2304} {"train_loss": -12.167156219482422, "global_step": 387221, "epoch": 2304} {"train_loss": -12.284737586975098, "global_step": 387222, "epoch": 2304} {"train_loss": -12.454333305358887, "global_step": 387223, "epoch": 2304} {"train_loss": -12.410740852355957, "global_step": 387224, "epoch": 2304} {"train_loss": -12.190675735473633, "global_step": 387225, "epoch": 2304} {"train_loss": -11.97497272491455, "global_step": 387226, "epoch": 2304} {"train_loss": -12.15141487121582, "global_step": 387227, "epoch": 2304} {"train_loss": -12.12627124786377, "global_step": 387228, "epoch": 2304} {"train_loss": -12.51023006439209, "global_step": 387229, "epoch": 2304} {"train_loss": -12.41945743560791, "global_step": 387230, "epoch": 2304} {"train_loss": -12.372621536254883, "global_step": 387231, "epoch": 2304} {"train_loss": -12.330678939819336, "global_step": 387232, "epoch": 2304} {"train_loss": -12.43039321899414, "global_step": 387233, "epoch": 2304} {"train_loss": -12.425922393798828, "global_step": 387234, "epoch": 2304} {"train_loss": -12.390989303588867, "global_step": 387235, "epoch": 2304} {"train_loss": -12.406970977783203, "global_step": 387236, "epoch": 2304} {"train_loss": -12.09210205078125, "global_step": 387237, "epoch": 2304} {"train_loss": -12.21430492401123, "global_step": 387238, "epoch": 2304} {"train_loss": -11.915998839196705, "global_step": 387239, "epoch": 2304, "val_loss": 294653.3125} {"train_loss": -12.07158374786377, "global_step": 387240, "epoch": 2305} {"train_loss": -12.413936614990234, "global_step": 387241, "epoch": 2305} {"train_loss": -12.12075424194336, "global_step": 387242, "epoch": 2305} {"train_loss": -12.248798370361328, "global_step": 387243, "epoch": 2305} {"train_loss": -12.445630073547363, "global_step": 387244, "epoch": 2305} {"train_loss": -12.235089302062988, "global_step": 387245, "epoch": 2305} {"train_loss": -12.213623046875, "global_step": 387246, "epoch": 2305} {"train_loss": -12.005630493164062, "global_step": 387247, "epoch": 2305} {"train_loss": -12.48145866394043, "global_step": 387248, "epoch": 2305} {"train_loss": -11.8299560546875, "global_step": 387249, "epoch": 2305} {"train_loss": -12.452664375305176, "global_step": 387250, "epoch": 2305} {"train_loss": -12.144997596740723, "global_step": 387251, "epoch": 2305} {"train_loss": -12.347978591918945, "global_step": 387252, "epoch": 2305} {"train_loss": -11.950571060180664, "global_step": 387253, "epoch": 2305} {"train_loss": -12.154918670654297, "global_step": 387254, "epoch": 2305} {"train_loss": -12.161653518676758, "global_step": 387255, "epoch": 2305} {"train_loss": -12.165512084960938, "global_step": 387256, "epoch": 2305} {"train_loss": -12.503143310546875, "global_step": 387257, "epoch": 2305} {"train_loss": -11.998802185058594, "global_step": 387258, "epoch": 2305} {"train_loss": -12.224623680114746, "global_step": 387259, "epoch": 2305} {"train_loss": -11.857593536376953, "global_step": 387260, "epoch": 2305} {"train_loss": -12.367286682128906, "global_step": 387261, "epoch": 2305} {"train_loss": -12.249341011047363, "global_step": 387262, "epoch": 2305} {"train_loss": -12.144006729125977, "global_step": 387263, "epoch": 2305} {"train_loss": -12.094673156738281, "global_step": 387264, "epoch": 2305} {"train_loss": -12.241579055786133, "global_step": 387265, "epoch": 2305} {"train_loss": -12.583916664123535, "global_step": 387266, "epoch": 2305} {"train_loss": -12.224864959716797, "global_step": 387267, "epoch": 2305} {"train_loss": -12.489476203918457, "global_step": 387268, "epoch": 2305} {"train_loss": -12.120769500732422, "global_step": 387269, "epoch": 2305} {"train_loss": -12.608153343200684, "global_step": 387270, "epoch": 2305} {"train_loss": -12.188658714294434, "global_step": 387271, "epoch": 2305} {"train_loss": -12.34168815612793, "global_step": 387272, "epoch": 2305} {"train_loss": -12.458507537841797, "global_step": 387273, "epoch": 2305} {"train_loss": -12.404775619506836, "global_step": 387274, "epoch": 2305} {"train_loss": -12.466583251953125, "global_step": 387275, "epoch": 2305} {"train_loss": -12.216768264770508, "global_step": 387276, "epoch": 2305} {"train_loss": -12.431846618652344, "global_step": 387277, "epoch": 2305} {"train_loss": -12.376906394958496, "global_step": 387278, "epoch": 2305} {"train_loss": -12.478231430053711, "global_step": 387279, "epoch": 2305} {"train_loss": -11.997188568115234, "global_step": 387280, "epoch": 2305} {"train_loss": -12.391261100769043, "global_step": 387281, "epoch": 2305} {"train_loss": -12.449448585510254, "global_step": 387282, "epoch": 2305} {"train_loss": -12.499263763427734, "global_step": 387283, "epoch": 2305} {"train_loss": -12.419178009033203, "global_step": 387284, "epoch": 2305} {"train_loss": -12.567219734191895, "global_step": 387285, "epoch": 2305} {"train_loss": -12.55195426940918, "global_step": 387286, "epoch": 2305} {"train_loss": -12.729842185974121, "global_step": 387287, "epoch": 2305} {"train_loss": -12.826014518737793, "global_step": 387288, "epoch": 2305} {"train_loss": -12.729679107666016, "global_step": 387289, "epoch": 2305} {"train_loss": -12.028438568115234, "global_step": 387290, "epoch": 2305} {"train_loss": -12.218755722045898, "global_step": 387291, "epoch": 2305} {"train_loss": -12.559761047363281, "global_step": 387292, "epoch": 2305} {"train_loss": -12.2382230758667, "global_step": 387293, "epoch": 2305} {"train_loss": -11.609189987182617, "global_step": 387294, "epoch": 2305} {"train_loss": -12.178656578063965, "global_step": 387295, "epoch": 2305} {"train_loss": -12.443339347839355, "global_step": 387296, "epoch": 2305} {"train_loss": -12.021294593811035, "global_step": 387297, "epoch": 2305} {"train_loss": -12.096481323242188, "global_step": 387298, "epoch": 2305} {"train_loss": -12.490091323852539, "global_step": 387299, "epoch": 2305} {"train_loss": -11.458772659301758, "global_step": 387300, "epoch": 2305} {"train_loss": -12.442198753356934, "global_step": 387301, "epoch": 2305} {"train_loss": -12.601011276245117, "global_step": 387302, "epoch": 2305} {"train_loss": -12.231084823608398, "global_step": 387303, "epoch": 2305} {"train_loss": -12.300107955932617, "global_step": 387304, "epoch": 2305} {"train_loss": -12.119085311889648, "global_step": 387305, "epoch": 2305} {"train_loss": -12.230398178100586, "global_step": 387306, "epoch": 2305} {"train_loss": -12.387052536010742, "global_step": 387307, "epoch": 2305} {"train_loss": -11.86022663116455, "global_step": 387308, "epoch": 2305} {"train_loss": -11.726730346679688, "global_step": 387309, "epoch": 2305} {"train_loss": -12.627246856689453, "global_step": 387310, "epoch": 2305} {"train_loss": -12.162637710571289, "global_step": 387311, "epoch": 2305} {"train_loss": -12.34107494354248, "global_step": 387312, "epoch": 2305} {"train_loss": -12.461700439453125, "global_step": 387313, "epoch": 2305} {"train_loss": -12.329965591430664, "global_step": 387314, "epoch": 2305} {"train_loss": -12.170555114746094, "global_step": 387315, "epoch": 2305} {"train_loss": -12.224843978881836, "global_step": 387316, "epoch": 2305} {"train_loss": -12.58519172668457, "global_step": 387317, "epoch": 2305} {"train_loss": -12.151597023010254, "global_step": 387318, "epoch": 2305} {"train_loss": -12.391351699829102, "global_step": 387319, "epoch": 2305} {"train_loss": -12.398420333862305, "global_step": 387320, "epoch": 2305} {"train_loss": -12.38927936553955, "global_step": 387321, "epoch": 2305} {"train_loss": -11.72796630859375, "global_step": 387322, "epoch": 2305} {"train_loss": -12.065006256103516, "global_step": 387323, "epoch": 2305} {"train_loss": -12.123979568481445, "global_step": 387324, "epoch": 2305} {"train_loss": -11.017577171325684, "global_step": 387325, "epoch": 2305} {"train_loss": -11.670805931091309, "global_step": 387326, "epoch": 2305} {"train_loss": -12.184002876281738, "global_step": 387327, "epoch": 2305} {"train_loss": -11.64670467376709, "global_step": 387328, "epoch": 2305} {"train_loss": -9.710200309753418, "global_step": 387329, "epoch": 2305} {"train_loss": -11.397965431213379, "global_step": 387330, "epoch": 2305} {"train_loss": -8.947613716125488, "global_step": 387331, "epoch": 2305} {"train_loss": -10.595812797546387, "global_step": 387332, "epoch": 2305} {"train_loss": -8.543885231018066, "global_step": 387333, "epoch": 2305} {"train_loss": -9.841546058654785, "global_step": 387334, "epoch": 2305} {"train_loss": -9.128133773803711, "global_step": 387335, "epoch": 2305} {"train_loss": -9.997060775756836, "global_step": 387336, "epoch": 2305} {"train_loss": -9.228117942810059, "global_step": 387337, "epoch": 2305} {"train_loss": -10.091544151306152, "global_step": 387338, "epoch": 2305} {"train_loss": -9.082864761352539, "global_step": 387339, "epoch": 2305} {"train_loss": -9.112663269042969, "global_step": 387340, "epoch": 2305} {"train_loss": -11.211126327514648, "global_step": 387341, "epoch": 2305} {"train_loss": -9.547595977783203, "global_step": 387342, "epoch": 2305} {"train_loss": -11.129898071289062, "global_step": 387343, "epoch": 2305} {"train_loss": -10.469991683959961, "global_step": 387344, "epoch": 2305} {"train_loss": -10.478721618652344, "global_step": 387345, "epoch": 2305} {"train_loss": -11.141899108886719, "global_step": 387346, "epoch": 2305} {"train_loss": -10.764175415039062, "global_step": 387347, "epoch": 2305} {"train_loss": -11.896933555603027, "global_step": 387348, "epoch": 2305} {"train_loss": -11.607786178588867, "global_step": 387349, "epoch": 2305} {"train_loss": -12.081916809082031, "global_step": 387350, "epoch": 2305} {"train_loss": -11.814668655395508, "global_step": 387351, "epoch": 2305} {"train_loss": -12.037090301513672, "global_step": 387352, "epoch": 2305} {"train_loss": -11.828164100646973, "global_step": 387353, "epoch": 2305} {"train_loss": -11.477535247802734, "global_step": 387354, "epoch": 2305} {"train_loss": -11.866065979003906, "global_step": 387355, "epoch": 2305} {"train_loss": -11.923805236816406, "global_step": 387356, "epoch": 2305} {"train_loss": -11.867104530334473, "global_step": 387357, "epoch": 2305} {"train_loss": -11.699909210205078, "global_step": 387358, "epoch": 2305} {"train_loss": -11.87687873840332, "global_step": 387359, "epoch": 2305} {"train_loss": -11.67388916015625, "global_step": 387360, "epoch": 2305} {"train_loss": -11.859016418457031, "global_step": 387361, "epoch": 2305} {"train_loss": -11.773828506469727, "global_step": 387362, "epoch": 2305} {"train_loss": -11.949746131896973, "global_step": 387363, "epoch": 2305} {"train_loss": -12.138131141662598, "global_step": 387364, "epoch": 2305} {"train_loss": -11.899139404296875, "global_step": 387365, "epoch": 2305} {"train_loss": -12.175762176513672, "global_step": 387366, "epoch": 2305} {"train_loss": -12.108987808227539, "global_step": 387367, "epoch": 2305} {"train_loss": -12.169755935668945, "global_step": 387368, "epoch": 2305} {"train_loss": -12.191675186157227, "global_step": 387369, "epoch": 2305} {"train_loss": -12.050586700439453, "global_step": 387370, "epoch": 2305} {"train_loss": -12.227006912231445, "global_step": 387371, "epoch": 2305} {"train_loss": -12.26268196105957, "global_step": 387372, "epoch": 2305} {"train_loss": -12.341348648071289, "global_step": 387373, "epoch": 2305} {"train_loss": -12.297564506530762, "global_step": 387374, "epoch": 2305} {"train_loss": -12.264514923095703, "global_step": 387375, "epoch": 2305} {"train_loss": -12.325199127197266, "global_step": 387376, "epoch": 2305} {"train_loss": -12.340063095092773, "global_step": 387377, "epoch": 2305} {"train_loss": -12.510747909545898, "global_step": 387378, "epoch": 2305} {"train_loss": -12.366962432861328, "global_step": 387379, "epoch": 2305} {"train_loss": -12.371805191040039, "global_step": 387380, "epoch": 2305} {"train_loss": -12.6107177734375, "global_step": 387381, "epoch": 2305} {"train_loss": -12.24919319152832, "global_step": 387382, "epoch": 2305} {"train_loss": -12.44111442565918, "global_step": 387383, "epoch": 2305} {"train_loss": -12.415138244628906, "global_step": 387384, "epoch": 2305} {"train_loss": -12.370163917541504, "global_step": 387385, "epoch": 2305} {"train_loss": -12.371719360351562, "global_step": 387386, "epoch": 2305} {"train_loss": -12.551204681396484, "global_step": 387387, "epoch": 2305} {"train_loss": -12.346403121948242, "global_step": 387388, "epoch": 2305} {"train_loss": -12.39643669128418, "global_step": 387389, "epoch": 2305} {"train_loss": -12.47167682647705, "global_step": 387390, "epoch": 2305} {"train_loss": -12.55844783782959, "global_step": 387391, "epoch": 2305} {"train_loss": -12.606575012207031, "global_step": 387392, "epoch": 2305} {"train_loss": -12.40485668182373, "global_step": 387393, "epoch": 2305} {"train_loss": -12.623861312866211, "global_step": 387394, "epoch": 2305} {"train_loss": -12.198969841003418, "global_step": 387395, "epoch": 2305} {"train_loss": -12.504995346069336, "global_step": 387396, "epoch": 2305} {"train_loss": -12.511701583862305, "global_step": 387397, "epoch": 2305} {"train_loss": -12.465938568115234, "global_step": 387398, "epoch": 2305} {"train_loss": -12.41249942779541, "global_step": 387399, "epoch": 2305} {"train_loss": -12.599878311157227, "global_step": 387400, "epoch": 2305} {"train_loss": -12.610295295715332, "global_step": 387401, "epoch": 2305} {"train_loss": -12.675565719604492, "global_step": 387402, "epoch": 2305} {"train_loss": -12.299389839172363, "global_step": 387403, "epoch": 2305} {"train_loss": -12.589944839477539, "global_step": 387404, "epoch": 2305} {"train_loss": -12.597136497497559, "global_step": 387405, "epoch": 2305} {"train_loss": -12.642292022705078, "global_step": 387406, "epoch": 2305} {"train_loss": -11.990703525997343, "global_step": 387407, "epoch": 2305, "val_loss": 292267.5625, "train_action_mse_error": 1.6907442808151245} {"train_loss": -12.470891952514648, "global_step": 387408, "epoch": 2306} {"train_loss": -12.51861572265625, "global_step": 387409, "epoch": 2306} {"train_loss": -12.59737777709961, "global_step": 387410, "epoch": 2306} {"train_loss": -12.553184509277344, "global_step": 387411, "epoch": 2306} {"train_loss": -12.403165817260742, "global_step": 387412, "epoch": 2306} {"train_loss": -12.657468795776367, "global_step": 387413, "epoch": 2306} {"train_loss": -12.74872875213623, "global_step": 387414, "epoch": 2306} {"train_loss": -12.796455383300781, "global_step": 387415, "epoch": 2306} {"train_loss": -12.636857986450195, "global_step": 387416, "epoch": 2306} {"train_loss": -12.473930358886719, "global_step": 387417, "epoch": 2306} {"train_loss": -12.794224739074707, "global_step": 387418, "epoch": 2306} {"train_loss": -12.584148406982422, "global_step": 387419, "epoch": 2306} {"train_loss": -12.522407531738281, "global_step": 387420, "epoch": 2306} {"train_loss": -12.631274223327637, "global_step": 387421, "epoch": 2306} {"train_loss": -12.623802185058594, "global_step": 387422, "epoch": 2306} {"train_loss": -12.702153205871582, "global_step": 387423, "epoch": 2306} {"train_loss": -12.664358139038086, "global_step": 387424, "epoch": 2306} {"train_loss": -12.682682037353516, "global_step": 387425, "epoch": 2306} {"train_loss": -12.681293487548828, "global_step": 387426, "epoch": 2306} {"train_loss": -12.63399887084961, "global_step": 387427, "epoch": 2306} {"train_loss": -12.643994331359863, "global_step": 387428, "epoch": 2306} {"train_loss": -12.519994735717773, "global_step": 387429, "epoch": 2306} {"train_loss": -12.630037307739258, "global_step": 387430, "epoch": 2306} {"train_loss": -12.158829689025879, "global_step": 387431, "epoch": 2306} {"train_loss": -12.5982666015625, "global_step": 387432, "epoch": 2306} {"train_loss": -12.519330024719238, "global_step": 387433, "epoch": 2306} {"train_loss": -12.120611190795898, "global_step": 387434, "epoch": 2306} {"train_loss": -12.597164154052734, "global_step": 387435, "epoch": 2306} {"train_loss": -11.850833892822266, "global_step": 387436, "epoch": 2306} {"train_loss": -12.393274307250977, "global_step": 387437, "epoch": 2306} {"train_loss": -11.889106750488281, "global_step": 387438, "epoch": 2306} {"train_loss": -12.612405776977539, "global_step": 387439, "epoch": 2306} {"train_loss": -12.293008804321289, "global_step": 387440, "epoch": 2306} {"train_loss": -12.424163818359375, "global_step": 387441, "epoch": 2306} {"train_loss": -12.517170906066895, "global_step": 387442, "epoch": 2306} {"train_loss": -12.711944580078125, "global_step": 387443, "epoch": 2306} {"train_loss": -12.337118148803711, "global_step": 387444, "epoch": 2306} {"train_loss": -12.30247688293457, "global_step": 387445, "epoch": 2306} {"train_loss": -12.404772758483887, "global_step": 387446, "epoch": 2306} {"train_loss": -12.406787872314453, "global_step": 387447, "epoch": 2306} {"train_loss": -12.341330528259277, "global_step": 387448, "epoch": 2306} {"train_loss": -12.434305191040039, "global_step": 387449, "epoch": 2306} {"train_loss": -11.788908004760742, "global_step": 387450, "epoch": 2306} {"train_loss": -12.073540687561035, "global_step": 387451, "epoch": 2306} {"train_loss": -11.45556926727295, "global_step": 387452, "epoch": 2306} {"train_loss": -12.654558181762695, "global_step": 387453, "epoch": 2306} {"train_loss": -11.063353538513184, "global_step": 387454, "epoch": 2306} {"train_loss": -10.029464721679688, "global_step": 387455, "epoch": 2306} {"train_loss": -10.254705429077148, "global_step": 387456, "epoch": 2306} {"train_loss": -12.617657661437988, "global_step": 387457, "epoch": 2306} {"train_loss": -11.821069717407227, "global_step": 387458, "epoch": 2306} {"train_loss": -11.63961124420166, "global_step": 387459, "epoch": 2306} {"train_loss": -10.937814712524414, "global_step": 387460, "epoch": 2306} {"train_loss": -11.221134185791016, "global_step": 387461, "epoch": 2306} {"train_loss": -10.394445419311523, "global_step": 387462, "epoch": 2306} {"train_loss": -10.832469940185547, "global_step": 387463, "epoch": 2306} {"train_loss": -9.692853927612305, "global_step": 387464, "epoch": 2306} {"train_loss": -10.386046409606934, "global_step": 387465, "epoch": 2306} {"train_loss": -10.618277549743652, "global_step": 387466, "epoch": 2306} {"train_loss": -10.98029899597168, "global_step": 387467, "epoch": 2306} {"train_loss": -10.572115898132324, "global_step": 387468, "epoch": 2306} {"train_loss": -10.82630729675293, "global_step": 387469, "epoch": 2306} {"train_loss": -12.208572387695312, "global_step": 387470, "epoch": 2306} {"train_loss": -10.505538940429688, "global_step": 387471, "epoch": 2306} {"train_loss": -12.273862838745117, "global_step": 387472, "epoch": 2306} {"train_loss": -11.153409957885742, "global_step": 387473, "epoch": 2306} {"train_loss": -11.7878999710083, "global_step": 387474, "epoch": 2306} {"train_loss": -11.975131034851074, "global_step": 387475, "epoch": 2306} {"train_loss": -11.636356353759766, "global_step": 387476, "epoch": 2306} {"train_loss": -11.82802963256836, "global_step": 387477, "epoch": 2306} {"train_loss": -11.200726509094238, "global_step": 387478, "epoch": 2306} {"train_loss": -11.846569061279297, "global_step": 387479, "epoch": 2306} {"train_loss": -11.520020484924316, "global_step": 387480, "epoch": 2306} {"train_loss": -11.494455337524414, "global_step": 387481, "epoch": 2306} {"train_loss": -11.762447357177734, "global_step": 387482, "epoch": 2306} {"train_loss": -11.890810012817383, "global_step": 387483, "epoch": 2306} {"train_loss": -11.352548599243164, "global_step": 387484, "epoch": 2306} {"train_loss": -11.999605178833008, "global_step": 387485, "epoch": 2306} {"train_loss": -10.669729232788086, "global_step": 387486, "epoch": 2306} {"train_loss": -12.190729141235352, "global_step": 387487, "epoch": 2306} {"train_loss": -11.576894760131836, "global_step": 387488, "epoch": 2306} {"train_loss": -11.872537612915039, "global_step": 387489, "epoch": 2306} {"train_loss": -10.6777925491333, "global_step": 387490, "epoch": 2306} {"train_loss": -11.266420364379883, "global_step": 387491, "epoch": 2306} {"train_loss": -9.833375930786133, "global_step": 387492, "epoch": 2306} {"train_loss": -10.833044052124023, "global_step": 387493, "epoch": 2306} {"train_loss": -10.441490173339844, "global_step": 387494, "epoch": 2306} {"train_loss": -10.096416473388672, "global_step": 387495, "epoch": 2306} {"train_loss": -10.394830703735352, "global_step": 387496, "epoch": 2306} {"train_loss": -11.612299919128418, "global_step": 387497, "epoch": 2306} {"train_loss": -10.684925079345703, "global_step": 387498, "epoch": 2306} {"train_loss": -11.292181968688965, "global_step": 387499, "epoch": 2306} {"train_loss": -11.260147094726562, "global_step": 387500, "epoch": 2306} {"train_loss": -11.05711841583252, "global_step": 387501, "epoch": 2306} {"train_loss": -11.915328979492188, "global_step": 387502, "epoch": 2306} {"train_loss": -11.835525512695312, "global_step": 387503, "epoch": 2306} {"train_loss": -11.881839752197266, "global_step": 387504, "epoch": 2306} {"train_loss": -11.835609436035156, "global_step": 387505, "epoch": 2306} {"train_loss": -11.981273651123047, "global_step": 387506, "epoch": 2306} {"train_loss": -11.974382400512695, "global_step": 387507, "epoch": 2306} {"train_loss": -11.997357368469238, "global_step": 387508, "epoch": 2306} {"train_loss": -12.26266860961914, "global_step": 387509, "epoch": 2306} {"train_loss": -12.235976219177246, "global_step": 387510, "epoch": 2306} {"train_loss": -11.917110443115234, "global_step": 387511, "epoch": 2306} {"train_loss": -12.403072357177734, "global_step": 387512, "epoch": 2306} {"train_loss": -11.962878227233887, "global_step": 387513, "epoch": 2306} {"train_loss": -12.281851768493652, "global_step": 387514, "epoch": 2306} {"train_loss": -12.07679557800293, "global_step": 387515, "epoch": 2306} {"train_loss": -12.192648887634277, "global_step": 387516, "epoch": 2306} {"train_loss": -12.227020263671875, "global_step": 387517, "epoch": 2306} {"train_loss": -12.308000564575195, "global_step": 387518, "epoch": 2306} {"train_loss": -12.489898681640625, "global_step": 387519, "epoch": 2306} {"train_loss": -12.48109245300293, "global_step": 387520, "epoch": 2306} {"train_loss": -12.332950592041016, "global_step": 387521, "epoch": 2306} {"train_loss": -12.418563842773438, "global_step": 387522, "epoch": 2306} {"train_loss": -12.40800666809082, "global_step": 387523, "epoch": 2306} {"train_loss": -12.657015800476074, "global_step": 387524, "epoch": 2306} {"train_loss": -12.28034782409668, "global_step": 387525, "epoch": 2306} {"train_loss": -12.358993530273438, "global_step": 387526, "epoch": 2306} {"train_loss": -12.124441146850586, "global_step": 387527, "epoch": 2306} {"train_loss": -12.056451797485352, "global_step": 387528, "epoch": 2306} {"train_loss": -12.192623138427734, "global_step": 387529, "epoch": 2306} {"train_loss": -12.189400672912598, "global_step": 387530, "epoch": 2306} {"train_loss": -12.49641227722168, "global_step": 387531, "epoch": 2306} {"train_loss": -12.351251602172852, "global_step": 387532, "epoch": 2306} {"train_loss": -12.616153717041016, "global_step": 387533, "epoch": 2306} {"train_loss": -12.525020599365234, "global_step": 387534, "epoch": 2306} {"train_loss": -12.425010681152344, "global_step": 387535, "epoch": 2306} {"train_loss": -12.456584930419922, "global_step": 387536, "epoch": 2306} {"train_loss": -12.609301567077637, "global_step": 387537, "epoch": 2306} {"train_loss": -12.526419639587402, "global_step": 387538, "epoch": 2306} {"train_loss": -12.439205169677734, "global_step": 387539, "epoch": 2306} {"train_loss": -12.566612243652344, "global_step": 387540, "epoch": 2306} {"train_loss": -12.511194229125977, "global_step": 387541, "epoch": 2306} {"train_loss": -12.178974151611328, "global_step": 387542, "epoch": 2306} {"train_loss": -12.535472869873047, "global_step": 387543, "epoch": 2306} {"train_loss": -12.269588470458984, "global_step": 387544, "epoch": 2306} {"train_loss": -12.332611083984375, "global_step": 387545, "epoch": 2306} {"train_loss": -12.478033065795898, "global_step": 387546, "epoch": 2306} {"train_loss": -11.880159378051758, "global_step": 387547, "epoch": 2306} {"train_loss": -11.107437133789062, "global_step": 387548, "epoch": 2306} {"train_loss": -12.059196472167969, "global_step": 387549, "epoch": 2306} {"train_loss": -9.7786865234375, "global_step": 387550, "epoch": 2306} {"train_loss": -11.76763916015625, "global_step": 387551, "epoch": 2306} {"train_loss": -11.090869903564453, "global_step": 387552, "epoch": 2306} {"train_loss": -10.630972862243652, "global_step": 387553, "epoch": 2306} {"train_loss": -11.736114501953125, "global_step": 387554, "epoch": 2306} {"train_loss": -10.909404754638672, "global_step": 387555, "epoch": 2306} {"train_loss": -10.710674285888672, "global_step": 387556, "epoch": 2306} {"train_loss": -10.90073013305664, "global_step": 387557, "epoch": 2306} {"train_loss": -10.537012100219727, "global_step": 387558, "epoch": 2306} {"train_loss": -11.829547882080078, "global_step": 387559, "epoch": 2306} {"train_loss": -10.304184913635254, "global_step": 387560, "epoch": 2306} {"train_loss": -11.423563003540039, "global_step": 387561, "epoch": 2306} {"train_loss": -9.620367050170898, "global_step": 387562, "epoch": 2306} {"train_loss": -11.066256523132324, "global_step": 387563, "epoch": 2306} {"train_loss": -11.882055282592773, "global_step": 387564, "epoch": 2306} {"train_loss": -10.275789260864258, "global_step": 387565, "epoch": 2306} {"train_loss": -11.682126998901367, "global_step": 387566, "epoch": 2306} {"train_loss": -9.94885540008545, "global_step": 387567, "epoch": 2306} {"train_loss": -10.311715126037598, "global_step": 387568, "epoch": 2306} {"train_loss": -11.239522933959961, "global_step": 387569, "epoch": 2306} {"train_loss": -10.869434356689453, "global_step": 387570, "epoch": 2306} {"train_loss": -11.41285514831543, "global_step": 387571, "epoch": 2306} {"train_loss": -11.572587966918945, "global_step": 387572, "epoch": 2306} {"train_loss": -11.523262977600098, "global_step": 387573, "epoch": 2306} {"train_loss": -11.725807189941406, "global_step": 387574, "epoch": 2306} {"train_loss": -11.805054227511087, "global_step": 387575, "epoch": 2306, "val_loss": 296673.59375} {"train_loss": -11.57703971862793, "global_step": 387576, "epoch": 2307} {"train_loss": -11.790319442749023, "global_step": 387577, "epoch": 2307} {"train_loss": -11.496986389160156, "global_step": 387578, "epoch": 2307} {"train_loss": -11.359471321105957, "global_step": 387579, "epoch": 2307} {"train_loss": -11.88157844543457, "global_step": 387580, "epoch": 2307} {"train_loss": -11.620896339416504, "global_step": 387581, "epoch": 2307} {"train_loss": -11.736942291259766, "global_step": 387582, "epoch": 2307} {"train_loss": -11.954107284545898, "global_step": 387583, "epoch": 2307} {"train_loss": -11.814191818237305, "global_step": 387584, "epoch": 2307} {"train_loss": -12.099305152893066, "global_step": 387585, "epoch": 2307} {"train_loss": -12.099664688110352, "global_step": 387586, "epoch": 2307} {"train_loss": -11.675405502319336, "global_step": 387587, "epoch": 2307} {"train_loss": -11.972677230834961, "global_step": 387588, "epoch": 2307} {"train_loss": -11.597543716430664, "global_step": 387589, "epoch": 2307} {"train_loss": -12.065103530883789, "global_step": 387590, "epoch": 2307} {"train_loss": -12.094388961791992, "global_step": 387591, "epoch": 2307} {"train_loss": -11.733155250549316, "global_step": 387592, "epoch": 2307} {"train_loss": -12.003290176391602, "global_step": 387593, "epoch": 2307} {"train_loss": -11.735997200012207, "global_step": 387594, "epoch": 2307} {"train_loss": -12.126225471496582, "global_step": 387595, "epoch": 2307} {"train_loss": -12.074121475219727, "global_step": 387596, "epoch": 2307} {"train_loss": -12.211097717285156, "global_step": 387597, "epoch": 2307} {"train_loss": -11.983936309814453, "global_step": 387598, "epoch": 2307} {"train_loss": -11.806098937988281, "global_step": 387599, "epoch": 2307} {"train_loss": -12.381219863891602, "global_step": 387600, "epoch": 2307} {"train_loss": -11.80295181274414, "global_step": 387601, "epoch": 2307} {"train_loss": -12.214433670043945, "global_step": 387602, "epoch": 2307} {"train_loss": -11.983119010925293, "global_step": 387603, "epoch": 2307} {"train_loss": -11.958794593811035, "global_step": 387604, "epoch": 2307} {"train_loss": -12.491615295410156, "global_step": 387605, "epoch": 2307} {"train_loss": -11.800849914550781, "global_step": 387606, "epoch": 2307} {"train_loss": -12.321075439453125, "global_step": 387607, "epoch": 2307} {"train_loss": -11.989727020263672, "global_step": 387608, "epoch": 2307} {"train_loss": -12.374547958374023, "global_step": 387609, "epoch": 2307} {"train_loss": -12.19327163696289, "global_step": 387610, "epoch": 2307} {"train_loss": -12.270679473876953, "global_step": 387611, "epoch": 2307} {"train_loss": -12.487218856811523, "global_step": 387612, "epoch": 2307} {"train_loss": -12.12478256225586, "global_step": 387613, "epoch": 2307} {"train_loss": -12.379216194152832, "global_step": 387614, "epoch": 2307} {"train_loss": -11.889528274536133, "global_step": 387615, "epoch": 2307} {"train_loss": -12.126398086547852, "global_step": 387616, "epoch": 2307} {"train_loss": -12.404230117797852, "global_step": 387617, "epoch": 2307} {"train_loss": -12.113322257995605, "global_step": 387618, "epoch": 2307} {"train_loss": -12.252862930297852, "global_step": 387619, "epoch": 2307} {"train_loss": -12.19625186920166, "global_step": 387620, "epoch": 2307} {"train_loss": -12.404367446899414, "global_step": 387621, "epoch": 2307} {"train_loss": -12.310150146484375, "global_step": 387622, "epoch": 2307} {"train_loss": -12.467824935913086, "global_step": 387623, "epoch": 2307} {"train_loss": -12.26922607421875, "global_step": 387624, "epoch": 2307} {"train_loss": -12.357747077941895, "global_step": 387625, "epoch": 2307} {"train_loss": -12.339214324951172, "global_step": 387626, "epoch": 2307} {"train_loss": -12.252342224121094, "global_step": 387627, "epoch": 2307} {"train_loss": -12.542984008789062, "global_step": 387628, "epoch": 2307} {"train_loss": -12.36660385131836, "global_step": 387629, "epoch": 2307} {"train_loss": -12.531238555908203, "global_step": 387630, "epoch": 2307} {"train_loss": -12.469725608825684, "global_step": 387631, "epoch": 2307} {"train_loss": -12.490429878234863, "global_step": 387632, "epoch": 2307} {"train_loss": -12.319595336914062, "global_step": 387633, "epoch": 2307} {"train_loss": -12.574359893798828, "global_step": 387634, "epoch": 2307} {"train_loss": -12.618664741516113, "global_step": 387635, "epoch": 2307} {"train_loss": -12.561716079711914, "global_step": 387636, "epoch": 2307} {"train_loss": -12.51275634765625, "global_step": 387637, "epoch": 2307} {"train_loss": -12.55571460723877, "global_step": 387638, "epoch": 2307} {"train_loss": -12.685857772827148, "global_step": 387639, "epoch": 2307} {"train_loss": -12.526079177856445, "global_step": 387640, "epoch": 2307} {"train_loss": -12.502693176269531, "global_step": 387641, "epoch": 2307} {"train_loss": -12.63303279876709, "global_step": 387642, "epoch": 2307} {"train_loss": -12.59123420715332, "global_step": 387643, "epoch": 2307} {"train_loss": -12.614019393920898, "global_step": 387644, "epoch": 2307} {"train_loss": -12.649402618408203, "global_step": 387645, "epoch": 2307} {"train_loss": -12.51379108428955, "global_step": 387646, "epoch": 2307} {"train_loss": -12.681989669799805, "global_step": 387647, "epoch": 2307} {"train_loss": -12.640706062316895, "global_step": 387648, "epoch": 2307} {"train_loss": -12.354913711547852, "global_step": 387649, "epoch": 2307} {"train_loss": -12.431356430053711, "global_step": 387650, "epoch": 2307} {"train_loss": -12.600059509277344, "global_step": 387651, "epoch": 2307} {"train_loss": -12.647513389587402, "global_step": 387652, "epoch": 2307} {"train_loss": -12.391203880310059, "global_step": 387653, "epoch": 2307} {"train_loss": -12.553866386413574, "global_step": 387654, "epoch": 2307} {"train_loss": -12.342530250549316, "global_step": 387655, "epoch": 2307} {"train_loss": -12.305464744567871, "global_step": 387656, "epoch": 2307} {"train_loss": -12.63111400604248, "global_step": 387657, "epoch": 2307} {"train_loss": -12.082742691040039, "global_step": 387658, "epoch": 2307} {"train_loss": -11.141968727111816, "global_step": 387659, "epoch": 2307} {"train_loss": -11.948789596557617, "global_step": 387660, "epoch": 2307} {"train_loss": -11.596681594848633, "global_step": 387661, "epoch": 2307} {"train_loss": -11.540133476257324, "global_step": 387662, "epoch": 2307} {"train_loss": -12.198620796203613, "global_step": 387663, "epoch": 2307} {"train_loss": -11.723812103271484, "global_step": 387664, "epoch": 2307} {"train_loss": -11.939456939697266, "global_step": 387665, "epoch": 2307} {"train_loss": -11.909416198730469, "global_step": 387666, "epoch": 2307} {"train_loss": -12.357521057128906, "global_step": 387667, "epoch": 2307} {"train_loss": -12.376188278198242, "global_step": 387668, "epoch": 2307} {"train_loss": -11.664655685424805, "global_step": 387669, "epoch": 2307} {"train_loss": -11.46809196472168, "global_step": 387670, "epoch": 2307} {"train_loss": -12.517090797424316, "global_step": 387671, "epoch": 2307} {"train_loss": -11.761652946472168, "global_step": 387672, "epoch": 2307} {"train_loss": -11.986848831176758, "global_step": 387673, "epoch": 2307} {"train_loss": -12.440702438354492, "global_step": 387674, "epoch": 2307} {"train_loss": -12.603736877441406, "global_step": 387675, "epoch": 2307} {"train_loss": -12.457496643066406, "global_step": 387676, "epoch": 2307} {"train_loss": -12.450638771057129, "global_step": 387677, "epoch": 2307} {"train_loss": -12.46043872833252, "global_step": 387678, "epoch": 2307} {"train_loss": -12.587434768676758, "global_step": 387679, "epoch": 2307} {"train_loss": -12.493232727050781, "global_step": 387680, "epoch": 2307} {"train_loss": -12.574981689453125, "global_step": 387681, "epoch": 2307} {"train_loss": -12.622193336486816, "global_step": 387682, "epoch": 2307} {"train_loss": -12.387632369995117, "global_step": 387683, "epoch": 2307} {"train_loss": -12.419927597045898, "global_step": 387684, "epoch": 2307} {"train_loss": -12.36050033569336, "global_step": 387685, "epoch": 2307} {"train_loss": -12.564923286437988, "global_step": 387686, "epoch": 2307} {"train_loss": -12.431488037109375, "global_step": 387687, "epoch": 2307} {"train_loss": -12.031819343566895, "global_step": 387688, "epoch": 2307} {"train_loss": -11.866378784179688, "global_step": 387689, "epoch": 2307} {"train_loss": -12.542510986328125, "global_step": 387690, "epoch": 2307} {"train_loss": -12.093781471252441, "global_step": 387691, "epoch": 2307} {"train_loss": -12.04879379272461, "global_step": 387692, "epoch": 2307} {"train_loss": -12.244455337524414, "global_step": 387693, "epoch": 2307} {"train_loss": -11.870777130126953, "global_step": 387694, "epoch": 2307} {"train_loss": -12.393267631530762, "global_step": 387695, "epoch": 2307} {"train_loss": -12.136452674865723, "global_step": 387696, "epoch": 2307} {"train_loss": -12.132331848144531, "global_step": 387697, "epoch": 2307} {"train_loss": -12.383478164672852, "global_step": 387698, "epoch": 2307} {"train_loss": -11.87212085723877, "global_step": 387699, "epoch": 2307} {"train_loss": -12.120973587036133, "global_step": 387700, "epoch": 2307} {"train_loss": -12.078506469726562, "global_step": 387701, "epoch": 2307} {"train_loss": -11.82461166381836, "global_step": 387702, "epoch": 2307} {"train_loss": -11.937560081481934, "global_step": 387703, "epoch": 2307} {"train_loss": -12.54330062866211, "global_step": 387704, "epoch": 2307} {"train_loss": -12.327150344848633, "global_step": 387705, "epoch": 2307} {"train_loss": -12.13775634765625, "global_step": 387706, "epoch": 2307} {"train_loss": -11.393753051757812, "global_step": 387707, "epoch": 2307} {"train_loss": -11.651336669921875, "global_step": 387708, "epoch": 2307} {"train_loss": -11.566110610961914, "global_step": 387709, "epoch": 2307} {"train_loss": -10.183903694152832, "global_step": 387710, "epoch": 2307} {"train_loss": -11.99869155883789, "global_step": 387711, "epoch": 2307} {"train_loss": -9.316508293151855, "global_step": 387712, "epoch": 2307} {"train_loss": -10.612979888916016, "global_step": 387713, "epoch": 2307} {"train_loss": -8.388206481933594, "global_step": 387714, "epoch": 2307} {"train_loss": -9.731836318969727, "global_step": 387715, "epoch": 2307} {"train_loss": -10.145612716674805, "global_step": 387716, "epoch": 2307} {"train_loss": -10.31163215637207, "global_step": 387717, "epoch": 2307} {"train_loss": -9.693883895874023, "global_step": 387718, "epoch": 2307} {"train_loss": -10.451947212219238, "global_step": 387719, "epoch": 2307} {"train_loss": -10.107405662536621, "global_step": 387720, "epoch": 2307} {"train_loss": -9.40925407409668, "global_step": 387721, "epoch": 2307} {"train_loss": -9.028871536254883, "global_step": 387722, "epoch": 2307} {"train_loss": -10.379861831665039, "global_step": 387723, "epoch": 2307} {"train_loss": -10.795941352844238, "global_step": 387724, "epoch": 2307} {"train_loss": -10.440441131591797, "global_step": 387725, "epoch": 2307} {"train_loss": -10.584495544433594, "global_step": 387726, "epoch": 2307} {"train_loss": -10.996866226196289, "global_step": 387727, "epoch": 2307} {"train_loss": -9.676959991455078, "global_step": 387728, "epoch": 2307} {"train_loss": -10.01773452758789, "global_step": 387729, "epoch": 2307} {"train_loss": -10.27276611328125, "global_step": 387730, "epoch": 2307} {"train_loss": -10.307025909423828, "global_step": 387731, "epoch": 2307} {"train_loss": -9.816827774047852, "global_step": 387732, "epoch": 2307} {"train_loss": -9.437915802001953, "global_step": 387733, "epoch": 2307} {"train_loss": -11.17584228515625, "global_step": 387734, "epoch": 2307} {"train_loss": -10.535637855529785, "global_step": 387735, "epoch": 2307} {"train_loss": -10.86603832244873, "global_step": 387736, "epoch": 2307} {"train_loss": -10.697393417358398, "global_step": 387737, "epoch": 2307} {"train_loss": -11.56136417388916, "global_step": 387738, "epoch": 2307} {"train_loss": -10.968616485595703, "global_step": 387739, "epoch": 2307} {"train_loss": -10.55352783203125, "global_step": 387740, "epoch": 2307} {"train_loss": -11.385276794433594, "global_step": 387741, "epoch": 2307} {"train_loss": -11.021268844604492, "global_step": 387742, "epoch": 2307} {"train_loss": -11.816299869900657, "global_step": 387743, "epoch": 2307, "val_loss": 293594.34375} {"train_loss": -11.687362670898438, "global_step": 387744, "epoch": 2308} {"train_loss": -10.731649398803711, "global_step": 387745, "epoch": 2308} {"train_loss": -11.161359786987305, "global_step": 387746, "epoch": 2308} {"train_loss": -11.66899299621582, "global_step": 387747, "epoch": 2308} {"train_loss": -11.164373397827148, "global_step": 387748, "epoch": 2308} {"train_loss": -11.532184600830078, "global_step": 387749, "epoch": 2308} {"train_loss": -12.004339218139648, "global_step": 387750, "epoch": 2308} {"train_loss": -10.931892395019531, "global_step": 387751, "epoch": 2308} {"train_loss": -11.555013656616211, "global_step": 387752, "epoch": 2308} {"train_loss": -11.451123237609863, "global_step": 387753, "epoch": 2308} {"train_loss": -11.413148880004883, "global_step": 387754, "epoch": 2308} {"train_loss": -11.53972053527832, "global_step": 387755, "epoch": 2308} {"train_loss": -12.101560592651367, "global_step": 387756, "epoch": 2308} {"train_loss": -11.17003345489502, "global_step": 387757, "epoch": 2308} {"train_loss": -11.444732666015625, "global_step": 387758, "epoch": 2308} {"train_loss": -11.468534469604492, "global_step": 387759, "epoch": 2308} {"train_loss": -10.931354522705078, "global_step": 387760, "epoch": 2308} {"train_loss": -11.712393760681152, "global_step": 387761, "epoch": 2308} {"train_loss": -10.834774017333984, "global_step": 387762, "epoch": 2308} {"train_loss": -11.678094863891602, "global_step": 387763, "epoch": 2308} {"train_loss": -11.933149337768555, "global_step": 387764, "epoch": 2308} {"train_loss": -11.630972862243652, "global_step": 387765, "epoch": 2308} {"train_loss": -11.665844917297363, "global_step": 387766, "epoch": 2308} {"train_loss": -12.049797058105469, "global_step": 387767, "epoch": 2308} {"train_loss": -11.478357315063477, "global_step": 387768, "epoch": 2308} {"train_loss": -12.07937240600586, "global_step": 387769, "epoch": 2308} {"train_loss": -11.854736328125, "global_step": 387770, "epoch": 2308} {"train_loss": -11.725503921508789, "global_step": 387771, "epoch": 2308} {"train_loss": -11.928948402404785, "global_step": 387772, "epoch": 2308} {"train_loss": -11.99284553527832, "global_step": 387773, "epoch": 2308} {"train_loss": -12.141082763671875, "global_step": 387774, "epoch": 2308} {"train_loss": -12.243856430053711, "global_step": 387775, "epoch": 2308} {"train_loss": -12.029515266418457, "global_step": 387776, "epoch": 2308} {"train_loss": -12.34764289855957, "global_step": 387777, "epoch": 2308} {"train_loss": -12.299964904785156, "global_step": 387778, "epoch": 2308} {"train_loss": -11.975759506225586, "global_step": 387779, "epoch": 2308} {"train_loss": -12.318304061889648, "global_step": 387780, "epoch": 2308} {"train_loss": -11.937938690185547, "global_step": 387781, "epoch": 2308} {"train_loss": -12.213927268981934, "global_step": 387782, "epoch": 2308} {"train_loss": -12.028278350830078, "global_step": 387783, "epoch": 2308} {"train_loss": -12.265970230102539, "global_step": 387784, "epoch": 2308} {"train_loss": -11.956927299499512, "global_step": 387785, "epoch": 2308} {"train_loss": -12.286478996276855, "global_step": 387786, "epoch": 2308} {"train_loss": -12.107786178588867, "global_step": 387787, "epoch": 2308} {"train_loss": -12.272927284240723, "global_step": 387788, "epoch": 2308} {"train_loss": -11.55947208404541, "global_step": 387789, "epoch": 2308} {"train_loss": -12.377391815185547, "global_step": 387790, "epoch": 2308} {"train_loss": -12.284168243408203, "global_step": 387791, "epoch": 2308} {"train_loss": -12.405762672424316, "global_step": 387792, "epoch": 2308} {"train_loss": -12.289091110229492, "global_step": 387793, "epoch": 2308} {"train_loss": -12.29991626739502, "global_step": 387794, "epoch": 2308} {"train_loss": -11.061595916748047, "global_step": 387795, "epoch": 2308} {"train_loss": -12.092435836791992, "global_step": 387796, "epoch": 2308} {"train_loss": -11.348579406738281, "global_step": 387797, "epoch": 2308} {"train_loss": -12.156412124633789, "global_step": 387798, "epoch": 2308} {"train_loss": -11.913629531860352, "global_step": 387799, "epoch": 2308} {"train_loss": -11.767651557922363, "global_step": 387800, "epoch": 2308} {"train_loss": -12.060792922973633, "global_step": 387801, "epoch": 2308} {"train_loss": -12.004257202148438, "global_step": 387802, "epoch": 2308} {"train_loss": -12.323728561401367, "global_step": 387803, "epoch": 2308} {"train_loss": -12.120872497558594, "global_step": 387804, "epoch": 2308} {"train_loss": -12.13061809539795, "global_step": 387805, "epoch": 2308} {"train_loss": -12.312335968017578, "global_step": 387806, "epoch": 2308} {"train_loss": -12.174517631530762, "global_step": 387807, "epoch": 2308} {"train_loss": -12.239749908447266, "global_step": 387808, "epoch": 2308} {"train_loss": -12.326835632324219, "global_step": 387809, "epoch": 2308} {"train_loss": -12.075511932373047, "global_step": 387810, "epoch": 2308} {"train_loss": -12.236260414123535, "global_step": 387811, "epoch": 2308} {"train_loss": -12.471434593200684, "global_step": 387812, "epoch": 2308} {"train_loss": -12.257585525512695, "global_step": 387813, "epoch": 2308} {"train_loss": -12.345794677734375, "global_step": 387814, "epoch": 2308} {"train_loss": -12.23905086517334, "global_step": 387815, "epoch": 2308} {"train_loss": -12.179977416992188, "global_step": 387816, "epoch": 2308} {"train_loss": -12.415159225463867, "global_step": 387817, "epoch": 2308} {"train_loss": -12.604375839233398, "global_step": 387818, "epoch": 2308} {"train_loss": -12.223325729370117, "global_step": 387819, "epoch": 2308} {"train_loss": -12.398313522338867, "global_step": 387820, "epoch": 2308} {"train_loss": -12.276169776916504, "global_step": 387821, "epoch": 2308} {"train_loss": -12.333505630493164, "global_step": 387822, "epoch": 2308} {"train_loss": -12.25555419921875, "global_step": 387823, "epoch": 2308} {"train_loss": -12.479334831237793, "global_step": 387824, "epoch": 2308} {"train_loss": -12.636800765991211, "global_step": 387825, "epoch": 2308} {"train_loss": -12.563057899475098, "global_step": 387826, "epoch": 2308} {"train_loss": -12.551775932312012, "global_step": 387827, "epoch": 2308} {"train_loss": -12.468420028686523, "global_step": 387828, "epoch": 2308} {"train_loss": -12.635021209716797, "global_step": 387829, "epoch": 2308} {"train_loss": -12.729095458984375, "global_step": 387830, "epoch": 2308} {"train_loss": -12.545854568481445, "global_step": 387831, "epoch": 2308} {"train_loss": -12.407342910766602, "global_step": 387832, "epoch": 2308} {"train_loss": -12.610974311828613, "global_step": 387833, "epoch": 2308} {"train_loss": -12.352375030517578, "global_step": 387834, "epoch": 2308} {"train_loss": -12.321630477905273, "global_step": 387835, "epoch": 2308} {"train_loss": -12.608942985534668, "global_step": 387836, "epoch": 2308} {"train_loss": -12.333824157714844, "global_step": 387837, "epoch": 2308} {"train_loss": -12.015985488891602, "global_step": 387838, "epoch": 2308} {"train_loss": -12.23527717590332, "global_step": 387839, "epoch": 2308} {"train_loss": -12.44062614440918, "global_step": 387840, "epoch": 2308} {"train_loss": -12.712224960327148, "global_step": 387841, "epoch": 2308} {"train_loss": -12.05579948425293, "global_step": 387842, "epoch": 2308} {"train_loss": -12.198125839233398, "global_step": 387843, "epoch": 2308} {"train_loss": -12.246780395507812, "global_step": 387844, "epoch": 2308} {"train_loss": -12.201639175415039, "global_step": 387845, "epoch": 2308} {"train_loss": -12.038458824157715, "global_step": 387846, "epoch": 2308} {"train_loss": -12.297700881958008, "global_step": 387847, "epoch": 2308} {"train_loss": -12.334665298461914, "global_step": 387848, "epoch": 2308} {"train_loss": -12.047014236450195, "global_step": 387849, "epoch": 2308} {"train_loss": -12.284550666809082, "global_step": 387850, "epoch": 2308} {"train_loss": -12.413926124572754, "global_step": 387851, "epoch": 2308} {"train_loss": -12.665365219116211, "global_step": 387852, "epoch": 2308} {"train_loss": -12.12940788269043, "global_step": 387853, "epoch": 2308} {"train_loss": -12.032991409301758, "global_step": 387854, "epoch": 2308} {"train_loss": -12.18121337890625, "global_step": 387855, "epoch": 2308} {"train_loss": -12.551813125610352, "global_step": 387856, "epoch": 2308} {"train_loss": -12.226343154907227, "global_step": 387857, "epoch": 2308} {"train_loss": -11.974386215209961, "global_step": 387858, "epoch": 2308} {"train_loss": -12.63192367553711, "global_step": 387859, "epoch": 2308} {"train_loss": -12.609151840209961, "global_step": 387860, "epoch": 2308} {"train_loss": -12.521181106567383, "global_step": 387861, "epoch": 2308} {"train_loss": -12.509550094604492, "global_step": 387862, "epoch": 2308} {"train_loss": -12.089106559753418, "global_step": 387863, "epoch": 2308} {"train_loss": -12.209142684936523, "global_step": 387864, "epoch": 2308} {"train_loss": -12.564400672912598, "global_step": 387865, "epoch": 2308} {"train_loss": -12.369101524353027, "global_step": 387866, "epoch": 2308} {"train_loss": -12.313217163085938, "global_step": 387867, "epoch": 2308} {"train_loss": -12.202640533447266, "global_step": 387868, "epoch": 2308} {"train_loss": -11.720720291137695, "global_step": 387869, "epoch": 2308} {"train_loss": -12.29776382446289, "global_step": 387870, "epoch": 2308} {"train_loss": -12.287267684936523, "global_step": 387871, "epoch": 2308} {"train_loss": -12.49631118774414, "global_step": 387872, "epoch": 2308} {"train_loss": -12.405824661254883, "global_step": 387873, "epoch": 2308} {"train_loss": -12.461483001708984, "global_step": 387874, "epoch": 2308} {"train_loss": -12.450750350952148, "global_step": 387875, "epoch": 2308} {"train_loss": -12.022777557373047, "global_step": 387876, "epoch": 2308} {"train_loss": -12.344099044799805, "global_step": 387877, "epoch": 2308} {"train_loss": -12.594112396240234, "global_step": 387878, "epoch": 2308} {"train_loss": -12.329035758972168, "global_step": 387879, "epoch": 2308} {"train_loss": -11.947128295898438, "global_step": 387880, "epoch": 2308} {"train_loss": -10.42315673828125, "global_step": 387881, "epoch": 2308} {"train_loss": -10.181417465209961, "global_step": 387882, "epoch": 2308} {"train_loss": -11.684329986572266, "global_step": 387883, "epoch": 2308} {"train_loss": -11.958694458007812, "global_step": 387884, "epoch": 2308} {"train_loss": -11.965381622314453, "global_step": 387885, "epoch": 2308} {"train_loss": -11.236005783081055, "global_step": 387886, "epoch": 2308} {"train_loss": -11.596944808959961, "global_step": 387887, "epoch": 2308} {"train_loss": -10.598003387451172, "global_step": 387888, "epoch": 2308} {"train_loss": -10.383678436279297, "global_step": 387889, "epoch": 2308} {"train_loss": -8.65213680267334, "global_step": 387890, "epoch": 2308} {"train_loss": -8.585367202758789, "global_step": 387891, "epoch": 2308} {"train_loss": -10.360715866088867, "global_step": 387892, "epoch": 2308} {"train_loss": -8.156667709350586, "global_step": 387893, "epoch": 2308} {"train_loss": -9.652294158935547, "global_step": 387894, "epoch": 2308} {"train_loss": -8.10329818725586, "global_step": 387895, "epoch": 2308} {"train_loss": -8.310354232788086, "global_step": 387896, "epoch": 2308} {"train_loss": -8.820280075073242, "global_step": 387897, "epoch": 2308} {"train_loss": -9.726634979248047, "global_step": 387898, "epoch": 2308} {"train_loss": -8.684221267700195, "global_step": 387899, "epoch": 2308} {"train_loss": -8.670650482177734, "global_step": 387900, "epoch": 2308} {"train_loss": -7.796853065490723, "global_step": 387901, "epoch": 2308} {"train_loss": -7.769561767578125, "global_step": 387902, "epoch": 2308} {"train_loss": -7.874166488647461, "global_step": 387903, "epoch": 2308} {"train_loss": -8.617053985595703, "global_step": 387904, "epoch": 2308} {"train_loss": -9.245979309082031, "global_step": 387905, "epoch": 2308} {"train_loss": -8.90394401550293, "global_step": 387906, "epoch": 2308} {"train_loss": -10.466461181640625, "global_step": 387907, "epoch": 2308} {"train_loss": -9.097795486450195, "global_step": 387908, "epoch": 2308} {"train_loss": -9.51257038116455, "global_step": 387909, "epoch": 2308} {"train_loss": -10.379600524902344, "global_step": 387910, "epoch": 2308} {"train_loss": -11.646590357735043, "global_step": 387911, "epoch": 2308, "val_loss": 293943.15625} {"train_loss": -10.539384841918945, "global_step": 387912, "epoch": 2309} {"train_loss": -10.714890480041504, "global_step": 387913, "epoch": 2309} {"train_loss": -11.531573295593262, "global_step": 387914, "epoch": 2309} {"train_loss": -10.50100326538086, "global_step": 387915, "epoch": 2309} {"train_loss": -10.904287338256836, "global_step": 387916, "epoch": 2309} {"train_loss": -11.022195816040039, "global_step": 387917, "epoch": 2309} {"train_loss": -10.198103904724121, "global_step": 387918, "epoch": 2309} {"train_loss": -10.668924331665039, "global_step": 387919, "epoch": 2309} {"train_loss": -11.338062286376953, "global_step": 387920, "epoch": 2309} {"train_loss": -11.010492324829102, "global_step": 387921, "epoch": 2309} {"train_loss": -11.627975463867188, "global_step": 387922, "epoch": 2309} {"train_loss": -10.616230964660645, "global_step": 387923, "epoch": 2309} {"train_loss": -11.142342567443848, "global_step": 387924, "epoch": 2309} {"train_loss": -11.678040504455566, "global_step": 387925, "epoch": 2309} {"train_loss": -11.650564193725586, "global_step": 387926, "epoch": 2309} {"train_loss": -11.415623664855957, "global_step": 387927, "epoch": 2309} {"train_loss": -11.881538391113281, "global_step": 387928, "epoch": 2309} {"train_loss": -11.316644668579102, "global_step": 387929, "epoch": 2309} {"train_loss": -11.537906646728516, "global_step": 387930, "epoch": 2309} {"train_loss": -11.893418312072754, "global_step": 387931, "epoch": 2309} {"train_loss": -11.517862319946289, "global_step": 387932, "epoch": 2309} {"train_loss": -11.819293975830078, "global_step": 387933, "epoch": 2309} {"train_loss": -11.831013679504395, "global_step": 387934, "epoch": 2309} {"train_loss": -11.405435562133789, "global_step": 387935, "epoch": 2309} {"train_loss": -12.105759620666504, "global_step": 387936, "epoch": 2309} {"train_loss": -11.940350532531738, "global_step": 387937, "epoch": 2309} {"train_loss": -11.92798137664795, "global_step": 387938, "epoch": 2309} {"train_loss": -12.18995189666748, "global_step": 387939, "epoch": 2309} {"train_loss": -11.65049934387207, "global_step": 387940, "epoch": 2309} {"train_loss": -11.983602523803711, "global_step": 387941, "epoch": 2309} {"train_loss": -12.20694351196289, "global_step": 387942, "epoch": 2309} {"train_loss": -12.050681114196777, "global_step": 387943, "epoch": 2309} {"train_loss": -12.03520393371582, "global_step": 387944, "epoch": 2309} {"train_loss": -12.211145401000977, "global_step": 387945, "epoch": 2309} {"train_loss": -11.874356269836426, "global_step": 387946, "epoch": 2309} {"train_loss": -12.20787525177002, "global_step": 387947, "epoch": 2309} {"train_loss": -11.970550537109375, "global_step": 387948, "epoch": 2309} {"train_loss": -12.169992446899414, "global_step": 387949, "epoch": 2309} {"train_loss": -12.10250473022461, "global_step": 387950, "epoch": 2309} {"train_loss": -12.365995407104492, "global_step": 387951, "epoch": 2309} {"train_loss": -12.395174980163574, "global_step": 387952, "epoch": 2309} {"train_loss": -12.298959732055664, "global_step": 387953, "epoch": 2309} {"train_loss": -12.270406723022461, "global_step": 387954, "epoch": 2309} {"train_loss": -12.486610412597656, "global_step": 387955, "epoch": 2309} {"train_loss": -12.280887603759766, "global_step": 387956, "epoch": 2309} {"train_loss": -12.440738677978516, "global_step": 387957, "epoch": 2309} {"train_loss": -12.325650215148926, "global_step": 387958, "epoch": 2309} {"train_loss": -12.342330932617188, "global_step": 387959, "epoch": 2309} {"train_loss": -12.17288589477539, "global_step": 387960, "epoch": 2309} {"train_loss": -12.526471138000488, "global_step": 387961, "epoch": 2309} {"train_loss": -12.192864418029785, "global_step": 387962, "epoch": 2309} {"train_loss": -12.352945327758789, "global_step": 387963, "epoch": 2309} {"train_loss": -12.07027816772461, "global_step": 387964, "epoch": 2309} {"train_loss": -12.47278881072998, "global_step": 387965, "epoch": 2309} {"train_loss": -11.880499839782715, "global_step": 387966, "epoch": 2309} {"train_loss": -12.50097370147705, "global_step": 387967, "epoch": 2309} {"train_loss": -12.347917556762695, "global_step": 387968, "epoch": 2309} {"train_loss": -12.160384178161621, "global_step": 387969, "epoch": 2309} {"train_loss": -12.237448692321777, "global_step": 387970, "epoch": 2309} {"train_loss": -12.124448776245117, "global_step": 387971, "epoch": 2309} {"train_loss": -12.188640594482422, "global_step": 387972, "epoch": 2309} {"train_loss": -12.069110870361328, "global_step": 387973, "epoch": 2309} {"train_loss": -12.483077049255371, "global_step": 387974, "epoch": 2309} {"train_loss": -11.949691772460938, "global_step": 387975, "epoch": 2309} {"train_loss": -12.530807495117188, "global_step": 387976, "epoch": 2309} {"train_loss": -11.826850891113281, "global_step": 387977, "epoch": 2309} {"train_loss": -12.066238403320312, "global_step": 387978, "epoch": 2309} {"train_loss": -12.250299453735352, "global_step": 387979, "epoch": 2309} {"train_loss": -12.130426406860352, "global_step": 387980, "epoch": 2309} {"train_loss": -12.050710678100586, "global_step": 387981, "epoch": 2309} {"train_loss": -12.063522338867188, "global_step": 387982, "epoch": 2309} {"train_loss": -12.357142448425293, "global_step": 387983, "epoch": 2309} {"train_loss": -12.328847885131836, "global_step": 387984, "epoch": 2309} {"train_loss": -12.050972938537598, "global_step": 387985, "epoch": 2309} {"train_loss": -12.240407943725586, "global_step": 387986, "epoch": 2309} {"train_loss": -12.037818908691406, "global_step": 387987, "epoch": 2309} {"train_loss": -12.220721244812012, "global_step": 387988, "epoch": 2309} {"train_loss": -12.027027130126953, "global_step": 387989, "epoch": 2309} {"train_loss": -12.388473510742188, "global_step": 387990, "epoch": 2309} {"train_loss": -12.164257049560547, "global_step": 387991, "epoch": 2309} {"train_loss": -12.231550216674805, "global_step": 387992, "epoch": 2309} {"train_loss": -12.26887035369873, "global_step": 387993, "epoch": 2309} {"train_loss": -12.162939071655273, "global_step": 387994, "epoch": 2309} {"train_loss": -12.513826370239258, "global_step": 387995, "epoch": 2309} {"train_loss": -12.191922187805176, "global_step": 387996, "epoch": 2309} {"train_loss": -12.351057052612305, "global_step": 387997, "epoch": 2309} {"train_loss": -12.126506805419922, "global_step": 387998, "epoch": 2309} {"train_loss": -11.804342269897461, "global_step": 387999, "epoch": 2309} {"train_loss": -12.281408309936523, "global_step": 388000, "epoch": 2309} {"train_loss": -11.615983963012695, "global_step": 388001, "epoch": 2309} {"train_loss": -12.128471374511719, "global_step": 388002, "epoch": 2309} {"train_loss": -11.979652404785156, "global_step": 388003, "epoch": 2309} {"train_loss": -12.173290252685547, "global_step": 388004, "epoch": 2309} {"train_loss": -11.826860427856445, "global_step": 388005, "epoch": 2309} {"train_loss": -12.018304824829102, "global_step": 388006, "epoch": 2309} {"train_loss": -12.051926612854004, "global_step": 388007, "epoch": 2309} {"train_loss": -12.002422332763672, "global_step": 388008, "epoch": 2309} {"train_loss": -12.351476669311523, "global_step": 388009, "epoch": 2309} {"train_loss": -11.69504451751709, "global_step": 388010, "epoch": 2309} {"train_loss": -12.224499702453613, "global_step": 388011, "epoch": 2309} {"train_loss": -12.012312889099121, "global_step": 388012, "epoch": 2309} {"train_loss": -11.948665618896484, "global_step": 388013, "epoch": 2309} {"train_loss": -12.241872787475586, "global_step": 388014, "epoch": 2309} {"train_loss": -12.195917129516602, "global_step": 388015, "epoch": 2309} {"train_loss": -12.336292266845703, "global_step": 388016, "epoch": 2309} {"train_loss": -12.23681640625, "global_step": 388017, "epoch": 2309} {"train_loss": -12.383853912353516, "global_step": 388018, "epoch": 2309} {"train_loss": -12.032505989074707, "global_step": 388019, "epoch": 2309} {"train_loss": -11.573883056640625, "global_step": 388020, "epoch": 2309} {"train_loss": -12.333826065063477, "global_step": 388021, "epoch": 2309} {"train_loss": -12.243226051330566, "global_step": 388022, "epoch": 2309} {"train_loss": -11.602928161621094, "global_step": 388023, "epoch": 2309} {"train_loss": -12.148757934570312, "global_step": 388024, "epoch": 2309} {"train_loss": -12.268441200256348, "global_step": 388025, "epoch": 2309} {"train_loss": -12.00804615020752, "global_step": 388026, "epoch": 2309} {"train_loss": -12.028116226196289, "global_step": 388027, "epoch": 2309} {"train_loss": -11.857072830200195, "global_step": 388028, "epoch": 2309} {"train_loss": -12.477261543273926, "global_step": 388029, "epoch": 2309} {"train_loss": -12.2461519241333, "global_step": 388030, "epoch": 2309} {"train_loss": -12.196233749389648, "global_step": 388031, "epoch": 2309} {"train_loss": -12.43211841583252, "global_step": 388032, "epoch": 2309} {"train_loss": -12.375513076782227, "global_step": 388033, "epoch": 2309} {"train_loss": -12.396299362182617, "global_step": 388034, "epoch": 2309} {"train_loss": -12.335267066955566, "global_step": 388035, "epoch": 2309} {"train_loss": -12.620584487915039, "global_step": 388036, "epoch": 2309} {"train_loss": -12.073723793029785, "global_step": 388037, "epoch": 2309} {"train_loss": -12.484116554260254, "global_step": 388038, "epoch": 2309} {"train_loss": -12.467170715332031, "global_step": 388039, "epoch": 2309} {"train_loss": -12.545211791992188, "global_step": 388040, "epoch": 2309} {"train_loss": -12.363767623901367, "global_step": 388041, "epoch": 2309} {"train_loss": -12.53376579284668, "global_step": 388042, "epoch": 2309} {"train_loss": -12.600055694580078, "global_step": 388043, "epoch": 2309} {"train_loss": -12.536602973937988, "global_step": 388044, "epoch": 2309} {"train_loss": -12.519838333129883, "global_step": 388045, "epoch": 2309} {"train_loss": -12.479839324951172, "global_step": 388046, "epoch": 2309} {"train_loss": -12.50092887878418, "global_step": 388047, "epoch": 2309} {"train_loss": -12.569963455200195, "global_step": 388048, "epoch": 2309} {"train_loss": -12.717119216918945, "global_step": 388049, "epoch": 2309} {"train_loss": -12.786219596862793, "global_step": 388050, "epoch": 2309} {"train_loss": -12.529537200927734, "global_step": 388051, "epoch": 2309} {"train_loss": -12.540782928466797, "global_step": 388052, "epoch": 2309} {"train_loss": -12.226221084594727, "global_step": 388053, "epoch": 2309} {"train_loss": -12.341971397399902, "global_step": 388054, "epoch": 2309} {"train_loss": -12.487686157226562, "global_step": 388055, "epoch": 2309} {"train_loss": -12.26922607421875, "global_step": 388056, "epoch": 2309} {"train_loss": -12.176984786987305, "global_step": 388057, "epoch": 2309} {"train_loss": -12.435075759887695, "global_step": 388058, "epoch": 2309} {"train_loss": -12.268645286560059, "global_step": 388059, "epoch": 2309} {"train_loss": -11.548019409179688, "global_step": 388060, "epoch": 2309} {"train_loss": -12.524188995361328, "global_step": 388061, "epoch": 2309} {"train_loss": -12.2548189163208, "global_step": 388062, "epoch": 2309} {"train_loss": -12.019954681396484, "global_step": 388063, "epoch": 2309} {"train_loss": -12.406562805175781, "global_step": 388064, "epoch": 2309} {"train_loss": -12.387935638427734, "global_step": 388065, "epoch": 2309} {"train_loss": -12.598660469055176, "global_step": 388066, "epoch": 2309} {"train_loss": -12.364201545715332, "global_step": 388067, "epoch": 2309} {"train_loss": -12.607158660888672, "global_step": 388068, "epoch": 2309} {"train_loss": -12.535233497619629, "global_step": 388069, "epoch": 2309} {"train_loss": -12.405793190002441, "global_step": 388070, "epoch": 2309} {"train_loss": -11.920158386230469, "global_step": 388071, "epoch": 2309} {"train_loss": -12.672386169433594, "global_step": 388072, "epoch": 2309} {"train_loss": -12.564312934875488, "global_step": 388073, "epoch": 2309} {"train_loss": -12.599724769592285, "global_step": 388074, "epoch": 2309} {"train_loss": -11.964454650878906, "global_step": 388075, "epoch": 2309} {"train_loss": -12.07026481628418, "global_step": 388076, "epoch": 2309} {"train_loss": -12.263671875, "global_step": 388077, "epoch": 2309} {"train_loss": -11.624563217163086, "global_step": 388078, "epoch": 2309} {"train_loss": -12.083760658899942, "global_step": 388079, "epoch": 2309, "val_loss": 294593.71875} {"train_loss": -11.121620178222656, "global_step": 388080, "epoch": 2310} {"train_loss": -12.509132385253906, "global_step": 388081, "epoch": 2310} {"train_loss": -11.383228302001953, "global_step": 388082, "epoch": 2310} {"train_loss": -11.65999984741211, "global_step": 388083, "epoch": 2310} {"train_loss": -10.972099304199219, "global_step": 388084, "epoch": 2310} {"train_loss": -11.833246231079102, "global_step": 388085, "epoch": 2310} {"train_loss": -11.759542465209961, "global_step": 388086, "epoch": 2310} {"train_loss": -11.24233627319336, "global_step": 388087, "epoch": 2310} {"train_loss": -11.060676574707031, "global_step": 388088, "epoch": 2310} {"train_loss": -11.412846565246582, "global_step": 388089, "epoch": 2310} {"train_loss": -12.097515106201172, "global_step": 388090, "epoch": 2310} {"train_loss": -11.815765380859375, "global_step": 388091, "epoch": 2310} {"train_loss": -11.538599014282227, "global_step": 388092, "epoch": 2310} {"train_loss": -12.089208602905273, "global_step": 388093, "epoch": 2310} {"train_loss": -11.91002082824707, "global_step": 388094, "epoch": 2310} {"train_loss": -12.274702072143555, "global_step": 388095, "epoch": 2310} {"train_loss": -11.482572555541992, "global_step": 388096, "epoch": 2310} {"train_loss": -11.616484642028809, "global_step": 388097, "epoch": 2310} {"train_loss": -12.188085556030273, "global_step": 388098, "epoch": 2310} {"train_loss": -11.325420379638672, "global_step": 388099, "epoch": 2310} {"train_loss": -11.861654281616211, "global_step": 388100, "epoch": 2310} {"train_loss": -11.865904808044434, "global_step": 388101, "epoch": 2310} {"train_loss": -12.12882137298584, "global_step": 388102, "epoch": 2310} {"train_loss": -11.50942325592041, "global_step": 388103, "epoch": 2310} {"train_loss": -11.926868438720703, "global_step": 388104, "epoch": 2310} {"train_loss": -12.318422317504883, "global_step": 388105, "epoch": 2310} {"train_loss": -12.192392349243164, "global_step": 388106, "epoch": 2310} {"train_loss": -12.373435974121094, "global_step": 388107, "epoch": 2310} {"train_loss": -12.046772003173828, "global_step": 388108, "epoch": 2310} {"train_loss": -11.766104698181152, "global_step": 388109, "epoch": 2310} {"train_loss": -12.349563598632812, "global_step": 388110, "epoch": 2310} {"train_loss": -12.402721405029297, "global_step": 388111, "epoch": 2310} {"train_loss": -12.185379028320312, "global_step": 388112, "epoch": 2310} {"train_loss": -12.108890533447266, "global_step": 388113, "epoch": 2310} {"train_loss": -12.451400756835938, "global_step": 388114, "epoch": 2310} {"train_loss": -12.108534812927246, "global_step": 388115, "epoch": 2310} {"train_loss": -12.247684478759766, "global_step": 388116, "epoch": 2310} {"train_loss": -12.177807807922363, "global_step": 388117, "epoch": 2310} {"train_loss": -12.388368606567383, "global_step": 388118, "epoch": 2310} {"train_loss": -12.224814414978027, "global_step": 388119, "epoch": 2310} {"train_loss": -12.169410705566406, "global_step": 388120, "epoch": 2310} {"train_loss": -12.054889678955078, "global_step": 388121, "epoch": 2310} {"train_loss": -12.457845687866211, "global_step": 388122, "epoch": 2310} {"train_loss": -12.082706451416016, "global_step": 388123, "epoch": 2310} {"train_loss": -12.244354248046875, "global_step": 388124, "epoch": 2310} {"train_loss": -12.172897338867188, "global_step": 388125, "epoch": 2310} {"train_loss": -12.365550994873047, "global_step": 388126, "epoch": 2310} {"train_loss": -12.425714492797852, "global_step": 388127, "epoch": 2310} {"train_loss": -12.516059875488281, "global_step": 388128, "epoch": 2310} {"train_loss": -11.997688293457031, "global_step": 388129, "epoch": 2310} {"train_loss": -12.444436073303223, "global_step": 388130, "epoch": 2310} {"train_loss": -11.922660827636719, "global_step": 388131, "epoch": 2310} {"train_loss": -12.122359275817871, "global_step": 388132, "epoch": 2310} {"train_loss": -12.55513858795166, "global_step": 388133, "epoch": 2310} {"train_loss": -11.874027252197266, "global_step": 388134, "epoch": 2310} {"train_loss": -10.801213264465332, "global_step": 388135, "epoch": 2310} {"train_loss": -12.492048263549805, "global_step": 388136, "epoch": 2310} {"train_loss": -11.791238784790039, "global_step": 388137, "epoch": 2310} {"train_loss": -10.81423568725586, "global_step": 388138, "epoch": 2310} {"train_loss": -12.07547378540039, "global_step": 388139, "epoch": 2310} {"train_loss": -11.94237995147705, "global_step": 388140, "epoch": 2310} {"train_loss": -11.581405639648438, "global_step": 388141, "epoch": 2310} {"train_loss": -12.091354370117188, "global_step": 388142, "epoch": 2310} {"train_loss": -12.45850944519043, "global_step": 388143, "epoch": 2310} {"train_loss": -11.864459991455078, "global_step": 388144, "epoch": 2310} {"train_loss": -12.075661659240723, "global_step": 388145, "epoch": 2310} {"train_loss": -12.387767791748047, "global_step": 388146, "epoch": 2310} {"train_loss": -12.075002670288086, "global_step": 388147, "epoch": 2310} {"train_loss": -11.352531433105469, "global_step": 388148, "epoch": 2310} {"train_loss": -11.869331359863281, "global_step": 388149, "epoch": 2310} {"train_loss": -12.143692016601562, "global_step": 388150, "epoch": 2310} {"train_loss": -11.108025550842285, "global_step": 388151, "epoch": 2310} {"train_loss": -11.50171184539795, "global_step": 388152, "epoch": 2310} {"train_loss": -12.344249725341797, "global_step": 388153, "epoch": 2310} {"train_loss": -11.819801330566406, "global_step": 388154, "epoch": 2310} {"train_loss": -12.016355514526367, "global_step": 388155, "epoch": 2310} {"train_loss": -11.551002502441406, "global_step": 388156, "epoch": 2310} {"train_loss": -12.167851448059082, "global_step": 388157, "epoch": 2310} {"train_loss": -11.329584121704102, "global_step": 388158, "epoch": 2310} {"train_loss": -11.789443969726562, "global_step": 388159, "epoch": 2310} {"train_loss": -11.67051887512207, "global_step": 388160, "epoch": 2310} {"train_loss": -12.16954231262207, "global_step": 388161, "epoch": 2310} {"train_loss": -11.862598419189453, "global_step": 388162, "epoch": 2310} {"train_loss": -11.495192527770996, "global_step": 388163, "epoch": 2310} {"train_loss": -11.772624969482422, "global_step": 388164, "epoch": 2310} {"train_loss": -11.587440490722656, "global_step": 388165, "epoch": 2310} {"train_loss": -11.283519744873047, "global_step": 388166, "epoch": 2310} {"train_loss": -11.416595458984375, "global_step": 388167, "epoch": 2310} {"train_loss": -11.055328369140625, "global_step": 388168, "epoch": 2310} {"train_loss": -12.337038040161133, "global_step": 388169, "epoch": 2310} {"train_loss": -11.405674934387207, "global_step": 388170, "epoch": 2310} {"train_loss": -12.057790756225586, "global_step": 388171, "epoch": 2310} {"train_loss": -12.06634521484375, "global_step": 388172, "epoch": 2310} {"train_loss": -11.337403297424316, "global_step": 388173, "epoch": 2310} {"train_loss": -11.899338722229004, "global_step": 388174, "epoch": 2310} {"train_loss": -12.498062133789062, "global_step": 388175, "epoch": 2310} {"train_loss": -11.846992492675781, "global_step": 388176, "epoch": 2310} {"train_loss": -12.051095962524414, "global_step": 388177, "epoch": 2310} {"train_loss": -12.028684616088867, "global_step": 388178, "epoch": 2310} {"train_loss": -12.232093811035156, "global_step": 388179, "epoch": 2310} {"train_loss": -12.212272644042969, "global_step": 388180, "epoch": 2310} {"train_loss": -12.311491966247559, "global_step": 388181, "epoch": 2310} {"train_loss": -12.191394805908203, "global_step": 388182, "epoch": 2310} {"train_loss": -12.253521919250488, "global_step": 388183, "epoch": 2310} {"train_loss": -12.063699722290039, "global_step": 388184, "epoch": 2310} {"train_loss": -11.990957260131836, "global_step": 388185, "epoch": 2310} {"train_loss": -12.286126136779785, "global_step": 388186, "epoch": 2310} {"train_loss": -12.377958297729492, "global_step": 388187, "epoch": 2310} {"train_loss": -12.176633834838867, "global_step": 388188, "epoch": 2310} {"train_loss": -12.344955444335938, "global_step": 388189, "epoch": 2310} {"train_loss": -12.340161323547363, "global_step": 388190, "epoch": 2310} {"train_loss": -11.839542388916016, "global_step": 388191, "epoch": 2310} {"train_loss": -12.219606399536133, "global_step": 388192, "epoch": 2310} {"train_loss": -12.321877479553223, "global_step": 388193, "epoch": 2310} {"train_loss": -12.29830551147461, "global_step": 388194, "epoch": 2310} {"train_loss": -12.425230026245117, "global_step": 388195, "epoch": 2310} {"train_loss": -11.959623336791992, "global_step": 388196, "epoch": 2310} {"train_loss": -12.582487106323242, "global_step": 388197, "epoch": 2310} {"train_loss": -12.29901123046875, "global_step": 388198, "epoch": 2310} {"train_loss": -12.243465423583984, "global_step": 388199, "epoch": 2310} {"train_loss": -12.567420959472656, "global_step": 388200, "epoch": 2310} {"train_loss": -12.561349868774414, "global_step": 388201, "epoch": 2310} {"train_loss": -12.680896759033203, "global_step": 388202, "epoch": 2310} {"train_loss": -12.776044845581055, "global_step": 388203, "epoch": 2310} {"train_loss": -12.431151390075684, "global_step": 388204, "epoch": 2310} {"train_loss": -12.531892776489258, "global_step": 388205, "epoch": 2310} {"train_loss": -12.477249145507812, "global_step": 388206, "epoch": 2310} {"train_loss": -12.6520357131958, "global_step": 388207, "epoch": 2310} {"train_loss": -12.631863594055176, "global_step": 388208, "epoch": 2310} {"train_loss": -12.347562789916992, "global_step": 388209, "epoch": 2310} {"train_loss": -12.151812553405762, "global_step": 388210, "epoch": 2310} {"train_loss": -12.608648300170898, "global_step": 388211, "epoch": 2310} {"train_loss": -12.409524917602539, "global_step": 388212, "epoch": 2310} {"train_loss": -12.579649925231934, "global_step": 388213, "epoch": 2310} {"train_loss": -12.51628303527832, "global_step": 388214, "epoch": 2310} {"train_loss": -11.765851020812988, "global_step": 388215, "epoch": 2310} {"train_loss": -11.855809211730957, "global_step": 388216, "epoch": 2310} {"train_loss": -12.521814346313477, "global_step": 388217, "epoch": 2310} {"train_loss": -12.31990909576416, "global_step": 388218, "epoch": 2310} {"train_loss": -11.933971405029297, "global_step": 388219, "epoch": 2310} {"train_loss": -12.346845626831055, "global_step": 388220, "epoch": 2310} {"train_loss": -12.752166748046875, "global_step": 388221, "epoch": 2310} {"train_loss": -12.463523864746094, "global_step": 388222, "epoch": 2310} {"train_loss": -12.4256010055542, "global_step": 388223, "epoch": 2310} {"train_loss": -12.539814949035645, "global_step": 388224, "epoch": 2310} {"train_loss": -11.968358993530273, "global_step": 388225, "epoch": 2310} {"train_loss": -12.127681732177734, "global_step": 388226, "epoch": 2310} {"train_loss": -12.504791259765625, "global_step": 388227, "epoch": 2310} {"train_loss": -12.153069496154785, "global_step": 388228, "epoch": 2310} {"train_loss": -12.455971717834473, "global_step": 388229, "epoch": 2310} {"train_loss": -12.218345642089844, "global_step": 388230, "epoch": 2310} {"train_loss": -12.32647705078125, "global_step": 388231, "epoch": 2310} {"train_loss": -12.40070915222168, "global_step": 388232, "epoch": 2310} {"train_loss": -12.519464492797852, "global_step": 388233, "epoch": 2310} {"train_loss": -12.032922744750977, "global_step": 388234, "epoch": 2310} {"train_loss": -12.529169082641602, "global_step": 388235, "epoch": 2310} {"train_loss": -12.353172302246094, "global_step": 388236, "epoch": 2310} {"train_loss": -11.407466888427734, "global_step": 388237, "epoch": 2310} {"train_loss": -11.515300750732422, "global_step": 388238, "epoch": 2310} {"train_loss": -11.615938186645508, "global_step": 388239, "epoch": 2310} {"train_loss": -10.46613883972168, "global_step": 388240, "epoch": 2310} {"train_loss": -11.065003395080566, "global_step": 388241, "epoch": 2310} {"train_loss": -12.238853454589844, "global_step": 388242, "epoch": 2310} {"train_loss": -11.144960403442383, "global_step": 388243, "epoch": 2310} {"train_loss": -11.843076705932617, "global_step": 388244, "epoch": 2310} {"train_loss": -9.590583801269531, "global_step": 388245, "epoch": 2310} {"train_loss": -9.71713924407959, "global_step": 388246, "epoch": 2310} {"train_loss": -11.980886510440282, "global_step": 388247, "epoch": 2310, "val_loss": 298559.84375, "train_action_mse_error": 1.2529696226119995} {"train_loss": -8.409294128417969, "global_step": 388248, "epoch": 2311} {"train_loss": -9.335090637207031, "global_step": 388249, "epoch": 2311} {"train_loss": -8.905399322509766, "global_step": 388250, "epoch": 2311} {"train_loss": -8.892909049987793, "global_step": 388251, "epoch": 2311} {"train_loss": -7.325290679931641, "global_step": 388252, "epoch": 2311} {"train_loss": -7.333558082580566, "global_step": 388253, "epoch": 2311} {"train_loss": -9.155489921569824, "global_step": 388254, "epoch": 2311} {"train_loss": -8.706501960754395, "global_step": 388255, "epoch": 2311} {"train_loss": -8.850229263305664, "global_step": 388256, "epoch": 2311} {"train_loss": -9.03194808959961, "global_step": 388257, "epoch": 2311} {"train_loss": -10.672713279724121, "global_step": 388258, "epoch": 2311} {"train_loss": -10.216438293457031, "global_step": 388259, "epoch": 2311} {"train_loss": -11.168285369873047, "global_step": 388260, "epoch": 2311} {"train_loss": -10.69495964050293, "global_step": 388261, "epoch": 2311} {"train_loss": -10.784411430358887, "global_step": 388262, "epoch": 2311} {"train_loss": -10.66560173034668, "global_step": 388263, "epoch": 2311} {"train_loss": -10.854503631591797, "global_step": 388264, "epoch": 2311} {"train_loss": -10.284126281738281, "global_step": 388265, "epoch": 2311} {"train_loss": -11.094742774963379, "global_step": 388266, "epoch": 2311} {"train_loss": -10.350924491882324, "global_step": 388267, "epoch": 2311} {"train_loss": -10.954730987548828, "global_step": 388268, "epoch": 2311} {"train_loss": -11.557279586791992, "global_step": 388269, "epoch": 2311} {"train_loss": -11.169578552246094, "global_step": 388270, "epoch": 2311} {"train_loss": -11.136356353759766, "global_step": 388271, "epoch": 2311} {"train_loss": -10.962675094604492, "global_step": 388272, "epoch": 2311} {"train_loss": -11.659231185913086, "global_step": 388273, "epoch": 2311} {"train_loss": -11.661280632019043, "global_step": 388274, "epoch": 2311} {"train_loss": -11.708165168762207, "global_step": 388275, "epoch": 2311} {"train_loss": -11.60795783996582, "global_step": 388276, "epoch": 2311} {"train_loss": -11.681514739990234, "global_step": 388277, "epoch": 2311} {"train_loss": -11.452127456665039, "global_step": 388278, "epoch": 2311} {"train_loss": -11.725133895874023, "global_step": 388279, "epoch": 2311} {"train_loss": -11.332757949829102, "global_step": 388280, "epoch": 2311} {"train_loss": -11.825390815734863, "global_step": 388281, "epoch": 2311} {"train_loss": -11.281820297241211, "global_step": 388282, "epoch": 2311} {"train_loss": -11.908374786376953, "global_step": 388283, "epoch": 2311} {"train_loss": -11.821023941040039, "global_step": 388284, "epoch": 2311} {"train_loss": -12.034418106079102, "global_step": 388285, "epoch": 2311} {"train_loss": -11.955110549926758, "global_step": 388286, "epoch": 2311} {"train_loss": -11.889399528503418, "global_step": 388287, "epoch": 2311} {"train_loss": -12.089832305908203, "global_step": 388288, "epoch": 2311} {"train_loss": -11.991024017333984, "global_step": 388289, "epoch": 2311} {"train_loss": -12.137350082397461, "global_step": 388290, "epoch": 2311} {"train_loss": -12.225634574890137, "global_step": 388291, "epoch": 2311} {"train_loss": -11.996904373168945, "global_step": 388292, "epoch": 2311} {"train_loss": -12.318696975708008, "global_step": 388293, "epoch": 2311} {"train_loss": -12.036245346069336, "global_step": 388294, "epoch": 2311} {"train_loss": -12.140098571777344, "global_step": 388295, "epoch": 2311} {"train_loss": -12.192221641540527, "global_step": 388296, "epoch": 2311} {"train_loss": -12.034833908081055, "global_step": 388297, "epoch": 2311} {"train_loss": -12.035109519958496, "global_step": 388298, "epoch": 2311} {"train_loss": -12.089742660522461, "global_step": 388299, "epoch": 2311} {"train_loss": -11.98638916015625, "global_step": 388300, "epoch": 2311} {"train_loss": -12.009567260742188, "global_step": 388301, "epoch": 2311} {"train_loss": -12.223600387573242, "global_step": 388302, "epoch": 2311} {"train_loss": -11.873424530029297, "global_step": 388303, "epoch": 2311} {"train_loss": -11.985288619995117, "global_step": 388304, "epoch": 2311} {"train_loss": -12.320331573486328, "global_step": 388305, "epoch": 2311} {"train_loss": -12.068483352661133, "global_step": 388306, "epoch": 2311} {"train_loss": -12.36377239227295, "global_step": 388307, "epoch": 2311} {"train_loss": -12.014174461364746, "global_step": 388308, "epoch": 2311} {"train_loss": -12.236349105834961, "global_step": 388309, "epoch": 2311} {"train_loss": -11.950057983398438, "global_step": 388310, "epoch": 2311} {"train_loss": -12.293598175048828, "global_step": 388311, "epoch": 2311} {"train_loss": -12.100397109985352, "global_step": 388312, "epoch": 2311} {"train_loss": -12.131141662597656, "global_step": 388313, "epoch": 2311} {"train_loss": -12.221794128417969, "global_step": 388314, "epoch": 2311} {"train_loss": -12.173288345336914, "global_step": 388315, "epoch": 2311} {"train_loss": -12.23086166381836, "global_step": 388316, "epoch": 2311} {"train_loss": -12.361021995544434, "global_step": 388317, "epoch": 2311} {"train_loss": -12.156013488769531, "global_step": 388318, "epoch": 2311} {"train_loss": -12.229808807373047, "global_step": 388319, "epoch": 2311} {"train_loss": -11.677480697631836, "global_step": 388320, "epoch": 2311} {"train_loss": -12.543567657470703, "global_step": 388321, "epoch": 2311} {"train_loss": -11.670089721679688, "global_step": 388322, "epoch": 2311} {"train_loss": -12.353097915649414, "global_step": 388323, "epoch": 2311} {"train_loss": -12.177494049072266, "global_step": 388324, "epoch": 2311} {"train_loss": -11.927313804626465, "global_step": 388325, "epoch": 2311} {"train_loss": -12.442913055419922, "global_step": 388326, "epoch": 2311} {"train_loss": -12.344125747680664, "global_step": 388327, "epoch": 2311} {"train_loss": -12.391058921813965, "global_step": 388328, "epoch": 2311} {"train_loss": -12.340754508972168, "global_step": 388329, "epoch": 2311} {"train_loss": -12.216436386108398, "global_step": 388330, "epoch": 2311} {"train_loss": -12.326045989990234, "global_step": 388331, "epoch": 2311} {"train_loss": -11.934565544128418, "global_step": 388332, "epoch": 2311} {"train_loss": -12.06845474243164, "global_step": 388333, "epoch": 2311} {"train_loss": -12.095742225646973, "global_step": 388334, "epoch": 2311} {"train_loss": -11.463262557983398, "global_step": 388335, "epoch": 2311} {"train_loss": -12.363015174865723, "global_step": 388336, "epoch": 2311} {"train_loss": -11.210386276245117, "global_step": 388337, "epoch": 2311} {"train_loss": -11.845449447631836, "global_step": 388338, "epoch": 2311} {"train_loss": -11.999868392944336, "global_step": 388339, "epoch": 2311} {"train_loss": -10.375564575195312, "global_step": 388340, "epoch": 2311} {"train_loss": -12.092317581176758, "global_step": 388341, "epoch": 2311} {"train_loss": -11.562206268310547, "global_step": 388342, "epoch": 2311} {"train_loss": -10.73681926727295, "global_step": 388343, "epoch": 2311} {"train_loss": -12.284423828125, "global_step": 388344, "epoch": 2311} {"train_loss": -11.571904182434082, "global_step": 388345, "epoch": 2311} {"train_loss": -12.349431991577148, "global_step": 388346, "epoch": 2311} {"train_loss": -11.267362594604492, "global_step": 388347, "epoch": 2311} {"train_loss": -11.792236328125, "global_step": 388348, "epoch": 2311} {"train_loss": -11.08917236328125, "global_step": 388349, "epoch": 2311} {"train_loss": -11.487288475036621, "global_step": 388350, "epoch": 2311} {"train_loss": -11.322797775268555, "global_step": 388351, "epoch": 2311} {"train_loss": -11.268207550048828, "global_step": 388352, "epoch": 2311} {"train_loss": -11.788646697998047, "global_step": 388353, "epoch": 2311} {"train_loss": -11.330068588256836, "global_step": 388354, "epoch": 2311} {"train_loss": -10.499370574951172, "global_step": 388355, "epoch": 2311} {"train_loss": -10.227466583251953, "global_step": 388356, "epoch": 2311} {"train_loss": -11.456512451171875, "global_step": 388357, "epoch": 2311} {"train_loss": -9.744170188903809, "global_step": 388358, "epoch": 2311} {"train_loss": -11.465304374694824, "global_step": 388359, "epoch": 2311} {"train_loss": -10.11446475982666, "global_step": 388360, "epoch": 2311} {"train_loss": -10.446441650390625, "global_step": 388361, "epoch": 2311} {"train_loss": -11.233936309814453, "global_step": 388362, "epoch": 2311} {"train_loss": -11.351924896240234, "global_step": 388363, "epoch": 2311} {"train_loss": -11.510791778564453, "global_step": 388364, "epoch": 2311} {"train_loss": -11.971944808959961, "global_step": 388365, "epoch": 2311} {"train_loss": -11.43464469909668, "global_step": 388366, "epoch": 2311} {"train_loss": -11.910050392150879, "global_step": 388367, "epoch": 2311} {"train_loss": -11.63632869720459, "global_step": 388368, "epoch": 2311} {"train_loss": -12.259145736694336, "global_step": 388369, "epoch": 2311} {"train_loss": -11.749075889587402, "global_step": 388370, "epoch": 2311} {"train_loss": -11.985400199890137, "global_step": 388371, "epoch": 2311} {"train_loss": -11.907413482666016, "global_step": 388372, "epoch": 2311} {"train_loss": -12.140480041503906, "global_step": 388373, "epoch": 2311} {"train_loss": -11.592848777770996, "global_step": 388374, "epoch": 2311} {"train_loss": -12.07336711883545, "global_step": 388375, "epoch": 2311} {"train_loss": -11.764955520629883, "global_step": 388376, "epoch": 2311} {"train_loss": -12.25493049621582, "global_step": 388377, "epoch": 2311} {"train_loss": -11.810890197753906, "global_step": 388378, "epoch": 2311} {"train_loss": -12.295404434204102, "global_step": 388379, "epoch": 2311} {"train_loss": -12.075716018676758, "global_step": 388380, "epoch": 2311} {"train_loss": -12.29427719116211, "global_step": 388381, "epoch": 2311} {"train_loss": -12.366962432861328, "global_step": 388382, "epoch": 2311} {"train_loss": -12.289846420288086, "global_step": 388383, "epoch": 2311} {"train_loss": -12.383243560791016, "global_step": 388384, "epoch": 2311} {"train_loss": -12.337644577026367, "global_step": 388385, "epoch": 2311} {"train_loss": -12.312790870666504, "global_step": 388386, "epoch": 2311} {"train_loss": -12.519857406616211, "global_step": 388387, "epoch": 2311} {"train_loss": -12.569416046142578, "global_step": 388388, "epoch": 2311} {"train_loss": -12.182851791381836, "global_step": 388389, "epoch": 2311} {"train_loss": -12.199480056762695, "global_step": 388390, "epoch": 2311} {"train_loss": -11.966155052185059, "global_step": 388391, "epoch": 2311} {"train_loss": -12.176592826843262, "global_step": 388392, "epoch": 2311} {"train_loss": -12.02739143371582, "global_step": 388393, "epoch": 2311} {"train_loss": -12.282350540161133, "global_step": 388394, "epoch": 2311} {"train_loss": -11.763267517089844, "global_step": 388395, "epoch": 2311} {"train_loss": -12.406339645385742, "global_step": 388396, "epoch": 2311} {"train_loss": -11.622190475463867, "global_step": 388397, "epoch": 2311} {"train_loss": -12.083619117736816, "global_step": 388398, "epoch": 2311} {"train_loss": -11.995735168457031, "global_step": 388399, "epoch": 2311} {"train_loss": -12.016571998596191, "global_step": 388400, "epoch": 2311} {"train_loss": -11.80958366394043, "global_step": 388401, "epoch": 2311} {"train_loss": -11.890008926391602, "global_step": 388402, "epoch": 2311} {"train_loss": -11.750804901123047, "global_step": 388403, "epoch": 2311} {"train_loss": -11.878957748413086, "global_step": 388404, "epoch": 2311} {"train_loss": -11.637275695800781, "global_step": 388405, "epoch": 2311} {"train_loss": -12.071310043334961, "global_step": 388406, "epoch": 2311} {"train_loss": -11.60947036743164, "global_step": 388407, "epoch": 2311} {"train_loss": -11.574799537658691, "global_step": 388408, "epoch": 2311} {"train_loss": -11.88549518585205, "global_step": 388409, "epoch": 2311} {"train_loss": -12.049848556518555, "global_step": 388410, "epoch": 2311} {"train_loss": -12.33388614654541, "global_step": 388411, "epoch": 2311} {"train_loss": -11.87517261505127, "global_step": 388412, "epoch": 2311} {"train_loss": -12.62549114227295, "global_step": 388413, "epoch": 2311} {"train_loss": -12.026300430297852, "global_step": 388414, "epoch": 2311} {"train_loss": -11.596346974372864, "global_step": 388415, "epoch": 2311, "val_loss": 295446.5} {"train_loss": -11.969011306762695, "global_step": 388416, "epoch": 2312} {"train_loss": -12.234231948852539, "global_step": 388417, "epoch": 2312} {"train_loss": -12.124279022216797, "global_step": 388418, "epoch": 2312} {"train_loss": -12.211484909057617, "global_step": 388419, "epoch": 2312} {"train_loss": -12.212091445922852, "global_step": 388420, "epoch": 2312} {"train_loss": -12.241740226745605, "global_step": 388421, "epoch": 2312} {"train_loss": -12.163530349731445, "global_step": 388422, "epoch": 2312} {"train_loss": -12.474496841430664, "global_step": 388423, "epoch": 2312} {"train_loss": -12.213228225708008, "global_step": 388424, "epoch": 2312} {"train_loss": -12.337121963500977, "global_step": 388425, "epoch": 2312} {"train_loss": -12.592095375061035, "global_step": 388426, "epoch": 2312} {"train_loss": -12.411064147949219, "global_step": 388427, "epoch": 2312} {"train_loss": -12.709566116333008, "global_step": 388428, "epoch": 2312} {"train_loss": -12.421939849853516, "global_step": 388429, "epoch": 2312} {"train_loss": -12.297515869140625, "global_step": 388430, "epoch": 2312} {"train_loss": -12.392366409301758, "global_step": 388431, "epoch": 2312} {"train_loss": -12.379350662231445, "global_step": 388432, "epoch": 2312} {"train_loss": -12.583383560180664, "global_step": 388433, "epoch": 2312} {"train_loss": -12.377758979797363, "global_step": 388434, "epoch": 2312} {"train_loss": -12.560070037841797, "global_step": 388435, "epoch": 2312} {"train_loss": -12.657792091369629, "global_step": 388436, "epoch": 2312} {"train_loss": -12.132808685302734, "global_step": 388437, "epoch": 2312} {"train_loss": -12.507089614868164, "global_step": 388438, "epoch": 2312} {"train_loss": -12.332096099853516, "global_step": 388439, "epoch": 2312} {"train_loss": -11.654997825622559, "global_step": 388440, "epoch": 2312} {"train_loss": -12.606185913085938, "global_step": 388441, "epoch": 2312} {"train_loss": -12.26826286315918, "global_step": 388442, "epoch": 2312} {"train_loss": -12.16270923614502, "global_step": 388443, "epoch": 2312} {"train_loss": -12.292034149169922, "global_step": 388444, "epoch": 2312} {"train_loss": -11.731708526611328, "global_step": 388445, "epoch": 2312} {"train_loss": -12.41406536102295, "global_step": 388446, "epoch": 2312} {"train_loss": -11.368577003479004, "global_step": 388447, "epoch": 2312} {"train_loss": -12.505475044250488, "global_step": 388448, "epoch": 2312} {"train_loss": -11.84347152709961, "global_step": 388449, "epoch": 2312} {"train_loss": -11.462930679321289, "global_step": 388450, "epoch": 2312} {"train_loss": -11.633487701416016, "global_step": 388451, "epoch": 2312} {"train_loss": -12.366470336914062, "global_step": 388452, "epoch": 2312} {"train_loss": -11.859554290771484, "global_step": 388453, "epoch": 2312} {"train_loss": -11.765108108520508, "global_step": 388454, "epoch": 2312} {"train_loss": -12.29710865020752, "global_step": 388455, "epoch": 2312} {"train_loss": -11.900428771972656, "global_step": 388456, "epoch": 2312} {"train_loss": -12.550697326660156, "global_step": 388457, "epoch": 2312} {"train_loss": -12.002466201782227, "global_step": 388458, "epoch": 2312} {"train_loss": -12.231222152709961, "global_step": 388459, "epoch": 2312} {"train_loss": -11.909207344055176, "global_step": 388460, "epoch": 2312} {"train_loss": -11.75984001159668, "global_step": 388461, "epoch": 2312} {"train_loss": -11.785781860351562, "global_step": 388462, "epoch": 2312} {"train_loss": -11.900594711303711, "global_step": 388463, "epoch": 2312} {"train_loss": -11.705063819885254, "global_step": 388464, "epoch": 2312} {"train_loss": -12.24724292755127, "global_step": 388465, "epoch": 2312} {"train_loss": -11.362508773803711, "global_step": 388466, "epoch": 2312} {"train_loss": -11.853023529052734, "global_step": 388467, "epoch": 2312} {"train_loss": -11.87794303894043, "global_step": 388468, "epoch": 2312} {"train_loss": -11.17351245880127, "global_step": 388469, "epoch": 2312} {"train_loss": -12.443137168884277, "global_step": 388470, "epoch": 2312} {"train_loss": -10.950820922851562, "global_step": 388471, "epoch": 2312} {"train_loss": -11.919633865356445, "global_step": 388472, "epoch": 2312} {"train_loss": -12.046576499938965, "global_step": 388473, "epoch": 2312} {"train_loss": -11.687283515930176, "global_step": 388474, "epoch": 2312} {"train_loss": -11.605113983154297, "global_step": 388475, "epoch": 2312} {"train_loss": -11.423736572265625, "global_step": 388476, "epoch": 2312} {"train_loss": -10.72822093963623, "global_step": 388477, "epoch": 2312} {"train_loss": -11.364814758300781, "global_step": 388478, "epoch": 2312} {"train_loss": -11.096941947937012, "global_step": 388479, "epoch": 2312} {"train_loss": -10.29355525970459, "global_step": 388480, "epoch": 2312} {"train_loss": -10.891374588012695, "global_step": 388481, "epoch": 2312} {"train_loss": -10.671659469604492, "global_step": 388482, "epoch": 2312} {"train_loss": -10.736538887023926, "global_step": 388483, "epoch": 2312} {"train_loss": -11.329591751098633, "global_step": 388484, "epoch": 2312} {"train_loss": -11.455718994140625, "global_step": 388485, "epoch": 2312} {"train_loss": -11.657992362976074, "global_step": 388486, "epoch": 2312} {"train_loss": -12.229816436767578, "global_step": 388487, "epoch": 2312} {"train_loss": -11.142549514770508, "global_step": 388488, "epoch": 2312} {"train_loss": -12.277236938476562, "global_step": 388489, "epoch": 2312} {"train_loss": -11.49785041809082, "global_step": 388490, "epoch": 2312} {"train_loss": -12.152141571044922, "global_step": 388491, "epoch": 2312} {"train_loss": -11.831841468811035, "global_step": 388492, "epoch": 2312} {"train_loss": -11.921119689941406, "global_step": 388493, "epoch": 2312} {"train_loss": -12.313671112060547, "global_step": 388494, "epoch": 2312} {"train_loss": -11.74641227722168, "global_step": 388495, "epoch": 2312} {"train_loss": -12.157502174377441, "global_step": 388496, "epoch": 2312} {"train_loss": -12.145538330078125, "global_step": 388497, "epoch": 2312} {"train_loss": -11.922226905822754, "global_step": 388498, "epoch": 2312} {"train_loss": -11.992035865783691, "global_step": 388499, "epoch": 2312} {"train_loss": -12.04554271697998, "global_step": 388500, "epoch": 2312} {"train_loss": -12.229394912719727, "global_step": 388501, "epoch": 2312} {"train_loss": -11.847454071044922, "global_step": 388502, "epoch": 2312} {"train_loss": -11.630434036254883, "global_step": 388503, "epoch": 2312} {"train_loss": -11.961570739746094, "global_step": 388504, "epoch": 2312} {"train_loss": -11.878280639648438, "global_step": 388505, "epoch": 2312} {"train_loss": -11.960153579711914, "global_step": 388506, "epoch": 2312} {"train_loss": -12.127069473266602, "global_step": 388507, "epoch": 2312} {"train_loss": -11.875526428222656, "global_step": 388508, "epoch": 2312} {"train_loss": -12.125871658325195, "global_step": 388509, "epoch": 2312} {"train_loss": -11.628084182739258, "global_step": 388510, "epoch": 2312} {"train_loss": -11.815194129943848, "global_step": 388511, "epoch": 2312} {"train_loss": -11.906213760375977, "global_step": 388512, "epoch": 2312} {"train_loss": -11.584444046020508, "global_step": 388513, "epoch": 2312} {"train_loss": -12.340646743774414, "global_step": 388514, "epoch": 2312} {"train_loss": -11.678683280944824, "global_step": 388515, "epoch": 2312} {"train_loss": -12.440685272216797, "global_step": 388516, "epoch": 2312} {"train_loss": -12.149270057678223, "global_step": 388517, "epoch": 2312} {"train_loss": -12.24295425415039, "global_step": 388518, "epoch": 2312} {"train_loss": -12.282920837402344, "global_step": 388519, "epoch": 2312} {"train_loss": -12.129924774169922, "global_step": 388520, "epoch": 2312} {"train_loss": -12.153470993041992, "global_step": 388521, "epoch": 2312} {"train_loss": -12.419456481933594, "global_step": 388522, "epoch": 2312} {"train_loss": -12.372209548950195, "global_step": 388523, "epoch": 2312} {"train_loss": -12.378070831298828, "global_step": 388524, "epoch": 2312} {"train_loss": -12.430557250976562, "global_step": 388525, "epoch": 2312} {"train_loss": -12.060691833496094, "global_step": 388526, "epoch": 2312} {"train_loss": -12.622602462768555, "global_step": 388527, "epoch": 2312} {"train_loss": -12.355294227600098, "global_step": 388528, "epoch": 2312} {"train_loss": -12.53131103515625, "global_step": 388529, "epoch": 2312} {"train_loss": -12.425037384033203, "global_step": 388530, "epoch": 2312} {"train_loss": -12.555723190307617, "global_step": 388531, "epoch": 2312} {"train_loss": -12.336822509765625, "global_step": 388532, "epoch": 2312} {"train_loss": -12.226054191589355, "global_step": 388533, "epoch": 2312} {"train_loss": -12.589529037475586, "global_step": 388534, "epoch": 2312} {"train_loss": -12.479939460754395, "global_step": 388535, "epoch": 2312} {"train_loss": -12.619148254394531, "global_step": 388536, "epoch": 2312} {"train_loss": -12.599466323852539, "global_step": 388537, "epoch": 2312} {"train_loss": -12.583065032958984, "global_step": 388538, "epoch": 2312} {"train_loss": -12.595968246459961, "global_step": 388539, "epoch": 2312} {"train_loss": -12.647825241088867, "global_step": 388540, "epoch": 2312} {"train_loss": -12.386695861816406, "global_step": 388541, "epoch": 2312} {"train_loss": -12.535379409790039, "global_step": 388542, "epoch": 2312} {"train_loss": -12.635415077209473, "global_step": 388543, "epoch": 2312} {"train_loss": -12.573113441467285, "global_step": 388544, "epoch": 2312} {"train_loss": -12.48790454864502, "global_step": 388545, "epoch": 2312} {"train_loss": -12.56083869934082, "global_step": 388546, "epoch": 2312} {"train_loss": -12.682537078857422, "global_step": 388547, "epoch": 2312} {"train_loss": -12.331392288208008, "global_step": 388548, "epoch": 2312} {"train_loss": -12.579030990600586, "global_step": 388549, "epoch": 2312} {"train_loss": -12.564022064208984, "global_step": 388550, "epoch": 2312} {"train_loss": -12.563959121704102, "global_step": 388551, "epoch": 2312} {"train_loss": -12.734382629394531, "global_step": 388552, "epoch": 2312} {"train_loss": -12.693839073181152, "global_step": 388553, "epoch": 2312} {"train_loss": -12.46116828918457, "global_step": 388554, "epoch": 2312} {"train_loss": -12.720542907714844, "global_step": 388555, "epoch": 2312} {"train_loss": -12.539844512939453, "global_step": 388556, "epoch": 2312} {"train_loss": -12.561738014221191, "global_step": 388557, "epoch": 2312} {"train_loss": -12.532425880432129, "global_step": 388558, "epoch": 2312} {"train_loss": -12.5116548538208, "global_step": 388559, "epoch": 2312} {"train_loss": -12.533477783203125, "global_step": 388560, "epoch": 2312} {"train_loss": -12.787694931030273, "global_step": 388561, "epoch": 2312} {"train_loss": -11.975976943969727, "global_step": 388562, "epoch": 2312} {"train_loss": -12.674901962280273, "global_step": 388563, "epoch": 2312} {"train_loss": -12.488815307617188, "global_step": 388564, "epoch": 2312} {"train_loss": -12.34803581237793, "global_step": 388565, "epoch": 2312} {"train_loss": -12.528961181640625, "global_step": 388566, "epoch": 2312} {"train_loss": -12.76356315612793, "global_step": 388567, "epoch": 2312} {"train_loss": -12.296051025390625, "global_step": 388568, "epoch": 2312} {"train_loss": -12.591093063354492, "global_step": 388569, "epoch": 2312} {"train_loss": -12.473987579345703, "global_step": 388570, "epoch": 2312} {"train_loss": -12.275763511657715, "global_step": 388571, "epoch": 2312} {"train_loss": -12.377962112426758, "global_step": 388572, "epoch": 2312} {"train_loss": -12.223858833312988, "global_step": 388573, "epoch": 2312} {"train_loss": -11.818771362304688, "global_step": 388574, "epoch": 2312} {"train_loss": -12.145378112792969, "global_step": 388575, "epoch": 2312} {"train_loss": -12.059608459472656, "global_step": 388576, "epoch": 2312} {"train_loss": -11.437484741210938, "global_step": 388577, "epoch": 2312} {"train_loss": -12.045863151550293, "global_step": 388578, "epoch": 2312} {"train_loss": -11.584589004516602, "global_step": 388579, "epoch": 2312} {"train_loss": -11.177510261535645, "global_step": 388580, "epoch": 2312} {"train_loss": -11.75036907196045, "global_step": 388581, "epoch": 2312} {"train_loss": -10.277586936950684, "global_step": 388582, "epoch": 2312} {"train_loss": -12.101163262412662, "global_step": 388583, "epoch": 2312, "val_loss": 298526.84375} {"train_loss": -10.556741714477539, "global_step": 388584, "epoch": 2313} {"train_loss": -12.1029052734375, "global_step": 388585, "epoch": 2313} {"train_loss": -10.362605094909668, "global_step": 388586, "epoch": 2313} {"train_loss": -10.55137825012207, "global_step": 388587, "epoch": 2313} {"train_loss": -11.180144309997559, "global_step": 388588, "epoch": 2313} {"train_loss": -10.815446853637695, "global_step": 388589, "epoch": 2313} {"train_loss": -10.92503547668457, "global_step": 388590, "epoch": 2313} {"train_loss": -8.79536247253418, "global_step": 388591, "epoch": 2313} {"train_loss": -10.119657516479492, "global_step": 388592, "epoch": 2313} {"train_loss": -10.900411605834961, "global_step": 388593, "epoch": 2313} {"train_loss": -10.581660270690918, "global_step": 388594, "epoch": 2313} {"train_loss": -10.872060775756836, "global_step": 388595, "epoch": 2313} {"train_loss": -11.389971733093262, "global_step": 388596, "epoch": 2313} {"train_loss": -10.802667617797852, "global_step": 388597, "epoch": 2313} {"train_loss": -12.32083511352539, "global_step": 388598, "epoch": 2313} {"train_loss": -11.674203872680664, "global_step": 388599, "epoch": 2313} {"train_loss": -11.430493354797363, "global_step": 388600, "epoch": 2313} {"train_loss": -11.685016632080078, "global_step": 388601, "epoch": 2313} {"train_loss": -11.536447525024414, "global_step": 388602, "epoch": 2313} {"train_loss": -12.335359573364258, "global_step": 388603, "epoch": 2313} {"train_loss": -11.930180549621582, "global_step": 388604, "epoch": 2313} {"train_loss": -11.94173526763916, "global_step": 388605, "epoch": 2313} {"train_loss": -12.235417366027832, "global_step": 388606, "epoch": 2313} {"train_loss": -11.521334648132324, "global_step": 388607, "epoch": 2313} {"train_loss": -11.97094440460205, "global_step": 388608, "epoch": 2313} {"train_loss": -12.133295059204102, "global_step": 388609, "epoch": 2313} {"train_loss": -12.356721878051758, "global_step": 388610, "epoch": 2313} {"train_loss": -12.354364395141602, "global_step": 388611, "epoch": 2313} {"train_loss": -12.295173645019531, "global_step": 388612, "epoch": 2313} {"train_loss": -12.019615173339844, "global_step": 388613, "epoch": 2313} {"train_loss": -12.185083389282227, "global_step": 388614, "epoch": 2313} {"train_loss": -12.36941146850586, "global_step": 388615, "epoch": 2313} {"train_loss": -11.970308303833008, "global_step": 388616, "epoch": 2313} {"train_loss": -12.294282913208008, "global_step": 388617, "epoch": 2313} {"train_loss": -12.029622077941895, "global_step": 388618, "epoch": 2313} {"train_loss": -12.345573425292969, "global_step": 388619, "epoch": 2313} {"train_loss": -12.107866287231445, "global_step": 388620, "epoch": 2313} {"train_loss": -11.603535652160645, "global_step": 388621, "epoch": 2313} {"train_loss": -12.082534790039062, "global_step": 388622, "epoch": 2313} {"train_loss": -12.17866325378418, "global_step": 388623, "epoch": 2313} {"train_loss": -11.36946964263916, "global_step": 388624, "epoch": 2313} {"train_loss": -12.291617393493652, "global_step": 388625, "epoch": 2313} {"train_loss": -11.699249267578125, "global_step": 388626, "epoch": 2313} {"train_loss": -11.686159133911133, "global_step": 388627, "epoch": 2313} {"train_loss": -12.312541961669922, "global_step": 388628, "epoch": 2313} {"train_loss": -11.283271789550781, "global_step": 388629, "epoch": 2313} {"train_loss": -12.43617057800293, "global_step": 388630, "epoch": 2313} {"train_loss": -12.085134506225586, "global_step": 388631, "epoch": 2313} {"train_loss": -11.768177032470703, "global_step": 388632, "epoch": 2313} {"train_loss": -12.614997863769531, "global_step": 388633, "epoch": 2313} {"train_loss": -11.937746047973633, "global_step": 388634, "epoch": 2313} {"train_loss": -12.18309211730957, "global_step": 388635, "epoch": 2313} {"train_loss": -12.091769218444824, "global_step": 388636, "epoch": 2313} {"train_loss": -11.721418380737305, "global_step": 388637, "epoch": 2313} {"train_loss": -12.46799087524414, "global_step": 388638, "epoch": 2313} {"train_loss": -11.974053382873535, "global_step": 388639, "epoch": 2313} {"train_loss": -12.151877403259277, "global_step": 388640, "epoch": 2313} {"train_loss": -12.40481948852539, "global_step": 388641, "epoch": 2313} {"train_loss": -12.174301147460938, "global_step": 388642, "epoch": 2313} {"train_loss": -12.480846405029297, "global_step": 388643, "epoch": 2313} {"train_loss": -12.252920150756836, "global_step": 388644, "epoch": 2313} {"train_loss": -12.45730972290039, "global_step": 388645, "epoch": 2313} {"train_loss": -12.364950180053711, "global_step": 388646, "epoch": 2313} {"train_loss": -12.555502891540527, "global_step": 388647, "epoch": 2313} {"train_loss": -12.509441375732422, "global_step": 388648, "epoch": 2313} {"train_loss": -12.58780288696289, "global_step": 388649, "epoch": 2313} {"train_loss": -12.52194595336914, "global_step": 388650, "epoch": 2313} {"train_loss": -12.410942077636719, "global_step": 388651, "epoch": 2313} {"train_loss": -11.958341598510742, "global_step": 388652, "epoch": 2313} {"train_loss": -12.526315689086914, "global_step": 388653, "epoch": 2313} {"train_loss": -11.982538223266602, "global_step": 388654, "epoch": 2313} {"train_loss": -12.441096305847168, "global_step": 388655, "epoch": 2313} {"train_loss": -12.024839401245117, "global_step": 388656, "epoch": 2313} {"train_loss": -12.414408683776855, "global_step": 388657, "epoch": 2313} {"train_loss": -12.70281982421875, "global_step": 388658, "epoch": 2313} {"train_loss": -12.473370552062988, "global_step": 388659, "epoch": 2313} {"train_loss": -12.4571533203125, "global_step": 388660, "epoch": 2313} {"train_loss": -12.41874885559082, "global_step": 388661, "epoch": 2313} {"train_loss": -12.647899627685547, "global_step": 388662, "epoch": 2313} {"train_loss": -12.644659042358398, "global_step": 388663, "epoch": 2313} {"train_loss": -12.156561851501465, "global_step": 388664, "epoch": 2313} {"train_loss": -12.379940032958984, "global_step": 388665, "epoch": 2313} {"train_loss": -12.733602523803711, "global_step": 388666, "epoch": 2313} {"train_loss": -12.19095230102539, "global_step": 388667, "epoch": 2313} {"train_loss": -12.545108795166016, "global_step": 388668, "epoch": 2313} {"train_loss": -12.539202690124512, "global_step": 388669, "epoch": 2313} {"train_loss": -12.598600387573242, "global_step": 388670, "epoch": 2313} {"train_loss": -12.66079330444336, "global_step": 388671, "epoch": 2313} {"train_loss": -12.296899795532227, "global_step": 388672, "epoch": 2313} {"train_loss": -12.40888786315918, "global_step": 388673, "epoch": 2313} {"train_loss": -12.413087844848633, "global_step": 388674, "epoch": 2313} {"train_loss": -11.950319290161133, "global_step": 388675, "epoch": 2313} {"train_loss": -12.430273056030273, "global_step": 388676, "epoch": 2313} {"train_loss": -12.232095718383789, "global_step": 388677, "epoch": 2313} {"train_loss": -12.106061935424805, "global_step": 388678, "epoch": 2313} {"train_loss": -12.813554763793945, "global_step": 388679, "epoch": 2313} {"train_loss": -12.412765502929688, "global_step": 388680, "epoch": 2313} {"train_loss": -12.329099655151367, "global_step": 388681, "epoch": 2313} {"train_loss": -12.694015502929688, "global_step": 388682, "epoch": 2313} {"train_loss": -12.876153945922852, "global_step": 388683, "epoch": 2313} {"train_loss": -12.5780611038208, "global_step": 388684, "epoch": 2313} {"train_loss": -12.557360649108887, "global_step": 388685, "epoch": 2313} {"train_loss": -12.54200553894043, "global_step": 388686, "epoch": 2313} {"train_loss": -12.537869453430176, "global_step": 388687, "epoch": 2313} {"train_loss": -12.001096725463867, "global_step": 388688, "epoch": 2313} {"train_loss": -12.582853317260742, "global_step": 388689, "epoch": 2313} {"train_loss": -11.811857223510742, "global_step": 388690, "epoch": 2313} {"train_loss": -11.736650466918945, "global_step": 388691, "epoch": 2313} {"train_loss": -12.481532096862793, "global_step": 388692, "epoch": 2313} {"train_loss": -11.997520446777344, "global_step": 388693, "epoch": 2313} {"train_loss": -11.879171371459961, "global_step": 388694, "epoch": 2313} {"train_loss": -12.204931259155273, "global_step": 388695, "epoch": 2313} {"train_loss": -12.038360595703125, "global_step": 388696, "epoch": 2313} {"train_loss": -11.551519393920898, "global_step": 388697, "epoch": 2313} {"train_loss": -12.266969680786133, "global_step": 388698, "epoch": 2313} {"train_loss": -11.314142227172852, "global_step": 388699, "epoch": 2313} {"train_loss": -11.942700386047363, "global_step": 388700, "epoch": 2313} {"train_loss": -10.54919719696045, "global_step": 388701, "epoch": 2313} {"train_loss": -12.300381660461426, "global_step": 388702, "epoch": 2313} {"train_loss": -11.584249496459961, "global_step": 388703, "epoch": 2313} {"train_loss": -12.271520614624023, "global_step": 388704, "epoch": 2313} {"train_loss": -10.377392768859863, "global_step": 388705, "epoch": 2313} {"train_loss": -10.57674789428711, "global_step": 388706, "epoch": 2313} {"train_loss": -11.632822036743164, "global_step": 388707, "epoch": 2313} {"train_loss": -10.655584335327148, "global_step": 388708, "epoch": 2313} {"train_loss": -10.967501640319824, "global_step": 388709, "epoch": 2313} {"train_loss": -11.281201362609863, "global_step": 388710, "epoch": 2313} {"train_loss": -10.932079315185547, "global_step": 388711, "epoch": 2313} {"train_loss": -10.629858016967773, "global_step": 388712, "epoch": 2313} {"train_loss": -11.689157485961914, "global_step": 388713, "epoch": 2313} {"train_loss": -10.005514144897461, "global_step": 388714, "epoch": 2313} {"train_loss": -12.377071380615234, "global_step": 388715, "epoch": 2313} {"train_loss": -10.74893569946289, "global_step": 388716, "epoch": 2313} {"train_loss": -11.547487258911133, "global_step": 388717, "epoch": 2313} {"train_loss": -12.041820526123047, "global_step": 388718, "epoch": 2313} {"train_loss": -11.106178283691406, "global_step": 388719, "epoch": 2313} {"train_loss": -11.813756942749023, "global_step": 388720, "epoch": 2313} {"train_loss": -11.670001983642578, "global_step": 388721, "epoch": 2313} {"train_loss": -11.02680492401123, "global_step": 388722, "epoch": 2313} {"train_loss": -11.692533493041992, "global_step": 388723, "epoch": 2313} {"train_loss": -11.634449005126953, "global_step": 388724, "epoch": 2313} {"train_loss": -11.20970344543457, "global_step": 388725, "epoch": 2313} {"train_loss": -11.690320014953613, "global_step": 388726, "epoch": 2313} {"train_loss": -12.113004684448242, "global_step": 388727, "epoch": 2313} {"train_loss": -11.21609115600586, "global_step": 388728, "epoch": 2313} {"train_loss": -11.656167030334473, "global_step": 388729, "epoch": 2313} {"train_loss": -11.551695823669434, "global_step": 388730, "epoch": 2313} {"train_loss": -11.76417064666748, "global_step": 388731, "epoch": 2313} {"train_loss": -12.104713439941406, "global_step": 388732, "epoch": 2313} {"train_loss": -11.774545669555664, "global_step": 388733, "epoch": 2313} {"train_loss": -12.191499710083008, "global_step": 388734, "epoch": 2313} {"train_loss": -11.678913116455078, "global_step": 388735, "epoch": 2313} {"train_loss": -12.140787124633789, "global_step": 388736, "epoch": 2313} {"train_loss": -11.972764015197754, "global_step": 388737, "epoch": 2313} {"train_loss": -12.271255493164062, "global_step": 388738, "epoch": 2313} {"train_loss": -12.107845306396484, "global_step": 388739, "epoch": 2313} {"train_loss": -12.05866527557373, "global_step": 388740, "epoch": 2313} {"train_loss": -12.336711883544922, "global_step": 388741, "epoch": 2313} {"train_loss": -11.66446304321289, "global_step": 388742, "epoch": 2313} {"train_loss": -12.12662410736084, "global_step": 388743, "epoch": 2313} {"train_loss": -12.166755676269531, "global_step": 388744, "epoch": 2313} {"train_loss": -11.768350601196289, "global_step": 388745, "epoch": 2313} {"train_loss": -12.221887588500977, "global_step": 388746, "epoch": 2313} {"train_loss": -11.945123672485352, "global_step": 388747, "epoch": 2313} {"train_loss": -11.97108268737793, "global_step": 388748, "epoch": 2313} {"train_loss": -12.018482208251953, "global_step": 388749, "epoch": 2313} {"train_loss": -12.275360107421875, "global_step": 388750, "epoch": 2313} {"train_loss": -11.906111785343715, "global_step": 388751, "epoch": 2313, "val_loss": 297158.4375} {"train_loss": -12.399198532104492, "global_step": 388752, "epoch": 2314} {"train_loss": -11.699440956115723, "global_step": 388753, "epoch": 2314} {"train_loss": -11.999074935913086, "global_step": 388754, "epoch": 2314} {"train_loss": -12.006305694580078, "global_step": 388755, "epoch": 2314} {"train_loss": -11.761016845703125, "global_step": 388756, "epoch": 2314} {"train_loss": -11.844423294067383, "global_step": 388757, "epoch": 2314} {"train_loss": -11.219528198242188, "global_step": 388758, "epoch": 2314} {"train_loss": -12.001578330993652, "global_step": 388759, "epoch": 2314} {"train_loss": -11.482905387878418, "global_step": 388760, "epoch": 2314} {"train_loss": -12.170713424682617, "global_step": 388761, "epoch": 2314} {"train_loss": -11.24111270904541, "global_step": 388762, "epoch": 2314} {"train_loss": -12.337469100952148, "global_step": 388763, "epoch": 2314} {"train_loss": -11.277050971984863, "global_step": 388764, "epoch": 2314} {"train_loss": -12.140057563781738, "global_step": 388765, "epoch": 2314} {"train_loss": -12.094881057739258, "global_step": 388766, "epoch": 2314} {"train_loss": -12.344005584716797, "global_step": 388767, "epoch": 2314} {"train_loss": -11.86906623840332, "global_step": 388768, "epoch": 2314} {"train_loss": -11.487408638000488, "global_step": 388769, "epoch": 2314} {"train_loss": -12.033685684204102, "global_step": 388770, "epoch": 2314} {"train_loss": -11.564311981201172, "global_step": 388771, "epoch": 2314} {"train_loss": -11.394943237304688, "global_step": 388772, "epoch": 2314} {"train_loss": -11.415823936462402, "global_step": 388773, "epoch": 2314} {"train_loss": -11.474517822265625, "global_step": 388774, "epoch": 2314} {"train_loss": -11.737607955932617, "global_step": 388775, "epoch": 2314} {"train_loss": -11.654043197631836, "global_step": 388776, "epoch": 2314} {"train_loss": -11.600933074951172, "global_step": 388777, "epoch": 2314} {"train_loss": -11.651281356811523, "global_step": 388778, "epoch": 2314} {"train_loss": -11.840761184692383, "global_step": 388779, "epoch": 2314} {"train_loss": -11.890522956848145, "global_step": 388780, "epoch": 2314} {"train_loss": -12.366935729980469, "global_step": 388781, "epoch": 2314} {"train_loss": -11.978466033935547, "global_step": 388782, "epoch": 2314} {"train_loss": -11.945022583007812, "global_step": 388783, "epoch": 2314} {"train_loss": -12.043384552001953, "global_step": 388784, "epoch": 2314} {"train_loss": -12.408820152282715, "global_step": 388785, "epoch": 2314} {"train_loss": -11.960016250610352, "global_step": 388786, "epoch": 2314} {"train_loss": -12.561994552612305, "global_step": 388787, "epoch": 2314} {"train_loss": -12.127260208129883, "global_step": 388788, "epoch": 2314} {"train_loss": -12.315742492675781, "global_step": 388789, "epoch": 2314} {"train_loss": -11.789310455322266, "global_step": 388790, "epoch": 2314} {"train_loss": -12.468329429626465, "global_step": 388791, "epoch": 2314} {"train_loss": -12.248785972595215, "global_step": 388792, "epoch": 2314} {"train_loss": -12.315112113952637, "global_step": 388793, "epoch": 2314} {"train_loss": -12.008434295654297, "global_step": 388794, "epoch": 2314} {"train_loss": -12.35738754272461, "global_step": 388795, "epoch": 2314} {"train_loss": -12.178674697875977, "global_step": 388796, "epoch": 2314} {"train_loss": -12.24732780456543, "global_step": 388797, "epoch": 2314} {"train_loss": -12.470367431640625, "global_step": 388798, "epoch": 2314} {"train_loss": -12.305353164672852, "global_step": 388799, "epoch": 2314} {"train_loss": -12.491830825805664, "global_step": 388800, "epoch": 2314} {"train_loss": -12.504663467407227, "global_step": 388801, "epoch": 2314} {"train_loss": -12.60230827331543, "global_step": 388802, "epoch": 2314} {"train_loss": -12.62369155883789, "global_step": 388803, "epoch": 2314} {"train_loss": -12.596366882324219, "global_step": 388804, "epoch": 2314} {"train_loss": -12.620098114013672, "global_step": 388805, "epoch": 2314} {"train_loss": -12.748921394348145, "global_step": 388806, "epoch": 2314} {"train_loss": -12.357982635498047, "global_step": 388807, "epoch": 2314} {"train_loss": -12.575033187866211, "global_step": 388808, "epoch": 2314} {"train_loss": -12.248329162597656, "global_step": 388809, "epoch": 2314} {"train_loss": -12.680411338806152, "global_step": 388810, "epoch": 2314} {"train_loss": -12.223623275756836, "global_step": 388811, "epoch": 2314} {"train_loss": -12.609500885009766, "global_step": 388812, "epoch": 2314} {"train_loss": -12.411120414733887, "global_step": 388813, "epoch": 2314} {"train_loss": -12.480754852294922, "global_step": 388814, "epoch": 2314} {"train_loss": -12.670110702514648, "global_step": 388815, "epoch": 2314} {"train_loss": -12.408120155334473, "global_step": 388816, "epoch": 2314} {"train_loss": -12.627277374267578, "global_step": 388817, "epoch": 2314} {"train_loss": -12.466894149780273, "global_step": 388818, "epoch": 2314} {"train_loss": -12.202142715454102, "global_step": 388819, "epoch": 2314} {"train_loss": -12.669522285461426, "global_step": 388820, "epoch": 2314} {"train_loss": -12.178464889526367, "global_step": 388821, "epoch": 2314} {"train_loss": -12.427802085876465, "global_step": 388822, "epoch": 2314} {"train_loss": -12.691705703735352, "global_step": 388823, "epoch": 2314} {"train_loss": -12.185853958129883, "global_step": 388824, "epoch": 2314} {"train_loss": -12.304031372070312, "global_step": 388825, "epoch": 2314} {"train_loss": -12.327814102172852, "global_step": 388826, "epoch": 2314} {"train_loss": -12.2887544631958, "global_step": 388827, "epoch": 2314} {"train_loss": -12.38825511932373, "global_step": 388828, "epoch": 2314} {"train_loss": -12.526388168334961, "global_step": 388829, "epoch": 2314} {"train_loss": -12.45226001739502, "global_step": 388830, "epoch": 2314} {"train_loss": -12.38131332397461, "global_step": 388831, "epoch": 2314} {"train_loss": -12.530588150024414, "global_step": 388832, "epoch": 2314} {"train_loss": -12.672887802124023, "global_step": 388833, "epoch": 2314} {"train_loss": -12.426039695739746, "global_step": 388834, "epoch": 2314} {"train_loss": -12.525382995605469, "global_step": 388835, "epoch": 2314} {"train_loss": -12.192633628845215, "global_step": 388836, "epoch": 2314} {"train_loss": -12.573514938354492, "global_step": 388837, "epoch": 2314} {"train_loss": -12.025214195251465, "global_step": 388838, "epoch": 2314} {"train_loss": -12.602090835571289, "global_step": 388839, "epoch": 2314} {"train_loss": -12.218117713928223, "global_step": 388840, "epoch": 2314} {"train_loss": -12.678824424743652, "global_step": 388841, "epoch": 2314} {"train_loss": -12.094242095947266, "global_step": 388842, "epoch": 2314} {"train_loss": -12.473140716552734, "global_step": 388843, "epoch": 2314} {"train_loss": -12.318506240844727, "global_step": 388844, "epoch": 2314} {"train_loss": -12.146723747253418, "global_step": 388845, "epoch": 2314} {"train_loss": -11.95938491821289, "global_step": 388846, "epoch": 2314} {"train_loss": -12.544106483459473, "global_step": 388847, "epoch": 2314} {"train_loss": -11.589941024780273, "global_step": 388848, "epoch": 2314} {"train_loss": -11.736377716064453, "global_step": 388849, "epoch": 2314} {"train_loss": -12.669963836669922, "global_step": 388850, "epoch": 2314} {"train_loss": -12.3507080078125, "global_step": 388851, "epoch": 2314} {"train_loss": -12.404964447021484, "global_step": 388852, "epoch": 2314} {"train_loss": -12.393135070800781, "global_step": 388853, "epoch": 2314} {"train_loss": -12.530502319335938, "global_step": 388854, "epoch": 2314} {"train_loss": -12.32064437866211, "global_step": 388855, "epoch": 2314} {"train_loss": -12.600339889526367, "global_step": 388856, "epoch": 2314} {"train_loss": -12.617012023925781, "global_step": 388857, "epoch": 2314} {"train_loss": -12.633466720581055, "global_step": 388858, "epoch": 2314} {"train_loss": -12.699562072753906, "global_step": 388859, "epoch": 2314} {"train_loss": -12.582026481628418, "global_step": 388860, "epoch": 2314} {"train_loss": -12.658605575561523, "global_step": 388861, "epoch": 2314} {"train_loss": -12.623929977416992, "global_step": 388862, "epoch": 2314} {"train_loss": -12.721231460571289, "global_step": 388863, "epoch": 2314} {"train_loss": -12.605012893676758, "global_step": 388864, "epoch": 2314} {"train_loss": -12.856945991516113, "global_step": 388865, "epoch": 2314} {"train_loss": -12.48077392578125, "global_step": 388866, "epoch": 2314} {"train_loss": -12.775918006896973, "global_step": 388867, "epoch": 2314} {"train_loss": -12.461909294128418, "global_step": 388868, "epoch": 2314} {"train_loss": -12.116086959838867, "global_step": 388869, "epoch": 2314} {"train_loss": -12.203703880310059, "global_step": 388870, "epoch": 2314} {"train_loss": -12.37112808227539, "global_step": 388871, "epoch": 2314} {"train_loss": -12.779393196105957, "global_step": 388872, "epoch": 2314} {"train_loss": -12.307106971740723, "global_step": 388873, "epoch": 2314} {"train_loss": -12.450623512268066, "global_step": 388874, "epoch": 2314} {"train_loss": -12.515727996826172, "global_step": 388875, "epoch": 2314} {"train_loss": -12.763959884643555, "global_step": 388876, "epoch": 2314} {"train_loss": -12.592235565185547, "global_step": 388877, "epoch": 2314} {"train_loss": -12.23135757446289, "global_step": 388878, "epoch": 2314} {"train_loss": -12.560094833374023, "global_step": 388879, "epoch": 2314} {"train_loss": -12.376723289489746, "global_step": 388880, "epoch": 2314} {"train_loss": -12.893686294555664, "global_step": 388881, "epoch": 2314} {"train_loss": -12.471904754638672, "global_step": 388882, "epoch": 2314} {"train_loss": -12.48320198059082, "global_step": 388883, "epoch": 2314} {"train_loss": -12.197698593139648, "global_step": 388884, "epoch": 2314} {"train_loss": -12.303775787353516, "global_step": 388885, "epoch": 2314} {"train_loss": -12.239110946655273, "global_step": 388886, "epoch": 2314} {"train_loss": -10.77833080291748, "global_step": 388887, "epoch": 2314} {"train_loss": -12.627774238586426, "global_step": 388888, "epoch": 2314} {"train_loss": -11.67585563659668, "global_step": 388889, "epoch": 2314} {"train_loss": -11.024940490722656, "global_step": 388890, "epoch": 2314} {"train_loss": -10.877422332763672, "global_step": 388891, "epoch": 2314} {"train_loss": -10.7754545211792, "global_step": 388892, "epoch": 2314} {"train_loss": -11.911548614501953, "global_step": 388893, "epoch": 2314} {"train_loss": -10.384411811828613, "global_step": 388894, "epoch": 2314} {"train_loss": -10.607637405395508, "global_step": 388895, "epoch": 2314} {"train_loss": -12.191072463989258, "global_step": 388896, "epoch": 2314} {"train_loss": -11.374147415161133, "global_step": 388897, "epoch": 2314} {"train_loss": -11.63302993774414, "global_step": 388898, "epoch": 2314} {"train_loss": -11.903635025024414, "global_step": 388899, "epoch": 2314} {"train_loss": -9.693472862243652, "global_step": 388900, "epoch": 2314} {"train_loss": -10.511228561401367, "global_step": 388901, "epoch": 2314} {"train_loss": -10.414106369018555, "global_step": 388902, "epoch": 2314} {"train_loss": -9.514362335205078, "global_step": 388903, "epoch": 2314} {"train_loss": -7.745262622833252, "global_step": 388904, "epoch": 2314} {"train_loss": -7.846625328063965, "global_step": 388905, "epoch": 2314} {"train_loss": -8.432028770446777, "global_step": 388906, "epoch": 2314} {"train_loss": -7.782149314880371, "global_step": 388907, "epoch": 2314} {"train_loss": -8.163591384887695, "global_step": 388908, "epoch": 2314} {"train_loss": -8.962747573852539, "global_step": 388909, "epoch": 2314} {"train_loss": -8.027395248413086, "global_step": 388910, "epoch": 2314} {"train_loss": -8.904098510742188, "global_step": 388911, "epoch": 2314} {"train_loss": -8.406076431274414, "global_step": 388912, "epoch": 2314} {"train_loss": -8.784038543701172, "global_step": 388913, "epoch": 2314} {"train_loss": -8.535964965820312, "global_step": 388914, "epoch": 2314} {"train_loss": -9.010482788085938, "global_step": 388915, "epoch": 2314} {"train_loss": -8.897520065307617, "global_step": 388916, "epoch": 2314} {"train_loss": -9.932731628417969, "global_step": 388917, "epoch": 2314} {"train_loss": -9.790897369384766, "global_step": 388918, "epoch": 2314} {"train_loss": -11.814978704566048, "global_step": 388919, "epoch": 2314, "val_loss": 295074.28125} {"train_loss": -11.318689346313477, "global_step": 388920, "epoch": 2315} {"train_loss": -11.107315063476562, "global_step": 388921, "epoch": 2315} {"train_loss": -10.572761535644531, "global_step": 388922, "epoch": 2315} {"train_loss": -10.115128517150879, "global_step": 388923, "epoch": 2315} {"train_loss": -10.359381675720215, "global_step": 388924, "epoch": 2315} {"train_loss": -10.31166934967041, "global_step": 388925, "epoch": 2315} {"train_loss": -10.857337951660156, "global_step": 388926, "epoch": 2315} {"train_loss": -10.155057907104492, "global_step": 388927, "epoch": 2315} {"train_loss": -11.12914752960205, "global_step": 388928, "epoch": 2315} {"train_loss": -10.591217041015625, "global_step": 388929, "epoch": 2315} {"train_loss": -10.849515914916992, "global_step": 388930, "epoch": 2315} {"train_loss": -10.827228546142578, "global_step": 388931, "epoch": 2315} {"train_loss": -10.631168365478516, "global_step": 388932, "epoch": 2315} {"train_loss": -11.083011627197266, "global_step": 388933, "epoch": 2315} {"train_loss": -10.604180335998535, "global_step": 388934, "epoch": 2315} {"train_loss": -11.138607025146484, "global_step": 388935, "epoch": 2315} {"train_loss": -11.248409271240234, "global_step": 388936, "epoch": 2315} {"train_loss": -11.384288787841797, "global_step": 388937, "epoch": 2315} {"train_loss": -11.313262939453125, "global_step": 388938, "epoch": 2315} {"train_loss": -11.625471115112305, "global_step": 388939, "epoch": 2315} {"train_loss": -11.729220390319824, "global_step": 388940, "epoch": 2315} {"train_loss": -11.60062026977539, "global_step": 388941, "epoch": 2315} {"train_loss": -11.816549301147461, "global_step": 388942, "epoch": 2315} {"train_loss": -11.680590629577637, "global_step": 388943, "epoch": 2315} {"train_loss": -11.823759078979492, "global_step": 388944, "epoch": 2315} {"train_loss": -11.871137619018555, "global_step": 388945, "epoch": 2315} {"train_loss": -12.046207427978516, "global_step": 388946, "epoch": 2315} {"train_loss": -12.167123794555664, "global_step": 388947, "epoch": 2315} {"train_loss": -11.924764633178711, "global_step": 388948, "epoch": 2315} {"train_loss": -11.97005844116211, "global_step": 388949, "epoch": 2315} {"train_loss": -11.841421127319336, "global_step": 388950, "epoch": 2315} {"train_loss": -11.934553146362305, "global_step": 388951, "epoch": 2315} {"train_loss": -12.100987434387207, "global_step": 388952, "epoch": 2315} {"train_loss": -12.038667678833008, "global_step": 388953, "epoch": 2315} {"train_loss": -12.032930374145508, "global_step": 388954, "epoch": 2315} {"train_loss": -12.268928527832031, "global_step": 388955, "epoch": 2315} {"train_loss": -12.061576843261719, "global_step": 388956, "epoch": 2315} {"train_loss": -11.978588104248047, "global_step": 388957, "epoch": 2315} {"train_loss": -12.236257553100586, "global_step": 388958, "epoch": 2315} {"train_loss": -12.171035766601562, "global_step": 388959, "epoch": 2315} {"train_loss": -12.119447708129883, "global_step": 388960, "epoch": 2315} {"train_loss": -12.205584526062012, "global_step": 388961, "epoch": 2315} {"train_loss": -12.195286750793457, "global_step": 388962, "epoch": 2315} {"train_loss": -12.133674621582031, "global_step": 388963, "epoch": 2315} {"train_loss": -12.37936019897461, "global_step": 388964, "epoch": 2315} {"train_loss": -12.228501319885254, "global_step": 388965, "epoch": 2315} {"train_loss": -12.405237197875977, "global_step": 388966, "epoch": 2315} {"train_loss": -12.310967445373535, "global_step": 388967, "epoch": 2315} {"train_loss": -12.29790210723877, "global_step": 388968, "epoch": 2315} {"train_loss": -12.646788597106934, "global_step": 388969, "epoch": 2315} {"train_loss": -12.354793548583984, "global_step": 388970, "epoch": 2315} {"train_loss": -12.254335403442383, "global_step": 388971, "epoch": 2315} {"train_loss": -12.606072425842285, "global_step": 388972, "epoch": 2315} {"train_loss": -12.436976432800293, "global_step": 388973, "epoch": 2315} {"train_loss": -12.285459518432617, "global_step": 388974, "epoch": 2315} {"train_loss": -12.54859733581543, "global_step": 388975, "epoch": 2315} {"train_loss": -12.362329483032227, "global_step": 388976, "epoch": 2315} {"train_loss": -12.630751609802246, "global_step": 388977, "epoch": 2315} {"train_loss": -12.566426277160645, "global_step": 388978, "epoch": 2315} {"train_loss": -12.688457489013672, "global_step": 388979, "epoch": 2315} {"train_loss": -12.717456817626953, "global_step": 388980, "epoch": 2315} {"train_loss": -12.448457717895508, "global_step": 388981, "epoch": 2315} {"train_loss": -12.406679153442383, "global_step": 388982, "epoch": 2315} {"train_loss": -12.754376411437988, "global_step": 388983, "epoch": 2315} {"train_loss": -12.570258140563965, "global_step": 388984, "epoch": 2315} {"train_loss": -12.585941314697266, "global_step": 388985, "epoch": 2315} {"train_loss": -12.655101776123047, "global_step": 388986, "epoch": 2315} {"train_loss": -12.479109764099121, "global_step": 388987, "epoch": 2315} {"train_loss": -12.672761917114258, "global_step": 388988, "epoch": 2315} {"train_loss": -12.782445907592773, "global_step": 388989, "epoch": 2315} {"train_loss": -12.348892211914062, "global_step": 388990, "epoch": 2315} {"train_loss": -12.633604049682617, "global_step": 388991, "epoch": 2315} {"train_loss": -12.603614807128906, "global_step": 388992, "epoch": 2315} {"train_loss": -12.527946472167969, "global_step": 388993, "epoch": 2315} {"train_loss": -12.628877639770508, "global_step": 388994, "epoch": 2315} {"train_loss": -12.72525405883789, "global_step": 388995, "epoch": 2315} {"train_loss": -12.53100299835205, "global_step": 388996, "epoch": 2315} {"train_loss": -12.859718322753906, "global_step": 388997, "epoch": 2315} {"train_loss": -12.546483039855957, "global_step": 388998, "epoch": 2315} {"train_loss": -12.75562858581543, "global_step": 388999, "epoch": 2315} {"train_loss": -12.253684043884277, "global_step": 389000, "epoch": 2315} {"train_loss": -12.537750244140625, "global_step": 389001, "epoch": 2315} {"train_loss": -12.421138763427734, "global_step": 389002, "epoch": 2315} {"train_loss": -12.810221672058105, "global_step": 389003, "epoch": 2315} {"train_loss": -12.672365188598633, "global_step": 389004, "epoch": 2315} {"train_loss": -12.751340866088867, "global_step": 389005, "epoch": 2315} {"train_loss": -12.657294273376465, "global_step": 389006, "epoch": 2315} {"train_loss": -12.663846969604492, "global_step": 389007, "epoch": 2315} {"train_loss": -12.81147575378418, "global_step": 389008, "epoch": 2315} {"train_loss": -12.620870590209961, "global_step": 389009, "epoch": 2315} {"train_loss": -12.610028266906738, "global_step": 389010, "epoch": 2315} {"train_loss": -12.542572021484375, "global_step": 389011, "epoch": 2315} {"train_loss": -12.9064359664917, "global_step": 389012, "epoch": 2315} {"train_loss": -12.687252044677734, "global_step": 389013, "epoch": 2315} {"train_loss": -12.5812406539917, "global_step": 389014, "epoch": 2315} {"train_loss": -12.543588638305664, "global_step": 389015, "epoch": 2315} {"train_loss": -12.73149585723877, "global_step": 389016, "epoch": 2315} {"train_loss": -12.761797904968262, "global_step": 389017, "epoch": 2315} {"train_loss": -12.649581909179688, "global_step": 389018, "epoch": 2315} {"train_loss": -12.663393020629883, "global_step": 389019, "epoch": 2315} {"train_loss": -12.795520782470703, "global_step": 389020, "epoch": 2315} {"train_loss": -12.924480438232422, "global_step": 389021, "epoch": 2315} {"train_loss": -12.635169982910156, "global_step": 389022, "epoch": 2315} {"train_loss": -12.740506172180176, "global_step": 389023, "epoch": 2315} {"train_loss": -12.839478492736816, "global_step": 389024, "epoch": 2315} {"train_loss": -12.873685836791992, "global_step": 389025, "epoch": 2315} {"train_loss": -12.825210571289062, "global_step": 389026, "epoch": 2315} {"train_loss": -12.718022346496582, "global_step": 389027, "epoch": 2315} {"train_loss": -12.664259910583496, "global_step": 389028, "epoch": 2315} {"train_loss": -12.265937805175781, "global_step": 389029, "epoch": 2315} {"train_loss": -12.064327239990234, "global_step": 389030, "epoch": 2315} {"train_loss": -11.284387588500977, "global_step": 389031, "epoch": 2315} {"train_loss": -11.523850440979004, "global_step": 389032, "epoch": 2315} {"train_loss": -12.099967956542969, "global_step": 389033, "epoch": 2315} {"train_loss": -11.497440338134766, "global_step": 389034, "epoch": 2315} {"train_loss": -11.235203742980957, "global_step": 389035, "epoch": 2315} {"train_loss": -11.018431663513184, "global_step": 389036, "epoch": 2315} {"train_loss": -9.996789932250977, "global_step": 389037, "epoch": 2315} {"train_loss": -8.908012390136719, "global_step": 389038, "epoch": 2315} {"train_loss": -8.098830223083496, "global_step": 389039, "epoch": 2315} {"train_loss": -8.25503921508789, "global_step": 389040, "epoch": 2315} {"train_loss": -7.561119079589844, "global_step": 389041, "epoch": 2315} {"train_loss": -7.77143669128418, "global_step": 389042, "epoch": 2315} {"train_loss": -8.530981063842773, "global_step": 389043, "epoch": 2315} {"train_loss": -8.172771453857422, "global_step": 389044, "epoch": 2315} {"train_loss": -8.088665962219238, "global_step": 389045, "epoch": 2315} {"train_loss": -8.181266784667969, "global_step": 389046, "epoch": 2315} {"train_loss": -8.108262062072754, "global_step": 389047, "epoch": 2315} {"train_loss": -8.622605323791504, "global_step": 389048, "epoch": 2315} {"train_loss": -8.742120742797852, "global_step": 389049, "epoch": 2315} {"train_loss": -8.76007080078125, "global_step": 389050, "epoch": 2315} {"train_loss": -9.417436599731445, "global_step": 389051, "epoch": 2315} {"train_loss": -9.691587448120117, "global_step": 389052, "epoch": 2315} {"train_loss": -10.640095710754395, "global_step": 389053, "epoch": 2315} {"train_loss": -10.253458976745605, "global_step": 389054, "epoch": 2315} {"train_loss": -10.850286483764648, "global_step": 389055, "epoch": 2315} {"train_loss": -10.404748916625977, "global_step": 389056, "epoch": 2315} {"train_loss": -10.325263977050781, "global_step": 389057, "epoch": 2315} {"train_loss": -10.599702835083008, "global_step": 389058, "epoch": 2315} {"train_loss": -10.151268005371094, "global_step": 389059, "epoch": 2315} {"train_loss": -11.018623352050781, "global_step": 389060, "epoch": 2315} {"train_loss": -11.162057876586914, "global_step": 389061, "epoch": 2315} {"train_loss": -11.003730773925781, "global_step": 389062, "epoch": 2315} {"train_loss": -11.369243621826172, "global_step": 389063, "epoch": 2315} {"train_loss": -11.134872436523438, "global_step": 389064, "epoch": 2315} {"train_loss": -11.652584075927734, "global_step": 389065, "epoch": 2315} {"train_loss": -11.312776565551758, "global_step": 389066, "epoch": 2315} {"train_loss": -11.331550598144531, "global_step": 389067, "epoch": 2315} {"train_loss": -11.307323455810547, "global_step": 389068, "epoch": 2315} {"train_loss": -11.362959861755371, "global_step": 389069, "epoch": 2315} {"train_loss": -12.213455200195312, "global_step": 389070, "epoch": 2315} {"train_loss": -11.503805160522461, "global_step": 389071, "epoch": 2315} {"train_loss": -12.14368724822998, "global_step": 389072, "epoch": 2315} {"train_loss": -11.5725679397583, "global_step": 389073, "epoch": 2315} {"train_loss": -11.792647361755371, "global_step": 389074, "epoch": 2315} {"train_loss": -11.63230037689209, "global_step": 389075, "epoch": 2315} {"train_loss": -11.797686576843262, "global_step": 389076, "epoch": 2315} {"train_loss": -12.045164108276367, "global_step": 389077, "epoch": 2315} {"train_loss": -12.127182006835938, "global_step": 389078, "epoch": 2315} {"train_loss": -11.498559951782227, "global_step": 389079, "epoch": 2315} {"train_loss": -12.153926849365234, "global_step": 389080, "epoch": 2315} {"train_loss": -11.60633659362793, "global_step": 389081, "epoch": 2315} {"train_loss": -12.167387962341309, "global_step": 389082, "epoch": 2315} {"train_loss": -11.977535247802734, "global_step": 389083, "epoch": 2315} {"train_loss": -12.365543365478516, "global_step": 389084, "epoch": 2315} {"train_loss": -12.136975288391113, "global_step": 389085, "epoch": 2315} {"train_loss": -12.327064514160156, "global_step": 389086, "epoch": 2315} {"train_loss": -11.639445770354499, "global_step": 389087, "epoch": 2315, "val_loss": 296156.40625, "train_action_mse_error": 1.2143456935882568} {"train_loss": -12.000944137573242, "global_step": 389088, "epoch": 2316} {"train_loss": -12.284963607788086, "global_step": 389089, "epoch": 2316} {"train_loss": -11.940618515014648, "global_step": 389090, "epoch": 2316} {"train_loss": -12.383079528808594, "global_step": 389091, "epoch": 2316} {"train_loss": -12.030434608459473, "global_step": 389092, "epoch": 2316} {"train_loss": -12.108992576599121, "global_step": 389093, "epoch": 2316} {"train_loss": -12.10094928741455, "global_step": 389094, "epoch": 2316} {"train_loss": -11.788463592529297, "global_step": 389095, "epoch": 2316} {"train_loss": -12.235912322998047, "global_step": 389096, "epoch": 2316} {"train_loss": -12.230216979980469, "global_step": 389097, "epoch": 2316} {"train_loss": -12.009622573852539, "global_step": 389098, "epoch": 2316} {"train_loss": -12.312694549560547, "global_step": 389099, "epoch": 2316} {"train_loss": -12.012792587280273, "global_step": 389100, "epoch": 2316} {"train_loss": -12.217521667480469, "global_step": 389101, "epoch": 2316} {"train_loss": -12.353790283203125, "global_step": 389102, "epoch": 2316} {"train_loss": -12.362470626831055, "global_step": 389103, "epoch": 2316} {"train_loss": -12.439422607421875, "global_step": 389104, "epoch": 2316} {"train_loss": -12.450316429138184, "global_step": 389105, "epoch": 2316} {"train_loss": -12.32994270324707, "global_step": 389106, "epoch": 2316} {"train_loss": -12.194257736206055, "global_step": 389107, "epoch": 2316} {"train_loss": -12.572996139526367, "global_step": 389108, "epoch": 2316} {"train_loss": -12.123516082763672, "global_step": 389109, "epoch": 2316} {"train_loss": -12.451471328735352, "global_step": 389110, "epoch": 2316} {"train_loss": -11.432437896728516, "global_step": 389111, "epoch": 2316} {"train_loss": -12.27452278137207, "global_step": 389112, "epoch": 2316} {"train_loss": -11.28715705871582, "global_step": 389113, "epoch": 2316} {"train_loss": -12.034175872802734, "global_step": 389114, "epoch": 2316} {"train_loss": -10.867959022521973, "global_step": 389115, "epoch": 2316} {"train_loss": -11.73819351196289, "global_step": 389116, "epoch": 2316} {"train_loss": -10.978083610534668, "global_step": 389117, "epoch": 2316} {"train_loss": -11.619111061096191, "global_step": 389118, "epoch": 2316} {"train_loss": -11.388639450073242, "global_step": 389119, "epoch": 2316} {"train_loss": -10.788036346435547, "global_step": 389120, "epoch": 2316} {"train_loss": -11.418523788452148, "global_step": 389121, "epoch": 2316} {"train_loss": -10.833213806152344, "global_step": 389122, "epoch": 2316} {"train_loss": -12.101670265197754, "global_step": 389123, "epoch": 2316} {"train_loss": -11.616752624511719, "global_step": 389124, "epoch": 2316} {"train_loss": -11.917009353637695, "global_step": 389125, "epoch": 2316} {"train_loss": -11.806892395019531, "global_step": 389126, "epoch": 2316} {"train_loss": -11.441242218017578, "global_step": 389127, "epoch": 2316} {"train_loss": -11.830159187316895, "global_step": 389128, "epoch": 2316} {"train_loss": -9.875468254089355, "global_step": 389129, "epoch": 2316} {"train_loss": -10.862775802612305, "global_step": 389130, "epoch": 2316} {"train_loss": -10.840103149414062, "global_step": 389131, "epoch": 2316} {"train_loss": -11.315954208374023, "global_step": 389132, "epoch": 2316} {"train_loss": -11.156965255737305, "global_step": 389133, "epoch": 2316} {"train_loss": -12.253140449523926, "global_step": 389134, "epoch": 2316} {"train_loss": -11.346776962280273, "global_step": 389135, "epoch": 2316} {"train_loss": -12.185311317443848, "global_step": 389136, "epoch": 2316} {"train_loss": -11.456957817077637, "global_step": 389137, "epoch": 2316} {"train_loss": -11.6162748336792, "global_step": 389138, "epoch": 2316} {"train_loss": -11.752264022827148, "global_step": 389139, "epoch": 2316} {"train_loss": -12.131881713867188, "global_step": 389140, "epoch": 2316} {"train_loss": -11.728382110595703, "global_step": 389141, "epoch": 2316} {"train_loss": -12.013564109802246, "global_step": 389142, "epoch": 2316} {"train_loss": -11.601495742797852, "global_step": 389143, "epoch": 2316} {"train_loss": -12.033834457397461, "global_step": 389144, "epoch": 2316} {"train_loss": -12.268550872802734, "global_step": 389145, "epoch": 2316} {"train_loss": -11.504983901977539, "global_step": 389146, "epoch": 2316} {"train_loss": -11.904672622680664, "global_step": 389147, "epoch": 2316} {"train_loss": -11.930154800415039, "global_step": 389148, "epoch": 2316} {"train_loss": -12.353971481323242, "global_step": 389149, "epoch": 2316} {"train_loss": -12.211483001708984, "global_step": 389150, "epoch": 2316} {"train_loss": -12.41165542602539, "global_step": 389151, "epoch": 2316} {"train_loss": -12.237699508666992, "global_step": 389152, "epoch": 2316} {"train_loss": -12.485321998596191, "global_step": 389153, "epoch": 2316} {"train_loss": -12.288543701171875, "global_step": 389154, "epoch": 2316} {"train_loss": -12.488919258117676, "global_step": 389155, "epoch": 2316} {"train_loss": -12.28652572631836, "global_step": 389156, "epoch": 2316} {"train_loss": -12.483207702636719, "global_step": 389157, "epoch": 2316} {"train_loss": -12.269850730895996, "global_step": 389158, "epoch": 2316} {"train_loss": -12.44845199584961, "global_step": 389159, "epoch": 2316} {"train_loss": -12.212666511535645, "global_step": 389160, "epoch": 2316} {"train_loss": -12.408136367797852, "global_step": 389161, "epoch": 2316} {"train_loss": -12.337075233459473, "global_step": 389162, "epoch": 2316} {"train_loss": -12.432857513427734, "global_step": 389163, "epoch": 2316} {"train_loss": -12.491805076599121, "global_step": 389164, "epoch": 2316} {"train_loss": -12.474930763244629, "global_step": 389165, "epoch": 2316} {"train_loss": -12.396718978881836, "global_step": 389166, "epoch": 2316} {"train_loss": -12.295805931091309, "global_step": 389167, "epoch": 2316} {"train_loss": -12.434379577636719, "global_step": 389168, "epoch": 2316} {"train_loss": -12.080789566040039, "global_step": 389169, "epoch": 2316} {"train_loss": -12.31547737121582, "global_step": 389170, "epoch": 2316} {"train_loss": -12.334519386291504, "global_step": 389171, "epoch": 2316} {"train_loss": -11.832213401794434, "global_step": 389172, "epoch": 2316} {"train_loss": -12.392425537109375, "global_step": 389173, "epoch": 2316} {"train_loss": -12.194112777709961, "global_step": 389174, "epoch": 2316} {"train_loss": -12.382312774658203, "global_step": 389175, "epoch": 2316} {"train_loss": -12.209068298339844, "global_step": 389176, "epoch": 2316} {"train_loss": -12.230661392211914, "global_step": 389177, "epoch": 2316} {"train_loss": -12.497440338134766, "global_step": 389178, "epoch": 2316} {"train_loss": -12.074579238891602, "global_step": 389179, "epoch": 2316} {"train_loss": -12.623823165893555, "global_step": 389180, "epoch": 2316} {"train_loss": -11.992623329162598, "global_step": 389181, "epoch": 2316} {"train_loss": -11.923219680786133, "global_step": 389182, "epoch": 2316} {"train_loss": -11.997723579406738, "global_step": 389183, "epoch": 2316} {"train_loss": -11.979555130004883, "global_step": 389184, "epoch": 2316} {"train_loss": -12.035833358764648, "global_step": 389185, "epoch": 2316} {"train_loss": -12.05959701538086, "global_step": 389186, "epoch": 2316} {"train_loss": -12.152530670166016, "global_step": 389187, "epoch": 2316} {"train_loss": -12.355648040771484, "global_step": 389188, "epoch": 2316} {"train_loss": -12.3643798828125, "global_step": 389189, "epoch": 2316} {"train_loss": -12.237007141113281, "global_step": 389190, "epoch": 2316} {"train_loss": -12.094522476196289, "global_step": 389191, "epoch": 2316} {"train_loss": -12.340371131896973, "global_step": 389192, "epoch": 2316} {"train_loss": -11.915731430053711, "global_step": 389193, "epoch": 2316} {"train_loss": -12.46255874633789, "global_step": 389194, "epoch": 2316} {"train_loss": -12.192314147949219, "global_step": 389195, "epoch": 2316} {"train_loss": -12.251312255859375, "global_step": 389196, "epoch": 2316} {"train_loss": -12.241214752197266, "global_step": 389197, "epoch": 2316} {"train_loss": -12.262357711791992, "global_step": 389198, "epoch": 2316} {"train_loss": -12.378327369689941, "global_step": 389199, "epoch": 2316} {"train_loss": -11.790055274963379, "global_step": 389200, "epoch": 2316} {"train_loss": -11.581439018249512, "global_step": 389201, "epoch": 2316} {"train_loss": -11.786760330200195, "global_step": 389202, "epoch": 2316} {"train_loss": -11.472614288330078, "global_step": 389203, "epoch": 2316} {"train_loss": -12.016387939453125, "global_step": 389204, "epoch": 2316} {"train_loss": -11.613840103149414, "global_step": 389205, "epoch": 2316} {"train_loss": -11.844533920288086, "global_step": 389206, "epoch": 2316} {"train_loss": -12.15777587890625, "global_step": 389207, "epoch": 2316} {"train_loss": -12.009794235229492, "global_step": 389208, "epoch": 2316} {"train_loss": -12.040887832641602, "global_step": 389209, "epoch": 2316} {"train_loss": -11.969379425048828, "global_step": 389210, "epoch": 2316} {"train_loss": -12.425820350646973, "global_step": 389211, "epoch": 2316} {"train_loss": -11.948015213012695, "global_step": 389212, "epoch": 2316} {"train_loss": -12.16340446472168, "global_step": 389213, "epoch": 2316} {"train_loss": -12.07952880859375, "global_step": 389214, "epoch": 2316} {"train_loss": -11.980082511901855, "global_step": 389215, "epoch": 2316} {"train_loss": -12.49111557006836, "global_step": 389216, "epoch": 2316} {"train_loss": -12.347575187683105, "global_step": 389217, "epoch": 2316} {"train_loss": -12.146585464477539, "global_step": 389218, "epoch": 2316} {"train_loss": -12.101198196411133, "global_step": 389219, "epoch": 2316} {"train_loss": -12.578109741210938, "global_step": 389220, "epoch": 2316} {"train_loss": -12.062606811523438, "global_step": 389221, "epoch": 2316} {"train_loss": -12.45325756072998, "global_step": 389222, "epoch": 2316} {"train_loss": -12.07282543182373, "global_step": 389223, "epoch": 2316} {"train_loss": -12.32750129699707, "global_step": 389224, "epoch": 2316} {"train_loss": -12.415088653564453, "global_step": 389225, "epoch": 2316} {"train_loss": -12.049690246582031, "global_step": 389226, "epoch": 2316} {"train_loss": -12.52790641784668, "global_step": 389227, "epoch": 2316} {"train_loss": -12.246478080749512, "global_step": 389228, "epoch": 2316} {"train_loss": -12.387239456176758, "global_step": 389229, "epoch": 2316} {"train_loss": -12.128010749816895, "global_step": 389230, "epoch": 2316} {"train_loss": -12.515727996826172, "global_step": 389231, "epoch": 2316} {"train_loss": -12.514778137207031, "global_step": 389232, "epoch": 2316} {"train_loss": -12.318239212036133, "global_step": 389233, "epoch": 2316} {"train_loss": -12.293737411499023, "global_step": 389234, "epoch": 2316} {"train_loss": -12.158370971679688, "global_step": 389235, "epoch": 2316} {"train_loss": -11.927877426147461, "global_step": 389236, "epoch": 2316} {"train_loss": -12.144559860229492, "global_step": 389237, "epoch": 2316} {"train_loss": -12.357664108276367, "global_step": 389238, "epoch": 2316} {"train_loss": -12.29693603515625, "global_step": 389239, "epoch": 2316} {"train_loss": -12.340603828430176, "global_step": 389240, "epoch": 2316} {"train_loss": -12.516609191894531, "global_step": 389241, "epoch": 2316} {"train_loss": -12.132644653320312, "global_step": 389242, "epoch": 2316} {"train_loss": -12.027124404907227, "global_step": 389243, "epoch": 2316} {"train_loss": -11.98395824432373, "global_step": 389244, "epoch": 2316} {"train_loss": -11.754143714904785, "global_step": 389245, "epoch": 2316} {"train_loss": -12.122472763061523, "global_step": 389246, "epoch": 2316} {"train_loss": -11.990872383117676, "global_step": 389247, "epoch": 2316} {"train_loss": -11.528369903564453, "global_step": 389248, "epoch": 2316} {"train_loss": -11.95502758026123, "global_step": 389249, "epoch": 2316} {"train_loss": -12.242822647094727, "global_step": 389250, "epoch": 2316} {"train_loss": -12.21927261352539, "global_step": 389251, "epoch": 2316} {"train_loss": -12.020833015441895, "global_step": 389252, "epoch": 2316} {"train_loss": -12.265624046325684, "global_step": 389253, "epoch": 2316} {"train_loss": -12.300531387329102, "global_step": 389254, "epoch": 2316} {"train_loss": -12.053586937132335, "global_step": 389255, "epoch": 2316, "val_loss": 298919.21875} {"train_loss": -12.433815002441406, "global_step": 389256, "epoch": 2317} {"train_loss": -12.334426879882812, "global_step": 389257, "epoch": 2317} {"train_loss": -12.378105163574219, "global_step": 389258, "epoch": 2317} {"train_loss": -12.385958671569824, "global_step": 389259, "epoch": 2317} {"train_loss": -12.118547439575195, "global_step": 389260, "epoch": 2317} {"train_loss": -12.34248161315918, "global_step": 389261, "epoch": 2317} {"train_loss": -11.780241012573242, "global_step": 389262, "epoch": 2317} {"train_loss": -11.422746658325195, "global_step": 389263, "epoch": 2317} {"train_loss": -11.821187019348145, "global_step": 389264, "epoch": 2317} {"train_loss": -12.144388198852539, "global_step": 389265, "epoch": 2317} {"train_loss": -11.947352409362793, "global_step": 389266, "epoch": 2317} {"train_loss": -11.586005210876465, "global_step": 389267, "epoch": 2317} {"train_loss": -12.198607444763184, "global_step": 389268, "epoch": 2317} {"train_loss": -11.858097076416016, "global_step": 389269, "epoch": 2317} {"train_loss": -12.523176193237305, "global_step": 389270, "epoch": 2317} {"train_loss": -12.438230514526367, "global_step": 389271, "epoch": 2317} {"train_loss": -12.3759183883667, "global_step": 389272, "epoch": 2317} {"train_loss": -12.398564338684082, "global_step": 389273, "epoch": 2317} {"train_loss": -12.30294418334961, "global_step": 389274, "epoch": 2317} {"train_loss": -12.471126556396484, "global_step": 389275, "epoch": 2317} {"train_loss": -12.444879531860352, "global_step": 389276, "epoch": 2317} {"train_loss": -12.401796340942383, "global_step": 389277, "epoch": 2317} {"train_loss": -12.027885437011719, "global_step": 389278, "epoch": 2317} {"train_loss": -12.278373718261719, "global_step": 389279, "epoch": 2317} {"train_loss": -12.348339080810547, "global_step": 389280, "epoch": 2317} {"train_loss": -12.119939804077148, "global_step": 389281, "epoch": 2317} {"train_loss": -12.085371017456055, "global_step": 389282, "epoch": 2317} {"train_loss": -12.282134056091309, "global_step": 389283, "epoch": 2317} {"train_loss": -12.338048934936523, "global_step": 389284, "epoch": 2317} {"train_loss": -12.515083312988281, "global_step": 389285, "epoch": 2317} {"train_loss": -12.348162651062012, "global_step": 389286, "epoch": 2317} {"train_loss": -12.080110549926758, "global_step": 389287, "epoch": 2317} {"train_loss": -12.341880798339844, "global_step": 389288, "epoch": 2317} {"train_loss": -12.481155395507812, "global_step": 389289, "epoch": 2317} {"train_loss": -12.114529609680176, "global_step": 389290, "epoch": 2317} {"train_loss": -12.354880332946777, "global_step": 389291, "epoch": 2317} {"train_loss": -11.772298812866211, "global_step": 389292, "epoch": 2317} {"train_loss": -11.608898162841797, "global_step": 389293, "epoch": 2317} {"train_loss": -12.060995101928711, "global_step": 389294, "epoch": 2317} {"train_loss": -12.063194274902344, "global_step": 389295, "epoch": 2317} {"train_loss": -12.183353424072266, "global_step": 389296, "epoch": 2317} {"train_loss": -12.18838882446289, "global_step": 389297, "epoch": 2317} {"train_loss": -12.320719718933105, "global_step": 389298, "epoch": 2317} {"train_loss": -11.274219512939453, "global_step": 389299, "epoch": 2317} {"train_loss": -10.397790908813477, "global_step": 389300, "epoch": 2317} {"train_loss": -12.035524368286133, "global_step": 389301, "epoch": 2317} {"train_loss": -11.569211959838867, "global_step": 389302, "epoch": 2317} {"train_loss": -9.718719482421875, "global_step": 389303, "epoch": 2317} {"train_loss": -12.238792419433594, "global_step": 389304, "epoch": 2317} {"train_loss": -11.33951187133789, "global_step": 389305, "epoch": 2317} {"train_loss": -10.588988304138184, "global_step": 389306, "epoch": 2317} {"train_loss": -12.287355422973633, "global_step": 389307, "epoch": 2317} {"train_loss": -11.388104438781738, "global_step": 389308, "epoch": 2317} {"train_loss": -10.179831504821777, "global_step": 389309, "epoch": 2317} {"train_loss": -10.175527572631836, "global_step": 389310, "epoch": 2317} {"train_loss": -11.940292358398438, "global_step": 389311, "epoch": 2317} {"train_loss": -11.09648609161377, "global_step": 389312, "epoch": 2317} {"train_loss": -9.760753631591797, "global_step": 389313, "epoch": 2317} {"train_loss": -10.101428031921387, "global_step": 389314, "epoch": 2317} {"train_loss": -10.0509033203125, "global_step": 389315, "epoch": 2317} {"train_loss": -10.076964378356934, "global_step": 389316, "epoch": 2317} {"train_loss": -10.558473587036133, "global_step": 389317, "epoch": 2317} {"train_loss": -10.708452224731445, "global_step": 389318, "epoch": 2317} {"train_loss": -9.094815254211426, "global_step": 389319, "epoch": 2317} {"train_loss": -10.686169624328613, "global_step": 389320, "epoch": 2317} {"train_loss": -9.845832824707031, "global_step": 389321, "epoch": 2317} {"train_loss": -11.153308868408203, "global_step": 389322, "epoch": 2317} {"train_loss": -10.214668273925781, "global_step": 389323, "epoch": 2317} {"train_loss": -10.01171875, "global_step": 389324, "epoch": 2317} {"train_loss": -11.01137924194336, "global_step": 389325, "epoch": 2317} {"train_loss": -10.686023712158203, "global_step": 389326, "epoch": 2317} {"train_loss": -11.473893165588379, "global_step": 389327, "epoch": 2317} {"train_loss": -10.997247695922852, "global_step": 389328, "epoch": 2317} {"train_loss": -12.041296005249023, "global_step": 389329, "epoch": 2317} {"train_loss": -11.653194427490234, "global_step": 389330, "epoch": 2317} {"train_loss": -12.326964378356934, "global_step": 389331, "epoch": 2317} {"train_loss": -11.54572868347168, "global_step": 389332, "epoch": 2317} {"train_loss": -12.194647789001465, "global_step": 389333, "epoch": 2317} {"train_loss": -11.83989143371582, "global_step": 389334, "epoch": 2317} {"train_loss": -11.697488784790039, "global_step": 389335, "epoch": 2317} {"train_loss": -11.943713188171387, "global_step": 389336, "epoch": 2317} {"train_loss": -12.006107330322266, "global_step": 389337, "epoch": 2317} {"train_loss": -11.833931922912598, "global_step": 389338, "epoch": 2317} {"train_loss": -12.185789108276367, "global_step": 389339, "epoch": 2317} {"train_loss": -11.674160957336426, "global_step": 389340, "epoch": 2317} {"train_loss": -11.89706802368164, "global_step": 389341, "epoch": 2317} {"train_loss": -12.30186653137207, "global_step": 389342, "epoch": 2317} {"train_loss": -11.973247528076172, "global_step": 389343, "epoch": 2317} {"train_loss": -12.055907249450684, "global_step": 389344, "epoch": 2317} {"train_loss": -11.857131004333496, "global_step": 389345, "epoch": 2317} {"train_loss": -11.720949172973633, "global_step": 389346, "epoch": 2317} {"train_loss": -12.163623809814453, "global_step": 389347, "epoch": 2317} {"train_loss": -11.73023796081543, "global_step": 389348, "epoch": 2317} {"train_loss": -12.052734375, "global_step": 389349, "epoch": 2317} {"train_loss": -12.116901397705078, "global_step": 389350, "epoch": 2317} {"train_loss": -11.763982772827148, "global_step": 389351, "epoch": 2317} {"train_loss": -11.96908950805664, "global_step": 389352, "epoch": 2317} {"train_loss": -11.812763214111328, "global_step": 389353, "epoch": 2317} {"train_loss": -11.974912643432617, "global_step": 389354, "epoch": 2317} {"train_loss": -11.501901626586914, "global_step": 389355, "epoch": 2317} {"train_loss": -12.092578887939453, "global_step": 389356, "epoch": 2317} {"train_loss": -11.985483169555664, "global_step": 389357, "epoch": 2317} {"train_loss": -12.146722793579102, "global_step": 389358, "epoch": 2317} {"train_loss": -12.007566452026367, "global_step": 389359, "epoch": 2317} {"train_loss": -12.042610168457031, "global_step": 389360, "epoch": 2317} {"train_loss": -12.367290496826172, "global_step": 389361, "epoch": 2317} {"train_loss": -12.317584991455078, "global_step": 389362, "epoch": 2317} {"train_loss": -12.006172180175781, "global_step": 389363, "epoch": 2317} {"train_loss": -12.26380729675293, "global_step": 389364, "epoch": 2317} {"train_loss": -11.961718559265137, "global_step": 389365, "epoch": 2317} {"train_loss": -12.063645362854004, "global_step": 389366, "epoch": 2317} {"train_loss": -11.997148513793945, "global_step": 389367, "epoch": 2317} {"train_loss": -11.663718223571777, "global_step": 389368, "epoch": 2317} {"train_loss": -12.329204559326172, "global_step": 389369, "epoch": 2317} {"train_loss": -11.849653244018555, "global_step": 389370, "epoch": 2317} {"train_loss": -11.89200210571289, "global_step": 389371, "epoch": 2317} {"train_loss": -12.09332275390625, "global_step": 389372, "epoch": 2317} {"train_loss": -11.91649055480957, "global_step": 389373, "epoch": 2317} {"train_loss": -12.15634822845459, "global_step": 389374, "epoch": 2317} {"train_loss": -12.011703491210938, "global_step": 389375, "epoch": 2317} {"train_loss": -12.409432411193848, "global_step": 389376, "epoch": 2317} {"train_loss": -11.786613464355469, "global_step": 389377, "epoch": 2317} {"train_loss": -11.694750785827637, "global_step": 389378, "epoch": 2317} {"train_loss": -11.901247024536133, "global_step": 389379, "epoch": 2317} {"train_loss": -11.388702392578125, "global_step": 389380, "epoch": 2317} {"train_loss": -12.046764373779297, "global_step": 389381, "epoch": 2317} {"train_loss": -12.152223587036133, "global_step": 389382, "epoch": 2317} {"train_loss": -11.964794158935547, "global_step": 389383, "epoch": 2317} {"train_loss": -12.249113082885742, "global_step": 389384, "epoch": 2317} {"train_loss": -12.248844146728516, "global_step": 389385, "epoch": 2317} {"train_loss": -12.182741165161133, "global_step": 389386, "epoch": 2317} {"train_loss": -12.126964569091797, "global_step": 389387, "epoch": 2317} {"train_loss": -11.771768569946289, "global_step": 389388, "epoch": 2317} {"train_loss": -12.099717140197754, "global_step": 389389, "epoch": 2317} {"train_loss": -11.961165428161621, "global_step": 389390, "epoch": 2317} {"train_loss": -12.200685501098633, "global_step": 389391, "epoch": 2317} {"train_loss": -12.270082473754883, "global_step": 389392, "epoch": 2317} {"train_loss": -12.44550895690918, "global_step": 389393, "epoch": 2317} {"train_loss": -12.015889167785645, "global_step": 389394, "epoch": 2317} {"train_loss": -12.462667465209961, "global_step": 389395, "epoch": 2317} {"train_loss": -12.03592300415039, "global_step": 389396, "epoch": 2317} {"train_loss": -12.153467178344727, "global_step": 389397, "epoch": 2317} {"train_loss": -12.438854217529297, "global_step": 389398, "epoch": 2317} {"train_loss": -12.398601531982422, "global_step": 389399, "epoch": 2317} {"train_loss": -12.280776023864746, "global_step": 389400, "epoch": 2317} {"train_loss": -12.617475509643555, "global_step": 389401, "epoch": 2317} {"train_loss": -12.135209083557129, "global_step": 389402, "epoch": 2317} {"train_loss": -12.4445219039917, "global_step": 389403, "epoch": 2317} {"train_loss": -12.025588989257812, "global_step": 389404, "epoch": 2317} {"train_loss": -12.483039855957031, "global_step": 389405, "epoch": 2317} {"train_loss": -12.335124969482422, "global_step": 389406, "epoch": 2317} {"train_loss": -12.512572288513184, "global_step": 389407, "epoch": 2317} {"train_loss": -12.600564956665039, "global_step": 389408, "epoch": 2317} {"train_loss": -12.275211334228516, "global_step": 389409, "epoch": 2317} {"train_loss": -12.532894134521484, "global_step": 389410, "epoch": 2317} {"train_loss": -12.583845138549805, "global_step": 389411, "epoch": 2317} {"train_loss": -12.506847381591797, "global_step": 389412, "epoch": 2317} {"train_loss": -12.562795639038086, "global_step": 389413, "epoch": 2317} {"train_loss": -12.736047744750977, "global_step": 389414, "epoch": 2317} {"train_loss": -12.566593170166016, "global_step": 389415, "epoch": 2317} {"train_loss": -12.330589294433594, "global_step": 389416, "epoch": 2317} {"train_loss": -12.790085792541504, "global_step": 389417, "epoch": 2317} {"train_loss": -12.313047409057617, "global_step": 389418, "epoch": 2317} {"train_loss": -12.59396743774414, "global_step": 389419, "epoch": 2317} {"train_loss": -12.228839874267578, "global_step": 389420, "epoch": 2317} {"train_loss": -12.33770751953125, "global_step": 389421, "epoch": 2317} {"train_loss": -12.631875991821289, "global_step": 389422, "epoch": 2317} {"train_loss": -11.895853258314586, "global_step": 389423, "epoch": 2317, "val_loss": 295868.96875} {"train_loss": -12.611769676208496, "global_step": 389424, "epoch": 2318} {"train_loss": -12.41784954071045, "global_step": 389425, "epoch": 2318} {"train_loss": -11.693232536315918, "global_step": 389426, "epoch": 2318} {"train_loss": -12.583686828613281, "global_step": 389427, "epoch": 2318} {"train_loss": -12.027832984924316, "global_step": 389428, "epoch": 2318} {"train_loss": -12.228154182434082, "global_step": 389429, "epoch": 2318} {"train_loss": -12.333412170410156, "global_step": 389430, "epoch": 2318} {"train_loss": -12.250990867614746, "global_step": 389431, "epoch": 2318} {"train_loss": -12.488354682922363, "global_step": 389432, "epoch": 2318} {"train_loss": -12.335227966308594, "global_step": 389433, "epoch": 2318} {"train_loss": -12.40042495727539, "global_step": 389434, "epoch": 2318} {"train_loss": -11.997143745422363, "global_step": 389435, "epoch": 2318} {"train_loss": -12.17056655883789, "global_step": 389436, "epoch": 2318} {"train_loss": -11.166282653808594, "global_step": 389437, "epoch": 2318} {"train_loss": -11.91362190246582, "global_step": 389438, "epoch": 2318} {"train_loss": -12.191131591796875, "global_step": 389439, "epoch": 2318} {"train_loss": -10.820924758911133, "global_step": 389440, "epoch": 2318} {"train_loss": -12.519917488098145, "global_step": 389441, "epoch": 2318} {"train_loss": -11.238635063171387, "global_step": 389442, "epoch": 2318} {"train_loss": -10.817895889282227, "global_step": 389443, "epoch": 2318} {"train_loss": -12.139181137084961, "global_step": 389444, "epoch": 2318} {"train_loss": -10.427454948425293, "global_step": 389445, "epoch": 2318} {"train_loss": -10.41580581665039, "global_step": 389446, "epoch": 2318} {"train_loss": -11.99827766418457, "global_step": 389447, "epoch": 2318} {"train_loss": -10.902875900268555, "global_step": 389448, "epoch": 2318} {"train_loss": -11.786316871643066, "global_step": 389449, "epoch": 2318} {"train_loss": -11.249834060668945, "global_step": 389450, "epoch": 2318} {"train_loss": -11.715669631958008, "global_step": 389451, "epoch": 2318} {"train_loss": -12.22616958618164, "global_step": 389452, "epoch": 2318} {"train_loss": -11.691816329956055, "global_step": 389453, "epoch": 2318} {"train_loss": -12.366514205932617, "global_step": 389454, "epoch": 2318} {"train_loss": -11.760359764099121, "global_step": 389455, "epoch": 2318} {"train_loss": -12.37994384765625, "global_step": 389456, "epoch": 2318} {"train_loss": -12.093132972717285, "global_step": 389457, "epoch": 2318} {"train_loss": -12.269365310668945, "global_step": 389458, "epoch": 2318} {"train_loss": -12.179378509521484, "global_step": 389459, "epoch": 2318} {"train_loss": -12.289382934570312, "global_step": 389460, "epoch": 2318} {"train_loss": -12.488532066345215, "global_step": 389461, "epoch": 2318} {"train_loss": -12.241620063781738, "global_step": 389462, "epoch": 2318} {"train_loss": -12.457977294921875, "global_step": 389463, "epoch": 2318} {"train_loss": -12.048758506774902, "global_step": 389464, "epoch": 2318} {"train_loss": -12.169533729553223, "global_step": 389465, "epoch": 2318} {"train_loss": -11.827999114990234, "global_step": 389466, "epoch": 2318} {"train_loss": -11.732282638549805, "global_step": 389467, "epoch": 2318} {"train_loss": -11.973569869995117, "global_step": 389468, "epoch": 2318} {"train_loss": -11.8921537399292, "global_step": 389469, "epoch": 2318} {"train_loss": -12.130607604980469, "global_step": 389470, "epoch": 2318} {"train_loss": -12.18620777130127, "global_step": 389471, "epoch": 2318} {"train_loss": -12.010553359985352, "global_step": 389472, "epoch": 2318} {"train_loss": -11.879388809204102, "global_step": 389473, "epoch": 2318} {"train_loss": -12.284765243530273, "global_step": 389474, "epoch": 2318} {"train_loss": -11.738964080810547, "global_step": 389475, "epoch": 2318} {"train_loss": -12.316240310668945, "global_step": 389476, "epoch": 2318} {"train_loss": -11.968352317810059, "global_step": 389477, "epoch": 2318} {"train_loss": -12.101139068603516, "global_step": 389478, "epoch": 2318} {"train_loss": -12.530465126037598, "global_step": 389479, "epoch": 2318} {"train_loss": -11.997734069824219, "global_step": 389480, "epoch": 2318} {"train_loss": -12.5311279296875, "global_step": 389481, "epoch": 2318} {"train_loss": -12.040523529052734, "global_step": 389482, "epoch": 2318} {"train_loss": -12.47681713104248, "global_step": 389483, "epoch": 2318} {"train_loss": -12.060816764831543, "global_step": 389484, "epoch": 2318} {"train_loss": -12.527115821838379, "global_step": 389485, "epoch": 2318} {"train_loss": -11.957866668701172, "global_step": 389486, "epoch": 2318} {"train_loss": -12.317938804626465, "global_step": 389487, "epoch": 2318} {"train_loss": -11.327011108398438, "global_step": 389488, "epoch": 2318} {"train_loss": -12.36227798461914, "global_step": 389489, "epoch": 2318} {"train_loss": -11.822321891784668, "global_step": 389490, "epoch": 2318} {"train_loss": -11.876705169677734, "global_step": 389491, "epoch": 2318} {"train_loss": -12.48880386352539, "global_step": 389492, "epoch": 2318} {"train_loss": -11.551589965820312, "global_step": 389493, "epoch": 2318} {"train_loss": -12.429357528686523, "global_step": 389494, "epoch": 2318} {"train_loss": -11.472475051879883, "global_step": 389495, "epoch": 2318} {"train_loss": -11.915780067443848, "global_step": 389496, "epoch": 2318} {"train_loss": -11.997785568237305, "global_step": 389497, "epoch": 2318} {"train_loss": -11.803325653076172, "global_step": 389498, "epoch": 2318} {"train_loss": -11.505205154418945, "global_step": 389499, "epoch": 2318} {"train_loss": -11.326263427734375, "global_step": 389500, "epoch": 2318} {"train_loss": -11.40729808807373, "global_step": 389501, "epoch": 2318} {"train_loss": -11.612602233886719, "global_step": 389502, "epoch": 2318} {"train_loss": -11.420156478881836, "global_step": 389503, "epoch": 2318} {"train_loss": -11.619795799255371, "global_step": 389504, "epoch": 2318} {"train_loss": -11.29047966003418, "global_step": 389505, "epoch": 2318} {"train_loss": -11.502768516540527, "global_step": 389506, "epoch": 2318} {"train_loss": -10.653656005859375, "global_step": 389507, "epoch": 2318} {"train_loss": -11.008771896362305, "global_step": 389508, "epoch": 2318} {"train_loss": -9.935047149658203, "global_step": 389509, "epoch": 2318} {"train_loss": -10.304437637329102, "global_step": 389510, "epoch": 2318} {"train_loss": -10.084559440612793, "global_step": 389511, "epoch": 2318} {"train_loss": -11.389511108398438, "global_step": 389512, "epoch": 2318} {"train_loss": -10.20434856414795, "global_step": 389513, "epoch": 2318} {"train_loss": -11.902850151062012, "global_step": 389514, "epoch": 2318} {"train_loss": -10.396515846252441, "global_step": 389515, "epoch": 2318} {"train_loss": -11.282970428466797, "global_step": 389516, "epoch": 2318} {"train_loss": -11.273527145385742, "global_step": 389517, "epoch": 2318} {"train_loss": -10.952821731567383, "global_step": 389518, "epoch": 2318} {"train_loss": -12.068216323852539, "global_step": 389519, "epoch": 2318} {"train_loss": -11.199674606323242, "global_step": 389520, "epoch": 2318} {"train_loss": -10.899620056152344, "global_step": 389521, "epoch": 2318} {"train_loss": -12.002921104431152, "global_step": 389522, "epoch": 2318} {"train_loss": -10.76179313659668, "global_step": 389523, "epoch": 2318} {"train_loss": -11.516623497009277, "global_step": 389524, "epoch": 2318} {"train_loss": -11.527853965759277, "global_step": 389525, "epoch": 2318} {"train_loss": -11.656829833984375, "global_step": 389526, "epoch": 2318} {"train_loss": -11.697900772094727, "global_step": 389527, "epoch": 2318} {"train_loss": -12.088348388671875, "global_step": 389528, "epoch": 2318} {"train_loss": -11.97528076171875, "global_step": 389529, "epoch": 2318} {"train_loss": -11.921012878417969, "global_step": 389530, "epoch": 2318} {"train_loss": -12.177882194519043, "global_step": 389531, "epoch": 2318} {"train_loss": -11.590248107910156, "global_step": 389532, "epoch": 2318} {"train_loss": -12.075803756713867, "global_step": 389533, "epoch": 2318} {"train_loss": -11.555702209472656, "global_step": 389534, "epoch": 2318} {"train_loss": -11.996110916137695, "global_step": 389535, "epoch": 2318} {"train_loss": -12.040380477905273, "global_step": 389536, "epoch": 2318} {"train_loss": -11.87083625793457, "global_step": 389537, "epoch": 2318} {"train_loss": -12.473402976989746, "global_step": 389538, "epoch": 2318} {"train_loss": -12.086080551147461, "global_step": 389539, "epoch": 2318} {"train_loss": -11.917086601257324, "global_step": 389540, "epoch": 2318} {"train_loss": -12.265649795532227, "global_step": 389541, "epoch": 2318} {"train_loss": -12.036479949951172, "global_step": 389542, "epoch": 2318} {"train_loss": -12.27029800415039, "global_step": 389543, "epoch": 2318} {"train_loss": -12.276656150817871, "global_step": 389544, "epoch": 2318} {"train_loss": -11.976885795593262, "global_step": 389545, "epoch": 2318} {"train_loss": -12.44819450378418, "global_step": 389546, "epoch": 2318} {"train_loss": -12.006067276000977, "global_step": 389547, "epoch": 2318} {"train_loss": -12.190351486206055, "global_step": 389548, "epoch": 2318} {"train_loss": -12.325971603393555, "global_step": 389549, "epoch": 2318} {"train_loss": -12.256734848022461, "global_step": 389550, "epoch": 2318} {"train_loss": -12.339958190917969, "global_step": 389551, "epoch": 2318} {"train_loss": -12.557710647583008, "global_step": 389552, "epoch": 2318} {"train_loss": -12.263188362121582, "global_step": 389553, "epoch": 2318} {"train_loss": -12.468761444091797, "global_step": 389554, "epoch": 2318} {"train_loss": -12.487268447875977, "global_step": 389555, "epoch": 2318} {"train_loss": -12.580456733703613, "global_step": 389556, "epoch": 2318} {"train_loss": -12.585851669311523, "global_step": 389557, "epoch": 2318} {"train_loss": -12.515971183776855, "global_step": 389558, "epoch": 2318} {"train_loss": -12.440149307250977, "global_step": 389559, "epoch": 2318} {"train_loss": -12.193876266479492, "global_step": 389560, "epoch": 2318} {"train_loss": -12.524188995361328, "global_step": 389561, "epoch": 2318} {"train_loss": -12.560286521911621, "global_step": 389562, "epoch": 2318} {"train_loss": -12.612228393554688, "global_step": 389563, "epoch": 2318} {"train_loss": -12.515203475952148, "global_step": 389564, "epoch": 2318} {"train_loss": -12.580694198608398, "global_step": 389565, "epoch": 2318} {"train_loss": -12.335458755493164, "global_step": 389566, "epoch": 2318} {"train_loss": -12.654874801635742, "global_step": 389567, "epoch": 2318} {"train_loss": -12.566546440124512, "global_step": 389568, "epoch": 2318} {"train_loss": -12.349042892456055, "global_step": 389569, "epoch": 2318} {"train_loss": -12.565858840942383, "global_step": 389570, "epoch": 2318} {"train_loss": -12.602408409118652, "global_step": 389571, "epoch": 2318} {"train_loss": -12.759057998657227, "global_step": 389572, "epoch": 2318} {"train_loss": -12.625846862792969, "global_step": 389573, "epoch": 2318} {"train_loss": -12.68449592590332, "global_step": 389574, "epoch": 2318} {"train_loss": -12.541814804077148, "global_step": 389575, "epoch": 2318} {"train_loss": -12.50279426574707, "global_step": 389576, "epoch": 2318} {"train_loss": -12.607736587524414, "global_step": 389577, "epoch": 2318} {"train_loss": -12.546989440917969, "global_step": 389578, "epoch": 2318} {"train_loss": -12.854765892028809, "global_step": 389579, "epoch": 2318} {"train_loss": -12.700552940368652, "global_step": 389580, "epoch": 2318} {"train_loss": -12.604289054870605, "global_step": 389581, "epoch": 2318} {"train_loss": -12.787126541137695, "global_step": 389582, "epoch": 2318} {"train_loss": -12.78646469116211, "global_step": 389583, "epoch": 2318} {"train_loss": -12.65684700012207, "global_step": 389584, "epoch": 2318} {"train_loss": -12.92601203918457, "global_step": 389585, "epoch": 2318} {"train_loss": -12.674561500549316, "global_step": 389586, "epoch": 2318} {"train_loss": -12.59732437133789, "global_step": 389587, "epoch": 2318} {"train_loss": -12.627948760986328, "global_step": 389588, "epoch": 2318} {"train_loss": -12.736884117126465, "global_step": 389589, "epoch": 2318} {"train_loss": -12.504779815673828, "global_step": 389590, "epoch": 2318} {"train_loss": -12.004396682693844, "global_step": 389591, "epoch": 2318, "val_loss": 300036.21875} {"train_loss": -12.768416404724121, "global_step": 389592, "epoch": 2319} {"train_loss": -12.380542755126953, "global_step": 389593, "epoch": 2319} {"train_loss": -12.488602638244629, "global_step": 389594, "epoch": 2319} {"train_loss": -12.549419403076172, "global_step": 389595, "epoch": 2319} {"train_loss": -11.704320907592773, "global_step": 389596, "epoch": 2319} {"train_loss": -12.35879135131836, "global_step": 389597, "epoch": 2319} {"train_loss": -12.553817749023438, "global_step": 389598, "epoch": 2319} {"train_loss": -11.666227340698242, "global_step": 389599, "epoch": 2319} {"train_loss": -11.542037963867188, "global_step": 389600, "epoch": 2319} {"train_loss": -12.14599323272705, "global_step": 389601, "epoch": 2319} {"train_loss": -11.859220504760742, "global_step": 389602, "epoch": 2319} {"train_loss": -11.273964881896973, "global_step": 389603, "epoch": 2319} {"train_loss": -9.98177719116211, "global_step": 389604, "epoch": 2319} {"train_loss": -12.267602920532227, "global_step": 389605, "epoch": 2319} {"train_loss": -10.597475051879883, "global_step": 389606, "epoch": 2319} {"train_loss": -10.724210739135742, "global_step": 389607, "epoch": 2319} {"train_loss": -10.523143768310547, "global_step": 389608, "epoch": 2319} {"train_loss": -10.827888488769531, "global_step": 389609, "epoch": 2319} {"train_loss": -11.401872634887695, "global_step": 389610, "epoch": 2319} {"train_loss": -12.00209903717041, "global_step": 389611, "epoch": 2319} {"train_loss": -10.138108253479004, "global_step": 389612, "epoch": 2319} {"train_loss": -11.482905387878418, "global_step": 389613, "epoch": 2319} {"train_loss": -11.765789985656738, "global_step": 389614, "epoch": 2319} {"train_loss": -11.09134292602539, "global_step": 389615, "epoch": 2319} {"train_loss": -11.322059631347656, "global_step": 389616, "epoch": 2319} {"train_loss": -11.46839427947998, "global_step": 389617, "epoch": 2319} {"train_loss": -10.822126388549805, "global_step": 389618, "epoch": 2319} {"train_loss": -11.458970069885254, "global_step": 389619, "epoch": 2319} {"train_loss": -11.160591125488281, "global_step": 389620, "epoch": 2319} {"train_loss": -11.064915657043457, "global_step": 389621, "epoch": 2319} {"train_loss": -11.896655082702637, "global_step": 389622, "epoch": 2319} {"train_loss": -11.194839477539062, "global_step": 389623, "epoch": 2319} {"train_loss": -10.963488578796387, "global_step": 389624, "epoch": 2319} {"train_loss": -10.10108470916748, "global_step": 389625, "epoch": 2319} {"train_loss": -11.000720977783203, "global_step": 389626, "epoch": 2319} {"train_loss": -11.862446784973145, "global_step": 389627, "epoch": 2319} {"train_loss": -11.094097137451172, "global_step": 389628, "epoch": 2319} {"train_loss": -11.761903762817383, "global_step": 389629, "epoch": 2319} {"train_loss": -11.343284606933594, "global_step": 389630, "epoch": 2319} {"train_loss": -11.680299758911133, "global_step": 389631, "epoch": 2319} {"train_loss": -11.402475357055664, "global_step": 389632, "epoch": 2319} {"train_loss": -11.611000061035156, "global_step": 389633, "epoch": 2319} {"train_loss": -11.555902481079102, "global_step": 389634, "epoch": 2319} {"train_loss": -11.462729454040527, "global_step": 389635, "epoch": 2319} {"train_loss": -12.121393203735352, "global_step": 389636, "epoch": 2319} {"train_loss": -11.781537055969238, "global_step": 389637, "epoch": 2319} {"train_loss": -11.715462684631348, "global_step": 389638, "epoch": 2319} {"train_loss": -11.806753158569336, "global_step": 389639, "epoch": 2319} {"train_loss": -12.030099868774414, "global_step": 389640, "epoch": 2319} {"train_loss": -11.430233001708984, "global_step": 389641, "epoch": 2319} {"train_loss": -11.39365291595459, "global_step": 389642, "epoch": 2319} {"train_loss": -11.873737335205078, "global_step": 389643, "epoch": 2319} {"train_loss": -11.886716842651367, "global_step": 389644, "epoch": 2319} {"train_loss": -11.71317195892334, "global_step": 389645, "epoch": 2319} {"train_loss": -12.055145263671875, "global_step": 389646, "epoch": 2319} {"train_loss": -12.06383991241455, "global_step": 389647, "epoch": 2319} {"train_loss": -11.832356452941895, "global_step": 389648, "epoch": 2319} {"train_loss": -11.589249610900879, "global_step": 389649, "epoch": 2319} {"train_loss": -11.899978637695312, "global_step": 389650, "epoch": 2319} {"train_loss": -12.104759216308594, "global_step": 389651, "epoch": 2319} {"train_loss": -12.270856857299805, "global_step": 389652, "epoch": 2319} {"train_loss": -12.009475708007812, "global_step": 389653, "epoch": 2319} {"train_loss": -12.429047584533691, "global_step": 389654, "epoch": 2319} {"train_loss": -12.372640609741211, "global_step": 389655, "epoch": 2319} {"train_loss": -12.439834594726562, "global_step": 389656, "epoch": 2319} {"train_loss": -12.248997688293457, "global_step": 389657, "epoch": 2319} {"train_loss": -12.402793884277344, "global_step": 389658, "epoch": 2319} {"train_loss": -12.220438957214355, "global_step": 389659, "epoch": 2319} {"train_loss": -12.320907592773438, "global_step": 389660, "epoch": 2319} {"train_loss": -12.4339017868042, "global_step": 389661, "epoch": 2319} {"train_loss": -12.5191650390625, "global_step": 389662, "epoch": 2319} {"train_loss": -12.550814628601074, "global_step": 389663, "epoch": 2319} {"train_loss": -12.417243957519531, "global_step": 389664, "epoch": 2319} {"train_loss": -12.508628845214844, "global_step": 389665, "epoch": 2319} {"train_loss": -12.149163246154785, "global_step": 389666, "epoch": 2319} {"train_loss": -12.520509719848633, "global_step": 389667, "epoch": 2319} {"train_loss": -12.597030639648438, "global_step": 389668, "epoch": 2319} {"train_loss": -12.523526191711426, "global_step": 389669, "epoch": 2319} {"train_loss": -12.436883926391602, "global_step": 389670, "epoch": 2319} {"train_loss": -12.484691619873047, "global_step": 389671, "epoch": 2319} {"train_loss": -12.45673942565918, "global_step": 389672, "epoch": 2319} {"train_loss": -12.329230308532715, "global_step": 389673, "epoch": 2319} {"train_loss": -12.527264595031738, "global_step": 389674, "epoch": 2319} {"train_loss": -12.585725784301758, "global_step": 389675, "epoch": 2319} {"train_loss": -12.466255187988281, "global_step": 389676, "epoch": 2319} {"train_loss": -12.126958847045898, "global_step": 389677, "epoch": 2319} {"train_loss": -12.548811912536621, "global_step": 389678, "epoch": 2319} {"train_loss": -12.518974304199219, "global_step": 389679, "epoch": 2319} {"train_loss": -12.644266128540039, "global_step": 389680, "epoch": 2319} {"train_loss": -12.203634262084961, "global_step": 389681, "epoch": 2319} {"train_loss": -12.493098258972168, "global_step": 389682, "epoch": 2319} {"train_loss": -12.495162963867188, "global_step": 389683, "epoch": 2319} {"train_loss": -12.595998764038086, "global_step": 389684, "epoch": 2319} {"train_loss": -12.19588851928711, "global_step": 389685, "epoch": 2319} {"train_loss": -12.368505477905273, "global_step": 389686, "epoch": 2319} {"train_loss": -12.445977210998535, "global_step": 389687, "epoch": 2319} {"train_loss": -12.682376861572266, "global_step": 389688, "epoch": 2319} {"train_loss": -12.428125381469727, "global_step": 389689, "epoch": 2319} {"train_loss": -12.664426803588867, "global_step": 389690, "epoch": 2319} {"train_loss": -12.79716682434082, "global_step": 389691, "epoch": 2319} {"train_loss": -12.329363822937012, "global_step": 389692, "epoch": 2319} {"train_loss": -12.45873737335205, "global_step": 389693, "epoch": 2319} {"train_loss": -12.51875114440918, "global_step": 389694, "epoch": 2319} {"train_loss": -12.448756217956543, "global_step": 389695, "epoch": 2319} {"train_loss": -12.653305053710938, "global_step": 389696, "epoch": 2319} {"train_loss": -12.41106128692627, "global_step": 389697, "epoch": 2319} {"train_loss": -12.361894607543945, "global_step": 389698, "epoch": 2319} {"train_loss": -12.692070007324219, "global_step": 389699, "epoch": 2319} {"train_loss": -12.6959867477417, "global_step": 389700, "epoch": 2319} {"train_loss": -12.574621200561523, "global_step": 389701, "epoch": 2319} {"train_loss": -12.12204360961914, "global_step": 389702, "epoch": 2319} {"train_loss": -12.502572059631348, "global_step": 389703, "epoch": 2319} {"train_loss": -12.623760223388672, "global_step": 389704, "epoch": 2319} {"train_loss": -12.450647354125977, "global_step": 389705, "epoch": 2319} {"train_loss": -12.532126426696777, "global_step": 389706, "epoch": 2319} {"train_loss": -12.530553817749023, "global_step": 389707, "epoch": 2319} {"train_loss": -12.672435760498047, "global_step": 389708, "epoch": 2319} {"train_loss": -12.79846477508545, "global_step": 389709, "epoch": 2319} {"train_loss": -12.298763275146484, "global_step": 389710, "epoch": 2319} {"train_loss": -12.206148147583008, "global_step": 389711, "epoch": 2319} {"train_loss": -12.739995956420898, "global_step": 389712, "epoch": 2319} {"train_loss": -12.114595413208008, "global_step": 389713, "epoch": 2319} {"train_loss": -11.923107147216797, "global_step": 389714, "epoch": 2319} {"train_loss": -12.482247352600098, "global_step": 389715, "epoch": 2319} {"train_loss": -12.64310073852539, "global_step": 389716, "epoch": 2319} {"train_loss": -11.505499839782715, "global_step": 389717, "epoch": 2319} {"train_loss": -11.193683624267578, "global_step": 389718, "epoch": 2319} {"train_loss": -12.565694808959961, "global_step": 389719, "epoch": 2319} {"train_loss": -11.630773544311523, "global_step": 389720, "epoch": 2319} {"train_loss": -11.331473350524902, "global_step": 389721, "epoch": 2319} {"train_loss": -11.985130310058594, "global_step": 389722, "epoch": 2319} {"train_loss": -10.938530921936035, "global_step": 389723, "epoch": 2319} {"train_loss": -11.652654647827148, "global_step": 389724, "epoch": 2319} {"train_loss": -11.950756072998047, "global_step": 389725, "epoch": 2319} {"train_loss": -10.605681419372559, "global_step": 389726, "epoch": 2319} {"train_loss": -11.965677261352539, "global_step": 389727, "epoch": 2319} {"train_loss": -11.541106224060059, "global_step": 389728, "epoch": 2319} {"train_loss": -10.910310745239258, "global_step": 389729, "epoch": 2319} {"train_loss": -11.348039627075195, "global_step": 389730, "epoch": 2319} {"train_loss": -11.174752235412598, "global_step": 389731, "epoch": 2319} {"train_loss": -11.205236434936523, "global_step": 389732, "epoch": 2319} {"train_loss": -11.084989547729492, "global_step": 389733, "epoch": 2319} {"train_loss": -10.94693374633789, "global_step": 389734, "epoch": 2319} {"train_loss": -11.293191909790039, "global_step": 389735, "epoch": 2319} {"train_loss": -11.32706069946289, "global_step": 389736, "epoch": 2319} {"train_loss": -11.611580848693848, "global_step": 389737, "epoch": 2319} {"train_loss": -12.00610065460205, "global_step": 389738, "epoch": 2319} {"train_loss": -11.613183975219727, "global_step": 389739, "epoch": 2319} {"train_loss": -11.822173118591309, "global_step": 389740, "epoch": 2319} {"train_loss": -11.156471252441406, "global_step": 389741, "epoch": 2319} {"train_loss": -12.079858779907227, "global_step": 389742, "epoch": 2319} {"train_loss": -10.791784286499023, "global_step": 389743, "epoch": 2319} {"train_loss": -11.23457145690918, "global_step": 389744, "epoch": 2319} {"train_loss": -11.454450607299805, "global_step": 389745, "epoch": 2319} {"train_loss": -12.029524803161621, "global_step": 389746, "epoch": 2319} {"train_loss": -11.706320762634277, "global_step": 389747, "epoch": 2319} {"train_loss": -11.718432426452637, "global_step": 389748, "epoch": 2319} {"train_loss": -11.414083480834961, "global_step": 389749, "epoch": 2319} {"train_loss": -11.980463027954102, "global_step": 389750, "epoch": 2319} {"train_loss": -11.396228790283203, "global_step": 389751, "epoch": 2319} {"train_loss": -12.126544952392578, "global_step": 389752, "epoch": 2319} {"train_loss": -12.051770210266113, "global_step": 389753, "epoch": 2319} {"train_loss": -11.771097183227539, "global_step": 389754, "epoch": 2319} {"train_loss": -12.040878295898438, "global_step": 389755, "epoch": 2319} {"train_loss": -11.691596031188965, "global_step": 389756, "epoch": 2319} {"train_loss": -12.034751892089844, "global_step": 389757, "epoch": 2319} {"train_loss": -11.998922348022461, "global_step": 389758, "epoch": 2319} {"train_loss": -11.906652881985618, "global_step": 389759, "epoch": 2319, "val_loss": 300760.40625} {"train_loss": -11.954648971557617, "global_step": 389760, "epoch": 2320} {"train_loss": -11.451622009277344, "global_step": 389761, "epoch": 2320} {"train_loss": -11.960761070251465, "global_step": 389762, "epoch": 2320} {"train_loss": -11.805870056152344, "global_step": 389763, "epoch": 2320} {"train_loss": -11.766237258911133, "global_step": 389764, "epoch": 2320} {"train_loss": -11.49433708190918, "global_step": 389765, "epoch": 2320} {"train_loss": -12.000975608825684, "global_step": 389766, "epoch": 2320} {"train_loss": -12.014842987060547, "global_step": 389767, "epoch": 2320} {"train_loss": -12.073278427124023, "global_step": 389768, "epoch": 2320} {"train_loss": -12.121192932128906, "global_step": 389769, "epoch": 2320} {"train_loss": -12.18716049194336, "global_step": 389770, "epoch": 2320} {"train_loss": -12.310174942016602, "global_step": 389771, "epoch": 2320} {"train_loss": -12.351007461547852, "global_step": 389772, "epoch": 2320} {"train_loss": -12.281736373901367, "global_step": 389773, "epoch": 2320} {"train_loss": -12.048379898071289, "global_step": 389774, "epoch": 2320} {"train_loss": -12.013197898864746, "global_step": 389775, "epoch": 2320} {"train_loss": -12.165779113769531, "global_step": 389776, "epoch": 2320} {"train_loss": -12.095224380493164, "global_step": 389777, "epoch": 2320} {"train_loss": -11.87169075012207, "global_step": 389778, "epoch": 2320} {"train_loss": -11.7465238571167, "global_step": 389779, "epoch": 2320} {"train_loss": -12.367959022521973, "global_step": 389780, "epoch": 2320} {"train_loss": -11.960153579711914, "global_step": 389781, "epoch": 2320} {"train_loss": -11.925725936889648, "global_step": 389782, "epoch": 2320} {"train_loss": -11.956260681152344, "global_step": 389783, "epoch": 2320} {"train_loss": -12.017751693725586, "global_step": 389784, "epoch": 2320} {"train_loss": -12.013986587524414, "global_step": 389785, "epoch": 2320} {"train_loss": -12.231897354125977, "global_step": 389786, "epoch": 2320} {"train_loss": -11.909602165222168, "global_step": 389787, "epoch": 2320} {"train_loss": -11.889631271362305, "global_step": 389788, "epoch": 2320} {"train_loss": -12.359628677368164, "global_step": 389789, "epoch": 2320} {"train_loss": -12.13083267211914, "global_step": 389790, "epoch": 2320} {"train_loss": -12.200092315673828, "global_step": 389791, "epoch": 2320} {"train_loss": -12.405126571655273, "global_step": 389792, "epoch": 2320} {"train_loss": -12.162909507751465, "global_step": 389793, "epoch": 2320} {"train_loss": -12.223987579345703, "global_step": 389794, "epoch": 2320} {"train_loss": -12.264524459838867, "global_step": 389795, "epoch": 2320} {"train_loss": -12.045830726623535, "global_step": 389796, "epoch": 2320} {"train_loss": -12.261608123779297, "global_step": 389797, "epoch": 2320} {"train_loss": -12.117708206176758, "global_step": 389798, "epoch": 2320} {"train_loss": -12.650778770446777, "global_step": 389799, "epoch": 2320} {"train_loss": -12.217479705810547, "global_step": 389800, "epoch": 2320} {"train_loss": -12.250417709350586, "global_step": 389801, "epoch": 2320} {"train_loss": -12.368581771850586, "global_step": 389802, "epoch": 2320} {"train_loss": -12.401495933532715, "global_step": 389803, "epoch": 2320} {"train_loss": -12.541694641113281, "global_step": 389804, "epoch": 2320} {"train_loss": -12.3073091506958, "global_step": 389805, "epoch": 2320} {"train_loss": -12.26336669921875, "global_step": 389806, "epoch": 2320} {"train_loss": -12.532550811767578, "global_step": 389807, "epoch": 2320} {"train_loss": -12.326093673706055, "global_step": 389808, "epoch": 2320} {"train_loss": -12.482626914978027, "global_step": 389809, "epoch": 2320} {"train_loss": -12.42797565460205, "global_step": 389810, "epoch": 2320} {"train_loss": -12.543795585632324, "global_step": 389811, "epoch": 2320} {"train_loss": -12.387687683105469, "global_step": 389812, "epoch": 2320} {"train_loss": -12.131608963012695, "global_step": 389813, "epoch": 2320} {"train_loss": -12.238542556762695, "global_step": 389814, "epoch": 2320} {"train_loss": -12.05709171295166, "global_step": 389815, "epoch": 2320} {"train_loss": -11.06962776184082, "global_step": 389816, "epoch": 2320} {"train_loss": -12.363343238830566, "global_step": 389817, "epoch": 2320} {"train_loss": -11.671552658081055, "global_step": 389818, "epoch": 2320} {"train_loss": -12.217195510864258, "global_step": 389819, "epoch": 2320} {"train_loss": -11.508007049560547, "global_step": 389820, "epoch": 2320} {"train_loss": -11.833986282348633, "global_step": 389821, "epoch": 2320} {"train_loss": -12.110462188720703, "global_step": 389822, "epoch": 2320} {"train_loss": -12.290485382080078, "global_step": 389823, "epoch": 2320} {"train_loss": -10.927261352539062, "global_step": 389824, "epoch": 2320} {"train_loss": -12.543182373046875, "global_step": 389825, "epoch": 2320} {"train_loss": -11.20083236694336, "global_step": 389826, "epoch": 2320} {"train_loss": -11.905885696411133, "global_step": 389827, "epoch": 2320} {"train_loss": -12.01021957397461, "global_step": 389828, "epoch": 2320} {"train_loss": -11.28609848022461, "global_step": 389829, "epoch": 2320} {"train_loss": -11.8017578125, "global_step": 389830, "epoch": 2320} {"train_loss": -12.382368087768555, "global_step": 389831, "epoch": 2320} {"train_loss": -11.323675155639648, "global_step": 389832, "epoch": 2320} {"train_loss": -10.773898124694824, "global_step": 389833, "epoch": 2320} {"train_loss": -12.110738754272461, "global_step": 389834, "epoch": 2320} {"train_loss": -11.20228385925293, "global_step": 389835, "epoch": 2320} {"train_loss": -11.73013687133789, "global_step": 389836, "epoch": 2320} {"train_loss": -11.503049850463867, "global_step": 389837, "epoch": 2320} {"train_loss": -11.650564193725586, "global_step": 389838, "epoch": 2320} {"train_loss": -11.760113716125488, "global_step": 389839, "epoch": 2320} {"train_loss": -12.002338409423828, "global_step": 389840, "epoch": 2320} {"train_loss": -11.417088508605957, "global_step": 389841, "epoch": 2320} {"train_loss": -11.546806335449219, "global_step": 389842, "epoch": 2320} {"train_loss": -11.57335090637207, "global_step": 389843, "epoch": 2320} {"train_loss": -10.888725280761719, "global_step": 389844, "epoch": 2320} {"train_loss": -12.164176940917969, "global_step": 389845, "epoch": 2320} {"train_loss": -11.451475143432617, "global_step": 389846, "epoch": 2320} {"train_loss": -10.310800552368164, "global_step": 389847, "epoch": 2320} {"train_loss": -11.01144790649414, "global_step": 389848, "epoch": 2320} {"train_loss": -10.339423179626465, "global_step": 389849, "epoch": 2320} {"train_loss": -10.26113224029541, "global_step": 389850, "epoch": 2320} {"train_loss": -10.337164878845215, "global_step": 389851, "epoch": 2320} {"train_loss": -11.246870040893555, "global_step": 389852, "epoch": 2320} {"train_loss": -11.146778106689453, "global_step": 389853, "epoch": 2320} {"train_loss": -11.926924705505371, "global_step": 389854, "epoch": 2320} {"train_loss": -10.690936088562012, "global_step": 389855, "epoch": 2320} {"train_loss": -11.523189544677734, "global_step": 389856, "epoch": 2320} {"train_loss": -10.88672924041748, "global_step": 389857, "epoch": 2320} {"train_loss": -11.078099250793457, "global_step": 389858, "epoch": 2320} {"train_loss": -11.677298545837402, "global_step": 389859, "epoch": 2320} {"train_loss": -11.660134315490723, "global_step": 389860, "epoch": 2320} {"train_loss": -11.771073341369629, "global_step": 389861, "epoch": 2320} {"train_loss": -11.95068359375, "global_step": 389862, "epoch": 2320} {"train_loss": -11.349438667297363, "global_step": 389863, "epoch": 2320} {"train_loss": -11.835756301879883, "global_step": 389864, "epoch": 2320} {"train_loss": -11.610225677490234, "global_step": 389865, "epoch": 2320} {"train_loss": -11.532966613769531, "global_step": 389866, "epoch": 2320} {"train_loss": -11.926140785217285, "global_step": 389867, "epoch": 2320} {"train_loss": -11.070962905883789, "global_step": 389868, "epoch": 2320} {"train_loss": -12.047806739807129, "global_step": 389869, "epoch": 2320} {"train_loss": -11.294401168823242, "global_step": 389870, "epoch": 2320} {"train_loss": -11.879194259643555, "global_step": 389871, "epoch": 2320} {"train_loss": -11.773058891296387, "global_step": 389872, "epoch": 2320} {"train_loss": -11.790046691894531, "global_step": 389873, "epoch": 2320} {"train_loss": -11.605592727661133, "global_step": 389874, "epoch": 2320} {"train_loss": -12.084159851074219, "global_step": 389875, "epoch": 2320} {"train_loss": -11.595277786254883, "global_step": 389876, "epoch": 2320} {"train_loss": -12.174617767333984, "global_step": 389877, "epoch": 2320} {"train_loss": -11.440802574157715, "global_step": 389878, "epoch": 2320} {"train_loss": -12.132936477661133, "global_step": 389879, "epoch": 2320} {"train_loss": -11.682026863098145, "global_step": 389880, "epoch": 2320} {"train_loss": -12.151798248291016, "global_step": 389881, "epoch": 2320} {"train_loss": -11.99882698059082, "global_step": 389882, "epoch": 2320} {"train_loss": -12.152490615844727, "global_step": 389883, "epoch": 2320} {"train_loss": -11.595088005065918, "global_step": 389884, "epoch": 2320} {"train_loss": -12.337080001831055, "global_step": 389885, "epoch": 2320} {"train_loss": -11.906004905700684, "global_step": 389886, "epoch": 2320} {"train_loss": -12.285987854003906, "global_step": 389887, "epoch": 2320} {"train_loss": -12.154134750366211, "global_step": 389888, "epoch": 2320} {"train_loss": -12.16943359375, "global_step": 389889, "epoch": 2320} {"train_loss": -12.181807518005371, "global_step": 389890, "epoch": 2320} {"train_loss": -11.967924118041992, "global_step": 389891, "epoch": 2320} {"train_loss": -12.274007797241211, "global_step": 389892, "epoch": 2320} {"train_loss": -12.187665939331055, "global_step": 389893, "epoch": 2320} {"train_loss": -12.12303352355957, "global_step": 389894, "epoch": 2320} {"train_loss": -12.615030288696289, "global_step": 389895, "epoch": 2320} {"train_loss": -12.229103088378906, "global_step": 389896, "epoch": 2320} {"train_loss": -12.539716720581055, "global_step": 389897, "epoch": 2320} {"train_loss": -12.100902557373047, "global_step": 389898, "epoch": 2320} {"train_loss": -12.211507797241211, "global_step": 389899, "epoch": 2320} {"train_loss": -12.262032508850098, "global_step": 389900, "epoch": 2320} {"train_loss": -12.11049747467041, "global_step": 389901, "epoch": 2320} {"train_loss": -12.298542022705078, "global_step": 389902, "epoch": 2320} {"train_loss": -12.21169662475586, "global_step": 389903, "epoch": 2320} {"train_loss": -12.417795181274414, "global_step": 389904, "epoch": 2320} {"train_loss": -12.403063774108887, "global_step": 389905, "epoch": 2320} {"train_loss": -12.343701362609863, "global_step": 389906, "epoch": 2320} {"train_loss": -12.575604438781738, "global_step": 389907, "epoch": 2320} {"train_loss": -12.407353401184082, "global_step": 389908, "epoch": 2320} {"train_loss": -12.51224422454834, "global_step": 389909, "epoch": 2320} {"train_loss": -12.677108764648438, "global_step": 389910, "epoch": 2320} {"train_loss": -12.469257354736328, "global_step": 389911, "epoch": 2320} {"train_loss": -12.709381103515625, "global_step": 389912, "epoch": 2320} {"train_loss": -12.611642837524414, "global_step": 389913, "epoch": 2320} {"train_loss": -12.437997817993164, "global_step": 389914, "epoch": 2320} {"train_loss": -12.685696601867676, "global_step": 389915, "epoch": 2320} {"train_loss": -12.596059799194336, "global_step": 389916, "epoch": 2320} {"train_loss": -12.762304306030273, "global_step": 389917, "epoch": 2320} {"train_loss": -12.828530311584473, "global_step": 389918, "epoch": 2320} {"train_loss": -12.52095890045166, "global_step": 389919, "epoch": 2320} {"train_loss": -12.608855247497559, "global_step": 389920, "epoch": 2320} {"train_loss": -12.36334228515625, "global_step": 389921, "epoch": 2320} {"train_loss": -12.524707794189453, "global_step": 389922, "epoch": 2320} {"train_loss": -12.489593505859375, "global_step": 389923, "epoch": 2320} {"train_loss": -12.646458625793457, "global_step": 389924, "epoch": 2320} {"train_loss": -12.535089492797852, "global_step": 389925, "epoch": 2320} {"train_loss": -12.599964141845703, "global_step": 389926, "epoch": 2320} {"train_loss": -11.97610898812612, "global_step": 389927, "epoch": 2320, "val_loss": 298084.03125, "train_action_mse_error": 1.2155797481536865} {"train_loss": -12.418403625488281, "global_step": 389928, "epoch": 2321} {"train_loss": -12.65541934967041, "global_step": 389929, "epoch": 2321} {"train_loss": -12.664194107055664, "global_step": 389930, "epoch": 2321} {"train_loss": -12.445259094238281, "global_step": 389931, "epoch": 2321} {"train_loss": -12.65603256225586, "global_step": 389932, "epoch": 2321} {"train_loss": -12.679909706115723, "global_step": 389933, "epoch": 2321} {"train_loss": -12.390467643737793, "global_step": 389934, "epoch": 2321} {"train_loss": -12.71410846710205, "global_step": 389935, "epoch": 2321} {"train_loss": -12.267312049865723, "global_step": 389936, "epoch": 2321} {"train_loss": -12.43156623840332, "global_step": 389937, "epoch": 2321} {"train_loss": -12.157268524169922, "global_step": 389938, "epoch": 2321} {"train_loss": -12.520105361938477, "global_step": 389939, "epoch": 2321} {"train_loss": -12.605141639709473, "global_step": 389940, "epoch": 2321} {"train_loss": -11.822235107421875, "global_step": 389941, "epoch": 2321} {"train_loss": -12.21347427368164, "global_step": 389942, "epoch": 2321} {"train_loss": -12.297529220581055, "global_step": 389943, "epoch": 2321} {"train_loss": -12.464426040649414, "global_step": 389944, "epoch": 2321} {"train_loss": -12.265253067016602, "global_step": 389945, "epoch": 2321} {"train_loss": -12.260793685913086, "global_step": 389946, "epoch": 2321} {"train_loss": -12.640681266784668, "global_step": 389947, "epoch": 2321} {"train_loss": -12.352959632873535, "global_step": 389948, "epoch": 2321} {"train_loss": -12.485174179077148, "global_step": 389949, "epoch": 2321} {"train_loss": -12.598970413208008, "global_step": 389950, "epoch": 2321} {"train_loss": -12.155630111694336, "global_step": 389951, "epoch": 2321} {"train_loss": -12.470094680786133, "global_step": 389952, "epoch": 2321} {"train_loss": -12.315410614013672, "global_step": 389953, "epoch": 2321} {"train_loss": -12.439363479614258, "global_step": 389954, "epoch": 2321} {"train_loss": -12.231489181518555, "global_step": 389955, "epoch": 2321} {"train_loss": -12.244073867797852, "global_step": 389956, "epoch": 2321} {"train_loss": -12.155318260192871, "global_step": 389957, "epoch": 2321} {"train_loss": -11.950189590454102, "global_step": 389958, "epoch": 2321} {"train_loss": -12.414228439331055, "global_step": 389959, "epoch": 2321} {"train_loss": -12.377148628234863, "global_step": 389960, "epoch": 2321} {"train_loss": -12.297283172607422, "global_step": 389961, "epoch": 2321} {"train_loss": -12.230917930603027, "global_step": 389962, "epoch": 2321} {"train_loss": -12.134023666381836, "global_step": 389963, "epoch": 2321} {"train_loss": -12.242189407348633, "global_step": 389964, "epoch": 2321} {"train_loss": -12.033519744873047, "global_step": 389965, "epoch": 2321} {"train_loss": -11.683045387268066, "global_step": 389966, "epoch": 2321} {"train_loss": -10.979349136352539, "global_step": 389967, "epoch": 2321} {"train_loss": -11.950742721557617, "global_step": 389968, "epoch": 2321} {"train_loss": -11.358091354370117, "global_step": 389969, "epoch": 2321} {"train_loss": -12.290578842163086, "global_step": 389970, "epoch": 2321} {"train_loss": -11.671825408935547, "global_step": 389971, "epoch": 2321} {"train_loss": -12.290854454040527, "global_step": 389972, "epoch": 2321} {"train_loss": -11.567374229431152, "global_step": 389973, "epoch": 2321} {"train_loss": -11.663926124572754, "global_step": 389974, "epoch": 2321} {"train_loss": -11.697708129882812, "global_step": 389975, "epoch": 2321} {"train_loss": -11.967269897460938, "global_step": 389976, "epoch": 2321} {"train_loss": -10.831899642944336, "global_step": 389977, "epoch": 2321} {"train_loss": -11.852439880371094, "global_step": 389978, "epoch": 2321} {"train_loss": -11.026810646057129, "global_step": 389979, "epoch": 2321} {"train_loss": -11.224390983581543, "global_step": 389980, "epoch": 2321} {"train_loss": -10.944801330566406, "global_step": 389981, "epoch": 2321} {"train_loss": -11.77419662475586, "global_step": 389982, "epoch": 2321} {"train_loss": -11.011672019958496, "global_step": 389983, "epoch": 2321} {"train_loss": -10.796320915222168, "global_step": 389984, "epoch": 2321} {"train_loss": -8.96219253540039, "global_step": 389985, "epoch": 2321} {"train_loss": -9.407365798950195, "global_step": 389986, "epoch": 2321} {"train_loss": -10.156755447387695, "global_step": 389987, "epoch": 2321} {"train_loss": -11.281673431396484, "global_step": 389988, "epoch": 2321} {"train_loss": -10.418703079223633, "global_step": 389989, "epoch": 2321} {"train_loss": -10.990364074707031, "global_step": 389990, "epoch": 2321} {"train_loss": -11.824609756469727, "global_step": 389991, "epoch": 2321} {"train_loss": -11.347155570983887, "global_step": 389992, "epoch": 2321} {"train_loss": -11.771621704101562, "global_step": 389993, "epoch": 2321} {"train_loss": -11.729330062866211, "global_step": 389994, "epoch": 2321} {"train_loss": -11.481107711791992, "global_step": 389995, "epoch": 2321} {"train_loss": -11.87248706817627, "global_step": 389996, "epoch": 2321} {"train_loss": -12.064800262451172, "global_step": 389997, "epoch": 2321} {"train_loss": -11.960466384887695, "global_step": 389998, "epoch": 2321} {"train_loss": -11.898752212524414, "global_step": 389999, "epoch": 2321} {"train_loss": -11.686914443969727, "global_step": 390000, "epoch": 2321} {"train_loss": -11.952398300170898, "global_step": 390001, "epoch": 2321} {"train_loss": -11.87478256225586, "global_step": 390002, "epoch": 2321} {"train_loss": -11.690080642700195, "global_step": 390003, "epoch": 2321} {"train_loss": -12.244943618774414, "global_step": 390004, "epoch": 2321} {"train_loss": -11.910575866699219, "global_step": 390005, "epoch": 2321} {"train_loss": -11.97693920135498, "global_step": 390006, "epoch": 2321} {"train_loss": -12.151189804077148, "global_step": 390007, "epoch": 2321} {"train_loss": -12.182828903198242, "global_step": 390008, "epoch": 2321} {"train_loss": -12.322184562683105, "global_step": 390009, "epoch": 2321} {"train_loss": -11.619439125061035, "global_step": 390010, "epoch": 2321} {"train_loss": -12.14312744140625, "global_step": 390011, "epoch": 2321} {"train_loss": -11.990459442138672, "global_step": 390012, "epoch": 2321} {"train_loss": -12.04460620880127, "global_step": 390013, "epoch": 2321} {"train_loss": -12.152336120605469, "global_step": 390014, "epoch": 2321} {"train_loss": -12.238508224487305, "global_step": 390015, "epoch": 2321} {"train_loss": -12.069077491760254, "global_step": 390016, "epoch": 2321} {"train_loss": -12.116850852966309, "global_step": 390017, "epoch": 2321} {"train_loss": -12.39234733581543, "global_step": 390018, "epoch": 2321} {"train_loss": -12.326576232910156, "global_step": 390019, "epoch": 2321} {"train_loss": -12.120786666870117, "global_step": 390020, "epoch": 2321} {"train_loss": -11.94698429107666, "global_step": 390021, "epoch": 2321} {"train_loss": -12.316085815429688, "global_step": 390022, "epoch": 2321} {"train_loss": -12.204744338989258, "global_step": 390023, "epoch": 2321} {"train_loss": -12.124284744262695, "global_step": 390024, "epoch": 2321} {"train_loss": -12.301980972290039, "global_step": 390025, "epoch": 2321} {"train_loss": -12.366706848144531, "global_step": 390026, "epoch": 2321} {"train_loss": -12.214618682861328, "global_step": 390027, "epoch": 2321} {"train_loss": -12.303528785705566, "global_step": 390028, "epoch": 2321} {"train_loss": -12.334195137023926, "global_step": 390029, "epoch": 2321} {"train_loss": -12.41860580444336, "global_step": 390030, "epoch": 2321} {"train_loss": -12.151707649230957, "global_step": 390031, "epoch": 2321} {"train_loss": -12.348916053771973, "global_step": 390032, "epoch": 2321} {"train_loss": -12.41646957397461, "global_step": 390033, "epoch": 2321} {"train_loss": -12.356109619140625, "global_step": 390034, "epoch": 2321} {"train_loss": -12.839495658874512, "global_step": 390035, "epoch": 2321} {"train_loss": -12.170355796813965, "global_step": 390036, "epoch": 2321} {"train_loss": -12.612467765808105, "global_step": 390037, "epoch": 2321} {"train_loss": -12.513657569885254, "global_step": 390038, "epoch": 2321} {"train_loss": -12.43120002746582, "global_step": 390039, "epoch": 2321} {"train_loss": -12.567142486572266, "global_step": 390040, "epoch": 2321} {"train_loss": -12.52906608581543, "global_step": 390041, "epoch": 2321} {"train_loss": -12.523979187011719, "global_step": 390042, "epoch": 2321} {"train_loss": -12.263729095458984, "global_step": 390043, "epoch": 2321} {"train_loss": -12.545614242553711, "global_step": 390044, "epoch": 2321} {"train_loss": -12.522865295410156, "global_step": 390045, "epoch": 2321} {"train_loss": -12.581605911254883, "global_step": 390046, "epoch": 2321} {"train_loss": -12.736156463623047, "global_step": 390047, "epoch": 2321} {"train_loss": -12.61215877532959, "global_step": 390048, "epoch": 2321} {"train_loss": -12.728384017944336, "global_step": 390049, "epoch": 2321} {"train_loss": -12.719621658325195, "global_step": 390050, "epoch": 2321} {"train_loss": -12.717733383178711, "global_step": 390051, "epoch": 2321} {"train_loss": -12.694355010986328, "global_step": 390052, "epoch": 2321} {"train_loss": -12.57296085357666, "global_step": 390053, "epoch": 2321} {"train_loss": -12.757705688476562, "global_step": 390054, "epoch": 2321} {"train_loss": -12.573782920837402, "global_step": 390055, "epoch": 2321} {"train_loss": -12.676231384277344, "global_step": 390056, "epoch": 2321} {"train_loss": -12.497554779052734, "global_step": 390057, "epoch": 2321} {"train_loss": -12.572124481201172, "global_step": 390058, "epoch": 2321} {"train_loss": -11.93111515045166, "global_step": 390059, "epoch": 2321} {"train_loss": -12.262996673583984, "global_step": 390060, "epoch": 2321} {"train_loss": -11.56257438659668, "global_step": 390061, "epoch": 2321} {"train_loss": -11.69426155090332, "global_step": 390062, "epoch": 2321} {"train_loss": -12.249533653259277, "global_step": 390063, "epoch": 2321} {"train_loss": -11.897923469543457, "global_step": 390064, "epoch": 2321} {"train_loss": -12.798205375671387, "global_step": 390065, "epoch": 2321} {"train_loss": -12.151639938354492, "global_step": 390066, "epoch": 2321} {"train_loss": -12.461724281311035, "global_step": 390067, "epoch": 2321} {"train_loss": -12.33753776550293, "global_step": 390068, "epoch": 2321} {"train_loss": -11.873245239257812, "global_step": 390069, "epoch": 2321} {"train_loss": -11.78386402130127, "global_step": 390070, "epoch": 2321} {"train_loss": -12.38540267944336, "global_step": 390071, "epoch": 2321} {"train_loss": -12.10494327545166, "global_step": 390072, "epoch": 2321} {"train_loss": -12.147624969482422, "global_step": 390073, "epoch": 2321} {"train_loss": -12.60352611541748, "global_step": 390074, "epoch": 2321} {"train_loss": -12.203460693359375, "global_step": 390075, "epoch": 2321} {"train_loss": -12.320981979370117, "global_step": 390076, "epoch": 2321} {"train_loss": -12.420949935913086, "global_step": 390077, "epoch": 2321} {"train_loss": -11.97562313079834, "global_step": 390078, "epoch": 2321} {"train_loss": -12.513276100158691, "global_step": 390079, "epoch": 2321} {"train_loss": -12.265739440917969, "global_step": 390080, "epoch": 2321} {"train_loss": -11.70541000366211, "global_step": 390081, "epoch": 2321} {"train_loss": -12.590636253356934, "global_step": 390082, "epoch": 2321} {"train_loss": -12.136581420898438, "global_step": 390083, "epoch": 2321} {"train_loss": -11.574727058410645, "global_step": 390084, "epoch": 2321} {"train_loss": -12.218162536621094, "global_step": 390085, "epoch": 2321} {"train_loss": -11.933977127075195, "global_step": 390086, "epoch": 2321} {"train_loss": -10.9058837890625, "global_step": 390087, "epoch": 2321} {"train_loss": -12.104081153869629, "global_step": 390088, "epoch": 2321} {"train_loss": -11.881441116333008, "global_step": 390089, "epoch": 2321} {"train_loss": -11.660333633422852, "global_step": 390090, "epoch": 2321} {"train_loss": -11.93004322052002, "global_step": 390091, "epoch": 2321} {"train_loss": -11.401750564575195, "global_step": 390092, "epoch": 2321} {"train_loss": -12.052260398864746, "global_step": 390093, "epoch": 2321} {"train_loss": -11.844329833984375, "global_step": 390094, "epoch": 2321} {"train_loss": -12.074607514199757, "global_step": 390095, "epoch": 2321, "val_loss": 299495.40625} {"train_loss": -11.327859878540039, "global_step": 390096, "epoch": 2322} {"train_loss": -11.64808464050293, "global_step": 390097, "epoch": 2322} {"train_loss": -10.860907554626465, "global_step": 390098, "epoch": 2322} {"train_loss": -12.301229476928711, "global_step": 390099, "epoch": 2322} {"train_loss": -10.656607627868652, "global_step": 390100, "epoch": 2322} {"train_loss": -12.147051811218262, "global_step": 390101, "epoch": 2322} {"train_loss": -11.14610767364502, "global_step": 390102, "epoch": 2322} {"train_loss": -11.957088470458984, "global_step": 390103, "epoch": 2322} {"train_loss": -11.138782501220703, "global_step": 390104, "epoch": 2322} {"train_loss": -11.554374694824219, "global_step": 390105, "epoch": 2322} {"train_loss": -11.277974128723145, "global_step": 390106, "epoch": 2322} {"train_loss": -10.805013656616211, "global_step": 390107, "epoch": 2322} {"train_loss": -11.80870246887207, "global_step": 390108, "epoch": 2322} {"train_loss": -11.489148139953613, "global_step": 390109, "epoch": 2322} {"train_loss": -11.983356475830078, "global_step": 390110, "epoch": 2322} {"train_loss": -11.343465805053711, "global_step": 390111, "epoch": 2322} {"train_loss": -12.022965431213379, "global_step": 390112, "epoch": 2322} {"train_loss": -12.283294677734375, "global_step": 390113, "epoch": 2322} {"train_loss": -11.923256874084473, "global_step": 390114, "epoch": 2322} {"train_loss": -11.394932746887207, "global_step": 390115, "epoch": 2322} {"train_loss": -12.422547340393066, "global_step": 390116, "epoch": 2322} {"train_loss": -11.532655715942383, "global_step": 390117, "epoch": 2322} {"train_loss": -12.025790214538574, "global_step": 390118, "epoch": 2322} {"train_loss": -11.886428833007812, "global_step": 390119, "epoch": 2322} {"train_loss": -12.500402450561523, "global_step": 390120, "epoch": 2322} {"train_loss": -11.76382827758789, "global_step": 390121, "epoch": 2322} {"train_loss": -11.962583541870117, "global_step": 390122, "epoch": 2322} {"train_loss": -11.787075996398926, "global_step": 390123, "epoch": 2322} {"train_loss": -11.6486234664917, "global_step": 390124, "epoch": 2322} {"train_loss": -11.507128715515137, "global_step": 390125, "epoch": 2322} {"train_loss": -11.970909118652344, "global_step": 390126, "epoch": 2322} {"train_loss": -10.787083625793457, "global_step": 390127, "epoch": 2322} {"train_loss": -11.675704956054688, "global_step": 390128, "epoch": 2322} {"train_loss": -10.177671432495117, "global_step": 390129, "epoch": 2322} {"train_loss": -11.018091201782227, "global_step": 390130, "epoch": 2322} {"train_loss": -10.408879280090332, "global_step": 390131, "epoch": 2322} {"train_loss": -12.234230995178223, "global_step": 390132, "epoch": 2322} {"train_loss": -10.037117004394531, "global_step": 390133, "epoch": 2322} {"train_loss": -11.13383674621582, "global_step": 390134, "epoch": 2322} {"train_loss": -10.83192253112793, "global_step": 390135, "epoch": 2322} {"train_loss": -10.766576766967773, "global_step": 390136, "epoch": 2322} {"train_loss": -11.643112182617188, "global_step": 390137, "epoch": 2322} {"train_loss": -10.592605590820312, "global_step": 390138, "epoch": 2322} {"train_loss": -11.74764633178711, "global_step": 390139, "epoch": 2322} {"train_loss": -10.622262954711914, "global_step": 390140, "epoch": 2322} {"train_loss": -11.41939640045166, "global_step": 390141, "epoch": 2322} {"train_loss": -10.943422317504883, "global_step": 390142, "epoch": 2322} {"train_loss": -11.883337020874023, "global_step": 390143, "epoch": 2322} {"train_loss": -11.292069435119629, "global_step": 390144, "epoch": 2322} {"train_loss": -11.59264087677002, "global_step": 390145, "epoch": 2322} {"train_loss": -11.70064926147461, "global_step": 390146, "epoch": 2322} {"train_loss": -11.582674026489258, "global_step": 390147, "epoch": 2322} {"train_loss": -12.032072067260742, "global_step": 390148, "epoch": 2322} {"train_loss": -11.870109558105469, "global_step": 390149, "epoch": 2322} {"train_loss": -11.508249282836914, "global_step": 390150, "epoch": 2322} {"train_loss": -11.268622398376465, "global_step": 390151, "epoch": 2322} {"train_loss": -11.097259521484375, "global_step": 390152, "epoch": 2322} {"train_loss": -10.768604278564453, "global_step": 390153, "epoch": 2322} {"train_loss": -11.81074333190918, "global_step": 390154, "epoch": 2322} {"train_loss": -11.055736541748047, "global_step": 390155, "epoch": 2322} {"train_loss": -11.839113235473633, "global_step": 390156, "epoch": 2322} {"train_loss": -11.205009460449219, "global_step": 390157, "epoch": 2322} {"train_loss": -11.80579662322998, "global_step": 390158, "epoch": 2322} {"train_loss": -11.345218658447266, "global_step": 390159, "epoch": 2322} {"train_loss": -11.120210647583008, "global_step": 390160, "epoch": 2322} {"train_loss": -11.757816314697266, "global_step": 390161, "epoch": 2322} {"train_loss": -10.913097381591797, "global_step": 390162, "epoch": 2322} {"train_loss": -11.888486862182617, "global_step": 390163, "epoch": 2322} {"train_loss": -11.708300590515137, "global_step": 390164, "epoch": 2322} {"train_loss": -11.721484184265137, "global_step": 390165, "epoch": 2322} {"train_loss": -11.72877025604248, "global_step": 390166, "epoch": 2322} {"train_loss": -11.82361125946045, "global_step": 390167, "epoch": 2322} {"train_loss": -11.840397834777832, "global_step": 390168, "epoch": 2322} {"train_loss": -12.257554054260254, "global_step": 390169, "epoch": 2322} {"train_loss": -11.998846054077148, "global_step": 390170, "epoch": 2322} {"train_loss": -12.046905517578125, "global_step": 390171, "epoch": 2322} {"train_loss": -11.960861206054688, "global_step": 390172, "epoch": 2322} {"train_loss": -12.36955451965332, "global_step": 390173, "epoch": 2322} {"train_loss": -12.032387733459473, "global_step": 390174, "epoch": 2322} {"train_loss": -12.232388496398926, "global_step": 390175, "epoch": 2322} {"train_loss": -12.042438507080078, "global_step": 390176, "epoch": 2322} {"train_loss": -12.053672790527344, "global_step": 390177, "epoch": 2322} {"train_loss": -12.204617500305176, "global_step": 390178, "epoch": 2322} {"train_loss": -12.005035400390625, "global_step": 390179, "epoch": 2322} {"train_loss": -12.415714263916016, "global_step": 390180, "epoch": 2322} {"train_loss": -12.127277374267578, "global_step": 390181, "epoch": 2322} {"train_loss": -12.359253883361816, "global_step": 390182, "epoch": 2322} {"train_loss": -12.165635108947754, "global_step": 390183, "epoch": 2322} {"train_loss": -12.167580604553223, "global_step": 390184, "epoch": 2322} {"train_loss": -12.28256607055664, "global_step": 390185, "epoch": 2322} {"train_loss": -12.09909439086914, "global_step": 390186, "epoch": 2322} {"train_loss": -12.100469589233398, "global_step": 390187, "epoch": 2322} {"train_loss": -12.55360221862793, "global_step": 390188, "epoch": 2322} {"train_loss": -12.1358642578125, "global_step": 390189, "epoch": 2322} {"train_loss": -12.533662796020508, "global_step": 390190, "epoch": 2322} {"train_loss": -12.313551902770996, "global_step": 390191, "epoch": 2322} {"train_loss": -12.336888313293457, "global_step": 390192, "epoch": 2322} {"train_loss": -12.56893539428711, "global_step": 390193, "epoch": 2322} {"train_loss": -12.137096405029297, "global_step": 390194, "epoch": 2322} {"train_loss": -12.465605735778809, "global_step": 390195, "epoch": 2322} {"train_loss": -12.46481990814209, "global_step": 390196, "epoch": 2322} {"train_loss": -12.197855949401855, "global_step": 390197, "epoch": 2322} {"train_loss": -12.484026908874512, "global_step": 390198, "epoch": 2322} {"train_loss": -12.396318435668945, "global_step": 390199, "epoch": 2322} {"train_loss": -12.552751541137695, "global_step": 390200, "epoch": 2322} {"train_loss": -12.376032829284668, "global_step": 390201, "epoch": 2322} {"train_loss": -12.53473949432373, "global_step": 390202, "epoch": 2322} {"train_loss": -12.536367416381836, "global_step": 390203, "epoch": 2322} {"train_loss": -12.310901641845703, "global_step": 390204, "epoch": 2322} {"train_loss": -12.563340187072754, "global_step": 390205, "epoch": 2322} {"train_loss": -12.185562133789062, "global_step": 390206, "epoch": 2322} {"train_loss": -12.619288444519043, "global_step": 390207, "epoch": 2322} {"train_loss": -12.186738967895508, "global_step": 390208, "epoch": 2322} {"train_loss": -12.355951309204102, "global_step": 390209, "epoch": 2322} {"train_loss": -12.565622329711914, "global_step": 390210, "epoch": 2322} {"train_loss": -12.152742385864258, "global_step": 390211, "epoch": 2322} {"train_loss": -12.372852325439453, "global_step": 390212, "epoch": 2322} {"train_loss": -11.945517539978027, "global_step": 390213, "epoch": 2322} {"train_loss": -12.226310729980469, "global_step": 390214, "epoch": 2322} {"train_loss": -12.04434585571289, "global_step": 390215, "epoch": 2322} {"train_loss": -12.237913131713867, "global_step": 390216, "epoch": 2322} {"train_loss": -12.499972343444824, "global_step": 390217, "epoch": 2322} {"train_loss": -11.993443489074707, "global_step": 390218, "epoch": 2322} {"train_loss": -12.522920608520508, "global_step": 390219, "epoch": 2322} {"train_loss": -12.015754699707031, "global_step": 390220, "epoch": 2322} {"train_loss": -12.49379825592041, "global_step": 390221, "epoch": 2322} {"train_loss": -12.697408676147461, "global_step": 390222, "epoch": 2322} {"train_loss": -12.381979942321777, "global_step": 390223, "epoch": 2322} {"train_loss": -12.615837097167969, "global_step": 390224, "epoch": 2322} {"train_loss": -12.404752731323242, "global_step": 390225, "epoch": 2322} {"train_loss": -12.613997459411621, "global_step": 390226, "epoch": 2322} {"train_loss": -12.628812789916992, "global_step": 390227, "epoch": 2322} {"train_loss": -12.63438606262207, "global_step": 390228, "epoch": 2322} {"train_loss": -12.423648834228516, "global_step": 390229, "epoch": 2322} {"train_loss": -12.681267738342285, "global_step": 390230, "epoch": 2322} {"train_loss": -12.528623580932617, "global_step": 390231, "epoch": 2322} {"train_loss": -12.560285568237305, "global_step": 390232, "epoch": 2322} {"train_loss": -12.656839370727539, "global_step": 390233, "epoch": 2322} {"train_loss": -12.397415161132812, "global_step": 390234, "epoch": 2322} {"train_loss": -12.242971420288086, "global_step": 390235, "epoch": 2322} {"train_loss": -12.569515228271484, "global_step": 390236, "epoch": 2322} {"train_loss": -12.109748840332031, "global_step": 390237, "epoch": 2322} {"train_loss": -12.001195907592773, "global_step": 390238, "epoch": 2322} {"train_loss": -12.523545265197754, "global_step": 390239, "epoch": 2322} {"train_loss": -12.270264625549316, "global_step": 390240, "epoch": 2322} {"train_loss": -12.285893440246582, "global_step": 390241, "epoch": 2322} {"train_loss": -12.283422470092773, "global_step": 390242, "epoch": 2322} {"train_loss": -12.340879440307617, "global_step": 390243, "epoch": 2322} {"train_loss": -12.441726684570312, "global_step": 390244, "epoch": 2322} {"train_loss": -12.541645050048828, "global_step": 390245, "epoch": 2322} {"train_loss": -12.462828636169434, "global_step": 390246, "epoch": 2322} {"train_loss": -12.410563468933105, "global_step": 390247, "epoch": 2322} {"train_loss": -12.183876991271973, "global_step": 390248, "epoch": 2322} {"train_loss": -12.402502059936523, "global_step": 390249, "epoch": 2322} {"train_loss": -12.124923706054688, "global_step": 390250, "epoch": 2322} {"train_loss": -12.05435848236084, "global_step": 390251, "epoch": 2322} {"train_loss": -12.496853828430176, "global_step": 390252, "epoch": 2322} {"train_loss": -12.451739311218262, "global_step": 390253, "epoch": 2322} {"train_loss": -10.745540618896484, "global_step": 390254, "epoch": 2322} {"train_loss": -12.603961944580078, "global_step": 390255, "epoch": 2322} {"train_loss": -11.177314758300781, "global_step": 390256, "epoch": 2322} {"train_loss": -10.762134552001953, "global_step": 390257, "epoch": 2322} {"train_loss": -12.365653991699219, "global_step": 390258, "epoch": 2322} {"train_loss": -10.654403686523438, "global_step": 390259, "epoch": 2322} {"train_loss": -11.214264869689941, "global_step": 390260, "epoch": 2322} {"train_loss": -12.440775871276855, "global_step": 390261, "epoch": 2322} {"train_loss": -11.105636596679688, "global_step": 390262, "epoch": 2322} {"train_loss": -11.907419380687532, "global_step": 390263, "epoch": 2322, "val_loss": 300206.125} {"train_loss": -11.07876968383789, "global_step": 390264, "epoch": 2323} {"train_loss": -9.822078704833984, "global_step": 390265, "epoch": 2323} {"train_loss": -8.976451873779297, "global_step": 390266, "epoch": 2323} {"train_loss": -11.967637062072754, "global_step": 390267, "epoch": 2323} {"train_loss": -8.242464065551758, "global_step": 390268, "epoch": 2323} {"train_loss": -11.829212188720703, "global_step": 390269, "epoch": 2323} {"train_loss": -9.678447723388672, "global_step": 390270, "epoch": 2323} {"train_loss": -10.284564971923828, "global_step": 390271, "epoch": 2323} {"train_loss": -9.634842872619629, "global_step": 390272, "epoch": 2323} {"train_loss": -11.768162727355957, "global_step": 390273, "epoch": 2323} {"train_loss": -11.012792587280273, "global_step": 390274, "epoch": 2323} {"train_loss": -12.241193771362305, "global_step": 390275, "epoch": 2323} {"train_loss": -11.112470626831055, "global_step": 390276, "epoch": 2323} {"train_loss": -12.305194854736328, "global_step": 390277, "epoch": 2323} {"train_loss": -11.573309898376465, "global_step": 390278, "epoch": 2323} {"train_loss": -11.272430419921875, "global_step": 390279, "epoch": 2323} {"train_loss": -11.765485763549805, "global_step": 390280, "epoch": 2323} {"train_loss": -11.327396392822266, "global_step": 390281, "epoch": 2323} {"train_loss": -11.721769332885742, "global_step": 390282, "epoch": 2323} {"train_loss": -10.24809455871582, "global_step": 390283, "epoch": 2323} {"train_loss": -11.840410232543945, "global_step": 390284, "epoch": 2323} {"train_loss": -10.982139587402344, "global_step": 390285, "epoch": 2323} {"train_loss": -12.168668746948242, "global_step": 390286, "epoch": 2323} {"train_loss": -11.622249603271484, "global_step": 390287, "epoch": 2323} {"train_loss": -12.041411399841309, "global_step": 390288, "epoch": 2323} {"train_loss": -11.89425277709961, "global_step": 390289, "epoch": 2323} {"train_loss": -12.025327682495117, "global_step": 390290, "epoch": 2323} {"train_loss": -11.823563575744629, "global_step": 390291, "epoch": 2323} {"train_loss": -11.829080581665039, "global_step": 390292, "epoch": 2323} {"train_loss": -11.543280601501465, "global_step": 390293, "epoch": 2323} {"train_loss": -11.765731811523438, "global_step": 390294, "epoch": 2323} {"train_loss": -11.91970443725586, "global_step": 390295, "epoch": 2323} {"train_loss": -12.165884017944336, "global_step": 390296, "epoch": 2323} {"train_loss": -11.461938858032227, "global_step": 390297, "epoch": 2323} {"train_loss": -12.246467590332031, "global_step": 390298, "epoch": 2323} {"train_loss": -11.571146011352539, "global_step": 390299, "epoch": 2323} {"train_loss": -12.091550827026367, "global_step": 390300, "epoch": 2323} {"train_loss": -11.71826171875, "global_step": 390301, "epoch": 2323} {"train_loss": -12.247936248779297, "global_step": 390302, "epoch": 2323} {"train_loss": -11.557828903198242, "global_step": 390303, "epoch": 2323} {"train_loss": -12.267724990844727, "global_step": 390304, "epoch": 2323} {"train_loss": -12.026241302490234, "global_step": 390305, "epoch": 2323} {"train_loss": -12.021434783935547, "global_step": 390306, "epoch": 2323} {"train_loss": -11.938539505004883, "global_step": 390307, "epoch": 2323} {"train_loss": -12.015204429626465, "global_step": 390308, "epoch": 2323} {"train_loss": -12.233719825744629, "global_step": 390309, "epoch": 2323} {"train_loss": -12.151847839355469, "global_step": 390310, "epoch": 2323} {"train_loss": -12.111279487609863, "global_step": 390311, "epoch": 2323} {"train_loss": -12.31203842163086, "global_step": 390312, "epoch": 2323} {"train_loss": -12.152294158935547, "global_step": 390313, "epoch": 2323} {"train_loss": -12.18073558807373, "global_step": 390314, "epoch": 2323} {"train_loss": -12.229751586914062, "global_step": 390315, "epoch": 2323} {"train_loss": -12.431486129760742, "global_step": 390316, "epoch": 2323} {"train_loss": -12.065908432006836, "global_step": 390317, "epoch": 2323} {"train_loss": -12.380621910095215, "global_step": 390318, "epoch": 2323} {"train_loss": -11.984968185424805, "global_step": 390319, "epoch": 2323} {"train_loss": -12.231969833374023, "global_step": 390320, "epoch": 2323} {"train_loss": -12.123172760009766, "global_step": 390321, "epoch": 2323} {"train_loss": -11.887845993041992, "global_step": 390322, "epoch": 2323} {"train_loss": -12.320903778076172, "global_step": 390323, "epoch": 2323} {"train_loss": -12.010251998901367, "global_step": 390324, "epoch": 2323} {"train_loss": -12.242788314819336, "global_step": 390325, "epoch": 2323} {"train_loss": -12.366823196411133, "global_step": 390326, "epoch": 2323} {"train_loss": -12.47531795501709, "global_step": 390327, "epoch": 2323} {"train_loss": -12.356765747070312, "global_step": 390328, "epoch": 2323} {"train_loss": -12.131706237792969, "global_step": 390329, "epoch": 2323} {"train_loss": -12.383376121520996, "global_step": 390330, "epoch": 2323} {"train_loss": -11.481008529663086, "global_step": 390331, "epoch": 2323} {"train_loss": -10.916954040527344, "global_step": 390332, "epoch": 2323} {"train_loss": -12.13962173461914, "global_step": 390333, "epoch": 2323} {"train_loss": -11.46850872039795, "global_step": 390334, "epoch": 2323} {"train_loss": -11.794788360595703, "global_step": 390335, "epoch": 2323} {"train_loss": -11.787873268127441, "global_step": 390336, "epoch": 2323} {"train_loss": -11.843618392944336, "global_step": 390337, "epoch": 2323} {"train_loss": -11.976278305053711, "global_step": 390338, "epoch": 2323} {"train_loss": -11.329996109008789, "global_step": 390339, "epoch": 2323} {"train_loss": -12.157356262207031, "global_step": 390340, "epoch": 2323} {"train_loss": -10.797536849975586, "global_step": 390341, "epoch": 2323} {"train_loss": -11.409951210021973, "global_step": 390342, "epoch": 2323} {"train_loss": -11.70737361907959, "global_step": 390343, "epoch": 2323} {"train_loss": -10.894784927368164, "global_step": 390344, "epoch": 2323} {"train_loss": -12.119136810302734, "global_step": 390345, "epoch": 2323} {"train_loss": -10.991296768188477, "global_step": 390346, "epoch": 2323} {"train_loss": -11.887977600097656, "global_step": 390347, "epoch": 2323} {"train_loss": -12.07641315460205, "global_step": 390348, "epoch": 2323} {"train_loss": -11.45872688293457, "global_step": 390349, "epoch": 2323} {"train_loss": -12.500224113464355, "global_step": 390350, "epoch": 2323} {"train_loss": -11.714332580566406, "global_step": 390351, "epoch": 2323} {"train_loss": -12.174473762512207, "global_step": 390352, "epoch": 2323} {"train_loss": -11.970333099365234, "global_step": 390353, "epoch": 2323} {"train_loss": -11.999773979187012, "global_step": 390354, "epoch": 2323} {"train_loss": -12.102280616760254, "global_step": 390355, "epoch": 2323} {"train_loss": -11.73779010772705, "global_step": 390356, "epoch": 2323} {"train_loss": -12.253655433654785, "global_step": 390357, "epoch": 2323} {"train_loss": -11.806845664978027, "global_step": 390358, "epoch": 2323} {"train_loss": -12.226171493530273, "global_step": 390359, "epoch": 2323} {"train_loss": -11.658738136291504, "global_step": 390360, "epoch": 2323} {"train_loss": -12.02596664428711, "global_step": 390361, "epoch": 2323} {"train_loss": -11.747408866882324, "global_step": 390362, "epoch": 2323} {"train_loss": -12.029277801513672, "global_step": 390363, "epoch": 2323} {"train_loss": -11.5698823928833, "global_step": 390364, "epoch": 2323} {"train_loss": -11.7989501953125, "global_step": 390365, "epoch": 2323} {"train_loss": -10.896374702453613, "global_step": 390366, "epoch": 2323} {"train_loss": -12.136503219604492, "global_step": 390367, "epoch": 2323} {"train_loss": -11.423628807067871, "global_step": 390368, "epoch": 2323} {"train_loss": -12.029108047485352, "global_step": 390369, "epoch": 2323} {"train_loss": -11.528088569641113, "global_step": 390370, "epoch": 2323} {"train_loss": -11.860509872436523, "global_step": 390371, "epoch": 2323} {"train_loss": -12.215784072875977, "global_step": 390372, "epoch": 2323} {"train_loss": -11.668938636779785, "global_step": 390373, "epoch": 2323} {"train_loss": -11.954743385314941, "global_step": 390374, "epoch": 2323} {"train_loss": -12.099260330200195, "global_step": 390375, "epoch": 2323} {"train_loss": -11.549417495727539, "global_step": 390376, "epoch": 2323} {"train_loss": -12.123381614685059, "global_step": 390377, "epoch": 2323} {"train_loss": -11.547734260559082, "global_step": 390378, "epoch": 2323} {"train_loss": -10.973745346069336, "global_step": 390379, "epoch": 2323} {"train_loss": -12.058765411376953, "global_step": 390380, "epoch": 2323} {"train_loss": -10.21463394165039, "global_step": 390381, "epoch": 2323} {"train_loss": -11.291131973266602, "global_step": 390382, "epoch": 2323} {"train_loss": -11.307334899902344, "global_step": 390383, "epoch": 2323} {"train_loss": -10.84919548034668, "global_step": 390384, "epoch": 2323} {"train_loss": -10.90904426574707, "global_step": 390385, "epoch": 2323} {"train_loss": -11.467479705810547, "global_step": 390386, "epoch": 2323} {"train_loss": -10.885615348815918, "global_step": 390387, "epoch": 2323} {"train_loss": -11.898755073547363, "global_step": 390388, "epoch": 2323} {"train_loss": -10.867117881774902, "global_step": 390389, "epoch": 2323} {"train_loss": -11.38253402709961, "global_step": 390390, "epoch": 2323} {"train_loss": -11.305665969848633, "global_step": 390391, "epoch": 2323} {"train_loss": -10.57559585571289, "global_step": 390392, "epoch": 2323} {"train_loss": -12.051755905151367, "global_step": 390393, "epoch": 2323} {"train_loss": -11.546351432800293, "global_step": 390394, "epoch": 2323} {"train_loss": -11.395341873168945, "global_step": 390395, "epoch": 2323} {"train_loss": -12.384221076965332, "global_step": 390396, "epoch": 2323} {"train_loss": -11.77936840057373, "global_step": 390397, "epoch": 2323} {"train_loss": -11.48715877532959, "global_step": 390398, "epoch": 2323} {"train_loss": -12.221309661865234, "global_step": 390399, "epoch": 2323} {"train_loss": -11.541082382202148, "global_step": 390400, "epoch": 2323} {"train_loss": -12.02114486694336, "global_step": 390401, "epoch": 2323} {"train_loss": -11.93739128112793, "global_step": 390402, "epoch": 2323} {"train_loss": -11.948155403137207, "global_step": 390403, "epoch": 2323} {"train_loss": -11.756904602050781, "global_step": 390404, "epoch": 2323} {"train_loss": -11.8519868850708, "global_step": 390405, "epoch": 2323} {"train_loss": -11.919607162475586, "global_step": 390406, "epoch": 2323} {"train_loss": -12.13312816619873, "global_step": 390407, "epoch": 2323} {"train_loss": -11.685041427612305, "global_step": 390408, "epoch": 2323} {"train_loss": -12.148048400878906, "global_step": 390409, "epoch": 2323} {"train_loss": -11.786937713623047, "global_step": 390410, "epoch": 2323} {"train_loss": -12.264881134033203, "global_step": 390411, "epoch": 2323} {"train_loss": -11.970810890197754, "global_step": 390412, "epoch": 2323} {"train_loss": -12.248634338378906, "global_step": 390413, "epoch": 2323} {"train_loss": -12.191810607910156, "global_step": 390414, "epoch": 2323} {"train_loss": -12.38839340209961, "global_step": 390415, "epoch": 2323} {"train_loss": -12.100669860839844, "global_step": 390416, "epoch": 2323} {"train_loss": -11.896358489990234, "global_step": 390417, "epoch": 2323} {"train_loss": -12.021200180053711, "global_step": 390418, "epoch": 2323} {"train_loss": -12.206947326660156, "global_step": 390419, "epoch": 2323} {"train_loss": -11.719808578491211, "global_step": 390420, "epoch": 2323} {"train_loss": -12.21119213104248, "global_step": 390421, "epoch": 2323} {"train_loss": -12.13516616821289, "global_step": 390422, "epoch": 2323} {"train_loss": -12.243926048278809, "global_step": 390423, "epoch": 2323} {"train_loss": -12.272174835205078, "global_step": 390424, "epoch": 2323} {"train_loss": -12.013716697692871, "global_step": 390425, "epoch": 2323} {"train_loss": -12.369648933410645, "global_step": 390426, "epoch": 2323} {"train_loss": -12.053939819335938, "global_step": 390427, "epoch": 2323} {"train_loss": -12.432455062866211, "global_step": 390428, "epoch": 2323} {"train_loss": -12.227835655212402, "global_step": 390429, "epoch": 2323} {"train_loss": -12.288662910461426, "global_step": 390430, "epoch": 2323} {"train_loss": -11.746115917251224, "global_step": 390431, "epoch": 2323, "val_loss": 294139.53125} {"train_loss": -12.439924240112305, "global_step": 390432, "epoch": 2324} {"train_loss": -12.46994400024414, "global_step": 390433, "epoch": 2324} {"train_loss": -12.371078491210938, "global_step": 390434, "epoch": 2324} {"train_loss": -12.406719207763672, "global_step": 390435, "epoch": 2324} {"train_loss": -12.63294506072998, "global_step": 390436, "epoch": 2324} {"train_loss": -12.230186462402344, "global_step": 390437, "epoch": 2324} {"train_loss": -12.281110763549805, "global_step": 390438, "epoch": 2324} {"train_loss": -12.409217834472656, "global_step": 390439, "epoch": 2324} {"train_loss": -12.57809066772461, "global_step": 390440, "epoch": 2324} {"train_loss": -12.520818710327148, "global_step": 390441, "epoch": 2324} {"train_loss": -12.663121223449707, "global_step": 390442, "epoch": 2324} {"train_loss": -12.810066223144531, "global_step": 390443, "epoch": 2324} {"train_loss": -12.620992660522461, "global_step": 390444, "epoch": 2324} {"train_loss": -12.595123291015625, "global_step": 390445, "epoch": 2324} {"train_loss": -12.611881256103516, "global_step": 390446, "epoch": 2324} {"train_loss": -12.299970626831055, "global_step": 390447, "epoch": 2324} {"train_loss": -12.721739768981934, "global_step": 390448, "epoch": 2324} {"train_loss": -12.674314498901367, "global_step": 390449, "epoch": 2324} {"train_loss": -12.45885944366455, "global_step": 390450, "epoch": 2324} {"train_loss": -12.660904884338379, "global_step": 390451, "epoch": 2324} {"train_loss": -12.673016548156738, "global_step": 390452, "epoch": 2324} {"train_loss": -12.599287986755371, "global_step": 390453, "epoch": 2324} {"train_loss": -12.07533073425293, "global_step": 390454, "epoch": 2324} {"train_loss": -12.759420394897461, "global_step": 390455, "epoch": 2324} {"train_loss": -12.328962326049805, "global_step": 390456, "epoch": 2324} {"train_loss": -12.401866912841797, "global_step": 390457, "epoch": 2324} {"train_loss": -12.668740272521973, "global_step": 390458, "epoch": 2324} {"train_loss": -11.948487281799316, "global_step": 390459, "epoch": 2324} {"train_loss": -12.384712219238281, "global_step": 390460, "epoch": 2324} {"train_loss": -12.666396141052246, "global_step": 390461, "epoch": 2324} {"train_loss": -12.453922271728516, "global_step": 390462, "epoch": 2324} {"train_loss": -12.579817771911621, "global_step": 390463, "epoch": 2324} {"train_loss": -12.64675521850586, "global_step": 390464, "epoch": 2324} {"train_loss": -12.774829864501953, "global_step": 390465, "epoch": 2324} {"train_loss": -12.701504707336426, "global_step": 390466, "epoch": 2324} {"train_loss": -12.645471572875977, "global_step": 390467, "epoch": 2324} {"train_loss": -12.69573974609375, "global_step": 390468, "epoch": 2324} {"train_loss": -12.600822448730469, "global_step": 390469, "epoch": 2324} {"train_loss": -12.778814315795898, "global_step": 390470, "epoch": 2324} {"train_loss": -12.738641738891602, "global_step": 390471, "epoch": 2324} {"train_loss": -12.536582946777344, "global_step": 390472, "epoch": 2324} {"train_loss": -12.767285346984863, "global_step": 390473, "epoch": 2324} {"train_loss": -12.33928394317627, "global_step": 390474, "epoch": 2324} {"train_loss": -12.842215538024902, "global_step": 390475, "epoch": 2324} {"train_loss": -11.776784896850586, "global_step": 390476, "epoch": 2324} {"train_loss": -12.057320594787598, "global_step": 390477, "epoch": 2324} {"train_loss": -12.293319702148438, "global_step": 390478, "epoch": 2324} {"train_loss": -12.804126739501953, "global_step": 390479, "epoch": 2324} {"train_loss": -12.369359016418457, "global_step": 390480, "epoch": 2324} {"train_loss": -12.675704002380371, "global_step": 390481, "epoch": 2324} {"train_loss": -12.622468948364258, "global_step": 390482, "epoch": 2324} {"train_loss": -12.81687068939209, "global_step": 390483, "epoch": 2324} {"train_loss": -12.541217803955078, "global_step": 390484, "epoch": 2324} {"train_loss": -12.262821197509766, "global_step": 390485, "epoch": 2324} {"train_loss": -11.57860279083252, "global_step": 390486, "epoch": 2324} {"train_loss": -12.486884117126465, "global_step": 390487, "epoch": 2324} {"train_loss": -12.244160652160645, "global_step": 390488, "epoch": 2324} {"train_loss": -11.67181396484375, "global_step": 390489, "epoch": 2324} {"train_loss": -11.25693130493164, "global_step": 390490, "epoch": 2324} {"train_loss": -12.117528915405273, "global_step": 390491, "epoch": 2324} {"train_loss": -12.64207649230957, "global_step": 390492, "epoch": 2324} {"train_loss": -11.872955322265625, "global_step": 390493, "epoch": 2324} {"train_loss": -12.543161392211914, "global_step": 390494, "epoch": 2324} {"train_loss": -11.656264305114746, "global_step": 390495, "epoch": 2324} {"train_loss": -11.890045166015625, "global_step": 390496, "epoch": 2324} {"train_loss": -12.021989822387695, "global_step": 390497, "epoch": 2324} {"train_loss": -11.675063133239746, "global_step": 390498, "epoch": 2324} {"train_loss": -12.593827247619629, "global_step": 390499, "epoch": 2324} {"train_loss": -12.135564804077148, "global_step": 390500, "epoch": 2324} {"train_loss": -12.10679817199707, "global_step": 390501, "epoch": 2324} {"train_loss": -12.51527214050293, "global_step": 390502, "epoch": 2324} {"train_loss": -12.386609077453613, "global_step": 390503, "epoch": 2324} {"train_loss": -12.006246566772461, "global_step": 390504, "epoch": 2324} {"train_loss": -12.162452697753906, "global_step": 390505, "epoch": 2324} {"train_loss": -11.990165710449219, "global_step": 390506, "epoch": 2324} {"train_loss": -11.24222183227539, "global_step": 390507, "epoch": 2324} {"train_loss": -12.293319702148438, "global_step": 390508, "epoch": 2324} {"train_loss": -11.628213882446289, "global_step": 390509, "epoch": 2324} {"train_loss": -11.666979789733887, "global_step": 390510, "epoch": 2324} {"train_loss": -12.044563293457031, "global_step": 390511, "epoch": 2324} {"train_loss": -10.255743980407715, "global_step": 390512, "epoch": 2324} {"train_loss": -12.764883041381836, "global_step": 390513, "epoch": 2324} {"train_loss": -10.88193130493164, "global_step": 390514, "epoch": 2324} {"train_loss": -11.919792175292969, "global_step": 390515, "epoch": 2324} {"train_loss": -12.03740119934082, "global_step": 390516, "epoch": 2324} {"train_loss": -11.833648681640625, "global_step": 390517, "epoch": 2324} {"train_loss": -12.28763198852539, "global_step": 390518, "epoch": 2324} {"train_loss": -11.510281562805176, "global_step": 390519, "epoch": 2324} {"train_loss": -12.387751579284668, "global_step": 390520, "epoch": 2324} {"train_loss": -11.642080307006836, "global_step": 390521, "epoch": 2324} {"train_loss": -12.354999542236328, "global_step": 390522, "epoch": 2324} {"train_loss": -12.106537818908691, "global_step": 390523, "epoch": 2324} {"train_loss": -11.84616470336914, "global_step": 390524, "epoch": 2324} {"train_loss": -11.903058052062988, "global_step": 390525, "epoch": 2324} {"train_loss": -12.069305419921875, "global_step": 390526, "epoch": 2324} {"train_loss": -11.96505355834961, "global_step": 390527, "epoch": 2324} {"train_loss": -11.598834991455078, "global_step": 390528, "epoch": 2324} {"train_loss": -12.057989120483398, "global_step": 390529, "epoch": 2324} {"train_loss": -12.239911079406738, "global_step": 390530, "epoch": 2324} {"train_loss": -12.080883979797363, "global_step": 390531, "epoch": 2324} {"train_loss": -11.831953048706055, "global_step": 390532, "epoch": 2324} {"train_loss": -11.940927505493164, "global_step": 390533, "epoch": 2324} {"train_loss": -12.322233200073242, "global_step": 390534, "epoch": 2324} {"train_loss": -12.216526985168457, "global_step": 390535, "epoch": 2324} {"train_loss": -12.469803810119629, "global_step": 390536, "epoch": 2324} {"train_loss": -12.168206214904785, "global_step": 390537, "epoch": 2324} {"train_loss": -12.093633651733398, "global_step": 390538, "epoch": 2324} {"train_loss": -12.332191467285156, "global_step": 390539, "epoch": 2324} {"train_loss": -12.496208190917969, "global_step": 390540, "epoch": 2324} {"train_loss": -12.185108184814453, "global_step": 390541, "epoch": 2324} {"train_loss": -12.581636428833008, "global_step": 390542, "epoch": 2324} {"train_loss": -12.337418556213379, "global_step": 390543, "epoch": 2324} {"train_loss": -12.341348648071289, "global_step": 390544, "epoch": 2324} {"train_loss": -12.350813865661621, "global_step": 390545, "epoch": 2324} {"train_loss": -12.021541595458984, "global_step": 390546, "epoch": 2324} {"train_loss": -11.70418643951416, "global_step": 390547, "epoch": 2324} {"train_loss": -12.384685516357422, "global_step": 390548, "epoch": 2324} {"train_loss": -11.65304946899414, "global_step": 390549, "epoch": 2324} {"train_loss": -10.884883880615234, "global_step": 390550, "epoch": 2324} {"train_loss": -12.086068153381348, "global_step": 390551, "epoch": 2324} {"train_loss": -11.995800018310547, "global_step": 390552, "epoch": 2324} {"train_loss": -11.142324447631836, "global_step": 390553, "epoch": 2324} {"train_loss": -11.107900619506836, "global_step": 390554, "epoch": 2324} {"train_loss": -12.27425765991211, "global_step": 390555, "epoch": 2324} {"train_loss": -9.918448448181152, "global_step": 390556, "epoch": 2324} {"train_loss": -9.165633201599121, "global_step": 390557, "epoch": 2324} {"train_loss": -10.338773727416992, "global_step": 390558, "epoch": 2324} {"train_loss": -9.327116012573242, "global_step": 390559, "epoch": 2324} {"train_loss": -9.51181411743164, "global_step": 390560, "epoch": 2324} {"train_loss": -11.47611141204834, "global_step": 390561, "epoch": 2324} {"train_loss": -11.06867504119873, "global_step": 390562, "epoch": 2324} {"train_loss": -11.614615440368652, "global_step": 390563, "epoch": 2324} {"train_loss": -11.296958923339844, "global_step": 390564, "epoch": 2324} {"train_loss": -10.644001007080078, "global_step": 390565, "epoch": 2324} {"train_loss": -11.778624534606934, "global_step": 390566, "epoch": 2324} {"train_loss": -11.448431968688965, "global_step": 390567, "epoch": 2324} {"train_loss": -11.731401443481445, "global_step": 390568, "epoch": 2324} {"train_loss": -11.421571731567383, "global_step": 390569, "epoch": 2324} {"train_loss": -11.479055404663086, "global_step": 390570, "epoch": 2324} {"train_loss": -11.032588958740234, "global_step": 390571, "epoch": 2324} {"train_loss": -11.620112419128418, "global_step": 390572, "epoch": 2324} {"train_loss": -11.709006309509277, "global_step": 390573, "epoch": 2324} {"train_loss": -10.682984352111816, "global_step": 390574, "epoch": 2324} {"train_loss": -11.613449096679688, "global_step": 390575, "epoch": 2324} {"train_loss": -11.511871337890625, "global_step": 390576, "epoch": 2324} {"train_loss": -11.567695617675781, "global_step": 390577, "epoch": 2324} {"train_loss": -11.609024047851562, "global_step": 390578, "epoch": 2324} {"train_loss": -12.081872940063477, "global_step": 390579, "epoch": 2324} {"train_loss": -11.80770492553711, "global_step": 390580, "epoch": 2324} {"train_loss": -12.118099212646484, "global_step": 390581, "epoch": 2324} {"train_loss": -11.386760711669922, "global_step": 390582, "epoch": 2324} {"train_loss": -11.881345748901367, "global_step": 390583, "epoch": 2324} {"train_loss": -11.527740478515625, "global_step": 390584, "epoch": 2324} {"train_loss": -12.134550094604492, "global_step": 390585, "epoch": 2324} {"train_loss": -12.168096542358398, "global_step": 390586, "epoch": 2324} {"train_loss": -11.926612854003906, "global_step": 390587, "epoch": 2324} {"train_loss": -12.270071983337402, "global_step": 390588, "epoch": 2324} {"train_loss": -12.134723663330078, "global_step": 390589, "epoch": 2324} {"train_loss": -11.8942289352417, "global_step": 390590, "epoch": 2324} {"train_loss": -12.26222038269043, "global_step": 390591, "epoch": 2324} {"train_loss": -12.212793350219727, "global_step": 390592, "epoch": 2324} {"train_loss": -12.141401290893555, "global_step": 390593, "epoch": 2324} {"train_loss": -12.297134399414062, "global_step": 390594, "epoch": 2324} {"train_loss": -12.149070739746094, "global_step": 390595, "epoch": 2324} {"train_loss": -12.544273376464844, "global_step": 390596, "epoch": 2324} {"train_loss": -12.11916732788086, "global_step": 390597, "epoch": 2324} {"train_loss": -12.18600845336914, "global_step": 390598, "epoch": 2324} {"train_loss": -12.039652710869198, "global_step": 390599, "epoch": 2324, "val_loss": 299559.84375} {"train_loss": -12.344266891479492, "global_step": 390600, "epoch": 2325} {"train_loss": -12.497139930725098, "global_step": 390601, "epoch": 2325} {"train_loss": -12.41379165649414, "global_step": 390602, "epoch": 2325} {"train_loss": -12.44870376586914, "global_step": 390603, "epoch": 2325} {"train_loss": -12.569929122924805, "global_step": 390604, "epoch": 2325} {"train_loss": -12.344988822937012, "global_step": 390605, "epoch": 2325} {"train_loss": -12.58418083190918, "global_step": 390606, "epoch": 2325} {"train_loss": -12.644414901733398, "global_step": 390607, "epoch": 2325} {"train_loss": -12.561775207519531, "global_step": 390608, "epoch": 2325} {"train_loss": -12.50218391418457, "global_step": 390609, "epoch": 2325} {"train_loss": -12.523228645324707, "global_step": 390610, "epoch": 2325} {"train_loss": -12.539558410644531, "global_step": 390611, "epoch": 2325} {"train_loss": -12.574804306030273, "global_step": 390612, "epoch": 2325} {"train_loss": -12.316682815551758, "global_step": 390613, "epoch": 2325} {"train_loss": -12.412859916687012, "global_step": 390614, "epoch": 2325} {"train_loss": -12.265049934387207, "global_step": 390615, "epoch": 2325} {"train_loss": -12.430830001831055, "global_step": 390616, "epoch": 2325} {"train_loss": -12.371461868286133, "global_step": 390617, "epoch": 2325} {"train_loss": -12.474384307861328, "global_step": 390618, "epoch": 2325} {"train_loss": -12.260072708129883, "global_step": 390619, "epoch": 2325} {"train_loss": -12.494661331176758, "global_step": 390620, "epoch": 2325} {"train_loss": -12.430580139160156, "global_step": 390621, "epoch": 2325} {"train_loss": -12.74917221069336, "global_step": 390622, "epoch": 2325} {"train_loss": -12.497772216796875, "global_step": 390623, "epoch": 2325} {"train_loss": -12.276300430297852, "global_step": 390624, "epoch": 2325} {"train_loss": -12.5684814453125, "global_step": 390625, "epoch": 2325} {"train_loss": -12.357335090637207, "global_step": 390626, "epoch": 2325} {"train_loss": -12.319465637207031, "global_step": 390627, "epoch": 2325} {"train_loss": -12.334613800048828, "global_step": 390628, "epoch": 2325} {"train_loss": -12.143558502197266, "global_step": 390629, "epoch": 2325} {"train_loss": -12.668899536132812, "global_step": 390630, "epoch": 2325} {"train_loss": -11.99393367767334, "global_step": 390631, "epoch": 2325} {"train_loss": -12.300950050354004, "global_step": 390632, "epoch": 2325} {"train_loss": -12.268290519714355, "global_step": 390633, "epoch": 2325} {"train_loss": -12.5576810836792, "global_step": 390634, "epoch": 2325} {"train_loss": -12.78166389465332, "global_step": 390635, "epoch": 2325} {"train_loss": -12.667531967163086, "global_step": 390636, "epoch": 2325} {"train_loss": -12.635943412780762, "global_step": 390637, "epoch": 2325} {"train_loss": -12.73396110534668, "global_step": 390638, "epoch": 2325} {"train_loss": -12.710121154785156, "global_step": 390639, "epoch": 2325} {"train_loss": -12.82962417602539, "global_step": 390640, "epoch": 2325} {"train_loss": -12.654876708984375, "global_step": 390641, "epoch": 2325} {"train_loss": -12.796796798706055, "global_step": 390642, "epoch": 2325} {"train_loss": -12.700244903564453, "global_step": 390643, "epoch": 2325} {"train_loss": -12.923917770385742, "global_step": 390644, "epoch": 2325} {"train_loss": -12.866180419921875, "global_step": 390645, "epoch": 2325} {"train_loss": -12.627668380737305, "global_step": 390646, "epoch": 2325} {"train_loss": -12.680334091186523, "global_step": 390647, "epoch": 2325} {"train_loss": -12.833049774169922, "global_step": 390648, "epoch": 2325} {"train_loss": -12.47408676147461, "global_step": 390649, "epoch": 2325} {"train_loss": -12.53114128112793, "global_step": 390650, "epoch": 2325} {"train_loss": -12.689104080200195, "global_step": 390651, "epoch": 2325} {"train_loss": -12.64710807800293, "global_step": 390652, "epoch": 2325} {"train_loss": -12.3787841796875, "global_step": 390653, "epoch": 2325} {"train_loss": -12.885346412658691, "global_step": 390654, "epoch": 2325} {"train_loss": -12.829118728637695, "global_step": 390655, "epoch": 2325} {"train_loss": -12.580763816833496, "global_step": 390656, "epoch": 2325} {"train_loss": -12.223526000976562, "global_step": 390657, "epoch": 2325} {"train_loss": -12.4373779296875, "global_step": 390658, "epoch": 2325} {"train_loss": -12.551258087158203, "global_step": 390659, "epoch": 2325} {"train_loss": -12.894747734069824, "global_step": 390660, "epoch": 2325} {"train_loss": -12.712706565856934, "global_step": 390661, "epoch": 2325} {"train_loss": -12.347488403320312, "global_step": 390662, "epoch": 2325} {"train_loss": -12.559813499450684, "global_step": 390663, "epoch": 2325} {"train_loss": -12.375811576843262, "global_step": 390664, "epoch": 2325} {"train_loss": -12.386383056640625, "global_step": 390665, "epoch": 2325} {"train_loss": -12.097722053527832, "global_step": 390666, "epoch": 2325} {"train_loss": -12.159843444824219, "global_step": 390667, "epoch": 2325} {"train_loss": -12.076932907104492, "global_step": 390668, "epoch": 2325} {"train_loss": -12.463438034057617, "global_step": 390669, "epoch": 2325} {"train_loss": -12.236729621887207, "global_step": 390670, "epoch": 2325} {"train_loss": -12.067785263061523, "global_step": 390671, "epoch": 2325} {"train_loss": -12.094120979309082, "global_step": 390672, "epoch": 2325} {"train_loss": -11.399198532104492, "global_step": 390673, "epoch": 2325} {"train_loss": -11.817298889160156, "global_step": 390674, "epoch": 2325} {"train_loss": -11.580517768859863, "global_step": 390675, "epoch": 2325} {"train_loss": -11.729592323303223, "global_step": 390676, "epoch": 2325} {"train_loss": -11.998509407043457, "global_step": 390677, "epoch": 2325} {"train_loss": -11.478118896484375, "global_step": 390678, "epoch": 2325} {"train_loss": -12.35629653930664, "global_step": 390679, "epoch": 2325} {"train_loss": -11.401254653930664, "global_step": 390680, "epoch": 2325} {"train_loss": -12.299375534057617, "global_step": 390681, "epoch": 2325} {"train_loss": -11.892181396484375, "global_step": 390682, "epoch": 2325} {"train_loss": -11.563112258911133, "global_step": 390683, "epoch": 2325} {"train_loss": -11.501770973205566, "global_step": 390684, "epoch": 2325} {"train_loss": -12.167398452758789, "global_step": 390685, "epoch": 2325} {"train_loss": -12.05345344543457, "global_step": 390686, "epoch": 2325} {"train_loss": -12.004961967468262, "global_step": 390687, "epoch": 2325} {"train_loss": -11.765387535095215, "global_step": 390688, "epoch": 2325} {"train_loss": -11.312108993530273, "global_step": 390689, "epoch": 2325} {"train_loss": -12.37852954864502, "global_step": 390690, "epoch": 2325} {"train_loss": -11.181497573852539, "global_step": 390691, "epoch": 2325} {"train_loss": -11.828377723693848, "global_step": 390692, "epoch": 2325} {"train_loss": -12.224237442016602, "global_step": 390693, "epoch": 2325} {"train_loss": -11.56233024597168, "global_step": 390694, "epoch": 2325} {"train_loss": -12.283175468444824, "global_step": 390695, "epoch": 2325} {"train_loss": -12.174124717712402, "global_step": 390696, "epoch": 2325} {"train_loss": -11.187963485717773, "global_step": 390697, "epoch": 2325} {"train_loss": -12.363723754882812, "global_step": 390698, "epoch": 2325} {"train_loss": -11.385839462280273, "global_step": 390699, "epoch": 2325} {"train_loss": -11.165279388427734, "global_step": 390700, "epoch": 2325} {"train_loss": -11.859140396118164, "global_step": 390701, "epoch": 2325} {"train_loss": -12.128069877624512, "global_step": 390702, "epoch": 2325} {"train_loss": -11.82795524597168, "global_step": 390703, "epoch": 2325} {"train_loss": -12.192167282104492, "global_step": 390704, "epoch": 2325} {"train_loss": -9.837621688842773, "global_step": 390705, "epoch": 2325} {"train_loss": -11.88753604888916, "global_step": 390706, "epoch": 2325} {"train_loss": -9.928436279296875, "global_step": 390707, "epoch": 2325} {"train_loss": -10.378303527832031, "global_step": 390708, "epoch": 2325} {"train_loss": -9.707966804504395, "global_step": 390709, "epoch": 2325} {"train_loss": -10.32043743133545, "global_step": 390710, "epoch": 2325} {"train_loss": -8.674125671386719, "global_step": 390711, "epoch": 2325} {"train_loss": -10.532546997070312, "global_step": 390712, "epoch": 2325} {"train_loss": -8.344451904296875, "global_step": 390713, "epoch": 2325} {"train_loss": -11.333059310913086, "global_step": 390714, "epoch": 2325} {"train_loss": -8.562339782714844, "global_step": 390715, "epoch": 2325} {"train_loss": -8.294326782226562, "global_step": 390716, "epoch": 2325} {"train_loss": -11.372945785522461, "global_step": 390717, "epoch": 2325} {"train_loss": -7.230562210083008, "global_step": 390718, "epoch": 2325} {"train_loss": -9.60278606414795, "global_step": 390719, "epoch": 2325} {"train_loss": -9.120203971862793, "global_step": 390720, "epoch": 2325} {"train_loss": -9.463767051696777, "global_step": 390721, "epoch": 2325} {"train_loss": -9.134031295776367, "global_step": 390722, "epoch": 2325} {"train_loss": -7.9199652671813965, "global_step": 390723, "epoch": 2325} {"train_loss": -9.748210906982422, "global_step": 390724, "epoch": 2325} {"train_loss": -10.586071014404297, "global_step": 390725, "epoch": 2325} {"train_loss": -9.25071907043457, "global_step": 390726, "epoch": 2325} {"train_loss": -10.654900550842285, "global_step": 390727, "epoch": 2325} {"train_loss": -9.144979476928711, "global_step": 390728, "epoch": 2325} {"train_loss": -10.752901077270508, "global_step": 390729, "epoch": 2325} {"train_loss": -10.961528778076172, "global_step": 390730, "epoch": 2325} {"train_loss": -11.331275939941406, "global_step": 390731, "epoch": 2325} {"train_loss": -10.585370063781738, "global_step": 390732, "epoch": 2325} {"train_loss": -11.34060287475586, "global_step": 390733, "epoch": 2325} {"train_loss": -10.22021770477295, "global_step": 390734, "epoch": 2325} {"train_loss": -10.499853134155273, "global_step": 390735, "epoch": 2325} {"train_loss": -11.266571998596191, "global_step": 390736, "epoch": 2325} {"train_loss": -11.277728080749512, "global_step": 390737, "epoch": 2325} {"train_loss": -11.725793838500977, "global_step": 390738, "epoch": 2325} {"train_loss": -11.341670989990234, "global_step": 390739, "epoch": 2325} {"train_loss": -11.335445404052734, "global_step": 390740, "epoch": 2325} {"train_loss": -11.497310638427734, "global_step": 390741, "epoch": 2325} {"train_loss": -11.834571838378906, "global_step": 390742, "epoch": 2325} {"train_loss": -11.050947189331055, "global_step": 390743, "epoch": 2325} {"train_loss": -12.012969970703125, "global_step": 390744, "epoch": 2325} {"train_loss": -11.421876907348633, "global_step": 390745, "epoch": 2325} {"train_loss": -10.923952102661133, "global_step": 390746, "epoch": 2325} {"train_loss": -11.947432518005371, "global_step": 390747, "epoch": 2325} {"train_loss": -11.161520957946777, "global_step": 390748, "epoch": 2325} {"train_loss": -11.45855712890625, "global_step": 390749, "epoch": 2325} {"train_loss": -11.686049461364746, "global_step": 390750, "epoch": 2325} {"train_loss": -11.702415466308594, "global_step": 390751, "epoch": 2325} {"train_loss": -11.709259033203125, "global_step": 390752, "epoch": 2325} {"train_loss": -11.84951400756836, "global_step": 390753, "epoch": 2325} {"train_loss": -11.790266990661621, "global_step": 390754, "epoch": 2325} {"train_loss": -11.157232284545898, "global_step": 390755, "epoch": 2325} {"train_loss": -12.222160339355469, "global_step": 390756, "epoch": 2325} {"train_loss": -11.634866714477539, "global_step": 390757, "epoch": 2325} {"train_loss": -11.950300216674805, "global_step": 390758, "epoch": 2325} {"train_loss": -12.105485916137695, "global_step": 390759, "epoch": 2325} {"train_loss": -11.635857582092285, "global_step": 390760, "epoch": 2325} {"train_loss": -12.000743865966797, "global_step": 390761, "epoch": 2325} {"train_loss": -12.00529670715332, "global_step": 390762, "epoch": 2325} {"train_loss": -11.799248695373535, "global_step": 390763, "epoch": 2325} {"train_loss": -12.315454483032227, "global_step": 390764, "epoch": 2325} {"train_loss": -12.172159194946289, "global_step": 390765, "epoch": 2325} {"train_loss": -12.198266983032227, "global_step": 390766, "epoch": 2325} {"train_loss": -11.733939554010119, "global_step": 390767, "epoch": 2325, "val_loss": 292755.75, "train_action_mse_error": 1.7504234313964844} {"train_loss": -12.025391578674316, "global_step": 390768, "epoch": 2326} {"train_loss": -11.973067283630371, "global_step": 390769, "epoch": 2326} {"train_loss": -11.653558731079102, "global_step": 390770, "epoch": 2326} {"train_loss": -12.167190551757812, "global_step": 390771, "epoch": 2326} {"train_loss": -12.082773208618164, "global_step": 390772, "epoch": 2326} {"train_loss": -12.197113990783691, "global_step": 390773, "epoch": 2326} {"train_loss": -12.476160049438477, "global_step": 390774, "epoch": 2326} {"train_loss": -12.210380554199219, "global_step": 390775, "epoch": 2326} {"train_loss": -12.128988265991211, "global_step": 390776, "epoch": 2326} {"train_loss": -12.014968872070312, "global_step": 390777, "epoch": 2326} {"train_loss": -12.064502716064453, "global_step": 390778, "epoch": 2326} {"train_loss": -12.27581787109375, "global_step": 390779, "epoch": 2326} {"train_loss": -12.278465270996094, "global_step": 390780, "epoch": 2326} {"train_loss": -12.40013313293457, "global_step": 390781, "epoch": 2326} {"train_loss": -12.297135353088379, "global_step": 390782, "epoch": 2326} {"train_loss": -12.339445114135742, "global_step": 390783, "epoch": 2326} {"train_loss": -12.190670013427734, "global_step": 390784, "epoch": 2326} {"train_loss": -12.254142761230469, "global_step": 390785, "epoch": 2326} {"train_loss": -12.394725799560547, "global_step": 390786, "epoch": 2326} {"train_loss": -12.279781341552734, "global_step": 390787, "epoch": 2326} {"train_loss": -12.521086692810059, "global_step": 390788, "epoch": 2326} {"train_loss": -12.131891250610352, "global_step": 390789, "epoch": 2326} {"train_loss": -12.402898788452148, "global_step": 390790, "epoch": 2326} {"train_loss": -12.21876335144043, "global_step": 390791, "epoch": 2326} {"train_loss": -12.539203643798828, "global_step": 390792, "epoch": 2326} {"train_loss": -12.191459655761719, "global_step": 390793, "epoch": 2326} {"train_loss": -12.51915454864502, "global_step": 390794, "epoch": 2326} {"train_loss": -12.095898628234863, "global_step": 390795, "epoch": 2326} {"train_loss": -12.463174819946289, "global_step": 390796, "epoch": 2326} {"train_loss": -12.118085861206055, "global_step": 390797, "epoch": 2326} {"train_loss": -12.371257781982422, "global_step": 390798, "epoch": 2326} {"train_loss": -12.44394302368164, "global_step": 390799, "epoch": 2326} {"train_loss": -12.450884819030762, "global_step": 390800, "epoch": 2326} {"train_loss": -12.20704460144043, "global_step": 390801, "epoch": 2326} {"train_loss": -12.33108139038086, "global_step": 390802, "epoch": 2326} {"train_loss": -12.328886032104492, "global_step": 390803, "epoch": 2326} {"train_loss": -12.613813400268555, "global_step": 390804, "epoch": 2326} {"train_loss": -12.300949096679688, "global_step": 390805, "epoch": 2326} {"train_loss": -12.275899887084961, "global_step": 390806, "epoch": 2326} {"train_loss": -12.590897560119629, "global_step": 390807, "epoch": 2326} {"train_loss": -12.609477996826172, "global_step": 390808, "epoch": 2326} {"train_loss": -12.602441787719727, "global_step": 390809, "epoch": 2326} {"train_loss": -12.336454391479492, "global_step": 390810, "epoch": 2326} {"train_loss": -12.662360191345215, "global_step": 390811, "epoch": 2326} {"train_loss": -12.696965217590332, "global_step": 390812, "epoch": 2326} {"train_loss": -12.647464752197266, "global_step": 390813, "epoch": 2326} {"train_loss": -12.356090545654297, "global_step": 390814, "epoch": 2326} {"train_loss": -12.343971252441406, "global_step": 390815, "epoch": 2326} {"train_loss": -12.0618896484375, "global_step": 390816, "epoch": 2326} {"train_loss": -12.247747421264648, "global_step": 390817, "epoch": 2326} {"train_loss": -12.284398078918457, "global_step": 390818, "epoch": 2326} {"train_loss": -12.453880310058594, "global_step": 390819, "epoch": 2326} {"train_loss": -12.60928726196289, "global_step": 390820, "epoch": 2326} {"train_loss": -12.532480239868164, "global_step": 390821, "epoch": 2326} {"train_loss": -12.661584854125977, "global_step": 390822, "epoch": 2326} {"train_loss": -12.513264656066895, "global_step": 390823, "epoch": 2326} {"train_loss": -12.725064277648926, "global_step": 390824, "epoch": 2326} {"train_loss": -12.284061431884766, "global_step": 390825, "epoch": 2326} {"train_loss": -12.537516593933105, "global_step": 390826, "epoch": 2326} {"train_loss": -12.540477752685547, "global_step": 390827, "epoch": 2326} {"train_loss": -12.459449768066406, "global_step": 390828, "epoch": 2326} {"train_loss": -12.720137596130371, "global_step": 390829, "epoch": 2326} {"train_loss": -12.593799591064453, "global_step": 390830, "epoch": 2326} {"train_loss": -12.620278358459473, "global_step": 390831, "epoch": 2326} {"train_loss": -12.82164192199707, "global_step": 390832, "epoch": 2326} {"train_loss": -12.667509078979492, "global_step": 390833, "epoch": 2326} {"train_loss": -12.544212341308594, "global_step": 390834, "epoch": 2326} {"train_loss": -11.754657745361328, "global_step": 390835, "epoch": 2326} {"train_loss": -12.772130966186523, "global_step": 390836, "epoch": 2326} {"train_loss": -12.072836875915527, "global_step": 390837, "epoch": 2326} {"train_loss": -11.924171447753906, "global_step": 390838, "epoch": 2326} {"train_loss": -12.591983795166016, "global_step": 390839, "epoch": 2326} {"train_loss": -12.397994995117188, "global_step": 390840, "epoch": 2326} {"train_loss": -11.510600090026855, "global_step": 390841, "epoch": 2326} {"train_loss": -11.565214157104492, "global_step": 390842, "epoch": 2326} {"train_loss": -12.098722457885742, "global_step": 390843, "epoch": 2326} {"train_loss": -12.484777450561523, "global_step": 390844, "epoch": 2326} {"train_loss": -12.100175857543945, "global_step": 390845, "epoch": 2326} {"train_loss": -11.880127906799316, "global_step": 390846, "epoch": 2326} {"train_loss": -11.792041778564453, "global_step": 390847, "epoch": 2326} {"train_loss": -12.38742446899414, "global_step": 390848, "epoch": 2326} {"train_loss": -12.619291305541992, "global_step": 390849, "epoch": 2326} {"train_loss": -12.240195274353027, "global_step": 390850, "epoch": 2326} {"train_loss": -12.382612228393555, "global_step": 390851, "epoch": 2326} {"train_loss": -12.296348571777344, "global_step": 390852, "epoch": 2326} {"train_loss": -11.72920036315918, "global_step": 390853, "epoch": 2326} {"train_loss": -12.29789924621582, "global_step": 390854, "epoch": 2326} {"train_loss": -12.571310043334961, "global_step": 390855, "epoch": 2326} {"train_loss": -12.567423820495605, "global_step": 390856, "epoch": 2326} {"train_loss": -12.358125686645508, "global_step": 390857, "epoch": 2326} {"train_loss": -11.682150840759277, "global_step": 390858, "epoch": 2326} {"train_loss": -11.902997970581055, "global_step": 390859, "epoch": 2326} {"train_loss": -12.201998710632324, "global_step": 390860, "epoch": 2326} {"train_loss": -12.045208930969238, "global_step": 390861, "epoch": 2326} {"train_loss": -12.501303672790527, "global_step": 390862, "epoch": 2326} {"train_loss": -11.953805923461914, "global_step": 390863, "epoch": 2326} {"train_loss": -12.314395904541016, "global_step": 390864, "epoch": 2326} {"train_loss": -11.672547340393066, "global_step": 390865, "epoch": 2326} {"train_loss": -12.231178283691406, "global_step": 390866, "epoch": 2326} {"train_loss": -11.696505546569824, "global_step": 390867, "epoch": 2326} {"train_loss": -11.155426025390625, "global_step": 390868, "epoch": 2326} {"train_loss": -11.387451171875, "global_step": 390869, "epoch": 2326} {"train_loss": -12.314391136169434, "global_step": 390870, "epoch": 2326} {"train_loss": -11.45582389831543, "global_step": 390871, "epoch": 2326} {"train_loss": -10.219186782836914, "global_step": 390872, "epoch": 2326} {"train_loss": -12.068133354187012, "global_step": 390873, "epoch": 2326} {"train_loss": -11.190781593322754, "global_step": 390874, "epoch": 2326} {"train_loss": -11.040355682373047, "global_step": 390875, "epoch": 2326} {"train_loss": -11.26014232635498, "global_step": 390876, "epoch": 2326} {"train_loss": -12.139595985412598, "global_step": 390877, "epoch": 2326} {"train_loss": -11.040048599243164, "global_step": 390878, "epoch": 2326} {"train_loss": -11.879453659057617, "global_step": 390879, "epoch": 2326} {"train_loss": -11.587711334228516, "global_step": 390880, "epoch": 2326} {"train_loss": -11.915552139282227, "global_step": 390881, "epoch": 2326} {"train_loss": -11.544134140014648, "global_step": 390882, "epoch": 2326} {"train_loss": -12.54054069519043, "global_step": 390883, "epoch": 2326} {"train_loss": -11.681529998779297, "global_step": 390884, "epoch": 2326} {"train_loss": -11.895807266235352, "global_step": 390885, "epoch": 2326} {"train_loss": -12.059563636779785, "global_step": 390886, "epoch": 2326} {"train_loss": -11.411463737487793, "global_step": 390887, "epoch": 2326} {"train_loss": -11.64383316040039, "global_step": 390888, "epoch": 2326} {"train_loss": -11.426111221313477, "global_step": 390889, "epoch": 2326} {"train_loss": -12.071327209472656, "global_step": 390890, "epoch": 2326} {"train_loss": -11.544065475463867, "global_step": 390891, "epoch": 2326} {"train_loss": -12.181188583374023, "global_step": 390892, "epoch": 2326} {"train_loss": -11.550621032714844, "global_step": 390893, "epoch": 2326} {"train_loss": -11.980234146118164, "global_step": 390894, "epoch": 2326} {"train_loss": -11.33709716796875, "global_step": 390895, "epoch": 2326} {"train_loss": -11.462645530700684, "global_step": 390896, "epoch": 2326} {"train_loss": -11.528526306152344, "global_step": 390897, "epoch": 2326} {"train_loss": -11.896324157714844, "global_step": 390898, "epoch": 2326} {"train_loss": -11.906171798706055, "global_step": 390899, "epoch": 2326} {"train_loss": -12.08889102935791, "global_step": 390900, "epoch": 2326} {"train_loss": -11.887014389038086, "global_step": 390901, "epoch": 2326} {"train_loss": -11.963525772094727, "global_step": 390902, "epoch": 2326} {"train_loss": -12.024456977844238, "global_step": 390903, "epoch": 2326} {"train_loss": -12.328252792358398, "global_step": 390904, "epoch": 2326} {"train_loss": -12.085800170898438, "global_step": 390905, "epoch": 2326} {"train_loss": -12.136468887329102, "global_step": 390906, "epoch": 2326} {"train_loss": -12.08900260925293, "global_step": 390907, "epoch": 2326} {"train_loss": -11.901829719543457, "global_step": 390908, "epoch": 2326} {"train_loss": -12.363033294677734, "global_step": 390909, "epoch": 2326} {"train_loss": -12.163915634155273, "global_step": 390910, "epoch": 2326} {"train_loss": -12.62142562866211, "global_step": 390911, "epoch": 2326} {"train_loss": -12.35694694519043, "global_step": 390912, "epoch": 2326} {"train_loss": -12.185145378112793, "global_step": 390913, "epoch": 2326} {"train_loss": -12.630005836486816, "global_step": 390914, "epoch": 2326} {"train_loss": -12.405607223510742, "global_step": 390915, "epoch": 2326} {"train_loss": -12.191566467285156, "global_step": 390916, "epoch": 2326} {"train_loss": -12.398160934448242, "global_step": 390917, "epoch": 2326} {"train_loss": -12.393838882446289, "global_step": 390918, "epoch": 2326} {"train_loss": -12.024295806884766, "global_step": 390919, "epoch": 2326} {"train_loss": -12.645393371582031, "global_step": 390920, "epoch": 2326} {"train_loss": -11.983175277709961, "global_step": 390921, "epoch": 2326} {"train_loss": -12.049397468566895, "global_step": 390922, "epoch": 2326} {"train_loss": -12.200499534606934, "global_step": 390923, "epoch": 2326} {"train_loss": -12.070225715637207, "global_step": 390924, "epoch": 2326} {"train_loss": -11.794018745422363, "global_step": 390925, "epoch": 2326} {"train_loss": -12.257979393005371, "global_step": 390926, "epoch": 2326} {"train_loss": -12.122312545776367, "global_step": 390927, "epoch": 2326} {"train_loss": -11.424786567687988, "global_step": 390928, "epoch": 2326} {"train_loss": -11.874984741210938, "global_step": 390929, "epoch": 2326} {"train_loss": -11.912497520446777, "global_step": 390930, "epoch": 2326} {"train_loss": -12.139986991882324, "global_step": 390931, "epoch": 2326} {"train_loss": -12.190630912780762, "global_step": 390932, "epoch": 2326} {"train_loss": -12.67863941192627, "global_step": 390933, "epoch": 2326} {"train_loss": -12.212279319763184, "global_step": 390934, "epoch": 2326} {"train_loss": -12.142831666128975, "global_step": 390935, "epoch": 2326, "val_loss": 295151.75} {"train_loss": -12.486620903015137, "global_step": 390936, "epoch": 2327} {"train_loss": -12.362831115722656, "global_step": 390937, "epoch": 2327} {"train_loss": -12.122130393981934, "global_step": 390938, "epoch": 2327} {"train_loss": -12.362464904785156, "global_step": 390939, "epoch": 2327} {"train_loss": -12.380643844604492, "global_step": 390940, "epoch": 2327} {"train_loss": -12.543496131896973, "global_step": 390941, "epoch": 2327} {"train_loss": -12.40572738647461, "global_step": 390942, "epoch": 2327} {"train_loss": -12.628471374511719, "global_step": 390943, "epoch": 2327} {"train_loss": -12.41225528717041, "global_step": 390944, "epoch": 2327} {"train_loss": -12.482097625732422, "global_step": 390945, "epoch": 2327} {"train_loss": -12.364029884338379, "global_step": 390946, "epoch": 2327} {"train_loss": -11.990739822387695, "global_step": 390947, "epoch": 2327} {"train_loss": -12.273785591125488, "global_step": 390948, "epoch": 2327} {"train_loss": -12.447663307189941, "global_step": 390949, "epoch": 2327} {"train_loss": -12.105114936828613, "global_step": 390950, "epoch": 2327} {"train_loss": -12.388641357421875, "global_step": 390951, "epoch": 2327} {"train_loss": -12.490287780761719, "global_step": 390952, "epoch": 2327} {"train_loss": -12.650251388549805, "global_step": 390953, "epoch": 2327} {"train_loss": -12.006460189819336, "global_step": 390954, "epoch": 2327} {"train_loss": -12.396200180053711, "global_step": 390955, "epoch": 2327} {"train_loss": -12.201363563537598, "global_step": 390956, "epoch": 2327} {"train_loss": -12.474303245544434, "global_step": 390957, "epoch": 2327} {"train_loss": -12.511431694030762, "global_step": 390958, "epoch": 2327} {"train_loss": -12.613832473754883, "global_step": 390959, "epoch": 2327} {"train_loss": -12.258392333984375, "global_step": 390960, "epoch": 2327} {"train_loss": -12.672801971435547, "global_step": 390961, "epoch": 2327} {"train_loss": -12.274306297302246, "global_step": 390962, "epoch": 2327} {"train_loss": -12.328648567199707, "global_step": 390963, "epoch": 2327} {"train_loss": -11.998312950134277, "global_step": 390964, "epoch": 2327} {"train_loss": -12.364251136779785, "global_step": 390965, "epoch": 2327} {"train_loss": -12.34840202331543, "global_step": 390966, "epoch": 2327} {"train_loss": -12.25607681274414, "global_step": 390967, "epoch": 2327} {"train_loss": -12.506803512573242, "global_step": 390968, "epoch": 2327} {"train_loss": -12.406187057495117, "global_step": 390969, "epoch": 2327} {"train_loss": -12.045738220214844, "global_step": 390970, "epoch": 2327} {"train_loss": -12.632364273071289, "global_step": 390971, "epoch": 2327} {"train_loss": -12.245656967163086, "global_step": 390972, "epoch": 2327} {"train_loss": -12.49760627746582, "global_step": 390973, "epoch": 2327} {"train_loss": -12.637447357177734, "global_step": 390974, "epoch": 2327} {"train_loss": -12.09213924407959, "global_step": 390975, "epoch": 2327} {"train_loss": -12.681938171386719, "global_step": 390976, "epoch": 2327} {"train_loss": -12.432538986206055, "global_step": 390977, "epoch": 2327} {"train_loss": -12.580070495605469, "global_step": 390978, "epoch": 2327} {"train_loss": -12.250818252563477, "global_step": 390979, "epoch": 2327} {"train_loss": -12.626668930053711, "global_step": 390980, "epoch": 2327} {"train_loss": -11.727134704589844, "global_step": 390981, "epoch": 2327} {"train_loss": -12.882223129272461, "global_step": 390982, "epoch": 2327} {"train_loss": -12.409369468688965, "global_step": 390983, "epoch": 2327} {"train_loss": -12.686622619628906, "global_step": 390984, "epoch": 2327} {"train_loss": -12.596770286560059, "global_step": 390985, "epoch": 2327} {"train_loss": -12.567071914672852, "global_step": 390986, "epoch": 2327} {"train_loss": -12.0830078125, "global_step": 390987, "epoch": 2327} {"train_loss": -12.478111267089844, "global_step": 390988, "epoch": 2327} {"train_loss": -11.969093322753906, "global_step": 390989, "epoch": 2327} {"train_loss": -12.596879959106445, "global_step": 390990, "epoch": 2327} {"train_loss": -12.151546478271484, "global_step": 390991, "epoch": 2327} {"train_loss": -12.224870681762695, "global_step": 390992, "epoch": 2327} {"train_loss": -11.407422065734863, "global_step": 390993, "epoch": 2327} {"train_loss": -11.20077133178711, "global_step": 390994, "epoch": 2327} {"train_loss": -12.073698043823242, "global_step": 390995, "epoch": 2327} {"train_loss": -11.115333557128906, "global_step": 390996, "epoch": 2327} {"train_loss": -11.38780403137207, "global_step": 390997, "epoch": 2327} {"train_loss": -12.214781761169434, "global_step": 390998, "epoch": 2327} {"train_loss": -12.018369674682617, "global_step": 390999, "epoch": 2327} {"train_loss": -11.007153511047363, "global_step": 391000, "epoch": 2327} {"train_loss": -11.327311515808105, "global_step": 391001, "epoch": 2327} {"train_loss": -11.591920852661133, "global_step": 391002, "epoch": 2327} {"train_loss": -11.072041511535645, "global_step": 391003, "epoch": 2327} {"train_loss": -10.707889556884766, "global_step": 391004, "epoch": 2327} {"train_loss": -11.54476547241211, "global_step": 391005, "epoch": 2327} {"train_loss": -11.012502670288086, "global_step": 391006, "epoch": 2327} {"train_loss": -11.62432861328125, "global_step": 391007, "epoch": 2327} {"train_loss": -10.972675323486328, "global_step": 391008, "epoch": 2327} {"train_loss": -11.866901397705078, "global_step": 391009, "epoch": 2327} {"train_loss": -12.271875381469727, "global_step": 391010, "epoch": 2327} {"train_loss": -11.78071117401123, "global_step": 391011, "epoch": 2327} {"train_loss": -11.889954566955566, "global_step": 391012, "epoch": 2327} {"train_loss": -12.077613830566406, "global_step": 391013, "epoch": 2327} {"train_loss": -11.519506454467773, "global_step": 391014, "epoch": 2327} {"train_loss": -12.0734224319458, "global_step": 391015, "epoch": 2327} {"train_loss": -11.047526359558105, "global_step": 391016, "epoch": 2327} {"train_loss": -11.245574951171875, "global_step": 391017, "epoch": 2327} {"train_loss": -11.125898361206055, "global_step": 391018, "epoch": 2327} {"train_loss": -11.665193557739258, "global_step": 391019, "epoch": 2327} {"train_loss": -11.099143981933594, "global_step": 391020, "epoch": 2327} {"train_loss": -12.021125793457031, "global_step": 391021, "epoch": 2327} {"train_loss": -11.677582740783691, "global_step": 391022, "epoch": 2327} {"train_loss": -12.050586700439453, "global_step": 391023, "epoch": 2327} {"train_loss": -11.713968276977539, "global_step": 391024, "epoch": 2327} {"train_loss": -12.182594299316406, "global_step": 391025, "epoch": 2327} {"train_loss": -12.056255340576172, "global_step": 391026, "epoch": 2327} {"train_loss": -11.996477127075195, "global_step": 391027, "epoch": 2327} {"train_loss": -12.39065170288086, "global_step": 391028, "epoch": 2327} {"train_loss": -12.207503318786621, "global_step": 391029, "epoch": 2327} {"train_loss": -12.366687774658203, "global_step": 391030, "epoch": 2327} {"train_loss": -12.223636627197266, "global_step": 391031, "epoch": 2327} {"train_loss": -12.568634033203125, "global_step": 391032, "epoch": 2327} {"train_loss": -12.316336631774902, "global_step": 391033, "epoch": 2327} {"train_loss": -12.546600341796875, "global_step": 391034, "epoch": 2327} {"train_loss": -12.101081848144531, "global_step": 391035, "epoch": 2327} {"train_loss": -12.246488571166992, "global_step": 391036, "epoch": 2327} {"train_loss": -12.458646774291992, "global_step": 391037, "epoch": 2327} {"train_loss": -11.885068893432617, "global_step": 391038, "epoch": 2327} {"train_loss": -12.635398864746094, "global_step": 391039, "epoch": 2327} {"train_loss": -12.3147611618042, "global_step": 391040, "epoch": 2327} {"train_loss": -12.404214859008789, "global_step": 391041, "epoch": 2327} {"train_loss": -12.276643753051758, "global_step": 391042, "epoch": 2327} {"train_loss": -12.651053428649902, "global_step": 391043, "epoch": 2327} {"train_loss": -12.452241897583008, "global_step": 391044, "epoch": 2327} {"train_loss": -12.411176681518555, "global_step": 391045, "epoch": 2327} {"train_loss": -12.038599967956543, "global_step": 391046, "epoch": 2327} {"train_loss": -12.284546852111816, "global_step": 391047, "epoch": 2327} {"train_loss": -12.294230461120605, "global_step": 391048, "epoch": 2327} {"train_loss": -11.63403606414795, "global_step": 391049, "epoch": 2327} {"train_loss": -12.28139877319336, "global_step": 391050, "epoch": 2327} {"train_loss": -11.801229476928711, "global_step": 391051, "epoch": 2327} {"train_loss": -12.381160736083984, "global_step": 391052, "epoch": 2327} {"train_loss": -12.106201171875, "global_step": 391053, "epoch": 2327} {"train_loss": -12.2991943359375, "global_step": 391054, "epoch": 2327} {"train_loss": -11.703888893127441, "global_step": 391055, "epoch": 2327} {"train_loss": -12.144303321838379, "global_step": 391056, "epoch": 2327} {"train_loss": -11.231154441833496, "global_step": 391057, "epoch": 2327} {"train_loss": -12.244575500488281, "global_step": 391058, "epoch": 2327} {"train_loss": -11.841766357421875, "global_step": 391059, "epoch": 2327} {"train_loss": -12.38000202178955, "global_step": 391060, "epoch": 2327} {"train_loss": -12.007156372070312, "global_step": 391061, "epoch": 2327} {"train_loss": -12.235535621643066, "global_step": 391062, "epoch": 2327} {"train_loss": -12.206205368041992, "global_step": 391063, "epoch": 2327} {"train_loss": -12.149190902709961, "global_step": 391064, "epoch": 2327} {"train_loss": -12.391357421875, "global_step": 391065, "epoch": 2327} {"train_loss": -12.265260696411133, "global_step": 391066, "epoch": 2327} {"train_loss": -12.32347297668457, "global_step": 391067, "epoch": 2327} {"train_loss": -12.414311408996582, "global_step": 391068, "epoch": 2327} {"train_loss": -12.15544605255127, "global_step": 391069, "epoch": 2327} {"train_loss": -12.337199211120605, "global_step": 391070, "epoch": 2327} {"train_loss": -11.69540786743164, "global_step": 391071, "epoch": 2327} {"train_loss": -12.033124923706055, "global_step": 391072, "epoch": 2327} {"train_loss": -11.91983413696289, "global_step": 391073, "epoch": 2327} {"train_loss": -12.05717658996582, "global_step": 391074, "epoch": 2327} {"train_loss": -11.508231163024902, "global_step": 391075, "epoch": 2327} {"train_loss": -12.052854537963867, "global_step": 391076, "epoch": 2327} {"train_loss": -11.63143539428711, "global_step": 391077, "epoch": 2327} {"train_loss": -12.212442398071289, "global_step": 391078, "epoch": 2327} {"train_loss": -11.78057861328125, "global_step": 391079, "epoch": 2327} {"train_loss": -10.975775718688965, "global_step": 391080, "epoch": 2327} {"train_loss": -11.981941223144531, "global_step": 391081, "epoch": 2327} {"train_loss": -11.100116729736328, "global_step": 391082, "epoch": 2327} {"train_loss": -10.833219528198242, "global_step": 391083, "epoch": 2327} {"train_loss": -10.828678131103516, "global_step": 391084, "epoch": 2327} {"train_loss": -8.954090118408203, "global_step": 391085, "epoch": 2327} {"train_loss": -8.443626403808594, "global_step": 391086, "epoch": 2327} {"train_loss": -7.94807767868042, "global_step": 391087, "epoch": 2327} {"train_loss": -9.2681884765625, "global_step": 391088, "epoch": 2327} {"train_loss": -10.109162330627441, "global_step": 391089, "epoch": 2327} {"train_loss": -10.981823921203613, "global_step": 391090, "epoch": 2327} {"train_loss": -9.262447357177734, "global_step": 391091, "epoch": 2327} {"train_loss": -9.74909782409668, "global_step": 391092, "epoch": 2327} {"train_loss": -8.766731262207031, "global_step": 391093, "epoch": 2327} {"train_loss": -10.086234092712402, "global_step": 391094, "epoch": 2327} {"train_loss": -9.737475395202637, "global_step": 391095, "epoch": 2327} {"train_loss": -10.131422996520996, "global_step": 391096, "epoch": 2327} {"train_loss": -9.80079460144043, "global_step": 391097, "epoch": 2327} {"train_loss": -8.565568923950195, "global_step": 391098, "epoch": 2327} {"train_loss": -8.716331481933594, "global_step": 391099, "epoch": 2327} {"train_loss": -9.10450267791748, "global_step": 391100, "epoch": 2327} {"train_loss": -8.197919845581055, "global_step": 391101, "epoch": 2327} {"train_loss": -9.635887145996094, "global_step": 391102, "epoch": 2327} {"train_loss": -11.763850572563353, "global_step": 391103, "epoch": 2327, "val_loss": 291448.0625} {"train_loss": -9.22583293914795, "global_step": 391104, "epoch": 2328} {"train_loss": -10.123578071594238, "global_step": 391105, "epoch": 2328} {"train_loss": -10.210630416870117, "global_step": 391106, "epoch": 2328} {"train_loss": -10.077253341674805, "global_step": 391107, "epoch": 2328} {"train_loss": -10.038644790649414, "global_step": 391108, "epoch": 2328} {"train_loss": -11.324625015258789, "global_step": 391109, "epoch": 2328} {"train_loss": -10.744056701660156, "global_step": 391110, "epoch": 2328} {"train_loss": -10.561426162719727, "global_step": 391111, "epoch": 2328} {"train_loss": -11.038556098937988, "global_step": 391112, "epoch": 2328} {"train_loss": -10.836393356323242, "global_step": 391113, "epoch": 2328} {"train_loss": -10.918797492980957, "global_step": 391114, "epoch": 2328} {"train_loss": -11.661613464355469, "global_step": 391115, "epoch": 2328} {"train_loss": -10.736248016357422, "global_step": 391116, "epoch": 2328} {"train_loss": -10.94741153717041, "global_step": 391117, "epoch": 2328} {"train_loss": -11.369813919067383, "global_step": 391118, "epoch": 2328} {"train_loss": -11.186864852905273, "global_step": 391119, "epoch": 2328} {"train_loss": -11.714320182800293, "global_step": 391120, "epoch": 2328} {"train_loss": -11.725762367248535, "global_step": 391121, "epoch": 2328} {"train_loss": -11.494803428649902, "global_step": 391122, "epoch": 2328} {"train_loss": -11.796499252319336, "global_step": 391123, "epoch": 2328} {"train_loss": -11.51647663116455, "global_step": 391124, "epoch": 2328} {"train_loss": -11.347089767456055, "global_step": 391125, "epoch": 2328} {"train_loss": -11.608125686645508, "global_step": 391126, "epoch": 2328} {"train_loss": -11.66208267211914, "global_step": 391127, "epoch": 2328} {"train_loss": -11.670069694519043, "global_step": 391128, "epoch": 2328} {"train_loss": -11.669454574584961, "global_step": 391129, "epoch": 2328} {"train_loss": -11.637160301208496, "global_step": 391130, "epoch": 2328} {"train_loss": -11.623699188232422, "global_step": 391131, "epoch": 2328} {"train_loss": -12.083351135253906, "global_step": 391132, "epoch": 2328} {"train_loss": -11.92282485961914, "global_step": 391133, "epoch": 2328} {"train_loss": -11.702762603759766, "global_step": 391134, "epoch": 2328} {"train_loss": -12.19146728515625, "global_step": 391135, "epoch": 2328} {"train_loss": -11.788768768310547, "global_step": 391136, "epoch": 2328} {"train_loss": -12.084721565246582, "global_step": 391137, "epoch": 2328} {"train_loss": -11.509157180786133, "global_step": 391138, "epoch": 2328} {"train_loss": -11.714967727661133, "global_step": 391139, "epoch": 2328} {"train_loss": -11.972626686096191, "global_step": 391140, "epoch": 2328} {"train_loss": -12.277986526489258, "global_step": 391141, "epoch": 2328} {"train_loss": -11.83970832824707, "global_step": 391142, "epoch": 2328} {"train_loss": -12.349225044250488, "global_step": 391143, "epoch": 2328} {"train_loss": -12.038064956665039, "global_step": 391144, "epoch": 2328} {"train_loss": -12.146710395812988, "global_step": 391145, "epoch": 2328} {"train_loss": -12.190617561340332, "global_step": 391146, "epoch": 2328} {"train_loss": -12.296521186828613, "global_step": 391147, "epoch": 2328} {"train_loss": -12.132272720336914, "global_step": 391148, "epoch": 2328} {"train_loss": -12.052467346191406, "global_step": 391149, "epoch": 2328} {"train_loss": -12.063810348510742, "global_step": 391150, "epoch": 2328} {"train_loss": -12.265130996704102, "global_step": 391151, "epoch": 2328} {"train_loss": -12.349613189697266, "global_step": 391152, "epoch": 2328} {"train_loss": -12.36244010925293, "global_step": 391153, "epoch": 2328} {"train_loss": -12.332016944885254, "global_step": 391154, "epoch": 2328} {"train_loss": -12.237510681152344, "global_step": 391155, "epoch": 2328} {"train_loss": -12.41812801361084, "global_step": 391156, "epoch": 2328} {"train_loss": -11.874616622924805, "global_step": 391157, "epoch": 2328} {"train_loss": -12.311751365661621, "global_step": 391158, "epoch": 2328} {"train_loss": -12.125800132751465, "global_step": 391159, "epoch": 2328} {"train_loss": -12.229524612426758, "global_step": 391160, "epoch": 2328} {"train_loss": -12.074577331542969, "global_step": 391161, "epoch": 2328} {"train_loss": -12.13779067993164, "global_step": 391162, "epoch": 2328} {"train_loss": -11.961926460266113, "global_step": 391163, "epoch": 2328} {"train_loss": -11.986949920654297, "global_step": 391164, "epoch": 2328} {"train_loss": -11.957645416259766, "global_step": 391165, "epoch": 2328} {"train_loss": -12.317867279052734, "global_step": 391166, "epoch": 2328} {"train_loss": -11.74024486541748, "global_step": 391167, "epoch": 2328} {"train_loss": -12.333700180053711, "global_step": 391168, "epoch": 2328} {"train_loss": -11.788774490356445, "global_step": 391169, "epoch": 2328} {"train_loss": -12.244089126586914, "global_step": 391170, "epoch": 2328} {"train_loss": -11.997095108032227, "global_step": 391171, "epoch": 2328} {"train_loss": -12.297576904296875, "global_step": 391172, "epoch": 2328} {"train_loss": -11.538639068603516, "global_step": 391173, "epoch": 2328} {"train_loss": -12.120240211486816, "global_step": 391174, "epoch": 2328} {"train_loss": -11.64043140411377, "global_step": 391175, "epoch": 2328} {"train_loss": -11.919989585876465, "global_step": 391176, "epoch": 2328} {"train_loss": -12.028726577758789, "global_step": 391177, "epoch": 2328} {"train_loss": -11.82918930053711, "global_step": 391178, "epoch": 2328} {"train_loss": -12.361801147460938, "global_step": 391179, "epoch": 2328} {"train_loss": -11.569833755493164, "global_step": 391180, "epoch": 2328} {"train_loss": -12.36599349975586, "global_step": 391181, "epoch": 2328} {"train_loss": -11.815413475036621, "global_step": 391182, "epoch": 2328} {"train_loss": -12.54135513305664, "global_step": 391183, "epoch": 2328} {"train_loss": -11.656099319458008, "global_step": 391184, "epoch": 2328} {"train_loss": -12.433961868286133, "global_step": 391185, "epoch": 2328} {"train_loss": -12.003986358642578, "global_step": 391186, "epoch": 2328} {"train_loss": -12.155309677124023, "global_step": 391187, "epoch": 2328} {"train_loss": -12.021312713623047, "global_step": 391188, "epoch": 2328} {"train_loss": -12.186882019042969, "global_step": 391189, "epoch": 2328} {"train_loss": -12.248861312866211, "global_step": 391190, "epoch": 2328} {"train_loss": -11.902565002441406, "global_step": 391191, "epoch": 2328} {"train_loss": -11.94140625, "global_step": 391192, "epoch": 2328} {"train_loss": -11.986170768737793, "global_step": 391193, "epoch": 2328} {"train_loss": -12.145503997802734, "global_step": 391194, "epoch": 2328} {"train_loss": -12.478964805603027, "global_step": 391195, "epoch": 2328} {"train_loss": -12.16600227355957, "global_step": 391196, "epoch": 2328} {"train_loss": -12.321870803833008, "global_step": 391197, "epoch": 2328} {"train_loss": -12.294201850891113, "global_step": 391198, "epoch": 2328} {"train_loss": -12.538822174072266, "global_step": 391199, "epoch": 2328} {"train_loss": -12.52258014678955, "global_step": 391200, "epoch": 2328} {"train_loss": -12.36735725402832, "global_step": 391201, "epoch": 2328} {"train_loss": -12.628625869750977, "global_step": 391202, "epoch": 2328} {"train_loss": -12.420695304870605, "global_step": 391203, "epoch": 2328} {"train_loss": -12.616177558898926, "global_step": 391204, "epoch": 2328} {"train_loss": -12.419771194458008, "global_step": 391205, "epoch": 2328} {"train_loss": -12.523090362548828, "global_step": 391206, "epoch": 2328} {"train_loss": -12.35110855102539, "global_step": 391207, "epoch": 2328} {"train_loss": -12.688325881958008, "global_step": 391208, "epoch": 2328} {"train_loss": -12.512327194213867, "global_step": 391209, "epoch": 2328} {"train_loss": -12.651853561401367, "global_step": 391210, "epoch": 2328} {"train_loss": -12.215689659118652, "global_step": 391211, "epoch": 2328} {"train_loss": -12.396202087402344, "global_step": 391212, "epoch": 2328} {"train_loss": -12.617576599121094, "global_step": 391213, "epoch": 2328} {"train_loss": -12.233085632324219, "global_step": 391214, "epoch": 2328} {"train_loss": -12.640016555786133, "global_step": 391215, "epoch": 2328} {"train_loss": -12.430703163146973, "global_step": 391216, "epoch": 2328} {"train_loss": -12.517489433288574, "global_step": 391217, "epoch": 2328} {"train_loss": -12.79435920715332, "global_step": 391218, "epoch": 2328} {"train_loss": -12.410144805908203, "global_step": 391219, "epoch": 2328} {"train_loss": -12.525579452514648, "global_step": 391220, "epoch": 2328} {"train_loss": -12.30936050415039, "global_step": 391221, "epoch": 2328} {"train_loss": -12.356563568115234, "global_step": 391222, "epoch": 2328} {"train_loss": -12.268159866333008, "global_step": 391223, "epoch": 2328} {"train_loss": -12.316899299621582, "global_step": 391224, "epoch": 2328} {"train_loss": -12.596891403198242, "global_step": 391225, "epoch": 2328} {"train_loss": -12.364858627319336, "global_step": 391226, "epoch": 2328} {"train_loss": -12.157621383666992, "global_step": 391227, "epoch": 2328} {"train_loss": -12.348716735839844, "global_step": 391228, "epoch": 2328} {"train_loss": -12.323347091674805, "global_step": 391229, "epoch": 2328} {"train_loss": -11.751372337341309, "global_step": 391230, "epoch": 2328} {"train_loss": -12.754777908325195, "global_step": 391231, "epoch": 2328} {"train_loss": -12.004779815673828, "global_step": 391232, "epoch": 2328} {"train_loss": -12.346094131469727, "global_step": 391233, "epoch": 2328} {"train_loss": -12.098596572875977, "global_step": 391234, "epoch": 2328} {"train_loss": -12.203285217285156, "global_step": 391235, "epoch": 2328} {"train_loss": -12.426424026489258, "global_step": 391236, "epoch": 2328} {"train_loss": -12.228116035461426, "global_step": 391237, "epoch": 2328} {"train_loss": -12.243586540222168, "global_step": 391238, "epoch": 2328} {"train_loss": -12.210352897644043, "global_step": 391239, "epoch": 2328} {"train_loss": -12.417722702026367, "global_step": 391240, "epoch": 2328} {"train_loss": -12.252192497253418, "global_step": 391241, "epoch": 2328} {"train_loss": -12.529630661010742, "global_step": 391242, "epoch": 2328} {"train_loss": -12.383580207824707, "global_step": 391243, "epoch": 2328} {"train_loss": -12.333334922790527, "global_step": 391244, "epoch": 2328} {"train_loss": -12.689784049987793, "global_step": 391245, "epoch": 2328} {"train_loss": -12.210111618041992, "global_step": 391246, "epoch": 2328} {"train_loss": -12.261733055114746, "global_step": 391247, "epoch": 2328} {"train_loss": -12.777029037475586, "global_step": 391248, "epoch": 2328} {"train_loss": -12.194950103759766, "global_step": 391249, "epoch": 2328} {"train_loss": -12.055606842041016, "global_step": 391250, "epoch": 2328} {"train_loss": -12.73648452758789, "global_step": 391251, "epoch": 2328} {"train_loss": -12.361566543579102, "global_step": 391252, "epoch": 2328} {"train_loss": -11.743274688720703, "global_step": 391253, "epoch": 2328} {"train_loss": -11.885621070861816, "global_step": 391254, "epoch": 2328} {"train_loss": -12.203006744384766, "global_step": 391255, "epoch": 2328} {"train_loss": -12.218633651733398, "global_step": 391256, "epoch": 2328} {"train_loss": -12.03218936920166, "global_step": 391257, "epoch": 2328} {"train_loss": -12.116044998168945, "global_step": 391258, "epoch": 2328} {"train_loss": -12.460201263427734, "global_step": 391259, "epoch": 2328} {"train_loss": -12.370899200439453, "global_step": 391260, "epoch": 2328} {"train_loss": -12.137652397155762, "global_step": 391261, "epoch": 2328} {"train_loss": -12.164488792419434, "global_step": 391262, "epoch": 2328} {"train_loss": -12.128129959106445, "global_step": 391263, "epoch": 2328} {"train_loss": -12.06490707397461, "global_step": 391264, "epoch": 2328} {"train_loss": -11.670164108276367, "global_step": 391265, "epoch": 2328} {"train_loss": -11.916326522827148, "global_step": 391266, "epoch": 2328} {"train_loss": -11.06690788269043, "global_step": 391267, "epoch": 2328} {"train_loss": -12.220766067504883, "global_step": 391268, "epoch": 2328} {"train_loss": -11.924175262451172, "global_step": 391269, "epoch": 2328} {"train_loss": -11.505899429321289, "global_step": 391270, "epoch": 2328} {"train_loss": -12.003607670466105, "global_step": 391271, "epoch": 2328, "val_loss": 293202.0625} {"train_loss": -12.245121002197266, "global_step": 391272, "epoch": 2329} {"train_loss": -11.67497444152832, "global_step": 391273, "epoch": 2329} {"train_loss": -12.43136978149414, "global_step": 391274, "epoch": 2329} {"train_loss": -11.493703842163086, "global_step": 391275, "epoch": 2329} {"train_loss": -11.730456352233887, "global_step": 391276, "epoch": 2329} {"train_loss": -11.83859634399414, "global_step": 391277, "epoch": 2329} {"train_loss": -11.896408081054688, "global_step": 391278, "epoch": 2329} {"train_loss": -11.483072280883789, "global_step": 391279, "epoch": 2329} {"train_loss": -11.744388580322266, "global_step": 391280, "epoch": 2329} {"train_loss": -11.60977554321289, "global_step": 391281, "epoch": 2329} {"train_loss": -11.88748550415039, "global_step": 391282, "epoch": 2329} {"train_loss": -12.365060806274414, "global_step": 391283, "epoch": 2329} {"train_loss": -11.71381950378418, "global_step": 391284, "epoch": 2329} {"train_loss": -12.53378677368164, "global_step": 391285, "epoch": 2329} {"train_loss": -11.519363403320312, "global_step": 391286, "epoch": 2329} {"train_loss": -11.510315895080566, "global_step": 391287, "epoch": 2329} {"train_loss": -11.99056625366211, "global_step": 391288, "epoch": 2329} {"train_loss": -12.232122421264648, "global_step": 391289, "epoch": 2329} {"train_loss": -12.024105072021484, "global_step": 391290, "epoch": 2329} {"train_loss": -12.27761173248291, "global_step": 391291, "epoch": 2329} {"train_loss": -11.823088645935059, "global_step": 391292, "epoch": 2329} {"train_loss": -11.913323402404785, "global_step": 391293, "epoch": 2329} {"train_loss": -11.46490478515625, "global_step": 391294, "epoch": 2329} {"train_loss": -11.909996032714844, "global_step": 391295, "epoch": 2329} {"train_loss": -11.629636764526367, "global_step": 391296, "epoch": 2329} {"train_loss": -12.06130313873291, "global_step": 391297, "epoch": 2329} {"train_loss": -12.000442504882812, "global_step": 391298, "epoch": 2329} {"train_loss": -12.110264778137207, "global_step": 391299, "epoch": 2329} {"train_loss": -12.136215209960938, "global_step": 391300, "epoch": 2329} {"train_loss": -12.33411693572998, "global_step": 391301, "epoch": 2329} {"train_loss": -11.450019836425781, "global_step": 391302, "epoch": 2329} {"train_loss": -12.242975234985352, "global_step": 391303, "epoch": 2329} {"train_loss": -12.184466361999512, "global_step": 391304, "epoch": 2329} {"train_loss": -12.301525115966797, "global_step": 391305, "epoch": 2329} {"train_loss": -11.97264289855957, "global_step": 391306, "epoch": 2329} {"train_loss": -12.254922866821289, "global_step": 391307, "epoch": 2329} {"train_loss": -12.012142181396484, "global_step": 391308, "epoch": 2329} {"train_loss": -12.671966552734375, "global_step": 391309, "epoch": 2329} {"train_loss": -11.515933990478516, "global_step": 391310, "epoch": 2329} {"train_loss": -11.953750610351562, "global_step": 391311, "epoch": 2329} {"train_loss": -12.080039978027344, "global_step": 391312, "epoch": 2329} {"train_loss": -12.275327682495117, "global_step": 391313, "epoch": 2329} {"train_loss": -12.011777877807617, "global_step": 391314, "epoch": 2329} {"train_loss": -12.373884201049805, "global_step": 391315, "epoch": 2329} {"train_loss": -11.905540466308594, "global_step": 391316, "epoch": 2329} {"train_loss": -12.049588203430176, "global_step": 391317, "epoch": 2329} {"train_loss": -11.67286491394043, "global_step": 391318, "epoch": 2329} {"train_loss": -11.912158966064453, "global_step": 391319, "epoch": 2329} {"train_loss": -12.201632499694824, "global_step": 391320, "epoch": 2329} {"train_loss": -11.802935600280762, "global_step": 391321, "epoch": 2329} {"train_loss": -12.496529579162598, "global_step": 391322, "epoch": 2329} {"train_loss": -11.656782150268555, "global_step": 391323, "epoch": 2329} {"train_loss": -12.501317024230957, "global_step": 391324, "epoch": 2329} {"train_loss": -12.283748626708984, "global_step": 391325, "epoch": 2329} {"train_loss": -12.198723793029785, "global_step": 391326, "epoch": 2329} {"train_loss": -11.755298614501953, "global_step": 391327, "epoch": 2329} {"train_loss": -12.352673530578613, "global_step": 391328, "epoch": 2329} {"train_loss": -12.438213348388672, "global_step": 391329, "epoch": 2329} {"train_loss": -12.33523941040039, "global_step": 391330, "epoch": 2329} {"train_loss": -12.519216537475586, "global_step": 391331, "epoch": 2329} {"train_loss": -12.021031379699707, "global_step": 391332, "epoch": 2329} {"train_loss": -12.623043060302734, "global_step": 391333, "epoch": 2329} {"train_loss": -12.521354675292969, "global_step": 391334, "epoch": 2329} {"train_loss": -12.434977531433105, "global_step": 391335, "epoch": 2329} {"train_loss": -12.288753509521484, "global_step": 391336, "epoch": 2329} {"train_loss": -12.078451156616211, "global_step": 391337, "epoch": 2329} {"train_loss": -12.462201118469238, "global_step": 391338, "epoch": 2329} {"train_loss": -12.253762245178223, "global_step": 391339, "epoch": 2329} {"train_loss": -12.475128173828125, "global_step": 391340, "epoch": 2329} {"train_loss": -12.442726135253906, "global_step": 391341, "epoch": 2329} {"train_loss": -11.728509902954102, "global_step": 391342, "epoch": 2329} {"train_loss": -12.215181350708008, "global_step": 391343, "epoch": 2329} {"train_loss": -11.832067489624023, "global_step": 391344, "epoch": 2329} {"train_loss": -12.001044273376465, "global_step": 391345, "epoch": 2329} {"train_loss": -11.905518531799316, "global_step": 391346, "epoch": 2329} {"train_loss": -11.91370964050293, "global_step": 391347, "epoch": 2329} {"train_loss": -10.825096130371094, "global_step": 391348, "epoch": 2329} {"train_loss": -11.809809684753418, "global_step": 391349, "epoch": 2329} {"train_loss": -11.36679744720459, "global_step": 391350, "epoch": 2329} {"train_loss": -12.4278564453125, "global_step": 391351, "epoch": 2329} {"train_loss": -12.01850700378418, "global_step": 391352, "epoch": 2329} {"train_loss": -12.490829467773438, "global_step": 391353, "epoch": 2329} {"train_loss": -12.196789741516113, "global_step": 391354, "epoch": 2329} {"train_loss": -12.301828384399414, "global_step": 391355, "epoch": 2329} {"train_loss": -12.214254379272461, "global_step": 391356, "epoch": 2329} {"train_loss": -12.133572578430176, "global_step": 391357, "epoch": 2329} {"train_loss": -12.2718505859375, "global_step": 391358, "epoch": 2329} {"train_loss": -11.754263877868652, "global_step": 391359, "epoch": 2329} {"train_loss": -12.252835273742676, "global_step": 391360, "epoch": 2329} {"train_loss": -11.748150825500488, "global_step": 391361, "epoch": 2329} {"train_loss": -11.800647735595703, "global_step": 391362, "epoch": 2329} {"train_loss": -12.483756065368652, "global_step": 391363, "epoch": 2329} {"train_loss": -12.271106719970703, "global_step": 391364, "epoch": 2329} {"train_loss": -12.131577491760254, "global_step": 391365, "epoch": 2329} {"train_loss": -12.213235855102539, "global_step": 391366, "epoch": 2329} {"train_loss": -12.200995445251465, "global_step": 391367, "epoch": 2329} {"train_loss": -11.877843856811523, "global_step": 391368, "epoch": 2329} {"train_loss": -12.271377563476562, "global_step": 391369, "epoch": 2329} {"train_loss": -11.902318954467773, "global_step": 391370, "epoch": 2329} {"train_loss": -11.457764625549316, "global_step": 391371, "epoch": 2329} {"train_loss": -11.455799102783203, "global_step": 391372, "epoch": 2329} {"train_loss": -12.105743408203125, "global_step": 391373, "epoch": 2329} {"train_loss": -11.350753784179688, "global_step": 391374, "epoch": 2329} {"train_loss": -11.713260650634766, "global_step": 391375, "epoch": 2329} {"train_loss": -11.829545021057129, "global_step": 391376, "epoch": 2329} {"train_loss": -11.918375015258789, "global_step": 391377, "epoch": 2329} {"train_loss": -12.203333854675293, "global_step": 391378, "epoch": 2329} {"train_loss": -12.026037216186523, "global_step": 391379, "epoch": 2329} {"train_loss": -12.694969177246094, "global_step": 391380, "epoch": 2329} {"train_loss": -11.723651885986328, "global_step": 391381, "epoch": 2329} {"train_loss": -12.507829666137695, "global_step": 391382, "epoch": 2329} {"train_loss": -11.843817710876465, "global_step": 391383, "epoch": 2329} {"train_loss": -12.426998138427734, "global_step": 391384, "epoch": 2329} {"train_loss": -11.702630043029785, "global_step": 391385, "epoch": 2329} {"train_loss": -12.416413307189941, "global_step": 391386, "epoch": 2329} {"train_loss": -11.71114730834961, "global_step": 391387, "epoch": 2329} {"train_loss": -11.860204696655273, "global_step": 391388, "epoch": 2329} {"train_loss": -12.069419860839844, "global_step": 391389, "epoch": 2329} {"train_loss": -12.448541641235352, "global_step": 391390, "epoch": 2329} {"train_loss": -12.46715259552002, "global_step": 391391, "epoch": 2329} {"train_loss": -12.313761711120605, "global_step": 391392, "epoch": 2329} {"train_loss": -12.349115371704102, "global_step": 391393, "epoch": 2329} {"train_loss": -11.716169357299805, "global_step": 391394, "epoch": 2329} {"train_loss": -12.324445724487305, "global_step": 391395, "epoch": 2329} {"train_loss": -12.345129013061523, "global_step": 391396, "epoch": 2329} {"train_loss": -12.123016357421875, "global_step": 391397, "epoch": 2329} {"train_loss": -12.43228530883789, "global_step": 391398, "epoch": 2329} {"train_loss": -12.477666854858398, "global_step": 391399, "epoch": 2329} {"train_loss": -12.326582908630371, "global_step": 391400, "epoch": 2329} {"train_loss": -12.627717971801758, "global_step": 391401, "epoch": 2329} {"train_loss": -12.608930587768555, "global_step": 391402, "epoch": 2329} {"train_loss": -12.465826034545898, "global_step": 391403, "epoch": 2329} {"train_loss": -12.286991119384766, "global_step": 391404, "epoch": 2329} {"train_loss": -12.496063232421875, "global_step": 391405, "epoch": 2329} {"train_loss": -12.297880172729492, "global_step": 391406, "epoch": 2329} {"train_loss": -12.65610408782959, "global_step": 391407, "epoch": 2329} {"train_loss": -12.591346740722656, "global_step": 391408, "epoch": 2329} {"train_loss": -12.700681686401367, "global_step": 391409, "epoch": 2329} {"train_loss": -12.578561782836914, "global_step": 391410, "epoch": 2329} {"train_loss": -12.42026138305664, "global_step": 391411, "epoch": 2329} {"train_loss": -12.630328178405762, "global_step": 391412, "epoch": 2329} {"train_loss": -12.470739364624023, "global_step": 391413, "epoch": 2329} {"train_loss": -12.376739501953125, "global_step": 391414, "epoch": 2329} {"train_loss": -12.680538177490234, "global_step": 391415, "epoch": 2329} {"train_loss": -12.494119644165039, "global_step": 391416, "epoch": 2329} {"train_loss": -12.204862594604492, "global_step": 391417, "epoch": 2329} {"train_loss": -12.220453262329102, "global_step": 391418, "epoch": 2329} {"train_loss": -12.428424835205078, "global_step": 391419, "epoch": 2329} {"train_loss": -11.192572593688965, "global_step": 391420, "epoch": 2329} {"train_loss": -12.021406173706055, "global_step": 391421, "epoch": 2329} {"train_loss": -12.006682395935059, "global_step": 391422, "epoch": 2329} {"train_loss": -11.642805099487305, "global_step": 391423, "epoch": 2329} {"train_loss": -12.094427108764648, "global_step": 391424, "epoch": 2329} {"train_loss": -11.803083419799805, "global_step": 391425, "epoch": 2329} {"train_loss": -10.17518138885498, "global_step": 391426, "epoch": 2329} {"train_loss": -10.911663055419922, "global_step": 391427, "epoch": 2329} {"train_loss": -10.743478775024414, "global_step": 391428, "epoch": 2329} {"train_loss": -10.419095993041992, "global_step": 391429, "epoch": 2329} {"train_loss": -10.729795455932617, "global_step": 391430, "epoch": 2329} {"train_loss": -9.955257415771484, "global_step": 391431, "epoch": 2329} {"train_loss": -11.286227226257324, "global_step": 391432, "epoch": 2329} {"train_loss": -10.810876846313477, "global_step": 391433, "epoch": 2329} {"train_loss": -10.695098876953125, "global_step": 391434, "epoch": 2329} {"train_loss": -9.990490913391113, "global_step": 391435, "epoch": 2329} {"train_loss": -10.170083045959473, "global_step": 391436, "epoch": 2329} {"train_loss": -11.176109313964844, "global_step": 391437, "epoch": 2329} {"train_loss": -9.457494735717773, "global_step": 391438, "epoch": 2329} {"train_loss": -11.957889006251381, "global_step": 391439, "epoch": 2329, "val_loss": 292462.875} {"train_loss": -9.61883544921875, "global_step": 391440, "epoch": 2330} {"train_loss": -9.748808860778809, "global_step": 391441, "epoch": 2330} {"train_loss": -10.082084655761719, "global_step": 391442, "epoch": 2330} {"train_loss": -9.628573417663574, "global_step": 391443, "epoch": 2330} {"train_loss": -9.49620246887207, "global_step": 391444, "epoch": 2330} {"train_loss": -10.45296859741211, "global_step": 391445, "epoch": 2330} {"train_loss": -10.6619291305542, "global_step": 391446, "epoch": 2330} {"train_loss": -11.423239707946777, "global_step": 391447, "epoch": 2330} {"train_loss": -9.675012588500977, "global_step": 391448, "epoch": 2330} {"train_loss": -11.118123054504395, "global_step": 391449, "epoch": 2330} {"train_loss": -11.270118713378906, "global_step": 391450, "epoch": 2330} {"train_loss": -10.898508071899414, "global_step": 391451, "epoch": 2330} {"train_loss": -10.04532241821289, "global_step": 391452, "epoch": 2330} {"train_loss": -11.43193244934082, "global_step": 391453, "epoch": 2330} {"train_loss": -10.595008850097656, "global_step": 391454, "epoch": 2330} {"train_loss": -11.509624481201172, "global_step": 391455, "epoch": 2330} {"train_loss": -11.313566207885742, "global_step": 391456, "epoch": 2330} {"train_loss": -10.488351821899414, "global_step": 391457, "epoch": 2330} {"train_loss": -11.47591495513916, "global_step": 391458, "epoch": 2330} {"train_loss": -11.388486862182617, "global_step": 391459, "epoch": 2330} {"train_loss": -10.241229057312012, "global_step": 391460, "epoch": 2330} {"train_loss": -10.891485214233398, "global_step": 391461, "epoch": 2330} {"train_loss": -10.690896034240723, "global_step": 391462, "epoch": 2330} {"train_loss": -11.146099090576172, "global_step": 391463, "epoch": 2330} {"train_loss": -11.797578811645508, "global_step": 391464, "epoch": 2330} {"train_loss": -11.623852729797363, "global_step": 391465, "epoch": 2330} {"train_loss": -10.67827033996582, "global_step": 391466, "epoch": 2330} {"train_loss": -11.684745788574219, "global_step": 391467, "epoch": 2330} {"train_loss": -10.469408988952637, "global_step": 391468, "epoch": 2330} {"train_loss": -12.04345703125, "global_step": 391469, "epoch": 2330} {"train_loss": -11.493881225585938, "global_step": 391470, "epoch": 2330} {"train_loss": -11.355648040771484, "global_step": 391471, "epoch": 2330} {"train_loss": -11.556118965148926, "global_step": 391472, "epoch": 2330} {"train_loss": -11.697357177734375, "global_step": 391473, "epoch": 2330} {"train_loss": -11.26656723022461, "global_step": 391474, "epoch": 2330} {"train_loss": -11.603638648986816, "global_step": 391475, "epoch": 2330} {"train_loss": -12.124137878417969, "global_step": 391476, "epoch": 2330} {"train_loss": -11.203075408935547, "global_step": 391477, "epoch": 2330} {"train_loss": -12.073149681091309, "global_step": 391478, "epoch": 2330} {"train_loss": -11.824913024902344, "global_step": 391479, "epoch": 2330} {"train_loss": -11.720157623291016, "global_step": 391480, "epoch": 2330} {"train_loss": -11.883679389953613, "global_step": 391481, "epoch": 2330} {"train_loss": -11.929274559020996, "global_step": 391482, "epoch": 2330} {"train_loss": -12.065502166748047, "global_step": 391483, "epoch": 2330} {"train_loss": -11.808837890625, "global_step": 391484, "epoch": 2330} {"train_loss": -12.162938117980957, "global_step": 391485, "epoch": 2330} {"train_loss": -12.223760604858398, "global_step": 391486, "epoch": 2330} {"train_loss": -12.262672424316406, "global_step": 391487, "epoch": 2330} {"train_loss": -12.302146911621094, "global_step": 391488, "epoch": 2330} {"train_loss": -12.199828147888184, "global_step": 391489, "epoch": 2330} {"train_loss": -11.97694206237793, "global_step": 391490, "epoch": 2330} {"train_loss": -12.43549919128418, "global_step": 391491, "epoch": 2330} {"train_loss": -12.093717575073242, "global_step": 391492, "epoch": 2330} {"train_loss": -12.288747787475586, "global_step": 391493, "epoch": 2330} {"train_loss": -12.186175346374512, "global_step": 391494, "epoch": 2330} {"train_loss": -12.184682846069336, "global_step": 391495, "epoch": 2330} {"train_loss": -12.378416061401367, "global_step": 391496, "epoch": 2330} {"train_loss": -12.531286239624023, "global_step": 391497, "epoch": 2330} {"train_loss": -12.214508056640625, "global_step": 391498, "epoch": 2330} {"train_loss": -12.430912017822266, "global_step": 391499, "epoch": 2330} {"train_loss": -12.510967254638672, "global_step": 391500, "epoch": 2330} {"train_loss": -12.520689010620117, "global_step": 391501, "epoch": 2330} {"train_loss": -12.383272171020508, "global_step": 391502, "epoch": 2330} {"train_loss": -12.331345558166504, "global_step": 391503, "epoch": 2330} {"train_loss": -12.414048194885254, "global_step": 391504, "epoch": 2330} {"train_loss": -12.50515365600586, "global_step": 391505, "epoch": 2330} {"train_loss": -12.469659805297852, "global_step": 391506, "epoch": 2330} {"train_loss": -12.494745254516602, "global_step": 391507, "epoch": 2330} {"train_loss": -12.324548721313477, "global_step": 391508, "epoch": 2330} {"train_loss": -12.515290260314941, "global_step": 391509, "epoch": 2330} {"train_loss": -12.543343544006348, "global_step": 391510, "epoch": 2330} {"train_loss": -12.453618049621582, "global_step": 391511, "epoch": 2330} {"train_loss": -12.514748573303223, "global_step": 391512, "epoch": 2330} {"train_loss": -12.46152114868164, "global_step": 391513, "epoch": 2330} {"train_loss": -12.42320442199707, "global_step": 391514, "epoch": 2330} {"train_loss": -12.659146308898926, "global_step": 391515, "epoch": 2330} {"train_loss": -12.661613464355469, "global_step": 391516, "epoch": 2330} {"train_loss": -12.451379776000977, "global_step": 391517, "epoch": 2330} {"train_loss": -12.594771385192871, "global_step": 391518, "epoch": 2330} {"train_loss": -12.507503509521484, "global_step": 391519, "epoch": 2330} {"train_loss": -12.613569259643555, "global_step": 391520, "epoch": 2330} {"train_loss": -12.483081817626953, "global_step": 391521, "epoch": 2330} {"train_loss": -12.569110870361328, "global_step": 391522, "epoch": 2330} {"train_loss": -12.580150604248047, "global_step": 391523, "epoch": 2330} {"train_loss": -12.863980293273926, "global_step": 391524, "epoch": 2330} {"train_loss": -12.647775650024414, "global_step": 391525, "epoch": 2330} {"train_loss": -12.691572189331055, "global_step": 391526, "epoch": 2330} {"train_loss": -12.679423332214355, "global_step": 391527, "epoch": 2330} {"train_loss": -12.44552993774414, "global_step": 391528, "epoch": 2330} {"train_loss": -12.837165832519531, "global_step": 391529, "epoch": 2330} {"train_loss": -12.469395637512207, "global_step": 391530, "epoch": 2330} {"train_loss": -12.676743507385254, "global_step": 391531, "epoch": 2330} {"train_loss": -12.454813957214355, "global_step": 391532, "epoch": 2330} {"train_loss": -12.682912826538086, "global_step": 391533, "epoch": 2330} {"train_loss": -12.517233848571777, "global_step": 391534, "epoch": 2330} {"train_loss": -12.529559135437012, "global_step": 391535, "epoch": 2330} {"train_loss": -12.491908073425293, "global_step": 391536, "epoch": 2330} {"train_loss": -12.350791931152344, "global_step": 391537, "epoch": 2330} {"train_loss": -12.715391159057617, "global_step": 391538, "epoch": 2330} {"train_loss": -12.584213256835938, "global_step": 391539, "epoch": 2330} {"train_loss": -12.586038589477539, "global_step": 391540, "epoch": 2330} {"train_loss": -12.5755615234375, "global_step": 391541, "epoch": 2330} {"train_loss": -12.706366539001465, "global_step": 391542, "epoch": 2330} {"train_loss": -12.553775787353516, "global_step": 391543, "epoch": 2330} {"train_loss": -12.766892433166504, "global_step": 391544, "epoch": 2330} {"train_loss": -12.451225280761719, "global_step": 391545, "epoch": 2330} {"train_loss": -12.53149127960205, "global_step": 391546, "epoch": 2330} {"train_loss": -12.581343650817871, "global_step": 391547, "epoch": 2330} {"train_loss": -12.666444778442383, "global_step": 391548, "epoch": 2330} {"train_loss": -12.658893585205078, "global_step": 391549, "epoch": 2330} {"train_loss": -12.430929183959961, "global_step": 391550, "epoch": 2330} {"train_loss": -12.338068008422852, "global_step": 391551, "epoch": 2330} {"train_loss": -12.518438339233398, "global_step": 391552, "epoch": 2330} {"train_loss": -11.228350639343262, "global_step": 391553, "epoch": 2330} {"train_loss": -10.632508277893066, "global_step": 391554, "epoch": 2330} {"train_loss": -11.878499031066895, "global_step": 391555, "epoch": 2330} {"train_loss": -11.946828842163086, "global_step": 391556, "epoch": 2330} {"train_loss": -9.634872436523438, "global_step": 391557, "epoch": 2330} {"train_loss": -9.533419609069824, "global_step": 391558, "epoch": 2330} {"train_loss": -11.090042114257812, "global_step": 391559, "epoch": 2330} {"train_loss": -7.231376647949219, "global_step": 391560, "epoch": 2330} {"train_loss": -7.195451736450195, "global_step": 391561, "epoch": 2330} {"train_loss": -8.5421781539917, "global_step": 391562, "epoch": 2330} {"train_loss": -7.674412250518799, "global_step": 391563, "epoch": 2330} {"train_loss": -8.419088363647461, "global_step": 391564, "epoch": 2330} {"train_loss": -7.049147129058838, "global_step": 391565, "epoch": 2330} {"train_loss": -8.719621658325195, "global_step": 391566, "epoch": 2330} {"train_loss": -7.818304061889648, "global_step": 391567, "epoch": 2330} {"train_loss": -9.206287384033203, "global_step": 391568, "epoch": 2330} {"train_loss": -7.682642936706543, "global_step": 391569, "epoch": 2330} {"train_loss": -8.385196685791016, "global_step": 391570, "epoch": 2330} {"train_loss": -8.671815872192383, "global_step": 391571, "epoch": 2330} {"train_loss": -8.027632713317871, "global_step": 391572, "epoch": 2330} {"train_loss": -7.96388053894043, "global_step": 391573, "epoch": 2330} {"train_loss": -7.287557601928711, "global_step": 391574, "epoch": 2330} {"train_loss": -8.298657417297363, "global_step": 391575, "epoch": 2330} {"train_loss": -7.133203029632568, "global_step": 391576, "epoch": 2330} {"train_loss": -7.899632930755615, "global_step": 391577, "epoch": 2330} {"train_loss": -9.122241020202637, "global_step": 391578, "epoch": 2330} {"train_loss": -8.816977500915527, "global_step": 391579, "epoch": 2330} {"train_loss": -10.053717613220215, "global_step": 391580, "epoch": 2330} {"train_loss": -9.180675506591797, "global_step": 391581, "epoch": 2330} {"train_loss": -9.295125961303711, "global_step": 391582, "epoch": 2330} {"train_loss": -9.85365104675293, "global_step": 391583, "epoch": 2330} {"train_loss": -9.594461441040039, "global_step": 391584, "epoch": 2330} {"train_loss": -10.567386627197266, "global_step": 391585, "epoch": 2330} {"train_loss": -10.41415023803711, "global_step": 391586, "epoch": 2330} {"train_loss": -11.031160354614258, "global_step": 391587, "epoch": 2330} {"train_loss": -10.764342308044434, "global_step": 391588, "epoch": 2330} {"train_loss": -11.352458953857422, "global_step": 391589, "epoch": 2330} {"train_loss": -11.143281936645508, "global_step": 391590, "epoch": 2330} {"train_loss": -11.41000747680664, "global_step": 391591, "epoch": 2330} {"train_loss": -11.567258834838867, "global_step": 391592, "epoch": 2330} {"train_loss": -11.690153121948242, "global_step": 391593, "epoch": 2330} {"train_loss": -11.756963729858398, "global_step": 391594, "epoch": 2330} {"train_loss": -11.568378448486328, "global_step": 391595, "epoch": 2330} {"train_loss": -11.41267204284668, "global_step": 391596, "epoch": 2330} {"train_loss": -12.071471214294434, "global_step": 391597, "epoch": 2330} {"train_loss": -11.42094612121582, "global_step": 391598, "epoch": 2330} {"train_loss": -11.794792175292969, "global_step": 391599, "epoch": 2330} {"train_loss": -11.359501838684082, "global_step": 391600, "epoch": 2330} {"train_loss": -11.49933910369873, "global_step": 391601, "epoch": 2330} {"train_loss": -11.403304100036621, "global_step": 391602, "epoch": 2330} {"train_loss": -11.86501693725586, "global_step": 391603, "epoch": 2330} {"train_loss": -11.91181468963623, "global_step": 391604, "epoch": 2330} {"train_loss": -11.23179817199707, "global_step": 391605, "epoch": 2330} {"train_loss": -12.01598834991455, "global_step": 391606, "epoch": 2330} {"train_loss": -11.284035949479966, "global_step": 391607, "epoch": 2330, "val_loss": 296841.125, "train_action_mse_error": 1.059748888015747} {"train_loss": -11.75230598449707, "global_step": 391608, "epoch": 2331} {"train_loss": -11.877035140991211, "global_step": 391609, "epoch": 2331} {"train_loss": -11.451122283935547, "global_step": 391610, "epoch": 2331} {"train_loss": -11.958473205566406, "global_step": 391611, "epoch": 2331} {"train_loss": -11.633406639099121, "global_step": 391612, "epoch": 2331} {"train_loss": -11.941417694091797, "global_step": 391613, "epoch": 2331} {"train_loss": -12.240718841552734, "global_step": 391614, "epoch": 2331} {"train_loss": -11.979328155517578, "global_step": 391615, "epoch": 2331} {"train_loss": -12.303220748901367, "global_step": 391616, "epoch": 2331} {"train_loss": -12.218976020812988, "global_step": 391617, "epoch": 2331} {"train_loss": -11.890432357788086, "global_step": 391618, "epoch": 2331} {"train_loss": -12.344268798828125, "global_step": 391619, "epoch": 2331} {"train_loss": -12.143777847290039, "global_step": 391620, "epoch": 2331} {"train_loss": -12.389404296875, "global_step": 391621, "epoch": 2331} {"train_loss": -11.874015808105469, "global_step": 391622, "epoch": 2331} {"train_loss": -12.093667030334473, "global_step": 391623, "epoch": 2331} {"train_loss": -12.146215438842773, "global_step": 391624, "epoch": 2331} {"train_loss": -12.152854919433594, "global_step": 391625, "epoch": 2331} {"train_loss": -12.324617385864258, "global_step": 391626, "epoch": 2331} {"train_loss": -12.372797012329102, "global_step": 391627, "epoch": 2331} {"train_loss": -12.176000595092773, "global_step": 391628, "epoch": 2331} {"train_loss": -12.102323532104492, "global_step": 391629, "epoch": 2331} {"train_loss": -12.348159790039062, "global_step": 391630, "epoch": 2331} {"train_loss": -12.457420349121094, "global_step": 391631, "epoch": 2331} {"train_loss": -12.23849105834961, "global_step": 391632, "epoch": 2331} {"train_loss": -11.874900817871094, "global_step": 391633, "epoch": 2331} {"train_loss": -12.304142951965332, "global_step": 391634, "epoch": 2331} {"train_loss": -11.970409393310547, "global_step": 391635, "epoch": 2331} {"train_loss": -12.286537170410156, "global_step": 391636, "epoch": 2331} {"train_loss": -12.197739601135254, "global_step": 391637, "epoch": 2331} {"train_loss": -12.554328918457031, "global_step": 391638, "epoch": 2331} {"train_loss": -12.369905471801758, "global_step": 391639, "epoch": 2331} {"train_loss": -12.059353828430176, "global_step": 391640, "epoch": 2331} {"train_loss": -12.516380310058594, "global_step": 391641, "epoch": 2331} {"train_loss": -11.933506965637207, "global_step": 391642, "epoch": 2331} {"train_loss": -12.054545402526855, "global_step": 391643, "epoch": 2331} {"train_loss": -11.854032516479492, "global_step": 391644, "epoch": 2331} {"train_loss": -12.281808853149414, "global_step": 391645, "epoch": 2331} {"train_loss": -12.01990032196045, "global_step": 391646, "epoch": 2331} {"train_loss": -12.451218605041504, "global_step": 391647, "epoch": 2331} {"train_loss": -12.280509948730469, "global_step": 391648, "epoch": 2331} {"train_loss": -12.390087127685547, "global_step": 391649, "epoch": 2331} {"train_loss": -12.62736701965332, "global_step": 391650, "epoch": 2331} {"train_loss": -12.497411727905273, "global_step": 391651, "epoch": 2331} {"train_loss": -12.362605094909668, "global_step": 391652, "epoch": 2331} {"train_loss": -12.457684516906738, "global_step": 391653, "epoch": 2331} {"train_loss": -12.383594512939453, "global_step": 391654, "epoch": 2331} {"train_loss": -12.51987075805664, "global_step": 391655, "epoch": 2331} {"train_loss": -12.604393005371094, "global_step": 391656, "epoch": 2331} {"train_loss": -12.634819984436035, "global_step": 391657, "epoch": 2331} {"train_loss": -12.556761741638184, "global_step": 391658, "epoch": 2331} {"train_loss": -12.382610321044922, "global_step": 391659, "epoch": 2331} {"train_loss": -12.410757064819336, "global_step": 391660, "epoch": 2331} {"train_loss": -12.558183670043945, "global_step": 391661, "epoch": 2331} {"train_loss": -12.62457275390625, "global_step": 391662, "epoch": 2331} {"train_loss": -12.61772346496582, "global_step": 391663, "epoch": 2331} {"train_loss": -12.733675003051758, "global_step": 391664, "epoch": 2331} {"train_loss": -12.289529800415039, "global_step": 391665, "epoch": 2331} {"train_loss": -12.51828670501709, "global_step": 391666, "epoch": 2331} {"train_loss": -12.697014808654785, "global_step": 391667, "epoch": 2331} {"train_loss": -12.68132209777832, "global_step": 391668, "epoch": 2331} {"train_loss": -12.538548469543457, "global_step": 391669, "epoch": 2331} {"train_loss": -12.52750015258789, "global_step": 391670, "epoch": 2331} {"train_loss": -12.6957426071167, "global_step": 391671, "epoch": 2331} {"train_loss": -11.839361190795898, "global_step": 391672, "epoch": 2331} {"train_loss": -12.171891212463379, "global_step": 391673, "epoch": 2331} {"train_loss": -12.489104270935059, "global_step": 391674, "epoch": 2331} {"train_loss": -12.158926963806152, "global_step": 391675, "epoch": 2331} {"train_loss": -12.278364181518555, "global_step": 391676, "epoch": 2331} {"train_loss": -12.529979705810547, "global_step": 391677, "epoch": 2331} {"train_loss": -12.168272018432617, "global_step": 391678, "epoch": 2331} {"train_loss": -12.422658920288086, "global_step": 391679, "epoch": 2331} {"train_loss": -12.596149444580078, "global_step": 391680, "epoch": 2331} {"train_loss": -12.222784042358398, "global_step": 391681, "epoch": 2331} {"train_loss": -12.330678939819336, "global_step": 391682, "epoch": 2331} {"train_loss": -12.394662857055664, "global_step": 391683, "epoch": 2331} {"train_loss": -12.69207763671875, "global_step": 391684, "epoch": 2331} {"train_loss": -12.549558639526367, "global_step": 391685, "epoch": 2331} {"train_loss": -12.628767013549805, "global_step": 391686, "epoch": 2331} {"train_loss": -12.33320426940918, "global_step": 391687, "epoch": 2331} {"train_loss": -12.536015510559082, "global_step": 391688, "epoch": 2331} {"train_loss": -12.251709938049316, "global_step": 391689, "epoch": 2331} {"train_loss": -12.191068649291992, "global_step": 391690, "epoch": 2331} {"train_loss": -11.820460319519043, "global_step": 391691, "epoch": 2331} {"train_loss": -10.460114479064941, "global_step": 391692, "epoch": 2331} {"train_loss": -9.87622356414795, "global_step": 391693, "epoch": 2331} {"train_loss": -11.943902015686035, "global_step": 391694, "epoch": 2331} {"train_loss": -9.283223152160645, "global_step": 391695, "epoch": 2331} {"train_loss": -10.61237621307373, "global_step": 391696, "epoch": 2331} {"train_loss": -7.661916732788086, "global_step": 391697, "epoch": 2331} {"train_loss": -8.629533767700195, "global_step": 391698, "epoch": 2331} {"train_loss": -9.653451919555664, "global_step": 391699, "epoch": 2331} {"train_loss": -8.597232818603516, "global_step": 391700, "epoch": 2331} {"train_loss": -10.401126861572266, "global_step": 391701, "epoch": 2331} {"train_loss": -9.305109024047852, "global_step": 391702, "epoch": 2331} {"train_loss": -10.559951782226562, "global_step": 391703, "epoch": 2331} {"train_loss": -10.57160758972168, "global_step": 391704, "epoch": 2331} {"train_loss": -11.447732925415039, "global_step": 391705, "epoch": 2331} {"train_loss": -9.696622848510742, "global_step": 391706, "epoch": 2331} {"train_loss": -11.643050193786621, "global_step": 391707, "epoch": 2331} {"train_loss": -10.859962463378906, "global_step": 391708, "epoch": 2331} {"train_loss": -11.543620109558105, "global_step": 391709, "epoch": 2331} {"train_loss": -10.93476676940918, "global_step": 391710, "epoch": 2331} {"train_loss": -10.428442001342773, "global_step": 391711, "epoch": 2331} {"train_loss": -11.668566703796387, "global_step": 391712, "epoch": 2331} {"train_loss": -11.035861015319824, "global_step": 391713, "epoch": 2331} {"train_loss": -10.960238456726074, "global_step": 391714, "epoch": 2331} {"train_loss": -10.950468063354492, "global_step": 391715, "epoch": 2331} {"train_loss": -10.036810874938965, "global_step": 391716, "epoch": 2331} {"train_loss": -9.999908447265625, "global_step": 391717, "epoch": 2331} {"train_loss": -11.649092674255371, "global_step": 391718, "epoch": 2331} {"train_loss": -10.402048110961914, "global_step": 391719, "epoch": 2331} {"train_loss": -11.474084854125977, "global_step": 391720, "epoch": 2331} {"train_loss": -10.8223876953125, "global_step": 391721, "epoch": 2331} {"train_loss": -11.405318260192871, "global_step": 391722, "epoch": 2331} {"train_loss": -11.305702209472656, "global_step": 391723, "epoch": 2331} {"train_loss": -11.749174118041992, "global_step": 391724, "epoch": 2331} {"train_loss": -11.701133728027344, "global_step": 391725, "epoch": 2331} {"train_loss": -11.519245147705078, "global_step": 391726, "epoch": 2331} {"train_loss": -11.817009925842285, "global_step": 391727, "epoch": 2331} {"train_loss": -11.421330451965332, "global_step": 391728, "epoch": 2331} {"train_loss": -11.994470596313477, "global_step": 391729, "epoch": 2331} {"train_loss": -11.534042358398438, "global_step": 391730, "epoch": 2331} {"train_loss": -11.699287414550781, "global_step": 391731, "epoch": 2331} {"train_loss": -11.409902572631836, "global_step": 391732, "epoch": 2331} {"train_loss": -11.574459075927734, "global_step": 391733, "epoch": 2331} {"train_loss": -11.396835327148438, "global_step": 391734, "epoch": 2331} {"train_loss": -12.05305004119873, "global_step": 391735, "epoch": 2331} {"train_loss": -10.942078590393066, "global_step": 391736, "epoch": 2331} {"train_loss": -11.914161682128906, "global_step": 391737, "epoch": 2331} {"train_loss": -11.001165390014648, "global_step": 391738, "epoch": 2331} {"train_loss": -11.566263198852539, "global_step": 391739, "epoch": 2331} {"train_loss": -11.659782409667969, "global_step": 391740, "epoch": 2331} {"train_loss": -11.682357788085938, "global_step": 391741, "epoch": 2331} {"train_loss": -11.905418395996094, "global_step": 391742, "epoch": 2331} {"train_loss": -12.132030487060547, "global_step": 391743, "epoch": 2331} {"train_loss": -11.417668342590332, "global_step": 391744, "epoch": 2331} {"train_loss": -11.834280014038086, "global_step": 391745, "epoch": 2331} {"train_loss": -11.655607223510742, "global_step": 391746, "epoch": 2331} {"train_loss": -11.945974349975586, "global_step": 391747, "epoch": 2331} {"train_loss": -11.912445068359375, "global_step": 391748, "epoch": 2331} {"train_loss": -11.928877830505371, "global_step": 391749, "epoch": 2331} {"train_loss": -12.153217315673828, "global_step": 391750, "epoch": 2331} {"train_loss": -12.331390380859375, "global_step": 391751, "epoch": 2331} {"train_loss": -11.830124855041504, "global_step": 391752, "epoch": 2331} {"train_loss": -11.889007568359375, "global_step": 391753, "epoch": 2331} {"train_loss": -11.980445861816406, "global_step": 391754, "epoch": 2331} {"train_loss": -11.945119857788086, "global_step": 391755, "epoch": 2331} {"train_loss": -12.120126724243164, "global_step": 391756, "epoch": 2331} {"train_loss": -12.143917083740234, "global_step": 391757, "epoch": 2331} {"train_loss": -12.082919120788574, "global_step": 391758, "epoch": 2331} {"train_loss": -11.934749603271484, "global_step": 391759, "epoch": 2331} {"train_loss": -12.103523254394531, "global_step": 391760, "epoch": 2331} {"train_loss": -11.930707931518555, "global_step": 391761, "epoch": 2331} {"train_loss": -12.203282356262207, "global_step": 391762, "epoch": 2331} {"train_loss": -12.137809753417969, "global_step": 391763, "epoch": 2331} {"train_loss": -12.420242309570312, "global_step": 391764, "epoch": 2331} {"train_loss": -12.128826141357422, "global_step": 391765, "epoch": 2331} {"train_loss": -12.176682472229004, "global_step": 391766, "epoch": 2331} {"train_loss": -12.356051445007324, "global_step": 391767, "epoch": 2331} {"train_loss": -12.15744400024414, "global_step": 391768, "epoch": 2331} {"train_loss": -12.204154014587402, "global_step": 391769, "epoch": 2331} {"train_loss": -12.46749496459961, "global_step": 391770, "epoch": 2331} {"train_loss": -12.384982109069824, "global_step": 391771, "epoch": 2331} {"train_loss": -12.394742965698242, "global_step": 391772, "epoch": 2331} {"train_loss": -12.371393203735352, "global_step": 391773, "epoch": 2331} {"train_loss": -12.300905227661133, "global_step": 391774, "epoch": 2331} {"train_loss": -11.833635165577842, "global_step": 391775, "epoch": 2331, "val_loss": 300209.84375} {"train_loss": -12.422985076904297, "global_step": 391776, "epoch": 2332} {"train_loss": -12.306979179382324, "global_step": 391777, "epoch": 2332} {"train_loss": -12.302396774291992, "global_step": 391778, "epoch": 2332} {"train_loss": -12.295385360717773, "global_step": 391779, "epoch": 2332} {"train_loss": -12.371417999267578, "global_step": 391780, "epoch": 2332} {"train_loss": -12.394760131835938, "global_step": 391781, "epoch": 2332} {"train_loss": -12.187045097351074, "global_step": 391782, "epoch": 2332} {"train_loss": -12.412724494934082, "global_step": 391783, "epoch": 2332} {"train_loss": -12.019026756286621, "global_step": 391784, "epoch": 2332} {"train_loss": -12.251559257507324, "global_step": 391785, "epoch": 2332} {"train_loss": -12.286824226379395, "global_step": 391786, "epoch": 2332} {"train_loss": -12.109623908996582, "global_step": 391787, "epoch": 2332} {"train_loss": -12.28049087524414, "global_step": 391788, "epoch": 2332} {"train_loss": -11.850473403930664, "global_step": 391789, "epoch": 2332} {"train_loss": -12.057262420654297, "global_step": 391790, "epoch": 2332} {"train_loss": -12.181081771850586, "global_step": 391791, "epoch": 2332} {"train_loss": -11.985380172729492, "global_step": 391792, "epoch": 2332} {"train_loss": -12.347095489501953, "global_step": 391793, "epoch": 2332} {"train_loss": -12.373647689819336, "global_step": 391794, "epoch": 2332} {"train_loss": -12.134254455566406, "global_step": 391795, "epoch": 2332} {"train_loss": -12.694705963134766, "global_step": 391796, "epoch": 2332} {"train_loss": -12.459562301635742, "global_step": 391797, "epoch": 2332} {"train_loss": -12.518970489501953, "global_step": 391798, "epoch": 2332} {"train_loss": -12.763338088989258, "global_step": 391799, "epoch": 2332} {"train_loss": -12.33481216430664, "global_step": 391800, "epoch": 2332} {"train_loss": -12.676915168762207, "global_step": 391801, "epoch": 2332} {"train_loss": -12.492528915405273, "global_step": 391802, "epoch": 2332} {"train_loss": -12.264788627624512, "global_step": 391803, "epoch": 2332} {"train_loss": -12.6079683303833, "global_step": 391804, "epoch": 2332} {"train_loss": -11.710210800170898, "global_step": 391805, "epoch": 2332} {"train_loss": -12.0006103515625, "global_step": 391806, "epoch": 2332} {"train_loss": -12.444753646850586, "global_step": 391807, "epoch": 2332} {"train_loss": -11.746109008789062, "global_step": 391808, "epoch": 2332} {"train_loss": -12.30324649810791, "global_step": 391809, "epoch": 2332} {"train_loss": -12.106910705566406, "global_step": 391810, "epoch": 2332} {"train_loss": -12.00662612915039, "global_step": 391811, "epoch": 2332} {"train_loss": -11.879103660583496, "global_step": 391812, "epoch": 2332} {"train_loss": -12.46757698059082, "global_step": 391813, "epoch": 2332} {"train_loss": -12.074355125427246, "global_step": 391814, "epoch": 2332} {"train_loss": -11.747480392456055, "global_step": 391815, "epoch": 2332} {"train_loss": -12.497507095336914, "global_step": 391816, "epoch": 2332} {"train_loss": -12.218709945678711, "global_step": 391817, "epoch": 2332} {"train_loss": -12.599040985107422, "global_step": 391818, "epoch": 2332} {"train_loss": -12.408706665039062, "global_step": 391819, "epoch": 2332} {"train_loss": -12.507728576660156, "global_step": 391820, "epoch": 2332} {"train_loss": -11.979666709899902, "global_step": 391821, "epoch": 2332} {"train_loss": -12.810430526733398, "global_step": 391822, "epoch": 2332} {"train_loss": -11.773561477661133, "global_step": 391823, "epoch": 2332} {"train_loss": -12.092714309692383, "global_step": 391824, "epoch": 2332} {"train_loss": -12.395669937133789, "global_step": 391825, "epoch": 2332} {"train_loss": -11.995564460754395, "global_step": 391826, "epoch": 2332} {"train_loss": -12.013606071472168, "global_step": 391827, "epoch": 2332} {"train_loss": -12.55400276184082, "global_step": 391828, "epoch": 2332} {"train_loss": -11.978273391723633, "global_step": 391829, "epoch": 2332} {"train_loss": -12.380611419677734, "global_step": 391830, "epoch": 2332} {"train_loss": -12.410202026367188, "global_step": 391831, "epoch": 2332} {"train_loss": -12.495589256286621, "global_step": 391832, "epoch": 2332} {"train_loss": -12.120871543884277, "global_step": 391833, "epoch": 2332} {"train_loss": -12.28963565826416, "global_step": 391834, "epoch": 2332} {"train_loss": -12.14654541015625, "global_step": 391835, "epoch": 2332} {"train_loss": -12.043021202087402, "global_step": 391836, "epoch": 2332} {"train_loss": -12.475382804870605, "global_step": 391837, "epoch": 2332} {"train_loss": -12.043048858642578, "global_step": 391838, "epoch": 2332} {"train_loss": -12.303239822387695, "global_step": 391839, "epoch": 2332} {"train_loss": -12.36825180053711, "global_step": 391840, "epoch": 2332} {"train_loss": -12.093973159790039, "global_step": 391841, "epoch": 2332} {"train_loss": -12.684463500976562, "global_step": 391842, "epoch": 2332} {"train_loss": -12.295169830322266, "global_step": 391843, "epoch": 2332} {"train_loss": -12.221497535705566, "global_step": 391844, "epoch": 2332} {"train_loss": -12.413808822631836, "global_step": 391845, "epoch": 2332} {"train_loss": -12.141149520874023, "global_step": 391846, "epoch": 2332} {"train_loss": -12.19518756866455, "global_step": 391847, "epoch": 2332} {"train_loss": -12.471305847167969, "global_step": 391848, "epoch": 2332} {"train_loss": -11.728721618652344, "global_step": 391849, "epoch": 2332} {"train_loss": -12.48762321472168, "global_step": 391850, "epoch": 2332} {"train_loss": -12.187338829040527, "global_step": 391851, "epoch": 2332} {"train_loss": -12.08791732788086, "global_step": 391852, "epoch": 2332} {"train_loss": -12.163047790527344, "global_step": 391853, "epoch": 2332} {"train_loss": -12.378434181213379, "global_step": 391854, "epoch": 2332} {"train_loss": -12.191814422607422, "global_step": 391855, "epoch": 2332} {"train_loss": -12.29660415649414, "global_step": 391856, "epoch": 2332} {"train_loss": -12.184926986694336, "global_step": 391857, "epoch": 2332} {"train_loss": -12.283363342285156, "global_step": 391858, "epoch": 2332} {"train_loss": -12.765554428100586, "global_step": 391859, "epoch": 2332} {"train_loss": -12.471254348754883, "global_step": 391860, "epoch": 2332} {"train_loss": -12.575787544250488, "global_step": 391861, "epoch": 2332} {"train_loss": -12.623239517211914, "global_step": 391862, "epoch": 2332} {"train_loss": -12.383528709411621, "global_step": 391863, "epoch": 2332} {"train_loss": -11.624798774719238, "global_step": 391864, "epoch": 2332} {"train_loss": -12.230607032775879, "global_step": 391865, "epoch": 2332} {"train_loss": -12.31037712097168, "global_step": 391866, "epoch": 2332} {"train_loss": -12.399085998535156, "global_step": 391867, "epoch": 2332} {"train_loss": -12.319726943969727, "global_step": 391868, "epoch": 2332} {"train_loss": -12.606551170349121, "global_step": 391869, "epoch": 2332} {"train_loss": -12.509773254394531, "global_step": 391870, "epoch": 2332} {"train_loss": -12.18051815032959, "global_step": 391871, "epoch": 2332} {"train_loss": -12.658012390136719, "global_step": 391872, "epoch": 2332} {"train_loss": -12.031875610351562, "global_step": 391873, "epoch": 2332} {"train_loss": -12.244075775146484, "global_step": 391874, "epoch": 2332} {"train_loss": -12.47854232788086, "global_step": 391875, "epoch": 2332} {"train_loss": -11.881590843200684, "global_step": 391876, "epoch": 2332} {"train_loss": -12.227618217468262, "global_step": 391877, "epoch": 2332} {"train_loss": -12.365060806274414, "global_step": 391878, "epoch": 2332} {"train_loss": -11.716243743896484, "global_step": 391879, "epoch": 2332} {"train_loss": -11.909833908081055, "global_step": 391880, "epoch": 2332} {"train_loss": -11.770726203918457, "global_step": 391881, "epoch": 2332} {"train_loss": -12.064349174499512, "global_step": 391882, "epoch": 2332} {"train_loss": -11.43832015991211, "global_step": 391883, "epoch": 2332} {"train_loss": -11.372530937194824, "global_step": 391884, "epoch": 2332} {"train_loss": -11.592809677124023, "global_step": 391885, "epoch": 2332} {"train_loss": -10.189262390136719, "global_step": 391886, "epoch": 2332} {"train_loss": -10.919584274291992, "global_step": 391887, "epoch": 2332} {"train_loss": -11.21004867553711, "global_step": 391888, "epoch": 2332} {"train_loss": -9.682127952575684, "global_step": 391889, "epoch": 2332} {"train_loss": -8.918768882751465, "global_step": 391890, "epoch": 2332} {"train_loss": -11.773943901062012, "global_step": 391891, "epoch": 2332} {"train_loss": -7.360297203063965, "global_step": 391892, "epoch": 2332} {"train_loss": -7.446992874145508, "global_step": 391893, "epoch": 2332} {"train_loss": -10.638005256652832, "global_step": 391894, "epoch": 2332} {"train_loss": -6.0492682456970215, "global_step": 391895, "epoch": 2332} {"train_loss": -7.254641056060791, "global_step": 391896, "epoch": 2332} {"train_loss": -6.049957275390625, "global_step": 391897, "epoch": 2332} {"train_loss": -5.9990363121032715, "global_step": 391898, "epoch": 2332} {"train_loss": -5.691308498382568, "global_step": 391899, "epoch": 2332} {"train_loss": -5.857817649841309, "global_step": 391900, "epoch": 2332} {"train_loss": -6.784500598907471, "global_step": 391901, "epoch": 2332} {"train_loss": -7.735964298248291, "global_step": 391902, "epoch": 2332} {"train_loss": -7.122204303741455, "global_step": 391903, "epoch": 2332} {"train_loss": -7.165876388549805, "global_step": 391904, "epoch": 2332} {"train_loss": -7.675078392028809, "global_step": 391905, "epoch": 2332} {"train_loss": -7.765287399291992, "global_step": 391906, "epoch": 2332} {"train_loss": -8.169973373413086, "global_step": 391907, "epoch": 2332} {"train_loss": -8.44200325012207, "global_step": 391908, "epoch": 2332} {"train_loss": -8.720295906066895, "global_step": 391909, "epoch": 2332} {"train_loss": -8.712300300598145, "global_step": 391910, "epoch": 2332} {"train_loss": -8.718921661376953, "global_step": 391911, "epoch": 2332} {"train_loss": -7.89883279800415, "global_step": 391912, "epoch": 2332} {"train_loss": -9.112361907958984, "global_step": 391913, "epoch": 2332} {"train_loss": -9.479612350463867, "global_step": 391914, "epoch": 2332} {"train_loss": -9.803561210632324, "global_step": 391915, "epoch": 2332} {"train_loss": -9.107763290405273, "global_step": 391916, "epoch": 2332} {"train_loss": -8.883230209350586, "global_step": 391917, "epoch": 2332} {"train_loss": -8.422647476196289, "global_step": 391918, "epoch": 2332} {"train_loss": -9.793609619140625, "global_step": 391919, "epoch": 2332} {"train_loss": -9.575315475463867, "global_step": 391920, "epoch": 2332} {"train_loss": -8.27000904083252, "global_step": 391921, "epoch": 2332} {"train_loss": -8.878475189208984, "global_step": 391922, "epoch": 2332} {"train_loss": -9.122812271118164, "global_step": 391923, "epoch": 2332} {"train_loss": -9.953237533569336, "global_step": 391924, "epoch": 2332} {"train_loss": -9.9086275100708, "global_step": 391925, "epoch": 2332} {"train_loss": -9.67755126953125, "global_step": 391926, "epoch": 2332} {"train_loss": -9.62060546875, "global_step": 391927, "epoch": 2332} {"train_loss": -10.436461448669434, "global_step": 391928, "epoch": 2332} {"train_loss": -11.007806777954102, "global_step": 391929, "epoch": 2332} {"train_loss": -10.327840805053711, "global_step": 391930, "epoch": 2332} {"train_loss": -11.610857009887695, "global_step": 391931, "epoch": 2332} {"train_loss": -10.392548561096191, "global_step": 391932, "epoch": 2332} {"train_loss": -11.387577056884766, "global_step": 391933, "epoch": 2332} {"train_loss": -11.139885902404785, "global_step": 391934, "epoch": 2332} {"train_loss": -11.108055114746094, "global_step": 391935, "epoch": 2332} {"train_loss": -11.167994499206543, "global_step": 391936, "epoch": 2332} {"train_loss": -11.39876651763916, "global_step": 391937, "epoch": 2332} {"train_loss": -11.439152717590332, "global_step": 391938, "epoch": 2332} {"train_loss": -11.095016479492188, "global_step": 391939, "epoch": 2332} {"train_loss": -11.867984771728516, "global_step": 391940, "epoch": 2332} {"train_loss": -11.312972068786621, "global_step": 391941, "epoch": 2332} {"train_loss": -11.737373352050781, "global_step": 391942, "epoch": 2332} {"train_loss": -11.218679944674173, "global_step": 391943, "epoch": 2332, "val_loss": 299004.5} {"train_loss": -11.801105499267578, "global_step": 391944, "epoch": 2333} {"train_loss": -11.844284057617188, "global_step": 391945, "epoch": 2333} {"train_loss": -11.740142822265625, "global_step": 391946, "epoch": 2333} {"train_loss": -11.64200210571289, "global_step": 391947, "epoch": 2333} {"train_loss": -11.593210220336914, "global_step": 391948, "epoch": 2333} {"train_loss": -11.743684768676758, "global_step": 391949, "epoch": 2333} {"train_loss": -11.568218231201172, "global_step": 391950, "epoch": 2333} {"train_loss": -11.788403511047363, "global_step": 391951, "epoch": 2333} {"train_loss": -12.123784065246582, "global_step": 391952, "epoch": 2333} {"train_loss": -11.871840476989746, "global_step": 391953, "epoch": 2333} {"train_loss": -12.0629243850708, "global_step": 391954, "epoch": 2333} {"train_loss": -11.965850830078125, "global_step": 391955, "epoch": 2333} {"train_loss": -11.711544036865234, "global_step": 391956, "epoch": 2333} {"train_loss": -12.266783714294434, "global_step": 391957, "epoch": 2333} {"train_loss": -12.004182815551758, "global_step": 391958, "epoch": 2333} {"train_loss": -12.150981903076172, "global_step": 391959, "epoch": 2333} {"train_loss": -12.298442840576172, "global_step": 391960, "epoch": 2333} {"train_loss": -12.147477149963379, "global_step": 391961, "epoch": 2333} {"train_loss": -12.07133674621582, "global_step": 391962, "epoch": 2333} {"train_loss": -12.01962661743164, "global_step": 391963, "epoch": 2333} {"train_loss": -12.001407623291016, "global_step": 391964, "epoch": 2333} {"train_loss": -12.114700317382812, "global_step": 391965, "epoch": 2333} {"train_loss": -12.294733047485352, "global_step": 391966, "epoch": 2333} {"train_loss": -12.327386856079102, "global_step": 391967, "epoch": 2333} {"train_loss": -12.153223037719727, "global_step": 391968, "epoch": 2333} {"train_loss": -12.206274032592773, "global_step": 391969, "epoch": 2333} {"train_loss": -12.210885047912598, "global_step": 391970, "epoch": 2333} {"train_loss": -12.327839851379395, "global_step": 391971, "epoch": 2333} {"train_loss": -12.292706489562988, "global_step": 391972, "epoch": 2333} {"train_loss": -12.184675216674805, "global_step": 391973, "epoch": 2333} {"train_loss": -12.475765228271484, "global_step": 391974, "epoch": 2333} {"train_loss": -12.16653060913086, "global_step": 391975, "epoch": 2333} {"train_loss": -12.295084953308105, "global_step": 391976, "epoch": 2333} {"train_loss": -12.359097480773926, "global_step": 391977, "epoch": 2333} {"train_loss": -12.23865795135498, "global_step": 391978, "epoch": 2333} {"train_loss": -12.338136672973633, "global_step": 391979, "epoch": 2333} {"train_loss": -12.395919799804688, "global_step": 391980, "epoch": 2333} {"train_loss": -12.325135231018066, "global_step": 391981, "epoch": 2333} {"train_loss": -12.380534172058105, "global_step": 391982, "epoch": 2333} {"train_loss": -11.861082077026367, "global_step": 391983, "epoch": 2333} {"train_loss": -12.471923828125, "global_step": 391984, "epoch": 2333} {"train_loss": -12.512227058410645, "global_step": 391985, "epoch": 2333} {"train_loss": -12.563752174377441, "global_step": 391986, "epoch": 2333} {"train_loss": -12.489895820617676, "global_step": 391987, "epoch": 2333} {"train_loss": -12.42991828918457, "global_step": 391988, "epoch": 2333} {"train_loss": -12.619999885559082, "global_step": 391989, "epoch": 2333} {"train_loss": -12.536520004272461, "global_step": 391990, "epoch": 2333} {"train_loss": -12.600959777832031, "global_step": 391991, "epoch": 2333} {"train_loss": -12.504344940185547, "global_step": 391992, "epoch": 2333} {"train_loss": -12.578628540039062, "global_step": 391993, "epoch": 2333} {"train_loss": -12.653483390808105, "global_step": 391994, "epoch": 2333} {"train_loss": -12.559647560119629, "global_step": 391995, "epoch": 2333} {"train_loss": -12.483223915100098, "global_step": 391996, "epoch": 2333} {"train_loss": -12.577518463134766, "global_step": 391997, "epoch": 2333} {"train_loss": -12.590721130371094, "global_step": 391998, "epoch": 2333} {"train_loss": -12.680476188659668, "global_step": 391999, "epoch": 2333} {"train_loss": -12.471281051635742, "global_step": 392000, "epoch": 2333} {"train_loss": -12.622687339782715, "global_step": 392001, "epoch": 2333} {"train_loss": -12.713624954223633, "global_step": 392002, "epoch": 2333} {"train_loss": -12.409600257873535, "global_step": 392003, "epoch": 2333} {"train_loss": -12.597776412963867, "global_step": 392004, "epoch": 2333} {"train_loss": -12.470109939575195, "global_step": 392005, "epoch": 2333} {"train_loss": -12.62022590637207, "global_step": 392006, "epoch": 2333} {"train_loss": -12.371530532836914, "global_step": 392007, "epoch": 2333} {"train_loss": -12.518826484680176, "global_step": 392008, "epoch": 2333} {"train_loss": -12.61557388305664, "global_step": 392009, "epoch": 2333} {"train_loss": -12.508318901062012, "global_step": 392010, "epoch": 2333} {"train_loss": -12.402326583862305, "global_step": 392011, "epoch": 2333} {"train_loss": -12.493693351745605, "global_step": 392012, "epoch": 2333} {"train_loss": -12.750114440917969, "global_step": 392013, "epoch": 2333} {"train_loss": -12.342744827270508, "global_step": 392014, "epoch": 2333} {"train_loss": -12.717337608337402, "global_step": 392015, "epoch": 2333} {"train_loss": -12.578192710876465, "global_step": 392016, "epoch": 2333} {"train_loss": -12.693435668945312, "global_step": 392017, "epoch": 2333} {"train_loss": -12.309502601623535, "global_step": 392018, "epoch": 2333} {"train_loss": -12.66874885559082, "global_step": 392019, "epoch": 2333} {"train_loss": -12.476318359375, "global_step": 392020, "epoch": 2333} {"train_loss": -12.537856101989746, "global_step": 392021, "epoch": 2333} {"train_loss": -12.675235748291016, "global_step": 392022, "epoch": 2333} {"train_loss": -12.543322563171387, "global_step": 392023, "epoch": 2333} {"train_loss": -12.677116394042969, "global_step": 392024, "epoch": 2333} {"train_loss": -12.106891632080078, "global_step": 392025, "epoch": 2333} {"train_loss": -12.334137916564941, "global_step": 392026, "epoch": 2333} {"train_loss": -12.319091796875, "global_step": 392027, "epoch": 2333} {"train_loss": -12.051605224609375, "global_step": 392028, "epoch": 2333} {"train_loss": -12.660017967224121, "global_step": 392029, "epoch": 2333} {"train_loss": -12.522909164428711, "global_step": 392030, "epoch": 2333} {"train_loss": -11.494569778442383, "global_step": 392031, "epoch": 2333} {"train_loss": -12.48819351196289, "global_step": 392032, "epoch": 2333} {"train_loss": -12.225422859191895, "global_step": 392033, "epoch": 2333} {"train_loss": -12.035801887512207, "global_step": 392034, "epoch": 2333} {"train_loss": -12.362983703613281, "global_step": 392035, "epoch": 2333} {"train_loss": -12.25146198272705, "global_step": 392036, "epoch": 2333} {"train_loss": -12.161974906921387, "global_step": 392037, "epoch": 2333} {"train_loss": -12.422319412231445, "global_step": 392038, "epoch": 2333} {"train_loss": -11.333220481872559, "global_step": 392039, "epoch": 2333} {"train_loss": -12.049744606018066, "global_step": 392040, "epoch": 2333} {"train_loss": -11.954181671142578, "global_step": 392041, "epoch": 2333} {"train_loss": -10.91716194152832, "global_step": 392042, "epoch": 2333} {"train_loss": -11.649616241455078, "global_step": 392043, "epoch": 2333} {"train_loss": -10.758609771728516, "global_step": 392044, "epoch": 2333} {"train_loss": -11.278322219848633, "global_step": 392045, "epoch": 2333} {"train_loss": -12.228031158447266, "global_step": 392046, "epoch": 2333} {"train_loss": -11.666373252868652, "global_step": 392047, "epoch": 2333} {"train_loss": -11.852518081665039, "global_step": 392048, "epoch": 2333} {"train_loss": -11.78381061553955, "global_step": 392049, "epoch": 2333} {"train_loss": -12.220505714416504, "global_step": 392050, "epoch": 2333} {"train_loss": -12.202237129211426, "global_step": 392051, "epoch": 2333} {"train_loss": -12.288151741027832, "global_step": 392052, "epoch": 2333} {"train_loss": -11.791568756103516, "global_step": 392053, "epoch": 2333} {"train_loss": -12.250232696533203, "global_step": 392054, "epoch": 2333} {"train_loss": -12.076810836791992, "global_step": 392055, "epoch": 2333} {"train_loss": -12.510411262512207, "global_step": 392056, "epoch": 2333} {"train_loss": -11.608987808227539, "global_step": 392057, "epoch": 2333} {"train_loss": -12.319388389587402, "global_step": 392058, "epoch": 2333} {"train_loss": -11.953676223754883, "global_step": 392059, "epoch": 2333} {"train_loss": -11.998374938964844, "global_step": 392060, "epoch": 2333} {"train_loss": -11.43617057800293, "global_step": 392061, "epoch": 2333} {"train_loss": -11.87964916229248, "global_step": 392062, "epoch": 2333} {"train_loss": -11.94346809387207, "global_step": 392063, "epoch": 2333} {"train_loss": -12.537805557250977, "global_step": 392064, "epoch": 2333} {"train_loss": -12.213767051696777, "global_step": 392065, "epoch": 2333} {"train_loss": -12.148690223693848, "global_step": 392066, "epoch": 2333} {"train_loss": -12.127386093139648, "global_step": 392067, "epoch": 2333} {"train_loss": -12.26760482788086, "global_step": 392068, "epoch": 2333} {"train_loss": -12.551492691040039, "global_step": 392069, "epoch": 2333} {"train_loss": -12.01502513885498, "global_step": 392070, "epoch": 2333} {"train_loss": -12.045342445373535, "global_step": 392071, "epoch": 2333} {"train_loss": -11.8075590133667, "global_step": 392072, "epoch": 2333} {"train_loss": -12.021312713623047, "global_step": 392073, "epoch": 2333} {"train_loss": -11.791340827941895, "global_step": 392074, "epoch": 2333} {"train_loss": -11.536596298217773, "global_step": 392075, "epoch": 2333} {"train_loss": -12.415935516357422, "global_step": 392076, "epoch": 2333} {"train_loss": -11.490307807922363, "global_step": 392077, "epoch": 2333} {"train_loss": -12.320669174194336, "global_step": 392078, "epoch": 2333} {"train_loss": -11.768655776977539, "global_step": 392079, "epoch": 2333} {"train_loss": -12.607484817504883, "global_step": 392080, "epoch": 2333} {"train_loss": -12.25208568572998, "global_step": 392081, "epoch": 2333} {"train_loss": -12.06460952758789, "global_step": 392082, "epoch": 2333} {"train_loss": -12.366453170776367, "global_step": 392083, "epoch": 2333} {"train_loss": -11.699739456176758, "global_step": 392084, "epoch": 2333} {"train_loss": -12.349376678466797, "global_step": 392085, "epoch": 2333} {"train_loss": -11.43893814086914, "global_step": 392086, "epoch": 2333} {"train_loss": -11.372501373291016, "global_step": 392087, "epoch": 2333} {"train_loss": -11.961994171142578, "global_step": 392088, "epoch": 2333} {"train_loss": -11.497642517089844, "global_step": 392089, "epoch": 2333} {"train_loss": -11.939620971679688, "global_step": 392090, "epoch": 2333} {"train_loss": -11.943136215209961, "global_step": 392091, "epoch": 2333} {"train_loss": -12.054073333740234, "global_step": 392092, "epoch": 2333} {"train_loss": -11.555587768554688, "global_step": 392093, "epoch": 2333} {"train_loss": -12.2347993850708, "global_step": 392094, "epoch": 2333} {"train_loss": -11.869649887084961, "global_step": 392095, "epoch": 2333} {"train_loss": -12.101179122924805, "global_step": 392096, "epoch": 2333} {"train_loss": -11.382499694824219, "global_step": 392097, "epoch": 2333} {"train_loss": -12.180095672607422, "global_step": 392098, "epoch": 2333} {"train_loss": -12.095462799072266, "global_step": 392099, "epoch": 2333} {"train_loss": -12.050745964050293, "global_step": 392100, "epoch": 2333} {"train_loss": -12.019267082214355, "global_step": 392101, "epoch": 2333} {"train_loss": -11.977470397949219, "global_step": 392102, "epoch": 2333} {"train_loss": -11.956108093261719, "global_step": 392103, "epoch": 2333} {"train_loss": -11.907881736755371, "global_step": 392104, "epoch": 2333} {"train_loss": -12.31822681427002, "global_step": 392105, "epoch": 2333} {"train_loss": -12.231477737426758, "global_step": 392106, "epoch": 2333} {"train_loss": -11.648069381713867, "global_step": 392107, "epoch": 2333} {"train_loss": -11.965686798095703, "global_step": 392108, "epoch": 2333} {"train_loss": -12.126876831054688, "global_step": 392109, "epoch": 2333} {"train_loss": -12.256792068481445, "global_step": 392110, "epoch": 2333} {"train_loss": -12.15262912568592, "global_step": 392111, "epoch": 2333, "val_loss": 298485.28125} {"train_loss": -12.010110855102539, "global_step": 392112, "epoch": 2334} {"train_loss": -11.729206085205078, "global_step": 392113, "epoch": 2334} {"train_loss": -12.246301651000977, "global_step": 392114, "epoch": 2334} {"train_loss": -11.384288787841797, "global_step": 392115, "epoch": 2334} {"train_loss": -12.168802261352539, "global_step": 392116, "epoch": 2334} {"train_loss": -11.991806030273438, "global_step": 392117, "epoch": 2334} {"train_loss": -12.231853485107422, "global_step": 392118, "epoch": 2334} {"train_loss": -12.17082691192627, "global_step": 392119, "epoch": 2334} {"train_loss": -12.292403221130371, "global_step": 392120, "epoch": 2334} {"train_loss": -12.278013229370117, "global_step": 392121, "epoch": 2334} {"train_loss": -12.032381057739258, "global_step": 392122, "epoch": 2334} {"train_loss": -12.08385944366455, "global_step": 392123, "epoch": 2334} {"train_loss": -11.830001831054688, "global_step": 392124, "epoch": 2334} {"train_loss": -12.066308975219727, "global_step": 392125, "epoch": 2334} {"train_loss": -12.115750312805176, "global_step": 392126, "epoch": 2334} {"train_loss": -11.92599868774414, "global_step": 392127, "epoch": 2334} {"train_loss": -11.106514930725098, "global_step": 392128, "epoch": 2334} {"train_loss": -11.705049514770508, "global_step": 392129, "epoch": 2334} {"train_loss": -12.14941692352295, "global_step": 392130, "epoch": 2334} {"train_loss": -11.82929515838623, "global_step": 392131, "epoch": 2334} {"train_loss": -12.215370178222656, "global_step": 392132, "epoch": 2334} {"train_loss": -11.433664321899414, "global_step": 392133, "epoch": 2334} {"train_loss": -12.243818283081055, "global_step": 392134, "epoch": 2334} {"train_loss": -11.6579008102417, "global_step": 392135, "epoch": 2334} {"train_loss": -12.467621803283691, "global_step": 392136, "epoch": 2334} {"train_loss": -11.713966369628906, "global_step": 392137, "epoch": 2334} {"train_loss": -11.841633796691895, "global_step": 392138, "epoch": 2334} {"train_loss": -12.181598663330078, "global_step": 392139, "epoch": 2334} {"train_loss": -11.901351928710938, "global_step": 392140, "epoch": 2334} {"train_loss": -12.171989440917969, "global_step": 392141, "epoch": 2334} {"train_loss": -12.007465362548828, "global_step": 392142, "epoch": 2334} {"train_loss": -12.404874801635742, "global_step": 392143, "epoch": 2334} {"train_loss": -11.746086120605469, "global_step": 392144, "epoch": 2334} {"train_loss": -12.284290313720703, "global_step": 392145, "epoch": 2334} {"train_loss": -11.797140121459961, "global_step": 392146, "epoch": 2334} {"train_loss": -11.921290397644043, "global_step": 392147, "epoch": 2334} {"train_loss": -11.790241241455078, "global_step": 392148, "epoch": 2334} {"train_loss": -11.954798698425293, "global_step": 392149, "epoch": 2334} {"train_loss": -12.035106658935547, "global_step": 392150, "epoch": 2334} {"train_loss": -12.048613548278809, "global_step": 392151, "epoch": 2334} {"train_loss": -12.518024444580078, "global_step": 392152, "epoch": 2334} {"train_loss": -12.014179229736328, "global_step": 392153, "epoch": 2334} {"train_loss": -12.435718536376953, "global_step": 392154, "epoch": 2334} {"train_loss": -12.310832977294922, "global_step": 392155, "epoch": 2334} {"train_loss": -12.42740535736084, "global_step": 392156, "epoch": 2334} {"train_loss": -12.289268493652344, "global_step": 392157, "epoch": 2334} {"train_loss": -12.244224548339844, "global_step": 392158, "epoch": 2334} {"train_loss": -12.423879623413086, "global_step": 392159, "epoch": 2334} {"train_loss": -12.44659423828125, "global_step": 392160, "epoch": 2334} {"train_loss": -12.267715454101562, "global_step": 392161, "epoch": 2334} {"train_loss": -12.496192932128906, "global_step": 392162, "epoch": 2334} {"train_loss": -12.524374008178711, "global_step": 392163, "epoch": 2334} {"train_loss": -12.68753433227539, "global_step": 392164, "epoch": 2334} {"train_loss": -12.25977611541748, "global_step": 392165, "epoch": 2334} {"train_loss": -12.21431827545166, "global_step": 392166, "epoch": 2334} {"train_loss": -12.043201446533203, "global_step": 392167, "epoch": 2334} {"train_loss": -12.45073413848877, "global_step": 392168, "epoch": 2334} {"train_loss": -12.009387969970703, "global_step": 392169, "epoch": 2334} {"train_loss": -12.370293617248535, "global_step": 392170, "epoch": 2334} {"train_loss": -12.40774917602539, "global_step": 392171, "epoch": 2334} {"train_loss": -12.349479675292969, "global_step": 392172, "epoch": 2334} {"train_loss": -11.751964569091797, "global_step": 392173, "epoch": 2334} {"train_loss": -12.631795883178711, "global_step": 392174, "epoch": 2334} {"train_loss": -12.240915298461914, "global_step": 392175, "epoch": 2334} {"train_loss": -12.23678207397461, "global_step": 392176, "epoch": 2334} {"train_loss": -12.46361255645752, "global_step": 392177, "epoch": 2334} {"train_loss": -12.277570724487305, "global_step": 392178, "epoch": 2334} {"train_loss": -12.362245559692383, "global_step": 392179, "epoch": 2334} {"train_loss": -12.271942138671875, "global_step": 392180, "epoch": 2334} {"train_loss": -12.294471740722656, "global_step": 392181, "epoch": 2334} {"train_loss": -12.68881893157959, "global_step": 392182, "epoch": 2334} {"train_loss": -12.046167373657227, "global_step": 392183, "epoch": 2334} {"train_loss": -12.132280349731445, "global_step": 392184, "epoch": 2334} {"train_loss": -12.191953659057617, "global_step": 392185, "epoch": 2334} {"train_loss": -12.358777046203613, "global_step": 392186, "epoch": 2334} {"train_loss": -11.817607879638672, "global_step": 392187, "epoch": 2334} {"train_loss": -12.03251838684082, "global_step": 392188, "epoch": 2334} {"train_loss": -12.523423194885254, "global_step": 392189, "epoch": 2334} {"train_loss": -11.797938346862793, "global_step": 392190, "epoch": 2334} {"train_loss": -10.929855346679688, "global_step": 392191, "epoch": 2334} {"train_loss": -10.841289520263672, "global_step": 392192, "epoch": 2334} {"train_loss": -12.521998405456543, "global_step": 392193, "epoch": 2334} {"train_loss": -11.458623886108398, "global_step": 392194, "epoch": 2334} {"train_loss": -10.035346984863281, "global_step": 392195, "epoch": 2334} {"train_loss": -12.293421745300293, "global_step": 392196, "epoch": 2334} {"train_loss": -8.796131134033203, "global_step": 392197, "epoch": 2334} {"train_loss": -9.867984771728516, "global_step": 392198, "epoch": 2334} {"train_loss": -8.838926315307617, "global_step": 392199, "epoch": 2334} {"train_loss": -8.32769775390625, "global_step": 392200, "epoch": 2334} {"train_loss": -8.22979736328125, "global_step": 392201, "epoch": 2334} {"train_loss": -8.933984756469727, "global_step": 392202, "epoch": 2334} {"train_loss": -10.804033279418945, "global_step": 392203, "epoch": 2334} {"train_loss": -10.08565902709961, "global_step": 392204, "epoch": 2334} {"train_loss": -10.25786018371582, "global_step": 392205, "epoch": 2334} {"train_loss": -11.623079299926758, "global_step": 392206, "epoch": 2334} {"train_loss": -10.768784523010254, "global_step": 392207, "epoch": 2334} {"train_loss": -10.388250350952148, "global_step": 392208, "epoch": 2334} {"train_loss": -10.707534790039062, "global_step": 392209, "epoch": 2334} {"train_loss": -10.722167015075684, "global_step": 392210, "epoch": 2334} {"train_loss": -11.235504150390625, "global_step": 392211, "epoch": 2334} {"train_loss": -10.539753913879395, "global_step": 392212, "epoch": 2334} {"train_loss": -10.665977478027344, "global_step": 392213, "epoch": 2334} {"train_loss": -10.238740921020508, "global_step": 392214, "epoch": 2334} {"train_loss": -10.652505874633789, "global_step": 392215, "epoch": 2334} {"train_loss": -11.723173141479492, "global_step": 392216, "epoch": 2334} {"train_loss": -10.458301544189453, "global_step": 392217, "epoch": 2334} {"train_loss": -11.493268966674805, "global_step": 392218, "epoch": 2334} {"train_loss": -11.212471008300781, "global_step": 392219, "epoch": 2334} {"train_loss": -10.941287994384766, "global_step": 392220, "epoch": 2334} {"train_loss": -11.557075500488281, "global_step": 392221, "epoch": 2334} {"train_loss": -10.8948974609375, "global_step": 392222, "epoch": 2334} {"train_loss": -11.677571296691895, "global_step": 392223, "epoch": 2334} {"train_loss": -11.138497352600098, "global_step": 392224, "epoch": 2334} {"train_loss": -11.142815589904785, "global_step": 392225, "epoch": 2334} {"train_loss": -11.682896614074707, "global_step": 392226, "epoch": 2334} {"train_loss": -11.522478103637695, "global_step": 392227, "epoch": 2334} {"train_loss": -11.8575439453125, "global_step": 392228, "epoch": 2334} {"train_loss": -11.715072631835938, "global_step": 392229, "epoch": 2334} {"train_loss": -11.196419715881348, "global_step": 392230, "epoch": 2334} {"train_loss": -12.106587409973145, "global_step": 392231, "epoch": 2334} {"train_loss": -11.175762176513672, "global_step": 392232, "epoch": 2334} {"train_loss": -11.972406387329102, "global_step": 392233, "epoch": 2334} {"train_loss": -11.734184265136719, "global_step": 392234, "epoch": 2334} {"train_loss": -11.083965301513672, "global_step": 392235, "epoch": 2334} {"train_loss": -12.107414245605469, "global_step": 392236, "epoch": 2334} {"train_loss": -11.212455749511719, "global_step": 392237, "epoch": 2334} {"train_loss": -12.084197998046875, "global_step": 392238, "epoch": 2334} {"train_loss": -11.611440658569336, "global_step": 392239, "epoch": 2334} {"train_loss": -11.379646301269531, "global_step": 392240, "epoch": 2334} {"train_loss": -11.895516395568848, "global_step": 392241, "epoch": 2334} {"train_loss": -11.401552200317383, "global_step": 392242, "epoch": 2334} {"train_loss": -12.356013298034668, "global_step": 392243, "epoch": 2334} {"train_loss": -11.816779136657715, "global_step": 392244, "epoch": 2334} {"train_loss": -12.201101303100586, "global_step": 392245, "epoch": 2334} {"train_loss": -11.96074390411377, "global_step": 392246, "epoch": 2334} {"train_loss": -12.049772262573242, "global_step": 392247, "epoch": 2334} {"train_loss": -12.013094902038574, "global_step": 392248, "epoch": 2334} {"train_loss": -12.173908233642578, "global_step": 392249, "epoch": 2334} {"train_loss": -12.393115043640137, "global_step": 392250, "epoch": 2334} {"train_loss": -12.403968811035156, "global_step": 392251, "epoch": 2334} {"train_loss": -12.431769371032715, "global_step": 392252, "epoch": 2334} {"train_loss": -12.370312690734863, "global_step": 392253, "epoch": 2334} {"train_loss": -12.219797134399414, "global_step": 392254, "epoch": 2334} {"train_loss": -12.188102722167969, "global_step": 392255, "epoch": 2334} {"train_loss": -12.468969345092773, "global_step": 392256, "epoch": 2334} {"train_loss": -12.407270431518555, "global_step": 392257, "epoch": 2334} {"train_loss": -12.414971351623535, "global_step": 392258, "epoch": 2334} {"train_loss": -12.561101913452148, "global_step": 392259, "epoch": 2334} {"train_loss": -12.349668502807617, "global_step": 392260, "epoch": 2334} {"train_loss": -12.331223487854004, "global_step": 392261, "epoch": 2334} {"train_loss": -12.470697402954102, "global_step": 392262, "epoch": 2334} {"train_loss": -12.506507873535156, "global_step": 392263, "epoch": 2334} {"train_loss": -12.532376289367676, "global_step": 392264, "epoch": 2334} {"train_loss": -12.713417053222656, "global_step": 392265, "epoch": 2334} {"train_loss": -12.513718605041504, "global_step": 392266, "epoch": 2334} {"train_loss": -12.405138969421387, "global_step": 392267, "epoch": 2334} {"train_loss": -12.610982894897461, "global_step": 392268, "epoch": 2334} {"train_loss": -12.446259498596191, "global_step": 392269, "epoch": 2334} {"train_loss": -12.681407928466797, "global_step": 392270, "epoch": 2334} {"train_loss": -12.410812377929688, "global_step": 392271, "epoch": 2334} {"train_loss": -12.697613716125488, "global_step": 392272, "epoch": 2334} {"train_loss": -12.498479843139648, "global_step": 392273, "epoch": 2334} {"train_loss": -12.608976364135742, "global_step": 392274, "epoch": 2334} {"train_loss": -12.739387512207031, "global_step": 392275, "epoch": 2334} {"train_loss": -12.660992622375488, "global_step": 392276, "epoch": 2334} {"train_loss": -12.744050979614258, "global_step": 392277, "epoch": 2334} {"train_loss": -12.381651878356934, "global_step": 392278, "epoch": 2334} {"train_loss": -11.8295753740129, "global_step": 392279, "epoch": 2334, "val_loss": 296623.65625} {"train_loss": -12.435022354125977, "global_step": 392280, "epoch": 2335} {"train_loss": -12.356466293334961, "global_step": 392281, "epoch": 2335} {"train_loss": -12.370111465454102, "global_step": 392282, "epoch": 2335} {"train_loss": -12.034481048583984, "global_step": 392283, "epoch": 2335} {"train_loss": -12.194005966186523, "global_step": 392284, "epoch": 2335} {"train_loss": -12.516059875488281, "global_step": 392285, "epoch": 2335} {"train_loss": -12.42841625213623, "global_step": 392286, "epoch": 2335} {"train_loss": -12.471750259399414, "global_step": 392287, "epoch": 2335} {"train_loss": -12.256843566894531, "global_step": 392288, "epoch": 2335} {"train_loss": -12.356819152832031, "global_step": 392289, "epoch": 2335} {"train_loss": -12.457645416259766, "global_step": 392290, "epoch": 2335} {"train_loss": -12.42648983001709, "global_step": 392291, "epoch": 2335} {"train_loss": -12.405200958251953, "global_step": 392292, "epoch": 2335} {"train_loss": -12.00691032409668, "global_step": 392293, "epoch": 2335} {"train_loss": -12.256353378295898, "global_step": 392294, "epoch": 2335} {"train_loss": -12.296464920043945, "global_step": 392295, "epoch": 2335} {"train_loss": -12.213020324707031, "global_step": 392296, "epoch": 2335} {"train_loss": -12.02834701538086, "global_step": 392297, "epoch": 2335} {"train_loss": -12.632636070251465, "global_step": 392298, "epoch": 2335} {"train_loss": -10.633638381958008, "global_step": 392299, "epoch": 2335} {"train_loss": -12.218871116638184, "global_step": 392300, "epoch": 2335} {"train_loss": -11.115991592407227, "global_step": 392301, "epoch": 2335} {"train_loss": -11.000886917114258, "global_step": 392302, "epoch": 2335} {"train_loss": -10.668278694152832, "global_step": 392303, "epoch": 2335} {"train_loss": -10.383265495300293, "global_step": 392304, "epoch": 2335} {"train_loss": -11.692098617553711, "global_step": 392305, "epoch": 2335} {"train_loss": -12.133541107177734, "global_step": 392306, "epoch": 2335} {"train_loss": -11.36333179473877, "global_step": 392307, "epoch": 2335} {"train_loss": -12.294503211975098, "global_step": 392308, "epoch": 2335} {"train_loss": -11.801836967468262, "global_step": 392309, "epoch": 2335} {"train_loss": -12.017099380493164, "global_step": 392310, "epoch": 2335} {"train_loss": -12.009918212890625, "global_step": 392311, "epoch": 2335} {"train_loss": -12.267619132995605, "global_step": 392312, "epoch": 2335} {"train_loss": -11.523996353149414, "global_step": 392313, "epoch": 2335} {"train_loss": -12.243596076965332, "global_step": 392314, "epoch": 2335} {"train_loss": -12.218181610107422, "global_step": 392315, "epoch": 2335} {"train_loss": -11.996274948120117, "global_step": 392316, "epoch": 2335} {"train_loss": -11.599350929260254, "global_step": 392317, "epoch": 2335} {"train_loss": -11.90218734741211, "global_step": 392318, "epoch": 2335} {"train_loss": -12.24189567565918, "global_step": 392319, "epoch": 2335} {"train_loss": -12.29017448425293, "global_step": 392320, "epoch": 2335} {"train_loss": -12.173025131225586, "global_step": 392321, "epoch": 2335} {"train_loss": -12.31246280670166, "global_step": 392322, "epoch": 2335} {"train_loss": -12.394425392150879, "global_step": 392323, "epoch": 2335} {"train_loss": -11.98253345489502, "global_step": 392324, "epoch": 2335} {"train_loss": -12.37499713897705, "global_step": 392325, "epoch": 2335} {"train_loss": -12.191774368286133, "global_step": 392326, "epoch": 2335} {"train_loss": -12.120195388793945, "global_step": 392327, "epoch": 2335} {"train_loss": -12.443763732910156, "global_step": 392328, "epoch": 2335} {"train_loss": -12.535083770751953, "global_step": 392329, "epoch": 2335} {"train_loss": -12.25097942352295, "global_step": 392330, "epoch": 2335} {"train_loss": -11.980259895324707, "global_step": 392331, "epoch": 2335} {"train_loss": -12.453250885009766, "global_step": 392332, "epoch": 2335} {"train_loss": -12.350912094116211, "global_step": 392333, "epoch": 2335} {"train_loss": -11.931822776794434, "global_step": 392334, "epoch": 2335} {"train_loss": -12.766080856323242, "global_step": 392335, "epoch": 2335} {"train_loss": -12.044720649719238, "global_step": 392336, "epoch": 2335} {"train_loss": -11.983550071716309, "global_step": 392337, "epoch": 2335} {"train_loss": -12.47950553894043, "global_step": 392338, "epoch": 2335} {"train_loss": -12.385236740112305, "global_step": 392339, "epoch": 2335} {"train_loss": -12.222026824951172, "global_step": 392340, "epoch": 2335} {"train_loss": -12.67886734008789, "global_step": 392341, "epoch": 2335} {"train_loss": -12.085314750671387, "global_step": 392342, "epoch": 2335} {"train_loss": -12.105096817016602, "global_step": 392343, "epoch": 2335} {"train_loss": -12.441988945007324, "global_step": 392344, "epoch": 2335} {"train_loss": -11.961299896240234, "global_step": 392345, "epoch": 2335} {"train_loss": -12.681400299072266, "global_step": 392346, "epoch": 2335} {"train_loss": -12.208412170410156, "global_step": 392347, "epoch": 2335} {"train_loss": -12.1688232421875, "global_step": 392348, "epoch": 2335} {"train_loss": -12.605648040771484, "global_step": 392349, "epoch": 2335} {"train_loss": -12.568593978881836, "global_step": 392350, "epoch": 2335} {"train_loss": -12.503665924072266, "global_step": 392351, "epoch": 2335} {"train_loss": -12.320683479309082, "global_step": 392352, "epoch": 2335} {"train_loss": -12.064447402954102, "global_step": 392353, "epoch": 2335} {"train_loss": -11.87674331665039, "global_step": 392354, "epoch": 2335} {"train_loss": -12.84885025024414, "global_step": 392355, "epoch": 2335} {"train_loss": -11.985036849975586, "global_step": 392356, "epoch": 2335} {"train_loss": -11.687110900878906, "global_step": 392357, "epoch": 2335} {"train_loss": -12.444313049316406, "global_step": 392358, "epoch": 2335} {"train_loss": -12.66692066192627, "global_step": 392359, "epoch": 2335} {"train_loss": -12.05274772644043, "global_step": 392360, "epoch": 2335} {"train_loss": -12.287434577941895, "global_step": 392361, "epoch": 2335} {"train_loss": -12.398704528808594, "global_step": 392362, "epoch": 2335} {"train_loss": -12.598894119262695, "global_step": 392363, "epoch": 2335} {"train_loss": -11.954717636108398, "global_step": 392364, "epoch": 2335} {"train_loss": -12.040250778198242, "global_step": 392365, "epoch": 2335} {"train_loss": -12.902936935424805, "global_step": 392366, "epoch": 2335} {"train_loss": -12.41211986541748, "global_step": 392367, "epoch": 2335} {"train_loss": -12.270387649536133, "global_step": 392368, "epoch": 2335} {"train_loss": -12.116106986999512, "global_step": 392369, "epoch": 2335} {"train_loss": -12.469533920288086, "global_step": 392370, "epoch": 2335} {"train_loss": -12.209484100341797, "global_step": 392371, "epoch": 2335} {"train_loss": -12.167062759399414, "global_step": 392372, "epoch": 2335} {"train_loss": -12.273828506469727, "global_step": 392373, "epoch": 2335} {"train_loss": -11.654401779174805, "global_step": 392374, "epoch": 2335} {"train_loss": -12.487674713134766, "global_step": 392375, "epoch": 2335} {"train_loss": -11.849326133728027, "global_step": 392376, "epoch": 2335} {"train_loss": -12.375480651855469, "global_step": 392377, "epoch": 2335} {"train_loss": -11.775729179382324, "global_step": 392378, "epoch": 2335} {"train_loss": -12.315122604370117, "global_step": 392379, "epoch": 2335} {"train_loss": -11.197684288024902, "global_step": 392380, "epoch": 2335} {"train_loss": -12.16492748260498, "global_step": 392381, "epoch": 2335} {"train_loss": -11.199761390686035, "global_step": 392382, "epoch": 2335} {"train_loss": -12.508493423461914, "global_step": 392383, "epoch": 2335} {"train_loss": -11.274202346801758, "global_step": 392384, "epoch": 2335} {"train_loss": -11.818187713623047, "global_step": 392385, "epoch": 2335} {"train_loss": -12.111357688903809, "global_step": 392386, "epoch": 2335} {"train_loss": -11.54774284362793, "global_step": 392387, "epoch": 2335} {"train_loss": -11.41978931427002, "global_step": 392388, "epoch": 2335} {"train_loss": -11.476318359375, "global_step": 392389, "epoch": 2335} {"train_loss": -11.17949104309082, "global_step": 392390, "epoch": 2335} {"train_loss": -11.426042556762695, "global_step": 392391, "epoch": 2335} {"train_loss": -12.461210250854492, "global_step": 392392, "epoch": 2335} {"train_loss": -11.327461242675781, "global_step": 392393, "epoch": 2335} {"train_loss": -11.851998329162598, "global_step": 392394, "epoch": 2335} {"train_loss": -10.801994323730469, "global_step": 392395, "epoch": 2335} {"train_loss": -11.073169708251953, "global_step": 392396, "epoch": 2335} {"train_loss": -11.921432495117188, "global_step": 392397, "epoch": 2335} {"train_loss": -11.37791919708252, "global_step": 392398, "epoch": 2335} {"train_loss": -11.64055347442627, "global_step": 392399, "epoch": 2335} {"train_loss": -11.896613121032715, "global_step": 392400, "epoch": 2335} {"train_loss": -11.718720436096191, "global_step": 392401, "epoch": 2335} {"train_loss": -11.369054794311523, "global_step": 392402, "epoch": 2335} {"train_loss": -12.256305694580078, "global_step": 392403, "epoch": 2335} {"train_loss": -11.71551513671875, "global_step": 392404, "epoch": 2335} {"train_loss": -12.267370223999023, "global_step": 392405, "epoch": 2335} {"train_loss": -11.202017784118652, "global_step": 392406, "epoch": 2335} {"train_loss": -11.717966079711914, "global_step": 392407, "epoch": 2335} {"train_loss": -11.371648788452148, "global_step": 392408, "epoch": 2335} {"train_loss": -11.092450141906738, "global_step": 392409, "epoch": 2335} {"train_loss": -11.590777397155762, "global_step": 392410, "epoch": 2335} {"train_loss": -11.69332504272461, "global_step": 392411, "epoch": 2335} {"train_loss": -11.718873977661133, "global_step": 392412, "epoch": 2335} {"train_loss": -12.042071342468262, "global_step": 392413, "epoch": 2335} {"train_loss": -11.839146614074707, "global_step": 392414, "epoch": 2335} {"train_loss": -11.81297492980957, "global_step": 392415, "epoch": 2335} {"train_loss": -11.28958511352539, "global_step": 392416, "epoch": 2335} {"train_loss": -11.71609878540039, "global_step": 392417, "epoch": 2335} {"train_loss": -11.132158279418945, "global_step": 392418, "epoch": 2335} {"train_loss": -11.846623420715332, "global_step": 392419, "epoch": 2335} {"train_loss": -11.611472129821777, "global_step": 392420, "epoch": 2335} {"train_loss": -11.43095874786377, "global_step": 392421, "epoch": 2335} {"train_loss": -12.136256217956543, "global_step": 392422, "epoch": 2335} {"train_loss": -11.079000473022461, "global_step": 392423, "epoch": 2335} {"train_loss": -11.776126861572266, "global_step": 392424, "epoch": 2335} {"train_loss": -12.034004211425781, "global_step": 392425, "epoch": 2335} {"train_loss": -11.478841781616211, "global_step": 392426, "epoch": 2335} {"train_loss": -12.248893737792969, "global_step": 392427, "epoch": 2335} {"train_loss": -11.584806442260742, "global_step": 392428, "epoch": 2335} {"train_loss": -11.87083625793457, "global_step": 392429, "epoch": 2335} {"train_loss": -12.284902572631836, "global_step": 392430, "epoch": 2335} {"train_loss": -11.763547897338867, "global_step": 392431, "epoch": 2335} {"train_loss": -12.207402229309082, "global_step": 392432, "epoch": 2335} {"train_loss": -12.185585021972656, "global_step": 392433, "epoch": 2335} {"train_loss": -12.083402633666992, "global_step": 392434, "epoch": 2335} {"train_loss": -12.430946350097656, "global_step": 392435, "epoch": 2335} {"train_loss": -11.914188385009766, "global_step": 392436, "epoch": 2335} {"train_loss": -12.479432106018066, "global_step": 392437, "epoch": 2335} {"train_loss": -12.09954833984375, "global_step": 392438, "epoch": 2335} {"train_loss": -12.370691299438477, "global_step": 392439, "epoch": 2335} {"train_loss": -12.45343017578125, "global_step": 392440, "epoch": 2335} {"train_loss": -12.388445854187012, "global_step": 392441, "epoch": 2335} {"train_loss": -11.987753868103027, "global_step": 392442, "epoch": 2335} {"train_loss": -12.473756790161133, "global_step": 392443, "epoch": 2335} {"train_loss": -12.014309883117676, "global_step": 392444, "epoch": 2335} {"train_loss": -12.593420028686523, "global_step": 392445, "epoch": 2335} {"train_loss": -12.370227813720703, "global_step": 392446, "epoch": 2335} {"train_loss": -12.01351735705421, "global_step": 392447, "epoch": 2335, "val_loss": 297103.9375, "train_action_mse_error": 1.5690428018569946} {"train_loss": -12.27364730834961, "global_step": 392448, "epoch": 2336} {"train_loss": -12.51007080078125, "global_step": 392449, "epoch": 2336} {"train_loss": -12.16012191772461, "global_step": 392450, "epoch": 2336} {"train_loss": -12.175943374633789, "global_step": 392451, "epoch": 2336} {"train_loss": -12.347198486328125, "global_step": 392452, "epoch": 2336} {"train_loss": -12.477402687072754, "global_step": 392453, "epoch": 2336} {"train_loss": -12.398764610290527, "global_step": 392454, "epoch": 2336} {"train_loss": -12.367680549621582, "global_step": 392455, "epoch": 2336} {"train_loss": -12.199569702148438, "global_step": 392456, "epoch": 2336} {"train_loss": -12.544360160827637, "global_step": 392457, "epoch": 2336} {"train_loss": -11.987503051757812, "global_step": 392458, "epoch": 2336} {"train_loss": -12.44437313079834, "global_step": 392459, "epoch": 2336} {"train_loss": -12.525602340698242, "global_step": 392460, "epoch": 2336} {"train_loss": -12.421793937683105, "global_step": 392461, "epoch": 2336} {"train_loss": -12.536508560180664, "global_step": 392462, "epoch": 2336} {"train_loss": -12.571868896484375, "global_step": 392463, "epoch": 2336} {"train_loss": -12.41914176940918, "global_step": 392464, "epoch": 2336} {"train_loss": -12.656853675842285, "global_step": 392465, "epoch": 2336} {"train_loss": -12.726174354553223, "global_step": 392466, "epoch": 2336} {"train_loss": -12.751450538635254, "global_step": 392467, "epoch": 2336} {"train_loss": -12.534146308898926, "global_step": 392468, "epoch": 2336} {"train_loss": -12.814862251281738, "global_step": 392469, "epoch": 2336} {"train_loss": -12.52436637878418, "global_step": 392470, "epoch": 2336} {"train_loss": -12.582260131835938, "global_step": 392471, "epoch": 2336} {"train_loss": -12.545888900756836, "global_step": 392472, "epoch": 2336} {"train_loss": -12.564021110534668, "global_step": 392473, "epoch": 2336} {"train_loss": -12.536640167236328, "global_step": 392474, "epoch": 2336} {"train_loss": -12.678726196289062, "global_step": 392475, "epoch": 2336} {"train_loss": -12.464131355285645, "global_step": 392476, "epoch": 2336} {"train_loss": -12.711541175842285, "global_step": 392477, "epoch": 2336} {"train_loss": -12.482053756713867, "global_step": 392478, "epoch": 2336} {"train_loss": -12.330779075622559, "global_step": 392479, "epoch": 2336} {"train_loss": -11.890037536621094, "global_step": 392480, "epoch": 2336} {"train_loss": -12.714699745178223, "global_step": 392481, "epoch": 2336} {"train_loss": -12.126928329467773, "global_step": 392482, "epoch": 2336} {"train_loss": -11.393381118774414, "global_step": 392483, "epoch": 2336} {"train_loss": -11.435344696044922, "global_step": 392484, "epoch": 2336} {"train_loss": -11.970491409301758, "global_step": 392485, "epoch": 2336} {"train_loss": -8.574443817138672, "global_step": 392486, "epoch": 2336} {"train_loss": -8.951422691345215, "global_step": 392487, "epoch": 2336} {"train_loss": -10.83881950378418, "global_step": 392488, "epoch": 2336} {"train_loss": -9.134750366210938, "global_step": 392489, "epoch": 2336} {"train_loss": -11.068914413452148, "global_step": 392490, "epoch": 2336} {"train_loss": -11.40966796875, "global_step": 392491, "epoch": 2336} {"train_loss": -10.540007591247559, "global_step": 392492, "epoch": 2336} {"train_loss": -11.85799789428711, "global_step": 392493, "epoch": 2336} {"train_loss": -9.492977142333984, "global_step": 392494, "epoch": 2336} {"train_loss": -9.74089527130127, "global_step": 392495, "epoch": 2336} {"train_loss": -10.609332084655762, "global_step": 392496, "epoch": 2336} {"train_loss": -11.946743965148926, "global_step": 392497, "epoch": 2336} {"train_loss": -9.6900053024292, "global_step": 392498, "epoch": 2336} {"train_loss": -10.417326927185059, "global_step": 392499, "epoch": 2336} {"train_loss": -10.749324798583984, "global_step": 392500, "epoch": 2336} {"train_loss": -10.884815216064453, "global_step": 392501, "epoch": 2336} {"train_loss": -11.46195125579834, "global_step": 392502, "epoch": 2336} {"train_loss": -9.696285247802734, "global_step": 392503, "epoch": 2336} {"train_loss": -11.23036003112793, "global_step": 392504, "epoch": 2336} {"train_loss": -11.553665161132812, "global_step": 392505, "epoch": 2336} {"train_loss": -11.189474105834961, "global_step": 392506, "epoch": 2336} {"train_loss": -9.937358856201172, "global_step": 392507, "epoch": 2336} {"train_loss": -11.71879768371582, "global_step": 392508, "epoch": 2336} {"train_loss": -10.602496147155762, "global_step": 392509, "epoch": 2336} {"train_loss": -10.34942626953125, "global_step": 392510, "epoch": 2336} {"train_loss": -9.829292297363281, "global_step": 392511, "epoch": 2336} {"train_loss": -10.174988746643066, "global_step": 392512, "epoch": 2336} {"train_loss": -9.69825267791748, "global_step": 392513, "epoch": 2336} {"train_loss": -11.395515441894531, "global_step": 392514, "epoch": 2336} {"train_loss": -10.965312957763672, "global_step": 392515, "epoch": 2336} {"train_loss": -10.83861255645752, "global_step": 392516, "epoch": 2336} {"train_loss": -11.18419075012207, "global_step": 392517, "epoch": 2336} {"train_loss": -11.55451774597168, "global_step": 392518, "epoch": 2336} {"train_loss": -10.59634780883789, "global_step": 392519, "epoch": 2336} {"train_loss": -11.602516174316406, "global_step": 392520, "epoch": 2336} {"train_loss": -10.579045295715332, "global_step": 392521, "epoch": 2336} {"train_loss": -11.817547798156738, "global_step": 392522, "epoch": 2336} {"train_loss": -11.247689247131348, "global_step": 392523, "epoch": 2336} {"train_loss": -11.87533950805664, "global_step": 392524, "epoch": 2336} {"train_loss": -11.641075134277344, "global_step": 392525, "epoch": 2336} {"train_loss": -11.93598747253418, "global_step": 392526, "epoch": 2336} {"train_loss": -11.382369995117188, "global_step": 392527, "epoch": 2336} {"train_loss": -11.902172088623047, "global_step": 392528, "epoch": 2336} {"train_loss": -11.64258098602295, "global_step": 392529, "epoch": 2336} {"train_loss": -11.718168258666992, "global_step": 392530, "epoch": 2336} {"train_loss": -11.834897994995117, "global_step": 392531, "epoch": 2336} {"train_loss": -11.774876594543457, "global_step": 392532, "epoch": 2336} {"train_loss": -12.099886894226074, "global_step": 392533, "epoch": 2336} {"train_loss": -12.079380989074707, "global_step": 392534, "epoch": 2336} {"train_loss": -12.027702331542969, "global_step": 392535, "epoch": 2336} {"train_loss": -12.210405349731445, "global_step": 392536, "epoch": 2336} {"train_loss": -11.783331871032715, "global_step": 392537, "epoch": 2336} {"train_loss": -12.293025016784668, "global_step": 392538, "epoch": 2336} {"train_loss": -12.063604354858398, "global_step": 392539, "epoch": 2336} {"train_loss": -12.298995018005371, "global_step": 392540, "epoch": 2336} {"train_loss": -11.9703369140625, "global_step": 392541, "epoch": 2336} {"train_loss": -12.247785568237305, "global_step": 392542, "epoch": 2336} {"train_loss": -12.119195938110352, "global_step": 392543, "epoch": 2336} {"train_loss": -12.281841278076172, "global_step": 392544, "epoch": 2336} {"train_loss": -12.143034934997559, "global_step": 392545, "epoch": 2336} {"train_loss": -12.302909851074219, "global_step": 392546, "epoch": 2336} {"train_loss": -12.397501945495605, "global_step": 392547, "epoch": 2336} {"train_loss": -12.303712844848633, "global_step": 392548, "epoch": 2336} {"train_loss": -12.162117004394531, "global_step": 392549, "epoch": 2336} {"train_loss": -12.295494079589844, "global_step": 392550, "epoch": 2336} {"train_loss": -11.999404907226562, "global_step": 392551, "epoch": 2336} {"train_loss": -12.25669002532959, "global_step": 392552, "epoch": 2336} {"train_loss": -12.511165618896484, "global_step": 392553, "epoch": 2336} {"train_loss": -12.241178512573242, "global_step": 392554, "epoch": 2336} {"train_loss": -12.417353630065918, "global_step": 392555, "epoch": 2336} {"train_loss": -12.269060134887695, "global_step": 392556, "epoch": 2336} {"train_loss": -12.418878555297852, "global_step": 392557, "epoch": 2336} {"train_loss": -12.305261611938477, "global_step": 392558, "epoch": 2336} {"train_loss": -12.081341743469238, "global_step": 392559, "epoch": 2336} {"train_loss": -12.207588195800781, "global_step": 392560, "epoch": 2336} {"train_loss": -12.266839981079102, "global_step": 392561, "epoch": 2336} {"train_loss": -12.339288711547852, "global_step": 392562, "epoch": 2336} {"train_loss": -12.256715774536133, "global_step": 392563, "epoch": 2336} {"train_loss": -12.542926788330078, "global_step": 392564, "epoch": 2336} {"train_loss": -12.421272277832031, "global_step": 392565, "epoch": 2336} {"train_loss": -12.432357788085938, "global_step": 392566, "epoch": 2336} {"train_loss": -12.546428680419922, "global_step": 392567, "epoch": 2336} {"train_loss": -12.313593864440918, "global_step": 392568, "epoch": 2336} {"train_loss": -12.563831329345703, "global_step": 392569, "epoch": 2336} {"train_loss": -12.257182121276855, "global_step": 392570, "epoch": 2336} {"train_loss": -12.50277042388916, "global_step": 392571, "epoch": 2336} {"train_loss": -12.434148788452148, "global_step": 392572, "epoch": 2336} {"train_loss": -12.258527755737305, "global_step": 392573, "epoch": 2336} {"train_loss": -12.337890625, "global_step": 392574, "epoch": 2336} {"train_loss": -12.001323699951172, "global_step": 392575, "epoch": 2336} {"train_loss": -12.583734512329102, "global_step": 392576, "epoch": 2336} {"train_loss": -12.524154663085938, "global_step": 392577, "epoch": 2336} {"train_loss": -12.56680965423584, "global_step": 392578, "epoch": 2336} {"train_loss": -12.599916458129883, "global_step": 392579, "epoch": 2336} {"train_loss": -12.477901458740234, "global_step": 392580, "epoch": 2336} {"train_loss": -12.751750946044922, "global_step": 392581, "epoch": 2336} {"train_loss": -12.403592109680176, "global_step": 392582, "epoch": 2336} {"train_loss": -12.620597839355469, "global_step": 392583, "epoch": 2336} {"train_loss": -12.578513145446777, "global_step": 392584, "epoch": 2336} {"train_loss": -12.555492401123047, "global_step": 392585, "epoch": 2336} {"train_loss": -12.570517539978027, "global_step": 392586, "epoch": 2336} {"train_loss": -12.263751983642578, "global_step": 392587, "epoch": 2336} {"train_loss": -12.64286994934082, "global_step": 392588, "epoch": 2336} {"train_loss": -12.375420570373535, "global_step": 392589, "epoch": 2336} {"train_loss": -12.458915710449219, "global_step": 392590, "epoch": 2336} {"train_loss": -12.666894912719727, "global_step": 392591, "epoch": 2336} {"train_loss": -12.4886474609375, "global_step": 392592, "epoch": 2336} {"train_loss": -12.462267875671387, "global_step": 392593, "epoch": 2336} {"train_loss": -12.565895080566406, "global_step": 392594, "epoch": 2336} {"train_loss": -12.396001815795898, "global_step": 392595, "epoch": 2336} {"train_loss": -12.722735404968262, "global_step": 392596, "epoch": 2336} {"train_loss": -12.752878189086914, "global_step": 392597, "epoch": 2336} {"train_loss": -12.451676368713379, "global_step": 392598, "epoch": 2336} {"train_loss": -12.521117210388184, "global_step": 392599, "epoch": 2336} {"train_loss": -12.449031829833984, "global_step": 392600, "epoch": 2336} {"train_loss": -12.492231369018555, "global_step": 392601, "epoch": 2336} {"train_loss": -12.590596199035645, "global_step": 392602, "epoch": 2336} {"train_loss": -12.60545539855957, "global_step": 392603, "epoch": 2336} {"train_loss": -12.58675765991211, "global_step": 392604, "epoch": 2336} {"train_loss": -12.547563552856445, "global_step": 392605, "epoch": 2336} {"train_loss": -12.757400512695312, "global_step": 392606, "epoch": 2336} {"train_loss": -12.811235427856445, "global_step": 392607, "epoch": 2336} {"train_loss": -12.621526718139648, "global_step": 392608, "epoch": 2336} {"train_loss": -12.415369033813477, "global_step": 392609, "epoch": 2336} {"train_loss": -12.717367172241211, "global_step": 392610, "epoch": 2336} {"train_loss": -12.726788520812988, "global_step": 392611, "epoch": 2336} {"train_loss": -12.526280403137207, "global_step": 392612, "epoch": 2336} {"train_loss": -12.065366744995117, "global_step": 392613, "epoch": 2336} {"train_loss": -12.048705101013184, "global_step": 392614, "epoch": 2336} {"train_loss": -11.961859669004168, "global_step": 392615, "epoch": 2336, "val_loss": 295695.625} {"train_loss": -12.339146614074707, "global_step": 392616, "epoch": 2337} {"train_loss": -12.55156135559082, "global_step": 392617, "epoch": 2337} {"train_loss": -12.658733367919922, "global_step": 392618, "epoch": 2337} {"train_loss": -12.235238075256348, "global_step": 392619, "epoch": 2337} {"train_loss": -12.30534839630127, "global_step": 392620, "epoch": 2337} {"train_loss": -11.782434463500977, "global_step": 392621, "epoch": 2337} {"train_loss": -11.725662231445312, "global_step": 392622, "epoch": 2337} {"train_loss": -10.683218955993652, "global_step": 392623, "epoch": 2337} {"train_loss": -11.993169784545898, "global_step": 392624, "epoch": 2337} {"train_loss": -11.303657531738281, "global_step": 392625, "epoch": 2337} {"train_loss": -9.96487045288086, "global_step": 392626, "epoch": 2337} {"train_loss": -9.89959716796875, "global_step": 392627, "epoch": 2337} {"train_loss": -10.278131484985352, "global_step": 392628, "epoch": 2337} {"train_loss": -10.728318214416504, "global_step": 392629, "epoch": 2337} {"train_loss": -9.868368148803711, "global_step": 392630, "epoch": 2337} {"train_loss": -10.714614868164062, "global_step": 392631, "epoch": 2337} {"train_loss": -10.200165748596191, "global_step": 392632, "epoch": 2337} {"train_loss": -10.754678726196289, "global_step": 392633, "epoch": 2337} {"train_loss": -9.591194152832031, "global_step": 392634, "epoch": 2337} {"train_loss": -10.976676940917969, "global_step": 392635, "epoch": 2337} {"train_loss": -11.599771499633789, "global_step": 392636, "epoch": 2337} {"train_loss": -9.794637680053711, "global_step": 392637, "epoch": 2337} {"train_loss": -10.64498519897461, "global_step": 392638, "epoch": 2337} {"train_loss": -9.683562278747559, "global_step": 392639, "epoch": 2337} {"train_loss": -10.397937774658203, "global_step": 392640, "epoch": 2337} {"train_loss": -10.25223445892334, "global_step": 392641, "epoch": 2337} {"train_loss": -10.911578178405762, "global_step": 392642, "epoch": 2337} {"train_loss": -9.831438064575195, "global_step": 392643, "epoch": 2337} {"train_loss": -10.863256454467773, "global_step": 392644, "epoch": 2337} {"train_loss": -10.964937210083008, "global_step": 392645, "epoch": 2337} {"train_loss": -10.412409782409668, "global_step": 392646, "epoch": 2337} {"train_loss": -10.666580200195312, "global_step": 392647, "epoch": 2337} {"train_loss": -10.353082656860352, "global_step": 392648, "epoch": 2337} {"train_loss": -9.796854972839355, "global_step": 392649, "epoch": 2337} {"train_loss": -11.301176071166992, "global_step": 392650, "epoch": 2337} {"train_loss": -10.751480102539062, "global_step": 392651, "epoch": 2337} {"train_loss": -11.023588180541992, "global_step": 392652, "epoch": 2337} {"train_loss": -11.313753128051758, "global_step": 392653, "epoch": 2337} {"train_loss": -10.772725105285645, "global_step": 392654, "epoch": 2337} {"train_loss": -10.241983413696289, "global_step": 392655, "epoch": 2337} {"train_loss": -11.362218856811523, "global_step": 392656, "epoch": 2337} {"train_loss": -10.432585716247559, "global_step": 392657, "epoch": 2337} {"train_loss": -10.272584915161133, "global_step": 392658, "epoch": 2337} {"train_loss": -11.196592330932617, "global_step": 392659, "epoch": 2337} {"train_loss": -10.979513168334961, "global_step": 392660, "epoch": 2337} {"train_loss": -11.177261352539062, "global_step": 392661, "epoch": 2337} {"train_loss": -11.659956932067871, "global_step": 392662, "epoch": 2337} {"train_loss": -11.275309562683105, "global_step": 392663, "epoch": 2337} {"train_loss": -11.351118087768555, "global_step": 392664, "epoch": 2337} {"train_loss": -11.669539451599121, "global_step": 392665, "epoch": 2337} {"train_loss": -11.157464027404785, "global_step": 392666, "epoch": 2337} {"train_loss": -10.940887451171875, "global_step": 392667, "epoch": 2337} {"train_loss": -12.097854614257812, "global_step": 392668, "epoch": 2337} {"train_loss": -11.08137321472168, "global_step": 392669, "epoch": 2337} {"train_loss": -12.00235366821289, "global_step": 392670, "epoch": 2337} {"train_loss": -11.87289810180664, "global_step": 392671, "epoch": 2337} {"train_loss": -11.779505729675293, "global_step": 392672, "epoch": 2337} {"train_loss": -11.918020248413086, "global_step": 392673, "epoch": 2337} {"train_loss": -11.624545097351074, "global_step": 392674, "epoch": 2337} {"train_loss": -11.550058364868164, "global_step": 392675, "epoch": 2337} {"train_loss": -12.185604095458984, "global_step": 392676, "epoch": 2337} {"train_loss": -11.751090049743652, "global_step": 392677, "epoch": 2337} {"train_loss": -11.98727798461914, "global_step": 392678, "epoch": 2337} {"train_loss": -12.201271057128906, "global_step": 392679, "epoch": 2337} {"train_loss": -11.947697639465332, "global_step": 392680, "epoch": 2337} {"train_loss": -11.989895820617676, "global_step": 392681, "epoch": 2337} {"train_loss": -12.07583236694336, "global_step": 392682, "epoch": 2337} {"train_loss": -12.125853538513184, "global_step": 392683, "epoch": 2337} {"train_loss": -12.060325622558594, "global_step": 392684, "epoch": 2337} {"train_loss": -12.043405532836914, "global_step": 392685, "epoch": 2337} {"train_loss": -11.75588607788086, "global_step": 392686, "epoch": 2337} {"train_loss": -12.04741096496582, "global_step": 392687, "epoch": 2337} {"train_loss": -11.839408874511719, "global_step": 392688, "epoch": 2337} {"train_loss": -12.253403663635254, "global_step": 392689, "epoch": 2337} {"train_loss": -12.414569854736328, "global_step": 392690, "epoch": 2337} {"train_loss": -12.168105125427246, "global_step": 392691, "epoch": 2337} {"train_loss": -12.264832496643066, "global_step": 392692, "epoch": 2337} {"train_loss": -12.363353729248047, "global_step": 392693, "epoch": 2337} {"train_loss": -12.04566764831543, "global_step": 392694, "epoch": 2337} {"train_loss": -12.230342864990234, "global_step": 392695, "epoch": 2337} {"train_loss": -12.267866134643555, "global_step": 392696, "epoch": 2337} {"train_loss": -12.033011436462402, "global_step": 392697, "epoch": 2337} {"train_loss": -12.543757438659668, "global_step": 392698, "epoch": 2337} {"train_loss": -12.333778381347656, "global_step": 392699, "epoch": 2337} {"train_loss": -12.19287395477295, "global_step": 392700, "epoch": 2337} {"train_loss": -12.427389144897461, "global_step": 392701, "epoch": 2337} {"train_loss": -12.339356422424316, "global_step": 392702, "epoch": 2337} {"train_loss": -12.401228904724121, "global_step": 392703, "epoch": 2337} {"train_loss": -12.260077476501465, "global_step": 392704, "epoch": 2337} {"train_loss": -12.451784133911133, "global_step": 392705, "epoch": 2337} {"train_loss": -12.274690628051758, "global_step": 392706, "epoch": 2337} {"train_loss": -12.634507179260254, "global_step": 392707, "epoch": 2337} {"train_loss": -12.500041961669922, "global_step": 392708, "epoch": 2337} {"train_loss": -12.704702377319336, "global_step": 392709, "epoch": 2337} {"train_loss": -12.319524765014648, "global_step": 392710, "epoch": 2337} {"train_loss": -12.427650451660156, "global_step": 392711, "epoch": 2337} {"train_loss": -12.362627029418945, "global_step": 392712, "epoch": 2337} {"train_loss": -12.391845703125, "global_step": 392713, "epoch": 2337} {"train_loss": -12.409433364868164, "global_step": 392714, "epoch": 2337} {"train_loss": -12.358235359191895, "global_step": 392715, "epoch": 2337} {"train_loss": -12.446941375732422, "global_step": 392716, "epoch": 2337} {"train_loss": -12.494731903076172, "global_step": 392717, "epoch": 2337} {"train_loss": -12.419452667236328, "global_step": 392718, "epoch": 2337} {"train_loss": -12.48301887512207, "global_step": 392719, "epoch": 2337} {"train_loss": -12.441734313964844, "global_step": 392720, "epoch": 2337} {"train_loss": -12.350776672363281, "global_step": 392721, "epoch": 2337} {"train_loss": -12.554044723510742, "global_step": 392722, "epoch": 2337} {"train_loss": -12.640802383422852, "global_step": 392723, "epoch": 2337} {"train_loss": -12.300355911254883, "global_step": 392724, "epoch": 2337} {"train_loss": -12.411539077758789, "global_step": 392725, "epoch": 2337} {"train_loss": -12.581130981445312, "global_step": 392726, "epoch": 2337} {"train_loss": -12.551590919494629, "global_step": 392727, "epoch": 2337} {"train_loss": -12.133842468261719, "global_step": 392728, "epoch": 2337} {"train_loss": -12.049636840820312, "global_step": 392729, "epoch": 2337} {"train_loss": -12.735169410705566, "global_step": 392730, "epoch": 2337} {"train_loss": -12.572598457336426, "global_step": 392731, "epoch": 2337} {"train_loss": -12.57359504699707, "global_step": 392732, "epoch": 2337} {"train_loss": -12.449353218078613, "global_step": 392733, "epoch": 2337} {"train_loss": -12.827058792114258, "global_step": 392734, "epoch": 2337} {"train_loss": -12.594816207885742, "global_step": 392735, "epoch": 2337} {"train_loss": -12.56597900390625, "global_step": 392736, "epoch": 2337} {"train_loss": -12.674346923828125, "global_step": 392737, "epoch": 2337} {"train_loss": -12.619742393493652, "global_step": 392738, "epoch": 2337} {"train_loss": -12.560667991638184, "global_step": 392739, "epoch": 2337} {"train_loss": -12.643404006958008, "global_step": 392740, "epoch": 2337} {"train_loss": -12.760455131530762, "global_step": 392741, "epoch": 2337} {"train_loss": -12.594192504882812, "global_step": 392742, "epoch": 2337} {"train_loss": -12.828700065612793, "global_step": 392743, "epoch": 2337} {"train_loss": -12.76453685760498, "global_step": 392744, "epoch": 2337} {"train_loss": -12.694761276245117, "global_step": 392745, "epoch": 2337} {"train_loss": -12.675172805786133, "global_step": 392746, "epoch": 2337} {"train_loss": -12.793529510498047, "global_step": 392747, "epoch": 2337} {"train_loss": -12.72827434539795, "global_step": 392748, "epoch": 2337} {"train_loss": -12.637565612792969, "global_step": 392749, "epoch": 2337} {"train_loss": -12.910425186157227, "global_step": 392750, "epoch": 2337} {"train_loss": -12.578498840332031, "global_step": 392751, "epoch": 2337} {"train_loss": -12.38253402709961, "global_step": 392752, "epoch": 2337} {"train_loss": -12.598275184631348, "global_step": 392753, "epoch": 2337} {"train_loss": -12.706003189086914, "global_step": 392754, "epoch": 2337} {"train_loss": -11.978228569030762, "global_step": 392755, "epoch": 2337} {"train_loss": -11.804126739501953, "global_step": 392756, "epoch": 2337} {"train_loss": -11.670860290527344, "global_step": 392757, "epoch": 2337} {"train_loss": -12.505638122558594, "global_step": 392758, "epoch": 2337} {"train_loss": -11.856571197509766, "global_step": 392759, "epoch": 2337} {"train_loss": -11.327373504638672, "global_step": 392760, "epoch": 2337} {"train_loss": -11.79012680053711, "global_step": 392761, "epoch": 2337} {"train_loss": -12.143686294555664, "global_step": 392762, "epoch": 2337} {"train_loss": -11.532732009887695, "global_step": 392763, "epoch": 2337} {"train_loss": -9.928426742553711, "global_step": 392764, "epoch": 2337} {"train_loss": -10.868143081665039, "global_step": 392765, "epoch": 2337} {"train_loss": -9.748420715332031, "global_step": 392766, "epoch": 2337} {"train_loss": -10.88680648803711, "global_step": 392767, "epoch": 2337} {"train_loss": -10.608695983886719, "global_step": 392768, "epoch": 2337} {"train_loss": -10.923506736755371, "global_step": 392769, "epoch": 2337} {"train_loss": -11.127326011657715, "global_step": 392770, "epoch": 2337} {"train_loss": -11.179717063903809, "global_step": 392771, "epoch": 2337} {"train_loss": -12.193597793579102, "global_step": 392772, "epoch": 2337} {"train_loss": -10.62060260772705, "global_step": 392773, "epoch": 2337} {"train_loss": -11.6762113571167, "global_step": 392774, "epoch": 2337} {"train_loss": -11.259021759033203, "global_step": 392775, "epoch": 2337} {"train_loss": -11.773698806762695, "global_step": 392776, "epoch": 2337} {"train_loss": -10.777117729187012, "global_step": 392777, "epoch": 2337} {"train_loss": -10.728721618652344, "global_step": 392778, "epoch": 2337} {"train_loss": -11.311872482299805, "global_step": 392779, "epoch": 2337} {"train_loss": -10.670585632324219, "global_step": 392780, "epoch": 2337} {"train_loss": -10.898039817810059, "global_step": 392781, "epoch": 2337} {"train_loss": -11.318662643432617, "global_step": 392782, "epoch": 2337} {"train_loss": -11.71106701805478, "global_step": 392783, "epoch": 2337, "val_loss": 296179.875} {"train_loss": -11.158976554870605, "global_step": 392784, "epoch": 2338} {"train_loss": -11.558548927307129, "global_step": 392785, "epoch": 2338} {"train_loss": -11.915472030639648, "global_step": 392786, "epoch": 2338} {"train_loss": -11.863180160522461, "global_step": 392787, "epoch": 2338} {"train_loss": -11.878934860229492, "global_step": 392788, "epoch": 2338} {"train_loss": -12.198477745056152, "global_step": 392789, "epoch": 2338} {"train_loss": -11.61239242553711, "global_step": 392790, "epoch": 2338} {"train_loss": -12.297845840454102, "global_step": 392791, "epoch": 2338} {"train_loss": -11.736995697021484, "global_step": 392792, "epoch": 2338} {"train_loss": -11.855016708374023, "global_step": 392793, "epoch": 2338} {"train_loss": -12.3041353225708, "global_step": 392794, "epoch": 2338} {"train_loss": -11.656966209411621, "global_step": 392795, "epoch": 2338} {"train_loss": -11.798534393310547, "global_step": 392796, "epoch": 2338} {"train_loss": -11.750589370727539, "global_step": 392797, "epoch": 2338} {"train_loss": -11.917264938354492, "global_step": 392798, "epoch": 2338} {"train_loss": -11.9671630859375, "global_step": 392799, "epoch": 2338} {"train_loss": -12.234857559204102, "global_step": 392800, "epoch": 2338} {"train_loss": -12.294586181640625, "global_step": 392801, "epoch": 2338} {"train_loss": -12.265605926513672, "global_step": 392802, "epoch": 2338} {"train_loss": -12.078044891357422, "global_step": 392803, "epoch": 2338} {"train_loss": -11.965261459350586, "global_step": 392804, "epoch": 2338} {"train_loss": -12.273192405700684, "global_step": 392805, "epoch": 2338} {"train_loss": -12.483389854431152, "global_step": 392806, "epoch": 2338} {"train_loss": -12.330766677856445, "global_step": 392807, "epoch": 2338} {"train_loss": -12.167536735534668, "global_step": 392808, "epoch": 2338} {"train_loss": -12.184723854064941, "global_step": 392809, "epoch": 2338} {"train_loss": -12.335680961608887, "global_step": 392810, "epoch": 2338} {"train_loss": -12.049787521362305, "global_step": 392811, "epoch": 2338} {"train_loss": -12.258025169372559, "global_step": 392812, "epoch": 2338} {"train_loss": -12.20541763305664, "global_step": 392813, "epoch": 2338} {"train_loss": -12.208993911743164, "global_step": 392814, "epoch": 2338} {"train_loss": -12.2628812789917, "global_step": 392815, "epoch": 2338} {"train_loss": -11.93073558807373, "global_step": 392816, "epoch": 2338} {"train_loss": -12.160067558288574, "global_step": 392817, "epoch": 2338} {"train_loss": -12.323308944702148, "global_step": 392818, "epoch": 2338} {"train_loss": -12.224081039428711, "global_step": 392819, "epoch": 2338} {"train_loss": -12.48280143737793, "global_step": 392820, "epoch": 2338} {"train_loss": -12.208658218383789, "global_step": 392821, "epoch": 2338} {"train_loss": -12.191542625427246, "global_step": 392822, "epoch": 2338} {"train_loss": -12.353334426879883, "global_step": 392823, "epoch": 2338} {"train_loss": -12.298498153686523, "global_step": 392824, "epoch": 2338} {"train_loss": -12.369770050048828, "global_step": 392825, "epoch": 2338} {"train_loss": -12.159954071044922, "global_step": 392826, "epoch": 2338} {"train_loss": -12.485113143920898, "global_step": 392827, "epoch": 2338} {"train_loss": -12.128220558166504, "global_step": 392828, "epoch": 2338} {"train_loss": -12.401022911071777, "global_step": 392829, "epoch": 2338} {"train_loss": -12.047779083251953, "global_step": 392830, "epoch": 2338} {"train_loss": -12.390155792236328, "global_step": 392831, "epoch": 2338} {"train_loss": -12.38827133178711, "global_step": 392832, "epoch": 2338} {"train_loss": -12.16181755065918, "global_step": 392833, "epoch": 2338} {"train_loss": -12.048805236816406, "global_step": 392834, "epoch": 2338} {"train_loss": -12.35289478302002, "global_step": 392835, "epoch": 2338} {"train_loss": -12.525049209594727, "global_step": 392836, "epoch": 2338} {"train_loss": -12.452766418457031, "global_step": 392837, "epoch": 2338} {"train_loss": -12.298933982849121, "global_step": 392838, "epoch": 2338} {"train_loss": -12.622358322143555, "global_step": 392839, "epoch": 2338} {"train_loss": -12.279987335205078, "global_step": 392840, "epoch": 2338} {"train_loss": -12.280339241027832, "global_step": 392841, "epoch": 2338} {"train_loss": -12.392215728759766, "global_step": 392842, "epoch": 2338} {"train_loss": -12.484685897827148, "global_step": 392843, "epoch": 2338} {"train_loss": -12.535652160644531, "global_step": 392844, "epoch": 2338} {"train_loss": -12.402750015258789, "global_step": 392845, "epoch": 2338} {"train_loss": -12.690043449401855, "global_step": 392846, "epoch": 2338} {"train_loss": -12.495418548583984, "global_step": 392847, "epoch": 2338} {"train_loss": -12.481772422790527, "global_step": 392848, "epoch": 2338} {"train_loss": -12.413516998291016, "global_step": 392849, "epoch": 2338} {"train_loss": -12.08195686340332, "global_step": 392850, "epoch": 2338} {"train_loss": -12.342069625854492, "global_step": 392851, "epoch": 2338} {"train_loss": -12.548544883728027, "global_step": 392852, "epoch": 2338} {"train_loss": -12.28802490234375, "global_step": 392853, "epoch": 2338} {"train_loss": -12.675926208496094, "global_step": 392854, "epoch": 2338} {"train_loss": -12.596519470214844, "global_step": 392855, "epoch": 2338} {"train_loss": -12.67482852935791, "global_step": 392856, "epoch": 2338} {"train_loss": -12.296152114868164, "global_step": 392857, "epoch": 2338} {"train_loss": -12.358576774597168, "global_step": 392858, "epoch": 2338} {"train_loss": -12.337420463562012, "global_step": 392859, "epoch": 2338} {"train_loss": -12.546432495117188, "global_step": 392860, "epoch": 2338} {"train_loss": -12.290477752685547, "global_step": 392861, "epoch": 2338} {"train_loss": -12.680039405822754, "global_step": 392862, "epoch": 2338} {"train_loss": -12.180527687072754, "global_step": 392863, "epoch": 2338} {"train_loss": -12.341682434082031, "global_step": 392864, "epoch": 2338} {"train_loss": -12.37203311920166, "global_step": 392865, "epoch": 2338} {"train_loss": -12.407591819763184, "global_step": 392866, "epoch": 2338} {"train_loss": -12.122686386108398, "global_step": 392867, "epoch": 2338} {"train_loss": -11.235028266906738, "global_step": 392868, "epoch": 2338} {"train_loss": -12.532742500305176, "global_step": 392869, "epoch": 2338} {"train_loss": -11.943145751953125, "global_step": 392870, "epoch": 2338} {"train_loss": -12.597051620483398, "global_step": 392871, "epoch": 2338} {"train_loss": -12.07803726196289, "global_step": 392872, "epoch": 2338} {"train_loss": -11.23507308959961, "global_step": 392873, "epoch": 2338} {"train_loss": -11.333015441894531, "global_step": 392874, "epoch": 2338} {"train_loss": -11.575358390808105, "global_step": 392875, "epoch": 2338} {"train_loss": -12.121822357177734, "global_step": 392876, "epoch": 2338} {"train_loss": -11.551448822021484, "global_step": 392877, "epoch": 2338} {"train_loss": -11.661731719970703, "global_step": 392878, "epoch": 2338} {"train_loss": -12.117700576782227, "global_step": 392879, "epoch": 2338} {"train_loss": -11.862003326416016, "global_step": 392880, "epoch": 2338} {"train_loss": -11.82383918762207, "global_step": 392881, "epoch": 2338} {"train_loss": -11.975446701049805, "global_step": 392882, "epoch": 2338} {"train_loss": -11.915800094604492, "global_step": 392883, "epoch": 2338} {"train_loss": -11.823238372802734, "global_step": 392884, "epoch": 2338} {"train_loss": -11.180633544921875, "global_step": 392885, "epoch": 2338} {"train_loss": -10.531182289123535, "global_step": 392886, "epoch": 2338} {"train_loss": -11.79415225982666, "global_step": 392887, "epoch": 2338} {"train_loss": -12.340270042419434, "global_step": 392888, "epoch": 2338} {"train_loss": -11.915787696838379, "global_step": 392889, "epoch": 2338} {"train_loss": -11.619460105895996, "global_step": 392890, "epoch": 2338} {"train_loss": -12.46097469329834, "global_step": 392891, "epoch": 2338} {"train_loss": -11.954862594604492, "global_step": 392892, "epoch": 2338} {"train_loss": -12.32895565032959, "global_step": 392893, "epoch": 2338} {"train_loss": -11.48000717163086, "global_step": 392894, "epoch": 2338} {"train_loss": -11.638948440551758, "global_step": 392895, "epoch": 2338} {"train_loss": -12.750738143920898, "global_step": 392896, "epoch": 2338} {"train_loss": -11.496749877929688, "global_step": 392897, "epoch": 2338} {"train_loss": -12.291147232055664, "global_step": 392898, "epoch": 2338} {"train_loss": -11.930131912231445, "global_step": 392899, "epoch": 2338} {"train_loss": -11.949263572692871, "global_step": 392900, "epoch": 2338} {"train_loss": -12.373611450195312, "global_step": 392901, "epoch": 2338} {"train_loss": -11.187383651733398, "global_step": 392902, "epoch": 2338} {"train_loss": -11.493968963623047, "global_step": 392903, "epoch": 2338} {"train_loss": -12.135534286499023, "global_step": 392904, "epoch": 2338} {"train_loss": -12.527143478393555, "global_step": 392905, "epoch": 2338} {"train_loss": -11.972638130187988, "global_step": 392906, "epoch": 2338} {"train_loss": -12.015340805053711, "global_step": 392907, "epoch": 2338} {"train_loss": -12.378543853759766, "global_step": 392908, "epoch": 2338} {"train_loss": -12.164103507995605, "global_step": 392909, "epoch": 2338} {"train_loss": -12.033101081848145, "global_step": 392910, "epoch": 2338} {"train_loss": -12.313268661499023, "global_step": 392911, "epoch": 2338} {"train_loss": -11.84097671508789, "global_step": 392912, "epoch": 2338} {"train_loss": -12.003662109375, "global_step": 392913, "epoch": 2338} {"train_loss": -12.112855911254883, "global_step": 392914, "epoch": 2338} {"train_loss": -11.954471588134766, "global_step": 392915, "epoch": 2338} {"train_loss": -12.250783920288086, "global_step": 392916, "epoch": 2338} {"train_loss": -12.05539321899414, "global_step": 392917, "epoch": 2338} {"train_loss": -11.876712799072266, "global_step": 392918, "epoch": 2338} {"train_loss": -12.583430290222168, "global_step": 392919, "epoch": 2338} {"train_loss": -12.632205963134766, "global_step": 392920, "epoch": 2338} {"train_loss": -12.427946090698242, "global_step": 392921, "epoch": 2338} {"train_loss": -12.531230926513672, "global_step": 392922, "epoch": 2338} {"train_loss": -12.234116554260254, "global_step": 392923, "epoch": 2338} {"train_loss": -12.2117919921875, "global_step": 392924, "epoch": 2338} {"train_loss": -12.3070650100708, "global_step": 392925, "epoch": 2338} {"train_loss": -12.414752006530762, "global_step": 392926, "epoch": 2338} {"train_loss": -12.011043548583984, "global_step": 392927, "epoch": 2338} {"train_loss": -12.387989044189453, "global_step": 392928, "epoch": 2338} {"train_loss": -11.85389518737793, "global_step": 392929, "epoch": 2338} {"train_loss": -12.032114028930664, "global_step": 392930, "epoch": 2338} {"train_loss": -11.933725357055664, "global_step": 392931, "epoch": 2338} {"train_loss": -11.970928192138672, "global_step": 392932, "epoch": 2338} {"train_loss": -11.816892623901367, "global_step": 392933, "epoch": 2338} {"train_loss": -12.342666625976562, "global_step": 392934, "epoch": 2338} {"train_loss": -12.040929794311523, "global_step": 392935, "epoch": 2338} {"train_loss": -12.364181518554688, "global_step": 392936, "epoch": 2338} {"train_loss": -12.069524765014648, "global_step": 392937, "epoch": 2338} {"train_loss": -12.461368560791016, "global_step": 392938, "epoch": 2338} {"train_loss": -12.229157447814941, "global_step": 392939, "epoch": 2338} {"train_loss": -12.33258056640625, "global_step": 392940, "epoch": 2338} {"train_loss": -12.065406799316406, "global_step": 392941, "epoch": 2338} {"train_loss": -12.490812301635742, "global_step": 392942, "epoch": 2338} {"train_loss": -12.148086547851562, "global_step": 392943, "epoch": 2338} {"train_loss": -12.291975021362305, "global_step": 392944, "epoch": 2338} {"train_loss": -12.316137313842773, "global_step": 392945, "epoch": 2338} {"train_loss": -12.161702156066895, "global_step": 392946, "epoch": 2338} {"train_loss": -12.30921745300293, "global_step": 392947, "epoch": 2338} {"train_loss": -12.230521202087402, "global_step": 392948, "epoch": 2338} {"train_loss": -11.768065452575684, "global_step": 392949, "epoch": 2338} {"train_loss": -11.53506851196289, "global_step": 392950, "epoch": 2338} {"train_loss": -12.131729466574532, "global_step": 392951, "epoch": 2338, "val_loss": 298299.1875} {"train_loss": -11.844743728637695, "global_step": 392952, "epoch": 2339} {"train_loss": -12.162899017333984, "global_step": 392953, "epoch": 2339} {"train_loss": -12.076807975769043, "global_step": 392954, "epoch": 2339} {"train_loss": -11.274238586425781, "global_step": 392955, "epoch": 2339} {"train_loss": -11.52330207824707, "global_step": 392956, "epoch": 2339} {"train_loss": -11.923440933227539, "global_step": 392957, "epoch": 2339} {"train_loss": -12.177261352539062, "global_step": 392958, "epoch": 2339} {"train_loss": -11.771272659301758, "global_step": 392959, "epoch": 2339} {"train_loss": -12.651692390441895, "global_step": 392960, "epoch": 2339} {"train_loss": -11.932546615600586, "global_step": 392961, "epoch": 2339} {"train_loss": -12.335943222045898, "global_step": 392962, "epoch": 2339} {"train_loss": -11.981752395629883, "global_step": 392963, "epoch": 2339} {"train_loss": -12.497198104858398, "global_step": 392964, "epoch": 2339} {"train_loss": -11.775633811950684, "global_step": 392965, "epoch": 2339} {"train_loss": -12.344757080078125, "global_step": 392966, "epoch": 2339} {"train_loss": -12.085758209228516, "global_step": 392967, "epoch": 2339} {"train_loss": -12.335533142089844, "global_step": 392968, "epoch": 2339} {"train_loss": -12.071206092834473, "global_step": 392969, "epoch": 2339} {"train_loss": -12.358390808105469, "global_step": 392970, "epoch": 2339} {"train_loss": -12.3221435546875, "global_step": 392971, "epoch": 2339} {"train_loss": -12.333477020263672, "global_step": 392972, "epoch": 2339} {"train_loss": -12.522281646728516, "global_step": 392973, "epoch": 2339} {"train_loss": -12.615318298339844, "global_step": 392974, "epoch": 2339} {"train_loss": -12.519942283630371, "global_step": 392975, "epoch": 2339} {"train_loss": -12.323419570922852, "global_step": 392976, "epoch": 2339} {"train_loss": -12.63772201538086, "global_step": 392977, "epoch": 2339} {"train_loss": -12.301148414611816, "global_step": 392978, "epoch": 2339} {"train_loss": -11.478767395019531, "global_step": 392979, "epoch": 2339} {"train_loss": -12.272520065307617, "global_step": 392980, "epoch": 2339} {"train_loss": -11.787254333496094, "global_step": 392981, "epoch": 2339} {"train_loss": -11.015436172485352, "global_step": 392982, "epoch": 2339} {"train_loss": -12.385385513305664, "global_step": 392983, "epoch": 2339} {"train_loss": -12.400825500488281, "global_step": 392984, "epoch": 2339} {"train_loss": -11.55215072631836, "global_step": 392985, "epoch": 2339} {"train_loss": -12.156167030334473, "global_step": 392986, "epoch": 2339} {"train_loss": -12.245450973510742, "global_step": 392987, "epoch": 2339} {"train_loss": -11.001490592956543, "global_step": 392988, "epoch": 2339} {"train_loss": -12.063544273376465, "global_step": 392989, "epoch": 2339} {"train_loss": -12.333192825317383, "global_step": 392990, "epoch": 2339} {"train_loss": -11.90382194519043, "global_step": 392991, "epoch": 2339} {"train_loss": -12.481523513793945, "global_step": 392992, "epoch": 2339} {"train_loss": -11.808481216430664, "global_step": 392993, "epoch": 2339} {"train_loss": -11.992740631103516, "global_step": 392994, "epoch": 2339} {"train_loss": -12.207858085632324, "global_step": 392995, "epoch": 2339} {"train_loss": -12.223970413208008, "global_step": 392996, "epoch": 2339} {"train_loss": -11.698020935058594, "global_step": 392997, "epoch": 2339} {"train_loss": -12.013837814331055, "global_step": 392998, "epoch": 2339} {"train_loss": -12.036911010742188, "global_step": 392999, "epoch": 2339} {"train_loss": -12.122926712036133, "global_step": 393000, "epoch": 2339} {"train_loss": -12.275310516357422, "global_step": 393001, "epoch": 2339} {"train_loss": -12.449729919433594, "global_step": 393002, "epoch": 2339} {"train_loss": -11.938629150390625, "global_step": 393003, "epoch": 2339} {"train_loss": -12.290589332580566, "global_step": 393004, "epoch": 2339} {"train_loss": -12.148611068725586, "global_step": 393005, "epoch": 2339} {"train_loss": -11.864347457885742, "global_step": 393006, "epoch": 2339} {"train_loss": -12.371036529541016, "global_step": 393007, "epoch": 2339} {"train_loss": -12.323663711547852, "global_step": 393008, "epoch": 2339} {"train_loss": -12.584152221679688, "global_step": 393009, "epoch": 2339} {"train_loss": -12.129094123840332, "global_step": 393010, "epoch": 2339} {"train_loss": -12.048030853271484, "global_step": 393011, "epoch": 2339} {"train_loss": -11.87462329864502, "global_step": 393012, "epoch": 2339} {"train_loss": -12.251245498657227, "global_step": 393013, "epoch": 2339} {"train_loss": -11.44421672821045, "global_step": 393014, "epoch": 2339} {"train_loss": -12.385351181030273, "global_step": 393015, "epoch": 2339} {"train_loss": -11.353982925415039, "global_step": 393016, "epoch": 2339} {"train_loss": -12.42465591430664, "global_step": 393017, "epoch": 2339} {"train_loss": -11.191452980041504, "global_step": 393018, "epoch": 2339} {"train_loss": -11.699899673461914, "global_step": 393019, "epoch": 2339} {"train_loss": -11.050806045532227, "global_step": 393020, "epoch": 2339} {"train_loss": -11.927963256835938, "global_step": 393021, "epoch": 2339} {"train_loss": -11.526392936706543, "global_step": 393022, "epoch": 2339} {"train_loss": -12.218481063842773, "global_step": 393023, "epoch": 2339} {"train_loss": -11.461908340454102, "global_step": 393024, "epoch": 2339} {"train_loss": -11.657123565673828, "global_step": 393025, "epoch": 2339} {"train_loss": -11.061101913452148, "global_step": 393026, "epoch": 2339} {"train_loss": -11.358488082885742, "global_step": 393027, "epoch": 2339} {"train_loss": -11.274134635925293, "global_step": 393028, "epoch": 2339} {"train_loss": -11.264106750488281, "global_step": 393029, "epoch": 2339} {"train_loss": -11.122971534729004, "global_step": 393030, "epoch": 2339} {"train_loss": -10.889790534973145, "global_step": 393031, "epoch": 2339} {"train_loss": -11.444896697998047, "global_step": 393032, "epoch": 2339} {"train_loss": -9.799407958984375, "global_step": 393033, "epoch": 2339} {"train_loss": -11.36036491394043, "global_step": 393034, "epoch": 2339} {"train_loss": -11.54408073425293, "global_step": 393035, "epoch": 2339} {"train_loss": -11.207483291625977, "global_step": 393036, "epoch": 2339} {"train_loss": -11.569282531738281, "global_step": 393037, "epoch": 2339} {"train_loss": -11.243889808654785, "global_step": 393038, "epoch": 2339} {"train_loss": -11.48841381072998, "global_step": 393039, "epoch": 2339} {"train_loss": -11.336506843566895, "global_step": 393040, "epoch": 2339} {"train_loss": -11.427014350891113, "global_step": 393041, "epoch": 2339} {"train_loss": -11.95821762084961, "global_step": 393042, "epoch": 2339} {"train_loss": -11.275175094604492, "global_step": 393043, "epoch": 2339} {"train_loss": -11.725506782531738, "global_step": 393044, "epoch": 2339} {"train_loss": -11.416145324707031, "global_step": 393045, "epoch": 2339} {"train_loss": -11.895784378051758, "global_step": 393046, "epoch": 2339} {"train_loss": -11.988777160644531, "global_step": 393047, "epoch": 2339} {"train_loss": -11.557623863220215, "global_step": 393048, "epoch": 2339} {"train_loss": -11.742637634277344, "global_step": 393049, "epoch": 2339} {"train_loss": -11.157590866088867, "global_step": 393050, "epoch": 2339} {"train_loss": -11.546298027038574, "global_step": 393051, "epoch": 2339} {"train_loss": -11.978641510009766, "global_step": 393052, "epoch": 2339} {"train_loss": -11.114151000976562, "global_step": 393053, "epoch": 2339} {"train_loss": -12.010629653930664, "global_step": 393054, "epoch": 2339} {"train_loss": -11.079452514648438, "global_step": 393055, "epoch": 2339} {"train_loss": -11.548765182495117, "global_step": 393056, "epoch": 2339} {"train_loss": -11.112411499023438, "global_step": 393057, "epoch": 2339} {"train_loss": -10.899312973022461, "global_step": 393058, "epoch": 2339} {"train_loss": -11.497987747192383, "global_step": 393059, "epoch": 2339} {"train_loss": -10.703669548034668, "global_step": 393060, "epoch": 2339} {"train_loss": -10.981301307678223, "global_step": 393061, "epoch": 2339} {"train_loss": -10.899999618530273, "global_step": 393062, "epoch": 2339} {"train_loss": -11.467538833618164, "global_step": 393063, "epoch": 2339} {"train_loss": -11.066771507263184, "global_step": 393064, "epoch": 2339} {"train_loss": -11.856125831604004, "global_step": 393065, "epoch": 2339} {"train_loss": -11.300105094909668, "global_step": 393066, "epoch": 2339} {"train_loss": -11.635904312133789, "global_step": 393067, "epoch": 2339} {"train_loss": -11.224260330200195, "global_step": 393068, "epoch": 2339} {"train_loss": -11.857681274414062, "global_step": 393069, "epoch": 2339} {"train_loss": -11.982746124267578, "global_step": 393070, "epoch": 2339} {"train_loss": -12.073930740356445, "global_step": 393071, "epoch": 2339} {"train_loss": -12.025152206420898, "global_step": 393072, "epoch": 2339} {"train_loss": -12.062933921813965, "global_step": 393073, "epoch": 2339} {"train_loss": -11.86376953125, "global_step": 393074, "epoch": 2339} {"train_loss": -12.096675872802734, "global_step": 393075, "epoch": 2339} {"train_loss": -12.036752700805664, "global_step": 393076, "epoch": 2339} {"train_loss": -11.837284088134766, "global_step": 393077, "epoch": 2339} {"train_loss": -11.908288955688477, "global_step": 393078, "epoch": 2339} {"train_loss": -12.095069885253906, "global_step": 393079, "epoch": 2339} {"train_loss": -12.071590423583984, "global_step": 393080, "epoch": 2339} {"train_loss": -12.26108169555664, "global_step": 393081, "epoch": 2339} {"train_loss": -12.36618709564209, "global_step": 393082, "epoch": 2339} {"train_loss": -12.223686218261719, "global_step": 393083, "epoch": 2339} {"train_loss": -12.205707550048828, "global_step": 393084, "epoch": 2339} {"train_loss": -12.298216819763184, "global_step": 393085, "epoch": 2339} {"train_loss": -12.207115173339844, "global_step": 393086, "epoch": 2339} {"train_loss": -12.29910659790039, "global_step": 393087, "epoch": 2339} {"train_loss": -12.147382736206055, "global_step": 393088, "epoch": 2339} {"train_loss": -12.484326362609863, "global_step": 393089, "epoch": 2339} {"train_loss": -12.249177932739258, "global_step": 393090, "epoch": 2339} {"train_loss": -12.304956436157227, "global_step": 393091, "epoch": 2339} {"train_loss": -12.327003479003906, "global_step": 393092, "epoch": 2339} {"train_loss": -12.15235424041748, "global_step": 393093, "epoch": 2339} {"train_loss": -12.274267196655273, "global_step": 393094, "epoch": 2339} {"train_loss": -12.367887496948242, "global_step": 393095, "epoch": 2339} {"train_loss": -12.271173477172852, "global_step": 393096, "epoch": 2339} {"train_loss": -12.28909683227539, "global_step": 393097, "epoch": 2339} {"train_loss": -12.143914222717285, "global_step": 393098, "epoch": 2339} {"train_loss": -12.58273696899414, "global_step": 393099, "epoch": 2339} {"train_loss": -11.93216323852539, "global_step": 393100, "epoch": 2339} {"train_loss": -12.558131217956543, "global_step": 393101, "epoch": 2339} {"train_loss": -12.208630561828613, "global_step": 393102, "epoch": 2339} {"train_loss": -12.566436767578125, "global_step": 393103, "epoch": 2339} {"train_loss": -12.511584281921387, "global_step": 393104, "epoch": 2339} {"train_loss": -12.435184478759766, "global_step": 393105, "epoch": 2339} {"train_loss": -12.281744956970215, "global_step": 393106, "epoch": 2339} {"train_loss": -12.501020431518555, "global_step": 393107, "epoch": 2339} {"train_loss": -12.575727462768555, "global_step": 393108, "epoch": 2339} {"train_loss": -12.368051528930664, "global_step": 393109, "epoch": 2339} {"train_loss": -12.43045425415039, "global_step": 393110, "epoch": 2339} {"train_loss": -12.419557571411133, "global_step": 393111, "epoch": 2339} {"train_loss": -12.627326011657715, "global_step": 393112, "epoch": 2339} {"train_loss": -12.359954833984375, "global_step": 393113, "epoch": 2339} {"train_loss": -12.430185317993164, "global_step": 393114, "epoch": 2339} {"train_loss": -12.694631576538086, "global_step": 393115, "epoch": 2339} {"train_loss": -12.252111434936523, "global_step": 393116, "epoch": 2339} {"train_loss": -12.399234771728516, "global_step": 393117, "epoch": 2339} {"train_loss": -12.57139778137207, "global_step": 393118, "epoch": 2339} {"train_loss": -11.933288869403658, "global_step": 393119, "epoch": 2339, "val_loss": 298594.34375} {"train_loss": -12.55876636505127, "global_step": 393120, "epoch": 2340} {"train_loss": -12.728878021240234, "global_step": 393121, "epoch": 2340} {"train_loss": -12.678804397583008, "global_step": 393122, "epoch": 2340} {"train_loss": -12.538834571838379, "global_step": 393123, "epoch": 2340} {"train_loss": -12.38112735748291, "global_step": 393124, "epoch": 2340} {"train_loss": -12.454894065856934, "global_step": 393125, "epoch": 2340} {"train_loss": -12.858318328857422, "global_step": 393126, "epoch": 2340} {"train_loss": -12.182903289794922, "global_step": 393127, "epoch": 2340} {"train_loss": -12.268342971801758, "global_step": 393128, "epoch": 2340} {"train_loss": -12.414737701416016, "global_step": 393129, "epoch": 2340} {"train_loss": -12.455904006958008, "global_step": 393130, "epoch": 2340} {"train_loss": -12.240860939025879, "global_step": 393131, "epoch": 2340} {"train_loss": -12.432374000549316, "global_step": 393132, "epoch": 2340} {"train_loss": -12.34375286102295, "global_step": 393133, "epoch": 2340} {"train_loss": -11.84553337097168, "global_step": 393134, "epoch": 2340} {"train_loss": -12.547760963439941, "global_step": 393135, "epoch": 2340} {"train_loss": -12.259407043457031, "global_step": 393136, "epoch": 2340} {"train_loss": -12.064680099487305, "global_step": 393137, "epoch": 2340} {"train_loss": -12.042642593383789, "global_step": 393138, "epoch": 2340} {"train_loss": -12.557719230651855, "global_step": 393139, "epoch": 2340} {"train_loss": -11.684025764465332, "global_step": 393140, "epoch": 2340} {"train_loss": -12.23122501373291, "global_step": 393141, "epoch": 2340} {"train_loss": -12.34780502319336, "global_step": 393142, "epoch": 2340} {"train_loss": -12.029867172241211, "global_step": 393143, "epoch": 2340} {"train_loss": -12.412492752075195, "global_step": 393144, "epoch": 2340} {"train_loss": -12.796415328979492, "global_step": 393145, "epoch": 2340} {"train_loss": -12.365495681762695, "global_step": 393146, "epoch": 2340} {"train_loss": -12.304596900939941, "global_step": 393147, "epoch": 2340} {"train_loss": -12.664434432983398, "global_step": 393148, "epoch": 2340} {"train_loss": -12.724088668823242, "global_step": 393149, "epoch": 2340} {"train_loss": -12.77225112915039, "global_step": 393150, "epoch": 2340} {"train_loss": -12.680463790893555, "global_step": 393151, "epoch": 2340} {"train_loss": -12.587179183959961, "global_step": 393152, "epoch": 2340} {"train_loss": -12.602472305297852, "global_step": 393153, "epoch": 2340} {"train_loss": -12.696548461914062, "global_step": 393154, "epoch": 2340} {"train_loss": -12.738164901733398, "global_step": 393155, "epoch": 2340} {"train_loss": -12.653748512268066, "global_step": 393156, "epoch": 2340} {"train_loss": -12.755502700805664, "global_step": 393157, "epoch": 2340} {"train_loss": -12.491106033325195, "global_step": 393158, "epoch": 2340} {"train_loss": -12.636573791503906, "global_step": 393159, "epoch": 2340} {"train_loss": -12.703497886657715, "global_step": 393160, "epoch": 2340} {"train_loss": -12.722455978393555, "global_step": 393161, "epoch": 2340} {"train_loss": -12.339256286621094, "global_step": 393162, "epoch": 2340} {"train_loss": -12.575484275817871, "global_step": 393163, "epoch": 2340} {"train_loss": -12.619392395019531, "global_step": 393164, "epoch": 2340} {"train_loss": -12.26959228515625, "global_step": 393165, "epoch": 2340} {"train_loss": -12.667793273925781, "global_step": 393166, "epoch": 2340} {"train_loss": -12.63277816772461, "global_step": 393167, "epoch": 2340} {"train_loss": -12.379915237426758, "global_step": 393168, "epoch": 2340} {"train_loss": -12.294140815734863, "global_step": 393169, "epoch": 2340} {"train_loss": -12.589444160461426, "global_step": 393170, "epoch": 2340} {"train_loss": -12.432621002197266, "global_step": 393171, "epoch": 2340} {"train_loss": -12.46197509765625, "global_step": 393172, "epoch": 2340} {"train_loss": -12.665958404541016, "global_step": 393173, "epoch": 2340} {"train_loss": -12.635255813598633, "global_step": 393174, "epoch": 2340} {"train_loss": -12.251569747924805, "global_step": 393175, "epoch": 2340} {"train_loss": -12.440908432006836, "global_step": 393176, "epoch": 2340} {"train_loss": -12.556341171264648, "global_step": 393177, "epoch": 2340} {"train_loss": -12.652881622314453, "global_step": 393178, "epoch": 2340} {"train_loss": -11.770660400390625, "global_step": 393179, "epoch": 2340} {"train_loss": -10.7645263671875, "global_step": 393180, "epoch": 2340} {"train_loss": -11.24946117401123, "global_step": 393181, "epoch": 2340} {"train_loss": -12.114468574523926, "global_step": 393182, "epoch": 2340} {"train_loss": -11.021023750305176, "global_step": 393183, "epoch": 2340} {"train_loss": -11.63697624206543, "global_step": 393184, "epoch": 2340} {"train_loss": -10.728927612304688, "global_step": 393185, "epoch": 2340} {"train_loss": -9.623468399047852, "global_step": 393186, "epoch": 2340} {"train_loss": -11.572183609008789, "global_step": 393187, "epoch": 2340} {"train_loss": -7.300419807434082, "global_step": 393188, "epoch": 2340} {"train_loss": -8.77951431274414, "global_step": 393189, "epoch": 2340} {"train_loss": -8.699508666992188, "global_step": 393190, "epoch": 2340} {"train_loss": -7.240233898162842, "global_step": 393191, "epoch": 2340} {"train_loss": -8.319881439208984, "global_step": 393192, "epoch": 2340} {"train_loss": -9.528570175170898, "global_step": 393193, "epoch": 2340} {"train_loss": -9.171943664550781, "global_step": 393194, "epoch": 2340} {"train_loss": -9.651652336120605, "global_step": 393195, "epoch": 2340} {"train_loss": -10.803956031799316, "global_step": 393196, "epoch": 2340} {"train_loss": -10.498370170593262, "global_step": 393197, "epoch": 2340} {"train_loss": -10.837160110473633, "global_step": 393198, "epoch": 2340} {"train_loss": -10.464272499084473, "global_step": 393199, "epoch": 2340} {"train_loss": -11.43751335144043, "global_step": 393200, "epoch": 2340} {"train_loss": -10.032171249389648, "global_step": 393201, "epoch": 2340} {"train_loss": -10.978050231933594, "global_step": 393202, "epoch": 2340} {"train_loss": -10.944999694824219, "global_step": 393203, "epoch": 2340} {"train_loss": -9.957837104797363, "global_step": 393204, "epoch": 2340} {"train_loss": -11.385435104370117, "global_step": 393205, "epoch": 2340} {"train_loss": -11.168697357177734, "global_step": 393206, "epoch": 2340} {"train_loss": -10.675293922424316, "global_step": 393207, "epoch": 2340} {"train_loss": -11.84842300415039, "global_step": 393208, "epoch": 2340} {"train_loss": -10.726241111755371, "global_step": 393209, "epoch": 2340} {"train_loss": -11.702716827392578, "global_step": 393210, "epoch": 2340} {"train_loss": -11.361618995666504, "global_step": 393211, "epoch": 2340} {"train_loss": -11.640844345092773, "global_step": 393212, "epoch": 2340} {"train_loss": -11.686331748962402, "global_step": 393213, "epoch": 2340} {"train_loss": -11.683274269104004, "global_step": 393214, "epoch": 2340} {"train_loss": -11.920697212219238, "global_step": 393215, "epoch": 2340} {"train_loss": -11.332700729370117, "global_step": 393216, "epoch": 2340} {"train_loss": -11.350507736206055, "global_step": 393217, "epoch": 2340} {"train_loss": -11.634810447692871, "global_step": 393218, "epoch": 2340} {"train_loss": -11.380271911621094, "global_step": 393219, "epoch": 2340} {"train_loss": -11.699600219726562, "global_step": 393220, "epoch": 2340} {"train_loss": -11.559276580810547, "global_step": 393221, "epoch": 2340} {"train_loss": -11.23377799987793, "global_step": 393222, "epoch": 2340} {"train_loss": -12.132608413696289, "global_step": 393223, "epoch": 2340} {"train_loss": -11.327118873596191, "global_step": 393224, "epoch": 2340} {"train_loss": -11.686970710754395, "global_step": 393225, "epoch": 2340} {"train_loss": -11.735091209411621, "global_step": 393226, "epoch": 2340} {"train_loss": -11.312782287597656, "global_step": 393227, "epoch": 2340} {"train_loss": -12.126022338867188, "global_step": 393228, "epoch": 2340} {"train_loss": -10.824378967285156, "global_step": 393229, "epoch": 2340} {"train_loss": -12.31167221069336, "global_step": 393230, "epoch": 2340} {"train_loss": -11.386579513549805, "global_step": 393231, "epoch": 2340} {"train_loss": -11.883328437805176, "global_step": 393232, "epoch": 2340} {"train_loss": -11.778031349182129, "global_step": 393233, "epoch": 2340} {"train_loss": -11.766200065612793, "global_step": 393234, "epoch": 2340} {"train_loss": -12.009222030639648, "global_step": 393235, "epoch": 2340} {"train_loss": -11.694256782531738, "global_step": 393236, "epoch": 2340} {"train_loss": -12.213569641113281, "global_step": 393237, "epoch": 2340} {"train_loss": -12.119763374328613, "global_step": 393238, "epoch": 2340} {"train_loss": -12.115119934082031, "global_step": 393239, "epoch": 2340} {"train_loss": -12.103265762329102, "global_step": 393240, "epoch": 2340} {"train_loss": -12.487878799438477, "global_step": 393241, "epoch": 2340} {"train_loss": -11.91501235961914, "global_step": 393242, "epoch": 2340} {"train_loss": -12.216839790344238, "global_step": 393243, "epoch": 2340} {"train_loss": -12.39095687866211, "global_step": 393244, "epoch": 2340} {"train_loss": -12.142816543579102, "global_step": 393245, "epoch": 2340} {"train_loss": -12.442312240600586, "global_step": 393246, "epoch": 2340} {"train_loss": -12.376336097717285, "global_step": 393247, "epoch": 2340} {"train_loss": -12.389548301696777, "global_step": 393248, "epoch": 2340} {"train_loss": -12.332120895385742, "global_step": 393249, "epoch": 2340} {"train_loss": -12.411174774169922, "global_step": 393250, "epoch": 2340} {"train_loss": -12.570068359375, "global_step": 393251, "epoch": 2340} {"train_loss": -12.491300582885742, "global_step": 393252, "epoch": 2340} {"train_loss": -12.553717613220215, "global_step": 393253, "epoch": 2340} {"train_loss": -12.257841110229492, "global_step": 393254, "epoch": 2340} {"train_loss": -12.414022445678711, "global_step": 393255, "epoch": 2340} {"train_loss": -12.334397315979004, "global_step": 393256, "epoch": 2340} {"train_loss": -12.585902214050293, "global_step": 393257, "epoch": 2340} {"train_loss": -12.487375259399414, "global_step": 393258, "epoch": 2340} {"train_loss": -12.334091186523438, "global_step": 393259, "epoch": 2340} {"train_loss": -12.244462013244629, "global_step": 393260, "epoch": 2340} {"train_loss": -12.423791885375977, "global_step": 393261, "epoch": 2340} {"train_loss": -12.172245979309082, "global_step": 393262, "epoch": 2340} {"train_loss": -12.369938850402832, "global_step": 393263, "epoch": 2340} {"train_loss": -12.331389427185059, "global_step": 393264, "epoch": 2340} {"train_loss": -12.227845191955566, "global_step": 393265, "epoch": 2340} {"train_loss": -12.062127113342285, "global_step": 393266, "epoch": 2340} {"train_loss": -12.003355026245117, "global_step": 393267, "epoch": 2340} {"train_loss": -12.226436614990234, "global_step": 393268, "epoch": 2340} {"train_loss": -11.660066604614258, "global_step": 393269, "epoch": 2340} {"train_loss": -12.35643196105957, "global_step": 393270, "epoch": 2340} {"train_loss": -12.036453247070312, "global_step": 393271, "epoch": 2340} {"train_loss": -12.191429138183594, "global_step": 393272, "epoch": 2340} {"train_loss": -12.336115837097168, "global_step": 393273, "epoch": 2340} {"train_loss": -11.85512638092041, "global_step": 393274, "epoch": 2340} {"train_loss": -12.530019760131836, "global_step": 393275, "epoch": 2340} {"train_loss": -11.833749771118164, "global_step": 393276, "epoch": 2340} {"train_loss": -12.56787395477295, "global_step": 393277, "epoch": 2340} {"train_loss": -12.160463333129883, "global_step": 393278, "epoch": 2340} {"train_loss": -11.88677978515625, "global_step": 393279, "epoch": 2340} {"train_loss": -12.546470642089844, "global_step": 393280, "epoch": 2340} {"train_loss": -11.893828392028809, "global_step": 393281, "epoch": 2340} {"train_loss": -12.273618698120117, "global_step": 393282, "epoch": 2340} {"train_loss": -11.990642547607422, "global_step": 393283, "epoch": 2340} {"train_loss": -12.585182189941406, "global_step": 393284, "epoch": 2340} {"train_loss": -12.24459171295166, "global_step": 393285, "epoch": 2340} {"train_loss": -12.155156135559082, "global_step": 393286, "epoch": 2340} {"train_loss": -11.883381925878071, "global_step": 393287, "epoch": 2340, "val_loss": 296398.78125, "train_action_mse_error": 2.107079267501831} {"train_loss": -12.600214958190918, "global_step": 393288, "epoch": 2341} {"train_loss": -12.432985305786133, "global_step": 393289, "epoch": 2341} {"train_loss": -12.389680862426758, "global_step": 393290, "epoch": 2341} {"train_loss": -12.567524909973145, "global_step": 393291, "epoch": 2341} {"train_loss": -12.28533935546875, "global_step": 393292, "epoch": 2341} {"train_loss": -12.052177429199219, "global_step": 393293, "epoch": 2341} {"train_loss": -12.644001007080078, "global_step": 393294, "epoch": 2341} {"train_loss": -12.36872386932373, "global_step": 393295, "epoch": 2341} {"train_loss": -12.470206260681152, "global_step": 393296, "epoch": 2341} {"train_loss": -12.198639869689941, "global_step": 393297, "epoch": 2341} {"train_loss": -12.240935325622559, "global_step": 393298, "epoch": 2341} {"train_loss": -12.242595672607422, "global_step": 393299, "epoch": 2341} {"train_loss": -12.280003547668457, "global_step": 393300, "epoch": 2341} {"train_loss": -12.558927536010742, "global_step": 393301, "epoch": 2341} {"train_loss": -12.177315711975098, "global_step": 393302, "epoch": 2341} {"train_loss": -12.544801712036133, "global_step": 393303, "epoch": 2341} {"train_loss": -12.430985450744629, "global_step": 393304, "epoch": 2341} {"train_loss": -12.175292015075684, "global_step": 393305, "epoch": 2341} {"train_loss": -12.486971855163574, "global_step": 393306, "epoch": 2341} {"train_loss": -12.492074966430664, "global_step": 393307, "epoch": 2341} {"train_loss": -12.377771377563477, "global_step": 393308, "epoch": 2341} {"train_loss": -12.450326919555664, "global_step": 393309, "epoch": 2341} {"train_loss": -12.404468536376953, "global_step": 393310, "epoch": 2341} {"train_loss": -12.360055923461914, "global_step": 393311, "epoch": 2341} {"train_loss": -12.508220672607422, "global_step": 393312, "epoch": 2341} {"train_loss": -11.782673835754395, "global_step": 393313, "epoch": 2341} {"train_loss": -12.562032699584961, "global_step": 393314, "epoch": 2341} {"train_loss": -12.247766494750977, "global_step": 393315, "epoch": 2341} {"train_loss": -11.78933334350586, "global_step": 393316, "epoch": 2341} {"train_loss": -12.46520709991455, "global_step": 393317, "epoch": 2341} {"train_loss": -11.895597457885742, "global_step": 393318, "epoch": 2341} {"train_loss": -12.428091049194336, "global_step": 393319, "epoch": 2341} {"train_loss": -11.662416458129883, "global_step": 393320, "epoch": 2341} {"train_loss": -11.438369750976562, "global_step": 393321, "epoch": 2341} {"train_loss": -12.125418663024902, "global_step": 393322, "epoch": 2341} {"train_loss": -12.302289962768555, "global_step": 393323, "epoch": 2341} {"train_loss": -12.404608726501465, "global_step": 393324, "epoch": 2341} {"train_loss": -12.798173904418945, "global_step": 393325, "epoch": 2341} {"train_loss": -12.218897819519043, "global_step": 393326, "epoch": 2341} {"train_loss": -12.720710754394531, "global_step": 393327, "epoch": 2341} {"train_loss": -12.526315689086914, "global_step": 393328, "epoch": 2341} {"train_loss": -12.392731666564941, "global_step": 393329, "epoch": 2341} {"train_loss": -12.268295288085938, "global_step": 393330, "epoch": 2341} {"train_loss": -12.321136474609375, "global_step": 393331, "epoch": 2341} {"train_loss": -12.041006088256836, "global_step": 393332, "epoch": 2341} {"train_loss": -12.556068420410156, "global_step": 393333, "epoch": 2341} {"train_loss": -12.309057235717773, "global_step": 393334, "epoch": 2341} {"train_loss": -12.170226097106934, "global_step": 393335, "epoch": 2341} {"train_loss": -12.526948928833008, "global_step": 393336, "epoch": 2341} {"train_loss": -12.515788078308105, "global_step": 393337, "epoch": 2341} {"train_loss": -12.458662033081055, "global_step": 393338, "epoch": 2341} {"train_loss": -12.402763366699219, "global_step": 393339, "epoch": 2341} {"train_loss": -12.343942642211914, "global_step": 393340, "epoch": 2341} {"train_loss": -12.421432495117188, "global_step": 393341, "epoch": 2341} {"train_loss": -12.208131790161133, "global_step": 393342, "epoch": 2341} {"train_loss": -12.164716720581055, "global_step": 393343, "epoch": 2341} {"train_loss": -12.58622932434082, "global_step": 393344, "epoch": 2341} {"train_loss": -12.530324935913086, "global_step": 393345, "epoch": 2341} {"train_loss": -12.295191764831543, "global_step": 393346, "epoch": 2341} {"train_loss": -11.948585510253906, "global_step": 393347, "epoch": 2341} {"train_loss": -11.533307075500488, "global_step": 393348, "epoch": 2341} {"train_loss": -12.435115814208984, "global_step": 393349, "epoch": 2341} {"train_loss": -11.701766967773438, "global_step": 393350, "epoch": 2341} {"train_loss": -10.369197845458984, "global_step": 393351, "epoch": 2341} {"train_loss": -11.042547225952148, "global_step": 393352, "epoch": 2341} {"train_loss": -12.059746742248535, "global_step": 393353, "epoch": 2341} {"train_loss": -9.459043502807617, "global_step": 393354, "epoch": 2341} {"train_loss": -11.419650077819824, "global_step": 393355, "epoch": 2341} {"train_loss": -10.10419750213623, "global_step": 393356, "epoch": 2341} {"train_loss": -9.508593559265137, "global_step": 393357, "epoch": 2341} {"train_loss": -12.251070022583008, "global_step": 393358, "epoch": 2341} {"train_loss": -9.737833976745605, "global_step": 393359, "epoch": 2341} {"train_loss": -11.063841819763184, "global_step": 393360, "epoch": 2341} {"train_loss": -7.85560417175293, "global_step": 393361, "epoch": 2341} {"train_loss": -8.307472229003906, "global_step": 393362, "epoch": 2341} {"train_loss": -8.128854751586914, "global_step": 393363, "epoch": 2341} {"train_loss": -8.173920631408691, "global_step": 393364, "epoch": 2341} {"train_loss": -7.597179412841797, "global_step": 393365, "epoch": 2341} {"train_loss": -9.295626640319824, "global_step": 393366, "epoch": 2341} {"train_loss": -8.388538360595703, "global_step": 393367, "epoch": 2341} {"train_loss": -8.744097709655762, "global_step": 393368, "epoch": 2341} {"train_loss": -9.443257331848145, "global_step": 393369, "epoch": 2341} {"train_loss": -8.629164695739746, "global_step": 393370, "epoch": 2341} {"train_loss": -10.117535591125488, "global_step": 393371, "epoch": 2341} {"train_loss": -9.969754219055176, "global_step": 393372, "epoch": 2341} {"train_loss": -10.714234352111816, "global_step": 393373, "epoch": 2341} {"train_loss": -10.389278411865234, "global_step": 393374, "epoch": 2341} {"train_loss": -11.186880111694336, "global_step": 393375, "epoch": 2341} {"train_loss": -10.29550552368164, "global_step": 393376, "epoch": 2341} {"train_loss": -10.864649772644043, "global_step": 393377, "epoch": 2341} {"train_loss": -10.149826049804688, "global_step": 393378, "epoch": 2341} {"train_loss": -9.405149459838867, "global_step": 393379, "epoch": 2341} {"train_loss": -10.7385835647583, "global_step": 393380, "epoch": 2341} {"train_loss": -9.954587936401367, "global_step": 393381, "epoch": 2341} {"train_loss": -11.231860160827637, "global_step": 393382, "epoch": 2341} {"train_loss": -10.907144546508789, "global_step": 393383, "epoch": 2341} {"train_loss": -11.127735137939453, "global_step": 393384, "epoch": 2341} {"train_loss": -11.277559280395508, "global_step": 393385, "epoch": 2341} {"train_loss": -11.565448760986328, "global_step": 393386, "epoch": 2341} {"train_loss": -11.43791389465332, "global_step": 393387, "epoch": 2341} {"train_loss": -11.78255844116211, "global_step": 393388, "epoch": 2341} {"train_loss": -11.641691207885742, "global_step": 393389, "epoch": 2341} {"train_loss": -11.867830276489258, "global_step": 393390, "epoch": 2341} {"train_loss": -11.839578628540039, "global_step": 393391, "epoch": 2341} {"train_loss": -12.074520111083984, "global_step": 393392, "epoch": 2341} {"train_loss": -11.776345252990723, "global_step": 393393, "epoch": 2341} {"train_loss": -12.057631492614746, "global_step": 393394, "epoch": 2341} {"train_loss": -12.048364639282227, "global_step": 393395, "epoch": 2341} {"train_loss": -12.104747772216797, "global_step": 393396, "epoch": 2341} {"train_loss": -11.840099334716797, "global_step": 393397, "epoch": 2341} {"train_loss": -12.210274696350098, "global_step": 393398, "epoch": 2341} {"train_loss": -12.101844787597656, "global_step": 393399, "epoch": 2341} {"train_loss": -11.964248657226562, "global_step": 393400, "epoch": 2341} {"train_loss": -12.153529167175293, "global_step": 393401, "epoch": 2341} {"train_loss": -11.756246566772461, "global_step": 393402, "epoch": 2341} {"train_loss": -12.194242477416992, "global_step": 393403, "epoch": 2341} {"train_loss": -11.729106903076172, "global_step": 393404, "epoch": 2341} {"train_loss": -12.187959671020508, "global_step": 393405, "epoch": 2341} {"train_loss": -12.042749404907227, "global_step": 393406, "epoch": 2341} {"train_loss": -12.12582015991211, "global_step": 393407, "epoch": 2341} {"train_loss": -12.033069610595703, "global_step": 393408, "epoch": 2341} {"train_loss": -12.401638984680176, "global_step": 393409, "epoch": 2341} {"train_loss": -12.236472129821777, "global_step": 393410, "epoch": 2341} {"train_loss": -12.368250846862793, "global_step": 393411, "epoch": 2341} {"train_loss": -12.159161567687988, "global_step": 393412, "epoch": 2341} {"train_loss": -12.432331085205078, "global_step": 393413, "epoch": 2341} {"train_loss": -12.364604949951172, "global_step": 393414, "epoch": 2341} {"train_loss": -12.459554672241211, "global_step": 393415, "epoch": 2341} {"train_loss": -12.416573524475098, "global_step": 393416, "epoch": 2341} {"train_loss": -12.305469512939453, "global_step": 393417, "epoch": 2341} {"train_loss": -12.436202049255371, "global_step": 393418, "epoch": 2341} {"train_loss": -12.195164680480957, "global_step": 393419, "epoch": 2341} {"train_loss": -12.522650718688965, "global_step": 393420, "epoch": 2341} {"train_loss": -12.283770561218262, "global_step": 393421, "epoch": 2341} {"train_loss": -12.164180755615234, "global_step": 393422, "epoch": 2341} {"train_loss": -12.347940444946289, "global_step": 393423, "epoch": 2341} {"train_loss": -12.459790229797363, "global_step": 393424, "epoch": 2341} {"train_loss": -12.498332977294922, "global_step": 393425, "epoch": 2341} {"train_loss": -12.42180061340332, "global_step": 393426, "epoch": 2341} {"train_loss": -12.548460960388184, "global_step": 393427, "epoch": 2341} {"train_loss": -12.597358703613281, "global_step": 393428, "epoch": 2341} {"train_loss": -12.719398498535156, "global_step": 393429, "epoch": 2341} {"train_loss": -12.520511627197266, "global_step": 393430, "epoch": 2341} {"train_loss": -12.67182731628418, "global_step": 393431, "epoch": 2341} {"train_loss": -12.446048736572266, "global_step": 393432, "epoch": 2341} {"train_loss": -12.631760597229004, "global_step": 393433, "epoch": 2341} {"train_loss": -12.444536209106445, "global_step": 393434, "epoch": 2341} {"train_loss": -12.521350860595703, "global_step": 393435, "epoch": 2341} {"train_loss": -12.628257751464844, "global_step": 393436, "epoch": 2341} {"train_loss": -12.708118438720703, "global_step": 393437, "epoch": 2341} {"train_loss": -12.558303833007812, "global_step": 393438, "epoch": 2341} {"train_loss": -12.656767845153809, "global_step": 393439, "epoch": 2341} {"train_loss": -12.706199645996094, "global_step": 393440, "epoch": 2341} {"train_loss": -12.53498363494873, "global_step": 393441, "epoch": 2341} {"train_loss": -12.577892303466797, "global_step": 393442, "epoch": 2341} {"train_loss": -12.700061798095703, "global_step": 393443, "epoch": 2341} {"train_loss": -12.781521797180176, "global_step": 393444, "epoch": 2341} {"train_loss": -12.632579803466797, "global_step": 393445, "epoch": 2341} {"train_loss": -12.452484130859375, "global_step": 393446, "epoch": 2341} {"train_loss": -12.643821716308594, "global_step": 393447, "epoch": 2341} {"train_loss": -12.662359237670898, "global_step": 393448, "epoch": 2341} {"train_loss": -12.765459060668945, "global_step": 393449, "epoch": 2341} {"train_loss": -12.53198528289795, "global_step": 393450, "epoch": 2341} {"train_loss": -12.837841987609863, "global_step": 393451, "epoch": 2341} {"train_loss": -12.939168930053711, "global_step": 393452, "epoch": 2341} {"train_loss": -12.733083724975586, "global_step": 393453, "epoch": 2341} {"train_loss": -12.779961585998535, "global_step": 393454, "epoch": 2341} {"train_loss": -11.83862202508109, "global_step": 393455, "epoch": 2341, "val_loss": 299194.28125} {"train_loss": -12.819120407104492, "global_step": 393456, "epoch": 2342} {"train_loss": -12.809886932373047, "global_step": 393457, "epoch": 2342} {"train_loss": -12.774030685424805, "global_step": 393458, "epoch": 2342} {"train_loss": -12.812334060668945, "global_step": 393459, "epoch": 2342} {"train_loss": -12.726279258728027, "global_step": 393460, "epoch": 2342} {"train_loss": -12.76852798461914, "global_step": 393461, "epoch": 2342} {"train_loss": -12.727508544921875, "global_step": 393462, "epoch": 2342} {"train_loss": -12.641866683959961, "global_step": 393463, "epoch": 2342} {"train_loss": -12.648146629333496, "global_step": 393464, "epoch": 2342} {"train_loss": -12.460943222045898, "global_step": 393465, "epoch": 2342} {"train_loss": -11.756080627441406, "global_step": 393466, "epoch": 2342} {"train_loss": -11.70008659362793, "global_step": 393467, "epoch": 2342} {"train_loss": -11.73133659362793, "global_step": 393468, "epoch": 2342} {"train_loss": -12.01445198059082, "global_step": 393469, "epoch": 2342} {"train_loss": -11.85757827758789, "global_step": 393470, "epoch": 2342} {"train_loss": -11.953490257263184, "global_step": 393471, "epoch": 2342} {"train_loss": -12.241781234741211, "global_step": 393472, "epoch": 2342} {"train_loss": -12.28383731842041, "global_step": 393473, "epoch": 2342} {"train_loss": -12.177591323852539, "global_step": 393474, "epoch": 2342} {"train_loss": -11.875706672668457, "global_step": 393475, "epoch": 2342} {"train_loss": -10.2190580368042, "global_step": 393476, "epoch": 2342} {"train_loss": -11.019707679748535, "global_step": 393477, "epoch": 2342} {"train_loss": -11.801777839660645, "global_step": 393478, "epoch": 2342} {"train_loss": -9.090496063232422, "global_step": 393479, "epoch": 2342} {"train_loss": -6.818912029266357, "global_step": 393480, "epoch": 2342} {"train_loss": -8.318001747131348, "global_step": 393481, "epoch": 2342} {"train_loss": -7.24108362197876, "global_step": 393482, "epoch": 2342} {"train_loss": -7.379956245422363, "global_step": 393483, "epoch": 2342} {"train_loss": -6.931200981140137, "global_step": 393484, "epoch": 2342} {"train_loss": -7.83186149597168, "global_step": 393485, "epoch": 2342} {"train_loss": -8.230621337890625, "global_step": 393486, "epoch": 2342} {"train_loss": -8.109490394592285, "global_step": 393487, "epoch": 2342} {"train_loss": -8.397553443908691, "global_step": 393488, "epoch": 2342} {"train_loss": -8.503643035888672, "global_step": 393489, "epoch": 2342} {"train_loss": -8.634254455566406, "global_step": 393490, "epoch": 2342} {"train_loss": -8.701478958129883, "global_step": 393491, "epoch": 2342} {"train_loss": -7.890761375427246, "global_step": 393492, "epoch": 2342} {"train_loss": -8.565876007080078, "global_step": 393493, "epoch": 2342} {"train_loss": -8.966854095458984, "global_step": 393494, "epoch": 2342} {"train_loss": -8.666179656982422, "global_step": 393495, "epoch": 2342} {"train_loss": -9.296296119689941, "global_step": 393496, "epoch": 2342} {"train_loss": -9.1842622756958, "global_step": 393497, "epoch": 2342} {"train_loss": -9.303057670593262, "global_step": 393498, "epoch": 2342} {"train_loss": -9.788063049316406, "global_step": 393499, "epoch": 2342} {"train_loss": -9.55221939086914, "global_step": 393500, "epoch": 2342} {"train_loss": -10.000146865844727, "global_step": 393501, "epoch": 2342} {"train_loss": -10.231805801391602, "global_step": 393502, "epoch": 2342} {"train_loss": -9.832353591918945, "global_step": 393503, "epoch": 2342} {"train_loss": -10.31529426574707, "global_step": 393504, "epoch": 2342} {"train_loss": -10.389518737792969, "global_step": 393505, "epoch": 2342} {"train_loss": -10.316561698913574, "global_step": 393506, "epoch": 2342} {"train_loss": -10.605249404907227, "global_step": 393507, "epoch": 2342} {"train_loss": -10.994877815246582, "global_step": 393508, "epoch": 2342} {"train_loss": -10.33315372467041, "global_step": 393509, "epoch": 2342} {"train_loss": -10.834498405456543, "global_step": 393510, "epoch": 2342} {"train_loss": -10.729837417602539, "global_step": 393511, "epoch": 2342} {"train_loss": -11.072542190551758, "global_step": 393512, "epoch": 2342} {"train_loss": -11.083831787109375, "global_step": 393513, "epoch": 2342} {"train_loss": -10.980829238891602, "global_step": 393514, "epoch": 2342} {"train_loss": -11.41518783569336, "global_step": 393515, "epoch": 2342} {"train_loss": -11.221715927124023, "global_step": 393516, "epoch": 2342} {"train_loss": -11.080495834350586, "global_step": 393517, "epoch": 2342} {"train_loss": -11.063252449035645, "global_step": 393518, "epoch": 2342} {"train_loss": -10.974535942077637, "global_step": 393519, "epoch": 2342} {"train_loss": -11.650182723999023, "global_step": 393520, "epoch": 2342} {"train_loss": -11.392807960510254, "global_step": 393521, "epoch": 2342} {"train_loss": -11.483175277709961, "global_step": 393522, "epoch": 2342} {"train_loss": -11.44246768951416, "global_step": 393523, "epoch": 2342} {"train_loss": -11.420063972473145, "global_step": 393524, "epoch": 2342} {"train_loss": -11.397721290588379, "global_step": 393525, "epoch": 2342} {"train_loss": -11.868834495544434, "global_step": 393526, "epoch": 2342} {"train_loss": -11.6375093460083, "global_step": 393527, "epoch": 2342} {"train_loss": -11.999547958374023, "global_step": 393528, "epoch": 2342} {"train_loss": -11.789226531982422, "global_step": 393529, "epoch": 2342} {"train_loss": -11.875884056091309, "global_step": 393530, "epoch": 2342} {"train_loss": -11.828573226928711, "global_step": 393531, "epoch": 2342} {"train_loss": -12.084321975708008, "global_step": 393532, "epoch": 2342} {"train_loss": -11.230579376220703, "global_step": 393533, "epoch": 2342} {"train_loss": -11.590996742248535, "global_step": 393534, "epoch": 2342} {"train_loss": -11.634575843811035, "global_step": 393535, "epoch": 2342} {"train_loss": -11.67124080657959, "global_step": 393536, "epoch": 2342} {"train_loss": -11.949563980102539, "global_step": 393537, "epoch": 2342} {"train_loss": -11.888278007507324, "global_step": 393538, "epoch": 2342} {"train_loss": -11.669168472290039, "global_step": 393539, "epoch": 2342} {"train_loss": -11.990488052368164, "global_step": 393540, "epoch": 2342} {"train_loss": -12.197441101074219, "global_step": 393541, "epoch": 2342} {"train_loss": -11.939094543457031, "global_step": 393542, "epoch": 2342} {"train_loss": -12.302456855773926, "global_step": 393543, "epoch": 2342} {"train_loss": -11.737653732299805, "global_step": 393544, "epoch": 2342} {"train_loss": -11.972452163696289, "global_step": 393545, "epoch": 2342} {"train_loss": -12.01738166809082, "global_step": 393546, "epoch": 2342} {"train_loss": -12.251044273376465, "global_step": 393547, "epoch": 2342} {"train_loss": -11.634172439575195, "global_step": 393548, "epoch": 2342} {"train_loss": -11.933809280395508, "global_step": 393549, "epoch": 2342} {"train_loss": -11.489574432373047, "global_step": 393550, "epoch": 2342} {"train_loss": -11.815685272216797, "global_step": 393551, "epoch": 2342} {"train_loss": -12.098126411437988, "global_step": 393552, "epoch": 2342} {"train_loss": -11.682101249694824, "global_step": 393553, "epoch": 2342} {"train_loss": -11.735803604125977, "global_step": 393554, "epoch": 2342} {"train_loss": -11.983377456665039, "global_step": 393555, "epoch": 2342} {"train_loss": -11.813187599182129, "global_step": 393556, "epoch": 2342} {"train_loss": -11.346370697021484, "global_step": 393557, "epoch": 2342} {"train_loss": -11.64130973815918, "global_step": 393558, "epoch": 2342} {"train_loss": -11.948115348815918, "global_step": 393559, "epoch": 2342} {"train_loss": -11.934049606323242, "global_step": 393560, "epoch": 2342} {"train_loss": -11.999835014343262, "global_step": 393561, "epoch": 2342} {"train_loss": -12.011812210083008, "global_step": 393562, "epoch": 2342} {"train_loss": -12.135793685913086, "global_step": 393563, "epoch": 2342} {"train_loss": -12.047109603881836, "global_step": 393564, "epoch": 2342} {"train_loss": -11.335830688476562, "global_step": 393565, "epoch": 2342} {"train_loss": -12.053994178771973, "global_step": 393566, "epoch": 2342} {"train_loss": -11.576662063598633, "global_step": 393567, "epoch": 2342} {"train_loss": -11.679798126220703, "global_step": 393568, "epoch": 2342} {"train_loss": -12.253637313842773, "global_step": 393569, "epoch": 2342} {"train_loss": -11.581352233886719, "global_step": 393570, "epoch": 2342} {"train_loss": -12.333709716796875, "global_step": 393571, "epoch": 2342} {"train_loss": -12.297704696655273, "global_step": 393572, "epoch": 2342} {"train_loss": -12.20498275756836, "global_step": 393573, "epoch": 2342} {"train_loss": -12.235895156860352, "global_step": 393574, "epoch": 2342} {"train_loss": -11.69666862487793, "global_step": 393575, "epoch": 2342} {"train_loss": -11.956548690795898, "global_step": 393576, "epoch": 2342} {"train_loss": -11.71274185180664, "global_step": 393577, "epoch": 2342} {"train_loss": -12.026765823364258, "global_step": 393578, "epoch": 2342} {"train_loss": -11.755407333374023, "global_step": 393579, "epoch": 2342} {"train_loss": -11.491294860839844, "global_step": 393580, "epoch": 2342} {"train_loss": -12.036149978637695, "global_step": 393581, "epoch": 2342} {"train_loss": -11.61413288116455, "global_step": 393582, "epoch": 2342} {"train_loss": -12.487176895141602, "global_step": 393583, "epoch": 2342} {"train_loss": -11.54216194152832, "global_step": 393584, "epoch": 2342} {"train_loss": -12.203828811645508, "global_step": 393585, "epoch": 2342} {"train_loss": -11.888692855834961, "global_step": 393586, "epoch": 2342} {"train_loss": -11.748912811279297, "global_step": 393587, "epoch": 2342} {"train_loss": -12.082415580749512, "global_step": 393588, "epoch": 2342} {"train_loss": -11.772789001464844, "global_step": 393589, "epoch": 2342} {"train_loss": -11.589265823364258, "global_step": 393590, "epoch": 2342} {"train_loss": -12.41694164276123, "global_step": 393591, "epoch": 2342} {"train_loss": -12.031967163085938, "global_step": 393592, "epoch": 2342} {"train_loss": -11.442449569702148, "global_step": 393593, "epoch": 2342} {"train_loss": -11.898195266723633, "global_step": 393594, "epoch": 2342} {"train_loss": -12.156007766723633, "global_step": 393595, "epoch": 2342} {"train_loss": -11.051508903503418, "global_step": 393596, "epoch": 2342} {"train_loss": -11.405576705932617, "global_step": 393597, "epoch": 2342} {"train_loss": -11.377202987670898, "global_step": 393598, "epoch": 2342} {"train_loss": -11.304509162902832, "global_step": 393599, "epoch": 2342} {"train_loss": -11.985700607299805, "global_step": 393600, "epoch": 2342} {"train_loss": -11.857362747192383, "global_step": 393601, "epoch": 2342} {"train_loss": -12.063215255737305, "global_step": 393602, "epoch": 2342} {"train_loss": -11.994817733764648, "global_step": 393603, "epoch": 2342} {"train_loss": -12.025371551513672, "global_step": 393604, "epoch": 2342} {"train_loss": -12.020059585571289, "global_step": 393605, "epoch": 2342} {"train_loss": -12.33823013305664, "global_step": 393606, "epoch": 2342} {"train_loss": -12.01934814453125, "global_step": 393607, "epoch": 2342} {"train_loss": -12.168915748596191, "global_step": 393608, "epoch": 2342} {"train_loss": -12.159765243530273, "global_step": 393609, "epoch": 2342} {"train_loss": -11.824777603149414, "global_step": 393610, "epoch": 2342} {"train_loss": -11.63951301574707, "global_step": 393611, "epoch": 2342} {"train_loss": -12.179122924804688, "global_step": 393612, "epoch": 2342} {"train_loss": -11.831905364990234, "global_step": 393613, "epoch": 2342} {"train_loss": -12.505541801452637, "global_step": 393614, "epoch": 2342} {"train_loss": -12.115851402282715, "global_step": 393615, "epoch": 2342} {"train_loss": -12.301981925964355, "global_step": 393616, "epoch": 2342} {"train_loss": -12.218749046325684, "global_step": 393617, "epoch": 2342} {"train_loss": -12.389938354492188, "global_step": 393618, "epoch": 2342} {"train_loss": -11.914108276367188, "global_step": 393619, "epoch": 2342} {"train_loss": -12.174596786499023, "global_step": 393620, "epoch": 2342} {"train_loss": -12.213763236999512, "global_step": 393621, "epoch": 2342} {"train_loss": -12.169954299926758, "global_step": 393622, "epoch": 2342} {"train_loss": -11.337067002341861, "global_step": 393623, "epoch": 2342, "val_loss": 297841.84375} {"train_loss": -12.241279602050781, "global_step": 393624, "epoch": 2343} {"train_loss": -11.905021667480469, "global_step": 393625, "epoch": 2343} {"train_loss": -12.490842819213867, "global_step": 393626, "epoch": 2343} {"train_loss": -11.938209533691406, "global_step": 393627, "epoch": 2343} {"train_loss": -11.866046905517578, "global_step": 393628, "epoch": 2343} {"train_loss": -12.55921745300293, "global_step": 393629, "epoch": 2343} {"train_loss": -12.348509788513184, "global_step": 393630, "epoch": 2343} {"train_loss": -12.321615219116211, "global_step": 393631, "epoch": 2343} {"train_loss": -12.737810134887695, "global_step": 393632, "epoch": 2343} {"train_loss": -12.341751098632812, "global_step": 393633, "epoch": 2343} {"train_loss": -12.58856201171875, "global_step": 393634, "epoch": 2343} {"train_loss": -12.3523530960083, "global_step": 393635, "epoch": 2343} {"train_loss": -12.712543487548828, "global_step": 393636, "epoch": 2343} {"train_loss": -12.485930442810059, "global_step": 393637, "epoch": 2343} {"train_loss": -12.25230598449707, "global_step": 393638, "epoch": 2343} {"train_loss": -12.880526542663574, "global_step": 393639, "epoch": 2343} {"train_loss": -12.372308731079102, "global_step": 393640, "epoch": 2343} {"train_loss": -12.389167785644531, "global_step": 393641, "epoch": 2343} {"train_loss": -12.521759033203125, "global_step": 393642, "epoch": 2343} {"train_loss": -12.397772789001465, "global_step": 393643, "epoch": 2343} {"train_loss": -12.272622108459473, "global_step": 393644, "epoch": 2343} {"train_loss": -12.45498275756836, "global_step": 393645, "epoch": 2343} {"train_loss": -12.435235023498535, "global_step": 393646, "epoch": 2343} {"train_loss": -12.402477264404297, "global_step": 393647, "epoch": 2343} {"train_loss": -12.474653244018555, "global_step": 393648, "epoch": 2343} {"train_loss": -11.910760879516602, "global_step": 393649, "epoch": 2343} {"train_loss": -12.29193115234375, "global_step": 393650, "epoch": 2343} {"train_loss": -12.281717300415039, "global_step": 393651, "epoch": 2343} {"train_loss": -11.434919357299805, "global_step": 393652, "epoch": 2343} {"train_loss": -11.897735595703125, "global_step": 393653, "epoch": 2343} {"train_loss": -12.442831039428711, "global_step": 393654, "epoch": 2343} {"train_loss": -11.959686279296875, "global_step": 393655, "epoch": 2343} {"train_loss": -11.693751335144043, "global_step": 393656, "epoch": 2343} {"train_loss": -12.187450408935547, "global_step": 393657, "epoch": 2343} {"train_loss": -11.774242401123047, "global_step": 393658, "epoch": 2343} {"train_loss": -11.597236633300781, "global_step": 393659, "epoch": 2343} {"train_loss": -11.201637268066406, "global_step": 393660, "epoch": 2343} {"train_loss": -10.629988670349121, "global_step": 393661, "epoch": 2343} {"train_loss": -11.767035484313965, "global_step": 393662, "epoch": 2343} {"train_loss": -10.98846435546875, "global_step": 393663, "epoch": 2343} {"train_loss": -10.31694221496582, "global_step": 393664, "epoch": 2343} {"train_loss": -10.684276580810547, "global_step": 393665, "epoch": 2343} {"train_loss": -10.682544708251953, "global_step": 393666, "epoch": 2343} {"train_loss": -9.358741760253906, "global_step": 393667, "epoch": 2343} {"train_loss": -8.630825996398926, "global_step": 393668, "epoch": 2343} {"train_loss": -9.721961975097656, "global_step": 393669, "epoch": 2343} {"train_loss": -9.673095703125, "global_step": 393670, "epoch": 2343} {"train_loss": -9.806981086730957, "global_step": 393671, "epoch": 2343} {"train_loss": -9.078756332397461, "global_step": 393672, "epoch": 2343} {"train_loss": -10.069380760192871, "global_step": 393673, "epoch": 2343} {"train_loss": -8.480264663696289, "global_step": 393674, "epoch": 2343} {"train_loss": -10.237842559814453, "global_step": 393675, "epoch": 2343} {"train_loss": -10.162862777709961, "global_step": 393676, "epoch": 2343} {"train_loss": -9.522340774536133, "global_step": 393677, "epoch": 2343} {"train_loss": -9.66712760925293, "global_step": 393678, "epoch": 2343} {"train_loss": -10.811563491821289, "global_step": 393679, "epoch": 2343} {"train_loss": -10.5079984664917, "global_step": 393680, "epoch": 2343} {"train_loss": -11.75752067565918, "global_step": 393681, "epoch": 2343} {"train_loss": -10.123289108276367, "global_step": 393682, "epoch": 2343} {"train_loss": -10.897172927856445, "global_step": 393683, "epoch": 2343} {"train_loss": -10.292289733886719, "global_step": 393684, "epoch": 2343} {"train_loss": -11.380167961120605, "global_step": 393685, "epoch": 2343} {"train_loss": -10.377245903015137, "global_step": 393686, "epoch": 2343} {"train_loss": -11.00283432006836, "global_step": 393687, "epoch": 2343} {"train_loss": -10.426368713378906, "global_step": 393688, "epoch": 2343} {"train_loss": -9.727001190185547, "global_step": 393689, "epoch": 2343} {"train_loss": -9.34201431274414, "global_step": 393690, "epoch": 2343} {"train_loss": -10.180793762207031, "global_step": 393691, "epoch": 2343} {"train_loss": -10.5784330368042, "global_step": 393692, "epoch": 2343} {"train_loss": -11.176835060119629, "global_step": 393693, "epoch": 2343} {"train_loss": -10.554533004760742, "global_step": 393694, "epoch": 2343} {"train_loss": -10.880596160888672, "global_step": 393695, "epoch": 2343} {"train_loss": -10.424079895019531, "global_step": 393696, "epoch": 2343} {"train_loss": -10.837052345275879, "global_step": 393697, "epoch": 2343} {"train_loss": -10.277206420898438, "global_step": 393698, "epoch": 2343} {"train_loss": -10.920875549316406, "global_step": 393699, "epoch": 2343} {"train_loss": -11.035234451293945, "global_step": 393700, "epoch": 2343} {"train_loss": -10.70594596862793, "global_step": 393701, "epoch": 2343} {"train_loss": -10.860313415527344, "global_step": 393702, "epoch": 2343} {"train_loss": -11.35666275024414, "global_step": 393703, "epoch": 2343} {"train_loss": -11.512112617492676, "global_step": 393704, "epoch": 2343} {"train_loss": -11.114706039428711, "global_step": 393705, "epoch": 2343} {"train_loss": -11.273760795593262, "global_step": 393706, "epoch": 2343} {"train_loss": -11.594352722167969, "global_step": 393707, "epoch": 2343} {"train_loss": -11.13257122039795, "global_step": 393708, "epoch": 2343} {"train_loss": -11.73513126373291, "global_step": 393709, "epoch": 2343} {"train_loss": -11.457329750061035, "global_step": 393710, "epoch": 2343} {"train_loss": -11.60824966430664, "global_step": 393711, "epoch": 2343} {"train_loss": -11.782973289489746, "global_step": 393712, "epoch": 2343} {"train_loss": -11.580965042114258, "global_step": 393713, "epoch": 2343} {"train_loss": -11.791023254394531, "global_step": 393714, "epoch": 2343} {"train_loss": -11.73538589477539, "global_step": 393715, "epoch": 2343} {"train_loss": -11.623187065124512, "global_step": 393716, "epoch": 2343} {"train_loss": -11.755218505859375, "global_step": 393717, "epoch": 2343} {"train_loss": -12.035470962524414, "global_step": 393718, "epoch": 2343} {"train_loss": -11.76599407196045, "global_step": 393719, "epoch": 2343} {"train_loss": -12.11212158203125, "global_step": 393720, "epoch": 2343} {"train_loss": -11.542621612548828, "global_step": 393721, "epoch": 2343} {"train_loss": -11.991205215454102, "global_step": 393722, "epoch": 2343} {"train_loss": -11.71671199798584, "global_step": 393723, "epoch": 2343} {"train_loss": -11.869842529296875, "global_step": 393724, "epoch": 2343} {"train_loss": -11.74445915222168, "global_step": 393725, "epoch": 2343} {"train_loss": -11.987366676330566, "global_step": 393726, "epoch": 2343} {"train_loss": -11.11459732055664, "global_step": 393727, "epoch": 2343} {"train_loss": -12.036969184875488, "global_step": 393728, "epoch": 2343} {"train_loss": -11.700555801391602, "global_step": 393729, "epoch": 2343} {"train_loss": -11.803291320800781, "global_step": 393730, "epoch": 2343} {"train_loss": -11.191410064697266, "global_step": 393731, "epoch": 2343} {"train_loss": -12.059085845947266, "global_step": 393732, "epoch": 2343} {"train_loss": -11.555845260620117, "global_step": 393733, "epoch": 2343} {"train_loss": -11.966967582702637, "global_step": 393734, "epoch": 2343} {"train_loss": -11.755525588989258, "global_step": 393735, "epoch": 2343} {"train_loss": -12.000482559204102, "global_step": 393736, "epoch": 2343} {"train_loss": -11.79775333404541, "global_step": 393737, "epoch": 2343} {"train_loss": -12.183859825134277, "global_step": 393738, "epoch": 2343} {"train_loss": -11.746448516845703, "global_step": 393739, "epoch": 2343} {"train_loss": -12.355815887451172, "global_step": 393740, "epoch": 2343} {"train_loss": -11.841480255126953, "global_step": 393741, "epoch": 2343} {"train_loss": -12.224395751953125, "global_step": 393742, "epoch": 2343} {"train_loss": -11.887031555175781, "global_step": 393743, "epoch": 2343} {"train_loss": -12.195487022399902, "global_step": 393744, "epoch": 2343} {"train_loss": -11.990313529968262, "global_step": 393745, "epoch": 2343} {"train_loss": -12.309444427490234, "global_step": 393746, "epoch": 2343} {"train_loss": -11.985074996948242, "global_step": 393747, "epoch": 2343} {"train_loss": -12.309892654418945, "global_step": 393748, "epoch": 2343} {"train_loss": -12.170024871826172, "global_step": 393749, "epoch": 2343} {"train_loss": -12.360335350036621, "global_step": 393750, "epoch": 2343} {"train_loss": -12.043718338012695, "global_step": 393751, "epoch": 2343} {"train_loss": -12.116836547851562, "global_step": 393752, "epoch": 2343} {"train_loss": -12.162271499633789, "global_step": 393753, "epoch": 2343} {"train_loss": -12.274002075195312, "global_step": 393754, "epoch": 2343} {"train_loss": -12.312832832336426, "global_step": 393755, "epoch": 2343} {"train_loss": -12.369986534118652, "global_step": 393756, "epoch": 2343} {"train_loss": -12.038414001464844, "global_step": 393757, "epoch": 2343} {"train_loss": -12.196603775024414, "global_step": 393758, "epoch": 2343} {"train_loss": -12.427689552307129, "global_step": 393759, "epoch": 2343} {"train_loss": -12.365297317504883, "global_step": 393760, "epoch": 2343} {"train_loss": -12.663710594177246, "global_step": 393761, "epoch": 2343} {"train_loss": -12.56801700592041, "global_step": 393762, "epoch": 2343} {"train_loss": -12.562725067138672, "global_step": 393763, "epoch": 2343} {"train_loss": -12.524001121520996, "global_step": 393764, "epoch": 2343} {"train_loss": -12.482953071594238, "global_step": 393765, "epoch": 2343} {"train_loss": -12.517011642456055, "global_step": 393766, "epoch": 2343} {"train_loss": -12.320361137390137, "global_step": 393767, "epoch": 2343} {"train_loss": -12.532361030578613, "global_step": 393768, "epoch": 2343} {"train_loss": -12.554019927978516, "global_step": 393769, "epoch": 2343} {"train_loss": -12.517608642578125, "global_step": 393770, "epoch": 2343} {"train_loss": -12.563185691833496, "global_step": 393771, "epoch": 2343} {"train_loss": -12.604682922363281, "global_step": 393772, "epoch": 2343} {"train_loss": -12.389907836914062, "global_step": 393773, "epoch": 2343} {"train_loss": -12.440864562988281, "global_step": 393774, "epoch": 2343} {"train_loss": -12.58255386352539, "global_step": 393775, "epoch": 2343} {"train_loss": -12.602712631225586, "global_step": 393776, "epoch": 2343} {"train_loss": -12.657572746276855, "global_step": 393777, "epoch": 2343} {"train_loss": -12.575729370117188, "global_step": 393778, "epoch": 2343} {"train_loss": -12.630395889282227, "global_step": 393779, "epoch": 2343} {"train_loss": -12.366744041442871, "global_step": 393780, "epoch": 2343} {"train_loss": -12.350299835205078, "global_step": 393781, "epoch": 2343} {"train_loss": -12.63265609741211, "global_step": 393782, "epoch": 2343} {"train_loss": -12.721884727478027, "global_step": 393783, "epoch": 2343} {"train_loss": -12.651264190673828, "global_step": 393784, "epoch": 2343} {"train_loss": -12.443544387817383, "global_step": 393785, "epoch": 2343} {"train_loss": -12.767271041870117, "global_step": 393786, "epoch": 2343} {"train_loss": -12.723268508911133, "global_step": 393787, "epoch": 2343} {"train_loss": -12.586198806762695, "global_step": 393788, "epoch": 2343} {"train_loss": -12.502065658569336, "global_step": 393789, "epoch": 2343} {"train_loss": -12.674311637878418, "global_step": 393790, "epoch": 2343} {"train_loss": -11.696880970682416, "global_step": 393791, "epoch": 2343, "val_loss": 300492.78125} {"train_loss": -12.440488815307617, "global_step": 393792, "epoch": 2344} {"train_loss": -12.639503479003906, "global_step": 393793, "epoch": 2344} {"train_loss": -12.461281776428223, "global_step": 393794, "epoch": 2344} {"train_loss": -12.682589530944824, "global_step": 393795, "epoch": 2344} {"train_loss": -12.502398490905762, "global_step": 393796, "epoch": 2344} {"train_loss": -12.84330940246582, "global_step": 393797, "epoch": 2344} {"train_loss": -12.64675521850586, "global_step": 393798, "epoch": 2344} {"train_loss": -12.782485961914062, "global_step": 393799, "epoch": 2344} {"train_loss": -12.550985336303711, "global_step": 393800, "epoch": 2344} {"train_loss": -12.578634262084961, "global_step": 393801, "epoch": 2344} {"train_loss": -12.555144309997559, "global_step": 393802, "epoch": 2344} {"train_loss": -12.685236930847168, "global_step": 393803, "epoch": 2344} {"train_loss": -12.354333877563477, "global_step": 393804, "epoch": 2344} {"train_loss": -12.591416358947754, "global_step": 393805, "epoch": 2344} {"train_loss": -12.586498260498047, "global_step": 393806, "epoch": 2344} {"train_loss": -12.412386894226074, "global_step": 393807, "epoch": 2344} {"train_loss": -12.601810455322266, "global_step": 393808, "epoch": 2344} {"train_loss": -12.465837478637695, "global_step": 393809, "epoch": 2344} {"train_loss": -11.856464385986328, "global_step": 393810, "epoch": 2344} {"train_loss": -11.49191665649414, "global_step": 393811, "epoch": 2344} {"train_loss": -11.179465293884277, "global_step": 393812, "epoch": 2344} {"train_loss": -12.1134614944458, "global_step": 393813, "epoch": 2344} {"train_loss": -12.753555297851562, "global_step": 393814, "epoch": 2344} {"train_loss": -12.285199165344238, "global_step": 393815, "epoch": 2344} {"train_loss": -12.133180618286133, "global_step": 393816, "epoch": 2344} {"train_loss": -11.133137702941895, "global_step": 393817, "epoch": 2344} {"train_loss": -11.697492599487305, "global_step": 393818, "epoch": 2344} {"train_loss": -12.214139938354492, "global_step": 393819, "epoch": 2344} {"train_loss": -12.640811920166016, "global_step": 393820, "epoch": 2344} {"train_loss": -11.672743797302246, "global_step": 393821, "epoch": 2344} {"train_loss": -12.290606498718262, "global_step": 393822, "epoch": 2344} {"train_loss": -12.241082191467285, "global_step": 393823, "epoch": 2344} {"train_loss": -12.19863510131836, "global_step": 393824, "epoch": 2344} {"train_loss": -11.51327133178711, "global_step": 393825, "epoch": 2344} {"train_loss": -11.191835403442383, "global_step": 393826, "epoch": 2344} {"train_loss": -12.215839385986328, "global_step": 393827, "epoch": 2344} {"train_loss": -10.95100212097168, "global_step": 393828, "epoch": 2344} {"train_loss": -11.688728332519531, "global_step": 393829, "epoch": 2344} {"train_loss": -9.154741287231445, "global_step": 393830, "epoch": 2344} {"train_loss": -9.407384872436523, "global_step": 393831, "epoch": 2344} {"train_loss": -10.546489715576172, "global_step": 393832, "epoch": 2344} {"train_loss": -10.80712890625, "global_step": 393833, "epoch": 2344} {"train_loss": -9.73452377319336, "global_step": 393834, "epoch": 2344} {"train_loss": -9.956793785095215, "global_step": 393835, "epoch": 2344} {"train_loss": -11.04738998413086, "global_step": 393836, "epoch": 2344} {"train_loss": -11.534273147583008, "global_step": 393837, "epoch": 2344} {"train_loss": -10.478023529052734, "global_step": 393838, "epoch": 2344} {"train_loss": -11.625076293945312, "global_step": 393839, "epoch": 2344} {"train_loss": -10.728801727294922, "global_step": 393840, "epoch": 2344} {"train_loss": -12.130820274353027, "global_step": 393841, "epoch": 2344} {"train_loss": -11.540178298950195, "global_step": 393842, "epoch": 2344} {"train_loss": -11.799388885498047, "global_step": 393843, "epoch": 2344} {"train_loss": -11.80893325805664, "global_step": 393844, "epoch": 2344} {"train_loss": -11.836710929870605, "global_step": 393845, "epoch": 2344} {"train_loss": -11.730140686035156, "global_step": 393846, "epoch": 2344} {"train_loss": -11.918560981750488, "global_step": 393847, "epoch": 2344} {"train_loss": -12.146759033203125, "global_step": 393848, "epoch": 2344} {"train_loss": -12.094083786010742, "global_step": 393849, "epoch": 2344} {"train_loss": -12.298646926879883, "global_step": 393850, "epoch": 2344} {"train_loss": -12.0649995803833, "global_step": 393851, "epoch": 2344} {"train_loss": -12.445812225341797, "global_step": 393852, "epoch": 2344} {"train_loss": -11.873682022094727, "global_step": 393853, "epoch": 2344} {"train_loss": -12.228415489196777, "global_step": 393854, "epoch": 2344} {"train_loss": -12.157526969909668, "global_step": 393855, "epoch": 2344} {"train_loss": -12.142766952514648, "global_step": 393856, "epoch": 2344} {"train_loss": -12.37808895111084, "global_step": 393857, "epoch": 2344} {"train_loss": -11.92593002319336, "global_step": 393858, "epoch": 2344} {"train_loss": -12.446271896362305, "global_step": 393859, "epoch": 2344} {"train_loss": -12.410576820373535, "global_step": 393860, "epoch": 2344} {"train_loss": -12.335037231445312, "global_step": 393861, "epoch": 2344} {"train_loss": -12.329084396362305, "global_step": 393862, "epoch": 2344} {"train_loss": -12.712836265563965, "global_step": 393863, "epoch": 2344} {"train_loss": -12.11291790008545, "global_step": 393864, "epoch": 2344} {"train_loss": -12.21932601928711, "global_step": 393865, "epoch": 2344} {"train_loss": -12.290929794311523, "global_step": 393866, "epoch": 2344} {"train_loss": -12.172231674194336, "global_step": 393867, "epoch": 2344} {"train_loss": -12.602804183959961, "global_step": 393868, "epoch": 2344} {"train_loss": -12.559733390808105, "global_step": 393869, "epoch": 2344} {"train_loss": -12.642958641052246, "global_step": 393870, "epoch": 2344} {"train_loss": -12.360635757446289, "global_step": 393871, "epoch": 2344} {"train_loss": -12.1672945022583, "global_step": 393872, "epoch": 2344} {"train_loss": -12.565500259399414, "global_step": 393873, "epoch": 2344} {"train_loss": -12.406756401062012, "global_step": 393874, "epoch": 2344} {"train_loss": -12.368406295776367, "global_step": 393875, "epoch": 2344} {"train_loss": -12.43065071105957, "global_step": 393876, "epoch": 2344} {"train_loss": -12.65927505493164, "global_step": 393877, "epoch": 2344} {"train_loss": -12.459595680236816, "global_step": 393878, "epoch": 2344} {"train_loss": -12.475878715515137, "global_step": 393879, "epoch": 2344} {"train_loss": -12.351733207702637, "global_step": 393880, "epoch": 2344} {"train_loss": -12.377649307250977, "global_step": 393881, "epoch": 2344} {"train_loss": -12.27973461151123, "global_step": 393882, "epoch": 2344} {"train_loss": -12.472099304199219, "global_step": 393883, "epoch": 2344} {"train_loss": -12.730875015258789, "global_step": 393884, "epoch": 2344} {"train_loss": -12.711420059204102, "global_step": 393885, "epoch": 2344} {"train_loss": -12.149478912353516, "global_step": 393886, "epoch": 2344} {"train_loss": -12.173517227172852, "global_step": 393887, "epoch": 2344} {"train_loss": -12.043831825256348, "global_step": 393888, "epoch": 2344} {"train_loss": -12.128089904785156, "global_step": 393889, "epoch": 2344} {"train_loss": -12.023155212402344, "global_step": 393890, "epoch": 2344} {"train_loss": -12.490584373474121, "global_step": 393891, "epoch": 2344} {"train_loss": -12.503046989440918, "global_step": 393892, "epoch": 2344} {"train_loss": -12.411645889282227, "global_step": 393893, "epoch": 2344} {"train_loss": -12.678611755371094, "global_step": 393894, "epoch": 2344} {"train_loss": -12.453272819519043, "global_step": 393895, "epoch": 2344} {"train_loss": -12.310210227966309, "global_step": 393896, "epoch": 2344} {"train_loss": -12.044632911682129, "global_step": 393897, "epoch": 2344} {"train_loss": -12.259611129760742, "global_step": 393898, "epoch": 2344} {"train_loss": -11.691447257995605, "global_step": 393899, "epoch": 2344} {"train_loss": -12.54932975769043, "global_step": 393900, "epoch": 2344} {"train_loss": -11.755224227905273, "global_step": 393901, "epoch": 2344} {"train_loss": -12.198588371276855, "global_step": 393902, "epoch": 2344} {"train_loss": -12.15445327758789, "global_step": 393903, "epoch": 2344} {"train_loss": -12.546686172485352, "global_step": 393904, "epoch": 2344} {"train_loss": -12.095512390136719, "global_step": 393905, "epoch": 2344} {"train_loss": -12.387727737426758, "global_step": 393906, "epoch": 2344} {"train_loss": -11.89632797241211, "global_step": 393907, "epoch": 2344} {"train_loss": -12.42203140258789, "global_step": 393908, "epoch": 2344} {"train_loss": -12.247446060180664, "global_step": 393909, "epoch": 2344} {"train_loss": -12.367510795593262, "global_step": 393910, "epoch": 2344} {"train_loss": -12.064160346984863, "global_step": 393911, "epoch": 2344} {"train_loss": -11.175522804260254, "global_step": 393912, "epoch": 2344} {"train_loss": -11.849807739257812, "global_step": 393913, "epoch": 2344} {"train_loss": -11.61968994140625, "global_step": 393914, "epoch": 2344} {"train_loss": -11.196037292480469, "global_step": 393915, "epoch": 2344} {"train_loss": -10.052250862121582, "global_step": 393916, "epoch": 2344} {"train_loss": -10.701728820800781, "global_step": 393917, "epoch": 2344} {"train_loss": -10.89468002319336, "global_step": 393918, "epoch": 2344} {"train_loss": -9.716168403625488, "global_step": 393919, "epoch": 2344} {"train_loss": -9.397093772888184, "global_step": 393920, "epoch": 2344} {"train_loss": -10.469158172607422, "global_step": 393921, "epoch": 2344} {"train_loss": -10.432573318481445, "global_step": 393922, "epoch": 2344} {"train_loss": -10.955816268920898, "global_step": 393923, "epoch": 2344} {"train_loss": -9.443551063537598, "global_step": 393924, "epoch": 2344} {"train_loss": -8.798690795898438, "global_step": 393925, "epoch": 2344} {"train_loss": -8.883553504943848, "global_step": 393926, "epoch": 2344} {"train_loss": -9.622568130493164, "global_step": 393927, "epoch": 2344} {"train_loss": -10.568132400512695, "global_step": 393928, "epoch": 2344} {"train_loss": -9.919044494628906, "global_step": 393929, "epoch": 2344} {"train_loss": -9.445524215698242, "global_step": 393930, "epoch": 2344} {"train_loss": -10.43197250366211, "global_step": 393931, "epoch": 2344} {"train_loss": -11.324606895446777, "global_step": 393932, "epoch": 2344} {"train_loss": -10.486799240112305, "global_step": 393933, "epoch": 2344} {"train_loss": -9.3527193069458, "global_step": 393934, "epoch": 2344} {"train_loss": -10.046722412109375, "global_step": 393935, "epoch": 2344} {"train_loss": -10.92988395690918, "global_step": 393936, "epoch": 2344} {"train_loss": -10.635465621948242, "global_step": 393937, "epoch": 2344} {"train_loss": -10.389907836914062, "global_step": 393938, "epoch": 2344} {"train_loss": -11.011041641235352, "global_step": 393939, "epoch": 2344} {"train_loss": -11.309457778930664, "global_step": 393940, "epoch": 2344} {"train_loss": -10.61021900177002, "global_step": 393941, "epoch": 2344} {"train_loss": -10.711152076721191, "global_step": 393942, "epoch": 2344} {"train_loss": -10.521700859069824, "global_step": 393943, "epoch": 2344} {"train_loss": -10.479536056518555, "global_step": 393944, "epoch": 2344} {"train_loss": -11.170904159545898, "global_step": 393945, "epoch": 2344} {"train_loss": -10.896486282348633, "global_step": 393946, "epoch": 2344} {"train_loss": -10.983275413513184, "global_step": 393947, "epoch": 2344} {"train_loss": -11.398309707641602, "global_step": 393948, "epoch": 2344} {"train_loss": -10.809698104858398, "global_step": 393949, "epoch": 2344} {"train_loss": -11.509475708007812, "global_step": 393950, "epoch": 2344} {"train_loss": -11.241764068603516, "global_step": 393951, "epoch": 2344} {"train_loss": -11.312577247619629, "global_step": 393952, "epoch": 2344} {"train_loss": -11.464546203613281, "global_step": 393953, "epoch": 2344} {"train_loss": -10.933477401733398, "global_step": 393954, "epoch": 2344} {"train_loss": -11.947380065917969, "global_step": 393955, "epoch": 2344} {"train_loss": -11.463125228881836, "global_step": 393956, "epoch": 2344} {"train_loss": -11.605215072631836, "global_step": 393957, "epoch": 2344} {"train_loss": -11.86180305480957, "global_step": 393958, "epoch": 2344} {"train_loss": -11.685712768917991, "global_step": 393959, "epoch": 2344, "val_loss": 297785.46875} {"train_loss": -12.108976364135742, "global_step": 393960, "epoch": 2345} {"train_loss": -11.837322235107422, "global_step": 393961, "epoch": 2345} {"train_loss": -12.044029235839844, "global_step": 393962, "epoch": 2345} {"train_loss": -11.76603889465332, "global_step": 393963, "epoch": 2345} {"train_loss": -11.960599899291992, "global_step": 393964, "epoch": 2345} {"train_loss": -11.807395935058594, "global_step": 393965, "epoch": 2345} {"train_loss": -12.19261360168457, "global_step": 393966, "epoch": 2345} {"train_loss": -11.844232559204102, "global_step": 393967, "epoch": 2345} {"train_loss": -12.125875473022461, "global_step": 393968, "epoch": 2345} {"train_loss": -12.093438148498535, "global_step": 393969, "epoch": 2345} {"train_loss": -12.1915922164917, "global_step": 393970, "epoch": 2345} {"train_loss": -12.290943145751953, "global_step": 393971, "epoch": 2345} {"train_loss": -12.188936233520508, "global_step": 393972, "epoch": 2345} {"train_loss": -12.144267082214355, "global_step": 393973, "epoch": 2345} {"train_loss": -12.18096923828125, "global_step": 393974, "epoch": 2345} {"train_loss": -11.948356628417969, "global_step": 393975, "epoch": 2345} {"train_loss": -12.123390197753906, "global_step": 393976, "epoch": 2345} {"train_loss": -12.272319793701172, "global_step": 393977, "epoch": 2345} {"train_loss": -12.251452445983887, "global_step": 393978, "epoch": 2345} {"train_loss": -12.194524765014648, "global_step": 393979, "epoch": 2345} {"train_loss": -12.334868431091309, "global_step": 393980, "epoch": 2345} {"train_loss": -12.381169319152832, "global_step": 393981, "epoch": 2345} {"train_loss": -12.049911499023438, "global_step": 393982, "epoch": 2345} {"train_loss": -12.281133651733398, "global_step": 393983, "epoch": 2345} {"train_loss": -12.448159217834473, "global_step": 393984, "epoch": 2345} {"train_loss": -12.30989933013916, "global_step": 393985, "epoch": 2345} {"train_loss": -12.129426956176758, "global_step": 393986, "epoch": 2345} {"train_loss": -12.326332092285156, "global_step": 393987, "epoch": 2345} {"train_loss": -12.298970222473145, "global_step": 393988, "epoch": 2345} {"train_loss": -12.30300521850586, "global_step": 393989, "epoch": 2345} {"train_loss": -12.146097183227539, "global_step": 393990, "epoch": 2345} {"train_loss": -12.39551067352295, "global_step": 393991, "epoch": 2345} {"train_loss": -12.317482948303223, "global_step": 393992, "epoch": 2345} {"train_loss": -12.229787826538086, "global_step": 393993, "epoch": 2345} {"train_loss": -12.325318336486816, "global_step": 393994, "epoch": 2345} {"train_loss": -12.487993240356445, "global_step": 393995, "epoch": 2345} {"train_loss": -12.369017601013184, "global_step": 393996, "epoch": 2345} {"train_loss": -12.437265396118164, "global_step": 393997, "epoch": 2345} {"train_loss": -12.215254783630371, "global_step": 393998, "epoch": 2345} {"train_loss": -12.554871559143066, "global_step": 393999, "epoch": 2345} {"train_loss": -12.467239379882812, "global_step": 394000, "epoch": 2345} {"train_loss": -12.48322582244873, "global_step": 394001, "epoch": 2345} {"train_loss": -12.568168640136719, "global_step": 394002, "epoch": 2345} {"train_loss": -12.244247436523438, "global_step": 394003, "epoch": 2345} {"train_loss": -12.483168601989746, "global_step": 394004, "epoch": 2345} {"train_loss": -12.386404991149902, "global_step": 394005, "epoch": 2345} {"train_loss": -12.276212692260742, "global_step": 394006, "epoch": 2345} {"train_loss": -12.277252197265625, "global_step": 394007, "epoch": 2345} {"train_loss": -12.30200481414795, "global_step": 394008, "epoch": 2345} {"train_loss": -12.080883026123047, "global_step": 394009, "epoch": 2345} {"train_loss": -12.552478790283203, "global_step": 394010, "epoch": 2345} {"train_loss": -12.340641021728516, "global_step": 394011, "epoch": 2345} {"train_loss": -12.320563316345215, "global_step": 394012, "epoch": 2345} {"train_loss": -12.42818832397461, "global_step": 394013, "epoch": 2345} {"train_loss": -12.380661010742188, "global_step": 394014, "epoch": 2345} {"train_loss": -12.563404083251953, "global_step": 394015, "epoch": 2345} {"train_loss": -12.526333808898926, "global_step": 394016, "epoch": 2345} {"train_loss": -12.297039031982422, "global_step": 394017, "epoch": 2345} {"train_loss": -12.45715045928955, "global_step": 394018, "epoch": 2345} {"train_loss": -12.32744312286377, "global_step": 394019, "epoch": 2345} {"train_loss": -12.275047302246094, "global_step": 394020, "epoch": 2345} {"train_loss": -12.388206481933594, "global_step": 394021, "epoch": 2345} {"train_loss": -12.334667205810547, "global_step": 394022, "epoch": 2345} {"train_loss": -12.647452354431152, "global_step": 394023, "epoch": 2345} {"train_loss": -12.46330451965332, "global_step": 394024, "epoch": 2345} {"train_loss": -12.193862915039062, "global_step": 394025, "epoch": 2345} {"train_loss": -11.771589279174805, "global_step": 394026, "epoch": 2345} {"train_loss": -12.508819580078125, "global_step": 394027, "epoch": 2345} {"train_loss": -11.272453308105469, "global_step": 394028, "epoch": 2345} {"train_loss": -11.599578857421875, "global_step": 394029, "epoch": 2345} {"train_loss": -12.122295379638672, "global_step": 394030, "epoch": 2345} {"train_loss": -12.382274627685547, "global_step": 394031, "epoch": 2345} {"train_loss": -11.68640422821045, "global_step": 394032, "epoch": 2345} {"train_loss": -11.516114234924316, "global_step": 394033, "epoch": 2345} {"train_loss": -11.348562240600586, "global_step": 394034, "epoch": 2345} {"train_loss": -11.875316619873047, "global_step": 394035, "epoch": 2345} {"train_loss": -12.322132110595703, "global_step": 394036, "epoch": 2345} {"train_loss": -11.939804077148438, "global_step": 394037, "epoch": 2345} {"train_loss": -11.046043395996094, "global_step": 394038, "epoch": 2345} {"train_loss": -12.139155387878418, "global_step": 394039, "epoch": 2345} {"train_loss": -12.013371467590332, "global_step": 394040, "epoch": 2345} {"train_loss": -12.361400604248047, "global_step": 394041, "epoch": 2345} {"train_loss": -11.801319122314453, "global_step": 394042, "epoch": 2345} {"train_loss": -12.034854888916016, "global_step": 394043, "epoch": 2345} {"train_loss": -12.028051376342773, "global_step": 394044, "epoch": 2345} {"train_loss": -12.081740379333496, "global_step": 394045, "epoch": 2345} {"train_loss": -11.794905662536621, "global_step": 394046, "epoch": 2345} {"train_loss": -11.581523895263672, "global_step": 394047, "epoch": 2345} {"train_loss": -10.05615234375, "global_step": 394048, "epoch": 2345} {"train_loss": -10.758553504943848, "global_step": 394049, "epoch": 2345} {"train_loss": -9.929838180541992, "global_step": 394050, "epoch": 2345} {"train_loss": -11.124791145324707, "global_step": 394051, "epoch": 2345} {"train_loss": -10.318267822265625, "global_step": 394052, "epoch": 2345} {"train_loss": -9.914831161499023, "global_step": 394053, "epoch": 2345} {"train_loss": -9.941551208496094, "global_step": 394054, "epoch": 2345} {"train_loss": -11.001958847045898, "global_step": 394055, "epoch": 2345} {"train_loss": -10.380638122558594, "global_step": 394056, "epoch": 2345} {"train_loss": -10.146947860717773, "global_step": 394057, "epoch": 2345} {"train_loss": -11.077859878540039, "global_step": 394058, "epoch": 2345} {"train_loss": -11.424412727355957, "global_step": 394059, "epoch": 2345} {"train_loss": -10.243514060974121, "global_step": 394060, "epoch": 2345} {"train_loss": -10.290887832641602, "global_step": 394061, "epoch": 2345} {"train_loss": -11.170071601867676, "global_step": 394062, "epoch": 2345} {"train_loss": -9.995216369628906, "global_step": 394063, "epoch": 2345} {"train_loss": -9.751307487487793, "global_step": 394064, "epoch": 2345} {"train_loss": -9.483190536499023, "global_step": 394065, "epoch": 2345} {"train_loss": -10.765312194824219, "global_step": 394066, "epoch": 2345} {"train_loss": -11.111101150512695, "global_step": 394067, "epoch": 2345} {"train_loss": -11.24803352355957, "global_step": 394068, "epoch": 2345} {"train_loss": -11.107481002807617, "global_step": 394069, "epoch": 2345} {"train_loss": -10.012035369873047, "global_step": 394070, "epoch": 2345} {"train_loss": -11.606332778930664, "global_step": 394071, "epoch": 2345} {"train_loss": -10.652599334716797, "global_step": 394072, "epoch": 2345} {"train_loss": -11.455463409423828, "global_step": 394073, "epoch": 2345} {"train_loss": -11.21700668334961, "global_step": 394074, "epoch": 2345} {"train_loss": -10.122047424316406, "global_step": 394075, "epoch": 2345} {"train_loss": -10.344776153564453, "global_step": 394076, "epoch": 2345} {"train_loss": -10.616840362548828, "global_step": 394077, "epoch": 2345} {"train_loss": -10.036297798156738, "global_step": 394078, "epoch": 2345} {"train_loss": -10.526097297668457, "global_step": 394079, "epoch": 2345} {"train_loss": -11.178119659423828, "global_step": 394080, "epoch": 2345} {"train_loss": -10.766522407531738, "global_step": 394081, "epoch": 2345} {"train_loss": -10.691442489624023, "global_step": 394082, "epoch": 2345} {"train_loss": -11.664375305175781, "global_step": 394083, "epoch": 2345} {"train_loss": -11.010276794433594, "global_step": 394084, "epoch": 2345} {"train_loss": -11.331128120422363, "global_step": 394085, "epoch": 2345} {"train_loss": -11.90762710571289, "global_step": 394086, "epoch": 2345} {"train_loss": -11.317995071411133, "global_step": 394087, "epoch": 2345} {"train_loss": -11.602470397949219, "global_step": 394088, "epoch": 2345} {"train_loss": -12.08498764038086, "global_step": 394089, "epoch": 2345} {"train_loss": -11.630914688110352, "global_step": 394090, "epoch": 2345} {"train_loss": -12.018623352050781, "global_step": 394091, "epoch": 2345} {"train_loss": -12.170217514038086, "global_step": 394092, "epoch": 2345} {"train_loss": -11.954418182373047, "global_step": 394093, "epoch": 2345} {"train_loss": -11.969711303710938, "global_step": 394094, "epoch": 2345} {"train_loss": -11.940611839294434, "global_step": 394095, "epoch": 2345} {"train_loss": -12.25672721862793, "global_step": 394096, "epoch": 2345} {"train_loss": -12.157801628112793, "global_step": 394097, "epoch": 2345} {"train_loss": -11.908747673034668, "global_step": 394098, "epoch": 2345} {"train_loss": -12.063583374023438, "global_step": 394099, "epoch": 2345} {"train_loss": -11.883454322814941, "global_step": 394100, "epoch": 2345} {"train_loss": -12.308772087097168, "global_step": 394101, "epoch": 2345} {"train_loss": -11.769041061401367, "global_step": 394102, "epoch": 2345} {"train_loss": -11.949759483337402, "global_step": 394103, "epoch": 2345} {"train_loss": -11.941034317016602, "global_step": 394104, "epoch": 2345} {"train_loss": -11.841141700744629, "global_step": 394105, "epoch": 2345} {"train_loss": -12.158838272094727, "global_step": 394106, "epoch": 2345} {"train_loss": -12.14133358001709, "global_step": 394107, "epoch": 2345} {"train_loss": -12.039840698242188, "global_step": 394108, "epoch": 2345} {"train_loss": -12.217982292175293, "global_step": 394109, "epoch": 2345} {"train_loss": -12.428239822387695, "global_step": 394110, "epoch": 2345} {"train_loss": -12.246941566467285, "global_step": 394111, "epoch": 2345} {"train_loss": -12.41571044921875, "global_step": 394112, "epoch": 2345} {"train_loss": -12.060784339904785, "global_step": 394113, "epoch": 2345} {"train_loss": -12.218780517578125, "global_step": 394114, "epoch": 2345} {"train_loss": -12.090877532958984, "global_step": 394115, "epoch": 2345} {"train_loss": -12.03605842590332, "global_step": 394116, "epoch": 2345} {"train_loss": -11.98653793334961, "global_step": 394117, "epoch": 2345} {"train_loss": -12.433771133422852, "global_step": 394118, "epoch": 2345} {"train_loss": -12.225561141967773, "global_step": 394119, "epoch": 2345} {"train_loss": -12.422876358032227, "global_step": 394120, "epoch": 2345} {"train_loss": -12.019672393798828, "global_step": 394121, "epoch": 2345} {"train_loss": -12.292113304138184, "global_step": 394122, "epoch": 2345} {"train_loss": -12.174242973327637, "global_step": 394123, "epoch": 2345} {"train_loss": -12.440177917480469, "global_step": 394124, "epoch": 2345} {"train_loss": -12.490716934204102, "global_step": 394125, "epoch": 2345} {"train_loss": -12.347902297973633, "global_step": 394126, "epoch": 2345} {"train_loss": -11.806862314542135, "global_step": 394127, "epoch": 2345, "val_loss": 298553.8125, "train_action_mse_error": 0.3901573419570923} {"train_loss": -11.932235717773438, "global_step": 394128, "epoch": 2346} {"train_loss": -12.00416374206543, "global_step": 394129, "epoch": 2346} {"train_loss": -11.789484024047852, "global_step": 394130, "epoch": 2346} {"train_loss": -11.718021392822266, "global_step": 394131, "epoch": 2346} {"train_loss": -12.030557632446289, "global_step": 394132, "epoch": 2346} {"train_loss": -11.794981002807617, "global_step": 394133, "epoch": 2346} {"train_loss": -11.27188491821289, "global_step": 394134, "epoch": 2346} {"train_loss": -12.023983001708984, "global_step": 394135, "epoch": 2346} {"train_loss": -11.885970115661621, "global_step": 394136, "epoch": 2346} {"train_loss": -11.63878345489502, "global_step": 394137, "epoch": 2346} {"train_loss": -11.933404922485352, "global_step": 394138, "epoch": 2346} {"train_loss": -12.003118515014648, "global_step": 394139, "epoch": 2346} {"train_loss": -11.406919479370117, "global_step": 394140, "epoch": 2346} {"train_loss": -12.41369915008545, "global_step": 394141, "epoch": 2346} {"train_loss": -11.90987777709961, "global_step": 394142, "epoch": 2346} {"train_loss": -12.242986679077148, "global_step": 394143, "epoch": 2346} {"train_loss": -12.347625732421875, "global_step": 394144, "epoch": 2346} {"train_loss": -12.26632308959961, "global_step": 394145, "epoch": 2346} {"train_loss": -12.342925071716309, "global_step": 394146, "epoch": 2346} {"train_loss": -12.3184175491333, "global_step": 394147, "epoch": 2346} {"train_loss": -12.419700622558594, "global_step": 394148, "epoch": 2346} {"train_loss": -12.294105529785156, "global_step": 394149, "epoch": 2346} {"train_loss": -12.486360549926758, "global_step": 394150, "epoch": 2346} {"train_loss": -12.24128532409668, "global_step": 394151, "epoch": 2346} {"train_loss": -12.356446266174316, "global_step": 394152, "epoch": 2346} {"train_loss": -12.419356346130371, "global_step": 394153, "epoch": 2346} {"train_loss": -12.614311218261719, "global_step": 394154, "epoch": 2346} {"train_loss": -12.546003341674805, "global_step": 394155, "epoch": 2346} {"train_loss": -12.436437606811523, "global_step": 394156, "epoch": 2346} {"train_loss": -12.533147811889648, "global_step": 394157, "epoch": 2346} {"train_loss": -12.351448059082031, "global_step": 394158, "epoch": 2346} {"train_loss": -12.46277904510498, "global_step": 394159, "epoch": 2346} {"train_loss": -12.323549270629883, "global_step": 394160, "epoch": 2346} {"train_loss": -12.026538848876953, "global_step": 394161, "epoch": 2346} {"train_loss": -12.732255935668945, "global_step": 394162, "epoch": 2346} {"train_loss": -12.087750434875488, "global_step": 394163, "epoch": 2346} {"train_loss": -12.430828094482422, "global_step": 394164, "epoch": 2346} {"train_loss": -12.277122497558594, "global_step": 394165, "epoch": 2346} {"train_loss": -12.28314208984375, "global_step": 394166, "epoch": 2346} {"train_loss": -12.41622257232666, "global_step": 394167, "epoch": 2346} {"train_loss": -12.243531227111816, "global_step": 394168, "epoch": 2346} {"train_loss": -12.599408149719238, "global_step": 394169, "epoch": 2346} {"train_loss": -12.188847541809082, "global_step": 394170, "epoch": 2346} {"train_loss": -12.097606658935547, "global_step": 394171, "epoch": 2346} {"train_loss": -12.292007446289062, "global_step": 394172, "epoch": 2346} {"train_loss": -12.283367156982422, "global_step": 394173, "epoch": 2346} {"train_loss": -12.589489936828613, "global_step": 394174, "epoch": 2346} {"train_loss": -12.167356491088867, "global_step": 394175, "epoch": 2346} {"train_loss": -11.880891799926758, "global_step": 394176, "epoch": 2346} {"train_loss": -12.555339813232422, "global_step": 394177, "epoch": 2346} {"train_loss": -12.358075141906738, "global_step": 394178, "epoch": 2346} {"train_loss": -12.058762550354004, "global_step": 394179, "epoch": 2346} {"train_loss": -12.373984336853027, "global_step": 394180, "epoch": 2346} {"train_loss": -11.977849960327148, "global_step": 394181, "epoch": 2346} {"train_loss": -12.292455673217773, "global_step": 394182, "epoch": 2346} {"train_loss": -12.104219436645508, "global_step": 394183, "epoch": 2346} {"train_loss": -12.562332153320312, "global_step": 394184, "epoch": 2346} {"train_loss": -12.396875381469727, "global_step": 394185, "epoch": 2346} {"train_loss": -12.586395263671875, "global_step": 394186, "epoch": 2346} {"train_loss": -12.452768325805664, "global_step": 394187, "epoch": 2346} {"train_loss": -12.718270301818848, "global_step": 394188, "epoch": 2346} {"train_loss": -12.369492530822754, "global_step": 394189, "epoch": 2346} {"train_loss": -11.964923858642578, "global_step": 394190, "epoch": 2346} {"train_loss": -12.582889556884766, "global_step": 394191, "epoch": 2346} {"train_loss": -12.4384126663208, "global_step": 394192, "epoch": 2346} {"train_loss": -11.620241165161133, "global_step": 394193, "epoch": 2346} {"train_loss": -11.529399871826172, "global_step": 394194, "epoch": 2346} {"train_loss": -12.174189567565918, "global_step": 394195, "epoch": 2346} {"train_loss": -12.315444946289062, "global_step": 394196, "epoch": 2346} {"train_loss": -10.885106086730957, "global_step": 394197, "epoch": 2346} {"train_loss": -11.820941925048828, "global_step": 394198, "epoch": 2346} {"train_loss": -12.358074188232422, "global_step": 394199, "epoch": 2346} {"train_loss": -10.987715721130371, "global_step": 394200, "epoch": 2346} {"train_loss": -12.195680618286133, "global_step": 394201, "epoch": 2346} {"train_loss": -11.364714622497559, "global_step": 394202, "epoch": 2346} {"train_loss": -11.785211563110352, "global_step": 394203, "epoch": 2346} {"train_loss": -11.750802040100098, "global_step": 394204, "epoch": 2346} {"train_loss": -11.888906478881836, "global_step": 394205, "epoch": 2346} {"train_loss": -12.070194244384766, "global_step": 394206, "epoch": 2346} {"train_loss": -11.845205307006836, "global_step": 394207, "epoch": 2346} {"train_loss": -11.539045333862305, "global_step": 394208, "epoch": 2346} {"train_loss": -12.070779800415039, "global_step": 394209, "epoch": 2346} {"train_loss": -10.893362998962402, "global_step": 394210, "epoch": 2346} {"train_loss": -11.746297836303711, "global_step": 394211, "epoch": 2346} {"train_loss": -11.783943176269531, "global_step": 394212, "epoch": 2346} {"train_loss": -11.514564514160156, "global_step": 394213, "epoch": 2346} {"train_loss": -12.14628791809082, "global_step": 394214, "epoch": 2346} {"train_loss": -11.585037231445312, "global_step": 394215, "epoch": 2346} {"train_loss": -10.826706886291504, "global_step": 394216, "epoch": 2346} {"train_loss": -12.25028133392334, "global_step": 394217, "epoch": 2346} {"train_loss": -10.722113609313965, "global_step": 394218, "epoch": 2346} {"train_loss": -11.979153633117676, "global_step": 394219, "epoch": 2346} {"train_loss": -11.170271873474121, "global_step": 394220, "epoch": 2346} {"train_loss": -10.240006446838379, "global_step": 394221, "epoch": 2346} {"train_loss": -12.411796569824219, "global_step": 394222, "epoch": 2346} {"train_loss": -10.324872970581055, "global_step": 394223, "epoch": 2346} {"train_loss": -12.012836456298828, "global_step": 394224, "epoch": 2346} {"train_loss": -11.644755363464355, "global_step": 394225, "epoch": 2346} {"train_loss": -11.73786735534668, "global_step": 394226, "epoch": 2346} {"train_loss": -12.137603759765625, "global_step": 394227, "epoch": 2346} {"train_loss": -12.265247344970703, "global_step": 394228, "epoch": 2346} {"train_loss": -12.232205390930176, "global_step": 394229, "epoch": 2346} {"train_loss": -12.178411483764648, "global_step": 394230, "epoch": 2346} {"train_loss": -12.049570083618164, "global_step": 394231, "epoch": 2346} {"train_loss": -12.325470924377441, "global_step": 394232, "epoch": 2346} {"train_loss": -11.904361724853516, "global_step": 394233, "epoch": 2346} {"train_loss": -11.945842742919922, "global_step": 394234, "epoch": 2346} {"train_loss": -12.169854164123535, "global_step": 394235, "epoch": 2346} {"train_loss": -11.926822662353516, "global_step": 394236, "epoch": 2346} {"train_loss": -12.236152648925781, "global_step": 394237, "epoch": 2346} {"train_loss": -12.19681167602539, "global_step": 394238, "epoch": 2346} {"train_loss": -12.360157012939453, "global_step": 394239, "epoch": 2346} {"train_loss": -12.163650512695312, "global_step": 394240, "epoch": 2346} {"train_loss": -12.39358139038086, "global_step": 394241, "epoch": 2346} {"train_loss": -11.967985153198242, "global_step": 394242, "epoch": 2346} {"train_loss": -12.170209884643555, "global_step": 394243, "epoch": 2346} {"train_loss": -12.033706665039062, "global_step": 394244, "epoch": 2346} {"train_loss": -11.975343704223633, "global_step": 394245, "epoch": 2346} {"train_loss": -12.254219055175781, "global_step": 394246, "epoch": 2346} {"train_loss": -12.004682540893555, "global_step": 394247, "epoch": 2346} {"train_loss": -12.24291706085205, "global_step": 394248, "epoch": 2346} {"train_loss": -11.529074668884277, "global_step": 394249, "epoch": 2346} {"train_loss": -12.006996154785156, "global_step": 394250, "epoch": 2346} {"train_loss": -11.919185638427734, "global_step": 394251, "epoch": 2346} {"train_loss": -11.2488431930542, "global_step": 394252, "epoch": 2346} {"train_loss": -12.120218276977539, "global_step": 394253, "epoch": 2346} {"train_loss": -11.909798622131348, "global_step": 394254, "epoch": 2346} {"train_loss": -10.850427627563477, "global_step": 394255, "epoch": 2346} {"train_loss": -12.137683868408203, "global_step": 394256, "epoch": 2346} {"train_loss": -11.344844818115234, "global_step": 394257, "epoch": 2346} {"train_loss": -11.679844856262207, "global_step": 394258, "epoch": 2346} {"train_loss": -11.923698425292969, "global_step": 394259, "epoch": 2346} {"train_loss": -11.41651439666748, "global_step": 394260, "epoch": 2346} {"train_loss": -11.059614181518555, "global_step": 394261, "epoch": 2346} {"train_loss": -11.972315788269043, "global_step": 394262, "epoch": 2346} {"train_loss": -10.556550979614258, "global_step": 394263, "epoch": 2346} {"train_loss": -11.91596794128418, "global_step": 394264, "epoch": 2346} {"train_loss": -10.978693008422852, "global_step": 394265, "epoch": 2346} {"train_loss": -12.025869369506836, "global_step": 394266, "epoch": 2346} {"train_loss": -10.31826114654541, "global_step": 394267, "epoch": 2346} {"train_loss": -11.288371086120605, "global_step": 394268, "epoch": 2346} {"train_loss": -10.351675987243652, "global_step": 394269, "epoch": 2346} {"train_loss": -12.103071212768555, "global_step": 394270, "epoch": 2346} {"train_loss": -10.468866348266602, "global_step": 394271, "epoch": 2346} {"train_loss": -12.25244140625, "global_step": 394272, "epoch": 2346} {"train_loss": -11.041028022766113, "global_step": 394273, "epoch": 2346} {"train_loss": -12.30886459350586, "global_step": 394274, "epoch": 2346} {"train_loss": -11.36854362487793, "global_step": 394275, "epoch": 2346} {"train_loss": -12.320443153381348, "global_step": 394276, "epoch": 2346} {"train_loss": -11.815887451171875, "global_step": 394277, "epoch": 2346} {"train_loss": -12.021495819091797, "global_step": 394278, "epoch": 2346} {"train_loss": -11.786951065063477, "global_step": 394279, "epoch": 2346} {"train_loss": -12.224231719970703, "global_step": 394280, "epoch": 2346} {"train_loss": -11.765467643737793, "global_step": 394281, "epoch": 2346} {"train_loss": -11.601400375366211, "global_step": 394282, "epoch": 2346} {"train_loss": -11.976509094238281, "global_step": 394283, "epoch": 2346} {"train_loss": -11.815887451171875, "global_step": 394284, "epoch": 2346} {"train_loss": -12.283187866210938, "global_step": 394285, "epoch": 2346} {"train_loss": -11.511592864990234, "global_step": 394286, "epoch": 2346} {"train_loss": -11.681561470031738, "global_step": 394287, "epoch": 2346} {"train_loss": -12.030668258666992, "global_step": 394288, "epoch": 2346} {"train_loss": -11.576704025268555, "global_step": 394289, "epoch": 2346} {"train_loss": -11.790397644042969, "global_step": 394290, "epoch": 2346} {"train_loss": -12.106558799743652, "global_step": 394291, "epoch": 2346} {"train_loss": -11.410886764526367, "global_step": 394292, "epoch": 2346} {"train_loss": -11.952582359313965, "global_step": 394293, "epoch": 2346} {"train_loss": -12.12962532043457, "global_step": 394294, "epoch": 2346} {"train_loss": -11.936895376160031, "global_step": 394295, "epoch": 2346, "val_loss": 300043.71875} {"train_loss": -12.247119903564453, "global_step": 394296, "epoch": 2347} {"train_loss": -11.812200546264648, "global_step": 394297, "epoch": 2347} {"train_loss": -12.139280319213867, "global_step": 394298, "epoch": 2347} {"train_loss": -11.824871063232422, "global_step": 394299, "epoch": 2347} {"train_loss": -12.325931549072266, "global_step": 394300, "epoch": 2347} {"train_loss": -12.148466110229492, "global_step": 394301, "epoch": 2347} {"train_loss": -12.395458221435547, "global_step": 394302, "epoch": 2347} {"train_loss": -12.25217056274414, "global_step": 394303, "epoch": 2347} {"train_loss": -12.283363342285156, "global_step": 394304, "epoch": 2347} {"train_loss": -12.114051818847656, "global_step": 394305, "epoch": 2347} {"train_loss": -11.7000732421875, "global_step": 394306, "epoch": 2347} {"train_loss": -11.6395263671875, "global_step": 394307, "epoch": 2347} {"train_loss": -11.96816635131836, "global_step": 394308, "epoch": 2347} {"train_loss": -11.086366653442383, "global_step": 394309, "epoch": 2347} {"train_loss": -12.112906455993652, "global_step": 394310, "epoch": 2347} {"train_loss": -11.52273941040039, "global_step": 394311, "epoch": 2347} {"train_loss": -11.5306978225708, "global_step": 394312, "epoch": 2347} {"train_loss": -11.827012062072754, "global_step": 394313, "epoch": 2347} {"train_loss": -11.479069709777832, "global_step": 394314, "epoch": 2347} {"train_loss": -11.680903434753418, "global_step": 394315, "epoch": 2347} {"train_loss": -11.677592277526855, "global_step": 394316, "epoch": 2347} {"train_loss": -11.474053382873535, "global_step": 394317, "epoch": 2347} {"train_loss": -12.264898300170898, "global_step": 394318, "epoch": 2347} {"train_loss": -11.218127250671387, "global_step": 394319, "epoch": 2347} {"train_loss": -11.46911907196045, "global_step": 394320, "epoch": 2347} {"train_loss": -11.999418258666992, "global_step": 394321, "epoch": 2347} {"train_loss": -10.97415828704834, "global_step": 394322, "epoch": 2347} {"train_loss": -11.834003448486328, "global_step": 394323, "epoch": 2347} {"train_loss": -11.845466613769531, "global_step": 394324, "epoch": 2347} {"train_loss": -11.962459564208984, "global_step": 394325, "epoch": 2347} {"train_loss": -12.193538665771484, "global_step": 394326, "epoch": 2347} {"train_loss": -12.139701843261719, "global_step": 394327, "epoch": 2347} {"train_loss": -12.239975929260254, "global_step": 394328, "epoch": 2347} {"train_loss": -12.035011291503906, "global_step": 394329, "epoch": 2347} {"train_loss": -12.24594783782959, "global_step": 394330, "epoch": 2347} {"train_loss": -11.915102005004883, "global_step": 394331, "epoch": 2347} {"train_loss": -11.85268783569336, "global_step": 394332, "epoch": 2347} {"train_loss": -12.347137451171875, "global_step": 394333, "epoch": 2347} {"train_loss": -11.673260688781738, "global_step": 394334, "epoch": 2347} {"train_loss": -12.18215560913086, "global_step": 394335, "epoch": 2347} {"train_loss": -11.95571231842041, "global_step": 394336, "epoch": 2347} {"train_loss": -11.147001266479492, "global_step": 394337, "epoch": 2347} {"train_loss": -12.051051139831543, "global_step": 394338, "epoch": 2347} {"train_loss": -12.060636520385742, "global_step": 394339, "epoch": 2347} {"train_loss": -11.57162857055664, "global_step": 394340, "epoch": 2347} {"train_loss": -12.114473342895508, "global_step": 394341, "epoch": 2347} {"train_loss": -11.664057731628418, "global_step": 394342, "epoch": 2347} {"train_loss": -11.823933601379395, "global_step": 394343, "epoch": 2347} {"train_loss": -11.947616577148438, "global_step": 394344, "epoch": 2347} {"train_loss": -11.888298034667969, "global_step": 394345, "epoch": 2347} {"train_loss": -11.971227645874023, "global_step": 394346, "epoch": 2347} {"train_loss": -12.077398300170898, "global_step": 394347, "epoch": 2347} {"train_loss": -11.901191711425781, "global_step": 394348, "epoch": 2347} {"train_loss": -12.085932731628418, "global_step": 394349, "epoch": 2347} {"train_loss": -11.87899398803711, "global_step": 394350, "epoch": 2347} {"train_loss": -10.891130447387695, "global_step": 394351, "epoch": 2347} {"train_loss": -11.941520690917969, "global_step": 394352, "epoch": 2347} {"train_loss": -11.61338996887207, "global_step": 394353, "epoch": 2347} {"train_loss": -11.491403579711914, "global_step": 394354, "epoch": 2347} {"train_loss": -12.191822052001953, "global_step": 394355, "epoch": 2347} {"train_loss": -11.434374809265137, "global_step": 394356, "epoch": 2347} {"train_loss": -12.245024681091309, "global_step": 394357, "epoch": 2347} {"train_loss": -11.986080169677734, "global_step": 394358, "epoch": 2347} {"train_loss": -12.071968078613281, "global_step": 394359, "epoch": 2347} {"train_loss": -12.157337188720703, "global_step": 394360, "epoch": 2347} {"train_loss": -11.830739974975586, "global_step": 394361, "epoch": 2347} {"train_loss": -12.53176498413086, "global_step": 394362, "epoch": 2347} {"train_loss": -12.410137176513672, "global_step": 394363, "epoch": 2347} {"train_loss": -12.353985786437988, "global_step": 394364, "epoch": 2347} {"train_loss": -12.163674354553223, "global_step": 394365, "epoch": 2347} {"train_loss": -12.343734741210938, "global_step": 394366, "epoch": 2347} {"train_loss": -12.387741088867188, "global_step": 394367, "epoch": 2347} {"train_loss": -12.335508346557617, "global_step": 394368, "epoch": 2347} {"train_loss": -12.166411399841309, "global_step": 394369, "epoch": 2347} {"train_loss": -12.185830116271973, "global_step": 394370, "epoch": 2347} {"train_loss": -12.28149700164795, "global_step": 394371, "epoch": 2347} {"train_loss": -12.275197982788086, "global_step": 394372, "epoch": 2347} {"train_loss": -12.583903312683105, "global_step": 394373, "epoch": 2347} {"train_loss": -12.500629425048828, "global_step": 394374, "epoch": 2347} {"train_loss": -12.485101699829102, "global_step": 394375, "epoch": 2347} {"train_loss": -12.194905281066895, "global_step": 394376, "epoch": 2347} {"train_loss": -12.371683120727539, "global_step": 394377, "epoch": 2347} {"train_loss": -12.345438003540039, "global_step": 394378, "epoch": 2347} {"train_loss": -12.243365287780762, "global_step": 394379, "epoch": 2347} {"train_loss": -12.595494270324707, "global_step": 394380, "epoch": 2347} {"train_loss": -12.306262969970703, "global_step": 394381, "epoch": 2347} {"train_loss": -12.661109924316406, "global_step": 394382, "epoch": 2347} {"train_loss": -12.375762939453125, "global_step": 394383, "epoch": 2347} {"train_loss": -12.610215187072754, "global_step": 394384, "epoch": 2347} {"train_loss": -12.505661010742188, "global_step": 394385, "epoch": 2347} {"train_loss": -12.432782173156738, "global_step": 394386, "epoch": 2347} {"train_loss": -12.501259803771973, "global_step": 394387, "epoch": 2347} {"train_loss": -12.24178695678711, "global_step": 394388, "epoch": 2347} {"train_loss": -12.623870849609375, "global_step": 394389, "epoch": 2347} {"train_loss": -12.307316780090332, "global_step": 394390, "epoch": 2347} {"train_loss": -12.662659645080566, "global_step": 394391, "epoch": 2347} {"train_loss": -12.507984161376953, "global_step": 394392, "epoch": 2347} {"train_loss": -12.444559097290039, "global_step": 394393, "epoch": 2347} {"train_loss": -12.46104621887207, "global_step": 394394, "epoch": 2347} {"train_loss": -12.370628356933594, "global_step": 394395, "epoch": 2347} {"train_loss": -12.491086959838867, "global_step": 394396, "epoch": 2347} {"train_loss": -12.425711631774902, "global_step": 394397, "epoch": 2347} {"train_loss": -12.445375442504883, "global_step": 394398, "epoch": 2347} {"train_loss": -12.713878631591797, "global_step": 394399, "epoch": 2347} {"train_loss": -12.714398384094238, "global_step": 394400, "epoch": 2347} {"train_loss": -12.588927268981934, "global_step": 394401, "epoch": 2347} {"train_loss": -12.187800407409668, "global_step": 394402, "epoch": 2347} {"train_loss": -12.602737426757812, "global_step": 394403, "epoch": 2347} {"train_loss": -12.434354782104492, "global_step": 394404, "epoch": 2347} {"train_loss": -12.212589263916016, "global_step": 394405, "epoch": 2347} {"train_loss": -12.553059577941895, "global_step": 394406, "epoch": 2347} {"train_loss": -12.095054626464844, "global_step": 394407, "epoch": 2347} {"train_loss": -11.9108247756958, "global_step": 394408, "epoch": 2347} {"train_loss": -12.708642959594727, "global_step": 394409, "epoch": 2347} {"train_loss": -12.674412727355957, "global_step": 394410, "epoch": 2347} {"train_loss": -11.767135620117188, "global_step": 394411, "epoch": 2347} {"train_loss": -12.574666976928711, "global_step": 394412, "epoch": 2347} {"train_loss": -12.089107513427734, "global_step": 394413, "epoch": 2347} {"train_loss": -12.376659393310547, "global_step": 394414, "epoch": 2347} {"train_loss": -12.258649826049805, "global_step": 394415, "epoch": 2347} {"train_loss": -12.347228050231934, "global_step": 394416, "epoch": 2347} {"train_loss": -12.179671287536621, "global_step": 394417, "epoch": 2347} {"train_loss": -12.485568046569824, "global_step": 394418, "epoch": 2347} {"train_loss": -12.48447036743164, "global_step": 394419, "epoch": 2347} {"train_loss": -12.55119514465332, "global_step": 394420, "epoch": 2347} {"train_loss": -12.300832748413086, "global_step": 394421, "epoch": 2347} {"train_loss": -12.510054588317871, "global_step": 394422, "epoch": 2347} {"train_loss": -12.50377082824707, "global_step": 394423, "epoch": 2347} {"train_loss": -12.02475357055664, "global_step": 394424, "epoch": 2347} {"train_loss": -11.69143295288086, "global_step": 394425, "epoch": 2347} {"train_loss": -12.32005500793457, "global_step": 394426, "epoch": 2347} {"train_loss": -12.516555786132812, "global_step": 394427, "epoch": 2347} {"train_loss": -12.26225757598877, "global_step": 394428, "epoch": 2347} {"train_loss": -12.194744110107422, "global_step": 394429, "epoch": 2347} {"train_loss": -12.616525650024414, "global_step": 394430, "epoch": 2347} {"train_loss": -12.34178352355957, "global_step": 394431, "epoch": 2347} {"train_loss": -11.939682006835938, "global_step": 394432, "epoch": 2347} {"train_loss": -12.158526420593262, "global_step": 394433, "epoch": 2347} {"train_loss": -12.479228973388672, "global_step": 394434, "epoch": 2347} {"train_loss": -12.31301498413086, "global_step": 394435, "epoch": 2347} {"train_loss": -12.075776100158691, "global_step": 394436, "epoch": 2347} {"train_loss": -12.094158172607422, "global_step": 394437, "epoch": 2347} {"train_loss": -12.531132698059082, "global_step": 394438, "epoch": 2347} {"train_loss": -12.425066947937012, "global_step": 394439, "epoch": 2347} {"train_loss": -12.624853134155273, "global_step": 394440, "epoch": 2347} {"train_loss": -12.567716598510742, "global_step": 394441, "epoch": 2347} {"train_loss": -12.602195739746094, "global_step": 394442, "epoch": 2347} {"train_loss": -12.633487701416016, "global_step": 394443, "epoch": 2347} {"train_loss": -12.310384750366211, "global_step": 394444, "epoch": 2347} {"train_loss": -11.914979934692383, "global_step": 394445, "epoch": 2347} {"train_loss": -12.479557037353516, "global_step": 394446, "epoch": 2347} {"train_loss": -12.035833358764648, "global_step": 394447, "epoch": 2347} {"train_loss": -12.593402862548828, "global_step": 394448, "epoch": 2347} {"train_loss": -12.472923278808594, "global_step": 394449, "epoch": 2347} {"train_loss": -12.0957612991333, "global_step": 394450, "epoch": 2347} {"train_loss": -12.397308349609375, "global_step": 394451, "epoch": 2347} {"train_loss": -12.207616806030273, "global_step": 394452, "epoch": 2347} {"train_loss": -12.418328285217285, "global_step": 394453, "epoch": 2347} {"train_loss": -11.674871444702148, "global_step": 394454, "epoch": 2347} {"train_loss": -11.533601760864258, "global_step": 394455, "epoch": 2347} {"train_loss": -11.897104263305664, "global_step": 394456, "epoch": 2347} {"train_loss": -11.505972862243652, "global_step": 394457, "epoch": 2347} {"train_loss": -11.521230697631836, "global_step": 394458, "epoch": 2347} {"train_loss": -10.268775939941406, "global_step": 394459, "epoch": 2347} {"train_loss": -11.570808410644531, "global_step": 394460, "epoch": 2347} {"train_loss": -11.708673477172852, "global_step": 394461, "epoch": 2347} {"train_loss": -9.611383438110352, "global_step": 394462, "epoch": 2347} {"train_loss": -12.113161887441363, "global_step": 394463, "epoch": 2347, "val_loss": 300368.875} {"train_loss": -10.970046997070312, "global_step": 394464, "epoch": 2348} {"train_loss": -9.730716705322266, "global_step": 394465, "epoch": 2348} {"train_loss": -11.211559295654297, "global_step": 394466, "epoch": 2348} {"train_loss": -9.861384391784668, "global_step": 394467, "epoch": 2348} {"train_loss": -10.267744064331055, "global_step": 394468, "epoch": 2348} {"train_loss": -11.060997009277344, "global_step": 394469, "epoch": 2348} {"train_loss": -9.610719680786133, "global_step": 394470, "epoch": 2348} {"train_loss": -11.250356674194336, "global_step": 394471, "epoch": 2348} {"train_loss": -10.202146530151367, "global_step": 394472, "epoch": 2348} {"train_loss": -10.663451194763184, "global_step": 394473, "epoch": 2348} {"train_loss": -11.100627899169922, "global_step": 394474, "epoch": 2348} {"train_loss": -10.812568664550781, "global_step": 394475, "epoch": 2348} {"train_loss": -11.117424011230469, "global_step": 394476, "epoch": 2348} {"train_loss": -10.166598320007324, "global_step": 394477, "epoch": 2348} {"train_loss": -11.794990539550781, "global_step": 394478, "epoch": 2348} {"train_loss": -10.727834701538086, "global_step": 394479, "epoch": 2348} {"train_loss": -11.03764533996582, "global_step": 394480, "epoch": 2348} {"train_loss": -11.462158203125, "global_step": 394481, "epoch": 2348} {"train_loss": -11.3811674118042, "global_step": 394482, "epoch": 2348} {"train_loss": -11.986732482910156, "global_step": 394483, "epoch": 2348} {"train_loss": -11.68203067779541, "global_step": 394484, "epoch": 2348} {"train_loss": -12.033466339111328, "global_step": 394485, "epoch": 2348} {"train_loss": -12.001019477844238, "global_step": 394486, "epoch": 2348} {"train_loss": -11.706319808959961, "global_step": 394487, "epoch": 2348} {"train_loss": -12.105533599853516, "global_step": 394488, "epoch": 2348} {"train_loss": -11.656820297241211, "global_step": 394489, "epoch": 2348} {"train_loss": -12.059040069580078, "global_step": 394490, "epoch": 2348} {"train_loss": -11.786066055297852, "global_step": 394491, "epoch": 2348} {"train_loss": -12.01148509979248, "global_step": 394492, "epoch": 2348} {"train_loss": -11.517199516296387, "global_step": 394493, "epoch": 2348} {"train_loss": -11.958398818969727, "global_step": 394494, "epoch": 2348} {"train_loss": -12.349065780639648, "global_step": 394495, "epoch": 2348} {"train_loss": -11.676826477050781, "global_step": 394496, "epoch": 2348} {"train_loss": -12.348363876342773, "global_step": 394497, "epoch": 2348} {"train_loss": -11.452838897705078, "global_step": 394498, "epoch": 2348} {"train_loss": -11.854804992675781, "global_step": 394499, "epoch": 2348} {"train_loss": -11.835941314697266, "global_step": 394500, "epoch": 2348} {"train_loss": -11.428531646728516, "global_step": 394501, "epoch": 2348} {"train_loss": -11.613486289978027, "global_step": 394502, "epoch": 2348} {"train_loss": -11.839935302734375, "global_step": 394503, "epoch": 2348} {"train_loss": -11.75709342956543, "global_step": 394504, "epoch": 2348} {"train_loss": -11.66775131225586, "global_step": 394505, "epoch": 2348} {"train_loss": -10.366284370422363, "global_step": 394506, "epoch": 2348} {"train_loss": -11.901412963867188, "global_step": 394507, "epoch": 2348} {"train_loss": -10.764334678649902, "global_step": 394508, "epoch": 2348} {"train_loss": -10.01738166809082, "global_step": 394509, "epoch": 2348} {"train_loss": -11.098302841186523, "global_step": 394510, "epoch": 2348} {"train_loss": -11.162565231323242, "global_step": 394511, "epoch": 2348} {"train_loss": -11.55418586730957, "global_step": 394512, "epoch": 2348} {"train_loss": -11.664876937866211, "global_step": 394513, "epoch": 2348} {"train_loss": -11.581657409667969, "global_step": 394514, "epoch": 2348} {"train_loss": -11.28934097290039, "global_step": 394515, "epoch": 2348} {"train_loss": -12.28079891204834, "global_step": 394516, "epoch": 2348} {"train_loss": -11.338607788085938, "global_step": 394517, "epoch": 2348} {"train_loss": -11.811084747314453, "global_step": 394518, "epoch": 2348} {"train_loss": -11.418601989746094, "global_step": 394519, "epoch": 2348} {"train_loss": -10.914974212646484, "global_step": 394520, "epoch": 2348} {"train_loss": -11.676578521728516, "global_step": 394521, "epoch": 2348} {"train_loss": -11.192462921142578, "global_step": 394522, "epoch": 2348} {"train_loss": -11.472770690917969, "global_step": 394523, "epoch": 2348} {"train_loss": -11.691900253295898, "global_step": 394524, "epoch": 2348} {"train_loss": -11.222793579101562, "global_step": 394525, "epoch": 2348} {"train_loss": -12.006824493408203, "global_step": 394526, "epoch": 2348} {"train_loss": -11.515029907226562, "global_step": 394527, "epoch": 2348} {"train_loss": -11.790224075317383, "global_step": 394528, "epoch": 2348} {"train_loss": -11.585376739501953, "global_step": 394529, "epoch": 2348} {"train_loss": -11.744270324707031, "global_step": 394530, "epoch": 2348} {"train_loss": -11.980154037475586, "global_step": 394531, "epoch": 2348} {"train_loss": -11.89678955078125, "global_step": 394532, "epoch": 2348} {"train_loss": -11.938302993774414, "global_step": 394533, "epoch": 2348} {"train_loss": -11.670492172241211, "global_step": 394534, "epoch": 2348} {"train_loss": -11.36767292022705, "global_step": 394535, "epoch": 2348} {"train_loss": -11.925176620483398, "global_step": 394536, "epoch": 2348} {"train_loss": -11.58297348022461, "global_step": 394537, "epoch": 2348} {"train_loss": -11.93697738647461, "global_step": 394538, "epoch": 2348} {"train_loss": -11.149614334106445, "global_step": 394539, "epoch": 2348} {"train_loss": -11.707083702087402, "global_step": 394540, "epoch": 2348} {"train_loss": -11.457029342651367, "global_step": 394541, "epoch": 2348} {"train_loss": -11.09786319732666, "global_step": 394542, "epoch": 2348} {"train_loss": -11.624316215515137, "global_step": 394543, "epoch": 2348} {"train_loss": -11.527231216430664, "global_step": 394544, "epoch": 2348} {"train_loss": -11.28432846069336, "global_step": 394545, "epoch": 2348} {"train_loss": -12.055464744567871, "global_step": 394546, "epoch": 2348} {"train_loss": -11.541546821594238, "global_step": 394547, "epoch": 2348} {"train_loss": -11.741992950439453, "global_step": 394548, "epoch": 2348} {"train_loss": -12.1837158203125, "global_step": 394549, "epoch": 2348} {"train_loss": -11.856521606445312, "global_step": 394550, "epoch": 2348} {"train_loss": -12.440001487731934, "global_step": 394551, "epoch": 2348} {"train_loss": -12.065631866455078, "global_step": 394552, "epoch": 2348} {"train_loss": -12.291094779968262, "global_step": 394553, "epoch": 2348} {"train_loss": -12.199867248535156, "global_step": 394554, "epoch": 2348} {"train_loss": -12.016473770141602, "global_step": 394555, "epoch": 2348} {"train_loss": -12.316169738769531, "global_step": 394556, "epoch": 2348} {"train_loss": -12.059700965881348, "global_step": 394557, "epoch": 2348} {"train_loss": -11.86771011352539, "global_step": 394558, "epoch": 2348} {"train_loss": -12.173760414123535, "global_step": 394559, "epoch": 2348} {"train_loss": -12.370015144348145, "global_step": 394560, "epoch": 2348} {"train_loss": -12.141709327697754, "global_step": 394561, "epoch": 2348} {"train_loss": -12.378668785095215, "global_step": 394562, "epoch": 2348} {"train_loss": -12.407805442810059, "global_step": 394563, "epoch": 2348} {"train_loss": -12.160853385925293, "global_step": 394564, "epoch": 2348} {"train_loss": -12.131078720092773, "global_step": 394565, "epoch": 2348} {"train_loss": -11.960309982299805, "global_step": 394566, "epoch": 2348} {"train_loss": -12.27536678314209, "global_step": 394567, "epoch": 2348} {"train_loss": -12.527481079101562, "global_step": 394568, "epoch": 2348} {"train_loss": -12.211831092834473, "global_step": 394569, "epoch": 2348} {"train_loss": -12.173768997192383, "global_step": 394570, "epoch": 2348} {"train_loss": -12.202564239501953, "global_step": 394571, "epoch": 2348} {"train_loss": -12.090906143188477, "global_step": 394572, "epoch": 2348} {"train_loss": -12.612602233886719, "global_step": 394573, "epoch": 2348} {"train_loss": -12.225727081298828, "global_step": 394574, "epoch": 2348} {"train_loss": -12.242271423339844, "global_step": 394575, "epoch": 2348} {"train_loss": -12.522920608520508, "global_step": 394576, "epoch": 2348} {"train_loss": -12.151863098144531, "global_step": 394577, "epoch": 2348} {"train_loss": -12.491034507751465, "global_step": 394578, "epoch": 2348} {"train_loss": -12.399413108825684, "global_step": 394579, "epoch": 2348} {"train_loss": -12.316892623901367, "global_step": 394580, "epoch": 2348} {"train_loss": -12.398306846618652, "global_step": 394581, "epoch": 2348} {"train_loss": -12.604379653930664, "global_step": 394582, "epoch": 2348} {"train_loss": -12.417862892150879, "global_step": 394583, "epoch": 2348} {"train_loss": -12.30638313293457, "global_step": 394584, "epoch": 2348} {"train_loss": -12.196484565734863, "global_step": 394585, "epoch": 2348} {"train_loss": -12.173469543457031, "global_step": 394586, "epoch": 2348} {"train_loss": -12.194863319396973, "global_step": 394587, "epoch": 2348} {"train_loss": -12.476431846618652, "global_step": 394588, "epoch": 2348} {"train_loss": -11.9472074508667, "global_step": 394589, "epoch": 2348} {"train_loss": -11.860816955566406, "global_step": 394590, "epoch": 2348} {"train_loss": -11.96096420288086, "global_step": 394591, "epoch": 2348} {"train_loss": -11.861652374267578, "global_step": 394592, "epoch": 2348} {"train_loss": -12.258007049560547, "global_step": 394593, "epoch": 2348} {"train_loss": -11.92379379272461, "global_step": 394594, "epoch": 2348} {"train_loss": -12.312881469726562, "global_step": 394595, "epoch": 2348} {"train_loss": -12.396642684936523, "global_step": 394596, "epoch": 2348} {"train_loss": -12.395133972167969, "global_step": 394597, "epoch": 2348} {"train_loss": -12.35560131072998, "global_step": 394598, "epoch": 2348} {"train_loss": -12.381402969360352, "global_step": 394599, "epoch": 2348} {"train_loss": -12.449761390686035, "global_step": 394600, "epoch": 2348} {"train_loss": -12.612401962280273, "global_step": 394601, "epoch": 2348} {"train_loss": -12.415290832519531, "global_step": 394602, "epoch": 2348} {"train_loss": -12.467361450195312, "global_step": 394603, "epoch": 2348} {"train_loss": -12.354780197143555, "global_step": 394604, "epoch": 2348} {"train_loss": -12.72039794921875, "global_step": 394605, "epoch": 2348} {"train_loss": -12.313087463378906, "global_step": 394606, "epoch": 2348} {"train_loss": -12.696396827697754, "global_step": 394607, "epoch": 2348} {"train_loss": -12.388202667236328, "global_step": 394608, "epoch": 2348} {"train_loss": -12.301389694213867, "global_step": 394609, "epoch": 2348} {"train_loss": -12.47503662109375, "global_step": 394610, "epoch": 2348} {"train_loss": -12.401683807373047, "global_step": 394611, "epoch": 2348} {"train_loss": -12.333724021911621, "global_step": 394612, "epoch": 2348} {"train_loss": -12.691141128540039, "global_step": 394613, "epoch": 2348} {"train_loss": -12.175384521484375, "global_step": 394614, "epoch": 2348} {"train_loss": -12.009702682495117, "global_step": 394615, "epoch": 2348} {"train_loss": -12.46064567565918, "global_step": 394616, "epoch": 2348} {"train_loss": -12.448491096496582, "global_step": 394617, "epoch": 2348} {"train_loss": -12.705885887145996, "global_step": 394618, "epoch": 2348} {"train_loss": -11.833597183227539, "global_step": 394619, "epoch": 2348} {"train_loss": -12.347528457641602, "global_step": 394620, "epoch": 2348} {"train_loss": -12.283317565917969, "global_step": 394621, "epoch": 2348} {"train_loss": -12.04306411743164, "global_step": 394622, "epoch": 2348} {"train_loss": -12.372920989990234, "global_step": 394623, "epoch": 2348} {"train_loss": -12.159770965576172, "global_step": 394624, "epoch": 2348} {"train_loss": -12.518292427062988, "global_step": 394625, "epoch": 2348} {"train_loss": -12.374702453613281, "global_step": 394626, "epoch": 2348} {"train_loss": -12.126331329345703, "global_step": 394627, "epoch": 2348} {"train_loss": -12.15945816040039, "global_step": 394628, "epoch": 2348} {"train_loss": -12.063207626342773, "global_step": 394629, "epoch": 2348} {"train_loss": -11.237509727478027, "global_step": 394630, "epoch": 2348} {"train_loss": -11.8437344062896, "global_step": 394631, "epoch": 2348, "val_loss": 299869.40625} {"train_loss": -12.273246765136719, "global_step": 394632, "epoch": 2349} {"train_loss": -12.733429908752441, "global_step": 394633, "epoch": 2349} {"train_loss": -12.331247329711914, "global_step": 394634, "epoch": 2349} {"train_loss": -12.37996768951416, "global_step": 394635, "epoch": 2349} {"train_loss": -12.225157737731934, "global_step": 394636, "epoch": 2349} {"train_loss": -11.691149711608887, "global_step": 394637, "epoch": 2349} {"train_loss": -11.586860656738281, "global_step": 394638, "epoch": 2349} {"train_loss": -11.859162330627441, "global_step": 394639, "epoch": 2349} {"train_loss": -11.976566314697266, "global_step": 394640, "epoch": 2349} {"train_loss": -12.193230628967285, "global_step": 394641, "epoch": 2349} {"train_loss": -11.95496940612793, "global_step": 394642, "epoch": 2349} {"train_loss": -12.312694549560547, "global_step": 394643, "epoch": 2349} {"train_loss": -11.938911437988281, "global_step": 394644, "epoch": 2349} {"train_loss": -11.486577033996582, "global_step": 394645, "epoch": 2349} {"train_loss": -11.233872413635254, "global_step": 394646, "epoch": 2349} {"train_loss": -11.967121124267578, "global_step": 394647, "epoch": 2349} {"train_loss": -11.669036865234375, "global_step": 394648, "epoch": 2349} {"train_loss": -10.630277633666992, "global_step": 394649, "epoch": 2349} {"train_loss": -12.09794807434082, "global_step": 394650, "epoch": 2349} {"train_loss": -10.597755432128906, "global_step": 394651, "epoch": 2349} {"train_loss": -11.334182739257812, "global_step": 394652, "epoch": 2349} {"train_loss": -11.544260025024414, "global_step": 394653, "epoch": 2349} {"train_loss": -9.365283966064453, "global_step": 394654, "epoch": 2349} {"train_loss": -11.09943675994873, "global_step": 394655, "epoch": 2349} {"train_loss": -8.813997268676758, "global_step": 394656, "epoch": 2349} {"train_loss": -8.102594375610352, "global_step": 394657, "epoch": 2349} {"train_loss": -7.880051136016846, "global_step": 394658, "epoch": 2349} {"train_loss": -7.383605003356934, "global_step": 394659, "epoch": 2349} {"train_loss": -8.21306037902832, "global_step": 394660, "epoch": 2349} {"train_loss": -8.200292587280273, "global_step": 394661, "epoch": 2349} {"train_loss": -9.370765686035156, "global_step": 394662, "epoch": 2349} {"train_loss": -10.558332443237305, "global_step": 394663, "epoch": 2349} {"train_loss": -9.972152709960938, "global_step": 394664, "epoch": 2349} {"train_loss": -8.995055198669434, "global_step": 394665, "epoch": 2349} {"train_loss": -9.189872741699219, "global_step": 394666, "epoch": 2349} {"train_loss": -10.127760887145996, "global_step": 394667, "epoch": 2349} {"train_loss": -10.851438522338867, "global_step": 394668, "epoch": 2349} {"train_loss": -9.766170501708984, "global_step": 394669, "epoch": 2349} {"train_loss": -9.925562858581543, "global_step": 394670, "epoch": 2349} {"train_loss": -10.720949172973633, "global_step": 394671, "epoch": 2349} {"train_loss": -11.281580924987793, "global_step": 394672, "epoch": 2349} {"train_loss": -9.917243957519531, "global_step": 394673, "epoch": 2349} {"train_loss": -10.73182201385498, "global_step": 394674, "epoch": 2349} {"train_loss": -11.073830604553223, "global_step": 394675, "epoch": 2349} {"train_loss": -11.371072769165039, "global_step": 394676, "epoch": 2349} {"train_loss": -10.548552513122559, "global_step": 394677, "epoch": 2349} {"train_loss": -11.843616485595703, "global_step": 394678, "epoch": 2349} {"train_loss": -11.265058517456055, "global_step": 394679, "epoch": 2349} {"train_loss": -11.738239288330078, "global_step": 394680, "epoch": 2349} {"train_loss": -10.258275985717773, "global_step": 394681, "epoch": 2349} {"train_loss": -11.260107040405273, "global_step": 394682, "epoch": 2349} {"train_loss": -10.472665786743164, "global_step": 394683, "epoch": 2349} {"train_loss": -11.377164840698242, "global_step": 394684, "epoch": 2349} {"train_loss": -10.719008445739746, "global_step": 394685, "epoch": 2349} {"train_loss": -11.016522407531738, "global_step": 394686, "epoch": 2349} {"train_loss": -11.186214447021484, "global_step": 394687, "epoch": 2349} {"train_loss": -11.051127433776855, "global_step": 394688, "epoch": 2349} {"train_loss": -11.644396781921387, "global_step": 394689, "epoch": 2349} {"train_loss": -11.069112777709961, "global_step": 394690, "epoch": 2349} {"train_loss": -12.089211463928223, "global_step": 394691, "epoch": 2349} {"train_loss": -11.349937438964844, "global_step": 394692, "epoch": 2349} {"train_loss": -11.899182319641113, "global_step": 394693, "epoch": 2349} {"train_loss": -11.844779968261719, "global_step": 394694, "epoch": 2349} {"train_loss": -11.773849487304688, "global_step": 394695, "epoch": 2349} {"train_loss": -11.815251350402832, "global_step": 394696, "epoch": 2349} {"train_loss": -12.0433349609375, "global_step": 394697, "epoch": 2349} {"train_loss": -11.924741744995117, "global_step": 394698, "epoch": 2349} {"train_loss": -12.061426162719727, "global_step": 394699, "epoch": 2349} {"train_loss": -11.964975357055664, "global_step": 394700, "epoch": 2349} {"train_loss": -12.055742263793945, "global_step": 394701, "epoch": 2349} {"train_loss": -12.185981750488281, "global_step": 394702, "epoch": 2349} {"train_loss": -12.057456970214844, "global_step": 394703, "epoch": 2349} {"train_loss": -12.283653259277344, "global_step": 394704, "epoch": 2349} {"train_loss": -12.055170059204102, "global_step": 394705, "epoch": 2349} {"train_loss": -11.919357299804688, "global_step": 394706, "epoch": 2349} {"train_loss": -11.985870361328125, "global_step": 394707, "epoch": 2349} {"train_loss": -12.01819896697998, "global_step": 394708, "epoch": 2349} {"train_loss": -12.437368392944336, "global_step": 394709, "epoch": 2349} {"train_loss": -12.227606773376465, "global_step": 394710, "epoch": 2349} {"train_loss": -11.970710754394531, "global_step": 394711, "epoch": 2349} {"train_loss": -12.319756507873535, "global_step": 394712, "epoch": 2349} {"train_loss": -12.078824996948242, "global_step": 394713, "epoch": 2349} {"train_loss": -12.477296829223633, "global_step": 394714, "epoch": 2349} {"train_loss": -12.442649841308594, "global_step": 394715, "epoch": 2349} {"train_loss": -12.273176193237305, "global_step": 394716, "epoch": 2349} {"train_loss": -12.432775497436523, "global_step": 394717, "epoch": 2349} {"train_loss": -12.274116516113281, "global_step": 394718, "epoch": 2349} {"train_loss": -12.358091354370117, "global_step": 394719, "epoch": 2349} {"train_loss": -12.252103805541992, "global_step": 394720, "epoch": 2349} {"train_loss": -12.292013168334961, "global_step": 394721, "epoch": 2349} {"train_loss": -12.380803108215332, "global_step": 394722, "epoch": 2349} {"train_loss": -12.480892181396484, "global_step": 394723, "epoch": 2349} {"train_loss": -12.37952709197998, "global_step": 394724, "epoch": 2349} {"train_loss": -12.706778526306152, "global_step": 394725, "epoch": 2349} {"train_loss": -12.42143440246582, "global_step": 394726, "epoch": 2349} {"train_loss": -12.19887924194336, "global_step": 394727, "epoch": 2349} {"train_loss": -12.424779891967773, "global_step": 394728, "epoch": 2349} {"train_loss": -12.336713790893555, "global_step": 394729, "epoch": 2349} {"train_loss": -12.466497421264648, "global_step": 394730, "epoch": 2349} {"train_loss": -12.433545112609863, "global_step": 394731, "epoch": 2349} {"train_loss": -12.251298904418945, "global_step": 394732, "epoch": 2349} {"train_loss": -12.734997749328613, "global_step": 394733, "epoch": 2349} {"train_loss": -12.382026672363281, "global_step": 394734, "epoch": 2349} {"train_loss": -12.585165023803711, "global_step": 394735, "epoch": 2349} {"train_loss": -12.194940567016602, "global_step": 394736, "epoch": 2349} {"train_loss": -12.567026138305664, "global_step": 394737, "epoch": 2349} {"train_loss": -12.311684608459473, "global_step": 394738, "epoch": 2349} {"train_loss": -12.544340133666992, "global_step": 394739, "epoch": 2349} {"train_loss": -12.695671081542969, "global_step": 394740, "epoch": 2349} {"train_loss": -12.620243072509766, "global_step": 394741, "epoch": 2349} {"train_loss": -12.424674987792969, "global_step": 394742, "epoch": 2349} {"train_loss": -12.486682891845703, "global_step": 394743, "epoch": 2349} {"train_loss": -12.827437400817871, "global_step": 394744, "epoch": 2349} {"train_loss": -12.41611099243164, "global_step": 394745, "epoch": 2349} {"train_loss": -12.616265296936035, "global_step": 394746, "epoch": 2349} {"train_loss": -12.583955764770508, "global_step": 394747, "epoch": 2349} {"train_loss": -12.70233154296875, "global_step": 394748, "epoch": 2349} {"train_loss": -12.608255386352539, "global_step": 394749, "epoch": 2349} {"train_loss": -12.674633979797363, "global_step": 394750, "epoch": 2349} {"train_loss": -12.692339897155762, "global_step": 394751, "epoch": 2349} {"train_loss": -12.575216293334961, "global_step": 394752, "epoch": 2349} {"train_loss": -12.760226249694824, "global_step": 394753, "epoch": 2349} {"train_loss": -12.688455581665039, "global_step": 394754, "epoch": 2349} {"train_loss": -12.684430122375488, "global_step": 394755, "epoch": 2349} {"train_loss": -12.738619804382324, "global_step": 394756, "epoch": 2349} {"train_loss": -12.509567260742188, "global_step": 394757, "epoch": 2349} {"train_loss": -12.666982650756836, "global_step": 394758, "epoch": 2349} {"train_loss": -12.818644523620605, "global_step": 394759, "epoch": 2349} {"train_loss": -12.634187698364258, "global_step": 394760, "epoch": 2349} {"train_loss": -12.608877182006836, "global_step": 394761, "epoch": 2349} {"train_loss": -12.980079650878906, "global_step": 394762, "epoch": 2349} {"train_loss": -12.774662017822266, "global_step": 394763, "epoch": 2349} {"train_loss": -12.7547025680542, "global_step": 394764, "epoch": 2349} {"train_loss": -12.52646541595459, "global_step": 394765, "epoch": 2349} {"train_loss": -12.757338523864746, "global_step": 394766, "epoch": 2349} {"train_loss": -12.904943466186523, "global_step": 394767, "epoch": 2349} {"train_loss": -12.721884727478027, "global_step": 394768, "epoch": 2349} {"train_loss": -12.719027519226074, "global_step": 394769, "epoch": 2349} {"train_loss": -13.069411277770996, "global_step": 394770, "epoch": 2349} {"train_loss": -12.962573051452637, "global_step": 394771, "epoch": 2349} {"train_loss": -12.826567649841309, "global_step": 394772, "epoch": 2349} {"train_loss": -12.912171363830566, "global_step": 394773, "epoch": 2349} {"train_loss": -12.844200134277344, "global_step": 394774, "epoch": 2349} {"train_loss": -12.692034721374512, "global_step": 394775, "epoch": 2349} {"train_loss": -12.943130493164062, "global_step": 394776, "epoch": 2349} {"train_loss": -12.804180145263672, "global_step": 394777, "epoch": 2349} {"train_loss": -12.848844528198242, "global_step": 394778, "epoch": 2349} {"train_loss": -12.655006408691406, "global_step": 394779, "epoch": 2349} {"train_loss": -12.591896057128906, "global_step": 394780, "epoch": 2349} {"train_loss": -12.723945617675781, "global_step": 394781, "epoch": 2349} {"train_loss": -12.441790580749512, "global_step": 394782, "epoch": 2349} {"train_loss": -12.309703826904297, "global_step": 394783, "epoch": 2349} {"train_loss": -12.591775894165039, "global_step": 394784, "epoch": 2349} {"train_loss": -12.597378730773926, "global_step": 394785, "epoch": 2349} {"train_loss": -12.783209800720215, "global_step": 394786, "epoch": 2349} {"train_loss": -12.12887191772461, "global_step": 394787, "epoch": 2349} {"train_loss": -11.50225830078125, "global_step": 394788, "epoch": 2349} {"train_loss": -12.131662368774414, "global_step": 394789, "epoch": 2349} {"train_loss": -12.543047904968262, "global_step": 394790, "epoch": 2349} {"train_loss": -11.408843994140625, "global_step": 394791, "epoch": 2349} {"train_loss": -10.960713386535645, "global_step": 394792, "epoch": 2349} {"train_loss": -11.253862380981445, "global_step": 394793, "epoch": 2349} {"train_loss": -11.992891311645508, "global_step": 394794, "epoch": 2349} {"train_loss": -10.433931350708008, "global_step": 394795, "epoch": 2349} {"train_loss": -10.679187774658203, "global_step": 394796, "epoch": 2349} {"train_loss": -10.14932632446289, "global_step": 394797, "epoch": 2349} {"train_loss": -10.40079116821289, "global_step": 394798, "epoch": 2349} {"train_loss": -11.786406803698767, "global_step": 394799, "epoch": 2349, "val_loss": 300974.84375} {"train_loss": -11.970100402832031, "global_step": 394800, "epoch": 2350} {"train_loss": -10.07693862915039, "global_step": 394801, "epoch": 2350} {"train_loss": -9.113567352294922, "global_step": 394802, "epoch": 2350} {"train_loss": -11.069032669067383, "global_step": 394803, "epoch": 2350} {"train_loss": -10.47945499420166, "global_step": 394804, "epoch": 2350} {"train_loss": -10.1841402053833, "global_step": 394805, "epoch": 2350} {"train_loss": -11.082626342773438, "global_step": 394806, "epoch": 2350} {"train_loss": -10.145767211914062, "global_step": 394807, "epoch": 2350} {"train_loss": -10.928852081298828, "global_step": 394808, "epoch": 2350} {"train_loss": -10.883773803710938, "global_step": 394809, "epoch": 2350} {"train_loss": -11.59627914428711, "global_step": 394810, "epoch": 2350} {"train_loss": -11.216917037963867, "global_step": 394811, "epoch": 2350} {"train_loss": -11.08001708984375, "global_step": 394812, "epoch": 2350} {"train_loss": -11.290632247924805, "global_step": 394813, "epoch": 2350} {"train_loss": -11.533384323120117, "global_step": 394814, "epoch": 2350} {"train_loss": -11.015088081359863, "global_step": 394815, "epoch": 2350} {"train_loss": -11.170763969421387, "global_step": 394816, "epoch": 2350} {"train_loss": -9.51501750946045, "global_step": 394817, "epoch": 2350} {"train_loss": -9.574451446533203, "global_step": 394818, "epoch": 2350} {"train_loss": -11.406845092773438, "global_step": 394819, "epoch": 2350} {"train_loss": -8.979720115661621, "global_step": 394820, "epoch": 2350} {"train_loss": -9.49303150177002, "global_step": 394821, "epoch": 2350} {"train_loss": -9.162847518920898, "global_step": 394822, "epoch": 2350} {"train_loss": -10.122110366821289, "global_step": 394823, "epoch": 2350} {"train_loss": -10.965346336364746, "global_step": 394824, "epoch": 2350} {"train_loss": -8.844438552856445, "global_step": 394825, "epoch": 2350} {"train_loss": -10.740388870239258, "global_step": 394826, "epoch": 2350} {"train_loss": -10.733211517333984, "global_step": 394827, "epoch": 2350} {"train_loss": -10.656577110290527, "global_step": 394828, "epoch": 2350} {"train_loss": -10.994611740112305, "global_step": 394829, "epoch": 2350} {"train_loss": -10.56004524230957, "global_step": 394830, "epoch": 2350} {"train_loss": -11.219602584838867, "global_step": 394831, "epoch": 2350} {"train_loss": -10.745683670043945, "global_step": 394832, "epoch": 2350} {"train_loss": -10.107741355895996, "global_step": 394833, "epoch": 2350} {"train_loss": -11.680526733398438, "global_step": 394834, "epoch": 2350} {"train_loss": -10.242865562438965, "global_step": 394835, "epoch": 2350} {"train_loss": -10.946995735168457, "global_step": 394836, "epoch": 2350} {"train_loss": -11.702072143554688, "global_step": 394837, "epoch": 2350} {"train_loss": -10.90268325805664, "global_step": 394838, "epoch": 2350} {"train_loss": -11.216968536376953, "global_step": 394839, "epoch": 2350} {"train_loss": -11.44758415222168, "global_step": 394840, "epoch": 2350} {"train_loss": -11.444585800170898, "global_step": 394841, "epoch": 2350} {"train_loss": -11.525617599487305, "global_step": 394842, "epoch": 2350} {"train_loss": -10.990331649780273, "global_step": 394843, "epoch": 2350} {"train_loss": -11.74105453491211, "global_step": 394844, "epoch": 2350} {"train_loss": -11.553546905517578, "global_step": 394845, "epoch": 2350} {"train_loss": -10.254863739013672, "global_step": 394846, "epoch": 2350} {"train_loss": -11.47339153289795, "global_step": 394847, "epoch": 2350} {"train_loss": -10.889885902404785, "global_step": 394848, "epoch": 2350} {"train_loss": -11.043981552124023, "global_step": 394849, "epoch": 2350} {"train_loss": -12.141243934631348, "global_step": 394850, "epoch": 2350} {"train_loss": -11.189733505249023, "global_step": 394851, "epoch": 2350} {"train_loss": -11.824000358581543, "global_step": 394852, "epoch": 2350} {"train_loss": -11.596817016601562, "global_step": 394853, "epoch": 2350} {"train_loss": -11.519996643066406, "global_step": 394854, "epoch": 2350} {"train_loss": -12.039432525634766, "global_step": 394855, "epoch": 2350} {"train_loss": -11.956897735595703, "global_step": 394856, "epoch": 2350} {"train_loss": -11.801640510559082, "global_step": 394857, "epoch": 2350} {"train_loss": -11.757261276245117, "global_step": 394858, "epoch": 2350} {"train_loss": -11.613645553588867, "global_step": 394859, "epoch": 2350} {"train_loss": -11.773588180541992, "global_step": 394860, "epoch": 2350} {"train_loss": -12.192980766296387, "global_step": 394861, "epoch": 2350} {"train_loss": -11.81783676147461, "global_step": 394862, "epoch": 2350} {"train_loss": -12.084357261657715, "global_step": 394863, "epoch": 2350} {"train_loss": -12.146951675415039, "global_step": 394864, "epoch": 2350} {"train_loss": -11.834210395812988, "global_step": 394865, "epoch": 2350} {"train_loss": -12.111505508422852, "global_step": 394866, "epoch": 2350} {"train_loss": -12.255043029785156, "global_step": 394867, "epoch": 2350} {"train_loss": -11.787141799926758, "global_step": 394868, "epoch": 2350} {"train_loss": -12.37451171875, "global_step": 394869, "epoch": 2350} {"train_loss": -12.133687973022461, "global_step": 394870, "epoch": 2350} {"train_loss": -12.23669719696045, "global_step": 394871, "epoch": 2350} {"train_loss": -12.255951881408691, "global_step": 394872, "epoch": 2350} {"train_loss": -12.128074645996094, "global_step": 394873, "epoch": 2350} {"train_loss": -12.275007247924805, "global_step": 394874, "epoch": 2350} {"train_loss": -12.203125953674316, "global_step": 394875, "epoch": 2350} {"train_loss": -12.164220809936523, "global_step": 394876, "epoch": 2350} {"train_loss": -12.163148880004883, "global_step": 394877, "epoch": 2350} {"train_loss": -12.23478889465332, "global_step": 394878, "epoch": 2350} {"train_loss": -12.414153099060059, "global_step": 394879, "epoch": 2350} {"train_loss": -12.127433776855469, "global_step": 394880, "epoch": 2350} {"train_loss": -12.362476348876953, "global_step": 394881, "epoch": 2350} {"train_loss": -12.502787590026855, "global_step": 394882, "epoch": 2350} {"train_loss": -12.385190963745117, "global_step": 394883, "epoch": 2350} {"train_loss": -12.512940406799316, "global_step": 394884, "epoch": 2350} {"train_loss": -12.373847007751465, "global_step": 394885, "epoch": 2350} {"train_loss": -12.36866283416748, "global_step": 394886, "epoch": 2350} {"train_loss": -12.465587615966797, "global_step": 394887, "epoch": 2350} {"train_loss": -12.59532356262207, "global_step": 394888, "epoch": 2350} {"train_loss": -12.488265037536621, "global_step": 394889, "epoch": 2350} {"train_loss": -12.349013328552246, "global_step": 394890, "epoch": 2350} {"train_loss": -12.543585777282715, "global_step": 394891, "epoch": 2350} {"train_loss": -12.556411743164062, "global_step": 394892, "epoch": 2350} {"train_loss": -12.692095756530762, "global_step": 394893, "epoch": 2350} {"train_loss": -12.551135063171387, "global_step": 394894, "epoch": 2350} {"train_loss": -12.482210159301758, "global_step": 394895, "epoch": 2350} {"train_loss": -12.410600662231445, "global_step": 394896, "epoch": 2350} {"train_loss": -12.62030029296875, "global_step": 394897, "epoch": 2350} {"train_loss": -12.67357063293457, "global_step": 394898, "epoch": 2350} {"train_loss": -12.565391540527344, "global_step": 394899, "epoch": 2350} {"train_loss": -12.517278671264648, "global_step": 394900, "epoch": 2350} {"train_loss": -12.546394348144531, "global_step": 394901, "epoch": 2350} {"train_loss": -12.592483520507812, "global_step": 394902, "epoch": 2350} {"train_loss": -12.533540725708008, "global_step": 394903, "epoch": 2350} {"train_loss": -12.658927917480469, "global_step": 394904, "epoch": 2350} {"train_loss": -12.525455474853516, "global_step": 394905, "epoch": 2350} {"train_loss": -12.541448593139648, "global_step": 394906, "epoch": 2350} {"train_loss": -12.886570930480957, "global_step": 394907, "epoch": 2350} {"train_loss": -12.655900955200195, "global_step": 394908, "epoch": 2350} {"train_loss": -12.67100715637207, "global_step": 394909, "epoch": 2350} {"train_loss": -12.612775802612305, "global_step": 394910, "epoch": 2350} {"train_loss": -12.486652374267578, "global_step": 394911, "epoch": 2350} {"train_loss": -12.361310958862305, "global_step": 394912, "epoch": 2350} {"train_loss": -12.40477180480957, "global_step": 394913, "epoch": 2350} {"train_loss": -12.723093032836914, "global_step": 394914, "epoch": 2350} {"train_loss": -12.755958557128906, "global_step": 394915, "epoch": 2350} {"train_loss": -12.724629402160645, "global_step": 394916, "epoch": 2350} {"train_loss": -12.731124877929688, "global_step": 394917, "epoch": 2350} {"train_loss": -12.57476806640625, "global_step": 394918, "epoch": 2350} {"train_loss": -12.592662811279297, "global_step": 394919, "epoch": 2350} {"train_loss": -12.349431991577148, "global_step": 394920, "epoch": 2350} {"train_loss": -12.636810302734375, "global_step": 394921, "epoch": 2350} {"train_loss": -12.550464630126953, "global_step": 394922, "epoch": 2350} {"train_loss": -12.333683013916016, "global_step": 394923, "epoch": 2350} {"train_loss": -12.60307502746582, "global_step": 394924, "epoch": 2350} {"train_loss": -12.79300308227539, "global_step": 394925, "epoch": 2350} {"train_loss": -12.381189346313477, "global_step": 394926, "epoch": 2350} {"train_loss": -12.941224098205566, "global_step": 394927, "epoch": 2350} {"train_loss": -12.361191749572754, "global_step": 394928, "epoch": 2350} {"train_loss": -12.24333381652832, "global_step": 394929, "epoch": 2350} {"train_loss": -12.351364135742188, "global_step": 394930, "epoch": 2350} {"train_loss": -12.628510475158691, "global_step": 394931, "epoch": 2350} {"train_loss": -12.284517288208008, "global_step": 394932, "epoch": 2350} {"train_loss": -12.242066383361816, "global_step": 394933, "epoch": 2350} {"train_loss": -12.823902130126953, "global_step": 394934, "epoch": 2350} {"train_loss": -12.334600448608398, "global_step": 394935, "epoch": 2350} {"train_loss": -11.970100402832031, "global_step": 394936, "epoch": 2350} {"train_loss": -12.037154197692871, "global_step": 394937, "epoch": 2350} {"train_loss": -12.487262725830078, "global_step": 394938, "epoch": 2350} {"train_loss": -12.034480094909668, "global_step": 394939, "epoch": 2350} {"train_loss": -11.448650360107422, "global_step": 394940, "epoch": 2350} {"train_loss": -12.247583389282227, "global_step": 394941, "epoch": 2350} {"train_loss": -12.044662475585938, "global_step": 394942, "epoch": 2350} {"train_loss": -11.220294952392578, "global_step": 394943, "epoch": 2350} {"train_loss": -11.948883056640625, "global_step": 394944, "epoch": 2350} {"train_loss": -12.351561546325684, "global_step": 394945, "epoch": 2350} {"train_loss": -12.195281982421875, "global_step": 394946, "epoch": 2350} {"train_loss": -11.887474060058594, "global_step": 394947, "epoch": 2350} {"train_loss": -12.478981018066406, "global_step": 394948, "epoch": 2350} {"train_loss": -10.836118698120117, "global_step": 394949, "epoch": 2350} {"train_loss": -11.279577255249023, "global_step": 394950, "epoch": 2350} {"train_loss": -12.301214218139648, "global_step": 394951, "epoch": 2350} {"train_loss": -11.47574234008789, "global_step": 394952, "epoch": 2350} {"train_loss": -11.314388275146484, "global_step": 394953, "epoch": 2350} {"train_loss": -12.094732284545898, "global_step": 394954, "epoch": 2350} {"train_loss": -10.850287437438965, "global_step": 394955, "epoch": 2350} {"train_loss": -11.667333602905273, "global_step": 394956, "epoch": 2350} {"train_loss": -10.103395462036133, "global_step": 394957, "epoch": 2350} {"train_loss": -11.890262603759766, "global_step": 394958, "epoch": 2350} {"train_loss": -9.028543472290039, "global_step": 394959, "epoch": 2350} {"train_loss": -8.106521606445312, "global_step": 394960, "epoch": 2350} {"train_loss": -7.821544170379639, "global_step": 394961, "epoch": 2350} {"train_loss": -8.54319953918457, "global_step": 394962, "epoch": 2350} {"train_loss": -9.181785583496094, "global_step": 394963, "epoch": 2350} {"train_loss": -10.128267288208008, "global_step": 394964, "epoch": 2350} {"train_loss": -10.28342056274414, "global_step": 394965, "epoch": 2350} {"train_loss": -9.448253631591797, "global_step": 394966, "epoch": 2350} {"train_loss": -11.616085418633052, "global_step": 394967, "epoch": 2350, "train/sim_max_reward_0": 0.5398483433127375, "train/sim_max_reward_1": 0.9831212926553724, "train/sim_max_reward_2": 0.02426523822607819, "train/sim_max_reward_3": 0.6871045922935591, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.5702213923999667, "test/sim_max_reward_4400000": 0.9334778562128172, "test/sim_max_reward_4400001": 0.3665064065951535, "test/sim_max_reward_4400002": 0.9887945803690582, "test/sim_max_reward_4400003": 0.31065726995056253, "test/sim_max_reward_4400004": 0.42197642794114065, "test/sim_max_reward_4400005": 0.9946026887662817, "test/sim_max_reward_4400006": 0.2427612862300619, "test/sim_max_reward_4400007": 0.4968644791900039, "test/sim_max_reward_4400008": 0.6151923974090718, "test/sim_max_reward_4400009": 0.327070173309846, "test/sim_max_reward_4400010": 0.9511553880574776, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 0.40213123705826387, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.5097764407160443, "test/sim_max_reward_4400015": 0.9351938550500094, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.10066088376342504, "test/sim_max_reward_4400018": 0.9723760010230038, "test/sim_max_reward_4400019": 0.17432400277136204, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.6601571711556772, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.00589689348845146, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.5745908022996311, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.17760751167823602, "test/sim_max_reward_4400028": 1.0, "test/sim_max_reward_4400029": 0.7633105548945774, "test/sim_max_reward_4400030": 0.9739887914983975, "test/sim_max_reward_4400031": 0.9952147139584151, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.5735201819241221, "test/sim_max_reward_4400034": 0.9687088595702805, "test/sim_max_reward_4400035": 0.5881600729164378, "test/sim_max_reward_4400036": 1.0, "test/sim_max_reward_4400037": 0.8731126058714227, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.18312466488557821, "test/sim_max_reward_4400042": 1.0, "test/sim_max_reward_4400043": 0.019913828622171705, "test/sim_max_reward_4400044": 0.5448608863423449, "test/sim_max_reward_4400045": 0.9226327221337729, "test/sim_max_reward_4400046": 0.33216884204376057, "test/sim_max_reward_4400047": 0.9862705179372189, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6340934764812857, "test/mean_score": 0.5597055613612408, "val_loss": 300810.40625, "train_action_mse_error": 0.8468916416168213} {"train_loss": -9.949065208435059, "global_step": 394968, "epoch": 2351} {"train_loss": -9.104145050048828, "global_step": 394969, "epoch": 2351} {"train_loss": -10.936220169067383, "global_step": 394970, "epoch": 2351} {"train_loss": -10.088495254516602, "global_step": 394971, "epoch": 2351} {"train_loss": -11.105888366699219, "global_step": 394972, "epoch": 2351} {"train_loss": -10.773021697998047, "global_step": 394973, "epoch": 2351} {"train_loss": -10.354730606079102, "global_step": 394974, "epoch": 2351} {"train_loss": -10.261801719665527, "global_step": 394975, "epoch": 2351} {"train_loss": -10.557560920715332, "global_step": 394976, "epoch": 2351} {"train_loss": -10.663660049438477, "global_step": 394977, "epoch": 2351} {"train_loss": -11.578695297241211, "global_step": 394978, "epoch": 2351} {"train_loss": -11.052696228027344, "global_step": 394979, "epoch": 2351} {"train_loss": -10.602540969848633, "global_step": 394980, "epoch": 2351} {"train_loss": -11.287620544433594, "global_step": 394981, "epoch": 2351} {"train_loss": -10.53272533416748, "global_step": 394982, "epoch": 2351} {"train_loss": -11.452153205871582, "global_step": 394983, "epoch": 2351} {"train_loss": -11.620260238647461, "global_step": 394984, "epoch": 2351} {"train_loss": -11.843201637268066, "global_step": 394985, "epoch": 2351} {"train_loss": -11.34533977508545, "global_step": 394986, "epoch": 2351} {"train_loss": -11.344736099243164, "global_step": 394987, "epoch": 2351} {"train_loss": -11.284189224243164, "global_step": 394988, "epoch": 2351} {"train_loss": -11.617673873901367, "global_step": 394989, "epoch": 2351} {"train_loss": -11.420865058898926, "global_step": 394990, "epoch": 2351} {"train_loss": -11.67564582824707, "global_step": 394991, "epoch": 2351} {"train_loss": -11.592126846313477, "global_step": 394992, "epoch": 2351} {"train_loss": -12.011262893676758, "global_step": 394993, "epoch": 2351} {"train_loss": -11.762149810791016, "global_step": 394994, "epoch": 2351} {"train_loss": -11.899139404296875, "global_step": 394995, "epoch": 2351} {"train_loss": -11.721654891967773, "global_step": 394996, "epoch": 2351} {"train_loss": -11.6443452835083, "global_step": 394997, "epoch": 2351} {"train_loss": -11.604930877685547, "global_step": 394998, "epoch": 2351} {"train_loss": -11.92308235168457, "global_step": 394999, "epoch": 2351} {"train_loss": -11.843997955322266, "global_step": 395000, "epoch": 2351} {"train_loss": -11.773107528686523, "global_step": 395001, "epoch": 2351} {"train_loss": -11.829710006713867, "global_step": 395002, "epoch": 2351} {"train_loss": -11.728736877441406, "global_step": 395003, "epoch": 2351} {"train_loss": -11.919659614562988, "global_step": 395004, "epoch": 2351} {"train_loss": -12.111250877380371, "global_step": 395005, "epoch": 2351} {"train_loss": -12.127914428710938, "global_step": 395006, "epoch": 2351} {"train_loss": -12.268725395202637, "global_step": 395007, "epoch": 2351} {"train_loss": -11.668652534484863, "global_step": 395008, "epoch": 2351} {"train_loss": -12.005906105041504, "global_step": 395009, "epoch": 2351} {"train_loss": -12.008606910705566, "global_step": 395010, "epoch": 2351} {"train_loss": -12.067831993103027, "global_step": 395011, "epoch": 2351} {"train_loss": -12.254722595214844, "global_step": 395012, "epoch": 2351} {"train_loss": -12.31572151184082, "global_step": 395013, "epoch": 2351} {"train_loss": -12.431659698486328, "global_step": 395014, "epoch": 2351} {"train_loss": -11.91531753540039, "global_step": 395015, "epoch": 2351} {"train_loss": -12.180902481079102, "global_step": 395016, "epoch": 2351} {"train_loss": -12.103801727294922, "global_step": 395017, "epoch": 2351} {"train_loss": -12.295724868774414, "global_step": 395018, "epoch": 2351} {"train_loss": -11.983393669128418, "global_step": 395019, "epoch": 2351} {"train_loss": -12.14062213897705, "global_step": 395020, "epoch": 2351} {"train_loss": -12.322977066040039, "global_step": 395021, "epoch": 2351} {"train_loss": -12.208024978637695, "global_step": 395022, "epoch": 2351} {"train_loss": -12.086017608642578, "global_step": 395023, "epoch": 2351} {"train_loss": -11.963454246520996, "global_step": 395024, "epoch": 2351} {"train_loss": -11.925735473632812, "global_step": 395025, "epoch": 2351} {"train_loss": -12.346002578735352, "global_step": 395026, "epoch": 2351} {"train_loss": -11.84909439086914, "global_step": 395027, "epoch": 2351} {"train_loss": -12.153276443481445, "global_step": 395028, "epoch": 2351} {"train_loss": -12.18794059753418, "global_step": 395029, "epoch": 2351} {"train_loss": -12.007296562194824, "global_step": 395030, "epoch": 2351} {"train_loss": -12.462082862854004, "global_step": 395031, "epoch": 2351} {"train_loss": -12.292057037353516, "global_step": 395032, "epoch": 2351} {"train_loss": -12.476762771606445, "global_step": 395033, "epoch": 2351} {"train_loss": -12.073914527893066, "global_step": 395034, "epoch": 2351} {"train_loss": -12.321266174316406, "global_step": 395035, "epoch": 2351} {"train_loss": -12.44327163696289, "global_step": 395036, "epoch": 2351} {"train_loss": -12.226261138916016, "global_step": 395037, "epoch": 2351} {"train_loss": -12.513463973999023, "global_step": 395038, "epoch": 2351} {"train_loss": -12.108830451965332, "global_step": 395039, "epoch": 2351} {"train_loss": -12.605084419250488, "global_step": 395040, "epoch": 2351} {"train_loss": -12.366491317749023, "global_step": 395041, "epoch": 2351} {"train_loss": -12.346491813659668, "global_step": 395042, "epoch": 2351} {"train_loss": -12.360636711120605, "global_step": 395043, "epoch": 2351} {"train_loss": -12.371532440185547, "global_step": 395044, "epoch": 2351} {"train_loss": -12.26388931274414, "global_step": 395045, "epoch": 2351} {"train_loss": -12.53408432006836, "global_step": 395046, "epoch": 2351} {"train_loss": -12.670263290405273, "global_step": 395047, "epoch": 2351} {"train_loss": -12.474101066589355, "global_step": 395048, "epoch": 2351} {"train_loss": -12.460733413696289, "global_step": 395049, "epoch": 2351} {"train_loss": -12.490667343139648, "global_step": 395050, "epoch": 2351} {"train_loss": -12.604060173034668, "global_step": 395051, "epoch": 2351} {"train_loss": -12.41083812713623, "global_step": 395052, "epoch": 2351} {"train_loss": -12.715621948242188, "global_step": 395053, "epoch": 2351} {"train_loss": -12.552816390991211, "global_step": 395054, "epoch": 2351} {"train_loss": -12.495647430419922, "global_step": 395055, "epoch": 2351} {"train_loss": -12.43780517578125, "global_step": 395056, "epoch": 2351} {"train_loss": -12.219100952148438, "global_step": 395057, "epoch": 2351} {"train_loss": -12.574317932128906, "global_step": 395058, "epoch": 2351} {"train_loss": -12.3923921585083, "global_step": 395059, "epoch": 2351} {"train_loss": -12.568460464477539, "global_step": 395060, "epoch": 2351} {"train_loss": -12.437283515930176, "global_step": 395061, "epoch": 2351} {"train_loss": -12.599508285522461, "global_step": 395062, "epoch": 2351} {"train_loss": -12.64114761352539, "global_step": 395063, "epoch": 2351} {"train_loss": -12.475105285644531, "global_step": 395064, "epoch": 2351} {"train_loss": -12.473224639892578, "global_step": 395065, "epoch": 2351} {"train_loss": -12.554021835327148, "global_step": 395066, "epoch": 2351} {"train_loss": -12.504878997802734, "global_step": 395067, "epoch": 2351} {"train_loss": -12.54374885559082, "global_step": 395068, "epoch": 2351} {"train_loss": -12.596908569335938, "global_step": 395069, "epoch": 2351} {"train_loss": -12.605931282043457, "global_step": 395070, "epoch": 2351} {"train_loss": -12.522247314453125, "global_step": 395071, "epoch": 2351} {"train_loss": -12.430584907531738, "global_step": 395072, "epoch": 2351} {"train_loss": -12.63742446899414, "global_step": 395073, "epoch": 2351} {"train_loss": -12.214361190795898, "global_step": 395074, "epoch": 2351} {"train_loss": -12.167257308959961, "global_step": 395075, "epoch": 2351} {"train_loss": -12.639047622680664, "global_step": 395076, "epoch": 2351} {"train_loss": -12.699836730957031, "global_step": 395077, "epoch": 2351} {"train_loss": -12.639331817626953, "global_step": 395078, "epoch": 2351} {"train_loss": -12.470842361450195, "global_step": 395079, "epoch": 2351} {"train_loss": -12.525145530700684, "global_step": 395080, "epoch": 2351} {"train_loss": -11.73431396484375, "global_step": 395081, "epoch": 2351} {"train_loss": -11.652863502502441, "global_step": 395082, "epoch": 2351} {"train_loss": -12.205257415771484, "global_step": 395083, "epoch": 2351} {"train_loss": -11.36929702758789, "global_step": 395084, "epoch": 2351} {"train_loss": -11.876846313476562, "global_step": 395085, "epoch": 2351} {"train_loss": -11.987665176391602, "global_step": 395086, "epoch": 2351} {"train_loss": -11.406027793884277, "global_step": 395087, "epoch": 2351} {"train_loss": -12.375285148620605, "global_step": 395088, "epoch": 2351} {"train_loss": -12.09172248840332, "global_step": 395089, "epoch": 2351} {"train_loss": -12.373479843139648, "global_step": 395090, "epoch": 2351} {"train_loss": -12.099283218383789, "global_step": 395091, "epoch": 2351} {"train_loss": -12.4946928024292, "global_step": 395092, "epoch": 2351} {"train_loss": -12.277473449707031, "global_step": 395093, "epoch": 2351} {"train_loss": -12.140314102172852, "global_step": 395094, "epoch": 2351} {"train_loss": -12.187214851379395, "global_step": 395095, "epoch": 2351} {"train_loss": -11.324414253234863, "global_step": 395096, "epoch": 2351} {"train_loss": -12.207771301269531, "global_step": 395097, "epoch": 2351} {"train_loss": -11.441293716430664, "global_step": 395098, "epoch": 2351} {"train_loss": -11.746339797973633, "global_step": 395099, "epoch": 2351} {"train_loss": -11.264424324035645, "global_step": 395100, "epoch": 2351} {"train_loss": -10.34957504272461, "global_step": 395101, "epoch": 2351} {"train_loss": -11.126869201660156, "global_step": 395102, "epoch": 2351} {"train_loss": -11.119464874267578, "global_step": 395103, "epoch": 2351} {"train_loss": -11.258644104003906, "global_step": 395104, "epoch": 2351} {"train_loss": -9.671062469482422, "global_step": 395105, "epoch": 2351} {"train_loss": -9.316400527954102, "global_step": 395106, "epoch": 2351} {"train_loss": -10.782917022705078, "global_step": 395107, "epoch": 2351} {"train_loss": -10.617134094238281, "global_step": 395108, "epoch": 2351} {"train_loss": -10.76789379119873, "global_step": 395109, "epoch": 2351} {"train_loss": -11.126379013061523, "global_step": 395110, "epoch": 2351} {"train_loss": -11.719198226928711, "global_step": 395111, "epoch": 2351} {"train_loss": -10.51112174987793, "global_step": 395112, "epoch": 2351} {"train_loss": -11.009843826293945, "global_step": 395113, "epoch": 2351} {"train_loss": -11.909543991088867, "global_step": 395114, "epoch": 2351} {"train_loss": -10.541597366333008, "global_step": 395115, "epoch": 2351} {"train_loss": -12.054191589355469, "global_step": 395116, "epoch": 2351} {"train_loss": -11.294116973876953, "global_step": 395117, "epoch": 2351} {"train_loss": -11.749382019042969, "global_step": 395118, "epoch": 2351} {"train_loss": -12.070274353027344, "global_step": 395119, "epoch": 2351} {"train_loss": -11.567777633666992, "global_step": 395120, "epoch": 2351} {"train_loss": -12.175714492797852, "global_step": 395121, "epoch": 2351} {"train_loss": -11.934637069702148, "global_step": 395122, "epoch": 2351} {"train_loss": -11.601030349731445, "global_step": 395123, "epoch": 2351} {"train_loss": -12.258935928344727, "global_step": 395124, "epoch": 2351} {"train_loss": -12.164530754089355, "global_step": 395125, "epoch": 2351} {"train_loss": -12.450996398925781, "global_step": 395126, "epoch": 2351} {"train_loss": -11.537065505981445, "global_step": 395127, "epoch": 2351} {"train_loss": -12.101885795593262, "global_step": 395128, "epoch": 2351} {"train_loss": -11.837682723999023, "global_step": 395129, "epoch": 2351} {"train_loss": -12.252506256103516, "global_step": 395130, "epoch": 2351} {"train_loss": -11.998022079467773, "global_step": 395131, "epoch": 2351} {"train_loss": -12.138172149658203, "global_step": 395132, "epoch": 2351} {"train_loss": -12.043546676635742, "global_step": 395133, "epoch": 2351} {"train_loss": -12.363580703735352, "global_step": 395134, "epoch": 2351} {"train_loss": -11.867653290430704, "global_step": 395135, "epoch": 2351, "val_loss": 299591.96875} {"train_loss": -12.251643180847168, "global_step": 395136, "epoch": 2352} {"train_loss": -12.241012573242188, "global_step": 395137, "epoch": 2352} {"train_loss": -12.284034729003906, "global_step": 395138, "epoch": 2352} {"train_loss": -12.077186584472656, "global_step": 395139, "epoch": 2352} {"train_loss": -12.195588111877441, "global_step": 395140, "epoch": 2352} {"train_loss": -12.075166702270508, "global_step": 395141, "epoch": 2352} {"train_loss": -12.245765686035156, "global_step": 395142, "epoch": 2352} {"train_loss": -12.450254440307617, "global_step": 395143, "epoch": 2352} {"train_loss": -12.12969970703125, "global_step": 395144, "epoch": 2352} {"train_loss": -12.32335090637207, "global_step": 395145, "epoch": 2352} {"train_loss": -12.395851135253906, "global_step": 395146, "epoch": 2352} {"train_loss": -12.51296329498291, "global_step": 395147, "epoch": 2352} {"train_loss": -12.543760299682617, "global_step": 395148, "epoch": 2352} {"train_loss": -12.347625732421875, "global_step": 395149, "epoch": 2352} {"train_loss": -12.274087905883789, "global_step": 395150, "epoch": 2352} {"train_loss": -12.610855102539062, "global_step": 395151, "epoch": 2352} {"train_loss": -12.367176055908203, "global_step": 395152, "epoch": 2352} {"train_loss": -12.81136703491211, "global_step": 395153, "epoch": 2352} {"train_loss": -12.57379150390625, "global_step": 395154, "epoch": 2352} {"train_loss": -12.58980655670166, "global_step": 395155, "epoch": 2352} {"train_loss": -12.528904914855957, "global_step": 395156, "epoch": 2352} {"train_loss": -12.58215618133545, "global_step": 395157, "epoch": 2352} {"train_loss": -12.712200164794922, "global_step": 395158, "epoch": 2352} {"train_loss": -12.686848640441895, "global_step": 395159, "epoch": 2352} {"train_loss": -12.461009979248047, "global_step": 395160, "epoch": 2352} {"train_loss": -12.501235961914062, "global_step": 395161, "epoch": 2352} {"train_loss": -12.473919868469238, "global_step": 395162, "epoch": 2352} {"train_loss": -12.452396392822266, "global_step": 395163, "epoch": 2352} {"train_loss": -12.2286376953125, "global_step": 395164, "epoch": 2352} {"train_loss": -12.622570037841797, "global_step": 395165, "epoch": 2352} {"train_loss": -12.460393905639648, "global_step": 395166, "epoch": 2352} {"train_loss": -12.584097862243652, "global_step": 395167, "epoch": 2352} {"train_loss": -12.44183349609375, "global_step": 395168, "epoch": 2352} {"train_loss": -12.802262306213379, "global_step": 395169, "epoch": 2352} {"train_loss": -12.64400863647461, "global_step": 395170, "epoch": 2352} {"train_loss": -12.60367202758789, "global_step": 395171, "epoch": 2352} {"train_loss": -12.60987663269043, "global_step": 395172, "epoch": 2352} {"train_loss": -12.602226257324219, "global_step": 395173, "epoch": 2352} {"train_loss": -12.652345657348633, "global_step": 395174, "epoch": 2352} {"train_loss": -12.359273910522461, "global_step": 395175, "epoch": 2352} {"train_loss": -12.142966270446777, "global_step": 395176, "epoch": 2352} {"train_loss": -12.60787582397461, "global_step": 395177, "epoch": 2352} {"train_loss": -12.068376541137695, "global_step": 395178, "epoch": 2352} {"train_loss": -12.201828002929688, "global_step": 395179, "epoch": 2352} {"train_loss": -11.888607025146484, "global_step": 395180, "epoch": 2352} {"train_loss": -11.650487899780273, "global_step": 395181, "epoch": 2352} {"train_loss": -12.551783561706543, "global_step": 395182, "epoch": 2352} {"train_loss": -11.702869415283203, "global_step": 395183, "epoch": 2352} {"train_loss": -10.6535005569458, "global_step": 395184, "epoch": 2352} {"train_loss": -12.552356719970703, "global_step": 395185, "epoch": 2352} {"train_loss": -11.772205352783203, "global_step": 395186, "epoch": 2352} {"train_loss": -11.37246036529541, "global_step": 395187, "epoch": 2352} {"train_loss": -11.406219482421875, "global_step": 395188, "epoch": 2352} {"train_loss": -10.85293197631836, "global_step": 395189, "epoch": 2352} {"train_loss": -12.010885238647461, "global_step": 395190, "epoch": 2352} {"train_loss": -10.581884384155273, "global_step": 395191, "epoch": 2352} {"train_loss": -12.067441940307617, "global_step": 395192, "epoch": 2352} {"train_loss": -9.895242691040039, "global_step": 395193, "epoch": 2352} {"train_loss": -11.845550537109375, "global_step": 395194, "epoch": 2352} {"train_loss": -10.770408630371094, "global_step": 395195, "epoch": 2352} {"train_loss": -10.925806999206543, "global_step": 395196, "epoch": 2352} {"train_loss": -11.876703262329102, "global_step": 395197, "epoch": 2352} {"train_loss": -10.410537719726562, "global_step": 395198, "epoch": 2352} {"train_loss": -12.146663665771484, "global_step": 395199, "epoch": 2352} {"train_loss": -10.942116737365723, "global_step": 395200, "epoch": 2352} {"train_loss": -11.529613494873047, "global_step": 395201, "epoch": 2352} {"train_loss": -10.791500091552734, "global_step": 395202, "epoch": 2352} {"train_loss": -11.763121604919434, "global_step": 395203, "epoch": 2352} {"train_loss": -10.711725234985352, "global_step": 395204, "epoch": 2352} {"train_loss": -9.20499324798584, "global_step": 395205, "epoch": 2352} {"train_loss": -12.063068389892578, "global_step": 395206, "epoch": 2352} {"train_loss": -9.788970947265625, "global_step": 395207, "epoch": 2352} {"train_loss": -11.075605392456055, "global_step": 395208, "epoch": 2352} {"train_loss": -10.924403190612793, "global_step": 395209, "epoch": 2352} {"train_loss": -11.948989868164062, "global_step": 395210, "epoch": 2352} {"train_loss": -10.026968002319336, "global_step": 395211, "epoch": 2352} {"train_loss": -10.741400718688965, "global_step": 395212, "epoch": 2352} {"train_loss": -10.860244750976562, "global_step": 395213, "epoch": 2352} {"train_loss": -10.419103622436523, "global_step": 395214, "epoch": 2352} {"train_loss": -9.965143203735352, "global_step": 395215, "epoch": 2352} {"train_loss": -10.432699203491211, "global_step": 395216, "epoch": 2352} {"train_loss": -10.4993896484375, "global_step": 395217, "epoch": 2352} {"train_loss": -10.61088752746582, "global_step": 395218, "epoch": 2352} {"train_loss": -10.819692611694336, "global_step": 395219, "epoch": 2352} {"train_loss": -11.2466402053833, "global_step": 395220, "epoch": 2352} {"train_loss": -10.873065948486328, "global_step": 395221, "epoch": 2352} {"train_loss": -11.16530990600586, "global_step": 395222, "epoch": 2352} {"train_loss": -11.581060409545898, "global_step": 395223, "epoch": 2352} {"train_loss": -11.249887466430664, "global_step": 395224, "epoch": 2352} {"train_loss": -11.845974922180176, "global_step": 395225, "epoch": 2352} {"train_loss": -11.496505737304688, "global_step": 395226, "epoch": 2352} {"train_loss": -11.853370666503906, "global_step": 395227, "epoch": 2352} {"train_loss": -11.678180694580078, "global_step": 395228, "epoch": 2352} {"train_loss": -11.81593132019043, "global_step": 395229, "epoch": 2352} {"train_loss": -11.680826187133789, "global_step": 395230, "epoch": 2352} {"train_loss": -12.050501823425293, "global_step": 395231, "epoch": 2352} {"train_loss": -11.707006454467773, "global_step": 395232, "epoch": 2352} {"train_loss": -11.933652877807617, "global_step": 395233, "epoch": 2352} {"train_loss": -12.010126113891602, "global_step": 395234, "epoch": 2352} {"train_loss": -11.835775375366211, "global_step": 395235, "epoch": 2352} {"train_loss": -12.268876075744629, "global_step": 395236, "epoch": 2352} {"train_loss": -12.155571937561035, "global_step": 395237, "epoch": 2352} {"train_loss": -12.030435562133789, "global_step": 395238, "epoch": 2352} {"train_loss": -12.233009338378906, "global_step": 395239, "epoch": 2352} {"train_loss": -12.285310745239258, "global_step": 395240, "epoch": 2352} {"train_loss": -12.500423431396484, "global_step": 395241, "epoch": 2352} {"train_loss": -12.098161697387695, "global_step": 395242, "epoch": 2352} {"train_loss": -12.230690002441406, "global_step": 395243, "epoch": 2352} {"train_loss": -12.293155670166016, "global_step": 395244, "epoch": 2352} {"train_loss": -11.888429641723633, "global_step": 395245, "epoch": 2352} {"train_loss": -12.196471214294434, "global_step": 395246, "epoch": 2352} {"train_loss": -12.33453369140625, "global_step": 395247, "epoch": 2352} {"train_loss": -12.399066925048828, "global_step": 395248, "epoch": 2352} {"train_loss": -12.184846878051758, "global_step": 395249, "epoch": 2352} {"train_loss": -12.280876159667969, "global_step": 395250, "epoch": 2352} {"train_loss": -12.402860641479492, "global_step": 395251, "epoch": 2352} {"train_loss": -12.068922996520996, "global_step": 395252, "epoch": 2352} {"train_loss": -12.248733520507812, "global_step": 395253, "epoch": 2352} {"train_loss": -12.187421798706055, "global_step": 395254, "epoch": 2352} {"train_loss": -12.409955024719238, "global_step": 395255, "epoch": 2352} {"train_loss": -12.482975006103516, "global_step": 395256, "epoch": 2352} {"train_loss": -12.11643123626709, "global_step": 395257, "epoch": 2352} {"train_loss": -12.585538864135742, "global_step": 395258, "epoch": 2352} {"train_loss": -12.153375625610352, "global_step": 395259, "epoch": 2352} {"train_loss": -12.549357414245605, "global_step": 395260, "epoch": 2352} {"train_loss": -12.532075881958008, "global_step": 395261, "epoch": 2352} {"train_loss": -12.26759147644043, "global_step": 395262, "epoch": 2352} {"train_loss": -12.376354217529297, "global_step": 395263, "epoch": 2352} {"train_loss": -12.370026588439941, "global_step": 395264, "epoch": 2352} {"train_loss": -12.547151565551758, "global_step": 395265, "epoch": 2352} {"train_loss": -12.501124382019043, "global_step": 395266, "epoch": 2352} {"train_loss": -12.495991706848145, "global_step": 395267, "epoch": 2352} {"train_loss": -12.242246627807617, "global_step": 395268, "epoch": 2352} {"train_loss": -12.555546760559082, "global_step": 395269, "epoch": 2352} {"train_loss": -12.771442413330078, "global_step": 395270, "epoch": 2352} {"train_loss": -12.399813652038574, "global_step": 395271, "epoch": 2352} {"train_loss": -12.377528190612793, "global_step": 395272, "epoch": 2352} {"train_loss": -12.592355728149414, "global_step": 395273, "epoch": 2352} {"train_loss": -12.566191673278809, "global_step": 395274, "epoch": 2352} {"train_loss": -12.526222229003906, "global_step": 395275, "epoch": 2352} {"train_loss": -12.416406631469727, "global_step": 395276, "epoch": 2352} {"train_loss": -12.51350212097168, "global_step": 395277, "epoch": 2352} {"train_loss": -12.72076416015625, "global_step": 395278, "epoch": 2352} {"train_loss": -12.70372200012207, "global_step": 395279, "epoch": 2352} {"train_loss": -12.403440475463867, "global_step": 395280, "epoch": 2352} {"train_loss": -12.614107131958008, "global_step": 395281, "epoch": 2352} {"train_loss": -12.648350715637207, "global_step": 395282, "epoch": 2352} {"train_loss": -12.666217803955078, "global_step": 395283, "epoch": 2352} {"train_loss": -12.3511962890625, "global_step": 395284, "epoch": 2352} {"train_loss": -12.481460571289062, "global_step": 395285, "epoch": 2352} {"train_loss": -12.710031509399414, "global_step": 395286, "epoch": 2352} {"train_loss": -12.551860809326172, "global_step": 395287, "epoch": 2352} {"train_loss": -12.683197975158691, "global_step": 395288, "epoch": 2352} {"train_loss": -12.565855026245117, "global_step": 395289, "epoch": 2352} {"train_loss": -12.530728340148926, "global_step": 395290, "epoch": 2352} {"train_loss": -12.647723197937012, "global_step": 395291, "epoch": 2352} {"train_loss": -12.576864242553711, "global_step": 395292, "epoch": 2352} {"train_loss": -12.815478324890137, "global_step": 395293, "epoch": 2352} {"train_loss": -12.43093490600586, "global_step": 395294, "epoch": 2352} {"train_loss": -12.768983840942383, "global_step": 395295, "epoch": 2352} {"train_loss": -12.868583679199219, "global_step": 395296, "epoch": 2352} {"train_loss": -12.525053024291992, "global_step": 395297, "epoch": 2352} {"train_loss": -12.723796844482422, "global_step": 395298, "epoch": 2352} {"train_loss": -12.916468620300293, "global_step": 395299, "epoch": 2352} {"train_loss": -12.77073860168457, "global_step": 395300, "epoch": 2352} {"train_loss": -12.940762519836426, "global_step": 395301, "epoch": 2352} {"train_loss": -12.453596115112305, "global_step": 395302, "epoch": 2352} {"train_loss": -12.053529029800778, "global_step": 395303, "epoch": 2352, "val_loss": 300452.5625} {"train_loss": -12.542571067810059, "global_step": 395304, "epoch": 2353} {"train_loss": -12.772768020629883, "global_step": 395305, "epoch": 2353} {"train_loss": -12.721556663513184, "global_step": 395306, "epoch": 2353} {"train_loss": -12.74925422668457, "global_step": 395307, "epoch": 2353} {"train_loss": -12.79772663116455, "global_step": 395308, "epoch": 2353} {"train_loss": -12.42448616027832, "global_step": 395309, "epoch": 2353} {"train_loss": -12.695103645324707, "global_step": 395310, "epoch": 2353} {"train_loss": -12.488513946533203, "global_step": 395311, "epoch": 2353} {"train_loss": -12.917442321777344, "global_step": 395312, "epoch": 2353} {"train_loss": -12.734087944030762, "global_step": 395313, "epoch": 2353} {"train_loss": -12.554496765136719, "global_step": 395314, "epoch": 2353} {"train_loss": -12.581711769104004, "global_step": 395315, "epoch": 2353} {"train_loss": -12.284934997558594, "global_step": 395316, "epoch": 2353} {"train_loss": -12.088971138000488, "global_step": 395317, "epoch": 2353} {"train_loss": -12.006091117858887, "global_step": 395318, "epoch": 2353} {"train_loss": -11.070796966552734, "global_step": 395319, "epoch": 2353} {"train_loss": -12.10154914855957, "global_step": 395320, "epoch": 2353} {"train_loss": -11.076530456542969, "global_step": 395321, "epoch": 2353} {"train_loss": -10.949136734008789, "global_step": 395322, "epoch": 2353} {"train_loss": -12.173093795776367, "global_step": 395323, "epoch": 2353} {"train_loss": -10.58582878112793, "global_step": 395324, "epoch": 2353} {"train_loss": -9.595108032226562, "global_step": 395325, "epoch": 2353} {"train_loss": -9.774664878845215, "global_step": 395326, "epoch": 2353} {"train_loss": -10.764759063720703, "global_step": 395327, "epoch": 2353} {"train_loss": -7.703665733337402, "global_step": 395328, "epoch": 2353} {"train_loss": -8.158426284790039, "global_step": 395329, "epoch": 2353} {"train_loss": -7.3827714920043945, "global_step": 395330, "epoch": 2353} {"train_loss": -7.774679183959961, "global_step": 395331, "epoch": 2353} {"train_loss": -7.765403747558594, "global_step": 395332, "epoch": 2353} {"train_loss": -7.514036178588867, "global_step": 395333, "epoch": 2353} {"train_loss": -8.591796875, "global_step": 395334, "epoch": 2353} {"train_loss": -6.4154052734375, "global_step": 395335, "epoch": 2353} {"train_loss": -9.30327033996582, "global_step": 395336, "epoch": 2353} {"train_loss": -7.92523717880249, "global_step": 395337, "epoch": 2353} {"train_loss": -7.019882678985596, "global_step": 395338, "epoch": 2353} {"train_loss": -6.917305946350098, "global_step": 395339, "epoch": 2353} {"train_loss": -7.268180847167969, "global_step": 395340, "epoch": 2353} {"train_loss": -7.658730983734131, "global_step": 395341, "epoch": 2353} {"train_loss": -7.79331111907959, "global_step": 395342, "epoch": 2353} {"train_loss": -8.207160949707031, "global_step": 395343, "epoch": 2353} {"train_loss": -8.29669189453125, "global_step": 395344, "epoch": 2353} {"train_loss": -8.009944915771484, "global_step": 395345, "epoch": 2353} {"train_loss": -8.734138488769531, "global_step": 395346, "epoch": 2353} {"train_loss": -9.11024284362793, "global_step": 395347, "epoch": 2353} {"train_loss": -9.011392593383789, "global_step": 395348, "epoch": 2353} {"train_loss": -8.464935302734375, "global_step": 395349, "epoch": 2353} {"train_loss": -9.13829517364502, "global_step": 395350, "epoch": 2353} {"train_loss": -9.686330795288086, "global_step": 395351, "epoch": 2353} {"train_loss": -9.565473556518555, "global_step": 395352, "epoch": 2353} {"train_loss": -9.64961051940918, "global_step": 395353, "epoch": 2353} {"train_loss": -9.96160888671875, "global_step": 395354, "epoch": 2353} {"train_loss": -10.025705337524414, "global_step": 395355, "epoch": 2353} {"train_loss": -10.607444763183594, "global_step": 395356, "epoch": 2353} {"train_loss": -10.878252029418945, "global_step": 395357, "epoch": 2353} {"train_loss": -10.583152770996094, "global_step": 395358, "epoch": 2353} {"train_loss": -10.633516311645508, "global_step": 395359, "epoch": 2353} {"train_loss": -10.939849853515625, "global_step": 395360, "epoch": 2353} {"train_loss": -11.020514488220215, "global_step": 395361, "epoch": 2353} {"train_loss": -11.23600959777832, "global_step": 395362, "epoch": 2353} {"train_loss": -11.116969108581543, "global_step": 395363, "epoch": 2353} {"train_loss": -11.562067031860352, "global_step": 395364, "epoch": 2353} {"train_loss": -11.354330062866211, "global_step": 395365, "epoch": 2353} {"train_loss": -11.660704612731934, "global_step": 395366, "epoch": 2353} {"train_loss": -11.331470489501953, "global_step": 395367, "epoch": 2353} {"train_loss": -11.862744331359863, "global_step": 395368, "epoch": 2353} {"train_loss": -11.557931900024414, "global_step": 395369, "epoch": 2353} {"train_loss": -12.109125137329102, "global_step": 395370, "epoch": 2353} {"train_loss": -11.381128311157227, "global_step": 395371, "epoch": 2353} {"train_loss": -11.969780921936035, "global_step": 395372, "epoch": 2353} {"train_loss": -11.576486587524414, "global_step": 395373, "epoch": 2353} {"train_loss": -11.93035888671875, "global_step": 395374, "epoch": 2353} {"train_loss": -11.545791625976562, "global_step": 395375, "epoch": 2353} {"train_loss": -11.81143569946289, "global_step": 395376, "epoch": 2353} {"train_loss": -11.52031135559082, "global_step": 395377, "epoch": 2353} {"train_loss": -11.578372955322266, "global_step": 395378, "epoch": 2353} {"train_loss": -11.057088851928711, "global_step": 395379, "epoch": 2353} {"train_loss": -10.982359886169434, "global_step": 395380, "epoch": 2353} {"train_loss": -11.68149185180664, "global_step": 395381, "epoch": 2353} {"train_loss": -11.653596878051758, "global_step": 395382, "epoch": 2353} {"train_loss": -11.925451278686523, "global_step": 395383, "epoch": 2353} {"train_loss": -11.833377838134766, "global_step": 395384, "epoch": 2353} {"train_loss": -11.771594047546387, "global_step": 395385, "epoch": 2353} {"train_loss": -12.067122459411621, "global_step": 395386, "epoch": 2353} {"train_loss": -11.824260711669922, "global_step": 395387, "epoch": 2353} {"train_loss": -12.28253173828125, "global_step": 395388, "epoch": 2353} {"train_loss": -11.748991012573242, "global_step": 395389, "epoch": 2353} {"train_loss": -11.967105865478516, "global_step": 395390, "epoch": 2353} {"train_loss": -11.756991386413574, "global_step": 395391, "epoch": 2353} {"train_loss": -12.047660827636719, "global_step": 395392, "epoch": 2353} {"train_loss": -12.077414512634277, "global_step": 395393, "epoch": 2353} {"train_loss": -12.128595352172852, "global_step": 395394, "epoch": 2353} {"train_loss": -12.080814361572266, "global_step": 395395, "epoch": 2353} {"train_loss": -12.308253288269043, "global_step": 395396, "epoch": 2353} {"train_loss": -12.041000366210938, "global_step": 395397, "epoch": 2353} {"train_loss": -12.262273788452148, "global_step": 395398, "epoch": 2353} {"train_loss": -12.296499252319336, "global_step": 395399, "epoch": 2353} {"train_loss": -12.194355010986328, "global_step": 395400, "epoch": 2353} {"train_loss": -12.160253524780273, "global_step": 395401, "epoch": 2353} {"train_loss": -12.067497253417969, "global_step": 395402, "epoch": 2353} {"train_loss": -12.414710998535156, "global_step": 395403, "epoch": 2353} {"train_loss": -12.047648429870605, "global_step": 395404, "epoch": 2353} {"train_loss": -12.361078262329102, "global_step": 395405, "epoch": 2353} {"train_loss": -11.880422592163086, "global_step": 395406, "epoch": 2353} {"train_loss": -12.11670207977295, "global_step": 395407, "epoch": 2353} {"train_loss": -11.97110366821289, "global_step": 395408, "epoch": 2353} {"train_loss": -12.168542861938477, "global_step": 395409, "epoch": 2353} {"train_loss": -12.279539108276367, "global_step": 395410, "epoch": 2353} {"train_loss": -12.301253318786621, "global_step": 395411, "epoch": 2353} {"train_loss": -12.27596664428711, "global_step": 395412, "epoch": 2353} {"train_loss": -12.524615287780762, "global_step": 395413, "epoch": 2353} {"train_loss": -12.392154693603516, "global_step": 395414, "epoch": 2353} {"train_loss": -12.28889274597168, "global_step": 395415, "epoch": 2353} {"train_loss": -12.42057991027832, "global_step": 395416, "epoch": 2353} {"train_loss": -12.49830436706543, "global_step": 395417, "epoch": 2353} {"train_loss": -12.549829483032227, "global_step": 395418, "epoch": 2353} {"train_loss": -12.581449508666992, "global_step": 395419, "epoch": 2353} {"train_loss": -12.520158767700195, "global_step": 395420, "epoch": 2353} {"train_loss": -12.41435432434082, "global_step": 395421, "epoch": 2353} {"train_loss": -12.542266845703125, "global_step": 395422, "epoch": 2353} {"train_loss": -12.499879837036133, "global_step": 395423, "epoch": 2353} {"train_loss": -12.514501571655273, "global_step": 395424, "epoch": 2353} {"train_loss": -12.644889831542969, "global_step": 395425, "epoch": 2353} {"train_loss": -12.486954689025879, "global_step": 395426, "epoch": 2353} {"train_loss": -12.703937530517578, "global_step": 395427, "epoch": 2353} {"train_loss": -12.386585235595703, "global_step": 395428, "epoch": 2353} {"train_loss": -12.456299781799316, "global_step": 395429, "epoch": 2353} {"train_loss": -12.673834800720215, "global_step": 395430, "epoch": 2353} {"train_loss": -12.310243606567383, "global_step": 395431, "epoch": 2353} {"train_loss": -12.717694282531738, "global_step": 395432, "epoch": 2353} {"train_loss": -12.56603717803955, "global_step": 395433, "epoch": 2353} {"train_loss": -12.801267623901367, "global_step": 395434, "epoch": 2353} {"train_loss": -12.561555862426758, "global_step": 395435, "epoch": 2353} {"train_loss": -12.645668029785156, "global_step": 395436, "epoch": 2353} {"train_loss": -12.792377471923828, "global_step": 395437, "epoch": 2353} {"train_loss": -12.537351608276367, "global_step": 395438, "epoch": 2353} {"train_loss": -12.652595520019531, "global_step": 395439, "epoch": 2353} {"train_loss": -12.498950958251953, "global_step": 395440, "epoch": 2353} {"train_loss": -12.508684158325195, "global_step": 395441, "epoch": 2353} {"train_loss": -12.577787399291992, "global_step": 395442, "epoch": 2353} {"train_loss": -12.68794059753418, "global_step": 395443, "epoch": 2353} {"train_loss": -12.640533447265625, "global_step": 395444, "epoch": 2353} {"train_loss": -12.434289932250977, "global_step": 395445, "epoch": 2353} {"train_loss": -12.618621826171875, "global_step": 395446, "epoch": 2353} {"train_loss": -12.91543960571289, "global_step": 395447, "epoch": 2353} {"train_loss": -12.680891036987305, "global_step": 395448, "epoch": 2353} {"train_loss": -12.45855712890625, "global_step": 395449, "epoch": 2353} {"train_loss": -12.774744033813477, "global_step": 395450, "epoch": 2353} {"train_loss": -12.641254425048828, "global_step": 395451, "epoch": 2353} {"train_loss": -12.439040184020996, "global_step": 395452, "epoch": 2353} {"train_loss": -12.515396118164062, "global_step": 395453, "epoch": 2353} {"train_loss": -12.407280921936035, "global_step": 395454, "epoch": 2353} {"train_loss": -12.51130485534668, "global_step": 395455, "epoch": 2353} {"train_loss": -12.268698692321777, "global_step": 395456, "epoch": 2353} {"train_loss": -12.483695983886719, "global_step": 395457, "epoch": 2353} {"train_loss": -12.462135314941406, "global_step": 395458, "epoch": 2353} {"train_loss": -12.2091064453125, "global_step": 395459, "epoch": 2353} {"train_loss": -11.644047737121582, "global_step": 395460, "epoch": 2353} {"train_loss": -11.285017013549805, "global_step": 395461, "epoch": 2353} {"train_loss": -11.742643356323242, "global_step": 395462, "epoch": 2353} {"train_loss": -12.019197463989258, "global_step": 395463, "epoch": 2353} {"train_loss": -11.120553970336914, "global_step": 395464, "epoch": 2353} {"train_loss": -11.976770401000977, "global_step": 395465, "epoch": 2353} {"train_loss": -11.492085456848145, "global_step": 395466, "epoch": 2353} {"train_loss": -11.48949146270752, "global_step": 395467, "epoch": 2353} {"train_loss": -10.43867015838623, "global_step": 395468, "epoch": 2353} {"train_loss": -11.701322555541992, "global_step": 395469, "epoch": 2353} {"train_loss": -9.010543823242188, "global_step": 395470, "epoch": 2353} {"train_loss": -11.384205945900508, "global_step": 395471, "epoch": 2353, "val_loss": 297783.78125} {"train_loss": -9.280563354492188, "global_step": 395472, "epoch": 2354} {"train_loss": -10.923176765441895, "global_step": 395473, "epoch": 2354} {"train_loss": -10.875985145568848, "global_step": 395474, "epoch": 2354} {"train_loss": -10.880575180053711, "global_step": 395475, "epoch": 2354} {"train_loss": -11.689128875732422, "global_step": 395476, "epoch": 2354} {"train_loss": -10.37668228149414, "global_step": 395477, "epoch": 2354} {"train_loss": -11.504894256591797, "global_step": 395478, "epoch": 2354} {"train_loss": -11.749184608459473, "global_step": 395479, "epoch": 2354} {"train_loss": -11.518184661865234, "global_step": 395480, "epoch": 2354} {"train_loss": -11.942841529846191, "global_step": 395481, "epoch": 2354} {"train_loss": -11.875527381896973, "global_step": 395482, "epoch": 2354} {"train_loss": -11.865999221801758, "global_step": 395483, "epoch": 2354} {"train_loss": -11.920686721801758, "global_step": 395484, "epoch": 2354} {"train_loss": -12.367368698120117, "global_step": 395485, "epoch": 2354} {"train_loss": -11.766607284545898, "global_step": 395486, "epoch": 2354} {"train_loss": -11.909221649169922, "global_step": 395487, "epoch": 2354} {"train_loss": -11.679389953613281, "global_step": 395488, "epoch": 2354} {"train_loss": -11.890260696411133, "global_step": 395489, "epoch": 2354} {"train_loss": -12.324944496154785, "global_step": 395490, "epoch": 2354} {"train_loss": -11.719252586364746, "global_step": 395491, "epoch": 2354} {"train_loss": -11.702583312988281, "global_step": 395492, "epoch": 2354} {"train_loss": -11.868121147155762, "global_step": 395493, "epoch": 2354} {"train_loss": -11.829089164733887, "global_step": 395494, "epoch": 2354} {"train_loss": -12.103355407714844, "global_step": 395495, "epoch": 2354} {"train_loss": -11.914749145507812, "global_step": 395496, "epoch": 2354} {"train_loss": -11.799824714660645, "global_step": 395497, "epoch": 2354} {"train_loss": -12.124160766601562, "global_step": 395498, "epoch": 2354} {"train_loss": -11.65172290802002, "global_step": 395499, "epoch": 2354} {"train_loss": -12.046801567077637, "global_step": 395500, "epoch": 2354} {"train_loss": -11.846390724182129, "global_step": 395501, "epoch": 2354} {"train_loss": -12.0374116897583, "global_step": 395502, "epoch": 2354} {"train_loss": -11.676891326904297, "global_step": 395503, "epoch": 2354} {"train_loss": -12.183612823486328, "global_step": 395504, "epoch": 2354} {"train_loss": -11.693445205688477, "global_step": 395505, "epoch": 2354} {"train_loss": -12.348808288574219, "global_step": 395506, "epoch": 2354} {"train_loss": -11.477624893188477, "global_step": 395507, "epoch": 2354} {"train_loss": -11.697471618652344, "global_step": 395508, "epoch": 2354} {"train_loss": -12.192005157470703, "global_step": 395509, "epoch": 2354} {"train_loss": -11.18073844909668, "global_step": 395510, "epoch": 2354} {"train_loss": -11.154328346252441, "global_step": 395511, "epoch": 2354} {"train_loss": -11.299083709716797, "global_step": 395512, "epoch": 2354} {"train_loss": -12.19705867767334, "global_step": 395513, "epoch": 2354} {"train_loss": -10.56252384185791, "global_step": 395514, "epoch": 2354} {"train_loss": -12.008209228515625, "global_step": 395515, "epoch": 2354} {"train_loss": -10.73869514465332, "global_step": 395516, "epoch": 2354} {"train_loss": -11.564013481140137, "global_step": 395517, "epoch": 2354} {"train_loss": -11.360323905944824, "global_step": 395518, "epoch": 2354} {"train_loss": -11.651338577270508, "global_step": 395519, "epoch": 2354} {"train_loss": -11.874473571777344, "global_step": 395520, "epoch": 2354} {"train_loss": -11.908341407775879, "global_step": 395521, "epoch": 2354} {"train_loss": -12.028226852416992, "global_step": 395522, "epoch": 2354} {"train_loss": -11.586614608764648, "global_step": 395523, "epoch": 2354} {"train_loss": -11.495399475097656, "global_step": 395524, "epoch": 2354} {"train_loss": -12.19074821472168, "global_step": 395525, "epoch": 2354} {"train_loss": -11.47713851928711, "global_step": 395526, "epoch": 2354} {"train_loss": -12.115736961364746, "global_step": 395527, "epoch": 2354} {"train_loss": -11.682157516479492, "global_step": 395528, "epoch": 2354} {"train_loss": -11.907190322875977, "global_step": 395529, "epoch": 2354} {"train_loss": -11.973583221435547, "global_step": 395530, "epoch": 2354} {"train_loss": -11.591270446777344, "global_step": 395531, "epoch": 2354} {"train_loss": -12.188668251037598, "global_step": 395532, "epoch": 2354} {"train_loss": -11.22146987915039, "global_step": 395533, "epoch": 2354} {"train_loss": -12.080045700073242, "global_step": 395534, "epoch": 2354} {"train_loss": -11.264787673950195, "global_step": 395535, "epoch": 2354} {"train_loss": -12.102943420410156, "global_step": 395536, "epoch": 2354} {"train_loss": -11.47219181060791, "global_step": 395537, "epoch": 2354} {"train_loss": -11.588969230651855, "global_step": 395538, "epoch": 2354} {"train_loss": -11.222467422485352, "global_step": 395539, "epoch": 2354} {"train_loss": -11.55604076385498, "global_step": 395540, "epoch": 2354} {"train_loss": -11.405125617980957, "global_step": 395541, "epoch": 2354} {"train_loss": -11.917778015136719, "global_step": 395542, "epoch": 2354} {"train_loss": -11.618630409240723, "global_step": 395543, "epoch": 2354} {"train_loss": -11.591705322265625, "global_step": 395544, "epoch": 2354} {"train_loss": -11.941130638122559, "global_step": 395545, "epoch": 2354} {"train_loss": -11.380586624145508, "global_step": 395546, "epoch": 2354} {"train_loss": -12.330997467041016, "global_step": 395547, "epoch": 2354} {"train_loss": -11.524590492248535, "global_step": 395548, "epoch": 2354} {"train_loss": -12.247360229492188, "global_step": 395549, "epoch": 2354} {"train_loss": -11.754514694213867, "global_step": 395550, "epoch": 2354} {"train_loss": -12.09956169128418, "global_step": 395551, "epoch": 2354} {"train_loss": -12.110025405883789, "global_step": 395552, "epoch": 2354} {"train_loss": -12.123916625976562, "global_step": 395553, "epoch": 2354} {"train_loss": -11.926047325134277, "global_step": 395554, "epoch": 2354} {"train_loss": -12.311849594116211, "global_step": 395555, "epoch": 2354} {"train_loss": -12.40550422668457, "global_step": 395556, "epoch": 2354} {"train_loss": -12.211215019226074, "global_step": 395557, "epoch": 2354} {"train_loss": -12.455092430114746, "global_step": 395558, "epoch": 2354} {"train_loss": -12.393278121948242, "global_step": 395559, "epoch": 2354} {"train_loss": -12.278681755065918, "global_step": 395560, "epoch": 2354} {"train_loss": -12.429849624633789, "global_step": 395561, "epoch": 2354} {"train_loss": -12.535560607910156, "global_step": 395562, "epoch": 2354} {"train_loss": -12.603106498718262, "global_step": 395563, "epoch": 2354} {"train_loss": -12.309085845947266, "global_step": 395564, "epoch": 2354} {"train_loss": -12.114838600158691, "global_step": 395565, "epoch": 2354} {"train_loss": -12.373528480529785, "global_step": 395566, "epoch": 2354} {"train_loss": -12.245841979980469, "global_step": 395567, "epoch": 2354} {"train_loss": -12.529870986938477, "global_step": 395568, "epoch": 2354} {"train_loss": -12.333358764648438, "global_step": 395569, "epoch": 2354} {"train_loss": -12.647369384765625, "global_step": 395570, "epoch": 2354} {"train_loss": -12.319368362426758, "global_step": 395571, "epoch": 2354} {"train_loss": -12.458375930786133, "global_step": 395572, "epoch": 2354} {"train_loss": -12.147393226623535, "global_step": 395573, "epoch": 2354} {"train_loss": -12.508941650390625, "global_step": 395574, "epoch": 2354} {"train_loss": -12.295879364013672, "global_step": 395575, "epoch": 2354} {"train_loss": -12.45669174194336, "global_step": 395576, "epoch": 2354} {"train_loss": -12.51144027709961, "global_step": 395577, "epoch": 2354} {"train_loss": -12.579317092895508, "global_step": 395578, "epoch": 2354} {"train_loss": -12.46631145477295, "global_step": 395579, "epoch": 2354} {"train_loss": -12.137415885925293, "global_step": 395580, "epoch": 2354} {"train_loss": -12.59166145324707, "global_step": 395581, "epoch": 2354} {"train_loss": -12.381978988647461, "global_step": 395582, "epoch": 2354} {"train_loss": -12.253110885620117, "global_step": 395583, "epoch": 2354} {"train_loss": -12.694133758544922, "global_step": 395584, "epoch": 2354} {"train_loss": -12.462736129760742, "global_step": 395585, "epoch": 2354} {"train_loss": -12.24079418182373, "global_step": 395586, "epoch": 2354} {"train_loss": -12.8573579788208, "global_step": 395587, "epoch": 2354} {"train_loss": -12.232004165649414, "global_step": 395588, "epoch": 2354} {"train_loss": -11.851534843444824, "global_step": 395589, "epoch": 2354} {"train_loss": -12.419830322265625, "global_step": 395590, "epoch": 2354} {"train_loss": -12.144774436950684, "global_step": 395591, "epoch": 2354} {"train_loss": -11.975016593933105, "global_step": 395592, "epoch": 2354} {"train_loss": -12.03396224975586, "global_step": 395593, "epoch": 2354} {"train_loss": -12.534940719604492, "global_step": 395594, "epoch": 2354} {"train_loss": -11.338582992553711, "global_step": 395595, "epoch": 2354} {"train_loss": -11.655960083007812, "global_step": 395596, "epoch": 2354} {"train_loss": -12.214747428894043, "global_step": 395597, "epoch": 2354} {"train_loss": -11.469137191772461, "global_step": 395598, "epoch": 2354} {"train_loss": -11.152519226074219, "global_step": 395599, "epoch": 2354} {"train_loss": -12.328420639038086, "global_step": 395600, "epoch": 2354} {"train_loss": -11.420612335205078, "global_step": 395601, "epoch": 2354} {"train_loss": -11.98802375793457, "global_step": 395602, "epoch": 2354} {"train_loss": -12.293794631958008, "global_step": 395603, "epoch": 2354} {"train_loss": -12.204582214355469, "global_step": 395604, "epoch": 2354} {"train_loss": -12.507332801818848, "global_step": 395605, "epoch": 2354} {"train_loss": -12.379892349243164, "global_step": 395606, "epoch": 2354} {"train_loss": -12.508993148803711, "global_step": 395607, "epoch": 2354} {"train_loss": -12.430139541625977, "global_step": 395608, "epoch": 2354} {"train_loss": -12.567560195922852, "global_step": 395609, "epoch": 2354} {"train_loss": -12.328523635864258, "global_step": 395610, "epoch": 2354} {"train_loss": -12.378314971923828, "global_step": 395611, "epoch": 2354} {"train_loss": -12.195619583129883, "global_step": 395612, "epoch": 2354} {"train_loss": -12.238190650939941, "global_step": 395613, "epoch": 2354} {"train_loss": -12.56623363494873, "global_step": 395614, "epoch": 2354} {"train_loss": -12.58367919921875, "global_step": 395615, "epoch": 2354} {"train_loss": -12.456883430480957, "global_step": 395616, "epoch": 2354} {"train_loss": -12.5469331741333, "global_step": 395617, "epoch": 2354} {"train_loss": -12.4765625, "global_step": 395618, "epoch": 2354} {"train_loss": -12.604541778564453, "global_step": 395619, "epoch": 2354} {"train_loss": -12.531193733215332, "global_step": 395620, "epoch": 2354} {"train_loss": -12.475908279418945, "global_step": 395621, "epoch": 2354} {"train_loss": -12.319150924682617, "global_step": 395622, "epoch": 2354} {"train_loss": -12.496223449707031, "global_step": 395623, "epoch": 2354} {"train_loss": -12.323429107666016, "global_step": 395624, "epoch": 2354} {"train_loss": -12.101055145263672, "global_step": 395625, "epoch": 2354} {"train_loss": -12.652318954467773, "global_step": 395626, "epoch": 2354} {"train_loss": -12.362833023071289, "global_step": 395627, "epoch": 2354} {"train_loss": -12.05677604675293, "global_step": 395628, "epoch": 2354} {"train_loss": -11.74879264831543, "global_step": 395629, "epoch": 2354} {"train_loss": -11.874704360961914, "global_step": 395630, "epoch": 2354} {"train_loss": -12.225374221801758, "global_step": 395631, "epoch": 2354} {"train_loss": -11.689678192138672, "global_step": 395632, "epoch": 2354} {"train_loss": -12.45660400390625, "global_step": 395633, "epoch": 2354} {"train_loss": -11.832907676696777, "global_step": 395634, "epoch": 2354} {"train_loss": -12.037322998046875, "global_step": 395635, "epoch": 2354} {"train_loss": -11.251304626464844, "global_step": 395636, "epoch": 2354} {"train_loss": -12.317181587219238, "global_step": 395637, "epoch": 2354} {"train_loss": -11.114217758178711, "global_step": 395638, "epoch": 2354} {"train_loss": -11.97664559455145, "global_step": 395639, "epoch": 2354, "val_loss": 300477.71875} {"train_loss": -11.371562004089355, "global_step": 395640, "epoch": 2355} {"train_loss": -12.320883750915527, "global_step": 395641, "epoch": 2355} {"train_loss": -11.674044609069824, "global_step": 395642, "epoch": 2355} {"train_loss": -11.395637512207031, "global_step": 395643, "epoch": 2355} {"train_loss": -12.088545799255371, "global_step": 395644, "epoch": 2355} {"train_loss": -12.218072891235352, "global_step": 395645, "epoch": 2355} {"train_loss": -11.531208038330078, "global_step": 395646, "epoch": 2355} {"train_loss": -12.260218620300293, "global_step": 395647, "epoch": 2355} {"train_loss": -12.095882415771484, "global_step": 395648, "epoch": 2355} {"train_loss": -11.968210220336914, "global_step": 395649, "epoch": 2355} {"train_loss": -11.844745635986328, "global_step": 395650, "epoch": 2355} {"train_loss": -11.317956924438477, "global_step": 395651, "epoch": 2355} {"train_loss": -11.963687896728516, "global_step": 395652, "epoch": 2355} {"train_loss": -11.630916595458984, "global_step": 395653, "epoch": 2355} {"train_loss": -12.367258071899414, "global_step": 395654, "epoch": 2355} {"train_loss": -11.879446983337402, "global_step": 395655, "epoch": 2355} {"train_loss": -12.37578296661377, "global_step": 395656, "epoch": 2355} {"train_loss": -11.988639831542969, "global_step": 395657, "epoch": 2355} {"train_loss": -11.29681396484375, "global_step": 395658, "epoch": 2355} {"train_loss": -10.449651718139648, "global_step": 395659, "epoch": 2355} {"train_loss": -11.853654861450195, "global_step": 395660, "epoch": 2355} {"train_loss": -10.114452362060547, "global_step": 395661, "epoch": 2355} {"train_loss": -10.054313659667969, "global_step": 395662, "epoch": 2355} {"train_loss": -9.987602233886719, "global_step": 395663, "epoch": 2355} {"train_loss": -11.929776191711426, "global_step": 395664, "epoch": 2355} {"train_loss": -9.875673294067383, "global_step": 395665, "epoch": 2355} {"train_loss": -9.778236389160156, "global_step": 395666, "epoch": 2355} {"train_loss": -11.234670639038086, "global_step": 395667, "epoch": 2355} {"train_loss": -9.998113632202148, "global_step": 395668, "epoch": 2355} {"train_loss": -10.39315128326416, "global_step": 395669, "epoch": 2355} {"train_loss": -10.70648193359375, "global_step": 395670, "epoch": 2355} {"train_loss": -10.492839813232422, "global_step": 395671, "epoch": 2355} {"train_loss": -11.647114753723145, "global_step": 395672, "epoch": 2355} {"train_loss": -11.253393173217773, "global_step": 395673, "epoch": 2355} {"train_loss": -11.631248474121094, "global_step": 395674, "epoch": 2355} {"train_loss": -12.014485359191895, "global_step": 395675, "epoch": 2355} {"train_loss": -11.854008674621582, "global_step": 395676, "epoch": 2355} {"train_loss": -11.956443786621094, "global_step": 395677, "epoch": 2355} {"train_loss": -11.908346176147461, "global_step": 395678, "epoch": 2355} {"train_loss": -11.794595718383789, "global_step": 395679, "epoch": 2355} {"train_loss": -11.277013778686523, "global_step": 395680, "epoch": 2355} {"train_loss": -12.191876411437988, "global_step": 395681, "epoch": 2355} {"train_loss": -11.379626274108887, "global_step": 395682, "epoch": 2355} {"train_loss": -12.081138610839844, "global_step": 395683, "epoch": 2355} {"train_loss": -11.804649353027344, "global_step": 395684, "epoch": 2355} {"train_loss": -11.879753112792969, "global_step": 395685, "epoch": 2355} {"train_loss": -12.423839569091797, "global_step": 395686, "epoch": 2355} {"train_loss": -11.995776176452637, "global_step": 395687, "epoch": 2355} {"train_loss": -12.393580436706543, "global_step": 395688, "epoch": 2355} {"train_loss": -12.310694694519043, "global_step": 395689, "epoch": 2355} {"train_loss": -12.251813888549805, "global_step": 395690, "epoch": 2355} {"train_loss": -12.325236320495605, "global_step": 395691, "epoch": 2355} {"train_loss": -12.218941688537598, "global_step": 395692, "epoch": 2355} {"train_loss": -12.339849472045898, "global_step": 395693, "epoch": 2355} {"train_loss": -12.293807983398438, "global_step": 395694, "epoch": 2355} {"train_loss": -12.390869140625, "global_step": 395695, "epoch": 2355} {"train_loss": -12.302465438842773, "global_step": 395696, "epoch": 2355} {"train_loss": -12.732141494750977, "global_step": 395697, "epoch": 2355} {"train_loss": -12.27072525024414, "global_step": 395698, "epoch": 2355} {"train_loss": -12.573932647705078, "global_step": 395699, "epoch": 2355} {"train_loss": -12.45616340637207, "global_step": 395700, "epoch": 2355} {"train_loss": -12.203078269958496, "global_step": 395701, "epoch": 2355} {"train_loss": -12.398165702819824, "global_step": 395702, "epoch": 2355} {"train_loss": -12.20060920715332, "global_step": 395703, "epoch": 2355} {"train_loss": -12.27279281616211, "global_step": 395704, "epoch": 2355} {"train_loss": -12.475170135498047, "global_step": 395705, "epoch": 2355} {"train_loss": -12.343003273010254, "global_step": 395706, "epoch": 2355} {"train_loss": -12.356542587280273, "global_step": 395707, "epoch": 2355} {"train_loss": -12.263204574584961, "global_step": 395708, "epoch": 2355} {"train_loss": -12.653895378112793, "global_step": 395709, "epoch": 2355} {"train_loss": -12.264949798583984, "global_step": 395710, "epoch": 2355} {"train_loss": -12.442176818847656, "global_step": 395711, "epoch": 2355} {"train_loss": -12.160362243652344, "global_step": 395712, "epoch": 2355} {"train_loss": -12.397636413574219, "global_step": 395713, "epoch": 2355} {"train_loss": -12.571366310119629, "global_step": 395714, "epoch": 2355} {"train_loss": -12.637911796569824, "global_step": 395715, "epoch": 2355} {"train_loss": -12.398024559020996, "global_step": 395716, "epoch": 2355} {"train_loss": -12.439925193786621, "global_step": 395717, "epoch": 2355} {"train_loss": -12.662172317504883, "global_step": 395718, "epoch": 2355} {"train_loss": -12.478461265563965, "global_step": 395719, "epoch": 2355} {"train_loss": -12.706623077392578, "global_step": 395720, "epoch": 2355} {"train_loss": -12.716910362243652, "global_step": 395721, "epoch": 2355} {"train_loss": -12.574712753295898, "global_step": 395722, "epoch": 2355} {"train_loss": -12.633623123168945, "global_step": 395723, "epoch": 2355} {"train_loss": -12.425918579101562, "global_step": 395724, "epoch": 2355} {"train_loss": -12.526152610778809, "global_step": 395725, "epoch": 2355} {"train_loss": -12.641895294189453, "global_step": 395726, "epoch": 2355} {"train_loss": -12.723026275634766, "global_step": 395727, "epoch": 2355} {"train_loss": -12.779565811157227, "global_step": 395728, "epoch": 2355} {"train_loss": -12.6708984375, "global_step": 395729, "epoch": 2355} {"train_loss": -12.567008018493652, "global_step": 395730, "epoch": 2355} {"train_loss": -12.294939994812012, "global_step": 395731, "epoch": 2355} {"train_loss": -12.512711524963379, "global_step": 395732, "epoch": 2355} {"train_loss": -12.663471221923828, "global_step": 395733, "epoch": 2355} {"train_loss": -12.311628341674805, "global_step": 395734, "epoch": 2355} {"train_loss": -12.130115509033203, "global_step": 395735, "epoch": 2355} {"train_loss": -12.149789810180664, "global_step": 395736, "epoch": 2355} {"train_loss": -12.386043548583984, "global_step": 395737, "epoch": 2355} {"train_loss": -12.082694053649902, "global_step": 395738, "epoch": 2355} {"train_loss": -12.189254760742188, "global_step": 395739, "epoch": 2355} {"train_loss": -12.096138954162598, "global_step": 395740, "epoch": 2355} {"train_loss": -11.936141967773438, "global_step": 395741, "epoch": 2355} {"train_loss": -12.016136169433594, "global_step": 395742, "epoch": 2355} {"train_loss": -11.504283905029297, "global_step": 395743, "epoch": 2355} {"train_loss": -11.086536407470703, "global_step": 395744, "epoch": 2355} {"train_loss": -12.081194877624512, "global_step": 395745, "epoch": 2355} {"train_loss": -11.830172538757324, "global_step": 395746, "epoch": 2355} {"train_loss": -10.899150848388672, "global_step": 395747, "epoch": 2355} {"train_loss": -11.690189361572266, "global_step": 395748, "epoch": 2355} {"train_loss": -12.087295532226562, "global_step": 395749, "epoch": 2355} {"train_loss": -11.42758846282959, "global_step": 395750, "epoch": 2355} {"train_loss": -12.195356369018555, "global_step": 395751, "epoch": 2355} {"train_loss": -11.582204818725586, "global_step": 395752, "epoch": 2355} {"train_loss": -11.439675331115723, "global_step": 395753, "epoch": 2355} {"train_loss": -12.146437644958496, "global_step": 395754, "epoch": 2355} {"train_loss": -12.159802436828613, "global_step": 395755, "epoch": 2355} {"train_loss": -12.127090454101562, "global_step": 395756, "epoch": 2355} {"train_loss": -12.320600509643555, "global_step": 395757, "epoch": 2355} {"train_loss": -11.883496284484863, "global_step": 395758, "epoch": 2355} {"train_loss": -12.098152160644531, "global_step": 395759, "epoch": 2355} {"train_loss": -12.394248962402344, "global_step": 395760, "epoch": 2355} {"train_loss": -12.207891464233398, "global_step": 395761, "epoch": 2355} {"train_loss": -12.259723663330078, "global_step": 395762, "epoch": 2355} {"train_loss": -12.217390060424805, "global_step": 395763, "epoch": 2355} {"train_loss": -12.362594604492188, "global_step": 395764, "epoch": 2355} {"train_loss": -12.650979042053223, "global_step": 395765, "epoch": 2355} {"train_loss": -12.37332534790039, "global_step": 395766, "epoch": 2355} {"train_loss": -12.320638656616211, "global_step": 395767, "epoch": 2355} {"train_loss": -12.317983627319336, "global_step": 395768, "epoch": 2355} {"train_loss": -12.506589889526367, "global_step": 395769, "epoch": 2355} {"train_loss": -12.112052917480469, "global_step": 395770, "epoch": 2355} {"train_loss": -12.381474494934082, "global_step": 395771, "epoch": 2355} {"train_loss": -11.943552017211914, "global_step": 395772, "epoch": 2355} {"train_loss": -12.171649932861328, "global_step": 395773, "epoch": 2355} {"train_loss": -11.90945053100586, "global_step": 395774, "epoch": 2355} {"train_loss": -12.05331039428711, "global_step": 395775, "epoch": 2355} {"train_loss": -11.462559700012207, "global_step": 395776, "epoch": 2355} {"train_loss": -11.773162841796875, "global_step": 395777, "epoch": 2355} {"train_loss": -11.224634170532227, "global_step": 395778, "epoch": 2355} {"train_loss": -12.13438892364502, "global_step": 395779, "epoch": 2355} {"train_loss": -12.099815368652344, "global_step": 395780, "epoch": 2355} {"train_loss": -11.369973182678223, "global_step": 395781, "epoch": 2355} {"train_loss": -10.813950538635254, "global_step": 395782, "epoch": 2355} {"train_loss": -10.342353820800781, "global_step": 395783, "epoch": 2355} {"train_loss": -12.200414657592773, "global_step": 395784, "epoch": 2355} {"train_loss": -10.82468318939209, "global_step": 395785, "epoch": 2355} {"train_loss": -10.993906021118164, "global_step": 395786, "epoch": 2355} {"train_loss": -10.502033233642578, "global_step": 395787, "epoch": 2355} {"train_loss": -10.371149063110352, "global_step": 395788, "epoch": 2355} {"train_loss": -11.518322944641113, "global_step": 395789, "epoch": 2355} {"train_loss": -10.617044448852539, "global_step": 395790, "epoch": 2355} {"train_loss": -11.475016593933105, "global_step": 395791, "epoch": 2355} {"train_loss": -11.537040710449219, "global_step": 395792, "epoch": 2355} {"train_loss": -11.878929138183594, "global_step": 395793, "epoch": 2355} {"train_loss": -11.796083450317383, "global_step": 395794, "epoch": 2355} {"train_loss": -11.829248428344727, "global_step": 395795, "epoch": 2355} {"train_loss": -10.983050346374512, "global_step": 395796, "epoch": 2355} {"train_loss": -11.965051651000977, "global_step": 395797, "epoch": 2355} {"train_loss": -11.90060806274414, "global_step": 395798, "epoch": 2355} {"train_loss": -12.010894775390625, "global_step": 395799, "epoch": 2355} {"train_loss": -12.171771049499512, "global_step": 395800, "epoch": 2355} {"train_loss": -11.668232917785645, "global_step": 395801, "epoch": 2355} {"train_loss": -12.0974760055542, "global_step": 395802, "epoch": 2355} {"train_loss": -12.078385353088379, "global_step": 395803, "epoch": 2355} {"train_loss": -11.928492546081543, "global_step": 395804, "epoch": 2355} {"train_loss": -12.349985122680664, "global_step": 395805, "epoch": 2355} {"train_loss": -11.853379249572754, "global_step": 395806, "epoch": 2355} {"train_loss": -11.906605413981847, "global_step": 395807, "epoch": 2355, "val_loss": 296995.71875, "train_action_mse_error": 1.5186090469360352} {"train_loss": -12.246933937072754, "global_step": 395808, "epoch": 2356} {"train_loss": -12.285028457641602, "global_step": 395809, "epoch": 2356} {"train_loss": -12.169206619262695, "global_step": 395810, "epoch": 2356} {"train_loss": -12.008806228637695, "global_step": 395811, "epoch": 2356} {"train_loss": -12.115412712097168, "global_step": 395812, "epoch": 2356} {"train_loss": -12.205804824829102, "global_step": 395813, "epoch": 2356} {"train_loss": -12.305521011352539, "global_step": 395814, "epoch": 2356} {"train_loss": -12.354423522949219, "global_step": 395815, "epoch": 2356} {"train_loss": -12.489952087402344, "global_step": 395816, "epoch": 2356} {"train_loss": -12.518865585327148, "global_step": 395817, "epoch": 2356} {"train_loss": -12.513567924499512, "global_step": 395818, "epoch": 2356} {"train_loss": -12.539169311523438, "global_step": 395819, "epoch": 2356} {"train_loss": -12.425195693969727, "global_step": 395820, "epoch": 2356} {"train_loss": -12.387744903564453, "global_step": 395821, "epoch": 2356} {"train_loss": -12.076390266418457, "global_step": 395822, "epoch": 2356} {"train_loss": -12.581838607788086, "global_step": 395823, "epoch": 2356} {"train_loss": -12.366044998168945, "global_step": 395824, "epoch": 2356} {"train_loss": -12.488397598266602, "global_step": 395825, "epoch": 2356} {"train_loss": -12.308494567871094, "global_step": 395826, "epoch": 2356} {"train_loss": -12.394781112670898, "global_step": 395827, "epoch": 2356} {"train_loss": -12.102012634277344, "global_step": 395828, "epoch": 2356} {"train_loss": -12.599583625793457, "global_step": 395829, "epoch": 2356} {"train_loss": -12.183208465576172, "global_step": 395830, "epoch": 2356} {"train_loss": -12.667119979858398, "global_step": 395831, "epoch": 2356} {"train_loss": -12.29429817199707, "global_step": 395832, "epoch": 2356} {"train_loss": -12.609986305236816, "global_step": 395833, "epoch": 2356} {"train_loss": -12.561437606811523, "global_step": 395834, "epoch": 2356} {"train_loss": -12.503231048583984, "global_step": 395835, "epoch": 2356} {"train_loss": -12.66283893585205, "global_step": 395836, "epoch": 2356} {"train_loss": -12.49209976196289, "global_step": 395837, "epoch": 2356} {"train_loss": -12.34375, "global_step": 395838, "epoch": 2356} {"train_loss": -12.482671737670898, "global_step": 395839, "epoch": 2356} {"train_loss": -12.436178207397461, "global_step": 395840, "epoch": 2356} {"train_loss": -12.335124969482422, "global_step": 395841, "epoch": 2356} {"train_loss": -12.245732307434082, "global_step": 395842, "epoch": 2356} {"train_loss": -12.449037551879883, "global_step": 395843, "epoch": 2356} {"train_loss": -12.000980377197266, "global_step": 395844, "epoch": 2356} {"train_loss": -11.952119827270508, "global_step": 395845, "epoch": 2356} {"train_loss": -12.173568725585938, "global_step": 395846, "epoch": 2356} {"train_loss": -11.734114646911621, "global_step": 395847, "epoch": 2356} {"train_loss": -11.890497207641602, "global_step": 395848, "epoch": 2356} {"train_loss": -12.198768615722656, "global_step": 395849, "epoch": 2356} {"train_loss": -11.90960693359375, "global_step": 395850, "epoch": 2356} {"train_loss": -11.63078498840332, "global_step": 395851, "epoch": 2356} {"train_loss": -12.400226593017578, "global_step": 395852, "epoch": 2356} {"train_loss": -11.236410140991211, "global_step": 395853, "epoch": 2356} {"train_loss": -11.827754020690918, "global_step": 395854, "epoch": 2356} {"train_loss": -12.062291145324707, "global_step": 395855, "epoch": 2356} {"train_loss": -11.742467880249023, "global_step": 395856, "epoch": 2356} {"train_loss": -11.481260299682617, "global_step": 395857, "epoch": 2356} {"train_loss": -12.071942329406738, "global_step": 395858, "epoch": 2356} {"train_loss": -11.669906616210938, "global_step": 395859, "epoch": 2356} {"train_loss": -12.087843894958496, "global_step": 395860, "epoch": 2356} {"train_loss": -11.69033432006836, "global_step": 395861, "epoch": 2356} {"train_loss": -12.399953842163086, "global_step": 395862, "epoch": 2356} {"train_loss": -11.853744506835938, "global_step": 395863, "epoch": 2356} {"train_loss": -12.410239219665527, "global_step": 395864, "epoch": 2356} {"train_loss": -11.224649429321289, "global_step": 395865, "epoch": 2356} {"train_loss": -12.10725212097168, "global_step": 395866, "epoch": 2356} {"train_loss": -12.206562995910645, "global_step": 395867, "epoch": 2356} {"train_loss": -12.310492515563965, "global_step": 395868, "epoch": 2356} {"train_loss": -12.225241661071777, "global_step": 395869, "epoch": 2356} {"train_loss": -12.37999153137207, "global_step": 395870, "epoch": 2356} {"train_loss": -12.120757102966309, "global_step": 395871, "epoch": 2356} {"train_loss": -11.873249053955078, "global_step": 395872, "epoch": 2356} {"train_loss": -12.133321762084961, "global_step": 395873, "epoch": 2356} {"train_loss": -12.290653228759766, "global_step": 395874, "epoch": 2356} {"train_loss": -12.435188293457031, "global_step": 395875, "epoch": 2356} {"train_loss": -12.175710678100586, "global_step": 395876, "epoch": 2356} {"train_loss": -12.367431640625, "global_step": 395877, "epoch": 2356} {"train_loss": -12.460997581481934, "global_step": 395878, "epoch": 2356} {"train_loss": -12.502570152282715, "global_step": 395879, "epoch": 2356} {"train_loss": -12.473419189453125, "global_step": 395880, "epoch": 2356} {"train_loss": -12.387064933776855, "global_step": 395881, "epoch": 2356} {"train_loss": -12.386711120605469, "global_step": 395882, "epoch": 2356} {"train_loss": -12.451716423034668, "global_step": 395883, "epoch": 2356} {"train_loss": -12.739415168762207, "global_step": 395884, "epoch": 2356} {"train_loss": -12.409764289855957, "global_step": 395885, "epoch": 2356} {"train_loss": -12.554573059082031, "global_step": 395886, "epoch": 2356} {"train_loss": -12.585371017456055, "global_step": 395887, "epoch": 2356} {"train_loss": -12.345091819763184, "global_step": 395888, "epoch": 2356} {"train_loss": -12.291366577148438, "global_step": 395889, "epoch": 2356} {"train_loss": -12.482928276062012, "global_step": 395890, "epoch": 2356} {"train_loss": -12.500873565673828, "global_step": 395891, "epoch": 2356} {"train_loss": -12.637025833129883, "global_step": 395892, "epoch": 2356} {"train_loss": -12.496161460876465, "global_step": 395893, "epoch": 2356} {"train_loss": -11.996559143066406, "global_step": 395894, "epoch": 2356} {"train_loss": -12.456745147705078, "global_step": 395895, "epoch": 2356} {"train_loss": -12.451981544494629, "global_step": 395896, "epoch": 2356} {"train_loss": -12.561906814575195, "global_step": 395897, "epoch": 2356} {"train_loss": -12.175904273986816, "global_step": 395898, "epoch": 2356} {"train_loss": -12.018363952636719, "global_step": 395899, "epoch": 2356} {"train_loss": -12.041425704956055, "global_step": 395900, "epoch": 2356} {"train_loss": -12.359018325805664, "global_step": 395901, "epoch": 2356} {"train_loss": -11.776508331298828, "global_step": 395902, "epoch": 2356} {"train_loss": -11.527969360351562, "global_step": 395903, "epoch": 2356} {"train_loss": -12.00897216796875, "global_step": 395904, "epoch": 2356} {"train_loss": -12.068294525146484, "global_step": 395905, "epoch": 2356} {"train_loss": -11.7656888961792, "global_step": 395906, "epoch": 2356} {"train_loss": -12.639060974121094, "global_step": 395907, "epoch": 2356} {"train_loss": -12.303129196166992, "global_step": 395908, "epoch": 2356} {"train_loss": -11.857020378112793, "global_step": 395909, "epoch": 2356} {"train_loss": -12.241870880126953, "global_step": 395910, "epoch": 2356} {"train_loss": -11.730122566223145, "global_step": 395911, "epoch": 2356} {"train_loss": -12.039911270141602, "global_step": 395912, "epoch": 2356} {"train_loss": -12.34526252746582, "global_step": 395913, "epoch": 2356} {"train_loss": -12.445060729980469, "global_step": 395914, "epoch": 2356} {"train_loss": -11.385931015014648, "global_step": 395915, "epoch": 2356} {"train_loss": -11.562458038330078, "global_step": 395916, "epoch": 2356} {"train_loss": -11.95663070678711, "global_step": 395917, "epoch": 2356} {"train_loss": -12.180763244628906, "global_step": 395918, "epoch": 2356} {"train_loss": -11.216808319091797, "global_step": 395919, "epoch": 2356} {"train_loss": -12.347461700439453, "global_step": 395920, "epoch": 2356} {"train_loss": -11.081676483154297, "global_step": 395921, "epoch": 2356} {"train_loss": -11.768067359924316, "global_step": 395922, "epoch": 2356} {"train_loss": -11.512710571289062, "global_step": 395923, "epoch": 2356} {"train_loss": -11.523326873779297, "global_step": 395924, "epoch": 2356} {"train_loss": -11.015707969665527, "global_step": 395925, "epoch": 2356} {"train_loss": -11.724644660949707, "global_step": 395926, "epoch": 2356} {"train_loss": -11.27742862701416, "global_step": 395927, "epoch": 2356} {"train_loss": -11.295014381408691, "global_step": 395928, "epoch": 2356} {"train_loss": -10.937931060791016, "global_step": 395929, "epoch": 2356} {"train_loss": -11.262396812438965, "global_step": 395930, "epoch": 2356} {"train_loss": -11.431745529174805, "global_step": 395931, "epoch": 2356} {"train_loss": -10.858039855957031, "global_step": 395932, "epoch": 2356} {"train_loss": -11.622541427612305, "global_step": 395933, "epoch": 2356} {"train_loss": -10.553230285644531, "global_step": 395934, "epoch": 2356} {"train_loss": -10.736238479614258, "global_step": 395935, "epoch": 2356} {"train_loss": -11.496614456176758, "global_step": 395936, "epoch": 2356} {"train_loss": -10.438185691833496, "global_step": 395937, "epoch": 2356} {"train_loss": -11.627531051635742, "global_step": 395938, "epoch": 2356} {"train_loss": -10.858939170837402, "global_step": 395939, "epoch": 2356} {"train_loss": -11.402313232421875, "global_step": 395940, "epoch": 2356} {"train_loss": -11.482139587402344, "global_step": 395941, "epoch": 2356} {"train_loss": -11.19023323059082, "global_step": 395942, "epoch": 2356} {"train_loss": -9.934102058410645, "global_step": 395943, "epoch": 2356} {"train_loss": -11.707727432250977, "global_step": 395944, "epoch": 2356} {"train_loss": -10.90804672241211, "global_step": 395945, "epoch": 2356} {"train_loss": -12.063055038452148, "global_step": 395946, "epoch": 2356} {"train_loss": -11.554859161376953, "global_step": 395947, "epoch": 2356} {"train_loss": -11.994829177856445, "global_step": 395948, "epoch": 2356} {"train_loss": -11.825067520141602, "global_step": 395949, "epoch": 2356} {"train_loss": -11.631858825683594, "global_step": 395950, "epoch": 2356} {"train_loss": -12.153945922851562, "global_step": 395951, "epoch": 2356} {"train_loss": -11.567163467407227, "global_step": 395952, "epoch": 2356} {"train_loss": -11.606159210205078, "global_step": 395953, "epoch": 2356} {"train_loss": -12.027902603149414, "global_step": 395954, "epoch": 2356} {"train_loss": -11.90072250366211, "global_step": 395955, "epoch": 2356} {"train_loss": -12.436747550964355, "global_step": 395956, "epoch": 2356} {"train_loss": -11.867120742797852, "global_step": 395957, "epoch": 2356} {"train_loss": -12.21512222290039, "global_step": 395958, "epoch": 2356} {"train_loss": -11.776633262634277, "global_step": 395959, "epoch": 2356} {"train_loss": -12.0130615234375, "global_step": 395960, "epoch": 2356} {"train_loss": -12.000997543334961, "global_step": 395961, "epoch": 2356} {"train_loss": -12.132696151733398, "global_step": 395962, "epoch": 2356} {"train_loss": -12.271505355834961, "global_step": 395963, "epoch": 2356} {"train_loss": -12.142557144165039, "global_step": 395964, "epoch": 2356} {"train_loss": -12.414003372192383, "global_step": 395965, "epoch": 2356} {"train_loss": -12.010926246643066, "global_step": 395966, "epoch": 2356} {"train_loss": -11.959329605102539, "global_step": 395967, "epoch": 2356} {"train_loss": -12.211482048034668, "global_step": 395968, "epoch": 2356} {"train_loss": -12.36843204498291, "global_step": 395969, "epoch": 2356} {"train_loss": -12.318136215209961, "global_step": 395970, "epoch": 2356} {"train_loss": -12.509575843811035, "global_step": 395971, "epoch": 2356} {"train_loss": -12.118223190307617, "global_step": 395972, "epoch": 2356} {"train_loss": -12.273810386657715, "global_step": 395973, "epoch": 2356} {"train_loss": -12.279327392578125, "global_step": 395974, "epoch": 2356} {"train_loss": -12.029855614616757, "global_step": 395975, "epoch": 2356, "val_loss": 302365.84375} {"train_loss": -12.310720443725586, "global_step": 395976, "epoch": 2357} {"train_loss": -12.203845977783203, "global_step": 395977, "epoch": 2357} {"train_loss": -12.559650421142578, "global_step": 395978, "epoch": 2357} {"train_loss": -12.095000267028809, "global_step": 395979, "epoch": 2357} {"train_loss": -12.31471061706543, "global_step": 395980, "epoch": 2357} {"train_loss": -12.373613357543945, "global_step": 395981, "epoch": 2357} {"train_loss": -12.447568893432617, "global_step": 395982, "epoch": 2357} {"train_loss": -12.555562019348145, "global_step": 395983, "epoch": 2357} {"train_loss": -12.535248756408691, "global_step": 395984, "epoch": 2357} {"train_loss": -12.253726959228516, "global_step": 395985, "epoch": 2357} {"train_loss": -12.674201965332031, "global_step": 395986, "epoch": 2357} {"train_loss": -12.450050354003906, "global_step": 395987, "epoch": 2357} {"train_loss": -12.335256576538086, "global_step": 395988, "epoch": 2357} {"train_loss": -12.538220405578613, "global_step": 395989, "epoch": 2357} {"train_loss": -12.286670684814453, "global_step": 395990, "epoch": 2357} {"train_loss": -12.801437377929688, "global_step": 395991, "epoch": 2357} {"train_loss": -12.163534164428711, "global_step": 395992, "epoch": 2357} {"train_loss": -12.599994659423828, "global_step": 395993, "epoch": 2357} {"train_loss": -12.497342109680176, "global_step": 395994, "epoch": 2357} {"train_loss": -12.350441932678223, "global_step": 395995, "epoch": 2357} {"train_loss": -12.627306938171387, "global_step": 395996, "epoch": 2357} {"train_loss": -12.592517852783203, "global_step": 395997, "epoch": 2357} {"train_loss": -12.576122283935547, "global_step": 395998, "epoch": 2357} {"train_loss": -12.70285415649414, "global_step": 395999, "epoch": 2357} {"train_loss": -12.594841957092285, "global_step": 396000, "epoch": 2357} {"train_loss": -12.487266540527344, "global_step": 396001, "epoch": 2357} {"train_loss": -12.433645248413086, "global_step": 396002, "epoch": 2357} {"train_loss": -12.666961669921875, "global_step": 396003, "epoch": 2357} {"train_loss": -12.213251113891602, "global_step": 396004, "epoch": 2357} {"train_loss": -12.259998321533203, "global_step": 396005, "epoch": 2357} {"train_loss": -12.670055389404297, "global_step": 396006, "epoch": 2357} {"train_loss": -12.153225898742676, "global_step": 396007, "epoch": 2357} {"train_loss": -12.353511810302734, "global_step": 396008, "epoch": 2357} {"train_loss": -12.60075855255127, "global_step": 396009, "epoch": 2357} {"train_loss": -12.862494468688965, "global_step": 396010, "epoch": 2357} {"train_loss": -12.52086067199707, "global_step": 396011, "epoch": 2357} {"train_loss": -12.308847427368164, "global_step": 396012, "epoch": 2357} {"train_loss": -12.867982864379883, "global_step": 396013, "epoch": 2357} {"train_loss": -12.556076049804688, "global_step": 396014, "epoch": 2357} {"train_loss": -12.5920991897583, "global_step": 396015, "epoch": 2357} {"train_loss": -12.310310363769531, "global_step": 396016, "epoch": 2357} {"train_loss": -12.50495433807373, "global_step": 396017, "epoch": 2357} {"train_loss": -12.247636795043945, "global_step": 396018, "epoch": 2357} {"train_loss": -12.570906639099121, "global_step": 396019, "epoch": 2357} {"train_loss": -12.320718765258789, "global_step": 396020, "epoch": 2357} {"train_loss": -11.937763214111328, "global_step": 396021, "epoch": 2357} {"train_loss": -11.854942321777344, "global_step": 396022, "epoch": 2357} {"train_loss": -11.09262752532959, "global_step": 396023, "epoch": 2357} {"train_loss": -11.400347709655762, "global_step": 396024, "epoch": 2357} {"train_loss": -11.639681816101074, "global_step": 396025, "epoch": 2357} {"train_loss": -11.27577018737793, "global_step": 396026, "epoch": 2357} {"train_loss": -11.442940711975098, "global_step": 396027, "epoch": 2357} {"train_loss": -11.835275650024414, "global_step": 396028, "epoch": 2357} {"train_loss": -10.470056533813477, "global_step": 396029, "epoch": 2357} {"train_loss": -11.656695365905762, "global_step": 396030, "epoch": 2357} {"train_loss": -10.401272773742676, "global_step": 396031, "epoch": 2357} {"train_loss": -9.770479202270508, "global_step": 396032, "epoch": 2357} {"train_loss": -11.168712615966797, "global_step": 396033, "epoch": 2357} {"train_loss": -9.779008865356445, "global_step": 396034, "epoch": 2357} {"train_loss": -9.959611892700195, "global_step": 396035, "epoch": 2357} {"train_loss": -9.970467567443848, "global_step": 396036, "epoch": 2357} {"train_loss": -10.468300819396973, "global_step": 396037, "epoch": 2357} {"train_loss": -10.910581588745117, "global_step": 396038, "epoch": 2357} {"train_loss": -10.832342147827148, "global_step": 396039, "epoch": 2357} {"train_loss": -10.38192367553711, "global_step": 396040, "epoch": 2357} {"train_loss": -10.672118186950684, "global_step": 396041, "epoch": 2357} {"train_loss": -10.069934844970703, "global_step": 396042, "epoch": 2357} {"train_loss": -9.233041763305664, "global_step": 396043, "epoch": 2357} {"train_loss": -10.333483695983887, "global_step": 396044, "epoch": 2357} {"train_loss": -11.394866943359375, "global_step": 396045, "epoch": 2357} {"train_loss": -9.61142635345459, "global_step": 396046, "epoch": 2357} {"train_loss": -9.599000930786133, "global_step": 396047, "epoch": 2357} {"train_loss": -9.793057441711426, "global_step": 396048, "epoch": 2357} {"train_loss": -10.881489753723145, "global_step": 396049, "epoch": 2357} {"train_loss": -10.40557861328125, "global_step": 396050, "epoch": 2357} {"train_loss": -9.77197265625, "global_step": 396051, "epoch": 2357} {"train_loss": -11.022638320922852, "global_step": 396052, "epoch": 2357} {"train_loss": -9.809868812561035, "global_step": 396053, "epoch": 2357} {"train_loss": -10.83122444152832, "global_step": 396054, "epoch": 2357} {"train_loss": -10.908807754516602, "global_step": 396055, "epoch": 2357} {"train_loss": -11.517965316772461, "global_step": 396056, "epoch": 2357} {"train_loss": -11.705718994140625, "global_step": 396057, "epoch": 2357} {"train_loss": -11.938420295715332, "global_step": 396058, "epoch": 2357} {"train_loss": -11.46603775024414, "global_step": 396059, "epoch": 2357} {"train_loss": -11.925107955932617, "global_step": 396060, "epoch": 2357} {"train_loss": -11.803632736206055, "global_step": 396061, "epoch": 2357} {"train_loss": -12.07870864868164, "global_step": 396062, "epoch": 2357} {"train_loss": -11.877552032470703, "global_step": 396063, "epoch": 2357} {"train_loss": -12.014114379882812, "global_step": 396064, "epoch": 2357} {"train_loss": -11.503689765930176, "global_step": 396065, "epoch": 2357} {"train_loss": -12.132844924926758, "global_step": 396066, "epoch": 2357} {"train_loss": -12.088373184204102, "global_step": 396067, "epoch": 2357} {"train_loss": -12.036941528320312, "global_step": 396068, "epoch": 2357} {"train_loss": -12.07725715637207, "global_step": 396069, "epoch": 2357} {"train_loss": -12.085172653198242, "global_step": 396070, "epoch": 2357} {"train_loss": -12.262308120727539, "global_step": 396071, "epoch": 2357} {"train_loss": -12.154475212097168, "global_step": 396072, "epoch": 2357} {"train_loss": -12.314347267150879, "global_step": 396073, "epoch": 2357} {"train_loss": -12.460830688476562, "global_step": 396074, "epoch": 2357} {"train_loss": -12.394344329833984, "global_step": 396075, "epoch": 2357} {"train_loss": -12.338865280151367, "global_step": 396076, "epoch": 2357} {"train_loss": -12.536449432373047, "global_step": 396077, "epoch": 2357} {"train_loss": -12.413753509521484, "global_step": 396078, "epoch": 2357} {"train_loss": -12.451082229614258, "global_step": 396079, "epoch": 2357} {"train_loss": -12.313636779785156, "global_step": 396080, "epoch": 2357} {"train_loss": -12.3627290725708, "global_step": 396081, "epoch": 2357} {"train_loss": -12.503325462341309, "global_step": 396082, "epoch": 2357} {"train_loss": -12.040361404418945, "global_step": 396083, "epoch": 2357} {"train_loss": -12.536384582519531, "global_step": 396084, "epoch": 2357} {"train_loss": -12.30772590637207, "global_step": 396085, "epoch": 2357} {"train_loss": -12.40596866607666, "global_step": 396086, "epoch": 2357} {"train_loss": -12.217971801757812, "global_step": 396087, "epoch": 2357} {"train_loss": -12.378680229187012, "global_step": 396088, "epoch": 2357} {"train_loss": -12.462409973144531, "global_step": 396089, "epoch": 2357} {"train_loss": -12.35892105102539, "global_step": 396090, "epoch": 2357} {"train_loss": -12.310043334960938, "global_step": 396091, "epoch": 2357} {"train_loss": -12.489822387695312, "global_step": 396092, "epoch": 2357} {"train_loss": -12.381239891052246, "global_step": 396093, "epoch": 2357} {"train_loss": -12.395731925964355, "global_step": 396094, "epoch": 2357} {"train_loss": -12.262993812561035, "global_step": 396095, "epoch": 2357} {"train_loss": -12.473878860473633, "global_step": 396096, "epoch": 2357} {"train_loss": -12.594487190246582, "global_step": 396097, "epoch": 2357} {"train_loss": -12.295827865600586, "global_step": 396098, "epoch": 2357} {"train_loss": -12.683412551879883, "global_step": 396099, "epoch": 2357} {"train_loss": -12.390205383300781, "global_step": 396100, "epoch": 2357} {"train_loss": -12.663595199584961, "global_step": 396101, "epoch": 2357} {"train_loss": -12.332489013671875, "global_step": 396102, "epoch": 2357} {"train_loss": -12.54736328125, "global_step": 396103, "epoch": 2357} {"train_loss": -12.385271072387695, "global_step": 396104, "epoch": 2357} {"train_loss": -12.515451431274414, "global_step": 396105, "epoch": 2357} {"train_loss": -12.72769832611084, "global_step": 396106, "epoch": 2357} {"train_loss": -12.432256698608398, "global_step": 396107, "epoch": 2357} {"train_loss": -12.63485336303711, "global_step": 396108, "epoch": 2357} {"train_loss": -12.6173095703125, "global_step": 396109, "epoch": 2357} {"train_loss": -12.477782249450684, "global_step": 396110, "epoch": 2357} {"train_loss": -12.748377799987793, "global_step": 396111, "epoch": 2357} {"train_loss": -12.528976440429688, "global_step": 396112, "epoch": 2357} {"train_loss": -12.491046905517578, "global_step": 396113, "epoch": 2357} {"train_loss": -12.617826461791992, "global_step": 396114, "epoch": 2357} {"train_loss": -12.798423767089844, "global_step": 396115, "epoch": 2357} {"train_loss": -12.543099403381348, "global_step": 396116, "epoch": 2357} {"train_loss": -12.457979202270508, "global_step": 396117, "epoch": 2357} {"train_loss": -12.68552017211914, "global_step": 396118, "epoch": 2357} {"train_loss": -12.64326286315918, "global_step": 396119, "epoch": 2357} {"train_loss": -12.733171463012695, "global_step": 396120, "epoch": 2357} {"train_loss": -12.332755088806152, "global_step": 396121, "epoch": 2357} {"train_loss": -12.591113090515137, "global_step": 396122, "epoch": 2357} {"train_loss": -12.414905548095703, "global_step": 396123, "epoch": 2357} {"train_loss": -12.413238525390625, "global_step": 396124, "epoch": 2357} {"train_loss": -12.61094856262207, "global_step": 396125, "epoch": 2357} {"train_loss": -12.22343635559082, "global_step": 396126, "epoch": 2357} {"train_loss": -11.875877380371094, "global_step": 396127, "epoch": 2357} {"train_loss": -12.0023193359375, "global_step": 396128, "epoch": 2357} {"train_loss": -11.859759330749512, "global_step": 396129, "epoch": 2357} {"train_loss": -11.70998477935791, "global_step": 396130, "epoch": 2357} {"train_loss": -11.819208145141602, "global_step": 396131, "epoch": 2357} {"train_loss": -11.55881118774414, "global_step": 396132, "epoch": 2357} {"train_loss": -12.117696762084961, "global_step": 396133, "epoch": 2357} {"train_loss": -12.058164596557617, "global_step": 396134, "epoch": 2357} {"train_loss": -11.282524108886719, "global_step": 396135, "epoch": 2357} {"train_loss": -12.664177894592285, "global_step": 396136, "epoch": 2357} {"train_loss": -11.631755828857422, "global_step": 396137, "epoch": 2357} {"train_loss": -11.246613502502441, "global_step": 396138, "epoch": 2357} {"train_loss": -11.875926971435547, "global_step": 396139, "epoch": 2357} {"train_loss": -11.890586853027344, "global_step": 396140, "epoch": 2357} {"train_loss": -12.907824516296387, "global_step": 396141, "epoch": 2357} {"train_loss": -12.18011474609375, "global_step": 396142, "epoch": 2357} {"train_loss": -11.979475055422101, "global_step": 396143, "epoch": 2357, "val_loss": 299027.625} {"train_loss": -12.074668884277344, "global_step": 396144, "epoch": 2358} {"train_loss": -12.495196342468262, "global_step": 396145, "epoch": 2358} {"train_loss": -12.221925735473633, "global_step": 396146, "epoch": 2358} {"train_loss": -12.686941146850586, "global_step": 396147, "epoch": 2358} {"train_loss": -12.547126770019531, "global_step": 396148, "epoch": 2358} {"train_loss": -12.466577529907227, "global_step": 396149, "epoch": 2358} {"train_loss": -12.500906944274902, "global_step": 396150, "epoch": 2358} {"train_loss": -12.650917053222656, "global_step": 396151, "epoch": 2358} {"train_loss": -12.25088119506836, "global_step": 396152, "epoch": 2358} {"train_loss": -12.095046043395996, "global_step": 396153, "epoch": 2358} {"train_loss": -12.516483306884766, "global_step": 396154, "epoch": 2358} {"train_loss": -11.964816093444824, "global_step": 396155, "epoch": 2358} {"train_loss": -12.459151268005371, "global_step": 396156, "epoch": 2358} {"train_loss": -12.458548545837402, "global_step": 396157, "epoch": 2358} {"train_loss": -12.660415649414062, "global_step": 396158, "epoch": 2358} {"train_loss": -12.329813957214355, "global_step": 396159, "epoch": 2358} {"train_loss": -12.880739212036133, "global_step": 396160, "epoch": 2358} {"train_loss": -12.517593383789062, "global_step": 396161, "epoch": 2358} {"train_loss": -12.290952682495117, "global_step": 396162, "epoch": 2358} {"train_loss": -12.57325553894043, "global_step": 396163, "epoch": 2358} {"train_loss": -11.997526168823242, "global_step": 396164, "epoch": 2358} {"train_loss": -11.987494468688965, "global_step": 396165, "epoch": 2358} {"train_loss": -12.393095016479492, "global_step": 396166, "epoch": 2358} {"train_loss": -12.631643295288086, "global_step": 396167, "epoch": 2358} {"train_loss": -12.05781364440918, "global_step": 396168, "epoch": 2358} {"train_loss": -12.193180084228516, "global_step": 396169, "epoch": 2358} {"train_loss": -12.43814468383789, "global_step": 396170, "epoch": 2358} {"train_loss": -11.668444633483887, "global_step": 396171, "epoch": 2358} {"train_loss": -11.681933403015137, "global_step": 396172, "epoch": 2358} {"train_loss": -11.432482719421387, "global_step": 396173, "epoch": 2358} {"train_loss": -11.746723175048828, "global_step": 396174, "epoch": 2358} {"train_loss": -12.383907318115234, "global_step": 396175, "epoch": 2358} {"train_loss": -12.400606155395508, "global_step": 396176, "epoch": 2358} {"train_loss": -11.888177871704102, "global_step": 396177, "epoch": 2358} {"train_loss": -12.178852081298828, "global_step": 396178, "epoch": 2358} {"train_loss": -11.806621551513672, "global_step": 396179, "epoch": 2358} {"train_loss": -11.738906860351562, "global_step": 396180, "epoch": 2358} {"train_loss": -12.21617317199707, "global_step": 396181, "epoch": 2358} {"train_loss": -11.797202110290527, "global_step": 396182, "epoch": 2358} {"train_loss": -11.753266334533691, "global_step": 396183, "epoch": 2358} {"train_loss": -12.511919975280762, "global_step": 396184, "epoch": 2358} {"train_loss": -12.117326736450195, "global_step": 396185, "epoch": 2358} {"train_loss": -11.653907775878906, "global_step": 396186, "epoch": 2358} {"train_loss": -11.968109130859375, "global_step": 396187, "epoch": 2358} {"train_loss": -12.448919296264648, "global_step": 396188, "epoch": 2358} {"train_loss": -11.88029670715332, "global_step": 396189, "epoch": 2358} {"train_loss": -11.906858444213867, "global_step": 396190, "epoch": 2358} {"train_loss": -12.313164710998535, "global_step": 396191, "epoch": 2358} {"train_loss": -12.376173973083496, "global_step": 396192, "epoch": 2358} {"train_loss": -12.14126968383789, "global_step": 396193, "epoch": 2358} {"train_loss": -12.284530639648438, "global_step": 396194, "epoch": 2358} {"train_loss": -11.891776084899902, "global_step": 396195, "epoch": 2358} {"train_loss": -12.413202285766602, "global_step": 396196, "epoch": 2358} {"train_loss": -12.342459678649902, "global_step": 396197, "epoch": 2358} {"train_loss": -12.11294937133789, "global_step": 396198, "epoch": 2358} {"train_loss": -12.521636962890625, "global_step": 396199, "epoch": 2358} {"train_loss": -12.307016372680664, "global_step": 396200, "epoch": 2358} {"train_loss": -12.420170783996582, "global_step": 396201, "epoch": 2358} {"train_loss": -12.377452850341797, "global_step": 396202, "epoch": 2358} {"train_loss": -12.641199111938477, "global_step": 396203, "epoch": 2358} {"train_loss": -12.259485244750977, "global_step": 396204, "epoch": 2358} {"train_loss": -12.442798614501953, "global_step": 396205, "epoch": 2358} {"train_loss": -12.46902847290039, "global_step": 396206, "epoch": 2358} {"train_loss": -12.551549911499023, "global_step": 396207, "epoch": 2358} {"train_loss": -12.239818572998047, "global_step": 396208, "epoch": 2358} {"train_loss": -11.761873245239258, "global_step": 396209, "epoch": 2358} {"train_loss": -12.22925090789795, "global_step": 396210, "epoch": 2358} {"train_loss": -12.127290725708008, "global_step": 396211, "epoch": 2358} {"train_loss": -12.772340774536133, "global_step": 396212, "epoch": 2358} {"train_loss": -12.215179443359375, "global_step": 396213, "epoch": 2358} {"train_loss": -12.666743278503418, "global_step": 396214, "epoch": 2358} {"train_loss": -12.283721923828125, "global_step": 396215, "epoch": 2358} {"train_loss": -12.71537971496582, "global_step": 396216, "epoch": 2358} {"train_loss": -12.412212371826172, "global_step": 396217, "epoch": 2358} {"train_loss": -12.74749755859375, "global_step": 396218, "epoch": 2358} {"train_loss": -12.507702827453613, "global_step": 396219, "epoch": 2358} {"train_loss": -12.444753646850586, "global_step": 396220, "epoch": 2358} {"train_loss": -12.155618667602539, "global_step": 396221, "epoch": 2358} {"train_loss": -12.122509002685547, "global_step": 396222, "epoch": 2358} {"train_loss": -12.202601432800293, "global_step": 396223, "epoch": 2358} {"train_loss": -12.349130630493164, "global_step": 396224, "epoch": 2358} {"train_loss": -12.200623512268066, "global_step": 396225, "epoch": 2358} {"train_loss": -11.880842208862305, "global_step": 396226, "epoch": 2358} {"train_loss": -12.16175651550293, "global_step": 396227, "epoch": 2358} {"train_loss": -10.287635803222656, "global_step": 396228, "epoch": 2358} {"train_loss": -11.818952560424805, "global_step": 396229, "epoch": 2358} {"train_loss": -11.352065086364746, "global_step": 396230, "epoch": 2358} {"train_loss": -11.460311889648438, "global_step": 396231, "epoch": 2358} {"train_loss": -11.67604923248291, "global_step": 396232, "epoch": 2358} {"train_loss": -11.425085067749023, "global_step": 396233, "epoch": 2358} {"train_loss": -12.290756225585938, "global_step": 396234, "epoch": 2358} {"train_loss": -10.90793228149414, "global_step": 396235, "epoch": 2358} {"train_loss": -11.77526569366455, "global_step": 396236, "epoch": 2358} {"train_loss": -11.731204986572266, "global_step": 396237, "epoch": 2358} {"train_loss": -11.30430793762207, "global_step": 396238, "epoch": 2358} {"train_loss": -9.716168403625488, "global_step": 396239, "epoch": 2358} {"train_loss": -11.97620677947998, "global_step": 396240, "epoch": 2358} {"train_loss": -11.741508483886719, "global_step": 396241, "epoch": 2358} {"train_loss": -11.132906913757324, "global_step": 396242, "epoch": 2358} {"train_loss": -11.141618728637695, "global_step": 396243, "epoch": 2358} {"train_loss": -11.679277420043945, "global_step": 396244, "epoch": 2358} {"train_loss": -11.296401977539062, "global_step": 396245, "epoch": 2358} {"train_loss": -11.552492141723633, "global_step": 396246, "epoch": 2358} {"train_loss": -11.679052352905273, "global_step": 396247, "epoch": 2358} {"train_loss": -11.864099502563477, "global_step": 396248, "epoch": 2358} {"train_loss": -10.23293685913086, "global_step": 396249, "epoch": 2358} {"train_loss": -11.41947078704834, "global_step": 396250, "epoch": 2358} {"train_loss": -8.766731262207031, "global_step": 396251, "epoch": 2358} {"train_loss": -8.070134162902832, "global_step": 396252, "epoch": 2358} {"train_loss": -8.143463134765625, "global_step": 396253, "epoch": 2358} {"train_loss": -8.987642288208008, "global_step": 396254, "epoch": 2358} {"train_loss": -10.026630401611328, "global_step": 396255, "epoch": 2358} {"train_loss": -9.035394668579102, "global_step": 396256, "epoch": 2358} {"train_loss": -9.083588600158691, "global_step": 396257, "epoch": 2358} {"train_loss": -8.366189956665039, "global_step": 396258, "epoch": 2358} {"train_loss": -9.823457717895508, "global_step": 396259, "epoch": 2358} {"train_loss": -9.888426780700684, "global_step": 396260, "epoch": 2358} {"train_loss": -9.917308807373047, "global_step": 396261, "epoch": 2358} {"train_loss": -9.0394287109375, "global_step": 396262, "epoch": 2358} {"train_loss": -10.582257270812988, "global_step": 396263, "epoch": 2358} {"train_loss": -11.304815292358398, "global_step": 396264, "epoch": 2358} {"train_loss": -10.429924011230469, "global_step": 396265, "epoch": 2358} {"train_loss": -11.093671798706055, "global_step": 396266, "epoch": 2358} {"train_loss": -10.51382064819336, "global_step": 396267, "epoch": 2358} {"train_loss": -11.344231605529785, "global_step": 396268, "epoch": 2358} {"train_loss": -11.25760555267334, "global_step": 396269, "epoch": 2358} {"train_loss": -11.601720809936523, "global_step": 396270, "epoch": 2358} {"train_loss": -11.464933395385742, "global_step": 396271, "epoch": 2358} {"train_loss": -11.831894874572754, "global_step": 396272, "epoch": 2358} {"train_loss": -11.18594741821289, "global_step": 396273, "epoch": 2358} {"train_loss": -11.78015422821045, "global_step": 396274, "epoch": 2358} {"train_loss": -11.42438793182373, "global_step": 396275, "epoch": 2358} {"train_loss": -11.599163055419922, "global_step": 396276, "epoch": 2358} {"train_loss": -12.083671569824219, "global_step": 396277, "epoch": 2358} {"train_loss": -11.177955627441406, "global_step": 396278, "epoch": 2358} {"train_loss": -11.988306045532227, "global_step": 396279, "epoch": 2358} {"train_loss": -11.758014678955078, "global_step": 396280, "epoch": 2358} {"train_loss": -11.672024726867676, "global_step": 396281, "epoch": 2358} {"train_loss": -11.45864200592041, "global_step": 396282, "epoch": 2358} {"train_loss": -11.368196487426758, "global_step": 396283, "epoch": 2358} {"train_loss": -11.51226806640625, "global_step": 396284, "epoch": 2358} {"train_loss": -11.690526008605957, "global_step": 396285, "epoch": 2358} {"train_loss": -11.31055736541748, "global_step": 396286, "epoch": 2358} {"train_loss": -11.49977970123291, "global_step": 396287, "epoch": 2358} {"train_loss": -11.516965866088867, "global_step": 396288, "epoch": 2358} {"train_loss": -11.426254272460938, "global_step": 396289, "epoch": 2358} {"train_loss": -12.068578720092773, "global_step": 396290, "epoch": 2358} {"train_loss": -11.606815338134766, "global_step": 396291, "epoch": 2358} {"train_loss": -11.58895492553711, "global_step": 396292, "epoch": 2358} {"train_loss": -12.038580894470215, "global_step": 396293, "epoch": 2358} {"train_loss": -11.939310073852539, "global_step": 396294, "epoch": 2358} {"train_loss": -12.235410690307617, "global_step": 396295, "epoch": 2358} {"train_loss": -11.976089477539062, "global_step": 396296, "epoch": 2358} {"train_loss": -12.07988166809082, "global_step": 396297, "epoch": 2358} {"train_loss": -12.097452163696289, "global_step": 396298, "epoch": 2358} {"train_loss": -12.009271621704102, "global_step": 396299, "epoch": 2358} {"train_loss": -12.075105667114258, "global_step": 396300, "epoch": 2358} {"train_loss": -12.095926284790039, "global_step": 396301, "epoch": 2358} {"train_loss": -12.079376220703125, "global_step": 396302, "epoch": 2358} {"train_loss": -11.985077857971191, "global_step": 396303, "epoch": 2358} {"train_loss": -12.256937026977539, "global_step": 396304, "epoch": 2358} {"train_loss": -12.038084030151367, "global_step": 396305, "epoch": 2358} {"train_loss": -12.00306510925293, "global_step": 396306, "epoch": 2358} {"train_loss": -12.082321166992188, "global_step": 396307, "epoch": 2358} {"train_loss": -12.203123092651367, "global_step": 396308, "epoch": 2358} {"train_loss": -12.2570219039917, "global_step": 396309, "epoch": 2358} {"train_loss": -12.301716804504395, "global_step": 396310, "epoch": 2358} {"train_loss": -11.746245179857526, "global_step": 396311, "epoch": 2358, "val_loss": 289649.625} {"train_loss": -12.343353271484375, "global_step": 396312, "epoch": 2359} {"train_loss": -12.235383987426758, "global_step": 396313, "epoch": 2359} {"train_loss": -12.325807571411133, "global_step": 396314, "epoch": 2359} {"train_loss": -12.420537948608398, "global_step": 396315, "epoch": 2359} {"train_loss": -12.406946182250977, "global_step": 396316, "epoch": 2359} {"train_loss": -12.453458786010742, "global_step": 396317, "epoch": 2359} {"train_loss": -12.237817764282227, "global_step": 396318, "epoch": 2359} {"train_loss": -12.464018821716309, "global_step": 396319, "epoch": 2359} {"train_loss": -12.25313949584961, "global_step": 396320, "epoch": 2359} {"train_loss": -12.420480728149414, "global_step": 396321, "epoch": 2359} {"train_loss": -12.246238708496094, "global_step": 396322, "epoch": 2359} {"train_loss": -12.32255744934082, "global_step": 396323, "epoch": 2359} {"train_loss": -12.155545234680176, "global_step": 396324, "epoch": 2359} {"train_loss": -12.396829605102539, "global_step": 396325, "epoch": 2359} {"train_loss": -12.459619522094727, "global_step": 396326, "epoch": 2359} {"train_loss": -12.430174827575684, "global_step": 396327, "epoch": 2359} {"train_loss": -12.492767333984375, "global_step": 396328, "epoch": 2359} {"train_loss": -12.266805648803711, "global_step": 396329, "epoch": 2359} {"train_loss": -12.61949634552002, "global_step": 396330, "epoch": 2359} {"train_loss": -12.469928741455078, "global_step": 396331, "epoch": 2359} {"train_loss": -12.456708908081055, "global_step": 396332, "epoch": 2359} {"train_loss": -12.284797668457031, "global_step": 396333, "epoch": 2359} {"train_loss": -12.201150894165039, "global_step": 396334, "epoch": 2359} {"train_loss": -12.330779075622559, "global_step": 396335, "epoch": 2359} {"train_loss": -12.586968421936035, "global_step": 396336, "epoch": 2359} {"train_loss": -12.295711517333984, "global_step": 396337, "epoch": 2359} {"train_loss": -12.457371711730957, "global_step": 396338, "epoch": 2359} {"train_loss": -12.588027954101562, "global_step": 396339, "epoch": 2359} {"train_loss": -12.381290435791016, "global_step": 396340, "epoch": 2359} {"train_loss": -12.834218978881836, "global_step": 396341, "epoch": 2359} {"train_loss": -12.419322967529297, "global_step": 396342, "epoch": 2359} {"train_loss": -12.39017105102539, "global_step": 396343, "epoch": 2359} {"train_loss": -12.3821439743042, "global_step": 396344, "epoch": 2359} {"train_loss": -12.402891159057617, "global_step": 396345, "epoch": 2359} {"train_loss": -12.41191577911377, "global_step": 396346, "epoch": 2359} {"train_loss": -12.306777954101562, "global_step": 396347, "epoch": 2359} {"train_loss": -12.41909122467041, "global_step": 396348, "epoch": 2359} {"train_loss": -12.587631225585938, "global_step": 396349, "epoch": 2359} {"train_loss": -12.60623550415039, "global_step": 396350, "epoch": 2359} {"train_loss": -12.402104377746582, "global_step": 396351, "epoch": 2359} {"train_loss": -12.645538330078125, "global_step": 396352, "epoch": 2359} {"train_loss": -12.541217803955078, "global_step": 396353, "epoch": 2359} {"train_loss": -12.78177261352539, "global_step": 396354, "epoch": 2359} {"train_loss": -12.578751564025879, "global_step": 396355, "epoch": 2359} {"train_loss": -12.891623497009277, "global_step": 396356, "epoch": 2359} {"train_loss": -12.422523498535156, "global_step": 396357, "epoch": 2359} {"train_loss": -12.726707458496094, "global_step": 396358, "epoch": 2359} {"train_loss": -12.557037353515625, "global_step": 396359, "epoch": 2359} {"train_loss": -12.617340087890625, "global_step": 396360, "epoch": 2359} {"train_loss": -12.55150032043457, "global_step": 396361, "epoch": 2359} {"train_loss": -12.615191459655762, "global_step": 396362, "epoch": 2359} {"train_loss": -12.480382919311523, "global_step": 396363, "epoch": 2359} {"train_loss": -12.241608619689941, "global_step": 396364, "epoch": 2359} {"train_loss": -11.911993026733398, "global_step": 396365, "epoch": 2359} {"train_loss": -12.28882884979248, "global_step": 396366, "epoch": 2359} {"train_loss": -12.527348518371582, "global_step": 396367, "epoch": 2359} {"train_loss": -12.222496032714844, "global_step": 396368, "epoch": 2359} {"train_loss": -12.519194602966309, "global_step": 396369, "epoch": 2359} {"train_loss": -12.378787994384766, "global_step": 396370, "epoch": 2359} {"train_loss": -12.39510440826416, "global_step": 396371, "epoch": 2359} {"train_loss": -10.746610641479492, "global_step": 396372, "epoch": 2359} {"train_loss": -10.817855834960938, "global_step": 396373, "epoch": 2359} {"train_loss": -11.656993865966797, "global_step": 396374, "epoch": 2359} {"train_loss": -11.888819694519043, "global_step": 396375, "epoch": 2359} {"train_loss": -10.755182266235352, "global_step": 396376, "epoch": 2359} {"train_loss": -11.666495323181152, "global_step": 396377, "epoch": 2359} {"train_loss": -11.73069953918457, "global_step": 396378, "epoch": 2359} {"train_loss": -9.867105484008789, "global_step": 396379, "epoch": 2359} {"train_loss": -11.733918190002441, "global_step": 396380, "epoch": 2359} {"train_loss": -11.168152809143066, "global_step": 396381, "epoch": 2359} {"train_loss": -9.631576538085938, "global_step": 396382, "epoch": 2359} {"train_loss": -9.269477844238281, "global_step": 396383, "epoch": 2359} {"train_loss": -9.41478443145752, "global_step": 396384, "epoch": 2359} {"train_loss": -9.752835273742676, "global_step": 396385, "epoch": 2359} {"train_loss": -10.138199806213379, "global_step": 396386, "epoch": 2359} {"train_loss": -9.530941009521484, "global_step": 396387, "epoch": 2359} {"train_loss": -10.938121795654297, "global_step": 396388, "epoch": 2359} {"train_loss": -9.957189559936523, "global_step": 396389, "epoch": 2359} {"train_loss": -10.921545028686523, "global_step": 396390, "epoch": 2359} {"train_loss": -10.00143051147461, "global_step": 396391, "epoch": 2359} {"train_loss": -11.37442398071289, "global_step": 396392, "epoch": 2359} {"train_loss": -9.94239330291748, "global_step": 396393, "epoch": 2359} {"train_loss": -11.54339599609375, "global_step": 396394, "epoch": 2359} {"train_loss": -10.919461250305176, "global_step": 396395, "epoch": 2359} {"train_loss": -11.664785385131836, "global_step": 396396, "epoch": 2359} {"train_loss": -11.036834716796875, "global_step": 396397, "epoch": 2359} {"train_loss": -11.057650566101074, "global_step": 396398, "epoch": 2359} {"train_loss": -11.656850814819336, "global_step": 396399, "epoch": 2359} {"train_loss": -11.492140769958496, "global_step": 396400, "epoch": 2359} {"train_loss": -12.08459186553955, "global_step": 396401, "epoch": 2359} {"train_loss": -11.544090270996094, "global_step": 396402, "epoch": 2359} {"train_loss": -12.242530822753906, "global_step": 396403, "epoch": 2359} {"train_loss": -11.562545776367188, "global_step": 396404, "epoch": 2359} {"train_loss": -11.610380172729492, "global_step": 396405, "epoch": 2359} {"train_loss": -11.662784576416016, "global_step": 396406, "epoch": 2359} {"train_loss": -11.851043701171875, "global_step": 396407, "epoch": 2359} {"train_loss": -12.290313720703125, "global_step": 396408, "epoch": 2359} {"train_loss": -11.91950511932373, "global_step": 396409, "epoch": 2359} {"train_loss": -11.852200508117676, "global_step": 396410, "epoch": 2359} {"train_loss": -11.919673919677734, "global_step": 396411, "epoch": 2359} {"train_loss": -12.120058059692383, "global_step": 396412, "epoch": 2359} {"train_loss": -12.069053649902344, "global_step": 396413, "epoch": 2359} {"train_loss": -12.16895866394043, "global_step": 396414, "epoch": 2359} {"train_loss": -12.069480895996094, "global_step": 396415, "epoch": 2359} {"train_loss": -12.055715560913086, "global_step": 396416, "epoch": 2359} {"train_loss": -11.889745712280273, "global_step": 396417, "epoch": 2359} {"train_loss": -12.212876319885254, "global_step": 396418, "epoch": 2359} {"train_loss": -11.704435348510742, "global_step": 396419, "epoch": 2359} {"train_loss": -12.236595153808594, "global_step": 396420, "epoch": 2359} {"train_loss": -11.64175796508789, "global_step": 396421, "epoch": 2359} {"train_loss": -11.913676261901855, "global_step": 396422, "epoch": 2359} {"train_loss": -11.996515274047852, "global_step": 396423, "epoch": 2359} {"train_loss": -12.067142486572266, "global_step": 396424, "epoch": 2359} {"train_loss": -12.024419784545898, "global_step": 396425, "epoch": 2359} {"train_loss": -12.1163911819458, "global_step": 396426, "epoch": 2359} {"train_loss": -11.937417030334473, "global_step": 396427, "epoch": 2359} {"train_loss": -11.713226318359375, "global_step": 396428, "epoch": 2359} {"train_loss": -12.298617362976074, "global_step": 396429, "epoch": 2359} {"train_loss": -12.19615364074707, "global_step": 396430, "epoch": 2359} {"train_loss": -12.253567695617676, "global_step": 396431, "epoch": 2359} {"train_loss": -12.201200485229492, "global_step": 396432, "epoch": 2359} {"train_loss": -12.312823295593262, "global_step": 396433, "epoch": 2359} {"train_loss": -12.278217315673828, "global_step": 396434, "epoch": 2359} {"train_loss": -12.126352310180664, "global_step": 396435, "epoch": 2359} {"train_loss": -11.722406387329102, "global_step": 396436, "epoch": 2359} {"train_loss": -12.061115264892578, "global_step": 396437, "epoch": 2359} {"train_loss": -11.331158638000488, "global_step": 396438, "epoch": 2359} {"train_loss": -12.342050552368164, "global_step": 396439, "epoch": 2359} {"train_loss": -11.750663757324219, "global_step": 396440, "epoch": 2359} {"train_loss": -12.48353099822998, "global_step": 396441, "epoch": 2359} {"train_loss": -12.114070892333984, "global_step": 396442, "epoch": 2359} {"train_loss": -12.660673141479492, "global_step": 396443, "epoch": 2359} {"train_loss": -12.349142074584961, "global_step": 396444, "epoch": 2359} {"train_loss": -12.334683418273926, "global_step": 396445, "epoch": 2359} {"train_loss": -12.532480239868164, "global_step": 396446, "epoch": 2359} {"train_loss": -12.372783660888672, "global_step": 396447, "epoch": 2359} {"train_loss": -12.36686897277832, "global_step": 396448, "epoch": 2359} {"train_loss": -12.272750854492188, "global_step": 396449, "epoch": 2359} {"train_loss": -12.604124069213867, "global_step": 396450, "epoch": 2359} {"train_loss": -12.265625953674316, "global_step": 396451, "epoch": 2359} {"train_loss": -12.357275009155273, "global_step": 396452, "epoch": 2359} {"train_loss": -12.43559455871582, "global_step": 396453, "epoch": 2359} {"train_loss": -12.117441177368164, "global_step": 396454, "epoch": 2359} {"train_loss": -12.320112228393555, "global_step": 396455, "epoch": 2359} {"train_loss": -12.225470542907715, "global_step": 396456, "epoch": 2359} {"train_loss": -12.005887985229492, "global_step": 396457, "epoch": 2359} {"train_loss": -12.302380561828613, "global_step": 396458, "epoch": 2359} {"train_loss": -12.120262145996094, "global_step": 396459, "epoch": 2359} {"train_loss": -12.398822784423828, "global_step": 396460, "epoch": 2359} {"train_loss": -12.281604766845703, "global_step": 396461, "epoch": 2359} {"train_loss": -12.046161651611328, "global_step": 396462, "epoch": 2359} {"train_loss": -11.89561939239502, "global_step": 396463, "epoch": 2359} {"train_loss": -12.54914665222168, "global_step": 396464, "epoch": 2359} {"train_loss": -11.74498176574707, "global_step": 396465, "epoch": 2359} {"train_loss": -11.672243118286133, "global_step": 396466, "epoch": 2359} {"train_loss": -12.34691333770752, "global_step": 396467, "epoch": 2359} {"train_loss": -11.555070877075195, "global_step": 396468, "epoch": 2359} {"train_loss": -11.312894821166992, "global_step": 396469, "epoch": 2359} {"train_loss": -12.228055953979492, "global_step": 396470, "epoch": 2359} {"train_loss": -11.49783706665039, "global_step": 396471, "epoch": 2359} {"train_loss": -11.886711120605469, "global_step": 396472, "epoch": 2359} {"train_loss": -12.352341651916504, "global_step": 396473, "epoch": 2359} {"train_loss": -12.430584907531738, "global_step": 396474, "epoch": 2359} {"train_loss": -12.190752983093262, "global_step": 396475, "epoch": 2359} {"train_loss": -12.247980117797852, "global_step": 396476, "epoch": 2359} {"train_loss": -11.74647331237793, "global_step": 396477, "epoch": 2359} {"train_loss": -12.366060256958008, "global_step": 396478, "epoch": 2359} {"train_loss": -11.979022434779576, "global_step": 396479, "epoch": 2359, "val_loss": 290241.3125} {"train_loss": -12.05534553527832, "global_step": 396480, "epoch": 2360} {"train_loss": -11.821512222290039, "global_step": 396481, "epoch": 2360} {"train_loss": -12.233806610107422, "global_step": 396482, "epoch": 2360} {"train_loss": -11.901514053344727, "global_step": 396483, "epoch": 2360} {"train_loss": -11.987764358520508, "global_step": 396484, "epoch": 2360} {"train_loss": -12.177594184875488, "global_step": 396485, "epoch": 2360} {"train_loss": -11.644412994384766, "global_step": 396486, "epoch": 2360} {"train_loss": -11.33852767944336, "global_step": 396487, "epoch": 2360} {"train_loss": -12.539360046386719, "global_step": 396488, "epoch": 2360} {"train_loss": -11.166851043701172, "global_step": 396489, "epoch": 2360} {"train_loss": -10.927152633666992, "global_step": 396490, "epoch": 2360} {"train_loss": -12.472213745117188, "global_step": 396491, "epoch": 2360} {"train_loss": -11.647727966308594, "global_step": 396492, "epoch": 2360} {"train_loss": -11.985505104064941, "global_step": 396493, "epoch": 2360} {"train_loss": -11.748662948608398, "global_step": 396494, "epoch": 2360} {"train_loss": -11.349441528320312, "global_step": 396495, "epoch": 2360} {"train_loss": -11.025449752807617, "global_step": 396496, "epoch": 2360} {"train_loss": -9.777688980102539, "global_step": 396497, "epoch": 2360} {"train_loss": -10.511171340942383, "global_step": 396498, "epoch": 2360} {"train_loss": -11.382346153259277, "global_step": 396499, "epoch": 2360} {"train_loss": -10.384110450744629, "global_step": 396500, "epoch": 2360} {"train_loss": -10.263626098632812, "global_step": 396501, "epoch": 2360} {"train_loss": -11.45016860961914, "global_step": 396502, "epoch": 2360} {"train_loss": -10.766561508178711, "global_step": 396503, "epoch": 2360} {"train_loss": -12.097089767456055, "global_step": 396504, "epoch": 2360} {"train_loss": -11.078471183776855, "global_step": 396505, "epoch": 2360} {"train_loss": -10.957221984863281, "global_step": 396506, "epoch": 2360} {"train_loss": -11.673080444335938, "global_step": 396507, "epoch": 2360} {"train_loss": -10.38161849975586, "global_step": 396508, "epoch": 2360} {"train_loss": -11.406917572021484, "global_step": 396509, "epoch": 2360} {"train_loss": -10.928701400756836, "global_step": 396510, "epoch": 2360} {"train_loss": -11.087224960327148, "global_step": 396511, "epoch": 2360} {"train_loss": -11.684000015258789, "global_step": 396512, "epoch": 2360} {"train_loss": -12.011629104614258, "global_step": 396513, "epoch": 2360} {"train_loss": -11.277017593383789, "global_step": 396514, "epoch": 2360} {"train_loss": -11.234954833984375, "global_step": 396515, "epoch": 2360} {"train_loss": -11.478409767150879, "global_step": 396516, "epoch": 2360} {"train_loss": -11.769416809082031, "global_step": 396517, "epoch": 2360} {"train_loss": -11.739218711853027, "global_step": 396518, "epoch": 2360} {"train_loss": -11.889313697814941, "global_step": 396519, "epoch": 2360} {"train_loss": -11.843896865844727, "global_step": 396520, "epoch": 2360} {"train_loss": -11.947001457214355, "global_step": 396521, "epoch": 2360} {"train_loss": -12.021390914916992, "global_step": 396522, "epoch": 2360} {"train_loss": -12.068461418151855, "global_step": 396523, "epoch": 2360} {"train_loss": -11.591142654418945, "global_step": 396524, "epoch": 2360} {"train_loss": -11.95872688293457, "global_step": 396525, "epoch": 2360} {"train_loss": -11.785467147827148, "global_step": 396526, "epoch": 2360} {"train_loss": -12.002903938293457, "global_step": 396527, "epoch": 2360} {"train_loss": -11.504049301147461, "global_step": 396528, "epoch": 2360} {"train_loss": -12.20669174194336, "global_step": 396529, "epoch": 2360} {"train_loss": -12.015959739685059, "global_step": 396530, "epoch": 2360} {"train_loss": -11.68093490600586, "global_step": 396531, "epoch": 2360} {"train_loss": -11.980405807495117, "global_step": 396532, "epoch": 2360} {"train_loss": -12.165970802307129, "global_step": 396533, "epoch": 2360} {"train_loss": -11.506031036376953, "global_step": 396534, "epoch": 2360} {"train_loss": -11.956550598144531, "global_step": 396535, "epoch": 2360} {"train_loss": -11.784509658813477, "global_step": 396536, "epoch": 2360} {"train_loss": -11.876764297485352, "global_step": 396537, "epoch": 2360} {"train_loss": -11.850040435791016, "global_step": 396538, "epoch": 2360} {"train_loss": -11.629242897033691, "global_step": 396539, "epoch": 2360} {"train_loss": -11.559253692626953, "global_step": 396540, "epoch": 2360} {"train_loss": -12.06867790222168, "global_step": 396541, "epoch": 2360} {"train_loss": -11.44648551940918, "global_step": 396542, "epoch": 2360} {"train_loss": -11.968875885009766, "global_step": 396543, "epoch": 2360} {"train_loss": -12.244338035583496, "global_step": 396544, "epoch": 2360} {"train_loss": -11.282029151916504, "global_step": 396545, "epoch": 2360} {"train_loss": -12.051769256591797, "global_step": 396546, "epoch": 2360} {"train_loss": -11.014132499694824, "global_step": 396547, "epoch": 2360} {"train_loss": -11.766698837280273, "global_step": 396548, "epoch": 2360} {"train_loss": -11.636591911315918, "global_step": 396549, "epoch": 2360} {"train_loss": -10.430892944335938, "global_step": 396550, "epoch": 2360} {"train_loss": -12.025352478027344, "global_step": 396551, "epoch": 2360} {"train_loss": -11.193944931030273, "global_step": 396552, "epoch": 2360} {"train_loss": -11.355283737182617, "global_step": 396553, "epoch": 2360} {"train_loss": -11.418891906738281, "global_step": 396554, "epoch": 2360} {"train_loss": -11.127796173095703, "global_step": 396555, "epoch": 2360} {"train_loss": -11.683523178100586, "global_step": 396556, "epoch": 2360} {"train_loss": -11.614486694335938, "global_step": 396557, "epoch": 2360} {"train_loss": -11.494996070861816, "global_step": 396558, "epoch": 2360} {"train_loss": -11.478108406066895, "global_step": 396559, "epoch": 2360} {"train_loss": -11.516826629638672, "global_step": 396560, "epoch": 2360} {"train_loss": -11.425201416015625, "global_step": 396561, "epoch": 2360} {"train_loss": -11.203585624694824, "global_step": 396562, "epoch": 2360} {"train_loss": -11.872102737426758, "global_step": 396563, "epoch": 2360} {"train_loss": -10.98246955871582, "global_step": 396564, "epoch": 2360} {"train_loss": -11.713827133178711, "global_step": 396565, "epoch": 2360} {"train_loss": -11.810115814208984, "global_step": 396566, "epoch": 2360} {"train_loss": -10.862101554870605, "global_step": 396567, "epoch": 2360} {"train_loss": -12.457182884216309, "global_step": 396568, "epoch": 2360} {"train_loss": -11.311534881591797, "global_step": 396569, "epoch": 2360} {"train_loss": -11.482553482055664, "global_step": 396570, "epoch": 2360} {"train_loss": -12.248109817504883, "global_step": 396571, "epoch": 2360} {"train_loss": -11.287971496582031, "global_step": 396572, "epoch": 2360} {"train_loss": -11.554269790649414, "global_step": 396573, "epoch": 2360} {"train_loss": -11.866100311279297, "global_step": 396574, "epoch": 2360} {"train_loss": -11.714725494384766, "global_step": 396575, "epoch": 2360} {"train_loss": -12.090396881103516, "global_step": 396576, "epoch": 2360} {"train_loss": -11.718632698059082, "global_step": 396577, "epoch": 2360} {"train_loss": -11.987173080444336, "global_step": 396578, "epoch": 2360} {"train_loss": -11.657304763793945, "global_step": 396579, "epoch": 2360} {"train_loss": -11.961465835571289, "global_step": 396580, "epoch": 2360} {"train_loss": -11.757840156555176, "global_step": 396581, "epoch": 2360} {"train_loss": -11.244879722595215, "global_step": 396582, "epoch": 2360} {"train_loss": -11.717784881591797, "global_step": 396583, "epoch": 2360} {"train_loss": -11.14522933959961, "global_step": 396584, "epoch": 2360} {"train_loss": -11.91175651550293, "global_step": 396585, "epoch": 2360} {"train_loss": -11.856858253479004, "global_step": 396586, "epoch": 2360} {"train_loss": -11.500626564025879, "global_step": 396587, "epoch": 2360} {"train_loss": -11.537640571594238, "global_step": 396588, "epoch": 2360} {"train_loss": -11.586213111877441, "global_step": 396589, "epoch": 2360} {"train_loss": -11.11075210571289, "global_step": 396590, "epoch": 2360} {"train_loss": -11.63095474243164, "global_step": 396591, "epoch": 2360} {"train_loss": -11.208793640136719, "global_step": 396592, "epoch": 2360} {"train_loss": -11.610443115234375, "global_step": 396593, "epoch": 2360} {"train_loss": -12.078856468200684, "global_step": 396594, "epoch": 2360} {"train_loss": -11.176136016845703, "global_step": 396595, "epoch": 2360} {"train_loss": -12.069519996643066, "global_step": 396596, "epoch": 2360} {"train_loss": -11.461771011352539, "global_step": 396597, "epoch": 2360} {"train_loss": -11.978135108947754, "global_step": 396598, "epoch": 2360} {"train_loss": -11.766763687133789, "global_step": 396599, "epoch": 2360} {"train_loss": -11.892675399780273, "global_step": 396600, "epoch": 2360} {"train_loss": -12.263021469116211, "global_step": 396601, "epoch": 2360} {"train_loss": -11.79932975769043, "global_step": 396602, "epoch": 2360} {"train_loss": -12.36893367767334, "global_step": 396603, "epoch": 2360} {"train_loss": -11.613161087036133, "global_step": 396604, "epoch": 2360} {"train_loss": -12.099916458129883, "global_step": 396605, "epoch": 2360} {"train_loss": -12.184224128723145, "global_step": 396606, "epoch": 2360} {"train_loss": -11.920342445373535, "global_step": 396607, "epoch": 2360} {"train_loss": -12.206238746643066, "global_step": 396608, "epoch": 2360} {"train_loss": -12.153225898742676, "global_step": 396609, "epoch": 2360} {"train_loss": -12.042320251464844, "global_step": 396610, "epoch": 2360} {"train_loss": -12.15866470336914, "global_step": 396611, "epoch": 2360} {"train_loss": -12.17759895324707, "global_step": 396612, "epoch": 2360} {"train_loss": -12.009844779968262, "global_step": 396613, "epoch": 2360} {"train_loss": -12.239716529846191, "global_step": 396614, "epoch": 2360} {"train_loss": -12.36549186706543, "global_step": 396615, "epoch": 2360} {"train_loss": -12.169949531555176, "global_step": 396616, "epoch": 2360} {"train_loss": -12.432785034179688, "global_step": 396617, "epoch": 2360} {"train_loss": -12.403518676757812, "global_step": 396618, "epoch": 2360} {"train_loss": -12.347320556640625, "global_step": 396619, "epoch": 2360} {"train_loss": -12.257087707519531, "global_step": 396620, "epoch": 2360} {"train_loss": -12.26092529296875, "global_step": 396621, "epoch": 2360} {"train_loss": -12.2759370803833, "global_step": 396622, "epoch": 2360} {"train_loss": -12.271615028381348, "global_step": 396623, "epoch": 2360} {"train_loss": -12.479114532470703, "global_step": 396624, "epoch": 2360} {"train_loss": -12.436262130737305, "global_step": 396625, "epoch": 2360} {"train_loss": -12.269001007080078, "global_step": 396626, "epoch": 2360} {"train_loss": -12.384450912475586, "global_step": 396627, "epoch": 2360} {"train_loss": -12.203438758850098, "global_step": 396628, "epoch": 2360} {"train_loss": -12.509735107421875, "global_step": 396629, "epoch": 2360} {"train_loss": -12.008014678955078, "global_step": 396630, "epoch": 2360} {"train_loss": -12.139230728149414, "global_step": 396631, "epoch": 2360} {"train_loss": -12.611708641052246, "global_step": 396632, "epoch": 2360} {"train_loss": -11.64626693725586, "global_step": 396633, "epoch": 2360} {"train_loss": -12.479316711425781, "global_step": 396634, "epoch": 2360} {"train_loss": -12.139209747314453, "global_step": 396635, "epoch": 2360} {"train_loss": -12.679313659667969, "global_step": 396636, "epoch": 2360} {"train_loss": -12.300203323364258, "global_step": 396637, "epoch": 2360} {"train_loss": -12.14024543762207, "global_step": 396638, "epoch": 2360} {"train_loss": -12.482048034667969, "global_step": 396639, "epoch": 2360} {"train_loss": -11.97201919555664, "global_step": 396640, "epoch": 2360} {"train_loss": -12.281536102294922, "global_step": 396641, "epoch": 2360} {"train_loss": -12.111382484436035, "global_step": 396642, "epoch": 2360} {"train_loss": -12.651850700378418, "global_step": 396643, "epoch": 2360} {"train_loss": -12.187862396240234, "global_step": 396644, "epoch": 2360} {"train_loss": -12.237569808959961, "global_step": 396645, "epoch": 2360} {"train_loss": -12.390713691711426, "global_step": 396646, "epoch": 2360} {"train_loss": -11.77075910000574, "global_step": 396647, "epoch": 2360, "val_loss": 291461.53125, "train_action_mse_error": 0.12398657202720642} {"train_loss": -12.260319709777832, "global_step": 396648, "epoch": 2361} {"train_loss": -12.142505645751953, "global_step": 396649, "epoch": 2361} {"train_loss": -12.252070426940918, "global_step": 396650, "epoch": 2361} {"train_loss": -11.833229064941406, "global_step": 396651, "epoch": 2361} {"train_loss": -12.012163162231445, "global_step": 396652, "epoch": 2361} {"train_loss": -11.556329727172852, "global_step": 396653, "epoch": 2361} {"train_loss": -11.900003433227539, "global_step": 396654, "epoch": 2361} {"train_loss": -11.633134841918945, "global_step": 396655, "epoch": 2361} {"train_loss": -11.266071319580078, "global_step": 396656, "epoch": 2361} {"train_loss": -11.977402687072754, "global_step": 396657, "epoch": 2361} {"train_loss": -11.13983154296875, "global_step": 396658, "epoch": 2361} {"train_loss": -11.497904777526855, "global_step": 396659, "epoch": 2361} {"train_loss": -10.514764785766602, "global_step": 396660, "epoch": 2361} {"train_loss": -11.796594619750977, "global_step": 396661, "epoch": 2361} {"train_loss": -10.52206802368164, "global_step": 396662, "epoch": 2361} {"train_loss": -11.84857177734375, "global_step": 396663, "epoch": 2361} {"train_loss": -9.99527359008789, "global_step": 396664, "epoch": 2361} {"train_loss": -10.598831176757812, "global_step": 396665, "epoch": 2361} {"train_loss": -11.958166122436523, "global_step": 396666, "epoch": 2361} {"train_loss": -10.530401229858398, "global_step": 396667, "epoch": 2361} {"train_loss": -11.806312561035156, "global_step": 396668, "epoch": 2361} {"train_loss": -11.98457145690918, "global_step": 396669, "epoch": 2361} {"train_loss": -12.086886405944824, "global_step": 396670, "epoch": 2361} {"train_loss": -11.547077178955078, "global_step": 396671, "epoch": 2361} {"train_loss": -11.936267852783203, "global_step": 396672, "epoch": 2361} {"train_loss": -12.187232971191406, "global_step": 396673, "epoch": 2361} {"train_loss": -12.235177993774414, "global_step": 396674, "epoch": 2361} {"train_loss": -12.610859870910645, "global_step": 396675, "epoch": 2361} {"train_loss": -11.668149948120117, "global_step": 396676, "epoch": 2361} {"train_loss": -12.10804271697998, "global_step": 396677, "epoch": 2361} {"train_loss": -12.14184284210205, "global_step": 396678, "epoch": 2361} {"train_loss": -11.932918548583984, "global_step": 396679, "epoch": 2361} {"train_loss": -12.46554946899414, "global_step": 396680, "epoch": 2361} {"train_loss": -11.989152908325195, "global_step": 396681, "epoch": 2361} {"train_loss": -12.258322715759277, "global_step": 396682, "epoch": 2361} {"train_loss": -12.096338272094727, "global_step": 396683, "epoch": 2361} {"train_loss": -12.52089786529541, "global_step": 396684, "epoch": 2361} {"train_loss": -12.131668090820312, "global_step": 396685, "epoch": 2361} {"train_loss": -12.53872299194336, "global_step": 396686, "epoch": 2361} {"train_loss": -12.242583274841309, "global_step": 396687, "epoch": 2361} {"train_loss": -12.41270637512207, "global_step": 396688, "epoch": 2361} {"train_loss": -12.226736068725586, "global_step": 396689, "epoch": 2361} {"train_loss": -12.221914291381836, "global_step": 396690, "epoch": 2361} {"train_loss": -12.22964859008789, "global_step": 396691, "epoch": 2361} {"train_loss": -12.146438598632812, "global_step": 396692, "epoch": 2361} {"train_loss": -12.295991897583008, "global_step": 396693, "epoch": 2361} {"train_loss": -12.13038444519043, "global_step": 396694, "epoch": 2361} {"train_loss": -12.26041030883789, "global_step": 396695, "epoch": 2361} {"train_loss": -12.133102416992188, "global_step": 396696, "epoch": 2361} {"train_loss": -12.510163307189941, "global_step": 396697, "epoch": 2361} {"train_loss": -12.370475769042969, "global_step": 396698, "epoch": 2361} {"train_loss": -12.3803071975708, "global_step": 396699, "epoch": 2361} {"train_loss": -12.08336353302002, "global_step": 396700, "epoch": 2361} {"train_loss": -12.530223846435547, "global_step": 396701, "epoch": 2361} {"train_loss": -12.388959884643555, "global_step": 396702, "epoch": 2361} {"train_loss": -12.421260833740234, "global_step": 396703, "epoch": 2361} {"train_loss": -12.373095512390137, "global_step": 396704, "epoch": 2361} {"train_loss": -12.401308059692383, "global_step": 396705, "epoch": 2361} {"train_loss": -12.049481391906738, "global_step": 396706, "epoch": 2361} {"train_loss": -11.536734580993652, "global_step": 396707, "epoch": 2361} {"train_loss": -12.293368339538574, "global_step": 396708, "epoch": 2361} {"train_loss": -12.005008697509766, "global_step": 396709, "epoch": 2361} {"train_loss": -12.212096214294434, "global_step": 396710, "epoch": 2361} {"train_loss": -11.709156036376953, "global_step": 396711, "epoch": 2361} {"train_loss": -12.256951332092285, "global_step": 396712, "epoch": 2361} {"train_loss": -11.938085556030273, "global_step": 396713, "epoch": 2361} {"train_loss": -12.103883743286133, "global_step": 396714, "epoch": 2361} {"train_loss": -12.466451644897461, "global_step": 396715, "epoch": 2361} {"train_loss": -11.481878280639648, "global_step": 396716, "epoch": 2361} {"train_loss": -11.96094036102295, "global_step": 396717, "epoch": 2361} {"train_loss": -12.118436813354492, "global_step": 396718, "epoch": 2361} {"train_loss": -12.227222442626953, "global_step": 396719, "epoch": 2361} {"train_loss": -10.825923919677734, "global_step": 396720, "epoch": 2361} {"train_loss": -11.79653263092041, "global_step": 396721, "epoch": 2361} {"train_loss": -12.359613418579102, "global_step": 396722, "epoch": 2361} {"train_loss": -10.003152847290039, "global_step": 396723, "epoch": 2361} {"train_loss": -11.165956497192383, "global_step": 396724, "epoch": 2361} {"train_loss": -11.862215042114258, "global_step": 396725, "epoch": 2361} {"train_loss": -10.457998275756836, "global_step": 396726, "epoch": 2361} {"train_loss": -10.337665557861328, "global_step": 396727, "epoch": 2361} {"train_loss": -11.914487838745117, "global_step": 396728, "epoch": 2361} {"train_loss": -11.152345657348633, "global_step": 396729, "epoch": 2361} {"train_loss": -10.025151252746582, "global_step": 396730, "epoch": 2361} {"train_loss": -10.890275955200195, "global_step": 396731, "epoch": 2361} {"train_loss": -10.855667114257812, "global_step": 396732, "epoch": 2361} {"train_loss": -10.824507713317871, "global_step": 396733, "epoch": 2361} {"train_loss": -10.557676315307617, "global_step": 396734, "epoch": 2361} {"train_loss": -11.074831008911133, "global_step": 396735, "epoch": 2361} {"train_loss": -11.690966606140137, "global_step": 396736, "epoch": 2361} {"train_loss": -11.354286193847656, "global_step": 396737, "epoch": 2361} {"train_loss": -11.796417236328125, "global_step": 396738, "epoch": 2361} {"train_loss": -11.33832836151123, "global_step": 396739, "epoch": 2361} {"train_loss": -11.856428146362305, "global_step": 396740, "epoch": 2361} {"train_loss": -11.71362590789795, "global_step": 396741, "epoch": 2361} {"train_loss": -12.02029037475586, "global_step": 396742, "epoch": 2361} {"train_loss": -12.252974510192871, "global_step": 396743, "epoch": 2361} {"train_loss": -12.04871654510498, "global_step": 396744, "epoch": 2361} {"train_loss": -12.02424430847168, "global_step": 396745, "epoch": 2361} {"train_loss": -12.0601806640625, "global_step": 396746, "epoch": 2361} {"train_loss": -12.493931770324707, "global_step": 396747, "epoch": 2361} {"train_loss": -12.440545082092285, "global_step": 396748, "epoch": 2361} {"train_loss": -12.22836685180664, "global_step": 396749, "epoch": 2361} {"train_loss": -12.265388488769531, "global_step": 396750, "epoch": 2361} {"train_loss": -12.048466682434082, "global_step": 396751, "epoch": 2361} {"train_loss": -12.049907684326172, "global_step": 396752, "epoch": 2361} {"train_loss": -12.342108726501465, "global_step": 396753, "epoch": 2361} {"train_loss": -12.237062454223633, "global_step": 396754, "epoch": 2361} {"train_loss": -12.334186553955078, "global_step": 396755, "epoch": 2361} {"train_loss": -12.178221702575684, "global_step": 396756, "epoch": 2361} {"train_loss": -12.133219718933105, "global_step": 396757, "epoch": 2361} {"train_loss": -12.216700553894043, "global_step": 396758, "epoch": 2361} {"train_loss": -12.416847229003906, "global_step": 396759, "epoch": 2361} {"train_loss": -12.132450103759766, "global_step": 396760, "epoch": 2361} {"train_loss": -12.13943099975586, "global_step": 396761, "epoch": 2361} {"train_loss": -12.307939529418945, "global_step": 396762, "epoch": 2361} {"train_loss": -11.986651420593262, "global_step": 396763, "epoch": 2361} {"train_loss": -12.234513282775879, "global_step": 396764, "epoch": 2361} {"train_loss": -12.370315551757812, "global_step": 396765, "epoch": 2361} {"train_loss": -12.29348373413086, "global_step": 396766, "epoch": 2361} {"train_loss": -12.507867813110352, "global_step": 396767, "epoch": 2361} {"train_loss": -12.06235122680664, "global_step": 396768, "epoch": 2361} {"train_loss": -12.206953048706055, "global_step": 396769, "epoch": 2361} {"train_loss": -12.351886749267578, "global_step": 396770, "epoch": 2361} {"train_loss": -12.136002540588379, "global_step": 396771, "epoch": 2361} {"train_loss": -12.14321517944336, "global_step": 396772, "epoch": 2361} {"train_loss": -12.059138298034668, "global_step": 396773, "epoch": 2361} {"train_loss": -12.214248657226562, "global_step": 396774, "epoch": 2361} {"train_loss": -12.255899429321289, "global_step": 396775, "epoch": 2361} {"train_loss": -12.065534591674805, "global_step": 396776, "epoch": 2361} {"train_loss": -12.340737342834473, "global_step": 396777, "epoch": 2361} {"train_loss": -12.185003280639648, "global_step": 396778, "epoch": 2361} {"train_loss": -12.234869003295898, "global_step": 396779, "epoch": 2361} {"train_loss": -12.311334609985352, "global_step": 396780, "epoch": 2361} {"train_loss": -12.303698539733887, "global_step": 396781, "epoch": 2361} {"train_loss": -12.343242645263672, "global_step": 396782, "epoch": 2361} {"train_loss": -12.145328521728516, "global_step": 396783, "epoch": 2361} {"train_loss": -12.459214210510254, "global_step": 396784, "epoch": 2361} {"train_loss": -11.929438591003418, "global_step": 396785, "epoch": 2361} {"train_loss": -12.40500545501709, "global_step": 396786, "epoch": 2361} {"train_loss": -12.058233261108398, "global_step": 396787, "epoch": 2361} {"train_loss": -11.779254913330078, "global_step": 396788, "epoch": 2361} {"train_loss": -12.108017921447754, "global_step": 396789, "epoch": 2361} {"train_loss": -12.32720947265625, "global_step": 396790, "epoch": 2361} {"train_loss": -12.443502426147461, "global_step": 396791, "epoch": 2361} {"train_loss": -12.402812957763672, "global_step": 396792, "epoch": 2361} {"train_loss": -12.606376647949219, "global_step": 396793, "epoch": 2361} {"train_loss": -12.56937313079834, "global_step": 396794, "epoch": 2361} {"train_loss": -12.531780242919922, "global_step": 396795, "epoch": 2361} {"train_loss": -12.624666213989258, "global_step": 396796, "epoch": 2361} {"train_loss": -12.670772552490234, "global_step": 396797, "epoch": 2361} {"train_loss": -12.390015602111816, "global_step": 396798, "epoch": 2361} {"train_loss": -12.494720458984375, "global_step": 396799, "epoch": 2361} {"train_loss": -12.649532318115234, "global_step": 396800, "epoch": 2361} {"train_loss": -12.34900188446045, "global_step": 396801, "epoch": 2361} {"train_loss": -12.368877410888672, "global_step": 396802, "epoch": 2361} {"train_loss": -12.457072257995605, "global_step": 396803, "epoch": 2361} {"train_loss": -12.642059326171875, "global_step": 396804, "epoch": 2361} {"train_loss": -12.556071281433105, "global_step": 396805, "epoch": 2361} {"train_loss": -12.601768493652344, "global_step": 396806, "epoch": 2361} {"train_loss": -12.11458969116211, "global_step": 396807, "epoch": 2361} {"train_loss": -12.224420547485352, "global_step": 396808, "epoch": 2361} {"train_loss": -12.506087303161621, "global_step": 396809, "epoch": 2361} {"train_loss": -11.865520477294922, "global_step": 396810, "epoch": 2361} {"train_loss": -12.512877464294434, "global_step": 396811, "epoch": 2361} {"train_loss": -11.948346138000488, "global_step": 396812, "epoch": 2361} {"train_loss": -10.740278244018555, "global_step": 396813, "epoch": 2361} {"train_loss": -12.577531814575195, "global_step": 396814, "epoch": 2361} {"train_loss": -11.986056015605019, "global_step": 396815, "epoch": 2361, "val_loss": 293089.0} {"train_loss": -10.312822341918945, "global_step": 396816, "epoch": 2362} {"train_loss": -11.082228660583496, "global_step": 396817, "epoch": 2362} {"train_loss": -9.342560768127441, "global_step": 396818, "epoch": 2362} {"train_loss": -11.139512062072754, "global_step": 396819, "epoch": 2362} {"train_loss": -9.560558319091797, "global_step": 396820, "epoch": 2362} {"train_loss": -11.324645042419434, "global_step": 396821, "epoch": 2362} {"train_loss": -8.904050827026367, "global_step": 396822, "epoch": 2362} {"train_loss": -9.6315279006958, "global_step": 396823, "epoch": 2362} {"train_loss": -7.335254669189453, "global_step": 396824, "epoch": 2362} {"train_loss": -10.11463737487793, "global_step": 396825, "epoch": 2362} {"train_loss": -8.527915954589844, "global_step": 396826, "epoch": 2362} {"train_loss": -8.370096206665039, "global_step": 396827, "epoch": 2362} {"train_loss": -10.03184986114502, "global_step": 396828, "epoch": 2362} {"train_loss": -10.04299259185791, "global_step": 396829, "epoch": 2362} {"train_loss": -8.886889457702637, "global_step": 396830, "epoch": 2362} {"train_loss": -10.406624794006348, "global_step": 396831, "epoch": 2362} {"train_loss": -11.456413269042969, "global_step": 396832, "epoch": 2362} {"train_loss": -9.601813316345215, "global_step": 396833, "epoch": 2362} {"train_loss": -9.769548416137695, "global_step": 396834, "epoch": 2362} {"train_loss": -10.560065269470215, "global_step": 396835, "epoch": 2362} {"train_loss": -10.982027053833008, "global_step": 396836, "epoch": 2362} {"train_loss": -10.44843864440918, "global_step": 396837, "epoch": 2362} {"train_loss": -11.27174186706543, "global_step": 396838, "epoch": 2362} {"train_loss": -9.812625885009766, "global_step": 396839, "epoch": 2362} {"train_loss": -9.319156646728516, "global_step": 396840, "epoch": 2362} {"train_loss": -11.342041015625, "global_step": 396841, "epoch": 2362} {"train_loss": -9.982895851135254, "global_step": 396842, "epoch": 2362} {"train_loss": -8.850698471069336, "global_step": 396843, "epoch": 2362} {"train_loss": -10.331789016723633, "global_step": 396844, "epoch": 2362} {"train_loss": -10.19820785522461, "global_step": 396845, "epoch": 2362} {"train_loss": -10.65695858001709, "global_step": 396846, "epoch": 2362} {"train_loss": -9.550224304199219, "global_step": 396847, "epoch": 2362} {"train_loss": -9.709957122802734, "global_step": 396848, "epoch": 2362} {"train_loss": -10.808879852294922, "global_step": 396849, "epoch": 2362} {"train_loss": -10.396211624145508, "global_step": 396850, "epoch": 2362} {"train_loss": -9.55229663848877, "global_step": 396851, "epoch": 2362} {"train_loss": -10.865300178527832, "global_step": 396852, "epoch": 2362} {"train_loss": -11.3897705078125, "global_step": 396853, "epoch": 2362} {"train_loss": -11.088238716125488, "global_step": 396854, "epoch": 2362} {"train_loss": -11.084686279296875, "global_step": 396855, "epoch": 2362} {"train_loss": -11.396284103393555, "global_step": 396856, "epoch": 2362} {"train_loss": -10.621578216552734, "global_step": 396857, "epoch": 2362} {"train_loss": -11.0050630569458, "global_step": 396858, "epoch": 2362} {"train_loss": -11.694272994995117, "global_step": 396859, "epoch": 2362} {"train_loss": -11.481377601623535, "global_step": 396860, "epoch": 2362} {"train_loss": -11.397672653198242, "global_step": 396861, "epoch": 2362} {"train_loss": -11.837789535522461, "global_step": 396862, "epoch": 2362} {"train_loss": -11.771080017089844, "global_step": 396863, "epoch": 2362} {"train_loss": -11.613748550415039, "global_step": 396864, "epoch": 2362} {"train_loss": -11.551633834838867, "global_step": 396865, "epoch": 2362} {"train_loss": -11.79106330871582, "global_step": 396866, "epoch": 2362} {"train_loss": -11.59501838684082, "global_step": 396867, "epoch": 2362} {"train_loss": -11.726774215698242, "global_step": 396868, "epoch": 2362} {"train_loss": -11.816359519958496, "global_step": 396869, "epoch": 2362} {"train_loss": -11.790433883666992, "global_step": 396870, "epoch": 2362} {"train_loss": -11.816061019897461, "global_step": 396871, "epoch": 2362} {"train_loss": -11.874961853027344, "global_step": 396872, "epoch": 2362} {"train_loss": -11.722183227539062, "global_step": 396873, "epoch": 2362} {"train_loss": -11.909664154052734, "global_step": 396874, "epoch": 2362} {"train_loss": -12.014537811279297, "global_step": 396875, "epoch": 2362} {"train_loss": -11.881970405578613, "global_step": 396876, "epoch": 2362} {"train_loss": -12.192848205566406, "global_step": 396877, "epoch": 2362} {"train_loss": -11.970606803894043, "global_step": 396878, "epoch": 2362} {"train_loss": -11.906027793884277, "global_step": 396879, "epoch": 2362} {"train_loss": -12.200989723205566, "global_step": 396880, "epoch": 2362} {"train_loss": -12.05177116394043, "global_step": 396881, "epoch": 2362} {"train_loss": -12.12623405456543, "global_step": 396882, "epoch": 2362} {"train_loss": -12.000956535339355, "global_step": 396883, "epoch": 2362} {"train_loss": -11.94132137298584, "global_step": 396884, "epoch": 2362} {"train_loss": -11.963228225708008, "global_step": 396885, "epoch": 2362} {"train_loss": -12.140106201171875, "global_step": 396886, "epoch": 2362} {"train_loss": -12.293598175048828, "global_step": 396887, "epoch": 2362} {"train_loss": -12.414346694946289, "global_step": 396888, "epoch": 2362} {"train_loss": -12.37037467956543, "global_step": 396889, "epoch": 2362} {"train_loss": -12.247315406799316, "global_step": 396890, "epoch": 2362} {"train_loss": -12.215044021606445, "global_step": 396891, "epoch": 2362} {"train_loss": -12.365713119506836, "global_step": 396892, "epoch": 2362} {"train_loss": -12.446939468383789, "global_step": 396893, "epoch": 2362} {"train_loss": -12.323482513427734, "global_step": 396894, "epoch": 2362} {"train_loss": -12.16761589050293, "global_step": 396895, "epoch": 2362} {"train_loss": -12.380857467651367, "global_step": 396896, "epoch": 2362} {"train_loss": -12.246707916259766, "global_step": 396897, "epoch": 2362} {"train_loss": -12.33961296081543, "global_step": 396898, "epoch": 2362} {"train_loss": -12.151206016540527, "global_step": 396899, "epoch": 2362} {"train_loss": -12.352139472961426, "global_step": 396900, "epoch": 2362} {"train_loss": -12.244551658630371, "global_step": 396901, "epoch": 2362} {"train_loss": -12.455639839172363, "global_step": 396902, "epoch": 2362} {"train_loss": -12.165127754211426, "global_step": 396903, "epoch": 2362} {"train_loss": -12.528189659118652, "global_step": 396904, "epoch": 2362} {"train_loss": -12.351970672607422, "global_step": 396905, "epoch": 2362} {"train_loss": -12.588424682617188, "global_step": 396906, "epoch": 2362} {"train_loss": -12.361013412475586, "global_step": 396907, "epoch": 2362} {"train_loss": -12.391318321228027, "global_step": 396908, "epoch": 2362} {"train_loss": -12.43971061706543, "global_step": 396909, "epoch": 2362} {"train_loss": -12.368461608886719, "global_step": 396910, "epoch": 2362} {"train_loss": -12.276275634765625, "global_step": 396911, "epoch": 2362} {"train_loss": -12.282699584960938, "global_step": 396912, "epoch": 2362} {"train_loss": -12.598531723022461, "global_step": 396913, "epoch": 2362} {"train_loss": -12.428528785705566, "global_step": 396914, "epoch": 2362} {"train_loss": -12.444618225097656, "global_step": 396915, "epoch": 2362} {"train_loss": -12.36783218383789, "global_step": 396916, "epoch": 2362} {"train_loss": -12.398139953613281, "global_step": 396917, "epoch": 2362} {"train_loss": -12.513679504394531, "global_step": 396918, "epoch": 2362} {"train_loss": -12.56640625, "global_step": 396919, "epoch": 2362} {"train_loss": -12.58677864074707, "global_step": 396920, "epoch": 2362} {"train_loss": -12.345014572143555, "global_step": 396921, "epoch": 2362} {"train_loss": -12.530033111572266, "global_step": 396922, "epoch": 2362} {"train_loss": -12.551806449890137, "global_step": 396923, "epoch": 2362} {"train_loss": -12.085107803344727, "global_step": 396924, "epoch": 2362} {"train_loss": -12.063720703125, "global_step": 396925, "epoch": 2362} {"train_loss": -12.698251724243164, "global_step": 396926, "epoch": 2362} {"train_loss": -12.286859512329102, "global_step": 396927, "epoch": 2362} {"train_loss": -12.423866271972656, "global_step": 396928, "epoch": 2362} {"train_loss": -12.139092445373535, "global_step": 396929, "epoch": 2362} {"train_loss": -11.694646835327148, "global_step": 396930, "epoch": 2362} {"train_loss": -11.965553283691406, "global_step": 396931, "epoch": 2362} {"train_loss": -12.280871391296387, "global_step": 396932, "epoch": 2362} {"train_loss": -12.020960807800293, "global_step": 396933, "epoch": 2362} {"train_loss": -11.629093170166016, "global_step": 396934, "epoch": 2362} {"train_loss": -12.001462936401367, "global_step": 396935, "epoch": 2362} {"train_loss": -10.394760131835938, "global_step": 396936, "epoch": 2362} {"train_loss": -10.35753059387207, "global_step": 396937, "epoch": 2362} {"train_loss": -12.523849487304688, "global_step": 396938, "epoch": 2362} {"train_loss": -9.994645118713379, "global_step": 396939, "epoch": 2362} {"train_loss": -12.140168190002441, "global_step": 396940, "epoch": 2362} {"train_loss": -11.003959655761719, "global_step": 396941, "epoch": 2362} {"train_loss": -10.150909423828125, "global_step": 396942, "epoch": 2362} {"train_loss": -11.874984741210938, "global_step": 396943, "epoch": 2362} {"train_loss": -10.762325286865234, "global_step": 396944, "epoch": 2362} {"train_loss": -11.82867431640625, "global_step": 396945, "epoch": 2362} {"train_loss": -12.194334030151367, "global_step": 396946, "epoch": 2362} {"train_loss": -11.30309772491455, "global_step": 396947, "epoch": 2362} {"train_loss": -12.366182327270508, "global_step": 396948, "epoch": 2362} {"train_loss": -11.351517677307129, "global_step": 396949, "epoch": 2362} {"train_loss": -12.061958312988281, "global_step": 396950, "epoch": 2362} {"train_loss": -11.951169967651367, "global_step": 396951, "epoch": 2362} {"train_loss": -11.93183422088623, "global_step": 396952, "epoch": 2362} {"train_loss": -12.055309295654297, "global_step": 396953, "epoch": 2362} {"train_loss": -11.930484771728516, "global_step": 396954, "epoch": 2362} {"train_loss": -11.816707611083984, "global_step": 396955, "epoch": 2362} {"train_loss": -11.895397186279297, "global_step": 396956, "epoch": 2362} {"train_loss": -11.40043830871582, "global_step": 396957, "epoch": 2362} {"train_loss": -12.299858093261719, "global_step": 396958, "epoch": 2362} {"train_loss": -11.356891632080078, "global_step": 396959, "epoch": 2362} {"train_loss": -12.379179000854492, "global_step": 396960, "epoch": 2362} {"train_loss": -11.67520523071289, "global_step": 396961, "epoch": 2362} {"train_loss": -12.120418548583984, "global_step": 396962, "epoch": 2362} {"train_loss": -11.441699981689453, "global_step": 396963, "epoch": 2362} {"train_loss": -11.445316314697266, "global_step": 396964, "epoch": 2362} {"train_loss": -11.711639404296875, "global_step": 396965, "epoch": 2362} {"train_loss": -11.475116729736328, "global_step": 396966, "epoch": 2362} {"train_loss": -11.834981918334961, "global_step": 396967, "epoch": 2362} {"train_loss": -12.350000381469727, "global_step": 396968, "epoch": 2362} {"train_loss": -12.074355125427246, "global_step": 396969, "epoch": 2362} {"train_loss": -12.075873374938965, "global_step": 396970, "epoch": 2362} {"train_loss": -12.208285331726074, "global_step": 396971, "epoch": 2362} {"train_loss": -12.286638259887695, "global_step": 396972, "epoch": 2362} {"train_loss": -12.03146743774414, "global_step": 396973, "epoch": 2362} {"train_loss": -12.21996784210205, "global_step": 396974, "epoch": 2362} {"train_loss": -12.219144821166992, "global_step": 396975, "epoch": 2362} {"train_loss": -11.707916259765625, "global_step": 396976, "epoch": 2362} {"train_loss": -12.11310863494873, "global_step": 396977, "epoch": 2362} {"train_loss": -12.10835075378418, "global_step": 396978, "epoch": 2362} {"train_loss": -12.224526405334473, "global_step": 396979, "epoch": 2362} {"train_loss": -12.418071746826172, "global_step": 396980, "epoch": 2362} {"train_loss": -12.427050590515137, "global_step": 396981, "epoch": 2362} {"train_loss": -12.013223648071289, "global_step": 396982, "epoch": 2362} {"train_loss": -11.53494838305882, "global_step": 396983, "epoch": 2362, "val_loss": 292613.6875} {"train_loss": -12.037444114685059, "global_step": 396984, "epoch": 2363} {"train_loss": -12.354174613952637, "global_step": 396985, "epoch": 2363} {"train_loss": -12.003179550170898, "global_step": 396986, "epoch": 2363} {"train_loss": -12.349891662597656, "global_step": 396987, "epoch": 2363} {"train_loss": -12.319395065307617, "global_step": 396988, "epoch": 2363} {"train_loss": -11.918563842773438, "global_step": 396989, "epoch": 2363} {"train_loss": -12.239656448364258, "global_step": 396990, "epoch": 2363} {"train_loss": -12.093374252319336, "global_step": 396991, "epoch": 2363} {"train_loss": -12.081418991088867, "global_step": 396992, "epoch": 2363} {"train_loss": -12.238157272338867, "global_step": 396993, "epoch": 2363} {"train_loss": -11.950180053710938, "global_step": 396994, "epoch": 2363} {"train_loss": -11.855987548828125, "global_step": 396995, "epoch": 2363} {"train_loss": -12.75956916809082, "global_step": 396996, "epoch": 2363} {"train_loss": -11.946300506591797, "global_step": 396997, "epoch": 2363} {"train_loss": -12.378782272338867, "global_step": 396998, "epoch": 2363} {"train_loss": -11.661648750305176, "global_step": 396999, "epoch": 2363} {"train_loss": -11.475847244262695, "global_step": 397000, "epoch": 2363} {"train_loss": -12.182088851928711, "global_step": 397001, "epoch": 2363} {"train_loss": -10.866418838500977, "global_step": 397002, "epoch": 2363} {"train_loss": -11.572577476501465, "global_step": 397003, "epoch": 2363} {"train_loss": -12.453479766845703, "global_step": 397004, "epoch": 2363} {"train_loss": -11.570446014404297, "global_step": 397005, "epoch": 2363} {"train_loss": -12.275032043457031, "global_step": 397006, "epoch": 2363} {"train_loss": -12.117023468017578, "global_step": 397007, "epoch": 2363} {"train_loss": -12.50366497039795, "global_step": 397008, "epoch": 2363} {"train_loss": -12.522432327270508, "global_step": 397009, "epoch": 2363} {"train_loss": -12.081611633300781, "global_step": 397010, "epoch": 2363} {"train_loss": -12.4447021484375, "global_step": 397011, "epoch": 2363} {"train_loss": -12.2667875289917, "global_step": 397012, "epoch": 2363} {"train_loss": -12.181703567504883, "global_step": 397013, "epoch": 2363} {"train_loss": -12.658035278320312, "global_step": 397014, "epoch": 2363} {"train_loss": -12.446853637695312, "global_step": 397015, "epoch": 2363} {"train_loss": -12.450868606567383, "global_step": 397016, "epoch": 2363} {"train_loss": -12.42121696472168, "global_step": 397017, "epoch": 2363} {"train_loss": -12.244102478027344, "global_step": 397018, "epoch": 2363} {"train_loss": -12.634174346923828, "global_step": 397019, "epoch": 2363} {"train_loss": -12.08615493774414, "global_step": 397020, "epoch": 2363} {"train_loss": -12.416816711425781, "global_step": 397021, "epoch": 2363} {"train_loss": -12.515539169311523, "global_step": 397022, "epoch": 2363} {"train_loss": -12.223029136657715, "global_step": 397023, "epoch": 2363} {"train_loss": -12.39918327331543, "global_step": 397024, "epoch": 2363} {"train_loss": -12.364180564880371, "global_step": 397025, "epoch": 2363} {"train_loss": -12.658812522888184, "global_step": 397026, "epoch": 2363} {"train_loss": -12.436132431030273, "global_step": 397027, "epoch": 2363} {"train_loss": -12.524267196655273, "global_step": 397028, "epoch": 2363} {"train_loss": -12.48948860168457, "global_step": 397029, "epoch": 2363} {"train_loss": -12.68666934967041, "global_step": 397030, "epoch": 2363} {"train_loss": -12.524173736572266, "global_step": 397031, "epoch": 2363} {"train_loss": -12.606212615966797, "global_step": 397032, "epoch": 2363} {"train_loss": -12.510092735290527, "global_step": 397033, "epoch": 2363} {"train_loss": -12.536008834838867, "global_step": 397034, "epoch": 2363} {"train_loss": -12.38064956665039, "global_step": 397035, "epoch": 2363} {"train_loss": -12.78480339050293, "global_step": 397036, "epoch": 2363} {"train_loss": -12.213175773620605, "global_step": 397037, "epoch": 2363} {"train_loss": -12.593098640441895, "global_step": 397038, "epoch": 2363} {"train_loss": -12.518569946289062, "global_step": 397039, "epoch": 2363} {"train_loss": -12.433370590209961, "global_step": 397040, "epoch": 2363} {"train_loss": -12.440631866455078, "global_step": 397041, "epoch": 2363} {"train_loss": -12.459896087646484, "global_step": 397042, "epoch": 2363} {"train_loss": -12.67198657989502, "global_step": 397043, "epoch": 2363} {"train_loss": -12.42103385925293, "global_step": 397044, "epoch": 2363} {"train_loss": -12.485628128051758, "global_step": 397045, "epoch": 2363} {"train_loss": -12.699414253234863, "global_step": 397046, "epoch": 2363} {"train_loss": -12.461384773254395, "global_step": 397047, "epoch": 2363} {"train_loss": -12.509459495544434, "global_step": 397048, "epoch": 2363} {"train_loss": -12.811527252197266, "global_step": 397049, "epoch": 2363} {"train_loss": -12.080399513244629, "global_step": 397050, "epoch": 2363} {"train_loss": -12.641841888427734, "global_step": 397051, "epoch": 2363} {"train_loss": -12.307794570922852, "global_step": 397052, "epoch": 2363} {"train_loss": -11.89294147491455, "global_step": 397053, "epoch": 2363} {"train_loss": -12.714717864990234, "global_step": 397054, "epoch": 2363} {"train_loss": -12.20541000366211, "global_step": 397055, "epoch": 2363} {"train_loss": -10.811095237731934, "global_step": 397056, "epoch": 2363} {"train_loss": -10.568416595458984, "global_step": 397057, "epoch": 2363} {"train_loss": -12.134359359741211, "global_step": 397058, "epoch": 2363} {"train_loss": -12.21316909790039, "global_step": 397059, "epoch": 2363} {"train_loss": -12.42428970336914, "global_step": 397060, "epoch": 2363} {"train_loss": -12.422203063964844, "global_step": 397061, "epoch": 2363} {"train_loss": -12.497903823852539, "global_step": 397062, "epoch": 2363} {"train_loss": -12.35311508178711, "global_step": 397063, "epoch": 2363} {"train_loss": -12.197715759277344, "global_step": 397064, "epoch": 2363} {"train_loss": -11.853097915649414, "global_step": 397065, "epoch": 2363} {"train_loss": -12.92596435546875, "global_step": 397066, "epoch": 2363} {"train_loss": -12.341880798339844, "global_step": 397067, "epoch": 2363} {"train_loss": -12.559343338012695, "global_step": 397068, "epoch": 2363} {"train_loss": -12.707562446594238, "global_step": 397069, "epoch": 2363} {"train_loss": -12.408222198486328, "global_step": 397070, "epoch": 2363} {"train_loss": -12.274504661560059, "global_step": 397071, "epoch": 2363} {"train_loss": -12.698044776916504, "global_step": 397072, "epoch": 2363} {"train_loss": -12.5291166305542, "global_step": 397073, "epoch": 2363} {"train_loss": -12.286905288696289, "global_step": 397074, "epoch": 2363} {"train_loss": -12.401488304138184, "global_step": 397075, "epoch": 2363} {"train_loss": -12.440738677978516, "global_step": 397076, "epoch": 2363} {"train_loss": -12.382832527160645, "global_step": 397077, "epoch": 2363} {"train_loss": -12.380406379699707, "global_step": 397078, "epoch": 2363} {"train_loss": -12.336849212646484, "global_step": 397079, "epoch": 2363} {"train_loss": -12.163423538208008, "global_step": 397080, "epoch": 2363} {"train_loss": -12.091747283935547, "global_step": 397081, "epoch": 2363} {"train_loss": -12.108307838439941, "global_step": 397082, "epoch": 2363} {"train_loss": -12.497014045715332, "global_step": 397083, "epoch": 2363} {"train_loss": -12.019579887390137, "global_step": 397084, "epoch": 2363} {"train_loss": -11.414306640625, "global_step": 397085, "epoch": 2363} {"train_loss": -11.939824104309082, "global_step": 397086, "epoch": 2363} {"train_loss": -11.978363037109375, "global_step": 397087, "epoch": 2363} {"train_loss": -9.983755111694336, "global_step": 397088, "epoch": 2363} {"train_loss": -12.226896286010742, "global_step": 397089, "epoch": 2363} {"train_loss": -12.013174057006836, "global_step": 397090, "epoch": 2363} {"train_loss": -12.006468772888184, "global_step": 397091, "epoch": 2363} {"train_loss": -12.326360702514648, "global_step": 397092, "epoch": 2363} {"train_loss": -11.901906967163086, "global_step": 397093, "epoch": 2363} {"train_loss": -12.013797760009766, "global_step": 397094, "epoch": 2363} {"train_loss": -12.003419876098633, "global_step": 397095, "epoch": 2363} {"train_loss": -12.028520584106445, "global_step": 397096, "epoch": 2363} {"train_loss": -11.634819984436035, "global_step": 397097, "epoch": 2363} {"train_loss": -11.6946382522583, "global_step": 397098, "epoch": 2363} {"train_loss": -12.518563270568848, "global_step": 397099, "epoch": 2363} {"train_loss": -11.583816528320312, "global_step": 397100, "epoch": 2363} {"train_loss": -11.129900932312012, "global_step": 397101, "epoch": 2363} {"train_loss": -11.838004112243652, "global_step": 397102, "epoch": 2363} {"train_loss": -11.739713668823242, "global_step": 397103, "epoch": 2363} {"train_loss": -10.560502052307129, "global_step": 397104, "epoch": 2363} {"train_loss": -12.118492126464844, "global_step": 397105, "epoch": 2363} {"train_loss": -10.541339874267578, "global_step": 397106, "epoch": 2363} {"train_loss": -11.143099784851074, "global_step": 397107, "epoch": 2363} {"train_loss": -12.107282638549805, "global_step": 397108, "epoch": 2363} {"train_loss": -10.272714614868164, "global_step": 397109, "epoch": 2363} {"train_loss": -12.02976131439209, "global_step": 397110, "epoch": 2363} {"train_loss": -10.925422668457031, "global_step": 397111, "epoch": 2363} {"train_loss": -10.25340747833252, "global_step": 397112, "epoch": 2363} {"train_loss": -11.852952003479004, "global_step": 397113, "epoch": 2363} {"train_loss": -11.105329513549805, "global_step": 397114, "epoch": 2363} {"train_loss": -12.076213836669922, "global_step": 397115, "epoch": 2363} {"train_loss": -11.41530990600586, "global_step": 397116, "epoch": 2363} {"train_loss": -12.373059272766113, "global_step": 397117, "epoch": 2363} {"train_loss": -11.332109451293945, "global_step": 397118, "epoch": 2363} {"train_loss": -12.13874626159668, "global_step": 397119, "epoch": 2363} {"train_loss": -11.199480056762695, "global_step": 397120, "epoch": 2363} {"train_loss": -11.817161560058594, "global_step": 397121, "epoch": 2363} {"train_loss": -11.880426406860352, "global_step": 397122, "epoch": 2363} {"train_loss": -11.672941207885742, "global_step": 397123, "epoch": 2363} {"train_loss": -11.814056396484375, "global_step": 397124, "epoch": 2363} {"train_loss": -11.727243423461914, "global_step": 397125, "epoch": 2363} {"train_loss": -12.052206039428711, "global_step": 397126, "epoch": 2363} {"train_loss": -11.812788009643555, "global_step": 397127, "epoch": 2363} {"train_loss": -11.94206428527832, "global_step": 397128, "epoch": 2363} {"train_loss": -12.017651557922363, "global_step": 397129, "epoch": 2363} {"train_loss": -11.525701522827148, "global_step": 397130, "epoch": 2363} {"train_loss": -11.632299423217773, "global_step": 397131, "epoch": 2363} {"train_loss": -11.734598159790039, "global_step": 397132, "epoch": 2363} {"train_loss": -11.65842056274414, "global_step": 397133, "epoch": 2363} {"train_loss": -11.841455459594727, "global_step": 397134, "epoch": 2363} {"train_loss": -11.775554656982422, "global_step": 397135, "epoch": 2363} {"train_loss": -11.9092378616333, "global_step": 397136, "epoch": 2363} {"train_loss": -12.113039016723633, "global_step": 397137, "epoch": 2363} {"train_loss": -11.933664321899414, "global_step": 397138, "epoch": 2363} {"train_loss": -12.273977279663086, "global_step": 397139, "epoch": 2363} {"train_loss": -12.234881401062012, "global_step": 397140, "epoch": 2363} {"train_loss": -11.967555046081543, "global_step": 397141, "epoch": 2363} {"train_loss": -11.935209274291992, "global_step": 397142, "epoch": 2363} {"train_loss": -12.156160354614258, "global_step": 397143, "epoch": 2363} {"train_loss": -12.27386474609375, "global_step": 397144, "epoch": 2363} {"train_loss": -12.220352172851562, "global_step": 397145, "epoch": 2363} {"train_loss": -11.566949844360352, "global_step": 397146, "epoch": 2363} {"train_loss": -12.447879791259766, "global_step": 397147, "epoch": 2363} {"train_loss": -11.649539947509766, "global_step": 397148, "epoch": 2363} {"train_loss": -12.025081634521484, "global_step": 397149, "epoch": 2363} {"train_loss": -11.823958396911621, "global_step": 397150, "epoch": 2363} {"train_loss": -12.068258796419416, "global_step": 397151, "epoch": 2363, "val_loss": 292728.65625} {"train_loss": -11.885797500610352, "global_step": 397152, "epoch": 2364} {"train_loss": -11.825887680053711, "global_step": 397153, "epoch": 2364} {"train_loss": -11.855644226074219, "global_step": 397154, "epoch": 2364} {"train_loss": -11.579472541809082, "global_step": 397155, "epoch": 2364} {"train_loss": -11.460963249206543, "global_step": 397156, "epoch": 2364} {"train_loss": -11.727556228637695, "global_step": 397157, "epoch": 2364} {"train_loss": -11.948224067687988, "global_step": 397158, "epoch": 2364} {"train_loss": -11.952156066894531, "global_step": 397159, "epoch": 2364} {"train_loss": -11.84201431274414, "global_step": 397160, "epoch": 2364} {"train_loss": -12.042570114135742, "global_step": 397161, "epoch": 2364} {"train_loss": -12.074800491333008, "global_step": 397162, "epoch": 2364} {"train_loss": -11.782648086547852, "global_step": 397163, "epoch": 2364} {"train_loss": -11.937959671020508, "global_step": 397164, "epoch": 2364} {"train_loss": -12.04564380645752, "global_step": 397165, "epoch": 2364} {"train_loss": -11.912278175354004, "global_step": 397166, "epoch": 2364} {"train_loss": -12.332239151000977, "global_step": 397167, "epoch": 2364} {"train_loss": -12.084080696105957, "global_step": 397168, "epoch": 2364} {"train_loss": -12.330526351928711, "global_step": 397169, "epoch": 2364} {"train_loss": -12.182165145874023, "global_step": 397170, "epoch": 2364} {"train_loss": -11.868438720703125, "global_step": 397171, "epoch": 2364} {"train_loss": -12.270288467407227, "global_step": 397172, "epoch": 2364} {"train_loss": -12.25373363494873, "global_step": 397173, "epoch": 2364} {"train_loss": -12.141942024230957, "global_step": 397174, "epoch": 2364} {"train_loss": -12.27245044708252, "global_step": 397175, "epoch": 2364} {"train_loss": -11.638145446777344, "global_step": 397176, "epoch": 2364} {"train_loss": -12.427268981933594, "global_step": 397177, "epoch": 2364} {"train_loss": -11.781615257263184, "global_step": 397178, "epoch": 2364} {"train_loss": -12.436046600341797, "global_step": 397179, "epoch": 2364} {"train_loss": -12.008491516113281, "global_step": 397180, "epoch": 2364} {"train_loss": -11.913390159606934, "global_step": 397181, "epoch": 2364} {"train_loss": -11.937332153320312, "global_step": 397182, "epoch": 2364} {"train_loss": -11.400704383850098, "global_step": 397183, "epoch": 2364} {"train_loss": -11.701740264892578, "global_step": 397184, "epoch": 2364} {"train_loss": -11.807642936706543, "global_step": 397185, "epoch": 2364} {"train_loss": -11.104158401489258, "global_step": 397186, "epoch": 2364} {"train_loss": -12.12293529510498, "global_step": 397187, "epoch": 2364} {"train_loss": -11.454895973205566, "global_step": 397188, "epoch": 2364} {"train_loss": -11.469730377197266, "global_step": 397189, "epoch": 2364} {"train_loss": -12.010501861572266, "global_step": 397190, "epoch": 2364} {"train_loss": -11.638057708740234, "global_step": 397191, "epoch": 2364} {"train_loss": -11.4784574508667, "global_step": 397192, "epoch": 2364} {"train_loss": -11.634352684020996, "global_step": 397193, "epoch": 2364} {"train_loss": -11.859620094299316, "global_step": 397194, "epoch": 2364} {"train_loss": -11.546342849731445, "global_step": 397195, "epoch": 2364} {"train_loss": -11.58839225769043, "global_step": 397196, "epoch": 2364} {"train_loss": -12.308747291564941, "global_step": 397197, "epoch": 2364} {"train_loss": -11.749460220336914, "global_step": 397198, "epoch": 2364} {"train_loss": -12.43096923828125, "global_step": 397199, "epoch": 2364} {"train_loss": -10.929939270019531, "global_step": 397200, "epoch": 2364} {"train_loss": -12.372873306274414, "global_step": 397201, "epoch": 2364} {"train_loss": -11.079498291015625, "global_step": 397202, "epoch": 2364} {"train_loss": -11.906290054321289, "global_step": 397203, "epoch": 2364} {"train_loss": -11.79261589050293, "global_step": 397204, "epoch": 2364} {"train_loss": -11.040371894836426, "global_step": 397205, "epoch": 2364} {"train_loss": -11.83842945098877, "global_step": 397206, "epoch": 2364} {"train_loss": -10.281573295593262, "global_step": 397207, "epoch": 2364} {"train_loss": -11.119827270507812, "global_step": 397208, "epoch": 2364} {"train_loss": -11.799553871154785, "global_step": 397209, "epoch": 2364} {"train_loss": -11.194524765014648, "global_step": 397210, "epoch": 2364} {"train_loss": -11.763313293457031, "global_step": 397211, "epoch": 2364} {"train_loss": -11.786858558654785, "global_step": 397212, "epoch": 2364} {"train_loss": -11.348997116088867, "global_step": 397213, "epoch": 2364} {"train_loss": -12.20603084564209, "global_step": 397214, "epoch": 2364} {"train_loss": -10.851662635803223, "global_step": 397215, "epoch": 2364} {"train_loss": -10.789632797241211, "global_step": 397216, "epoch": 2364} {"train_loss": -11.796783447265625, "global_step": 397217, "epoch": 2364} {"train_loss": -11.083148956298828, "global_step": 397218, "epoch": 2364} {"train_loss": -12.073747634887695, "global_step": 397219, "epoch": 2364} {"train_loss": -11.82031536102295, "global_step": 397220, "epoch": 2364} {"train_loss": -11.870683670043945, "global_step": 397221, "epoch": 2364} {"train_loss": -11.709630966186523, "global_step": 397222, "epoch": 2364} {"train_loss": -12.053525924682617, "global_step": 397223, "epoch": 2364} {"train_loss": -11.536714553833008, "global_step": 397224, "epoch": 2364} {"train_loss": -11.739295959472656, "global_step": 397225, "epoch": 2364} {"train_loss": -12.291170120239258, "global_step": 397226, "epoch": 2364} {"train_loss": -12.027544021606445, "global_step": 397227, "epoch": 2364} {"train_loss": -12.226530075073242, "global_step": 397228, "epoch": 2364} {"train_loss": -11.746259689331055, "global_step": 397229, "epoch": 2364} {"train_loss": -12.179778099060059, "global_step": 397230, "epoch": 2364} {"train_loss": -11.931924819946289, "global_step": 397231, "epoch": 2364} {"train_loss": -12.043233871459961, "global_step": 397232, "epoch": 2364} {"train_loss": -11.893187522888184, "global_step": 397233, "epoch": 2364} {"train_loss": -11.937711715698242, "global_step": 397234, "epoch": 2364} {"train_loss": -12.068086624145508, "global_step": 397235, "epoch": 2364} {"train_loss": -11.8629789352417, "global_step": 397236, "epoch": 2364} {"train_loss": -11.822795867919922, "global_step": 397237, "epoch": 2364} {"train_loss": -11.633208274841309, "global_step": 397238, "epoch": 2364} {"train_loss": -12.355781555175781, "global_step": 397239, "epoch": 2364} {"train_loss": -12.146743774414062, "global_step": 397240, "epoch": 2364} {"train_loss": -12.060107231140137, "global_step": 397241, "epoch": 2364} {"train_loss": -12.250057220458984, "global_step": 397242, "epoch": 2364} {"train_loss": -12.225462913513184, "global_step": 397243, "epoch": 2364} {"train_loss": -12.119239807128906, "global_step": 397244, "epoch": 2364} {"train_loss": -11.821429252624512, "global_step": 397245, "epoch": 2364} {"train_loss": -12.015546798706055, "global_step": 397246, "epoch": 2364} {"train_loss": -11.811318397521973, "global_step": 397247, "epoch": 2364} {"train_loss": -12.242085456848145, "global_step": 397248, "epoch": 2364} {"train_loss": -12.167259216308594, "global_step": 397249, "epoch": 2364} {"train_loss": -12.134065628051758, "global_step": 397250, "epoch": 2364} {"train_loss": -12.01922607421875, "global_step": 397251, "epoch": 2364} {"train_loss": -12.236249923706055, "global_step": 397252, "epoch": 2364} {"train_loss": -12.083868026733398, "global_step": 397253, "epoch": 2364} {"train_loss": -12.371147155761719, "global_step": 397254, "epoch": 2364} {"train_loss": -11.990867614746094, "global_step": 397255, "epoch": 2364} {"train_loss": -12.250099182128906, "global_step": 397256, "epoch": 2364} {"train_loss": -12.17953109741211, "global_step": 397257, "epoch": 2364} {"train_loss": -12.068931579589844, "global_step": 397258, "epoch": 2364} {"train_loss": -11.890312194824219, "global_step": 397259, "epoch": 2364} {"train_loss": -11.914461135864258, "global_step": 397260, "epoch": 2364} {"train_loss": -12.297739028930664, "global_step": 397261, "epoch": 2364} {"train_loss": -12.372797966003418, "global_step": 397262, "epoch": 2364} {"train_loss": -12.34715747833252, "global_step": 397263, "epoch": 2364} {"train_loss": -12.289717674255371, "global_step": 397264, "epoch": 2364} {"train_loss": -12.722463607788086, "global_step": 397265, "epoch": 2364} {"train_loss": -12.222654342651367, "global_step": 397266, "epoch": 2364} {"train_loss": -12.375082969665527, "global_step": 397267, "epoch": 2364} {"train_loss": -12.507173538208008, "global_step": 397268, "epoch": 2364} {"train_loss": -12.274572372436523, "global_step": 397269, "epoch": 2364} {"train_loss": -11.99220085144043, "global_step": 397270, "epoch": 2364} {"train_loss": -12.020074844360352, "global_step": 397271, "epoch": 2364} {"train_loss": -12.215780258178711, "global_step": 397272, "epoch": 2364} {"train_loss": -12.235958099365234, "global_step": 397273, "epoch": 2364} {"train_loss": -12.37752628326416, "global_step": 397274, "epoch": 2364} {"train_loss": -12.161211013793945, "global_step": 397275, "epoch": 2364} {"train_loss": -12.3381986618042, "global_step": 397276, "epoch": 2364} {"train_loss": -12.030523300170898, "global_step": 397277, "epoch": 2364} {"train_loss": -12.208528518676758, "global_step": 397278, "epoch": 2364} {"train_loss": -12.103586196899414, "global_step": 397279, "epoch": 2364} {"train_loss": -12.439090728759766, "global_step": 397280, "epoch": 2364} {"train_loss": -12.177885055541992, "global_step": 397281, "epoch": 2364} {"train_loss": -12.340103149414062, "global_step": 397282, "epoch": 2364} {"train_loss": -12.172149658203125, "global_step": 397283, "epoch": 2364} {"train_loss": -12.439414978027344, "global_step": 397284, "epoch": 2364} {"train_loss": -12.335784912109375, "global_step": 397285, "epoch": 2364} {"train_loss": -12.188965797424316, "global_step": 397286, "epoch": 2364} {"train_loss": -12.233872413635254, "global_step": 397287, "epoch": 2364} {"train_loss": -12.818958282470703, "global_step": 397288, "epoch": 2364} {"train_loss": -12.238663673400879, "global_step": 397289, "epoch": 2364} {"train_loss": -12.20828914642334, "global_step": 397290, "epoch": 2364} {"train_loss": -12.476470947265625, "global_step": 397291, "epoch": 2364} {"train_loss": -12.47252082824707, "global_step": 397292, "epoch": 2364} {"train_loss": -12.347086906433105, "global_step": 397293, "epoch": 2364} {"train_loss": -12.727014541625977, "global_step": 397294, "epoch": 2364} {"train_loss": -12.491788864135742, "global_step": 397295, "epoch": 2364} {"train_loss": -12.739442825317383, "global_step": 397296, "epoch": 2364} {"train_loss": -12.232048034667969, "global_step": 397297, "epoch": 2364} {"train_loss": -12.21531867980957, "global_step": 397298, "epoch": 2364} {"train_loss": -12.648553848266602, "global_step": 397299, "epoch": 2364} {"train_loss": -12.515953063964844, "global_step": 397300, "epoch": 2364} {"train_loss": -12.306464195251465, "global_step": 397301, "epoch": 2364} {"train_loss": -12.708759307861328, "global_step": 397302, "epoch": 2364} {"train_loss": -12.47560977935791, "global_step": 397303, "epoch": 2364} {"train_loss": -12.417083740234375, "global_step": 397304, "epoch": 2364} {"train_loss": -12.124349594116211, "global_step": 397305, "epoch": 2364} {"train_loss": -12.59286117553711, "global_step": 397306, "epoch": 2364} {"train_loss": -12.293365478515625, "global_step": 397307, "epoch": 2364} {"train_loss": -12.252111434936523, "global_step": 397308, "epoch": 2364} {"train_loss": -12.378682136535645, "global_step": 397309, "epoch": 2364} {"train_loss": -12.38979721069336, "global_step": 397310, "epoch": 2364} {"train_loss": -12.432920455932617, "global_step": 397311, "epoch": 2364} {"train_loss": -12.40273666381836, "global_step": 397312, "epoch": 2364} {"train_loss": -12.048620223999023, "global_step": 397313, "epoch": 2364} {"train_loss": -12.063315391540527, "global_step": 397314, "epoch": 2364} {"train_loss": -12.231557846069336, "global_step": 397315, "epoch": 2364} {"train_loss": -12.446627616882324, "global_step": 397316, "epoch": 2364} {"train_loss": -12.626263618469238, "global_step": 397317, "epoch": 2364} {"train_loss": -12.367639541625977, "global_step": 397318, "epoch": 2364} {"train_loss": -12.0330787726811, "global_step": 397319, "epoch": 2364, "val_loss": 297829.1875} {"train_loss": -12.466642379760742, "global_step": 397320, "epoch": 2365} {"train_loss": -12.275468826293945, "global_step": 397321, "epoch": 2365} {"train_loss": -12.594679832458496, "global_step": 397322, "epoch": 2365} {"train_loss": -12.157590866088867, "global_step": 397323, "epoch": 2365} {"train_loss": -12.587034225463867, "global_step": 397324, "epoch": 2365} {"train_loss": -12.16381549835205, "global_step": 397325, "epoch": 2365} {"train_loss": -11.888519287109375, "global_step": 397326, "epoch": 2365} {"train_loss": -12.50265121459961, "global_step": 397327, "epoch": 2365} {"train_loss": -12.602945327758789, "global_step": 397328, "epoch": 2365} {"train_loss": -12.335372924804688, "global_step": 397329, "epoch": 2365} {"train_loss": -11.947294235229492, "global_step": 397330, "epoch": 2365} {"train_loss": -12.315607070922852, "global_step": 397331, "epoch": 2365} {"train_loss": -11.535714149475098, "global_step": 397332, "epoch": 2365} {"train_loss": -10.117035865783691, "global_step": 397333, "epoch": 2365} {"train_loss": -11.577714920043945, "global_step": 397334, "epoch": 2365} {"train_loss": -11.591361999511719, "global_step": 397335, "epoch": 2365} {"train_loss": -11.628231048583984, "global_step": 397336, "epoch": 2365} {"train_loss": -12.132745742797852, "global_step": 397337, "epoch": 2365} {"train_loss": -11.607709884643555, "global_step": 397338, "epoch": 2365} {"train_loss": -11.992919921875, "global_step": 397339, "epoch": 2365} {"train_loss": -12.240338325500488, "global_step": 397340, "epoch": 2365} {"train_loss": -11.868854522705078, "global_step": 397341, "epoch": 2365} {"train_loss": -12.04680061340332, "global_step": 397342, "epoch": 2365} {"train_loss": -11.4974365234375, "global_step": 397343, "epoch": 2365} {"train_loss": -10.945332527160645, "global_step": 397344, "epoch": 2365} {"train_loss": -12.090080261230469, "global_step": 397345, "epoch": 2365} {"train_loss": -12.003938674926758, "global_step": 397346, "epoch": 2365} {"train_loss": -11.497001647949219, "global_step": 397347, "epoch": 2365} {"train_loss": -12.414163589477539, "global_step": 397348, "epoch": 2365} {"train_loss": -11.75931453704834, "global_step": 397349, "epoch": 2365} {"train_loss": -11.932775497436523, "global_step": 397350, "epoch": 2365} {"train_loss": -12.235894203186035, "global_step": 397351, "epoch": 2365} {"train_loss": -11.507144927978516, "global_step": 397352, "epoch": 2365} {"train_loss": -11.741636276245117, "global_step": 397353, "epoch": 2365} {"train_loss": -11.874627113342285, "global_step": 397354, "epoch": 2365} {"train_loss": -11.387295722961426, "global_step": 397355, "epoch": 2365} {"train_loss": -11.817451477050781, "global_step": 397356, "epoch": 2365} {"train_loss": -11.873212814331055, "global_step": 397357, "epoch": 2365} {"train_loss": -11.920391082763672, "global_step": 397358, "epoch": 2365} {"train_loss": -12.333053588867188, "global_step": 397359, "epoch": 2365} {"train_loss": -11.816841125488281, "global_step": 397360, "epoch": 2365} {"train_loss": -12.270889282226562, "global_step": 397361, "epoch": 2365} {"train_loss": -12.013988494873047, "global_step": 397362, "epoch": 2365} {"train_loss": -12.250654220581055, "global_step": 397363, "epoch": 2365} {"train_loss": -12.082260131835938, "global_step": 397364, "epoch": 2365} {"train_loss": -11.712583541870117, "global_step": 397365, "epoch": 2365} {"train_loss": -11.506290435791016, "global_step": 397366, "epoch": 2365} {"train_loss": -12.53299331665039, "global_step": 397367, "epoch": 2365} {"train_loss": -11.315290451049805, "global_step": 397368, "epoch": 2365} {"train_loss": -12.209840774536133, "global_step": 397369, "epoch": 2365} {"train_loss": -12.023186683654785, "global_step": 397370, "epoch": 2365} {"train_loss": -11.648534774780273, "global_step": 397371, "epoch": 2365} {"train_loss": -12.037673950195312, "global_step": 397372, "epoch": 2365} {"train_loss": -11.509095191955566, "global_step": 397373, "epoch": 2365} {"train_loss": -11.853524208068848, "global_step": 397374, "epoch": 2365} {"train_loss": -10.89316177368164, "global_step": 397375, "epoch": 2365} {"train_loss": -11.851890563964844, "global_step": 397376, "epoch": 2365} {"train_loss": -11.124984741210938, "global_step": 397377, "epoch": 2365} {"train_loss": -11.13232421875, "global_step": 397378, "epoch": 2365} {"train_loss": -11.842247009277344, "global_step": 397379, "epoch": 2365} {"train_loss": -10.921880722045898, "global_step": 397380, "epoch": 2365} {"train_loss": -11.650919914245605, "global_step": 397381, "epoch": 2365} {"train_loss": -10.473983764648438, "global_step": 397382, "epoch": 2365} {"train_loss": -11.909711837768555, "global_step": 397383, "epoch": 2365} {"train_loss": -10.732292175292969, "global_step": 397384, "epoch": 2365} {"train_loss": -11.599637985229492, "global_step": 397385, "epoch": 2365} {"train_loss": -10.505744934082031, "global_step": 397386, "epoch": 2365} {"train_loss": -11.234268188476562, "global_step": 397387, "epoch": 2365} {"train_loss": -11.483692169189453, "global_step": 397388, "epoch": 2365} {"train_loss": -11.813262939453125, "global_step": 397389, "epoch": 2365} {"train_loss": -12.06174373626709, "global_step": 397390, "epoch": 2365} {"train_loss": -11.994372367858887, "global_step": 397391, "epoch": 2365} {"train_loss": -12.414497375488281, "global_step": 397392, "epoch": 2365} {"train_loss": -12.166112899780273, "global_step": 397393, "epoch": 2365} {"train_loss": -12.37704086303711, "global_step": 397394, "epoch": 2365} {"train_loss": -12.152976036071777, "global_step": 397395, "epoch": 2365} {"train_loss": -12.053018569946289, "global_step": 397396, "epoch": 2365} {"train_loss": -12.094202041625977, "global_step": 397397, "epoch": 2365} {"train_loss": -12.058815002441406, "global_step": 397398, "epoch": 2365} {"train_loss": -12.354877471923828, "global_step": 397399, "epoch": 2365} {"train_loss": -12.266357421875, "global_step": 397400, "epoch": 2365} {"train_loss": -11.719396591186523, "global_step": 397401, "epoch": 2365} {"train_loss": -11.909967422485352, "global_step": 397402, "epoch": 2365} {"train_loss": -11.92125129699707, "global_step": 397403, "epoch": 2365} {"train_loss": -11.89361572265625, "global_step": 397404, "epoch": 2365} {"train_loss": -12.238032341003418, "global_step": 397405, "epoch": 2365} {"train_loss": -12.006958961486816, "global_step": 397406, "epoch": 2365} {"train_loss": -11.820491790771484, "global_step": 397407, "epoch": 2365} {"train_loss": -12.65439224243164, "global_step": 397408, "epoch": 2365} {"train_loss": -12.03078842163086, "global_step": 397409, "epoch": 2365} {"train_loss": -12.209596633911133, "global_step": 397410, "epoch": 2365} {"train_loss": -11.709365844726562, "global_step": 397411, "epoch": 2365} {"train_loss": -12.093186378479004, "global_step": 397412, "epoch": 2365} {"train_loss": -11.921092987060547, "global_step": 397413, "epoch": 2365} {"train_loss": -11.87113094329834, "global_step": 397414, "epoch": 2365} {"train_loss": -11.825584411621094, "global_step": 397415, "epoch": 2365} {"train_loss": -12.170636177062988, "global_step": 397416, "epoch": 2365} {"train_loss": -12.118728637695312, "global_step": 397417, "epoch": 2365} {"train_loss": -11.857444763183594, "global_step": 397418, "epoch": 2365} {"train_loss": -12.222846031188965, "global_step": 397419, "epoch": 2365} {"train_loss": -11.564264297485352, "global_step": 397420, "epoch": 2365} {"train_loss": -12.345993041992188, "global_step": 397421, "epoch": 2365} {"train_loss": -11.935165405273438, "global_step": 397422, "epoch": 2365} {"train_loss": -12.255754470825195, "global_step": 397423, "epoch": 2365} {"train_loss": -12.201870918273926, "global_step": 397424, "epoch": 2365} {"train_loss": -12.430156707763672, "global_step": 397425, "epoch": 2365} {"train_loss": -12.329991340637207, "global_step": 397426, "epoch": 2365} {"train_loss": -12.473655700683594, "global_step": 397427, "epoch": 2365} {"train_loss": -12.11927318572998, "global_step": 397428, "epoch": 2365} {"train_loss": -12.381790161132812, "global_step": 397429, "epoch": 2365} {"train_loss": -12.532672882080078, "global_step": 397430, "epoch": 2365} {"train_loss": -12.028212547302246, "global_step": 397431, "epoch": 2365} {"train_loss": -12.421939849853516, "global_step": 397432, "epoch": 2365} {"train_loss": -12.209006309509277, "global_step": 397433, "epoch": 2365} {"train_loss": -12.614835739135742, "global_step": 397434, "epoch": 2365} {"train_loss": -12.780128479003906, "global_step": 397435, "epoch": 2365} {"train_loss": -12.593786239624023, "global_step": 397436, "epoch": 2365} {"train_loss": -12.515536308288574, "global_step": 397437, "epoch": 2365} {"train_loss": -12.42343521118164, "global_step": 397438, "epoch": 2365} {"train_loss": -12.575462341308594, "global_step": 397439, "epoch": 2365} {"train_loss": -12.454370498657227, "global_step": 397440, "epoch": 2365} {"train_loss": -12.414628982543945, "global_step": 397441, "epoch": 2365} {"train_loss": -12.469182968139648, "global_step": 397442, "epoch": 2365} {"train_loss": -12.557857513427734, "global_step": 397443, "epoch": 2365} {"train_loss": -12.20293140411377, "global_step": 397444, "epoch": 2365} {"train_loss": -12.544241905212402, "global_step": 397445, "epoch": 2365} {"train_loss": -12.346412658691406, "global_step": 397446, "epoch": 2365} {"train_loss": -12.552434921264648, "global_step": 397447, "epoch": 2365} {"train_loss": -12.55126953125, "global_step": 397448, "epoch": 2365} {"train_loss": -12.58281135559082, "global_step": 397449, "epoch": 2365} {"train_loss": -12.46479606628418, "global_step": 397450, "epoch": 2365} {"train_loss": -12.636022567749023, "global_step": 397451, "epoch": 2365} {"train_loss": -12.509323120117188, "global_step": 397452, "epoch": 2365} {"train_loss": -12.70340347290039, "global_step": 397453, "epoch": 2365} {"train_loss": -11.884336471557617, "global_step": 397454, "epoch": 2365} {"train_loss": -12.385847091674805, "global_step": 397455, "epoch": 2365} {"train_loss": -12.315624237060547, "global_step": 397456, "epoch": 2365} {"train_loss": -10.644969940185547, "global_step": 397457, "epoch": 2365} {"train_loss": -11.384077072143555, "global_step": 397458, "epoch": 2365} {"train_loss": -12.444940567016602, "global_step": 397459, "epoch": 2365} {"train_loss": -11.634231567382812, "global_step": 397460, "epoch": 2365} {"train_loss": -11.569074630737305, "global_step": 397461, "epoch": 2365} {"train_loss": -12.533210754394531, "global_step": 397462, "epoch": 2365} {"train_loss": -12.053261756896973, "global_step": 397463, "epoch": 2365} {"train_loss": -12.20041275024414, "global_step": 397464, "epoch": 2365} {"train_loss": -12.132265090942383, "global_step": 397465, "epoch": 2365} {"train_loss": -11.956388473510742, "global_step": 397466, "epoch": 2365} {"train_loss": -11.688220977783203, "global_step": 397467, "epoch": 2365} {"train_loss": -11.980351448059082, "global_step": 397468, "epoch": 2365} {"train_loss": -10.533099174499512, "global_step": 397469, "epoch": 2365} {"train_loss": -12.102428436279297, "global_step": 397470, "epoch": 2365} {"train_loss": -11.373197555541992, "global_step": 397471, "epoch": 2365} {"train_loss": -11.13783073425293, "global_step": 397472, "epoch": 2365} {"train_loss": -11.461580276489258, "global_step": 397473, "epoch": 2365} {"train_loss": -11.298973083496094, "global_step": 397474, "epoch": 2365} {"train_loss": -11.36721420288086, "global_step": 397475, "epoch": 2365} {"train_loss": -10.147716522216797, "global_step": 397476, "epoch": 2365} {"train_loss": -11.784429550170898, "global_step": 397477, "epoch": 2365} {"train_loss": -10.260218620300293, "global_step": 397478, "epoch": 2365} {"train_loss": -9.885774612426758, "global_step": 397479, "epoch": 2365} {"train_loss": -12.282228469848633, "global_step": 397480, "epoch": 2365} {"train_loss": -10.180925369262695, "global_step": 397481, "epoch": 2365} {"train_loss": -11.805412292480469, "global_step": 397482, "epoch": 2365} {"train_loss": -10.660137176513672, "global_step": 397483, "epoch": 2365} {"train_loss": -11.014986038208008, "global_step": 397484, "epoch": 2365} {"train_loss": -11.853311538696289, "global_step": 397485, "epoch": 2365} {"train_loss": -11.076628684997559, "global_step": 397486, "epoch": 2365} {"train_loss": -11.90341187658764, "global_step": 397487, "epoch": 2365, "val_loss": 298457.28125, "train_action_mse_error": 0.42288631200790405} {"train_loss": -11.46932601928711, "global_step": 397488, "epoch": 2366} {"train_loss": -11.274847030639648, "global_step": 397489, "epoch": 2366} {"train_loss": -12.190811157226562, "global_step": 397490, "epoch": 2366} {"train_loss": -11.097476959228516, "global_step": 397491, "epoch": 2366} {"train_loss": -12.431978225708008, "global_step": 397492, "epoch": 2366} {"train_loss": -11.917455673217773, "global_step": 397493, "epoch": 2366} {"train_loss": -11.6787748336792, "global_step": 397494, "epoch": 2366} {"train_loss": -11.905409812927246, "global_step": 397495, "epoch": 2366} {"train_loss": -11.289474487304688, "global_step": 397496, "epoch": 2366} {"train_loss": -12.064037322998047, "global_step": 397497, "epoch": 2366} {"train_loss": -12.265122413635254, "global_step": 397498, "epoch": 2366} {"train_loss": -11.44059944152832, "global_step": 397499, "epoch": 2366} {"train_loss": -12.165199279785156, "global_step": 397500, "epoch": 2366} {"train_loss": -11.21781063079834, "global_step": 397501, "epoch": 2366} {"train_loss": -11.38550090789795, "global_step": 397502, "epoch": 2366} {"train_loss": -11.541552543640137, "global_step": 397503, "epoch": 2366} {"train_loss": -11.189859390258789, "global_step": 397504, "epoch": 2366} {"train_loss": -10.670992851257324, "global_step": 397505, "epoch": 2366} {"train_loss": -12.079547882080078, "global_step": 397506, "epoch": 2366} {"train_loss": -10.628689765930176, "global_step": 397507, "epoch": 2366} {"train_loss": -11.562460899353027, "global_step": 397508, "epoch": 2366} {"train_loss": -11.373215675354004, "global_step": 397509, "epoch": 2366} {"train_loss": -11.274748802185059, "global_step": 397510, "epoch": 2366} {"train_loss": -11.67816162109375, "global_step": 397511, "epoch": 2366} {"train_loss": -11.490799903869629, "global_step": 397512, "epoch": 2366} {"train_loss": -11.910146713256836, "global_step": 397513, "epoch": 2366} {"train_loss": -11.963064193725586, "global_step": 397514, "epoch": 2366} {"train_loss": -12.024287223815918, "global_step": 397515, "epoch": 2366} {"train_loss": -11.901498794555664, "global_step": 397516, "epoch": 2366} {"train_loss": -11.99296760559082, "global_step": 397517, "epoch": 2366} {"train_loss": -11.561136245727539, "global_step": 397518, "epoch": 2366} {"train_loss": -12.086833953857422, "global_step": 397519, "epoch": 2366} {"train_loss": -11.996687889099121, "global_step": 397520, "epoch": 2366} {"train_loss": -12.243526458740234, "global_step": 397521, "epoch": 2366} {"train_loss": -12.157238960266113, "global_step": 397522, "epoch": 2366} {"train_loss": -11.359442710876465, "global_step": 397523, "epoch": 2366} {"train_loss": -12.036280632019043, "global_step": 397524, "epoch": 2366} {"train_loss": -10.984928131103516, "global_step": 397525, "epoch": 2366} {"train_loss": -12.065544128417969, "global_step": 397526, "epoch": 2366} {"train_loss": -11.753815650939941, "global_step": 397527, "epoch": 2366} {"train_loss": -11.783514022827148, "global_step": 397528, "epoch": 2366} {"train_loss": -11.783945083618164, "global_step": 397529, "epoch": 2366} {"train_loss": -11.590046882629395, "global_step": 397530, "epoch": 2366} {"train_loss": -11.801522254943848, "global_step": 397531, "epoch": 2366} {"train_loss": -12.017786026000977, "global_step": 397532, "epoch": 2366} {"train_loss": -12.028275489807129, "global_step": 397533, "epoch": 2366} {"train_loss": -12.182653427124023, "global_step": 397534, "epoch": 2366} {"train_loss": -12.275004386901855, "global_step": 397535, "epoch": 2366} {"train_loss": -12.116643905639648, "global_step": 397536, "epoch": 2366} {"train_loss": -12.260866165161133, "global_step": 397537, "epoch": 2366} {"train_loss": -11.844734191894531, "global_step": 397538, "epoch": 2366} {"train_loss": -12.13476848602295, "global_step": 397539, "epoch": 2366} {"train_loss": -11.950746536254883, "global_step": 397540, "epoch": 2366} {"train_loss": -12.097628593444824, "global_step": 397541, "epoch": 2366} {"train_loss": -12.032279968261719, "global_step": 397542, "epoch": 2366} {"train_loss": -12.23458480834961, "global_step": 397543, "epoch": 2366} {"train_loss": -11.865028381347656, "global_step": 397544, "epoch": 2366} {"train_loss": -11.800464630126953, "global_step": 397545, "epoch": 2366} {"train_loss": -12.230335235595703, "global_step": 397546, "epoch": 2366} {"train_loss": -11.877429962158203, "global_step": 397547, "epoch": 2366} {"train_loss": -12.32478141784668, "global_step": 397548, "epoch": 2366} {"train_loss": -12.02505111694336, "global_step": 397549, "epoch": 2366} {"train_loss": -12.382490158081055, "global_step": 397550, "epoch": 2366} {"train_loss": -11.974380493164062, "global_step": 397551, "epoch": 2366} {"train_loss": -12.308745384216309, "global_step": 397552, "epoch": 2366} {"train_loss": -11.97581672668457, "global_step": 397553, "epoch": 2366} {"train_loss": -12.297842025756836, "global_step": 397554, "epoch": 2366} {"train_loss": -12.098867416381836, "global_step": 397555, "epoch": 2366} {"train_loss": -12.31633186340332, "global_step": 397556, "epoch": 2366} {"train_loss": -12.161128044128418, "global_step": 397557, "epoch": 2366} {"train_loss": -12.377778053283691, "global_step": 397558, "epoch": 2366} {"train_loss": -12.240030288696289, "global_step": 397559, "epoch": 2366} {"train_loss": -12.557437896728516, "global_step": 397560, "epoch": 2366} {"train_loss": -12.54908561706543, "global_step": 397561, "epoch": 2366} {"train_loss": -12.665851593017578, "global_step": 397562, "epoch": 2366} {"train_loss": -12.485137939453125, "global_step": 397563, "epoch": 2366} {"train_loss": -12.415568351745605, "global_step": 397564, "epoch": 2366} {"train_loss": -12.497716903686523, "global_step": 397565, "epoch": 2366} {"train_loss": -12.573801040649414, "global_step": 397566, "epoch": 2366} {"train_loss": -12.621272087097168, "global_step": 397567, "epoch": 2366} {"train_loss": -12.270004272460938, "global_step": 397568, "epoch": 2366} {"train_loss": -12.550920486450195, "global_step": 397569, "epoch": 2366} {"train_loss": -12.38926887512207, "global_step": 397570, "epoch": 2366} {"train_loss": -12.605043411254883, "global_step": 397571, "epoch": 2366} {"train_loss": -12.41469955444336, "global_step": 397572, "epoch": 2366} {"train_loss": -12.578636169433594, "global_step": 397573, "epoch": 2366} {"train_loss": -12.54007339477539, "global_step": 397574, "epoch": 2366} {"train_loss": -12.432315826416016, "global_step": 397575, "epoch": 2366} {"train_loss": -12.660358428955078, "global_step": 397576, "epoch": 2366} {"train_loss": -12.18470573425293, "global_step": 397577, "epoch": 2366} {"train_loss": -12.683893203735352, "global_step": 397578, "epoch": 2366} {"train_loss": -12.606493949890137, "global_step": 397579, "epoch": 2366} {"train_loss": -12.31222915649414, "global_step": 397580, "epoch": 2366} {"train_loss": -12.3074312210083, "global_step": 397581, "epoch": 2366} {"train_loss": -12.538164138793945, "global_step": 397582, "epoch": 2366} {"train_loss": -12.10987663269043, "global_step": 397583, "epoch": 2366} {"train_loss": -12.559135437011719, "global_step": 397584, "epoch": 2366} {"train_loss": -12.11518383026123, "global_step": 397585, "epoch": 2366} {"train_loss": -12.209966659545898, "global_step": 397586, "epoch": 2366} {"train_loss": -12.51591682434082, "global_step": 397587, "epoch": 2366} {"train_loss": -11.17306900024414, "global_step": 397588, "epoch": 2366} {"train_loss": -11.31737995147705, "global_step": 397589, "epoch": 2366} {"train_loss": -12.202834129333496, "global_step": 397590, "epoch": 2366} {"train_loss": -11.934259414672852, "global_step": 397591, "epoch": 2366} {"train_loss": -11.959567070007324, "global_step": 397592, "epoch": 2366} {"train_loss": -11.960160255432129, "global_step": 397593, "epoch": 2366} {"train_loss": -11.65726375579834, "global_step": 397594, "epoch": 2366} {"train_loss": -11.522308349609375, "global_step": 397595, "epoch": 2366} {"train_loss": -11.52353286743164, "global_step": 397596, "epoch": 2366} {"train_loss": -10.675617218017578, "global_step": 397597, "epoch": 2366} {"train_loss": -12.416508674621582, "global_step": 397598, "epoch": 2366} {"train_loss": -11.649843215942383, "global_step": 397599, "epoch": 2366} {"train_loss": -11.135637283325195, "global_step": 397600, "epoch": 2366} {"train_loss": -12.396156311035156, "global_step": 397601, "epoch": 2366} {"train_loss": -10.527473449707031, "global_step": 397602, "epoch": 2366} {"train_loss": -11.024782180786133, "global_step": 397603, "epoch": 2366} {"train_loss": -12.221109390258789, "global_step": 397604, "epoch": 2366} {"train_loss": -10.61884880065918, "global_step": 397605, "epoch": 2366} {"train_loss": -11.58665657043457, "global_step": 397606, "epoch": 2366} {"train_loss": -10.883235931396484, "global_step": 397607, "epoch": 2366} {"train_loss": -10.953886985778809, "global_step": 397608, "epoch": 2366} {"train_loss": -11.658031463623047, "global_step": 397609, "epoch": 2366} {"train_loss": -11.028762817382812, "global_step": 397610, "epoch": 2366} {"train_loss": -11.777242660522461, "global_step": 397611, "epoch": 2366} {"train_loss": -10.698127746582031, "global_step": 397612, "epoch": 2366} {"train_loss": -11.596677780151367, "global_step": 397613, "epoch": 2366} {"train_loss": -10.856630325317383, "global_step": 397614, "epoch": 2366} {"train_loss": -11.432082176208496, "global_step": 397615, "epoch": 2366} {"train_loss": -11.586711883544922, "global_step": 397616, "epoch": 2366} {"train_loss": -11.593883514404297, "global_step": 397617, "epoch": 2366} {"train_loss": -11.42324161529541, "global_step": 397618, "epoch": 2366} {"train_loss": -12.275510787963867, "global_step": 397619, "epoch": 2366} {"train_loss": -11.474491119384766, "global_step": 397620, "epoch": 2366} {"train_loss": -11.834769248962402, "global_step": 397621, "epoch": 2366} {"train_loss": -12.06665325164795, "global_step": 397622, "epoch": 2366} {"train_loss": -11.957387924194336, "global_step": 397623, "epoch": 2366} {"train_loss": -12.154321670532227, "global_step": 397624, "epoch": 2366} {"train_loss": -11.762869834899902, "global_step": 397625, "epoch": 2366} {"train_loss": -11.981376647949219, "global_step": 397626, "epoch": 2366} {"train_loss": -12.043498992919922, "global_step": 397627, "epoch": 2366} {"train_loss": -12.273933410644531, "global_step": 397628, "epoch": 2366} {"train_loss": -11.782306671142578, "global_step": 397629, "epoch": 2366} {"train_loss": -12.24972915649414, "global_step": 397630, "epoch": 2366} {"train_loss": -11.91022777557373, "global_step": 397631, "epoch": 2366} {"train_loss": -12.187200546264648, "global_step": 397632, "epoch": 2366} {"train_loss": -12.116409301757812, "global_step": 397633, "epoch": 2366} {"train_loss": -12.237832069396973, "global_step": 397634, "epoch": 2366} {"train_loss": -12.28436279296875, "global_step": 397635, "epoch": 2366} {"train_loss": -12.03681468963623, "global_step": 397636, "epoch": 2366} {"train_loss": -12.049633026123047, "global_step": 397637, "epoch": 2366} {"train_loss": -11.95482063293457, "global_step": 397638, "epoch": 2366} {"train_loss": -11.869878768920898, "global_step": 397639, "epoch": 2366} {"train_loss": -12.147242546081543, "global_step": 397640, "epoch": 2366} {"train_loss": -12.243644714355469, "global_step": 397641, "epoch": 2366} {"train_loss": -12.206809997558594, "global_step": 397642, "epoch": 2366} {"train_loss": -12.313238143920898, "global_step": 397643, "epoch": 2366} {"train_loss": -12.351690292358398, "global_step": 397644, "epoch": 2366} {"train_loss": -12.358223915100098, "global_step": 397645, "epoch": 2366} {"train_loss": -12.521774291992188, "global_step": 397646, "epoch": 2366} {"train_loss": -12.372058868408203, "global_step": 397647, "epoch": 2366} {"train_loss": -12.152435302734375, "global_step": 397648, "epoch": 2366} {"train_loss": -12.38017463684082, "global_step": 397649, "epoch": 2366} {"train_loss": -12.28869915008545, "global_step": 397650, "epoch": 2366} {"train_loss": -12.052169799804688, "global_step": 397651, "epoch": 2366} {"train_loss": -11.962667465209961, "global_step": 397652, "epoch": 2366} {"train_loss": -11.699329376220703, "global_step": 397653, "epoch": 2366} {"train_loss": -11.835596084594727, "global_step": 397654, "epoch": 2366} {"train_loss": -11.935693014235724, "global_step": 397655, "epoch": 2366, "val_loss": 296572.65625} {"train_loss": -12.061833381652832, "global_step": 397656, "epoch": 2367} {"train_loss": -11.950919151306152, "global_step": 397657, "epoch": 2367} {"train_loss": -12.370908737182617, "global_step": 397658, "epoch": 2367} {"train_loss": -11.52301025390625, "global_step": 397659, "epoch": 2367} {"train_loss": -11.831798553466797, "global_step": 397660, "epoch": 2367} {"train_loss": -12.260398864746094, "global_step": 397661, "epoch": 2367} {"train_loss": -11.82526969909668, "global_step": 397662, "epoch": 2367} {"train_loss": -12.152732849121094, "global_step": 397663, "epoch": 2367} {"train_loss": -12.245388984680176, "global_step": 397664, "epoch": 2367} {"train_loss": -12.465572357177734, "global_step": 397665, "epoch": 2367} {"train_loss": -12.548023223876953, "global_step": 397666, "epoch": 2367} {"train_loss": -12.20792007446289, "global_step": 397667, "epoch": 2367} {"train_loss": -12.394564628601074, "global_step": 397668, "epoch": 2367} {"train_loss": -12.270587921142578, "global_step": 397669, "epoch": 2367} {"train_loss": -12.455221176147461, "global_step": 397670, "epoch": 2367} {"train_loss": -12.51982307434082, "global_step": 397671, "epoch": 2367} {"train_loss": -12.398856163024902, "global_step": 397672, "epoch": 2367} {"train_loss": -12.498724937438965, "global_step": 397673, "epoch": 2367} {"train_loss": -12.179268836975098, "global_step": 397674, "epoch": 2367} {"train_loss": -12.459003448486328, "global_step": 397675, "epoch": 2367} {"train_loss": -12.02228832244873, "global_step": 397676, "epoch": 2367} {"train_loss": -12.274636268615723, "global_step": 397677, "epoch": 2367} {"train_loss": -12.363736152648926, "global_step": 397678, "epoch": 2367} {"train_loss": -12.281906127929688, "global_step": 397679, "epoch": 2367} {"train_loss": -12.26128101348877, "global_step": 397680, "epoch": 2367} {"train_loss": -12.284872055053711, "global_step": 397681, "epoch": 2367} {"train_loss": -12.124582290649414, "global_step": 397682, "epoch": 2367} {"train_loss": -12.657269477844238, "global_step": 397683, "epoch": 2367} {"train_loss": -12.371776580810547, "global_step": 397684, "epoch": 2367} {"train_loss": -12.391987800598145, "global_step": 397685, "epoch": 2367} {"train_loss": -12.257930755615234, "global_step": 397686, "epoch": 2367} {"train_loss": -11.87423324584961, "global_step": 397687, "epoch": 2367} {"train_loss": -12.371607780456543, "global_step": 397688, "epoch": 2367} {"train_loss": -11.742267608642578, "global_step": 397689, "epoch": 2367} {"train_loss": -11.102466583251953, "global_step": 397690, "epoch": 2367} {"train_loss": -12.720712661743164, "global_step": 397691, "epoch": 2367} {"train_loss": -11.226177215576172, "global_step": 397692, "epoch": 2367} {"train_loss": -12.036124229431152, "global_step": 397693, "epoch": 2367} {"train_loss": -10.712675094604492, "global_step": 397694, "epoch": 2367} {"train_loss": -11.356600761413574, "global_step": 397695, "epoch": 2367} {"train_loss": -11.7886962890625, "global_step": 397696, "epoch": 2367} {"train_loss": -9.613046646118164, "global_step": 397697, "epoch": 2367} {"train_loss": -10.572919845581055, "global_step": 397698, "epoch": 2367} {"train_loss": -10.489602088928223, "global_step": 397699, "epoch": 2367} {"train_loss": -11.43011474609375, "global_step": 397700, "epoch": 2367} {"train_loss": -9.415632247924805, "global_step": 397701, "epoch": 2367} {"train_loss": -10.55311393737793, "global_step": 397702, "epoch": 2367} {"train_loss": -10.14854621887207, "global_step": 397703, "epoch": 2367} {"train_loss": -11.648868560791016, "global_step": 397704, "epoch": 2367} {"train_loss": -10.209901809692383, "global_step": 397705, "epoch": 2367} {"train_loss": -11.053325653076172, "global_step": 397706, "epoch": 2367} {"train_loss": -11.434818267822266, "global_step": 397707, "epoch": 2367} {"train_loss": -10.582550048828125, "global_step": 397708, "epoch": 2367} {"train_loss": -11.628686904907227, "global_step": 397709, "epoch": 2367} {"train_loss": -11.191651344299316, "global_step": 397710, "epoch": 2367} {"train_loss": -11.403543472290039, "global_step": 397711, "epoch": 2367} {"train_loss": -11.783879280090332, "global_step": 397712, "epoch": 2367} {"train_loss": -11.700427055358887, "global_step": 397713, "epoch": 2367} {"train_loss": -11.552122116088867, "global_step": 397714, "epoch": 2367} {"train_loss": -11.691511154174805, "global_step": 397715, "epoch": 2367} {"train_loss": -11.879169464111328, "global_step": 397716, "epoch": 2367} {"train_loss": -11.783843040466309, "global_step": 397717, "epoch": 2367} {"train_loss": -11.877150535583496, "global_step": 397718, "epoch": 2367} {"train_loss": -11.572086334228516, "global_step": 397719, "epoch": 2367} {"train_loss": -11.37177562713623, "global_step": 397720, "epoch": 2367} {"train_loss": -11.328889846801758, "global_step": 397721, "epoch": 2367} {"train_loss": -11.141138076782227, "global_step": 397722, "epoch": 2367} {"train_loss": -10.895730972290039, "global_step": 397723, "epoch": 2367} {"train_loss": -11.700733184814453, "global_step": 397724, "epoch": 2367} {"train_loss": -11.297589302062988, "global_step": 397725, "epoch": 2367} {"train_loss": -11.931748390197754, "global_step": 397726, "epoch": 2367} {"train_loss": -11.652839660644531, "global_step": 397727, "epoch": 2367} {"train_loss": -11.536928176879883, "global_step": 397728, "epoch": 2367} {"train_loss": -11.95668888092041, "global_step": 397729, "epoch": 2367} {"train_loss": -12.06060791015625, "global_step": 397730, "epoch": 2367} {"train_loss": -11.551386833190918, "global_step": 397731, "epoch": 2367} {"train_loss": -11.932378768920898, "global_step": 397732, "epoch": 2367} {"train_loss": -11.54745101928711, "global_step": 397733, "epoch": 2367} {"train_loss": -12.185136795043945, "global_step": 397734, "epoch": 2367} {"train_loss": -11.374698638916016, "global_step": 397735, "epoch": 2367} {"train_loss": -12.158952713012695, "global_step": 397736, "epoch": 2367} {"train_loss": -11.836759567260742, "global_step": 397737, "epoch": 2367} {"train_loss": -11.954628944396973, "global_step": 397738, "epoch": 2367} {"train_loss": -12.06808090209961, "global_step": 397739, "epoch": 2367} {"train_loss": -11.970829010009766, "global_step": 397740, "epoch": 2367} {"train_loss": -11.717761993408203, "global_step": 397741, "epoch": 2367} {"train_loss": -12.096172332763672, "global_step": 397742, "epoch": 2367} {"train_loss": -11.687555313110352, "global_step": 397743, "epoch": 2367} {"train_loss": -12.003533363342285, "global_step": 397744, "epoch": 2367} {"train_loss": -11.745354652404785, "global_step": 397745, "epoch": 2367} {"train_loss": -12.368972778320312, "global_step": 397746, "epoch": 2367} {"train_loss": -11.983070373535156, "global_step": 397747, "epoch": 2367} {"train_loss": -12.33541488647461, "global_step": 397748, "epoch": 2367} {"train_loss": -12.275959968566895, "global_step": 397749, "epoch": 2367} {"train_loss": -12.1435546875, "global_step": 397750, "epoch": 2367} {"train_loss": -12.207210540771484, "global_step": 397751, "epoch": 2367} {"train_loss": -12.082807540893555, "global_step": 397752, "epoch": 2367} {"train_loss": -12.20806884765625, "global_step": 397753, "epoch": 2367} {"train_loss": -12.282264709472656, "global_step": 397754, "epoch": 2367} {"train_loss": -11.975173950195312, "global_step": 397755, "epoch": 2367} {"train_loss": -12.28929328918457, "global_step": 397756, "epoch": 2367} {"train_loss": -11.637039184570312, "global_step": 397757, "epoch": 2367} {"train_loss": -12.310809135437012, "global_step": 397758, "epoch": 2367} {"train_loss": -11.884323120117188, "global_step": 397759, "epoch": 2367} {"train_loss": -12.079109191894531, "global_step": 397760, "epoch": 2367} {"train_loss": -12.322053909301758, "global_step": 397761, "epoch": 2367} {"train_loss": -12.207027435302734, "global_step": 397762, "epoch": 2367} {"train_loss": -12.30243968963623, "global_step": 397763, "epoch": 2367} {"train_loss": -12.174190521240234, "global_step": 397764, "epoch": 2367} {"train_loss": -12.333486557006836, "global_step": 397765, "epoch": 2367} {"train_loss": -12.453683853149414, "global_step": 397766, "epoch": 2367} {"train_loss": -12.010109901428223, "global_step": 397767, "epoch": 2367} {"train_loss": -12.523293495178223, "global_step": 397768, "epoch": 2367} {"train_loss": -11.773530006408691, "global_step": 397769, "epoch": 2367} {"train_loss": -12.397283554077148, "global_step": 397770, "epoch": 2367} {"train_loss": -12.062495231628418, "global_step": 397771, "epoch": 2367} {"train_loss": -12.13651180267334, "global_step": 397772, "epoch": 2367} {"train_loss": -12.309711456298828, "global_step": 397773, "epoch": 2367} {"train_loss": -12.224095344543457, "global_step": 397774, "epoch": 2367} {"train_loss": -12.401981353759766, "global_step": 397775, "epoch": 2367} {"train_loss": -12.436419486999512, "global_step": 397776, "epoch": 2367} {"train_loss": -12.362454414367676, "global_step": 397777, "epoch": 2367} {"train_loss": -12.383200645446777, "global_step": 397778, "epoch": 2367} {"train_loss": -12.634931564331055, "global_step": 397779, "epoch": 2367} {"train_loss": -12.156489372253418, "global_step": 397780, "epoch": 2367} {"train_loss": -12.322702407836914, "global_step": 397781, "epoch": 2367} {"train_loss": -12.646953582763672, "global_step": 397782, "epoch": 2367} {"train_loss": -12.094725608825684, "global_step": 397783, "epoch": 2367} {"train_loss": -12.122638702392578, "global_step": 397784, "epoch": 2367} {"train_loss": -12.374049186706543, "global_step": 397785, "epoch": 2367} {"train_loss": -12.202215194702148, "global_step": 397786, "epoch": 2367} {"train_loss": -12.552831649780273, "global_step": 397787, "epoch": 2367} {"train_loss": -12.1815185546875, "global_step": 397788, "epoch": 2367} {"train_loss": -12.488645553588867, "global_step": 397789, "epoch": 2367} {"train_loss": -12.38819408416748, "global_step": 397790, "epoch": 2367} {"train_loss": -12.273418426513672, "global_step": 397791, "epoch": 2367} {"train_loss": -12.274239540100098, "global_step": 397792, "epoch": 2367} {"train_loss": -12.553790092468262, "global_step": 397793, "epoch": 2367} {"train_loss": -11.978311538696289, "global_step": 397794, "epoch": 2367} {"train_loss": -12.567166328430176, "global_step": 397795, "epoch": 2367} {"train_loss": -12.408382415771484, "global_step": 397796, "epoch": 2367} {"train_loss": -12.695466995239258, "global_step": 397797, "epoch": 2367} {"train_loss": -12.398893356323242, "global_step": 397798, "epoch": 2367} {"train_loss": -12.4529447555542, "global_step": 397799, "epoch": 2367} {"train_loss": -12.637893676757812, "global_step": 397800, "epoch": 2367} {"train_loss": -12.568523406982422, "global_step": 397801, "epoch": 2367} {"train_loss": -12.390459060668945, "global_step": 397802, "epoch": 2367} {"train_loss": -12.399381637573242, "global_step": 397803, "epoch": 2367} {"train_loss": -12.320357322692871, "global_step": 397804, "epoch": 2367} {"train_loss": -12.381756782531738, "global_step": 397805, "epoch": 2367} {"train_loss": -12.600448608398438, "global_step": 397806, "epoch": 2367} {"train_loss": -12.708375930786133, "global_step": 397807, "epoch": 2367} {"train_loss": -12.336830139160156, "global_step": 397808, "epoch": 2367} {"train_loss": -12.247830390930176, "global_step": 397809, "epoch": 2367} {"train_loss": -12.21360969543457, "global_step": 397810, "epoch": 2367} {"train_loss": -12.38289737701416, "global_step": 397811, "epoch": 2367} {"train_loss": -12.558670043945312, "global_step": 397812, "epoch": 2367} {"train_loss": -12.251016616821289, "global_step": 397813, "epoch": 2367} {"train_loss": -12.678677558898926, "global_step": 397814, "epoch": 2367} {"train_loss": -12.360784530639648, "global_step": 397815, "epoch": 2367} {"train_loss": -12.456297874450684, "global_step": 397816, "epoch": 2367} {"train_loss": -12.627899169921875, "global_step": 397817, "epoch": 2367} {"train_loss": -12.480095863342285, "global_step": 397818, "epoch": 2367} {"train_loss": -12.210517883300781, "global_step": 397819, "epoch": 2367} {"train_loss": -12.429133415222168, "global_step": 397820, "epoch": 2367} {"train_loss": -12.567968368530273, "global_step": 397821, "epoch": 2367} {"train_loss": -12.606603622436523, "global_step": 397822, "epoch": 2367} {"train_loss": -12.016340976669674, "global_step": 397823, "epoch": 2367, "val_loss": 295280.46875} {"train_loss": -12.034640312194824, "global_step": 397824, "epoch": 2368} {"train_loss": -12.565023422241211, "global_step": 397825, "epoch": 2368} {"train_loss": -12.675484657287598, "global_step": 397826, "epoch": 2368} {"train_loss": -12.489938735961914, "global_step": 397827, "epoch": 2368} {"train_loss": -12.295646667480469, "global_step": 397828, "epoch": 2368} {"train_loss": -12.6363525390625, "global_step": 397829, "epoch": 2368} {"train_loss": -12.112701416015625, "global_step": 397830, "epoch": 2368} {"train_loss": -12.473881721496582, "global_step": 397831, "epoch": 2368} {"train_loss": -12.755931854248047, "global_step": 397832, "epoch": 2368} {"train_loss": -12.289819717407227, "global_step": 397833, "epoch": 2368} {"train_loss": -12.458146095275879, "global_step": 397834, "epoch": 2368} {"train_loss": -12.575239181518555, "global_step": 397835, "epoch": 2368} {"train_loss": -12.66026782989502, "global_step": 397836, "epoch": 2368} {"train_loss": -12.405654907226562, "global_step": 397837, "epoch": 2368} {"train_loss": -12.439668655395508, "global_step": 397838, "epoch": 2368} {"train_loss": -12.59414291381836, "global_step": 397839, "epoch": 2368} {"train_loss": -12.779778480529785, "global_step": 397840, "epoch": 2368} {"train_loss": -12.478218078613281, "global_step": 397841, "epoch": 2368} {"train_loss": -12.65544319152832, "global_step": 397842, "epoch": 2368} {"train_loss": -12.558961868286133, "global_step": 397843, "epoch": 2368} {"train_loss": -12.151632308959961, "global_step": 397844, "epoch": 2368} {"train_loss": -12.439349174499512, "global_step": 397845, "epoch": 2368} {"train_loss": -12.295464515686035, "global_step": 397846, "epoch": 2368} {"train_loss": -12.588245391845703, "global_step": 397847, "epoch": 2368} {"train_loss": -12.305830001831055, "global_step": 397848, "epoch": 2368} {"train_loss": -12.634206771850586, "global_step": 397849, "epoch": 2368} {"train_loss": -12.616255760192871, "global_step": 397850, "epoch": 2368} {"train_loss": -12.451122283935547, "global_step": 397851, "epoch": 2368} {"train_loss": -12.623010635375977, "global_step": 397852, "epoch": 2368} {"train_loss": -12.555802345275879, "global_step": 397853, "epoch": 2368} {"train_loss": -12.049236297607422, "global_step": 397854, "epoch": 2368} {"train_loss": -11.925687789916992, "global_step": 397855, "epoch": 2368} {"train_loss": -11.584946632385254, "global_step": 397856, "epoch": 2368} {"train_loss": -9.575252532958984, "global_step": 397857, "epoch": 2368} {"train_loss": -8.824968338012695, "global_step": 397858, "epoch": 2368} {"train_loss": -11.665910720825195, "global_step": 397859, "epoch": 2368} {"train_loss": -10.547257423400879, "global_step": 397860, "epoch": 2368} {"train_loss": -10.793228149414062, "global_step": 397861, "epoch": 2368} {"train_loss": -10.034457206726074, "global_step": 397862, "epoch": 2368} {"train_loss": -10.930852890014648, "global_step": 397863, "epoch": 2368} {"train_loss": -9.407112121582031, "global_step": 397864, "epoch": 2368} {"train_loss": -10.004817962646484, "global_step": 397865, "epoch": 2368} {"train_loss": -10.165567398071289, "global_step": 397866, "epoch": 2368} {"train_loss": -9.498584747314453, "global_step": 397867, "epoch": 2368} {"train_loss": -10.319175720214844, "global_step": 397868, "epoch": 2368} {"train_loss": -8.225807189941406, "global_step": 397869, "epoch": 2368} {"train_loss": -9.604486465454102, "global_step": 397870, "epoch": 2368} {"train_loss": -9.68121337890625, "global_step": 397871, "epoch": 2368} {"train_loss": -8.590141296386719, "global_step": 397872, "epoch": 2368} {"train_loss": -7.921880722045898, "global_step": 397873, "epoch": 2368} {"train_loss": -8.92853832244873, "global_step": 397874, "epoch": 2368} {"train_loss": -8.760381698608398, "global_step": 397875, "epoch": 2368} {"train_loss": -8.878751754760742, "global_step": 397876, "epoch": 2368} {"train_loss": -8.571798324584961, "global_step": 397877, "epoch": 2368} {"train_loss": -8.739013671875, "global_step": 397878, "epoch": 2368} {"train_loss": -9.971963882446289, "global_step": 397879, "epoch": 2368} {"train_loss": -10.31558895111084, "global_step": 397880, "epoch": 2368} {"train_loss": -10.76464557647705, "global_step": 397881, "epoch": 2368} {"train_loss": -11.008806228637695, "global_step": 397882, "epoch": 2368} {"train_loss": -10.284423828125, "global_step": 397883, "epoch": 2368} {"train_loss": -10.151910781860352, "global_step": 397884, "epoch": 2368} {"train_loss": -10.172612190246582, "global_step": 397885, "epoch": 2368} {"train_loss": -10.862430572509766, "global_step": 397886, "epoch": 2368} {"train_loss": -10.777580261230469, "global_step": 397887, "epoch": 2368} {"train_loss": -11.114943504333496, "global_step": 397888, "epoch": 2368} {"train_loss": -11.439798355102539, "global_step": 397889, "epoch": 2368} {"train_loss": -11.313982009887695, "global_step": 397890, "epoch": 2368} {"train_loss": -10.969522476196289, "global_step": 397891, "epoch": 2368} {"train_loss": -11.158282279968262, "global_step": 397892, "epoch": 2368} {"train_loss": -11.118459701538086, "global_step": 397893, "epoch": 2368} {"train_loss": -11.155116081237793, "global_step": 397894, "epoch": 2368} {"train_loss": -11.211877822875977, "global_step": 397895, "epoch": 2368} {"train_loss": -11.102529525756836, "global_step": 397896, "epoch": 2368} {"train_loss": -11.536459922790527, "global_step": 397897, "epoch": 2368} {"train_loss": -11.243642807006836, "global_step": 397898, "epoch": 2368} {"train_loss": -11.240736961364746, "global_step": 397899, "epoch": 2368} {"train_loss": -11.877605438232422, "global_step": 397900, "epoch": 2368} {"train_loss": -11.347367286682129, "global_step": 397901, "epoch": 2368} {"train_loss": -11.438328742980957, "global_step": 397902, "epoch": 2368} {"train_loss": -11.180099487304688, "global_step": 397903, "epoch": 2368} {"train_loss": -11.76119613647461, "global_step": 397904, "epoch": 2368} {"train_loss": -11.733305931091309, "global_step": 397905, "epoch": 2368} {"train_loss": -12.165373802185059, "global_step": 397906, "epoch": 2368} {"train_loss": -11.865989685058594, "global_step": 397907, "epoch": 2368} {"train_loss": -11.78664779663086, "global_step": 397908, "epoch": 2368} {"train_loss": -12.12968635559082, "global_step": 397909, "epoch": 2368} {"train_loss": -11.910723686218262, "global_step": 397910, "epoch": 2368} {"train_loss": -11.78958511352539, "global_step": 397911, "epoch": 2368} {"train_loss": -12.184492111206055, "global_step": 397912, "epoch": 2368} {"train_loss": -12.026545524597168, "global_step": 397913, "epoch": 2368} {"train_loss": -12.122035026550293, "global_step": 397914, "epoch": 2368} {"train_loss": -12.194901466369629, "global_step": 397915, "epoch": 2368} {"train_loss": -12.388839721679688, "global_step": 397916, "epoch": 2368} {"train_loss": -11.776130676269531, "global_step": 397917, "epoch": 2368} {"train_loss": -12.525879859924316, "global_step": 397918, "epoch": 2368} {"train_loss": -12.193049430847168, "global_step": 397919, "epoch": 2368} {"train_loss": -12.443517684936523, "global_step": 397920, "epoch": 2368} {"train_loss": -12.271706581115723, "global_step": 397921, "epoch": 2368} {"train_loss": -12.243316650390625, "global_step": 397922, "epoch": 2368} {"train_loss": -12.12054443359375, "global_step": 397923, "epoch": 2368} {"train_loss": -12.149709701538086, "global_step": 397924, "epoch": 2368} {"train_loss": -12.464786529541016, "global_step": 397925, "epoch": 2368} {"train_loss": -12.126628875732422, "global_step": 397926, "epoch": 2368} {"train_loss": -12.37773323059082, "global_step": 397927, "epoch": 2368} {"train_loss": -12.41124153137207, "global_step": 397928, "epoch": 2368} {"train_loss": -12.298656463623047, "global_step": 397929, "epoch": 2368} {"train_loss": -12.34347152709961, "global_step": 397930, "epoch": 2368} {"train_loss": -12.266270637512207, "global_step": 397931, "epoch": 2368} {"train_loss": -12.299248695373535, "global_step": 397932, "epoch": 2368} {"train_loss": -12.337140083312988, "global_step": 397933, "epoch": 2368} {"train_loss": -12.392766952514648, "global_step": 397934, "epoch": 2368} {"train_loss": -12.396236419677734, "global_step": 397935, "epoch": 2368} {"train_loss": -12.37367057800293, "global_step": 397936, "epoch": 2368} {"train_loss": -12.164804458618164, "global_step": 397937, "epoch": 2368} {"train_loss": -12.422480583190918, "global_step": 397938, "epoch": 2368} {"train_loss": -11.994302749633789, "global_step": 397939, "epoch": 2368} {"train_loss": -12.501216888427734, "global_step": 397940, "epoch": 2368} {"train_loss": -12.067787170410156, "global_step": 397941, "epoch": 2368} {"train_loss": -12.152633666992188, "global_step": 397942, "epoch": 2368} {"train_loss": -12.330005645751953, "global_step": 397943, "epoch": 2368} {"train_loss": -12.117086410522461, "global_step": 397944, "epoch": 2368} {"train_loss": -12.172557830810547, "global_step": 397945, "epoch": 2368} {"train_loss": -12.297664642333984, "global_step": 397946, "epoch": 2368} {"train_loss": -12.315232276916504, "global_step": 397947, "epoch": 2368} {"train_loss": -11.894401550292969, "global_step": 397948, "epoch": 2368} {"train_loss": -12.47693920135498, "global_step": 397949, "epoch": 2368} {"train_loss": -11.783130645751953, "global_step": 397950, "epoch": 2368} {"train_loss": -12.130507469177246, "global_step": 397951, "epoch": 2368} {"train_loss": -12.470343589782715, "global_step": 397952, "epoch": 2368} {"train_loss": -12.35368537902832, "global_step": 397953, "epoch": 2368} {"train_loss": -12.248876571655273, "global_step": 397954, "epoch": 2368} {"train_loss": -12.354229927062988, "global_step": 397955, "epoch": 2368} {"train_loss": -12.203470230102539, "global_step": 397956, "epoch": 2368} {"train_loss": -12.595993995666504, "global_step": 397957, "epoch": 2368} {"train_loss": -12.371282577514648, "global_step": 397958, "epoch": 2368} {"train_loss": -12.087218284606934, "global_step": 397959, "epoch": 2368} {"train_loss": -12.311169624328613, "global_step": 397960, "epoch": 2368} {"train_loss": -11.374160766601562, "global_step": 397961, "epoch": 2368} {"train_loss": -11.393614768981934, "global_step": 397962, "epoch": 2368} {"train_loss": -12.100692749023438, "global_step": 397963, "epoch": 2368} {"train_loss": -12.282129287719727, "global_step": 397964, "epoch": 2368} {"train_loss": -11.97989273071289, "global_step": 397965, "epoch": 2368} {"train_loss": -12.362869262695312, "global_step": 397966, "epoch": 2368} {"train_loss": -12.236722946166992, "global_step": 397967, "epoch": 2368} {"train_loss": -12.075506210327148, "global_step": 397968, "epoch": 2368} {"train_loss": -12.326242446899414, "global_step": 397969, "epoch": 2368} {"train_loss": -12.538212776184082, "global_step": 397970, "epoch": 2368} {"train_loss": -12.091643333435059, "global_step": 397971, "epoch": 2368} {"train_loss": -12.52566909790039, "global_step": 397972, "epoch": 2368} {"train_loss": -12.485763549804688, "global_step": 397973, "epoch": 2368} {"train_loss": -12.162554740905762, "global_step": 397974, "epoch": 2368} {"train_loss": -12.712924003601074, "global_step": 397975, "epoch": 2368} {"train_loss": -12.398212432861328, "global_step": 397976, "epoch": 2368} {"train_loss": -12.495499610900879, "global_step": 397977, "epoch": 2368} {"train_loss": -12.618728637695312, "global_step": 397978, "epoch": 2368} {"train_loss": -12.270923614501953, "global_step": 397979, "epoch": 2368} {"train_loss": -12.562997817993164, "global_step": 397980, "epoch": 2368} {"train_loss": -12.743563652038574, "global_step": 397981, "epoch": 2368} {"train_loss": -12.57400131225586, "global_step": 397982, "epoch": 2368} {"train_loss": -12.597049713134766, "global_step": 397983, "epoch": 2368} {"train_loss": -12.563756942749023, "global_step": 397984, "epoch": 2368} {"train_loss": -12.708084106445312, "global_step": 397985, "epoch": 2368} {"train_loss": -12.266339302062988, "global_step": 397986, "epoch": 2368} {"train_loss": -12.456136703491211, "global_step": 397987, "epoch": 2368} {"train_loss": -12.250986099243164, "global_step": 397988, "epoch": 2368} {"train_loss": -12.471782684326172, "global_step": 397989, "epoch": 2368} {"train_loss": -12.193044662475586, "global_step": 397990, "epoch": 2368} {"train_loss": -11.739524046579996, "global_step": 397991, "epoch": 2368, "val_loss": 293949.15625} {"train_loss": -12.14936637878418, "global_step": 397992, "epoch": 2369} {"train_loss": -12.313737869262695, "global_step": 397993, "epoch": 2369} {"train_loss": -12.59080696105957, "global_step": 397994, "epoch": 2369} {"train_loss": -12.105964660644531, "global_step": 397995, "epoch": 2369} {"train_loss": -11.8515043258667, "global_step": 397996, "epoch": 2369} {"train_loss": -11.925594329833984, "global_step": 397997, "epoch": 2369} {"train_loss": -12.267356872558594, "global_step": 397998, "epoch": 2369} {"train_loss": -11.684026718139648, "global_step": 397999, "epoch": 2369} {"train_loss": -11.138534545898438, "global_step": 398000, "epoch": 2369} {"train_loss": -11.62867546081543, "global_step": 398001, "epoch": 2369} {"train_loss": -12.328052520751953, "global_step": 398002, "epoch": 2369} {"train_loss": -11.717889785766602, "global_step": 398003, "epoch": 2369} {"train_loss": -11.927705764770508, "global_step": 398004, "epoch": 2369} {"train_loss": -12.021048545837402, "global_step": 398005, "epoch": 2369} {"train_loss": -12.307969093322754, "global_step": 398006, "epoch": 2369} {"train_loss": -11.999013900756836, "global_step": 398007, "epoch": 2369} {"train_loss": -12.347036361694336, "global_step": 398008, "epoch": 2369} {"train_loss": -12.404097557067871, "global_step": 398009, "epoch": 2369} {"train_loss": -11.797450065612793, "global_step": 398010, "epoch": 2369} {"train_loss": -12.217031478881836, "global_step": 398011, "epoch": 2369} {"train_loss": -12.574169158935547, "global_step": 398012, "epoch": 2369} {"train_loss": -11.803354263305664, "global_step": 398013, "epoch": 2369} {"train_loss": -11.833248138427734, "global_step": 398014, "epoch": 2369} {"train_loss": -12.2047700881958, "global_step": 398015, "epoch": 2369} {"train_loss": -11.016585350036621, "global_step": 398016, "epoch": 2369} {"train_loss": -11.72043228149414, "global_step": 398017, "epoch": 2369} {"train_loss": -12.008773803710938, "global_step": 398018, "epoch": 2369} {"train_loss": -10.986640930175781, "global_step": 398019, "epoch": 2369} {"train_loss": -11.084184646606445, "global_step": 398020, "epoch": 2369} {"train_loss": -11.845388412475586, "global_step": 398021, "epoch": 2369} {"train_loss": -9.874004364013672, "global_step": 398022, "epoch": 2369} {"train_loss": -12.192806243896484, "global_step": 398023, "epoch": 2369} {"train_loss": -10.779960632324219, "global_step": 398024, "epoch": 2369} {"train_loss": -11.247711181640625, "global_step": 398025, "epoch": 2369} {"train_loss": -11.922698974609375, "global_step": 398026, "epoch": 2369} {"train_loss": -11.147933959960938, "global_step": 398027, "epoch": 2369} {"train_loss": -10.815680503845215, "global_step": 398028, "epoch": 2369} {"train_loss": -11.022625923156738, "global_step": 398029, "epoch": 2369} {"train_loss": -11.59954833984375, "global_step": 398030, "epoch": 2369} {"train_loss": -11.459735870361328, "global_step": 398031, "epoch": 2369} {"train_loss": -11.480124473571777, "global_step": 398032, "epoch": 2369} {"train_loss": -12.28193473815918, "global_step": 398033, "epoch": 2369} {"train_loss": -11.666303634643555, "global_step": 398034, "epoch": 2369} {"train_loss": -12.020957946777344, "global_step": 398035, "epoch": 2369} {"train_loss": -11.50688362121582, "global_step": 398036, "epoch": 2369} {"train_loss": -11.824492454528809, "global_step": 398037, "epoch": 2369} {"train_loss": -12.044089317321777, "global_step": 398038, "epoch": 2369} {"train_loss": -11.523069381713867, "global_step": 398039, "epoch": 2369} {"train_loss": -12.229071617126465, "global_step": 398040, "epoch": 2369} {"train_loss": -11.842245101928711, "global_step": 398041, "epoch": 2369} {"train_loss": -11.7760009765625, "global_step": 398042, "epoch": 2369} {"train_loss": -11.934187889099121, "global_step": 398043, "epoch": 2369} {"train_loss": -11.847829818725586, "global_step": 398044, "epoch": 2369} {"train_loss": -11.38740348815918, "global_step": 398045, "epoch": 2369} {"train_loss": -11.98284912109375, "global_step": 398046, "epoch": 2369} {"train_loss": -11.765945434570312, "global_step": 398047, "epoch": 2369} {"train_loss": -12.17749309539795, "global_step": 398048, "epoch": 2369} {"train_loss": -12.158756256103516, "global_step": 398049, "epoch": 2369} {"train_loss": -11.801029205322266, "global_step": 398050, "epoch": 2369} {"train_loss": -12.39863395690918, "global_step": 398051, "epoch": 2369} {"train_loss": -11.099166870117188, "global_step": 398052, "epoch": 2369} {"train_loss": -11.83426570892334, "global_step": 398053, "epoch": 2369} {"train_loss": -11.886831283569336, "global_step": 398054, "epoch": 2369} {"train_loss": -11.887578964233398, "global_step": 398055, "epoch": 2369} {"train_loss": -12.226991653442383, "global_step": 398056, "epoch": 2369} {"train_loss": -11.502935409545898, "global_step": 398057, "epoch": 2369} {"train_loss": -12.343818664550781, "global_step": 398058, "epoch": 2369} {"train_loss": -11.38870906829834, "global_step": 398059, "epoch": 2369} {"train_loss": -11.97935676574707, "global_step": 398060, "epoch": 2369} {"train_loss": -11.498261451721191, "global_step": 398061, "epoch": 2369} {"train_loss": -11.223295211791992, "global_step": 398062, "epoch": 2369} {"train_loss": -11.97420597076416, "global_step": 398063, "epoch": 2369} {"train_loss": -11.624128341674805, "global_step": 398064, "epoch": 2369} {"train_loss": -11.743539810180664, "global_step": 398065, "epoch": 2369} {"train_loss": -11.721638679504395, "global_step": 398066, "epoch": 2369} {"train_loss": -11.72972297668457, "global_step": 398067, "epoch": 2369} {"train_loss": -11.298734664916992, "global_step": 398068, "epoch": 2369} {"train_loss": -11.540144920349121, "global_step": 398069, "epoch": 2369} {"train_loss": -11.624463081359863, "global_step": 398070, "epoch": 2369} {"train_loss": -11.915823936462402, "global_step": 398071, "epoch": 2369} {"train_loss": -11.691939353942871, "global_step": 398072, "epoch": 2369} {"train_loss": -12.426549911499023, "global_step": 398073, "epoch": 2369} {"train_loss": -11.315896034240723, "global_step": 398074, "epoch": 2369} {"train_loss": -12.357734680175781, "global_step": 398075, "epoch": 2369} {"train_loss": -12.104288101196289, "global_step": 398076, "epoch": 2369} {"train_loss": -12.185232162475586, "global_step": 398077, "epoch": 2369} {"train_loss": -11.957478523254395, "global_step": 398078, "epoch": 2369} {"train_loss": -11.589807510375977, "global_step": 398079, "epoch": 2369} {"train_loss": -12.22787857055664, "global_step": 398080, "epoch": 2369} {"train_loss": -12.191438674926758, "global_step": 398081, "epoch": 2369} {"train_loss": -12.226435661315918, "global_step": 398082, "epoch": 2369} {"train_loss": -12.09895133972168, "global_step": 398083, "epoch": 2369} {"train_loss": -12.33511734008789, "global_step": 398084, "epoch": 2369} {"train_loss": -12.288620948791504, "global_step": 398085, "epoch": 2369} {"train_loss": -12.222155570983887, "global_step": 398086, "epoch": 2369} {"train_loss": -12.574014663696289, "global_step": 398087, "epoch": 2369} {"train_loss": -12.197205543518066, "global_step": 398088, "epoch": 2369} {"train_loss": -12.323951721191406, "global_step": 398089, "epoch": 2369} {"train_loss": -12.196895599365234, "global_step": 398090, "epoch": 2369} {"train_loss": -12.107873916625977, "global_step": 398091, "epoch": 2369} {"train_loss": -12.353394508361816, "global_step": 398092, "epoch": 2369} {"train_loss": -12.479284286499023, "global_step": 398093, "epoch": 2369} {"train_loss": -12.375188827514648, "global_step": 398094, "epoch": 2369} {"train_loss": -12.59732437133789, "global_step": 398095, "epoch": 2369} {"train_loss": -12.312938690185547, "global_step": 398096, "epoch": 2369} {"train_loss": -12.237963676452637, "global_step": 398097, "epoch": 2369} {"train_loss": -12.412981033325195, "global_step": 398098, "epoch": 2369} {"train_loss": -12.269815444946289, "global_step": 398099, "epoch": 2369} {"train_loss": -12.381595611572266, "global_step": 398100, "epoch": 2369} {"train_loss": -12.449806213378906, "global_step": 398101, "epoch": 2369} {"train_loss": -12.493247985839844, "global_step": 398102, "epoch": 2369} {"train_loss": -12.636741638183594, "global_step": 398103, "epoch": 2369} {"train_loss": -12.69373607635498, "global_step": 398104, "epoch": 2369} {"train_loss": -12.46048355102539, "global_step": 398105, "epoch": 2369} {"train_loss": -12.567323684692383, "global_step": 398106, "epoch": 2369} {"train_loss": -12.395809173583984, "global_step": 398107, "epoch": 2369} {"train_loss": -12.590449333190918, "global_step": 398108, "epoch": 2369} {"train_loss": -12.409832000732422, "global_step": 398109, "epoch": 2369} {"train_loss": -12.626787185668945, "global_step": 398110, "epoch": 2369} {"train_loss": -12.272214889526367, "global_step": 398111, "epoch": 2369} {"train_loss": -12.64337158203125, "global_step": 398112, "epoch": 2369} {"train_loss": -12.415811538696289, "global_step": 398113, "epoch": 2369} {"train_loss": -12.739768028259277, "global_step": 398114, "epoch": 2369} {"train_loss": -12.433161735534668, "global_step": 398115, "epoch": 2369} {"train_loss": -12.671358108520508, "global_step": 398116, "epoch": 2369} {"train_loss": -12.170930862426758, "global_step": 398117, "epoch": 2369} {"train_loss": -12.69537353515625, "global_step": 398118, "epoch": 2369} {"train_loss": -12.54010009765625, "global_step": 398119, "epoch": 2369} {"train_loss": -12.683103561401367, "global_step": 398120, "epoch": 2369} {"train_loss": -12.336337089538574, "global_step": 398121, "epoch": 2369} {"train_loss": -12.704496383666992, "global_step": 398122, "epoch": 2369} {"train_loss": -12.28782844543457, "global_step": 398123, "epoch": 2369} {"train_loss": -12.22000503540039, "global_step": 398124, "epoch": 2369} {"train_loss": -12.538436889648438, "global_step": 398125, "epoch": 2369} {"train_loss": -12.556490898132324, "global_step": 398126, "epoch": 2369} {"train_loss": -12.656330108642578, "global_step": 398127, "epoch": 2369} {"train_loss": -12.645910263061523, "global_step": 398128, "epoch": 2369} {"train_loss": -12.621026039123535, "global_step": 398129, "epoch": 2369} {"train_loss": -12.839502334594727, "global_step": 398130, "epoch": 2369} {"train_loss": -11.99513053894043, "global_step": 398131, "epoch": 2369} {"train_loss": -12.356592178344727, "global_step": 398132, "epoch": 2369} {"train_loss": -12.0228271484375, "global_step": 398133, "epoch": 2369} {"train_loss": -12.420251846313477, "global_step": 398134, "epoch": 2369} {"train_loss": -12.630471229553223, "global_step": 398135, "epoch": 2369} {"train_loss": -12.580718994140625, "global_step": 398136, "epoch": 2369} {"train_loss": -12.47735595703125, "global_step": 398137, "epoch": 2369} {"train_loss": -12.727386474609375, "global_step": 398138, "epoch": 2369} {"train_loss": -12.652629852294922, "global_step": 398139, "epoch": 2369} {"train_loss": -12.611337661743164, "global_step": 398140, "epoch": 2369} {"train_loss": -12.471332550048828, "global_step": 398141, "epoch": 2369} {"train_loss": -12.703179359436035, "global_step": 398142, "epoch": 2369} {"train_loss": -12.113086700439453, "global_step": 398143, "epoch": 2369} {"train_loss": -12.220088958740234, "global_step": 398144, "epoch": 2369} {"train_loss": -12.489531517028809, "global_step": 398145, "epoch": 2369} {"train_loss": -12.332897186279297, "global_step": 398146, "epoch": 2369} {"train_loss": -12.150145530700684, "global_step": 398147, "epoch": 2369} {"train_loss": -12.295648574829102, "global_step": 398148, "epoch": 2369} {"train_loss": -12.31848430633545, "global_step": 398149, "epoch": 2369} {"train_loss": -12.705785751342773, "global_step": 398150, "epoch": 2369} {"train_loss": -11.404269218444824, "global_step": 398151, "epoch": 2369} {"train_loss": -12.539642333984375, "global_step": 398152, "epoch": 2369} {"train_loss": -11.916743278503418, "global_step": 398153, "epoch": 2369} {"train_loss": -12.296916007995605, "global_step": 398154, "epoch": 2369} {"train_loss": -11.837006568908691, "global_step": 398155, "epoch": 2369} {"train_loss": -11.899839401245117, "global_step": 398156, "epoch": 2369} {"train_loss": -12.121073722839355, "global_step": 398157, "epoch": 2369} {"train_loss": -11.534982681274414, "global_step": 398158, "epoch": 2369} {"train_loss": -12.056380646569389, "global_step": 398159, "epoch": 2369, "val_loss": 293026.53125} {"train_loss": -11.72983455657959, "global_step": 398160, "epoch": 2370} {"train_loss": -9.426507949829102, "global_step": 398161, "epoch": 2370} {"train_loss": -11.01242446899414, "global_step": 398162, "epoch": 2370} {"train_loss": -7.23621940612793, "global_step": 398163, "epoch": 2370} {"train_loss": -6.943350791931152, "global_step": 398164, "epoch": 2370} {"train_loss": -6.464265823364258, "global_step": 398165, "epoch": 2370} {"train_loss": -5.7801103591918945, "global_step": 398166, "epoch": 2370} {"train_loss": -6.382733345031738, "global_step": 398167, "epoch": 2370} {"train_loss": -7.0081048011779785, "global_step": 398168, "epoch": 2370} {"train_loss": -6.944548606872559, "global_step": 398169, "epoch": 2370} {"train_loss": -6.646455764770508, "global_step": 398170, "epoch": 2370} {"train_loss": -7.461852073669434, "global_step": 398171, "epoch": 2370} {"train_loss": -7.080509662628174, "global_step": 398172, "epoch": 2370} {"train_loss": -6.947566509246826, "global_step": 398173, "epoch": 2370} {"train_loss": -8.085647583007812, "global_step": 398174, "epoch": 2370} {"train_loss": -7.815122604370117, "global_step": 398175, "epoch": 2370} {"train_loss": -7.183545112609863, "global_step": 398176, "epoch": 2370} {"train_loss": -7.537357330322266, "global_step": 398177, "epoch": 2370} {"train_loss": -8.404438018798828, "global_step": 398178, "epoch": 2370} {"train_loss": -8.164819717407227, "global_step": 398179, "epoch": 2370} {"train_loss": -7.55001163482666, "global_step": 398180, "epoch": 2370} {"train_loss": -8.482137680053711, "global_step": 398181, "epoch": 2370} {"train_loss": -7.872468948364258, "global_step": 398182, "epoch": 2370} {"train_loss": -8.729086875915527, "global_step": 398183, "epoch": 2370} {"train_loss": -8.82229232788086, "global_step": 398184, "epoch": 2370} {"train_loss": -8.74557113647461, "global_step": 398185, "epoch": 2370} {"train_loss": -9.087018966674805, "global_step": 398186, "epoch": 2370} {"train_loss": -9.564332962036133, "global_step": 398187, "epoch": 2370} {"train_loss": -9.577685356140137, "global_step": 398188, "epoch": 2370} {"train_loss": -9.293632507324219, "global_step": 398189, "epoch": 2370} {"train_loss": -9.828007698059082, "global_step": 398190, "epoch": 2370} {"train_loss": -10.245146751403809, "global_step": 398191, "epoch": 2370} {"train_loss": -10.199840545654297, "global_step": 398192, "epoch": 2370} {"train_loss": -9.483220100402832, "global_step": 398193, "epoch": 2370} {"train_loss": -10.251861572265625, "global_step": 398194, "epoch": 2370} {"train_loss": -10.852277755737305, "global_step": 398195, "epoch": 2370} {"train_loss": -10.246541976928711, "global_step": 398196, "epoch": 2370} {"train_loss": -10.967306137084961, "global_step": 398197, "epoch": 2370} {"train_loss": -10.098135948181152, "global_step": 398198, "epoch": 2370} {"train_loss": -11.481693267822266, "global_step": 398199, "epoch": 2370} {"train_loss": -10.451904296875, "global_step": 398200, "epoch": 2370} {"train_loss": -10.037983894348145, "global_step": 398201, "epoch": 2370} {"train_loss": -11.441474914550781, "global_step": 398202, "epoch": 2370} {"train_loss": -10.263311386108398, "global_step": 398203, "epoch": 2370} {"train_loss": -10.497800827026367, "global_step": 398204, "epoch": 2370} {"train_loss": -11.081673622131348, "global_step": 398205, "epoch": 2370} {"train_loss": -11.144242286682129, "global_step": 398206, "epoch": 2370} {"train_loss": -11.006590843200684, "global_step": 398207, "epoch": 2370} {"train_loss": -10.963194847106934, "global_step": 398208, "epoch": 2370} {"train_loss": -11.018451690673828, "global_step": 398209, "epoch": 2370} {"train_loss": -11.077262878417969, "global_step": 398210, "epoch": 2370} {"train_loss": -10.82781982421875, "global_step": 398211, "epoch": 2370} {"train_loss": -10.885566711425781, "global_step": 398212, "epoch": 2370} {"train_loss": -11.158041954040527, "global_step": 398213, "epoch": 2370} {"train_loss": -11.453965187072754, "global_step": 398214, "epoch": 2370} {"train_loss": -11.080377578735352, "global_step": 398215, "epoch": 2370} {"train_loss": -11.84027099609375, "global_step": 398216, "epoch": 2370} {"train_loss": -11.193334579467773, "global_step": 398217, "epoch": 2370} {"train_loss": -11.88418960571289, "global_step": 398218, "epoch": 2370} {"train_loss": -11.85894775390625, "global_step": 398219, "epoch": 2370} {"train_loss": -11.209434509277344, "global_step": 398220, "epoch": 2370} {"train_loss": -11.9951171875, "global_step": 398221, "epoch": 2370} {"train_loss": -11.845199584960938, "global_step": 398222, "epoch": 2370} {"train_loss": -12.070852279663086, "global_step": 398223, "epoch": 2370} {"train_loss": -11.821206092834473, "global_step": 398224, "epoch": 2370} {"train_loss": -11.803057670593262, "global_step": 398225, "epoch": 2370} {"train_loss": -11.473848342895508, "global_step": 398226, "epoch": 2370} {"train_loss": -11.625044822692871, "global_step": 398227, "epoch": 2370} {"train_loss": -11.930524826049805, "global_step": 398228, "epoch": 2370} {"train_loss": -11.580228805541992, "global_step": 398229, "epoch": 2370} {"train_loss": -12.184820175170898, "global_step": 398230, "epoch": 2370} {"train_loss": -11.954771041870117, "global_step": 398231, "epoch": 2370} {"train_loss": -11.852569580078125, "global_step": 398232, "epoch": 2370} {"train_loss": -11.898961067199707, "global_step": 398233, "epoch": 2370} {"train_loss": -12.18364429473877, "global_step": 398234, "epoch": 2370} {"train_loss": -11.71095085144043, "global_step": 398235, "epoch": 2370} {"train_loss": -12.220788955688477, "global_step": 398236, "epoch": 2370} {"train_loss": -11.88490104675293, "global_step": 398237, "epoch": 2370} {"train_loss": -12.078496932983398, "global_step": 398238, "epoch": 2370} {"train_loss": -12.144121170043945, "global_step": 398239, "epoch": 2370} {"train_loss": -12.148733139038086, "global_step": 398240, "epoch": 2370} {"train_loss": -12.009977340698242, "global_step": 398241, "epoch": 2370} {"train_loss": -12.003377914428711, "global_step": 398242, "epoch": 2370} {"train_loss": -12.147140502929688, "global_step": 398243, "epoch": 2370} {"train_loss": -11.921324729919434, "global_step": 398244, "epoch": 2370} {"train_loss": -12.284698486328125, "global_step": 398245, "epoch": 2370} {"train_loss": -11.763893127441406, "global_step": 398246, "epoch": 2370} {"train_loss": -12.374748229980469, "global_step": 398247, "epoch": 2370} {"train_loss": -11.95296859741211, "global_step": 398248, "epoch": 2370} {"train_loss": -12.361388206481934, "global_step": 398249, "epoch": 2370} {"train_loss": -12.117443084716797, "global_step": 398250, "epoch": 2370} {"train_loss": -12.362539291381836, "global_step": 398251, "epoch": 2370} {"train_loss": -12.110950469970703, "global_step": 398252, "epoch": 2370} {"train_loss": -11.728141784667969, "global_step": 398253, "epoch": 2370} {"train_loss": -12.381532669067383, "global_step": 398254, "epoch": 2370} {"train_loss": -11.661499977111816, "global_step": 398255, "epoch": 2370} {"train_loss": -12.145637512207031, "global_step": 398256, "epoch": 2370} {"train_loss": -12.383902549743652, "global_step": 398257, "epoch": 2370} {"train_loss": -12.26380729675293, "global_step": 398258, "epoch": 2370} {"train_loss": -11.976984977722168, "global_step": 398259, "epoch": 2370} {"train_loss": -12.088842391967773, "global_step": 398260, "epoch": 2370} {"train_loss": -12.277063369750977, "global_step": 398261, "epoch": 2370} {"train_loss": -12.129677772521973, "global_step": 398262, "epoch": 2370} {"train_loss": -12.259085655212402, "global_step": 398263, "epoch": 2370} {"train_loss": -12.277267456054688, "global_step": 398264, "epoch": 2370} {"train_loss": -12.222484588623047, "global_step": 398265, "epoch": 2370} {"train_loss": -12.103767395019531, "global_step": 398266, "epoch": 2370} {"train_loss": -12.229185104370117, "global_step": 398267, "epoch": 2370} {"train_loss": -12.390652656555176, "global_step": 398268, "epoch": 2370} {"train_loss": -12.218208312988281, "global_step": 398269, "epoch": 2370} {"train_loss": -12.336532592773438, "global_step": 398270, "epoch": 2370} {"train_loss": -12.238812446594238, "global_step": 398271, "epoch": 2370} {"train_loss": -12.365327835083008, "global_step": 398272, "epoch": 2370} {"train_loss": -12.583141326904297, "global_step": 398273, "epoch": 2370} {"train_loss": -12.305374145507812, "global_step": 398274, "epoch": 2370} {"train_loss": -12.461819648742676, "global_step": 398275, "epoch": 2370} {"train_loss": -12.051248550415039, "global_step": 398276, "epoch": 2370} {"train_loss": -12.177755355834961, "global_step": 398277, "epoch": 2370} {"train_loss": -12.428117752075195, "global_step": 398278, "epoch": 2370} {"train_loss": -12.137114524841309, "global_step": 398279, "epoch": 2370} {"train_loss": -12.080944061279297, "global_step": 398280, "epoch": 2370} {"train_loss": -12.324884414672852, "global_step": 398281, "epoch": 2370} {"train_loss": -11.829132080078125, "global_step": 398282, "epoch": 2370} {"train_loss": -12.114278793334961, "global_step": 398283, "epoch": 2370} {"train_loss": -12.350507736206055, "global_step": 398284, "epoch": 2370} {"train_loss": -11.551918029785156, "global_step": 398285, "epoch": 2370} {"train_loss": -12.306864738464355, "global_step": 398286, "epoch": 2370} {"train_loss": -11.958125114440918, "global_step": 398287, "epoch": 2370} {"train_loss": -12.41326904296875, "global_step": 398288, "epoch": 2370} {"train_loss": -12.45372200012207, "global_step": 398289, "epoch": 2370} {"train_loss": -12.206575393676758, "global_step": 398290, "epoch": 2370} {"train_loss": -12.305761337280273, "global_step": 398291, "epoch": 2370} {"train_loss": -12.134622573852539, "global_step": 398292, "epoch": 2370} {"train_loss": -12.062309265136719, "global_step": 398293, "epoch": 2370} {"train_loss": -12.24440860748291, "global_step": 398294, "epoch": 2370} {"train_loss": -12.301835060119629, "global_step": 398295, "epoch": 2370} {"train_loss": -12.338094711303711, "global_step": 398296, "epoch": 2370} {"train_loss": -12.233257293701172, "global_step": 398297, "epoch": 2370} {"train_loss": -12.565338134765625, "global_step": 398298, "epoch": 2370} {"train_loss": -12.065229415893555, "global_step": 398299, "epoch": 2370} {"train_loss": -12.415672302246094, "global_step": 398300, "epoch": 2370} {"train_loss": -12.44804859161377, "global_step": 398301, "epoch": 2370} {"train_loss": -12.371004104614258, "global_step": 398302, "epoch": 2370} {"train_loss": -12.404058456420898, "global_step": 398303, "epoch": 2370} {"train_loss": -12.348472595214844, "global_step": 398304, "epoch": 2370} {"train_loss": -12.530160903930664, "global_step": 398305, "epoch": 2370} {"train_loss": -12.512065887451172, "global_step": 398306, "epoch": 2370} {"train_loss": -12.661882400512695, "global_step": 398307, "epoch": 2370} {"train_loss": -12.637943267822266, "global_step": 398308, "epoch": 2370} {"train_loss": -12.490043640136719, "global_step": 398309, "epoch": 2370} {"train_loss": -12.782065391540527, "global_step": 398310, "epoch": 2370} {"train_loss": -12.54318618774414, "global_step": 398311, "epoch": 2370} {"train_loss": -12.592880249023438, "global_step": 398312, "epoch": 2370} {"train_loss": -12.574006080627441, "global_step": 398313, "epoch": 2370} {"train_loss": -12.56277847290039, "global_step": 398314, "epoch": 2370} {"train_loss": -12.637447357177734, "global_step": 398315, "epoch": 2370} {"train_loss": -12.563690185546875, "global_step": 398316, "epoch": 2370} {"train_loss": -12.733391761779785, "global_step": 398317, "epoch": 2370} {"train_loss": -12.78751277923584, "global_step": 398318, "epoch": 2370} {"train_loss": -12.681636810302734, "global_step": 398319, "epoch": 2370} {"train_loss": -12.771299362182617, "global_step": 398320, "epoch": 2370} {"train_loss": -12.541393280029297, "global_step": 398321, "epoch": 2370} {"train_loss": -12.78054428100586, "global_step": 398322, "epoch": 2370} {"train_loss": -12.70368766784668, "global_step": 398323, "epoch": 2370} {"train_loss": -12.361042022705078, "global_step": 398324, "epoch": 2370} {"train_loss": -12.55362319946289, "global_step": 398325, "epoch": 2370} {"train_loss": -12.721293449401855, "global_step": 398326, "epoch": 2370} {"train_loss": -11.236997828597115, "global_step": 398327, "epoch": 2370, "val_loss": 296142.25, "train_action_mse_error": 1.145097255706787} {"train_loss": -12.508249282836914, "global_step": 398328, "epoch": 2371} {"train_loss": -12.369643211364746, "global_step": 398329, "epoch": 2371} {"train_loss": -12.465424537658691, "global_step": 398330, "epoch": 2371} {"train_loss": -11.615141868591309, "global_step": 398331, "epoch": 2371} {"train_loss": -11.362462997436523, "global_step": 398332, "epoch": 2371} {"train_loss": -11.936670303344727, "global_step": 398333, "epoch": 2371} {"train_loss": -12.223684310913086, "global_step": 398334, "epoch": 2371} {"train_loss": -11.498485565185547, "global_step": 398335, "epoch": 2371} {"train_loss": -12.319453239440918, "global_step": 398336, "epoch": 2371} {"train_loss": -12.007966995239258, "global_step": 398337, "epoch": 2371} {"train_loss": -11.519257545471191, "global_step": 398338, "epoch": 2371} {"train_loss": -11.925507545471191, "global_step": 398339, "epoch": 2371} {"train_loss": -12.476516723632812, "global_step": 398340, "epoch": 2371} {"train_loss": -11.320863723754883, "global_step": 398341, "epoch": 2371} {"train_loss": -11.868511199951172, "global_step": 398342, "epoch": 2371} {"train_loss": -12.209819793701172, "global_step": 398343, "epoch": 2371} {"train_loss": -12.607274055480957, "global_step": 398344, "epoch": 2371} {"train_loss": -11.716711044311523, "global_step": 398345, "epoch": 2371} {"train_loss": -12.406820297241211, "global_step": 398346, "epoch": 2371} {"train_loss": -12.436456680297852, "global_step": 398347, "epoch": 2371} {"train_loss": -12.406231880187988, "global_step": 398348, "epoch": 2371} {"train_loss": -12.546195030212402, "global_step": 398349, "epoch": 2371} {"train_loss": -12.102523803710938, "global_step": 398350, "epoch": 2371} {"train_loss": -12.159435272216797, "global_step": 398351, "epoch": 2371} {"train_loss": -11.895286560058594, "global_step": 398352, "epoch": 2371} {"train_loss": -12.380922317504883, "global_step": 398353, "epoch": 2371} {"train_loss": -12.151479721069336, "global_step": 398354, "epoch": 2371} {"train_loss": -12.260982513427734, "global_step": 398355, "epoch": 2371} {"train_loss": -12.058541297912598, "global_step": 398356, "epoch": 2371} {"train_loss": -12.243976593017578, "global_step": 398357, "epoch": 2371} {"train_loss": -12.268342018127441, "global_step": 398358, "epoch": 2371} {"train_loss": -12.800912857055664, "global_step": 398359, "epoch": 2371} {"train_loss": -12.02102279663086, "global_step": 398360, "epoch": 2371} {"train_loss": -12.601248741149902, "global_step": 398361, "epoch": 2371} {"train_loss": -11.993278503417969, "global_step": 398362, "epoch": 2371} {"train_loss": -11.714570999145508, "global_step": 398363, "epoch": 2371} {"train_loss": -11.713425636291504, "global_step": 398364, "epoch": 2371} {"train_loss": -12.392524719238281, "global_step": 398365, "epoch": 2371} {"train_loss": -11.81273365020752, "global_step": 398366, "epoch": 2371} {"train_loss": -11.147464752197266, "global_step": 398367, "epoch": 2371} {"train_loss": -9.860092163085938, "global_step": 398368, "epoch": 2371} {"train_loss": -11.129390716552734, "global_step": 398369, "epoch": 2371} {"train_loss": -11.326436996459961, "global_step": 398370, "epoch": 2371} {"train_loss": -9.75438117980957, "global_step": 398371, "epoch": 2371} {"train_loss": -10.19553279876709, "global_step": 398372, "epoch": 2371} {"train_loss": -8.327388763427734, "global_step": 398373, "epoch": 2371} {"train_loss": -7.495204448699951, "global_step": 398374, "epoch": 2371} {"train_loss": -7.796194076538086, "global_step": 398375, "epoch": 2371} {"train_loss": -8.205848693847656, "global_step": 398376, "epoch": 2371} {"train_loss": -7.8417253494262695, "global_step": 398377, "epoch": 2371} {"train_loss": -7.463507175445557, "global_step": 398378, "epoch": 2371} {"train_loss": -7.128123760223389, "global_step": 398379, "epoch": 2371} {"train_loss": -8.461444854736328, "global_step": 398380, "epoch": 2371} {"train_loss": -8.261890411376953, "global_step": 398381, "epoch": 2371} {"train_loss": -8.213242530822754, "global_step": 398382, "epoch": 2371} {"train_loss": -8.050117492675781, "global_step": 398383, "epoch": 2371} {"train_loss": -7.870073318481445, "global_step": 398384, "epoch": 2371} {"train_loss": -8.537498474121094, "global_step": 398385, "epoch": 2371} {"train_loss": -8.19678783416748, "global_step": 398386, "epoch": 2371} {"train_loss": -8.725680351257324, "global_step": 398387, "epoch": 2371} {"train_loss": -8.34829330444336, "global_step": 398388, "epoch": 2371} {"train_loss": -8.548016548156738, "global_step": 398389, "epoch": 2371} {"train_loss": -8.470830917358398, "global_step": 398390, "epoch": 2371} {"train_loss": -9.493758201599121, "global_step": 398391, "epoch": 2371} {"train_loss": -8.981948852539062, "global_step": 398392, "epoch": 2371} {"train_loss": -8.96725845336914, "global_step": 398393, "epoch": 2371} {"train_loss": -9.31496810913086, "global_step": 398394, "epoch": 2371} {"train_loss": -9.642929077148438, "global_step": 398395, "epoch": 2371} {"train_loss": -9.898223876953125, "global_step": 398396, "epoch": 2371} {"train_loss": -9.510553359985352, "global_step": 398397, "epoch": 2371} {"train_loss": -9.224584579467773, "global_step": 398398, "epoch": 2371} {"train_loss": -10.604913711547852, "global_step": 398399, "epoch": 2371} {"train_loss": -10.454309463500977, "global_step": 398400, "epoch": 2371} {"train_loss": -10.856988906860352, "global_step": 398401, "epoch": 2371} {"train_loss": -10.568378448486328, "global_step": 398402, "epoch": 2371} {"train_loss": -10.547300338745117, "global_step": 398403, "epoch": 2371} {"train_loss": -10.649724006652832, "global_step": 398404, "epoch": 2371} {"train_loss": -11.290790557861328, "global_step": 398405, "epoch": 2371} {"train_loss": -11.059558868408203, "global_step": 398406, "epoch": 2371} {"train_loss": -11.019661903381348, "global_step": 398407, "epoch": 2371} {"train_loss": -11.39661693572998, "global_step": 398408, "epoch": 2371} {"train_loss": -11.272831916809082, "global_step": 398409, "epoch": 2371} {"train_loss": -11.179523468017578, "global_step": 398410, "epoch": 2371} {"train_loss": -11.231245994567871, "global_step": 398411, "epoch": 2371} {"train_loss": -11.236539840698242, "global_step": 398412, "epoch": 2371} {"train_loss": -11.523887634277344, "global_step": 398413, "epoch": 2371} {"train_loss": -11.658016204833984, "global_step": 398414, "epoch": 2371} {"train_loss": -11.813108444213867, "global_step": 398415, "epoch": 2371} {"train_loss": -11.550873756408691, "global_step": 398416, "epoch": 2371} {"train_loss": -11.983034133911133, "global_step": 398417, "epoch": 2371} {"train_loss": -11.677757263183594, "global_step": 398418, "epoch": 2371} {"train_loss": -11.988898277282715, "global_step": 398419, "epoch": 2371} {"train_loss": -11.811222076416016, "global_step": 398420, "epoch": 2371} {"train_loss": -11.280049324035645, "global_step": 398421, "epoch": 2371} {"train_loss": -12.045289993286133, "global_step": 398422, "epoch": 2371} {"train_loss": -12.092547416687012, "global_step": 398423, "epoch": 2371} {"train_loss": -12.050270080566406, "global_step": 398424, "epoch": 2371} {"train_loss": -11.954110145568848, "global_step": 398425, "epoch": 2371} {"train_loss": -12.1521635055542, "global_step": 398426, "epoch": 2371} {"train_loss": -11.807123184204102, "global_step": 398427, "epoch": 2371} {"train_loss": -12.181057929992676, "global_step": 398428, "epoch": 2371} {"train_loss": -11.91552448272705, "global_step": 398429, "epoch": 2371} {"train_loss": -11.309188842773438, "global_step": 398430, "epoch": 2371} {"train_loss": -12.153968811035156, "global_step": 398431, "epoch": 2371} {"train_loss": -12.019486427307129, "global_step": 398432, "epoch": 2371} {"train_loss": -12.017877578735352, "global_step": 398433, "epoch": 2371} {"train_loss": -12.057077407836914, "global_step": 398434, "epoch": 2371} {"train_loss": -11.957735061645508, "global_step": 398435, "epoch": 2371} {"train_loss": -11.839508056640625, "global_step": 398436, "epoch": 2371} {"train_loss": -12.07844352722168, "global_step": 398437, "epoch": 2371} {"train_loss": -12.117362976074219, "global_step": 398438, "epoch": 2371} {"train_loss": -12.236026763916016, "global_step": 398439, "epoch": 2371} {"train_loss": -11.982039451599121, "global_step": 398440, "epoch": 2371} {"train_loss": -12.241927146911621, "global_step": 398441, "epoch": 2371} {"train_loss": -11.947070121765137, "global_step": 398442, "epoch": 2371} {"train_loss": -12.455305099487305, "global_step": 398443, "epoch": 2371} {"train_loss": -12.027369499206543, "global_step": 398444, "epoch": 2371} {"train_loss": -12.481842994689941, "global_step": 398445, "epoch": 2371} {"train_loss": -12.370347023010254, "global_step": 398446, "epoch": 2371} {"train_loss": -12.283902168273926, "global_step": 398447, "epoch": 2371} {"train_loss": -12.10722827911377, "global_step": 398448, "epoch": 2371} {"train_loss": -12.151926040649414, "global_step": 398449, "epoch": 2371} {"train_loss": -12.516660690307617, "global_step": 398450, "epoch": 2371} {"train_loss": -12.470504760742188, "global_step": 398451, "epoch": 2371} {"train_loss": -12.282715797424316, "global_step": 398452, "epoch": 2371} {"train_loss": -11.956040382385254, "global_step": 398453, "epoch": 2371} {"train_loss": -12.266677856445312, "global_step": 398454, "epoch": 2371} {"train_loss": -11.9677095413208, "global_step": 398455, "epoch": 2371} {"train_loss": -12.202193260192871, "global_step": 398456, "epoch": 2371} {"train_loss": -12.443198204040527, "global_step": 398457, "epoch": 2371} {"train_loss": -12.470624923706055, "global_step": 398458, "epoch": 2371} {"train_loss": -12.460350036621094, "global_step": 398459, "epoch": 2371} {"train_loss": -12.341691970825195, "global_step": 398460, "epoch": 2371} {"train_loss": -12.50649642944336, "global_step": 398461, "epoch": 2371} {"train_loss": -12.233806610107422, "global_step": 398462, "epoch": 2371} {"train_loss": -12.40478515625, "global_step": 398463, "epoch": 2371} {"train_loss": -12.291851997375488, "global_step": 398464, "epoch": 2371} {"train_loss": -12.39950180053711, "global_step": 398465, "epoch": 2371} {"train_loss": -12.434513092041016, "global_step": 398466, "epoch": 2371} {"train_loss": -12.283493041992188, "global_step": 398467, "epoch": 2371} {"train_loss": -11.92253303527832, "global_step": 398468, "epoch": 2371} {"train_loss": -12.390673637390137, "global_step": 398469, "epoch": 2371} {"train_loss": -11.864351272583008, "global_step": 398470, "epoch": 2371} {"train_loss": -11.82131576538086, "global_step": 398471, "epoch": 2371} {"train_loss": -12.081220626831055, "global_step": 398472, "epoch": 2371} {"train_loss": -12.250208854675293, "global_step": 398473, "epoch": 2371} {"train_loss": -11.896394729614258, "global_step": 398474, "epoch": 2371} {"train_loss": -11.786117553710938, "global_step": 398475, "epoch": 2371} {"train_loss": -12.416606903076172, "global_step": 398476, "epoch": 2371} {"train_loss": -12.46480941772461, "global_step": 398477, "epoch": 2371} {"train_loss": -12.240522384643555, "global_step": 398478, "epoch": 2371} {"train_loss": -12.621295928955078, "global_step": 398479, "epoch": 2371} {"train_loss": -12.21450424194336, "global_step": 398480, "epoch": 2371} {"train_loss": -12.444790840148926, "global_step": 398481, "epoch": 2371} {"train_loss": -12.237921714782715, "global_step": 398482, "epoch": 2371} {"train_loss": -12.207645416259766, "global_step": 398483, "epoch": 2371} {"train_loss": -12.326131820678711, "global_step": 398484, "epoch": 2371} {"train_loss": -11.688308715820312, "global_step": 398485, "epoch": 2371} {"train_loss": -12.17856502532959, "global_step": 398486, "epoch": 2371} {"train_loss": -12.060420989990234, "global_step": 398487, "epoch": 2371} {"train_loss": -11.737737655639648, "global_step": 398488, "epoch": 2371} {"train_loss": -12.277552604675293, "global_step": 398489, "epoch": 2371} {"train_loss": -11.880050659179688, "global_step": 398490, "epoch": 2371} {"train_loss": -11.122180938720703, "global_step": 398491, "epoch": 2371} {"train_loss": -12.346500396728516, "global_step": 398492, "epoch": 2371} {"train_loss": -12.268386840820312, "global_step": 398493, "epoch": 2371} {"train_loss": -12.375494003295898, "global_step": 398494, "epoch": 2371} {"train_loss": -11.395354739257268, "global_step": 398495, "epoch": 2371, "val_loss": 304357.0625} {"train_loss": -12.251141548156738, "global_step": 398496, "epoch": 2372} {"train_loss": -12.259265899658203, "global_step": 398497, "epoch": 2372} {"train_loss": -12.452255249023438, "global_step": 398498, "epoch": 2372} {"train_loss": -12.41639232635498, "global_step": 398499, "epoch": 2372} {"train_loss": -12.55830192565918, "global_step": 398500, "epoch": 2372} {"train_loss": -12.143117904663086, "global_step": 398501, "epoch": 2372} {"train_loss": -12.705677032470703, "global_step": 398502, "epoch": 2372} {"train_loss": -11.956019401550293, "global_step": 398503, "epoch": 2372} {"train_loss": -12.351306915283203, "global_step": 398504, "epoch": 2372} {"train_loss": -12.523879051208496, "global_step": 398505, "epoch": 2372} {"train_loss": -11.902555465698242, "global_step": 398506, "epoch": 2372} {"train_loss": -11.593790054321289, "global_step": 398507, "epoch": 2372} {"train_loss": -12.311939239501953, "global_step": 398508, "epoch": 2372} {"train_loss": -12.246837615966797, "global_step": 398509, "epoch": 2372} {"train_loss": -11.985572814941406, "global_step": 398510, "epoch": 2372} {"train_loss": -12.217321395874023, "global_step": 398511, "epoch": 2372} {"train_loss": -12.492612838745117, "global_step": 398512, "epoch": 2372} {"train_loss": -12.055326461791992, "global_step": 398513, "epoch": 2372} {"train_loss": -12.079442977905273, "global_step": 398514, "epoch": 2372} {"train_loss": -12.706180572509766, "global_step": 398515, "epoch": 2372} {"train_loss": -12.187021255493164, "global_step": 398516, "epoch": 2372} {"train_loss": -12.376237869262695, "global_step": 398517, "epoch": 2372} {"train_loss": -12.53890323638916, "global_step": 398518, "epoch": 2372} {"train_loss": -12.339120864868164, "global_step": 398519, "epoch": 2372} {"train_loss": -12.333271026611328, "global_step": 398520, "epoch": 2372} {"train_loss": -12.755138397216797, "global_step": 398521, "epoch": 2372} {"train_loss": -12.541735649108887, "global_step": 398522, "epoch": 2372} {"train_loss": -12.463479042053223, "global_step": 398523, "epoch": 2372} {"train_loss": -12.747095108032227, "global_step": 398524, "epoch": 2372} {"train_loss": -12.322561264038086, "global_step": 398525, "epoch": 2372} {"train_loss": -12.657588005065918, "global_step": 398526, "epoch": 2372} {"train_loss": -12.190685272216797, "global_step": 398527, "epoch": 2372} {"train_loss": -12.400690078735352, "global_step": 398528, "epoch": 2372} {"train_loss": -12.569963455200195, "global_step": 398529, "epoch": 2372} {"train_loss": -12.192049026489258, "global_step": 398530, "epoch": 2372} {"train_loss": -12.152852058410645, "global_step": 398531, "epoch": 2372} {"train_loss": -12.451539993286133, "global_step": 398532, "epoch": 2372} {"train_loss": -12.038507461547852, "global_step": 398533, "epoch": 2372} {"train_loss": -11.792378425598145, "global_step": 398534, "epoch": 2372} {"train_loss": -11.775211334228516, "global_step": 398535, "epoch": 2372} {"train_loss": -11.869802474975586, "global_step": 398536, "epoch": 2372} {"train_loss": -12.070541381835938, "global_step": 398537, "epoch": 2372} {"train_loss": -11.856367111206055, "global_step": 398538, "epoch": 2372} {"train_loss": -11.624831199645996, "global_step": 398539, "epoch": 2372} {"train_loss": -11.483009338378906, "global_step": 398540, "epoch": 2372} {"train_loss": -11.34614372253418, "global_step": 398541, "epoch": 2372} {"train_loss": -11.45211410522461, "global_step": 398542, "epoch": 2372} {"train_loss": -11.134297370910645, "global_step": 398543, "epoch": 2372} {"train_loss": -12.372873306274414, "global_step": 398544, "epoch": 2372} {"train_loss": -10.699213027954102, "global_step": 398545, "epoch": 2372} {"train_loss": -11.543184280395508, "global_step": 398546, "epoch": 2372} {"train_loss": -11.3932466506958, "global_step": 398547, "epoch": 2372} {"train_loss": -12.009599685668945, "global_step": 398548, "epoch": 2372} {"train_loss": -11.026013374328613, "global_step": 398549, "epoch": 2372} {"train_loss": -11.89200210571289, "global_step": 398550, "epoch": 2372} {"train_loss": -11.687562942504883, "global_step": 398551, "epoch": 2372} {"train_loss": -11.814092636108398, "global_step": 398552, "epoch": 2372} {"train_loss": -11.924049377441406, "global_step": 398553, "epoch": 2372} {"train_loss": -12.305804252624512, "global_step": 398554, "epoch": 2372} {"train_loss": -11.721674919128418, "global_step": 398555, "epoch": 2372} {"train_loss": -11.669036865234375, "global_step": 398556, "epoch": 2372} {"train_loss": -12.154170989990234, "global_step": 398557, "epoch": 2372} {"train_loss": -12.200719833374023, "global_step": 398558, "epoch": 2372} {"train_loss": -12.336324691772461, "global_step": 398559, "epoch": 2372} {"train_loss": -12.006317138671875, "global_step": 398560, "epoch": 2372} {"train_loss": -12.09184741973877, "global_step": 398561, "epoch": 2372} {"train_loss": -12.318758010864258, "global_step": 398562, "epoch": 2372} {"train_loss": -12.179292678833008, "global_step": 398563, "epoch": 2372} {"train_loss": -11.896387100219727, "global_step": 398564, "epoch": 2372} {"train_loss": -12.50940990447998, "global_step": 398565, "epoch": 2372} {"train_loss": -12.288575172424316, "global_step": 398566, "epoch": 2372} {"train_loss": -12.1908540725708, "global_step": 398567, "epoch": 2372} {"train_loss": -11.95455551147461, "global_step": 398568, "epoch": 2372} {"train_loss": -11.790888786315918, "global_step": 398569, "epoch": 2372} {"train_loss": -11.259214401245117, "global_step": 398570, "epoch": 2372} {"train_loss": -12.355620384216309, "global_step": 398571, "epoch": 2372} {"train_loss": -11.44245719909668, "global_step": 398572, "epoch": 2372} {"train_loss": -11.922492980957031, "global_step": 398573, "epoch": 2372} {"train_loss": -12.04066276550293, "global_step": 398574, "epoch": 2372} {"train_loss": -11.866008758544922, "global_step": 398575, "epoch": 2372} {"train_loss": -12.417882919311523, "global_step": 398576, "epoch": 2372} {"train_loss": -11.350652694702148, "global_step": 398577, "epoch": 2372} {"train_loss": -12.12195873260498, "global_step": 398578, "epoch": 2372} {"train_loss": -11.664474487304688, "global_step": 398579, "epoch": 2372} {"train_loss": -11.052282333374023, "global_step": 398580, "epoch": 2372} {"train_loss": -11.290753364562988, "global_step": 398581, "epoch": 2372} {"train_loss": -10.869039535522461, "global_step": 398582, "epoch": 2372} {"train_loss": -11.734630584716797, "global_step": 398583, "epoch": 2372} {"train_loss": -10.710906028747559, "global_step": 398584, "epoch": 2372} {"train_loss": -12.001529693603516, "global_step": 398585, "epoch": 2372} {"train_loss": -10.914937973022461, "global_step": 398586, "epoch": 2372} {"train_loss": -11.632345199584961, "global_step": 398587, "epoch": 2372} {"train_loss": -11.79214859008789, "global_step": 398588, "epoch": 2372} {"train_loss": -10.912893295288086, "global_step": 398589, "epoch": 2372} {"train_loss": -11.956892013549805, "global_step": 398590, "epoch": 2372} {"train_loss": -10.825221061706543, "global_step": 398591, "epoch": 2372} {"train_loss": -11.719691276550293, "global_step": 398592, "epoch": 2372} {"train_loss": -11.444698333740234, "global_step": 398593, "epoch": 2372} {"train_loss": -11.60639762878418, "global_step": 398594, "epoch": 2372} {"train_loss": -12.193509101867676, "global_step": 398595, "epoch": 2372} {"train_loss": -11.442861557006836, "global_step": 398596, "epoch": 2372} {"train_loss": -11.905838012695312, "global_step": 398597, "epoch": 2372} {"train_loss": -11.56522274017334, "global_step": 398598, "epoch": 2372} {"train_loss": -11.354061126708984, "global_step": 398599, "epoch": 2372} {"train_loss": -12.249587059020996, "global_step": 398600, "epoch": 2372} {"train_loss": -11.28256607055664, "global_step": 398601, "epoch": 2372} {"train_loss": -12.268186569213867, "global_step": 398602, "epoch": 2372} {"train_loss": -11.38996696472168, "global_step": 398603, "epoch": 2372} {"train_loss": -11.853214263916016, "global_step": 398604, "epoch": 2372} {"train_loss": -12.241914749145508, "global_step": 398605, "epoch": 2372} {"train_loss": -11.731209754943848, "global_step": 398606, "epoch": 2372} {"train_loss": -12.054168701171875, "global_step": 398607, "epoch": 2372} {"train_loss": -11.488469123840332, "global_step": 398608, "epoch": 2372} {"train_loss": -11.93067741394043, "global_step": 398609, "epoch": 2372} {"train_loss": -11.502038955688477, "global_step": 398610, "epoch": 2372} {"train_loss": -12.296485900878906, "global_step": 398611, "epoch": 2372} {"train_loss": -12.116043090820312, "global_step": 398612, "epoch": 2372} {"train_loss": -12.240240097045898, "global_step": 398613, "epoch": 2372} {"train_loss": -12.142616271972656, "global_step": 398614, "epoch": 2372} {"train_loss": -12.153497695922852, "global_step": 398615, "epoch": 2372} {"train_loss": -12.101249694824219, "global_step": 398616, "epoch": 2372} {"train_loss": -12.229907989501953, "global_step": 398617, "epoch": 2372} {"train_loss": -12.200092315673828, "global_step": 398618, "epoch": 2372} {"train_loss": -12.350982666015625, "global_step": 398619, "epoch": 2372} {"train_loss": -11.839115142822266, "global_step": 398620, "epoch": 2372} {"train_loss": -12.010366439819336, "global_step": 398621, "epoch": 2372} {"train_loss": -12.25239372253418, "global_step": 398622, "epoch": 2372} {"train_loss": -11.721100807189941, "global_step": 398623, "epoch": 2372} {"train_loss": -12.326014518737793, "global_step": 398624, "epoch": 2372} {"train_loss": -11.918883323669434, "global_step": 398625, "epoch": 2372} {"train_loss": -12.0223970413208, "global_step": 398626, "epoch": 2372} {"train_loss": -12.189496994018555, "global_step": 398627, "epoch": 2372} {"train_loss": -12.204421997070312, "global_step": 398628, "epoch": 2372} {"train_loss": -12.099185943603516, "global_step": 398629, "epoch": 2372} {"train_loss": -12.302812576293945, "global_step": 398630, "epoch": 2372} {"train_loss": -12.343717575073242, "global_step": 398631, "epoch": 2372} {"train_loss": -12.01885986328125, "global_step": 398632, "epoch": 2372} {"train_loss": -12.216632843017578, "global_step": 398633, "epoch": 2372} {"train_loss": -12.208691596984863, "global_step": 398634, "epoch": 2372} {"train_loss": -12.298534393310547, "global_step": 398635, "epoch": 2372} {"train_loss": -12.461953163146973, "global_step": 398636, "epoch": 2372} {"train_loss": -12.289791107177734, "global_step": 398637, "epoch": 2372} {"train_loss": -11.660100936889648, "global_step": 398638, "epoch": 2372} {"train_loss": -12.007452011108398, "global_step": 398639, "epoch": 2372} {"train_loss": -12.08128833770752, "global_step": 398640, "epoch": 2372} {"train_loss": -12.255867004394531, "global_step": 398641, "epoch": 2372} {"train_loss": -11.91975212097168, "global_step": 398642, "epoch": 2372} {"train_loss": -11.705392837524414, "global_step": 398643, "epoch": 2372} {"train_loss": -11.502033233642578, "global_step": 398644, "epoch": 2372} {"train_loss": -11.191795349121094, "global_step": 398645, "epoch": 2372} {"train_loss": -11.694262504577637, "global_step": 398646, "epoch": 2372} {"train_loss": -11.515844345092773, "global_step": 398647, "epoch": 2372} {"train_loss": -11.738036155700684, "global_step": 398648, "epoch": 2372} {"train_loss": -11.624916076660156, "global_step": 398649, "epoch": 2372} {"train_loss": -11.59835433959961, "global_step": 398650, "epoch": 2372} {"train_loss": -11.940655708312988, "global_step": 398651, "epoch": 2372} {"train_loss": -11.894702911376953, "global_step": 398652, "epoch": 2372} {"train_loss": -11.987783432006836, "global_step": 398653, "epoch": 2372} {"train_loss": -11.952377319335938, "global_step": 398654, "epoch": 2372} {"train_loss": -12.184429168701172, "global_step": 398655, "epoch": 2372} {"train_loss": -11.351978302001953, "global_step": 398656, "epoch": 2372} {"train_loss": -12.04963493347168, "global_step": 398657, "epoch": 2372} {"train_loss": -11.600275039672852, "global_step": 398658, "epoch": 2372} {"train_loss": -11.606411933898926, "global_step": 398659, "epoch": 2372} {"train_loss": -12.35556411743164, "global_step": 398660, "epoch": 2372} {"train_loss": -11.364103317260742, "global_step": 398661, "epoch": 2372} {"train_loss": -12.101452827453613, "global_step": 398662, "epoch": 2372} {"train_loss": -11.95102876708621, "global_step": 398663, "epoch": 2372, "val_loss": 301529.53125} {"train_loss": -11.957886695861816, "global_step": 398664, "epoch": 2373} {"train_loss": -12.215071678161621, "global_step": 398665, "epoch": 2373} {"train_loss": -12.293586730957031, "global_step": 398666, "epoch": 2373} {"train_loss": -12.06689453125, "global_step": 398667, "epoch": 2373} {"train_loss": -12.105743408203125, "global_step": 398668, "epoch": 2373} {"train_loss": -12.182815551757812, "global_step": 398669, "epoch": 2373} {"train_loss": -12.190120697021484, "global_step": 398670, "epoch": 2373} {"train_loss": -11.809540748596191, "global_step": 398671, "epoch": 2373} {"train_loss": -12.335298538208008, "global_step": 398672, "epoch": 2373} {"train_loss": -12.05080795288086, "global_step": 398673, "epoch": 2373} {"train_loss": -11.836795806884766, "global_step": 398674, "epoch": 2373} {"train_loss": -12.09322738647461, "global_step": 398675, "epoch": 2373} {"train_loss": -12.153395652770996, "global_step": 398676, "epoch": 2373} {"train_loss": -12.189458847045898, "global_step": 398677, "epoch": 2373} {"train_loss": -12.209522247314453, "global_step": 398678, "epoch": 2373} {"train_loss": -12.356616973876953, "global_step": 398679, "epoch": 2373} {"train_loss": -12.01419448852539, "global_step": 398680, "epoch": 2373} {"train_loss": -12.380763053894043, "global_step": 398681, "epoch": 2373} {"train_loss": -12.20748233795166, "global_step": 398682, "epoch": 2373} {"train_loss": -12.529389381408691, "global_step": 398683, "epoch": 2373} {"train_loss": -12.621271133422852, "global_step": 398684, "epoch": 2373} {"train_loss": -12.457348823547363, "global_step": 398685, "epoch": 2373} {"train_loss": -12.473869323730469, "global_step": 398686, "epoch": 2373} {"train_loss": -12.444764137268066, "global_step": 398687, "epoch": 2373} {"train_loss": -12.274543762207031, "global_step": 398688, "epoch": 2373} {"train_loss": -12.664182662963867, "global_step": 398689, "epoch": 2373} {"train_loss": -12.631671905517578, "global_step": 398690, "epoch": 2373} {"train_loss": -12.59024715423584, "global_step": 398691, "epoch": 2373} {"train_loss": -12.536052703857422, "global_step": 398692, "epoch": 2373} {"train_loss": -12.477063179016113, "global_step": 398693, "epoch": 2373} {"train_loss": -12.460338592529297, "global_step": 398694, "epoch": 2373} {"train_loss": -12.73295783996582, "global_step": 398695, "epoch": 2373} {"train_loss": -12.442752838134766, "global_step": 398696, "epoch": 2373} {"train_loss": -12.531360626220703, "global_step": 398697, "epoch": 2373} {"train_loss": -12.508111953735352, "global_step": 398698, "epoch": 2373} {"train_loss": -12.217609405517578, "global_step": 398699, "epoch": 2373} {"train_loss": -12.511301040649414, "global_step": 398700, "epoch": 2373} {"train_loss": -12.401226997375488, "global_step": 398701, "epoch": 2373} {"train_loss": -12.558366775512695, "global_step": 398702, "epoch": 2373} {"train_loss": -12.24070930480957, "global_step": 398703, "epoch": 2373} {"train_loss": -12.550773620605469, "global_step": 398704, "epoch": 2373} {"train_loss": -12.488798141479492, "global_step": 398705, "epoch": 2373} {"train_loss": -12.629312515258789, "global_step": 398706, "epoch": 2373} {"train_loss": -12.430907249450684, "global_step": 398707, "epoch": 2373} {"train_loss": -12.684000015258789, "global_step": 398708, "epoch": 2373} {"train_loss": -12.583589553833008, "global_step": 398709, "epoch": 2373} {"train_loss": -12.567426681518555, "global_step": 398710, "epoch": 2373} {"train_loss": -12.709022521972656, "global_step": 398711, "epoch": 2373} {"train_loss": -12.652023315429688, "global_step": 398712, "epoch": 2373} {"train_loss": -12.43274211883545, "global_step": 398713, "epoch": 2373} {"train_loss": -12.618951797485352, "global_step": 398714, "epoch": 2373} {"train_loss": -12.62646484375, "global_step": 398715, "epoch": 2373} {"train_loss": -12.537956237792969, "global_step": 398716, "epoch": 2373} {"train_loss": -12.776989936828613, "global_step": 398717, "epoch": 2373} {"train_loss": -12.644347190856934, "global_step": 398718, "epoch": 2373} {"train_loss": -12.674101829528809, "global_step": 398719, "epoch": 2373} {"train_loss": -12.15561580657959, "global_step": 398720, "epoch": 2373} {"train_loss": -12.464244842529297, "global_step": 398721, "epoch": 2373} {"train_loss": -12.45945930480957, "global_step": 398722, "epoch": 2373} {"train_loss": -12.961944580078125, "global_step": 398723, "epoch": 2373} {"train_loss": -12.312626838684082, "global_step": 398724, "epoch": 2373} {"train_loss": -11.764888763427734, "global_step": 398725, "epoch": 2373} {"train_loss": -11.79360580444336, "global_step": 398726, "epoch": 2373} {"train_loss": -10.545150756835938, "global_step": 398727, "epoch": 2373} {"train_loss": -10.926192283630371, "global_step": 398728, "epoch": 2373} {"train_loss": -12.12257194519043, "global_step": 398729, "epoch": 2373} {"train_loss": -11.400436401367188, "global_step": 398730, "epoch": 2373} {"train_loss": -12.359100341796875, "global_step": 398731, "epoch": 2373} {"train_loss": -11.38310432434082, "global_step": 398732, "epoch": 2373} {"train_loss": -11.74668025970459, "global_step": 398733, "epoch": 2373} {"train_loss": -12.301856994628906, "global_step": 398734, "epoch": 2373} {"train_loss": -11.501985549926758, "global_step": 398735, "epoch": 2373} {"train_loss": -11.603303909301758, "global_step": 398736, "epoch": 2373} {"train_loss": -12.143213272094727, "global_step": 398737, "epoch": 2373} {"train_loss": -10.941566467285156, "global_step": 398738, "epoch": 2373} {"train_loss": -11.994912147521973, "global_step": 398739, "epoch": 2373} {"train_loss": -12.088228225708008, "global_step": 398740, "epoch": 2373} {"train_loss": -11.040179252624512, "global_step": 398741, "epoch": 2373} {"train_loss": -12.244013786315918, "global_step": 398742, "epoch": 2373} {"train_loss": -11.784036636352539, "global_step": 398743, "epoch": 2373} {"train_loss": -11.554027557373047, "global_step": 398744, "epoch": 2373} {"train_loss": -11.754250526428223, "global_step": 398745, "epoch": 2373} {"train_loss": -11.953707695007324, "global_step": 398746, "epoch": 2373} {"train_loss": -11.562601089477539, "global_step": 398747, "epoch": 2373} {"train_loss": -12.062568664550781, "global_step": 398748, "epoch": 2373} {"train_loss": -11.964059829711914, "global_step": 398749, "epoch": 2373} {"train_loss": -11.84991455078125, "global_step": 398750, "epoch": 2373} {"train_loss": -12.534645080566406, "global_step": 398751, "epoch": 2373} {"train_loss": -11.717108726501465, "global_step": 398752, "epoch": 2373} {"train_loss": -12.312971115112305, "global_step": 398753, "epoch": 2373} {"train_loss": -11.962182998657227, "global_step": 398754, "epoch": 2373} {"train_loss": -12.294533729553223, "global_step": 398755, "epoch": 2373} {"train_loss": -12.08693790435791, "global_step": 398756, "epoch": 2373} {"train_loss": -12.3428316116333, "global_step": 398757, "epoch": 2373} {"train_loss": -12.296609878540039, "global_step": 398758, "epoch": 2373} {"train_loss": -12.220558166503906, "global_step": 398759, "epoch": 2373} {"train_loss": -12.578760147094727, "global_step": 398760, "epoch": 2373} {"train_loss": -12.05825138092041, "global_step": 398761, "epoch": 2373} {"train_loss": -12.437051773071289, "global_step": 398762, "epoch": 2373} {"train_loss": -12.406503677368164, "global_step": 398763, "epoch": 2373} {"train_loss": -12.327421188354492, "global_step": 398764, "epoch": 2373} {"train_loss": -12.452880859375, "global_step": 398765, "epoch": 2373} {"train_loss": -12.48347282409668, "global_step": 398766, "epoch": 2373} {"train_loss": -12.385196685791016, "global_step": 398767, "epoch": 2373} {"train_loss": -11.739093780517578, "global_step": 398768, "epoch": 2373} {"train_loss": -12.052584648132324, "global_step": 398769, "epoch": 2373} {"train_loss": -12.39002513885498, "global_step": 398770, "epoch": 2373} {"train_loss": -12.301145553588867, "global_step": 398771, "epoch": 2373} {"train_loss": -12.215558052062988, "global_step": 398772, "epoch": 2373} {"train_loss": -12.024253845214844, "global_step": 398773, "epoch": 2373} {"train_loss": -12.28268051147461, "global_step": 398774, "epoch": 2373} {"train_loss": -12.451799392700195, "global_step": 398775, "epoch": 2373} {"train_loss": -12.015958786010742, "global_step": 398776, "epoch": 2373} {"train_loss": -11.575684547424316, "global_step": 398777, "epoch": 2373} {"train_loss": -11.940962791442871, "global_step": 398778, "epoch": 2373} {"train_loss": -12.378084182739258, "global_step": 398779, "epoch": 2373} {"train_loss": -12.16859245300293, "global_step": 398780, "epoch": 2373} {"train_loss": -12.529205322265625, "global_step": 398781, "epoch": 2373} {"train_loss": -11.833517074584961, "global_step": 398782, "epoch": 2373} {"train_loss": -11.730072021484375, "global_step": 398783, "epoch": 2373} {"train_loss": -11.97899055480957, "global_step": 398784, "epoch": 2373} {"train_loss": -12.033977508544922, "global_step": 398785, "epoch": 2373} {"train_loss": -12.054584503173828, "global_step": 398786, "epoch": 2373} {"train_loss": -11.665460586547852, "global_step": 398787, "epoch": 2373} {"train_loss": -11.851417541503906, "global_step": 398788, "epoch": 2373} {"train_loss": -11.750933647155762, "global_step": 398789, "epoch": 2373} {"train_loss": -11.985357284545898, "global_step": 398790, "epoch": 2373} {"train_loss": -12.369546890258789, "global_step": 398791, "epoch": 2373} {"train_loss": -11.625076293945312, "global_step": 398792, "epoch": 2373} {"train_loss": -11.501081466674805, "global_step": 398793, "epoch": 2373} {"train_loss": -12.2517728805542, "global_step": 398794, "epoch": 2373} {"train_loss": -10.863046646118164, "global_step": 398795, "epoch": 2373} {"train_loss": -11.191804885864258, "global_step": 398796, "epoch": 2373} {"train_loss": -11.890686988830566, "global_step": 398797, "epoch": 2373} {"train_loss": -11.544920921325684, "global_step": 398798, "epoch": 2373} {"train_loss": -11.255239486694336, "global_step": 398799, "epoch": 2373} {"train_loss": -11.062909126281738, "global_step": 398800, "epoch": 2373} {"train_loss": -12.254898071289062, "global_step": 398801, "epoch": 2373} {"train_loss": -11.718002319335938, "global_step": 398802, "epoch": 2373} {"train_loss": -12.189245223999023, "global_step": 398803, "epoch": 2373} {"train_loss": -11.815284729003906, "global_step": 398804, "epoch": 2373} {"train_loss": -12.482261657714844, "global_step": 398805, "epoch": 2373} {"train_loss": -11.843001365661621, "global_step": 398806, "epoch": 2373} {"train_loss": -11.896469116210938, "global_step": 398807, "epoch": 2373} {"train_loss": -12.470426559448242, "global_step": 398808, "epoch": 2373} {"train_loss": -11.897905349731445, "global_step": 398809, "epoch": 2373} {"train_loss": -12.11186408996582, "global_step": 398810, "epoch": 2373} {"train_loss": -12.131889343261719, "global_step": 398811, "epoch": 2373} {"train_loss": -12.10771369934082, "global_step": 398812, "epoch": 2373} {"train_loss": -12.156770706176758, "global_step": 398813, "epoch": 2373} {"train_loss": -12.123021125793457, "global_step": 398814, "epoch": 2373} {"train_loss": -11.950998306274414, "global_step": 398815, "epoch": 2373} {"train_loss": -12.305268287658691, "global_step": 398816, "epoch": 2373} {"train_loss": -12.138313293457031, "global_step": 398817, "epoch": 2373} {"train_loss": -12.104171752929688, "global_step": 398818, "epoch": 2373} {"train_loss": -12.429794311523438, "global_step": 398819, "epoch": 2373} {"train_loss": -11.475061416625977, "global_step": 398820, "epoch": 2373} {"train_loss": -12.385883331298828, "global_step": 398821, "epoch": 2373} {"train_loss": -11.820815086364746, "global_step": 398822, "epoch": 2373} {"train_loss": -11.866621971130371, "global_step": 398823, "epoch": 2373} {"train_loss": -12.159688949584961, "global_step": 398824, "epoch": 2373} {"train_loss": -12.491838455200195, "global_step": 398825, "epoch": 2373} {"train_loss": -11.591585159301758, "global_step": 398826, "epoch": 2373} {"train_loss": -12.177849769592285, "global_step": 398827, "epoch": 2373} {"train_loss": -11.470602989196777, "global_step": 398828, "epoch": 2373} {"train_loss": -12.332334518432617, "global_step": 398829, "epoch": 2373} {"train_loss": -11.977495193481445, "global_step": 398830, "epoch": 2373} {"train_loss": -12.124627277964638, "global_step": 398831, "epoch": 2373, "val_loss": 303677.40625} {"train_loss": -12.354869842529297, "global_step": 398832, "epoch": 2374} {"train_loss": -11.823856353759766, "global_step": 398833, "epoch": 2374} {"train_loss": -12.530104637145996, "global_step": 398834, "epoch": 2374} {"train_loss": -11.920092582702637, "global_step": 398835, "epoch": 2374} {"train_loss": -12.53994083404541, "global_step": 398836, "epoch": 2374} {"train_loss": -12.257387161254883, "global_step": 398837, "epoch": 2374} {"train_loss": -12.401998519897461, "global_step": 398838, "epoch": 2374} {"train_loss": -12.16110610961914, "global_step": 398839, "epoch": 2374} {"train_loss": -12.165769577026367, "global_step": 398840, "epoch": 2374} {"train_loss": -12.10969066619873, "global_step": 398841, "epoch": 2374} {"train_loss": -12.067747116088867, "global_step": 398842, "epoch": 2374} {"train_loss": -12.004051208496094, "global_step": 398843, "epoch": 2374} {"train_loss": -12.496952056884766, "global_step": 398844, "epoch": 2374} {"train_loss": -12.20883560180664, "global_step": 398845, "epoch": 2374} {"train_loss": -12.015003204345703, "global_step": 398846, "epoch": 2374} {"train_loss": -12.45065689086914, "global_step": 398847, "epoch": 2374} {"train_loss": -12.416324615478516, "global_step": 398848, "epoch": 2374} {"train_loss": -12.58724594116211, "global_step": 398849, "epoch": 2374} {"train_loss": -12.251230239868164, "global_step": 398850, "epoch": 2374} {"train_loss": -12.039121627807617, "global_step": 398851, "epoch": 2374} {"train_loss": -11.934100151062012, "global_step": 398852, "epoch": 2374} {"train_loss": -12.305074691772461, "global_step": 398853, "epoch": 2374} {"train_loss": -12.381458282470703, "global_step": 398854, "epoch": 2374} {"train_loss": -12.273509979248047, "global_step": 398855, "epoch": 2374} {"train_loss": -11.752323150634766, "global_step": 398856, "epoch": 2374} {"train_loss": -12.490397453308105, "global_step": 398857, "epoch": 2374} {"train_loss": -12.398683547973633, "global_step": 398858, "epoch": 2374} {"train_loss": -12.484224319458008, "global_step": 398859, "epoch": 2374} {"train_loss": -12.423604011535645, "global_step": 398860, "epoch": 2374} {"train_loss": -12.500051498413086, "global_step": 398861, "epoch": 2374} {"train_loss": -12.491010665893555, "global_step": 398862, "epoch": 2374} {"train_loss": -12.66873550415039, "global_step": 398863, "epoch": 2374} {"train_loss": -12.469230651855469, "global_step": 398864, "epoch": 2374} {"train_loss": -12.381301879882812, "global_step": 398865, "epoch": 2374} {"train_loss": -12.742837905883789, "global_step": 398866, "epoch": 2374} {"train_loss": -12.779223442077637, "global_step": 398867, "epoch": 2374} {"train_loss": -12.254944801330566, "global_step": 398868, "epoch": 2374} {"train_loss": -12.58461856842041, "global_step": 398869, "epoch": 2374} {"train_loss": -12.513409614562988, "global_step": 398870, "epoch": 2374} {"train_loss": -12.225412368774414, "global_step": 398871, "epoch": 2374} {"train_loss": -12.332586288452148, "global_step": 398872, "epoch": 2374} {"train_loss": -12.719632148742676, "global_step": 398873, "epoch": 2374} {"train_loss": -12.169867515563965, "global_step": 398874, "epoch": 2374} {"train_loss": -11.99927043914795, "global_step": 398875, "epoch": 2374} {"train_loss": -12.297935485839844, "global_step": 398876, "epoch": 2374} {"train_loss": -12.520172119140625, "global_step": 398877, "epoch": 2374} {"train_loss": -11.834867477416992, "global_step": 398878, "epoch": 2374} {"train_loss": -11.616573333740234, "global_step": 398879, "epoch": 2374} {"train_loss": -11.96966552734375, "global_step": 398880, "epoch": 2374} {"train_loss": -11.079075813293457, "global_step": 398881, "epoch": 2374} {"train_loss": -10.806404113769531, "global_step": 398882, "epoch": 2374} {"train_loss": -11.557428359985352, "global_step": 398883, "epoch": 2374} {"train_loss": -11.536199569702148, "global_step": 398884, "epoch": 2374} {"train_loss": -11.37255859375, "global_step": 398885, "epoch": 2374} {"train_loss": -11.653197288513184, "global_step": 398886, "epoch": 2374} {"train_loss": -11.993659973144531, "global_step": 398887, "epoch": 2374} {"train_loss": -11.441287994384766, "global_step": 398888, "epoch": 2374} {"train_loss": -11.736852645874023, "global_step": 398889, "epoch": 2374} {"train_loss": -11.61609172821045, "global_step": 398890, "epoch": 2374} {"train_loss": -12.194962501525879, "global_step": 398891, "epoch": 2374} {"train_loss": -11.374618530273438, "global_step": 398892, "epoch": 2374} {"train_loss": -11.2337007522583, "global_step": 398893, "epoch": 2374} {"train_loss": -11.407133102416992, "global_step": 398894, "epoch": 2374} {"train_loss": -12.174062728881836, "global_step": 398895, "epoch": 2374} {"train_loss": -11.55904769897461, "global_step": 398896, "epoch": 2374} {"train_loss": -12.224342346191406, "global_step": 398897, "epoch": 2374} {"train_loss": -11.792644500732422, "global_step": 398898, "epoch": 2374} {"train_loss": -11.883264541625977, "global_step": 398899, "epoch": 2374} {"train_loss": -11.192278861999512, "global_step": 398900, "epoch": 2374} {"train_loss": -12.202832221984863, "global_step": 398901, "epoch": 2374} {"train_loss": -10.796329498291016, "global_step": 398902, "epoch": 2374} {"train_loss": -11.7196044921875, "global_step": 398903, "epoch": 2374} {"train_loss": -10.966991424560547, "global_step": 398904, "epoch": 2374} {"train_loss": -11.159385681152344, "global_step": 398905, "epoch": 2374} {"train_loss": -11.835027694702148, "global_step": 398906, "epoch": 2374} {"train_loss": -10.439537048339844, "global_step": 398907, "epoch": 2374} {"train_loss": -11.211230278015137, "global_step": 398908, "epoch": 2374} {"train_loss": -11.260470390319824, "global_step": 398909, "epoch": 2374} {"train_loss": -10.462299346923828, "global_step": 398910, "epoch": 2374} {"train_loss": -11.145893096923828, "global_step": 398911, "epoch": 2374} {"train_loss": -10.13853931427002, "global_step": 398912, "epoch": 2374} {"train_loss": -11.171443939208984, "global_step": 398913, "epoch": 2374} {"train_loss": -10.607772827148438, "global_step": 398914, "epoch": 2374} {"train_loss": -10.537696838378906, "global_step": 398915, "epoch": 2374} {"train_loss": -11.537419319152832, "global_step": 398916, "epoch": 2374} {"train_loss": -10.627021789550781, "global_step": 398917, "epoch": 2374} {"train_loss": -10.808547973632812, "global_step": 398918, "epoch": 2374} {"train_loss": -11.687013626098633, "global_step": 398919, "epoch": 2374} {"train_loss": -11.547018051147461, "global_step": 398920, "epoch": 2374} {"train_loss": -11.778104782104492, "global_step": 398921, "epoch": 2374} {"train_loss": -11.675901412963867, "global_step": 398922, "epoch": 2374} {"train_loss": -11.385334968566895, "global_step": 398923, "epoch": 2374} {"train_loss": -11.8406982421875, "global_step": 398924, "epoch": 2374} {"train_loss": -11.659122467041016, "global_step": 398925, "epoch": 2374} {"train_loss": -12.084428787231445, "global_step": 398926, "epoch": 2374} {"train_loss": -11.844545364379883, "global_step": 398927, "epoch": 2374} {"train_loss": -11.678899765014648, "global_step": 398928, "epoch": 2374} {"train_loss": -12.237822532653809, "global_step": 398929, "epoch": 2374} {"train_loss": -11.921757698059082, "global_step": 398930, "epoch": 2374} {"train_loss": -12.118476867675781, "global_step": 398931, "epoch": 2374} {"train_loss": -11.631976127624512, "global_step": 398932, "epoch": 2374} {"train_loss": -11.626964569091797, "global_step": 398933, "epoch": 2374} {"train_loss": -11.738205909729004, "global_step": 398934, "epoch": 2374} {"train_loss": -11.631576538085938, "global_step": 398935, "epoch": 2374} {"train_loss": -12.151091575622559, "global_step": 398936, "epoch": 2374} {"train_loss": -11.566829681396484, "global_step": 398937, "epoch": 2374} {"train_loss": -12.187597274780273, "global_step": 398938, "epoch": 2374} {"train_loss": -11.78931999206543, "global_step": 398939, "epoch": 2374} {"train_loss": -12.199140548706055, "global_step": 398940, "epoch": 2374} {"train_loss": -12.170628547668457, "global_step": 398941, "epoch": 2374} {"train_loss": -12.134517669677734, "global_step": 398942, "epoch": 2374} {"train_loss": -12.545198440551758, "global_step": 398943, "epoch": 2374} {"train_loss": -12.230531692504883, "global_step": 398944, "epoch": 2374} {"train_loss": -12.218393325805664, "global_step": 398945, "epoch": 2374} {"train_loss": -12.275056838989258, "global_step": 398946, "epoch": 2374} {"train_loss": -12.256158828735352, "global_step": 398947, "epoch": 2374} {"train_loss": -12.128849983215332, "global_step": 398948, "epoch": 2374} {"train_loss": -12.59646224975586, "global_step": 398949, "epoch": 2374} {"train_loss": -12.110237121582031, "global_step": 398950, "epoch": 2374} {"train_loss": -12.57594108581543, "global_step": 398951, "epoch": 2374} {"train_loss": -12.284521102905273, "global_step": 398952, "epoch": 2374} {"train_loss": -12.228887557983398, "global_step": 398953, "epoch": 2374} {"train_loss": -12.497459411621094, "global_step": 398954, "epoch": 2374} {"train_loss": -12.342169761657715, "global_step": 398955, "epoch": 2374} {"train_loss": -12.621252059936523, "global_step": 398956, "epoch": 2374} {"train_loss": -12.439075469970703, "global_step": 398957, "epoch": 2374} {"train_loss": -12.616364479064941, "global_step": 398958, "epoch": 2374} {"train_loss": -12.666362762451172, "global_step": 398959, "epoch": 2374} {"train_loss": -12.568796157836914, "global_step": 398960, "epoch": 2374} {"train_loss": -12.520007133483887, "global_step": 398961, "epoch": 2374} {"train_loss": -12.415060043334961, "global_step": 398962, "epoch": 2374} {"train_loss": -12.484278678894043, "global_step": 398963, "epoch": 2374} {"train_loss": -12.221356391906738, "global_step": 398964, "epoch": 2374} {"train_loss": -12.491235733032227, "global_step": 398965, "epoch": 2374} {"train_loss": -12.55439281463623, "global_step": 398966, "epoch": 2374} {"train_loss": -12.334980010986328, "global_step": 398967, "epoch": 2374} {"train_loss": -12.161787033081055, "global_step": 398968, "epoch": 2374} {"train_loss": -12.274595260620117, "global_step": 398969, "epoch": 2374} {"train_loss": -12.496817588806152, "global_step": 398970, "epoch": 2374} {"train_loss": -12.233404159545898, "global_step": 398971, "epoch": 2374} {"train_loss": -12.76171588897705, "global_step": 398972, "epoch": 2374} {"train_loss": -12.352033615112305, "global_step": 398973, "epoch": 2374} {"train_loss": -12.387426376342773, "global_step": 398974, "epoch": 2374} {"train_loss": -12.260406494140625, "global_step": 398975, "epoch": 2374} {"train_loss": -12.605748176574707, "global_step": 398976, "epoch": 2374} {"train_loss": -12.38199234008789, "global_step": 398977, "epoch": 2374} {"train_loss": -12.39152717590332, "global_step": 398978, "epoch": 2374} {"train_loss": -12.540803909301758, "global_step": 398979, "epoch": 2374} {"train_loss": -12.4471435546875, "global_step": 398980, "epoch": 2374} {"train_loss": -12.229286193847656, "global_step": 398981, "epoch": 2374} {"train_loss": -12.216263771057129, "global_step": 398982, "epoch": 2374} {"train_loss": -12.276748657226562, "global_step": 398983, "epoch": 2374} {"train_loss": -11.986852645874023, "global_step": 398984, "epoch": 2374} {"train_loss": -11.979957580566406, "global_step": 398985, "epoch": 2374} {"train_loss": -12.399892807006836, "global_step": 398986, "epoch": 2374} {"train_loss": -11.844461441040039, "global_step": 398987, "epoch": 2374} {"train_loss": -12.242260932922363, "global_step": 398988, "epoch": 2374} {"train_loss": -12.055940628051758, "global_step": 398989, "epoch": 2374} {"train_loss": -12.104007720947266, "global_step": 398990, "epoch": 2374} {"train_loss": -12.433279037475586, "global_step": 398991, "epoch": 2374} {"train_loss": -12.356199264526367, "global_step": 398992, "epoch": 2374} {"train_loss": -12.363910675048828, "global_step": 398993, "epoch": 2374} {"train_loss": -12.483749389648438, "global_step": 398994, "epoch": 2374} {"train_loss": -12.555364608764648, "global_step": 398995, "epoch": 2374} {"train_loss": -12.4241361618042, "global_step": 398996, "epoch": 2374} {"train_loss": -12.26787281036377, "global_step": 398997, "epoch": 2374} {"train_loss": -12.308492660522461, "global_step": 398998, "epoch": 2374} {"train_loss": -12.035180602754865, "global_step": 398999, "epoch": 2374, "val_loss": 305219.15625} {"train_loss": -12.578722953796387, "global_step": 399000, "epoch": 2375} {"train_loss": -12.589302062988281, "global_step": 399001, "epoch": 2375} {"train_loss": -11.69110107421875, "global_step": 399002, "epoch": 2375} {"train_loss": -12.223955154418945, "global_step": 399003, "epoch": 2375} {"train_loss": -12.315862655639648, "global_step": 399004, "epoch": 2375} {"train_loss": -12.354243278503418, "global_step": 399005, "epoch": 2375} {"train_loss": -11.939913749694824, "global_step": 399006, "epoch": 2375} {"train_loss": -11.913829803466797, "global_step": 399007, "epoch": 2375} {"train_loss": -12.360849380493164, "global_step": 399008, "epoch": 2375} {"train_loss": -12.62955093383789, "global_step": 399009, "epoch": 2375} {"train_loss": -12.340620040893555, "global_step": 399010, "epoch": 2375} {"train_loss": -11.913236618041992, "global_step": 399011, "epoch": 2375} {"train_loss": -12.712944984436035, "global_step": 399012, "epoch": 2375} {"train_loss": -12.247495651245117, "global_step": 399013, "epoch": 2375} {"train_loss": -11.681026458740234, "global_step": 399014, "epoch": 2375} {"train_loss": -12.220256805419922, "global_step": 399015, "epoch": 2375} {"train_loss": -12.288541793823242, "global_step": 399016, "epoch": 2375} {"train_loss": -11.686965942382812, "global_step": 399017, "epoch": 2375} {"train_loss": -12.337449073791504, "global_step": 399018, "epoch": 2375} {"train_loss": -12.10934066772461, "global_step": 399019, "epoch": 2375} {"train_loss": -11.89887809753418, "global_step": 399020, "epoch": 2375} {"train_loss": -12.39218521118164, "global_step": 399021, "epoch": 2375} {"train_loss": -10.809467315673828, "global_step": 399022, "epoch": 2375} {"train_loss": -11.725067138671875, "global_step": 399023, "epoch": 2375} {"train_loss": -11.72875690460205, "global_step": 399024, "epoch": 2375} {"train_loss": -10.545123100280762, "global_step": 399025, "epoch": 2375} {"train_loss": -11.046854019165039, "global_step": 399026, "epoch": 2375} {"train_loss": -10.189619064331055, "global_step": 399027, "epoch": 2375} {"train_loss": -10.232650756835938, "global_step": 399028, "epoch": 2375} {"train_loss": -8.756172180175781, "global_step": 399029, "epoch": 2375} {"train_loss": -10.832416534423828, "global_step": 399030, "epoch": 2375} {"train_loss": -10.121725082397461, "global_step": 399031, "epoch": 2375} {"train_loss": -11.149030685424805, "global_step": 399032, "epoch": 2375} {"train_loss": -9.332061767578125, "global_step": 399033, "epoch": 2375} {"train_loss": -10.730561256408691, "global_step": 399034, "epoch": 2375} {"train_loss": -9.789190292358398, "global_step": 399035, "epoch": 2375} {"train_loss": -9.64846420288086, "global_step": 399036, "epoch": 2375} {"train_loss": -9.526554107666016, "global_step": 399037, "epoch": 2375} {"train_loss": -10.216793060302734, "global_step": 399038, "epoch": 2375} {"train_loss": -9.013580322265625, "global_step": 399039, "epoch": 2375} {"train_loss": -11.140517234802246, "global_step": 399040, "epoch": 2375} {"train_loss": -10.334989547729492, "global_step": 399041, "epoch": 2375} {"train_loss": -10.028895378112793, "global_step": 399042, "epoch": 2375} {"train_loss": -10.3431396484375, "global_step": 399043, "epoch": 2375} {"train_loss": -10.88785457611084, "global_step": 399044, "epoch": 2375} {"train_loss": -10.319665908813477, "global_step": 399045, "epoch": 2375} {"train_loss": -10.113197326660156, "global_step": 399046, "epoch": 2375} {"train_loss": -12.106090545654297, "global_step": 399047, "epoch": 2375} {"train_loss": -10.497300148010254, "global_step": 399048, "epoch": 2375} {"train_loss": -11.330398559570312, "global_step": 399049, "epoch": 2375} {"train_loss": -11.655266761779785, "global_step": 399050, "epoch": 2375} {"train_loss": -11.333930969238281, "global_step": 399051, "epoch": 2375} {"train_loss": -11.693997383117676, "global_step": 399052, "epoch": 2375} {"train_loss": -11.759395599365234, "global_step": 399053, "epoch": 2375} {"train_loss": -11.111647605895996, "global_step": 399054, "epoch": 2375} {"train_loss": -12.166830062866211, "global_step": 399055, "epoch": 2375} {"train_loss": -11.696413040161133, "global_step": 399056, "epoch": 2375} {"train_loss": -11.821249008178711, "global_step": 399057, "epoch": 2375} {"train_loss": -12.033361434936523, "global_step": 399058, "epoch": 2375} {"train_loss": -11.47938346862793, "global_step": 399059, "epoch": 2375} {"train_loss": -11.977020263671875, "global_step": 399060, "epoch": 2375} {"train_loss": -11.84278678894043, "global_step": 399061, "epoch": 2375} {"train_loss": -11.899933815002441, "global_step": 399062, "epoch": 2375} {"train_loss": -11.558042526245117, "global_step": 399063, "epoch": 2375} {"train_loss": -12.0548734664917, "global_step": 399064, "epoch": 2375} {"train_loss": -11.798763275146484, "global_step": 399065, "epoch": 2375} {"train_loss": -11.87814998626709, "global_step": 399066, "epoch": 2375} {"train_loss": -12.013620376586914, "global_step": 399067, "epoch": 2375} {"train_loss": -11.820476531982422, "global_step": 399068, "epoch": 2375} {"train_loss": -11.880487442016602, "global_step": 399069, "epoch": 2375} {"train_loss": -12.307040214538574, "global_step": 399070, "epoch": 2375} {"train_loss": -11.937261581420898, "global_step": 399071, "epoch": 2375} {"train_loss": -12.212669372558594, "global_step": 399072, "epoch": 2375} {"train_loss": -12.239969253540039, "global_step": 399073, "epoch": 2375} {"train_loss": -12.175158500671387, "global_step": 399074, "epoch": 2375} {"train_loss": -12.118646621704102, "global_step": 399075, "epoch": 2375} {"train_loss": -11.966445922851562, "global_step": 399076, "epoch": 2375} {"train_loss": -12.100835800170898, "global_step": 399077, "epoch": 2375} {"train_loss": -11.955890655517578, "global_step": 399078, "epoch": 2375} {"train_loss": -11.547225952148438, "global_step": 399079, "epoch": 2375} {"train_loss": -12.301840782165527, "global_step": 399080, "epoch": 2375} {"train_loss": -11.869807243347168, "global_step": 399081, "epoch": 2375} {"train_loss": -12.153022766113281, "global_step": 399082, "epoch": 2375} {"train_loss": -12.134138107299805, "global_step": 399083, "epoch": 2375} {"train_loss": -12.07214641571045, "global_step": 399084, "epoch": 2375} {"train_loss": -12.293794631958008, "global_step": 399085, "epoch": 2375} {"train_loss": -12.40460205078125, "global_step": 399086, "epoch": 2375} {"train_loss": -12.31944751739502, "global_step": 399087, "epoch": 2375} {"train_loss": -12.449831008911133, "global_step": 399088, "epoch": 2375} {"train_loss": -12.067546844482422, "global_step": 399089, "epoch": 2375} {"train_loss": -12.55104923248291, "global_step": 399090, "epoch": 2375} {"train_loss": -12.34788703918457, "global_step": 399091, "epoch": 2375} {"train_loss": -12.256999015808105, "global_step": 399092, "epoch": 2375} {"train_loss": -12.486091613769531, "global_step": 399093, "epoch": 2375} {"train_loss": -12.604164123535156, "global_step": 399094, "epoch": 2375} {"train_loss": -12.59663200378418, "global_step": 399095, "epoch": 2375} {"train_loss": -12.574481010437012, "global_step": 399096, "epoch": 2375} {"train_loss": -12.50074577331543, "global_step": 399097, "epoch": 2375} {"train_loss": -12.340435981750488, "global_step": 399098, "epoch": 2375} {"train_loss": -12.515970230102539, "global_step": 399099, "epoch": 2375} {"train_loss": -12.344043731689453, "global_step": 399100, "epoch": 2375} {"train_loss": -12.45147705078125, "global_step": 399101, "epoch": 2375} {"train_loss": -12.391791343688965, "global_step": 399102, "epoch": 2375} {"train_loss": -12.586526870727539, "global_step": 399103, "epoch": 2375} {"train_loss": -12.624242782592773, "global_step": 399104, "epoch": 2375} {"train_loss": -12.437986373901367, "global_step": 399105, "epoch": 2375} {"train_loss": -12.511180877685547, "global_step": 399106, "epoch": 2375} {"train_loss": -12.601829528808594, "global_step": 399107, "epoch": 2375} {"train_loss": -12.63017463684082, "global_step": 399108, "epoch": 2375} {"train_loss": -12.84391975402832, "global_step": 399109, "epoch": 2375} {"train_loss": -12.533767700195312, "global_step": 399110, "epoch": 2375} {"train_loss": -12.692981719970703, "global_step": 399111, "epoch": 2375} {"train_loss": -12.659002304077148, "global_step": 399112, "epoch": 2375} {"train_loss": -12.618675231933594, "global_step": 399113, "epoch": 2375} {"train_loss": -12.725114822387695, "global_step": 399114, "epoch": 2375} {"train_loss": -12.558924674987793, "global_step": 399115, "epoch": 2375} {"train_loss": -12.48046875, "global_step": 399116, "epoch": 2375} {"train_loss": -12.77231216430664, "global_step": 399117, "epoch": 2375} {"train_loss": -12.796440124511719, "global_step": 399118, "epoch": 2375} {"train_loss": -12.855916976928711, "global_step": 399119, "epoch": 2375} {"train_loss": -12.595508575439453, "global_step": 399120, "epoch": 2375} {"train_loss": -12.653825759887695, "global_step": 399121, "epoch": 2375} {"train_loss": -12.723380088806152, "global_step": 399122, "epoch": 2375} {"train_loss": -12.671432495117188, "global_step": 399123, "epoch": 2375} {"train_loss": -12.247117042541504, "global_step": 399124, "epoch": 2375} {"train_loss": -12.599458694458008, "global_step": 399125, "epoch": 2375} {"train_loss": -12.905430793762207, "global_step": 399126, "epoch": 2375} {"train_loss": -12.60537338256836, "global_step": 399127, "epoch": 2375} {"train_loss": -12.47762393951416, "global_step": 399128, "epoch": 2375} {"train_loss": -12.65227222442627, "global_step": 399129, "epoch": 2375} {"train_loss": -12.474681854248047, "global_step": 399130, "epoch": 2375} {"train_loss": -12.205497741699219, "global_step": 399131, "epoch": 2375} {"train_loss": -12.046285629272461, "global_step": 399132, "epoch": 2375} {"train_loss": -12.803260803222656, "global_step": 399133, "epoch": 2375} {"train_loss": -12.096318244934082, "global_step": 399134, "epoch": 2375} {"train_loss": -11.876813888549805, "global_step": 399135, "epoch": 2375} {"train_loss": -12.335029602050781, "global_step": 399136, "epoch": 2375} {"train_loss": -12.40376091003418, "global_step": 399137, "epoch": 2375} {"train_loss": -12.727900505065918, "global_step": 399138, "epoch": 2375} {"train_loss": -12.537313461303711, "global_step": 399139, "epoch": 2375} {"train_loss": -12.54254150390625, "global_step": 399140, "epoch": 2375} {"train_loss": -12.31035041809082, "global_step": 399141, "epoch": 2375} {"train_loss": -12.48678207397461, "global_step": 399142, "epoch": 2375} {"train_loss": -11.175957679748535, "global_step": 399143, "epoch": 2375} {"train_loss": -10.41652774810791, "global_step": 399144, "epoch": 2375} {"train_loss": -10.660550117492676, "global_step": 399145, "epoch": 2375} {"train_loss": -10.473871231079102, "global_step": 399146, "epoch": 2375} {"train_loss": -8.293058395385742, "global_step": 399147, "epoch": 2375} {"train_loss": -11.161434173583984, "global_step": 399148, "epoch": 2375} {"train_loss": -7.09068489074707, "global_step": 399149, "epoch": 2375} {"train_loss": -7.2015533447265625, "global_step": 399150, "epoch": 2375} {"train_loss": -9.27713680267334, "global_step": 399151, "epoch": 2375} {"train_loss": -9.185029983520508, "global_step": 399152, "epoch": 2375} {"train_loss": -10.346038818359375, "global_step": 399153, "epoch": 2375} {"train_loss": -8.782682418823242, "global_step": 399154, "epoch": 2375} {"train_loss": -10.491682052612305, "global_step": 399155, "epoch": 2375} {"train_loss": -9.284053802490234, "global_step": 399156, "epoch": 2375} {"train_loss": -9.371918678283691, "global_step": 399157, "epoch": 2375} {"train_loss": -11.378755569458008, "global_step": 399158, "epoch": 2375} {"train_loss": -8.714971542358398, "global_step": 399159, "epoch": 2375} {"train_loss": -9.603645324707031, "global_step": 399160, "epoch": 2375} {"train_loss": -9.394636154174805, "global_step": 399161, "epoch": 2375} {"train_loss": -10.693997383117676, "global_step": 399162, "epoch": 2375} {"train_loss": -9.536869049072266, "global_step": 399163, "epoch": 2375} {"train_loss": -8.274513244628906, "global_step": 399164, "epoch": 2375} {"train_loss": -10.573015213012695, "global_step": 399165, "epoch": 2375} {"train_loss": -10.625592231750488, "global_step": 399166, "epoch": 2375} {"train_loss": -11.575905277615501, "global_step": 399167, "epoch": 2375, "val_loss": 294087.21875, "train_action_mse_error": 1.4670192003250122} {"train_loss": -10.396703720092773, "global_step": 399168, "epoch": 2376} {"train_loss": -10.993940353393555, "global_step": 399169, "epoch": 2376} {"train_loss": -10.982132911682129, "global_step": 399170, "epoch": 2376} {"train_loss": -11.12293815612793, "global_step": 399171, "epoch": 2376} {"train_loss": -10.8157958984375, "global_step": 399172, "epoch": 2376} {"train_loss": -10.037740707397461, "global_step": 399173, "epoch": 2376} {"train_loss": -10.867488861083984, "global_step": 399174, "epoch": 2376} {"train_loss": -10.992674827575684, "global_step": 399175, "epoch": 2376} {"train_loss": -10.783109664916992, "global_step": 399176, "epoch": 2376} {"train_loss": -11.204469680786133, "global_step": 399177, "epoch": 2376} {"train_loss": -11.364496231079102, "global_step": 399178, "epoch": 2376} {"train_loss": -11.203187942504883, "global_step": 399179, "epoch": 2376} {"train_loss": -12.084798812866211, "global_step": 399180, "epoch": 2376} {"train_loss": -11.292572021484375, "global_step": 399181, "epoch": 2376} {"train_loss": -11.902631759643555, "global_step": 399182, "epoch": 2376} {"train_loss": -11.902873039245605, "global_step": 399183, "epoch": 2376} {"train_loss": -11.4252347946167, "global_step": 399184, "epoch": 2376} {"train_loss": -11.80721664428711, "global_step": 399185, "epoch": 2376} {"train_loss": -11.916645050048828, "global_step": 399186, "epoch": 2376} {"train_loss": -11.768823623657227, "global_step": 399187, "epoch": 2376} {"train_loss": -12.275047302246094, "global_step": 399188, "epoch": 2376} {"train_loss": -12.160624504089355, "global_step": 399189, "epoch": 2376} {"train_loss": -12.151323318481445, "global_step": 399190, "epoch": 2376} {"train_loss": -12.063652992248535, "global_step": 399191, "epoch": 2376} {"train_loss": -12.252264022827148, "global_step": 399192, "epoch": 2376} {"train_loss": -12.11320972442627, "global_step": 399193, "epoch": 2376} {"train_loss": -12.0604887008667, "global_step": 399194, "epoch": 2376} {"train_loss": -12.27828311920166, "global_step": 399195, "epoch": 2376} {"train_loss": -12.254718780517578, "global_step": 399196, "epoch": 2376} {"train_loss": -12.226539611816406, "global_step": 399197, "epoch": 2376} {"train_loss": -12.195558547973633, "global_step": 399198, "epoch": 2376} {"train_loss": -12.21138858795166, "global_step": 399199, "epoch": 2376} {"train_loss": -12.121023178100586, "global_step": 399200, "epoch": 2376} {"train_loss": -12.431146621704102, "global_step": 399201, "epoch": 2376} {"train_loss": -12.206029891967773, "global_step": 399202, "epoch": 2376} {"train_loss": -12.454500198364258, "global_step": 399203, "epoch": 2376} {"train_loss": -12.559610366821289, "global_step": 399204, "epoch": 2376} {"train_loss": -12.560708999633789, "global_step": 399205, "epoch": 2376} {"train_loss": -12.325509071350098, "global_step": 399206, "epoch": 2376} {"train_loss": -12.30303955078125, "global_step": 399207, "epoch": 2376} {"train_loss": -12.073678970336914, "global_step": 399208, "epoch": 2376} {"train_loss": -12.518646240234375, "global_step": 399209, "epoch": 2376} {"train_loss": -12.289239883422852, "global_step": 399210, "epoch": 2376} {"train_loss": -12.246713638305664, "global_step": 399211, "epoch": 2376} {"train_loss": -12.134706497192383, "global_step": 399212, "epoch": 2376} {"train_loss": -12.309551239013672, "global_step": 399213, "epoch": 2376} {"train_loss": -12.428550720214844, "global_step": 399214, "epoch": 2376} {"train_loss": -12.422012329101562, "global_step": 399215, "epoch": 2376} {"train_loss": -12.502248764038086, "global_step": 399216, "epoch": 2376} {"train_loss": -12.39431381225586, "global_step": 399217, "epoch": 2376} {"train_loss": -12.466421127319336, "global_step": 399218, "epoch": 2376} {"train_loss": -12.481395721435547, "global_step": 399219, "epoch": 2376} {"train_loss": -12.059901237487793, "global_step": 399220, "epoch": 2376} {"train_loss": -12.473073959350586, "global_step": 399221, "epoch": 2376} {"train_loss": -12.65478515625, "global_step": 399222, "epoch": 2376} {"train_loss": -12.334576606750488, "global_step": 399223, "epoch": 2376} {"train_loss": -12.491188049316406, "global_step": 399224, "epoch": 2376} {"train_loss": -12.515082359313965, "global_step": 399225, "epoch": 2376} {"train_loss": -12.529406547546387, "global_step": 399226, "epoch": 2376} {"train_loss": -12.533674240112305, "global_step": 399227, "epoch": 2376} {"train_loss": -12.512491226196289, "global_step": 399228, "epoch": 2376} {"train_loss": -12.317288398742676, "global_step": 399229, "epoch": 2376} {"train_loss": -12.540712356567383, "global_step": 399230, "epoch": 2376} {"train_loss": -12.56908893585205, "global_step": 399231, "epoch": 2376} {"train_loss": -12.647378921508789, "global_step": 399232, "epoch": 2376} {"train_loss": -12.572854995727539, "global_step": 399233, "epoch": 2376} {"train_loss": -12.595972061157227, "global_step": 399234, "epoch": 2376} {"train_loss": -12.668307304382324, "global_step": 399235, "epoch": 2376} {"train_loss": -12.536371231079102, "global_step": 399236, "epoch": 2376} {"train_loss": -12.671806335449219, "global_step": 399237, "epoch": 2376} {"train_loss": -12.560279846191406, "global_step": 399238, "epoch": 2376} {"train_loss": -12.669659614562988, "global_step": 399239, "epoch": 2376} {"train_loss": -12.662932395935059, "global_step": 399240, "epoch": 2376} {"train_loss": -12.659818649291992, "global_step": 399241, "epoch": 2376} {"train_loss": -12.701837539672852, "global_step": 399242, "epoch": 2376} {"train_loss": -12.698829650878906, "global_step": 399243, "epoch": 2376} {"train_loss": -12.768518447875977, "global_step": 399244, "epoch": 2376} {"train_loss": -12.626025199890137, "global_step": 399245, "epoch": 2376} {"train_loss": -12.597197532653809, "global_step": 399246, "epoch": 2376} {"train_loss": -12.602581977844238, "global_step": 399247, "epoch": 2376} {"train_loss": -12.701811790466309, "global_step": 399248, "epoch": 2376} {"train_loss": -12.642850875854492, "global_step": 399249, "epoch": 2376} {"train_loss": -12.385428428649902, "global_step": 399250, "epoch": 2376} {"train_loss": -12.709890365600586, "global_step": 399251, "epoch": 2376} {"train_loss": -12.404014587402344, "global_step": 399252, "epoch": 2376} {"train_loss": -12.924212455749512, "global_step": 399253, "epoch": 2376} {"train_loss": -12.72887897491455, "global_step": 399254, "epoch": 2376} {"train_loss": -12.556990623474121, "global_step": 399255, "epoch": 2376} {"train_loss": -12.663443565368652, "global_step": 399256, "epoch": 2376} {"train_loss": -12.534451484680176, "global_step": 399257, "epoch": 2376} {"train_loss": -12.601516723632812, "global_step": 399258, "epoch": 2376} {"train_loss": -12.813085556030273, "global_step": 399259, "epoch": 2376} {"train_loss": -12.659189224243164, "global_step": 399260, "epoch": 2376} {"train_loss": -12.53931999206543, "global_step": 399261, "epoch": 2376} {"train_loss": -12.590448379516602, "global_step": 399262, "epoch": 2376} {"train_loss": -12.63060474395752, "global_step": 399263, "epoch": 2376} {"train_loss": -12.428743362426758, "global_step": 399264, "epoch": 2376} {"train_loss": -12.672372817993164, "global_step": 399265, "epoch": 2376} {"train_loss": -12.894158363342285, "global_step": 399266, "epoch": 2376} {"train_loss": -12.769891738891602, "global_step": 399267, "epoch": 2376} {"train_loss": -12.624414443969727, "global_step": 399268, "epoch": 2376} {"train_loss": -12.68448257446289, "global_step": 399269, "epoch": 2376} {"train_loss": -12.838576316833496, "global_step": 399270, "epoch": 2376} {"train_loss": -12.27514934539795, "global_step": 399271, "epoch": 2376} {"train_loss": -11.85263729095459, "global_step": 399272, "epoch": 2376} {"train_loss": -10.933011054992676, "global_step": 399273, "epoch": 2376} {"train_loss": -12.732085227966309, "global_step": 399274, "epoch": 2376} {"train_loss": -12.442643165588379, "global_step": 399275, "epoch": 2376} {"train_loss": -11.595744132995605, "global_step": 399276, "epoch": 2376} {"train_loss": -11.987464904785156, "global_step": 399277, "epoch": 2376} {"train_loss": -12.600738525390625, "global_step": 399278, "epoch": 2376} {"train_loss": -12.18449592590332, "global_step": 399279, "epoch": 2376} {"train_loss": -11.085273742675781, "global_step": 399280, "epoch": 2376} {"train_loss": -12.270950317382812, "global_step": 399281, "epoch": 2376} {"train_loss": -12.324967384338379, "global_step": 399282, "epoch": 2376} {"train_loss": -11.300044059753418, "global_step": 399283, "epoch": 2376} {"train_loss": -12.518054962158203, "global_step": 399284, "epoch": 2376} {"train_loss": -12.344134330749512, "global_step": 399285, "epoch": 2376} {"train_loss": -11.509064674377441, "global_step": 399286, "epoch": 2376} {"train_loss": -11.479755401611328, "global_step": 399287, "epoch": 2376} {"train_loss": -12.565110206604004, "global_step": 399288, "epoch": 2376} {"train_loss": -10.948205947875977, "global_step": 399289, "epoch": 2376} {"train_loss": -11.626630783081055, "global_step": 399290, "epoch": 2376} {"train_loss": -12.387758255004883, "global_step": 399291, "epoch": 2376} {"train_loss": -12.000652313232422, "global_step": 399292, "epoch": 2376} {"train_loss": -11.750804901123047, "global_step": 399293, "epoch": 2376} {"train_loss": -12.35484504699707, "global_step": 399294, "epoch": 2376} {"train_loss": -11.470477104187012, "global_step": 399295, "epoch": 2376} {"train_loss": -11.814749717712402, "global_step": 399296, "epoch": 2376} {"train_loss": -12.004990577697754, "global_step": 399297, "epoch": 2376} {"train_loss": -11.998010635375977, "global_step": 399298, "epoch": 2376} {"train_loss": -11.174638748168945, "global_step": 399299, "epoch": 2376} {"train_loss": -11.893842697143555, "global_step": 399300, "epoch": 2376} {"train_loss": -11.62352180480957, "global_step": 399301, "epoch": 2376} {"train_loss": -11.588337898254395, "global_step": 399302, "epoch": 2376} {"train_loss": -11.575931549072266, "global_step": 399303, "epoch": 2376} {"train_loss": -11.371683120727539, "global_step": 399304, "epoch": 2376} {"train_loss": -12.029212951660156, "global_step": 399305, "epoch": 2376} {"train_loss": -12.13394832611084, "global_step": 399306, "epoch": 2376} {"train_loss": -12.084066390991211, "global_step": 399307, "epoch": 2376} {"train_loss": -12.445865631103516, "global_step": 399308, "epoch": 2376} {"train_loss": -11.992351531982422, "global_step": 399309, "epoch": 2376} {"train_loss": -12.355775833129883, "global_step": 399310, "epoch": 2376} {"train_loss": -11.816176414489746, "global_step": 399311, "epoch": 2376} {"train_loss": -12.39830207824707, "global_step": 399312, "epoch": 2376} {"train_loss": -12.09408950805664, "global_step": 399313, "epoch": 2376} {"train_loss": -12.142410278320312, "global_step": 399314, "epoch": 2376} {"train_loss": -12.032304763793945, "global_step": 399315, "epoch": 2376} {"train_loss": -12.29755973815918, "global_step": 399316, "epoch": 2376} {"train_loss": -11.77255630493164, "global_step": 399317, "epoch": 2376} {"train_loss": -11.551640510559082, "global_step": 399318, "epoch": 2376} {"train_loss": -11.98436164855957, "global_step": 399319, "epoch": 2376} {"train_loss": -11.557859420776367, "global_step": 399320, "epoch": 2376} {"train_loss": -11.198285102844238, "global_step": 399321, "epoch": 2376} {"train_loss": -12.024419784545898, "global_step": 399322, "epoch": 2376} {"train_loss": -12.328773498535156, "global_step": 399323, "epoch": 2376} {"train_loss": -12.126201629638672, "global_step": 399324, "epoch": 2376} {"train_loss": -12.35300064086914, "global_step": 399325, "epoch": 2376} {"train_loss": -11.956215858459473, "global_step": 399326, "epoch": 2376} {"train_loss": -12.123440742492676, "global_step": 399327, "epoch": 2376} {"train_loss": -12.150991439819336, "global_step": 399328, "epoch": 2376} {"train_loss": -11.966291427612305, "global_step": 399329, "epoch": 2376} {"train_loss": -11.883438110351562, "global_step": 399330, "epoch": 2376} {"train_loss": -12.247833251953125, "global_step": 399331, "epoch": 2376} {"train_loss": -11.565712928771973, "global_step": 399332, "epoch": 2376} {"train_loss": -11.802671432495117, "global_step": 399333, "epoch": 2376} {"train_loss": -12.290725708007812, "global_step": 399334, "epoch": 2376} {"train_loss": -12.12667339188712, "global_step": 399335, "epoch": 2376, "val_loss": 299937.53125} {"train_loss": -11.626134872436523, "global_step": 399336, "epoch": 2377} {"train_loss": -11.89635944366455, "global_step": 399337, "epoch": 2377} {"train_loss": -12.168298721313477, "global_step": 399338, "epoch": 2377} {"train_loss": -11.789290428161621, "global_step": 399339, "epoch": 2377} {"train_loss": -11.771507263183594, "global_step": 399340, "epoch": 2377} {"train_loss": -11.562868118286133, "global_step": 399341, "epoch": 2377} {"train_loss": -11.652786254882812, "global_step": 399342, "epoch": 2377} {"train_loss": -12.028512954711914, "global_step": 399343, "epoch": 2377} {"train_loss": -12.505777359008789, "global_step": 399344, "epoch": 2377} {"train_loss": -11.719961166381836, "global_step": 399345, "epoch": 2377} {"train_loss": -12.222589492797852, "global_step": 399346, "epoch": 2377} {"train_loss": -11.293144226074219, "global_step": 399347, "epoch": 2377} {"train_loss": -12.36136531829834, "global_step": 399348, "epoch": 2377} {"train_loss": -11.743760108947754, "global_step": 399349, "epoch": 2377} {"train_loss": -12.391373634338379, "global_step": 399350, "epoch": 2377} {"train_loss": -11.94272518157959, "global_step": 399351, "epoch": 2377} {"train_loss": -12.292613983154297, "global_step": 399352, "epoch": 2377} {"train_loss": -12.23459529876709, "global_step": 399353, "epoch": 2377} {"train_loss": -12.367271423339844, "global_step": 399354, "epoch": 2377} {"train_loss": -12.574795722961426, "global_step": 399355, "epoch": 2377} {"train_loss": -12.211037635803223, "global_step": 399356, "epoch": 2377} {"train_loss": -12.545528411865234, "global_step": 399357, "epoch": 2377} {"train_loss": -11.914678573608398, "global_step": 399358, "epoch": 2377} {"train_loss": -12.692635536193848, "global_step": 399359, "epoch": 2377} {"train_loss": -12.084428787231445, "global_step": 399360, "epoch": 2377} {"train_loss": -12.41411304473877, "global_step": 399361, "epoch": 2377} {"train_loss": -12.439839363098145, "global_step": 399362, "epoch": 2377} {"train_loss": -12.355436325073242, "global_step": 399363, "epoch": 2377} {"train_loss": -12.554594039916992, "global_step": 399364, "epoch": 2377} {"train_loss": -12.151607513427734, "global_step": 399365, "epoch": 2377} {"train_loss": -12.647138595581055, "global_step": 399366, "epoch": 2377} {"train_loss": -12.287461280822754, "global_step": 399367, "epoch": 2377} {"train_loss": -12.283905029296875, "global_step": 399368, "epoch": 2377} {"train_loss": -12.400278091430664, "global_step": 399369, "epoch": 2377} {"train_loss": -12.428438186645508, "global_step": 399370, "epoch": 2377} {"train_loss": -12.646551132202148, "global_step": 399371, "epoch": 2377} {"train_loss": -12.538086891174316, "global_step": 399372, "epoch": 2377} {"train_loss": -12.094359397888184, "global_step": 399373, "epoch": 2377} {"train_loss": -12.288511276245117, "global_step": 399374, "epoch": 2377} {"train_loss": -11.956432342529297, "global_step": 399375, "epoch": 2377} {"train_loss": -11.9544677734375, "global_step": 399376, "epoch": 2377} {"train_loss": -12.43137264251709, "global_step": 399377, "epoch": 2377} {"train_loss": -12.573419570922852, "global_step": 399378, "epoch": 2377} {"train_loss": -12.6094388961792, "global_step": 399379, "epoch": 2377} {"train_loss": -12.646393775939941, "global_step": 399380, "epoch": 2377} {"train_loss": -12.55607795715332, "global_step": 399381, "epoch": 2377} {"train_loss": -12.433393478393555, "global_step": 399382, "epoch": 2377} {"train_loss": -12.37878131866455, "global_step": 399383, "epoch": 2377} {"train_loss": -12.327007293701172, "global_step": 399384, "epoch": 2377} {"train_loss": -12.543008804321289, "global_step": 399385, "epoch": 2377} {"train_loss": -12.540288925170898, "global_step": 399386, "epoch": 2377} {"train_loss": -11.885116577148438, "global_step": 399387, "epoch": 2377} {"train_loss": -12.074739456176758, "global_step": 399388, "epoch": 2377} {"train_loss": -12.133455276489258, "global_step": 399389, "epoch": 2377} {"train_loss": -12.326276779174805, "global_step": 399390, "epoch": 2377} {"train_loss": -11.432263374328613, "global_step": 399391, "epoch": 2377} {"train_loss": -12.079231262207031, "global_step": 399392, "epoch": 2377} {"train_loss": -12.30352783203125, "global_step": 399393, "epoch": 2377} {"train_loss": -12.147645950317383, "global_step": 399394, "epoch": 2377} {"train_loss": -10.70606803894043, "global_step": 399395, "epoch": 2377} {"train_loss": -12.584247589111328, "global_step": 399396, "epoch": 2377} {"train_loss": -11.30060863494873, "global_step": 399397, "epoch": 2377} {"train_loss": -9.78840446472168, "global_step": 399398, "epoch": 2377} {"train_loss": -11.328535079956055, "global_step": 399399, "epoch": 2377} {"train_loss": -11.863594055175781, "global_step": 399400, "epoch": 2377} {"train_loss": -11.028690338134766, "global_step": 399401, "epoch": 2377} {"train_loss": -11.767594337463379, "global_step": 399402, "epoch": 2377} {"train_loss": -10.217214584350586, "global_step": 399403, "epoch": 2377} {"train_loss": -12.207883834838867, "global_step": 399404, "epoch": 2377} {"train_loss": -11.331243515014648, "global_step": 399405, "epoch": 2377} {"train_loss": -11.408706665039062, "global_step": 399406, "epoch": 2377} {"train_loss": -11.54641056060791, "global_step": 399407, "epoch": 2377} {"train_loss": -11.618753433227539, "global_step": 399408, "epoch": 2377} {"train_loss": -12.098685264587402, "global_step": 399409, "epoch": 2377} {"train_loss": -11.637693405151367, "global_step": 399410, "epoch": 2377} {"train_loss": -11.180620193481445, "global_step": 399411, "epoch": 2377} {"train_loss": -11.950905799865723, "global_step": 399412, "epoch": 2377} {"train_loss": -11.371445655822754, "global_step": 399413, "epoch": 2377} {"train_loss": -10.154146194458008, "global_step": 399414, "epoch": 2377} {"train_loss": -11.107080459594727, "global_step": 399415, "epoch": 2377} {"train_loss": -10.222501754760742, "global_step": 399416, "epoch": 2377} {"train_loss": -11.582559585571289, "global_step": 399417, "epoch": 2377} {"train_loss": -11.28593635559082, "global_step": 399418, "epoch": 2377} {"train_loss": -11.870166778564453, "global_step": 399419, "epoch": 2377} {"train_loss": -10.998086929321289, "global_step": 399420, "epoch": 2377} {"train_loss": -11.44599723815918, "global_step": 399421, "epoch": 2377} {"train_loss": -11.499359130859375, "global_step": 399422, "epoch": 2377} {"train_loss": -11.192619323730469, "global_step": 399423, "epoch": 2377} {"train_loss": -11.131478309631348, "global_step": 399424, "epoch": 2377} {"train_loss": -11.14169692993164, "global_step": 399425, "epoch": 2377} {"train_loss": -11.459875106811523, "global_step": 399426, "epoch": 2377} {"train_loss": -11.246726989746094, "global_step": 399427, "epoch": 2377} {"train_loss": -11.73398494720459, "global_step": 399428, "epoch": 2377} {"train_loss": -10.932441711425781, "global_step": 399429, "epoch": 2377} {"train_loss": -11.777433395385742, "global_step": 399430, "epoch": 2377} {"train_loss": -11.648712158203125, "global_step": 399431, "epoch": 2377} {"train_loss": -10.932353973388672, "global_step": 399432, "epoch": 2377} {"train_loss": -12.071876525878906, "global_step": 399433, "epoch": 2377} {"train_loss": -11.480683326721191, "global_step": 399434, "epoch": 2377} {"train_loss": -11.458314895629883, "global_step": 399435, "epoch": 2377} {"train_loss": -12.10118293762207, "global_step": 399436, "epoch": 2377} {"train_loss": -11.519919395446777, "global_step": 399437, "epoch": 2377} {"train_loss": -12.134733200073242, "global_step": 399438, "epoch": 2377} {"train_loss": -12.016912460327148, "global_step": 399439, "epoch": 2377} {"train_loss": -11.726729393005371, "global_step": 399440, "epoch": 2377} {"train_loss": -12.108955383300781, "global_step": 399441, "epoch": 2377} {"train_loss": -11.883456230163574, "global_step": 399442, "epoch": 2377} {"train_loss": -11.884378433227539, "global_step": 399443, "epoch": 2377} {"train_loss": -11.705808639526367, "global_step": 399444, "epoch": 2377} {"train_loss": -12.016143798828125, "global_step": 399445, "epoch": 2377} {"train_loss": -11.738920211791992, "global_step": 399446, "epoch": 2377} {"train_loss": -12.290630340576172, "global_step": 399447, "epoch": 2377} {"train_loss": -11.596967697143555, "global_step": 399448, "epoch": 2377} {"train_loss": -12.528141021728516, "global_step": 399449, "epoch": 2377} {"train_loss": -11.96667194366455, "global_step": 399450, "epoch": 2377} {"train_loss": -12.236428260803223, "global_step": 399451, "epoch": 2377} {"train_loss": -12.211687088012695, "global_step": 399452, "epoch": 2377} {"train_loss": -12.026543617248535, "global_step": 399453, "epoch": 2377} {"train_loss": -12.138179779052734, "global_step": 399454, "epoch": 2377} {"train_loss": -12.123716354370117, "global_step": 399455, "epoch": 2377} {"train_loss": -12.233981132507324, "global_step": 399456, "epoch": 2377} {"train_loss": -12.064208984375, "global_step": 399457, "epoch": 2377} {"train_loss": -12.220622062683105, "global_step": 399458, "epoch": 2377} {"train_loss": -12.220011711120605, "global_step": 399459, "epoch": 2377} {"train_loss": -12.26550006866455, "global_step": 399460, "epoch": 2377} {"train_loss": -12.445028305053711, "global_step": 399461, "epoch": 2377} {"train_loss": -12.204095840454102, "global_step": 399462, "epoch": 2377} {"train_loss": -12.289031028747559, "global_step": 399463, "epoch": 2377} {"train_loss": -12.275802612304688, "global_step": 399464, "epoch": 2377} {"train_loss": -12.253521919250488, "global_step": 399465, "epoch": 2377} {"train_loss": -12.427526473999023, "global_step": 399466, "epoch": 2377} {"train_loss": -12.34742546081543, "global_step": 399467, "epoch": 2377} {"train_loss": -12.309389114379883, "global_step": 399468, "epoch": 2377} {"train_loss": -12.634856224060059, "global_step": 399469, "epoch": 2377} {"train_loss": -12.192290306091309, "global_step": 399470, "epoch": 2377} {"train_loss": -12.278426170349121, "global_step": 399471, "epoch": 2377} {"train_loss": -12.386890411376953, "global_step": 399472, "epoch": 2377} {"train_loss": -12.265869140625, "global_step": 399473, "epoch": 2377} {"train_loss": -12.436117172241211, "global_step": 399474, "epoch": 2377} {"train_loss": -12.091154098510742, "global_step": 399475, "epoch": 2377} {"train_loss": -12.761503219604492, "global_step": 399476, "epoch": 2377} {"train_loss": -12.37950325012207, "global_step": 399477, "epoch": 2377} {"train_loss": -12.384042739868164, "global_step": 399478, "epoch": 2377} {"train_loss": -12.273946762084961, "global_step": 399479, "epoch": 2377} {"train_loss": -12.184986114501953, "global_step": 399480, "epoch": 2377} {"train_loss": -12.539201736450195, "global_step": 399481, "epoch": 2377} {"train_loss": -12.327737808227539, "global_step": 399482, "epoch": 2377} {"train_loss": -12.570898056030273, "global_step": 399483, "epoch": 2377} {"train_loss": -12.57708740234375, "global_step": 399484, "epoch": 2377} {"train_loss": -12.456451416015625, "global_step": 399485, "epoch": 2377} {"train_loss": -12.62987232208252, "global_step": 399486, "epoch": 2377} {"train_loss": -12.704591751098633, "global_step": 399487, "epoch": 2377} {"train_loss": -12.488658905029297, "global_step": 399488, "epoch": 2377} {"train_loss": -12.527408599853516, "global_step": 399489, "epoch": 2377} {"train_loss": -12.300695419311523, "global_step": 399490, "epoch": 2377} {"train_loss": -12.139471054077148, "global_step": 399491, "epoch": 2377} {"train_loss": -11.927430152893066, "global_step": 399492, "epoch": 2377} {"train_loss": -12.411617279052734, "global_step": 399493, "epoch": 2377} {"train_loss": -12.37255573272705, "global_step": 399494, "epoch": 2377} {"train_loss": -12.24083137512207, "global_step": 399495, "epoch": 2377} {"train_loss": -12.088580131530762, "global_step": 399496, "epoch": 2377} {"train_loss": -12.485499382019043, "global_step": 399497, "epoch": 2377} {"train_loss": -11.963423728942871, "global_step": 399498, "epoch": 2377} {"train_loss": -12.331222534179688, "global_step": 399499, "epoch": 2377} {"train_loss": -12.319112777709961, "global_step": 399500, "epoch": 2377} {"train_loss": -11.590475082397461, "global_step": 399501, "epoch": 2377} {"train_loss": -12.041635513305664, "global_step": 399502, "epoch": 2377} {"train_loss": -12.004321944145929, "global_step": 399503, "epoch": 2377, "val_loss": 303194.0} {"train_loss": -11.799827575683594, "global_step": 399504, "epoch": 2378} {"train_loss": -11.977560043334961, "global_step": 399505, "epoch": 2378} {"train_loss": -11.982498168945312, "global_step": 399506, "epoch": 2378} {"train_loss": -12.020566940307617, "global_step": 399507, "epoch": 2378} {"train_loss": -11.652645111083984, "global_step": 399508, "epoch": 2378} {"train_loss": -11.759239196777344, "global_step": 399509, "epoch": 2378} {"train_loss": -12.334107398986816, "global_step": 399510, "epoch": 2378} {"train_loss": -11.691049575805664, "global_step": 399511, "epoch": 2378} {"train_loss": -12.083772659301758, "global_step": 399512, "epoch": 2378} {"train_loss": -12.28182601928711, "global_step": 399513, "epoch": 2378} {"train_loss": -12.14556884765625, "global_step": 399514, "epoch": 2378} {"train_loss": -11.553119659423828, "global_step": 399515, "epoch": 2378} {"train_loss": -12.260586738586426, "global_step": 399516, "epoch": 2378} {"train_loss": -11.873652458190918, "global_step": 399517, "epoch": 2378} {"train_loss": -12.010580062866211, "global_step": 399518, "epoch": 2378} {"train_loss": -12.13663101196289, "global_step": 399519, "epoch": 2378} {"train_loss": -11.91535758972168, "global_step": 399520, "epoch": 2378} {"train_loss": -12.203397750854492, "global_step": 399521, "epoch": 2378} {"train_loss": -12.504897117614746, "global_step": 399522, "epoch": 2378} {"train_loss": -12.345263481140137, "global_step": 399523, "epoch": 2378} {"train_loss": -12.347026824951172, "global_step": 399524, "epoch": 2378} {"train_loss": -12.542455673217773, "global_step": 399525, "epoch": 2378} {"train_loss": -12.550192832946777, "global_step": 399526, "epoch": 2378} {"train_loss": -12.576868057250977, "global_step": 399527, "epoch": 2378} {"train_loss": -12.41341495513916, "global_step": 399528, "epoch": 2378} {"train_loss": -12.554174423217773, "global_step": 399529, "epoch": 2378} {"train_loss": -12.388189315795898, "global_step": 399530, "epoch": 2378} {"train_loss": -12.307696342468262, "global_step": 399531, "epoch": 2378} {"train_loss": -12.012357711791992, "global_step": 399532, "epoch": 2378} {"train_loss": -11.933197021484375, "global_step": 399533, "epoch": 2378} {"train_loss": -12.08860969543457, "global_step": 399534, "epoch": 2378} {"train_loss": -12.305179595947266, "global_step": 399535, "epoch": 2378} {"train_loss": -12.448348045349121, "global_step": 399536, "epoch": 2378} {"train_loss": -11.982234001159668, "global_step": 399537, "epoch": 2378} {"train_loss": -11.773386001586914, "global_step": 399538, "epoch": 2378} {"train_loss": -11.27591323852539, "global_step": 399539, "epoch": 2378} {"train_loss": -11.867704391479492, "global_step": 399540, "epoch": 2378} {"train_loss": -11.415143966674805, "global_step": 399541, "epoch": 2378} {"train_loss": -12.238956451416016, "global_step": 399542, "epoch": 2378} {"train_loss": -11.446174621582031, "global_step": 399543, "epoch": 2378} {"train_loss": -11.684329986572266, "global_step": 399544, "epoch": 2378} {"train_loss": -12.485048294067383, "global_step": 399545, "epoch": 2378} {"train_loss": -11.61125373840332, "global_step": 399546, "epoch": 2378} {"train_loss": -11.838233947753906, "global_step": 399547, "epoch": 2378} {"train_loss": -12.352537155151367, "global_step": 399548, "epoch": 2378} {"train_loss": -12.261075973510742, "global_step": 399549, "epoch": 2378} {"train_loss": -12.250244140625, "global_step": 399550, "epoch": 2378} {"train_loss": -12.429878234863281, "global_step": 399551, "epoch": 2378} {"train_loss": -12.171003341674805, "global_step": 399552, "epoch": 2378} {"train_loss": -12.31036376953125, "global_step": 399553, "epoch": 2378} {"train_loss": -12.282697677612305, "global_step": 399554, "epoch": 2378} {"train_loss": -12.37800407409668, "global_step": 399555, "epoch": 2378} {"train_loss": -12.274696350097656, "global_step": 399556, "epoch": 2378} {"train_loss": -12.071439743041992, "global_step": 399557, "epoch": 2378} {"train_loss": -12.31369400024414, "global_step": 399558, "epoch": 2378} {"train_loss": -12.187759399414062, "global_step": 399559, "epoch": 2378} {"train_loss": -12.684576988220215, "global_step": 399560, "epoch": 2378} {"train_loss": -12.123161315917969, "global_step": 399561, "epoch": 2378} {"train_loss": -12.411266326904297, "global_step": 399562, "epoch": 2378} {"train_loss": -12.309661865234375, "global_step": 399563, "epoch": 2378} {"train_loss": -12.198570251464844, "global_step": 399564, "epoch": 2378} {"train_loss": -12.339326858520508, "global_step": 399565, "epoch": 2378} {"train_loss": -11.596212387084961, "global_step": 399566, "epoch": 2378} {"train_loss": -12.072906494140625, "global_step": 399567, "epoch": 2378} {"train_loss": -11.888406753540039, "global_step": 399568, "epoch": 2378} {"train_loss": -12.524799346923828, "global_step": 399569, "epoch": 2378} {"train_loss": -11.907468795776367, "global_step": 399570, "epoch": 2378} {"train_loss": -11.495840072631836, "global_step": 399571, "epoch": 2378} {"train_loss": -11.839662551879883, "global_step": 399572, "epoch": 2378} {"train_loss": -12.30970573425293, "global_step": 399573, "epoch": 2378} {"train_loss": -11.277321815490723, "global_step": 399574, "epoch": 2378} {"train_loss": -12.443849563598633, "global_step": 399575, "epoch": 2378} {"train_loss": -12.703386306762695, "global_step": 399576, "epoch": 2378} {"train_loss": -12.15645980834961, "global_step": 399577, "epoch": 2378} {"train_loss": -12.727306365966797, "global_step": 399578, "epoch": 2378} {"train_loss": -12.099090576171875, "global_step": 399579, "epoch": 2378} {"train_loss": -11.83339786529541, "global_step": 399580, "epoch": 2378} {"train_loss": -12.41893196105957, "global_step": 399581, "epoch": 2378} {"train_loss": -11.930879592895508, "global_step": 399582, "epoch": 2378} {"train_loss": -11.824707984924316, "global_step": 399583, "epoch": 2378} {"train_loss": -12.332155227661133, "global_step": 399584, "epoch": 2378} {"train_loss": -12.167547225952148, "global_step": 399585, "epoch": 2378} {"train_loss": -12.333576202392578, "global_step": 399586, "epoch": 2378} {"train_loss": -12.579181671142578, "global_step": 399587, "epoch": 2378} {"train_loss": -12.481657981872559, "global_step": 399588, "epoch": 2378} {"train_loss": -12.372919082641602, "global_step": 399589, "epoch": 2378} {"train_loss": -12.497861862182617, "global_step": 399590, "epoch": 2378} {"train_loss": -12.486478805541992, "global_step": 399591, "epoch": 2378} {"train_loss": -12.28370475769043, "global_step": 399592, "epoch": 2378} {"train_loss": -12.128118515014648, "global_step": 399593, "epoch": 2378} {"train_loss": -12.69576644897461, "global_step": 399594, "epoch": 2378} {"train_loss": -12.54748249053955, "global_step": 399595, "epoch": 2378} {"train_loss": -12.507039070129395, "global_step": 399596, "epoch": 2378} {"train_loss": -12.466215133666992, "global_step": 399597, "epoch": 2378} {"train_loss": -12.560510635375977, "global_step": 399598, "epoch": 2378} {"train_loss": -12.769754409790039, "global_step": 399599, "epoch": 2378} {"train_loss": -12.5183744430542, "global_step": 399600, "epoch": 2378} {"train_loss": -12.635684967041016, "global_step": 399601, "epoch": 2378} {"train_loss": -12.504639625549316, "global_step": 399602, "epoch": 2378} {"train_loss": -12.479684829711914, "global_step": 399603, "epoch": 2378} {"train_loss": -12.613350868225098, "global_step": 399604, "epoch": 2378} {"train_loss": -12.403032302856445, "global_step": 399605, "epoch": 2378} {"train_loss": -12.44530200958252, "global_step": 399606, "epoch": 2378} {"train_loss": -12.42156982421875, "global_step": 399607, "epoch": 2378} {"train_loss": -12.506143569946289, "global_step": 399608, "epoch": 2378} {"train_loss": -12.471181869506836, "global_step": 399609, "epoch": 2378} {"train_loss": -12.292152404785156, "global_step": 399610, "epoch": 2378} {"train_loss": -12.220283508300781, "global_step": 399611, "epoch": 2378} {"train_loss": -12.16463851928711, "global_step": 399612, "epoch": 2378} {"train_loss": -11.937744140625, "global_step": 399613, "epoch": 2378} {"train_loss": -12.383512496948242, "global_step": 399614, "epoch": 2378} {"train_loss": -12.239604949951172, "global_step": 399615, "epoch": 2378} {"train_loss": -11.792123794555664, "global_step": 399616, "epoch": 2378} {"train_loss": -11.883979797363281, "global_step": 399617, "epoch": 2378} {"train_loss": -12.376517295837402, "global_step": 399618, "epoch": 2378} {"train_loss": -11.915077209472656, "global_step": 399619, "epoch": 2378} {"train_loss": -12.0774564743042, "global_step": 399620, "epoch": 2378} {"train_loss": -11.916545867919922, "global_step": 399621, "epoch": 2378} {"train_loss": -12.174407958984375, "global_step": 399622, "epoch": 2378} {"train_loss": -11.278465270996094, "global_step": 399623, "epoch": 2378} {"train_loss": -11.9010009765625, "global_step": 399624, "epoch": 2378} {"train_loss": -12.419685363769531, "global_step": 399625, "epoch": 2378} {"train_loss": -12.067510604858398, "global_step": 399626, "epoch": 2378} {"train_loss": -10.989702224731445, "global_step": 399627, "epoch": 2378} {"train_loss": -11.383962631225586, "global_step": 399628, "epoch": 2378} {"train_loss": -11.38086986541748, "global_step": 399629, "epoch": 2378} {"train_loss": -10.038639068603516, "global_step": 399630, "epoch": 2378} {"train_loss": -10.893396377563477, "global_step": 399631, "epoch": 2378} {"train_loss": -10.247150421142578, "global_step": 399632, "epoch": 2378} {"train_loss": -9.99671459197998, "global_step": 399633, "epoch": 2378} {"train_loss": -10.824893951416016, "global_step": 399634, "epoch": 2378} {"train_loss": -10.646454811096191, "global_step": 399635, "epoch": 2378} {"train_loss": -11.598770141601562, "global_step": 399636, "epoch": 2378} {"train_loss": -10.737447738647461, "global_step": 399637, "epoch": 2378} {"train_loss": -11.813814163208008, "global_step": 399638, "epoch": 2378} {"train_loss": -11.389845848083496, "global_step": 399639, "epoch": 2378} {"train_loss": -11.220308303833008, "global_step": 399640, "epoch": 2378} {"train_loss": -11.266780853271484, "global_step": 399641, "epoch": 2378} {"train_loss": -10.689228057861328, "global_step": 399642, "epoch": 2378} {"train_loss": -10.210226058959961, "global_step": 399643, "epoch": 2378} {"train_loss": -11.359037399291992, "global_step": 399644, "epoch": 2378} {"train_loss": -10.516626358032227, "global_step": 399645, "epoch": 2378} {"train_loss": -11.217046737670898, "global_step": 399646, "epoch": 2378} {"train_loss": -10.757555961608887, "global_step": 399647, "epoch": 2378} {"train_loss": -10.731098175048828, "global_step": 399648, "epoch": 2378} {"train_loss": -11.347945213317871, "global_step": 399649, "epoch": 2378} {"train_loss": -10.721637725830078, "global_step": 399650, "epoch": 2378} {"train_loss": -11.875387191772461, "global_step": 399651, "epoch": 2378} {"train_loss": -11.163225173950195, "global_step": 399652, "epoch": 2378} {"train_loss": -12.214219093322754, "global_step": 399653, "epoch": 2378} {"train_loss": -11.660690307617188, "global_step": 399654, "epoch": 2378} {"train_loss": -11.665862083435059, "global_step": 399655, "epoch": 2378} {"train_loss": -11.724878311157227, "global_step": 399656, "epoch": 2378} {"train_loss": -11.15045166015625, "global_step": 399657, "epoch": 2378} {"train_loss": -12.308038711547852, "global_step": 399658, "epoch": 2378} {"train_loss": -11.409006118774414, "global_step": 399659, "epoch": 2378} {"train_loss": -11.909459114074707, "global_step": 399660, "epoch": 2378} {"train_loss": -11.749214172363281, "global_step": 399661, "epoch": 2378} {"train_loss": -11.676915168762207, "global_step": 399662, "epoch": 2378} {"train_loss": -11.912860870361328, "global_step": 399663, "epoch": 2378} {"train_loss": -11.645450592041016, "global_step": 399664, "epoch": 2378} {"train_loss": -12.278829574584961, "global_step": 399665, "epoch": 2378} {"train_loss": -12.057308197021484, "global_step": 399666, "epoch": 2378} {"train_loss": -11.791121482849121, "global_step": 399667, "epoch": 2378} {"train_loss": -12.228106498718262, "global_step": 399668, "epoch": 2378} {"train_loss": -12.090801239013672, "global_step": 399669, "epoch": 2378} {"train_loss": -12.46931266784668, "global_step": 399670, "epoch": 2378} {"train_loss": -11.959115658487592, "global_step": 399671, "epoch": 2378, "val_loss": 304662.90625} {"train_loss": -12.351724624633789, "global_step": 399672, "epoch": 2379} {"train_loss": -12.344121932983398, "global_step": 399673, "epoch": 2379} {"train_loss": -11.971017837524414, "global_step": 399674, "epoch": 2379} {"train_loss": -12.120562553405762, "global_step": 399675, "epoch": 2379} {"train_loss": -11.804086685180664, "global_step": 399676, "epoch": 2379} {"train_loss": -12.144229888916016, "global_step": 399677, "epoch": 2379} {"train_loss": -12.072770118713379, "global_step": 399678, "epoch": 2379} {"train_loss": -12.120006561279297, "global_step": 399679, "epoch": 2379} {"train_loss": -12.336323738098145, "global_step": 399680, "epoch": 2379} {"train_loss": -12.305458068847656, "global_step": 399681, "epoch": 2379} {"train_loss": -12.336633682250977, "global_step": 399682, "epoch": 2379} {"train_loss": -12.305185317993164, "global_step": 399683, "epoch": 2379} {"train_loss": -12.408639907836914, "global_step": 399684, "epoch": 2379} {"train_loss": -12.355398178100586, "global_step": 399685, "epoch": 2379} {"train_loss": -12.537818908691406, "global_step": 399686, "epoch": 2379} {"train_loss": -12.50220012664795, "global_step": 399687, "epoch": 2379} {"train_loss": -12.462114334106445, "global_step": 399688, "epoch": 2379} {"train_loss": -12.406819343566895, "global_step": 399689, "epoch": 2379} {"train_loss": -12.607006072998047, "global_step": 399690, "epoch": 2379} {"train_loss": -12.63260269165039, "global_step": 399691, "epoch": 2379} {"train_loss": -12.628110885620117, "global_step": 399692, "epoch": 2379} {"train_loss": -12.467131614685059, "global_step": 399693, "epoch": 2379} {"train_loss": -12.277848243713379, "global_step": 399694, "epoch": 2379} {"train_loss": -12.386435508728027, "global_step": 399695, "epoch": 2379} {"train_loss": -12.463887214660645, "global_step": 399696, "epoch": 2379} {"train_loss": -12.371566772460938, "global_step": 399697, "epoch": 2379} {"train_loss": -12.215965270996094, "global_step": 399698, "epoch": 2379} {"train_loss": -12.600566864013672, "global_step": 399699, "epoch": 2379} {"train_loss": -12.329768180847168, "global_step": 399700, "epoch": 2379} {"train_loss": -12.504945755004883, "global_step": 399701, "epoch": 2379} {"train_loss": -12.497533798217773, "global_step": 399702, "epoch": 2379} {"train_loss": -12.246149063110352, "global_step": 399703, "epoch": 2379} {"train_loss": -12.501823425292969, "global_step": 399704, "epoch": 2379} {"train_loss": -12.408039093017578, "global_step": 399705, "epoch": 2379} {"train_loss": -11.791900634765625, "global_step": 399706, "epoch": 2379} {"train_loss": -12.657896041870117, "global_step": 399707, "epoch": 2379} {"train_loss": -12.104820251464844, "global_step": 399708, "epoch": 2379} {"train_loss": -12.405811309814453, "global_step": 399709, "epoch": 2379} {"train_loss": -12.385887145996094, "global_step": 399710, "epoch": 2379} {"train_loss": -12.073935508728027, "global_step": 399711, "epoch": 2379} {"train_loss": -12.307680130004883, "global_step": 399712, "epoch": 2379} {"train_loss": -12.35911750793457, "global_step": 399713, "epoch": 2379} {"train_loss": -12.497337341308594, "global_step": 399714, "epoch": 2379} {"train_loss": -12.137467384338379, "global_step": 399715, "epoch": 2379} {"train_loss": -12.497520446777344, "global_step": 399716, "epoch": 2379} {"train_loss": -12.582897186279297, "global_step": 399717, "epoch": 2379} {"train_loss": -12.558558464050293, "global_step": 399718, "epoch": 2379} {"train_loss": -12.632403373718262, "global_step": 399719, "epoch": 2379} {"train_loss": -12.812450408935547, "global_step": 399720, "epoch": 2379} {"train_loss": -12.573768615722656, "global_step": 399721, "epoch": 2379} {"train_loss": -12.778447151184082, "global_step": 399722, "epoch": 2379} {"train_loss": -12.687652587890625, "global_step": 399723, "epoch": 2379} {"train_loss": -12.24853515625, "global_step": 399724, "epoch": 2379} {"train_loss": -12.5438232421875, "global_step": 399725, "epoch": 2379} {"train_loss": -12.783141136169434, "global_step": 399726, "epoch": 2379} {"train_loss": -12.434659957885742, "global_step": 399727, "epoch": 2379} {"train_loss": -12.308820724487305, "global_step": 399728, "epoch": 2379} {"train_loss": -12.416621208190918, "global_step": 399729, "epoch": 2379} {"train_loss": -12.479726791381836, "global_step": 399730, "epoch": 2379} {"train_loss": -12.405807495117188, "global_step": 399731, "epoch": 2379} {"train_loss": -12.749649047851562, "global_step": 399732, "epoch": 2379} {"train_loss": -12.058717727661133, "global_step": 399733, "epoch": 2379} {"train_loss": -12.255634307861328, "global_step": 399734, "epoch": 2379} {"train_loss": -12.814589500427246, "global_step": 399735, "epoch": 2379} {"train_loss": -12.664301872253418, "global_step": 399736, "epoch": 2379} {"train_loss": -12.526150703430176, "global_step": 399737, "epoch": 2379} {"train_loss": -12.611967086791992, "global_step": 399738, "epoch": 2379} {"train_loss": -12.598280906677246, "global_step": 399739, "epoch": 2379} {"train_loss": -12.697969436645508, "global_step": 399740, "epoch": 2379} {"train_loss": -12.671878814697266, "global_step": 399741, "epoch": 2379} {"train_loss": -12.598922729492188, "global_step": 399742, "epoch": 2379} {"train_loss": -12.294947624206543, "global_step": 399743, "epoch": 2379} {"train_loss": -11.878873825073242, "global_step": 399744, "epoch": 2379} {"train_loss": -12.118670463562012, "global_step": 399745, "epoch": 2379} {"train_loss": -12.449262619018555, "global_step": 399746, "epoch": 2379} {"train_loss": -11.957741737365723, "global_step": 399747, "epoch": 2379} {"train_loss": -12.247572898864746, "global_step": 399748, "epoch": 2379} {"train_loss": -12.668033599853516, "global_step": 399749, "epoch": 2379} {"train_loss": -11.818439483642578, "global_step": 399750, "epoch": 2379} {"train_loss": -11.750531196594238, "global_step": 399751, "epoch": 2379} {"train_loss": -13.074289321899414, "global_step": 399752, "epoch": 2379} {"train_loss": -11.678807258605957, "global_step": 399753, "epoch": 2379} {"train_loss": -12.162822723388672, "global_step": 399754, "epoch": 2379} {"train_loss": -12.017542839050293, "global_step": 399755, "epoch": 2379} {"train_loss": -11.808097839355469, "global_step": 399756, "epoch": 2379} {"train_loss": -11.240448951721191, "global_step": 399757, "epoch": 2379} {"train_loss": -12.617631912231445, "global_step": 399758, "epoch": 2379} {"train_loss": -10.613600730895996, "global_step": 399759, "epoch": 2379} {"train_loss": -12.133193969726562, "global_step": 399760, "epoch": 2379} {"train_loss": -10.833133697509766, "global_step": 399761, "epoch": 2379} {"train_loss": -10.863490104675293, "global_step": 399762, "epoch": 2379} {"train_loss": -12.113357543945312, "global_step": 399763, "epoch": 2379} {"train_loss": -11.111726760864258, "global_step": 399764, "epoch": 2379} {"train_loss": -12.380615234375, "global_step": 399765, "epoch": 2379} {"train_loss": -12.216001510620117, "global_step": 399766, "epoch": 2379} {"train_loss": -11.995134353637695, "global_step": 399767, "epoch": 2379} {"train_loss": -12.635741233825684, "global_step": 399768, "epoch": 2379} {"train_loss": -11.935985565185547, "global_step": 399769, "epoch": 2379} {"train_loss": -12.654688835144043, "global_step": 399770, "epoch": 2379} {"train_loss": -12.117108345031738, "global_step": 399771, "epoch": 2379} {"train_loss": -12.00943374633789, "global_step": 399772, "epoch": 2379} {"train_loss": -12.410178184509277, "global_step": 399773, "epoch": 2379} {"train_loss": -12.347365379333496, "global_step": 399774, "epoch": 2379} {"train_loss": -12.214603424072266, "global_step": 399775, "epoch": 2379} {"train_loss": -12.360637664794922, "global_step": 399776, "epoch": 2379} {"train_loss": -12.064291954040527, "global_step": 399777, "epoch": 2379} {"train_loss": -11.574789047241211, "global_step": 399778, "epoch": 2379} {"train_loss": -12.28786849975586, "global_step": 399779, "epoch": 2379} {"train_loss": -12.523517608642578, "global_step": 399780, "epoch": 2379} {"train_loss": -11.755516052246094, "global_step": 399781, "epoch": 2379} {"train_loss": -12.38563060760498, "global_step": 399782, "epoch": 2379} {"train_loss": -11.949179649353027, "global_step": 399783, "epoch": 2379} {"train_loss": -11.702288627624512, "global_step": 399784, "epoch": 2379} {"train_loss": -12.033122062683105, "global_step": 399785, "epoch": 2379} {"train_loss": -11.666726112365723, "global_step": 399786, "epoch": 2379} {"train_loss": -11.951101303100586, "global_step": 399787, "epoch": 2379} {"train_loss": -12.151529312133789, "global_step": 399788, "epoch": 2379} {"train_loss": -11.712923049926758, "global_step": 399789, "epoch": 2379} {"train_loss": -12.293209075927734, "global_step": 399790, "epoch": 2379} {"train_loss": -11.78516960144043, "global_step": 399791, "epoch": 2379} {"train_loss": -12.242902755737305, "global_step": 399792, "epoch": 2379} {"train_loss": -12.633142471313477, "global_step": 399793, "epoch": 2379} {"train_loss": -12.39710807800293, "global_step": 399794, "epoch": 2379} {"train_loss": -12.567753791809082, "global_step": 399795, "epoch": 2379} {"train_loss": -12.292398452758789, "global_step": 399796, "epoch": 2379} {"train_loss": -12.289291381835938, "global_step": 399797, "epoch": 2379} {"train_loss": -12.046072006225586, "global_step": 399798, "epoch": 2379} {"train_loss": -12.76832389831543, "global_step": 399799, "epoch": 2379} {"train_loss": -12.215997695922852, "global_step": 399800, "epoch": 2379} {"train_loss": -12.556831359863281, "global_step": 399801, "epoch": 2379} {"train_loss": -12.30243968963623, "global_step": 399802, "epoch": 2379} {"train_loss": -12.445000648498535, "global_step": 399803, "epoch": 2379} {"train_loss": -12.363351821899414, "global_step": 399804, "epoch": 2379} {"train_loss": -12.323795318603516, "global_step": 399805, "epoch": 2379} {"train_loss": -12.56078052520752, "global_step": 399806, "epoch": 2379} {"train_loss": -12.340377807617188, "global_step": 399807, "epoch": 2379} {"train_loss": -12.502567291259766, "global_step": 399808, "epoch": 2379} {"train_loss": -12.338132858276367, "global_step": 399809, "epoch": 2379} {"train_loss": -12.561723709106445, "global_step": 399810, "epoch": 2379} {"train_loss": -12.677945137023926, "global_step": 399811, "epoch": 2379} {"train_loss": -12.466379165649414, "global_step": 399812, "epoch": 2379} {"train_loss": -12.27841854095459, "global_step": 399813, "epoch": 2379} {"train_loss": -12.587864875793457, "global_step": 399814, "epoch": 2379} {"train_loss": -12.523515701293945, "global_step": 399815, "epoch": 2379} {"train_loss": -12.16702651977539, "global_step": 399816, "epoch": 2379} {"train_loss": -12.444551467895508, "global_step": 399817, "epoch": 2379} {"train_loss": -12.339153289794922, "global_step": 399818, "epoch": 2379} {"train_loss": -12.304634094238281, "global_step": 399819, "epoch": 2379} {"train_loss": -11.930999755859375, "global_step": 399820, "epoch": 2379} {"train_loss": -12.63266372680664, "global_step": 399821, "epoch": 2379} {"train_loss": -12.380637168884277, "global_step": 399822, "epoch": 2379} {"train_loss": -12.39953327178955, "global_step": 399823, "epoch": 2379} {"train_loss": -12.527772903442383, "global_step": 399824, "epoch": 2379} {"train_loss": -12.21535873413086, "global_step": 399825, "epoch": 2379} {"train_loss": -12.535246849060059, "global_step": 399826, "epoch": 2379} {"train_loss": -12.678647994995117, "global_step": 399827, "epoch": 2379} {"train_loss": -12.278081893920898, "global_step": 399828, "epoch": 2379} {"train_loss": -12.331518173217773, "global_step": 399829, "epoch": 2379} {"train_loss": -12.59022331237793, "global_step": 399830, "epoch": 2379} {"train_loss": -12.7120361328125, "global_step": 399831, "epoch": 2379} {"train_loss": -12.440916061401367, "global_step": 399832, "epoch": 2379} {"train_loss": -12.483438491821289, "global_step": 399833, "epoch": 2379} {"train_loss": -12.618792533874512, "global_step": 399834, "epoch": 2379} {"train_loss": -12.21061897277832, "global_step": 399835, "epoch": 2379} {"train_loss": -12.110088348388672, "global_step": 399836, "epoch": 2379} {"train_loss": -12.01794719696045, "global_step": 399837, "epoch": 2379} {"train_loss": -12.061868667602539, "global_step": 399838, "epoch": 2379} {"train_loss": -12.288044356164479, "global_step": 399839, "epoch": 2379, "val_loss": 299981.8125} {"train_loss": -11.21267318725586, "global_step": 399840, "epoch": 2380} {"train_loss": -12.267200469970703, "global_step": 399841, "epoch": 2380} {"train_loss": -10.417023658752441, "global_step": 399842, "epoch": 2380} {"train_loss": -10.904958724975586, "global_step": 399843, "epoch": 2380} {"train_loss": -11.652597427368164, "global_step": 399844, "epoch": 2380} {"train_loss": -11.153697967529297, "global_step": 399845, "epoch": 2380} {"train_loss": -10.930419921875, "global_step": 399846, "epoch": 2380} {"train_loss": -10.690494537353516, "global_step": 399847, "epoch": 2380} {"train_loss": -10.552398681640625, "global_step": 399848, "epoch": 2380} {"train_loss": -12.016315460205078, "global_step": 399849, "epoch": 2380} {"train_loss": -10.702796936035156, "global_step": 399850, "epoch": 2380} {"train_loss": -12.029153823852539, "global_step": 399851, "epoch": 2380} {"train_loss": -11.296116828918457, "global_step": 399852, "epoch": 2380} {"train_loss": -11.604269027709961, "global_step": 399853, "epoch": 2380} {"train_loss": -11.393932342529297, "global_step": 399854, "epoch": 2380} {"train_loss": -11.871688842773438, "global_step": 399855, "epoch": 2380} {"train_loss": -11.21563720703125, "global_step": 399856, "epoch": 2380} {"train_loss": -11.977652549743652, "global_step": 399857, "epoch": 2380} {"train_loss": -12.158839225769043, "global_step": 399858, "epoch": 2380} {"train_loss": -11.623968124389648, "global_step": 399859, "epoch": 2380} {"train_loss": -11.639581680297852, "global_step": 399860, "epoch": 2380} {"train_loss": -12.307381629943848, "global_step": 399861, "epoch": 2380} {"train_loss": -11.659494400024414, "global_step": 399862, "epoch": 2380} {"train_loss": -12.377955436706543, "global_step": 399863, "epoch": 2380} {"train_loss": -11.830055236816406, "global_step": 399864, "epoch": 2380} {"train_loss": -11.54153823852539, "global_step": 399865, "epoch": 2380} {"train_loss": -12.377911567687988, "global_step": 399866, "epoch": 2380} {"train_loss": -11.707376480102539, "global_step": 399867, "epoch": 2380} {"train_loss": -12.3731689453125, "global_step": 399868, "epoch": 2380} {"train_loss": -12.409549713134766, "global_step": 399869, "epoch": 2380} {"train_loss": -11.946157455444336, "global_step": 399870, "epoch": 2380} {"train_loss": -12.41574478149414, "global_step": 399871, "epoch": 2380} {"train_loss": -12.380982398986816, "global_step": 399872, "epoch": 2380} {"train_loss": -12.29642105102539, "global_step": 399873, "epoch": 2380} {"train_loss": -12.419678688049316, "global_step": 399874, "epoch": 2380} {"train_loss": -11.892154693603516, "global_step": 399875, "epoch": 2380} {"train_loss": -12.36740493774414, "global_step": 399876, "epoch": 2380} {"train_loss": -11.847936630249023, "global_step": 399877, "epoch": 2380} {"train_loss": -10.200479507446289, "global_step": 399878, "epoch": 2380} {"train_loss": -12.507108688354492, "global_step": 399879, "epoch": 2380} {"train_loss": -11.210418701171875, "global_step": 399880, "epoch": 2380} {"train_loss": -11.06943130493164, "global_step": 399881, "epoch": 2380} {"train_loss": -12.03359317779541, "global_step": 399882, "epoch": 2380} {"train_loss": -11.071130752563477, "global_step": 399883, "epoch": 2380} {"train_loss": -12.034300804138184, "global_step": 399884, "epoch": 2380} {"train_loss": -11.259773254394531, "global_step": 399885, "epoch": 2380} {"train_loss": -12.230499267578125, "global_step": 399886, "epoch": 2380} {"train_loss": -11.503708839416504, "global_step": 399887, "epoch": 2380} {"train_loss": -11.736557006835938, "global_step": 399888, "epoch": 2380} {"train_loss": -12.24545669555664, "global_step": 399889, "epoch": 2380} {"train_loss": -11.198366165161133, "global_step": 399890, "epoch": 2380} {"train_loss": -12.038115501403809, "global_step": 399891, "epoch": 2380} {"train_loss": -11.762107849121094, "global_step": 399892, "epoch": 2380} {"train_loss": -11.551416397094727, "global_step": 399893, "epoch": 2380} {"train_loss": -12.183238983154297, "global_step": 399894, "epoch": 2380} {"train_loss": -10.991504669189453, "global_step": 399895, "epoch": 2380} {"train_loss": -12.155754089355469, "global_step": 399896, "epoch": 2380} {"train_loss": -11.222596168518066, "global_step": 399897, "epoch": 2380} {"train_loss": -12.07919692993164, "global_step": 399898, "epoch": 2380} {"train_loss": -11.63007926940918, "global_step": 399899, "epoch": 2380} {"train_loss": -11.746874809265137, "global_step": 399900, "epoch": 2380} {"train_loss": -12.019254684448242, "global_step": 399901, "epoch": 2380} {"train_loss": -11.604418754577637, "global_step": 399902, "epoch": 2380} {"train_loss": -12.451471328735352, "global_step": 399903, "epoch": 2380} {"train_loss": -11.267890930175781, "global_step": 399904, "epoch": 2380} {"train_loss": -12.37278938293457, "global_step": 399905, "epoch": 2380} {"train_loss": -11.741193771362305, "global_step": 399906, "epoch": 2380} {"train_loss": -11.577644348144531, "global_step": 399907, "epoch": 2380} {"train_loss": -12.537210464477539, "global_step": 399908, "epoch": 2380} {"train_loss": -11.797708511352539, "global_step": 399909, "epoch": 2380} {"train_loss": -12.37977123260498, "global_step": 399910, "epoch": 2380} {"train_loss": -12.227836608886719, "global_step": 399911, "epoch": 2380} {"train_loss": -12.418834686279297, "global_step": 399912, "epoch": 2380} {"train_loss": -12.389967918395996, "global_step": 399913, "epoch": 2380} {"train_loss": -12.4036865234375, "global_step": 399914, "epoch": 2380} {"train_loss": -12.234589576721191, "global_step": 399915, "epoch": 2380} {"train_loss": -12.081986427307129, "global_step": 399916, "epoch": 2380} {"train_loss": -12.157097816467285, "global_step": 399917, "epoch": 2380} {"train_loss": -12.094396591186523, "global_step": 399918, "epoch": 2380} {"train_loss": -12.451168060302734, "global_step": 399919, "epoch": 2380} {"train_loss": -12.141413688659668, "global_step": 399920, "epoch": 2380} {"train_loss": -12.262660026550293, "global_step": 399921, "epoch": 2380} {"train_loss": -11.883514404296875, "global_step": 399922, "epoch": 2380} {"train_loss": -12.278139114379883, "global_step": 399923, "epoch": 2380} {"train_loss": -11.782705307006836, "global_step": 399924, "epoch": 2380} {"train_loss": -11.71871280670166, "global_step": 399925, "epoch": 2380} {"train_loss": -11.718725204467773, "global_step": 399926, "epoch": 2380} {"train_loss": -11.456721305847168, "global_step": 399927, "epoch": 2380} {"train_loss": -11.937782287597656, "global_step": 399928, "epoch": 2380} {"train_loss": -11.163426399230957, "global_step": 399929, "epoch": 2380} {"train_loss": -11.576713562011719, "global_step": 399930, "epoch": 2380} {"train_loss": -10.765497207641602, "global_step": 399931, "epoch": 2380} {"train_loss": -10.951904296875, "global_step": 399932, "epoch": 2380} {"train_loss": -11.956253051757812, "global_step": 399933, "epoch": 2380} {"train_loss": -11.311628341674805, "global_step": 399934, "epoch": 2380} {"train_loss": -11.328149795532227, "global_step": 399935, "epoch": 2380} {"train_loss": -10.700965881347656, "global_step": 399936, "epoch": 2380} {"train_loss": -10.223804473876953, "global_step": 399937, "epoch": 2380} {"train_loss": -10.838006973266602, "global_step": 399938, "epoch": 2380} {"train_loss": -11.602706909179688, "global_step": 399939, "epoch": 2380} {"train_loss": -9.957597732543945, "global_step": 399940, "epoch": 2380} {"train_loss": -11.25323486328125, "global_step": 399941, "epoch": 2380} {"train_loss": -12.035091400146484, "global_step": 399942, "epoch": 2380} {"train_loss": -10.85563850402832, "global_step": 399943, "epoch": 2380} {"train_loss": -11.008766174316406, "global_step": 399944, "epoch": 2380} {"train_loss": -11.6578369140625, "global_step": 399945, "epoch": 2380} {"train_loss": -10.254066467285156, "global_step": 399946, "epoch": 2380} {"train_loss": -11.514049530029297, "global_step": 399947, "epoch": 2380} {"train_loss": -10.841692924499512, "global_step": 399948, "epoch": 2380} {"train_loss": -11.304332733154297, "global_step": 399949, "epoch": 2380} {"train_loss": -11.401430130004883, "global_step": 399950, "epoch": 2380} {"train_loss": -12.144649505615234, "global_step": 399951, "epoch": 2380} {"train_loss": -11.365917205810547, "global_step": 399952, "epoch": 2380} {"train_loss": -12.20857048034668, "global_step": 399953, "epoch": 2380} {"train_loss": -10.931377410888672, "global_step": 399954, "epoch": 2380} {"train_loss": -12.069513320922852, "global_step": 399955, "epoch": 2380} {"train_loss": -11.869054794311523, "global_step": 399956, "epoch": 2380} {"train_loss": -11.938407897949219, "global_step": 399957, "epoch": 2380} {"train_loss": -11.840896606445312, "global_step": 399958, "epoch": 2380} {"train_loss": -12.238558769226074, "global_step": 399959, "epoch": 2380} {"train_loss": -11.62449836730957, "global_step": 399960, "epoch": 2380} {"train_loss": -12.188563346862793, "global_step": 399961, "epoch": 2380} {"train_loss": -11.642080307006836, "global_step": 399962, "epoch": 2380} {"train_loss": -12.328695297241211, "global_step": 399963, "epoch": 2380} {"train_loss": -11.696083068847656, "global_step": 399964, "epoch": 2380} {"train_loss": -12.388708114624023, "global_step": 399965, "epoch": 2380} {"train_loss": -11.90831184387207, "global_step": 399966, "epoch": 2380} {"train_loss": -12.050559997558594, "global_step": 399967, "epoch": 2380} {"train_loss": -12.427778244018555, "global_step": 399968, "epoch": 2380} {"train_loss": -12.355875015258789, "global_step": 399969, "epoch": 2380} {"train_loss": -12.399490356445312, "global_step": 399970, "epoch": 2380} {"train_loss": -12.492753028869629, "global_step": 399971, "epoch": 2380} {"train_loss": -12.27811050415039, "global_step": 399972, "epoch": 2380} {"train_loss": -12.645034790039062, "global_step": 399973, "epoch": 2380} {"train_loss": -12.272554397583008, "global_step": 399974, "epoch": 2380} {"train_loss": -12.347915649414062, "global_step": 399975, "epoch": 2380} {"train_loss": -12.380707740783691, "global_step": 399976, "epoch": 2380} {"train_loss": -12.20461654663086, "global_step": 399977, "epoch": 2380} {"train_loss": -12.22359848022461, "global_step": 399978, "epoch": 2380} {"train_loss": -12.274433135986328, "global_step": 399979, "epoch": 2380} {"train_loss": -12.394498825073242, "global_step": 399980, "epoch": 2380} {"train_loss": -12.309125900268555, "global_step": 399981, "epoch": 2380} {"train_loss": -12.446649551391602, "global_step": 399982, "epoch": 2380} {"train_loss": -12.308887481689453, "global_step": 399983, "epoch": 2380} {"train_loss": -12.220924377441406, "global_step": 399984, "epoch": 2380} {"train_loss": -12.304849624633789, "global_step": 399985, "epoch": 2380} {"train_loss": -12.415843963623047, "global_step": 399986, "epoch": 2380} {"train_loss": -12.521345138549805, "global_step": 399987, "epoch": 2380} {"train_loss": -12.203636169433594, "global_step": 399988, "epoch": 2380} {"train_loss": -12.170883178710938, "global_step": 399989, "epoch": 2380} {"train_loss": -12.243385314941406, "global_step": 399990, "epoch": 2380} {"train_loss": -11.91104507446289, "global_step": 399991, "epoch": 2380} {"train_loss": -12.516881942749023, "global_step": 399992, "epoch": 2380} {"train_loss": -12.226083755493164, "global_step": 399993, "epoch": 2380} {"train_loss": -12.304328918457031, "global_step": 399994, "epoch": 2380} {"train_loss": -12.448373794555664, "global_step": 399995, "epoch": 2380} {"train_loss": -12.676595687866211, "global_step": 399996, "epoch": 2380} {"train_loss": -12.376526832580566, "global_step": 399997, "epoch": 2380} {"train_loss": -12.56808853149414, "global_step": 399998, "epoch": 2380} {"train_loss": -12.589942932128906, "global_step": 399999, "epoch": 2380} {"train_loss": -12.696503639221191, "global_step": 400000, "epoch": 2380} {"train_loss": -12.273208618164062, "global_step": 400001, "epoch": 2380} {"train_loss": -12.401859283447266, "global_step": 400002, "epoch": 2380} {"train_loss": -12.502557754516602, "global_step": 400003, "epoch": 2380} {"train_loss": -12.443098068237305, "global_step": 400004, "epoch": 2380} {"train_loss": -12.682063102722168, "global_step": 400005, "epoch": 2380} {"train_loss": -12.269609451293945, "global_step": 400006, "epoch": 2380} {"train_loss": -11.862777023088364, "global_step": 400007, "epoch": 2380, "val_loss": 304904.65625, "train_action_mse_error": 0.3225623667240143} {"train_loss": -12.49005126953125, "global_step": 400008, "epoch": 2381} {"train_loss": -12.750781059265137, "global_step": 400009, "epoch": 2381} {"train_loss": -12.449350357055664, "global_step": 400010, "epoch": 2381} {"train_loss": -12.668466567993164, "global_step": 400011, "epoch": 2381} {"train_loss": -12.443078994750977, "global_step": 400012, "epoch": 2381} {"train_loss": -12.517518997192383, "global_step": 400013, "epoch": 2381} {"train_loss": -12.434305191040039, "global_step": 400014, "epoch": 2381} {"train_loss": -12.556015968322754, "global_step": 400015, "epoch": 2381} {"train_loss": -12.494914054870605, "global_step": 400016, "epoch": 2381} {"train_loss": -12.52642822265625, "global_step": 400017, "epoch": 2381} {"train_loss": -12.777458190917969, "global_step": 400018, "epoch": 2381} {"train_loss": -12.755170822143555, "global_step": 400019, "epoch": 2381} {"train_loss": -12.72783088684082, "global_step": 400020, "epoch": 2381} {"train_loss": -12.653144836425781, "global_step": 400021, "epoch": 2381} {"train_loss": -12.75715160369873, "global_step": 400022, "epoch": 2381} {"train_loss": -12.31093692779541, "global_step": 400023, "epoch": 2381} {"train_loss": -12.856972694396973, "global_step": 400024, "epoch": 2381} {"train_loss": -12.760028839111328, "global_step": 400025, "epoch": 2381} {"train_loss": -12.53613567352295, "global_step": 400026, "epoch": 2381} {"train_loss": -12.548983573913574, "global_step": 400027, "epoch": 2381} {"train_loss": -12.995628356933594, "global_step": 400028, "epoch": 2381} {"train_loss": -12.395201683044434, "global_step": 400029, "epoch": 2381} {"train_loss": -12.655618667602539, "global_step": 400030, "epoch": 2381} {"train_loss": -12.864635467529297, "global_step": 400031, "epoch": 2381} {"train_loss": -12.594470977783203, "global_step": 400032, "epoch": 2381} {"train_loss": -12.335153579711914, "global_step": 400033, "epoch": 2381} {"train_loss": -12.767341613769531, "global_step": 400034, "epoch": 2381} {"train_loss": -12.171867370605469, "global_step": 400035, "epoch": 2381} {"train_loss": -12.011585235595703, "global_step": 400036, "epoch": 2381} {"train_loss": -12.701723098754883, "global_step": 400037, "epoch": 2381} {"train_loss": -12.597978591918945, "global_step": 400038, "epoch": 2381} {"train_loss": -12.727031707763672, "global_step": 400039, "epoch": 2381} {"train_loss": -12.798332214355469, "global_step": 400040, "epoch": 2381} {"train_loss": -12.873031616210938, "global_step": 400041, "epoch": 2381} {"train_loss": -12.758086204528809, "global_step": 400042, "epoch": 2381} {"train_loss": -12.59589958190918, "global_step": 400043, "epoch": 2381} {"train_loss": -12.758979797363281, "global_step": 400044, "epoch": 2381} {"train_loss": -12.18936538696289, "global_step": 400045, "epoch": 2381} {"train_loss": -11.782858848571777, "global_step": 400046, "epoch": 2381} {"train_loss": -12.33005428314209, "global_step": 400047, "epoch": 2381} {"train_loss": -12.818290710449219, "global_step": 400048, "epoch": 2381} {"train_loss": -12.253610610961914, "global_step": 400049, "epoch": 2381} {"train_loss": -12.542112350463867, "global_step": 400050, "epoch": 2381} {"train_loss": -12.760581970214844, "global_step": 400051, "epoch": 2381} {"train_loss": -12.425802230834961, "global_step": 400052, "epoch": 2381} {"train_loss": -12.199176788330078, "global_step": 400053, "epoch": 2381} {"train_loss": -11.574009895324707, "global_step": 400054, "epoch": 2381} {"train_loss": -12.168231964111328, "global_step": 400055, "epoch": 2381} {"train_loss": -12.754812240600586, "global_step": 400056, "epoch": 2381} {"train_loss": -12.763883590698242, "global_step": 400057, "epoch": 2381} {"train_loss": -12.312506675720215, "global_step": 400058, "epoch": 2381} {"train_loss": -12.73791790008545, "global_step": 400059, "epoch": 2381} {"train_loss": -12.50378131866455, "global_step": 400060, "epoch": 2381} {"train_loss": -12.885015487670898, "global_step": 400061, "epoch": 2381} {"train_loss": -12.494136810302734, "global_step": 400062, "epoch": 2381} {"train_loss": -12.707290649414062, "global_step": 400063, "epoch": 2381} {"train_loss": -12.751455307006836, "global_step": 400064, "epoch": 2381} {"train_loss": -12.574834823608398, "global_step": 400065, "epoch": 2381} {"train_loss": -12.508581161499023, "global_step": 400066, "epoch": 2381} {"train_loss": -12.727299690246582, "global_step": 400067, "epoch": 2381} {"train_loss": -12.711275100708008, "global_step": 400068, "epoch": 2381} {"train_loss": -12.534619331359863, "global_step": 400069, "epoch": 2381} {"train_loss": -12.729272842407227, "global_step": 400070, "epoch": 2381} {"train_loss": -12.493474006652832, "global_step": 400071, "epoch": 2381} {"train_loss": -12.436027526855469, "global_step": 400072, "epoch": 2381} {"train_loss": -12.777419090270996, "global_step": 400073, "epoch": 2381} {"train_loss": -12.383017539978027, "global_step": 400074, "epoch": 2381} {"train_loss": -11.634050369262695, "global_step": 400075, "epoch": 2381} {"train_loss": -12.201547622680664, "global_step": 400076, "epoch": 2381} {"train_loss": -12.500946998596191, "global_step": 400077, "epoch": 2381} {"train_loss": -11.935615539550781, "global_step": 400078, "epoch": 2381} {"train_loss": -10.90000057220459, "global_step": 400079, "epoch": 2381} {"train_loss": -11.75389289855957, "global_step": 400080, "epoch": 2381} {"train_loss": -9.628301620483398, "global_step": 400081, "epoch": 2381} {"train_loss": -9.917635917663574, "global_step": 400082, "epoch": 2381} {"train_loss": -10.999529838562012, "global_step": 400083, "epoch": 2381} {"train_loss": -8.914878845214844, "global_step": 400084, "epoch": 2381} {"train_loss": -10.16286849975586, "global_step": 400085, "epoch": 2381} {"train_loss": -10.388132095336914, "global_step": 400086, "epoch": 2381} {"train_loss": -10.599939346313477, "global_step": 400087, "epoch": 2381} {"train_loss": -10.760448455810547, "global_step": 400088, "epoch": 2381} {"train_loss": -10.162732124328613, "global_step": 400089, "epoch": 2381} {"train_loss": -9.675529479980469, "global_step": 400090, "epoch": 2381} {"train_loss": -11.333887100219727, "global_step": 400091, "epoch": 2381} {"train_loss": -10.412199020385742, "global_step": 400092, "epoch": 2381} {"train_loss": -10.736650466918945, "global_step": 400093, "epoch": 2381} {"train_loss": -10.839245796203613, "global_step": 400094, "epoch": 2381} {"train_loss": -10.113985061645508, "global_step": 400095, "epoch": 2381} {"train_loss": -11.21122932434082, "global_step": 400096, "epoch": 2381} {"train_loss": -11.187593460083008, "global_step": 400097, "epoch": 2381} {"train_loss": -11.244769096374512, "global_step": 400098, "epoch": 2381} {"train_loss": -11.315537452697754, "global_step": 400099, "epoch": 2381} {"train_loss": -11.439624786376953, "global_step": 400100, "epoch": 2381} {"train_loss": -11.095016479492188, "global_step": 400101, "epoch": 2381} {"train_loss": -12.09487533569336, "global_step": 400102, "epoch": 2381} {"train_loss": -11.683448791503906, "global_step": 400103, "epoch": 2381} {"train_loss": -11.976970672607422, "global_step": 400104, "epoch": 2381} {"train_loss": -11.913700103759766, "global_step": 400105, "epoch": 2381} {"train_loss": -11.7239990234375, "global_step": 400106, "epoch": 2381} {"train_loss": -11.87344741821289, "global_step": 400107, "epoch": 2381} {"train_loss": -10.786928176879883, "global_step": 400108, "epoch": 2381} {"train_loss": -12.29932975769043, "global_step": 400109, "epoch": 2381} {"train_loss": -10.896356582641602, "global_step": 400110, "epoch": 2381} {"train_loss": -11.732240676879883, "global_step": 400111, "epoch": 2381} {"train_loss": -10.783864974975586, "global_step": 400112, "epoch": 2381} {"train_loss": -11.166659355163574, "global_step": 400113, "epoch": 2381} {"train_loss": -11.500371932983398, "global_step": 400114, "epoch": 2381} {"train_loss": -11.326684951782227, "global_step": 400115, "epoch": 2381} {"train_loss": -11.138657569885254, "global_step": 400116, "epoch": 2381} {"train_loss": -11.589820861816406, "global_step": 400117, "epoch": 2381} {"train_loss": -11.610628128051758, "global_step": 400118, "epoch": 2381} {"train_loss": -11.71096420288086, "global_step": 400119, "epoch": 2381} {"train_loss": -11.795395851135254, "global_step": 400120, "epoch": 2381} {"train_loss": -11.533623695373535, "global_step": 400121, "epoch": 2381} {"train_loss": -11.714338302612305, "global_step": 400122, "epoch": 2381} {"train_loss": -11.737635612487793, "global_step": 400123, "epoch": 2381} {"train_loss": -12.165515899658203, "global_step": 400124, "epoch": 2381} {"train_loss": -11.070905685424805, "global_step": 400125, "epoch": 2381} {"train_loss": -12.177521705627441, "global_step": 400126, "epoch": 2381} {"train_loss": -11.332032203674316, "global_step": 400127, "epoch": 2381} {"train_loss": -12.18374252319336, "global_step": 400128, "epoch": 2381} {"train_loss": -11.732627868652344, "global_step": 400129, "epoch": 2381} {"train_loss": -11.89881706237793, "global_step": 400130, "epoch": 2381} {"train_loss": -11.915103912353516, "global_step": 400131, "epoch": 2381} {"train_loss": -12.072548866271973, "global_step": 400132, "epoch": 2381} {"train_loss": -12.068093299865723, "global_step": 400133, "epoch": 2381} {"train_loss": -12.004858016967773, "global_step": 400134, "epoch": 2381} {"train_loss": -12.10107421875, "global_step": 400135, "epoch": 2381} {"train_loss": -11.981054306030273, "global_step": 400136, "epoch": 2381} {"train_loss": -12.108755111694336, "global_step": 400137, "epoch": 2381} {"train_loss": -11.861690521240234, "global_step": 400138, "epoch": 2381} {"train_loss": -11.614830017089844, "global_step": 400139, "epoch": 2381} {"train_loss": -11.243305206298828, "global_step": 400140, "epoch": 2381} {"train_loss": -12.019621849060059, "global_step": 400141, "epoch": 2381} {"train_loss": -11.308357238769531, "global_step": 400142, "epoch": 2381} {"train_loss": -12.400131225585938, "global_step": 400143, "epoch": 2381} {"train_loss": -11.761821746826172, "global_step": 400144, "epoch": 2381} {"train_loss": -12.090261459350586, "global_step": 400145, "epoch": 2381} {"train_loss": -11.873894691467285, "global_step": 400146, "epoch": 2381} {"train_loss": -11.915685653686523, "global_step": 400147, "epoch": 2381} {"train_loss": -12.081954002380371, "global_step": 400148, "epoch": 2381} {"train_loss": -11.932106971740723, "global_step": 400149, "epoch": 2381} {"train_loss": -12.074095726013184, "global_step": 400150, "epoch": 2381} {"train_loss": -12.049174308776855, "global_step": 400151, "epoch": 2381} {"train_loss": -11.82278060913086, "global_step": 400152, "epoch": 2381} {"train_loss": -11.843572616577148, "global_step": 400153, "epoch": 2381} {"train_loss": -11.225695610046387, "global_step": 400154, "epoch": 2381} {"train_loss": -12.045720100402832, "global_step": 400155, "epoch": 2381} {"train_loss": -11.394497871398926, "global_step": 400156, "epoch": 2381} {"train_loss": -12.107749938964844, "global_step": 400157, "epoch": 2381} {"train_loss": -11.915658950805664, "global_step": 400158, "epoch": 2381} {"train_loss": -11.862494468688965, "global_step": 400159, "epoch": 2381} {"train_loss": -11.962642669677734, "global_step": 400160, "epoch": 2381} {"train_loss": -11.948786735534668, "global_step": 400161, "epoch": 2381} {"train_loss": -11.591653823852539, "global_step": 400162, "epoch": 2381} {"train_loss": -11.914712905883789, "global_step": 400163, "epoch": 2381} {"train_loss": -11.81631088256836, "global_step": 400164, "epoch": 2381} {"train_loss": -11.711944580078125, "global_step": 400165, "epoch": 2381} {"train_loss": -12.357047080993652, "global_step": 400166, "epoch": 2381} {"train_loss": -11.750822067260742, "global_step": 400167, "epoch": 2381} {"train_loss": -12.46705436706543, "global_step": 400168, "epoch": 2381} {"train_loss": -12.160748481750488, "global_step": 400169, "epoch": 2381} {"train_loss": -12.18736457824707, "global_step": 400170, "epoch": 2381} {"train_loss": -12.330965042114258, "global_step": 400171, "epoch": 2381} {"train_loss": -12.344991683959961, "global_step": 400172, "epoch": 2381} {"train_loss": -12.246797561645508, "global_step": 400173, "epoch": 2381} {"train_loss": -12.443875312805176, "global_step": 400174, "epoch": 2381} {"train_loss": -11.963319557053703, "global_step": 400175, "epoch": 2381, "val_loss": 303994.1875} {"train_loss": -12.154825210571289, "global_step": 400176, "epoch": 2382} {"train_loss": -12.432256698608398, "global_step": 400177, "epoch": 2382} {"train_loss": -12.064844131469727, "global_step": 400178, "epoch": 2382} {"train_loss": -12.32616901397705, "global_step": 400179, "epoch": 2382} {"train_loss": -12.27924633026123, "global_step": 400180, "epoch": 2382} {"train_loss": -12.102394104003906, "global_step": 400181, "epoch": 2382} {"train_loss": -12.52375602722168, "global_step": 400182, "epoch": 2382} {"train_loss": -12.344966888427734, "global_step": 400183, "epoch": 2382} {"train_loss": -12.22673225402832, "global_step": 400184, "epoch": 2382} {"train_loss": -12.478757858276367, "global_step": 400185, "epoch": 2382} {"train_loss": -12.536675453186035, "global_step": 400186, "epoch": 2382} {"train_loss": -12.445825576782227, "global_step": 400187, "epoch": 2382} {"train_loss": -12.21819019317627, "global_step": 400188, "epoch": 2382} {"train_loss": -12.28614616394043, "global_step": 400189, "epoch": 2382} {"train_loss": -12.590862274169922, "global_step": 400190, "epoch": 2382} {"train_loss": -12.296679496765137, "global_step": 400191, "epoch": 2382} {"train_loss": -12.368940353393555, "global_step": 400192, "epoch": 2382} {"train_loss": -12.57561206817627, "global_step": 400193, "epoch": 2382} {"train_loss": -12.183202743530273, "global_step": 400194, "epoch": 2382} {"train_loss": -12.720727920532227, "global_step": 400195, "epoch": 2382} {"train_loss": -12.692992210388184, "global_step": 400196, "epoch": 2382} {"train_loss": -12.487340927124023, "global_step": 400197, "epoch": 2382} {"train_loss": -12.549888610839844, "global_step": 400198, "epoch": 2382} {"train_loss": -12.417274475097656, "global_step": 400199, "epoch": 2382} {"train_loss": -12.541657447814941, "global_step": 400200, "epoch": 2382} {"train_loss": -12.25629997253418, "global_step": 400201, "epoch": 2382} {"train_loss": -12.535416603088379, "global_step": 400202, "epoch": 2382} {"train_loss": -12.188516616821289, "global_step": 400203, "epoch": 2382} {"train_loss": -12.126646041870117, "global_step": 400204, "epoch": 2382} {"train_loss": -12.299052238464355, "global_step": 400205, "epoch": 2382} {"train_loss": -12.220526695251465, "global_step": 400206, "epoch": 2382} {"train_loss": -11.993807792663574, "global_step": 400207, "epoch": 2382} {"train_loss": -12.190463066101074, "global_step": 400208, "epoch": 2382} {"train_loss": -12.523265838623047, "global_step": 400209, "epoch": 2382} {"train_loss": -11.90129280090332, "global_step": 400210, "epoch": 2382} {"train_loss": -12.439176559448242, "global_step": 400211, "epoch": 2382} {"train_loss": -12.181447982788086, "global_step": 400212, "epoch": 2382} {"train_loss": -12.252768516540527, "global_step": 400213, "epoch": 2382} {"train_loss": -12.075976371765137, "global_step": 400214, "epoch": 2382} {"train_loss": -11.498926162719727, "global_step": 400215, "epoch": 2382} {"train_loss": -12.188441276550293, "global_step": 400216, "epoch": 2382} {"train_loss": -11.678190231323242, "global_step": 400217, "epoch": 2382} {"train_loss": -11.927101135253906, "global_step": 400218, "epoch": 2382} {"train_loss": -12.29885482788086, "global_step": 400219, "epoch": 2382} {"train_loss": -12.505736351013184, "global_step": 400220, "epoch": 2382} {"train_loss": -12.458353042602539, "global_step": 400221, "epoch": 2382} {"train_loss": -12.2890625, "global_step": 400222, "epoch": 2382} {"train_loss": -12.294571876525879, "global_step": 400223, "epoch": 2382} {"train_loss": -12.306232452392578, "global_step": 400224, "epoch": 2382} {"train_loss": -12.407083511352539, "global_step": 400225, "epoch": 2382} {"train_loss": -11.840087890625, "global_step": 400226, "epoch": 2382} {"train_loss": -12.310859680175781, "global_step": 400227, "epoch": 2382} {"train_loss": -11.238662719726562, "global_step": 400228, "epoch": 2382} {"train_loss": -12.32547664642334, "global_step": 400229, "epoch": 2382} {"train_loss": -10.892354965209961, "global_step": 400230, "epoch": 2382} {"train_loss": -12.495697021484375, "global_step": 400231, "epoch": 2382} {"train_loss": -11.764636039733887, "global_step": 400232, "epoch": 2382} {"train_loss": -10.917516708374023, "global_step": 400233, "epoch": 2382} {"train_loss": -12.118423461914062, "global_step": 400234, "epoch": 2382} {"train_loss": -11.180723190307617, "global_step": 400235, "epoch": 2382} {"train_loss": -12.585634231567383, "global_step": 400236, "epoch": 2382} {"train_loss": -11.143585205078125, "global_step": 400237, "epoch": 2382} {"train_loss": -11.805971145629883, "global_step": 400238, "epoch": 2382} {"train_loss": -11.975857734680176, "global_step": 400239, "epoch": 2382} {"train_loss": -10.876143455505371, "global_step": 400240, "epoch": 2382} {"train_loss": -11.74365234375, "global_step": 400241, "epoch": 2382} {"train_loss": -11.692901611328125, "global_step": 400242, "epoch": 2382} {"train_loss": -11.349956512451172, "global_step": 400243, "epoch": 2382} {"train_loss": -12.10987663269043, "global_step": 400244, "epoch": 2382} {"train_loss": -11.163708686828613, "global_step": 400245, "epoch": 2382} {"train_loss": -11.95576286315918, "global_step": 400246, "epoch": 2382} {"train_loss": -11.793574333190918, "global_step": 400247, "epoch": 2382} {"train_loss": -11.646207809448242, "global_step": 400248, "epoch": 2382} {"train_loss": -12.141058921813965, "global_step": 400249, "epoch": 2382} {"train_loss": -11.097450256347656, "global_step": 400250, "epoch": 2382} {"train_loss": -12.547351837158203, "global_step": 400251, "epoch": 2382} {"train_loss": -11.846380233764648, "global_step": 400252, "epoch": 2382} {"train_loss": -11.451875686645508, "global_step": 400253, "epoch": 2382} {"train_loss": -11.663054466247559, "global_step": 400254, "epoch": 2382} {"train_loss": -11.772201538085938, "global_step": 400255, "epoch": 2382} {"train_loss": -12.196404457092285, "global_step": 400256, "epoch": 2382} {"train_loss": -11.134830474853516, "global_step": 400257, "epoch": 2382} {"train_loss": -12.1183500289917, "global_step": 400258, "epoch": 2382} {"train_loss": -11.468778610229492, "global_step": 400259, "epoch": 2382} {"train_loss": -12.044557571411133, "global_step": 400260, "epoch": 2382} {"train_loss": -12.111333847045898, "global_step": 400261, "epoch": 2382} {"train_loss": -12.050687789916992, "global_step": 400262, "epoch": 2382} {"train_loss": -12.02219295501709, "global_step": 400263, "epoch": 2382} {"train_loss": -11.890122413635254, "global_step": 400264, "epoch": 2382} {"train_loss": -11.911455154418945, "global_step": 400265, "epoch": 2382} {"train_loss": -12.221124649047852, "global_step": 400266, "epoch": 2382} {"train_loss": -12.291399002075195, "global_step": 400267, "epoch": 2382} {"train_loss": -12.270471572875977, "global_step": 400268, "epoch": 2382} {"train_loss": -11.950639724731445, "global_step": 400269, "epoch": 2382} {"train_loss": -12.396232604980469, "global_step": 400270, "epoch": 2382} {"train_loss": -12.18022346496582, "global_step": 400271, "epoch": 2382} {"train_loss": -12.111825942993164, "global_step": 400272, "epoch": 2382} {"train_loss": -12.312686920166016, "global_step": 400273, "epoch": 2382} {"train_loss": -12.325843811035156, "global_step": 400274, "epoch": 2382} {"train_loss": -12.460946083068848, "global_step": 400275, "epoch": 2382} {"train_loss": -12.232030868530273, "global_step": 400276, "epoch": 2382} {"train_loss": -12.286134719848633, "global_step": 400277, "epoch": 2382} {"train_loss": -12.077751159667969, "global_step": 400278, "epoch": 2382} {"train_loss": -12.739787101745605, "global_step": 400279, "epoch": 2382} {"train_loss": -12.264482498168945, "global_step": 400280, "epoch": 2382} {"train_loss": -12.31656551361084, "global_step": 400281, "epoch": 2382} {"train_loss": -12.180475234985352, "global_step": 400282, "epoch": 2382} {"train_loss": -12.378368377685547, "global_step": 400283, "epoch": 2382} {"train_loss": -12.469893455505371, "global_step": 400284, "epoch": 2382} {"train_loss": -12.345890998840332, "global_step": 400285, "epoch": 2382} {"train_loss": -12.586410522460938, "global_step": 400286, "epoch": 2382} {"train_loss": -12.130537033081055, "global_step": 400287, "epoch": 2382} {"train_loss": -12.271394729614258, "global_step": 400288, "epoch": 2382} {"train_loss": -12.082365036010742, "global_step": 400289, "epoch": 2382} {"train_loss": -11.44232177734375, "global_step": 400290, "epoch": 2382} {"train_loss": -12.581562995910645, "global_step": 400291, "epoch": 2382} {"train_loss": -12.005829811096191, "global_step": 400292, "epoch": 2382} {"train_loss": -12.053705215454102, "global_step": 400293, "epoch": 2382} {"train_loss": -12.208623886108398, "global_step": 400294, "epoch": 2382} {"train_loss": -11.611603736877441, "global_step": 400295, "epoch": 2382} {"train_loss": -12.55571174621582, "global_step": 400296, "epoch": 2382} {"train_loss": -12.052360534667969, "global_step": 400297, "epoch": 2382} {"train_loss": -12.058853149414062, "global_step": 400298, "epoch": 2382} {"train_loss": -12.327668190002441, "global_step": 400299, "epoch": 2382} {"train_loss": -12.571281433105469, "global_step": 400300, "epoch": 2382} {"train_loss": -12.448795318603516, "global_step": 400301, "epoch": 2382} {"train_loss": -12.651222229003906, "global_step": 400302, "epoch": 2382} {"train_loss": -12.501331329345703, "global_step": 400303, "epoch": 2382} {"train_loss": -12.549065589904785, "global_step": 400304, "epoch": 2382} {"train_loss": -12.580778121948242, "global_step": 400305, "epoch": 2382} {"train_loss": -12.489599227905273, "global_step": 400306, "epoch": 2382} {"train_loss": -12.716279983520508, "global_step": 400307, "epoch": 2382} {"train_loss": -12.481882095336914, "global_step": 400308, "epoch": 2382} {"train_loss": -12.721358299255371, "global_step": 400309, "epoch": 2382} {"train_loss": -12.596946716308594, "global_step": 400310, "epoch": 2382} {"train_loss": -12.549564361572266, "global_step": 400311, "epoch": 2382} {"train_loss": -12.306876182556152, "global_step": 400312, "epoch": 2382} {"train_loss": -12.624029159545898, "global_step": 400313, "epoch": 2382} {"train_loss": -12.581121444702148, "global_step": 400314, "epoch": 2382} {"train_loss": -12.749279975891113, "global_step": 400315, "epoch": 2382} {"train_loss": -12.619860649108887, "global_step": 400316, "epoch": 2382} {"train_loss": -12.70600700378418, "global_step": 400317, "epoch": 2382} {"train_loss": -12.487100601196289, "global_step": 400318, "epoch": 2382} {"train_loss": -12.639045715332031, "global_step": 400319, "epoch": 2382} {"train_loss": -12.41645336151123, "global_step": 400320, "epoch": 2382} {"train_loss": -12.819445610046387, "global_step": 400321, "epoch": 2382} {"train_loss": -12.832550048828125, "global_step": 400322, "epoch": 2382} {"train_loss": -12.62690544128418, "global_step": 400323, "epoch": 2382} {"train_loss": -12.843446731567383, "global_step": 400324, "epoch": 2382} {"train_loss": -12.611833572387695, "global_step": 400325, "epoch": 2382} {"train_loss": -12.768081665039062, "global_step": 400326, "epoch": 2382} {"train_loss": -12.842571258544922, "global_step": 400327, "epoch": 2382} {"train_loss": -12.53273868560791, "global_step": 400328, "epoch": 2382} {"train_loss": -12.403430938720703, "global_step": 400329, "epoch": 2382} {"train_loss": -12.524169921875, "global_step": 400330, "epoch": 2382} {"train_loss": -12.968017578125, "global_step": 400331, "epoch": 2382} {"train_loss": -12.552299499511719, "global_step": 400332, "epoch": 2382} {"train_loss": -12.153711318969727, "global_step": 400333, "epoch": 2382} {"train_loss": -11.709745407104492, "global_step": 400334, "epoch": 2382} {"train_loss": -12.29996109008789, "global_step": 400335, "epoch": 2382} {"train_loss": -12.342522621154785, "global_step": 400336, "epoch": 2382} {"train_loss": -11.437958717346191, "global_step": 400337, "epoch": 2382} {"train_loss": -12.124295234680176, "global_step": 400338, "epoch": 2382} {"train_loss": -12.323158264160156, "global_step": 400339, "epoch": 2382} {"train_loss": -12.567794799804688, "global_step": 400340, "epoch": 2382} {"train_loss": -12.738910675048828, "global_step": 400341, "epoch": 2382} {"train_loss": -12.423662185668945, "global_step": 400342, "epoch": 2382} {"train_loss": -12.21569770290738, "global_step": 400343, "epoch": 2382, "val_loss": 305020.3125} {"train_loss": -11.955034255981445, "global_step": 400344, "epoch": 2383} {"train_loss": -11.873273849487305, "global_step": 400345, "epoch": 2383} {"train_loss": -12.692390441894531, "global_step": 400346, "epoch": 2383} {"train_loss": -12.238728523254395, "global_step": 400347, "epoch": 2383} {"train_loss": -11.840742111206055, "global_step": 400348, "epoch": 2383} {"train_loss": -12.454509735107422, "global_step": 400349, "epoch": 2383} {"train_loss": -12.425537109375, "global_step": 400350, "epoch": 2383} {"train_loss": -11.673834800720215, "global_step": 400351, "epoch": 2383} {"train_loss": -12.489537239074707, "global_step": 400352, "epoch": 2383} {"train_loss": -12.022862434387207, "global_step": 400353, "epoch": 2383} {"train_loss": -12.308921813964844, "global_step": 400354, "epoch": 2383} {"train_loss": -12.13766860961914, "global_step": 400355, "epoch": 2383} {"train_loss": -12.039291381835938, "global_step": 400356, "epoch": 2383} {"train_loss": -11.101631164550781, "global_step": 400357, "epoch": 2383} {"train_loss": -12.355382919311523, "global_step": 400358, "epoch": 2383} {"train_loss": -11.215858459472656, "global_step": 400359, "epoch": 2383} {"train_loss": -11.469194412231445, "global_step": 400360, "epoch": 2383} {"train_loss": -11.850347518920898, "global_step": 400361, "epoch": 2383} {"train_loss": -11.542387008666992, "global_step": 400362, "epoch": 2383} {"train_loss": -11.892462730407715, "global_step": 400363, "epoch": 2383} {"train_loss": -11.828011512756348, "global_step": 400364, "epoch": 2383} {"train_loss": -11.996025085449219, "global_step": 400365, "epoch": 2383} {"train_loss": -11.938265800476074, "global_step": 400366, "epoch": 2383} {"train_loss": -12.214302062988281, "global_step": 400367, "epoch": 2383} {"train_loss": -11.896598815917969, "global_step": 400368, "epoch": 2383} {"train_loss": -12.30790901184082, "global_step": 400369, "epoch": 2383} {"train_loss": -11.84726619720459, "global_step": 400370, "epoch": 2383} {"train_loss": -12.010801315307617, "global_step": 400371, "epoch": 2383} {"train_loss": -12.428232192993164, "global_step": 400372, "epoch": 2383} {"train_loss": -11.996603012084961, "global_step": 400373, "epoch": 2383} {"train_loss": -12.561429977416992, "global_step": 400374, "epoch": 2383} {"train_loss": -12.059042930603027, "global_step": 400375, "epoch": 2383} {"train_loss": -12.43023681640625, "global_step": 400376, "epoch": 2383} {"train_loss": -12.661310195922852, "global_step": 400377, "epoch": 2383} {"train_loss": -12.042221069335938, "global_step": 400378, "epoch": 2383} {"train_loss": -11.827766418457031, "global_step": 400379, "epoch": 2383} {"train_loss": -11.722660064697266, "global_step": 400380, "epoch": 2383} {"train_loss": -12.499823570251465, "global_step": 400381, "epoch": 2383} {"train_loss": -12.013189315795898, "global_step": 400382, "epoch": 2383} {"train_loss": -12.19343090057373, "global_step": 400383, "epoch": 2383} {"train_loss": -12.488744735717773, "global_step": 400384, "epoch": 2383} {"train_loss": -12.313098907470703, "global_step": 400385, "epoch": 2383} {"train_loss": -11.517992973327637, "global_step": 400386, "epoch": 2383} {"train_loss": -11.732820510864258, "global_step": 400387, "epoch": 2383} {"train_loss": -12.060733795166016, "global_step": 400388, "epoch": 2383} {"train_loss": -12.11046028137207, "global_step": 400389, "epoch": 2383} {"train_loss": -11.754786491394043, "global_step": 400390, "epoch": 2383} {"train_loss": -11.96059799194336, "global_step": 400391, "epoch": 2383} {"train_loss": -12.208314895629883, "global_step": 400392, "epoch": 2383} {"train_loss": -12.047195434570312, "global_step": 400393, "epoch": 2383} {"train_loss": -11.910604476928711, "global_step": 400394, "epoch": 2383} {"train_loss": -12.293257713317871, "global_step": 400395, "epoch": 2383} {"train_loss": -11.739263534545898, "global_step": 400396, "epoch": 2383} {"train_loss": -11.686323165893555, "global_step": 400397, "epoch": 2383} {"train_loss": -11.7430419921875, "global_step": 400398, "epoch": 2383} {"train_loss": -12.12368392944336, "global_step": 400399, "epoch": 2383} {"train_loss": -11.808185577392578, "global_step": 400400, "epoch": 2383} {"train_loss": -11.944753646850586, "global_step": 400401, "epoch": 2383} {"train_loss": -11.010196685791016, "global_step": 400402, "epoch": 2383} {"train_loss": -12.395743370056152, "global_step": 400403, "epoch": 2383} {"train_loss": -10.964600563049316, "global_step": 400404, "epoch": 2383} {"train_loss": -10.405838966369629, "global_step": 400405, "epoch": 2383} {"train_loss": -12.236987113952637, "global_step": 400406, "epoch": 2383} {"train_loss": -11.459753036499023, "global_step": 400407, "epoch": 2383} {"train_loss": -11.127963066101074, "global_step": 400408, "epoch": 2383} {"train_loss": -11.730645179748535, "global_step": 400409, "epoch": 2383} {"train_loss": -10.937040328979492, "global_step": 400410, "epoch": 2383} {"train_loss": -10.965252876281738, "global_step": 400411, "epoch": 2383} {"train_loss": -12.000846862792969, "global_step": 400412, "epoch": 2383} {"train_loss": -10.959388732910156, "global_step": 400413, "epoch": 2383} {"train_loss": -11.737398147583008, "global_step": 400414, "epoch": 2383} {"train_loss": -11.861732482910156, "global_step": 400415, "epoch": 2383} {"train_loss": -11.582975387573242, "global_step": 400416, "epoch": 2383} {"train_loss": -11.697504043579102, "global_step": 400417, "epoch": 2383} {"train_loss": -10.757074356079102, "global_step": 400418, "epoch": 2383} {"train_loss": -10.870840072631836, "global_step": 400419, "epoch": 2383} {"train_loss": -11.837251663208008, "global_step": 400420, "epoch": 2383} {"train_loss": -10.922855377197266, "global_step": 400421, "epoch": 2383} {"train_loss": -11.668285369873047, "global_step": 400422, "epoch": 2383} {"train_loss": -11.920913696289062, "global_step": 400423, "epoch": 2383} {"train_loss": -11.990065574645996, "global_step": 400424, "epoch": 2383} {"train_loss": -12.08304214477539, "global_step": 400425, "epoch": 2383} {"train_loss": -12.11117935180664, "global_step": 400426, "epoch": 2383} {"train_loss": -12.135534286499023, "global_step": 400427, "epoch": 2383} {"train_loss": -11.46670913696289, "global_step": 400428, "epoch": 2383} {"train_loss": -11.99484634399414, "global_step": 400429, "epoch": 2383} {"train_loss": -11.915794372558594, "global_step": 400430, "epoch": 2383} {"train_loss": -12.072266578674316, "global_step": 400431, "epoch": 2383} {"train_loss": -11.786758422851562, "global_step": 400432, "epoch": 2383} {"train_loss": -11.657866477966309, "global_step": 400433, "epoch": 2383} {"train_loss": -11.732481956481934, "global_step": 400434, "epoch": 2383} {"train_loss": -11.685880661010742, "global_step": 400435, "epoch": 2383} {"train_loss": -12.018789291381836, "global_step": 400436, "epoch": 2383} {"train_loss": -11.430416107177734, "global_step": 400437, "epoch": 2383} {"train_loss": -11.961437225341797, "global_step": 400438, "epoch": 2383} {"train_loss": -11.771507263183594, "global_step": 400439, "epoch": 2383} {"train_loss": -12.132929801940918, "global_step": 400440, "epoch": 2383} {"train_loss": -12.04318618774414, "global_step": 400441, "epoch": 2383} {"train_loss": -12.018476486206055, "global_step": 400442, "epoch": 2383} {"train_loss": -12.152143478393555, "global_step": 400443, "epoch": 2383} {"train_loss": -11.647134780883789, "global_step": 400444, "epoch": 2383} {"train_loss": -12.11735725402832, "global_step": 400445, "epoch": 2383} {"train_loss": -12.234720230102539, "global_step": 400446, "epoch": 2383} {"train_loss": -12.081778526306152, "global_step": 400447, "epoch": 2383} {"train_loss": -12.26902961730957, "global_step": 400448, "epoch": 2383} {"train_loss": -12.519004821777344, "global_step": 400449, "epoch": 2383} {"train_loss": -12.164657592773438, "global_step": 400450, "epoch": 2383} {"train_loss": -12.152589797973633, "global_step": 400451, "epoch": 2383} {"train_loss": -12.392033576965332, "global_step": 400452, "epoch": 2383} {"train_loss": -12.294761657714844, "global_step": 400453, "epoch": 2383} {"train_loss": -12.712696075439453, "global_step": 400454, "epoch": 2383} {"train_loss": -12.411852836608887, "global_step": 400455, "epoch": 2383} {"train_loss": -12.402507781982422, "global_step": 400456, "epoch": 2383} {"train_loss": -12.565841674804688, "global_step": 400457, "epoch": 2383} {"train_loss": -12.59191608428955, "global_step": 400458, "epoch": 2383} {"train_loss": -12.388148307800293, "global_step": 400459, "epoch": 2383} {"train_loss": -12.550708770751953, "global_step": 400460, "epoch": 2383} {"train_loss": -12.562958717346191, "global_step": 400461, "epoch": 2383} {"train_loss": -12.489934921264648, "global_step": 400462, "epoch": 2383} {"train_loss": -12.617910385131836, "global_step": 400463, "epoch": 2383} {"train_loss": -12.631643295288086, "global_step": 400464, "epoch": 2383} {"train_loss": -12.38763427734375, "global_step": 400465, "epoch": 2383} {"train_loss": -12.774811744689941, "global_step": 400466, "epoch": 2383} {"train_loss": -12.59341812133789, "global_step": 400467, "epoch": 2383} {"train_loss": -12.486948013305664, "global_step": 400468, "epoch": 2383} {"train_loss": -12.716100692749023, "global_step": 400469, "epoch": 2383} {"train_loss": -12.579706192016602, "global_step": 400470, "epoch": 2383} {"train_loss": -12.532037734985352, "global_step": 400471, "epoch": 2383} {"train_loss": -12.669346809387207, "global_step": 400472, "epoch": 2383} {"train_loss": -12.539103507995605, "global_step": 400473, "epoch": 2383} {"train_loss": -12.640286445617676, "global_step": 400474, "epoch": 2383} {"train_loss": -12.60448932647705, "global_step": 400475, "epoch": 2383} {"train_loss": -12.646659851074219, "global_step": 400476, "epoch": 2383} {"train_loss": -12.615097999572754, "global_step": 400477, "epoch": 2383} {"train_loss": -12.604944229125977, "global_step": 400478, "epoch": 2383} {"train_loss": -12.721235275268555, "global_step": 400479, "epoch": 2383} {"train_loss": -12.807461738586426, "global_step": 400480, "epoch": 2383} {"train_loss": -12.804879188537598, "global_step": 400481, "epoch": 2383} {"train_loss": -12.735799789428711, "global_step": 400482, "epoch": 2383} {"train_loss": -12.6529541015625, "global_step": 400483, "epoch": 2383} {"train_loss": -12.558855056762695, "global_step": 400484, "epoch": 2383} {"train_loss": -12.69861888885498, "global_step": 400485, "epoch": 2383} {"train_loss": -12.480291366577148, "global_step": 400486, "epoch": 2383} {"train_loss": -12.770769119262695, "global_step": 400487, "epoch": 2383} {"train_loss": -12.614786148071289, "global_step": 400488, "epoch": 2383} {"train_loss": -12.641947746276855, "global_step": 400489, "epoch": 2383} {"train_loss": -12.652883529663086, "global_step": 400490, "epoch": 2383} {"train_loss": -12.519405364990234, "global_step": 400491, "epoch": 2383} {"train_loss": -12.502925872802734, "global_step": 400492, "epoch": 2383} {"train_loss": -12.341355323791504, "global_step": 400493, "epoch": 2383} {"train_loss": -12.807550430297852, "global_step": 400494, "epoch": 2383} {"train_loss": -12.354158401489258, "global_step": 400495, "epoch": 2383} {"train_loss": -12.272124290466309, "global_step": 400496, "epoch": 2383} {"train_loss": -12.656082153320312, "global_step": 400497, "epoch": 2383} {"train_loss": -12.333311080932617, "global_step": 400498, "epoch": 2383} {"train_loss": -12.521109580993652, "global_step": 400499, "epoch": 2383} {"train_loss": -12.329381942749023, "global_step": 400500, "epoch": 2383} {"train_loss": -12.42109489440918, "global_step": 400501, "epoch": 2383} {"train_loss": -12.46255111694336, "global_step": 400502, "epoch": 2383} {"train_loss": -12.638250350952148, "global_step": 400503, "epoch": 2383} {"train_loss": -12.670793533325195, "global_step": 400504, "epoch": 2383} {"train_loss": -12.807258605957031, "global_step": 400505, "epoch": 2383} {"train_loss": -12.845640182495117, "global_step": 400506, "epoch": 2383} {"train_loss": -12.8714599609375, "global_step": 400507, "epoch": 2383} {"train_loss": -12.643113136291504, "global_step": 400508, "epoch": 2383} {"train_loss": -13.041427612304688, "global_step": 400509, "epoch": 2383} {"train_loss": -12.381359100341797, "global_step": 400510, "epoch": 2383} {"train_loss": -12.137438331331525, "global_step": 400511, "epoch": 2383, "val_loss": 304158.15625} {"train_loss": -12.284727096557617, "global_step": 400512, "epoch": 2384} {"train_loss": -12.174443244934082, "global_step": 400513, "epoch": 2384} {"train_loss": -12.473137855529785, "global_step": 400514, "epoch": 2384} {"train_loss": -11.944244384765625, "global_step": 400515, "epoch": 2384} {"train_loss": -11.704854965209961, "global_step": 400516, "epoch": 2384} {"train_loss": -12.091388702392578, "global_step": 400517, "epoch": 2384} {"train_loss": -12.418634414672852, "global_step": 400518, "epoch": 2384} {"train_loss": -12.398807525634766, "global_step": 400519, "epoch": 2384} {"train_loss": -11.684575080871582, "global_step": 400520, "epoch": 2384} {"train_loss": -10.185108184814453, "global_step": 400521, "epoch": 2384} {"train_loss": -10.775032043457031, "global_step": 400522, "epoch": 2384} {"train_loss": -11.915165901184082, "global_step": 400523, "epoch": 2384} {"train_loss": -11.618602752685547, "global_step": 400524, "epoch": 2384} {"train_loss": -11.066808700561523, "global_step": 400525, "epoch": 2384} {"train_loss": -12.023447036743164, "global_step": 400526, "epoch": 2384} {"train_loss": -11.206096649169922, "global_step": 400527, "epoch": 2384} {"train_loss": -12.137138366699219, "global_step": 400528, "epoch": 2384} {"train_loss": -11.551352500915527, "global_step": 400529, "epoch": 2384} {"train_loss": -11.41482162475586, "global_step": 400530, "epoch": 2384} {"train_loss": -11.040771484375, "global_step": 400531, "epoch": 2384} {"train_loss": -10.17568302154541, "global_step": 400532, "epoch": 2384} {"train_loss": -11.558807373046875, "global_step": 400533, "epoch": 2384} {"train_loss": -12.21401596069336, "global_step": 400534, "epoch": 2384} {"train_loss": -10.788398742675781, "global_step": 400535, "epoch": 2384} {"train_loss": -11.177250862121582, "global_step": 400536, "epoch": 2384} {"train_loss": -11.911459922790527, "global_step": 400537, "epoch": 2384} {"train_loss": -11.11613655090332, "global_step": 400538, "epoch": 2384} {"train_loss": -11.138347625732422, "global_step": 400539, "epoch": 2384} {"train_loss": -11.03587532043457, "global_step": 400540, "epoch": 2384} {"train_loss": -11.041336059570312, "global_step": 400541, "epoch": 2384} {"train_loss": -11.35906982421875, "global_step": 400542, "epoch": 2384} {"train_loss": -11.969245910644531, "global_step": 400543, "epoch": 2384} {"train_loss": -11.853334426879883, "global_step": 400544, "epoch": 2384} {"train_loss": -11.46493148803711, "global_step": 400545, "epoch": 2384} {"train_loss": -12.089563369750977, "global_step": 400546, "epoch": 2384} {"train_loss": -12.27791976928711, "global_step": 400547, "epoch": 2384} {"train_loss": -11.687475204467773, "global_step": 400548, "epoch": 2384} {"train_loss": -12.322135925292969, "global_step": 400549, "epoch": 2384} {"train_loss": -11.68821907043457, "global_step": 400550, "epoch": 2384} {"train_loss": -12.043059349060059, "global_step": 400551, "epoch": 2384} {"train_loss": -11.795145034790039, "global_step": 400552, "epoch": 2384} {"train_loss": -12.199070930480957, "global_step": 400553, "epoch": 2384} {"train_loss": -11.954020500183105, "global_step": 400554, "epoch": 2384} {"train_loss": -12.155795097351074, "global_step": 400555, "epoch": 2384} {"train_loss": -12.175983428955078, "global_step": 400556, "epoch": 2384} {"train_loss": -12.038554191589355, "global_step": 400557, "epoch": 2384} {"train_loss": -12.48861312866211, "global_step": 400558, "epoch": 2384} {"train_loss": -12.211349487304688, "global_step": 400559, "epoch": 2384} {"train_loss": -11.999792098999023, "global_step": 400560, "epoch": 2384} {"train_loss": -12.437614440917969, "global_step": 400561, "epoch": 2384} {"train_loss": -12.240217208862305, "global_step": 400562, "epoch": 2384} {"train_loss": -12.161530494689941, "global_step": 400563, "epoch": 2384} {"train_loss": -12.420012474060059, "global_step": 400564, "epoch": 2384} {"train_loss": -12.127118110656738, "global_step": 400565, "epoch": 2384} {"train_loss": -12.601062774658203, "global_step": 400566, "epoch": 2384} {"train_loss": -12.005693435668945, "global_step": 400567, "epoch": 2384} {"train_loss": -12.508304595947266, "global_step": 400568, "epoch": 2384} {"train_loss": -12.184623718261719, "global_step": 400569, "epoch": 2384} {"train_loss": -12.034576416015625, "global_step": 400570, "epoch": 2384} {"train_loss": -12.717122077941895, "global_step": 400571, "epoch": 2384} {"train_loss": -12.209701538085938, "global_step": 400572, "epoch": 2384} {"train_loss": -12.494793891906738, "global_step": 400573, "epoch": 2384} {"train_loss": -12.438623428344727, "global_step": 400574, "epoch": 2384} {"train_loss": -12.497686386108398, "global_step": 400575, "epoch": 2384} {"train_loss": -12.271577835083008, "global_step": 400576, "epoch": 2384} {"train_loss": -12.454429626464844, "global_step": 400577, "epoch": 2384} {"train_loss": -12.576589584350586, "global_step": 400578, "epoch": 2384} {"train_loss": -12.043585777282715, "global_step": 400579, "epoch": 2384} {"train_loss": -12.209554672241211, "global_step": 400580, "epoch": 2384} {"train_loss": -12.000722885131836, "global_step": 400581, "epoch": 2384} {"train_loss": -12.361080169677734, "global_step": 400582, "epoch": 2384} {"train_loss": -12.467721939086914, "global_step": 400583, "epoch": 2384} {"train_loss": -12.097604751586914, "global_step": 400584, "epoch": 2384} {"train_loss": -12.103570938110352, "global_step": 400585, "epoch": 2384} {"train_loss": -11.459012985229492, "global_step": 400586, "epoch": 2384} {"train_loss": -12.310325622558594, "global_step": 400587, "epoch": 2384} {"train_loss": -12.074808120727539, "global_step": 400588, "epoch": 2384} {"train_loss": -11.380197525024414, "global_step": 400589, "epoch": 2384} {"train_loss": -12.20517349243164, "global_step": 400590, "epoch": 2384} {"train_loss": -11.433578491210938, "global_step": 400591, "epoch": 2384} {"train_loss": -12.437995910644531, "global_step": 400592, "epoch": 2384} {"train_loss": -11.666633605957031, "global_step": 400593, "epoch": 2384} {"train_loss": -11.797130584716797, "global_step": 400594, "epoch": 2384} {"train_loss": -12.279230117797852, "global_step": 400595, "epoch": 2384} {"train_loss": -11.762796401977539, "global_step": 400596, "epoch": 2384} {"train_loss": -11.559813499450684, "global_step": 400597, "epoch": 2384} {"train_loss": -11.995314598083496, "global_step": 400598, "epoch": 2384} {"train_loss": -11.491442680358887, "global_step": 400599, "epoch": 2384} {"train_loss": -12.067487716674805, "global_step": 400600, "epoch": 2384} {"train_loss": -11.702680587768555, "global_step": 400601, "epoch": 2384} {"train_loss": -11.959037780761719, "global_step": 400602, "epoch": 2384} {"train_loss": -11.9048490524292, "global_step": 400603, "epoch": 2384} {"train_loss": -12.183849334716797, "global_step": 400604, "epoch": 2384} {"train_loss": -12.270275115966797, "global_step": 400605, "epoch": 2384} {"train_loss": -12.14877986907959, "global_step": 400606, "epoch": 2384} {"train_loss": -12.029579162597656, "global_step": 400607, "epoch": 2384} {"train_loss": -12.516780853271484, "global_step": 400608, "epoch": 2384} {"train_loss": -12.208917617797852, "global_step": 400609, "epoch": 2384} {"train_loss": -12.581201553344727, "global_step": 400610, "epoch": 2384} {"train_loss": -11.986478805541992, "global_step": 400611, "epoch": 2384} {"train_loss": -12.080812454223633, "global_step": 400612, "epoch": 2384} {"train_loss": -12.146550178527832, "global_step": 400613, "epoch": 2384} {"train_loss": -11.6770601272583, "global_step": 400614, "epoch": 2384} {"train_loss": -12.300138473510742, "global_step": 400615, "epoch": 2384} {"train_loss": -11.249946594238281, "global_step": 400616, "epoch": 2384} {"train_loss": -12.500387191772461, "global_step": 400617, "epoch": 2384} {"train_loss": -11.070211410522461, "global_step": 400618, "epoch": 2384} {"train_loss": -11.982428550720215, "global_step": 400619, "epoch": 2384} {"train_loss": -11.623678207397461, "global_step": 400620, "epoch": 2384} {"train_loss": -12.054695129394531, "global_step": 400621, "epoch": 2384} {"train_loss": -12.411601066589355, "global_step": 400622, "epoch": 2384} {"train_loss": -12.011021614074707, "global_step": 400623, "epoch": 2384} {"train_loss": -12.558858871459961, "global_step": 400624, "epoch": 2384} {"train_loss": -12.114336967468262, "global_step": 400625, "epoch": 2384} {"train_loss": -12.48324203491211, "global_step": 400626, "epoch": 2384} {"train_loss": -11.977472305297852, "global_step": 400627, "epoch": 2384} {"train_loss": -12.412025451660156, "global_step": 400628, "epoch": 2384} {"train_loss": -12.186269760131836, "global_step": 400629, "epoch": 2384} {"train_loss": -12.234161376953125, "global_step": 400630, "epoch": 2384} {"train_loss": -12.3731689453125, "global_step": 400631, "epoch": 2384} {"train_loss": -12.009977340698242, "global_step": 400632, "epoch": 2384} {"train_loss": -12.351764678955078, "global_step": 400633, "epoch": 2384} {"train_loss": -12.209243774414062, "global_step": 400634, "epoch": 2384} {"train_loss": -12.154157638549805, "global_step": 400635, "epoch": 2384} {"train_loss": -12.34764289855957, "global_step": 400636, "epoch": 2384} {"train_loss": -12.32580852508545, "global_step": 400637, "epoch": 2384} {"train_loss": -12.429342269897461, "global_step": 400638, "epoch": 2384} {"train_loss": -12.354124069213867, "global_step": 400639, "epoch": 2384} {"train_loss": -12.316264152526855, "global_step": 400640, "epoch": 2384} {"train_loss": -12.257484436035156, "global_step": 400641, "epoch": 2384} {"train_loss": -11.759332656860352, "global_step": 400642, "epoch": 2384} {"train_loss": -12.286715507507324, "global_step": 400643, "epoch": 2384} {"train_loss": -11.929841041564941, "global_step": 400644, "epoch": 2384} {"train_loss": -11.64786148071289, "global_step": 400645, "epoch": 2384} {"train_loss": -11.818140029907227, "global_step": 400646, "epoch": 2384} {"train_loss": -12.087310791015625, "global_step": 400647, "epoch": 2384} {"train_loss": -11.31812858581543, "global_step": 400648, "epoch": 2384} {"train_loss": -11.68037223815918, "global_step": 400649, "epoch": 2384} {"train_loss": -11.512619018554688, "global_step": 400650, "epoch": 2384} {"train_loss": -11.48177719116211, "global_step": 400651, "epoch": 2384} {"train_loss": -11.669963836669922, "global_step": 400652, "epoch": 2384} {"train_loss": -11.739425659179688, "global_step": 400653, "epoch": 2384} {"train_loss": -11.577571868896484, "global_step": 400654, "epoch": 2384} {"train_loss": -11.926584243774414, "global_step": 400655, "epoch": 2384} {"train_loss": -11.711216926574707, "global_step": 400656, "epoch": 2384} {"train_loss": -12.33941650390625, "global_step": 400657, "epoch": 2384} {"train_loss": -11.524094581604004, "global_step": 400658, "epoch": 2384} {"train_loss": -11.973381996154785, "global_step": 400659, "epoch": 2384} {"train_loss": -11.559017181396484, "global_step": 400660, "epoch": 2384} {"train_loss": -12.190570831298828, "global_step": 400661, "epoch": 2384} {"train_loss": -11.738727569580078, "global_step": 400662, "epoch": 2384} {"train_loss": -12.457318305969238, "global_step": 400663, "epoch": 2384} {"train_loss": -11.849245071411133, "global_step": 400664, "epoch": 2384} {"train_loss": -12.191207885742188, "global_step": 400665, "epoch": 2384} {"train_loss": -11.877538681030273, "global_step": 400666, "epoch": 2384} {"train_loss": -12.424751281738281, "global_step": 400667, "epoch": 2384} {"train_loss": -12.179492950439453, "global_step": 400668, "epoch": 2384} {"train_loss": -11.925636291503906, "global_step": 400669, "epoch": 2384} {"train_loss": -12.339790344238281, "global_step": 400670, "epoch": 2384} {"train_loss": -11.96927261352539, "global_step": 400671, "epoch": 2384} {"train_loss": -12.361841201782227, "global_step": 400672, "epoch": 2384} {"train_loss": -12.589594841003418, "global_step": 400673, "epoch": 2384} {"train_loss": -12.38273811340332, "global_step": 400674, "epoch": 2384} {"train_loss": -12.253632545471191, "global_step": 400675, "epoch": 2384} {"train_loss": -12.713225364685059, "global_step": 400676, "epoch": 2384} {"train_loss": -12.408416748046875, "global_step": 400677, "epoch": 2384} {"train_loss": -12.408130645751953, "global_step": 400678, "epoch": 2384} {"train_loss": -11.986530406134468, "global_step": 400679, "epoch": 2384, "val_loss": 303762.09375} {"train_loss": -12.252555847167969, "global_step": 400680, "epoch": 2385} {"train_loss": -12.504159927368164, "global_step": 400681, "epoch": 2385} {"train_loss": -12.131893157958984, "global_step": 400682, "epoch": 2385} {"train_loss": -12.44618034362793, "global_step": 400683, "epoch": 2385} {"train_loss": -12.233736038208008, "global_step": 400684, "epoch": 2385} {"train_loss": -12.120307922363281, "global_step": 400685, "epoch": 2385} {"train_loss": -12.39437198638916, "global_step": 400686, "epoch": 2385} {"train_loss": -12.211441040039062, "global_step": 400687, "epoch": 2385} {"train_loss": -12.318286895751953, "global_step": 400688, "epoch": 2385} {"train_loss": -12.516237258911133, "global_step": 400689, "epoch": 2385} {"train_loss": -12.355005264282227, "global_step": 400690, "epoch": 2385} {"train_loss": -12.199262619018555, "global_step": 400691, "epoch": 2385} {"train_loss": -12.068037986755371, "global_step": 400692, "epoch": 2385} {"train_loss": -12.846891403198242, "global_step": 400693, "epoch": 2385} {"train_loss": -12.108915328979492, "global_step": 400694, "epoch": 2385} {"train_loss": -12.624090194702148, "global_step": 400695, "epoch": 2385} {"train_loss": -12.365045547485352, "global_step": 400696, "epoch": 2385} {"train_loss": -12.50368595123291, "global_step": 400697, "epoch": 2385} {"train_loss": -12.658239364624023, "global_step": 400698, "epoch": 2385} {"train_loss": -12.56556224822998, "global_step": 400699, "epoch": 2385} {"train_loss": -12.446802139282227, "global_step": 400700, "epoch": 2385} {"train_loss": -12.724939346313477, "global_step": 400701, "epoch": 2385} {"train_loss": -12.468888282775879, "global_step": 400702, "epoch": 2385} {"train_loss": -12.355079650878906, "global_step": 400703, "epoch": 2385} {"train_loss": -12.496137619018555, "global_step": 400704, "epoch": 2385} {"train_loss": -12.519500732421875, "global_step": 400705, "epoch": 2385} {"train_loss": -12.681013107299805, "global_step": 400706, "epoch": 2385} {"train_loss": -12.92522144317627, "global_step": 400707, "epoch": 2385} {"train_loss": -12.771858215332031, "global_step": 400708, "epoch": 2385} {"train_loss": -12.652668952941895, "global_step": 400709, "epoch": 2385} {"train_loss": -12.558526992797852, "global_step": 400710, "epoch": 2385} {"train_loss": -12.752490997314453, "global_step": 400711, "epoch": 2385} {"train_loss": -12.580080032348633, "global_step": 400712, "epoch": 2385} {"train_loss": -12.746343612670898, "global_step": 400713, "epoch": 2385} {"train_loss": -12.730684280395508, "global_step": 400714, "epoch": 2385} {"train_loss": -12.736305236816406, "global_step": 400715, "epoch": 2385} {"train_loss": -12.587871551513672, "global_step": 400716, "epoch": 2385} {"train_loss": -12.735115051269531, "global_step": 400717, "epoch": 2385} {"train_loss": -12.667272567749023, "global_step": 400718, "epoch": 2385} {"train_loss": -12.709859848022461, "global_step": 400719, "epoch": 2385} {"train_loss": -12.715224266052246, "global_step": 400720, "epoch": 2385} {"train_loss": -12.353034019470215, "global_step": 400721, "epoch": 2385} {"train_loss": -12.344467163085938, "global_step": 400722, "epoch": 2385} {"train_loss": -12.443344116210938, "global_step": 400723, "epoch": 2385} {"train_loss": -12.365472793579102, "global_step": 400724, "epoch": 2385} {"train_loss": -12.370980262756348, "global_step": 400725, "epoch": 2385} {"train_loss": -11.352212905883789, "global_step": 400726, "epoch": 2385} {"train_loss": -10.508829116821289, "global_step": 400727, "epoch": 2385} {"train_loss": -11.493313789367676, "global_step": 400728, "epoch": 2385} {"train_loss": -10.532577514648438, "global_step": 400729, "epoch": 2385} {"train_loss": -9.989595413208008, "global_step": 400730, "epoch": 2385} {"train_loss": -11.835699081420898, "global_step": 400731, "epoch": 2385} {"train_loss": -8.20230484008789, "global_step": 400732, "epoch": 2385} {"train_loss": -10.658174514770508, "global_step": 400733, "epoch": 2385} {"train_loss": -9.521873474121094, "global_step": 400734, "epoch": 2385} {"train_loss": -11.183753967285156, "global_step": 400735, "epoch": 2385} {"train_loss": -9.02036190032959, "global_step": 400736, "epoch": 2385} {"train_loss": -10.022573471069336, "global_step": 400737, "epoch": 2385} {"train_loss": -10.775464057922363, "global_step": 400738, "epoch": 2385} {"train_loss": -10.742918014526367, "global_step": 400739, "epoch": 2385} {"train_loss": -8.693302154541016, "global_step": 400740, "epoch": 2385} {"train_loss": -11.706125259399414, "global_step": 400741, "epoch": 2385} {"train_loss": -8.576142311096191, "global_step": 400742, "epoch": 2385} {"train_loss": -11.695423126220703, "global_step": 400743, "epoch": 2385} {"train_loss": -10.719084739685059, "global_step": 400744, "epoch": 2385} {"train_loss": -11.167478561401367, "global_step": 400745, "epoch": 2385} {"train_loss": -10.520463943481445, "global_step": 400746, "epoch": 2385} {"train_loss": -10.670753479003906, "global_step": 400747, "epoch": 2385} {"train_loss": -11.216732025146484, "global_step": 400748, "epoch": 2385} {"train_loss": -11.457098007202148, "global_step": 400749, "epoch": 2385} {"train_loss": -11.490737915039062, "global_step": 400750, "epoch": 2385} {"train_loss": -11.860849380493164, "global_step": 400751, "epoch": 2385} {"train_loss": -11.933860778808594, "global_step": 400752, "epoch": 2385} {"train_loss": -11.553272247314453, "global_step": 400753, "epoch": 2385} {"train_loss": -12.034566879272461, "global_step": 400754, "epoch": 2385} {"train_loss": -11.624231338500977, "global_step": 400755, "epoch": 2385} {"train_loss": -12.192081451416016, "global_step": 400756, "epoch": 2385} {"train_loss": -11.873509407043457, "global_step": 400757, "epoch": 2385} {"train_loss": -12.25366497039795, "global_step": 400758, "epoch": 2385} {"train_loss": -11.955097198486328, "global_step": 400759, "epoch": 2385} {"train_loss": -11.619030952453613, "global_step": 400760, "epoch": 2385} {"train_loss": -12.149589538574219, "global_step": 400761, "epoch": 2385} {"train_loss": -12.04025650024414, "global_step": 400762, "epoch": 2385} {"train_loss": -12.261438369750977, "global_step": 400763, "epoch": 2385} {"train_loss": -12.326774597167969, "global_step": 400764, "epoch": 2385} {"train_loss": -12.131175994873047, "global_step": 400765, "epoch": 2385} {"train_loss": -11.871926307678223, "global_step": 400766, "epoch": 2385} {"train_loss": -12.190664291381836, "global_step": 400767, "epoch": 2385} {"train_loss": -12.552127838134766, "global_step": 400768, "epoch": 2385} {"train_loss": -12.29659366607666, "global_step": 400769, "epoch": 2385} {"train_loss": -12.442089080810547, "global_step": 400770, "epoch": 2385} {"train_loss": -12.227782249450684, "global_step": 400771, "epoch": 2385} {"train_loss": -12.093622207641602, "global_step": 400772, "epoch": 2385} {"train_loss": -12.439863204956055, "global_step": 400773, "epoch": 2385} {"train_loss": -12.474739074707031, "global_step": 400774, "epoch": 2385} {"train_loss": -12.540653228759766, "global_step": 400775, "epoch": 2385} {"train_loss": -12.52910041809082, "global_step": 400776, "epoch": 2385} {"train_loss": -12.40506362915039, "global_step": 400777, "epoch": 2385} {"train_loss": -12.458454132080078, "global_step": 400778, "epoch": 2385} {"train_loss": -12.528995513916016, "global_step": 400779, "epoch": 2385} {"train_loss": -12.286080360412598, "global_step": 400780, "epoch": 2385} {"train_loss": -12.690265655517578, "global_step": 400781, "epoch": 2385} {"train_loss": -12.451164245605469, "global_step": 400782, "epoch": 2385} {"train_loss": -12.76453971862793, "global_step": 400783, "epoch": 2385} {"train_loss": -12.101119995117188, "global_step": 400784, "epoch": 2385} {"train_loss": -12.610137939453125, "global_step": 400785, "epoch": 2385} {"train_loss": -12.45457935333252, "global_step": 400786, "epoch": 2385} {"train_loss": -12.56355094909668, "global_step": 400787, "epoch": 2385} {"train_loss": -12.655430793762207, "global_step": 400788, "epoch": 2385} {"train_loss": -12.521678924560547, "global_step": 400789, "epoch": 2385} {"train_loss": -12.537223815917969, "global_step": 400790, "epoch": 2385} {"train_loss": -12.618058204650879, "global_step": 400791, "epoch": 2385} {"train_loss": -12.500537872314453, "global_step": 400792, "epoch": 2385} {"train_loss": -12.724984169006348, "global_step": 400793, "epoch": 2385} {"train_loss": -12.619623184204102, "global_step": 400794, "epoch": 2385} {"train_loss": -12.256695747375488, "global_step": 400795, "epoch": 2385} {"train_loss": -12.707529067993164, "global_step": 400796, "epoch": 2385} {"train_loss": -12.504854202270508, "global_step": 400797, "epoch": 2385} {"train_loss": -12.579270362854004, "global_step": 400798, "epoch": 2385} {"train_loss": -12.70107650756836, "global_step": 400799, "epoch": 2385} {"train_loss": -12.764795303344727, "global_step": 400800, "epoch": 2385} {"train_loss": -12.700557708740234, "global_step": 400801, "epoch": 2385} {"train_loss": -12.580343246459961, "global_step": 400802, "epoch": 2385} {"train_loss": -12.544252395629883, "global_step": 400803, "epoch": 2385} {"train_loss": -12.898541450500488, "global_step": 400804, "epoch": 2385} {"train_loss": -12.51211929321289, "global_step": 400805, "epoch": 2385} {"train_loss": -12.731935501098633, "global_step": 400806, "epoch": 2385} {"train_loss": -12.683584213256836, "global_step": 400807, "epoch": 2385} {"train_loss": -12.610745429992676, "global_step": 400808, "epoch": 2385} {"train_loss": -12.889354705810547, "global_step": 400809, "epoch": 2385} {"train_loss": -12.77676773071289, "global_step": 400810, "epoch": 2385} {"train_loss": -12.794455528259277, "global_step": 400811, "epoch": 2385} {"train_loss": -12.622757911682129, "global_step": 400812, "epoch": 2385} {"train_loss": -12.50820541381836, "global_step": 400813, "epoch": 2385} {"train_loss": -12.388202667236328, "global_step": 400814, "epoch": 2385} {"train_loss": -12.823042869567871, "global_step": 400815, "epoch": 2385} {"train_loss": -12.48143482208252, "global_step": 400816, "epoch": 2385} {"train_loss": -12.688919067382812, "global_step": 400817, "epoch": 2385} {"train_loss": -12.510737419128418, "global_step": 400818, "epoch": 2385} {"train_loss": -12.922370910644531, "global_step": 400819, "epoch": 2385} {"train_loss": -12.195716857910156, "global_step": 400820, "epoch": 2385} {"train_loss": -12.688326835632324, "global_step": 400821, "epoch": 2385} {"train_loss": -12.943915367126465, "global_step": 400822, "epoch": 2385} {"train_loss": -13.09104061126709, "global_step": 400823, "epoch": 2385} {"train_loss": -12.599292755126953, "global_step": 400824, "epoch": 2385} {"train_loss": -12.915093421936035, "global_step": 400825, "epoch": 2385} {"train_loss": -12.684103965759277, "global_step": 400826, "epoch": 2385} {"train_loss": -12.68678092956543, "global_step": 400827, "epoch": 2385} {"train_loss": -12.827088356018066, "global_step": 400828, "epoch": 2385} {"train_loss": -12.833559036254883, "global_step": 400829, "epoch": 2385} {"train_loss": -12.774499893188477, "global_step": 400830, "epoch": 2385} {"train_loss": -12.656649589538574, "global_step": 400831, "epoch": 2385} {"train_loss": -12.650941848754883, "global_step": 400832, "epoch": 2385} {"train_loss": -12.437135696411133, "global_step": 400833, "epoch": 2385} {"train_loss": -12.821297645568848, "global_step": 400834, "epoch": 2385} {"train_loss": -12.806783676147461, "global_step": 400835, "epoch": 2385} {"train_loss": -12.832589149475098, "global_step": 400836, "epoch": 2385} {"train_loss": -12.198722839355469, "global_step": 400837, "epoch": 2385} {"train_loss": -12.38607120513916, "global_step": 400838, "epoch": 2385} {"train_loss": -12.740172386169434, "global_step": 400839, "epoch": 2385} {"train_loss": -12.237292289733887, "global_step": 400840, "epoch": 2385} {"train_loss": -12.389427185058594, "global_step": 400841, "epoch": 2385} {"train_loss": -12.376723289489746, "global_step": 400842, "epoch": 2385} {"train_loss": -12.25953483581543, "global_step": 400843, "epoch": 2385} {"train_loss": -11.590292930603027, "global_step": 400844, "epoch": 2385} {"train_loss": -12.073413848876953, "global_step": 400845, "epoch": 2385} {"train_loss": -12.148301124572754, "global_step": 400846, "epoch": 2385} {"train_loss": -12.170941517466591, "global_step": 400847, "epoch": 2385, "val_loss": 301908.46875, "train_action_mse_error": 1.284547209739685} {"train_loss": -11.94212818145752, "global_step": 400848, "epoch": 2386} {"train_loss": -11.920761108398438, "global_step": 400849, "epoch": 2386} {"train_loss": -10.640898704528809, "global_step": 400850, "epoch": 2386} {"train_loss": -12.269587516784668, "global_step": 400851, "epoch": 2386} {"train_loss": -12.075420379638672, "global_step": 400852, "epoch": 2386} {"train_loss": -11.210691452026367, "global_step": 400853, "epoch": 2386} {"train_loss": -11.58489990234375, "global_step": 400854, "epoch": 2386} {"train_loss": -11.591914176940918, "global_step": 400855, "epoch": 2386} {"train_loss": -11.453598022460938, "global_step": 400856, "epoch": 2386} {"train_loss": -12.177229881286621, "global_step": 400857, "epoch": 2386} {"train_loss": -12.06224536895752, "global_step": 400858, "epoch": 2386} {"train_loss": -11.493476867675781, "global_step": 400859, "epoch": 2386} {"train_loss": -11.635149002075195, "global_step": 400860, "epoch": 2386} {"train_loss": -11.865543365478516, "global_step": 400861, "epoch": 2386} {"train_loss": -11.936595916748047, "global_step": 400862, "epoch": 2386} {"train_loss": -11.513944625854492, "global_step": 400863, "epoch": 2386} {"train_loss": -11.110532760620117, "global_step": 400864, "epoch": 2386} {"train_loss": -11.209810256958008, "global_step": 400865, "epoch": 2386} {"train_loss": -11.861255645751953, "global_step": 400866, "epoch": 2386} {"train_loss": -10.683290481567383, "global_step": 400867, "epoch": 2386} {"train_loss": -11.702458381652832, "global_step": 400868, "epoch": 2386} {"train_loss": -11.402145385742188, "global_step": 400869, "epoch": 2386} {"train_loss": -11.4148530960083, "global_step": 400870, "epoch": 2386} {"train_loss": -12.028703689575195, "global_step": 400871, "epoch": 2386} {"train_loss": -12.043817520141602, "global_step": 400872, "epoch": 2386} {"train_loss": -11.34977912902832, "global_step": 400873, "epoch": 2386} {"train_loss": -12.163305282592773, "global_step": 400874, "epoch": 2386} {"train_loss": -11.702774047851562, "global_step": 400875, "epoch": 2386} {"train_loss": -11.185307502746582, "global_step": 400876, "epoch": 2386} {"train_loss": -10.6136474609375, "global_step": 400877, "epoch": 2386} {"train_loss": -12.392024040222168, "global_step": 400878, "epoch": 2386} {"train_loss": -10.825084686279297, "global_step": 400879, "epoch": 2386} {"train_loss": -12.172402381896973, "global_step": 400880, "epoch": 2386} {"train_loss": -11.293968200683594, "global_step": 400881, "epoch": 2386} {"train_loss": -11.687307357788086, "global_step": 400882, "epoch": 2386} {"train_loss": -12.329890251159668, "global_step": 400883, "epoch": 2386} {"train_loss": -11.018465995788574, "global_step": 400884, "epoch": 2386} {"train_loss": -12.127130508422852, "global_step": 400885, "epoch": 2386} {"train_loss": -11.605813980102539, "global_step": 400886, "epoch": 2386} {"train_loss": -11.499002456665039, "global_step": 400887, "epoch": 2386} {"train_loss": -11.627079963684082, "global_step": 400888, "epoch": 2386} {"train_loss": -11.876493453979492, "global_step": 400889, "epoch": 2386} {"train_loss": -11.291083335876465, "global_step": 400890, "epoch": 2386} {"train_loss": -11.070000648498535, "global_step": 400891, "epoch": 2386} {"train_loss": -10.90972900390625, "global_step": 400892, "epoch": 2386} {"train_loss": -11.258904457092285, "global_step": 400893, "epoch": 2386} {"train_loss": -10.656582832336426, "global_step": 400894, "epoch": 2386} {"train_loss": -11.342864990234375, "global_step": 400895, "epoch": 2386} {"train_loss": -10.843076705932617, "global_step": 400896, "epoch": 2386} {"train_loss": -12.208504676818848, "global_step": 400897, "epoch": 2386} {"train_loss": -11.089765548706055, "global_step": 400898, "epoch": 2386} {"train_loss": -11.937994003295898, "global_step": 400899, "epoch": 2386} {"train_loss": -11.266134262084961, "global_step": 400900, "epoch": 2386} {"train_loss": -12.101736068725586, "global_step": 400901, "epoch": 2386} {"train_loss": -11.748432159423828, "global_step": 400902, "epoch": 2386} {"train_loss": -11.8656587600708, "global_step": 400903, "epoch": 2386} {"train_loss": -11.724326133728027, "global_step": 400904, "epoch": 2386} {"train_loss": -12.42882251739502, "global_step": 400905, "epoch": 2386} {"train_loss": -11.814048767089844, "global_step": 400906, "epoch": 2386} {"train_loss": -12.001100540161133, "global_step": 400907, "epoch": 2386} {"train_loss": -11.049528121948242, "global_step": 400908, "epoch": 2386} {"train_loss": -11.980585098266602, "global_step": 400909, "epoch": 2386} {"train_loss": -11.832724571228027, "global_step": 400910, "epoch": 2386} {"train_loss": -11.621668815612793, "global_step": 400911, "epoch": 2386} {"train_loss": -12.121936798095703, "global_step": 400912, "epoch": 2386} {"train_loss": -11.949816703796387, "global_step": 400913, "epoch": 2386} {"train_loss": -12.157598495483398, "global_step": 400914, "epoch": 2386} {"train_loss": -12.193876266479492, "global_step": 400915, "epoch": 2386} {"train_loss": -12.286303520202637, "global_step": 400916, "epoch": 2386} {"train_loss": -12.423036575317383, "global_step": 400917, "epoch": 2386} {"train_loss": -12.155320167541504, "global_step": 400918, "epoch": 2386} {"train_loss": -12.447793006896973, "global_step": 400919, "epoch": 2386} {"train_loss": -12.42291259765625, "global_step": 400920, "epoch": 2386} {"train_loss": -12.209970474243164, "global_step": 400921, "epoch": 2386} {"train_loss": -12.2578125, "global_step": 400922, "epoch": 2386} {"train_loss": -12.323116302490234, "global_step": 400923, "epoch": 2386} {"train_loss": -12.19412612915039, "global_step": 400924, "epoch": 2386} {"train_loss": -12.483359336853027, "global_step": 400925, "epoch": 2386} {"train_loss": -12.282737731933594, "global_step": 400926, "epoch": 2386} {"train_loss": -12.110342025756836, "global_step": 400927, "epoch": 2386} {"train_loss": -12.420117378234863, "global_step": 400928, "epoch": 2386} {"train_loss": -12.647510528564453, "global_step": 400929, "epoch": 2386} {"train_loss": -12.133434295654297, "global_step": 400930, "epoch": 2386} {"train_loss": -11.980113983154297, "global_step": 400931, "epoch": 2386} {"train_loss": -12.150407791137695, "global_step": 400932, "epoch": 2386} {"train_loss": -12.34912395477295, "global_step": 400933, "epoch": 2386} {"train_loss": -11.85065746307373, "global_step": 400934, "epoch": 2386} {"train_loss": -12.15762996673584, "global_step": 400935, "epoch": 2386} {"train_loss": -12.195762634277344, "global_step": 400936, "epoch": 2386} {"train_loss": -11.971590042114258, "global_step": 400937, "epoch": 2386} {"train_loss": -12.064390182495117, "global_step": 400938, "epoch": 2386} {"train_loss": -11.937273025512695, "global_step": 400939, "epoch": 2386} {"train_loss": -12.387042045593262, "global_step": 400940, "epoch": 2386} {"train_loss": -12.233115196228027, "global_step": 400941, "epoch": 2386} {"train_loss": -12.174888610839844, "global_step": 400942, "epoch": 2386} {"train_loss": -12.231057167053223, "global_step": 400943, "epoch": 2386} {"train_loss": -12.10698127746582, "global_step": 400944, "epoch": 2386} {"train_loss": -12.541574478149414, "global_step": 400945, "epoch": 2386} {"train_loss": -12.368890762329102, "global_step": 400946, "epoch": 2386} {"train_loss": -12.649353981018066, "global_step": 400947, "epoch": 2386} {"train_loss": -12.30729866027832, "global_step": 400948, "epoch": 2386} {"train_loss": -12.36593246459961, "global_step": 400949, "epoch": 2386} {"train_loss": -12.447737693786621, "global_step": 400950, "epoch": 2386} {"train_loss": -12.185426712036133, "global_step": 400951, "epoch": 2386} {"train_loss": -12.200553894042969, "global_step": 400952, "epoch": 2386} {"train_loss": -12.07461929321289, "global_step": 400953, "epoch": 2386} {"train_loss": -11.709268569946289, "global_step": 400954, "epoch": 2386} {"train_loss": -12.380904197692871, "global_step": 400955, "epoch": 2386} {"train_loss": -12.129938125610352, "global_step": 400956, "epoch": 2386} {"train_loss": -12.279687881469727, "global_step": 400957, "epoch": 2386} {"train_loss": -12.224912643432617, "global_step": 400958, "epoch": 2386} {"train_loss": -11.473457336425781, "global_step": 400959, "epoch": 2386} {"train_loss": -11.883285522460938, "global_step": 400960, "epoch": 2386} {"train_loss": -12.398849487304688, "global_step": 400961, "epoch": 2386} {"train_loss": -11.841302871704102, "global_step": 400962, "epoch": 2386} {"train_loss": -12.327064514160156, "global_step": 400963, "epoch": 2386} {"train_loss": -11.703712463378906, "global_step": 400964, "epoch": 2386} {"train_loss": -11.89134407043457, "global_step": 400965, "epoch": 2386} {"train_loss": -11.510734558105469, "global_step": 400966, "epoch": 2386} {"train_loss": -12.276237487792969, "global_step": 400967, "epoch": 2386} {"train_loss": -11.607885360717773, "global_step": 400968, "epoch": 2386} {"train_loss": -12.296162605285645, "global_step": 400969, "epoch": 2386} {"train_loss": -11.94546127319336, "global_step": 400970, "epoch": 2386} {"train_loss": -11.686763763427734, "global_step": 400971, "epoch": 2386} {"train_loss": -12.739105224609375, "global_step": 400972, "epoch": 2386} {"train_loss": -12.127206802368164, "global_step": 400973, "epoch": 2386} {"train_loss": -12.051163673400879, "global_step": 400974, "epoch": 2386} {"train_loss": -12.240087509155273, "global_step": 400975, "epoch": 2386} {"train_loss": -12.170495986938477, "global_step": 400976, "epoch": 2386} {"train_loss": -11.82612133026123, "global_step": 400977, "epoch": 2386} {"train_loss": -12.626391410827637, "global_step": 400978, "epoch": 2386} {"train_loss": -12.124250411987305, "global_step": 400979, "epoch": 2386} {"train_loss": -12.610912322998047, "global_step": 400980, "epoch": 2386} {"train_loss": -11.850762367248535, "global_step": 400981, "epoch": 2386} {"train_loss": -12.302152633666992, "global_step": 400982, "epoch": 2386} {"train_loss": -12.395777702331543, "global_step": 400983, "epoch": 2386} {"train_loss": -12.196598052978516, "global_step": 400984, "epoch": 2386} {"train_loss": -12.308375358581543, "global_step": 400985, "epoch": 2386} {"train_loss": -11.988312721252441, "global_step": 400986, "epoch": 2386} {"train_loss": -12.009021759033203, "global_step": 400987, "epoch": 2386} {"train_loss": -12.472894668579102, "global_step": 400988, "epoch": 2386} {"train_loss": -11.817808151245117, "global_step": 400989, "epoch": 2386} {"train_loss": -12.264881134033203, "global_step": 400990, "epoch": 2386} {"train_loss": -11.976680755615234, "global_step": 400991, "epoch": 2386} {"train_loss": -12.496236801147461, "global_step": 400992, "epoch": 2386} {"train_loss": -12.288432121276855, "global_step": 400993, "epoch": 2386} {"train_loss": -12.196611404418945, "global_step": 400994, "epoch": 2386} {"train_loss": -12.061336517333984, "global_step": 400995, "epoch": 2386} {"train_loss": -12.442179679870605, "global_step": 400996, "epoch": 2386} {"train_loss": -12.116065979003906, "global_step": 400997, "epoch": 2386} {"train_loss": -12.534723281860352, "global_step": 400998, "epoch": 2386} {"train_loss": -12.18602180480957, "global_step": 400999, "epoch": 2386} {"train_loss": -12.515913963317871, "global_step": 401000, "epoch": 2386} {"train_loss": -11.960590362548828, "global_step": 401001, "epoch": 2386} {"train_loss": -12.773345947265625, "global_step": 401002, "epoch": 2386} {"train_loss": -12.324653625488281, "global_step": 401003, "epoch": 2386} {"train_loss": -12.613008499145508, "global_step": 401004, "epoch": 2386} {"train_loss": -12.408893585205078, "global_step": 401005, "epoch": 2386} {"train_loss": -12.499898910522461, "global_step": 401006, "epoch": 2386} {"train_loss": -12.190441131591797, "global_step": 401007, "epoch": 2386} {"train_loss": -12.37138843536377, "global_step": 401008, "epoch": 2386} {"train_loss": -12.297572135925293, "global_step": 401009, "epoch": 2386} {"train_loss": -12.389275550842285, "global_step": 401010, "epoch": 2386} {"train_loss": -12.301082611083984, "global_step": 401011, "epoch": 2386} {"train_loss": -12.816692352294922, "global_step": 401012, "epoch": 2386} {"train_loss": -12.544637680053711, "global_step": 401013, "epoch": 2386} {"train_loss": -12.625103950500488, "global_step": 401014, "epoch": 2386} {"train_loss": -11.984893543379647, "global_step": 401015, "epoch": 2386, "val_loss": 299453.8125} {"train_loss": -12.491745948791504, "global_step": 401016, "epoch": 2387} {"train_loss": -12.752653121948242, "global_step": 401017, "epoch": 2387} {"train_loss": -12.619068145751953, "global_step": 401018, "epoch": 2387} {"train_loss": -12.289888381958008, "global_step": 401019, "epoch": 2387} {"train_loss": -12.398290634155273, "global_step": 401020, "epoch": 2387} {"train_loss": -12.480934143066406, "global_step": 401021, "epoch": 2387} {"train_loss": -12.58230972290039, "global_step": 401022, "epoch": 2387} {"train_loss": -12.300329208374023, "global_step": 401023, "epoch": 2387} {"train_loss": -12.329672813415527, "global_step": 401024, "epoch": 2387} {"train_loss": -12.419960021972656, "global_step": 401025, "epoch": 2387} {"train_loss": -12.253839492797852, "global_step": 401026, "epoch": 2387} {"train_loss": -12.52025318145752, "global_step": 401027, "epoch": 2387} {"train_loss": -12.569746017456055, "global_step": 401028, "epoch": 2387} {"train_loss": -12.473665237426758, "global_step": 401029, "epoch": 2387} {"train_loss": -12.453902244567871, "global_step": 401030, "epoch": 2387} {"train_loss": -12.550687789916992, "global_step": 401031, "epoch": 2387} {"train_loss": -12.484495162963867, "global_step": 401032, "epoch": 2387} {"train_loss": -12.60953426361084, "global_step": 401033, "epoch": 2387} {"train_loss": -12.410516738891602, "global_step": 401034, "epoch": 2387} {"train_loss": -12.676273345947266, "global_step": 401035, "epoch": 2387} {"train_loss": -12.571765899658203, "global_step": 401036, "epoch": 2387} {"train_loss": -12.683290481567383, "global_step": 401037, "epoch": 2387} {"train_loss": -12.252944946289062, "global_step": 401038, "epoch": 2387} {"train_loss": -12.491645812988281, "global_step": 401039, "epoch": 2387} {"train_loss": -12.55300521850586, "global_step": 401040, "epoch": 2387} {"train_loss": -12.294755935668945, "global_step": 401041, "epoch": 2387} {"train_loss": -11.983697891235352, "global_step": 401042, "epoch": 2387} {"train_loss": -12.131903648376465, "global_step": 401043, "epoch": 2387} {"train_loss": -12.295413970947266, "global_step": 401044, "epoch": 2387} {"train_loss": -11.285664558410645, "global_step": 401045, "epoch": 2387} {"train_loss": -12.338396072387695, "global_step": 401046, "epoch": 2387} {"train_loss": -9.96863079071045, "global_step": 401047, "epoch": 2387} {"train_loss": -11.649038314819336, "global_step": 401048, "epoch": 2387} {"train_loss": -11.725767135620117, "global_step": 401049, "epoch": 2387} {"train_loss": -10.243446350097656, "global_step": 401050, "epoch": 2387} {"train_loss": -11.930458068847656, "global_step": 401051, "epoch": 2387} {"train_loss": -9.685942649841309, "global_step": 401052, "epoch": 2387} {"train_loss": -12.117701530456543, "global_step": 401053, "epoch": 2387} {"train_loss": -9.525141716003418, "global_step": 401054, "epoch": 2387} {"train_loss": -11.834732055664062, "global_step": 401055, "epoch": 2387} {"train_loss": -10.122685432434082, "global_step": 401056, "epoch": 2387} {"train_loss": -11.448058128356934, "global_step": 401057, "epoch": 2387} {"train_loss": -11.04928207397461, "global_step": 401058, "epoch": 2387} {"train_loss": -11.490659713745117, "global_step": 401059, "epoch": 2387} {"train_loss": -11.233386039733887, "global_step": 401060, "epoch": 2387} {"train_loss": -11.198151588439941, "global_step": 401061, "epoch": 2387} {"train_loss": -11.743157386779785, "global_step": 401062, "epoch": 2387} {"train_loss": -10.93712329864502, "global_step": 401063, "epoch": 2387} {"train_loss": -11.233747482299805, "global_step": 401064, "epoch": 2387} {"train_loss": -10.958176612854004, "global_step": 401065, "epoch": 2387} {"train_loss": -11.538208961486816, "global_step": 401066, "epoch": 2387} {"train_loss": -11.725958824157715, "global_step": 401067, "epoch": 2387} {"train_loss": -10.857818603515625, "global_step": 401068, "epoch": 2387} {"train_loss": -12.099185943603516, "global_step": 401069, "epoch": 2387} {"train_loss": -11.272453308105469, "global_step": 401070, "epoch": 2387} {"train_loss": -11.661754608154297, "global_step": 401071, "epoch": 2387} {"train_loss": -11.724356651306152, "global_step": 401072, "epoch": 2387} {"train_loss": -11.476726531982422, "global_step": 401073, "epoch": 2387} {"train_loss": -11.626429557800293, "global_step": 401074, "epoch": 2387} {"train_loss": -11.861324310302734, "global_step": 401075, "epoch": 2387} {"train_loss": -11.13371467590332, "global_step": 401076, "epoch": 2387} {"train_loss": -11.675151824951172, "global_step": 401077, "epoch": 2387} {"train_loss": -10.950161933898926, "global_step": 401078, "epoch": 2387} {"train_loss": -11.342313766479492, "global_step": 401079, "epoch": 2387} {"train_loss": -10.420902252197266, "global_step": 401080, "epoch": 2387} {"train_loss": -10.79265022277832, "global_step": 401081, "epoch": 2387} {"train_loss": -10.919723510742188, "global_step": 401082, "epoch": 2387} {"train_loss": -10.205556869506836, "global_step": 401083, "epoch": 2387} {"train_loss": -10.188421249389648, "global_step": 401084, "epoch": 2387} {"train_loss": -11.121285438537598, "global_step": 401085, "epoch": 2387} {"train_loss": -11.548645973205566, "global_step": 401086, "epoch": 2387} {"train_loss": -10.64406967163086, "global_step": 401087, "epoch": 2387} {"train_loss": -11.677865028381348, "global_step": 401088, "epoch": 2387} {"train_loss": -10.004368782043457, "global_step": 401089, "epoch": 2387} {"train_loss": -11.511908531188965, "global_step": 401090, "epoch": 2387} {"train_loss": -10.334709167480469, "global_step": 401091, "epoch": 2387} {"train_loss": -11.228446960449219, "global_step": 401092, "epoch": 2387} {"train_loss": -12.036625862121582, "global_step": 401093, "epoch": 2387} {"train_loss": -11.436538696289062, "global_step": 401094, "epoch": 2387} {"train_loss": -12.063804626464844, "global_step": 401095, "epoch": 2387} {"train_loss": -11.84005069732666, "global_step": 401096, "epoch": 2387} {"train_loss": -11.937307357788086, "global_step": 401097, "epoch": 2387} {"train_loss": -12.157510757446289, "global_step": 401098, "epoch": 2387} {"train_loss": -12.013751983642578, "global_step": 401099, "epoch": 2387} {"train_loss": -12.0006103515625, "global_step": 401100, "epoch": 2387} {"train_loss": -12.05204963684082, "global_step": 401101, "epoch": 2387} {"train_loss": -12.334578514099121, "global_step": 401102, "epoch": 2387} {"train_loss": -12.01140308380127, "global_step": 401103, "epoch": 2387} {"train_loss": -12.388143539428711, "global_step": 401104, "epoch": 2387} {"train_loss": -12.023416519165039, "global_step": 401105, "epoch": 2387} {"train_loss": -12.32973861694336, "global_step": 401106, "epoch": 2387} {"train_loss": -11.886825561523438, "global_step": 401107, "epoch": 2387} {"train_loss": -12.177440643310547, "global_step": 401108, "epoch": 2387} {"train_loss": -12.185755729675293, "global_step": 401109, "epoch": 2387} {"train_loss": -12.389446258544922, "global_step": 401110, "epoch": 2387} {"train_loss": -12.144417762756348, "global_step": 401111, "epoch": 2387} {"train_loss": -12.460729598999023, "global_step": 401112, "epoch": 2387} {"train_loss": -12.266307830810547, "global_step": 401113, "epoch": 2387} {"train_loss": -12.580647468566895, "global_step": 401114, "epoch": 2387} {"train_loss": -12.456558227539062, "global_step": 401115, "epoch": 2387} {"train_loss": -12.473713874816895, "global_step": 401116, "epoch": 2387} {"train_loss": -12.327938079833984, "global_step": 401117, "epoch": 2387} {"train_loss": -12.301231384277344, "global_step": 401118, "epoch": 2387} {"train_loss": -12.452518463134766, "global_step": 401119, "epoch": 2387} {"train_loss": -12.425080299377441, "global_step": 401120, "epoch": 2387} {"train_loss": -12.601263046264648, "global_step": 401121, "epoch": 2387} {"train_loss": -12.264854431152344, "global_step": 401122, "epoch": 2387} {"train_loss": -12.297758102416992, "global_step": 401123, "epoch": 2387} {"train_loss": -12.416522979736328, "global_step": 401124, "epoch": 2387} {"train_loss": -12.47885799407959, "global_step": 401125, "epoch": 2387} {"train_loss": -12.69146728515625, "global_step": 401126, "epoch": 2387} {"train_loss": -12.760366439819336, "global_step": 401127, "epoch": 2387} {"train_loss": -12.497543334960938, "global_step": 401128, "epoch": 2387} {"train_loss": -12.434029579162598, "global_step": 401129, "epoch": 2387} {"train_loss": -12.43377685546875, "global_step": 401130, "epoch": 2387} {"train_loss": -12.639050483703613, "global_step": 401131, "epoch": 2387} {"train_loss": -12.610466003417969, "global_step": 401132, "epoch": 2387} {"train_loss": -12.697209358215332, "global_step": 401133, "epoch": 2387} {"train_loss": -12.753093719482422, "global_step": 401134, "epoch": 2387} {"train_loss": -12.6051664352417, "global_step": 401135, "epoch": 2387} {"train_loss": -12.622062683105469, "global_step": 401136, "epoch": 2387} {"train_loss": -12.688443183898926, "global_step": 401137, "epoch": 2387} {"train_loss": -12.791019439697266, "global_step": 401138, "epoch": 2387} {"train_loss": -12.509952545166016, "global_step": 401139, "epoch": 2387} {"train_loss": -12.622451782226562, "global_step": 401140, "epoch": 2387} {"train_loss": -12.532129287719727, "global_step": 401141, "epoch": 2387} {"train_loss": -12.864224433898926, "global_step": 401142, "epoch": 2387} {"train_loss": -12.68553352355957, "global_step": 401143, "epoch": 2387} {"train_loss": -12.740161895751953, "global_step": 401144, "epoch": 2387} {"train_loss": -12.760597229003906, "global_step": 401145, "epoch": 2387} {"train_loss": -12.761293411254883, "global_step": 401146, "epoch": 2387} {"train_loss": -12.880062103271484, "global_step": 401147, "epoch": 2387} {"train_loss": -12.734654426574707, "global_step": 401148, "epoch": 2387} {"train_loss": -12.745779037475586, "global_step": 401149, "epoch": 2387} {"train_loss": -12.610340118408203, "global_step": 401150, "epoch": 2387} {"train_loss": -12.74066162109375, "global_step": 401151, "epoch": 2387} {"train_loss": -12.497758865356445, "global_step": 401152, "epoch": 2387} {"train_loss": -12.781244277954102, "global_step": 401153, "epoch": 2387} {"train_loss": -12.731449127197266, "global_step": 401154, "epoch": 2387} {"train_loss": -12.59353256225586, "global_step": 401155, "epoch": 2387} {"train_loss": -12.672828674316406, "global_step": 401156, "epoch": 2387} {"train_loss": -12.647634506225586, "global_step": 401157, "epoch": 2387} {"train_loss": -12.966802597045898, "global_step": 401158, "epoch": 2387} {"train_loss": -12.8397216796875, "global_step": 401159, "epoch": 2387} {"train_loss": -12.744215965270996, "global_step": 401160, "epoch": 2387} {"train_loss": -12.585653305053711, "global_step": 401161, "epoch": 2387} {"train_loss": -12.774169921875, "global_step": 401162, "epoch": 2387} {"train_loss": -12.795722961425781, "global_step": 401163, "epoch": 2387} {"train_loss": -12.615396499633789, "global_step": 401164, "epoch": 2387} {"train_loss": -12.601034164428711, "global_step": 401165, "epoch": 2387} {"train_loss": -12.78817367553711, "global_step": 401166, "epoch": 2387} {"train_loss": -12.72517204284668, "global_step": 401167, "epoch": 2387} {"train_loss": -12.477846145629883, "global_step": 401168, "epoch": 2387} {"train_loss": -12.492195129394531, "global_step": 401169, "epoch": 2387} {"train_loss": -12.680895805358887, "global_step": 401170, "epoch": 2387} {"train_loss": -12.637508392333984, "global_step": 401171, "epoch": 2387} {"train_loss": -12.57155990600586, "global_step": 401172, "epoch": 2387} {"train_loss": -12.784966468811035, "global_step": 401173, "epoch": 2387} {"train_loss": -12.507494926452637, "global_step": 401174, "epoch": 2387} {"train_loss": -12.785965919494629, "global_step": 401175, "epoch": 2387} {"train_loss": -12.75670051574707, "global_step": 401176, "epoch": 2387} {"train_loss": -12.785160064697266, "global_step": 401177, "epoch": 2387} {"train_loss": -12.845049858093262, "global_step": 401178, "epoch": 2387} {"train_loss": -13.113473892211914, "global_step": 401179, "epoch": 2387} {"train_loss": -12.68684196472168, "global_step": 401180, "epoch": 2387} {"train_loss": -12.877067565917969, "global_step": 401181, "epoch": 2387} {"train_loss": -12.761409759521484, "global_step": 401182, "epoch": 2387} {"train_loss": -12.118832253274464, "global_step": 401183, "epoch": 2387, "val_loss": 300635.15625} {"train_loss": -12.791515350341797, "global_step": 401184, "epoch": 2388} {"train_loss": -12.59701919555664, "global_step": 401185, "epoch": 2388} {"train_loss": -12.622998237609863, "global_step": 401186, "epoch": 2388} {"train_loss": -12.656188011169434, "global_step": 401187, "epoch": 2388} {"train_loss": -12.968050003051758, "global_step": 401188, "epoch": 2388} {"train_loss": -12.823163032531738, "global_step": 401189, "epoch": 2388} {"train_loss": -12.781793594360352, "global_step": 401190, "epoch": 2388} {"train_loss": -12.176665306091309, "global_step": 401191, "epoch": 2388} {"train_loss": -12.393259048461914, "global_step": 401192, "epoch": 2388} {"train_loss": -12.785429000854492, "global_step": 401193, "epoch": 2388} {"train_loss": -12.237066268920898, "global_step": 401194, "epoch": 2388} {"train_loss": -12.331043243408203, "global_step": 401195, "epoch": 2388} {"train_loss": -12.720230102539062, "global_step": 401196, "epoch": 2388} {"train_loss": -12.130069732666016, "global_step": 401197, "epoch": 2388} {"train_loss": -12.313621520996094, "global_step": 401198, "epoch": 2388} {"train_loss": -12.329571723937988, "global_step": 401199, "epoch": 2388} {"train_loss": -12.673956871032715, "global_step": 401200, "epoch": 2388} {"train_loss": -12.43303394317627, "global_step": 401201, "epoch": 2388} {"train_loss": -12.149075508117676, "global_step": 401202, "epoch": 2388} {"train_loss": -10.757256507873535, "global_step": 401203, "epoch": 2388} {"train_loss": -11.402618408203125, "global_step": 401204, "epoch": 2388} {"train_loss": -12.22501277923584, "global_step": 401205, "epoch": 2388} {"train_loss": -12.312637329101562, "global_step": 401206, "epoch": 2388} {"train_loss": -12.213499069213867, "global_step": 401207, "epoch": 2388} {"train_loss": -12.001572608947754, "global_step": 401208, "epoch": 2388} {"train_loss": -12.089327812194824, "global_step": 401209, "epoch": 2388} {"train_loss": -11.902101516723633, "global_step": 401210, "epoch": 2388} {"train_loss": -10.706777572631836, "global_step": 401211, "epoch": 2388} {"train_loss": -11.70107650756836, "global_step": 401212, "epoch": 2388} {"train_loss": -11.914974212646484, "global_step": 401213, "epoch": 2388} {"train_loss": -11.015533447265625, "global_step": 401214, "epoch": 2388} {"train_loss": -9.430517196655273, "global_step": 401215, "epoch": 2388} {"train_loss": -11.091418266296387, "global_step": 401216, "epoch": 2388} {"train_loss": -10.692302703857422, "global_step": 401217, "epoch": 2388} {"train_loss": -9.949861526489258, "global_step": 401218, "epoch": 2388} {"train_loss": -10.255712509155273, "global_step": 401219, "epoch": 2388} {"train_loss": -11.390495300292969, "global_step": 401220, "epoch": 2388} {"train_loss": -11.232248306274414, "global_step": 401221, "epoch": 2388} {"train_loss": -11.299661636352539, "global_step": 401222, "epoch": 2388} {"train_loss": -10.78122329711914, "global_step": 401223, "epoch": 2388} {"train_loss": -10.912633895874023, "global_step": 401224, "epoch": 2388} {"train_loss": -9.45551872253418, "global_step": 401225, "epoch": 2388} {"train_loss": -10.876826286315918, "global_step": 401226, "epoch": 2388} {"train_loss": -10.456239700317383, "global_step": 401227, "epoch": 2388} {"train_loss": -10.578775405883789, "global_step": 401228, "epoch": 2388} {"train_loss": -10.523348808288574, "global_step": 401229, "epoch": 2388} {"train_loss": -10.704519271850586, "global_step": 401230, "epoch": 2388} {"train_loss": -11.40065860748291, "global_step": 401231, "epoch": 2388} {"train_loss": -10.569547653198242, "global_step": 401232, "epoch": 2388} {"train_loss": -11.49024486541748, "global_step": 401233, "epoch": 2388} {"train_loss": -10.887454986572266, "global_step": 401234, "epoch": 2388} {"train_loss": -10.592462539672852, "global_step": 401235, "epoch": 2388} {"train_loss": -10.865273475646973, "global_step": 401236, "epoch": 2388} {"train_loss": -11.271646499633789, "global_step": 401237, "epoch": 2388} {"train_loss": -10.790351867675781, "global_step": 401238, "epoch": 2388} {"train_loss": -11.350007057189941, "global_step": 401239, "epoch": 2388} {"train_loss": -11.354127883911133, "global_step": 401240, "epoch": 2388} {"train_loss": -12.001585006713867, "global_step": 401241, "epoch": 2388} {"train_loss": -11.443268775939941, "global_step": 401242, "epoch": 2388} {"train_loss": -11.939407348632812, "global_step": 401243, "epoch": 2388} {"train_loss": -11.672499656677246, "global_step": 401244, "epoch": 2388} {"train_loss": -11.868242263793945, "global_step": 401245, "epoch": 2388} {"train_loss": -11.975406646728516, "global_step": 401246, "epoch": 2388} {"train_loss": -11.550423622131348, "global_step": 401247, "epoch": 2388} {"train_loss": -11.790107727050781, "global_step": 401248, "epoch": 2388} {"train_loss": -11.343011856079102, "global_step": 401249, "epoch": 2388} {"train_loss": -11.764307022094727, "global_step": 401250, "epoch": 2388} {"train_loss": -11.880319595336914, "global_step": 401251, "epoch": 2388} {"train_loss": -11.663799285888672, "global_step": 401252, "epoch": 2388} {"train_loss": -11.971887588500977, "global_step": 401253, "epoch": 2388} {"train_loss": -11.489856719970703, "global_step": 401254, "epoch": 2388} {"train_loss": -11.744365692138672, "global_step": 401255, "epoch": 2388} {"train_loss": -11.937615394592285, "global_step": 401256, "epoch": 2388} {"train_loss": -11.737710952758789, "global_step": 401257, "epoch": 2388} {"train_loss": -11.938936233520508, "global_step": 401258, "epoch": 2388} {"train_loss": -12.18393325805664, "global_step": 401259, "epoch": 2388} {"train_loss": -11.615215301513672, "global_step": 401260, "epoch": 2388} {"train_loss": -11.993168830871582, "global_step": 401261, "epoch": 2388} {"train_loss": -12.248927116394043, "global_step": 401262, "epoch": 2388} {"train_loss": -11.979904174804688, "global_step": 401263, "epoch": 2388} {"train_loss": -12.151830673217773, "global_step": 401264, "epoch": 2388} {"train_loss": -12.130963325500488, "global_step": 401265, "epoch": 2388} {"train_loss": -12.195789337158203, "global_step": 401266, "epoch": 2388} {"train_loss": -12.18087387084961, "global_step": 401267, "epoch": 2388} {"train_loss": -12.414154052734375, "global_step": 401268, "epoch": 2388} {"train_loss": -12.100339889526367, "global_step": 401269, "epoch": 2388} {"train_loss": -11.875505447387695, "global_step": 401270, "epoch": 2388} {"train_loss": -12.210929870605469, "global_step": 401271, "epoch": 2388} {"train_loss": -11.792093276977539, "global_step": 401272, "epoch": 2388} {"train_loss": -12.187751770019531, "global_step": 401273, "epoch": 2388} {"train_loss": -11.850028991699219, "global_step": 401274, "epoch": 2388} {"train_loss": -12.051905632019043, "global_step": 401275, "epoch": 2388} {"train_loss": -12.186891555786133, "global_step": 401276, "epoch": 2388} {"train_loss": -11.990468978881836, "global_step": 401277, "epoch": 2388} {"train_loss": -12.136247634887695, "global_step": 401278, "epoch": 2388} {"train_loss": -11.825571060180664, "global_step": 401279, "epoch": 2388} {"train_loss": -12.147132873535156, "global_step": 401280, "epoch": 2388} {"train_loss": -12.212550163269043, "global_step": 401281, "epoch": 2388} {"train_loss": -12.150175094604492, "global_step": 401282, "epoch": 2388} {"train_loss": -12.427705764770508, "global_step": 401283, "epoch": 2388} {"train_loss": -12.225282669067383, "global_step": 401284, "epoch": 2388} {"train_loss": -12.38936996459961, "global_step": 401285, "epoch": 2388} {"train_loss": -12.27511215209961, "global_step": 401286, "epoch": 2388} {"train_loss": -12.426959991455078, "global_step": 401287, "epoch": 2388} {"train_loss": -12.346672058105469, "global_step": 401288, "epoch": 2388} {"train_loss": -12.34553337097168, "global_step": 401289, "epoch": 2388} {"train_loss": -12.523157119750977, "global_step": 401290, "epoch": 2388} {"train_loss": -12.430343627929688, "global_step": 401291, "epoch": 2388} {"train_loss": -12.331050872802734, "global_step": 401292, "epoch": 2388} {"train_loss": -12.327658653259277, "global_step": 401293, "epoch": 2388} {"train_loss": -12.577486991882324, "global_step": 401294, "epoch": 2388} {"train_loss": -12.425331115722656, "global_step": 401295, "epoch": 2388} {"train_loss": -12.488531112670898, "global_step": 401296, "epoch": 2388} {"train_loss": -12.506935119628906, "global_step": 401297, "epoch": 2388} {"train_loss": -12.503250122070312, "global_step": 401298, "epoch": 2388} {"train_loss": -12.448860168457031, "global_step": 401299, "epoch": 2388} {"train_loss": -12.501274108886719, "global_step": 401300, "epoch": 2388} {"train_loss": -12.668416023254395, "global_step": 401301, "epoch": 2388} {"train_loss": -12.714203834533691, "global_step": 401302, "epoch": 2388} {"train_loss": -12.712093353271484, "global_step": 401303, "epoch": 2388} {"train_loss": -12.791975021362305, "global_step": 401304, "epoch": 2388} {"train_loss": -12.604574203491211, "global_step": 401305, "epoch": 2388} {"train_loss": -12.666380882263184, "global_step": 401306, "epoch": 2388} {"train_loss": -12.608442306518555, "global_step": 401307, "epoch": 2388} {"train_loss": -12.751420021057129, "global_step": 401308, "epoch": 2388} {"train_loss": -12.610066413879395, "global_step": 401309, "epoch": 2388} {"train_loss": -12.682353973388672, "global_step": 401310, "epoch": 2388} {"train_loss": -12.620500564575195, "global_step": 401311, "epoch": 2388} {"train_loss": -12.645322799682617, "global_step": 401312, "epoch": 2388} {"train_loss": -12.69443130493164, "global_step": 401313, "epoch": 2388} {"train_loss": -12.706596374511719, "global_step": 401314, "epoch": 2388} {"train_loss": -12.52439022064209, "global_step": 401315, "epoch": 2388} {"train_loss": -12.726839065551758, "global_step": 401316, "epoch": 2388} {"train_loss": -12.60456657409668, "global_step": 401317, "epoch": 2388} {"train_loss": -12.511106491088867, "global_step": 401318, "epoch": 2388} {"train_loss": -12.678383827209473, "global_step": 401319, "epoch": 2388} {"train_loss": -12.710920333862305, "global_step": 401320, "epoch": 2388} {"train_loss": -12.64402961730957, "global_step": 401321, "epoch": 2388} {"train_loss": -12.298948287963867, "global_step": 401322, "epoch": 2388} {"train_loss": -12.755136489868164, "global_step": 401323, "epoch": 2388} {"train_loss": -12.646787643432617, "global_step": 401324, "epoch": 2388} {"train_loss": -12.440585136413574, "global_step": 401325, "epoch": 2388} {"train_loss": -12.515869140625, "global_step": 401326, "epoch": 2388} {"train_loss": -12.582768440246582, "global_step": 401327, "epoch": 2388} {"train_loss": -12.636603355407715, "global_step": 401328, "epoch": 2388} {"train_loss": -12.826967239379883, "global_step": 401329, "epoch": 2388} {"train_loss": -12.68580436706543, "global_step": 401330, "epoch": 2388} {"train_loss": -12.081461906433105, "global_step": 401331, "epoch": 2388} {"train_loss": -12.174881935119629, "global_step": 401332, "epoch": 2388} {"train_loss": -12.502435684204102, "global_step": 401333, "epoch": 2388} {"train_loss": -12.16700553894043, "global_step": 401334, "epoch": 2388} {"train_loss": -11.911748886108398, "global_step": 401335, "epoch": 2388} {"train_loss": -10.379616737365723, "global_step": 401336, "epoch": 2388} {"train_loss": -10.387598037719727, "global_step": 401337, "epoch": 2388} {"train_loss": -11.73759651184082, "global_step": 401338, "epoch": 2388} {"train_loss": -9.746698379516602, "global_step": 401339, "epoch": 2388} {"train_loss": -10.767180442810059, "global_step": 401340, "epoch": 2388} {"train_loss": -9.851327896118164, "global_step": 401341, "epoch": 2388} {"train_loss": -10.279946327209473, "global_step": 401342, "epoch": 2388} {"train_loss": -8.653913497924805, "global_step": 401343, "epoch": 2388} {"train_loss": -11.466815948486328, "global_step": 401344, "epoch": 2388} {"train_loss": -8.699808120727539, "global_step": 401345, "epoch": 2388} {"train_loss": -11.412933349609375, "global_step": 401346, "epoch": 2388} {"train_loss": -8.568380355834961, "global_step": 401347, "epoch": 2388} {"train_loss": -9.169938087463379, "global_step": 401348, "epoch": 2388} {"train_loss": -8.401294708251953, "global_step": 401349, "epoch": 2388} {"train_loss": -8.662208557128906, "global_step": 401350, "epoch": 2388} {"train_loss": -11.785862479891096, "global_step": 401351, "epoch": 2388, "val_loss": 299851.78125} {"train_loss": -8.952083587646484, "global_step": 401352, "epoch": 2389} {"train_loss": -10.572234153747559, "global_step": 401353, "epoch": 2389} {"train_loss": -9.631752014160156, "global_step": 401354, "epoch": 2389} {"train_loss": -9.78834342956543, "global_step": 401355, "epoch": 2389} {"train_loss": -10.475954055786133, "global_step": 401356, "epoch": 2389} {"train_loss": -10.193168640136719, "global_step": 401357, "epoch": 2389} {"train_loss": -10.9191255569458, "global_step": 401358, "epoch": 2389} {"train_loss": -11.053977966308594, "global_step": 401359, "epoch": 2389} {"train_loss": -10.536680221557617, "global_step": 401360, "epoch": 2389} {"train_loss": -10.362604141235352, "global_step": 401361, "epoch": 2389} {"train_loss": -10.63332748413086, "global_step": 401362, "epoch": 2389} {"train_loss": -11.1722412109375, "global_step": 401363, "epoch": 2389} {"train_loss": -11.723411560058594, "global_step": 401364, "epoch": 2389} {"train_loss": -11.789125442504883, "global_step": 401365, "epoch": 2389} {"train_loss": -11.21511459350586, "global_step": 401366, "epoch": 2389} {"train_loss": -11.583621978759766, "global_step": 401367, "epoch": 2389} {"train_loss": -11.169286727905273, "global_step": 401368, "epoch": 2389} {"train_loss": -11.54763126373291, "global_step": 401369, "epoch": 2389} {"train_loss": -12.015344619750977, "global_step": 401370, "epoch": 2389} {"train_loss": -11.80651569366455, "global_step": 401371, "epoch": 2389} {"train_loss": -11.977211952209473, "global_step": 401372, "epoch": 2389} {"train_loss": -11.771079063415527, "global_step": 401373, "epoch": 2389} {"train_loss": -12.1936616897583, "global_step": 401374, "epoch": 2389} {"train_loss": -12.125434875488281, "global_step": 401375, "epoch": 2389} {"train_loss": -11.976736068725586, "global_step": 401376, "epoch": 2389} {"train_loss": -12.115459442138672, "global_step": 401377, "epoch": 2389} {"train_loss": -11.671466827392578, "global_step": 401378, "epoch": 2389} {"train_loss": -12.003009796142578, "global_step": 401379, "epoch": 2389} {"train_loss": -11.989057540893555, "global_step": 401380, "epoch": 2389} {"train_loss": -12.100631713867188, "global_step": 401381, "epoch": 2389} {"train_loss": -11.931917190551758, "global_step": 401382, "epoch": 2389} {"train_loss": -12.17612075805664, "global_step": 401383, "epoch": 2389} {"train_loss": -12.110401153564453, "global_step": 401384, "epoch": 2389} {"train_loss": -11.842537879943848, "global_step": 401385, "epoch": 2389} {"train_loss": -11.932268142700195, "global_step": 401386, "epoch": 2389} {"train_loss": -11.76927375793457, "global_step": 401387, "epoch": 2389} {"train_loss": -12.030900001525879, "global_step": 401388, "epoch": 2389} {"train_loss": -11.921538352966309, "global_step": 401389, "epoch": 2389} {"train_loss": -12.428934097290039, "global_step": 401390, "epoch": 2389} {"train_loss": -11.698169708251953, "global_step": 401391, "epoch": 2389} {"train_loss": -12.31290054321289, "global_step": 401392, "epoch": 2389} {"train_loss": -11.78969669342041, "global_step": 401393, "epoch": 2389} {"train_loss": -12.415287017822266, "global_step": 401394, "epoch": 2389} {"train_loss": -12.167594909667969, "global_step": 401395, "epoch": 2389} {"train_loss": -12.306025505065918, "global_step": 401396, "epoch": 2389} {"train_loss": -12.25197982788086, "global_step": 401397, "epoch": 2389} {"train_loss": -12.133647918701172, "global_step": 401398, "epoch": 2389} {"train_loss": -12.188883781433105, "global_step": 401399, "epoch": 2389} {"train_loss": -12.168318748474121, "global_step": 401400, "epoch": 2389} {"train_loss": -12.259092330932617, "global_step": 401401, "epoch": 2389} {"train_loss": -12.18086051940918, "global_step": 401402, "epoch": 2389} {"train_loss": -12.004878044128418, "global_step": 401403, "epoch": 2389} {"train_loss": -12.480850219726562, "global_step": 401404, "epoch": 2389} {"train_loss": -12.410883903503418, "global_step": 401405, "epoch": 2389} {"train_loss": -12.368734359741211, "global_step": 401406, "epoch": 2389} {"train_loss": -12.36227798461914, "global_step": 401407, "epoch": 2389} {"train_loss": -12.470849990844727, "global_step": 401408, "epoch": 2389} {"train_loss": -12.34679126739502, "global_step": 401409, "epoch": 2389} {"train_loss": -12.40597915649414, "global_step": 401410, "epoch": 2389} {"train_loss": -12.492729187011719, "global_step": 401411, "epoch": 2389} {"train_loss": -12.344293594360352, "global_step": 401412, "epoch": 2389} {"train_loss": -12.537696838378906, "global_step": 401413, "epoch": 2389} {"train_loss": -12.435945510864258, "global_step": 401414, "epoch": 2389} {"train_loss": -12.637984275817871, "global_step": 401415, "epoch": 2389} {"train_loss": -12.427144050598145, "global_step": 401416, "epoch": 2389} {"train_loss": -12.472299575805664, "global_step": 401417, "epoch": 2389} {"train_loss": -12.308404922485352, "global_step": 401418, "epoch": 2389} {"train_loss": -12.462209701538086, "global_step": 401419, "epoch": 2389} {"train_loss": -12.082075119018555, "global_step": 401420, "epoch": 2389} {"train_loss": -12.479774475097656, "global_step": 401421, "epoch": 2389} {"train_loss": -12.0492525100708, "global_step": 401422, "epoch": 2389} {"train_loss": -12.550322532653809, "global_step": 401423, "epoch": 2389} {"train_loss": -12.315851211547852, "global_step": 401424, "epoch": 2389} {"train_loss": -12.662481307983398, "global_step": 401425, "epoch": 2389} {"train_loss": -12.293333053588867, "global_step": 401426, "epoch": 2389} {"train_loss": -12.827567100524902, "global_step": 401427, "epoch": 2389} {"train_loss": -12.514653205871582, "global_step": 401428, "epoch": 2389} {"train_loss": -12.718465805053711, "global_step": 401429, "epoch": 2389} {"train_loss": -12.587369918823242, "global_step": 401430, "epoch": 2389} {"train_loss": -12.65926456451416, "global_step": 401431, "epoch": 2389} {"train_loss": -12.668828964233398, "global_step": 401432, "epoch": 2389} {"train_loss": -12.655561447143555, "global_step": 401433, "epoch": 2389} {"train_loss": -12.673809051513672, "global_step": 401434, "epoch": 2389} {"train_loss": -12.788172721862793, "global_step": 401435, "epoch": 2389} {"train_loss": -12.713998794555664, "global_step": 401436, "epoch": 2389} {"train_loss": -12.750726699829102, "global_step": 401437, "epoch": 2389} {"train_loss": -12.617183685302734, "global_step": 401438, "epoch": 2389} {"train_loss": -12.525012969970703, "global_step": 401439, "epoch": 2389} {"train_loss": -12.317228317260742, "global_step": 401440, "epoch": 2389} {"train_loss": -12.738771438598633, "global_step": 401441, "epoch": 2389} {"train_loss": -12.64139175415039, "global_step": 401442, "epoch": 2389} {"train_loss": -12.670351028442383, "global_step": 401443, "epoch": 2389} {"train_loss": -12.633816719055176, "global_step": 401444, "epoch": 2389} {"train_loss": -12.655673027038574, "global_step": 401445, "epoch": 2389} {"train_loss": -12.490869522094727, "global_step": 401446, "epoch": 2389} {"train_loss": -12.586828231811523, "global_step": 401447, "epoch": 2389} {"train_loss": -12.264996528625488, "global_step": 401448, "epoch": 2389} {"train_loss": -12.111296653747559, "global_step": 401449, "epoch": 2389} {"train_loss": -12.47362232208252, "global_step": 401450, "epoch": 2389} {"train_loss": -12.876409530639648, "global_step": 401451, "epoch": 2389} {"train_loss": -12.116006851196289, "global_step": 401452, "epoch": 2389} {"train_loss": -12.488241195678711, "global_step": 401453, "epoch": 2389} {"train_loss": -12.022314071655273, "global_step": 401454, "epoch": 2389} {"train_loss": -12.701346397399902, "global_step": 401455, "epoch": 2389} {"train_loss": -12.140256881713867, "global_step": 401456, "epoch": 2389} {"train_loss": -12.641908645629883, "global_step": 401457, "epoch": 2389} {"train_loss": -12.132024765014648, "global_step": 401458, "epoch": 2389} {"train_loss": -12.373346328735352, "global_step": 401459, "epoch": 2389} {"train_loss": -12.409327507019043, "global_step": 401460, "epoch": 2389} {"train_loss": -12.31747055053711, "global_step": 401461, "epoch": 2389} {"train_loss": -11.088592529296875, "global_step": 401462, "epoch": 2389} {"train_loss": -12.454185485839844, "global_step": 401463, "epoch": 2389} {"train_loss": -12.115575790405273, "global_step": 401464, "epoch": 2389} {"train_loss": -12.154239654541016, "global_step": 401465, "epoch": 2389} {"train_loss": -11.581462860107422, "global_step": 401466, "epoch": 2389} {"train_loss": -12.171900749206543, "global_step": 401467, "epoch": 2389} {"train_loss": -12.414273262023926, "global_step": 401468, "epoch": 2389} {"train_loss": -11.818845748901367, "global_step": 401469, "epoch": 2389} {"train_loss": -11.37399673461914, "global_step": 401470, "epoch": 2389} {"train_loss": -12.173036575317383, "global_step": 401471, "epoch": 2389} {"train_loss": -12.700211524963379, "global_step": 401472, "epoch": 2389} {"train_loss": -12.212738037109375, "global_step": 401473, "epoch": 2389} {"train_loss": -12.457826614379883, "global_step": 401474, "epoch": 2389} {"train_loss": -12.776092529296875, "global_step": 401475, "epoch": 2389} {"train_loss": -12.519742965698242, "global_step": 401476, "epoch": 2389} {"train_loss": -12.478893280029297, "global_step": 401477, "epoch": 2389} {"train_loss": -12.125337600708008, "global_step": 401478, "epoch": 2389} {"train_loss": -12.919000625610352, "global_step": 401479, "epoch": 2389} {"train_loss": -12.5244722366333, "global_step": 401480, "epoch": 2389} {"train_loss": -12.592430114746094, "global_step": 401481, "epoch": 2389} {"train_loss": -12.69066047668457, "global_step": 401482, "epoch": 2389} {"train_loss": -12.42786979675293, "global_step": 401483, "epoch": 2389} {"train_loss": -12.404094696044922, "global_step": 401484, "epoch": 2389} {"train_loss": -12.64620304107666, "global_step": 401485, "epoch": 2389} {"train_loss": -12.794711112976074, "global_step": 401486, "epoch": 2389} {"train_loss": -12.46549129486084, "global_step": 401487, "epoch": 2389} {"train_loss": -12.681764602661133, "global_step": 401488, "epoch": 2389} {"train_loss": -12.103311538696289, "global_step": 401489, "epoch": 2389} {"train_loss": -12.410806655883789, "global_step": 401490, "epoch": 2389} {"train_loss": -12.06134033203125, "global_step": 401491, "epoch": 2389} {"train_loss": -12.440146446228027, "global_step": 401492, "epoch": 2389} {"train_loss": -12.580202102661133, "global_step": 401493, "epoch": 2389} {"train_loss": -12.64069938659668, "global_step": 401494, "epoch": 2389} {"train_loss": -12.39471435546875, "global_step": 401495, "epoch": 2389} {"train_loss": -12.511602401733398, "global_step": 401496, "epoch": 2389} {"train_loss": -12.178852081298828, "global_step": 401497, "epoch": 2389} {"train_loss": -11.060184478759766, "global_step": 401498, "epoch": 2389} {"train_loss": -11.551372528076172, "global_step": 401499, "epoch": 2389} {"train_loss": -11.970743179321289, "global_step": 401500, "epoch": 2389} {"train_loss": -11.132148742675781, "global_step": 401501, "epoch": 2389} {"train_loss": -10.46463394165039, "global_step": 401502, "epoch": 2389} {"train_loss": -11.281349182128906, "global_step": 401503, "epoch": 2389} {"train_loss": -10.654659271240234, "global_step": 401504, "epoch": 2389} {"train_loss": -10.659188270568848, "global_step": 401505, "epoch": 2389} {"train_loss": -9.640913009643555, "global_step": 401506, "epoch": 2389} {"train_loss": -10.587236404418945, "global_step": 401507, "epoch": 2389} {"train_loss": -10.056264877319336, "global_step": 401508, "epoch": 2389} {"train_loss": -10.035675048828125, "global_step": 401509, "epoch": 2389} {"train_loss": -9.752819061279297, "global_step": 401510, "epoch": 2389} {"train_loss": -12.113752365112305, "global_step": 401511, "epoch": 2389} {"train_loss": -10.571535110473633, "global_step": 401512, "epoch": 2389} {"train_loss": -11.101934432983398, "global_step": 401513, "epoch": 2389} {"train_loss": -11.111204147338867, "global_step": 401514, "epoch": 2389} {"train_loss": -11.819254875183105, "global_step": 401515, "epoch": 2389} {"train_loss": -10.783756256103516, "global_step": 401516, "epoch": 2389} {"train_loss": -11.343830108642578, "global_step": 401517, "epoch": 2389} {"train_loss": -11.961503982543945, "global_step": 401518, "epoch": 2389} {"train_loss": -11.973604230653672, "global_step": 401519, "epoch": 2389, "val_loss": 297850.875} {"train_loss": -12.105680465698242, "global_step": 401520, "epoch": 2390} {"train_loss": -11.066679000854492, "global_step": 401521, "epoch": 2390} {"train_loss": -11.898265838623047, "global_step": 401522, "epoch": 2390} {"train_loss": -11.368608474731445, "global_step": 401523, "epoch": 2390} {"train_loss": -11.753101348876953, "global_step": 401524, "epoch": 2390} {"train_loss": -11.557952880859375, "global_step": 401525, "epoch": 2390} {"train_loss": -11.519227027893066, "global_step": 401526, "epoch": 2390} {"train_loss": -11.102334022521973, "global_step": 401527, "epoch": 2390} {"train_loss": -11.190324783325195, "global_step": 401528, "epoch": 2390} {"train_loss": -12.021766662597656, "global_step": 401529, "epoch": 2390} {"train_loss": -11.758100509643555, "global_step": 401530, "epoch": 2390} {"train_loss": -11.823138236999512, "global_step": 401531, "epoch": 2390} {"train_loss": -10.585086822509766, "global_step": 401532, "epoch": 2390} {"train_loss": -11.976364135742188, "global_step": 401533, "epoch": 2390} {"train_loss": -10.854928970336914, "global_step": 401534, "epoch": 2390} {"train_loss": -12.386232376098633, "global_step": 401535, "epoch": 2390} {"train_loss": -11.695182800292969, "global_step": 401536, "epoch": 2390} {"train_loss": -12.15955924987793, "global_step": 401537, "epoch": 2390} {"train_loss": -11.70804214477539, "global_step": 401538, "epoch": 2390} {"train_loss": -12.320735931396484, "global_step": 401539, "epoch": 2390} {"train_loss": -12.065621376037598, "global_step": 401540, "epoch": 2390} {"train_loss": -11.888422012329102, "global_step": 401541, "epoch": 2390} {"train_loss": -12.060966491699219, "global_step": 401542, "epoch": 2390} {"train_loss": -12.077129364013672, "global_step": 401543, "epoch": 2390} {"train_loss": -12.36945629119873, "global_step": 401544, "epoch": 2390} {"train_loss": -12.262821197509766, "global_step": 401545, "epoch": 2390} {"train_loss": -12.2915678024292, "global_step": 401546, "epoch": 2390} {"train_loss": -12.579241752624512, "global_step": 401547, "epoch": 2390} {"train_loss": -12.39786148071289, "global_step": 401548, "epoch": 2390} {"train_loss": -12.41018009185791, "global_step": 401549, "epoch": 2390} {"train_loss": -12.545175552368164, "global_step": 401550, "epoch": 2390} {"train_loss": -12.095268249511719, "global_step": 401551, "epoch": 2390} {"train_loss": -12.294235229492188, "global_step": 401552, "epoch": 2390} {"train_loss": -12.270248413085938, "global_step": 401553, "epoch": 2390} {"train_loss": -12.584003448486328, "global_step": 401554, "epoch": 2390} {"train_loss": -12.381979942321777, "global_step": 401555, "epoch": 2390} {"train_loss": -12.309263229370117, "global_step": 401556, "epoch": 2390} {"train_loss": -12.5188570022583, "global_step": 401557, "epoch": 2390} {"train_loss": -12.400951385498047, "global_step": 401558, "epoch": 2390} {"train_loss": -12.640798568725586, "global_step": 401559, "epoch": 2390} {"train_loss": -12.300468444824219, "global_step": 401560, "epoch": 2390} {"train_loss": -12.639838218688965, "global_step": 401561, "epoch": 2390} {"train_loss": -12.659936904907227, "global_step": 401562, "epoch": 2390} {"train_loss": -12.63866901397705, "global_step": 401563, "epoch": 2390} {"train_loss": -12.725341796875, "global_step": 401564, "epoch": 2390} {"train_loss": -12.7220458984375, "global_step": 401565, "epoch": 2390} {"train_loss": -12.621922492980957, "global_step": 401566, "epoch": 2390} {"train_loss": -12.460419654846191, "global_step": 401567, "epoch": 2390} {"train_loss": -12.785667419433594, "global_step": 401568, "epoch": 2390} {"train_loss": -12.746408462524414, "global_step": 401569, "epoch": 2390} {"train_loss": -12.739486694335938, "global_step": 401570, "epoch": 2390} {"train_loss": -12.738709449768066, "global_step": 401571, "epoch": 2390} {"train_loss": -12.696725845336914, "global_step": 401572, "epoch": 2390} {"train_loss": -12.702249526977539, "global_step": 401573, "epoch": 2390} {"train_loss": -12.686813354492188, "global_step": 401574, "epoch": 2390} {"train_loss": -12.590211868286133, "global_step": 401575, "epoch": 2390} {"train_loss": -12.699264526367188, "global_step": 401576, "epoch": 2390} {"train_loss": -12.453132629394531, "global_step": 401577, "epoch": 2390} {"train_loss": -12.183385848999023, "global_step": 401578, "epoch": 2390} {"train_loss": -12.38695240020752, "global_step": 401579, "epoch": 2390} {"train_loss": -12.338227272033691, "global_step": 401580, "epoch": 2390} {"train_loss": -12.650964736938477, "global_step": 401581, "epoch": 2390} {"train_loss": -12.692461967468262, "global_step": 401582, "epoch": 2390} {"train_loss": -12.553448677062988, "global_step": 401583, "epoch": 2390} {"train_loss": -12.497798919677734, "global_step": 401584, "epoch": 2390} {"train_loss": -12.429462432861328, "global_step": 401585, "epoch": 2390} {"train_loss": -12.368526458740234, "global_step": 401586, "epoch": 2390} {"train_loss": -11.96743392944336, "global_step": 401587, "epoch": 2390} {"train_loss": -12.320622444152832, "global_step": 401588, "epoch": 2390} {"train_loss": -12.156675338745117, "global_step": 401589, "epoch": 2390} {"train_loss": -11.69846248626709, "global_step": 401590, "epoch": 2390} {"train_loss": -11.833105087280273, "global_step": 401591, "epoch": 2390} {"train_loss": -12.069275856018066, "global_step": 401592, "epoch": 2390} {"train_loss": -12.597579956054688, "global_step": 401593, "epoch": 2390} {"train_loss": -11.645879745483398, "global_step": 401594, "epoch": 2390} {"train_loss": -11.660934448242188, "global_step": 401595, "epoch": 2390} {"train_loss": -10.847892761230469, "global_step": 401596, "epoch": 2390} {"train_loss": -10.523902893066406, "global_step": 401597, "epoch": 2390} {"train_loss": -10.235136985778809, "global_step": 401598, "epoch": 2390} {"train_loss": -9.779083251953125, "global_step": 401599, "epoch": 2390} {"train_loss": -9.977913856506348, "global_step": 401600, "epoch": 2390} {"train_loss": -11.69445514678955, "global_step": 401601, "epoch": 2390} {"train_loss": -8.136338233947754, "global_step": 401602, "epoch": 2390} {"train_loss": -10.405355453491211, "global_step": 401603, "epoch": 2390} {"train_loss": -6.535252571105957, "global_step": 401604, "epoch": 2390} {"train_loss": -6.665147304534912, "global_step": 401605, "epoch": 2390} {"train_loss": -6.800082206726074, "global_step": 401606, "epoch": 2390} {"train_loss": -7.005365371704102, "global_step": 401607, "epoch": 2390} {"train_loss": -7.010682106018066, "global_step": 401608, "epoch": 2390} {"train_loss": -7.913908004760742, "global_step": 401609, "epoch": 2390} {"train_loss": -7.208693981170654, "global_step": 401610, "epoch": 2390} {"train_loss": -7.675596237182617, "global_step": 401611, "epoch": 2390} {"train_loss": -7.280859470367432, "global_step": 401612, "epoch": 2390} {"train_loss": -7.660416126251221, "global_step": 401613, "epoch": 2390} {"train_loss": -7.9970808029174805, "global_step": 401614, "epoch": 2390} {"train_loss": -8.074844360351562, "global_step": 401615, "epoch": 2390} {"train_loss": -8.50595474243164, "global_step": 401616, "epoch": 2390} {"train_loss": -8.288176536560059, "global_step": 401617, "epoch": 2390} {"train_loss": -7.932878494262695, "global_step": 401618, "epoch": 2390} {"train_loss": -8.198805809020996, "global_step": 401619, "epoch": 2390} {"train_loss": -8.603120803833008, "global_step": 401620, "epoch": 2390} {"train_loss": -8.829351425170898, "global_step": 401621, "epoch": 2390} {"train_loss": -8.832468032836914, "global_step": 401622, "epoch": 2390} {"train_loss": -8.632832527160645, "global_step": 401623, "epoch": 2390} {"train_loss": -9.212352752685547, "global_step": 401624, "epoch": 2390} {"train_loss": -9.076603889465332, "global_step": 401625, "epoch": 2390} {"train_loss": -9.364635467529297, "global_step": 401626, "epoch": 2390} {"train_loss": -9.53642463684082, "global_step": 401627, "epoch": 2390} {"train_loss": -9.434618949890137, "global_step": 401628, "epoch": 2390} {"train_loss": -9.429640769958496, "global_step": 401629, "epoch": 2390} {"train_loss": -9.41282844543457, "global_step": 401630, "epoch": 2390} {"train_loss": -10.13878345489502, "global_step": 401631, "epoch": 2390} {"train_loss": -10.41763687133789, "global_step": 401632, "epoch": 2390} {"train_loss": -10.242332458496094, "global_step": 401633, "epoch": 2390} {"train_loss": -10.654630661010742, "global_step": 401634, "epoch": 2390} {"train_loss": -10.651382446289062, "global_step": 401635, "epoch": 2390} {"train_loss": -10.309103012084961, "global_step": 401636, "epoch": 2390} {"train_loss": -10.522319793701172, "global_step": 401637, "epoch": 2390} {"train_loss": -10.78276252746582, "global_step": 401638, "epoch": 2390} {"train_loss": -11.108481407165527, "global_step": 401639, "epoch": 2390} {"train_loss": -10.347644805908203, "global_step": 401640, "epoch": 2390} {"train_loss": -10.548593521118164, "global_step": 401641, "epoch": 2390} {"train_loss": -11.151440620422363, "global_step": 401642, "epoch": 2390} {"train_loss": -10.900863647460938, "global_step": 401643, "epoch": 2390} {"train_loss": -9.942815780639648, "global_step": 401644, "epoch": 2390} {"train_loss": -11.073114395141602, "global_step": 401645, "epoch": 2390} {"train_loss": -11.130992889404297, "global_step": 401646, "epoch": 2390} {"train_loss": -11.071918487548828, "global_step": 401647, "epoch": 2390} {"train_loss": -11.037591934204102, "global_step": 401648, "epoch": 2390} {"train_loss": -11.512163162231445, "global_step": 401649, "epoch": 2390} {"train_loss": -10.82520866394043, "global_step": 401650, "epoch": 2390} {"train_loss": -11.044048309326172, "global_step": 401651, "epoch": 2390} {"train_loss": -11.537745475769043, "global_step": 401652, "epoch": 2390} {"train_loss": -11.55484390258789, "global_step": 401653, "epoch": 2390} {"train_loss": -11.59204387664795, "global_step": 401654, "epoch": 2390} {"train_loss": -11.356731414794922, "global_step": 401655, "epoch": 2390} {"train_loss": -10.829730033874512, "global_step": 401656, "epoch": 2390} {"train_loss": -11.705188751220703, "global_step": 401657, "epoch": 2390} {"train_loss": -11.337410926818848, "global_step": 401658, "epoch": 2390} {"train_loss": -11.650568008422852, "global_step": 401659, "epoch": 2390} {"train_loss": -11.561406135559082, "global_step": 401660, "epoch": 2390} {"train_loss": -11.537904739379883, "global_step": 401661, "epoch": 2390} {"train_loss": -11.7159423828125, "global_step": 401662, "epoch": 2390} {"train_loss": -11.610147476196289, "global_step": 401663, "epoch": 2390} {"train_loss": -11.744718551635742, "global_step": 401664, "epoch": 2390} {"train_loss": -11.575454711914062, "global_step": 401665, "epoch": 2390} {"train_loss": -11.671295166015625, "global_step": 401666, "epoch": 2390} {"train_loss": -11.600915908813477, "global_step": 401667, "epoch": 2390} {"train_loss": -11.866935729980469, "global_step": 401668, "epoch": 2390} {"train_loss": -11.962366104125977, "global_step": 401669, "epoch": 2390} {"train_loss": -12.412578582763672, "global_step": 401670, "epoch": 2390} {"train_loss": -11.7398681640625, "global_step": 401671, "epoch": 2390} {"train_loss": -12.368692398071289, "global_step": 401672, "epoch": 2390} {"train_loss": -12.176654815673828, "global_step": 401673, "epoch": 2390} {"train_loss": -11.889158248901367, "global_step": 401674, "epoch": 2390} {"train_loss": -12.225257873535156, "global_step": 401675, "epoch": 2390} {"train_loss": -12.386138916015625, "global_step": 401676, "epoch": 2390} {"train_loss": -11.962137222290039, "global_step": 401677, "epoch": 2390} {"train_loss": -12.2474946975708, "global_step": 401678, "epoch": 2390} {"train_loss": -12.30828857421875, "global_step": 401679, "epoch": 2390} {"train_loss": -12.374495506286621, "global_step": 401680, "epoch": 2390} {"train_loss": -12.589883804321289, "global_step": 401681, "epoch": 2390} {"train_loss": -12.172727584838867, "global_step": 401682, "epoch": 2390} {"train_loss": -12.242006301879883, "global_step": 401683, "epoch": 2390} {"train_loss": -12.484720230102539, "global_step": 401684, "epoch": 2390} {"train_loss": -12.39525032043457, "global_step": 401685, "epoch": 2390} {"train_loss": -12.556291580200195, "global_step": 401686, "epoch": 2390} {"train_loss": -11.217012093180703, "global_step": 401687, "epoch": 2390, "val_loss": 300717.0, "train_action_mse_error": 1.754096269607544} {"train_loss": -12.446065902709961, "global_step": 401688, "epoch": 2391} {"train_loss": -12.628321647644043, "global_step": 401689, "epoch": 2391} {"train_loss": -12.360936164855957, "global_step": 401690, "epoch": 2391} {"train_loss": -12.400785446166992, "global_step": 401691, "epoch": 2391} {"train_loss": -12.466032028198242, "global_step": 401692, "epoch": 2391} {"train_loss": -12.557785987854004, "global_step": 401693, "epoch": 2391} {"train_loss": -12.60887336730957, "global_step": 401694, "epoch": 2391} {"train_loss": -12.323040008544922, "global_step": 401695, "epoch": 2391} {"train_loss": -12.33823013305664, "global_step": 401696, "epoch": 2391} {"train_loss": -12.336448669433594, "global_step": 401697, "epoch": 2391} {"train_loss": -12.394886016845703, "global_step": 401698, "epoch": 2391} {"train_loss": -12.41706657409668, "global_step": 401699, "epoch": 2391} {"train_loss": -12.464132308959961, "global_step": 401700, "epoch": 2391} {"train_loss": -12.089644432067871, "global_step": 401701, "epoch": 2391} {"train_loss": -12.644287109375, "global_step": 401702, "epoch": 2391} {"train_loss": -12.381004333496094, "global_step": 401703, "epoch": 2391} {"train_loss": -12.574017524719238, "global_step": 401704, "epoch": 2391} {"train_loss": -12.543935775756836, "global_step": 401705, "epoch": 2391} {"train_loss": -12.50584602355957, "global_step": 401706, "epoch": 2391} {"train_loss": -12.623213768005371, "global_step": 401707, "epoch": 2391} {"train_loss": -12.721335411071777, "global_step": 401708, "epoch": 2391} {"train_loss": -12.645306587219238, "global_step": 401709, "epoch": 2391} {"train_loss": -12.28896713256836, "global_step": 401710, "epoch": 2391} {"train_loss": -12.80605697631836, "global_step": 401711, "epoch": 2391} {"train_loss": -12.76022720336914, "global_step": 401712, "epoch": 2391} {"train_loss": -12.593358993530273, "global_step": 401713, "epoch": 2391} {"train_loss": -12.630334854125977, "global_step": 401714, "epoch": 2391} {"train_loss": -12.600476264953613, "global_step": 401715, "epoch": 2391} {"train_loss": -12.378296852111816, "global_step": 401716, "epoch": 2391} {"train_loss": -12.641380310058594, "global_step": 401717, "epoch": 2391} {"train_loss": -12.249418258666992, "global_step": 401718, "epoch": 2391} {"train_loss": -12.279905319213867, "global_step": 401719, "epoch": 2391} {"train_loss": -12.098812103271484, "global_step": 401720, "epoch": 2391} {"train_loss": -11.940189361572266, "global_step": 401721, "epoch": 2391} {"train_loss": -12.56854248046875, "global_step": 401722, "epoch": 2391} {"train_loss": -11.774153709411621, "global_step": 401723, "epoch": 2391} {"train_loss": -11.752119064331055, "global_step": 401724, "epoch": 2391} {"train_loss": -11.888757705688477, "global_step": 401725, "epoch": 2391} {"train_loss": -11.027599334716797, "global_step": 401726, "epoch": 2391} {"train_loss": -11.948814392089844, "global_step": 401727, "epoch": 2391} {"train_loss": -11.606648445129395, "global_step": 401728, "epoch": 2391} {"train_loss": -12.393838882446289, "global_step": 401729, "epoch": 2391} {"train_loss": -12.397903442382812, "global_step": 401730, "epoch": 2391} {"train_loss": -12.118642807006836, "global_step": 401731, "epoch": 2391} {"train_loss": -12.61458969116211, "global_step": 401732, "epoch": 2391} {"train_loss": -11.755462646484375, "global_step": 401733, "epoch": 2391} {"train_loss": -11.588908195495605, "global_step": 401734, "epoch": 2391} {"train_loss": -12.648797035217285, "global_step": 401735, "epoch": 2391} {"train_loss": -11.095222473144531, "global_step": 401736, "epoch": 2391} {"train_loss": -12.002685546875, "global_step": 401737, "epoch": 2391} {"train_loss": -11.000728607177734, "global_step": 401738, "epoch": 2391} {"train_loss": -11.295223236083984, "global_step": 401739, "epoch": 2391} {"train_loss": -11.527488708496094, "global_step": 401740, "epoch": 2391} {"train_loss": -11.455142974853516, "global_step": 401741, "epoch": 2391} {"train_loss": -11.94147777557373, "global_step": 401742, "epoch": 2391} {"train_loss": -11.810697555541992, "global_step": 401743, "epoch": 2391} {"train_loss": -11.51449203491211, "global_step": 401744, "epoch": 2391} {"train_loss": -11.558612823486328, "global_step": 401745, "epoch": 2391} {"train_loss": -10.896828651428223, "global_step": 401746, "epoch": 2391} {"train_loss": -11.51624870300293, "global_step": 401747, "epoch": 2391} {"train_loss": -11.670536041259766, "global_step": 401748, "epoch": 2391} {"train_loss": -11.969352722167969, "global_step": 401749, "epoch": 2391} {"train_loss": -11.771491050720215, "global_step": 401750, "epoch": 2391} {"train_loss": -11.49341106414795, "global_step": 401751, "epoch": 2391} {"train_loss": -11.909255981445312, "global_step": 401752, "epoch": 2391} {"train_loss": -11.496395111083984, "global_step": 401753, "epoch": 2391} {"train_loss": -12.346353530883789, "global_step": 401754, "epoch": 2391} {"train_loss": -11.673299789428711, "global_step": 401755, "epoch": 2391} {"train_loss": -11.750540733337402, "global_step": 401756, "epoch": 2391} {"train_loss": -11.742271423339844, "global_step": 401757, "epoch": 2391} {"train_loss": -11.746603012084961, "global_step": 401758, "epoch": 2391} {"train_loss": -11.500886917114258, "global_step": 401759, "epoch": 2391} {"train_loss": -11.422937393188477, "global_step": 401760, "epoch": 2391} {"train_loss": -11.772119522094727, "global_step": 401761, "epoch": 2391} {"train_loss": -11.68137264251709, "global_step": 401762, "epoch": 2391} {"train_loss": -11.195761680603027, "global_step": 401763, "epoch": 2391} {"train_loss": -12.156414985656738, "global_step": 401764, "epoch": 2391} {"train_loss": -11.7371826171875, "global_step": 401765, "epoch": 2391} {"train_loss": -11.937324523925781, "global_step": 401766, "epoch": 2391} {"train_loss": -11.892361640930176, "global_step": 401767, "epoch": 2391} {"train_loss": -11.377616882324219, "global_step": 401768, "epoch": 2391} {"train_loss": -12.292863845825195, "global_step": 401769, "epoch": 2391} {"train_loss": -12.023445129394531, "global_step": 401770, "epoch": 2391} {"train_loss": -12.024789810180664, "global_step": 401771, "epoch": 2391} {"train_loss": -11.985933303833008, "global_step": 401772, "epoch": 2391} {"train_loss": -11.896783828735352, "global_step": 401773, "epoch": 2391} {"train_loss": -11.868220329284668, "global_step": 401774, "epoch": 2391} {"train_loss": -11.75792121887207, "global_step": 401775, "epoch": 2391} {"train_loss": -12.095298767089844, "global_step": 401776, "epoch": 2391} {"train_loss": -12.15892505645752, "global_step": 401777, "epoch": 2391} {"train_loss": -11.917400360107422, "global_step": 401778, "epoch": 2391} {"train_loss": -12.480733871459961, "global_step": 401779, "epoch": 2391} {"train_loss": -12.107808113098145, "global_step": 401780, "epoch": 2391} {"train_loss": -12.292510032653809, "global_step": 401781, "epoch": 2391} {"train_loss": -12.25074291229248, "global_step": 401782, "epoch": 2391} {"train_loss": -12.267770767211914, "global_step": 401783, "epoch": 2391} {"train_loss": -12.345071792602539, "global_step": 401784, "epoch": 2391} {"train_loss": -12.348793029785156, "global_step": 401785, "epoch": 2391} {"train_loss": -11.988548278808594, "global_step": 401786, "epoch": 2391} {"train_loss": -12.07729721069336, "global_step": 401787, "epoch": 2391} {"train_loss": -12.118000030517578, "global_step": 401788, "epoch": 2391} {"train_loss": -11.92348861694336, "global_step": 401789, "epoch": 2391} {"train_loss": -12.470523834228516, "global_step": 401790, "epoch": 2391} {"train_loss": -11.73652458190918, "global_step": 401791, "epoch": 2391} {"train_loss": -12.395515441894531, "global_step": 401792, "epoch": 2391} {"train_loss": -12.09522533416748, "global_step": 401793, "epoch": 2391} {"train_loss": -11.959905624389648, "global_step": 401794, "epoch": 2391} {"train_loss": -12.39999008178711, "global_step": 401795, "epoch": 2391} {"train_loss": -12.190811157226562, "global_step": 401796, "epoch": 2391} {"train_loss": -12.65545654296875, "global_step": 401797, "epoch": 2391} {"train_loss": -11.885374069213867, "global_step": 401798, "epoch": 2391} {"train_loss": -12.495687484741211, "global_step": 401799, "epoch": 2391} {"train_loss": -12.106308937072754, "global_step": 401800, "epoch": 2391} {"train_loss": -12.350889205932617, "global_step": 401801, "epoch": 2391} {"train_loss": -12.440561294555664, "global_step": 401802, "epoch": 2391} {"train_loss": -12.264714241027832, "global_step": 401803, "epoch": 2391} {"train_loss": -12.418136596679688, "global_step": 401804, "epoch": 2391} {"train_loss": -12.397025108337402, "global_step": 401805, "epoch": 2391} {"train_loss": -12.466373443603516, "global_step": 401806, "epoch": 2391} {"train_loss": -12.437154769897461, "global_step": 401807, "epoch": 2391} {"train_loss": -12.48971176147461, "global_step": 401808, "epoch": 2391} {"train_loss": -12.46681022644043, "global_step": 401809, "epoch": 2391} {"train_loss": -12.512601852416992, "global_step": 401810, "epoch": 2391} {"train_loss": -12.652487754821777, "global_step": 401811, "epoch": 2391} {"train_loss": -12.481240272521973, "global_step": 401812, "epoch": 2391} {"train_loss": -12.444694519042969, "global_step": 401813, "epoch": 2391} {"train_loss": -12.431193351745605, "global_step": 401814, "epoch": 2391} {"train_loss": -12.451410293579102, "global_step": 401815, "epoch": 2391} {"train_loss": -12.657731056213379, "global_step": 401816, "epoch": 2391} {"train_loss": -12.577295303344727, "global_step": 401817, "epoch": 2391} {"train_loss": -12.072978973388672, "global_step": 401818, "epoch": 2391} {"train_loss": -12.66720962524414, "global_step": 401819, "epoch": 2391} {"train_loss": -12.722492218017578, "global_step": 401820, "epoch": 2391} {"train_loss": -12.778576850891113, "global_step": 401821, "epoch": 2391} {"train_loss": -12.41572380065918, "global_step": 401822, "epoch": 2391} {"train_loss": -12.563997268676758, "global_step": 401823, "epoch": 2391} {"train_loss": -12.835027694702148, "global_step": 401824, "epoch": 2391} {"train_loss": -12.519306182861328, "global_step": 401825, "epoch": 2391} {"train_loss": -12.649667739868164, "global_step": 401826, "epoch": 2391} {"train_loss": -12.551088333129883, "global_step": 401827, "epoch": 2391} {"train_loss": -12.22423267364502, "global_step": 401828, "epoch": 2391} {"train_loss": -12.366641998291016, "global_step": 401829, "epoch": 2391} {"train_loss": -12.470272064208984, "global_step": 401830, "epoch": 2391} {"train_loss": -12.705522537231445, "global_step": 401831, "epoch": 2391} {"train_loss": -12.410218238830566, "global_step": 401832, "epoch": 2391} {"train_loss": -11.932806968688965, "global_step": 401833, "epoch": 2391} {"train_loss": -12.300763130187988, "global_step": 401834, "epoch": 2391} {"train_loss": -12.68115234375, "global_step": 401835, "epoch": 2391} {"train_loss": -12.486895561218262, "global_step": 401836, "epoch": 2391} {"train_loss": -12.282491683959961, "global_step": 401837, "epoch": 2391} {"train_loss": -12.495361328125, "global_step": 401838, "epoch": 2391} {"train_loss": -12.659696578979492, "global_step": 401839, "epoch": 2391} {"train_loss": -12.059998512268066, "global_step": 401840, "epoch": 2391} {"train_loss": -12.4555082321167, "global_step": 401841, "epoch": 2391} {"train_loss": -12.426979064941406, "global_step": 401842, "epoch": 2391} {"train_loss": -12.460277557373047, "global_step": 401843, "epoch": 2391} {"train_loss": -12.35203742980957, "global_step": 401844, "epoch": 2391} {"train_loss": -12.721930503845215, "global_step": 401845, "epoch": 2391} {"train_loss": -12.61149787902832, "global_step": 401846, "epoch": 2391} {"train_loss": -12.206742286682129, "global_step": 401847, "epoch": 2391} {"train_loss": -12.101217269897461, "global_step": 401848, "epoch": 2391} {"train_loss": -12.360452651977539, "global_step": 401849, "epoch": 2391} {"train_loss": -12.26952075958252, "global_step": 401850, "epoch": 2391} {"train_loss": -12.284461975097656, "global_step": 401851, "epoch": 2391} {"train_loss": -12.350395202636719, "global_step": 401852, "epoch": 2391} {"train_loss": -12.134294509887695, "global_step": 401853, "epoch": 2391} {"train_loss": -12.251890182495117, "global_step": 401854, "epoch": 2391} {"train_loss": -12.193458000818888, "global_step": 401855, "epoch": 2391, "val_loss": 304059.53125} {"train_loss": -11.284374237060547, "global_step": 401856, "epoch": 2392} {"train_loss": -12.280315399169922, "global_step": 401857, "epoch": 2392} {"train_loss": -12.772577285766602, "global_step": 401858, "epoch": 2392} {"train_loss": -11.9759521484375, "global_step": 401859, "epoch": 2392} {"train_loss": -12.085345268249512, "global_step": 401860, "epoch": 2392} {"train_loss": -11.831260681152344, "global_step": 401861, "epoch": 2392} {"train_loss": -11.874106407165527, "global_step": 401862, "epoch": 2392} {"train_loss": -12.406149864196777, "global_step": 401863, "epoch": 2392} {"train_loss": -12.399415016174316, "global_step": 401864, "epoch": 2392} {"train_loss": -12.595013618469238, "global_step": 401865, "epoch": 2392} {"train_loss": -12.124971389770508, "global_step": 401866, "epoch": 2392} {"train_loss": -12.772122383117676, "global_step": 401867, "epoch": 2392} {"train_loss": -12.32977294921875, "global_step": 401868, "epoch": 2392} {"train_loss": -12.574271202087402, "global_step": 401869, "epoch": 2392} {"train_loss": -12.35958194732666, "global_step": 401870, "epoch": 2392} {"train_loss": -12.494071960449219, "global_step": 401871, "epoch": 2392} {"train_loss": -12.575474739074707, "global_step": 401872, "epoch": 2392} {"train_loss": -12.649307250976562, "global_step": 401873, "epoch": 2392} {"train_loss": -12.431307792663574, "global_step": 401874, "epoch": 2392} {"train_loss": -12.467113494873047, "global_step": 401875, "epoch": 2392} {"train_loss": -12.287996292114258, "global_step": 401876, "epoch": 2392} {"train_loss": -12.019954681396484, "global_step": 401877, "epoch": 2392} {"train_loss": -11.624290466308594, "global_step": 401878, "epoch": 2392} {"train_loss": -11.745410919189453, "global_step": 401879, "epoch": 2392} {"train_loss": -11.846210479736328, "global_step": 401880, "epoch": 2392} {"train_loss": -10.225189208984375, "global_step": 401881, "epoch": 2392} {"train_loss": -11.997231483459473, "global_step": 401882, "epoch": 2392} {"train_loss": -11.785501480102539, "global_step": 401883, "epoch": 2392} {"train_loss": -10.665594100952148, "global_step": 401884, "epoch": 2392} {"train_loss": -10.50478458404541, "global_step": 401885, "epoch": 2392} {"train_loss": -10.792101860046387, "global_step": 401886, "epoch": 2392} {"train_loss": -11.959770202636719, "global_step": 401887, "epoch": 2392} {"train_loss": -11.393858909606934, "global_step": 401888, "epoch": 2392} {"train_loss": -11.246886253356934, "global_step": 401889, "epoch": 2392} {"train_loss": -11.073406219482422, "global_step": 401890, "epoch": 2392} {"train_loss": -11.037908554077148, "global_step": 401891, "epoch": 2392} {"train_loss": -10.071592330932617, "global_step": 401892, "epoch": 2392} {"train_loss": -11.537307739257812, "global_step": 401893, "epoch": 2392} {"train_loss": -11.46928596496582, "global_step": 401894, "epoch": 2392} {"train_loss": -11.926366806030273, "global_step": 401895, "epoch": 2392} {"train_loss": -10.927309036254883, "global_step": 401896, "epoch": 2392} {"train_loss": -11.722362518310547, "global_step": 401897, "epoch": 2392} {"train_loss": -11.662039756774902, "global_step": 401898, "epoch": 2392} {"train_loss": -11.271937370300293, "global_step": 401899, "epoch": 2392} {"train_loss": -11.919380187988281, "global_step": 401900, "epoch": 2392} {"train_loss": -11.074044227600098, "global_step": 401901, "epoch": 2392} {"train_loss": -11.99382209777832, "global_step": 401902, "epoch": 2392} {"train_loss": -10.887423515319824, "global_step": 401903, "epoch": 2392} {"train_loss": -11.962810516357422, "global_step": 401904, "epoch": 2392} {"train_loss": -11.464515686035156, "global_step": 401905, "epoch": 2392} {"train_loss": -11.351705551147461, "global_step": 401906, "epoch": 2392} {"train_loss": -11.860807418823242, "global_step": 401907, "epoch": 2392} {"train_loss": -11.451286315917969, "global_step": 401908, "epoch": 2392} {"train_loss": -12.080652236938477, "global_step": 401909, "epoch": 2392} {"train_loss": -11.68875503540039, "global_step": 401910, "epoch": 2392} {"train_loss": -11.966710090637207, "global_step": 401911, "epoch": 2392} {"train_loss": -11.41069221496582, "global_step": 401912, "epoch": 2392} {"train_loss": -11.418325424194336, "global_step": 401913, "epoch": 2392} {"train_loss": -11.85142707824707, "global_step": 401914, "epoch": 2392} {"train_loss": -11.858217239379883, "global_step": 401915, "epoch": 2392} {"train_loss": -12.029253005981445, "global_step": 401916, "epoch": 2392} {"train_loss": -11.415645599365234, "global_step": 401917, "epoch": 2392} {"train_loss": -11.600173950195312, "global_step": 401918, "epoch": 2392} {"train_loss": -12.256136894226074, "global_step": 401919, "epoch": 2392} {"train_loss": -11.503644943237305, "global_step": 401920, "epoch": 2392} {"train_loss": -12.292128562927246, "global_step": 401921, "epoch": 2392} {"train_loss": -11.672011375427246, "global_step": 401922, "epoch": 2392} {"train_loss": -11.958562850952148, "global_step": 401923, "epoch": 2392} {"train_loss": -12.171952247619629, "global_step": 401924, "epoch": 2392} {"train_loss": -11.587800979614258, "global_step": 401925, "epoch": 2392} {"train_loss": -12.534866333007812, "global_step": 401926, "epoch": 2392} {"train_loss": -12.064943313598633, "global_step": 401927, "epoch": 2392} {"train_loss": -12.21473503112793, "global_step": 401928, "epoch": 2392} {"train_loss": -12.380951881408691, "global_step": 401929, "epoch": 2392} {"train_loss": -11.972051620483398, "global_step": 401930, "epoch": 2392} {"train_loss": -12.07724380493164, "global_step": 401931, "epoch": 2392} {"train_loss": -12.315689086914062, "global_step": 401932, "epoch": 2392} {"train_loss": -12.206283569335938, "global_step": 401933, "epoch": 2392} {"train_loss": -12.49604606628418, "global_step": 401934, "epoch": 2392} {"train_loss": -12.315079689025879, "global_step": 401935, "epoch": 2392} {"train_loss": -12.450785636901855, "global_step": 401936, "epoch": 2392} {"train_loss": -12.335540771484375, "global_step": 401937, "epoch": 2392} {"train_loss": -12.369806289672852, "global_step": 401938, "epoch": 2392} {"train_loss": -12.32752513885498, "global_step": 401939, "epoch": 2392} {"train_loss": -12.618857383728027, "global_step": 401940, "epoch": 2392} {"train_loss": -12.539999008178711, "global_step": 401941, "epoch": 2392} {"train_loss": -12.495803833007812, "global_step": 401942, "epoch": 2392} {"train_loss": -12.395658493041992, "global_step": 401943, "epoch": 2392} {"train_loss": -12.480785369873047, "global_step": 401944, "epoch": 2392} {"train_loss": -12.667738914489746, "global_step": 401945, "epoch": 2392} {"train_loss": -12.45580768585205, "global_step": 401946, "epoch": 2392} {"train_loss": -12.522001266479492, "global_step": 401947, "epoch": 2392} {"train_loss": -12.362417221069336, "global_step": 401948, "epoch": 2392} {"train_loss": -12.363593101501465, "global_step": 401949, "epoch": 2392} {"train_loss": -12.588769912719727, "global_step": 401950, "epoch": 2392} {"train_loss": -12.308467864990234, "global_step": 401951, "epoch": 2392} {"train_loss": -12.534872055053711, "global_step": 401952, "epoch": 2392} {"train_loss": -12.407988548278809, "global_step": 401953, "epoch": 2392} {"train_loss": -12.7859525680542, "global_step": 401954, "epoch": 2392} {"train_loss": -12.607096672058105, "global_step": 401955, "epoch": 2392} {"train_loss": -12.529887199401855, "global_step": 401956, "epoch": 2392} {"train_loss": -12.537343978881836, "global_step": 401957, "epoch": 2392} {"train_loss": -12.391786575317383, "global_step": 401958, "epoch": 2392} {"train_loss": -12.115516662597656, "global_step": 401959, "epoch": 2392} {"train_loss": -12.420492172241211, "global_step": 401960, "epoch": 2392} {"train_loss": -12.543798446655273, "global_step": 401961, "epoch": 2392} {"train_loss": -12.447271347045898, "global_step": 401962, "epoch": 2392} {"train_loss": -12.158992767333984, "global_step": 401963, "epoch": 2392} {"train_loss": -12.243603706359863, "global_step": 401964, "epoch": 2392} {"train_loss": -12.60400390625, "global_step": 401965, "epoch": 2392} {"train_loss": -11.891229629516602, "global_step": 401966, "epoch": 2392} {"train_loss": -12.261480331420898, "global_step": 401967, "epoch": 2392} {"train_loss": -12.5842924118042, "global_step": 401968, "epoch": 2392} {"train_loss": -11.696868896484375, "global_step": 401969, "epoch": 2392} {"train_loss": -11.4846773147583, "global_step": 401970, "epoch": 2392} {"train_loss": -12.26375675201416, "global_step": 401971, "epoch": 2392} {"train_loss": -11.55846118927002, "global_step": 401972, "epoch": 2392} {"train_loss": -10.420782089233398, "global_step": 401973, "epoch": 2392} {"train_loss": -10.53176498413086, "global_step": 401974, "epoch": 2392} {"train_loss": -10.530109405517578, "global_step": 401975, "epoch": 2392} {"train_loss": -10.741312026977539, "global_step": 401976, "epoch": 2392} {"train_loss": -10.023006439208984, "global_step": 401977, "epoch": 2392} {"train_loss": -9.805797576904297, "global_step": 401978, "epoch": 2392} {"train_loss": -11.224252700805664, "global_step": 401979, "epoch": 2392} {"train_loss": -10.260150909423828, "global_step": 401980, "epoch": 2392} {"train_loss": -10.884794235229492, "global_step": 401981, "epoch": 2392} {"train_loss": -11.164451599121094, "global_step": 401982, "epoch": 2392} {"train_loss": -10.422261238098145, "global_step": 401983, "epoch": 2392} {"train_loss": -11.91202163696289, "global_step": 401984, "epoch": 2392} {"train_loss": -10.443992614746094, "global_step": 401985, "epoch": 2392} {"train_loss": -11.790679931640625, "global_step": 401986, "epoch": 2392} {"train_loss": -11.431724548339844, "global_step": 401987, "epoch": 2392} {"train_loss": -11.792661666870117, "global_step": 401988, "epoch": 2392} {"train_loss": -11.967794418334961, "global_step": 401989, "epoch": 2392} {"train_loss": -11.660629272460938, "global_step": 401990, "epoch": 2392} {"train_loss": -11.993613243103027, "global_step": 401991, "epoch": 2392} {"train_loss": -12.18014907836914, "global_step": 401992, "epoch": 2392} {"train_loss": -11.470212936401367, "global_step": 401993, "epoch": 2392} {"train_loss": -12.034212112426758, "global_step": 401994, "epoch": 2392} {"train_loss": -11.92564582824707, "global_step": 401995, "epoch": 2392} {"train_loss": -11.362224578857422, "global_step": 401996, "epoch": 2392} {"train_loss": -11.92362117767334, "global_step": 401997, "epoch": 2392} {"train_loss": -11.428329467773438, "global_step": 401998, "epoch": 2392} {"train_loss": -11.819236755371094, "global_step": 401999, "epoch": 2392} {"train_loss": -12.295068740844727, "global_step": 402000, "epoch": 2392} {"train_loss": -10.968971252441406, "global_step": 402001, "epoch": 2392} {"train_loss": -11.452713012695312, "global_step": 402002, "epoch": 2392} {"train_loss": -11.733680725097656, "global_step": 402003, "epoch": 2392} {"train_loss": -11.37648868560791, "global_step": 402004, "epoch": 2392} {"train_loss": -11.285907745361328, "global_step": 402005, "epoch": 2392} {"train_loss": -11.977256774902344, "global_step": 402006, "epoch": 2392} {"train_loss": -10.801361083984375, "global_step": 402007, "epoch": 2392} {"train_loss": -12.240251541137695, "global_step": 402008, "epoch": 2392} {"train_loss": -11.678665161132812, "global_step": 402009, "epoch": 2392} {"train_loss": -12.307792663574219, "global_step": 402010, "epoch": 2392} {"train_loss": -12.005146026611328, "global_step": 402011, "epoch": 2392} {"train_loss": -11.554512023925781, "global_step": 402012, "epoch": 2392} {"train_loss": -11.898456573486328, "global_step": 402013, "epoch": 2392} {"train_loss": -12.212518692016602, "global_step": 402014, "epoch": 2392} {"train_loss": -11.983804702758789, "global_step": 402015, "epoch": 2392} {"train_loss": -11.777934074401855, "global_step": 402016, "epoch": 2392} {"train_loss": -11.996007919311523, "global_step": 402017, "epoch": 2392} {"train_loss": -11.968667984008789, "global_step": 402018, "epoch": 2392} {"train_loss": -11.845359802246094, "global_step": 402019, "epoch": 2392} {"train_loss": -11.847321510314941, "global_step": 402020, "epoch": 2392} {"train_loss": -11.960519790649414, "global_step": 402021, "epoch": 2392} {"train_loss": -11.910070419311523, "global_step": 402022, "epoch": 2392} {"train_loss": -11.843574892906915, "global_step": 402023, "epoch": 2392, "val_loss": 304279.59375} {"train_loss": -11.579407691955566, "global_step": 402024, "epoch": 2393} {"train_loss": -11.30274772644043, "global_step": 402025, "epoch": 2393} {"train_loss": -10.909141540527344, "global_step": 402026, "epoch": 2393} {"train_loss": -10.434232711791992, "global_step": 402027, "epoch": 2393} {"train_loss": -10.275599479675293, "global_step": 402028, "epoch": 2393} {"train_loss": -10.288841247558594, "global_step": 402029, "epoch": 2393} {"train_loss": -11.287059783935547, "global_step": 402030, "epoch": 2393} {"train_loss": -9.81574821472168, "global_step": 402031, "epoch": 2393} {"train_loss": -11.168185234069824, "global_step": 402032, "epoch": 2393} {"train_loss": -10.602218627929688, "global_step": 402033, "epoch": 2393} {"train_loss": -10.901464462280273, "global_step": 402034, "epoch": 2393} {"train_loss": -10.655003547668457, "global_step": 402035, "epoch": 2393} {"train_loss": -11.940427780151367, "global_step": 402036, "epoch": 2393} {"train_loss": -10.984527587890625, "global_step": 402037, "epoch": 2393} {"train_loss": -11.5369873046875, "global_step": 402038, "epoch": 2393} {"train_loss": -11.728887557983398, "global_step": 402039, "epoch": 2393} {"train_loss": -11.7470703125, "global_step": 402040, "epoch": 2393} {"train_loss": -11.69912338256836, "global_step": 402041, "epoch": 2393} {"train_loss": -11.709338188171387, "global_step": 402042, "epoch": 2393} {"train_loss": -11.70279598236084, "global_step": 402043, "epoch": 2393} {"train_loss": -11.504118919372559, "global_step": 402044, "epoch": 2393} {"train_loss": -12.099395751953125, "global_step": 402045, "epoch": 2393} {"train_loss": -11.897652626037598, "global_step": 402046, "epoch": 2393} {"train_loss": -12.07822036743164, "global_step": 402047, "epoch": 2393} {"train_loss": -11.988153457641602, "global_step": 402048, "epoch": 2393} {"train_loss": -12.374242782592773, "global_step": 402049, "epoch": 2393} {"train_loss": -12.162162780761719, "global_step": 402050, "epoch": 2393} {"train_loss": -12.08491039276123, "global_step": 402051, "epoch": 2393} {"train_loss": -12.159141540527344, "global_step": 402052, "epoch": 2393} {"train_loss": -12.1753568649292, "global_step": 402053, "epoch": 2393} {"train_loss": -12.305667877197266, "global_step": 402054, "epoch": 2393} {"train_loss": -12.167060852050781, "global_step": 402055, "epoch": 2393} {"train_loss": -12.191866874694824, "global_step": 402056, "epoch": 2393} {"train_loss": -12.175037384033203, "global_step": 402057, "epoch": 2393} {"train_loss": -12.46225357055664, "global_step": 402058, "epoch": 2393} {"train_loss": -12.065755844116211, "global_step": 402059, "epoch": 2393} {"train_loss": -12.285249710083008, "global_step": 402060, "epoch": 2393} {"train_loss": -12.431522369384766, "global_step": 402061, "epoch": 2393} {"train_loss": -11.847692489624023, "global_step": 402062, "epoch": 2393} {"train_loss": -12.37264633178711, "global_step": 402063, "epoch": 2393} {"train_loss": -12.2853422164917, "global_step": 402064, "epoch": 2393} {"train_loss": -12.168723106384277, "global_step": 402065, "epoch": 2393} {"train_loss": -12.454479217529297, "global_step": 402066, "epoch": 2393} {"train_loss": -12.353118896484375, "global_step": 402067, "epoch": 2393} {"train_loss": -12.463470458984375, "global_step": 402068, "epoch": 2393} {"train_loss": -12.10416030883789, "global_step": 402069, "epoch": 2393} {"train_loss": -12.494647979736328, "global_step": 402070, "epoch": 2393} {"train_loss": -12.417224884033203, "global_step": 402071, "epoch": 2393} {"train_loss": -12.19858455657959, "global_step": 402072, "epoch": 2393} {"train_loss": -12.355856895446777, "global_step": 402073, "epoch": 2393} {"train_loss": -12.023502349853516, "global_step": 402074, "epoch": 2393} {"train_loss": -12.354459762573242, "global_step": 402075, "epoch": 2393} {"train_loss": -12.269660949707031, "global_step": 402076, "epoch": 2393} {"train_loss": -11.945350646972656, "global_step": 402077, "epoch": 2393} {"train_loss": -12.320050239562988, "global_step": 402078, "epoch": 2393} {"train_loss": -12.340120315551758, "global_step": 402079, "epoch": 2393} {"train_loss": -12.052578926086426, "global_step": 402080, "epoch": 2393} {"train_loss": -12.574501037597656, "global_step": 402081, "epoch": 2393} {"train_loss": -12.113774299621582, "global_step": 402082, "epoch": 2393} {"train_loss": -12.164846420288086, "global_step": 402083, "epoch": 2393} {"train_loss": -12.273088455200195, "global_step": 402084, "epoch": 2393} {"train_loss": -12.325662612915039, "global_step": 402085, "epoch": 2393} {"train_loss": -12.588239669799805, "global_step": 402086, "epoch": 2393} {"train_loss": -12.507866859436035, "global_step": 402087, "epoch": 2393} {"train_loss": -12.42459487915039, "global_step": 402088, "epoch": 2393} {"train_loss": -12.387104034423828, "global_step": 402089, "epoch": 2393} {"train_loss": -12.741704940795898, "global_step": 402090, "epoch": 2393} {"train_loss": -12.261442184448242, "global_step": 402091, "epoch": 2393} {"train_loss": -12.327829360961914, "global_step": 402092, "epoch": 2393} {"train_loss": -11.903934478759766, "global_step": 402093, "epoch": 2393} {"train_loss": -12.567581176757812, "global_step": 402094, "epoch": 2393} {"train_loss": -12.138542175292969, "global_step": 402095, "epoch": 2393} {"train_loss": -12.663694381713867, "global_step": 402096, "epoch": 2393} {"train_loss": -12.357656478881836, "global_step": 402097, "epoch": 2393} {"train_loss": -12.356681823730469, "global_step": 402098, "epoch": 2393} {"train_loss": -12.431928634643555, "global_step": 402099, "epoch": 2393} {"train_loss": -12.54970932006836, "global_step": 402100, "epoch": 2393} {"train_loss": -12.457423210144043, "global_step": 402101, "epoch": 2393} {"train_loss": -12.463642120361328, "global_step": 402102, "epoch": 2393} {"train_loss": -12.559883117675781, "global_step": 402103, "epoch": 2393} {"train_loss": -12.419183731079102, "global_step": 402104, "epoch": 2393} {"train_loss": -12.556056022644043, "global_step": 402105, "epoch": 2393} {"train_loss": -12.493060111999512, "global_step": 402106, "epoch": 2393} {"train_loss": -12.802112579345703, "global_step": 402107, "epoch": 2393} {"train_loss": -12.250083923339844, "global_step": 402108, "epoch": 2393} {"train_loss": -12.530366897583008, "global_step": 402109, "epoch": 2393} {"train_loss": -12.751312255859375, "global_step": 402110, "epoch": 2393} {"train_loss": -12.567026138305664, "global_step": 402111, "epoch": 2393} {"train_loss": -12.687686920166016, "global_step": 402112, "epoch": 2393} {"train_loss": -12.651310920715332, "global_step": 402113, "epoch": 2393} {"train_loss": -12.694852828979492, "global_step": 402114, "epoch": 2393} {"train_loss": -12.754840850830078, "global_step": 402115, "epoch": 2393} {"train_loss": -12.506816864013672, "global_step": 402116, "epoch": 2393} {"train_loss": -12.978689193725586, "global_step": 402117, "epoch": 2393} {"train_loss": -12.653770446777344, "global_step": 402118, "epoch": 2393} {"train_loss": -12.402955055236816, "global_step": 402119, "epoch": 2393} {"train_loss": -12.6317720413208, "global_step": 402120, "epoch": 2393} {"train_loss": -12.516756057739258, "global_step": 402121, "epoch": 2393} {"train_loss": -12.649336814880371, "global_step": 402122, "epoch": 2393} {"train_loss": -12.651391983032227, "global_step": 402123, "epoch": 2393} {"train_loss": -12.815980911254883, "global_step": 402124, "epoch": 2393} {"train_loss": -12.252015113830566, "global_step": 402125, "epoch": 2393} {"train_loss": -12.376925468444824, "global_step": 402126, "epoch": 2393} {"train_loss": -12.123763084411621, "global_step": 402127, "epoch": 2393} {"train_loss": -12.820869445800781, "global_step": 402128, "epoch": 2393} {"train_loss": -12.56527328491211, "global_step": 402129, "epoch": 2393} {"train_loss": -12.86246109008789, "global_step": 402130, "epoch": 2393} {"train_loss": -12.729763984680176, "global_step": 402131, "epoch": 2393} {"train_loss": -12.999101638793945, "global_step": 402132, "epoch": 2393} {"train_loss": -12.600955963134766, "global_step": 402133, "epoch": 2393} {"train_loss": -12.791731834411621, "global_step": 402134, "epoch": 2393} {"train_loss": -12.60896110534668, "global_step": 402135, "epoch": 2393} {"train_loss": -12.74263858795166, "global_step": 402136, "epoch": 2393} {"train_loss": -12.52371597290039, "global_step": 402137, "epoch": 2393} {"train_loss": -12.619911193847656, "global_step": 402138, "epoch": 2393} {"train_loss": -13.028303146362305, "global_step": 402139, "epoch": 2393} {"train_loss": -12.49875545501709, "global_step": 402140, "epoch": 2393} {"train_loss": -11.826547622680664, "global_step": 402141, "epoch": 2393} {"train_loss": -11.823873519897461, "global_step": 402142, "epoch": 2393} {"train_loss": -12.169865608215332, "global_step": 402143, "epoch": 2393} {"train_loss": -12.167207717895508, "global_step": 402144, "epoch": 2393} {"train_loss": -12.215459823608398, "global_step": 402145, "epoch": 2393} {"train_loss": -11.80455493927002, "global_step": 402146, "epoch": 2393} {"train_loss": -11.819480895996094, "global_step": 402147, "epoch": 2393} {"train_loss": -11.893795013427734, "global_step": 402148, "epoch": 2393} {"train_loss": -12.126009941101074, "global_step": 402149, "epoch": 2393} {"train_loss": -12.133188247680664, "global_step": 402150, "epoch": 2393} {"train_loss": -11.577924728393555, "global_step": 402151, "epoch": 2393} {"train_loss": -12.005889892578125, "global_step": 402152, "epoch": 2393} {"train_loss": -11.61845588684082, "global_step": 402153, "epoch": 2393} {"train_loss": -12.048771858215332, "global_step": 402154, "epoch": 2393} {"train_loss": -11.838359832763672, "global_step": 402155, "epoch": 2393} {"train_loss": -11.182707786560059, "global_step": 402156, "epoch": 2393} {"train_loss": -12.188688278198242, "global_step": 402157, "epoch": 2393} {"train_loss": -10.71550464630127, "global_step": 402158, "epoch": 2393} {"train_loss": -10.805770874023438, "global_step": 402159, "epoch": 2393} {"train_loss": -11.58326530456543, "global_step": 402160, "epoch": 2393} {"train_loss": -10.791976928710938, "global_step": 402161, "epoch": 2393} {"train_loss": -10.35606575012207, "global_step": 402162, "epoch": 2393} {"train_loss": -11.668909072875977, "global_step": 402163, "epoch": 2393} {"train_loss": -10.951303482055664, "global_step": 402164, "epoch": 2393} {"train_loss": -10.271596908569336, "global_step": 402165, "epoch": 2393} {"train_loss": -11.582439422607422, "global_step": 402166, "epoch": 2393} {"train_loss": -10.231280326843262, "global_step": 402167, "epoch": 2393} {"train_loss": -10.552228927612305, "global_step": 402168, "epoch": 2393} {"train_loss": -9.572809219360352, "global_step": 402169, "epoch": 2393} {"train_loss": -10.683124542236328, "global_step": 402170, "epoch": 2393} {"train_loss": -7.807100772857666, "global_step": 402171, "epoch": 2393} {"train_loss": -9.431804656982422, "global_step": 402172, "epoch": 2393} {"train_loss": -8.420660972595215, "global_step": 402173, "epoch": 2393} {"train_loss": -8.772198677062988, "global_step": 402174, "epoch": 2393} {"train_loss": -9.500970840454102, "global_step": 402175, "epoch": 2393} {"train_loss": -10.883825302124023, "global_step": 402176, "epoch": 2393} {"train_loss": -8.764183044433594, "global_step": 402177, "epoch": 2393} {"train_loss": -10.134528160095215, "global_step": 402178, "epoch": 2393} {"train_loss": -9.878496170043945, "global_step": 402179, "epoch": 2393} {"train_loss": -9.868029594421387, "global_step": 402180, "epoch": 2393} {"train_loss": -9.633031845092773, "global_step": 402181, "epoch": 2393} {"train_loss": -10.088271141052246, "global_step": 402182, "epoch": 2393} {"train_loss": -11.578364372253418, "global_step": 402183, "epoch": 2393} {"train_loss": -9.982559204101562, "global_step": 402184, "epoch": 2393} {"train_loss": -10.550041198730469, "global_step": 402185, "epoch": 2393} {"train_loss": -10.076393127441406, "global_step": 402186, "epoch": 2393} {"train_loss": -11.206438064575195, "global_step": 402187, "epoch": 2393} {"train_loss": -9.897960662841797, "global_step": 402188, "epoch": 2393} {"train_loss": -11.716535568237305, "global_step": 402189, "epoch": 2393} {"train_loss": -10.673477172851562, "global_step": 402190, "epoch": 2393} {"train_loss": -11.775014812038059, "global_step": 402191, "epoch": 2393, "val_loss": 300568.65625} {"train_loss": -10.527759552001953, "global_step": 402192, "epoch": 2394} {"train_loss": -11.522293090820312, "global_step": 402193, "epoch": 2394} {"train_loss": -10.298202514648438, "global_step": 402194, "epoch": 2394} {"train_loss": -11.47304630279541, "global_step": 402195, "epoch": 2394} {"train_loss": -11.38749885559082, "global_step": 402196, "epoch": 2394} {"train_loss": -10.7147216796875, "global_step": 402197, "epoch": 2394} {"train_loss": -11.81959342956543, "global_step": 402198, "epoch": 2394} {"train_loss": -11.027673721313477, "global_step": 402199, "epoch": 2394} {"train_loss": -11.317090034484863, "global_step": 402200, "epoch": 2394} {"train_loss": -11.404439926147461, "global_step": 402201, "epoch": 2394} {"train_loss": -11.267282485961914, "global_step": 402202, "epoch": 2394} {"train_loss": -11.655983924865723, "global_step": 402203, "epoch": 2394} {"train_loss": -12.076882362365723, "global_step": 402204, "epoch": 2394} {"train_loss": -11.741959571838379, "global_step": 402205, "epoch": 2394} {"train_loss": -11.802980422973633, "global_step": 402206, "epoch": 2394} {"train_loss": -12.097494125366211, "global_step": 402207, "epoch": 2394} {"train_loss": -11.520503997802734, "global_step": 402208, "epoch": 2394} {"train_loss": -11.846799850463867, "global_step": 402209, "epoch": 2394} {"train_loss": -11.831266403198242, "global_step": 402210, "epoch": 2394} {"train_loss": -11.821051597595215, "global_step": 402211, "epoch": 2394} {"train_loss": -12.110570907592773, "global_step": 402212, "epoch": 2394} {"train_loss": -12.11373519897461, "global_step": 402213, "epoch": 2394} {"train_loss": -12.101441383361816, "global_step": 402214, "epoch": 2394} {"train_loss": -12.037786483764648, "global_step": 402215, "epoch": 2394} {"train_loss": -12.240793228149414, "global_step": 402216, "epoch": 2394} {"train_loss": -12.21532154083252, "global_step": 402217, "epoch": 2394} {"train_loss": -12.210611343383789, "global_step": 402218, "epoch": 2394} {"train_loss": -12.378055572509766, "global_step": 402219, "epoch": 2394} {"train_loss": -12.500381469726562, "global_step": 402220, "epoch": 2394} {"train_loss": -12.33470344543457, "global_step": 402221, "epoch": 2394} {"train_loss": -12.031045913696289, "global_step": 402222, "epoch": 2394} {"train_loss": -12.32249641418457, "global_step": 402223, "epoch": 2394} {"train_loss": -12.11919116973877, "global_step": 402224, "epoch": 2394} {"train_loss": -12.27769660949707, "global_step": 402225, "epoch": 2394} {"train_loss": -12.218887329101562, "global_step": 402226, "epoch": 2394} {"train_loss": -12.089092254638672, "global_step": 402227, "epoch": 2394} {"train_loss": -12.269524574279785, "global_step": 402228, "epoch": 2394} {"train_loss": -12.187158584594727, "global_step": 402229, "epoch": 2394} {"train_loss": -12.240370750427246, "global_step": 402230, "epoch": 2394} {"train_loss": -12.536482810974121, "global_step": 402231, "epoch": 2394} {"train_loss": -12.319269180297852, "global_step": 402232, "epoch": 2394} {"train_loss": -12.227046966552734, "global_step": 402233, "epoch": 2394} {"train_loss": -12.463691711425781, "global_step": 402234, "epoch": 2394} {"train_loss": -12.394010543823242, "global_step": 402235, "epoch": 2394} {"train_loss": -12.338481903076172, "global_step": 402236, "epoch": 2394} {"train_loss": -12.430286407470703, "global_step": 402237, "epoch": 2394} {"train_loss": -12.50390625, "global_step": 402238, "epoch": 2394} {"train_loss": -12.243722915649414, "global_step": 402239, "epoch": 2394} {"train_loss": -12.619434356689453, "global_step": 402240, "epoch": 2394} {"train_loss": -12.469071388244629, "global_step": 402241, "epoch": 2394} {"train_loss": -12.372869491577148, "global_step": 402242, "epoch": 2394} {"train_loss": -12.461073875427246, "global_step": 402243, "epoch": 2394} {"train_loss": -12.513285636901855, "global_step": 402244, "epoch": 2394} {"train_loss": -12.224078178405762, "global_step": 402245, "epoch": 2394} {"train_loss": -12.427125930786133, "global_step": 402246, "epoch": 2394} {"train_loss": -12.322288513183594, "global_step": 402247, "epoch": 2394} {"train_loss": -12.669939041137695, "global_step": 402248, "epoch": 2394} {"train_loss": -12.377503395080566, "global_step": 402249, "epoch": 2394} {"train_loss": -12.47384262084961, "global_step": 402250, "epoch": 2394} {"train_loss": -12.353912353515625, "global_step": 402251, "epoch": 2394} {"train_loss": -12.451122283935547, "global_step": 402252, "epoch": 2394} {"train_loss": -12.43136215209961, "global_step": 402253, "epoch": 2394} {"train_loss": -12.487910270690918, "global_step": 402254, "epoch": 2394} {"train_loss": -12.345757484436035, "global_step": 402255, "epoch": 2394} {"train_loss": -12.647911071777344, "global_step": 402256, "epoch": 2394} {"train_loss": -12.213214874267578, "global_step": 402257, "epoch": 2394} {"train_loss": -12.690513610839844, "global_step": 402258, "epoch": 2394} {"train_loss": -12.020100593566895, "global_step": 402259, "epoch": 2394} {"train_loss": -12.298599243164062, "global_step": 402260, "epoch": 2394} {"train_loss": -12.521893501281738, "global_step": 402261, "epoch": 2394} {"train_loss": -12.593270301818848, "global_step": 402262, "epoch": 2394} {"train_loss": -12.460254669189453, "global_step": 402263, "epoch": 2394} {"train_loss": -12.822834014892578, "global_step": 402264, "epoch": 2394} {"train_loss": -12.33328628540039, "global_step": 402265, "epoch": 2394} {"train_loss": -12.679218292236328, "global_step": 402266, "epoch": 2394} {"train_loss": -12.481258392333984, "global_step": 402267, "epoch": 2394} {"train_loss": -12.643306732177734, "global_step": 402268, "epoch": 2394} {"train_loss": -12.642108917236328, "global_step": 402269, "epoch": 2394} {"train_loss": -12.500194549560547, "global_step": 402270, "epoch": 2394} {"train_loss": -12.286676406860352, "global_step": 402271, "epoch": 2394} {"train_loss": -12.487173080444336, "global_step": 402272, "epoch": 2394} {"train_loss": -12.27020263671875, "global_step": 402273, "epoch": 2394} {"train_loss": -11.502824783325195, "global_step": 402274, "epoch": 2394} {"train_loss": -12.28118896484375, "global_step": 402275, "epoch": 2394} {"train_loss": -12.183340072631836, "global_step": 402276, "epoch": 2394} {"train_loss": -11.36711311340332, "global_step": 402277, "epoch": 2394} {"train_loss": -11.650962829589844, "global_step": 402278, "epoch": 2394} {"train_loss": -10.20716381072998, "global_step": 402279, "epoch": 2394} {"train_loss": -10.757875442504883, "global_step": 402280, "epoch": 2394} {"train_loss": -12.16620922088623, "global_step": 402281, "epoch": 2394} {"train_loss": -11.059164047241211, "global_step": 402282, "epoch": 2394} {"train_loss": -12.262491226196289, "global_step": 402283, "epoch": 2394} {"train_loss": -11.71938705444336, "global_step": 402284, "epoch": 2394} {"train_loss": -11.575387954711914, "global_step": 402285, "epoch": 2394} {"train_loss": -12.453741073608398, "global_step": 402286, "epoch": 2394} {"train_loss": -11.358107566833496, "global_step": 402287, "epoch": 2394} {"train_loss": -11.140666961669922, "global_step": 402288, "epoch": 2394} {"train_loss": -12.32420539855957, "global_step": 402289, "epoch": 2394} {"train_loss": -11.927851676940918, "global_step": 402290, "epoch": 2394} {"train_loss": -11.985213279724121, "global_step": 402291, "epoch": 2394} {"train_loss": -12.345064163208008, "global_step": 402292, "epoch": 2394} {"train_loss": -11.423172950744629, "global_step": 402293, "epoch": 2394} {"train_loss": -12.124273300170898, "global_step": 402294, "epoch": 2394} {"train_loss": -11.771917343139648, "global_step": 402295, "epoch": 2394} {"train_loss": -12.025094985961914, "global_step": 402296, "epoch": 2394} {"train_loss": -11.460174560546875, "global_step": 402297, "epoch": 2394} {"train_loss": -12.076786041259766, "global_step": 402298, "epoch": 2394} {"train_loss": -11.445587158203125, "global_step": 402299, "epoch": 2394} {"train_loss": -11.27464485168457, "global_step": 402300, "epoch": 2394} {"train_loss": -11.656638145446777, "global_step": 402301, "epoch": 2394} {"train_loss": -11.586624145507812, "global_step": 402302, "epoch": 2394} {"train_loss": -11.476980209350586, "global_step": 402303, "epoch": 2394} {"train_loss": -12.019695281982422, "global_step": 402304, "epoch": 2394} {"train_loss": -10.654651641845703, "global_step": 402305, "epoch": 2394} {"train_loss": -11.969625473022461, "global_step": 402306, "epoch": 2394} {"train_loss": -11.957767486572266, "global_step": 402307, "epoch": 2394} {"train_loss": -11.47632884979248, "global_step": 402308, "epoch": 2394} {"train_loss": -12.345392227172852, "global_step": 402309, "epoch": 2394} {"train_loss": -11.77939224243164, "global_step": 402310, "epoch": 2394} {"train_loss": -12.308748245239258, "global_step": 402311, "epoch": 2394} {"train_loss": -12.004798889160156, "global_step": 402312, "epoch": 2394} {"train_loss": -12.1315279006958, "global_step": 402313, "epoch": 2394} {"train_loss": -11.838634490966797, "global_step": 402314, "epoch": 2394} {"train_loss": -11.688064575195312, "global_step": 402315, "epoch": 2394} {"train_loss": -12.200571060180664, "global_step": 402316, "epoch": 2394} {"train_loss": -12.148886680603027, "global_step": 402317, "epoch": 2394} {"train_loss": -12.05229377746582, "global_step": 402318, "epoch": 2394} {"train_loss": -12.20089340209961, "global_step": 402319, "epoch": 2394} {"train_loss": -12.128055572509766, "global_step": 402320, "epoch": 2394} {"train_loss": -12.26160717010498, "global_step": 402321, "epoch": 2394} {"train_loss": -12.287590026855469, "global_step": 402322, "epoch": 2394} {"train_loss": -12.237314224243164, "global_step": 402323, "epoch": 2394} {"train_loss": -12.264900207519531, "global_step": 402324, "epoch": 2394} {"train_loss": -12.210160255432129, "global_step": 402325, "epoch": 2394} {"train_loss": -12.023940086364746, "global_step": 402326, "epoch": 2394} {"train_loss": -12.160901069641113, "global_step": 402327, "epoch": 2394} {"train_loss": -12.076099395751953, "global_step": 402328, "epoch": 2394} {"train_loss": -12.337760925292969, "global_step": 402329, "epoch": 2394} {"train_loss": -11.461666107177734, "global_step": 402330, "epoch": 2394} {"train_loss": -12.042501449584961, "global_step": 402331, "epoch": 2394} {"train_loss": -11.49899673461914, "global_step": 402332, "epoch": 2394} {"train_loss": -12.062509536743164, "global_step": 402333, "epoch": 2394} {"train_loss": -11.614076614379883, "global_step": 402334, "epoch": 2394} {"train_loss": -12.04327392578125, "global_step": 402335, "epoch": 2394} {"train_loss": -12.338669776916504, "global_step": 402336, "epoch": 2394} {"train_loss": -12.166333198547363, "global_step": 402337, "epoch": 2394} {"train_loss": -12.58580493927002, "global_step": 402338, "epoch": 2394} {"train_loss": -12.005661010742188, "global_step": 402339, "epoch": 2394} {"train_loss": -12.309900283813477, "global_step": 402340, "epoch": 2394} {"train_loss": -12.384027481079102, "global_step": 402341, "epoch": 2394} {"train_loss": -12.195613861083984, "global_step": 402342, "epoch": 2394} {"train_loss": -12.460830688476562, "global_step": 402343, "epoch": 2394} {"train_loss": -12.277719497680664, "global_step": 402344, "epoch": 2394} {"train_loss": -12.376846313476562, "global_step": 402345, "epoch": 2394} {"train_loss": -12.58957576751709, "global_step": 402346, "epoch": 2394} {"train_loss": -12.447967529296875, "global_step": 402347, "epoch": 2394} {"train_loss": -12.4087553024292, "global_step": 402348, "epoch": 2394} {"train_loss": -12.307141304016113, "global_step": 402349, "epoch": 2394} {"train_loss": -12.405187606811523, "global_step": 402350, "epoch": 2394} {"train_loss": -12.552324295043945, "global_step": 402351, "epoch": 2394} {"train_loss": -12.325013160705566, "global_step": 402352, "epoch": 2394} {"train_loss": -12.311717987060547, "global_step": 402353, "epoch": 2394} {"train_loss": -12.424201011657715, "global_step": 402354, "epoch": 2394} {"train_loss": -12.653844833374023, "global_step": 402355, "epoch": 2394} {"train_loss": -12.331546783447266, "global_step": 402356, "epoch": 2394} {"train_loss": -12.53508186340332, "global_step": 402357, "epoch": 2394} {"train_loss": -12.097941398620605, "global_step": 402358, "epoch": 2394} {"train_loss": -12.067255905696324, "global_step": 402359, "epoch": 2394, "val_loss": 301481.59375} {"train_loss": -11.763833999633789, "global_step": 402360, "epoch": 2395} {"train_loss": -12.325166702270508, "global_step": 402361, "epoch": 2395} {"train_loss": -11.558256149291992, "global_step": 402362, "epoch": 2395} {"train_loss": -11.990317344665527, "global_step": 402363, "epoch": 2395} {"train_loss": -11.836067199707031, "global_step": 402364, "epoch": 2395} {"train_loss": -11.948983192443848, "global_step": 402365, "epoch": 2395} {"train_loss": -11.92587661743164, "global_step": 402366, "epoch": 2395} {"train_loss": -12.102642059326172, "global_step": 402367, "epoch": 2395} {"train_loss": -12.336181640625, "global_step": 402368, "epoch": 2395} {"train_loss": -12.140275955200195, "global_step": 402369, "epoch": 2395} {"train_loss": -12.377558708190918, "global_step": 402370, "epoch": 2395} {"train_loss": -12.144462585449219, "global_step": 402371, "epoch": 2395} {"train_loss": -11.52113151550293, "global_step": 402372, "epoch": 2395} {"train_loss": -12.262418746948242, "global_step": 402373, "epoch": 2395} {"train_loss": -11.552064895629883, "global_step": 402374, "epoch": 2395} {"train_loss": -12.496044158935547, "global_step": 402375, "epoch": 2395} {"train_loss": -11.937725067138672, "global_step": 402376, "epoch": 2395} {"train_loss": -12.240896224975586, "global_step": 402377, "epoch": 2395} {"train_loss": -12.572315216064453, "global_step": 402378, "epoch": 2395} {"train_loss": -12.33456802368164, "global_step": 402379, "epoch": 2395} {"train_loss": -12.267030715942383, "global_step": 402380, "epoch": 2395} {"train_loss": -12.237285614013672, "global_step": 402381, "epoch": 2395} {"train_loss": -12.325237274169922, "global_step": 402382, "epoch": 2395} {"train_loss": -12.341048240661621, "global_step": 402383, "epoch": 2395} {"train_loss": -12.636337280273438, "global_step": 402384, "epoch": 2395} {"train_loss": -12.622386932373047, "global_step": 402385, "epoch": 2395} {"train_loss": -12.723799705505371, "global_step": 402386, "epoch": 2395} {"train_loss": -12.410862922668457, "global_step": 402387, "epoch": 2395} {"train_loss": -12.641180038452148, "global_step": 402388, "epoch": 2395} {"train_loss": -12.490330696105957, "global_step": 402389, "epoch": 2395} {"train_loss": -12.560792922973633, "global_step": 402390, "epoch": 2395} {"train_loss": -12.74030876159668, "global_step": 402391, "epoch": 2395} {"train_loss": -12.585531234741211, "global_step": 402392, "epoch": 2395} {"train_loss": -12.4561767578125, "global_step": 402393, "epoch": 2395} {"train_loss": -12.468164443969727, "global_step": 402394, "epoch": 2395} {"train_loss": -12.659076690673828, "global_step": 402395, "epoch": 2395} {"train_loss": -12.475401878356934, "global_step": 402396, "epoch": 2395} {"train_loss": -12.750219345092773, "global_step": 402397, "epoch": 2395} {"train_loss": -12.391731262207031, "global_step": 402398, "epoch": 2395} {"train_loss": -12.66019058227539, "global_step": 402399, "epoch": 2395} {"train_loss": -11.968656539916992, "global_step": 402400, "epoch": 2395} {"train_loss": -11.737549781799316, "global_step": 402401, "epoch": 2395} {"train_loss": -12.500479698181152, "global_step": 402402, "epoch": 2395} {"train_loss": -11.607795715332031, "global_step": 402403, "epoch": 2395} {"train_loss": -11.052330017089844, "global_step": 402404, "epoch": 2395} {"train_loss": -12.26934814453125, "global_step": 402405, "epoch": 2395} {"train_loss": -11.955514907836914, "global_step": 402406, "epoch": 2395} {"train_loss": -11.352400779724121, "global_step": 402407, "epoch": 2395} {"train_loss": -12.145012855529785, "global_step": 402408, "epoch": 2395} {"train_loss": -12.264699935913086, "global_step": 402409, "epoch": 2395} {"train_loss": -11.852702140808105, "global_step": 402410, "epoch": 2395} {"train_loss": -10.926259994506836, "global_step": 402411, "epoch": 2395} {"train_loss": -12.086260795593262, "global_step": 402412, "epoch": 2395} {"train_loss": -11.509601593017578, "global_step": 402413, "epoch": 2395} {"train_loss": -10.872451782226562, "global_step": 402414, "epoch": 2395} {"train_loss": -12.063570022583008, "global_step": 402415, "epoch": 2395} {"train_loss": -11.2275390625, "global_step": 402416, "epoch": 2395} {"train_loss": -12.537296295166016, "global_step": 402417, "epoch": 2395} {"train_loss": -11.476131439208984, "global_step": 402418, "epoch": 2395} {"train_loss": -12.108787536621094, "global_step": 402419, "epoch": 2395} {"train_loss": -11.49670124053955, "global_step": 402420, "epoch": 2395} {"train_loss": -12.405447006225586, "global_step": 402421, "epoch": 2395} {"train_loss": -11.217000961303711, "global_step": 402422, "epoch": 2395} {"train_loss": -12.25890064239502, "global_step": 402423, "epoch": 2395} {"train_loss": -11.522878646850586, "global_step": 402424, "epoch": 2395} {"train_loss": -11.327213287353516, "global_step": 402425, "epoch": 2395} {"train_loss": -11.750276565551758, "global_step": 402426, "epoch": 2395} {"train_loss": -11.262578964233398, "global_step": 402427, "epoch": 2395} {"train_loss": -11.8157320022583, "global_step": 402428, "epoch": 2395} {"train_loss": -11.369301795959473, "global_step": 402429, "epoch": 2395} {"train_loss": -10.815208435058594, "global_step": 402430, "epoch": 2395} {"train_loss": -10.337233543395996, "global_step": 402431, "epoch": 2395} {"train_loss": -10.236698150634766, "global_step": 402432, "epoch": 2395} {"train_loss": -11.786094665527344, "global_step": 402433, "epoch": 2395} {"train_loss": -10.746992111206055, "global_step": 402434, "epoch": 2395} {"train_loss": -10.047080993652344, "global_step": 402435, "epoch": 2395} {"train_loss": -11.703845977783203, "global_step": 402436, "epoch": 2395} {"train_loss": -10.629009246826172, "global_step": 402437, "epoch": 2395} {"train_loss": -11.704588890075684, "global_step": 402438, "epoch": 2395} {"train_loss": -10.778071403503418, "global_step": 402439, "epoch": 2395} {"train_loss": -11.033163070678711, "global_step": 402440, "epoch": 2395} {"train_loss": -11.229949951171875, "global_step": 402441, "epoch": 2395} {"train_loss": -10.895480155944824, "global_step": 402442, "epoch": 2395} {"train_loss": -11.532550811767578, "global_step": 402443, "epoch": 2395} {"train_loss": -11.265247344970703, "global_step": 402444, "epoch": 2395} {"train_loss": -11.418205261230469, "global_step": 402445, "epoch": 2395} {"train_loss": -9.488059997558594, "global_step": 402446, "epoch": 2395} {"train_loss": -10.546710968017578, "global_step": 402447, "epoch": 2395} {"train_loss": -11.001736640930176, "global_step": 402448, "epoch": 2395} {"train_loss": -9.401022911071777, "global_step": 402449, "epoch": 2395} {"train_loss": -11.441978454589844, "global_step": 402450, "epoch": 2395} {"train_loss": -10.03398323059082, "global_step": 402451, "epoch": 2395} {"train_loss": -11.472004890441895, "global_step": 402452, "epoch": 2395} {"train_loss": -10.462485313415527, "global_step": 402453, "epoch": 2395} {"train_loss": -11.526477813720703, "global_step": 402454, "epoch": 2395} {"train_loss": -10.428316116333008, "global_step": 402455, "epoch": 2395} {"train_loss": -11.345059394836426, "global_step": 402456, "epoch": 2395} {"train_loss": -10.867135047912598, "global_step": 402457, "epoch": 2395} {"train_loss": -11.103914260864258, "global_step": 402458, "epoch": 2395} {"train_loss": -10.58755874633789, "global_step": 402459, "epoch": 2395} {"train_loss": -11.644315719604492, "global_step": 402460, "epoch": 2395} {"train_loss": -11.106986999511719, "global_step": 402461, "epoch": 2395} {"train_loss": -11.40357494354248, "global_step": 402462, "epoch": 2395} {"train_loss": -11.566123962402344, "global_step": 402463, "epoch": 2395} {"train_loss": -10.46115779876709, "global_step": 402464, "epoch": 2395} {"train_loss": -11.329313278198242, "global_step": 402465, "epoch": 2395} {"train_loss": -11.795913696289062, "global_step": 402466, "epoch": 2395} {"train_loss": -11.117444038391113, "global_step": 402467, "epoch": 2395} {"train_loss": -11.875507354736328, "global_step": 402468, "epoch": 2395} {"train_loss": -12.127852439880371, "global_step": 402469, "epoch": 2395} {"train_loss": -11.337286949157715, "global_step": 402470, "epoch": 2395} {"train_loss": -12.054657936096191, "global_step": 402471, "epoch": 2395} {"train_loss": -11.807162284851074, "global_step": 402472, "epoch": 2395} {"train_loss": -11.639949798583984, "global_step": 402473, "epoch": 2395} {"train_loss": -12.129953384399414, "global_step": 402474, "epoch": 2395} {"train_loss": -11.885889053344727, "global_step": 402475, "epoch": 2395} {"train_loss": -11.523308753967285, "global_step": 402476, "epoch": 2395} {"train_loss": -12.277839660644531, "global_step": 402477, "epoch": 2395} {"train_loss": -11.777551651000977, "global_step": 402478, "epoch": 2395} {"train_loss": -11.668878555297852, "global_step": 402479, "epoch": 2395} {"train_loss": -11.921051025390625, "global_step": 402480, "epoch": 2395} {"train_loss": -12.05582046508789, "global_step": 402481, "epoch": 2395} {"train_loss": -11.918643951416016, "global_step": 402482, "epoch": 2395} {"train_loss": -12.216631889343262, "global_step": 402483, "epoch": 2395} {"train_loss": -11.720340728759766, "global_step": 402484, "epoch": 2395} {"train_loss": -12.082653045654297, "global_step": 402485, "epoch": 2395} {"train_loss": -11.981599807739258, "global_step": 402486, "epoch": 2395} {"train_loss": -12.179057121276855, "global_step": 402487, "epoch": 2395} {"train_loss": -12.348828315734863, "global_step": 402488, "epoch": 2395} {"train_loss": -12.049247741699219, "global_step": 402489, "epoch": 2395} {"train_loss": -12.313674926757812, "global_step": 402490, "epoch": 2395} {"train_loss": -12.16440200805664, "global_step": 402491, "epoch": 2395} {"train_loss": -12.20083999633789, "global_step": 402492, "epoch": 2395} {"train_loss": -12.356110572814941, "global_step": 402493, "epoch": 2395} {"train_loss": -12.239362716674805, "global_step": 402494, "epoch": 2395} {"train_loss": -12.469844818115234, "global_step": 402495, "epoch": 2395} {"train_loss": -12.275552749633789, "global_step": 402496, "epoch": 2395} {"train_loss": -12.498289108276367, "global_step": 402497, "epoch": 2395} {"train_loss": -12.344022750854492, "global_step": 402498, "epoch": 2395} {"train_loss": -12.617425918579102, "global_step": 402499, "epoch": 2395} {"train_loss": -12.271774291992188, "global_step": 402500, "epoch": 2395} {"train_loss": -12.387758255004883, "global_step": 402501, "epoch": 2395} {"train_loss": -12.4332857131958, "global_step": 402502, "epoch": 2395} {"train_loss": -12.410551071166992, "global_step": 402503, "epoch": 2395} {"train_loss": -12.457797050476074, "global_step": 402504, "epoch": 2395} {"train_loss": -12.487369537353516, "global_step": 402505, "epoch": 2395} {"train_loss": -12.513289451599121, "global_step": 402506, "epoch": 2395} {"train_loss": -12.322023391723633, "global_step": 402507, "epoch": 2395} {"train_loss": -12.593635559082031, "global_step": 402508, "epoch": 2395} {"train_loss": -12.42249870300293, "global_step": 402509, "epoch": 2395} {"train_loss": -12.63988208770752, "global_step": 402510, "epoch": 2395} {"train_loss": -12.441537857055664, "global_step": 402511, "epoch": 2395} {"train_loss": -12.611572265625, "global_step": 402512, "epoch": 2395} {"train_loss": -12.411171913146973, "global_step": 402513, "epoch": 2395} {"train_loss": -12.211877822875977, "global_step": 402514, "epoch": 2395} {"train_loss": -12.395403861999512, "global_step": 402515, "epoch": 2395} {"train_loss": -12.157074928283691, "global_step": 402516, "epoch": 2395} {"train_loss": -12.3917875289917, "global_step": 402517, "epoch": 2395} {"train_loss": -12.243146896362305, "global_step": 402518, "epoch": 2395} {"train_loss": -12.261697769165039, "global_step": 402519, "epoch": 2395} {"train_loss": -12.620893478393555, "global_step": 402520, "epoch": 2395} {"train_loss": -12.328718185424805, "global_step": 402521, "epoch": 2395} {"train_loss": -12.70077896118164, "global_step": 402522, "epoch": 2395} {"train_loss": -12.319616317749023, "global_step": 402523, "epoch": 2395} {"train_loss": -12.486089706420898, "global_step": 402524, "epoch": 2395} {"train_loss": -12.42922306060791, "global_step": 402525, "epoch": 2395} {"train_loss": -12.12228775024414, "global_step": 402526, "epoch": 2395} {"train_loss": -11.867641182172866, "global_step": 402527, "epoch": 2395, "val_loss": 301677.34375, "train_action_mse_error": 1.490630865097046} {"train_loss": -11.848392486572266, "global_step": 402528, "epoch": 2396} {"train_loss": -12.034370422363281, "global_step": 402529, "epoch": 2396} {"train_loss": -12.42496109008789, "global_step": 402530, "epoch": 2396} {"train_loss": -12.262170791625977, "global_step": 402531, "epoch": 2396} {"train_loss": -12.338705062866211, "global_step": 402532, "epoch": 2396} {"train_loss": -12.251537322998047, "global_step": 402533, "epoch": 2396} {"train_loss": -12.218225479125977, "global_step": 402534, "epoch": 2396} {"train_loss": -12.414213180541992, "global_step": 402535, "epoch": 2396} {"train_loss": -12.28427791595459, "global_step": 402536, "epoch": 2396} {"train_loss": -12.094586372375488, "global_step": 402537, "epoch": 2396} {"train_loss": -12.55274486541748, "global_step": 402538, "epoch": 2396} {"train_loss": -12.202470779418945, "global_step": 402539, "epoch": 2396} {"train_loss": -12.749341011047363, "global_step": 402540, "epoch": 2396} {"train_loss": -12.396696090698242, "global_step": 402541, "epoch": 2396} {"train_loss": -12.327690124511719, "global_step": 402542, "epoch": 2396} {"train_loss": -12.275445938110352, "global_step": 402543, "epoch": 2396} {"train_loss": -12.415637016296387, "global_step": 402544, "epoch": 2396} {"train_loss": -12.513784408569336, "global_step": 402545, "epoch": 2396} {"train_loss": -12.515654563903809, "global_step": 402546, "epoch": 2396} {"train_loss": -12.534358978271484, "global_step": 402547, "epoch": 2396} {"train_loss": -12.384754180908203, "global_step": 402548, "epoch": 2396} {"train_loss": -12.127408981323242, "global_step": 402549, "epoch": 2396} {"train_loss": -12.339473724365234, "global_step": 402550, "epoch": 2396} {"train_loss": -11.94949722290039, "global_step": 402551, "epoch": 2396} {"train_loss": -11.586308479309082, "global_step": 402552, "epoch": 2396} {"train_loss": -11.981071472167969, "global_step": 402553, "epoch": 2396} {"train_loss": -11.580618858337402, "global_step": 402554, "epoch": 2396} {"train_loss": -11.516129493713379, "global_step": 402555, "epoch": 2396} {"train_loss": -12.015508651733398, "global_step": 402556, "epoch": 2396} {"train_loss": -11.366426467895508, "global_step": 402557, "epoch": 2396} {"train_loss": -12.310476303100586, "global_step": 402558, "epoch": 2396} {"train_loss": -11.86818790435791, "global_step": 402559, "epoch": 2396} {"train_loss": -10.98391342163086, "global_step": 402560, "epoch": 2396} {"train_loss": -11.374733924865723, "global_step": 402561, "epoch": 2396} {"train_loss": -9.908302307128906, "global_step": 402562, "epoch": 2396} {"train_loss": -11.692451477050781, "global_step": 402563, "epoch": 2396} {"train_loss": -9.63172721862793, "global_step": 402564, "epoch": 2396} {"train_loss": -11.158919334411621, "global_step": 402565, "epoch": 2396} {"train_loss": -10.107932090759277, "global_step": 402566, "epoch": 2396} {"train_loss": -11.506824493408203, "global_step": 402567, "epoch": 2396} {"train_loss": -9.452899932861328, "global_step": 402568, "epoch": 2396} {"train_loss": -10.46585464477539, "global_step": 402569, "epoch": 2396} {"train_loss": -10.856793403625488, "global_step": 402570, "epoch": 2396} {"train_loss": -11.15640640258789, "global_step": 402571, "epoch": 2396} {"train_loss": -10.436666488647461, "global_step": 402572, "epoch": 2396} {"train_loss": -11.093326568603516, "global_step": 402573, "epoch": 2396} {"train_loss": -10.519868850708008, "global_step": 402574, "epoch": 2396} {"train_loss": -10.92692756652832, "global_step": 402575, "epoch": 2396} {"train_loss": -10.665731430053711, "global_step": 402576, "epoch": 2396} {"train_loss": -11.239566802978516, "global_step": 402577, "epoch": 2396} {"train_loss": -10.795587539672852, "global_step": 402578, "epoch": 2396} {"train_loss": -11.918750762939453, "global_step": 402579, "epoch": 2396} {"train_loss": -11.322229385375977, "global_step": 402580, "epoch": 2396} {"train_loss": -11.785785675048828, "global_step": 402581, "epoch": 2396} {"train_loss": -11.735522270202637, "global_step": 402582, "epoch": 2396} {"train_loss": -11.640789985656738, "global_step": 402583, "epoch": 2396} {"train_loss": -11.32657527923584, "global_step": 402584, "epoch": 2396} {"train_loss": -11.230074882507324, "global_step": 402585, "epoch": 2396} {"train_loss": -11.700347900390625, "global_step": 402586, "epoch": 2396} {"train_loss": -11.63392162322998, "global_step": 402587, "epoch": 2396} {"train_loss": -11.780569076538086, "global_step": 402588, "epoch": 2396} {"train_loss": -12.155138969421387, "global_step": 402589, "epoch": 2396} {"train_loss": -11.704524040222168, "global_step": 402590, "epoch": 2396} {"train_loss": -11.543427467346191, "global_step": 402591, "epoch": 2396} {"train_loss": -11.896442413330078, "global_step": 402592, "epoch": 2396} {"train_loss": -11.958409309387207, "global_step": 402593, "epoch": 2396} {"train_loss": -12.362624168395996, "global_step": 402594, "epoch": 2396} {"train_loss": -11.92024040222168, "global_step": 402595, "epoch": 2396} {"train_loss": -12.021728515625, "global_step": 402596, "epoch": 2396} {"train_loss": -12.328166007995605, "global_step": 402597, "epoch": 2396} {"train_loss": -12.073451042175293, "global_step": 402598, "epoch": 2396} {"train_loss": -12.444425582885742, "global_step": 402599, "epoch": 2396} {"train_loss": -12.173194885253906, "global_step": 402600, "epoch": 2396} {"train_loss": -12.177101135253906, "global_step": 402601, "epoch": 2396} {"train_loss": -12.249122619628906, "global_step": 402602, "epoch": 2396} {"train_loss": -12.220996856689453, "global_step": 402603, "epoch": 2396} {"train_loss": -12.548758506774902, "global_step": 402604, "epoch": 2396} {"train_loss": -12.055334091186523, "global_step": 402605, "epoch": 2396} {"train_loss": -12.165428161621094, "global_step": 402606, "epoch": 2396} {"train_loss": -12.192032814025879, "global_step": 402607, "epoch": 2396} {"train_loss": -12.310747146606445, "global_step": 402608, "epoch": 2396} {"train_loss": -11.955052375793457, "global_step": 402609, "epoch": 2396} {"train_loss": -12.4522066116333, "global_step": 402610, "epoch": 2396} {"train_loss": -12.207721710205078, "global_step": 402611, "epoch": 2396} {"train_loss": -12.285825729370117, "global_step": 402612, "epoch": 2396} {"train_loss": -12.157709121704102, "global_step": 402613, "epoch": 2396} {"train_loss": -12.36678695678711, "global_step": 402614, "epoch": 2396} {"train_loss": -12.54884147644043, "global_step": 402615, "epoch": 2396} {"train_loss": -12.45739459991455, "global_step": 402616, "epoch": 2396} {"train_loss": -12.334671974182129, "global_step": 402617, "epoch": 2396} {"train_loss": -12.35118293762207, "global_step": 402618, "epoch": 2396} {"train_loss": -12.334599494934082, "global_step": 402619, "epoch": 2396} {"train_loss": -12.538156509399414, "global_step": 402620, "epoch": 2396} {"train_loss": -12.562522888183594, "global_step": 402621, "epoch": 2396} {"train_loss": -12.451118469238281, "global_step": 402622, "epoch": 2396} {"train_loss": -12.498308181762695, "global_step": 402623, "epoch": 2396} {"train_loss": -12.309358596801758, "global_step": 402624, "epoch": 2396} {"train_loss": -12.648448944091797, "global_step": 402625, "epoch": 2396} {"train_loss": -12.569537162780762, "global_step": 402626, "epoch": 2396} {"train_loss": -12.74617862701416, "global_step": 402627, "epoch": 2396} {"train_loss": -12.457087516784668, "global_step": 402628, "epoch": 2396} {"train_loss": -12.679088592529297, "global_step": 402629, "epoch": 2396} {"train_loss": -12.481337547302246, "global_step": 402630, "epoch": 2396} {"train_loss": -12.556639671325684, "global_step": 402631, "epoch": 2396} {"train_loss": -12.527145385742188, "global_step": 402632, "epoch": 2396} {"train_loss": -12.465551376342773, "global_step": 402633, "epoch": 2396} {"train_loss": -12.583115577697754, "global_step": 402634, "epoch": 2396} {"train_loss": -12.632113456726074, "global_step": 402635, "epoch": 2396} {"train_loss": -12.597475051879883, "global_step": 402636, "epoch": 2396} {"train_loss": -12.263051986694336, "global_step": 402637, "epoch": 2396} {"train_loss": -12.422119140625, "global_step": 402638, "epoch": 2396} {"train_loss": -12.580187797546387, "global_step": 402639, "epoch": 2396} {"train_loss": -12.432328224182129, "global_step": 402640, "epoch": 2396} {"train_loss": -12.542719841003418, "global_step": 402641, "epoch": 2396} {"train_loss": -12.42254638671875, "global_step": 402642, "epoch": 2396} {"train_loss": -12.548131942749023, "global_step": 402643, "epoch": 2396} {"train_loss": -12.23802375793457, "global_step": 402644, "epoch": 2396} {"train_loss": -12.685274124145508, "global_step": 402645, "epoch": 2396} {"train_loss": -12.127894401550293, "global_step": 402646, "epoch": 2396} {"train_loss": -12.095001220703125, "global_step": 402647, "epoch": 2396} {"train_loss": -12.690921783447266, "global_step": 402648, "epoch": 2396} {"train_loss": -11.813899993896484, "global_step": 402649, "epoch": 2396} {"train_loss": -12.37213134765625, "global_step": 402650, "epoch": 2396} {"train_loss": -12.35897445678711, "global_step": 402651, "epoch": 2396} {"train_loss": -12.031764030456543, "global_step": 402652, "epoch": 2396} {"train_loss": -12.342514991760254, "global_step": 402653, "epoch": 2396} {"train_loss": -12.49134349822998, "global_step": 402654, "epoch": 2396} {"train_loss": -12.00102424621582, "global_step": 402655, "epoch": 2396} {"train_loss": -12.129915237426758, "global_step": 402656, "epoch": 2396} {"train_loss": -12.231781005859375, "global_step": 402657, "epoch": 2396} {"train_loss": -12.407445907592773, "global_step": 402658, "epoch": 2396} {"train_loss": -12.468295097351074, "global_step": 402659, "epoch": 2396} {"train_loss": -12.47581672668457, "global_step": 402660, "epoch": 2396} {"train_loss": -12.364998817443848, "global_step": 402661, "epoch": 2396} {"train_loss": -12.378668785095215, "global_step": 402662, "epoch": 2396} {"train_loss": -12.595304489135742, "global_step": 402663, "epoch": 2396} {"train_loss": -12.200502395629883, "global_step": 402664, "epoch": 2396} {"train_loss": -12.202066421508789, "global_step": 402665, "epoch": 2396} {"train_loss": -12.354759216308594, "global_step": 402666, "epoch": 2396} {"train_loss": -12.55935287475586, "global_step": 402667, "epoch": 2396} {"train_loss": -12.463296890258789, "global_step": 402668, "epoch": 2396} {"train_loss": -12.400742530822754, "global_step": 402669, "epoch": 2396} {"train_loss": -12.367555618286133, "global_step": 402670, "epoch": 2396} {"train_loss": -12.448827743530273, "global_step": 402671, "epoch": 2396} {"train_loss": -12.358938217163086, "global_step": 402672, "epoch": 2396} {"train_loss": -12.345373153686523, "global_step": 402673, "epoch": 2396} {"train_loss": -12.010242462158203, "global_step": 402674, "epoch": 2396} {"train_loss": -11.98878288269043, "global_step": 402675, "epoch": 2396} {"train_loss": -11.062637329101562, "global_step": 402676, "epoch": 2396} {"train_loss": -11.925971031188965, "global_step": 402677, "epoch": 2396} {"train_loss": -10.863277435302734, "global_step": 402678, "epoch": 2396} {"train_loss": -11.464211463928223, "global_step": 402679, "epoch": 2396} {"train_loss": -8.93317985534668, "global_step": 402680, "epoch": 2396} {"train_loss": -8.184836387634277, "global_step": 402681, "epoch": 2396} {"train_loss": -8.364861488342285, "global_step": 402682, "epoch": 2396} {"train_loss": -8.710551261901855, "global_step": 402683, "epoch": 2396} {"train_loss": -9.910730361938477, "global_step": 402684, "epoch": 2396} {"train_loss": -10.181009292602539, "global_step": 402685, "epoch": 2396} {"train_loss": -9.142097473144531, "global_step": 402686, "epoch": 2396} {"train_loss": -11.23428726196289, "global_step": 402687, "epoch": 2396} {"train_loss": -11.095769882202148, "global_step": 402688, "epoch": 2396} {"train_loss": -10.851024627685547, "global_step": 402689, "epoch": 2396} {"train_loss": -11.726991653442383, "global_step": 402690, "epoch": 2396} {"train_loss": -10.015572547912598, "global_step": 402691, "epoch": 2396} {"train_loss": -11.787799835205078, "global_step": 402692, "epoch": 2396} {"train_loss": -10.37129020690918, "global_step": 402693, "epoch": 2396} {"train_loss": -11.648269653320312, "global_step": 402694, "epoch": 2396} {"train_loss": -11.848705484753562, "global_step": 402695, "epoch": 2396, "val_loss": 296544.0} {"train_loss": -11.42396068572998, "global_step": 402696, "epoch": 2397} {"train_loss": -10.381721496582031, "global_step": 402697, "epoch": 2397} {"train_loss": -11.080635070800781, "global_step": 402698, "epoch": 2397} {"train_loss": -11.367071151733398, "global_step": 402699, "epoch": 2397} {"train_loss": -11.532663345336914, "global_step": 402700, "epoch": 2397} {"train_loss": -11.291617393493652, "global_step": 402701, "epoch": 2397} {"train_loss": -10.498605728149414, "global_step": 402702, "epoch": 2397} {"train_loss": -10.949441909790039, "global_step": 402703, "epoch": 2397} {"train_loss": -11.079839706420898, "global_step": 402704, "epoch": 2397} {"train_loss": -11.186603546142578, "global_step": 402705, "epoch": 2397} {"train_loss": -10.959159851074219, "global_step": 402706, "epoch": 2397} {"train_loss": -10.847246170043945, "global_step": 402707, "epoch": 2397} {"train_loss": -11.271728515625, "global_step": 402708, "epoch": 2397} {"train_loss": -11.67388916015625, "global_step": 402709, "epoch": 2397} {"train_loss": -11.263449668884277, "global_step": 402710, "epoch": 2397} {"train_loss": -11.766009330749512, "global_step": 402711, "epoch": 2397} {"train_loss": -10.771997451782227, "global_step": 402712, "epoch": 2397} {"train_loss": -11.600286483764648, "global_step": 402713, "epoch": 2397} {"train_loss": -10.924160957336426, "global_step": 402714, "epoch": 2397} {"train_loss": -11.31613540649414, "global_step": 402715, "epoch": 2397} {"train_loss": -11.439590454101562, "global_step": 402716, "epoch": 2397} {"train_loss": -11.723299980163574, "global_step": 402717, "epoch": 2397} {"train_loss": -11.718486785888672, "global_step": 402718, "epoch": 2397} {"train_loss": -11.653846740722656, "global_step": 402719, "epoch": 2397} {"train_loss": -11.963468551635742, "global_step": 402720, "epoch": 2397} {"train_loss": -11.47661018371582, "global_step": 402721, "epoch": 2397} {"train_loss": -11.845836639404297, "global_step": 402722, "epoch": 2397} {"train_loss": -11.872108459472656, "global_step": 402723, "epoch": 2397} {"train_loss": -11.118654251098633, "global_step": 402724, "epoch": 2397} {"train_loss": -12.111936569213867, "global_step": 402725, "epoch": 2397} {"train_loss": -11.665895462036133, "global_step": 402726, "epoch": 2397} {"train_loss": -12.071195602416992, "global_step": 402727, "epoch": 2397} {"train_loss": -12.123360633850098, "global_step": 402728, "epoch": 2397} {"train_loss": -11.796791076660156, "global_step": 402729, "epoch": 2397} {"train_loss": -12.324746131896973, "global_step": 402730, "epoch": 2397} {"train_loss": -11.981856346130371, "global_step": 402731, "epoch": 2397} {"train_loss": -12.392918586730957, "global_step": 402732, "epoch": 2397} {"train_loss": -11.945917129516602, "global_step": 402733, "epoch": 2397} {"train_loss": -11.784608840942383, "global_step": 402734, "epoch": 2397} {"train_loss": -12.058727264404297, "global_step": 402735, "epoch": 2397} {"train_loss": -11.856340408325195, "global_step": 402736, "epoch": 2397} {"train_loss": -12.013690948486328, "global_step": 402737, "epoch": 2397} {"train_loss": -11.733870506286621, "global_step": 402738, "epoch": 2397} {"train_loss": -11.91196060180664, "global_step": 402739, "epoch": 2397} {"train_loss": -12.035874366760254, "global_step": 402740, "epoch": 2397} {"train_loss": -12.511951446533203, "global_step": 402741, "epoch": 2397} {"train_loss": -11.96051025390625, "global_step": 402742, "epoch": 2397} {"train_loss": -12.073774337768555, "global_step": 402743, "epoch": 2397} {"train_loss": -12.325517654418945, "global_step": 402744, "epoch": 2397} {"train_loss": -11.970671653747559, "global_step": 402745, "epoch": 2397} {"train_loss": -12.352723121643066, "global_step": 402746, "epoch": 2397} {"train_loss": -11.886913299560547, "global_step": 402747, "epoch": 2397} {"train_loss": -12.234100341796875, "global_step": 402748, "epoch": 2397} {"train_loss": -11.957740783691406, "global_step": 402749, "epoch": 2397} {"train_loss": -12.364251136779785, "global_step": 402750, "epoch": 2397} {"train_loss": -12.211624145507812, "global_step": 402751, "epoch": 2397} {"train_loss": -12.341421127319336, "global_step": 402752, "epoch": 2397} {"train_loss": -12.20051383972168, "global_step": 402753, "epoch": 2397} {"train_loss": -12.270904541015625, "global_step": 402754, "epoch": 2397} {"train_loss": -12.327716827392578, "global_step": 402755, "epoch": 2397} {"train_loss": -11.901744842529297, "global_step": 402756, "epoch": 2397} {"train_loss": -12.498115539550781, "global_step": 402757, "epoch": 2397} {"train_loss": -12.008922576904297, "global_step": 402758, "epoch": 2397} {"train_loss": -12.403817176818848, "global_step": 402759, "epoch": 2397} {"train_loss": -12.304615020751953, "global_step": 402760, "epoch": 2397} {"train_loss": -11.799073219299316, "global_step": 402761, "epoch": 2397} {"train_loss": -12.429588317871094, "global_step": 402762, "epoch": 2397} {"train_loss": -11.988502502441406, "global_step": 402763, "epoch": 2397} {"train_loss": -12.459957122802734, "global_step": 402764, "epoch": 2397} {"train_loss": -12.564871788024902, "global_step": 402765, "epoch": 2397} {"train_loss": -12.105325698852539, "global_step": 402766, "epoch": 2397} {"train_loss": -12.569928169250488, "global_step": 402767, "epoch": 2397} {"train_loss": -12.450637817382812, "global_step": 402768, "epoch": 2397} {"train_loss": -12.623416900634766, "global_step": 402769, "epoch": 2397} {"train_loss": -12.54419231414795, "global_step": 402770, "epoch": 2397} {"train_loss": -12.449651718139648, "global_step": 402771, "epoch": 2397} {"train_loss": -12.4822998046875, "global_step": 402772, "epoch": 2397} {"train_loss": -12.37492847442627, "global_step": 402773, "epoch": 2397} {"train_loss": -12.20988655090332, "global_step": 402774, "epoch": 2397} {"train_loss": -12.38460922241211, "global_step": 402775, "epoch": 2397} {"train_loss": -12.355554580688477, "global_step": 402776, "epoch": 2397} {"train_loss": -12.077836036682129, "global_step": 402777, "epoch": 2397} {"train_loss": -11.488750457763672, "global_step": 402778, "epoch": 2397} {"train_loss": -11.573501586914062, "global_step": 402779, "epoch": 2397} {"train_loss": -12.124778747558594, "global_step": 402780, "epoch": 2397} {"train_loss": -12.153189659118652, "global_step": 402781, "epoch": 2397} {"train_loss": -12.486675262451172, "global_step": 402782, "epoch": 2397} {"train_loss": -11.686351776123047, "global_step": 402783, "epoch": 2397} {"train_loss": -12.749454498291016, "global_step": 402784, "epoch": 2397} {"train_loss": -12.090683937072754, "global_step": 402785, "epoch": 2397} {"train_loss": -12.482847213745117, "global_step": 402786, "epoch": 2397} {"train_loss": -11.669402122497559, "global_step": 402787, "epoch": 2397} {"train_loss": -12.51728630065918, "global_step": 402788, "epoch": 2397} {"train_loss": -12.054673194885254, "global_step": 402789, "epoch": 2397} {"train_loss": -12.09604263305664, "global_step": 402790, "epoch": 2397} {"train_loss": -12.180520057678223, "global_step": 402791, "epoch": 2397} {"train_loss": -12.08999252319336, "global_step": 402792, "epoch": 2397} {"train_loss": -12.467082023620605, "global_step": 402793, "epoch": 2397} {"train_loss": -12.001452445983887, "global_step": 402794, "epoch": 2397} {"train_loss": -12.09276008605957, "global_step": 402795, "epoch": 2397} {"train_loss": -12.377861022949219, "global_step": 402796, "epoch": 2397} {"train_loss": -12.122102737426758, "global_step": 402797, "epoch": 2397} {"train_loss": -12.262847900390625, "global_step": 402798, "epoch": 2397} {"train_loss": -12.137992858886719, "global_step": 402799, "epoch": 2397} {"train_loss": -12.50128173828125, "global_step": 402800, "epoch": 2397} {"train_loss": -11.906760215759277, "global_step": 402801, "epoch": 2397} {"train_loss": -12.35594654083252, "global_step": 402802, "epoch": 2397} {"train_loss": -12.233803749084473, "global_step": 402803, "epoch": 2397} {"train_loss": -12.57768440246582, "global_step": 402804, "epoch": 2397} {"train_loss": -12.136761665344238, "global_step": 402805, "epoch": 2397} {"train_loss": -12.652711868286133, "global_step": 402806, "epoch": 2397} {"train_loss": -11.996810913085938, "global_step": 402807, "epoch": 2397} {"train_loss": -12.009688377380371, "global_step": 402808, "epoch": 2397} {"train_loss": -12.637076377868652, "global_step": 402809, "epoch": 2397} {"train_loss": -12.357110977172852, "global_step": 402810, "epoch": 2397} {"train_loss": -12.098573684692383, "global_step": 402811, "epoch": 2397} {"train_loss": -12.415395736694336, "global_step": 402812, "epoch": 2397} {"train_loss": -12.239236831665039, "global_step": 402813, "epoch": 2397} {"train_loss": -11.802188873291016, "global_step": 402814, "epoch": 2397} {"train_loss": -12.391890525817871, "global_step": 402815, "epoch": 2397} {"train_loss": -11.386207580566406, "global_step": 402816, "epoch": 2397} {"train_loss": -12.398735046386719, "global_step": 402817, "epoch": 2397} {"train_loss": -12.167608261108398, "global_step": 402818, "epoch": 2397} {"train_loss": -11.78428840637207, "global_step": 402819, "epoch": 2397} {"train_loss": -12.34769058227539, "global_step": 402820, "epoch": 2397} {"train_loss": -12.14729118347168, "global_step": 402821, "epoch": 2397} {"train_loss": -11.342255592346191, "global_step": 402822, "epoch": 2397} {"train_loss": -12.617568969726562, "global_step": 402823, "epoch": 2397} {"train_loss": -11.751463890075684, "global_step": 402824, "epoch": 2397} {"train_loss": -11.684511184692383, "global_step": 402825, "epoch": 2397} {"train_loss": -12.303049087524414, "global_step": 402826, "epoch": 2397} {"train_loss": -11.664067268371582, "global_step": 402827, "epoch": 2397} {"train_loss": -12.171360969543457, "global_step": 402828, "epoch": 2397} {"train_loss": -11.514806747436523, "global_step": 402829, "epoch": 2397} {"train_loss": -11.263187408447266, "global_step": 402830, "epoch": 2397} {"train_loss": -11.63227653503418, "global_step": 402831, "epoch": 2397} {"train_loss": -11.986270904541016, "global_step": 402832, "epoch": 2397} {"train_loss": -11.738065719604492, "global_step": 402833, "epoch": 2397} {"train_loss": -11.777040481567383, "global_step": 402834, "epoch": 2397} {"train_loss": -11.330138206481934, "global_step": 402835, "epoch": 2397} {"train_loss": -11.998088836669922, "global_step": 402836, "epoch": 2397} {"train_loss": -11.0951509475708, "global_step": 402837, "epoch": 2397} {"train_loss": -11.836276054382324, "global_step": 402838, "epoch": 2397} {"train_loss": -12.204534530639648, "global_step": 402839, "epoch": 2397} {"train_loss": -11.609596252441406, "global_step": 402840, "epoch": 2397} {"train_loss": -12.203782081604004, "global_step": 402841, "epoch": 2397} {"train_loss": -11.469151496887207, "global_step": 402842, "epoch": 2397} {"train_loss": -12.19119644165039, "global_step": 402843, "epoch": 2397} {"train_loss": -12.398027420043945, "global_step": 402844, "epoch": 2397} {"train_loss": -12.30282211303711, "global_step": 402845, "epoch": 2397} {"train_loss": -12.27680778503418, "global_step": 402846, "epoch": 2397} {"train_loss": -11.933761596679688, "global_step": 402847, "epoch": 2397} {"train_loss": -11.93795394897461, "global_step": 402848, "epoch": 2397} {"train_loss": -12.376688957214355, "global_step": 402849, "epoch": 2397} {"train_loss": -12.204023361206055, "global_step": 402850, "epoch": 2397} {"train_loss": -11.791895866394043, "global_step": 402851, "epoch": 2397} {"train_loss": -12.432679176330566, "global_step": 402852, "epoch": 2397} {"train_loss": -12.182235717773438, "global_step": 402853, "epoch": 2397} {"train_loss": -12.294729232788086, "global_step": 402854, "epoch": 2397} {"train_loss": -12.171618461608887, "global_step": 402855, "epoch": 2397} {"train_loss": -12.104827880859375, "global_step": 402856, "epoch": 2397} {"train_loss": -12.132442474365234, "global_step": 402857, "epoch": 2397} {"train_loss": -12.238723754882812, "global_step": 402858, "epoch": 2397} {"train_loss": -12.106943130493164, "global_step": 402859, "epoch": 2397} {"train_loss": -12.286075592041016, "global_step": 402860, "epoch": 2397} {"train_loss": -12.22153091430664, "global_step": 402861, "epoch": 2397} {"train_loss": -12.181295394897461, "global_step": 402862, "epoch": 2397} {"train_loss": -11.979213271822248, "global_step": 402863, "epoch": 2397, "val_loss": 302568.15625} {"train_loss": -11.999246597290039, "global_step": 402864, "epoch": 2398} {"train_loss": -10.783906936645508, "global_step": 402865, "epoch": 2398} {"train_loss": -12.106701850891113, "global_step": 402866, "epoch": 2398} {"train_loss": -11.668298721313477, "global_step": 402867, "epoch": 2398} {"train_loss": -11.382951736450195, "global_step": 402868, "epoch": 2398} {"train_loss": -11.328275680541992, "global_step": 402869, "epoch": 2398} {"train_loss": -12.34720230102539, "global_step": 402870, "epoch": 2398} {"train_loss": -10.797651290893555, "global_step": 402871, "epoch": 2398} {"train_loss": -12.051128387451172, "global_step": 402872, "epoch": 2398} {"train_loss": -11.537853240966797, "global_step": 402873, "epoch": 2398} {"train_loss": -12.048900604248047, "global_step": 402874, "epoch": 2398} {"train_loss": -11.98621654510498, "global_step": 402875, "epoch": 2398} {"train_loss": -11.54143238067627, "global_step": 402876, "epoch": 2398} {"train_loss": -12.038864135742188, "global_step": 402877, "epoch": 2398} {"train_loss": -12.093995094299316, "global_step": 402878, "epoch": 2398} {"train_loss": -10.951287269592285, "global_step": 402879, "epoch": 2398} {"train_loss": -11.719392776489258, "global_step": 402880, "epoch": 2398} {"train_loss": -10.921406745910645, "global_step": 402881, "epoch": 2398} {"train_loss": -12.087904930114746, "global_step": 402882, "epoch": 2398} {"train_loss": -11.251879692077637, "global_step": 402883, "epoch": 2398} {"train_loss": -11.281717300415039, "global_step": 402884, "epoch": 2398} {"train_loss": -11.357160568237305, "global_step": 402885, "epoch": 2398} {"train_loss": -10.661609649658203, "global_step": 402886, "epoch": 2398} {"train_loss": -11.81576156616211, "global_step": 402887, "epoch": 2398} {"train_loss": -10.929693222045898, "global_step": 402888, "epoch": 2398} {"train_loss": -10.990784645080566, "global_step": 402889, "epoch": 2398} {"train_loss": -10.682588577270508, "global_step": 402890, "epoch": 2398} {"train_loss": -11.312095642089844, "global_step": 402891, "epoch": 2398} {"train_loss": -11.775237083435059, "global_step": 402892, "epoch": 2398} {"train_loss": -11.576689720153809, "global_step": 402893, "epoch": 2398} {"train_loss": -11.783533096313477, "global_step": 402894, "epoch": 2398} {"train_loss": -11.664806365966797, "global_step": 402895, "epoch": 2398} {"train_loss": -11.442867279052734, "global_step": 402896, "epoch": 2398} {"train_loss": -11.993754386901855, "global_step": 402897, "epoch": 2398} {"train_loss": -11.412176132202148, "global_step": 402898, "epoch": 2398} {"train_loss": -11.582767486572266, "global_step": 402899, "epoch": 2398} {"train_loss": -11.938247680664062, "global_step": 402900, "epoch": 2398} {"train_loss": -11.48702621459961, "global_step": 402901, "epoch": 2398} {"train_loss": -11.901649475097656, "global_step": 402902, "epoch": 2398} {"train_loss": -12.048105239868164, "global_step": 402903, "epoch": 2398} {"train_loss": -11.441673278808594, "global_step": 402904, "epoch": 2398} {"train_loss": -12.266891479492188, "global_step": 402905, "epoch": 2398} {"train_loss": -11.408347129821777, "global_step": 402906, "epoch": 2398} {"train_loss": -12.493770599365234, "global_step": 402907, "epoch": 2398} {"train_loss": -12.097574234008789, "global_step": 402908, "epoch": 2398} {"train_loss": -12.085606575012207, "global_step": 402909, "epoch": 2398} {"train_loss": -12.234786987304688, "global_step": 402910, "epoch": 2398} {"train_loss": -11.66322135925293, "global_step": 402911, "epoch": 2398} {"train_loss": -12.20626163482666, "global_step": 402912, "epoch": 2398} {"train_loss": -11.989120483398438, "global_step": 402913, "epoch": 2398} {"train_loss": -12.074374198913574, "global_step": 402914, "epoch": 2398} {"train_loss": -12.460016250610352, "global_step": 402915, "epoch": 2398} {"train_loss": -12.43624496459961, "global_step": 402916, "epoch": 2398} {"train_loss": -11.984834671020508, "global_step": 402917, "epoch": 2398} {"train_loss": -12.329132080078125, "global_step": 402918, "epoch": 2398} {"train_loss": -12.001395225524902, "global_step": 402919, "epoch": 2398} {"train_loss": -12.42225170135498, "global_step": 402920, "epoch": 2398} {"train_loss": -12.266446113586426, "global_step": 402921, "epoch": 2398} {"train_loss": -12.44439697265625, "global_step": 402922, "epoch": 2398} {"train_loss": -12.299505233764648, "global_step": 402923, "epoch": 2398} {"train_loss": -12.54916763305664, "global_step": 402924, "epoch": 2398} {"train_loss": -12.217955589294434, "global_step": 402925, "epoch": 2398} {"train_loss": -12.468780517578125, "global_step": 402926, "epoch": 2398} {"train_loss": -12.150989532470703, "global_step": 402927, "epoch": 2398} {"train_loss": -12.437573432922363, "global_step": 402928, "epoch": 2398} {"train_loss": -12.460391998291016, "global_step": 402929, "epoch": 2398} {"train_loss": -12.606134414672852, "global_step": 402930, "epoch": 2398} {"train_loss": -12.60459041595459, "global_step": 402931, "epoch": 2398} {"train_loss": -12.43658447265625, "global_step": 402932, "epoch": 2398} {"train_loss": -12.717499732971191, "global_step": 402933, "epoch": 2398} {"train_loss": -12.4912109375, "global_step": 402934, "epoch": 2398} {"train_loss": -12.16771125793457, "global_step": 402935, "epoch": 2398} {"train_loss": -12.568021774291992, "global_step": 402936, "epoch": 2398} {"train_loss": -12.33902645111084, "global_step": 402937, "epoch": 2398} {"train_loss": -12.473007202148438, "global_step": 402938, "epoch": 2398} {"train_loss": -12.62718677520752, "global_step": 402939, "epoch": 2398} {"train_loss": -12.514784812927246, "global_step": 402940, "epoch": 2398} {"train_loss": -12.56264591217041, "global_step": 402941, "epoch": 2398} {"train_loss": -12.703136444091797, "global_step": 402942, "epoch": 2398} {"train_loss": -12.428398132324219, "global_step": 402943, "epoch": 2398} {"train_loss": -12.75509262084961, "global_step": 402944, "epoch": 2398} {"train_loss": -12.417964935302734, "global_step": 402945, "epoch": 2398} {"train_loss": -12.431842803955078, "global_step": 402946, "epoch": 2398} {"train_loss": -12.729832649230957, "global_step": 402947, "epoch": 2398} {"train_loss": -12.488097190856934, "global_step": 402948, "epoch": 2398} {"train_loss": -12.513442993164062, "global_step": 402949, "epoch": 2398} {"train_loss": -12.590616226196289, "global_step": 402950, "epoch": 2398} {"train_loss": -12.198834419250488, "global_step": 402951, "epoch": 2398} {"train_loss": -11.718818664550781, "global_step": 402952, "epoch": 2398} {"train_loss": -12.47489070892334, "global_step": 402953, "epoch": 2398} {"train_loss": -12.180195808410645, "global_step": 402954, "epoch": 2398} {"train_loss": -12.355751991271973, "global_step": 402955, "epoch": 2398} {"train_loss": -12.278377532958984, "global_step": 402956, "epoch": 2398} {"train_loss": -12.146553039550781, "global_step": 402957, "epoch": 2398} {"train_loss": -12.519540786743164, "global_step": 402958, "epoch": 2398} {"train_loss": -11.593513488769531, "global_step": 402959, "epoch": 2398} {"train_loss": -11.849874496459961, "global_step": 402960, "epoch": 2398} {"train_loss": -12.481317520141602, "global_step": 402961, "epoch": 2398} {"train_loss": -12.190705299377441, "global_step": 402962, "epoch": 2398} {"train_loss": -12.420913696289062, "global_step": 402963, "epoch": 2398} {"train_loss": -12.423407554626465, "global_step": 402964, "epoch": 2398} {"train_loss": -12.185115814208984, "global_step": 402965, "epoch": 2398} {"train_loss": -12.349205017089844, "global_step": 402966, "epoch": 2398} {"train_loss": -12.120626449584961, "global_step": 402967, "epoch": 2398} {"train_loss": -12.135396957397461, "global_step": 402968, "epoch": 2398} {"train_loss": -11.45881175994873, "global_step": 402969, "epoch": 2398} {"train_loss": -11.25429916381836, "global_step": 402970, "epoch": 2398} {"train_loss": -12.458154678344727, "global_step": 402971, "epoch": 2398} {"train_loss": -11.159954071044922, "global_step": 402972, "epoch": 2398} {"train_loss": -12.423730850219727, "global_step": 402973, "epoch": 2398} {"train_loss": -10.687061309814453, "global_step": 402974, "epoch": 2398} {"train_loss": -11.05707836151123, "global_step": 402975, "epoch": 2398} {"train_loss": -10.877729415893555, "global_step": 402976, "epoch": 2398} {"train_loss": -10.63140869140625, "global_step": 402977, "epoch": 2398} {"train_loss": -11.984701156616211, "global_step": 402978, "epoch": 2398} {"train_loss": -11.675942420959473, "global_step": 402979, "epoch": 2398} {"train_loss": -11.72154426574707, "global_step": 402980, "epoch": 2398} {"train_loss": -12.03923511505127, "global_step": 402981, "epoch": 2398} {"train_loss": -11.751153945922852, "global_step": 402982, "epoch": 2398} {"train_loss": -12.171258926391602, "global_step": 402983, "epoch": 2398} {"train_loss": -11.573606491088867, "global_step": 402984, "epoch": 2398} {"train_loss": -12.157690048217773, "global_step": 402985, "epoch": 2398} {"train_loss": -11.820781707763672, "global_step": 402986, "epoch": 2398} {"train_loss": -11.645323753356934, "global_step": 402987, "epoch": 2398} {"train_loss": -12.540143013000488, "global_step": 402988, "epoch": 2398} {"train_loss": -12.1806640625, "global_step": 402989, "epoch": 2398} {"train_loss": -12.506845474243164, "global_step": 402990, "epoch": 2398} {"train_loss": -12.019186019897461, "global_step": 402991, "epoch": 2398} {"train_loss": -12.160172462463379, "global_step": 402992, "epoch": 2398} {"train_loss": -12.357823371887207, "global_step": 402993, "epoch": 2398} {"train_loss": -12.314237594604492, "global_step": 402994, "epoch": 2398} {"train_loss": -12.356769561767578, "global_step": 402995, "epoch": 2398} {"train_loss": -12.348226547241211, "global_step": 402996, "epoch": 2398} {"train_loss": -12.06278133392334, "global_step": 402997, "epoch": 2398} {"train_loss": -12.378750801086426, "global_step": 402998, "epoch": 2398} {"train_loss": -12.33678913116455, "global_step": 402999, "epoch": 2398} {"train_loss": -11.78358268737793, "global_step": 403000, "epoch": 2398} {"train_loss": -11.774772644042969, "global_step": 403001, "epoch": 2398} {"train_loss": -11.861188888549805, "global_step": 403002, "epoch": 2398} {"train_loss": -9.908537864685059, "global_step": 403003, "epoch": 2398} {"train_loss": -12.003610610961914, "global_step": 403004, "epoch": 2398} {"train_loss": -11.907440185546875, "global_step": 403005, "epoch": 2398} {"train_loss": -11.777849197387695, "global_step": 403006, "epoch": 2398} {"train_loss": -12.347861289978027, "global_step": 403007, "epoch": 2398} {"train_loss": -12.18826675415039, "global_step": 403008, "epoch": 2398} {"train_loss": -11.811716079711914, "global_step": 403009, "epoch": 2398} {"train_loss": -12.592940330505371, "global_step": 403010, "epoch": 2398} {"train_loss": -11.74604320526123, "global_step": 403011, "epoch": 2398} {"train_loss": -12.337947845458984, "global_step": 403012, "epoch": 2398} {"train_loss": -12.494180679321289, "global_step": 403013, "epoch": 2398} {"train_loss": -12.333727836608887, "global_step": 403014, "epoch": 2398} {"train_loss": -12.093111991882324, "global_step": 403015, "epoch": 2398} {"train_loss": -12.184915542602539, "global_step": 403016, "epoch": 2398} {"train_loss": -12.167118072509766, "global_step": 403017, "epoch": 2398} {"train_loss": -12.327872276306152, "global_step": 403018, "epoch": 2398} {"train_loss": -12.356987953186035, "global_step": 403019, "epoch": 2398} {"train_loss": -12.4058256149292, "global_step": 403020, "epoch": 2398} {"train_loss": -12.347341537475586, "global_step": 403021, "epoch": 2398} {"train_loss": -12.531179428100586, "global_step": 403022, "epoch": 2398} {"train_loss": -12.770596504211426, "global_step": 403023, "epoch": 2398} {"train_loss": -12.69900131225586, "global_step": 403024, "epoch": 2398} {"train_loss": -12.507410049438477, "global_step": 403025, "epoch": 2398} {"train_loss": -12.680047988891602, "global_step": 403026, "epoch": 2398} {"train_loss": -12.359429359436035, "global_step": 403027, "epoch": 2398} {"train_loss": -12.549460411071777, "global_step": 403028, "epoch": 2398} {"train_loss": -12.906636238098145, "global_step": 403029, "epoch": 2398} {"train_loss": -12.385820388793945, "global_step": 403030, "epoch": 2398} {"train_loss": -12.02943662234715, "global_step": 403031, "epoch": 2398, "val_loss": 303401.75} {"train_loss": -12.642843246459961, "global_step": 403032, "epoch": 2399} {"train_loss": -12.11164379119873, "global_step": 403033, "epoch": 2399} {"train_loss": -12.729117393493652, "global_step": 403034, "epoch": 2399} {"train_loss": -12.718215942382812, "global_step": 403035, "epoch": 2399} {"train_loss": -12.752904891967773, "global_step": 403036, "epoch": 2399} {"train_loss": -12.560209274291992, "global_step": 403037, "epoch": 2399} {"train_loss": -12.211307525634766, "global_step": 403038, "epoch": 2399} {"train_loss": -12.512127876281738, "global_step": 403039, "epoch": 2399} {"train_loss": -12.862773895263672, "global_step": 403040, "epoch": 2399} {"train_loss": -12.351188659667969, "global_step": 403041, "epoch": 2399} {"train_loss": -12.476531982421875, "global_step": 403042, "epoch": 2399} {"train_loss": -12.37956714630127, "global_step": 403043, "epoch": 2399} {"train_loss": -12.050361633300781, "global_step": 403044, "epoch": 2399} {"train_loss": -11.818687438964844, "global_step": 403045, "epoch": 2399} {"train_loss": -11.894548416137695, "global_step": 403046, "epoch": 2399} {"train_loss": -12.115523338317871, "global_step": 403047, "epoch": 2399} {"train_loss": -12.067041397094727, "global_step": 403048, "epoch": 2399} {"train_loss": -12.057879447937012, "global_step": 403049, "epoch": 2399} {"train_loss": -12.416299819946289, "global_step": 403050, "epoch": 2399} {"train_loss": -11.995264053344727, "global_step": 403051, "epoch": 2399} {"train_loss": -12.136861801147461, "global_step": 403052, "epoch": 2399} {"train_loss": -11.720016479492188, "global_step": 403053, "epoch": 2399} {"train_loss": -11.605735778808594, "global_step": 403054, "epoch": 2399} {"train_loss": -11.823802947998047, "global_step": 403055, "epoch": 2399} {"train_loss": -12.057123184204102, "global_step": 403056, "epoch": 2399} {"train_loss": -11.826175689697266, "global_step": 403057, "epoch": 2399} {"train_loss": -12.096902847290039, "global_step": 403058, "epoch": 2399} {"train_loss": -12.378437995910645, "global_step": 403059, "epoch": 2399} {"train_loss": -12.255719184875488, "global_step": 403060, "epoch": 2399} {"train_loss": -12.030981063842773, "global_step": 403061, "epoch": 2399} {"train_loss": -12.032063484191895, "global_step": 403062, "epoch": 2399} {"train_loss": -12.040329933166504, "global_step": 403063, "epoch": 2399} {"train_loss": -12.043923377990723, "global_step": 403064, "epoch": 2399} {"train_loss": -11.851600646972656, "global_step": 403065, "epoch": 2399} {"train_loss": -11.735809326171875, "global_step": 403066, "epoch": 2399} {"train_loss": -12.057129859924316, "global_step": 403067, "epoch": 2399} {"train_loss": -11.958452224731445, "global_step": 403068, "epoch": 2399} {"train_loss": -11.509455680847168, "global_step": 403069, "epoch": 2399} {"train_loss": -12.473287582397461, "global_step": 403070, "epoch": 2399} {"train_loss": -11.907804489135742, "global_step": 403071, "epoch": 2399} {"train_loss": -11.90461254119873, "global_step": 403072, "epoch": 2399} {"train_loss": -11.788562774658203, "global_step": 403073, "epoch": 2399} {"train_loss": -11.884057998657227, "global_step": 403074, "epoch": 2399} {"train_loss": -11.719791412353516, "global_step": 403075, "epoch": 2399} {"train_loss": -11.968463897705078, "global_step": 403076, "epoch": 2399} {"train_loss": -12.570024490356445, "global_step": 403077, "epoch": 2399} {"train_loss": -12.053866386413574, "global_step": 403078, "epoch": 2399} {"train_loss": -11.83285903930664, "global_step": 403079, "epoch": 2399} {"train_loss": -12.185369491577148, "global_step": 403080, "epoch": 2399} {"train_loss": -12.336196899414062, "global_step": 403081, "epoch": 2399} {"train_loss": -11.078619956970215, "global_step": 403082, "epoch": 2399} {"train_loss": -12.341273307800293, "global_step": 403083, "epoch": 2399} {"train_loss": -12.101157188415527, "global_step": 403084, "epoch": 2399} {"train_loss": -11.215977668762207, "global_step": 403085, "epoch": 2399} {"train_loss": -11.418882369995117, "global_step": 403086, "epoch": 2399} {"train_loss": -12.056102752685547, "global_step": 403087, "epoch": 2399} {"train_loss": -11.701842308044434, "global_step": 403088, "epoch": 2399} {"train_loss": -11.730951309204102, "global_step": 403089, "epoch": 2399} {"train_loss": -12.13151741027832, "global_step": 403090, "epoch": 2399} {"train_loss": -11.002601623535156, "global_step": 403091, "epoch": 2399} {"train_loss": -11.861703872680664, "global_step": 403092, "epoch": 2399} {"train_loss": -12.179174423217773, "global_step": 403093, "epoch": 2399} {"train_loss": -11.882330894470215, "global_step": 403094, "epoch": 2399} {"train_loss": -11.692840576171875, "global_step": 403095, "epoch": 2399} {"train_loss": -12.323273658752441, "global_step": 403096, "epoch": 2399} {"train_loss": -11.517520904541016, "global_step": 403097, "epoch": 2399} {"train_loss": -12.605268478393555, "global_step": 403098, "epoch": 2399} {"train_loss": -11.760954856872559, "global_step": 403099, "epoch": 2399} {"train_loss": -12.392298698425293, "global_step": 403100, "epoch": 2399} {"train_loss": -12.248003005981445, "global_step": 403101, "epoch": 2399} {"train_loss": -12.330368041992188, "global_step": 403102, "epoch": 2399} {"train_loss": -12.122542381286621, "global_step": 403103, "epoch": 2399} {"train_loss": -12.065652847290039, "global_step": 403104, "epoch": 2399} {"train_loss": -12.006551742553711, "global_step": 403105, "epoch": 2399} {"train_loss": -12.11733627319336, "global_step": 403106, "epoch": 2399} {"train_loss": -12.16969108581543, "global_step": 403107, "epoch": 2399} {"train_loss": -12.170517921447754, "global_step": 403108, "epoch": 2399} {"train_loss": -12.043777465820312, "global_step": 403109, "epoch": 2399} {"train_loss": -12.195545196533203, "global_step": 403110, "epoch": 2399} {"train_loss": -12.277780532836914, "global_step": 403111, "epoch": 2399} {"train_loss": -12.395115852355957, "global_step": 403112, "epoch": 2399} {"train_loss": -12.104413032531738, "global_step": 403113, "epoch": 2399} {"train_loss": -12.272791862487793, "global_step": 403114, "epoch": 2399} {"train_loss": -12.456563949584961, "global_step": 403115, "epoch": 2399} {"train_loss": -12.009588241577148, "global_step": 403116, "epoch": 2399} {"train_loss": -12.199710845947266, "global_step": 403117, "epoch": 2399} {"train_loss": -12.508195877075195, "global_step": 403118, "epoch": 2399} {"train_loss": -12.500097274780273, "global_step": 403119, "epoch": 2399} {"train_loss": -12.371210098266602, "global_step": 403120, "epoch": 2399} {"train_loss": -12.496393203735352, "global_step": 403121, "epoch": 2399} {"train_loss": -12.692870140075684, "global_step": 403122, "epoch": 2399} {"train_loss": -12.555824279785156, "global_step": 403123, "epoch": 2399} {"train_loss": -12.042983055114746, "global_step": 403124, "epoch": 2399} {"train_loss": -12.149028778076172, "global_step": 403125, "epoch": 2399} {"train_loss": -12.7727689743042, "global_step": 403126, "epoch": 2399} {"train_loss": -12.235298156738281, "global_step": 403127, "epoch": 2399} {"train_loss": -12.583512306213379, "global_step": 403128, "epoch": 2399} {"train_loss": -12.283945083618164, "global_step": 403129, "epoch": 2399} {"train_loss": -12.787165641784668, "global_step": 403130, "epoch": 2399} {"train_loss": -12.339162826538086, "global_step": 403131, "epoch": 2399} {"train_loss": -12.551780700683594, "global_step": 403132, "epoch": 2399} {"train_loss": -12.588235855102539, "global_step": 403133, "epoch": 2399} {"train_loss": -12.687921524047852, "global_step": 403134, "epoch": 2399} {"train_loss": -12.77160930633545, "global_step": 403135, "epoch": 2399} {"train_loss": -12.567915916442871, "global_step": 403136, "epoch": 2399} {"train_loss": -12.538644790649414, "global_step": 403137, "epoch": 2399} {"train_loss": -12.662673950195312, "global_step": 403138, "epoch": 2399} {"train_loss": -12.694253921508789, "global_step": 403139, "epoch": 2399} {"train_loss": -12.848760604858398, "global_step": 403140, "epoch": 2399} {"train_loss": -12.51230239868164, "global_step": 403141, "epoch": 2399} {"train_loss": -12.608089447021484, "global_step": 403142, "epoch": 2399} {"train_loss": -12.500561714172363, "global_step": 403143, "epoch": 2399} {"train_loss": -12.720966339111328, "global_step": 403144, "epoch": 2399} {"train_loss": -12.656408309936523, "global_step": 403145, "epoch": 2399} {"train_loss": -12.536612510681152, "global_step": 403146, "epoch": 2399} {"train_loss": -12.744209289550781, "global_step": 403147, "epoch": 2399} {"train_loss": -12.620514869689941, "global_step": 403148, "epoch": 2399} {"train_loss": -12.40888500213623, "global_step": 403149, "epoch": 2399} {"train_loss": -12.311407089233398, "global_step": 403150, "epoch": 2399} {"train_loss": -12.629766464233398, "global_step": 403151, "epoch": 2399} {"train_loss": -12.476442337036133, "global_step": 403152, "epoch": 2399} {"train_loss": -11.633708953857422, "global_step": 403153, "epoch": 2399} {"train_loss": -11.58620548248291, "global_step": 403154, "epoch": 2399} {"train_loss": -11.822840690612793, "global_step": 403155, "epoch": 2399} {"train_loss": -11.796208381652832, "global_step": 403156, "epoch": 2399} {"train_loss": -12.162313461303711, "global_step": 403157, "epoch": 2399} {"train_loss": -11.890946388244629, "global_step": 403158, "epoch": 2399} {"train_loss": -11.107915878295898, "global_step": 403159, "epoch": 2399} {"train_loss": -12.32159423828125, "global_step": 403160, "epoch": 2399} {"train_loss": -11.236625671386719, "global_step": 403161, "epoch": 2399} {"train_loss": -11.747453689575195, "global_step": 403162, "epoch": 2399} {"train_loss": -12.169246673583984, "global_step": 403163, "epoch": 2399} {"train_loss": -11.773393630981445, "global_step": 403164, "epoch": 2399} {"train_loss": -11.342484474182129, "global_step": 403165, "epoch": 2399} {"train_loss": -12.48978042602539, "global_step": 403166, "epoch": 2399} {"train_loss": -11.968340873718262, "global_step": 403167, "epoch": 2399} {"train_loss": -11.567874908447266, "global_step": 403168, "epoch": 2399} {"train_loss": -12.224227905273438, "global_step": 403169, "epoch": 2399} {"train_loss": -12.502573013305664, "global_step": 403170, "epoch": 2399} {"train_loss": -11.80655288696289, "global_step": 403171, "epoch": 2399} {"train_loss": -11.935115814208984, "global_step": 403172, "epoch": 2399} {"train_loss": -12.289460182189941, "global_step": 403173, "epoch": 2399} {"train_loss": -12.377156257629395, "global_step": 403174, "epoch": 2399} {"train_loss": -12.126508712768555, "global_step": 403175, "epoch": 2399} {"train_loss": -11.889059066772461, "global_step": 403176, "epoch": 2399} {"train_loss": -12.01794719696045, "global_step": 403177, "epoch": 2399} {"train_loss": -11.558143615722656, "global_step": 403178, "epoch": 2399} {"train_loss": -12.044754028320312, "global_step": 403179, "epoch": 2399} {"train_loss": -11.006653785705566, "global_step": 403180, "epoch": 2399} {"train_loss": -12.325777053833008, "global_step": 403181, "epoch": 2399} {"train_loss": -11.251387596130371, "global_step": 403182, "epoch": 2399} {"train_loss": -11.308338165283203, "global_step": 403183, "epoch": 2399} {"train_loss": -11.364479064941406, "global_step": 403184, "epoch": 2399} {"train_loss": -11.281932830810547, "global_step": 403185, "epoch": 2399} {"train_loss": -10.707805633544922, "global_step": 403186, "epoch": 2399} {"train_loss": -11.676995277404785, "global_step": 403187, "epoch": 2399} {"train_loss": -11.628369331359863, "global_step": 403188, "epoch": 2399} {"train_loss": -11.436874389648438, "global_step": 403189, "epoch": 2399} {"train_loss": -12.038248062133789, "global_step": 403190, "epoch": 2399} {"train_loss": -11.344249725341797, "global_step": 403191, "epoch": 2399} {"train_loss": -11.282242774963379, "global_step": 403192, "epoch": 2399} {"train_loss": -11.127544403076172, "global_step": 403193, "epoch": 2399} {"train_loss": -10.841147422790527, "global_step": 403194, "epoch": 2399} {"train_loss": -11.054821014404297, "global_step": 403195, "epoch": 2399} {"train_loss": -10.890104293823242, "global_step": 403196, "epoch": 2399} {"train_loss": -10.906725883483887, "global_step": 403197, "epoch": 2399} {"train_loss": -11.439263343811035, "global_step": 403198, "epoch": 2399} {"train_loss": -12.04949646904355, "global_step": 403199, "epoch": 2399, "val_loss": 303332.59375} {"train_loss": -11.724958419799805, "global_step": 403200, "epoch": 2400} {"train_loss": -10.942893981933594, "global_step": 403201, "epoch": 2400} {"train_loss": -11.096059799194336, "global_step": 403202, "epoch": 2400} {"train_loss": -10.371532440185547, "global_step": 403203, "epoch": 2400} {"train_loss": -11.207383155822754, "global_step": 403204, "epoch": 2400} {"train_loss": -10.716538429260254, "global_step": 403205, "epoch": 2400} {"train_loss": -10.767011642456055, "global_step": 403206, "epoch": 2400} {"train_loss": -10.383020401000977, "global_step": 403207, "epoch": 2400} {"train_loss": -10.399805068969727, "global_step": 403208, "epoch": 2400} {"train_loss": -11.304527282714844, "global_step": 403209, "epoch": 2400} {"train_loss": -11.073725700378418, "global_step": 403210, "epoch": 2400} {"train_loss": -10.880577087402344, "global_step": 403211, "epoch": 2400} {"train_loss": -11.62971305847168, "global_step": 403212, "epoch": 2400} {"train_loss": -10.842693328857422, "global_step": 403213, "epoch": 2400} {"train_loss": -10.609956741333008, "global_step": 403214, "epoch": 2400} {"train_loss": -11.734827995300293, "global_step": 403215, "epoch": 2400} {"train_loss": -11.11166763305664, "global_step": 403216, "epoch": 2400} {"train_loss": -11.226755142211914, "global_step": 403217, "epoch": 2400} {"train_loss": -11.324319839477539, "global_step": 403218, "epoch": 2400} {"train_loss": -10.93661880493164, "global_step": 403219, "epoch": 2400} {"train_loss": -11.319709777832031, "global_step": 403220, "epoch": 2400} {"train_loss": -11.589284896850586, "global_step": 403221, "epoch": 2400} {"train_loss": -11.65158748626709, "global_step": 403222, "epoch": 2400} {"train_loss": -11.641508102416992, "global_step": 403223, "epoch": 2400} {"train_loss": -11.609697341918945, "global_step": 403224, "epoch": 2400} {"train_loss": -12.08761978149414, "global_step": 403225, "epoch": 2400} {"train_loss": -12.018514633178711, "global_step": 403226, "epoch": 2400} {"train_loss": -11.766019821166992, "global_step": 403227, "epoch": 2400} {"train_loss": -12.012060165405273, "global_step": 403228, "epoch": 2400} {"train_loss": -11.899177551269531, "global_step": 403229, "epoch": 2400} {"train_loss": -12.228771209716797, "global_step": 403230, "epoch": 2400} {"train_loss": -12.137848854064941, "global_step": 403231, "epoch": 2400} {"train_loss": -12.348275184631348, "global_step": 403232, "epoch": 2400} {"train_loss": -11.917215347290039, "global_step": 403233, "epoch": 2400} {"train_loss": -12.075175285339355, "global_step": 403234, "epoch": 2400} {"train_loss": -12.363387107849121, "global_step": 403235, "epoch": 2400} {"train_loss": -12.384943008422852, "global_step": 403236, "epoch": 2400} {"train_loss": -12.290715217590332, "global_step": 403237, "epoch": 2400} {"train_loss": -12.190120697021484, "global_step": 403238, "epoch": 2400} {"train_loss": -12.122632026672363, "global_step": 403239, "epoch": 2400} {"train_loss": -12.217784881591797, "global_step": 403240, "epoch": 2400} {"train_loss": -12.021368980407715, "global_step": 403241, "epoch": 2400} {"train_loss": -11.86611557006836, "global_step": 403242, "epoch": 2400} {"train_loss": -12.372873306274414, "global_step": 403243, "epoch": 2400} {"train_loss": -11.851480484008789, "global_step": 403244, "epoch": 2400} {"train_loss": -12.115241050720215, "global_step": 403245, "epoch": 2400} {"train_loss": -12.30473804473877, "global_step": 403246, "epoch": 2400} {"train_loss": -11.969619750976562, "global_step": 403247, "epoch": 2400} {"train_loss": -12.430436134338379, "global_step": 403248, "epoch": 2400} {"train_loss": -12.235486030578613, "global_step": 403249, "epoch": 2400} {"train_loss": -12.639242172241211, "global_step": 403250, "epoch": 2400} {"train_loss": -12.289414405822754, "global_step": 403251, "epoch": 2400} {"train_loss": -12.594346046447754, "global_step": 403252, "epoch": 2400} {"train_loss": -12.095327377319336, "global_step": 403253, "epoch": 2400} {"train_loss": -12.431754112243652, "global_step": 403254, "epoch": 2400} {"train_loss": -12.363458633422852, "global_step": 403255, "epoch": 2400} {"train_loss": -12.42974853515625, "global_step": 403256, "epoch": 2400} {"train_loss": -12.079901695251465, "global_step": 403257, "epoch": 2400} {"train_loss": -12.295509338378906, "global_step": 403258, "epoch": 2400} {"train_loss": -12.211202621459961, "global_step": 403259, "epoch": 2400} {"train_loss": -12.329997062683105, "global_step": 403260, "epoch": 2400} {"train_loss": -12.443565368652344, "global_step": 403261, "epoch": 2400} {"train_loss": -12.420281410217285, "global_step": 403262, "epoch": 2400} {"train_loss": -12.361652374267578, "global_step": 403263, "epoch": 2400} {"train_loss": -12.109416007995605, "global_step": 403264, "epoch": 2400} {"train_loss": -12.394522666931152, "global_step": 403265, "epoch": 2400} {"train_loss": -12.197637557983398, "global_step": 403266, "epoch": 2400} {"train_loss": -12.598370552062988, "global_step": 403267, "epoch": 2400} {"train_loss": -12.031102180480957, "global_step": 403268, "epoch": 2400} {"train_loss": -12.255365371704102, "global_step": 403269, "epoch": 2400} {"train_loss": -12.261966705322266, "global_step": 403270, "epoch": 2400} {"train_loss": -12.42948055267334, "global_step": 403271, "epoch": 2400} {"train_loss": -12.421087265014648, "global_step": 403272, "epoch": 2400} {"train_loss": -12.495590209960938, "global_step": 403273, "epoch": 2400} {"train_loss": -12.551992416381836, "global_step": 403274, "epoch": 2400} {"train_loss": -12.450376510620117, "global_step": 403275, "epoch": 2400} {"train_loss": -12.677350044250488, "global_step": 403276, "epoch": 2400} {"train_loss": -12.631248474121094, "global_step": 403277, "epoch": 2400} {"train_loss": -12.570062637329102, "global_step": 403278, "epoch": 2400} {"train_loss": -12.37574291229248, "global_step": 403279, "epoch": 2400} {"train_loss": -12.673227310180664, "global_step": 403280, "epoch": 2400} {"train_loss": -12.664641380310059, "global_step": 403281, "epoch": 2400} {"train_loss": -12.728155136108398, "global_step": 403282, "epoch": 2400} {"train_loss": -12.605424880981445, "global_step": 403283, "epoch": 2400} {"train_loss": -12.602706909179688, "global_step": 403284, "epoch": 2400} {"train_loss": -12.442534446716309, "global_step": 403285, "epoch": 2400} {"train_loss": -12.613481521606445, "global_step": 403286, "epoch": 2400} {"train_loss": -12.734663009643555, "global_step": 403287, "epoch": 2400} {"train_loss": -12.637560844421387, "global_step": 403288, "epoch": 2400} {"train_loss": -12.743289947509766, "global_step": 403289, "epoch": 2400} {"train_loss": -12.731161117553711, "global_step": 403290, "epoch": 2400} {"train_loss": -12.815670013427734, "global_step": 403291, "epoch": 2400} {"train_loss": -12.76418685913086, "global_step": 403292, "epoch": 2400} {"train_loss": -12.821592330932617, "global_step": 403293, "epoch": 2400} {"train_loss": -12.707784652709961, "global_step": 403294, "epoch": 2400} {"train_loss": -12.676029205322266, "global_step": 403295, "epoch": 2400} {"train_loss": -12.637280464172363, "global_step": 403296, "epoch": 2400} {"train_loss": -12.805413246154785, "global_step": 403297, "epoch": 2400} {"train_loss": -12.155338287353516, "global_step": 403298, "epoch": 2400} {"train_loss": -12.726383209228516, "global_step": 403299, "epoch": 2400} {"train_loss": -12.71238899230957, "global_step": 403300, "epoch": 2400} {"train_loss": -12.414168357849121, "global_step": 403301, "epoch": 2400} {"train_loss": -12.830825805664062, "global_step": 403302, "epoch": 2400} {"train_loss": -12.716035842895508, "global_step": 403303, "epoch": 2400} {"train_loss": -12.270668029785156, "global_step": 403304, "epoch": 2400} {"train_loss": -12.63710880279541, "global_step": 403305, "epoch": 2400} {"train_loss": -12.829364776611328, "global_step": 403306, "epoch": 2400} {"train_loss": -12.529653549194336, "global_step": 403307, "epoch": 2400} {"train_loss": -12.8619966506958, "global_step": 403308, "epoch": 2400} {"train_loss": -12.66598129272461, "global_step": 403309, "epoch": 2400} {"train_loss": -12.396458625793457, "global_step": 403310, "epoch": 2400} {"train_loss": -12.295462608337402, "global_step": 403311, "epoch": 2400} {"train_loss": -12.818464279174805, "global_step": 403312, "epoch": 2400} {"train_loss": -12.482379913330078, "global_step": 403313, "epoch": 2400} {"train_loss": -12.189886093139648, "global_step": 403314, "epoch": 2400} {"train_loss": -12.06454086303711, "global_step": 403315, "epoch": 2400} {"train_loss": -12.103263854980469, "global_step": 403316, "epoch": 2400} {"train_loss": -12.597484588623047, "global_step": 403317, "epoch": 2400} {"train_loss": -11.79407787322998, "global_step": 403318, "epoch": 2400} {"train_loss": -12.516615867614746, "global_step": 403319, "epoch": 2400} {"train_loss": -11.919744491577148, "global_step": 403320, "epoch": 2400} {"train_loss": -11.627262115478516, "global_step": 403321, "epoch": 2400} {"train_loss": -12.308624267578125, "global_step": 403322, "epoch": 2400} {"train_loss": -12.188871383666992, "global_step": 403323, "epoch": 2400} {"train_loss": -12.307092666625977, "global_step": 403324, "epoch": 2400} {"train_loss": -12.396097183227539, "global_step": 403325, "epoch": 2400} {"train_loss": -11.740789413452148, "global_step": 403326, "epoch": 2400} {"train_loss": -11.82568359375, "global_step": 403327, "epoch": 2400} {"train_loss": -12.539337158203125, "global_step": 403328, "epoch": 2400} {"train_loss": -12.220267295837402, "global_step": 403329, "epoch": 2400} {"train_loss": -11.667909622192383, "global_step": 403330, "epoch": 2400} {"train_loss": -12.636360168457031, "global_step": 403331, "epoch": 2400} {"train_loss": -12.065873146057129, "global_step": 403332, "epoch": 2400} {"train_loss": -11.638452529907227, "global_step": 403333, "epoch": 2400} {"train_loss": -12.311037063598633, "global_step": 403334, "epoch": 2400} {"train_loss": -11.875585556030273, "global_step": 403335, "epoch": 2400} {"train_loss": -11.602043151855469, "global_step": 403336, "epoch": 2400} {"train_loss": -11.398123741149902, "global_step": 403337, "epoch": 2400} {"train_loss": -12.630643844604492, "global_step": 403338, "epoch": 2400} {"train_loss": -12.268182754516602, "global_step": 403339, "epoch": 2400} {"train_loss": -12.03295612335205, "global_step": 403340, "epoch": 2400} {"train_loss": -12.4478759765625, "global_step": 403341, "epoch": 2400} {"train_loss": -12.481422424316406, "global_step": 403342, "epoch": 2400} {"train_loss": -12.314502716064453, "global_step": 403343, "epoch": 2400} {"train_loss": -12.358475685119629, "global_step": 403344, "epoch": 2400} {"train_loss": -12.235641479492188, "global_step": 403345, "epoch": 2400} {"train_loss": -11.685769081115723, "global_step": 403346, "epoch": 2400} {"train_loss": -12.366020202636719, "global_step": 403347, "epoch": 2400} {"train_loss": -11.97701644897461, "global_step": 403348, "epoch": 2400} {"train_loss": -12.07893180847168, "global_step": 403349, "epoch": 2400} {"train_loss": -11.503738403320312, "global_step": 403350, "epoch": 2400} {"train_loss": -11.901670455932617, "global_step": 403351, "epoch": 2400} {"train_loss": -11.854938507080078, "global_step": 403352, "epoch": 2400} {"train_loss": -11.712604522705078, "global_step": 403353, "epoch": 2400} {"train_loss": -11.993408203125, "global_step": 403354, "epoch": 2400} {"train_loss": -11.60447883605957, "global_step": 403355, "epoch": 2400} {"train_loss": -12.009047508239746, "global_step": 403356, "epoch": 2400} {"train_loss": -11.995139122009277, "global_step": 403357, "epoch": 2400} {"train_loss": -11.635919570922852, "global_step": 403358, "epoch": 2400} {"train_loss": -11.841629981994629, "global_step": 403359, "epoch": 2400} {"train_loss": -11.864320755004883, "global_step": 403360, "epoch": 2400} {"train_loss": -12.103189468383789, "global_step": 403361, "epoch": 2400} {"train_loss": -11.665800094604492, "global_step": 403362, "epoch": 2400} {"train_loss": -12.436836242675781, "global_step": 403363, "epoch": 2400} {"train_loss": -11.748052597045898, "global_step": 403364, "epoch": 2400} {"train_loss": -12.275986671447754, "global_step": 403365, "epoch": 2400} {"train_loss": -11.861855506896973, "global_step": 403366, "epoch": 2400} {"train_loss": -12.097919560614086, "global_step": 403367, "epoch": 2400, "train/sim_max_reward_0": 0.674566708098209, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.007585626074249171, "train/sim_max_reward_3": 0.4048965186251678, "train/sim_max_reward_4": 0.8831745799095715, "train/sim_max_reward_5": 0.5684579692489425, "test/sim_max_reward_4400000": 0.971529967009936, "test/sim_max_reward_4400001": 0.7529029140728101, "test/sim_max_reward_4400002": 0.07830791392510501, "test/sim_max_reward_4400003": 0.8882405032329562, "test/sim_max_reward_4400004": 0.5999011418801956, "test/sim_max_reward_4400005": 0.03900616693239641, "test/sim_max_reward_4400006": 0.3034593917176817, "test/sim_max_reward_4400007": 0.6689949019254953, "test/sim_max_reward_4400008": 0.5668306432651796, "test/sim_max_reward_4400009": 0.029693625424042854, "test/sim_max_reward_4400010": 0.690156210835135, "test/sim_max_reward_4400011": 0.9640951133196908, "test/sim_max_reward_4400012": 0.14110722128947978, "test/sim_max_reward_4400013": 0.9933163167385652, "test/sim_max_reward_4400014": 0.397179568986547, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9808890809863519, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.25994404375736196, "test/sim_max_reward_4400021": 0.9275697954701642, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.13078886843092458, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.6356908972708494, "test/sim_max_reward_4400026": 0.02010448566171279, "test/sim_max_reward_4400027": 0.9704702783506685, "test/sim_max_reward_4400028": 0.9327406403375611, "test/sim_max_reward_4400029": 0.46426577569612126, "test/sim_max_reward_4400030": 0.9780966221224072, "test/sim_max_reward_4400031": 0.5182408144453418, "test/sim_max_reward_4400032": 0.3959487644558136, "test/sim_max_reward_4400033": 0.7112808133226209, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.45816674048700046, "test/sim_max_reward_4400036": 0.3741265124688523, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.9944335882826177, "test/sim_max_reward_4400039": 0.963374907252079, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.1666485177583387, "test/sim_max_reward_4400042": 0.9589468483696809, "test/sim_max_reward_4400043": 0.04457726332474153, "test/sim_max_reward_4400044": 0.9784268951453845, "test/sim_max_reward_4400045": 0.0, "test/sim_max_reward_4400046": 0.3147671341171592, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.5897802336593566, "test/mean_score": 0.5072505506978122, "val_loss": 302166.28125, "train_action_mse_error": 0.9282330274581909} {"train_loss": -11.793428421020508, "global_step": 403368, "epoch": 2401} {"train_loss": -11.667987823486328, "global_step": 403369, "epoch": 2401} {"train_loss": -11.927770614624023, "global_step": 403370, "epoch": 2401} {"train_loss": -12.130311965942383, "global_step": 403371, "epoch": 2401} {"train_loss": -11.637089729309082, "global_step": 403372, "epoch": 2401} {"train_loss": -12.266254425048828, "global_step": 403373, "epoch": 2401} {"train_loss": -12.051050186157227, "global_step": 403374, "epoch": 2401} {"train_loss": -11.761240005493164, "global_step": 403375, "epoch": 2401} {"train_loss": -11.98614501953125, "global_step": 403376, "epoch": 2401} {"train_loss": -11.807052612304688, "global_step": 403377, "epoch": 2401} {"train_loss": -11.898247718811035, "global_step": 403378, "epoch": 2401} {"train_loss": -11.734737396240234, "global_step": 403379, "epoch": 2401} {"train_loss": -11.434467315673828, "global_step": 403380, "epoch": 2401} {"train_loss": -11.485559463500977, "global_step": 403381, "epoch": 2401} {"train_loss": -12.488298416137695, "global_step": 403382, "epoch": 2401} {"train_loss": -11.30327320098877, "global_step": 403383, "epoch": 2401} {"train_loss": -11.682940483093262, "global_step": 403384, "epoch": 2401} {"train_loss": -11.406816482543945, "global_step": 403385, "epoch": 2401} {"train_loss": -11.398384094238281, "global_step": 403386, "epoch": 2401} {"train_loss": -11.539435386657715, "global_step": 403387, "epoch": 2401} {"train_loss": -11.402585983276367, "global_step": 403388, "epoch": 2401} {"train_loss": -11.9207763671875, "global_step": 403389, "epoch": 2401} {"train_loss": -12.208009719848633, "global_step": 403390, "epoch": 2401} {"train_loss": -11.58195686340332, "global_step": 403391, "epoch": 2401} {"train_loss": -11.982156753540039, "global_step": 403392, "epoch": 2401} {"train_loss": -11.67162036895752, "global_step": 403393, "epoch": 2401} {"train_loss": -11.627723693847656, "global_step": 403394, "epoch": 2401} {"train_loss": -11.664077758789062, "global_step": 403395, "epoch": 2401} {"train_loss": -12.137226104736328, "global_step": 403396, "epoch": 2401} {"train_loss": -11.763622283935547, "global_step": 403397, "epoch": 2401} {"train_loss": -11.722004890441895, "global_step": 403398, "epoch": 2401} {"train_loss": -11.375130653381348, "global_step": 403399, "epoch": 2401} {"train_loss": -12.044790267944336, "global_step": 403400, "epoch": 2401} {"train_loss": -11.383974075317383, "global_step": 403401, "epoch": 2401} {"train_loss": -11.692020416259766, "global_step": 403402, "epoch": 2401} {"train_loss": -11.638326644897461, "global_step": 403403, "epoch": 2401} {"train_loss": -11.604137420654297, "global_step": 403404, "epoch": 2401} {"train_loss": -12.540399551391602, "global_step": 403405, "epoch": 2401} {"train_loss": -11.138788223266602, "global_step": 403406, "epoch": 2401} {"train_loss": -11.941703796386719, "global_step": 403407, "epoch": 2401} {"train_loss": -11.775989532470703, "global_step": 403408, "epoch": 2401} {"train_loss": -11.979745864868164, "global_step": 403409, "epoch": 2401} {"train_loss": -12.330350875854492, "global_step": 403410, "epoch": 2401} {"train_loss": -12.045768737792969, "global_step": 403411, "epoch": 2401} {"train_loss": -12.404308319091797, "global_step": 403412, "epoch": 2401} {"train_loss": -11.955717086791992, "global_step": 403413, "epoch": 2401} {"train_loss": -12.05009651184082, "global_step": 403414, "epoch": 2401} {"train_loss": -12.341057777404785, "global_step": 403415, "epoch": 2401} {"train_loss": -12.300151824951172, "global_step": 403416, "epoch": 2401} {"train_loss": -12.277795791625977, "global_step": 403417, "epoch": 2401} {"train_loss": -12.198768615722656, "global_step": 403418, "epoch": 2401} {"train_loss": -12.277185440063477, "global_step": 403419, "epoch": 2401} {"train_loss": -12.27734088897705, "global_step": 403420, "epoch": 2401} {"train_loss": -12.171581268310547, "global_step": 403421, "epoch": 2401} {"train_loss": -12.469371795654297, "global_step": 403422, "epoch": 2401} {"train_loss": -11.815271377563477, "global_step": 403423, "epoch": 2401} {"train_loss": -12.53573226928711, "global_step": 403424, "epoch": 2401} {"train_loss": -12.423834800720215, "global_step": 403425, "epoch": 2401} {"train_loss": -12.176651000976562, "global_step": 403426, "epoch": 2401} {"train_loss": -12.390538215637207, "global_step": 403427, "epoch": 2401} {"train_loss": -12.497057914733887, "global_step": 403428, "epoch": 2401} {"train_loss": -12.207188606262207, "global_step": 403429, "epoch": 2401} {"train_loss": -12.474321365356445, "global_step": 403430, "epoch": 2401} {"train_loss": -12.20077896118164, "global_step": 403431, "epoch": 2401} {"train_loss": -12.545366287231445, "global_step": 403432, "epoch": 2401} {"train_loss": -12.468395233154297, "global_step": 403433, "epoch": 2401} {"train_loss": -12.561028480529785, "global_step": 403434, "epoch": 2401} {"train_loss": -12.720019340515137, "global_step": 403435, "epoch": 2401} {"train_loss": -12.246391296386719, "global_step": 403436, "epoch": 2401} {"train_loss": -12.686861038208008, "global_step": 403437, "epoch": 2401} {"train_loss": -12.677639961242676, "global_step": 403438, "epoch": 2401} {"train_loss": -12.564155578613281, "global_step": 403439, "epoch": 2401} {"train_loss": -12.73320198059082, "global_step": 403440, "epoch": 2401} {"train_loss": -12.360475540161133, "global_step": 403441, "epoch": 2401} {"train_loss": -12.237405776977539, "global_step": 403442, "epoch": 2401} {"train_loss": -12.419407844543457, "global_step": 403443, "epoch": 2401} {"train_loss": -12.426958084106445, "global_step": 403444, "epoch": 2401} {"train_loss": -12.429813385009766, "global_step": 403445, "epoch": 2401} {"train_loss": -12.773111343383789, "global_step": 403446, "epoch": 2401} {"train_loss": -12.333934783935547, "global_step": 403447, "epoch": 2401} {"train_loss": -12.369424819946289, "global_step": 403448, "epoch": 2401} {"train_loss": -12.549636840820312, "global_step": 403449, "epoch": 2401} {"train_loss": -12.536518096923828, "global_step": 403450, "epoch": 2401} {"train_loss": -12.472614288330078, "global_step": 403451, "epoch": 2401} {"train_loss": -12.544952392578125, "global_step": 403452, "epoch": 2401} {"train_loss": -12.365240097045898, "global_step": 403453, "epoch": 2401} {"train_loss": -12.213528633117676, "global_step": 403454, "epoch": 2401} {"train_loss": -12.242120742797852, "global_step": 403455, "epoch": 2401} {"train_loss": -12.242894172668457, "global_step": 403456, "epoch": 2401} {"train_loss": -12.067475318908691, "global_step": 403457, "epoch": 2401} {"train_loss": -12.006343841552734, "global_step": 403458, "epoch": 2401} {"train_loss": -10.589313507080078, "global_step": 403459, "epoch": 2401} {"train_loss": -12.531465530395508, "global_step": 403460, "epoch": 2401} {"train_loss": -11.153850555419922, "global_step": 403461, "epoch": 2401} {"train_loss": -12.1317138671875, "global_step": 403462, "epoch": 2401} {"train_loss": -12.17953109741211, "global_step": 403463, "epoch": 2401} {"train_loss": -12.245185852050781, "global_step": 403464, "epoch": 2401} {"train_loss": -12.551692962646484, "global_step": 403465, "epoch": 2401} {"train_loss": -12.324508666992188, "global_step": 403466, "epoch": 2401} {"train_loss": -12.47932243347168, "global_step": 403467, "epoch": 2401} {"train_loss": -12.0458984375, "global_step": 403468, "epoch": 2401} {"train_loss": -12.219144821166992, "global_step": 403469, "epoch": 2401} {"train_loss": -12.672724723815918, "global_step": 403470, "epoch": 2401} {"train_loss": -12.36439323425293, "global_step": 403471, "epoch": 2401} {"train_loss": -12.010690689086914, "global_step": 403472, "epoch": 2401} {"train_loss": -12.367998123168945, "global_step": 403473, "epoch": 2401} {"train_loss": -12.708385467529297, "global_step": 403474, "epoch": 2401} {"train_loss": -12.458549499511719, "global_step": 403475, "epoch": 2401} {"train_loss": -12.17410659790039, "global_step": 403476, "epoch": 2401} {"train_loss": -12.55056095123291, "global_step": 403477, "epoch": 2401} {"train_loss": -12.291630744934082, "global_step": 403478, "epoch": 2401} {"train_loss": -12.344005584716797, "global_step": 403479, "epoch": 2401} {"train_loss": -12.494026184082031, "global_step": 403480, "epoch": 2401} {"train_loss": -12.140215873718262, "global_step": 403481, "epoch": 2401} {"train_loss": -12.431955337524414, "global_step": 403482, "epoch": 2401} {"train_loss": -12.268611907958984, "global_step": 403483, "epoch": 2401} {"train_loss": -12.488577842712402, "global_step": 403484, "epoch": 2401} {"train_loss": -12.556775093078613, "global_step": 403485, "epoch": 2401} {"train_loss": -12.541614532470703, "global_step": 403486, "epoch": 2401} {"train_loss": -12.239843368530273, "global_step": 403487, "epoch": 2401} {"train_loss": -12.24923324584961, "global_step": 403488, "epoch": 2401} {"train_loss": -12.633161544799805, "global_step": 403489, "epoch": 2401} {"train_loss": -12.152517318725586, "global_step": 403490, "epoch": 2401} {"train_loss": -12.310110092163086, "global_step": 403491, "epoch": 2401} {"train_loss": -12.41168212890625, "global_step": 403492, "epoch": 2401} {"train_loss": -12.698394775390625, "global_step": 403493, "epoch": 2401} {"train_loss": -12.11309814453125, "global_step": 403494, "epoch": 2401} {"train_loss": -12.4786376953125, "global_step": 403495, "epoch": 2401} {"train_loss": -11.669862747192383, "global_step": 403496, "epoch": 2401} {"train_loss": -12.37800407409668, "global_step": 403497, "epoch": 2401} {"train_loss": -12.30337142944336, "global_step": 403498, "epoch": 2401} {"train_loss": -12.184442520141602, "global_step": 403499, "epoch": 2401} {"train_loss": -12.22336196899414, "global_step": 403500, "epoch": 2401} {"train_loss": -12.401341438293457, "global_step": 403501, "epoch": 2401} {"train_loss": -12.593341827392578, "global_step": 403502, "epoch": 2401} {"train_loss": -12.722909927368164, "global_step": 403503, "epoch": 2401} {"train_loss": -12.646129608154297, "global_step": 403504, "epoch": 2401} {"train_loss": -12.404698371887207, "global_step": 403505, "epoch": 2401} {"train_loss": -12.719205856323242, "global_step": 403506, "epoch": 2401} {"train_loss": -12.255619049072266, "global_step": 403507, "epoch": 2401} {"train_loss": -12.600475311279297, "global_step": 403508, "epoch": 2401} {"train_loss": -12.536944389343262, "global_step": 403509, "epoch": 2401} {"train_loss": -12.662954330444336, "global_step": 403510, "epoch": 2401} {"train_loss": -12.658720970153809, "global_step": 403511, "epoch": 2401} {"train_loss": -12.660784721374512, "global_step": 403512, "epoch": 2401} {"train_loss": -12.498414993286133, "global_step": 403513, "epoch": 2401} {"train_loss": -12.718415260314941, "global_step": 403514, "epoch": 2401} {"train_loss": -12.413698196411133, "global_step": 403515, "epoch": 2401} {"train_loss": -11.833723068237305, "global_step": 403516, "epoch": 2401} {"train_loss": -12.005504608154297, "global_step": 403517, "epoch": 2401} {"train_loss": -12.602310180664062, "global_step": 403518, "epoch": 2401} {"train_loss": -12.18490219116211, "global_step": 403519, "epoch": 2401} {"train_loss": -11.84128475189209, "global_step": 403520, "epoch": 2401} {"train_loss": -11.619588851928711, "global_step": 403521, "epoch": 2401} {"train_loss": -11.659128189086914, "global_step": 403522, "epoch": 2401} {"train_loss": -12.351574897766113, "global_step": 403523, "epoch": 2401} {"train_loss": -11.231728553771973, "global_step": 403524, "epoch": 2401} {"train_loss": -10.145994186401367, "global_step": 403525, "epoch": 2401} {"train_loss": -10.458381652832031, "global_step": 403526, "epoch": 2401} {"train_loss": -11.57199478149414, "global_step": 403527, "epoch": 2401} {"train_loss": -9.94875431060791, "global_step": 403528, "epoch": 2401} {"train_loss": -11.956665992736816, "global_step": 403529, "epoch": 2401} {"train_loss": -10.49185562133789, "global_step": 403530, "epoch": 2401} {"train_loss": -11.416563987731934, "global_step": 403531, "epoch": 2401} {"train_loss": -10.7234525680542, "global_step": 403532, "epoch": 2401} {"train_loss": -9.993017196655273, "global_step": 403533, "epoch": 2401} {"train_loss": -10.037132263183594, "global_step": 403534, "epoch": 2401} {"train_loss": -12.076171602521624, "global_step": 403535, "epoch": 2401, "val_loss": 303578.625} {"train_loss": -8.286312103271484, "global_step": 403536, "epoch": 2402} {"train_loss": -9.548337936401367, "global_step": 403537, "epoch": 2402} {"train_loss": -10.339411735534668, "global_step": 403538, "epoch": 2402} {"train_loss": -9.612388610839844, "global_step": 403539, "epoch": 2402} {"train_loss": -9.021995544433594, "global_step": 403540, "epoch": 2402} {"train_loss": -10.983211517333984, "global_step": 403541, "epoch": 2402} {"train_loss": -9.086503982543945, "global_step": 403542, "epoch": 2402} {"train_loss": -11.070392608642578, "global_step": 403543, "epoch": 2402} {"train_loss": -9.640176773071289, "global_step": 403544, "epoch": 2402} {"train_loss": -11.525879859924316, "global_step": 403545, "epoch": 2402} {"train_loss": -9.576327323913574, "global_step": 403546, "epoch": 2402} {"train_loss": -11.510736465454102, "global_step": 403547, "epoch": 2402} {"train_loss": -11.195094108581543, "global_step": 403548, "epoch": 2402} {"train_loss": -11.179815292358398, "global_step": 403549, "epoch": 2402} {"train_loss": -11.437234878540039, "global_step": 403550, "epoch": 2402} {"train_loss": -11.110475540161133, "global_step": 403551, "epoch": 2402} {"train_loss": -11.7909574508667, "global_step": 403552, "epoch": 2402} {"train_loss": -11.730223655700684, "global_step": 403553, "epoch": 2402} {"train_loss": -12.060348510742188, "global_step": 403554, "epoch": 2402} {"train_loss": -11.79601764678955, "global_step": 403555, "epoch": 2402} {"train_loss": -11.58110237121582, "global_step": 403556, "epoch": 2402} {"train_loss": -11.927165985107422, "global_step": 403557, "epoch": 2402} {"train_loss": -11.894830703735352, "global_step": 403558, "epoch": 2402} {"train_loss": -12.050293922424316, "global_step": 403559, "epoch": 2402} {"train_loss": -12.133832931518555, "global_step": 403560, "epoch": 2402} {"train_loss": -12.239501953125, "global_step": 403561, "epoch": 2402} {"train_loss": -11.908029556274414, "global_step": 403562, "epoch": 2402} {"train_loss": -12.166864395141602, "global_step": 403563, "epoch": 2402} {"train_loss": -12.142688751220703, "global_step": 403564, "epoch": 2402} {"train_loss": -12.28753662109375, "global_step": 403565, "epoch": 2402} {"train_loss": -12.369389533996582, "global_step": 403566, "epoch": 2402} {"train_loss": -12.29379653930664, "global_step": 403567, "epoch": 2402} {"train_loss": -12.672178268432617, "global_step": 403568, "epoch": 2402} {"train_loss": -12.485387802124023, "global_step": 403569, "epoch": 2402} {"train_loss": -12.443344116210938, "global_step": 403570, "epoch": 2402} {"train_loss": -12.284100532531738, "global_step": 403571, "epoch": 2402} {"train_loss": -12.366867065429688, "global_step": 403572, "epoch": 2402} {"train_loss": -12.318052291870117, "global_step": 403573, "epoch": 2402} {"train_loss": -12.262843132019043, "global_step": 403574, "epoch": 2402} {"train_loss": -12.387524604797363, "global_step": 403575, "epoch": 2402} {"train_loss": -12.531501770019531, "global_step": 403576, "epoch": 2402} {"train_loss": -12.418452262878418, "global_step": 403577, "epoch": 2402} {"train_loss": -12.165760040283203, "global_step": 403578, "epoch": 2402} {"train_loss": -12.744738578796387, "global_step": 403579, "epoch": 2402} {"train_loss": -12.460431098937988, "global_step": 403580, "epoch": 2402} {"train_loss": -12.529485702514648, "global_step": 403581, "epoch": 2402} {"train_loss": -12.477666854858398, "global_step": 403582, "epoch": 2402} {"train_loss": -12.633026123046875, "global_step": 403583, "epoch": 2402} {"train_loss": -12.649026870727539, "global_step": 403584, "epoch": 2402} {"train_loss": -12.413673400878906, "global_step": 403585, "epoch": 2402} {"train_loss": -12.436911582946777, "global_step": 403586, "epoch": 2402} {"train_loss": -12.459053993225098, "global_step": 403587, "epoch": 2402} {"train_loss": -12.817573547363281, "global_step": 403588, "epoch": 2402} {"train_loss": -12.477020263671875, "global_step": 403589, "epoch": 2402} {"train_loss": -12.305503845214844, "global_step": 403590, "epoch": 2402} {"train_loss": -12.459136009216309, "global_step": 403591, "epoch": 2402} {"train_loss": -11.950309753417969, "global_step": 403592, "epoch": 2402} {"train_loss": -12.561058044433594, "global_step": 403593, "epoch": 2402} {"train_loss": -11.853422164916992, "global_step": 403594, "epoch": 2402} {"train_loss": -12.109476089477539, "global_step": 403595, "epoch": 2402} {"train_loss": -12.37045669555664, "global_step": 403596, "epoch": 2402} {"train_loss": -11.513642311096191, "global_step": 403597, "epoch": 2402} {"train_loss": -12.686600685119629, "global_step": 403598, "epoch": 2402} {"train_loss": -10.902305603027344, "global_step": 403599, "epoch": 2402} {"train_loss": -12.038434028625488, "global_step": 403600, "epoch": 2402} {"train_loss": -12.162168502807617, "global_step": 403601, "epoch": 2402} {"train_loss": -11.315183639526367, "global_step": 403602, "epoch": 2402} {"train_loss": -12.389158248901367, "global_step": 403603, "epoch": 2402} {"train_loss": -12.078627586364746, "global_step": 403604, "epoch": 2402} {"train_loss": -11.862812995910645, "global_step": 403605, "epoch": 2402} {"train_loss": -12.747515678405762, "global_step": 403606, "epoch": 2402} {"train_loss": -12.035326957702637, "global_step": 403607, "epoch": 2402} {"train_loss": -12.470224380493164, "global_step": 403608, "epoch": 2402} {"train_loss": -12.486783981323242, "global_step": 403609, "epoch": 2402} {"train_loss": -12.55343246459961, "global_step": 403610, "epoch": 2402} {"train_loss": -12.49738597869873, "global_step": 403611, "epoch": 2402} {"train_loss": -12.513915061950684, "global_step": 403612, "epoch": 2402} {"train_loss": -12.685373306274414, "global_step": 403613, "epoch": 2402} {"train_loss": -12.216669082641602, "global_step": 403614, "epoch": 2402} {"train_loss": -12.667325973510742, "global_step": 403615, "epoch": 2402} {"train_loss": -12.492631912231445, "global_step": 403616, "epoch": 2402} {"train_loss": -12.369909286499023, "global_step": 403617, "epoch": 2402} {"train_loss": -12.385658264160156, "global_step": 403618, "epoch": 2402} {"train_loss": -12.486343383789062, "global_step": 403619, "epoch": 2402} {"train_loss": -12.28561019897461, "global_step": 403620, "epoch": 2402} {"train_loss": -12.356914520263672, "global_step": 403621, "epoch": 2402} {"train_loss": -12.610442161560059, "global_step": 403622, "epoch": 2402} {"train_loss": -12.397485733032227, "global_step": 403623, "epoch": 2402} {"train_loss": -12.611199378967285, "global_step": 403624, "epoch": 2402} {"train_loss": -12.270750045776367, "global_step": 403625, "epoch": 2402} {"train_loss": -12.482549667358398, "global_step": 403626, "epoch": 2402} {"train_loss": -12.38497543334961, "global_step": 403627, "epoch": 2402} {"train_loss": -12.438850402832031, "global_step": 403628, "epoch": 2402} {"train_loss": -12.077354431152344, "global_step": 403629, "epoch": 2402} {"train_loss": -12.481340408325195, "global_step": 403630, "epoch": 2402} {"train_loss": -11.920685768127441, "global_step": 403631, "epoch": 2402} {"train_loss": -12.135527610778809, "global_step": 403632, "epoch": 2402} {"train_loss": -12.348993301391602, "global_step": 403633, "epoch": 2402} {"train_loss": -11.904302597045898, "global_step": 403634, "epoch": 2402} {"train_loss": -11.809906959533691, "global_step": 403635, "epoch": 2402} {"train_loss": -12.32720947265625, "global_step": 403636, "epoch": 2402} {"train_loss": -11.413351058959961, "global_step": 403637, "epoch": 2402} {"train_loss": -11.115029335021973, "global_step": 403638, "epoch": 2402} {"train_loss": -12.358559608459473, "global_step": 403639, "epoch": 2402} {"train_loss": -12.272236824035645, "global_step": 403640, "epoch": 2402} {"train_loss": -11.946357727050781, "global_step": 403641, "epoch": 2402} {"train_loss": -12.140624046325684, "global_step": 403642, "epoch": 2402} {"train_loss": -12.81800365447998, "global_step": 403643, "epoch": 2402} {"train_loss": -11.903047561645508, "global_step": 403644, "epoch": 2402} {"train_loss": -12.218769073486328, "global_step": 403645, "epoch": 2402} {"train_loss": -12.231861114501953, "global_step": 403646, "epoch": 2402} {"train_loss": -12.07053279876709, "global_step": 403647, "epoch": 2402} {"train_loss": -12.30781364440918, "global_step": 403648, "epoch": 2402} {"train_loss": -12.652569770812988, "global_step": 403649, "epoch": 2402} {"train_loss": -12.107213973999023, "global_step": 403650, "epoch": 2402} {"train_loss": -12.547712326049805, "global_step": 403651, "epoch": 2402} {"train_loss": -12.112537384033203, "global_step": 403652, "epoch": 2402} {"train_loss": -12.04397201538086, "global_step": 403653, "epoch": 2402} {"train_loss": -12.17831039428711, "global_step": 403654, "epoch": 2402} {"train_loss": -12.282042503356934, "global_step": 403655, "epoch": 2402} {"train_loss": -11.983579635620117, "global_step": 403656, "epoch": 2402} {"train_loss": -12.307838439941406, "global_step": 403657, "epoch": 2402} {"train_loss": -12.411762237548828, "global_step": 403658, "epoch": 2402} {"train_loss": -11.95483684539795, "global_step": 403659, "epoch": 2402} {"train_loss": -12.271836280822754, "global_step": 403660, "epoch": 2402} {"train_loss": -12.512574195861816, "global_step": 403661, "epoch": 2402} {"train_loss": -12.307771682739258, "global_step": 403662, "epoch": 2402} {"train_loss": -12.738840103149414, "global_step": 403663, "epoch": 2402} {"train_loss": -12.393733978271484, "global_step": 403664, "epoch": 2402} {"train_loss": -12.655679702758789, "global_step": 403665, "epoch": 2402} {"train_loss": -12.589071273803711, "global_step": 403666, "epoch": 2402} {"train_loss": -12.486466407775879, "global_step": 403667, "epoch": 2402} {"train_loss": -12.53054428100586, "global_step": 403668, "epoch": 2402} {"train_loss": -12.656798362731934, "global_step": 403669, "epoch": 2402} {"train_loss": -12.664937019348145, "global_step": 403670, "epoch": 2402} {"train_loss": -12.546822547912598, "global_step": 403671, "epoch": 2402} {"train_loss": -12.393135070800781, "global_step": 403672, "epoch": 2402} {"train_loss": -12.485189437866211, "global_step": 403673, "epoch": 2402} {"train_loss": -12.68077564239502, "global_step": 403674, "epoch": 2402} {"train_loss": -12.691583633422852, "global_step": 403675, "epoch": 2402} {"train_loss": -12.495023727416992, "global_step": 403676, "epoch": 2402} {"train_loss": -12.80738353729248, "global_step": 403677, "epoch": 2402} {"train_loss": -12.677265167236328, "global_step": 403678, "epoch": 2402} {"train_loss": -12.776719093322754, "global_step": 403679, "epoch": 2402} {"train_loss": -12.544769287109375, "global_step": 403680, "epoch": 2402} {"train_loss": -12.575732231140137, "global_step": 403681, "epoch": 2402} {"train_loss": -12.55007266998291, "global_step": 403682, "epoch": 2402} {"train_loss": -12.784130096435547, "global_step": 403683, "epoch": 2402} {"train_loss": -12.5516939163208, "global_step": 403684, "epoch": 2402} {"train_loss": -12.645336151123047, "global_step": 403685, "epoch": 2402} {"train_loss": -12.569835662841797, "global_step": 403686, "epoch": 2402} {"train_loss": -12.464754104614258, "global_step": 403687, "epoch": 2402} {"train_loss": -12.372528076171875, "global_step": 403688, "epoch": 2402} {"train_loss": -12.801139831542969, "global_step": 403689, "epoch": 2402} {"train_loss": -12.424121856689453, "global_step": 403690, "epoch": 2402} {"train_loss": -12.742951393127441, "global_step": 403691, "epoch": 2402} {"train_loss": -12.672715187072754, "global_step": 403692, "epoch": 2402} {"train_loss": -12.424030303955078, "global_step": 403693, "epoch": 2402} {"train_loss": -12.617613792419434, "global_step": 403694, "epoch": 2402} {"train_loss": -12.854904174804688, "global_step": 403695, "epoch": 2402} {"train_loss": -12.483985900878906, "global_step": 403696, "epoch": 2402} {"train_loss": -12.636696815490723, "global_step": 403697, "epoch": 2402} {"train_loss": -12.471236228942871, "global_step": 403698, "epoch": 2402} {"train_loss": -12.54580307006836, "global_step": 403699, "epoch": 2402} {"train_loss": -12.680543899536133, "global_step": 403700, "epoch": 2402} {"train_loss": -12.588674545288086, "global_step": 403701, "epoch": 2402} {"train_loss": -12.436151504516602, "global_step": 403702, "epoch": 2402} {"train_loss": -12.146261340095883, "global_step": 403703, "epoch": 2402, "val_loss": 303099.25} {"train_loss": -12.699836730957031, "global_step": 403704, "epoch": 2403} {"train_loss": -12.716033935546875, "global_step": 403705, "epoch": 2403} {"train_loss": -12.525010108947754, "global_step": 403706, "epoch": 2403} {"train_loss": -11.805468559265137, "global_step": 403707, "epoch": 2403} {"train_loss": -11.533822059631348, "global_step": 403708, "epoch": 2403} {"train_loss": -12.39804744720459, "global_step": 403709, "epoch": 2403} {"train_loss": -12.40219497680664, "global_step": 403710, "epoch": 2403} {"train_loss": -10.004951477050781, "global_step": 403711, "epoch": 2403} {"train_loss": -11.12026309967041, "global_step": 403712, "epoch": 2403} {"train_loss": -9.549139022827148, "global_step": 403713, "epoch": 2403} {"train_loss": -8.01176643371582, "global_step": 403714, "epoch": 2403} {"train_loss": -7.650012493133545, "global_step": 403715, "epoch": 2403} {"train_loss": -8.414928436279297, "global_step": 403716, "epoch": 2403} {"train_loss": -7.577942848205566, "global_step": 403717, "epoch": 2403} {"train_loss": -8.396394729614258, "global_step": 403718, "epoch": 2403} {"train_loss": -8.848834991455078, "global_step": 403719, "epoch": 2403} {"train_loss": -9.17140007019043, "global_step": 403720, "epoch": 2403} {"train_loss": -9.07285213470459, "global_step": 403721, "epoch": 2403} {"train_loss": -8.322662353515625, "global_step": 403722, "epoch": 2403} {"train_loss": -8.286028861999512, "global_step": 403723, "epoch": 2403} {"train_loss": -9.071686744689941, "global_step": 403724, "epoch": 2403} {"train_loss": -8.827884674072266, "global_step": 403725, "epoch": 2403} {"train_loss": -9.147761344909668, "global_step": 403726, "epoch": 2403} {"train_loss": -9.069504737854004, "global_step": 403727, "epoch": 2403} {"train_loss": -9.353168487548828, "global_step": 403728, "epoch": 2403} {"train_loss": -9.431594848632812, "global_step": 403729, "epoch": 2403} {"train_loss": -9.796465873718262, "global_step": 403730, "epoch": 2403} {"train_loss": -9.6331787109375, "global_step": 403731, "epoch": 2403} {"train_loss": -10.351069450378418, "global_step": 403732, "epoch": 2403} {"train_loss": -10.738000869750977, "global_step": 403733, "epoch": 2403} {"train_loss": -11.267711639404297, "global_step": 403734, "epoch": 2403} {"train_loss": -11.141770362854004, "global_step": 403735, "epoch": 2403} {"train_loss": -11.308783531188965, "global_step": 403736, "epoch": 2403} {"train_loss": -11.640804290771484, "global_step": 403737, "epoch": 2403} {"train_loss": -11.129182815551758, "global_step": 403738, "epoch": 2403} {"train_loss": -11.316328048706055, "global_step": 403739, "epoch": 2403} {"train_loss": -11.718338012695312, "global_step": 403740, "epoch": 2403} {"train_loss": -11.720706939697266, "global_step": 403741, "epoch": 2403} {"train_loss": -11.417217254638672, "global_step": 403742, "epoch": 2403} {"train_loss": -11.714395523071289, "global_step": 403743, "epoch": 2403} {"train_loss": -11.57423210144043, "global_step": 403744, "epoch": 2403} {"train_loss": -11.736024856567383, "global_step": 403745, "epoch": 2403} {"train_loss": -11.112699508666992, "global_step": 403746, "epoch": 2403} {"train_loss": -11.515230178833008, "global_step": 403747, "epoch": 2403} {"train_loss": -11.80101203918457, "global_step": 403748, "epoch": 2403} {"train_loss": -11.648038864135742, "global_step": 403749, "epoch": 2403} {"train_loss": -11.398504257202148, "global_step": 403750, "epoch": 2403} {"train_loss": -11.887117385864258, "global_step": 403751, "epoch": 2403} {"train_loss": -11.285440444946289, "global_step": 403752, "epoch": 2403} {"train_loss": -11.641958236694336, "global_step": 403753, "epoch": 2403} {"train_loss": -10.848816871643066, "global_step": 403754, "epoch": 2403} {"train_loss": -11.416475296020508, "global_step": 403755, "epoch": 2403} {"train_loss": -11.238101959228516, "global_step": 403756, "epoch": 2403} {"train_loss": -10.449337005615234, "global_step": 403757, "epoch": 2403} {"train_loss": -11.356321334838867, "global_step": 403758, "epoch": 2403} {"train_loss": -10.773674011230469, "global_step": 403759, "epoch": 2403} {"train_loss": -9.85554313659668, "global_step": 403760, "epoch": 2403} {"train_loss": -9.909144401550293, "global_step": 403761, "epoch": 2403} {"train_loss": -10.0225830078125, "global_step": 403762, "epoch": 2403} {"train_loss": -10.72221565246582, "global_step": 403763, "epoch": 2403} {"train_loss": -10.406538009643555, "global_step": 403764, "epoch": 2403} {"train_loss": -10.588541030883789, "global_step": 403765, "epoch": 2403} {"train_loss": -11.277120590209961, "global_step": 403766, "epoch": 2403} {"train_loss": -11.662858963012695, "global_step": 403767, "epoch": 2403} {"train_loss": -11.299564361572266, "global_step": 403768, "epoch": 2403} {"train_loss": -11.02433967590332, "global_step": 403769, "epoch": 2403} {"train_loss": -11.811287879943848, "global_step": 403770, "epoch": 2403} {"train_loss": -11.072004318237305, "global_step": 403771, "epoch": 2403} {"train_loss": -11.122029304504395, "global_step": 403772, "epoch": 2403} {"train_loss": -10.807650566101074, "global_step": 403773, "epoch": 2403} {"train_loss": -11.36016845703125, "global_step": 403774, "epoch": 2403} {"train_loss": -11.478878021240234, "global_step": 403775, "epoch": 2403} {"train_loss": -11.287227630615234, "global_step": 403776, "epoch": 2403} {"train_loss": -11.453996658325195, "global_step": 403777, "epoch": 2403} {"train_loss": -11.736186981201172, "global_step": 403778, "epoch": 2403} {"train_loss": -11.343437194824219, "global_step": 403779, "epoch": 2403} {"train_loss": -12.21011734008789, "global_step": 403780, "epoch": 2403} {"train_loss": -11.3121337890625, "global_step": 403781, "epoch": 2403} {"train_loss": -12.01188850402832, "global_step": 403782, "epoch": 2403} {"train_loss": -11.438167572021484, "global_step": 403783, "epoch": 2403} {"train_loss": -11.282001495361328, "global_step": 403784, "epoch": 2403} {"train_loss": -11.739152908325195, "global_step": 403785, "epoch": 2403} {"train_loss": -11.729063034057617, "global_step": 403786, "epoch": 2403} {"train_loss": -11.485557556152344, "global_step": 403787, "epoch": 2403} {"train_loss": -12.126551628112793, "global_step": 403788, "epoch": 2403} {"train_loss": -11.67049789428711, "global_step": 403789, "epoch": 2403} {"train_loss": -11.349058151245117, "global_step": 403790, "epoch": 2403} {"train_loss": -11.675796508789062, "global_step": 403791, "epoch": 2403} {"train_loss": -11.753185272216797, "global_step": 403792, "epoch": 2403} {"train_loss": -11.808405876159668, "global_step": 403793, "epoch": 2403} {"train_loss": -11.680963516235352, "global_step": 403794, "epoch": 2403} {"train_loss": -11.37948226928711, "global_step": 403795, "epoch": 2403} {"train_loss": -12.11594009399414, "global_step": 403796, "epoch": 2403} {"train_loss": -11.649955749511719, "global_step": 403797, "epoch": 2403} {"train_loss": -12.03414535522461, "global_step": 403798, "epoch": 2403} {"train_loss": -11.88007640838623, "global_step": 403799, "epoch": 2403} {"train_loss": -12.135466575622559, "global_step": 403800, "epoch": 2403} {"train_loss": -12.320047378540039, "global_step": 403801, "epoch": 2403} {"train_loss": -12.035465240478516, "global_step": 403802, "epoch": 2403} {"train_loss": -12.059022903442383, "global_step": 403803, "epoch": 2403} {"train_loss": -12.374367713928223, "global_step": 403804, "epoch": 2403} {"train_loss": -12.354791641235352, "global_step": 403805, "epoch": 2403} {"train_loss": -12.120628356933594, "global_step": 403806, "epoch": 2403} {"train_loss": -12.33974838256836, "global_step": 403807, "epoch": 2403} {"train_loss": -12.083858489990234, "global_step": 403808, "epoch": 2403} {"train_loss": -12.221176147460938, "global_step": 403809, "epoch": 2403} {"train_loss": -12.27774429321289, "global_step": 403810, "epoch": 2403} {"train_loss": -12.275771141052246, "global_step": 403811, "epoch": 2403} {"train_loss": -12.325126647949219, "global_step": 403812, "epoch": 2403} {"train_loss": -12.132100105285645, "global_step": 403813, "epoch": 2403} {"train_loss": -12.172599792480469, "global_step": 403814, "epoch": 2403} {"train_loss": -12.3563814163208, "global_step": 403815, "epoch": 2403} {"train_loss": -12.306326866149902, "global_step": 403816, "epoch": 2403} {"train_loss": -12.405864715576172, "global_step": 403817, "epoch": 2403} {"train_loss": -12.28070068359375, "global_step": 403818, "epoch": 2403} {"train_loss": -12.349128723144531, "global_step": 403819, "epoch": 2403} {"train_loss": -12.448648452758789, "global_step": 403820, "epoch": 2403} {"train_loss": -12.39767837524414, "global_step": 403821, "epoch": 2403} {"train_loss": -12.584580421447754, "global_step": 403822, "epoch": 2403} {"train_loss": -12.309274673461914, "global_step": 403823, "epoch": 2403} {"train_loss": -12.700913429260254, "global_step": 403824, "epoch": 2403} {"train_loss": -12.533864974975586, "global_step": 403825, "epoch": 2403} {"train_loss": -12.485188484191895, "global_step": 403826, "epoch": 2403} {"train_loss": -12.5402250289917, "global_step": 403827, "epoch": 2403} {"train_loss": -12.54514217376709, "global_step": 403828, "epoch": 2403} {"train_loss": -12.418209075927734, "global_step": 403829, "epoch": 2403} {"train_loss": -12.57607650756836, "global_step": 403830, "epoch": 2403} {"train_loss": -12.676769256591797, "global_step": 403831, "epoch": 2403} {"train_loss": -12.632503509521484, "global_step": 403832, "epoch": 2403} {"train_loss": -12.702505111694336, "global_step": 403833, "epoch": 2403} {"train_loss": -12.630154609680176, "global_step": 403834, "epoch": 2403} {"train_loss": -12.63595962524414, "global_step": 403835, "epoch": 2403} {"train_loss": -12.658894538879395, "global_step": 403836, "epoch": 2403} {"train_loss": -12.49831771850586, "global_step": 403837, "epoch": 2403} {"train_loss": -12.66088581085205, "global_step": 403838, "epoch": 2403} {"train_loss": -12.443593978881836, "global_step": 403839, "epoch": 2403} {"train_loss": -12.43191909790039, "global_step": 403840, "epoch": 2403} {"train_loss": -12.477753639221191, "global_step": 403841, "epoch": 2403} {"train_loss": -12.675420761108398, "global_step": 403842, "epoch": 2403} {"train_loss": -12.747671127319336, "global_step": 403843, "epoch": 2403} {"train_loss": -12.381624221801758, "global_step": 403844, "epoch": 2403} {"train_loss": -12.449957847595215, "global_step": 403845, "epoch": 2403} {"train_loss": -12.366569519042969, "global_step": 403846, "epoch": 2403} {"train_loss": -12.480480194091797, "global_step": 403847, "epoch": 2403} {"train_loss": -12.349623680114746, "global_step": 403848, "epoch": 2403} {"train_loss": -12.610668182373047, "global_step": 403849, "epoch": 2403} {"train_loss": -12.454351425170898, "global_step": 403850, "epoch": 2403} {"train_loss": -12.711421966552734, "global_step": 403851, "epoch": 2403} {"train_loss": -12.662252426147461, "global_step": 403852, "epoch": 2403} {"train_loss": -12.462990760803223, "global_step": 403853, "epoch": 2403} {"train_loss": -12.653079986572266, "global_step": 403854, "epoch": 2403} {"train_loss": -12.311525344848633, "global_step": 403855, "epoch": 2403} {"train_loss": -11.942282676696777, "global_step": 403856, "epoch": 2403} {"train_loss": -12.6442232131958, "global_step": 403857, "epoch": 2403} {"train_loss": -12.889047622680664, "global_step": 403858, "epoch": 2403} {"train_loss": -12.066253662109375, "global_step": 403859, "epoch": 2403} {"train_loss": -11.913497924804688, "global_step": 403860, "epoch": 2403} {"train_loss": -12.427875518798828, "global_step": 403861, "epoch": 2403} {"train_loss": -12.496702194213867, "global_step": 403862, "epoch": 2403} {"train_loss": -12.360658645629883, "global_step": 403863, "epoch": 2403} {"train_loss": -12.460718154907227, "global_step": 403864, "epoch": 2403} {"train_loss": -12.446456909179688, "global_step": 403865, "epoch": 2403} {"train_loss": -12.619621276855469, "global_step": 403866, "epoch": 2403} {"train_loss": -12.736286163330078, "global_step": 403867, "epoch": 2403} {"train_loss": -12.718564987182617, "global_step": 403868, "epoch": 2403} {"train_loss": -12.437337875366211, "global_step": 403869, "epoch": 2403} {"train_loss": -12.240862846374512, "global_step": 403870, "epoch": 2403} {"train_loss": -11.56022034656434, "global_step": 403871, "epoch": 2403, "val_loss": 301895.5625} {"train_loss": -12.707246780395508, "global_step": 403872, "epoch": 2404} {"train_loss": -12.445751190185547, "global_step": 403873, "epoch": 2404} {"train_loss": -12.465126991271973, "global_step": 403874, "epoch": 2404} {"train_loss": -12.970351219177246, "global_step": 403875, "epoch": 2404} {"train_loss": -12.551409721374512, "global_step": 403876, "epoch": 2404} {"train_loss": -12.447240829467773, "global_step": 403877, "epoch": 2404} {"train_loss": -12.320219993591309, "global_step": 403878, "epoch": 2404} {"train_loss": -12.01659870147705, "global_step": 403879, "epoch": 2404} {"train_loss": -12.591383934020996, "global_step": 403880, "epoch": 2404} {"train_loss": -12.46834659576416, "global_step": 403881, "epoch": 2404} {"train_loss": -12.55413818359375, "global_step": 403882, "epoch": 2404} {"train_loss": -12.547374725341797, "global_step": 403883, "epoch": 2404} {"train_loss": -12.534109115600586, "global_step": 403884, "epoch": 2404} {"train_loss": -12.581238746643066, "global_step": 403885, "epoch": 2404} {"train_loss": -11.79757308959961, "global_step": 403886, "epoch": 2404} {"train_loss": -12.24250602722168, "global_step": 403887, "epoch": 2404} {"train_loss": -12.06108283996582, "global_step": 403888, "epoch": 2404} {"train_loss": -12.628241539001465, "global_step": 403889, "epoch": 2404} {"train_loss": -12.051912307739258, "global_step": 403890, "epoch": 2404} {"train_loss": -11.449172973632812, "global_step": 403891, "epoch": 2404} {"train_loss": -12.232332229614258, "global_step": 403892, "epoch": 2404} {"train_loss": -11.887283325195312, "global_step": 403893, "epoch": 2404} {"train_loss": -10.669914245605469, "global_step": 403894, "epoch": 2404} {"train_loss": -12.27239990234375, "global_step": 403895, "epoch": 2404} {"train_loss": -9.515558242797852, "global_step": 403896, "epoch": 2404} {"train_loss": -10.832680702209473, "global_step": 403897, "epoch": 2404} {"train_loss": -10.584992408752441, "global_step": 403898, "epoch": 2404} {"train_loss": -9.879942893981934, "global_step": 403899, "epoch": 2404} {"train_loss": -9.1927490234375, "global_step": 403900, "epoch": 2404} {"train_loss": -9.58521556854248, "global_step": 403901, "epoch": 2404} {"train_loss": -9.76779556274414, "global_step": 403902, "epoch": 2404} {"train_loss": -10.461601257324219, "global_step": 403903, "epoch": 2404} {"train_loss": -10.528791427612305, "global_step": 403904, "epoch": 2404} {"train_loss": -11.740633010864258, "global_step": 403905, "epoch": 2404} {"train_loss": -9.967246055603027, "global_step": 403906, "epoch": 2404} {"train_loss": -12.144355773925781, "global_step": 403907, "epoch": 2404} {"train_loss": -10.755289077758789, "global_step": 403908, "epoch": 2404} {"train_loss": -11.519817352294922, "global_step": 403909, "epoch": 2404} {"train_loss": -11.027938842773438, "global_step": 403910, "epoch": 2404} {"train_loss": -11.558880805969238, "global_step": 403911, "epoch": 2404} {"train_loss": -11.981410026550293, "global_step": 403912, "epoch": 2404} {"train_loss": -10.609823226928711, "global_step": 403913, "epoch": 2404} {"train_loss": -12.095325469970703, "global_step": 403914, "epoch": 2404} {"train_loss": -10.048727989196777, "global_step": 403915, "epoch": 2404} {"train_loss": -11.071650505065918, "global_step": 403916, "epoch": 2404} {"train_loss": -9.655540466308594, "global_step": 403917, "epoch": 2404} {"train_loss": -12.112617492675781, "global_step": 403918, "epoch": 2404} {"train_loss": -10.985105514526367, "global_step": 403919, "epoch": 2404} {"train_loss": -11.724035263061523, "global_step": 403920, "epoch": 2404} {"train_loss": -11.573638916015625, "global_step": 403921, "epoch": 2404} {"train_loss": -11.394895553588867, "global_step": 403922, "epoch": 2404} {"train_loss": -11.878297805786133, "global_step": 403923, "epoch": 2404} {"train_loss": -11.736244201660156, "global_step": 403924, "epoch": 2404} {"train_loss": -11.891898155212402, "global_step": 403925, "epoch": 2404} {"train_loss": -12.017072677612305, "global_step": 403926, "epoch": 2404} {"train_loss": -12.135468482971191, "global_step": 403927, "epoch": 2404} {"train_loss": -12.08212661743164, "global_step": 403928, "epoch": 2404} {"train_loss": -11.985942840576172, "global_step": 403929, "epoch": 2404} {"train_loss": -11.812162399291992, "global_step": 403930, "epoch": 2404} {"train_loss": -12.232285499572754, "global_step": 403931, "epoch": 2404} {"train_loss": -12.25811767578125, "global_step": 403932, "epoch": 2404} {"train_loss": -12.225744247436523, "global_step": 403933, "epoch": 2404} {"train_loss": -12.195840835571289, "global_step": 403934, "epoch": 2404} {"train_loss": -12.338769912719727, "global_step": 403935, "epoch": 2404} {"train_loss": -12.221363067626953, "global_step": 403936, "epoch": 2404} {"train_loss": -12.373289108276367, "global_step": 403937, "epoch": 2404} {"train_loss": -12.314745903015137, "global_step": 403938, "epoch": 2404} {"train_loss": -12.519147872924805, "global_step": 403939, "epoch": 2404} {"train_loss": -12.392362594604492, "global_step": 403940, "epoch": 2404} {"train_loss": -12.446791648864746, "global_step": 403941, "epoch": 2404} {"train_loss": -12.415236473083496, "global_step": 403942, "epoch": 2404} {"train_loss": -12.676288604736328, "global_step": 403943, "epoch": 2404} {"train_loss": -12.402002334594727, "global_step": 403944, "epoch": 2404} {"train_loss": -12.591695785522461, "global_step": 403945, "epoch": 2404} {"train_loss": -12.359039306640625, "global_step": 403946, "epoch": 2404} {"train_loss": -12.320777893066406, "global_step": 403947, "epoch": 2404} {"train_loss": -12.6487455368042, "global_step": 403948, "epoch": 2404} {"train_loss": -12.351306915283203, "global_step": 403949, "epoch": 2404} {"train_loss": -12.483463287353516, "global_step": 403950, "epoch": 2404} {"train_loss": -12.373932838439941, "global_step": 403951, "epoch": 2404} {"train_loss": -12.095735549926758, "global_step": 403952, "epoch": 2404} {"train_loss": -12.370065689086914, "global_step": 403953, "epoch": 2404} {"train_loss": -11.608075141906738, "global_step": 403954, "epoch": 2404} {"train_loss": -12.121899604797363, "global_step": 403955, "epoch": 2404} {"train_loss": -11.69179630279541, "global_step": 403956, "epoch": 2404} {"train_loss": -12.487298965454102, "global_step": 403957, "epoch": 2404} {"train_loss": -11.735227584838867, "global_step": 403958, "epoch": 2404} {"train_loss": -12.494217872619629, "global_step": 403959, "epoch": 2404} {"train_loss": -11.700782775878906, "global_step": 403960, "epoch": 2404} {"train_loss": -12.22996711730957, "global_step": 403961, "epoch": 2404} {"train_loss": -11.83416748046875, "global_step": 403962, "epoch": 2404} {"train_loss": -12.411441802978516, "global_step": 403963, "epoch": 2404} {"train_loss": -11.936553955078125, "global_step": 403964, "epoch": 2404} {"train_loss": -11.784024238586426, "global_step": 403965, "epoch": 2404} {"train_loss": -11.748030662536621, "global_step": 403966, "epoch": 2404} {"train_loss": -12.201749801635742, "global_step": 403967, "epoch": 2404} {"train_loss": -11.641610145568848, "global_step": 403968, "epoch": 2404} {"train_loss": -12.32264232635498, "global_step": 403969, "epoch": 2404} {"train_loss": -11.966875076293945, "global_step": 403970, "epoch": 2404} {"train_loss": -11.875486373901367, "global_step": 403971, "epoch": 2404} {"train_loss": -12.141399383544922, "global_step": 403972, "epoch": 2404} {"train_loss": -12.121822357177734, "global_step": 403973, "epoch": 2404} {"train_loss": -12.41610336303711, "global_step": 403974, "epoch": 2404} {"train_loss": -12.176153182983398, "global_step": 403975, "epoch": 2404} {"train_loss": -12.377397537231445, "global_step": 403976, "epoch": 2404} {"train_loss": -12.30765151977539, "global_step": 403977, "epoch": 2404} {"train_loss": -12.080732345581055, "global_step": 403978, "epoch": 2404} {"train_loss": -11.957213401794434, "global_step": 403979, "epoch": 2404} {"train_loss": -12.454116821289062, "global_step": 403980, "epoch": 2404} {"train_loss": -11.872635841369629, "global_step": 403981, "epoch": 2404} {"train_loss": -12.047616958618164, "global_step": 403982, "epoch": 2404} {"train_loss": -12.542495727539062, "global_step": 403983, "epoch": 2404} {"train_loss": -11.978240013122559, "global_step": 403984, "epoch": 2404} {"train_loss": -11.988412857055664, "global_step": 403985, "epoch": 2404} {"train_loss": -12.372334480285645, "global_step": 403986, "epoch": 2404} {"train_loss": -12.424808502197266, "global_step": 403987, "epoch": 2404} {"train_loss": -12.185060501098633, "global_step": 403988, "epoch": 2404} {"train_loss": -12.336071014404297, "global_step": 403989, "epoch": 2404} {"train_loss": -12.03154182434082, "global_step": 403990, "epoch": 2404} {"train_loss": -12.139769554138184, "global_step": 403991, "epoch": 2404} {"train_loss": -11.992258071899414, "global_step": 403992, "epoch": 2404} {"train_loss": -11.80478286743164, "global_step": 403993, "epoch": 2404} {"train_loss": -12.294929504394531, "global_step": 403994, "epoch": 2404} {"train_loss": -11.715208053588867, "global_step": 403995, "epoch": 2404} {"train_loss": -12.131757736206055, "global_step": 403996, "epoch": 2404} {"train_loss": -12.308879852294922, "global_step": 403997, "epoch": 2404} {"train_loss": -11.81717586517334, "global_step": 403998, "epoch": 2404} {"train_loss": -12.171672821044922, "global_step": 403999, "epoch": 2404} {"train_loss": -11.77206039428711, "global_step": 404000, "epoch": 2404} {"train_loss": -12.08018684387207, "global_step": 404001, "epoch": 2404} {"train_loss": -12.257956504821777, "global_step": 404002, "epoch": 2404} {"train_loss": -11.898605346679688, "global_step": 404003, "epoch": 2404} {"train_loss": -11.856626510620117, "global_step": 404004, "epoch": 2404} {"train_loss": -12.23338508605957, "global_step": 404005, "epoch": 2404} {"train_loss": -12.291853904724121, "global_step": 404006, "epoch": 2404} {"train_loss": -12.29554557800293, "global_step": 404007, "epoch": 2404} {"train_loss": -12.54500961303711, "global_step": 404008, "epoch": 2404} {"train_loss": -11.916500091552734, "global_step": 404009, "epoch": 2404} {"train_loss": -12.626688957214355, "global_step": 404010, "epoch": 2404} {"train_loss": -11.644147872924805, "global_step": 404011, "epoch": 2404} {"train_loss": -12.345626831054688, "global_step": 404012, "epoch": 2404} {"train_loss": -12.175785064697266, "global_step": 404013, "epoch": 2404} {"train_loss": -12.202165603637695, "global_step": 404014, "epoch": 2404} {"train_loss": -12.371648788452148, "global_step": 404015, "epoch": 2404} {"train_loss": -11.901162147521973, "global_step": 404016, "epoch": 2404} {"train_loss": -12.436912536621094, "global_step": 404017, "epoch": 2404} {"train_loss": -11.951443672180176, "global_step": 404018, "epoch": 2404} {"train_loss": -12.00030517578125, "global_step": 404019, "epoch": 2404} {"train_loss": -12.236663818359375, "global_step": 404020, "epoch": 2404} {"train_loss": -12.343696594238281, "global_step": 404021, "epoch": 2404} {"train_loss": -12.256097793579102, "global_step": 404022, "epoch": 2404} {"train_loss": -12.179893493652344, "global_step": 404023, "epoch": 2404} {"train_loss": -11.622448921203613, "global_step": 404024, "epoch": 2404} {"train_loss": -12.439833641052246, "global_step": 404025, "epoch": 2404} {"train_loss": -11.390277862548828, "global_step": 404026, "epoch": 2404} {"train_loss": -12.31146240234375, "global_step": 404027, "epoch": 2404} {"train_loss": -11.474444389343262, "global_step": 404028, "epoch": 2404} {"train_loss": -11.118406295776367, "global_step": 404029, "epoch": 2404} {"train_loss": -12.166646957397461, "global_step": 404030, "epoch": 2404} {"train_loss": -12.155776977539062, "global_step": 404031, "epoch": 2404} {"train_loss": -11.846281051635742, "global_step": 404032, "epoch": 2404} {"train_loss": -11.890762329101562, "global_step": 404033, "epoch": 2404} {"train_loss": -11.993103981018066, "global_step": 404034, "epoch": 2404} {"train_loss": -11.99636459350586, "global_step": 404035, "epoch": 2404} {"train_loss": -11.71963119506836, "global_step": 404036, "epoch": 2404} {"train_loss": -12.272310256958008, "global_step": 404037, "epoch": 2404} {"train_loss": -11.95992374420166, "global_step": 404038, "epoch": 2404} {"train_loss": -11.93956648735773, "global_step": 404039, "epoch": 2404, "val_loss": 304933.5} {"train_loss": -12.11796760559082, "global_step": 404040, "epoch": 2405} {"train_loss": -12.247722625732422, "global_step": 404041, "epoch": 2405} {"train_loss": -11.843522071838379, "global_step": 404042, "epoch": 2405} {"train_loss": -12.020004272460938, "global_step": 404043, "epoch": 2405} {"train_loss": -12.639394760131836, "global_step": 404044, "epoch": 2405} {"train_loss": -11.521774291992188, "global_step": 404045, "epoch": 2405} {"train_loss": -12.259997367858887, "global_step": 404046, "epoch": 2405} {"train_loss": -12.108048439025879, "global_step": 404047, "epoch": 2405} {"train_loss": -11.967887878417969, "global_step": 404048, "epoch": 2405} {"train_loss": -12.28570556640625, "global_step": 404049, "epoch": 2405} {"train_loss": -12.079029083251953, "global_step": 404050, "epoch": 2405} {"train_loss": -12.594293594360352, "global_step": 404051, "epoch": 2405} {"train_loss": -12.259659767150879, "global_step": 404052, "epoch": 2405} {"train_loss": -12.137577056884766, "global_step": 404053, "epoch": 2405} {"train_loss": -12.660480499267578, "global_step": 404054, "epoch": 2405} {"train_loss": -11.657222747802734, "global_step": 404055, "epoch": 2405} {"train_loss": -12.396636009216309, "global_step": 404056, "epoch": 2405} {"train_loss": -12.433576583862305, "global_step": 404057, "epoch": 2405} {"train_loss": -11.913836479187012, "global_step": 404058, "epoch": 2405} {"train_loss": -12.507051467895508, "global_step": 404059, "epoch": 2405} {"train_loss": -12.093701362609863, "global_step": 404060, "epoch": 2405} {"train_loss": -12.112570762634277, "global_step": 404061, "epoch": 2405} {"train_loss": -11.975542068481445, "global_step": 404062, "epoch": 2405} {"train_loss": -12.353008270263672, "global_step": 404063, "epoch": 2405} {"train_loss": -12.471295356750488, "global_step": 404064, "epoch": 2405} {"train_loss": -11.63134479522705, "global_step": 404065, "epoch": 2405} {"train_loss": -12.4599609375, "global_step": 404066, "epoch": 2405} {"train_loss": -12.206537246704102, "global_step": 404067, "epoch": 2405} {"train_loss": -11.75646686553955, "global_step": 404068, "epoch": 2405} {"train_loss": -12.327162742614746, "global_step": 404069, "epoch": 2405} {"train_loss": -12.569326400756836, "global_step": 404070, "epoch": 2405} {"train_loss": -12.414398193359375, "global_step": 404071, "epoch": 2405} {"train_loss": -12.39216423034668, "global_step": 404072, "epoch": 2405} {"train_loss": -12.316454887390137, "global_step": 404073, "epoch": 2405} {"train_loss": -12.532726287841797, "global_step": 404074, "epoch": 2405} {"train_loss": -12.455009460449219, "global_step": 404075, "epoch": 2405} {"train_loss": -12.378381729125977, "global_step": 404076, "epoch": 2405} {"train_loss": -12.694450378417969, "global_step": 404077, "epoch": 2405} {"train_loss": -12.235835075378418, "global_step": 404078, "epoch": 2405} {"train_loss": -12.211012840270996, "global_step": 404079, "epoch": 2405} {"train_loss": -12.642146110534668, "global_step": 404080, "epoch": 2405} {"train_loss": -12.359647750854492, "global_step": 404081, "epoch": 2405} {"train_loss": -12.570884704589844, "global_step": 404082, "epoch": 2405} {"train_loss": -12.277742385864258, "global_step": 404083, "epoch": 2405} {"train_loss": -12.219755172729492, "global_step": 404084, "epoch": 2405} {"train_loss": -11.930630683898926, "global_step": 404085, "epoch": 2405} {"train_loss": -12.513873100280762, "global_step": 404086, "epoch": 2405} {"train_loss": -11.125885009765625, "global_step": 404087, "epoch": 2405} {"train_loss": -11.261350631713867, "global_step": 404088, "epoch": 2405} {"train_loss": -12.055407524108887, "global_step": 404089, "epoch": 2405} {"train_loss": -11.641803741455078, "global_step": 404090, "epoch": 2405} {"train_loss": -12.111387252807617, "global_step": 404091, "epoch": 2405} {"train_loss": -11.971268653869629, "global_step": 404092, "epoch": 2405} {"train_loss": -12.299516677856445, "global_step": 404093, "epoch": 2405} {"train_loss": -12.30587387084961, "global_step": 404094, "epoch": 2405} {"train_loss": -11.34588623046875, "global_step": 404095, "epoch": 2405} {"train_loss": -11.508045196533203, "global_step": 404096, "epoch": 2405} {"train_loss": -12.13743782043457, "global_step": 404097, "epoch": 2405} {"train_loss": -11.313158988952637, "global_step": 404098, "epoch": 2405} {"train_loss": -12.300926208496094, "global_step": 404099, "epoch": 2405} {"train_loss": -12.132436752319336, "global_step": 404100, "epoch": 2405} {"train_loss": -10.958597183227539, "global_step": 404101, "epoch": 2405} {"train_loss": -12.001787185668945, "global_step": 404102, "epoch": 2405} {"train_loss": -12.008578300476074, "global_step": 404103, "epoch": 2405} {"train_loss": -11.339862823486328, "global_step": 404104, "epoch": 2405} {"train_loss": -11.00712776184082, "global_step": 404105, "epoch": 2405} {"train_loss": -12.536844253540039, "global_step": 404106, "epoch": 2405} {"train_loss": -10.872376441955566, "global_step": 404107, "epoch": 2405} {"train_loss": -11.808977127075195, "global_step": 404108, "epoch": 2405} {"train_loss": -11.491990089416504, "global_step": 404109, "epoch": 2405} {"train_loss": -12.047027587890625, "global_step": 404110, "epoch": 2405} {"train_loss": -12.122201919555664, "global_step": 404111, "epoch": 2405} {"train_loss": -11.953779220581055, "global_step": 404112, "epoch": 2405} {"train_loss": -12.01439094543457, "global_step": 404113, "epoch": 2405} {"train_loss": -11.761950492858887, "global_step": 404114, "epoch": 2405} {"train_loss": -12.13197135925293, "global_step": 404115, "epoch": 2405} {"train_loss": -11.738080978393555, "global_step": 404116, "epoch": 2405} {"train_loss": -11.858758926391602, "global_step": 404117, "epoch": 2405} {"train_loss": -11.88492488861084, "global_step": 404118, "epoch": 2405} {"train_loss": -10.410401344299316, "global_step": 404119, "epoch": 2405} {"train_loss": -11.794967651367188, "global_step": 404120, "epoch": 2405} {"train_loss": -10.37912368774414, "global_step": 404121, "epoch": 2405} {"train_loss": -11.923368453979492, "global_step": 404122, "epoch": 2405} {"train_loss": -10.787240028381348, "global_step": 404123, "epoch": 2405} {"train_loss": -12.222028732299805, "global_step": 404124, "epoch": 2405} {"train_loss": -11.183874130249023, "global_step": 404125, "epoch": 2405} {"train_loss": -11.202146530151367, "global_step": 404126, "epoch": 2405} {"train_loss": -11.602505683898926, "global_step": 404127, "epoch": 2405} {"train_loss": -10.975711822509766, "global_step": 404128, "epoch": 2405} {"train_loss": -12.039587020874023, "global_step": 404129, "epoch": 2405} {"train_loss": -10.524617195129395, "global_step": 404130, "epoch": 2405} {"train_loss": -12.117582321166992, "global_step": 404131, "epoch": 2405} {"train_loss": -11.484642028808594, "global_step": 404132, "epoch": 2405} {"train_loss": -11.494338035583496, "global_step": 404133, "epoch": 2405} {"train_loss": -11.718716621398926, "global_step": 404134, "epoch": 2405} {"train_loss": -11.637109756469727, "global_step": 404135, "epoch": 2405} {"train_loss": -12.09205436706543, "global_step": 404136, "epoch": 2405} {"train_loss": -10.206266403198242, "global_step": 404137, "epoch": 2405} {"train_loss": -11.821050643920898, "global_step": 404138, "epoch": 2405} {"train_loss": -10.894838333129883, "global_step": 404139, "epoch": 2405} {"train_loss": -11.752278327941895, "global_step": 404140, "epoch": 2405} {"train_loss": -11.109662055969238, "global_step": 404141, "epoch": 2405} {"train_loss": -12.208564758300781, "global_step": 404142, "epoch": 2405} {"train_loss": -11.425076484680176, "global_step": 404143, "epoch": 2405} {"train_loss": -12.264850616455078, "global_step": 404144, "epoch": 2405} {"train_loss": -11.942188262939453, "global_step": 404145, "epoch": 2405} {"train_loss": -12.191434860229492, "global_step": 404146, "epoch": 2405} {"train_loss": -11.99528694152832, "global_step": 404147, "epoch": 2405} {"train_loss": -11.73525619506836, "global_step": 404148, "epoch": 2405} {"train_loss": -12.247861862182617, "global_step": 404149, "epoch": 2405} {"train_loss": -11.962813377380371, "global_step": 404150, "epoch": 2405} {"train_loss": -12.331337928771973, "global_step": 404151, "epoch": 2405} {"train_loss": -11.847162246704102, "global_step": 404152, "epoch": 2405} {"train_loss": -12.450550079345703, "global_step": 404153, "epoch": 2405} {"train_loss": -11.946357727050781, "global_step": 404154, "epoch": 2405} {"train_loss": -12.29531478881836, "global_step": 404155, "epoch": 2405} {"train_loss": -12.244926452636719, "global_step": 404156, "epoch": 2405} {"train_loss": -12.187275886535645, "global_step": 404157, "epoch": 2405} {"train_loss": -12.098991394042969, "global_step": 404158, "epoch": 2405} {"train_loss": -12.312469482421875, "global_step": 404159, "epoch": 2405} {"train_loss": -12.118610382080078, "global_step": 404160, "epoch": 2405} {"train_loss": -12.179920196533203, "global_step": 404161, "epoch": 2405} {"train_loss": -12.379451751708984, "global_step": 404162, "epoch": 2405} {"train_loss": -12.187820434570312, "global_step": 404163, "epoch": 2405} {"train_loss": -12.373799324035645, "global_step": 404164, "epoch": 2405} {"train_loss": -12.251226425170898, "global_step": 404165, "epoch": 2405} {"train_loss": -12.403656959533691, "global_step": 404166, "epoch": 2405} {"train_loss": -12.35740852355957, "global_step": 404167, "epoch": 2405} {"train_loss": -12.482635498046875, "global_step": 404168, "epoch": 2405} {"train_loss": -12.366825103759766, "global_step": 404169, "epoch": 2405} {"train_loss": -12.29578971862793, "global_step": 404170, "epoch": 2405} {"train_loss": -12.570823669433594, "global_step": 404171, "epoch": 2405} {"train_loss": -12.402915954589844, "global_step": 404172, "epoch": 2405} {"train_loss": -12.499106407165527, "global_step": 404173, "epoch": 2405} {"train_loss": -12.497459411621094, "global_step": 404174, "epoch": 2405} {"train_loss": -12.758703231811523, "global_step": 404175, "epoch": 2405} {"train_loss": -12.701353073120117, "global_step": 404176, "epoch": 2405} {"train_loss": -12.628482818603516, "global_step": 404177, "epoch": 2405} {"train_loss": -12.602935791015625, "global_step": 404178, "epoch": 2405} {"train_loss": -12.694622993469238, "global_step": 404179, "epoch": 2405} {"train_loss": -12.483234405517578, "global_step": 404180, "epoch": 2405} {"train_loss": -12.593441009521484, "global_step": 404181, "epoch": 2405} {"train_loss": -12.71365737915039, "global_step": 404182, "epoch": 2405} {"train_loss": -12.860130310058594, "global_step": 404183, "epoch": 2405} {"train_loss": -12.389942169189453, "global_step": 404184, "epoch": 2405} {"train_loss": -12.282970428466797, "global_step": 404185, "epoch": 2405} {"train_loss": -12.66534423828125, "global_step": 404186, "epoch": 2405} {"train_loss": -12.363153457641602, "global_step": 404187, "epoch": 2405} {"train_loss": -12.457130432128906, "global_step": 404188, "epoch": 2405} {"train_loss": -12.854436874389648, "global_step": 404189, "epoch": 2405} {"train_loss": -12.405099868774414, "global_step": 404190, "epoch": 2405} {"train_loss": -12.490084648132324, "global_step": 404191, "epoch": 2405} {"train_loss": -12.522911071777344, "global_step": 404192, "epoch": 2405} {"train_loss": -12.420900344848633, "global_step": 404193, "epoch": 2405} {"train_loss": -12.453716278076172, "global_step": 404194, "epoch": 2405} {"train_loss": -12.445636749267578, "global_step": 404195, "epoch": 2405} {"train_loss": -12.6947021484375, "global_step": 404196, "epoch": 2405} {"train_loss": -12.531124114990234, "global_step": 404197, "epoch": 2405} {"train_loss": -12.55418872833252, "global_step": 404198, "epoch": 2405} {"train_loss": -12.679414749145508, "global_step": 404199, "epoch": 2405} {"train_loss": -12.8388671875, "global_step": 404200, "epoch": 2405} {"train_loss": -12.725004196166992, "global_step": 404201, "epoch": 2405} {"train_loss": -12.853801727294922, "global_step": 404202, "epoch": 2405} {"train_loss": -12.809196472167969, "global_step": 404203, "epoch": 2405} {"train_loss": -12.837472915649414, "global_step": 404204, "epoch": 2405} {"train_loss": -12.596471786499023, "global_step": 404205, "epoch": 2405} {"train_loss": -12.617414474487305, "global_step": 404206, "epoch": 2405} {"train_loss": -12.10255978220985, "global_step": 404207, "epoch": 2405, "val_loss": 305063.09375, "train_action_mse_error": 0.37092840671539307} {"train_loss": -12.752790451049805, "global_step": 404208, "epoch": 2406} {"train_loss": -12.383095741271973, "global_step": 404209, "epoch": 2406} {"train_loss": -12.24795150756836, "global_step": 404210, "epoch": 2406} {"train_loss": -12.984842300415039, "global_step": 404211, "epoch": 2406} {"train_loss": -12.544824600219727, "global_step": 404212, "epoch": 2406} {"train_loss": -12.351118087768555, "global_step": 404213, "epoch": 2406} {"train_loss": -12.778517723083496, "global_step": 404214, "epoch": 2406} {"train_loss": -12.51041030883789, "global_step": 404215, "epoch": 2406} {"train_loss": -12.795483589172363, "global_step": 404216, "epoch": 2406} {"train_loss": -12.455074310302734, "global_step": 404217, "epoch": 2406} {"train_loss": -12.760883331298828, "global_step": 404218, "epoch": 2406} {"train_loss": -12.686361312866211, "global_step": 404219, "epoch": 2406} {"train_loss": -12.782698631286621, "global_step": 404220, "epoch": 2406} {"train_loss": -12.080663681030273, "global_step": 404221, "epoch": 2406} {"train_loss": -12.167424201965332, "global_step": 404222, "epoch": 2406} {"train_loss": -12.431121826171875, "global_step": 404223, "epoch": 2406} {"train_loss": -12.304940223693848, "global_step": 404224, "epoch": 2406} {"train_loss": -12.402894973754883, "global_step": 404225, "epoch": 2406} {"train_loss": -12.012310028076172, "global_step": 404226, "epoch": 2406} {"train_loss": -12.229852676391602, "global_step": 404227, "epoch": 2406} {"train_loss": -12.301628112792969, "global_step": 404228, "epoch": 2406} {"train_loss": -12.733959197998047, "global_step": 404229, "epoch": 2406} {"train_loss": -12.752704620361328, "global_step": 404230, "epoch": 2406} {"train_loss": -12.329839706420898, "global_step": 404231, "epoch": 2406} {"train_loss": -11.758529663085938, "global_step": 404232, "epoch": 2406} {"train_loss": -12.574516296386719, "global_step": 404233, "epoch": 2406} {"train_loss": -12.156953811645508, "global_step": 404234, "epoch": 2406} {"train_loss": -12.356012344360352, "global_step": 404235, "epoch": 2406} {"train_loss": -12.183570861816406, "global_step": 404236, "epoch": 2406} {"train_loss": -12.432775497436523, "global_step": 404237, "epoch": 2406} {"train_loss": -11.99244499206543, "global_step": 404238, "epoch": 2406} {"train_loss": -12.180119514465332, "global_step": 404239, "epoch": 2406} {"train_loss": -12.32366943359375, "global_step": 404240, "epoch": 2406} {"train_loss": -10.7020263671875, "global_step": 404241, "epoch": 2406} {"train_loss": -12.321407318115234, "global_step": 404242, "epoch": 2406} {"train_loss": -11.656582832336426, "global_step": 404243, "epoch": 2406} {"train_loss": -11.987584114074707, "global_step": 404244, "epoch": 2406} {"train_loss": -12.241799354553223, "global_step": 404245, "epoch": 2406} {"train_loss": -12.688321113586426, "global_step": 404246, "epoch": 2406} {"train_loss": -11.643046379089355, "global_step": 404247, "epoch": 2406} {"train_loss": -11.216737747192383, "global_step": 404248, "epoch": 2406} {"train_loss": -12.516336441040039, "global_step": 404249, "epoch": 2406} {"train_loss": -11.544170379638672, "global_step": 404250, "epoch": 2406} {"train_loss": -10.764884948730469, "global_step": 404251, "epoch": 2406} {"train_loss": -12.44305419921875, "global_step": 404252, "epoch": 2406} {"train_loss": -11.39394760131836, "global_step": 404253, "epoch": 2406} {"train_loss": -11.102490425109863, "global_step": 404254, "epoch": 2406} {"train_loss": -11.806741714477539, "global_step": 404255, "epoch": 2406} {"train_loss": -11.95475959777832, "global_step": 404256, "epoch": 2406} {"train_loss": -11.436662673950195, "global_step": 404257, "epoch": 2406} {"train_loss": -11.542118072509766, "global_step": 404258, "epoch": 2406} {"train_loss": -12.336809158325195, "global_step": 404259, "epoch": 2406} {"train_loss": -11.793935775756836, "global_step": 404260, "epoch": 2406} {"train_loss": -11.672356605529785, "global_step": 404261, "epoch": 2406} {"train_loss": -12.440037727355957, "global_step": 404262, "epoch": 2406} {"train_loss": -11.890178680419922, "global_step": 404263, "epoch": 2406} {"train_loss": -11.865791320800781, "global_step": 404264, "epoch": 2406} {"train_loss": -12.560790061950684, "global_step": 404265, "epoch": 2406} {"train_loss": -11.966257095336914, "global_step": 404266, "epoch": 2406} {"train_loss": -11.841379165649414, "global_step": 404267, "epoch": 2406} {"train_loss": -12.163589477539062, "global_step": 404268, "epoch": 2406} {"train_loss": -11.989672660827637, "global_step": 404269, "epoch": 2406} {"train_loss": -12.159339904785156, "global_step": 404270, "epoch": 2406} {"train_loss": -11.704439163208008, "global_step": 404271, "epoch": 2406} {"train_loss": -12.085590362548828, "global_step": 404272, "epoch": 2406} {"train_loss": -11.264799118041992, "global_step": 404273, "epoch": 2406} {"train_loss": -12.076054573059082, "global_step": 404274, "epoch": 2406} {"train_loss": -11.514265060424805, "global_step": 404275, "epoch": 2406} {"train_loss": -12.005837440490723, "global_step": 404276, "epoch": 2406} {"train_loss": -12.063488006591797, "global_step": 404277, "epoch": 2406} {"train_loss": -11.817977905273438, "global_step": 404278, "epoch": 2406} {"train_loss": -11.60903263092041, "global_step": 404279, "epoch": 2406} {"train_loss": -12.4428129196167, "global_step": 404280, "epoch": 2406} {"train_loss": -11.619938850402832, "global_step": 404281, "epoch": 2406} {"train_loss": -12.329349517822266, "global_step": 404282, "epoch": 2406} {"train_loss": -11.807333946228027, "global_step": 404283, "epoch": 2406} {"train_loss": -12.081533432006836, "global_step": 404284, "epoch": 2406} {"train_loss": -12.053364753723145, "global_step": 404285, "epoch": 2406} {"train_loss": -12.134343147277832, "global_step": 404286, "epoch": 2406} {"train_loss": -11.888840675354004, "global_step": 404287, "epoch": 2406} {"train_loss": -11.546623229980469, "global_step": 404288, "epoch": 2406} {"train_loss": -11.872734069824219, "global_step": 404289, "epoch": 2406} {"train_loss": -11.570215225219727, "global_step": 404290, "epoch": 2406} {"train_loss": -11.35295295715332, "global_step": 404291, "epoch": 2406} {"train_loss": -12.051475524902344, "global_step": 404292, "epoch": 2406} {"train_loss": -11.768176078796387, "global_step": 404293, "epoch": 2406} {"train_loss": -11.575181007385254, "global_step": 404294, "epoch": 2406} {"train_loss": -11.96938419342041, "global_step": 404295, "epoch": 2406} {"train_loss": -12.205358505249023, "global_step": 404296, "epoch": 2406} {"train_loss": -12.1161470413208, "global_step": 404297, "epoch": 2406} {"train_loss": -11.711809158325195, "global_step": 404298, "epoch": 2406} {"train_loss": -12.333358764648438, "global_step": 404299, "epoch": 2406} {"train_loss": -11.688915252685547, "global_step": 404300, "epoch": 2406} {"train_loss": -12.339792251586914, "global_step": 404301, "epoch": 2406} {"train_loss": -11.945581436157227, "global_step": 404302, "epoch": 2406} {"train_loss": -12.093857765197754, "global_step": 404303, "epoch": 2406} {"train_loss": -11.946863174438477, "global_step": 404304, "epoch": 2406} {"train_loss": -11.736467361450195, "global_step": 404305, "epoch": 2406} {"train_loss": -12.214722633361816, "global_step": 404306, "epoch": 2406} {"train_loss": -11.417631149291992, "global_step": 404307, "epoch": 2406} {"train_loss": -12.429719924926758, "global_step": 404308, "epoch": 2406} {"train_loss": -11.719551086425781, "global_step": 404309, "epoch": 2406} {"train_loss": -12.060543060302734, "global_step": 404310, "epoch": 2406} {"train_loss": -11.78207778930664, "global_step": 404311, "epoch": 2406} {"train_loss": -12.436750411987305, "global_step": 404312, "epoch": 2406} {"train_loss": -11.697914123535156, "global_step": 404313, "epoch": 2406} {"train_loss": -12.124115943908691, "global_step": 404314, "epoch": 2406} {"train_loss": -12.451545715332031, "global_step": 404315, "epoch": 2406} {"train_loss": -11.569894790649414, "global_step": 404316, "epoch": 2406} {"train_loss": -12.099499702453613, "global_step": 404317, "epoch": 2406} {"train_loss": -12.23434829711914, "global_step": 404318, "epoch": 2406} {"train_loss": -11.684100151062012, "global_step": 404319, "epoch": 2406} {"train_loss": -12.473155975341797, "global_step": 404320, "epoch": 2406} {"train_loss": -11.884111404418945, "global_step": 404321, "epoch": 2406} {"train_loss": -12.215194702148438, "global_step": 404322, "epoch": 2406} {"train_loss": -11.87869930267334, "global_step": 404323, "epoch": 2406} {"train_loss": -12.211959838867188, "global_step": 404324, "epoch": 2406} {"train_loss": -11.858562469482422, "global_step": 404325, "epoch": 2406} {"train_loss": -12.491657257080078, "global_step": 404326, "epoch": 2406} {"train_loss": -12.104032516479492, "global_step": 404327, "epoch": 2406} {"train_loss": -12.28852653503418, "global_step": 404328, "epoch": 2406} {"train_loss": -11.991077423095703, "global_step": 404329, "epoch": 2406} {"train_loss": -12.076995849609375, "global_step": 404330, "epoch": 2406} {"train_loss": -12.357917785644531, "global_step": 404331, "epoch": 2406} {"train_loss": -12.35854434967041, "global_step": 404332, "epoch": 2406} {"train_loss": -12.414494514465332, "global_step": 404333, "epoch": 2406} {"train_loss": -12.301677703857422, "global_step": 404334, "epoch": 2406} {"train_loss": -11.838769912719727, "global_step": 404335, "epoch": 2406} {"train_loss": -12.705343246459961, "global_step": 404336, "epoch": 2406} {"train_loss": -12.220951080322266, "global_step": 404337, "epoch": 2406} {"train_loss": -12.470640182495117, "global_step": 404338, "epoch": 2406} {"train_loss": -12.351922988891602, "global_step": 404339, "epoch": 2406} {"train_loss": -12.025154113769531, "global_step": 404340, "epoch": 2406} {"train_loss": -12.292009353637695, "global_step": 404341, "epoch": 2406} {"train_loss": -12.306661605834961, "global_step": 404342, "epoch": 2406} {"train_loss": -12.18643856048584, "global_step": 404343, "epoch": 2406} {"train_loss": -12.630874633789062, "global_step": 404344, "epoch": 2406} {"train_loss": -12.560307502746582, "global_step": 404345, "epoch": 2406} {"train_loss": -12.330784797668457, "global_step": 404346, "epoch": 2406} {"train_loss": -12.49346923828125, "global_step": 404347, "epoch": 2406} {"train_loss": -12.54896354675293, "global_step": 404348, "epoch": 2406} {"train_loss": -12.437358856201172, "global_step": 404349, "epoch": 2406} {"train_loss": -12.380627632141113, "global_step": 404350, "epoch": 2406} {"train_loss": -12.637845993041992, "global_step": 404351, "epoch": 2406} {"train_loss": -11.901212692260742, "global_step": 404352, "epoch": 2406} {"train_loss": -12.413091659545898, "global_step": 404353, "epoch": 2406} {"train_loss": -12.33145523071289, "global_step": 404354, "epoch": 2406} {"train_loss": -12.286565780639648, "global_step": 404355, "epoch": 2406} {"train_loss": -12.176422119140625, "global_step": 404356, "epoch": 2406} {"train_loss": -12.595071792602539, "global_step": 404357, "epoch": 2406} {"train_loss": -11.957749366760254, "global_step": 404358, "epoch": 2406} {"train_loss": -12.188407897949219, "global_step": 404359, "epoch": 2406} {"train_loss": -12.35329818725586, "global_step": 404360, "epoch": 2406} {"train_loss": -12.580217361450195, "global_step": 404361, "epoch": 2406} {"train_loss": -12.210055351257324, "global_step": 404362, "epoch": 2406} {"train_loss": -12.378108978271484, "global_step": 404363, "epoch": 2406} {"train_loss": -12.345361709594727, "global_step": 404364, "epoch": 2406} {"train_loss": -12.49290657043457, "global_step": 404365, "epoch": 2406} {"train_loss": -12.40793228149414, "global_step": 404366, "epoch": 2406} {"train_loss": -12.619451522827148, "global_step": 404367, "epoch": 2406} {"train_loss": -12.310192108154297, "global_step": 404368, "epoch": 2406} {"train_loss": -12.46818733215332, "global_step": 404369, "epoch": 2406} {"train_loss": -12.824312210083008, "global_step": 404370, "epoch": 2406} {"train_loss": -12.584495544433594, "global_step": 404371, "epoch": 2406} {"train_loss": -12.695363998413086, "global_step": 404372, "epoch": 2406} {"train_loss": -12.519477844238281, "global_step": 404373, "epoch": 2406} {"train_loss": -12.581551551818848, "global_step": 404374, "epoch": 2406} {"train_loss": -12.147734636352176, "global_step": 404375, "epoch": 2406, "val_loss": 302815.5} {"train_loss": -12.756444931030273, "global_step": 404376, "epoch": 2407} {"train_loss": -12.61985969543457, "global_step": 404377, "epoch": 2407} {"train_loss": -12.33875846862793, "global_step": 404378, "epoch": 2407} {"train_loss": -12.668319702148438, "global_step": 404379, "epoch": 2407} {"train_loss": -12.306501388549805, "global_step": 404380, "epoch": 2407} {"train_loss": -12.590167045593262, "global_step": 404381, "epoch": 2407} {"train_loss": -12.768524169921875, "global_step": 404382, "epoch": 2407} {"train_loss": -12.480682373046875, "global_step": 404383, "epoch": 2407} {"train_loss": -12.493230819702148, "global_step": 404384, "epoch": 2407} {"train_loss": -12.684041976928711, "global_step": 404385, "epoch": 2407} {"train_loss": -12.460151672363281, "global_step": 404386, "epoch": 2407} {"train_loss": -12.3208646774292, "global_step": 404387, "epoch": 2407} {"train_loss": -12.554122924804688, "global_step": 404388, "epoch": 2407} {"train_loss": -12.032391548156738, "global_step": 404389, "epoch": 2407} {"train_loss": -12.205976486206055, "global_step": 404390, "epoch": 2407} {"train_loss": -12.213598251342773, "global_step": 404391, "epoch": 2407} {"train_loss": -12.618142127990723, "global_step": 404392, "epoch": 2407} {"train_loss": -12.007913589477539, "global_step": 404393, "epoch": 2407} {"train_loss": -12.417957305908203, "global_step": 404394, "epoch": 2407} {"train_loss": -12.009916305541992, "global_step": 404395, "epoch": 2407} {"train_loss": -12.52182674407959, "global_step": 404396, "epoch": 2407} {"train_loss": -12.334371566772461, "global_step": 404397, "epoch": 2407} {"train_loss": -11.514090538024902, "global_step": 404398, "epoch": 2407} {"train_loss": -11.6553955078125, "global_step": 404399, "epoch": 2407} {"train_loss": -12.659029006958008, "global_step": 404400, "epoch": 2407} {"train_loss": -11.267801284790039, "global_step": 404401, "epoch": 2407} {"train_loss": -10.871240615844727, "global_step": 404402, "epoch": 2407} {"train_loss": -12.13309097290039, "global_step": 404403, "epoch": 2407} {"train_loss": -11.859432220458984, "global_step": 404404, "epoch": 2407} {"train_loss": -10.084674835205078, "global_step": 404405, "epoch": 2407} {"train_loss": -11.627985000610352, "global_step": 404406, "epoch": 2407} {"train_loss": -10.659919738769531, "global_step": 404407, "epoch": 2407} {"train_loss": -10.312519073486328, "global_step": 404408, "epoch": 2407} {"train_loss": -11.828278541564941, "global_step": 404409, "epoch": 2407} {"train_loss": -8.673969268798828, "global_step": 404410, "epoch": 2407} {"train_loss": -11.603960037231445, "global_step": 404411, "epoch": 2407} {"train_loss": -10.697012901306152, "global_step": 404412, "epoch": 2407} {"train_loss": -10.895522117614746, "global_step": 404413, "epoch": 2407} {"train_loss": -11.5172758102417, "global_step": 404414, "epoch": 2407} {"train_loss": -11.347577095031738, "global_step": 404415, "epoch": 2407} {"train_loss": -11.471822738647461, "global_step": 404416, "epoch": 2407} {"train_loss": -11.714746475219727, "global_step": 404417, "epoch": 2407} {"train_loss": -11.546433448791504, "global_step": 404418, "epoch": 2407} {"train_loss": -11.464805603027344, "global_step": 404419, "epoch": 2407} {"train_loss": -11.112798690795898, "global_step": 404420, "epoch": 2407} {"train_loss": -9.91220760345459, "global_step": 404421, "epoch": 2407} {"train_loss": -11.726484298706055, "global_step": 404422, "epoch": 2407} {"train_loss": -10.769001960754395, "global_step": 404423, "epoch": 2407} {"train_loss": -11.612469673156738, "global_step": 404424, "epoch": 2407} {"train_loss": -10.524349212646484, "global_step": 404425, "epoch": 2407} {"train_loss": -11.199728012084961, "global_step": 404426, "epoch": 2407} {"train_loss": -11.24563217163086, "global_step": 404427, "epoch": 2407} {"train_loss": -11.671945571899414, "global_step": 404428, "epoch": 2407} {"train_loss": -11.705113410949707, "global_step": 404429, "epoch": 2407} {"train_loss": -11.481164932250977, "global_step": 404430, "epoch": 2407} {"train_loss": -12.145377159118652, "global_step": 404431, "epoch": 2407} {"train_loss": -11.217437744140625, "global_step": 404432, "epoch": 2407} {"train_loss": -12.17651653289795, "global_step": 404433, "epoch": 2407} {"train_loss": -11.551624298095703, "global_step": 404434, "epoch": 2407} {"train_loss": -11.366231918334961, "global_step": 404435, "epoch": 2407} {"train_loss": -11.83271598815918, "global_step": 404436, "epoch": 2407} {"train_loss": -11.731385231018066, "global_step": 404437, "epoch": 2407} {"train_loss": -11.875028610229492, "global_step": 404438, "epoch": 2407} {"train_loss": -12.020517349243164, "global_step": 404439, "epoch": 2407} {"train_loss": -12.032718658447266, "global_step": 404440, "epoch": 2407} {"train_loss": -12.152302742004395, "global_step": 404441, "epoch": 2407} {"train_loss": -12.031278610229492, "global_step": 404442, "epoch": 2407} {"train_loss": -12.119284629821777, "global_step": 404443, "epoch": 2407} {"train_loss": -12.069751739501953, "global_step": 404444, "epoch": 2407} {"train_loss": -11.962870597839355, "global_step": 404445, "epoch": 2407} {"train_loss": -11.820366859436035, "global_step": 404446, "epoch": 2407} {"train_loss": -11.921781539916992, "global_step": 404447, "epoch": 2407} {"train_loss": -11.952938079833984, "global_step": 404448, "epoch": 2407} {"train_loss": -11.709295272827148, "global_step": 404449, "epoch": 2407} {"train_loss": -11.844328880310059, "global_step": 404450, "epoch": 2407} {"train_loss": -11.73569107055664, "global_step": 404451, "epoch": 2407} {"train_loss": -11.916231155395508, "global_step": 404452, "epoch": 2407} {"train_loss": -11.852486610412598, "global_step": 404453, "epoch": 2407} {"train_loss": -11.931411743164062, "global_step": 404454, "epoch": 2407} {"train_loss": -12.007840156555176, "global_step": 404455, "epoch": 2407} {"train_loss": -12.151687622070312, "global_step": 404456, "epoch": 2407} {"train_loss": -12.065940856933594, "global_step": 404457, "epoch": 2407} {"train_loss": -11.995403289794922, "global_step": 404458, "epoch": 2407} {"train_loss": -12.183478355407715, "global_step": 404459, "epoch": 2407} {"train_loss": -12.05849838256836, "global_step": 404460, "epoch": 2407} {"train_loss": -12.020955085754395, "global_step": 404461, "epoch": 2407} {"train_loss": -12.551370620727539, "global_step": 404462, "epoch": 2407} {"train_loss": -11.963726043701172, "global_step": 404463, "epoch": 2407} {"train_loss": -12.490254402160645, "global_step": 404464, "epoch": 2407} {"train_loss": -12.197894096374512, "global_step": 404465, "epoch": 2407} {"train_loss": -12.330221176147461, "global_step": 404466, "epoch": 2407} {"train_loss": -12.486507415771484, "global_step": 404467, "epoch": 2407} {"train_loss": -12.408716201782227, "global_step": 404468, "epoch": 2407} {"train_loss": -12.335387229919434, "global_step": 404469, "epoch": 2407} {"train_loss": -12.373385429382324, "global_step": 404470, "epoch": 2407} {"train_loss": -12.434469223022461, "global_step": 404471, "epoch": 2407} {"train_loss": -12.382490158081055, "global_step": 404472, "epoch": 2407} {"train_loss": -12.358647346496582, "global_step": 404473, "epoch": 2407} {"train_loss": -12.219923973083496, "global_step": 404474, "epoch": 2407} {"train_loss": -12.64896011352539, "global_step": 404475, "epoch": 2407} {"train_loss": -12.451614379882812, "global_step": 404476, "epoch": 2407} {"train_loss": -12.630597114562988, "global_step": 404477, "epoch": 2407} {"train_loss": -12.247407913208008, "global_step": 404478, "epoch": 2407} {"train_loss": -12.301651000976562, "global_step": 404479, "epoch": 2407} {"train_loss": -12.503933906555176, "global_step": 404480, "epoch": 2407} {"train_loss": -12.469870567321777, "global_step": 404481, "epoch": 2407} {"train_loss": -12.322319030761719, "global_step": 404482, "epoch": 2407} {"train_loss": -12.454689979553223, "global_step": 404483, "epoch": 2407} {"train_loss": -12.692703247070312, "global_step": 404484, "epoch": 2407} {"train_loss": -12.399322509765625, "global_step": 404485, "epoch": 2407} {"train_loss": -12.497701644897461, "global_step": 404486, "epoch": 2407} {"train_loss": -12.515494346618652, "global_step": 404487, "epoch": 2407} {"train_loss": -12.325233459472656, "global_step": 404488, "epoch": 2407} {"train_loss": -12.576711654663086, "global_step": 404489, "epoch": 2407} {"train_loss": -12.394227027893066, "global_step": 404490, "epoch": 2407} {"train_loss": -12.5887451171875, "global_step": 404491, "epoch": 2407} {"train_loss": -12.458417892456055, "global_step": 404492, "epoch": 2407} {"train_loss": -12.772635459899902, "global_step": 404493, "epoch": 2407} {"train_loss": -11.91421890258789, "global_step": 404494, "epoch": 2407} {"train_loss": -12.600616455078125, "global_step": 404495, "epoch": 2407} {"train_loss": -12.515274047851562, "global_step": 404496, "epoch": 2407} {"train_loss": -12.678686141967773, "global_step": 404497, "epoch": 2407} {"train_loss": -12.778111457824707, "global_step": 404498, "epoch": 2407} {"train_loss": -12.836240768432617, "global_step": 404499, "epoch": 2407} {"train_loss": -12.760147094726562, "global_step": 404500, "epoch": 2407} {"train_loss": -12.60273551940918, "global_step": 404501, "epoch": 2407} {"train_loss": -12.592541694641113, "global_step": 404502, "epoch": 2407} {"train_loss": -12.772939682006836, "global_step": 404503, "epoch": 2407} {"train_loss": -12.40880012512207, "global_step": 404504, "epoch": 2407} {"train_loss": -12.808988571166992, "global_step": 404505, "epoch": 2407} {"train_loss": -12.75959587097168, "global_step": 404506, "epoch": 2407} {"train_loss": -12.793190002441406, "global_step": 404507, "epoch": 2407} {"train_loss": -12.715680122375488, "global_step": 404508, "epoch": 2407} {"train_loss": -12.888006210327148, "global_step": 404509, "epoch": 2407} {"train_loss": -12.701888084411621, "global_step": 404510, "epoch": 2407} {"train_loss": -12.740999221801758, "global_step": 404511, "epoch": 2407} {"train_loss": -12.427258491516113, "global_step": 404512, "epoch": 2407} {"train_loss": -12.626581192016602, "global_step": 404513, "epoch": 2407} {"train_loss": -12.495792388916016, "global_step": 404514, "epoch": 2407} {"train_loss": -12.761439323425293, "global_step": 404515, "epoch": 2407} {"train_loss": -12.149962425231934, "global_step": 404516, "epoch": 2407} {"train_loss": -12.345026016235352, "global_step": 404517, "epoch": 2407} {"train_loss": -12.408744812011719, "global_step": 404518, "epoch": 2407} {"train_loss": -12.364026069641113, "global_step": 404519, "epoch": 2407} {"train_loss": -10.477714538574219, "global_step": 404520, "epoch": 2407} {"train_loss": -11.435211181640625, "global_step": 404521, "epoch": 2407} {"train_loss": -9.68227767944336, "global_step": 404522, "epoch": 2407} {"train_loss": -9.66568374633789, "global_step": 404523, "epoch": 2407} {"train_loss": -10.045928001403809, "global_step": 404524, "epoch": 2407} {"train_loss": -8.304925918579102, "global_step": 404525, "epoch": 2407} {"train_loss": -8.375925064086914, "global_step": 404526, "epoch": 2407} {"train_loss": -9.157427787780762, "global_step": 404527, "epoch": 2407} {"train_loss": -10.652408599853516, "global_step": 404528, "epoch": 2407} {"train_loss": -10.332636833190918, "global_step": 404529, "epoch": 2407} {"train_loss": -10.129783630371094, "global_step": 404530, "epoch": 2407} {"train_loss": -10.40904426574707, "global_step": 404531, "epoch": 2407} {"train_loss": -8.605141639709473, "global_step": 404532, "epoch": 2407} {"train_loss": -9.493431091308594, "global_step": 404533, "epoch": 2407} {"train_loss": -11.051349639892578, "global_step": 404534, "epoch": 2407} {"train_loss": -9.314462661743164, "global_step": 404535, "epoch": 2407} {"train_loss": -10.606715202331543, "global_step": 404536, "epoch": 2407} {"train_loss": -9.873771667480469, "global_step": 404537, "epoch": 2407} {"train_loss": -9.131256103515625, "global_step": 404538, "epoch": 2407} {"train_loss": -10.559871673583984, "global_step": 404539, "epoch": 2407} {"train_loss": -11.537109375, "global_step": 404540, "epoch": 2407} {"train_loss": -10.3416166305542, "global_step": 404541, "epoch": 2407} {"train_loss": -11.356082916259766, "global_step": 404542, "epoch": 2407} {"train_loss": -11.781894910903205, "global_step": 404543, "epoch": 2407, "val_loss": 295967.34375} {"train_loss": -11.756233215332031, "global_step": 404544, "epoch": 2408} {"train_loss": -10.700468063354492, "global_step": 404545, "epoch": 2408} {"train_loss": -10.533140182495117, "global_step": 404546, "epoch": 2408} {"train_loss": -11.648124694824219, "global_step": 404547, "epoch": 2408} {"train_loss": -11.356626510620117, "global_step": 404548, "epoch": 2408} {"train_loss": -11.169326782226562, "global_step": 404549, "epoch": 2408} {"train_loss": -11.646707534790039, "global_step": 404550, "epoch": 2408} {"train_loss": -11.384210586547852, "global_step": 404551, "epoch": 2408} {"train_loss": -11.629292488098145, "global_step": 404552, "epoch": 2408} {"train_loss": -11.905855178833008, "global_step": 404553, "epoch": 2408} {"train_loss": -12.033907890319824, "global_step": 404554, "epoch": 2408} {"train_loss": -11.123941421508789, "global_step": 404555, "epoch": 2408} {"train_loss": -11.38642692565918, "global_step": 404556, "epoch": 2408} {"train_loss": -11.628002166748047, "global_step": 404557, "epoch": 2408} {"train_loss": -11.75036334991455, "global_step": 404558, "epoch": 2408} {"train_loss": -11.65927791595459, "global_step": 404559, "epoch": 2408} {"train_loss": -11.592854499816895, "global_step": 404560, "epoch": 2408} {"train_loss": -11.337118148803711, "global_step": 404561, "epoch": 2408} {"train_loss": -12.003376007080078, "global_step": 404562, "epoch": 2408} {"train_loss": -11.764801979064941, "global_step": 404563, "epoch": 2408} {"train_loss": -11.91127872467041, "global_step": 404564, "epoch": 2408} {"train_loss": -11.88679313659668, "global_step": 404565, "epoch": 2408} {"train_loss": -12.29170036315918, "global_step": 404566, "epoch": 2408} {"train_loss": -11.874238014221191, "global_step": 404567, "epoch": 2408} {"train_loss": -12.363679885864258, "global_step": 404568, "epoch": 2408} {"train_loss": -12.093526840209961, "global_step": 404569, "epoch": 2408} {"train_loss": -12.132390975952148, "global_step": 404570, "epoch": 2408} {"train_loss": -12.361404418945312, "global_step": 404571, "epoch": 2408} {"train_loss": -12.344554901123047, "global_step": 404572, "epoch": 2408} {"train_loss": -12.302461624145508, "global_step": 404573, "epoch": 2408} {"train_loss": -12.284049034118652, "global_step": 404574, "epoch": 2408} {"train_loss": -12.204914093017578, "global_step": 404575, "epoch": 2408} {"train_loss": -12.301980972290039, "global_step": 404576, "epoch": 2408} {"train_loss": -12.373383522033691, "global_step": 404577, "epoch": 2408} {"train_loss": -12.268552780151367, "global_step": 404578, "epoch": 2408} {"train_loss": -12.335856437683105, "global_step": 404579, "epoch": 2408} {"train_loss": -12.462446212768555, "global_step": 404580, "epoch": 2408} {"train_loss": -12.509306907653809, "global_step": 404581, "epoch": 2408} {"train_loss": -12.462329864501953, "global_step": 404582, "epoch": 2408} {"train_loss": -12.479528427124023, "global_step": 404583, "epoch": 2408} {"train_loss": -12.450491905212402, "global_step": 404584, "epoch": 2408} {"train_loss": -12.541301727294922, "global_step": 404585, "epoch": 2408} {"train_loss": -12.388145446777344, "global_step": 404586, "epoch": 2408} {"train_loss": -12.500298500061035, "global_step": 404587, "epoch": 2408} {"train_loss": -12.362374305725098, "global_step": 404588, "epoch": 2408} {"train_loss": -12.385339736938477, "global_step": 404589, "epoch": 2408} {"train_loss": -12.104870796203613, "global_step": 404590, "epoch": 2408} {"train_loss": -12.415406227111816, "global_step": 404591, "epoch": 2408} {"train_loss": -12.607765197753906, "global_step": 404592, "epoch": 2408} {"train_loss": -12.31283950805664, "global_step": 404593, "epoch": 2408} {"train_loss": -12.345959663391113, "global_step": 404594, "epoch": 2408} {"train_loss": -12.555733680725098, "global_step": 404595, "epoch": 2408} {"train_loss": -12.061915397644043, "global_step": 404596, "epoch": 2408} {"train_loss": -12.380069732666016, "global_step": 404597, "epoch": 2408} {"train_loss": -12.651865005493164, "global_step": 404598, "epoch": 2408} {"train_loss": -12.477875709533691, "global_step": 404599, "epoch": 2408} {"train_loss": -12.286450386047363, "global_step": 404600, "epoch": 2408} {"train_loss": -12.447006225585938, "global_step": 404601, "epoch": 2408} {"train_loss": -12.119821548461914, "global_step": 404602, "epoch": 2408} {"train_loss": -12.423771858215332, "global_step": 404603, "epoch": 2408} {"train_loss": -12.238452911376953, "global_step": 404604, "epoch": 2408} {"train_loss": -11.72821044921875, "global_step": 404605, "epoch": 2408} {"train_loss": -12.310206413269043, "global_step": 404606, "epoch": 2408} {"train_loss": -12.274163246154785, "global_step": 404607, "epoch": 2408} {"train_loss": -11.963800430297852, "global_step": 404608, "epoch": 2408} {"train_loss": -12.407453536987305, "global_step": 404609, "epoch": 2408} {"train_loss": -11.973207473754883, "global_step": 404610, "epoch": 2408} {"train_loss": -12.659914016723633, "global_step": 404611, "epoch": 2408} {"train_loss": -11.93048095703125, "global_step": 404612, "epoch": 2408} {"train_loss": -12.716686248779297, "global_step": 404613, "epoch": 2408} {"train_loss": -12.135408401489258, "global_step": 404614, "epoch": 2408} {"train_loss": -12.443537712097168, "global_step": 404615, "epoch": 2408} {"train_loss": -11.969110488891602, "global_step": 404616, "epoch": 2408} {"train_loss": -12.115606307983398, "global_step": 404617, "epoch": 2408} {"train_loss": -12.113554954528809, "global_step": 404618, "epoch": 2408} {"train_loss": -11.566919326782227, "global_step": 404619, "epoch": 2408} {"train_loss": -11.691566467285156, "global_step": 404620, "epoch": 2408} {"train_loss": -11.332380294799805, "global_step": 404621, "epoch": 2408} {"train_loss": -12.162979125976562, "global_step": 404622, "epoch": 2408} {"train_loss": -10.854180335998535, "global_step": 404623, "epoch": 2408} {"train_loss": -12.037118911743164, "global_step": 404624, "epoch": 2408} {"train_loss": -10.585330963134766, "global_step": 404625, "epoch": 2408} {"train_loss": -11.408028602600098, "global_step": 404626, "epoch": 2408} {"train_loss": -11.323076248168945, "global_step": 404627, "epoch": 2408} {"train_loss": -10.13244342803955, "global_step": 404628, "epoch": 2408} {"train_loss": -10.33418083190918, "global_step": 404629, "epoch": 2408} {"train_loss": -10.092397689819336, "global_step": 404630, "epoch": 2408} {"train_loss": -10.567072868347168, "global_step": 404631, "epoch": 2408} {"train_loss": -10.944475173950195, "global_step": 404632, "epoch": 2408} {"train_loss": -11.536123275756836, "global_step": 404633, "epoch": 2408} {"train_loss": -9.497808456420898, "global_step": 404634, "epoch": 2408} {"train_loss": -10.989047050476074, "global_step": 404635, "epoch": 2408} {"train_loss": -10.148344039916992, "global_step": 404636, "epoch": 2408} {"train_loss": -9.023750305175781, "global_step": 404637, "epoch": 2408} {"train_loss": -9.250589370727539, "global_step": 404638, "epoch": 2408} {"train_loss": -10.210046768188477, "global_step": 404639, "epoch": 2408} {"train_loss": -10.812660217285156, "global_step": 404640, "epoch": 2408} {"train_loss": -10.801029205322266, "global_step": 404641, "epoch": 2408} {"train_loss": -9.837111473083496, "global_step": 404642, "epoch": 2408} {"train_loss": -10.899272918701172, "global_step": 404643, "epoch": 2408} {"train_loss": -11.09664535522461, "global_step": 404644, "epoch": 2408} {"train_loss": -11.127934455871582, "global_step": 404645, "epoch": 2408} {"train_loss": -10.728965759277344, "global_step": 404646, "epoch": 2408} {"train_loss": -11.996240615844727, "global_step": 404647, "epoch": 2408} {"train_loss": -10.848628044128418, "global_step": 404648, "epoch": 2408} {"train_loss": -12.04724407196045, "global_step": 404649, "epoch": 2408} {"train_loss": -11.704774856567383, "global_step": 404650, "epoch": 2408} {"train_loss": -10.769681930541992, "global_step": 404651, "epoch": 2408} {"train_loss": -11.52827262878418, "global_step": 404652, "epoch": 2408} {"train_loss": -10.912927627563477, "global_step": 404653, "epoch": 2408} {"train_loss": -10.568007469177246, "global_step": 404654, "epoch": 2408} {"train_loss": -11.589552879333496, "global_step": 404655, "epoch": 2408} {"train_loss": -10.870851516723633, "global_step": 404656, "epoch": 2408} {"train_loss": -10.920219421386719, "global_step": 404657, "epoch": 2408} {"train_loss": -11.350221633911133, "global_step": 404658, "epoch": 2408} {"train_loss": -11.346990585327148, "global_step": 404659, "epoch": 2408} {"train_loss": -11.299176216125488, "global_step": 404660, "epoch": 2408} {"train_loss": -11.841119766235352, "global_step": 404661, "epoch": 2408} {"train_loss": -11.709028244018555, "global_step": 404662, "epoch": 2408} {"train_loss": -11.244874954223633, "global_step": 404663, "epoch": 2408} {"train_loss": -11.362815856933594, "global_step": 404664, "epoch": 2408} {"train_loss": -11.571617126464844, "global_step": 404665, "epoch": 2408} {"train_loss": -11.51057243347168, "global_step": 404666, "epoch": 2408} {"train_loss": -11.070894241333008, "global_step": 404667, "epoch": 2408} {"train_loss": -11.537190437316895, "global_step": 404668, "epoch": 2408} {"train_loss": -10.816629409790039, "global_step": 404669, "epoch": 2408} {"train_loss": -11.761272430419922, "global_step": 404670, "epoch": 2408} {"train_loss": -11.722776412963867, "global_step": 404671, "epoch": 2408} {"train_loss": -11.266097068786621, "global_step": 404672, "epoch": 2408} {"train_loss": -11.802996635437012, "global_step": 404673, "epoch": 2408} {"train_loss": -11.334978103637695, "global_step": 404674, "epoch": 2408} {"train_loss": -11.686933517456055, "global_step": 404675, "epoch": 2408} {"train_loss": -11.986150741577148, "global_step": 404676, "epoch": 2408} {"train_loss": -11.868860244750977, "global_step": 404677, "epoch": 2408} {"train_loss": -12.127313613891602, "global_step": 404678, "epoch": 2408} {"train_loss": -12.244422912597656, "global_step": 404679, "epoch": 2408} {"train_loss": -11.85299301147461, "global_step": 404680, "epoch": 2408} {"train_loss": -12.121109008789062, "global_step": 404681, "epoch": 2408} {"train_loss": -12.141307830810547, "global_step": 404682, "epoch": 2408} {"train_loss": -12.08496379852295, "global_step": 404683, "epoch": 2408} {"train_loss": -12.217607498168945, "global_step": 404684, "epoch": 2408} {"train_loss": -11.985906600952148, "global_step": 404685, "epoch": 2408} {"train_loss": -12.217327117919922, "global_step": 404686, "epoch": 2408} {"train_loss": -12.107132911682129, "global_step": 404687, "epoch": 2408} {"train_loss": -12.386544227600098, "global_step": 404688, "epoch": 2408} {"train_loss": -12.282413482666016, "global_step": 404689, "epoch": 2408} {"train_loss": -12.341794967651367, "global_step": 404690, "epoch": 2408} {"train_loss": -12.275432586669922, "global_step": 404691, "epoch": 2408} {"train_loss": -12.05555534362793, "global_step": 404692, "epoch": 2408} {"train_loss": -12.46377182006836, "global_step": 404693, "epoch": 2408} {"train_loss": -12.34627914428711, "global_step": 404694, "epoch": 2408} {"train_loss": -12.516279220581055, "global_step": 404695, "epoch": 2408} {"train_loss": -12.19942855834961, "global_step": 404696, "epoch": 2408} {"train_loss": -12.309630393981934, "global_step": 404697, "epoch": 2408} {"train_loss": -12.354825973510742, "global_step": 404698, "epoch": 2408} {"train_loss": -12.332868576049805, "global_step": 404699, "epoch": 2408} {"train_loss": -12.376490592956543, "global_step": 404700, "epoch": 2408} {"train_loss": -12.547378540039062, "global_step": 404701, "epoch": 2408} {"train_loss": -12.401347160339355, "global_step": 404702, "epoch": 2408} {"train_loss": -12.402609825134277, "global_step": 404703, "epoch": 2408} {"train_loss": -12.564199447631836, "global_step": 404704, "epoch": 2408} {"train_loss": -12.163618087768555, "global_step": 404705, "epoch": 2408} {"train_loss": -12.491839408874512, "global_step": 404706, "epoch": 2408} {"train_loss": -12.087779998779297, "global_step": 404707, "epoch": 2408} {"train_loss": -12.373392105102539, "global_step": 404708, "epoch": 2408} {"train_loss": -12.600116729736328, "global_step": 404709, "epoch": 2408} {"train_loss": -12.557302474975586, "global_step": 404710, "epoch": 2408} {"train_loss": -11.777539661952428, "global_step": 404711, "epoch": 2408, "val_loss": 302107.625} {"train_loss": -12.36826229095459, "global_step": 404712, "epoch": 2409} {"train_loss": -12.495861053466797, "global_step": 404713, "epoch": 2409} {"train_loss": -12.307209014892578, "global_step": 404714, "epoch": 2409} {"train_loss": -12.623384475708008, "global_step": 404715, "epoch": 2409} {"train_loss": -12.451227188110352, "global_step": 404716, "epoch": 2409} {"train_loss": -12.547262191772461, "global_step": 404717, "epoch": 2409} {"train_loss": -12.656490325927734, "global_step": 404718, "epoch": 2409} {"train_loss": -12.508403778076172, "global_step": 404719, "epoch": 2409} {"train_loss": -12.586525917053223, "global_step": 404720, "epoch": 2409} {"train_loss": -12.463561058044434, "global_step": 404721, "epoch": 2409} {"train_loss": -12.37906551361084, "global_step": 404722, "epoch": 2409} {"train_loss": -12.435359954833984, "global_step": 404723, "epoch": 2409} {"train_loss": -12.478153228759766, "global_step": 404724, "epoch": 2409} {"train_loss": -12.633227348327637, "global_step": 404725, "epoch": 2409} {"train_loss": -12.47861099243164, "global_step": 404726, "epoch": 2409} {"train_loss": -12.34896183013916, "global_step": 404727, "epoch": 2409} {"train_loss": -12.64578628540039, "global_step": 404728, "epoch": 2409} {"train_loss": -12.637094497680664, "global_step": 404729, "epoch": 2409} {"train_loss": -12.75840950012207, "global_step": 404730, "epoch": 2409} {"train_loss": -12.251672744750977, "global_step": 404731, "epoch": 2409} {"train_loss": -12.623502731323242, "global_step": 404732, "epoch": 2409} {"train_loss": -12.849031448364258, "global_step": 404733, "epoch": 2409} {"train_loss": -12.727729797363281, "global_step": 404734, "epoch": 2409} {"train_loss": -12.819185256958008, "global_step": 404735, "epoch": 2409} {"train_loss": -13.069753646850586, "global_step": 404736, "epoch": 2409} {"train_loss": -12.808624267578125, "global_step": 404737, "epoch": 2409} {"train_loss": -12.742213249206543, "global_step": 404738, "epoch": 2409} {"train_loss": -12.870521545410156, "global_step": 404739, "epoch": 2409} {"train_loss": -12.739195823669434, "global_step": 404740, "epoch": 2409} {"train_loss": -12.711944580078125, "global_step": 404741, "epoch": 2409} {"train_loss": -12.481719970703125, "global_step": 404742, "epoch": 2409} {"train_loss": -12.788039207458496, "global_step": 404743, "epoch": 2409} {"train_loss": -12.789514541625977, "global_step": 404744, "epoch": 2409} {"train_loss": -12.782936096191406, "global_step": 404745, "epoch": 2409} {"train_loss": -12.756455421447754, "global_step": 404746, "epoch": 2409} {"train_loss": -12.895528793334961, "global_step": 404747, "epoch": 2409} {"train_loss": -12.892708778381348, "global_step": 404748, "epoch": 2409} {"train_loss": -12.83532428741455, "global_step": 404749, "epoch": 2409} {"train_loss": -12.717588424682617, "global_step": 404750, "epoch": 2409} {"train_loss": -12.66464900970459, "global_step": 404751, "epoch": 2409} {"train_loss": -12.763420104980469, "global_step": 404752, "epoch": 2409} {"train_loss": -12.89981746673584, "global_step": 404753, "epoch": 2409} {"train_loss": -12.853906631469727, "global_step": 404754, "epoch": 2409} {"train_loss": -12.773250579833984, "global_step": 404755, "epoch": 2409} {"train_loss": -12.615270614624023, "global_step": 404756, "epoch": 2409} {"train_loss": -12.837833404541016, "global_step": 404757, "epoch": 2409} {"train_loss": -12.446709632873535, "global_step": 404758, "epoch": 2409} {"train_loss": -12.631893157958984, "global_step": 404759, "epoch": 2409} {"train_loss": -12.572927474975586, "global_step": 404760, "epoch": 2409} {"train_loss": -12.922086715698242, "global_step": 404761, "epoch": 2409} {"train_loss": -12.368874549865723, "global_step": 404762, "epoch": 2409} {"train_loss": -12.620264053344727, "global_step": 404763, "epoch": 2409} {"train_loss": -12.189473152160645, "global_step": 404764, "epoch": 2409} {"train_loss": -12.574745178222656, "global_step": 404765, "epoch": 2409} {"train_loss": -12.721978187561035, "global_step": 404766, "epoch": 2409} {"train_loss": -12.758350372314453, "global_step": 404767, "epoch": 2409} {"train_loss": -12.595579147338867, "global_step": 404768, "epoch": 2409} {"train_loss": -12.753181457519531, "global_step": 404769, "epoch": 2409} {"train_loss": -12.553295135498047, "global_step": 404770, "epoch": 2409} {"train_loss": -12.369461059570312, "global_step": 404771, "epoch": 2409} {"train_loss": -12.39102554321289, "global_step": 404772, "epoch": 2409} {"train_loss": -12.3624267578125, "global_step": 404773, "epoch": 2409} {"train_loss": -12.423359870910645, "global_step": 404774, "epoch": 2409} {"train_loss": -12.364294052124023, "global_step": 404775, "epoch": 2409} {"train_loss": -12.765605926513672, "global_step": 404776, "epoch": 2409} {"train_loss": -12.124486923217773, "global_step": 404777, "epoch": 2409} {"train_loss": -12.564071655273438, "global_step": 404778, "epoch": 2409} {"train_loss": -12.383459091186523, "global_step": 404779, "epoch": 2409} {"train_loss": -12.553014755249023, "global_step": 404780, "epoch": 2409} {"train_loss": -12.780092239379883, "global_step": 404781, "epoch": 2409} {"train_loss": -12.524190902709961, "global_step": 404782, "epoch": 2409} {"train_loss": -12.228586196899414, "global_step": 404783, "epoch": 2409} {"train_loss": -11.691511154174805, "global_step": 404784, "epoch": 2409} {"train_loss": -11.360610961914062, "global_step": 404785, "epoch": 2409} {"train_loss": -11.905586242675781, "global_step": 404786, "epoch": 2409} {"train_loss": -12.08285903930664, "global_step": 404787, "epoch": 2409} {"train_loss": -11.425182342529297, "global_step": 404788, "epoch": 2409} {"train_loss": -10.133462905883789, "global_step": 404789, "epoch": 2409} {"train_loss": -12.391940116882324, "global_step": 404790, "epoch": 2409} {"train_loss": -11.104835510253906, "global_step": 404791, "epoch": 2409} {"train_loss": -11.40639877319336, "global_step": 404792, "epoch": 2409} {"train_loss": -12.315040588378906, "global_step": 404793, "epoch": 2409} {"train_loss": -11.724629402160645, "global_step": 404794, "epoch": 2409} {"train_loss": -11.263687133789062, "global_step": 404795, "epoch": 2409} {"train_loss": -11.619359970092773, "global_step": 404796, "epoch": 2409} {"train_loss": -12.090713500976562, "global_step": 404797, "epoch": 2409} {"train_loss": -12.108219146728516, "global_step": 404798, "epoch": 2409} {"train_loss": -10.706527709960938, "global_step": 404799, "epoch": 2409} {"train_loss": -12.246548652648926, "global_step": 404800, "epoch": 2409} {"train_loss": -10.462782859802246, "global_step": 404801, "epoch": 2409} {"train_loss": -11.579137802124023, "global_step": 404802, "epoch": 2409} {"train_loss": -11.116012573242188, "global_step": 404803, "epoch": 2409} {"train_loss": -11.378061294555664, "global_step": 404804, "epoch": 2409} {"train_loss": -10.97004508972168, "global_step": 404805, "epoch": 2409} {"train_loss": -10.681493759155273, "global_step": 404806, "epoch": 2409} {"train_loss": -11.819608688354492, "global_step": 404807, "epoch": 2409} {"train_loss": -9.969568252563477, "global_step": 404808, "epoch": 2409} {"train_loss": -12.047165870666504, "global_step": 404809, "epoch": 2409} {"train_loss": -10.916784286499023, "global_step": 404810, "epoch": 2409} {"train_loss": -12.057132720947266, "global_step": 404811, "epoch": 2409} {"train_loss": -10.675973892211914, "global_step": 404812, "epoch": 2409} {"train_loss": -12.057673454284668, "global_step": 404813, "epoch": 2409} {"train_loss": -11.663907051086426, "global_step": 404814, "epoch": 2409} {"train_loss": -11.809784889221191, "global_step": 404815, "epoch": 2409} {"train_loss": -11.663436889648438, "global_step": 404816, "epoch": 2409} {"train_loss": -11.750875473022461, "global_step": 404817, "epoch": 2409} {"train_loss": -11.738080978393555, "global_step": 404818, "epoch": 2409} {"train_loss": -11.979496955871582, "global_step": 404819, "epoch": 2409} {"train_loss": -11.8950777053833, "global_step": 404820, "epoch": 2409} {"train_loss": -11.904083251953125, "global_step": 404821, "epoch": 2409} {"train_loss": -12.24796199798584, "global_step": 404822, "epoch": 2409} {"train_loss": -11.924165725708008, "global_step": 404823, "epoch": 2409} {"train_loss": -11.938250541687012, "global_step": 404824, "epoch": 2409} {"train_loss": -12.017849922180176, "global_step": 404825, "epoch": 2409} {"train_loss": -11.964397430419922, "global_step": 404826, "epoch": 2409} {"train_loss": -12.297995567321777, "global_step": 404827, "epoch": 2409} {"train_loss": -12.376873016357422, "global_step": 404828, "epoch": 2409} {"train_loss": -11.997751235961914, "global_step": 404829, "epoch": 2409} {"train_loss": -11.969743728637695, "global_step": 404830, "epoch": 2409} {"train_loss": -12.020292282104492, "global_step": 404831, "epoch": 2409} {"train_loss": -11.927072525024414, "global_step": 404832, "epoch": 2409} {"train_loss": -12.051424026489258, "global_step": 404833, "epoch": 2409} {"train_loss": -12.088155746459961, "global_step": 404834, "epoch": 2409} {"train_loss": -12.119683265686035, "global_step": 404835, "epoch": 2409} {"train_loss": -12.102338790893555, "global_step": 404836, "epoch": 2409} {"train_loss": -12.088157653808594, "global_step": 404837, "epoch": 2409} {"train_loss": -12.03253173828125, "global_step": 404838, "epoch": 2409} {"train_loss": -12.076830863952637, "global_step": 404839, "epoch": 2409} {"train_loss": -11.55229377746582, "global_step": 404840, "epoch": 2409} {"train_loss": -12.031292915344238, "global_step": 404841, "epoch": 2409} {"train_loss": -11.49485969543457, "global_step": 404842, "epoch": 2409} {"train_loss": -11.768449783325195, "global_step": 404843, "epoch": 2409} {"train_loss": -12.171083450317383, "global_step": 404844, "epoch": 2409} {"train_loss": -11.649106979370117, "global_step": 404845, "epoch": 2409} {"train_loss": -11.2769775390625, "global_step": 404846, "epoch": 2409} {"train_loss": -11.70320987701416, "global_step": 404847, "epoch": 2409} {"train_loss": -11.035526275634766, "global_step": 404848, "epoch": 2409} {"train_loss": -11.208015441894531, "global_step": 404849, "epoch": 2409} {"train_loss": -12.126381874084473, "global_step": 404850, "epoch": 2409} {"train_loss": -11.38204574584961, "global_step": 404851, "epoch": 2409} {"train_loss": -10.857168197631836, "global_step": 404852, "epoch": 2409} {"train_loss": -11.715392112731934, "global_step": 404853, "epoch": 2409} {"train_loss": -11.664972305297852, "global_step": 404854, "epoch": 2409} {"train_loss": -11.128396034240723, "global_step": 404855, "epoch": 2409} {"train_loss": -11.496387481689453, "global_step": 404856, "epoch": 2409} {"train_loss": -12.207658767700195, "global_step": 404857, "epoch": 2409} {"train_loss": -11.029115676879883, "global_step": 404858, "epoch": 2409} {"train_loss": -11.701955795288086, "global_step": 404859, "epoch": 2409} {"train_loss": -11.392387390136719, "global_step": 404860, "epoch": 2409} {"train_loss": -11.802630424499512, "global_step": 404861, "epoch": 2409} {"train_loss": -11.870763778686523, "global_step": 404862, "epoch": 2409} {"train_loss": -11.27038288116455, "global_step": 404863, "epoch": 2409} {"train_loss": -12.271224975585938, "global_step": 404864, "epoch": 2409} {"train_loss": -11.644735336303711, "global_step": 404865, "epoch": 2409} {"train_loss": -11.346420288085938, "global_step": 404866, "epoch": 2409} {"train_loss": -12.166282653808594, "global_step": 404867, "epoch": 2409} {"train_loss": -12.094017028808594, "global_step": 404868, "epoch": 2409} {"train_loss": -11.55715274810791, "global_step": 404869, "epoch": 2409} {"train_loss": -12.070396423339844, "global_step": 404870, "epoch": 2409} {"train_loss": -11.97156810760498, "global_step": 404871, "epoch": 2409} {"train_loss": -12.262012481689453, "global_step": 404872, "epoch": 2409} {"train_loss": -12.064629554748535, "global_step": 404873, "epoch": 2409} {"train_loss": -12.155531883239746, "global_step": 404874, "epoch": 2409} {"train_loss": -12.402885437011719, "global_step": 404875, "epoch": 2409} {"train_loss": -11.676025390625, "global_step": 404876, "epoch": 2409} {"train_loss": -12.448299407958984, "global_step": 404877, "epoch": 2409} {"train_loss": -11.657309532165527, "global_step": 404878, "epoch": 2409} {"train_loss": -12.097943277586074, "global_step": 404879, "epoch": 2409, "val_loss": 299279.75} {"train_loss": -11.77491569519043, "global_step": 404880, "epoch": 2410} {"train_loss": -11.743555068969727, "global_step": 404881, "epoch": 2410} {"train_loss": -12.2620849609375, "global_step": 404882, "epoch": 2410} {"train_loss": -10.924969673156738, "global_step": 404883, "epoch": 2410} {"train_loss": -11.620701789855957, "global_step": 404884, "epoch": 2410} {"train_loss": -11.255819320678711, "global_step": 404885, "epoch": 2410} {"train_loss": -11.410259246826172, "global_step": 404886, "epoch": 2410} {"train_loss": -11.545038223266602, "global_step": 404887, "epoch": 2410} {"train_loss": -11.98149299621582, "global_step": 404888, "epoch": 2410} {"train_loss": -11.533105850219727, "global_step": 404889, "epoch": 2410} {"train_loss": -12.144285202026367, "global_step": 404890, "epoch": 2410} {"train_loss": -11.716611862182617, "global_step": 404891, "epoch": 2410} {"train_loss": -12.038528442382812, "global_step": 404892, "epoch": 2410} {"train_loss": -11.708498001098633, "global_step": 404893, "epoch": 2410} {"train_loss": -12.338661193847656, "global_step": 404894, "epoch": 2410} {"train_loss": -11.862558364868164, "global_step": 404895, "epoch": 2410} {"train_loss": -12.116429328918457, "global_step": 404896, "epoch": 2410} {"train_loss": -11.226795196533203, "global_step": 404897, "epoch": 2410} {"train_loss": -11.718339920043945, "global_step": 404898, "epoch": 2410} {"train_loss": -12.083928108215332, "global_step": 404899, "epoch": 2410} {"train_loss": -11.760200500488281, "global_step": 404900, "epoch": 2410} {"train_loss": -12.344844818115234, "global_step": 404901, "epoch": 2410} {"train_loss": -12.058576583862305, "global_step": 404902, "epoch": 2410} {"train_loss": -11.98759651184082, "global_step": 404903, "epoch": 2410} {"train_loss": -12.092968940734863, "global_step": 404904, "epoch": 2410} {"train_loss": -11.901509284973145, "global_step": 404905, "epoch": 2410} {"train_loss": -12.185134887695312, "global_step": 404906, "epoch": 2410} {"train_loss": -11.89743423461914, "global_step": 404907, "epoch": 2410} {"train_loss": -12.09675121307373, "global_step": 404908, "epoch": 2410} {"train_loss": -11.768518447875977, "global_step": 404909, "epoch": 2410} {"train_loss": -12.352437973022461, "global_step": 404910, "epoch": 2410} {"train_loss": -11.985343933105469, "global_step": 404911, "epoch": 2410} {"train_loss": -12.331038475036621, "global_step": 404912, "epoch": 2410} {"train_loss": -12.03976058959961, "global_step": 404913, "epoch": 2410} {"train_loss": -11.850096702575684, "global_step": 404914, "epoch": 2410} {"train_loss": -12.036697387695312, "global_step": 404915, "epoch": 2410} {"train_loss": -11.949132919311523, "global_step": 404916, "epoch": 2410} {"train_loss": -12.525209426879883, "global_step": 404917, "epoch": 2410} {"train_loss": -12.133931159973145, "global_step": 404918, "epoch": 2410} {"train_loss": -12.227484703063965, "global_step": 404919, "epoch": 2410} {"train_loss": -12.345708847045898, "global_step": 404920, "epoch": 2410} {"train_loss": -12.184547424316406, "global_step": 404921, "epoch": 2410} {"train_loss": -12.582756042480469, "global_step": 404922, "epoch": 2410} {"train_loss": -12.132131576538086, "global_step": 404923, "epoch": 2410} {"train_loss": -12.606115341186523, "global_step": 404924, "epoch": 2410} {"train_loss": -12.0455904006958, "global_step": 404925, "epoch": 2410} {"train_loss": -12.36060905456543, "global_step": 404926, "epoch": 2410} {"train_loss": -12.32598876953125, "global_step": 404927, "epoch": 2410} {"train_loss": -12.143157958984375, "global_step": 404928, "epoch": 2410} {"train_loss": -12.532491683959961, "global_step": 404929, "epoch": 2410} {"train_loss": -12.44384479522705, "global_step": 404930, "epoch": 2410} {"train_loss": -12.295960426330566, "global_step": 404931, "epoch": 2410} {"train_loss": -12.13131332397461, "global_step": 404932, "epoch": 2410} {"train_loss": -12.445995330810547, "global_step": 404933, "epoch": 2410} {"train_loss": -12.754916191101074, "global_step": 404934, "epoch": 2410} {"train_loss": -12.363218307495117, "global_step": 404935, "epoch": 2410} {"train_loss": -12.678903579711914, "global_step": 404936, "epoch": 2410} {"train_loss": -12.37752914428711, "global_step": 404937, "epoch": 2410} {"train_loss": -12.291747093200684, "global_step": 404938, "epoch": 2410} {"train_loss": -12.481078147888184, "global_step": 404939, "epoch": 2410} {"train_loss": -12.302011489868164, "global_step": 404940, "epoch": 2410} {"train_loss": -12.597391128540039, "global_step": 404941, "epoch": 2410} {"train_loss": -12.660751342773438, "global_step": 404942, "epoch": 2410} {"train_loss": -12.389937400817871, "global_step": 404943, "epoch": 2410} {"train_loss": -12.55422592163086, "global_step": 404944, "epoch": 2410} {"train_loss": -12.07416820526123, "global_step": 404945, "epoch": 2410} {"train_loss": -12.419865608215332, "global_step": 404946, "epoch": 2410} {"train_loss": -12.564419746398926, "global_step": 404947, "epoch": 2410} {"train_loss": -12.717903137207031, "global_step": 404948, "epoch": 2410} {"train_loss": -12.554887771606445, "global_step": 404949, "epoch": 2410} {"train_loss": -12.557016372680664, "global_step": 404950, "epoch": 2410} {"train_loss": -12.445029258728027, "global_step": 404951, "epoch": 2410} {"train_loss": -12.653411865234375, "global_step": 404952, "epoch": 2410} {"train_loss": -12.30200481414795, "global_step": 404953, "epoch": 2410} {"train_loss": -12.623361587524414, "global_step": 404954, "epoch": 2410} {"train_loss": -12.655658721923828, "global_step": 404955, "epoch": 2410} {"train_loss": -12.528388977050781, "global_step": 404956, "epoch": 2410} {"train_loss": -12.99727725982666, "global_step": 404957, "epoch": 2410} {"train_loss": -12.355673789978027, "global_step": 404958, "epoch": 2410} {"train_loss": -12.571885108947754, "global_step": 404959, "epoch": 2410} {"train_loss": -12.646339416503906, "global_step": 404960, "epoch": 2410} {"train_loss": -12.30437183380127, "global_step": 404961, "epoch": 2410} {"train_loss": -12.565996170043945, "global_step": 404962, "epoch": 2410} {"train_loss": -12.431934356689453, "global_step": 404963, "epoch": 2410} {"train_loss": -12.221399307250977, "global_step": 404964, "epoch": 2410} {"train_loss": -12.843135833740234, "global_step": 404965, "epoch": 2410} {"train_loss": -12.368746757507324, "global_step": 404966, "epoch": 2410} {"train_loss": -12.366494178771973, "global_step": 404967, "epoch": 2410} {"train_loss": -12.544984817504883, "global_step": 404968, "epoch": 2410} {"train_loss": -12.2169771194458, "global_step": 404969, "epoch": 2410} {"train_loss": -11.974479675292969, "global_step": 404970, "epoch": 2410} {"train_loss": -12.711912155151367, "global_step": 404971, "epoch": 2410} {"train_loss": -12.064528465270996, "global_step": 404972, "epoch": 2410} {"train_loss": -12.516587257385254, "global_step": 404973, "epoch": 2410} {"train_loss": -11.570287704467773, "global_step": 404974, "epoch": 2410} {"train_loss": -12.019515037536621, "global_step": 404975, "epoch": 2410} {"train_loss": -12.3519926071167, "global_step": 404976, "epoch": 2410} {"train_loss": -12.077926635742188, "global_step": 404977, "epoch": 2410} {"train_loss": -11.890209197998047, "global_step": 404978, "epoch": 2410} {"train_loss": -12.584732055664062, "global_step": 404979, "epoch": 2410} {"train_loss": -11.734457015991211, "global_step": 404980, "epoch": 2410} {"train_loss": -12.105659484863281, "global_step": 404981, "epoch": 2410} {"train_loss": -12.306228637695312, "global_step": 404982, "epoch": 2410} {"train_loss": -12.311483383178711, "global_step": 404983, "epoch": 2410} {"train_loss": -12.106780052185059, "global_step": 404984, "epoch": 2410} {"train_loss": -12.583487510681152, "global_step": 404985, "epoch": 2410} {"train_loss": -11.881759643554688, "global_step": 404986, "epoch": 2410} {"train_loss": -12.309111595153809, "global_step": 404987, "epoch": 2410} {"train_loss": -12.45713996887207, "global_step": 404988, "epoch": 2410} {"train_loss": -12.103553771972656, "global_step": 404989, "epoch": 2410} {"train_loss": -12.215641021728516, "global_step": 404990, "epoch": 2410} {"train_loss": -12.66148567199707, "global_step": 404991, "epoch": 2410} {"train_loss": -12.396343231201172, "global_step": 404992, "epoch": 2410} {"train_loss": -11.90362548828125, "global_step": 404993, "epoch": 2410} {"train_loss": -12.626893043518066, "global_step": 404994, "epoch": 2410} {"train_loss": -12.387382507324219, "global_step": 404995, "epoch": 2410} {"train_loss": -11.877477645874023, "global_step": 404996, "epoch": 2410} {"train_loss": -12.299026489257812, "global_step": 404997, "epoch": 2410} {"train_loss": -12.106741905212402, "global_step": 404998, "epoch": 2410} {"train_loss": -12.48723030090332, "global_step": 404999, "epoch": 2410} {"train_loss": -12.400032043457031, "global_step": 405000, "epoch": 2410} {"train_loss": -12.513578414916992, "global_step": 405001, "epoch": 2410} {"train_loss": -12.472309112548828, "global_step": 405002, "epoch": 2410} {"train_loss": -12.65113353729248, "global_step": 405003, "epoch": 2410} {"train_loss": -12.460540771484375, "global_step": 405004, "epoch": 2410} {"train_loss": -12.83344841003418, "global_step": 405005, "epoch": 2410} {"train_loss": -12.463820457458496, "global_step": 405006, "epoch": 2410} {"train_loss": -12.5489501953125, "global_step": 405007, "epoch": 2410} {"train_loss": -12.393150329589844, "global_step": 405008, "epoch": 2410} {"train_loss": -12.65259075164795, "global_step": 405009, "epoch": 2410} {"train_loss": -12.407157897949219, "global_step": 405010, "epoch": 2410} {"train_loss": -12.489572525024414, "global_step": 405011, "epoch": 2410} {"train_loss": -12.421655654907227, "global_step": 405012, "epoch": 2410} {"train_loss": -12.105325698852539, "global_step": 405013, "epoch": 2410} {"train_loss": -12.548044204711914, "global_step": 405014, "epoch": 2410} {"train_loss": -12.327081680297852, "global_step": 405015, "epoch": 2410} {"train_loss": -12.297369003295898, "global_step": 405016, "epoch": 2410} {"train_loss": -12.454578399658203, "global_step": 405017, "epoch": 2410} {"train_loss": -11.833404541015625, "global_step": 405018, "epoch": 2410} {"train_loss": -12.09402084350586, "global_step": 405019, "epoch": 2410} {"train_loss": -11.609827041625977, "global_step": 405020, "epoch": 2410} {"train_loss": -11.021456718444824, "global_step": 405021, "epoch": 2410} {"train_loss": -12.309438705444336, "global_step": 405022, "epoch": 2410} {"train_loss": -11.374786376953125, "global_step": 405023, "epoch": 2410} {"train_loss": -11.079729080200195, "global_step": 405024, "epoch": 2410} {"train_loss": -12.053309440612793, "global_step": 405025, "epoch": 2410} {"train_loss": -11.24618148803711, "global_step": 405026, "epoch": 2410} {"train_loss": -10.584357261657715, "global_step": 405027, "epoch": 2410} {"train_loss": -11.306129455566406, "global_step": 405028, "epoch": 2410} {"train_loss": -12.157451629638672, "global_step": 405029, "epoch": 2410} {"train_loss": -11.58674144744873, "global_step": 405030, "epoch": 2410} {"train_loss": -11.831472396850586, "global_step": 405031, "epoch": 2410} {"train_loss": -11.186652183532715, "global_step": 405032, "epoch": 2410} {"train_loss": -11.978979110717773, "global_step": 405033, "epoch": 2410} {"train_loss": -11.277303695678711, "global_step": 405034, "epoch": 2410} {"train_loss": -11.85739517211914, "global_step": 405035, "epoch": 2410} {"train_loss": -11.483477592468262, "global_step": 405036, "epoch": 2410} {"train_loss": -10.997641563415527, "global_step": 405037, "epoch": 2410} {"train_loss": -12.384790420532227, "global_step": 405038, "epoch": 2410} {"train_loss": -11.453023910522461, "global_step": 405039, "epoch": 2410} {"train_loss": -11.759504318237305, "global_step": 405040, "epoch": 2410} {"train_loss": -11.914202690124512, "global_step": 405041, "epoch": 2410} {"train_loss": -10.694567680358887, "global_step": 405042, "epoch": 2410} {"train_loss": -11.481714248657227, "global_step": 405043, "epoch": 2410} {"train_loss": -11.209050178527832, "global_step": 405044, "epoch": 2410} {"train_loss": -11.974197387695312, "global_step": 405045, "epoch": 2410} {"train_loss": -11.716817855834961, "global_step": 405046, "epoch": 2410} {"train_loss": -12.11909141994658, "global_step": 405047, "epoch": 2410, "val_loss": 300496.3125, "train_action_mse_error": 1.2338289022445679} {"train_loss": -11.677362442016602, "global_step": 405048, "epoch": 2411} {"train_loss": -11.074289321899414, "global_step": 405049, "epoch": 2411} {"train_loss": -11.319416046142578, "global_step": 405050, "epoch": 2411} {"train_loss": -11.923357009887695, "global_step": 405051, "epoch": 2411} {"train_loss": -10.86751937866211, "global_step": 405052, "epoch": 2411} {"train_loss": -12.021038055419922, "global_step": 405053, "epoch": 2411} {"train_loss": -11.392589569091797, "global_step": 405054, "epoch": 2411} {"train_loss": -11.761602401733398, "global_step": 405055, "epoch": 2411} {"train_loss": -11.954483032226562, "global_step": 405056, "epoch": 2411} {"train_loss": -11.768366813659668, "global_step": 405057, "epoch": 2411} {"train_loss": -11.406850814819336, "global_step": 405058, "epoch": 2411} {"train_loss": -11.906405448913574, "global_step": 405059, "epoch": 2411} {"train_loss": -11.204453468322754, "global_step": 405060, "epoch": 2411} {"train_loss": -10.70704460144043, "global_step": 405061, "epoch": 2411} {"train_loss": -11.119104385375977, "global_step": 405062, "epoch": 2411} {"train_loss": -10.421197891235352, "global_step": 405063, "epoch": 2411} {"train_loss": -11.11467170715332, "global_step": 405064, "epoch": 2411} {"train_loss": -11.59826374053955, "global_step": 405065, "epoch": 2411} {"train_loss": -10.93104362487793, "global_step": 405066, "epoch": 2411} {"train_loss": -11.608233451843262, "global_step": 405067, "epoch": 2411} {"train_loss": -11.699895858764648, "global_step": 405068, "epoch": 2411} {"train_loss": -10.473227500915527, "global_step": 405069, "epoch": 2411} {"train_loss": -12.112106323242188, "global_step": 405070, "epoch": 2411} {"train_loss": -11.312288284301758, "global_step": 405071, "epoch": 2411} {"train_loss": -11.50047779083252, "global_step": 405072, "epoch": 2411} {"train_loss": -11.866808891296387, "global_step": 405073, "epoch": 2411} {"train_loss": -11.233508110046387, "global_step": 405074, "epoch": 2411} {"train_loss": -11.88552474975586, "global_step": 405075, "epoch": 2411} {"train_loss": -11.519274711608887, "global_step": 405076, "epoch": 2411} {"train_loss": -11.755830764770508, "global_step": 405077, "epoch": 2411} {"train_loss": -11.795682907104492, "global_step": 405078, "epoch": 2411} {"train_loss": -11.381591796875, "global_step": 405079, "epoch": 2411} {"train_loss": -11.685215950012207, "global_step": 405080, "epoch": 2411} {"train_loss": -11.833330154418945, "global_step": 405081, "epoch": 2411} {"train_loss": -11.381160736083984, "global_step": 405082, "epoch": 2411} {"train_loss": -11.883870124816895, "global_step": 405083, "epoch": 2411} {"train_loss": -11.584951400756836, "global_step": 405084, "epoch": 2411} {"train_loss": -11.650415420532227, "global_step": 405085, "epoch": 2411} {"train_loss": -11.303680419921875, "global_step": 405086, "epoch": 2411} {"train_loss": -11.20064926147461, "global_step": 405087, "epoch": 2411} {"train_loss": -11.479487419128418, "global_step": 405088, "epoch": 2411} {"train_loss": -11.52708625793457, "global_step": 405089, "epoch": 2411} {"train_loss": -12.04438591003418, "global_step": 405090, "epoch": 2411} {"train_loss": -11.382450103759766, "global_step": 405091, "epoch": 2411} {"train_loss": -12.200567245483398, "global_step": 405092, "epoch": 2411} {"train_loss": -11.816267013549805, "global_step": 405093, "epoch": 2411} {"train_loss": -11.562128067016602, "global_step": 405094, "epoch": 2411} {"train_loss": -11.642776489257812, "global_step": 405095, "epoch": 2411} {"train_loss": -11.831961631774902, "global_step": 405096, "epoch": 2411} {"train_loss": -12.319890975952148, "global_step": 405097, "epoch": 2411} {"train_loss": -11.986221313476562, "global_step": 405098, "epoch": 2411} {"train_loss": -12.27890396118164, "global_step": 405099, "epoch": 2411} {"train_loss": -12.153276443481445, "global_step": 405100, "epoch": 2411} {"train_loss": -12.037625312805176, "global_step": 405101, "epoch": 2411} {"train_loss": -12.18019962310791, "global_step": 405102, "epoch": 2411} {"train_loss": -12.391995429992676, "global_step": 405103, "epoch": 2411} {"train_loss": -12.20474624633789, "global_step": 405104, "epoch": 2411} {"train_loss": -11.814321517944336, "global_step": 405105, "epoch": 2411} {"train_loss": -12.027250289916992, "global_step": 405106, "epoch": 2411} {"train_loss": -11.816871643066406, "global_step": 405107, "epoch": 2411} {"train_loss": -12.372513771057129, "global_step": 405108, "epoch": 2411} {"train_loss": -12.143074035644531, "global_step": 405109, "epoch": 2411} {"train_loss": -12.4231538772583, "global_step": 405110, "epoch": 2411} {"train_loss": -12.076045989990234, "global_step": 405111, "epoch": 2411} {"train_loss": -12.149333953857422, "global_step": 405112, "epoch": 2411} {"train_loss": -12.41495132446289, "global_step": 405113, "epoch": 2411} {"train_loss": -12.242100715637207, "global_step": 405114, "epoch": 2411} {"train_loss": -12.33946418762207, "global_step": 405115, "epoch": 2411} {"train_loss": -12.042043685913086, "global_step": 405116, "epoch": 2411} {"train_loss": -12.384086608886719, "global_step": 405117, "epoch": 2411} {"train_loss": -12.019559860229492, "global_step": 405118, "epoch": 2411} {"train_loss": -12.362192153930664, "global_step": 405119, "epoch": 2411} {"train_loss": -11.957429885864258, "global_step": 405120, "epoch": 2411} {"train_loss": -12.48927116394043, "global_step": 405121, "epoch": 2411} {"train_loss": -12.055784225463867, "global_step": 405122, "epoch": 2411} {"train_loss": -12.032322883605957, "global_step": 405123, "epoch": 2411} {"train_loss": -12.270631790161133, "global_step": 405124, "epoch": 2411} {"train_loss": -12.325576782226562, "global_step": 405125, "epoch": 2411} {"train_loss": -12.083795547485352, "global_step": 405126, "epoch": 2411} {"train_loss": -12.579259872436523, "global_step": 405127, "epoch": 2411} {"train_loss": -12.009500503540039, "global_step": 405128, "epoch": 2411} {"train_loss": -12.298118591308594, "global_step": 405129, "epoch": 2411} {"train_loss": -11.88156509399414, "global_step": 405130, "epoch": 2411} {"train_loss": -12.597757339477539, "global_step": 405131, "epoch": 2411} {"train_loss": -11.94052791595459, "global_step": 405132, "epoch": 2411} {"train_loss": -12.356485366821289, "global_step": 405133, "epoch": 2411} {"train_loss": -12.480470657348633, "global_step": 405134, "epoch": 2411} {"train_loss": -12.3135347366333, "global_step": 405135, "epoch": 2411} {"train_loss": -12.478255271911621, "global_step": 405136, "epoch": 2411} {"train_loss": -12.386987686157227, "global_step": 405137, "epoch": 2411} {"train_loss": -12.3375244140625, "global_step": 405138, "epoch": 2411} {"train_loss": -12.338808059692383, "global_step": 405139, "epoch": 2411} {"train_loss": -12.503875732421875, "global_step": 405140, "epoch": 2411} {"train_loss": -12.308655738830566, "global_step": 405141, "epoch": 2411} {"train_loss": -12.342536926269531, "global_step": 405142, "epoch": 2411} {"train_loss": -12.423927307128906, "global_step": 405143, "epoch": 2411} {"train_loss": -12.45291519165039, "global_step": 405144, "epoch": 2411} {"train_loss": -12.180492401123047, "global_step": 405145, "epoch": 2411} {"train_loss": -12.39221477508545, "global_step": 405146, "epoch": 2411} {"train_loss": -12.228013038635254, "global_step": 405147, "epoch": 2411} {"train_loss": -12.509401321411133, "global_step": 405148, "epoch": 2411} {"train_loss": -12.390275001525879, "global_step": 405149, "epoch": 2411} {"train_loss": -12.418193817138672, "global_step": 405150, "epoch": 2411} {"train_loss": -12.299880981445312, "global_step": 405151, "epoch": 2411} {"train_loss": -12.128107070922852, "global_step": 405152, "epoch": 2411} {"train_loss": -12.171320915222168, "global_step": 405153, "epoch": 2411} {"train_loss": -11.761062622070312, "global_step": 405154, "epoch": 2411} {"train_loss": -12.563922882080078, "global_step": 405155, "epoch": 2411} {"train_loss": -11.635780334472656, "global_step": 405156, "epoch": 2411} {"train_loss": -12.093470573425293, "global_step": 405157, "epoch": 2411} {"train_loss": -12.434855461120605, "global_step": 405158, "epoch": 2411} {"train_loss": -12.073006629943848, "global_step": 405159, "epoch": 2411} {"train_loss": -12.147808074951172, "global_step": 405160, "epoch": 2411} {"train_loss": -12.319841384887695, "global_step": 405161, "epoch": 2411} {"train_loss": -11.900546073913574, "global_step": 405162, "epoch": 2411} {"train_loss": -12.79237174987793, "global_step": 405163, "epoch": 2411} {"train_loss": -12.065990447998047, "global_step": 405164, "epoch": 2411} {"train_loss": -11.890504837036133, "global_step": 405165, "epoch": 2411} {"train_loss": -12.784664154052734, "global_step": 405166, "epoch": 2411} {"train_loss": -11.625201225280762, "global_step": 405167, "epoch": 2411} {"train_loss": -11.520294189453125, "global_step": 405168, "epoch": 2411} {"train_loss": -12.379720687866211, "global_step": 405169, "epoch": 2411} {"train_loss": -12.013052940368652, "global_step": 405170, "epoch": 2411} {"train_loss": -11.889738082885742, "global_step": 405171, "epoch": 2411} {"train_loss": -11.447242736816406, "global_step": 405172, "epoch": 2411} {"train_loss": -11.2921781539917, "global_step": 405173, "epoch": 2411} {"train_loss": -11.343852996826172, "global_step": 405174, "epoch": 2411} {"train_loss": -11.05053424835205, "global_step": 405175, "epoch": 2411} {"train_loss": -11.938390731811523, "global_step": 405176, "epoch": 2411} {"train_loss": -11.06903076171875, "global_step": 405177, "epoch": 2411} {"train_loss": -11.527276992797852, "global_step": 405178, "epoch": 2411} {"train_loss": -11.68200969696045, "global_step": 405179, "epoch": 2411} {"train_loss": -10.548192977905273, "global_step": 405180, "epoch": 2411} {"train_loss": -12.076658248901367, "global_step": 405181, "epoch": 2411} {"train_loss": -11.134904861450195, "global_step": 405182, "epoch": 2411} {"train_loss": -11.052337646484375, "global_step": 405183, "epoch": 2411} {"train_loss": -11.659137725830078, "global_step": 405184, "epoch": 2411} {"train_loss": -11.752510070800781, "global_step": 405185, "epoch": 2411} {"train_loss": -11.94679069519043, "global_step": 405186, "epoch": 2411} {"train_loss": -11.680620193481445, "global_step": 405187, "epoch": 2411} {"train_loss": -11.9198579788208, "global_step": 405188, "epoch": 2411} {"train_loss": -11.6082124710083, "global_step": 405189, "epoch": 2411} {"train_loss": -11.418142318725586, "global_step": 405190, "epoch": 2411} {"train_loss": -11.834150314331055, "global_step": 405191, "epoch": 2411} {"train_loss": -12.106809616088867, "global_step": 405192, "epoch": 2411} {"train_loss": -11.541259765625, "global_step": 405193, "epoch": 2411} {"train_loss": -11.624543190002441, "global_step": 405194, "epoch": 2411} {"train_loss": -11.938186645507812, "global_step": 405195, "epoch": 2411} {"train_loss": -11.754011154174805, "global_step": 405196, "epoch": 2411} {"train_loss": -12.226503372192383, "global_step": 405197, "epoch": 2411} {"train_loss": -11.252544403076172, "global_step": 405198, "epoch": 2411} {"train_loss": -12.116954803466797, "global_step": 405199, "epoch": 2411} {"train_loss": -11.951913833618164, "global_step": 405200, "epoch": 2411} {"train_loss": -11.930439949035645, "global_step": 405201, "epoch": 2411} {"train_loss": -11.842958450317383, "global_step": 405202, "epoch": 2411} {"train_loss": -12.168546676635742, "global_step": 405203, "epoch": 2411} {"train_loss": -12.00910758972168, "global_step": 405204, "epoch": 2411} {"train_loss": -12.268203735351562, "global_step": 405205, "epoch": 2411} {"train_loss": -11.927215576171875, "global_step": 405206, "epoch": 2411} {"train_loss": -12.46977424621582, "global_step": 405207, "epoch": 2411} {"train_loss": -11.985136032104492, "global_step": 405208, "epoch": 2411} {"train_loss": -12.158266067504883, "global_step": 405209, "epoch": 2411} {"train_loss": -12.522102355957031, "global_step": 405210, "epoch": 2411} {"train_loss": -12.077905654907227, "global_step": 405211, "epoch": 2411} {"train_loss": -12.320737838745117, "global_step": 405212, "epoch": 2411} {"train_loss": -12.263492584228516, "global_step": 405213, "epoch": 2411} {"train_loss": -12.328685760498047, "global_step": 405214, "epoch": 2411} {"train_loss": -11.901243124689374, "global_step": 405215, "epoch": 2411, "val_loss": 302276.65625} {"train_loss": -12.264829635620117, "global_step": 405216, "epoch": 2412} {"train_loss": -12.122941970825195, "global_step": 405217, "epoch": 2412} {"train_loss": -12.171256065368652, "global_step": 405218, "epoch": 2412} {"train_loss": -11.8851957321167, "global_step": 405219, "epoch": 2412} {"train_loss": -12.14204216003418, "global_step": 405220, "epoch": 2412} {"train_loss": -12.329157829284668, "global_step": 405221, "epoch": 2412} {"train_loss": -12.168222427368164, "global_step": 405222, "epoch": 2412} {"train_loss": -12.04115104675293, "global_step": 405223, "epoch": 2412} {"train_loss": -11.949803352355957, "global_step": 405224, "epoch": 2412} {"train_loss": -12.403470039367676, "global_step": 405225, "epoch": 2412} {"train_loss": -12.03608512878418, "global_step": 405226, "epoch": 2412} {"train_loss": -12.183177947998047, "global_step": 405227, "epoch": 2412} {"train_loss": -12.280439376831055, "global_step": 405228, "epoch": 2412} {"train_loss": -11.987520217895508, "global_step": 405229, "epoch": 2412} {"train_loss": -12.28437614440918, "global_step": 405230, "epoch": 2412} {"train_loss": -11.79248332977295, "global_step": 405231, "epoch": 2412} {"train_loss": -12.205831527709961, "global_step": 405232, "epoch": 2412} {"train_loss": -11.795425415039062, "global_step": 405233, "epoch": 2412} {"train_loss": -12.258240699768066, "global_step": 405234, "epoch": 2412} {"train_loss": -12.15510368347168, "global_step": 405235, "epoch": 2412} {"train_loss": -12.436196327209473, "global_step": 405236, "epoch": 2412} {"train_loss": -12.523553848266602, "global_step": 405237, "epoch": 2412} {"train_loss": -12.561992645263672, "global_step": 405238, "epoch": 2412} {"train_loss": -12.461993217468262, "global_step": 405239, "epoch": 2412} {"train_loss": -12.442418098449707, "global_step": 405240, "epoch": 2412} {"train_loss": -12.483403205871582, "global_step": 405241, "epoch": 2412} {"train_loss": -12.382560729980469, "global_step": 405242, "epoch": 2412} {"train_loss": -12.366201400756836, "global_step": 405243, "epoch": 2412} {"train_loss": -12.648050308227539, "global_step": 405244, "epoch": 2412} {"train_loss": -12.296380996704102, "global_step": 405245, "epoch": 2412} {"train_loss": -12.566152572631836, "global_step": 405246, "epoch": 2412} {"train_loss": -12.561144828796387, "global_step": 405247, "epoch": 2412} {"train_loss": -12.409976959228516, "global_step": 405248, "epoch": 2412} {"train_loss": -12.665138244628906, "global_step": 405249, "epoch": 2412} {"train_loss": -12.536581039428711, "global_step": 405250, "epoch": 2412} {"train_loss": -12.343074798583984, "global_step": 405251, "epoch": 2412} {"train_loss": -12.59773063659668, "global_step": 405252, "epoch": 2412} {"train_loss": -12.614219665527344, "global_step": 405253, "epoch": 2412} {"train_loss": -12.858098983764648, "global_step": 405254, "epoch": 2412} {"train_loss": -12.64521598815918, "global_step": 405255, "epoch": 2412} {"train_loss": -12.74209976196289, "global_step": 405256, "epoch": 2412} {"train_loss": -12.481422424316406, "global_step": 405257, "epoch": 2412} {"train_loss": -12.530012130737305, "global_step": 405258, "epoch": 2412} {"train_loss": -12.775344848632812, "global_step": 405259, "epoch": 2412} {"train_loss": -12.631697654724121, "global_step": 405260, "epoch": 2412} {"train_loss": -12.722017288208008, "global_step": 405261, "epoch": 2412} {"train_loss": -12.529176712036133, "global_step": 405262, "epoch": 2412} {"train_loss": -12.658205032348633, "global_step": 405263, "epoch": 2412} {"train_loss": -12.744275093078613, "global_step": 405264, "epoch": 2412} {"train_loss": -12.337417602539062, "global_step": 405265, "epoch": 2412} {"train_loss": -12.827848434448242, "global_step": 405266, "epoch": 2412} {"train_loss": -12.764341354370117, "global_step": 405267, "epoch": 2412} {"train_loss": -12.636265754699707, "global_step": 405268, "epoch": 2412} {"train_loss": -12.632743835449219, "global_step": 405269, "epoch": 2412} {"train_loss": -12.059316635131836, "global_step": 405270, "epoch": 2412} {"train_loss": -12.569528579711914, "global_step": 405271, "epoch": 2412} {"train_loss": -12.661949157714844, "global_step": 405272, "epoch": 2412} {"train_loss": -12.267987251281738, "global_step": 405273, "epoch": 2412} {"train_loss": -12.860747337341309, "global_step": 405274, "epoch": 2412} {"train_loss": -12.253665924072266, "global_step": 405275, "epoch": 2412} {"train_loss": -12.508078575134277, "global_step": 405276, "epoch": 2412} {"train_loss": -12.614219665527344, "global_step": 405277, "epoch": 2412} {"train_loss": -12.346114158630371, "global_step": 405278, "epoch": 2412} {"train_loss": -12.684293746948242, "global_step": 405279, "epoch": 2412} {"train_loss": -12.111488342285156, "global_step": 405280, "epoch": 2412} {"train_loss": -11.44632339477539, "global_step": 405281, "epoch": 2412} {"train_loss": -12.440229415893555, "global_step": 405282, "epoch": 2412} {"train_loss": -12.272789001464844, "global_step": 405283, "epoch": 2412} {"train_loss": -12.191579818725586, "global_step": 405284, "epoch": 2412} {"train_loss": -12.357776641845703, "global_step": 405285, "epoch": 2412} {"train_loss": -12.156572341918945, "global_step": 405286, "epoch": 2412} {"train_loss": -12.425515174865723, "global_step": 405287, "epoch": 2412} {"train_loss": -12.429449081420898, "global_step": 405288, "epoch": 2412} {"train_loss": -11.74966049194336, "global_step": 405289, "epoch": 2412} {"train_loss": -12.449697494506836, "global_step": 405290, "epoch": 2412} {"train_loss": -12.079923629760742, "global_step": 405291, "epoch": 2412} {"train_loss": -11.462991714477539, "global_step": 405292, "epoch": 2412} {"train_loss": -10.94256591796875, "global_step": 405293, "epoch": 2412} {"train_loss": -12.260074615478516, "global_step": 405294, "epoch": 2412} {"train_loss": -11.1404447555542, "global_step": 405295, "epoch": 2412} {"train_loss": -11.635418891906738, "global_step": 405296, "epoch": 2412} {"train_loss": -12.060239791870117, "global_step": 405297, "epoch": 2412} {"train_loss": -10.353898048400879, "global_step": 405298, "epoch": 2412} {"train_loss": -11.97990608215332, "global_step": 405299, "epoch": 2412} {"train_loss": -11.831647872924805, "global_step": 405300, "epoch": 2412} {"train_loss": -11.29562759399414, "global_step": 405301, "epoch": 2412} {"train_loss": -11.946523666381836, "global_step": 405302, "epoch": 2412} {"train_loss": -12.208464622497559, "global_step": 405303, "epoch": 2412} {"train_loss": -11.194713592529297, "global_step": 405304, "epoch": 2412} {"train_loss": -10.920387268066406, "global_step": 405305, "epoch": 2412} {"train_loss": -12.209606170654297, "global_step": 405306, "epoch": 2412} {"train_loss": -11.631513595581055, "global_step": 405307, "epoch": 2412} {"train_loss": -11.392356872558594, "global_step": 405308, "epoch": 2412} {"train_loss": -12.027467727661133, "global_step": 405309, "epoch": 2412} {"train_loss": -11.963926315307617, "global_step": 405310, "epoch": 2412} {"train_loss": -12.157232284545898, "global_step": 405311, "epoch": 2412} {"train_loss": -12.102069854736328, "global_step": 405312, "epoch": 2412} {"train_loss": -11.933584213256836, "global_step": 405313, "epoch": 2412} {"train_loss": -12.059183120727539, "global_step": 405314, "epoch": 2412} {"train_loss": -12.589544296264648, "global_step": 405315, "epoch": 2412} {"train_loss": -12.01388931274414, "global_step": 405316, "epoch": 2412} {"train_loss": -12.258047103881836, "global_step": 405317, "epoch": 2412} {"train_loss": -12.118209838867188, "global_step": 405318, "epoch": 2412} {"train_loss": -12.267961502075195, "global_step": 405319, "epoch": 2412} {"train_loss": -11.966073989868164, "global_step": 405320, "epoch": 2412} {"train_loss": -11.824028015136719, "global_step": 405321, "epoch": 2412} {"train_loss": -11.582857131958008, "global_step": 405322, "epoch": 2412} {"train_loss": -12.522236824035645, "global_step": 405323, "epoch": 2412} {"train_loss": -11.9345703125, "global_step": 405324, "epoch": 2412} {"train_loss": -11.94538688659668, "global_step": 405325, "epoch": 2412} {"train_loss": -11.224663734436035, "global_step": 405326, "epoch": 2412} {"train_loss": -12.604225158691406, "global_step": 405327, "epoch": 2412} {"train_loss": -11.350234985351562, "global_step": 405328, "epoch": 2412} {"train_loss": -12.240976333618164, "global_step": 405329, "epoch": 2412} {"train_loss": -12.437678337097168, "global_step": 405330, "epoch": 2412} {"train_loss": -11.866548538208008, "global_step": 405331, "epoch": 2412} {"train_loss": -12.367448806762695, "global_step": 405332, "epoch": 2412} {"train_loss": -12.445030212402344, "global_step": 405333, "epoch": 2412} {"train_loss": -11.98190689086914, "global_step": 405334, "epoch": 2412} {"train_loss": -12.543336868286133, "global_step": 405335, "epoch": 2412} {"train_loss": -12.108882904052734, "global_step": 405336, "epoch": 2412} {"train_loss": -12.387971878051758, "global_step": 405337, "epoch": 2412} {"train_loss": -12.071678161621094, "global_step": 405338, "epoch": 2412} {"train_loss": -11.814726829528809, "global_step": 405339, "epoch": 2412} {"train_loss": -11.719158172607422, "global_step": 405340, "epoch": 2412} {"train_loss": -11.153881072998047, "global_step": 405341, "epoch": 2412} {"train_loss": -11.879505157470703, "global_step": 405342, "epoch": 2412} {"train_loss": -11.668928146362305, "global_step": 405343, "epoch": 2412} {"train_loss": -10.182975769042969, "global_step": 405344, "epoch": 2412} {"train_loss": -11.445648193359375, "global_step": 405345, "epoch": 2412} {"train_loss": -10.316534042358398, "global_step": 405346, "epoch": 2412} {"train_loss": -11.058409690856934, "global_step": 405347, "epoch": 2412} {"train_loss": -11.276484489440918, "global_step": 405348, "epoch": 2412} {"train_loss": -10.978523254394531, "global_step": 405349, "epoch": 2412} {"train_loss": -11.52389144897461, "global_step": 405350, "epoch": 2412} {"train_loss": -10.962645530700684, "global_step": 405351, "epoch": 2412} {"train_loss": -10.883594512939453, "global_step": 405352, "epoch": 2412} {"train_loss": -10.681417465209961, "global_step": 405353, "epoch": 2412} {"train_loss": -10.626768112182617, "global_step": 405354, "epoch": 2412} {"train_loss": -11.241973876953125, "global_step": 405355, "epoch": 2412} {"train_loss": -10.919060707092285, "global_step": 405356, "epoch": 2412} {"train_loss": -10.783422470092773, "global_step": 405357, "epoch": 2412} {"train_loss": -11.043724060058594, "global_step": 405358, "epoch": 2412} {"train_loss": -10.118409156799316, "global_step": 405359, "epoch": 2412} {"train_loss": -11.260214805603027, "global_step": 405360, "epoch": 2412} {"train_loss": -10.037649154663086, "global_step": 405361, "epoch": 2412} {"train_loss": -10.288080215454102, "global_step": 405362, "epoch": 2412} {"train_loss": -12.047163009643555, "global_step": 405363, "epoch": 2412} {"train_loss": -10.8849458694458, "global_step": 405364, "epoch": 2412} {"train_loss": -11.303007125854492, "global_step": 405365, "epoch": 2412} {"train_loss": -11.457172393798828, "global_step": 405366, "epoch": 2412} {"train_loss": -11.556324005126953, "global_step": 405367, "epoch": 2412} {"train_loss": -11.43680477142334, "global_step": 405368, "epoch": 2412} {"train_loss": -12.117046356201172, "global_step": 405369, "epoch": 2412} {"train_loss": -10.96308708190918, "global_step": 405370, "epoch": 2412} {"train_loss": -12.195514678955078, "global_step": 405371, "epoch": 2412} {"train_loss": -11.136747360229492, "global_step": 405372, "epoch": 2412} {"train_loss": -11.932511329650879, "global_step": 405373, "epoch": 2412} {"train_loss": -11.955193519592285, "global_step": 405374, "epoch": 2412} {"train_loss": -11.734842300415039, "global_step": 405375, "epoch": 2412} {"train_loss": -12.166044235229492, "global_step": 405376, "epoch": 2412} {"train_loss": -11.701737403869629, "global_step": 405377, "epoch": 2412} {"train_loss": -11.823986053466797, "global_step": 405378, "epoch": 2412} {"train_loss": -12.017265319824219, "global_step": 405379, "epoch": 2412} {"train_loss": -11.988859176635742, "global_step": 405380, "epoch": 2412} {"train_loss": -12.222872734069824, "global_step": 405381, "epoch": 2412} {"train_loss": -12.27471923828125, "global_step": 405382, "epoch": 2412} {"train_loss": -11.969797083309718, "global_step": 405383, "epoch": 2412, "val_loss": 301213.4375} {"train_loss": -12.351177215576172, "global_step": 405384, "epoch": 2413} {"train_loss": -12.133235931396484, "global_step": 405385, "epoch": 2413} {"train_loss": -12.026079177856445, "global_step": 405386, "epoch": 2413} {"train_loss": -12.267988204956055, "global_step": 405387, "epoch": 2413} {"train_loss": -12.035033226013184, "global_step": 405388, "epoch": 2413} {"train_loss": -12.380743026733398, "global_step": 405389, "epoch": 2413} {"train_loss": -12.11252212524414, "global_step": 405390, "epoch": 2413} {"train_loss": -12.324653625488281, "global_step": 405391, "epoch": 2413} {"train_loss": -12.422823905944824, "global_step": 405392, "epoch": 2413} {"train_loss": -12.19137954711914, "global_step": 405393, "epoch": 2413} {"train_loss": -12.45761489868164, "global_step": 405394, "epoch": 2413} {"train_loss": -12.539249420166016, "global_step": 405395, "epoch": 2413} {"train_loss": -12.295021057128906, "global_step": 405396, "epoch": 2413} {"train_loss": -12.639148712158203, "global_step": 405397, "epoch": 2413} {"train_loss": -12.163253784179688, "global_step": 405398, "epoch": 2413} {"train_loss": -12.388973236083984, "global_step": 405399, "epoch": 2413} {"train_loss": -12.03742790222168, "global_step": 405400, "epoch": 2413} {"train_loss": -12.403992652893066, "global_step": 405401, "epoch": 2413} {"train_loss": -12.395389556884766, "global_step": 405402, "epoch": 2413} {"train_loss": -12.55244255065918, "global_step": 405403, "epoch": 2413} {"train_loss": -12.489227294921875, "global_step": 405404, "epoch": 2413} {"train_loss": -12.352031707763672, "global_step": 405405, "epoch": 2413} {"train_loss": -12.315210342407227, "global_step": 405406, "epoch": 2413} {"train_loss": -12.314430236816406, "global_step": 405407, "epoch": 2413} {"train_loss": -11.975330352783203, "global_step": 405408, "epoch": 2413} {"train_loss": -12.108280181884766, "global_step": 405409, "epoch": 2413} {"train_loss": -12.354326248168945, "global_step": 405410, "epoch": 2413} {"train_loss": -12.157629013061523, "global_step": 405411, "epoch": 2413} {"train_loss": -12.477265357971191, "global_step": 405412, "epoch": 2413} {"train_loss": -12.1145658493042, "global_step": 405413, "epoch": 2413} {"train_loss": -12.175500869750977, "global_step": 405414, "epoch": 2413} {"train_loss": -12.090898513793945, "global_step": 405415, "epoch": 2413} {"train_loss": -12.26021957397461, "global_step": 405416, "epoch": 2413} {"train_loss": -12.087165832519531, "global_step": 405417, "epoch": 2413} {"train_loss": -12.213020324707031, "global_step": 405418, "epoch": 2413} {"train_loss": -11.978126525878906, "global_step": 405419, "epoch": 2413} {"train_loss": -12.122142791748047, "global_step": 405420, "epoch": 2413} {"train_loss": -12.469034194946289, "global_step": 405421, "epoch": 2413} {"train_loss": -12.182316780090332, "global_step": 405422, "epoch": 2413} {"train_loss": -12.371110916137695, "global_step": 405423, "epoch": 2413} {"train_loss": -12.07125186920166, "global_step": 405424, "epoch": 2413} {"train_loss": -11.890283584594727, "global_step": 405425, "epoch": 2413} {"train_loss": -12.468953132629395, "global_step": 405426, "epoch": 2413} {"train_loss": -12.132266998291016, "global_step": 405427, "epoch": 2413} {"train_loss": -12.527785301208496, "global_step": 405428, "epoch": 2413} {"train_loss": -12.205184936523438, "global_step": 405429, "epoch": 2413} {"train_loss": -12.177906036376953, "global_step": 405430, "epoch": 2413} {"train_loss": -12.294173240661621, "global_step": 405431, "epoch": 2413} {"train_loss": -12.544767379760742, "global_step": 405432, "epoch": 2413} {"train_loss": -12.253177642822266, "global_step": 405433, "epoch": 2413} {"train_loss": -12.252962112426758, "global_step": 405434, "epoch": 2413} {"train_loss": -12.38765811920166, "global_step": 405435, "epoch": 2413} {"train_loss": -12.540454864501953, "global_step": 405436, "epoch": 2413} {"train_loss": -12.559502601623535, "global_step": 405437, "epoch": 2413} {"train_loss": -12.513958930969238, "global_step": 405438, "epoch": 2413} {"train_loss": -12.599396705627441, "global_step": 405439, "epoch": 2413} {"train_loss": -12.322446823120117, "global_step": 405440, "epoch": 2413} {"train_loss": -12.566072463989258, "global_step": 405441, "epoch": 2413} {"train_loss": -12.647113800048828, "global_step": 405442, "epoch": 2413} {"train_loss": -12.683025360107422, "global_step": 405443, "epoch": 2413} {"train_loss": -12.674818992614746, "global_step": 405444, "epoch": 2413} {"train_loss": -12.595016479492188, "global_step": 405445, "epoch": 2413} {"train_loss": -12.59119987487793, "global_step": 405446, "epoch": 2413} {"train_loss": -12.820789337158203, "global_step": 405447, "epoch": 2413} {"train_loss": -12.673757553100586, "global_step": 405448, "epoch": 2413} {"train_loss": -12.677925109863281, "global_step": 405449, "epoch": 2413} {"train_loss": -12.710769653320312, "global_step": 405450, "epoch": 2413} {"train_loss": -12.775203704833984, "global_step": 405451, "epoch": 2413} {"train_loss": -12.554277420043945, "global_step": 405452, "epoch": 2413} {"train_loss": -12.623455047607422, "global_step": 405453, "epoch": 2413} {"train_loss": -12.52916431427002, "global_step": 405454, "epoch": 2413} {"train_loss": -12.690049171447754, "global_step": 405455, "epoch": 2413} {"train_loss": -12.741621017456055, "global_step": 405456, "epoch": 2413} {"train_loss": -12.232895851135254, "global_step": 405457, "epoch": 2413} {"train_loss": -12.043234825134277, "global_step": 405458, "epoch": 2413} {"train_loss": -12.565286636352539, "global_step": 405459, "epoch": 2413} {"train_loss": -12.410961151123047, "global_step": 405460, "epoch": 2413} {"train_loss": -12.219942092895508, "global_step": 405461, "epoch": 2413} {"train_loss": -12.772464752197266, "global_step": 405462, "epoch": 2413} {"train_loss": -12.22812557220459, "global_step": 405463, "epoch": 2413} {"train_loss": -11.025045394897461, "global_step": 405464, "epoch": 2413} {"train_loss": -12.376129150390625, "global_step": 405465, "epoch": 2413} {"train_loss": -11.715822219848633, "global_step": 405466, "epoch": 2413} {"train_loss": -12.01118278503418, "global_step": 405467, "epoch": 2413} {"train_loss": -11.7754487991333, "global_step": 405468, "epoch": 2413} {"train_loss": -12.59682846069336, "global_step": 405469, "epoch": 2413} {"train_loss": -12.242788314819336, "global_step": 405470, "epoch": 2413} {"train_loss": -12.356142044067383, "global_step": 405471, "epoch": 2413} {"train_loss": -12.117161750793457, "global_step": 405472, "epoch": 2413} {"train_loss": -12.159585952758789, "global_step": 405473, "epoch": 2413} {"train_loss": -11.867948532104492, "global_step": 405474, "epoch": 2413} {"train_loss": -12.271430015563965, "global_step": 405475, "epoch": 2413} {"train_loss": -11.787851333618164, "global_step": 405476, "epoch": 2413} {"train_loss": -12.259814262390137, "global_step": 405477, "epoch": 2413} {"train_loss": -12.024704933166504, "global_step": 405478, "epoch": 2413} {"train_loss": -11.504964828491211, "global_step": 405479, "epoch": 2413} {"train_loss": -11.58763599395752, "global_step": 405480, "epoch": 2413} {"train_loss": -12.063562393188477, "global_step": 405481, "epoch": 2413} {"train_loss": -11.552068710327148, "global_step": 405482, "epoch": 2413} {"train_loss": -11.415298461914062, "global_step": 405483, "epoch": 2413} {"train_loss": -10.845945358276367, "global_step": 405484, "epoch": 2413} {"train_loss": -11.936653137207031, "global_step": 405485, "epoch": 2413} {"train_loss": -10.777427673339844, "global_step": 405486, "epoch": 2413} {"train_loss": -11.428166389465332, "global_step": 405487, "epoch": 2413} {"train_loss": -12.132011413574219, "global_step": 405488, "epoch": 2413} {"train_loss": -10.651183128356934, "global_step": 405489, "epoch": 2413} {"train_loss": -12.049938201904297, "global_step": 405490, "epoch": 2413} {"train_loss": -10.901652336120605, "global_step": 405491, "epoch": 2413} {"train_loss": -11.93265151977539, "global_step": 405492, "epoch": 2413} {"train_loss": -10.987349510192871, "global_step": 405493, "epoch": 2413} {"train_loss": -11.95881462097168, "global_step": 405494, "epoch": 2413} {"train_loss": -11.629390716552734, "global_step": 405495, "epoch": 2413} {"train_loss": -12.017587661743164, "global_step": 405496, "epoch": 2413} {"train_loss": -10.980396270751953, "global_step": 405497, "epoch": 2413} {"train_loss": -12.025609970092773, "global_step": 405498, "epoch": 2413} {"train_loss": -11.007669448852539, "global_step": 405499, "epoch": 2413} {"train_loss": -11.54835319519043, "global_step": 405500, "epoch": 2413} {"train_loss": -11.376291275024414, "global_step": 405501, "epoch": 2413} {"train_loss": -11.427297592163086, "global_step": 405502, "epoch": 2413} {"train_loss": -12.135305404663086, "global_step": 405503, "epoch": 2413} {"train_loss": -11.548635482788086, "global_step": 405504, "epoch": 2413} {"train_loss": -12.017427444458008, "global_step": 405505, "epoch": 2413} {"train_loss": -11.798478126525879, "global_step": 405506, "epoch": 2413} {"train_loss": -11.697604179382324, "global_step": 405507, "epoch": 2413} {"train_loss": -11.869405746459961, "global_step": 405508, "epoch": 2413} {"train_loss": -11.95222282409668, "global_step": 405509, "epoch": 2413} {"train_loss": -12.34996223449707, "global_step": 405510, "epoch": 2413} {"train_loss": -12.039533615112305, "global_step": 405511, "epoch": 2413} {"train_loss": -12.071979522705078, "global_step": 405512, "epoch": 2413} {"train_loss": -12.411870956420898, "global_step": 405513, "epoch": 2413} {"train_loss": -12.177881240844727, "global_step": 405514, "epoch": 2413} {"train_loss": -12.473682403564453, "global_step": 405515, "epoch": 2413} {"train_loss": -12.130691528320312, "global_step": 405516, "epoch": 2413} {"train_loss": -12.355707168579102, "global_step": 405517, "epoch": 2413} {"train_loss": -12.431459426879883, "global_step": 405518, "epoch": 2413} {"train_loss": -12.595406532287598, "global_step": 405519, "epoch": 2413} {"train_loss": -12.248648643493652, "global_step": 405520, "epoch": 2413} {"train_loss": -12.064286231994629, "global_step": 405521, "epoch": 2413} {"train_loss": -11.982366561889648, "global_step": 405522, "epoch": 2413} {"train_loss": -12.349540710449219, "global_step": 405523, "epoch": 2413} {"train_loss": -12.043673515319824, "global_step": 405524, "epoch": 2413} {"train_loss": -12.277963638305664, "global_step": 405525, "epoch": 2413} {"train_loss": -12.546297073364258, "global_step": 405526, "epoch": 2413} {"train_loss": -12.441818237304688, "global_step": 405527, "epoch": 2413} {"train_loss": -12.313498497009277, "global_step": 405528, "epoch": 2413} {"train_loss": -12.101646423339844, "global_step": 405529, "epoch": 2413} {"train_loss": -12.612943649291992, "global_step": 405530, "epoch": 2413} {"train_loss": -12.302059173583984, "global_step": 405531, "epoch": 2413} {"train_loss": -12.42835807800293, "global_step": 405532, "epoch": 2413} {"train_loss": -12.49230670928955, "global_step": 405533, "epoch": 2413} {"train_loss": -12.084705352783203, "global_step": 405534, "epoch": 2413} {"train_loss": -12.184408187866211, "global_step": 405535, "epoch": 2413} {"train_loss": -12.243402481079102, "global_step": 405536, "epoch": 2413} {"train_loss": -12.146417617797852, "global_step": 405537, "epoch": 2413} {"train_loss": -12.08889389038086, "global_step": 405538, "epoch": 2413} {"train_loss": -12.521892547607422, "global_step": 405539, "epoch": 2413} {"train_loss": -11.928750991821289, "global_step": 405540, "epoch": 2413} {"train_loss": -12.475232124328613, "global_step": 405541, "epoch": 2413} {"train_loss": -12.183775901794434, "global_step": 405542, "epoch": 2413} {"train_loss": -12.463350296020508, "global_step": 405543, "epoch": 2413} {"train_loss": -12.366249084472656, "global_step": 405544, "epoch": 2413} {"train_loss": -12.26889419555664, "global_step": 405545, "epoch": 2413} {"train_loss": -11.807123184204102, "global_step": 405546, "epoch": 2413} {"train_loss": -12.69930648803711, "global_step": 405547, "epoch": 2413} {"train_loss": -12.168949127197266, "global_step": 405548, "epoch": 2413} {"train_loss": -12.638731002807617, "global_step": 405549, "epoch": 2413} {"train_loss": -12.338251113891602, "global_step": 405550, "epoch": 2413} {"train_loss": -12.172786848885673, "global_step": 405551, "epoch": 2413, "val_loss": 301141.5} {"train_loss": -12.372426986694336, "global_step": 405552, "epoch": 2414} {"train_loss": -12.59280776977539, "global_step": 405553, "epoch": 2414} {"train_loss": -12.610576629638672, "global_step": 405554, "epoch": 2414} {"train_loss": -12.632551193237305, "global_step": 405555, "epoch": 2414} {"train_loss": -12.621047973632812, "global_step": 405556, "epoch": 2414} {"train_loss": -12.518325805664062, "global_step": 405557, "epoch": 2414} {"train_loss": -12.299246788024902, "global_step": 405558, "epoch": 2414} {"train_loss": -12.557124137878418, "global_step": 405559, "epoch": 2414} {"train_loss": -12.690876007080078, "global_step": 405560, "epoch": 2414} {"train_loss": -12.734859466552734, "global_step": 405561, "epoch": 2414} {"train_loss": -12.500191688537598, "global_step": 405562, "epoch": 2414} {"train_loss": -12.696338653564453, "global_step": 405563, "epoch": 2414} {"train_loss": -12.409473419189453, "global_step": 405564, "epoch": 2414} {"train_loss": -12.562736511230469, "global_step": 405565, "epoch": 2414} {"train_loss": -12.669371604919434, "global_step": 405566, "epoch": 2414} {"train_loss": -11.944002151489258, "global_step": 405567, "epoch": 2414} {"train_loss": -12.669748306274414, "global_step": 405568, "epoch": 2414} {"train_loss": -11.786952018737793, "global_step": 405569, "epoch": 2414} {"train_loss": -12.089204788208008, "global_step": 405570, "epoch": 2414} {"train_loss": -12.592304229736328, "global_step": 405571, "epoch": 2414} {"train_loss": -12.250303268432617, "global_step": 405572, "epoch": 2414} {"train_loss": -12.040512084960938, "global_step": 405573, "epoch": 2414} {"train_loss": -12.310293197631836, "global_step": 405574, "epoch": 2414} {"train_loss": -12.113424301147461, "global_step": 405575, "epoch": 2414} {"train_loss": -11.542552947998047, "global_step": 405576, "epoch": 2414} {"train_loss": -10.535146713256836, "global_step": 405577, "epoch": 2414} {"train_loss": -12.315814018249512, "global_step": 405578, "epoch": 2414} {"train_loss": -10.667400360107422, "global_step": 405579, "epoch": 2414} {"train_loss": -11.364945411682129, "global_step": 405580, "epoch": 2414} {"train_loss": -12.023614883422852, "global_step": 405581, "epoch": 2414} {"train_loss": -11.493463516235352, "global_step": 405582, "epoch": 2414} {"train_loss": -12.062287330627441, "global_step": 405583, "epoch": 2414} {"train_loss": -11.847923278808594, "global_step": 405584, "epoch": 2414} {"train_loss": -12.337529182434082, "global_step": 405585, "epoch": 2414} {"train_loss": -11.415022850036621, "global_step": 405586, "epoch": 2414} {"train_loss": -11.78205394744873, "global_step": 405587, "epoch": 2414} {"train_loss": -12.015045166015625, "global_step": 405588, "epoch": 2414} {"train_loss": -10.966131210327148, "global_step": 405589, "epoch": 2414} {"train_loss": -12.00081729888916, "global_step": 405590, "epoch": 2414} {"train_loss": -11.58639907836914, "global_step": 405591, "epoch": 2414} {"train_loss": -11.837875366210938, "global_step": 405592, "epoch": 2414} {"train_loss": -12.142468452453613, "global_step": 405593, "epoch": 2414} {"train_loss": -11.570785522460938, "global_step": 405594, "epoch": 2414} {"train_loss": -11.768997192382812, "global_step": 405595, "epoch": 2414} {"train_loss": -11.851968765258789, "global_step": 405596, "epoch": 2414} {"train_loss": -11.85494613647461, "global_step": 405597, "epoch": 2414} {"train_loss": -12.142267227172852, "global_step": 405598, "epoch": 2414} {"train_loss": -11.35394287109375, "global_step": 405599, "epoch": 2414} {"train_loss": -12.000497817993164, "global_step": 405600, "epoch": 2414} {"train_loss": -12.276223182678223, "global_step": 405601, "epoch": 2414} {"train_loss": -11.389545440673828, "global_step": 405602, "epoch": 2414} {"train_loss": -12.078113555908203, "global_step": 405603, "epoch": 2414} {"train_loss": -11.914243698120117, "global_step": 405604, "epoch": 2414} {"train_loss": -12.019309997558594, "global_step": 405605, "epoch": 2414} {"train_loss": -12.29310417175293, "global_step": 405606, "epoch": 2414} {"train_loss": -11.734977722167969, "global_step": 405607, "epoch": 2414} {"train_loss": -11.960801124572754, "global_step": 405608, "epoch": 2414} {"train_loss": -12.318395614624023, "global_step": 405609, "epoch": 2414} {"train_loss": -11.899968147277832, "global_step": 405610, "epoch": 2414} {"train_loss": -12.398012161254883, "global_step": 405611, "epoch": 2414} {"train_loss": -11.181344985961914, "global_step": 405612, "epoch": 2414} {"train_loss": -12.45572566986084, "global_step": 405613, "epoch": 2414} {"train_loss": -11.794651985168457, "global_step": 405614, "epoch": 2414} {"train_loss": -12.293914794921875, "global_step": 405615, "epoch": 2414} {"train_loss": -12.218204498291016, "global_step": 405616, "epoch": 2414} {"train_loss": -12.425932884216309, "global_step": 405617, "epoch": 2414} {"train_loss": -12.53851318359375, "global_step": 405618, "epoch": 2414} {"train_loss": -12.31277847290039, "global_step": 405619, "epoch": 2414} {"train_loss": -12.462532043457031, "global_step": 405620, "epoch": 2414} {"train_loss": -12.391670227050781, "global_step": 405621, "epoch": 2414} {"train_loss": -12.455209732055664, "global_step": 405622, "epoch": 2414} {"train_loss": -12.6373929977417, "global_step": 405623, "epoch": 2414} {"train_loss": -12.345495223999023, "global_step": 405624, "epoch": 2414} {"train_loss": -12.381221771240234, "global_step": 405625, "epoch": 2414} {"train_loss": -12.344961166381836, "global_step": 405626, "epoch": 2414} {"train_loss": -12.53868579864502, "global_step": 405627, "epoch": 2414} {"train_loss": -12.260501861572266, "global_step": 405628, "epoch": 2414} {"train_loss": -11.886524200439453, "global_step": 405629, "epoch": 2414} {"train_loss": -12.319934844970703, "global_step": 405630, "epoch": 2414} {"train_loss": -12.087909698486328, "global_step": 405631, "epoch": 2414} {"train_loss": -12.376129150390625, "global_step": 405632, "epoch": 2414} {"train_loss": -12.39535140991211, "global_step": 405633, "epoch": 2414} {"train_loss": -12.575292587280273, "global_step": 405634, "epoch": 2414} {"train_loss": -11.815666198730469, "global_step": 405635, "epoch": 2414} {"train_loss": -12.641376495361328, "global_step": 405636, "epoch": 2414} {"train_loss": -12.47800064086914, "global_step": 405637, "epoch": 2414} {"train_loss": -12.452275276184082, "global_step": 405638, "epoch": 2414} {"train_loss": -12.313361167907715, "global_step": 405639, "epoch": 2414} {"train_loss": -12.487129211425781, "global_step": 405640, "epoch": 2414} {"train_loss": -12.084010124206543, "global_step": 405641, "epoch": 2414} {"train_loss": -12.023405075073242, "global_step": 405642, "epoch": 2414} {"train_loss": -12.384321212768555, "global_step": 405643, "epoch": 2414} {"train_loss": -11.875066757202148, "global_step": 405644, "epoch": 2414} {"train_loss": -12.529793739318848, "global_step": 405645, "epoch": 2414} {"train_loss": -11.975380897521973, "global_step": 405646, "epoch": 2414} {"train_loss": -12.094099044799805, "global_step": 405647, "epoch": 2414} {"train_loss": -12.417257308959961, "global_step": 405648, "epoch": 2414} {"train_loss": -11.935613632202148, "global_step": 405649, "epoch": 2414} {"train_loss": -12.051271438598633, "global_step": 405650, "epoch": 2414} {"train_loss": -12.249605178833008, "global_step": 405651, "epoch": 2414} {"train_loss": -12.014927864074707, "global_step": 405652, "epoch": 2414} {"train_loss": -12.625173568725586, "global_step": 405653, "epoch": 2414} {"train_loss": -12.22323226928711, "global_step": 405654, "epoch": 2414} {"train_loss": -11.922842979431152, "global_step": 405655, "epoch": 2414} {"train_loss": -12.292376518249512, "global_step": 405656, "epoch": 2414} {"train_loss": -11.937840461730957, "global_step": 405657, "epoch": 2414} {"train_loss": -12.08175277709961, "global_step": 405658, "epoch": 2414} {"train_loss": -12.375385284423828, "global_step": 405659, "epoch": 2414} {"train_loss": -12.145870208740234, "global_step": 405660, "epoch": 2414} {"train_loss": -12.178397178649902, "global_step": 405661, "epoch": 2414} {"train_loss": -12.078329086303711, "global_step": 405662, "epoch": 2414} {"train_loss": -11.752817153930664, "global_step": 405663, "epoch": 2414} {"train_loss": -11.359882354736328, "global_step": 405664, "epoch": 2414} {"train_loss": -12.097053527832031, "global_step": 405665, "epoch": 2414} {"train_loss": -11.948898315429688, "global_step": 405666, "epoch": 2414} {"train_loss": -11.926366806030273, "global_step": 405667, "epoch": 2414} {"train_loss": -11.718180656433105, "global_step": 405668, "epoch": 2414} {"train_loss": -11.790082931518555, "global_step": 405669, "epoch": 2414} {"train_loss": -11.637029647827148, "global_step": 405670, "epoch": 2414} {"train_loss": -11.471466064453125, "global_step": 405671, "epoch": 2414} {"train_loss": -11.292546272277832, "global_step": 405672, "epoch": 2414} {"train_loss": -12.109978675842285, "global_step": 405673, "epoch": 2414} {"train_loss": -10.690670013427734, "global_step": 405674, "epoch": 2414} {"train_loss": -12.607343673706055, "global_step": 405675, "epoch": 2414} {"train_loss": -11.380243301391602, "global_step": 405676, "epoch": 2414} {"train_loss": -11.848848342895508, "global_step": 405677, "epoch": 2414} {"train_loss": -11.086979866027832, "global_step": 405678, "epoch": 2414} {"train_loss": -11.981460571289062, "global_step": 405679, "epoch": 2414} {"train_loss": -11.554462432861328, "global_step": 405680, "epoch": 2414} {"train_loss": -11.835195541381836, "global_step": 405681, "epoch": 2414} {"train_loss": -11.682930946350098, "global_step": 405682, "epoch": 2414} {"train_loss": -11.733991622924805, "global_step": 405683, "epoch": 2414} {"train_loss": -11.931415557861328, "global_step": 405684, "epoch": 2414} {"train_loss": -11.192281723022461, "global_step": 405685, "epoch": 2414} {"train_loss": -12.136920928955078, "global_step": 405686, "epoch": 2414} {"train_loss": -11.731932640075684, "global_step": 405687, "epoch": 2414} {"train_loss": -12.091100692749023, "global_step": 405688, "epoch": 2414} {"train_loss": -11.673835754394531, "global_step": 405689, "epoch": 2414} {"train_loss": -12.324905395507812, "global_step": 405690, "epoch": 2414} {"train_loss": -11.462766647338867, "global_step": 405691, "epoch": 2414} {"train_loss": -11.939536094665527, "global_step": 405692, "epoch": 2414} {"train_loss": -11.135683059692383, "global_step": 405693, "epoch": 2414} {"train_loss": -11.956092834472656, "global_step": 405694, "epoch": 2414} {"train_loss": -11.330451011657715, "global_step": 405695, "epoch": 2414} {"train_loss": -11.383485794067383, "global_step": 405696, "epoch": 2414} {"train_loss": -11.4744234085083, "global_step": 405697, "epoch": 2414} {"train_loss": -11.703880310058594, "global_step": 405698, "epoch": 2414} {"train_loss": -10.818613052368164, "global_step": 405699, "epoch": 2414} {"train_loss": -12.381108283996582, "global_step": 405700, "epoch": 2414} {"train_loss": -11.03996467590332, "global_step": 405701, "epoch": 2414} {"train_loss": -12.038463592529297, "global_step": 405702, "epoch": 2414} {"train_loss": -11.355820655822754, "global_step": 405703, "epoch": 2414} {"train_loss": -12.212318420410156, "global_step": 405704, "epoch": 2414} {"train_loss": -11.378341674804688, "global_step": 405705, "epoch": 2414} {"train_loss": -12.135496139526367, "global_step": 405706, "epoch": 2414} {"train_loss": -11.052803039550781, "global_step": 405707, "epoch": 2414} {"train_loss": -12.334528923034668, "global_step": 405708, "epoch": 2414} {"train_loss": -11.370637893676758, "global_step": 405709, "epoch": 2414} {"train_loss": -12.273737907409668, "global_step": 405710, "epoch": 2414} {"train_loss": -11.25649642944336, "global_step": 405711, "epoch": 2414} {"train_loss": -12.092514991760254, "global_step": 405712, "epoch": 2414} {"train_loss": -11.269998550415039, "global_step": 405713, "epoch": 2414} {"train_loss": -12.251670837402344, "global_step": 405714, "epoch": 2414} {"train_loss": -11.417488098144531, "global_step": 405715, "epoch": 2414} {"train_loss": -12.15902328491211, "global_step": 405716, "epoch": 2414} {"train_loss": -11.65298080444336, "global_step": 405717, "epoch": 2414} {"train_loss": -12.420909881591797, "global_step": 405718, "epoch": 2414} {"train_loss": -11.9949612844558, "global_step": 405719, "epoch": 2414, "val_loss": 303660.3125} {"train_loss": -12.428167343139648, "global_step": 405720, "epoch": 2415} {"train_loss": -11.96977424621582, "global_step": 405721, "epoch": 2415} {"train_loss": -12.532833099365234, "global_step": 405722, "epoch": 2415} {"train_loss": -12.294509887695312, "global_step": 405723, "epoch": 2415} {"train_loss": -12.54916763305664, "global_step": 405724, "epoch": 2415} {"train_loss": -12.303884506225586, "global_step": 405725, "epoch": 2415} {"train_loss": -12.606475830078125, "global_step": 405726, "epoch": 2415} {"train_loss": -12.022502899169922, "global_step": 405727, "epoch": 2415} {"train_loss": -12.369743347167969, "global_step": 405728, "epoch": 2415} {"train_loss": -12.607645034790039, "global_step": 405729, "epoch": 2415} {"train_loss": -12.442075729370117, "global_step": 405730, "epoch": 2415} {"train_loss": -12.61551284790039, "global_step": 405731, "epoch": 2415} {"train_loss": -12.2210054397583, "global_step": 405732, "epoch": 2415} {"train_loss": -12.381180763244629, "global_step": 405733, "epoch": 2415} {"train_loss": -12.353599548339844, "global_step": 405734, "epoch": 2415} {"train_loss": -12.475662231445312, "global_step": 405735, "epoch": 2415} {"train_loss": -12.528264999389648, "global_step": 405736, "epoch": 2415} {"train_loss": -12.37017822265625, "global_step": 405737, "epoch": 2415} {"train_loss": -12.417373657226562, "global_step": 405738, "epoch": 2415} {"train_loss": -12.391973495483398, "global_step": 405739, "epoch": 2415} {"train_loss": -12.311058044433594, "global_step": 405740, "epoch": 2415} {"train_loss": -12.470855712890625, "global_step": 405741, "epoch": 2415} {"train_loss": -12.379592895507812, "global_step": 405742, "epoch": 2415} {"train_loss": -12.472748756408691, "global_step": 405743, "epoch": 2415} {"train_loss": -12.538496017456055, "global_step": 405744, "epoch": 2415} {"train_loss": -12.393024444580078, "global_step": 405745, "epoch": 2415} {"train_loss": -12.596480369567871, "global_step": 405746, "epoch": 2415} {"train_loss": -12.592596054077148, "global_step": 405747, "epoch": 2415} {"train_loss": -12.653477668762207, "global_step": 405748, "epoch": 2415} {"train_loss": -12.328482627868652, "global_step": 405749, "epoch": 2415} {"train_loss": -12.561697006225586, "global_step": 405750, "epoch": 2415} {"train_loss": -12.7116060256958, "global_step": 405751, "epoch": 2415} {"train_loss": -12.540802001953125, "global_step": 405752, "epoch": 2415} {"train_loss": -12.68990707397461, "global_step": 405753, "epoch": 2415} {"train_loss": -12.680305480957031, "global_step": 405754, "epoch": 2415} {"train_loss": -12.577861785888672, "global_step": 405755, "epoch": 2415} {"train_loss": -12.803813934326172, "global_step": 405756, "epoch": 2415} {"train_loss": -12.460175514221191, "global_step": 405757, "epoch": 2415} {"train_loss": -12.331323623657227, "global_step": 405758, "epoch": 2415} {"train_loss": -12.33186149597168, "global_step": 405759, "epoch": 2415} {"train_loss": -12.675745964050293, "global_step": 405760, "epoch": 2415} {"train_loss": -12.687724113464355, "global_step": 405761, "epoch": 2415} {"train_loss": -12.307788848876953, "global_step": 405762, "epoch": 2415} {"train_loss": -11.566728591918945, "global_step": 405763, "epoch": 2415} {"train_loss": -11.242968559265137, "global_step": 405764, "epoch": 2415} {"train_loss": -12.103574752807617, "global_step": 405765, "epoch": 2415} {"train_loss": -9.049320220947266, "global_step": 405766, "epoch": 2415} {"train_loss": -8.411383628845215, "global_step": 405767, "epoch": 2415} {"train_loss": -10.162668228149414, "global_step": 405768, "epoch": 2415} {"train_loss": -9.597372055053711, "global_step": 405769, "epoch": 2415} {"train_loss": -10.402748107910156, "global_step": 405770, "epoch": 2415} {"train_loss": -10.220603942871094, "global_step": 405771, "epoch": 2415} {"train_loss": -10.736648559570312, "global_step": 405772, "epoch": 2415} {"train_loss": -12.0853910446167, "global_step": 405773, "epoch": 2415} {"train_loss": -11.819257736206055, "global_step": 405774, "epoch": 2415} {"train_loss": -11.053939819335938, "global_step": 405775, "epoch": 2415} {"train_loss": -11.05081558227539, "global_step": 405776, "epoch": 2415} {"train_loss": -10.73713207244873, "global_step": 405777, "epoch": 2415} {"train_loss": -11.52216911315918, "global_step": 405778, "epoch": 2415} {"train_loss": -10.42286205291748, "global_step": 405779, "epoch": 2415} {"train_loss": -11.30067253112793, "global_step": 405780, "epoch": 2415} {"train_loss": -10.63664436340332, "global_step": 405781, "epoch": 2415} {"train_loss": -11.586024284362793, "global_step": 405782, "epoch": 2415} {"train_loss": -10.98143196105957, "global_step": 405783, "epoch": 2415} {"train_loss": -11.19039535522461, "global_step": 405784, "epoch": 2415} {"train_loss": -12.044269561767578, "global_step": 405785, "epoch": 2415} {"train_loss": -10.802696228027344, "global_step": 405786, "epoch": 2415} {"train_loss": -12.334513664245605, "global_step": 405787, "epoch": 2415} {"train_loss": -11.60879898071289, "global_step": 405788, "epoch": 2415} {"train_loss": -12.091691970825195, "global_step": 405789, "epoch": 2415} {"train_loss": -11.493342399597168, "global_step": 405790, "epoch": 2415} {"train_loss": -12.010246276855469, "global_step": 405791, "epoch": 2415} {"train_loss": -12.125375747680664, "global_step": 405792, "epoch": 2415} {"train_loss": -11.901580810546875, "global_step": 405793, "epoch": 2415} {"train_loss": -12.18597412109375, "global_step": 405794, "epoch": 2415} {"train_loss": -11.768736839294434, "global_step": 405795, "epoch": 2415} {"train_loss": -12.067201614379883, "global_step": 405796, "epoch": 2415} {"train_loss": -11.601948738098145, "global_step": 405797, "epoch": 2415} {"train_loss": -11.465349197387695, "global_step": 405798, "epoch": 2415} {"train_loss": -12.182619094848633, "global_step": 405799, "epoch": 2415} {"train_loss": -11.602001190185547, "global_step": 405800, "epoch": 2415} {"train_loss": -12.381689071655273, "global_step": 405801, "epoch": 2415} {"train_loss": -10.59010124206543, "global_step": 405802, "epoch": 2415} {"train_loss": -11.555695533752441, "global_step": 405803, "epoch": 2415} {"train_loss": -11.546545028686523, "global_step": 405804, "epoch": 2415} {"train_loss": -10.018003463745117, "global_step": 405805, "epoch": 2415} {"train_loss": -11.999837875366211, "global_step": 405806, "epoch": 2415} {"train_loss": -10.880992889404297, "global_step": 405807, "epoch": 2415} {"train_loss": -11.627813339233398, "global_step": 405808, "epoch": 2415} {"train_loss": -11.20688533782959, "global_step": 405809, "epoch": 2415} {"train_loss": -10.77797794342041, "global_step": 405810, "epoch": 2415} {"train_loss": -11.220285415649414, "global_step": 405811, "epoch": 2415} {"train_loss": -11.477761268615723, "global_step": 405812, "epoch": 2415} {"train_loss": -11.1704740524292, "global_step": 405813, "epoch": 2415} {"train_loss": -11.325468063354492, "global_step": 405814, "epoch": 2415} {"train_loss": -11.548980712890625, "global_step": 405815, "epoch": 2415} {"train_loss": -12.015955924987793, "global_step": 405816, "epoch": 2415} {"train_loss": -12.142154693603516, "global_step": 405817, "epoch": 2415} {"train_loss": -11.568543434143066, "global_step": 405818, "epoch": 2415} {"train_loss": -11.961851119995117, "global_step": 405819, "epoch": 2415} {"train_loss": -11.854597091674805, "global_step": 405820, "epoch": 2415} {"train_loss": -12.166297912597656, "global_step": 405821, "epoch": 2415} {"train_loss": -11.883939743041992, "global_step": 405822, "epoch": 2415} {"train_loss": -12.103967666625977, "global_step": 405823, "epoch": 2415} {"train_loss": -12.25008773803711, "global_step": 405824, "epoch": 2415} {"train_loss": -12.025348663330078, "global_step": 405825, "epoch": 2415} {"train_loss": -12.335027694702148, "global_step": 405826, "epoch": 2415} {"train_loss": -11.92951774597168, "global_step": 405827, "epoch": 2415} {"train_loss": -12.31485366821289, "global_step": 405828, "epoch": 2415} {"train_loss": -12.020227432250977, "global_step": 405829, "epoch": 2415} {"train_loss": -12.394453048706055, "global_step": 405830, "epoch": 2415} {"train_loss": -12.2708158493042, "global_step": 405831, "epoch": 2415} {"train_loss": -12.29718017578125, "global_step": 405832, "epoch": 2415} {"train_loss": -12.418448448181152, "global_step": 405833, "epoch": 2415} {"train_loss": -12.332578659057617, "global_step": 405834, "epoch": 2415} {"train_loss": -12.470998764038086, "global_step": 405835, "epoch": 2415} {"train_loss": -12.411252975463867, "global_step": 405836, "epoch": 2415} {"train_loss": -12.457316398620605, "global_step": 405837, "epoch": 2415} {"train_loss": -12.429779052734375, "global_step": 405838, "epoch": 2415} {"train_loss": -12.12416934967041, "global_step": 405839, "epoch": 2415} {"train_loss": -12.370777130126953, "global_step": 405840, "epoch": 2415} {"train_loss": -12.372739791870117, "global_step": 405841, "epoch": 2415} {"train_loss": -12.60175609588623, "global_step": 405842, "epoch": 2415} {"train_loss": -12.589912414550781, "global_step": 405843, "epoch": 2415} {"train_loss": -12.323685646057129, "global_step": 405844, "epoch": 2415} {"train_loss": -12.526439666748047, "global_step": 405845, "epoch": 2415} {"train_loss": -12.408622741699219, "global_step": 405846, "epoch": 2415} {"train_loss": -12.749160766601562, "global_step": 405847, "epoch": 2415} {"train_loss": -12.43049430847168, "global_step": 405848, "epoch": 2415} {"train_loss": -12.537192344665527, "global_step": 405849, "epoch": 2415} {"train_loss": -12.482279777526855, "global_step": 405850, "epoch": 2415} {"train_loss": -12.322540283203125, "global_step": 405851, "epoch": 2415} {"train_loss": -12.686233520507812, "global_step": 405852, "epoch": 2415} {"train_loss": -12.454626083374023, "global_step": 405853, "epoch": 2415} {"train_loss": -12.30203628540039, "global_step": 405854, "epoch": 2415} {"train_loss": -12.410469055175781, "global_step": 405855, "epoch": 2415} {"train_loss": -12.51759147644043, "global_step": 405856, "epoch": 2415} {"train_loss": -12.46010684967041, "global_step": 405857, "epoch": 2415} {"train_loss": -12.611129760742188, "global_step": 405858, "epoch": 2415} {"train_loss": -12.538341522216797, "global_step": 405859, "epoch": 2415} {"train_loss": -12.502634048461914, "global_step": 405860, "epoch": 2415} {"train_loss": -12.392328262329102, "global_step": 405861, "epoch": 2415} {"train_loss": -12.568792343139648, "global_step": 405862, "epoch": 2415} {"train_loss": -12.271989822387695, "global_step": 405863, "epoch": 2415} {"train_loss": -12.501433372497559, "global_step": 405864, "epoch": 2415} {"train_loss": -12.427308082580566, "global_step": 405865, "epoch": 2415} {"train_loss": -12.396913528442383, "global_step": 405866, "epoch": 2415} {"train_loss": -12.345457077026367, "global_step": 405867, "epoch": 2415} {"train_loss": -12.638465881347656, "global_step": 405868, "epoch": 2415} {"train_loss": -12.515756607055664, "global_step": 405869, "epoch": 2415} {"train_loss": -12.414674758911133, "global_step": 405870, "epoch": 2415} {"train_loss": -12.565694808959961, "global_step": 405871, "epoch": 2415} {"train_loss": -12.373881340026855, "global_step": 405872, "epoch": 2415} {"train_loss": -12.675512313842773, "global_step": 405873, "epoch": 2415} {"train_loss": -12.473503112792969, "global_step": 405874, "epoch": 2415} {"train_loss": -12.213371276855469, "global_step": 405875, "epoch": 2415} {"train_loss": -12.565925598144531, "global_step": 405876, "epoch": 2415} {"train_loss": -12.513643264770508, "global_step": 405877, "epoch": 2415} {"train_loss": -12.844900131225586, "global_step": 405878, "epoch": 2415} {"train_loss": -12.545769691467285, "global_step": 405879, "epoch": 2415} {"train_loss": -12.755279541015625, "global_step": 405880, "epoch": 2415} {"train_loss": -12.805903434753418, "global_step": 405881, "epoch": 2415} {"train_loss": -12.659989356994629, "global_step": 405882, "epoch": 2415} {"train_loss": -12.785927772521973, "global_step": 405883, "epoch": 2415} {"train_loss": -12.791994094848633, "global_step": 405884, "epoch": 2415} {"train_loss": -12.749855995178223, "global_step": 405885, "epoch": 2415} {"train_loss": -12.814079284667969, "global_step": 405886, "epoch": 2415} {"train_loss": -12.059390964962187, "global_step": 405887, "epoch": 2415, "val_loss": 300763.875, "train_action_mse_error": 1.690124750137329} {"train_loss": -12.504841804504395, "global_step": 405888, "epoch": 2416} {"train_loss": -12.514110565185547, "global_step": 405889, "epoch": 2416} {"train_loss": -12.63701057434082, "global_step": 405890, "epoch": 2416} {"train_loss": -12.54976749420166, "global_step": 405891, "epoch": 2416} {"train_loss": -12.351840019226074, "global_step": 405892, "epoch": 2416} {"train_loss": -12.706680297851562, "global_step": 405893, "epoch": 2416} {"train_loss": -12.456817626953125, "global_step": 405894, "epoch": 2416} {"train_loss": -12.110459327697754, "global_step": 405895, "epoch": 2416} {"train_loss": -12.422122955322266, "global_step": 405896, "epoch": 2416} {"train_loss": -12.706046104431152, "global_step": 405897, "epoch": 2416} {"train_loss": -12.583267211914062, "global_step": 405898, "epoch": 2416} {"train_loss": -12.58780574798584, "global_step": 405899, "epoch": 2416} {"train_loss": -12.784613609313965, "global_step": 405900, "epoch": 2416} {"train_loss": -12.284116744995117, "global_step": 405901, "epoch": 2416} {"train_loss": -11.73867416381836, "global_step": 405902, "epoch": 2416} {"train_loss": -12.540635108947754, "global_step": 405903, "epoch": 2416} {"train_loss": -11.749361038208008, "global_step": 405904, "epoch": 2416} {"train_loss": -12.477060317993164, "global_step": 405905, "epoch": 2416} {"train_loss": -11.90188980102539, "global_step": 405906, "epoch": 2416} {"train_loss": -12.744210243225098, "global_step": 405907, "epoch": 2416} {"train_loss": -11.552802085876465, "global_step": 405908, "epoch": 2416} {"train_loss": -12.231269836425781, "global_step": 405909, "epoch": 2416} {"train_loss": -11.799385070800781, "global_step": 405910, "epoch": 2416} {"train_loss": -12.374771118164062, "global_step": 405911, "epoch": 2416} {"train_loss": -11.721656799316406, "global_step": 405912, "epoch": 2416} {"train_loss": -12.059370040893555, "global_step": 405913, "epoch": 2416} {"train_loss": -11.683952331542969, "global_step": 405914, "epoch": 2416} {"train_loss": -12.183333396911621, "global_step": 405915, "epoch": 2416} {"train_loss": -12.023859977722168, "global_step": 405916, "epoch": 2416} {"train_loss": -11.99656867980957, "global_step": 405917, "epoch": 2416} {"train_loss": -12.402115821838379, "global_step": 405918, "epoch": 2416} {"train_loss": -12.185585975646973, "global_step": 405919, "epoch": 2416} {"train_loss": -12.579195022583008, "global_step": 405920, "epoch": 2416} {"train_loss": -12.495105743408203, "global_step": 405921, "epoch": 2416} {"train_loss": -12.584596633911133, "global_step": 405922, "epoch": 2416} {"train_loss": -12.42056655883789, "global_step": 405923, "epoch": 2416} {"train_loss": -12.637754440307617, "global_step": 405924, "epoch": 2416} {"train_loss": -12.507017135620117, "global_step": 405925, "epoch": 2416} {"train_loss": -12.766656875610352, "global_step": 405926, "epoch": 2416} {"train_loss": -12.130539894104004, "global_step": 405927, "epoch": 2416} {"train_loss": -12.701214790344238, "global_step": 405928, "epoch": 2416} {"train_loss": -12.491079330444336, "global_step": 405929, "epoch": 2416} {"train_loss": -12.217742919921875, "global_step": 405930, "epoch": 2416} {"train_loss": -12.602267265319824, "global_step": 405931, "epoch": 2416} {"train_loss": -12.279083251953125, "global_step": 405932, "epoch": 2416} {"train_loss": -11.820043563842773, "global_step": 405933, "epoch": 2416} {"train_loss": -12.358311653137207, "global_step": 405934, "epoch": 2416} {"train_loss": -11.835714340209961, "global_step": 405935, "epoch": 2416} {"train_loss": -10.936334609985352, "global_step": 405936, "epoch": 2416} {"train_loss": -11.725716590881348, "global_step": 405937, "epoch": 2416} {"train_loss": -11.923564910888672, "global_step": 405938, "epoch": 2416} {"train_loss": -12.473947525024414, "global_step": 405939, "epoch": 2416} {"train_loss": -12.238571166992188, "global_step": 405940, "epoch": 2416} {"train_loss": -12.124856948852539, "global_step": 405941, "epoch": 2416} {"train_loss": -11.26693058013916, "global_step": 405942, "epoch": 2416} {"train_loss": -12.262001991271973, "global_step": 405943, "epoch": 2416} {"train_loss": -12.178470611572266, "global_step": 405944, "epoch": 2416} {"train_loss": -12.48842716217041, "global_step": 405945, "epoch": 2416} {"train_loss": -12.180932998657227, "global_step": 405946, "epoch": 2416} {"train_loss": -12.52685546875, "global_step": 405947, "epoch": 2416} {"train_loss": -11.29216194152832, "global_step": 405948, "epoch": 2416} {"train_loss": -11.63636589050293, "global_step": 405949, "epoch": 2416} {"train_loss": -12.030550003051758, "global_step": 405950, "epoch": 2416} {"train_loss": -11.313653945922852, "global_step": 405951, "epoch": 2416} {"train_loss": -11.701103210449219, "global_step": 405952, "epoch": 2416} {"train_loss": -12.578364372253418, "global_step": 405953, "epoch": 2416} {"train_loss": -12.191095352172852, "global_step": 405954, "epoch": 2416} {"train_loss": -12.19287109375, "global_step": 405955, "epoch": 2416} {"train_loss": -12.034225463867188, "global_step": 405956, "epoch": 2416} {"train_loss": -11.173126220703125, "global_step": 405957, "epoch": 2416} {"train_loss": -11.591306686401367, "global_step": 405958, "epoch": 2416} {"train_loss": -11.999663352966309, "global_step": 405959, "epoch": 2416} {"train_loss": -11.635420799255371, "global_step": 405960, "epoch": 2416} {"train_loss": -11.704507827758789, "global_step": 405961, "epoch": 2416} {"train_loss": -11.896425247192383, "global_step": 405962, "epoch": 2416} {"train_loss": -11.616767883300781, "global_step": 405963, "epoch": 2416} {"train_loss": -11.092363357543945, "global_step": 405964, "epoch": 2416} {"train_loss": -12.31848430633545, "global_step": 405965, "epoch": 2416} {"train_loss": -9.813199996948242, "global_step": 405966, "epoch": 2416} {"train_loss": -11.68935489654541, "global_step": 405967, "epoch": 2416} {"train_loss": -11.275888442993164, "global_step": 405968, "epoch": 2416} {"train_loss": -10.626672744750977, "global_step": 405969, "epoch": 2416} {"train_loss": -11.023269653320312, "global_step": 405970, "epoch": 2416} {"train_loss": -11.859991073608398, "global_step": 405971, "epoch": 2416} {"train_loss": -11.083946228027344, "global_step": 405972, "epoch": 2416} {"train_loss": -11.05899429321289, "global_step": 405973, "epoch": 2416} {"train_loss": -11.583669662475586, "global_step": 405974, "epoch": 2416} {"train_loss": -10.59453010559082, "global_step": 405975, "epoch": 2416} {"train_loss": -11.601058959960938, "global_step": 405976, "epoch": 2416} {"train_loss": -11.326416969299316, "global_step": 405977, "epoch": 2416} {"train_loss": -11.765850067138672, "global_step": 405978, "epoch": 2416} {"train_loss": -11.200056076049805, "global_step": 405979, "epoch": 2416} {"train_loss": -12.522505760192871, "global_step": 405980, "epoch": 2416} {"train_loss": -11.63388442993164, "global_step": 405981, "epoch": 2416} {"train_loss": -11.976175308227539, "global_step": 405982, "epoch": 2416} {"train_loss": -12.0604829788208, "global_step": 405983, "epoch": 2416} {"train_loss": -11.767786026000977, "global_step": 405984, "epoch": 2416} {"train_loss": -12.257604598999023, "global_step": 405985, "epoch": 2416} {"train_loss": -12.117307662963867, "global_step": 405986, "epoch": 2416} {"train_loss": -12.288195610046387, "global_step": 405987, "epoch": 2416} {"train_loss": -11.8668851852417, "global_step": 405988, "epoch": 2416} {"train_loss": -12.159348487854004, "global_step": 405989, "epoch": 2416} {"train_loss": -12.148529052734375, "global_step": 405990, "epoch": 2416} {"train_loss": -12.14682388305664, "global_step": 405991, "epoch": 2416} {"train_loss": -12.202399253845215, "global_step": 405992, "epoch": 2416} {"train_loss": -12.141436576843262, "global_step": 405993, "epoch": 2416} {"train_loss": -12.454245567321777, "global_step": 405994, "epoch": 2416} {"train_loss": -12.176337242126465, "global_step": 405995, "epoch": 2416} {"train_loss": -12.423894882202148, "global_step": 405996, "epoch": 2416} {"train_loss": -12.311083793640137, "global_step": 405997, "epoch": 2416} {"train_loss": -11.936290740966797, "global_step": 405998, "epoch": 2416} {"train_loss": -12.003437995910645, "global_step": 405999, "epoch": 2416} {"train_loss": -12.136466979980469, "global_step": 406000, "epoch": 2416} {"train_loss": -11.825170516967773, "global_step": 406001, "epoch": 2416} {"train_loss": -12.04465103149414, "global_step": 406002, "epoch": 2416} {"train_loss": -12.170112609863281, "global_step": 406003, "epoch": 2416} {"train_loss": -11.215757369995117, "global_step": 406004, "epoch": 2416} {"train_loss": -11.757625579833984, "global_step": 406005, "epoch": 2416} {"train_loss": -11.688068389892578, "global_step": 406006, "epoch": 2416} {"train_loss": -11.561148643493652, "global_step": 406007, "epoch": 2416} {"train_loss": -11.679143905639648, "global_step": 406008, "epoch": 2416} {"train_loss": -12.408485412597656, "global_step": 406009, "epoch": 2416} {"train_loss": -12.153644561767578, "global_step": 406010, "epoch": 2416} {"train_loss": -11.99051284790039, "global_step": 406011, "epoch": 2416} {"train_loss": -12.186253547668457, "global_step": 406012, "epoch": 2416} {"train_loss": -12.289519309997559, "global_step": 406013, "epoch": 2416} {"train_loss": -12.30449104309082, "global_step": 406014, "epoch": 2416} {"train_loss": -12.413410186767578, "global_step": 406015, "epoch": 2416} {"train_loss": -12.389076232910156, "global_step": 406016, "epoch": 2416} {"train_loss": -12.54592514038086, "global_step": 406017, "epoch": 2416} {"train_loss": -12.41826057434082, "global_step": 406018, "epoch": 2416} {"train_loss": -12.582353591918945, "global_step": 406019, "epoch": 2416} {"train_loss": -12.373315811157227, "global_step": 406020, "epoch": 2416} {"train_loss": -12.315363883972168, "global_step": 406021, "epoch": 2416} {"train_loss": -12.50313949584961, "global_step": 406022, "epoch": 2416} {"train_loss": -12.406742095947266, "global_step": 406023, "epoch": 2416} {"train_loss": -12.279631614685059, "global_step": 406024, "epoch": 2416} {"train_loss": -12.570558547973633, "global_step": 406025, "epoch": 2416} {"train_loss": -12.369939804077148, "global_step": 406026, "epoch": 2416} {"train_loss": -12.424248695373535, "global_step": 406027, "epoch": 2416} {"train_loss": -12.333353042602539, "global_step": 406028, "epoch": 2416} {"train_loss": -12.339790344238281, "global_step": 406029, "epoch": 2416} {"train_loss": -12.297660827636719, "global_step": 406030, "epoch": 2416} {"train_loss": -12.206125259399414, "global_step": 406031, "epoch": 2416} {"train_loss": -12.731345176696777, "global_step": 406032, "epoch": 2416} {"train_loss": -12.399521827697754, "global_step": 406033, "epoch": 2416} {"train_loss": -12.708356857299805, "global_step": 406034, "epoch": 2416} {"train_loss": -12.531207084655762, "global_step": 406035, "epoch": 2416} {"train_loss": -12.482370376586914, "global_step": 406036, "epoch": 2416} {"train_loss": -12.36354923248291, "global_step": 406037, "epoch": 2416} {"train_loss": -12.700889587402344, "global_step": 406038, "epoch": 2416} {"train_loss": -12.349079132080078, "global_step": 406039, "epoch": 2416} {"train_loss": -12.718280792236328, "global_step": 406040, "epoch": 2416} {"train_loss": -12.548617362976074, "global_step": 406041, "epoch": 2416} {"train_loss": -12.804816246032715, "global_step": 406042, "epoch": 2416} {"train_loss": -12.589405059814453, "global_step": 406043, "epoch": 2416} {"train_loss": -12.651954650878906, "global_step": 406044, "epoch": 2416} {"train_loss": -12.620002746582031, "global_step": 406045, "epoch": 2416} {"train_loss": -12.40493106842041, "global_step": 406046, "epoch": 2416} {"train_loss": -12.669790267944336, "global_step": 406047, "epoch": 2416} {"train_loss": -12.750715255737305, "global_step": 406048, "epoch": 2416} {"train_loss": -12.732505798339844, "global_step": 406049, "epoch": 2416} {"train_loss": -12.632926940917969, "global_step": 406050, "epoch": 2416} {"train_loss": -12.557013511657715, "global_step": 406051, "epoch": 2416} {"train_loss": -13.01953411102295, "global_step": 406052, "epoch": 2416} {"train_loss": -12.513418197631836, "global_step": 406053, "epoch": 2416} {"train_loss": -12.910356521606445, "global_step": 406054, "epoch": 2416} {"train_loss": -12.140740428652082, "global_step": 406055, "epoch": 2416, "val_loss": 300977.8125} {"train_loss": -12.736589431762695, "global_step": 406056, "epoch": 2417} {"train_loss": -12.714634895324707, "global_step": 406057, "epoch": 2417} {"train_loss": -12.848644256591797, "global_step": 406058, "epoch": 2417} {"train_loss": -12.656576156616211, "global_step": 406059, "epoch": 2417} {"train_loss": -12.699766159057617, "global_step": 406060, "epoch": 2417} {"train_loss": -12.566535949707031, "global_step": 406061, "epoch": 2417} {"train_loss": -12.177742004394531, "global_step": 406062, "epoch": 2417} {"train_loss": -12.642748832702637, "global_step": 406063, "epoch": 2417} {"train_loss": -12.709514617919922, "global_step": 406064, "epoch": 2417} {"train_loss": -12.168320655822754, "global_step": 406065, "epoch": 2417} {"train_loss": -12.591854095458984, "global_step": 406066, "epoch": 2417} {"train_loss": -12.708751678466797, "global_step": 406067, "epoch": 2417} {"train_loss": -12.450325012207031, "global_step": 406068, "epoch": 2417} {"train_loss": -12.491748809814453, "global_step": 406069, "epoch": 2417} {"train_loss": -12.568443298339844, "global_step": 406070, "epoch": 2417} {"train_loss": -11.975030899047852, "global_step": 406071, "epoch": 2417} {"train_loss": -12.066427230834961, "global_step": 406072, "epoch": 2417} {"train_loss": -12.869930267333984, "global_step": 406073, "epoch": 2417} {"train_loss": -12.18275260925293, "global_step": 406074, "epoch": 2417} {"train_loss": -12.202467918395996, "global_step": 406075, "epoch": 2417} {"train_loss": -11.921653747558594, "global_step": 406076, "epoch": 2417} {"train_loss": -11.848288536071777, "global_step": 406077, "epoch": 2417} {"train_loss": -12.254884719848633, "global_step": 406078, "epoch": 2417} {"train_loss": -11.196833610534668, "global_step": 406079, "epoch": 2417} {"train_loss": -11.884613990783691, "global_step": 406080, "epoch": 2417} {"train_loss": -11.189695358276367, "global_step": 406081, "epoch": 2417} {"train_loss": -11.42287826538086, "global_step": 406082, "epoch": 2417} {"train_loss": -10.460464477539062, "global_step": 406083, "epoch": 2417} {"train_loss": -11.316656112670898, "global_step": 406084, "epoch": 2417} {"train_loss": -10.706724166870117, "global_step": 406085, "epoch": 2417} {"train_loss": -9.821545600891113, "global_step": 406086, "epoch": 2417} {"train_loss": -9.721150398254395, "global_step": 406087, "epoch": 2417} {"train_loss": -9.4384765625, "global_step": 406088, "epoch": 2417} {"train_loss": -10.377490997314453, "global_step": 406089, "epoch": 2417} {"train_loss": -10.747808456420898, "global_step": 406090, "epoch": 2417} {"train_loss": -9.979156494140625, "global_step": 406091, "epoch": 2417} {"train_loss": -10.377416610717773, "global_step": 406092, "epoch": 2417} {"train_loss": -11.030035972595215, "global_step": 406093, "epoch": 2417} {"train_loss": -11.354503631591797, "global_step": 406094, "epoch": 2417} {"train_loss": -9.788671493530273, "global_step": 406095, "epoch": 2417} {"train_loss": -11.063544273376465, "global_step": 406096, "epoch": 2417} {"train_loss": -10.376258850097656, "global_step": 406097, "epoch": 2417} {"train_loss": -11.868481636047363, "global_step": 406098, "epoch": 2417} {"train_loss": -11.441261291503906, "global_step": 406099, "epoch": 2417} {"train_loss": -11.852715492248535, "global_step": 406100, "epoch": 2417} {"train_loss": -11.731866836547852, "global_step": 406101, "epoch": 2417} {"train_loss": -11.787622451782227, "global_step": 406102, "epoch": 2417} {"train_loss": -11.644338607788086, "global_step": 406103, "epoch": 2417} {"train_loss": -12.23524284362793, "global_step": 406104, "epoch": 2417} {"train_loss": -11.73915958404541, "global_step": 406105, "epoch": 2417} {"train_loss": -11.999513626098633, "global_step": 406106, "epoch": 2417} {"train_loss": -12.103582382202148, "global_step": 406107, "epoch": 2417} {"train_loss": -11.71701431274414, "global_step": 406108, "epoch": 2417} {"train_loss": -12.199511528015137, "global_step": 406109, "epoch": 2417} {"train_loss": -12.113018989562988, "global_step": 406110, "epoch": 2417} {"train_loss": -11.934776306152344, "global_step": 406111, "epoch": 2417} {"train_loss": -12.202439308166504, "global_step": 406112, "epoch": 2417} {"train_loss": -12.226059913635254, "global_step": 406113, "epoch": 2417} {"train_loss": -12.064275741577148, "global_step": 406114, "epoch": 2417} {"train_loss": -12.02243423461914, "global_step": 406115, "epoch": 2417} {"train_loss": -12.061498641967773, "global_step": 406116, "epoch": 2417} {"train_loss": -12.201576232910156, "global_step": 406117, "epoch": 2417} {"train_loss": -12.094987869262695, "global_step": 406118, "epoch": 2417} {"train_loss": -12.112117767333984, "global_step": 406119, "epoch": 2417} {"train_loss": -12.011337280273438, "global_step": 406120, "epoch": 2417} {"train_loss": -11.703019142150879, "global_step": 406121, "epoch": 2417} {"train_loss": -12.293368339538574, "global_step": 406122, "epoch": 2417} {"train_loss": -12.329957962036133, "global_step": 406123, "epoch": 2417} {"train_loss": -12.163599014282227, "global_step": 406124, "epoch": 2417} {"train_loss": -11.712931632995605, "global_step": 406125, "epoch": 2417} {"train_loss": -12.31434440612793, "global_step": 406126, "epoch": 2417} {"train_loss": -12.460959434509277, "global_step": 406127, "epoch": 2417} {"train_loss": -12.482927322387695, "global_step": 406128, "epoch": 2417} {"train_loss": -12.065841674804688, "global_step": 406129, "epoch": 2417} {"train_loss": -12.689396858215332, "global_step": 406130, "epoch": 2417} {"train_loss": -12.235416412353516, "global_step": 406131, "epoch": 2417} {"train_loss": -12.228536605834961, "global_step": 406132, "epoch": 2417} {"train_loss": -12.253373146057129, "global_step": 406133, "epoch": 2417} {"train_loss": -12.384132385253906, "global_step": 406134, "epoch": 2417} {"train_loss": -12.333099365234375, "global_step": 406135, "epoch": 2417} {"train_loss": -12.413573265075684, "global_step": 406136, "epoch": 2417} {"train_loss": -12.530263900756836, "global_step": 406137, "epoch": 2417} {"train_loss": -12.450307846069336, "global_step": 406138, "epoch": 2417} {"train_loss": -12.416620254516602, "global_step": 406139, "epoch": 2417} {"train_loss": -12.392986297607422, "global_step": 406140, "epoch": 2417} {"train_loss": -12.628607749938965, "global_step": 406141, "epoch": 2417} {"train_loss": -12.516825675964355, "global_step": 406142, "epoch": 2417} {"train_loss": -12.499797821044922, "global_step": 406143, "epoch": 2417} {"train_loss": -12.583805084228516, "global_step": 406144, "epoch": 2417} {"train_loss": -12.578824996948242, "global_step": 406145, "epoch": 2417} {"train_loss": -12.505863189697266, "global_step": 406146, "epoch": 2417} {"train_loss": -12.610822677612305, "global_step": 406147, "epoch": 2417} {"train_loss": -12.613733291625977, "global_step": 406148, "epoch": 2417} {"train_loss": -12.643041610717773, "global_step": 406149, "epoch": 2417} {"train_loss": -12.377410888671875, "global_step": 406150, "epoch": 2417} {"train_loss": -12.773213386535645, "global_step": 406151, "epoch": 2417} {"train_loss": -12.453245162963867, "global_step": 406152, "epoch": 2417} {"train_loss": -12.611780166625977, "global_step": 406153, "epoch": 2417} {"train_loss": -12.627073287963867, "global_step": 406154, "epoch": 2417} {"train_loss": -12.500720024108887, "global_step": 406155, "epoch": 2417} {"train_loss": -12.677918434143066, "global_step": 406156, "epoch": 2417} {"train_loss": -12.736605644226074, "global_step": 406157, "epoch": 2417} {"train_loss": -12.731786727905273, "global_step": 406158, "epoch": 2417} {"train_loss": -12.701257705688477, "global_step": 406159, "epoch": 2417} {"train_loss": -12.731301307678223, "global_step": 406160, "epoch": 2417} {"train_loss": -12.706863403320312, "global_step": 406161, "epoch": 2417} {"train_loss": -12.752668380737305, "global_step": 406162, "epoch": 2417} {"train_loss": -12.791099548339844, "global_step": 406163, "epoch": 2417} {"train_loss": -12.727544784545898, "global_step": 406164, "epoch": 2417} {"train_loss": -12.710464477539062, "global_step": 406165, "epoch": 2417} {"train_loss": -12.727131843566895, "global_step": 406166, "epoch": 2417} {"train_loss": -12.591474533081055, "global_step": 406167, "epoch": 2417} {"train_loss": -12.909622192382812, "global_step": 406168, "epoch": 2417} {"train_loss": -12.844892501831055, "global_step": 406169, "epoch": 2417} {"train_loss": -12.857933044433594, "global_step": 406170, "epoch": 2417} {"train_loss": -12.753294944763184, "global_step": 406171, "epoch": 2417} {"train_loss": -12.478249549865723, "global_step": 406172, "epoch": 2417} {"train_loss": -12.503637313842773, "global_step": 406173, "epoch": 2417} {"train_loss": -12.642050743103027, "global_step": 406174, "epoch": 2417} {"train_loss": -12.725506782531738, "global_step": 406175, "epoch": 2417} {"train_loss": -12.790017127990723, "global_step": 406176, "epoch": 2417} {"train_loss": -12.668038368225098, "global_step": 406177, "epoch": 2417} {"train_loss": -12.900629043579102, "global_step": 406178, "epoch": 2417} {"train_loss": -12.626256942749023, "global_step": 406179, "epoch": 2417} {"train_loss": -12.616410255432129, "global_step": 406180, "epoch": 2417} {"train_loss": -12.335010528564453, "global_step": 406181, "epoch": 2417} {"train_loss": -12.418235778808594, "global_step": 406182, "epoch": 2417} {"train_loss": -11.972234725952148, "global_step": 406183, "epoch": 2417} {"train_loss": -12.139602661132812, "global_step": 406184, "epoch": 2417} {"train_loss": -12.409194946289062, "global_step": 406185, "epoch": 2417} {"train_loss": -12.592500686645508, "global_step": 406186, "epoch": 2417} {"train_loss": -11.819833755493164, "global_step": 406187, "epoch": 2417} {"train_loss": -11.29615592956543, "global_step": 406188, "epoch": 2417} {"train_loss": -11.355106353759766, "global_step": 406189, "epoch": 2417} {"train_loss": -12.561140060424805, "global_step": 406190, "epoch": 2417} {"train_loss": -11.974615097045898, "global_step": 406191, "epoch": 2417} {"train_loss": -11.06110954284668, "global_step": 406192, "epoch": 2417} {"train_loss": -10.806894302368164, "global_step": 406193, "epoch": 2417} {"train_loss": -12.445064544677734, "global_step": 406194, "epoch": 2417} {"train_loss": -10.64824104309082, "global_step": 406195, "epoch": 2417} {"train_loss": -11.184491157531738, "global_step": 406196, "epoch": 2417} {"train_loss": -9.894433975219727, "global_step": 406197, "epoch": 2417} {"train_loss": -10.354419708251953, "global_step": 406198, "epoch": 2417} {"train_loss": -9.35301399230957, "global_step": 406199, "epoch": 2417} {"train_loss": -10.768234252929688, "global_step": 406200, "epoch": 2417} {"train_loss": -10.098487854003906, "global_step": 406201, "epoch": 2417} {"train_loss": -10.442273139953613, "global_step": 406202, "epoch": 2417} {"train_loss": -8.778661727905273, "global_step": 406203, "epoch": 2417} {"train_loss": -11.179919242858887, "global_step": 406204, "epoch": 2417} {"train_loss": -10.478706359863281, "global_step": 406205, "epoch": 2417} {"train_loss": -9.445479393005371, "global_step": 406206, "epoch": 2417} {"train_loss": -10.967792510986328, "global_step": 406207, "epoch": 2417} {"train_loss": -9.12507438659668, "global_step": 406208, "epoch": 2417} {"train_loss": -11.643465042114258, "global_step": 406209, "epoch": 2417} {"train_loss": -9.281356811523438, "global_step": 406210, "epoch": 2417} {"train_loss": -11.360118865966797, "global_step": 406211, "epoch": 2417} {"train_loss": -10.917978286743164, "global_step": 406212, "epoch": 2417} {"train_loss": -11.248741149902344, "global_step": 406213, "epoch": 2417} {"train_loss": -11.588727951049805, "global_step": 406214, "epoch": 2417} {"train_loss": -11.572211265563965, "global_step": 406215, "epoch": 2417} {"train_loss": -11.545734405517578, "global_step": 406216, "epoch": 2417} {"train_loss": -10.509078979492188, "global_step": 406217, "epoch": 2417} {"train_loss": -12.125450134277344, "global_step": 406218, "epoch": 2417} {"train_loss": -10.55085563659668, "global_step": 406219, "epoch": 2417} {"train_loss": -11.921022415161133, "global_step": 406220, "epoch": 2417} {"train_loss": -11.411867141723633, "global_step": 406221, "epoch": 2417} {"train_loss": -11.90080451965332, "global_step": 406222, "epoch": 2417} {"train_loss": -11.875447523026239, "global_step": 406223, "epoch": 2417, "val_loss": 307249.21875} {"train_loss": -12.02746295928955, "global_step": 406224, "epoch": 2418} {"train_loss": -11.78721809387207, "global_step": 406225, "epoch": 2418} {"train_loss": -11.97602367401123, "global_step": 406226, "epoch": 2418} {"train_loss": -12.00933837890625, "global_step": 406227, "epoch": 2418} {"train_loss": -12.02978515625, "global_step": 406228, "epoch": 2418} {"train_loss": -11.810237884521484, "global_step": 406229, "epoch": 2418} {"train_loss": -11.622417449951172, "global_step": 406230, "epoch": 2418} {"train_loss": -12.032949447631836, "global_step": 406231, "epoch": 2418} {"train_loss": -11.85713005065918, "global_step": 406232, "epoch": 2418} {"train_loss": -11.989675521850586, "global_step": 406233, "epoch": 2418} {"train_loss": -11.9310941696167, "global_step": 406234, "epoch": 2418} {"train_loss": -12.208284378051758, "global_step": 406235, "epoch": 2418} {"train_loss": -11.97972297668457, "global_step": 406236, "epoch": 2418} {"train_loss": -12.242615699768066, "global_step": 406237, "epoch": 2418} {"train_loss": -12.125009536743164, "global_step": 406238, "epoch": 2418} {"train_loss": -11.998212814331055, "global_step": 406239, "epoch": 2418} {"train_loss": -12.32493782043457, "global_step": 406240, "epoch": 2418} {"train_loss": -12.077436447143555, "global_step": 406241, "epoch": 2418} {"train_loss": -12.318136215209961, "global_step": 406242, "epoch": 2418} {"train_loss": -12.441816329956055, "global_step": 406243, "epoch": 2418} {"train_loss": -12.365167617797852, "global_step": 406244, "epoch": 2418} {"train_loss": -12.358492851257324, "global_step": 406245, "epoch": 2418} {"train_loss": -12.156543731689453, "global_step": 406246, "epoch": 2418} {"train_loss": -12.324707984924316, "global_step": 406247, "epoch": 2418} {"train_loss": -12.19459342956543, "global_step": 406248, "epoch": 2418} {"train_loss": -12.429990768432617, "global_step": 406249, "epoch": 2418} {"train_loss": -12.103679656982422, "global_step": 406250, "epoch": 2418} {"train_loss": -12.370203018188477, "global_step": 406251, "epoch": 2418} {"train_loss": -12.106204986572266, "global_step": 406252, "epoch": 2418} {"train_loss": -12.43470573425293, "global_step": 406253, "epoch": 2418} {"train_loss": -12.41675853729248, "global_step": 406254, "epoch": 2418} {"train_loss": -12.50737190246582, "global_step": 406255, "epoch": 2418} {"train_loss": -12.445256233215332, "global_step": 406256, "epoch": 2418} {"train_loss": -12.185159683227539, "global_step": 406257, "epoch": 2418} {"train_loss": -12.270076751708984, "global_step": 406258, "epoch": 2418} {"train_loss": -12.196491241455078, "global_step": 406259, "epoch": 2418} {"train_loss": -11.957944869995117, "global_step": 406260, "epoch": 2418} {"train_loss": -12.592401504516602, "global_step": 406261, "epoch": 2418} {"train_loss": -12.009119033813477, "global_step": 406262, "epoch": 2418} {"train_loss": -12.309843063354492, "global_step": 406263, "epoch": 2418} {"train_loss": -12.107728958129883, "global_step": 406264, "epoch": 2418} {"train_loss": -12.137908935546875, "global_step": 406265, "epoch": 2418} {"train_loss": -12.157257080078125, "global_step": 406266, "epoch": 2418} {"train_loss": -12.251378059387207, "global_step": 406267, "epoch": 2418} {"train_loss": -11.808019638061523, "global_step": 406268, "epoch": 2418} {"train_loss": -12.17586898803711, "global_step": 406269, "epoch": 2418} {"train_loss": -11.905755996704102, "global_step": 406270, "epoch": 2418} {"train_loss": -12.256123542785645, "global_step": 406271, "epoch": 2418} {"train_loss": -12.130903244018555, "global_step": 406272, "epoch": 2418} {"train_loss": -12.112985610961914, "global_step": 406273, "epoch": 2418} {"train_loss": -12.432686805725098, "global_step": 406274, "epoch": 2418} {"train_loss": -11.674639701843262, "global_step": 406275, "epoch": 2418} {"train_loss": -12.565834999084473, "global_step": 406276, "epoch": 2418} {"train_loss": -11.77139663696289, "global_step": 406277, "epoch": 2418} {"train_loss": -12.61165714263916, "global_step": 406278, "epoch": 2418} {"train_loss": -11.940269470214844, "global_step": 406279, "epoch": 2418} {"train_loss": -12.515342712402344, "global_step": 406280, "epoch": 2418} {"train_loss": -12.244207382202148, "global_step": 406281, "epoch": 2418} {"train_loss": -12.416220664978027, "global_step": 406282, "epoch": 2418} {"train_loss": -12.452110290527344, "global_step": 406283, "epoch": 2418} {"train_loss": -12.552957534790039, "global_step": 406284, "epoch": 2418} {"train_loss": -12.56144905090332, "global_step": 406285, "epoch": 2418} {"train_loss": -12.41227912902832, "global_step": 406286, "epoch": 2418} {"train_loss": -12.455568313598633, "global_step": 406287, "epoch": 2418} {"train_loss": -12.449341773986816, "global_step": 406288, "epoch": 2418} {"train_loss": -12.51507568359375, "global_step": 406289, "epoch": 2418} {"train_loss": -12.329254150390625, "global_step": 406290, "epoch": 2418} {"train_loss": -12.813338279724121, "global_step": 406291, "epoch": 2418} {"train_loss": -12.377687454223633, "global_step": 406292, "epoch": 2418} {"train_loss": -12.581981658935547, "global_step": 406293, "epoch": 2418} {"train_loss": -12.653989791870117, "global_step": 406294, "epoch": 2418} {"train_loss": -12.59144401550293, "global_step": 406295, "epoch": 2418} {"train_loss": -12.631759643554688, "global_step": 406296, "epoch": 2418} {"train_loss": -12.528536796569824, "global_step": 406297, "epoch": 2418} {"train_loss": -12.56766128540039, "global_step": 406298, "epoch": 2418} {"train_loss": -12.592215538024902, "global_step": 406299, "epoch": 2418} {"train_loss": -12.403177261352539, "global_step": 406300, "epoch": 2418} {"train_loss": -12.42766284942627, "global_step": 406301, "epoch": 2418} {"train_loss": -12.52291488647461, "global_step": 406302, "epoch": 2418} {"train_loss": -12.486291885375977, "global_step": 406303, "epoch": 2418} {"train_loss": -12.102622985839844, "global_step": 406304, "epoch": 2418} {"train_loss": -12.56895637512207, "global_step": 406305, "epoch": 2418} {"train_loss": -12.242389678955078, "global_step": 406306, "epoch": 2418} {"train_loss": -11.890022277832031, "global_step": 406307, "epoch": 2418} {"train_loss": -12.636804580688477, "global_step": 406308, "epoch": 2418} {"train_loss": -12.501184463500977, "global_step": 406309, "epoch": 2418} {"train_loss": -12.783985137939453, "global_step": 406310, "epoch": 2418} {"train_loss": -12.676498413085938, "global_step": 406311, "epoch": 2418} {"train_loss": -12.7213716506958, "global_step": 406312, "epoch": 2418} {"train_loss": -12.635965347290039, "global_step": 406313, "epoch": 2418} {"train_loss": -12.703935623168945, "global_step": 406314, "epoch": 2418} {"train_loss": -12.322209358215332, "global_step": 406315, "epoch": 2418} {"train_loss": -12.551318168640137, "global_step": 406316, "epoch": 2418} {"train_loss": -12.42599868774414, "global_step": 406317, "epoch": 2418} {"train_loss": -12.21348762512207, "global_step": 406318, "epoch": 2418} {"train_loss": -12.356019973754883, "global_step": 406319, "epoch": 2418} {"train_loss": -12.609399795532227, "global_step": 406320, "epoch": 2418} {"train_loss": -11.895791053771973, "global_step": 406321, "epoch": 2418} {"train_loss": -11.91480827331543, "global_step": 406322, "epoch": 2418} {"train_loss": -12.619707107543945, "global_step": 406323, "epoch": 2418} {"train_loss": -11.8783597946167, "global_step": 406324, "epoch": 2418} {"train_loss": -12.207113265991211, "global_step": 406325, "epoch": 2418} {"train_loss": -11.892329216003418, "global_step": 406326, "epoch": 2418} {"train_loss": -11.397409439086914, "global_step": 406327, "epoch": 2418} {"train_loss": -12.086043357849121, "global_step": 406328, "epoch": 2418} {"train_loss": -11.137632369995117, "global_step": 406329, "epoch": 2418} {"train_loss": -11.759119033813477, "global_step": 406330, "epoch": 2418} {"train_loss": -12.175956726074219, "global_step": 406331, "epoch": 2418} {"train_loss": -10.504438400268555, "global_step": 406332, "epoch": 2418} {"train_loss": -9.78596305847168, "global_step": 406333, "epoch": 2418} {"train_loss": -12.296862602233887, "global_step": 406334, "epoch": 2418} {"train_loss": -11.045674324035645, "global_step": 406335, "epoch": 2418} {"train_loss": -12.120330810546875, "global_step": 406336, "epoch": 2418} {"train_loss": -11.088293075561523, "global_step": 406337, "epoch": 2418} {"train_loss": -12.333108901977539, "global_step": 406338, "epoch": 2418} {"train_loss": -11.897453308105469, "global_step": 406339, "epoch": 2418} {"train_loss": -11.61937141418457, "global_step": 406340, "epoch": 2418} {"train_loss": -11.751489639282227, "global_step": 406341, "epoch": 2418} {"train_loss": -10.108991622924805, "global_step": 406342, "epoch": 2418} {"train_loss": -12.29345417022705, "global_step": 406343, "epoch": 2418} {"train_loss": -10.865094184875488, "global_step": 406344, "epoch": 2418} {"train_loss": -11.682405471801758, "global_step": 406345, "epoch": 2418} {"train_loss": -12.078641891479492, "global_step": 406346, "epoch": 2418} {"train_loss": -10.885099411010742, "global_step": 406347, "epoch": 2418} {"train_loss": -12.246879577636719, "global_step": 406348, "epoch": 2418} {"train_loss": -11.301703453063965, "global_step": 406349, "epoch": 2418} {"train_loss": -12.039562225341797, "global_step": 406350, "epoch": 2418} {"train_loss": -11.769214630126953, "global_step": 406351, "epoch": 2418} {"train_loss": -11.73679256439209, "global_step": 406352, "epoch": 2418} {"train_loss": -11.999122619628906, "global_step": 406353, "epoch": 2418} {"train_loss": -11.541168212890625, "global_step": 406354, "epoch": 2418} {"train_loss": -11.787724494934082, "global_step": 406355, "epoch": 2418} {"train_loss": -11.221341133117676, "global_step": 406356, "epoch": 2418} {"train_loss": -11.903846740722656, "global_step": 406357, "epoch": 2418} {"train_loss": -11.780771255493164, "global_step": 406358, "epoch": 2418} {"train_loss": -12.119122505187988, "global_step": 406359, "epoch": 2418} {"train_loss": -11.868324279785156, "global_step": 406360, "epoch": 2418} {"train_loss": -12.040802001953125, "global_step": 406361, "epoch": 2418} {"train_loss": -11.870992660522461, "global_step": 406362, "epoch": 2418} {"train_loss": -12.072318077087402, "global_step": 406363, "epoch": 2418} {"train_loss": -12.242182731628418, "global_step": 406364, "epoch": 2418} {"train_loss": -11.971319198608398, "global_step": 406365, "epoch": 2418} {"train_loss": -12.262758255004883, "global_step": 406366, "epoch": 2418} {"train_loss": -12.275941848754883, "global_step": 406367, "epoch": 2418} {"train_loss": -11.956905364990234, "global_step": 406368, "epoch": 2418} {"train_loss": -12.119071960449219, "global_step": 406369, "epoch": 2418} {"train_loss": -11.758750915527344, "global_step": 406370, "epoch": 2418} {"train_loss": -12.515230178833008, "global_step": 406371, "epoch": 2418} {"train_loss": -11.90250301361084, "global_step": 406372, "epoch": 2418} {"train_loss": -12.479204177856445, "global_step": 406373, "epoch": 2418} {"train_loss": -11.844037055969238, "global_step": 406374, "epoch": 2418} {"train_loss": -12.134395599365234, "global_step": 406375, "epoch": 2418} {"train_loss": -11.92013931274414, "global_step": 406376, "epoch": 2418} {"train_loss": -11.679691314697266, "global_step": 406377, "epoch": 2418} {"train_loss": -12.432231903076172, "global_step": 406378, "epoch": 2418} {"train_loss": -12.127584457397461, "global_step": 406379, "epoch": 2418} {"train_loss": -11.435040473937988, "global_step": 406380, "epoch": 2418} {"train_loss": -12.297760963439941, "global_step": 406381, "epoch": 2418} {"train_loss": -11.667266845703125, "global_step": 406382, "epoch": 2418} {"train_loss": -12.027060508728027, "global_step": 406383, "epoch": 2418} {"train_loss": -12.008892059326172, "global_step": 406384, "epoch": 2418} {"train_loss": -11.296611785888672, "global_step": 406385, "epoch": 2418} {"train_loss": -12.118049621582031, "global_step": 406386, "epoch": 2418} {"train_loss": -11.992626190185547, "global_step": 406387, "epoch": 2418} {"train_loss": -12.582487106323242, "global_step": 406388, "epoch": 2418} {"train_loss": -12.204549789428711, "global_step": 406389, "epoch": 2418} {"train_loss": -12.41997241973877, "global_step": 406390, "epoch": 2418} {"train_loss": -12.100866260982695, "global_step": 406391, "epoch": 2418, "val_loss": 305409.84375} {"train_loss": -12.133943557739258, "global_step": 406392, "epoch": 2419} {"train_loss": -12.632231712341309, "global_step": 406393, "epoch": 2419} {"train_loss": -11.931710243225098, "global_step": 406394, "epoch": 2419} {"train_loss": -12.315262794494629, "global_step": 406395, "epoch": 2419} {"train_loss": -12.472240447998047, "global_step": 406396, "epoch": 2419} {"train_loss": -12.571268081665039, "global_step": 406397, "epoch": 2419} {"train_loss": -12.381118774414062, "global_step": 406398, "epoch": 2419} {"train_loss": -12.549488067626953, "global_step": 406399, "epoch": 2419} {"train_loss": -12.452449798583984, "global_step": 406400, "epoch": 2419} {"train_loss": -12.76718521118164, "global_step": 406401, "epoch": 2419} {"train_loss": -12.131325721740723, "global_step": 406402, "epoch": 2419} {"train_loss": -11.883983612060547, "global_step": 406403, "epoch": 2419} {"train_loss": -12.62971305847168, "global_step": 406404, "epoch": 2419} {"train_loss": -11.56618881225586, "global_step": 406405, "epoch": 2419} {"train_loss": -12.551735877990723, "global_step": 406406, "epoch": 2419} {"train_loss": -11.794687271118164, "global_step": 406407, "epoch": 2419} {"train_loss": -12.13508415222168, "global_step": 406408, "epoch": 2419} {"train_loss": -12.567678451538086, "global_step": 406409, "epoch": 2419} {"train_loss": -12.462255477905273, "global_step": 406410, "epoch": 2419} {"train_loss": -12.601886749267578, "global_step": 406411, "epoch": 2419} {"train_loss": -12.570818901062012, "global_step": 406412, "epoch": 2419} {"train_loss": -12.659112930297852, "global_step": 406413, "epoch": 2419} {"train_loss": -12.469854354858398, "global_step": 406414, "epoch": 2419} {"train_loss": -12.516997337341309, "global_step": 406415, "epoch": 2419} {"train_loss": -12.617494583129883, "global_step": 406416, "epoch": 2419} {"train_loss": -12.522473335266113, "global_step": 406417, "epoch": 2419} {"train_loss": -12.647136688232422, "global_step": 406418, "epoch": 2419} {"train_loss": -12.448149681091309, "global_step": 406419, "epoch": 2419} {"train_loss": -12.60787582397461, "global_step": 406420, "epoch": 2419} {"train_loss": -12.637142181396484, "global_step": 406421, "epoch": 2419} {"train_loss": -12.548881530761719, "global_step": 406422, "epoch": 2419} {"train_loss": -12.765811920166016, "global_step": 406423, "epoch": 2419} {"train_loss": -12.662220001220703, "global_step": 406424, "epoch": 2419} {"train_loss": -12.47087287902832, "global_step": 406425, "epoch": 2419} {"train_loss": -12.717742919921875, "global_step": 406426, "epoch": 2419} {"train_loss": -12.54146957397461, "global_step": 406427, "epoch": 2419} {"train_loss": -12.767724990844727, "global_step": 406428, "epoch": 2419} {"train_loss": -12.682367324829102, "global_step": 406429, "epoch": 2419} {"train_loss": -12.067022323608398, "global_step": 406430, "epoch": 2419} {"train_loss": -12.739360809326172, "global_step": 406431, "epoch": 2419} {"train_loss": -12.570895195007324, "global_step": 406432, "epoch": 2419} {"train_loss": -12.31436538696289, "global_step": 406433, "epoch": 2419} {"train_loss": -12.733787536621094, "global_step": 406434, "epoch": 2419} {"train_loss": -12.557615280151367, "global_step": 406435, "epoch": 2419} {"train_loss": -12.380306243896484, "global_step": 406436, "epoch": 2419} {"train_loss": -12.64004898071289, "global_step": 406437, "epoch": 2419} {"train_loss": -12.520051956176758, "global_step": 406438, "epoch": 2419} {"train_loss": -12.262807846069336, "global_step": 406439, "epoch": 2419} {"train_loss": -12.476141929626465, "global_step": 406440, "epoch": 2419} {"train_loss": -12.682519912719727, "global_step": 406441, "epoch": 2419} {"train_loss": -12.351481437683105, "global_step": 406442, "epoch": 2419} {"train_loss": -12.683683395385742, "global_step": 406443, "epoch": 2419} {"train_loss": -12.618309020996094, "global_step": 406444, "epoch": 2419} {"train_loss": -12.131935119628906, "global_step": 406445, "epoch": 2419} {"train_loss": -12.728586196899414, "global_step": 406446, "epoch": 2419} {"train_loss": -11.422616958618164, "global_step": 406447, "epoch": 2419} {"train_loss": -11.922676086425781, "global_step": 406448, "epoch": 2419} {"train_loss": -12.389601707458496, "global_step": 406449, "epoch": 2419} {"train_loss": -11.91663932800293, "global_step": 406450, "epoch": 2419} {"train_loss": -11.767510414123535, "global_step": 406451, "epoch": 2419} {"train_loss": -12.402502059936523, "global_step": 406452, "epoch": 2419} {"train_loss": -12.102547645568848, "global_step": 406453, "epoch": 2419} {"train_loss": -12.628036499023438, "global_step": 406454, "epoch": 2419} {"train_loss": -12.16879653930664, "global_step": 406455, "epoch": 2419} {"train_loss": -12.202315330505371, "global_step": 406456, "epoch": 2419} {"train_loss": -12.185441970825195, "global_step": 406457, "epoch": 2419} {"train_loss": -12.394341468811035, "global_step": 406458, "epoch": 2419} {"train_loss": -12.415377616882324, "global_step": 406459, "epoch": 2419} {"train_loss": -12.224915504455566, "global_step": 406460, "epoch": 2419} {"train_loss": -12.853212356567383, "global_step": 406461, "epoch": 2419} {"train_loss": -12.32756233215332, "global_step": 406462, "epoch": 2419} {"train_loss": -12.700216293334961, "global_step": 406463, "epoch": 2419} {"train_loss": -12.209551811218262, "global_step": 406464, "epoch": 2419} {"train_loss": -12.572671890258789, "global_step": 406465, "epoch": 2419} {"train_loss": -11.164979934692383, "global_step": 406466, "epoch": 2419} {"train_loss": -11.390254974365234, "global_step": 406467, "epoch": 2419} {"train_loss": -10.766538619995117, "global_step": 406468, "epoch": 2419} {"train_loss": -12.207738876342773, "global_step": 406469, "epoch": 2419} {"train_loss": -10.597299575805664, "global_step": 406470, "epoch": 2419} {"train_loss": -12.160310745239258, "global_step": 406471, "epoch": 2419} {"train_loss": -11.124529838562012, "global_step": 406472, "epoch": 2419} {"train_loss": -11.422661781311035, "global_step": 406473, "epoch": 2419} {"train_loss": -11.299266815185547, "global_step": 406474, "epoch": 2419} {"train_loss": -8.668785095214844, "global_step": 406475, "epoch": 2419} {"train_loss": -11.428633689880371, "global_step": 406476, "epoch": 2419} {"train_loss": -10.508295059204102, "global_step": 406477, "epoch": 2419} {"train_loss": -11.57082462310791, "global_step": 406478, "epoch": 2419} {"train_loss": -10.215605735778809, "global_step": 406479, "epoch": 2419} {"train_loss": -10.430776596069336, "global_step": 406480, "epoch": 2419} {"train_loss": -11.325225830078125, "global_step": 406481, "epoch": 2419} {"train_loss": -9.875972747802734, "global_step": 406482, "epoch": 2419} {"train_loss": -10.667779922485352, "global_step": 406483, "epoch": 2419} {"train_loss": -9.437603950500488, "global_step": 406484, "epoch": 2419} {"train_loss": -10.362850189208984, "global_step": 406485, "epoch": 2419} {"train_loss": -9.707271575927734, "global_step": 406486, "epoch": 2419} {"train_loss": -10.280566215515137, "global_step": 406487, "epoch": 2419} {"train_loss": -10.493570327758789, "global_step": 406488, "epoch": 2419} {"train_loss": -10.368213653564453, "global_step": 406489, "epoch": 2419} {"train_loss": -10.390256881713867, "global_step": 406490, "epoch": 2419} {"train_loss": -10.885892868041992, "global_step": 406491, "epoch": 2419} {"train_loss": -11.056177139282227, "global_step": 406492, "epoch": 2419} {"train_loss": -11.193920135498047, "global_step": 406493, "epoch": 2419} {"train_loss": -10.989280700683594, "global_step": 406494, "epoch": 2419} {"train_loss": -11.31592082977295, "global_step": 406495, "epoch": 2419} {"train_loss": -11.690900802612305, "global_step": 406496, "epoch": 2419} {"train_loss": -11.169756889343262, "global_step": 406497, "epoch": 2419} {"train_loss": -11.308448791503906, "global_step": 406498, "epoch": 2419} {"train_loss": -11.543478012084961, "global_step": 406499, "epoch": 2419} {"train_loss": -11.966424942016602, "global_step": 406500, "epoch": 2419} {"train_loss": -11.850180625915527, "global_step": 406501, "epoch": 2419} {"train_loss": -11.628416061401367, "global_step": 406502, "epoch": 2419} {"train_loss": -12.02110481262207, "global_step": 406503, "epoch": 2419} {"train_loss": -11.799287796020508, "global_step": 406504, "epoch": 2419} {"train_loss": -12.218353271484375, "global_step": 406505, "epoch": 2419} {"train_loss": -11.895852088928223, "global_step": 406506, "epoch": 2419} {"train_loss": -12.208978652954102, "global_step": 406507, "epoch": 2419} {"train_loss": -11.966809272766113, "global_step": 406508, "epoch": 2419} {"train_loss": -12.178204536437988, "global_step": 406509, "epoch": 2419} {"train_loss": -12.05278205871582, "global_step": 406510, "epoch": 2419} {"train_loss": -12.171977996826172, "global_step": 406511, "epoch": 2419} {"train_loss": -12.052225112915039, "global_step": 406512, "epoch": 2419} {"train_loss": -12.113160133361816, "global_step": 406513, "epoch": 2419} {"train_loss": -12.324592590332031, "global_step": 406514, "epoch": 2419} {"train_loss": -12.022998809814453, "global_step": 406515, "epoch": 2419} {"train_loss": -12.111392974853516, "global_step": 406516, "epoch": 2419} {"train_loss": -12.168176651000977, "global_step": 406517, "epoch": 2419} {"train_loss": -11.894805908203125, "global_step": 406518, "epoch": 2419} {"train_loss": -12.474064826965332, "global_step": 406519, "epoch": 2419} {"train_loss": -12.069509506225586, "global_step": 406520, "epoch": 2419} {"train_loss": -12.470001220703125, "global_step": 406521, "epoch": 2419} {"train_loss": -12.36854362487793, "global_step": 406522, "epoch": 2419} {"train_loss": -12.247268676757812, "global_step": 406523, "epoch": 2419} {"train_loss": -12.586089134216309, "global_step": 406524, "epoch": 2419} {"train_loss": -12.386133193969727, "global_step": 406525, "epoch": 2419} {"train_loss": -12.495536804199219, "global_step": 406526, "epoch": 2419} {"train_loss": -12.35348129272461, "global_step": 406527, "epoch": 2419} {"train_loss": -12.289371490478516, "global_step": 406528, "epoch": 2419} {"train_loss": -12.388336181640625, "global_step": 406529, "epoch": 2419} {"train_loss": -12.397643089294434, "global_step": 406530, "epoch": 2419} {"train_loss": -12.239961624145508, "global_step": 406531, "epoch": 2419} {"train_loss": -12.325311660766602, "global_step": 406532, "epoch": 2419} {"train_loss": -12.325451850891113, "global_step": 406533, "epoch": 2419} {"train_loss": -12.626962661743164, "global_step": 406534, "epoch": 2419} {"train_loss": -12.317178726196289, "global_step": 406535, "epoch": 2419} {"train_loss": -12.533881187438965, "global_step": 406536, "epoch": 2419} {"train_loss": -12.308683395385742, "global_step": 406537, "epoch": 2419} {"train_loss": -12.589818954467773, "global_step": 406538, "epoch": 2419} {"train_loss": -12.378128051757812, "global_step": 406539, "epoch": 2419} {"train_loss": -12.582352638244629, "global_step": 406540, "epoch": 2419} {"train_loss": -12.24233627319336, "global_step": 406541, "epoch": 2419} {"train_loss": -12.590314865112305, "global_step": 406542, "epoch": 2419} {"train_loss": -12.390170097351074, "global_step": 406543, "epoch": 2419} {"train_loss": -12.532602310180664, "global_step": 406544, "epoch": 2419} {"train_loss": -12.385994911193848, "global_step": 406545, "epoch": 2419} {"train_loss": -12.564339637756348, "global_step": 406546, "epoch": 2419} {"train_loss": -12.541484832763672, "global_step": 406547, "epoch": 2419} {"train_loss": -12.603442192077637, "global_step": 406548, "epoch": 2419} {"train_loss": -12.500814437866211, "global_step": 406549, "epoch": 2419} {"train_loss": -12.374635696411133, "global_step": 406550, "epoch": 2419} {"train_loss": -12.557304382324219, "global_step": 406551, "epoch": 2419} {"train_loss": -12.284618377685547, "global_step": 406552, "epoch": 2419} {"train_loss": -12.411214828491211, "global_step": 406553, "epoch": 2419} {"train_loss": -12.4845609664917, "global_step": 406554, "epoch": 2419} {"train_loss": -12.398468017578125, "global_step": 406555, "epoch": 2419} {"train_loss": -12.432905197143555, "global_step": 406556, "epoch": 2419} {"train_loss": -12.423420906066895, "global_step": 406557, "epoch": 2419} {"train_loss": -12.61288833618164, "global_step": 406558, "epoch": 2419} {"train_loss": -12.059203766641163, "global_step": 406559, "epoch": 2419, "val_loss": 305403.5} {"train_loss": -12.662081718444824, "global_step": 406560, "epoch": 2420} {"train_loss": -12.467704772949219, "global_step": 406561, "epoch": 2420} {"train_loss": -12.60150146484375, "global_step": 406562, "epoch": 2420} {"train_loss": -12.449291229248047, "global_step": 406563, "epoch": 2420} {"train_loss": -12.933794021606445, "global_step": 406564, "epoch": 2420} {"train_loss": -12.846525192260742, "global_step": 406565, "epoch": 2420} {"train_loss": -12.880316734313965, "global_step": 406566, "epoch": 2420} {"train_loss": -12.735179901123047, "global_step": 406567, "epoch": 2420} {"train_loss": -12.74918270111084, "global_step": 406568, "epoch": 2420} {"train_loss": -12.932140350341797, "global_step": 406569, "epoch": 2420} {"train_loss": -12.795190811157227, "global_step": 406570, "epoch": 2420} {"train_loss": -12.703751564025879, "global_step": 406571, "epoch": 2420} {"train_loss": -12.69144058227539, "global_step": 406572, "epoch": 2420} {"train_loss": -12.70933723449707, "global_step": 406573, "epoch": 2420} {"train_loss": -12.65424919128418, "global_step": 406574, "epoch": 2420} {"train_loss": -12.690319061279297, "global_step": 406575, "epoch": 2420} {"train_loss": -12.911945343017578, "global_step": 406576, "epoch": 2420} {"train_loss": -12.640382766723633, "global_step": 406577, "epoch": 2420} {"train_loss": -12.858270645141602, "global_step": 406578, "epoch": 2420} {"train_loss": -12.63894271850586, "global_step": 406579, "epoch": 2420} {"train_loss": -12.38869857788086, "global_step": 406580, "epoch": 2420} {"train_loss": -12.716363906860352, "global_step": 406581, "epoch": 2420} {"train_loss": -12.508468627929688, "global_step": 406582, "epoch": 2420} {"train_loss": -12.625880241394043, "global_step": 406583, "epoch": 2420} {"train_loss": -12.613153457641602, "global_step": 406584, "epoch": 2420} {"train_loss": -12.425971984863281, "global_step": 406585, "epoch": 2420} {"train_loss": -12.688661575317383, "global_step": 406586, "epoch": 2420} {"train_loss": -12.772597312927246, "global_step": 406587, "epoch": 2420} {"train_loss": -12.220718383789062, "global_step": 406588, "epoch": 2420} {"train_loss": -12.481657028198242, "global_step": 406589, "epoch": 2420} {"train_loss": -12.721556663513184, "global_step": 406590, "epoch": 2420} {"train_loss": -12.295463562011719, "global_step": 406591, "epoch": 2420} {"train_loss": -12.42413330078125, "global_step": 406592, "epoch": 2420} {"train_loss": -12.545894622802734, "global_step": 406593, "epoch": 2420} {"train_loss": -12.218506813049316, "global_step": 406594, "epoch": 2420} {"train_loss": -12.315810203552246, "global_step": 406595, "epoch": 2420} {"train_loss": -12.587448120117188, "global_step": 406596, "epoch": 2420} {"train_loss": -12.196578025817871, "global_step": 406597, "epoch": 2420} {"train_loss": -12.01457405090332, "global_step": 406598, "epoch": 2420} {"train_loss": -12.303763389587402, "global_step": 406599, "epoch": 2420} {"train_loss": -12.70820426940918, "global_step": 406600, "epoch": 2420} {"train_loss": -12.355999946594238, "global_step": 406601, "epoch": 2420} {"train_loss": -12.70693588256836, "global_step": 406602, "epoch": 2420} {"train_loss": -12.266487121582031, "global_step": 406603, "epoch": 2420} {"train_loss": -12.547187805175781, "global_step": 406604, "epoch": 2420} {"train_loss": -12.207296371459961, "global_step": 406605, "epoch": 2420} {"train_loss": -12.68591594696045, "global_step": 406606, "epoch": 2420} {"train_loss": -11.76008415222168, "global_step": 406607, "epoch": 2420} {"train_loss": -9.597371101379395, "global_step": 406608, "epoch": 2420} {"train_loss": -10.693693161010742, "global_step": 406609, "epoch": 2420} {"train_loss": -12.35726261138916, "global_step": 406610, "epoch": 2420} {"train_loss": -11.868978500366211, "global_step": 406611, "epoch": 2420} {"train_loss": -12.062298774719238, "global_step": 406612, "epoch": 2420} {"train_loss": -10.811715126037598, "global_step": 406613, "epoch": 2420} {"train_loss": -12.262463569641113, "global_step": 406614, "epoch": 2420} {"train_loss": -10.794120788574219, "global_step": 406615, "epoch": 2420} {"train_loss": -12.077495574951172, "global_step": 406616, "epoch": 2420} {"train_loss": -10.648331642150879, "global_step": 406617, "epoch": 2420} {"train_loss": -12.565299987792969, "global_step": 406618, "epoch": 2420} {"train_loss": -10.791259765625, "global_step": 406619, "epoch": 2420} {"train_loss": -12.196102142333984, "global_step": 406620, "epoch": 2420} {"train_loss": -12.1664400100708, "global_step": 406621, "epoch": 2420} {"train_loss": -11.582858085632324, "global_step": 406622, "epoch": 2420} {"train_loss": -12.113970756530762, "global_step": 406623, "epoch": 2420} {"train_loss": -11.516714096069336, "global_step": 406624, "epoch": 2420} {"train_loss": -12.649288177490234, "global_step": 406625, "epoch": 2420} {"train_loss": -11.979870796203613, "global_step": 406626, "epoch": 2420} {"train_loss": -12.480413436889648, "global_step": 406627, "epoch": 2420} {"train_loss": -12.051685333251953, "global_step": 406628, "epoch": 2420} {"train_loss": -12.299518585205078, "global_step": 406629, "epoch": 2420} {"train_loss": -12.33541202545166, "global_step": 406630, "epoch": 2420} {"train_loss": -11.90646743774414, "global_step": 406631, "epoch": 2420} {"train_loss": -11.93515396118164, "global_step": 406632, "epoch": 2420} {"train_loss": -12.62324333190918, "global_step": 406633, "epoch": 2420} {"train_loss": -12.087712287902832, "global_step": 406634, "epoch": 2420} {"train_loss": -11.994123458862305, "global_step": 406635, "epoch": 2420} {"train_loss": -12.132526397705078, "global_step": 406636, "epoch": 2420} {"train_loss": -11.981992721557617, "global_step": 406637, "epoch": 2420} {"train_loss": -11.982694625854492, "global_step": 406638, "epoch": 2420} {"train_loss": -12.077385902404785, "global_step": 406639, "epoch": 2420} {"train_loss": -11.545845031738281, "global_step": 406640, "epoch": 2420} {"train_loss": -12.593141555786133, "global_step": 406641, "epoch": 2420} {"train_loss": -12.00484848022461, "global_step": 406642, "epoch": 2420} {"train_loss": -12.421640396118164, "global_step": 406643, "epoch": 2420} {"train_loss": -12.277881622314453, "global_step": 406644, "epoch": 2420} {"train_loss": -12.048802375793457, "global_step": 406645, "epoch": 2420} {"train_loss": -11.342000007629395, "global_step": 406646, "epoch": 2420} {"train_loss": -12.23597240447998, "global_step": 406647, "epoch": 2420} {"train_loss": -11.97970962524414, "global_step": 406648, "epoch": 2420} {"train_loss": -11.419177055358887, "global_step": 406649, "epoch": 2420} {"train_loss": -12.10264778137207, "global_step": 406650, "epoch": 2420} {"train_loss": -11.860573768615723, "global_step": 406651, "epoch": 2420} {"train_loss": -11.910202026367188, "global_step": 406652, "epoch": 2420} {"train_loss": -12.206890106201172, "global_step": 406653, "epoch": 2420} {"train_loss": -11.343579292297363, "global_step": 406654, "epoch": 2420} {"train_loss": -12.087518692016602, "global_step": 406655, "epoch": 2420} {"train_loss": -11.98992919921875, "global_step": 406656, "epoch": 2420} {"train_loss": -10.834394454956055, "global_step": 406657, "epoch": 2420} {"train_loss": -11.679000854492188, "global_step": 406658, "epoch": 2420} {"train_loss": -10.492715835571289, "global_step": 406659, "epoch": 2420} {"train_loss": -12.15510082244873, "global_step": 406660, "epoch": 2420} {"train_loss": -10.684049606323242, "global_step": 406661, "epoch": 2420} {"train_loss": -11.084753036499023, "global_step": 406662, "epoch": 2420} {"train_loss": -10.800884246826172, "global_step": 406663, "epoch": 2420} {"train_loss": -11.599443435668945, "global_step": 406664, "epoch": 2420} {"train_loss": -10.937837600708008, "global_step": 406665, "epoch": 2420} {"train_loss": -12.102827072143555, "global_step": 406666, "epoch": 2420} {"train_loss": -11.845664978027344, "global_step": 406667, "epoch": 2420} {"train_loss": -11.451881408691406, "global_step": 406668, "epoch": 2420} {"train_loss": -12.116205215454102, "global_step": 406669, "epoch": 2420} {"train_loss": -11.454015731811523, "global_step": 406670, "epoch": 2420} {"train_loss": -12.053184509277344, "global_step": 406671, "epoch": 2420} {"train_loss": -11.930696487426758, "global_step": 406672, "epoch": 2420} {"train_loss": -12.191697120666504, "global_step": 406673, "epoch": 2420} {"train_loss": -11.956415176391602, "global_step": 406674, "epoch": 2420} {"train_loss": -12.243035316467285, "global_step": 406675, "epoch": 2420} {"train_loss": -12.3897123336792, "global_step": 406676, "epoch": 2420} {"train_loss": -12.25822925567627, "global_step": 406677, "epoch": 2420} {"train_loss": -12.455188751220703, "global_step": 406678, "epoch": 2420} {"train_loss": -12.309259414672852, "global_step": 406679, "epoch": 2420} {"train_loss": -12.093719482421875, "global_step": 406680, "epoch": 2420} {"train_loss": -11.964292526245117, "global_step": 406681, "epoch": 2420} {"train_loss": -12.470318794250488, "global_step": 406682, "epoch": 2420} {"train_loss": -11.929496765136719, "global_step": 406683, "epoch": 2420} {"train_loss": -11.793237686157227, "global_step": 406684, "epoch": 2420} {"train_loss": -12.237754821777344, "global_step": 406685, "epoch": 2420} {"train_loss": -12.164558410644531, "global_step": 406686, "epoch": 2420} {"train_loss": -12.197553634643555, "global_step": 406687, "epoch": 2420} {"train_loss": -12.22334098815918, "global_step": 406688, "epoch": 2420} {"train_loss": -12.224634170532227, "global_step": 406689, "epoch": 2420} {"train_loss": -12.027681350708008, "global_step": 406690, "epoch": 2420} {"train_loss": -11.862737655639648, "global_step": 406691, "epoch": 2420} {"train_loss": -11.508447647094727, "global_step": 406692, "epoch": 2420} {"train_loss": -12.406940460205078, "global_step": 406693, "epoch": 2420} {"train_loss": -11.8203125, "global_step": 406694, "epoch": 2420} {"train_loss": -12.007221221923828, "global_step": 406695, "epoch": 2420} {"train_loss": -11.939844131469727, "global_step": 406696, "epoch": 2420} {"train_loss": -11.891204833984375, "global_step": 406697, "epoch": 2420} {"train_loss": -12.188699722290039, "global_step": 406698, "epoch": 2420} {"train_loss": -12.183006286621094, "global_step": 406699, "epoch": 2420} {"train_loss": -11.631425857543945, "global_step": 406700, "epoch": 2420} {"train_loss": -11.773072242736816, "global_step": 406701, "epoch": 2420} {"train_loss": -11.573643684387207, "global_step": 406702, "epoch": 2420} {"train_loss": -11.23546028137207, "global_step": 406703, "epoch": 2420} {"train_loss": -10.820168495178223, "global_step": 406704, "epoch": 2420} {"train_loss": -11.51382827758789, "global_step": 406705, "epoch": 2420} {"train_loss": -9.896336555480957, "global_step": 406706, "epoch": 2420} {"train_loss": -8.553661346435547, "global_step": 406707, "epoch": 2420} {"train_loss": -8.53597354888916, "global_step": 406708, "epoch": 2420} {"train_loss": -9.000846862792969, "global_step": 406709, "epoch": 2420} {"train_loss": -9.343104362487793, "global_step": 406710, "epoch": 2420} {"train_loss": -8.860786437988281, "global_step": 406711, "epoch": 2420} {"train_loss": -9.256942749023438, "global_step": 406712, "epoch": 2420} {"train_loss": -9.032859802246094, "global_step": 406713, "epoch": 2420} {"train_loss": -9.046194076538086, "global_step": 406714, "epoch": 2420} {"train_loss": -9.359048843383789, "global_step": 406715, "epoch": 2420} {"train_loss": -9.872878074645996, "global_step": 406716, "epoch": 2420} {"train_loss": -10.166963577270508, "global_step": 406717, "epoch": 2420} {"train_loss": -10.288220405578613, "global_step": 406718, "epoch": 2420} {"train_loss": -10.062162399291992, "global_step": 406719, "epoch": 2420} {"train_loss": -10.415338516235352, "global_step": 406720, "epoch": 2420} {"train_loss": -10.931282997131348, "global_step": 406721, "epoch": 2420} {"train_loss": -11.067184448242188, "global_step": 406722, "epoch": 2420} {"train_loss": -9.829536437988281, "global_step": 406723, "epoch": 2420} {"train_loss": -10.123246192932129, "global_step": 406724, "epoch": 2420} {"train_loss": -9.890704154968262, "global_step": 406725, "epoch": 2420} {"train_loss": -9.62242317199707, "global_step": 406726, "epoch": 2420} {"train_loss": -11.764215804281688, "global_step": 406727, "epoch": 2420, "val_loss": 298599.46875, "train_action_mse_error": 1.1209540367126465} {"train_loss": -10.28524398803711, "global_step": 406728, "epoch": 2421} {"train_loss": -11.460647583007812, "global_step": 406729, "epoch": 2421} {"train_loss": -10.320429801940918, "global_step": 406730, "epoch": 2421} {"train_loss": -10.947466850280762, "global_step": 406731, "epoch": 2421} {"train_loss": -11.19064712524414, "global_step": 406732, "epoch": 2421} {"train_loss": -10.41897201538086, "global_step": 406733, "epoch": 2421} {"train_loss": -11.445591926574707, "global_step": 406734, "epoch": 2421} {"train_loss": -11.32498836517334, "global_step": 406735, "epoch": 2421} {"train_loss": -10.716007232666016, "global_step": 406736, "epoch": 2421} {"train_loss": -11.465874671936035, "global_step": 406737, "epoch": 2421} {"train_loss": -11.23998737335205, "global_step": 406738, "epoch": 2421} {"train_loss": -10.971353530883789, "global_step": 406739, "epoch": 2421} {"train_loss": -12.053703308105469, "global_step": 406740, "epoch": 2421} {"train_loss": -11.31479263305664, "global_step": 406741, "epoch": 2421} {"train_loss": -11.466336250305176, "global_step": 406742, "epoch": 2421} {"train_loss": -11.803625106811523, "global_step": 406743, "epoch": 2421} {"train_loss": -11.23300838470459, "global_step": 406744, "epoch": 2421} {"train_loss": -12.019457817077637, "global_step": 406745, "epoch": 2421} {"train_loss": -11.947134017944336, "global_step": 406746, "epoch": 2421} {"train_loss": -11.802966117858887, "global_step": 406747, "epoch": 2421} {"train_loss": -11.64742660522461, "global_step": 406748, "epoch": 2421} {"train_loss": -11.755629539489746, "global_step": 406749, "epoch": 2421} {"train_loss": -12.160703659057617, "global_step": 406750, "epoch": 2421} {"train_loss": -12.224649429321289, "global_step": 406751, "epoch": 2421} {"train_loss": -11.922538757324219, "global_step": 406752, "epoch": 2421} {"train_loss": -12.110820770263672, "global_step": 406753, "epoch": 2421} {"train_loss": -12.226672172546387, "global_step": 406754, "epoch": 2421} {"train_loss": -12.195646286010742, "global_step": 406755, "epoch": 2421} {"train_loss": -12.023953437805176, "global_step": 406756, "epoch": 2421} {"train_loss": -12.530471801757812, "global_step": 406757, "epoch": 2421} {"train_loss": -12.133630752563477, "global_step": 406758, "epoch": 2421} {"train_loss": -12.157408714294434, "global_step": 406759, "epoch": 2421} {"train_loss": -11.913881301879883, "global_step": 406760, "epoch": 2421} {"train_loss": -12.079887390136719, "global_step": 406761, "epoch": 2421} {"train_loss": -11.784597396850586, "global_step": 406762, "epoch": 2421} {"train_loss": -12.375133514404297, "global_step": 406763, "epoch": 2421} {"train_loss": -11.865877151489258, "global_step": 406764, "epoch": 2421} {"train_loss": -12.39648151397705, "global_step": 406765, "epoch": 2421} {"train_loss": -11.89566421508789, "global_step": 406766, "epoch": 2421} {"train_loss": -12.118572235107422, "global_step": 406767, "epoch": 2421} {"train_loss": -11.8964262008667, "global_step": 406768, "epoch": 2421} {"train_loss": -11.928342819213867, "global_step": 406769, "epoch": 2421} {"train_loss": -12.165300369262695, "global_step": 406770, "epoch": 2421} {"train_loss": -12.297284126281738, "global_step": 406771, "epoch": 2421} {"train_loss": -12.136697769165039, "global_step": 406772, "epoch": 2421} {"train_loss": -12.436904907226562, "global_step": 406773, "epoch": 2421} {"train_loss": -12.150970458984375, "global_step": 406774, "epoch": 2421} {"train_loss": -11.878256797790527, "global_step": 406775, "epoch": 2421} {"train_loss": -11.931623458862305, "global_step": 406776, "epoch": 2421} {"train_loss": -11.936513900756836, "global_step": 406777, "epoch": 2421} {"train_loss": -11.912132263183594, "global_step": 406778, "epoch": 2421} {"train_loss": -12.288030624389648, "global_step": 406779, "epoch": 2421} {"train_loss": -11.981175422668457, "global_step": 406780, "epoch": 2421} {"train_loss": -12.265619277954102, "global_step": 406781, "epoch": 2421} {"train_loss": -11.964847564697266, "global_step": 406782, "epoch": 2421} {"train_loss": -12.27490234375, "global_step": 406783, "epoch": 2421} {"train_loss": -12.32349967956543, "global_step": 406784, "epoch": 2421} {"train_loss": -12.324458122253418, "global_step": 406785, "epoch": 2421} {"train_loss": -12.577667236328125, "global_step": 406786, "epoch": 2421} {"train_loss": -12.243829727172852, "global_step": 406787, "epoch": 2421} {"train_loss": -12.239835739135742, "global_step": 406788, "epoch": 2421} {"train_loss": -12.326560974121094, "global_step": 406789, "epoch": 2421} {"train_loss": -12.468825340270996, "global_step": 406790, "epoch": 2421} {"train_loss": -12.066173553466797, "global_step": 406791, "epoch": 2421} {"train_loss": -12.369911193847656, "global_step": 406792, "epoch": 2421} {"train_loss": -12.13508129119873, "global_step": 406793, "epoch": 2421} {"train_loss": -12.29214859008789, "global_step": 406794, "epoch": 2421} {"train_loss": -12.429389953613281, "global_step": 406795, "epoch": 2421} {"train_loss": -12.10564136505127, "global_step": 406796, "epoch": 2421} {"train_loss": -12.392616271972656, "global_step": 406797, "epoch": 2421} {"train_loss": -12.343827247619629, "global_step": 406798, "epoch": 2421} {"train_loss": -12.263721466064453, "global_step": 406799, "epoch": 2421} {"train_loss": -12.263372421264648, "global_step": 406800, "epoch": 2421} {"train_loss": -12.070047378540039, "global_step": 406801, "epoch": 2421} {"train_loss": -12.130477905273438, "global_step": 406802, "epoch": 2421} {"train_loss": -12.324405670166016, "global_step": 406803, "epoch": 2421} {"train_loss": -12.177361488342285, "global_step": 406804, "epoch": 2421} {"train_loss": -12.40719985961914, "global_step": 406805, "epoch": 2421} {"train_loss": -11.994258880615234, "global_step": 406806, "epoch": 2421} {"train_loss": -12.322688102722168, "global_step": 406807, "epoch": 2421} {"train_loss": -12.268816947937012, "global_step": 406808, "epoch": 2421} {"train_loss": -12.296725273132324, "global_step": 406809, "epoch": 2421} {"train_loss": -12.699871063232422, "global_step": 406810, "epoch": 2421} {"train_loss": -12.362601280212402, "global_step": 406811, "epoch": 2421} {"train_loss": -12.72665023803711, "global_step": 406812, "epoch": 2421} {"train_loss": -12.291755676269531, "global_step": 406813, "epoch": 2421} {"train_loss": -12.493268966674805, "global_step": 406814, "epoch": 2421} {"train_loss": -12.553445816040039, "global_step": 406815, "epoch": 2421} {"train_loss": -12.396127700805664, "global_step": 406816, "epoch": 2421} {"train_loss": -12.52800178527832, "global_step": 406817, "epoch": 2421} {"train_loss": -12.31198501586914, "global_step": 406818, "epoch": 2421} {"train_loss": -12.215461730957031, "global_step": 406819, "epoch": 2421} {"train_loss": -12.466693878173828, "global_step": 406820, "epoch": 2421} {"train_loss": -12.28947925567627, "global_step": 406821, "epoch": 2421} {"train_loss": -12.086854934692383, "global_step": 406822, "epoch": 2421} {"train_loss": -12.450434684753418, "global_step": 406823, "epoch": 2421} {"train_loss": -12.049705505371094, "global_step": 406824, "epoch": 2421} {"train_loss": -12.349512100219727, "global_step": 406825, "epoch": 2421} {"train_loss": -12.04245662689209, "global_step": 406826, "epoch": 2421} {"train_loss": -12.409732818603516, "global_step": 406827, "epoch": 2421} {"train_loss": -12.250484466552734, "global_step": 406828, "epoch": 2421} {"train_loss": -12.430625915527344, "global_step": 406829, "epoch": 2421} {"train_loss": -12.468631744384766, "global_step": 406830, "epoch": 2421} {"train_loss": -12.497915267944336, "global_step": 406831, "epoch": 2421} {"train_loss": -12.342066764831543, "global_step": 406832, "epoch": 2421} {"train_loss": -12.79770278930664, "global_step": 406833, "epoch": 2421} {"train_loss": -12.328154563903809, "global_step": 406834, "epoch": 2421} {"train_loss": -12.320087432861328, "global_step": 406835, "epoch": 2421} {"train_loss": -12.414190292358398, "global_step": 406836, "epoch": 2421} {"train_loss": -11.933708190917969, "global_step": 406837, "epoch": 2421} {"train_loss": -12.318982124328613, "global_step": 406838, "epoch": 2421} {"train_loss": -12.205730438232422, "global_step": 406839, "epoch": 2421} {"train_loss": -12.409111022949219, "global_step": 406840, "epoch": 2421} {"train_loss": -12.676840782165527, "global_step": 406841, "epoch": 2421} {"train_loss": -12.442537307739258, "global_step": 406842, "epoch": 2421} {"train_loss": -12.700017929077148, "global_step": 406843, "epoch": 2421} {"train_loss": -12.347725868225098, "global_step": 406844, "epoch": 2421} {"train_loss": -11.862192153930664, "global_step": 406845, "epoch": 2421} {"train_loss": -12.251659393310547, "global_step": 406846, "epoch": 2421} {"train_loss": -11.723089218139648, "global_step": 406847, "epoch": 2421} {"train_loss": -12.606317520141602, "global_step": 406848, "epoch": 2421} {"train_loss": -12.104068756103516, "global_step": 406849, "epoch": 2421} {"train_loss": -12.304046630859375, "global_step": 406850, "epoch": 2421} {"train_loss": -12.512514114379883, "global_step": 406851, "epoch": 2421} {"train_loss": -12.305875778198242, "global_step": 406852, "epoch": 2421} {"train_loss": -12.621431350708008, "global_step": 406853, "epoch": 2421} {"train_loss": -11.897722244262695, "global_step": 406854, "epoch": 2421} {"train_loss": -11.830217361450195, "global_step": 406855, "epoch": 2421} {"train_loss": -12.048301696777344, "global_step": 406856, "epoch": 2421} {"train_loss": -11.826722145080566, "global_step": 406857, "epoch": 2421} {"train_loss": -12.253498077392578, "global_step": 406858, "epoch": 2421} {"train_loss": -10.774736404418945, "global_step": 406859, "epoch": 2421} {"train_loss": -12.078691482543945, "global_step": 406860, "epoch": 2421} {"train_loss": -11.281304359436035, "global_step": 406861, "epoch": 2421} {"train_loss": -11.6566162109375, "global_step": 406862, "epoch": 2421} {"train_loss": -11.41061019897461, "global_step": 406863, "epoch": 2421} {"train_loss": -12.04896354675293, "global_step": 406864, "epoch": 2421} {"train_loss": -11.572161674499512, "global_step": 406865, "epoch": 2421} {"train_loss": -12.06620979309082, "global_step": 406866, "epoch": 2421} {"train_loss": -11.473556518554688, "global_step": 406867, "epoch": 2421} {"train_loss": -12.254854202270508, "global_step": 406868, "epoch": 2421} {"train_loss": -11.667874336242676, "global_step": 406869, "epoch": 2421} {"train_loss": -11.934741973876953, "global_step": 406870, "epoch": 2421} {"train_loss": -11.944618225097656, "global_step": 406871, "epoch": 2421} {"train_loss": -12.272817611694336, "global_step": 406872, "epoch": 2421} {"train_loss": -12.177215576171875, "global_step": 406873, "epoch": 2421} {"train_loss": -11.637653350830078, "global_step": 406874, "epoch": 2421} {"train_loss": -12.31784439086914, "global_step": 406875, "epoch": 2421} {"train_loss": -11.366339683532715, "global_step": 406876, "epoch": 2421} {"train_loss": -12.227339744567871, "global_step": 406877, "epoch": 2421} {"train_loss": -11.081073760986328, "global_step": 406878, "epoch": 2421} {"train_loss": -12.326713562011719, "global_step": 406879, "epoch": 2421} {"train_loss": -11.396777153015137, "global_step": 406880, "epoch": 2421} {"train_loss": -12.056147575378418, "global_step": 406881, "epoch": 2421} {"train_loss": -11.452381134033203, "global_step": 406882, "epoch": 2421} {"train_loss": -12.292034149169922, "global_step": 406883, "epoch": 2421} {"train_loss": -11.487544059753418, "global_step": 406884, "epoch": 2421} {"train_loss": -11.927228927612305, "global_step": 406885, "epoch": 2421} {"train_loss": -11.25137710571289, "global_step": 406886, "epoch": 2421} {"train_loss": -11.529411315917969, "global_step": 406887, "epoch": 2421} {"train_loss": -11.068449974060059, "global_step": 406888, "epoch": 2421} {"train_loss": -11.373285293579102, "global_step": 406889, "epoch": 2421} {"train_loss": -11.598810195922852, "global_step": 406890, "epoch": 2421} {"train_loss": -11.229903221130371, "global_step": 406891, "epoch": 2421} {"train_loss": -11.615459442138672, "global_step": 406892, "epoch": 2421} {"train_loss": -11.915907859802246, "global_step": 406893, "epoch": 2421} {"train_loss": -11.266810417175293, "global_step": 406894, "epoch": 2421} {"train_loss": -11.999048868815104, "global_step": 406895, "epoch": 2421, "val_loss": 306904.125} {"train_loss": -11.940322875976562, "global_step": 406896, "epoch": 2422} {"train_loss": -11.216296195983887, "global_step": 406897, "epoch": 2422} {"train_loss": -11.961389541625977, "global_step": 406898, "epoch": 2422} {"train_loss": -11.844551086425781, "global_step": 406899, "epoch": 2422} {"train_loss": -11.311203002929688, "global_step": 406900, "epoch": 2422} {"train_loss": -11.622005462646484, "global_step": 406901, "epoch": 2422} {"train_loss": -12.047381401062012, "global_step": 406902, "epoch": 2422} {"train_loss": -11.248231887817383, "global_step": 406903, "epoch": 2422} {"train_loss": -11.964006423950195, "global_step": 406904, "epoch": 2422} {"train_loss": -9.766237258911133, "global_step": 406905, "epoch": 2422} {"train_loss": -10.809306144714355, "global_step": 406906, "epoch": 2422} {"train_loss": -10.176868438720703, "global_step": 406907, "epoch": 2422} {"train_loss": -10.419942855834961, "global_step": 406908, "epoch": 2422} {"train_loss": -8.910057067871094, "global_step": 406909, "epoch": 2422} {"train_loss": -10.166553497314453, "global_step": 406910, "epoch": 2422} {"train_loss": -9.181930541992188, "global_step": 406911, "epoch": 2422} {"train_loss": -9.894478797912598, "global_step": 406912, "epoch": 2422} {"train_loss": -10.767111778259277, "global_step": 406913, "epoch": 2422} {"train_loss": -10.43587589263916, "global_step": 406914, "epoch": 2422} {"train_loss": -10.752893447875977, "global_step": 406915, "epoch": 2422} {"train_loss": -10.904766082763672, "global_step": 406916, "epoch": 2422} {"train_loss": -9.572132110595703, "global_step": 406917, "epoch": 2422} {"train_loss": -10.629119873046875, "global_step": 406918, "epoch": 2422} {"train_loss": -10.051620483398438, "global_step": 406919, "epoch": 2422} {"train_loss": -10.798613548278809, "global_step": 406920, "epoch": 2422} {"train_loss": -9.24650764465332, "global_step": 406921, "epoch": 2422} {"train_loss": -9.538215637207031, "global_step": 406922, "epoch": 2422} {"train_loss": -11.47149658203125, "global_step": 406923, "epoch": 2422} {"train_loss": -9.713643074035645, "global_step": 406924, "epoch": 2422} {"train_loss": -10.971412658691406, "global_step": 406925, "epoch": 2422} {"train_loss": -10.776517868041992, "global_step": 406926, "epoch": 2422} {"train_loss": -11.279491424560547, "global_step": 406927, "epoch": 2422} {"train_loss": -11.060232162475586, "global_step": 406928, "epoch": 2422} {"train_loss": -11.548563957214355, "global_step": 406929, "epoch": 2422} {"train_loss": -11.312507629394531, "global_step": 406930, "epoch": 2422} {"train_loss": -11.003948211669922, "global_step": 406931, "epoch": 2422} {"train_loss": -11.82411003112793, "global_step": 406932, "epoch": 2422} {"train_loss": -11.7901611328125, "global_step": 406933, "epoch": 2422} {"train_loss": -11.872289657592773, "global_step": 406934, "epoch": 2422} {"train_loss": -11.819421768188477, "global_step": 406935, "epoch": 2422} {"train_loss": -11.962919235229492, "global_step": 406936, "epoch": 2422} {"train_loss": -12.131808280944824, "global_step": 406937, "epoch": 2422} {"train_loss": -12.00202751159668, "global_step": 406938, "epoch": 2422} {"train_loss": -11.211585998535156, "global_step": 406939, "epoch": 2422} {"train_loss": -11.830806732177734, "global_step": 406940, "epoch": 2422} {"train_loss": -11.27989673614502, "global_step": 406941, "epoch": 2422} {"train_loss": -11.87959098815918, "global_step": 406942, "epoch": 2422} {"train_loss": -10.976133346557617, "global_step": 406943, "epoch": 2422} {"train_loss": -11.426584243774414, "global_step": 406944, "epoch": 2422} {"train_loss": -11.928770065307617, "global_step": 406945, "epoch": 2422} {"train_loss": -11.752294540405273, "global_step": 406946, "epoch": 2422} {"train_loss": -11.489569664001465, "global_step": 406947, "epoch": 2422} {"train_loss": -12.181289672851562, "global_step": 406948, "epoch": 2422} {"train_loss": -11.308538436889648, "global_step": 406949, "epoch": 2422} {"train_loss": -11.422347068786621, "global_step": 406950, "epoch": 2422} {"train_loss": -11.798359870910645, "global_step": 406951, "epoch": 2422} {"train_loss": -12.007171630859375, "global_step": 406952, "epoch": 2422} {"train_loss": -11.610111236572266, "global_step": 406953, "epoch": 2422} {"train_loss": -12.110298156738281, "global_step": 406954, "epoch": 2422} {"train_loss": -11.535091400146484, "global_step": 406955, "epoch": 2422} {"train_loss": -12.26319694519043, "global_step": 406956, "epoch": 2422} {"train_loss": -11.931958198547363, "global_step": 406957, "epoch": 2422} {"train_loss": -12.296338081359863, "global_step": 406958, "epoch": 2422} {"train_loss": -11.798528671264648, "global_step": 406959, "epoch": 2422} {"train_loss": -12.305054664611816, "global_step": 406960, "epoch": 2422} {"train_loss": -12.023903846740723, "global_step": 406961, "epoch": 2422} {"train_loss": -12.131265640258789, "global_step": 406962, "epoch": 2422} {"train_loss": -12.372268676757812, "global_step": 406963, "epoch": 2422} {"train_loss": -12.30996036529541, "global_step": 406964, "epoch": 2422} {"train_loss": -12.130683898925781, "global_step": 406965, "epoch": 2422} {"train_loss": -12.202280044555664, "global_step": 406966, "epoch": 2422} {"train_loss": -12.390510559082031, "global_step": 406967, "epoch": 2422} {"train_loss": -11.97647476196289, "global_step": 406968, "epoch": 2422} {"train_loss": -12.336736679077148, "global_step": 406969, "epoch": 2422} {"train_loss": -12.366106986999512, "global_step": 406970, "epoch": 2422} {"train_loss": -12.327048301696777, "global_step": 406971, "epoch": 2422} {"train_loss": -12.333351135253906, "global_step": 406972, "epoch": 2422} {"train_loss": -12.504520416259766, "global_step": 406973, "epoch": 2422} {"train_loss": -12.472137451171875, "global_step": 406974, "epoch": 2422} {"train_loss": -12.460552215576172, "global_step": 406975, "epoch": 2422} {"train_loss": -12.377692222595215, "global_step": 406976, "epoch": 2422} {"train_loss": -12.616294860839844, "global_step": 406977, "epoch": 2422} {"train_loss": -12.338493347167969, "global_step": 406978, "epoch": 2422} {"train_loss": -12.430761337280273, "global_step": 406979, "epoch": 2422} {"train_loss": -12.397214889526367, "global_step": 406980, "epoch": 2422} {"train_loss": -12.400419235229492, "global_step": 406981, "epoch": 2422} {"train_loss": -12.615339279174805, "global_step": 406982, "epoch": 2422} {"train_loss": -12.474541664123535, "global_step": 406983, "epoch": 2422} {"train_loss": -12.519469261169434, "global_step": 406984, "epoch": 2422} {"train_loss": -12.571487426757812, "global_step": 406985, "epoch": 2422} {"train_loss": -12.482481002807617, "global_step": 406986, "epoch": 2422} {"train_loss": -12.484343528747559, "global_step": 406987, "epoch": 2422} {"train_loss": -12.32457447052002, "global_step": 406988, "epoch": 2422} {"train_loss": -12.340961456298828, "global_step": 406989, "epoch": 2422} {"train_loss": -12.756574630737305, "global_step": 406990, "epoch": 2422} {"train_loss": -12.62083911895752, "global_step": 406991, "epoch": 2422} {"train_loss": -12.660980224609375, "global_step": 406992, "epoch": 2422} {"train_loss": -12.634147644042969, "global_step": 406993, "epoch": 2422} {"train_loss": -12.493419647216797, "global_step": 406994, "epoch": 2422} {"train_loss": -12.745138168334961, "global_step": 406995, "epoch": 2422} {"train_loss": -12.47871208190918, "global_step": 406996, "epoch": 2422} {"train_loss": -12.617693901062012, "global_step": 406997, "epoch": 2422} {"train_loss": -12.68333625793457, "global_step": 406998, "epoch": 2422} {"train_loss": -12.604660987854004, "global_step": 406999, "epoch": 2422} {"train_loss": -12.527223587036133, "global_step": 407000, "epoch": 2422} {"train_loss": -12.79179573059082, "global_step": 407001, "epoch": 2422} {"train_loss": -12.771685600280762, "global_step": 407002, "epoch": 2422} {"train_loss": -12.553108215332031, "global_step": 407003, "epoch": 2422} {"train_loss": -12.73318099975586, "global_step": 407004, "epoch": 2422} {"train_loss": -12.789665222167969, "global_step": 407005, "epoch": 2422} {"train_loss": -12.412515640258789, "global_step": 407006, "epoch": 2422} {"train_loss": -12.651366233825684, "global_step": 407007, "epoch": 2422} {"train_loss": -12.521565437316895, "global_step": 407008, "epoch": 2422} {"train_loss": -12.642363548278809, "global_step": 407009, "epoch": 2422} {"train_loss": -12.55373764038086, "global_step": 407010, "epoch": 2422} {"train_loss": -12.58509635925293, "global_step": 407011, "epoch": 2422} {"train_loss": -12.763252258300781, "global_step": 407012, "epoch": 2422} {"train_loss": -12.439493179321289, "global_step": 407013, "epoch": 2422} {"train_loss": -12.5106201171875, "global_step": 407014, "epoch": 2422} {"train_loss": -12.690084457397461, "global_step": 407015, "epoch": 2422} {"train_loss": -12.755476951599121, "global_step": 407016, "epoch": 2422} {"train_loss": -12.48408317565918, "global_step": 407017, "epoch": 2422} {"train_loss": -12.8419189453125, "global_step": 407018, "epoch": 2422} {"train_loss": -12.197237968444824, "global_step": 407019, "epoch": 2422} {"train_loss": -12.071887969970703, "global_step": 407020, "epoch": 2422} {"train_loss": -12.478036880493164, "global_step": 407021, "epoch": 2422} {"train_loss": -12.744789123535156, "global_step": 407022, "epoch": 2422} {"train_loss": -12.17464828491211, "global_step": 407023, "epoch": 2422} {"train_loss": -12.587347030639648, "global_step": 407024, "epoch": 2422} {"train_loss": -12.33095932006836, "global_step": 407025, "epoch": 2422} {"train_loss": -12.274468421936035, "global_step": 407026, "epoch": 2422} {"train_loss": -12.305644989013672, "global_step": 407027, "epoch": 2422} {"train_loss": -12.634078025817871, "global_step": 407028, "epoch": 2422} {"train_loss": -12.366393089294434, "global_step": 407029, "epoch": 2422} {"train_loss": -12.678994178771973, "global_step": 407030, "epoch": 2422} {"train_loss": -12.213794708251953, "global_step": 407031, "epoch": 2422} {"train_loss": -12.269735336303711, "global_step": 407032, "epoch": 2422} {"train_loss": -12.670634269714355, "global_step": 407033, "epoch": 2422} {"train_loss": -12.605937004089355, "global_step": 407034, "epoch": 2422} {"train_loss": -12.449810028076172, "global_step": 407035, "epoch": 2422} {"train_loss": -12.442083358764648, "global_step": 407036, "epoch": 2422} {"train_loss": -12.11379623413086, "global_step": 407037, "epoch": 2422} {"train_loss": -12.593929290771484, "global_step": 407038, "epoch": 2422} {"train_loss": -12.29423713684082, "global_step": 407039, "epoch": 2422} {"train_loss": -12.532724380493164, "global_step": 407040, "epoch": 2422} {"train_loss": -12.613943099975586, "global_step": 407041, "epoch": 2422} {"train_loss": -12.797672271728516, "global_step": 407042, "epoch": 2422} {"train_loss": -12.64089584350586, "global_step": 407043, "epoch": 2422} {"train_loss": -12.507448196411133, "global_step": 407044, "epoch": 2422} {"train_loss": -12.463748931884766, "global_step": 407045, "epoch": 2422} {"train_loss": -12.188248634338379, "global_step": 407046, "epoch": 2422} {"train_loss": -12.498215675354004, "global_step": 407047, "epoch": 2422} {"train_loss": -12.197260856628418, "global_step": 407048, "epoch": 2422} {"train_loss": -12.710329055786133, "global_step": 407049, "epoch": 2422} {"train_loss": -12.386479377746582, "global_step": 407050, "epoch": 2422} {"train_loss": -12.040070533752441, "global_step": 407051, "epoch": 2422} {"train_loss": -12.627817153930664, "global_step": 407052, "epoch": 2422} {"train_loss": -12.796686172485352, "global_step": 407053, "epoch": 2422} {"train_loss": -12.276756286621094, "global_step": 407054, "epoch": 2422} {"train_loss": -12.368038177490234, "global_step": 407055, "epoch": 2422} {"train_loss": -12.343199729919434, "global_step": 407056, "epoch": 2422} {"train_loss": -12.350305557250977, "global_step": 407057, "epoch": 2422} {"train_loss": -12.17910385131836, "global_step": 407058, "epoch": 2422} {"train_loss": -12.714029312133789, "global_step": 407059, "epoch": 2422} {"train_loss": -12.09338092803955, "global_step": 407060, "epoch": 2422} {"train_loss": -11.100096702575684, "global_step": 407061, "epoch": 2422} {"train_loss": -11.023457527160645, "global_step": 407062, "epoch": 2422} {"train_loss": -11.959191651571365, "global_step": 407063, "epoch": 2422, "val_loss": 303672.5625} {"train_loss": -12.030292510986328, "global_step": 407064, "epoch": 2423} {"train_loss": -11.288259506225586, "global_step": 407065, "epoch": 2423} {"train_loss": -11.775857925415039, "global_step": 407066, "epoch": 2423} {"train_loss": -11.774907112121582, "global_step": 407067, "epoch": 2423} {"train_loss": -11.458549499511719, "global_step": 407068, "epoch": 2423} {"train_loss": -12.167316436767578, "global_step": 407069, "epoch": 2423} {"train_loss": -11.893482208251953, "global_step": 407070, "epoch": 2423} {"train_loss": -11.582910537719727, "global_step": 407071, "epoch": 2423} {"train_loss": -11.879389762878418, "global_step": 407072, "epoch": 2423} {"train_loss": -11.920321464538574, "global_step": 407073, "epoch": 2423} {"train_loss": -12.474504470825195, "global_step": 407074, "epoch": 2423} {"train_loss": -12.265260696411133, "global_step": 407075, "epoch": 2423} {"train_loss": -11.927966117858887, "global_step": 407076, "epoch": 2423} {"train_loss": -11.682012557983398, "global_step": 407077, "epoch": 2423} {"train_loss": -12.020811080932617, "global_step": 407078, "epoch": 2423} {"train_loss": -11.190189361572266, "global_step": 407079, "epoch": 2423} {"train_loss": -12.091398239135742, "global_step": 407080, "epoch": 2423} {"train_loss": -11.380013465881348, "global_step": 407081, "epoch": 2423} {"train_loss": -10.219533920288086, "global_step": 407082, "epoch": 2423} {"train_loss": -11.060328483581543, "global_step": 407083, "epoch": 2423} {"train_loss": -10.226849555969238, "global_step": 407084, "epoch": 2423} {"train_loss": -11.14749526977539, "global_step": 407085, "epoch": 2423} {"train_loss": -8.944263458251953, "global_step": 407086, "epoch": 2423} {"train_loss": -10.669820785522461, "global_step": 407087, "epoch": 2423} {"train_loss": -9.010576248168945, "global_step": 407088, "epoch": 2423} {"train_loss": -10.600890159606934, "global_step": 407089, "epoch": 2423} {"train_loss": -9.037397384643555, "global_step": 407090, "epoch": 2423} {"train_loss": -11.382946968078613, "global_step": 407091, "epoch": 2423} {"train_loss": -9.324783325195312, "global_step": 407092, "epoch": 2423} {"train_loss": -11.204940795898438, "global_step": 407093, "epoch": 2423} {"train_loss": -10.441781997680664, "global_step": 407094, "epoch": 2423} {"train_loss": -10.645393371582031, "global_step": 407095, "epoch": 2423} {"train_loss": -10.533512115478516, "global_step": 407096, "epoch": 2423} {"train_loss": -11.356057167053223, "global_step": 407097, "epoch": 2423} {"train_loss": -11.315101623535156, "global_step": 407098, "epoch": 2423} {"train_loss": -12.04151725769043, "global_step": 407099, "epoch": 2423} {"train_loss": -11.036138534545898, "global_step": 407100, "epoch": 2423} {"train_loss": -11.608253479003906, "global_step": 407101, "epoch": 2423} {"train_loss": -11.467428207397461, "global_step": 407102, "epoch": 2423} {"train_loss": -11.826433181762695, "global_step": 407103, "epoch": 2423} {"train_loss": -11.657485008239746, "global_step": 407104, "epoch": 2423} {"train_loss": -11.42793083190918, "global_step": 407105, "epoch": 2423} {"train_loss": -11.401399612426758, "global_step": 407106, "epoch": 2423} {"train_loss": -11.884062767028809, "global_step": 407107, "epoch": 2423} {"train_loss": -12.11713981628418, "global_step": 407108, "epoch": 2423} {"train_loss": -12.148963928222656, "global_step": 407109, "epoch": 2423} {"train_loss": -11.551067352294922, "global_step": 407110, "epoch": 2423} {"train_loss": -11.792181015014648, "global_step": 407111, "epoch": 2423} {"train_loss": -11.930793762207031, "global_step": 407112, "epoch": 2423} {"train_loss": -11.630813598632812, "global_step": 407113, "epoch": 2423} {"train_loss": -11.64302921295166, "global_step": 407114, "epoch": 2423} {"train_loss": -11.907742500305176, "global_step": 407115, "epoch": 2423} {"train_loss": -11.937904357910156, "global_step": 407116, "epoch": 2423} {"train_loss": -11.915849685668945, "global_step": 407117, "epoch": 2423} {"train_loss": -11.751716613769531, "global_step": 407118, "epoch": 2423} {"train_loss": -12.204279899597168, "global_step": 407119, "epoch": 2423} {"train_loss": -11.946981430053711, "global_step": 407120, "epoch": 2423} {"train_loss": -12.029016494750977, "global_step": 407121, "epoch": 2423} {"train_loss": -11.741161346435547, "global_step": 407122, "epoch": 2423} {"train_loss": -12.346780776977539, "global_step": 407123, "epoch": 2423} {"train_loss": -12.069210052490234, "global_step": 407124, "epoch": 2423} {"train_loss": -12.347440719604492, "global_step": 407125, "epoch": 2423} {"train_loss": -12.198433876037598, "global_step": 407126, "epoch": 2423} {"train_loss": -12.58825397491455, "global_step": 407127, "epoch": 2423} {"train_loss": -12.357620239257812, "global_step": 407128, "epoch": 2423} {"train_loss": -12.40783405303955, "global_step": 407129, "epoch": 2423} {"train_loss": -12.352483749389648, "global_step": 407130, "epoch": 2423} {"train_loss": -12.682621002197266, "global_step": 407131, "epoch": 2423} {"train_loss": -12.066323280334473, "global_step": 407132, "epoch": 2423} {"train_loss": -12.313652038574219, "global_step": 407133, "epoch": 2423} {"train_loss": -12.426236152648926, "global_step": 407134, "epoch": 2423} {"train_loss": -12.569100379943848, "global_step": 407135, "epoch": 2423} {"train_loss": -12.465694427490234, "global_step": 407136, "epoch": 2423} {"train_loss": -12.365321159362793, "global_step": 407137, "epoch": 2423} {"train_loss": -12.4751615524292, "global_step": 407138, "epoch": 2423} {"train_loss": -12.500086784362793, "global_step": 407139, "epoch": 2423} {"train_loss": -12.2596435546875, "global_step": 407140, "epoch": 2423} {"train_loss": -12.599859237670898, "global_step": 407141, "epoch": 2423} {"train_loss": -12.497108459472656, "global_step": 407142, "epoch": 2423} {"train_loss": -12.34131145477295, "global_step": 407143, "epoch": 2423} {"train_loss": -12.525609970092773, "global_step": 407144, "epoch": 2423} {"train_loss": -12.644725799560547, "global_step": 407145, "epoch": 2423} {"train_loss": -12.250439643859863, "global_step": 407146, "epoch": 2423} {"train_loss": -12.78609848022461, "global_step": 407147, "epoch": 2423} {"train_loss": -11.895736694335938, "global_step": 407148, "epoch": 2423} {"train_loss": -12.731748580932617, "global_step": 407149, "epoch": 2423} {"train_loss": -12.318856239318848, "global_step": 407150, "epoch": 2423} {"train_loss": -12.505193710327148, "global_step": 407151, "epoch": 2423} {"train_loss": -12.547568321228027, "global_step": 407152, "epoch": 2423} {"train_loss": -12.417051315307617, "global_step": 407153, "epoch": 2423} {"train_loss": -12.448152542114258, "global_step": 407154, "epoch": 2423} {"train_loss": -12.70307731628418, "global_step": 407155, "epoch": 2423} {"train_loss": -12.675796508789062, "global_step": 407156, "epoch": 2423} {"train_loss": -12.553625106811523, "global_step": 407157, "epoch": 2423} {"train_loss": -12.5110502243042, "global_step": 407158, "epoch": 2423} {"train_loss": -12.639996528625488, "global_step": 407159, "epoch": 2423} {"train_loss": -12.519050598144531, "global_step": 407160, "epoch": 2423} {"train_loss": -12.587392807006836, "global_step": 407161, "epoch": 2423} {"train_loss": -12.696361541748047, "global_step": 407162, "epoch": 2423} {"train_loss": -12.781763076782227, "global_step": 407163, "epoch": 2423} {"train_loss": -12.655496597290039, "global_step": 407164, "epoch": 2423} {"train_loss": -12.460723876953125, "global_step": 407165, "epoch": 2423} {"train_loss": -12.501853942871094, "global_step": 407166, "epoch": 2423} {"train_loss": -12.73691177368164, "global_step": 407167, "epoch": 2423} {"train_loss": -12.556872367858887, "global_step": 407168, "epoch": 2423} {"train_loss": -12.660320281982422, "global_step": 407169, "epoch": 2423} {"train_loss": -12.557622909545898, "global_step": 407170, "epoch": 2423} {"train_loss": -12.624391555786133, "global_step": 407171, "epoch": 2423} {"train_loss": -12.578147888183594, "global_step": 407172, "epoch": 2423} {"train_loss": -12.521745681762695, "global_step": 407173, "epoch": 2423} {"train_loss": -12.44901180267334, "global_step": 407174, "epoch": 2423} {"train_loss": -12.050472259521484, "global_step": 407175, "epoch": 2423} {"train_loss": -12.390085220336914, "global_step": 407176, "epoch": 2423} {"train_loss": -12.4039306640625, "global_step": 407177, "epoch": 2423} {"train_loss": -12.675689697265625, "global_step": 407178, "epoch": 2423} {"train_loss": -12.511823654174805, "global_step": 407179, "epoch": 2423} {"train_loss": -12.721834182739258, "global_step": 407180, "epoch": 2423} {"train_loss": -12.140482902526855, "global_step": 407181, "epoch": 2423} {"train_loss": -12.654489517211914, "global_step": 407182, "epoch": 2423} {"train_loss": -11.868486404418945, "global_step": 407183, "epoch": 2423} {"train_loss": -12.826513290405273, "global_step": 407184, "epoch": 2423} {"train_loss": -12.45365047454834, "global_step": 407185, "epoch": 2423} {"train_loss": -12.271028518676758, "global_step": 407186, "epoch": 2423} {"train_loss": -12.786685943603516, "global_step": 407187, "epoch": 2423} {"train_loss": -12.891819953918457, "global_step": 407188, "epoch": 2423} {"train_loss": -12.622888565063477, "global_step": 407189, "epoch": 2423} {"train_loss": -12.441579818725586, "global_step": 407190, "epoch": 2423} {"train_loss": -12.767534255981445, "global_step": 407191, "epoch": 2423} {"train_loss": -12.194936752319336, "global_step": 407192, "epoch": 2423} {"train_loss": -12.782854080200195, "global_step": 407193, "epoch": 2423} {"train_loss": -12.588362693786621, "global_step": 407194, "epoch": 2423} {"train_loss": -12.122974395751953, "global_step": 407195, "epoch": 2423} {"train_loss": -12.104766845703125, "global_step": 407196, "epoch": 2423} {"train_loss": -12.607772827148438, "global_step": 407197, "epoch": 2423} {"train_loss": -12.476561546325684, "global_step": 407198, "epoch": 2423} {"train_loss": -11.70332145690918, "global_step": 407199, "epoch": 2423} {"train_loss": -12.529111862182617, "global_step": 407200, "epoch": 2423} {"train_loss": -12.637344360351562, "global_step": 407201, "epoch": 2423} {"train_loss": -12.647651672363281, "global_step": 407202, "epoch": 2423} {"train_loss": -12.263883590698242, "global_step": 407203, "epoch": 2423} {"train_loss": -12.714542388916016, "global_step": 407204, "epoch": 2423} {"train_loss": -12.316167831420898, "global_step": 407205, "epoch": 2423} {"train_loss": -11.963860511779785, "global_step": 407206, "epoch": 2423} {"train_loss": -11.86386489868164, "global_step": 407207, "epoch": 2423} {"train_loss": -12.560579299926758, "global_step": 407208, "epoch": 2423} {"train_loss": -11.65022087097168, "global_step": 407209, "epoch": 2423} {"train_loss": -12.332681655883789, "global_step": 407210, "epoch": 2423} {"train_loss": -11.868721008300781, "global_step": 407211, "epoch": 2423} {"train_loss": -10.615131378173828, "global_step": 407212, "epoch": 2423} {"train_loss": -11.191280364990234, "global_step": 407213, "epoch": 2423} {"train_loss": -11.078348159790039, "global_step": 407214, "epoch": 2423} {"train_loss": -9.84444808959961, "global_step": 407215, "epoch": 2423} {"train_loss": -10.04833984375, "global_step": 407216, "epoch": 2423} {"train_loss": -10.582352638244629, "global_step": 407217, "epoch": 2423} {"train_loss": -9.867067337036133, "global_step": 407218, "epoch": 2423} {"train_loss": -9.923694610595703, "global_step": 407219, "epoch": 2423} {"train_loss": -9.427144050598145, "global_step": 407220, "epoch": 2423} {"train_loss": -10.850871086120605, "global_step": 407221, "epoch": 2423} {"train_loss": -10.118353843688965, "global_step": 407222, "epoch": 2423} {"train_loss": -9.055365562438965, "global_step": 407223, "epoch": 2423} {"train_loss": -11.609943389892578, "global_step": 407224, "epoch": 2423} {"train_loss": -8.839512825012207, "global_step": 407225, "epoch": 2423} {"train_loss": -10.326118469238281, "global_step": 407226, "epoch": 2423} {"train_loss": -10.774826049804688, "global_step": 407227, "epoch": 2423} {"train_loss": -10.240943908691406, "global_step": 407228, "epoch": 2423} {"train_loss": -11.210816383361816, "global_step": 407229, "epoch": 2423} {"train_loss": -11.450652122497559, "global_step": 407230, "epoch": 2423} {"train_loss": -11.837486403329033, "global_step": 407231, "epoch": 2423, "val_loss": 298707.875} {"train_loss": -10.590599060058594, "global_step": 407232, "epoch": 2424} {"train_loss": -11.30398941040039, "global_step": 407233, "epoch": 2424} {"train_loss": -10.701948165893555, "global_step": 407234, "epoch": 2424} {"train_loss": -10.942523956298828, "global_step": 407235, "epoch": 2424} {"train_loss": -10.743829727172852, "global_step": 407236, "epoch": 2424} {"train_loss": -11.478300094604492, "global_step": 407237, "epoch": 2424} {"train_loss": -11.208723068237305, "global_step": 407238, "epoch": 2424} {"train_loss": -10.896620750427246, "global_step": 407239, "epoch": 2424} {"train_loss": -11.541534423828125, "global_step": 407240, "epoch": 2424} {"train_loss": -11.324748992919922, "global_step": 407241, "epoch": 2424} {"train_loss": -11.650157928466797, "global_step": 407242, "epoch": 2424} {"train_loss": -11.06982707977295, "global_step": 407243, "epoch": 2424} {"train_loss": -10.938150405883789, "global_step": 407244, "epoch": 2424} {"train_loss": -11.739053726196289, "global_step": 407245, "epoch": 2424} {"train_loss": -10.535523414611816, "global_step": 407246, "epoch": 2424} {"train_loss": -11.69990062713623, "global_step": 407247, "epoch": 2424} {"train_loss": -10.899898529052734, "global_step": 407248, "epoch": 2424} {"train_loss": -11.94192886352539, "global_step": 407249, "epoch": 2424} {"train_loss": -9.850812911987305, "global_step": 407250, "epoch": 2424} {"train_loss": -12.010531425476074, "global_step": 407251, "epoch": 2424} {"train_loss": -10.624277114868164, "global_step": 407252, "epoch": 2424} {"train_loss": -11.620330810546875, "global_step": 407253, "epoch": 2424} {"train_loss": -11.921255111694336, "global_step": 407254, "epoch": 2424} {"train_loss": -11.277462005615234, "global_step": 407255, "epoch": 2424} {"train_loss": -12.193357467651367, "global_step": 407256, "epoch": 2424} {"train_loss": -11.502668380737305, "global_step": 407257, "epoch": 2424} {"train_loss": -11.456157684326172, "global_step": 407258, "epoch": 2424} {"train_loss": -11.807973861694336, "global_step": 407259, "epoch": 2424} {"train_loss": -11.009319305419922, "global_step": 407260, "epoch": 2424} {"train_loss": -11.939092636108398, "global_step": 407261, "epoch": 2424} {"train_loss": -11.39175033569336, "global_step": 407262, "epoch": 2424} {"train_loss": -11.290555953979492, "global_step": 407263, "epoch": 2424} {"train_loss": -11.257596015930176, "global_step": 407264, "epoch": 2424} {"train_loss": -11.73554801940918, "global_step": 407265, "epoch": 2424} {"train_loss": -11.165210723876953, "global_step": 407266, "epoch": 2424} {"train_loss": -11.501952171325684, "global_step": 407267, "epoch": 2424} {"train_loss": -11.185775756835938, "global_step": 407268, "epoch": 2424} {"train_loss": -11.589409828186035, "global_step": 407269, "epoch": 2424} {"train_loss": -11.57455825805664, "global_step": 407270, "epoch": 2424} {"train_loss": -11.519163131713867, "global_step": 407271, "epoch": 2424} {"train_loss": -11.489482879638672, "global_step": 407272, "epoch": 2424} {"train_loss": -11.500490188598633, "global_step": 407273, "epoch": 2424} {"train_loss": -11.578399658203125, "global_step": 407274, "epoch": 2424} {"train_loss": -11.66545581817627, "global_step": 407275, "epoch": 2424} {"train_loss": -11.60877799987793, "global_step": 407276, "epoch": 2424} {"train_loss": -11.934794425964355, "global_step": 407277, "epoch": 2424} {"train_loss": -11.75417423248291, "global_step": 407278, "epoch": 2424} {"train_loss": -11.905828475952148, "global_step": 407279, "epoch": 2424} {"train_loss": -11.77103328704834, "global_step": 407280, "epoch": 2424} {"train_loss": -12.098793983459473, "global_step": 407281, "epoch": 2424} {"train_loss": -11.937759399414062, "global_step": 407282, "epoch": 2424} {"train_loss": -12.139068603515625, "global_step": 407283, "epoch": 2424} {"train_loss": -11.946358680725098, "global_step": 407284, "epoch": 2424} {"train_loss": -12.120757102966309, "global_step": 407285, "epoch": 2424} {"train_loss": -12.299773216247559, "global_step": 407286, "epoch": 2424} {"train_loss": -11.942394256591797, "global_step": 407287, "epoch": 2424} {"train_loss": -12.052156448364258, "global_step": 407288, "epoch": 2424} {"train_loss": -12.023857116699219, "global_step": 407289, "epoch": 2424} {"train_loss": -12.164897918701172, "global_step": 407290, "epoch": 2424} {"train_loss": -12.077089309692383, "global_step": 407291, "epoch": 2424} {"train_loss": -12.3551664352417, "global_step": 407292, "epoch": 2424} {"train_loss": -12.01764965057373, "global_step": 407293, "epoch": 2424} {"train_loss": -12.172060012817383, "global_step": 407294, "epoch": 2424} {"train_loss": -12.289459228515625, "global_step": 407295, "epoch": 2424} {"train_loss": -12.152690887451172, "global_step": 407296, "epoch": 2424} {"train_loss": -12.15003776550293, "global_step": 407297, "epoch": 2424} {"train_loss": -12.459325790405273, "global_step": 407298, "epoch": 2424} {"train_loss": -12.088094711303711, "global_step": 407299, "epoch": 2424} {"train_loss": -12.415607452392578, "global_step": 407300, "epoch": 2424} {"train_loss": -12.294004440307617, "global_step": 407301, "epoch": 2424} {"train_loss": -12.389033317565918, "global_step": 407302, "epoch": 2424} {"train_loss": -12.273042678833008, "global_step": 407303, "epoch": 2424} {"train_loss": -12.104429244995117, "global_step": 407304, "epoch": 2424} {"train_loss": -12.340036392211914, "global_step": 407305, "epoch": 2424} {"train_loss": -12.246662139892578, "global_step": 407306, "epoch": 2424} {"train_loss": -12.329117774963379, "global_step": 407307, "epoch": 2424} {"train_loss": -12.027737617492676, "global_step": 407308, "epoch": 2424} {"train_loss": -12.300832748413086, "global_step": 407309, "epoch": 2424} {"train_loss": -12.271810531616211, "global_step": 407310, "epoch": 2424} {"train_loss": -12.432770729064941, "global_step": 407311, "epoch": 2424} {"train_loss": -12.144886016845703, "global_step": 407312, "epoch": 2424} {"train_loss": -12.013313293457031, "global_step": 407313, "epoch": 2424} {"train_loss": -12.12968921661377, "global_step": 407314, "epoch": 2424} {"train_loss": -12.375865936279297, "global_step": 407315, "epoch": 2424} {"train_loss": -12.28862190246582, "global_step": 407316, "epoch": 2424} {"train_loss": -12.42642593383789, "global_step": 407317, "epoch": 2424} {"train_loss": -12.25663948059082, "global_step": 407318, "epoch": 2424} {"train_loss": -12.640868186950684, "global_step": 407319, "epoch": 2424} {"train_loss": -12.216005325317383, "global_step": 407320, "epoch": 2424} {"train_loss": -12.460293769836426, "global_step": 407321, "epoch": 2424} {"train_loss": -12.260438919067383, "global_step": 407322, "epoch": 2424} {"train_loss": -12.478200912475586, "global_step": 407323, "epoch": 2424} {"train_loss": -12.560209274291992, "global_step": 407324, "epoch": 2424} {"train_loss": -12.48542594909668, "global_step": 407325, "epoch": 2424} {"train_loss": -12.339938163757324, "global_step": 407326, "epoch": 2424} {"train_loss": -12.427118301391602, "global_step": 407327, "epoch": 2424} {"train_loss": -12.543388366699219, "global_step": 407328, "epoch": 2424} {"train_loss": -12.482307434082031, "global_step": 407329, "epoch": 2424} {"train_loss": -12.451544761657715, "global_step": 407330, "epoch": 2424} {"train_loss": -12.710159301757812, "global_step": 407331, "epoch": 2424} {"train_loss": -12.456012725830078, "global_step": 407332, "epoch": 2424} {"train_loss": -12.658913612365723, "global_step": 407333, "epoch": 2424} {"train_loss": -12.663850784301758, "global_step": 407334, "epoch": 2424} {"train_loss": -12.81755256652832, "global_step": 407335, "epoch": 2424} {"train_loss": -12.6206636428833, "global_step": 407336, "epoch": 2424} {"train_loss": -12.642643928527832, "global_step": 407337, "epoch": 2424} {"train_loss": -12.789036750793457, "global_step": 407338, "epoch": 2424} {"train_loss": -12.752583503723145, "global_step": 407339, "epoch": 2424} {"train_loss": -12.766382217407227, "global_step": 407340, "epoch": 2424} {"train_loss": -12.539148330688477, "global_step": 407341, "epoch": 2424} {"train_loss": -12.447571754455566, "global_step": 407342, "epoch": 2424} {"train_loss": -12.626358985900879, "global_step": 407343, "epoch": 2424} {"train_loss": -12.7008638381958, "global_step": 407344, "epoch": 2424} {"train_loss": -12.725509643554688, "global_step": 407345, "epoch": 2424} {"train_loss": -12.70948600769043, "global_step": 407346, "epoch": 2424} {"train_loss": -12.56244945526123, "global_step": 407347, "epoch": 2424} {"train_loss": -12.706558227539062, "global_step": 407348, "epoch": 2424} {"train_loss": -12.602733612060547, "global_step": 407349, "epoch": 2424} {"train_loss": -12.584014892578125, "global_step": 407350, "epoch": 2424} {"train_loss": -12.526233673095703, "global_step": 407351, "epoch": 2424} {"train_loss": -12.731409072875977, "global_step": 407352, "epoch": 2424} {"train_loss": -12.634732246398926, "global_step": 407353, "epoch": 2424} {"train_loss": -12.506343841552734, "global_step": 407354, "epoch": 2424} {"train_loss": -12.760622024536133, "global_step": 407355, "epoch": 2424} {"train_loss": -12.606435775756836, "global_step": 407356, "epoch": 2424} {"train_loss": -12.642797470092773, "global_step": 407357, "epoch": 2424} {"train_loss": -12.879534721374512, "global_step": 407358, "epoch": 2424} {"train_loss": -12.765097618103027, "global_step": 407359, "epoch": 2424} {"train_loss": -12.760387420654297, "global_step": 407360, "epoch": 2424} {"train_loss": -12.640495300292969, "global_step": 407361, "epoch": 2424} {"train_loss": -12.749916076660156, "global_step": 407362, "epoch": 2424} {"train_loss": -12.59939193725586, "global_step": 407363, "epoch": 2424} {"train_loss": -12.868936538696289, "global_step": 407364, "epoch": 2424} {"train_loss": -12.262776374816895, "global_step": 407365, "epoch": 2424} {"train_loss": -12.0621976852417, "global_step": 407366, "epoch": 2424} {"train_loss": -12.69648551940918, "global_step": 407367, "epoch": 2424} {"train_loss": -10.612958908081055, "global_step": 407368, "epoch": 2424} {"train_loss": -11.905362129211426, "global_step": 407369, "epoch": 2424} {"train_loss": -12.459263801574707, "global_step": 407370, "epoch": 2424} {"train_loss": -11.610309600830078, "global_step": 407371, "epoch": 2424} {"train_loss": -12.07168960571289, "global_step": 407372, "epoch": 2424} {"train_loss": -11.994277954101562, "global_step": 407373, "epoch": 2424} {"train_loss": -11.362630844116211, "global_step": 407374, "epoch": 2424} {"train_loss": -11.938133239746094, "global_step": 407375, "epoch": 2424} {"train_loss": -12.538495063781738, "global_step": 407376, "epoch": 2424} {"train_loss": -11.41727352142334, "global_step": 407377, "epoch": 2424} {"train_loss": -12.148758888244629, "global_step": 407378, "epoch": 2424} {"train_loss": -11.276622772216797, "global_step": 407379, "epoch": 2424} {"train_loss": -10.856975555419922, "global_step": 407380, "epoch": 2424} {"train_loss": -11.222320556640625, "global_step": 407381, "epoch": 2424} {"train_loss": -11.755516052246094, "global_step": 407382, "epoch": 2424} {"train_loss": -11.543695449829102, "global_step": 407383, "epoch": 2424} {"train_loss": -11.893409729003906, "global_step": 407384, "epoch": 2424} {"train_loss": -11.681875228881836, "global_step": 407385, "epoch": 2424} {"train_loss": -12.144081115722656, "global_step": 407386, "epoch": 2424} {"train_loss": -12.146707534790039, "global_step": 407387, "epoch": 2424} {"train_loss": -11.743205070495605, "global_step": 407388, "epoch": 2424} {"train_loss": -11.913623809814453, "global_step": 407389, "epoch": 2424} {"train_loss": -12.176643371582031, "global_step": 407390, "epoch": 2424} {"train_loss": -11.96310043334961, "global_step": 407391, "epoch": 2424} {"train_loss": -11.918509483337402, "global_step": 407392, "epoch": 2424} {"train_loss": -11.93699836730957, "global_step": 407393, "epoch": 2424} {"train_loss": -11.279986381530762, "global_step": 407394, "epoch": 2424} {"train_loss": -11.981985092163086, "global_step": 407395, "epoch": 2424} {"train_loss": -11.792001724243164, "global_step": 407396, "epoch": 2424} {"train_loss": -10.605854034423828, "global_step": 407397, "epoch": 2424} {"train_loss": -11.233421325683594, "global_step": 407398, "epoch": 2424} {"train_loss": -11.981465197744823, "global_step": 407399, "epoch": 2424, "val_loss": 297920.0} {"train_loss": -11.210613250732422, "global_step": 407400, "epoch": 2425} {"train_loss": -10.734271049499512, "global_step": 407401, "epoch": 2425} {"train_loss": -11.78373908996582, "global_step": 407402, "epoch": 2425} {"train_loss": -10.102888107299805, "global_step": 407403, "epoch": 2425} {"train_loss": -11.68595027923584, "global_step": 407404, "epoch": 2425} {"train_loss": -11.100317001342773, "global_step": 407405, "epoch": 2425} {"train_loss": -12.006490707397461, "global_step": 407406, "epoch": 2425} {"train_loss": -11.175108909606934, "global_step": 407407, "epoch": 2425} {"train_loss": -11.175056457519531, "global_step": 407408, "epoch": 2425} {"train_loss": -11.15507698059082, "global_step": 407409, "epoch": 2425} {"train_loss": -10.843137741088867, "global_step": 407410, "epoch": 2425} {"train_loss": -11.154788970947266, "global_step": 407411, "epoch": 2425} {"train_loss": -11.219331741333008, "global_step": 407412, "epoch": 2425} {"train_loss": -11.359755516052246, "global_step": 407413, "epoch": 2425} {"train_loss": -11.81259822845459, "global_step": 407414, "epoch": 2425} {"train_loss": -11.329935073852539, "global_step": 407415, "epoch": 2425} {"train_loss": -11.504085540771484, "global_step": 407416, "epoch": 2425} {"train_loss": -11.117847442626953, "global_step": 407417, "epoch": 2425} {"train_loss": -11.233349800109863, "global_step": 407418, "epoch": 2425} {"train_loss": -11.614513397216797, "global_step": 407419, "epoch": 2425} {"train_loss": -10.837093353271484, "global_step": 407420, "epoch": 2425} {"train_loss": -11.601197242736816, "global_step": 407421, "epoch": 2425} {"train_loss": -11.466747283935547, "global_step": 407422, "epoch": 2425} {"train_loss": -11.549600601196289, "global_step": 407423, "epoch": 2425} {"train_loss": -11.3826322555542, "global_step": 407424, "epoch": 2425} {"train_loss": -11.50617790222168, "global_step": 407425, "epoch": 2425} {"train_loss": -11.672977447509766, "global_step": 407426, "epoch": 2425} {"train_loss": -11.411635398864746, "global_step": 407427, "epoch": 2425} {"train_loss": -12.008638381958008, "global_step": 407428, "epoch": 2425} {"train_loss": -12.084877967834473, "global_step": 407429, "epoch": 2425} {"train_loss": -12.019928932189941, "global_step": 407430, "epoch": 2425} {"train_loss": -11.812543869018555, "global_step": 407431, "epoch": 2425} {"train_loss": -11.988791465759277, "global_step": 407432, "epoch": 2425} {"train_loss": -11.706253051757812, "global_step": 407433, "epoch": 2425} {"train_loss": -11.814990997314453, "global_step": 407434, "epoch": 2425} {"train_loss": -11.66893196105957, "global_step": 407435, "epoch": 2425} {"train_loss": -11.781288146972656, "global_step": 407436, "epoch": 2425} {"train_loss": -11.597774505615234, "global_step": 407437, "epoch": 2425} {"train_loss": -11.350279808044434, "global_step": 407438, "epoch": 2425} {"train_loss": -11.66108512878418, "global_step": 407439, "epoch": 2425} {"train_loss": -11.462356567382812, "global_step": 407440, "epoch": 2425} {"train_loss": -11.730510711669922, "global_step": 407441, "epoch": 2425} {"train_loss": -11.632899284362793, "global_step": 407442, "epoch": 2425} {"train_loss": -11.990646362304688, "global_step": 407443, "epoch": 2425} {"train_loss": -11.712424278259277, "global_step": 407444, "epoch": 2425} {"train_loss": -11.921575546264648, "global_step": 407445, "epoch": 2425} {"train_loss": -11.395423889160156, "global_step": 407446, "epoch": 2425} {"train_loss": -11.810935020446777, "global_step": 407447, "epoch": 2425} {"train_loss": -11.652913093566895, "global_step": 407448, "epoch": 2425} {"train_loss": -11.841888427734375, "global_step": 407449, "epoch": 2425} {"train_loss": -11.95180606842041, "global_step": 407450, "epoch": 2425} {"train_loss": -11.84526252746582, "global_step": 407451, "epoch": 2425} {"train_loss": -12.428586959838867, "global_step": 407452, "epoch": 2425} {"train_loss": -12.166383743286133, "global_step": 407453, "epoch": 2425} {"train_loss": -12.130032539367676, "global_step": 407454, "epoch": 2425} {"train_loss": -11.942480087280273, "global_step": 407455, "epoch": 2425} {"train_loss": -12.277253150939941, "global_step": 407456, "epoch": 2425} {"train_loss": -11.838054656982422, "global_step": 407457, "epoch": 2425} {"train_loss": -12.420351028442383, "global_step": 407458, "epoch": 2425} {"train_loss": -12.005245208740234, "global_step": 407459, "epoch": 2425} {"train_loss": -12.387750625610352, "global_step": 407460, "epoch": 2425} {"train_loss": -11.8762788772583, "global_step": 407461, "epoch": 2425} {"train_loss": -12.126961708068848, "global_step": 407462, "epoch": 2425} {"train_loss": -12.184564590454102, "global_step": 407463, "epoch": 2425} {"train_loss": -12.06428050994873, "global_step": 407464, "epoch": 2425} {"train_loss": -12.499061584472656, "global_step": 407465, "epoch": 2425} {"train_loss": -12.122032165527344, "global_step": 407466, "epoch": 2425} {"train_loss": -12.440511703491211, "global_step": 407467, "epoch": 2425} {"train_loss": -12.363396644592285, "global_step": 407468, "epoch": 2425} {"train_loss": -12.159744262695312, "global_step": 407469, "epoch": 2425} {"train_loss": -12.282773971557617, "global_step": 407470, "epoch": 2425} {"train_loss": -12.354662895202637, "global_step": 407471, "epoch": 2425} {"train_loss": -12.381868362426758, "global_step": 407472, "epoch": 2425} {"train_loss": -12.309242248535156, "global_step": 407473, "epoch": 2425} {"train_loss": -12.145404815673828, "global_step": 407474, "epoch": 2425} {"train_loss": -12.25190544128418, "global_step": 407475, "epoch": 2425} {"train_loss": -12.161014556884766, "global_step": 407476, "epoch": 2425} {"train_loss": -12.60932731628418, "global_step": 407477, "epoch": 2425} {"train_loss": -12.079885482788086, "global_step": 407478, "epoch": 2425} {"train_loss": -12.515810012817383, "global_step": 407479, "epoch": 2425} {"train_loss": -12.300365447998047, "global_step": 407480, "epoch": 2425} {"train_loss": -12.17507266998291, "global_step": 407481, "epoch": 2425} {"train_loss": -12.453622817993164, "global_step": 407482, "epoch": 2425} {"train_loss": -12.50035285949707, "global_step": 407483, "epoch": 2425} {"train_loss": -12.531797409057617, "global_step": 407484, "epoch": 2425} {"train_loss": -12.353986740112305, "global_step": 407485, "epoch": 2425} {"train_loss": -12.269994735717773, "global_step": 407486, "epoch": 2425} {"train_loss": -12.301942825317383, "global_step": 407487, "epoch": 2425} {"train_loss": -12.43317985534668, "global_step": 407488, "epoch": 2425} {"train_loss": -12.54648494720459, "global_step": 407489, "epoch": 2425} {"train_loss": -12.30986213684082, "global_step": 407490, "epoch": 2425} {"train_loss": -12.58874225616455, "global_step": 407491, "epoch": 2425} {"train_loss": -12.465370178222656, "global_step": 407492, "epoch": 2425} {"train_loss": -12.258066177368164, "global_step": 407493, "epoch": 2425} {"train_loss": -12.516305923461914, "global_step": 407494, "epoch": 2425} {"train_loss": -12.418148040771484, "global_step": 407495, "epoch": 2425} {"train_loss": -12.588970184326172, "global_step": 407496, "epoch": 2425} {"train_loss": -12.808870315551758, "global_step": 407497, "epoch": 2425} {"train_loss": -12.24488353729248, "global_step": 407498, "epoch": 2425} {"train_loss": -12.412919998168945, "global_step": 407499, "epoch": 2425} {"train_loss": -12.639081954956055, "global_step": 407500, "epoch": 2425} {"train_loss": -12.45010757446289, "global_step": 407501, "epoch": 2425} {"train_loss": -12.577899932861328, "global_step": 407502, "epoch": 2425} {"train_loss": -12.559865951538086, "global_step": 407503, "epoch": 2425} {"train_loss": -12.704345703125, "global_step": 407504, "epoch": 2425} {"train_loss": -12.560771942138672, "global_step": 407505, "epoch": 2425} {"train_loss": -12.604647636413574, "global_step": 407506, "epoch": 2425} {"train_loss": -12.759020805358887, "global_step": 407507, "epoch": 2425} {"train_loss": -12.538612365722656, "global_step": 407508, "epoch": 2425} {"train_loss": -12.658527374267578, "global_step": 407509, "epoch": 2425} {"train_loss": -12.493474960327148, "global_step": 407510, "epoch": 2425} {"train_loss": -12.364229202270508, "global_step": 407511, "epoch": 2425} {"train_loss": -12.569412231445312, "global_step": 407512, "epoch": 2425} {"train_loss": -12.368043899536133, "global_step": 407513, "epoch": 2425} {"train_loss": -12.58739948272705, "global_step": 407514, "epoch": 2425} {"train_loss": -12.599769592285156, "global_step": 407515, "epoch": 2425} {"train_loss": -12.68648910522461, "global_step": 407516, "epoch": 2425} {"train_loss": -12.758333206176758, "global_step": 407517, "epoch": 2425} {"train_loss": -12.8667573928833, "global_step": 407518, "epoch": 2425} {"train_loss": -12.571043014526367, "global_step": 407519, "epoch": 2425} {"train_loss": -12.702651023864746, "global_step": 407520, "epoch": 2425} {"train_loss": -12.638788223266602, "global_step": 407521, "epoch": 2425} {"train_loss": -12.618720054626465, "global_step": 407522, "epoch": 2425} {"train_loss": -12.965802192687988, "global_step": 407523, "epoch": 2425} {"train_loss": -12.289770126342773, "global_step": 407524, "epoch": 2425} {"train_loss": -12.41171646118164, "global_step": 407525, "epoch": 2425} {"train_loss": -12.300821304321289, "global_step": 407526, "epoch": 2425} {"train_loss": -12.641233444213867, "global_step": 407527, "epoch": 2425} {"train_loss": -12.329423904418945, "global_step": 407528, "epoch": 2425} {"train_loss": -12.84207534790039, "global_step": 407529, "epoch": 2425} {"train_loss": -12.141825675964355, "global_step": 407530, "epoch": 2425} {"train_loss": -12.769757270812988, "global_step": 407531, "epoch": 2425} {"train_loss": -11.967535018920898, "global_step": 407532, "epoch": 2425} {"train_loss": -11.782079696655273, "global_step": 407533, "epoch": 2425} {"train_loss": -12.577919960021973, "global_step": 407534, "epoch": 2425} {"train_loss": -12.596673965454102, "global_step": 407535, "epoch": 2425} {"train_loss": -11.635169982910156, "global_step": 407536, "epoch": 2425} {"train_loss": -11.802427291870117, "global_step": 407537, "epoch": 2425} {"train_loss": -11.607955932617188, "global_step": 407538, "epoch": 2425} {"train_loss": -11.394247055053711, "global_step": 407539, "epoch": 2425} {"train_loss": -11.341772079467773, "global_step": 407540, "epoch": 2425} {"train_loss": -11.032419204711914, "global_step": 407541, "epoch": 2425} {"train_loss": -9.068443298339844, "global_step": 407542, "epoch": 2425} {"train_loss": -10.508602142333984, "global_step": 407543, "epoch": 2425} {"train_loss": -9.109947204589844, "global_step": 407544, "epoch": 2425} {"train_loss": -8.526531219482422, "global_step": 407545, "epoch": 2425} {"train_loss": -8.088605880737305, "global_step": 407546, "epoch": 2425} {"train_loss": -11.43223762512207, "global_step": 407547, "epoch": 2425} {"train_loss": -9.655707359313965, "global_step": 407548, "epoch": 2425} {"train_loss": -8.69282341003418, "global_step": 407549, "epoch": 2425} {"train_loss": -10.505561828613281, "global_step": 407550, "epoch": 2425} {"train_loss": -7.573125839233398, "global_step": 407551, "epoch": 2425} {"train_loss": -7.758319854736328, "global_step": 407552, "epoch": 2425} {"train_loss": -8.5724515914917, "global_step": 407553, "epoch": 2425} {"train_loss": -6.549071788787842, "global_step": 407554, "epoch": 2425} {"train_loss": -6.359426498413086, "global_step": 407555, "epoch": 2425} {"train_loss": -8.010051727294922, "global_step": 407556, "epoch": 2425} {"train_loss": -7.035365104675293, "global_step": 407557, "epoch": 2425} {"train_loss": -8.83238410949707, "global_step": 407558, "epoch": 2425} {"train_loss": -9.385271072387695, "global_step": 407559, "epoch": 2425} {"train_loss": -10.025184631347656, "global_step": 407560, "epoch": 2425} {"train_loss": -10.023557662963867, "global_step": 407561, "epoch": 2425} {"train_loss": -10.510065078735352, "global_step": 407562, "epoch": 2425} {"train_loss": -9.996173858642578, "global_step": 407563, "epoch": 2425} {"train_loss": -10.616560935974121, "global_step": 407564, "epoch": 2425} {"train_loss": -9.915157318115234, "global_step": 407565, "epoch": 2425} {"train_loss": -10.736247062683105, "global_step": 407566, "epoch": 2425} {"train_loss": -11.599140516349248, "global_step": 407567, "epoch": 2425, "val_loss": 297949.3125, "train_action_mse_error": 0.9022328853607178} {"train_loss": -9.38469123840332, "global_step": 407568, "epoch": 2426} {"train_loss": -10.715991020202637, "global_step": 407569, "epoch": 2426} {"train_loss": -10.177553176879883, "global_step": 407570, "epoch": 2426} {"train_loss": -11.15383529663086, "global_step": 407571, "epoch": 2426} {"train_loss": -10.419754028320312, "global_step": 407572, "epoch": 2426} {"train_loss": -11.071839332580566, "global_step": 407573, "epoch": 2426} {"train_loss": -10.811805725097656, "global_step": 407574, "epoch": 2426} {"train_loss": -10.493507385253906, "global_step": 407575, "epoch": 2426} {"train_loss": -11.592665672302246, "global_step": 407576, "epoch": 2426} {"train_loss": -10.586915016174316, "global_step": 407577, "epoch": 2426} {"train_loss": -11.907997131347656, "global_step": 407578, "epoch": 2426} {"train_loss": -10.917879104614258, "global_step": 407579, "epoch": 2426} {"train_loss": -11.459237098693848, "global_step": 407580, "epoch": 2426} {"train_loss": -11.48487663269043, "global_step": 407581, "epoch": 2426} {"train_loss": -11.294042587280273, "global_step": 407582, "epoch": 2426} {"train_loss": -10.98886489868164, "global_step": 407583, "epoch": 2426} {"train_loss": -11.403953552246094, "global_step": 407584, "epoch": 2426} {"train_loss": -11.251798629760742, "global_step": 407585, "epoch": 2426} {"train_loss": -11.366096496582031, "global_step": 407586, "epoch": 2426} {"train_loss": -11.300374031066895, "global_step": 407587, "epoch": 2426} {"train_loss": -11.077775955200195, "global_step": 407588, "epoch": 2426} {"train_loss": -11.641853332519531, "global_step": 407589, "epoch": 2426} {"train_loss": -11.079368591308594, "global_step": 407590, "epoch": 2426} {"train_loss": -11.779716491699219, "global_step": 407591, "epoch": 2426} {"train_loss": -11.23624038696289, "global_step": 407592, "epoch": 2426} {"train_loss": -11.989835739135742, "global_step": 407593, "epoch": 2426} {"train_loss": -11.692500114440918, "global_step": 407594, "epoch": 2426} {"train_loss": -11.938934326171875, "global_step": 407595, "epoch": 2426} {"train_loss": -11.114886283874512, "global_step": 407596, "epoch": 2426} {"train_loss": -11.696247100830078, "global_step": 407597, "epoch": 2426} {"train_loss": -12.245410919189453, "global_step": 407598, "epoch": 2426} {"train_loss": -11.628864288330078, "global_step": 407599, "epoch": 2426} {"train_loss": -12.006797790527344, "global_step": 407600, "epoch": 2426} {"train_loss": -11.49219036102295, "global_step": 407601, "epoch": 2426} {"train_loss": -11.97843074798584, "global_step": 407602, "epoch": 2426} {"train_loss": -11.601957321166992, "global_step": 407603, "epoch": 2426} {"train_loss": -11.987201690673828, "global_step": 407604, "epoch": 2426} {"train_loss": -11.69127082824707, "global_step": 407605, "epoch": 2426} {"train_loss": -11.975935935974121, "global_step": 407606, "epoch": 2426} {"train_loss": -11.517339706420898, "global_step": 407607, "epoch": 2426} {"train_loss": -11.867844581604004, "global_step": 407608, "epoch": 2426} {"train_loss": -11.812185287475586, "global_step": 407609, "epoch": 2426} {"train_loss": -11.70697021484375, "global_step": 407610, "epoch": 2426} {"train_loss": -11.909416198730469, "global_step": 407611, "epoch": 2426} {"train_loss": -11.577404022216797, "global_step": 407612, "epoch": 2426} {"train_loss": -11.578298568725586, "global_step": 407613, "epoch": 2426} {"train_loss": -11.906089782714844, "global_step": 407614, "epoch": 2426} {"train_loss": -11.911192893981934, "global_step": 407615, "epoch": 2426} {"train_loss": -11.883261680603027, "global_step": 407616, "epoch": 2426} {"train_loss": -12.031913757324219, "global_step": 407617, "epoch": 2426} {"train_loss": -11.905258178710938, "global_step": 407618, "epoch": 2426} {"train_loss": -11.733558654785156, "global_step": 407619, "epoch": 2426} {"train_loss": -12.169050216674805, "global_step": 407620, "epoch": 2426} {"train_loss": -11.58874225616455, "global_step": 407621, "epoch": 2426} {"train_loss": -11.90273380279541, "global_step": 407622, "epoch": 2426} {"train_loss": -12.060608863830566, "global_step": 407623, "epoch": 2426} {"train_loss": -12.110270500183105, "global_step": 407624, "epoch": 2426} {"train_loss": -11.997390747070312, "global_step": 407625, "epoch": 2426} {"train_loss": -12.259881019592285, "global_step": 407626, "epoch": 2426} {"train_loss": -12.012964248657227, "global_step": 407627, "epoch": 2426} {"train_loss": -11.894014358520508, "global_step": 407628, "epoch": 2426} {"train_loss": -12.107775688171387, "global_step": 407629, "epoch": 2426} {"train_loss": -11.97978687286377, "global_step": 407630, "epoch": 2426} {"train_loss": -12.0569429397583, "global_step": 407631, "epoch": 2426} {"train_loss": -12.265413284301758, "global_step": 407632, "epoch": 2426} {"train_loss": -11.909324645996094, "global_step": 407633, "epoch": 2426} {"train_loss": -12.463133811950684, "global_step": 407634, "epoch": 2426} {"train_loss": -12.1160249710083, "global_step": 407635, "epoch": 2426} {"train_loss": -12.102184295654297, "global_step": 407636, "epoch": 2426} {"train_loss": -12.384695053100586, "global_step": 407637, "epoch": 2426} {"train_loss": -12.12624454498291, "global_step": 407638, "epoch": 2426} {"train_loss": -12.29287338256836, "global_step": 407639, "epoch": 2426} {"train_loss": -12.4214448928833, "global_step": 407640, "epoch": 2426} {"train_loss": -12.252004623413086, "global_step": 407641, "epoch": 2426} {"train_loss": -12.409293174743652, "global_step": 407642, "epoch": 2426} {"train_loss": -12.379734992980957, "global_step": 407643, "epoch": 2426} {"train_loss": -12.193836212158203, "global_step": 407644, "epoch": 2426} {"train_loss": -12.40538215637207, "global_step": 407645, "epoch": 2426} {"train_loss": -12.266155242919922, "global_step": 407646, "epoch": 2426} {"train_loss": -12.505727767944336, "global_step": 407647, "epoch": 2426} {"train_loss": -12.172038078308105, "global_step": 407648, "epoch": 2426} {"train_loss": -12.508362770080566, "global_step": 407649, "epoch": 2426} {"train_loss": -12.423885345458984, "global_step": 407650, "epoch": 2426} {"train_loss": -12.365387916564941, "global_step": 407651, "epoch": 2426} {"train_loss": -12.263501167297363, "global_step": 407652, "epoch": 2426} {"train_loss": -12.384662628173828, "global_step": 407653, "epoch": 2426} {"train_loss": -12.389714241027832, "global_step": 407654, "epoch": 2426} {"train_loss": -12.406877517700195, "global_step": 407655, "epoch": 2426} {"train_loss": -12.284425735473633, "global_step": 407656, "epoch": 2426} {"train_loss": -12.454404830932617, "global_step": 407657, "epoch": 2426} {"train_loss": -12.393959045410156, "global_step": 407658, "epoch": 2426} {"train_loss": -12.413402557373047, "global_step": 407659, "epoch": 2426} {"train_loss": -12.540523529052734, "global_step": 407660, "epoch": 2426} {"train_loss": -12.677038192749023, "global_step": 407661, "epoch": 2426} {"train_loss": -12.473394393920898, "global_step": 407662, "epoch": 2426} {"train_loss": -12.631830215454102, "global_step": 407663, "epoch": 2426} {"train_loss": -12.557591438293457, "global_step": 407664, "epoch": 2426} {"train_loss": -12.437673568725586, "global_step": 407665, "epoch": 2426} {"train_loss": -12.35517692565918, "global_step": 407666, "epoch": 2426} {"train_loss": -12.38463020324707, "global_step": 407667, "epoch": 2426} {"train_loss": -12.591201782226562, "global_step": 407668, "epoch": 2426} {"train_loss": -12.614667892456055, "global_step": 407669, "epoch": 2426} {"train_loss": -12.497175216674805, "global_step": 407670, "epoch": 2426} {"train_loss": -12.665252685546875, "global_step": 407671, "epoch": 2426} {"train_loss": -12.718162536621094, "global_step": 407672, "epoch": 2426} {"train_loss": -12.577129364013672, "global_step": 407673, "epoch": 2426} {"train_loss": -12.656028747558594, "global_step": 407674, "epoch": 2426} {"train_loss": -12.472538948059082, "global_step": 407675, "epoch": 2426} {"train_loss": -12.672160148620605, "global_step": 407676, "epoch": 2426} {"train_loss": -12.583391189575195, "global_step": 407677, "epoch": 2426} {"train_loss": -12.489309310913086, "global_step": 407678, "epoch": 2426} {"train_loss": -12.856678009033203, "global_step": 407679, "epoch": 2426} {"train_loss": -12.650554656982422, "global_step": 407680, "epoch": 2426} {"train_loss": -12.766210556030273, "global_step": 407681, "epoch": 2426} {"train_loss": -12.796274185180664, "global_step": 407682, "epoch": 2426} {"train_loss": -12.529767990112305, "global_step": 407683, "epoch": 2426} {"train_loss": -12.673177719116211, "global_step": 407684, "epoch": 2426} {"train_loss": -12.711404800415039, "global_step": 407685, "epoch": 2426} {"train_loss": -12.791009902954102, "global_step": 407686, "epoch": 2426} {"train_loss": -12.741376876831055, "global_step": 407687, "epoch": 2426} {"train_loss": -12.775634765625, "global_step": 407688, "epoch": 2426} {"train_loss": -12.60924243927002, "global_step": 407689, "epoch": 2426} {"train_loss": -12.675176620483398, "global_step": 407690, "epoch": 2426} {"train_loss": -12.696585655212402, "global_step": 407691, "epoch": 2426} {"train_loss": -12.816034317016602, "global_step": 407692, "epoch": 2426} {"train_loss": -12.807872772216797, "global_step": 407693, "epoch": 2426} {"train_loss": -12.83126449584961, "global_step": 407694, "epoch": 2426} {"train_loss": -12.731819152832031, "global_step": 407695, "epoch": 2426} {"train_loss": -12.79411506652832, "global_step": 407696, "epoch": 2426} {"train_loss": -12.870246887207031, "global_step": 407697, "epoch": 2426} {"train_loss": -12.939587593078613, "global_step": 407698, "epoch": 2426} {"train_loss": -12.700479507446289, "global_step": 407699, "epoch": 2426} {"train_loss": -12.561197280883789, "global_step": 407700, "epoch": 2426} {"train_loss": -12.571952819824219, "global_step": 407701, "epoch": 2426} {"train_loss": -12.942325592041016, "global_step": 407702, "epoch": 2426} {"train_loss": -12.913588523864746, "global_step": 407703, "epoch": 2426} {"train_loss": -12.805496215820312, "global_step": 407704, "epoch": 2426} {"train_loss": -12.914779663085938, "global_step": 407705, "epoch": 2426} {"train_loss": -12.546701431274414, "global_step": 407706, "epoch": 2426} {"train_loss": -12.742116928100586, "global_step": 407707, "epoch": 2426} {"train_loss": -12.8284912109375, "global_step": 407708, "epoch": 2426} {"train_loss": -12.453216552734375, "global_step": 407709, "epoch": 2426} {"train_loss": -12.285482406616211, "global_step": 407710, "epoch": 2426} {"train_loss": -12.626043319702148, "global_step": 407711, "epoch": 2426} {"train_loss": -12.573854446411133, "global_step": 407712, "epoch": 2426} {"train_loss": -12.631489753723145, "global_step": 407713, "epoch": 2426} {"train_loss": -12.114191055297852, "global_step": 407714, "epoch": 2426} {"train_loss": -11.806038856506348, "global_step": 407715, "epoch": 2426} {"train_loss": -11.858803749084473, "global_step": 407716, "epoch": 2426} {"train_loss": -12.615673065185547, "global_step": 407717, "epoch": 2426} {"train_loss": -11.998724937438965, "global_step": 407718, "epoch": 2426} {"train_loss": -12.669214248657227, "global_step": 407719, "epoch": 2426} {"train_loss": -11.76730728149414, "global_step": 407720, "epoch": 2426} {"train_loss": -12.075238227844238, "global_step": 407721, "epoch": 2426} {"train_loss": -12.33053970336914, "global_step": 407722, "epoch": 2426} {"train_loss": -11.607101440429688, "global_step": 407723, "epoch": 2426} {"train_loss": -9.904579162597656, "global_step": 407724, "epoch": 2426} {"train_loss": -12.17564582824707, "global_step": 407725, "epoch": 2426} {"train_loss": -11.392101287841797, "global_step": 407726, "epoch": 2426} {"train_loss": -11.318519592285156, "global_step": 407727, "epoch": 2426} {"train_loss": -12.490478515625, "global_step": 407728, "epoch": 2426} {"train_loss": -11.381940841674805, "global_step": 407729, "epoch": 2426} {"train_loss": -11.071094512939453, "global_step": 407730, "epoch": 2426} {"train_loss": -12.415059089660645, "global_step": 407731, "epoch": 2426} {"train_loss": -12.014744758605957, "global_step": 407732, "epoch": 2426} {"train_loss": -11.827855110168457, "global_step": 407733, "epoch": 2426} {"train_loss": -12.291345596313477, "global_step": 407734, "epoch": 2426} {"train_loss": -12.076249519983927, "global_step": 407735, "epoch": 2426, "val_loss": 299015.40625} {"train_loss": -12.328461647033691, "global_step": 407736, "epoch": 2427} {"train_loss": -11.520374298095703, "global_step": 407737, "epoch": 2427} {"train_loss": -12.308340072631836, "global_step": 407738, "epoch": 2427} {"train_loss": -12.310267448425293, "global_step": 407739, "epoch": 2427} {"train_loss": -12.557409286499023, "global_step": 407740, "epoch": 2427} {"train_loss": -12.03225326538086, "global_step": 407741, "epoch": 2427} {"train_loss": -12.251197814941406, "global_step": 407742, "epoch": 2427} {"train_loss": -12.098572731018066, "global_step": 407743, "epoch": 2427} {"train_loss": -12.128738403320312, "global_step": 407744, "epoch": 2427} {"train_loss": -12.117603302001953, "global_step": 407745, "epoch": 2427} {"train_loss": -11.981200218200684, "global_step": 407746, "epoch": 2427} {"train_loss": -12.334211349487305, "global_step": 407747, "epoch": 2427} {"train_loss": -12.42318344116211, "global_step": 407748, "epoch": 2427} {"train_loss": -12.279220581054688, "global_step": 407749, "epoch": 2427} {"train_loss": -12.389781951904297, "global_step": 407750, "epoch": 2427} {"train_loss": -12.631114959716797, "global_step": 407751, "epoch": 2427} {"train_loss": -12.498323440551758, "global_step": 407752, "epoch": 2427} {"train_loss": -12.632617950439453, "global_step": 407753, "epoch": 2427} {"train_loss": -12.653904914855957, "global_step": 407754, "epoch": 2427} {"train_loss": -12.00478458404541, "global_step": 407755, "epoch": 2427} {"train_loss": -12.724645614624023, "global_step": 407756, "epoch": 2427} {"train_loss": -11.946174621582031, "global_step": 407757, "epoch": 2427} {"train_loss": -11.48347282409668, "global_step": 407758, "epoch": 2427} {"train_loss": -12.311359405517578, "global_step": 407759, "epoch": 2427} {"train_loss": -11.8182373046875, "global_step": 407760, "epoch": 2427} {"train_loss": -11.80086898803711, "global_step": 407761, "epoch": 2427} {"train_loss": -11.162598609924316, "global_step": 407762, "epoch": 2427} {"train_loss": -12.097415924072266, "global_step": 407763, "epoch": 2427} {"train_loss": -11.989995956420898, "global_step": 407764, "epoch": 2427} {"train_loss": -12.135974884033203, "global_step": 407765, "epoch": 2427} {"train_loss": -12.170059204101562, "global_step": 407766, "epoch": 2427} {"train_loss": -12.39008617401123, "global_step": 407767, "epoch": 2427} {"train_loss": -12.354623794555664, "global_step": 407768, "epoch": 2427} {"train_loss": -11.965705871582031, "global_step": 407769, "epoch": 2427} {"train_loss": -12.42134952545166, "global_step": 407770, "epoch": 2427} {"train_loss": -12.399919509887695, "global_step": 407771, "epoch": 2427} {"train_loss": -11.913544654846191, "global_step": 407772, "epoch": 2427} {"train_loss": -11.862794876098633, "global_step": 407773, "epoch": 2427} {"train_loss": -12.353976249694824, "global_step": 407774, "epoch": 2427} {"train_loss": -11.478853225708008, "global_step": 407775, "epoch": 2427} {"train_loss": -12.536564826965332, "global_step": 407776, "epoch": 2427} {"train_loss": -12.516005516052246, "global_step": 407777, "epoch": 2427} {"train_loss": -12.318092346191406, "global_step": 407778, "epoch": 2427} {"train_loss": -12.06096363067627, "global_step": 407779, "epoch": 2427} {"train_loss": -12.462180137634277, "global_step": 407780, "epoch": 2427} {"train_loss": -12.336567878723145, "global_step": 407781, "epoch": 2427} {"train_loss": -12.376592636108398, "global_step": 407782, "epoch": 2427} {"train_loss": -12.342893600463867, "global_step": 407783, "epoch": 2427} {"train_loss": -12.31480884552002, "global_step": 407784, "epoch": 2427} {"train_loss": -12.518564224243164, "global_step": 407785, "epoch": 2427} {"train_loss": -12.294439315795898, "global_step": 407786, "epoch": 2427} {"train_loss": -11.892095565795898, "global_step": 407787, "epoch": 2427} {"train_loss": -12.686760902404785, "global_step": 407788, "epoch": 2427} {"train_loss": -12.169710159301758, "global_step": 407789, "epoch": 2427} {"train_loss": -12.507637977600098, "global_step": 407790, "epoch": 2427} {"train_loss": -12.466632843017578, "global_step": 407791, "epoch": 2427} {"train_loss": -12.263187408447266, "global_step": 407792, "epoch": 2427} {"train_loss": -12.332914352416992, "global_step": 407793, "epoch": 2427} {"train_loss": -12.367599487304688, "global_step": 407794, "epoch": 2427} {"train_loss": -12.448481559753418, "global_step": 407795, "epoch": 2427} {"train_loss": -12.409639358520508, "global_step": 407796, "epoch": 2427} {"train_loss": -12.284026145935059, "global_step": 407797, "epoch": 2427} {"train_loss": -12.723750114440918, "global_step": 407798, "epoch": 2427} {"train_loss": -12.57721996307373, "global_step": 407799, "epoch": 2427} {"train_loss": -12.514568328857422, "global_step": 407800, "epoch": 2427} {"train_loss": -12.415499687194824, "global_step": 407801, "epoch": 2427} {"train_loss": -12.688779830932617, "global_step": 407802, "epoch": 2427} {"train_loss": -11.85995101928711, "global_step": 407803, "epoch": 2427} {"train_loss": -12.086898803710938, "global_step": 407804, "epoch": 2427} {"train_loss": -12.525217056274414, "global_step": 407805, "epoch": 2427} {"train_loss": -12.048179626464844, "global_step": 407806, "epoch": 2427} {"train_loss": -11.838617324829102, "global_step": 407807, "epoch": 2427} {"train_loss": -12.617368698120117, "global_step": 407808, "epoch": 2427} {"train_loss": -11.522327423095703, "global_step": 407809, "epoch": 2427} {"train_loss": -11.137860298156738, "global_step": 407810, "epoch": 2427} {"train_loss": -11.877466201782227, "global_step": 407811, "epoch": 2427} {"train_loss": -11.814840316772461, "global_step": 407812, "epoch": 2427} {"train_loss": -11.3843994140625, "global_step": 407813, "epoch": 2427} {"train_loss": -11.749212265014648, "global_step": 407814, "epoch": 2427} {"train_loss": -11.569013595581055, "global_step": 407815, "epoch": 2427} {"train_loss": -10.67057991027832, "global_step": 407816, "epoch": 2427} {"train_loss": -12.365161895751953, "global_step": 407817, "epoch": 2427} {"train_loss": -11.673334121704102, "global_step": 407818, "epoch": 2427} {"train_loss": -11.733695983886719, "global_step": 407819, "epoch": 2427} {"train_loss": -11.926454544067383, "global_step": 407820, "epoch": 2427} {"train_loss": -10.488363265991211, "global_step": 407821, "epoch": 2427} {"train_loss": -11.393899917602539, "global_step": 407822, "epoch": 2427} {"train_loss": -11.579672813415527, "global_step": 407823, "epoch": 2427} {"train_loss": -10.147170066833496, "global_step": 407824, "epoch": 2427} {"train_loss": -10.094330787658691, "global_step": 407825, "epoch": 2427} {"train_loss": -10.322697639465332, "global_step": 407826, "epoch": 2427} {"train_loss": -10.064362525939941, "global_step": 407827, "epoch": 2427} {"train_loss": -9.850503921508789, "global_step": 407828, "epoch": 2427} {"train_loss": -9.30549430847168, "global_step": 407829, "epoch": 2427} {"train_loss": -9.706918716430664, "global_step": 407830, "epoch": 2427} {"train_loss": -9.523504257202148, "global_step": 407831, "epoch": 2427} {"train_loss": -9.47292423248291, "global_step": 407832, "epoch": 2427} {"train_loss": -10.64315414428711, "global_step": 407833, "epoch": 2427} {"train_loss": -10.470560073852539, "global_step": 407834, "epoch": 2427} {"train_loss": -10.708709716796875, "global_step": 407835, "epoch": 2427} {"train_loss": -10.302828788757324, "global_step": 407836, "epoch": 2427} {"train_loss": -9.888252258300781, "global_step": 407837, "epoch": 2427} {"train_loss": -9.887274742126465, "global_step": 407838, "epoch": 2427} {"train_loss": -10.102219581604004, "global_step": 407839, "epoch": 2427} {"train_loss": -9.907588958740234, "global_step": 407840, "epoch": 2427} {"train_loss": -10.336612701416016, "global_step": 407841, "epoch": 2427} {"train_loss": -9.784196853637695, "global_step": 407842, "epoch": 2427} {"train_loss": -10.174930572509766, "global_step": 407843, "epoch": 2427} {"train_loss": -10.264701843261719, "global_step": 407844, "epoch": 2427} {"train_loss": -9.448040008544922, "global_step": 407845, "epoch": 2427} {"train_loss": -9.337381362915039, "global_step": 407846, "epoch": 2427} {"train_loss": -10.454843521118164, "global_step": 407847, "epoch": 2427} {"train_loss": -10.040313720703125, "global_step": 407848, "epoch": 2427} {"train_loss": -10.348095893859863, "global_step": 407849, "epoch": 2427} {"train_loss": -11.121894836425781, "global_step": 407850, "epoch": 2427} {"train_loss": -10.746358871459961, "global_step": 407851, "epoch": 2427} {"train_loss": -11.349485397338867, "global_step": 407852, "epoch": 2427} {"train_loss": -10.299322128295898, "global_step": 407853, "epoch": 2427} {"train_loss": -11.267229080200195, "global_step": 407854, "epoch": 2427} {"train_loss": -10.924816131591797, "global_step": 407855, "epoch": 2427} {"train_loss": -11.332679748535156, "global_step": 407856, "epoch": 2427} {"train_loss": -11.042295455932617, "global_step": 407857, "epoch": 2427} {"train_loss": -10.976188659667969, "global_step": 407858, "epoch": 2427} {"train_loss": -10.879484176635742, "global_step": 407859, "epoch": 2427} {"train_loss": -10.306642532348633, "global_step": 407860, "epoch": 2427} {"train_loss": -11.306992530822754, "global_step": 407861, "epoch": 2427} {"train_loss": -10.92040729522705, "global_step": 407862, "epoch": 2427} {"train_loss": -11.608949661254883, "global_step": 407863, "epoch": 2427} {"train_loss": -10.810012817382812, "global_step": 407864, "epoch": 2427} {"train_loss": -11.499765396118164, "global_step": 407865, "epoch": 2427} {"train_loss": -11.096883773803711, "global_step": 407866, "epoch": 2427} {"train_loss": -11.594263076782227, "global_step": 407867, "epoch": 2427} {"train_loss": -10.980559349060059, "global_step": 407868, "epoch": 2427} {"train_loss": -11.920516967773438, "global_step": 407869, "epoch": 2427} {"train_loss": -11.087108612060547, "global_step": 407870, "epoch": 2427} {"train_loss": -12.126601219177246, "global_step": 407871, "epoch": 2427} {"train_loss": -11.232959747314453, "global_step": 407872, "epoch": 2427} {"train_loss": -11.720390319824219, "global_step": 407873, "epoch": 2427} {"train_loss": -11.62765121459961, "global_step": 407874, "epoch": 2427} {"train_loss": -11.835400581359863, "global_step": 407875, "epoch": 2427} {"train_loss": -11.726146697998047, "global_step": 407876, "epoch": 2427} {"train_loss": -11.856553077697754, "global_step": 407877, "epoch": 2427} {"train_loss": -11.557817459106445, "global_step": 407878, "epoch": 2427} {"train_loss": -11.964374542236328, "global_step": 407879, "epoch": 2427} {"train_loss": -12.07815170288086, "global_step": 407880, "epoch": 2427} {"train_loss": -12.100751876831055, "global_step": 407881, "epoch": 2427} {"train_loss": -12.045671463012695, "global_step": 407882, "epoch": 2427} {"train_loss": -11.868579864501953, "global_step": 407883, "epoch": 2427} {"train_loss": -11.916292190551758, "global_step": 407884, "epoch": 2427} {"train_loss": -12.125625610351562, "global_step": 407885, "epoch": 2427} {"train_loss": -11.808074951171875, "global_step": 407886, "epoch": 2427} {"train_loss": -12.050212860107422, "global_step": 407887, "epoch": 2427} {"train_loss": -11.979421615600586, "global_step": 407888, "epoch": 2427} {"train_loss": -12.013239860534668, "global_step": 407889, "epoch": 2427} {"train_loss": -12.209419250488281, "global_step": 407890, "epoch": 2427} {"train_loss": -12.25869369506836, "global_step": 407891, "epoch": 2427} {"train_loss": -12.249300003051758, "global_step": 407892, "epoch": 2427} {"train_loss": -11.904359817504883, "global_step": 407893, "epoch": 2427} {"train_loss": -12.45699405670166, "global_step": 407894, "epoch": 2427} {"train_loss": -11.991783142089844, "global_step": 407895, "epoch": 2427} {"train_loss": -12.055425643920898, "global_step": 407896, "epoch": 2427} {"train_loss": -12.065652847290039, "global_step": 407897, "epoch": 2427} {"train_loss": -12.307047843933105, "global_step": 407898, "epoch": 2427} {"train_loss": -12.06842041015625, "global_step": 407899, "epoch": 2427} {"train_loss": -12.185290336608887, "global_step": 407900, "epoch": 2427} {"train_loss": -12.220365524291992, "global_step": 407901, "epoch": 2427} {"train_loss": -12.106851577758789, "global_step": 407902, "epoch": 2427} {"train_loss": -11.646693377267747, "global_step": 407903, "epoch": 2427, "val_loss": 301078.0625} {"train_loss": -12.090292930603027, "global_step": 407904, "epoch": 2428} {"train_loss": -12.265569686889648, "global_step": 407905, "epoch": 2428} {"train_loss": -12.263866424560547, "global_step": 407906, "epoch": 2428} {"train_loss": -12.339280128479004, "global_step": 407907, "epoch": 2428} {"train_loss": -12.292163848876953, "global_step": 407908, "epoch": 2428} {"train_loss": -12.34228515625, "global_step": 407909, "epoch": 2428} {"train_loss": -12.250846862792969, "global_step": 407910, "epoch": 2428} {"train_loss": -12.330161094665527, "global_step": 407911, "epoch": 2428} {"train_loss": -12.362594604492188, "global_step": 407912, "epoch": 2428} {"train_loss": -12.264718055725098, "global_step": 407913, "epoch": 2428} {"train_loss": -12.292671203613281, "global_step": 407914, "epoch": 2428} {"train_loss": -12.415013313293457, "global_step": 407915, "epoch": 2428} {"train_loss": -12.170683860778809, "global_step": 407916, "epoch": 2428} {"train_loss": -12.303997039794922, "global_step": 407917, "epoch": 2428} {"train_loss": -12.425300598144531, "global_step": 407918, "epoch": 2428} {"train_loss": -12.402097702026367, "global_step": 407919, "epoch": 2428} {"train_loss": -12.340633392333984, "global_step": 407920, "epoch": 2428} {"train_loss": -12.314521789550781, "global_step": 407921, "epoch": 2428} {"train_loss": -12.366654396057129, "global_step": 407922, "epoch": 2428} {"train_loss": -12.541582107543945, "global_step": 407923, "epoch": 2428} {"train_loss": -12.15528678894043, "global_step": 407924, "epoch": 2428} {"train_loss": -12.242878913879395, "global_step": 407925, "epoch": 2428} {"train_loss": -12.666326522827148, "global_step": 407926, "epoch": 2428} {"train_loss": -12.363174438476562, "global_step": 407927, "epoch": 2428} {"train_loss": -12.521430015563965, "global_step": 407928, "epoch": 2428} {"train_loss": -12.55411148071289, "global_step": 407929, "epoch": 2428} {"train_loss": -12.311213493347168, "global_step": 407930, "epoch": 2428} {"train_loss": -12.476036071777344, "global_step": 407931, "epoch": 2428} {"train_loss": -12.470632553100586, "global_step": 407932, "epoch": 2428} {"train_loss": -12.375039100646973, "global_step": 407933, "epoch": 2428} {"train_loss": -12.516212463378906, "global_step": 407934, "epoch": 2428} {"train_loss": -12.528783798217773, "global_step": 407935, "epoch": 2428} {"train_loss": -12.522008895874023, "global_step": 407936, "epoch": 2428} {"train_loss": -12.505258560180664, "global_step": 407937, "epoch": 2428} {"train_loss": -12.456539154052734, "global_step": 407938, "epoch": 2428} {"train_loss": -12.521875381469727, "global_step": 407939, "epoch": 2428} {"train_loss": -12.416849136352539, "global_step": 407940, "epoch": 2428} {"train_loss": -12.385917663574219, "global_step": 407941, "epoch": 2428} {"train_loss": -12.016349792480469, "global_step": 407942, "epoch": 2428} {"train_loss": -12.448752403259277, "global_step": 407943, "epoch": 2428} {"train_loss": -12.261649131774902, "global_step": 407944, "epoch": 2428} {"train_loss": -12.093170166015625, "global_step": 407945, "epoch": 2428} {"train_loss": -12.661712646484375, "global_step": 407946, "epoch": 2428} {"train_loss": -12.303030967712402, "global_step": 407947, "epoch": 2428} {"train_loss": -12.36581802368164, "global_step": 407948, "epoch": 2428} {"train_loss": -12.590392112731934, "global_step": 407949, "epoch": 2428} {"train_loss": -12.544639587402344, "global_step": 407950, "epoch": 2428} {"train_loss": -12.343692779541016, "global_step": 407951, "epoch": 2428} {"train_loss": -12.596868515014648, "global_step": 407952, "epoch": 2428} {"train_loss": -12.589834213256836, "global_step": 407953, "epoch": 2428} {"train_loss": -12.430967330932617, "global_step": 407954, "epoch": 2428} {"train_loss": -12.748523712158203, "global_step": 407955, "epoch": 2428} {"train_loss": -12.752843856811523, "global_step": 407956, "epoch": 2428} {"train_loss": -12.545707702636719, "global_step": 407957, "epoch": 2428} {"train_loss": -12.827174186706543, "global_step": 407958, "epoch": 2428} {"train_loss": -12.396895408630371, "global_step": 407959, "epoch": 2428} {"train_loss": -12.234987258911133, "global_step": 407960, "epoch": 2428} {"train_loss": -12.57290267944336, "global_step": 407961, "epoch": 2428} {"train_loss": -12.282848358154297, "global_step": 407962, "epoch": 2428} {"train_loss": -12.461919784545898, "global_step": 407963, "epoch": 2428} {"train_loss": -12.491607666015625, "global_step": 407964, "epoch": 2428} {"train_loss": -12.132116317749023, "global_step": 407965, "epoch": 2428} {"train_loss": -12.444791793823242, "global_step": 407966, "epoch": 2428} {"train_loss": -12.317235946655273, "global_step": 407967, "epoch": 2428} {"train_loss": -12.415992736816406, "global_step": 407968, "epoch": 2428} {"train_loss": -12.452506065368652, "global_step": 407969, "epoch": 2428} {"train_loss": -12.80376148223877, "global_step": 407970, "epoch": 2428} {"train_loss": -12.230213165283203, "global_step": 407971, "epoch": 2428} {"train_loss": -12.54038143157959, "global_step": 407972, "epoch": 2428} {"train_loss": -12.12539291381836, "global_step": 407973, "epoch": 2428} {"train_loss": -12.4052152633667, "global_step": 407974, "epoch": 2428} {"train_loss": -12.27194595336914, "global_step": 407975, "epoch": 2428} {"train_loss": -12.529611587524414, "global_step": 407976, "epoch": 2428} {"train_loss": -11.736011505126953, "global_step": 407977, "epoch": 2428} {"train_loss": -11.63339614868164, "global_step": 407978, "epoch": 2428} {"train_loss": -12.334650039672852, "global_step": 407979, "epoch": 2428} {"train_loss": -11.945810317993164, "global_step": 407980, "epoch": 2428} {"train_loss": -11.337945938110352, "global_step": 407981, "epoch": 2428} {"train_loss": -12.166452407836914, "global_step": 407982, "epoch": 2428} {"train_loss": -12.242323875427246, "global_step": 407983, "epoch": 2428} {"train_loss": -11.32552433013916, "global_step": 407984, "epoch": 2428} {"train_loss": -12.047500610351562, "global_step": 407985, "epoch": 2428} {"train_loss": -12.04239273071289, "global_step": 407986, "epoch": 2428} {"train_loss": -11.902109146118164, "global_step": 407987, "epoch": 2428} {"train_loss": -12.413068771362305, "global_step": 407988, "epoch": 2428} {"train_loss": -12.06131362915039, "global_step": 407989, "epoch": 2428} {"train_loss": -11.662246704101562, "global_step": 407990, "epoch": 2428} {"train_loss": -12.30006217956543, "global_step": 407991, "epoch": 2428} {"train_loss": -12.2439546585083, "global_step": 407992, "epoch": 2428} {"train_loss": -11.710336685180664, "global_step": 407993, "epoch": 2428} {"train_loss": -12.218510627746582, "global_step": 407994, "epoch": 2428} {"train_loss": -12.491783142089844, "global_step": 407995, "epoch": 2428} {"train_loss": -12.136675834655762, "global_step": 407996, "epoch": 2428} {"train_loss": -12.372793197631836, "global_step": 407997, "epoch": 2428} {"train_loss": -12.108182907104492, "global_step": 407998, "epoch": 2428} {"train_loss": -12.068880081176758, "global_step": 407999, "epoch": 2428} {"train_loss": -12.438955307006836, "global_step": 408000, "epoch": 2428} {"train_loss": -12.24919319152832, "global_step": 408001, "epoch": 2428} {"train_loss": -12.504611015319824, "global_step": 408002, "epoch": 2428} {"train_loss": -12.11067008972168, "global_step": 408003, "epoch": 2428} {"train_loss": -12.164762496948242, "global_step": 408004, "epoch": 2428} {"train_loss": -12.438034057617188, "global_step": 408005, "epoch": 2428} {"train_loss": -12.10552978515625, "global_step": 408006, "epoch": 2428} {"train_loss": -12.292434692382812, "global_step": 408007, "epoch": 2428} {"train_loss": -11.817632675170898, "global_step": 408008, "epoch": 2428} {"train_loss": -12.668943405151367, "global_step": 408009, "epoch": 2428} {"train_loss": -12.077203750610352, "global_step": 408010, "epoch": 2428} {"train_loss": -12.41860294342041, "global_step": 408011, "epoch": 2428} {"train_loss": -12.42461109161377, "global_step": 408012, "epoch": 2428} {"train_loss": -12.385332107543945, "global_step": 408013, "epoch": 2428} {"train_loss": -12.59864330291748, "global_step": 408014, "epoch": 2428} {"train_loss": -12.251736640930176, "global_step": 408015, "epoch": 2428} {"train_loss": -12.452959060668945, "global_step": 408016, "epoch": 2428} {"train_loss": -12.623703956604004, "global_step": 408017, "epoch": 2428} {"train_loss": -12.387011528015137, "global_step": 408018, "epoch": 2428} {"train_loss": -12.275197982788086, "global_step": 408019, "epoch": 2428} {"train_loss": -12.40871810913086, "global_step": 408020, "epoch": 2428} {"train_loss": -12.322568893432617, "global_step": 408021, "epoch": 2428} {"train_loss": -12.612045288085938, "global_step": 408022, "epoch": 2428} {"train_loss": -12.407512664794922, "global_step": 408023, "epoch": 2428} {"train_loss": -12.705888748168945, "global_step": 408024, "epoch": 2428} {"train_loss": -12.480388641357422, "global_step": 408025, "epoch": 2428} {"train_loss": -12.618619918823242, "global_step": 408026, "epoch": 2428} {"train_loss": -12.602487564086914, "global_step": 408027, "epoch": 2428} {"train_loss": -12.821930885314941, "global_step": 408028, "epoch": 2428} {"train_loss": -12.324129104614258, "global_step": 408029, "epoch": 2428} {"train_loss": -12.537010192871094, "global_step": 408030, "epoch": 2428} {"train_loss": -12.640419006347656, "global_step": 408031, "epoch": 2428} {"train_loss": -12.582141876220703, "global_step": 408032, "epoch": 2428} {"train_loss": -12.371191024780273, "global_step": 408033, "epoch": 2428} {"train_loss": -12.467981338500977, "global_step": 408034, "epoch": 2428} {"train_loss": -12.662384033203125, "global_step": 408035, "epoch": 2428} {"train_loss": -12.5646390914917, "global_step": 408036, "epoch": 2428} {"train_loss": -12.543538093566895, "global_step": 408037, "epoch": 2428} {"train_loss": -12.698270797729492, "global_step": 408038, "epoch": 2428} {"train_loss": -12.766372680664062, "global_step": 408039, "epoch": 2428} {"train_loss": -12.361604690551758, "global_step": 408040, "epoch": 2428} {"train_loss": -12.504241943359375, "global_step": 408041, "epoch": 2428} {"train_loss": -12.568804740905762, "global_step": 408042, "epoch": 2428} {"train_loss": -12.216426849365234, "global_step": 408043, "epoch": 2428} {"train_loss": -12.644600868225098, "global_step": 408044, "epoch": 2428} {"train_loss": -12.4603271484375, "global_step": 408045, "epoch": 2428} {"train_loss": -12.477405548095703, "global_step": 408046, "epoch": 2428} {"train_loss": -12.6939697265625, "global_step": 408047, "epoch": 2428} {"train_loss": -12.563780784606934, "global_step": 408048, "epoch": 2428} {"train_loss": -12.151426315307617, "global_step": 408049, "epoch": 2428} {"train_loss": -12.236589431762695, "global_step": 408050, "epoch": 2428} {"train_loss": -12.8616304397583, "global_step": 408051, "epoch": 2428} {"train_loss": -12.551048278808594, "global_step": 408052, "epoch": 2428} {"train_loss": -11.653630256652832, "global_step": 408053, "epoch": 2428} {"train_loss": -12.282289505004883, "global_step": 408054, "epoch": 2428} {"train_loss": -12.743568420410156, "global_step": 408055, "epoch": 2428} {"train_loss": -12.098319053649902, "global_step": 408056, "epoch": 2428} {"train_loss": -11.402626037597656, "global_step": 408057, "epoch": 2428} {"train_loss": -11.973146438598633, "global_step": 408058, "epoch": 2428} {"train_loss": -12.53591537475586, "global_step": 408059, "epoch": 2428} {"train_loss": -12.444681167602539, "global_step": 408060, "epoch": 2428} {"train_loss": -11.409168243408203, "global_step": 408061, "epoch": 2428} {"train_loss": -12.268084526062012, "global_step": 408062, "epoch": 2428} {"train_loss": -12.381922721862793, "global_step": 408063, "epoch": 2428} {"train_loss": -12.145988464355469, "global_step": 408064, "epoch": 2428} {"train_loss": -12.365242004394531, "global_step": 408065, "epoch": 2428} {"train_loss": -12.061525344848633, "global_step": 408066, "epoch": 2428} {"train_loss": -12.501710891723633, "global_step": 408067, "epoch": 2428} {"train_loss": -12.261974334716797, "global_step": 408068, "epoch": 2428} {"train_loss": -12.505977630615234, "global_step": 408069, "epoch": 2428} {"train_loss": -12.250503540039062, "global_step": 408070, "epoch": 2428} {"train_loss": -12.345371831031073, "global_step": 408071, "epoch": 2428, "val_loss": 298240.6875} {"train_loss": -12.710405349731445, "global_step": 408072, "epoch": 2429} {"train_loss": -12.611013412475586, "global_step": 408073, "epoch": 2429} {"train_loss": -12.614330291748047, "global_step": 408074, "epoch": 2429} {"train_loss": -12.704049110412598, "global_step": 408075, "epoch": 2429} {"train_loss": -12.596115112304688, "global_step": 408076, "epoch": 2429} {"train_loss": -12.368653297424316, "global_step": 408077, "epoch": 2429} {"train_loss": -12.669048309326172, "global_step": 408078, "epoch": 2429} {"train_loss": -12.369461059570312, "global_step": 408079, "epoch": 2429} {"train_loss": -12.231710433959961, "global_step": 408080, "epoch": 2429} {"train_loss": -12.777962684631348, "global_step": 408081, "epoch": 2429} {"train_loss": -12.74557113647461, "global_step": 408082, "epoch": 2429} {"train_loss": -12.860888481140137, "global_step": 408083, "epoch": 2429} {"train_loss": -12.259103775024414, "global_step": 408084, "epoch": 2429} {"train_loss": -12.614852905273438, "global_step": 408085, "epoch": 2429} {"train_loss": -12.588762283325195, "global_step": 408086, "epoch": 2429} {"train_loss": -12.584756851196289, "global_step": 408087, "epoch": 2429} {"train_loss": -12.301725387573242, "global_step": 408088, "epoch": 2429} {"train_loss": -12.289783477783203, "global_step": 408089, "epoch": 2429} {"train_loss": -12.32706069946289, "global_step": 408090, "epoch": 2429} {"train_loss": -11.815031051635742, "global_step": 408091, "epoch": 2429} {"train_loss": -11.480535507202148, "global_step": 408092, "epoch": 2429} {"train_loss": -11.077423095703125, "global_step": 408093, "epoch": 2429} {"train_loss": -12.57882022857666, "global_step": 408094, "epoch": 2429} {"train_loss": -11.840032577514648, "global_step": 408095, "epoch": 2429} {"train_loss": -11.037744522094727, "global_step": 408096, "epoch": 2429} {"train_loss": -12.241029739379883, "global_step": 408097, "epoch": 2429} {"train_loss": -12.007913589477539, "global_step": 408098, "epoch": 2429} {"train_loss": -12.094358444213867, "global_step": 408099, "epoch": 2429} {"train_loss": -12.120963096618652, "global_step": 408100, "epoch": 2429} {"train_loss": -11.602644920349121, "global_step": 408101, "epoch": 2429} {"train_loss": -11.720293045043945, "global_step": 408102, "epoch": 2429} {"train_loss": -11.824607849121094, "global_step": 408103, "epoch": 2429} {"train_loss": -12.512700080871582, "global_step": 408104, "epoch": 2429} {"train_loss": -11.409174919128418, "global_step": 408105, "epoch": 2429} {"train_loss": -12.090591430664062, "global_step": 408106, "epoch": 2429} {"train_loss": -11.784198760986328, "global_step": 408107, "epoch": 2429} {"train_loss": -11.228363990783691, "global_step": 408108, "epoch": 2429} {"train_loss": -10.84433650970459, "global_step": 408109, "epoch": 2429} {"train_loss": -11.704639434814453, "global_step": 408110, "epoch": 2429} {"train_loss": -11.960196495056152, "global_step": 408111, "epoch": 2429} {"train_loss": -12.424800872802734, "global_step": 408112, "epoch": 2429} {"train_loss": -12.078184127807617, "global_step": 408113, "epoch": 2429} {"train_loss": -12.479141235351562, "global_step": 408114, "epoch": 2429} {"train_loss": -11.683424949645996, "global_step": 408115, "epoch": 2429} {"train_loss": -12.426103591918945, "global_step": 408116, "epoch": 2429} {"train_loss": -11.910127639770508, "global_step": 408117, "epoch": 2429} {"train_loss": -11.471601486206055, "global_step": 408118, "epoch": 2429} {"train_loss": -12.623556137084961, "global_step": 408119, "epoch": 2429} {"train_loss": -11.89337158203125, "global_step": 408120, "epoch": 2429} {"train_loss": -11.988334655761719, "global_step": 408121, "epoch": 2429} {"train_loss": -11.76650333404541, "global_step": 408122, "epoch": 2429} {"train_loss": -12.100954055786133, "global_step": 408123, "epoch": 2429} {"train_loss": -12.121423721313477, "global_step": 408124, "epoch": 2429} {"train_loss": -11.782480239868164, "global_step": 408125, "epoch": 2429} {"train_loss": -12.44878101348877, "global_step": 408126, "epoch": 2429} {"train_loss": -12.503049850463867, "global_step": 408127, "epoch": 2429} {"train_loss": -11.84649658203125, "global_step": 408128, "epoch": 2429} {"train_loss": -12.279499053955078, "global_step": 408129, "epoch": 2429} {"train_loss": -12.257770538330078, "global_step": 408130, "epoch": 2429} {"train_loss": -12.049556732177734, "global_step": 408131, "epoch": 2429} {"train_loss": -12.526910781860352, "global_step": 408132, "epoch": 2429} {"train_loss": -12.376225471496582, "global_step": 408133, "epoch": 2429} {"train_loss": -11.60628604888916, "global_step": 408134, "epoch": 2429} {"train_loss": -11.989486694335938, "global_step": 408135, "epoch": 2429} {"train_loss": -12.69869327545166, "global_step": 408136, "epoch": 2429} {"train_loss": -12.138449668884277, "global_step": 408137, "epoch": 2429} {"train_loss": -12.034442901611328, "global_step": 408138, "epoch": 2429} {"train_loss": -12.187763214111328, "global_step": 408139, "epoch": 2429} {"train_loss": -12.382648468017578, "global_step": 408140, "epoch": 2429} {"train_loss": -12.170238494873047, "global_step": 408141, "epoch": 2429} {"train_loss": -12.431680679321289, "global_step": 408142, "epoch": 2429} {"train_loss": -12.2068452835083, "global_step": 408143, "epoch": 2429} {"train_loss": -12.079025268554688, "global_step": 408144, "epoch": 2429} {"train_loss": -12.168094635009766, "global_step": 408145, "epoch": 2429} {"train_loss": -12.587207794189453, "global_step": 408146, "epoch": 2429} {"train_loss": -12.104756355285645, "global_step": 408147, "epoch": 2429} {"train_loss": -12.619386672973633, "global_step": 408148, "epoch": 2429} {"train_loss": -11.79061508178711, "global_step": 408149, "epoch": 2429} {"train_loss": -12.027708053588867, "global_step": 408150, "epoch": 2429} {"train_loss": -9.457294464111328, "global_step": 408151, "epoch": 2429} {"train_loss": -11.516141891479492, "global_step": 408152, "epoch": 2429} {"train_loss": -9.545368194580078, "global_step": 408153, "epoch": 2429} {"train_loss": -8.54970932006836, "global_step": 408154, "epoch": 2429} {"train_loss": -8.936113357543945, "global_step": 408155, "epoch": 2429} {"train_loss": -9.820053100585938, "global_step": 408156, "epoch": 2429} {"train_loss": -9.497675895690918, "global_step": 408157, "epoch": 2429} {"train_loss": -8.51295280456543, "global_step": 408158, "epoch": 2429} {"train_loss": -8.193735122680664, "global_step": 408159, "epoch": 2429} {"train_loss": -9.7913818359375, "global_step": 408160, "epoch": 2429} {"train_loss": -10.094141006469727, "global_step": 408161, "epoch": 2429} {"train_loss": -9.916720390319824, "global_step": 408162, "epoch": 2429} {"train_loss": -10.147073745727539, "global_step": 408163, "epoch": 2429} {"train_loss": -9.925122261047363, "global_step": 408164, "epoch": 2429} {"train_loss": -9.375083923339844, "global_step": 408165, "epoch": 2429} {"train_loss": -11.047154426574707, "global_step": 408166, "epoch": 2429} {"train_loss": -9.5235595703125, "global_step": 408167, "epoch": 2429} {"train_loss": -8.887350082397461, "global_step": 408168, "epoch": 2429} {"train_loss": -10.12553596496582, "global_step": 408169, "epoch": 2429} {"train_loss": -10.67215347290039, "global_step": 408170, "epoch": 2429} {"train_loss": -10.287656784057617, "global_step": 408171, "epoch": 2429} {"train_loss": -10.349050521850586, "global_step": 408172, "epoch": 2429} {"train_loss": -11.33311653137207, "global_step": 408173, "epoch": 2429} {"train_loss": -10.97303295135498, "global_step": 408174, "epoch": 2429} {"train_loss": -10.738780975341797, "global_step": 408175, "epoch": 2429} {"train_loss": -11.434783935546875, "global_step": 408176, "epoch": 2429} {"train_loss": -10.853886604309082, "global_step": 408177, "epoch": 2429} {"train_loss": -11.730977058410645, "global_step": 408178, "epoch": 2429} {"train_loss": -11.903276443481445, "global_step": 408179, "epoch": 2429} {"train_loss": -11.707508087158203, "global_step": 408180, "epoch": 2429} {"train_loss": -11.93542766571045, "global_step": 408181, "epoch": 2429} {"train_loss": -11.55341911315918, "global_step": 408182, "epoch": 2429} {"train_loss": -11.770484924316406, "global_step": 408183, "epoch": 2429} {"train_loss": -11.645334243774414, "global_step": 408184, "epoch": 2429} {"train_loss": -11.724160194396973, "global_step": 408185, "epoch": 2429} {"train_loss": -12.042015075683594, "global_step": 408186, "epoch": 2429} {"train_loss": -11.941826820373535, "global_step": 408187, "epoch": 2429} {"train_loss": -12.087026596069336, "global_step": 408188, "epoch": 2429} {"train_loss": -12.132009506225586, "global_step": 408189, "epoch": 2429} {"train_loss": -11.78851318359375, "global_step": 408190, "epoch": 2429} {"train_loss": -11.951224327087402, "global_step": 408191, "epoch": 2429} {"train_loss": -11.831642150878906, "global_step": 408192, "epoch": 2429} {"train_loss": -12.34900188446045, "global_step": 408193, "epoch": 2429} {"train_loss": -12.217265129089355, "global_step": 408194, "epoch": 2429} {"train_loss": -11.943109512329102, "global_step": 408195, "epoch": 2429} {"train_loss": -12.170660018920898, "global_step": 408196, "epoch": 2429} {"train_loss": -11.886957168579102, "global_step": 408197, "epoch": 2429} {"train_loss": -12.379302024841309, "global_step": 408198, "epoch": 2429} {"train_loss": -12.152505874633789, "global_step": 408199, "epoch": 2429} {"train_loss": -12.249759674072266, "global_step": 408200, "epoch": 2429} {"train_loss": -12.044424057006836, "global_step": 408201, "epoch": 2429} {"train_loss": -12.114014625549316, "global_step": 408202, "epoch": 2429} {"train_loss": -12.167871475219727, "global_step": 408203, "epoch": 2429} {"train_loss": -12.050283432006836, "global_step": 408204, "epoch": 2429} {"train_loss": -12.136658668518066, "global_step": 408205, "epoch": 2429} {"train_loss": -12.127036094665527, "global_step": 408206, "epoch": 2429} {"train_loss": -12.220247268676758, "global_step": 408207, "epoch": 2429} {"train_loss": -12.210735321044922, "global_step": 408208, "epoch": 2429} {"train_loss": -12.301148414611816, "global_step": 408209, "epoch": 2429} {"train_loss": -12.331716537475586, "global_step": 408210, "epoch": 2429} {"train_loss": -12.115631103515625, "global_step": 408211, "epoch": 2429} {"train_loss": -12.236234664916992, "global_step": 408212, "epoch": 2429} {"train_loss": -11.947161674499512, "global_step": 408213, "epoch": 2429} {"train_loss": -12.026700973510742, "global_step": 408214, "epoch": 2429} {"train_loss": -12.152539253234863, "global_step": 408215, "epoch": 2429} {"train_loss": -12.409232139587402, "global_step": 408216, "epoch": 2429} {"train_loss": -12.115440368652344, "global_step": 408217, "epoch": 2429} {"train_loss": -12.500954627990723, "global_step": 408218, "epoch": 2429} {"train_loss": -12.422219276428223, "global_step": 408219, "epoch": 2429} {"train_loss": -12.34449577331543, "global_step": 408220, "epoch": 2429} {"train_loss": -12.28606128692627, "global_step": 408221, "epoch": 2429} {"train_loss": -12.465256690979004, "global_step": 408222, "epoch": 2429} {"train_loss": -12.158177375793457, "global_step": 408223, "epoch": 2429} {"train_loss": -12.448076248168945, "global_step": 408224, "epoch": 2429} {"train_loss": -12.49740982055664, "global_step": 408225, "epoch": 2429} {"train_loss": -12.691095352172852, "global_step": 408226, "epoch": 2429} {"train_loss": -12.55432415008545, "global_step": 408227, "epoch": 2429} {"train_loss": -12.51667594909668, "global_step": 408228, "epoch": 2429} {"train_loss": -12.517812728881836, "global_step": 408229, "epoch": 2429} {"train_loss": -12.744306564331055, "global_step": 408230, "epoch": 2429} {"train_loss": -12.500038146972656, "global_step": 408231, "epoch": 2429} {"train_loss": -12.706133842468262, "global_step": 408232, "epoch": 2429} {"train_loss": -12.482995986938477, "global_step": 408233, "epoch": 2429} {"train_loss": -12.487102508544922, "global_step": 408234, "epoch": 2429} {"train_loss": -12.41728401184082, "global_step": 408235, "epoch": 2429} {"train_loss": -12.497413635253906, "global_step": 408236, "epoch": 2429} {"train_loss": -12.410054206848145, "global_step": 408237, "epoch": 2429} {"train_loss": -12.47691822052002, "global_step": 408238, "epoch": 2429} {"train_loss": -11.816649556159973, "global_step": 408239, "epoch": 2429, "val_loss": 295950.6875} {"train_loss": -12.691010475158691, "global_step": 408240, "epoch": 2430} {"train_loss": -12.489316940307617, "global_step": 408241, "epoch": 2430} {"train_loss": -12.112252235412598, "global_step": 408242, "epoch": 2430} {"train_loss": -12.62820053100586, "global_step": 408243, "epoch": 2430} {"train_loss": -12.41592788696289, "global_step": 408244, "epoch": 2430} {"train_loss": -12.22903823852539, "global_step": 408245, "epoch": 2430} {"train_loss": -12.363458633422852, "global_step": 408246, "epoch": 2430} {"train_loss": -12.475461959838867, "global_step": 408247, "epoch": 2430} {"train_loss": -12.430158615112305, "global_step": 408248, "epoch": 2430} {"train_loss": -12.429243087768555, "global_step": 408249, "epoch": 2430} {"train_loss": -12.556543350219727, "global_step": 408250, "epoch": 2430} {"train_loss": -12.25986099243164, "global_step": 408251, "epoch": 2430} {"train_loss": -12.729207038879395, "global_step": 408252, "epoch": 2430} {"train_loss": -12.606830596923828, "global_step": 408253, "epoch": 2430} {"train_loss": -12.400310516357422, "global_step": 408254, "epoch": 2430} {"train_loss": -12.292903900146484, "global_step": 408255, "epoch": 2430} {"train_loss": -12.553569793701172, "global_step": 408256, "epoch": 2430} {"train_loss": -12.407586097717285, "global_step": 408257, "epoch": 2430} {"train_loss": -11.954201698303223, "global_step": 408258, "epoch": 2430} {"train_loss": -12.156932830810547, "global_step": 408259, "epoch": 2430} {"train_loss": -11.894292831420898, "global_step": 408260, "epoch": 2430} {"train_loss": -12.48314380645752, "global_step": 408261, "epoch": 2430} {"train_loss": -12.372088432312012, "global_step": 408262, "epoch": 2430} {"train_loss": -12.164636611938477, "global_step": 408263, "epoch": 2430} {"train_loss": -12.564212799072266, "global_step": 408264, "epoch": 2430} {"train_loss": -11.818364143371582, "global_step": 408265, "epoch": 2430} {"train_loss": -12.161893844604492, "global_step": 408266, "epoch": 2430} {"train_loss": -12.086777687072754, "global_step": 408267, "epoch": 2430} {"train_loss": -12.738042831420898, "global_step": 408268, "epoch": 2430} {"train_loss": -12.486944198608398, "global_step": 408269, "epoch": 2430} {"train_loss": -12.483906745910645, "global_step": 408270, "epoch": 2430} {"train_loss": -12.383954048156738, "global_step": 408271, "epoch": 2430} {"train_loss": -12.43032455444336, "global_step": 408272, "epoch": 2430} {"train_loss": -12.279098510742188, "global_step": 408273, "epoch": 2430} {"train_loss": -12.2854585647583, "global_step": 408274, "epoch": 2430} {"train_loss": -12.598804473876953, "global_step": 408275, "epoch": 2430} {"train_loss": -12.454513549804688, "global_step": 408276, "epoch": 2430} {"train_loss": -12.485677719116211, "global_step": 408277, "epoch": 2430} {"train_loss": -11.851003646850586, "global_step": 408278, "epoch": 2430} {"train_loss": -12.631348609924316, "global_step": 408279, "epoch": 2430} {"train_loss": -12.522279739379883, "global_step": 408280, "epoch": 2430} {"train_loss": -12.144891738891602, "global_step": 408281, "epoch": 2430} {"train_loss": -12.275073051452637, "global_step": 408282, "epoch": 2430} {"train_loss": -11.981367111206055, "global_step": 408283, "epoch": 2430} {"train_loss": -11.435970306396484, "global_step": 408284, "epoch": 2430} {"train_loss": -11.787677764892578, "global_step": 408285, "epoch": 2430} {"train_loss": -12.635986328125, "global_step": 408286, "epoch": 2430} {"train_loss": -12.226612091064453, "global_step": 408287, "epoch": 2430} {"train_loss": -11.97734546661377, "global_step": 408288, "epoch": 2430} {"train_loss": -12.163530349731445, "global_step": 408289, "epoch": 2430} {"train_loss": -12.28343677520752, "global_step": 408290, "epoch": 2430} {"train_loss": -12.11181640625, "global_step": 408291, "epoch": 2430} {"train_loss": -12.33753776550293, "global_step": 408292, "epoch": 2430} {"train_loss": -12.391824722290039, "global_step": 408293, "epoch": 2430} {"train_loss": -12.314336776733398, "global_step": 408294, "epoch": 2430} {"train_loss": -11.809564590454102, "global_step": 408295, "epoch": 2430} {"train_loss": -12.501656532287598, "global_step": 408296, "epoch": 2430} {"train_loss": -12.420671463012695, "global_step": 408297, "epoch": 2430} {"train_loss": -12.410551071166992, "global_step": 408298, "epoch": 2430} {"train_loss": -12.255138397216797, "global_step": 408299, "epoch": 2430} {"train_loss": -12.01701545715332, "global_step": 408300, "epoch": 2430} {"train_loss": -11.91897201538086, "global_step": 408301, "epoch": 2430} {"train_loss": -11.95466423034668, "global_step": 408302, "epoch": 2430} {"train_loss": -11.772804260253906, "global_step": 408303, "epoch": 2430} {"train_loss": -11.096992492675781, "global_step": 408304, "epoch": 2430} {"train_loss": -10.31643295288086, "global_step": 408305, "epoch": 2430} {"train_loss": -11.013459205627441, "global_step": 408306, "epoch": 2430} {"train_loss": -11.302173614501953, "global_step": 408307, "epoch": 2430} {"train_loss": -10.40561294555664, "global_step": 408308, "epoch": 2430} {"train_loss": -10.907539367675781, "global_step": 408309, "epoch": 2430} {"train_loss": -10.343254089355469, "global_step": 408310, "epoch": 2430} {"train_loss": -10.180810928344727, "global_step": 408311, "epoch": 2430} {"train_loss": -11.196966171264648, "global_step": 408312, "epoch": 2430} {"train_loss": -10.896522521972656, "global_step": 408313, "epoch": 2430} {"train_loss": -11.353763580322266, "global_step": 408314, "epoch": 2430} {"train_loss": -11.06462287902832, "global_step": 408315, "epoch": 2430} {"train_loss": -12.178863525390625, "global_step": 408316, "epoch": 2430} {"train_loss": -11.442726135253906, "global_step": 408317, "epoch": 2430} {"train_loss": -11.668031692504883, "global_step": 408318, "epoch": 2430} {"train_loss": -11.508907318115234, "global_step": 408319, "epoch": 2430} {"train_loss": -11.0888090133667, "global_step": 408320, "epoch": 2430} {"train_loss": -11.153430938720703, "global_step": 408321, "epoch": 2430} {"train_loss": -10.986557006835938, "global_step": 408322, "epoch": 2430} {"train_loss": -11.349177360534668, "global_step": 408323, "epoch": 2430} {"train_loss": -11.250578880310059, "global_step": 408324, "epoch": 2430} {"train_loss": -11.26192855834961, "global_step": 408325, "epoch": 2430} {"train_loss": -11.425065040588379, "global_step": 408326, "epoch": 2430} {"train_loss": -10.720381736755371, "global_step": 408327, "epoch": 2430} {"train_loss": -11.943584442138672, "global_step": 408328, "epoch": 2430} {"train_loss": -10.576986312866211, "global_step": 408329, "epoch": 2430} {"train_loss": -11.176252365112305, "global_step": 408330, "epoch": 2430} {"train_loss": -11.108747482299805, "global_step": 408331, "epoch": 2430} {"train_loss": -10.996435165405273, "global_step": 408332, "epoch": 2430} {"train_loss": -10.751029014587402, "global_step": 408333, "epoch": 2430} {"train_loss": -11.195079803466797, "global_step": 408334, "epoch": 2430} {"train_loss": -10.696932792663574, "global_step": 408335, "epoch": 2430} {"train_loss": -11.401398658752441, "global_step": 408336, "epoch": 2430} {"train_loss": -10.797242164611816, "global_step": 408337, "epoch": 2430} {"train_loss": -11.90768814086914, "global_step": 408338, "epoch": 2430} {"train_loss": -10.72249698638916, "global_step": 408339, "epoch": 2430} {"train_loss": -11.911483764648438, "global_step": 408340, "epoch": 2430} {"train_loss": -11.367996215820312, "global_step": 408341, "epoch": 2430} {"train_loss": -11.993825912475586, "global_step": 408342, "epoch": 2430} {"train_loss": -11.462855339050293, "global_step": 408343, "epoch": 2430} {"train_loss": -11.539508819580078, "global_step": 408344, "epoch": 2430} {"train_loss": -12.000280380249023, "global_step": 408345, "epoch": 2430} {"train_loss": -11.936800956726074, "global_step": 408346, "epoch": 2430} {"train_loss": -11.782563209533691, "global_step": 408347, "epoch": 2430} {"train_loss": -12.353731155395508, "global_step": 408348, "epoch": 2430} {"train_loss": -11.669628143310547, "global_step": 408349, "epoch": 2430} {"train_loss": -12.098783493041992, "global_step": 408350, "epoch": 2430} {"train_loss": -11.376410484313965, "global_step": 408351, "epoch": 2430} {"train_loss": -11.926599502563477, "global_step": 408352, "epoch": 2430} {"train_loss": -11.39151382446289, "global_step": 408353, "epoch": 2430} {"train_loss": -12.245088577270508, "global_step": 408354, "epoch": 2430} {"train_loss": -11.693046569824219, "global_step": 408355, "epoch": 2430} {"train_loss": -11.68590259552002, "global_step": 408356, "epoch": 2430} {"train_loss": -11.91574478149414, "global_step": 408357, "epoch": 2430} {"train_loss": -11.9771728515625, "global_step": 408358, "epoch": 2430} {"train_loss": -12.070075988769531, "global_step": 408359, "epoch": 2430} {"train_loss": -12.17711067199707, "global_step": 408360, "epoch": 2430} {"train_loss": -12.326594352722168, "global_step": 408361, "epoch": 2430} {"train_loss": -12.218562126159668, "global_step": 408362, "epoch": 2430} {"train_loss": -12.255019187927246, "global_step": 408363, "epoch": 2430} {"train_loss": -12.152582168579102, "global_step": 408364, "epoch": 2430} {"train_loss": -12.345075607299805, "global_step": 408365, "epoch": 2430} {"train_loss": -12.092601776123047, "global_step": 408366, "epoch": 2430} {"train_loss": -12.46847152709961, "global_step": 408367, "epoch": 2430} {"train_loss": -12.147754669189453, "global_step": 408368, "epoch": 2430} {"train_loss": -12.479206085205078, "global_step": 408369, "epoch": 2430} {"train_loss": -12.098429679870605, "global_step": 408370, "epoch": 2430} {"train_loss": -12.494148254394531, "global_step": 408371, "epoch": 2430} {"train_loss": -12.270439147949219, "global_step": 408372, "epoch": 2430} {"train_loss": -12.466915130615234, "global_step": 408373, "epoch": 2430} {"train_loss": -12.287633895874023, "global_step": 408374, "epoch": 2430} {"train_loss": -12.173015594482422, "global_step": 408375, "epoch": 2430} {"train_loss": -12.61697769165039, "global_step": 408376, "epoch": 2430} {"train_loss": -12.288715362548828, "global_step": 408377, "epoch": 2430} {"train_loss": -12.532999038696289, "global_step": 408378, "epoch": 2430} {"train_loss": -12.530350685119629, "global_step": 408379, "epoch": 2430} {"train_loss": -12.457477569580078, "global_step": 408380, "epoch": 2430} {"train_loss": -12.52415657043457, "global_step": 408381, "epoch": 2430} {"train_loss": -12.48550033569336, "global_step": 408382, "epoch": 2430} {"train_loss": -12.433897018432617, "global_step": 408383, "epoch": 2430} {"train_loss": -12.377802848815918, "global_step": 408384, "epoch": 2430} {"train_loss": -12.535747528076172, "global_step": 408385, "epoch": 2430} {"train_loss": -12.412946701049805, "global_step": 408386, "epoch": 2430} {"train_loss": -11.851625442504883, "global_step": 408387, "epoch": 2430} {"train_loss": -12.519501686096191, "global_step": 408388, "epoch": 2430} {"train_loss": -12.078109741210938, "global_step": 408389, "epoch": 2430} {"train_loss": -12.478738784790039, "global_step": 408390, "epoch": 2430} {"train_loss": -12.38829231262207, "global_step": 408391, "epoch": 2430} {"train_loss": -11.866287231445312, "global_step": 408392, "epoch": 2430} {"train_loss": -12.240202903747559, "global_step": 408393, "epoch": 2430} {"train_loss": -12.285866737365723, "global_step": 408394, "epoch": 2430} {"train_loss": -12.34468936920166, "global_step": 408395, "epoch": 2430} {"train_loss": -12.464588165283203, "global_step": 408396, "epoch": 2430} {"train_loss": -12.440324783325195, "global_step": 408397, "epoch": 2430} {"train_loss": -12.195189476013184, "global_step": 408398, "epoch": 2430} {"train_loss": -12.299848556518555, "global_step": 408399, "epoch": 2430} {"train_loss": -11.917213439941406, "global_step": 408400, "epoch": 2430} {"train_loss": -12.269426345825195, "global_step": 408401, "epoch": 2430} {"train_loss": -12.440446853637695, "global_step": 408402, "epoch": 2430} {"train_loss": -12.35507583618164, "global_step": 408403, "epoch": 2430} {"train_loss": -12.182409286499023, "global_step": 408404, "epoch": 2430} {"train_loss": -12.494348526000977, "global_step": 408405, "epoch": 2430} {"train_loss": -12.45421314239502, "global_step": 408406, "epoch": 2430} {"train_loss": -11.986739067804246, "global_step": 408407, "epoch": 2430, "val_loss": 296444.78125, "train_action_mse_error": 1.41829514503479} {"train_loss": -12.385188102722168, "global_step": 408408, "epoch": 2431} {"train_loss": -12.300518035888672, "global_step": 408409, "epoch": 2431} {"train_loss": -12.653270721435547, "global_step": 408410, "epoch": 2431} {"train_loss": -12.247203826904297, "global_step": 408411, "epoch": 2431} {"train_loss": -12.453299522399902, "global_step": 408412, "epoch": 2431} {"train_loss": -12.16097354888916, "global_step": 408413, "epoch": 2431} {"train_loss": -11.6547269821167, "global_step": 408414, "epoch": 2431} {"train_loss": -12.481292724609375, "global_step": 408415, "epoch": 2431} {"train_loss": -11.674335479736328, "global_step": 408416, "epoch": 2431} {"train_loss": -11.253250122070312, "global_step": 408417, "epoch": 2431} {"train_loss": -12.555593490600586, "global_step": 408418, "epoch": 2431} {"train_loss": -11.819281578063965, "global_step": 408419, "epoch": 2431} {"train_loss": -12.28091049194336, "global_step": 408420, "epoch": 2431} {"train_loss": -12.275400161743164, "global_step": 408421, "epoch": 2431} {"train_loss": -11.785589218139648, "global_step": 408422, "epoch": 2431} {"train_loss": -11.66128158569336, "global_step": 408423, "epoch": 2431} {"train_loss": -12.244462966918945, "global_step": 408424, "epoch": 2431} {"train_loss": -12.043773651123047, "global_step": 408425, "epoch": 2431} {"train_loss": -11.437057495117188, "global_step": 408426, "epoch": 2431} {"train_loss": -11.940756797790527, "global_step": 408427, "epoch": 2431} {"train_loss": -11.984920501708984, "global_step": 408428, "epoch": 2431} {"train_loss": -11.343891143798828, "global_step": 408429, "epoch": 2431} {"train_loss": -12.079303741455078, "global_step": 408430, "epoch": 2431} {"train_loss": -11.566638946533203, "global_step": 408431, "epoch": 2431} {"train_loss": -12.173917770385742, "global_step": 408432, "epoch": 2431} {"train_loss": -11.839418411254883, "global_step": 408433, "epoch": 2431} {"train_loss": -11.686347961425781, "global_step": 408434, "epoch": 2431} {"train_loss": -12.028188705444336, "global_step": 408435, "epoch": 2431} {"train_loss": -12.567512512207031, "global_step": 408436, "epoch": 2431} {"train_loss": -11.963617324829102, "global_step": 408437, "epoch": 2431} {"train_loss": -12.153512954711914, "global_step": 408438, "epoch": 2431} {"train_loss": -12.282491683959961, "global_step": 408439, "epoch": 2431} {"train_loss": -12.493189811706543, "global_step": 408440, "epoch": 2431} {"train_loss": -12.003986358642578, "global_step": 408441, "epoch": 2431} {"train_loss": -12.564361572265625, "global_step": 408442, "epoch": 2431} {"train_loss": -12.224411010742188, "global_step": 408443, "epoch": 2431} {"train_loss": -12.297538757324219, "global_step": 408444, "epoch": 2431} {"train_loss": -12.228918075561523, "global_step": 408445, "epoch": 2431} {"train_loss": -12.368803024291992, "global_step": 408446, "epoch": 2431} {"train_loss": -12.185380935668945, "global_step": 408447, "epoch": 2431} {"train_loss": -12.357646942138672, "global_step": 408448, "epoch": 2431} {"train_loss": -12.127826690673828, "global_step": 408449, "epoch": 2431} {"train_loss": -11.92899227142334, "global_step": 408450, "epoch": 2431} {"train_loss": -12.152250289916992, "global_step": 408451, "epoch": 2431} {"train_loss": -12.162294387817383, "global_step": 408452, "epoch": 2431} {"train_loss": -12.186639785766602, "global_step": 408453, "epoch": 2431} {"train_loss": -11.879222869873047, "global_step": 408454, "epoch": 2431} {"train_loss": -11.493704795837402, "global_step": 408455, "epoch": 2431} {"train_loss": -12.383366584777832, "global_step": 408456, "epoch": 2431} {"train_loss": -11.676424980163574, "global_step": 408457, "epoch": 2431} {"train_loss": -12.203095436096191, "global_step": 408458, "epoch": 2431} {"train_loss": -11.626152038574219, "global_step": 408459, "epoch": 2431} {"train_loss": -12.055563926696777, "global_step": 408460, "epoch": 2431} {"train_loss": -11.901266098022461, "global_step": 408461, "epoch": 2431} {"train_loss": -11.999069213867188, "global_step": 408462, "epoch": 2431} {"train_loss": -11.426567077636719, "global_step": 408463, "epoch": 2431} {"train_loss": -12.061718940734863, "global_step": 408464, "epoch": 2431} {"train_loss": -11.540838241577148, "global_step": 408465, "epoch": 2431} {"train_loss": -11.885515213012695, "global_step": 408466, "epoch": 2431} {"train_loss": -12.114023208618164, "global_step": 408467, "epoch": 2431} {"train_loss": -11.039926528930664, "global_step": 408468, "epoch": 2431} {"train_loss": -12.10274600982666, "global_step": 408469, "epoch": 2431} {"train_loss": -11.308504104614258, "global_step": 408470, "epoch": 2431} {"train_loss": -12.200335502624512, "global_step": 408471, "epoch": 2431} {"train_loss": -11.702472686767578, "global_step": 408472, "epoch": 2431} {"train_loss": -12.103971481323242, "global_step": 408473, "epoch": 2431} {"train_loss": -11.941902160644531, "global_step": 408474, "epoch": 2431} {"train_loss": -12.052175521850586, "global_step": 408475, "epoch": 2431} {"train_loss": -10.533856391906738, "global_step": 408476, "epoch": 2431} {"train_loss": -11.937150001525879, "global_step": 408477, "epoch": 2431} {"train_loss": -9.032569885253906, "global_step": 408478, "epoch": 2431} {"train_loss": -11.895401954650879, "global_step": 408479, "epoch": 2431} {"train_loss": -7.912051200866699, "global_step": 408480, "epoch": 2431} {"train_loss": -10.662981033325195, "global_step": 408481, "epoch": 2431} {"train_loss": -7.3302202224731445, "global_step": 408482, "epoch": 2431} {"train_loss": -7.573721885681152, "global_step": 408483, "epoch": 2431} {"train_loss": -7.333807468414307, "global_step": 408484, "epoch": 2431} {"train_loss": -7.802950859069824, "global_step": 408485, "epoch": 2431} {"train_loss": -8.701227188110352, "global_step": 408486, "epoch": 2431} {"train_loss": -8.771599769592285, "global_step": 408487, "epoch": 2431} {"train_loss": -10.914217948913574, "global_step": 408488, "epoch": 2431} {"train_loss": -7.3674774169921875, "global_step": 408489, "epoch": 2431} {"train_loss": -10.027482986450195, "global_step": 408490, "epoch": 2431} {"train_loss": -8.912002563476562, "global_step": 408491, "epoch": 2431} {"train_loss": -9.234039306640625, "global_step": 408492, "epoch": 2431} {"train_loss": -9.26911735534668, "global_step": 408493, "epoch": 2431} {"train_loss": -9.889986038208008, "global_step": 408494, "epoch": 2431} {"train_loss": -11.562782287597656, "global_step": 408495, "epoch": 2431} {"train_loss": -10.111981391906738, "global_step": 408496, "epoch": 2431} {"train_loss": -11.409346580505371, "global_step": 408497, "epoch": 2431} {"train_loss": -10.791231155395508, "global_step": 408498, "epoch": 2431} {"train_loss": -11.389094352722168, "global_step": 408499, "epoch": 2431} {"train_loss": -11.133264541625977, "global_step": 408500, "epoch": 2431} {"train_loss": -11.44936466217041, "global_step": 408501, "epoch": 2431} {"train_loss": -11.31793212890625, "global_step": 408502, "epoch": 2431} {"train_loss": -11.831275939941406, "global_step": 408503, "epoch": 2431} {"train_loss": -10.986745834350586, "global_step": 408504, "epoch": 2431} {"train_loss": -11.5538969039917, "global_step": 408505, "epoch": 2431} {"train_loss": -11.448312759399414, "global_step": 408506, "epoch": 2431} {"train_loss": -11.170536041259766, "global_step": 408507, "epoch": 2431} {"train_loss": -11.768465042114258, "global_step": 408508, "epoch": 2431} {"train_loss": -10.970279693603516, "global_step": 408509, "epoch": 2431} {"train_loss": -11.711795806884766, "global_step": 408510, "epoch": 2431} {"train_loss": -11.37813949584961, "global_step": 408511, "epoch": 2431} {"train_loss": -11.693929672241211, "global_step": 408512, "epoch": 2431} {"train_loss": -11.582496643066406, "global_step": 408513, "epoch": 2431} {"train_loss": -11.683259010314941, "global_step": 408514, "epoch": 2431} {"train_loss": -11.431161880493164, "global_step": 408515, "epoch": 2431} {"train_loss": -11.615890502929688, "global_step": 408516, "epoch": 2431} {"train_loss": -11.609292984008789, "global_step": 408517, "epoch": 2431} {"train_loss": -11.781883239746094, "global_step": 408518, "epoch": 2431} {"train_loss": -11.455216407775879, "global_step": 408519, "epoch": 2431} {"train_loss": -11.8751220703125, "global_step": 408520, "epoch": 2431} {"train_loss": -11.849977493286133, "global_step": 408521, "epoch": 2431} {"train_loss": -12.001214027404785, "global_step": 408522, "epoch": 2431} {"train_loss": -11.91468334197998, "global_step": 408523, "epoch": 2431} {"train_loss": -11.49738883972168, "global_step": 408524, "epoch": 2431} {"train_loss": -11.977827072143555, "global_step": 408525, "epoch": 2431} {"train_loss": -11.858888626098633, "global_step": 408526, "epoch": 2431} {"train_loss": -11.788646697998047, "global_step": 408527, "epoch": 2431} {"train_loss": -11.791651725769043, "global_step": 408528, "epoch": 2431} {"train_loss": -12.052886962890625, "global_step": 408529, "epoch": 2431} {"train_loss": -11.992525100708008, "global_step": 408530, "epoch": 2431} {"train_loss": -12.228212356567383, "global_step": 408531, "epoch": 2431} {"train_loss": -11.997944831848145, "global_step": 408532, "epoch": 2431} {"train_loss": -11.87235164642334, "global_step": 408533, "epoch": 2431} {"train_loss": -12.364033699035645, "global_step": 408534, "epoch": 2431} {"train_loss": -11.9518404006958, "global_step": 408535, "epoch": 2431} {"train_loss": -12.312714576721191, "global_step": 408536, "epoch": 2431} {"train_loss": -12.10351276397705, "global_step": 408537, "epoch": 2431} {"train_loss": -12.083288192749023, "global_step": 408538, "epoch": 2431} {"train_loss": -12.343372344970703, "global_step": 408539, "epoch": 2431} {"train_loss": -12.306699752807617, "global_step": 408540, "epoch": 2431} {"train_loss": -12.10875129699707, "global_step": 408541, "epoch": 2431} {"train_loss": -12.205475807189941, "global_step": 408542, "epoch": 2431} {"train_loss": -12.186054229736328, "global_step": 408543, "epoch": 2431} {"train_loss": -12.5460205078125, "global_step": 408544, "epoch": 2431} {"train_loss": -12.044631958007812, "global_step": 408545, "epoch": 2431} {"train_loss": -12.295661926269531, "global_step": 408546, "epoch": 2431} {"train_loss": -12.116463661193848, "global_step": 408547, "epoch": 2431} {"train_loss": -12.24421501159668, "global_step": 408548, "epoch": 2431} {"train_loss": -12.441214561462402, "global_step": 408549, "epoch": 2431} {"train_loss": -12.489151000976562, "global_step": 408550, "epoch": 2431} {"train_loss": -12.439589500427246, "global_step": 408551, "epoch": 2431} {"train_loss": -12.569046020507812, "global_step": 408552, "epoch": 2431} {"train_loss": -12.609582901000977, "global_step": 408553, "epoch": 2431} {"train_loss": -12.414051055908203, "global_step": 408554, "epoch": 2431} {"train_loss": -12.347576141357422, "global_step": 408555, "epoch": 2431} {"train_loss": -12.415876388549805, "global_step": 408556, "epoch": 2431} {"train_loss": -12.380453109741211, "global_step": 408557, "epoch": 2431} {"train_loss": -12.38877010345459, "global_step": 408558, "epoch": 2431} {"train_loss": -12.390769958496094, "global_step": 408559, "epoch": 2431} {"train_loss": -12.318997383117676, "global_step": 408560, "epoch": 2431} {"train_loss": -12.329556465148926, "global_step": 408561, "epoch": 2431} {"train_loss": -12.285415649414062, "global_step": 408562, "epoch": 2431} {"train_loss": -12.29383659362793, "global_step": 408563, "epoch": 2431} {"train_loss": -12.425078392028809, "global_step": 408564, "epoch": 2431} {"train_loss": -12.579797744750977, "global_step": 408565, "epoch": 2431} {"train_loss": -12.453300476074219, "global_step": 408566, "epoch": 2431} {"train_loss": -12.464765548706055, "global_step": 408567, "epoch": 2431} {"train_loss": -12.551647186279297, "global_step": 408568, "epoch": 2431} {"train_loss": -12.504742622375488, "global_step": 408569, "epoch": 2431} {"train_loss": -12.477520942687988, "global_step": 408570, "epoch": 2431} {"train_loss": -12.313579559326172, "global_step": 408571, "epoch": 2431} {"train_loss": -12.541936874389648, "global_step": 408572, "epoch": 2431} {"train_loss": -12.503133773803711, "global_step": 408573, "epoch": 2431} {"train_loss": -12.447662353515625, "global_step": 408574, "epoch": 2431} {"train_loss": -11.6809536360559, "global_step": 408575, "epoch": 2431, "val_loss": 298669.0625} {"train_loss": -12.383323669433594, "global_step": 408576, "epoch": 2432} {"train_loss": -12.549072265625, "global_step": 408577, "epoch": 2432} {"train_loss": -12.63809585571289, "global_step": 408578, "epoch": 2432} {"train_loss": -12.500100135803223, "global_step": 408579, "epoch": 2432} {"train_loss": -12.604991912841797, "global_step": 408580, "epoch": 2432} {"train_loss": -12.612201690673828, "global_step": 408581, "epoch": 2432} {"train_loss": -12.608705520629883, "global_step": 408582, "epoch": 2432} {"train_loss": -12.34714126586914, "global_step": 408583, "epoch": 2432} {"train_loss": -11.780606269836426, "global_step": 408584, "epoch": 2432} {"train_loss": -12.284366607666016, "global_step": 408585, "epoch": 2432} {"train_loss": -12.262162208557129, "global_step": 408586, "epoch": 2432} {"train_loss": -12.484457969665527, "global_step": 408587, "epoch": 2432} {"train_loss": -12.36890983581543, "global_step": 408588, "epoch": 2432} {"train_loss": -12.42444133758545, "global_step": 408589, "epoch": 2432} {"train_loss": -11.781930923461914, "global_step": 408590, "epoch": 2432} {"train_loss": -12.320935249328613, "global_step": 408591, "epoch": 2432} {"train_loss": -12.342317581176758, "global_step": 408592, "epoch": 2432} {"train_loss": -12.3406982421875, "global_step": 408593, "epoch": 2432} {"train_loss": -11.956932067871094, "global_step": 408594, "epoch": 2432} {"train_loss": -12.364931106567383, "global_step": 408595, "epoch": 2432} {"train_loss": -12.358524322509766, "global_step": 408596, "epoch": 2432} {"train_loss": -11.841787338256836, "global_step": 408597, "epoch": 2432} {"train_loss": -12.726591110229492, "global_step": 408598, "epoch": 2432} {"train_loss": -11.890491485595703, "global_step": 408599, "epoch": 2432} {"train_loss": -12.591607093811035, "global_step": 408600, "epoch": 2432} {"train_loss": -11.899971008300781, "global_step": 408601, "epoch": 2432} {"train_loss": -12.189018249511719, "global_step": 408602, "epoch": 2432} {"train_loss": -11.844684600830078, "global_step": 408603, "epoch": 2432} {"train_loss": -12.529260635375977, "global_step": 408604, "epoch": 2432} {"train_loss": -11.633467674255371, "global_step": 408605, "epoch": 2432} {"train_loss": -12.487268447875977, "global_step": 408606, "epoch": 2432} {"train_loss": -12.480511665344238, "global_step": 408607, "epoch": 2432} {"train_loss": -12.224586486816406, "global_step": 408608, "epoch": 2432} {"train_loss": -12.193937301635742, "global_step": 408609, "epoch": 2432} {"train_loss": -12.585260391235352, "global_step": 408610, "epoch": 2432} {"train_loss": -12.166205406188965, "global_step": 408611, "epoch": 2432} {"train_loss": -12.633514404296875, "global_step": 408612, "epoch": 2432} {"train_loss": -12.503376007080078, "global_step": 408613, "epoch": 2432} {"train_loss": -12.369635581970215, "global_step": 408614, "epoch": 2432} {"train_loss": -12.479108810424805, "global_step": 408615, "epoch": 2432} {"train_loss": -11.810768127441406, "global_step": 408616, "epoch": 2432} {"train_loss": -12.104724884033203, "global_step": 408617, "epoch": 2432} {"train_loss": -11.759794235229492, "global_step": 408618, "epoch": 2432} {"train_loss": -12.242169380187988, "global_step": 408619, "epoch": 2432} {"train_loss": -10.352940559387207, "global_step": 408620, "epoch": 2432} {"train_loss": -10.585692405700684, "global_step": 408621, "epoch": 2432} {"train_loss": -11.030098915100098, "global_step": 408622, "epoch": 2432} {"train_loss": -11.010839462280273, "global_step": 408623, "epoch": 2432} {"train_loss": -11.895553588867188, "global_step": 408624, "epoch": 2432} {"train_loss": -11.546598434448242, "global_step": 408625, "epoch": 2432} {"train_loss": -12.354227066040039, "global_step": 408626, "epoch": 2432} {"train_loss": -11.410225868225098, "global_step": 408627, "epoch": 2432} {"train_loss": -12.376049041748047, "global_step": 408628, "epoch": 2432} {"train_loss": -12.03353500366211, "global_step": 408629, "epoch": 2432} {"train_loss": -12.136414527893066, "global_step": 408630, "epoch": 2432} {"train_loss": -12.182246208190918, "global_step": 408631, "epoch": 2432} {"train_loss": -11.966835021972656, "global_step": 408632, "epoch": 2432} {"train_loss": -12.143295288085938, "global_step": 408633, "epoch": 2432} {"train_loss": -12.216926574707031, "global_step": 408634, "epoch": 2432} {"train_loss": -11.530460357666016, "global_step": 408635, "epoch": 2432} {"train_loss": -11.78628921508789, "global_step": 408636, "epoch": 2432} {"train_loss": -11.844964027404785, "global_step": 408637, "epoch": 2432} {"train_loss": -11.91147232055664, "global_step": 408638, "epoch": 2432} {"train_loss": -12.094881057739258, "global_step": 408639, "epoch": 2432} {"train_loss": -12.433764457702637, "global_step": 408640, "epoch": 2432} {"train_loss": -12.137188911437988, "global_step": 408641, "epoch": 2432} {"train_loss": -12.47638988494873, "global_step": 408642, "epoch": 2432} {"train_loss": -12.390820503234863, "global_step": 408643, "epoch": 2432} {"train_loss": -12.284567832946777, "global_step": 408644, "epoch": 2432} {"train_loss": -11.935230255126953, "global_step": 408645, "epoch": 2432} {"train_loss": -12.359585762023926, "global_step": 408646, "epoch": 2432} {"train_loss": -12.310408592224121, "global_step": 408647, "epoch": 2432} {"train_loss": -12.564157485961914, "global_step": 408648, "epoch": 2432} {"train_loss": -12.416679382324219, "global_step": 408649, "epoch": 2432} {"train_loss": -12.360610961914062, "global_step": 408650, "epoch": 2432} {"train_loss": -12.059661865234375, "global_step": 408651, "epoch": 2432} {"train_loss": -12.135639190673828, "global_step": 408652, "epoch": 2432} {"train_loss": -11.916258811950684, "global_step": 408653, "epoch": 2432} {"train_loss": -12.521903991699219, "global_step": 408654, "epoch": 2432} {"train_loss": -11.582914352416992, "global_step": 408655, "epoch": 2432} {"train_loss": -12.166532516479492, "global_step": 408656, "epoch": 2432} {"train_loss": -12.30677604675293, "global_step": 408657, "epoch": 2432} {"train_loss": -11.832120895385742, "global_step": 408658, "epoch": 2432} {"train_loss": -12.385974884033203, "global_step": 408659, "epoch": 2432} {"train_loss": -12.472709655761719, "global_step": 408660, "epoch": 2432} {"train_loss": -12.421175956726074, "global_step": 408661, "epoch": 2432} {"train_loss": -12.349876403808594, "global_step": 408662, "epoch": 2432} {"train_loss": -12.279037475585938, "global_step": 408663, "epoch": 2432} {"train_loss": -12.212779998779297, "global_step": 408664, "epoch": 2432} {"train_loss": -11.45525074005127, "global_step": 408665, "epoch": 2432} {"train_loss": -12.408687591552734, "global_step": 408666, "epoch": 2432} {"train_loss": -11.667089462280273, "global_step": 408667, "epoch": 2432} {"train_loss": -12.218221664428711, "global_step": 408668, "epoch": 2432} {"train_loss": -12.180133819580078, "global_step": 408669, "epoch": 2432} {"train_loss": -12.107505798339844, "global_step": 408670, "epoch": 2432} {"train_loss": -12.495240211486816, "global_step": 408671, "epoch": 2432} {"train_loss": -12.46030330657959, "global_step": 408672, "epoch": 2432} {"train_loss": -11.867571830749512, "global_step": 408673, "epoch": 2432} {"train_loss": -12.680887222290039, "global_step": 408674, "epoch": 2432} {"train_loss": -12.120177268981934, "global_step": 408675, "epoch": 2432} {"train_loss": -12.575156211853027, "global_step": 408676, "epoch": 2432} {"train_loss": -12.430950164794922, "global_step": 408677, "epoch": 2432} {"train_loss": -12.470537185668945, "global_step": 408678, "epoch": 2432} {"train_loss": -12.55025577545166, "global_step": 408679, "epoch": 2432} {"train_loss": -12.579258918762207, "global_step": 408680, "epoch": 2432} {"train_loss": -12.370849609375, "global_step": 408681, "epoch": 2432} {"train_loss": -12.546802520751953, "global_step": 408682, "epoch": 2432} {"train_loss": -12.463628768920898, "global_step": 408683, "epoch": 2432} {"train_loss": -12.39142894744873, "global_step": 408684, "epoch": 2432} {"train_loss": -12.554025650024414, "global_step": 408685, "epoch": 2432} {"train_loss": -12.161694526672363, "global_step": 408686, "epoch": 2432} {"train_loss": -12.400079727172852, "global_step": 408687, "epoch": 2432} {"train_loss": -12.428302764892578, "global_step": 408688, "epoch": 2432} {"train_loss": -12.282427787780762, "global_step": 408689, "epoch": 2432} {"train_loss": -12.40184211730957, "global_step": 408690, "epoch": 2432} {"train_loss": -12.619338989257812, "global_step": 408691, "epoch": 2432} {"train_loss": -12.181642532348633, "global_step": 408692, "epoch": 2432} {"train_loss": -12.303276062011719, "global_step": 408693, "epoch": 2432} {"train_loss": -12.25585651397705, "global_step": 408694, "epoch": 2432} {"train_loss": -11.903403282165527, "global_step": 408695, "epoch": 2432} {"train_loss": -11.588027954101562, "global_step": 408696, "epoch": 2432} {"train_loss": -11.54289436340332, "global_step": 408697, "epoch": 2432} {"train_loss": -11.379704475402832, "global_step": 408698, "epoch": 2432} {"train_loss": -11.416614532470703, "global_step": 408699, "epoch": 2432} {"train_loss": -10.695512771606445, "global_step": 408700, "epoch": 2432} {"train_loss": -11.828283309936523, "global_step": 408701, "epoch": 2432} {"train_loss": -10.344690322875977, "global_step": 408702, "epoch": 2432} {"train_loss": -11.467527389526367, "global_step": 408703, "epoch": 2432} {"train_loss": -11.744027137756348, "global_step": 408704, "epoch": 2432} {"train_loss": -11.65925121307373, "global_step": 408705, "epoch": 2432} {"train_loss": -11.117757797241211, "global_step": 408706, "epoch": 2432} {"train_loss": -11.981902122497559, "global_step": 408707, "epoch": 2432} {"train_loss": -11.80921459197998, "global_step": 408708, "epoch": 2432} {"train_loss": -12.041357040405273, "global_step": 408709, "epoch": 2432} {"train_loss": -12.039508819580078, "global_step": 408710, "epoch": 2432} {"train_loss": -11.642894744873047, "global_step": 408711, "epoch": 2432} {"train_loss": -12.202202796936035, "global_step": 408712, "epoch": 2432} {"train_loss": -11.865628242492676, "global_step": 408713, "epoch": 2432} {"train_loss": -11.747557640075684, "global_step": 408714, "epoch": 2432} {"train_loss": -12.019144058227539, "global_step": 408715, "epoch": 2432} {"train_loss": -12.056709289550781, "global_step": 408716, "epoch": 2432} {"train_loss": -11.912005424499512, "global_step": 408717, "epoch": 2432} {"train_loss": -12.5464448928833, "global_step": 408718, "epoch": 2432} {"train_loss": -12.178910255432129, "global_step": 408719, "epoch": 2432} {"train_loss": -12.469795227050781, "global_step": 408720, "epoch": 2432} {"train_loss": -12.039617538452148, "global_step": 408721, "epoch": 2432} {"train_loss": -12.453130722045898, "global_step": 408722, "epoch": 2432} {"train_loss": -12.263474464416504, "global_step": 408723, "epoch": 2432} {"train_loss": -12.378583908081055, "global_step": 408724, "epoch": 2432} {"train_loss": -12.17648983001709, "global_step": 408725, "epoch": 2432} {"train_loss": -12.263338088989258, "global_step": 408726, "epoch": 2432} {"train_loss": -12.415810585021973, "global_step": 408727, "epoch": 2432} {"train_loss": -12.217954635620117, "global_step": 408728, "epoch": 2432} {"train_loss": -12.57080078125, "global_step": 408729, "epoch": 2432} {"train_loss": -12.372273445129395, "global_step": 408730, "epoch": 2432} {"train_loss": -12.533260345458984, "global_step": 408731, "epoch": 2432} {"train_loss": -12.643606185913086, "global_step": 408732, "epoch": 2432} {"train_loss": -12.51756763458252, "global_step": 408733, "epoch": 2432} {"train_loss": -12.596431732177734, "global_step": 408734, "epoch": 2432} {"train_loss": -12.506872177124023, "global_step": 408735, "epoch": 2432} {"train_loss": -12.670592308044434, "global_step": 408736, "epoch": 2432} {"train_loss": -12.657726287841797, "global_step": 408737, "epoch": 2432} {"train_loss": -12.570423126220703, "global_step": 408738, "epoch": 2432} {"train_loss": -12.449100494384766, "global_step": 408739, "epoch": 2432} {"train_loss": -12.606260299682617, "global_step": 408740, "epoch": 2432} {"train_loss": -12.778836250305176, "global_step": 408741, "epoch": 2432} {"train_loss": -12.83879280090332, "global_step": 408742, "epoch": 2432} {"train_loss": -12.162366293725514, "global_step": 408743, "epoch": 2432, "val_loss": 300629.53125} {"train_loss": -12.567976951599121, "global_step": 408744, "epoch": 2433} {"train_loss": -12.513114929199219, "global_step": 408745, "epoch": 2433} {"train_loss": -12.58420181274414, "global_step": 408746, "epoch": 2433} {"train_loss": -12.759769439697266, "global_step": 408747, "epoch": 2433} {"train_loss": -12.694175720214844, "global_step": 408748, "epoch": 2433} {"train_loss": -12.886248588562012, "global_step": 408749, "epoch": 2433} {"train_loss": -12.653114318847656, "global_step": 408750, "epoch": 2433} {"train_loss": -12.580371856689453, "global_step": 408751, "epoch": 2433} {"train_loss": -12.818502426147461, "global_step": 408752, "epoch": 2433} {"train_loss": -12.846841812133789, "global_step": 408753, "epoch": 2433} {"train_loss": -12.794898986816406, "global_step": 408754, "epoch": 2433} {"train_loss": -12.904661178588867, "global_step": 408755, "epoch": 2433} {"train_loss": -12.79074478149414, "global_step": 408756, "epoch": 2433} {"train_loss": -12.94976806640625, "global_step": 408757, "epoch": 2433} {"train_loss": -12.777605056762695, "global_step": 408758, "epoch": 2433} {"train_loss": -12.78277587890625, "global_step": 408759, "epoch": 2433} {"train_loss": -12.928668975830078, "global_step": 408760, "epoch": 2433} {"train_loss": -12.628273010253906, "global_step": 408761, "epoch": 2433} {"train_loss": -12.633252143859863, "global_step": 408762, "epoch": 2433} {"train_loss": -12.69176959991455, "global_step": 408763, "epoch": 2433} {"train_loss": -12.460552215576172, "global_step": 408764, "epoch": 2433} {"train_loss": -12.085777282714844, "global_step": 408765, "epoch": 2433} {"train_loss": -12.59543228149414, "global_step": 408766, "epoch": 2433} {"train_loss": -12.505077362060547, "global_step": 408767, "epoch": 2433} {"train_loss": -12.474199295043945, "global_step": 408768, "epoch": 2433} {"train_loss": -12.177865982055664, "global_step": 408769, "epoch": 2433} {"train_loss": -11.811246871948242, "global_step": 408770, "epoch": 2433} {"train_loss": -12.486464500427246, "global_step": 408771, "epoch": 2433} {"train_loss": -12.637260437011719, "global_step": 408772, "epoch": 2433} {"train_loss": -11.703420639038086, "global_step": 408773, "epoch": 2433} {"train_loss": -12.414321899414062, "global_step": 408774, "epoch": 2433} {"train_loss": -11.938482284545898, "global_step": 408775, "epoch": 2433} {"train_loss": -11.783161163330078, "global_step": 408776, "epoch": 2433} {"train_loss": -12.367722511291504, "global_step": 408777, "epoch": 2433} {"train_loss": -12.44905948638916, "global_step": 408778, "epoch": 2433} {"train_loss": -11.722858428955078, "global_step": 408779, "epoch": 2433} {"train_loss": -12.325422286987305, "global_step": 408780, "epoch": 2433} {"train_loss": -12.09343147277832, "global_step": 408781, "epoch": 2433} {"train_loss": -11.583427429199219, "global_step": 408782, "epoch": 2433} {"train_loss": -12.160930633544922, "global_step": 408783, "epoch": 2433} {"train_loss": -11.374030113220215, "global_step": 408784, "epoch": 2433} {"train_loss": -11.860360145568848, "global_step": 408785, "epoch": 2433} {"train_loss": -11.799341201782227, "global_step": 408786, "epoch": 2433} {"train_loss": -12.061356544494629, "global_step": 408787, "epoch": 2433} {"train_loss": -11.975122451782227, "global_step": 408788, "epoch": 2433} {"train_loss": -11.939759254455566, "global_step": 408789, "epoch": 2433} {"train_loss": -10.882486343383789, "global_step": 408790, "epoch": 2433} {"train_loss": -11.846683502197266, "global_step": 408791, "epoch": 2433} {"train_loss": -11.756738662719727, "global_step": 408792, "epoch": 2433} {"train_loss": -12.58247184753418, "global_step": 408793, "epoch": 2433} {"train_loss": -12.01055908203125, "global_step": 408794, "epoch": 2433} {"train_loss": -12.17730712890625, "global_step": 408795, "epoch": 2433} {"train_loss": -11.717065811157227, "global_step": 408796, "epoch": 2433} {"train_loss": -11.949392318725586, "global_step": 408797, "epoch": 2433} {"train_loss": -11.05571174621582, "global_step": 408798, "epoch": 2433} {"train_loss": -11.27147102355957, "global_step": 408799, "epoch": 2433} {"train_loss": -10.555826187133789, "global_step": 408800, "epoch": 2433} {"train_loss": -9.158914566040039, "global_step": 408801, "epoch": 2433} {"train_loss": -10.826345443725586, "global_step": 408802, "epoch": 2433} {"train_loss": -10.647433280944824, "global_step": 408803, "epoch": 2433} {"train_loss": -10.543434143066406, "global_step": 408804, "epoch": 2433} {"train_loss": -9.286983489990234, "global_step": 408805, "epoch": 2433} {"train_loss": -9.567008972167969, "global_step": 408806, "epoch": 2433} {"train_loss": -11.136211395263672, "global_step": 408807, "epoch": 2433} {"train_loss": -8.335411071777344, "global_step": 408808, "epoch": 2433} {"train_loss": -8.933605194091797, "global_step": 408809, "epoch": 2433} {"train_loss": -8.680127143859863, "global_step": 408810, "epoch": 2433} {"train_loss": -11.277474403381348, "global_step": 408811, "epoch": 2433} {"train_loss": -9.37736701965332, "global_step": 408812, "epoch": 2433} {"train_loss": -9.392911911010742, "global_step": 408813, "epoch": 2433} {"train_loss": -9.265228271484375, "global_step": 408814, "epoch": 2433} {"train_loss": -10.202234268188477, "global_step": 408815, "epoch": 2433} {"train_loss": -9.499399185180664, "global_step": 408816, "epoch": 2433} {"train_loss": -9.712445259094238, "global_step": 408817, "epoch": 2433} {"train_loss": -10.289234161376953, "global_step": 408818, "epoch": 2433} {"train_loss": -11.67547607421875, "global_step": 408819, "epoch": 2433} {"train_loss": -8.850017547607422, "global_step": 408820, "epoch": 2433} {"train_loss": -10.193443298339844, "global_step": 408821, "epoch": 2433} {"train_loss": -10.16376781463623, "global_step": 408822, "epoch": 2433} {"train_loss": -9.747610092163086, "global_step": 408823, "epoch": 2433} {"train_loss": -10.188156127929688, "global_step": 408824, "epoch": 2433} {"train_loss": -11.253564834594727, "global_step": 408825, "epoch": 2433} {"train_loss": -10.68832778930664, "global_step": 408826, "epoch": 2433} {"train_loss": -10.096309661865234, "global_step": 408827, "epoch": 2433} {"train_loss": -11.172382354736328, "global_step": 408828, "epoch": 2433} {"train_loss": -11.157793045043945, "global_step": 408829, "epoch": 2433} {"train_loss": -10.707117080688477, "global_step": 408830, "epoch": 2433} {"train_loss": -11.989696502685547, "global_step": 408831, "epoch": 2433} {"train_loss": -11.760228157043457, "global_step": 408832, "epoch": 2433} {"train_loss": -11.226743698120117, "global_step": 408833, "epoch": 2433} {"train_loss": -10.904617309570312, "global_step": 408834, "epoch": 2433} {"train_loss": -11.573100090026855, "global_step": 408835, "epoch": 2433} {"train_loss": -11.17540168762207, "global_step": 408836, "epoch": 2433} {"train_loss": -11.923517227172852, "global_step": 408837, "epoch": 2433} {"train_loss": -12.053844451904297, "global_step": 408838, "epoch": 2433} {"train_loss": -11.600255966186523, "global_step": 408839, "epoch": 2433} {"train_loss": -12.032679557800293, "global_step": 408840, "epoch": 2433} {"train_loss": -12.29133415222168, "global_step": 408841, "epoch": 2433} {"train_loss": -11.536373138427734, "global_step": 408842, "epoch": 2433} {"train_loss": -12.004532814025879, "global_step": 408843, "epoch": 2433} {"train_loss": -12.247023582458496, "global_step": 408844, "epoch": 2433} {"train_loss": -11.59221076965332, "global_step": 408845, "epoch": 2433} {"train_loss": -12.060368537902832, "global_step": 408846, "epoch": 2433} {"train_loss": -11.748764991760254, "global_step": 408847, "epoch": 2433} {"train_loss": -11.979329109191895, "global_step": 408848, "epoch": 2433} {"train_loss": -12.082036972045898, "global_step": 408849, "epoch": 2433} {"train_loss": -12.137704849243164, "global_step": 408850, "epoch": 2433} {"train_loss": -11.75991439819336, "global_step": 408851, "epoch": 2433} {"train_loss": -12.204885482788086, "global_step": 408852, "epoch": 2433} {"train_loss": -11.861915588378906, "global_step": 408853, "epoch": 2433} {"train_loss": -12.079533576965332, "global_step": 408854, "epoch": 2433} {"train_loss": -12.240272521972656, "global_step": 408855, "epoch": 2433} {"train_loss": -12.037631034851074, "global_step": 408856, "epoch": 2433} {"train_loss": -12.162562370300293, "global_step": 408857, "epoch": 2433} {"train_loss": -12.065206527709961, "global_step": 408858, "epoch": 2433} {"train_loss": -12.222541809082031, "global_step": 408859, "epoch": 2433} {"train_loss": -12.021169662475586, "global_step": 408860, "epoch": 2433} {"train_loss": -12.2011137008667, "global_step": 408861, "epoch": 2433} {"train_loss": -11.810759544372559, "global_step": 408862, "epoch": 2433} {"train_loss": -12.168832778930664, "global_step": 408863, "epoch": 2433} {"train_loss": -11.923498153686523, "global_step": 408864, "epoch": 2433} {"train_loss": -12.259124755859375, "global_step": 408865, "epoch": 2433} {"train_loss": -12.043557167053223, "global_step": 408866, "epoch": 2433} {"train_loss": -12.143632888793945, "global_step": 408867, "epoch": 2433} {"train_loss": -12.291913986206055, "global_step": 408868, "epoch": 2433} {"train_loss": -11.828653335571289, "global_step": 408869, "epoch": 2433} {"train_loss": -12.362871170043945, "global_step": 408870, "epoch": 2433} {"train_loss": -12.085506439208984, "global_step": 408871, "epoch": 2433} {"train_loss": -12.209310531616211, "global_step": 408872, "epoch": 2433} {"train_loss": -11.810354232788086, "global_step": 408873, "epoch": 2433} {"train_loss": -11.564847946166992, "global_step": 408874, "epoch": 2433} {"train_loss": -12.283966064453125, "global_step": 408875, "epoch": 2433} {"train_loss": -11.530350685119629, "global_step": 408876, "epoch": 2433} {"train_loss": -11.900958061218262, "global_step": 408877, "epoch": 2433} {"train_loss": -12.053817749023438, "global_step": 408878, "epoch": 2433} {"train_loss": -11.638130187988281, "global_step": 408879, "epoch": 2433} {"train_loss": -12.180272102355957, "global_step": 408880, "epoch": 2433} {"train_loss": -11.740983963012695, "global_step": 408881, "epoch": 2433} {"train_loss": -12.368635177612305, "global_step": 408882, "epoch": 2433} {"train_loss": -11.492700576782227, "global_step": 408883, "epoch": 2433} {"train_loss": -12.421157836914062, "global_step": 408884, "epoch": 2433} {"train_loss": -12.008118629455566, "global_step": 408885, "epoch": 2433} {"train_loss": -12.521170616149902, "global_step": 408886, "epoch": 2433} {"train_loss": -12.063751220703125, "global_step": 408887, "epoch": 2433} {"train_loss": -12.350830078125, "global_step": 408888, "epoch": 2433} {"train_loss": -12.238435745239258, "global_step": 408889, "epoch": 2433} {"train_loss": -12.516422271728516, "global_step": 408890, "epoch": 2433} {"train_loss": -12.443010330200195, "global_step": 408891, "epoch": 2433} {"train_loss": -12.09837818145752, "global_step": 408892, "epoch": 2433} {"train_loss": -12.044010162353516, "global_step": 408893, "epoch": 2433} {"train_loss": -12.047698974609375, "global_step": 408894, "epoch": 2433} {"train_loss": -12.053049087524414, "global_step": 408895, "epoch": 2433} {"train_loss": -12.367073059082031, "global_step": 408896, "epoch": 2433} {"train_loss": -11.811894416809082, "global_step": 408897, "epoch": 2433} {"train_loss": -12.183506965637207, "global_step": 408898, "epoch": 2433} {"train_loss": -12.118522644042969, "global_step": 408899, "epoch": 2433} {"train_loss": -12.118205070495605, "global_step": 408900, "epoch": 2433} {"train_loss": -12.319350242614746, "global_step": 408901, "epoch": 2433} {"train_loss": -12.179230690002441, "global_step": 408902, "epoch": 2433} {"train_loss": -12.344367980957031, "global_step": 408903, "epoch": 2433} {"train_loss": -12.37944507598877, "global_step": 408904, "epoch": 2433} {"train_loss": -12.435300827026367, "global_step": 408905, "epoch": 2433} {"train_loss": -12.466194152832031, "global_step": 408906, "epoch": 2433} {"train_loss": -12.11496353149414, "global_step": 408907, "epoch": 2433} {"train_loss": -12.469524383544922, "global_step": 408908, "epoch": 2433} {"train_loss": -12.242463111877441, "global_step": 408909, "epoch": 2433} {"train_loss": -11.975101470947266, "global_step": 408910, "epoch": 2433} {"train_loss": -11.754287969498407, "global_step": 408911, "epoch": 2433, "val_loss": 305273.28125} {"train_loss": -11.903731346130371, "global_step": 408912, "epoch": 2434} {"train_loss": -12.299094200134277, "global_step": 408913, "epoch": 2434} {"train_loss": -11.879974365234375, "global_step": 408914, "epoch": 2434} {"train_loss": -12.189756393432617, "global_step": 408915, "epoch": 2434} {"train_loss": -12.017172813415527, "global_step": 408916, "epoch": 2434} {"train_loss": -12.111006736755371, "global_step": 408917, "epoch": 2434} {"train_loss": -12.030884742736816, "global_step": 408918, "epoch": 2434} {"train_loss": -12.61005687713623, "global_step": 408919, "epoch": 2434} {"train_loss": -11.485180854797363, "global_step": 408920, "epoch": 2434} {"train_loss": -11.706396102905273, "global_step": 408921, "epoch": 2434} {"train_loss": -12.272997856140137, "global_step": 408922, "epoch": 2434} {"train_loss": -11.860088348388672, "global_step": 408923, "epoch": 2434} {"train_loss": -11.869455337524414, "global_step": 408924, "epoch": 2434} {"train_loss": -12.437562942504883, "global_step": 408925, "epoch": 2434} {"train_loss": -12.27790355682373, "global_step": 408926, "epoch": 2434} {"train_loss": -12.304723739624023, "global_step": 408927, "epoch": 2434} {"train_loss": -12.34011459350586, "global_step": 408928, "epoch": 2434} {"train_loss": -12.19029426574707, "global_step": 408929, "epoch": 2434} {"train_loss": -12.443283081054688, "global_step": 408930, "epoch": 2434} {"train_loss": -12.521907806396484, "global_step": 408931, "epoch": 2434} {"train_loss": -12.481294631958008, "global_step": 408932, "epoch": 2434} {"train_loss": -12.549227714538574, "global_step": 408933, "epoch": 2434} {"train_loss": -12.466175079345703, "global_step": 408934, "epoch": 2434} {"train_loss": -12.587964057922363, "global_step": 408935, "epoch": 2434} {"train_loss": -12.582637786865234, "global_step": 408936, "epoch": 2434} {"train_loss": -12.526263236999512, "global_step": 408937, "epoch": 2434} {"train_loss": -12.692059516906738, "global_step": 408938, "epoch": 2434} {"train_loss": -12.291881561279297, "global_step": 408939, "epoch": 2434} {"train_loss": -12.63320255279541, "global_step": 408940, "epoch": 2434} {"train_loss": -12.547916412353516, "global_step": 408941, "epoch": 2434} {"train_loss": -12.560420036315918, "global_step": 408942, "epoch": 2434} {"train_loss": -12.727287292480469, "global_step": 408943, "epoch": 2434} {"train_loss": -12.744675636291504, "global_step": 408944, "epoch": 2434} {"train_loss": -12.61529541015625, "global_step": 408945, "epoch": 2434} {"train_loss": -12.40349006652832, "global_step": 408946, "epoch": 2434} {"train_loss": -12.709080696105957, "global_step": 408947, "epoch": 2434} {"train_loss": -12.769430160522461, "global_step": 408948, "epoch": 2434} {"train_loss": -12.601963996887207, "global_step": 408949, "epoch": 2434} {"train_loss": -12.803654670715332, "global_step": 408950, "epoch": 2434} {"train_loss": -12.627792358398438, "global_step": 408951, "epoch": 2434} {"train_loss": -12.415029525756836, "global_step": 408952, "epoch": 2434} {"train_loss": -12.71280288696289, "global_step": 408953, "epoch": 2434} {"train_loss": -12.684328079223633, "global_step": 408954, "epoch": 2434} {"train_loss": -12.460848808288574, "global_step": 408955, "epoch": 2434} {"train_loss": -12.533456802368164, "global_step": 408956, "epoch": 2434} {"train_loss": -12.526498794555664, "global_step": 408957, "epoch": 2434} {"train_loss": -11.761394500732422, "global_step": 408958, "epoch": 2434} {"train_loss": -12.770380020141602, "global_step": 408959, "epoch": 2434} {"train_loss": -12.058554649353027, "global_step": 408960, "epoch": 2434} {"train_loss": -11.475912094116211, "global_step": 408961, "epoch": 2434} {"train_loss": -11.164352416992188, "global_step": 408962, "epoch": 2434} {"train_loss": -12.795833587646484, "global_step": 408963, "epoch": 2434} {"train_loss": -11.535666465759277, "global_step": 408964, "epoch": 2434} {"train_loss": -12.180410385131836, "global_step": 408965, "epoch": 2434} {"train_loss": -11.968337059020996, "global_step": 408966, "epoch": 2434} {"train_loss": -12.506513595581055, "global_step": 408967, "epoch": 2434} {"train_loss": -11.471260070800781, "global_step": 408968, "epoch": 2434} {"train_loss": -11.949366569519043, "global_step": 408969, "epoch": 2434} {"train_loss": -12.03504467010498, "global_step": 408970, "epoch": 2434} {"train_loss": -10.999631881713867, "global_step": 408971, "epoch": 2434} {"train_loss": -11.536226272583008, "global_step": 408972, "epoch": 2434} {"train_loss": -12.585880279541016, "global_step": 408973, "epoch": 2434} {"train_loss": -10.7172269821167, "global_step": 408974, "epoch": 2434} {"train_loss": -11.281466484069824, "global_step": 408975, "epoch": 2434} {"train_loss": -10.851475715637207, "global_step": 408976, "epoch": 2434} {"train_loss": -11.883085250854492, "global_step": 408977, "epoch": 2434} {"train_loss": -9.71279525756836, "global_step": 408978, "epoch": 2434} {"train_loss": -11.809813499450684, "global_step": 408979, "epoch": 2434} {"train_loss": -10.961831092834473, "global_step": 408980, "epoch": 2434} {"train_loss": -10.487524032592773, "global_step": 408981, "epoch": 2434} {"train_loss": -10.201302528381348, "global_step": 408982, "epoch": 2434} {"train_loss": -11.666967391967773, "global_step": 408983, "epoch": 2434} {"train_loss": -10.41882610321045, "global_step": 408984, "epoch": 2434} {"train_loss": -8.865501403808594, "global_step": 408985, "epoch": 2434} {"train_loss": -9.88924503326416, "global_step": 408986, "epoch": 2434} {"train_loss": -11.528238296508789, "global_step": 408987, "epoch": 2434} {"train_loss": -8.713907241821289, "global_step": 408988, "epoch": 2434} {"train_loss": -10.862222671508789, "global_step": 408989, "epoch": 2434} {"train_loss": -10.64146900177002, "global_step": 408990, "epoch": 2434} {"train_loss": -10.03807258605957, "global_step": 408991, "epoch": 2434} {"train_loss": -10.78209400177002, "global_step": 408992, "epoch": 2434} {"train_loss": -10.827259063720703, "global_step": 408993, "epoch": 2434} {"train_loss": -10.05362319946289, "global_step": 408994, "epoch": 2434} {"train_loss": -10.887521743774414, "global_step": 408995, "epoch": 2434} {"train_loss": -11.477029800415039, "global_step": 408996, "epoch": 2434} {"train_loss": -11.025056838989258, "global_step": 408997, "epoch": 2434} {"train_loss": -11.92273998260498, "global_step": 408998, "epoch": 2434} {"train_loss": -11.305814743041992, "global_step": 408999, "epoch": 2434} {"train_loss": -11.1758394241333, "global_step": 409000, "epoch": 2434} {"train_loss": -11.164205551147461, "global_step": 409001, "epoch": 2434} {"train_loss": -10.73274040222168, "global_step": 409002, "epoch": 2434} {"train_loss": -10.244490623474121, "global_step": 409003, "epoch": 2434} {"train_loss": -10.645890235900879, "global_step": 409004, "epoch": 2434} {"train_loss": -11.631623268127441, "global_step": 409005, "epoch": 2434} {"train_loss": -10.674077987670898, "global_step": 409006, "epoch": 2434} {"train_loss": -11.367171287536621, "global_step": 409007, "epoch": 2434} {"train_loss": -12.149450302124023, "global_step": 409008, "epoch": 2434} {"train_loss": -11.498699188232422, "global_step": 409009, "epoch": 2434} {"train_loss": -11.826056480407715, "global_step": 409010, "epoch": 2434} {"train_loss": -11.527450561523438, "global_step": 409011, "epoch": 2434} {"train_loss": -11.815695762634277, "global_step": 409012, "epoch": 2434} {"train_loss": -12.001930236816406, "global_step": 409013, "epoch": 2434} {"train_loss": -11.984809875488281, "global_step": 409014, "epoch": 2434} {"train_loss": -12.2066068649292, "global_step": 409015, "epoch": 2434} {"train_loss": -12.271951675415039, "global_step": 409016, "epoch": 2434} {"train_loss": -12.074859619140625, "global_step": 409017, "epoch": 2434} {"train_loss": -12.334793090820312, "global_step": 409018, "epoch": 2434} {"train_loss": -12.046510696411133, "global_step": 409019, "epoch": 2434} {"train_loss": -12.34766960144043, "global_step": 409020, "epoch": 2434} {"train_loss": -12.05997371673584, "global_step": 409021, "epoch": 2434} {"train_loss": -12.235931396484375, "global_step": 409022, "epoch": 2434} {"train_loss": -12.189451217651367, "global_step": 409023, "epoch": 2434} {"train_loss": -12.19106674194336, "global_step": 409024, "epoch": 2434} {"train_loss": -12.397059440612793, "global_step": 409025, "epoch": 2434} {"train_loss": -12.229572296142578, "global_step": 409026, "epoch": 2434} {"train_loss": -11.906047821044922, "global_step": 409027, "epoch": 2434} {"train_loss": -12.269454956054688, "global_step": 409028, "epoch": 2434} {"train_loss": -12.032279968261719, "global_step": 409029, "epoch": 2434} {"train_loss": -12.067852020263672, "global_step": 409030, "epoch": 2434} {"train_loss": -12.008177757263184, "global_step": 409031, "epoch": 2434} {"train_loss": -12.17674446105957, "global_step": 409032, "epoch": 2434} {"train_loss": -12.346321105957031, "global_step": 409033, "epoch": 2434} {"train_loss": -12.12733268737793, "global_step": 409034, "epoch": 2434} {"train_loss": -12.227126121520996, "global_step": 409035, "epoch": 2434} {"train_loss": -12.076959609985352, "global_step": 409036, "epoch": 2434} {"train_loss": -12.309152603149414, "global_step": 409037, "epoch": 2434} {"train_loss": -12.159049987792969, "global_step": 409038, "epoch": 2434} {"train_loss": -12.21174430847168, "global_step": 409039, "epoch": 2434} {"train_loss": -12.464031219482422, "global_step": 409040, "epoch": 2434} {"train_loss": -12.250864028930664, "global_step": 409041, "epoch": 2434} {"train_loss": -12.281684875488281, "global_step": 409042, "epoch": 2434} {"train_loss": -12.240626335144043, "global_step": 409043, "epoch": 2434} {"train_loss": -12.175430297851562, "global_step": 409044, "epoch": 2434} {"train_loss": -12.34942626953125, "global_step": 409045, "epoch": 2434} {"train_loss": -11.9956693649292, "global_step": 409046, "epoch": 2434} {"train_loss": -12.552257537841797, "global_step": 409047, "epoch": 2434} {"train_loss": -12.118361473083496, "global_step": 409048, "epoch": 2434} {"train_loss": -12.507119178771973, "global_step": 409049, "epoch": 2434} {"train_loss": -12.455621719360352, "global_step": 409050, "epoch": 2434} {"train_loss": -12.048264503479004, "global_step": 409051, "epoch": 2434} {"train_loss": -12.550556182861328, "global_step": 409052, "epoch": 2434} {"train_loss": -12.11707878112793, "global_step": 409053, "epoch": 2434} {"train_loss": -12.493056297302246, "global_step": 409054, "epoch": 2434} {"train_loss": -12.26099967956543, "global_step": 409055, "epoch": 2434} {"train_loss": -12.501020431518555, "global_step": 409056, "epoch": 2434} {"train_loss": -12.457409858703613, "global_step": 409057, "epoch": 2434} {"train_loss": -12.27348518371582, "global_step": 409058, "epoch": 2434} {"train_loss": -12.510926246643066, "global_step": 409059, "epoch": 2434} {"train_loss": -12.257743835449219, "global_step": 409060, "epoch": 2434} {"train_loss": -12.422836303710938, "global_step": 409061, "epoch": 2434} {"train_loss": -12.331591606140137, "global_step": 409062, "epoch": 2434} {"train_loss": -12.23715877532959, "global_step": 409063, "epoch": 2434} {"train_loss": -12.556839942932129, "global_step": 409064, "epoch": 2434} {"train_loss": -12.238482475280762, "global_step": 409065, "epoch": 2434} {"train_loss": -12.387532234191895, "global_step": 409066, "epoch": 2434} {"train_loss": -12.322391510009766, "global_step": 409067, "epoch": 2434} {"train_loss": -12.441869735717773, "global_step": 409068, "epoch": 2434} {"train_loss": -12.394988059997559, "global_step": 409069, "epoch": 2434} {"train_loss": -12.050273895263672, "global_step": 409070, "epoch": 2434} {"train_loss": -12.392197608947754, "global_step": 409071, "epoch": 2434} {"train_loss": -12.161840438842773, "global_step": 409072, "epoch": 2434} {"train_loss": -12.272636413574219, "global_step": 409073, "epoch": 2434} {"train_loss": -12.750932693481445, "global_step": 409074, "epoch": 2434} {"train_loss": -12.044417381286621, "global_step": 409075, "epoch": 2434} {"train_loss": -12.099052429199219, "global_step": 409076, "epoch": 2434} {"train_loss": -12.761499404907227, "global_step": 409077, "epoch": 2434} {"train_loss": -12.578259468078613, "global_step": 409078, "epoch": 2434} {"train_loss": -11.95231328691755, "global_step": 409079, "epoch": 2434, "val_loss": 300564.84375} {"train_loss": -12.763291358947754, "global_step": 409080, "epoch": 2435} {"train_loss": -12.530542373657227, "global_step": 409081, "epoch": 2435} {"train_loss": -12.439576148986816, "global_step": 409082, "epoch": 2435} {"train_loss": -12.62044906616211, "global_step": 409083, "epoch": 2435} {"train_loss": -12.47108268737793, "global_step": 409084, "epoch": 2435} {"train_loss": -12.546651840209961, "global_step": 409085, "epoch": 2435} {"train_loss": -12.652713775634766, "global_step": 409086, "epoch": 2435} {"train_loss": -12.320220947265625, "global_step": 409087, "epoch": 2435} {"train_loss": -11.794099807739258, "global_step": 409088, "epoch": 2435} {"train_loss": -12.536672592163086, "global_step": 409089, "epoch": 2435} {"train_loss": -12.348470687866211, "global_step": 409090, "epoch": 2435} {"train_loss": -12.04793930053711, "global_step": 409091, "epoch": 2435} {"train_loss": -12.49683952331543, "global_step": 409092, "epoch": 2435} {"train_loss": -12.210602760314941, "global_step": 409093, "epoch": 2435} {"train_loss": -12.495734214782715, "global_step": 409094, "epoch": 2435} {"train_loss": -12.495340347290039, "global_step": 409095, "epoch": 2435} {"train_loss": -12.498659133911133, "global_step": 409096, "epoch": 2435} {"train_loss": -12.004522323608398, "global_step": 409097, "epoch": 2435} {"train_loss": -12.36302375793457, "global_step": 409098, "epoch": 2435} {"train_loss": -12.512626647949219, "global_step": 409099, "epoch": 2435} {"train_loss": -12.389497756958008, "global_step": 409100, "epoch": 2435} {"train_loss": -12.593667030334473, "global_step": 409101, "epoch": 2435} {"train_loss": -12.294288635253906, "global_step": 409102, "epoch": 2435} {"train_loss": -12.56650161743164, "global_step": 409103, "epoch": 2435} {"train_loss": -12.569175720214844, "global_step": 409104, "epoch": 2435} {"train_loss": -12.642162322998047, "global_step": 409105, "epoch": 2435} {"train_loss": -12.472026824951172, "global_step": 409106, "epoch": 2435} {"train_loss": -12.302684783935547, "global_step": 409107, "epoch": 2435} {"train_loss": -12.179010391235352, "global_step": 409108, "epoch": 2435} {"train_loss": -12.276334762573242, "global_step": 409109, "epoch": 2435} {"train_loss": -12.535065650939941, "global_step": 409110, "epoch": 2435} {"train_loss": -12.410125732421875, "global_step": 409111, "epoch": 2435} {"train_loss": -12.465187072753906, "global_step": 409112, "epoch": 2435} {"train_loss": -12.081449508666992, "global_step": 409113, "epoch": 2435} {"train_loss": -12.377647399902344, "global_step": 409114, "epoch": 2435} {"train_loss": -10.988882064819336, "global_step": 409115, "epoch": 2435} {"train_loss": -11.2898588180542, "global_step": 409116, "epoch": 2435} {"train_loss": -12.146102905273438, "global_step": 409117, "epoch": 2435} {"train_loss": -11.550504684448242, "global_step": 409118, "epoch": 2435} {"train_loss": -11.559627532958984, "global_step": 409119, "epoch": 2435} {"train_loss": -12.074203491210938, "global_step": 409120, "epoch": 2435} {"train_loss": -10.646101951599121, "global_step": 409121, "epoch": 2435} {"train_loss": -9.864996910095215, "global_step": 409122, "epoch": 2435} {"train_loss": -9.85240364074707, "global_step": 409123, "epoch": 2435} {"train_loss": -7.255234241485596, "global_step": 409124, "epoch": 2435} {"train_loss": -8.144189834594727, "global_step": 409125, "epoch": 2435} {"train_loss": -7.120309352874756, "global_step": 409126, "epoch": 2435} {"train_loss": -7.338603496551514, "global_step": 409127, "epoch": 2435} {"train_loss": -6.938333034515381, "global_step": 409128, "epoch": 2435} {"train_loss": -6.840946674346924, "global_step": 409129, "epoch": 2435} {"train_loss": -6.958090782165527, "global_step": 409130, "epoch": 2435} {"train_loss": -6.345441818237305, "global_step": 409131, "epoch": 2435} {"train_loss": -7.86969518661499, "global_step": 409132, "epoch": 2435} {"train_loss": -7.871029853820801, "global_step": 409133, "epoch": 2435} {"train_loss": -8.424198150634766, "global_step": 409134, "epoch": 2435} {"train_loss": -8.484060287475586, "global_step": 409135, "epoch": 2435} {"train_loss": -8.273758888244629, "global_step": 409136, "epoch": 2435} {"train_loss": -8.198351860046387, "global_step": 409137, "epoch": 2435} {"train_loss": -7.7848992347717285, "global_step": 409138, "epoch": 2435} {"train_loss": -8.351245880126953, "global_step": 409139, "epoch": 2435} {"train_loss": -8.910847663879395, "global_step": 409140, "epoch": 2435} {"train_loss": -9.150960922241211, "global_step": 409141, "epoch": 2435} {"train_loss": -9.372580528259277, "global_step": 409142, "epoch": 2435} {"train_loss": -8.587350845336914, "global_step": 409143, "epoch": 2435} {"train_loss": -8.772628784179688, "global_step": 409144, "epoch": 2435} {"train_loss": -9.03061294555664, "global_step": 409145, "epoch": 2435} {"train_loss": -9.408953666687012, "global_step": 409146, "epoch": 2435} {"train_loss": -9.499565124511719, "global_step": 409147, "epoch": 2435} {"train_loss": -10.032934188842773, "global_step": 409148, "epoch": 2435} {"train_loss": -9.865795135498047, "global_step": 409149, "epoch": 2435} {"train_loss": -10.217899322509766, "global_step": 409150, "epoch": 2435} {"train_loss": -10.029077529907227, "global_step": 409151, "epoch": 2435} {"train_loss": -10.041706085205078, "global_step": 409152, "epoch": 2435} {"train_loss": -10.182923316955566, "global_step": 409153, "epoch": 2435} {"train_loss": -10.710577011108398, "global_step": 409154, "epoch": 2435} {"train_loss": -10.2412109375, "global_step": 409155, "epoch": 2435} {"train_loss": -10.772993087768555, "global_step": 409156, "epoch": 2435} {"train_loss": -10.3367919921875, "global_step": 409157, "epoch": 2435} {"train_loss": -10.292852401733398, "global_step": 409158, "epoch": 2435} {"train_loss": -10.557910919189453, "global_step": 409159, "epoch": 2435} {"train_loss": -10.16296100616455, "global_step": 409160, "epoch": 2435} {"train_loss": -10.528298377990723, "global_step": 409161, "epoch": 2435} {"train_loss": -10.419898986816406, "global_step": 409162, "epoch": 2435} {"train_loss": -11.143401145935059, "global_step": 409163, "epoch": 2435} {"train_loss": -10.95734977722168, "global_step": 409164, "epoch": 2435} {"train_loss": -11.231575012207031, "global_step": 409165, "epoch": 2435} {"train_loss": -11.18828296661377, "global_step": 409166, "epoch": 2435} {"train_loss": -10.732460021972656, "global_step": 409167, "epoch": 2435} {"train_loss": -11.505880355834961, "global_step": 409168, "epoch": 2435} {"train_loss": -11.207623481750488, "global_step": 409169, "epoch": 2435} {"train_loss": -11.279669761657715, "global_step": 409170, "epoch": 2435} {"train_loss": -11.191993713378906, "global_step": 409171, "epoch": 2435} {"train_loss": -11.74209213256836, "global_step": 409172, "epoch": 2435} {"train_loss": -11.456990242004395, "global_step": 409173, "epoch": 2435} {"train_loss": -11.783281326293945, "global_step": 409174, "epoch": 2435} {"train_loss": -11.270609855651855, "global_step": 409175, "epoch": 2435} {"train_loss": -11.683137893676758, "global_step": 409176, "epoch": 2435} {"train_loss": -11.335779190063477, "global_step": 409177, "epoch": 2435} {"train_loss": -11.53443431854248, "global_step": 409178, "epoch": 2435} {"train_loss": -11.319562911987305, "global_step": 409179, "epoch": 2435} {"train_loss": -11.6376953125, "global_step": 409180, "epoch": 2435} {"train_loss": -11.720187187194824, "global_step": 409181, "epoch": 2435} {"train_loss": -11.443760871887207, "global_step": 409182, "epoch": 2435} {"train_loss": -12.011144638061523, "global_step": 409183, "epoch": 2435} {"train_loss": -11.840471267700195, "global_step": 409184, "epoch": 2435} {"train_loss": -11.83088493347168, "global_step": 409185, "epoch": 2435} {"train_loss": -11.759180068969727, "global_step": 409186, "epoch": 2435} {"train_loss": -11.789560317993164, "global_step": 409187, "epoch": 2435} {"train_loss": -12.066848754882812, "global_step": 409188, "epoch": 2435} {"train_loss": -11.881021499633789, "global_step": 409189, "epoch": 2435} {"train_loss": -12.050453186035156, "global_step": 409190, "epoch": 2435} {"train_loss": -11.755024909973145, "global_step": 409191, "epoch": 2435} {"train_loss": -11.787590026855469, "global_step": 409192, "epoch": 2435} {"train_loss": -12.104276657104492, "global_step": 409193, "epoch": 2435} {"train_loss": -12.085465431213379, "global_step": 409194, "epoch": 2435} {"train_loss": -11.98770809173584, "global_step": 409195, "epoch": 2435} {"train_loss": -12.289022445678711, "global_step": 409196, "epoch": 2435} {"train_loss": -11.812637329101562, "global_step": 409197, "epoch": 2435} {"train_loss": -12.186613082885742, "global_step": 409198, "epoch": 2435} {"train_loss": -12.158358573913574, "global_step": 409199, "epoch": 2435} {"train_loss": -11.781867980957031, "global_step": 409200, "epoch": 2435} {"train_loss": -12.074155807495117, "global_step": 409201, "epoch": 2435} {"train_loss": -11.769981384277344, "global_step": 409202, "epoch": 2435} {"train_loss": -11.733631134033203, "global_step": 409203, "epoch": 2435} {"train_loss": -11.991907119750977, "global_step": 409204, "epoch": 2435} {"train_loss": -12.443056106567383, "global_step": 409205, "epoch": 2435} {"train_loss": -11.769067764282227, "global_step": 409206, "epoch": 2435} {"train_loss": -12.491838455200195, "global_step": 409207, "epoch": 2435} {"train_loss": -12.300970077514648, "global_step": 409208, "epoch": 2435} {"train_loss": -12.467214584350586, "global_step": 409209, "epoch": 2435} {"train_loss": -12.422622680664062, "global_step": 409210, "epoch": 2435} {"train_loss": -12.267475128173828, "global_step": 409211, "epoch": 2435} {"train_loss": -12.454265594482422, "global_step": 409212, "epoch": 2435} {"train_loss": -12.205350875854492, "global_step": 409213, "epoch": 2435} {"train_loss": -12.417426109313965, "global_step": 409214, "epoch": 2435} {"train_loss": -12.086387634277344, "global_step": 409215, "epoch": 2435} {"train_loss": -12.483135223388672, "global_step": 409216, "epoch": 2435} {"train_loss": -12.104209899902344, "global_step": 409217, "epoch": 2435} {"train_loss": -12.424960136413574, "global_step": 409218, "epoch": 2435} {"train_loss": -12.404422760009766, "global_step": 409219, "epoch": 2435} {"train_loss": -12.397370338439941, "global_step": 409220, "epoch": 2435} {"train_loss": -12.579811096191406, "global_step": 409221, "epoch": 2435} {"train_loss": -12.535011291503906, "global_step": 409222, "epoch": 2435} {"train_loss": -12.403202056884766, "global_step": 409223, "epoch": 2435} {"train_loss": -12.389969825744629, "global_step": 409224, "epoch": 2435} {"train_loss": -12.482093811035156, "global_step": 409225, "epoch": 2435} {"train_loss": -12.558666229248047, "global_step": 409226, "epoch": 2435} {"train_loss": -12.510702133178711, "global_step": 409227, "epoch": 2435} {"train_loss": -12.435165405273438, "global_step": 409228, "epoch": 2435} {"train_loss": -12.624029159545898, "global_step": 409229, "epoch": 2435} {"train_loss": -12.38336181640625, "global_step": 409230, "epoch": 2435} {"train_loss": -12.711328506469727, "global_step": 409231, "epoch": 2435} {"train_loss": -12.634805679321289, "global_step": 409232, "epoch": 2435} {"train_loss": -12.286142349243164, "global_step": 409233, "epoch": 2435} {"train_loss": -12.46021842956543, "global_step": 409234, "epoch": 2435} {"train_loss": -12.63319206237793, "global_step": 409235, "epoch": 2435} {"train_loss": -12.617995262145996, "global_step": 409236, "epoch": 2435} {"train_loss": -12.789119720458984, "global_step": 409237, "epoch": 2435} {"train_loss": -12.683908462524414, "global_step": 409238, "epoch": 2435} {"train_loss": -12.728988647460938, "global_step": 409239, "epoch": 2435} {"train_loss": -12.6701078414917, "global_step": 409240, "epoch": 2435} {"train_loss": -12.710328102111816, "global_step": 409241, "epoch": 2435} {"train_loss": -12.68460464477539, "global_step": 409242, "epoch": 2435} {"train_loss": -12.807607650756836, "global_step": 409243, "epoch": 2435} {"train_loss": -12.555578231811523, "global_step": 409244, "epoch": 2435} {"train_loss": -12.717241287231445, "global_step": 409245, "epoch": 2435} {"train_loss": -12.834755897521973, "global_step": 409246, "epoch": 2435} {"train_loss": -11.37491523368018, "global_step": 409247, "epoch": 2435, "val_loss": 306816.40625, "train_action_mse_error": 1.7775928974151611} {"train_loss": -12.819404602050781, "global_step": 409248, "epoch": 2436} {"train_loss": -12.738778114318848, "global_step": 409249, "epoch": 2436} {"train_loss": -12.638053894042969, "global_step": 409250, "epoch": 2436} {"train_loss": -12.615087509155273, "global_step": 409251, "epoch": 2436} {"train_loss": -12.757031440734863, "global_step": 409252, "epoch": 2436} {"train_loss": -12.842655181884766, "global_step": 409253, "epoch": 2436} {"train_loss": -12.72894287109375, "global_step": 409254, "epoch": 2436} {"train_loss": -12.347180366516113, "global_step": 409255, "epoch": 2436} {"train_loss": -12.793956756591797, "global_step": 409256, "epoch": 2436} {"train_loss": -11.4437255859375, "global_step": 409257, "epoch": 2436} {"train_loss": -12.034855842590332, "global_step": 409258, "epoch": 2436} {"train_loss": -12.655438423156738, "global_step": 409259, "epoch": 2436} {"train_loss": -11.476317405700684, "global_step": 409260, "epoch": 2436} {"train_loss": -11.585418701171875, "global_step": 409261, "epoch": 2436} {"train_loss": -11.994729995727539, "global_step": 409262, "epoch": 2436} {"train_loss": -11.185205459594727, "global_step": 409263, "epoch": 2436} {"train_loss": -11.451032638549805, "global_step": 409264, "epoch": 2436} {"train_loss": -11.7240629196167, "global_step": 409265, "epoch": 2436} {"train_loss": -11.611124038696289, "global_step": 409266, "epoch": 2436} {"train_loss": -11.676268577575684, "global_step": 409267, "epoch": 2436} {"train_loss": -11.63775634765625, "global_step": 409268, "epoch": 2436} {"train_loss": -11.528984069824219, "global_step": 409269, "epoch": 2436} {"train_loss": -11.717992782592773, "global_step": 409270, "epoch": 2436} {"train_loss": -11.60409927368164, "global_step": 409271, "epoch": 2436} {"train_loss": -12.171980857849121, "global_step": 409272, "epoch": 2436} {"train_loss": -11.103860855102539, "global_step": 409273, "epoch": 2436} {"train_loss": -12.206897735595703, "global_step": 409274, "epoch": 2436} {"train_loss": -11.352566719055176, "global_step": 409275, "epoch": 2436} {"train_loss": -12.137643814086914, "global_step": 409276, "epoch": 2436} {"train_loss": -11.382072448730469, "global_step": 409277, "epoch": 2436} {"train_loss": -12.037763595581055, "global_step": 409278, "epoch": 2436} {"train_loss": -11.312192916870117, "global_step": 409279, "epoch": 2436} {"train_loss": -10.758011817932129, "global_step": 409280, "epoch": 2436} {"train_loss": -11.567750930786133, "global_step": 409281, "epoch": 2436} {"train_loss": -10.33256721496582, "global_step": 409282, "epoch": 2436} {"train_loss": -9.386557579040527, "global_step": 409283, "epoch": 2436} {"train_loss": -10.359121322631836, "global_step": 409284, "epoch": 2436} {"train_loss": -11.239452362060547, "global_step": 409285, "epoch": 2436} {"train_loss": -11.45544147491455, "global_step": 409286, "epoch": 2436} {"train_loss": -11.065153121948242, "global_step": 409287, "epoch": 2436} {"train_loss": -11.368159294128418, "global_step": 409288, "epoch": 2436} {"train_loss": -10.806472778320312, "global_step": 409289, "epoch": 2436} {"train_loss": -11.810107231140137, "global_step": 409290, "epoch": 2436} {"train_loss": -10.345255851745605, "global_step": 409291, "epoch": 2436} {"train_loss": -11.647334098815918, "global_step": 409292, "epoch": 2436} {"train_loss": -11.08854866027832, "global_step": 409293, "epoch": 2436} {"train_loss": -11.382978439331055, "global_step": 409294, "epoch": 2436} {"train_loss": -11.485552787780762, "global_step": 409295, "epoch": 2436} {"train_loss": -10.974311828613281, "global_step": 409296, "epoch": 2436} {"train_loss": -11.477044105529785, "global_step": 409297, "epoch": 2436} {"train_loss": -11.460257530212402, "global_step": 409298, "epoch": 2436} {"train_loss": -12.136103630065918, "global_step": 409299, "epoch": 2436} {"train_loss": -10.669427871704102, "global_step": 409300, "epoch": 2436} {"train_loss": -11.694639205932617, "global_step": 409301, "epoch": 2436} {"train_loss": -10.61784553527832, "global_step": 409302, "epoch": 2436} {"train_loss": -11.346870422363281, "global_step": 409303, "epoch": 2436} {"train_loss": -11.179479598999023, "global_step": 409304, "epoch": 2436} {"train_loss": -10.468164443969727, "global_step": 409305, "epoch": 2436} {"train_loss": -11.930073738098145, "global_step": 409306, "epoch": 2436} {"train_loss": -9.707794189453125, "global_step": 409307, "epoch": 2436} {"train_loss": -9.631336212158203, "global_step": 409308, "epoch": 2436} {"train_loss": -9.86265754699707, "global_step": 409309, "epoch": 2436} {"train_loss": -11.259166717529297, "global_step": 409310, "epoch": 2436} {"train_loss": -10.72788143157959, "global_step": 409311, "epoch": 2436} {"train_loss": -9.430793762207031, "global_step": 409312, "epoch": 2436} {"train_loss": -11.04723072052002, "global_step": 409313, "epoch": 2436} {"train_loss": -11.129037857055664, "global_step": 409314, "epoch": 2436} {"train_loss": -10.551837921142578, "global_step": 409315, "epoch": 2436} {"train_loss": -11.582684516906738, "global_step": 409316, "epoch": 2436} {"train_loss": -11.168509483337402, "global_step": 409317, "epoch": 2436} {"train_loss": -11.570155143737793, "global_step": 409318, "epoch": 2436} {"train_loss": -11.246635437011719, "global_step": 409319, "epoch": 2436} {"train_loss": -11.558177947998047, "global_step": 409320, "epoch": 2436} {"train_loss": -11.714883804321289, "global_step": 409321, "epoch": 2436} {"train_loss": -10.80922794342041, "global_step": 409322, "epoch": 2436} {"train_loss": -11.987507820129395, "global_step": 409323, "epoch": 2436} {"train_loss": -11.30740737915039, "global_step": 409324, "epoch": 2436} {"train_loss": -12.052452087402344, "global_step": 409325, "epoch": 2436} {"train_loss": -11.79065990447998, "global_step": 409326, "epoch": 2436} {"train_loss": -12.08057689666748, "global_step": 409327, "epoch": 2436} {"train_loss": -12.125639915466309, "global_step": 409328, "epoch": 2436} {"train_loss": -11.992076873779297, "global_step": 409329, "epoch": 2436} {"train_loss": -12.249689102172852, "global_step": 409330, "epoch": 2436} {"train_loss": -11.964700698852539, "global_step": 409331, "epoch": 2436} {"train_loss": -12.40814208984375, "global_step": 409332, "epoch": 2436} {"train_loss": -12.303443908691406, "global_step": 409333, "epoch": 2436} {"train_loss": -12.429489135742188, "global_step": 409334, "epoch": 2436} {"train_loss": -12.273042678833008, "global_step": 409335, "epoch": 2436} {"train_loss": -12.090557098388672, "global_step": 409336, "epoch": 2436} {"train_loss": -12.214853286743164, "global_step": 409337, "epoch": 2436} {"train_loss": -12.38790512084961, "global_step": 409338, "epoch": 2436} {"train_loss": -12.217482566833496, "global_step": 409339, "epoch": 2436} {"train_loss": -12.265718460083008, "global_step": 409340, "epoch": 2436} {"train_loss": -12.454967498779297, "global_step": 409341, "epoch": 2436} {"train_loss": -12.37898063659668, "global_step": 409342, "epoch": 2436} {"train_loss": -12.35824203491211, "global_step": 409343, "epoch": 2436} {"train_loss": -12.501643180847168, "global_step": 409344, "epoch": 2436} {"train_loss": -12.194950103759766, "global_step": 409345, "epoch": 2436} {"train_loss": -12.473503112792969, "global_step": 409346, "epoch": 2436} {"train_loss": -12.517852783203125, "global_step": 409347, "epoch": 2436} {"train_loss": -12.402488708496094, "global_step": 409348, "epoch": 2436} {"train_loss": -12.544366836547852, "global_step": 409349, "epoch": 2436} {"train_loss": -12.202401161193848, "global_step": 409350, "epoch": 2436} {"train_loss": -12.642004013061523, "global_step": 409351, "epoch": 2436} {"train_loss": -12.493642807006836, "global_step": 409352, "epoch": 2436} {"train_loss": -12.463375091552734, "global_step": 409353, "epoch": 2436} {"train_loss": -12.557334899902344, "global_step": 409354, "epoch": 2436} {"train_loss": -12.62724494934082, "global_step": 409355, "epoch": 2436} {"train_loss": -12.53429889678955, "global_step": 409356, "epoch": 2436} {"train_loss": -12.624524116516113, "global_step": 409357, "epoch": 2436} {"train_loss": -12.527467727661133, "global_step": 409358, "epoch": 2436} {"train_loss": -12.591009140014648, "global_step": 409359, "epoch": 2436} {"train_loss": -12.542695999145508, "global_step": 409360, "epoch": 2436} {"train_loss": -12.780088424682617, "global_step": 409361, "epoch": 2436} {"train_loss": -12.707475662231445, "global_step": 409362, "epoch": 2436} {"train_loss": -12.708187103271484, "global_step": 409363, "epoch": 2436} {"train_loss": -12.810904502868652, "global_step": 409364, "epoch": 2436} {"train_loss": -12.710908889770508, "global_step": 409365, "epoch": 2436} {"train_loss": -12.828659057617188, "global_step": 409366, "epoch": 2436} {"train_loss": -12.777250289916992, "global_step": 409367, "epoch": 2436} {"train_loss": -12.900121688842773, "global_step": 409368, "epoch": 2436} {"train_loss": -12.868288040161133, "global_step": 409369, "epoch": 2436} {"train_loss": -12.77972412109375, "global_step": 409370, "epoch": 2436} {"train_loss": -12.77949047088623, "global_step": 409371, "epoch": 2436} {"train_loss": -12.883140563964844, "global_step": 409372, "epoch": 2436} {"train_loss": -12.702716827392578, "global_step": 409373, "epoch": 2436} {"train_loss": -12.659444808959961, "global_step": 409374, "epoch": 2436} {"train_loss": -12.894176483154297, "global_step": 409375, "epoch": 2436} {"train_loss": -12.636147499084473, "global_step": 409376, "epoch": 2436} {"train_loss": -12.781842231750488, "global_step": 409377, "epoch": 2436} {"train_loss": -12.792014122009277, "global_step": 409378, "epoch": 2436} {"train_loss": -12.807977676391602, "global_step": 409379, "epoch": 2436} {"train_loss": -12.715850830078125, "global_step": 409380, "epoch": 2436} {"train_loss": -12.868674278259277, "global_step": 409381, "epoch": 2436} {"train_loss": -12.841283798217773, "global_step": 409382, "epoch": 2436} {"train_loss": -12.697365760803223, "global_step": 409383, "epoch": 2436} {"train_loss": -12.87956714630127, "global_step": 409384, "epoch": 2436} {"train_loss": -12.944042205810547, "global_step": 409385, "epoch": 2436} {"train_loss": -12.632850646972656, "global_step": 409386, "epoch": 2436} {"train_loss": -12.889577865600586, "global_step": 409387, "epoch": 2436} {"train_loss": -12.647209167480469, "global_step": 409388, "epoch": 2436} {"train_loss": -12.833854675292969, "global_step": 409389, "epoch": 2436} {"train_loss": -12.595731735229492, "global_step": 409390, "epoch": 2436} {"train_loss": -12.130674362182617, "global_step": 409391, "epoch": 2436} {"train_loss": -12.179293632507324, "global_step": 409392, "epoch": 2436} {"train_loss": -12.849748611450195, "global_step": 409393, "epoch": 2436} {"train_loss": -12.691193580627441, "global_step": 409394, "epoch": 2436} {"train_loss": -12.600563049316406, "global_step": 409395, "epoch": 2436} {"train_loss": -12.607840538024902, "global_step": 409396, "epoch": 2436} {"train_loss": -13.061378479003906, "global_step": 409397, "epoch": 2436} {"train_loss": -12.182415008544922, "global_step": 409398, "epoch": 2436} {"train_loss": -12.650371551513672, "global_step": 409399, "epoch": 2436} {"train_loss": -12.284825325012207, "global_step": 409400, "epoch": 2436} {"train_loss": -12.246261596679688, "global_step": 409401, "epoch": 2436} {"train_loss": -12.410680770874023, "global_step": 409402, "epoch": 2436} {"train_loss": -12.766092300415039, "global_step": 409403, "epoch": 2436} {"train_loss": -12.233829498291016, "global_step": 409404, "epoch": 2436} {"train_loss": -12.549051284790039, "global_step": 409405, "epoch": 2436} {"train_loss": -12.12335205078125, "global_step": 409406, "epoch": 2436} {"train_loss": -12.106815338134766, "global_step": 409407, "epoch": 2436} {"train_loss": -12.563568115234375, "global_step": 409408, "epoch": 2436} {"train_loss": -12.461315155029297, "global_step": 409409, "epoch": 2436} {"train_loss": -12.50461483001709, "global_step": 409410, "epoch": 2436} {"train_loss": -12.148656845092773, "global_step": 409411, "epoch": 2436} {"train_loss": -12.218588829040527, "global_step": 409412, "epoch": 2436} {"train_loss": -11.71129035949707, "global_step": 409413, "epoch": 2436} {"train_loss": -12.596577644348145, "global_step": 409414, "epoch": 2436} {"train_loss": -12.008522487822033, "global_step": 409415, "epoch": 2436, "val_loss": 303156.21875} {"train_loss": -11.924285888671875, "global_step": 409416, "epoch": 2437} {"train_loss": -11.29180908203125, "global_step": 409417, "epoch": 2437} {"train_loss": -12.338570594787598, "global_step": 409418, "epoch": 2437} {"train_loss": -12.195344924926758, "global_step": 409419, "epoch": 2437} {"train_loss": -10.039738655090332, "global_step": 409420, "epoch": 2437} {"train_loss": -11.144624710083008, "global_step": 409421, "epoch": 2437} {"train_loss": -9.775578498840332, "global_step": 409422, "epoch": 2437} {"train_loss": -9.972846984863281, "global_step": 409423, "epoch": 2437} {"train_loss": -10.937387466430664, "global_step": 409424, "epoch": 2437} {"train_loss": -9.585602760314941, "global_step": 409425, "epoch": 2437} {"train_loss": -11.674858093261719, "global_step": 409426, "epoch": 2437} {"train_loss": -9.542311668395996, "global_step": 409427, "epoch": 2437} {"train_loss": -9.608219146728516, "global_step": 409428, "epoch": 2437} {"train_loss": -8.10606575012207, "global_step": 409429, "epoch": 2437} {"train_loss": -8.516700744628906, "global_step": 409430, "epoch": 2437} {"train_loss": -10.347606658935547, "global_step": 409431, "epoch": 2437} {"train_loss": -8.930886268615723, "global_step": 409432, "epoch": 2437} {"train_loss": -9.132882118225098, "global_step": 409433, "epoch": 2437} {"train_loss": -8.435501098632812, "global_step": 409434, "epoch": 2437} {"train_loss": -9.162270545959473, "global_step": 409435, "epoch": 2437} {"train_loss": -9.39029598236084, "global_step": 409436, "epoch": 2437} {"train_loss": -9.544229507446289, "global_step": 409437, "epoch": 2437} {"train_loss": -9.27154541015625, "global_step": 409438, "epoch": 2437} {"train_loss": -9.613094329833984, "global_step": 409439, "epoch": 2437} {"train_loss": -9.469228744506836, "global_step": 409440, "epoch": 2437} {"train_loss": -10.14971923828125, "global_step": 409441, "epoch": 2437} {"train_loss": -10.571788787841797, "global_step": 409442, "epoch": 2437} {"train_loss": -10.137651443481445, "global_step": 409443, "epoch": 2437} {"train_loss": -10.387261390686035, "global_step": 409444, "epoch": 2437} {"train_loss": -9.559709548950195, "global_step": 409445, "epoch": 2437} {"train_loss": -9.485292434692383, "global_step": 409446, "epoch": 2437} {"train_loss": -10.042975425720215, "global_step": 409447, "epoch": 2437} {"train_loss": -10.63045883178711, "global_step": 409448, "epoch": 2437} {"train_loss": -10.213651657104492, "global_step": 409449, "epoch": 2437} {"train_loss": -10.863364219665527, "global_step": 409450, "epoch": 2437} {"train_loss": -10.989104270935059, "global_step": 409451, "epoch": 2437} {"train_loss": -10.807867050170898, "global_step": 409452, "epoch": 2437} {"train_loss": -11.521166801452637, "global_step": 409453, "epoch": 2437} {"train_loss": -11.38111686706543, "global_step": 409454, "epoch": 2437} {"train_loss": -11.619216918945312, "global_step": 409455, "epoch": 2437} {"train_loss": -11.382623672485352, "global_step": 409456, "epoch": 2437} {"train_loss": -11.476444244384766, "global_step": 409457, "epoch": 2437} {"train_loss": -11.362709045410156, "global_step": 409458, "epoch": 2437} {"train_loss": -12.1506986618042, "global_step": 409459, "epoch": 2437} {"train_loss": -11.243250846862793, "global_step": 409460, "epoch": 2437} {"train_loss": -11.64645004272461, "global_step": 409461, "epoch": 2437} {"train_loss": -11.865758895874023, "global_step": 409462, "epoch": 2437} {"train_loss": -11.457643508911133, "global_step": 409463, "epoch": 2437} {"train_loss": -11.627026557922363, "global_step": 409464, "epoch": 2437} {"train_loss": -11.614481925964355, "global_step": 409465, "epoch": 2437} {"train_loss": -11.086929321289062, "global_step": 409466, "epoch": 2437} {"train_loss": -12.011133193969727, "global_step": 409467, "epoch": 2437} {"train_loss": -11.016324043273926, "global_step": 409468, "epoch": 2437} {"train_loss": -11.372537612915039, "global_step": 409469, "epoch": 2437} {"train_loss": -11.776468276977539, "global_step": 409470, "epoch": 2437} {"train_loss": -11.62584114074707, "global_step": 409471, "epoch": 2437} {"train_loss": -11.587101936340332, "global_step": 409472, "epoch": 2437} {"train_loss": -12.005125045776367, "global_step": 409473, "epoch": 2437} {"train_loss": -11.720733642578125, "global_step": 409474, "epoch": 2437} {"train_loss": -11.66112232208252, "global_step": 409475, "epoch": 2437} {"train_loss": -11.927324295043945, "global_step": 409476, "epoch": 2437} {"train_loss": -11.818449020385742, "global_step": 409477, "epoch": 2437} {"train_loss": -12.278139114379883, "global_step": 409478, "epoch": 2437} {"train_loss": -11.67736530303955, "global_step": 409479, "epoch": 2437} {"train_loss": -12.209312438964844, "global_step": 409480, "epoch": 2437} {"train_loss": -11.77908992767334, "global_step": 409481, "epoch": 2437} {"train_loss": -12.01669692993164, "global_step": 409482, "epoch": 2437} {"train_loss": -11.737276077270508, "global_step": 409483, "epoch": 2437} {"train_loss": -11.53724479675293, "global_step": 409484, "epoch": 2437} {"train_loss": -11.766244888305664, "global_step": 409485, "epoch": 2437} {"train_loss": -11.251203536987305, "global_step": 409486, "epoch": 2437} {"train_loss": -12.222366333007812, "global_step": 409487, "epoch": 2437} {"train_loss": -11.579604148864746, "global_step": 409488, "epoch": 2437} {"train_loss": -12.173604965209961, "global_step": 409489, "epoch": 2437} {"train_loss": -12.116964340209961, "global_step": 409490, "epoch": 2437} {"train_loss": -12.182459831237793, "global_step": 409491, "epoch": 2437} {"train_loss": -12.27200698852539, "global_step": 409492, "epoch": 2437} {"train_loss": -12.04174518585205, "global_step": 409493, "epoch": 2437} {"train_loss": -12.203897476196289, "global_step": 409494, "epoch": 2437} {"train_loss": -12.276226043701172, "global_step": 409495, "epoch": 2437} {"train_loss": -12.254572868347168, "global_step": 409496, "epoch": 2437} {"train_loss": -12.185885429382324, "global_step": 409497, "epoch": 2437} {"train_loss": -12.420516014099121, "global_step": 409498, "epoch": 2437} {"train_loss": -12.217708587646484, "global_step": 409499, "epoch": 2437} {"train_loss": -12.394044876098633, "global_step": 409500, "epoch": 2437} {"train_loss": -12.398761749267578, "global_step": 409501, "epoch": 2437} {"train_loss": -12.437420845031738, "global_step": 409502, "epoch": 2437} {"train_loss": -12.547759056091309, "global_step": 409503, "epoch": 2437} {"train_loss": -12.4595308303833, "global_step": 409504, "epoch": 2437} {"train_loss": -12.310335159301758, "global_step": 409505, "epoch": 2437} {"train_loss": -12.230778694152832, "global_step": 409506, "epoch": 2437} {"train_loss": -12.76577377319336, "global_step": 409507, "epoch": 2437} {"train_loss": -12.323406219482422, "global_step": 409508, "epoch": 2437} {"train_loss": -12.577483177185059, "global_step": 409509, "epoch": 2437} {"train_loss": -12.46132755279541, "global_step": 409510, "epoch": 2437} {"train_loss": -12.46628189086914, "global_step": 409511, "epoch": 2437} {"train_loss": -12.410686492919922, "global_step": 409512, "epoch": 2437} {"train_loss": -12.476869583129883, "global_step": 409513, "epoch": 2437} {"train_loss": -12.624671936035156, "global_step": 409514, "epoch": 2437} {"train_loss": -12.560676574707031, "global_step": 409515, "epoch": 2437} {"train_loss": -12.474987030029297, "global_step": 409516, "epoch": 2437} {"train_loss": -12.511058807373047, "global_step": 409517, "epoch": 2437} {"train_loss": -12.569647789001465, "global_step": 409518, "epoch": 2437} {"train_loss": -12.8475923538208, "global_step": 409519, "epoch": 2437} {"train_loss": -12.624909400939941, "global_step": 409520, "epoch": 2437} {"train_loss": -12.54611873626709, "global_step": 409521, "epoch": 2437} {"train_loss": -12.889365196228027, "global_step": 409522, "epoch": 2437} {"train_loss": -12.447953224182129, "global_step": 409523, "epoch": 2437} {"train_loss": -12.528312683105469, "global_step": 409524, "epoch": 2437} {"train_loss": -12.911741256713867, "global_step": 409525, "epoch": 2437} {"train_loss": -12.592172622680664, "global_step": 409526, "epoch": 2437} {"train_loss": -12.717958450317383, "global_step": 409527, "epoch": 2437} {"train_loss": -12.782768249511719, "global_step": 409528, "epoch": 2437} {"train_loss": -12.722493171691895, "global_step": 409529, "epoch": 2437} {"train_loss": -12.661943435668945, "global_step": 409530, "epoch": 2437} {"train_loss": -12.53616714477539, "global_step": 409531, "epoch": 2437} {"train_loss": -12.700411796569824, "global_step": 409532, "epoch": 2437} {"train_loss": -12.745328903198242, "global_step": 409533, "epoch": 2437} {"train_loss": -12.705892562866211, "global_step": 409534, "epoch": 2437} {"train_loss": -12.59933090209961, "global_step": 409535, "epoch": 2437} {"train_loss": -12.823163986206055, "global_step": 409536, "epoch": 2437} {"train_loss": -12.925844192504883, "global_step": 409537, "epoch": 2437} {"train_loss": -12.337589263916016, "global_step": 409538, "epoch": 2437} {"train_loss": -12.879607200622559, "global_step": 409539, "epoch": 2437} {"train_loss": -12.626153945922852, "global_step": 409540, "epoch": 2437} {"train_loss": -12.738851547241211, "global_step": 409541, "epoch": 2437} {"train_loss": -12.83033561706543, "global_step": 409542, "epoch": 2437} {"train_loss": -13.005373001098633, "global_step": 409543, "epoch": 2437} {"train_loss": -12.612587928771973, "global_step": 409544, "epoch": 2437} {"train_loss": -12.842519760131836, "global_step": 409545, "epoch": 2437} {"train_loss": -12.828880310058594, "global_step": 409546, "epoch": 2437} {"train_loss": -12.884930610656738, "global_step": 409547, "epoch": 2437} {"train_loss": -12.577383041381836, "global_step": 409548, "epoch": 2437} {"train_loss": -12.47500991821289, "global_step": 409549, "epoch": 2437} {"train_loss": -12.746358871459961, "global_step": 409550, "epoch": 2437} {"train_loss": -12.847146987915039, "global_step": 409551, "epoch": 2437} {"train_loss": -12.528034210205078, "global_step": 409552, "epoch": 2437} {"train_loss": -12.656702995300293, "global_step": 409553, "epoch": 2437} {"train_loss": -12.803094863891602, "global_step": 409554, "epoch": 2437} {"train_loss": -12.629331588745117, "global_step": 409555, "epoch": 2437} {"train_loss": -12.428915977478027, "global_step": 409556, "epoch": 2437} {"train_loss": -12.57447624206543, "global_step": 409557, "epoch": 2437} {"train_loss": -12.470672607421875, "global_step": 409558, "epoch": 2437} {"train_loss": -12.706380844116211, "global_step": 409559, "epoch": 2437} {"train_loss": -11.89320182800293, "global_step": 409560, "epoch": 2437} {"train_loss": -10.546087265014648, "global_step": 409561, "epoch": 2437} {"train_loss": -10.848400115966797, "global_step": 409562, "epoch": 2437} {"train_loss": -11.277018547058105, "global_step": 409563, "epoch": 2437} {"train_loss": -10.188054084777832, "global_step": 409564, "epoch": 2437} {"train_loss": -11.830306053161621, "global_step": 409565, "epoch": 2437} {"train_loss": -11.255094528198242, "global_step": 409566, "epoch": 2437} {"train_loss": -10.428183555603027, "global_step": 409567, "epoch": 2437} {"train_loss": -12.452783584594727, "global_step": 409568, "epoch": 2437} {"train_loss": -10.656915664672852, "global_step": 409569, "epoch": 2437} {"train_loss": -10.5193452835083, "global_step": 409570, "epoch": 2437} {"train_loss": -10.311786651611328, "global_step": 409571, "epoch": 2437} {"train_loss": -8.8969144821167, "global_step": 409572, "epoch": 2437} {"train_loss": -8.637808799743652, "global_step": 409573, "epoch": 2437} {"train_loss": -7.706085205078125, "global_step": 409574, "epoch": 2437} {"train_loss": -8.338201522827148, "global_step": 409575, "epoch": 2437} {"train_loss": -8.81087875366211, "global_step": 409576, "epoch": 2437} {"train_loss": -8.487566947937012, "global_step": 409577, "epoch": 2437} {"train_loss": -8.499336242675781, "global_step": 409578, "epoch": 2437} {"train_loss": -8.98692512512207, "global_step": 409579, "epoch": 2437} {"train_loss": -9.038717269897461, "global_step": 409580, "epoch": 2437} {"train_loss": -9.534247398376465, "global_step": 409581, "epoch": 2437} {"train_loss": -9.724504470825195, "global_step": 409582, "epoch": 2437} {"train_loss": -11.450737130074273, "global_step": 409583, "epoch": 2437, "val_loss": 303013.1875} {"train_loss": -8.594223022460938, "global_step": 409584, "epoch": 2438} {"train_loss": -8.449239730834961, "global_step": 409585, "epoch": 2438} {"train_loss": -7.6001296043396, "global_step": 409586, "epoch": 2438} {"train_loss": -10.266425132751465, "global_step": 409587, "epoch": 2438} {"train_loss": -9.037723541259766, "global_step": 409588, "epoch": 2438} {"train_loss": -10.202364921569824, "global_step": 409589, "epoch": 2438} {"train_loss": -10.500022888183594, "global_step": 409590, "epoch": 2438} {"train_loss": -9.542764663696289, "global_step": 409591, "epoch": 2438} {"train_loss": -10.346622467041016, "global_step": 409592, "epoch": 2438} {"train_loss": -10.785703659057617, "global_step": 409593, "epoch": 2438} {"train_loss": -9.578872680664062, "global_step": 409594, "epoch": 2438} {"train_loss": -10.560752868652344, "global_step": 409595, "epoch": 2438} {"train_loss": -9.259099960327148, "global_step": 409596, "epoch": 2438} {"train_loss": -8.824199676513672, "global_step": 409597, "epoch": 2438} {"train_loss": -9.469396591186523, "global_step": 409598, "epoch": 2438} {"train_loss": -10.2418851852417, "global_step": 409599, "epoch": 2438} {"train_loss": -11.494613647460938, "global_step": 409600, "epoch": 2438} {"train_loss": -9.770574569702148, "global_step": 409601, "epoch": 2438} {"train_loss": -10.3643159866333, "global_step": 409602, "epoch": 2438} {"train_loss": -10.38407039642334, "global_step": 409603, "epoch": 2438} {"train_loss": -11.073450088500977, "global_step": 409604, "epoch": 2438} {"train_loss": -10.503296852111816, "global_step": 409605, "epoch": 2438} {"train_loss": -10.510977745056152, "global_step": 409606, "epoch": 2438} {"train_loss": -11.309005737304688, "global_step": 409607, "epoch": 2438} {"train_loss": -11.326944351196289, "global_step": 409608, "epoch": 2438} {"train_loss": -10.360113143920898, "global_step": 409609, "epoch": 2438} {"train_loss": -11.076242446899414, "global_step": 409610, "epoch": 2438} {"train_loss": -11.689416885375977, "global_step": 409611, "epoch": 2438} {"train_loss": -11.290122985839844, "global_step": 409612, "epoch": 2438} {"train_loss": -11.746002197265625, "global_step": 409613, "epoch": 2438} {"train_loss": -11.627222061157227, "global_step": 409614, "epoch": 2438} {"train_loss": -11.769537925720215, "global_step": 409615, "epoch": 2438} {"train_loss": -11.651209831237793, "global_step": 409616, "epoch": 2438} {"train_loss": -11.575340270996094, "global_step": 409617, "epoch": 2438} {"train_loss": -12.099180221557617, "global_step": 409618, "epoch": 2438} {"train_loss": -12.1022367477417, "global_step": 409619, "epoch": 2438} {"train_loss": -11.843942642211914, "global_step": 409620, "epoch": 2438} {"train_loss": -12.306753158569336, "global_step": 409621, "epoch": 2438} {"train_loss": -11.953670501708984, "global_step": 409622, "epoch": 2438} {"train_loss": -11.884148597717285, "global_step": 409623, "epoch": 2438} {"train_loss": -12.034198760986328, "global_step": 409624, "epoch": 2438} {"train_loss": -11.817377090454102, "global_step": 409625, "epoch": 2438} {"train_loss": -12.097100257873535, "global_step": 409626, "epoch": 2438} {"train_loss": -12.22354507446289, "global_step": 409627, "epoch": 2438} {"train_loss": -11.949756622314453, "global_step": 409628, "epoch": 2438} {"train_loss": -12.242453575134277, "global_step": 409629, "epoch": 2438} {"train_loss": -12.01767349243164, "global_step": 409630, "epoch": 2438} {"train_loss": -12.345281600952148, "global_step": 409631, "epoch": 2438} {"train_loss": -12.123526573181152, "global_step": 409632, "epoch": 2438} {"train_loss": -11.996174812316895, "global_step": 409633, "epoch": 2438} {"train_loss": -12.074127197265625, "global_step": 409634, "epoch": 2438} {"train_loss": -12.159806251525879, "global_step": 409635, "epoch": 2438} {"train_loss": -12.198921203613281, "global_step": 409636, "epoch": 2438} {"train_loss": -12.377803802490234, "global_step": 409637, "epoch": 2438} {"train_loss": -12.030986785888672, "global_step": 409638, "epoch": 2438} {"train_loss": -12.12635612487793, "global_step": 409639, "epoch": 2438} {"train_loss": -12.024309158325195, "global_step": 409640, "epoch": 2438} {"train_loss": -12.346242904663086, "global_step": 409641, "epoch": 2438} {"train_loss": -11.946540832519531, "global_step": 409642, "epoch": 2438} {"train_loss": -12.388014793395996, "global_step": 409643, "epoch": 2438} {"train_loss": -12.260248184204102, "global_step": 409644, "epoch": 2438} {"train_loss": -12.518491744995117, "global_step": 409645, "epoch": 2438} {"train_loss": -12.451824188232422, "global_step": 409646, "epoch": 2438} {"train_loss": -12.194568634033203, "global_step": 409647, "epoch": 2438} {"train_loss": -12.417006492614746, "global_step": 409648, "epoch": 2438} {"train_loss": -12.425683975219727, "global_step": 409649, "epoch": 2438} {"train_loss": -12.3245267868042, "global_step": 409650, "epoch": 2438} {"train_loss": -12.640549659729004, "global_step": 409651, "epoch": 2438} {"train_loss": -12.45360279083252, "global_step": 409652, "epoch": 2438} {"train_loss": -12.358238220214844, "global_step": 409653, "epoch": 2438} {"train_loss": -12.24993896484375, "global_step": 409654, "epoch": 2438} {"train_loss": -12.466235160827637, "global_step": 409655, "epoch": 2438} {"train_loss": -12.223308563232422, "global_step": 409656, "epoch": 2438} {"train_loss": -12.408967971801758, "global_step": 409657, "epoch": 2438} {"train_loss": -12.278335571289062, "global_step": 409658, "epoch": 2438} {"train_loss": -12.312310218811035, "global_step": 409659, "epoch": 2438} {"train_loss": -12.332296371459961, "global_step": 409660, "epoch": 2438} {"train_loss": -12.249444007873535, "global_step": 409661, "epoch": 2438} {"train_loss": -12.274858474731445, "global_step": 409662, "epoch": 2438} {"train_loss": -12.209005355834961, "global_step": 409663, "epoch": 2438} {"train_loss": -12.401455879211426, "global_step": 409664, "epoch": 2438} {"train_loss": -12.31888198852539, "global_step": 409665, "epoch": 2438} {"train_loss": -12.27094841003418, "global_step": 409666, "epoch": 2438} {"train_loss": -12.114461898803711, "global_step": 409667, "epoch": 2438} {"train_loss": -12.579655647277832, "global_step": 409668, "epoch": 2438} {"train_loss": -11.745309829711914, "global_step": 409669, "epoch": 2438} {"train_loss": -12.410614013671875, "global_step": 409670, "epoch": 2438} {"train_loss": -12.394457817077637, "global_step": 409671, "epoch": 2438} {"train_loss": -12.227644920349121, "global_step": 409672, "epoch": 2438} {"train_loss": -12.174477577209473, "global_step": 409673, "epoch": 2438} {"train_loss": -12.0748872756958, "global_step": 409674, "epoch": 2438} {"train_loss": -12.521160125732422, "global_step": 409675, "epoch": 2438} {"train_loss": -11.783733367919922, "global_step": 409676, "epoch": 2438} {"train_loss": -12.475996017456055, "global_step": 409677, "epoch": 2438} {"train_loss": -12.113981246948242, "global_step": 409678, "epoch": 2438} {"train_loss": -12.482139587402344, "global_step": 409679, "epoch": 2438} {"train_loss": -12.163702011108398, "global_step": 409680, "epoch": 2438} {"train_loss": -11.907081604003906, "global_step": 409681, "epoch": 2438} {"train_loss": -11.2557373046875, "global_step": 409682, "epoch": 2438} {"train_loss": -12.173776626586914, "global_step": 409683, "epoch": 2438} {"train_loss": -11.482287406921387, "global_step": 409684, "epoch": 2438} {"train_loss": -10.913361549377441, "global_step": 409685, "epoch": 2438} {"train_loss": -12.207296371459961, "global_step": 409686, "epoch": 2438} {"train_loss": -11.558856964111328, "global_step": 409687, "epoch": 2438} {"train_loss": -9.584465980529785, "global_step": 409688, "epoch": 2438} {"train_loss": -9.071468353271484, "global_step": 409689, "epoch": 2438} {"train_loss": -9.958328247070312, "global_step": 409690, "epoch": 2438} {"train_loss": -9.128822326660156, "global_step": 409691, "epoch": 2438} {"train_loss": -10.262533187866211, "global_step": 409692, "epoch": 2438} {"train_loss": -10.90761947631836, "global_step": 409693, "epoch": 2438} {"train_loss": -10.848015785217285, "global_step": 409694, "epoch": 2438} {"train_loss": -10.358353614807129, "global_step": 409695, "epoch": 2438} {"train_loss": -11.116416931152344, "global_step": 409696, "epoch": 2438} {"train_loss": -10.833040237426758, "global_step": 409697, "epoch": 2438} {"train_loss": -11.55459213256836, "global_step": 409698, "epoch": 2438} {"train_loss": -11.791849136352539, "global_step": 409699, "epoch": 2438} {"train_loss": -11.60636043548584, "global_step": 409700, "epoch": 2438} {"train_loss": -11.206291198730469, "global_step": 409701, "epoch": 2438} {"train_loss": -11.497455596923828, "global_step": 409702, "epoch": 2438} {"train_loss": -11.896966934204102, "global_step": 409703, "epoch": 2438} {"train_loss": -11.447340965270996, "global_step": 409704, "epoch": 2438} {"train_loss": -12.113268852233887, "global_step": 409705, "epoch": 2438} {"train_loss": -11.330493927001953, "global_step": 409706, "epoch": 2438} {"train_loss": -11.65695571899414, "global_step": 409707, "epoch": 2438} {"train_loss": -11.72575855255127, "global_step": 409708, "epoch": 2438} {"train_loss": -11.765018463134766, "global_step": 409709, "epoch": 2438} {"train_loss": -11.556411743164062, "global_step": 409710, "epoch": 2438} {"train_loss": -12.070405960083008, "global_step": 409711, "epoch": 2438} {"train_loss": -11.807723999023438, "global_step": 409712, "epoch": 2438} {"train_loss": -11.997400283813477, "global_step": 409713, "epoch": 2438} {"train_loss": -11.519020080566406, "global_step": 409714, "epoch": 2438} {"train_loss": -12.076480865478516, "global_step": 409715, "epoch": 2438} {"train_loss": -12.27394962310791, "global_step": 409716, "epoch": 2438} {"train_loss": -12.257301330566406, "global_step": 409717, "epoch": 2438} {"train_loss": -12.215176582336426, "global_step": 409718, "epoch": 2438} {"train_loss": -12.067987442016602, "global_step": 409719, "epoch": 2438} {"train_loss": -12.124360084533691, "global_step": 409720, "epoch": 2438} {"train_loss": -12.367998123168945, "global_step": 409721, "epoch": 2438} {"train_loss": -12.164299011230469, "global_step": 409722, "epoch": 2438} {"train_loss": -12.311392784118652, "global_step": 409723, "epoch": 2438} {"train_loss": -12.432029724121094, "global_step": 409724, "epoch": 2438} {"train_loss": -12.07869815826416, "global_step": 409725, "epoch": 2438} {"train_loss": -12.459214210510254, "global_step": 409726, "epoch": 2438} {"train_loss": -12.183441162109375, "global_step": 409727, "epoch": 2438} {"train_loss": -12.327577590942383, "global_step": 409728, "epoch": 2438} {"train_loss": -12.228759765625, "global_step": 409729, "epoch": 2438} {"train_loss": -12.386870384216309, "global_step": 409730, "epoch": 2438} {"train_loss": -12.482927322387695, "global_step": 409731, "epoch": 2438} {"train_loss": -12.177713394165039, "global_step": 409732, "epoch": 2438} {"train_loss": -12.28492546081543, "global_step": 409733, "epoch": 2438} {"train_loss": -12.163182258605957, "global_step": 409734, "epoch": 2438} {"train_loss": -12.569265365600586, "global_step": 409735, "epoch": 2438} {"train_loss": -12.134744644165039, "global_step": 409736, "epoch": 2438} {"train_loss": -12.181724548339844, "global_step": 409737, "epoch": 2438} {"train_loss": -12.343433380126953, "global_step": 409738, "epoch": 2438} {"train_loss": -12.141298294067383, "global_step": 409739, "epoch": 2438} {"train_loss": -12.348512649536133, "global_step": 409740, "epoch": 2438} {"train_loss": -12.696761131286621, "global_step": 409741, "epoch": 2438} {"train_loss": -12.032968521118164, "global_step": 409742, "epoch": 2438} {"train_loss": -12.587181091308594, "global_step": 409743, "epoch": 2438} {"train_loss": -12.256431579589844, "global_step": 409744, "epoch": 2438} {"train_loss": -12.50368881225586, "global_step": 409745, "epoch": 2438} {"train_loss": -12.366971015930176, "global_step": 409746, "epoch": 2438} {"train_loss": -12.113277435302734, "global_step": 409747, "epoch": 2438} {"train_loss": -12.233999252319336, "global_step": 409748, "epoch": 2438} {"train_loss": -12.322893142700195, "global_step": 409749, "epoch": 2438} {"train_loss": -11.97706413269043, "global_step": 409750, "epoch": 2438} {"train_loss": -11.663163874830518, "global_step": 409751, "epoch": 2438, "val_loss": 301490.34375} {"train_loss": -12.133991241455078, "global_step": 409752, "epoch": 2439} {"train_loss": -12.417245864868164, "global_step": 409753, "epoch": 2439} {"train_loss": -12.245672225952148, "global_step": 409754, "epoch": 2439} {"train_loss": -12.439220428466797, "global_step": 409755, "epoch": 2439} {"train_loss": -12.581809997558594, "global_step": 409756, "epoch": 2439} {"train_loss": -12.257991790771484, "global_step": 409757, "epoch": 2439} {"train_loss": -12.508636474609375, "global_step": 409758, "epoch": 2439} {"train_loss": -12.717580795288086, "global_step": 409759, "epoch": 2439} {"train_loss": -12.492362976074219, "global_step": 409760, "epoch": 2439} {"train_loss": -12.71847915649414, "global_step": 409761, "epoch": 2439} {"train_loss": -12.661662101745605, "global_step": 409762, "epoch": 2439} {"train_loss": -12.296297073364258, "global_step": 409763, "epoch": 2439} {"train_loss": -12.377254486083984, "global_step": 409764, "epoch": 2439} {"train_loss": -12.14560604095459, "global_step": 409765, "epoch": 2439} {"train_loss": -12.040342330932617, "global_step": 409766, "epoch": 2439} {"train_loss": -12.399425506591797, "global_step": 409767, "epoch": 2439} {"train_loss": -12.306512832641602, "global_step": 409768, "epoch": 2439} {"train_loss": -12.217007637023926, "global_step": 409769, "epoch": 2439} {"train_loss": -12.79788875579834, "global_step": 409770, "epoch": 2439} {"train_loss": -12.453010559082031, "global_step": 409771, "epoch": 2439} {"train_loss": -12.528182983398438, "global_step": 409772, "epoch": 2439} {"train_loss": -12.164756774902344, "global_step": 409773, "epoch": 2439} {"train_loss": -12.261131286621094, "global_step": 409774, "epoch": 2439} {"train_loss": -12.290473937988281, "global_step": 409775, "epoch": 2439} {"train_loss": -12.24725341796875, "global_step": 409776, "epoch": 2439} {"train_loss": -10.615201950073242, "global_step": 409777, "epoch": 2439} {"train_loss": -11.929574966430664, "global_step": 409778, "epoch": 2439} {"train_loss": -12.084976196289062, "global_step": 409779, "epoch": 2439} {"train_loss": -10.928796768188477, "global_step": 409780, "epoch": 2439} {"train_loss": -12.391087532043457, "global_step": 409781, "epoch": 2439} {"train_loss": -11.51762580871582, "global_step": 409782, "epoch": 2439} {"train_loss": -11.517401695251465, "global_step": 409783, "epoch": 2439} {"train_loss": -12.204575538635254, "global_step": 409784, "epoch": 2439} {"train_loss": -10.560218811035156, "global_step": 409785, "epoch": 2439} {"train_loss": -11.680685043334961, "global_step": 409786, "epoch": 2439} {"train_loss": -11.251076698303223, "global_step": 409787, "epoch": 2439} {"train_loss": -10.7836332321167, "global_step": 409788, "epoch": 2439} {"train_loss": -11.620323181152344, "global_step": 409789, "epoch": 2439} {"train_loss": -10.525867462158203, "global_step": 409790, "epoch": 2439} {"train_loss": -12.138093948364258, "global_step": 409791, "epoch": 2439} {"train_loss": -10.590392112731934, "global_step": 409792, "epoch": 2439} {"train_loss": -12.265521049499512, "global_step": 409793, "epoch": 2439} {"train_loss": -11.33010482788086, "global_step": 409794, "epoch": 2439} {"train_loss": -11.327736854553223, "global_step": 409795, "epoch": 2439} {"train_loss": -11.949220657348633, "global_step": 409796, "epoch": 2439} {"train_loss": -10.626763343811035, "global_step": 409797, "epoch": 2439} {"train_loss": -11.83213996887207, "global_step": 409798, "epoch": 2439} {"train_loss": -11.064406394958496, "global_step": 409799, "epoch": 2439} {"train_loss": -11.270198822021484, "global_step": 409800, "epoch": 2439} {"train_loss": -11.523079872131348, "global_step": 409801, "epoch": 2439} {"train_loss": -10.492905616760254, "global_step": 409802, "epoch": 2439} {"train_loss": -10.860326766967773, "global_step": 409803, "epoch": 2439} {"train_loss": -10.012510299682617, "global_step": 409804, "epoch": 2439} {"train_loss": -11.474137306213379, "global_step": 409805, "epoch": 2439} {"train_loss": -10.354717254638672, "global_step": 409806, "epoch": 2439} {"train_loss": -10.816801071166992, "global_step": 409807, "epoch": 2439} {"train_loss": -10.234108924865723, "global_step": 409808, "epoch": 2439} {"train_loss": -11.24643611907959, "global_step": 409809, "epoch": 2439} {"train_loss": -9.472455024719238, "global_step": 409810, "epoch": 2439} {"train_loss": -10.868560791015625, "global_step": 409811, "epoch": 2439} {"train_loss": -10.504520416259766, "global_step": 409812, "epoch": 2439} {"train_loss": -10.842992782592773, "global_step": 409813, "epoch": 2439} {"train_loss": -11.322311401367188, "global_step": 409814, "epoch": 2439} {"train_loss": -11.16695785522461, "global_step": 409815, "epoch": 2439} {"train_loss": -11.086874008178711, "global_step": 409816, "epoch": 2439} {"train_loss": -11.70675277709961, "global_step": 409817, "epoch": 2439} {"train_loss": -10.512478828430176, "global_step": 409818, "epoch": 2439} {"train_loss": -11.931053161621094, "global_step": 409819, "epoch": 2439} {"train_loss": -10.763086318969727, "global_step": 409820, "epoch": 2439} {"train_loss": -11.892590522766113, "global_step": 409821, "epoch": 2439} {"train_loss": -10.693864822387695, "global_step": 409822, "epoch": 2439} {"train_loss": -11.931109428405762, "global_step": 409823, "epoch": 2439} {"train_loss": -9.928935050964355, "global_step": 409824, "epoch": 2439} {"train_loss": -12.024576187133789, "global_step": 409825, "epoch": 2439} {"train_loss": -9.941328048706055, "global_step": 409826, "epoch": 2439} {"train_loss": -12.060869216918945, "global_step": 409827, "epoch": 2439} {"train_loss": -10.684637069702148, "global_step": 409828, "epoch": 2439} {"train_loss": -11.83637523651123, "global_step": 409829, "epoch": 2439} {"train_loss": -10.844221115112305, "global_step": 409830, "epoch": 2439} {"train_loss": -11.914558410644531, "global_step": 409831, "epoch": 2439} {"train_loss": -10.964387893676758, "global_step": 409832, "epoch": 2439} {"train_loss": -11.963844299316406, "global_step": 409833, "epoch": 2439} {"train_loss": -11.303424835205078, "global_step": 409834, "epoch": 2439} {"train_loss": -12.127252578735352, "global_step": 409835, "epoch": 2439} {"train_loss": -11.632061004638672, "global_step": 409836, "epoch": 2439} {"train_loss": -11.853687286376953, "global_step": 409837, "epoch": 2439} {"train_loss": -11.92898941040039, "global_step": 409838, "epoch": 2439} {"train_loss": -11.900690078735352, "global_step": 409839, "epoch": 2439} {"train_loss": -11.803829193115234, "global_step": 409840, "epoch": 2439} {"train_loss": -11.846956253051758, "global_step": 409841, "epoch": 2439} {"train_loss": -11.869972229003906, "global_step": 409842, "epoch": 2439} {"train_loss": -12.160157203674316, "global_step": 409843, "epoch": 2439} {"train_loss": -11.66904354095459, "global_step": 409844, "epoch": 2439} {"train_loss": -11.99161148071289, "global_step": 409845, "epoch": 2439} {"train_loss": -11.889885902404785, "global_step": 409846, "epoch": 2439} {"train_loss": -12.060782432556152, "global_step": 409847, "epoch": 2439} {"train_loss": -11.986748695373535, "global_step": 409848, "epoch": 2439} {"train_loss": -12.3466215133667, "global_step": 409849, "epoch": 2439} {"train_loss": -11.9197998046875, "global_step": 409850, "epoch": 2439} {"train_loss": -12.270143508911133, "global_step": 409851, "epoch": 2439} {"train_loss": -12.092360496520996, "global_step": 409852, "epoch": 2439} {"train_loss": -12.227418899536133, "global_step": 409853, "epoch": 2439} {"train_loss": -12.020483016967773, "global_step": 409854, "epoch": 2439} {"train_loss": -11.94967269897461, "global_step": 409855, "epoch": 2439} {"train_loss": -12.340974807739258, "global_step": 409856, "epoch": 2439} {"train_loss": -12.285360336303711, "global_step": 409857, "epoch": 2439} {"train_loss": -12.559478759765625, "global_step": 409858, "epoch": 2439} {"train_loss": -12.309442520141602, "global_step": 409859, "epoch": 2439} {"train_loss": -12.344474792480469, "global_step": 409860, "epoch": 2439} {"train_loss": -12.37893295288086, "global_step": 409861, "epoch": 2439} {"train_loss": -12.288537979125977, "global_step": 409862, "epoch": 2439} {"train_loss": -12.138166427612305, "global_step": 409863, "epoch": 2439} {"train_loss": -12.414459228515625, "global_step": 409864, "epoch": 2439} {"train_loss": -12.376134872436523, "global_step": 409865, "epoch": 2439} {"train_loss": -12.410446166992188, "global_step": 409866, "epoch": 2439} {"train_loss": -12.515182495117188, "global_step": 409867, "epoch": 2439} {"train_loss": -12.477279663085938, "global_step": 409868, "epoch": 2439} {"train_loss": -12.21104621887207, "global_step": 409869, "epoch": 2439} {"train_loss": -12.636951446533203, "global_step": 409870, "epoch": 2439} {"train_loss": -12.483390808105469, "global_step": 409871, "epoch": 2439} {"train_loss": -12.542719841003418, "global_step": 409872, "epoch": 2439} {"train_loss": -12.221410751342773, "global_step": 409873, "epoch": 2439} {"train_loss": -12.459774017333984, "global_step": 409874, "epoch": 2439} {"train_loss": -12.344392776489258, "global_step": 409875, "epoch": 2439} {"train_loss": -12.380025863647461, "global_step": 409876, "epoch": 2439} {"train_loss": -12.439282417297363, "global_step": 409877, "epoch": 2439} {"train_loss": -12.505473136901855, "global_step": 409878, "epoch": 2439} {"train_loss": -12.576213836669922, "global_step": 409879, "epoch": 2439} {"train_loss": -12.106887817382812, "global_step": 409880, "epoch": 2439} {"train_loss": -12.411409378051758, "global_step": 409881, "epoch": 2439} {"train_loss": -12.242059707641602, "global_step": 409882, "epoch": 2439} {"train_loss": -12.35028076171875, "global_step": 409883, "epoch": 2439} {"train_loss": -12.03066635131836, "global_step": 409884, "epoch": 2439} {"train_loss": -11.787896156311035, "global_step": 409885, "epoch": 2439} {"train_loss": -12.065555572509766, "global_step": 409886, "epoch": 2439} {"train_loss": -11.587944030761719, "global_step": 409887, "epoch": 2439} {"train_loss": -12.323480606079102, "global_step": 409888, "epoch": 2439} {"train_loss": -11.60866928100586, "global_step": 409889, "epoch": 2439} {"train_loss": -12.516653060913086, "global_step": 409890, "epoch": 2439} {"train_loss": -11.44000244140625, "global_step": 409891, "epoch": 2439} {"train_loss": -12.279112815856934, "global_step": 409892, "epoch": 2439} {"train_loss": -11.665170669555664, "global_step": 409893, "epoch": 2439} {"train_loss": -11.730849266052246, "global_step": 409894, "epoch": 2439} {"train_loss": -11.832448959350586, "global_step": 409895, "epoch": 2439} {"train_loss": -11.534265518188477, "global_step": 409896, "epoch": 2439} {"train_loss": -11.764625549316406, "global_step": 409897, "epoch": 2439} {"train_loss": -11.609301567077637, "global_step": 409898, "epoch": 2439} {"train_loss": -12.469502449035645, "global_step": 409899, "epoch": 2439} {"train_loss": -11.65683364868164, "global_step": 409900, "epoch": 2439} {"train_loss": -12.30197525024414, "global_step": 409901, "epoch": 2439} {"train_loss": -12.105217933654785, "global_step": 409902, "epoch": 2439} {"train_loss": -12.37216567993164, "global_step": 409903, "epoch": 2439} {"train_loss": -12.654522895812988, "global_step": 409904, "epoch": 2439} {"train_loss": -11.776908874511719, "global_step": 409905, "epoch": 2439} {"train_loss": -12.478357315063477, "global_step": 409906, "epoch": 2439} {"train_loss": -12.266350746154785, "global_step": 409907, "epoch": 2439} {"train_loss": -12.805408477783203, "global_step": 409908, "epoch": 2439} {"train_loss": -12.008430480957031, "global_step": 409909, "epoch": 2439} {"train_loss": -12.650932312011719, "global_step": 409910, "epoch": 2439} {"train_loss": -12.198617935180664, "global_step": 409911, "epoch": 2439} {"train_loss": -12.514062881469727, "global_step": 409912, "epoch": 2439} {"train_loss": -12.411286354064941, "global_step": 409913, "epoch": 2439} {"train_loss": -12.305414199829102, "global_step": 409914, "epoch": 2439} {"train_loss": -12.414274215698242, "global_step": 409915, "epoch": 2439} {"train_loss": -12.242515563964844, "global_step": 409916, "epoch": 2439} {"train_loss": -12.373627662658691, "global_step": 409917, "epoch": 2439} {"train_loss": -12.394797325134277, "global_step": 409918, "epoch": 2439} {"train_loss": -11.865316351254782, "global_step": 409919, "epoch": 2439, "val_loss": 302795.46875} {"train_loss": -12.498016357421875, "global_step": 409920, "epoch": 2440} {"train_loss": -12.229146003723145, "global_step": 409921, "epoch": 2440} {"train_loss": -12.202325820922852, "global_step": 409922, "epoch": 2440} {"train_loss": -12.541240692138672, "global_step": 409923, "epoch": 2440} {"train_loss": -12.295735359191895, "global_step": 409924, "epoch": 2440} {"train_loss": -12.608797073364258, "global_step": 409925, "epoch": 2440} {"train_loss": -12.666419982910156, "global_step": 409926, "epoch": 2440} {"train_loss": -12.495874404907227, "global_step": 409927, "epoch": 2440} {"train_loss": -12.431299209594727, "global_step": 409928, "epoch": 2440} {"train_loss": -12.583340644836426, "global_step": 409929, "epoch": 2440} {"train_loss": -12.636137008666992, "global_step": 409930, "epoch": 2440} {"train_loss": -12.48564624786377, "global_step": 409931, "epoch": 2440} {"train_loss": -12.440266609191895, "global_step": 409932, "epoch": 2440} {"train_loss": -12.51214599609375, "global_step": 409933, "epoch": 2440} {"train_loss": -12.37653636932373, "global_step": 409934, "epoch": 2440} {"train_loss": -12.642274856567383, "global_step": 409935, "epoch": 2440} {"train_loss": -12.487324714660645, "global_step": 409936, "epoch": 2440} {"train_loss": -12.1898832321167, "global_step": 409937, "epoch": 2440} {"train_loss": -12.750450134277344, "global_step": 409938, "epoch": 2440} {"train_loss": -12.488821029663086, "global_step": 409939, "epoch": 2440} {"train_loss": -12.514286041259766, "global_step": 409940, "epoch": 2440} {"train_loss": -12.375727653503418, "global_step": 409941, "epoch": 2440} {"train_loss": -12.7189359664917, "global_step": 409942, "epoch": 2440} {"train_loss": -12.661775588989258, "global_step": 409943, "epoch": 2440} {"train_loss": -12.315549850463867, "global_step": 409944, "epoch": 2440} {"train_loss": -12.223832130432129, "global_step": 409945, "epoch": 2440} {"train_loss": -12.325727462768555, "global_step": 409946, "epoch": 2440} {"train_loss": -12.463016510009766, "global_step": 409947, "epoch": 2440} {"train_loss": -11.138069152832031, "global_step": 409948, "epoch": 2440} {"train_loss": -12.207376480102539, "global_step": 409949, "epoch": 2440} {"train_loss": -11.922931671142578, "global_step": 409950, "epoch": 2440} {"train_loss": -12.39986515045166, "global_step": 409951, "epoch": 2440} {"train_loss": -11.311875343322754, "global_step": 409952, "epoch": 2440} {"train_loss": -12.30019760131836, "global_step": 409953, "epoch": 2440} {"train_loss": -12.717328071594238, "global_step": 409954, "epoch": 2440} {"train_loss": -11.783008575439453, "global_step": 409955, "epoch": 2440} {"train_loss": -11.550056457519531, "global_step": 409956, "epoch": 2440} {"train_loss": -12.21480655670166, "global_step": 409957, "epoch": 2440} {"train_loss": -12.177315711975098, "global_step": 409958, "epoch": 2440} {"train_loss": -11.38145637512207, "global_step": 409959, "epoch": 2440} {"train_loss": -11.377985954284668, "global_step": 409960, "epoch": 2440} {"train_loss": -12.73265552520752, "global_step": 409961, "epoch": 2440} {"train_loss": -11.731710433959961, "global_step": 409962, "epoch": 2440} {"train_loss": -11.625701904296875, "global_step": 409963, "epoch": 2440} {"train_loss": -12.264130592346191, "global_step": 409964, "epoch": 2440} {"train_loss": -12.187049865722656, "global_step": 409965, "epoch": 2440} {"train_loss": -12.084771156311035, "global_step": 409966, "epoch": 2440} {"train_loss": -12.52208137512207, "global_step": 409967, "epoch": 2440} {"train_loss": -11.859417915344238, "global_step": 409968, "epoch": 2440} {"train_loss": -11.468364715576172, "global_step": 409969, "epoch": 2440} {"train_loss": -12.457864761352539, "global_step": 409970, "epoch": 2440} {"train_loss": -12.627975463867188, "global_step": 409971, "epoch": 2440} {"train_loss": -12.081766128540039, "global_step": 409972, "epoch": 2440} {"train_loss": -11.964897155761719, "global_step": 409973, "epoch": 2440} {"train_loss": -12.268348693847656, "global_step": 409974, "epoch": 2440} {"train_loss": -12.10959243774414, "global_step": 409975, "epoch": 2440} {"train_loss": -12.323067665100098, "global_step": 409976, "epoch": 2440} {"train_loss": -12.503013610839844, "global_step": 409977, "epoch": 2440} {"train_loss": -11.922073364257812, "global_step": 409978, "epoch": 2440} {"train_loss": -11.923210144042969, "global_step": 409979, "epoch": 2440} {"train_loss": -11.761116027832031, "global_step": 409980, "epoch": 2440} {"train_loss": -10.274877548217773, "global_step": 409981, "epoch": 2440} {"train_loss": -10.913198471069336, "global_step": 409982, "epoch": 2440} {"train_loss": -11.231588363647461, "global_step": 409983, "epoch": 2440} {"train_loss": -10.952301979064941, "global_step": 409984, "epoch": 2440} {"train_loss": -10.091547966003418, "global_step": 409985, "epoch": 2440} {"train_loss": -11.412074089050293, "global_step": 409986, "epoch": 2440} {"train_loss": -10.596231460571289, "global_step": 409987, "epoch": 2440} {"train_loss": -11.33107852935791, "global_step": 409988, "epoch": 2440} {"train_loss": -10.225990295410156, "global_step": 409989, "epoch": 2440} {"train_loss": -12.073055267333984, "global_step": 409990, "epoch": 2440} {"train_loss": -9.973551750183105, "global_step": 409991, "epoch": 2440} {"train_loss": -11.307388305664062, "global_step": 409992, "epoch": 2440} {"train_loss": -11.596369743347168, "global_step": 409993, "epoch": 2440} {"train_loss": -11.785070419311523, "global_step": 409994, "epoch": 2440} {"train_loss": -12.229286193847656, "global_step": 409995, "epoch": 2440} {"train_loss": -11.764802932739258, "global_step": 409996, "epoch": 2440} {"train_loss": -12.182733535766602, "global_step": 409997, "epoch": 2440} {"train_loss": -12.128299713134766, "global_step": 409998, "epoch": 2440} {"train_loss": -11.942956924438477, "global_step": 409999, "epoch": 2440} {"train_loss": -12.3250732421875, "global_step": 410000, "epoch": 2440} {"train_loss": -11.982169151306152, "global_step": 410001, "epoch": 2440} {"train_loss": -12.312837600708008, "global_step": 410002, "epoch": 2440} {"train_loss": -12.001564025878906, "global_step": 410003, "epoch": 2440} {"train_loss": -12.287848472595215, "global_step": 410004, "epoch": 2440} {"train_loss": -11.96253776550293, "global_step": 410005, "epoch": 2440} {"train_loss": -11.802602767944336, "global_step": 410006, "epoch": 2440} {"train_loss": -12.063624382019043, "global_step": 410007, "epoch": 2440} {"train_loss": -11.857946395874023, "global_step": 410008, "epoch": 2440} {"train_loss": -12.38538932800293, "global_step": 410009, "epoch": 2440} {"train_loss": -12.128535270690918, "global_step": 410010, "epoch": 2440} {"train_loss": -12.136934280395508, "global_step": 410011, "epoch": 2440} {"train_loss": -12.013591766357422, "global_step": 410012, "epoch": 2440} {"train_loss": -12.41405200958252, "global_step": 410013, "epoch": 2440} {"train_loss": -11.734663009643555, "global_step": 410014, "epoch": 2440} {"train_loss": -11.947577476501465, "global_step": 410015, "epoch": 2440} {"train_loss": -11.879438400268555, "global_step": 410016, "epoch": 2440} {"train_loss": -11.709732055664062, "global_step": 410017, "epoch": 2440} {"train_loss": -12.281648635864258, "global_step": 410018, "epoch": 2440} {"train_loss": -12.126745223999023, "global_step": 410019, "epoch": 2440} {"train_loss": -11.979512214660645, "global_step": 410020, "epoch": 2440} {"train_loss": -11.587060928344727, "global_step": 410021, "epoch": 2440} {"train_loss": -12.150651931762695, "global_step": 410022, "epoch": 2440} {"train_loss": -12.024659156799316, "global_step": 410023, "epoch": 2440} {"train_loss": -12.172740936279297, "global_step": 410024, "epoch": 2440} {"train_loss": -12.576253890991211, "global_step": 410025, "epoch": 2440} {"train_loss": -12.433602333068848, "global_step": 410026, "epoch": 2440} {"train_loss": -12.336030960083008, "global_step": 410027, "epoch": 2440} {"train_loss": -12.62615966796875, "global_step": 410028, "epoch": 2440} {"train_loss": -12.518503189086914, "global_step": 410029, "epoch": 2440} {"train_loss": -12.584785461425781, "global_step": 410030, "epoch": 2440} {"train_loss": -12.50544548034668, "global_step": 410031, "epoch": 2440} {"train_loss": -12.444305419921875, "global_step": 410032, "epoch": 2440} {"train_loss": -12.158821105957031, "global_step": 410033, "epoch": 2440} {"train_loss": -12.445623397827148, "global_step": 410034, "epoch": 2440} {"train_loss": -12.299331665039062, "global_step": 410035, "epoch": 2440} {"train_loss": -12.29440689086914, "global_step": 410036, "epoch": 2440} {"train_loss": -12.50052261352539, "global_step": 410037, "epoch": 2440} {"train_loss": -12.00584602355957, "global_step": 410038, "epoch": 2440} {"train_loss": -12.32357406616211, "global_step": 410039, "epoch": 2440} {"train_loss": -12.270988464355469, "global_step": 410040, "epoch": 2440} {"train_loss": -12.03952407836914, "global_step": 410041, "epoch": 2440} {"train_loss": -12.21989631652832, "global_step": 410042, "epoch": 2440} {"train_loss": -12.574101448059082, "global_step": 410043, "epoch": 2440} {"train_loss": -12.055974006652832, "global_step": 410044, "epoch": 2440} {"train_loss": -12.247234344482422, "global_step": 410045, "epoch": 2440} {"train_loss": -12.389357566833496, "global_step": 410046, "epoch": 2440} {"train_loss": -12.493561744689941, "global_step": 410047, "epoch": 2440} {"train_loss": -12.489625930786133, "global_step": 410048, "epoch": 2440} {"train_loss": -12.411312103271484, "global_step": 410049, "epoch": 2440} {"train_loss": -12.474482536315918, "global_step": 410050, "epoch": 2440} {"train_loss": -12.345327377319336, "global_step": 410051, "epoch": 2440} {"train_loss": -12.686595916748047, "global_step": 410052, "epoch": 2440} {"train_loss": -12.045122146606445, "global_step": 410053, "epoch": 2440} {"train_loss": -12.206710815429688, "global_step": 410054, "epoch": 2440} {"train_loss": -12.500033378601074, "global_step": 410055, "epoch": 2440} {"train_loss": -12.2001371383667, "global_step": 410056, "epoch": 2440} {"train_loss": -12.425846099853516, "global_step": 410057, "epoch": 2440} {"train_loss": -12.4681978225708, "global_step": 410058, "epoch": 2440} {"train_loss": -11.65878677368164, "global_step": 410059, "epoch": 2440} {"train_loss": -12.40157699584961, "global_step": 410060, "epoch": 2440} {"train_loss": -12.355962753295898, "global_step": 410061, "epoch": 2440} {"train_loss": -12.081517219543457, "global_step": 410062, "epoch": 2440} {"train_loss": -12.513970375061035, "global_step": 410063, "epoch": 2440} {"train_loss": -12.523359298706055, "global_step": 410064, "epoch": 2440} {"train_loss": -12.234294891357422, "global_step": 410065, "epoch": 2440} {"train_loss": -12.007429122924805, "global_step": 410066, "epoch": 2440} {"train_loss": -12.72079849243164, "global_step": 410067, "epoch": 2440} {"train_loss": -12.339994430541992, "global_step": 410068, "epoch": 2440} {"train_loss": -12.639640808105469, "global_step": 410069, "epoch": 2440} {"train_loss": -12.156105995178223, "global_step": 410070, "epoch": 2440} {"train_loss": -12.271677017211914, "global_step": 410071, "epoch": 2440} {"train_loss": -12.44906234741211, "global_step": 410072, "epoch": 2440} {"train_loss": -12.434730529785156, "global_step": 410073, "epoch": 2440} {"train_loss": -11.697759628295898, "global_step": 410074, "epoch": 2440} {"train_loss": -12.376598358154297, "global_step": 410075, "epoch": 2440} {"train_loss": -12.185660362243652, "global_step": 410076, "epoch": 2440} {"train_loss": -11.923416137695312, "global_step": 410077, "epoch": 2440} {"train_loss": -12.173843383789062, "global_step": 410078, "epoch": 2440} {"train_loss": -12.383630752563477, "global_step": 410079, "epoch": 2440} {"train_loss": -12.395271301269531, "global_step": 410080, "epoch": 2440} {"train_loss": -12.745656967163086, "global_step": 410081, "epoch": 2440} {"train_loss": -12.280610084533691, "global_step": 410082, "epoch": 2440} {"train_loss": -12.606800079345703, "global_step": 410083, "epoch": 2440} {"train_loss": -12.093116760253906, "global_step": 410084, "epoch": 2440} {"train_loss": -12.595704078674316, "global_step": 410085, "epoch": 2440} {"train_loss": -12.459025382995605, "global_step": 410086, "epoch": 2440} {"train_loss": -12.135719719387236, "global_step": 410087, "epoch": 2440, "val_loss": 304328.625, "train_action_mse_error": 0.16264109313488007} {"train_loss": -12.184501647949219, "global_step": 410088, "epoch": 2441} {"train_loss": -12.426881790161133, "global_step": 410089, "epoch": 2441} {"train_loss": -12.657979965209961, "global_step": 410090, "epoch": 2441} {"train_loss": -12.185696601867676, "global_step": 410091, "epoch": 2441} {"train_loss": -12.680215835571289, "global_step": 410092, "epoch": 2441} {"train_loss": -12.207174301147461, "global_step": 410093, "epoch": 2441} {"train_loss": -12.326547622680664, "global_step": 410094, "epoch": 2441} {"train_loss": -12.025531768798828, "global_step": 410095, "epoch": 2441} {"train_loss": -12.340420722961426, "global_step": 410096, "epoch": 2441} {"train_loss": -12.072624206542969, "global_step": 410097, "epoch": 2441} {"train_loss": -12.686477661132812, "global_step": 410098, "epoch": 2441} {"train_loss": -12.16451644897461, "global_step": 410099, "epoch": 2441} {"train_loss": -12.070175170898438, "global_step": 410100, "epoch": 2441} {"train_loss": -12.485992431640625, "global_step": 410101, "epoch": 2441} {"train_loss": -12.694269180297852, "global_step": 410102, "epoch": 2441} {"train_loss": -12.164027214050293, "global_step": 410103, "epoch": 2441} {"train_loss": -11.669382095336914, "global_step": 410104, "epoch": 2441} {"train_loss": -11.914115905761719, "global_step": 410105, "epoch": 2441} {"train_loss": -12.238102912902832, "global_step": 410106, "epoch": 2441} {"train_loss": -11.376657485961914, "global_step": 410107, "epoch": 2441} {"train_loss": -11.214163780212402, "global_step": 410108, "epoch": 2441} {"train_loss": -11.903653144836426, "global_step": 410109, "epoch": 2441} {"train_loss": -10.744004249572754, "global_step": 410110, "epoch": 2441} {"train_loss": -11.015695571899414, "global_step": 410111, "epoch": 2441} {"train_loss": -11.605145454406738, "global_step": 410112, "epoch": 2441} {"train_loss": -11.533283233642578, "global_step": 410113, "epoch": 2441} {"train_loss": -11.231181144714355, "global_step": 410114, "epoch": 2441} {"train_loss": -11.69685173034668, "global_step": 410115, "epoch": 2441} {"train_loss": -11.64494514465332, "global_step": 410116, "epoch": 2441} {"train_loss": -11.444639205932617, "global_step": 410117, "epoch": 2441} {"train_loss": -11.300741195678711, "global_step": 410118, "epoch": 2441} {"train_loss": -12.349358558654785, "global_step": 410119, "epoch": 2441} {"train_loss": -11.263115882873535, "global_step": 410120, "epoch": 2441} {"train_loss": -11.395484924316406, "global_step": 410121, "epoch": 2441} {"train_loss": -12.045987129211426, "global_step": 410122, "epoch": 2441} {"train_loss": -10.763471603393555, "global_step": 410123, "epoch": 2441} {"train_loss": -12.172141075134277, "global_step": 410124, "epoch": 2441} {"train_loss": -11.237409591674805, "global_step": 410125, "epoch": 2441} {"train_loss": -11.847136497497559, "global_step": 410126, "epoch": 2441} {"train_loss": -11.665046691894531, "global_step": 410127, "epoch": 2441} {"train_loss": -12.216070175170898, "global_step": 410128, "epoch": 2441} {"train_loss": -11.471789360046387, "global_step": 410129, "epoch": 2441} {"train_loss": -12.06678581237793, "global_step": 410130, "epoch": 2441} {"train_loss": -11.747426986694336, "global_step": 410131, "epoch": 2441} {"train_loss": -11.830278396606445, "global_step": 410132, "epoch": 2441} {"train_loss": -11.470460891723633, "global_step": 410133, "epoch": 2441} {"train_loss": -11.898195266723633, "global_step": 410134, "epoch": 2441} {"train_loss": -11.581544876098633, "global_step": 410135, "epoch": 2441} {"train_loss": -11.064776420593262, "global_step": 410136, "epoch": 2441} {"train_loss": -11.309226989746094, "global_step": 410137, "epoch": 2441} {"train_loss": -11.278066635131836, "global_step": 410138, "epoch": 2441} {"train_loss": -11.651167869567871, "global_step": 410139, "epoch": 2441} {"train_loss": -11.661123275756836, "global_step": 410140, "epoch": 2441} {"train_loss": -12.019551277160645, "global_step": 410141, "epoch": 2441} {"train_loss": -10.336806297302246, "global_step": 410142, "epoch": 2441} {"train_loss": -11.648405075073242, "global_step": 410143, "epoch": 2441} {"train_loss": -10.216058731079102, "global_step": 410144, "epoch": 2441} {"train_loss": -11.911102294921875, "global_step": 410145, "epoch": 2441} {"train_loss": -10.692707061767578, "global_step": 410146, "epoch": 2441} {"train_loss": -11.070205688476562, "global_step": 410147, "epoch": 2441} {"train_loss": -11.461270332336426, "global_step": 410148, "epoch": 2441} {"train_loss": -11.159531593322754, "global_step": 410149, "epoch": 2441} {"train_loss": -10.817590713500977, "global_step": 410150, "epoch": 2441} {"train_loss": -11.127237319946289, "global_step": 410151, "epoch": 2441} {"train_loss": -11.61831283569336, "global_step": 410152, "epoch": 2441} {"train_loss": -11.069100379943848, "global_step": 410153, "epoch": 2441} {"train_loss": -12.172136306762695, "global_step": 410154, "epoch": 2441} {"train_loss": -11.976625442504883, "global_step": 410155, "epoch": 2441} {"train_loss": -11.578410148620605, "global_step": 410156, "epoch": 2441} {"train_loss": -12.170883178710938, "global_step": 410157, "epoch": 2441} {"train_loss": -11.93815803527832, "global_step": 410158, "epoch": 2441} {"train_loss": -12.35325813293457, "global_step": 410159, "epoch": 2441} {"train_loss": -12.116562843322754, "global_step": 410160, "epoch": 2441} {"train_loss": -12.137801170349121, "global_step": 410161, "epoch": 2441} {"train_loss": -12.402501106262207, "global_step": 410162, "epoch": 2441} {"train_loss": -12.255176544189453, "global_step": 410163, "epoch": 2441} {"train_loss": -12.450411796569824, "global_step": 410164, "epoch": 2441} {"train_loss": -12.284619331359863, "global_step": 410165, "epoch": 2441} {"train_loss": -12.280250549316406, "global_step": 410166, "epoch": 2441} {"train_loss": -12.411603927612305, "global_step": 410167, "epoch": 2441} {"train_loss": -12.113614082336426, "global_step": 410168, "epoch": 2441} {"train_loss": -12.304813385009766, "global_step": 410169, "epoch": 2441} {"train_loss": -12.211845397949219, "global_step": 410170, "epoch": 2441} {"train_loss": -12.512280464172363, "global_step": 410171, "epoch": 2441} {"train_loss": -12.38663387298584, "global_step": 410172, "epoch": 2441} {"train_loss": -12.323028564453125, "global_step": 410173, "epoch": 2441} {"train_loss": -12.627225875854492, "global_step": 410174, "epoch": 2441} {"train_loss": -12.419910430908203, "global_step": 410175, "epoch": 2441} {"train_loss": -12.396313667297363, "global_step": 410176, "epoch": 2441} {"train_loss": -12.409812927246094, "global_step": 410177, "epoch": 2441} {"train_loss": -12.221981048583984, "global_step": 410178, "epoch": 2441} {"train_loss": -11.90818977355957, "global_step": 410179, "epoch": 2441} {"train_loss": -12.43362808227539, "global_step": 410180, "epoch": 2441} {"train_loss": -11.841557502746582, "global_step": 410181, "epoch": 2441} {"train_loss": -12.32322883605957, "global_step": 410182, "epoch": 2441} {"train_loss": -11.908379554748535, "global_step": 410183, "epoch": 2441} {"train_loss": -12.379380226135254, "global_step": 410184, "epoch": 2441} {"train_loss": -12.019649505615234, "global_step": 410185, "epoch": 2441} {"train_loss": -12.427345275878906, "global_step": 410186, "epoch": 2441} {"train_loss": -11.941034317016602, "global_step": 410187, "epoch": 2441} {"train_loss": -11.993621826171875, "global_step": 410188, "epoch": 2441} {"train_loss": -12.164953231811523, "global_step": 410189, "epoch": 2441} {"train_loss": -12.454139709472656, "global_step": 410190, "epoch": 2441} {"train_loss": -12.212014198303223, "global_step": 410191, "epoch": 2441} {"train_loss": -12.311002731323242, "global_step": 410192, "epoch": 2441} {"train_loss": -12.215429306030273, "global_step": 410193, "epoch": 2441} {"train_loss": -11.997289657592773, "global_step": 410194, "epoch": 2441} {"train_loss": -12.400708198547363, "global_step": 410195, "epoch": 2441} {"train_loss": -12.385345458984375, "global_step": 410196, "epoch": 2441} {"train_loss": -12.526667594909668, "global_step": 410197, "epoch": 2441} {"train_loss": -12.281526565551758, "global_step": 410198, "epoch": 2441} {"train_loss": -12.524284362792969, "global_step": 410199, "epoch": 2441} {"train_loss": -12.443744659423828, "global_step": 410200, "epoch": 2441} {"train_loss": -12.375653266906738, "global_step": 410201, "epoch": 2441} {"train_loss": -12.571203231811523, "global_step": 410202, "epoch": 2441} {"train_loss": -12.585840225219727, "global_step": 410203, "epoch": 2441} {"train_loss": -12.145261764526367, "global_step": 410204, "epoch": 2441} {"train_loss": -12.228099822998047, "global_step": 410205, "epoch": 2441} {"train_loss": -12.301599502563477, "global_step": 410206, "epoch": 2441} {"train_loss": -12.228635787963867, "global_step": 410207, "epoch": 2441} {"train_loss": -12.621639251708984, "global_step": 410208, "epoch": 2441} {"train_loss": -12.402042388916016, "global_step": 410209, "epoch": 2441} {"train_loss": -12.575136184692383, "global_step": 410210, "epoch": 2441} {"train_loss": -12.332351684570312, "global_step": 410211, "epoch": 2441} {"train_loss": -12.50904369354248, "global_step": 410212, "epoch": 2441} {"train_loss": -12.39680290222168, "global_step": 410213, "epoch": 2441} {"train_loss": -12.34070110321045, "global_step": 410214, "epoch": 2441} {"train_loss": -12.560482025146484, "global_step": 410215, "epoch": 2441} {"train_loss": -12.484441757202148, "global_step": 410216, "epoch": 2441} {"train_loss": -12.612075805664062, "global_step": 410217, "epoch": 2441} {"train_loss": -12.331453323364258, "global_step": 410218, "epoch": 2441} {"train_loss": -12.761859893798828, "global_step": 410219, "epoch": 2441} {"train_loss": -12.431131362915039, "global_step": 410220, "epoch": 2441} {"train_loss": -12.572954177856445, "global_step": 410221, "epoch": 2441} {"train_loss": -12.668676376342773, "global_step": 410222, "epoch": 2441} {"train_loss": -12.757568359375, "global_step": 410223, "epoch": 2441} {"train_loss": -12.537666320800781, "global_step": 410224, "epoch": 2441} {"train_loss": -12.815065383911133, "global_step": 410225, "epoch": 2441} {"train_loss": -12.659106254577637, "global_step": 410226, "epoch": 2441} {"train_loss": -12.701469421386719, "global_step": 410227, "epoch": 2441} {"train_loss": -12.664640426635742, "global_step": 410228, "epoch": 2441} {"train_loss": -12.562908172607422, "global_step": 410229, "epoch": 2441} {"train_loss": -12.800422668457031, "global_step": 410230, "epoch": 2441} {"train_loss": -12.599275588989258, "global_step": 410231, "epoch": 2441} {"train_loss": -11.991432189941406, "global_step": 410232, "epoch": 2441} {"train_loss": -12.267927169799805, "global_step": 410233, "epoch": 2441} {"train_loss": -12.593225479125977, "global_step": 410234, "epoch": 2441} {"train_loss": -12.385671615600586, "global_step": 410235, "epoch": 2441} {"train_loss": -12.215787887573242, "global_step": 410236, "epoch": 2441} {"train_loss": -11.951870918273926, "global_step": 410237, "epoch": 2441} {"train_loss": -12.63096809387207, "global_step": 410238, "epoch": 2441} {"train_loss": -12.39875602722168, "global_step": 410239, "epoch": 2441} {"train_loss": -12.90980052947998, "global_step": 410240, "epoch": 2441} {"train_loss": -12.649560928344727, "global_step": 410241, "epoch": 2441} {"train_loss": -12.630489349365234, "global_step": 410242, "epoch": 2441} {"train_loss": -12.498249053955078, "global_step": 410243, "epoch": 2441} {"train_loss": -12.6607084274292, "global_step": 410244, "epoch": 2441} {"train_loss": -12.408760070800781, "global_step": 410245, "epoch": 2441} {"train_loss": -12.81263542175293, "global_step": 410246, "epoch": 2441} {"train_loss": -12.477042198181152, "global_step": 410247, "epoch": 2441} {"train_loss": -12.591497421264648, "global_step": 410248, "epoch": 2441} {"train_loss": -12.532613754272461, "global_step": 410249, "epoch": 2441} {"train_loss": -12.392656326293945, "global_step": 410250, "epoch": 2441} {"train_loss": -12.752933502197266, "global_step": 410251, "epoch": 2441} {"train_loss": -12.487298965454102, "global_step": 410252, "epoch": 2441} {"train_loss": -12.302698135375977, "global_step": 410253, "epoch": 2441} {"train_loss": -12.383952140808105, "global_step": 410254, "epoch": 2441} {"train_loss": -12.107896333649045, "global_step": 410255, "epoch": 2441, "val_loss": 304770.8125} {"train_loss": -11.878929138183594, "global_step": 410256, "epoch": 2442} {"train_loss": -12.725776672363281, "global_step": 410257, "epoch": 2442} {"train_loss": -12.177650451660156, "global_step": 410258, "epoch": 2442} {"train_loss": -12.247203826904297, "global_step": 410259, "epoch": 2442} {"train_loss": -12.126216888427734, "global_step": 410260, "epoch": 2442} {"train_loss": -12.340885162353516, "global_step": 410261, "epoch": 2442} {"train_loss": -11.696706771850586, "global_step": 410262, "epoch": 2442} {"train_loss": -12.329177856445312, "global_step": 410263, "epoch": 2442} {"train_loss": -11.902027130126953, "global_step": 410264, "epoch": 2442} {"train_loss": -12.500268936157227, "global_step": 410265, "epoch": 2442} {"train_loss": -11.648748397827148, "global_step": 410266, "epoch": 2442} {"train_loss": -12.009087562561035, "global_step": 410267, "epoch": 2442} {"train_loss": -11.705357551574707, "global_step": 410268, "epoch": 2442} {"train_loss": -12.083121299743652, "global_step": 410269, "epoch": 2442} {"train_loss": -11.218864440917969, "global_step": 410270, "epoch": 2442} {"train_loss": -11.806380271911621, "global_step": 410271, "epoch": 2442} {"train_loss": -11.592097282409668, "global_step": 410272, "epoch": 2442} {"train_loss": -11.799571990966797, "global_step": 410273, "epoch": 2442} {"train_loss": -11.687746047973633, "global_step": 410274, "epoch": 2442} {"train_loss": -11.50084400177002, "global_step": 410275, "epoch": 2442} {"train_loss": -11.238224983215332, "global_step": 410276, "epoch": 2442} {"train_loss": -11.570544242858887, "global_step": 410277, "epoch": 2442} {"train_loss": -9.356239318847656, "global_step": 410278, "epoch": 2442} {"train_loss": -9.732329368591309, "global_step": 410279, "epoch": 2442} {"train_loss": -10.774030685424805, "global_step": 410280, "epoch": 2442} {"train_loss": -10.08517074584961, "global_step": 410281, "epoch": 2442} {"train_loss": -9.614204406738281, "global_step": 410282, "epoch": 2442} {"train_loss": -9.70169448852539, "global_step": 410283, "epoch": 2442} {"train_loss": -11.073217391967773, "global_step": 410284, "epoch": 2442} {"train_loss": -9.873695373535156, "global_step": 410285, "epoch": 2442} {"train_loss": -10.808226585388184, "global_step": 410286, "epoch": 2442} {"train_loss": -10.581165313720703, "global_step": 410287, "epoch": 2442} {"train_loss": -11.159778594970703, "global_step": 410288, "epoch": 2442} {"train_loss": -11.320877075195312, "global_step": 410289, "epoch": 2442} {"train_loss": -11.124112129211426, "global_step": 410290, "epoch": 2442} {"train_loss": -11.597169876098633, "global_step": 410291, "epoch": 2442} {"train_loss": -10.567774772644043, "global_step": 410292, "epoch": 2442} {"train_loss": -10.71572494506836, "global_step": 410293, "epoch": 2442} {"train_loss": -11.023947715759277, "global_step": 410294, "epoch": 2442} {"train_loss": -10.837553024291992, "global_step": 410295, "epoch": 2442} {"train_loss": -11.991024017333984, "global_step": 410296, "epoch": 2442} {"train_loss": -11.215519905090332, "global_step": 410297, "epoch": 2442} {"train_loss": -11.332862854003906, "global_step": 410298, "epoch": 2442} {"train_loss": -11.297219276428223, "global_step": 410299, "epoch": 2442} {"train_loss": -11.246338844299316, "global_step": 410300, "epoch": 2442} {"train_loss": -11.727838516235352, "global_step": 410301, "epoch": 2442} {"train_loss": -11.443912506103516, "global_step": 410302, "epoch": 2442} {"train_loss": -10.451492309570312, "global_step": 410303, "epoch": 2442} {"train_loss": -12.24215316772461, "global_step": 410304, "epoch": 2442} {"train_loss": -10.76750373840332, "global_step": 410305, "epoch": 2442} {"train_loss": -11.881292343139648, "global_step": 410306, "epoch": 2442} {"train_loss": -11.563705444335938, "global_step": 410307, "epoch": 2442} {"train_loss": -11.411870956420898, "global_step": 410308, "epoch": 2442} {"train_loss": -11.945273399353027, "global_step": 410309, "epoch": 2442} {"train_loss": -11.190412521362305, "global_step": 410310, "epoch": 2442} {"train_loss": -12.165525436401367, "global_step": 410311, "epoch": 2442} {"train_loss": -11.913864135742188, "global_step": 410312, "epoch": 2442} {"train_loss": -11.696584701538086, "global_step": 410313, "epoch": 2442} {"train_loss": -12.26580810546875, "global_step": 410314, "epoch": 2442} {"train_loss": -11.966564178466797, "global_step": 410315, "epoch": 2442} {"train_loss": -12.215351104736328, "global_step": 410316, "epoch": 2442} {"train_loss": -12.235827445983887, "global_step": 410317, "epoch": 2442} {"train_loss": -12.058319091796875, "global_step": 410318, "epoch": 2442} {"train_loss": -12.277323722839355, "global_step": 410319, "epoch": 2442} {"train_loss": -12.046123504638672, "global_step": 410320, "epoch": 2442} {"train_loss": -12.336883544921875, "global_step": 410321, "epoch": 2442} {"train_loss": -11.945104598999023, "global_step": 410322, "epoch": 2442} {"train_loss": -12.06450080871582, "global_step": 410323, "epoch": 2442} {"train_loss": -12.125358581542969, "global_step": 410324, "epoch": 2442} {"train_loss": -11.562238693237305, "global_step": 410325, "epoch": 2442} {"train_loss": -12.134651184082031, "global_step": 410326, "epoch": 2442} {"train_loss": -12.09942626953125, "global_step": 410327, "epoch": 2442} {"train_loss": -11.978530883789062, "global_step": 410328, "epoch": 2442} {"train_loss": -12.313536643981934, "global_step": 410329, "epoch": 2442} {"train_loss": -12.062193870544434, "global_step": 410330, "epoch": 2442} {"train_loss": -11.967638969421387, "global_step": 410331, "epoch": 2442} {"train_loss": -11.8975830078125, "global_step": 410332, "epoch": 2442} {"train_loss": -12.021890640258789, "global_step": 410333, "epoch": 2442} {"train_loss": -12.310808181762695, "global_step": 410334, "epoch": 2442} {"train_loss": -12.097643852233887, "global_step": 410335, "epoch": 2442} {"train_loss": -12.433174133300781, "global_step": 410336, "epoch": 2442} {"train_loss": -12.465988159179688, "global_step": 410337, "epoch": 2442} {"train_loss": -12.582950592041016, "global_step": 410338, "epoch": 2442} {"train_loss": -12.53715705871582, "global_step": 410339, "epoch": 2442} {"train_loss": -12.457389831542969, "global_step": 410340, "epoch": 2442} {"train_loss": -12.457524299621582, "global_step": 410341, "epoch": 2442} {"train_loss": -12.304530143737793, "global_step": 410342, "epoch": 2442} {"train_loss": -12.437599182128906, "global_step": 410343, "epoch": 2442} {"train_loss": -12.463362693786621, "global_step": 410344, "epoch": 2442} {"train_loss": -12.362666130065918, "global_step": 410345, "epoch": 2442} {"train_loss": -12.452619552612305, "global_step": 410346, "epoch": 2442} {"train_loss": -12.416549682617188, "global_step": 410347, "epoch": 2442} {"train_loss": -12.282002449035645, "global_step": 410348, "epoch": 2442} {"train_loss": -12.358601570129395, "global_step": 410349, "epoch": 2442} {"train_loss": -12.480640411376953, "global_step": 410350, "epoch": 2442} {"train_loss": -12.406268119812012, "global_step": 410351, "epoch": 2442} {"train_loss": -12.052119255065918, "global_step": 410352, "epoch": 2442} {"train_loss": -12.40804672241211, "global_step": 410353, "epoch": 2442} {"train_loss": -12.467164039611816, "global_step": 410354, "epoch": 2442} {"train_loss": -12.521339416503906, "global_step": 410355, "epoch": 2442} {"train_loss": -12.303177833557129, "global_step": 410356, "epoch": 2442} {"train_loss": -12.397882461547852, "global_step": 410357, "epoch": 2442} {"train_loss": -11.364751815795898, "global_step": 410358, "epoch": 2442} {"train_loss": -12.48162841796875, "global_step": 410359, "epoch": 2442} {"train_loss": -11.26432991027832, "global_step": 410360, "epoch": 2442} {"train_loss": -12.425339698791504, "global_step": 410361, "epoch": 2442} {"train_loss": -12.135860443115234, "global_step": 410362, "epoch": 2442} {"train_loss": -12.177717208862305, "global_step": 410363, "epoch": 2442} {"train_loss": -12.119359970092773, "global_step": 410364, "epoch": 2442} {"train_loss": -12.630059242248535, "global_step": 410365, "epoch": 2442} {"train_loss": -12.435957908630371, "global_step": 410366, "epoch": 2442} {"train_loss": -12.329612731933594, "global_step": 410367, "epoch": 2442} {"train_loss": -12.526342391967773, "global_step": 410368, "epoch": 2442} {"train_loss": -12.222322463989258, "global_step": 410369, "epoch": 2442} {"train_loss": -12.414985656738281, "global_step": 410370, "epoch": 2442} {"train_loss": -12.199577331542969, "global_step": 410371, "epoch": 2442} {"train_loss": -12.261404037475586, "global_step": 410372, "epoch": 2442} {"train_loss": -12.096647262573242, "global_step": 410373, "epoch": 2442} {"train_loss": -12.499996185302734, "global_step": 410374, "epoch": 2442} {"train_loss": -12.26165771484375, "global_step": 410375, "epoch": 2442} {"train_loss": -12.521576881408691, "global_step": 410376, "epoch": 2442} {"train_loss": -12.335883140563965, "global_step": 410377, "epoch": 2442} {"train_loss": -12.494865417480469, "global_step": 410378, "epoch": 2442} {"train_loss": -12.466039657592773, "global_step": 410379, "epoch": 2442} {"train_loss": -12.44993782043457, "global_step": 410380, "epoch": 2442} {"train_loss": -12.569503784179688, "global_step": 410381, "epoch": 2442} {"train_loss": -12.82255744934082, "global_step": 410382, "epoch": 2442} {"train_loss": -12.361950874328613, "global_step": 410383, "epoch": 2442} {"train_loss": -12.764205932617188, "global_step": 410384, "epoch": 2442} {"train_loss": -12.238170623779297, "global_step": 410385, "epoch": 2442} {"train_loss": -12.423311233520508, "global_step": 410386, "epoch": 2442} {"train_loss": -12.597290992736816, "global_step": 410387, "epoch": 2442} {"train_loss": -12.433475494384766, "global_step": 410388, "epoch": 2442} {"train_loss": -12.625411033630371, "global_step": 410389, "epoch": 2442} {"train_loss": -12.77566909790039, "global_step": 410390, "epoch": 2442} {"train_loss": -12.469125747680664, "global_step": 410391, "epoch": 2442} {"train_loss": -12.586861610412598, "global_step": 410392, "epoch": 2442} {"train_loss": -12.479427337646484, "global_step": 410393, "epoch": 2442} {"train_loss": -12.598413467407227, "global_step": 410394, "epoch": 2442} {"train_loss": -12.319540023803711, "global_step": 410395, "epoch": 2442} {"train_loss": -12.616912841796875, "global_step": 410396, "epoch": 2442} {"train_loss": -12.416146278381348, "global_step": 410397, "epoch": 2442} {"train_loss": -12.33414363861084, "global_step": 410398, "epoch": 2442} {"train_loss": -11.104551315307617, "global_step": 410399, "epoch": 2442} {"train_loss": -11.667831420898438, "global_step": 410400, "epoch": 2442} {"train_loss": -12.17408561706543, "global_step": 410401, "epoch": 2442} {"train_loss": -12.175830841064453, "global_step": 410402, "epoch": 2442} {"train_loss": -11.153879165649414, "global_step": 410403, "epoch": 2442} {"train_loss": -12.287483215332031, "global_step": 410404, "epoch": 2442} {"train_loss": -10.70135498046875, "global_step": 410405, "epoch": 2442} {"train_loss": -11.472251892089844, "global_step": 410406, "epoch": 2442} {"train_loss": -12.0038423538208, "global_step": 410407, "epoch": 2442} {"train_loss": -11.885761260986328, "global_step": 410408, "epoch": 2442} {"train_loss": -11.566739082336426, "global_step": 410409, "epoch": 2442} {"train_loss": -12.257073402404785, "global_step": 410410, "epoch": 2442} {"train_loss": -11.295548439025879, "global_step": 410411, "epoch": 2442} {"train_loss": -10.689872741699219, "global_step": 410412, "epoch": 2442} {"train_loss": -12.404212951660156, "global_step": 410413, "epoch": 2442} {"train_loss": -11.897340774536133, "global_step": 410414, "epoch": 2442} {"train_loss": -9.65455436706543, "global_step": 410415, "epoch": 2442} {"train_loss": -12.090719223022461, "global_step": 410416, "epoch": 2442} {"train_loss": -10.126920700073242, "global_step": 410417, "epoch": 2442} {"train_loss": -10.800484657287598, "global_step": 410418, "epoch": 2442} {"train_loss": -11.50885009765625, "global_step": 410419, "epoch": 2442} {"train_loss": -10.123689651489258, "global_step": 410420, "epoch": 2442} {"train_loss": -9.74363899230957, "global_step": 410421, "epoch": 2442} {"train_loss": -10.222513198852539, "global_step": 410422, "epoch": 2442} {"train_loss": -11.83547822634379, "global_step": 410423, "epoch": 2442, "val_loss": 307213.8125} {"train_loss": -9.761377334594727, "global_step": 410424, "epoch": 2443} {"train_loss": -11.414390563964844, "global_step": 410425, "epoch": 2443} {"train_loss": -9.999695777893066, "global_step": 410426, "epoch": 2443} {"train_loss": -10.347969055175781, "global_step": 410427, "epoch": 2443} {"train_loss": -11.723077774047852, "global_step": 410428, "epoch": 2443} {"train_loss": -11.316652297973633, "global_step": 410429, "epoch": 2443} {"train_loss": -11.879585266113281, "global_step": 410430, "epoch": 2443} {"train_loss": -11.231843948364258, "global_step": 410431, "epoch": 2443} {"train_loss": -11.969371795654297, "global_step": 410432, "epoch": 2443} {"train_loss": -11.718544006347656, "global_step": 410433, "epoch": 2443} {"train_loss": -11.870282173156738, "global_step": 410434, "epoch": 2443} {"train_loss": -11.65578842163086, "global_step": 410435, "epoch": 2443} {"train_loss": -11.460214614868164, "global_step": 410436, "epoch": 2443} {"train_loss": -11.993034362792969, "global_step": 410437, "epoch": 2443} {"train_loss": -11.882711410522461, "global_step": 410438, "epoch": 2443} {"train_loss": -12.073004722595215, "global_step": 410439, "epoch": 2443} {"train_loss": -12.23259162902832, "global_step": 410440, "epoch": 2443} {"train_loss": -11.886832237243652, "global_step": 410441, "epoch": 2443} {"train_loss": -12.222566604614258, "global_step": 410442, "epoch": 2443} {"train_loss": -12.085460662841797, "global_step": 410443, "epoch": 2443} {"train_loss": -11.916179656982422, "global_step": 410444, "epoch": 2443} {"train_loss": -12.19300651550293, "global_step": 410445, "epoch": 2443} {"train_loss": -12.062870979309082, "global_step": 410446, "epoch": 2443} {"train_loss": -12.032804489135742, "global_step": 410447, "epoch": 2443} {"train_loss": -12.285160064697266, "global_step": 410448, "epoch": 2443} {"train_loss": -12.26093864440918, "global_step": 410449, "epoch": 2443} {"train_loss": -12.115951538085938, "global_step": 410450, "epoch": 2443} {"train_loss": -12.177502632141113, "global_step": 410451, "epoch": 2443} {"train_loss": -11.908650398254395, "global_step": 410452, "epoch": 2443} {"train_loss": -11.973315238952637, "global_step": 410453, "epoch": 2443} {"train_loss": -12.195211410522461, "global_step": 410454, "epoch": 2443} {"train_loss": -12.335917472839355, "global_step": 410455, "epoch": 2443} {"train_loss": -11.731794357299805, "global_step": 410456, "epoch": 2443} {"train_loss": -12.313889503479004, "global_step": 410457, "epoch": 2443} {"train_loss": -11.569942474365234, "global_step": 410458, "epoch": 2443} {"train_loss": -12.27741813659668, "global_step": 410459, "epoch": 2443} {"train_loss": -12.099031448364258, "global_step": 410460, "epoch": 2443} {"train_loss": -12.415803909301758, "global_step": 410461, "epoch": 2443} {"train_loss": -12.043668746948242, "global_step": 410462, "epoch": 2443} {"train_loss": -12.16535758972168, "global_step": 410463, "epoch": 2443} {"train_loss": -11.93319034576416, "global_step": 410464, "epoch": 2443} {"train_loss": -12.35583209991455, "global_step": 410465, "epoch": 2443} {"train_loss": -11.78617000579834, "global_step": 410466, "epoch": 2443} {"train_loss": -11.404195785522461, "global_step": 410467, "epoch": 2443} {"train_loss": -11.068073272705078, "global_step": 410468, "epoch": 2443} {"train_loss": -12.12247085571289, "global_step": 410469, "epoch": 2443} {"train_loss": -11.391620635986328, "global_step": 410470, "epoch": 2443} {"train_loss": -12.422542572021484, "global_step": 410471, "epoch": 2443} {"train_loss": -11.916899681091309, "global_step": 410472, "epoch": 2443} {"train_loss": -11.924795150756836, "global_step": 410473, "epoch": 2443} {"train_loss": -11.791338920593262, "global_step": 410474, "epoch": 2443} {"train_loss": -12.140508651733398, "global_step": 410475, "epoch": 2443} {"train_loss": -12.39326286315918, "global_step": 410476, "epoch": 2443} {"train_loss": -12.034780502319336, "global_step": 410477, "epoch": 2443} {"train_loss": -12.41166877746582, "global_step": 410478, "epoch": 2443} {"train_loss": -11.937671661376953, "global_step": 410479, "epoch": 2443} {"train_loss": -12.20811939239502, "global_step": 410480, "epoch": 2443} {"train_loss": -12.416322708129883, "global_step": 410481, "epoch": 2443} {"train_loss": -12.301532745361328, "global_step": 410482, "epoch": 2443} {"train_loss": -12.3509521484375, "global_step": 410483, "epoch": 2443} {"train_loss": -12.0722074508667, "global_step": 410484, "epoch": 2443} {"train_loss": -12.428250312805176, "global_step": 410485, "epoch": 2443} {"train_loss": -12.309272766113281, "global_step": 410486, "epoch": 2443} {"train_loss": -12.416655540466309, "global_step": 410487, "epoch": 2443} {"train_loss": -11.784086227416992, "global_step": 410488, "epoch": 2443} {"train_loss": -12.236510276794434, "global_step": 410489, "epoch": 2443} {"train_loss": -11.52775764465332, "global_step": 410490, "epoch": 2443} {"train_loss": -11.749055862426758, "global_step": 410491, "epoch": 2443} {"train_loss": -11.017401695251465, "global_step": 410492, "epoch": 2443} {"train_loss": -11.293654441833496, "global_step": 410493, "epoch": 2443} {"train_loss": -10.50506591796875, "global_step": 410494, "epoch": 2443} {"train_loss": -10.071232795715332, "global_step": 410495, "epoch": 2443} {"train_loss": -10.106168746948242, "global_step": 410496, "epoch": 2443} {"train_loss": -11.423551559448242, "global_step": 410497, "epoch": 2443} {"train_loss": -10.90615177154541, "global_step": 410498, "epoch": 2443} {"train_loss": -11.46000862121582, "global_step": 410499, "epoch": 2443} {"train_loss": -11.784660339355469, "global_step": 410500, "epoch": 2443} {"train_loss": -11.586196899414062, "global_step": 410501, "epoch": 2443} {"train_loss": -11.938263893127441, "global_step": 410502, "epoch": 2443} {"train_loss": -11.199823379516602, "global_step": 410503, "epoch": 2443} {"train_loss": -12.154684066772461, "global_step": 410504, "epoch": 2443} {"train_loss": -11.711902618408203, "global_step": 410505, "epoch": 2443} {"train_loss": -12.017847061157227, "global_step": 410506, "epoch": 2443} {"train_loss": -11.890434265136719, "global_step": 410507, "epoch": 2443} {"train_loss": -12.01517105102539, "global_step": 410508, "epoch": 2443} {"train_loss": -12.120513916015625, "global_step": 410509, "epoch": 2443} {"train_loss": -11.930880546569824, "global_step": 410510, "epoch": 2443} {"train_loss": -12.173589706420898, "global_step": 410511, "epoch": 2443} {"train_loss": -11.789810180664062, "global_step": 410512, "epoch": 2443} {"train_loss": -11.793558120727539, "global_step": 410513, "epoch": 2443} {"train_loss": -12.064263343811035, "global_step": 410514, "epoch": 2443} {"train_loss": -12.005927085876465, "global_step": 410515, "epoch": 2443} {"train_loss": -11.99083137512207, "global_step": 410516, "epoch": 2443} {"train_loss": -12.088041305541992, "global_step": 410517, "epoch": 2443} {"train_loss": -11.95361328125, "global_step": 410518, "epoch": 2443} {"train_loss": -11.882661819458008, "global_step": 410519, "epoch": 2443} {"train_loss": -11.86976432800293, "global_step": 410520, "epoch": 2443} {"train_loss": -12.107732772827148, "global_step": 410521, "epoch": 2443} {"train_loss": -12.126983642578125, "global_step": 410522, "epoch": 2443} {"train_loss": -12.058599472045898, "global_step": 410523, "epoch": 2443} {"train_loss": -12.241299629211426, "global_step": 410524, "epoch": 2443} {"train_loss": -11.984197616577148, "global_step": 410525, "epoch": 2443} {"train_loss": -12.265043258666992, "global_step": 410526, "epoch": 2443} {"train_loss": -11.98741626739502, "global_step": 410527, "epoch": 2443} {"train_loss": -12.451150894165039, "global_step": 410528, "epoch": 2443} {"train_loss": -12.170970916748047, "global_step": 410529, "epoch": 2443} {"train_loss": -12.217529296875, "global_step": 410530, "epoch": 2443} {"train_loss": -12.202052116394043, "global_step": 410531, "epoch": 2443} {"train_loss": -12.343183517456055, "global_step": 410532, "epoch": 2443} {"train_loss": -12.347874641418457, "global_step": 410533, "epoch": 2443} {"train_loss": -12.478048324584961, "global_step": 410534, "epoch": 2443} {"train_loss": -12.323923110961914, "global_step": 410535, "epoch": 2443} {"train_loss": -12.471240997314453, "global_step": 410536, "epoch": 2443} {"train_loss": -12.434450149536133, "global_step": 410537, "epoch": 2443} {"train_loss": -12.229536056518555, "global_step": 410538, "epoch": 2443} {"train_loss": -12.339197158813477, "global_step": 410539, "epoch": 2443} {"train_loss": -12.279747009277344, "global_step": 410540, "epoch": 2443} {"train_loss": -12.438517570495605, "global_step": 410541, "epoch": 2443} {"train_loss": -12.50282096862793, "global_step": 410542, "epoch": 2443} {"train_loss": -12.260750770568848, "global_step": 410543, "epoch": 2443} {"train_loss": -12.516166687011719, "global_step": 410544, "epoch": 2443} {"train_loss": -12.364054679870605, "global_step": 410545, "epoch": 2443} {"train_loss": -12.629426956176758, "global_step": 410546, "epoch": 2443} {"train_loss": -12.369582176208496, "global_step": 410547, "epoch": 2443} {"train_loss": -12.502716064453125, "global_step": 410548, "epoch": 2443} {"train_loss": -12.44249153137207, "global_step": 410549, "epoch": 2443} {"train_loss": -12.545101165771484, "global_step": 410550, "epoch": 2443} {"train_loss": -12.601103782653809, "global_step": 410551, "epoch": 2443} {"train_loss": -12.478809356689453, "global_step": 410552, "epoch": 2443} {"train_loss": -12.711523056030273, "global_step": 410553, "epoch": 2443} {"train_loss": -12.634689331054688, "global_step": 410554, "epoch": 2443} {"train_loss": -12.434247016906738, "global_step": 410555, "epoch": 2443} {"train_loss": -11.910001754760742, "global_step": 410556, "epoch": 2443} {"train_loss": -12.242645263671875, "global_step": 410557, "epoch": 2443} {"train_loss": -12.654867172241211, "global_step": 410558, "epoch": 2443} {"train_loss": -12.335172653198242, "global_step": 410559, "epoch": 2443} {"train_loss": -12.448246002197266, "global_step": 410560, "epoch": 2443} {"train_loss": -12.724550247192383, "global_step": 410561, "epoch": 2443} {"train_loss": -12.374645233154297, "global_step": 410562, "epoch": 2443} {"train_loss": -12.487932205200195, "global_step": 410563, "epoch": 2443} {"train_loss": -12.702131271362305, "global_step": 410564, "epoch": 2443} {"train_loss": -12.384700775146484, "global_step": 410565, "epoch": 2443} {"train_loss": -11.887545585632324, "global_step": 410566, "epoch": 2443} {"train_loss": -12.330205917358398, "global_step": 410567, "epoch": 2443} {"train_loss": -12.329263687133789, "global_step": 410568, "epoch": 2443} {"train_loss": -11.803997039794922, "global_step": 410569, "epoch": 2443} {"train_loss": -12.726016998291016, "global_step": 410570, "epoch": 2443} {"train_loss": -11.995574951171875, "global_step": 410571, "epoch": 2443} {"train_loss": -12.573524475097656, "global_step": 410572, "epoch": 2443} {"train_loss": -12.3232421875, "global_step": 410573, "epoch": 2443} {"train_loss": -11.551847457885742, "global_step": 410574, "epoch": 2443} {"train_loss": -11.946582794189453, "global_step": 410575, "epoch": 2443} {"train_loss": -12.290578842163086, "global_step": 410576, "epoch": 2443} {"train_loss": -10.65350341796875, "global_step": 410577, "epoch": 2443} {"train_loss": -9.221685409545898, "global_step": 410578, "epoch": 2443} {"train_loss": -12.243988037109375, "global_step": 410579, "epoch": 2443} {"train_loss": -10.046770095825195, "global_step": 410580, "epoch": 2443} {"train_loss": -11.455934524536133, "global_step": 410581, "epoch": 2443} {"train_loss": -11.83223819732666, "global_step": 410582, "epoch": 2443} {"train_loss": -10.260160446166992, "global_step": 410583, "epoch": 2443} {"train_loss": -10.807685852050781, "global_step": 410584, "epoch": 2443} {"train_loss": -11.00654411315918, "global_step": 410585, "epoch": 2443} {"train_loss": -10.454643249511719, "global_step": 410586, "epoch": 2443} {"train_loss": -11.317686080932617, "global_step": 410587, "epoch": 2443} {"train_loss": -11.70933723449707, "global_step": 410588, "epoch": 2443} {"train_loss": -9.118606567382812, "global_step": 410589, "epoch": 2443} {"train_loss": -11.384053230285645, "global_step": 410590, "epoch": 2443} {"train_loss": -11.896250838325138, "global_step": 410591, "epoch": 2443, "val_loss": 302803.71875} {"train_loss": -10.68692398071289, "global_step": 410592, "epoch": 2444} {"train_loss": -11.345165252685547, "global_step": 410593, "epoch": 2444} {"train_loss": -9.893265724182129, "global_step": 410594, "epoch": 2444} {"train_loss": -11.07307243347168, "global_step": 410595, "epoch": 2444} {"train_loss": -10.22646427154541, "global_step": 410596, "epoch": 2444} {"train_loss": -11.619354248046875, "global_step": 410597, "epoch": 2444} {"train_loss": -10.038444519042969, "global_step": 410598, "epoch": 2444} {"train_loss": -11.57811164855957, "global_step": 410599, "epoch": 2444} {"train_loss": -10.761970520019531, "global_step": 410600, "epoch": 2444} {"train_loss": -11.69921875, "global_step": 410601, "epoch": 2444} {"train_loss": -10.97866439819336, "global_step": 410602, "epoch": 2444} {"train_loss": -11.488433837890625, "global_step": 410603, "epoch": 2444} {"train_loss": -11.189168930053711, "global_step": 410604, "epoch": 2444} {"train_loss": -11.937650680541992, "global_step": 410605, "epoch": 2444} {"train_loss": -11.773992538452148, "global_step": 410606, "epoch": 2444} {"train_loss": -11.812625885009766, "global_step": 410607, "epoch": 2444} {"train_loss": -11.261163711547852, "global_step": 410608, "epoch": 2444} {"train_loss": -11.63187026977539, "global_step": 410609, "epoch": 2444} {"train_loss": -11.93172836303711, "global_step": 410610, "epoch": 2444} {"train_loss": -11.552129745483398, "global_step": 410611, "epoch": 2444} {"train_loss": -12.300503730773926, "global_step": 410612, "epoch": 2444} {"train_loss": -11.84764575958252, "global_step": 410613, "epoch": 2444} {"train_loss": -12.213835716247559, "global_step": 410614, "epoch": 2444} {"train_loss": -12.134400367736816, "global_step": 410615, "epoch": 2444} {"train_loss": -12.100013732910156, "global_step": 410616, "epoch": 2444} {"train_loss": -12.186371803283691, "global_step": 410617, "epoch": 2444} {"train_loss": -12.044021606445312, "global_step": 410618, "epoch": 2444} {"train_loss": -12.340692520141602, "global_step": 410619, "epoch": 2444} {"train_loss": -12.219416618347168, "global_step": 410620, "epoch": 2444} {"train_loss": -12.196192741394043, "global_step": 410621, "epoch": 2444} {"train_loss": -11.980062484741211, "global_step": 410622, "epoch": 2444} {"train_loss": -12.157963752746582, "global_step": 410623, "epoch": 2444} {"train_loss": -12.320691108703613, "global_step": 410624, "epoch": 2444} {"train_loss": -12.297558784484863, "global_step": 410625, "epoch": 2444} {"train_loss": -12.365884780883789, "global_step": 410626, "epoch": 2444} {"train_loss": -12.361736297607422, "global_step": 410627, "epoch": 2444} {"train_loss": -12.394657135009766, "global_step": 410628, "epoch": 2444} {"train_loss": -12.360188484191895, "global_step": 410629, "epoch": 2444} {"train_loss": -12.091594696044922, "global_step": 410630, "epoch": 2444} {"train_loss": -12.495570182800293, "global_step": 410631, "epoch": 2444} {"train_loss": -12.38718318939209, "global_step": 410632, "epoch": 2444} {"train_loss": -12.465442657470703, "global_step": 410633, "epoch": 2444} {"train_loss": -12.344282150268555, "global_step": 410634, "epoch": 2444} {"train_loss": -12.275690078735352, "global_step": 410635, "epoch": 2444} {"train_loss": -12.279409408569336, "global_step": 410636, "epoch": 2444} {"train_loss": -12.259531021118164, "global_step": 410637, "epoch": 2444} {"train_loss": -12.278152465820312, "global_step": 410638, "epoch": 2444} {"train_loss": -12.399195671081543, "global_step": 410639, "epoch": 2444} {"train_loss": -12.17776870727539, "global_step": 410640, "epoch": 2444} {"train_loss": -12.444485664367676, "global_step": 410641, "epoch": 2444} {"train_loss": -12.23658561706543, "global_step": 410642, "epoch": 2444} {"train_loss": -12.466384887695312, "global_step": 410643, "epoch": 2444} {"train_loss": -12.28133773803711, "global_step": 410644, "epoch": 2444} {"train_loss": -12.112129211425781, "global_step": 410645, "epoch": 2444} {"train_loss": -12.515153884887695, "global_step": 410646, "epoch": 2444} {"train_loss": -11.944865226745605, "global_step": 410647, "epoch": 2444} {"train_loss": -12.532380104064941, "global_step": 410648, "epoch": 2444} {"train_loss": -12.24136734008789, "global_step": 410649, "epoch": 2444} {"train_loss": -12.163846969604492, "global_step": 410650, "epoch": 2444} {"train_loss": -12.79472541809082, "global_step": 410651, "epoch": 2444} {"train_loss": -12.130378723144531, "global_step": 410652, "epoch": 2444} {"train_loss": -12.637299537658691, "global_step": 410653, "epoch": 2444} {"train_loss": -12.216571807861328, "global_step": 410654, "epoch": 2444} {"train_loss": -12.315926551818848, "global_step": 410655, "epoch": 2444} {"train_loss": -12.369061470031738, "global_step": 410656, "epoch": 2444} {"train_loss": -12.215852737426758, "global_step": 410657, "epoch": 2444} {"train_loss": -12.5709228515625, "global_step": 410658, "epoch": 2444} {"train_loss": -12.160778045654297, "global_step": 410659, "epoch": 2444} {"train_loss": -12.322430610656738, "global_step": 410660, "epoch": 2444} {"train_loss": -12.23476791381836, "global_step": 410661, "epoch": 2444} {"train_loss": -12.246906280517578, "global_step": 410662, "epoch": 2444} {"train_loss": -11.95533275604248, "global_step": 410663, "epoch": 2444} {"train_loss": -12.539722442626953, "global_step": 410664, "epoch": 2444} {"train_loss": -12.302734375, "global_step": 410665, "epoch": 2444} {"train_loss": -12.188660621643066, "global_step": 410666, "epoch": 2444} {"train_loss": -12.109411239624023, "global_step": 410667, "epoch": 2444} {"train_loss": -11.693900108337402, "global_step": 410668, "epoch": 2444} {"train_loss": -11.961977005004883, "global_step": 410669, "epoch": 2444} {"train_loss": -11.690181732177734, "global_step": 410670, "epoch": 2444} {"train_loss": -12.339478492736816, "global_step": 410671, "epoch": 2444} {"train_loss": -11.855438232421875, "global_step": 410672, "epoch": 2444} {"train_loss": -11.45214557647705, "global_step": 410673, "epoch": 2444} {"train_loss": -10.74460506439209, "global_step": 410674, "epoch": 2444} {"train_loss": -11.295852661132812, "global_step": 410675, "epoch": 2444} {"train_loss": -9.994522094726562, "global_step": 410676, "epoch": 2444} {"train_loss": -11.964908599853516, "global_step": 410677, "epoch": 2444} {"train_loss": -9.743481636047363, "global_step": 410678, "epoch": 2444} {"train_loss": -11.993473052978516, "global_step": 410679, "epoch": 2444} {"train_loss": -10.350616455078125, "global_step": 410680, "epoch": 2444} {"train_loss": -12.323343276977539, "global_step": 410681, "epoch": 2444} {"train_loss": -11.704975128173828, "global_step": 410682, "epoch": 2444} {"train_loss": -11.503278732299805, "global_step": 410683, "epoch": 2444} {"train_loss": -11.190711975097656, "global_step": 410684, "epoch": 2444} {"train_loss": -11.567380905151367, "global_step": 410685, "epoch": 2444} {"train_loss": -11.432646751403809, "global_step": 410686, "epoch": 2444} {"train_loss": -11.970083236694336, "global_step": 410687, "epoch": 2444} {"train_loss": -9.880977630615234, "global_step": 410688, "epoch": 2444} {"train_loss": -10.110122680664062, "global_step": 410689, "epoch": 2444} {"train_loss": -11.483160018920898, "global_step": 410690, "epoch": 2444} {"train_loss": -11.328638076782227, "global_step": 410691, "epoch": 2444} {"train_loss": -12.034666061401367, "global_step": 410692, "epoch": 2444} {"train_loss": -11.381425857543945, "global_step": 410693, "epoch": 2444} {"train_loss": -12.017631530761719, "global_step": 410694, "epoch": 2444} {"train_loss": -11.7838773727417, "global_step": 410695, "epoch": 2444} {"train_loss": -12.159490585327148, "global_step": 410696, "epoch": 2444} {"train_loss": -11.429998397827148, "global_step": 410697, "epoch": 2444} {"train_loss": -11.967533111572266, "global_step": 410698, "epoch": 2444} {"train_loss": -11.681856155395508, "global_step": 410699, "epoch": 2444} {"train_loss": -11.910575866699219, "global_step": 410700, "epoch": 2444} {"train_loss": -11.674616813659668, "global_step": 410701, "epoch": 2444} {"train_loss": -11.979037284851074, "global_step": 410702, "epoch": 2444} {"train_loss": -11.284865379333496, "global_step": 410703, "epoch": 2444} {"train_loss": -12.213554382324219, "global_step": 410704, "epoch": 2444} {"train_loss": -12.146904945373535, "global_step": 410705, "epoch": 2444} {"train_loss": -11.973701477050781, "global_step": 410706, "epoch": 2444} {"train_loss": -11.958574295043945, "global_step": 410707, "epoch": 2444} {"train_loss": -12.413352012634277, "global_step": 410708, "epoch": 2444} {"train_loss": -10.975187301635742, "global_step": 410709, "epoch": 2444} {"train_loss": -12.454353332519531, "global_step": 410710, "epoch": 2444} {"train_loss": -11.191763877868652, "global_step": 410711, "epoch": 2444} {"train_loss": -12.445610046386719, "global_step": 410712, "epoch": 2444} {"train_loss": -11.592053413391113, "global_step": 410713, "epoch": 2444} {"train_loss": -12.258255004882812, "global_step": 410714, "epoch": 2444} {"train_loss": -11.766496658325195, "global_step": 410715, "epoch": 2444} {"train_loss": -11.940332412719727, "global_step": 410716, "epoch": 2444} {"train_loss": -11.424027442932129, "global_step": 410717, "epoch": 2444} {"train_loss": -12.054754257202148, "global_step": 410718, "epoch": 2444} {"train_loss": -11.692726135253906, "global_step": 410719, "epoch": 2444} {"train_loss": -12.083335876464844, "global_step": 410720, "epoch": 2444} {"train_loss": -12.29906940460205, "global_step": 410721, "epoch": 2444} {"train_loss": -11.989721298217773, "global_step": 410722, "epoch": 2444} {"train_loss": -12.301298141479492, "global_step": 410723, "epoch": 2444} {"train_loss": -11.90530014038086, "global_step": 410724, "epoch": 2444} {"train_loss": -12.21323013305664, "global_step": 410725, "epoch": 2444} {"train_loss": -12.222600936889648, "global_step": 410726, "epoch": 2444} {"train_loss": -12.130298614501953, "global_step": 410727, "epoch": 2444} {"train_loss": -12.099681854248047, "global_step": 410728, "epoch": 2444} {"train_loss": -12.403621673583984, "global_step": 410729, "epoch": 2444} {"train_loss": -12.136173248291016, "global_step": 410730, "epoch": 2444} {"train_loss": -12.465478897094727, "global_step": 410731, "epoch": 2444} {"train_loss": -12.158501625061035, "global_step": 410732, "epoch": 2444} {"train_loss": -12.3212308883667, "global_step": 410733, "epoch": 2444} {"train_loss": -12.342230796813965, "global_step": 410734, "epoch": 2444} {"train_loss": -12.181205749511719, "global_step": 410735, "epoch": 2444} {"train_loss": -12.309314727783203, "global_step": 410736, "epoch": 2444} {"train_loss": -12.56072998046875, "global_step": 410737, "epoch": 2444} {"train_loss": -12.332635879516602, "global_step": 410738, "epoch": 2444} {"train_loss": -12.640426635742188, "global_step": 410739, "epoch": 2444} {"train_loss": -12.235579490661621, "global_step": 410740, "epoch": 2444} {"train_loss": -12.541449546813965, "global_step": 410741, "epoch": 2444} {"train_loss": -12.427180290222168, "global_step": 410742, "epoch": 2444} {"train_loss": -12.603277206420898, "global_step": 410743, "epoch": 2444} {"train_loss": -12.741974830627441, "global_step": 410744, "epoch": 2444} {"train_loss": -12.368387222290039, "global_step": 410745, "epoch": 2444} {"train_loss": -12.31564712524414, "global_step": 410746, "epoch": 2444} {"train_loss": -12.596853256225586, "global_step": 410747, "epoch": 2444} {"train_loss": -12.412496566772461, "global_step": 410748, "epoch": 2444} {"train_loss": -12.719083786010742, "global_step": 410749, "epoch": 2444} {"train_loss": -12.478141784667969, "global_step": 410750, "epoch": 2444} {"train_loss": -12.542165756225586, "global_step": 410751, "epoch": 2444} {"train_loss": -12.684211730957031, "global_step": 410752, "epoch": 2444} {"train_loss": -12.353885650634766, "global_step": 410753, "epoch": 2444} {"train_loss": -12.412689208984375, "global_step": 410754, "epoch": 2444} {"train_loss": -12.603143692016602, "global_step": 410755, "epoch": 2444} {"train_loss": -12.533489227294922, "global_step": 410756, "epoch": 2444} {"train_loss": -12.44509506225586, "global_step": 410757, "epoch": 2444} {"train_loss": -12.585908889770508, "global_step": 410758, "epoch": 2444} {"train_loss": -11.966166802815028, "global_step": 410759, "epoch": 2444, "val_loss": 303250.09375} {"train_loss": -12.262968063354492, "global_step": 410760, "epoch": 2445} {"train_loss": -12.394453048706055, "global_step": 410761, "epoch": 2445} {"train_loss": -12.44930362701416, "global_step": 410762, "epoch": 2445} {"train_loss": -12.293328285217285, "global_step": 410763, "epoch": 2445} {"train_loss": -12.62087345123291, "global_step": 410764, "epoch": 2445} {"train_loss": -12.532075881958008, "global_step": 410765, "epoch": 2445} {"train_loss": -12.167171478271484, "global_step": 410766, "epoch": 2445} {"train_loss": -12.108168601989746, "global_step": 410767, "epoch": 2445} {"train_loss": -12.269891738891602, "global_step": 410768, "epoch": 2445} {"train_loss": -11.999937057495117, "global_step": 410769, "epoch": 2445} {"train_loss": -11.868999481201172, "global_step": 410770, "epoch": 2445} {"train_loss": -10.937820434570312, "global_step": 410771, "epoch": 2445} {"train_loss": -12.482011795043945, "global_step": 410772, "epoch": 2445} {"train_loss": -10.194826126098633, "global_step": 410773, "epoch": 2445} {"train_loss": -11.158096313476562, "global_step": 410774, "epoch": 2445} {"train_loss": -11.081936836242676, "global_step": 410775, "epoch": 2445} {"train_loss": -10.915879249572754, "global_step": 410776, "epoch": 2445} {"train_loss": -12.005447387695312, "global_step": 410777, "epoch": 2445} {"train_loss": -11.033658981323242, "global_step": 410778, "epoch": 2445} {"train_loss": -10.213563919067383, "global_step": 410779, "epoch": 2445} {"train_loss": -11.44401741027832, "global_step": 410780, "epoch": 2445} {"train_loss": -10.641650199890137, "global_step": 410781, "epoch": 2445} {"train_loss": -10.450185775756836, "global_step": 410782, "epoch": 2445} {"train_loss": -11.701345443725586, "global_step": 410783, "epoch": 2445} {"train_loss": -10.950872421264648, "global_step": 410784, "epoch": 2445} {"train_loss": -10.971940994262695, "global_step": 410785, "epoch": 2445} {"train_loss": -11.476908683776855, "global_step": 410786, "epoch": 2445} {"train_loss": -10.409904479980469, "global_step": 410787, "epoch": 2445} {"train_loss": -11.332711219787598, "global_step": 410788, "epoch": 2445} {"train_loss": -9.748743057250977, "global_step": 410789, "epoch": 2445} {"train_loss": -10.868423461914062, "global_step": 410790, "epoch": 2445} {"train_loss": -10.133567810058594, "global_step": 410791, "epoch": 2445} {"train_loss": -11.799479484558105, "global_step": 410792, "epoch": 2445} {"train_loss": -10.72010326385498, "global_step": 410793, "epoch": 2445} {"train_loss": -11.654884338378906, "global_step": 410794, "epoch": 2445} {"train_loss": -11.328119277954102, "global_step": 410795, "epoch": 2445} {"train_loss": -10.080723762512207, "global_step": 410796, "epoch": 2445} {"train_loss": -11.57518196105957, "global_step": 410797, "epoch": 2445} {"train_loss": -9.159770965576172, "global_step": 410798, "epoch": 2445} {"train_loss": -9.97425365447998, "global_step": 410799, "epoch": 2445} {"train_loss": -10.187897682189941, "global_step": 410800, "epoch": 2445} {"train_loss": -10.255653381347656, "global_step": 410801, "epoch": 2445} {"train_loss": -11.23115348815918, "global_step": 410802, "epoch": 2445} {"train_loss": -10.101619720458984, "global_step": 410803, "epoch": 2445} {"train_loss": -10.599180221557617, "global_step": 410804, "epoch": 2445} {"train_loss": -11.376367568969727, "global_step": 410805, "epoch": 2445} {"train_loss": -11.362359046936035, "global_step": 410806, "epoch": 2445} {"train_loss": -10.298416137695312, "global_step": 410807, "epoch": 2445} {"train_loss": -11.63654613494873, "global_step": 410808, "epoch": 2445} {"train_loss": -10.78466796875, "global_step": 410809, "epoch": 2445} {"train_loss": -11.734891891479492, "global_step": 410810, "epoch": 2445} {"train_loss": -10.750509262084961, "global_step": 410811, "epoch": 2445} {"train_loss": -11.196416854858398, "global_step": 410812, "epoch": 2445} {"train_loss": -11.521100044250488, "global_step": 410813, "epoch": 2445} {"train_loss": -11.383570671081543, "global_step": 410814, "epoch": 2445} {"train_loss": -11.805253982543945, "global_step": 410815, "epoch": 2445} {"train_loss": -11.303207397460938, "global_step": 410816, "epoch": 2445} {"train_loss": -11.8643217086792, "global_step": 410817, "epoch": 2445} {"train_loss": -11.407888412475586, "global_step": 410818, "epoch": 2445} {"train_loss": -12.018270492553711, "global_step": 410819, "epoch": 2445} {"train_loss": -11.708342552185059, "global_step": 410820, "epoch": 2445} {"train_loss": -11.821512222290039, "global_step": 410821, "epoch": 2445} {"train_loss": -11.693510055541992, "global_step": 410822, "epoch": 2445} {"train_loss": -12.274177551269531, "global_step": 410823, "epoch": 2445} {"train_loss": -11.867744445800781, "global_step": 410824, "epoch": 2445} {"train_loss": -12.314790725708008, "global_step": 410825, "epoch": 2445} {"train_loss": -11.869159698486328, "global_step": 410826, "epoch": 2445} {"train_loss": -11.78950309753418, "global_step": 410827, "epoch": 2445} {"train_loss": -11.867228507995605, "global_step": 410828, "epoch": 2445} {"train_loss": -11.735273361206055, "global_step": 410829, "epoch": 2445} {"train_loss": -11.928668975830078, "global_step": 410830, "epoch": 2445} {"train_loss": -11.83907413482666, "global_step": 410831, "epoch": 2445} {"train_loss": -12.064550399780273, "global_step": 410832, "epoch": 2445} {"train_loss": -12.143104553222656, "global_step": 410833, "epoch": 2445} {"train_loss": -12.20671272277832, "global_step": 410834, "epoch": 2445} {"train_loss": -12.011006355285645, "global_step": 410835, "epoch": 2445} {"train_loss": -12.009082794189453, "global_step": 410836, "epoch": 2445} {"train_loss": -12.345014572143555, "global_step": 410837, "epoch": 2445} {"train_loss": -12.149208068847656, "global_step": 410838, "epoch": 2445} {"train_loss": -12.34250545501709, "global_step": 410839, "epoch": 2445} {"train_loss": -12.045524597167969, "global_step": 410840, "epoch": 2445} {"train_loss": -12.346415519714355, "global_step": 410841, "epoch": 2445} {"train_loss": -12.172313690185547, "global_step": 410842, "epoch": 2445} {"train_loss": -12.209112167358398, "global_step": 410843, "epoch": 2445} {"train_loss": -12.092307090759277, "global_step": 410844, "epoch": 2445} {"train_loss": -12.219046592712402, "global_step": 410845, "epoch": 2445} {"train_loss": -12.111934661865234, "global_step": 410846, "epoch": 2445} {"train_loss": -12.496203422546387, "global_step": 410847, "epoch": 2445} {"train_loss": -12.351604461669922, "global_step": 410848, "epoch": 2445} {"train_loss": -12.15426254272461, "global_step": 410849, "epoch": 2445} {"train_loss": -12.535171508789062, "global_step": 410850, "epoch": 2445} {"train_loss": -12.26345443725586, "global_step": 410851, "epoch": 2445} {"train_loss": -12.489938735961914, "global_step": 410852, "epoch": 2445} {"train_loss": -12.33909797668457, "global_step": 410853, "epoch": 2445} {"train_loss": -12.017141342163086, "global_step": 410854, "epoch": 2445} {"train_loss": -12.501226425170898, "global_step": 410855, "epoch": 2445} {"train_loss": -12.318517684936523, "global_step": 410856, "epoch": 2445} {"train_loss": -12.368755340576172, "global_step": 410857, "epoch": 2445} {"train_loss": -12.400711059570312, "global_step": 410858, "epoch": 2445} {"train_loss": -12.384340286254883, "global_step": 410859, "epoch": 2445} {"train_loss": -12.360139846801758, "global_step": 410860, "epoch": 2445} {"train_loss": -12.403829574584961, "global_step": 410861, "epoch": 2445} {"train_loss": -12.454751968383789, "global_step": 410862, "epoch": 2445} {"train_loss": -12.404375076293945, "global_step": 410863, "epoch": 2445} {"train_loss": -12.137697219848633, "global_step": 410864, "epoch": 2445} {"train_loss": -12.398962020874023, "global_step": 410865, "epoch": 2445} {"train_loss": -12.338493347167969, "global_step": 410866, "epoch": 2445} {"train_loss": -12.568490028381348, "global_step": 410867, "epoch": 2445} {"train_loss": -12.481973648071289, "global_step": 410868, "epoch": 2445} {"train_loss": -12.429704666137695, "global_step": 410869, "epoch": 2445} {"train_loss": -12.401071548461914, "global_step": 410870, "epoch": 2445} {"train_loss": -12.242825508117676, "global_step": 410871, "epoch": 2445} {"train_loss": -12.50428581237793, "global_step": 410872, "epoch": 2445} {"train_loss": -12.771984100341797, "global_step": 410873, "epoch": 2445} {"train_loss": -12.33275318145752, "global_step": 410874, "epoch": 2445} {"train_loss": -12.599990844726562, "global_step": 410875, "epoch": 2445} {"train_loss": -12.575300216674805, "global_step": 410876, "epoch": 2445} {"train_loss": -12.608470916748047, "global_step": 410877, "epoch": 2445} {"train_loss": -12.549602508544922, "global_step": 410878, "epoch": 2445} {"train_loss": -12.70602035522461, "global_step": 410879, "epoch": 2445} {"train_loss": -12.56875228881836, "global_step": 410880, "epoch": 2445} {"train_loss": -12.815766334533691, "global_step": 410881, "epoch": 2445} {"train_loss": -12.767072677612305, "global_step": 410882, "epoch": 2445} {"train_loss": -12.590814590454102, "global_step": 410883, "epoch": 2445} {"train_loss": -12.783674240112305, "global_step": 410884, "epoch": 2445} {"train_loss": -12.577005386352539, "global_step": 410885, "epoch": 2445} {"train_loss": -12.770163536071777, "global_step": 410886, "epoch": 2445} {"train_loss": -12.738815307617188, "global_step": 410887, "epoch": 2445} {"train_loss": -12.71142578125, "global_step": 410888, "epoch": 2445} {"train_loss": -12.634809494018555, "global_step": 410889, "epoch": 2445} {"train_loss": -12.750945091247559, "global_step": 410890, "epoch": 2445} {"train_loss": -12.676156997680664, "global_step": 410891, "epoch": 2445} {"train_loss": -12.834787368774414, "global_step": 410892, "epoch": 2445} {"train_loss": -12.762571334838867, "global_step": 410893, "epoch": 2445} {"train_loss": -12.727179527282715, "global_step": 410894, "epoch": 2445} {"train_loss": -12.89349365234375, "global_step": 410895, "epoch": 2445} {"train_loss": -12.850057601928711, "global_step": 410896, "epoch": 2445} {"train_loss": -12.883764266967773, "global_step": 410897, "epoch": 2445} {"train_loss": -12.498261451721191, "global_step": 410898, "epoch": 2445} {"train_loss": -12.396495819091797, "global_step": 410899, "epoch": 2445} {"train_loss": -12.679449081420898, "global_step": 410900, "epoch": 2445} {"train_loss": -12.35274887084961, "global_step": 410901, "epoch": 2445} {"train_loss": -12.053035736083984, "global_step": 410902, "epoch": 2445} {"train_loss": -12.292622566223145, "global_step": 410903, "epoch": 2445} {"train_loss": -12.589818954467773, "global_step": 410904, "epoch": 2445} {"train_loss": -12.310528755187988, "global_step": 410905, "epoch": 2445} {"train_loss": -12.155901908874512, "global_step": 410906, "epoch": 2445} {"train_loss": -12.815141677856445, "global_step": 410907, "epoch": 2445} {"train_loss": -12.503820419311523, "global_step": 410908, "epoch": 2445} {"train_loss": -12.312582969665527, "global_step": 410909, "epoch": 2445} {"train_loss": -12.856942176818848, "global_step": 410910, "epoch": 2445} {"train_loss": -11.987360000610352, "global_step": 410911, "epoch": 2445} {"train_loss": -11.604537963867188, "global_step": 410912, "epoch": 2445} {"train_loss": -12.245505332946777, "global_step": 410913, "epoch": 2445} {"train_loss": -12.703775405883789, "global_step": 410914, "epoch": 2445} {"train_loss": -11.602865219116211, "global_step": 410915, "epoch": 2445} {"train_loss": -10.544038772583008, "global_step": 410916, "epoch": 2445} {"train_loss": -12.0626802444458, "global_step": 410917, "epoch": 2445} {"train_loss": -10.47722053527832, "global_step": 410918, "epoch": 2445} {"train_loss": -11.210027694702148, "global_step": 410919, "epoch": 2445} {"train_loss": -11.438241958618164, "global_step": 410920, "epoch": 2445} {"train_loss": -11.751864433288574, "global_step": 410921, "epoch": 2445} {"train_loss": -11.913548469543457, "global_step": 410922, "epoch": 2445} {"train_loss": -11.471504211425781, "global_step": 410923, "epoch": 2445} {"train_loss": -11.42270278930664, "global_step": 410924, "epoch": 2445} {"train_loss": -10.633753776550293, "global_step": 410925, "epoch": 2445} {"train_loss": -10.849199295043945, "global_step": 410926, "epoch": 2445} {"train_loss": -11.869277301288786, "global_step": 410927, "epoch": 2445, "val_loss": 304346.96875, "train_action_mse_error": 1.897428035736084} {"train_loss": -11.354082107543945, "global_step": 410928, "epoch": 2446} {"train_loss": -11.139820098876953, "global_step": 410929, "epoch": 2446} {"train_loss": -10.57638168334961, "global_step": 410930, "epoch": 2446} {"train_loss": -11.930408477783203, "global_step": 410931, "epoch": 2446} {"train_loss": -10.695117950439453, "global_step": 410932, "epoch": 2446} {"train_loss": -10.675365447998047, "global_step": 410933, "epoch": 2446} {"train_loss": -11.474452018737793, "global_step": 410934, "epoch": 2446} {"train_loss": -10.892024993896484, "global_step": 410935, "epoch": 2446} {"train_loss": -11.993303298950195, "global_step": 410936, "epoch": 2446} {"train_loss": -11.24453353881836, "global_step": 410937, "epoch": 2446} {"train_loss": -10.586668968200684, "global_step": 410938, "epoch": 2446} {"train_loss": -11.937366485595703, "global_step": 410939, "epoch": 2446} {"train_loss": -11.119039535522461, "global_step": 410940, "epoch": 2446} {"train_loss": -11.936399459838867, "global_step": 410941, "epoch": 2446} {"train_loss": -11.676370620727539, "global_step": 410942, "epoch": 2446} {"train_loss": -11.890905380249023, "global_step": 410943, "epoch": 2446} {"train_loss": -11.81801986694336, "global_step": 410944, "epoch": 2446} {"train_loss": -11.774368286132812, "global_step": 410945, "epoch": 2446} {"train_loss": -11.201471328735352, "global_step": 410946, "epoch": 2446} {"train_loss": -11.639636993408203, "global_step": 410947, "epoch": 2446} {"train_loss": -11.478748321533203, "global_step": 410948, "epoch": 2446} {"train_loss": -11.901826858520508, "global_step": 410949, "epoch": 2446} {"train_loss": -11.668060302734375, "global_step": 410950, "epoch": 2446} {"train_loss": -12.07056999206543, "global_step": 410951, "epoch": 2446} {"train_loss": -11.859560012817383, "global_step": 410952, "epoch": 2446} {"train_loss": -12.252016067504883, "global_step": 410953, "epoch": 2446} {"train_loss": -11.727163314819336, "global_step": 410954, "epoch": 2446} {"train_loss": -12.000778198242188, "global_step": 410955, "epoch": 2446} {"train_loss": -11.753182411193848, "global_step": 410956, "epoch": 2446} {"train_loss": -12.146402359008789, "global_step": 410957, "epoch": 2446} {"train_loss": -11.857688903808594, "global_step": 410958, "epoch": 2446} {"train_loss": -11.965007781982422, "global_step": 410959, "epoch": 2446} {"train_loss": -12.023035049438477, "global_step": 410960, "epoch": 2446} {"train_loss": -12.167987823486328, "global_step": 410961, "epoch": 2446} {"train_loss": -12.03018569946289, "global_step": 410962, "epoch": 2446} {"train_loss": -12.045217514038086, "global_step": 410963, "epoch": 2446} {"train_loss": -11.955522537231445, "global_step": 410964, "epoch": 2446} {"train_loss": -11.988353729248047, "global_step": 410965, "epoch": 2446} {"train_loss": -11.745412826538086, "global_step": 410966, "epoch": 2446} {"train_loss": -11.983100891113281, "global_step": 410967, "epoch": 2446} {"train_loss": -11.574811935424805, "global_step": 410968, "epoch": 2446} {"train_loss": -11.802964210510254, "global_step": 410969, "epoch": 2446} {"train_loss": -12.396394729614258, "global_step": 410970, "epoch": 2446} {"train_loss": -11.795706748962402, "global_step": 410971, "epoch": 2446} {"train_loss": -12.010652542114258, "global_step": 410972, "epoch": 2446} {"train_loss": -11.896760940551758, "global_step": 410973, "epoch": 2446} {"train_loss": -12.128816604614258, "global_step": 410974, "epoch": 2446} {"train_loss": -11.628609657287598, "global_step": 410975, "epoch": 2446} {"train_loss": -11.934995651245117, "global_step": 410976, "epoch": 2446} {"train_loss": -12.272034645080566, "global_step": 410977, "epoch": 2446} {"train_loss": -12.167984008789062, "global_step": 410978, "epoch": 2446} {"train_loss": -12.248749732971191, "global_step": 410979, "epoch": 2446} {"train_loss": -12.462587356567383, "global_step": 410980, "epoch": 2446} {"train_loss": -12.48672103881836, "global_step": 410981, "epoch": 2446} {"train_loss": -12.169573783874512, "global_step": 410982, "epoch": 2446} {"train_loss": -12.318812370300293, "global_step": 410983, "epoch": 2446} {"train_loss": -12.342988967895508, "global_step": 410984, "epoch": 2446} {"train_loss": -12.426450729370117, "global_step": 410985, "epoch": 2446} {"train_loss": -12.446855545043945, "global_step": 410986, "epoch": 2446} {"train_loss": -12.164731979370117, "global_step": 410987, "epoch": 2446} {"train_loss": -12.707890510559082, "global_step": 410988, "epoch": 2446} {"train_loss": -12.075437545776367, "global_step": 410989, "epoch": 2446} {"train_loss": -12.254440307617188, "global_step": 410990, "epoch": 2446} {"train_loss": -12.17003059387207, "global_step": 410991, "epoch": 2446} {"train_loss": -12.390443801879883, "global_step": 410992, "epoch": 2446} {"train_loss": -12.409416198730469, "global_step": 410993, "epoch": 2446} {"train_loss": -12.30024242401123, "global_step": 410994, "epoch": 2446} {"train_loss": -12.413389205932617, "global_step": 410995, "epoch": 2446} {"train_loss": -12.338027954101562, "global_step": 410996, "epoch": 2446} {"train_loss": -12.409021377563477, "global_step": 410997, "epoch": 2446} {"train_loss": -12.428516387939453, "global_step": 410998, "epoch": 2446} {"train_loss": -12.45003890991211, "global_step": 410999, "epoch": 2446} {"train_loss": -12.480022430419922, "global_step": 411000, "epoch": 2446} {"train_loss": -12.50424575805664, "global_step": 411001, "epoch": 2446} {"train_loss": -12.52376937866211, "global_step": 411002, "epoch": 2446} {"train_loss": -12.60659122467041, "global_step": 411003, "epoch": 2446} {"train_loss": -12.357205390930176, "global_step": 411004, "epoch": 2446} {"train_loss": -12.562768936157227, "global_step": 411005, "epoch": 2446} {"train_loss": -12.682258605957031, "global_step": 411006, "epoch": 2446} {"train_loss": -12.483320236206055, "global_step": 411007, "epoch": 2446} {"train_loss": -12.672104835510254, "global_step": 411008, "epoch": 2446} {"train_loss": -12.091531753540039, "global_step": 411009, "epoch": 2446} {"train_loss": -12.481425285339355, "global_step": 411010, "epoch": 2446} {"train_loss": -12.501858711242676, "global_step": 411011, "epoch": 2446} {"train_loss": -12.36203384399414, "global_step": 411012, "epoch": 2446} {"train_loss": -12.719840049743652, "global_step": 411013, "epoch": 2446} {"train_loss": -12.556434631347656, "global_step": 411014, "epoch": 2446} {"train_loss": -11.964248657226562, "global_step": 411015, "epoch": 2446} {"train_loss": -12.26968002319336, "global_step": 411016, "epoch": 2446} {"train_loss": -12.801155090332031, "global_step": 411017, "epoch": 2446} {"train_loss": -12.497718811035156, "global_step": 411018, "epoch": 2446} {"train_loss": -12.627229690551758, "global_step": 411019, "epoch": 2446} {"train_loss": -12.583327293395996, "global_step": 411020, "epoch": 2446} {"train_loss": -12.69074821472168, "global_step": 411021, "epoch": 2446} {"train_loss": -12.428218841552734, "global_step": 411022, "epoch": 2446} {"train_loss": -12.766645431518555, "global_step": 411023, "epoch": 2446} {"train_loss": -12.416877746582031, "global_step": 411024, "epoch": 2446} {"train_loss": -12.681571960449219, "global_step": 411025, "epoch": 2446} {"train_loss": -12.636750221252441, "global_step": 411026, "epoch": 2446} {"train_loss": -12.471128463745117, "global_step": 411027, "epoch": 2446} {"train_loss": -12.45557975769043, "global_step": 411028, "epoch": 2446} {"train_loss": -12.553958892822266, "global_step": 411029, "epoch": 2446} {"train_loss": -12.161787033081055, "global_step": 411030, "epoch": 2446} {"train_loss": -12.343414306640625, "global_step": 411031, "epoch": 2446} {"train_loss": -12.537803649902344, "global_step": 411032, "epoch": 2446} {"train_loss": -12.234687805175781, "global_step": 411033, "epoch": 2446} {"train_loss": -12.071874618530273, "global_step": 411034, "epoch": 2446} {"train_loss": -12.50770092010498, "global_step": 411035, "epoch": 2446} {"train_loss": -12.77721881866455, "global_step": 411036, "epoch": 2446} {"train_loss": -12.356082916259766, "global_step": 411037, "epoch": 2446} {"train_loss": -12.672684669494629, "global_step": 411038, "epoch": 2446} {"train_loss": -12.29279899597168, "global_step": 411039, "epoch": 2446} {"train_loss": -12.590877532958984, "global_step": 411040, "epoch": 2446} {"train_loss": -12.472112655639648, "global_step": 411041, "epoch": 2446} {"train_loss": -12.637248992919922, "global_step": 411042, "epoch": 2446} {"train_loss": -11.96927261352539, "global_step": 411043, "epoch": 2446} {"train_loss": -11.530096054077148, "global_step": 411044, "epoch": 2446} {"train_loss": -12.334309577941895, "global_step": 411045, "epoch": 2446} {"train_loss": -12.476408958435059, "global_step": 411046, "epoch": 2446} {"train_loss": -11.714561462402344, "global_step": 411047, "epoch": 2446} {"train_loss": -12.526826858520508, "global_step": 411048, "epoch": 2446} {"train_loss": -11.565224647521973, "global_step": 411049, "epoch": 2446} {"train_loss": -11.958327293395996, "global_step": 411050, "epoch": 2446} {"train_loss": -11.935516357421875, "global_step": 411051, "epoch": 2446} {"train_loss": -11.799121856689453, "global_step": 411052, "epoch": 2446} {"train_loss": -11.40776252746582, "global_step": 411053, "epoch": 2446} {"train_loss": -11.896921157836914, "global_step": 411054, "epoch": 2446} {"train_loss": -9.781042098999023, "global_step": 411055, "epoch": 2446} {"train_loss": -12.78852653503418, "global_step": 411056, "epoch": 2446} {"train_loss": -10.19388198852539, "global_step": 411057, "epoch": 2446} {"train_loss": -10.710893630981445, "global_step": 411058, "epoch": 2446} {"train_loss": -11.202507019042969, "global_step": 411059, "epoch": 2446} {"train_loss": -8.484023094177246, "global_step": 411060, "epoch": 2446} {"train_loss": -9.397683143615723, "global_step": 411061, "epoch": 2446} {"train_loss": -10.054506301879883, "global_step": 411062, "epoch": 2446} {"train_loss": -10.127891540527344, "global_step": 411063, "epoch": 2446} {"train_loss": -10.649717330932617, "global_step": 411064, "epoch": 2446} {"train_loss": -7.824946403503418, "global_step": 411065, "epoch": 2446} {"train_loss": -9.88753890991211, "global_step": 411066, "epoch": 2446} {"train_loss": -8.657732009887695, "global_step": 411067, "epoch": 2446} {"train_loss": -10.532832145690918, "global_step": 411068, "epoch": 2446} {"train_loss": -8.753372192382812, "global_step": 411069, "epoch": 2446} {"train_loss": -9.877408981323242, "global_step": 411070, "epoch": 2446} {"train_loss": -9.806007385253906, "global_step": 411071, "epoch": 2446} {"train_loss": -9.14478874206543, "global_step": 411072, "epoch": 2446} {"train_loss": -9.840389251708984, "global_step": 411073, "epoch": 2446} {"train_loss": -10.600663185119629, "global_step": 411074, "epoch": 2446} {"train_loss": -9.962553024291992, "global_step": 411075, "epoch": 2446} {"train_loss": -10.736754417419434, "global_step": 411076, "epoch": 2446} {"train_loss": -10.772656440734863, "global_step": 411077, "epoch": 2446} {"train_loss": -11.487236976623535, "global_step": 411078, "epoch": 2446} {"train_loss": -11.207326889038086, "global_step": 411079, "epoch": 2446} {"train_loss": -11.215391159057617, "global_step": 411080, "epoch": 2446} {"train_loss": -10.781723976135254, "global_step": 411081, "epoch": 2446} {"train_loss": -11.562395095825195, "global_step": 411082, "epoch": 2446} {"train_loss": -11.380725860595703, "global_step": 411083, "epoch": 2446} {"train_loss": -11.543268203735352, "global_step": 411084, "epoch": 2446} {"train_loss": -11.41940689086914, "global_step": 411085, "epoch": 2446} {"train_loss": -11.98225212097168, "global_step": 411086, "epoch": 2446} {"train_loss": -11.523241996765137, "global_step": 411087, "epoch": 2446} {"train_loss": -11.52751350402832, "global_step": 411088, "epoch": 2446} {"train_loss": -11.332019805908203, "global_step": 411089, "epoch": 2446} {"train_loss": -11.704875946044922, "global_step": 411090, "epoch": 2446} {"train_loss": -11.430994033813477, "global_step": 411091, "epoch": 2446} {"train_loss": -12.191863059997559, "global_step": 411092, "epoch": 2446} {"train_loss": -11.87177848815918, "global_step": 411093, "epoch": 2446} {"train_loss": -11.405876159667969, "global_step": 411094, "epoch": 2446} {"train_loss": -11.752342031115578, "global_step": 411095, "epoch": 2446, "val_loss": 301259.03125} {"train_loss": -11.771957397460938, "global_step": 411096, "epoch": 2447} {"train_loss": -11.710039138793945, "global_step": 411097, "epoch": 2447} {"train_loss": -11.940186500549316, "global_step": 411098, "epoch": 2447} {"train_loss": -11.720285415649414, "global_step": 411099, "epoch": 2447} {"train_loss": -11.893339157104492, "global_step": 411100, "epoch": 2447} {"train_loss": -11.744342803955078, "global_step": 411101, "epoch": 2447} {"train_loss": -12.02789306640625, "global_step": 411102, "epoch": 2447} {"train_loss": -12.011775016784668, "global_step": 411103, "epoch": 2447} {"train_loss": -11.78264045715332, "global_step": 411104, "epoch": 2447} {"train_loss": -11.819435119628906, "global_step": 411105, "epoch": 2447} {"train_loss": -12.2149658203125, "global_step": 411106, "epoch": 2447} {"train_loss": -12.045328140258789, "global_step": 411107, "epoch": 2447} {"train_loss": -12.145214080810547, "global_step": 411108, "epoch": 2447} {"train_loss": -12.047086715698242, "global_step": 411109, "epoch": 2447} {"train_loss": -11.721481323242188, "global_step": 411110, "epoch": 2447} {"train_loss": -12.071294784545898, "global_step": 411111, "epoch": 2447} {"train_loss": -11.421478271484375, "global_step": 411112, "epoch": 2447} {"train_loss": -11.61918830871582, "global_step": 411113, "epoch": 2447} {"train_loss": -11.716422080993652, "global_step": 411114, "epoch": 2447} {"train_loss": -11.516195297241211, "global_step": 411115, "epoch": 2447} {"train_loss": -11.924009323120117, "global_step": 411116, "epoch": 2447} {"train_loss": -11.699106216430664, "global_step": 411117, "epoch": 2447} {"train_loss": -11.99893569946289, "global_step": 411118, "epoch": 2447} {"train_loss": -11.508453369140625, "global_step": 411119, "epoch": 2447} {"train_loss": -11.971762657165527, "global_step": 411120, "epoch": 2447} {"train_loss": -12.192420959472656, "global_step": 411121, "epoch": 2447} {"train_loss": -11.836697578430176, "global_step": 411122, "epoch": 2447} {"train_loss": -12.101175308227539, "global_step": 411123, "epoch": 2447} {"train_loss": -11.625356674194336, "global_step": 411124, "epoch": 2447} {"train_loss": -12.216296195983887, "global_step": 411125, "epoch": 2447} {"train_loss": -11.821382522583008, "global_step": 411126, "epoch": 2447} {"train_loss": -12.325904846191406, "global_step": 411127, "epoch": 2447} {"train_loss": -11.764720916748047, "global_step": 411128, "epoch": 2447} {"train_loss": -12.210578918457031, "global_step": 411129, "epoch": 2447} {"train_loss": -11.792694091796875, "global_step": 411130, "epoch": 2447} {"train_loss": -12.117247581481934, "global_step": 411131, "epoch": 2447} {"train_loss": -12.13679313659668, "global_step": 411132, "epoch": 2447} {"train_loss": -11.758697509765625, "global_step": 411133, "epoch": 2447} {"train_loss": -12.35307502746582, "global_step": 411134, "epoch": 2447} {"train_loss": -11.950788497924805, "global_step": 411135, "epoch": 2447} {"train_loss": -11.943769454956055, "global_step": 411136, "epoch": 2447} {"train_loss": -11.86964225769043, "global_step": 411137, "epoch": 2447} {"train_loss": -11.680620193481445, "global_step": 411138, "epoch": 2447} {"train_loss": -12.38350772857666, "global_step": 411139, "epoch": 2447} {"train_loss": -12.035934448242188, "global_step": 411140, "epoch": 2447} {"train_loss": -12.148172378540039, "global_step": 411141, "epoch": 2447} {"train_loss": -12.15462875366211, "global_step": 411142, "epoch": 2447} {"train_loss": -11.487606048583984, "global_step": 411143, "epoch": 2447} {"train_loss": -12.383672714233398, "global_step": 411144, "epoch": 2447} {"train_loss": -11.38666820526123, "global_step": 411145, "epoch": 2447} {"train_loss": -11.937776565551758, "global_step": 411146, "epoch": 2447} {"train_loss": -11.796537399291992, "global_step": 411147, "epoch": 2447} {"train_loss": -11.795320510864258, "global_step": 411148, "epoch": 2447} {"train_loss": -12.125347137451172, "global_step": 411149, "epoch": 2447} {"train_loss": -11.355335235595703, "global_step": 411150, "epoch": 2447} {"train_loss": -11.935575485229492, "global_step": 411151, "epoch": 2447} {"train_loss": -12.142478942871094, "global_step": 411152, "epoch": 2447} {"train_loss": -11.765922546386719, "global_step": 411153, "epoch": 2447} {"train_loss": -12.233976364135742, "global_step": 411154, "epoch": 2447} {"train_loss": -11.977483749389648, "global_step": 411155, "epoch": 2447} {"train_loss": -12.111621856689453, "global_step": 411156, "epoch": 2447} {"train_loss": -12.410642623901367, "global_step": 411157, "epoch": 2447} {"train_loss": -11.736005783081055, "global_step": 411158, "epoch": 2447} {"train_loss": -12.411017417907715, "global_step": 411159, "epoch": 2447} {"train_loss": -11.626508712768555, "global_step": 411160, "epoch": 2447} {"train_loss": -11.98587703704834, "global_step": 411161, "epoch": 2447} {"train_loss": -11.156356811523438, "global_step": 411162, "epoch": 2447} {"train_loss": -11.787532806396484, "global_step": 411163, "epoch": 2447} {"train_loss": -11.71059799194336, "global_step": 411164, "epoch": 2447} {"train_loss": -11.644649505615234, "global_step": 411165, "epoch": 2447} {"train_loss": -12.114688873291016, "global_step": 411166, "epoch": 2447} {"train_loss": -11.214376449584961, "global_step": 411167, "epoch": 2447} {"train_loss": -12.163875579833984, "global_step": 411168, "epoch": 2447} {"train_loss": -12.09267807006836, "global_step": 411169, "epoch": 2447} {"train_loss": -12.065281867980957, "global_step": 411170, "epoch": 2447} {"train_loss": -12.082073211669922, "global_step": 411171, "epoch": 2447} {"train_loss": -12.364574432373047, "global_step": 411172, "epoch": 2447} {"train_loss": -12.217367172241211, "global_step": 411173, "epoch": 2447} {"train_loss": -11.735666275024414, "global_step": 411174, "epoch": 2447} {"train_loss": -12.516407012939453, "global_step": 411175, "epoch": 2447} {"train_loss": -11.873638153076172, "global_step": 411176, "epoch": 2447} {"train_loss": -12.554864883422852, "global_step": 411177, "epoch": 2447} {"train_loss": -12.003318786621094, "global_step": 411178, "epoch": 2447} {"train_loss": -12.549066543579102, "global_step": 411179, "epoch": 2447} {"train_loss": -12.350325584411621, "global_step": 411180, "epoch": 2447} {"train_loss": -12.436254501342773, "global_step": 411181, "epoch": 2447} {"train_loss": -12.627130508422852, "global_step": 411182, "epoch": 2447} {"train_loss": -12.486095428466797, "global_step": 411183, "epoch": 2447} {"train_loss": -12.206571578979492, "global_step": 411184, "epoch": 2447} {"train_loss": -12.421371459960938, "global_step": 411185, "epoch": 2447} {"train_loss": -12.290939331054688, "global_step": 411186, "epoch": 2447} {"train_loss": -12.608024597167969, "global_step": 411187, "epoch": 2447} {"train_loss": -12.216911315917969, "global_step": 411188, "epoch": 2447} {"train_loss": -12.46898078918457, "global_step": 411189, "epoch": 2447} {"train_loss": -12.325498580932617, "global_step": 411190, "epoch": 2447} {"train_loss": -12.68893814086914, "global_step": 411191, "epoch": 2447} {"train_loss": -12.360143661499023, "global_step": 411192, "epoch": 2447} {"train_loss": -11.891469955444336, "global_step": 411193, "epoch": 2447} {"train_loss": -12.483756065368652, "global_step": 411194, "epoch": 2447} {"train_loss": -11.851852416992188, "global_step": 411195, "epoch": 2447} {"train_loss": -12.148402214050293, "global_step": 411196, "epoch": 2447} {"train_loss": -12.382431030273438, "global_step": 411197, "epoch": 2447} {"train_loss": -12.420849800109863, "global_step": 411198, "epoch": 2447} {"train_loss": -12.511234283447266, "global_step": 411199, "epoch": 2447} {"train_loss": -12.380648612976074, "global_step": 411200, "epoch": 2447} {"train_loss": -12.23040771484375, "global_step": 411201, "epoch": 2447} {"train_loss": -12.465274810791016, "global_step": 411202, "epoch": 2447} {"train_loss": -12.19554328918457, "global_step": 411203, "epoch": 2447} {"train_loss": -12.420822143554688, "global_step": 411204, "epoch": 2447} {"train_loss": -12.32404899597168, "global_step": 411205, "epoch": 2447} {"train_loss": -12.601999282836914, "global_step": 411206, "epoch": 2447} {"train_loss": -12.137002944946289, "global_step": 411207, "epoch": 2447} {"train_loss": -12.167880058288574, "global_step": 411208, "epoch": 2447} {"train_loss": -12.386433601379395, "global_step": 411209, "epoch": 2447} {"train_loss": -12.397674560546875, "global_step": 411210, "epoch": 2447} {"train_loss": -12.531394958496094, "global_step": 411211, "epoch": 2447} {"train_loss": -12.601789474487305, "global_step": 411212, "epoch": 2447} {"train_loss": -12.352828979492188, "global_step": 411213, "epoch": 2447} {"train_loss": -12.534805297851562, "global_step": 411214, "epoch": 2447} {"train_loss": -12.559610366821289, "global_step": 411215, "epoch": 2447} {"train_loss": -12.302850723266602, "global_step": 411216, "epoch": 2447} {"train_loss": -12.108319282531738, "global_step": 411217, "epoch": 2447} {"train_loss": -12.745915412902832, "global_step": 411218, "epoch": 2447} {"train_loss": -12.388790130615234, "global_step": 411219, "epoch": 2447} {"train_loss": -12.566944122314453, "global_step": 411220, "epoch": 2447} {"train_loss": -12.312739372253418, "global_step": 411221, "epoch": 2447} {"train_loss": -12.59775447845459, "global_step": 411222, "epoch": 2447} {"train_loss": -11.898066520690918, "global_step": 411223, "epoch": 2447} {"train_loss": -12.6070556640625, "global_step": 411224, "epoch": 2447} {"train_loss": -12.019261360168457, "global_step": 411225, "epoch": 2447} {"train_loss": -12.611953735351562, "global_step": 411226, "epoch": 2447} {"train_loss": -11.949139595031738, "global_step": 411227, "epoch": 2447} {"train_loss": -12.061187744140625, "global_step": 411228, "epoch": 2447} {"train_loss": -11.769057273864746, "global_step": 411229, "epoch": 2447} {"train_loss": -11.300378799438477, "global_step": 411230, "epoch": 2447} {"train_loss": -12.206609725952148, "global_step": 411231, "epoch": 2447} {"train_loss": -11.812040328979492, "global_step": 411232, "epoch": 2447} {"train_loss": -11.042838096618652, "global_step": 411233, "epoch": 2447} {"train_loss": -11.985487937927246, "global_step": 411234, "epoch": 2447} {"train_loss": -12.263636589050293, "global_step": 411235, "epoch": 2447} {"train_loss": -11.68847370147705, "global_step": 411236, "epoch": 2447} {"train_loss": -12.077710151672363, "global_step": 411237, "epoch": 2447} {"train_loss": -12.354212760925293, "global_step": 411238, "epoch": 2447} {"train_loss": -12.37711238861084, "global_step": 411239, "epoch": 2447} {"train_loss": -11.912126541137695, "global_step": 411240, "epoch": 2447} {"train_loss": -12.485523223876953, "global_step": 411241, "epoch": 2447} {"train_loss": -11.693185806274414, "global_step": 411242, "epoch": 2447} {"train_loss": -12.044811248779297, "global_step": 411243, "epoch": 2447} {"train_loss": -11.970766067504883, "global_step": 411244, "epoch": 2447} {"train_loss": -12.23442554473877, "global_step": 411245, "epoch": 2447} {"train_loss": -11.92492961883545, "global_step": 411246, "epoch": 2447} {"train_loss": -12.094497680664062, "global_step": 411247, "epoch": 2447} {"train_loss": -12.045589447021484, "global_step": 411248, "epoch": 2447} {"train_loss": -12.43265151977539, "global_step": 411249, "epoch": 2447} {"train_loss": -11.830524444580078, "global_step": 411250, "epoch": 2447} {"train_loss": -12.365723609924316, "global_step": 411251, "epoch": 2447} {"train_loss": -11.83670711517334, "global_step": 411252, "epoch": 2447} {"train_loss": -12.40980339050293, "global_step": 411253, "epoch": 2447} {"train_loss": -11.855669021606445, "global_step": 411254, "epoch": 2447} {"train_loss": -12.27475357055664, "global_step": 411255, "epoch": 2447} {"train_loss": -12.289953231811523, "global_step": 411256, "epoch": 2447} {"train_loss": -12.24502182006836, "global_step": 411257, "epoch": 2447} {"train_loss": -12.318056106567383, "global_step": 411258, "epoch": 2447} {"train_loss": -12.701379776000977, "global_step": 411259, "epoch": 2447} {"train_loss": -11.88753890991211, "global_step": 411260, "epoch": 2447} {"train_loss": -12.68117618560791, "global_step": 411261, "epoch": 2447} {"train_loss": -12.175657272338867, "global_step": 411262, "epoch": 2447} {"train_loss": -12.087927290371486, "global_step": 411263, "epoch": 2447, "val_loss": 308445.59375} {"train_loss": -12.673471450805664, "global_step": 411264, "epoch": 2448} {"train_loss": -12.31016731262207, "global_step": 411265, "epoch": 2448} {"train_loss": -12.423650741577148, "global_step": 411266, "epoch": 2448} {"train_loss": -12.413700103759766, "global_step": 411267, "epoch": 2448} {"train_loss": -12.046930313110352, "global_step": 411268, "epoch": 2448} {"train_loss": -12.110366821289062, "global_step": 411269, "epoch": 2448} {"train_loss": -12.617883682250977, "global_step": 411270, "epoch": 2448} {"train_loss": -12.223257064819336, "global_step": 411271, "epoch": 2448} {"train_loss": -12.497039794921875, "global_step": 411272, "epoch": 2448} {"train_loss": -12.425607681274414, "global_step": 411273, "epoch": 2448} {"train_loss": -12.566463470458984, "global_step": 411274, "epoch": 2448} {"train_loss": -12.539762496948242, "global_step": 411275, "epoch": 2448} {"train_loss": -12.008155822753906, "global_step": 411276, "epoch": 2448} {"train_loss": -12.431528091430664, "global_step": 411277, "epoch": 2448} {"train_loss": -12.25560188293457, "global_step": 411278, "epoch": 2448} {"train_loss": -12.622505187988281, "global_step": 411279, "epoch": 2448} {"train_loss": -12.230388641357422, "global_step": 411280, "epoch": 2448} {"train_loss": -12.315635681152344, "global_step": 411281, "epoch": 2448} {"train_loss": -12.381759643554688, "global_step": 411282, "epoch": 2448} {"train_loss": -12.428694725036621, "global_step": 411283, "epoch": 2448} {"train_loss": -12.700965881347656, "global_step": 411284, "epoch": 2448} {"train_loss": -12.255666732788086, "global_step": 411285, "epoch": 2448} {"train_loss": -12.628141403198242, "global_step": 411286, "epoch": 2448} {"train_loss": -12.493446350097656, "global_step": 411287, "epoch": 2448} {"train_loss": -12.242239952087402, "global_step": 411288, "epoch": 2448} {"train_loss": -12.59627914428711, "global_step": 411289, "epoch": 2448} {"train_loss": -11.954456329345703, "global_step": 411290, "epoch": 2448} {"train_loss": -12.304887771606445, "global_step": 411291, "epoch": 2448} {"train_loss": -12.306329727172852, "global_step": 411292, "epoch": 2448} {"train_loss": -12.121709823608398, "global_step": 411293, "epoch": 2448} {"train_loss": -12.555731773376465, "global_step": 411294, "epoch": 2448} {"train_loss": -12.386984825134277, "global_step": 411295, "epoch": 2448} {"train_loss": -11.837727546691895, "global_step": 411296, "epoch": 2448} {"train_loss": -12.030192375183105, "global_step": 411297, "epoch": 2448} {"train_loss": -12.52584457397461, "global_step": 411298, "epoch": 2448} {"train_loss": -11.912203788757324, "global_step": 411299, "epoch": 2448} {"train_loss": -12.281194686889648, "global_step": 411300, "epoch": 2448} {"train_loss": -12.433361053466797, "global_step": 411301, "epoch": 2448} {"train_loss": -12.14210033416748, "global_step": 411302, "epoch": 2448} {"train_loss": -12.161096572875977, "global_step": 411303, "epoch": 2448} {"train_loss": -12.357715606689453, "global_step": 411304, "epoch": 2448} {"train_loss": -11.810617446899414, "global_step": 411305, "epoch": 2448} {"train_loss": -12.500889778137207, "global_step": 411306, "epoch": 2448} {"train_loss": -11.869425773620605, "global_step": 411307, "epoch": 2448} {"train_loss": -11.440980911254883, "global_step": 411308, "epoch": 2448} {"train_loss": -12.023980140686035, "global_step": 411309, "epoch": 2448} {"train_loss": -12.03840446472168, "global_step": 411310, "epoch": 2448} {"train_loss": -11.818178176879883, "global_step": 411311, "epoch": 2448} {"train_loss": -12.346341133117676, "global_step": 411312, "epoch": 2448} {"train_loss": -11.59890079498291, "global_step": 411313, "epoch": 2448} {"train_loss": -12.17892837524414, "global_step": 411314, "epoch": 2448} {"train_loss": -11.984047889709473, "global_step": 411315, "epoch": 2448} {"train_loss": -11.422733306884766, "global_step": 411316, "epoch": 2448} {"train_loss": -12.267618179321289, "global_step": 411317, "epoch": 2448} {"train_loss": -11.71291732788086, "global_step": 411318, "epoch": 2448} {"train_loss": -12.209716796875, "global_step": 411319, "epoch": 2448} {"train_loss": -11.814132690429688, "global_step": 411320, "epoch": 2448} {"train_loss": -11.52894401550293, "global_step": 411321, "epoch": 2448} {"train_loss": -12.252788543701172, "global_step": 411322, "epoch": 2448} {"train_loss": -11.952980041503906, "global_step": 411323, "epoch": 2448} {"train_loss": -12.207839965820312, "global_step": 411324, "epoch": 2448} {"train_loss": -12.307649612426758, "global_step": 411325, "epoch": 2448} {"train_loss": -12.288545608520508, "global_step": 411326, "epoch": 2448} {"train_loss": -12.252264976501465, "global_step": 411327, "epoch": 2448} {"train_loss": -11.930501937866211, "global_step": 411328, "epoch": 2448} {"train_loss": -12.124889373779297, "global_step": 411329, "epoch": 2448} {"train_loss": -12.573711395263672, "global_step": 411330, "epoch": 2448} {"train_loss": -12.143043518066406, "global_step": 411331, "epoch": 2448} {"train_loss": -12.315340042114258, "global_step": 411332, "epoch": 2448} {"train_loss": -12.668792724609375, "global_step": 411333, "epoch": 2448} {"train_loss": -12.236157417297363, "global_step": 411334, "epoch": 2448} {"train_loss": -12.040757179260254, "global_step": 411335, "epoch": 2448} {"train_loss": -12.002402305603027, "global_step": 411336, "epoch": 2448} {"train_loss": -11.582865715026855, "global_step": 411337, "epoch": 2448} {"train_loss": -12.253633499145508, "global_step": 411338, "epoch": 2448} {"train_loss": -12.182586669921875, "global_step": 411339, "epoch": 2448} {"train_loss": -9.461015701293945, "global_step": 411340, "epoch": 2448} {"train_loss": -11.632339477539062, "global_step": 411341, "epoch": 2448} {"train_loss": -9.954254150390625, "global_step": 411342, "epoch": 2448} {"train_loss": -9.956300735473633, "global_step": 411343, "epoch": 2448} {"train_loss": -8.622669219970703, "global_step": 411344, "epoch": 2448} {"train_loss": -11.112951278686523, "global_step": 411345, "epoch": 2448} {"train_loss": -7.600009918212891, "global_step": 411346, "epoch": 2448} {"train_loss": -7.3589324951171875, "global_step": 411347, "epoch": 2448} {"train_loss": -8.360321044921875, "global_step": 411348, "epoch": 2448} {"train_loss": -8.664877891540527, "global_step": 411349, "epoch": 2448} {"train_loss": -9.093668937683105, "global_step": 411350, "epoch": 2448} {"train_loss": -9.689009666442871, "global_step": 411351, "epoch": 2448} {"train_loss": -10.74026870727539, "global_step": 411352, "epoch": 2448} {"train_loss": -8.750167846679688, "global_step": 411353, "epoch": 2448} {"train_loss": -9.773143768310547, "global_step": 411354, "epoch": 2448} {"train_loss": -9.73634147644043, "global_step": 411355, "epoch": 2448} {"train_loss": -9.228679656982422, "global_step": 411356, "epoch": 2448} {"train_loss": -9.761683464050293, "global_step": 411357, "epoch": 2448} {"train_loss": -11.180140495300293, "global_step": 411358, "epoch": 2448} {"train_loss": -8.98514175415039, "global_step": 411359, "epoch": 2448} {"train_loss": -8.133914947509766, "global_step": 411360, "epoch": 2448} {"train_loss": -8.963855743408203, "global_step": 411361, "epoch": 2448} {"train_loss": -9.666437149047852, "global_step": 411362, "epoch": 2448} {"train_loss": -9.003782272338867, "global_step": 411363, "epoch": 2448} {"train_loss": -9.717504501342773, "global_step": 411364, "epoch": 2448} {"train_loss": -10.250572204589844, "global_step": 411365, "epoch": 2448} {"train_loss": -10.435871124267578, "global_step": 411366, "epoch": 2448} {"train_loss": -10.008932113647461, "global_step": 411367, "epoch": 2448} {"train_loss": -11.013646125793457, "global_step": 411368, "epoch": 2448} {"train_loss": -11.653497695922852, "global_step": 411369, "epoch": 2448} {"train_loss": -10.57010555267334, "global_step": 411370, "epoch": 2448} {"train_loss": -11.609331130981445, "global_step": 411371, "epoch": 2448} {"train_loss": -11.20096206665039, "global_step": 411372, "epoch": 2448} {"train_loss": -10.644365310668945, "global_step": 411373, "epoch": 2448} {"train_loss": -11.754542350769043, "global_step": 411374, "epoch": 2448} {"train_loss": -11.31014633178711, "global_step": 411375, "epoch": 2448} {"train_loss": -11.875664710998535, "global_step": 411376, "epoch": 2448} {"train_loss": -11.168983459472656, "global_step": 411377, "epoch": 2448} {"train_loss": -11.566703796386719, "global_step": 411378, "epoch": 2448} {"train_loss": -11.448553085327148, "global_step": 411379, "epoch": 2448} {"train_loss": -11.60566234588623, "global_step": 411380, "epoch": 2448} {"train_loss": -11.429985046386719, "global_step": 411381, "epoch": 2448} {"train_loss": -11.67791748046875, "global_step": 411382, "epoch": 2448} {"train_loss": -11.613798141479492, "global_step": 411383, "epoch": 2448} {"train_loss": -12.194585800170898, "global_step": 411384, "epoch": 2448} {"train_loss": -11.962251663208008, "global_step": 411385, "epoch": 2448} {"train_loss": -12.0892333984375, "global_step": 411386, "epoch": 2448} {"train_loss": -11.879352569580078, "global_step": 411387, "epoch": 2448} {"train_loss": -11.929960250854492, "global_step": 411388, "epoch": 2448} {"train_loss": -12.13949203491211, "global_step": 411389, "epoch": 2448} {"train_loss": -11.677566528320312, "global_step": 411390, "epoch": 2448} {"train_loss": -12.075803756713867, "global_step": 411391, "epoch": 2448} {"train_loss": -11.948721885681152, "global_step": 411392, "epoch": 2448} {"train_loss": -12.360039710998535, "global_step": 411393, "epoch": 2448} {"train_loss": -12.041732788085938, "global_step": 411394, "epoch": 2448} {"train_loss": -11.979036331176758, "global_step": 411395, "epoch": 2448} {"train_loss": -12.203313827514648, "global_step": 411396, "epoch": 2448} {"train_loss": -11.987478256225586, "global_step": 411397, "epoch": 2448} {"train_loss": -11.952001571655273, "global_step": 411398, "epoch": 2448} {"train_loss": -12.231619834899902, "global_step": 411399, "epoch": 2448} {"train_loss": -11.781129837036133, "global_step": 411400, "epoch": 2448} {"train_loss": -12.21281623840332, "global_step": 411401, "epoch": 2448} {"train_loss": -12.384392738342285, "global_step": 411402, "epoch": 2448} {"train_loss": -11.907365798950195, "global_step": 411403, "epoch": 2448} {"train_loss": -12.248099327087402, "global_step": 411404, "epoch": 2448} {"train_loss": -12.235176086425781, "global_step": 411405, "epoch": 2448} {"train_loss": -12.30431842803955, "global_step": 411406, "epoch": 2448} {"train_loss": -12.190780639648438, "global_step": 411407, "epoch": 2448} {"train_loss": -12.11206340789795, "global_step": 411408, "epoch": 2448} {"train_loss": -12.012508392333984, "global_step": 411409, "epoch": 2448} {"train_loss": -12.330594062805176, "global_step": 411410, "epoch": 2448} {"train_loss": -12.010108947753906, "global_step": 411411, "epoch": 2448} {"train_loss": -12.111597061157227, "global_step": 411412, "epoch": 2448} {"train_loss": -12.156686782836914, "global_step": 411413, "epoch": 2448} {"train_loss": -12.531885147094727, "global_step": 411414, "epoch": 2448} {"train_loss": -12.403648376464844, "global_step": 411415, "epoch": 2448} {"train_loss": -12.30558967590332, "global_step": 411416, "epoch": 2448} {"train_loss": -12.120588302612305, "global_step": 411417, "epoch": 2448} {"train_loss": -12.412689208984375, "global_step": 411418, "epoch": 2448} {"train_loss": -12.212203979492188, "global_step": 411419, "epoch": 2448} {"train_loss": -12.490619659423828, "global_step": 411420, "epoch": 2448} {"train_loss": -12.243408203125, "global_step": 411421, "epoch": 2448} {"train_loss": -12.365160942077637, "global_step": 411422, "epoch": 2448} {"train_loss": -12.262618064880371, "global_step": 411423, "epoch": 2448} {"train_loss": -12.534109115600586, "global_step": 411424, "epoch": 2448} {"train_loss": -12.305177688598633, "global_step": 411425, "epoch": 2448} {"train_loss": -12.43138313293457, "global_step": 411426, "epoch": 2448} {"train_loss": -12.538415908813477, "global_step": 411427, "epoch": 2448} {"train_loss": -12.50349235534668, "global_step": 411428, "epoch": 2448} {"train_loss": -12.461187362670898, "global_step": 411429, "epoch": 2448} {"train_loss": -12.654256820678711, "global_step": 411430, "epoch": 2448} {"train_loss": -11.67515967005775, "global_step": 411431, "epoch": 2448, "val_loss": 302986.03125} {"train_loss": -12.507312774658203, "global_step": 411432, "epoch": 2449} {"train_loss": -12.60313606262207, "global_step": 411433, "epoch": 2449} {"train_loss": -12.530652046203613, "global_step": 411434, "epoch": 2449} {"train_loss": -12.460792541503906, "global_step": 411435, "epoch": 2449} {"train_loss": -12.67024040222168, "global_step": 411436, "epoch": 2449} {"train_loss": -12.269391059875488, "global_step": 411437, "epoch": 2449} {"train_loss": -12.616247177124023, "global_step": 411438, "epoch": 2449} {"train_loss": -12.379830360412598, "global_step": 411439, "epoch": 2449} {"train_loss": -12.551092147827148, "global_step": 411440, "epoch": 2449} {"train_loss": -12.562520980834961, "global_step": 411441, "epoch": 2449} {"train_loss": -12.500190734863281, "global_step": 411442, "epoch": 2449} {"train_loss": -12.52003002166748, "global_step": 411443, "epoch": 2449} {"train_loss": -12.52004623413086, "global_step": 411444, "epoch": 2449} {"train_loss": -12.251375198364258, "global_step": 411445, "epoch": 2449} {"train_loss": -12.797338485717773, "global_step": 411446, "epoch": 2449} {"train_loss": -12.245296478271484, "global_step": 411447, "epoch": 2449} {"train_loss": -12.65342903137207, "global_step": 411448, "epoch": 2449} {"train_loss": -12.423669815063477, "global_step": 411449, "epoch": 2449} {"train_loss": -12.577059745788574, "global_step": 411450, "epoch": 2449} {"train_loss": -12.024762153625488, "global_step": 411451, "epoch": 2449} {"train_loss": -12.560032844543457, "global_step": 411452, "epoch": 2449} {"train_loss": -12.561110496520996, "global_step": 411453, "epoch": 2449} {"train_loss": -12.488179206848145, "global_step": 411454, "epoch": 2449} {"train_loss": -12.69716739654541, "global_step": 411455, "epoch": 2449} {"train_loss": -12.407478332519531, "global_step": 411456, "epoch": 2449} {"train_loss": -12.539434432983398, "global_step": 411457, "epoch": 2449} {"train_loss": -12.460790634155273, "global_step": 411458, "epoch": 2449} {"train_loss": -12.660138130187988, "global_step": 411459, "epoch": 2449} {"train_loss": -12.195334434509277, "global_step": 411460, "epoch": 2449} {"train_loss": -12.271856307983398, "global_step": 411461, "epoch": 2449} {"train_loss": -12.641737937927246, "global_step": 411462, "epoch": 2449} {"train_loss": -12.698894500732422, "global_step": 411463, "epoch": 2449} {"train_loss": -11.937911987304688, "global_step": 411464, "epoch": 2449} {"train_loss": -12.184236526489258, "global_step": 411465, "epoch": 2449} {"train_loss": -12.470723152160645, "global_step": 411466, "epoch": 2449} {"train_loss": -11.674346923828125, "global_step": 411467, "epoch": 2449} {"train_loss": -10.961838722229004, "global_step": 411468, "epoch": 2449} {"train_loss": -11.798585891723633, "global_step": 411469, "epoch": 2449} {"train_loss": -12.482133865356445, "global_step": 411470, "epoch": 2449} {"train_loss": -12.032442092895508, "global_step": 411471, "epoch": 2449} {"train_loss": -12.726913452148438, "global_step": 411472, "epoch": 2449} {"train_loss": -11.980813026428223, "global_step": 411473, "epoch": 2449} {"train_loss": -11.269875526428223, "global_step": 411474, "epoch": 2449} {"train_loss": -12.369377136230469, "global_step": 411475, "epoch": 2449} {"train_loss": -11.871088981628418, "global_step": 411476, "epoch": 2449} {"train_loss": -10.592498779296875, "global_step": 411477, "epoch": 2449} {"train_loss": -12.135024070739746, "global_step": 411478, "epoch": 2449} {"train_loss": -12.287306785583496, "global_step": 411479, "epoch": 2449} {"train_loss": -11.705817222595215, "global_step": 411480, "epoch": 2449} {"train_loss": -12.384220123291016, "global_step": 411481, "epoch": 2449} {"train_loss": -12.400240898132324, "global_step": 411482, "epoch": 2449} {"train_loss": -11.860183715820312, "global_step": 411483, "epoch": 2449} {"train_loss": -12.103132247924805, "global_step": 411484, "epoch": 2449} {"train_loss": -12.500127792358398, "global_step": 411485, "epoch": 2449} {"train_loss": -12.359148979187012, "global_step": 411486, "epoch": 2449} {"train_loss": -11.67140007019043, "global_step": 411487, "epoch": 2449} {"train_loss": -11.610737800598145, "global_step": 411488, "epoch": 2449} {"train_loss": -12.629389762878418, "global_step": 411489, "epoch": 2449} {"train_loss": -11.652303695678711, "global_step": 411490, "epoch": 2449} {"train_loss": -12.393026351928711, "global_step": 411491, "epoch": 2449} {"train_loss": -11.957271575927734, "global_step": 411492, "epoch": 2449} {"train_loss": -11.47376823425293, "global_step": 411493, "epoch": 2449} {"train_loss": -12.2548828125, "global_step": 411494, "epoch": 2449} {"train_loss": -11.513246536254883, "global_step": 411495, "epoch": 2449} {"train_loss": -12.075210571289062, "global_step": 411496, "epoch": 2449} {"train_loss": -12.117267608642578, "global_step": 411497, "epoch": 2449} {"train_loss": -12.532407760620117, "global_step": 411498, "epoch": 2449} {"train_loss": -11.980295181274414, "global_step": 411499, "epoch": 2449} {"train_loss": -11.761676788330078, "global_step": 411500, "epoch": 2449} {"train_loss": -12.460248947143555, "global_step": 411501, "epoch": 2449} {"train_loss": -11.670276641845703, "global_step": 411502, "epoch": 2449} {"train_loss": -12.373588562011719, "global_step": 411503, "epoch": 2449} {"train_loss": -12.373976707458496, "global_step": 411504, "epoch": 2449} {"train_loss": -12.363227844238281, "global_step": 411505, "epoch": 2449} {"train_loss": -12.122491836547852, "global_step": 411506, "epoch": 2449} {"train_loss": -12.346086502075195, "global_step": 411507, "epoch": 2449} {"train_loss": -11.441153526306152, "global_step": 411508, "epoch": 2449} {"train_loss": -12.423856735229492, "global_step": 411509, "epoch": 2449} {"train_loss": -12.076699256896973, "global_step": 411510, "epoch": 2449} {"train_loss": -12.379776000976562, "global_step": 411511, "epoch": 2449} {"train_loss": -12.27637004852295, "global_step": 411512, "epoch": 2449} {"train_loss": -12.502994537353516, "global_step": 411513, "epoch": 2449} {"train_loss": -12.195590019226074, "global_step": 411514, "epoch": 2449} {"train_loss": -11.803182601928711, "global_step": 411515, "epoch": 2449} {"train_loss": -12.239311218261719, "global_step": 411516, "epoch": 2449} {"train_loss": -11.997912406921387, "global_step": 411517, "epoch": 2449} {"train_loss": -12.063163757324219, "global_step": 411518, "epoch": 2449} {"train_loss": -12.536741256713867, "global_step": 411519, "epoch": 2449} {"train_loss": -11.772214889526367, "global_step": 411520, "epoch": 2449} {"train_loss": -12.28422737121582, "global_step": 411521, "epoch": 2449} {"train_loss": -12.015707015991211, "global_step": 411522, "epoch": 2449} {"train_loss": -11.612430572509766, "global_step": 411523, "epoch": 2449} {"train_loss": -12.09372329711914, "global_step": 411524, "epoch": 2449} {"train_loss": -11.104089736938477, "global_step": 411525, "epoch": 2449} {"train_loss": -12.2749662399292, "global_step": 411526, "epoch": 2449} {"train_loss": -12.468656539916992, "global_step": 411527, "epoch": 2449} {"train_loss": -11.67751407623291, "global_step": 411528, "epoch": 2449} {"train_loss": -12.278871536254883, "global_step": 411529, "epoch": 2449} {"train_loss": -11.215606689453125, "global_step": 411530, "epoch": 2449} {"train_loss": -12.07536506652832, "global_step": 411531, "epoch": 2449} {"train_loss": -11.774885177612305, "global_step": 411532, "epoch": 2449} {"train_loss": -11.574508666992188, "global_step": 411533, "epoch": 2449} {"train_loss": -11.785948753356934, "global_step": 411534, "epoch": 2449} {"train_loss": -11.871341705322266, "global_step": 411535, "epoch": 2449} {"train_loss": -11.00613784790039, "global_step": 411536, "epoch": 2449} {"train_loss": -12.273937225341797, "global_step": 411537, "epoch": 2449} {"train_loss": -10.537026405334473, "global_step": 411538, "epoch": 2449} {"train_loss": -12.218961715698242, "global_step": 411539, "epoch": 2449} {"train_loss": -12.091623306274414, "global_step": 411540, "epoch": 2449} {"train_loss": -11.68163776397705, "global_step": 411541, "epoch": 2449} {"train_loss": -12.290192604064941, "global_step": 411542, "epoch": 2449} {"train_loss": -10.656845092773438, "global_step": 411543, "epoch": 2449} {"train_loss": -12.410764694213867, "global_step": 411544, "epoch": 2449} {"train_loss": -11.12364673614502, "global_step": 411545, "epoch": 2449} {"train_loss": -12.44293212890625, "global_step": 411546, "epoch": 2449} {"train_loss": -11.622997283935547, "global_step": 411547, "epoch": 2449} {"train_loss": -11.871631622314453, "global_step": 411548, "epoch": 2449} {"train_loss": -11.994791984558105, "global_step": 411549, "epoch": 2449} {"train_loss": -11.7130708694458, "global_step": 411550, "epoch": 2449} {"train_loss": -12.047260284423828, "global_step": 411551, "epoch": 2449} {"train_loss": -11.559589385986328, "global_step": 411552, "epoch": 2449} {"train_loss": -12.181982040405273, "global_step": 411553, "epoch": 2449} {"train_loss": -11.30196762084961, "global_step": 411554, "epoch": 2449} {"train_loss": -11.844667434692383, "global_step": 411555, "epoch": 2449} {"train_loss": -11.92232608795166, "global_step": 411556, "epoch": 2449} {"train_loss": -11.716835021972656, "global_step": 411557, "epoch": 2449} {"train_loss": -12.620391845703125, "global_step": 411558, "epoch": 2449} {"train_loss": -12.132264137268066, "global_step": 411559, "epoch": 2449} {"train_loss": -12.580021858215332, "global_step": 411560, "epoch": 2449} {"train_loss": -12.141305923461914, "global_step": 411561, "epoch": 2449} {"train_loss": -12.126035690307617, "global_step": 411562, "epoch": 2449} {"train_loss": -12.530912399291992, "global_step": 411563, "epoch": 2449} {"train_loss": -11.770975112915039, "global_step": 411564, "epoch": 2449} {"train_loss": -12.685286521911621, "global_step": 411565, "epoch": 2449} {"train_loss": -12.10118293762207, "global_step": 411566, "epoch": 2449} {"train_loss": -12.334814071655273, "global_step": 411567, "epoch": 2449} {"train_loss": -12.076805114746094, "global_step": 411568, "epoch": 2449} {"train_loss": -12.39961051940918, "global_step": 411569, "epoch": 2449} {"train_loss": -12.39764404296875, "global_step": 411570, "epoch": 2449} {"train_loss": -11.816339492797852, "global_step": 411571, "epoch": 2449} {"train_loss": -12.579164505004883, "global_step": 411572, "epoch": 2449} {"train_loss": -12.114004135131836, "global_step": 411573, "epoch": 2449} {"train_loss": -12.492321014404297, "global_step": 411574, "epoch": 2449} {"train_loss": -12.238619804382324, "global_step": 411575, "epoch": 2449} {"train_loss": -12.041226387023926, "global_step": 411576, "epoch": 2449} {"train_loss": -12.402281761169434, "global_step": 411577, "epoch": 2449} {"train_loss": -12.268547058105469, "global_step": 411578, "epoch": 2449} {"train_loss": -12.051759719848633, "global_step": 411579, "epoch": 2449} {"train_loss": -12.473718643188477, "global_step": 411580, "epoch": 2449} {"train_loss": -11.839370727539062, "global_step": 411581, "epoch": 2449} {"train_loss": -12.148504257202148, "global_step": 411582, "epoch": 2449} {"train_loss": -12.146474838256836, "global_step": 411583, "epoch": 2449} {"train_loss": -12.25910472869873, "global_step": 411584, "epoch": 2449} {"train_loss": -12.240715980529785, "global_step": 411585, "epoch": 2449} {"train_loss": -12.273881912231445, "global_step": 411586, "epoch": 2449} {"train_loss": -12.220524787902832, "global_step": 411587, "epoch": 2449} {"train_loss": -12.6793851852417, "global_step": 411588, "epoch": 2449} {"train_loss": -12.033796310424805, "global_step": 411589, "epoch": 2449} {"train_loss": -12.636107444763184, "global_step": 411590, "epoch": 2449} {"train_loss": -11.928387641906738, "global_step": 411591, "epoch": 2449} {"train_loss": -12.518562316894531, "global_step": 411592, "epoch": 2449} {"train_loss": -11.931397438049316, "global_step": 411593, "epoch": 2449} {"train_loss": -12.338184356689453, "global_step": 411594, "epoch": 2449} {"train_loss": -12.025020599365234, "global_step": 411595, "epoch": 2449} {"train_loss": -12.458499908447266, "global_step": 411596, "epoch": 2449} {"train_loss": -12.622072219848633, "global_step": 411597, "epoch": 2449} {"train_loss": -11.591729164123535, "global_step": 411598, "epoch": 2449} {"train_loss": -12.125502126557487, "global_step": 411599, "epoch": 2449, "val_loss": 303334.34375} {"train_loss": -12.076955795288086, "global_step": 411600, "epoch": 2450} {"train_loss": -12.165135383605957, "global_step": 411601, "epoch": 2450} {"train_loss": -11.167218208312988, "global_step": 411602, "epoch": 2450} {"train_loss": -11.053045272827148, "global_step": 411603, "epoch": 2450} {"train_loss": -11.02694320678711, "global_step": 411604, "epoch": 2450} {"train_loss": -10.62673282623291, "global_step": 411605, "epoch": 2450} {"train_loss": -10.064523696899414, "global_step": 411606, "epoch": 2450} {"train_loss": -9.317317962646484, "global_step": 411607, "epoch": 2450} {"train_loss": -11.199918746948242, "global_step": 411608, "epoch": 2450} {"train_loss": -10.370499610900879, "global_step": 411609, "epoch": 2450} {"train_loss": -9.943008422851562, "global_step": 411610, "epoch": 2450} {"train_loss": -11.117637634277344, "global_step": 411611, "epoch": 2450} {"train_loss": -9.748258590698242, "global_step": 411612, "epoch": 2450} {"train_loss": -10.450931549072266, "global_step": 411613, "epoch": 2450} {"train_loss": -11.168923377990723, "global_step": 411614, "epoch": 2450} {"train_loss": -10.697484016418457, "global_step": 411615, "epoch": 2450} {"train_loss": -11.133417129516602, "global_step": 411616, "epoch": 2450} {"train_loss": -11.64404296875, "global_step": 411617, "epoch": 2450} {"train_loss": -11.214164733886719, "global_step": 411618, "epoch": 2450} {"train_loss": -11.406177520751953, "global_step": 411619, "epoch": 2450} {"train_loss": -11.565164566040039, "global_step": 411620, "epoch": 2450} {"train_loss": -11.860681533813477, "global_step": 411621, "epoch": 2450} {"train_loss": -11.355230331420898, "global_step": 411622, "epoch": 2450} {"train_loss": -12.17253589630127, "global_step": 411623, "epoch": 2450} {"train_loss": -11.396629333496094, "global_step": 411624, "epoch": 2450} {"train_loss": -11.92794132232666, "global_step": 411625, "epoch": 2450} {"train_loss": -12.005544662475586, "global_step": 411626, "epoch": 2450} {"train_loss": -11.645898818969727, "global_step": 411627, "epoch": 2450} {"train_loss": -11.587420463562012, "global_step": 411628, "epoch": 2450} {"train_loss": -11.5960693359375, "global_step": 411629, "epoch": 2450} {"train_loss": -11.444265365600586, "global_step": 411630, "epoch": 2450} {"train_loss": -11.309524536132812, "global_step": 411631, "epoch": 2450} {"train_loss": -12.414997100830078, "global_step": 411632, "epoch": 2450} {"train_loss": -11.499095916748047, "global_step": 411633, "epoch": 2450} {"train_loss": -11.745071411132812, "global_step": 411634, "epoch": 2450} {"train_loss": -12.210461616516113, "global_step": 411635, "epoch": 2450} {"train_loss": -11.602289199829102, "global_step": 411636, "epoch": 2450} {"train_loss": -12.052104949951172, "global_step": 411637, "epoch": 2450} {"train_loss": -11.53435230255127, "global_step": 411638, "epoch": 2450} {"train_loss": -12.016949653625488, "global_step": 411639, "epoch": 2450} {"train_loss": -11.979762077331543, "global_step": 411640, "epoch": 2450} {"train_loss": -11.890027046203613, "global_step": 411641, "epoch": 2450} {"train_loss": -12.229736328125, "global_step": 411642, "epoch": 2450} {"train_loss": -11.94775676727295, "global_step": 411643, "epoch": 2450} {"train_loss": -12.16059398651123, "global_step": 411644, "epoch": 2450} {"train_loss": -12.26974105834961, "global_step": 411645, "epoch": 2450} {"train_loss": -11.959752082824707, "global_step": 411646, "epoch": 2450} {"train_loss": -12.503458023071289, "global_step": 411647, "epoch": 2450} {"train_loss": -11.945505142211914, "global_step": 411648, "epoch": 2450} {"train_loss": -12.321874618530273, "global_step": 411649, "epoch": 2450} {"train_loss": -12.396662712097168, "global_step": 411650, "epoch": 2450} {"train_loss": -12.395610809326172, "global_step": 411651, "epoch": 2450} {"train_loss": -12.334291458129883, "global_step": 411652, "epoch": 2450} {"train_loss": -12.135537147521973, "global_step": 411653, "epoch": 2450} {"train_loss": -12.310940742492676, "global_step": 411654, "epoch": 2450} {"train_loss": -12.503595352172852, "global_step": 411655, "epoch": 2450} {"train_loss": -12.3294677734375, "global_step": 411656, "epoch": 2450} {"train_loss": -12.594913482666016, "global_step": 411657, "epoch": 2450} {"train_loss": -12.422516822814941, "global_step": 411658, "epoch": 2450} {"train_loss": -12.32950496673584, "global_step": 411659, "epoch": 2450} {"train_loss": -12.421847343444824, "global_step": 411660, "epoch": 2450} {"train_loss": -12.241530418395996, "global_step": 411661, "epoch": 2450} {"train_loss": -12.596960067749023, "global_step": 411662, "epoch": 2450} {"train_loss": -12.612066268920898, "global_step": 411663, "epoch": 2450} {"train_loss": -12.357552528381348, "global_step": 411664, "epoch": 2450} {"train_loss": -12.335936546325684, "global_step": 411665, "epoch": 2450} {"train_loss": -12.40326976776123, "global_step": 411666, "epoch": 2450} {"train_loss": -12.357511520385742, "global_step": 411667, "epoch": 2450} {"train_loss": -12.269147872924805, "global_step": 411668, "epoch": 2450} {"train_loss": -12.369510650634766, "global_step": 411669, "epoch": 2450} {"train_loss": -12.481742858886719, "global_step": 411670, "epoch": 2450} {"train_loss": -12.167106628417969, "global_step": 411671, "epoch": 2450} {"train_loss": -12.762566566467285, "global_step": 411672, "epoch": 2450} {"train_loss": -12.65102767944336, "global_step": 411673, "epoch": 2450} {"train_loss": -12.419855117797852, "global_step": 411674, "epoch": 2450} {"train_loss": -12.619354248046875, "global_step": 411675, "epoch": 2450} {"train_loss": -12.357513427734375, "global_step": 411676, "epoch": 2450} {"train_loss": -12.551958084106445, "global_step": 411677, "epoch": 2450} {"train_loss": -12.703880310058594, "global_step": 411678, "epoch": 2450} {"train_loss": -12.57925796508789, "global_step": 411679, "epoch": 2450} {"train_loss": -12.549959182739258, "global_step": 411680, "epoch": 2450} {"train_loss": -12.53682804107666, "global_step": 411681, "epoch": 2450} {"train_loss": -12.311431884765625, "global_step": 411682, "epoch": 2450} {"train_loss": -12.463048934936523, "global_step": 411683, "epoch": 2450} {"train_loss": -12.485733032226562, "global_step": 411684, "epoch": 2450} {"train_loss": -12.812657356262207, "global_step": 411685, "epoch": 2450} {"train_loss": -12.215065002441406, "global_step": 411686, "epoch": 2450} {"train_loss": -11.687702178955078, "global_step": 411687, "epoch": 2450} {"train_loss": -12.406095504760742, "global_step": 411688, "epoch": 2450} {"train_loss": -12.00468635559082, "global_step": 411689, "epoch": 2450} {"train_loss": -12.377279281616211, "global_step": 411690, "epoch": 2450} {"train_loss": -12.268049240112305, "global_step": 411691, "epoch": 2450} {"train_loss": -12.517486572265625, "global_step": 411692, "epoch": 2450} {"train_loss": -12.642784118652344, "global_step": 411693, "epoch": 2450} {"train_loss": -12.421821594238281, "global_step": 411694, "epoch": 2450} {"train_loss": -12.562337875366211, "global_step": 411695, "epoch": 2450} {"train_loss": -12.294454574584961, "global_step": 411696, "epoch": 2450} {"train_loss": -12.253149032592773, "global_step": 411697, "epoch": 2450} {"train_loss": -12.112579345703125, "global_step": 411698, "epoch": 2450} {"train_loss": -12.26198673248291, "global_step": 411699, "epoch": 2450} {"train_loss": -12.384851455688477, "global_step": 411700, "epoch": 2450} {"train_loss": -12.677738189697266, "global_step": 411701, "epoch": 2450} {"train_loss": -12.386981964111328, "global_step": 411702, "epoch": 2450} {"train_loss": -12.499906539916992, "global_step": 411703, "epoch": 2450} {"train_loss": -12.68189811706543, "global_step": 411704, "epoch": 2450} {"train_loss": -12.786627769470215, "global_step": 411705, "epoch": 2450} {"train_loss": -12.606306076049805, "global_step": 411706, "epoch": 2450} {"train_loss": -12.776191711425781, "global_step": 411707, "epoch": 2450} {"train_loss": -12.723352432250977, "global_step": 411708, "epoch": 2450} {"train_loss": -12.479669570922852, "global_step": 411709, "epoch": 2450} {"train_loss": -12.564483642578125, "global_step": 411710, "epoch": 2450} {"train_loss": -12.625090599060059, "global_step": 411711, "epoch": 2450} {"train_loss": -12.633930206298828, "global_step": 411712, "epoch": 2450} {"train_loss": -12.7788724899292, "global_step": 411713, "epoch": 2450} {"train_loss": -12.737569808959961, "global_step": 411714, "epoch": 2450} {"train_loss": -12.5107421875, "global_step": 411715, "epoch": 2450} {"train_loss": -12.522746086120605, "global_step": 411716, "epoch": 2450} {"train_loss": -12.54572582244873, "global_step": 411717, "epoch": 2450} {"train_loss": -12.661943435668945, "global_step": 411718, "epoch": 2450} {"train_loss": -12.481935501098633, "global_step": 411719, "epoch": 2450} {"train_loss": -12.43704605102539, "global_step": 411720, "epoch": 2450} {"train_loss": -12.683297157287598, "global_step": 411721, "epoch": 2450} {"train_loss": -12.353346824645996, "global_step": 411722, "epoch": 2450} {"train_loss": -12.353679656982422, "global_step": 411723, "epoch": 2450} {"train_loss": -12.651189804077148, "global_step": 411724, "epoch": 2450} {"train_loss": -12.751630783081055, "global_step": 411725, "epoch": 2450} {"train_loss": -12.615814208984375, "global_step": 411726, "epoch": 2450} {"train_loss": -12.58732795715332, "global_step": 411727, "epoch": 2450} {"train_loss": -12.547529220581055, "global_step": 411728, "epoch": 2450} {"train_loss": -12.731746673583984, "global_step": 411729, "epoch": 2450} {"train_loss": -12.690366744995117, "global_step": 411730, "epoch": 2450} {"train_loss": -12.454596519470215, "global_step": 411731, "epoch": 2450} {"train_loss": -12.432144165039062, "global_step": 411732, "epoch": 2450} {"train_loss": -12.535175323486328, "global_step": 411733, "epoch": 2450} {"train_loss": -12.340018272399902, "global_step": 411734, "epoch": 2450} {"train_loss": -12.178794860839844, "global_step": 411735, "epoch": 2450} {"train_loss": -12.484487533569336, "global_step": 411736, "epoch": 2450} {"train_loss": -12.124553680419922, "global_step": 411737, "epoch": 2450} {"train_loss": -11.651107788085938, "global_step": 411738, "epoch": 2450} {"train_loss": -12.325353622436523, "global_step": 411739, "epoch": 2450} {"train_loss": -11.694978713989258, "global_step": 411740, "epoch": 2450} {"train_loss": -12.270491600036621, "global_step": 411741, "epoch": 2450} {"train_loss": -11.440427780151367, "global_step": 411742, "epoch": 2450} {"train_loss": -12.232645988464355, "global_step": 411743, "epoch": 2450} {"train_loss": -11.270835876464844, "global_step": 411744, "epoch": 2450} {"train_loss": -12.241351127624512, "global_step": 411745, "epoch": 2450} {"train_loss": -11.626348495483398, "global_step": 411746, "epoch": 2450} {"train_loss": -12.43232536315918, "global_step": 411747, "epoch": 2450} {"train_loss": -10.869503021240234, "global_step": 411748, "epoch": 2450} {"train_loss": -12.33958625793457, "global_step": 411749, "epoch": 2450} {"train_loss": -11.05815601348877, "global_step": 411750, "epoch": 2450} {"train_loss": -11.811054229736328, "global_step": 411751, "epoch": 2450} {"train_loss": -12.209748268127441, "global_step": 411752, "epoch": 2450} {"train_loss": -10.8042573928833, "global_step": 411753, "epoch": 2450} {"train_loss": -12.1201171875, "global_step": 411754, "epoch": 2450} {"train_loss": -10.873010635375977, "global_step": 411755, "epoch": 2450} {"train_loss": -11.558021545410156, "global_step": 411756, "epoch": 2450} {"train_loss": -11.275712966918945, "global_step": 411757, "epoch": 2450} {"train_loss": -11.155176162719727, "global_step": 411758, "epoch": 2450} {"train_loss": -12.047503471374512, "global_step": 411759, "epoch": 2450} {"train_loss": -11.480208396911621, "global_step": 411760, "epoch": 2450} {"train_loss": -11.276595115661621, "global_step": 411761, "epoch": 2450} {"train_loss": -12.262664794921875, "global_step": 411762, "epoch": 2450} {"train_loss": -11.246522903442383, "global_step": 411763, "epoch": 2450} {"train_loss": -11.339635848999023, "global_step": 411764, "epoch": 2450} {"train_loss": -11.855646133422852, "global_step": 411765, "epoch": 2450} {"train_loss": -10.914318084716797, "global_step": 411766, "epoch": 2450} {"train_loss": -12.018692538851784, "global_step": 411767, "epoch": 2450, "train/sim_max_reward_0": 0.6521605507482454, "train/sim_max_reward_1": 0.9059616877994353, "train/sim_max_reward_2": 0.00015813048283176156, "train/sim_max_reward_3": 0.4485309135675642, "train/sim_max_reward_4": 0.9955973559547882, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.938177238686307, "test/sim_max_reward_4400002": 0.9296308154970675, "test/sim_max_reward_4400003": 0.4357591795874207, "test/sim_max_reward_4400004": 0.4150437230054585, "test/sim_max_reward_4400005": 0.9298727081004498, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 0.5645550125724847, "test/sim_max_reward_4400008": 0.6003999994488537, "test/sim_max_reward_4400009": 0.34690675667710624, "test/sim_max_reward_4400010": 0.4153054753196813, "test/sim_max_reward_4400011": 0.994074559767647, "test/sim_max_reward_4400012": 0.6575349958217023, "test/sim_max_reward_4400013": 0.9942260178612229, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 0.1286854514096604, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9961976676478779, "test/sim_max_reward_4400019": 0.18140992009933063, "test/sim_max_reward_4400020": 0.002534617308416769, "test/sim_max_reward_4400021": 0.689355435922514, "test/sim_max_reward_4400022": 0.9851621439132477, "test/sim_max_reward_4400023": 0.14258387005671122, "test/sim_max_reward_4400024": 0.17834392960191142, "test/sim_max_reward_4400025": 0.6291828557560275, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.16714866995500502, "test/sim_max_reward_4400028": 0.6836469316582636, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.963779482547582, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.6941704959475984, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.3673052903770062, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.2992604852659244, "test/sim_max_reward_4400039": 0.4117816013553648, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.061163853542357365, "test/sim_max_reward_4400042": 0.9798027418315081, "test/sim_max_reward_4400043": 0.19357440895696978, "test/sim_max_reward_4400044": 0.5195679398426024, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.3213241779460734, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6670681064254774, "test/mean_score": 0.5220358807531876, "val_loss": 305420.40625, "train_action_mse_error": 1.1072139739990234} {"train_loss": -11.422296524047852, "global_step": 411768, "epoch": 2451} {"train_loss": -8.988594055175781, "global_step": 411769, "epoch": 2451} {"train_loss": -9.144268989562988, "global_step": 411770, "epoch": 2451} {"train_loss": -9.738037109375, "global_step": 411771, "epoch": 2451} {"train_loss": -10.536090850830078, "global_step": 411772, "epoch": 2451} {"train_loss": -10.229812622070312, "global_step": 411773, "epoch": 2451} {"train_loss": -9.714278221130371, "global_step": 411774, "epoch": 2451} {"train_loss": -11.873104095458984, "global_step": 411775, "epoch": 2451} {"train_loss": -10.52066421508789, "global_step": 411776, "epoch": 2451} {"train_loss": -11.103008270263672, "global_step": 411777, "epoch": 2451} {"train_loss": -10.543659210205078, "global_step": 411778, "epoch": 2451} {"train_loss": -11.018875122070312, "global_step": 411779, "epoch": 2451} {"train_loss": -9.331707000732422, "global_step": 411780, "epoch": 2451} {"train_loss": -10.09695053100586, "global_step": 411781, "epoch": 2451} {"train_loss": -8.499038696289062, "global_step": 411782, "epoch": 2451} {"train_loss": -10.566732406616211, "global_step": 411783, "epoch": 2451} {"train_loss": -10.049241065979004, "global_step": 411784, "epoch": 2451} {"train_loss": -10.464717864990234, "global_step": 411785, "epoch": 2451} {"train_loss": -11.12116813659668, "global_step": 411786, "epoch": 2451} {"train_loss": -10.249444961547852, "global_step": 411787, "epoch": 2451} {"train_loss": -9.561431884765625, "global_step": 411788, "epoch": 2451} {"train_loss": -10.589485168457031, "global_step": 411789, "epoch": 2451} {"train_loss": -10.924762725830078, "global_step": 411790, "epoch": 2451} {"train_loss": -10.720539093017578, "global_step": 411791, "epoch": 2451} {"train_loss": -10.818206787109375, "global_step": 411792, "epoch": 2451} {"train_loss": -11.62063217163086, "global_step": 411793, "epoch": 2451} {"train_loss": -11.402443885803223, "global_step": 411794, "epoch": 2451} {"train_loss": -11.94489574432373, "global_step": 411795, "epoch": 2451} {"train_loss": -11.540288925170898, "global_step": 411796, "epoch": 2451} {"train_loss": -11.528754234313965, "global_step": 411797, "epoch": 2451} {"train_loss": -11.408472061157227, "global_step": 411798, "epoch": 2451} {"train_loss": -11.633066177368164, "global_step": 411799, "epoch": 2451} {"train_loss": -11.787473678588867, "global_step": 411800, "epoch": 2451} {"train_loss": -11.846503257751465, "global_step": 411801, "epoch": 2451} {"train_loss": -11.623600006103516, "global_step": 411802, "epoch": 2451} {"train_loss": -11.63920783996582, "global_step": 411803, "epoch": 2451} {"train_loss": -11.610342025756836, "global_step": 411804, "epoch": 2451} {"train_loss": -12.029704093933105, "global_step": 411805, "epoch": 2451} {"train_loss": -11.496376037597656, "global_step": 411806, "epoch": 2451} {"train_loss": -11.648996353149414, "global_step": 411807, "epoch": 2451} {"train_loss": -11.70705509185791, "global_step": 411808, "epoch": 2451} {"train_loss": -11.36158561706543, "global_step": 411809, "epoch": 2451} {"train_loss": -11.368926048278809, "global_step": 411810, "epoch": 2451} {"train_loss": -11.761297225952148, "global_step": 411811, "epoch": 2451} {"train_loss": -11.694116592407227, "global_step": 411812, "epoch": 2451} {"train_loss": -11.83821964263916, "global_step": 411813, "epoch": 2451} {"train_loss": -12.197019577026367, "global_step": 411814, "epoch": 2451} {"train_loss": -11.540023803710938, "global_step": 411815, "epoch": 2451} {"train_loss": -11.912593841552734, "global_step": 411816, "epoch": 2451} {"train_loss": -11.731077194213867, "global_step": 411817, "epoch": 2451} {"train_loss": -11.726431846618652, "global_step": 411818, "epoch": 2451} {"train_loss": -12.197738647460938, "global_step": 411819, "epoch": 2451} {"train_loss": -11.841005325317383, "global_step": 411820, "epoch": 2451} {"train_loss": -11.645723342895508, "global_step": 411821, "epoch": 2451} {"train_loss": -11.983180046081543, "global_step": 411822, "epoch": 2451} {"train_loss": -11.880592346191406, "global_step": 411823, "epoch": 2451} {"train_loss": -11.805437088012695, "global_step": 411824, "epoch": 2451} {"train_loss": -12.256930351257324, "global_step": 411825, "epoch": 2451} {"train_loss": -11.881890296936035, "global_step": 411826, "epoch": 2451} {"train_loss": -12.07736587524414, "global_step": 411827, "epoch": 2451} {"train_loss": -12.135335922241211, "global_step": 411828, "epoch": 2451} {"train_loss": -11.872973442077637, "global_step": 411829, "epoch": 2451} {"train_loss": -12.217082977294922, "global_step": 411830, "epoch": 2451} {"train_loss": -12.00832748413086, "global_step": 411831, "epoch": 2451} {"train_loss": -12.098047256469727, "global_step": 411832, "epoch": 2451} {"train_loss": -11.933609008789062, "global_step": 411833, "epoch": 2451} {"train_loss": -12.077165603637695, "global_step": 411834, "epoch": 2451} {"train_loss": -12.109169960021973, "global_step": 411835, "epoch": 2451} {"train_loss": -11.684378623962402, "global_step": 411836, "epoch": 2451} {"train_loss": -12.120870590209961, "global_step": 411837, "epoch": 2451} {"train_loss": -11.349222183227539, "global_step": 411838, "epoch": 2451} {"train_loss": -12.279516220092773, "global_step": 411839, "epoch": 2451} {"train_loss": -12.060523986816406, "global_step": 411840, "epoch": 2451} {"train_loss": -12.296932220458984, "global_step": 411841, "epoch": 2451} {"train_loss": -11.842947006225586, "global_step": 411842, "epoch": 2451} {"train_loss": -12.115443229675293, "global_step": 411843, "epoch": 2451} {"train_loss": -12.077091217041016, "global_step": 411844, "epoch": 2451} {"train_loss": -12.403446197509766, "global_step": 411845, "epoch": 2451} {"train_loss": -12.167370796203613, "global_step": 411846, "epoch": 2451} {"train_loss": -11.900050163269043, "global_step": 411847, "epoch": 2451} {"train_loss": -12.310518264770508, "global_step": 411848, "epoch": 2451} {"train_loss": -11.984508514404297, "global_step": 411849, "epoch": 2451} {"train_loss": -12.314546585083008, "global_step": 411850, "epoch": 2451} {"train_loss": -12.162105560302734, "global_step": 411851, "epoch": 2451} {"train_loss": -12.27492618560791, "global_step": 411852, "epoch": 2451} {"train_loss": -12.285606384277344, "global_step": 411853, "epoch": 2451} {"train_loss": -12.518686294555664, "global_step": 411854, "epoch": 2451} {"train_loss": -12.179769515991211, "global_step": 411855, "epoch": 2451} {"train_loss": -12.429483413696289, "global_step": 411856, "epoch": 2451} {"train_loss": -12.08047103881836, "global_step": 411857, "epoch": 2451} {"train_loss": -12.18899154663086, "global_step": 411858, "epoch": 2451} {"train_loss": -12.307629585266113, "global_step": 411859, "epoch": 2451} {"train_loss": -12.306812286376953, "global_step": 411860, "epoch": 2451} {"train_loss": -12.32308578491211, "global_step": 411861, "epoch": 2451} {"train_loss": -12.372751235961914, "global_step": 411862, "epoch": 2451} {"train_loss": -12.075008392333984, "global_step": 411863, "epoch": 2451} {"train_loss": -12.40818977355957, "global_step": 411864, "epoch": 2451} {"train_loss": -12.25232219696045, "global_step": 411865, "epoch": 2451} {"train_loss": -11.718639373779297, "global_step": 411866, "epoch": 2451} {"train_loss": -12.68154525756836, "global_step": 411867, "epoch": 2451} {"train_loss": -12.153474807739258, "global_step": 411868, "epoch": 2451} {"train_loss": -11.83276081085205, "global_step": 411869, "epoch": 2451} {"train_loss": -11.701309204101562, "global_step": 411870, "epoch": 2451} {"train_loss": -12.362054824829102, "global_step": 411871, "epoch": 2451} {"train_loss": -11.672411918640137, "global_step": 411872, "epoch": 2451} {"train_loss": -12.239551544189453, "global_step": 411873, "epoch": 2451} {"train_loss": -11.786123275756836, "global_step": 411874, "epoch": 2451} {"train_loss": -12.438154220581055, "global_step": 411875, "epoch": 2451} {"train_loss": -11.83720588684082, "global_step": 411876, "epoch": 2451} {"train_loss": -12.381155014038086, "global_step": 411877, "epoch": 2451} {"train_loss": -12.076376914978027, "global_step": 411878, "epoch": 2451} {"train_loss": -12.411271095275879, "global_step": 411879, "epoch": 2451} {"train_loss": -12.487648010253906, "global_step": 411880, "epoch": 2451} {"train_loss": -12.207075119018555, "global_step": 411881, "epoch": 2451} {"train_loss": -12.317340850830078, "global_step": 411882, "epoch": 2451} {"train_loss": -12.647138595581055, "global_step": 411883, "epoch": 2451} {"train_loss": -12.12491226196289, "global_step": 411884, "epoch": 2451} {"train_loss": -12.075653076171875, "global_step": 411885, "epoch": 2451} {"train_loss": -12.48676872253418, "global_step": 411886, "epoch": 2451} {"train_loss": -12.590780258178711, "global_step": 411887, "epoch": 2451} {"train_loss": -12.047185897827148, "global_step": 411888, "epoch": 2451} {"train_loss": -12.46353816986084, "global_step": 411889, "epoch": 2451} {"train_loss": -12.305789947509766, "global_step": 411890, "epoch": 2451} {"train_loss": -11.42385196685791, "global_step": 411891, "epoch": 2451} {"train_loss": -11.822612762451172, "global_step": 411892, "epoch": 2451} {"train_loss": -12.204631805419922, "global_step": 411893, "epoch": 2451} {"train_loss": -11.087778091430664, "global_step": 411894, "epoch": 2451} {"train_loss": -10.77096939086914, "global_step": 411895, "epoch": 2451} {"train_loss": -12.431656837463379, "global_step": 411896, "epoch": 2451} {"train_loss": -11.782831192016602, "global_step": 411897, "epoch": 2451} {"train_loss": -11.762823104858398, "global_step": 411898, "epoch": 2451} {"train_loss": -11.90689468383789, "global_step": 411899, "epoch": 2451} {"train_loss": -11.376367568969727, "global_step": 411900, "epoch": 2451} {"train_loss": -11.409563064575195, "global_step": 411901, "epoch": 2451} {"train_loss": -12.039271354675293, "global_step": 411902, "epoch": 2451} {"train_loss": -10.54798412322998, "global_step": 411903, "epoch": 2451} {"train_loss": -10.744773864746094, "global_step": 411904, "epoch": 2451} {"train_loss": -12.285675048828125, "global_step": 411905, "epoch": 2451} {"train_loss": -10.589818954467773, "global_step": 411906, "epoch": 2451} {"train_loss": -11.878093719482422, "global_step": 411907, "epoch": 2451} {"train_loss": -11.460693359375, "global_step": 411908, "epoch": 2451} {"train_loss": -11.417327880859375, "global_step": 411909, "epoch": 2451} {"train_loss": -11.722288131713867, "global_step": 411910, "epoch": 2451} {"train_loss": -10.563692092895508, "global_step": 411911, "epoch": 2451} {"train_loss": -11.99199104309082, "global_step": 411912, "epoch": 2451} {"train_loss": -11.654253005981445, "global_step": 411913, "epoch": 2451} {"train_loss": -10.6266450881958, "global_step": 411914, "epoch": 2451} {"train_loss": -11.571361541748047, "global_step": 411915, "epoch": 2451} {"train_loss": -10.950737953186035, "global_step": 411916, "epoch": 2451} {"train_loss": -11.177519798278809, "global_step": 411917, "epoch": 2451} {"train_loss": -12.120664596557617, "global_step": 411918, "epoch": 2451} {"train_loss": -10.259916305541992, "global_step": 411919, "epoch": 2451} {"train_loss": -12.050788879394531, "global_step": 411920, "epoch": 2451} {"train_loss": -11.064641952514648, "global_step": 411921, "epoch": 2451} {"train_loss": -11.9881010055542, "global_step": 411922, "epoch": 2451} {"train_loss": -11.281505584716797, "global_step": 411923, "epoch": 2451} {"train_loss": -11.938423156738281, "global_step": 411924, "epoch": 2451} {"train_loss": -11.707818984985352, "global_step": 411925, "epoch": 2451} {"train_loss": -11.899909973144531, "global_step": 411926, "epoch": 2451} {"train_loss": -12.002203941345215, "global_step": 411927, "epoch": 2451} {"train_loss": -11.684566497802734, "global_step": 411928, "epoch": 2451} {"train_loss": -12.218746185302734, "global_step": 411929, "epoch": 2451} {"train_loss": -12.391268730163574, "global_step": 411930, "epoch": 2451} {"train_loss": -11.706944465637207, "global_step": 411931, "epoch": 2451} {"train_loss": -11.514374732971191, "global_step": 411932, "epoch": 2451} {"train_loss": -12.04858112335205, "global_step": 411933, "epoch": 2451} {"train_loss": -11.667594909667969, "global_step": 411934, "epoch": 2451} {"train_loss": -11.644170397803897, "global_step": 411935, "epoch": 2451, "val_loss": 306574.96875} {"train_loss": -12.10576343536377, "global_step": 411936, "epoch": 2452} {"train_loss": -12.004852294921875, "global_step": 411937, "epoch": 2452} {"train_loss": -12.120059967041016, "global_step": 411938, "epoch": 2452} {"train_loss": -12.11020278930664, "global_step": 411939, "epoch": 2452} {"train_loss": -12.331014633178711, "global_step": 411940, "epoch": 2452} {"train_loss": -12.037225723266602, "global_step": 411941, "epoch": 2452} {"train_loss": -12.252461433410645, "global_step": 411942, "epoch": 2452} {"train_loss": -12.218414306640625, "global_step": 411943, "epoch": 2452} {"train_loss": -11.749263763427734, "global_step": 411944, "epoch": 2452} {"train_loss": -12.23217487335205, "global_step": 411945, "epoch": 2452} {"train_loss": -12.227838516235352, "global_step": 411946, "epoch": 2452} {"train_loss": -12.39549446105957, "global_step": 411947, "epoch": 2452} {"train_loss": -12.222911834716797, "global_step": 411948, "epoch": 2452} {"train_loss": -12.338943481445312, "global_step": 411949, "epoch": 2452} {"train_loss": -12.284004211425781, "global_step": 411950, "epoch": 2452} {"train_loss": -12.277130126953125, "global_step": 411951, "epoch": 2452} {"train_loss": -11.920600891113281, "global_step": 411952, "epoch": 2452} {"train_loss": -11.850382804870605, "global_step": 411953, "epoch": 2452} {"train_loss": -12.028175354003906, "global_step": 411954, "epoch": 2452} {"train_loss": -12.347792625427246, "global_step": 411955, "epoch": 2452} {"train_loss": -12.174169540405273, "global_step": 411956, "epoch": 2452} {"train_loss": -12.159533500671387, "global_step": 411957, "epoch": 2452} {"train_loss": -12.153603553771973, "global_step": 411958, "epoch": 2452} {"train_loss": -12.413865089416504, "global_step": 411959, "epoch": 2452} {"train_loss": -12.233282089233398, "global_step": 411960, "epoch": 2452} {"train_loss": -12.516365051269531, "global_step": 411961, "epoch": 2452} {"train_loss": -12.354263305664062, "global_step": 411962, "epoch": 2452} {"train_loss": -12.35446548461914, "global_step": 411963, "epoch": 2452} {"train_loss": -12.392302513122559, "global_step": 411964, "epoch": 2452} {"train_loss": -12.36594009399414, "global_step": 411965, "epoch": 2452} {"train_loss": -12.355822563171387, "global_step": 411966, "epoch": 2452} {"train_loss": -12.41097640991211, "global_step": 411967, "epoch": 2452} {"train_loss": -12.466131210327148, "global_step": 411968, "epoch": 2452} {"train_loss": -12.314210891723633, "global_step": 411969, "epoch": 2452} {"train_loss": -12.324085235595703, "global_step": 411970, "epoch": 2452} {"train_loss": -12.206685066223145, "global_step": 411971, "epoch": 2452} {"train_loss": -12.314981460571289, "global_step": 411972, "epoch": 2452} {"train_loss": -12.313886642456055, "global_step": 411973, "epoch": 2452} {"train_loss": -12.425872802734375, "global_step": 411974, "epoch": 2452} {"train_loss": -12.397281646728516, "global_step": 411975, "epoch": 2452} {"train_loss": -12.412096977233887, "global_step": 411976, "epoch": 2452} {"train_loss": -12.471063613891602, "global_step": 411977, "epoch": 2452} {"train_loss": -12.456952095031738, "global_step": 411978, "epoch": 2452} {"train_loss": -12.379908561706543, "global_step": 411979, "epoch": 2452} {"train_loss": -12.532750129699707, "global_step": 411980, "epoch": 2452} {"train_loss": -12.511945724487305, "global_step": 411981, "epoch": 2452} {"train_loss": -12.513083457946777, "global_step": 411982, "epoch": 2452} {"train_loss": -12.689214706420898, "global_step": 411983, "epoch": 2452} {"train_loss": -12.531814575195312, "global_step": 411984, "epoch": 2452} {"train_loss": -12.766819953918457, "global_step": 411985, "epoch": 2452} {"train_loss": -12.788147926330566, "global_step": 411986, "epoch": 2452} {"train_loss": -12.493246078491211, "global_step": 411987, "epoch": 2452} {"train_loss": -12.660508155822754, "global_step": 411988, "epoch": 2452} {"train_loss": -12.523744583129883, "global_step": 411989, "epoch": 2452} {"train_loss": -12.766389846801758, "global_step": 411990, "epoch": 2452} {"train_loss": -13.02354621887207, "global_step": 411991, "epoch": 2452} {"train_loss": -12.340251922607422, "global_step": 411992, "epoch": 2452} {"train_loss": -12.509042739868164, "global_step": 411993, "epoch": 2452} {"train_loss": -12.705108642578125, "global_step": 411994, "epoch": 2452} {"train_loss": -12.680614471435547, "global_step": 411995, "epoch": 2452} {"train_loss": -12.558303833007812, "global_step": 411996, "epoch": 2452} {"train_loss": -12.51017951965332, "global_step": 411997, "epoch": 2452} {"train_loss": -12.88963508605957, "global_step": 411998, "epoch": 2452} {"train_loss": -12.498624801635742, "global_step": 411999, "epoch": 2452} {"train_loss": -12.0799560546875, "global_step": 412000, "epoch": 2452} {"train_loss": -12.345648765563965, "global_step": 412001, "epoch": 2452} {"train_loss": -12.243696212768555, "global_step": 412002, "epoch": 2452} {"train_loss": -12.677361488342285, "global_step": 412003, "epoch": 2452} {"train_loss": -12.479024887084961, "global_step": 412004, "epoch": 2452} {"train_loss": -12.516648292541504, "global_step": 412005, "epoch": 2452} {"train_loss": -12.323524475097656, "global_step": 412006, "epoch": 2452} {"train_loss": -11.985302925109863, "global_step": 412007, "epoch": 2452} {"train_loss": -12.495341300964355, "global_step": 412008, "epoch": 2452} {"train_loss": -12.155614852905273, "global_step": 412009, "epoch": 2452} {"train_loss": -12.554964065551758, "global_step": 412010, "epoch": 2452} {"train_loss": -11.965071678161621, "global_step": 412011, "epoch": 2452} {"train_loss": -12.569313049316406, "global_step": 412012, "epoch": 2452} {"train_loss": -11.550212860107422, "global_step": 412013, "epoch": 2452} {"train_loss": -11.549060821533203, "global_step": 412014, "epoch": 2452} {"train_loss": -12.342147827148438, "global_step": 412015, "epoch": 2452} {"train_loss": -12.587312698364258, "global_step": 412016, "epoch": 2452} {"train_loss": -11.885619163513184, "global_step": 412017, "epoch": 2452} {"train_loss": -11.720993041992188, "global_step": 412018, "epoch": 2452} {"train_loss": -12.587078094482422, "global_step": 412019, "epoch": 2452} {"train_loss": -12.022551536560059, "global_step": 412020, "epoch": 2452} {"train_loss": -12.432272911071777, "global_step": 412021, "epoch": 2452} {"train_loss": -12.617560386657715, "global_step": 412022, "epoch": 2452} {"train_loss": -12.509270668029785, "global_step": 412023, "epoch": 2452} {"train_loss": -12.689573287963867, "global_step": 412024, "epoch": 2452} {"train_loss": -12.529314994812012, "global_step": 412025, "epoch": 2452} {"train_loss": -12.359232902526855, "global_step": 412026, "epoch": 2452} {"train_loss": -12.199969291687012, "global_step": 412027, "epoch": 2452} {"train_loss": -12.560941696166992, "global_step": 412028, "epoch": 2452} {"train_loss": -12.614042282104492, "global_step": 412029, "epoch": 2452} {"train_loss": -12.452284812927246, "global_step": 412030, "epoch": 2452} {"train_loss": -12.346778869628906, "global_step": 412031, "epoch": 2452} {"train_loss": -12.317925453186035, "global_step": 412032, "epoch": 2452} {"train_loss": -11.806977272033691, "global_step": 412033, "epoch": 2452} {"train_loss": -11.518977165222168, "global_step": 412034, "epoch": 2452} {"train_loss": -12.035818099975586, "global_step": 412035, "epoch": 2452} {"train_loss": -11.728958129882812, "global_step": 412036, "epoch": 2452} {"train_loss": -12.125603675842285, "global_step": 412037, "epoch": 2452} {"train_loss": -11.634472846984863, "global_step": 412038, "epoch": 2452} {"train_loss": -11.829143524169922, "global_step": 412039, "epoch": 2452} {"train_loss": -11.460992813110352, "global_step": 412040, "epoch": 2452} {"train_loss": -12.178305625915527, "global_step": 412041, "epoch": 2452} {"train_loss": -11.459175109863281, "global_step": 412042, "epoch": 2452} {"train_loss": -11.996265411376953, "global_step": 412043, "epoch": 2452} {"train_loss": -11.011972427368164, "global_step": 412044, "epoch": 2452} {"train_loss": -11.887166976928711, "global_step": 412045, "epoch": 2452} {"train_loss": -10.11161994934082, "global_step": 412046, "epoch": 2452} {"train_loss": -11.345596313476562, "global_step": 412047, "epoch": 2452} {"train_loss": -10.275997161865234, "global_step": 412048, "epoch": 2452} {"train_loss": -10.644552230834961, "global_step": 412049, "epoch": 2452} {"train_loss": -11.437917709350586, "global_step": 412050, "epoch": 2452} {"train_loss": -9.989558219909668, "global_step": 412051, "epoch": 2452} {"train_loss": -10.016966819763184, "global_step": 412052, "epoch": 2452} {"train_loss": -10.364131927490234, "global_step": 412053, "epoch": 2452} {"train_loss": -11.230889320373535, "global_step": 412054, "epoch": 2452} {"train_loss": -11.059942245483398, "global_step": 412055, "epoch": 2452} {"train_loss": -10.775243759155273, "global_step": 412056, "epoch": 2452} {"train_loss": -10.387866973876953, "global_step": 412057, "epoch": 2452} {"train_loss": -10.973196983337402, "global_step": 412058, "epoch": 2452} {"train_loss": -10.816391944885254, "global_step": 412059, "epoch": 2452} {"train_loss": -11.274872779846191, "global_step": 412060, "epoch": 2452} {"train_loss": -10.687644004821777, "global_step": 412061, "epoch": 2452} {"train_loss": -10.684600830078125, "global_step": 412062, "epoch": 2452} {"train_loss": -11.190061569213867, "global_step": 412063, "epoch": 2452} {"train_loss": -10.826972961425781, "global_step": 412064, "epoch": 2452} {"train_loss": -11.147220611572266, "global_step": 412065, "epoch": 2452} {"train_loss": -10.99264907836914, "global_step": 412066, "epoch": 2452} {"train_loss": -10.832252502441406, "global_step": 412067, "epoch": 2452} {"train_loss": -11.371086120605469, "global_step": 412068, "epoch": 2452} {"train_loss": -10.865644454956055, "global_step": 412069, "epoch": 2452} {"train_loss": -11.861913681030273, "global_step": 412070, "epoch": 2452} {"train_loss": -10.52767276763916, "global_step": 412071, "epoch": 2452} {"train_loss": -11.84500503540039, "global_step": 412072, "epoch": 2452} {"train_loss": -11.092687606811523, "global_step": 412073, "epoch": 2452} {"train_loss": -11.159287452697754, "global_step": 412074, "epoch": 2452} {"train_loss": -11.400625228881836, "global_step": 412075, "epoch": 2452} {"train_loss": -11.62312126159668, "global_step": 412076, "epoch": 2452} {"train_loss": -11.548084259033203, "global_step": 412077, "epoch": 2452} {"train_loss": -11.68848705291748, "global_step": 412078, "epoch": 2452} {"train_loss": -11.820405960083008, "global_step": 412079, "epoch": 2452} {"train_loss": -11.758034706115723, "global_step": 412080, "epoch": 2452} {"train_loss": -11.966663360595703, "global_step": 412081, "epoch": 2452} {"train_loss": -11.640666007995605, "global_step": 412082, "epoch": 2452} {"train_loss": -12.288579940795898, "global_step": 412083, "epoch": 2452} {"train_loss": -11.70417594909668, "global_step": 412084, "epoch": 2452} {"train_loss": -11.794239044189453, "global_step": 412085, "epoch": 2452} {"train_loss": -11.597063064575195, "global_step": 412086, "epoch": 2452} {"train_loss": -11.78731632232666, "global_step": 412087, "epoch": 2452} {"train_loss": -11.735505104064941, "global_step": 412088, "epoch": 2452} {"train_loss": -11.861806869506836, "global_step": 412089, "epoch": 2452} {"train_loss": -11.528275489807129, "global_step": 412090, "epoch": 2452} {"train_loss": -12.019237518310547, "global_step": 412091, "epoch": 2452} {"train_loss": -11.659260749816895, "global_step": 412092, "epoch": 2452} {"train_loss": -12.06019115447998, "global_step": 412093, "epoch": 2452} {"train_loss": -11.835355758666992, "global_step": 412094, "epoch": 2452} {"train_loss": -11.344267845153809, "global_step": 412095, "epoch": 2452} {"train_loss": -12.240836143493652, "global_step": 412096, "epoch": 2452} {"train_loss": -11.384292602539062, "global_step": 412097, "epoch": 2452} {"train_loss": -12.008898735046387, "global_step": 412098, "epoch": 2452} {"train_loss": -12.065448760986328, "global_step": 412099, "epoch": 2452} {"train_loss": -11.947782516479492, "global_step": 412100, "epoch": 2452} {"train_loss": -12.283048629760742, "global_step": 412101, "epoch": 2452} {"train_loss": -12.264911651611328, "global_step": 412102, "epoch": 2452} {"train_loss": -11.961776750428337, "global_step": 412103, "epoch": 2452, "val_loss": 305694.375} {"train_loss": -11.805134773254395, "global_step": 412104, "epoch": 2453} {"train_loss": -11.825876235961914, "global_step": 412105, "epoch": 2453} {"train_loss": -11.562599182128906, "global_step": 412106, "epoch": 2453} {"train_loss": -11.386222839355469, "global_step": 412107, "epoch": 2453} {"train_loss": -11.31950569152832, "global_step": 412108, "epoch": 2453} {"train_loss": -12.360389709472656, "global_step": 412109, "epoch": 2453} {"train_loss": -11.559579849243164, "global_step": 412110, "epoch": 2453} {"train_loss": -12.178722381591797, "global_step": 412111, "epoch": 2453} {"train_loss": -12.037430763244629, "global_step": 412112, "epoch": 2453} {"train_loss": -12.057695388793945, "global_step": 412113, "epoch": 2453} {"train_loss": -12.085389137268066, "global_step": 412114, "epoch": 2453} {"train_loss": -12.055667877197266, "global_step": 412115, "epoch": 2453} {"train_loss": -12.036391258239746, "global_step": 412116, "epoch": 2453} {"train_loss": -12.411060333251953, "global_step": 412117, "epoch": 2453} {"train_loss": -11.90340518951416, "global_step": 412118, "epoch": 2453} {"train_loss": -12.258768081665039, "global_step": 412119, "epoch": 2453} {"train_loss": -12.204265594482422, "global_step": 412120, "epoch": 2453} {"train_loss": -12.0974760055542, "global_step": 412121, "epoch": 2453} {"train_loss": -11.867918014526367, "global_step": 412122, "epoch": 2453} {"train_loss": -12.48836898803711, "global_step": 412123, "epoch": 2453} {"train_loss": -11.836775779724121, "global_step": 412124, "epoch": 2453} {"train_loss": -12.408149719238281, "global_step": 412125, "epoch": 2453} {"train_loss": -12.033137321472168, "global_step": 412126, "epoch": 2453} {"train_loss": -12.435338973999023, "global_step": 412127, "epoch": 2453} {"train_loss": -12.231097221374512, "global_step": 412128, "epoch": 2453} {"train_loss": -12.593358039855957, "global_step": 412129, "epoch": 2453} {"train_loss": -12.274002075195312, "global_step": 412130, "epoch": 2453} {"train_loss": -12.56834602355957, "global_step": 412131, "epoch": 2453} {"train_loss": -12.196019172668457, "global_step": 412132, "epoch": 2453} {"train_loss": -12.384857177734375, "global_step": 412133, "epoch": 2453} {"train_loss": -12.194880485534668, "global_step": 412134, "epoch": 2453} {"train_loss": -12.303955078125, "global_step": 412135, "epoch": 2453} {"train_loss": -12.284619331359863, "global_step": 412136, "epoch": 2453} {"train_loss": -12.316082000732422, "global_step": 412137, "epoch": 2453} {"train_loss": -12.393514633178711, "global_step": 412138, "epoch": 2453} {"train_loss": -12.485189437866211, "global_step": 412139, "epoch": 2453} {"train_loss": -12.102315902709961, "global_step": 412140, "epoch": 2453} {"train_loss": -12.476408958435059, "global_step": 412141, "epoch": 2453} {"train_loss": -12.455875396728516, "global_step": 412142, "epoch": 2453} {"train_loss": -12.486339569091797, "global_step": 412143, "epoch": 2453} {"train_loss": -12.394023895263672, "global_step": 412144, "epoch": 2453} {"train_loss": -12.382584571838379, "global_step": 412145, "epoch": 2453} {"train_loss": -12.61468505859375, "global_step": 412146, "epoch": 2453} {"train_loss": -12.055367469787598, "global_step": 412147, "epoch": 2453} {"train_loss": -12.316376686096191, "global_step": 412148, "epoch": 2453} {"train_loss": -12.354284286499023, "global_step": 412149, "epoch": 2453} {"train_loss": -12.493212699890137, "global_step": 412150, "epoch": 2453} {"train_loss": -12.651333808898926, "global_step": 412151, "epoch": 2453} {"train_loss": -12.267677307128906, "global_step": 412152, "epoch": 2453} {"train_loss": -12.392936706542969, "global_step": 412153, "epoch": 2453} {"train_loss": -12.556737899780273, "global_step": 412154, "epoch": 2453} {"train_loss": -12.424478530883789, "global_step": 412155, "epoch": 2453} {"train_loss": -12.637262344360352, "global_step": 412156, "epoch": 2453} {"train_loss": -12.317182540893555, "global_step": 412157, "epoch": 2453} {"train_loss": -12.310277938842773, "global_step": 412158, "epoch": 2453} {"train_loss": -12.585281372070312, "global_step": 412159, "epoch": 2453} {"train_loss": -12.586282730102539, "global_step": 412160, "epoch": 2453} {"train_loss": -12.692792892456055, "global_step": 412161, "epoch": 2453} {"train_loss": -12.542864799499512, "global_step": 412162, "epoch": 2453} {"train_loss": -12.667525291442871, "global_step": 412163, "epoch": 2453} {"train_loss": -12.50518798828125, "global_step": 412164, "epoch": 2453} {"train_loss": -12.698356628417969, "global_step": 412165, "epoch": 2453} {"train_loss": -12.689896583557129, "global_step": 412166, "epoch": 2453} {"train_loss": -12.686626434326172, "global_step": 412167, "epoch": 2453} {"train_loss": -12.487055778503418, "global_step": 412168, "epoch": 2453} {"train_loss": -12.575249671936035, "global_step": 412169, "epoch": 2453} {"train_loss": -12.75124454498291, "global_step": 412170, "epoch": 2453} {"train_loss": -12.454561233520508, "global_step": 412171, "epoch": 2453} {"train_loss": -12.785540580749512, "global_step": 412172, "epoch": 2453} {"train_loss": -12.575775146484375, "global_step": 412173, "epoch": 2453} {"train_loss": -12.788232803344727, "global_step": 412174, "epoch": 2453} {"train_loss": -12.664505004882812, "global_step": 412175, "epoch": 2453} {"train_loss": -12.832314491271973, "global_step": 412176, "epoch": 2453} {"train_loss": -12.772209167480469, "global_step": 412177, "epoch": 2453} {"train_loss": -12.409296035766602, "global_step": 412178, "epoch": 2453} {"train_loss": -12.15095329284668, "global_step": 412179, "epoch": 2453} {"train_loss": -12.435306549072266, "global_step": 412180, "epoch": 2453} {"train_loss": -12.76006031036377, "global_step": 412181, "epoch": 2453} {"train_loss": -12.53712272644043, "global_step": 412182, "epoch": 2453} {"train_loss": -12.115861892700195, "global_step": 412183, "epoch": 2453} {"train_loss": -12.557769775390625, "global_step": 412184, "epoch": 2453} {"train_loss": -12.53684139251709, "global_step": 412185, "epoch": 2453} {"train_loss": -12.06843090057373, "global_step": 412186, "epoch": 2453} {"train_loss": -12.012086868286133, "global_step": 412187, "epoch": 2453} {"train_loss": -12.129947662353516, "global_step": 412188, "epoch": 2453} {"train_loss": -12.046323776245117, "global_step": 412189, "epoch": 2453} {"train_loss": -10.90172004699707, "global_step": 412190, "epoch": 2453} {"train_loss": -12.352584838867188, "global_step": 412191, "epoch": 2453} {"train_loss": -11.812061309814453, "global_step": 412192, "epoch": 2453} {"train_loss": -12.013113975524902, "global_step": 412193, "epoch": 2453} {"train_loss": -11.86333179473877, "global_step": 412194, "epoch": 2453} {"train_loss": -12.156167984008789, "global_step": 412195, "epoch": 2453} {"train_loss": -11.935210227966309, "global_step": 412196, "epoch": 2453} {"train_loss": -12.4885835647583, "global_step": 412197, "epoch": 2453} {"train_loss": -12.192955017089844, "global_step": 412198, "epoch": 2453} {"train_loss": -11.520257949829102, "global_step": 412199, "epoch": 2453} {"train_loss": -12.144399642944336, "global_step": 412200, "epoch": 2453} {"train_loss": -12.084163665771484, "global_step": 412201, "epoch": 2453} {"train_loss": -12.335482597351074, "global_step": 412202, "epoch": 2453} {"train_loss": -11.990058898925781, "global_step": 412203, "epoch": 2453} {"train_loss": -11.868462562561035, "global_step": 412204, "epoch": 2453} {"train_loss": -11.04863166809082, "global_step": 412205, "epoch": 2453} {"train_loss": -12.238006591796875, "global_step": 412206, "epoch": 2453} {"train_loss": -11.438112258911133, "global_step": 412207, "epoch": 2453} {"train_loss": -12.463220596313477, "global_step": 412208, "epoch": 2453} {"train_loss": -11.938252449035645, "global_step": 412209, "epoch": 2453} {"train_loss": -12.348901748657227, "global_step": 412210, "epoch": 2453} {"train_loss": -12.246078491210938, "global_step": 412211, "epoch": 2453} {"train_loss": -12.135924339294434, "global_step": 412212, "epoch": 2453} {"train_loss": -12.648887634277344, "global_step": 412213, "epoch": 2453} {"train_loss": -12.704950332641602, "global_step": 412214, "epoch": 2453} {"train_loss": -12.433050155639648, "global_step": 412215, "epoch": 2453} {"train_loss": -12.538990020751953, "global_step": 412216, "epoch": 2453} {"train_loss": -12.7316255569458, "global_step": 412217, "epoch": 2453} {"train_loss": -12.410261154174805, "global_step": 412218, "epoch": 2453} {"train_loss": -12.610370635986328, "global_step": 412219, "epoch": 2453} {"train_loss": -12.730666160583496, "global_step": 412220, "epoch": 2453} {"train_loss": -12.842158317565918, "global_step": 412221, "epoch": 2453} {"train_loss": -12.711771965026855, "global_step": 412222, "epoch": 2453} {"train_loss": -12.534669876098633, "global_step": 412223, "epoch": 2453} {"train_loss": -12.814916610717773, "global_step": 412224, "epoch": 2453} {"train_loss": -12.398805618286133, "global_step": 412225, "epoch": 2453} {"train_loss": -12.334820747375488, "global_step": 412226, "epoch": 2453} {"train_loss": -12.772180557250977, "global_step": 412227, "epoch": 2453} {"train_loss": -12.910650253295898, "global_step": 412228, "epoch": 2453} {"train_loss": -12.467094421386719, "global_step": 412229, "epoch": 2453} {"train_loss": -12.534849166870117, "global_step": 412230, "epoch": 2453} {"train_loss": -12.631441116333008, "global_step": 412231, "epoch": 2453} {"train_loss": -12.518738746643066, "global_step": 412232, "epoch": 2453} {"train_loss": -12.941847801208496, "global_step": 412233, "epoch": 2453} {"train_loss": -12.528855323791504, "global_step": 412234, "epoch": 2453} {"train_loss": -12.701385498046875, "global_step": 412235, "epoch": 2453} {"train_loss": -12.569704055786133, "global_step": 412236, "epoch": 2453} {"train_loss": -12.662930488586426, "global_step": 412237, "epoch": 2453} {"train_loss": -12.477655410766602, "global_step": 412238, "epoch": 2453} {"train_loss": -12.832260131835938, "global_step": 412239, "epoch": 2453} {"train_loss": -12.64659309387207, "global_step": 412240, "epoch": 2453} {"train_loss": -12.486213684082031, "global_step": 412241, "epoch": 2453} {"train_loss": -12.385751724243164, "global_step": 412242, "epoch": 2453} {"train_loss": -12.811271667480469, "global_step": 412243, "epoch": 2453} {"train_loss": -12.577760696411133, "global_step": 412244, "epoch": 2453} {"train_loss": -12.511688232421875, "global_step": 412245, "epoch": 2453} {"train_loss": -12.111770629882812, "global_step": 412246, "epoch": 2453} {"train_loss": -12.23476791381836, "global_step": 412247, "epoch": 2453} {"train_loss": -12.308538436889648, "global_step": 412248, "epoch": 2453} {"train_loss": -12.919854164123535, "global_step": 412249, "epoch": 2453} {"train_loss": -12.676609992980957, "global_step": 412250, "epoch": 2453} {"train_loss": -12.133922576904297, "global_step": 412251, "epoch": 2453} {"train_loss": -12.193389892578125, "global_step": 412252, "epoch": 2453} {"train_loss": -12.647195816040039, "global_step": 412253, "epoch": 2453} {"train_loss": -12.400041580200195, "global_step": 412254, "epoch": 2453} {"train_loss": -12.508983612060547, "global_step": 412255, "epoch": 2453} {"train_loss": -12.53868293762207, "global_step": 412256, "epoch": 2453} {"train_loss": -12.450246810913086, "global_step": 412257, "epoch": 2453} {"train_loss": -12.550849914550781, "global_step": 412258, "epoch": 2453} {"train_loss": -12.275135040283203, "global_step": 412259, "epoch": 2453} {"train_loss": -12.478379249572754, "global_step": 412260, "epoch": 2453} {"train_loss": -12.207012176513672, "global_step": 412261, "epoch": 2453} {"train_loss": -12.518239974975586, "global_step": 412262, "epoch": 2453} {"train_loss": -12.352422714233398, "global_step": 412263, "epoch": 2453} {"train_loss": -10.95454216003418, "global_step": 412264, "epoch": 2453} {"train_loss": -10.847298622131348, "global_step": 412265, "epoch": 2453} {"train_loss": -10.476458549499512, "global_step": 412266, "epoch": 2453} {"train_loss": -9.327265739440918, "global_step": 412267, "epoch": 2453} {"train_loss": -10.893486976623535, "global_step": 412268, "epoch": 2453} {"train_loss": -10.419384956359863, "global_step": 412269, "epoch": 2453} {"train_loss": -11.464349746704102, "global_step": 412270, "epoch": 2453} {"train_loss": -12.260737600780669, "global_step": 412271, "epoch": 2453, "val_loss": 308924.6875} {"train_loss": -10.98166275024414, "global_step": 412272, "epoch": 2454} {"train_loss": -10.63565731048584, "global_step": 412273, "epoch": 2454} {"train_loss": -9.687631607055664, "global_step": 412274, "epoch": 2454} {"train_loss": -9.92401123046875, "global_step": 412275, "epoch": 2454} {"train_loss": -9.257884979248047, "global_step": 412276, "epoch": 2454} {"train_loss": -8.538491249084473, "global_step": 412277, "epoch": 2454} {"train_loss": -9.402566909790039, "global_step": 412278, "epoch": 2454} {"train_loss": -11.4287748336792, "global_step": 412279, "epoch": 2454} {"train_loss": -8.881393432617188, "global_step": 412280, "epoch": 2454} {"train_loss": -10.769759178161621, "global_step": 412281, "epoch": 2454} {"train_loss": -11.024616241455078, "global_step": 412282, "epoch": 2454} {"train_loss": -9.278663635253906, "global_step": 412283, "epoch": 2454} {"train_loss": -10.001262664794922, "global_step": 412284, "epoch": 2454} {"train_loss": -10.851919174194336, "global_step": 412285, "epoch": 2454} {"train_loss": -8.296202659606934, "global_step": 412286, "epoch": 2454} {"train_loss": -9.652799606323242, "global_step": 412287, "epoch": 2454} {"train_loss": -9.88404655456543, "global_step": 412288, "epoch": 2454} {"train_loss": -8.550985336303711, "global_step": 412289, "epoch": 2454} {"train_loss": -9.480707168579102, "global_step": 412290, "epoch": 2454} {"train_loss": -11.184959411621094, "global_step": 412291, "epoch": 2454} {"train_loss": -9.38780689239502, "global_step": 412292, "epoch": 2454} {"train_loss": -9.222509384155273, "global_step": 412293, "epoch": 2454} {"train_loss": -11.076330184936523, "global_step": 412294, "epoch": 2454} {"train_loss": -8.893714904785156, "global_step": 412295, "epoch": 2454} {"train_loss": -8.147722244262695, "global_step": 412296, "epoch": 2454} {"train_loss": -10.405845642089844, "global_step": 412297, "epoch": 2454} {"train_loss": -8.377264976501465, "global_step": 412298, "epoch": 2454} {"train_loss": -9.125889778137207, "global_step": 412299, "epoch": 2454} {"train_loss": -9.78831672668457, "global_step": 412300, "epoch": 2454} {"train_loss": -9.584606170654297, "global_step": 412301, "epoch": 2454} {"train_loss": -10.146078109741211, "global_step": 412302, "epoch": 2454} {"train_loss": -9.763004302978516, "global_step": 412303, "epoch": 2454} {"train_loss": -11.084627151489258, "global_step": 412304, "epoch": 2454} {"train_loss": -10.615081787109375, "global_step": 412305, "epoch": 2454} {"train_loss": -10.683670043945312, "global_step": 412306, "epoch": 2454} {"train_loss": -9.942791938781738, "global_step": 412307, "epoch": 2454} {"train_loss": -11.062191009521484, "global_step": 412308, "epoch": 2454} {"train_loss": -10.142154693603516, "global_step": 412309, "epoch": 2454} {"train_loss": -10.42341136932373, "global_step": 412310, "epoch": 2454} {"train_loss": -10.712515830993652, "global_step": 412311, "epoch": 2454} {"train_loss": -11.099594116210938, "global_step": 412312, "epoch": 2454} {"train_loss": -10.833480834960938, "global_step": 412313, "epoch": 2454} {"train_loss": -11.400388717651367, "global_step": 412314, "epoch": 2454} {"train_loss": -11.469268798828125, "global_step": 412315, "epoch": 2454} {"train_loss": -10.955144882202148, "global_step": 412316, "epoch": 2454} {"train_loss": -10.732696533203125, "global_step": 412317, "epoch": 2454} {"train_loss": -11.78763484954834, "global_step": 412318, "epoch": 2454} {"train_loss": -11.280284881591797, "global_step": 412319, "epoch": 2454} {"train_loss": -11.447853088378906, "global_step": 412320, "epoch": 2454} {"train_loss": -11.52210807800293, "global_step": 412321, "epoch": 2454} {"train_loss": -11.19743537902832, "global_step": 412322, "epoch": 2454} {"train_loss": -11.702520370483398, "global_step": 412323, "epoch": 2454} {"train_loss": -11.698397636413574, "global_step": 412324, "epoch": 2454} {"train_loss": -11.400899887084961, "global_step": 412325, "epoch": 2454} {"train_loss": -11.598785400390625, "global_step": 412326, "epoch": 2454} {"train_loss": -11.310359954833984, "global_step": 412327, "epoch": 2454} {"train_loss": -11.698430061340332, "global_step": 412328, "epoch": 2454} {"train_loss": -11.777259826660156, "global_step": 412329, "epoch": 2454} {"train_loss": -11.845890045166016, "global_step": 412330, "epoch": 2454} {"train_loss": -12.104852676391602, "global_step": 412331, "epoch": 2454} {"train_loss": -11.565065383911133, "global_step": 412332, "epoch": 2454} {"train_loss": -11.664329528808594, "global_step": 412333, "epoch": 2454} {"train_loss": -12.099424362182617, "global_step": 412334, "epoch": 2454} {"train_loss": -11.70292854309082, "global_step": 412335, "epoch": 2454} {"train_loss": -12.090315818786621, "global_step": 412336, "epoch": 2454} {"train_loss": -11.70659065246582, "global_step": 412337, "epoch": 2454} {"train_loss": -11.983302116394043, "global_step": 412338, "epoch": 2454} {"train_loss": -11.905292510986328, "global_step": 412339, "epoch": 2454} {"train_loss": -12.017590522766113, "global_step": 412340, "epoch": 2454} {"train_loss": -11.959047317504883, "global_step": 412341, "epoch": 2454} {"train_loss": -11.810644149780273, "global_step": 412342, "epoch": 2454} {"train_loss": -12.106378555297852, "global_step": 412343, "epoch": 2454} {"train_loss": -12.023521423339844, "global_step": 412344, "epoch": 2454} {"train_loss": -12.008073806762695, "global_step": 412345, "epoch": 2454} {"train_loss": -12.095236778259277, "global_step": 412346, "epoch": 2454} {"train_loss": -11.863183975219727, "global_step": 412347, "epoch": 2454} {"train_loss": -12.292088508605957, "global_step": 412348, "epoch": 2454} {"train_loss": -12.083052635192871, "global_step": 412349, "epoch": 2454} {"train_loss": -12.06324577331543, "global_step": 412350, "epoch": 2454} {"train_loss": -12.175830841064453, "global_step": 412351, "epoch": 2454} {"train_loss": -12.167105674743652, "global_step": 412352, "epoch": 2454} {"train_loss": -12.19106388092041, "global_step": 412353, "epoch": 2454} {"train_loss": -12.047100067138672, "global_step": 412354, "epoch": 2454} {"train_loss": -12.393428802490234, "global_step": 412355, "epoch": 2454} {"train_loss": -12.088251113891602, "global_step": 412356, "epoch": 2454} {"train_loss": -12.32485580444336, "global_step": 412357, "epoch": 2454} {"train_loss": -12.331398010253906, "global_step": 412358, "epoch": 2454} {"train_loss": -12.030694007873535, "global_step": 412359, "epoch": 2454} {"train_loss": -12.320432662963867, "global_step": 412360, "epoch": 2454} {"train_loss": -12.204813003540039, "global_step": 412361, "epoch": 2454} {"train_loss": -12.390119552612305, "global_step": 412362, "epoch": 2454} {"train_loss": -11.904179573059082, "global_step": 412363, "epoch": 2454} {"train_loss": -12.248140335083008, "global_step": 412364, "epoch": 2454} {"train_loss": -12.096282958984375, "global_step": 412365, "epoch": 2454} {"train_loss": -12.083043098449707, "global_step": 412366, "epoch": 2454} {"train_loss": -12.559462547302246, "global_step": 412367, "epoch": 2454} {"train_loss": -12.09343147277832, "global_step": 412368, "epoch": 2454} {"train_loss": -12.429096221923828, "global_step": 412369, "epoch": 2454} {"train_loss": -12.066145896911621, "global_step": 412370, "epoch": 2454} {"train_loss": -12.471700668334961, "global_step": 412371, "epoch": 2454} {"train_loss": -12.031524658203125, "global_step": 412372, "epoch": 2454} {"train_loss": -12.195673942565918, "global_step": 412373, "epoch": 2454} {"train_loss": -12.042274475097656, "global_step": 412374, "epoch": 2454} {"train_loss": -11.591529846191406, "global_step": 412375, "epoch": 2454} {"train_loss": -12.313264846801758, "global_step": 412376, "epoch": 2454} {"train_loss": -11.994640350341797, "global_step": 412377, "epoch": 2454} {"train_loss": -12.202192306518555, "global_step": 412378, "epoch": 2454} {"train_loss": -11.765113830566406, "global_step": 412379, "epoch": 2454} {"train_loss": -12.068435668945312, "global_step": 412380, "epoch": 2454} {"train_loss": -12.319756507873535, "global_step": 412381, "epoch": 2454} {"train_loss": -12.236669540405273, "global_step": 412382, "epoch": 2454} {"train_loss": -12.303906440734863, "global_step": 412383, "epoch": 2454} {"train_loss": -12.407007217407227, "global_step": 412384, "epoch": 2454} {"train_loss": -12.210697174072266, "global_step": 412385, "epoch": 2454} {"train_loss": -12.322696685791016, "global_step": 412386, "epoch": 2454} {"train_loss": -12.089019775390625, "global_step": 412387, "epoch": 2454} {"train_loss": -12.399811744689941, "global_step": 412388, "epoch": 2454} {"train_loss": -12.153887748718262, "global_step": 412389, "epoch": 2454} {"train_loss": -12.360268592834473, "global_step": 412390, "epoch": 2454} {"train_loss": -12.543346405029297, "global_step": 412391, "epoch": 2454} {"train_loss": -12.266414642333984, "global_step": 412392, "epoch": 2454} {"train_loss": -12.465789794921875, "global_step": 412393, "epoch": 2454} {"train_loss": -12.520137786865234, "global_step": 412394, "epoch": 2454} {"train_loss": -12.60660171508789, "global_step": 412395, "epoch": 2454} {"train_loss": -12.515111923217773, "global_step": 412396, "epoch": 2454} {"train_loss": -12.506963729858398, "global_step": 412397, "epoch": 2454} {"train_loss": -12.29549503326416, "global_step": 412398, "epoch": 2454} {"train_loss": -12.616496086120605, "global_step": 412399, "epoch": 2454} {"train_loss": -12.686837196350098, "global_step": 412400, "epoch": 2454} {"train_loss": -12.490814208984375, "global_step": 412401, "epoch": 2454} {"train_loss": -12.468480110168457, "global_step": 412402, "epoch": 2454} {"train_loss": -12.633834838867188, "global_step": 412403, "epoch": 2454} {"train_loss": -12.372515678405762, "global_step": 412404, "epoch": 2454} {"train_loss": -12.480238914489746, "global_step": 412405, "epoch": 2454} {"train_loss": -12.75198745727539, "global_step": 412406, "epoch": 2454} {"train_loss": -12.530914306640625, "global_step": 412407, "epoch": 2454} {"train_loss": -12.745122909545898, "global_step": 412408, "epoch": 2454} {"train_loss": -12.464946746826172, "global_step": 412409, "epoch": 2454} {"train_loss": -12.79880142211914, "global_step": 412410, "epoch": 2454} {"train_loss": -12.551982879638672, "global_step": 412411, "epoch": 2454} {"train_loss": -12.51253604888916, "global_step": 412412, "epoch": 2454} {"train_loss": -12.391600608825684, "global_step": 412413, "epoch": 2454} {"train_loss": -12.452340126037598, "global_step": 412414, "epoch": 2454} {"train_loss": -12.678240776062012, "global_step": 412415, "epoch": 2454} {"train_loss": -12.298128128051758, "global_step": 412416, "epoch": 2454} {"train_loss": -12.668476104736328, "global_step": 412417, "epoch": 2454} {"train_loss": -12.32076358795166, "global_step": 412418, "epoch": 2454} {"train_loss": -12.352119445800781, "global_step": 412419, "epoch": 2454} {"train_loss": -12.671834945678711, "global_step": 412420, "epoch": 2454} {"train_loss": -12.252307891845703, "global_step": 412421, "epoch": 2454} {"train_loss": -12.193185806274414, "global_step": 412422, "epoch": 2454} {"train_loss": -12.320416450500488, "global_step": 412423, "epoch": 2454} {"train_loss": -12.809433937072754, "global_step": 412424, "epoch": 2454} {"train_loss": -12.55204963684082, "global_step": 412425, "epoch": 2454} {"train_loss": -12.630229949951172, "global_step": 412426, "epoch": 2454} {"train_loss": -12.576936721801758, "global_step": 412427, "epoch": 2454} {"train_loss": -12.324048042297363, "global_step": 412428, "epoch": 2454} {"train_loss": -12.564349174499512, "global_step": 412429, "epoch": 2454} {"train_loss": -12.512650489807129, "global_step": 412430, "epoch": 2454} {"train_loss": -11.90943431854248, "global_step": 412431, "epoch": 2454} {"train_loss": -12.765859603881836, "global_step": 412432, "epoch": 2454} {"train_loss": -12.439034461975098, "global_step": 412433, "epoch": 2454} {"train_loss": -12.68020248413086, "global_step": 412434, "epoch": 2454} {"train_loss": -12.425639152526855, "global_step": 412435, "epoch": 2454} {"train_loss": -12.676398277282715, "global_step": 412436, "epoch": 2454} {"train_loss": -12.314019203186035, "global_step": 412437, "epoch": 2454} {"train_loss": -12.368370056152344, "global_step": 412438, "epoch": 2454} {"train_loss": -11.61924411569323, "global_step": 412439, "epoch": 2454, "val_loss": 299413.40625} {"train_loss": -12.732669830322266, "global_step": 412440, "epoch": 2455} {"train_loss": -12.7166109085083, "global_step": 412441, "epoch": 2455} {"train_loss": -12.510747909545898, "global_step": 412442, "epoch": 2455} {"train_loss": -12.272171020507812, "global_step": 412443, "epoch": 2455} {"train_loss": -12.195615768432617, "global_step": 412444, "epoch": 2455} {"train_loss": -12.386646270751953, "global_step": 412445, "epoch": 2455} {"train_loss": -12.391533851623535, "global_step": 412446, "epoch": 2455} {"train_loss": -12.481103897094727, "global_step": 412447, "epoch": 2455} {"train_loss": -12.604328155517578, "global_step": 412448, "epoch": 2455} {"train_loss": -11.510228157043457, "global_step": 412449, "epoch": 2455} {"train_loss": -12.295082092285156, "global_step": 412450, "epoch": 2455} {"train_loss": -12.395476341247559, "global_step": 412451, "epoch": 2455} {"train_loss": -12.144712448120117, "global_step": 412452, "epoch": 2455} {"train_loss": -12.454244613647461, "global_step": 412453, "epoch": 2455} {"train_loss": -11.353853225708008, "global_step": 412454, "epoch": 2455} {"train_loss": -11.284247398376465, "global_step": 412455, "epoch": 2455} {"train_loss": -11.601245880126953, "global_step": 412456, "epoch": 2455} {"train_loss": -12.504414558410645, "global_step": 412457, "epoch": 2455} {"train_loss": -11.479204177856445, "global_step": 412458, "epoch": 2455} {"train_loss": -10.307146072387695, "global_step": 412459, "epoch": 2455} {"train_loss": -10.940361022949219, "global_step": 412460, "epoch": 2455} {"train_loss": -11.814751625061035, "global_step": 412461, "epoch": 2455} {"train_loss": -9.08260726928711, "global_step": 412462, "epoch": 2455} {"train_loss": -11.397489547729492, "global_step": 412463, "epoch": 2455} {"train_loss": -7.907678604125977, "global_step": 412464, "epoch": 2455} {"train_loss": -6.90659236907959, "global_step": 412465, "epoch": 2455} {"train_loss": -7.631559371948242, "global_step": 412466, "epoch": 2455} {"train_loss": -7.346990585327148, "global_step": 412467, "epoch": 2455} {"train_loss": -6.748727798461914, "global_step": 412468, "epoch": 2455} {"train_loss": -7.064905166625977, "global_step": 412469, "epoch": 2455} {"train_loss": -6.963775157928467, "global_step": 412470, "epoch": 2455} {"train_loss": -7.068276882171631, "global_step": 412471, "epoch": 2455} {"train_loss": -7.435830116271973, "global_step": 412472, "epoch": 2455} {"train_loss": -7.274727821350098, "global_step": 412473, "epoch": 2455} {"train_loss": -7.450246810913086, "global_step": 412474, "epoch": 2455} {"train_loss": -7.735445022583008, "global_step": 412475, "epoch": 2455} {"train_loss": -7.754785537719727, "global_step": 412476, "epoch": 2455} {"train_loss": -7.5670671463012695, "global_step": 412477, "epoch": 2455} {"train_loss": -7.812160968780518, "global_step": 412478, "epoch": 2455} {"train_loss": -8.690664291381836, "global_step": 412479, "epoch": 2455} {"train_loss": -9.113407135009766, "global_step": 412480, "epoch": 2455} {"train_loss": -9.208123207092285, "global_step": 412481, "epoch": 2455} {"train_loss": -9.651053428649902, "global_step": 412482, "epoch": 2455} {"train_loss": -9.164359092712402, "global_step": 412483, "epoch": 2455} {"train_loss": -9.643733978271484, "global_step": 412484, "epoch": 2455} {"train_loss": -9.447731018066406, "global_step": 412485, "epoch": 2455} {"train_loss": -10.067852973937988, "global_step": 412486, "epoch": 2455} {"train_loss": -10.215208053588867, "global_step": 412487, "epoch": 2455} {"train_loss": -10.500526428222656, "global_step": 412488, "epoch": 2455} {"train_loss": -10.572613716125488, "global_step": 412489, "epoch": 2455} {"train_loss": -10.838523864746094, "global_step": 412490, "epoch": 2455} {"train_loss": -10.896431922912598, "global_step": 412491, "epoch": 2455} {"train_loss": -11.689840316772461, "global_step": 412492, "epoch": 2455} {"train_loss": -11.383440017700195, "global_step": 412493, "epoch": 2455} {"train_loss": -11.145285606384277, "global_step": 412494, "epoch": 2455} {"train_loss": -11.510496139526367, "global_step": 412495, "epoch": 2455} {"train_loss": -11.829019546508789, "global_step": 412496, "epoch": 2455} {"train_loss": -11.757791519165039, "global_step": 412497, "epoch": 2455} {"train_loss": -11.721990585327148, "global_step": 412498, "epoch": 2455} {"train_loss": -11.921152114868164, "global_step": 412499, "epoch": 2455} {"train_loss": -11.262114524841309, "global_step": 412500, "epoch": 2455} {"train_loss": -11.82070541381836, "global_step": 412501, "epoch": 2455} {"train_loss": -11.040570259094238, "global_step": 412502, "epoch": 2455} {"train_loss": -11.525867462158203, "global_step": 412503, "epoch": 2455} {"train_loss": -11.939204216003418, "global_step": 412504, "epoch": 2455} {"train_loss": -11.634370803833008, "global_step": 412505, "epoch": 2455} {"train_loss": -12.04452896118164, "global_step": 412506, "epoch": 2455} {"train_loss": -11.723592758178711, "global_step": 412507, "epoch": 2455} {"train_loss": -12.10391902923584, "global_step": 412508, "epoch": 2455} {"train_loss": -11.588793754577637, "global_step": 412509, "epoch": 2455} {"train_loss": -11.955113410949707, "global_step": 412510, "epoch": 2455} {"train_loss": -11.472818374633789, "global_step": 412511, "epoch": 2455} {"train_loss": -11.873823165893555, "global_step": 412512, "epoch": 2455} {"train_loss": -11.998014450073242, "global_step": 412513, "epoch": 2455} {"train_loss": -11.965744972229004, "global_step": 412514, "epoch": 2455} {"train_loss": -12.137260437011719, "global_step": 412515, "epoch": 2455} {"train_loss": -12.103668212890625, "global_step": 412516, "epoch": 2455} {"train_loss": -12.376709938049316, "global_step": 412517, "epoch": 2455} {"train_loss": -12.14560604095459, "global_step": 412518, "epoch": 2455} {"train_loss": -11.94951057434082, "global_step": 412519, "epoch": 2455} {"train_loss": -12.077579498291016, "global_step": 412520, "epoch": 2455} {"train_loss": -12.278633117675781, "global_step": 412521, "epoch": 2455} {"train_loss": -12.2176513671875, "global_step": 412522, "epoch": 2455} {"train_loss": -12.401897430419922, "global_step": 412523, "epoch": 2455} {"train_loss": -12.42222785949707, "global_step": 412524, "epoch": 2455} {"train_loss": -12.305761337280273, "global_step": 412525, "epoch": 2455} {"train_loss": -12.404072761535645, "global_step": 412526, "epoch": 2455} {"train_loss": -12.468133926391602, "global_step": 412527, "epoch": 2455} {"train_loss": -12.274948120117188, "global_step": 412528, "epoch": 2455} {"train_loss": -12.40144157409668, "global_step": 412529, "epoch": 2455} {"train_loss": -12.525928497314453, "global_step": 412530, "epoch": 2455} {"train_loss": -12.310547828674316, "global_step": 412531, "epoch": 2455} {"train_loss": -12.6090087890625, "global_step": 412532, "epoch": 2455} {"train_loss": -12.643717765808105, "global_step": 412533, "epoch": 2455} {"train_loss": -12.411798477172852, "global_step": 412534, "epoch": 2455} {"train_loss": -12.44145393371582, "global_step": 412535, "epoch": 2455} {"train_loss": -12.805519104003906, "global_step": 412536, "epoch": 2455} {"train_loss": -12.500710487365723, "global_step": 412537, "epoch": 2455} {"train_loss": -12.478736877441406, "global_step": 412538, "epoch": 2455} {"train_loss": -12.335124015808105, "global_step": 412539, "epoch": 2455} {"train_loss": -12.317291259765625, "global_step": 412540, "epoch": 2455} {"train_loss": -12.229708671569824, "global_step": 412541, "epoch": 2455} {"train_loss": -12.563617706298828, "global_step": 412542, "epoch": 2455} {"train_loss": -12.282129287719727, "global_step": 412543, "epoch": 2455} {"train_loss": -12.60665225982666, "global_step": 412544, "epoch": 2455} {"train_loss": -12.390308380126953, "global_step": 412545, "epoch": 2455} {"train_loss": -12.419304847717285, "global_step": 412546, "epoch": 2455} {"train_loss": -12.454034805297852, "global_step": 412547, "epoch": 2455} {"train_loss": -12.300141334533691, "global_step": 412548, "epoch": 2455} {"train_loss": -12.154544830322266, "global_step": 412549, "epoch": 2455} {"train_loss": -12.506479263305664, "global_step": 412550, "epoch": 2455} {"train_loss": -12.139508247375488, "global_step": 412551, "epoch": 2455} {"train_loss": -12.450983047485352, "global_step": 412552, "epoch": 2455} {"train_loss": -12.496505737304688, "global_step": 412553, "epoch": 2455} {"train_loss": -11.617534637451172, "global_step": 412554, "epoch": 2455} {"train_loss": -11.508621215820312, "global_step": 412555, "epoch": 2455} {"train_loss": -12.217716217041016, "global_step": 412556, "epoch": 2455} {"train_loss": -12.075216293334961, "global_step": 412557, "epoch": 2455} {"train_loss": -12.387982368469238, "global_step": 412558, "epoch": 2455} {"train_loss": -12.306891441345215, "global_step": 412559, "epoch": 2455} {"train_loss": -12.558208465576172, "global_step": 412560, "epoch": 2455} {"train_loss": -12.16451644897461, "global_step": 412561, "epoch": 2455} {"train_loss": -12.466221809387207, "global_step": 412562, "epoch": 2455} {"train_loss": -12.593914031982422, "global_step": 412563, "epoch": 2455} {"train_loss": -12.291955947875977, "global_step": 412564, "epoch": 2455} {"train_loss": -12.4708251953125, "global_step": 412565, "epoch": 2455} {"train_loss": -12.489646911621094, "global_step": 412566, "epoch": 2455} {"train_loss": -12.121910095214844, "global_step": 412567, "epoch": 2455} {"train_loss": -12.655084609985352, "global_step": 412568, "epoch": 2455} {"train_loss": -12.678256034851074, "global_step": 412569, "epoch": 2455} {"train_loss": -12.037004470825195, "global_step": 412570, "epoch": 2455} {"train_loss": -12.312690734863281, "global_step": 412571, "epoch": 2455} {"train_loss": -12.462187767028809, "global_step": 412572, "epoch": 2455} {"train_loss": -12.376378059387207, "global_step": 412573, "epoch": 2455} {"train_loss": -12.542556762695312, "global_step": 412574, "epoch": 2455} {"train_loss": -12.42910385131836, "global_step": 412575, "epoch": 2455} {"train_loss": -12.567357063293457, "global_step": 412576, "epoch": 2455} {"train_loss": -12.509977340698242, "global_step": 412577, "epoch": 2455} {"train_loss": -12.652144432067871, "global_step": 412578, "epoch": 2455} {"train_loss": -12.226988792419434, "global_step": 412579, "epoch": 2455} {"train_loss": -12.474004745483398, "global_step": 412580, "epoch": 2455} {"train_loss": -12.036663055419922, "global_step": 412581, "epoch": 2455} {"train_loss": -12.087841033935547, "global_step": 412582, "epoch": 2455} {"train_loss": -12.401077270507812, "global_step": 412583, "epoch": 2455} {"train_loss": -12.425643920898438, "global_step": 412584, "epoch": 2455} {"train_loss": -12.43148136138916, "global_step": 412585, "epoch": 2455} {"train_loss": -12.544656753540039, "global_step": 412586, "epoch": 2455} {"train_loss": -12.173458099365234, "global_step": 412587, "epoch": 2455} {"train_loss": -12.524454116821289, "global_step": 412588, "epoch": 2455} {"train_loss": -12.372346878051758, "global_step": 412589, "epoch": 2455} {"train_loss": -12.454729080200195, "global_step": 412590, "epoch": 2455} {"train_loss": -12.41093635559082, "global_step": 412591, "epoch": 2455} {"train_loss": -12.310806274414062, "global_step": 412592, "epoch": 2455} {"train_loss": -12.32742691040039, "global_step": 412593, "epoch": 2455} {"train_loss": -12.636223793029785, "global_step": 412594, "epoch": 2455} {"train_loss": -12.526199340820312, "global_step": 412595, "epoch": 2455} {"train_loss": -12.195089340209961, "global_step": 412596, "epoch": 2455} {"train_loss": -12.217029571533203, "global_step": 412597, "epoch": 2455} {"train_loss": -12.34416389465332, "global_step": 412598, "epoch": 2455} {"train_loss": -10.67724895477295, "global_step": 412599, "epoch": 2455} {"train_loss": -11.516846656799316, "global_step": 412600, "epoch": 2455} {"train_loss": -12.301673889160156, "global_step": 412601, "epoch": 2455} {"train_loss": -11.784782409667969, "global_step": 412602, "epoch": 2455} {"train_loss": -12.272223472595215, "global_step": 412603, "epoch": 2455} {"train_loss": -12.47821044921875, "global_step": 412604, "epoch": 2455} {"train_loss": -12.443836212158203, "global_step": 412605, "epoch": 2455} {"train_loss": -12.428553581237793, "global_step": 412606, "epoch": 2455} {"train_loss": -11.540377494834718, "global_step": 412607, "epoch": 2455, "val_loss": 305308.59375, "train_action_mse_error": 2.475191116333008} {"train_loss": -12.374870300292969, "global_step": 412608, "epoch": 2456} {"train_loss": -12.429641723632812, "global_step": 412609, "epoch": 2456} {"train_loss": -12.462845802307129, "global_step": 412610, "epoch": 2456} {"train_loss": -12.10100269317627, "global_step": 412611, "epoch": 2456} {"train_loss": -10.857410430908203, "global_step": 412612, "epoch": 2456} {"train_loss": -11.550172805786133, "global_step": 412613, "epoch": 2456} {"train_loss": -11.529394149780273, "global_step": 412614, "epoch": 2456} {"train_loss": -9.900125503540039, "global_step": 412615, "epoch": 2456} {"train_loss": -10.01767349243164, "global_step": 412616, "epoch": 2456} {"train_loss": -11.480949401855469, "global_step": 412617, "epoch": 2456} {"train_loss": -11.057968139648438, "global_step": 412618, "epoch": 2456} {"train_loss": -11.63811206817627, "global_step": 412619, "epoch": 2456} {"train_loss": -11.075538635253906, "global_step": 412620, "epoch": 2456} {"train_loss": -12.145454406738281, "global_step": 412621, "epoch": 2456} {"train_loss": -11.623103141784668, "global_step": 412622, "epoch": 2456} {"train_loss": -11.368915557861328, "global_step": 412623, "epoch": 2456} {"train_loss": -10.85862922668457, "global_step": 412624, "epoch": 2456} {"train_loss": -11.309476852416992, "global_step": 412625, "epoch": 2456} {"train_loss": -10.917802810668945, "global_step": 412626, "epoch": 2456} {"train_loss": -10.820594787597656, "global_step": 412627, "epoch": 2456} {"train_loss": -11.47171401977539, "global_step": 412628, "epoch": 2456} {"train_loss": -11.375675201416016, "global_step": 412629, "epoch": 2456} {"train_loss": -10.444581985473633, "global_step": 412630, "epoch": 2456} {"train_loss": -11.687398910522461, "global_step": 412631, "epoch": 2456} {"train_loss": -10.874914169311523, "global_step": 412632, "epoch": 2456} {"train_loss": -10.710691452026367, "global_step": 412633, "epoch": 2456} {"train_loss": -11.385456085205078, "global_step": 412634, "epoch": 2456} {"train_loss": -10.818904876708984, "global_step": 412635, "epoch": 2456} {"train_loss": -11.71082592010498, "global_step": 412636, "epoch": 2456} {"train_loss": -11.08598518371582, "global_step": 412637, "epoch": 2456} {"train_loss": -11.981959342956543, "global_step": 412638, "epoch": 2456} {"train_loss": -10.416723251342773, "global_step": 412639, "epoch": 2456} {"train_loss": -11.842750549316406, "global_step": 412640, "epoch": 2456} {"train_loss": -10.767187118530273, "global_step": 412641, "epoch": 2456} {"train_loss": -10.365400314331055, "global_step": 412642, "epoch": 2456} {"train_loss": -11.64177131652832, "global_step": 412643, "epoch": 2456} {"train_loss": -10.708967208862305, "global_step": 412644, "epoch": 2456} {"train_loss": -10.458511352539062, "global_step": 412645, "epoch": 2456} {"train_loss": -10.494573593139648, "global_step": 412646, "epoch": 2456} {"train_loss": -9.438241958618164, "global_step": 412647, "epoch": 2456} {"train_loss": -11.725698471069336, "global_step": 412648, "epoch": 2456} {"train_loss": -10.110735893249512, "global_step": 412649, "epoch": 2456} {"train_loss": -11.19922161102295, "global_step": 412650, "epoch": 2456} {"train_loss": -11.000299453735352, "global_step": 412651, "epoch": 2456} {"train_loss": -10.915618896484375, "global_step": 412652, "epoch": 2456} {"train_loss": -10.902405738830566, "global_step": 412653, "epoch": 2456} {"train_loss": -11.85025405883789, "global_step": 412654, "epoch": 2456} {"train_loss": -10.82851791381836, "global_step": 412655, "epoch": 2456} {"train_loss": -11.496907234191895, "global_step": 412656, "epoch": 2456} {"train_loss": -11.46174144744873, "global_step": 412657, "epoch": 2456} {"train_loss": -11.44775390625, "global_step": 412658, "epoch": 2456} {"train_loss": -11.64107894897461, "global_step": 412659, "epoch": 2456} {"train_loss": -11.962531089782715, "global_step": 412660, "epoch": 2456} {"train_loss": -11.543871879577637, "global_step": 412661, "epoch": 2456} {"train_loss": -11.831281661987305, "global_step": 412662, "epoch": 2456} {"train_loss": -11.819107055664062, "global_step": 412663, "epoch": 2456} {"train_loss": -11.976266860961914, "global_step": 412664, "epoch": 2456} {"train_loss": -12.214104652404785, "global_step": 412665, "epoch": 2456} {"train_loss": -12.230344772338867, "global_step": 412666, "epoch": 2456} {"train_loss": -12.020421028137207, "global_step": 412667, "epoch": 2456} {"train_loss": -12.186446189880371, "global_step": 412668, "epoch": 2456} {"train_loss": -12.02164077758789, "global_step": 412669, "epoch": 2456} {"train_loss": -12.411431312561035, "global_step": 412670, "epoch": 2456} {"train_loss": -12.51318359375, "global_step": 412671, "epoch": 2456} {"train_loss": -12.14393138885498, "global_step": 412672, "epoch": 2456} {"train_loss": -12.407376289367676, "global_step": 412673, "epoch": 2456} {"train_loss": -12.188766479492188, "global_step": 412674, "epoch": 2456} {"train_loss": -12.432727813720703, "global_step": 412675, "epoch": 2456} {"train_loss": -12.155479431152344, "global_step": 412676, "epoch": 2456} {"train_loss": -12.493335723876953, "global_step": 412677, "epoch": 2456} {"train_loss": -12.0990571975708, "global_step": 412678, "epoch": 2456} {"train_loss": -12.494770050048828, "global_step": 412679, "epoch": 2456} {"train_loss": -12.315482139587402, "global_step": 412680, "epoch": 2456} {"train_loss": -12.480317115783691, "global_step": 412681, "epoch": 2456} {"train_loss": -12.055889129638672, "global_step": 412682, "epoch": 2456} {"train_loss": -12.090728759765625, "global_step": 412683, "epoch": 2456} {"train_loss": -12.493953704833984, "global_step": 412684, "epoch": 2456} {"train_loss": -12.10359001159668, "global_step": 412685, "epoch": 2456} {"train_loss": -12.21674919128418, "global_step": 412686, "epoch": 2456} {"train_loss": -12.518396377563477, "global_step": 412687, "epoch": 2456} {"train_loss": -12.551294326782227, "global_step": 412688, "epoch": 2456} {"train_loss": -12.434743881225586, "global_step": 412689, "epoch": 2456} {"train_loss": -12.084701538085938, "global_step": 412690, "epoch": 2456} {"train_loss": -12.1248779296875, "global_step": 412691, "epoch": 2456} {"train_loss": -12.451108932495117, "global_step": 412692, "epoch": 2456} {"train_loss": -12.080421447753906, "global_step": 412693, "epoch": 2456} {"train_loss": -12.238542556762695, "global_step": 412694, "epoch": 2456} {"train_loss": -12.02199935913086, "global_step": 412695, "epoch": 2456} {"train_loss": -11.723957061767578, "global_step": 412696, "epoch": 2456} {"train_loss": -12.44906234741211, "global_step": 412697, "epoch": 2456} {"train_loss": -12.018977165222168, "global_step": 412698, "epoch": 2456} {"train_loss": -12.079298973083496, "global_step": 412699, "epoch": 2456} {"train_loss": -12.33488655090332, "global_step": 412700, "epoch": 2456} {"train_loss": -12.23908805847168, "global_step": 412701, "epoch": 2456} {"train_loss": -12.290000915527344, "global_step": 412702, "epoch": 2456} {"train_loss": -12.406564712524414, "global_step": 412703, "epoch": 2456} {"train_loss": -12.17514419555664, "global_step": 412704, "epoch": 2456} {"train_loss": -12.179475784301758, "global_step": 412705, "epoch": 2456} {"train_loss": -12.526910781860352, "global_step": 412706, "epoch": 2456} {"train_loss": -12.482479095458984, "global_step": 412707, "epoch": 2456} {"train_loss": -12.639913558959961, "global_step": 412708, "epoch": 2456} {"train_loss": -12.230681419372559, "global_step": 412709, "epoch": 2456} {"train_loss": -12.578160285949707, "global_step": 412710, "epoch": 2456} {"train_loss": -12.263261795043945, "global_step": 412711, "epoch": 2456} {"train_loss": -12.601400375366211, "global_step": 412712, "epoch": 2456} {"train_loss": -12.583364486694336, "global_step": 412713, "epoch": 2456} {"train_loss": -12.239583969116211, "global_step": 412714, "epoch": 2456} {"train_loss": -12.485936164855957, "global_step": 412715, "epoch": 2456} {"train_loss": -12.429655075073242, "global_step": 412716, "epoch": 2456} {"train_loss": -12.600339889526367, "global_step": 412717, "epoch": 2456} {"train_loss": -12.135797500610352, "global_step": 412718, "epoch": 2456} {"train_loss": -12.340676307678223, "global_step": 412719, "epoch": 2456} {"train_loss": -11.883440017700195, "global_step": 412720, "epoch": 2456} {"train_loss": -11.901734352111816, "global_step": 412721, "epoch": 2456} {"train_loss": -12.210699081420898, "global_step": 412722, "epoch": 2456} {"train_loss": -11.974584579467773, "global_step": 412723, "epoch": 2456} {"train_loss": -11.946224212646484, "global_step": 412724, "epoch": 2456} {"train_loss": -11.97559928894043, "global_step": 412725, "epoch": 2456} {"train_loss": -11.329263687133789, "global_step": 412726, "epoch": 2456} {"train_loss": -11.760552406311035, "global_step": 412727, "epoch": 2456} {"train_loss": -12.098426818847656, "global_step": 412728, "epoch": 2456} {"train_loss": -11.017452239990234, "global_step": 412729, "epoch": 2456} {"train_loss": -11.425675392150879, "global_step": 412730, "epoch": 2456} {"train_loss": -11.98931884765625, "global_step": 412731, "epoch": 2456} {"train_loss": -12.240235328674316, "global_step": 412732, "epoch": 2456} {"train_loss": -11.572978019714355, "global_step": 412733, "epoch": 2456} {"train_loss": -12.569509506225586, "global_step": 412734, "epoch": 2456} {"train_loss": -11.452630996704102, "global_step": 412735, "epoch": 2456} {"train_loss": -12.187470436096191, "global_step": 412736, "epoch": 2456} {"train_loss": -12.241497039794922, "global_step": 412737, "epoch": 2456} {"train_loss": -11.48181438446045, "global_step": 412738, "epoch": 2456} {"train_loss": -11.83051586151123, "global_step": 412739, "epoch": 2456} {"train_loss": -12.458253860473633, "global_step": 412740, "epoch": 2456} {"train_loss": -11.372299194335938, "global_step": 412741, "epoch": 2456} {"train_loss": -12.27329158782959, "global_step": 412742, "epoch": 2456} {"train_loss": -11.838361740112305, "global_step": 412743, "epoch": 2456} {"train_loss": -10.398537635803223, "global_step": 412744, "epoch": 2456} {"train_loss": -12.186481475830078, "global_step": 412745, "epoch": 2456} {"train_loss": -10.49392318725586, "global_step": 412746, "epoch": 2456} {"train_loss": -11.804986953735352, "global_step": 412747, "epoch": 2456} {"train_loss": -10.56456470489502, "global_step": 412748, "epoch": 2456} {"train_loss": -11.508903503417969, "global_step": 412749, "epoch": 2456} {"train_loss": -11.628418922424316, "global_step": 412750, "epoch": 2456} {"train_loss": -11.381233215332031, "global_step": 412751, "epoch": 2456} {"train_loss": -11.98574447631836, "global_step": 412752, "epoch": 2456} {"train_loss": -11.011988639831543, "global_step": 412753, "epoch": 2456} {"train_loss": -11.439483642578125, "global_step": 412754, "epoch": 2456} {"train_loss": -11.142230987548828, "global_step": 412755, "epoch": 2456} {"train_loss": -11.897029876708984, "global_step": 412756, "epoch": 2456} {"train_loss": -10.861770629882812, "global_step": 412757, "epoch": 2456} {"train_loss": -12.267961502075195, "global_step": 412758, "epoch": 2456} {"train_loss": -11.627861022949219, "global_step": 412759, "epoch": 2456} {"train_loss": -11.707405090332031, "global_step": 412760, "epoch": 2456} {"train_loss": -12.578530311584473, "global_step": 412761, "epoch": 2456} {"train_loss": -11.038970947265625, "global_step": 412762, "epoch": 2456} {"train_loss": -11.763843536376953, "global_step": 412763, "epoch": 2456} {"train_loss": -11.913497924804688, "global_step": 412764, "epoch": 2456} {"train_loss": -11.476301193237305, "global_step": 412765, "epoch": 2456} {"train_loss": -11.890884399414062, "global_step": 412766, "epoch": 2456} {"train_loss": -10.360922813415527, "global_step": 412767, "epoch": 2456} {"train_loss": -10.324554443359375, "global_step": 412768, "epoch": 2456} {"train_loss": -10.87343692779541, "global_step": 412769, "epoch": 2456} {"train_loss": -11.992449760437012, "global_step": 412770, "epoch": 2456} {"train_loss": -10.586755752563477, "global_step": 412771, "epoch": 2456} {"train_loss": -10.192940711975098, "global_step": 412772, "epoch": 2456} {"train_loss": -11.91134262084961, "global_step": 412773, "epoch": 2456} {"train_loss": -10.571523666381836, "global_step": 412774, "epoch": 2456} {"train_loss": -11.688198095276242, "global_step": 412775, "epoch": 2456, "val_loss": 305118.625} {"train_loss": -10.737419128417969, "global_step": 412776, "epoch": 2457} {"train_loss": -11.61099624633789, "global_step": 412777, "epoch": 2457} {"train_loss": -10.141258239746094, "global_step": 412778, "epoch": 2457} {"train_loss": -10.413057327270508, "global_step": 412779, "epoch": 2457} {"train_loss": -10.914957046508789, "global_step": 412780, "epoch": 2457} {"train_loss": -10.666947364807129, "global_step": 412781, "epoch": 2457} {"train_loss": -11.170500755310059, "global_step": 412782, "epoch": 2457} {"train_loss": -10.542433738708496, "global_step": 412783, "epoch": 2457} {"train_loss": -10.37033462524414, "global_step": 412784, "epoch": 2457} {"train_loss": -11.325343132019043, "global_step": 412785, "epoch": 2457} {"train_loss": -11.655704498291016, "global_step": 412786, "epoch": 2457} {"train_loss": -11.166826248168945, "global_step": 412787, "epoch": 2457} {"train_loss": -11.643436431884766, "global_step": 412788, "epoch": 2457} {"train_loss": -11.766569137573242, "global_step": 412789, "epoch": 2457} {"train_loss": -11.123921394348145, "global_step": 412790, "epoch": 2457} {"train_loss": -12.095464706420898, "global_step": 412791, "epoch": 2457} {"train_loss": -11.977862358093262, "global_step": 412792, "epoch": 2457} {"train_loss": -10.902583122253418, "global_step": 412793, "epoch": 2457} {"train_loss": -12.302356719970703, "global_step": 412794, "epoch": 2457} {"train_loss": -11.284278869628906, "global_step": 412795, "epoch": 2457} {"train_loss": -11.632217407226562, "global_step": 412796, "epoch": 2457} {"train_loss": -12.300363540649414, "global_step": 412797, "epoch": 2457} {"train_loss": -11.842558860778809, "global_step": 412798, "epoch": 2457} {"train_loss": -12.007930755615234, "global_step": 412799, "epoch": 2457} {"train_loss": -12.39399528503418, "global_step": 412800, "epoch": 2457} {"train_loss": -12.112704277038574, "global_step": 412801, "epoch": 2457} {"train_loss": -11.92917537689209, "global_step": 412802, "epoch": 2457} {"train_loss": -12.139406204223633, "global_step": 412803, "epoch": 2457} {"train_loss": -12.387969017028809, "global_step": 412804, "epoch": 2457} {"train_loss": -12.409271240234375, "global_step": 412805, "epoch": 2457} {"train_loss": -12.293729782104492, "global_step": 412806, "epoch": 2457} {"train_loss": -12.299165725708008, "global_step": 412807, "epoch": 2457} {"train_loss": -11.914098739624023, "global_step": 412808, "epoch": 2457} {"train_loss": -12.310198783874512, "global_step": 412809, "epoch": 2457} {"train_loss": -12.236248970031738, "global_step": 412810, "epoch": 2457} {"train_loss": -12.328986167907715, "global_step": 412811, "epoch": 2457} {"train_loss": -12.358820915222168, "global_step": 412812, "epoch": 2457} {"train_loss": -12.313506126403809, "global_step": 412813, "epoch": 2457} {"train_loss": -12.54564094543457, "global_step": 412814, "epoch": 2457} {"train_loss": -12.460668563842773, "global_step": 412815, "epoch": 2457} {"train_loss": -12.23409366607666, "global_step": 412816, "epoch": 2457} {"train_loss": -12.380891799926758, "global_step": 412817, "epoch": 2457} {"train_loss": -12.473068237304688, "global_step": 412818, "epoch": 2457} {"train_loss": -12.335429191589355, "global_step": 412819, "epoch": 2457} {"train_loss": -12.244155883789062, "global_step": 412820, "epoch": 2457} {"train_loss": -12.56180191040039, "global_step": 412821, "epoch": 2457} {"train_loss": -12.426412582397461, "global_step": 412822, "epoch": 2457} {"train_loss": -12.462239265441895, "global_step": 412823, "epoch": 2457} {"train_loss": -12.31979751586914, "global_step": 412824, "epoch": 2457} {"train_loss": -12.455683708190918, "global_step": 412825, "epoch": 2457} {"train_loss": -12.461648941040039, "global_step": 412826, "epoch": 2457} {"train_loss": -12.551419258117676, "global_step": 412827, "epoch": 2457} {"train_loss": -12.575563430786133, "global_step": 412828, "epoch": 2457} {"train_loss": -12.459331512451172, "global_step": 412829, "epoch": 2457} {"train_loss": -12.489238739013672, "global_step": 412830, "epoch": 2457} {"train_loss": -12.642782211303711, "global_step": 412831, "epoch": 2457} {"train_loss": -12.502801895141602, "global_step": 412832, "epoch": 2457} {"train_loss": -12.594841003417969, "global_step": 412833, "epoch": 2457} {"train_loss": -12.49285888671875, "global_step": 412834, "epoch": 2457} {"train_loss": -12.795015335083008, "global_step": 412835, "epoch": 2457} {"train_loss": -12.74754810333252, "global_step": 412836, "epoch": 2457} {"train_loss": -12.755884170532227, "global_step": 412837, "epoch": 2457} {"train_loss": -12.585429191589355, "global_step": 412838, "epoch": 2457} {"train_loss": -12.745054244995117, "global_step": 412839, "epoch": 2457} {"train_loss": -12.58067798614502, "global_step": 412840, "epoch": 2457} {"train_loss": -12.736454963684082, "global_step": 412841, "epoch": 2457} {"train_loss": -12.540952682495117, "global_step": 412842, "epoch": 2457} {"train_loss": -12.484790802001953, "global_step": 412843, "epoch": 2457} {"train_loss": -12.35038948059082, "global_step": 412844, "epoch": 2457} {"train_loss": -12.828189849853516, "global_step": 412845, "epoch": 2457} {"train_loss": -12.549169540405273, "global_step": 412846, "epoch": 2457} {"train_loss": -12.557404518127441, "global_step": 412847, "epoch": 2457} {"train_loss": -12.304344177246094, "global_step": 412848, "epoch": 2457} {"train_loss": -12.503591537475586, "global_step": 412849, "epoch": 2457} {"train_loss": -12.531235694885254, "global_step": 412850, "epoch": 2457} {"train_loss": -12.721488952636719, "global_step": 412851, "epoch": 2457} {"train_loss": -12.787120819091797, "global_step": 412852, "epoch": 2457} {"train_loss": -12.620268821716309, "global_step": 412853, "epoch": 2457} {"train_loss": -12.85434341430664, "global_step": 412854, "epoch": 2457} {"train_loss": -12.625506401062012, "global_step": 412855, "epoch": 2457} {"train_loss": -12.579423904418945, "global_step": 412856, "epoch": 2457} {"train_loss": -12.455121040344238, "global_step": 412857, "epoch": 2457} {"train_loss": -12.500913619995117, "global_step": 412858, "epoch": 2457} {"train_loss": -12.701089859008789, "global_step": 412859, "epoch": 2457} {"train_loss": -12.71843147277832, "global_step": 412860, "epoch": 2457} {"train_loss": -12.57569408416748, "global_step": 412861, "epoch": 2457} {"train_loss": -11.802717208862305, "global_step": 412862, "epoch": 2457} {"train_loss": -12.500569343566895, "global_step": 412863, "epoch": 2457} {"train_loss": -12.103984832763672, "global_step": 412864, "epoch": 2457} {"train_loss": -11.583970069885254, "global_step": 412865, "epoch": 2457} {"train_loss": -10.775873184204102, "global_step": 412866, "epoch": 2457} {"train_loss": -12.519359588623047, "global_step": 412867, "epoch": 2457} {"train_loss": -10.04439926147461, "global_step": 412868, "epoch": 2457} {"train_loss": -10.542202949523926, "global_step": 412869, "epoch": 2457} {"train_loss": -10.976472854614258, "global_step": 412870, "epoch": 2457} {"train_loss": -11.904099464416504, "global_step": 412871, "epoch": 2457} {"train_loss": -11.289468765258789, "global_step": 412872, "epoch": 2457} {"train_loss": -11.966121673583984, "global_step": 412873, "epoch": 2457} {"train_loss": -11.872676849365234, "global_step": 412874, "epoch": 2457} {"train_loss": -11.321060180664062, "global_step": 412875, "epoch": 2457} {"train_loss": -10.703935623168945, "global_step": 412876, "epoch": 2457} {"train_loss": -11.967340469360352, "global_step": 412877, "epoch": 2457} {"train_loss": -12.063727378845215, "global_step": 412878, "epoch": 2457} {"train_loss": -11.29227066040039, "global_step": 412879, "epoch": 2457} {"train_loss": -12.306828498840332, "global_step": 412880, "epoch": 2457} {"train_loss": -11.476001739501953, "global_step": 412881, "epoch": 2457} {"train_loss": -11.048912048339844, "global_step": 412882, "epoch": 2457} {"train_loss": -12.20060920715332, "global_step": 412883, "epoch": 2457} {"train_loss": -11.358057022094727, "global_step": 412884, "epoch": 2457} {"train_loss": -10.977163314819336, "global_step": 412885, "epoch": 2457} {"train_loss": -11.773360252380371, "global_step": 412886, "epoch": 2457} {"train_loss": -11.946840286254883, "global_step": 412887, "epoch": 2457} {"train_loss": -11.31844711303711, "global_step": 412888, "epoch": 2457} {"train_loss": -12.073143005371094, "global_step": 412889, "epoch": 2457} {"train_loss": -11.189200401306152, "global_step": 412890, "epoch": 2457} {"train_loss": -12.422086715698242, "global_step": 412891, "epoch": 2457} {"train_loss": -11.705107688903809, "global_step": 412892, "epoch": 2457} {"train_loss": -12.02181625366211, "global_step": 412893, "epoch": 2457} {"train_loss": -11.802190780639648, "global_step": 412894, "epoch": 2457} {"train_loss": -11.86201000213623, "global_step": 412895, "epoch": 2457} {"train_loss": -11.251324653625488, "global_step": 412896, "epoch": 2457} {"train_loss": -11.436773300170898, "global_step": 412897, "epoch": 2457} {"train_loss": -11.21474838256836, "global_step": 412898, "epoch": 2457} {"train_loss": -11.783376693725586, "global_step": 412899, "epoch": 2457} {"train_loss": -11.195785522460938, "global_step": 412900, "epoch": 2457} {"train_loss": -11.692605972290039, "global_step": 412901, "epoch": 2457} {"train_loss": -11.258506774902344, "global_step": 412902, "epoch": 2457} {"train_loss": -11.744314193725586, "global_step": 412903, "epoch": 2457} {"train_loss": -11.706279754638672, "global_step": 412904, "epoch": 2457} {"train_loss": -11.201009750366211, "global_step": 412905, "epoch": 2457} {"train_loss": -12.49618148803711, "global_step": 412906, "epoch": 2457} {"train_loss": -11.590579986572266, "global_step": 412907, "epoch": 2457} {"train_loss": -12.173710823059082, "global_step": 412908, "epoch": 2457} {"train_loss": -11.735538482666016, "global_step": 412909, "epoch": 2457} {"train_loss": -11.650861740112305, "global_step": 412910, "epoch": 2457} {"train_loss": -11.990625381469727, "global_step": 412911, "epoch": 2457} {"train_loss": -11.55355453491211, "global_step": 412912, "epoch": 2457} {"train_loss": -12.579387664794922, "global_step": 412913, "epoch": 2457} {"train_loss": -11.261027336120605, "global_step": 412914, "epoch": 2457} {"train_loss": -11.89280891418457, "global_step": 412915, "epoch": 2457} {"train_loss": -11.81816577911377, "global_step": 412916, "epoch": 2457} {"train_loss": -12.133795738220215, "global_step": 412917, "epoch": 2457} {"train_loss": -12.036319732666016, "global_step": 412918, "epoch": 2457} {"train_loss": -12.313813209533691, "global_step": 412919, "epoch": 2457} {"train_loss": -12.315003395080566, "global_step": 412920, "epoch": 2457} {"train_loss": -12.044671058654785, "global_step": 412921, "epoch": 2457} {"train_loss": -12.141441345214844, "global_step": 412922, "epoch": 2457} {"train_loss": -12.508331298828125, "global_step": 412923, "epoch": 2457} {"train_loss": -12.080577850341797, "global_step": 412924, "epoch": 2457} {"train_loss": -12.107063293457031, "global_step": 412925, "epoch": 2457} {"train_loss": -12.063376426696777, "global_step": 412926, "epoch": 2457} {"train_loss": -12.311017990112305, "global_step": 412927, "epoch": 2457} {"train_loss": -12.150547981262207, "global_step": 412928, "epoch": 2457} {"train_loss": -12.170392990112305, "global_step": 412929, "epoch": 2457} {"train_loss": -12.316507339477539, "global_step": 412930, "epoch": 2457} {"train_loss": -11.933778762817383, "global_step": 412931, "epoch": 2457} {"train_loss": -12.241987228393555, "global_step": 412932, "epoch": 2457} {"train_loss": -12.610860824584961, "global_step": 412933, "epoch": 2457} {"train_loss": -11.856582641601562, "global_step": 412934, "epoch": 2457} {"train_loss": -12.39358139038086, "global_step": 412935, "epoch": 2457} {"train_loss": -12.35593032836914, "global_step": 412936, "epoch": 2457} {"train_loss": -12.155311584472656, "global_step": 412937, "epoch": 2457} {"train_loss": -12.44900894165039, "global_step": 412938, "epoch": 2457} {"train_loss": -12.10684585571289, "global_step": 412939, "epoch": 2457} {"train_loss": -12.458351135253906, "global_step": 412940, "epoch": 2457} {"train_loss": -12.174715042114258, "global_step": 412941, "epoch": 2457} {"train_loss": -12.353870391845703, "global_step": 412942, "epoch": 2457} {"train_loss": -11.99767055397942, "global_step": 412943, "epoch": 2457, "val_loss": 305855.28125} {"train_loss": -12.382692337036133, "global_step": 412944, "epoch": 2458} {"train_loss": -12.295141220092773, "global_step": 412945, "epoch": 2458} {"train_loss": -12.495101928710938, "global_step": 412946, "epoch": 2458} {"train_loss": -12.217772483825684, "global_step": 412947, "epoch": 2458} {"train_loss": -12.049521446228027, "global_step": 412948, "epoch": 2458} {"train_loss": -12.140778541564941, "global_step": 412949, "epoch": 2458} {"train_loss": -11.974769592285156, "global_step": 412950, "epoch": 2458} {"train_loss": -11.895440101623535, "global_step": 412951, "epoch": 2458} {"train_loss": -12.502580642700195, "global_step": 412952, "epoch": 2458} {"train_loss": -11.657114028930664, "global_step": 412953, "epoch": 2458} {"train_loss": -12.043632507324219, "global_step": 412954, "epoch": 2458} {"train_loss": -12.250242233276367, "global_step": 412955, "epoch": 2458} {"train_loss": -12.208800315856934, "global_step": 412956, "epoch": 2458} {"train_loss": -12.454054832458496, "global_step": 412957, "epoch": 2458} {"train_loss": -12.175907135009766, "global_step": 412958, "epoch": 2458} {"train_loss": -12.141680717468262, "global_step": 412959, "epoch": 2458} {"train_loss": -12.137681007385254, "global_step": 412960, "epoch": 2458} {"train_loss": -12.467981338500977, "global_step": 412961, "epoch": 2458} {"train_loss": -12.233086585998535, "global_step": 412962, "epoch": 2458} {"train_loss": -12.603065490722656, "global_step": 412963, "epoch": 2458} {"train_loss": -12.472614288330078, "global_step": 412964, "epoch": 2458} {"train_loss": -12.496025085449219, "global_step": 412965, "epoch": 2458} {"train_loss": -12.346823692321777, "global_step": 412966, "epoch": 2458} {"train_loss": -12.528155326843262, "global_step": 412967, "epoch": 2458} {"train_loss": -12.493539810180664, "global_step": 412968, "epoch": 2458} {"train_loss": -12.361272811889648, "global_step": 412969, "epoch": 2458} {"train_loss": -12.454765319824219, "global_step": 412970, "epoch": 2458} {"train_loss": -12.513603210449219, "global_step": 412971, "epoch": 2458} {"train_loss": -12.35216999053955, "global_step": 412972, "epoch": 2458} {"train_loss": -12.355621337890625, "global_step": 412973, "epoch": 2458} {"train_loss": -12.273458480834961, "global_step": 412974, "epoch": 2458} {"train_loss": -12.660871505737305, "global_step": 412975, "epoch": 2458} {"train_loss": -12.557483673095703, "global_step": 412976, "epoch": 2458} {"train_loss": -12.132553100585938, "global_step": 412977, "epoch": 2458} {"train_loss": -12.222639083862305, "global_step": 412978, "epoch": 2458} {"train_loss": -12.374120712280273, "global_step": 412979, "epoch": 2458} {"train_loss": -12.087259292602539, "global_step": 412980, "epoch": 2458} {"train_loss": -12.065428733825684, "global_step": 412981, "epoch": 2458} {"train_loss": -12.830129623413086, "global_step": 412982, "epoch": 2458} {"train_loss": -12.343947410583496, "global_step": 412983, "epoch": 2458} {"train_loss": -12.440888404846191, "global_step": 412984, "epoch": 2458} {"train_loss": -12.370345115661621, "global_step": 412985, "epoch": 2458} {"train_loss": -12.748724937438965, "global_step": 412986, "epoch": 2458} {"train_loss": -11.940254211425781, "global_step": 412987, "epoch": 2458} {"train_loss": -12.348648071289062, "global_step": 412988, "epoch": 2458} {"train_loss": -12.651874542236328, "global_step": 412989, "epoch": 2458} {"train_loss": -12.831659317016602, "global_step": 412990, "epoch": 2458} {"train_loss": -12.567699432373047, "global_step": 412991, "epoch": 2458} {"train_loss": -12.447500228881836, "global_step": 412992, "epoch": 2458} {"train_loss": -12.734766006469727, "global_step": 412993, "epoch": 2458} {"train_loss": -12.631795883178711, "global_step": 412994, "epoch": 2458} {"train_loss": -12.35774040222168, "global_step": 412995, "epoch": 2458} {"train_loss": -12.110639572143555, "global_step": 412996, "epoch": 2458} {"train_loss": -12.773717880249023, "global_step": 412997, "epoch": 2458} {"train_loss": -12.619522094726562, "global_step": 412998, "epoch": 2458} {"train_loss": -12.756683349609375, "global_step": 412999, "epoch": 2458} {"train_loss": -12.600292205810547, "global_step": 413000, "epoch": 2458} {"train_loss": -12.592574119567871, "global_step": 413001, "epoch": 2458} {"train_loss": -12.598258972167969, "global_step": 413002, "epoch": 2458} {"train_loss": -12.807474136352539, "global_step": 413003, "epoch": 2458} {"train_loss": -12.706169128417969, "global_step": 413004, "epoch": 2458} {"train_loss": -12.775192260742188, "global_step": 413005, "epoch": 2458} {"train_loss": -12.662501335144043, "global_step": 413006, "epoch": 2458} {"train_loss": -12.50556755065918, "global_step": 413007, "epoch": 2458} {"train_loss": -12.73088550567627, "global_step": 413008, "epoch": 2458} {"train_loss": -12.683721542358398, "global_step": 413009, "epoch": 2458} {"train_loss": -12.67081069946289, "global_step": 413010, "epoch": 2458} {"train_loss": -12.639608383178711, "global_step": 413011, "epoch": 2458} {"train_loss": -12.857294082641602, "global_step": 413012, "epoch": 2458} {"train_loss": -12.83564281463623, "global_step": 413013, "epoch": 2458} {"train_loss": -12.111879348754883, "global_step": 413014, "epoch": 2458} {"train_loss": -11.943538665771484, "global_step": 413015, "epoch": 2458} {"train_loss": -11.899869918823242, "global_step": 413016, "epoch": 2458} {"train_loss": -12.069328308105469, "global_step": 413017, "epoch": 2458} {"train_loss": -12.235563278198242, "global_step": 413018, "epoch": 2458} {"train_loss": -11.896768569946289, "global_step": 413019, "epoch": 2458} {"train_loss": -11.286542892456055, "global_step": 413020, "epoch": 2458} {"train_loss": -11.962118148803711, "global_step": 413021, "epoch": 2458} {"train_loss": -11.846972465515137, "global_step": 413022, "epoch": 2458} {"train_loss": -11.034483909606934, "global_step": 413023, "epoch": 2458} {"train_loss": -10.913070678710938, "global_step": 413024, "epoch": 2458} {"train_loss": -10.017261505126953, "global_step": 413025, "epoch": 2458} {"train_loss": -10.1686429977417, "global_step": 413026, "epoch": 2458} {"train_loss": -8.948784828186035, "global_step": 413027, "epoch": 2458} {"train_loss": -10.246192932128906, "global_step": 413028, "epoch": 2458} {"train_loss": -11.014425277709961, "global_step": 413029, "epoch": 2458} {"train_loss": -10.085603713989258, "global_step": 413030, "epoch": 2458} {"train_loss": -9.71026611328125, "global_step": 413031, "epoch": 2458} {"train_loss": -11.759954452514648, "global_step": 413032, "epoch": 2458} {"train_loss": -10.670652389526367, "global_step": 413033, "epoch": 2458} {"train_loss": -10.374342918395996, "global_step": 413034, "epoch": 2458} {"train_loss": -9.8562650680542, "global_step": 413035, "epoch": 2458} {"train_loss": -11.686897277832031, "global_step": 413036, "epoch": 2458} {"train_loss": -10.536979675292969, "global_step": 413037, "epoch": 2458} {"train_loss": -10.476386070251465, "global_step": 413038, "epoch": 2458} {"train_loss": -10.748953819274902, "global_step": 413039, "epoch": 2458} {"train_loss": -11.441524505615234, "global_step": 413040, "epoch": 2458} {"train_loss": -9.807729721069336, "global_step": 413041, "epoch": 2458} {"train_loss": -11.362107276916504, "global_step": 413042, "epoch": 2458} {"train_loss": -10.492667198181152, "global_step": 413043, "epoch": 2458} {"train_loss": -9.865593910217285, "global_step": 413044, "epoch": 2458} {"train_loss": -11.418562889099121, "global_step": 413045, "epoch": 2458} {"train_loss": -10.47341537475586, "global_step": 413046, "epoch": 2458} {"train_loss": -10.138153076171875, "global_step": 413047, "epoch": 2458} {"train_loss": -10.280023574829102, "global_step": 413048, "epoch": 2458} {"train_loss": -10.981794357299805, "global_step": 413049, "epoch": 2458} {"train_loss": -10.992141723632812, "global_step": 413050, "epoch": 2458} {"train_loss": -11.012859344482422, "global_step": 413051, "epoch": 2458} {"train_loss": -11.177614212036133, "global_step": 413052, "epoch": 2458} {"train_loss": -10.918701171875, "global_step": 413053, "epoch": 2458} {"train_loss": -11.217059135437012, "global_step": 413054, "epoch": 2458} {"train_loss": -10.66305923461914, "global_step": 413055, "epoch": 2458} {"train_loss": -11.347293853759766, "global_step": 413056, "epoch": 2458} {"train_loss": -11.831557273864746, "global_step": 413057, "epoch": 2458} {"train_loss": -10.890146255493164, "global_step": 413058, "epoch": 2458} {"train_loss": -11.51287841796875, "global_step": 413059, "epoch": 2458} {"train_loss": -11.914216995239258, "global_step": 413060, "epoch": 2458} {"train_loss": -11.286170959472656, "global_step": 413061, "epoch": 2458} {"train_loss": -11.67322826385498, "global_step": 413062, "epoch": 2458} {"train_loss": -11.442239761352539, "global_step": 413063, "epoch": 2458} {"train_loss": -11.514283180236816, "global_step": 413064, "epoch": 2458} {"train_loss": -11.70650577545166, "global_step": 413065, "epoch": 2458} {"train_loss": -11.77729320526123, "global_step": 413066, "epoch": 2458} {"train_loss": -11.646530151367188, "global_step": 413067, "epoch": 2458} {"train_loss": -12.280370712280273, "global_step": 413068, "epoch": 2458} {"train_loss": -11.712518692016602, "global_step": 413069, "epoch": 2458} {"train_loss": -11.717280387878418, "global_step": 413070, "epoch": 2458} {"train_loss": -11.928215026855469, "global_step": 413071, "epoch": 2458} {"train_loss": -11.884538650512695, "global_step": 413072, "epoch": 2458} {"train_loss": -12.163623809814453, "global_step": 413073, "epoch": 2458} {"train_loss": -12.282427787780762, "global_step": 413074, "epoch": 2458} {"train_loss": -12.024310111999512, "global_step": 413075, "epoch": 2458} {"train_loss": -12.204242706298828, "global_step": 413076, "epoch": 2458} {"train_loss": -12.250205993652344, "global_step": 413077, "epoch": 2458} {"train_loss": -12.188090324401855, "global_step": 413078, "epoch": 2458} {"train_loss": -12.235847473144531, "global_step": 413079, "epoch": 2458} {"train_loss": -12.34807014465332, "global_step": 413080, "epoch": 2458} {"train_loss": -12.007763862609863, "global_step": 413081, "epoch": 2458} {"train_loss": -12.339544296264648, "global_step": 413082, "epoch": 2458} {"train_loss": -12.45286750793457, "global_step": 413083, "epoch": 2458} {"train_loss": -12.424592971801758, "global_step": 413084, "epoch": 2458} {"train_loss": -12.416296005249023, "global_step": 413085, "epoch": 2458} {"train_loss": -12.481829643249512, "global_step": 413086, "epoch": 2458} {"train_loss": -12.175705909729004, "global_step": 413087, "epoch": 2458} {"train_loss": -12.185277938842773, "global_step": 413088, "epoch": 2458} {"train_loss": -12.13190746307373, "global_step": 413089, "epoch": 2458} {"train_loss": -12.381758689880371, "global_step": 413090, "epoch": 2458} {"train_loss": -12.017267227172852, "global_step": 413091, "epoch": 2458} {"train_loss": -12.136981964111328, "global_step": 413092, "epoch": 2458} {"train_loss": -12.285856246948242, "global_step": 413093, "epoch": 2458} {"train_loss": -11.824312210083008, "global_step": 413094, "epoch": 2458} {"train_loss": -12.246908187866211, "global_step": 413095, "epoch": 2458} {"train_loss": -12.403575897216797, "global_step": 413096, "epoch": 2458} {"train_loss": -12.324617385864258, "global_step": 413097, "epoch": 2458} {"train_loss": -12.438004493713379, "global_step": 413098, "epoch": 2458} {"train_loss": -12.461593627929688, "global_step": 413099, "epoch": 2458} {"train_loss": -12.694209098815918, "global_step": 413100, "epoch": 2458} {"train_loss": -12.494880676269531, "global_step": 413101, "epoch": 2458} {"train_loss": -12.638012886047363, "global_step": 413102, "epoch": 2458} {"train_loss": -12.530759811401367, "global_step": 413103, "epoch": 2458} {"train_loss": -12.601531982421875, "global_step": 413104, "epoch": 2458} {"train_loss": -12.671012878417969, "global_step": 413105, "epoch": 2458} {"train_loss": -12.509197235107422, "global_step": 413106, "epoch": 2458} {"train_loss": -12.64741039276123, "global_step": 413107, "epoch": 2458} {"train_loss": -12.412521362304688, "global_step": 413108, "epoch": 2458} {"train_loss": -12.415030479431152, "global_step": 413109, "epoch": 2458} {"train_loss": -12.65279769897461, "global_step": 413110, "epoch": 2458} {"train_loss": -11.94762403056735, "global_step": 413111, "epoch": 2458, "val_loss": 300362.21875} {"train_loss": -12.625967025756836, "global_step": 413112, "epoch": 2459} {"train_loss": -12.502130508422852, "global_step": 413113, "epoch": 2459} {"train_loss": -12.477638244628906, "global_step": 413114, "epoch": 2459} {"train_loss": -12.864082336425781, "global_step": 413115, "epoch": 2459} {"train_loss": -12.642909049987793, "global_step": 413116, "epoch": 2459} {"train_loss": -12.579784393310547, "global_step": 413117, "epoch": 2459} {"train_loss": -12.657578468322754, "global_step": 413118, "epoch": 2459} {"train_loss": -12.7869234085083, "global_step": 413119, "epoch": 2459} {"train_loss": -12.663944244384766, "global_step": 413120, "epoch": 2459} {"train_loss": -12.313505172729492, "global_step": 413121, "epoch": 2459} {"train_loss": -12.576581954956055, "global_step": 413122, "epoch": 2459} {"train_loss": -12.416007995605469, "global_step": 413123, "epoch": 2459} {"train_loss": -12.625862121582031, "global_step": 413124, "epoch": 2459} {"train_loss": -12.278412818908691, "global_step": 413125, "epoch": 2459} {"train_loss": -12.588252067565918, "global_step": 413126, "epoch": 2459} {"train_loss": -12.497907638549805, "global_step": 413127, "epoch": 2459} {"train_loss": -12.548686027526855, "global_step": 413128, "epoch": 2459} {"train_loss": -12.339654922485352, "global_step": 413129, "epoch": 2459} {"train_loss": -12.610709190368652, "global_step": 413130, "epoch": 2459} {"train_loss": -12.905218124389648, "global_step": 413131, "epoch": 2459} {"train_loss": -12.44868278503418, "global_step": 413132, "epoch": 2459} {"train_loss": -12.757110595703125, "global_step": 413133, "epoch": 2459} {"train_loss": -12.677452087402344, "global_step": 413134, "epoch": 2459} {"train_loss": -12.814168930053711, "global_step": 413135, "epoch": 2459} {"train_loss": -12.51259708404541, "global_step": 413136, "epoch": 2459} {"train_loss": -12.246789932250977, "global_step": 413137, "epoch": 2459} {"train_loss": -12.372365951538086, "global_step": 413138, "epoch": 2459} {"train_loss": -12.563302993774414, "global_step": 413139, "epoch": 2459} {"train_loss": -12.183713912963867, "global_step": 413140, "epoch": 2459} {"train_loss": -12.614908218383789, "global_step": 413141, "epoch": 2459} {"train_loss": -12.296878814697266, "global_step": 413142, "epoch": 2459} {"train_loss": -12.148839950561523, "global_step": 413143, "epoch": 2459} {"train_loss": -12.196889877319336, "global_step": 413144, "epoch": 2459} {"train_loss": -12.683804512023926, "global_step": 413145, "epoch": 2459} {"train_loss": -12.031662940979004, "global_step": 413146, "epoch": 2459} {"train_loss": -12.287518501281738, "global_step": 413147, "epoch": 2459} {"train_loss": -12.884765625, "global_step": 413148, "epoch": 2459} {"train_loss": -12.59329891204834, "global_step": 413149, "epoch": 2459} {"train_loss": -12.609685897827148, "global_step": 413150, "epoch": 2459} {"train_loss": -12.727142333984375, "global_step": 413151, "epoch": 2459} {"train_loss": -12.21959400177002, "global_step": 413152, "epoch": 2459} {"train_loss": -12.336366653442383, "global_step": 413153, "epoch": 2459} {"train_loss": -12.647048950195312, "global_step": 413154, "epoch": 2459} {"train_loss": -12.473711013793945, "global_step": 413155, "epoch": 2459} {"train_loss": -12.30667495727539, "global_step": 413156, "epoch": 2459} {"train_loss": -12.29585075378418, "global_step": 413157, "epoch": 2459} {"train_loss": -12.76396369934082, "global_step": 413158, "epoch": 2459} {"train_loss": -12.535683631896973, "global_step": 413159, "epoch": 2459} {"train_loss": -11.88551139831543, "global_step": 413160, "epoch": 2459} {"train_loss": -12.125638961791992, "global_step": 413161, "epoch": 2459} {"train_loss": -12.385366439819336, "global_step": 413162, "epoch": 2459} {"train_loss": -12.068812370300293, "global_step": 413163, "epoch": 2459} {"train_loss": -12.405695915222168, "global_step": 413164, "epoch": 2459} {"train_loss": -12.196401596069336, "global_step": 413165, "epoch": 2459} {"train_loss": -12.49811840057373, "global_step": 413166, "epoch": 2459} {"train_loss": -11.779644012451172, "global_step": 413167, "epoch": 2459} {"train_loss": -12.105966567993164, "global_step": 413168, "epoch": 2459} {"train_loss": -12.119203567504883, "global_step": 413169, "epoch": 2459} {"train_loss": -11.903520584106445, "global_step": 413170, "epoch": 2459} {"train_loss": -11.584577560424805, "global_step": 413171, "epoch": 2459} {"train_loss": -11.871065139770508, "global_step": 413172, "epoch": 2459} {"train_loss": -11.944599151611328, "global_step": 413173, "epoch": 2459} {"train_loss": -11.975961685180664, "global_step": 413174, "epoch": 2459} {"train_loss": -11.224100112915039, "global_step": 413175, "epoch": 2459} {"train_loss": -10.657312393188477, "global_step": 413176, "epoch": 2459} {"train_loss": -11.768383026123047, "global_step": 413177, "epoch": 2459} {"train_loss": -10.901302337646484, "global_step": 413178, "epoch": 2459} {"train_loss": -11.814386367797852, "global_step": 413179, "epoch": 2459} {"train_loss": -10.854473114013672, "global_step": 413180, "epoch": 2459} {"train_loss": -11.568449020385742, "global_step": 413181, "epoch": 2459} {"train_loss": -10.851880073547363, "global_step": 413182, "epoch": 2459} {"train_loss": -11.768064498901367, "global_step": 413183, "epoch": 2459} {"train_loss": -9.54785442352295, "global_step": 413184, "epoch": 2459} {"train_loss": -10.998255729675293, "global_step": 413185, "epoch": 2459} {"train_loss": -10.67728042602539, "global_step": 413186, "epoch": 2459} {"train_loss": -10.640238761901855, "global_step": 413187, "epoch": 2459} {"train_loss": -11.895642280578613, "global_step": 413188, "epoch": 2459} {"train_loss": -10.098258972167969, "global_step": 413189, "epoch": 2459} {"train_loss": -10.573984146118164, "global_step": 413190, "epoch": 2459} {"train_loss": -10.781006813049316, "global_step": 413191, "epoch": 2459} {"train_loss": -11.832693099975586, "global_step": 413192, "epoch": 2459} {"train_loss": -11.160950660705566, "global_step": 413193, "epoch": 2459} {"train_loss": -10.553679466247559, "global_step": 413194, "epoch": 2459} {"train_loss": -10.634174346923828, "global_step": 413195, "epoch": 2459} {"train_loss": -11.372130393981934, "global_step": 413196, "epoch": 2459} {"train_loss": -10.451828956604004, "global_step": 413197, "epoch": 2459} {"train_loss": -10.555208206176758, "global_step": 413198, "epoch": 2459} {"train_loss": -10.324137687683105, "global_step": 413199, "epoch": 2459} {"train_loss": -11.279455184936523, "global_step": 413200, "epoch": 2459} {"train_loss": -10.130928039550781, "global_step": 413201, "epoch": 2459} {"train_loss": -10.73469352722168, "global_step": 413202, "epoch": 2459} {"train_loss": -10.796643257141113, "global_step": 413203, "epoch": 2459} {"train_loss": -11.337526321411133, "global_step": 413204, "epoch": 2459} {"train_loss": -11.514213562011719, "global_step": 413205, "epoch": 2459} {"train_loss": -12.019203186035156, "global_step": 413206, "epoch": 2459} {"train_loss": -11.477084159851074, "global_step": 413207, "epoch": 2459} {"train_loss": -11.375340461730957, "global_step": 413208, "epoch": 2459} {"train_loss": -10.539142608642578, "global_step": 413209, "epoch": 2459} {"train_loss": -11.319206237792969, "global_step": 413210, "epoch": 2459} {"train_loss": -11.384101867675781, "global_step": 413211, "epoch": 2459} {"train_loss": -11.80646800994873, "global_step": 413212, "epoch": 2459} {"train_loss": -10.926634788513184, "global_step": 413213, "epoch": 2459} {"train_loss": -11.296510696411133, "global_step": 413214, "epoch": 2459} {"train_loss": -10.691390991210938, "global_step": 413215, "epoch": 2459} {"train_loss": -10.937244415283203, "global_step": 413216, "epoch": 2459} {"train_loss": -11.83408260345459, "global_step": 413217, "epoch": 2459} {"train_loss": -11.125553131103516, "global_step": 413218, "epoch": 2459} {"train_loss": -11.606581687927246, "global_step": 413219, "epoch": 2459} {"train_loss": -11.714372634887695, "global_step": 413220, "epoch": 2459} {"train_loss": -11.444408416748047, "global_step": 413221, "epoch": 2459} {"train_loss": -11.968589782714844, "global_step": 413222, "epoch": 2459} {"train_loss": -12.250507354736328, "global_step": 413223, "epoch": 2459} {"train_loss": -11.181933403015137, "global_step": 413224, "epoch": 2459} {"train_loss": -11.69793701171875, "global_step": 413225, "epoch": 2459} {"train_loss": -12.176237106323242, "global_step": 413226, "epoch": 2459} {"train_loss": -11.747978210449219, "global_step": 413227, "epoch": 2459} {"train_loss": -12.134281158447266, "global_step": 413228, "epoch": 2459} {"train_loss": -12.226064682006836, "global_step": 413229, "epoch": 2459} {"train_loss": -11.83769416809082, "global_step": 413230, "epoch": 2459} {"train_loss": -12.316205978393555, "global_step": 413231, "epoch": 2459} {"train_loss": -12.115489959716797, "global_step": 413232, "epoch": 2459} {"train_loss": -12.275503158569336, "global_step": 413233, "epoch": 2459} {"train_loss": -12.375181198120117, "global_step": 413234, "epoch": 2459} {"train_loss": -12.257952690124512, "global_step": 413235, "epoch": 2459} {"train_loss": -12.105271339416504, "global_step": 413236, "epoch": 2459} {"train_loss": -12.527704238891602, "global_step": 413237, "epoch": 2459} {"train_loss": -12.371782302856445, "global_step": 413238, "epoch": 2459} {"train_loss": -12.204404830932617, "global_step": 413239, "epoch": 2459} {"train_loss": -12.230854034423828, "global_step": 413240, "epoch": 2459} {"train_loss": -12.424468994140625, "global_step": 413241, "epoch": 2459} {"train_loss": -12.539628982543945, "global_step": 413242, "epoch": 2459} {"train_loss": -12.188892364501953, "global_step": 413243, "epoch": 2459} {"train_loss": -12.332969665527344, "global_step": 413244, "epoch": 2459} {"train_loss": -12.428777694702148, "global_step": 413245, "epoch": 2459} {"train_loss": -12.376687049865723, "global_step": 413246, "epoch": 2459} {"train_loss": -12.463573455810547, "global_step": 413247, "epoch": 2459} {"train_loss": -12.452771186828613, "global_step": 413248, "epoch": 2459} {"train_loss": -12.37329387664795, "global_step": 413249, "epoch": 2459} {"train_loss": -12.514974594116211, "global_step": 413250, "epoch": 2459} {"train_loss": -12.705514907836914, "global_step": 413251, "epoch": 2459} {"train_loss": -12.42109489440918, "global_step": 413252, "epoch": 2459} {"train_loss": -12.597259521484375, "global_step": 413253, "epoch": 2459} {"train_loss": -12.390154838562012, "global_step": 413254, "epoch": 2459} {"train_loss": -12.334291458129883, "global_step": 413255, "epoch": 2459} {"train_loss": -12.623239517211914, "global_step": 413256, "epoch": 2459} {"train_loss": -12.582860946655273, "global_step": 413257, "epoch": 2459} {"train_loss": -12.482463836669922, "global_step": 413258, "epoch": 2459} {"train_loss": -12.582110404968262, "global_step": 413259, "epoch": 2459} {"train_loss": -12.708040237426758, "global_step": 413260, "epoch": 2459} {"train_loss": -12.634565353393555, "global_step": 413261, "epoch": 2459} {"train_loss": -12.559904098510742, "global_step": 413262, "epoch": 2459} {"train_loss": -12.719769477844238, "global_step": 413263, "epoch": 2459} {"train_loss": -12.645944595336914, "global_step": 413264, "epoch": 2459} {"train_loss": -12.79401683807373, "global_step": 413265, "epoch": 2459} {"train_loss": -12.732275009155273, "global_step": 413266, "epoch": 2459} {"train_loss": -12.745441436767578, "global_step": 413267, "epoch": 2459} {"train_loss": -12.756490707397461, "global_step": 413268, "epoch": 2459} {"train_loss": -12.524542808532715, "global_step": 413269, "epoch": 2459} {"train_loss": -12.599756240844727, "global_step": 413270, "epoch": 2459} {"train_loss": -12.791112899780273, "global_step": 413271, "epoch": 2459} {"train_loss": -12.514557838439941, "global_step": 413272, "epoch": 2459} {"train_loss": -12.797704696655273, "global_step": 413273, "epoch": 2459} {"train_loss": -12.733097076416016, "global_step": 413274, "epoch": 2459} {"train_loss": -12.694387435913086, "global_step": 413275, "epoch": 2459} {"train_loss": -12.712839126586914, "global_step": 413276, "epoch": 2459} {"train_loss": -12.71587085723877, "global_step": 413277, "epoch": 2459} {"train_loss": -12.627309799194336, "global_step": 413278, "epoch": 2459} {"train_loss": -12.041187683741251, "global_step": 413279, "epoch": 2459, "val_loss": 303245.75} {"train_loss": -12.704902648925781, "global_step": 413280, "epoch": 2460} {"train_loss": -12.642723083496094, "global_step": 413281, "epoch": 2460} {"train_loss": -12.910526275634766, "global_step": 413282, "epoch": 2460} {"train_loss": -12.881028175354004, "global_step": 413283, "epoch": 2460} {"train_loss": -12.896549224853516, "global_step": 413284, "epoch": 2460} {"train_loss": -12.857179641723633, "global_step": 413285, "epoch": 2460} {"train_loss": -12.853052139282227, "global_step": 413286, "epoch": 2460} {"train_loss": -12.858335494995117, "global_step": 413287, "epoch": 2460} {"train_loss": -12.957784652709961, "global_step": 413288, "epoch": 2460} {"train_loss": -12.695516586303711, "global_step": 413289, "epoch": 2460} {"train_loss": -12.48011302947998, "global_step": 413290, "epoch": 2460} {"train_loss": -13.081085205078125, "global_step": 413291, "epoch": 2460} {"train_loss": -12.876395225524902, "global_step": 413292, "epoch": 2460} {"train_loss": -12.84620475769043, "global_step": 413293, "epoch": 2460} {"train_loss": -12.905378341674805, "global_step": 413294, "epoch": 2460} {"train_loss": -12.780467987060547, "global_step": 413295, "epoch": 2460} {"train_loss": -12.858169555664062, "global_step": 413296, "epoch": 2460} {"train_loss": -12.84430980682373, "global_step": 413297, "epoch": 2460} {"train_loss": -12.544329643249512, "global_step": 413298, "epoch": 2460} {"train_loss": -12.465601921081543, "global_step": 413299, "epoch": 2460} {"train_loss": -12.636228561401367, "global_step": 413300, "epoch": 2460} {"train_loss": -12.905983924865723, "global_step": 413301, "epoch": 2460} {"train_loss": -12.586671829223633, "global_step": 413302, "epoch": 2460} {"train_loss": -12.111355781555176, "global_step": 413303, "epoch": 2460} {"train_loss": -12.03211498260498, "global_step": 413304, "epoch": 2460} {"train_loss": -12.557443618774414, "global_step": 413305, "epoch": 2460} {"train_loss": -12.513004302978516, "global_step": 413306, "epoch": 2460} {"train_loss": -12.545578002929688, "global_step": 413307, "epoch": 2460} {"train_loss": -11.375338554382324, "global_step": 413308, "epoch": 2460} {"train_loss": -12.042125701904297, "global_step": 413309, "epoch": 2460} {"train_loss": -12.113748550415039, "global_step": 413310, "epoch": 2460} {"train_loss": -12.95764446258545, "global_step": 413311, "epoch": 2460} {"train_loss": -11.92638874053955, "global_step": 413312, "epoch": 2460} {"train_loss": -12.541701316833496, "global_step": 413313, "epoch": 2460} {"train_loss": -11.497203826904297, "global_step": 413314, "epoch": 2460} {"train_loss": -12.28480052947998, "global_step": 413315, "epoch": 2460} {"train_loss": -12.133281707763672, "global_step": 413316, "epoch": 2460} {"train_loss": -12.585783004760742, "global_step": 413317, "epoch": 2460} {"train_loss": -12.291997909545898, "global_step": 413318, "epoch": 2460} {"train_loss": -11.509872436523438, "global_step": 413319, "epoch": 2460} {"train_loss": -9.770883560180664, "global_step": 413320, "epoch": 2460} {"train_loss": -11.685181617736816, "global_step": 413321, "epoch": 2460} {"train_loss": -10.177902221679688, "global_step": 413322, "epoch": 2460} {"train_loss": -11.725824356079102, "global_step": 413323, "epoch": 2460} {"train_loss": -9.091680526733398, "global_step": 413324, "epoch": 2460} {"train_loss": -9.425379753112793, "global_step": 413325, "epoch": 2460} {"train_loss": -10.374444007873535, "global_step": 413326, "epoch": 2460} {"train_loss": -11.090631484985352, "global_step": 413327, "epoch": 2460} {"train_loss": -10.656255722045898, "global_step": 413328, "epoch": 2460} {"train_loss": -10.834919929504395, "global_step": 413329, "epoch": 2460} {"train_loss": -12.22610855102539, "global_step": 413330, "epoch": 2460} {"train_loss": -11.049909591674805, "global_step": 413331, "epoch": 2460} {"train_loss": -11.445211410522461, "global_step": 413332, "epoch": 2460} {"train_loss": -11.482192993164062, "global_step": 413333, "epoch": 2460} {"train_loss": -10.540399551391602, "global_step": 413334, "epoch": 2460} {"train_loss": -11.211292266845703, "global_step": 413335, "epoch": 2460} {"train_loss": -11.259090423583984, "global_step": 413336, "epoch": 2460} {"train_loss": -10.5277099609375, "global_step": 413337, "epoch": 2460} {"train_loss": -11.582568168640137, "global_step": 413338, "epoch": 2460} {"train_loss": -10.971704483032227, "global_step": 413339, "epoch": 2460} {"train_loss": -11.575550079345703, "global_step": 413340, "epoch": 2460} {"train_loss": -11.268142700195312, "global_step": 413341, "epoch": 2460} {"train_loss": -11.040283203125, "global_step": 413342, "epoch": 2460} {"train_loss": -11.621908187866211, "global_step": 413343, "epoch": 2460} {"train_loss": -10.907529830932617, "global_step": 413344, "epoch": 2460} {"train_loss": -11.263673782348633, "global_step": 413345, "epoch": 2460} {"train_loss": -11.81570053100586, "global_step": 413346, "epoch": 2460} {"train_loss": -11.450394630432129, "global_step": 413347, "epoch": 2460} {"train_loss": -11.698046684265137, "global_step": 413348, "epoch": 2460} {"train_loss": -11.331086158752441, "global_step": 413349, "epoch": 2460} {"train_loss": -11.222677230834961, "global_step": 413350, "epoch": 2460} {"train_loss": -10.671335220336914, "global_step": 413351, "epoch": 2460} {"train_loss": -11.663738250732422, "global_step": 413352, "epoch": 2460} {"train_loss": -11.799040794372559, "global_step": 413353, "epoch": 2460} {"train_loss": -11.211271286010742, "global_step": 413354, "epoch": 2460} {"train_loss": -11.087410926818848, "global_step": 413355, "epoch": 2460} {"train_loss": -11.712787628173828, "global_step": 413356, "epoch": 2460} {"train_loss": -10.971454620361328, "global_step": 413357, "epoch": 2460} {"train_loss": -11.211115837097168, "global_step": 413358, "epoch": 2460} {"train_loss": -11.122093200683594, "global_step": 413359, "epoch": 2460} {"train_loss": -11.711440086364746, "global_step": 413360, "epoch": 2460} {"train_loss": -11.644946098327637, "global_step": 413361, "epoch": 2460} {"train_loss": -11.196556091308594, "global_step": 413362, "epoch": 2460} {"train_loss": -12.121137619018555, "global_step": 413363, "epoch": 2460} {"train_loss": -11.103609085083008, "global_step": 413364, "epoch": 2460} {"train_loss": -11.48725700378418, "global_step": 413365, "epoch": 2460} {"train_loss": -10.446157455444336, "global_step": 413366, "epoch": 2460} {"train_loss": -11.599045753479004, "global_step": 413367, "epoch": 2460} {"train_loss": -10.917746543884277, "global_step": 413368, "epoch": 2460} {"train_loss": -12.062870025634766, "global_step": 413369, "epoch": 2460} {"train_loss": -11.447854042053223, "global_step": 413370, "epoch": 2460} {"train_loss": -10.652996063232422, "global_step": 413371, "epoch": 2460} {"train_loss": -12.085550308227539, "global_step": 413372, "epoch": 2460} {"train_loss": -11.378347396850586, "global_step": 413373, "epoch": 2460} {"train_loss": -11.762678146362305, "global_step": 413374, "epoch": 2460} {"train_loss": -11.959312438964844, "global_step": 413375, "epoch": 2460} {"train_loss": -11.902023315429688, "global_step": 413376, "epoch": 2460} {"train_loss": -11.853044509887695, "global_step": 413377, "epoch": 2460} {"train_loss": -12.012758255004883, "global_step": 413378, "epoch": 2460} {"train_loss": -11.912891387939453, "global_step": 413379, "epoch": 2460} {"train_loss": -12.337549209594727, "global_step": 413380, "epoch": 2460} {"train_loss": -11.699403762817383, "global_step": 413381, "epoch": 2460} {"train_loss": -11.863253593444824, "global_step": 413382, "epoch": 2460} {"train_loss": -12.26677417755127, "global_step": 413383, "epoch": 2460} {"train_loss": -11.82391357421875, "global_step": 413384, "epoch": 2460} {"train_loss": -12.200286865234375, "global_step": 413385, "epoch": 2460} {"train_loss": -12.046062469482422, "global_step": 413386, "epoch": 2460} {"train_loss": -12.240676879882812, "global_step": 413387, "epoch": 2460} {"train_loss": -12.211381912231445, "global_step": 413388, "epoch": 2460} {"train_loss": -12.172708511352539, "global_step": 413389, "epoch": 2460} {"train_loss": -12.177299499511719, "global_step": 413390, "epoch": 2460} {"train_loss": -12.16439437866211, "global_step": 413391, "epoch": 2460} {"train_loss": -12.075003623962402, "global_step": 413392, "epoch": 2460} {"train_loss": -12.292947769165039, "global_step": 413393, "epoch": 2460} {"train_loss": -12.271158218383789, "global_step": 413394, "epoch": 2460} {"train_loss": -12.1390380859375, "global_step": 413395, "epoch": 2460} {"train_loss": -12.369668006896973, "global_step": 413396, "epoch": 2460} {"train_loss": -12.27195930480957, "global_step": 413397, "epoch": 2460} {"train_loss": -12.196868896484375, "global_step": 413398, "epoch": 2460} {"train_loss": -12.283405303955078, "global_step": 413399, "epoch": 2460} {"train_loss": -11.9514741897583, "global_step": 413400, "epoch": 2460} {"train_loss": -12.12822151184082, "global_step": 413401, "epoch": 2460} {"train_loss": -12.492143630981445, "global_step": 413402, "epoch": 2460} {"train_loss": -12.326753616333008, "global_step": 413403, "epoch": 2460} {"train_loss": -12.312848091125488, "global_step": 413404, "epoch": 2460} {"train_loss": -12.138875961303711, "global_step": 413405, "epoch": 2460} {"train_loss": -12.361989974975586, "global_step": 413406, "epoch": 2460} {"train_loss": -12.441858291625977, "global_step": 413407, "epoch": 2460} {"train_loss": -12.068205833435059, "global_step": 413408, "epoch": 2460} {"train_loss": -12.362531661987305, "global_step": 413409, "epoch": 2460} {"train_loss": -12.36180305480957, "global_step": 413410, "epoch": 2460} {"train_loss": -12.218683242797852, "global_step": 413411, "epoch": 2460} {"train_loss": -12.037847518920898, "global_step": 413412, "epoch": 2460} {"train_loss": -12.582221984863281, "global_step": 413413, "epoch": 2460} {"train_loss": -12.432461738586426, "global_step": 413414, "epoch": 2460} {"train_loss": -12.3098726272583, "global_step": 413415, "epoch": 2460} {"train_loss": -12.454448699951172, "global_step": 413416, "epoch": 2460} {"train_loss": -12.651762962341309, "global_step": 413417, "epoch": 2460} {"train_loss": -12.380420684814453, "global_step": 413418, "epoch": 2460} {"train_loss": -12.505407333374023, "global_step": 413419, "epoch": 2460} {"train_loss": -12.390863418579102, "global_step": 413420, "epoch": 2460} {"train_loss": -12.28643798828125, "global_step": 413421, "epoch": 2460} {"train_loss": -12.530109405517578, "global_step": 413422, "epoch": 2460} {"train_loss": -12.412915229797363, "global_step": 413423, "epoch": 2460} {"train_loss": -12.498148918151855, "global_step": 413424, "epoch": 2460} {"train_loss": -12.365621566772461, "global_step": 413425, "epoch": 2460} {"train_loss": -12.422595977783203, "global_step": 413426, "epoch": 2460} {"train_loss": -12.710973739624023, "global_step": 413427, "epoch": 2460} {"train_loss": -12.652423858642578, "global_step": 413428, "epoch": 2460} {"train_loss": -12.558012008666992, "global_step": 413429, "epoch": 2460} {"train_loss": -12.446756362915039, "global_step": 413430, "epoch": 2460} {"train_loss": -12.648151397705078, "global_step": 413431, "epoch": 2460} {"train_loss": -12.567899703979492, "global_step": 413432, "epoch": 2460} {"train_loss": -12.723247528076172, "global_step": 413433, "epoch": 2460} {"train_loss": -12.41417121887207, "global_step": 413434, "epoch": 2460} {"train_loss": -12.617910385131836, "global_step": 413435, "epoch": 2460} {"train_loss": -12.596959114074707, "global_step": 413436, "epoch": 2460} {"train_loss": -12.685155868530273, "global_step": 413437, "epoch": 2460} {"train_loss": -12.656150817871094, "global_step": 413438, "epoch": 2460} {"train_loss": -12.842657089233398, "global_step": 413439, "epoch": 2460} {"train_loss": -12.191495895385742, "global_step": 413440, "epoch": 2460} {"train_loss": -11.964290618896484, "global_step": 413441, "epoch": 2460} {"train_loss": -12.09156322479248, "global_step": 413442, "epoch": 2460} {"train_loss": -11.939785957336426, "global_step": 413443, "epoch": 2460} {"train_loss": -12.22438907623291, "global_step": 413444, "epoch": 2460} {"train_loss": -12.231996536254883, "global_step": 413445, "epoch": 2460} {"train_loss": -12.317460060119629, "global_step": 413446, "epoch": 2460} {"train_loss": -11.98877177351997, "global_step": 413447, "epoch": 2460, "val_loss": 303442.65625, "train_action_mse_error": 0.23966562747955322} {"train_loss": -11.80744457244873, "global_step": 413448, "epoch": 2461} {"train_loss": -12.279216766357422, "global_step": 413449, "epoch": 2461} {"train_loss": -11.95085620880127, "global_step": 413450, "epoch": 2461} {"train_loss": -12.470142364501953, "global_step": 413451, "epoch": 2461} {"train_loss": -11.687294960021973, "global_step": 413452, "epoch": 2461} {"train_loss": -12.26172161102295, "global_step": 413453, "epoch": 2461} {"train_loss": -12.029770851135254, "global_step": 413454, "epoch": 2461} {"train_loss": -12.079771995544434, "global_step": 413455, "epoch": 2461} {"train_loss": -12.352156639099121, "global_step": 413456, "epoch": 2461} {"train_loss": -12.050604820251465, "global_step": 413457, "epoch": 2461} {"train_loss": -12.107845306396484, "global_step": 413458, "epoch": 2461} {"train_loss": -11.173013687133789, "global_step": 413459, "epoch": 2461} {"train_loss": -12.329893112182617, "global_step": 413460, "epoch": 2461} {"train_loss": -11.358236312866211, "global_step": 413461, "epoch": 2461} {"train_loss": -11.416154861450195, "global_step": 413462, "epoch": 2461} {"train_loss": -12.230356216430664, "global_step": 413463, "epoch": 2461} {"train_loss": -10.347670555114746, "global_step": 413464, "epoch": 2461} {"train_loss": -11.253433227539062, "global_step": 413465, "epoch": 2461} {"train_loss": -10.89889144897461, "global_step": 413466, "epoch": 2461} {"train_loss": -9.80571174621582, "global_step": 413467, "epoch": 2461} {"train_loss": -9.501016616821289, "global_step": 413468, "epoch": 2461} {"train_loss": -10.1565523147583, "global_step": 413469, "epoch": 2461} {"train_loss": -11.124606132507324, "global_step": 413470, "epoch": 2461} {"train_loss": -10.53927993774414, "global_step": 413471, "epoch": 2461} {"train_loss": -11.296542167663574, "global_step": 413472, "epoch": 2461} {"train_loss": -11.323013305664062, "global_step": 413473, "epoch": 2461} {"train_loss": -10.434083938598633, "global_step": 413474, "epoch": 2461} {"train_loss": -11.080345153808594, "global_step": 413475, "epoch": 2461} {"train_loss": -11.09492301940918, "global_step": 413476, "epoch": 2461} {"train_loss": -11.476436614990234, "global_step": 413477, "epoch": 2461} {"train_loss": -11.702634811401367, "global_step": 413478, "epoch": 2461} {"train_loss": -11.098315238952637, "global_step": 413479, "epoch": 2461} {"train_loss": -10.6713228225708, "global_step": 413480, "epoch": 2461} {"train_loss": -10.968536376953125, "global_step": 413481, "epoch": 2461} {"train_loss": -9.562028884887695, "global_step": 413482, "epoch": 2461} {"train_loss": -10.652770042419434, "global_step": 413483, "epoch": 2461} {"train_loss": -11.061188697814941, "global_step": 413484, "epoch": 2461} {"train_loss": -9.187395095825195, "global_step": 413485, "epoch": 2461} {"train_loss": -10.785673141479492, "global_step": 413486, "epoch": 2461} {"train_loss": -10.653181076049805, "global_step": 413487, "epoch": 2461} {"train_loss": -11.665475845336914, "global_step": 413488, "epoch": 2461} {"train_loss": -10.320988655090332, "global_step": 413489, "epoch": 2461} {"train_loss": -11.366483688354492, "global_step": 413490, "epoch": 2461} {"train_loss": -11.402791976928711, "global_step": 413491, "epoch": 2461} {"train_loss": -11.348265647888184, "global_step": 413492, "epoch": 2461} {"train_loss": -11.496940612792969, "global_step": 413493, "epoch": 2461} {"train_loss": -11.029666900634766, "global_step": 413494, "epoch": 2461} {"train_loss": -11.178817749023438, "global_step": 413495, "epoch": 2461} {"train_loss": -11.671930313110352, "global_step": 413496, "epoch": 2461} {"train_loss": -11.28462028503418, "global_step": 413497, "epoch": 2461} {"train_loss": -11.56572151184082, "global_step": 413498, "epoch": 2461} {"train_loss": -11.588471412658691, "global_step": 413499, "epoch": 2461} {"train_loss": -11.204240798950195, "global_step": 413500, "epoch": 2461} {"train_loss": -11.759844779968262, "global_step": 413501, "epoch": 2461} {"train_loss": -11.370613098144531, "global_step": 413502, "epoch": 2461} {"train_loss": -12.29798698425293, "global_step": 413503, "epoch": 2461} {"train_loss": -11.938279151916504, "global_step": 413504, "epoch": 2461} {"train_loss": -11.467409133911133, "global_step": 413505, "epoch": 2461} {"train_loss": -11.795194625854492, "global_step": 413506, "epoch": 2461} {"train_loss": -11.98262882232666, "global_step": 413507, "epoch": 2461} {"train_loss": -11.843503952026367, "global_step": 413508, "epoch": 2461} {"train_loss": -12.1084566116333, "global_step": 413509, "epoch": 2461} {"train_loss": -11.960234642028809, "global_step": 413510, "epoch": 2461} {"train_loss": -12.016880989074707, "global_step": 413511, "epoch": 2461} {"train_loss": -12.342897415161133, "global_step": 413512, "epoch": 2461} {"train_loss": -12.148942947387695, "global_step": 413513, "epoch": 2461} {"train_loss": -12.362634658813477, "global_step": 413514, "epoch": 2461} {"train_loss": -12.17114543914795, "global_step": 413515, "epoch": 2461} {"train_loss": -12.185346603393555, "global_step": 413516, "epoch": 2461} {"train_loss": -12.15968132019043, "global_step": 413517, "epoch": 2461} {"train_loss": -12.317693710327148, "global_step": 413518, "epoch": 2461} {"train_loss": -12.170462608337402, "global_step": 413519, "epoch": 2461} {"train_loss": -12.284008026123047, "global_step": 413520, "epoch": 2461} {"train_loss": -12.410089492797852, "global_step": 413521, "epoch": 2461} {"train_loss": -12.188663482666016, "global_step": 413522, "epoch": 2461} {"train_loss": -12.3336181640625, "global_step": 413523, "epoch": 2461} {"train_loss": -12.165868759155273, "global_step": 413524, "epoch": 2461} {"train_loss": -12.495540618896484, "global_step": 413525, "epoch": 2461} {"train_loss": -12.023982048034668, "global_step": 413526, "epoch": 2461} {"train_loss": -12.446747779846191, "global_step": 413527, "epoch": 2461} {"train_loss": -12.08377456665039, "global_step": 413528, "epoch": 2461} {"train_loss": -12.447479248046875, "global_step": 413529, "epoch": 2461} {"train_loss": -12.478950500488281, "global_step": 413530, "epoch": 2461} {"train_loss": -12.480474472045898, "global_step": 413531, "epoch": 2461} {"train_loss": -12.516402244567871, "global_step": 413532, "epoch": 2461} {"train_loss": -12.422253608703613, "global_step": 413533, "epoch": 2461} {"train_loss": -12.401769638061523, "global_step": 413534, "epoch": 2461} {"train_loss": -12.620271682739258, "global_step": 413535, "epoch": 2461} {"train_loss": -12.516865730285645, "global_step": 413536, "epoch": 2461} {"train_loss": -12.603609085083008, "global_step": 413537, "epoch": 2461} {"train_loss": -12.504317283630371, "global_step": 413538, "epoch": 2461} {"train_loss": -12.576086044311523, "global_step": 413539, "epoch": 2461} {"train_loss": -12.452865600585938, "global_step": 413540, "epoch": 2461} {"train_loss": -12.617801666259766, "global_step": 413541, "epoch": 2461} {"train_loss": -12.663887977600098, "global_step": 413542, "epoch": 2461} {"train_loss": -12.606976509094238, "global_step": 413543, "epoch": 2461} {"train_loss": -12.511198043823242, "global_step": 413544, "epoch": 2461} {"train_loss": -12.599807739257812, "global_step": 413545, "epoch": 2461} {"train_loss": -12.600410461425781, "global_step": 413546, "epoch": 2461} {"train_loss": -12.734210968017578, "global_step": 413547, "epoch": 2461} {"train_loss": -12.51934814453125, "global_step": 413548, "epoch": 2461} {"train_loss": -12.784503936767578, "global_step": 413549, "epoch": 2461} {"train_loss": -12.789190292358398, "global_step": 413550, "epoch": 2461} {"train_loss": -12.615461349487305, "global_step": 413551, "epoch": 2461} {"train_loss": -12.764352798461914, "global_step": 413552, "epoch": 2461} {"train_loss": -12.5872220993042, "global_step": 413553, "epoch": 2461} {"train_loss": -12.705892562866211, "global_step": 413554, "epoch": 2461} {"train_loss": -12.72622013092041, "global_step": 413555, "epoch": 2461} {"train_loss": -12.535189628601074, "global_step": 413556, "epoch": 2461} {"train_loss": -12.658824920654297, "global_step": 413557, "epoch": 2461} {"train_loss": -12.301582336425781, "global_step": 413558, "epoch": 2461} {"train_loss": -12.585041046142578, "global_step": 413559, "epoch": 2461} {"train_loss": -12.682456970214844, "global_step": 413560, "epoch": 2461} {"train_loss": -12.639045715332031, "global_step": 413561, "epoch": 2461} {"train_loss": -12.692319869995117, "global_step": 413562, "epoch": 2461} {"train_loss": -12.63314437866211, "global_step": 413563, "epoch": 2461} {"train_loss": -12.688338279724121, "global_step": 413564, "epoch": 2461} {"train_loss": -12.638238906860352, "global_step": 413565, "epoch": 2461} {"train_loss": -12.773530006408691, "global_step": 413566, "epoch": 2461} {"train_loss": -12.604422569274902, "global_step": 413567, "epoch": 2461} {"train_loss": -12.806573867797852, "global_step": 413568, "epoch": 2461} {"train_loss": -12.675065994262695, "global_step": 413569, "epoch": 2461} {"train_loss": -12.446999549865723, "global_step": 413570, "epoch": 2461} {"train_loss": -12.526174545288086, "global_step": 413571, "epoch": 2461} {"train_loss": -12.91668701171875, "global_step": 413572, "epoch": 2461} {"train_loss": -12.969165802001953, "global_step": 413573, "epoch": 2461} {"train_loss": -12.359858512878418, "global_step": 413574, "epoch": 2461} {"train_loss": -12.69221305847168, "global_step": 413575, "epoch": 2461} {"train_loss": -12.486496925354004, "global_step": 413576, "epoch": 2461} {"train_loss": -12.542953491210938, "global_step": 413577, "epoch": 2461} {"train_loss": -12.488473892211914, "global_step": 413578, "epoch": 2461} {"train_loss": -12.41572380065918, "global_step": 413579, "epoch": 2461} {"train_loss": -11.90549087524414, "global_step": 413580, "epoch": 2461} {"train_loss": -12.117609024047852, "global_step": 413581, "epoch": 2461} {"train_loss": -12.57025146484375, "global_step": 413582, "epoch": 2461} {"train_loss": -11.683454513549805, "global_step": 413583, "epoch": 2461} {"train_loss": -10.018171310424805, "global_step": 413584, "epoch": 2461} {"train_loss": -8.972055435180664, "global_step": 413585, "epoch": 2461} {"train_loss": -8.540794372558594, "global_step": 413586, "epoch": 2461} {"train_loss": -8.795632362365723, "global_step": 413587, "epoch": 2461} {"train_loss": -9.349675178527832, "global_step": 413588, "epoch": 2461} {"train_loss": -9.82688045501709, "global_step": 413589, "epoch": 2461} {"train_loss": -8.668876647949219, "global_step": 413590, "epoch": 2461} {"train_loss": -9.642110824584961, "global_step": 413591, "epoch": 2461} {"train_loss": -8.853127479553223, "global_step": 413592, "epoch": 2461} {"train_loss": -9.731756210327148, "global_step": 413593, "epoch": 2461} {"train_loss": -7.539563179016113, "global_step": 413594, "epoch": 2461} {"train_loss": -10.749323844909668, "global_step": 413595, "epoch": 2461} {"train_loss": -8.441229820251465, "global_step": 413596, "epoch": 2461} {"train_loss": -10.61528491973877, "global_step": 413597, "epoch": 2461} {"train_loss": -9.094353675842285, "global_step": 413598, "epoch": 2461} {"train_loss": -10.362412452697754, "global_step": 413599, "epoch": 2461} {"train_loss": -8.982240676879883, "global_step": 413600, "epoch": 2461} {"train_loss": -9.813414573669434, "global_step": 413601, "epoch": 2461} {"train_loss": -9.97183609008789, "global_step": 413602, "epoch": 2461} {"train_loss": -10.0502347946167, "global_step": 413603, "epoch": 2461} {"train_loss": -9.800362586975098, "global_step": 413604, "epoch": 2461} {"train_loss": -10.325155258178711, "global_step": 413605, "epoch": 2461} {"train_loss": -10.987756729125977, "global_step": 413606, "epoch": 2461} {"train_loss": -10.447576522827148, "global_step": 413607, "epoch": 2461} {"train_loss": -10.841497421264648, "global_step": 413608, "epoch": 2461} {"train_loss": -10.418453216552734, "global_step": 413609, "epoch": 2461} {"train_loss": -11.4661283493042, "global_step": 413610, "epoch": 2461} {"train_loss": -10.9951171875, "global_step": 413611, "epoch": 2461} {"train_loss": -11.171546936035156, "global_step": 413612, "epoch": 2461} {"train_loss": -11.763096809387207, "global_step": 413613, "epoch": 2461} {"train_loss": -11.661112785339355, "global_step": 413614, "epoch": 2461} {"train_loss": -11.57254992212568, "global_step": 413615, "epoch": 2461, "val_loss": 301411.09375} {"train_loss": -10.391517639160156, "global_step": 413616, "epoch": 2462} {"train_loss": -11.561718940734863, "global_step": 413617, "epoch": 2462} {"train_loss": -10.277694702148438, "global_step": 413618, "epoch": 2462} {"train_loss": -10.804224014282227, "global_step": 413619, "epoch": 2462} {"train_loss": -11.306714057922363, "global_step": 413620, "epoch": 2462} {"train_loss": -10.864363670349121, "global_step": 413621, "epoch": 2462} {"train_loss": -11.317184448242188, "global_step": 413622, "epoch": 2462} {"train_loss": -11.606965065002441, "global_step": 413623, "epoch": 2462} {"train_loss": -10.942070960998535, "global_step": 413624, "epoch": 2462} {"train_loss": -11.722919464111328, "global_step": 413625, "epoch": 2462} {"train_loss": -11.261401176452637, "global_step": 413626, "epoch": 2462} {"train_loss": -11.430421829223633, "global_step": 413627, "epoch": 2462} {"train_loss": -11.924779891967773, "global_step": 413628, "epoch": 2462} {"train_loss": -11.5911865234375, "global_step": 413629, "epoch": 2462} {"train_loss": -12.017837524414062, "global_step": 413630, "epoch": 2462} {"train_loss": -11.564117431640625, "global_step": 413631, "epoch": 2462} {"train_loss": -11.566277503967285, "global_step": 413632, "epoch": 2462} {"train_loss": -11.927772521972656, "global_step": 413633, "epoch": 2462} {"train_loss": -11.627117156982422, "global_step": 413634, "epoch": 2462} {"train_loss": -12.333789825439453, "global_step": 413635, "epoch": 2462} {"train_loss": -12.231700897216797, "global_step": 413636, "epoch": 2462} {"train_loss": -12.061979293823242, "global_step": 413637, "epoch": 2462} {"train_loss": -12.015477180480957, "global_step": 413638, "epoch": 2462} {"train_loss": -12.277481079101562, "global_step": 413639, "epoch": 2462} {"train_loss": -11.46334457397461, "global_step": 413640, "epoch": 2462} {"train_loss": -12.191791534423828, "global_step": 413641, "epoch": 2462} {"train_loss": -11.686592102050781, "global_step": 413642, "epoch": 2462} {"train_loss": -12.080087661743164, "global_step": 413643, "epoch": 2462} {"train_loss": -11.88827896118164, "global_step": 413644, "epoch": 2462} {"train_loss": -11.983717918395996, "global_step": 413645, "epoch": 2462} {"train_loss": -11.966768264770508, "global_step": 413646, "epoch": 2462} {"train_loss": -12.230682373046875, "global_step": 413647, "epoch": 2462} {"train_loss": -11.946431159973145, "global_step": 413648, "epoch": 2462} {"train_loss": -12.038098335266113, "global_step": 413649, "epoch": 2462} {"train_loss": -11.868477821350098, "global_step": 413650, "epoch": 2462} {"train_loss": -11.915453910827637, "global_step": 413651, "epoch": 2462} {"train_loss": -11.760497093200684, "global_step": 413652, "epoch": 2462} {"train_loss": -12.288082122802734, "global_step": 413653, "epoch": 2462} {"train_loss": -12.112707138061523, "global_step": 413654, "epoch": 2462} {"train_loss": -12.205862045288086, "global_step": 413655, "epoch": 2462} {"train_loss": -12.191978454589844, "global_step": 413656, "epoch": 2462} {"train_loss": -12.29802131652832, "global_step": 413657, "epoch": 2462} {"train_loss": -11.969433784484863, "global_step": 413658, "epoch": 2462} {"train_loss": -12.259868621826172, "global_step": 413659, "epoch": 2462} {"train_loss": -11.98981761932373, "global_step": 413660, "epoch": 2462} {"train_loss": -11.69110107421875, "global_step": 413661, "epoch": 2462} {"train_loss": -12.06494140625, "global_step": 413662, "epoch": 2462} {"train_loss": -11.449762344360352, "global_step": 413663, "epoch": 2462} {"train_loss": -12.476158142089844, "global_step": 413664, "epoch": 2462} {"train_loss": -11.709802627563477, "global_step": 413665, "epoch": 2462} {"train_loss": -12.108743667602539, "global_step": 413666, "epoch": 2462} {"train_loss": -11.961055755615234, "global_step": 413667, "epoch": 2462} {"train_loss": -11.867753982543945, "global_step": 413668, "epoch": 2462} {"train_loss": -12.041935920715332, "global_step": 413669, "epoch": 2462} {"train_loss": -11.70407772064209, "global_step": 413670, "epoch": 2462} {"train_loss": -11.924593925476074, "global_step": 413671, "epoch": 2462} {"train_loss": -11.549980163574219, "global_step": 413672, "epoch": 2462} {"train_loss": -12.17657470703125, "global_step": 413673, "epoch": 2462} {"train_loss": -11.436624526977539, "global_step": 413674, "epoch": 2462} {"train_loss": -12.532255172729492, "global_step": 413675, "epoch": 2462} {"train_loss": -10.86589241027832, "global_step": 413676, "epoch": 2462} {"train_loss": -12.047359466552734, "global_step": 413677, "epoch": 2462} {"train_loss": -11.68407154083252, "global_step": 413678, "epoch": 2462} {"train_loss": -11.796066284179688, "global_step": 413679, "epoch": 2462} {"train_loss": -11.565547943115234, "global_step": 413680, "epoch": 2462} {"train_loss": -11.84020709991455, "global_step": 413681, "epoch": 2462} {"train_loss": -11.455740928649902, "global_step": 413682, "epoch": 2462} {"train_loss": -11.82165813446045, "global_step": 413683, "epoch": 2462} {"train_loss": -11.52897834777832, "global_step": 413684, "epoch": 2462} {"train_loss": -11.743915557861328, "global_step": 413685, "epoch": 2462} {"train_loss": -12.12338924407959, "global_step": 413686, "epoch": 2462} {"train_loss": -11.299762725830078, "global_step": 413687, "epoch": 2462} {"train_loss": -11.951313018798828, "global_step": 413688, "epoch": 2462} {"train_loss": -11.400263786315918, "global_step": 413689, "epoch": 2462} {"train_loss": -12.169126510620117, "global_step": 413690, "epoch": 2462} {"train_loss": -12.000753402709961, "global_step": 413691, "epoch": 2462} {"train_loss": -12.332796096801758, "global_step": 413692, "epoch": 2462} {"train_loss": -11.761282920837402, "global_step": 413693, "epoch": 2462} {"train_loss": -12.491279602050781, "global_step": 413694, "epoch": 2462} {"train_loss": -11.95353889465332, "global_step": 413695, "epoch": 2462} {"train_loss": -12.150994300842285, "global_step": 413696, "epoch": 2462} {"train_loss": -12.109345436096191, "global_step": 413697, "epoch": 2462} {"train_loss": -12.268648147583008, "global_step": 413698, "epoch": 2462} {"train_loss": -12.02686882019043, "global_step": 413699, "epoch": 2462} {"train_loss": -12.408266067504883, "global_step": 413700, "epoch": 2462} {"train_loss": -12.101847648620605, "global_step": 413701, "epoch": 2462} {"train_loss": -12.347253799438477, "global_step": 413702, "epoch": 2462} {"train_loss": -12.17737865447998, "global_step": 413703, "epoch": 2462} {"train_loss": -12.670225143432617, "global_step": 413704, "epoch": 2462} {"train_loss": -12.405258178710938, "global_step": 413705, "epoch": 2462} {"train_loss": -12.601465225219727, "global_step": 413706, "epoch": 2462} {"train_loss": -12.596949577331543, "global_step": 413707, "epoch": 2462} {"train_loss": -12.468893051147461, "global_step": 413708, "epoch": 2462} {"train_loss": -12.575630187988281, "global_step": 413709, "epoch": 2462} {"train_loss": -12.516767501831055, "global_step": 413710, "epoch": 2462} {"train_loss": -12.375575065612793, "global_step": 413711, "epoch": 2462} {"train_loss": -12.338272094726562, "global_step": 413712, "epoch": 2462} {"train_loss": -12.615467071533203, "global_step": 413713, "epoch": 2462} {"train_loss": -12.424748420715332, "global_step": 413714, "epoch": 2462} {"train_loss": -12.403970718383789, "global_step": 413715, "epoch": 2462} {"train_loss": -12.620800018310547, "global_step": 413716, "epoch": 2462} {"train_loss": -12.637371063232422, "global_step": 413717, "epoch": 2462} {"train_loss": -12.370469093322754, "global_step": 413718, "epoch": 2462} {"train_loss": -12.592490196228027, "global_step": 413719, "epoch": 2462} {"train_loss": -12.403326988220215, "global_step": 413720, "epoch": 2462} {"train_loss": -12.459680557250977, "global_step": 413721, "epoch": 2462} {"train_loss": -12.540842056274414, "global_step": 413722, "epoch": 2462} {"train_loss": -12.469812393188477, "global_step": 413723, "epoch": 2462} {"train_loss": -12.534866333007812, "global_step": 413724, "epoch": 2462} {"train_loss": -12.724270820617676, "global_step": 413725, "epoch": 2462} {"train_loss": -12.453239440917969, "global_step": 413726, "epoch": 2462} {"train_loss": -12.651798248291016, "global_step": 413727, "epoch": 2462} {"train_loss": -12.474952697753906, "global_step": 413728, "epoch": 2462} {"train_loss": -12.66086196899414, "global_step": 413729, "epoch": 2462} {"train_loss": -12.641952514648438, "global_step": 413730, "epoch": 2462} {"train_loss": -12.463438034057617, "global_step": 413731, "epoch": 2462} {"train_loss": -12.575326919555664, "global_step": 413732, "epoch": 2462} {"train_loss": -12.409584045410156, "global_step": 413733, "epoch": 2462} {"train_loss": -12.710302352905273, "global_step": 413734, "epoch": 2462} {"train_loss": -12.38528060913086, "global_step": 413735, "epoch": 2462} {"train_loss": -12.545170783996582, "global_step": 413736, "epoch": 2462} {"train_loss": -12.568161964416504, "global_step": 413737, "epoch": 2462} {"train_loss": -12.450462341308594, "global_step": 413738, "epoch": 2462} {"train_loss": -12.666605949401855, "global_step": 413739, "epoch": 2462} {"train_loss": -12.695640563964844, "global_step": 413740, "epoch": 2462} {"train_loss": -12.820440292358398, "global_step": 413741, "epoch": 2462} {"train_loss": -12.602396965026855, "global_step": 413742, "epoch": 2462} {"train_loss": -12.731090545654297, "global_step": 413743, "epoch": 2462} {"train_loss": -12.532341003417969, "global_step": 413744, "epoch": 2462} {"train_loss": -12.668206214904785, "global_step": 413745, "epoch": 2462} {"train_loss": -12.728979110717773, "global_step": 413746, "epoch": 2462} {"train_loss": -12.678661346435547, "global_step": 413747, "epoch": 2462} {"train_loss": -12.697105407714844, "global_step": 413748, "epoch": 2462} {"train_loss": -12.272130012512207, "global_step": 413749, "epoch": 2462} {"train_loss": -12.31002140045166, "global_step": 413750, "epoch": 2462} {"train_loss": -12.589821815490723, "global_step": 413751, "epoch": 2462} {"train_loss": -12.179725646972656, "global_step": 413752, "epoch": 2462} {"train_loss": -12.204296112060547, "global_step": 413753, "epoch": 2462} {"train_loss": -12.618640899658203, "global_step": 413754, "epoch": 2462} {"train_loss": -12.365702629089355, "global_step": 413755, "epoch": 2462} {"train_loss": -12.359125137329102, "global_step": 413756, "epoch": 2462} {"train_loss": -11.938138008117676, "global_step": 413757, "epoch": 2462} {"train_loss": -12.436637878417969, "global_step": 413758, "epoch": 2462} {"train_loss": -12.619308471679688, "global_step": 413759, "epoch": 2462} {"train_loss": -12.149782180786133, "global_step": 413760, "epoch": 2462} {"train_loss": -11.932266235351562, "global_step": 413761, "epoch": 2462} {"train_loss": -12.673297882080078, "global_step": 413762, "epoch": 2462} {"train_loss": -12.065248489379883, "global_step": 413763, "epoch": 2462} {"train_loss": -12.307245254516602, "global_step": 413764, "epoch": 2462} {"train_loss": -12.487236976623535, "global_step": 413765, "epoch": 2462} {"train_loss": -12.424842834472656, "global_step": 413766, "epoch": 2462} {"train_loss": -12.733028411865234, "global_step": 413767, "epoch": 2462} {"train_loss": -12.409384727478027, "global_step": 413768, "epoch": 2462} {"train_loss": -12.63176155090332, "global_step": 413769, "epoch": 2462} {"train_loss": -12.28364372253418, "global_step": 413770, "epoch": 2462} {"train_loss": -12.598063468933105, "global_step": 413771, "epoch": 2462} {"train_loss": -12.333696365356445, "global_step": 413772, "epoch": 2462} {"train_loss": -12.554810523986816, "global_step": 413773, "epoch": 2462} {"train_loss": -12.370577812194824, "global_step": 413774, "epoch": 2462} {"train_loss": -12.51520824432373, "global_step": 413775, "epoch": 2462} {"train_loss": -12.423751831054688, "global_step": 413776, "epoch": 2462} {"train_loss": -12.364225387573242, "global_step": 413777, "epoch": 2462} {"train_loss": -12.576099395751953, "global_step": 413778, "epoch": 2462} {"train_loss": -12.326250076293945, "global_step": 413779, "epoch": 2462} {"train_loss": -12.588298797607422, "global_step": 413780, "epoch": 2462} {"train_loss": -12.505874633789062, "global_step": 413781, "epoch": 2462} {"train_loss": -12.048500061035156, "global_step": 413782, "epoch": 2462} {"train_loss": -12.139436449323382, "global_step": 413783, "epoch": 2462, "val_loss": 303266.875} {"train_loss": -12.610013961791992, "global_step": 413784, "epoch": 2463} {"train_loss": -11.482951164245605, "global_step": 413785, "epoch": 2463} {"train_loss": -10.33881950378418, "global_step": 413786, "epoch": 2463} {"train_loss": -12.112213134765625, "global_step": 413787, "epoch": 2463} {"train_loss": -12.14531135559082, "global_step": 413788, "epoch": 2463} {"train_loss": -10.448834419250488, "global_step": 413789, "epoch": 2463} {"train_loss": -11.986652374267578, "global_step": 413790, "epoch": 2463} {"train_loss": -11.570011138916016, "global_step": 413791, "epoch": 2463} {"train_loss": -11.40285873413086, "global_step": 413792, "epoch": 2463} {"train_loss": -12.232423782348633, "global_step": 413793, "epoch": 2463} {"train_loss": -10.310693740844727, "global_step": 413794, "epoch": 2463} {"train_loss": -10.643966674804688, "global_step": 413795, "epoch": 2463} {"train_loss": -11.118012428283691, "global_step": 413796, "epoch": 2463} {"train_loss": -9.69766902923584, "global_step": 413797, "epoch": 2463} {"train_loss": -10.29475212097168, "global_step": 413798, "epoch": 2463} {"train_loss": -10.14410400390625, "global_step": 413799, "epoch": 2463} {"train_loss": -10.422479629516602, "global_step": 413800, "epoch": 2463} {"train_loss": -11.872136116027832, "global_step": 413801, "epoch": 2463} {"train_loss": -10.7063570022583, "global_step": 413802, "epoch": 2463} {"train_loss": -11.397027969360352, "global_step": 413803, "epoch": 2463} {"train_loss": -11.517414093017578, "global_step": 413804, "epoch": 2463} {"train_loss": -10.331544876098633, "global_step": 413805, "epoch": 2463} {"train_loss": -12.272907257080078, "global_step": 413806, "epoch": 2463} {"train_loss": -11.571744918823242, "global_step": 413807, "epoch": 2463} {"train_loss": -11.693583488464355, "global_step": 413808, "epoch": 2463} {"train_loss": -12.106976509094238, "global_step": 413809, "epoch": 2463} {"train_loss": -11.496293067932129, "global_step": 413810, "epoch": 2463} {"train_loss": -11.741148948669434, "global_step": 413811, "epoch": 2463} {"train_loss": -11.819682121276855, "global_step": 413812, "epoch": 2463} {"train_loss": -12.050317764282227, "global_step": 413813, "epoch": 2463} {"train_loss": -11.650583267211914, "global_step": 413814, "epoch": 2463} {"train_loss": -11.895889282226562, "global_step": 413815, "epoch": 2463} {"train_loss": -11.475235939025879, "global_step": 413816, "epoch": 2463} {"train_loss": -11.900325775146484, "global_step": 413817, "epoch": 2463} {"train_loss": -11.696635246276855, "global_step": 413818, "epoch": 2463} {"train_loss": -11.927453994750977, "global_step": 413819, "epoch": 2463} {"train_loss": -11.873786926269531, "global_step": 413820, "epoch": 2463} {"train_loss": -11.625158309936523, "global_step": 413821, "epoch": 2463} {"train_loss": -12.395753860473633, "global_step": 413822, "epoch": 2463} {"train_loss": -11.90394401550293, "global_step": 413823, "epoch": 2463} {"train_loss": -12.401252746582031, "global_step": 413824, "epoch": 2463} {"train_loss": -11.771119117736816, "global_step": 413825, "epoch": 2463} {"train_loss": -12.478104591369629, "global_step": 413826, "epoch": 2463} {"train_loss": -12.296263694763184, "global_step": 413827, "epoch": 2463} {"train_loss": -12.179908752441406, "global_step": 413828, "epoch": 2463} {"train_loss": -12.532976150512695, "global_step": 413829, "epoch": 2463} {"train_loss": -12.068756103515625, "global_step": 413830, "epoch": 2463} {"train_loss": -12.41683578491211, "global_step": 413831, "epoch": 2463} {"train_loss": -12.575003623962402, "global_step": 413832, "epoch": 2463} {"train_loss": -12.338594436645508, "global_step": 413833, "epoch": 2463} {"train_loss": -12.557184219360352, "global_step": 413834, "epoch": 2463} {"train_loss": -12.5166597366333, "global_step": 413835, "epoch": 2463} {"train_loss": -12.285294532775879, "global_step": 413836, "epoch": 2463} {"train_loss": -12.65545654296875, "global_step": 413837, "epoch": 2463} {"train_loss": -12.336023330688477, "global_step": 413838, "epoch": 2463} {"train_loss": -12.537303924560547, "global_step": 413839, "epoch": 2463} {"train_loss": -12.153787612915039, "global_step": 413840, "epoch": 2463} {"train_loss": -12.355956077575684, "global_step": 413841, "epoch": 2463} {"train_loss": -12.529549598693848, "global_step": 413842, "epoch": 2463} {"train_loss": -12.208415031433105, "global_step": 413843, "epoch": 2463} {"train_loss": -12.452130317687988, "global_step": 413844, "epoch": 2463} {"train_loss": -12.290197372436523, "global_step": 413845, "epoch": 2463} {"train_loss": -12.247180938720703, "global_step": 413846, "epoch": 2463} {"train_loss": -12.118988990783691, "global_step": 413847, "epoch": 2463} {"train_loss": -12.200141906738281, "global_step": 413848, "epoch": 2463} {"train_loss": -12.245658874511719, "global_step": 413849, "epoch": 2463} {"train_loss": -12.384891510009766, "global_step": 413850, "epoch": 2463} {"train_loss": -12.512371063232422, "global_step": 413851, "epoch": 2463} {"train_loss": -12.421918869018555, "global_step": 413852, "epoch": 2463} {"train_loss": -12.46938705444336, "global_step": 413853, "epoch": 2463} {"train_loss": -12.542691230773926, "global_step": 413854, "epoch": 2463} {"train_loss": -12.64093017578125, "global_step": 413855, "epoch": 2463} {"train_loss": -12.48850154876709, "global_step": 413856, "epoch": 2463} {"train_loss": -12.396349906921387, "global_step": 413857, "epoch": 2463} {"train_loss": -12.687883377075195, "global_step": 413858, "epoch": 2463} {"train_loss": -12.785221099853516, "global_step": 413859, "epoch": 2463} {"train_loss": -12.501910209655762, "global_step": 413860, "epoch": 2463} {"train_loss": -12.527953147888184, "global_step": 413861, "epoch": 2463} {"train_loss": -12.665225982666016, "global_step": 413862, "epoch": 2463} {"train_loss": -12.437378883361816, "global_step": 413863, "epoch": 2463} {"train_loss": -12.498191833496094, "global_step": 413864, "epoch": 2463} {"train_loss": -12.716960906982422, "global_step": 413865, "epoch": 2463} {"train_loss": -12.34689712524414, "global_step": 413866, "epoch": 2463} {"train_loss": -12.415578842163086, "global_step": 413867, "epoch": 2463} {"train_loss": -11.946334838867188, "global_step": 413868, "epoch": 2463} {"train_loss": -12.6862154006958, "global_step": 413869, "epoch": 2463} {"train_loss": -12.232484817504883, "global_step": 413870, "epoch": 2463} {"train_loss": -12.181100845336914, "global_step": 413871, "epoch": 2463} {"train_loss": -12.476648330688477, "global_step": 413872, "epoch": 2463} {"train_loss": -12.16041088104248, "global_step": 413873, "epoch": 2463} {"train_loss": -12.630565643310547, "global_step": 413874, "epoch": 2463} {"train_loss": -12.084829330444336, "global_step": 413875, "epoch": 2463} {"train_loss": -12.528427124023438, "global_step": 413876, "epoch": 2463} {"train_loss": -12.663835525512695, "global_step": 413877, "epoch": 2463} {"train_loss": -12.406126022338867, "global_step": 413878, "epoch": 2463} {"train_loss": -12.95121955871582, "global_step": 413879, "epoch": 2463} {"train_loss": -12.160284042358398, "global_step": 413880, "epoch": 2463} {"train_loss": -12.595193862915039, "global_step": 413881, "epoch": 2463} {"train_loss": -12.66464614868164, "global_step": 413882, "epoch": 2463} {"train_loss": -12.22989273071289, "global_step": 413883, "epoch": 2463} {"train_loss": -12.363107681274414, "global_step": 413884, "epoch": 2463} {"train_loss": -11.96922492980957, "global_step": 413885, "epoch": 2463} {"train_loss": -12.086071014404297, "global_step": 413886, "epoch": 2463} {"train_loss": -12.325858116149902, "global_step": 413887, "epoch": 2463} {"train_loss": -12.172718048095703, "global_step": 413888, "epoch": 2463} {"train_loss": -11.996459007263184, "global_step": 413889, "epoch": 2463} {"train_loss": -11.957939147949219, "global_step": 413890, "epoch": 2463} {"train_loss": -12.313703536987305, "global_step": 413891, "epoch": 2463} {"train_loss": -11.749670028686523, "global_step": 413892, "epoch": 2463} {"train_loss": -12.518797874450684, "global_step": 413893, "epoch": 2463} {"train_loss": -12.305398941040039, "global_step": 413894, "epoch": 2463} {"train_loss": -12.298993110656738, "global_step": 413895, "epoch": 2463} {"train_loss": -12.252437591552734, "global_step": 413896, "epoch": 2463} {"train_loss": -12.572261810302734, "global_step": 413897, "epoch": 2463} {"train_loss": -11.914363861083984, "global_step": 413898, "epoch": 2463} {"train_loss": -12.610054016113281, "global_step": 413899, "epoch": 2463} {"train_loss": -12.529720306396484, "global_step": 413900, "epoch": 2463} {"train_loss": -12.360350608825684, "global_step": 413901, "epoch": 2463} {"train_loss": -12.63525390625, "global_step": 413902, "epoch": 2463} {"train_loss": -12.249457359313965, "global_step": 413903, "epoch": 2463} {"train_loss": -12.252854347229004, "global_step": 413904, "epoch": 2463} {"train_loss": -12.578709602355957, "global_step": 413905, "epoch": 2463} {"train_loss": -11.63973331451416, "global_step": 413906, "epoch": 2463} {"train_loss": -12.138019561767578, "global_step": 413907, "epoch": 2463} {"train_loss": -12.12362003326416, "global_step": 413908, "epoch": 2463} {"train_loss": -11.920795440673828, "global_step": 413909, "epoch": 2463} {"train_loss": -11.781271934509277, "global_step": 413910, "epoch": 2463} {"train_loss": -12.540238380432129, "global_step": 413911, "epoch": 2463} {"train_loss": -11.54670524597168, "global_step": 413912, "epoch": 2463} {"train_loss": -11.878538131713867, "global_step": 413913, "epoch": 2463} {"train_loss": -11.467321395874023, "global_step": 413914, "epoch": 2463} {"train_loss": -9.65711784362793, "global_step": 413915, "epoch": 2463} {"train_loss": -11.82557201385498, "global_step": 413916, "epoch": 2463} {"train_loss": -9.220834732055664, "global_step": 413917, "epoch": 2463} {"train_loss": -11.597480773925781, "global_step": 413918, "epoch": 2463} {"train_loss": -10.749615669250488, "global_step": 413919, "epoch": 2463} {"train_loss": -9.797969818115234, "global_step": 413920, "epoch": 2463} {"train_loss": -10.858193397521973, "global_step": 413921, "epoch": 2463} {"train_loss": -11.016888618469238, "global_step": 413922, "epoch": 2463} {"train_loss": -11.19243049621582, "global_step": 413923, "epoch": 2463} {"train_loss": -10.66018295288086, "global_step": 413924, "epoch": 2463} {"train_loss": -11.985133171081543, "global_step": 413925, "epoch": 2463} {"train_loss": -9.58627986907959, "global_step": 413926, "epoch": 2463} {"train_loss": -11.660449981689453, "global_step": 413927, "epoch": 2463} {"train_loss": -10.893342971801758, "global_step": 413928, "epoch": 2463} {"train_loss": -11.202095031738281, "global_step": 413929, "epoch": 2463} {"train_loss": -11.974329948425293, "global_step": 413930, "epoch": 2463} {"train_loss": -11.270391464233398, "global_step": 413931, "epoch": 2463} {"train_loss": -11.648602485656738, "global_step": 413932, "epoch": 2463} {"train_loss": -11.49974250793457, "global_step": 413933, "epoch": 2463} {"train_loss": -11.825714111328125, "global_step": 413934, "epoch": 2463} {"train_loss": -11.551944732666016, "global_step": 413935, "epoch": 2463} {"train_loss": -11.767098426818848, "global_step": 413936, "epoch": 2463} {"train_loss": -11.62700080871582, "global_step": 413937, "epoch": 2463} {"train_loss": -12.069602966308594, "global_step": 413938, "epoch": 2463} {"train_loss": -11.638795852661133, "global_step": 413939, "epoch": 2463} {"train_loss": -12.01214599609375, "global_step": 413940, "epoch": 2463} {"train_loss": -11.985675811767578, "global_step": 413941, "epoch": 2463} {"train_loss": -11.736600875854492, "global_step": 413942, "epoch": 2463} {"train_loss": -12.047764778137207, "global_step": 413943, "epoch": 2463} {"train_loss": -11.390665054321289, "global_step": 413944, "epoch": 2463} {"train_loss": -12.428915023803711, "global_step": 413945, "epoch": 2463} {"train_loss": -11.24555778503418, "global_step": 413946, "epoch": 2463} {"train_loss": -12.1171875, "global_step": 413947, "epoch": 2463} {"train_loss": -11.597997665405273, "global_step": 413948, "epoch": 2463} {"train_loss": -11.995595932006836, "global_step": 413949, "epoch": 2463} {"train_loss": -12.008195877075195, "global_step": 413950, "epoch": 2463} {"train_loss": -11.909851920037042, "global_step": 413951, "epoch": 2463, "val_loss": 306158.9375} {"train_loss": -11.670143127441406, "global_step": 413952, "epoch": 2464} {"train_loss": -11.745939254760742, "global_step": 413953, "epoch": 2464} {"train_loss": -11.610246658325195, "global_step": 413954, "epoch": 2464} {"train_loss": -12.11648941040039, "global_step": 413955, "epoch": 2464} {"train_loss": -11.770668029785156, "global_step": 413956, "epoch": 2464} {"train_loss": -11.837823867797852, "global_step": 413957, "epoch": 2464} {"train_loss": -12.323379516601562, "global_step": 413958, "epoch": 2464} {"train_loss": -11.823686599731445, "global_step": 413959, "epoch": 2464} {"train_loss": -12.16114616394043, "global_step": 413960, "epoch": 2464} {"train_loss": -12.252339363098145, "global_step": 413961, "epoch": 2464} {"train_loss": -12.25341796875, "global_step": 413962, "epoch": 2464} {"train_loss": -11.855436325073242, "global_step": 413963, "epoch": 2464} {"train_loss": -11.705785751342773, "global_step": 413964, "epoch": 2464} {"train_loss": -12.302499771118164, "global_step": 413965, "epoch": 2464} {"train_loss": -12.19926643371582, "global_step": 413966, "epoch": 2464} {"train_loss": -11.901739120483398, "global_step": 413967, "epoch": 2464} {"train_loss": -12.558382034301758, "global_step": 413968, "epoch": 2464} {"train_loss": -11.892461776733398, "global_step": 413969, "epoch": 2464} {"train_loss": -12.571664810180664, "global_step": 413970, "epoch": 2464} {"train_loss": -12.274192810058594, "global_step": 413971, "epoch": 2464} {"train_loss": -12.058791160583496, "global_step": 413972, "epoch": 2464} {"train_loss": -12.296135902404785, "global_step": 413973, "epoch": 2464} {"train_loss": -12.213407516479492, "global_step": 413974, "epoch": 2464} {"train_loss": -12.513237953186035, "global_step": 413975, "epoch": 2464} {"train_loss": -12.337556838989258, "global_step": 413976, "epoch": 2464} {"train_loss": -12.326652526855469, "global_step": 413977, "epoch": 2464} {"train_loss": -12.289155006408691, "global_step": 413978, "epoch": 2464} {"train_loss": -12.28916072845459, "global_step": 413979, "epoch": 2464} {"train_loss": -12.276329040527344, "global_step": 413980, "epoch": 2464} {"train_loss": -12.209355354309082, "global_step": 413981, "epoch": 2464} {"train_loss": -12.328574180603027, "global_step": 413982, "epoch": 2464} {"train_loss": -12.235673904418945, "global_step": 413983, "epoch": 2464} {"train_loss": -12.238922119140625, "global_step": 413984, "epoch": 2464} {"train_loss": -12.656707763671875, "global_step": 413985, "epoch": 2464} {"train_loss": -12.066837310791016, "global_step": 413986, "epoch": 2464} {"train_loss": -12.055362701416016, "global_step": 413987, "epoch": 2464} {"train_loss": -12.378355026245117, "global_step": 413988, "epoch": 2464} {"train_loss": -11.994478225708008, "global_step": 413989, "epoch": 2464} {"train_loss": -12.29481315612793, "global_step": 413990, "epoch": 2464} {"train_loss": -11.675817489624023, "global_step": 413991, "epoch": 2464} {"train_loss": -12.148465156555176, "global_step": 413992, "epoch": 2464} {"train_loss": -12.251972198486328, "global_step": 413993, "epoch": 2464} {"train_loss": -11.418475151062012, "global_step": 413994, "epoch": 2464} {"train_loss": -12.462974548339844, "global_step": 413995, "epoch": 2464} {"train_loss": -10.99587631225586, "global_step": 413996, "epoch": 2464} {"train_loss": -11.7066068649292, "global_step": 413997, "epoch": 2464} {"train_loss": -12.077638626098633, "global_step": 413998, "epoch": 2464} {"train_loss": -10.517280578613281, "global_step": 413999, "epoch": 2464} {"train_loss": -12.498540878295898, "global_step": 414000, "epoch": 2464} {"train_loss": -10.736810684204102, "global_step": 414001, "epoch": 2464} {"train_loss": -12.107576370239258, "global_step": 414002, "epoch": 2464} {"train_loss": -11.094173431396484, "global_step": 414003, "epoch": 2464} {"train_loss": -11.822083473205566, "global_step": 414004, "epoch": 2464} {"train_loss": -11.898629188537598, "global_step": 414005, "epoch": 2464} {"train_loss": -11.153305053710938, "global_step": 414006, "epoch": 2464} {"train_loss": -12.595523834228516, "global_step": 414007, "epoch": 2464} {"train_loss": -11.190424919128418, "global_step": 414008, "epoch": 2464} {"train_loss": -11.858139038085938, "global_step": 414009, "epoch": 2464} {"train_loss": -11.17738151550293, "global_step": 414010, "epoch": 2464} {"train_loss": -11.691987991333008, "global_step": 414011, "epoch": 2464} {"train_loss": -12.08674430847168, "global_step": 414012, "epoch": 2464} {"train_loss": -11.311249732971191, "global_step": 414013, "epoch": 2464} {"train_loss": -12.080952644348145, "global_step": 414014, "epoch": 2464} {"train_loss": -10.825736999511719, "global_step": 414015, "epoch": 2464} {"train_loss": -12.372329711914062, "global_step": 414016, "epoch": 2464} {"train_loss": -11.384968757629395, "global_step": 414017, "epoch": 2464} {"train_loss": -12.051530838012695, "global_step": 414018, "epoch": 2464} {"train_loss": -11.118144989013672, "global_step": 414019, "epoch": 2464} {"train_loss": -11.771025657653809, "global_step": 414020, "epoch": 2464} {"train_loss": -12.043840408325195, "global_step": 414021, "epoch": 2464} {"train_loss": -11.659979820251465, "global_step": 414022, "epoch": 2464} {"train_loss": -12.575189590454102, "global_step": 414023, "epoch": 2464} {"train_loss": -12.105947494506836, "global_step": 414024, "epoch": 2464} {"train_loss": -12.321097373962402, "global_step": 414025, "epoch": 2464} {"train_loss": -12.166728019714355, "global_step": 414026, "epoch": 2464} {"train_loss": -12.235465049743652, "global_step": 414027, "epoch": 2464} {"train_loss": -12.338586807250977, "global_step": 414028, "epoch": 2464} {"train_loss": -12.239873886108398, "global_step": 414029, "epoch": 2464} {"train_loss": -12.249079704284668, "global_step": 414030, "epoch": 2464} {"train_loss": -12.405525207519531, "global_step": 414031, "epoch": 2464} {"train_loss": -12.18417739868164, "global_step": 414032, "epoch": 2464} {"train_loss": -12.393817901611328, "global_step": 414033, "epoch": 2464} {"train_loss": -12.415508270263672, "global_step": 414034, "epoch": 2464} {"train_loss": -12.39654541015625, "global_step": 414035, "epoch": 2464} {"train_loss": -12.221498489379883, "global_step": 414036, "epoch": 2464} {"train_loss": -12.583056449890137, "global_step": 414037, "epoch": 2464} {"train_loss": -12.430622100830078, "global_step": 414038, "epoch": 2464} {"train_loss": -12.548116683959961, "global_step": 414039, "epoch": 2464} {"train_loss": -12.447135925292969, "global_step": 414040, "epoch": 2464} {"train_loss": -12.327777862548828, "global_step": 414041, "epoch": 2464} {"train_loss": -12.66653060913086, "global_step": 414042, "epoch": 2464} {"train_loss": -12.471830368041992, "global_step": 414043, "epoch": 2464} {"train_loss": -12.666023254394531, "global_step": 414044, "epoch": 2464} {"train_loss": -12.62344741821289, "global_step": 414045, "epoch": 2464} {"train_loss": -12.664398193359375, "global_step": 414046, "epoch": 2464} {"train_loss": -12.421138763427734, "global_step": 414047, "epoch": 2464} {"train_loss": -12.449597358703613, "global_step": 414048, "epoch": 2464} {"train_loss": -12.452523231506348, "global_step": 414049, "epoch": 2464} {"train_loss": -12.561551094055176, "global_step": 414050, "epoch": 2464} {"train_loss": -12.930739402770996, "global_step": 414051, "epoch": 2464} {"train_loss": -12.665802001953125, "global_step": 414052, "epoch": 2464} {"train_loss": -12.600420951843262, "global_step": 414053, "epoch": 2464} {"train_loss": -12.631489753723145, "global_step": 414054, "epoch": 2464} {"train_loss": -12.480491638183594, "global_step": 414055, "epoch": 2464} {"train_loss": -12.710206985473633, "global_step": 414056, "epoch": 2464} {"train_loss": -12.332569122314453, "global_step": 414057, "epoch": 2464} {"train_loss": -12.750213623046875, "global_step": 414058, "epoch": 2464} {"train_loss": -12.743061065673828, "global_step": 414059, "epoch": 2464} {"train_loss": -12.744918823242188, "global_step": 414060, "epoch": 2464} {"train_loss": -12.801613807678223, "global_step": 414061, "epoch": 2464} {"train_loss": -12.709157943725586, "global_step": 414062, "epoch": 2464} {"train_loss": -12.920475006103516, "global_step": 414063, "epoch": 2464} {"train_loss": -12.620442390441895, "global_step": 414064, "epoch": 2464} {"train_loss": -12.573345184326172, "global_step": 414065, "epoch": 2464} {"train_loss": -12.482437133789062, "global_step": 414066, "epoch": 2464} {"train_loss": -12.39073371887207, "global_step": 414067, "epoch": 2464} {"train_loss": -12.382156372070312, "global_step": 414068, "epoch": 2464} {"train_loss": -12.711689949035645, "global_step": 414069, "epoch": 2464} {"train_loss": -12.566020965576172, "global_step": 414070, "epoch": 2464} {"train_loss": -12.215972900390625, "global_step": 414071, "epoch": 2464} {"train_loss": -12.910444259643555, "global_step": 414072, "epoch": 2464} {"train_loss": -12.442499160766602, "global_step": 414073, "epoch": 2464} {"train_loss": -12.228643417358398, "global_step": 414074, "epoch": 2464} {"train_loss": -12.539640426635742, "global_step": 414075, "epoch": 2464} {"train_loss": -12.70375919342041, "global_step": 414076, "epoch": 2464} {"train_loss": -12.712878227233887, "global_step": 414077, "epoch": 2464} {"train_loss": -12.55644702911377, "global_step": 414078, "epoch": 2464} {"train_loss": -12.617864608764648, "global_step": 414079, "epoch": 2464} {"train_loss": -12.655017852783203, "global_step": 414080, "epoch": 2464} {"train_loss": -12.853111267089844, "global_step": 414081, "epoch": 2464} {"train_loss": -12.78567123413086, "global_step": 414082, "epoch": 2464} {"train_loss": -12.850415229797363, "global_step": 414083, "epoch": 2464} {"train_loss": -12.715309143066406, "global_step": 414084, "epoch": 2464} {"train_loss": -12.772560119628906, "global_step": 414085, "epoch": 2464} {"train_loss": -12.624011039733887, "global_step": 414086, "epoch": 2464} {"train_loss": -12.618435859680176, "global_step": 414087, "epoch": 2464} {"train_loss": -12.66592788696289, "global_step": 414088, "epoch": 2464} {"train_loss": -12.700348854064941, "global_step": 414089, "epoch": 2464} {"train_loss": -12.673425674438477, "global_step": 414090, "epoch": 2464} {"train_loss": -12.530884742736816, "global_step": 414091, "epoch": 2464} {"train_loss": -12.719839096069336, "global_step": 414092, "epoch": 2464} {"train_loss": -12.791990280151367, "global_step": 414093, "epoch": 2464} {"train_loss": -12.808509826660156, "global_step": 414094, "epoch": 2464} {"train_loss": -12.609318733215332, "global_step": 414095, "epoch": 2464} {"train_loss": -12.573123931884766, "global_step": 414096, "epoch": 2464} {"train_loss": -12.827802658081055, "global_step": 414097, "epoch": 2464} {"train_loss": -12.953632354736328, "global_step": 414098, "epoch": 2464} {"train_loss": -12.91336441040039, "global_step": 414099, "epoch": 2464} {"train_loss": -12.898307800292969, "global_step": 414100, "epoch": 2464} {"train_loss": -12.737297058105469, "global_step": 414101, "epoch": 2464} {"train_loss": -12.771950721740723, "global_step": 414102, "epoch": 2464} {"train_loss": -12.624582290649414, "global_step": 414103, "epoch": 2464} {"train_loss": -12.86601734161377, "global_step": 414104, "epoch": 2464} {"train_loss": -12.590641021728516, "global_step": 414105, "epoch": 2464} {"train_loss": -12.747138977050781, "global_step": 414106, "epoch": 2464} {"train_loss": -12.924893379211426, "global_step": 414107, "epoch": 2464} {"train_loss": -12.708128929138184, "global_step": 414108, "epoch": 2464} {"train_loss": -12.131925582885742, "global_step": 414109, "epoch": 2464} {"train_loss": -11.775546073913574, "global_step": 414110, "epoch": 2464} {"train_loss": -11.217535018920898, "global_step": 414111, "epoch": 2464} {"train_loss": -12.110652923583984, "global_step": 414112, "epoch": 2464} {"train_loss": -12.32242202758789, "global_step": 414113, "epoch": 2464} {"train_loss": -11.7275972366333, "global_step": 414114, "epoch": 2464} {"train_loss": -12.085933685302734, "global_step": 414115, "epoch": 2464} {"train_loss": -12.270318984985352, "global_step": 414116, "epoch": 2464} {"train_loss": -12.293781280517578, "global_step": 414117, "epoch": 2464} {"train_loss": -10.641101837158203, "global_step": 414118, "epoch": 2464} {"train_loss": -12.257414692924137, "global_step": 414119, "epoch": 2464, "val_loss": 306155.3125} {"train_loss": -12.389165878295898, "global_step": 414120, "epoch": 2465} {"train_loss": -10.433687210083008, "global_step": 414121, "epoch": 2465} {"train_loss": -9.079191207885742, "global_step": 414122, "epoch": 2465} {"train_loss": -10.149273872375488, "global_step": 414123, "epoch": 2465} {"train_loss": -6.158346176147461, "global_step": 414124, "epoch": 2465} {"train_loss": -7.411942958831787, "global_step": 414125, "epoch": 2465} {"train_loss": -8.819831848144531, "global_step": 414126, "epoch": 2465} {"train_loss": -8.755136489868164, "global_step": 414127, "epoch": 2465} {"train_loss": -9.628841400146484, "global_step": 414128, "epoch": 2465} {"train_loss": -9.356321334838867, "global_step": 414129, "epoch": 2465} {"train_loss": -8.856481552124023, "global_step": 414130, "epoch": 2465} {"train_loss": -9.713907241821289, "global_step": 414131, "epoch": 2465} {"train_loss": -9.619089126586914, "global_step": 414132, "epoch": 2465} {"train_loss": -9.00980281829834, "global_step": 414133, "epoch": 2465} {"train_loss": -10.394492149353027, "global_step": 414134, "epoch": 2465} {"train_loss": -9.209575653076172, "global_step": 414135, "epoch": 2465} {"train_loss": -10.818556785583496, "global_step": 414136, "epoch": 2465} {"train_loss": -8.170357704162598, "global_step": 414137, "epoch": 2465} {"train_loss": -8.876507759094238, "global_step": 414138, "epoch": 2465} {"train_loss": -10.353273391723633, "global_step": 414139, "epoch": 2465} {"train_loss": -9.623115539550781, "global_step": 414140, "epoch": 2465} {"train_loss": -10.173301696777344, "global_step": 414141, "epoch": 2465} {"train_loss": -9.61745548248291, "global_step": 414142, "epoch": 2465} {"train_loss": -8.884425163269043, "global_step": 414143, "epoch": 2465} {"train_loss": -10.221036911010742, "global_step": 414144, "epoch": 2465} {"train_loss": -9.380624771118164, "global_step": 414145, "epoch": 2465} {"train_loss": -11.181623458862305, "global_step": 414146, "epoch": 2465} {"train_loss": -9.515314102172852, "global_step": 414147, "epoch": 2465} {"train_loss": -11.267770767211914, "global_step": 414148, "epoch": 2465} {"train_loss": -9.108837127685547, "global_step": 414149, "epoch": 2465} {"train_loss": -11.235126495361328, "global_step": 414150, "epoch": 2465} {"train_loss": -9.842422485351562, "global_step": 414151, "epoch": 2465} {"train_loss": -10.605051040649414, "global_step": 414152, "epoch": 2465} {"train_loss": -10.573196411132812, "global_step": 414153, "epoch": 2465} {"train_loss": -10.321310043334961, "global_step": 414154, "epoch": 2465} {"train_loss": -10.366045951843262, "global_step": 414155, "epoch": 2465} {"train_loss": -10.755992889404297, "global_step": 414156, "epoch": 2465} {"train_loss": -10.935037612915039, "global_step": 414157, "epoch": 2465} {"train_loss": -10.479776382446289, "global_step": 414158, "epoch": 2465} {"train_loss": -11.048327445983887, "global_step": 414159, "epoch": 2465} {"train_loss": -10.713525772094727, "global_step": 414160, "epoch": 2465} {"train_loss": -11.003868103027344, "global_step": 414161, "epoch": 2465} {"train_loss": -11.338640213012695, "global_step": 414162, "epoch": 2465} {"train_loss": -11.238520622253418, "global_step": 414163, "epoch": 2465} {"train_loss": -11.202018737792969, "global_step": 414164, "epoch": 2465} {"train_loss": -11.776145935058594, "global_step": 414165, "epoch": 2465} {"train_loss": -10.74948787689209, "global_step": 414166, "epoch": 2465} {"train_loss": -11.815009117126465, "global_step": 414167, "epoch": 2465} {"train_loss": -11.02891731262207, "global_step": 414168, "epoch": 2465} {"train_loss": -11.562784194946289, "global_step": 414169, "epoch": 2465} {"train_loss": -11.528279304504395, "global_step": 414170, "epoch": 2465} {"train_loss": -11.515236854553223, "global_step": 414171, "epoch": 2465} {"train_loss": -11.60053825378418, "global_step": 414172, "epoch": 2465} {"train_loss": -11.811368942260742, "global_step": 414173, "epoch": 2465} {"train_loss": -11.877087593078613, "global_step": 414174, "epoch": 2465} {"train_loss": -11.32246208190918, "global_step": 414175, "epoch": 2465} {"train_loss": -12.152043342590332, "global_step": 414176, "epoch": 2465} {"train_loss": -11.853987693786621, "global_step": 414177, "epoch": 2465} {"train_loss": -11.576776504516602, "global_step": 414178, "epoch": 2465} {"train_loss": -12.1219482421875, "global_step": 414179, "epoch": 2465} {"train_loss": -11.991872787475586, "global_step": 414180, "epoch": 2465} {"train_loss": -11.446847915649414, "global_step": 414181, "epoch": 2465} {"train_loss": -11.746658325195312, "global_step": 414182, "epoch": 2465} {"train_loss": -11.759990692138672, "global_step": 414183, "epoch": 2465} {"train_loss": -11.749288558959961, "global_step": 414184, "epoch": 2465} {"train_loss": -11.511520385742188, "global_step": 414185, "epoch": 2465} {"train_loss": -12.320928573608398, "global_step": 414186, "epoch": 2465} {"train_loss": -11.666637420654297, "global_step": 414187, "epoch": 2465} {"train_loss": -11.99311637878418, "global_step": 414188, "epoch": 2465} {"train_loss": -11.865863800048828, "global_step": 414189, "epoch": 2465} {"train_loss": -11.932250022888184, "global_step": 414190, "epoch": 2465} {"train_loss": -12.163272857666016, "global_step": 414191, "epoch": 2465} {"train_loss": -12.029667854309082, "global_step": 414192, "epoch": 2465} {"train_loss": -11.885034561157227, "global_step": 414193, "epoch": 2465} {"train_loss": -12.316987991333008, "global_step": 414194, "epoch": 2465} {"train_loss": -12.107585906982422, "global_step": 414195, "epoch": 2465} {"train_loss": -12.097038269042969, "global_step": 414196, "epoch": 2465} {"train_loss": -11.921728134155273, "global_step": 414197, "epoch": 2465} {"train_loss": -12.055273056030273, "global_step": 414198, "epoch": 2465} {"train_loss": -12.093402862548828, "global_step": 414199, "epoch": 2465} {"train_loss": -12.01522445678711, "global_step": 414200, "epoch": 2465} {"train_loss": -12.180459022521973, "global_step": 414201, "epoch": 2465} {"train_loss": -12.146867752075195, "global_step": 414202, "epoch": 2465} {"train_loss": -12.348464965820312, "global_step": 414203, "epoch": 2465} {"train_loss": -12.240690231323242, "global_step": 414204, "epoch": 2465} {"train_loss": -12.361550331115723, "global_step": 414205, "epoch": 2465} {"train_loss": -12.448193550109863, "global_step": 414206, "epoch": 2465} {"train_loss": -12.273653030395508, "global_step": 414207, "epoch": 2465} {"train_loss": -12.223651885986328, "global_step": 414208, "epoch": 2465} {"train_loss": -12.325362205505371, "global_step": 414209, "epoch": 2465} {"train_loss": -12.18990707397461, "global_step": 414210, "epoch": 2465} {"train_loss": -12.305859565734863, "global_step": 414211, "epoch": 2465} {"train_loss": -12.175192832946777, "global_step": 414212, "epoch": 2465} {"train_loss": -12.22886848449707, "global_step": 414213, "epoch": 2465} {"train_loss": -12.385187149047852, "global_step": 414214, "epoch": 2465} {"train_loss": -12.38398551940918, "global_step": 414215, "epoch": 2465} {"train_loss": -12.542448043823242, "global_step": 414216, "epoch": 2465} {"train_loss": -12.1743745803833, "global_step": 414217, "epoch": 2465} {"train_loss": -12.32573127746582, "global_step": 414218, "epoch": 2465} {"train_loss": -12.346084594726562, "global_step": 414219, "epoch": 2465} {"train_loss": -12.452336311340332, "global_step": 414220, "epoch": 2465} {"train_loss": -12.504222869873047, "global_step": 414221, "epoch": 2465} {"train_loss": -12.504504203796387, "global_step": 414222, "epoch": 2465} {"train_loss": -12.54612922668457, "global_step": 414223, "epoch": 2465} {"train_loss": -12.461206436157227, "global_step": 414224, "epoch": 2465} {"train_loss": -12.457133293151855, "global_step": 414225, "epoch": 2465} {"train_loss": -12.52584171295166, "global_step": 414226, "epoch": 2465} {"train_loss": -12.528892517089844, "global_step": 414227, "epoch": 2465} {"train_loss": -12.36253547668457, "global_step": 414228, "epoch": 2465} {"train_loss": -12.363275527954102, "global_step": 414229, "epoch": 2465} {"train_loss": -12.396446228027344, "global_step": 414230, "epoch": 2465} {"train_loss": -12.249639511108398, "global_step": 414231, "epoch": 2465} {"train_loss": -12.598047256469727, "global_step": 414232, "epoch": 2465} {"train_loss": -12.357412338256836, "global_step": 414233, "epoch": 2465} {"train_loss": -12.537248611450195, "global_step": 414234, "epoch": 2465} {"train_loss": -12.478281021118164, "global_step": 414235, "epoch": 2465} {"train_loss": -12.346114158630371, "global_step": 414236, "epoch": 2465} {"train_loss": -12.653124809265137, "global_step": 414237, "epoch": 2465} {"train_loss": -12.500749588012695, "global_step": 414238, "epoch": 2465} {"train_loss": -12.404702186584473, "global_step": 414239, "epoch": 2465} {"train_loss": -12.399412155151367, "global_step": 414240, "epoch": 2465} {"train_loss": -12.465646743774414, "global_step": 414241, "epoch": 2465} {"train_loss": -12.559928894042969, "global_step": 414242, "epoch": 2465} {"train_loss": -12.541062355041504, "global_step": 414243, "epoch": 2465} {"train_loss": -12.762497901916504, "global_step": 414244, "epoch": 2465} {"train_loss": -12.262696266174316, "global_step": 414245, "epoch": 2465} {"train_loss": -12.59405517578125, "global_step": 414246, "epoch": 2465} {"train_loss": -12.496953010559082, "global_step": 414247, "epoch": 2465} {"train_loss": -12.516561508178711, "global_step": 414248, "epoch": 2465} {"train_loss": -12.657752990722656, "global_step": 414249, "epoch": 2465} {"train_loss": -12.633477210998535, "global_step": 414250, "epoch": 2465} {"train_loss": -12.516373634338379, "global_step": 414251, "epoch": 2465} {"train_loss": -12.390241622924805, "global_step": 414252, "epoch": 2465} {"train_loss": -12.722518920898438, "global_step": 414253, "epoch": 2465} {"train_loss": -12.373472213745117, "global_step": 414254, "epoch": 2465} {"train_loss": -12.754718780517578, "global_step": 414255, "epoch": 2465} {"train_loss": -12.432243347167969, "global_step": 414256, "epoch": 2465} {"train_loss": -12.55681037902832, "global_step": 414257, "epoch": 2465} {"train_loss": -12.592455863952637, "global_step": 414258, "epoch": 2465} {"train_loss": -12.474807739257812, "global_step": 414259, "epoch": 2465} {"train_loss": -12.627382278442383, "global_step": 414260, "epoch": 2465} {"train_loss": -12.619585037231445, "global_step": 414261, "epoch": 2465} {"train_loss": -12.684881210327148, "global_step": 414262, "epoch": 2465} {"train_loss": -12.583019256591797, "global_step": 414263, "epoch": 2465} {"train_loss": -12.76078987121582, "global_step": 414264, "epoch": 2465} {"train_loss": -12.661914825439453, "global_step": 414265, "epoch": 2465} {"train_loss": -12.557404518127441, "global_step": 414266, "epoch": 2465} {"train_loss": -12.520186424255371, "global_step": 414267, "epoch": 2465} {"train_loss": -12.65948486328125, "global_step": 414268, "epoch": 2465} {"train_loss": -12.901254653930664, "global_step": 414269, "epoch": 2465} {"train_loss": -12.841537475585938, "global_step": 414270, "epoch": 2465} {"train_loss": -12.59414291381836, "global_step": 414271, "epoch": 2465} {"train_loss": -12.851874351501465, "global_step": 414272, "epoch": 2465} {"train_loss": -12.728643417358398, "global_step": 414273, "epoch": 2465} {"train_loss": -12.657207489013672, "global_step": 414274, "epoch": 2465} {"train_loss": -12.574477195739746, "global_step": 414275, "epoch": 2465} {"train_loss": -12.417502403259277, "global_step": 414276, "epoch": 2465} {"train_loss": -12.394021987915039, "global_step": 414277, "epoch": 2465} {"train_loss": -12.846186637878418, "global_step": 414278, "epoch": 2465} {"train_loss": -12.579610824584961, "global_step": 414279, "epoch": 2465} {"train_loss": -12.823827743530273, "global_step": 414280, "epoch": 2465} {"train_loss": -12.609098434448242, "global_step": 414281, "epoch": 2465} {"train_loss": -12.781488418579102, "global_step": 414282, "epoch": 2465} {"train_loss": -12.699041366577148, "global_step": 414283, "epoch": 2465} {"train_loss": -12.96629810333252, "global_step": 414284, "epoch": 2465} {"train_loss": -12.690933227539062, "global_step": 414285, "epoch": 2465} {"train_loss": -12.750604629516602, "global_step": 414286, "epoch": 2465} {"train_loss": -11.673621066978999, "global_step": 414287, "epoch": 2465, "val_loss": 300324.28125, "train_action_mse_error": 1.9632878303527832} {"train_loss": -12.796774864196777, "global_step": 414288, "epoch": 2466} {"train_loss": -12.711515426635742, "global_step": 414289, "epoch": 2466} {"train_loss": -12.342203140258789, "global_step": 414290, "epoch": 2466} {"train_loss": -12.651464462280273, "global_step": 414291, "epoch": 2466} {"train_loss": -12.621866226196289, "global_step": 414292, "epoch": 2466} {"train_loss": -12.658834457397461, "global_step": 414293, "epoch": 2466} {"train_loss": -12.703653335571289, "global_step": 414294, "epoch": 2466} {"train_loss": -12.556868553161621, "global_step": 414295, "epoch": 2466} {"train_loss": -12.618675231933594, "global_step": 414296, "epoch": 2466} {"train_loss": -12.726970672607422, "global_step": 414297, "epoch": 2466} {"train_loss": -12.58357048034668, "global_step": 414298, "epoch": 2466} {"train_loss": -12.490876197814941, "global_step": 414299, "epoch": 2466} {"train_loss": -12.796836853027344, "global_step": 414300, "epoch": 2466} {"train_loss": -12.830611228942871, "global_step": 414301, "epoch": 2466} {"train_loss": -12.750188827514648, "global_step": 414302, "epoch": 2466} {"train_loss": -12.860576629638672, "global_step": 414303, "epoch": 2466} {"train_loss": -12.885852813720703, "global_step": 414304, "epoch": 2466} {"train_loss": -12.447332382202148, "global_step": 414305, "epoch": 2466} {"train_loss": -13.001228332519531, "global_step": 414306, "epoch": 2466} {"train_loss": -12.862773895263672, "global_step": 414307, "epoch": 2466} {"train_loss": -12.276668548583984, "global_step": 414308, "epoch": 2466} {"train_loss": -12.282709121704102, "global_step": 414309, "epoch": 2466} {"train_loss": -12.407269477844238, "global_step": 414310, "epoch": 2466} {"train_loss": -12.595382690429688, "global_step": 414311, "epoch": 2466} {"train_loss": -12.072620391845703, "global_step": 414312, "epoch": 2466} {"train_loss": -11.546838760375977, "global_step": 414313, "epoch": 2466} {"train_loss": -10.738981246948242, "global_step": 414314, "epoch": 2466} {"train_loss": -12.823616981506348, "global_step": 414315, "epoch": 2466} {"train_loss": -9.737064361572266, "global_step": 414316, "epoch": 2466} {"train_loss": -11.251609802246094, "global_step": 414317, "epoch": 2466} {"train_loss": -11.501354217529297, "global_step": 414318, "epoch": 2466} {"train_loss": -11.039773941040039, "global_step": 414319, "epoch": 2466} {"train_loss": -9.91283893585205, "global_step": 414320, "epoch": 2466} {"train_loss": -8.930213928222656, "global_step": 414321, "epoch": 2466} {"train_loss": -8.96058464050293, "global_step": 414322, "epoch": 2466} {"train_loss": -9.252418518066406, "global_step": 414323, "epoch": 2466} {"train_loss": -9.323403358459473, "global_step": 414324, "epoch": 2466} {"train_loss": -10.31551456451416, "global_step": 414325, "epoch": 2466} {"train_loss": -10.479453086853027, "global_step": 414326, "epoch": 2466} {"train_loss": -9.589725494384766, "global_step": 414327, "epoch": 2466} {"train_loss": -10.024359703063965, "global_step": 414328, "epoch": 2466} {"train_loss": -9.847861289978027, "global_step": 414329, "epoch": 2466} {"train_loss": -10.709749221801758, "global_step": 414330, "epoch": 2466} {"train_loss": -11.256714820861816, "global_step": 414331, "epoch": 2466} {"train_loss": -11.277783393859863, "global_step": 414332, "epoch": 2466} {"train_loss": -11.745708465576172, "global_step": 414333, "epoch": 2466} {"train_loss": -10.699728965759277, "global_step": 414334, "epoch": 2466} {"train_loss": -11.437637329101562, "global_step": 414335, "epoch": 2466} {"train_loss": -11.090190887451172, "global_step": 414336, "epoch": 2466} {"train_loss": -11.500276565551758, "global_step": 414337, "epoch": 2466} {"train_loss": -11.403192520141602, "global_step": 414338, "epoch": 2466} {"train_loss": -11.13355827331543, "global_step": 414339, "epoch": 2466} {"train_loss": -11.322815895080566, "global_step": 414340, "epoch": 2466} {"train_loss": -11.166048049926758, "global_step": 414341, "epoch": 2466} {"train_loss": -11.015129089355469, "global_step": 414342, "epoch": 2466} {"train_loss": -10.646041870117188, "global_step": 414343, "epoch": 2466} {"train_loss": -11.271154403686523, "global_step": 414344, "epoch": 2466} {"train_loss": -11.497383117675781, "global_step": 414345, "epoch": 2466} {"train_loss": -9.978622436523438, "global_step": 414346, "epoch": 2466} {"train_loss": -11.556544303894043, "global_step": 414347, "epoch": 2466} {"train_loss": -10.449140548706055, "global_step": 414348, "epoch": 2466} {"train_loss": -11.107304573059082, "global_step": 414349, "epoch": 2466} {"train_loss": -11.070594787597656, "global_step": 414350, "epoch": 2466} {"train_loss": -10.579116821289062, "global_step": 414351, "epoch": 2466} {"train_loss": -10.812084197998047, "global_step": 414352, "epoch": 2466} {"train_loss": -11.353479385375977, "global_step": 414353, "epoch": 2466} {"train_loss": -10.661033630371094, "global_step": 414354, "epoch": 2466} {"train_loss": -11.715410232543945, "global_step": 414355, "epoch": 2466} {"train_loss": -10.858986854553223, "global_step": 414356, "epoch": 2466} {"train_loss": -11.766290664672852, "global_step": 414357, "epoch": 2466} {"train_loss": -11.624894142150879, "global_step": 414358, "epoch": 2466} {"train_loss": -11.827398300170898, "global_step": 414359, "epoch": 2466} {"train_loss": -10.935066223144531, "global_step": 414360, "epoch": 2466} {"train_loss": -10.944375991821289, "global_step": 414361, "epoch": 2466} {"train_loss": -11.007795333862305, "global_step": 414362, "epoch": 2466} {"train_loss": -11.878504753112793, "global_step": 414363, "epoch": 2466} {"train_loss": -10.925619125366211, "global_step": 414364, "epoch": 2466} {"train_loss": -11.504242897033691, "global_step": 414365, "epoch": 2466} {"train_loss": -11.237829208374023, "global_step": 414366, "epoch": 2466} {"train_loss": -11.3228759765625, "global_step": 414367, "epoch": 2466} {"train_loss": -11.768964767456055, "global_step": 414368, "epoch": 2466} {"train_loss": -11.746930122375488, "global_step": 414369, "epoch": 2466} {"train_loss": -11.152423858642578, "global_step": 414370, "epoch": 2466} {"train_loss": -11.954536437988281, "global_step": 414371, "epoch": 2466} {"train_loss": -11.106359481811523, "global_step": 414372, "epoch": 2466} {"train_loss": -11.431220054626465, "global_step": 414373, "epoch": 2466} {"train_loss": -11.612532615661621, "global_step": 414374, "epoch": 2466} {"train_loss": -11.788010597229004, "global_step": 414375, "epoch": 2466} {"train_loss": -11.70226001739502, "global_step": 414376, "epoch": 2466} {"train_loss": -11.649478912353516, "global_step": 414377, "epoch": 2466} {"train_loss": -12.143928527832031, "global_step": 414378, "epoch": 2466} {"train_loss": -11.844205856323242, "global_step": 414379, "epoch": 2466} {"train_loss": -11.952857971191406, "global_step": 414380, "epoch": 2466} {"train_loss": -11.846845626831055, "global_step": 414381, "epoch": 2466} {"train_loss": -11.714990615844727, "global_step": 414382, "epoch": 2466} {"train_loss": -11.99189567565918, "global_step": 414383, "epoch": 2466} {"train_loss": -12.207226753234863, "global_step": 414384, "epoch": 2466} {"train_loss": -12.063871383666992, "global_step": 414385, "epoch": 2466} {"train_loss": -12.011636734008789, "global_step": 414386, "epoch": 2466} {"train_loss": -11.951967239379883, "global_step": 414387, "epoch": 2466} {"train_loss": -12.215234756469727, "global_step": 414388, "epoch": 2466} {"train_loss": -11.957012176513672, "global_step": 414389, "epoch": 2466} {"train_loss": -12.235793113708496, "global_step": 414390, "epoch": 2466} {"train_loss": -12.192770004272461, "global_step": 414391, "epoch": 2466} {"train_loss": -12.028063774108887, "global_step": 414392, "epoch": 2466} {"train_loss": -12.395389556884766, "global_step": 414393, "epoch": 2466} {"train_loss": -12.404155731201172, "global_step": 414394, "epoch": 2466} {"train_loss": -12.423261642456055, "global_step": 414395, "epoch": 2466} {"train_loss": -12.19180679321289, "global_step": 414396, "epoch": 2466} {"train_loss": -12.46491813659668, "global_step": 414397, "epoch": 2466} {"train_loss": -12.2821683883667, "global_step": 414398, "epoch": 2466} {"train_loss": -12.413877487182617, "global_step": 414399, "epoch": 2466} {"train_loss": -12.108820915222168, "global_step": 414400, "epoch": 2466} {"train_loss": -12.242240905761719, "global_step": 414401, "epoch": 2466} {"train_loss": -12.386923789978027, "global_step": 414402, "epoch": 2466} {"train_loss": -12.276971817016602, "global_step": 414403, "epoch": 2466} {"train_loss": -12.37691593170166, "global_step": 414404, "epoch": 2466} {"train_loss": -12.112534523010254, "global_step": 414405, "epoch": 2466} {"train_loss": -12.642589569091797, "global_step": 414406, "epoch": 2466} {"train_loss": -12.176595687866211, "global_step": 414407, "epoch": 2466} {"train_loss": -12.443714141845703, "global_step": 414408, "epoch": 2466} {"train_loss": -12.361082077026367, "global_step": 414409, "epoch": 2466} {"train_loss": -12.28781509399414, "global_step": 414410, "epoch": 2466} {"train_loss": -12.308113098144531, "global_step": 414411, "epoch": 2466} {"train_loss": -12.618947982788086, "global_step": 414412, "epoch": 2466} {"train_loss": -12.43597412109375, "global_step": 414413, "epoch": 2466} {"train_loss": -12.324207305908203, "global_step": 414414, "epoch": 2466} {"train_loss": -12.434700012207031, "global_step": 414415, "epoch": 2466} {"train_loss": -12.515985488891602, "global_step": 414416, "epoch": 2466} {"train_loss": -12.375377655029297, "global_step": 414417, "epoch": 2466} {"train_loss": -12.537694931030273, "global_step": 414418, "epoch": 2466} {"train_loss": -12.724241256713867, "global_step": 414419, "epoch": 2466} {"train_loss": -12.6036376953125, "global_step": 414420, "epoch": 2466} {"train_loss": -12.536334991455078, "global_step": 414421, "epoch": 2466} {"train_loss": -12.526115417480469, "global_step": 414422, "epoch": 2466} {"train_loss": -12.590911865234375, "global_step": 414423, "epoch": 2466} {"train_loss": -12.518112182617188, "global_step": 414424, "epoch": 2466} {"train_loss": -12.612937927246094, "global_step": 414425, "epoch": 2466} {"train_loss": -12.41693115234375, "global_step": 414426, "epoch": 2466} {"train_loss": -12.69331169128418, "global_step": 414427, "epoch": 2466} {"train_loss": -12.583020210266113, "global_step": 414428, "epoch": 2466} {"train_loss": -12.438983917236328, "global_step": 414429, "epoch": 2466} {"train_loss": -12.555602073669434, "global_step": 414430, "epoch": 2466} {"train_loss": -12.441145896911621, "global_step": 414431, "epoch": 2466} {"train_loss": -12.667470932006836, "global_step": 414432, "epoch": 2466} {"train_loss": -12.462916374206543, "global_step": 414433, "epoch": 2466} {"train_loss": -12.573989868164062, "global_step": 414434, "epoch": 2466} {"train_loss": -12.48027229309082, "global_step": 414435, "epoch": 2466} {"train_loss": -12.621265411376953, "global_step": 414436, "epoch": 2466} {"train_loss": -12.24496841430664, "global_step": 414437, "epoch": 2466} {"train_loss": -12.578832626342773, "global_step": 414438, "epoch": 2466} {"train_loss": -12.510894775390625, "global_step": 414439, "epoch": 2466} {"train_loss": -12.659642219543457, "global_step": 414440, "epoch": 2466} {"train_loss": -12.240754127502441, "global_step": 414441, "epoch": 2466} {"train_loss": -12.364599227905273, "global_step": 414442, "epoch": 2466} {"train_loss": -12.09516716003418, "global_step": 414443, "epoch": 2466} {"train_loss": -12.469714164733887, "global_step": 414444, "epoch": 2466} {"train_loss": -12.119466781616211, "global_step": 414445, "epoch": 2466} {"train_loss": -11.653068542480469, "global_step": 414446, "epoch": 2466} {"train_loss": -12.030683517456055, "global_step": 414447, "epoch": 2466} {"train_loss": -11.8782958984375, "global_step": 414448, "epoch": 2466} {"train_loss": -12.509241104125977, "global_step": 414449, "epoch": 2466} {"train_loss": -11.841099739074707, "global_step": 414450, "epoch": 2466} {"train_loss": -12.660844802856445, "global_step": 414451, "epoch": 2466} {"train_loss": -12.218280792236328, "global_step": 414452, "epoch": 2466} {"train_loss": -12.203262329101562, "global_step": 414453, "epoch": 2466} {"train_loss": -12.398786544799805, "global_step": 414454, "epoch": 2466} {"train_loss": -11.857365653628396, "global_step": 414455, "epoch": 2466, "val_loss": 302772.21875} {"train_loss": -12.22901725769043, "global_step": 414456, "epoch": 2467} {"train_loss": -12.15196704864502, "global_step": 414457, "epoch": 2467} {"train_loss": -12.30847454071045, "global_step": 414458, "epoch": 2467} {"train_loss": -11.378805160522461, "global_step": 414459, "epoch": 2467} {"train_loss": -11.374049186706543, "global_step": 414460, "epoch": 2467} {"train_loss": -11.441411972045898, "global_step": 414461, "epoch": 2467} {"train_loss": -11.093856811523438, "global_step": 414462, "epoch": 2467} {"train_loss": -10.776029586791992, "global_step": 414463, "epoch": 2467} {"train_loss": -10.970967292785645, "global_step": 414464, "epoch": 2467} {"train_loss": -10.578238487243652, "global_step": 414465, "epoch": 2467} {"train_loss": -10.4631929397583, "global_step": 414466, "epoch": 2467} {"train_loss": -10.488676071166992, "global_step": 414467, "epoch": 2467} {"train_loss": -11.22319507598877, "global_step": 414468, "epoch": 2467} {"train_loss": -11.159294128417969, "global_step": 414469, "epoch": 2467} {"train_loss": -11.730218887329102, "global_step": 414470, "epoch": 2467} {"train_loss": -11.373734474182129, "global_step": 414471, "epoch": 2467} {"train_loss": -11.037019729614258, "global_step": 414472, "epoch": 2467} {"train_loss": -12.178078651428223, "global_step": 414473, "epoch": 2467} {"train_loss": -10.91061019897461, "global_step": 414474, "epoch": 2467} {"train_loss": -10.901511192321777, "global_step": 414475, "epoch": 2467} {"train_loss": -10.779552459716797, "global_step": 414476, "epoch": 2467} {"train_loss": -11.743810653686523, "global_step": 414477, "epoch": 2467} {"train_loss": -10.074365615844727, "global_step": 414478, "epoch": 2467} {"train_loss": -9.739922523498535, "global_step": 414479, "epoch": 2467} {"train_loss": -10.539861679077148, "global_step": 414480, "epoch": 2467} {"train_loss": -10.334787368774414, "global_step": 414481, "epoch": 2467} {"train_loss": -9.417171478271484, "global_step": 414482, "epoch": 2467} {"train_loss": -11.173625946044922, "global_step": 414483, "epoch": 2467} {"train_loss": -9.452888488769531, "global_step": 414484, "epoch": 2467} {"train_loss": -11.445987701416016, "global_step": 414485, "epoch": 2467} {"train_loss": -10.540914535522461, "global_step": 414486, "epoch": 2467} {"train_loss": -11.573493003845215, "global_step": 414487, "epoch": 2467} {"train_loss": -10.724161148071289, "global_step": 414488, "epoch": 2467} {"train_loss": -11.384273529052734, "global_step": 414489, "epoch": 2467} {"train_loss": -10.911918640136719, "global_step": 414490, "epoch": 2467} {"train_loss": -10.213533401489258, "global_step": 414491, "epoch": 2467} {"train_loss": -11.183904647827148, "global_step": 414492, "epoch": 2467} {"train_loss": -10.59800910949707, "global_step": 414493, "epoch": 2467} {"train_loss": -11.633689880371094, "global_step": 414494, "epoch": 2467} {"train_loss": -11.133474349975586, "global_step": 414495, "epoch": 2467} {"train_loss": -11.325749397277832, "global_step": 414496, "epoch": 2467} {"train_loss": -11.274006843566895, "global_step": 414497, "epoch": 2467} {"train_loss": -11.224742889404297, "global_step": 414498, "epoch": 2467} {"train_loss": -11.877699851989746, "global_step": 414499, "epoch": 2467} {"train_loss": -11.294300079345703, "global_step": 414500, "epoch": 2467} {"train_loss": -11.995037078857422, "global_step": 414501, "epoch": 2467} {"train_loss": -11.785895347595215, "global_step": 414502, "epoch": 2467} {"train_loss": -11.793500900268555, "global_step": 414503, "epoch": 2467} {"train_loss": -12.032096862792969, "global_step": 414504, "epoch": 2467} {"train_loss": -11.909975051879883, "global_step": 414505, "epoch": 2467} {"train_loss": -12.201895713806152, "global_step": 414506, "epoch": 2467} {"train_loss": -11.965007781982422, "global_step": 414507, "epoch": 2467} {"train_loss": -12.060182571411133, "global_step": 414508, "epoch": 2467} {"train_loss": -12.103840827941895, "global_step": 414509, "epoch": 2467} {"train_loss": -12.218642234802246, "global_step": 414510, "epoch": 2467} {"train_loss": -12.19438648223877, "global_step": 414511, "epoch": 2467} {"train_loss": -12.077436447143555, "global_step": 414512, "epoch": 2467} {"train_loss": -12.246967315673828, "global_step": 414513, "epoch": 2467} {"train_loss": -11.998926162719727, "global_step": 414514, "epoch": 2467} {"train_loss": -12.18336296081543, "global_step": 414515, "epoch": 2467} {"train_loss": -11.75006103515625, "global_step": 414516, "epoch": 2467} {"train_loss": -12.269242286682129, "global_step": 414517, "epoch": 2467} {"train_loss": -12.11864185333252, "global_step": 414518, "epoch": 2467} {"train_loss": -11.910601615905762, "global_step": 414519, "epoch": 2467} {"train_loss": -12.1529541015625, "global_step": 414520, "epoch": 2467} {"train_loss": -12.25341796875, "global_step": 414521, "epoch": 2467} {"train_loss": -12.281914710998535, "global_step": 414522, "epoch": 2467} {"train_loss": -11.9156494140625, "global_step": 414523, "epoch": 2467} {"train_loss": -12.037071228027344, "global_step": 414524, "epoch": 2467} {"train_loss": -12.15670108795166, "global_step": 414525, "epoch": 2467} {"train_loss": -12.212677955627441, "global_step": 414526, "epoch": 2467} {"train_loss": -12.274686813354492, "global_step": 414527, "epoch": 2467} {"train_loss": -11.764642715454102, "global_step": 414528, "epoch": 2467} {"train_loss": -12.423563003540039, "global_step": 414529, "epoch": 2467} {"train_loss": -11.836847305297852, "global_step": 414530, "epoch": 2467} {"train_loss": -12.174797058105469, "global_step": 414531, "epoch": 2467} {"train_loss": -11.876380920410156, "global_step": 414532, "epoch": 2467} {"train_loss": -12.042034149169922, "global_step": 414533, "epoch": 2467} {"train_loss": -12.165582656860352, "global_step": 414534, "epoch": 2467} {"train_loss": -11.64044189453125, "global_step": 414535, "epoch": 2467} {"train_loss": -12.304144859313965, "global_step": 414536, "epoch": 2467} {"train_loss": -11.700410842895508, "global_step": 414537, "epoch": 2467} {"train_loss": -11.877214431762695, "global_step": 414538, "epoch": 2467} {"train_loss": -11.769218444824219, "global_step": 414539, "epoch": 2467} {"train_loss": -12.074228286743164, "global_step": 414540, "epoch": 2467} {"train_loss": -12.073297500610352, "global_step": 414541, "epoch": 2467} {"train_loss": -11.99985122680664, "global_step": 414542, "epoch": 2467} {"train_loss": -11.975652694702148, "global_step": 414543, "epoch": 2467} {"train_loss": -12.111444473266602, "global_step": 414544, "epoch": 2467} {"train_loss": -12.14179801940918, "global_step": 414545, "epoch": 2467} {"train_loss": -12.105140686035156, "global_step": 414546, "epoch": 2467} {"train_loss": -11.737104415893555, "global_step": 414547, "epoch": 2467} {"train_loss": -12.425548553466797, "global_step": 414548, "epoch": 2467} {"train_loss": -11.8464937210083, "global_step": 414549, "epoch": 2467} {"train_loss": -12.228978157043457, "global_step": 414550, "epoch": 2467} {"train_loss": -12.030220985412598, "global_step": 414551, "epoch": 2467} {"train_loss": -12.284364700317383, "global_step": 414552, "epoch": 2467} {"train_loss": -12.015510559082031, "global_step": 414553, "epoch": 2467} {"train_loss": -12.31117057800293, "global_step": 414554, "epoch": 2467} {"train_loss": -12.255138397216797, "global_step": 414555, "epoch": 2467} {"train_loss": -12.395650863647461, "global_step": 414556, "epoch": 2467} {"train_loss": -12.112930297851562, "global_step": 414557, "epoch": 2467} {"train_loss": -12.55385971069336, "global_step": 414558, "epoch": 2467} {"train_loss": -12.225776672363281, "global_step": 414559, "epoch": 2467} {"train_loss": -12.459396362304688, "global_step": 414560, "epoch": 2467} {"train_loss": -12.363207817077637, "global_step": 414561, "epoch": 2467} {"train_loss": -12.104326248168945, "global_step": 414562, "epoch": 2467} {"train_loss": -12.393365859985352, "global_step": 414563, "epoch": 2467} {"train_loss": -12.119518280029297, "global_step": 414564, "epoch": 2467} {"train_loss": -12.472928047180176, "global_step": 414565, "epoch": 2467} {"train_loss": -12.302018165588379, "global_step": 414566, "epoch": 2467} {"train_loss": -12.298538208007812, "global_step": 414567, "epoch": 2467} {"train_loss": -12.416131019592285, "global_step": 414568, "epoch": 2467} {"train_loss": -12.639677047729492, "global_step": 414569, "epoch": 2467} {"train_loss": -12.335479736328125, "global_step": 414570, "epoch": 2467} {"train_loss": -12.215322494506836, "global_step": 414571, "epoch": 2467} {"train_loss": -12.477110862731934, "global_step": 414572, "epoch": 2467} {"train_loss": -12.396584510803223, "global_step": 414573, "epoch": 2467} {"train_loss": -12.597599029541016, "global_step": 414574, "epoch": 2467} {"train_loss": -12.311795234680176, "global_step": 414575, "epoch": 2467} {"train_loss": -12.466583251953125, "global_step": 414576, "epoch": 2467} {"train_loss": -12.5960111618042, "global_step": 414577, "epoch": 2467} {"train_loss": -11.9198579788208, "global_step": 414578, "epoch": 2467} {"train_loss": -12.662101745605469, "global_step": 414579, "epoch": 2467} {"train_loss": -12.167022705078125, "global_step": 414580, "epoch": 2467} {"train_loss": -11.8338623046875, "global_step": 414581, "epoch": 2467} {"train_loss": -12.405487060546875, "global_step": 414582, "epoch": 2467} {"train_loss": -11.794148445129395, "global_step": 414583, "epoch": 2467} {"train_loss": -11.309980392456055, "global_step": 414584, "epoch": 2467} {"train_loss": -12.209236145019531, "global_step": 414585, "epoch": 2467} {"train_loss": -10.868989944458008, "global_step": 414586, "epoch": 2467} {"train_loss": -11.928606033325195, "global_step": 414587, "epoch": 2467} {"train_loss": -11.864151954650879, "global_step": 414588, "epoch": 2467} {"train_loss": -11.42007064819336, "global_step": 414589, "epoch": 2467} {"train_loss": -11.42371940612793, "global_step": 414590, "epoch": 2467} {"train_loss": -11.776004791259766, "global_step": 414591, "epoch": 2467} {"train_loss": -11.557291030883789, "global_step": 414592, "epoch": 2467} {"train_loss": -11.750739097595215, "global_step": 414593, "epoch": 2467} {"train_loss": -12.187837600708008, "global_step": 414594, "epoch": 2467} {"train_loss": -11.632759094238281, "global_step": 414595, "epoch": 2467} {"train_loss": -11.931448936462402, "global_step": 414596, "epoch": 2467} {"train_loss": -11.47825813293457, "global_step": 414597, "epoch": 2467} {"train_loss": -12.29139518737793, "global_step": 414598, "epoch": 2467} {"train_loss": -12.228168487548828, "global_step": 414599, "epoch": 2467} {"train_loss": -12.346081733703613, "global_step": 414600, "epoch": 2467} {"train_loss": -12.395587921142578, "global_step": 414601, "epoch": 2467} {"train_loss": -12.593180656433105, "global_step": 414602, "epoch": 2467} {"train_loss": -12.364595413208008, "global_step": 414603, "epoch": 2467} {"train_loss": -12.468259811401367, "global_step": 414604, "epoch": 2467} {"train_loss": -12.128595352172852, "global_step": 414605, "epoch": 2467} {"train_loss": -12.64987850189209, "global_step": 414606, "epoch": 2467} {"train_loss": -12.583780288696289, "global_step": 414607, "epoch": 2467} {"train_loss": -12.268170356750488, "global_step": 414608, "epoch": 2467} {"train_loss": -12.590255737304688, "global_step": 414609, "epoch": 2467} {"train_loss": -12.371883392333984, "global_step": 414610, "epoch": 2467} {"train_loss": -12.462801933288574, "global_step": 414611, "epoch": 2467} {"train_loss": -12.69114875793457, "global_step": 414612, "epoch": 2467} {"train_loss": -12.40469741821289, "global_step": 414613, "epoch": 2467} {"train_loss": -12.374031066894531, "global_step": 414614, "epoch": 2467} {"train_loss": -12.517681121826172, "global_step": 414615, "epoch": 2467} {"train_loss": -12.391597747802734, "global_step": 414616, "epoch": 2467} {"train_loss": -12.506771087646484, "global_step": 414617, "epoch": 2467} {"train_loss": -12.503120422363281, "global_step": 414618, "epoch": 2467} {"train_loss": -12.395206451416016, "global_step": 414619, "epoch": 2467} {"train_loss": -12.227413177490234, "global_step": 414620, "epoch": 2467} {"train_loss": -12.702220916748047, "global_step": 414621, "epoch": 2467} {"train_loss": -12.351932525634766, "global_step": 414622, "epoch": 2467} {"train_loss": -11.857407564208621, "global_step": 414623, "epoch": 2467, "val_loss": 303506.4375} {"train_loss": -12.212714195251465, "global_step": 414624, "epoch": 2468} {"train_loss": -12.190031051635742, "global_step": 414625, "epoch": 2468} {"train_loss": -12.051464080810547, "global_step": 414626, "epoch": 2468} {"train_loss": -12.115796089172363, "global_step": 414627, "epoch": 2468} {"train_loss": -12.481258392333984, "global_step": 414628, "epoch": 2468} {"train_loss": -11.94082260131836, "global_step": 414629, "epoch": 2468} {"train_loss": -12.386430740356445, "global_step": 414630, "epoch": 2468} {"train_loss": -12.293874740600586, "global_step": 414631, "epoch": 2468} {"train_loss": -12.554434776306152, "global_step": 414632, "epoch": 2468} {"train_loss": -12.407264709472656, "global_step": 414633, "epoch": 2468} {"train_loss": -12.524210929870605, "global_step": 414634, "epoch": 2468} {"train_loss": -12.193807601928711, "global_step": 414635, "epoch": 2468} {"train_loss": -12.758079528808594, "global_step": 414636, "epoch": 2468} {"train_loss": -12.41008186340332, "global_step": 414637, "epoch": 2468} {"train_loss": -12.597146034240723, "global_step": 414638, "epoch": 2468} {"train_loss": -12.40542221069336, "global_step": 414639, "epoch": 2468} {"train_loss": -12.68958568572998, "global_step": 414640, "epoch": 2468} {"train_loss": -12.480451583862305, "global_step": 414641, "epoch": 2468} {"train_loss": -12.296710968017578, "global_step": 414642, "epoch": 2468} {"train_loss": -12.664981842041016, "global_step": 414643, "epoch": 2468} {"train_loss": -12.610020637512207, "global_step": 414644, "epoch": 2468} {"train_loss": -12.356935501098633, "global_step": 414645, "epoch": 2468} {"train_loss": -12.494206428527832, "global_step": 414646, "epoch": 2468} {"train_loss": -12.535799980163574, "global_step": 414647, "epoch": 2468} {"train_loss": -12.382755279541016, "global_step": 414648, "epoch": 2468} {"train_loss": -12.549585342407227, "global_step": 414649, "epoch": 2468} {"train_loss": -12.20025634765625, "global_step": 414650, "epoch": 2468} {"train_loss": -12.306295394897461, "global_step": 414651, "epoch": 2468} {"train_loss": -12.233840942382812, "global_step": 414652, "epoch": 2468} {"train_loss": -12.696304321289062, "global_step": 414653, "epoch": 2468} {"train_loss": -12.523755073547363, "global_step": 414654, "epoch": 2468} {"train_loss": -12.333240509033203, "global_step": 414655, "epoch": 2468} {"train_loss": -12.31661605834961, "global_step": 414656, "epoch": 2468} {"train_loss": -12.52961540222168, "global_step": 414657, "epoch": 2468} {"train_loss": -12.50606632232666, "global_step": 414658, "epoch": 2468} {"train_loss": -12.657207489013672, "global_step": 414659, "epoch": 2468} {"train_loss": -12.45925521850586, "global_step": 414660, "epoch": 2468} {"train_loss": -12.584253311157227, "global_step": 414661, "epoch": 2468} {"train_loss": -12.466318130493164, "global_step": 414662, "epoch": 2468} {"train_loss": -12.737366676330566, "global_step": 414663, "epoch": 2468} {"train_loss": -12.313628196716309, "global_step": 414664, "epoch": 2468} {"train_loss": -12.731819152832031, "global_step": 414665, "epoch": 2468} {"train_loss": -12.381603240966797, "global_step": 414666, "epoch": 2468} {"train_loss": -12.110429763793945, "global_step": 414667, "epoch": 2468} {"train_loss": -12.421751022338867, "global_step": 414668, "epoch": 2468} {"train_loss": -12.348639488220215, "global_step": 414669, "epoch": 2468} {"train_loss": -12.383787155151367, "global_step": 414670, "epoch": 2468} {"train_loss": -12.455288887023926, "global_step": 414671, "epoch": 2468} {"train_loss": -12.327866554260254, "global_step": 414672, "epoch": 2468} {"train_loss": -12.132427215576172, "global_step": 414673, "epoch": 2468} {"train_loss": -12.281192779541016, "global_step": 414674, "epoch": 2468} {"train_loss": -12.419035911560059, "global_step": 414675, "epoch": 2468} {"train_loss": -12.092281341552734, "global_step": 414676, "epoch": 2468} {"train_loss": -12.270910263061523, "global_step": 414677, "epoch": 2468} {"train_loss": -12.386817932128906, "global_step": 414678, "epoch": 2468} {"train_loss": -12.144149780273438, "global_step": 414679, "epoch": 2468} {"train_loss": -12.301788330078125, "global_step": 414680, "epoch": 2468} {"train_loss": -12.288374900817871, "global_step": 414681, "epoch": 2468} {"train_loss": -11.698687553405762, "global_step": 414682, "epoch": 2468} {"train_loss": -11.949044227600098, "global_step": 414683, "epoch": 2468} {"train_loss": -12.576011657714844, "global_step": 414684, "epoch": 2468} {"train_loss": -12.435513496398926, "global_step": 414685, "epoch": 2468} {"train_loss": -11.789738655090332, "global_step": 414686, "epoch": 2468} {"train_loss": -12.13576602935791, "global_step": 414687, "epoch": 2468} {"train_loss": -12.429182052612305, "global_step": 414688, "epoch": 2468} {"train_loss": -12.681467056274414, "global_step": 414689, "epoch": 2468} {"train_loss": -12.20140552520752, "global_step": 414690, "epoch": 2468} {"train_loss": -12.385475158691406, "global_step": 414691, "epoch": 2468} {"train_loss": -12.380389213562012, "global_step": 414692, "epoch": 2468} {"train_loss": -12.429153442382812, "global_step": 414693, "epoch": 2468} {"train_loss": -12.478862762451172, "global_step": 414694, "epoch": 2468} {"train_loss": -12.574458122253418, "global_step": 414695, "epoch": 2468} {"train_loss": -12.630199432373047, "global_step": 414696, "epoch": 2468} {"train_loss": -12.559006690979004, "global_step": 414697, "epoch": 2468} {"train_loss": -12.554768562316895, "global_step": 414698, "epoch": 2468} {"train_loss": -13.051994323730469, "global_step": 414699, "epoch": 2468} {"train_loss": -12.379341125488281, "global_step": 414700, "epoch": 2468} {"train_loss": -12.73574447631836, "global_step": 414701, "epoch": 2468} {"train_loss": -12.733024597167969, "global_step": 414702, "epoch": 2468} {"train_loss": -12.814777374267578, "global_step": 414703, "epoch": 2468} {"train_loss": -12.620841979980469, "global_step": 414704, "epoch": 2468} {"train_loss": -12.396583557128906, "global_step": 414705, "epoch": 2468} {"train_loss": -12.261917114257812, "global_step": 414706, "epoch": 2468} {"train_loss": -12.63575267791748, "global_step": 414707, "epoch": 2468} {"train_loss": -11.428874969482422, "global_step": 414708, "epoch": 2468} {"train_loss": -11.77845287322998, "global_step": 414709, "epoch": 2468} {"train_loss": -12.148009300231934, "global_step": 414710, "epoch": 2468} {"train_loss": -12.369829177856445, "global_step": 414711, "epoch": 2468} {"train_loss": -11.873788833618164, "global_step": 414712, "epoch": 2468} {"train_loss": -11.857614517211914, "global_step": 414713, "epoch": 2468} {"train_loss": -12.24343490600586, "global_step": 414714, "epoch": 2468} {"train_loss": -12.500555992126465, "global_step": 414715, "epoch": 2468} {"train_loss": -11.9579496383667, "global_step": 414716, "epoch": 2468} {"train_loss": -11.460739135742188, "global_step": 414717, "epoch": 2468} {"train_loss": -11.830137252807617, "global_step": 414718, "epoch": 2468} {"train_loss": -11.432600021362305, "global_step": 414719, "epoch": 2468} {"train_loss": -10.327041625976562, "global_step": 414720, "epoch": 2468} {"train_loss": -11.76942253112793, "global_step": 414721, "epoch": 2468} {"train_loss": -10.744600296020508, "global_step": 414722, "epoch": 2468} {"train_loss": -10.345014572143555, "global_step": 414723, "epoch": 2468} {"train_loss": -10.534849166870117, "global_step": 414724, "epoch": 2468} {"train_loss": -10.540925979614258, "global_step": 414725, "epoch": 2468} {"train_loss": -10.452116966247559, "global_step": 414726, "epoch": 2468} {"train_loss": -9.287240982055664, "global_step": 414727, "epoch": 2468} {"train_loss": -10.87352180480957, "global_step": 414728, "epoch": 2468} {"train_loss": -7.177481651306152, "global_step": 414729, "epoch": 2468} {"train_loss": -8.680368423461914, "global_step": 414730, "epoch": 2468} {"train_loss": -8.185827255249023, "global_step": 414731, "epoch": 2468} {"train_loss": -7.23126220703125, "global_step": 414732, "epoch": 2468} {"train_loss": -7.505147933959961, "global_step": 414733, "epoch": 2468} {"train_loss": -7.337777137756348, "global_step": 414734, "epoch": 2468} {"train_loss": -8.352306365966797, "global_step": 414735, "epoch": 2468} {"train_loss": -7.963868141174316, "global_step": 414736, "epoch": 2468} {"train_loss": -8.365640640258789, "global_step": 414737, "epoch": 2468} {"train_loss": -8.293919563293457, "global_step": 414738, "epoch": 2468} {"train_loss": -8.363801956176758, "global_step": 414739, "epoch": 2468} {"train_loss": -9.024367332458496, "global_step": 414740, "epoch": 2468} {"train_loss": -8.195938110351562, "global_step": 414741, "epoch": 2468} {"train_loss": -8.419381141662598, "global_step": 414742, "epoch": 2468} {"train_loss": -9.659894943237305, "global_step": 414743, "epoch": 2468} {"train_loss": -9.602853775024414, "global_step": 414744, "epoch": 2468} {"train_loss": -9.78076457977295, "global_step": 414745, "epoch": 2468} {"train_loss": -10.337678909301758, "global_step": 414746, "epoch": 2468} {"train_loss": -9.98261833190918, "global_step": 414747, "epoch": 2468} {"train_loss": -10.232256889343262, "global_step": 414748, "epoch": 2468} {"train_loss": -9.35771369934082, "global_step": 414749, "epoch": 2468} {"train_loss": -9.710289001464844, "global_step": 414750, "epoch": 2468} {"train_loss": -9.948202133178711, "global_step": 414751, "epoch": 2468} {"train_loss": -10.630250930786133, "global_step": 414752, "epoch": 2468} {"train_loss": -10.800655364990234, "global_step": 414753, "epoch": 2468} {"train_loss": -11.250616073608398, "global_step": 414754, "epoch": 2468} {"train_loss": -10.63925552368164, "global_step": 414755, "epoch": 2468} {"train_loss": -10.818849563598633, "global_step": 414756, "epoch": 2468} {"train_loss": -9.978351593017578, "global_step": 414757, "epoch": 2468} {"train_loss": -9.4795560836792, "global_step": 414758, "epoch": 2468} {"train_loss": -10.53266429901123, "global_step": 414759, "epoch": 2468} {"train_loss": -10.473989486694336, "global_step": 414760, "epoch": 2468} {"train_loss": -10.113774299621582, "global_step": 414761, "epoch": 2468} {"train_loss": -10.245505332946777, "global_step": 414762, "epoch": 2468} {"train_loss": -11.398296356201172, "global_step": 414763, "epoch": 2468} {"train_loss": -10.859111785888672, "global_step": 414764, "epoch": 2468} {"train_loss": -11.680944442749023, "global_step": 414765, "epoch": 2468} {"train_loss": -11.498360633850098, "global_step": 414766, "epoch": 2468} {"train_loss": -11.043832778930664, "global_step": 414767, "epoch": 2468} {"train_loss": -10.566034317016602, "global_step": 414768, "epoch": 2468} {"train_loss": -11.53314208984375, "global_step": 414769, "epoch": 2468} {"train_loss": -11.032140731811523, "global_step": 414770, "epoch": 2468} {"train_loss": -11.260107040405273, "global_step": 414771, "epoch": 2468} {"train_loss": -11.938240051269531, "global_step": 414772, "epoch": 2468} {"train_loss": -11.897860527038574, "global_step": 414773, "epoch": 2468} {"train_loss": -12.0565185546875, "global_step": 414774, "epoch": 2468} {"train_loss": -11.882375717163086, "global_step": 414775, "epoch": 2468} {"train_loss": -11.794927597045898, "global_step": 414776, "epoch": 2468} {"train_loss": -11.755544662475586, "global_step": 414777, "epoch": 2468} {"train_loss": -11.953184127807617, "global_step": 414778, "epoch": 2468} {"train_loss": -11.573641777038574, "global_step": 414779, "epoch": 2468} {"train_loss": -12.38260555267334, "global_step": 414780, "epoch": 2468} {"train_loss": -12.209589004516602, "global_step": 414781, "epoch": 2468} {"train_loss": -12.045815467834473, "global_step": 414782, "epoch": 2468} {"train_loss": -12.152204513549805, "global_step": 414783, "epoch": 2468} {"train_loss": -11.79957389831543, "global_step": 414784, "epoch": 2468} {"train_loss": -12.171825408935547, "global_step": 414785, "epoch": 2468} {"train_loss": -12.162942886352539, "global_step": 414786, "epoch": 2468} {"train_loss": -12.057528495788574, "global_step": 414787, "epoch": 2468} {"train_loss": -12.353239059448242, "global_step": 414788, "epoch": 2468} {"train_loss": -12.326680183410645, "global_step": 414789, "epoch": 2468} {"train_loss": -12.261966705322266, "global_step": 414790, "epoch": 2468} {"train_loss": -11.53948267868587, "global_step": 414791, "epoch": 2468, "val_loss": 305750.78125} {"train_loss": -12.341290473937988, "global_step": 414792, "epoch": 2469} {"train_loss": -12.273002624511719, "global_step": 414793, "epoch": 2469} {"train_loss": -12.118093490600586, "global_step": 414794, "epoch": 2469} {"train_loss": -12.237235069274902, "global_step": 414795, "epoch": 2469} {"train_loss": -12.429339408874512, "global_step": 414796, "epoch": 2469} {"train_loss": -12.231515884399414, "global_step": 414797, "epoch": 2469} {"train_loss": -12.502452850341797, "global_step": 414798, "epoch": 2469} {"train_loss": -12.360809326171875, "global_step": 414799, "epoch": 2469} {"train_loss": -12.338094711303711, "global_step": 414800, "epoch": 2469} {"train_loss": -12.191889762878418, "global_step": 414801, "epoch": 2469} {"train_loss": -12.181215286254883, "global_step": 414802, "epoch": 2469} {"train_loss": -12.446836471557617, "global_step": 414803, "epoch": 2469} {"train_loss": -12.509236335754395, "global_step": 414804, "epoch": 2469} {"train_loss": -12.535761833190918, "global_step": 414805, "epoch": 2469} {"train_loss": -12.507023811340332, "global_step": 414806, "epoch": 2469} {"train_loss": -12.302749633789062, "global_step": 414807, "epoch": 2469} {"train_loss": -12.28470230102539, "global_step": 414808, "epoch": 2469} {"train_loss": -12.458404541015625, "global_step": 414809, "epoch": 2469} {"train_loss": -12.275918960571289, "global_step": 414810, "epoch": 2469} {"train_loss": -12.381258010864258, "global_step": 414811, "epoch": 2469} {"train_loss": -12.444404602050781, "global_step": 414812, "epoch": 2469} {"train_loss": -12.382791519165039, "global_step": 414813, "epoch": 2469} {"train_loss": -12.376031875610352, "global_step": 414814, "epoch": 2469} {"train_loss": -12.368537902832031, "global_step": 414815, "epoch": 2469} {"train_loss": -12.577049255371094, "global_step": 414816, "epoch": 2469} {"train_loss": -12.625986099243164, "global_step": 414817, "epoch": 2469} {"train_loss": -12.551597595214844, "global_step": 414818, "epoch": 2469} {"train_loss": -12.48514175415039, "global_step": 414819, "epoch": 2469} {"train_loss": -12.581740379333496, "global_step": 414820, "epoch": 2469} {"train_loss": -12.6201171875, "global_step": 414821, "epoch": 2469} {"train_loss": -12.54550552368164, "global_step": 414822, "epoch": 2469} {"train_loss": -12.219608306884766, "global_step": 414823, "epoch": 2469} {"train_loss": -12.06955337524414, "global_step": 414824, "epoch": 2469} {"train_loss": -12.279016494750977, "global_step": 414825, "epoch": 2469} {"train_loss": -12.495744705200195, "global_step": 414826, "epoch": 2469} {"train_loss": -12.320034980773926, "global_step": 414827, "epoch": 2469} {"train_loss": -12.171260833740234, "global_step": 414828, "epoch": 2469} {"train_loss": -12.422399520874023, "global_step": 414829, "epoch": 2469} {"train_loss": -12.069673538208008, "global_step": 414830, "epoch": 2469} {"train_loss": -12.220492362976074, "global_step": 414831, "epoch": 2469} {"train_loss": -12.227683067321777, "global_step": 414832, "epoch": 2469} {"train_loss": -11.523151397705078, "global_step": 414833, "epoch": 2469} {"train_loss": -12.580157279968262, "global_step": 414834, "epoch": 2469} {"train_loss": -12.234501838684082, "global_step": 414835, "epoch": 2469} {"train_loss": -12.183465003967285, "global_step": 414836, "epoch": 2469} {"train_loss": -11.036945343017578, "global_step": 414837, "epoch": 2469} {"train_loss": -12.550251007080078, "global_step": 414838, "epoch": 2469} {"train_loss": -11.40159797668457, "global_step": 414839, "epoch": 2469} {"train_loss": -11.997676849365234, "global_step": 414840, "epoch": 2469} {"train_loss": -11.799901008605957, "global_step": 414841, "epoch": 2469} {"train_loss": -12.603193283081055, "global_step": 414842, "epoch": 2469} {"train_loss": -12.19870662689209, "global_step": 414843, "epoch": 2469} {"train_loss": -12.127246856689453, "global_step": 414844, "epoch": 2469} {"train_loss": -11.350323677062988, "global_step": 414845, "epoch": 2469} {"train_loss": -12.398789405822754, "global_step": 414846, "epoch": 2469} {"train_loss": -11.976672172546387, "global_step": 414847, "epoch": 2469} {"train_loss": -12.142894744873047, "global_step": 414848, "epoch": 2469} {"train_loss": -12.116085052490234, "global_step": 414849, "epoch": 2469} {"train_loss": -11.400533676147461, "global_step": 414850, "epoch": 2469} {"train_loss": -10.50505256652832, "global_step": 414851, "epoch": 2469} {"train_loss": -11.05843734741211, "global_step": 414852, "epoch": 2469} {"train_loss": -12.122182846069336, "global_step": 414853, "epoch": 2469} {"train_loss": -10.35997486114502, "global_step": 414854, "epoch": 2469} {"train_loss": -11.725729942321777, "global_step": 414855, "epoch": 2469} {"train_loss": -10.888333320617676, "global_step": 414856, "epoch": 2469} {"train_loss": -10.850229263305664, "global_step": 414857, "epoch": 2469} {"train_loss": -10.995335578918457, "global_step": 414858, "epoch": 2469} {"train_loss": -9.886591911315918, "global_step": 414859, "epoch": 2469} {"train_loss": -12.295360565185547, "global_step": 414860, "epoch": 2469} {"train_loss": -9.95393180847168, "global_step": 414861, "epoch": 2469} {"train_loss": -11.011760711669922, "global_step": 414862, "epoch": 2469} {"train_loss": -9.92026138305664, "global_step": 414863, "epoch": 2469} {"train_loss": -11.346052169799805, "global_step": 414864, "epoch": 2469} {"train_loss": -9.959882736206055, "global_step": 414865, "epoch": 2469} {"train_loss": -10.39930248260498, "global_step": 414866, "epoch": 2469} {"train_loss": -9.914510726928711, "global_step": 414867, "epoch": 2469} {"train_loss": -10.947986602783203, "global_step": 414868, "epoch": 2469} {"train_loss": -11.3604736328125, "global_step": 414869, "epoch": 2469} {"train_loss": -10.300926208496094, "global_step": 414870, "epoch": 2469} {"train_loss": -11.633353233337402, "global_step": 414871, "epoch": 2469} {"train_loss": -11.181547164916992, "global_step": 414872, "epoch": 2469} {"train_loss": -10.54551887512207, "global_step": 414873, "epoch": 2469} {"train_loss": -10.40414047241211, "global_step": 414874, "epoch": 2469} {"train_loss": -11.973260879516602, "global_step": 414875, "epoch": 2469} {"train_loss": -11.250333786010742, "global_step": 414876, "epoch": 2469} {"train_loss": -11.672896385192871, "global_step": 414877, "epoch": 2469} {"train_loss": -11.415380477905273, "global_step": 414878, "epoch": 2469} {"train_loss": -11.609732627868652, "global_step": 414879, "epoch": 2469} {"train_loss": -11.81976318359375, "global_step": 414880, "epoch": 2469} {"train_loss": -11.74582290649414, "global_step": 414881, "epoch": 2469} {"train_loss": -11.648536682128906, "global_step": 414882, "epoch": 2469} {"train_loss": -11.50421142578125, "global_step": 414883, "epoch": 2469} {"train_loss": -11.27976131439209, "global_step": 414884, "epoch": 2469} {"train_loss": -11.614826202392578, "global_step": 414885, "epoch": 2469} {"train_loss": -11.915029525756836, "global_step": 414886, "epoch": 2469} {"train_loss": -11.794770240783691, "global_step": 414887, "epoch": 2469} {"train_loss": -11.980268478393555, "global_step": 414888, "epoch": 2469} {"train_loss": -11.96954345703125, "global_step": 414889, "epoch": 2469} {"train_loss": -11.804527282714844, "global_step": 414890, "epoch": 2469} {"train_loss": -11.87458610534668, "global_step": 414891, "epoch": 2469} {"train_loss": -12.024859428405762, "global_step": 414892, "epoch": 2469} {"train_loss": -11.868196487426758, "global_step": 414893, "epoch": 2469} {"train_loss": -11.623724937438965, "global_step": 414894, "epoch": 2469} {"train_loss": -12.164258003234863, "global_step": 414895, "epoch": 2469} {"train_loss": -11.95588207244873, "global_step": 414896, "epoch": 2469} {"train_loss": -11.965627670288086, "global_step": 414897, "epoch": 2469} {"train_loss": -12.260370254516602, "global_step": 414898, "epoch": 2469} {"train_loss": -12.272428512573242, "global_step": 414899, "epoch": 2469} {"train_loss": -12.423914909362793, "global_step": 414900, "epoch": 2469} {"train_loss": -12.407672882080078, "global_step": 414901, "epoch": 2469} {"train_loss": -12.233139038085938, "global_step": 414902, "epoch": 2469} {"train_loss": -12.354694366455078, "global_step": 414903, "epoch": 2469} {"train_loss": -12.260612487792969, "global_step": 414904, "epoch": 2469} {"train_loss": -12.28798770904541, "global_step": 414905, "epoch": 2469} {"train_loss": -12.098058700561523, "global_step": 414906, "epoch": 2469} {"train_loss": -12.273624420166016, "global_step": 414907, "epoch": 2469} {"train_loss": -12.483312606811523, "global_step": 414908, "epoch": 2469} {"train_loss": -12.37080192565918, "global_step": 414909, "epoch": 2469} {"train_loss": -12.354652404785156, "global_step": 414910, "epoch": 2469} {"train_loss": -12.537782669067383, "global_step": 414911, "epoch": 2469} {"train_loss": -12.2877197265625, "global_step": 414912, "epoch": 2469} {"train_loss": -12.335946083068848, "global_step": 414913, "epoch": 2469} {"train_loss": -12.318361282348633, "global_step": 414914, "epoch": 2469} {"train_loss": -12.575910568237305, "global_step": 414915, "epoch": 2469} {"train_loss": -12.396361351013184, "global_step": 414916, "epoch": 2469} {"train_loss": -12.259563446044922, "global_step": 414917, "epoch": 2469} {"train_loss": -12.555158615112305, "global_step": 414918, "epoch": 2469} {"train_loss": -12.55888557434082, "global_step": 414919, "epoch": 2469} {"train_loss": -12.658714294433594, "global_step": 414920, "epoch": 2469} {"train_loss": -12.59907054901123, "global_step": 414921, "epoch": 2469} {"train_loss": -12.525421142578125, "global_step": 414922, "epoch": 2469} {"train_loss": -12.544991493225098, "global_step": 414923, "epoch": 2469} {"train_loss": -12.450668334960938, "global_step": 414924, "epoch": 2469} {"train_loss": -12.490438461303711, "global_step": 414925, "epoch": 2469} {"train_loss": -12.693841934204102, "global_step": 414926, "epoch": 2469} {"train_loss": -12.60279655456543, "global_step": 414927, "epoch": 2469} {"train_loss": -12.641485214233398, "global_step": 414928, "epoch": 2469} {"train_loss": -12.738356590270996, "global_step": 414929, "epoch": 2469} {"train_loss": -12.501134872436523, "global_step": 414930, "epoch": 2469} {"train_loss": -12.73660945892334, "global_step": 414931, "epoch": 2469} {"train_loss": -12.433917045593262, "global_step": 414932, "epoch": 2469} {"train_loss": -12.523396492004395, "global_step": 414933, "epoch": 2469} {"train_loss": -12.550260543823242, "global_step": 414934, "epoch": 2469} {"train_loss": -12.388343811035156, "global_step": 414935, "epoch": 2469} {"train_loss": -12.733685493469238, "global_step": 414936, "epoch": 2469} {"train_loss": -12.601733207702637, "global_step": 414937, "epoch": 2469} {"train_loss": -12.483689308166504, "global_step": 414938, "epoch": 2469} {"train_loss": -12.81686019897461, "global_step": 414939, "epoch": 2469} {"train_loss": -12.54746150970459, "global_step": 414940, "epoch": 2469} {"train_loss": -12.640157699584961, "global_step": 414941, "epoch": 2469} {"train_loss": -12.804954528808594, "global_step": 414942, "epoch": 2469} {"train_loss": -12.486396789550781, "global_step": 414943, "epoch": 2469} {"train_loss": -12.780550956726074, "global_step": 414944, "epoch": 2469} {"train_loss": -12.756338119506836, "global_step": 414945, "epoch": 2469} {"train_loss": -12.669099807739258, "global_step": 414946, "epoch": 2469} {"train_loss": -12.419504165649414, "global_step": 414947, "epoch": 2469} {"train_loss": -12.927413940429688, "global_step": 414948, "epoch": 2469} {"train_loss": -12.584949493408203, "global_step": 414949, "epoch": 2469} {"train_loss": -12.50362491607666, "global_step": 414950, "epoch": 2469} {"train_loss": -12.488606452941895, "global_step": 414951, "epoch": 2469} {"train_loss": -12.539910316467285, "global_step": 414952, "epoch": 2469} {"train_loss": -12.019808769226074, "global_step": 414953, "epoch": 2469} {"train_loss": -11.983120918273926, "global_step": 414954, "epoch": 2469} {"train_loss": -12.52501106262207, "global_step": 414955, "epoch": 2469} {"train_loss": -11.946383476257324, "global_step": 414956, "epoch": 2469} {"train_loss": -10.953383445739746, "global_step": 414957, "epoch": 2469} {"train_loss": -11.400815963745117, "global_step": 414958, "epoch": 2469} {"train_loss": -12.029890758650643, "global_step": 414959, "epoch": 2469, "val_loss": 305322.1875} {"train_loss": -12.067770004272461, "global_step": 414960, "epoch": 2470} {"train_loss": -10.247316360473633, "global_step": 414961, "epoch": 2470} {"train_loss": -11.153738021850586, "global_step": 414962, "epoch": 2470} {"train_loss": -10.215205192565918, "global_step": 414963, "epoch": 2470} {"train_loss": -11.170140266418457, "global_step": 414964, "epoch": 2470} {"train_loss": -10.274496078491211, "global_step": 414965, "epoch": 2470} {"train_loss": -10.91047191619873, "global_step": 414966, "epoch": 2470} {"train_loss": -10.175048828125, "global_step": 414967, "epoch": 2470} {"train_loss": -9.951749801635742, "global_step": 414968, "epoch": 2470} {"train_loss": -10.387744903564453, "global_step": 414969, "epoch": 2470} {"train_loss": -11.612184524536133, "global_step": 414970, "epoch": 2470} {"train_loss": -9.77444839477539, "global_step": 414971, "epoch": 2470} {"train_loss": -11.060699462890625, "global_step": 414972, "epoch": 2470} {"train_loss": -10.1607666015625, "global_step": 414973, "epoch": 2470} {"train_loss": -10.828088760375977, "global_step": 414974, "epoch": 2470} {"train_loss": -10.0397310256958, "global_step": 414975, "epoch": 2470} {"train_loss": -11.588191986083984, "global_step": 414976, "epoch": 2470} {"train_loss": -9.795374870300293, "global_step": 414977, "epoch": 2470} {"train_loss": -11.509515762329102, "global_step": 414978, "epoch": 2470} {"train_loss": -9.943694114685059, "global_step": 414979, "epoch": 2470} {"train_loss": -11.654566764831543, "global_step": 414980, "epoch": 2470} {"train_loss": -10.955873489379883, "global_step": 414981, "epoch": 2470} {"train_loss": -11.438177108764648, "global_step": 414982, "epoch": 2470} {"train_loss": -10.93610668182373, "global_step": 414983, "epoch": 2470} {"train_loss": -10.953682899475098, "global_step": 414984, "epoch": 2470} {"train_loss": -11.009464263916016, "global_step": 414985, "epoch": 2470} {"train_loss": -11.630064964294434, "global_step": 414986, "epoch": 2470} {"train_loss": -10.98211669921875, "global_step": 414987, "epoch": 2470} {"train_loss": -12.01480484008789, "global_step": 414988, "epoch": 2470} {"train_loss": -11.640386581420898, "global_step": 414989, "epoch": 2470} {"train_loss": -11.764484405517578, "global_step": 414990, "epoch": 2470} {"train_loss": -11.450581550598145, "global_step": 414991, "epoch": 2470} {"train_loss": -11.97694206237793, "global_step": 414992, "epoch": 2470} {"train_loss": -11.775561332702637, "global_step": 414993, "epoch": 2470} {"train_loss": -11.525677680969238, "global_step": 414994, "epoch": 2470} {"train_loss": -11.981118202209473, "global_step": 414995, "epoch": 2470} {"train_loss": -11.507180213928223, "global_step": 414996, "epoch": 2470} {"train_loss": -11.992302894592285, "global_step": 414997, "epoch": 2470} {"train_loss": -11.944499969482422, "global_step": 414998, "epoch": 2470} {"train_loss": -11.688642501831055, "global_step": 414999, "epoch": 2470} {"train_loss": -11.96945571899414, "global_step": 415000, "epoch": 2470} {"train_loss": -12.148719787597656, "global_step": 415001, "epoch": 2470} {"train_loss": -11.502420425415039, "global_step": 415002, "epoch": 2470} {"train_loss": -11.97507381439209, "global_step": 415003, "epoch": 2470} {"train_loss": -11.703872680664062, "global_step": 415004, "epoch": 2470} {"train_loss": -12.095132827758789, "global_step": 415005, "epoch": 2470} {"train_loss": -12.077369689941406, "global_step": 415006, "epoch": 2470} {"train_loss": -12.063638687133789, "global_step": 415007, "epoch": 2470} {"train_loss": -12.02043628692627, "global_step": 415008, "epoch": 2470} {"train_loss": -12.239500045776367, "global_step": 415009, "epoch": 2470} {"train_loss": -12.3806734085083, "global_step": 415010, "epoch": 2470} {"train_loss": -12.012812614440918, "global_step": 415011, "epoch": 2470} {"train_loss": -12.524020195007324, "global_step": 415012, "epoch": 2470} {"train_loss": -12.001729965209961, "global_step": 415013, "epoch": 2470} {"train_loss": -12.346902847290039, "global_step": 415014, "epoch": 2470} {"train_loss": -12.254579544067383, "global_step": 415015, "epoch": 2470} {"train_loss": -12.335779190063477, "global_step": 415016, "epoch": 2470} {"train_loss": -12.53147029876709, "global_step": 415017, "epoch": 2470} {"train_loss": -12.230703353881836, "global_step": 415018, "epoch": 2470} {"train_loss": -12.401432991027832, "global_step": 415019, "epoch": 2470} {"train_loss": -12.240239143371582, "global_step": 415020, "epoch": 2470} {"train_loss": -12.449312210083008, "global_step": 415021, "epoch": 2470} {"train_loss": -12.287043571472168, "global_step": 415022, "epoch": 2470} {"train_loss": -12.321988105773926, "global_step": 415023, "epoch": 2470} {"train_loss": -12.464263916015625, "global_step": 415024, "epoch": 2470} {"train_loss": -12.598845481872559, "global_step": 415025, "epoch": 2470} {"train_loss": -12.181936264038086, "global_step": 415026, "epoch": 2470} {"train_loss": -12.517465591430664, "global_step": 415027, "epoch": 2470} {"train_loss": -12.439284324645996, "global_step": 415028, "epoch": 2470} {"train_loss": -12.44468879699707, "global_step": 415029, "epoch": 2470} {"train_loss": -12.526167869567871, "global_step": 415030, "epoch": 2470} {"train_loss": -12.417606353759766, "global_step": 415031, "epoch": 2470} {"train_loss": -12.473359107971191, "global_step": 415032, "epoch": 2470} {"train_loss": -12.58598518371582, "global_step": 415033, "epoch": 2470} {"train_loss": -12.408341407775879, "global_step": 415034, "epoch": 2470} {"train_loss": -12.380123138427734, "global_step": 415035, "epoch": 2470} {"train_loss": -12.697693824768066, "global_step": 415036, "epoch": 2470} {"train_loss": -12.572515487670898, "global_step": 415037, "epoch": 2470} {"train_loss": -12.3013916015625, "global_step": 415038, "epoch": 2470} {"train_loss": -12.338424682617188, "global_step": 415039, "epoch": 2470} {"train_loss": -12.43919563293457, "global_step": 415040, "epoch": 2470} {"train_loss": -12.615797996520996, "global_step": 415041, "epoch": 2470} {"train_loss": -12.519481658935547, "global_step": 415042, "epoch": 2470} {"train_loss": -12.482220649719238, "global_step": 415043, "epoch": 2470} {"train_loss": -12.52717399597168, "global_step": 415044, "epoch": 2470} {"train_loss": -12.577996253967285, "global_step": 415045, "epoch": 2470} {"train_loss": -12.602170944213867, "global_step": 415046, "epoch": 2470} {"train_loss": -12.497937202453613, "global_step": 415047, "epoch": 2470} {"train_loss": -12.518043518066406, "global_step": 415048, "epoch": 2470} {"train_loss": -12.2763671875, "global_step": 415049, "epoch": 2470} {"train_loss": -12.43008041381836, "global_step": 415050, "epoch": 2470} {"train_loss": -12.483268737792969, "global_step": 415051, "epoch": 2470} {"train_loss": -12.39051628112793, "global_step": 415052, "epoch": 2470} {"train_loss": -12.994245529174805, "global_step": 415053, "epoch": 2470} {"train_loss": -12.513912200927734, "global_step": 415054, "epoch": 2470} {"train_loss": -12.813820838928223, "global_step": 415055, "epoch": 2470} {"train_loss": -12.724260330200195, "global_step": 415056, "epoch": 2470} {"train_loss": -12.641698837280273, "global_step": 415057, "epoch": 2470} {"train_loss": -12.681209564208984, "global_step": 415058, "epoch": 2470} {"train_loss": -12.754165649414062, "global_step": 415059, "epoch": 2470} {"train_loss": -12.626282691955566, "global_step": 415060, "epoch": 2470} {"train_loss": -12.423255920410156, "global_step": 415061, "epoch": 2470} {"train_loss": -12.621542930603027, "global_step": 415062, "epoch": 2470} {"train_loss": -12.680767059326172, "global_step": 415063, "epoch": 2470} {"train_loss": -12.583574295043945, "global_step": 415064, "epoch": 2470} {"train_loss": -12.554551124572754, "global_step": 415065, "epoch": 2470} {"train_loss": -12.645922660827637, "global_step": 415066, "epoch": 2470} {"train_loss": -12.474458694458008, "global_step": 415067, "epoch": 2470} {"train_loss": -12.560952186584473, "global_step": 415068, "epoch": 2470} {"train_loss": -11.925806045532227, "global_step": 415069, "epoch": 2470} {"train_loss": -11.434112548828125, "global_step": 415070, "epoch": 2470} {"train_loss": -11.88198471069336, "global_step": 415071, "epoch": 2470} {"train_loss": -11.836644172668457, "global_step": 415072, "epoch": 2470} {"train_loss": -10.50340461730957, "global_step": 415073, "epoch": 2470} {"train_loss": -12.494485855102539, "global_step": 415074, "epoch": 2470} {"train_loss": -10.969940185546875, "global_step": 415075, "epoch": 2470} {"train_loss": -10.845853805541992, "global_step": 415076, "epoch": 2470} {"train_loss": -12.086071968078613, "global_step": 415077, "epoch": 2470} {"train_loss": -11.722809791564941, "global_step": 415078, "epoch": 2470} {"train_loss": -12.311762809753418, "global_step": 415079, "epoch": 2470} {"train_loss": -11.75041389465332, "global_step": 415080, "epoch": 2470} {"train_loss": -11.771583557128906, "global_step": 415081, "epoch": 2470} {"train_loss": -12.418994903564453, "global_step": 415082, "epoch": 2470} {"train_loss": -11.212442398071289, "global_step": 415083, "epoch": 2470} {"train_loss": -12.448259353637695, "global_step": 415084, "epoch": 2470} {"train_loss": -12.117090225219727, "global_step": 415085, "epoch": 2470} {"train_loss": -11.829269409179688, "global_step": 415086, "epoch": 2470} {"train_loss": -12.442334175109863, "global_step": 415087, "epoch": 2470} {"train_loss": -12.180866241455078, "global_step": 415088, "epoch": 2470} {"train_loss": -11.900218963623047, "global_step": 415089, "epoch": 2470} {"train_loss": -11.997211456298828, "global_step": 415090, "epoch": 2470} {"train_loss": -12.196797370910645, "global_step": 415091, "epoch": 2470} {"train_loss": -11.515121459960938, "global_step": 415092, "epoch": 2470} {"train_loss": -12.499391555786133, "global_step": 415093, "epoch": 2470} {"train_loss": -11.747686386108398, "global_step": 415094, "epoch": 2470} {"train_loss": -12.108704566955566, "global_step": 415095, "epoch": 2470} {"train_loss": -11.919696807861328, "global_step": 415096, "epoch": 2470} {"train_loss": -12.422752380371094, "global_step": 415097, "epoch": 2470} {"train_loss": -12.163060188293457, "global_step": 415098, "epoch": 2470} {"train_loss": -12.078279495239258, "global_step": 415099, "epoch": 2470} {"train_loss": -12.441177368164062, "global_step": 415100, "epoch": 2470} {"train_loss": -11.54496955871582, "global_step": 415101, "epoch": 2470} {"train_loss": -12.112300872802734, "global_step": 415102, "epoch": 2470} {"train_loss": -11.888504981994629, "global_step": 415103, "epoch": 2470} {"train_loss": -10.67919921875, "global_step": 415104, "epoch": 2470} {"train_loss": -12.008191108703613, "global_step": 415105, "epoch": 2470} {"train_loss": -10.14594554901123, "global_step": 415106, "epoch": 2470} {"train_loss": -10.061841011047363, "global_step": 415107, "epoch": 2470} {"train_loss": -10.58985424041748, "global_step": 415108, "epoch": 2470} {"train_loss": -11.837713241577148, "global_step": 415109, "epoch": 2470} {"train_loss": -9.494935989379883, "global_step": 415110, "epoch": 2470} {"train_loss": -10.554944038391113, "global_step": 415111, "epoch": 2470} {"train_loss": -9.85402774810791, "global_step": 415112, "epoch": 2470} {"train_loss": -8.277667999267578, "global_step": 415113, "epoch": 2470} {"train_loss": -8.398818969726562, "global_step": 415114, "epoch": 2470} {"train_loss": -8.648946762084961, "global_step": 415115, "epoch": 2470} {"train_loss": -8.366399765014648, "global_step": 415116, "epoch": 2470} {"train_loss": -9.091249465942383, "global_step": 415117, "epoch": 2470} {"train_loss": -9.338600158691406, "global_step": 415118, "epoch": 2470} {"train_loss": -8.83269214630127, "global_step": 415119, "epoch": 2470} {"train_loss": -8.960031509399414, "global_step": 415120, "epoch": 2470} {"train_loss": -9.276378631591797, "global_step": 415121, "epoch": 2470} {"train_loss": -8.71969223022461, "global_step": 415122, "epoch": 2470} {"train_loss": -9.484289169311523, "global_step": 415123, "epoch": 2470} {"train_loss": -9.178817749023438, "global_step": 415124, "epoch": 2470} {"train_loss": -9.864775657653809, "global_step": 415125, "epoch": 2470} {"train_loss": -10.310995101928711, "global_step": 415126, "epoch": 2470} {"train_loss": -11.601276738303048, "global_step": 415127, "epoch": 2470, "val_loss": 305340.1875, "train_action_mse_error": 1.6409350633621216} {"train_loss": -10.366158485412598, "global_step": 415128, "epoch": 2471} {"train_loss": -10.74351978302002, "global_step": 415129, "epoch": 2471} {"train_loss": -11.123241424560547, "global_step": 415130, "epoch": 2471} {"train_loss": -11.547117233276367, "global_step": 415131, "epoch": 2471} {"train_loss": -11.345651626586914, "global_step": 415132, "epoch": 2471} {"train_loss": -11.391374588012695, "global_step": 415133, "epoch": 2471} {"train_loss": -11.191661834716797, "global_step": 415134, "epoch": 2471} {"train_loss": -11.103506088256836, "global_step": 415135, "epoch": 2471} {"train_loss": -11.019716262817383, "global_step": 415136, "epoch": 2471} {"train_loss": -11.26261043548584, "global_step": 415137, "epoch": 2471} {"train_loss": -11.545801162719727, "global_step": 415138, "epoch": 2471} {"train_loss": -11.465315818786621, "global_step": 415139, "epoch": 2471} {"train_loss": -11.7156343460083, "global_step": 415140, "epoch": 2471} {"train_loss": -11.551745414733887, "global_step": 415141, "epoch": 2471} {"train_loss": -11.076559066772461, "global_step": 415142, "epoch": 2471} {"train_loss": -11.298271179199219, "global_step": 415143, "epoch": 2471} {"train_loss": -11.311816215515137, "global_step": 415144, "epoch": 2471} {"train_loss": -11.751770973205566, "global_step": 415145, "epoch": 2471} {"train_loss": -11.784725189208984, "global_step": 415146, "epoch": 2471} {"train_loss": -11.46432876586914, "global_step": 415147, "epoch": 2471} {"train_loss": -11.914121627807617, "global_step": 415148, "epoch": 2471} {"train_loss": -11.822648048400879, "global_step": 415149, "epoch": 2471} {"train_loss": -11.664953231811523, "global_step": 415150, "epoch": 2471} {"train_loss": -11.778249740600586, "global_step": 415151, "epoch": 2471} {"train_loss": -11.928511619567871, "global_step": 415152, "epoch": 2471} {"train_loss": -11.901369094848633, "global_step": 415153, "epoch": 2471} {"train_loss": -11.852750778198242, "global_step": 415154, "epoch": 2471} {"train_loss": -11.988901138305664, "global_step": 415155, "epoch": 2471} {"train_loss": -11.718799591064453, "global_step": 415156, "epoch": 2471} {"train_loss": -11.943619728088379, "global_step": 415157, "epoch": 2471} {"train_loss": -11.778367042541504, "global_step": 415158, "epoch": 2471} {"train_loss": -12.112281799316406, "global_step": 415159, "epoch": 2471} {"train_loss": -11.896711349487305, "global_step": 415160, "epoch": 2471} {"train_loss": -11.650440216064453, "global_step": 415161, "epoch": 2471} {"train_loss": -11.851280212402344, "global_step": 415162, "epoch": 2471} {"train_loss": -11.419929504394531, "global_step": 415163, "epoch": 2471} {"train_loss": -11.949613571166992, "global_step": 415164, "epoch": 2471} {"train_loss": -11.527850151062012, "global_step": 415165, "epoch": 2471} {"train_loss": -11.948771476745605, "global_step": 415166, "epoch": 2471} {"train_loss": -11.587711334228516, "global_step": 415167, "epoch": 2471} {"train_loss": -11.535146713256836, "global_step": 415168, "epoch": 2471} {"train_loss": -11.829856872558594, "global_step": 415169, "epoch": 2471} {"train_loss": -11.417600631713867, "global_step": 415170, "epoch": 2471} {"train_loss": -12.09228801727295, "global_step": 415171, "epoch": 2471} {"train_loss": -11.509490013122559, "global_step": 415172, "epoch": 2471} {"train_loss": -11.972829818725586, "global_step": 415173, "epoch": 2471} {"train_loss": -11.051353454589844, "global_step": 415174, "epoch": 2471} {"train_loss": -12.146265029907227, "global_step": 415175, "epoch": 2471} {"train_loss": -11.511802673339844, "global_step": 415176, "epoch": 2471} {"train_loss": -12.016973495483398, "global_step": 415177, "epoch": 2471} {"train_loss": -11.424331665039062, "global_step": 415178, "epoch": 2471} {"train_loss": -11.49882984161377, "global_step": 415179, "epoch": 2471} {"train_loss": -11.838773727416992, "global_step": 415180, "epoch": 2471} {"train_loss": -11.31167221069336, "global_step": 415181, "epoch": 2471} {"train_loss": -11.89816951751709, "global_step": 415182, "epoch": 2471} {"train_loss": -11.777131080627441, "global_step": 415183, "epoch": 2471} {"train_loss": -11.725830078125, "global_step": 415184, "epoch": 2471} {"train_loss": -12.096620559692383, "global_step": 415185, "epoch": 2471} {"train_loss": -11.877216339111328, "global_step": 415186, "epoch": 2471} {"train_loss": -11.95781135559082, "global_step": 415187, "epoch": 2471} {"train_loss": -11.996152877807617, "global_step": 415188, "epoch": 2471} {"train_loss": -11.732989311218262, "global_step": 415189, "epoch": 2471} {"train_loss": -11.911959648132324, "global_step": 415190, "epoch": 2471} {"train_loss": -12.132061958312988, "global_step": 415191, "epoch": 2471} {"train_loss": -11.981918334960938, "global_step": 415192, "epoch": 2471} {"train_loss": -11.936713218688965, "global_step": 415193, "epoch": 2471} {"train_loss": -12.139366149902344, "global_step": 415194, "epoch": 2471} {"train_loss": -12.181572914123535, "global_step": 415195, "epoch": 2471} {"train_loss": -11.82908821105957, "global_step": 415196, "epoch": 2471} {"train_loss": -12.409055709838867, "global_step": 415197, "epoch": 2471} {"train_loss": -11.610410690307617, "global_step": 415198, "epoch": 2471} {"train_loss": -12.350812911987305, "global_step": 415199, "epoch": 2471} {"train_loss": -11.910234451293945, "global_step": 415200, "epoch": 2471} {"train_loss": -12.519124984741211, "global_step": 415201, "epoch": 2471} {"train_loss": -12.112028121948242, "global_step": 415202, "epoch": 2471} {"train_loss": -12.179038047790527, "global_step": 415203, "epoch": 2471} {"train_loss": -12.131165504455566, "global_step": 415204, "epoch": 2471} {"train_loss": -12.415441513061523, "global_step": 415205, "epoch": 2471} {"train_loss": -12.311676025390625, "global_step": 415206, "epoch": 2471} {"train_loss": -12.535932540893555, "global_step": 415207, "epoch": 2471} {"train_loss": -12.407614707946777, "global_step": 415208, "epoch": 2471} {"train_loss": -12.420299530029297, "global_step": 415209, "epoch": 2471} {"train_loss": -12.37332534790039, "global_step": 415210, "epoch": 2471} {"train_loss": -12.434211730957031, "global_step": 415211, "epoch": 2471} {"train_loss": -12.426703453063965, "global_step": 415212, "epoch": 2471} {"train_loss": -12.589689254760742, "global_step": 415213, "epoch": 2471} {"train_loss": -12.517333030700684, "global_step": 415214, "epoch": 2471} {"train_loss": -12.520286560058594, "global_step": 415215, "epoch": 2471} {"train_loss": -12.162962913513184, "global_step": 415216, "epoch": 2471} {"train_loss": -12.545269012451172, "global_step": 415217, "epoch": 2471} {"train_loss": -12.44935417175293, "global_step": 415218, "epoch": 2471} {"train_loss": -12.619257926940918, "global_step": 415219, "epoch": 2471} {"train_loss": -12.458866119384766, "global_step": 415220, "epoch": 2471} {"train_loss": -12.696004867553711, "global_step": 415221, "epoch": 2471} {"train_loss": -12.643980979919434, "global_step": 415222, "epoch": 2471} {"train_loss": -12.648553848266602, "global_step": 415223, "epoch": 2471} {"train_loss": -12.451665878295898, "global_step": 415224, "epoch": 2471} {"train_loss": -12.521300315856934, "global_step": 415225, "epoch": 2471} {"train_loss": -12.54111099243164, "global_step": 415226, "epoch": 2471} {"train_loss": -12.545380592346191, "global_step": 415227, "epoch": 2471} {"train_loss": -12.472780227661133, "global_step": 415228, "epoch": 2471} {"train_loss": -12.723289489746094, "global_step": 415229, "epoch": 2471} {"train_loss": -12.661188125610352, "global_step": 415230, "epoch": 2471} {"train_loss": -12.688074111938477, "global_step": 415231, "epoch": 2471} {"train_loss": -12.68784236907959, "global_step": 415232, "epoch": 2471} {"train_loss": -12.645890235900879, "global_step": 415233, "epoch": 2471} {"train_loss": -12.781961441040039, "global_step": 415234, "epoch": 2471} {"train_loss": -12.518564224243164, "global_step": 415235, "epoch": 2471} {"train_loss": -12.63808536529541, "global_step": 415236, "epoch": 2471} {"train_loss": -12.64291000366211, "global_step": 415237, "epoch": 2471} {"train_loss": -12.610937118530273, "global_step": 415238, "epoch": 2471} {"train_loss": -12.691428184509277, "global_step": 415239, "epoch": 2471} {"train_loss": -12.49958610534668, "global_step": 415240, "epoch": 2471} {"train_loss": -12.555331230163574, "global_step": 415241, "epoch": 2471} {"train_loss": -12.539467811584473, "global_step": 415242, "epoch": 2471} {"train_loss": -12.59972095489502, "global_step": 415243, "epoch": 2471} {"train_loss": -12.571203231811523, "global_step": 415244, "epoch": 2471} {"train_loss": -12.405216217041016, "global_step": 415245, "epoch": 2471} {"train_loss": -12.291529655456543, "global_step": 415246, "epoch": 2471} {"train_loss": -12.810558319091797, "global_step": 415247, "epoch": 2471} {"train_loss": -12.598862648010254, "global_step": 415248, "epoch": 2471} {"train_loss": -12.819478034973145, "global_step": 415249, "epoch": 2471} {"train_loss": -12.807145118713379, "global_step": 415250, "epoch": 2471} {"train_loss": -12.100484848022461, "global_step": 415251, "epoch": 2471} {"train_loss": -12.613329887390137, "global_step": 415252, "epoch": 2471} {"train_loss": -12.597281455993652, "global_step": 415253, "epoch": 2471} {"train_loss": -12.581108093261719, "global_step": 415254, "epoch": 2471} {"train_loss": -12.412370681762695, "global_step": 415255, "epoch": 2471} {"train_loss": -12.613594055175781, "global_step": 415256, "epoch": 2471} {"train_loss": -12.418241500854492, "global_step": 415257, "epoch": 2471} {"train_loss": -12.455378532409668, "global_step": 415258, "epoch": 2471} {"train_loss": -12.196697235107422, "global_step": 415259, "epoch": 2471} {"train_loss": -12.495794296264648, "global_step": 415260, "epoch": 2471} {"train_loss": -12.473644256591797, "global_step": 415261, "epoch": 2471} {"train_loss": -12.758331298828125, "global_step": 415262, "epoch": 2471} {"train_loss": -12.60238265991211, "global_step": 415263, "epoch": 2471} {"train_loss": -12.445723533630371, "global_step": 415264, "epoch": 2471} {"train_loss": -12.470518112182617, "global_step": 415265, "epoch": 2471} {"train_loss": -11.884784698486328, "global_step": 415266, "epoch": 2471} {"train_loss": -11.67806339263916, "global_step": 415267, "epoch": 2471} {"train_loss": -12.544593811035156, "global_step": 415268, "epoch": 2471} {"train_loss": -12.334959983825684, "global_step": 415269, "epoch": 2471} {"train_loss": -11.67848014831543, "global_step": 415270, "epoch": 2471} {"train_loss": -10.857229232788086, "global_step": 415271, "epoch": 2471} {"train_loss": -12.335644721984863, "global_step": 415272, "epoch": 2471} {"train_loss": -11.89527702331543, "global_step": 415273, "epoch": 2471} {"train_loss": -12.073894500732422, "global_step": 415274, "epoch": 2471} {"train_loss": -11.905380249023438, "global_step": 415275, "epoch": 2471} {"train_loss": -12.18070125579834, "global_step": 415276, "epoch": 2471} {"train_loss": -11.161102294921875, "global_step": 415277, "epoch": 2471} {"train_loss": -11.494945526123047, "global_step": 415278, "epoch": 2471} {"train_loss": -11.850849151611328, "global_step": 415279, "epoch": 2471} {"train_loss": -11.909515380859375, "global_step": 415280, "epoch": 2471} {"train_loss": -11.543631553649902, "global_step": 415281, "epoch": 2471} {"train_loss": -11.146515846252441, "global_step": 415282, "epoch": 2471} {"train_loss": -11.688072204589844, "global_step": 415283, "epoch": 2471} {"train_loss": -11.240533828735352, "global_step": 415284, "epoch": 2471} {"train_loss": -10.001976013183594, "global_step": 415285, "epoch": 2471} {"train_loss": -11.916814804077148, "global_step": 415286, "epoch": 2471} {"train_loss": -7.993679046630859, "global_step": 415287, "epoch": 2471} {"train_loss": -10.460905075073242, "global_step": 415288, "epoch": 2471} {"train_loss": -9.567850112915039, "global_step": 415289, "epoch": 2471} {"train_loss": -9.139244079589844, "global_step": 415290, "epoch": 2471} {"train_loss": -10.569242477416992, "global_step": 415291, "epoch": 2471} {"train_loss": -11.420806884765625, "global_step": 415292, "epoch": 2471} {"train_loss": -9.927556037902832, "global_step": 415293, "epoch": 2471} {"train_loss": -10.705127716064453, "global_step": 415294, "epoch": 2471} {"train_loss": -11.919012529509407, "global_step": 415295, "epoch": 2471, "val_loss": 301667.78125} {"train_loss": -10.859359741210938, "global_step": 415296, "epoch": 2472} {"train_loss": -10.99694538116455, "global_step": 415297, "epoch": 2472} {"train_loss": -10.800542831420898, "global_step": 415298, "epoch": 2472} {"train_loss": -10.813004493713379, "global_step": 415299, "epoch": 2472} {"train_loss": -11.434292793273926, "global_step": 415300, "epoch": 2472} {"train_loss": -10.705276489257812, "global_step": 415301, "epoch": 2472} {"train_loss": -11.008646965026855, "global_step": 415302, "epoch": 2472} {"train_loss": -11.185443878173828, "global_step": 415303, "epoch": 2472} {"train_loss": -11.553084373474121, "global_step": 415304, "epoch": 2472} {"train_loss": -11.387386322021484, "global_step": 415305, "epoch": 2472} {"train_loss": -12.03652572631836, "global_step": 415306, "epoch": 2472} {"train_loss": -12.020586013793945, "global_step": 415307, "epoch": 2472} {"train_loss": -11.905925750732422, "global_step": 415308, "epoch": 2472} {"train_loss": -11.306140899658203, "global_step": 415309, "epoch": 2472} {"train_loss": -12.040947914123535, "global_step": 415310, "epoch": 2472} {"train_loss": -11.765552520751953, "global_step": 415311, "epoch": 2472} {"train_loss": -12.059656143188477, "global_step": 415312, "epoch": 2472} {"train_loss": -12.030388832092285, "global_step": 415313, "epoch": 2472} {"train_loss": -11.392163276672363, "global_step": 415314, "epoch": 2472} {"train_loss": -12.230112075805664, "global_step": 415315, "epoch": 2472} {"train_loss": -11.642105102539062, "global_step": 415316, "epoch": 2472} {"train_loss": -11.730337142944336, "global_step": 415317, "epoch": 2472} {"train_loss": -12.054271697998047, "global_step": 415318, "epoch": 2472} {"train_loss": -11.769039154052734, "global_step": 415319, "epoch": 2472} {"train_loss": -12.213397026062012, "global_step": 415320, "epoch": 2472} {"train_loss": -12.043021202087402, "global_step": 415321, "epoch": 2472} {"train_loss": -12.126187324523926, "global_step": 415322, "epoch": 2472} {"train_loss": -12.045473098754883, "global_step": 415323, "epoch": 2472} {"train_loss": -11.83788013458252, "global_step": 415324, "epoch": 2472} {"train_loss": -11.90346908569336, "global_step": 415325, "epoch": 2472} {"train_loss": -11.900811195373535, "global_step": 415326, "epoch": 2472} {"train_loss": -11.792142868041992, "global_step": 415327, "epoch": 2472} {"train_loss": -11.690805435180664, "global_step": 415328, "epoch": 2472} {"train_loss": -11.814754486083984, "global_step": 415329, "epoch": 2472} {"train_loss": -12.444886207580566, "global_step": 415330, "epoch": 2472} {"train_loss": -12.156570434570312, "global_step": 415331, "epoch": 2472} {"train_loss": -12.147503852844238, "global_step": 415332, "epoch": 2472} {"train_loss": -11.999244689941406, "global_step": 415333, "epoch": 2472} {"train_loss": -12.545495986938477, "global_step": 415334, "epoch": 2472} {"train_loss": -12.081932067871094, "global_step": 415335, "epoch": 2472} {"train_loss": -12.383855819702148, "global_step": 415336, "epoch": 2472} {"train_loss": -12.190242767333984, "global_step": 415337, "epoch": 2472} {"train_loss": -12.152588844299316, "global_step": 415338, "epoch": 2472} {"train_loss": -12.237699508666992, "global_step": 415339, "epoch": 2472} {"train_loss": -11.972919464111328, "global_step": 415340, "epoch": 2472} {"train_loss": -11.436895370483398, "global_step": 415341, "epoch": 2472} {"train_loss": -11.490409851074219, "global_step": 415342, "epoch": 2472} {"train_loss": -11.421344757080078, "global_step": 415343, "epoch": 2472} {"train_loss": -11.876379013061523, "global_step": 415344, "epoch": 2472} {"train_loss": -11.786428451538086, "global_step": 415345, "epoch": 2472} {"train_loss": -11.163079261779785, "global_step": 415346, "epoch": 2472} {"train_loss": -12.179056167602539, "global_step": 415347, "epoch": 2472} {"train_loss": -11.764227867126465, "global_step": 415348, "epoch": 2472} {"train_loss": -11.554009437561035, "global_step": 415349, "epoch": 2472} {"train_loss": -12.16041374206543, "global_step": 415350, "epoch": 2472} {"train_loss": -10.925321578979492, "global_step": 415351, "epoch": 2472} {"train_loss": -12.004786491394043, "global_step": 415352, "epoch": 2472} {"train_loss": -11.798187255859375, "global_step": 415353, "epoch": 2472} {"train_loss": -11.990917205810547, "global_step": 415354, "epoch": 2472} {"train_loss": -12.450682640075684, "global_step": 415355, "epoch": 2472} {"train_loss": -12.002155303955078, "global_step": 415356, "epoch": 2472} {"train_loss": -12.47878646850586, "global_step": 415357, "epoch": 2472} {"train_loss": -12.104060173034668, "global_step": 415358, "epoch": 2472} {"train_loss": -12.49896240234375, "global_step": 415359, "epoch": 2472} {"train_loss": -12.173554420471191, "global_step": 415360, "epoch": 2472} {"train_loss": -12.12704086303711, "global_step": 415361, "epoch": 2472} {"train_loss": -12.198358535766602, "global_step": 415362, "epoch": 2472} {"train_loss": -12.351666450500488, "global_step": 415363, "epoch": 2472} {"train_loss": -12.48658561706543, "global_step": 415364, "epoch": 2472} {"train_loss": -12.076499938964844, "global_step": 415365, "epoch": 2472} {"train_loss": -12.485538482666016, "global_step": 415366, "epoch": 2472} {"train_loss": -12.20689868927002, "global_step": 415367, "epoch": 2472} {"train_loss": -12.448789596557617, "global_step": 415368, "epoch": 2472} {"train_loss": -12.00577163696289, "global_step": 415369, "epoch": 2472} {"train_loss": -12.145814895629883, "global_step": 415370, "epoch": 2472} {"train_loss": -12.113096237182617, "global_step": 415371, "epoch": 2472} {"train_loss": -11.594192504882812, "global_step": 415372, "epoch": 2472} {"train_loss": -12.361580848693848, "global_step": 415373, "epoch": 2472} {"train_loss": -11.933380126953125, "global_step": 415374, "epoch": 2472} {"train_loss": -12.41961669921875, "global_step": 415375, "epoch": 2472} {"train_loss": -12.256898880004883, "global_step": 415376, "epoch": 2472} {"train_loss": -11.94592571258545, "global_step": 415377, "epoch": 2472} {"train_loss": -12.277464866638184, "global_step": 415378, "epoch": 2472} {"train_loss": -11.620281219482422, "global_step": 415379, "epoch": 2472} {"train_loss": -12.556916236877441, "global_step": 415380, "epoch": 2472} {"train_loss": -11.915953636169434, "global_step": 415381, "epoch": 2472} {"train_loss": -12.103199005126953, "global_step": 415382, "epoch": 2472} {"train_loss": -11.960779190063477, "global_step": 415383, "epoch": 2472} {"train_loss": -12.101114273071289, "global_step": 415384, "epoch": 2472} {"train_loss": -12.295406341552734, "global_step": 415385, "epoch": 2472} {"train_loss": -11.405328750610352, "global_step": 415386, "epoch": 2472} {"train_loss": -10.978655815124512, "global_step": 415387, "epoch": 2472} {"train_loss": -10.152469635009766, "global_step": 415388, "epoch": 2472} {"train_loss": -11.218620300292969, "global_step": 415389, "epoch": 2472} {"train_loss": -10.809478759765625, "global_step": 415390, "epoch": 2472} {"train_loss": -11.936962127685547, "global_step": 415391, "epoch": 2472} {"train_loss": -10.943387985229492, "global_step": 415392, "epoch": 2472} {"train_loss": -12.306902885437012, "global_step": 415393, "epoch": 2472} {"train_loss": -11.490388870239258, "global_step": 415394, "epoch": 2472} {"train_loss": -12.308631896972656, "global_step": 415395, "epoch": 2472} {"train_loss": -11.867531776428223, "global_step": 415396, "epoch": 2472} {"train_loss": -11.741020202636719, "global_step": 415397, "epoch": 2472} {"train_loss": -12.29957389831543, "global_step": 415398, "epoch": 2472} {"train_loss": -11.738428115844727, "global_step": 415399, "epoch": 2472} {"train_loss": -12.48620319366455, "global_step": 415400, "epoch": 2472} {"train_loss": -12.013336181640625, "global_step": 415401, "epoch": 2472} {"train_loss": -12.013530731201172, "global_step": 415402, "epoch": 2472} {"train_loss": -12.28021240234375, "global_step": 415403, "epoch": 2472} {"train_loss": -12.51730728149414, "global_step": 415404, "epoch": 2472} {"train_loss": -12.484489440917969, "global_step": 415405, "epoch": 2472} {"train_loss": -12.23492431640625, "global_step": 415406, "epoch": 2472} {"train_loss": -12.47848892211914, "global_step": 415407, "epoch": 2472} {"train_loss": -12.520267486572266, "global_step": 415408, "epoch": 2472} {"train_loss": -12.491670608520508, "global_step": 415409, "epoch": 2472} {"train_loss": -12.41569709777832, "global_step": 415410, "epoch": 2472} {"train_loss": -12.360628128051758, "global_step": 415411, "epoch": 2472} {"train_loss": -12.617326736450195, "global_step": 415412, "epoch": 2472} {"train_loss": -12.354410171508789, "global_step": 415413, "epoch": 2472} {"train_loss": -12.389732360839844, "global_step": 415414, "epoch": 2472} {"train_loss": -12.670814514160156, "global_step": 415415, "epoch": 2472} {"train_loss": -12.237581253051758, "global_step": 415416, "epoch": 2472} {"train_loss": -12.600797653198242, "global_step": 415417, "epoch": 2472} {"train_loss": -12.723625183105469, "global_step": 415418, "epoch": 2472} {"train_loss": -12.502084732055664, "global_step": 415419, "epoch": 2472} {"train_loss": -12.525541305541992, "global_step": 415420, "epoch": 2472} {"train_loss": -12.361677169799805, "global_step": 415421, "epoch": 2472} {"train_loss": -12.47492790222168, "global_step": 415422, "epoch": 2472} {"train_loss": -12.538097381591797, "global_step": 415423, "epoch": 2472} {"train_loss": -12.556467056274414, "global_step": 415424, "epoch": 2472} {"train_loss": -12.340787887573242, "global_step": 415425, "epoch": 2472} {"train_loss": -12.546319961547852, "global_step": 415426, "epoch": 2472} {"train_loss": -12.609342575073242, "global_step": 415427, "epoch": 2472} {"train_loss": -12.4912748336792, "global_step": 415428, "epoch": 2472} {"train_loss": -12.525287628173828, "global_step": 415429, "epoch": 2472} {"train_loss": -12.762571334838867, "global_step": 415430, "epoch": 2472} {"train_loss": -12.669901847839355, "global_step": 415431, "epoch": 2472} {"train_loss": -12.496843338012695, "global_step": 415432, "epoch": 2472} {"train_loss": -12.615525245666504, "global_step": 415433, "epoch": 2472} {"train_loss": -12.628717422485352, "global_step": 415434, "epoch": 2472} {"train_loss": -12.500253677368164, "global_step": 415435, "epoch": 2472} {"train_loss": -12.325481414794922, "global_step": 415436, "epoch": 2472} {"train_loss": -12.57547378540039, "global_step": 415437, "epoch": 2472} {"train_loss": -12.466856002807617, "global_step": 415438, "epoch": 2472} {"train_loss": -12.626346588134766, "global_step": 415439, "epoch": 2472} {"train_loss": -12.620006561279297, "global_step": 415440, "epoch": 2472} {"train_loss": -12.444543838500977, "global_step": 415441, "epoch": 2472} {"train_loss": -12.491172790527344, "global_step": 415442, "epoch": 2472} {"train_loss": -12.582983016967773, "global_step": 415443, "epoch": 2472} {"train_loss": -12.21253776550293, "global_step": 415444, "epoch": 2472} {"train_loss": -11.952126502990723, "global_step": 415445, "epoch": 2472} {"train_loss": -12.283560752868652, "global_step": 415446, "epoch": 2472} {"train_loss": -12.21695327758789, "global_step": 415447, "epoch": 2472} {"train_loss": -12.565462112426758, "global_step": 415448, "epoch": 2472} {"train_loss": -12.023674011230469, "global_step": 415449, "epoch": 2472} {"train_loss": -12.215251922607422, "global_step": 415450, "epoch": 2472} {"train_loss": -12.761687278747559, "global_step": 415451, "epoch": 2472} {"train_loss": -12.409804344177246, "global_step": 415452, "epoch": 2472} {"train_loss": -12.44961929321289, "global_step": 415453, "epoch": 2472} {"train_loss": -12.450700759887695, "global_step": 415454, "epoch": 2472} {"train_loss": -12.646955490112305, "global_step": 415455, "epoch": 2472} {"train_loss": -12.453145980834961, "global_step": 415456, "epoch": 2472} {"train_loss": -12.520720481872559, "global_step": 415457, "epoch": 2472} {"train_loss": -12.520622253417969, "global_step": 415458, "epoch": 2472} {"train_loss": -12.567731857299805, "global_step": 415459, "epoch": 2472} {"train_loss": -12.55950927734375, "global_step": 415460, "epoch": 2472} {"train_loss": -12.638425827026367, "global_step": 415461, "epoch": 2472} {"train_loss": -12.383132934570312, "global_step": 415462, "epoch": 2472} {"train_loss": -12.082627392950512, "global_step": 415463, "epoch": 2472, "val_loss": 304316.375} {"train_loss": -12.008182525634766, "global_step": 415464, "epoch": 2473} {"train_loss": -11.941997528076172, "global_step": 415465, "epoch": 2473} {"train_loss": -11.892533302307129, "global_step": 415466, "epoch": 2473} {"train_loss": -11.537809371948242, "global_step": 415467, "epoch": 2473} {"train_loss": -11.80923080444336, "global_step": 415468, "epoch": 2473} {"train_loss": -12.076871871948242, "global_step": 415469, "epoch": 2473} {"train_loss": -11.674698829650879, "global_step": 415470, "epoch": 2473} {"train_loss": -11.228248596191406, "global_step": 415471, "epoch": 2473} {"train_loss": -12.64887809753418, "global_step": 415472, "epoch": 2473} {"train_loss": -11.994080543518066, "global_step": 415473, "epoch": 2473} {"train_loss": -11.96529769897461, "global_step": 415474, "epoch": 2473} {"train_loss": -11.828659057617188, "global_step": 415475, "epoch": 2473} {"train_loss": -12.230108261108398, "global_step": 415476, "epoch": 2473} {"train_loss": -11.254989624023438, "global_step": 415477, "epoch": 2473} {"train_loss": -12.188804626464844, "global_step": 415478, "epoch": 2473} {"train_loss": -11.799095153808594, "global_step": 415479, "epoch": 2473} {"train_loss": -12.241809844970703, "global_step": 415480, "epoch": 2473} {"train_loss": -11.82908821105957, "global_step": 415481, "epoch": 2473} {"train_loss": -12.034318923950195, "global_step": 415482, "epoch": 2473} {"train_loss": -12.232565879821777, "global_step": 415483, "epoch": 2473} {"train_loss": -11.540726661682129, "global_step": 415484, "epoch": 2473} {"train_loss": -11.145845413208008, "global_step": 415485, "epoch": 2473} {"train_loss": -12.394574165344238, "global_step": 415486, "epoch": 2473} {"train_loss": -12.108800888061523, "global_step": 415487, "epoch": 2473} {"train_loss": -11.377309799194336, "global_step": 415488, "epoch": 2473} {"train_loss": -12.346235275268555, "global_step": 415489, "epoch": 2473} {"train_loss": -12.058450698852539, "global_step": 415490, "epoch": 2473} {"train_loss": -12.308883666992188, "global_step": 415491, "epoch": 2473} {"train_loss": -12.155729293823242, "global_step": 415492, "epoch": 2473} {"train_loss": -12.181901931762695, "global_step": 415493, "epoch": 2473} {"train_loss": -11.82998275756836, "global_step": 415494, "epoch": 2473} {"train_loss": -12.087958335876465, "global_step": 415495, "epoch": 2473} {"train_loss": -11.69448471069336, "global_step": 415496, "epoch": 2473} {"train_loss": -11.989727020263672, "global_step": 415497, "epoch": 2473} {"train_loss": -11.932642936706543, "global_step": 415498, "epoch": 2473} {"train_loss": -12.11116886138916, "global_step": 415499, "epoch": 2473} {"train_loss": -12.416377067565918, "global_step": 415500, "epoch": 2473} {"train_loss": -11.96748161315918, "global_step": 415501, "epoch": 2473} {"train_loss": -11.902093887329102, "global_step": 415502, "epoch": 2473} {"train_loss": -12.542914390563965, "global_step": 415503, "epoch": 2473} {"train_loss": -12.394100189208984, "global_step": 415504, "epoch": 2473} {"train_loss": -12.180619239807129, "global_step": 415505, "epoch": 2473} {"train_loss": -12.197628021240234, "global_step": 415506, "epoch": 2473} {"train_loss": -11.701105117797852, "global_step": 415507, "epoch": 2473} {"train_loss": -12.421369552612305, "global_step": 415508, "epoch": 2473} {"train_loss": -12.06319808959961, "global_step": 415509, "epoch": 2473} {"train_loss": -12.399285316467285, "global_step": 415510, "epoch": 2473} {"train_loss": -12.19182014465332, "global_step": 415511, "epoch": 2473} {"train_loss": -11.775629043579102, "global_step": 415512, "epoch": 2473} {"train_loss": -12.113801956176758, "global_step": 415513, "epoch": 2473} {"train_loss": -12.134148597717285, "global_step": 415514, "epoch": 2473} {"train_loss": -12.427989959716797, "global_step": 415515, "epoch": 2473} {"train_loss": -12.449077606201172, "global_step": 415516, "epoch": 2473} {"train_loss": -12.38347053527832, "global_step": 415517, "epoch": 2473} {"train_loss": -12.542654037475586, "global_step": 415518, "epoch": 2473} {"train_loss": -12.193243026733398, "global_step": 415519, "epoch": 2473} {"train_loss": -12.457159042358398, "global_step": 415520, "epoch": 2473} {"train_loss": -12.392207145690918, "global_step": 415521, "epoch": 2473} {"train_loss": -12.586858749389648, "global_step": 415522, "epoch": 2473} {"train_loss": -12.12597370147705, "global_step": 415523, "epoch": 2473} {"train_loss": -12.69869613647461, "global_step": 415524, "epoch": 2473} {"train_loss": -12.493415832519531, "global_step": 415525, "epoch": 2473} {"train_loss": -12.110007286071777, "global_step": 415526, "epoch": 2473} {"train_loss": -12.506765365600586, "global_step": 415527, "epoch": 2473} {"train_loss": -12.260704040527344, "global_step": 415528, "epoch": 2473} {"train_loss": -12.33111572265625, "global_step": 415529, "epoch": 2473} {"train_loss": -12.893449783325195, "global_step": 415530, "epoch": 2473} {"train_loss": -12.497385025024414, "global_step": 415531, "epoch": 2473} {"train_loss": -12.400369644165039, "global_step": 415532, "epoch": 2473} {"train_loss": -12.373849868774414, "global_step": 415533, "epoch": 2473} {"train_loss": -11.921072006225586, "global_step": 415534, "epoch": 2473} {"train_loss": -12.517364501953125, "global_step": 415535, "epoch": 2473} {"train_loss": -12.390948295593262, "global_step": 415536, "epoch": 2473} {"train_loss": -12.123382568359375, "global_step": 415537, "epoch": 2473} {"train_loss": -12.207039833068848, "global_step": 415538, "epoch": 2473} {"train_loss": -12.37243938446045, "global_step": 415539, "epoch": 2473} {"train_loss": -10.888422012329102, "global_step": 415540, "epoch": 2473} {"train_loss": -10.510505676269531, "global_step": 415541, "epoch": 2473} {"train_loss": -12.539712905883789, "global_step": 415542, "epoch": 2473} {"train_loss": -10.534965515136719, "global_step": 415543, "epoch": 2473} {"train_loss": -10.975112915039062, "global_step": 415544, "epoch": 2473} {"train_loss": -11.434745788574219, "global_step": 415545, "epoch": 2473} {"train_loss": -10.326393127441406, "global_step": 415546, "epoch": 2473} {"train_loss": -10.280651092529297, "global_step": 415547, "epoch": 2473} {"train_loss": -9.996742248535156, "global_step": 415548, "epoch": 2473} {"train_loss": -11.241230964660645, "global_step": 415549, "epoch": 2473} {"train_loss": -10.56927490234375, "global_step": 415550, "epoch": 2473} {"train_loss": -10.471715927124023, "global_step": 415551, "epoch": 2473} {"train_loss": -11.336238861083984, "global_step": 415552, "epoch": 2473} {"train_loss": -10.380620956420898, "global_step": 415553, "epoch": 2473} {"train_loss": -10.50282096862793, "global_step": 415554, "epoch": 2473} {"train_loss": -11.229351043701172, "global_step": 415555, "epoch": 2473} {"train_loss": -10.490333557128906, "global_step": 415556, "epoch": 2473} {"train_loss": -10.317394256591797, "global_step": 415557, "epoch": 2473} {"train_loss": -10.321335792541504, "global_step": 415558, "epoch": 2473} {"train_loss": -10.819963455200195, "global_step": 415559, "epoch": 2473} {"train_loss": -11.18045711517334, "global_step": 415560, "epoch": 2473} {"train_loss": -10.494850158691406, "global_step": 415561, "epoch": 2473} {"train_loss": -10.435921669006348, "global_step": 415562, "epoch": 2473} {"train_loss": -10.015028953552246, "global_step": 415563, "epoch": 2473} {"train_loss": -11.185710906982422, "global_step": 415564, "epoch": 2473} {"train_loss": -11.184242248535156, "global_step": 415565, "epoch": 2473} {"train_loss": -11.110835075378418, "global_step": 415566, "epoch": 2473} {"train_loss": -11.469955444335938, "global_step": 415567, "epoch": 2473} {"train_loss": -11.856025695800781, "global_step": 415568, "epoch": 2473} {"train_loss": -10.745054244995117, "global_step": 415569, "epoch": 2473} {"train_loss": -11.780238151550293, "global_step": 415570, "epoch": 2473} {"train_loss": -11.687891006469727, "global_step": 415571, "epoch": 2473} {"train_loss": -11.368562698364258, "global_step": 415572, "epoch": 2473} {"train_loss": -11.721981048583984, "global_step": 415573, "epoch": 2473} {"train_loss": -11.272649765014648, "global_step": 415574, "epoch": 2473} {"train_loss": -11.88846206665039, "global_step": 415575, "epoch": 2473} {"train_loss": -11.476353645324707, "global_step": 415576, "epoch": 2473} {"train_loss": -11.918901443481445, "global_step": 415577, "epoch": 2473} {"train_loss": -11.601558685302734, "global_step": 415578, "epoch": 2473} {"train_loss": -11.671478271484375, "global_step": 415579, "epoch": 2473} {"train_loss": -11.176366806030273, "global_step": 415580, "epoch": 2473} {"train_loss": -11.721817970275879, "global_step": 415581, "epoch": 2473} {"train_loss": -11.674565315246582, "global_step": 415582, "epoch": 2473} {"train_loss": -11.927947998046875, "global_step": 415583, "epoch": 2473} {"train_loss": -11.751554489135742, "global_step": 415584, "epoch": 2473} {"train_loss": -11.425374984741211, "global_step": 415585, "epoch": 2473} {"train_loss": -12.153782844543457, "global_step": 415586, "epoch": 2473} {"train_loss": -11.549097061157227, "global_step": 415587, "epoch": 2473} {"train_loss": -12.176445007324219, "global_step": 415588, "epoch": 2473} {"train_loss": -11.604999542236328, "global_step": 415589, "epoch": 2473} {"train_loss": -12.516351699829102, "global_step": 415590, "epoch": 2473} {"train_loss": -11.907634735107422, "global_step": 415591, "epoch": 2473} {"train_loss": -12.40243911743164, "global_step": 415592, "epoch": 2473} {"train_loss": -12.204654693603516, "global_step": 415593, "epoch": 2473} {"train_loss": -11.99799919128418, "global_step": 415594, "epoch": 2473} {"train_loss": -12.12545394897461, "global_step": 415595, "epoch": 2473} {"train_loss": -11.956932067871094, "global_step": 415596, "epoch": 2473} {"train_loss": -11.807552337646484, "global_step": 415597, "epoch": 2473} {"train_loss": -12.015302658081055, "global_step": 415598, "epoch": 2473} {"train_loss": -12.175348281860352, "global_step": 415599, "epoch": 2473} {"train_loss": -12.179965019226074, "global_step": 415600, "epoch": 2473} {"train_loss": -12.00633716583252, "global_step": 415601, "epoch": 2473} {"train_loss": -11.355486869812012, "global_step": 415602, "epoch": 2473} {"train_loss": -12.102790832519531, "global_step": 415603, "epoch": 2473} {"train_loss": -10.504838943481445, "global_step": 415604, "epoch": 2473} {"train_loss": -11.879888534545898, "global_step": 415605, "epoch": 2473} {"train_loss": -11.278448104858398, "global_step": 415606, "epoch": 2473} {"train_loss": -12.05341911315918, "global_step": 415607, "epoch": 2473} {"train_loss": -11.348249435424805, "global_step": 415608, "epoch": 2473} {"train_loss": -12.223844528198242, "global_step": 415609, "epoch": 2473} {"train_loss": -11.359739303588867, "global_step": 415610, "epoch": 2473} {"train_loss": -12.181584358215332, "global_step": 415611, "epoch": 2473} {"train_loss": -11.806849479675293, "global_step": 415612, "epoch": 2473} {"train_loss": -12.020687103271484, "global_step": 415613, "epoch": 2473} {"train_loss": -12.101041793823242, "global_step": 415614, "epoch": 2473} {"train_loss": -12.073612213134766, "global_step": 415615, "epoch": 2473} {"train_loss": -11.848430633544922, "global_step": 415616, "epoch": 2473} {"train_loss": -12.3732328414917, "global_step": 415617, "epoch": 2473} {"train_loss": -11.856546401977539, "global_step": 415618, "epoch": 2473} {"train_loss": -12.349056243896484, "global_step": 415619, "epoch": 2473} {"train_loss": -11.603767395019531, "global_step": 415620, "epoch": 2473} {"train_loss": -12.01285457611084, "global_step": 415621, "epoch": 2473} {"train_loss": -11.646674156188965, "global_step": 415622, "epoch": 2473} {"train_loss": -12.416810035705566, "global_step": 415623, "epoch": 2473} {"train_loss": -11.899120330810547, "global_step": 415624, "epoch": 2473} {"train_loss": -12.295499801635742, "global_step": 415625, "epoch": 2473} {"train_loss": -12.095087051391602, "global_step": 415626, "epoch": 2473} {"train_loss": -12.214426040649414, "global_step": 415627, "epoch": 2473} {"train_loss": -11.874513626098633, "global_step": 415628, "epoch": 2473} {"train_loss": -12.241859436035156, "global_step": 415629, "epoch": 2473} {"train_loss": -11.861809730529785, "global_step": 415630, "epoch": 2473} {"train_loss": -11.800556415603275, "global_step": 415631, "epoch": 2473, "val_loss": 307455.28125} {"train_loss": -12.303255081176758, "global_step": 415632, "epoch": 2474} {"train_loss": -12.020355224609375, "global_step": 415633, "epoch": 2474} {"train_loss": -12.309385299682617, "global_step": 415634, "epoch": 2474} {"train_loss": -12.126641273498535, "global_step": 415635, "epoch": 2474} {"train_loss": -12.208566665649414, "global_step": 415636, "epoch": 2474} {"train_loss": -12.164270401000977, "global_step": 415637, "epoch": 2474} {"train_loss": -12.298742294311523, "global_step": 415638, "epoch": 2474} {"train_loss": -12.216623306274414, "global_step": 415639, "epoch": 2474} {"train_loss": -12.136344909667969, "global_step": 415640, "epoch": 2474} {"train_loss": -11.751103401184082, "global_step": 415641, "epoch": 2474} {"train_loss": -12.260650634765625, "global_step": 415642, "epoch": 2474} {"train_loss": -12.221601486206055, "global_step": 415643, "epoch": 2474} {"train_loss": -11.782840728759766, "global_step": 415644, "epoch": 2474} {"train_loss": -11.970597267150879, "global_step": 415645, "epoch": 2474} {"train_loss": -10.725845336914062, "global_step": 415646, "epoch": 2474} {"train_loss": -12.47266960144043, "global_step": 415647, "epoch": 2474} {"train_loss": -10.957817077636719, "global_step": 415648, "epoch": 2474} {"train_loss": -12.035301208496094, "global_step": 415649, "epoch": 2474} {"train_loss": -10.716384887695312, "global_step": 415650, "epoch": 2474} {"train_loss": -12.344104766845703, "global_step": 415651, "epoch": 2474} {"train_loss": -11.46106243133545, "global_step": 415652, "epoch": 2474} {"train_loss": -12.331731796264648, "global_step": 415653, "epoch": 2474} {"train_loss": -11.574268341064453, "global_step": 415654, "epoch": 2474} {"train_loss": -11.785850524902344, "global_step": 415655, "epoch": 2474} {"train_loss": -11.90174674987793, "global_step": 415656, "epoch": 2474} {"train_loss": -11.512469291687012, "global_step": 415657, "epoch": 2474} {"train_loss": -11.889930725097656, "global_step": 415658, "epoch": 2474} {"train_loss": -11.842947006225586, "global_step": 415659, "epoch": 2474} {"train_loss": -11.8229341506958, "global_step": 415660, "epoch": 2474} {"train_loss": -11.829864501953125, "global_step": 415661, "epoch": 2474} {"train_loss": -12.05078125, "global_step": 415662, "epoch": 2474} {"train_loss": -11.479854583740234, "global_step": 415663, "epoch": 2474} {"train_loss": -11.768655776977539, "global_step": 415664, "epoch": 2474} {"train_loss": -10.874669075012207, "global_step": 415665, "epoch": 2474} {"train_loss": -11.201062202453613, "global_step": 415666, "epoch": 2474} {"train_loss": -11.395306587219238, "global_step": 415667, "epoch": 2474} {"train_loss": -11.687644004821777, "global_step": 415668, "epoch": 2474} {"train_loss": -11.658031463623047, "global_step": 415669, "epoch": 2474} {"train_loss": -11.778064727783203, "global_step": 415670, "epoch": 2474} {"train_loss": -11.416330337524414, "global_step": 415671, "epoch": 2474} {"train_loss": -12.004024505615234, "global_step": 415672, "epoch": 2474} {"train_loss": -11.40749454498291, "global_step": 415673, "epoch": 2474} {"train_loss": -11.885801315307617, "global_step": 415674, "epoch": 2474} {"train_loss": -11.197478294372559, "global_step": 415675, "epoch": 2474} {"train_loss": -12.255621910095215, "global_step": 415676, "epoch": 2474} {"train_loss": -11.945642471313477, "global_step": 415677, "epoch": 2474} {"train_loss": -11.794763565063477, "global_step": 415678, "epoch": 2474} {"train_loss": -12.26113510131836, "global_step": 415679, "epoch": 2474} {"train_loss": -11.642799377441406, "global_step": 415680, "epoch": 2474} {"train_loss": -11.377887725830078, "global_step": 415681, "epoch": 2474} {"train_loss": -12.17037582397461, "global_step": 415682, "epoch": 2474} {"train_loss": -11.132539749145508, "global_step": 415683, "epoch": 2474} {"train_loss": -12.232717514038086, "global_step": 415684, "epoch": 2474} {"train_loss": -10.730513572692871, "global_step": 415685, "epoch": 2474} {"train_loss": -12.105924606323242, "global_step": 415686, "epoch": 2474} {"train_loss": -11.142332077026367, "global_step": 415687, "epoch": 2474} {"train_loss": -11.818336486816406, "global_step": 415688, "epoch": 2474} {"train_loss": -11.419478416442871, "global_step": 415689, "epoch": 2474} {"train_loss": -12.048076629638672, "global_step": 415690, "epoch": 2474} {"train_loss": -11.62093734741211, "global_step": 415691, "epoch": 2474} {"train_loss": -12.13715934753418, "global_step": 415692, "epoch": 2474} {"train_loss": -11.65066909790039, "global_step": 415693, "epoch": 2474} {"train_loss": -12.4292631149292, "global_step": 415694, "epoch": 2474} {"train_loss": -11.884669303894043, "global_step": 415695, "epoch": 2474} {"train_loss": -12.483600616455078, "global_step": 415696, "epoch": 2474} {"train_loss": -11.67646598815918, "global_step": 415697, "epoch": 2474} {"train_loss": -12.45225715637207, "global_step": 415698, "epoch": 2474} {"train_loss": -12.193464279174805, "global_step": 415699, "epoch": 2474} {"train_loss": -12.251947402954102, "global_step": 415700, "epoch": 2474} {"train_loss": -12.046567916870117, "global_step": 415701, "epoch": 2474} {"train_loss": -12.050901412963867, "global_step": 415702, "epoch": 2474} {"train_loss": -12.373546600341797, "global_step": 415703, "epoch": 2474} {"train_loss": -12.178400039672852, "global_step": 415704, "epoch": 2474} {"train_loss": -12.242156982421875, "global_step": 415705, "epoch": 2474} {"train_loss": -12.25710391998291, "global_step": 415706, "epoch": 2474} {"train_loss": -11.850172996520996, "global_step": 415707, "epoch": 2474} {"train_loss": -12.560826301574707, "global_step": 415708, "epoch": 2474} {"train_loss": -12.340103149414062, "global_step": 415709, "epoch": 2474} {"train_loss": -12.404540061950684, "global_step": 415710, "epoch": 2474} {"train_loss": -12.234031677246094, "global_step": 415711, "epoch": 2474} {"train_loss": -12.225223541259766, "global_step": 415712, "epoch": 2474} {"train_loss": -12.305354118347168, "global_step": 415713, "epoch": 2474} {"train_loss": -12.398014068603516, "global_step": 415714, "epoch": 2474} {"train_loss": -12.50938606262207, "global_step": 415715, "epoch": 2474} {"train_loss": -12.368393898010254, "global_step": 415716, "epoch": 2474} {"train_loss": -12.713460922241211, "global_step": 415717, "epoch": 2474} {"train_loss": -12.334714889526367, "global_step": 415718, "epoch": 2474} {"train_loss": -12.36988639831543, "global_step": 415719, "epoch": 2474} {"train_loss": -12.612871170043945, "global_step": 415720, "epoch": 2474} {"train_loss": -12.551409721374512, "global_step": 415721, "epoch": 2474} {"train_loss": -12.579645156860352, "global_step": 415722, "epoch": 2474} {"train_loss": -12.417815208435059, "global_step": 415723, "epoch": 2474} {"train_loss": -12.653057098388672, "global_step": 415724, "epoch": 2474} {"train_loss": -12.592388153076172, "global_step": 415725, "epoch": 2474} {"train_loss": -12.414563179016113, "global_step": 415726, "epoch": 2474} {"train_loss": -12.385262489318848, "global_step": 415727, "epoch": 2474} {"train_loss": -12.497648239135742, "global_step": 415728, "epoch": 2474} {"train_loss": -12.380062103271484, "global_step": 415729, "epoch": 2474} {"train_loss": -12.542423248291016, "global_step": 415730, "epoch": 2474} {"train_loss": -12.336738586425781, "global_step": 415731, "epoch": 2474} {"train_loss": -12.41054630279541, "global_step": 415732, "epoch": 2474} {"train_loss": -12.573927879333496, "global_step": 415733, "epoch": 2474} {"train_loss": -12.476444244384766, "global_step": 415734, "epoch": 2474} {"train_loss": -12.552249908447266, "global_step": 415735, "epoch": 2474} {"train_loss": -12.231477737426758, "global_step": 415736, "epoch": 2474} {"train_loss": -12.524859428405762, "global_step": 415737, "epoch": 2474} {"train_loss": -12.398374557495117, "global_step": 415738, "epoch": 2474} {"train_loss": -12.251834869384766, "global_step": 415739, "epoch": 2474} {"train_loss": -12.50185775756836, "global_step": 415740, "epoch": 2474} {"train_loss": -12.285038948059082, "global_step": 415741, "epoch": 2474} {"train_loss": -12.112438201904297, "global_step": 415742, "epoch": 2474} {"train_loss": -12.394903182983398, "global_step": 415743, "epoch": 2474} {"train_loss": -12.533073425292969, "global_step": 415744, "epoch": 2474} {"train_loss": -12.653539657592773, "global_step": 415745, "epoch": 2474} {"train_loss": -12.440305709838867, "global_step": 415746, "epoch": 2474} {"train_loss": -12.36117935180664, "global_step": 415747, "epoch": 2474} {"train_loss": -12.671698570251465, "global_step": 415748, "epoch": 2474} {"train_loss": -12.23603630065918, "global_step": 415749, "epoch": 2474} {"train_loss": -12.474590301513672, "global_step": 415750, "epoch": 2474} {"train_loss": -12.681310653686523, "global_step": 415751, "epoch": 2474} {"train_loss": -12.52265739440918, "global_step": 415752, "epoch": 2474} {"train_loss": -12.740814208984375, "global_step": 415753, "epoch": 2474} {"train_loss": -12.365703582763672, "global_step": 415754, "epoch": 2474} {"train_loss": -12.694307327270508, "global_step": 415755, "epoch": 2474} {"train_loss": -12.234870910644531, "global_step": 415756, "epoch": 2474} {"train_loss": -12.704816818237305, "global_step": 415757, "epoch": 2474} {"train_loss": -12.544915199279785, "global_step": 415758, "epoch": 2474} {"train_loss": -12.39872932434082, "global_step": 415759, "epoch": 2474} {"train_loss": -12.909088134765625, "global_step": 415760, "epoch": 2474} {"train_loss": -12.44749641418457, "global_step": 415761, "epoch": 2474} {"train_loss": -12.462133407592773, "global_step": 415762, "epoch": 2474} {"train_loss": -12.326610565185547, "global_step": 415763, "epoch": 2474} {"train_loss": -12.395393371582031, "global_step": 415764, "epoch": 2474} {"train_loss": -12.395051956176758, "global_step": 415765, "epoch": 2474} {"train_loss": -12.502174377441406, "global_step": 415766, "epoch": 2474} {"train_loss": -12.345483779907227, "global_step": 415767, "epoch": 2474} {"train_loss": -12.655628204345703, "global_step": 415768, "epoch": 2474} {"train_loss": -12.591598510742188, "global_step": 415769, "epoch": 2474} {"train_loss": -12.736795425415039, "global_step": 415770, "epoch": 2474} {"train_loss": -12.587116241455078, "global_step": 415771, "epoch": 2474} {"train_loss": -12.507396697998047, "global_step": 415772, "epoch": 2474} {"train_loss": -12.681635856628418, "global_step": 415773, "epoch": 2474} {"train_loss": -12.63589096069336, "global_step": 415774, "epoch": 2474} {"train_loss": -12.340627670288086, "global_step": 415775, "epoch": 2474} {"train_loss": -12.861698150634766, "global_step": 415776, "epoch": 2474} {"train_loss": -12.08203125, "global_step": 415777, "epoch": 2474} {"train_loss": -12.368115425109863, "global_step": 415778, "epoch": 2474} {"train_loss": -12.28502082824707, "global_step": 415779, "epoch": 2474} {"train_loss": -12.262679100036621, "global_step": 415780, "epoch": 2474} {"train_loss": -12.034058570861816, "global_step": 415781, "epoch": 2474} {"train_loss": -12.30698013305664, "global_step": 415782, "epoch": 2474} {"train_loss": -12.361127853393555, "global_step": 415783, "epoch": 2474} {"train_loss": -12.247310638427734, "global_step": 415784, "epoch": 2474} {"train_loss": -12.729551315307617, "global_step": 415785, "epoch": 2474} {"train_loss": -12.397241592407227, "global_step": 415786, "epoch": 2474} {"train_loss": -12.087915420532227, "global_step": 415787, "epoch": 2474} {"train_loss": -12.655742645263672, "global_step": 415788, "epoch": 2474} {"train_loss": -12.333669662475586, "global_step": 415789, "epoch": 2474} {"train_loss": -12.257184982299805, "global_step": 415790, "epoch": 2474} {"train_loss": -12.692035675048828, "global_step": 415791, "epoch": 2474} {"train_loss": -12.363718032836914, "global_step": 415792, "epoch": 2474} {"train_loss": -12.737462997436523, "global_step": 415793, "epoch": 2474} {"train_loss": -12.708120346069336, "global_step": 415794, "epoch": 2474} {"train_loss": -12.664118766784668, "global_step": 415795, "epoch": 2474} {"train_loss": -12.127131462097168, "global_step": 415796, "epoch": 2474} {"train_loss": -12.383111000061035, "global_step": 415797, "epoch": 2474} {"train_loss": -12.663753509521484, "global_step": 415798, "epoch": 2474} {"train_loss": -12.185596613656907, "global_step": 415799, "epoch": 2474, "val_loss": 306354.90625} {"train_loss": -12.586288452148438, "global_step": 415800, "epoch": 2475} {"train_loss": -12.399415969848633, "global_step": 415801, "epoch": 2475} {"train_loss": -12.608085632324219, "global_step": 415802, "epoch": 2475} {"train_loss": -12.33525276184082, "global_step": 415803, "epoch": 2475} {"train_loss": -12.477364540100098, "global_step": 415804, "epoch": 2475} {"train_loss": -12.242216110229492, "global_step": 415805, "epoch": 2475} {"train_loss": -12.166670799255371, "global_step": 415806, "epoch": 2475} {"train_loss": -12.246145248413086, "global_step": 415807, "epoch": 2475} {"train_loss": -12.231794357299805, "global_step": 415808, "epoch": 2475} {"train_loss": -12.027088165283203, "global_step": 415809, "epoch": 2475} {"train_loss": -11.395971298217773, "global_step": 415810, "epoch": 2475} {"train_loss": -11.31381607055664, "global_step": 415811, "epoch": 2475} {"train_loss": -11.361062049865723, "global_step": 415812, "epoch": 2475} {"train_loss": -12.314691543579102, "global_step": 415813, "epoch": 2475} {"train_loss": -11.709531784057617, "global_step": 415814, "epoch": 2475} {"train_loss": -12.217097282409668, "global_step": 415815, "epoch": 2475} {"train_loss": -12.354964256286621, "global_step": 415816, "epoch": 2475} {"train_loss": -11.436013221740723, "global_step": 415817, "epoch": 2475} {"train_loss": -12.532293319702148, "global_step": 415818, "epoch": 2475} {"train_loss": -12.493837356567383, "global_step": 415819, "epoch": 2475} {"train_loss": -12.004859924316406, "global_step": 415820, "epoch": 2475} {"train_loss": -11.293333053588867, "global_step": 415821, "epoch": 2475} {"train_loss": -12.532027244567871, "global_step": 415822, "epoch": 2475} {"train_loss": -11.462630271911621, "global_step": 415823, "epoch": 2475} {"train_loss": -10.54700756072998, "global_step": 415824, "epoch": 2475} {"train_loss": -12.067557334899902, "global_step": 415825, "epoch": 2475} {"train_loss": -10.905583381652832, "global_step": 415826, "epoch": 2475} {"train_loss": -11.914348602294922, "global_step": 415827, "epoch": 2475} {"train_loss": -12.040786743164062, "global_step": 415828, "epoch": 2475} {"train_loss": -9.656394958496094, "global_step": 415829, "epoch": 2475} {"train_loss": -11.712432861328125, "global_step": 415830, "epoch": 2475} {"train_loss": -9.67020034790039, "global_step": 415831, "epoch": 2475} {"train_loss": -11.217974662780762, "global_step": 415832, "epoch": 2475} {"train_loss": -10.971918106079102, "global_step": 415833, "epoch": 2475} {"train_loss": -10.47891616821289, "global_step": 415834, "epoch": 2475} {"train_loss": -11.343313217163086, "global_step": 415835, "epoch": 2475} {"train_loss": -10.340612411499023, "global_step": 415836, "epoch": 2475} {"train_loss": -11.462237358093262, "global_step": 415837, "epoch": 2475} {"train_loss": -11.182197570800781, "global_step": 415838, "epoch": 2475} {"train_loss": -11.482308387756348, "global_step": 415839, "epoch": 2475} {"train_loss": -11.048206329345703, "global_step": 415840, "epoch": 2475} {"train_loss": -11.493790626525879, "global_step": 415841, "epoch": 2475} {"train_loss": -10.738861083984375, "global_step": 415842, "epoch": 2475} {"train_loss": -11.792989730834961, "global_step": 415843, "epoch": 2475} {"train_loss": -11.070274353027344, "global_step": 415844, "epoch": 2475} {"train_loss": -10.633432388305664, "global_step": 415845, "epoch": 2475} {"train_loss": -11.499086380004883, "global_step": 415846, "epoch": 2475} {"train_loss": -11.635448455810547, "global_step": 415847, "epoch": 2475} {"train_loss": -11.704598426818848, "global_step": 415848, "epoch": 2475} {"train_loss": -11.678466796875, "global_step": 415849, "epoch": 2475} {"train_loss": -11.651196479797363, "global_step": 415850, "epoch": 2475} {"train_loss": -11.916727066040039, "global_step": 415851, "epoch": 2475} {"train_loss": -11.589021682739258, "global_step": 415852, "epoch": 2475} {"train_loss": -12.009350776672363, "global_step": 415853, "epoch": 2475} {"train_loss": -11.435972213745117, "global_step": 415854, "epoch": 2475} {"train_loss": -12.17127799987793, "global_step": 415855, "epoch": 2475} {"train_loss": -11.67841625213623, "global_step": 415856, "epoch": 2475} {"train_loss": -11.890220642089844, "global_step": 415857, "epoch": 2475} {"train_loss": -11.698498725891113, "global_step": 415858, "epoch": 2475} {"train_loss": -10.840188980102539, "global_step": 415859, "epoch": 2475} {"train_loss": -11.834821701049805, "global_step": 415860, "epoch": 2475} {"train_loss": -12.264627456665039, "global_step": 415861, "epoch": 2475} {"train_loss": -11.888182640075684, "global_step": 415862, "epoch": 2475} {"train_loss": -12.096317291259766, "global_step": 415863, "epoch": 2475} {"train_loss": -11.685245513916016, "global_step": 415864, "epoch": 2475} {"train_loss": -12.040069580078125, "global_step": 415865, "epoch": 2475} {"train_loss": -11.919021606445312, "global_step": 415866, "epoch": 2475} {"train_loss": -12.304666519165039, "global_step": 415867, "epoch": 2475} {"train_loss": -11.903633117675781, "global_step": 415868, "epoch": 2475} {"train_loss": -12.191513061523438, "global_step": 415869, "epoch": 2475} {"train_loss": -11.976268768310547, "global_step": 415870, "epoch": 2475} {"train_loss": -11.995864868164062, "global_step": 415871, "epoch": 2475} {"train_loss": -11.76169204711914, "global_step": 415872, "epoch": 2475} {"train_loss": -12.114468574523926, "global_step": 415873, "epoch": 2475} {"train_loss": -11.873332977294922, "global_step": 415874, "epoch": 2475} {"train_loss": -12.040064811706543, "global_step": 415875, "epoch": 2475} {"train_loss": -12.015730857849121, "global_step": 415876, "epoch": 2475} {"train_loss": -11.365745544433594, "global_step": 415877, "epoch": 2475} {"train_loss": -12.379690170288086, "global_step": 415878, "epoch": 2475} {"train_loss": -11.669417381286621, "global_step": 415879, "epoch": 2475} {"train_loss": -12.176794052124023, "global_step": 415880, "epoch": 2475} {"train_loss": -12.14218807220459, "global_step": 415881, "epoch": 2475} {"train_loss": -11.457466125488281, "global_step": 415882, "epoch": 2475} {"train_loss": -11.971839904785156, "global_step": 415883, "epoch": 2475} {"train_loss": -11.960636138916016, "global_step": 415884, "epoch": 2475} {"train_loss": -11.844086647033691, "global_step": 415885, "epoch": 2475} {"train_loss": -12.227781295776367, "global_step": 415886, "epoch": 2475} {"train_loss": -11.392980575561523, "global_step": 415887, "epoch": 2475} {"train_loss": -11.762246131896973, "global_step": 415888, "epoch": 2475} {"train_loss": -11.764032363891602, "global_step": 415889, "epoch": 2475} {"train_loss": -12.086587905883789, "global_step": 415890, "epoch": 2475} {"train_loss": -11.780045509338379, "global_step": 415891, "epoch": 2475} {"train_loss": -12.090807914733887, "global_step": 415892, "epoch": 2475} {"train_loss": -12.354236602783203, "global_step": 415893, "epoch": 2475} {"train_loss": -12.184008598327637, "global_step": 415894, "epoch": 2475} {"train_loss": -12.273835182189941, "global_step": 415895, "epoch": 2475} {"train_loss": -12.29826545715332, "global_step": 415896, "epoch": 2475} {"train_loss": -12.36328125, "global_step": 415897, "epoch": 2475} {"train_loss": -12.26424789428711, "global_step": 415898, "epoch": 2475} {"train_loss": -12.406842231750488, "global_step": 415899, "epoch": 2475} {"train_loss": -12.309221267700195, "global_step": 415900, "epoch": 2475} {"train_loss": -12.265726089477539, "global_step": 415901, "epoch": 2475} {"train_loss": -12.002202987670898, "global_step": 415902, "epoch": 2475} {"train_loss": -12.138813018798828, "global_step": 415903, "epoch": 2475} {"train_loss": -12.332998275756836, "global_step": 415904, "epoch": 2475} {"train_loss": -12.192023277282715, "global_step": 415905, "epoch": 2475} {"train_loss": -12.21596908569336, "global_step": 415906, "epoch": 2475} {"train_loss": -12.08485221862793, "global_step": 415907, "epoch": 2475} {"train_loss": -12.109842300415039, "global_step": 415908, "epoch": 2475} {"train_loss": -12.129573822021484, "global_step": 415909, "epoch": 2475} {"train_loss": -12.339470863342285, "global_step": 415910, "epoch": 2475} {"train_loss": -11.969417572021484, "global_step": 415911, "epoch": 2475} {"train_loss": -12.438311576843262, "global_step": 415912, "epoch": 2475} {"train_loss": -12.147024154663086, "global_step": 415913, "epoch": 2475} {"train_loss": -11.962279319763184, "global_step": 415914, "epoch": 2475} {"train_loss": -12.237436294555664, "global_step": 415915, "epoch": 2475} {"train_loss": -11.9852294921875, "global_step": 415916, "epoch": 2475} {"train_loss": -11.875181198120117, "global_step": 415917, "epoch": 2475} {"train_loss": -11.617767333984375, "global_step": 415918, "epoch": 2475} {"train_loss": -11.989442825317383, "global_step": 415919, "epoch": 2475} {"train_loss": -11.053071022033691, "global_step": 415920, "epoch": 2475} {"train_loss": -11.419561386108398, "global_step": 415921, "epoch": 2475} {"train_loss": -10.015121459960938, "global_step": 415922, "epoch": 2475} {"train_loss": -11.064691543579102, "global_step": 415923, "epoch": 2475} {"train_loss": -10.296579360961914, "global_step": 415924, "epoch": 2475} {"train_loss": -10.989957809448242, "global_step": 415925, "epoch": 2475} {"train_loss": -11.564416885375977, "global_step": 415926, "epoch": 2475} {"train_loss": -11.198530197143555, "global_step": 415927, "epoch": 2475} {"train_loss": -10.987465858459473, "global_step": 415928, "epoch": 2475} {"train_loss": -12.034102439880371, "global_step": 415929, "epoch": 2475} {"train_loss": -11.395801544189453, "global_step": 415930, "epoch": 2475} {"train_loss": -11.099464416503906, "global_step": 415931, "epoch": 2475} {"train_loss": -12.020800590515137, "global_step": 415932, "epoch": 2475} {"train_loss": -10.863444328308105, "global_step": 415933, "epoch": 2475} {"train_loss": -12.18046760559082, "global_step": 415934, "epoch": 2475} {"train_loss": -11.33193302154541, "global_step": 415935, "epoch": 2475} {"train_loss": -11.87667179107666, "global_step": 415936, "epoch": 2475} {"train_loss": -11.810771942138672, "global_step": 415937, "epoch": 2475} {"train_loss": -11.608542442321777, "global_step": 415938, "epoch": 2475} {"train_loss": -11.74402141571045, "global_step": 415939, "epoch": 2475} {"train_loss": -11.449807167053223, "global_step": 415940, "epoch": 2475} {"train_loss": -11.539291381835938, "global_step": 415941, "epoch": 2475} {"train_loss": -11.861089706420898, "global_step": 415942, "epoch": 2475} {"train_loss": -11.584672927856445, "global_step": 415943, "epoch": 2475} {"train_loss": -12.270559310913086, "global_step": 415944, "epoch": 2475} {"train_loss": -12.168789863586426, "global_step": 415945, "epoch": 2475} {"train_loss": -12.006464958190918, "global_step": 415946, "epoch": 2475} {"train_loss": -11.93325424194336, "global_step": 415947, "epoch": 2475} {"train_loss": -11.6343355178833, "global_step": 415948, "epoch": 2475} {"train_loss": -12.031106948852539, "global_step": 415949, "epoch": 2475} {"train_loss": -11.806512832641602, "global_step": 415950, "epoch": 2475} {"train_loss": -12.098241806030273, "global_step": 415951, "epoch": 2475} {"train_loss": -11.639212608337402, "global_step": 415952, "epoch": 2475} {"train_loss": -12.498000144958496, "global_step": 415953, "epoch": 2475} {"train_loss": -11.876558303833008, "global_step": 415954, "epoch": 2475} {"train_loss": -12.334436416625977, "global_step": 415955, "epoch": 2475} {"train_loss": -12.310789108276367, "global_step": 415956, "epoch": 2475} {"train_loss": -11.944538116455078, "global_step": 415957, "epoch": 2475} {"train_loss": -12.398235321044922, "global_step": 415958, "epoch": 2475} {"train_loss": -11.849737167358398, "global_step": 415959, "epoch": 2475} {"train_loss": -12.206415176391602, "global_step": 415960, "epoch": 2475} {"train_loss": -12.214009284973145, "global_step": 415961, "epoch": 2475} {"train_loss": -12.242231369018555, "global_step": 415962, "epoch": 2475} {"train_loss": -12.219606399536133, "global_step": 415963, "epoch": 2475} {"train_loss": -12.383316040039062, "global_step": 415964, "epoch": 2475} {"train_loss": -12.512962341308594, "global_step": 415965, "epoch": 2475} {"train_loss": -12.443948745727539, "global_step": 415966, "epoch": 2475} {"train_loss": -11.80785616238912, "global_step": 415967, "epoch": 2475, "val_loss": 306734.0625, "train_action_mse_error": 0.16643545031547546} {"train_loss": -12.140424728393555, "global_step": 415968, "epoch": 2476} {"train_loss": -12.26136589050293, "global_step": 415969, "epoch": 2476} {"train_loss": -11.825794219970703, "global_step": 415970, "epoch": 2476} {"train_loss": -12.408554077148438, "global_step": 415971, "epoch": 2476} {"train_loss": -12.140052795410156, "global_step": 415972, "epoch": 2476} {"train_loss": -12.289700508117676, "global_step": 415973, "epoch": 2476} {"train_loss": -12.383576393127441, "global_step": 415974, "epoch": 2476} {"train_loss": -12.380152702331543, "global_step": 415975, "epoch": 2476} {"train_loss": -12.348709106445312, "global_step": 415976, "epoch": 2476} {"train_loss": -12.355539321899414, "global_step": 415977, "epoch": 2476} {"train_loss": -12.42325210571289, "global_step": 415978, "epoch": 2476} {"train_loss": -12.393495559692383, "global_step": 415979, "epoch": 2476} {"train_loss": -12.119759559631348, "global_step": 415980, "epoch": 2476} {"train_loss": -12.51274299621582, "global_step": 415981, "epoch": 2476} {"train_loss": -12.55130386352539, "global_step": 415982, "epoch": 2476} {"train_loss": -12.318313598632812, "global_step": 415983, "epoch": 2476} {"train_loss": -12.559715270996094, "global_step": 415984, "epoch": 2476} {"train_loss": -12.205669403076172, "global_step": 415985, "epoch": 2476} {"train_loss": -12.539901733398438, "global_step": 415986, "epoch": 2476} {"train_loss": -12.390594482421875, "global_step": 415987, "epoch": 2476} {"train_loss": -12.374431610107422, "global_step": 415988, "epoch": 2476} {"train_loss": -12.528726577758789, "global_step": 415989, "epoch": 2476} {"train_loss": -12.518331527709961, "global_step": 415990, "epoch": 2476} {"train_loss": -12.300777435302734, "global_step": 415991, "epoch": 2476} {"train_loss": -12.51561164855957, "global_step": 415992, "epoch": 2476} {"train_loss": -12.350035667419434, "global_step": 415993, "epoch": 2476} {"train_loss": -12.753385543823242, "global_step": 415994, "epoch": 2476} {"train_loss": -12.267463684082031, "global_step": 415995, "epoch": 2476} {"train_loss": -12.659297943115234, "global_step": 415996, "epoch": 2476} {"train_loss": -12.536457061767578, "global_step": 415997, "epoch": 2476} {"train_loss": -12.5236234664917, "global_step": 415998, "epoch": 2476} {"train_loss": -12.590412139892578, "global_step": 415999, "epoch": 2476} {"train_loss": -12.58253002166748, "global_step": 416000, "epoch": 2476} {"train_loss": -12.78282642364502, "global_step": 416001, "epoch": 2476} {"train_loss": -12.490399360656738, "global_step": 416002, "epoch": 2476} {"train_loss": -12.81202220916748, "global_step": 416003, "epoch": 2476} {"train_loss": -12.77306079864502, "global_step": 416004, "epoch": 2476} {"train_loss": -12.435827255249023, "global_step": 416005, "epoch": 2476} {"train_loss": -12.71484375, "global_step": 416006, "epoch": 2476} {"train_loss": -12.363576889038086, "global_step": 416007, "epoch": 2476} {"train_loss": -12.750655174255371, "global_step": 416008, "epoch": 2476} {"train_loss": -12.605473518371582, "global_step": 416009, "epoch": 2476} {"train_loss": -12.444607734680176, "global_step": 416010, "epoch": 2476} {"train_loss": -12.51873779296875, "global_step": 416011, "epoch": 2476} {"train_loss": -12.47132396697998, "global_step": 416012, "epoch": 2476} {"train_loss": -12.76560115814209, "global_step": 416013, "epoch": 2476} {"train_loss": -12.459927558898926, "global_step": 416014, "epoch": 2476} {"train_loss": -12.828531265258789, "global_step": 416015, "epoch": 2476} {"train_loss": -12.72107982635498, "global_step": 416016, "epoch": 2476} {"train_loss": -12.711734771728516, "global_step": 416017, "epoch": 2476} {"train_loss": -12.534626960754395, "global_step": 416018, "epoch": 2476} {"train_loss": -12.795183181762695, "global_step": 416019, "epoch": 2476} {"train_loss": -12.624682426452637, "global_step": 416020, "epoch": 2476} {"train_loss": -12.61329460144043, "global_step": 416021, "epoch": 2476} {"train_loss": -12.505544662475586, "global_step": 416022, "epoch": 2476} {"train_loss": -12.779823303222656, "global_step": 416023, "epoch": 2476} {"train_loss": -12.712447166442871, "global_step": 416024, "epoch": 2476} {"train_loss": -12.599614143371582, "global_step": 416025, "epoch": 2476} {"train_loss": -12.651902198791504, "global_step": 416026, "epoch": 2476} {"train_loss": -12.745830535888672, "global_step": 416027, "epoch": 2476} {"train_loss": -12.803291320800781, "global_step": 416028, "epoch": 2476} {"train_loss": -12.674967765808105, "global_step": 416029, "epoch": 2476} {"train_loss": -12.438097953796387, "global_step": 416030, "epoch": 2476} {"train_loss": -12.869439125061035, "global_step": 416031, "epoch": 2476} {"train_loss": -12.1781005859375, "global_step": 416032, "epoch": 2476} {"train_loss": -12.886985778808594, "global_step": 416033, "epoch": 2476} {"train_loss": -12.728757858276367, "global_step": 416034, "epoch": 2476} {"train_loss": -12.826452255249023, "global_step": 416035, "epoch": 2476} {"train_loss": -12.537214279174805, "global_step": 416036, "epoch": 2476} {"train_loss": -12.585086822509766, "global_step": 416037, "epoch": 2476} {"train_loss": -12.750120162963867, "global_step": 416038, "epoch": 2476} {"train_loss": -12.758513450622559, "global_step": 416039, "epoch": 2476} {"train_loss": -12.548527717590332, "global_step": 416040, "epoch": 2476} {"train_loss": -12.71098804473877, "global_step": 416041, "epoch": 2476} {"train_loss": -12.544098854064941, "global_step": 416042, "epoch": 2476} {"train_loss": -12.38199234008789, "global_step": 416043, "epoch": 2476} {"train_loss": -12.20134162902832, "global_step": 416044, "epoch": 2476} {"train_loss": -12.575176239013672, "global_step": 416045, "epoch": 2476} {"train_loss": -12.684722900390625, "global_step": 416046, "epoch": 2476} {"train_loss": -12.714885711669922, "global_step": 416047, "epoch": 2476} {"train_loss": -11.010225296020508, "global_step": 416048, "epoch": 2476} {"train_loss": -12.216833114624023, "global_step": 416049, "epoch": 2476} {"train_loss": -12.337127685546875, "global_step": 416050, "epoch": 2476} {"train_loss": -12.593177795410156, "global_step": 416051, "epoch": 2476} {"train_loss": -11.252403259277344, "global_step": 416052, "epoch": 2476} {"train_loss": -11.379297256469727, "global_step": 416053, "epoch": 2476} {"train_loss": -11.32702350616455, "global_step": 416054, "epoch": 2476} {"train_loss": -11.164588928222656, "global_step": 416055, "epoch": 2476} {"train_loss": -12.392929077148438, "global_step": 416056, "epoch": 2476} {"train_loss": -11.65178108215332, "global_step": 416057, "epoch": 2476} {"train_loss": -11.406488418579102, "global_step": 416058, "epoch": 2476} {"train_loss": -11.987100601196289, "global_step": 416059, "epoch": 2476} {"train_loss": -11.921807289123535, "global_step": 416060, "epoch": 2476} {"train_loss": -10.15390682220459, "global_step": 416061, "epoch": 2476} {"train_loss": -11.875468254089355, "global_step": 416062, "epoch": 2476} {"train_loss": -11.801240921020508, "global_step": 416063, "epoch": 2476} {"train_loss": -10.619626998901367, "global_step": 416064, "epoch": 2476} {"train_loss": -11.890365600585938, "global_step": 416065, "epoch": 2476} {"train_loss": -11.293033599853516, "global_step": 416066, "epoch": 2476} {"train_loss": -10.676017761230469, "global_step": 416067, "epoch": 2476} {"train_loss": -11.442716598510742, "global_step": 416068, "epoch": 2476} {"train_loss": -9.31554126739502, "global_step": 416069, "epoch": 2476} {"train_loss": -9.92044448852539, "global_step": 416070, "epoch": 2476} {"train_loss": -10.337519645690918, "global_step": 416071, "epoch": 2476} {"train_loss": -10.946097373962402, "global_step": 416072, "epoch": 2476} {"train_loss": -8.769880294799805, "global_step": 416073, "epoch": 2476} {"train_loss": -10.38155746459961, "global_step": 416074, "epoch": 2476} {"train_loss": -10.95663070678711, "global_step": 416075, "epoch": 2476} {"train_loss": -10.189837455749512, "global_step": 416076, "epoch": 2476} {"train_loss": -9.552803039550781, "global_step": 416077, "epoch": 2476} {"train_loss": -10.370976448059082, "global_step": 416078, "epoch": 2476} {"train_loss": -10.498281478881836, "global_step": 416079, "epoch": 2476} {"train_loss": -9.432723045349121, "global_step": 416080, "epoch": 2476} {"train_loss": -10.522562026977539, "global_step": 416081, "epoch": 2476} {"train_loss": -10.219453811645508, "global_step": 416082, "epoch": 2476} {"train_loss": -8.446356773376465, "global_step": 416083, "epoch": 2476} {"train_loss": -9.017781257629395, "global_step": 416084, "epoch": 2476} {"train_loss": -11.58664608001709, "global_step": 416085, "epoch": 2476} {"train_loss": -8.307384490966797, "global_step": 416086, "epoch": 2476} {"train_loss": -10.860214233398438, "global_step": 416087, "epoch": 2476} {"train_loss": -10.811317443847656, "global_step": 416088, "epoch": 2476} {"train_loss": -10.734128952026367, "global_step": 416089, "epoch": 2476} {"train_loss": -11.185853004455566, "global_step": 416090, "epoch": 2476} {"train_loss": -10.464879989624023, "global_step": 416091, "epoch": 2476} {"train_loss": -10.270954132080078, "global_step": 416092, "epoch": 2476} {"train_loss": -10.860708236694336, "global_step": 416093, "epoch": 2476} {"train_loss": -11.022638320922852, "global_step": 416094, "epoch": 2476} {"train_loss": -10.45380973815918, "global_step": 416095, "epoch": 2476} {"train_loss": -11.648965835571289, "global_step": 416096, "epoch": 2476} {"train_loss": -10.613496780395508, "global_step": 416097, "epoch": 2476} {"train_loss": -11.615713119506836, "global_step": 416098, "epoch": 2476} {"train_loss": -10.441459655761719, "global_step": 416099, "epoch": 2476} {"train_loss": -10.748425483703613, "global_step": 416100, "epoch": 2476} {"train_loss": -10.998948097229004, "global_step": 416101, "epoch": 2476} {"train_loss": -11.58169174194336, "global_step": 416102, "epoch": 2476} {"train_loss": -10.937493324279785, "global_step": 416103, "epoch": 2476} {"train_loss": -11.637208938598633, "global_step": 416104, "epoch": 2476} {"train_loss": -10.366109848022461, "global_step": 416105, "epoch": 2476} {"train_loss": -12.054593086242676, "global_step": 416106, "epoch": 2476} {"train_loss": -11.324945449829102, "global_step": 416107, "epoch": 2476} {"train_loss": -11.462335586547852, "global_step": 416108, "epoch": 2476} {"train_loss": -11.193582534790039, "global_step": 416109, "epoch": 2476} {"train_loss": -11.478736877441406, "global_step": 416110, "epoch": 2476} {"train_loss": -11.64178466796875, "global_step": 416111, "epoch": 2476} {"train_loss": -11.855413436889648, "global_step": 416112, "epoch": 2476} {"train_loss": -11.907044410705566, "global_step": 416113, "epoch": 2476} {"train_loss": -11.401642799377441, "global_step": 416114, "epoch": 2476} {"train_loss": -11.521992683410645, "global_step": 416115, "epoch": 2476} {"train_loss": -11.103553771972656, "global_step": 416116, "epoch": 2476} {"train_loss": -10.605544090270996, "global_step": 416117, "epoch": 2476} {"train_loss": -12.157588958740234, "global_step": 416118, "epoch": 2476} {"train_loss": -10.138050079345703, "global_step": 416119, "epoch": 2476} {"train_loss": -10.325651168823242, "global_step": 416120, "epoch": 2476} {"train_loss": -11.269182205200195, "global_step": 416121, "epoch": 2476} {"train_loss": -11.717096328735352, "global_step": 416122, "epoch": 2476} {"train_loss": -10.841779708862305, "global_step": 416123, "epoch": 2476} {"train_loss": -11.203376770019531, "global_step": 416124, "epoch": 2476} {"train_loss": -11.639801025390625, "global_step": 416125, "epoch": 2476} {"train_loss": -10.811595916748047, "global_step": 416126, "epoch": 2476} {"train_loss": -11.385564804077148, "global_step": 416127, "epoch": 2476} {"train_loss": -11.455757141113281, "global_step": 416128, "epoch": 2476} {"train_loss": -11.123594284057617, "global_step": 416129, "epoch": 2476} {"train_loss": -11.102127075195312, "global_step": 416130, "epoch": 2476} {"train_loss": -11.61176872253418, "global_step": 416131, "epoch": 2476} {"train_loss": -11.160895347595215, "global_step": 416132, "epoch": 2476} {"train_loss": -11.538248062133789, "global_step": 416133, "epoch": 2476} {"train_loss": -11.942880630493164, "global_step": 416134, "epoch": 2476} {"train_loss": -11.73642783505576, "global_step": 416135, "epoch": 2476, "val_loss": 300093.125} {"train_loss": -11.725433349609375, "global_step": 416136, "epoch": 2477} {"train_loss": -11.640449523925781, "global_step": 416137, "epoch": 2477} {"train_loss": -11.665569305419922, "global_step": 416138, "epoch": 2477} {"train_loss": -11.660331726074219, "global_step": 416139, "epoch": 2477} {"train_loss": -11.565034866333008, "global_step": 416140, "epoch": 2477} {"train_loss": -11.978500366210938, "global_step": 416141, "epoch": 2477} {"train_loss": -11.629432678222656, "global_step": 416142, "epoch": 2477} {"train_loss": -12.143367767333984, "global_step": 416143, "epoch": 2477} {"train_loss": -12.22039794921875, "global_step": 416144, "epoch": 2477} {"train_loss": -11.817161560058594, "global_step": 416145, "epoch": 2477} {"train_loss": -11.949315071105957, "global_step": 416146, "epoch": 2477} {"train_loss": -12.078497886657715, "global_step": 416147, "epoch": 2477} {"train_loss": -11.772380828857422, "global_step": 416148, "epoch": 2477} {"train_loss": -11.726588249206543, "global_step": 416149, "epoch": 2477} {"train_loss": -11.6939058303833, "global_step": 416150, "epoch": 2477} {"train_loss": -12.069923400878906, "global_step": 416151, "epoch": 2477} {"train_loss": -12.077690124511719, "global_step": 416152, "epoch": 2477} {"train_loss": -12.075845718383789, "global_step": 416153, "epoch": 2477} {"train_loss": -11.873678207397461, "global_step": 416154, "epoch": 2477} {"train_loss": -12.144588470458984, "global_step": 416155, "epoch": 2477} {"train_loss": -12.080521583557129, "global_step": 416156, "epoch": 2477} {"train_loss": -12.216011047363281, "global_step": 416157, "epoch": 2477} {"train_loss": -12.232982635498047, "global_step": 416158, "epoch": 2477} {"train_loss": -12.190529823303223, "global_step": 416159, "epoch": 2477} {"train_loss": -12.29593276977539, "global_step": 416160, "epoch": 2477} {"train_loss": -12.223388671875, "global_step": 416161, "epoch": 2477} {"train_loss": -12.307655334472656, "global_step": 416162, "epoch": 2477} {"train_loss": -12.3635892868042, "global_step": 416163, "epoch": 2477} {"train_loss": -12.18704605102539, "global_step": 416164, "epoch": 2477} {"train_loss": -12.538299560546875, "global_step": 416165, "epoch": 2477} {"train_loss": -11.93227767944336, "global_step": 416166, "epoch": 2477} {"train_loss": -12.341087341308594, "global_step": 416167, "epoch": 2477} {"train_loss": -12.492044448852539, "global_step": 416168, "epoch": 2477} {"train_loss": -12.10568618774414, "global_step": 416169, "epoch": 2477} {"train_loss": -12.217962265014648, "global_step": 416170, "epoch": 2477} {"train_loss": -12.07363224029541, "global_step": 416171, "epoch": 2477} {"train_loss": -12.371073722839355, "global_step": 416172, "epoch": 2477} {"train_loss": -12.355323791503906, "global_step": 416173, "epoch": 2477} {"train_loss": -12.437196731567383, "global_step": 416174, "epoch": 2477} {"train_loss": -12.430760383605957, "global_step": 416175, "epoch": 2477} {"train_loss": -12.418289184570312, "global_step": 416176, "epoch": 2477} {"train_loss": -12.428336143493652, "global_step": 416177, "epoch": 2477} {"train_loss": -12.616554260253906, "global_step": 416178, "epoch": 2477} {"train_loss": -12.564634323120117, "global_step": 416179, "epoch": 2477} {"train_loss": -12.414872169494629, "global_step": 416180, "epoch": 2477} {"train_loss": -12.553983688354492, "global_step": 416181, "epoch": 2477} {"train_loss": -12.345978736877441, "global_step": 416182, "epoch": 2477} {"train_loss": -12.6386079788208, "global_step": 416183, "epoch": 2477} {"train_loss": -12.655126571655273, "global_step": 416184, "epoch": 2477} {"train_loss": -12.24339485168457, "global_step": 416185, "epoch": 2477} {"train_loss": -12.554505348205566, "global_step": 416186, "epoch": 2477} {"train_loss": -12.343832969665527, "global_step": 416187, "epoch": 2477} {"train_loss": -12.487874984741211, "global_step": 416188, "epoch": 2477} {"train_loss": -12.705853462219238, "global_step": 416189, "epoch": 2477} {"train_loss": -12.660967826843262, "global_step": 416190, "epoch": 2477} {"train_loss": -12.798439025878906, "global_step": 416191, "epoch": 2477} {"train_loss": -12.365875244140625, "global_step": 416192, "epoch": 2477} {"train_loss": -12.392372131347656, "global_step": 416193, "epoch": 2477} {"train_loss": -12.502960205078125, "global_step": 416194, "epoch": 2477} {"train_loss": -12.570975303649902, "global_step": 416195, "epoch": 2477} {"train_loss": -12.47536849975586, "global_step": 416196, "epoch": 2477} {"train_loss": -12.411924362182617, "global_step": 416197, "epoch": 2477} {"train_loss": -12.565595626831055, "global_step": 416198, "epoch": 2477} {"train_loss": -12.756293296813965, "global_step": 416199, "epoch": 2477} {"train_loss": -12.60216236114502, "global_step": 416200, "epoch": 2477} {"train_loss": -12.880533218383789, "global_step": 416201, "epoch": 2477} {"train_loss": -12.766876220703125, "global_step": 416202, "epoch": 2477} {"train_loss": -12.596257209777832, "global_step": 416203, "epoch": 2477} {"train_loss": -12.705275535583496, "global_step": 416204, "epoch": 2477} {"train_loss": -12.761307716369629, "global_step": 416205, "epoch": 2477} {"train_loss": -12.765701293945312, "global_step": 416206, "epoch": 2477} {"train_loss": -12.766549110412598, "global_step": 416207, "epoch": 2477} {"train_loss": -12.720388412475586, "global_step": 416208, "epoch": 2477} {"train_loss": -12.250276565551758, "global_step": 416209, "epoch": 2477} {"train_loss": -12.713980674743652, "global_step": 416210, "epoch": 2477} {"train_loss": -12.51064682006836, "global_step": 416211, "epoch": 2477} {"train_loss": -12.532803535461426, "global_step": 416212, "epoch": 2477} {"train_loss": -12.671874046325684, "global_step": 416213, "epoch": 2477} {"train_loss": -12.403034210205078, "global_step": 416214, "epoch": 2477} {"train_loss": -12.614389419555664, "global_step": 416215, "epoch": 2477} {"train_loss": -12.807598114013672, "global_step": 416216, "epoch": 2477} {"train_loss": -12.2757568359375, "global_step": 416217, "epoch": 2477} {"train_loss": -12.814923286437988, "global_step": 416218, "epoch": 2477} {"train_loss": -12.780176162719727, "global_step": 416219, "epoch": 2477} {"train_loss": -12.297514915466309, "global_step": 416220, "epoch": 2477} {"train_loss": -12.707481384277344, "global_step": 416221, "epoch": 2477} {"train_loss": -12.704462051391602, "global_step": 416222, "epoch": 2477} {"train_loss": -12.701860427856445, "global_step": 416223, "epoch": 2477} {"train_loss": -12.684891700744629, "global_step": 416224, "epoch": 2477} {"train_loss": -12.592424392700195, "global_step": 416225, "epoch": 2477} {"train_loss": -12.70321273803711, "global_step": 416226, "epoch": 2477} {"train_loss": -12.436426162719727, "global_step": 416227, "epoch": 2477} {"train_loss": -12.7095308303833, "global_step": 416228, "epoch": 2477} {"train_loss": -12.560661315917969, "global_step": 416229, "epoch": 2477} {"train_loss": -12.718818664550781, "global_step": 416230, "epoch": 2477} {"train_loss": -12.39821720123291, "global_step": 416231, "epoch": 2477} {"train_loss": -12.538599967956543, "global_step": 416232, "epoch": 2477} {"train_loss": -12.805032730102539, "global_step": 416233, "epoch": 2477} {"train_loss": -12.596040725708008, "global_step": 416234, "epoch": 2477} {"train_loss": -12.731040954589844, "global_step": 416235, "epoch": 2477} {"train_loss": -12.52335262298584, "global_step": 416236, "epoch": 2477} {"train_loss": -12.948942184448242, "global_step": 416237, "epoch": 2477} {"train_loss": -12.478131294250488, "global_step": 416238, "epoch": 2477} {"train_loss": -12.47559928894043, "global_step": 416239, "epoch": 2477} {"train_loss": -11.917583465576172, "global_step": 416240, "epoch": 2477} {"train_loss": -12.121106147766113, "global_step": 416241, "epoch": 2477} {"train_loss": -12.05320930480957, "global_step": 416242, "epoch": 2477} {"train_loss": -12.31993293762207, "global_step": 416243, "epoch": 2477} {"train_loss": -12.620967864990234, "global_step": 416244, "epoch": 2477} {"train_loss": -11.68720817565918, "global_step": 416245, "epoch": 2477} {"train_loss": -12.805135726928711, "global_step": 416246, "epoch": 2477} {"train_loss": -11.365485191345215, "global_step": 416247, "epoch": 2477} {"train_loss": -10.150871276855469, "global_step": 416248, "epoch": 2477} {"train_loss": -11.146536827087402, "global_step": 416249, "epoch": 2477} {"train_loss": -11.453760147094727, "global_step": 416250, "epoch": 2477} {"train_loss": -9.910079002380371, "global_step": 416251, "epoch": 2477} {"train_loss": -9.410255432128906, "global_step": 416252, "epoch": 2477} {"train_loss": -9.445959091186523, "global_step": 416253, "epoch": 2477} {"train_loss": -10.494911193847656, "global_step": 416254, "epoch": 2477} {"train_loss": -10.048032760620117, "global_step": 416255, "epoch": 2477} {"train_loss": -9.764785766601562, "global_step": 416256, "epoch": 2477} {"train_loss": -10.485321044921875, "global_step": 416257, "epoch": 2477} {"train_loss": -10.482588768005371, "global_step": 416258, "epoch": 2477} {"train_loss": -10.949807167053223, "global_step": 416259, "epoch": 2477} {"train_loss": -10.573477745056152, "global_step": 416260, "epoch": 2477} {"train_loss": -11.274338722229004, "global_step": 416261, "epoch": 2477} {"train_loss": -11.465848922729492, "global_step": 416262, "epoch": 2477} {"train_loss": -11.511917114257812, "global_step": 416263, "epoch": 2477} {"train_loss": -11.125439643859863, "global_step": 416264, "epoch": 2477} {"train_loss": -11.400840759277344, "global_step": 416265, "epoch": 2477} {"train_loss": -11.102885246276855, "global_step": 416266, "epoch": 2477} {"train_loss": -10.568343162536621, "global_step": 416267, "epoch": 2477} {"train_loss": -9.599372863769531, "global_step": 416268, "epoch": 2477} {"train_loss": -8.128213882446289, "global_step": 416269, "epoch": 2477} {"train_loss": -10.601699829101562, "global_step": 416270, "epoch": 2477} {"train_loss": -10.17895221710205, "global_step": 416271, "epoch": 2477} {"train_loss": -9.03823471069336, "global_step": 416272, "epoch": 2477} {"train_loss": -9.029632568359375, "global_step": 416273, "epoch": 2477} {"train_loss": -9.038764953613281, "global_step": 416274, "epoch": 2477} {"train_loss": -9.128917694091797, "global_step": 416275, "epoch": 2477} {"train_loss": -10.608506202697754, "global_step": 416276, "epoch": 2477} {"train_loss": -8.442115783691406, "global_step": 416277, "epoch": 2477} {"train_loss": -10.260734558105469, "global_step": 416278, "epoch": 2477} {"train_loss": -10.832064628601074, "global_step": 416279, "epoch": 2477} {"train_loss": -9.663117408752441, "global_step": 416280, "epoch": 2477} {"train_loss": -9.506647109985352, "global_step": 416281, "epoch": 2477} {"train_loss": -9.624190330505371, "global_step": 416282, "epoch": 2477} {"train_loss": -9.362184524536133, "global_step": 416283, "epoch": 2477} {"train_loss": -11.47451400756836, "global_step": 416284, "epoch": 2477} {"train_loss": -9.947305679321289, "global_step": 416285, "epoch": 2477} {"train_loss": -10.882951736450195, "global_step": 416286, "epoch": 2477} {"train_loss": -11.279488563537598, "global_step": 416287, "epoch": 2477} {"train_loss": -10.905745506286621, "global_step": 416288, "epoch": 2477} {"train_loss": -10.45468521118164, "global_step": 416289, "epoch": 2477} {"train_loss": -10.524735450744629, "global_step": 416290, "epoch": 2477} {"train_loss": -11.519721984863281, "global_step": 416291, "epoch": 2477} {"train_loss": -10.353891372680664, "global_step": 416292, "epoch": 2477} {"train_loss": -11.183890342712402, "global_step": 416293, "epoch": 2477} {"train_loss": -11.723514556884766, "global_step": 416294, "epoch": 2477} {"train_loss": -10.817142486572266, "global_step": 416295, "epoch": 2477} {"train_loss": -11.318197250366211, "global_step": 416296, "epoch": 2477} {"train_loss": -11.022884368896484, "global_step": 416297, "epoch": 2477} {"train_loss": -10.19131851196289, "global_step": 416298, "epoch": 2477} {"train_loss": -12.11638069152832, "global_step": 416299, "epoch": 2477} {"train_loss": -10.582809448242188, "global_step": 416300, "epoch": 2477} {"train_loss": -11.827476501464844, "global_step": 416301, "epoch": 2477} {"train_loss": -11.48861312866211, "global_step": 416302, "epoch": 2477} {"train_loss": -11.742097519692921, "global_step": 416303, "epoch": 2477, "val_loss": 302795.9375} {"train_loss": -11.988656997680664, "global_step": 416304, "epoch": 2478} {"train_loss": -11.807762145996094, "global_step": 416305, "epoch": 2478} {"train_loss": -11.674640655517578, "global_step": 416306, "epoch": 2478} {"train_loss": -12.216312408447266, "global_step": 416307, "epoch": 2478} {"train_loss": -11.985283851623535, "global_step": 416308, "epoch": 2478} {"train_loss": -11.845253944396973, "global_step": 416309, "epoch": 2478} {"train_loss": -12.10075569152832, "global_step": 416310, "epoch": 2478} {"train_loss": -11.939059257507324, "global_step": 416311, "epoch": 2478} {"train_loss": -11.951098442077637, "global_step": 416312, "epoch": 2478} {"train_loss": -12.409640312194824, "global_step": 416313, "epoch": 2478} {"train_loss": -12.025322914123535, "global_step": 416314, "epoch": 2478} {"train_loss": -12.164029121398926, "global_step": 416315, "epoch": 2478} {"train_loss": -12.105548858642578, "global_step": 416316, "epoch": 2478} {"train_loss": -11.97939395904541, "global_step": 416317, "epoch": 2478} {"train_loss": -12.154529571533203, "global_step": 416318, "epoch": 2478} {"train_loss": -12.321330070495605, "global_step": 416319, "epoch": 2478} {"train_loss": -12.020463943481445, "global_step": 416320, "epoch": 2478} {"train_loss": -11.901576042175293, "global_step": 416321, "epoch": 2478} {"train_loss": -12.216144561767578, "global_step": 416322, "epoch": 2478} {"train_loss": -11.864059448242188, "global_step": 416323, "epoch": 2478} {"train_loss": -12.421424865722656, "global_step": 416324, "epoch": 2478} {"train_loss": -12.064664840698242, "global_step": 416325, "epoch": 2478} {"train_loss": -12.273513793945312, "global_step": 416326, "epoch": 2478} {"train_loss": -12.330629348754883, "global_step": 416327, "epoch": 2478} {"train_loss": -12.095088005065918, "global_step": 416328, "epoch": 2478} {"train_loss": -12.309261322021484, "global_step": 416329, "epoch": 2478} {"train_loss": -12.323966979980469, "global_step": 416330, "epoch": 2478} {"train_loss": -12.447603225708008, "global_step": 416331, "epoch": 2478} {"train_loss": -12.251730918884277, "global_step": 416332, "epoch": 2478} {"train_loss": -12.356989860534668, "global_step": 416333, "epoch": 2478} {"train_loss": -12.137033462524414, "global_step": 416334, "epoch": 2478} {"train_loss": -12.552031517028809, "global_step": 416335, "epoch": 2478} {"train_loss": -12.319562911987305, "global_step": 416336, "epoch": 2478} {"train_loss": -12.530160903930664, "global_step": 416337, "epoch": 2478} {"train_loss": -12.39935302734375, "global_step": 416338, "epoch": 2478} {"train_loss": -12.398025512695312, "global_step": 416339, "epoch": 2478} {"train_loss": -12.526443481445312, "global_step": 416340, "epoch": 2478} {"train_loss": -12.51181411743164, "global_step": 416341, "epoch": 2478} {"train_loss": -12.455504417419434, "global_step": 416342, "epoch": 2478} {"train_loss": -12.514814376831055, "global_step": 416343, "epoch": 2478} {"train_loss": -12.26429557800293, "global_step": 416344, "epoch": 2478} {"train_loss": -12.515435218811035, "global_step": 416345, "epoch": 2478} {"train_loss": -12.392650604248047, "global_step": 416346, "epoch": 2478} {"train_loss": -12.561967849731445, "global_step": 416347, "epoch": 2478} {"train_loss": -12.568952560424805, "global_step": 416348, "epoch": 2478} {"train_loss": -12.277410507202148, "global_step": 416349, "epoch": 2478} {"train_loss": -12.548893928527832, "global_step": 416350, "epoch": 2478} {"train_loss": -12.640247344970703, "global_step": 416351, "epoch": 2478} {"train_loss": -12.412590026855469, "global_step": 416352, "epoch": 2478} {"train_loss": -12.352860450744629, "global_step": 416353, "epoch": 2478} {"train_loss": -12.410563468933105, "global_step": 416354, "epoch": 2478} {"train_loss": -12.452299118041992, "global_step": 416355, "epoch": 2478} {"train_loss": -12.70523452758789, "global_step": 416356, "epoch": 2478} {"train_loss": -12.60611629486084, "global_step": 416357, "epoch": 2478} {"train_loss": -12.543622970581055, "global_step": 416358, "epoch": 2478} {"train_loss": -12.62730598449707, "global_step": 416359, "epoch": 2478} {"train_loss": -12.815759658813477, "global_step": 416360, "epoch": 2478} {"train_loss": -12.58896255493164, "global_step": 416361, "epoch": 2478} {"train_loss": -12.607107162475586, "global_step": 416362, "epoch": 2478} {"train_loss": -12.574577331542969, "global_step": 416363, "epoch": 2478} {"train_loss": -12.72702693939209, "global_step": 416364, "epoch": 2478} {"train_loss": -12.540885925292969, "global_step": 416365, "epoch": 2478} {"train_loss": -12.673338890075684, "global_step": 416366, "epoch": 2478} {"train_loss": -12.673288345336914, "global_step": 416367, "epoch": 2478} {"train_loss": -12.735673904418945, "global_step": 416368, "epoch": 2478} {"train_loss": -12.728456497192383, "global_step": 416369, "epoch": 2478} {"train_loss": -12.787384033203125, "global_step": 416370, "epoch": 2478} {"train_loss": -12.610705375671387, "global_step": 416371, "epoch": 2478} {"train_loss": -12.663634300231934, "global_step": 416372, "epoch": 2478} {"train_loss": -12.684600830078125, "global_step": 416373, "epoch": 2478} {"train_loss": -12.696235656738281, "global_step": 416374, "epoch": 2478} {"train_loss": -12.627198219299316, "global_step": 416375, "epoch": 2478} {"train_loss": -12.510839462280273, "global_step": 416376, "epoch": 2478} {"train_loss": -12.766109466552734, "global_step": 416377, "epoch": 2478} {"train_loss": -12.679877281188965, "global_step": 416378, "epoch": 2478} {"train_loss": -12.685901641845703, "global_step": 416379, "epoch": 2478} {"train_loss": -12.647782325744629, "global_step": 416380, "epoch": 2478} {"train_loss": -12.472951889038086, "global_step": 416381, "epoch": 2478} {"train_loss": -12.687644958496094, "global_step": 416382, "epoch": 2478} {"train_loss": -12.70595645904541, "global_step": 416383, "epoch": 2478} {"train_loss": -12.768959045410156, "global_step": 416384, "epoch": 2478} {"train_loss": -12.731375694274902, "global_step": 416385, "epoch": 2478} {"train_loss": -12.74905014038086, "global_step": 416386, "epoch": 2478} {"train_loss": -12.654339790344238, "global_step": 416387, "epoch": 2478} {"train_loss": -12.833013534545898, "global_step": 416388, "epoch": 2478} {"train_loss": -12.673733711242676, "global_step": 416389, "epoch": 2478} {"train_loss": -12.946842193603516, "global_step": 416390, "epoch": 2478} {"train_loss": -12.755878448486328, "global_step": 416391, "epoch": 2478} {"train_loss": -12.614021301269531, "global_step": 416392, "epoch": 2478} {"train_loss": -12.603377342224121, "global_step": 416393, "epoch": 2478} {"train_loss": -12.57989501953125, "global_step": 416394, "epoch": 2478} {"train_loss": -12.654970169067383, "global_step": 416395, "epoch": 2478} {"train_loss": -12.792253494262695, "global_step": 416396, "epoch": 2478} {"train_loss": -12.654794692993164, "global_step": 416397, "epoch": 2478} {"train_loss": -12.673473358154297, "global_step": 416398, "epoch": 2478} {"train_loss": -12.773017883300781, "global_step": 416399, "epoch": 2478} {"train_loss": -12.717690467834473, "global_step": 416400, "epoch": 2478} {"train_loss": -12.775867462158203, "global_step": 416401, "epoch": 2478} {"train_loss": -12.677370071411133, "global_step": 416402, "epoch": 2478} {"train_loss": -12.565617561340332, "global_step": 416403, "epoch": 2478} {"train_loss": -12.673733711242676, "global_step": 416404, "epoch": 2478} {"train_loss": -12.81277084350586, "global_step": 416405, "epoch": 2478} {"train_loss": -12.771114349365234, "global_step": 416406, "epoch": 2478} {"train_loss": -12.759927749633789, "global_step": 416407, "epoch": 2478} {"train_loss": -12.762077331542969, "global_step": 416408, "epoch": 2478} {"train_loss": -12.67147445678711, "global_step": 416409, "epoch": 2478} {"train_loss": -12.55827808380127, "global_step": 416410, "epoch": 2478} {"train_loss": -12.386945724487305, "global_step": 416411, "epoch": 2478} {"train_loss": -12.674694061279297, "global_step": 416412, "epoch": 2478} {"train_loss": -12.594371795654297, "global_step": 416413, "epoch": 2478} {"train_loss": -12.1925048828125, "global_step": 416414, "epoch": 2478} {"train_loss": -12.479713439941406, "global_step": 416415, "epoch": 2478} {"train_loss": -12.521652221679688, "global_step": 416416, "epoch": 2478} {"train_loss": -12.284579277038574, "global_step": 416417, "epoch": 2478} {"train_loss": -12.379411697387695, "global_step": 416418, "epoch": 2478} {"train_loss": -12.017173767089844, "global_step": 416419, "epoch": 2478} {"train_loss": -11.507217407226562, "global_step": 416420, "epoch": 2478} {"train_loss": -11.837259292602539, "global_step": 416421, "epoch": 2478} {"train_loss": -12.269929885864258, "global_step": 416422, "epoch": 2478} {"train_loss": -12.15937328338623, "global_step": 416423, "epoch": 2478} {"train_loss": -11.816032409667969, "global_step": 416424, "epoch": 2478} {"train_loss": -12.588813781738281, "global_step": 416425, "epoch": 2478} {"train_loss": -12.360187530517578, "global_step": 416426, "epoch": 2478} {"train_loss": -11.73861312866211, "global_step": 416427, "epoch": 2478} {"train_loss": -11.34394645690918, "global_step": 416428, "epoch": 2478} {"train_loss": -11.104328155517578, "global_step": 416429, "epoch": 2478} {"train_loss": -11.69887638092041, "global_step": 416430, "epoch": 2478} {"train_loss": -9.026124954223633, "global_step": 416431, "epoch": 2478} {"train_loss": -9.083464622497559, "global_step": 416432, "epoch": 2478} {"train_loss": -8.339167594909668, "global_step": 416433, "epoch": 2478} {"train_loss": -9.859740257263184, "global_step": 416434, "epoch": 2478} {"train_loss": -8.762984275817871, "global_step": 416435, "epoch": 2478} {"train_loss": -9.69753646850586, "global_step": 416436, "epoch": 2478} {"train_loss": -11.17839241027832, "global_step": 416437, "epoch": 2478} {"train_loss": -10.917706489562988, "global_step": 416438, "epoch": 2478} {"train_loss": -11.068161010742188, "global_step": 416439, "epoch": 2478} {"train_loss": -11.043521881103516, "global_step": 416440, "epoch": 2478} {"train_loss": -11.113195419311523, "global_step": 416441, "epoch": 2478} {"train_loss": -10.765373229980469, "global_step": 416442, "epoch": 2478} {"train_loss": -10.617569923400879, "global_step": 416443, "epoch": 2478} {"train_loss": -11.005361557006836, "global_step": 416444, "epoch": 2478} {"train_loss": -10.550636291503906, "global_step": 416445, "epoch": 2478} {"train_loss": -11.247293472290039, "global_step": 416446, "epoch": 2478} {"train_loss": -11.619800567626953, "global_step": 416447, "epoch": 2478} {"train_loss": -11.030912399291992, "global_step": 416448, "epoch": 2478} {"train_loss": -11.256094932556152, "global_step": 416449, "epoch": 2478} {"train_loss": -11.433319091796875, "global_step": 416450, "epoch": 2478} {"train_loss": -11.893021583557129, "global_step": 416451, "epoch": 2478} {"train_loss": -10.703756332397461, "global_step": 416452, "epoch": 2478} {"train_loss": -11.625961303710938, "global_step": 416453, "epoch": 2478} {"train_loss": -11.656244277954102, "global_step": 416454, "epoch": 2478} {"train_loss": -11.595182418823242, "global_step": 416455, "epoch": 2478} {"train_loss": -11.775688171386719, "global_step": 416456, "epoch": 2478} {"train_loss": -11.805474281311035, "global_step": 416457, "epoch": 2478} {"train_loss": -12.111854553222656, "global_step": 416458, "epoch": 2478} {"train_loss": -11.887723922729492, "global_step": 416459, "epoch": 2478} {"train_loss": -11.628442764282227, "global_step": 416460, "epoch": 2478} {"train_loss": -11.217819213867188, "global_step": 416461, "epoch": 2478} {"train_loss": -11.850419998168945, "global_step": 416462, "epoch": 2478} {"train_loss": -11.56486701965332, "global_step": 416463, "epoch": 2478} {"train_loss": -12.182340621948242, "global_step": 416464, "epoch": 2478} {"train_loss": -11.57861328125, "global_step": 416465, "epoch": 2478} {"train_loss": -12.20022964477539, "global_step": 416466, "epoch": 2478} {"train_loss": -11.75108528137207, "global_step": 416467, "epoch": 2478} {"train_loss": -12.099347114562988, "global_step": 416468, "epoch": 2478} {"train_loss": -11.941619873046875, "global_step": 416469, "epoch": 2478} {"train_loss": -12.002659797668457, "global_step": 416470, "epoch": 2478} {"train_loss": -12.104809800783793, "global_step": 416471, "epoch": 2478, "val_loss": 302362.90625} {"train_loss": -11.914571762084961, "global_step": 416472, "epoch": 2479} {"train_loss": -12.299606323242188, "global_step": 416473, "epoch": 2479} {"train_loss": -12.281570434570312, "global_step": 416474, "epoch": 2479} {"train_loss": -12.109259605407715, "global_step": 416475, "epoch": 2479} {"train_loss": -12.159728050231934, "global_step": 416476, "epoch": 2479} {"train_loss": -12.33958625793457, "global_step": 416477, "epoch": 2479} {"train_loss": -12.00125503540039, "global_step": 416478, "epoch": 2479} {"train_loss": -12.417657852172852, "global_step": 416479, "epoch": 2479} {"train_loss": -12.481555938720703, "global_step": 416480, "epoch": 2479} {"train_loss": -12.132274627685547, "global_step": 416481, "epoch": 2479} {"train_loss": -12.307244300842285, "global_step": 416482, "epoch": 2479} {"train_loss": -12.304966926574707, "global_step": 416483, "epoch": 2479} {"train_loss": -12.345511436462402, "global_step": 416484, "epoch": 2479} {"train_loss": -12.194823265075684, "global_step": 416485, "epoch": 2479} {"train_loss": -12.296987533569336, "global_step": 416486, "epoch": 2479} {"train_loss": -12.3579740524292, "global_step": 416487, "epoch": 2479} {"train_loss": -12.22287368774414, "global_step": 416488, "epoch": 2479} {"train_loss": -12.351373672485352, "global_step": 416489, "epoch": 2479} {"train_loss": -12.140312194824219, "global_step": 416490, "epoch": 2479} {"train_loss": -12.519430160522461, "global_step": 416491, "epoch": 2479} {"train_loss": -12.173640251159668, "global_step": 416492, "epoch": 2479} {"train_loss": -12.220064163208008, "global_step": 416493, "epoch": 2479} {"train_loss": -11.784058570861816, "global_step": 416494, "epoch": 2479} {"train_loss": -12.226981163024902, "global_step": 416495, "epoch": 2479} {"train_loss": -12.287622451782227, "global_step": 416496, "epoch": 2479} {"train_loss": -12.017132759094238, "global_step": 416497, "epoch": 2479} {"train_loss": -12.228912353515625, "global_step": 416498, "epoch": 2479} {"train_loss": -12.311360359191895, "global_step": 416499, "epoch": 2479} {"train_loss": -12.782012939453125, "global_step": 416500, "epoch": 2479} {"train_loss": -12.507465362548828, "global_step": 416501, "epoch": 2479} {"train_loss": -12.575104713439941, "global_step": 416502, "epoch": 2479} {"train_loss": -12.62939453125, "global_step": 416503, "epoch": 2479} {"train_loss": -12.437490463256836, "global_step": 416504, "epoch": 2479} {"train_loss": -12.538246154785156, "global_step": 416505, "epoch": 2479} {"train_loss": -12.739250183105469, "global_step": 416506, "epoch": 2479} {"train_loss": -12.367030143737793, "global_step": 416507, "epoch": 2479} {"train_loss": -12.656795501708984, "global_step": 416508, "epoch": 2479} {"train_loss": -12.36240005493164, "global_step": 416509, "epoch": 2479} {"train_loss": -12.483392715454102, "global_step": 416510, "epoch": 2479} {"train_loss": -12.484752655029297, "global_step": 416511, "epoch": 2479} {"train_loss": -12.400873184204102, "global_step": 416512, "epoch": 2479} {"train_loss": -12.401040077209473, "global_step": 416513, "epoch": 2479} {"train_loss": -12.36227035522461, "global_step": 416514, "epoch": 2479} {"train_loss": -12.553520202636719, "global_step": 416515, "epoch": 2479} {"train_loss": -12.371089935302734, "global_step": 416516, "epoch": 2479} {"train_loss": -12.385815620422363, "global_step": 416517, "epoch": 2479} {"train_loss": -12.415243148803711, "global_step": 416518, "epoch": 2479} {"train_loss": -12.66309928894043, "global_step": 416519, "epoch": 2479} {"train_loss": -12.846529006958008, "global_step": 416520, "epoch": 2479} {"train_loss": -12.595033645629883, "global_step": 416521, "epoch": 2479} {"train_loss": -12.761303901672363, "global_step": 416522, "epoch": 2479} {"train_loss": -12.820123672485352, "global_step": 416523, "epoch": 2479} {"train_loss": -12.513988494873047, "global_step": 416524, "epoch": 2479} {"train_loss": -12.701969146728516, "global_step": 416525, "epoch": 2479} {"train_loss": -12.729894638061523, "global_step": 416526, "epoch": 2479} {"train_loss": -12.497424125671387, "global_step": 416527, "epoch": 2479} {"train_loss": -12.541792869567871, "global_step": 416528, "epoch": 2479} {"train_loss": -12.952431678771973, "global_step": 416529, "epoch": 2479} {"train_loss": -12.677030563354492, "global_step": 416530, "epoch": 2479} {"train_loss": -12.539175987243652, "global_step": 416531, "epoch": 2479} {"train_loss": -12.650794982910156, "global_step": 416532, "epoch": 2479} {"train_loss": -12.850448608398438, "global_step": 416533, "epoch": 2479} {"train_loss": -12.659473419189453, "global_step": 416534, "epoch": 2479} {"train_loss": -12.257200241088867, "global_step": 416535, "epoch": 2479} {"train_loss": -12.709794998168945, "global_step": 416536, "epoch": 2479} {"train_loss": -12.924713134765625, "global_step": 416537, "epoch": 2479} {"train_loss": -12.703857421875, "global_step": 416538, "epoch": 2479} {"train_loss": -12.70598030090332, "global_step": 416539, "epoch": 2479} {"train_loss": -12.917699813842773, "global_step": 416540, "epoch": 2479} {"train_loss": -12.941848754882812, "global_step": 416541, "epoch": 2479} {"train_loss": -12.589714050292969, "global_step": 416542, "epoch": 2479} {"train_loss": -12.98779010772705, "global_step": 416543, "epoch": 2479} {"train_loss": -12.807010650634766, "global_step": 416544, "epoch": 2479} {"train_loss": -12.697681427001953, "global_step": 416545, "epoch": 2479} {"train_loss": -12.683905601501465, "global_step": 416546, "epoch": 2479} {"train_loss": -12.879831314086914, "global_step": 416547, "epoch": 2479} {"train_loss": -12.98465347290039, "global_step": 416548, "epoch": 2479} {"train_loss": -12.56930923461914, "global_step": 416549, "epoch": 2479} {"train_loss": -12.40048599243164, "global_step": 416550, "epoch": 2479} {"train_loss": -12.457192420959473, "global_step": 416551, "epoch": 2479} {"train_loss": -12.491964340209961, "global_step": 416552, "epoch": 2479} {"train_loss": -12.730523109436035, "global_step": 416553, "epoch": 2479} {"train_loss": -12.894901275634766, "global_step": 416554, "epoch": 2479} {"train_loss": -12.887847900390625, "global_step": 416555, "epoch": 2479} {"train_loss": -12.718646049499512, "global_step": 416556, "epoch": 2479} {"train_loss": -12.946697235107422, "global_step": 416557, "epoch": 2479} {"train_loss": -12.52813720703125, "global_step": 416558, "epoch": 2479} {"train_loss": -12.44035816192627, "global_step": 416559, "epoch": 2479} {"train_loss": -12.602774620056152, "global_step": 416560, "epoch": 2479} {"train_loss": -12.40247917175293, "global_step": 416561, "epoch": 2479} {"train_loss": -12.432304382324219, "global_step": 416562, "epoch": 2479} {"train_loss": -12.269824981689453, "global_step": 416563, "epoch": 2479} {"train_loss": -12.7510404586792, "global_step": 416564, "epoch": 2479} {"train_loss": -12.341808319091797, "global_step": 416565, "epoch": 2479} {"train_loss": -11.691930770874023, "global_step": 416566, "epoch": 2479} {"train_loss": -12.331873893737793, "global_step": 416567, "epoch": 2479} {"train_loss": -12.041290283203125, "global_step": 416568, "epoch": 2479} {"train_loss": -12.143627166748047, "global_step": 416569, "epoch": 2479} {"train_loss": -12.347537994384766, "global_step": 416570, "epoch": 2479} {"train_loss": -11.86968994140625, "global_step": 416571, "epoch": 2479} {"train_loss": -12.469952583312988, "global_step": 416572, "epoch": 2479} {"train_loss": -11.440380096435547, "global_step": 416573, "epoch": 2479} {"train_loss": -10.478455543518066, "global_step": 416574, "epoch": 2479} {"train_loss": -11.493885040283203, "global_step": 416575, "epoch": 2479} {"train_loss": -12.045639991760254, "global_step": 416576, "epoch": 2479} {"train_loss": -11.44494915008545, "global_step": 416577, "epoch": 2479} {"train_loss": -12.427118301391602, "global_step": 416578, "epoch": 2479} {"train_loss": -11.471463203430176, "global_step": 416579, "epoch": 2479} {"train_loss": -11.969724655151367, "global_step": 416580, "epoch": 2479} {"train_loss": -10.971685409545898, "global_step": 416581, "epoch": 2479} {"train_loss": -9.969596862792969, "global_step": 416582, "epoch": 2479} {"train_loss": -11.254653930664062, "global_step": 416583, "epoch": 2479} {"train_loss": -9.331029891967773, "global_step": 416584, "epoch": 2479} {"train_loss": -8.9442138671875, "global_step": 416585, "epoch": 2479} {"train_loss": -11.675664901733398, "global_step": 416586, "epoch": 2479} {"train_loss": -9.887678146362305, "global_step": 416587, "epoch": 2479} {"train_loss": -8.70372486114502, "global_step": 416588, "epoch": 2479} {"train_loss": -9.14968490600586, "global_step": 416589, "epoch": 2479} {"train_loss": -9.850763320922852, "global_step": 416590, "epoch": 2479} {"train_loss": -10.514842987060547, "global_step": 416591, "epoch": 2479} {"train_loss": -9.309385299682617, "global_step": 416592, "epoch": 2479} {"train_loss": -10.822615623474121, "global_step": 416593, "epoch": 2479} {"train_loss": -10.892569541931152, "global_step": 416594, "epoch": 2479} {"train_loss": -11.420997619628906, "global_step": 416595, "epoch": 2479} {"train_loss": -9.98585319519043, "global_step": 416596, "epoch": 2479} {"train_loss": -9.617673873901367, "global_step": 416597, "epoch": 2479} {"train_loss": -10.895341873168945, "global_step": 416598, "epoch": 2479} {"train_loss": -10.426877975463867, "global_step": 416599, "epoch": 2479} {"train_loss": -10.10891342163086, "global_step": 416600, "epoch": 2479} {"train_loss": -10.855833053588867, "global_step": 416601, "epoch": 2479} {"train_loss": -11.033563613891602, "global_step": 416602, "epoch": 2479} {"train_loss": -11.275070190429688, "global_step": 416603, "epoch": 2479} {"train_loss": -11.362689971923828, "global_step": 416604, "epoch": 2479} {"train_loss": -10.98762035369873, "global_step": 416605, "epoch": 2479} {"train_loss": -11.456600189208984, "global_step": 416606, "epoch": 2479} {"train_loss": -10.904541015625, "global_step": 416607, "epoch": 2479} {"train_loss": -11.410316467285156, "global_step": 416608, "epoch": 2479} {"train_loss": -9.947429656982422, "global_step": 416609, "epoch": 2479} {"train_loss": -9.759699821472168, "global_step": 416610, "epoch": 2479} {"train_loss": -11.309679985046387, "global_step": 416611, "epoch": 2479} {"train_loss": -9.441815376281738, "global_step": 416612, "epoch": 2479} {"train_loss": -8.93115520477295, "global_step": 416613, "epoch": 2479} {"train_loss": -10.648702621459961, "global_step": 416614, "epoch": 2479} {"train_loss": -10.509499549865723, "global_step": 416615, "epoch": 2479} {"train_loss": -9.459268569946289, "global_step": 416616, "epoch": 2479} {"train_loss": -10.672201156616211, "global_step": 416617, "epoch": 2479} {"train_loss": -11.41598892211914, "global_step": 416618, "epoch": 2479} {"train_loss": -10.363079071044922, "global_step": 416619, "epoch": 2479} {"train_loss": -10.945382118225098, "global_step": 416620, "epoch": 2479} {"train_loss": -10.983585357666016, "global_step": 416621, "epoch": 2479} {"train_loss": -10.685314178466797, "global_step": 416622, "epoch": 2479} {"train_loss": -10.688940048217773, "global_step": 416623, "epoch": 2479} {"train_loss": -10.592779159545898, "global_step": 416624, "epoch": 2479} {"train_loss": -10.793864250183105, "global_step": 416625, "epoch": 2479} {"train_loss": -10.941305160522461, "global_step": 416626, "epoch": 2479} {"train_loss": -11.274991989135742, "global_step": 416627, "epoch": 2479} {"train_loss": -10.834716796875, "global_step": 416628, "epoch": 2479} {"train_loss": -11.919501304626465, "global_step": 416629, "epoch": 2479} {"train_loss": -11.460485458374023, "global_step": 416630, "epoch": 2479} {"train_loss": -11.375772476196289, "global_step": 416631, "epoch": 2479} {"train_loss": -11.640222549438477, "global_step": 416632, "epoch": 2479} {"train_loss": -10.984868049621582, "global_step": 416633, "epoch": 2479} {"train_loss": -11.128310203552246, "global_step": 416634, "epoch": 2479} {"train_loss": -11.75422477722168, "global_step": 416635, "epoch": 2479} {"train_loss": -10.750301361083984, "global_step": 416636, "epoch": 2479} {"train_loss": -11.722867965698242, "global_step": 416637, "epoch": 2479} {"train_loss": -11.800040245056152, "global_step": 416638, "epoch": 2479} {"train_loss": -11.798543197768074, "global_step": 416639, "epoch": 2479, "val_loss": 303078.25} {"train_loss": -11.445557594299316, "global_step": 416640, "epoch": 2480} {"train_loss": -11.726600646972656, "global_step": 416641, "epoch": 2480} {"train_loss": -11.453540802001953, "global_step": 416642, "epoch": 2480} {"train_loss": -11.97085952758789, "global_step": 416643, "epoch": 2480} {"train_loss": -11.817619323730469, "global_step": 416644, "epoch": 2480} {"train_loss": -11.803318977355957, "global_step": 416645, "epoch": 2480} {"train_loss": -12.335535049438477, "global_step": 416646, "epoch": 2480} {"train_loss": -11.764098167419434, "global_step": 416647, "epoch": 2480} {"train_loss": -11.815759658813477, "global_step": 416648, "epoch": 2480} {"train_loss": -12.054119110107422, "global_step": 416649, "epoch": 2480} {"train_loss": -11.60017204284668, "global_step": 416650, "epoch": 2480} {"train_loss": -12.063390731811523, "global_step": 416651, "epoch": 2480} {"train_loss": -12.054069519042969, "global_step": 416652, "epoch": 2480} {"train_loss": -11.782082557678223, "global_step": 416653, "epoch": 2480} {"train_loss": -12.108375549316406, "global_step": 416654, "epoch": 2480} {"train_loss": -11.772268295288086, "global_step": 416655, "epoch": 2480} {"train_loss": -12.29802131652832, "global_step": 416656, "epoch": 2480} {"train_loss": -12.129780769348145, "global_step": 416657, "epoch": 2480} {"train_loss": -12.042521476745605, "global_step": 416658, "epoch": 2480} {"train_loss": -12.2999267578125, "global_step": 416659, "epoch": 2480} {"train_loss": -12.243293762207031, "global_step": 416660, "epoch": 2480} {"train_loss": -12.136968612670898, "global_step": 416661, "epoch": 2480} {"train_loss": -12.166997909545898, "global_step": 416662, "epoch": 2480} {"train_loss": -12.307506561279297, "global_step": 416663, "epoch": 2480} {"train_loss": -12.329845428466797, "global_step": 416664, "epoch": 2480} {"train_loss": -12.424383163452148, "global_step": 416665, "epoch": 2480} {"train_loss": -12.239458084106445, "global_step": 416666, "epoch": 2480} {"train_loss": -12.653482437133789, "global_step": 416667, "epoch": 2480} {"train_loss": -12.484237670898438, "global_step": 416668, "epoch": 2480} {"train_loss": -12.228959083557129, "global_step": 416669, "epoch": 2480} {"train_loss": -12.429682731628418, "global_step": 416670, "epoch": 2480} {"train_loss": -12.401754379272461, "global_step": 416671, "epoch": 2480} {"train_loss": -12.457117080688477, "global_step": 416672, "epoch": 2480} {"train_loss": -12.399240493774414, "global_step": 416673, "epoch": 2480} {"train_loss": -12.37391471862793, "global_step": 416674, "epoch": 2480} {"train_loss": -12.456298828125, "global_step": 416675, "epoch": 2480} {"train_loss": -12.569372177124023, "global_step": 416676, "epoch": 2480} {"train_loss": -12.53768253326416, "global_step": 416677, "epoch": 2480} {"train_loss": -12.515162467956543, "global_step": 416678, "epoch": 2480} {"train_loss": -12.512104034423828, "global_step": 416679, "epoch": 2480} {"train_loss": -12.360517501831055, "global_step": 416680, "epoch": 2480} {"train_loss": -12.480993270874023, "global_step": 416681, "epoch": 2480} {"train_loss": -12.590019226074219, "global_step": 416682, "epoch": 2480} {"train_loss": -12.555755615234375, "global_step": 416683, "epoch": 2480} {"train_loss": -12.435612678527832, "global_step": 416684, "epoch": 2480} {"train_loss": -12.345746994018555, "global_step": 416685, "epoch": 2480} {"train_loss": -12.575799942016602, "global_step": 416686, "epoch": 2480} {"train_loss": -12.542266845703125, "global_step": 416687, "epoch": 2480} {"train_loss": -12.698932647705078, "global_step": 416688, "epoch": 2480} {"train_loss": -12.540480613708496, "global_step": 416689, "epoch": 2480} {"train_loss": -12.498250961303711, "global_step": 416690, "epoch": 2480} {"train_loss": -12.610944747924805, "global_step": 416691, "epoch": 2480} {"train_loss": -12.652944564819336, "global_step": 416692, "epoch": 2480} {"train_loss": -12.386723518371582, "global_step": 416693, "epoch": 2480} {"train_loss": -12.480062484741211, "global_step": 416694, "epoch": 2480} {"train_loss": -12.600200653076172, "global_step": 416695, "epoch": 2480} {"train_loss": -12.182608604431152, "global_step": 416696, "epoch": 2480} {"train_loss": -12.634214401245117, "global_step": 416697, "epoch": 2480} {"train_loss": -12.388989448547363, "global_step": 416698, "epoch": 2480} {"train_loss": -12.66097640991211, "global_step": 416699, "epoch": 2480} {"train_loss": -12.624755859375, "global_step": 416700, "epoch": 2480} {"train_loss": -12.681364059448242, "global_step": 416701, "epoch": 2480} {"train_loss": -12.776777267456055, "global_step": 416702, "epoch": 2480} {"train_loss": -12.603776931762695, "global_step": 416703, "epoch": 2480} {"train_loss": -12.593749046325684, "global_step": 416704, "epoch": 2480} {"train_loss": -12.634429931640625, "global_step": 416705, "epoch": 2480} {"train_loss": -12.531270980834961, "global_step": 416706, "epoch": 2480} {"train_loss": -12.623947143554688, "global_step": 416707, "epoch": 2480} {"train_loss": -12.712903022766113, "global_step": 416708, "epoch": 2480} {"train_loss": -12.638907432556152, "global_step": 416709, "epoch": 2480} {"train_loss": -12.785224914550781, "global_step": 416710, "epoch": 2480} {"train_loss": -12.666731834411621, "global_step": 416711, "epoch": 2480} {"train_loss": -12.82011890411377, "global_step": 416712, "epoch": 2480} {"train_loss": -12.553768157958984, "global_step": 416713, "epoch": 2480} {"train_loss": -12.48709487915039, "global_step": 416714, "epoch": 2480} {"train_loss": -12.56224250793457, "global_step": 416715, "epoch": 2480} {"train_loss": -12.528030395507812, "global_step": 416716, "epoch": 2480} {"train_loss": -12.612021446228027, "global_step": 416717, "epoch": 2480} {"train_loss": -12.154877662658691, "global_step": 416718, "epoch": 2480} {"train_loss": -11.99704360961914, "global_step": 416719, "epoch": 2480} {"train_loss": -12.878129005432129, "global_step": 416720, "epoch": 2480} {"train_loss": -12.298130989074707, "global_step": 416721, "epoch": 2480} {"train_loss": -12.509809494018555, "global_step": 416722, "epoch": 2480} {"train_loss": -12.347583770751953, "global_step": 416723, "epoch": 2480} {"train_loss": -12.434823036193848, "global_step": 416724, "epoch": 2480} {"train_loss": -12.380131721496582, "global_step": 416725, "epoch": 2480} {"train_loss": -12.647783279418945, "global_step": 416726, "epoch": 2480} {"train_loss": -12.41678237915039, "global_step": 416727, "epoch": 2480} {"train_loss": -12.74344253540039, "global_step": 416728, "epoch": 2480} {"train_loss": -12.679496765136719, "global_step": 416729, "epoch": 2480} {"train_loss": -12.596301078796387, "global_step": 416730, "epoch": 2480} {"train_loss": -12.464313507080078, "global_step": 416731, "epoch": 2480} {"train_loss": -12.580703735351562, "global_step": 416732, "epoch": 2480} {"train_loss": -12.597221374511719, "global_step": 416733, "epoch": 2480} {"train_loss": -12.768495559692383, "global_step": 416734, "epoch": 2480} {"train_loss": -12.544286727905273, "global_step": 416735, "epoch": 2480} {"train_loss": -12.486252784729004, "global_step": 416736, "epoch": 2480} {"train_loss": -12.40009880065918, "global_step": 416737, "epoch": 2480} {"train_loss": -12.110023498535156, "global_step": 416738, "epoch": 2480} {"train_loss": -12.532268524169922, "global_step": 416739, "epoch": 2480} {"train_loss": -12.67327880859375, "global_step": 416740, "epoch": 2480} {"train_loss": -12.587879180908203, "global_step": 416741, "epoch": 2480} {"train_loss": -12.530372619628906, "global_step": 416742, "epoch": 2480} {"train_loss": -12.296735763549805, "global_step": 416743, "epoch": 2480} {"train_loss": -12.479679107666016, "global_step": 416744, "epoch": 2480} {"train_loss": -12.517254829406738, "global_step": 416745, "epoch": 2480} {"train_loss": -12.199963569641113, "global_step": 416746, "epoch": 2480} {"train_loss": -12.619880676269531, "global_step": 416747, "epoch": 2480} {"train_loss": -12.597391128540039, "global_step": 416748, "epoch": 2480} {"train_loss": -12.770804405212402, "global_step": 416749, "epoch": 2480} {"train_loss": -12.41094970703125, "global_step": 416750, "epoch": 2480} {"train_loss": -12.871589660644531, "global_step": 416751, "epoch": 2480} {"train_loss": -12.419609069824219, "global_step": 416752, "epoch": 2480} {"train_loss": -12.628116607666016, "global_step": 416753, "epoch": 2480} {"train_loss": -12.232439041137695, "global_step": 416754, "epoch": 2480} {"train_loss": -12.668123245239258, "global_step": 416755, "epoch": 2480} {"train_loss": -12.479730606079102, "global_step": 416756, "epoch": 2480} {"train_loss": -12.443912506103516, "global_step": 416757, "epoch": 2480} {"train_loss": -12.309985160827637, "global_step": 416758, "epoch": 2480} {"train_loss": -12.170333862304688, "global_step": 416759, "epoch": 2480} {"train_loss": -12.105749130249023, "global_step": 416760, "epoch": 2480} {"train_loss": -12.245973587036133, "global_step": 416761, "epoch": 2480} {"train_loss": -10.797412872314453, "global_step": 416762, "epoch": 2480} {"train_loss": -11.859947204589844, "global_step": 416763, "epoch": 2480} {"train_loss": -12.632125854492188, "global_step": 416764, "epoch": 2480} {"train_loss": -12.501593589782715, "global_step": 416765, "epoch": 2480} {"train_loss": -11.757217407226562, "global_step": 416766, "epoch": 2480} {"train_loss": -12.621681213378906, "global_step": 416767, "epoch": 2480} {"train_loss": -10.937864303588867, "global_step": 416768, "epoch": 2480} {"train_loss": -11.719252586364746, "global_step": 416769, "epoch": 2480} {"train_loss": -11.279962539672852, "global_step": 416770, "epoch": 2480} {"train_loss": -10.80569839477539, "global_step": 416771, "epoch": 2480} {"train_loss": -9.383783340454102, "global_step": 416772, "epoch": 2480} {"train_loss": -7.293432235717773, "global_step": 416773, "epoch": 2480} {"train_loss": -7.243717670440674, "global_step": 416774, "epoch": 2480} {"train_loss": -10.018067359924316, "global_step": 416775, "epoch": 2480} {"train_loss": -9.859170913696289, "global_step": 416776, "epoch": 2480} {"train_loss": -9.312643051147461, "global_step": 416777, "epoch": 2480} {"train_loss": -10.135095596313477, "global_step": 416778, "epoch": 2480} {"train_loss": -8.753095626831055, "global_step": 416779, "epoch": 2480} {"train_loss": -10.962041854858398, "global_step": 416780, "epoch": 2480} {"train_loss": -8.219074249267578, "global_step": 416781, "epoch": 2480} {"train_loss": -9.260119438171387, "global_step": 416782, "epoch": 2480} {"train_loss": -10.010115623474121, "global_step": 416783, "epoch": 2480} {"train_loss": -9.703540802001953, "global_step": 416784, "epoch": 2480} {"train_loss": -10.124916076660156, "global_step": 416785, "epoch": 2480} {"train_loss": -9.114601135253906, "global_step": 416786, "epoch": 2480} {"train_loss": -10.762751579284668, "global_step": 416787, "epoch": 2480} {"train_loss": -9.911123275756836, "global_step": 416788, "epoch": 2480} {"train_loss": -9.926519393920898, "global_step": 416789, "epoch": 2480} {"train_loss": -8.851949691772461, "global_step": 416790, "epoch": 2480} {"train_loss": -8.750980377197266, "global_step": 416791, "epoch": 2480} {"train_loss": -10.316854476928711, "global_step": 416792, "epoch": 2480} {"train_loss": -9.887632369995117, "global_step": 416793, "epoch": 2480} {"train_loss": -9.97761344909668, "global_step": 416794, "epoch": 2480} {"train_loss": -9.953369140625, "global_step": 416795, "epoch": 2480} {"train_loss": -10.383399963378906, "global_step": 416796, "epoch": 2480} {"train_loss": -10.194459915161133, "global_step": 416797, "epoch": 2480} {"train_loss": -10.48488998413086, "global_step": 416798, "epoch": 2480} {"train_loss": -10.782489776611328, "global_step": 416799, "epoch": 2480} {"train_loss": -11.011515617370605, "global_step": 416800, "epoch": 2480} {"train_loss": -11.047561645507812, "global_step": 416801, "epoch": 2480} {"train_loss": -11.729386329650879, "global_step": 416802, "epoch": 2480} {"train_loss": -11.183061599731445, "global_step": 416803, "epoch": 2480} {"train_loss": -11.193962097167969, "global_step": 416804, "epoch": 2480} {"train_loss": -11.618895530700684, "global_step": 416805, "epoch": 2480} {"train_loss": -11.187894821166992, "global_step": 416806, "epoch": 2480} {"train_loss": -11.845108369986216, "global_step": 416807, "epoch": 2480, "val_loss": 303840.9375, "train_action_mse_error": 0.9800052642822266} {"train_loss": -11.22828483581543, "global_step": 416808, "epoch": 2481} {"train_loss": -12.026666641235352, "global_step": 416809, "epoch": 2481} {"train_loss": -11.914913177490234, "global_step": 416810, "epoch": 2481} {"train_loss": -11.75804328918457, "global_step": 416811, "epoch": 2481} {"train_loss": -11.661478996276855, "global_step": 416812, "epoch": 2481} {"train_loss": -11.799562454223633, "global_step": 416813, "epoch": 2481} {"train_loss": -11.466636657714844, "global_step": 416814, "epoch": 2481} {"train_loss": -12.047062873840332, "global_step": 416815, "epoch": 2481} {"train_loss": -11.334002494812012, "global_step": 416816, "epoch": 2481} {"train_loss": -12.096003532409668, "global_step": 416817, "epoch": 2481} {"train_loss": -11.737581253051758, "global_step": 416818, "epoch": 2481} {"train_loss": -11.804561614990234, "global_step": 416819, "epoch": 2481} {"train_loss": -12.004440307617188, "global_step": 416820, "epoch": 2481} {"train_loss": -12.083335876464844, "global_step": 416821, "epoch": 2481} {"train_loss": -12.055919647216797, "global_step": 416822, "epoch": 2481} {"train_loss": -12.340734481811523, "global_step": 416823, "epoch": 2481} {"train_loss": -11.84973430633545, "global_step": 416824, "epoch": 2481} {"train_loss": -11.737539291381836, "global_step": 416825, "epoch": 2481} {"train_loss": -11.686033248901367, "global_step": 416826, "epoch": 2481} {"train_loss": -11.813102722167969, "global_step": 416827, "epoch": 2481} {"train_loss": -12.088766098022461, "global_step": 416828, "epoch": 2481} {"train_loss": -11.396411895751953, "global_step": 416829, "epoch": 2481} {"train_loss": -12.212991714477539, "global_step": 416830, "epoch": 2481} {"train_loss": -11.649177551269531, "global_step": 416831, "epoch": 2481} {"train_loss": -12.009572982788086, "global_step": 416832, "epoch": 2481} {"train_loss": -11.567085266113281, "global_step": 416833, "epoch": 2481} {"train_loss": -11.986804008483887, "global_step": 416834, "epoch": 2481} {"train_loss": -11.587455749511719, "global_step": 416835, "epoch": 2481} {"train_loss": -12.010064125061035, "global_step": 416836, "epoch": 2481} {"train_loss": -11.471414566040039, "global_step": 416837, "epoch": 2481} {"train_loss": -11.763132095336914, "global_step": 416838, "epoch": 2481} {"train_loss": -11.566686630249023, "global_step": 416839, "epoch": 2481} {"train_loss": -11.862356185913086, "global_step": 416840, "epoch": 2481} {"train_loss": -11.840380668640137, "global_step": 416841, "epoch": 2481} {"train_loss": -11.594331741333008, "global_step": 416842, "epoch": 2481} {"train_loss": -12.252617835998535, "global_step": 416843, "epoch": 2481} {"train_loss": -11.870003700256348, "global_step": 416844, "epoch": 2481} {"train_loss": -12.143796920776367, "global_step": 416845, "epoch": 2481} {"train_loss": -11.800110816955566, "global_step": 416846, "epoch": 2481} {"train_loss": -12.265436172485352, "global_step": 416847, "epoch": 2481} {"train_loss": -12.022902488708496, "global_step": 416848, "epoch": 2481} {"train_loss": -12.201004981994629, "global_step": 416849, "epoch": 2481} {"train_loss": -12.109834671020508, "global_step": 416850, "epoch": 2481} {"train_loss": -12.127213478088379, "global_step": 416851, "epoch": 2481} {"train_loss": -12.106508255004883, "global_step": 416852, "epoch": 2481} {"train_loss": -12.309964179992676, "global_step": 416853, "epoch": 2481} {"train_loss": -12.247379302978516, "global_step": 416854, "epoch": 2481} {"train_loss": -12.316417694091797, "global_step": 416855, "epoch": 2481} {"train_loss": -12.342416763305664, "global_step": 416856, "epoch": 2481} {"train_loss": -12.21464729309082, "global_step": 416857, "epoch": 2481} {"train_loss": -12.108877182006836, "global_step": 416858, "epoch": 2481} {"train_loss": -12.126102447509766, "global_step": 416859, "epoch": 2481} {"train_loss": -12.382037162780762, "global_step": 416860, "epoch": 2481} {"train_loss": -12.36432933807373, "global_step": 416861, "epoch": 2481} {"train_loss": -12.3236722946167, "global_step": 416862, "epoch": 2481} {"train_loss": -12.169692993164062, "global_step": 416863, "epoch": 2481} {"train_loss": -12.359294891357422, "global_step": 416864, "epoch": 2481} {"train_loss": -12.253129005432129, "global_step": 416865, "epoch": 2481} {"train_loss": -12.446266174316406, "global_step": 416866, "epoch": 2481} {"train_loss": -12.21328353881836, "global_step": 416867, "epoch": 2481} {"train_loss": -12.445100784301758, "global_step": 416868, "epoch": 2481} {"train_loss": -12.407414436340332, "global_step": 416869, "epoch": 2481} {"train_loss": -12.337690353393555, "global_step": 416870, "epoch": 2481} {"train_loss": -12.548234939575195, "global_step": 416871, "epoch": 2481} {"train_loss": -12.364985466003418, "global_step": 416872, "epoch": 2481} {"train_loss": -12.461000442504883, "global_step": 416873, "epoch": 2481} {"train_loss": -12.61793327331543, "global_step": 416874, "epoch": 2481} {"train_loss": -12.424816131591797, "global_step": 416875, "epoch": 2481} {"train_loss": -12.451091766357422, "global_step": 416876, "epoch": 2481} {"train_loss": -12.569574356079102, "global_step": 416877, "epoch": 2481} {"train_loss": -12.282977104187012, "global_step": 416878, "epoch": 2481} {"train_loss": -12.505638122558594, "global_step": 416879, "epoch": 2481} {"train_loss": -12.497657775878906, "global_step": 416880, "epoch": 2481} {"train_loss": -12.394269943237305, "global_step": 416881, "epoch": 2481} {"train_loss": -12.627763748168945, "global_step": 416882, "epoch": 2481} {"train_loss": -12.531152725219727, "global_step": 416883, "epoch": 2481} {"train_loss": -12.570756912231445, "global_step": 416884, "epoch": 2481} {"train_loss": -12.358209609985352, "global_step": 416885, "epoch": 2481} {"train_loss": -12.673575401306152, "global_step": 416886, "epoch": 2481} {"train_loss": -12.587224960327148, "global_step": 416887, "epoch": 2481} {"train_loss": -12.593324661254883, "global_step": 416888, "epoch": 2481} {"train_loss": -12.508123397827148, "global_step": 416889, "epoch": 2481} {"train_loss": -12.489033699035645, "global_step": 416890, "epoch": 2481} {"train_loss": -12.456827163696289, "global_step": 416891, "epoch": 2481} {"train_loss": -12.626529693603516, "global_step": 416892, "epoch": 2481} {"train_loss": -12.463037490844727, "global_step": 416893, "epoch": 2481} {"train_loss": -12.856881141662598, "global_step": 416894, "epoch": 2481} {"train_loss": -12.368124008178711, "global_step": 416895, "epoch": 2481} {"train_loss": -12.736080169677734, "global_step": 416896, "epoch": 2481} {"train_loss": -12.632662773132324, "global_step": 416897, "epoch": 2481} {"train_loss": -12.526851654052734, "global_step": 416898, "epoch": 2481} {"train_loss": -12.734275817871094, "global_step": 416899, "epoch": 2481} {"train_loss": -12.562381744384766, "global_step": 416900, "epoch": 2481} {"train_loss": -12.486560821533203, "global_step": 416901, "epoch": 2481} {"train_loss": -12.698237419128418, "global_step": 416902, "epoch": 2481} {"train_loss": -12.4461088180542, "global_step": 416903, "epoch": 2481} {"train_loss": -12.357885360717773, "global_step": 416904, "epoch": 2481} {"train_loss": -12.682831764221191, "global_step": 416905, "epoch": 2481} {"train_loss": -12.489501953125, "global_step": 416906, "epoch": 2481} {"train_loss": -12.275461196899414, "global_step": 416907, "epoch": 2481} {"train_loss": -12.405399322509766, "global_step": 416908, "epoch": 2481} {"train_loss": -12.314023971557617, "global_step": 416909, "epoch": 2481} {"train_loss": -12.008526802062988, "global_step": 416910, "epoch": 2481} {"train_loss": -12.5164155960083, "global_step": 416911, "epoch": 2481} {"train_loss": -12.671500205993652, "global_step": 416912, "epoch": 2481} {"train_loss": -12.342479705810547, "global_step": 416913, "epoch": 2481} {"train_loss": -11.705894470214844, "global_step": 416914, "epoch": 2481} {"train_loss": -12.78627872467041, "global_step": 416915, "epoch": 2481} {"train_loss": -12.527539253234863, "global_step": 416916, "epoch": 2481} {"train_loss": -12.293722152709961, "global_step": 416917, "epoch": 2481} {"train_loss": -11.173463821411133, "global_step": 416918, "epoch": 2481} {"train_loss": -12.646041870117188, "global_step": 416919, "epoch": 2481} {"train_loss": -11.390650749206543, "global_step": 416920, "epoch": 2481} {"train_loss": -12.123117446899414, "global_step": 416921, "epoch": 2481} {"train_loss": -12.420492172241211, "global_step": 416922, "epoch": 2481} {"train_loss": -12.116708755493164, "global_step": 416923, "epoch": 2481} {"train_loss": -11.704080581665039, "global_step": 416924, "epoch": 2481} {"train_loss": -12.531477928161621, "global_step": 416925, "epoch": 2481} {"train_loss": -12.213872909545898, "global_step": 416926, "epoch": 2481} {"train_loss": -12.172666549682617, "global_step": 416927, "epoch": 2481} {"train_loss": -12.380395889282227, "global_step": 416928, "epoch": 2481} {"train_loss": -12.396599769592285, "global_step": 416929, "epoch": 2481} {"train_loss": -12.27859878540039, "global_step": 416930, "epoch": 2481} {"train_loss": -11.97744083404541, "global_step": 416931, "epoch": 2481} {"train_loss": -12.154123306274414, "global_step": 416932, "epoch": 2481} {"train_loss": -12.280637741088867, "global_step": 416933, "epoch": 2481} {"train_loss": -12.708158493041992, "global_step": 416934, "epoch": 2481} {"train_loss": -12.276721954345703, "global_step": 416935, "epoch": 2481} {"train_loss": -12.517095565795898, "global_step": 416936, "epoch": 2481} {"train_loss": -11.753210067749023, "global_step": 416937, "epoch": 2481} {"train_loss": -12.656017303466797, "global_step": 416938, "epoch": 2481} {"train_loss": -12.400177955627441, "global_step": 416939, "epoch": 2481} {"train_loss": -12.548087120056152, "global_step": 416940, "epoch": 2481} {"train_loss": -12.454781532287598, "global_step": 416941, "epoch": 2481} {"train_loss": -11.950550079345703, "global_step": 416942, "epoch": 2481} {"train_loss": -12.306489944458008, "global_step": 416943, "epoch": 2481} {"train_loss": -12.52173900604248, "global_step": 416944, "epoch": 2481} {"train_loss": -11.944137573242188, "global_step": 416945, "epoch": 2481} {"train_loss": -12.29604434967041, "global_step": 416946, "epoch": 2481} {"train_loss": -12.573970794677734, "global_step": 416947, "epoch": 2481} {"train_loss": -12.297121047973633, "global_step": 416948, "epoch": 2481} {"train_loss": -12.244290351867676, "global_step": 416949, "epoch": 2481} {"train_loss": -12.175405502319336, "global_step": 416950, "epoch": 2481} {"train_loss": -12.017914772033691, "global_step": 416951, "epoch": 2481} {"train_loss": -12.100988388061523, "global_step": 416952, "epoch": 2481} {"train_loss": -10.42963981628418, "global_step": 416953, "epoch": 2481} {"train_loss": -12.475324630737305, "global_step": 416954, "epoch": 2481} {"train_loss": -10.136993408203125, "global_step": 416955, "epoch": 2481} {"train_loss": -11.98982048034668, "global_step": 416956, "epoch": 2481} {"train_loss": -10.600544929504395, "global_step": 416957, "epoch": 2481} {"train_loss": -11.623113632202148, "global_step": 416958, "epoch": 2481} {"train_loss": -10.879093170166016, "global_step": 416959, "epoch": 2481} {"train_loss": -10.089031219482422, "global_step": 416960, "epoch": 2481} {"train_loss": -11.20814323425293, "global_step": 416961, "epoch": 2481} {"train_loss": -10.709968566894531, "global_step": 416962, "epoch": 2481} {"train_loss": -10.295709609985352, "global_step": 416963, "epoch": 2481} {"train_loss": -10.59415340423584, "global_step": 416964, "epoch": 2481} {"train_loss": -11.463111877441406, "global_step": 416965, "epoch": 2481} {"train_loss": -11.51192855834961, "global_step": 416966, "epoch": 2481} {"train_loss": -11.619461059570312, "global_step": 416967, "epoch": 2481} {"train_loss": -11.345815658569336, "global_step": 416968, "epoch": 2481} {"train_loss": -10.947826385498047, "global_step": 416969, "epoch": 2481} {"train_loss": -11.200769424438477, "global_step": 416970, "epoch": 2481} {"train_loss": -11.605728149414062, "global_step": 416971, "epoch": 2481} {"train_loss": -11.841404914855957, "global_step": 416972, "epoch": 2481} {"train_loss": -11.196535110473633, "global_step": 416973, "epoch": 2481} {"train_loss": -12.185623168945312, "global_step": 416974, "epoch": 2481} {"train_loss": -12.070892192068554, "global_step": 416975, "epoch": 2481, "val_loss": 304263.4375} {"train_loss": -11.643167495727539, "global_step": 416976, "epoch": 2482} {"train_loss": -11.198758125305176, "global_step": 416977, "epoch": 2482} {"train_loss": -11.790468215942383, "global_step": 416978, "epoch": 2482} {"train_loss": -11.536601066589355, "global_step": 416979, "epoch": 2482} {"train_loss": -10.817968368530273, "global_step": 416980, "epoch": 2482} {"train_loss": -12.24157428741455, "global_step": 416981, "epoch": 2482} {"train_loss": -10.879876136779785, "global_step": 416982, "epoch": 2482} {"train_loss": -11.605561256408691, "global_step": 416983, "epoch": 2482} {"train_loss": -11.755826950073242, "global_step": 416984, "epoch": 2482} {"train_loss": -11.285087585449219, "global_step": 416985, "epoch": 2482} {"train_loss": -11.960107803344727, "global_step": 416986, "epoch": 2482} {"train_loss": -11.233174324035645, "global_step": 416987, "epoch": 2482} {"train_loss": -12.233278274536133, "global_step": 416988, "epoch": 2482} {"train_loss": -11.24073314666748, "global_step": 416989, "epoch": 2482} {"train_loss": -11.948366165161133, "global_step": 416990, "epoch": 2482} {"train_loss": -11.644881248474121, "global_step": 416991, "epoch": 2482} {"train_loss": -11.967447280883789, "global_step": 416992, "epoch": 2482} {"train_loss": -11.925341606140137, "global_step": 416993, "epoch": 2482} {"train_loss": -11.936345100402832, "global_step": 416994, "epoch": 2482} {"train_loss": -11.927574157714844, "global_step": 416995, "epoch": 2482} {"train_loss": -11.900772094726562, "global_step": 416996, "epoch": 2482} {"train_loss": -12.1246919631958, "global_step": 416997, "epoch": 2482} {"train_loss": -11.922391891479492, "global_step": 416998, "epoch": 2482} {"train_loss": -12.277740478515625, "global_step": 416999, "epoch": 2482} {"train_loss": -11.531021118164062, "global_step": 417000, "epoch": 2482} {"train_loss": -12.252549171447754, "global_step": 417001, "epoch": 2482} {"train_loss": -11.42596435546875, "global_step": 417002, "epoch": 2482} {"train_loss": -12.180559158325195, "global_step": 417003, "epoch": 2482} {"train_loss": -11.933850288391113, "global_step": 417004, "epoch": 2482} {"train_loss": -11.751214027404785, "global_step": 417005, "epoch": 2482} {"train_loss": -11.762145042419434, "global_step": 417006, "epoch": 2482} {"train_loss": -11.629201889038086, "global_step": 417007, "epoch": 2482} {"train_loss": -12.15764045715332, "global_step": 417008, "epoch": 2482} {"train_loss": -11.852312088012695, "global_step": 417009, "epoch": 2482} {"train_loss": -12.347707748413086, "global_step": 417010, "epoch": 2482} {"train_loss": -12.048927307128906, "global_step": 417011, "epoch": 2482} {"train_loss": -12.123416900634766, "global_step": 417012, "epoch": 2482} {"train_loss": -11.460854530334473, "global_step": 417013, "epoch": 2482} {"train_loss": -12.173720359802246, "global_step": 417014, "epoch": 2482} {"train_loss": -12.252334594726562, "global_step": 417015, "epoch": 2482} {"train_loss": -11.840181350708008, "global_step": 417016, "epoch": 2482} {"train_loss": -12.236672401428223, "global_step": 417017, "epoch": 2482} {"train_loss": -12.027170181274414, "global_step": 417018, "epoch": 2482} {"train_loss": -12.314441680908203, "global_step": 417019, "epoch": 2482} {"train_loss": -11.981472969055176, "global_step": 417020, "epoch": 2482} {"train_loss": -12.230167388916016, "global_step": 417021, "epoch": 2482} {"train_loss": -11.803482055664062, "global_step": 417022, "epoch": 2482} {"train_loss": -12.188987731933594, "global_step": 417023, "epoch": 2482} {"train_loss": -12.156932830810547, "global_step": 417024, "epoch": 2482} {"train_loss": -12.088388442993164, "global_step": 417025, "epoch": 2482} {"train_loss": -12.10354232788086, "global_step": 417026, "epoch": 2482} {"train_loss": -12.212356567382812, "global_step": 417027, "epoch": 2482} {"train_loss": -12.050762176513672, "global_step": 417028, "epoch": 2482} {"train_loss": -11.759698867797852, "global_step": 417029, "epoch": 2482} {"train_loss": -12.389927864074707, "global_step": 417030, "epoch": 2482} {"train_loss": -11.980215072631836, "global_step": 417031, "epoch": 2482} {"train_loss": -11.815723419189453, "global_step": 417032, "epoch": 2482} {"train_loss": -12.36271858215332, "global_step": 417033, "epoch": 2482} {"train_loss": -10.9093017578125, "global_step": 417034, "epoch": 2482} {"train_loss": -12.159147262573242, "global_step": 417035, "epoch": 2482} {"train_loss": -11.95337200164795, "global_step": 417036, "epoch": 2482} {"train_loss": -12.098724365234375, "global_step": 417037, "epoch": 2482} {"train_loss": -12.124652862548828, "global_step": 417038, "epoch": 2482} {"train_loss": -12.051977157592773, "global_step": 417039, "epoch": 2482} {"train_loss": -12.231298446655273, "global_step": 417040, "epoch": 2482} {"train_loss": -12.274782180786133, "global_step": 417041, "epoch": 2482} {"train_loss": -12.064584732055664, "global_step": 417042, "epoch": 2482} {"train_loss": -12.070135116577148, "global_step": 417043, "epoch": 2482} {"train_loss": -12.582071304321289, "global_step": 417044, "epoch": 2482} {"train_loss": -12.290046691894531, "global_step": 417045, "epoch": 2482} {"train_loss": -12.459465026855469, "global_step": 417046, "epoch": 2482} {"train_loss": -12.442811965942383, "global_step": 417047, "epoch": 2482} {"train_loss": -12.631888389587402, "global_step": 417048, "epoch": 2482} {"train_loss": -12.282495498657227, "global_step": 417049, "epoch": 2482} {"train_loss": -12.484745025634766, "global_step": 417050, "epoch": 2482} {"train_loss": -12.591767311096191, "global_step": 417051, "epoch": 2482} {"train_loss": -12.614892959594727, "global_step": 417052, "epoch": 2482} {"train_loss": -12.46601676940918, "global_step": 417053, "epoch": 2482} {"train_loss": -12.623371124267578, "global_step": 417054, "epoch": 2482} {"train_loss": -12.52098274230957, "global_step": 417055, "epoch": 2482} {"train_loss": -12.336883544921875, "global_step": 417056, "epoch": 2482} {"train_loss": -12.371578216552734, "global_step": 417057, "epoch": 2482} {"train_loss": -12.626119613647461, "global_step": 417058, "epoch": 2482} {"train_loss": -12.595935821533203, "global_step": 417059, "epoch": 2482} {"train_loss": -12.263931274414062, "global_step": 417060, "epoch": 2482} {"train_loss": -12.502517700195312, "global_step": 417061, "epoch": 2482} {"train_loss": -12.88575267791748, "global_step": 417062, "epoch": 2482} {"train_loss": -12.337196350097656, "global_step": 417063, "epoch": 2482} {"train_loss": -12.611332893371582, "global_step": 417064, "epoch": 2482} {"train_loss": -12.441370010375977, "global_step": 417065, "epoch": 2482} {"train_loss": -12.683349609375, "global_step": 417066, "epoch": 2482} {"train_loss": -12.499876022338867, "global_step": 417067, "epoch": 2482} {"train_loss": -12.72386646270752, "global_step": 417068, "epoch": 2482} {"train_loss": -12.644754409790039, "global_step": 417069, "epoch": 2482} {"train_loss": -12.481775283813477, "global_step": 417070, "epoch": 2482} {"train_loss": -12.393385887145996, "global_step": 417071, "epoch": 2482} {"train_loss": -12.732879638671875, "global_step": 417072, "epoch": 2482} {"train_loss": -12.472875595092773, "global_step": 417073, "epoch": 2482} {"train_loss": -12.785475730895996, "global_step": 417074, "epoch": 2482} {"train_loss": -12.57223892211914, "global_step": 417075, "epoch": 2482} {"train_loss": -12.350696563720703, "global_step": 417076, "epoch": 2482} {"train_loss": -12.396957397460938, "global_step": 417077, "epoch": 2482} {"train_loss": -12.508774757385254, "global_step": 417078, "epoch": 2482} {"train_loss": -12.606627464294434, "global_step": 417079, "epoch": 2482} {"train_loss": -12.655967712402344, "global_step": 417080, "epoch": 2482} {"train_loss": -12.410480499267578, "global_step": 417081, "epoch": 2482} {"train_loss": -12.618751525878906, "global_step": 417082, "epoch": 2482} {"train_loss": -11.954488754272461, "global_step": 417083, "epoch": 2482} {"train_loss": -12.251710891723633, "global_step": 417084, "epoch": 2482} {"train_loss": -12.437570571899414, "global_step": 417085, "epoch": 2482} {"train_loss": -12.390761375427246, "global_step": 417086, "epoch": 2482} {"train_loss": -12.187887191772461, "global_step": 417087, "epoch": 2482} {"train_loss": -12.420823097229004, "global_step": 417088, "epoch": 2482} {"train_loss": -12.506464004516602, "global_step": 417089, "epoch": 2482} {"train_loss": -12.296085357666016, "global_step": 417090, "epoch": 2482} {"train_loss": -12.284421920776367, "global_step": 417091, "epoch": 2482} {"train_loss": -12.203246116638184, "global_step": 417092, "epoch": 2482} {"train_loss": -12.602487564086914, "global_step": 417093, "epoch": 2482} {"train_loss": -12.541089057922363, "global_step": 417094, "epoch": 2482} {"train_loss": -11.652144432067871, "global_step": 417095, "epoch": 2482} {"train_loss": -11.969459533691406, "global_step": 417096, "epoch": 2482} {"train_loss": -12.614927291870117, "global_step": 417097, "epoch": 2482} {"train_loss": -12.126269340515137, "global_step": 417098, "epoch": 2482} {"train_loss": -12.277946472167969, "global_step": 417099, "epoch": 2482} {"train_loss": -12.172021865844727, "global_step": 417100, "epoch": 2482} {"train_loss": -11.92245864868164, "global_step": 417101, "epoch": 2482} {"train_loss": -10.929080963134766, "global_step": 417102, "epoch": 2482} {"train_loss": -12.022767066955566, "global_step": 417103, "epoch": 2482} {"train_loss": -12.525896072387695, "global_step": 417104, "epoch": 2482} {"train_loss": -10.43181324005127, "global_step": 417105, "epoch": 2482} {"train_loss": -11.810855865478516, "global_step": 417106, "epoch": 2482} {"train_loss": -11.74317741394043, "global_step": 417107, "epoch": 2482} {"train_loss": -9.541343688964844, "global_step": 417108, "epoch": 2482} {"train_loss": -11.913612365722656, "global_step": 417109, "epoch": 2482} {"train_loss": -10.26164436340332, "global_step": 417110, "epoch": 2482} {"train_loss": -10.31356430053711, "global_step": 417111, "epoch": 2482} {"train_loss": -10.413299560546875, "global_step": 417112, "epoch": 2482} {"train_loss": -10.760796546936035, "global_step": 417113, "epoch": 2482} {"train_loss": -11.085487365722656, "global_step": 417114, "epoch": 2482} {"train_loss": -10.52017593383789, "global_step": 417115, "epoch": 2482} {"train_loss": -11.668889999389648, "global_step": 417116, "epoch": 2482} {"train_loss": -10.509967803955078, "global_step": 417117, "epoch": 2482} {"train_loss": -11.808798789978027, "global_step": 417118, "epoch": 2482} {"train_loss": -9.501222610473633, "global_step": 417119, "epoch": 2482} {"train_loss": -10.306968688964844, "global_step": 417120, "epoch": 2482} {"train_loss": -11.206742286682129, "global_step": 417121, "epoch": 2482} {"train_loss": -10.865875244140625, "global_step": 417122, "epoch": 2482} {"train_loss": -11.234954833984375, "global_step": 417123, "epoch": 2482} {"train_loss": -11.42318058013916, "global_step": 417124, "epoch": 2482} {"train_loss": -11.199514389038086, "global_step": 417125, "epoch": 2482} {"train_loss": -11.598336219787598, "global_step": 417126, "epoch": 2482} {"train_loss": -11.574236869812012, "global_step": 417127, "epoch": 2482} {"train_loss": -12.205438613891602, "global_step": 417128, "epoch": 2482} {"train_loss": -11.492709159851074, "global_step": 417129, "epoch": 2482} {"train_loss": -11.863840103149414, "global_step": 417130, "epoch": 2482} {"train_loss": -11.83933162689209, "global_step": 417131, "epoch": 2482} {"train_loss": -12.135181427001953, "global_step": 417132, "epoch": 2482} {"train_loss": -12.319391250610352, "global_step": 417133, "epoch": 2482} {"train_loss": -11.73434066772461, "global_step": 417134, "epoch": 2482} {"train_loss": -11.903833389282227, "global_step": 417135, "epoch": 2482} {"train_loss": -11.899171829223633, "global_step": 417136, "epoch": 2482} {"train_loss": -12.046741485595703, "global_step": 417137, "epoch": 2482} {"train_loss": -11.932110786437988, "global_step": 417138, "epoch": 2482} {"train_loss": -12.411123275756836, "global_step": 417139, "epoch": 2482} {"train_loss": -12.16197681427002, "global_step": 417140, "epoch": 2482} {"train_loss": -12.043684005737305, "global_step": 417141, "epoch": 2482} {"train_loss": -11.976598739624023, "global_step": 417142, "epoch": 2482} {"train_loss": -11.964032945178804, "global_step": 417143, "epoch": 2482, "val_loss": 308840.375} {"train_loss": -12.206575393676758, "global_step": 417144, "epoch": 2483} {"train_loss": -12.447195053100586, "global_step": 417145, "epoch": 2483} {"train_loss": -12.409759521484375, "global_step": 417146, "epoch": 2483} {"train_loss": -12.348892211914062, "global_step": 417147, "epoch": 2483} {"train_loss": -12.234280586242676, "global_step": 417148, "epoch": 2483} {"train_loss": -11.950599670410156, "global_step": 417149, "epoch": 2483} {"train_loss": -12.51770305633545, "global_step": 417150, "epoch": 2483} {"train_loss": -12.231565475463867, "global_step": 417151, "epoch": 2483} {"train_loss": -12.19105339050293, "global_step": 417152, "epoch": 2483} {"train_loss": -12.463216781616211, "global_step": 417153, "epoch": 2483} {"train_loss": -12.123802185058594, "global_step": 417154, "epoch": 2483} {"train_loss": -12.545404434204102, "global_step": 417155, "epoch": 2483} {"train_loss": -12.19272232055664, "global_step": 417156, "epoch": 2483} {"train_loss": -12.18234634399414, "global_step": 417157, "epoch": 2483} {"train_loss": -11.726388931274414, "global_step": 417158, "epoch": 2483} {"train_loss": -11.560976028442383, "global_step": 417159, "epoch": 2483} {"train_loss": -12.639915466308594, "global_step": 417160, "epoch": 2483} {"train_loss": -11.851232528686523, "global_step": 417161, "epoch": 2483} {"train_loss": -12.493424415588379, "global_step": 417162, "epoch": 2483} {"train_loss": -11.787245750427246, "global_step": 417163, "epoch": 2483} {"train_loss": -11.95798397064209, "global_step": 417164, "epoch": 2483} {"train_loss": -12.041316986083984, "global_step": 417165, "epoch": 2483} {"train_loss": -12.215174674987793, "global_step": 417166, "epoch": 2483} {"train_loss": -12.310550689697266, "global_step": 417167, "epoch": 2483} {"train_loss": -12.156007766723633, "global_step": 417168, "epoch": 2483} {"train_loss": -12.266363143920898, "global_step": 417169, "epoch": 2483} {"train_loss": -12.062923431396484, "global_step": 417170, "epoch": 2483} {"train_loss": -11.987785339355469, "global_step": 417171, "epoch": 2483} {"train_loss": -11.724557876586914, "global_step": 417172, "epoch": 2483} {"train_loss": -12.097661018371582, "global_step": 417173, "epoch": 2483} {"train_loss": -12.161689758300781, "global_step": 417174, "epoch": 2483} {"train_loss": -12.065354347229004, "global_step": 417175, "epoch": 2483} {"train_loss": -12.034414291381836, "global_step": 417176, "epoch": 2483} {"train_loss": -11.534496307373047, "global_step": 417177, "epoch": 2483} {"train_loss": -11.57084846496582, "global_step": 417178, "epoch": 2483} {"train_loss": -12.21240520477295, "global_step": 417179, "epoch": 2483} {"train_loss": -11.913464546203613, "global_step": 417180, "epoch": 2483} {"train_loss": -12.064605712890625, "global_step": 417181, "epoch": 2483} {"train_loss": -11.580862045288086, "global_step": 417182, "epoch": 2483} {"train_loss": -11.914193153381348, "global_step": 417183, "epoch": 2483} {"train_loss": -11.113941192626953, "global_step": 417184, "epoch": 2483} {"train_loss": -12.086132049560547, "global_step": 417185, "epoch": 2483} {"train_loss": -11.93411636352539, "global_step": 417186, "epoch": 2483} {"train_loss": -11.781036376953125, "global_step": 417187, "epoch": 2483} {"train_loss": -11.859016418457031, "global_step": 417188, "epoch": 2483} {"train_loss": -12.111212730407715, "global_step": 417189, "epoch": 2483} {"train_loss": -12.322710990905762, "global_step": 417190, "epoch": 2483} {"train_loss": -12.097774505615234, "global_step": 417191, "epoch": 2483} {"train_loss": -11.731189727783203, "global_step": 417192, "epoch": 2483} {"train_loss": -11.524421691894531, "global_step": 417193, "epoch": 2483} {"train_loss": -12.013443946838379, "global_step": 417194, "epoch": 2483} {"train_loss": -11.828367233276367, "global_step": 417195, "epoch": 2483} {"train_loss": -11.798749923706055, "global_step": 417196, "epoch": 2483} {"train_loss": -12.108236312866211, "global_step": 417197, "epoch": 2483} {"train_loss": -11.936175346374512, "global_step": 417198, "epoch": 2483} {"train_loss": -12.470261573791504, "global_step": 417199, "epoch": 2483} {"train_loss": -12.295611381530762, "global_step": 417200, "epoch": 2483} {"train_loss": -12.296401023864746, "global_step": 417201, "epoch": 2483} {"train_loss": -12.214409828186035, "global_step": 417202, "epoch": 2483} {"train_loss": -12.518367767333984, "global_step": 417203, "epoch": 2483} {"train_loss": -12.306883811950684, "global_step": 417204, "epoch": 2483} {"train_loss": -12.710908889770508, "global_step": 417205, "epoch": 2483} {"train_loss": -12.530254364013672, "global_step": 417206, "epoch": 2483} {"train_loss": -12.486912727355957, "global_step": 417207, "epoch": 2483} {"train_loss": -12.450482368469238, "global_step": 417208, "epoch": 2483} {"train_loss": -12.413321495056152, "global_step": 417209, "epoch": 2483} {"train_loss": -12.59328556060791, "global_step": 417210, "epoch": 2483} {"train_loss": -12.001991271972656, "global_step": 417211, "epoch": 2483} {"train_loss": -12.456155776977539, "global_step": 417212, "epoch": 2483} {"train_loss": -12.200752258300781, "global_step": 417213, "epoch": 2483} {"train_loss": -12.253459930419922, "global_step": 417214, "epoch": 2483} {"train_loss": -12.583929061889648, "global_step": 417215, "epoch": 2483} {"train_loss": -12.155828475952148, "global_step": 417216, "epoch": 2483} {"train_loss": -12.503437995910645, "global_step": 417217, "epoch": 2483} {"train_loss": -12.269920349121094, "global_step": 417218, "epoch": 2483} {"train_loss": -12.254182815551758, "global_step": 417219, "epoch": 2483} {"train_loss": -12.501580238342285, "global_step": 417220, "epoch": 2483} {"train_loss": -12.338029861450195, "global_step": 417221, "epoch": 2483} {"train_loss": -12.538326263427734, "global_step": 417222, "epoch": 2483} {"train_loss": -12.392800331115723, "global_step": 417223, "epoch": 2483} {"train_loss": -11.98337459564209, "global_step": 417224, "epoch": 2483} {"train_loss": -12.385272979736328, "global_step": 417225, "epoch": 2483} {"train_loss": -11.877998352050781, "global_step": 417226, "epoch": 2483} {"train_loss": -12.157405853271484, "global_step": 417227, "epoch": 2483} {"train_loss": -12.38090705871582, "global_step": 417228, "epoch": 2483} {"train_loss": -12.33206558227539, "global_step": 417229, "epoch": 2483} {"train_loss": -12.609573364257812, "global_step": 417230, "epoch": 2483} {"train_loss": -12.695646286010742, "global_step": 417231, "epoch": 2483} {"train_loss": -12.154999732971191, "global_step": 417232, "epoch": 2483} {"train_loss": -12.599258422851562, "global_step": 417233, "epoch": 2483} {"train_loss": -12.402556419372559, "global_step": 417234, "epoch": 2483} {"train_loss": -12.617013931274414, "global_step": 417235, "epoch": 2483} {"train_loss": -12.498695373535156, "global_step": 417236, "epoch": 2483} {"train_loss": -11.99620246887207, "global_step": 417237, "epoch": 2483} {"train_loss": -12.248323440551758, "global_step": 417238, "epoch": 2483} {"train_loss": -12.224477767944336, "global_step": 417239, "epoch": 2483} {"train_loss": -12.482717514038086, "global_step": 417240, "epoch": 2483} {"train_loss": -12.18342113494873, "global_step": 417241, "epoch": 2483} {"train_loss": -12.119807243347168, "global_step": 417242, "epoch": 2483} {"train_loss": -11.900491714477539, "global_step": 417243, "epoch": 2483} {"train_loss": -11.894366264343262, "global_step": 417244, "epoch": 2483} {"train_loss": -12.437437057495117, "global_step": 417245, "epoch": 2483} {"train_loss": -12.325485229492188, "global_step": 417246, "epoch": 2483} {"train_loss": -12.262456893920898, "global_step": 417247, "epoch": 2483} {"train_loss": -12.260507583618164, "global_step": 417248, "epoch": 2483} {"train_loss": -12.75874137878418, "global_step": 417249, "epoch": 2483} {"train_loss": -12.050029754638672, "global_step": 417250, "epoch": 2483} {"train_loss": -12.648871421813965, "global_step": 417251, "epoch": 2483} {"train_loss": -12.233610153198242, "global_step": 417252, "epoch": 2483} {"train_loss": -12.587635040283203, "global_step": 417253, "epoch": 2483} {"train_loss": -12.054931640625, "global_step": 417254, "epoch": 2483} {"train_loss": -12.641530990600586, "global_step": 417255, "epoch": 2483} {"train_loss": -12.128850936889648, "global_step": 417256, "epoch": 2483} {"train_loss": -12.64431095123291, "global_step": 417257, "epoch": 2483} {"train_loss": -12.186128616333008, "global_step": 417258, "epoch": 2483} {"train_loss": -11.916351318359375, "global_step": 417259, "epoch": 2483} {"train_loss": -12.231514930725098, "global_step": 417260, "epoch": 2483} {"train_loss": -12.310649871826172, "global_step": 417261, "epoch": 2483} {"train_loss": -12.273467063903809, "global_step": 417262, "epoch": 2483} {"train_loss": -12.38142204284668, "global_step": 417263, "epoch": 2483} {"train_loss": -12.378053665161133, "global_step": 417264, "epoch": 2483} {"train_loss": -12.762556076049805, "global_step": 417265, "epoch": 2483} {"train_loss": -12.562492370605469, "global_step": 417266, "epoch": 2483} {"train_loss": -12.684235572814941, "global_step": 417267, "epoch": 2483} {"train_loss": -12.589004516601562, "global_step": 417268, "epoch": 2483} {"train_loss": -12.696710586547852, "global_step": 417269, "epoch": 2483} {"train_loss": -12.579007148742676, "global_step": 417270, "epoch": 2483} {"train_loss": -12.584697723388672, "global_step": 417271, "epoch": 2483} {"train_loss": -12.617997169494629, "global_step": 417272, "epoch": 2483} {"train_loss": -12.305452346801758, "global_step": 417273, "epoch": 2483} {"train_loss": -12.547009468078613, "global_step": 417274, "epoch": 2483} {"train_loss": -12.684215545654297, "global_step": 417275, "epoch": 2483} {"train_loss": -12.54069709777832, "global_step": 417276, "epoch": 2483} {"train_loss": -12.413106918334961, "global_step": 417277, "epoch": 2483} {"train_loss": -12.450212478637695, "global_step": 417278, "epoch": 2483} {"train_loss": -12.521549224853516, "global_step": 417279, "epoch": 2483} {"train_loss": -12.57736587524414, "global_step": 417280, "epoch": 2483} {"train_loss": -12.277830123901367, "global_step": 417281, "epoch": 2483} {"train_loss": -12.746349334716797, "global_step": 417282, "epoch": 2483} {"train_loss": -12.814661026000977, "global_step": 417283, "epoch": 2483} {"train_loss": -12.742691040039062, "global_step": 417284, "epoch": 2483} {"train_loss": -12.667119979858398, "global_step": 417285, "epoch": 2483} {"train_loss": -12.51734733581543, "global_step": 417286, "epoch": 2483} {"train_loss": -12.78022575378418, "global_step": 417287, "epoch": 2483} {"train_loss": -12.711084365844727, "global_step": 417288, "epoch": 2483} {"train_loss": -12.814383506774902, "global_step": 417289, "epoch": 2483} {"train_loss": -12.756572723388672, "global_step": 417290, "epoch": 2483} {"train_loss": -12.616690635681152, "global_step": 417291, "epoch": 2483} {"train_loss": -12.564229965209961, "global_step": 417292, "epoch": 2483} {"train_loss": -12.682204246520996, "global_step": 417293, "epoch": 2483} {"train_loss": -12.468992233276367, "global_step": 417294, "epoch": 2483} {"train_loss": -12.538129806518555, "global_step": 417295, "epoch": 2483} {"train_loss": -12.48094367980957, "global_step": 417296, "epoch": 2483} {"train_loss": -11.603191375732422, "global_step": 417297, "epoch": 2483} {"train_loss": -12.30561637878418, "global_step": 417298, "epoch": 2483} {"train_loss": -12.537352561950684, "global_step": 417299, "epoch": 2483} {"train_loss": -11.617847442626953, "global_step": 417300, "epoch": 2483} {"train_loss": -11.076725006103516, "global_step": 417301, "epoch": 2483} {"train_loss": -12.550987243652344, "global_step": 417302, "epoch": 2483} {"train_loss": -11.698751449584961, "global_step": 417303, "epoch": 2483} {"train_loss": -11.218389511108398, "global_step": 417304, "epoch": 2483} {"train_loss": -11.28718090057373, "global_step": 417305, "epoch": 2483} {"train_loss": -12.021750450134277, "global_step": 417306, "epoch": 2483} {"train_loss": -10.990839004516602, "global_step": 417307, "epoch": 2483} {"train_loss": -11.82264518737793, "global_step": 417308, "epoch": 2483} {"train_loss": -11.945749282836914, "global_step": 417309, "epoch": 2483} {"train_loss": -10.893255233764648, "global_step": 417310, "epoch": 2483} {"train_loss": -12.229032868430728, "global_step": 417311, "epoch": 2483, "val_loss": 306951.09375} {"train_loss": -11.366724014282227, "global_step": 417312, "epoch": 2484} {"train_loss": -11.924524307250977, "global_step": 417313, "epoch": 2484} {"train_loss": -12.44081974029541, "global_step": 417314, "epoch": 2484} {"train_loss": -12.406637191772461, "global_step": 417315, "epoch": 2484} {"train_loss": -11.60828971862793, "global_step": 417316, "epoch": 2484} {"train_loss": -11.78700065612793, "global_step": 417317, "epoch": 2484} {"train_loss": -11.93009090423584, "global_step": 417318, "epoch": 2484} {"train_loss": -11.636475563049316, "global_step": 417319, "epoch": 2484} {"train_loss": -11.875356674194336, "global_step": 417320, "epoch": 2484} {"train_loss": -10.777566909790039, "global_step": 417321, "epoch": 2484} {"train_loss": -11.803276062011719, "global_step": 417322, "epoch": 2484} {"train_loss": -11.134796142578125, "global_step": 417323, "epoch": 2484} {"train_loss": -11.395020484924316, "global_step": 417324, "epoch": 2484} {"train_loss": -12.010000228881836, "global_step": 417325, "epoch": 2484} {"train_loss": -11.666747093200684, "global_step": 417326, "epoch": 2484} {"train_loss": -12.222618103027344, "global_step": 417327, "epoch": 2484} {"train_loss": -12.395288467407227, "global_step": 417328, "epoch": 2484} {"train_loss": -11.679746627807617, "global_step": 417329, "epoch": 2484} {"train_loss": -11.874855041503906, "global_step": 417330, "epoch": 2484} {"train_loss": -11.477367401123047, "global_step": 417331, "epoch": 2484} {"train_loss": -12.349206924438477, "global_step": 417332, "epoch": 2484} {"train_loss": -12.098024368286133, "global_step": 417333, "epoch": 2484} {"train_loss": -12.243067741394043, "global_step": 417334, "epoch": 2484} {"train_loss": -11.462016105651855, "global_step": 417335, "epoch": 2484} {"train_loss": -12.015874862670898, "global_step": 417336, "epoch": 2484} {"train_loss": -11.667488098144531, "global_step": 417337, "epoch": 2484} {"train_loss": -12.436567306518555, "global_step": 417338, "epoch": 2484} {"train_loss": -11.5035982131958, "global_step": 417339, "epoch": 2484} {"train_loss": -12.19234848022461, "global_step": 417340, "epoch": 2484} {"train_loss": -11.740385055541992, "global_step": 417341, "epoch": 2484} {"train_loss": -12.605302810668945, "global_step": 417342, "epoch": 2484} {"train_loss": -12.108688354492188, "global_step": 417343, "epoch": 2484} {"train_loss": -12.219579696655273, "global_step": 417344, "epoch": 2484} {"train_loss": -11.806461334228516, "global_step": 417345, "epoch": 2484} {"train_loss": -12.441923141479492, "global_step": 417346, "epoch": 2484} {"train_loss": -12.265731811523438, "global_step": 417347, "epoch": 2484} {"train_loss": -12.4647216796875, "global_step": 417348, "epoch": 2484} {"train_loss": -12.235466003417969, "global_step": 417349, "epoch": 2484} {"train_loss": -12.46785831451416, "global_step": 417350, "epoch": 2484} {"train_loss": -12.622332572937012, "global_step": 417351, "epoch": 2484} {"train_loss": -12.218515396118164, "global_step": 417352, "epoch": 2484} {"train_loss": -12.408280372619629, "global_step": 417353, "epoch": 2484} {"train_loss": -12.505011558532715, "global_step": 417354, "epoch": 2484} {"train_loss": -12.426443099975586, "global_step": 417355, "epoch": 2484} {"train_loss": -12.357754707336426, "global_step": 417356, "epoch": 2484} {"train_loss": -12.547903060913086, "global_step": 417357, "epoch": 2484} {"train_loss": -12.519367218017578, "global_step": 417358, "epoch": 2484} {"train_loss": -12.345501899719238, "global_step": 417359, "epoch": 2484} {"train_loss": -12.401360511779785, "global_step": 417360, "epoch": 2484} {"train_loss": -12.439901351928711, "global_step": 417361, "epoch": 2484} {"train_loss": -12.348260879516602, "global_step": 417362, "epoch": 2484} {"train_loss": -12.220438003540039, "global_step": 417363, "epoch": 2484} {"train_loss": -12.345369338989258, "global_step": 417364, "epoch": 2484} {"train_loss": -12.296932220458984, "global_step": 417365, "epoch": 2484} {"train_loss": -12.161693572998047, "global_step": 417366, "epoch": 2484} {"train_loss": -12.612213134765625, "global_step": 417367, "epoch": 2484} {"train_loss": -12.368704795837402, "global_step": 417368, "epoch": 2484} {"train_loss": -12.119003295898438, "global_step": 417369, "epoch": 2484} {"train_loss": -12.054924011230469, "global_step": 417370, "epoch": 2484} {"train_loss": -11.989076614379883, "global_step": 417371, "epoch": 2484} {"train_loss": -10.408927917480469, "global_step": 417372, "epoch": 2484} {"train_loss": -11.61496639251709, "global_step": 417373, "epoch": 2484} {"train_loss": -9.81259822845459, "global_step": 417374, "epoch": 2484} {"train_loss": -11.021331787109375, "global_step": 417375, "epoch": 2484} {"train_loss": -10.0714111328125, "global_step": 417376, "epoch": 2484} {"train_loss": -12.719475746154785, "global_step": 417377, "epoch": 2484} {"train_loss": -11.034454345703125, "global_step": 417378, "epoch": 2484} {"train_loss": -11.707574844360352, "global_step": 417379, "epoch": 2484} {"train_loss": -12.07094955444336, "global_step": 417380, "epoch": 2484} {"train_loss": -11.07186508178711, "global_step": 417381, "epoch": 2484} {"train_loss": -12.639081954956055, "global_step": 417382, "epoch": 2484} {"train_loss": -11.563262939453125, "global_step": 417383, "epoch": 2484} {"train_loss": -12.234804153442383, "global_step": 417384, "epoch": 2484} {"train_loss": -11.391151428222656, "global_step": 417385, "epoch": 2484} {"train_loss": -12.424747467041016, "global_step": 417386, "epoch": 2484} {"train_loss": -11.580911636352539, "global_step": 417387, "epoch": 2484} {"train_loss": -12.265801429748535, "global_step": 417388, "epoch": 2484} {"train_loss": -11.94507122039795, "global_step": 417389, "epoch": 2484} {"train_loss": -12.105683326721191, "global_step": 417390, "epoch": 2484} {"train_loss": -11.99093246459961, "global_step": 417391, "epoch": 2484} {"train_loss": -11.816688537597656, "global_step": 417392, "epoch": 2484} {"train_loss": -12.235580444335938, "global_step": 417393, "epoch": 2484} {"train_loss": -12.14529800415039, "global_step": 417394, "epoch": 2484} {"train_loss": -11.775872230529785, "global_step": 417395, "epoch": 2484} {"train_loss": -12.319704055786133, "global_step": 417396, "epoch": 2484} {"train_loss": -11.77455997467041, "global_step": 417397, "epoch": 2484} {"train_loss": -12.063521385192871, "global_step": 417398, "epoch": 2484} {"train_loss": -12.305289268493652, "global_step": 417399, "epoch": 2484} {"train_loss": -11.78506851196289, "global_step": 417400, "epoch": 2484} {"train_loss": -12.394001007080078, "global_step": 417401, "epoch": 2484} {"train_loss": -11.520158767700195, "global_step": 417402, "epoch": 2484} {"train_loss": -12.023683547973633, "global_step": 417403, "epoch": 2484} {"train_loss": -12.318571090698242, "global_step": 417404, "epoch": 2484} {"train_loss": -12.234057426452637, "global_step": 417405, "epoch": 2484} {"train_loss": -12.364668846130371, "global_step": 417406, "epoch": 2484} {"train_loss": -12.214824676513672, "global_step": 417407, "epoch": 2484} {"train_loss": -11.795278549194336, "global_step": 417408, "epoch": 2484} {"train_loss": -12.386059761047363, "global_step": 417409, "epoch": 2484} {"train_loss": -12.470462799072266, "global_step": 417410, "epoch": 2484} {"train_loss": -11.914076805114746, "global_step": 417411, "epoch": 2484} {"train_loss": -12.418983459472656, "global_step": 417412, "epoch": 2484} {"train_loss": -12.563201904296875, "global_step": 417413, "epoch": 2484} {"train_loss": -12.61342716217041, "global_step": 417414, "epoch": 2484} {"train_loss": -12.374519348144531, "global_step": 417415, "epoch": 2484} {"train_loss": -12.489810943603516, "global_step": 417416, "epoch": 2484} {"train_loss": -12.217082977294922, "global_step": 417417, "epoch": 2484} {"train_loss": -12.42645263671875, "global_step": 417418, "epoch": 2484} {"train_loss": -12.542119979858398, "global_step": 417419, "epoch": 2484} {"train_loss": -12.310291290283203, "global_step": 417420, "epoch": 2484} {"train_loss": -12.523565292358398, "global_step": 417421, "epoch": 2484} {"train_loss": -12.573930740356445, "global_step": 417422, "epoch": 2484} {"train_loss": -12.544797897338867, "global_step": 417423, "epoch": 2484} {"train_loss": -12.493947982788086, "global_step": 417424, "epoch": 2484} {"train_loss": -12.492557525634766, "global_step": 417425, "epoch": 2484} {"train_loss": -12.533712387084961, "global_step": 417426, "epoch": 2484} {"train_loss": -12.420150756835938, "global_step": 417427, "epoch": 2484} {"train_loss": -12.451774597167969, "global_step": 417428, "epoch": 2484} {"train_loss": -12.756569862365723, "global_step": 417429, "epoch": 2484} {"train_loss": -12.381208419799805, "global_step": 417430, "epoch": 2484} {"train_loss": -12.393975257873535, "global_step": 417431, "epoch": 2484} {"train_loss": -12.437204360961914, "global_step": 417432, "epoch": 2484} {"train_loss": -12.618996620178223, "global_step": 417433, "epoch": 2484} {"train_loss": -12.33475112915039, "global_step": 417434, "epoch": 2484} {"train_loss": -12.569031715393066, "global_step": 417435, "epoch": 2484} {"train_loss": -12.06594467163086, "global_step": 417436, "epoch": 2484} {"train_loss": -12.449235916137695, "global_step": 417437, "epoch": 2484} {"train_loss": -12.553359985351562, "global_step": 417438, "epoch": 2484} {"train_loss": -12.861154556274414, "global_step": 417439, "epoch": 2484} {"train_loss": -12.320186614990234, "global_step": 417440, "epoch": 2484} {"train_loss": -12.682504653930664, "global_step": 417441, "epoch": 2484} {"train_loss": -12.313610076904297, "global_step": 417442, "epoch": 2484} {"train_loss": -12.907821655273438, "global_step": 417443, "epoch": 2484} {"train_loss": -12.391717910766602, "global_step": 417444, "epoch": 2484} {"train_loss": -12.721622467041016, "global_step": 417445, "epoch": 2484} {"train_loss": -12.62171745300293, "global_step": 417446, "epoch": 2484} {"train_loss": -12.451334953308105, "global_step": 417447, "epoch": 2484} {"train_loss": -12.285430908203125, "global_step": 417448, "epoch": 2484} {"train_loss": -12.509977340698242, "global_step": 417449, "epoch": 2484} {"train_loss": -12.471260070800781, "global_step": 417450, "epoch": 2484} {"train_loss": -12.69506549835205, "global_step": 417451, "epoch": 2484} {"train_loss": -12.064606666564941, "global_step": 417452, "epoch": 2484} {"train_loss": -12.102533340454102, "global_step": 417453, "epoch": 2484} {"train_loss": -11.74267578125, "global_step": 417454, "epoch": 2484} {"train_loss": -12.760531425476074, "global_step": 417455, "epoch": 2484} {"train_loss": -11.858050346374512, "global_step": 417456, "epoch": 2484} {"train_loss": -12.514413833618164, "global_step": 417457, "epoch": 2484} {"train_loss": -12.027730941772461, "global_step": 417458, "epoch": 2484} {"train_loss": -11.670110702514648, "global_step": 417459, "epoch": 2484} {"train_loss": -11.724305152893066, "global_step": 417460, "epoch": 2484} {"train_loss": -11.840434074401855, "global_step": 417461, "epoch": 2484} {"train_loss": -11.321348190307617, "global_step": 417462, "epoch": 2484} {"train_loss": -11.702695846557617, "global_step": 417463, "epoch": 2484} {"train_loss": -11.525728225708008, "global_step": 417464, "epoch": 2484} {"train_loss": -11.54941177368164, "global_step": 417465, "epoch": 2484} {"train_loss": -11.722955703735352, "global_step": 417466, "epoch": 2484} {"train_loss": -11.565375328063965, "global_step": 417467, "epoch": 2484} {"train_loss": -12.023660659790039, "global_step": 417468, "epoch": 2484} {"train_loss": -10.929104804992676, "global_step": 417469, "epoch": 2484} {"train_loss": -10.88831901550293, "global_step": 417470, "epoch": 2484} {"train_loss": -11.466083526611328, "global_step": 417471, "epoch": 2484} {"train_loss": -9.620315551757812, "global_step": 417472, "epoch": 2484} {"train_loss": -10.366134643554688, "global_step": 417473, "epoch": 2484} {"train_loss": -11.330049514770508, "global_step": 417474, "epoch": 2484} {"train_loss": -9.75699234008789, "global_step": 417475, "epoch": 2484} {"train_loss": -10.643293380737305, "global_step": 417476, "epoch": 2484} {"train_loss": -9.616532325744629, "global_step": 417477, "epoch": 2484} {"train_loss": -9.569707870483398, "global_step": 417478, "epoch": 2484} {"train_loss": -11.983241762433734, "global_step": 417479, "epoch": 2484, "val_loss": 304766.09375} {"train_loss": -9.950504302978516, "global_step": 417480, "epoch": 2485} {"train_loss": -10.501874923706055, "global_step": 417481, "epoch": 2485} {"train_loss": -8.69672966003418, "global_step": 417482, "epoch": 2485} {"train_loss": -10.810470581054688, "global_step": 417483, "epoch": 2485} {"train_loss": -10.000993728637695, "global_step": 417484, "epoch": 2485} {"train_loss": -10.576340675354004, "global_step": 417485, "epoch": 2485} {"train_loss": -10.565225601196289, "global_step": 417486, "epoch": 2485} {"train_loss": -10.443925857543945, "global_step": 417487, "epoch": 2485} {"train_loss": -10.131206512451172, "global_step": 417488, "epoch": 2485} {"train_loss": -11.109516143798828, "global_step": 417489, "epoch": 2485} {"train_loss": -9.638421058654785, "global_step": 417490, "epoch": 2485} {"train_loss": -9.479637145996094, "global_step": 417491, "epoch": 2485} {"train_loss": -10.7516450881958, "global_step": 417492, "epoch": 2485} {"train_loss": -10.61444091796875, "global_step": 417493, "epoch": 2485} {"train_loss": -10.197671890258789, "global_step": 417494, "epoch": 2485} {"train_loss": -10.740478515625, "global_step": 417495, "epoch": 2485} {"train_loss": -11.222593307495117, "global_step": 417496, "epoch": 2485} {"train_loss": -10.514448165893555, "global_step": 417497, "epoch": 2485} {"train_loss": -11.729633331298828, "global_step": 417498, "epoch": 2485} {"train_loss": -10.850057601928711, "global_step": 417499, "epoch": 2485} {"train_loss": -11.859356880187988, "global_step": 417500, "epoch": 2485} {"train_loss": -10.980649948120117, "global_step": 417501, "epoch": 2485} {"train_loss": -11.256382942199707, "global_step": 417502, "epoch": 2485} {"train_loss": -11.630525588989258, "global_step": 417503, "epoch": 2485} {"train_loss": -11.327621459960938, "global_step": 417504, "epoch": 2485} {"train_loss": -11.342848777770996, "global_step": 417505, "epoch": 2485} {"train_loss": -11.963094711303711, "global_step": 417506, "epoch": 2485} {"train_loss": -11.195469856262207, "global_step": 417507, "epoch": 2485} {"train_loss": -11.952537536621094, "global_step": 417508, "epoch": 2485} {"train_loss": -11.352197647094727, "global_step": 417509, "epoch": 2485} {"train_loss": -11.714818954467773, "global_step": 417510, "epoch": 2485} {"train_loss": -11.688101768493652, "global_step": 417511, "epoch": 2485} {"train_loss": -10.999580383300781, "global_step": 417512, "epoch": 2485} {"train_loss": -11.679973602294922, "global_step": 417513, "epoch": 2485} {"train_loss": -11.702238082885742, "global_step": 417514, "epoch": 2485} {"train_loss": -11.348889350891113, "global_step": 417515, "epoch": 2485} {"train_loss": -11.803742408752441, "global_step": 417516, "epoch": 2485} {"train_loss": -11.859622955322266, "global_step": 417517, "epoch": 2485} {"train_loss": -11.083054542541504, "global_step": 417518, "epoch": 2485} {"train_loss": -11.993243217468262, "global_step": 417519, "epoch": 2485} {"train_loss": -11.993388175964355, "global_step": 417520, "epoch": 2485} {"train_loss": -11.412957191467285, "global_step": 417521, "epoch": 2485} {"train_loss": -12.22933292388916, "global_step": 417522, "epoch": 2485} {"train_loss": -11.97823429107666, "global_step": 417523, "epoch": 2485} {"train_loss": -12.061817169189453, "global_step": 417524, "epoch": 2485} {"train_loss": -11.79969596862793, "global_step": 417525, "epoch": 2485} {"train_loss": -12.215774536132812, "global_step": 417526, "epoch": 2485} {"train_loss": -11.559001922607422, "global_step": 417527, "epoch": 2485} {"train_loss": -12.354452133178711, "global_step": 417528, "epoch": 2485} {"train_loss": -11.710296630859375, "global_step": 417529, "epoch": 2485} {"train_loss": -12.05689811706543, "global_step": 417530, "epoch": 2485} {"train_loss": -11.817464828491211, "global_step": 417531, "epoch": 2485} {"train_loss": -12.011861801147461, "global_step": 417532, "epoch": 2485} {"train_loss": -12.077863693237305, "global_step": 417533, "epoch": 2485} {"train_loss": -11.629631996154785, "global_step": 417534, "epoch": 2485} {"train_loss": -12.10269546508789, "global_step": 417535, "epoch": 2485} {"train_loss": -11.888460159301758, "global_step": 417536, "epoch": 2485} {"train_loss": -11.824020385742188, "global_step": 417537, "epoch": 2485} {"train_loss": -11.958717346191406, "global_step": 417538, "epoch": 2485} {"train_loss": -11.805643081665039, "global_step": 417539, "epoch": 2485} {"train_loss": -11.148408889770508, "global_step": 417540, "epoch": 2485} {"train_loss": -12.10637092590332, "global_step": 417541, "epoch": 2485} {"train_loss": -11.06094741821289, "global_step": 417542, "epoch": 2485} {"train_loss": -11.943073272705078, "global_step": 417543, "epoch": 2485} {"train_loss": -11.299155235290527, "global_step": 417544, "epoch": 2485} {"train_loss": -12.052556991577148, "global_step": 417545, "epoch": 2485} {"train_loss": -12.005202293395996, "global_step": 417546, "epoch": 2485} {"train_loss": -11.922708511352539, "global_step": 417547, "epoch": 2485} {"train_loss": -11.810062408447266, "global_step": 417548, "epoch": 2485} {"train_loss": -12.07579231262207, "global_step": 417549, "epoch": 2485} {"train_loss": -12.061700820922852, "global_step": 417550, "epoch": 2485} {"train_loss": -12.219687461853027, "global_step": 417551, "epoch": 2485} {"train_loss": -12.311599731445312, "global_step": 417552, "epoch": 2485} {"train_loss": -12.353597640991211, "global_step": 417553, "epoch": 2485} {"train_loss": -12.417764663696289, "global_step": 417554, "epoch": 2485} {"train_loss": -12.34334945678711, "global_step": 417555, "epoch": 2485} {"train_loss": -12.310537338256836, "global_step": 417556, "epoch": 2485} {"train_loss": -12.466161727905273, "global_step": 417557, "epoch": 2485} {"train_loss": -12.290525436401367, "global_step": 417558, "epoch": 2485} {"train_loss": -12.48318862915039, "global_step": 417559, "epoch": 2485} {"train_loss": -12.551546096801758, "global_step": 417560, "epoch": 2485} {"train_loss": -12.52928352355957, "global_step": 417561, "epoch": 2485} {"train_loss": -12.220532417297363, "global_step": 417562, "epoch": 2485} {"train_loss": -12.476794242858887, "global_step": 417563, "epoch": 2485} {"train_loss": -12.425923347473145, "global_step": 417564, "epoch": 2485} {"train_loss": -12.589373588562012, "global_step": 417565, "epoch": 2485} {"train_loss": -12.34526252746582, "global_step": 417566, "epoch": 2485} {"train_loss": -12.623534202575684, "global_step": 417567, "epoch": 2485} {"train_loss": -12.66873836517334, "global_step": 417568, "epoch": 2485} {"train_loss": -12.582632064819336, "global_step": 417569, "epoch": 2485} {"train_loss": -12.657452583312988, "global_step": 417570, "epoch": 2485} {"train_loss": -12.660266876220703, "global_step": 417571, "epoch": 2485} {"train_loss": -12.486064910888672, "global_step": 417572, "epoch": 2485} {"train_loss": -12.703695297241211, "global_step": 417573, "epoch": 2485} {"train_loss": -12.609146118164062, "global_step": 417574, "epoch": 2485} {"train_loss": -12.475872993469238, "global_step": 417575, "epoch": 2485} {"train_loss": -12.593897819519043, "global_step": 417576, "epoch": 2485} {"train_loss": -12.525527954101562, "global_step": 417577, "epoch": 2485} {"train_loss": -12.766952514648438, "global_step": 417578, "epoch": 2485} {"train_loss": -12.587535858154297, "global_step": 417579, "epoch": 2485} {"train_loss": -12.819890975952148, "global_step": 417580, "epoch": 2485} {"train_loss": -12.671162605285645, "global_step": 417581, "epoch": 2485} {"train_loss": -12.82420825958252, "global_step": 417582, "epoch": 2485} {"train_loss": -12.671016693115234, "global_step": 417583, "epoch": 2485} {"train_loss": -12.78978157043457, "global_step": 417584, "epoch": 2485} {"train_loss": -12.643714904785156, "global_step": 417585, "epoch": 2485} {"train_loss": -12.744235038757324, "global_step": 417586, "epoch": 2485} {"train_loss": -12.734601974487305, "global_step": 417587, "epoch": 2485} {"train_loss": -12.723901748657227, "global_step": 417588, "epoch": 2485} {"train_loss": -12.594751358032227, "global_step": 417589, "epoch": 2485} {"train_loss": -12.414052963256836, "global_step": 417590, "epoch": 2485} {"train_loss": -12.495403289794922, "global_step": 417591, "epoch": 2485} {"train_loss": -12.449487686157227, "global_step": 417592, "epoch": 2485} {"train_loss": -12.40126895904541, "global_step": 417593, "epoch": 2485} {"train_loss": -12.622678756713867, "global_step": 417594, "epoch": 2485} {"train_loss": -12.603294372558594, "global_step": 417595, "epoch": 2485} {"train_loss": -12.72396469116211, "global_step": 417596, "epoch": 2485} {"train_loss": -12.331062316894531, "global_step": 417597, "epoch": 2485} {"train_loss": -12.39235782623291, "global_step": 417598, "epoch": 2485} {"train_loss": -12.753358840942383, "global_step": 417599, "epoch": 2485} {"train_loss": -12.586645126342773, "global_step": 417600, "epoch": 2485} {"train_loss": -12.366975784301758, "global_step": 417601, "epoch": 2485} {"train_loss": -12.482269287109375, "global_step": 417602, "epoch": 2485} {"train_loss": -12.605764389038086, "global_step": 417603, "epoch": 2485} {"train_loss": -11.861380577087402, "global_step": 417604, "epoch": 2485} {"train_loss": -12.332555770874023, "global_step": 417605, "epoch": 2485} {"train_loss": -12.550904273986816, "global_step": 417606, "epoch": 2485} {"train_loss": -12.450529098510742, "global_step": 417607, "epoch": 2485} {"train_loss": -12.192795753479004, "global_step": 417608, "epoch": 2485} {"train_loss": -12.582284927368164, "global_step": 417609, "epoch": 2485} {"train_loss": -12.019397735595703, "global_step": 417610, "epoch": 2485} {"train_loss": -12.071372985839844, "global_step": 417611, "epoch": 2485} {"train_loss": -12.608336448669434, "global_step": 417612, "epoch": 2485} {"train_loss": -12.38053035736084, "global_step": 417613, "epoch": 2485} {"train_loss": -11.996895790100098, "global_step": 417614, "epoch": 2485} {"train_loss": -12.523321151733398, "global_step": 417615, "epoch": 2485} {"train_loss": -11.713031768798828, "global_step": 417616, "epoch": 2485} {"train_loss": -12.345427513122559, "global_step": 417617, "epoch": 2485} {"train_loss": -12.15155029296875, "global_step": 417618, "epoch": 2485} {"train_loss": -11.496517181396484, "global_step": 417619, "epoch": 2485} {"train_loss": -12.287181854248047, "global_step": 417620, "epoch": 2485} {"train_loss": -11.878067016601562, "global_step": 417621, "epoch": 2485} {"train_loss": -11.959943771362305, "global_step": 417622, "epoch": 2485} {"train_loss": -11.890384674072266, "global_step": 417623, "epoch": 2485} {"train_loss": -12.581315040588379, "global_step": 417624, "epoch": 2485} {"train_loss": -11.189786911010742, "global_step": 417625, "epoch": 2485} {"train_loss": -12.397733688354492, "global_step": 417626, "epoch": 2485} {"train_loss": -11.675688743591309, "global_step": 417627, "epoch": 2485} {"train_loss": -12.192880630493164, "global_step": 417628, "epoch": 2485} {"train_loss": -11.262611389160156, "global_step": 417629, "epoch": 2485} {"train_loss": -12.183043479919434, "global_step": 417630, "epoch": 2485} {"train_loss": -11.600028038024902, "global_step": 417631, "epoch": 2485} {"train_loss": -12.253763198852539, "global_step": 417632, "epoch": 2485} {"train_loss": -11.391454696655273, "global_step": 417633, "epoch": 2485} {"train_loss": -12.024742126464844, "global_step": 417634, "epoch": 2485} {"train_loss": -11.5833740234375, "global_step": 417635, "epoch": 2485} {"train_loss": -11.064221382141113, "global_step": 417636, "epoch": 2485} {"train_loss": -12.023075103759766, "global_step": 417637, "epoch": 2485} {"train_loss": -11.645099639892578, "global_step": 417638, "epoch": 2485} {"train_loss": -11.808043479919434, "global_step": 417639, "epoch": 2485} {"train_loss": -11.011571884155273, "global_step": 417640, "epoch": 2485} {"train_loss": -12.146635055541992, "global_step": 417641, "epoch": 2485} {"train_loss": -10.864377975463867, "global_step": 417642, "epoch": 2485} {"train_loss": -11.6527099609375, "global_step": 417643, "epoch": 2485} {"train_loss": -11.293048858642578, "global_step": 417644, "epoch": 2485} {"train_loss": -11.11095905303955, "global_step": 417645, "epoch": 2485} {"train_loss": -11.402180671691895, "global_step": 417646, "epoch": 2485} {"train_loss": -11.871754737127395, "global_step": 417647, "epoch": 2485, "val_loss": 307092.25, "train_action_mse_error": 0.5527881979942322} {"train_loss": -12.135541915893555, "global_step": 417648, "epoch": 2486} {"train_loss": -11.76748275756836, "global_step": 417649, "epoch": 2486} {"train_loss": -11.8919677734375, "global_step": 417650, "epoch": 2486} {"train_loss": -12.204965591430664, "global_step": 417651, "epoch": 2486} {"train_loss": -11.577926635742188, "global_step": 417652, "epoch": 2486} {"train_loss": -11.795330047607422, "global_step": 417653, "epoch": 2486} {"train_loss": -11.776734352111816, "global_step": 417654, "epoch": 2486} {"train_loss": -12.310636520385742, "global_step": 417655, "epoch": 2486} {"train_loss": -11.488813400268555, "global_step": 417656, "epoch": 2486} {"train_loss": -12.35972785949707, "global_step": 417657, "epoch": 2486} {"train_loss": -12.157997131347656, "global_step": 417658, "epoch": 2486} {"train_loss": -11.9398193359375, "global_step": 417659, "epoch": 2486} {"train_loss": -11.897991180419922, "global_step": 417660, "epoch": 2486} {"train_loss": -12.045476913452148, "global_step": 417661, "epoch": 2486} {"train_loss": -12.039228439331055, "global_step": 417662, "epoch": 2486} {"train_loss": -12.042771339416504, "global_step": 417663, "epoch": 2486} {"train_loss": -11.860547065734863, "global_step": 417664, "epoch": 2486} {"train_loss": -12.207348823547363, "global_step": 417665, "epoch": 2486} {"train_loss": -12.06241226196289, "global_step": 417666, "epoch": 2486} {"train_loss": -12.1492919921875, "global_step": 417667, "epoch": 2486} {"train_loss": -12.021636009216309, "global_step": 417668, "epoch": 2486} {"train_loss": -11.869041442871094, "global_step": 417669, "epoch": 2486} {"train_loss": -12.043069839477539, "global_step": 417670, "epoch": 2486} {"train_loss": -11.509958267211914, "global_step": 417671, "epoch": 2486} {"train_loss": -11.546937942504883, "global_step": 417672, "epoch": 2486} {"train_loss": -12.056798934936523, "global_step": 417673, "epoch": 2486} {"train_loss": -12.095012664794922, "global_step": 417674, "epoch": 2486} {"train_loss": -12.249380111694336, "global_step": 417675, "epoch": 2486} {"train_loss": -12.185340881347656, "global_step": 417676, "epoch": 2486} {"train_loss": -12.297445297241211, "global_step": 417677, "epoch": 2486} {"train_loss": -11.990486145019531, "global_step": 417678, "epoch": 2486} {"train_loss": -12.162302017211914, "global_step": 417679, "epoch": 2486} {"train_loss": -12.47829532623291, "global_step": 417680, "epoch": 2486} {"train_loss": -12.089471817016602, "global_step": 417681, "epoch": 2486} {"train_loss": -12.121255874633789, "global_step": 417682, "epoch": 2486} {"train_loss": -12.118721961975098, "global_step": 417683, "epoch": 2486} {"train_loss": -12.421955108642578, "global_step": 417684, "epoch": 2486} {"train_loss": -12.248308181762695, "global_step": 417685, "epoch": 2486} {"train_loss": -12.595638275146484, "global_step": 417686, "epoch": 2486} {"train_loss": -12.140836715698242, "global_step": 417687, "epoch": 2486} {"train_loss": -12.442683219909668, "global_step": 417688, "epoch": 2486} {"train_loss": -12.222702980041504, "global_step": 417689, "epoch": 2486} {"train_loss": -12.208344459533691, "global_step": 417690, "epoch": 2486} {"train_loss": -12.441017150878906, "global_step": 417691, "epoch": 2486} {"train_loss": -12.062478065490723, "global_step": 417692, "epoch": 2486} {"train_loss": -12.452999114990234, "global_step": 417693, "epoch": 2486} {"train_loss": -12.272767066955566, "global_step": 417694, "epoch": 2486} {"train_loss": -12.141881942749023, "global_step": 417695, "epoch": 2486} {"train_loss": -12.237045288085938, "global_step": 417696, "epoch": 2486} {"train_loss": -12.318634033203125, "global_step": 417697, "epoch": 2486} {"train_loss": -12.16130542755127, "global_step": 417698, "epoch": 2486} {"train_loss": -12.302948951721191, "global_step": 417699, "epoch": 2486} {"train_loss": -12.350250244140625, "global_step": 417700, "epoch": 2486} {"train_loss": -12.522489547729492, "global_step": 417701, "epoch": 2486} {"train_loss": -12.38650131225586, "global_step": 417702, "epoch": 2486} {"train_loss": -12.398124694824219, "global_step": 417703, "epoch": 2486} {"train_loss": -12.560846328735352, "global_step": 417704, "epoch": 2486} {"train_loss": -12.409934997558594, "global_step": 417705, "epoch": 2486} {"train_loss": -12.700719833374023, "global_step": 417706, "epoch": 2486} {"train_loss": -12.655125617980957, "global_step": 417707, "epoch": 2486} {"train_loss": -12.416263580322266, "global_step": 417708, "epoch": 2486} {"train_loss": -12.705780982971191, "global_step": 417709, "epoch": 2486} {"train_loss": -12.742114067077637, "global_step": 417710, "epoch": 2486} {"train_loss": -12.64011001586914, "global_step": 417711, "epoch": 2486} {"train_loss": -12.63821792602539, "global_step": 417712, "epoch": 2486} {"train_loss": -12.384228706359863, "global_step": 417713, "epoch": 2486} {"train_loss": -12.47275161743164, "global_step": 417714, "epoch": 2486} {"train_loss": -12.375650405883789, "global_step": 417715, "epoch": 2486} {"train_loss": -12.664865493774414, "global_step": 417716, "epoch": 2486} {"train_loss": -12.854476928710938, "global_step": 417717, "epoch": 2486} {"train_loss": -12.353719711303711, "global_step": 417718, "epoch": 2486} {"train_loss": -12.531375885009766, "global_step": 417719, "epoch": 2486} {"train_loss": -12.407310485839844, "global_step": 417720, "epoch": 2486} {"train_loss": -12.391214370727539, "global_step": 417721, "epoch": 2486} {"train_loss": -12.401445388793945, "global_step": 417722, "epoch": 2486} {"train_loss": -12.203369140625, "global_step": 417723, "epoch": 2486} {"train_loss": -11.687044143676758, "global_step": 417724, "epoch": 2486} {"train_loss": -11.945378303527832, "global_step": 417725, "epoch": 2486} {"train_loss": -12.372041702270508, "global_step": 417726, "epoch": 2486} {"train_loss": -12.213436126708984, "global_step": 417727, "epoch": 2486} {"train_loss": -12.019424438476562, "global_step": 417728, "epoch": 2486} {"train_loss": -11.59322738647461, "global_step": 417729, "epoch": 2486} {"train_loss": -11.388489723205566, "global_step": 417730, "epoch": 2486} {"train_loss": -12.409507751464844, "global_step": 417731, "epoch": 2486} {"train_loss": -11.812755584716797, "global_step": 417732, "epoch": 2486} {"train_loss": -11.334806442260742, "global_step": 417733, "epoch": 2486} {"train_loss": -11.8785400390625, "global_step": 417734, "epoch": 2486} {"train_loss": -12.316097259521484, "global_step": 417735, "epoch": 2486} {"train_loss": -11.039385795593262, "global_step": 417736, "epoch": 2486} {"train_loss": -11.708272933959961, "global_step": 417737, "epoch": 2486} {"train_loss": -11.585982322692871, "global_step": 417738, "epoch": 2486} {"train_loss": -11.369264602661133, "global_step": 417739, "epoch": 2486} {"train_loss": -11.922616958618164, "global_step": 417740, "epoch": 2486} {"train_loss": -11.620061874389648, "global_step": 417741, "epoch": 2486} {"train_loss": -11.881729125976562, "global_step": 417742, "epoch": 2486} {"train_loss": -11.713483810424805, "global_step": 417743, "epoch": 2486} {"train_loss": -11.647628784179688, "global_step": 417744, "epoch": 2486} {"train_loss": -12.06549072265625, "global_step": 417745, "epoch": 2486} {"train_loss": -11.609380722045898, "global_step": 417746, "epoch": 2486} {"train_loss": -11.989511489868164, "global_step": 417747, "epoch": 2486} {"train_loss": -11.775880813598633, "global_step": 417748, "epoch": 2486} {"train_loss": -11.866508483886719, "global_step": 417749, "epoch": 2486} {"train_loss": -11.460872650146484, "global_step": 417750, "epoch": 2486} {"train_loss": -12.502543449401855, "global_step": 417751, "epoch": 2486} {"train_loss": -11.931072235107422, "global_step": 417752, "epoch": 2486} {"train_loss": -12.215004920959473, "global_step": 417753, "epoch": 2486} {"train_loss": -12.533287048339844, "global_step": 417754, "epoch": 2486} {"train_loss": -12.145463943481445, "global_step": 417755, "epoch": 2486} {"train_loss": -12.24062728881836, "global_step": 417756, "epoch": 2486} {"train_loss": -12.099985122680664, "global_step": 417757, "epoch": 2486} {"train_loss": -12.561321258544922, "global_step": 417758, "epoch": 2486} {"train_loss": -12.53109073638916, "global_step": 417759, "epoch": 2486} {"train_loss": -12.327338218688965, "global_step": 417760, "epoch": 2486} {"train_loss": -12.018634796142578, "global_step": 417761, "epoch": 2486} {"train_loss": -12.151834487915039, "global_step": 417762, "epoch": 2486} {"train_loss": -12.490774154663086, "global_step": 417763, "epoch": 2486} {"train_loss": -11.933809280395508, "global_step": 417764, "epoch": 2486} {"train_loss": -12.25932502746582, "global_step": 417765, "epoch": 2486} {"train_loss": -12.289632797241211, "global_step": 417766, "epoch": 2486} {"train_loss": -12.224020004272461, "global_step": 417767, "epoch": 2486} {"train_loss": -12.18224811553955, "global_step": 417768, "epoch": 2486} {"train_loss": -12.753997802734375, "global_step": 417769, "epoch": 2486} {"train_loss": -11.9870023727417, "global_step": 417770, "epoch": 2486} {"train_loss": -12.359404563903809, "global_step": 417771, "epoch": 2486} {"train_loss": -12.045988082885742, "global_step": 417772, "epoch": 2486} {"train_loss": -11.844466209411621, "global_step": 417773, "epoch": 2486} {"train_loss": -12.420350074768066, "global_step": 417774, "epoch": 2486} {"train_loss": -11.993842124938965, "global_step": 417775, "epoch": 2486} {"train_loss": -12.146333694458008, "global_step": 417776, "epoch": 2486} {"train_loss": -12.558022499084473, "global_step": 417777, "epoch": 2486} {"train_loss": -11.972188949584961, "global_step": 417778, "epoch": 2486} {"train_loss": -11.980951309204102, "global_step": 417779, "epoch": 2486} {"train_loss": -12.569451332092285, "global_step": 417780, "epoch": 2486} {"train_loss": -12.247366905212402, "global_step": 417781, "epoch": 2486} {"train_loss": -12.282821655273438, "global_step": 417782, "epoch": 2486} {"train_loss": -12.511796951293945, "global_step": 417783, "epoch": 2486} {"train_loss": -11.747169494628906, "global_step": 417784, "epoch": 2486} {"train_loss": -12.597458839416504, "global_step": 417785, "epoch": 2486} {"train_loss": -11.887849807739258, "global_step": 417786, "epoch": 2486} {"train_loss": -11.947410583496094, "global_step": 417787, "epoch": 2486} {"train_loss": -11.923868179321289, "global_step": 417788, "epoch": 2486} {"train_loss": -11.633955001831055, "global_step": 417789, "epoch": 2486} {"train_loss": -11.89484691619873, "global_step": 417790, "epoch": 2486} {"train_loss": -11.467879295349121, "global_step": 417791, "epoch": 2486} {"train_loss": -10.576878547668457, "global_step": 417792, "epoch": 2486} {"train_loss": -11.570321083068848, "global_step": 417793, "epoch": 2486} {"train_loss": -11.872146606445312, "global_step": 417794, "epoch": 2486} {"train_loss": -11.663657188415527, "global_step": 417795, "epoch": 2486} {"train_loss": -12.046087265014648, "global_step": 417796, "epoch": 2486} {"train_loss": -12.233316421508789, "global_step": 417797, "epoch": 2486} {"train_loss": -12.423545837402344, "global_step": 417798, "epoch": 2486} {"train_loss": -12.406343460083008, "global_step": 417799, "epoch": 2486} {"train_loss": -12.292387962341309, "global_step": 417800, "epoch": 2486} {"train_loss": -12.47629451751709, "global_step": 417801, "epoch": 2486} {"train_loss": -12.051451683044434, "global_step": 417802, "epoch": 2486} {"train_loss": -12.42082405090332, "global_step": 417803, "epoch": 2486} {"train_loss": -11.636438369750977, "global_step": 417804, "epoch": 2486} {"train_loss": -11.986316680908203, "global_step": 417805, "epoch": 2486} {"train_loss": -12.30261516571045, "global_step": 417806, "epoch": 2486} {"train_loss": -11.220540046691895, "global_step": 417807, "epoch": 2486} {"train_loss": -12.100057601928711, "global_step": 417808, "epoch": 2486} {"train_loss": -11.92094612121582, "global_step": 417809, "epoch": 2486} {"train_loss": -12.083159446716309, "global_step": 417810, "epoch": 2486} {"train_loss": -11.996073722839355, "global_step": 417811, "epoch": 2486} {"train_loss": -11.246620178222656, "global_step": 417812, "epoch": 2486} {"train_loss": -11.743046760559082, "global_step": 417813, "epoch": 2486} {"train_loss": -12.011537551879883, "global_step": 417814, "epoch": 2486} {"train_loss": -12.100971352486383, "global_step": 417815, "epoch": 2486, "val_loss": 304063.34375} {"train_loss": -11.596647262573242, "global_step": 417816, "epoch": 2487} {"train_loss": -10.323982238769531, "global_step": 417817, "epoch": 2487} {"train_loss": -11.442014694213867, "global_step": 417818, "epoch": 2487} {"train_loss": -10.272833824157715, "global_step": 417819, "epoch": 2487} {"train_loss": -11.482653617858887, "global_step": 417820, "epoch": 2487} {"train_loss": -11.020332336425781, "global_step": 417821, "epoch": 2487} {"train_loss": -11.43053150177002, "global_step": 417822, "epoch": 2487} {"train_loss": -11.195440292358398, "global_step": 417823, "epoch": 2487} {"train_loss": -10.693666458129883, "global_step": 417824, "epoch": 2487} {"train_loss": -11.67626667022705, "global_step": 417825, "epoch": 2487} {"train_loss": -9.734712600708008, "global_step": 417826, "epoch": 2487} {"train_loss": -11.307563781738281, "global_step": 417827, "epoch": 2487} {"train_loss": -10.993436813354492, "global_step": 417828, "epoch": 2487} {"train_loss": -11.301210403442383, "global_step": 417829, "epoch": 2487} {"train_loss": -11.063858032226562, "global_step": 417830, "epoch": 2487} {"train_loss": -11.676702499389648, "global_step": 417831, "epoch": 2487} {"train_loss": -10.813404083251953, "global_step": 417832, "epoch": 2487} {"train_loss": -11.381660461425781, "global_step": 417833, "epoch": 2487} {"train_loss": -10.90732479095459, "global_step": 417834, "epoch": 2487} {"train_loss": -11.98724365234375, "global_step": 417835, "epoch": 2487} {"train_loss": -11.610624313354492, "global_step": 417836, "epoch": 2487} {"train_loss": -12.082688331604004, "global_step": 417837, "epoch": 2487} {"train_loss": -11.620136260986328, "global_step": 417838, "epoch": 2487} {"train_loss": -12.086244583129883, "global_step": 417839, "epoch": 2487} {"train_loss": -11.229280471801758, "global_step": 417840, "epoch": 2487} {"train_loss": -11.87421989440918, "global_step": 417841, "epoch": 2487} {"train_loss": -11.896117210388184, "global_step": 417842, "epoch": 2487} {"train_loss": -11.9862060546875, "global_step": 417843, "epoch": 2487} {"train_loss": -12.019879341125488, "global_step": 417844, "epoch": 2487} {"train_loss": -11.84323501586914, "global_step": 417845, "epoch": 2487} {"train_loss": -11.637784957885742, "global_step": 417846, "epoch": 2487} {"train_loss": -12.069982528686523, "global_step": 417847, "epoch": 2487} {"train_loss": -11.696978569030762, "global_step": 417848, "epoch": 2487} {"train_loss": -12.02064323425293, "global_step": 417849, "epoch": 2487} {"train_loss": -11.266980171203613, "global_step": 417850, "epoch": 2487} {"train_loss": -11.200859069824219, "global_step": 417851, "epoch": 2487} {"train_loss": -12.057223320007324, "global_step": 417852, "epoch": 2487} {"train_loss": -11.626707077026367, "global_step": 417853, "epoch": 2487} {"train_loss": -11.886564254760742, "global_step": 417854, "epoch": 2487} {"train_loss": -11.952722549438477, "global_step": 417855, "epoch": 2487} {"train_loss": -11.46727180480957, "global_step": 417856, "epoch": 2487} {"train_loss": -11.648313522338867, "global_step": 417857, "epoch": 2487} {"train_loss": -11.566694259643555, "global_step": 417858, "epoch": 2487} {"train_loss": -10.443279266357422, "global_step": 417859, "epoch": 2487} {"train_loss": -12.300113677978516, "global_step": 417860, "epoch": 2487} {"train_loss": -10.79013442993164, "global_step": 417861, "epoch": 2487} {"train_loss": -11.750471115112305, "global_step": 417862, "epoch": 2487} {"train_loss": -11.570455551147461, "global_step": 417863, "epoch": 2487} {"train_loss": -11.866127014160156, "global_step": 417864, "epoch": 2487} {"train_loss": -11.751067161560059, "global_step": 417865, "epoch": 2487} {"train_loss": -11.867288589477539, "global_step": 417866, "epoch": 2487} {"train_loss": -11.921363830566406, "global_step": 417867, "epoch": 2487} {"train_loss": -12.506576538085938, "global_step": 417868, "epoch": 2487} {"train_loss": -12.04464340209961, "global_step": 417869, "epoch": 2487} {"train_loss": -12.223289489746094, "global_step": 417870, "epoch": 2487} {"train_loss": -12.406408309936523, "global_step": 417871, "epoch": 2487} {"train_loss": -12.439599990844727, "global_step": 417872, "epoch": 2487} {"train_loss": -12.521554946899414, "global_step": 417873, "epoch": 2487} {"train_loss": -12.470399856567383, "global_step": 417874, "epoch": 2487} {"train_loss": -12.286712646484375, "global_step": 417875, "epoch": 2487} {"train_loss": -12.484392166137695, "global_step": 417876, "epoch": 2487} {"train_loss": -12.476346015930176, "global_step": 417877, "epoch": 2487} {"train_loss": -12.325540542602539, "global_step": 417878, "epoch": 2487} {"train_loss": -12.489282608032227, "global_step": 417879, "epoch": 2487} {"train_loss": -12.395686149597168, "global_step": 417880, "epoch": 2487} {"train_loss": -12.406977653503418, "global_step": 417881, "epoch": 2487} {"train_loss": -12.490226745605469, "global_step": 417882, "epoch": 2487} {"train_loss": -12.323570251464844, "global_step": 417883, "epoch": 2487} {"train_loss": -12.556615829467773, "global_step": 417884, "epoch": 2487} {"train_loss": -12.360151290893555, "global_step": 417885, "epoch": 2487} {"train_loss": -12.718183517456055, "global_step": 417886, "epoch": 2487} {"train_loss": -12.608752250671387, "global_step": 417887, "epoch": 2487} {"train_loss": -12.617795944213867, "global_step": 417888, "epoch": 2487} {"train_loss": -12.53030014038086, "global_step": 417889, "epoch": 2487} {"train_loss": -12.45423698425293, "global_step": 417890, "epoch": 2487} {"train_loss": -12.49410629272461, "global_step": 417891, "epoch": 2487} {"train_loss": -12.499069213867188, "global_step": 417892, "epoch": 2487} {"train_loss": -12.493322372436523, "global_step": 417893, "epoch": 2487} {"train_loss": -12.358522415161133, "global_step": 417894, "epoch": 2487} {"train_loss": -12.335471153259277, "global_step": 417895, "epoch": 2487} {"train_loss": -12.599380493164062, "global_step": 417896, "epoch": 2487} {"train_loss": -12.348640441894531, "global_step": 417897, "epoch": 2487} {"train_loss": -12.492321968078613, "global_step": 417898, "epoch": 2487} {"train_loss": -12.519712448120117, "global_step": 417899, "epoch": 2487} {"train_loss": -12.36746597290039, "global_step": 417900, "epoch": 2487} {"train_loss": -12.554618835449219, "global_step": 417901, "epoch": 2487} {"train_loss": -12.696725845336914, "global_step": 417902, "epoch": 2487} {"train_loss": -12.664363861083984, "global_step": 417903, "epoch": 2487} {"train_loss": -12.587013244628906, "global_step": 417904, "epoch": 2487} {"train_loss": -12.562847137451172, "global_step": 417905, "epoch": 2487} {"train_loss": -12.485798835754395, "global_step": 417906, "epoch": 2487} {"train_loss": -12.822025299072266, "global_step": 417907, "epoch": 2487} {"train_loss": -12.651022911071777, "global_step": 417908, "epoch": 2487} {"train_loss": -12.644996643066406, "global_step": 417909, "epoch": 2487} {"train_loss": -12.497369766235352, "global_step": 417910, "epoch": 2487} {"train_loss": -12.705026626586914, "global_step": 417911, "epoch": 2487} {"train_loss": -12.561967849731445, "global_step": 417912, "epoch": 2487} {"train_loss": -12.910645484924316, "global_step": 417913, "epoch": 2487} {"train_loss": -12.737003326416016, "global_step": 417914, "epoch": 2487} {"train_loss": -12.417381286621094, "global_step": 417915, "epoch": 2487} {"train_loss": -12.612338066101074, "global_step": 417916, "epoch": 2487} {"train_loss": -12.708036422729492, "global_step": 417917, "epoch": 2487} {"train_loss": -12.596620559692383, "global_step": 417918, "epoch": 2487} {"train_loss": -12.3636474609375, "global_step": 417919, "epoch": 2487} {"train_loss": -12.565536499023438, "global_step": 417920, "epoch": 2487} {"train_loss": -12.564241409301758, "global_step": 417921, "epoch": 2487} {"train_loss": -12.662734985351562, "global_step": 417922, "epoch": 2487} {"train_loss": -12.539219856262207, "global_step": 417923, "epoch": 2487} {"train_loss": -12.796655654907227, "global_step": 417924, "epoch": 2487} {"train_loss": -12.43127727508545, "global_step": 417925, "epoch": 2487} {"train_loss": -12.461882591247559, "global_step": 417926, "epoch": 2487} {"train_loss": -12.624853134155273, "global_step": 417927, "epoch": 2487} {"train_loss": -12.25024700164795, "global_step": 417928, "epoch": 2487} {"train_loss": -12.726318359375, "global_step": 417929, "epoch": 2487} {"train_loss": -12.580543518066406, "global_step": 417930, "epoch": 2487} {"train_loss": -12.312877655029297, "global_step": 417931, "epoch": 2487} {"train_loss": -12.077716827392578, "global_step": 417932, "epoch": 2487} {"train_loss": -12.437026977539062, "global_step": 417933, "epoch": 2487} {"train_loss": -12.747612953186035, "global_step": 417934, "epoch": 2487} {"train_loss": -12.48845100402832, "global_step": 417935, "epoch": 2487} {"train_loss": -12.35081958770752, "global_step": 417936, "epoch": 2487} {"train_loss": -12.561025619506836, "global_step": 417937, "epoch": 2487} {"train_loss": -12.714258193969727, "global_step": 417938, "epoch": 2487} {"train_loss": -12.431449890136719, "global_step": 417939, "epoch": 2487} {"train_loss": -12.453948974609375, "global_step": 417940, "epoch": 2487} {"train_loss": -11.978099822998047, "global_step": 417941, "epoch": 2487} {"train_loss": -11.717653274536133, "global_step": 417942, "epoch": 2487} {"train_loss": -11.799236297607422, "global_step": 417943, "epoch": 2487} {"train_loss": -12.884553909301758, "global_step": 417944, "epoch": 2487} {"train_loss": -11.822286605834961, "global_step": 417945, "epoch": 2487} {"train_loss": -11.2340087890625, "global_step": 417946, "epoch": 2487} {"train_loss": -11.47819709777832, "global_step": 417947, "epoch": 2487} {"train_loss": -10.035799980163574, "global_step": 417948, "epoch": 2487} {"train_loss": -10.300947189331055, "global_step": 417949, "epoch": 2487} {"train_loss": -11.102941513061523, "global_step": 417950, "epoch": 2487} {"train_loss": -12.046009063720703, "global_step": 417951, "epoch": 2487} {"train_loss": -9.645294189453125, "global_step": 417952, "epoch": 2487} {"train_loss": -11.909185409545898, "global_step": 417953, "epoch": 2487} {"train_loss": -10.98906135559082, "global_step": 417954, "epoch": 2487} {"train_loss": -11.241496086120605, "global_step": 417955, "epoch": 2487} {"train_loss": -11.702467918395996, "global_step": 417956, "epoch": 2487} {"train_loss": -10.903800010681152, "global_step": 417957, "epoch": 2487} {"train_loss": -11.01350212097168, "global_step": 417958, "epoch": 2487} {"train_loss": -11.85906982421875, "global_step": 417959, "epoch": 2487} {"train_loss": -12.174057006835938, "global_step": 417960, "epoch": 2487} {"train_loss": -10.812850952148438, "global_step": 417961, "epoch": 2487} {"train_loss": -11.481935501098633, "global_step": 417962, "epoch": 2487} {"train_loss": -11.32165813446045, "global_step": 417963, "epoch": 2487} {"train_loss": -11.719799041748047, "global_step": 417964, "epoch": 2487} {"train_loss": -11.483053207397461, "global_step": 417965, "epoch": 2487} {"train_loss": -11.514878273010254, "global_step": 417966, "epoch": 2487} {"train_loss": -12.087224006652832, "global_step": 417967, "epoch": 2487} {"train_loss": -11.530653953552246, "global_step": 417968, "epoch": 2487} {"train_loss": -11.557760238647461, "global_step": 417969, "epoch": 2487} {"train_loss": -11.188017845153809, "global_step": 417970, "epoch": 2487} {"train_loss": -12.094463348388672, "global_step": 417971, "epoch": 2487} {"train_loss": -11.056541442871094, "global_step": 417972, "epoch": 2487} {"train_loss": -12.075491905212402, "global_step": 417973, "epoch": 2487} {"train_loss": -11.698781967163086, "global_step": 417974, "epoch": 2487} {"train_loss": -11.621034622192383, "global_step": 417975, "epoch": 2487} {"train_loss": -12.142742156982422, "global_step": 417976, "epoch": 2487} {"train_loss": -11.510333061218262, "global_step": 417977, "epoch": 2487} {"train_loss": -11.926643371582031, "global_step": 417978, "epoch": 2487} {"train_loss": -11.95681095123291, "global_step": 417979, "epoch": 2487} {"train_loss": -12.010387420654297, "global_step": 417980, "epoch": 2487} {"train_loss": -11.946226119995117, "global_step": 417981, "epoch": 2487} {"train_loss": -12.227848052978516, "global_step": 417982, "epoch": 2487} {"train_loss": -11.946836295581999, "global_step": 417983, "epoch": 2487, "val_loss": 303146.3125} {"train_loss": -12.398128509521484, "global_step": 417984, "epoch": 2488} {"train_loss": -11.890222549438477, "global_step": 417985, "epoch": 2488} {"train_loss": -11.974080085754395, "global_step": 417986, "epoch": 2488} {"train_loss": -12.270830154418945, "global_step": 417987, "epoch": 2488} {"train_loss": -12.287213325500488, "global_step": 417988, "epoch": 2488} {"train_loss": -11.88039779663086, "global_step": 417989, "epoch": 2488} {"train_loss": -12.035867691040039, "global_step": 417990, "epoch": 2488} {"train_loss": -11.83753776550293, "global_step": 417991, "epoch": 2488} {"train_loss": -11.710012435913086, "global_step": 417992, "epoch": 2488} {"train_loss": -12.251230239868164, "global_step": 417993, "epoch": 2488} {"train_loss": -11.890487670898438, "global_step": 417994, "epoch": 2488} {"train_loss": -12.151972770690918, "global_step": 417995, "epoch": 2488} {"train_loss": -11.583571434020996, "global_step": 417996, "epoch": 2488} {"train_loss": -11.957096099853516, "global_step": 417997, "epoch": 2488} {"train_loss": -11.469717025756836, "global_step": 417998, "epoch": 2488} {"train_loss": -12.272640228271484, "global_step": 417999, "epoch": 2488} {"train_loss": -10.819744110107422, "global_step": 418000, "epoch": 2488} {"train_loss": -12.06475830078125, "global_step": 418001, "epoch": 2488} {"train_loss": -10.680692672729492, "global_step": 418002, "epoch": 2488} {"train_loss": -12.129472732543945, "global_step": 418003, "epoch": 2488} {"train_loss": -11.140119552612305, "global_step": 418004, "epoch": 2488} {"train_loss": -11.369976043701172, "global_step": 418005, "epoch": 2488} {"train_loss": -12.129101753234863, "global_step": 418006, "epoch": 2488} {"train_loss": -11.736673355102539, "global_step": 418007, "epoch": 2488} {"train_loss": -12.336828231811523, "global_step": 418008, "epoch": 2488} {"train_loss": -11.589673042297363, "global_step": 418009, "epoch": 2488} {"train_loss": -11.737820625305176, "global_step": 418010, "epoch": 2488} {"train_loss": -12.223991394042969, "global_step": 418011, "epoch": 2488} {"train_loss": -11.639476776123047, "global_step": 418012, "epoch": 2488} {"train_loss": -12.496330261230469, "global_step": 418013, "epoch": 2488} {"train_loss": -11.279241561889648, "global_step": 418014, "epoch": 2488} {"train_loss": -12.267803192138672, "global_step": 418015, "epoch": 2488} {"train_loss": -11.450179100036621, "global_step": 418016, "epoch": 2488} {"train_loss": -11.679769515991211, "global_step": 418017, "epoch": 2488} {"train_loss": -11.896856307983398, "global_step": 418018, "epoch": 2488} {"train_loss": -11.439340591430664, "global_step": 418019, "epoch": 2488} {"train_loss": -12.251011848449707, "global_step": 418020, "epoch": 2488} {"train_loss": -11.821346282958984, "global_step": 418021, "epoch": 2488} {"train_loss": -12.025171279907227, "global_step": 418022, "epoch": 2488} {"train_loss": -12.365504264831543, "global_step": 418023, "epoch": 2488} {"train_loss": -12.010284423828125, "global_step": 418024, "epoch": 2488} {"train_loss": -12.373163223266602, "global_step": 418025, "epoch": 2488} {"train_loss": -11.955187797546387, "global_step": 418026, "epoch": 2488} {"train_loss": -12.467194557189941, "global_step": 418027, "epoch": 2488} {"train_loss": -12.346435546875, "global_step": 418028, "epoch": 2488} {"train_loss": -12.452286720275879, "global_step": 418029, "epoch": 2488} {"train_loss": -12.380857467651367, "global_step": 418030, "epoch": 2488} {"train_loss": -12.199593544006348, "global_step": 418031, "epoch": 2488} {"train_loss": -12.389022827148438, "global_step": 418032, "epoch": 2488} {"train_loss": -12.189250946044922, "global_step": 418033, "epoch": 2488} {"train_loss": -12.672603607177734, "global_step": 418034, "epoch": 2488} {"train_loss": -12.366355895996094, "global_step": 418035, "epoch": 2488} {"train_loss": -12.267370223999023, "global_step": 418036, "epoch": 2488} {"train_loss": -12.552313804626465, "global_step": 418037, "epoch": 2488} {"train_loss": -12.330409049987793, "global_step": 418038, "epoch": 2488} {"train_loss": -12.78468132019043, "global_step": 418039, "epoch": 2488} {"train_loss": -12.466300964355469, "global_step": 418040, "epoch": 2488} {"train_loss": -12.610759735107422, "global_step": 418041, "epoch": 2488} {"train_loss": -12.425796508789062, "global_step": 418042, "epoch": 2488} {"train_loss": -12.607064247131348, "global_step": 418043, "epoch": 2488} {"train_loss": -12.532538414001465, "global_step": 418044, "epoch": 2488} {"train_loss": -12.492935180664062, "global_step": 418045, "epoch": 2488} {"train_loss": -12.695699691772461, "global_step": 418046, "epoch": 2488} {"train_loss": -12.236730575561523, "global_step": 418047, "epoch": 2488} {"train_loss": -12.807044982910156, "global_step": 418048, "epoch": 2488} {"train_loss": -12.505607604980469, "global_step": 418049, "epoch": 2488} {"train_loss": -12.497355461120605, "global_step": 418050, "epoch": 2488} {"train_loss": -12.68538761138916, "global_step": 418051, "epoch": 2488} {"train_loss": -12.541616439819336, "global_step": 418052, "epoch": 2488} {"train_loss": -12.647812843322754, "global_step": 418053, "epoch": 2488} {"train_loss": -12.431417465209961, "global_step": 418054, "epoch": 2488} {"train_loss": -12.548126220703125, "global_step": 418055, "epoch": 2488} {"train_loss": -12.469708442687988, "global_step": 418056, "epoch": 2488} {"train_loss": -12.488956451416016, "global_step": 418057, "epoch": 2488} {"train_loss": -12.270149230957031, "global_step": 418058, "epoch": 2488} {"train_loss": -12.760618209838867, "global_step": 418059, "epoch": 2488} {"train_loss": -12.345630645751953, "global_step": 418060, "epoch": 2488} {"train_loss": -12.680678367614746, "global_step": 418061, "epoch": 2488} {"train_loss": -12.380126953125, "global_step": 418062, "epoch": 2488} {"train_loss": -12.463907241821289, "global_step": 418063, "epoch": 2488} {"train_loss": -12.631017684936523, "global_step": 418064, "epoch": 2488} {"train_loss": -12.124584197998047, "global_step": 418065, "epoch": 2488} {"train_loss": -12.63541030883789, "global_step": 418066, "epoch": 2488} {"train_loss": -12.042069435119629, "global_step": 418067, "epoch": 2488} {"train_loss": -12.236937522888184, "global_step": 418068, "epoch": 2488} {"train_loss": -12.468950271606445, "global_step": 418069, "epoch": 2488} {"train_loss": -11.829732894897461, "global_step": 418070, "epoch": 2488} {"train_loss": -11.86198616027832, "global_step": 418071, "epoch": 2488} {"train_loss": -12.488927841186523, "global_step": 418072, "epoch": 2488} {"train_loss": -11.531267166137695, "global_step": 418073, "epoch": 2488} {"train_loss": -12.198358535766602, "global_step": 418074, "epoch": 2488} {"train_loss": -12.521668434143066, "global_step": 418075, "epoch": 2488} {"train_loss": -11.74661636352539, "global_step": 418076, "epoch": 2488} {"train_loss": -11.950157165527344, "global_step": 418077, "epoch": 2488} {"train_loss": -11.296632766723633, "global_step": 418078, "epoch": 2488} {"train_loss": -12.377845764160156, "global_step": 418079, "epoch": 2488} {"train_loss": -11.471961975097656, "global_step": 418080, "epoch": 2488} {"train_loss": -11.157479286193848, "global_step": 418081, "epoch": 2488} {"train_loss": -11.433320045471191, "global_step": 418082, "epoch": 2488} {"train_loss": -12.567557334899902, "global_step": 418083, "epoch": 2488} {"train_loss": -12.34399127960205, "global_step": 418084, "epoch": 2488} {"train_loss": -12.293149948120117, "global_step": 418085, "epoch": 2488} {"train_loss": -11.869093894958496, "global_step": 418086, "epoch": 2488} {"train_loss": -12.08253288269043, "global_step": 418087, "epoch": 2488} {"train_loss": -12.08400821685791, "global_step": 418088, "epoch": 2488} {"train_loss": -12.135778427124023, "global_step": 418089, "epoch": 2488} {"train_loss": -12.093521118164062, "global_step": 418090, "epoch": 2488} {"train_loss": -11.54707145690918, "global_step": 418091, "epoch": 2488} {"train_loss": -12.47566032409668, "global_step": 418092, "epoch": 2488} {"train_loss": -11.819416999816895, "global_step": 418093, "epoch": 2488} {"train_loss": -12.271759033203125, "global_step": 418094, "epoch": 2488} {"train_loss": -11.884122848510742, "global_step": 418095, "epoch": 2488} {"train_loss": -12.149665832519531, "global_step": 418096, "epoch": 2488} {"train_loss": -12.329957962036133, "global_step": 418097, "epoch": 2488} {"train_loss": -11.385082244873047, "global_step": 418098, "epoch": 2488} {"train_loss": -12.288383483886719, "global_step": 418099, "epoch": 2488} {"train_loss": -11.870662689208984, "global_step": 418100, "epoch": 2488} {"train_loss": -12.1659574508667, "global_step": 418101, "epoch": 2488} {"train_loss": -12.081226348876953, "global_step": 418102, "epoch": 2488} {"train_loss": -11.888160705566406, "global_step": 418103, "epoch": 2488} {"train_loss": -12.189184188842773, "global_step": 418104, "epoch": 2488} {"train_loss": -12.223282814025879, "global_step": 418105, "epoch": 2488} {"train_loss": -10.805466651916504, "global_step": 418106, "epoch": 2488} {"train_loss": -12.26671028137207, "global_step": 418107, "epoch": 2488} {"train_loss": -10.879236221313477, "global_step": 418108, "epoch": 2488} {"train_loss": -11.602899551391602, "global_step": 418109, "epoch": 2488} {"train_loss": -12.18008804321289, "global_step": 418110, "epoch": 2488} {"train_loss": -11.230300903320312, "global_step": 418111, "epoch": 2488} {"train_loss": -11.904232025146484, "global_step": 418112, "epoch": 2488} {"train_loss": -11.364185333251953, "global_step": 418113, "epoch": 2488} {"train_loss": -11.823765754699707, "global_step": 418114, "epoch": 2488} {"train_loss": -12.140413284301758, "global_step": 418115, "epoch": 2488} {"train_loss": -12.056472778320312, "global_step": 418116, "epoch": 2488} {"train_loss": -12.203493118286133, "global_step": 418117, "epoch": 2488} {"train_loss": -11.677642822265625, "global_step": 418118, "epoch": 2488} {"train_loss": -11.999969482421875, "global_step": 418119, "epoch": 2488} {"train_loss": -11.955684661865234, "global_step": 418120, "epoch": 2488} {"train_loss": -12.56340503692627, "global_step": 418121, "epoch": 2488} {"train_loss": -12.181131362915039, "global_step": 418122, "epoch": 2488} {"train_loss": -12.0889892578125, "global_step": 418123, "epoch": 2488} {"train_loss": -12.076833724975586, "global_step": 418124, "epoch": 2488} {"train_loss": -12.55794620513916, "global_step": 418125, "epoch": 2488} {"train_loss": -12.348368644714355, "global_step": 418126, "epoch": 2488} {"train_loss": -12.08708381652832, "global_step": 418127, "epoch": 2488} {"train_loss": -12.056255340576172, "global_step": 418128, "epoch": 2488} {"train_loss": -12.260200500488281, "global_step": 418129, "epoch": 2488} {"train_loss": -12.23416519165039, "global_step": 418130, "epoch": 2488} {"train_loss": -12.084477424621582, "global_step": 418131, "epoch": 2488} {"train_loss": -12.469350814819336, "global_step": 418132, "epoch": 2488} {"train_loss": -11.784027099609375, "global_step": 418133, "epoch": 2488} {"train_loss": -12.363713264465332, "global_step": 418134, "epoch": 2488} {"train_loss": -12.280399322509766, "global_step": 418135, "epoch": 2488} {"train_loss": -12.308570861816406, "global_step": 418136, "epoch": 2488} {"train_loss": -12.37729549407959, "global_step": 418137, "epoch": 2488} {"train_loss": -12.447061538696289, "global_step": 418138, "epoch": 2488} {"train_loss": -12.024517059326172, "global_step": 418139, "epoch": 2488} {"train_loss": -12.417671203613281, "global_step": 418140, "epoch": 2488} {"train_loss": -12.663789749145508, "global_step": 418141, "epoch": 2488} {"train_loss": -12.2958984375, "global_step": 418142, "epoch": 2488} {"train_loss": -12.36077880859375, "global_step": 418143, "epoch": 2488} {"train_loss": -12.142004013061523, "global_step": 418144, "epoch": 2488} {"train_loss": -12.234495162963867, "global_step": 418145, "epoch": 2488} {"train_loss": -12.047595977783203, "global_step": 418146, "epoch": 2488} {"train_loss": -12.192203521728516, "global_step": 418147, "epoch": 2488} {"train_loss": -12.040014266967773, "global_step": 418148, "epoch": 2488} {"train_loss": -12.554080963134766, "global_step": 418149, "epoch": 2488} {"train_loss": -12.041421890258789, "global_step": 418150, "epoch": 2488} {"train_loss": -12.110999033564614, "global_step": 418151, "epoch": 2488, "val_loss": 307382.625} {"train_loss": -12.655492782592773, "global_step": 418152, "epoch": 2489} {"train_loss": -12.139137268066406, "global_step": 418153, "epoch": 2489} {"train_loss": -12.7612943649292, "global_step": 418154, "epoch": 2489} {"train_loss": -12.089693069458008, "global_step": 418155, "epoch": 2489} {"train_loss": -12.741450309753418, "global_step": 418156, "epoch": 2489} {"train_loss": -12.426229476928711, "global_step": 418157, "epoch": 2489} {"train_loss": -12.377684593200684, "global_step": 418158, "epoch": 2489} {"train_loss": -12.520231246948242, "global_step": 418159, "epoch": 2489} {"train_loss": -12.37270736694336, "global_step": 418160, "epoch": 2489} {"train_loss": -12.373026847839355, "global_step": 418161, "epoch": 2489} {"train_loss": -12.147801399230957, "global_step": 418162, "epoch": 2489} {"train_loss": -12.719919204711914, "global_step": 418163, "epoch": 2489} {"train_loss": -12.035662651062012, "global_step": 418164, "epoch": 2489} {"train_loss": -12.339345932006836, "global_step": 418165, "epoch": 2489} {"train_loss": -12.45125961303711, "global_step": 418166, "epoch": 2489} {"train_loss": -12.295146942138672, "global_step": 418167, "epoch": 2489} {"train_loss": -12.243552207946777, "global_step": 418168, "epoch": 2489} {"train_loss": -12.604266166687012, "global_step": 418169, "epoch": 2489} {"train_loss": -11.931243896484375, "global_step": 418170, "epoch": 2489} {"train_loss": -12.083229064941406, "global_step": 418171, "epoch": 2489} {"train_loss": -12.738075256347656, "global_step": 418172, "epoch": 2489} {"train_loss": -12.375032424926758, "global_step": 418173, "epoch": 2489} {"train_loss": -12.51124382019043, "global_step": 418174, "epoch": 2489} {"train_loss": -12.067450523376465, "global_step": 418175, "epoch": 2489} {"train_loss": -12.585981369018555, "global_step": 418176, "epoch": 2489} {"train_loss": -12.107114791870117, "global_step": 418177, "epoch": 2489} {"train_loss": -12.152059555053711, "global_step": 418178, "epoch": 2489} {"train_loss": -12.169744491577148, "global_step": 418179, "epoch": 2489} {"train_loss": -12.42757797241211, "global_step": 418180, "epoch": 2489} {"train_loss": -12.314840316772461, "global_step": 418181, "epoch": 2489} {"train_loss": -11.347488403320312, "global_step": 418182, "epoch": 2489} {"train_loss": -11.875177383422852, "global_step": 418183, "epoch": 2489} {"train_loss": -12.593612670898438, "global_step": 418184, "epoch": 2489} {"train_loss": -12.674285888671875, "global_step": 418185, "epoch": 2489} {"train_loss": -11.387838363647461, "global_step": 418186, "epoch": 2489} {"train_loss": -12.499700546264648, "global_step": 418187, "epoch": 2489} {"train_loss": -12.259631156921387, "global_step": 418188, "epoch": 2489} {"train_loss": -11.909018516540527, "global_step": 418189, "epoch": 2489} {"train_loss": -12.329748153686523, "global_step": 418190, "epoch": 2489} {"train_loss": -12.48720932006836, "global_step": 418191, "epoch": 2489} {"train_loss": -12.306211471557617, "global_step": 418192, "epoch": 2489} {"train_loss": -12.616508483886719, "global_step": 418193, "epoch": 2489} {"train_loss": -12.435648918151855, "global_step": 418194, "epoch": 2489} {"train_loss": -12.599740982055664, "global_step": 418195, "epoch": 2489} {"train_loss": -12.53895092010498, "global_step": 418196, "epoch": 2489} {"train_loss": -12.166540145874023, "global_step": 418197, "epoch": 2489} {"train_loss": -12.534049987792969, "global_step": 418198, "epoch": 2489} {"train_loss": -12.300785064697266, "global_step": 418199, "epoch": 2489} {"train_loss": -12.450541496276855, "global_step": 418200, "epoch": 2489} {"train_loss": -12.463111877441406, "global_step": 418201, "epoch": 2489} {"train_loss": -12.440267562866211, "global_step": 418202, "epoch": 2489} {"train_loss": -12.493539810180664, "global_step": 418203, "epoch": 2489} {"train_loss": -12.456225395202637, "global_step": 418204, "epoch": 2489} {"train_loss": -12.695323944091797, "global_step": 418205, "epoch": 2489} {"train_loss": -12.662300109863281, "global_step": 418206, "epoch": 2489} {"train_loss": -12.721681594848633, "global_step": 418207, "epoch": 2489} {"train_loss": -12.483477592468262, "global_step": 418208, "epoch": 2489} {"train_loss": -12.132161140441895, "global_step": 418209, "epoch": 2489} {"train_loss": -12.364358901977539, "global_step": 418210, "epoch": 2489} {"train_loss": -12.619558334350586, "global_step": 418211, "epoch": 2489} {"train_loss": -12.346593856811523, "global_step": 418212, "epoch": 2489} {"train_loss": -12.920310020446777, "global_step": 418213, "epoch": 2489} {"train_loss": -12.292215347290039, "global_step": 418214, "epoch": 2489} {"train_loss": -12.112844467163086, "global_step": 418215, "epoch": 2489} {"train_loss": -12.341991424560547, "global_step": 418216, "epoch": 2489} {"train_loss": -12.147832870483398, "global_step": 418217, "epoch": 2489} {"train_loss": -11.61688232421875, "global_step": 418218, "epoch": 2489} {"train_loss": -12.691587448120117, "global_step": 418219, "epoch": 2489} {"train_loss": -11.558753967285156, "global_step": 418220, "epoch": 2489} {"train_loss": -11.835224151611328, "global_step": 418221, "epoch": 2489} {"train_loss": -12.444475173950195, "global_step": 418222, "epoch": 2489} {"train_loss": -12.404680252075195, "global_step": 418223, "epoch": 2489} {"train_loss": -12.001615524291992, "global_step": 418224, "epoch": 2489} {"train_loss": -12.584892272949219, "global_step": 418225, "epoch": 2489} {"train_loss": -12.027804374694824, "global_step": 418226, "epoch": 2489} {"train_loss": -12.261504173278809, "global_step": 418227, "epoch": 2489} {"train_loss": -11.674715042114258, "global_step": 418228, "epoch": 2489} {"train_loss": -11.732405662536621, "global_step": 418229, "epoch": 2489} {"train_loss": -12.219429016113281, "global_step": 418230, "epoch": 2489} {"train_loss": -11.58587646484375, "global_step": 418231, "epoch": 2489} {"train_loss": -11.203933715820312, "global_step": 418232, "epoch": 2489} {"train_loss": -11.31671142578125, "global_step": 418233, "epoch": 2489} {"train_loss": -11.977752685546875, "global_step": 418234, "epoch": 2489} {"train_loss": -11.210040092468262, "global_step": 418235, "epoch": 2489} {"train_loss": -10.814580917358398, "global_step": 418236, "epoch": 2489} {"train_loss": -12.106908798217773, "global_step": 418237, "epoch": 2489} {"train_loss": -9.620389938354492, "global_step": 418238, "epoch": 2489} {"train_loss": -10.289545059204102, "global_step": 418239, "epoch": 2489} {"train_loss": -11.602250099182129, "global_step": 418240, "epoch": 2489} {"train_loss": -8.275014877319336, "global_step": 418241, "epoch": 2489} {"train_loss": -9.37159538269043, "global_step": 418242, "epoch": 2489} {"train_loss": -7.015295505523682, "global_step": 418243, "epoch": 2489} {"train_loss": -7.7106614112854, "global_step": 418244, "epoch": 2489} {"train_loss": -6.485079765319824, "global_step": 418245, "epoch": 2489} {"train_loss": -6.478823661804199, "global_step": 418246, "epoch": 2489} {"train_loss": -6.432720184326172, "global_step": 418247, "epoch": 2489} {"train_loss": -6.263372421264648, "global_step": 418248, "epoch": 2489} {"train_loss": -6.262740135192871, "global_step": 418249, "epoch": 2489} {"train_loss": -6.1535444259643555, "global_step": 418250, "epoch": 2489} {"train_loss": -6.405412673950195, "global_step": 418251, "epoch": 2489} {"train_loss": -7.497611999511719, "global_step": 418252, "epoch": 2489} {"train_loss": -6.679050445556641, "global_step": 418253, "epoch": 2489} {"train_loss": -6.541018486022949, "global_step": 418254, "epoch": 2489} {"train_loss": -6.990111827850342, "global_step": 418255, "epoch": 2489} {"train_loss": -6.644944190979004, "global_step": 418256, "epoch": 2489} {"train_loss": -6.960838317871094, "global_step": 418257, "epoch": 2489} {"train_loss": -7.239201545715332, "global_step": 418258, "epoch": 2489} {"train_loss": -6.710404872894287, "global_step": 418259, "epoch": 2489} {"train_loss": -6.984340667724609, "global_step": 418260, "epoch": 2489} {"train_loss": -7.591621398925781, "global_step": 418261, "epoch": 2489} {"train_loss": -7.092135906219482, "global_step": 418262, "epoch": 2489} {"train_loss": -7.5413360595703125, "global_step": 418263, "epoch": 2489} {"train_loss": -7.629439353942871, "global_step": 418264, "epoch": 2489} {"train_loss": -7.645931243896484, "global_step": 418265, "epoch": 2489} {"train_loss": -7.841370582580566, "global_step": 418266, "epoch": 2489} {"train_loss": -7.955854415893555, "global_step": 418267, "epoch": 2489} {"train_loss": -7.9001851081848145, "global_step": 418268, "epoch": 2489} {"train_loss": -7.798282623291016, "global_step": 418269, "epoch": 2489} {"train_loss": -8.018549919128418, "global_step": 418270, "epoch": 2489} {"train_loss": -8.521364212036133, "global_step": 418271, "epoch": 2489} {"train_loss": -8.005590438842773, "global_step": 418272, "epoch": 2489} {"train_loss": -8.344034194946289, "global_step": 418273, "epoch": 2489} {"train_loss": -8.374448776245117, "global_step": 418274, "epoch": 2489} {"train_loss": -8.459881782531738, "global_step": 418275, "epoch": 2489} {"train_loss": -8.414506912231445, "global_step": 418276, "epoch": 2489} {"train_loss": -8.684490203857422, "global_step": 418277, "epoch": 2489} {"train_loss": -8.54297161102295, "global_step": 418278, "epoch": 2489} {"train_loss": -8.562585830688477, "global_step": 418279, "epoch": 2489} {"train_loss": -8.956412315368652, "global_step": 418280, "epoch": 2489} {"train_loss": -8.839946746826172, "global_step": 418281, "epoch": 2489} {"train_loss": -9.005203247070312, "global_step": 418282, "epoch": 2489} {"train_loss": -9.098726272583008, "global_step": 418283, "epoch": 2489} {"train_loss": -9.272218704223633, "global_step": 418284, "epoch": 2489} {"train_loss": -9.15307331085205, "global_step": 418285, "epoch": 2489} {"train_loss": -9.376953125, "global_step": 418286, "epoch": 2489} {"train_loss": -9.402469635009766, "global_step": 418287, "epoch": 2489} {"train_loss": -9.24496078491211, "global_step": 418288, "epoch": 2489} {"train_loss": -9.61146068572998, "global_step": 418289, "epoch": 2489} {"train_loss": -9.563255310058594, "global_step": 418290, "epoch": 2489} {"train_loss": -9.486352920532227, "global_step": 418291, "epoch": 2489} {"train_loss": -9.688772201538086, "global_step": 418292, "epoch": 2489} {"train_loss": -9.811197280883789, "global_step": 418293, "epoch": 2489} {"train_loss": -9.700316429138184, "global_step": 418294, "epoch": 2489} {"train_loss": -10.02872085571289, "global_step": 418295, "epoch": 2489} {"train_loss": -9.945279121398926, "global_step": 418296, "epoch": 2489} {"train_loss": -9.722856521606445, "global_step": 418297, "epoch": 2489} {"train_loss": -9.86007308959961, "global_step": 418298, "epoch": 2489} {"train_loss": -9.773974418640137, "global_step": 418299, "epoch": 2489} {"train_loss": -9.936119079589844, "global_step": 418300, "epoch": 2489} {"train_loss": -9.967855453491211, "global_step": 418301, "epoch": 2489} {"train_loss": -10.194280624389648, "global_step": 418302, "epoch": 2489} {"train_loss": -10.034449577331543, "global_step": 418303, "epoch": 2489} {"train_loss": -10.037605285644531, "global_step": 418304, "epoch": 2489} {"train_loss": -10.323427200317383, "global_step": 418305, "epoch": 2489} {"train_loss": -10.566305160522461, "global_step": 418306, "epoch": 2489} {"train_loss": -10.27334976196289, "global_step": 418307, "epoch": 2489} {"train_loss": -10.710525512695312, "global_step": 418308, "epoch": 2489} {"train_loss": -10.248744010925293, "global_step": 418309, "epoch": 2489} {"train_loss": -10.899663925170898, "global_step": 418310, "epoch": 2489} {"train_loss": -10.615735054016113, "global_step": 418311, "epoch": 2489} {"train_loss": -10.67752742767334, "global_step": 418312, "epoch": 2489} {"train_loss": -10.492904663085938, "global_step": 418313, "epoch": 2489} {"train_loss": -10.486114501953125, "global_step": 418314, "epoch": 2489} {"train_loss": -10.502486228942871, "global_step": 418315, "epoch": 2489} {"train_loss": -10.32771110534668, "global_step": 418316, "epoch": 2489} {"train_loss": -10.254074096679688, "global_step": 418317, "epoch": 2489} {"train_loss": -10.247933387756348, "global_step": 418318, "epoch": 2489} {"train_loss": -10.552919966833931, "global_step": 418319, "epoch": 2489, "val_loss": 306269.90625} {"train_loss": -10.424185752868652, "global_step": 418320, "epoch": 2490} {"train_loss": -10.540613174438477, "global_step": 418321, "epoch": 2490} {"train_loss": -10.266603469848633, "global_step": 418322, "epoch": 2490} {"train_loss": -10.756505012512207, "global_step": 418323, "epoch": 2490} {"train_loss": -10.114614486694336, "global_step": 418324, "epoch": 2490} {"train_loss": -10.888416290283203, "global_step": 418325, "epoch": 2490} {"train_loss": -10.686030387878418, "global_step": 418326, "epoch": 2490} {"train_loss": -10.960293769836426, "global_step": 418327, "epoch": 2490} {"train_loss": -10.52740478515625, "global_step": 418328, "epoch": 2490} {"train_loss": -11.197187423706055, "global_step": 418329, "epoch": 2490} {"train_loss": -11.010894775390625, "global_step": 418330, "epoch": 2490} {"train_loss": -11.153366088867188, "global_step": 418331, "epoch": 2490} {"train_loss": -10.70406723022461, "global_step": 418332, "epoch": 2490} {"train_loss": -11.56654167175293, "global_step": 418333, "epoch": 2490} {"train_loss": -11.224349021911621, "global_step": 418334, "epoch": 2490} {"train_loss": -11.21707534790039, "global_step": 418335, "epoch": 2490} {"train_loss": -11.548149108886719, "global_step": 418336, "epoch": 2490} {"train_loss": -11.296653747558594, "global_step": 418337, "epoch": 2490} {"train_loss": -11.514852523803711, "global_step": 418338, "epoch": 2490} {"train_loss": -11.919464111328125, "global_step": 418339, "epoch": 2490} {"train_loss": -11.71764087677002, "global_step": 418340, "epoch": 2490} {"train_loss": -11.371768951416016, "global_step": 418341, "epoch": 2490} {"train_loss": -11.6600923538208, "global_step": 418342, "epoch": 2490} {"train_loss": -11.763566970825195, "global_step": 418343, "epoch": 2490} {"train_loss": -11.524531364440918, "global_step": 418344, "epoch": 2490} {"train_loss": -11.673831939697266, "global_step": 418345, "epoch": 2490} {"train_loss": -11.915091514587402, "global_step": 418346, "epoch": 2490} {"train_loss": -11.593454360961914, "global_step": 418347, "epoch": 2490} {"train_loss": -11.724048614501953, "global_step": 418348, "epoch": 2490} {"train_loss": -11.47258186340332, "global_step": 418349, "epoch": 2490} {"train_loss": -11.863171577453613, "global_step": 418350, "epoch": 2490} {"train_loss": -11.408994674682617, "global_step": 418351, "epoch": 2490} {"train_loss": -11.733479499816895, "global_step": 418352, "epoch": 2490} {"train_loss": -11.539732933044434, "global_step": 418353, "epoch": 2490} {"train_loss": -11.832444190979004, "global_step": 418354, "epoch": 2490} {"train_loss": -11.749784469604492, "global_step": 418355, "epoch": 2490} {"train_loss": -11.946512222290039, "global_step": 418356, "epoch": 2490} {"train_loss": -11.824090957641602, "global_step": 418357, "epoch": 2490} {"train_loss": -11.775924682617188, "global_step": 418358, "epoch": 2490} {"train_loss": -12.039997100830078, "global_step": 418359, "epoch": 2490} {"train_loss": -11.716999053955078, "global_step": 418360, "epoch": 2490} {"train_loss": -12.036252975463867, "global_step": 418361, "epoch": 2490} {"train_loss": -12.100830078125, "global_step": 418362, "epoch": 2490} {"train_loss": -11.9913969039917, "global_step": 418363, "epoch": 2490} {"train_loss": -12.036354064941406, "global_step": 418364, "epoch": 2490} {"train_loss": -11.956758499145508, "global_step": 418365, "epoch": 2490} {"train_loss": -12.057714462280273, "global_step": 418366, "epoch": 2490} {"train_loss": -12.083849906921387, "global_step": 418367, "epoch": 2490} {"train_loss": -11.457544326782227, "global_step": 418368, "epoch": 2490} {"train_loss": -11.816792488098145, "global_step": 418369, "epoch": 2490} {"train_loss": -12.038652420043945, "global_step": 418370, "epoch": 2490} {"train_loss": -12.216455459594727, "global_step": 418371, "epoch": 2490} {"train_loss": -11.956787109375, "global_step": 418372, "epoch": 2490} {"train_loss": -11.844260215759277, "global_step": 418373, "epoch": 2490} {"train_loss": -11.642163276672363, "global_step": 418374, "epoch": 2490} {"train_loss": -11.914409637451172, "global_step": 418375, "epoch": 2490} {"train_loss": -11.732425689697266, "global_step": 418376, "epoch": 2490} {"train_loss": -11.411477088928223, "global_step": 418377, "epoch": 2490} {"train_loss": -11.394856452941895, "global_step": 418378, "epoch": 2490} {"train_loss": -11.765020370483398, "global_step": 418379, "epoch": 2490} {"train_loss": -11.561912536621094, "global_step": 418380, "epoch": 2490} {"train_loss": -11.762904167175293, "global_step": 418381, "epoch": 2490} {"train_loss": -11.37874984741211, "global_step": 418382, "epoch": 2490} {"train_loss": -11.257783889770508, "global_step": 418383, "epoch": 2490} {"train_loss": -11.419170379638672, "global_step": 418384, "epoch": 2490} {"train_loss": -11.867709159851074, "global_step": 418385, "epoch": 2490} {"train_loss": -11.230178833007812, "global_step": 418386, "epoch": 2490} {"train_loss": -11.661293983459473, "global_step": 418387, "epoch": 2490} {"train_loss": -11.868122100830078, "global_step": 418388, "epoch": 2490} {"train_loss": -11.420011520385742, "global_step": 418389, "epoch": 2490} {"train_loss": -11.975421905517578, "global_step": 418390, "epoch": 2490} {"train_loss": -11.376241683959961, "global_step": 418391, "epoch": 2490} {"train_loss": -11.4298095703125, "global_step": 418392, "epoch": 2490} {"train_loss": -11.416348457336426, "global_step": 418393, "epoch": 2490} {"train_loss": -11.714405059814453, "global_step": 418394, "epoch": 2490} {"train_loss": -11.304361343383789, "global_step": 418395, "epoch": 2490} {"train_loss": -11.57142448425293, "global_step": 418396, "epoch": 2490} {"train_loss": -11.297845840454102, "global_step": 418397, "epoch": 2490} {"train_loss": -11.451459884643555, "global_step": 418398, "epoch": 2490} {"train_loss": -11.884695053100586, "global_step": 418399, "epoch": 2490} {"train_loss": -11.359577178955078, "global_step": 418400, "epoch": 2490} {"train_loss": -11.7369966506958, "global_step": 418401, "epoch": 2490} {"train_loss": -11.694192886352539, "global_step": 418402, "epoch": 2490} {"train_loss": -11.849416732788086, "global_step": 418403, "epoch": 2490} {"train_loss": -11.822484970092773, "global_step": 418404, "epoch": 2490} {"train_loss": -11.837646484375, "global_step": 418405, "epoch": 2490} {"train_loss": -12.00277042388916, "global_step": 418406, "epoch": 2490} {"train_loss": -11.971206665039062, "global_step": 418407, "epoch": 2490} {"train_loss": -11.896167755126953, "global_step": 418408, "epoch": 2490} {"train_loss": -11.859944343566895, "global_step": 418409, "epoch": 2490} {"train_loss": -11.925891876220703, "global_step": 418410, "epoch": 2490} {"train_loss": -11.879507064819336, "global_step": 418411, "epoch": 2490} {"train_loss": -11.758235931396484, "global_step": 418412, "epoch": 2490} {"train_loss": -12.100112915039062, "global_step": 418413, "epoch": 2490} {"train_loss": -11.845197677612305, "global_step": 418414, "epoch": 2490} {"train_loss": -12.055418014526367, "global_step": 418415, "epoch": 2490} {"train_loss": -12.06481647491455, "global_step": 418416, "epoch": 2490} {"train_loss": -12.209759712219238, "global_step": 418417, "epoch": 2490} {"train_loss": -12.275161743164062, "global_step": 418418, "epoch": 2490} {"train_loss": -12.180081367492676, "global_step": 418419, "epoch": 2490} {"train_loss": -12.00705337524414, "global_step": 418420, "epoch": 2490} {"train_loss": -11.559626579284668, "global_step": 418421, "epoch": 2490} {"train_loss": -12.284085273742676, "global_step": 418422, "epoch": 2490} {"train_loss": -12.104667663574219, "global_step": 418423, "epoch": 2490} {"train_loss": -12.339035034179688, "global_step": 418424, "epoch": 2490} {"train_loss": -11.86900806427002, "global_step": 418425, "epoch": 2490} {"train_loss": -12.235994338989258, "global_step": 418426, "epoch": 2490} {"train_loss": -11.6368408203125, "global_step": 418427, "epoch": 2490} {"train_loss": -12.213460922241211, "global_step": 418428, "epoch": 2490} {"train_loss": -12.130878448486328, "global_step": 418429, "epoch": 2490} {"train_loss": -11.474225997924805, "global_step": 418430, "epoch": 2490} {"train_loss": -11.936819076538086, "global_step": 418431, "epoch": 2490} {"train_loss": -12.099788665771484, "global_step": 418432, "epoch": 2490} {"train_loss": -11.577447891235352, "global_step": 418433, "epoch": 2490} {"train_loss": -11.982746124267578, "global_step": 418434, "epoch": 2490} {"train_loss": -11.84550666809082, "global_step": 418435, "epoch": 2490} {"train_loss": -12.1890869140625, "global_step": 418436, "epoch": 2490} {"train_loss": -12.150126457214355, "global_step": 418437, "epoch": 2490} {"train_loss": -11.80703353881836, "global_step": 418438, "epoch": 2490} {"train_loss": -12.28126335144043, "global_step": 418439, "epoch": 2490} {"train_loss": -12.228574752807617, "global_step": 418440, "epoch": 2490} {"train_loss": -12.149469375610352, "global_step": 418441, "epoch": 2490} {"train_loss": -12.569147109985352, "global_step": 418442, "epoch": 2490} {"train_loss": -12.456729888916016, "global_step": 418443, "epoch": 2490} {"train_loss": -12.18459701538086, "global_step": 418444, "epoch": 2490} {"train_loss": -12.40428352355957, "global_step": 418445, "epoch": 2490} {"train_loss": -12.128127098083496, "global_step": 418446, "epoch": 2490} {"train_loss": -12.022330284118652, "global_step": 418447, "epoch": 2490} {"train_loss": -12.158349990844727, "global_step": 418448, "epoch": 2490} {"train_loss": -12.00271987915039, "global_step": 418449, "epoch": 2490} {"train_loss": -12.516700744628906, "global_step": 418450, "epoch": 2490} {"train_loss": -12.259330749511719, "global_step": 418451, "epoch": 2490} {"train_loss": -12.394617080688477, "global_step": 418452, "epoch": 2490} {"train_loss": -12.293296813964844, "global_step": 418453, "epoch": 2490} {"train_loss": -12.407468795776367, "global_step": 418454, "epoch": 2490} {"train_loss": -12.466938018798828, "global_step": 418455, "epoch": 2490} {"train_loss": -12.523618698120117, "global_step": 418456, "epoch": 2490} {"train_loss": -12.365457534790039, "global_step": 418457, "epoch": 2490} {"train_loss": -12.376716613769531, "global_step": 418458, "epoch": 2490} {"train_loss": -12.128238677978516, "global_step": 418459, "epoch": 2490} {"train_loss": -12.41948413848877, "global_step": 418460, "epoch": 2490} {"train_loss": -12.203189849853516, "global_step": 418461, "epoch": 2490} {"train_loss": -11.976322174072266, "global_step": 418462, "epoch": 2490} {"train_loss": -12.143239974975586, "global_step": 418463, "epoch": 2490} {"train_loss": -11.82598876953125, "global_step": 418464, "epoch": 2490} {"train_loss": -12.336877822875977, "global_step": 418465, "epoch": 2490} {"train_loss": -11.944725036621094, "global_step": 418466, "epoch": 2490} {"train_loss": -12.025293350219727, "global_step": 418467, "epoch": 2490} {"train_loss": -11.212631225585938, "global_step": 418468, "epoch": 2490} {"train_loss": -11.905938148498535, "global_step": 418469, "epoch": 2490} {"train_loss": -12.370269775390625, "global_step": 418470, "epoch": 2490} {"train_loss": -12.134599685668945, "global_step": 418471, "epoch": 2490} {"train_loss": -12.55923080444336, "global_step": 418472, "epoch": 2490} {"train_loss": -12.419160842895508, "global_step": 418473, "epoch": 2490} {"train_loss": -11.803567886352539, "global_step": 418474, "epoch": 2490} {"train_loss": -11.60673999786377, "global_step": 418475, "epoch": 2490} {"train_loss": -11.969488143920898, "global_step": 418476, "epoch": 2490} {"train_loss": -11.794618606567383, "global_step": 418477, "epoch": 2490} {"train_loss": -11.610480308532715, "global_step": 418478, "epoch": 2490} {"train_loss": -12.34930419921875, "global_step": 418479, "epoch": 2490} {"train_loss": -11.97471809387207, "global_step": 418480, "epoch": 2490} {"train_loss": -11.821331024169922, "global_step": 418481, "epoch": 2490} {"train_loss": -12.132473945617676, "global_step": 418482, "epoch": 2490} {"train_loss": -12.470719337463379, "global_step": 418483, "epoch": 2490} {"train_loss": -11.694965362548828, "global_step": 418484, "epoch": 2490} {"train_loss": -12.631040573120117, "global_step": 418485, "epoch": 2490} {"train_loss": -12.388769149780273, "global_step": 418486, "epoch": 2490} {"train_loss": -11.809495210647583, "global_step": 418487, "epoch": 2490, "val_loss": 306511.53125, "train_action_mse_error": 2.7891592979431152} {"train_loss": -11.976813316345215, "global_step": 418488, "epoch": 2491} {"train_loss": -11.70571517944336, "global_step": 418489, "epoch": 2491} {"train_loss": -12.276837348937988, "global_step": 418490, "epoch": 2491} {"train_loss": -11.639835357666016, "global_step": 418491, "epoch": 2491} {"train_loss": -11.503704071044922, "global_step": 418492, "epoch": 2491} {"train_loss": -12.272882461547852, "global_step": 418493, "epoch": 2491} {"train_loss": -11.575605392456055, "global_step": 418494, "epoch": 2491} {"train_loss": -11.316875457763672, "global_step": 418495, "epoch": 2491} {"train_loss": -12.528240203857422, "global_step": 418496, "epoch": 2491} {"train_loss": -12.280065536499023, "global_step": 418497, "epoch": 2491} {"train_loss": -12.453042030334473, "global_step": 418498, "epoch": 2491} {"train_loss": -12.211568832397461, "global_step": 418499, "epoch": 2491} {"train_loss": -12.70285415649414, "global_step": 418500, "epoch": 2491} {"train_loss": -12.43929672241211, "global_step": 418501, "epoch": 2491} {"train_loss": -11.896976470947266, "global_step": 418502, "epoch": 2491} {"train_loss": -12.39629077911377, "global_step": 418503, "epoch": 2491} {"train_loss": -12.074675559997559, "global_step": 418504, "epoch": 2491} {"train_loss": -12.208009719848633, "global_step": 418505, "epoch": 2491} {"train_loss": -12.416351318359375, "global_step": 418506, "epoch": 2491} {"train_loss": -12.32872200012207, "global_step": 418507, "epoch": 2491} {"train_loss": -11.558673858642578, "global_step": 418508, "epoch": 2491} {"train_loss": -12.061962127685547, "global_step": 418509, "epoch": 2491} {"train_loss": -11.399520874023438, "global_step": 418510, "epoch": 2491} {"train_loss": -12.046829223632812, "global_step": 418511, "epoch": 2491} {"train_loss": -11.581771850585938, "global_step": 418512, "epoch": 2491} {"train_loss": -12.285456657409668, "global_step": 418513, "epoch": 2491} {"train_loss": -11.821664810180664, "global_step": 418514, "epoch": 2491} {"train_loss": -11.555233001708984, "global_step": 418515, "epoch": 2491} {"train_loss": -11.126689910888672, "global_step": 418516, "epoch": 2491} {"train_loss": -11.252065658569336, "global_step": 418517, "epoch": 2491} {"train_loss": -11.711090087890625, "global_step": 418518, "epoch": 2491} {"train_loss": -10.730276107788086, "global_step": 418519, "epoch": 2491} {"train_loss": -11.157554626464844, "global_step": 418520, "epoch": 2491} {"train_loss": -10.150117874145508, "global_step": 418521, "epoch": 2491} {"train_loss": -10.908923149108887, "global_step": 418522, "epoch": 2491} {"train_loss": -10.47012710571289, "global_step": 418523, "epoch": 2491} {"train_loss": -11.387296676635742, "global_step": 418524, "epoch": 2491} {"train_loss": -9.954381942749023, "global_step": 418525, "epoch": 2491} {"train_loss": -12.091291427612305, "global_step": 418526, "epoch": 2491} {"train_loss": -11.141578674316406, "global_step": 418527, "epoch": 2491} {"train_loss": -11.10581111907959, "global_step": 418528, "epoch": 2491} {"train_loss": -11.559623718261719, "global_step": 418529, "epoch": 2491} {"train_loss": -11.63355827331543, "global_step": 418530, "epoch": 2491} {"train_loss": -11.399530410766602, "global_step": 418531, "epoch": 2491} {"train_loss": -11.823793411254883, "global_step": 418532, "epoch": 2491} {"train_loss": -11.505910873413086, "global_step": 418533, "epoch": 2491} {"train_loss": -11.71301555633545, "global_step": 418534, "epoch": 2491} {"train_loss": -11.35226821899414, "global_step": 418535, "epoch": 2491} {"train_loss": -11.689674377441406, "global_step": 418536, "epoch": 2491} {"train_loss": -11.434924125671387, "global_step": 418537, "epoch": 2491} {"train_loss": -11.626176834106445, "global_step": 418538, "epoch": 2491} {"train_loss": -11.916793823242188, "global_step": 418539, "epoch": 2491} {"train_loss": -12.084619522094727, "global_step": 418540, "epoch": 2491} {"train_loss": -11.606106758117676, "global_step": 418541, "epoch": 2491} {"train_loss": -12.146678924560547, "global_step": 418542, "epoch": 2491} {"train_loss": -11.84316635131836, "global_step": 418543, "epoch": 2491} {"train_loss": -12.090856552124023, "global_step": 418544, "epoch": 2491} {"train_loss": -12.272276878356934, "global_step": 418545, "epoch": 2491} {"train_loss": -11.990962982177734, "global_step": 418546, "epoch": 2491} {"train_loss": -12.190286636352539, "global_step": 418547, "epoch": 2491} {"train_loss": -12.388644218444824, "global_step": 418548, "epoch": 2491} {"train_loss": -12.371810913085938, "global_step": 418549, "epoch": 2491} {"train_loss": -12.026022911071777, "global_step": 418550, "epoch": 2491} {"train_loss": -12.465812683105469, "global_step": 418551, "epoch": 2491} {"train_loss": -12.085628509521484, "global_step": 418552, "epoch": 2491} {"train_loss": -12.712526321411133, "global_step": 418553, "epoch": 2491} {"train_loss": -12.073301315307617, "global_step": 418554, "epoch": 2491} {"train_loss": -12.303908348083496, "global_step": 418555, "epoch": 2491} {"train_loss": -12.33515739440918, "global_step": 418556, "epoch": 2491} {"train_loss": -12.437905311584473, "global_step": 418557, "epoch": 2491} {"train_loss": -12.316015243530273, "global_step": 418558, "epoch": 2491} {"train_loss": -12.21735668182373, "global_step": 418559, "epoch": 2491} {"train_loss": -12.465269088745117, "global_step": 418560, "epoch": 2491} {"train_loss": -12.310214042663574, "global_step": 418561, "epoch": 2491} {"train_loss": -12.548084259033203, "global_step": 418562, "epoch": 2491} {"train_loss": -12.416738510131836, "global_step": 418563, "epoch": 2491} {"train_loss": -12.492843627929688, "global_step": 418564, "epoch": 2491} {"train_loss": -12.264629364013672, "global_step": 418565, "epoch": 2491} {"train_loss": -12.242855072021484, "global_step": 418566, "epoch": 2491} {"train_loss": -11.785164833068848, "global_step": 418567, "epoch": 2491} {"train_loss": -12.306161880493164, "global_step": 418568, "epoch": 2491} {"train_loss": -12.271727561950684, "global_step": 418569, "epoch": 2491} {"train_loss": -12.128425598144531, "global_step": 418570, "epoch": 2491} {"train_loss": -12.438518524169922, "global_step": 418571, "epoch": 2491} {"train_loss": -12.316577911376953, "global_step": 418572, "epoch": 2491} {"train_loss": -12.396303176879883, "global_step": 418573, "epoch": 2491} {"train_loss": -12.323467254638672, "global_step": 418574, "epoch": 2491} {"train_loss": -12.299468994140625, "global_step": 418575, "epoch": 2491} {"train_loss": -12.326655387878418, "global_step": 418576, "epoch": 2491} {"train_loss": -12.627906799316406, "global_step": 418577, "epoch": 2491} {"train_loss": -12.241510391235352, "global_step": 418578, "epoch": 2491} {"train_loss": -12.246140480041504, "global_step": 418579, "epoch": 2491} {"train_loss": -12.491600036621094, "global_step": 418580, "epoch": 2491} {"train_loss": -12.180440902709961, "global_step": 418581, "epoch": 2491} {"train_loss": -12.305712699890137, "global_step": 418582, "epoch": 2491} {"train_loss": -12.210126876831055, "global_step": 418583, "epoch": 2491} {"train_loss": -11.159795761108398, "global_step": 418584, "epoch": 2491} {"train_loss": -11.506133079528809, "global_step": 418585, "epoch": 2491} {"train_loss": -11.214014053344727, "global_step": 418586, "epoch": 2491} {"train_loss": -10.582671165466309, "global_step": 418587, "epoch": 2491} {"train_loss": -11.23128890991211, "global_step": 418588, "epoch": 2491} {"train_loss": -11.674385070800781, "global_step": 418589, "epoch": 2491} {"train_loss": -11.519457817077637, "global_step": 418590, "epoch": 2491} {"train_loss": -10.98049545288086, "global_step": 418591, "epoch": 2491} {"train_loss": -11.973514556884766, "global_step": 418592, "epoch": 2491} {"train_loss": -11.861665725708008, "global_step": 418593, "epoch": 2491} {"train_loss": -11.729769706726074, "global_step": 418594, "epoch": 2491} {"train_loss": -11.766690254211426, "global_step": 418595, "epoch": 2491} {"train_loss": -11.335890769958496, "global_step": 418596, "epoch": 2491} {"train_loss": -11.793420791625977, "global_step": 418597, "epoch": 2491} {"train_loss": -11.618227005004883, "global_step": 418598, "epoch": 2491} {"train_loss": -11.417616844177246, "global_step": 418599, "epoch": 2491} {"train_loss": -11.774868965148926, "global_step": 418600, "epoch": 2491} {"train_loss": -11.873331069946289, "global_step": 418601, "epoch": 2491} {"train_loss": -11.386934280395508, "global_step": 418602, "epoch": 2491} {"train_loss": -12.24478530883789, "global_step": 418603, "epoch": 2491} {"train_loss": -11.485294342041016, "global_step": 418604, "epoch": 2491} {"train_loss": -12.106748580932617, "global_step": 418605, "epoch": 2491} {"train_loss": -11.305557250976562, "global_step": 418606, "epoch": 2491} {"train_loss": -11.662269592285156, "global_step": 418607, "epoch": 2491} {"train_loss": -12.049471855163574, "global_step": 418608, "epoch": 2491} {"train_loss": -11.896928787231445, "global_step": 418609, "epoch": 2491} {"train_loss": -11.558090209960938, "global_step": 418610, "epoch": 2491} {"train_loss": -11.8093900680542, "global_step": 418611, "epoch": 2491} {"train_loss": -11.574482917785645, "global_step": 418612, "epoch": 2491} {"train_loss": -12.0702543258667, "global_step": 418613, "epoch": 2491} {"train_loss": -10.996757507324219, "global_step": 418614, "epoch": 2491} {"train_loss": -12.180370330810547, "global_step": 418615, "epoch": 2491} {"train_loss": -11.449545860290527, "global_step": 418616, "epoch": 2491} {"train_loss": -12.13713264465332, "global_step": 418617, "epoch": 2491} {"train_loss": -12.170949935913086, "global_step": 418618, "epoch": 2491} {"train_loss": -11.853128433227539, "global_step": 418619, "epoch": 2491} {"train_loss": -11.759252548217773, "global_step": 418620, "epoch": 2491} {"train_loss": -11.756418228149414, "global_step": 418621, "epoch": 2491} {"train_loss": -11.847657203674316, "global_step": 418622, "epoch": 2491} {"train_loss": -11.34277629852295, "global_step": 418623, "epoch": 2491} {"train_loss": -11.611043930053711, "global_step": 418624, "epoch": 2491} {"train_loss": -12.52532958984375, "global_step": 418625, "epoch": 2491} {"train_loss": -11.508062362670898, "global_step": 418626, "epoch": 2491} {"train_loss": -12.344053268432617, "global_step": 418627, "epoch": 2491} {"train_loss": -11.977890968322754, "global_step": 418628, "epoch": 2491} {"train_loss": -12.088830947875977, "global_step": 418629, "epoch": 2491} {"train_loss": -12.110292434692383, "global_step": 418630, "epoch": 2491} {"train_loss": -12.448761940002441, "global_step": 418631, "epoch": 2491} {"train_loss": -12.296781539916992, "global_step": 418632, "epoch": 2491} {"train_loss": -12.46171760559082, "global_step": 418633, "epoch": 2491} {"train_loss": -12.479388236999512, "global_step": 418634, "epoch": 2491} {"train_loss": -12.668591499328613, "global_step": 418635, "epoch": 2491} {"train_loss": -12.422621726989746, "global_step": 418636, "epoch": 2491} {"train_loss": -12.207849502563477, "global_step": 418637, "epoch": 2491} {"train_loss": -12.164775848388672, "global_step": 418638, "epoch": 2491} {"train_loss": -12.484811782836914, "global_step": 418639, "epoch": 2491} {"train_loss": -11.920417785644531, "global_step": 418640, "epoch": 2491} {"train_loss": -12.264538764953613, "global_step": 418641, "epoch": 2491} {"train_loss": -12.557696342468262, "global_step": 418642, "epoch": 2491} {"train_loss": -12.19334602355957, "global_step": 418643, "epoch": 2491} {"train_loss": -12.598749160766602, "global_step": 418644, "epoch": 2491} {"train_loss": -12.361339569091797, "global_step": 418645, "epoch": 2491} {"train_loss": -12.616079330444336, "global_step": 418646, "epoch": 2491} {"train_loss": -12.485433578491211, "global_step": 418647, "epoch": 2491} {"train_loss": -12.494022369384766, "global_step": 418648, "epoch": 2491} {"train_loss": -12.687444686889648, "global_step": 418649, "epoch": 2491} {"train_loss": -12.766462326049805, "global_step": 418650, "epoch": 2491} {"train_loss": -12.645828247070312, "global_step": 418651, "epoch": 2491} {"train_loss": -12.42428970336914, "global_step": 418652, "epoch": 2491} {"train_loss": -12.419744491577148, "global_step": 418653, "epoch": 2491} {"train_loss": -12.662999153137207, "global_step": 418654, "epoch": 2491} {"train_loss": -11.950681254977273, "global_step": 418655, "epoch": 2491, "val_loss": 307978.5} {"train_loss": -12.636767387390137, "global_step": 418656, "epoch": 2492} {"train_loss": -12.643909454345703, "global_step": 418657, "epoch": 2492} {"train_loss": -12.442947387695312, "global_step": 418658, "epoch": 2492} {"train_loss": -12.567109107971191, "global_step": 418659, "epoch": 2492} {"train_loss": -12.51451301574707, "global_step": 418660, "epoch": 2492} {"train_loss": -12.452231407165527, "global_step": 418661, "epoch": 2492} {"train_loss": -12.472471237182617, "global_step": 418662, "epoch": 2492} {"train_loss": -12.355146408081055, "global_step": 418663, "epoch": 2492} {"train_loss": -12.186934471130371, "global_step": 418664, "epoch": 2492} {"train_loss": -12.221097946166992, "global_step": 418665, "epoch": 2492} {"train_loss": -12.43525505065918, "global_step": 418666, "epoch": 2492} {"train_loss": -12.489153861999512, "global_step": 418667, "epoch": 2492} {"train_loss": -11.94294261932373, "global_step": 418668, "epoch": 2492} {"train_loss": -12.003491401672363, "global_step": 418669, "epoch": 2492} {"train_loss": -11.389942169189453, "global_step": 418670, "epoch": 2492} {"train_loss": -11.133584976196289, "global_step": 418671, "epoch": 2492} {"train_loss": -11.03636360168457, "global_step": 418672, "epoch": 2492} {"train_loss": -11.509431838989258, "global_step": 418673, "epoch": 2492} {"train_loss": -11.539359092712402, "global_step": 418674, "epoch": 2492} {"train_loss": -11.215721130371094, "global_step": 418675, "epoch": 2492} {"train_loss": -11.657903671264648, "global_step": 418676, "epoch": 2492} {"train_loss": -11.33364486694336, "global_step": 418677, "epoch": 2492} {"train_loss": -11.552665710449219, "global_step": 418678, "epoch": 2492} {"train_loss": -11.909503936767578, "global_step": 418679, "epoch": 2492} {"train_loss": -11.100499153137207, "global_step": 418680, "epoch": 2492} {"train_loss": -11.123200416564941, "global_step": 418681, "epoch": 2492} {"train_loss": -12.162878036499023, "global_step": 418682, "epoch": 2492} {"train_loss": -12.264001846313477, "global_step": 418683, "epoch": 2492} {"train_loss": -12.110664367675781, "global_step": 418684, "epoch": 2492} {"train_loss": -12.431767463684082, "global_step": 418685, "epoch": 2492} {"train_loss": -12.267496109008789, "global_step": 418686, "epoch": 2492} {"train_loss": -11.965286254882812, "global_step": 418687, "epoch": 2492} {"train_loss": -12.722338676452637, "global_step": 418688, "epoch": 2492} {"train_loss": -12.33212661743164, "global_step": 418689, "epoch": 2492} {"train_loss": -12.454631805419922, "global_step": 418690, "epoch": 2492} {"train_loss": -12.344908714294434, "global_step": 418691, "epoch": 2492} {"train_loss": -12.202547073364258, "global_step": 418692, "epoch": 2492} {"train_loss": -11.963668823242188, "global_step": 418693, "epoch": 2492} {"train_loss": -11.956990242004395, "global_step": 418694, "epoch": 2492} {"train_loss": -11.987370491027832, "global_step": 418695, "epoch": 2492} {"train_loss": -12.366044998168945, "global_step": 418696, "epoch": 2492} {"train_loss": -12.068005561828613, "global_step": 418697, "epoch": 2492} {"train_loss": -11.586647987365723, "global_step": 418698, "epoch": 2492} {"train_loss": -11.820001602172852, "global_step": 418699, "epoch": 2492} {"train_loss": -12.342033386230469, "global_step": 418700, "epoch": 2492} {"train_loss": -11.20622730255127, "global_step": 418701, "epoch": 2492} {"train_loss": -12.110259056091309, "global_step": 418702, "epoch": 2492} {"train_loss": -12.08251667022705, "global_step": 418703, "epoch": 2492} {"train_loss": -11.542804718017578, "global_step": 418704, "epoch": 2492} {"train_loss": -12.384471893310547, "global_step": 418705, "epoch": 2492} {"train_loss": -11.938982009887695, "global_step": 418706, "epoch": 2492} {"train_loss": -12.105064392089844, "global_step": 418707, "epoch": 2492} {"train_loss": -11.915169715881348, "global_step": 418708, "epoch": 2492} {"train_loss": -12.089546203613281, "global_step": 418709, "epoch": 2492} {"train_loss": -11.297271728515625, "global_step": 418710, "epoch": 2492} {"train_loss": -12.110933303833008, "global_step": 418711, "epoch": 2492} {"train_loss": -10.670293807983398, "global_step": 418712, "epoch": 2492} {"train_loss": -10.825260162353516, "global_step": 418713, "epoch": 2492} {"train_loss": -11.058265686035156, "global_step": 418714, "epoch": 2492} {"train_loss": -11.691106796264648, "global_step": 418715, "epoch": 2492} {"train_loss": -11.121475219726562, "global_step": 418716, "epoch": 2492} {"train_loss": -11.913219451904297, "global_step": 418717, "epoch": 2492} {"train_loss": -11.309873580932617, "global_step": 418718, "epoch": 2492} {"train_loss": -11.681314468383789, "global_step": 418719, "epoch": 2492} {"train_loss": -10.512357711791992, "global_step": 418720, "epoch": 2492} {"train_loss": -12.060270309448242, "global_step": 418721, "epoch": 2492} {"train_loss": -10.05262279510498, "global_step": 418722, "epoch": 2492} {"train_loss": -11.288212776184082, "global_step": 418723, "epoch": 2492} {"train_loss": -10.003662109375, "global_step": 418724, "epoch": 2492} {"train_loss": -11.243026733398438, "global_step": 418725, "epoch": 2492} {"train_loss": -11.29976749420166, "global_step": 418726, "epoch": 2492} {"train_loss": -10.376626968383789, "global_step": 418727, "epoch": 2492} {"train_loss": -10.785257339477539, "global_step": 418728, "epoch": 2492} {"train_loss": -10.308616638183594, "global_step": 418729, "epoch": 2492} {"train_loss": -10.461991310119629, "global_step": 418730, "epoch": 2492} {"train_loss": -10.282037734985352, "global_step": 418731, "epoch": 2492} {"train_loss": -11.630464553833008, "global_step": 418732, "epoch": 2492} {"train_loss": -10.720952987670898, "global_step": 418733, "epoch": 2492} {"train_loss": -10.169975280761719, "global_step": 418734, "epoch": 2492} {"train_loss": -11.084783554077148, "global_step": 418735, "epoch": 2492} {"train_loss": -8.544376373291016, "global_step": 418736, "epoch": 2492} {"train_loss": -9.59320068359375, "global_step": 418737, "epoch": 2492} {"train_loss": -10.108240127563477, "global_step": 418738, "epoch": 2492} {"train_loss": -10.154773712158203, "global_step": 418739, "epoch": 2492} {"train_loss": -9.915319442749023, "global_step": 418740, "epoch": 2492} {"train_loss": -11.197022438049316, "global_step": 418741, "epoch": 2492} {"train_loss": -11.077415466308594, "global_step": 418742, "epoch": 2492} {"train_loss": -10.18030834197998, "global_step": 418743, "epoch": 2492} {"train_loss": -11.313705444335938, "global_step": 418744, "epoch": 2492} {"train_loss": -11.112512588500977, "global_step": 418745, "epoch": 2492} {"train_loss": -10.478900909423828, "global_step": 418746, "epoch": 2492} {"train_loss": -10.363340377807617, "global_step": 418747, "epoch": 2492} {"train_loss": -11.012312889099121, "global_step": 418748, "epoch": 2492} {"train_loss": -10.582284927368164, "global_step": 418749, "epoch": 2492} {"train_loss": -11.032879829406738, "global_step": 418750, "epoch": 2492} {"train_loss": -11.115245819091797, "global_step": 418751, "epoch": 2492} {"train_loss": -10.212577819824219, "global_step": 418752, "epoch": 2492} {"train_loss": -10.606282234191895, "global_step": 418753, "epoch": 2492} {"train_loss": -11.416360855102539, "global_step": 418754, "epoch": 2492} {"train_loss": -11.01230525970459, "global_step": 418755, "epoch": 2492} {"train_loss": -11.078141212463379, "global_step": 418756, "epoch": 2492} {"train_loss": -10.785601615905762, "global_step": 418757, "epoch": 2492} {"train_loss": -11.399808883666992, "global_step": 418758, "epoch": 2492} {"train_loss": -10.422256469726562, "global_step": 418759, "epoch": 2492} {"train_loss": -11.500386238098145, "global_step": 418760, "epoch": 2492} {"train_loss": -11.669095039367676, "global_step": 418761, "epoch": 2492} {"train_loss": -10.782193183898926, "global_step": 418762, "epoch": 2492} {"train_loss": -10.765591621398926, "global_step": 418763, "epoch": 2492} {"train_loss": -11.315546035766602, "global_step": 418764, "epoch": 2492} {"train_loss": -11.21689224243164, "global_step": 418765, "epoch": 2492} {"train_loss": -11.161531448364258, "global_step": 418766, "epoch": 2492} {"train_loss": -10.4985933303833, "global_step": 418767, "epoch": 2492} {"train_loss": -11.531229019165039, "global_step": 418768, "epoch": 2492} {"train_loss": -11.278352737426758, "global_step": 418769, "epoch": 2492} {"train_loss": -10.756705284118652, "global_step": 418770, "epoch": 2492} {"train_loss": -11.928705215454102, "global_step": 418771, "epoch": 2492} {"train_loss": -11.446846008300781, "global_step": 418772, "epoch": 2492} {"train_loss": -10.82297420501709, "global_step": 418773, "epoch": 2492} {"train_loss": -11.343334197998047, "global_step": 418774, "epoch": 2492} {"train_loss": -11.204416275024414, "global_step": 418775, "epoch": 2492} {"train_loss": -11.30012321472168, "global_step": 418776, "epoch": 2492} {"train_loss": -10.794909477233887, "global_step": 418777, "epoch": 2492} {"train_loss": -11.697474479675293, "global_step": 418778, "epoch": 2492} {"train_loss": -11.284008026123047, "global_step": 418779, "epoch": 2492} {"train_loss": -10.626932144165039, "global_step": 418780, "epoch": 2492} {"train_loss": -10.852556228637695, "global_step": 418781, "epoch": 2492} {"train_loss": -11.922581672668457, "global_step": 418782, "epoch": 2492} {"train_loss": -11.146258354187012, "global_step": 418783, "epoch": 2492} {"train_loss": -11.374704360961914, "global_step": 418784, "epoch": 2492} {"train_loss": -11.342935562133789, "global_step": 418785, "epoch": 2492} {"train_loss": -11.369850158691406, "global_step": 418786, "epoch": 2492} {"train_loss": -11.238765716552734, "global_step": 418787, "epoch": 2492} {"train_loss": -11.365791320800781, "global_step": 418788, "epoch": 2492} {"train_loss": -11.583795547485352, "global_step": 418789, "epoch": 2492} {"train_loss": -11.677555084228516, "global_step": 418790, "epoch": 2492} {"train_loss": -12.11422348022461, "global_step": 418791, "epoch": 2492} {"train_loss": -11.827543258666992, "global_step": 418792, "epoch": 2492} {"train_loss": -11.811232566833496, "global_step": 418793, "epoch": 2492} {"train_loss": -12.22852897644043, "global_step": 418794, "epoch": 2492} {"train_loss": -11.914751052856445, "global_step": 418795, "epoch": 2492} {"train_loss": -11.982175827026367, "global_step": 418796, "epoch": 2492} {"train_loss": -11.999946594238281, "global_step": 418797, "epoch": 2492} {"train_loss": -12.273365020751953, "global_step": 418798, "epoch": 2492} {"train_loss": -11.947089195251465, "global_step": 418799, "epoch": 2492} {"train_loss": -12.196294784545898, "global_step": 418800, "epoch": 2492} {"train_loss": -12.015387535095215, "global_step": 418801, "epoch": 2492} {"train_loss": -12.243001937866211, "global_step": 418802, "epoch": 2492} {"train_loss": -12.333256721496582, "global_step": 418803, "epoch": 2492} {"train_loss": -12.175786972045898, "global_step": 418804, "epoch": 2492} {"train_loss": -12.030082702636719, "global_step": 418805, "epoch": 2492} {"train_loss": -12.474138259887695, "global_step": 418806, "epoch": 2492} {"train_loss": -12.091166496276855, "global_step": 418807, "epoch": 2492} {"train_loss": -12.309307098388672, "global_step": 418808, "epoch": 2492} {"train_loss": -12.385476112365723, "global_step": 418809, "epoch": 2492} {"train_loss": -12.360116958618164, "global_step": 418810, "epoch": 2492} {"train_loss": -12.29194450378418, "global_step": 418811, "epoch": 2492} {"train_loss": -12.445833206176758, "global_step": 418812, "epoch": 2492} {"train_loss": -12.193937301635742, "global_step": 418813, "epoch": 2492} {"train_loss": -12.349672317504883, "global_step": 418814, "epoch": 2492} {"train_loss": -12.422723770141602, "global_step": 418815, "epoch": 2492} {"train_loss": -12.228256225585938, "global_step": 418816, "epoch": 2492} {"train_loss": -12.451055526733398, "global_step": 418817, "epoch": 2492} {"train_loss": -12.357675552368164, "global_step": 418818, "epoch": 2492} {"train_loss": -12.643157005310059, "global_step": 418819, "epoch": 2492} {"train_loss": -12.459945678710938, "global_step": 418820, "epoch": 2492} {"train_loss": -12.202777862548828, "global_step": 418821, "epoch": 2492} {"train_loss": -12.48179817199707, "global_step": 418822, "epoch": 2492} {"train_loss": -11.555004063106718, "global_step": 418823, "epoch": 2492, "val_loss": 307048.375} {"train_loss": -12.604519844055176, "global_step": 418824, "epoch": 2493} {"train_loss": -12.578413963317871, "global_step": 418825, "epoch": 2493} {"train_loss": -12.49172592163086, "global_step": 418826, "epoch": 2493} {"train_loss": -12.616820335388184, "global_step": 418827, "epoch": 2493} {"train_loss": -12.412586212158203, "global_step": 418828, "epoch": 2493} {"train_loss": -12.619375228881836, "global_step": 418829, "epoch": 2493} {"train_loss": -12.556575775146484, "global_step": 418830, "epoch": 2493} {"train_loss": -12.518745422363281, "global_step": 418831, "epoch": 2493} {"train_loss": -12.532882690429688, "global_step": 418832, "epoch": 2493} {"train_loss": -12.632216453552246, "global_step": 418833, "epoch": 2493} {"train_loss": -12.452616691589355, "global_step": 418834, "epoch": 2493} {"train_loss": -12.409860610961914, "global_step": 418835, "epoch": 2493} {"train_loss": -12.576980590820312, "global_step": 418836, "epoch": 2493} {"train_loss": -12.680042266845703, "global_step": 418837, "epoch": 2493} {"train_loss": -12.43287181854248, "global_step": 418838, "epoch": 2493} {"train_loss": -12.531402587890625, "global_step": 418839, "epoch": 2493} {"train_loss": -12.419886589050293, "global_step": 418840, "epoch": 2493} {"train_loss": -12.499147415161133, "global_step": 418841, "epoch": 2493} {"train_loss": -12.521653175354004, "global_step": 418842, "epoch": 2493} {"train_loss": -12.683328628540039, "global_step": 418843, "epoch": 2493} {"train_loss": -12.706028938293457, "global_step": 418844, "epoch": 2493} {"train_loss": -12.685693740844727, "global_step": 418845, "epoch": 2493} {"train_loss": -12.695306777954102, "global_step": 418846, "epoch": 2493} {"train_loss": -12.687767028808594, "global_step": 418847, "epoch": 2493} {"train_loss": -12.707406997680664, "global_step": 418848, "epoch": 2493} {"train_loss": -12.728200912475586, "global_step": 418849, "epoch": 2493} {"train_loss": -12.58077335357666, "global_step": 418850, "epoch": 2493} {"train_loss": -12.618474960327148, "global_step": 418851, "epoch": 2493} {"train_loss": -12.628274917602539, "global_step": 418852, "epoch": 2493} {"train_loss": -12.522505760192871, "global_step": 418853, "epoch": 2493} {"train_loss": -12.574966430664062, "global_step": 418854, "epoch": 2493} {"train_loss": -12.370222091674805, "global_step": 418855, "epoch": 2493} {"train_loss": -12.382949829101562, "global_step": 418856, "epoch": 2493} {"train_loss": -12.513956069946289, "global_step": 418857, "epoch": 2493} {"train_loss": -12.496231079101562, "global_step": 418858, "epoch": 2493} {"train_loss": -12.649925231933594, "global_step": 418859, "epoch": 2493} {"train_loss": -12.250701904296875, "global_step": 418860, "epoch": 2493} {"train_loss": -12.435880661010742, "global_step": 418861, "epoch": 2493} {"train_loss": -12.324633598327637, "global_step": 418862, "epoch": 2493} {"train_loss": -12.569917678833008, "global_step": 418863, "epoch": 2493} {"train_loss": -12.452561378479004, "global_step": 418864, "epoch": 2493} {"train_loss": -12.319228172302246, "global_step": 418865, "epoch": 2493} {"train_loss": -12.250692367553711, "global_step": 418866, "epoch": 2493} {"train_loss": -11.769071578979492, "global_step": 418867, "epoch": 2493} {"train_loss": -11.099397659301758, "global_step": 418868, "epoch": 2493} {"train_loss": -11.421865463256836, "global_step": 418869, "epoch": 2493} {"train_loss": -12.152315139770508, "global_step": 418870, "epoch": 2493} {"train_loss": -10.917485237121582, "global_step": 418871, "epoch": 2493} {"train_loss": -11.211480140686035, "global_step": 418872, "epoch": 2493} {"train_loss": -11.489227294921875, "global_step": 418873, "epoch": 2493} {"train_loss": -11.100770950317383, "global_step": 418874, "epoch": 2493} {"train_loss": -12.14677619934082, "global_step": 418875, "epoch": 2493} {"train_loss": -10.718555450439453, "global_step": 418876, "epoch": 2493} {"train_loss": -12.372573852539062, "global_step": 418877, "epoch": 2493} {"train_loss": -10.961349487304688, "global_step": 418878, "epoch": 2493} {"train_loss": -11.26286506652832, "global_step": 418879, "epoch": 2493} {"train_loss": -11.196430206298828, "global_step": 418880, "epoch": 2493} {"train_loss": -11.086475372314453, "global_step": 418881, "epoch": 2493} {"train_loss": -11.641120910644531, "global_step": 418882, "epoch": 2493} {"train_loss": -10.948710441589355, "global_step": 418883, "epoch": 2493} {"train_loss": -11.768229484558105, "global_step": 418884, "epoch": 2493} {"train_loss": -11.893857955932617, "global_step": 418885, "epoch": 2493} {"train_loss": -11.728696823120117, "global_step": 418886, "epoch": 2493} {"train_loss": -11.167661666870117, "global_step": 418887, "epoch": 2493} {"train_loss": -12.266458511352539, "global_step": 418888, "epoch": 2493} {"train_loss": -10.513378143310547, "global_step": 418889, "epoch": 2493} {"train_loss": -12.13598346710205, "global_step": 418890, "epoch": 2493} {"train_loss": -10.89186954498291, "global_step": 418891, "epoch": 2493} {"train_loss": -11.566875457763672, "global_step": 418892, "epoch": 2493} {"train_loss": -11.960622787475586, "global_step": 418893, "epoch": 2493} {"train_loss": -11.696497917175293, "global_step": 418894, "epoch": 2493} {"train_loss": -12.244548797607422, "global_step": 418895, "epoch": 2493} {"train_loss": -11.54432487487793, "global_step": 418896, "epoch": 2493} {"train_loss": -11.327140808105469, "global_step": 418897, "epoch": 2493} {"train_loss": -12.172552108764648, "global_step": 418898, "epoch": 2493} {"train_loss": -12.182595252990723, "global_step": 418899, "epoch": 2493} {"train_loss": -12.318279266357422, "global_step": 418900, "epoch": 2493} {"train_loss": -11.901994705200195, "global_step": 418901, "epoch": 2493} {"train_loss": -12.338911056518555, "global_step": 418902, "epoch": 2493} {"train_loss": -11.855032920837402, "global_step": 418903, "epoch": 2493} {"train_loss": -12.406856536865234, "global_step": 418904, "epoch": 2493} {"train_loss": -11.95993709564209, "global_step": 418905, "epoch": 2493} {"train_loss": -12.176395416259766, "global_step": 418906, "epoch": 2493} {"train_loss": -12.280391693115234, "global_step": 418907, "epoch": 2493} {"train_loss": -12.16305160522461, "global_step": 418908, "epoch": 2493} {"train_loss": -12.335214614868164, "global_step": 418909, "epoch": 2493} {"train_loss": -12.261190414428711, "global_step": 418910, "epoch": 2493} {"train_loss": -12.477997779846191, "global_step": 418911, "epoch": 2493} {"train_loss": -12.46291732788086, "global_step": 418912, "epoch": 2493} {"train_loss": -12.322980880737305, "global_step": 418913, "epoch": 2493} {"train_loss": -12.608308792114258, "global_step": 418914, "epoch": 2493} {"train_loss": -12.248747825622559, "global_step": 418915, "epoch": 2493} {"train_loss": -11.934913635253906, "global_step": 418916, "epoch": 2493} {"train_loss": -12.517598152160645, "global_step": 418917, "epoch": 2493} {"train_loss": -12.378578186035156, "global_step": 418918, "epoch": 2493} {"train_loss": -12.234514236450195, "global_step": 418919, "epoch": 2493} {"train_loss": -12.40506362915039, "global_step": 418920, "epoch": 2493} {"train_loss": -12.291830062866211, "global_step": 418921, "epoch": 2493} {"train_loss": -12.349050521850586, "global_step": 418922, "epoch": 2493} {"train_loss": -12.427877426147461, "global_step": 418923, "epoch": 2493} {"train_loss": -12.377354621887207, "global_step": 418924, "epoch": 2493} {"train_loss": -12.534421920776367, "global_step": 418925, "epoch": 2493} {"train_loss": -12.36709213256836, "global_step": 418926, "epoch": 2493} {"train_loss": -12.533445358276367, "global_step": 418927, "epoch": 2493} {"train_loss": -12.469141960144043, "global_step": 418928, "epoch": 2493} {"train_loss": -12.446619033813477, "global_step": 418929, "epoch": 2493} {"train_loss": -12.506265640258789, "global_step": 418930, "epoch": 2493} {"train_loss": -12.575775146484375, "global_step": 418931, "epoch": 2493} {"train_loss": -12.529413223266602, "global_step": 418932, "epoch": 2493} {"train_loss": -12.507333755493164, "global_step": 418933, "epoch": 2493} {"train_loss": -12.48156452178955, "global_step": 418934, "epoch": 2493} {"train_loss": -12.686229705810547, "global_step": 418935, "epoch": 2493} {"train_loss": -12.271132469177246, "global_step": 418936, "epoch": 2493} {"train_loss": -12.603988647460938, "global_step": 418937, "epoch": 2493} {"train_loss": -12.648953437805176, "global_step": 418938, "epoch": 2493} {"train_loss": -11.7928466796875, "global_step": 418939, "epoch": 2493} {"train_loss": -12.57077407836914, "global_step": 418940, "epoch": 2493} {"train_loss": -12.223268508911133, "global_step": 418941, "epoch": 2493} {"train_loss": -12.219888687133789, "global_step": 418942, "epoch": 2493} {"train_loss": -12.556957244873047, "global_step": 418943, "epoch": 2493} {"train_loss": -12.2905912399292, "global_step": 418944, "epoch": 2493} {"train_loss": -12.533939361572266, "global_step": 418945, "epoch": 2493} {"train_loss": -12.48049545288086, "global_step": 418946, "epoch": 2493} {"train_loss": -12.406817436218262, "global_step": 418947, "epoch": 2493} {"train_loss": -12.663871765136719, "global_step": 418948, "epoch": 2493} {"train_loss": -12.599324226379395, "global_step": 418949, "epoch": 2493} {"train_loss": -12.18511962890625, "global_step": 418950, "epoch": 2493} {"train_loss": -12.421820640563965, "global_step": 418951, "epoch": 2493} {"train_loss": -12.4522066116333, "global_step": 418952, "epoch": 2493} {"train_loss": -12.12237548828125, "global_step": 418953, "epoch": 2493} {"train_loss": -12.444856643676758, "global_step": 418954, "epoch": 2493} {"train_loss": -12.528434753417969, "global_step": 418955, "epoch": 2493} {"train_loss": -12.13206672668457, "global_step": 418956, "epoch": 2493} {"train_loss": -12.158164978027344, "global_step": 418957, "epoch": 2493} {"train_loss": -12.069215774536133, "global_step": 418958, "epoch": 2493} {"train_loss": -12.409280776977539, "global_step": 418959, "epoch": 2493} {"train_loss": -12.499279022216797, "global_step": 418960, "epoch": 2493} {"train_loss": -12.468605041503906, "global_step": 418961, "epoch": 2493} {"train_loss": -12.700458526611328, "global_step": 418962, "epoch": 2493} {"train_loss": -12.406876564025879, "global_step": 418963, "epoch": 2493} {"train_loss": -12.601346015930176, "global_step": 418964, "epoch": 2493} {"train_loss": -12.747434616088867, "global_step": 418965, "epoch": 2493} {"train_loss": -12.747809410095215, "global_step": 418966, "epoch": 2493} {"train_loss": -12.484153747558594, "global_step": 418967, "epoch": 2493} {"train_loss": -12.65489387512207, "global_step": 418968, "epoch": 2493} {"train_loss": -12.725841522216797, "global_step": 418969, "epoch": 2493} {"train_loss": -12.804610252380371, "global_step": 418970, "epoch": 2493} {"train_loss": -12.952627182006836, "global_step": 418971, "epoch": 2493} {"train_loss": -12.508368492126465, "global_step": 418972, "epoch": 2493} {"train_loss": -12.734977722167969, "global_step": 418973, "epoch": 2493} {"train_loss": -12.714262008666992, "global_step": 418974, "epoch": 2493} {"train_loss": -12.649478912353516, "global_step": 418975, "epoch": 2493} {"train_loss": -11.902522087097168, "global_step": 418976, "epoch": 2493} {"train_loss": -12.291189193725586, "global_step": 418977, "epoch": 2493} {"train_loss": -12.346628189086914, "global_step": 418978, "epoch": 2493} {"train_loss": -12.488574981689453, "global_step": 418979, "epoch": 2493} {"train_loss": -12.142878532409668, "global_step": 418980, "epoch": 2493} {"train_loss": -11.998086929321289, "global_step": 418981, "epoch": 2493} {"train_loss": -11.558124542236328, "global_step": 418982, "epoch": 2493} {"train_loss": -12.154935836791992, "global_step": 418983, "epoch": 2493} {"train_loss": -11.982473373413086, "global_step": 418984, "epoch": 2493} {"train_loss": -12.21791934967041, "global_step": 418985, "epoch": 2493} {"train_loss": -12.06354808807373, "global_step": 418986, "epoch": 2493} {"train_loss": -12.115900993347168, "global_step": 418987, "epoch": 2493} {"train_loss": -11.432721138000488, "global_step": 418988, "epoch": 2493} {"train_loss": -11.770977020263672, "global_step": 418989, "epoch": 2493} {"train_loss": -12.346944808959961, "global_step": 418990, "epoch": 2493} {"train_loss": -12.232547022047497, "global_step": 418991, "epoch": 2493, "val_loss": 307153.3125} {"train_loss": -10.50787353515625, "global_step": 418992, "epoch": 2494} {"train_loss": -10.51784896850586, "global_step": 418993, "epoch": 2494} {"train_loss": -11.81001091003418, "global_step": 418994, "epoch": 2494} {"train_loss": -10.883511543273926, "global_step": 418995, "epoch": 2494} {"train_loss": -9.759462356567383, "global_step": 418996, "epoch": 2494} {"train_loss": -11.811203002929688, "global_step": 418997, "epoch": 2494} {"train_loss": -9.328442573547363, "global_step": 418998, "epoch": 2494} {"train_loss": -8.852863311767578, "global_step": 418999, "epoch": 2494} {"train_loss": -10.26328182220459, "global_step": 419000, "epoch": 2494} {"train_loss": -11.408323287963867, "global_step": 419001, "epoch": 2494} {"train_loss": -10.39737319946289, "global_step": 419002, "epoch": 2494} {"train_loss": -11.460794448852539, "global_step": 419003, "epoch": 2494} {"train_loss": -9.471769332885742, "global_step": 419004, "epoch": 2494} {"train_loss": -11.06718635559082, "global_step": 419005, "epoch": 2494} {"train_loss": -11.083250999450684, "global_step": 419006, "epoch": 2494} {"train_loss": -9.50877571105957, "global_step": 419007, "epoch": 2494} {"train_loss": -11.093318939208984, "global_step": 419008, "epoch": 2494} {"train_loss": -10.247974395751953, "global_step": 419009, "epoch": 2494} {"train_loss": -11.812695503234863, "global_step": 419010, "epoch": 2494} {"train_loss": -9.964519500732422, "global_step": 419011, "epoch": 2494} {"train_loss": -11.392141342163086, "global_step": 419012, "epoch": 2494} {"train_loss": -10.657963752746582, "global_step": 419013, "epoch": 2494} {"train_loss": -11.033482551574707, "global_step": 419014, "epoch": 2494} {"train_loss": -10.0200834274292, "global_step": 419015, "epoch": 2494} {"train_loss": -10.02650260925293, "global_step": 419016, "epoch": 2494} {"train_loss": -11.595611572265625, "global_step": 419017, "epoch": 2494} {"train_loss": -9.211448669433594, "global_step": 419018, "epoch": 2494} {"train_loss": -10.047906875610352, "global_step": 419019, "epoch": 2494} {"train_loss": -11.40599250793457, "global_step": 419020, "epoch": 2494} {"train_loss": -10.469497680664062, "global_step": 419021, "epoch": 2494} {"train_loss": -10.975815773010254, "global_step": 419022, "epoch": 2494} {"train_loss": -10.712815284729004, "global_step": 419023, "epoch": 2494} {"train_loss": -10.691879272460938, "global_step": 419024, "epoch": 2494} {"train_loss": -11.577438354492188, "global_step": 419025, "epoch": 2494} {"train_loss": -9.892155647277832, "global_step": 419026, "epoch": 2494} {"train_loss": -11.269067764282227, "global_step": 419027, "epoch": 2494} {"train_loss": -11.063188552856445, "global_step": 419028, "epoch": 2494} {"train_loss": -10.394794464111328, "global_step": 419029, "epoch": 2494} {"train_loss": -11.57242202758789, "global_step": 419030, "epoch": 2494} {"train_loss": -11.18705940246582, "global_step": 419031, "epoch": 2494} {"train_loss": -11.30853271484375, "global_step": 419032, "epoch": 2494} {"train_loss": -10.839980125427246, "global_step": 419033, "epoch": 2494} {"train_loss": -11.173654556274414, "global_step": 419034, "epoch": 2494} {"train_loss": -11.112344741821289, "global_step": 419035, "epoch": 2494} {"train_loss": -11.542576789855957, "global_step": 419036, "epoch": 2494} {"train_loss": -11.515308380126953, "global_step": 419037, "epoch": 2494} {"train_loss": -11.96922779083252, "global_step": 419038, "epoch": 2494} {"train_loss": -10.874977111816406, "global_step": 419039, "epoch": 2494} {"train_loss": -11.817571640014648, "global_step": 419040, "epoch": 2494} {"train_loss": -11.539813041687012, "global_step": 419041, "epoch": 2494} {"train_loss": -11.497011184692383, "global_step": 419042, "epoch": 2494} {"train_loss": -11.654722213745117, "global_step": 419043, "epoch": 2494} {"train_loss": -11.504384994506836, "global_step": 419044, "epoch": 2494} {"train_loss": -11.77946662902832, "global_step": 419045, "epoch": 2494} {"train_loss": -11.811880111694336, "global_step": 419046, "epoch": 2494} {"train_loss": -11.802166938781738, "global_step": 419047, "epoch": 2494} {"train_loss": -11.945947647094727, "global_step": 419048, "epoch": 2494} {"train_loss": -11.713102340698242, "global_step": 419049, "epoch": 2494} {"train_loss": -11.92683219909668, "global_step": 419050, "epoch": 2494} {"train_loss": -11.648366928100586, "global_step": 419051, "epoch": 2494} {"train_loss": -11.812429428100586, "global_step": 419052, "epoch": 2494} {"train_loss": -11.612715721130371, "global_step": 419053, "epoch": 2494} {"train_loss": -11.935110092163086, "global_step": 419054, "epoch": 2494} {"train_loss": -12.078238487243652, "global_step": 419055, "epoch": 2494} {"train_loss": -11.843927383422852, "global_step": 419056, "epoch": 2494} {"train_loss": -11.912240982055664, "global_step": 419057, "epoch": 2494} {"train_loss": -12.136226654052734, "global_step": 419058, "epoch": 2494} {"train_loss": -11.817752838134766, "global_step": 419059, "epoch": 2494} {"train_loss": -12.309295654296875, "global_step": 419060, "epoch": 2494} {"train_loss": -11.860883712768555, "global_step": 419061, "epoch": 2494} {"train_loss": -12.063791275024414, "global_step": 419062, "epoch": 2494} {"train_loss": -11.98426628112793, "global_step": 419063, "epoch": 2494} {"train_loss": -12.354352951049805, "global_step": 419064, "epoch": 2494} {"train_loss": -11.725946426391602, "global_step": 419065, "epoch": 2494} {"train_loss": -12.1415433883667, "global_step": 419066, "epoch": 2494} {"train_loss": -11.895292282104492, "global_step": 419067, "epoch": 2494} {"train_loss": -12.308412551879883, "global_step": 419068, "epoch": 2494} {"train_loss": -12.291833877563477, "global_step": 419069, "epoch": 2494} {"train_loss": -12.157451629638672, "global_step": 419070, "epoch": 2494} {"train_loss": -12.083300590515137, "global_step": 419071, "epoch": 2494} {"train_loss": -12.236998558044434, "global_step": 419072, "epoch": 2494} {"train_loss": -12.187671661376953, "global_step": 419073, "epoch": 2494} {"train_loss": -12.22604751586914, "global_step": 419074, "epoch": 2494} {"train_loss": -11.845760345458984, "global_step": 419075, "epoch": 2494} {"train_loss": -12.49873161315918, "global_step": 419076, "epoch": 2494} {"train_loss": -12.010034561157227, "global_step": 419077, "epoch": 2494} {"train_loss": -12.416723251342773, "global_step": 419078, "epoch": 2494} {"train_loss": -12.403810501098633, "global_step": 419079, "epoch": 2494} {"train_loss": -12.356399536132812, "global_step": 419080, "epoch": 2494} {"train_loss": -12.389538764953613, "global_step": 419081, "epoch": 2494} {"train_loss": -11.93458366394043, "global_step": 419082, "epoch": 2494} {"train_loss": -12.187593460083008, "global_step": 419083, "epoch": 2494} {"train_loss": -12.034865379333496, "global_step": 419084, "epoch": 2494} {"train_loss": -12.039685249328613, "global_step": 419085, "epoch": 2494} {"train_loss": -11.959541320800781, "global_step": 419086, "epoch": 2494} {"train_loss": -12.051031112670898, "global_step": 419087, "epoch": 2494} {"train_loss": -12.237293243408203, "global_step": 419088, "epoch": 2494} {"train_loss": -12.162939071655273, "global_step": 419089, "epoch": 2494} {"train_loss": -12.024795532226562, "global_step": 419090, "epoch": 2494} {"train_loss": -12.28433609008789, "global_step": 419091, "epoch": 2494} {"train_loss": -12.300209045410156, "global_step": 419092, "epoch": 2494} {"train_loss": -12.287364959716797, "global_step": 419093, "epoch": 2494} {"train_loss": -12.041873931884766, "global_step": 419094, "epoch": 2494} {"train_loss": -12.583051681518555, "global_step": 419095, "epoch": 2494} {"train_loss": -12.432687759399414, "global_step": 419096, "epoch": 2494} {"train_loss": -12.350393295288086, "global_step": 419097, "epoch": 2494} {"train_loss": -12.424089431762695, "global_step": 419098, "epoch": 2494} {"train_loss": -12.186311721801758, "global_step": 419099, "epoch": 2494} {"train_loss": -12.148164749145508, "global_step": 419100, "epoch": 2494} {"train_loss": -12.249356269836426, "global_step": 419101, "epoch": 2494} {"train_loss": -12.087272644042969, "global_step": 419102, "epoch": 2494} {"train_loss": -11.896007537841797, "global_step": 419103, "epoch": 2494} {"train_loss": -12.140174865722656, "global_step": 419104, "epoch": 2494} {"train_loss": -12.198347091674805, "global_step": 419105, "epoch": 2494} {"train_loss": -12.1191987991333, "global_step": 419106, "epoch": 2494} {"train_loss": -12.314830780029297, "global_step": 419107, "epoch": 2494} {"train_loss": -11.875431060791016, "global_step": 419108, "epoch": 2494} {"train_loss": -12.268777847290039, "global_step": 419109, "epoch": 2494} {"train_loss": -11.526823043823242, "global_step": 419110, "epoch": 2494} {"train_loss": -12.102516174316406, "global_step": 419111, "epoch": 2494} {"train_loss": -11.674424171447754, "global_step": 419112, "epoch": 2494} {"train_loss": -12.035979270935059, "global_step": 419113, "epoch": 2494} {"train_loss": -11.647723197937012, "global_step": 419114, "epoch": 2494} {"train_loss": -12.032064437866211, "global_step": 419115, "epoch": 2494} {"train_loss": -11.494056701660156, "global_step": 419116, "epoch": 2494} {"train_loss": -11.947906494140625, "global_step": 419117, "epoch": 2494} {"train_loss": -11.59508228302002, "global_step": 419118, "epoch": 2494} {"train_loss": -11.345751762390137, "global_step": 419119, "epoch": 2494} {"train_loss": -11.853250503540039, "global_step": 419120, "epoch": 2494} {"train_loss": -11.12602710723877, "global_step": 419121, "epoch": 2494} {"train_loss": -12.182772636413574, "global_step": 419122, "epoch": 2494} {"train_loss": -11.697197914123535, "global_step": 419123, "epoch": 2494} {"train_loss": -11.784719467163086, "global_step": 419124, "epoch": 2494} {"train_loss": -11.450298309326172, "global_step": 419125, "epoch": 2494} {"train_loss": -12.153873443603516, "global_step": 419126, "epoch": 2494} {"train_loss": -12.105904579162598, "global_step": 419127, "epoch": 2494} {"train_loss": -12.322981834411621, "global_step": 419128, "epoch": 2494} {"train_loss": -11.928401947021484, "global_step": 419129, "epoch": 2494} {"train_loss": -12.412976264953613, "global_step": 419130, "epoch": 2494} {"train_loss": -12.183348655700684, "global_step": 419131, "epoch": 2494} {"train_loss": -12.221500396728516, "global_step": 419132, "epoch": 2494} {"train_loss": -12.484399795532227, "global_step": 419133, "epoch": 2494} {"train_loss": -12.182029724121094, "global_step": 419134, "epoch": 2494} {"train_loss": -12.211641311645508, "global_step": 419135, "epoch": 2494} {"train_loss": -11.912627220153809, "global_step": 419136, "epoch": 2494} {"train_loss": -12.09621524810791, "global_step": 419137, "epoch": 2494} {"train_loss": -11.873830795288086, "global_step": 419138, "epoch": 2494} {"train_loss": -12.183509826660156, "global_step": 419139, "epoch": 2494} {"train_loss": -11.382291793823242, "global_step": 419140, "epoch": 2494} {"train_loss": -11.609170913696289, "global_step": 419141, "epoch": 2494} {"train_loss": -11.550819396972656, "global_step": 419142, "epoch": 2494} {"train_loss": -12.282369613647461, "global_step": 419143, "epoch": 2494} {"train_loss": -12.153877258300781, "global_step": 419144, "epoch": 2494} {"train_loss": -11.703855514526367, "global_step": 419145, "epoch": 2494} {"train_loss": -12.550304412841797, "global_step": 419146, "epoch": 2494} {"train_loss": -11.927925109863281, "global_step": 419147, "epoch": 2494} {"train_loss": -12.606229782104492, "global_step": 419148, "epoch": 2494} {"train_loss": -11.859825134277344, "global_step": 419149, "epoch": 2494} {"train_loss": -12.191965103149414, "global_step": 419150, "epoch": 2494} {"train_loss": -12.309403419494629, "global_step": 419151, "epoch": 2494} {"train_loss": -11.890661239624023, "global_step": 419152, "epoch": 2494} {"train_loss": -12.407325744628906, "global_step": 419153, "epoch": 2494} {"train_loss": -11.643697738647461, "global_step": 419154, "epoch": 2494} {"train_loss": -12.479888916015625, "global_step": 419155, "epoch": 2494} {"train_loss": -11.859593391418457, "global_step": 419156, "epoch": 2494} {"train_loss": -12.202217102050781, "global_step": 419157, "epoch": 2494} {"train_loss": -12.367742538452148, "global_step": 419158, "epoch": 2494} {"train_loss": -11.667732965378534, "global_step": 419159, "epoch": 2494, "val_loss": 310686.0} {"train_loss": -12.217557907104492, "global_step": 419160, "epoch": 2495} {"train_loss": -12.287559509277344, "global_step": 419161, "epoch": 2495} {"train_loss": -12.343921661376953, "global_step": 419162, "epoch": 2495} {"train_loss": -12.289251327514648, "global_step": 419163, "epoch": 2495} {"train_loss": -12.56403636932373, "global_step": 419164, "epoch": 2495} {"train_loss": -12.645217895507812, "global_step": 419165, "epoch": 2495} {"train_loss": -12.467198371887207, "global_step": 419166, "epoch": 2495} {"train_loss": -12.584606170654297, "global_step": 419167, "epoch": 2495} {"train_loss": -12.392736434936523, "global_step": 419168, "epoch": 2495} {"train_loss": -12.605186462402344, "global_step": 419169, "epoch": 2495} {"train_loss": -12.516656875610352, "global_step": 419170, "epoch": 2495} {"train_loss": -12.61495590209961, "global_step": 419171, "epoch": 2495} {"train_loss": -12.641950607299805, "global_step": 419172, "epoch": 2495} {"train_loss": -12.609170913696289, "global_step": 419173, "epoch": 2495} {"train_loss": -12.668549537658691, "global_step": 419174, "epoch": 2495} {"train_loss": -12.570406913757324, "global_step": 419175, "epoch": 2495} {"train_loss": -12.334165573120117, "global_step": 419176, "epoch": 2495} {"train_loss": -12.704219818115234, "global_step": 419177, "epoch": 2495} {"train_loss": -12.374700546264648, "global_step": 419178, "epoch": 2495} {"train_loss": -12.396100044250488, "global_step": 419179, "epoch": 2495} {"train_loss": -12.64518928527832, "global_step": 419180, "epoch": 2495} {"train_loss": -12.414398193359375, "global_step": 419181, "epoch": 2495} {"train_loss": -12.503047943115234, "global_step": 419182, "epoch": 2495} {"train_loss": -12.616032600402832, "global_step": 419183, "epoch": 2495} {"train_loss": -12.666598320007324, "global_step": 419184, "epoch": 2495} {"train_loss": -12.32931137084961, "global_step": 419185, "epoch": 2495} {"train_loss": -12.577208518981934, "global_step": 419186, "epoch": 2495} {"train_loss": -12.60509967803955, "global_step": 419187, "epoch": 2495} {"train_loss": -12.53342342376709, "global_step": 419188, "epoch": 2495} {"train_loss": -12.543265342712402, "global_step": 419189, "epoch": 2495} {"train_loss": -12.803281784057617, "global_step": 419190, "epoch": 2495} {"train_loss": -12.52423095703125, "global_step": 419191, "epoch": 2495} {"train_loss": -12.652660369873047, "global_step": 419192, "epoch": 2495} {"train_loss": -12.308035850524902, "global_step": 419193, "epoch": 2495} {"train_loss": -12.645587921142578, "global_step": 419194, "epoch": 2495} {"train_loss": -12.508769989013672, "global_step": 419195, "epoch": 2495} {"train_loss": -12.650970458984375, "global_step": 419196, "epoch": 2495} {"train_loss": -12.393917083740234, "global_step": 419197, "epoch": 2495} {"train_loss": -12.775370597839355, "global_step": 419198, "epoch": 2495} {"train_loss": -12.697391510009766, "global_step": 419199, "epoch": 2495} {"train_loss": -12.751392364501953, "global_step": 419200, "epoch": 2495} {"train_loss": -12.701242446899414, "global_step": 419201, "epoch": 2495} {"train_loss": -12.596001625061035, "global_step": 419202, "epoch": 2495} {"train_loss": -12.531704902648926, "global_step": 419203, "epoch": 2495} {"train_loss": -12.354754447937012, "global_step": 419204, "epoch": 2495} {"train_loss": -12.68100357055664, "global_step": 419205, "epoch": 2495} {"train_loss": -11.825698852539062, "global_step": 419206, "epoch": 2495} {"train_loss": -12.042360305786133, "global_step": 419207, "epoch": 2495} {"train_loss": -12.114603042602539, "global_step": 419208, "epoch": 2495} {"train_loss": -12.456153869628906, "global_step": 419209, "epoch": 2495} {"train_loss": -12.144889831542969, "global_step": 419210, "epoch": 2495} {"train_loss": -12.298503875732422, "global_step": 419211, "epoch": 2495} {"train_loss": -12.807120323181152, "global_step": 419212, "epoch": 2495} {"train_loss": -12.821821212768555, "global_step": 419213, "epoch": 2495} {"train_loss": -12.200533866882324, "global_step": 419214, "epoch": 2495} {"train_loss": -12.537862777709961, "global_step": 419215, "epoch": 2495} {"train_loss": -12.689142227172852, "global_step": 419216, "epoch": 2495} {"train_loss": -12.553773880004883, "global_step": 419217, "epoch": 2495} {"train_loss": -12.007037162780762, "global_step": 419218, "epoch": 2495} {"train_loss": -12.023567199707031, "global_step": 419219, "epoch": 2495} {"train_loss": -12.063667297363281, "global_step": 419220, "epoch": 2495} {"train_loss": -11.992776870727539, "global_step": 419221, "epoch": 2495} {"train_loss": -11.94408893585205, "global_step": 419222, "epoch": 2495} {"train_loss": -10.871097564697266, "global_step": 419223, "epoch": 2495} {"train_loss": -11.796716690063477, "global_step": 419224, "epoch": 2495} {"train_loss": -12.122106552124023, "global_step": 419225, "epoch": 2495} {"train_loss": -11.878192901611328, "global_step": 419226, "epoch": 2495} {"train_loss": -11.396761894226074, "global_step": 419227, "epoch": 2495} {"train_loss": -11.325529098510742, "global_step": 419228, "epoch": 2495} {"train_loss": -10.299478530883789, "global_step": 419229, "epoch": 2495} {"train_loss": -10.768442153930664, "global_step": 419230, "epoch": 2495} {"train_loss": -11.028242111206055, "global_step": 419231, "epoch": 2495} {"train_loss": -10.982979774475098, "global_step": 419232, "epoch": 2495} {"train_loss": -10.903936386108398, "global_step": 419233, "epoch": 2495} {"train_loss": -11.382428169250488, "global_step": 419234, "epoch": 2495} {"train_loss": -11.455753326416016, "global_step": 419235, "epoch": 2495} {"train_loss": -11.532620429992676, "global_step": 419236, "epoch": 2495} {"train_loss": -10.92498779296875, "global_step": 419237, "epoch": 2495} {"train_loss": -11.707484245300293, "global_step": 419238, "epoch": 2495} {"train_loss": -12.380879402160645, "global_step": 419239, "epoch": 2495} {"train_loss": -11.386751174926758, "global_step": 419240, "epoch": 2495} {"train_loss": -11.863006591796875, "global_step": 419241, "epoch": 2495} {"train_loss": -11.56277084350586, "global_step": 419242, "epoch": 2495} {"train_loss": -11.978710174560547, "global_step": 419243, "epoch": 2495} {"train_loss": -12.269742965698242, "global_step": 419244, "epoch": 2495} {"train_loss": -12.28497314453125, "global_step": 419245, "epoch": 2495} {"train_loss": -12.075546264648438, "global_step": 419246, "epoch": 2495} {"train_loss": -12.094243049621582, "global_step": 419247, "epoch": 2495} {"train_loss": -12.729008674621582, "global_step": 419248, "epoch": 2495} {"train_loss": -12.461679458618164, "global_step": 419249, "epoch": 2495} {"train_loss": -12.413640022277832, "global_step": 419250, "epoch": 2495} {"train_loss": -12.367767333984375, "global_step": 419251, "epoch": 2495} {"train_loss": -12.643959045410156, "global_step": 419252, "epoch": 2495} {"train_loss": -12.095069885253906, "global_step": 419253, "epoch": 2495} {"train_loss": -12.633817672729492, "global_step": 419254, "epoch": 2495} {"train_loss": -12.076354026794434, "global_step": 419255, "epoch": 2495} {"train_loss": -11.999689102172852, "global_step": 419256, "epoch": 2495} {"train_loss": -12.30784797668457, "global_step": 419257, "epoch": 2495} {"train_loss": -11.71538257598877, "global_step": 419258, "epoch": 2495} {"train_loss": -12.346780776977539, "global_step": 419259, "epoch": 2495} {"train_loss": -11.81637191772461, "global_step": 419260, "epoch": 2495} {"train_loss": -11.884527206420898, "global_step": 419261, "epoch": 2495} {"train_loss": -11.967426300048828, "global_step": 419262, "epoch": 2495} {"train_loss": -11.54294490814209, "global_step": 419263, "epoch": 2495} {"train_loss": -11.94322681427002, "global_step": 419264, "epoch": 2495} {"train_loss": -11.324071884155273, "global_step": 419265, "epoch": 2495} {"train_loss": -11.803167343139648, "global_step": 419266, "epoch": 2495} {"train_loss": -11.210094451904297, "global_step": 419267, "epoch": 2495} {"train_loss": -11.519126892089844, "global_step": 419268, "epoch": 2495} {"train_loss": -11.79084587097168, "global_step": 419269, "epoch": 2495} {"train_loss": -11.52916431427002, "global_step": 419270, "epoch": 2495} {"train_loss": -11.794877052307129, "global_step": 419271, "epoch": 2495} {"train_loss": -10.716958999633789, "global_step": 419272, "epoch": 2495} {"train_loss": -12.526325225830078, "global_step": 419273, "epoch": 2495} {"train_loss": -11.4528226852417, "global_step": 419274, "epoch": 2495} {"train_loss": -12.179584503173828, "global_step": 419275, "epoch": 2495} {"train_loss": -11.912221908569336, "global_step": 419276, "epoch": 2495} {"train_loss": -11.770805358886719, "global_step": 419277, "epoch": 2495} {"train_loss": -12.471762657165527, "global_step": 419278, "epoch": 2495} {"train_loss": -11.966144561767578, "global_step": 419279, "epoch": 2495} {"train_loss": -12.319718360900879, "global_step": 419280, "epoch": 2495} {"train_loss": -12.121002197265625, "global_step": 419281, "epoch": 2495} {"train_loss": -12.096761703491211, "global_step": 419282, "epoch": 2495} {"train_loss": -12.118465423583984, "global_step": 419283, "epoch": 2495} {"train_loss": -11.784433364868164, "global_step": 419284, "epoch": 2495} {"train_loss": -12.169506072998047, "global_step": 419285, "epoch": 2495} {"train_loss": -11.81758975982666, "global_step": 419286, "epoch": 2495} {"train_loss": -12.45633602142334, "global_step": 419287, "epoch": 2495} {"train_loss": -11.879152297973633, "global_step": 419288, "epoch": 2495} {"train_loss": -12.60888385772705, "global_step": 419289, "epoch": 2495} {"train_loss": -12.28660774230957, "global_step": 419290, "epoch": 2495} {"train_loss": -12.345976829528809, "global_step": 419291, "epoch": 2495} {"train_loss": -12.349178314208984, "global_step": 419292, "epoch": 2495} {"train_loss": -12.285966873168945, "global_step": 419293, "epoch": 2495} {"train_loss": -12.311717987060547, "global_step": 419294, "epoch": 2495} {"train_loss": -12.537891387939453, "global_step": 419295, "epoch": 2495} {"train_loss": -12.57986068725586, "global_step": 419296, "epoch": 2495} {"train_loss": -12.168211936950684, "global_step": 419297, "epoch": 2495} {"train_loss": -12.664772033691406, "global_step": 419298, "epoch": 2495} {"train_loss": -12.336791038513184, "global_step": 419299, "epoch": 2495} {"train_loss": -12.24941349029541, "global_step": 419300, "epoch": 2495} {"train_loss": -12.508594512939453, "global_step": 419301, "epoch": 2495} {"train_loss": -12.141653060913086, "global_step": 419302, "epoch": 2495} {"train_loss": -12.262889862060547, "global_step": 419303, "epoch": 2495} {"train_loss": -12.190738677978516, "global_step": 419304, "epoch": 2495} {"train_loss": -12.286077499389648, "global_step": 419305, "epoch": 2495} {"train_loss": -12.266549110412598, "global_step": 419306, "epoch": 2495} {"train_loss": -12.154258728027344, "global_step": 419307, "epoch": 2495} {"train_loss": -12.489864349365234, "global_step": 419308, "epoch": 2495} {"train_loss": -12.254436492919922, "global_step": 419309, "epoch": 2495} {"train_loss": -12.322563171386719, "global_step": 419310, "epoch": 2495} {"train_loss": -12.121550559997559, "global_step": 419311, "epoch": 2495} {"train_loss": -10.604022026062012, "global_step": 419312, "epoch": 2495} {"train_loss": -12.076692581176758, "global_step": 419313, "epoch": 2495} {"train_loss": -10.69853401184082, "global_step": 419314, "epoch": 2495} {"train_loss": -12.115900039672852, "global_step": 419315, "epoch": 2495} {"train_loss": -11.338523864746094, "global_step": 419316, "epoch": 2495} {"train_loss": -11.797006607055664, "global_step": 419317, "epoch": 2495} {"train_loss": -11.891190528869629, "global_step": 419318, "epoch": 2495} {"train_loss": -12.473861694335938, "global_step": 419319, "epoch": 2495} {"train_loss": -11.873403549194336, "global_step": 419320, "epoch": 2495} {"train_loss": -12.62506103515625, "global_step": 419321, "epoch": 2495} {"train_loss": -12.201460838317871, "global_step": 419322, "epoch": 2495} {"train_loss": -12.549619674682617, "global_step": 419323, "epoch": 2495} {"train_loss": -12.679996490478516, "global_step": 419324, "epoch": 2495} {"train_loss": -12.451372146606445, "global_step": 419325, "epoch": 2495} {"train_loss": -12.71778678894043, "global_step": 419326, "epoch": 2495} {"train_loss": -12.15258184501103, "global_step": 419327, "epoch": 2495, "val_loss": 308586.78125, "train_action_mse_error": 0.2076495885848999} {"train_loss": -12.754362106323242, "global_step": 419328, "epoch": 2496} {"train_loss": -12.478087425231934, "global_step": 419329, "epoch": 2496} {"train_loss": -12.734199523925781, "global_step": 419330, "epoch": 2496} {"train_loss": -12.61076831817627, "global_step": 419331, "epoch": 2496} {"train_loss": -12.447469711303711, "global_step": 419332, "epoch": 2496} {"train_loss": -12.774697303771973, "global_step": 419333, "epoch": 2496} {"train_loss": -12.688028335571289, "global_step": 419334, "epoch": 2496} {"train_loss": -12.699298858642578, "global_step": 419335, "epoch": 2496} {"train_loss": -12.613676071166992, "global_step": 419336, "epoch": 2496} {"train_loss": -12.306394577026367, "global_step": 419337, "epoch": 2496} {"train_loss": -12.534449577331543, "global_step": 419338, "epoch": 2496} {"train_loss": -12.509552001953125, "global_step": 419339, "epoch": 2496} {"train_loss": -12.636331558227539, "global_step": 419340, "epoch": 2496} {"train_loss": -12.697198867797852, "global_step": 419341, "epoch": 2496} {"train_loss": -12.682625770568848, "global_step": 419342, "epoch": 2496} {"train_loss": -12.649171829223633, "global_step": 419343, "epoch": 2496} {"train_loss": -12.482813835144043, "global_step": 419344, "epoch": 2496} {"train_loss": -12.469964981079102, "global_step": 419345, "epoch": 2496} {"train_loss": -12.63863754272461, "global_step": 419346, "epoch": 2496} {"train_loss": -12.476219177246094, "global_step": 419347, "epoch": 2496} {"train_loss": -12.586939811706543, "global_step": 419348, "epoch": 2496} {"train_loss": -12.584057807922363, "global_step": 419349, "epoch": 2496} {"train_loss": -12.644610404968262, "global_step": 419350, "epoch": 2496} {"train_loss": -12.386951446533203, "global_step": 419351, "epoch": 2496} {"train_loss": -12.736124992370605, "global_step": 419352, "epoch": 2496} {"train_loss": -12.63278579711914, "global_step": 419353, "epoch": 2496} {"train_loss": -12.840412139892578, "global_step": 419354, "epoch": 2496} {"train_loss": -12.844673156738281, "global_step": 419355, "epoch": 2496} {"train_loss": -12.433478355407715, "global_step": 419356, "epoch": 2496} {"train_loss": -12.026986122131348, "global_step": 419357, "epoch": 2496} {"train_loss": -12.531145095825195, "global_step": 419358, "epoch": 2496} {"train_loss": -12.66252326965332, "global_step": 419359, "epoch": 2496} {"train_loss": -12.180807113647461, "global_step": 419360, "epoch": 2496} {"train_loss": -11.804381370544434, "global_step": 419361, "epoch": 2496} {"train_loss": -12.406290054321289, "global_step": 419362, "epoch": 2496} {"train_loss": -11.533014297485352, "global_step": 419363, "epoch": 2496} {"train_loss": -12.380343437194824, "global_step": 419364, "epoch": 2496} {"train_loss": -12.128304481506348, "global_step": 419365, "epoch": 2496} {"train_loss": -11.414506912231445, "global_step": 419366, "epoch": 2496} {"train_loss": -12.361478805541992, "global_step": 419367, "epoch": 2496} {"train_loss": -11.082866668701172, "global_step": 419368, "epoch": 2496} {"train_loss": -11.731221199035645, "global_step": 419369, "epoch": 2496} {"train_loss": -11.60680103302002, "global_step": 419370, "epoch": 2496} {"train_loss": -11.095327377319336, "global_step": 419371, "epoch": 2496} {"train_loss": -12.306436538696289, "global_step": 419372, "epoch": 2496} {"train_loss": -11.03797435760498, "global_step": 419373, "epoch": 2496} {"train_loss": -12.13901138305664, "global_step": 419374, "epoch": 2496} {"train_loss": -12.185403823852539, "global_step": 419375, "epoch": 2496} {"train_loss": -11.754350662231445, "global_step": 419376, "epoch": 2496} {"train_loss": -12.243499755859375, "global_step": 419377, "epoch": 2496} {"train_loss": -12.030981063842773, "global_step": 419378, "epoch": 2496} {"train_loss": -12.447565078735352, "global_step": 419379, "epoch": 2496} {"train_loss": -12.460278511047363, "global_step": 419380, "epoch": 2496} {"train_loss": -12.392348289489746, "global_step": 419381, "epoch": 2496} {"train_loss": -12.346368789672852, "global_step": 419382, "epoch": 2496} {"train_loss": -11.940698623657227, "global_step": 419383, "epoch": 2496} {"train_loss": -11.773838996887207, "global_step": 419384, "epoch": 2496} {"train_loss": -11.963764190673828, "global_step": 419385, "epoch": 2496} {"train_loss": -11.998778343200684, "global_step": 419386, "epoch": 2496} {"train_loss": -11.91229248046875, "global_step": 419387, "epoch": 2496} {"train_loss": -12.177154541015625, "global_step": 419388, "epoch": 2496} {"train_loss": -12.117937088012695, "global_step": 419389, "epoch": 2496} {"train_loss": -12.374510765075684, "global_step": 419390, "epoch": 2496} {"train_loss": -11.78634262084961, "global_step": 419391, "epoch": 2496} {"train_loss": -12.181121826171875, "global_step": 419392, "epoch": 2496} {"train_loss": -11.719053268432617, "global_step": 419393, "epoch": 2496} {"train_loss": -11.590049743652344, "global_step": 419394, "epoch": 2496} {"train_loss": -12.186588287353516, "global_step": 419395, "epoch": 2496} {"train_loss": -12.229270935058594, "global_step": 419396, "epoch": 2496} {"train_loss": -12.089950561523438, "global_step": 419397, "epoch": 2496} {"train_loss": -12.118680000305176, "global_step": 419398, "epoch": 2496} {"train_loss": -12.089376449584961, "global_step": 419399, "epoch": 2496} {"train_loss": -12.123409271240234, "global_step": 419400, "epoch": 2496} {"train_loss": -12.296892166137695, "global_step": 419401, "epoch": 2496} {"train_loss": -12.43682861328125, "global_step": 419402, "epoch": 2496} {"train_loss": -11.924164772033691, "global_step": 419403, "epoch": 2496} {"train_loss": -11.979764938354492, "global_step": 419404, "epoch": 2496} {"train_loss": -12.066323280334473, "global_step": 419405, "epoch": 2496} {"train_loss": -12.32003402709961, "global_step": 419406, "epoch": 2496} {"train_loss": -11.487156867980957, "global_step": 419407, "epoch": 2496} {"train_loss": -11.823467254638672, "global_step": 419408, "epoch": 2496} {"train_loss": -10.940672874450684, "global_step": 419409, "epoch": 2496} {"train_loss": -10.736696243286133, "global_step": 419410, "epoch": 2496} {"train_loss": -10.739591598510742, "global_step": 419411, "epoch": 2496} {"train_loss": -11.168277740478516, "global_step": 419412, "epoch": 2496} {"train_loss": -8.284680366516113, "global_step": 419413, "epoch": 2496} {"train_loss": -9.408618927001953, "global_step": 419414, "epoch": 2496} {"train_loss": -9.446099281311035, "global_step": 419415, "epoch": 2496} {"train_loss": -9.683448791503906, "global_step": 419416, "epoch": 2496} {"train_loss": -10.368257522583008, "global_step": 419417, "epoch": 2496} {"train_loss": -10.451620101928711, "global_step": 419418, "epoch": 2496} {"train_loss": -11.489383697509766, "global_step": 419419, "epoch": 2496} {"train_loss": -9.1912260055542, "global_step": 419420, "epoch": 2496} {"train_loss": -11.524791717529297, "global_step": 419421, "epoch": 2496} {"train_loss": -10.01576042175293, "global_step": 419422, "epoch": 2496} {"train_loss": -9.341581344604492, "global_step": 419423, "epoch": 2496} {"train_loss": -9.813018798828125, "global_step": 419424, "epoch": 2496} {"train_loss": -9.521829605102539, "global_step": 419425, "epoch": 2496} {"train_loss": -8.627899169921875, "global_step": 419426, "epoch": 2496} {"train_loss": -9.548377990722656, "global_step": 419427, "epoch": 2496} {"train_loss": -9.638745307922363, "global_step": 419428, "epoch": 2496} {"train_loss": -9.356637001037598, "global_step": 419429, "epoch": 2496} {"train_loss": -10.379966735839844, "global_step": 419430, "epoch": 2496} {"train_loss": -10.14555549621582, "global_step": 419431, "epoch": 2496} {"train_loss": -10.069281578063965, "global_step": 419432, "epoch": 2496} {"train_loss": -10.478548049926758, "global_step": 419433, "epoch": 2496} {"train_loss": -10.258406639099121, "global_step": 419434, "epoch": 2496} {"train_loss": -10.29845905303955, "global_step": 419435, "epoch": 2496} {"train_loss": -10.40324592590332, "global_step": 419436, "epoch": 2496} {"train_loss": -10.642168045043945, "global_step": 419437, "epoch": 2496} {"train_loss": -11.175992012023926, "global_step": 419438, "epoch": 2496} {"train_loss": -11.821013450622559, "global_step": 419439, "epoch": 2496} {"train_loss": -10.817300796508789, "global_step": 419440, "epoch": 2496} {"train_loss": -11.73391342163086, "global_step": 419441, "epoch": 2496} {"train_loss": -11.15503978729248, "global_step": 419442, "epoch": 2496} {"train_loss": -11.374307632446289, "global_step": 419443, "epoch": 2496} {"train_loss": -11.961982727050781, "global_step": 419444, "epoch": 2496} {"train_loss": -11.827223777770996, "global_step": 419445, "epoch": 2496} {"train_loss": -11.926429748535156, "global_step": 419446, "epoch": 2496} {"train_loss": -11.66749382019043, "global_step": 419447, "epoch": 2496} {"train_loss": -11.701656341552734, "global_step": 419448, "epoch": 2496} {"train_loss": -11.51714038848877, "global_step": 419449, "epoch": 2496} {"train_loss": -11.968158721923828, "global_step": 419450, "epoch": 2496} {"train_loss": -11.632989883422852, "global_step": 419451, "epoch": 2496} {"train_loss": -12.125147819519043, "global_step": 419452, "epoch": 2496} {"train_loss": -12.307926177978516, "global_step": 419453, "epoch": 2496} {"train_loss": -12.163606643676758, "global_step": 419454, "epoch": 2496} {"train_loss": -12.291688919067383, "global_step": 419455, "epoch": 2496} {"train_loss": -12.116086959838867, "global_step": 419456, "epoch": 2496} {"train_loss": -12.09107780456543, "global_step": 419457, "epoch": 2496} {"train_loss": -12.086282730102539, "global_step": 419458, "epoch": 2496} {"train_loss": -12.294882774353027, "global_step": 419459, "epoch": 2496} {"train_loss": -12.306455612182617, "global_step": 419460, "epoch": 2496} {"train_loss": -11.98582935333252, "global_step": 419461, "epoch": 2496} {"train_loss": -12.210550308227539, "global_step": 419462, "epoch": 2496} {"train_loss": -12.310792922973633, "global_step": 419463, "epoch": 2496} {"train_loss": -12.041980743408203, "global_step": 419464, "epoch": 2496} {"train_loss": -12.36140251159668, "global_step": 419465, "epoch": 2496} {"train_loss": -12.095375061035156, "global_step": 419466, "epoch": 2496} {"train_loss": -12.192713737487793, "global_step": 419467, "epoch": 2496} {"train_loss": -12.311729431152344, "global_step": 419468, "epoch": 2496} {"train_loss": -12.372982025146484, "global_step": 419469, "epoch": 2496} {"train_loss": -12.109601020812988, "global_step": 419470, "epoch": 2496} {"train_loss": -12.192305564880371, "global_step": 419471, "epoch": 2496} {"train_loss": -12.343295097351074, "global_step": 419472, "epoch": 2496} {"train_loss": -12.10751724243164, "global_step": 419473, "epoch": 2496} {"train_loss": -12.184745788574219, "global_step": 419474, "epoch": 2496} {"train_loss": -12.256999969482422, "global_step": 419475, "epoch": 2496} {"train_loss": -12.062560081481934, "global_step": 419476, "epoch": 2496} {"train_loss": -12.390623092651367, "global_step": 419477, "epoch": 2496} {"train_loss": -12.238222122192383, "global_step": 419478, "epoch": 2496} {"train_loss": -12.412433624267578, "global_step": 419479, "epoch": 2496} {"train_loss": -12.123821258544922, "global_step": 419480, "epoch": 2496} {"train_loss": -12.406606674194336, "global_step": 419481, "epoch": 2496} {"train_loss": -12.466209411621094, "global_step": 419482, "epoch": 2496} {"train_loss": -12.341402053833008, "global_step": 419483, "epoch": 2496} {"train_loss": -12.434853553771973, "global_step": 419484, "epoch": 2496} {"train_loss": -12.393289566040039, "global_step": 419485, "epoch": 2496} {"train_loss": -12.58949089050293, "global_step": 419486, "epoch": 2496} {"train_loss": -12.525184631347656, "global_step": 419487, "epoch": 2496} {"train_loss": -12.401416778564453, "global_step": 419488, "epoch": 2496} {"train_loss": -12.52365779876709, "global_step": 419489, "epoch": 2496} {"train_loss": -12.18332290649414, "global_step": 419490, "epoch": 2496} {"train_loss": -12.722955703735352, "global_step": 419491, "epoch": 2496} {"train_loss": -12.230602264404297, "global_step": 419492, "epoch": 2496} {"train_loss": -12.58620548248291, "global_step": 419493, "epoch": 2496} {"train_loss": -12.211755752563477, "global_step": 419494, "epoch": 2496} {"train_loss": -11.815258548373269, "global_step": 419495, "epoch": 2496, "val_loss": 301311.3125} {"train_loss": -12.384989738464355, "global_step": 419496, "epoch": 2497} {"train_loss": -12.082324981689453, "global_step": 419497, "epoch": 2497} {"train_loss": -12.64957046508789, "global_step": 419498, "epoch": 2497} {"train_loss": -12.322036743164062, "global_step": 419499, "epoch": 2497} {"train_loss": -12.614970207214355, "global_step": 419500, "epoch": 2497} {"train_loss": -12.056361198425293, "global_step": 419501, "epoch": 2497} {"train_loss": -12.41744327545166, "global_step": 419502, "epoch": 2497} {"train_loss": -12.081893920898438, "global_step": 419503, "epoch": 2497} {"train_loss": -12.356902122497559, "global_step": 419504, "epoch": 2497} {"train_loss": -12.354884147644043, "global_step": 419505, "epoch": 2497} {"train_loss": -12.080951690673828, "global_step": 419506, "epoch": 2497} {"train_loss": -12.541492462158203, "global_step": 419507, "epoch": 2497} {"train_loss": -11.743568420410156, "global_step": 419508, "epoch": 2497} {"train_loss": -12.523153305053711, "global_step": 419509, "epoch": 2497} {"train_loss": -12.226104736328125, "global_step": 419510, "epoch": 2497} {"train_loss": -12.271692276000977, "global_step": 419511, "epoch": 2497} {"train_loss": -12.397651672363281, "global_step": 419512, "epoch": 2497} {"train_loss": -12.371017456054688, "global_step": 419513, "epoch": 2497} {"train_loss": -12.648551940917969, "global_step": 419514, "epoch": 2497} {"train_loss": -12.226643562316895, "global_step": 419515, "epoch": 2497} {"train_loss": -12.517571449279785, "global_step": 419516, "epoch": 2497} {"train_loss": -11.853322982788086, "global_step": 419517, "epoch": 2497} {"train_loss": -12.34384536743164, "global_step": 419518, "epoch": 2497} {"train_loss": -11.877399444580078, "global_step": 419519, "epoch": 2497} {"train_loss": -12.047346115112305, "global_step": 419520, "epoch": 2497} {"train_loss": -12.67367172241211, "global_step": 419521, "epoch": 2497} {"train_loss": -12.089591979980469, "global_step": 419522, "epoch": 2497} {"train_loss": -12.405743598937988, "global_step": 419523, "epoch": 2497} {"train_loss": -12.436461448669434, "global_step": 419524, "epoch": 2497} {"train_loss": -12.230694770812988, "global_step": 419525, "epoch": 2497} {"train_loss": -12.529253005981445, "global_step": 419526, "epoch": 2497} {"train_loss": -12.687145233154297, "global_step": 419527, "epoch": 2497} {"train_loss": -12.296807289123535, "global_step": 419528, "epoch": 2497} {"train_loss": -12.58633041381836, "global_step": 419529, "epoch": 2497} {"train_loss": -12.686284065246582, "global_step": 419530, "epoch": 2497} {"train_loss": -12.285146713256836, "global_step": 419531, "epoch": 2497} {"train_loss": -12.723119735717773, "global_step": 419532, "epoch": 2497} {"train_loss": -12.800743103027344, "global_step": 419533, "epoch": 2497} {"train_loss": -12.677976608276367, "global_step": 419534, "epoch": 2497} {"train_loss": -12.93868637084961, "global_step": 419535, "epoch": 2497} {"train_loss": -12.606094360351562, "global_step": 419536, "epoch": 2497} {"train_loss": -12.767279624938965, "global_step": 419537, "epoch": 2497} {"train_loss": -13.021496772766113, "global_step": 419538, "epoch": 2497} {"train_loss": -12.713155746459961, "global_step": 419539, "epoch": 2497} {"train_loss": -12.923027038574219, "global_step": 419540, "epoch": 2497} {"train_loss": -12.64915943145752, "global_step": 419541, "epoch": 2497} {"train_loss": -12.677558898925781, "global_step": 419542, "epoch": 2497} {"train_loss": -12.927967071533203, "global_step": 419543, "epoch": 2497} {"train_loss": -12.806736946105957, "global_step": 419544, "epoch": 2497} {"train_loss": -12.927984237670898, "global_step": 419545, "epoch": 2497} {"train_loss": -12.925344467163086, "global_step": 419546, "epoch": 2497} {"train_loss": -12.611184120178223, "global_step": 419547, "epoch": 2497} {"train_loss": -12.775625228881836, "global_step": 419548, "epoch": 2497} {"train_loss": -12.791311264038086, "global_step": 419549, "epoch": 2497} {"train_loss": -12.595776557922363, "global_step": 419550, "epoch": 2497} {"train_loss": -12.768203735351562, "global_step": 419551, "epoch": 2497} {"train_loss": -12.602749824523926, "global_step": 419552, "epoch": 2497} {"train_loss": -12.031761169433594, "global_step": 419553, "epoch": 2497} {"train_loss": -12.286351203918457, "global_step": 419554, "epoch": 2497} {"train_loss": -11.87164306640625, "global_step": 419555, "epoch": 2497} {"train_loss": -12.377375602722168, "global_step": 419556, "epoch": 2497} {"train_loss": -10.449906349182129, "global_step": 419557, "epoch": 2497} {"train_loss": -11.573223114013672, "global_step": 419558, "epoch": 2497} {"train_loss": -12.216443061828613, "global_step": 419559, "epoch": 2497} {"train_loss": -11.618024826049805, "global_step": 419560, "epoch": 2497} {"train_loss": -11.474272727966309, "global_step": 419561, "epoch": 2497} {"train_loss": -12.140710830688477, "global_step": 419562, "epoch": 2497} {"train_loss": -11.61514663696289, "global_step": 419563, "epoch": 2497} {"train_loss": -11.640588760375977, "global_step": 419564, "epoch": 2497} {"train_loss": -11.513389587402344, "global_step": 419565, "epoch": 2497} {"train_loss": -11.614432334899902, "global_step": 419566, "epoch": 2497} {"train_loss": -12.249992370605469, "global_step": 419567, "epoch": 2497} {"train_loss": -9.075596809387207, "global_step": 419568, "epoch": 2497} {"train_loss": -11.106489181518555, "global_step": 419569, "epoch": 2497} {"train_loss": -9.8737211227417, "global_step": 419570, "epoch": 2497} {"train_loss": -10.832341194152832, "global_step": 419571, "epoch": 2497} {"train_loss": -10.886438369750977, "global_step": 419572, "epoch": 2497} {"train_loss": -9.195404052734375, "global_step": 419573, "epoch": 2497} {"train_loss": -11.772929191589355, "global_step": 419574, "epoch": 2497} {"train_loss": -9.162694931030273, "global_step": 419575, "epoch": 2497} {"train_loss": -9.373886108398438, "global_step": 419576, "epoch": 2497} {"train_loss": -10.147211074829102, "global_step": 419577, "epoch": 2497} {"train_loss": -10.401228904724121, "global_step": 419578, "epoch": 2497} {"train_loss": -9.472850799560547, "global_step": 419579, "epoch": 2497} {"train_loss": -11.185111045837402, "global_step": 419580, "epoch": 2497} {"train_loss": -10.082897186279297, "global_step": 419581, "epoch": 2497} {"train_loss": -10.558393478393555, "global_step": 419582, "epoch": 2497} {"train_loss": -8.704147338867188, "global_step": 419583, "epoch": 2497} {"train_loss": -8.70164966583252, "global_step": 419584, "epoch": 2497} {"train_loss": -8.932361602783203, "global_step": 419585, "epoch": 2497} {"train_loss": -10.629297256469727, "global_step": 419586, "epoch": 2497} {"train_loss": -10.459805488586426, "global_step": 419587, "epoch": 2497} {"train_loss": -9.242963790893555, "global_step": 419588, "epoch": 2497} {"train_loss": -10.806293487548828, "global_step": 419589, "epoch": 2497} {"train_loss": -10.642842292785645, "global_step": 419590, "epoch": 2497} {"train_loss": -9.836784362792969, "global_step": 419591, "epoch": 2497} {"train_loss": -10.397607803344727, "global_step": 419592, "epoch": 2497} {"train_loss": -11.431535720825195, "global_step": 419593, "epoch": 2497} {"train_loss": -11.246540069580078, "global_step": 419594, "epoch": 2497} {"train_loss": -10.927070617675781, "global_step": 419595, "epoch": 2497} {"train_loss": -11.491418838500977, "global_step": 419596, "epoch": 2497} {"train_loss": -10.620429992675781, "global_step": 419597, "epoch": 2497} {"train_loss": -11.220983505249023, "global_step": 419598, "epoch": 2497} {"train_loss": -11.40893840789795, "global_step": 419599, "epoch": 2497} {"train_loss": -11.474929809570312, "global_step": 419600, "epoch": 2497} {"train_loss": -11.446205139160156, "global_step": 419601, "epoch": 2497} {"train_loss": -10.808256149291992, "global_step": 419602, "epoch": 2497} {"train_loss": -11.6768217086792, "global_step": 419603, "epoch": 2497} {"train_loss": -10.951053619384766, "global_step": 419604, "epoch": 2497} {"train_loss": -11.956897735595703, "global_step": 419605, "epoch": 2497} {"train_loss": -10.78868579864502, "global_step": 419606, "epoch": 2497} {"train_loss": -12.061616897583008, "global_step": 419607, "epoch": 2497} {"train_loss": -10.826902389526367, "global_step": 419608, "epoch": 2497} {"train_loss": -11.741203308105469, "global_step": 419609, "epoch": 2497} {"train_loss": -11.377610206604004, "global_step": 419610, "epoch": 2497} {"train_loss": -11.967487335205078, "global_step": 419611, "epoch": 2497} {"train_loss": -11.575820922851562, "global_step": 419612, "epoch": 2497} {"train_loss": -12.11397647857666, "global_step": 419613, "epoch": 2497} {"train_loss": -11.661640167236328, "global_step": 419614, "epoch": 2497} {"train_loss": -11.7896728515625, "global_step": 419615, "epoch": 2497} {"train_loss": -11.940345764160156, "global_step": 419616, "epoch": 2497} {"train_loss": -11.821098327636719, "global_step": 419617, "epoch": 2497} {"train_loss": -12.270940780639648, "global_step": 419618, "epoch": 2497} {"train_loss": -11.513410568237305, "global_step": 419619, "epoch": 2497} {"train_loss": -11.781280517578125, "global_step": 419620, "epoch": 2497} {"train_loss": -11.861576080322266, "global_step": 419621, "epoch": 2497} {"train_loss": -11.630802154541016, "global_step": 419622, "epoch": 2497} {"train_loss": -12.137876510620117, "global_step": 419623, "epoch": 2497} {"train_loss": -11.97856330871582, "global_step": 419624, "epoch": 2497} {"train_loss": -11.610995292663574, "global_step": 419625, "epoch": 2497} {"train_loss": -12.30842399597168, "global_step": 419626, "epoch": 2497} {"train_loss": -11.756010055541992, "global_step": 419627, "epoch": 2497} {"train_loss": -11.994924545288086, "global_step": 419628, "epoch": 2497} {"train_loss": -11.667181015014648, "global_step": 419629, "epoch": 2497} {"train_loss": -11.83957576751709, "global_step": 419630, "epoch": 2497} {"train_loss": -11.81876277923584, "global_step": 419631, "epoch": 2497} {"train_loss": -11.903079986572266, "global_step": 419632, "epoch": 2497} {"train_loss": -12.033039093017578, "global_step": 419633, "epoch": 2497} {"train_loss": -12.187067985534668, "global_step": 419634, "epoch": 2497} {"train_loss": -12.086945533752441, "global_step": 419635, "epoch": 2497} {"train_loss": -12.18353271484375, "global_step": 419636, "epoch": 2497} {"train_loss": -12.243520736694336, "global_step": 419637, "epoch": 2497} {"train_loss": -12.367685317993164, "global_step": 419638, "epoch": 2497} {"train_loss": -12.221240997314453, "global_step": 419639, "epoch": 2497} {"train_loss": -12.428787231445312, "global_step": 419640, "epoch": 2497} {"train_loss": -12.161747932434082, "global_step": 419641, "epoch": 2497} {"train_loss": -12.224165916442871, "global_step": 419642, "epoch": 2497} {"train_loss": -12.468585014343262, "global_step": 419643, "epoch": 2497} {"train_loss": -12.228589057922363, "global_step": 419644, "epoch": 2497} {"train_loss": -12.20368766784668, "global_step": 419645, "epoch": 2497} {"train_loss": -12.198429107666016, "global_step": 419646, "epoch": 2497} {"train_loss": -12.222923278808594, "global_step": 419647, "epoch": 2497} {"train_loss": -12.34679889678955, "global_step": 419648, "epoch": 2497} {"train_loss": -12.32331657409668, "global_step": 419649, "epoch": 2497} {"train_loss": -12.095741271972656, "global_step": 419650, "epoch": 2497} {"train_loss": -12.620643615722656, "global_step": 419651, "epoch": 2497} {"train_loss": -12.102838516235352, "global_step": 419652, "epoch": 2497} {"train_loss": -12.42492389678955, "global_step": 419653, "epoch": 2497} {"train_loss": -12.048582077026367, "global_step": 419654, "epoch": 2497} {"train_loss": -12.461737632751465, "global_step": 419655, "epoch": 2497} {"train_loss": -12.140605926513672, "global_step": 419656, "epoch": 2497} {"train_loss": -12.4739351272583, "global_step": 419657, "epoch": 2497} {"train_loss": -12.576053619384766, "global_step": 419658, "epoch": 2497} {"train_loss": -12.515970230102539, "global_step": 419659, "epoch": 2497} {"train_loss": -12.38449478149414, "global_step": 419660, "epoch": 2497} {"train_loss": -12.398475646972656, "global_step": 419661, "epoch": 2497} {"train_loss": -12.379426956176758, "global_step": 419662, "epoch": 2497} {"train_loss": -11.820317359197707, "global_step": 419663, "epoch": 2497, "val_loss": 303721.09375} {"train_loss": -12.318009376525879, "global_step": 419664, "epoch": 2498} {"train_loss": -12.576082229614258, "global_step": 419665, "epoch": 2498} {"train_loss": -12.247703552246094, "global_step": 419666, "epoch": 2498} {"train_loss": -12.391768455505371, "global_step": 419667, "epoch": 2498} {"train_loss": -12.502607345581055, "global_step": 419668, "epoch": 2498} {"train_loss": -12.383813858032227, "global_step": 419669, "epoch": 2498} {"train_loss": -12.59034538269043, "global_step": 419670, "epoch": 2498} {"train_loss": -12.280113220214844, "global_step": 419671, "epoch": 2498} {"train_loss": -12.655617713928223, "global_step": 419672, "epoch": 2498} {"train_loss": -12.509450912475586, "global_step": 419673, "epoch": 2498} {"train_loss": -12.50265884399414, "global_step": 419674, "epoch": 2498} {"train_loss": -12.662700653076172, "global_step": 419675, "epoch": 2498} {"train_loss": -12.339400291442871, "global_step": 419676, "epoch": 2498} {"train_loss": -12.628698348999023, "global_step": 419677, "epoch": 2498} {"train_loss": -12.641210556030273, "global_step": 419678, "epoch": 2498} {"train_loss": -12.499281883239746, "global_step": 419679, "epoch": 2498} {"train_loss": -12.391130447387695, "global_step": 419680, "epoch": 2498} {"train_loss": -12.698476791381836, "global_step": 419681, "epoch": 2498} {"train_loss": -12.41632080078125, "global_step": 419682, "epoch": 2498} {"train_loss": -12.616082191467285, "global_step": 419683, "epoch": 2498} {"train_loss": -12.489203453063965, "global_step": 419684, "epoch": 2498} {"train_loss": -12.850561141967773, "global_step": 419685, "epoch": 2498} {"train_loss": -12.491844177246094, "global_step": 419686, "epoch": 2498} {"train_loss": -12.671491622924805, "global_step": 419687, "epoch": 2498} {"train_loss": -12.638684272766113, "global_step": 419688, "epoch": 2498} {"train_loss": -12.91896915435791, "global_step": 419689, "epoch": 2498} {"train_loss": -12.702476501464844, "global_step": 419690, "epoch": 2498} {"train_loss": -12.716780662536621, "global_step": 419691, "epoch": 2498} {"train_loss": -12.786544799804688, "global_step": 419692, "epoch": 2498} {"train_loss": -12.748947143554688, "global_step": 419693, "epoch": 2498} {"train_loss": -12.761590003967285, "global_step": 419694, "epoch": 2498} {"train_loss": -12.826629638671875, "global_step": 419695, "epoch": 2498} {"train_loss": -12.810964584350586, "global_step": 419696, "epoch": 2498} {"train_loss": -12.837654113769531, "global_step": 419697, "epoch": 2498} {"train_loss": -12.667360305786133, "global_step": 419698, "epoch": 2498} {"train_loss": -12.53329086303711, "global_step": 419699, "epoch": 2498} {"train_loss": -12.929893493652344, "global_step": 419700, "epoch": 2498} {"train_loss": -12.655994415283203, "global_step": 419701, "epoch": 2498} {"train_loss": -12.846988677978516, "global_step": 419702, "epoch": 2498} {"train_loss": -12.797532081604004, "global_step": 419703, "epoch": 2498} {"train_loss": -12.815547943115234, "global_step": 419704, "epoch": 2498} {"train_loss": -12.70025634765625, "global_step": 419705, "epoch": 2498} {"train_loss": -12.795022964477539, "global_step": 419706, "epoch": 2498} {"train_loss": -12.671854019165039, "global_step": 419707, "epoch": 2498} {"train_loss": -12.825647354125977, "global_step": 419708, "epoch": 2498} {"train_loss": -12.711185455322266, "global_step": 419709, "epoch": 2498} {"train_loss": -12.746437072753906, "global_step": 419710, "epoch": 2498} {"train_loss": -12.102373123168945, "global_step": 419711, "epoch": 2498} {"train_loss": -11.888185501098633, "global_step": 419712, "epoch": 2498} {"train_loss": -11.319944381713867, "global_step": 419713, "epoch": 2498} {"train_loss": -12.481396675109863, "global_step": 419714, "epoch": 2498} {"train_loss": -12.486856460571289, "global_step": 419715, "epoch": 2498} {"train_loss": -12.34811782836914, "global_step": 419716, "epoch": 2498} {"train_loss": -12.704286575317383, "global_step": 419717, "epoch": 2498} {"train_loss": -12.52820873260498, "global_step": 419718, "epoch": 2498} {"train_loss": -12.380331039428711, "global_step": 419719, "epoch": 2498} {"train_loss": -12.530549049377441, "global_step": 419720, "epoch": 2498} {"train_loss": -12.597585678100586, "global_step": 419721, "epoch": 2498} {"train_loss": -12.689330101013184, "global_step": 419722, "epoch": 2498} {"train_loss": -12.495314598083496, "global_step": 419723, "epoch": 2498} {"train_loss": -12.404762268066406, "global_step": 419724, "epoch": 2498} {"train_loss": -12.396852493286133, "global_step": 419725, "epoch": 2498} {"train_loss": -12.438858032226562, "global_step": 419726, "epoch": 2498} {"train_loss": -12.375404357910156, "global_step": 419727, "epoch": 2498} {"train_loss": -12.635634422302246, "global_step": 419728, "epoch": 2498} {"train_loss": -12.232894897460938, "global_step": 419729, "epoch": 2498} {"train_loss": -11.23117446899414, "global_step": 419730, "epoch": 2498} {"train_loss": -12.00548267364502, "global_step": 419731, "epoch": 2498} {"train_loss": -12.178327560424805, "global_step": 419732, "epoch": 2498} {"train_loss": -11.944478988647461, "global_step": 419733, "epoch": 2498} {"train_loss": -11.5438232421875, "global_step": 419734, "epoch": 2498} {"train_loss": -12.068167686462402, "global_step": 419735, "epoch": 2498} {"train_loss": -11.819295883178711, "global_step": 419736, "epoch": 2498} {"train_loss": -11.328474998474121, "global_step": 419737, "epoch": 2498} {"train_loss": -11.928319931030273, "global_step": 419738, "epoch": 2498} {"train_loss": -9.067712783813477, "global_step": 419739, "epoch": 2498} {"train_loss": -12.364066123962402, "global_step": 419740, "epoch": 2498} {"train_loss": -11.340097427368164, "global_step": 419741, "epoch": 2498} {"train_loss": -11.976795196533203, "global_step": 419742, "epoch": 2498} {"train_loss": -12.161508560180664, "global_step": 419743, "epoch": 2498} {"train_loss": -11.151240348815918, "global_step": 419744, "epoch": 2498} {"train_loss": -10.935356140136719, "global_step": 419745, "epoch": 2498} {"train_loss": -11.317298889160156, "global_step": 419746, "epoch": 2498} {"train_loss": -12.084447860717773, "global_step": 419747, "epoch": 2498} {"train_loss": -11.505571365356445, "global_step": 419748, "epoch": 2498} {"train_loss": -12.405189514160156, "global_step": 419749, "epoch": 2498} {"train_loss": -11.959508895874023, "global_step": 419750, "epoch": 2498} {"train_loss": -11.638545989990234, "global_step": 419751, "epoch": 2498} {"train_loss": -10.301856994628906, "global_step": 419752, "epoch": 2498} {"train_loss": -11.828786849975586, "global_step": 419753, "epoch": 2498} {"train_loss": -11.566579818725586, "global_step": 419754, "epoch": 2498} {"train_loss": -10.386149406433105, "global_step": 419755, "epoch": 2498} {"train_loss": -11.993341445922852, "global_step": 419756, "epoch": 2498} {"train_loss": -11.277971267700195, "global_step": 419757, "epoch": 2498} {"train_loss": -10.697443008422852, "global_step": 419758, "epoch": 2498} {"train_loss": -12.119375228881836, "global_step": 419759, "epoch": 2498} {"train_loss": -11.398083686828613, "global_step": 419760, "epoch": 2498} {"train_loss": -12.206306457519531, "global_step": 419761, "epoch": 2498} {"train_loss": -11.220848083496094, "global_step": 419762, "epoch": 2498} {"train_loss": -11.981888771057129, "global_step": 419763, "epoch": 2498} {"train_loss": -12.012674331665039, "global_step": 419764, "epoch": 2498} {"train_loss": -12.002815246582031, "global_step": 419765, "epoch": 2498} {"train_loss": -12.296661376953125, "global_step": 419766, "epoch": 2498} {"train_loss": -11.822433471679688, "global_step": 419767, "epoch": 2498} {"train_loss": -12.202869415283203, "global_step": 419768, "epoch": 2498} {"train_loss": -12.088808059692383, "global_step": 419769, "epoch": 2498} {"train_loss": -11.60096549987793, "global_step": 419770, "epoch": 2498} {"train_loss": -12.388816833496094, "global_step": 419771, "epoch": 2498} {"train_loss": -12.281007766723633, "global_step": 419772, "epoch": 2498} {"train_loss": -12.338920593261719, "global_step": 419773, "epoch": 2498} {"train_loss": -12.279385566711426, "global_step": 419774, "epoch": 2498} {"train_loss": -12.250986099243164, "global_step": 419775, "epoch": 2498} {"train_loss": -12.561591148376465, "global_step": 419776, "epoch": 2498} {"train_loss": -12.276046752929688, "global_step": 419777, "epoch": 2498} {"train_loss": -12.439201354980469, "global_step": 419778, "epoch": 2498} {"train_loss": -12.571531295776367, "global_step": 419779, "epoch": 2498} {"train_loss": -12.484789848327637, "global_step": 419780, "epoch": 2498} {"train_loss": -12.495401382446289, "global_step": 419781, "epoch": 2498} {"train_loss": -12.156801223754883, "global_step": 419782, "epoch": 2498} {"train_loss": -12.69508171081543, "global_step": 419783, "epoch": 2498} {"train_loss": -12.52374267578125, "global_step": 419784, "epoch": 2498} {"train_loss": -12.253060340881348, "global_step": 419785, "epoch": 2498} {"train_loss": -12.666590690612793, "global_step": 419786, "epoch": 2498} {"train_loss": -12.111896514892578, "global_step": 419787, "epoch": 2498} {"train_loss": -12.649656295776367, "global_step": 419788, "epoch": 2498} {"train_loss": -12.275720596313477, "global_step": 419789, "epoch": 2498} {"train_loss": -12.535018920898438, "global_step": 419790, "epoch": 2498} {"train_loss": -12.257762908935547, "global_step": 419791, "epoch": 2498} {"train_loss": -12.612710952758789, "global_step": 419792, "epoch": 2498} {"train_loss": -11.767374038696289, "global_step": 419793, "epoch": 2498} {"train_loss": -12.543272018432617, "global_step": 419794, "epoch": 2498} {"train_loss": -12.153234481811523, "global_step": 419795, "epoch": 2498} {"train_loss": -12.061885833740234, "global_step": 419796, "epoch": 2498} {"train_loss": -12.191129684448242, "global_step": 419797, "epoch": 2498} {"train_loss": -12.20082950592041, "global_step": 419798, "epoch": 2498} {"train_loss": -12.173922538757324, "global_step": 419799, "epoch": 2498} {"train_loss": -12.132246017456055, "global_step": 419800, "epoch": 2498} {"train_loss": -11.576346397399902, "global_step": 419801, "epoch": 2498} {"train_loss": -12.046170234680176, "global_step": 419802, "epoch": 2498} {"train_loss": -11.380197525024414, "global_step": 419803, "epoch": 2498} {"train_loss": -11.362726211547852, "global_step": 419804, "epoch": 2498} {"train_loss": -12.23673152923584, "global_step": 419805, "epoch": 2498} {"train_loss": -11.356135368347168, "global_step": 419806, "epoch": 2498} {"train_loss": -11.681719779968262, "global_step": 419807, "epoch": 2498} {"train_loss": -11.592945098876953, "global_step": 419808, "epoch": 2498} {"train_loss": -12.282638549804688, "global_step": 419809, "epoch": 2498} {"train_loss": -11.819784164428711, "global_step": 419810, "epoch": 2498} {"train_loss": -12.072872161865234, "global_step": 419811, "epoch": 2498} {"train_loss": -11.303888320922852, "global_step": 419812, "epoch": 2498} {"train_loss": -11.084300994873047, "global_step": 419813, "epoch": 2498} {"train_loss": -11.766223907470703, "global_step": 419814, "epoch": 2498} {"train_loss": -10.03909969329834, "global_step": 419815, "epoch": 2498} {"train_loss": -10.854780197143555, "global_step": 419816, "epoch": 2498} {"train_loss": -10.702892303466797, "global_step": 419817, "epoch": 2498} {"train_loss": -10.330177307128906, "global_step": 419818, "epoch": 2498} {"train_loss": -10.423142433166504, "global_step": 419819, "epoch": 2498} {"train_loss": -11.467906951904297, "global_step": 419820, "epoch": 2498} {"train_loss": -10.523624420166016, "global_step": 419821, "epoch": 2498} {"train_loss": -10.877164840698242, "global_step": 419822, "epoch": 2498} {"train_loss": -11.491954803466797, "global_step": 419823, "epoch": 2498} {"train_loss": -10.849839210510254, "global_step": 419824, "epoch": 2498} {"train_loss": -10.453250885009766, "global_step": 419825, "epoch": 2498} {"train_loss": -12.13375473022461, "global_step": 419826, "epoch": 2498} {"train_loss": -10.04429817199707, "global_step": 419827, "epoch": 2498} {"train_loss": -11.613584518432617, "global_step": 419828, "epoch": 2498} {"train_loss": -10.965677261352539, "global_step": 419829, "epoch": 2498} {"train_loss": -11.425712585449219, "global_step": 419830, "epoch": 2498} {"train_loss": -12.053213216009594, "global_step": 419831, "epoch": 2498, "val_loss": 307510.25} {"train_loss": -12.126880645751953, "global_step": 419832, "epoch": 2499} {"train_loss": -11.819891929626465, "global_step": 419833, "epoch": 2499} {"train_loss": -12.219305038452148, "global_step": 419834, "epoch": 2499} {"train_loss": -11.166847229003906, "global_step": 419835, "epoch": 2499} {"train_loss": -12.051507949829102, "global_step": 419836, "epoch": 2499} {"train_loss": -11.815760612487793, "global_step": 419837, "epoch": 2499} {"train_loss": -11.781782150268555, "global_step": 419838, "epoch": 2499} {"train_loss": -11.892410278320312, "global_step": 419839, "epoch": 2499} {"train_loss": -12.067407608032227, "global_step": 419840, "epoch": 2499} {"train_loss": -11.522047996520996, "global_step": 419841, "epoch": 2499} {"train_loss": -12.26254940032959, "global_step": 419842, "epoch": 2499} {"train_loss": -11.365758895874023, "global_step": 419843, "epoch": 2499} {"train_loss": -11.793294906616211, "global_step": 419844, "epoch": 2499} {"train_loss": -11.281658172607422, "global_step": 419845, "epoch": 2499} {"train_loss": -11.557258605957031, "global_step": 419846, "epoch": 2499} {"train_loss": -11.282346725463867, "global_step": 419847, "epoch": 2499} {"train_loss": -11.762093544006348, "global_step": 419848, "epoch": 2499} {"train_loss": -11.229915618896484, "global_step": 419849, "epoch": 2499} {"train_loss": -12.008515357971191, "global_step": 419850, "epoch": 2499} {"train_loss": -11.874870300292969, "global_step": 419851, "epoch": 2499} {"train_loss": -11.598050117492676, "global_step": 419852, "epoch": 2499} {"train_loss": -11.62637710571289, "global_step": 419853, "epoch": 2499} {"train_loss": -11.450065612792969, "global_step": 419854, "epoch": 2499} {"train_loss": -11.634471893310547, "global_step": 419855, "epoch": 2499} {"train_loss": -11.180020332336426, "global_step": 419856, "epoch": 2499} {"train_loss": -11.89973258972168, "global_step": 419857, "epoch": 2499} {"train_loss": -11.415946006774902, "global_step": 419858, "epoch": 2499} {"train_loss": -12.076017379760742, "global_step": 419859, "epoch": 2499} {"train_loss": -11.71628189086914, "global_step": 419860, "epoch": 2499} {"train_loss": -12.00655746459961, "global_step": 419861, "epoch": 2499} {"train_loss": -11.55185604095459, "global_step": 419862, "epoch": 2499} {"train_loss": -12.051204681396484, "global_step": 419863, "epoch": 2499} {"train_loss": -11.813253402709961, "global_step": 419864, "epoch": 2499} {"train_loss": -12.158909797668457, "global_step": 419865, "epoch": 2499} {"train_loss": -11.709535598754883, "global_step": 419866, "epoch": 2499} {"train_loss": -12.125996589660645, "global_step": 419867, "epoch": 2499} {"train_loss": -11.854158401489258, "global_step": 419868, "epoch": 2499} {"train_loss": -12.2758207321167, "global_step": 419869, "epoch": 2499} {"train_loss": -12.220444679260254, "global_step": 419870, "epoch": 2499} {"train_loss": -12.458345413208008, "global_step": 419871, "epoch": 2499} {"train_loss": -12.282971382141113, "global_step": 419872, "epoch": 2499} {"train_loss": -12.557010650634766, "global_step": 419873, "epoch": 2499} {"train_loss": -12.233390808105469, "global_step": 419874, "epoch": 2499} {"train_loss": -12.167526245117188, "global_step": 419875, "epoch": 2499} {"train_loss": -12.330522537231445, "global_step": 419876, "epoch": 2499} {"train_loss": -12.147604942321777, "global_step": 419877, "epoch": 2499} {"train_loss": -12.514530181884766, "global_step": 419878, "epoch": 2499} {"train_loss": -12.296881675720215, "global_step": 419879, "epoch": 2499} {"train_loss": -12.261762619018555, "global_step": 419880, "epoch": 2499} {"train_loss": -12.553290367126465, "global_step": 419881, "epoch": 2499} {"train_loss": -12.487907409667969, "global_step": 419882, "epoch": 2499} {"train_loss": -12.456478118896484, "global_step": 419883, "epoch": 2499} {"train_loss": -12.536575317382812, "global_step": 419884, "epoch": 2499} {"train_loss": -12.558113098144531, "global_step": 419885, "epoch": 2499} {"train_loss": -12.607319831848145, "global_step": 419886, "epoch": 2499} {"train_loss": -12.800337791442871, "global_step": 419887, "epoch": 2499} {"train_loss": -12.586832046508789, "global_step": 419888, "epoch": 2499} {"train_loss": -12.622074127197266, "global_step": 419889, "epoch": 2499} {"train_loss": -12.440118789672852, "global_step": 419890, "epoch": 2499} {"train_loss": -12.675664901733398, "global_step": 419891, "epoch": 2499} {"train_loss": -12.634174346923828, "global_step": 419892, "epoch": 2499} {"train_loss": -12.750971794128418, "global_step": 419893, "epoch": 2499} {"train_loss": -12.715682983398438, "global_step": 419894, "epoch": 2499} {"train_loss": -12.511207580566406, "global_step": 419895, "epoch": 2499} {"train_loss": -12.731635093688965, "global_step": 419896, "epoch": 2499} {"train_loss": -12.636859893798828, "global_step": 419897, "epoch": 2499} {"train_loss": -12.887439727783203, "global_step": 419898, "epoch": 2499} {"train_loss": -12.508499145507812, "global_step": 419899, "epoch": 2499} {"train_loss": -12.409299850463867, "global_step": 419900, "epoch": 2499} {"train_loss": -12.511491775512695, "global_step": 419901, "epoch": 2499} {"train_loss": -12.487604141235352, "global_step": 419902, "epoch": 2499} {"train_loss": -12.466270446777344, "global_step": 419903, "epoch": 2499} {"train_loss": -11.844599723815918, "global_step": 419904, "epoch": 2499} {"train_loss": -12.543560028076172, "global_step": 419905, "epoch": 2499} {"train_loss": -12.457712173461914, "global_step": 419906, "epoch": 2499} {"train_loss": -11.439937591552734, "global_step": 419907, "epoch": 2499} {"train_loss": -11.909261703491211, "global_step": 419908, "epoch": 2499} {"train_loss": -12.372417449951172, "global_step": 419909, "epoch": 2499} {"train_loss": -11.172087669372559, "global_step": 419910, "epoch": 2499} {"train_loss": -11.187196731567383, "global_step": 419911, "epoch": 2499} {"train_loss": -12.2620210647583, "global_step": 419912, "epoch": 2499} {"train_loss": -10.214009284973145, "global_step": 419913, "epoch": 2499} {"train_loss": -9.777359962463379, "global_step": 419914, "epoch": 2499} {"train_loss": -10.113784790039062, "global_step": 419915, "epoch": 2499} {"train_loss": -8.827844619750977, "global_step": 419916, "epoch": 2499} {"train_loss": -9.438286781311035, "global_step": 419917, "epoch": 2499} {"train_loss": -9.533018112182617, "global_step": 419918, "epoch": 2499} {"train_loss": -9.616971015930176, "global_step": 419919, "epoch": 2499} {"train_loss": -11.509971618652344, "global_step": 419920, "epoch": 2499} {"train_loss": -9.573362350463867, "global_step": 419921, "epoch": 2499} {"train_loss": -11.173763275146484, "global_step": 419922, "epoch": 2499} {"train_loss": -9.330095291137695, "global_step": 419923, "epoch": 2499} {"train_loss": -10.495327949523926, "global_step": 419924, "epoch": 2499} {"train_loss": -11.25562858581543, "global_step": 419925, "epoch": 2499} {"train_loss": -9.047111511230469, "global_step": 419926, "epoch": 2499} {"train_loss": -11.8704833984375, "global_step": 419927, "epoch": 2499} {"train_loss": -9.848122596740723, "global_step": 419928, "epoch": 2499} {"train_loss": -10.455324172973633, "global_step": 419929, "epoch": 2499} {"train_loss": -11.182992935180664, "global_step": 419930, "epoch": 2499} {"train_loss": -10.223440170288086, "global_step": 419931, "epoch": 2499} {"train_loss": -11.228538513183594, "global_step": 419932, "epoch": 2499} {"train_loss": -11.046245574951172, "global_step": 419933, "epoch": 2499} {"train_loss": -11.65146255493164, "global_step": 419934, "epoch": 2499} {"train_loss": -11.668595314025879, "global_step": 419935, "epoch": 2499} {"train_loss": -10.895029067993164, "global_step": 419936, "epoch": 2499} {"train_loss": -12.00248908996582, "global_step": 419937, "epoch": 2499} {"train_loss": -11.341432571411133, "global_step": 419938, "epoch": 2499} {"train_loss": -10.848926544189453, "global_step": 419939, "epoch": 2499} {"train_loss": -11.932955741882324, "global_step": 419940, "epoch": 2499} {"train_loss": -11.147229194641113, "global_step": 419941, "epoch": 2499} {"train_loss": -11.942678451538086, "global_step": 419942, "epoch": 2499} {"train_loss": -11.491334915161133, "global_step": 419943, "epoch": 2499} {"train_loss": -11.325685501098633, "global_step": 419944, "epoch": 2499} {"train_loss": -11.993602752685547, "global_step": 419945, "epoch": 2499} {"train_loss": -11.6978759765625, "global_step": 419946, "epoch": 2499} {"train_loss": -12.197393417358398, "global_step": 419947, "epoch": 2499} {"train_loss": -11.925821304321289, "global_step": 419948, "epoch": 2499} {"train_loss": -11.912834167480469, "global_step": 419949, "epoch": 2499} {"train_loss": -12.146905899047852, "global_step": 419950, "epoch": 2499} {"train_loss": -11.680328369140625, "global_step": 419951, "epoch": 2499} {"train_loss": -12.141975402832031, "global_step": 419952, "epoch": 2499} {"train_loss": -12.140377044677734, "global_step": 419953, "epoch": 2499} {"train_loss": -12.30769157409668, "global_step": 419954, "epoch": 2499} {"train_loss": -12.152458190917969, "global_step": 419955, "epoch": 2499} {"train_loss": -12.026555061340332, "global_step": 419956, "epoch": 2499} {"train_loss": -12.164252281188965, "global_step": 419957, "epoch": 2499} {"train_loss": -12.237874984741211, "global_step": 419958, "epoch": 2499} {"train_loss": -12.285749435424805, "global_step": 419959, "epoch": 2499} {"train_loss": -12.365906715393066, "global_step": 419960, "epoch": 2499} {"train_loss": -12.203779220581055, "global_step": 419961, "epoch": 2499} {"train_loss": -12.181779861450195, "global_step": 419962, "epoch": 2499} {"train_loss": -12.080513000488281, "global_step": 419963, "epoch": 2499} {"train_loss": -12.50955867767334, "global_step": 419964, "epoch": 2499} {"train_loss": -12.182899475097656, "global_step": 419965, "epoch": 2499} {"train_loss": -12.118075370788574, "global_step": 419966, "epoch": 2499} {"train_loss": -12.355104446411133, "global_step": 419967, "epoch": 2499} {"train_loss": -12.45467758178711, "global_step": 419968, "epoch": 2499} {"train_loss": -12.295490264892578, "global_step": 419969, "epoch": 2499} {"train_loss": -12.012832641601562, "global_step": 419970, "epoch": 2499} {"train_loss": -12.284247398376465, "global_step": 419971, "epoch": 2499} {"train_loss": -12.061092376708984, "global_step": 419972, "epoch": 2499} {"train_loss": -12.407930374145508, "global_step": 419973, "epoch": 2499} {"train_loss": -12.046930313110352, "global_step": 419974, "epoch": 2499} {"train_loss": -12.402822494506836, "global_step": 419975, "epoch": 2499} {"train_loss": -12.253896713256836, "global_step": 419976, "epoch": 2499} {"train_loss": -12.179142951965332, "global_step": 419977, "epoch": 2499} {"train_loss": -12.426198959350586, "global_step": 419978, "epoch": 2499} {"train_loss": -12.045286178588867, "global_step": 419979, "epoch": 2499} {"train_loss": -12.49349594116211, "global_step": 419980, "epoch": 2499} {"train_loss": -12.306140899658203, "global_step": 419981, "epoch": 2499} {"train_loss": -12.195211410522461, "global_step": 419982, "epoch": 2499} {"train_loss": -12.430349349975586, "global_step": 419983, "epoch": 2499} {"train_loss": -12.065006256103516, "global_step": 419984, "epoch": 2499} {"train_loss": -12.37458610534668, "global_step": 419985, "epoch": 2499} {"train_loss": -12.407888412475586, "global_step": 419986, "epoch": 2499} {"train_loss": -12.39854907989502, "global_step": 419987, "epoch": 2499} {"train_loss": -12.587114334106445, "global_step": 419988, "epoch": 2499} {"train_loss": -12.406492233276367, "global_step": 419989, "epoch": 2499} {"train_loss": -12.647638320922852, "global_step": 419990, "epoch": 2499} {"train_loss": -12.510856628417969, "global_step": 419991, "epoch": 2499} {"train_loss": -12.238563537597656, "global_step": 419992, "epoch": 2499} {"train_loss": -12.50875473022461, "global_step": 419993, "epoch": 2499} {"train_loss": -12.125428199768066, "global_step": 419994, "epoch": 2499} {"train_loss": -12.527545928955078, "global_step": 419995, "epoch": 2499} {"train_loss": -12.353076934814453, "global_step": 419996, "epoch": 2499} {"train_loss": -12.356182098388672, "global_step": 419997, "epoch": 2499} {"train_loss": -12.421762466430664, "global_step": 419998, "epoch": 2499} {"train_loss": -11.873892273221697, "global_step": 419999, "epoch": 2499, "val_loss": 304382.375} {"train_loss": -12.414010047912598, "global_step": 420000, "epoch": 2500} {"train_loss": -12.27688217163086, "global_step": 420001, "epoch": 2500} {"train_loss": -12.646651268005371, "global_step": 420002, "epoch": 2500} {"train_loss": -12.28274154663086, "global_step": 420003, "epoch": 2500} {"train_loss": -12.401646614074707, "global_step": 420004, "epoch": 2500} {"train_loss": -12.437088966369629, "global_step": 420005, "epoch": 2500} {"train_loss": -12.651249885559082, "global_step": 420006, "epoch": 2500} {"train_loss": -12.514810562133789, "global_step": 420007, "epoch": 2500} {"train_loss": -12.588525772094727, "global_step": 420008, "epoch": 2500} {"train_loss": -12.562994003295898, "global_step": 420009, "epoch": 2500} {"train_loss": -12.68231201171875, "global_step": 420010, "epoch": 2500} {"train_loss": -12.589212417602539, "global_step": 420011, "epoch": 2500} {"train_loss": -12.527610778808594, "global_step": 420012, "epoch": 2500} {"train_loss": -12.472356796264648, "global_step": 420013, "epoch": 2500} {"train_loss": -12.591114044189453, "global_step": 420014, "epoch": 2500} {"train_loss": -12.36279296875, "global_step": 420015, "epoch": 2500} {"train_loss": -12.566767692565918, "global_step": 420016, "epoch": 2500} {"train_loss": -12.496694564819336, "global_step": 420017, "epoch": 2500} {"train_loss": -12.665313720703125, "global_step": 420018, "epoch": 2500} {"train_loss": -12.402978897094727, "global_step": 420019, "epoch": 2500} {"train_loss": -12.342496871948242, "global_step": 420020, "epoch": 2500} {"train_loss": -12.914985656738281, "global_step": 420021, "epoch": 2500} {"train_loss": -12.644023895263672, "global_step": 420022, "epoch": 2500} {"train_loss": -12.504880905151367, "global_step": 420023, "epoch": 2500} {"train_loss": -12.410430908203125, "global_step": 420024, "epoch": 2500} {"train_loss": -12.766511917114258, "global_step": 420025, "epoch": 2500} {"train_loss": -12.580984115600586, "global_step": 420026, "epoch": 2500} {"train_loss": -12.630674362182617, "global_step": 420027, "epoch": 2500} {"train_loss": -11.984874725341797, "global_step": 420028, "epoch": 2500} {"train_loss": -12.220608711242676, "global_step": 420029, "epoch": 2500} {"train_loss": -12.553291320800781, "global_step": 420030, "epoch": 2500} {"train_loss": -12.662158966064453, "global_step": 420031, "epoch": 2500} {"train_loss": -12.284456253051758, "global_step": 420032, "epoch": 2500} {"train_loss": -12.858000755310059, "global_step": 420033, "epoch": 2500} {"train_loss": -12.593799591064453, "global_step": 420034, "epoch": 2500} {"train_loss": -12.529441833496094, "global_step": 420035, "epoch": 2500} {"train_loss": -12.394432067871094, "global_step": 420036, "epoch": 2500} {"train_loss": -12.610605239868164, "global_step": 420037, "epoch": 2500} {"train_loss": -12.484848022460938, "global_step": 420038, "epoch": 2500} {"train_loss": -12.583219528198242, "global_step": 420039, "epoch": 2500} {"train_loss": -12.367880821228027, "global_step": 420040, "epoch": 2500} {"train_loss": -12.550640106201172, "global_step": 420041, "epoch": 2500} {"train_loss": -12.208902359008789, "global_step": 420042, "epoch": 2500} {"train_loss": -12.581280708312988, "global_step": 420043, "epoch": 2500} {"train_loss": -11.924102783203125, "global_step": 420044, "epoch": 2500} {"train_loss": -12.800643920898438, "global_step": 420045, "epoch": 2500} {"train_loss": -12.299295425415039, "global_step": 420046, "epoch": 2500} {"train_loss": -11.95185375213623, "global_step": 420047, "epoch": 2500} {"train_loss": -11.651716232299805, "global_step": 420048, "epoch": 2500} {"train_loss": -12.583175659179688, "global_step": 420049, "epoch": 2500} {"train_loss": -11.40626335144043, "global_step": 420050, "epoch": 2500} {"train_loss": -11.871955871582031, "global_step": 420051, "epoch": 2500} {"train_loss": -12.29257869720459, "global_step": 420052, "epoch": 2500} {"train_loss": -12.301996231079102, "global_step": 420053, "epoch": 2500} {"train_loss": -12.180563926696777, "global_step": 420054, "epoch": 2500} {"train_loss": -12.755857467651367, "global_step": 420055, "epoch": 2500} {"train_loss": -12.599945068359375, "global_step": 420056, "epoch": 2500} {"train_loss": -12.601513862609863, "global_step": 420057, "epoch": 2500} {"train_loss": -12.167174339294434, "global_step": 420058, "epoch": 2500} {"train_loss": -12.736400604248047, "global_step": 420059, "epoch": 2500} {"train_loss": -12.489951133728027, "global_step": 420060, "epoch": 2500} {"train_loss": -12.503670692443848, "global_step": 420061, "epoch": 2500} {"train_loss": -12.633869171142578, "global_step": 420062, "epoch": 2500} {"train_loss": -12.708906173706055, "global_step": 420063, "epoch": 2500} {"train_loss": -12.357159614562988, "global_step": 420064, "epoch": 2500} {"train_loss": -12.206664085388184, "global_step": 420065, "epoch": 2500} {"train_loss": -12.268253326416016, "global_step": 420066, "epoch": 2500} {"train_loss": -12.592832565307617, "global_step": 420067, "epoch": 2500} {"train_loss": -12.197830200195312, "global_step": 420068, "epoch": 2500} {"train_loss": -11.504497528076172, "global_step": 420069, "epoch": 2500} {"train_loss": -12.526479721069336, "global_step": 420070, "epoch": 2500} {"train_loss": -11.320117950439453, "global_step": 420071, "epoch": 2500} {"train_loss": -9.52015495300293, "global_step": 420072, "epoch": 2500} {"train_loss": -10.870992660522461, "global_step": 420073, "epoch": 2500} {"train_loss": -9.197813034057617, "global_step": 420074, "epoch": 2500} {"train_loss": -9.030458450317383, "global_step": 420075, "epoch": 2500} {"train_loss": -9.827556610107422, "global_step": 420076, "epoch": 2500} {"train_loss": -8.766641616821289, "global_step": 420077, "epoch": 2500} {"train_loss": -9.939319610595703, "global_step": 420078, "epoch": 2500} {"train_loss": -8.802840232849121, "global_step": 420079, "epoch": 2500} {"train_loss": -11.721596717834473, "global_step": 420080, "epoch": 2500} {"train_loss": -9.424262046813965, "global_step": 420081, "epoch": 2500} {"train_loss": -10.629292488098145, "global_step": 420082, "epoch": 2500} {"train_loss": -10.02391242980957, "global_step": 420083, "epoch": 2500} {"train_loss": -11.071840286254883, "global_step": 420084, "epoch": 2500} {"train_loss": -9.904570579528809, "global_step": 420085, "epoch": 2500} {"train_loss": -10.993712425231934, "global_step": 420086, "epoch": 2500} {"train_loss": -10.284576416015625, "global_step": 420087, "epoch": 2500} {"train_loss": -11.014060974121094, "global_step": 420088, "epoch": 2500} {"train_loss": -10.411453247070312, "global_step": 420089, "epoch": 2500} {"train_loss": -9.305011749267578, "global_step": 420090, "epoch": 2500} {"train_loss": -10.10446548461914, "global_step": 420091, "epoch": 2500} {"train_loss": -9.816669464111328, "global_step": 420092, "epoch": 2500} {"train_loss": -9.783834457397461, "global_step": 420093, "epoch": 2500} {"train_loss": -9.147644996643066, "global_step": 420094, "epoch": 2500} {"train_loss": -10.942913055419922, "global_step": 420095, "epoch": 2500} {"train_loss": -9.024415969848633, "global_step": 420096, "epoch": 2500} {"train_loss": -11.43083667755127, "global_step": 420097, "epoch": 2500} {"train_loss": -9.586456298828125, "global_step": 420098, "epoch": 2500} {"train_loss": -9.180217742919922, "global_step": 420099, "epoch": 2500} {"train_loss": -9.817964553833008, "global_step": 420100, "epoch": 2500} {"train_loss": -10.732770919799805, "global_step": 420101, "epoch": 2500} {"train_loss": -10.958966255187988, "global_step": 420102, "epoch": 2500} {"train_loss": -10.483686447143555, "global_step": 420103, "epoch": 2500} {"train_loss": -10.507728576660156, "global_step": 420104, "epoch": 2500} {"train_loss": -10.331634521484375, "global_step": 420105, "epoch": 2500} {"train_loss": -10.11984634399414, "global_step": 420106, "epoch": 2500} {"train_loss": -11.517373085021973, "global_step": 420107, "epoch": 2500} {"train_loss": -10.420587539672852, "global_step": 420108, "epoch": 2500} {"train_loss": -10.068445205688477, "global_step": 420109, "epoch": 2500} {"train_loss": -11.158308982849121, "global_step": 420110, "epoch": 2500} {"train_loss": -11.135198593139648, "global_step": 420111, "epoch": 2500} {"train_loss": -10.652791976928711, "global_step": 420112, "epoch": 2500} {"train_loss": -11.381572723388672, "global_step": 420113, "epoch": 2500} {"train_loss": -11.386146545410156, "global_step": 420114, "epoch": 2500} {"train_loss": -11.489315032958984, "global_step": 420115, "epoch": 2500} {"train_loss": -11.7731294631958, "global_step": 420116, "epoch": 2500} {"train_loss": -11.59493350982666, "global_step": 420117, "epoch": 2500} {"train_loss": -12.01283073425293, "global_step": 420118, "epoch": 2500} {"train_loss": -11.953855514526367, "global_step": 420119, "epoch": 2500} {"train_loss": -12.189560890197754, "global_step": 420120, "epoch": 2500} {"train_loss": -11.75039291381836, "global_step": 420121, "epoch": 2500} {"train_loss": -12.196800231933594, "global_step": 420122, "epoch": 2500} {"train_loss": -11.961252212524414, "global_step": 420123, "epoch": 2500} {"train_loss": -12.194064140319824, "global_step": 420124, "epoch": 2500} {"train_loss": -12.171236038208008, "global_step": 420125, "epoch": 2500} {"train_loss": -12.11723518371582, "global_step": 420126, "epoch": 2500} {"train_loss": -11.970841407775879, "global_step": 420127, "epoch": 2500} {"train_loss": -12.111103057861328, "global_step": 420128, "epoch": 2500} {"train_loss": -12.304743766784668, "global_step": 420129, "epoch": 2500} {"train_loss": -12.269430160522461, "global_step": 420130, "epoch": 2500} {"train_loss": -12.156220436096191, "global_step": 420131, "epoch": 2500} {"train_loss": -12.075368881225586, "global_step": 420132, "epoch": 2500} {"train_loss": -12.313323974609375, "global_step": 420133, "epoch": 2500} {"train_loss": -12.080253601074219, "global_step": 420134, "epoch": 2500} {"train_loss": -12.464344024658203, "global_step": 420135, "epoch": 2500} {"train_loss": -12.059050559997559, "global_step": 420136, "epoch": 2500} {"train_loss": -12.29716682434082, "global_step": 420137, "epoch": 2500} {"train_loss": -12.058541297912598, "global_step": 420138, "epoch": 2500} {"train_loss": -12.319154739379883, "global_step": 420139, "epoch": 2500} {"train_loss": -12.300504684448242, "global_step": 420140, "epoch": 2500} {"train_loss": -12.434974670410156, "global_step": 420141, "epoch": 2500} {"train_loss": -12.199509620666504, "global_step": 420142, "epoch": 2500} {"train_loss": -12.40189266204834, "global_step": 420143, "epoch": 2500} {"train_loss": -12.391749382019043, "global_step": 420144, "epoch": 2500} {"train_loss": -12.394163131713867, "global_step": 420145, "epoch": 2500} {"train_loss": -12.384416580200195, "global_step": 420146, "epoch": 2500} {"train_loss": -12.3839750289917, "global_step": 420147, "epoch": 2500} {"train_loss": -12.383161544799805, "global_step": 420148, "epoch": 2500} {"train_loss": -12.517106056213379, "global_step": 420149, "epoch": 2500} {"train_loss": -12.51388931274414, "global_step": 420150, "epoch": 2500} {"train_loss": -12.534687042236328, "global_step": 420151, "epoch": 2500} {"train_loss": -12.432689666748047, "global_step": 420152, "epoch": 2500} {"train_loss": -12.32557487487793, "global_step": 420153, "epoch": 2500} {"train_loss": -12.603104591369629, "global_step": 420154, "epoch": 2500} {"train_loss": -12.406509399414062, "global_step": 420155, "epoch": 2500} {"train_loss": -12.577796936035156, "global_step": 420156, "epoch": 2500} {"train_loss": -12.47022533416748, "global_step": 420157, "epoch": 2500} {"train_loss": -12.583639144897461, "global_step": 420158, "epoch": 2500} {"train_loss": -12.423690795898438, "global_step": 420159, "epoch": 2500} {"train_loss": -12.587308883666992, "global_step": 420160, "epoch": 2500} {"train_loss": -12.503986358642578, "global_step": 420161, "epoch": 2500} {"train_loss": -12.413009643554688, "global_step": 420162, "epoch": 2500} {"train_loss": -12.396896362304688, "global_step": 420163, "epoch": 2500} {"train_loss": -12.385847091674805, "global_step": 420164, "epoch": 2500} {"train_loss": -12.46316146850586, "global_step": 420165, "epoch": 2500} {"train_loss": -12.636884689331055, "global_step": 420166, "epoch": 2500} {"train_loss": -11.81118857292902, "global_step": 420167, "epoch": 2500, "train/sim_max_reward_0": 0.6765418581967065, "train/sim_max_reward_1": 0.9139951352688808, "train/sim_max_reward_2": 0.0008927746613597092, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.9852677982461095, "train/sim_max_reward_5": 0.999880501946658, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.3739125055592955, "test/sim_max_reward_4400002": 0.18645042112916185, "test/sim_max_reward_4400003": 7.662928014699957e-05, "test/sim_max_reward_4400004": 0.5383969380888354, "test/sim_max_reward_4400005": 0.9255564561649203, "test/sim_max_reward_4400006": 0.9932733184825046, "test/sim_max_reward_4400007": 0.5164125297573685, "test/sim_max_reward_4400008": 0.6071853498174022, "test/sim_max_reward_4400009": 0.34524360213526767, "test/sim_max_reward_4400010": 0.9878138970722764, "test/sim_max_reward_4400011": 0.28245826486324993, "test/sim_max_reward_4400012": 0.9917523152925791, "test/sim_max_reward_4400013": 0.9767626581300664, "test/sim_max_reward_4400014": 0.9901166775102418, "test/sim_max_reward_4400015": 0.9873380744554705, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 9.106881579913412e-06, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 0.39137883170729904, "test/sim_max_reward_4400020": 0.1295933406642839, "test/sim_max_reward_4400021": 0.7042052611324987, "test/sim_max_reward_4400022": 0.9822920135181744, "test/sim_max_reward_4400023": 0.11523391981608713, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.5523674644169226, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.17303270505478344, "test/sim_max_reward_4400028": 0.942027277008863, "test/sim_max_reward_4400029": 1.0, "test/sim_max_reward_4400030": 0.9489684454394504, "test/sim_max_reward_4400031": 0.9942349987774247, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.7182964284307075, "test/sim_max_reward_4400034": 0.5215406886075689, "test/sim_max_reward_4400035": 0.9844437712093818, "test/sim_max_reward_4400036": 0.5542934225842027, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.32339599924191603, "test/sim_max_reward_4400039": 0.9896358144296935, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.982204422614326, "test/sim_max_reward_4400042": 0.02149515508952813, "test/sim_max_reward_4400043": 0.022586009632537235, "test/sim_max_reward_4400044": 0.94259171484164, "test/sim_max_reward_4400045": 0.7093588865916195, "test/sim_max_reward_4400046": 0.33483485256197804, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.762763011386619, "test/mean_score": 0.5567815362962579, "val_loss": 304230.40625, "train_action_mse_error": 1.180510401725769} {"train_loss": -12.411087036132812, "global_step": 420168, "epoch": 2501} {"train_loss": -12.281129837036133, "global_step": 420169, "epoch": 2501} {"train_loss": -12.588144302368164, "global_step": 420170, "epoch": 2501} {"train_loss": -12.455707550048828, "global_step": 420171, "epoch": 2501} {"train_loss": -12.457326889038086, "global_step": 420172, "epoch": 2501} {"train_loss": -12.484233856201172, "global_step": 420173, "epoch": 2501} {"train_loss": -12.13767147064209, "global_step": 420174, "epoch": 2501} {"train_loss": -12.588766098022461, "global_step": 420175, "epoch": 2501} {"train_loss": -12.37923812866211, "global_step": 420176, "epoch": 2501} {"train_loss": -12.352970123291016, "global_step": 420177, "epoch": 2501} {"train_loss": -12.515941619873047, "global_step": 420178, "epoch": 2501} {"train_loss": -12.381234169006348, "global_step": 420179, "epoch": 2501} {"train_loss": -12.33131217956543, "global_step": 420180, "epoch": 2501} {"train_loss": -12.167396545410156, "global_step": 420181, "epoch": 2501} {"train_loss": -12.490933418273926, "global_step": 420182, "epoch": 2501} {"train_loss": -12.417570114135742, "global_step": 420183, "epoch": 2501} {"train_loss": -12.69969367980957, "global_step": 420184, "epoch": 2501} {"train_loss": -12.362178802490234, "global_step": 420185, "epoch": 2501} {"train_loss": -12.609067916870117, "global_step": 420186, "epoch": 2501} {"train_loss": -12.54677677154541, "global_step": 420187, "epoch": 2501} {"train_loss": -12.651365280151367, "global_step": 420188, "epoch": 2501} {"train_loss": -12.65188217163086, "global_step": 420189, "epoch": 2501} {"train_loss": -12.758190155029297, "global_step": 420190, "epoch": 2501} {"train_loss": -12.435396194458008, "global_step": 420191, "epoch": 2501} {"train_loss": -12.46027946472168, "global_step": 420192, "epoch": 2501} {"train_loss": -12.560077667236328, "global_step": 420193, "epoch": 2501} {"train_loss": -12.411718368530273, "global_step": 420194, "epoch": 2501} {"train_loss": -12.392062187194824, "global_step": 420195, "epoch": 2501} {"train_loss": -12.521469116210938, "global_step": 420196, "epoch": 2501} {"train_loss": -12.14819049835205, "global_step": 420197, "epoch": 2501} {"train_loss": -12.335663795471191, "global_step": 420198, "epoch": 2501} {"train_loss": -12.396869659423828, "global_step": 420199, "epoch": 2501} {"train_loss": -12.05912971496582, "global_step": 420200, "epoch": 2501} {"train_loss": -12.443073272705078, "global_step": 420201, "epoch": 2501} {"train_loss": -12.769338607788086, "global_step": 420202, "epoch": 2501} {"train_loss": -12.157660484313965, "global_step": 420203, "epoch": 2501} {"train_loss": -12.49490737915039, "global_step": 420204, "epoch": 2501} {"train_loss": -12.521677017211914, "global_step": 420205, "epoch": 2501} {"train_loss": -12.501617431640625, "global_step": 420206, "epoch": 2501} {"train_loss": -12.351534843444824, "global_step": 420207, "epoch": 2501} {"train_loss": -12.531805992126465, "global_step": 420208, "epoch": 2501} {"train_loss": -12.186344146728516, "global_step": 420209, "epoch": 2501} {"train_loss": -12.668766021728516, "global_step": 420210, "epoch": 2501} {"train_loss": -12.305731773376465, "global_step": 420211, "epoch": 2501} {"train_loss": -12.604777336120605, "global_step": 420212, "epoch": 2501} {"train_loss": -12.585304260253906, "global_step": 420213, "epoch": 2501} {"train_loss": -12.55096435546875, "global_step": 420214, "epoch": 2501} {"train_loss": -12.528144836425781, "global_step": 420215, "epoch": 2501} {"train_loss": -12.5204439163208, "global_step": 420216, "epoch": 2501} {"train_loss": -12.554550170898438, "global_step": 420217, "epoch": 2501} {"train_loss": -12.500475883483887, "global_step": 420218, "epoch": 2501} {"train_loss": -12.694173812866211, "global_step": 420219, "epoch": 2501} {"train_loss": -12.621601104736328, "global_step": 420220, "epoch": 2501} {"train_loss": -12.211074829101562, "global_step": 420221, "epoch": 2501} {"train_loss": -12.010854721069336, "global_step": 420222, "epoch": 2501} {"train_loss": -12.43863296508789, "global_step": 420223, "epoch": 2501} {"train_loss": -11.876591682434082, "global_step": 420224, "epoch": 2501} {"train_loss": -11.512939453125, "global_step": 420225, "epoch": 2501} {"train_loss": -12.051312446594238, "global_step": 420226, "epoch": 2501} {"train_loss": -12.13318157196045, "global_step": 420227, "epoch": 2501} {"train_loss": -10.913069725036621, "global_step": 420228, "epoch": 2501} {"train_loss": -12.428190231323242, "global_step": 420229, "epoch": 2501} {"train_loss": -12.105263710021973, "global_step": 420230, "epoch": 2501} {"train_loss": -12.077754974365234, "global_step": 420231, "epoch": 2501} {"train_loss": -12.538497924804688, "global_step": 420232, "epoch": 2501} {"train_loss": -12.35301399230957, "global_step": 420233, "epoch": 2501} {"train_loss": -12.259422302246094, "global_step": 420234, "epoch": 2501} {"train_loss": -12.651257514953613, "global_step": 420235, "epoch": 2501} {"train_loss": -12.399922370910645, "global_step": 420236, "epoch": 2501} {"train_loss": -12.265586853027344, "global_step": 420237, "epoch": 2501} {"train_loss": -12.783785820007324, "global_step": 420238, "epoch": 2501} {"train_loss": -12.338947296142578, "global_step": 420239, "epoch": 2501} {"train_loss": -12.787224769592285, "global_step": 420240, "epoch": 2501} {"train_loss": -12.147045135498047, "global_step": 420241, "epoch": 2501} {"train_loss": -12.594822883605957, "global_step": 420242, "epoch": 2501} {"train_loss": -12.502814292907715, "global_step": 420243, "epoch": 2501} {"train_loss": -12.52127456665039, "global_step": 420244, "epoch": 2501} {"train_loss": -12.437141418457031, "global_step": 420245, "epoch": 2501} {"train_loss": -12.671817779541016, "global_step": 420246, "epoch": 2501} {"train_loss": -12.582696914672852, "global_step": 420247, "epoch": 2501} {"train_loss": -12.841724395751953, "global_step": 420248, "epoch": 2501} {"train_loss": -12.615484237670898, "global_step": 420249, "epoch": 2501} {"train_loss": -12.68759822845459, "global_step": 420250, "epoch": 2501} {"train_loss": -12.56273078918457, "global_step": 420251, "epoch": 2501} {"train_loss": -12.649264335632324, "global_step": 420252, "epoch": 2501} {"train_loss": -12.474180221557617, "global_step": 420253, "epoch": 2501} {"train_loss": -12.735660552978516, "global_step": 420254, "epoch": 2501} {"train_loss": -12.510419845581055, "global_step": 420255, "epoch": 2501} {"train_loss": -13.04043197631836, "global_step": 420256, "epoch": 2501} {"train_loss": -12.849573135375977, "global_step": 420257, "epoch": 2501} {"train_loss": -12.833951950073242, "global_step": 420258, "epoch": 2501} {"train_loss": -12.882608413696289, "global_step": 420259, "epoch": 2501} {"train_loss": -12.653081893920898, "global_step": 420260, "epoch": 2501} {"train_loss": -12.888124465942383, "global_step": 420261, "epoch": 2501} {"train_loss": -12.672801971435547, "global_step": 420262, "epoch": 2501} {"train_loss": -12.847685813903809, "global_step": 420263, "epoch": 2501} {"train_loss": -12.404264450073242, "global_step": 420264, "epoch": 2501} {"train_loss": -12.752233505249023, "global_step": 420265, "epoch": 2501} {"train_loss": -12.795987129211426, "global_step": 420266, "epoch": 2501} {"train_loss": -12.812618255615234, "global_step": 420267, "epoch": 2501} {"train_loss": -12.668498992919922, "global_step": 420268, "epoch": 2501} {"train_loss": -12.83432674407959, "global_step": 420269, "epoch": 2501} {"train_loss": -12.769914627075195, "global_step": 420270, "epoch": 2501} {"train_loss": -12.026839256286621, "global_step": 420271, "epoch": 2501} {"train_loss": -12.14583969116211, "global_step": 420272, "epoch": 2501} {"train_loss": -12.205921173095703, "global_step": 420273, "epoch": 2501} {"train_loss": -12.591150283813477, "global_step": 420274, "epoch": 2501} {"train_loss": -12.56437873840332, "global_step": 420275, "epoch": 2501} {"train_loss": -12.792396545410156, "global_step": 420276, "epoch": 2501} {"train_loss": -12.404558181762695, "global_step": 420277, "epoch": 2501} {"train_loss": -12.575489044189453, "global_step": 420278, "epoch": 2501} {"train_loss": -12.416572570800781, "global_step": 420279, "epoch": 2501} {"train_loss": -12.522741317749023, "global_step": 420280, "epoch": 2501} {"train_loss": -12.745867729187012, "global_step": 420281, "epoch": 2501} {"train_loss": -12.565733909606934, "global_step": 420282, "epoch": 2501} {"train_loss": -11.994768142700195, "global_step": 420283, "epoch": 2501} {"train_loss": -11.810440063476562, "global_step": 420284, "epoch": 2501} {"train_loss": -12.05441951751709, "global_step": 420285, "epoch": 2501} {"train_loss": -12.069334030151367, "global_step": 420286, "epoch": 2501} {"train_loss": -9.530265808105469, "global_step": 420287, "epoch": 2501} {"train_loss": -10.63059139251709, "global_step": 420288, "epoch": 2501} {"train_loss": -10.975473403930664, "global_step": 420289, "epoch": 2501} {"train_loss": -9.33993148803711, "global_step": 420290, "epoch": 2501} {"train_loss": -10.57385540008545, "global_step": 420291, "epoch": 2501} {"train_loss": -9.060873031616211, "global_step": 420292, "epoch": 2501} {"train_loss": -9.903783798217773, "global_step": 420293, "epoch": 2501} {"train_loss": -10.097434043884277, "global_step": 420294, "epoch": 2501} {"train_loss": -9.851544380187988, "global_step": 420295, "epoch": 2501} {"train_loss": -10.680275917053223, "global_step": 420296, "epoch": 2501} {"train_loss": -11.638851165771484, "global_step": 420297, "epoch": 2501} {"train_loss": -11.393299102783203, "global_step": 420298, "epoch": 2501} {"train_loss": -11.838296890258789, "global_step": 420299, "epoch": 2501} {"train_loss": -10.927488327026367, "global_step": 420300, "epoch": 2501} {"train_loss": -11.072308540344238, "global_step": 420301, "epoch": 2501} {"train_loss": -10.938497543334961, "global_step": 420302, "epoch": 2501} {"train_loss": -9.821174621582031, "global_step": 420303, "epoch": 2501} {"train_loss": -10.357084274291992, "global_step": 420304, "epoch": 2501} {"train_loss": -10.430609703063965, "global_step": 420305, "epoch": 2501} {"train_loss": -10.57960033416748, "global_step": 420306, "epoch": 2501} {"train_loss": -9.793776512145996, "global_step": 420307, "epoch": 2501} {"train_loss": -10.8558931350708, "global_step": 420308, "epoch": 2501} {"train_loss": -10.435702323913574, "global_step": 420309, "epoch": 2501} {"train_loss": -11.301685333251953, "global_step": 420310, "epoch": 2501} {"train_loss": -11.637495040893555, "global_step": 420311, "epoch": 2501} {"train_loss": -9.239290237426758, "global_step": 420312, "epoch": 2501} {"train_loss": -11.073501586914062, "global_step": 420313, "epoch": 2501} {"train_loss": -11.347243309020996, "global_step": 420314, "epoch": 2501} {"train_loss": -10.815712928771973, "global_step": 420315, "epoch": 2501} {"train_loss": -10.331781387329102, "global_step": 420316, "epoch": 2501} {"train_loss": -10.241674423217773, "global_step": 420317, "epoch": 2501} {"train_loss": -10.660727500915527, "global_step": 420318, "epoch": 2501} {"train_loss": -10.781110763549805, "global_step": 420319, "epoch": 2501} {"train_loss": -10.106803894042969, "global_step": 420320, "epoch": 2501} {"train_loss": -10.37845230102539, "global_step": 420321, "epoch": 2501} {"train_loss": -10.75100326538086, "global_step": 420322, "epoch": 2501} {"train_loss": -10.775941848754883, "global_step": 420323, "epoch": 2501} {"train_loss": -10.775973320007324, "global_step": 420324, "epoch": 2501} {"train_loss": -11.024118423461914, "global_step": 420325, "epoch": 2501} {"train_loss": -11.075084686279297, "global_step": 420326, "epoch": 2501} {"train_loss": -10.975317001342773, "global_step": 420327, "epoch": 2501} {"train_loss": -11.83631706237793, "global_step": 420328, "epoch": 2501} {"train_loss": -11.335987091064453, "global_step": 420329, "epoch": 2501} {"train_loss": -11.418033599853516, "global_step": 420330, "epoch": 2501} {"train_loss": -11.322059631347656, "global_step": 420331, "epoch": 2501} {"train_loss": -11.237367630004883, "global_step": 420332, "epoch": 2501} {"train_loss": -11.842158317565918, "global_step": 420333, "epoch": 2501} {"train_loss": -11.083328247070312, "global_step": 420334, "epoch": 2501} {"train_loss": -11.951896798043023, "global_step": 420335, "epoch": 2501, "val_loss": 308489.625} {"train_loss": -11.005199432373047, "global_step": 420336, "epoch": 2502} {"train_loss": -11.902531623840332, "global_step": 420337, "epoch": 2502} {"train_loss": -10.581626892089844, "global_step": 420338, "epoch": 2502} {"train_loss": -11.822683334350586, "global_step": 420339, "epoch": 2502} {"train_loss": -11.613445281982422, "global_step": 420340, "epoch": 2502} {"train_loss": -11.03468132019043, "global_step": 420341, "epoch": 2502} {"train_loss": -11.642000198364258, "global_step": 420342, "epoch": 2502} {"train_loss": -10.87925910949707, "global_step": 420343, "epoch": 2502} {"train_loss": -11.489482879638672, "global_step": 420344, "epoch": 2502} {"train_loss": -11.560248374938965, "global_step": 420345, "epoch": 2502} {"train_loss": -11.127237319946289, "global_step": 420346, "epoch": 2502} {"train_loss": -11.866869926452637, "global_step": 420347, "epoch": 2502} {"train_loss": -11.26518440246582, "global_step": 420348, "epoch": 2502} {"train_loss": -11.871784210205078, "global_step": 420349, "epoch": 2502} {"train_loss": -11.322809219360352, "global_step": 420350, "epoch": 2502} {"train_loss": -12.066949844360352, "global_step": 420351, "epoch": 2502} {"train_loss": -11.880452156066895, "global_step": 420352, "epoch": 2502} {"train_loss": -11.83300495147705, "global_step": 420353, "epoch": 2502} {"train_loss": -12.330331802368164, "global_step": 420354, "epoch": 2502} {"train_loss": -11.969133377075195, "global_step": 420355, "epoch": 2502} {"train_loss": -11.98095703125, "global_step": 420356, "epoch": 2502} {"train_loss": -12.017148971557617, "global_step": 420357, "epoch": 2502} {"train_loss": -11.832966804504395, "global_step": 420358, "epoch": 2502} {"train_loss": -12.174005508422852, "global_step": 420359, "epoch": 2502} {"train_loss": -11.91423225402832, "global_step": 420360, "epoch": 2502} {"train_loss": -11.9797945022583, "global_step": 420361, "epoch": 2502} {"train_loss": -11.983177185058594, "global_step": 420362, "epoch": 2502} {"train_loss": -11.766035079956055, "global_step": 420363, "epoch": 2502} {"train_loss": -12.3620023727417, "global_step": 420364, "epoch": 2502} {"train_loss": -11.918232917785645, "global_step": 420365, "epoch": 2502} {"train_loss": -12.4420166015625, "global_step": 420366, "epoch": 2502} {"train_loss": -12.311819076538086, "global_step": 420367, "epoch": 2502} {"train_loss": -12.078710556030273, "global_step": 420368, "epoch": 2502} {"train_loss": -12.253413200378418, "global_step": 420369, "epoch": 2502} {"train_loss": -12.148372650146484, "global_step": 420370, "epoch": 2502} {"train_loss": -12.338752746582031, "global_step": 420371, "epoch": 2502} {"train_loss": -12.309860229492188, "global_step": 420372, "epoch": 2502} {"train_loss": -12.479280471801758, "global_step": 420373, "epoch": 2502} {"train_loss": -12.323522567749023, "global_step": 420374, "epoch": 2502} {"train_loss": -12.435835838317871, "global_step": 420375, "epoch": 2502} {"train_loss": -12.426194190979004, "global_step": 420376, "epoch": 2502} {"train_loss": -12.384941101074219, "global_step": 420377, "epoch": 2502} {"train_loss": -12.371049880981445, "global_step": 420378, "epoch": 2502} {"train_loss": -12.681795120239258, "global_step": 420379, "epoch": 2502} {"train_loss": -12.355486869812012, "global_step": 420380, "epoch": 2502} {"train_loss": -12.517101287841797, "global_step": 420381, "epoch": 2502} {"train_loss": -12.327735900878906, "global_step": 420382, "epoch": 2502} {"train_loss": -12.439867973327637, "global_step": 420383, "epoch": 2502} {"train_loss": -12.579612731933594, "global_step": 420384, "epoch": 2502} {"train_loss": -12.524085998535156, "global_step": 420385, "epoch": 2502} {"train_loss": -12.435280799865723, "global_step": 420386, "epoch": 2502} {"train_loss": -12.430349349975586, "global_step": 420387, "epoch": 2502} {"train_loss": -12.324471473693848, "global_step": 420388, "epoch": 2502} {"train_loss": -12.416425704956055, "global_step": 420389, "epoch": 2502} {"train_loss": -12.582798957824707, "global_step": 420390, "epoch": 2502} {"train_loss": -12.215314865112305, "global_step": 420391, "epoch": 2502} {"train_loss": -12.455537796020508, "global_step": 420392, "epoch": 2502} {"train_loss": -12.440433502197266, "global_step": 420393, "epoch": 2502} {"train_loss": -12.546396255493164, "global_step": 420394, "epoch": 2502} {"train_loss": -12.554752349853516, "global_step": 420395, "epoch": 2502} {"train_loss": -12.488024711608887, "global_step": 420396, "epoch": 2502} {"train_loss": -12.498391151428223, "global_step": 420397, "epoch": 2502} {"train_loss": -12.498831748962402, "global_step": 420398, "epoch": 2502} {"train_loss": -12.725318908691406, "global_step": 420399, "epoch": 2502} {"train_loss": -12.443670272827148, "global_step": 420400, "epoch": 2502} {"train_loss": -12.612249374389648, "global_step": 420401, "epoch": 2502} {"train_loss": -12.655162811279297, "global_step": 420402, "epoch": 2502} {"train_loss": -12.667768478393555, "global_step": 420403, "epoch": 2502} {"train_loss": -12.632837295532227, "global_step": 420404, "epoch": 2502} {"train_loss": -12.703760147094727, "global_step": 420405, "epoch": 2502} {"train_loss": -12.73348617553711, "global_step": 420406, "epoch": 2502} {"train_loss": -12.58221435546875, "global_step": 420407, "epoch": 2502} {"train_loss": -12.743742942810059, "global_step": 420408, "epoch": 2502} {"train_loss": -12.782343864440918, "global_step": 420409, "epoch": 2502} {"train_loss": -12.557489395141602, "global_step": 420410, "epoch": 2502} {"train_loss": -12.683881759643555, "global_step": 420411, "epoch": 2502} {"train_loss": -12.691667556762695, "global_step": 420412, "epoch": 2502} {"train_loss": -12.75647258758545, "global_step": 420413, "epoch": 2502} {"train_loss": -12.646987915039062, "global_step": 420414, "epoch": 2502} {"train_loss": -12.606752395629883, "global_step": 420415, "epoch": 2502} {"train_loss": -12.285663604736328, "global_step": 420416, "epoch": 2502} {"train_loss": -12.760772705078125, "global_step": 420417, "epoch": 2502} {"train_loss": -12.560810089111328, "global_step": 420418, "epoch": 2502} {"train_loss": -12.284660339355469, "global_step": 420419, "epoch": 2502} {"train_loss": -12.598426818847656, "global_step": 420420, "epoch": 2502} {"train_loss": -12.495153427124023, "global_step": 420421, "epoch": 2502} {"train_loss": -12.696298599243164, "global_step": 420422, "epoch": 2502} {"train_loss": -12.707448959350586, "global_step": 420423, "epoch": 2502} {"train_loss": -12.482609748840332, "global_step": 420424, "epoch": 2502} {"train_loss": -12.695637702941895, "global_step": 420425, "epoch": 2502} {"train_loss": -12.665452003479004, "global_step": 420426, "epoch": 2502} {"train_loss": -12.474227905273438, "global_step": 420427, "epoch": 2502} {"train_loss": -12.47395133972168, "global_step": 420428, "epoch": 2502} {"train_loss": -12.515949249267578, "global_step": 420429, "epoch": 2502} {"train_loss": -12.520973205566406, "global_step": 420430, "epoch": 2502} {"train_loss": -12.429126739501953, "global_step": 420431, "epoch": 2502} {"train_loss": -12.60049819946289, "global_step": 420432, "epoch": 2502} {"train_loss": -12.574140548706055, "global_step": 420433, "epoch": 2502} {"train_loss": -12.571569442749023, "global_step": 420434, "epoch": 2502} {"train_loss": -12.602569580078125, "global_step": 420435, "epoch": 2502} {"train_loss": -12.68497085571289, "global_step": 420436, "epoch": 2502} {"train_loss": -12.464273452758789, "global_step": 420437, "epoch": 2502} {"train_loss": -12.060609817504883, "global_step": 420438, "epoch": 2502} {"train_loss": -11.932183265686035, "global_step": 420439, "epoch": 2502} {"train_loss": -12.400968551635742, "global_step": 420440, "epoch": 2502} {"train_loss": -12.179498672485352, "global_step": 420441, "epoch": 2502} {"train_loss": -11.462369918823242, "global_step": 420442, "epoch": 2502} {"train_loss": -11.465713500976562, "global_step": 420443, "epoch": 2502} {"train_loss": -12.525575637817383, "global_step": 420444, "epoch": 2502} {"train_loss": -11.782325744628906, "global_step": 420445, "epoch": 2502} {"train_loss": -11.897799491882324, "global_step": 420446, "epoch": 2502} {"train_loss": -12.341355323791504, "global_step": 420447, "epoch": 2502} {"train_loss": -12.181594848632812, "global_step": 420448, "epoch": 2502} {"train_loss": -11.887483596801758, "global_step": 420449, "epoch": 2502} {"train_loss": -11.990184783935547, "global_step": 420450, "epoch": 2502} {"train_loss": -12.639265060424805, "global_step": 420451, "epoch": 2502} {"train_loss": -12.422144889831543, "global_step": 420452, "epoch": 2502} {"train_loss": -12.119230270385742, "global_step": 420453, "epoch": 2502} {"train_loss": -12.178865432739258, "global_step": 420454, "epoch": 2502} {"train_loss": -11.880086898803711, "global_step": 420455, "epoch": 2502} {"train_loss": -12.118566513061523, "global_step": 420456, "epoch": 2502} {"train_loss": -12.030574798583984, "global_step": 420457, "epoch": 2502} {"train_loss": -11.800768852233887, "global_step": 420458, "epoch": 2502} {"train_loss": -11.862943649291992, "global_step": 420459, "epoch": 2502} {"train_loss": -10.769685745239258, "global_step": 420460, "epoch": 2502} {"train_loss": -11.844110488891602, "global_step": 420461, "epoch": 2502} {"train_loss": -12.00777816772461, "global_step": 420462, "epoch": 2502} {"train_loss": -11.538603782653809, "global_step": 420463, "epoch": 2502} {"train_loss": -11.662485122680664, "global_step": 420464, "epoch": 2502} {"train_loss": -11.505743980407715, "global_step": 420465, "epoch": 2502} {"train_loss": -12.235137939453125, "global_step": 420466, "epoch": 2502} {"train_loss": -11.627427101135254, "global_step": 420467, "epoch": 2502} {"train_loss": -12.159696578979492, "global_step": 420468, "epoch": 2502} {"train_loss": -11.220746994018555, "global_step": 420469, "epoch": 2502} {"train_loss": -11.10597038269043, "global_step": 420470, "epoch": 2502} {"train_loss": -11.483391761779785, "global_step": 420471, "epoch": 2502} {"train_loss": -11.854545593261719, "global_step": 420472, "epoch": 2502} {"train_loss": -11.113245964050293, "global_step": 420473, "epoch": 2502} {"train_loss": -11.510353088378906, "global_step": 420474, "epoch": 2502} {"train_loss": -11.919751167297363, "global_step": 420475, "epoch": 2502} {"train_loss": -10.864607810974121, "global_step": 420476, "epoch": 2502} {"train_loss": -11.533812522888184, "global_step": 420477, "epoch": 2502} {"train_loss": -11.869760513305664, "global_step": 420478, "epoch": 2502} {"train_loss": -11.747417449951172, "global_step": 420479, "epoch": 2502} {"train_loss": -11.724113464355469, "global_step": 420480, "epoch": 2502} {"train_loss": -11.237188339233398, "global_step": 420481, "epoch": 2502} {"train_loss": -12.120492935180664, "global_step": 420482, "epoch": 2502} {"train_loss": -11.596502304077148, "global_step": 420483, "epoch": 2502} {"train_loss": -10.603382110595703, "global_step": 420484, "epoch": 2502} {"train_loss": -10.93172550201416, "global_step": 420485, "epoch": 2502} {"train_loss": -9.844625473022461, "global_step": 420486, "epoch": 2502} {"train_loss": -9.84358024597168, "global_step": 420487, "epoch": 2502} {"train_loss": -11.117752075195312, "global_step": 420488, "epoch": 2502} {"train_loss": -10.520098686218262, "global_step": 420489, "epoch": 2502} {"train_loss": -10.952193260192871, "global_step": 420490, "epoch": 2502} {"train_loss": -11.342365264892578, "global_step": 420491, "epoch": 2502} {"train_loss": -11.260625839233398, "global_step": 420492, "epoch": 2502} {"train_loss": -10.711418151855469, "global_step": 420493, "epoch": 2502} {"train_loss": -11.53786849975586, "global_step": 420494, "epoch": 2502} {"train_loss": -11.07528305053711, "global_step": 420495, "epoch": 2502} {"train_loss": -11.795964241027832, "global_step": 420496, "epoch": 2502} {"train_loss": -10.809743881225586, "global_step": 420497, "epoch": 2502} {"train_loss": -11.983898162841797, "global_step": 420498, "epoch": 2502} {"train_loss": -11.169824600219727, "global_step": 420499, "epoch": 2502} {"train_loss": -12.112173080444336, "global_step": 420500, "epoch": 2502} {"train_loss": -11.136003494262695, "global_step": 420501, "epoch": 2502} {"train_loss": -11.938621520996094, "global_step": 420502, "epoch": 2502} {"train_loss": -12.01017525650206, "global_step": 420503, "epoch": 2502, "val_loss": 306239.0625} {"train_loss": -11.662881851196289, "global_step": 420504, "epoch": 2503} {"train_loss": -11.888079643249512, "global_step": 420505, "epoch": 2503} {"train_loss": -11.948246002197266, "global_step": 420506, "epoch": 2503} {"train_loss": -11.90772533416748, "global_step": 420507, "epoch": 2503} {"train_loss": -11.669889450073242, "global_step": 420508, "epoch": 2503} {"train_loss": -11.984539031982422, "global_step": 420509, "epoch": 2503} {"train_loss": -12.112739562988281, "global_step": 420510, "epoch": 2503} {"train_loss": -12.207663536071777, "global_step": 420511, "epoch": 2503} {"train_loss": -12.047505378723145, "global_step": 420512, "epoch": 2503} {"train_loss": -12.346288681030273, "global_step": 420513, "epoch": 2503} {"train_loss": -11.931146621704102, "global_step": 420514, "epoch": 2503} {"train_loss": -11.70053482055664, "global_step": 420515, "epoch": 2503} {"train_loss": -12.268250465393066, "global_step": 420516, "epoch": 2503} {"train_loss": -11.851042747497559, "global_step": 420517, "epoch": 2503} {"train_loss": -11.809638977050781, "global_step": 420518, "epoch": 2503} {"train_loss": -12.36495304107666, "global_step": 420519, "epoch": 2503} {"train_loss": -11.890640258789062, "global_step": 420520, "epoch": 2503} {"train_loss": -11.807687759399414, "global_step": 420521, "epoch": 2503} {"train_loss": -12.37429141998291, "global_step": 420522, "epoch": 2503} {"train_loss": -11.784357070922852, "global_step": 420523, "epoch": 2503} {"train_loss": -12.349929809570312, "global_step": 420524, "epoch": 2503} {"train_loss": -11.779373168945312, "global_step": 420525, "epoch": 2503} {"train_loss": -11.706019401550293, "global_step": 420526, "epoch": 2503} {"train_loss": -12.200398445129395, "global_step": 420527, "epoch": 2503} {"train_loss": -12.042678833007812, "global_step": 420528, "epoch": 2503} {"train_loss": -12.360908508300781, "global_step": 420529, "epoch": 2503} {"train_loss": -12.353418350219727, "global_step": 420530, "epoch": 2503} {"train_loss": -12.484806060791016, "global_step": 420531, "epoch": 2503} {"train_loss": -12.4769868850708, "global_step": 420532, "epoch": 2503} {"train_loss": -12.212607383728027, "global_step": 420533, "epoch": 2503} {"train_loss": -11.98031997680664, "global_step": 420534, "epoch": 2503} {"train_loss": -12.457376480102539, "global_step": 420535, "epoch": 2503} {"train_loss": -12.146038055419922, "global_step": 420536, "epoch": 2503} {"train_loss": -12.727450370788574, "global_step": 420537, "epoch": 2503} {"train_loss": -12.447454452514648, "global_step": 420538, "epoch": 2503} {"train_loss": -12.593711853027344, "global_step": 420539, "epoch": 2503} {"train_loss": -12.72639274597168, "global_step": 420540, "epoch": 2503} {"train_loss": -12.716541290283203, "global_step": 420541, "epoch": 2503} {"train_loss": -12.546529769897461, "global_step": 420542, "epoch": 2503} {"train_loss": -12.727958679199219, "global_step": 420543, "epoch": 2503} {"train_loss": -12.617170333862305, "global_step": 420544, "epoch": 2503} {"train_loss": -12.789682388305664, "global_step": 420545, "epoch": 2503} {"train_loss": -12.43564224243164, "global_step": 420546, "epoch": 2503} {"train_loss": -12.601067543029785, "global_step": 420547, "epoch": 2503} {"train_loss": -12.88309383392334, "global_step": 420548, "epoch": 2503} {"train_loss": -12.419586181640625, "global_step": 420549, "epoch": 2503} {"train_loss": -12.534767150878906, "global_step": 420550, "epoch": 2503} {"train_loss": -12.715219497680664, "global_step": 420551, "epoch": 2503} {"train_loss": -12.645727157592773, "global_step": 420552, "epoch": 2503} {"train_loss": -12.407829284667969, "global_step": 420553, "epoch": 2503} {"train_loss": -12.699088096618652, "global_step": 420554, "epoch": 2503} {"train_loss": -12.765920639038086, "global_step": 420555, "epoch": 2503} {"train_loss": -12.67596435546875, "global_step": 420556, "epoch": 2503} {"train_loss": -12.766288757324219, "global_step": 420557, "epoch": 2503} {"train_loss": -12.533088684082031, "global_step": 420558, "epoch": 2503} {"train_loss": -12.762346267700195, "global_step": 420559, "epoch": 2503} {"train_loss": -12.575910568237305, "global_step": 420560, "epoch": 2503} {"train_loss": -12.440685272216797, "global_step": 420561, "epoch": 2503} {"train_loss": -12.593419075012207, "global_step": 420562, "epoch": 2503} {"train_loss": -12.482133865356445, "global_step": 420563, "epoch": 2503} {"train_loss": -12.204080581665039, "global_step": 420564, "epoch": 2503} {"train_loss": -12.78213119506836, "global_step": 420565, "epoch": 2503} {"train_loss": -12.355966567993164, "global_step": 420566, "epoch": 2503} {"train_loss": -12.734882354736328, "global_step": 420567, "epoch": 2503} {"train_loss": -12.491151809692383, "global_step": 420568, "epoch": 2503} {"train_loss": -12.507529258728027, "global_step": 420569, "epoch": 2503} {"train_loss": -12.728557586669922, "global_step": 420570, "epoch": 2503} {"train_loss": -12.532102584838867, "global_step": 420571, "epoch": 2503} {"train_loss": -12.50625991821289, "global_step": 420572, "epoch": 2503} {"train_loss": -12.753442764282227, "global_step": 420573, "epoch": 2503} {"train_loss": -12.777129173278809, "global_step": 420574, "epoch": 2503} {"train_loss": -12.49406909942627, "global_step": 420575, "epoch": 2503} {"train_loss": -12.596039772033691, "global_step": 420576, "epoch": 2503} {"train_loss": -12.583394050598145, "global_step": 420577, "epoch": 2503} {"train_loss": -12.378229141235352, "global_step": 420578, "epoch": 2503} {"train_loss": -12.060443878173828, "global_step": 420579, "epoch": 2503} {"train_loss": -12.653460502624512, "global_step": 420580, "epoch": 2503} {"train_loss": -12.612869262695312, "global_step": 420581, "epoch": 2503} {"train_loss": -12.425386428833008, "global_step": 420582, "epoch": 2503} {"train_loss": -12.707719802856445, "global_step": 420583, "epoch": 2503} {"train_loss": -12.90043830871582, "global_step": 420584, "epoch": 2503} {"train_loss": -12.26528549194336, "global_step": 420585, "epoch": 2503} {"train_loss": -12.19942855834961, "global_step": 420586, "epoch": 2503} {"train_loss": -12.512523651123047, "global_step": 420587, "epoch": 2503} {"train_loss": -12.765480041503906, "global_step": 420588, "epoch": 2503} {"train_loss": -12.143521308898926, "global_step": 420589, "epoch": 2503} {"train_loss": -12.423690795898438, "global_step": 420590, "epoch": 2503} {"train_loss": -12.563295364379883, "global_step": 420591, "epoch": 2503} {"train_loss": -12.205376625061035, "global_step": 420592, "epoch": 2503} {"train_loss": -12.470077514648438, "global_step": 420593, "epoch": 2503} {"train_loss": -12.886850357055664, "global_step": 420594, "epoch": 2503} {"train_loss": -12.759740829467773, "global_step": 420595, "epoch": 2503} {"train_loss": -12.782801628112793, "global_step": 420596, "epoch": 2503} {"train_loss": -11.872550964355469, "global_step": 420597, "epoch": 2503} {"train_loss": -12.026932716369629, "global_step": 420598, "epoch": 2503} {"train_loss": -12.611173629760742, "global_step": 420599, "epoch": 2503} {"train_loss": -12.45528793334961, "global_step": 420600, "epoch": 2503} {"train_loss": -11.986666679382324, "global_step": 420601, "epoch": 2503} {"train_loss": -11.833779335021973, "global_step": 420602, "epoch": 2503} {"train_loss": -12.340429306030273, "global_step": 420603, "epoch": 2503} {"train_loss": -11.372784614562988, "global_step": 420604, "epoch": 2503} {"train_loss": -11.586833953857422, "global_step": 420605, "epoch": 2503} {"train_loss": -11.841272354125977, "global_step": 420606, "epoch": 2503} {"train_loss": -11.98041820526123, "global_step": 420607, "epoch": 2503} {"train_loss": -11.932366371154785, "global_step": 420608, "epoch": 2503} {"train_loss": -12.689210891723633, "global_step": 420609, "epoch": 2503} {"train_loss": -12.2904634475708, "global_step": 420610, "epoch": 2503} {"train_loss": -12.645444869995117, "global_step": 420611, "epoch": 2503} {"train_loss": -12.266676902770996, "global_step": 420612, "epoch": 2503} {"train_loss": -12.540085792541504, "global_step": 420613, "epoch": 2503} {"train_loss": -12.475850105285645, "global_step": 420614, "epoch": 2503} {"train_loss": -12.80978775024414, "global_step": 420615, "epoch": 2503} {"train_loss": -11.964438438415527, "global_step": 420616, "epoch": 2503} {"train_loss": -12.740957260131836, "global_step": 420617, "epoch": 2503} {"train_loss": -12.13929271697998, "global_step": 420618, "epoch": 2503} {"train_loss": -11.699201583862305, "global_step": 420619, "epoch": 2503} {"train_loss": -11.633075714111328, "global_step": 420620, "epoch": 2503} {"train_loss": -12.46880054473877, "global_step": 420621, "epoch": 2503} {"train_loss": -11.358175277709961, "global_step": 420622, "epoch": 2503} {"train_loss": -12.244563102722168, "global_step": 420623, "epoch": 2503} {"train_loss": -11.8269681930542, "global_step": 420624, "epoch": 2503} {"train_loss": -11.689180374145508, "global_step": 420625, "epoch": 2503} {"train_loss": -12.032206535339355, "global_step": 420626, "epoch": 2503} {"train_loss": -11.394794464111328, "global_step": 420627, "epoch": 2503} {"train_loss": -11.87285041809082, "global_step": 420628, "epoch": 2503} {"train_loss": -10.918601036071777, "global_step": 420629, "epoch": 2503} {"train_loss": -11.563875198364258, "global_step": 420630, "epoch": 2503} {"train_loss": -10.665328979492188, "global_step": 420631, "epoch": 2503} {"train_loss": -11.957805633544922, "global_step": 420632, "epoch": 2503} {"train_loss": -12.044073104858398, "global_step": 420633, "epoch": 2503} {"train_loss": -11.618915557861328, "global_step": 420634, "epoch": 2503} {"train_loss": -12.168205261230469, "global_step": 420635, "epoch": 2503} {"train_loss": -12.27291488647461, "global_step": 420636, "epoch": 2503} {"train_loss": -12.3997802734375, "global_step": 420637, "epoch": 2503} {"train_loss": -12.44345474243164, "global_step": 420638, "epoch": 2503} {"train_loss": -12.224069595336914, "global_step": 420639, "epoch": 2503} {"train_loss": -12.243081092834473, "global_step": 420640, "epoch": 2503} {"train_loss": -12.401397705078125, "global_step": 420641, "epoch": 2503} {"train_loss": -12.239431381225586, "global_step": 420642, "epoch": 2503} {"train_loss": -12.595745086669922, "global_step": 420643, "epoch": 2503} {"train_loss": -12.46462345123291, "global_step": 420644, "epoch": 2503} {"train_loss": -12.70915412902832, "global_step": 420645, "epoch": 2503} {"train_loss": -12.452112197875977, "global_step": 420646, "epoch": 2503} {"train_loss": -12.488431930541992, "global_step": 420647, "epoch": 2503} {"train_loss": -12.390475273132324, "global_step": 420648, "epoch": 2503} {"train_loss": -12.101762771606445, "global_step": 420649, "epoch": 2503} {"train_loss": -12.285022735595703, "global_step": 420650, "epoch": 2503} {"train_loss": -12.587029457092285, "global_step": 420651, "epoch": 2503} {"train_loss": -12.239091873168945, "global_step": 420652, "epoch": 2503} {"train_loss": -12.310077667236328, "global_step": 420653, "epoch": 2503} {"train_loss": -12.473230361938477, "global_step": 420654, "epoch": 2503} {"train_loss": -11.912633895874023, "global_step": 420655, "epoch": 2503} {"train_loss": -12.086681365966797, "global_step": 420656, "epoch": 2503} {"train_loss": -11.77046012878418, "global_step": 420657, "epoch": 2503} {"train_loss": -12.400989532470703, "global_step": 420658, "epoch": 2503} {"train_loss": -12.056339263916016, "global_step": 420659, "epoch": 2503} {"train_loss": -12.410992622375488, "global_step": 420660, "epoch": 2503} {"train_loss": -12.320255279541016, "global_step": 420661, "epoch": 2503} {"train_loss": -12.205427169799805, "global_step": 420662, "epoch": 2503} {"train_loss": -12.030754089355469, "global_step": 420663, "epoch": 2503} {"train_loss": -12.363807678222656, "global_step": 420664, "epoch": 2503} {"train_loss": -12.249929428100586, "global_step": 420665, "epoch": 2503} {"train_loss": -11.823226928710938, "global_step": 420666, "epoch": 2503} {"train_loss": -11.53083610534668, "global_step": 420667, "epoch": 2503} {"train_loss": -12.514398574829102, "global_step": 420668, "epoch": 2503} {"train_loss": -12.042108535766602, "global_step": 420669, "epoch": 2503} {"train_loss": -12.54659366607666, "global_step": 420670, "epoch": 2503} {"train_loss": -12.274620606785728, "global_step": 420671, "epoch": 2503, "val_loss": 305311.09375} {"train_loss": -11.67137336730957, "global_step": 420672, "epoch": 2504} {"train_loss": -11.818047523498535, "global_step": 420673, "epoch": 2504} {"train_loss": -12.440702438354492, "global_step": 420674, "epoch": 2504} {"train_loss": -12.14786434173584, "global_step": 420675, "epoch": 2504} {"train_loss": -11.981209754943848, "global_step": 420676, "epoch": 2504} {"train_loss": -12.222557067871094, "global_step": 420677, "epoch": 2504} {"train_loss": -11.662124633789062, "global_step": 420678, "epoch": 2504} {"train_loss": -12.169509887695312, "global_step": 420679, "epoch": 2504} {"train_loss": -11.338788032531738, "global_step": 420680, "epoch": 2504} {"train_loss": -11.828391075134277, "global_step": 420681, "epoch": 2504} {"train_loss": -10.785970687866211, "global_step": 420682, "epoch": 2504} {"train_loss": -11.912196159362793, "global_step": 420683, "epoch": 2504} {"train_loss": -10.898479461669922, "global_step": 420684, "epoch": 2504} {"train_loss": -11.619938850402832, "global_step": 420685, "epoch": 2504} {"train_loss": -11.528157234191895, "global_step": 420686, "epoch": 2504} {"train_loss": -10.248430252075195, "global_step": 420687, "epoch": 2504} {"train_loss": -11.891402244567871, "global_step": 420688, "epoch": 2504} {"train_loss": -10.546455383300781, "global_step": 420689, "epoch": 2504} {"train_loss": -11.271760940551758, "global_step": 420690, "epoch": 2504} {"train_loss": -11.436519622802734, "global_step": 420691, "epoch": 2504} {"train_loss": -10.948917388916016, "global_step": 420692, "epoch": 2504} {"train_loss": -11.869333267211914, "global_step": 420693, "epoch": 2504} {"train_loss": -10.447525024414062, "global_step": 420694, "epoch": 2504} {"train_loss": -12.102434158325195, "global_step": 420695, "epoch": 2504} {"train_loss": -11.531620025634766, "global_step": 420696, "epoch": 2504} {"train_loss": -11.36172103881836, "global_step": 420697, "epoch": 2504} {"train_loss": -11.888174057006836, "global_step": 420698, "epoch": 2504} {"train_loss": -11.57581901550293, "global_step": 420699, "epoch": 2504} {"train_loss": -11.987866401672363, "global_step": 420700, "epoch": 2504} {"train_loss": -10.739359855651855, "global_step": 420701, "epoch": 2504} {"train_loss": -12.090063095092773, "global_step": 420702, "epoch": 2504} {"train_loss": -10.869647979736328, "global_step": 420703, "epoch": 2504} {"train_loss": -11.900041580200195, "global_step": 420704, "epoch": 2504} {"train_loss": -11.936882019042969, "global_step": 420705, "epoch": 2504} {"train_loss": -11.418363571166992, "global_step": 420706, "epoch": 2504} {"train_loss": -11.802026748657227, "global_step": 420707, "epoch": 2504} {"train_loss": -11.900753021240234, "global_step": 420708, "epoch": 2504} {"train_loss": -11.427201271057129, "global_step": 420709, "epoch": 2504} {"train_loss": -12.04810905456543, "global_step": 420710, "epoch": 2504} {"train_loss": -11.859451293945312, "global_step": 420711, "epoch": 2504} {"train_loss": -12.115589141845703, "global_step": 420712, "epoch": 2504} {"train_loss": -11.807350158691406, "global_step": 420713, "epoch": 2504} {"train_loss": -12.26462459564209, "global_step": 420714, "epoch": 2504} {"train_loss": -11.946718215942383, "global_step": 420715, "epoch": 2504} {"train_loss": -12.008441925048828, "global_step": 420716, "epoch": 2504} {"train_loss": -12.039949417114258, "global_step": 420717, "epoch": 2504} {"train_loss": -11.554254531860352, "global_step": 420718, "epoch": 2504} {"train_loss": -12.1360445022583, "global_step": 420719, "epoch": 2504} {"train_loss": -11.873313903808594, "global_step": 420720, "epoch": 2504} {"train_loss": -12.518033981323242, "global_step": 420721, "epoch": 2504} {"train_loss": -11.908821105957031, "global_step": 420722, "epoch": 2504} {"train_loss": -12.085590362548828, "global_step": 420723, "epoch": 2504} {"train_loss": -12.092578887939453, "global_step": 420724, "epoch": 2504} {"train_loss": -12.539506912231445, "global_step": 420725, "epoch": 2504} {"train_loss": -12.368364334106445, "global_step": 420726, "epoch": 2504} {"train_loss": -11.951536178588867, "global_step": 420727, "epoch": 2504} {"train_loss": -12.338701248168945, "global_step": 420728, "epoch": 2504} {"train_loss": -12.450944900512695, "global_step": 420729, "epoch": 2504} {"train_loss": -12.398386001586914, "global_step": 420730, "epoch": 2504} {"train_loss": -12.10584831237793, "global_step": 420731, "epoch": 2504} {"train_loss": -12.443974494934082, "global_step": 420732, "epoch": 2504} {"train_loss": -12.491296768188477, "global_step": 420733, "epoch": 2504} {"train_loss": -12.444774627685547, "global_step": 420734, "epoch": 2504} {"train_loss": -12.185196876525879, "global_step": 420735, "epoch": 2504} {"train_loss": -12.352274894714355, "global_step": 420736, "epoch": 2504} {"train_loss": -12.390528678894043, "global_step": 420737, "epoch": 2504} {"train_loss": -12.47279167175293, "global_step": 420738, "epoch": 2504} {"train_loss": -12.231668472290039, "global_step": 420739, "epoch": 2504} {"train_loss": -12.370031356811523, "global_step": 420740, "epoch": 2504} {"train_loss": -12.450839042663574, "global_step": 420741, "epoch": 2504} {"train_loss": -12.415096282958984, "global_step": 420742, "epoch": 2504} {"train_loss": -12.347871780395508, "global_step": 420743, "epoch": 2504} {"train_loss": -12.415788650512695, "global_step": 420744, "epoch": 2504} {"train_loss": -12.3164701461792, "global_step": 420745, "epoch": 2504} {"train_loss": -12.618295669555664, "global_step": 420746, "epoch": 2504} {"train_loss": -12.21407413482666, "global_step": 420747, "epoch": 2504} {"train_loss": -12.582725524902344, "global_step": 420748, "epoch": 2504} {"train_loss": -12.147863388061523, "global_step": 420749, "epoch": 2504} {"train_loss": -12.636404037475586, "global_step": 420750, "epoch": 2504} {"train_loss": -12.56384563446045, "global_step": 420751, "epoch": 2504} {"train_loss": -12.331676483154297, "global_step": 420752, "epoch": 2504} {"train_loss": -12.303556442260742, "global_step": 420753, "epoch": 2504} {"train_loss": -12.328760147094727, "global_step": 420754, "epoch": 2504} {"train_loss": -12.33277702331543, "global_step": 420755, "epoch": 2504} {"train_loss": -12.458656311035156, "global_step": 420756, "epoch": 2504} {"train_loss": -12.333789825439453, "global_step": 420757, "epoch": 2504} {"train_loss": -12.203523635864258, "global_step": 420758, "epoch": 2504} {"train_loss": -12.574991226196289, "global_step": 420759, "epoch": 2504} {"train_loss": -12.684593200683594, "global_step": 420760, "epoch": 2504} {"train_loss": -12.283903121948242, "global_step": 420761, "epoch": 2504} {"train_loss": -12.813821792602539, "global_step": 420762, "epoch": 2504} {"train_loss": -12.329729080200195, "global_step": 420763, "epoch": 2504} {"train_loss": -12.245457649230957, "global_step": 420764, "epoch": 2504} {"train_loss": -12.112199783325195, "global_step": 420765, "epoch": 2504} {"train_loss": -12.514760971069336, "global_step": 420766, "epoch": 2504} {"train_loss": -12.137053489685059, "global_step": 420767, "epoch": 2504} {"train_loss": -12.505451202392578, "global_step": 420768, "epoch": 2504} {"train_loss": -12.120874404907227, "global_step": 420769, "epoch": 2504} {"train_loss": -12.679637908935547, "global_step": 420770, "epoch": 2504} {"train_loss": -12.230856895446777, "global_step": 420771, "epoch": 2504} {"train_loss": -12.642956733703613, "global_step": 420772, "epoch": 2504} {"train_loss": -11.961631774902344, "global_step": 420773, "epoch": 2504} {"train_loss": -12.03113079071045, "global_step": 420774, "epoch": 2504} {"train_loss": -11.674423217773438, "global_step": 420775, "epoch": 2504} {"train_loss": -11.922065734863281, "global_step": 420776, "epoch": 2504} {"train_loss": -11.927802085876465, "global_step": 420777, "epoch": 2504} {"train_loss": -11.8292875289917, "global_step": 420778, "epoch": 2504} {"train_loss": -12.144287109375, "global_step": 420779, "epoch": 2504} {"train_loss": -11.826797485351562, "global_step": 420780, "epoch": 2504} {"train_loss": -12.185160636901855, "global_step": 420781, "epoch": 2504} {"train_loss": -11.712602615356445, "global_step": 420782, "epoch": 2504} {"train_loss": -12.300061225891113, "global_step": 420783, "epoch": 2504} {"train_loss": -12.221959114074707, "global_step": 420784, "epoch": 2504} {"train_loss": -12.460016250610352, "global_step": 420785, "epoch": 2504} {"train_loss": -12.198179244995117, "global_step": 420786, "epoch": 2504} {"train_loss": -12.047491073608398, "global_step": 420787, "epoch": 2504} {"train_loss": -11.744653701782227, "global_step": 420788, "epoch": 2504} {"train_loss": -12.27042007446289, "global_step": 420789, "epoch": 2504} {"train_loss": -12.102359771728516, "global_step": 420790, "epoch": 2504} {"train_loss": -12.097915649414062, "global_step": 420791, "epoch": 2504} {"train_loss": -12.373357772827148, "global_step": 420792, "epoch": 2504} {"train_loss": -12.371623992919922, "global_step": 420793, "epoch": 2504} {"train_loss": -11.539223670959473, "global_step": 420794, "epoch": 2504} {"train_loss": -11.984761238098145, "global_step": 420795, "epoch": 2504} {"train_loss": -11.946703910827637, "global_step": 420796, "epoch": 2504} {"train_loss": -11.325530052185059, "global_step": 420797, "epoch": 2504} {"train_loss": -11.824657440185547, "global_step": 420798, "epoch": 2504} {"train_loss": -12.131269454956055, "global_step": 420799, "epoch": 2504} {"train_loss": -11.814889907836914, "global_step": 420800, "epoch": 2504} {"train_loss": -11.668374061584473, "global_step": 420801, "epoch": 2504} {"train_loss": -11.523737907409668, "global_step": 420802, "epoch": 2504} {"train_loss": -12.252418518066406, "global_step": 420803, "epoch": 2504} {"train_loss": -11.11627197265625, "global_step": 420804, "epoch": 2504} {"train_loss": -11.5975341796875, "global_step": 420805, "epoch": 2504} {"train_loss": -10.823348999023438, "global_step": 420806, "epoch": 2504} {"train_loss": -10.80177116394043, "global_step": 420807, "epoch": 2504} {"train_loss": -11.094991683959961, "global_step": 420808, "epoch": 2504} {"train_loss": -10.606767654418945, "global_step": 420809, "epoch": 2504} {"train_loss": -11.070062637329102, "global_step": 420810, "epoch": 2504} {"train_loss": -11.550275802612305, "global_step": 420811, "epoch": 2504} {"train_loss": -9.878291130065918, "global_step": 420812, "epoch": 2504} {"train_loss": -11.188753128051758, "global_step": 420813, "epoch": 2504} {"train_loss": -10.574813842773438, "global_step": 420814, "epoch": 2504} {"train_loss": -10.354875564575195, "global_step": 420815, "epoch": 2504} {"train_loss": -11.108308792114258, "global_step": 420816, "epoch": 2504} {"train_loss": -10.972034454345703, "global_step": 420817, "epoch": 2504} {"train_loss": -11.30032730102539, "global_step": 420818, "epoch": 2504} {"train_loss": -12.01671028137207, "global_step": 420819, "epoch": 2504} {"train_loss": -10.954145431518555, "global_step": 420820, "epoch": 2504} {"train_loss": -11.470782279968262, "global_step": 420821, "epoch": 2504} {"train_loss": -11.555994033813477, "global_step": 420822, "epoch": 2504} {"train_loss": -11.716665267944336, "global_step": 420823, "epoch": 2504} {"train_loss": -11.892873764038086, "global_step": 420824, "epoch": 2504} {"train_loss": -11.587394714355469, "global_step": 420825, "epoch": 2504} {"train_loss": -11.675443649291992, "global_step": 420826, "epoch": 2504} {"train_loss": -11.542695045471191, "global_step": 420827, "epoch": 2504} {"train_loss": -12.012081146240234, "global_step": 420828, "epoch": 2504} {"train_loss": -11.658002853393555, "global_step": 420829, "epoch": 2504} {"train_loss": -11.780567169189453, "global_step": 420830, "epoch": 2504} {"train_loss": -12.27756118774414, "global_step": 420831, "epoch": 2504} {"train_loss": -12.272163391113281, "global_step": 420832, "epoch": 2504} {"train_loss": -11.890324592590332, "global_step": 420833, "epoch": 2504} {"train_loss": -12.365619659423828, "global_step": 420834, "epoch": 2504} {"train_loss": -12.238736152648926, "global_step": 420835, "epoch": 2504} {"train_loss": -12.16723346710205, "global_step": 420836, "epoch": 2504} {"train_loss": -12.334171295166016, "global_step": 420837, "epoch": 2504} {"train_loss": -12.46218204498291, "global_step": 420838, "epoch": 2504} {"train_loss": -11.902468669982184, "global_step": 420839, "epoch": 2504, "val_loss": 307663.6875} {"train_loss": -12.451129913330078, "global_step": 420840, "epoch": 2505} {"train_loss": -12.263995170593262, "global_step": 420841, "epoch": 2505} {"train_loss": -12.57584285736084, "global_step": 420842, "epoch": 2505} {"train_loss": -12.415037155151367, "global_step": 420843, "epoch": 2505} {"train_loss": -12.308221817016602, "global_step": 420844, "epoch": 2505} {"train_loss": -12.22574520111084, "global_step": 420845, "epoch": 2505} {"train_loss": -12.243685722351074, "global_step": 420846, "epoch": 2505} {"train_loss": -12.302427291870117, "global_step": 420847, "epoch": 2505} {"train_loss": -12.165163040161133, "global_step": 420848, "epoch": 2505} {"train_loss": -12.491358757019043, "global_step": 420849, "epoch": 2505} {"train_loss": -12.211091995239258, "global_step": 420850, "epoch": 2505} {"train_loss": -12.284636497497559, "global_step": 420851, "epoch": 2505} {"train_loss": -11.9395170211792, "global_step": 420852, "epoch": 2505} {"train_loss": -12.052070617675781, "global_step": 420853, "epoch": 2505} {"train_loss": -12.337718963623047, "global_step": 420854, "epoch": 2505} {"train_loss": -12.321142196655273, "global_step": 420855, "epoch": 2505} {"train_loss": -12.45085334777832, "global_step": 420856, "epoch": 2505} {"train_loss": -12.357101440429688, "global_step": 420857, "epoch": 2505} {"train_loss": -12.351515769958496, "global_step": 420858, "epoch": 2505} {"train_loss": -12.700506210327148, "global_step": 420859, "epoch": 2505} {"train_loss": -12.305669784545898, "global_step": 420860, "epoch": 2505} {"train_loss": -12.616331100463867, "global_step": 420861, "epoch": 2505} {"train_loss": -12.318427085876465, "global_step": 420862, "epoch": 2505} {"train_loss": -12.253440856933594, "global_step": 420863, "epoch": 2505} {"train_loss": -12.301395416259766, "global_step": 420864, "epoch": 2505} {"train_loss": -12.308256149291992, "global_step": 420865, "epoch": 2505} {"train_loss": -12.532939910888672, "global_step": 420866, "epoch": 2505} {"train_loss": -12.165143966674805, "global_step": 420867, "epoch": 2505} {"train_loss": -12.621337890625, "global_step": 420868, "epoch": 2505} {"train_loss": -12.510284423828125, "global_step": 420869, "epoch": 2505} {"train_loss": -12.785261154174805, "global_step": 420870, "epoch": 2505} {"train_loss": -12.542750358581543, "global_step": 420871, "epoch": 2505} {"train_loss": -12.34713363647461, "global_step": 420872, "epoch": 2505} {"train_loss": -12.649664878845215, "global_step": 420873, "epoch": 2505} {"train_loss": -12.20283031463623, "global_step": 420874, "epoch": 2505} {"train_loss": -12.739603042602539, "global_step": 420875, "epoch": 2505} {"train_loss": -12.448233604431152, "global_step": 420876, "epoch": 2505} {"train_loss": -12.81494140625, "global_step": 420877, "epoch": 2505} {"train_loss": -12.711795806884766, "global_step": 420878, "epoch": 2505} {"train_loss": -12.815838813781738, "global_step": 420879, "epoch": 2505} {"train_loss": -12.755794525146484, "global_step": 420880, "epoch": 2505} {"train_loss": -12.379358291625977, "global_step": 420881, "epoch": 2505} {"train_loss": -12.72269058227539, "global_step": 420882, "epoch": 2505} {"train_loss": -12.736082077026367, "global_step": 420883, "epoch": 2505} {"train_loss": -12.660955429077148, "global_step": 420884, "epoch": 2505} {"train_loss": -12.39577865600586, "global_step": 420885, "epoch": 2505} {"train_loss": -12.4261474609375, "global_step": 420886, "epoch": 2505} {"train_loss": -12.529767990112305, "global_step": 420887, "epoch": 2505} {"train_loss": -12.408737182617188, "global_step": 420888, "epoch": 2505} {"train_loss": -12.45170783996582, "global_step": 420889, "epoch": 2505} {"train_loss": -12.702001571655273, "global_step": 420890, "epoch": 2505} {"train_loss": -12.402546882629395, "global_step": 420891, "epoch": 2505} {"train_loss": -12.683372497558594, "global_step": 420892, "epoch": 2505} {"train_loss": -12.80428409576416, "global_step": 420893, "epoch": 2505} {"train_loss": -12.657449722290039, "global_step": 420894, "epoch": 2505} {"train_loss": -12.647239685058594, "global_step": 420895, "epoch": 2505} {"train_loss": -12.762788772583008, "global_step": 420896, "epoch": 2505} {"train_loss": -12.671276092529297, "global_step": 420897, "epoch": 2505} {"train_loss": -12.48252010345459, "global_step": 420898, "epoch": 2505} {"train_loss": -12.145350456237793, "global_step": 420899, "epoch": 2505} {"train_loss": -12.484437942504883, "global_step": 420900, "epoch": 2505} {"train_loss": -12.67265796661377, "global_step": 420901, "epoch": 2505} {"train_loss": -12.638835906982422, "global_step": 420902, "epoch": 2505} {"train_loss": -12.597728729248047, "global_step": 420903, "epoch": 2505} {"train_loss": -12.837526321411133, "global_step": 420904, "epoch": 2505} {"train_loss": -12.223003387451172, "global_step": 420905, "epoch": 2505} {"train_loss": -12.566513061523438, "global_step": 420906, "epoch": 2505} {"train_loss": -12.708195686340332, "global_step": 420907, "epoch": 2505} {"train_loss": -12.647331237792969, "global_step": 420908, "epoch": 2505} {"train_loss": -12.51502799987793, "global_step": 420909, "epoch": 2505} {"train_loss": -12.984346389770508, "global_step": 420910, "epoch": 2505} {"train_loss": -12.515212059020996, "global_step": 420911, "epoch": 2505} {"train_loss": -12.676202774047852, "global_step": 420912, "epoch": 2505} {"train_loss": -12.773863792419434, "global_step": 420913, "epoch": 2505} {"train_loss": -12.6177396774292, "global_step": 420914, "epoch": 2505} {"train_loss": -12.59740924835205, "global_step": 420915, "epoch": 2505} {"train_loss": -12.733015060424805, "global_step": 420916, "epoch": 2505} {"train_loss": -12.995935440063477, "global_step": 420917, "epoch": 2505} {"train_loss": -12.738178253173828, "global_step": 420918, "epoch": 2505} {"train_loss": -12.805074691772461, "global_step": 420919, "epoch": 2505} {"train_loss": -12.609001159667969, "global_step": 420920, "epoch": 2505} {"train_loss": -12.546907424926758, "global_step": 420921, "epoch": 2505} {"train_loss": -12.490971565246582, "global_step": 420922, "epoch": 2505} {"train_loss": -12.553963661193848, "global_step": 420923, "epoch": 2505} {"train_loss": -12.538899421691895, "global_step": 420924, "epoch": 2505} {"train_loss": -12.736912727355957, "global_step": 420925, "epoch": 2505} {"train_loss": -12.597492218017578, "global_step": 420926, "epoch": 2505} {"train_loss": -12.730722427368164, "global_step": 420927, "epoch": 2505} {"train_loss": -12.63615608215332, "global_step": 420928, "epoch": 2505} {"train_loss": -12.577020645141602, "global_step": 420929, "epoch": 2505} {"train_loss": -12.529440879821777, "global_step": 420930, "epoch": 2505} {"train_loss": -12.324195861816406, "global_step": 420931, "epoch": 2505} {"train_loss": -11.613138198852539, "global_step": 420932, "epoch": 2505} {"train_loss": -11.184918403625488, "global_step": 420933, "epoch": 2505} {"train_loss": -12.224677085876465, "global_step": 420934, "epoch": 2505} {"train_loss": -12.269037246704102, "global_step": 420935, "epoch": 2505} {"train_loss": -10.986465454101562, "global_step": 420936, "epoch": 2505} {"train_loss": -11.249322891235352, "global_step": 420937, "epoch": 2505} {"train_loss": -12.5566987991333, "global_step": 420938, "epoch": 2505} {"train_loss": -10.514127731323242, "global_step": 420939, "epoch": 2505} {"train_loss": -10.894681930541992, "global_step": 420940, "epoch": 2505} {"train_loss": -12.129674911499023, "global_step": 420941, "epoch": 2505} {"train_loss": -10.363609313964844, "global_step": 420942, "epoch": 2505} {"train_loss": -10.535272598266602, "global_step": 420943, "epoch": 2505} {"train_loss": -11.699045181274414, "global_step": 420944, "epoch": 2505} {"train_loss": -9.269436836242676, "global_step": 420945, "epoch": 2505} {"train_loss": -12.253446578979492, "global_step": 420946, "epoch": 2505} {"train_loss": -9.380786895751953, "global_step": 420947, "epoch": 2505} {"train_loss": -11.463125228881836, "global_step": 420948, "epoch": 2505} {"train_loss": -10.521387100219727, "global_step": 420949, "epoch": 2505} {"train_loss": -10.215761184692383, "global_step": 420950, "epoch": 2505} {"train_loss": -10.211105346679688, "global_step": 420951, "epoch": 2505} {"train_loss": -11.460034370422363, "global_step": 420952, "epoch": 2505} {"train_loss": -10.539348602294922, "global_step": 420953, "epoch": 2505} {"train_loss": -10.241544723510742, "global_step": 420954, "epoch": 2505} {"train_loss": -9.856121063232422, "global_step": 420955, "epoch": 2505} {"train_loss": -10.738398551940918, "global_step": 420956, "epoch": 2505} {"train_loss": -10.759307861328125, "global_step": 420957, "epoch": 2505} {"train_loss": -10.465736389160156, "global_step": 420958, "epoch": 2505} {"train_loss": -10.852375030517578, "global_step": 420959, "epoch": 2505} {"train_loss": -11.574532508850098, "global_step": 420960, "epoch": 2505} {"train_loss": -10.130500793457031, "global_step": 420961, "epoch": 2505} {"train_loss": -11.17989444732666, "global_step": 420962, "epoch": 2505} {"train_loss": -10.313558578491211, "global_step": 420963, "epoch": 2505} {"train_loss": -11.39635944366455, "global_step": 420964, "epoch": 2505} {"train_loss": -11.050665855407715, "global_step": 420965, "epoch": 2505} {"train_loss": -10.160863876342773, "global_step": 420966, "epoch": 2505} {"train_loss": -10.853790283203125, "global_step": 420967, "epoch": 2505} {"train_loss": -11.472238540649414, "global_step": 420968, "epoch": 2505} {"train_loss": -10.459026336669922, "global_step": 420969, "epoch": 2505} {"train_loss": -11.395536422729492, "global_step": 420970, "epoch": 2505} {"train_loss": -11.35100269317627, "global_step": 420971, "epoch": 2505} {"train_loss": -11.443225860595703, "global_step": 420972, "epoch": 2505} {"train_loss": -11.496877670288086, "global_step": 420973, "epoch": 2505} {"train_loss": -11.990493774414062, "global_step": 420974, "epoch": 2505} {"train_loss": -11.797647476196289, "global_step": 420975, "epoch": 2505} {"train_loss": -11.892207145690918, "global_step": 420976, "epoch": 2505} {"train_loss": -11.905088424682617, "global_step": 420977, "epoch": 2505} {"train_loss": -11.527868270874023, "global_step": 420978, "epoch": 2505} {"train_loss": -11.783825874328613, "global_step": 420979, "epoch": 2505} {"train_loss": -11.700152397155762, "global_step": 420980, "epoch": 2505} {"train_loss": -12.260133743286133, "global_step": 420981, "epoch": 2505} {"train_loss": -11.47183609008789, "global_step": 420982, "epoch": 2505} {"train_loss": -11.838614463806152, "global_step": 420983, "epoch": 2505} {"train_loss": -12.096559524536133, "global_step": 420984, "epoch": 2505} {"train_loss": -12.001466751098633, "global_step": 420985, "epoch": 2505} {"train_loss": -11.539532661437988, "global_step": 420986, "epoch": 2505} {"train_loss": -12.015911102294922, "global_step": 420987, "epoch": 2505} {"train_loss": -11.071900367736816, "global_step": 420988, "epoch": 2505} {"train_loss": -12.098686218261719, "global_step": 420989, "epoch": 2505} {"train_loss": -11.936328887939453, "global_step": 420990, "epoch": 2505} {"train_loss": -12.060422897338867, "global_step": 420991, "epoch": 2505} {"train_loss": -11.703605651855469, "global_step": 420992, "epoch": 2505} {"train_loss": -11.95175552368164, "global_step": 420993, "epoch": 2505} {"train_loss": -11.9325532913208, "global_step": 420994, "epoch": 2505} {"train_loss": -12.128900527954102, "global_step": 420995, "epoch": 2505} {"train_loss": -11.71109390258789, "global_step": 420996, "epoch": 2505} {"train_loss": -12.410006523132324, "global_step": 420997, "epoch": 2505} {"train_loss": -11.718379974365234, "global_step": 420998, "epoch": 2505} {"train_loss": -12.420943260192871, "global_step": 420999, "epoch": 2505} {"train_loss": -11.922013282775879, "global_step": 421000, "epoch": 2505} {"train_loss": -12.293859481811523, "global_step": 421001, "epoch": 2505} {"train_loss": -12.213422775268555, "global_step": 421002, "epoch": 2505} {"train_loss": -12.405965805053711, "global_step": 421003, "epoch": 2505} {"train_loss": -11.747686386108398, "global_step": 421004, "epoch": 2505} {"train_loss": -12.225872993469238, "global_step": 421005, "epoch": 2505} {"train_loss": -11.972609519958496, "global_step": 421006, "epoch": 2505} {"train_loss": -12.016952435175577, "global_step": 421007, "epoch": 2505, "val_loss": 306999.78125, "train_action_mse_error": 2.6897315979003906} {"train_loss": -11.86777114868164, "global_step": 421008, "epoch": 2506} {"train_loss": -12.285038948059082, "global_step": 421009, "epoch": 2506} {"train_loss": -12.195990562438965, "global_step": 421010, "epoch": 2506} {"train_loss": -12.401317596435547, "global_step": 421011, "epoch": 2506} {"train_loss": -12.054641723632812, "global_step": 421012, "epoch": 2506} {"train_loss": -12.356539726257324, "global_step": 421013, "epoch": 2506} {"train_loss": -12.30672550201416, "global_step": 421014, "epoch": 2506} {"train_loss": -12.339191436767578, "global_step": 421015, "epoch": 2506} {"train_loss": -11.984404563903809, "global_step": 421016, "epoch": 2506} {"train_loss": -12.59342098236084, "global_step": 421017, "epoch": 2506} {"train_loss": -12.335063934326172, "global_step": 421018, "epoch": 2506} {"train_loss": -12.486082077026367, "global_step": 421019, "epoch": 2506} {"train_loss": -12.265740394592285, "global_step": 421020, "epoch": 2506} {"train_loss": -12.52097225189209, "global_step": 421021, "epoch": 2506} {"train_loss": -12.536758422851562, "global_step": 421022, "epoch": 2506} {"train_loss": -12.434961318969727, "global_step": 421023, "epoch": 2506} {"train_loss": -12.53476333618164, "global_step": 421024, "epoch": 2506} {"train_loss": -12.590463638305664, "global_step": 421025, "epoch": 2506} {"train_loss": -12.284517288208008, "global_step": 421026, "epoch": 2506} {"train_loss": -12.652767181396484, "global_step": 421027, "epoch": 2506} {"train_loss": -12.384929656982422, "global_step": 421028, "epoch": 2506} {"train_loss": -12.645197868347168, "global_step": 421029, "epoch": 2506} {"train_loss": -12.158496856689453, "global_step": 421030, "epoch": 2506} {"train_loss": -12.667228698730469, "global_step": 421031, "epoch": 2506} {"train_loss": -12.641626358032227, "global_step": 421032, "epoch": 2506} {"train_loss": -12.396432876586914, "global_step": 421033, "epoch": 2506} {"train_loss": -12.278286933898926, "global_step": 421034, "epoch": 2506} {"train_loss": -12.661956787109375, "global_step": 421035, "epoch": 2506} {"train_loss": -12.680063247680664, "global_step": 421036, "epoch": 2506} {"train_loss": -12.645923614501953, "global_step": 421037, "epoch": 2506} {"train_loss": -12.553725242614746, "global_step": 421038, "epoch": 2506} {"train_loss": -12.795940399169922, "global_step": 421039, "epoch": 2506} {"train_loss": -12.636630058288574, "global_step": 421040, "epoch": 2506} {"train_loss": -12.774121284484863, "global_step": 421041, "epoch": 2506} {"train_loss": -12.694498062133789, "global_step": 421042, "epoch": 2506} {"train_loss": -12.664863586425781, "global_step": 421043, "epoch": 2506} {"train_loss": -12.715802192687988, "global_step": 421044, "epoch": 2506} {"train_loss": -12.790117263793945, "global_step": 421045, "epoch": 2506} {"train_loss": -12.616913795471191, "global_step": 421046, "epoch": 2506} {"train_loss": -12.462223052978516, "global_step": 421047, "epoch": 2506} {"train_loss": -12.53992748260498, "global_step": 421048, "epoch": 2506} {"train_loss": -12.571871757507324, "global_step": 421049, "epoch": 2506} {"train_loss": -12.562528610229492, "global_step": 421050, "epoch": 2506} {"train_loss": -12.167769432067871, "global_step": 421051, "epoch": 2506} {"train_loss": -12.876276016235352, "global_step": 421052, "epoch": 2506} {"train_loss": -12.58774471282959, "global_step": 421053, "epoch": 2506} {"train_loss": -12.486724853515625, "global_step": 421054, "epoch": 2506} {"train_loss": -12.776253700256348, "global_step": 421055, "epoch": 2506} {"train_loss": -12.784913063049316, "global_step": 421056, "epoch": 2506} {"train_loss": -12.512687683105469, "global_step": 421057, "epoch": 2506} {"train_loss": -12.753814697265625, "global_step": 421058, "epoch": 2506} {"train_loss": -12.668829917907715, "global_step": 421059, "epoch": 2506} {"train_loss": -12.846136093139648, "global_step": 421060, "epoch": 2506} {"train_loss": -12.705299377441406, "global_step": 421061, "epoch": 2506} {"train_loss": -12.824396133422852, "global_step": 421062, "epoch": 2506} {"train_loss": -12.3975830078125, "global_step": 421063, "epoch": 2506} {"train_loss": -12.682668685913086, "global_step": 421064, "epoch": 2506} {"train_loss": -12.405235290527344, "global_step": 421065, "epoch": 2506} {"train_loss": -12.70360279083252, "global_step": 421066, "epoch": 2506} {"train_loss": -12.251720428466797, "global_step": 421067, "epoch": 2506} {"train_loss": -12.26727294921875, "global_step": 421068, "epoch": 2506} {"train_loss": -12.612327575683594, "global_step": 421069, "epoch": 2506} {"train_loss": -12.438495635986328, "global_step": 421070, "epoch": 2506} {"train_loss": -11.670181274414062, "global_step": 421071, "epoch": 2506} {"train_loss": -12.590225219726562, "global_step": 421072, "epoch": 2506} {"train_loss": -12.679919242858887, "global_step": 421073, "epoch": 2506} {"train_loss": -12.343965530395508, "global_step": 421074, "epoch": 2506} {"train_loss": -11.995295524597168, "global_step": 421075, "epoch": 2506} {"train_loss": -12.450847625732422, "global_step": 421076, "epoch": 2506} {"train_loss": -12.104236602783203, "global_step": 421077, "epoch": 2506} {"train_loss": -12.419608116149902, "global_step": 421078, "epoch": 2506} {"train_loss": -12.239006996154785, "global_step": 421079, "epoch": 2506} {"train_loss": -12.475848197937012, "global_step": 421080, "epoch": 2506} {"train_loss": -11.989789962768555, "global_step": 421081, "epoch": 2506} {"train_loss": -12.459272384643555, "global_step": 421082, "epoch": 2506} {"train_loss": -12.586817741394043, "global_step": 421083, "epoch": 2506} {"train_loss": -12.215276718139648, "global_step": 421084, "epoch": 2506} {"train_loss": -12.637421607971191, "global_step": 421085, "epoch": 2506} {"train_loss": -12.040138244628906, "global_step": 421086, "epoch": 2506} {"train_loss": -12.837919235229492, "global_step": 421087, "epoch": 2506} {"train_loss": -12.063161849975586, "global_step": 421088, "epoch": 2506} {"train_loss": -12.172813415527344, "global_step": 421089, "epoch": 2506} {"train_loss": -10.875608444213867, "global_step": 421090, "epoch": 2506} {"train_loss": -11.503999710083008, "global_step": 421091, "epoch": 2506} {"train_loss": -11.634665489196777, "global_step": 421092, "epoch": 2506} {"train_loss": -12.046335220336914, "global_step": 421093, "epoch": 2506} {"train_loss": -12.45787239074707, "global_step": 421094, "epoch": 2506} {"train_loss": -12.270317077636719, "global_step": 421095, "epoch": 2506} {"train_loss": -12.01402473449707, "global_step": 421096, "epoch": 2506} {"train_loss": -12.327154159545898, "global_step": 421097, "epoch": 2506} {"train_loss": -11.49258804321289, "global_step": 421098, "epoch": 2506} {"train_loss": -12.395569801330566, "global_step": 421099, "epoch": 2506} {"train_loss": -11.833163261413574, "global_step": 421100, "epoch": 2506} {"train_loss": -11.98223876953125, "global_step": 421101, "epoch": 2506} {"train_loss": -11.905632972717285, "global_step": 421102, "epoch": 2506} {"train_loss": -12.552112579345703, "global_step": 421103, "epoch": 2506} {"train_loss": -11.972204208374023, "global_step": 421104, "epoch": 2506} {"train_loss": -11.867956161499023, "global_step": 421105, "epoch": 2506} {"train_loss": -11.288196563720703, "global_step": 421106, "epoch": 2506} {"train_loss": -12.284563064575195, "global_step": 421107, "epoch": 2506} {"train_loss": -10.562662124633789, "global_step": 421108, "epoch": 2506} {"train_loss": -10.45853328704834, "global_step": 421109, "epoch": 2506} {"train_loss": -11.893144607543945, "global_step": 421110, "epoch": 2506} {"train_loss": -10.396991729736328, "global_step": 421111, "epoch": 2506} {"train_loss": -9.711928367614746, "global_step": 421112, "epoch": 2506} {"train_loss": -9.84426498413086, "global_step": 421113, "epoch": 2506} {"train_loss": -8.941225051879883, "global_step": 421114, "epoch": 2506} {"train_loss": -10.28438949584961, "global_step": 421115, "epoch": 2506} {"train_loss": -10.666852951049805, "global_step": 421116, "epoch": 2506} {"train_loss": -9.720707893371582, "global_step": 421117, "epoch": 2506} {"train_loss": -10.908819198608398, "global_step": 421118, "epoch": 2506} {"train_loss": -11.050884246826172, "global_step": 421119, "epoch": 2506} {"train_loss": -10.549449920654297, "global_step": 421120, "epoch": 2506} {"train_loss": -11.236637115478516, "global_step": 421121, "epoch": 2506} {"train_loss": -10.964372634887695, "global_step": 421122, "epoch": 2506} {"train_loss": -10.642289161682129, "global_step": 421123, "epoch": 2506} {"train_loss": -12.190771102905273, "global_step": 421124, "epoch": 2506} {"train_loss": -9.315004348754883, "global_step": 421125, "epoch": 2506} {"train_loss": -12.0927734375, "global_step": 421126, "epoch": 2506} {"train_loss": -8.123554229736328, "global_step": 421127, "epoch": 2506} {"train_loss": -11.325712203979492, "global_step": 421128, "epoch": 2506} {"train_loss": -8.810193061828613, "global_step": 421129, "epoch": 2506} {"train_loss": -9.438291549682617, "global_step": 421130, "epoch": 2506} {"train_loss": -10.38673210144043, "global_step": 421131, "epoch": 2506} {"train_loss": -9.227052688598633, "global_step": 421132, "epoch": 2506} {"train_loss": -10.362520217895508, "global_step": 421133, "epoch": 2506} {"train_loss": -9.78715705871582, "global_step": 421134, "epoch": 2506} {"train_loss": -9.48278522491455, "global_step": 421135, "epoch": 2506} {"train_loss": -11.301307678222656, "global_step": 421136, "epoch": 2506} {"train_loss": -10.48869514465332, "global_step": 421137, "epoch": 2506} {"train_loss": -10.384117126464844, "global_step": 421138, "epoch": 2506} {"train_loss": -10.397786140441895, "global_step": 421139, "epoch": 2506} {"train_loss": -9.235279083251953, "global_step": 421140, "epoch": 2506} {"train_loss": -8.867225646972656, "global_step": 421141, "epoch": 2506} {"train_loss": -9.297658920288086, "global_step": 421142, "epoch": 2506} {"train_loss": -10.669000625610352, "global_step": 421143, "epoch": 2506} {"train_loss": -10.737470626831055, "global_step": 421144, "epoch": 2506} {"train_loss": -10.364608764648438, "global_step": 421145, "epoch": 2506} {"train_loss": -10.273916244506836, "global_step": 421146, "epoch": 2506} {"train_loss": -10.63802719116211, "global_step": 421147, "epoch": 2506} {"train_loss": -11.144609451293945, "global_step": 421148, "epoch": 2506} {"train_loss": -11.589656829833984, "global_step": 421149, "epoch": 2506} {"train_loss": -11.626617431640625, "global_step": 421150, "epoch": 2506} {"train_loss": -11.8153076171875, "global_step": 421151, "epoch": 2506} {"train_loss": -11.38093376159668, "global_step": 421152, "epoch": 2506} {"train_loss": -11.29411792755127, "global_step": 421153, "epoch": 2506} {"train_loss": -11.732263565063477, "global_step": 421154, "epoch": 2506} {"train_loss": -11.058749198913574, "global_step": 421155, "epoch": 2506} {"train_loss": -11.193843841552734, "global_step": 421156, "epoch": 2506} {"train_loss": -11.502815246582031, "global_step": 421157, "epoch": 2506} {"train_loss": -11.399848937988281, "global_step": 421158, "epoch": 2506} {"train_loss": -11.605306625366211, "global_step": 421159, "epoch": 2506} {"train_loss": -11.5958251953125, "global_step": 421160, "epoch": 2506} {"train_loss": -11.95769214630127, "global_step": 421161, "epoch": 2506} {"train_loss": -10.99152946472168, "global_step": 421162, "epoch": 2506} {"train_loss": -11.346477508544922, "global_step": 421163, "epoch": 2506} {"train_loss": -11.561840057373047, "global_step": 421164, "epoch": 2506} {"train_loss": -11.474868774414062, "global_step": 421165, "epoch": 2506} {"train_loss": -11.76774787902832, "global_step": 421166, "epoch": 2506} {"train_loss": -11.844430923461914, "global_step": 421167, "epoch": 2506} {"train_loss": -12.063335418701172, "global_step": 421168, "epoch": 2506} {"train_loss": -12.16468334197998, "global_step": 421169, "epoch": 2506} {"train_loss": -11.806585311889648, "global_step": 421170, "epoch": 2506} {"train_loss": -11.911738395690918, "global_step": 421171, "epoch": 2506} {"train_loss": -11.513219833374023, "global_step": 421172, "epoch": 2506} {"train_loss": -11.885854721069336, "global_step": 421173, "epoch": 2506} {"train_loss": -12.06109619140625, "global_step": 421174, "epoch": 2506} {"train_loss": -11.746759312493461, "global_step": 421175, "epoch": 2506, "val_loss": 305385.09375} {"train_loss": -11.978361129760742, "global_step": 421176, "epoch": 2507} {"train_loss": -11.477457046508789, "global_step": 421177, "epoch": 2507} {"train_loss": -12.122057914733887, "global_step": 421178, "epoch": 2507} {"train_loss": -11.717082023620605, "global_step": 421179, "epoch": 2507} {"train_loss": -11.819086074829102, "global_step": 421180, "epoch": 2507} {"train_loss": -11.642305374145508, "global_step": 421181, "epoch": 2507} {"train_loss": -12.28188419342041, "global_step": 421182, "epoch": 2507} {"train_loss": -10.961760520935059, "global_step": 421183, "epoch": 2507} {"train_loss": -12.33169937133789, "global_step": 421184, "epoch": 2507} {"train_loss": -11.862066268920898, "global_step": 421185, "epoch": 2507} {"train_loss": -12.019977569580078, "global_step": 421186, "epoch": 2507} {"train_loss": -11.670211791992188, "global_step": 421187, "epoch": 2507} {"train_loss": -11.71858024597168, "global_step": 421188, "epoch": 2507} {"train_loss": -11.884498596191406, "global_step": 421189, "epoch": 2507} {"train_loss": -11.888359069824219, "global_step": 421190, "epoch": 2507} {"train_loss": -12.11624526977539, "global_step": 421191, "epoch": 2507} {"train_loss": -11.776826858520508, "global_step": 421192, "epoch": 2507} {"train_loss": -12.123185157775879, "global_step": 421193, "epoch": 2507} {"train_loss": -12.051380157470703, "global_step": 421194, "epoch": 2507} {"train_loss": -12.098043441772461, "global_step": 421195, "epoch": 2507} {"train_loss": -12.079349517822266, "global_step": 421196, "epoch": 2507} {"train_loss": -12.069320678710938, "global_step": 421197, "epoch": 2507} {"train_loss": -12.099203109741211, "global_step": 421198, "epoch": 2507} {"train_loss": -12.260388374328613, "global_step": 421199, "epoch": 2507} {"train_loss": -12.421236038208008, "global_step": 421200, "epoch": 2507} {"train_loss": -11.993467330932617, "global_step": 421201, "epoch": 2507} {"train_loss": -12.270257949829102, "global_step": 421202, "epoch": 2507} {"train_loss": -12.250062942504883, "global_step": 421203, "epoch": 2507} {"train_loss": -12.408687591552734, "global_step": 421204, "epoch": 2507} {"train_loss": -12.463050842285156, "global_step": 421205, "epoch": 2507} {"train_loss": -12.216188430786133, "global_step": 421206, "epoch": 2507} {"train_loss": -12.398236274719238, "global_step": 421207, "epoch": 2507} {"train_loss": -12.622917175292969, "global_step": 421208, "epoch": 2507} {"train_loss": -12.416000366210938, "global_step": 421209, "epoch": 2507} {"train_loss": -12.311433792114258, "global_step": 421210, "epoch": 2507} {"train_loss": -12.476816177368164, "global_step": 421211, "epoch": 2507} {"train_loss": -12.20526123046875, "global_step": 421212, "epoch": 2507} {"train_loss": -12.604976654052734, "global_step": 421213, "epoch": 2507} {"train_loss": -12.362325668334961, "global_step": 421214, "epoch": 2507} {"train_loss": -12.463839530944824, "global_step": 421215, "epoch": 2507} {"train_loss": -12.186522483825684, "global_step": 421216, "epoch": 2507} {"train_loss": -12.557594299316406, "global_step": 421217, "epoch": 2507} {"train_loss": -12.232855796813965, "global_step": 421218, "epoch": 2507} {"train_loss": -12.399009704589844, "global_step": 421219, "epoch": 2507} {"train_loss": -12.444986343383789, "global_step": 421220, "epoch": 2507} {"train_loss": -12.492826461791992, "global_step": 421221, "epoch": 2507} {"train_loss": -12.538430213928223, "global_step": 421222, "epoch": 2507} {"train_loss": -12.447874069213867, "global_step": 421223, "epoch": 2507} {"train_loss": -12.425169944763184, "global_step": 421224, "epoch": 2507} {"train_loss": -12.352036476135254, "global_step": 421225, "epoch": 2507} {"train_loss": -12.543750762939453, "global_step": 421226, "epoch": 2507} {"train_loss": -12.569875717163086, "global_step": 421227, "epoch": 2507} {"train_loss": -12.693060874938965, "global_step": 421228, "epoch": 2507} {"train_loss": -12.540096282958984, "global_step": 421229, "epoch": 2507} {"train_loss": -12.478879928588867, "global_step": 421230, "epoch": 2507} {"train_loss": -12.494333267211914, "global_step": 421231, "epoch": 2507} {"train_loss": -12.768754959106445, "global_step": 421232, "epoch": 2507} {"train_loss": -12.255982398986816, "global_step": 421233, "epoch": 2507} {"train_loss": -12.327176094055176, "global_step": 421234, "epoch": 2507} {"train_loss": -12.487010955810547, "global_step": 421235, "epoch": 2507} {"train_loss": -12.32167911529541, "global_step": 421236, "epoch": 2507} {"train_loss": -11.904067993164062, "global_step": 421237, "epoch": 2507} {"train_loss": -12.442405700683594, "global_step": 421238, "epoch": 2507} {"train_loss": -12.428074836730957, "global_step": 421239, "epoch": 2507} {"train_loss": -12.18364429473877, "global_step": 421240, "epoch": 2507} {"train_loss": -12.03817081451416, "global_step": 421241, "epoch": 2507} {"train_loss": -12.619552612304688, "global_step": 421242, "epoch": 2507} {"train_loss": -11.986153602600098, "global_step": 421243, "epoch": 2507} {"train_loss": -12.016626358032227, "global_step": 421244, "epoch": 2507} {"train_loss": -12.41975212097168, "global_step": 421245, "epoch": 2507} {"train_loss": -12.339210510253906, "global_step": 421246, "epoch": 2507} {"train_loss": -12.0139741897583, "global_step": 421247, "epoch": 2507} {"train_loss": -12.149295806884766, "global_step": 421248, "epoch": 2507} {"train_loss": -12.553909301757812, "global_step": 421249, "epoch": 2507} {"train_loss": -12.278773307800293, "global_step": 421250, "epoch": 2507} {"train_loss": -11.92325496673584, "global_step": 421251, "epoch": 2507} {"train_loss": -12.600383758544922, "global_step": 421252, "epoch": 2507} {"train_loss": -11.51302433013916, "global_step": 421253, "epoch": 2507} {"train_loss": -12.32689094543457, "global_step": 421254, "epoch": 2507} {"train_loss": -11.983809471130371, "global_step": 421255, "epoch": 2507} {"train_loss": -11.550590515136719, "global_step": 421256, "epoch": 2507} {"train_loss": -12.196144104003906, "global_step": 421257, "epoch": 2507} {"train_loss": -11.627511978149414, "global_step": 421258, "epoch": 2507} {"train_loss": -11.649940490722656, "global_step": 421259, "epoch": 2507} {"train_loss": -12.303607940673828, "global_step": 421260, "epoch": 2507} {"train_loss": -12.033395767211914, "global_step": 421261, "epoch": 2507} {"train_loss": -11.21122932434082, "global_step": 421262, "epoch": 2507} {"train_loss": -12.54949951171875, "global_step": 421263, "epoch": 2507} {"train_loss": -11.939168930053711, "global_step": 421264, "epoch": 2507} {"train_loss": -11.615415573120117, "global_step": 421265, "epoch": 2507} {"train_loss": -12.184976577758789, "global_step": 421266, "epoch": 2507} {"train_loss": -11.938956260681152, "global_step": 421267, "epoch": 2507} {"train_loss": -12.118916511535645, "global_step": 421268, "epoch": 2507} {"train_loss": -12.242866516113281, "global_step": 421269, "epoch": 2507} {"train_loss": -12.122133255004883, "global_step": 421270, "epoch": 2507} {"train_loss": -12.31862735748291, "global_step": 421271, "epoch": 2507} {"train_loss": -11.88640022277832, "global_step": 421272, "epoch": 2507} {"train_loss": -12.315000534057617, "global_step": 421273, "epoch": 2507} {"train_loss": -12.563886642456055, "global_step": 421274, "epoch": 2507} {"train_loss": -12.084933280944824, "global_step": 421275, "epoch": 2507} {"train_loss": -11.927549362182617, "global_step": 421276, "epoch": 2507} {"train_loss": -11.529409408569336, "global_step": 421277, "epoch": 2507} {"train_loss": -11.826301574707031, "global_step": 421278, "epoch": 2507} {"train_loss": -12.526844024658203, "global_step": 421279, "epoch": 2507} {"train_loss": -12.385285377502441, "global_step": 421280, "epoch": 2507} {"train_loss": -11.993958473205566, "global_step": 421281, "epoch": 2507} {"train_loss": -12.28445053100586, "global_step": 421282, "epoch": 2507} {"train_loss": -12.372751235961914, "global_step": 421283, "epoch": 2507} {"train_loss": -12.133489608764648, "global_step": 421284, "epoch": 2507} {"train_loss": -12.40109920501709, "global_step": 421285, "epoch": 2507} {"train_loss": -12.118124008178711, "global_step": 421286, "epoch": 2507} {"train_loss": -12.675760269165039, "global_step": 421287, "epoch": 2507} {"train_loss": -12.151203155517578, "global_step": 421288, "epoch": 2507} {"train_loss": -12.175135612487793, "global_step": 421289, "epoch": 2507} {"train_loss": -12.474388122558594, "global_step": 421290, "epoch": 2507} {"train_loss": -12.04958724975586, "global_step": 421291, "epoch": 2507} {"train_loss": -12.555727005004883, "global_step": 421292, "epoch": 2507} {"train_loss": -12.595012664794922, "global_step": 421293, "epoch": 2507} {"train_loss": -12.434247970581055, "global_step": 421294, "epoch": 2507} {"train_loss": -12.792755126953125, "global_step": 421295, "epoch": 2507} {"train_loss": -12.264446258544922, "global_step": 421296, "epoch": 2507} {"train_loss": -12.586651802062988, "global_step": 421297, "epoch": 2507} {"train_loss": -12.576030731201172, "global_step": 421298, "epoch": 2507} {"train_loss": -12.594807624816895, "global_step": 421299, "epoch": 2507} {"train_loss": -12.587072372436523, "global_step": 421300, "epoch": 2507} {"train_loss": -12.834503173828125, "global_step": 421301, "epoch": 2507} {"train_loss": -12.573148727416992, "global_step": 421302, "epoch": 2507} {"train_loss": -12.478548049926758, "global_step": 421303, "epoch": 2507} {"train_loss": -12.53521728515625, "global_step": 421304, "epoch": 2507} {"train_loss": -12.663411140441895, "global_step": 421305, "epoch": 2507} {"train_loss": -12.597005844116211, "global_step": 421306, "epoch": 2507} {"train_loss": -12.620525360107422, "global_step": 421307, "epoch": 2507} {"train_loss": -12.617952346801758, "global_step": 421308, "epoch": 2507} {"train_loss": -12.588813781738281, "global_step": 421309, "epoch": 2507} {"train_loss": -12.755880355834961, "global_step": 421310, "epoch": 2507} {"train_loss": -12.560922622680664, "global_step": 421311, "epoch": 2507} {"train_loss": -12.43235969543457, "global_step": 421312, "epoch": 2507} {"train_loss": -12.375329971313477, "global_step": 421313, "epoch": 2507} {"train_loss": -12.880672454833984, "global_step": 421314, "epoch": 2507} {"train_loss": -12.070051193237305, "global_step": 421315, "epoch": 2507} {"train_loss": -12.538370132446289, "global_step": 421316, "epoch": 2507} {"train_loss": -12.555964469909668, "global_step": 421317, "epoch": 2507} {"train_loss": -12.315937042236328, "global_step": 421318, "epoch": 2507} {"train_loss": -12.088476181030273, "global_step": 421319, "epoch": 2507} {"train_loss": -12.132405281066895, "global_step": 421320, "epoch": 2507} {"train_loss": -12.298376083374023, "global_step": 421321, "epoch": 2507} {"train_loss": -12.306124687194824, "global_step": 421322, "epoch": 2507} {"train_loss": -12.32961368560791, "global_step": 421323, "epoch": 2507} {"train_loss": -12.077972412109375, "global_step": 421324, "epoch": 2507} {"train_loss": -12.272969245910645, "global_step": 421325, "epoch": 2507} {"train_loss": -12.531352996826172, "global_step": 421326, "epoch": 2507} {"train_loss": -12.316648483276367, "global_step": 421327, "epoch": 2507} {"train_loss": -12.65782642364502, "global_step": 421328, "epoch": 2507} {"train_loss": -12.462636947631836, "global_step": 421329, "epoch": 2507} {"train_loss": -12.747967720031738, "global_step": 421330, "epoch": 2507} {"train_loss": -12.76816177368164, "global_step": 421331, "epoch": 2507} {"train_loss": -12.643170356750488, "global_step": 421332, "epoch": 2507} {"train_loss": -12.687173843383789, "global_step": 421333, "epoch": 2507} {"train_loss": -12.378070831298828, "global_step": 421334, "epoch": 2507} {"train_loss": -12.798386573791504, "global_step": 421335, "epoch": 2507} {"train_loss": -12.729706764221191, "global_step": 421336, "epoch": 2507} {"train_loss": -12.719115257263184, "global_step": 421337, "epoch": 2507} {"train_loss": -12.506208419799805, "global_step": 421338, "epoch": 2507} {"train_loss": -12.389676094055176, "global_step": 421339, "epoch": 2507} {"train_loss": -12.363271713256836, "global_step": 421340, "epoch": 2507} {"train_loss": -12.561264038085938, "global_step": 421341, "epoch": 2507} {"train_loss": -12.323650360107422, "global_step": 421342, "epoch": 2507} {"train_loss": -12.281430017380487, "global_step": 421343, "epoch": 2507, "val_loss": 307827.46875} {"train_loss": -12.512245178222656, "global_step": 421344, "epoch": 2508} {"train_loss": -11.874870300292969, "global_step": 421345, "epoch": 2508} {"train_loss": -12.089303970336914, "global_step": 421346, "epoch": 2508} {"train_loss": -11.543633460998535, "global_step": 421347, "epoch": 2508} {"train_loss": -12.339045524597168, "global_step": 421348, "epoch": 2508} {"train_loss": -11.32201862335205, "global_step": 421349, "epoch": 2508} {"train_loss": -12.02232837677002, "global_step": 421350, "epoch": 2508} {"train_loss": -11.800670623779297, "global_step": 421351, "epoch": 2508} {"train_loss": -11.648983001708984, "global_step": 421352, "epoch": 2508} {"train_loss": -11.669121742248535, "global_step": 421353, "epoch": 2508} {"train_loss": -10.645563125610352, "global_step": 421354, "epoch": 2508} {"train_loss": -12.19624137878418, "global_step": 421355, "epoch": 2508} {"train_loss": -10.836397171020508, "global_step": 421356, "epoch": 2508} {"train_loss": -11.963708877563477, "global_step": 421357, "epoch": 2508} {"train_loss": -11.912561416625977, "global_step": 421358, "epoch": 2508} {"train_loss": -11.158748626708984, "global_step": 421359, "epoch": 2508} {"train_loss": -11.509821891784668, "global_step": 421360, "epoch": 2508} {"train_loss": -11.158015251159668, "global_step": 421361, "epoch": 2508} {"train_loss": -11.699164390563965, "global_step": 421362, "epoch": 2508} {"train_loss": -11.867124557495117, "global_step": 421363, "epoch": 2508} {"train_loss": -11.09366512298584, "global_step": 421364, "epoch": 2508} {"train_loss": -10.522272109985352, "global_step": 421365, "epoch": 2508} {"train_loss": -11.277956008911133, "global_step": 421366, "epoch": 2508} {"train_loss": -11.270601272583008, "global_step": 421367, "epoch": 2508} {"train_loss": -11.448692321777344, "global_step": 421368, "epoch": 2508} {"train_loss": -11.404013633728027, "global_step": 421369, "epoch": 2508} {"train_loss": -11.823307037353516, "global_step": 421370, "epoch": 2508} {"train_loss": -11.294507026672363, "global_step": 421371, "epoch": 2508} {"train_loss": -11.623373031616211, "global_step": 421372, "epoch": 2508} {"train_loss": -11.379600524902344, "global_step": 421373, "epoch": 2508} {"train_loss": -11.484888076782227, "global_step": 421374, "epoch": 2508} {"train_loss": -12.311455726623535, "global_step": 421375, "epoch": 2508} {"train_loss": -11.461681365966797, "global_step": 421376, "epoch": 2508} {"train_loss": -11.455572128295898, "global_step": 421377, "epoch": 2508} {"train_loss": -12.325716018676758, "global_step": 421378, "epoch": 2508} {"train_loss": -10.932356834411621, "global_step": 421379, "epoch": 2508} {"train_loss": -12.517822265625, "global_step": 421380, "epoch": 2508} {"train_loss": -11.37925910949707, "global_step": 421381, "epoch": 2508} {"train_loss": -12.108550071716309, "global_step": 421382, "epoch": 2508} {"train_loss": -12.12162971496582, "global_step": 421383, "epoch": 2508} {"train_loss": -12.009443283081055, "global_step": 421384, "epoch": 2508} {"train_loss": -11.974471092224121, "global_step": 421385, "epoch": 2508} {"train_loss": -11.946138381958008, "global_step": 421386, "epoch": 2508} {"train_loss": -11.137189865112305, "global_step": 421387, "epoch": 2508} {"train_loss": -11.786235809326172, "global_step": 421388, "epoch": 2508} {"train_loss": -11.652780532836914, "global_step": 421389, "epoch": 2508} {"train_loss": -11.463570594787598, "global_step": 421390, "epoch": 2508} {"train_loss": -11.79442024230957, "global_step": 421391, "epoch": 2508} {"train_loss": -10.768087387084961, "global_step": 421392, "epoch": 2508} {"train_loss": -12.025238037109375, "global_step": 421393, "epoch": 2508} {"train_loss": -11.36929702758789, "global_step": 421394, "epoch": 2508} {"train_loss": -11.72283935546875, "global_step": 421395, "epoch": 2508} {"train_loss": -11.704266548156738, "global_step": 421396, "epoch": 2508} {"train_loss": -11.467894554138184, "global_step": 421397, "epoch": 2508} {"train_loss": -11.466432571411133, "global_step": 421398, "epoch": 2508} {"train_loss": -12.128289222717285, "global_step": 421399, "epoch": 2508} {"train_loss": -11.714083671569824, "global_step": 421400, "epoch": 2508} {"train_loss": -11.930532455444336, "global_step": 421401, "epoch": 2508} {"train_loss": -12.077914237976074, "global_step": 421402, "epoch": 2508} {"train_loss": -11.972000122070312, "global_step": 421403, "epoch": 2508} {"train_loss": -12.27685260772705, "global_step": 421404, "epoch": 2508} {"train_loss": -12.24180793762207, "global_step": 421405, "epoch": 2508} {"train_loss": -12.309174537658691, "global_step": 421406, "epoch": 2508} {"train_loss": -12.040070533752441, "global_step": 421407, "epoch": 2508} {"train_loss": -12.345714569091797, "global_step": 421408, "epoch": 2508} {"train_loss": -12.255542755126953, "global_step": 421409, "epoch": 2508} {"train_loss": -12.475364685058594, "global_step": 421410, "epoch": 2508} {"train_loss": -12.249357223510742, "global_step": 421411, "epoch": 2508} {"train_loss": -12.320369720458984, "global_step": 421412, "epoch": 2508} {"train_loss": -12.374532699584961, "global_step": 421413, "epoch": 2508} {"train_loss": -12.069961547851562, "global_step": 421414, "epoch": 2508} {"train_loss": -12.47850227355957, "global_step": 421415, "epoch": 2508} {"train_loss": -12.145256042480469, "global_step": 421416, "epoch": 2508} {"train_loss": -12.348920822143555, "global_step": 421417, "epoch": 2508} {"train_loss": -12.096405982971191, "global_step": 421418, "epoch": 2508} {"train_loss": -12.08868408203125, "global_step": 421419, "epoch": 2508} {"train_loss": -12.130598068237305, "global_step": 421420, "epoch": 2508} {"train_loss": -12.327255249023438, "global_step": 421421, "epoch": 2508} {"train_loss": -12.18027114868164, "global_step": 421422, "epoch": 2508} {"train_loss": -12.154001235961914, "global_step": 421423, "epoch": 2508} {"train_loss": -12.137563705444336, "global_step": 421424, "epoch": 2508} {"train_loss": -12.283482551574707, "global_step": 421425, "epoch": 2508} {"train_loss": -11.843098640441895, "global_step": 421426, "epoch": 2508} {"train_loss": -12.423337936401367, "global_step": 421427, "epoch": 2508} {"train_loss": -12.025056838989258, "global_step": 421428, "epoch": 2508} {"train_loss": -12.20917797088623, "global_step": 421429, "epoch": 2508} {"train_loss": -12.179463386535645, "global_step": 421430, "epoch": 2508} {"train_loss": -12.166248321533203, "global_step": 421431, "epoch": 2508} {"train_loss": -12.265955924987793, "global_step": 421432, "epoch": 2508} {"train_loss": -11.976685523986816, "global_step": 421433, "epoch": 2508} {"train_loss": -12.063047409057617, "global_step": 421434, "epoch": 2508} {"train_loss": -12.041704177856445, "global_step": 421435, "epoch": 2508} {"train_loss": -12.242364883422852, "global_step": 421436, "epoch": 2508} {"train_loss": -12.105485916137695, "global_step": 421437, "epoch": 2508} {"train_loss": -11.747665405273438, "global_step": 421438, "epoch": 2508} {"train_loss": -12.294836044311523, "global_step": 421439, "epoch": 2508} {"train_loss": -12.572193145751953, "global_step": 421440, "epoch": 2508} {"train_loss": -11.930020332336426, "global_step": 421441, "epoch": 2508} {"train_loss": -12.162513732910156, "global_step": 421442, "epoch": 2508} {"train_loss": -11.944368362426758, "global_step": 421443, "epoch": 2508} {"train_loss": -12.358591079711914, "global_step": 421444, "epoch": 2508} {"train_loss": -12.039481163024902, "global_step": 421445, "epoch": 2508} {"train_loss": -12.471138000488281, "global_step": 421446, "epoch": 2508} {"train_loss": -12.200058937072754, "global_step": 421447, "epoch": 2508} {"train_loss": -12.368539810180664, "global_step": 421448, "epoch": 2508} {"train_loss": -12.497777938842773, "global_step": 421449, "epoch": 2508} {"train_loss": -12.160049438476562, "global_step": 421450, "epoch": 2508} {"train_loss": -12.505518913269043, "global_step": 421451, "epoch": 2508} {"train_loss": -12.258341789245605, "global_step": 421452, "epoch": 2508} {"train_loss": -12.644760131835938, "global_step": 421453, "epoch": 2508} {"train_loss": -11.940896987915039, "global_step": 421454, "epoch": 2508} {"train_loss": -12.694725036621094, "global_step": 421455, "epoch": 2508} {"train_loss": -12.209007263183594, "global_step": 421456, "epoch": 2508} {"train_loss": -12.271007537841797, "global_step": 421457, "epoch": 2508} {"train_loss": -12.426178932189941, "global_step": 421458, "epoch": 2508} {"train_loss": -12.484139442443848, "global_step": 421459, "epoch": 2508} {"train_loss": -12.495620727539062, "global_step": 421460, "epoch": 2508} {"train_loss": -12.621728897094727, "global_step": 421461, "epoch": 2508} {"train_loss": -12.201177597045898, "global_step": 421462, "epoch": 2508} {"train_loss": -12.59458065032959, "global_step": 421463, "epoch": 2508} {"train_loss": -12.486473083496094, "global_step": 421464, "epoch": 2508} {"train_loss": -12.423080444335938, "global_step": 421465, "epoch": 2508} {"train_loss": -12.634944915771484, "global_step": 421466, "epoch": 2508} {"train_loss": -12.704924583435059, "global_step": 421467, "epoch": 2508} {"train_loss": -12.21334457397461, "global_step": 421468, "epoch": 2508} {"train_loss": -12.52231502532959, "global_step": 421469, "epoch": 2508} {"train_loss": -12.413909912109375, "global_step": 421470, "epoch": 2508} {"train_loss": -12.671976089477539, "global_step": 421471, "epoch": 2508} {"train_loss": -12.837896347045898, "global_step": 421472, "epoch": 2508} {"train_loss": -12.383622169494629, "global_step": 421473, "epoch": 2508} {"train_loss": -12.345351219177246, "global_step": 421474, "epoch": 2508} {"train_loss": -12.658672332763672, "global_step": 421475, "epoch": 2508} {"train_loss": -12.386466979980469, "global_step": 421476, "epoch": 2508} {"train_loss": -12.342092514038086, "global_step": 421477, "epoch": 2508} {"train_loss": -12.599453926086426, "global_step": 421478, "epoch": 2508} {"train_loss": -11.937944412231445, "global_step": 421479, "epoch": 2508} {"train_loss": -12.460004806518555, "global_step": 421480, "epoch": 2508} {"train_loss": -12.59033489227295, "global_step": 421481, "epoch": 2508} {"train_loss": -12.35127067565918, "global_step": 421482, "epoch": 2508} {"train_loss": -12.680510520935059, "global_step": 421483, "epoch": 2508} {"train_loss": -12.058727264404297, "global_step": 421484, "epoch": 2508} {"train_loss": -11.7958984375, "global_step": 421485, "epoch": 2508} {"train_loss": -12.136762619018555, "global_step": 421486, "epoch": 2508} {"train_loss": -11.965375900268555, "global_step": 421487, "epoch": 2508} {"train_loss": -12.271190643310547, "global_step": 421488, "epoch": 2508} {"train_loss": -12.045909881591797, "global_step": 421489, "epoch": 2508} {"train_loss": -11.934891700744629, "global_step": 421490, "epoch": 2508} {"train_loss": -11.993066787719727, "global_step": 421491, "epoch": 2508} {"train_loss": -11.741437911987305, "global_step": 421492, "epoch": 2508} {"train_loss": -11.862920761108398, "global_step": 421493, "epoch": 2508} {"train_loss": -11.983224868774414, "global_step": 421494, "epoch": 2508} {"train_loss": -12.156303405761719, "global_step": 421495, "epoch": 2508} {"train_loss": -11.783514022827148, "global_step": 421496, "epoch": 2508} {"train_loss": -12.000799179077148, "global_step": 421497, "epoch": 2508} {"train_loss": -11.946746826171875, "global_step": 421498, "epoch": 2508} {"train_loss": -11.96996021270752, "global_step": 421499, "epoch": 2508} {"train_loss": -12.515369415283203, "global_step": 421500, "epoch": 2508} {"train_loss": -12.279838562011719, "global_step": 421501, "epoch": 2508} {"train_loss": -12.56045150756836, "global_step": 421502, "epoch": 2508} {"train_loss": -12.13611125946045, "global_step": 421503, "epoch": 2508} {"train_loss": -12.613141059875488, "global_step": 421504, "epoch": 2508} {"train_loss": -12.538858413696289, "global_step": 421505, "epoch": 2508} {"train_loss": -12.522186279296875, "global_step": 421506, "epoch": 2508} {"train_loss": -11.686561584472656, "global_step": 421507, "epoch": 2508} {"train_loss": -12.47797679901123, "global_step": 421508, "epoch": 2508} {"train_loss": -12.550893783569336, "global_step": 421509, "epoch": 2508} {"train_loss": -12.140933990478516, "global_step": 421510, "epoch": 2508} {"train_loss": -12.047633290290833, "global_step": 421511, "epoch": 2508, "val_loss": 310797.8125} {"train_loss": -11.909214973449707, "global_step": 421512, "epoch": 2509} {"train_loss": -12.553171157836914, "global_step": 421513, "epoch": 2509} {"train_loss": -12.472335815429688, "global_step": 421514, "epoch": 2509} {"train_loss": -12.574577331542969, "global_step": 421515, "epoch": 2509} {"train_loss": -12.344573020935059, "global_step": 421516, "epoch": 2509} {"train_loss": -12.650646209716797, "global_step": 421517, "epoch": 2509} {"train_loss": -12.655694961547852, "global_step": 421518, "epoch": 2509} {"train_loss": -12.30672550201416, "global_step": 421519, "epoch": 2509} {"train_loss": -12.405200958251953, "global_step": 421520, "epoch": 2509} {"train_loss": -12.317317962646484, "global_step": 421521, "epoch": 2509} {"train_loss": -12.546257972717285, "global_step": 421522, "epoch": 2509} {"train_loss": -12.660493850708008, "global_step": 421523, "epoch": 2509} {"train_loss": -12.662055969238281, "global_step": 421524, "epoch": 2509} {"train_loss": -12.492246627807617, "global_step": 421525, "epoch": 2509} {"train_loss": -12.603696823120117, "global_step": 421526, "epoch": 2509} {"train_loss": -12.428182601928711, "global_step": 421527, "epoch": 2509} {"train_loss": -12.485925674438477, "global_step": 421528, "epoch": 2509} {"train_loss": -12.673188209533691, "global_step": 421529, "epoch": 2509} {"train_loss": -12.526183128356934, "global_step": 421530, "epoch": 2509} {"train_loss": -12.154850006103516, "global_step": 421531, "epoch": 2509} {"train_loss": -12.74344253540039, "global_step": 421532, "epoch": 2509} {"train_loss": -12.249314308166504, "global_step": 421533, "epoch": 2509} {"train_loss": -12.585066795349121, "global_step": 421534, "epoch": 2509} {"train_loss": -12.660989761352539, "global_step": 421535, "epoch": 2509} {"train_loss": -12.217409133911133, "global_step": 421536, "epoch": 2509} {"train_loss": -12.670392990112305, "global_step": 421537, "epoch": 2509} {"train_loss": -12.588135719299316, "global_step": 421538, "epoch": 2509} {"train_loss": -12.703773498535156, "global_step": 421539, "epoch": 2509} {"train_loss": -12.403321266174316, "global_step": 421540, "epoch": 2509} {"train_loss": -12.289937973022461, "global_step": 421541, "epoch": 2509} {"train_loss": -12.486733436584473, "global_step": 421542, "epoch": 2509} {"train_loss": -12.550314903259277, "global_step": 421543, "epoch": 2509} {"train_loss": -12.552831649780273, "global_step": 421544, "epoch": 2509} {"train_loss": -11.89404582977295, "global_step": 421545, "epoch": 2509} {"train_loss": -12.333839416503906, "global_step": 421546, "epoch": 2509} {"train_loss": -12.789413452148438, "global_step": 421547, "epoch": 2509} {"train_loss": -12.210341453552246, "global_step": 421548, "epoch": 2509} {"train_loss": -11.643783569335938, "global_step": 421549, "epoch": 2509} {"train_loss": -12.612384796142578, "global_step": 421550, "epoch": 2509} {"train_loss": -12.239806175231934, "global_step": 421551, "epoch": 2509} {"train_loss": -12.347190856933594, "global_step": 421552, "epoch": 2509} {"train_loss": -12.430397033691406, "global_step": 421553, "epoch": 2509} {"train_loss": -12.364405632019043, "global_step": 421554, "epoch": 2509} {"train_loss": -12.33376693725586, "global_step": 421555, "epoch": 2509} {"train_loss": -11.869901657104492, "global_step": 421556, "epoch": 2509} {"train_loss": -12.06125259399414, "global_step": 421557, "epoch": 2509} {"train_loss": -12.769753456115723, "global_step": 421558, "epoch": 2509} {"train_loss": -12.33963394165039, "global_step": 421559, "epoch": 2509} {"train_loss": -11.311858177185059, "global_step": 421560, "epoch": 2509} {"train_loss": -12.465415954589844, "global_step": 421561, "epoch": 2509} {"train_loss": -12.311426162719727, "global_step": 421562, "epoch": 2509} {"train_loss": -11.232599258422852, "global_step": 421563, "epoch": 2509} {"train_loss": -11.48757553100586, "global_step": 421564, "epoch": 2509} {"train_loss": -12.314970970153809, "global_step": 421565, "epoch": 2509} {"train_loss": -11.842425346374512, "global_step": 421566, "epoch": 2509} {"train_loss": -11.290922164916992, "global_step": 421567, "epoch": 2509} {"train_loss": -11.935608863830566, "global_step": 421568, "epoch": 2509} {"train_loss": -11.494186401367188, "global_step": 421569, "epoch": 2509} {"train_loss": -10.630847930908203, "global_step": 421570, "epoch": 2509} {"train_loss": -11.095752716064453, "global_step": 421571, "epoch": 2509} {"train_loss": -12.38333797454834, "global_step": 421572, "epoch": 2509} {"train_loss": -11.2474946975708, "global_step": 421573, "epoch": 2509} {"train_loss": -11.873666763305664, "global_step": 421574, "epoch": 2509} {"train_loss": -11.324188232421875, "global_step": 421575, "epoch": 2509} {"train_loss": -10.551578521728516, "global_step": 421576, "epoch": 2509} {"train_loss": -11.783284187316895, "global_step": 421577, "epoch": 2509} {"train_loss": -10.929848670959473, "global_step": 421578, "epoch": 2509} {"train_loss": -10.531224250793457, "global_step": 421579, "epoch": 2509} {"train_loss": -10.157913208007812, "global_step": 421580, "epoch": 2509} {"train_loss": -10.843748092651367, "global_step": 421581, "epoch": 2509} {"train_loss": -9.994338989257812, "global_step": 421582, "epoch": 2509} {"train_loss": -11.49618148803711, "global_step": 421583, "epoch": 2509} {"train_loss": -10.0939302444458, "global_step": 421584, "epoch": 2509} {"train_loss": -10.526771545410156, "global_step": 421585, "epoch": 2509} {"train_loss": -11.579984664916992, "global_step": 421586, "epoch": 2509} {"train_loss": -9.506265640258789, "global_step": 421587, "epoch": 2509} {"train_loss": -11.728927612304688, "global_step": 421588, "epoch": 2509} {"train_loss": -10.63535213470459, "global_step": 421589, "epoch": 2509} {"train_loss": -9.54531192779541, "global_step": 421590, "epoch": 2509} {"train_loss": -10.01534652709961, "global_step": 421591, "epoch": 2509} {"train_loss": -10.781572341918945, "global_step": 421592, "epoch": 2509} {"train_loss": -10.121066093444824, "global_step": 421593, "epoch": 2509} {"train_loss": -10.942359924316406, "global_step": 421594, "epoch": 2509} {"train_loss": -11.207513809204102, "global_step": 421595, "epoch": 2509} {"train_loss": -10.63966178894043, "global_step": 421596, "epoch": 2509} {"train_loss": -11.796754837036133, "global_step": 421597, "epoch": 2509} {"train_loss": -10.914134979248047, "global_step": 421598, "epoch": 2509} {"train_loss": -11.38970947265625, "global_step": 421599, "epoch": 2509} {"train_loss": -11.39293098449707, "global_step": 421600, "epoch": 2509} {"train_loss": -11.141897201538086, "global_step": 421601, "epoch": 2509} {"train_loss": -11.301923751831055, "global_step": 421602, "epoch": 2509} {"train_loss": -12.068439483642578, "global_step": 421603, "epoch": 2509} {"train_loss": -11.911890983581543, "global_step": 421604, "epoch": 2509} {"train_loss": -11.977262496948242, "global_step": 421605, "epoch": 2509} {"train_loss": -12.013757705688477, "global_step": 421606, "epoch": 2509} {"train_loss": -11.808239936828613, "global_step": 421607, "epoch": 2509} {"train_loss": -12.145112991333008, "global_step": 421608, "epoch": 2509} {"train_loss": -12.043052673339844, "global_step": 421609, "epoch": 2509} {"train_loss": -12.116792678833008, "global_step": 421610, "epoch": 2509} {"train_loss": -12.235851287841797, "global_step": 421611, "epoch": 2509} {"train_loss": -11.728723526000977, "global_step": 421612, "epoch": 2509} {"train_loss": -12.252620697021484, "global_step": 421613, "epoch": 2509} {"train_loss": -12.206594467163086, "global_step": 421614, "epoch": 2509} {"train_loss": -11.95936107635498, "global_step": 421615, "epoch": 2509} {"train_loss": -12.107486724853516, "global_step": 421616, "epoch": 2509} {"train_loss": -12.256368637084961, "global_step": 421617, "epoch": 2509} {"train_loss": -11.917864799499512, "global_step": 421618, "epoch": 2509} {"train_loss": -12.408702850341797, "global_step": 421619, "epoch": 2509} {"train_loss": -11.996002197265625, "global_step": 421620, "epoch": 2509} {"train_loss": -11.834096908569336, "global_step": 421621, "epoch": 2509} {"train_loss": -12.34440803527832, "global_step": 421622, "epoch": 2509} {"train_loss": -11.915247917175293, "global_step": 421623, "epoch": 2509} {"train_loss": -11.896190643310547, "global_step": 421624, "epoch": 2509} {"train_loss": -12.331811904907227, "global_step": 421625, "epoch": 2509} {"train_loss": -12.261697769165039, "global_step": 421626, "epoch": 2509} {"train_loss": -11.910629272460938, "global_step": 421627, "epoch": 2509} {"train_loss": -12.205577850341797, "global_step": 421628, "epoch": 2509} {"train_loss": -11.972433090209961, "global_step": 421629, "epoch": 2509} {"train_loss": -12.33930778503418, "global_step": 421630, "epoch": 2509} {"train_loss": -12.30445384979248, "global_step": 421631, "epoch": 2509} {"train_loss": -12.205175399780273, "global_step": 421632, "epoch": 2509} {"train_loss": -12.262174606323242, "global_step": 421633, "epoch": 2509} {"train_loss": -12.056559562683105, "global_step": 421634, "epoch": 2509} {"train_loss": -12.160067558288574, "global_step": 421635, "epoch": 2509} {"train_loss": -12.144914627075195, "global_step": 421636, "epoch": 2509} {"train_loss": -12.295524597167969, "global_step": 421637, "epoch": 2509} {"train_loss": -12.14168930053711, "global_step": 421638, "epoch": 2509} {"train_loss": -12.36822509765625, "global_step": 421639, "epoch": 2509} {"train_loss": -12.390816688537598, "global_step": 421640, "epoch": 2509} {"train_loss": -12.426631927490234, "global_step": 421641, "epoch": 2509} {"train_loss": -12.342672348022461, "global_step": 421642, "epoch": 2509} {"train_loss": -12.306452751159668, "global_step": 421643, "epoch": 2509} {"train_loss": -12.219602584838867, "global_step": 421644, "epoch": 2509} {"train_loss": -12.497091293334961, "global_step": 421645, "epoch": 2509} {"train_loss": -12.194238662719727, "global_step": 421646, "epoch": 2509} {"train_loss": -12.584144592285156, "global_step": 421647, "epoch": 2509} {"train_loss": -11.98785400390625, "global_step": 421648, "epoch": 2509} {"train_loss": -12.606021881103516, "global_step": 421649, "epoch": 2509} {"train_loss": -12.118630409240723, "global_step": 421650, "epoch": 2509} {"train_loss": -12.608949661254883, "global_step": 421651, "epoch": 2509} {"train_loss": -12.432140350341797, "global_step": 421652, "epoch": 2509} {"train_loss": -12.249326705932617, "global_step": 421653, "epoch": 2509} {"train_loss": -12.500868797302246, "global_step": 421654, "epoch": 2509} {"train_loss": -12.565727233886719, "global_step": 421655, "epoch": 2509} {"train_loss": -12.634468078613281, "global_step": 421656, "epoch": 2509} {"train_loss": -12.269989013671875, "global_step": 421657, "epoch": 2509} {"train_loss": -12.636516571044922, "global_step": 421658, "epoch": 2509} {"train_loss": -12.660507202148438, "global_step": 421659, "epoch": 2509} {"train_loss": -12.68707275390625, "global_step": 421660, "epoch": 2509} {"train_loss": -12.540742874145508, "global_step": 421661, "epoch": 2509} {"train_loss": -12.577072143554688, "global_step": 421662, "epoch": 2509} {"train_loss": -12.607451438903809, "global_step": 421663, "epoch": 2509} {"train_loss": -12.441567420959473, "global_step": 421664, "epoch": 2509} {"train_loss": -12.57137680053711, "global_step": 421665, "epoch": 2509} {"train_loss": -12.545074462890625, "global_step": 421666, "epoch": 2509} {"train_loss": -12.475353240966797, "global_step": 421667, "epoch": 2509} {"train_loss": -12.689676284790039, "global_step": 421668, "epoch": 2509} {"train_loss": -12.494399070739746, "global_step": 421669, "epoch": 2509} {"train_loss": -12.662751197814941, "global_step": 421670, "epoch": 2509} {"train_loss": -12.283796310424805, "global_step": 421671, "epoch": 2509} {"train_loss": -12.171222686767578, "global_step": 421672, "epoch": 2509} {"train_loss": -12.028768539428711, "global_step": 421673, "epoch": 2509} {"train_loss": -12.64526653289795, "global_step": 421674, "epoch": 2509} {"train_loss": -12.32209587097168, "global_step": 421675, "epoch": 2509} {"train_loss": -12.328326225280762, "global_step": 421676, "epoch": 2509} {"train_loss": -11.9321870803833, "global_step": 421677, "epoch": 2509} {"train_loss": -12.398983001708984, "global_step": 421678, "epoch": 2509} {"train_loss": -12.018344390959967, "global_step": 421679, "epoch": 2509, "val_loss": 312311.9375} {"train_loss": -12.133623123168945, "global_step": 421680, "epoch": 2510} {"train_loss": -12.320904731750488, "global_step": 421681, "epoch": 2510} {"train_loss": -12.320192337036133, "global_step": 421682, "epoch": 2510} {"train_loss": -12.244470596313477, "global_step": 421683, "epoch": 2510} {"train_loss": -12.310789108276367, "global_step": 421684, "epoch": 2510} {"train_loss": -12.071574211120605, "global_step": 421685, "epoch": 2510} {"train_loss": -11.915538787841797, "global_step": 421686, "epoch": 2510} {"train_loss": -11.665252685546875, "global_step": 421687, "epoch": 2510} {"train_loss": -12.034858703613281, "global_step": 421688, "epoch": 2510} {"train_loss": -12.490286827087402, "global_step": 421689, "epoch": 2510} {"train_loss": -12.507806777954102, "global_step": 421690, "epoch": 2510} {"train_loss": -12.132264137268066, "global_step": 421691, "epoch": 2510} {"train_loss": -12.421545028686523, "global_step": 421692, "epoch": 2510} {"train_loss": -12.417428970336914, "global_step": 421693, "epoch": 2510} {"train_loss": -11.92786693572998, "global_step": 421694, "epoch": 2510} {"train_loss": -12.159475326538086, "global_step": 421695, "epoch": 2510} {"train_loss": -12.368162155151367, "global_step": 421696, "epoch": 2510} {"train_loss": -12.475115776062012, "global_step": 421697, "epoch": 2510} {"train_loss": -11.799646377563477, "global_step": 421698, "epoch": 2510} {"train_loss": -12.345001220703125, "global_step": 421699, "epoch": 2510} {"train_loss": -11.623710632324219, "global_step": 421700, "epoch": 2510} {"train_loss": -12.092263221740723, "global_step": 421701, "epoch": 2510} {"train_loss": -11.05007553100586, "global_step": 421702, "epoch": 2510} {"train_loss": -12.01601791381836, "global_step": 421703, "epoch": 2510} {"train_loss": -12.428984642028809, "global_step": 421704, "epoch": 2510} {"train_loss": -11.533744812011719, "global_step": 421705, "epoch": 2510} {"train_loss": -12.562347412109375, "global_step": 421706, "epoch": 2510} {"train_loss": -11.510127067565918, "global_step": 421707, "epoch": 2510} {"train_loss": -11.850141525268555, "global_step": 421708, "epoch": 2510} {"train_loss": -11.865903854370117, "global_step": 421709, "epoch": 2510} {"train_loss": -11.233120918273926, "global_step": 421710, "epoch": 2510} {"train_loss": -11.32156753540039, "global_step": 421711, "epoch": 2510} {"train_loss": -11.988143920898438, "global_step": 421712, "epoch": 2510} {"train_loss": -11.374176025390625, "global_step": 421713, "epoch": 2510} {"train_loss": -11.923969268798828, "global_step": 421714, "epoch": 2510} {"train_loss": -11.534588813781738, "global_step": 421715, "epoch": 2510} {"train_loss": -10.984123229980469, "global_step": 421716, "epoch": 2510} {"train_loss": -11.502191543579102, "global_step": 421717, "epoch": 2510} {"train_loss": -10.072071075439453, "global_step": 421718, "epoch": 2510} {"train_loss": -10.44278335571289, "global_step": 421719, "epoch": 2510} {"train_loss": -12.250398635864258, "global_step": 421720, "epoch": 2510} {"train_loss": -9.519293785095215, "global_step": 421721, "epoch": 2510} {"train_loss": -11.551298141479492, "global_step": 421722, "epoch": 2510} {"train_loss": -10.377296447753906, "global_step": 421723, "epoch": 2510} {"train_loss": -11.337967872619629, "global_step": 421724, "epoch": 2510} {"train_loss": -11.351554870605469, "global_step": 421725, "epoch": 2510} {"train_loss": -11.531874656677246, "global_step": 421726, "epoch": 2510} {"train_loss": -10.977506637573242, "global_step": 421727, "epoch": 2510} {"train_loss": -11.768959999084473, "global_step": 421728, "epoch": 2510} {"train_loss": -11.883968353271484, "global_step": 421729, "epoch": 2510} {"train_loss": -11.170851707458496, "global_step": 421730, "epoch": 2510} {"train_loss": -12.172893524169922, "global_step": 421731, "epoch": 2510} {"train_loss": -10.959159851074219, "global_step": 421732, "epoch": 2510} {"train_loss": -11.86500358581543, "global_step": 421733, "epoch": 2510} {"train_loss": -10.474538803100586, "global_step": 421734, "epoch": 2510} {"train_loss": -11.791090965270996, "global_step": 421735, "epoch": 2510} {"train_loss": -10.103216171264648, "global_step": 421736, "epoch": 2510} {"train_loss": -11.595844268798828, "global_step": 421737, "epoch": 2510} {"train_loss": -9.7714204788208, "global_step": 421738, "epoch": 2510} {"train_loss": -10.1597900390625, "global_step": 421739, "epoch": 2510} {"train_loss": -11.088579177856445, "global_step": 421740, "epoch": 2510} {"train_loss": -10.465221405029297, "global_step": 421741, "epoch": 2510} {"train_loss": -10.992382049560547, "global_step": 421742, "epoch": 2510} {"train_loss": -10.912165641784668, "global_step": 421743, "epoch": 2510} {"train_loss": -11.138559341430664, "global_step": 421744, "epoch": 2510} {"train_loss": -10.44909954071045, "global_step": 421745, "epoch": 2510} {"train_loss": -11.592132568359375, "global_step": 421746, "epoch": 2510} {"train_loss": -10.805174827575684, "global_step": 421747, "epoch": 2510} {"train_loss": -11.838759422302246, "global_step": 421748, "epoch": 2510} {"train_loss": -11.43625545501709, "global_step": 421749, "epoch": 2510} {"train_loss": -12.002443313598633, "global_step": 421750, "epoch": 2510} {"train_loss": -11.593812942504883, "global_step": 421751, "epoch": 2510} {"train_loss": -11.717547416687012, "global_step": 421752, "epoch": 2510} {"train_loss": -11.464323043823242, "global_step": 421753, "epoch": 2510} {"train_loss": -11.915594100952148, "global_step": 421754, "epoch": 2510} {"train_loss": -11.968802452087402, "global_step": 421755, "epoch": 2510} {"train_loss": -11.41291618347168, "global_step": 421756, "epoch": 2510} {"train_loss": -12.149761199951172, "global_step": 421757, "epoch": 2510} {"train_loss": -11.726062774658203, "global_step": 421758, "epoch": 2510} {"train_loss": -12.053140640258789, "global_step": 421759, "epoch": 2510} {"train_loss": -11.965537071228027, "global_step": 421760, "epoch": 2510} {"train_loss": -12.151198387145996, "global_step": 421761, "epoch": 2510} {"train_loss": -11.977556228637695, "global_step": 421762, "epoch": 2510} {"train_loss": -12.229114532470703, "global_step": 421763, "epoch": 2510} {"train_loss": -12.149588584899902, "global_step": 421764, "epoch": 2510} {"train_loss": -12.109968185424805, "global_step": 421765, "epoch": 2510} {"train_loss": -12.32269287109375, "global_step": 421766, "epoch": 2510} {"train_loss": -12.3115234375, "global_step": 421767, "epoch": 2510} {"train_loss": -12.102108001708984, "global_step": 421768, "epoch": 2510} {"train_loss": -12.282687187194824, "global_step": 421769, "epoch": 2510} {"train_loss": -12.142576217651367, "global_step": 421770, "epoch": 2510} {"train_loss": -12.196290969848633, "global_step": 421771, "epoch": 2510} {"train_loss": -12.166145324707031, "global_step": 421772, "epoch": 2510} {"train_loss": -11.977832794189453, "global_step": 421773, "epoch": 2510} {"train_loss": -12.152185440063477, "global_step": 421774, "epoch": 2510} {"train_loss": -12.302903175354004, "global_step": 421775, "epoch": 2510} {"train_loss": -11.92678451538086, "global_step": 421776, "epoch": 2510} {"train_loss": -12.313403129577637, "global_step": 421777, "epoch": 2510} {"train_loss": -12.169668197631836, "global_step": 421778, "epoch": 2510} {"train_loss": -12.08001708984375, "global_step": 421779, "epoch": 2510} {"train_loss": -11.984053611755371, "global_step": 421780, "epoch": 2510} {"train_loss": -12.001993179321289, "global_step": 421781, "epoch": 2510} {"train_loss": -12.205280303955078, "global_step": 421782, "epoch": 2510} {"train_loss": -11.962972640991211, "global_step": 421783, "epoch": 2510} {"train_loss": -11.798175811767578, "global_step": 421784, "epoch": 2510} {"train_loss": -12.109428405761719, "global_step": 421785, "epoch": 2510} {"train_loss": -11.739086151123047, "global_step": 421786, "epoch": 2510} {"train_loss": -12.324554443359375, "global_step": 421787, "epoch": 2510} {"train_loss": -11.857810020446777, "global_step": 421788, "epoch": 2510} {"train_loss": -12.058443069458008, "global_step": 421789, "epoch": 2510} {"train_loss": -12.198051452636719, "global_step": 421790, "epoch": 2510} {"train_loss": -11.955350875854492, "global_step": 421791, "epoch": 2510} {"train_loss": -12.17758846282959, "global_step": 421792, "epoch": 2510} {"train_loss": -12.247062683105469, "global_step": 421793, "epoch": 2510} {"train_loss": -12.466489791870117, "global_step": 421794, "epoch": 2510} {"train_loss": -12.10940933227539, "global_step": 421795, "epoch": 2510} {"train_loss": -12.242843627929688, "global_step": 421796, "epoch": 2510} {"train_loss": -12.127549171447754, "global_step": 421797, "epoch": 2510} {"train_loss": -12.22127628326416, "global_step": 421798, "epoch": 2510} {"train_loss": -12.228052139282227, "global_step": 421799, "epoch": 2510} {"train_loss": -12.212059020996094, "global_step": 421800, "epoch": 2510} {"train_loss": -12.287370681762695, "global_step": 421801, "epoch": 2510} {"train_loss": -12.490751266479492, "global_step": 421802, "epoch": 2510} {"train_loss": -12.390536308288574, "global_step": 421803, "epoch": 2510} {"train_loss": -12.488702774047852, "global_step": 421804, "epoch": 2510} {"train_loss": -12.647632598876953, "global_step": 421805, "epoch": 2510} {"train_loss": -12.393056869506836, "global_step": 421806, "epoch": 2510} {"train_loss": -12.433172225952148, "global_step": 421807, "epoch": 2510} {"train_loss": -12.198923110961914, "global_step": 421808, "epoch": 2510} {"train_loss": -12.644960403442383, "global_step": 421809, "epoch": 2510} {"train_loss": -12.55461311340332, "global_step": 421810, "epoch": 2510} {"train_loss": -12.496981620788574, "global_step": 421811, "epoch": 2510} {"train_loss": -12.791975021362305, "global_step": 421812, "epoch": 2510} {"train_loss": -12.663078308105469, "global_step": 421813, "epoch": 2510} {"train_loss": -12.642755508422852, "global_step": 421814, "epoch": 2510} {"train_loss": -12.668865203857422, "global_step": 421815, "epoch": 2510} {"train_loss": -12.724653244018555, "global_step": 421816, "epoch": 2510} {"train_loss": -12.456621170043945, "global_step": 421817, "epoch": 2510} {"train_loss": -12.614750862121582, "global_step": 421818, "epoch": 2510} {"train_loss": -12.79036808013916, "global_step": 421819, "epoch": 2510} {"train_loss": -12.7672700881958, "global_step": 421820, "epoch": 2510} {"train_loss": -12.494316101074219, "global_step": 421821, "epoch": 2510} {"train_loss": -12.73430061340332, "global_step": 421822, "epoch": 2510} {"train_loss": -12.614089965820312, "global_step": 421823, "epoch": 2510} {"train_loss": -12.75274658203125, "global_step": 421824, "epoch": 2510} {"train_loss": -12.663068771362305, "global_step": 421825, "epoch": 2510} {"train_loss": -12.566269874572754, "global_step": 421826, "epoch": 2510} {"train_loss": -12.758291244506836, "global_step": 421827, "epoch": 2510} {"train_loss": -12.510409355163574, "global_step": 421828, "epoch": 2510} {"train_loss": -12.695558547973633, "global_step": 421829, "epoch": 2510} {"train_loss": -12.515897750854492, "global_step": 421830, "epoch": 2510} {"train_loss": -12.797262191772461, "global_step": 421831, "epoch": 2510} {"train_loss": -12.335451126098633, "global_step": 421832, "epoch": 2510} {"train_loss": -12.57912540435791, "global_step": 421833, "epoch": 2510} {"train_loss": -11.858924865722656, "global_step": 421834, "epoch": 2510} {"train_loss": -12.137495994567871, "global_step": 421835, "epoch": 2510} {"train_loss": -12.062295913696289, "global_step": 421836, "epoch": 2510} {"train_loss": -12.269414901733398, "global_step": 421837, "epoch": 2510} {"train_loss": -12.292684555053711, "global_step": 421838, "epoch": 2510} {"train_loss": -12.128678321838379, "global_step": 421839, "epoch": 2510} {"train_loss": -12.056727409362793, "global_step": 421840, "epoch": 2510} {"train_loss": -11.982419967651367, "global_step": 421841, "epoch": 2510} {"train_loss": -12.290987014770508, "global_step": 421842, "epoch": 2510} {"train_loss": -12.295113563537598, "global_step": 421843, "epoch": 2510} {"train_loss": -12.605119705200195, "global_step": 421844, "epoch": 2510} {"train_loss": -12.315187454223633, "global_step": 421845, "epoch": 2510} {"train_loss": -12.419300079345703, "global_step": 421846, "epoch": 2510} {"train_loss": -11.964117146673656, "global_step": 421847, "epoch": 2510, "val_loss": 308635.34375, "train_action_mse_error": 1.1006672382354736} {"train_loss": -12.325952529907227, "global_step": 421848, "epoch": 2511} {"train_loss": -12.29721450805664, "global_step": 421849, "epoch": 2511} {"train_loss": -12.26431655883789, "global_step": 421850, "epoch": 2511} {"train_loss": -12.377403259277344, "global_step": 421851, "epoch": 2511} {"train_loss": -12.580643653869629, "global_step": 421852, "epoch": 2511} {"train_loss": -12.509114265441895, "global_step": 421853, "epoch": 2511} {"train_loss": -12.652715682983398, "global_step": 421854, "epoch": 2511} {"train_loss": -12.644813537597656, "global_step": 421855, "epoch": 2511} {"train_loss": -12.683509826660156, "global_step": 421856, "epoch": 2511} {"train_loss": -12.66790771484375, "global_step": 421857, "epoch": 2511} {"train_loss": -12.484151840209961, "global_step": 421858, "epoch": 2511} {"train_loss": -12.483795166015625, "global_step": 421859, "epoch": 2511} {"train_loss": -12.605892181396484, "global_step": 421860, "epoch": 2511} {"train_loss": -12.690958023071289, "global_step": 421861, "epoch": 2511} {"train_loss": -12.388875961303711, "global_step": 421862, "epoch": 2511} {"train_loss": -12.169963836669922, "global_step": 421863, "epoch": 2511} {"train_loss": -12.487556457519531, "global_step": 421864, "epoch": 2511} {"train_loss": -12.539612770080566, "global_step": 421865, "epoch": 2511} {"train_loss": -12.949914932250977, "global_step": 421866, "epoch": 2511} {"train_loss": -12.444391250610352, "global_step": 421867, "epoch": 2511} {"train_loss": -12.129496574401855, "global_step": 421868, "epoch": 2511} {"train_loss": -12.58682918548584, "global_step": 421869, "epoch": 2511} {"train_loss": -12.44185733795166, "global_step": 421870, "epoch": 2511} {"train_loss": -12.234723091125488, "global_step": 421871, "epoch": 2511} {"train_loss": -12.616363525390625, "global_step": 421872, "epoch": 2511} {"train_loss": -12.50857925415039, "global_step": 421873, "epoch": 2511} {"train_loss": -11.988304138183594, "global_step": 421874, "epoch": 2511} {"train_loss": -11.70254135131836, "global_step": 421875, "epoch": 2511} {"train_loss": -12.051323890686035, "global_step": 421876, "epoch": 2511} {"train_loss": -12.38939094543457, "global_step": 421877, "epoch": 2511} {"train_loss": -11.418669700622559, "global_step": 421878, "epoch": 2511} {"train_loss": -12.018932342529297, "global_step": 421879, "epoch": 2511} {"train_loss": -12.279986381530762, "global_step": 421880, "epoch": 2511} {"train_loss": -11.82266616821289, "global_step": 421881, "epoch": 2511} {"train_loss": -11.799967765808105, "global_step": 421882, "epoch": 2511} {"train_loss": -12.13880729675293, "global_step": 421883, "epoch": 2511} {"train_loss": -12.35406494140625, "global_step": 421884, "epoch": 2511} {"train_loss": -11.942163467407227, "global_step": 421885, "epoch": 2511} {"train_loss": -11.48744010925293, "global_step": 421886, "epoch": 2511} {"train_loss": -11.802830696105957, "global_step": 421887, "epoch": 2511} {"train_loss": -12.091787338256836, "global_step": 421888, "epoch": 2511} {"train_loss": -11.793825149536133, "global_step": 421889, "epoch": 2511} {"train_loss": -11.706253051757812, "global_step": 421890, "epoch": 2511} {"train_loss": -12.397283554077148, "global_step": 421891, "epoch": 2511} {"train_loss": -11.260568618774414, "global_step": 421892, "epoch": 2511} {"train_loss": -10.979339599609375, "global_step": 421893, "epoch": 2511} {"train_loss": -11.325258255004883, "global_step": 421894, "epoch": 2511} {"train_loss": -12.299822807312012, "global_step": 421895, "epoch": 2511} {"train_loss": -11.495577812194824, "global_step": 421896, "epoch": 2511} {"train_loss": -12.033379554748535, "global_step": 421897, "epoch": 2511} {"train_loss": -11.849645614624023, "global_step": 421898, "epoch": 2511} {"train_loss": -11.67816162109375, "global_step": 421899, "epoch": 2511} {"train_loss": -11.957853317260742, "global_step": 421900, "epoch": 2511} {"train_loss": -11.382455825805664, "global_step": 421901, "epoch": 2511} {"train_loss": -11.86433219909668, "global_step": 421902, "epoch": 2511} {"train_loss": -11.98169994354248, "global_step": 421903, "epoch": 2511} {"train_loss": -11.861838340759277, "global_step": 421904, "epoch": 2511} {"train_loss": -11.669219970703125, "global_step": 421905, "epoch": 2511} {"train_loss": -12.111007690429688, "global_step": 421906, "epoch": 2511} {"train_loss": -11.629646301269531, "global_step": 421907, "epoch": 2511} {"train_loss": -12.199066162109375, "global_step": 421908, "epoch": 2511} {"train_loss": -11.088098526000977, "global_step": 421909, "epoch": 2511} {"train_loss": -11.977192878723145, "global_step": 421910, "epoch": 2511} {"train_loss": -11.72012996673584, "global_step": 421911, "epoch": 2511} {"train_loss": -11.645456314086914, "global_step": 421912, "epoch": 2511} {"train_loss": -11.980165481567383, "global_step": 421913, "epoch": 2511} {"train_loss": -12.172979354858398, "global_step": 421914, "epoch": 2511} {"train_loss": -11.301483154296875, "global_step": 421915, "epoch": 2511} {"train_loss": -12.125151634216309, "global_step": 421916, "epoch": 2511} {"train_loss": -11.407195091247559, "global_step": 421917, "epoch": 2511} {"train_loss": -11.730233192443848, "global_step": 421918, "epoch": 2511} {"train_loss": -11.779154777526855, "global_step": 421919, "epoch": 2511} {"train_loss": -11.483414649963379, "global_step": 421920, "epoch": 2511} {"train_loss": -12.193744659423828, "global_step": 421921, "epoch": 2511} {"train_loss": -11.774202346801758, "global_step": 421922, "epoch": 2511} {"train_loss": -12.397167205810547, "global_step": 421923, "epoch": 2511} {"train_loss": -11.814474105834961, "global_step": 421924, "epoch": 2511} {"train_loss": -12.132380485534668, "global_step": 421925, "epoch": 2511} {"train_loss": -11.959943771362305, "global_step": 421926, "epoch": 2511} {"train_loss": -12.303598403930664, "global_step": 421927, "epoch": 2511} {"train_loss": -12.091085433959961, "global_step": 421928, "epoch": 2511} {"train_loss": -11.967732429504395, "global_step": 421929, "epoch": 2511} {"train_loss": -12.071200370788574, "global_step": 421930, "epoch": 2511} {"train_loss": -11.812145233154297, "global_step": 421931, "epoch": 2511} {"train_loss": -12.267250061035156, "global_step": 421932, "epoch": 2511} {"train_loss": -12.222892761230469, "global_step": 421933, "epoch": 2511} {"train_loss": -11.778905868530273, "global_step": 421934, "epoch": 2511} {"train_loss": -12.209744453430176, "global_step": 421935, "epoch": 2511} {"train_loss": -11.990766525268555, "global_step": 421936, "epoch": 2511} {"train_loss": -12.327285766601562, "global_step": 421937, "epoch": 2511} {"train_loss": -12.077193260192871, "global_step": 421938, "epoch": 2511} {"train_loss": -12.011506080627441, "global_step": 421939, "epoch": 2511} {"train_loss": -12.195148468017578, "global_step": 421940, "epoch": 2511} {"train_loss": -12.057744026184082, "global_step": 421941, "epoch": 2511} {"train_loss": -12.085732460021973, "global_step": 421942, "epoch": 2511} {"train_loss": -12.258275985717773, "global_step": 421943, "epoch": 2511} {"train_loss": -12.19845962524414, "global_step": 421944, "epoch": 2511} {"train_loss": -12.340838432312012, "global_step": 421945, "epoch": 2511} {"train_loss": -11.999391555786133, "global_step": 421946, "epoch": 2511} {"train_loss": -12.2650785446167, "global_step": 421947, "epoch": 2511} {"train_loss": -12.134061813354492, "global_step": 421948, "epoch": 2511} {"train_loss": -12.371109008789062, "global_step": 421949, "epoch": 2511} {"train_loss": -12.387338638305664, "global_step": 421950, "epoch": 2511} {"train_loss": -12.292683601379395, "global_step": 421951, "epoch": 2511} {"train_loss": -12.238810539245605, "global_step": 421952, "epoch": 2511} {"train_loss": -12.421414375305176, "global_step": 421953, "epoch": 2511} {"train_loss": -12.320684432983398, "global_step": 421954, "epoch": 2511} {"train_loss": -12.37968635559082, "global_step": 421955, "epoch": 2511} {"train_loss": -12.54608154296875, "global_step": 421956, "epoch": 2511} {"train_loss": -12.472171783447266, "global_step": 421957, "epoch": 2511} {"train_loss": -12.758211135864258, "global_step": 421958, "epoch": 2511} {"train_loss": -12.430929183959961, "global_step": 421959, "epoch": 2511} {"train_loss": -12.542061805725098, "global_step": 421960, "epoch": 2511} {"train_loss": -12.594700813293457, "global_step": 421961, "epoch": 2511} {"train_loss": -12.25446891784668, "global_step": 421962, "epoch": 2511} {"train_loss": -12.350994110107422, "global_step": 421963, "epoch": 2511} {"train_loss": -12.780981063842773, "global_step": 421964, "epoch": 2511} {"train_loss": -12.35495376586914, "global_step": 421965, "epoch": 2511} {"train_loss": -12.171142578125, "global_step": 421966, "epoch": 2511} {"train_loss": -12.301718711853027, "global_step": 421967, "epoch": 2511} {"train_loss": -12.034385681152344, "global_step": 421968, "epoch": 2511} {"train_loss": -12.398981094360352, "global_step": 421969, "epoch": 2511} {"train_loss": -12.185340881347656, "global_step": 421970, "epoch": 2511} {"train_loss": -12.10226058959961, "global_step": 421971, "epoch": 2511} {"train_loss": -12.740528106689453, "global_step": 421972, "epoch": 2511} {"train_loss": -11.864717483520508, "global_step": 421973, "epoch": 2511} {"train_loss": -12.535711288452148, "global_step": 421974, "epoch": 2511} {"train_loss": -12.296363830566406, "global_step": 421975, "epoch": 2511} {"train_loss": -12.299152374267578, "global_step": 421976, "epoch": 2511} {"train_loss": -12.437507629394531, "global_step": 421977, "epoch": 2511} {"train_loss": -11.936568260192871, "global_step": 421978, "epoch": 2511} {"train_loss": -12.644756317138672, "global_step": 421979, "epoch": 2511} {"train_loss": -12.397875785827637, "global_step": 421980, "epoch": 2511} {"train_loss": -12.563629150390625, "global_step": 421981, "epoch": 2511} {"train_loss": -12.5264892578125, "global_step": 421982, "epoch": 2511} {"train_loss": -12.704203605651855, "global_step": 421983, "epoch": 2511} {"train_loss": -12.622749328613281, "global_step": 421984, "epoch": 2511} {"train_loss": -12.638479232788086, "global_step": 421985, "epoch": 2511} {"train_loss": -12.565895080566406, "global_step": 421986, "epoch": 2511} {"train_loss": -12.623021125793457, "global_step": 421987, "epoch": 2511} {"train_loss": -12.432908058166504, "global_step": 421988, "epoch": 2511} {"train_loss": -12.459121704101562, "global_step": 421989, "epoch": 2511} {"train_loss": -12.078485488891602, "global_step": 421990, "epoch": 2511} {"train_loss": -12.297046661376953, "global_step": 421991, "epoch": 2511} {"train_loss": -11.797078132629395, "global_step": 421992, "epoch": 2511} {"train_loss": -12.506500244140625, "global_step": 421993, "epoch": 2511} {"train_loss": -12.20643424987793, "global_step": 421994, "epoch": 2511} {"train_loss": -12.2029390335083, "global_step": 421995, "epoch": 2511} {"train_loss": -12.156204223632812, "global_step": 421996, "epoch": 2511} {"train_loss": -11.706637382507324, "global_step": 421997, "epoch": 2511} {"train_loss": -12.280431747436523, "global_step": 421998, "epoch": 2511} {"train_loss": -12.044044494628906, "global_step": 421999, "epoch": 2511} {"train_loss": -12.132197380065918, "global_step": 422000, "epoch": 2511} {"train_loss": -12.650689125061035, "global_step": 422001, "epoch": 2511} {"train_loss": -12.28188705444336, "global_step": 422002, "epoch": 2511} {"train_loss": -12.50032901763916, "global_step": 422003, "epoch": 2511} {"train_loss": -11.92444896697998, "global_step": 422004, "epoch": 2511} {"train_loss": -11.855476379394531, "global_step": 422005, "epoch": 2511} {"train_loss": -12.273504257202148, "global_step": 422006, "epoch": 2511} {"train_loss": -12.217409133911133, "global_step": 422007, "epoch": 2511} {"train_loss": -12.580150604248047, "global_step": 422008, "epoch": 2511} {"train_loss": -12.378379821777344, "global_step": 422009, "epoch": 2511} {"train_loss": -12.487139701843262, "global_step": 422010, "epoch": 2511} {"train_loss": -12.577327728271484, "global_step": 422011, "epoch": 2511} {"train_loss": -11.926794052124023, "global_step": 422012, "epoch": 2511} {"train_loss": -12.263063430786133, "global_step": 422013, "epoch": 2511} {"train_loss": -12.30984878540039, "global_step": 422014, "epoch": 2511} {"train_loss": -12.177853459403629, "global_step": 422015, "epoch": 2511, "val_loss": 308621.9375} {"train_loss": -12.196329116821289, "global_step": 422016, "epoch": 2512} {"train_loss": -12.344989776611328, "global_step": 422017, "epoch": 2512} {"train_loss": -12.210271835327148, "global_step": 422018, "epoch": 2512} {"train_loss": -12.583172798156738, "global_step": 422019, "epoch": 2512} {"train_loss": -12.763360977172852, "global_step": 422020, "epoch": 2512} {"train_loss": -12.567359924316406, "global_step": 422021, "epoch": 2512} {"train_loss": -12.576736450195312, "global_step": 422022, "epoch": 2512} {"train_loss": -12.397781372070312, "global_step": 422023, "epoch": 2512} {"train_loss": -12.563896179199219, "global_step": 422024, "epoch": 2512} {"train_loss": -12.359702110290527, "global_step": 422025, "epoch": 2512} {"train_loss": -12.518216133117676, "global_step": 422026, "epoch": 2512} {"train_loss": -12.197498321533203, "global_step": 422027, "epoch": 2512} {"train_loss": -12.524791717529297, "global_step": 422028, "epoch": 2512} {"train_loss": -12.169439315795898, "global_step": 422029, "epoch": 2512} {"train_loss": -12.367015838623047, "global_step": 422030, "epoch": 2512} {"train_loss": -12.361791610717773, "global_step": 422031, "epoch": 2512} {"train_loss": -12.423375129699707, "global_step": 422032, "epoch": 2512} {"train_loss": -12.680490493774414, "global_step": 422033, "epoch": 2512} {"train_loss": -12.600931167602539, "global_step": 422034, "epoch": 2512} {"train_loss": -12.611234664916992, "global_step": 422035, "epoch": 2512} {"train_loss": -12.591235160827637, "global_step": 422036, "epoch": 2512} {"train_loss": -12.734859466552734, "global_step": 422037, "epoch": 2512} {"train_loss": -12.624101638793945, "global_step": 422038, "epoch": 2512} {"train_loss": -12.646638870239258, "global_step": 422039, "epoch": 2512} {"train_loss": -12.382349014282227, "global_step": 422040, "epoch": 2512} {"train_loss": -12.458111763000488, "global_step": 422041, "epoch": 2512} {"train_loss": -11.566792488098145, "global_step": 422042, "epoch": 2512} {"train_loss": -12.602851867675781, "global_step": 422043, "epoch": 2512} {"train_loss": -11.994424819946289, "global_step": 422044, "epoch": 2512} {"train_loss": -11.350300788879395, "global_step": 422045, "epoch": 2512} {"train_loss": -11.48554515838623, "global_step": 422046, "epoch": 2512} {"train_loss": -11.58984661102295, "global_step": 422047, "epoch": 2512} {"train_loss": -11.15878677368164, "global_step": 422048, "epoch": 2512} {"train_loss": -12.122557640075684, "global_step": 422049, "epoch": 2512} {"train_loss": -11.299142837524414, "global_step": 422050, "epoch": 2512} {"train_loss": -11.666730880737305, "global_step": 422051, "epoch": 2512} {"train_loss": -10.110284805297852, "global_step": 422052, "epoch": 2512} {"train_loss": -12.00152587890625, "global_step": 422053, "epoch": 2512} {"train_loss": -10.590198516845703, "global_step": 422054, "epoch": 2512} {"train_loss": -11.357500076293945, "global_step": 422055, "epoch": 2512} {"train_loss": -11.40927791595459, "global_step": 422056, "epoch": 2512} {"train_loss": -10.442564964294434, "global_step": 422057, "epoch": 2512} {"train_loss": -11.470608711242676, "global_step": 422058, "epoch": 2512} {"train_loss": -9.888829231262207, "global_step": 422059, "epoch": 2512} {"train_loss": -10.928948402404785, "global_step": 422060, "epoch": 2512} {"train_loss": -11.675739288330078, "global_step": 422061, "epoch": 2512} {"train_loss": -10.817100524902344, "global_step": 422062, "epoch": 2512} {"train_loss": -12.137407302856445, "global_step": 422063, "epoch": 2512} {"train_loss": -10.85661506652832, "global_step": 422064, "epoch": 2512} {"train_loss": -11.821929931640625, "global_step": 422065, "epoch": 2512} {"train_loss": -11.851144790649414, "global_step": 422066, "epoch": 2512} {"train_loss": -11.98510456085205, "global_step": 422067, "epoch": 2512} {"train_loss": -11.668704986572266, "global_step": 422068, "epoch": 2512} {"train_loss": -11.767593383789062, "global_step": 422069, "epoch": 2512} {"train_loss": -11.862924575805664, "global_step": 422070, "epoch": 2512} {"train_loss": -11.675482749938965, "global_step": 422071, "epoch": 2512} {"train_loss": -12.01231575012207, "global_step": 422072, "epoch": 2512} {"train_loss": -11.96961784362793, "global_step": 422073, "epoch": 2512} {"train_loss": -11.668207168579102, "global_step": 422074, "epoch": 2512} {"train_loss": -12.192859649658203, "global_step": 422075, "epoch": 2512} {"train_loss": -12.164501190185547, "global_step": 422076, "epoch": 2512} {"train_loss": -12.27374267578125, "global_step": 422077, "epoch": 2512} {"train_loss": -12.253250122070312, "global_step": 422078, "epoch": 2512} {"train_loss": -12.45389175415039, "global_step": 422079, "epoch": 2512} {"train_loss": -12.469488143920898, "global_step": 422080, "epoch": 2512} {"train_loss": -12.50396728515625, "global_step": 422081, "epoch": 2512} {"train_loss": -12.31892204284668, "global_step": 422082, "epoch": 2512} {"train_loss": -12.483369827270508, "global_step": 422083, "epoch": 2512} {"train_loss": -12.385377883911133, "global_step": 422084, "epoch": 2512} {"train_loss": -12.347569465637207, "global_step": 422085, "epoch": 2512} {"train_loss": -12.411524772644043, "global_step": 422086, "epoch": 2512} {"train_loss": -12.348859786987305, "global_step": 422087, "epoch": 2512} {"train_loss": -12.580839157104492, "global_step": 422088, "epoch": 2512} {"train_loss": -12.266895294189453, "global_step": 422089, "epoch": 2512} {"train_loss": -12.480611801147461, "global_step": 422090, "epoch": 2512} {"train_loss": -12.449206352233887, "global_step": 422091, "epoch": 2512} {"train_loss": -12.21776008605957, "global_step": 422092, "epoch": 2512} {"train_loss": -12.497719764709473, "global_step": 422093, "epoch": 2512} {"train_loss": -12.23196029663086, "global_step": 422094, "epoch": 2512} {"train_loss": -12.219980239868164, "global_step": 422095, "epoch": 2512} {"train_loss": -12.705196380615234, "global_step": 422096, "epoch": 2512} {"train_loss": -12.41887092590332, "global_step": 422097, "epoch": 2512} {"train_loss": -12.534323692321777, "global_step": 422098, "epoch": 2512} {"train_loss": -12.240767478942871, "global_step": 422099, "epoch": 2512} {"train_loss": -12.384361267089844, "global_step": 422100, "epoch": 2512} {"train_loss": -12.341856002807617, "global_step": 422101, "epoch": 2512} {"train_loss": -11.980782508850098, "global_step": 422102, "epoch": 2512} {"train_loss": -12.164438247680664, "global_step": 422103, "epoch": 2512} {"train_loss": -12.178024291992188, "global_step": 422104, "epoch": 2512} {"train_loss": -11.339250564575195, "global_step": 422105, "epoch": 2512} {"train_loss": -12.569584846496582, "global_step": 422106, "epoch": 2512} {"train_loss": -11.498058319091797, "global_step": 422107, "epoch": 2512} {"train_loss": -11.74195671081543, "global_step": 422108, "epoch": 2512} {"train_loss": -12.567192077636719, "global_step": 422109, "epoch": 2512} {"train_loss": -11.241230964660645, "global_step": 422110, "epoch": 2512} {"train_loss": -11.449020385742188, "global_step": 422111, "epoch": 2512} {"train_loss": -12.425994873046875, "global_step": 422112, "epoch": 2512} {"train_loss": -10.888273239135742, "global_step": 422113, "epoch": 2512} {"train_loss": -11.611692428588867, "global_step": 422114, "epoch": 2512} {"train_loss": -11.951018333435059, "global_step": 422115, "epoch": 2512} {"train_loss": -11.354190826416016, "global_step": 422116, "epoch": 2512} {"train_loss": -10.903603553771973, "global_step": 422117, "epoch": 2512} {"train_loss": -12.016716003417969, "global_step": 422118, "epoch": 2512} {"train_loss": -9.209193229675293, "global_step": 422119, "epoch": 2512} {"train_loss": -12.035955429077148, "global_step": 422120, "epoch": 2512} {"train_loss": -10.600980758666992, "global_step": 422121, "epoch": 2512} {"train_loss": -11.389984130859375, "global_step": 422122, "epoch": 2512} {"train_loss": -10.153861045837402, "global_step": 422123, "epoch": 2512} {"train_loss": -10.784280776977539, "global_step": 422124, "epoch": 2512} {"train_loss": -9.051774978637695, "global_step": 422125, "epoch": 2512} {"train_loss": -11.667083740234375, "global_step": 422126, "epoch": 2512} {"train_loss": -10.141355514526367, "global_step": 422127, "epoch": 2512} {"train_loss": -10.222332000732422, "global_step": 422128, "epoch": 2512} {"train_loss": -10.817258834838867, "global_step": 422129, "epoch": 2512} {"train_loss": -11.47508430480957, "global_step": 422130, "epoch": 2512} {"train_loss": -11.58405876159668, "global_step": 422131, "epoch": 2512} {"train_loss": -11.241432189941406, "global_step": 422132, "epoch": 2512} {"train_loss": -10.992902755737305, "global_step": 422133, "epoch": 2512} {"train_loss": -11.541730880737305, "global_step": 422134, "epoch": 2512} {"train_loss": -11.532849311828613, "global_step": 422135, "epoch": 2512} {"train_loss": -11.67110824584961, "global_step": 422136, "epoch": 2512} {"train_loss": -11.497818946838379, "global_step": 422137, "epoch": 2512} {"train_loss": -10.82841968536377, "global_step": 422138, "epoch": 2512} {"train_loss": -11.816333770751953, "global_step": 422139, "epoch": 2512} {"train_loss": -11.56450080871582, "global_step": 422140, "epoch": 2512} {"train_loss": -12.00654411315918, "global_step": 422141, "epoch": 2512} {"train_loss": -10.942048072814941, "global_step": 422142, "epoch": 2512} {"train_loss": -12.064617156982422, "global_step": 422143, "epoch": 2512} {"train_loss": -10.86130142211914, "global_step": 422144, "epoch": 2512} {"train_loss": -12.365192413330078, "global_step": 422145, "epoch": 2512} {"train_loss": -10.655938148498535, "global_step": 422146, "epoch": 2512} {"train_loss": -12.153059959411621, "global_step": 422147, "epoch": 2512} {"train_loss": -11.158048629760742, "global_step": 422148, "epoch": 2512} {"train_loss": -12.061588287353516, "global_step": 422149, "epoch": 2512} {"train_loss": -11.762717247009277, "global_step": 422150, "epoch": 2512} {"train_loss": -12.21932315826416, "global_step": 422151, "epoch": 2512} {"train_loss": -11.770028114318848, "global_step": 422152, "epoch": 2512} {"train_loss": -12.377166748046875, "global_step": 422153, "epoch": 2512} {"train_loss": -12.165082931518555, "global_step": 422154, "epoch": 2512} {"train_loss": -12.36277961730957, "global_step": 422155, "epoch": 2512} {"train_loss": -12.083757400512695, "global_step": 422156, "epoch": 2512} {"train_loss": -12.33255386352539, "global_step": 422157, "epoch": 2512} {"train_loss": -12.3548002243042, "global_step": 422158, "epoch": 2512} {"train_loss": -12.319428443908691, "global_step": 422159, "epoch": 2512} {"train_loss": -12.224385261535645, "global_step": 422160, "epoch": 2512} {"train_loss": -12.481090545654297, "global_step": 422161, "epoch": 2512} {"train_loss": -12.2327880859375, "global_step": 422162, "epoch": 2512} {"train_loss": -12.256973266601562, "global_step": 422163, "epoch": 2512} {"train_loss": -12.350166320800781, "global_step": 422164, "epoch": 2512} {"train_loss": -12.392478942871094, "global_step": 422165, "epoch": 2512} {"train_loss": -12.572467803955078, "global_step": 422166, "epoch": 2512} {"train_loss": -12.59611701965332, "global_step": 422167, "epoch": 2512} {"train_loss": -12.254634857177734, "global_step": 422168, "epoch": 2512} {"train_loss": -12.462175369262695, "global_step": 422169, "epoch": 2512} {"train_loss": -12.541421890258789, "global_step": 422170, "epoch": 2512} {"train_loss": -12.439099311828613, "global_step": 422171, "epoch": 2512} {"train_loss": -12.367981910705566, "global_step": 422172, "epoch": 2512} {"train_loss": -12.581327438354492, "global_step": 422173, "epoch": 2512} {"train_loss": -12.339009284973145, "global_step": 422174, "epoch": 2512} {"train_loss": -12.414487838745117, "global_step": 422175, "epoch": 2512} {"train_loss": -12.495662689208984, "global_step": 422176, "epoch": 2512} {"train_loss": -12.463041305541992, "global_step": 422177, "epoch": 2512} {"train_loss": -12.449894905090332, "global_step": 422178, "epoch": 2512} {"train_loss": -12.582778930664062, "global_step": 422179, "epoch": 2512} {"train_loss": -12.503730773925781, "global_step": 422180, "epoch": 2512} {"train_loss": -12.545381546020508, "global_step": 422181, "epoch": 2512} {"train_loss": -12.427936553955078, "global_step": 422182, "epoch": 2512} {"train_loss": -11.925909661111378, "global_step": 422183, "epoch": 2512, "val_loss": 305770.8125} {"train_loss": -12.53647232055664, "global_step": 422184, "epoch": 2513} {"train_loss": -12.0869140625, "global_step": 422185, "epoch": 2513} {"train_loss": -12.579841613769531, "global_step": 422186, "epoch": 2513} {"train_loss": -11.745838165283203, "global_step": 422187, "epoch": 2513} {"train_loss": -12.479133605957031, "global_step": 422188, "epoch": 2513} {"train_loss": -12.221755981445312, "global_step": 422189, "epoch": 2513} {"train_loss": -12.466065406799316, "global_step": 422190, "epoch": 2513} {"train_loss": -12.210817337036133, "global_step": 422191, "epoch": 2513} {"train_loss": -11.70895767211914, "global_step": 422192, "epoch": 2513} {"train_loss": -12.33806037902832, "global_step": 422193, "epoch": 2513} {"train_loss": -12.32914924621582, "global_step": 422194, "epoch": 2513} {"train_loss": -11.903464317321777, "global_step": 422195, "epoch": 2513} {"train_loss": -12.466419219970703, "global_step": 422196, "epoch": 2513} {"train_loss": -12.452577590942383, "global_step": 422197, "epoch": 2513} {"train_loss": -12.486283302307129, "global_step": 422198, "epoch": 2513} {"train_loss": -12.57215690612793, "global_step": 422199, "epoch": 2513} {"train_loss": -12.165817260742188, "global_step": 422200, "epoch": 2513} {"train_loss": -12.19116497039795, "global_step": 422201, "epoch": 2513} {"train_loss": -12.806859970092773, "global_step": 422202, "epoch": 2513} {"train_loss": -12.18326187133789, "global_step": 422203, "epoch": 2513} {"train_loss": -12.370805740356445, "global_step": 422204, "epoch": 2513} {"train_loss": -12.492219924926758, "global_step": 422205, "epoch": 2513} {"train_loss": -12.156604766845703, "global_step": 422206, "epoch": 2513} {"train_loss": -12.579498291015625, "global_step": 422207, "epoch": 2513} {"train_loss": -12.431358337402344, "global_step": 422208, "epoch": 2513} {"train_loss": -12.084871292114258, "global_step": 422209, "epoch": 2513} {"train_loss": -12.685007095336914, "global_step": 422210, "epoch": 2513} {"train_loss": -12.34273910522461, "global_step": 422211, "epoch": 2513} {"train_loss": -12.370177268981934, "global_step": 422212, "epoch": 2513} {"train_loss": -12.439956665039062, "global_step": 422213, "epoch": 2513} {"train_loss": -12.373601913452148, "global_step": 422214, "epoch": 2513} {"train_loss": -12.405162811279297, "global_step": 422215, "epoch": 2513} {"train_loss": -12.62641429901123, "global_step": 422216, "epoch": 2513} {"train_loss": -12.618712425231934, "global_step": 422217, "epoch": 2513} {"train_loss": -12.16057014465332, "global_step": 422218, "epoch": 2513} {"train_loss": -12.346090316772461, "global_step": 422219, "epoch": 2513} {"train_loss": -12.375144958496094, "global_step": 422220, "epoch": 2513} {"train_loss": -12.567955017089844, "global_step": 422221, "epoch": 2513} {"train_loss": -12.551530838012695, "global_step": 422222, "epoch": 2513} {"train_loss": -12.493151664733887, "global_step": 422223, "epoch": 2513} {"train_loss": -12.388948440551758, "global_step": 422224, "epoch": 2513} {"train_loss": -12.193671226501465, "global_step": 422225, "epoch": 2513} {"train_loss": -12.572769165039062, "global_step": 422226, "epoch": 2513} {"train_loss": -12.25418472290039, "global_step": 422227, "epoch": 2513} {"train_loss": -12.625919342041016, "global_step": 422228, "epoch": 2513} {"train_loss": -12.16881275177002, "global_step": 422229, "epoch": 2513} {"train_loss": -12.46539306640625, "global_step": 422230, "epoch": 2513} {"train_loss": -12.144123077392578, "global_step": 422231, "epoch": 2513} {"train_loss": -12.373106956481934, "global_step": 422232, "epoch": 2513} {"train_loss": -12.225430488586426, "global_step": 422233, "epoch": 2513} {"train_loss": -12.517993927001953, "global_step": 422234, "epoch": 2513} {"train_loss": -12.15024185180664, "global_step": 422235, "epoch": 2513} {"train_loss": -12.099760055541992, "global_step": 422236, "epoch": 2513} {"train_loss": -12.56907844543457, "global_step": 422237, "epoch": 2513} {"train_loss": -12.677061080932617, "global_step": 422238, "epoch": 2513} {"train_loss": -12.659749031066895, "global_step": 422239, "epoch": 2513} {"train_loss": -12.620292663574219, "global_step": 422240, "epoch": 2513} {"train_loss": -12.607131004333496, "global_step": 422241, "epoch": 2513} {"train_loss": -12.580812454223633, "global_step": 422242, "epoch": 2513} {"train_loss": -12.713991165161133, "global_step": 422243, "epoch": 2513} {"train_loss": -12.230267524719238, "global_step": 422244, "epoch": 2513} {"train_loss": -12.744430541992188, "global_step": 422245, "epoch": 2513} {"train_loss": -12.44336986541748, "global_step": 422246, "epoch": 2513} {"train_loss": -12.108842849731445, "global_step": 422247, "epoch": 2513} {"train_loss": -12.70537281036377, "global_step": 422248, "epoch": 2513} {"train_loss": -12.567560195922852, "global_step": 422249, "epoch": 2513} {"train_loss": -11.645345687866211, "global_step": 422250, "epoch": 2513} {"train_loss": -12.328588485717773, "global_step": 422251, "epoch": 2513} {"train_loss": -12.29311752319336, "global_step": 422252, "epoch": 2513} {"train_loss": -11.786615371704102, "global_step": 422253, "epoch": 2513} {"train_loss": -12.26502799987793, "global_step": 422254, "epoch": 2513} {"train_loss": -12.010414123535156, "global_step": 422255, "epoch": 2513} {"train_loss": -11.999067306518555, "global_step": 422256, "epoch": 2513} {"train_loss": -12.118429183959961, "global_step": 422257, "epoch": 2513} {"train_loss": -11.69217586517334, "global_step": 422258, "epoch": 2513} {"train_loss": -12.6211576461792, "global_step": 422259, "epoch": 2513} {"train_loss": -11.74354076385498, "global_step": 422260, "epoch": 2513} {"train_loss": -12.137458801269531, "global_step": 422261, "epoch": 2513} {"train_loss": -12.450407028198242, "global_step": 422262, "epoch": 2513} {"train_loss": -11.678960800170898, "global_step": 422263, "epoch": 2513} {"train_loss": -12.31894588470459, "global_step": 422264, "epoch": 2513} {"train_loss": -12.183719635009766, "global_step": 422265, "epoch": 2513} {"train_loss": -11.935260772705078, "global_step": 422266, "epoch": 2513} {"train_loss": -12.4887113571167, "global_step": 422267, "epoch": 2513} {"train_loss": -12.179420471191406, "global_step": 422268, "epoch": 2513} {"train_loss": -12.342580795288086, "global_step": 422269, "epoch": 2513} {"train_loss": -12.408419609069824, "global_step": 422270, "epoch": 2513} {"train_loss": -12.523168563842773, "global_step": 422271, "epoch": 2513} {"train_loss": -12.128524780273438, "global_step": 422272, "epoch": 2513} {"train_loss": -11.5997953414917, "global_step": 422273, "epoch": 2513} {"train_loss": -12.091259002685547, "global_step": 422274, "epoch": 2513} {"train_loss": -11.304607391357422, "global_step": 422275, "epoch": 2513} {"train_loss": -11.648611068725586, "global_step": 422276, "epoch": 2513} {"train_loss": -12.209348678588867, "global_step": 422277, "epoch": 2513} {"train_loss": -11.477624893188477, "global_step": 422278, "epoch": 2513} {"train_loss": -12.094810485839844, "global_step": 422279, "epoch": 2513} {"train_loss": -12.347105026245117, "global_step": 422280, "epoch": 2513} {"train_loss": -11.706945419311523, "global_step": 422281, "epoch": 2513} {"train_loss": -12.306110382080078, "global_step": 422282, "epoch": 2513} {"train_loss": -12.054058074951172, "global_step": 422283, "epoch": 2513} {"train_loss": -11.737706184387207, "global_step": 422284, "epoch": 2513} {"train_loss": -12.631855010986328, "global_step": 422285, "epoch": 2513} {"train_loss": -11.909238815307617, "global_step": 422286, "epoch": 2513} {"train_loss": -12.12703800201416, "global_step": 422287, "epoch": 2513} {"train_loss": -12.163551330566406, "global_step": 422288, "epoch": 2513} {"train_loss": -12.147428512573242, "global_step": 422289, "epoch": 2513} {"train_loss": -11.724273681640625, "global_step": 422290, "epoch": 2513} {"train_loss": -12.372674942016602, "global_step": 422291, "epoch": 2513} {"train_loss": -11.613458633422852, "global_step": 422292, "epoch": 2513} {"train_loss": -11.901408195495605, "global_step": 422293, "epoch": 2513} {"train_loss": -12.265989303588867, "global_step": 422294, "epoch": 2513} {"train_loss": -12.11861801147461, "global_step": 422295, "epoch": 2513} {"train_loss": -12.321067810058594, "global_step": 422296, "epoch": 2513} {"train_loss": -12.69839859008789, "global_step": 422297, "epoch": 2513} {"train_loss": -12.169353485107422, "global_step": 422298, "epoch": 2513} {"train_loss": -12.508415222167969, "global_step": 422299, "epoch": 2513} {"train_loss": -12.187494277954102, "global_step": 422300, "epoch": 2513} {"train_loss": -12.49285888671875, "global_step": 422301, "epoch": 2513} {"train_loss": -12.352272033691406, "global_step": 422302, "epoch": 2513} {"train_loss": -12.584574699401855, "global_step": 422303, "epoch": 2513} {"train_loss": -12.206022262573242, "global_step": 422304, "epoch": 2513} {"train_loss": -12.256706237792969, "global_step": 422305, "epoch": 2513} {"train_loss": -12.11566162109375, "global_step": 422306, "epoch": 2513} {"train_loss": -12.351357460021973, "global_step": 422307, "epoch": 2513} {"train_loss": -12.227115631103516, "global_step": 422308, "epoch": 2513} {"train_loss": -12.650787353515625, "global_step": 422309, "epoch": 2513} {"train_loss": -12.36148452758789, "global_step": 422310, "epoch": 2513} {"train_loss": -12.275446891784668, "global_step": 422311, "epoch": 2513} {"train_loss": -12.691028594970703, "global_step": 422312, "epoch": 2513} {"train_loss": -12.119392395019531, "global_step": 422313, "epoch": 2513} {"train_loss": -12.414915084838867, "global_step": 422314, "epoch": 2513} {"train_loss": -12.146726608276367, "global_step": 422315, "epoch": 2513} {"train_loss": -11.5297269821167, "global_step": 422316, "epoch": 2513} {"train_loss": -12.287471771240234, "global_step": 422317, "epoch": 2513} {"train_loss": -11.97268009185791, "global_step": 422318, "epoch": 2513} {"train_loss": -11.637935638427734, "global_step": 422319, "epoch": 2513} {"train_loss": -11.821002960205078, "global_step": 422320, "epoch": 2513} {"train_loss": -12.317096710205078, "global_step": 422321, "epoch": 2513} {"train_loss": -11.748907089233398, "global_step": 422322, "epoch": 2513} {"train_loss": -12.12908935546875, "global_step": 422323, "epoch": 2513} {"train_loss": -12.414990425109863, "global_step": 422324, "epoch": 2513} {"train_loss": -11.358877182006836, "global_step": 422325, "epoch": 2513} {"train_loss": -11.807783126831055, "global_step": 422326, "epoch": 2513} {"train_loss": -11.53246021270752, "global_step": 422327, "epoch": 2513} {"train_loss": -10.637707710266113, "global_step": 422328, "epoch": 2513} {"train_loss": -11.42491626739502, "global_step": 422329, "epoch": 2513} {"train_loss": -10.36767292022705, "global_step": 422330, "epoch": 2513} {"train_loss": -9.733686447143555, "global_step": 422331, "epoch": 2513} {"train_loss": -8.02652645111084, "global_step": 422332, "epoch": 2513} {"train_loss": -8.622236251831055, "global_step": 422333, "epoch": 2513} {"train_loss": -8.208751678466797, "global_step": 422334, "epoch": 2513} {"train_loss": -8.369232177734375, "global_step": 422335, "epoch": 2513} {"train_loss": -8.566527366638184, "global_step": 422336, "epoch": 2513} {"train_loss": -8.897665023803711, "global_step": 422337, "epoch": 2513} {"train_loss": -8.582670211791992, "global_step": 422338, "epoch": 2513} {"train_loss": -8.77100944519043, "global_step": 422339, "epoch": 2513} {"train_loss": -9.168426513671875, "global_step": 422340, "epoch": 2513} {"train_loss": -8.775909423828125, "global_step": 422341, "epoch": 2513} {"train_loss": -9.065147399902344, "global_step": 422342, "epoch": 2513} {"train_loss": -9.541709899902344, "global_step": 422343, "epoch": 2513} {"train_loss": -9.304974555969238, "global_step": 422344, "epoch": 2513} {"train_loss": -9.551368713378906, "global_step": 422345, "epoch": 2513} {"train_loss": -10.25086784362793, "global_step": 422346, "epoch": 2513} {"train_loss": -10.085869789123535, "global_step": 422347, "epoch": 2513} {"train_loss": -10.567848205566406, "global_step": 422348, "epoch": 2513} {"train_loss": -10.755880355834961, "global_step": 422349, "epoch": 2513} {"train_loss": -10.985383987426758, "global_step": 422350, "epoch": 2513} {"train_loss": -11.856483141581217, "global_step": 422351, "epoch": 2513, "val_loss": 303069.53125} {"train_loss": -11.366371154785156, "global_step": 422352, "epoch": 2514} {"train_loss": -10.618050575256348, "global_step": 422353, "epoch": 2514} {"train_loss": -11.492673873901367, "global_step": 422354, "epoch": 2514} {"train_loss": -11.49531364440918, "global_step": 422355, "epoch": 2514} {"train_loss": -11.442309379577637, "global_step": 422356, "epoch": 2514} {"train_loss": -11.670759201049805, "global_step": 422357, "epoch": 2514} {"train_loss": -10.586922645568848, "global_step": 422358, "epoch": 2514} {"train_loss": -11.551410675048828, "global_step": 422359, "epoch": 2514} {"train_loss": -11.968992233276367, "global_step": 422360, "epoch": 2514} {"train_loss": -11.809501647949219, "global_step": 422361, "epoch": 2514} {"train_loss": -11.744109153747559, "global_step": 422362, "epoch": 2514} {"train_loss": -11.978076934814453, "global_step": 422363, "epoch": 2514} {"train_loss": -12.188014030456543, "global_step": 422364, "epoch": 2514} {"train_loss": -11.980207443237305, "global_step": 422365, "epoch": 2514} {"train_loss": -12.169927597045898, "global_step": 422366, "epoch": 2514} {"train_loss": -12.137563705444336, "global_step": 422367, "epoch": 2514} {"train_loss": -12.31097412109375, "global_step": 422368, "epoch": 2514} {"train_loss": -11.848379135131836, "global_step": 422369, "epoch": 2514} {"train_loss": -12.060771942138672, "global_step": 422370, "epoch": 2514} {"train_loss": -11.927648544311523, "global_step": 422371, "epoch": 2514} {"train_loss": -11.800902366638184, "global_step": 422372, "epoch": 2514} {"train_loss": -12.148051261901855, "global_step": 422373, "epoch": 2514} {"train_loss": -11.993936538696289, "global_step": 422374, "epoch": 2514} {"train_loss": -11.992034912109375, "global_step": 422375, "epoch": 2514} {"train_loss": -12.013138771057129, "global_step": 422376, "epoch": 2514} {"train_loss": -12.057441711425781, "global_step": 422377, "epoch": 2514} {"train_loss": -12.222408294677734, "global_step": 422378, "epoch": 2514} {"train_loss": -12.223846435546875, "global_step": 422379, "epoch": 2514} {"train_loss": -11.658668518066406, "global_step": 422380, "epoch": 2514} {"train_loss": -12.308143615722656, "global_step": 422381, "epoch": 2514} {"train_loss": -12.385683059692383, "global_step": 422382, "epoch": 2514} {"train_loss": -12.096705436706543, "global_step": 422383, "epoch": 2514} {"train_loss": -12.42884635925293, "global_step": 422384, "epoch": 2514} {"train_loss": -12.295328140258789, "global_step": 422385, "epoch": 2514} {"train_loss": -11.883861541748047, "global_step": 422386, "epoch": 2514} {"train_loss": -12.073338508605957, "global_step": 422387, "epoch": 2514} {"train_loss": -12.00301456451416, "global_step": 422388, "epoch": 2514} {"train_loss": -12.125025749206543, "global_step": 422389, "epoch": 2514} {"train_loss": -12.123417854309082, "global_step": 422390, "epoch": 2514} {"train_loss": -11.930793762207031, "global_step": 422391, "epoch": 2514} {"train_loss": -12.246698379516602, "global_step": 422392, "epoch": 2514} {"train_loss": -12.295257568359375, "global_step": 422393, "epoch": 2514} {"train_loss": -12.35055160522461, "global_step": 422394, "epoch": 2514} {"train_loss": -12.399272918701172, "global_step": 422395, "epoch": 2514} {"train_loss": -12.451866149902344, "global_step": 422396, "epoch": 2514} {"train_loss": -12.560181617736816, "global_step": 422397, "epoch": 2514} {"train_loss": -12.153583526611328, "global_step": 422398, "epoch": 2514} {"train_loss": -12.699812889099121, "global_step": 422399, "epoch": 2514} {"train_loss": -12.184186935424805, "global_step": 422400, "epoch": 2514} {"train_loss": -12.2333402633667, "global_step": 422401, "epoch": 2514} {"train_loss": -12.100353240966797, "global_step": 422402, "epoch": 2514} {"train_loss": -11.917692184448242, "global_step": 422403, "epoch": 2514} {"train_loss": -12.209976196289062, "global_step": 422404, "epoch": 2514} {"train_loss": -12.311883926391602, "global_step": 422405, "epoch": 2514} {"train_loss": -12.232303619384766, "global_step": 422406, "epoch": 2514} {"train_loss": -11.673341751098633, "global_step": 422407, "epoch": 2514} {"train_loss": -12.389962196350098, "global_step": 422408, "epoch": 2514} {"train_loss": -11.543754577636719, "global_step": 422409, "epoch": 2514} {"train_loss": -12.360404968261719, "global_step": 422410, "epoch": 2514} {"train_loss": -11.321882247924805, "global_step": 422411, "epoch": 2514} {"train_loss": -12.117501258850098, "global_step": 422412, "epoch": 2514} {"train_loss": -11.205137252807617, "global_step": 422413, "epoch": 2514} {"train_loss": -12.016130447387695, "global_step": 422414, "epoch": 2514} {"train_loss": -11.319574356079102, "global_step": 422415, "epoch": 2514} {"train_loss": -12.225362777709961, "global_step": 422416, "epoch": 2514} {"train_loss": -11.414426803588867, "global_step": 422417, "epoch": 2514} {"train_loss": -11.863903045654297, "global_step": 422418, "epoch": 2514} {"train_loss": -11.477267265319824, "global_step": 422419, "epoch": 2514} {"train_loss": -11.767353057861328, "global_step": 422420, "epoch": 2514} {"train_loss": -10.977944374084473, "global_step": 422421, "epoch": 2514} {"train_loss": -11.506412506103516, "global_step": 422422, "epoch": 2514} {"train_loss": -12.311483383178711, "global_step": 422423, "epoch": 2514} {"train_loss": -10.72160816192627, "global_step": 422424, "epoch": 2514} {"train_loss": -12.480358123779297, "global_step": 422425, "epoch": 2514} {"train_loss": -10.375455856323242, "global_step": 422426, "epoch": 2514} {"train_loss": -12.196859359741211, "global_step": 422427, "epoch": 2514} {"train_loss": -12.006378173828125, "global_step": 422428, "epoch": 2514} {"train_loss": -11.493205070495605, "global_step": 422429, "epoch": 2514} {"train_loss": -11.915752410888672, "global_step": 422430, "epoch": 2514} {"train_loss": -11.431201934814453, "global_step": 422431, "epoch": 2514} {"train_loss": -11.555095672607422, "global_step": 422432, "epoch": 2514} {"train_loss": -12.447286605834961, "global_step": 422433, "epoch": 2514} {"train_loss": -11.729743957519531, "global_step": 422434, "epoch": 2514} {"train_loss": -12.187390327453613, "global_step": 422435, "epoch": 2514} {"train_loss": -12.285953521728516, "global_step": 422436, "epoch": 2514} {"train_loss": -12.150196075439453, "global_step": 422437, "epoch": 2514} {"train_loss": -12.319514274597168, "global_step": 422438, "epoch": 2514} {"train_loss": -12.19978141784668, "global_step": 422439, "epoch": 2514} {"train_loss": -12.091503143310547, "global_step": 422440, "epoch": 2514} {"train_loss": -12.248285293579102, "global_step": 422441, "epoch": 2514} {"train_loss": -12.127323150634766, "global_step": 422442, "epoch": 2514} {"train_loss": -12.21629524230957, "global_step": 422443, "epoch": 2514} {"train_loss": -12.053749084472656, "global_step": 422444, "epoch": 2514} {"train_loss": -11.974940299987793, "global_step": 422445, "epoch": 2514} {"train_loss": -12.084257125854492, "global_step": 422446, "epoch": 2514} {"train_loss": -12.272550582885742, "global_step": 422447, "epoch": 2514} {"train_loss": -12.126232147216797, "global_step": 422448, "epoch": 2514} {"train_loss": -12.07177734375, "global_step": 422449, "epoch": 2514} {"train_loss": -12.420883178710938, "global_step": 422450, "epoch": 2514} {"train_loss": -12.065237045288086, "global_step": 422451, "epoch": 2514} {"train_loss": -12.335976600646973, "global_step": 422452, "epoch": 2514} {"train_loss": -12.419950485229492, "global_step": 422453, "epoch": 2514} {"train_loss": -12.238618850708008, "global_step": 422454, "epoch": 2514} {"train_loss": -12.471948623657227, "global_step": 422455, "epoch": 2514} {"train_loss": -12.272928237915039, "global_step": 422456, "epoch": 2514} {"train_loss": -12.2485933303833, "global_step": 422457, "epoch": 2514} {"train_loss": -12.269153594970703, "global_step": 422458, "epoch": 2514} {"train_loss": -11.990530014038086, "global_step": 422459, "epoch": 2514} {"train_loss": -12.428595542907715, "global_step": 422460, "epoch": 2514} {"train_loss": -12.35349178314209, "global_step": 422461, "epoch": 2514} {"train_loss": -12.338706970214844, "global_step": 422462, "epoch": 2514} {"train_loss": -12.50358772277832, "global_step": 422463, "epoch": 2514} {"train_loss": -12.451092720031738, "global_step": 422464, "epoch": 2514} {"train_loss": -12.510257720947266, "global_step": 422465, "epoch": 2514} {"train_loss": -12.679264068603516, "global_step": 422466, "epoch": 2514} {"train_loss": -12.527957916259766, "global_step": 422467, "epoch": 2514} {"train_loss": -12.46711540222168, "global_step": 422468, "epoch": 2514} {"train_loss": -12.653739929199219, "global_step": 422469, "epoch": 2514} {"train_loss": -12.166927337646484, "global_step": 422470, "epoch": 2514} {"train_loss": -12.554566383361816, "global_step": 422471, "epoch": 2514} {"train_loss": -12.436832427978516, "global_step": 422472, "epoch": 2514} {"train_loss": -11.926600456237793, "global_step": 422473, "epoch": 2514} {"train_loss": -12.545915603637695, "global_step": 422474, "epoch": 2514} {"train_loss": -12.101245880126953, "global_step": 422475, "epoch": 2514} {"train_loss": -12.523460388183594, "global_step": 422476, "epoch": 2514} {"train_loss": -12.16754150390625, "global_step": 422477, "epoch": 2514} {"train_loss": -11.830774307250977, "global_step": 422478, "epoch": 2514} {"train_loss": -12.148941993713379, "global_step": 422479, "epoch": 2514} {"train_loss": -12.654901504516602, "global_step": 422480, "epoch": 2514} {"train_loss": -12.470024108886719, "global_step": 422481, "epoch": 2514} {"train_loss": -12.638052940368652, "global_step": 422482, "epoch": 2514} {"train_loss": -12.603759765625, "global_step": 422483, "epoch": 2514} {"train_loss": -12.477659225463867, "global_step": 422484, "epoch": 2514} {"train_loss": -12.556646347045898, "global_step": 422485, "epoch": 2514} {"train_loss": -12.194899559020996, "global_step": 422486, "epoch": 2514} {"train_loss": -12.34514331817627, "global_step": 422487, "epoch": 2514} {"train_loss": -12.62824821472168, "global_step": 422488, "epoch": 2514} {"train_loss": -12.14061164855957, "global_step": 422489, "epoch": 2514} {"train_loss": -12.403515815734863, "global_step": 422490, "epoch": 2514} {"train_loss": -12.701992988586426, "global_step": 422491, "epoch": 2514} {"train_loss": -12.411907196044922, "global_step": 422492, "epoch": 2514} {"train_loss": -12.53788948059082, "global_step": 422493, "epoch": 2514} {"train_loss": -12.646589279174805, "global_step": 422494, "epoch": 2514} {"train_loss": -12.447978973388672, "global_step": 422495, "epoch": 2514} {"train_loss": -12.001127243041992, "global_step": 422496, "epoch": 2514} {"train_loss": -12.765077590942383, "global_step": 422497, "epoch": 2514} {"train_loss": -12.394441604614258, "global_step": 422498, "epoch": 2514} {"train_loss": -12.500556945800781, "global_step": 422499, "epoch": 2514} {"train_loss": -12.396329879760742, "global_step": 422500, "epoch": 2514} {"train_loss": -11.947738647460938, "global_step": 422501, "epoch": 2514} {"train_loss": -11.746780395507812, "global_step": 422502, "epoch": 2514} {"train_loss": -12.549072265625, "global_step": 422503, "epoch": 2514} {"train_loss": -11.841492652893066, "global_step": 422504, "epoch": 2514} {"train_loss": -11.964771270751953, "global_step": 422505, "epoch": 2514} {"train_loss": -12.690679550170898, "global_step": 422506, "epoch": 2514} {"train_loss": -12.341984748840332, "global_step": 422507, "epoch": 2514} {"train_loss": -12.359042167663574, "global_step": 422508, "epoch": 2514} {"train_loss": -12.849742889404297, "global_step": 422509, "epoch": 2514} {"train_loss": -12.52987289428711, "global_step": 422510, "epoch": 2514} {"train_loss": -12.576192855834961, "global_step": 422511, "epoch": 2514} {"train_loss": -12.514104843139648, "global_step": 422512, "epoch": 2514} {"train_loss": -12.33273983001709, "global_step": 422513, "epoch": 2514} {"train_loss": -12.302369117736816, "global_step": 422514, "epoch": 2514} {"train_loss": -11.98875904083252, "global_step": 422515, "epoch": 2514} {"train_loss": -12.526082992553711, "global_step": 422516, "epoch": 2514} {"train_loss": -12.248151779174805, "global_step": 422517, "epoch": 2514} {"train_loss": -12.001097679138184, "global_step": 422518, "epoch": 2514} {"train_loss": -12.121262045133681, "global_step": 422519, "epoch": 2514, "val_loss": 305623.34375} {"train_loss": -11.423401832580566, "global_step": 422520, "epoch": 2515} {"train_loss": -12.317551612854004, "global_step": 422521, "epoch": 2515} {"train_loss": -11.561891555786133, "global_step": 422522, "epoch": 2515} {"train_loss": -12.031633377075195, "global_step": 422523, "epoch": 2515} {"train_loss": -11.463029861450195, "global_step": 422524, "epoch": 2515} {"train_loss": -12.31977653503418, "global_step": 422525, "epoch": 2515} {"train_loss": -12.311603546142578, "global_step": 422526, "epoch": 2515} {"train_loss": -12.385457992553711, "global_step": 422527, "epoch": 2515} {"train_loss": -12.444351196289062, "global_step": 422528, "epoch": 2515} {"train_loss": -11.998496055603027, "global_step": 422529, "epoch": 2515} {"train_loss": -12.052250862121582, "global_step": 422530, "epoch": 2515} {"train_loss": -12.559751510620117, "global_step": 422531, "epoch": 2515} {"train_loss": -11.541055679321289, "global_step": 422532, "epoch": 2515} {"train_loss": -12.58533763885498, "global_step": 422533, "epoch": 2515} {"train_loss": -11.729750633239746, "global_step": 422534, "epoch": 2515} {"train_loss": -12.319390296936035, "global_step": 422535, "epoch": 2515} {"train_loss": -12.072345733642578, "global_step": 422536, "epoch": 2515} {"train_loss": -12.50040054321289, "global_step": 422537, "epoch": 2515} {"train_loss": -12.293745040893555, "global_step": 422538, "epoch": 2515} {"train_loss": -12.549447059631348, "global_step": 422539, "epoch": 2515} {"train_loss": -12.147876739501953, "global_step": 422540, "epoch": 2515} {"train_loss": -12.314004898071289, "global_step": 422541, "epoch": 2515} {"train_loss": -12.137829780578613, "global_step": 422542, "epoch": 2515} {"train_loss": -11.911884307861328, "global_step": 422543, "epoch": 2515} {"train_loss": -12.393202781677246, "global_step": 422544, "epoch": 2515} {"train_loss": -12.08898639678955, "global_step": 422545, "epoch": 2515} {"train_loss": -12.137836456298828, "global_step": 422546, "epoch": 2515} {"train_loss": -12.195638656616211, "global_step": 422547, "epoch": 2515} {"train_loss": -12.383017539978027, "global_step": 422548, "epoch": 2515} {"train_loss": -11.276662826538086, "global_step": 422549, "epoch": 2515} {"train_loss": -12.528556823730469, "global_step": 422550, "epoch": 2515} {"train_loss": -11.814802169799805, "global_step": 422551, "epoch": 2515} {"train_loss": -12.774642944335938, "global_step": 422552, "epoch": 2515} {"train_loss": -12.273097038269043, "global_step": 422553, "epoch": 2515} {"train_loss": -12.297237396240234, "global_step": 422554, "epoch": 2515} {"train_loss": -12.117900848388672, "global_step": 422555, "epoch": 2515} {"train_loss": -12.696992874145508, "global_step": 422556, "epoch": 2515} {"train_loss": -12.286396026611328, "global_step": 422557, "epoch": 2515} {"train_loss": -12.282315254211426, "global_step": 422558, "epoch": 2515} {"train_loss": -12.612306594848633, "global_step": 422559, "epoch": 2515} {"train_loss": -12.538212776184082, "global_step": 422560, "epoch": 2515} {"train_loss": -12.56947135925293, "global_step": 422561, "epoch": 2515} {"train_loss": -12.471222877502441, "global_step": 422562, "epoch": 2515} {"train_loss": -12.470235824584961, "global_step": 422563, "epoch": 2515} {"train_loss": -12.642911911010742, "global_step": 422564, "epoch": 2515} {"train_loss": -12.507033348083496, "global_step": 422565, "epoch": 2515} {"train_loss": -12.630346298217773, "global_step": 422566, "epoch": 2515} {"train_loss": -12.516744613647461, "global_step": 422567, "epoch": 2515} {"train_loss": -12.579050064086914, "global_step": 422568, "epoch": 2515} {"train_loss": -12.300941467285156, "global_step": 422569, "epoch": 2515} {"train_loss": -12.305521011352539, "global_step": 422570, "epoch": 2515} {"train_loss": -12.375306129455566, "global_step": 422571, "epoch": 2515} {"train_loss": -12.809813499450684, "global_step": 422572, "epoch": 2515} {"train_loss": -12.367081642150879, "global_step": 422573, "epoch": 2515} {"train_loss": -12.570028305053711, "global_step": 422574, "epoch": 2515} {"train_loss": -12.562189102172852, "global_step": 422575, "epoch": 2515} {"train_loss": -12.847699165344238, "global_step": 422576, "epoch": 2515} {"train_loss": -12.577508926391602, "global_step": 422577, "epoch": 2515} {"train_loss": -12.435626983642578, "global_step": 422578, "epoch": 2515} {"train_loss": -12.542847633361816, "global_step": 422579, "epoch": 2515} {"train_loss": -12.56236457824707, "global_step": 422580, "epoch": 2515} {"train_loss": -11.934289932250977, "global_step": 422581, "epoch": 2515} {"train_loss": -12.242441177368164, "global_step": 422582, "epoch": 2515} {"train_loss": -12.628366470336914, "global_step": 422583, "epoch": 2515} {"train_loss": -12.435625076293945, "global_step": 422584, "epoch": 2515} {"train_loss": -12.182188034057617, "global_step": 422585, "epoch": 2515} {"train_loss": -12.87759780883789, "global_step": 422586, "epoch": 2515} {"train_loss": -12.115240097045898, "global_step": 422587, "epoch": 2515} {"train_loss": -12.298420906066895, "global_step": 422588, "epoch": 2515} {"train_loss": -12.007577896118164, "global_step": 422589, "epoch": 2515} {"train_loss": -12.785809516906738, "global_step": 422590, "epoch": 2515} {"train_loss": -12.556976318359375, "global_step": 422591, "epoch": 2515} {"train_loss": -11.880365371704102, "global_step": 422592, "epoch": 2515} {"train_loss": -11.737449645996094, "global_step": 422593, "epoch": 2515} {"train_loss": -12.66847038269043, "global_step": 422594, "epoch": 2515} {"train_loss": -11.884490966796875, "global_step": 422595, "epoch": 2515} {"train_loss": -12.377185821533203, "global_step": 422596, "epoch": 2515} {"train_loss": -12.438825607299805, "global_step": 422597, "epoch": 2515} {"train_loss": -12.414787292480469, "global_step": 422598, "epoch": 2515} {"train_loss": -12.020818710327148, "global_step": 422599, "epoch": 2515} {"train_loss": -12.524393081665039, "global_step": 422600, "epoch": 2515} {"train_loss": -12.392997741699219, "global_step": 422601, "epoch": 2515} {"train_loss": -11.872512817382812, "global_step": 422602, "epoch": 2515} {"train_loss": -12.19808578491211, "global_step": 422603, "epoch": 2515} {"train_loss": -12.479074478149414, "global_step": 422604, "epoch": 2515} {"train_loss": -12.341592788696289, "global_step": 422605, "epoch": 2515} {"train_loss": -12.293289184570312, "global_step": 422606, "epoch": 2515} {"train_loss": -12.573980331420898, "global_step": 422607, "epoch": 2515} {"train_loss": -12.607622146606445, "global_step": 422608, "epoch": 2515} {"train_loss": -12.591395378112793, "global_step": 422609, "epoch": 2515} {"train_loss": -12.342327117919922, "global_step": 422610, "epoch": 2515} {"train_loss": -12.520796775817871, "global_step": 422611, "epoch": 2515} {"train_loss": -12.29831314086914, "global_step": 422612, "epoch": 2515} {"train_loss": -11.811226844787598, "global_step": 422613, "epoch": 2515} {"train_loss": -12.410573959350586, "global_step": 422614, "epoch": 2515} {"train_loss": -12.69212532043457, "global_step": 422615, "epoch": 2515} {"train_loss": -12.644052505493164, "global_step": 422616, "epoch": 2515} {"train_loss": -12.601846694946289, "global_step": 422617, "epoch": 2515} {"train_loss": -12.606672286987305, "global_step": 422618, "epoch": 2515} {"train_loss": -12.454968452453613, "global_step": 422619, "epoch": 2515} {"train_loss": -12.371862411499023, "global_step": 422620, "epoch": 2515} {"train_loss": -12.249091148376465, "global_step": 422621, "epoch": 2515} {"train_loss": -12.544787406921387, "global_step": 422622, "epoch": 2515} {"train_loss": -12.541206359863281, "global_step": 422623, "epoch": 2515} {"train_loss": -12.372369766235352, "global_step": 422624, "epoch": 2515} {"train_loss": -12.646477699279785, "global_step": 422625, "epoch": 2515} {"train_loss": -12.341967582702637, "global_step": 422626, "epoch": 2515} {"train_loss": -12.395124435424805, "global_step": 422627, "epoch": 2515} {"train_loss": -12.38886833190918, "global_step": 422628, "epoch": 2515} {"train_loss": -12.44786262512207, "global_step": 422629, "epoch": 2515} {"train_loss": -11.558032989501953, "global_step": 422630, "epoch": 2515} {"train_loss": -11.920902252197266, "global_step": 422631, "epoch": 2515} {"train_loss": -11.990257263183594, "global_step": 422632, "epoch": 2515} {"train_loss": -11.320809364318848, "global_step": 422633, "epoch": 2515} {"train_loss": -10.923501968383789, "global_step": 422634, "epoch": 2515} {"train_loss": -12.268584251403809, "global_step": 422635, "epoch": 2515} {"train_loss": -9.054405212402344, "global_step": 422636, "epoch": 2515} {"train_loss": -10.158315658569336, "global_step": 422637, "epoch": 2515} {"train_loss": -9.160258293151855, "global_step": 422638, "epoch": 2515} {"train_loss": -11.39886474609375, "global_step": 422639, "epoch": 2515} {"train_loss": -9.332086563110352, "global_step": 422640, "epoch": 2515} {"train_loss": -10.671188354492188, "global_step": 422641, "epoch": 2515} {"train_loss": -10.262721061706543, "global_step": 422642, "epoch": 2515} {"train_loss": -8.608500480651855, "global_step": 422643, "epoch": 2515} {"train_loss": -8.056371688842773, "global_step": 422644, "epoch": 2515} {"train_loss": -9.577899932861328, "global_step": 422645, "epoch": 2515} {"train_loss": -10.779571533203125, "global_step": 422646, "epoch": 2515} {"train_loss": -9.966461181640625, "global_step": 422647, "epoch": 2515} {"train_loss": -8.961544036865234, "global_step": 422648, "epoch": 2515} {"train_loss": -9.451761245727539, "global_step": 422649, "epoch": 2515} {"train_loss": -11.071877479553223, "global_step": 422650, "epoch": 2515} {"train_loss": -10.330886840820312, "global_step": 422651, "epoch": 2515} {"train_loss": -10.558069229125977, "global_step": 422652, "epoch": 2515} {"train_loss": -11.174272537231445, "global_step": 422653, "epoch": 2515} {"train_loss": -11.722923278808594, "global_step": 422654, "epoch": 2515} {"train_loss": -10.863662719726562, "global_step": 422655, "epoch": 2515} {"train_loss": -11.234428405761719, "global_step": 422656, "epoch": 2515} {"train_loss": -10.846033096313477, "global_step": 422657, "epoch": 2515} {"train_loss": -11.554055213928223, "global_step": 422658, "epoch": 2515} {"train_loss": -11.65629768371582, "global_step": 422659, "epoch": 2515} {"train_loss": -11.724143981933594, "global_step": 422660, "epoch": 2515} {"train_loss": -11.876789093017578, "global_step": 422661, "epoch": 2515} {"train_loss": -11.350201606750488, "global_step": 422662, "epoch": 2515} {"train_loss": -11.64412784576416, "global_step": 422663, "epoch": 2515} {"train_loss": -11.415081024169922, "global_step": 422664, "epoch": 2515} {"train_loss": -11.15296459197998, "global_step": 422665, "epoch": 2515} {"train_loss": -11.886835098266602, "global_step": 422666, "epoch": 2515} {"train_loss": -11.119439125061035, "global_step": 422667, "epoch": 2515} {"train_loss": -12.093839645385742, "global_step": 422668, "epoch": 2515} {"train_loss": -11.029716491699219, "global_step": 422669, "epoch": 2515} {"train_loss": -12.279443740844727, "global_step": 422670, "epoch": 2515} {"train_loss": -11.352957725524902, "global_step": 422671, "epoch": 2515} {"train_loss": -11.579126358032227, "global_step": 422672, "epoch": 2515} {"train_loss": -11.472383499145508, "global_step": 422673, "epoch": 2515} {"train_loss": -11.291742324829102, "global_step": 422674, "epoch": 2515} {"train_loss": -12.044929504394531, "global_step": 422675, "epoch": 2515} {"train_loss": -11.251049041748047, "global_step": 422676, "epoch": 2515} {"train_loss": -12.362510681152344, "global_step": 422677, "epoch": 2515} {"train_loss": -11.358909606933594, "global_step": 422678, "epoch": 2515} {"train_loss": -11.108480453491211, "global_step": 422679, "epoch": 2515} {"train_loss": -11.983251571655273, "global_step": 422680, "epoch": 2515} {"train_loss": -11.456242561340332, "global_step": 422681, "epoch": 2515} {"train_loss": -11.752969741821289, "global_step": 422682, "epoch": 2515} {"train_loss": -11.68356704711914, "global_step": 422683, "epoch": 2515} {"train_loss": -11.822750091552734, "global_step": 422684, "epoch": 2515} {"train_loss": -12.150367736816406, "global_step": 422685, "epoch": 2515} {"train_loss": -11.675046920776367, "global_step": 422686, "epoch": 2515} {"train_loss": -11.895908230826969, "global_step": 422687, "epoch": 2515, "val_loss": 306158.625, "train_action_mse_error": 0.7094807624816895} {"train_loss": -12.065200805664062, "global_step": 422688, "epoch": 2516} {"train_loss": -11.654024124145508, "global_step": 422689, "epoch": 2516} {"train_loss": -12.347799301147461, "global_step": 422690, "epoch": 2516} {"train_loss": -12.310995101928711, "global_step": 422691, "epoch": 2516} {"train_loss": -11.913811683654785, "global_step": 422692, "epoch": 2516} {"train_loss": -12.105347633361816, "global_step": 422693, "epoch": 2516} {"train_loss": -12.400192260742188, "global_step": 422694, "epoch": 2516} {"train_loss": -12.143575668334961, "global_step": 422695, "epoch": 2516} {"train_loss": -12.250831604003906, "global_step": 422696, "epoch": 2516} {"train_loss": -12.218271255493164, "global_step": 422697, "epoch": 2516} {"train_loss": -12.154611587524414, "global_step": 422698, "epoch": 2516} {"train_loss": -12.146531105041504, "global_step": 422699, "epoch": 2516} {"train_loss": -12.24267578125, "global_step": 422700, "epoch": 2516} {"train_loss": -12.398289680480957, "global_step": 422701, "epoch": 2516} {"train_loss": -12.496896743774414, "global_step": 422702, "epoch": 2516} {"train_loss": -12.281110763549805, "global_step": 422703, "epoch": 2516} {"train_loss": -12.37270450592041, "global_step": 422704, "epoch": 2516} {"train_loss": -12.475852966308594, "global_step": 422705, "epoch": 2516} {"train_loss": -12.399654388427734, "global_step": 422706, "epoch": 2516} {"train_loss": -12.491161346435547, "global_step": 422707, "epoch": 2516} {"train_loss": -12.378255844116211, "global_step": 422708, "epoch": 2516} {"train_loss": -12.282081604003906, "global_step": 422709, "epoch": 2516} {"train_loss": -12.577248573303223, "global_step": 422710, "epoch": 2516} {"train_loss": -12.387516975402832, "global_step": 422711, "epoch": 2516} {"train_loss": -12.52305793762207, "global_step": 422712, "epoch": 2516} {"train_loss": -12.383426666259766, "global_step": 422713, "epoch": 2516} {"train_loss": -12.606769561767578, "global_step": 422714, "epoch": 2516} {"train_loss": -12.723377227783203, "global_step": 422715, "epoch": 2516} {"train_loss": -12.543912887573242, "global_step": 422716, "epoch": 2516} {"train_loss": -12.531196594238281, "global_step": 422717, "epoch": 2516} {"train_loss": -12.245227813720703, "global_step": 422718, "epoch": 2516} {"train_loss": -12.54066276550293, "global_step": 422719, "epoch": 2516} {"train_loss": -12.401566505432129, "global_step": 422720, "epoch": 2516} {"train_loss": -12.54270076751709, "global_step": 422721, "epoch": 2516} {"train_loss": -12.522933959960938, "global_step": 422722, "epoch": 2516} {"train_loss": -12.495128631591797, "global_step": 422723, "epoch": 2516} {"train_loss": -12.767091751098633, "global_step": 422724, "epoch": 2516} {"train_loss": -12.441400527954102, "global_step": 422725, "epoch": 2516} {"train_loss": -12.66121768951416, "global_step": 422726, "epoch": 2516} {"train_loss": -12.292916297912598, "global_step": 422727, "epoch": 2516} {"train_loss": -12.576812744140625, "global_step": 422728, "epoch": 2516} {"train_loss": -12.55937385559082, "global_step": 422729, "epoch": 2516} {"train_loss": -12.431184768676758, "global_step": 422730, "epoch": 2516} {"train_loss": -12.534117698669434, "global_step": 422731, "epoch": 2516} {"train_loss": -12.389029502868652, "global_step": 422732, "epoch": 2516} {"train_loss": -12.634391784667969, "global_step": 422733, "epoch": 2516} {"train_loss": -12.066023826599121, "global_step": 422734, "epoch": 2516} {"train_loss": -12.625001907348633, "global_step": 422735, "epoch": 2516} {"train_loss": -12.481077194213867, "global_step": 422736, "epoch": 2516} {"train_loss": -12.580443382263184, "global_step": 422737, "epoch": 2516} {"train_loss": -12.468536376953125, "global_step": 422738, "epoch": 2516} {"train_loss": -12.77536678314209, "global_step": 422739, "epoch": 2516} {"train_loss": -12.645892143249512, "global_step": 422740, "epoch": 2516} {"train_loss": -12.901992797851562, "global_step": 422741, "epoch": 2516} {"train_loss": -12.64944076538086, "global_step": 422742, "epoch": 2516} {"train_loss": -12.339500427246094, "global_step": 422743, "epoch": 2516} {"train_loss": -12.598151206970215, "global_step": 422744, "epoch": 2516} {"train_loss": -12.664993286132812, "global_step": 422745, "epoch": 2516} {"train_loss": -12.841536521911621, "global_step": 422746, "epoch": 2516} {"train_loss": -12.617866516113281, "global_step": 422747, "epoch": 2516} {"train_loss": -12.62260913848877, "global_step": 422748, "epoch": 2516} {"train_loss": -12.619077682495117, "global_step": 422749, "epoch": 2516} {"train_loss": -12.915656089782715, "global_step": 422750, "epoch": 2516} {"train_loss": -12.774051666259766, "global_step": 422751, "epoch": 2516} {"train_loss": -12.67213249206543, "global_step": 422752, "epoch": 2516} {"train_loss": -12.600083351135254, "global_step": 422753, "epoch": 2516} {"train_loss": -12.5797119140625, "global_step": 422754, "epoch": 2516} {"train_loss": -12.747089385986328, "global_step": 422755, "epoch": 2516} {"train_loss": -12.635053634643555, "global_step": 422756, "epoch": 2516} {"train_loss": -12.930312156677246, "global_step": 422757, "epoch": 2516} {"train_loss": -12.721317291259766, "global_step": 422758, "epoch": 2516} {"train_loss": -12.86876106262207, "global_step": 422759, "epoch": 2516} {"train_loss": -12.348875999450684, "global_step": 422760, "epoch": 2516} {"train_loss": -12.690694808959961, "global_step": 422761, "epoch": 2516} {"train_loss": -12.42080307006836, "global_step": 422762, "epoch": 2516} {"train_loss": -12.30079174041748, "global_step": 422763, "epoch": 2516} {"train_loss": -12.54596996307373, "global_step": 422764, "epoch": 2516} {"train_loss": -12.361072540283203, "global_step": 422765, "epoch": 2516} {"train_loss": -12.589046478271484, "global_step": 422766, "epoch": 2516} {"train_loss": -12.543685913085938, "global_step": 422767, "epoch": 2516} {"train_loss": -12.789169311523438, "global_step": 422768, "epoch": 2516} {"train_loss": -12.359156608581543, "global_step": 422769, "epoch": 2516} {"train_loss": -12.896553039550781, "global_step": 422770, "epoch": 2516} {"train_loss": -12.648191452026367, "global_step": 422771, "epoch": 2516} {"train_loss": -12.709388732910156, "global_step": 422772, "epoch": 2516} {"train_loss": -12.746302604675293, "global_step": 422773, "epoch": 2516} {"train_loss": -12.01052474975586, "global_step": 422774, "epoch": 2516} {"train_loss": -11.751916885375977, "global_step": 422775, "epoch": 2516} {"train_loss": -10.897029876708984, "global_step": 422776, "epoch": 2516} {"train_loss": -12.555052757263184, "global_step": 422777, "epoch": 2516} {"train_loss": -11.908928871154785, "global_step": 422778, "epoch": 2516} {"train_loss": -11.844825744628906, "global_step": 422779, "epoch": 2516} {"train_loss": -12.342764854431152, "global_step": 422780, "epoch": 2516} {"train_loss": -11.744305610656738, "global_step": 422781, "epoch": 2516} {"train_loss": -11.985313415527344, "global_step": 422782, "epoch": 2516} {"train_loss": -10.888567924499512, "global_step": 422783, "epoch": 2516} {"train_loss": -12.650413513183594, "global_step": 422784, "epoch": 2516} {"train_loss": -11.486227035522461, "global_step": 422785, "epoch": 2516} {"train_loss": -10.838866233825684, "global_step": 422786, "epoch": 2516} {"train_loss": -10.66380500793457, "global_step": 422787, "epoch": 2516} {"train_loss": -10.130043029785156, "global_step": 422788, "epoch": 2516} {"train_loss": -8.897960662841797, "global_step": 422789, "epoch": 2516} {"train_loss": -11.026324272155762, "global_step": 422790, "epoch": 2516} {"train_loss": -9.58202075958252, "global_step": 422791, "epoch": 2516} {"train_loss": -11.753538131713867, "global_step": 422792, "epoch": 2516} {"train_loss": -10.88612174987793, "global_step": 422793, "epoch": 2516} {"train_loss": -10.7241849899292, "global_step": 422794, "epoch": 2516} {"train_loss": -11.884298324584961, "global_step": 422795, "epoch": 2516} {"train_loss": -9.515922546386719, "global_step": 422796, "epoch": 2516} {"train_loss": -11.83730697631836, "global_step": 422797, "epoch": 2516} {"train_loss": -9.537965774536133, "global_step": 422798, "epoch": 2516} {"train_loss": -11.791182518005371, "global_step": 422799, "epoch": 2516} {"train_loss": -10.26393985748291, "global_step": 422800, "epoch": 2516} {"train_loss": -10.91273021697998, "global_step": 422801, "epoch": 2516} {"train_loss": -10.851829528808594, "global_step": 422802, "epoch": 2516} {"train_loss": -10.592601776123047, "global_step": 422803, "epoch": 2516} {"train_loss": -9.329208374023438, "global_step": 422804, "epoch": 2516} {"train_loss": -10.84434986114502, "global_step": 422805, "epoch": 2516} {"train_loss": -10.42928695678711, "global_step": 422806, "epoch": 2516} {"train_loss": -9.495523452758789, "global_step": 422807, "epoch": 2516} {"train_loss": -9.853777885437012, "global_step": 422808, "epoch": 2516} {"train_loss": -11.192890167236328, "global_step": 422809, "epoch": 2516} {"train_loss": -11.146303176879883, "global_step": 422810, "epoch": 2516} {"train_loss": -11.3408784866333, "global_step": 422811, "epoch": 2516} {"train_loss": -11.452281951904297, "global_step": 422812, "epoch": 2516} {"train_loss": -11.08223819732666, "global_step": 422813, "epoch": 2516} {"train_loss": -11.943479537963867, "global_step": 422814, "epoch": 2516} {"train_loss": -11.317497253417969, "global_step": 422815, "epoch": 2516} {"train_loss": -11.833256721496582, "global_step": 422816, "epoch": 2516} {"train_loss": -11.140192985534668, "global_step": 422817, "epoch": 2516} {"train_loss": -11.298080444335938, "global_step": 422818, "epoch": 2516} {"train_loss": -11.044227600097656, "global_step": 422819, "epoch": 2516} {"train_loss": -12.092848777770996, "global_step": 422820, "epoch": 2516} {"train_loss": -11.077341079711914, "global_step": 422821, "epoch": 2516} {"train_loss": -11.26430892944336, "global_step": 422822, "epoch": 2516} {"train_loss": -11.306844711303711, "global_step": 422823, "epoch": 2516} {"train_loss": -11.663023948669434, "global_step": 422824, "epoch": 2516} {"train_loss": -11.665407180786133, "global_step": 422825, "epoch": 2516} {"train_loss": -11.173877716064453, "global_step": 422826, "epoch": 2516} {"train_loss": -11.505916595458984, "global_step": 422827, "epoch": 2516} {"train_loss": -11.274749755859375, "global_step": 422828, "epoch": 2516} {"train_loss": -11.431808471679688, "global_step": 422829, "epoch": 2516} {"train_loss": -11.411331176757812, "global_step": 422830, "epoch": 2516} {"train_loss": -10.986757278442383, "global_step": 422831, "epoch": 2516} {"train_loss": -11.76427936553955, "global_step": 422832, "epoch": 2516} {"train_loss": -11.947059631347656, "global_step": 422833, "epoch": 2516} {"train_loss": -11.124775886535645, "global_step": 422834, "epoch": 2516} {"train_loss": -11.524747848510742, "global_step": 422835, "epoch": 2516} {"train_loss": -11.63208293914795, "global_step": 422836, "epoch": 2516} {"train_loss": -11.635229110717773, "global_step": 422837, "epoch": 2516} {"train_loss": -12.029382705688477, "global_step": 422838, "epoch": 2516} {"train_loss": -11.796951293945312, "global_step": 422839, "epoch": 2516} {"train_loss": -12.105752944946289, "global_step": 422840, "epoch": 2516} {"train_loss": -11.88254165649414, "global_step": 422841, "epoch": 2516} {"train_loss": -12.21547794342041, "global_step": 422842, "epoch": 2516} {"train_loss": -11.955856323242188, "global_step": 422843, "epoch": 2516} {"train_loss": -11.943120956420898, "global_step": 422844, "epoch": 2516} {"train_loss": -12.188629150390625, "global_step": 422845, "epoch": 2516} {"train_loss": -12.041950225830078, "global_step": 422846, "epoch": 2516} {"train_loss": -12.306900024414062, "global_step": 422847, "epoch": 2516} {"train_loss": -12.344457626342773, "global_step": 422848, "epoch": 2516} {"train_loss": -12.211597442626953, "global_step": 422849, "epoch": 2516} {"train_loss": -12.386951446533203, "global_step": 422850, "epoch": 2516} {"train_loss": -12.203529357910156, "global_step": 422851, "epoch": 2516} {"train_loss": -12.381267547607422, "global_step": 422852, "epoch": 2516} {"train_loss": -12.320608139038086, "global_step": 422853, "epoch": 2516} {"train_loss": -12.470170021057129, "global_step": 422854, "epoch": 2516} {"train_loss": -11.95783843880608, "global_step": 422855, "epoch": 2516, "val_loss": 303610.71875} {"train_loss": -12.253029823303223, "global_step": 422856, "epoch": 2517} {"train_loss": -12.231603622436523, "global_step": 422857, "epoch": 2517} {"train_loss": -12.52386474609375, "global_step": 422858, "epoch": 2517} {"train_loss": -12.346672058105469, "global_step": 422859, "epoch": 2517} {"train_loss": -12.58603286743164, "global_step": 422860, "epoch": 2517} {"train_loss": -12.38653564453125, "global_step": 422861, "epoch": 2517} {"train_loss": -12.388022422790527, "global_step": 422862, "epoch": 2517} {"train_loss": -12.581439018249512, "global_step": 422863, "epoch": 2517} {"train_loss": -12.639530181884766, "global_step": 422864, "epoch": 2517} {"train_loss": -12.645074844360352, "global_step": 422865, "epoch": 2517} {"train_loss": -12.455545425415039, "global_step": 422866, "epoch": 2517} {"train_loss": -12.457799911499023, "global_step": 422867, "epoch": 2517} {"train_loss": -12.528783798217773, "global_step": 422868, "epoch": 2517} {"train_loss": -12.632407188415527, "global_step": 422869, "epoch": 2517} {"train_loss": -12.35264778137207, "global_step": 422870, "epoch": 2517} {"train_loss": -12.651330947875977, "global_step": 422871, "epoch": 2517} {"train_loss": -12.484199523925781, "global_step": 422872, "epoch": 2517} {"train_loss": -12.55707836151123, "global_step": 422873, "epoch": 2517} {"train_loss": -12.49220085144043, "global_step": 422874, "epoch": 2517} {"train_loss": -12.733055114746094, "global_step": 422875, "epoch": 2517} {"train_loss": -12.643850326538086, "global_step": 422876, "epoch": 2517} {"train_loss": -12.73269271850586, "global_step": 422877, "epoch": 2517} {"train_loss": -12.653281211853027, "global_step": 422878, "epoch": 2517} {"train_loss": -12.8720703125, "global_step": 422879, "epoch": 2517} {"train_loss": -12.554717063903809, "global_step": 422880, "epoch": 2517} {"train_loss": -12.655326843261719, "global_step": 422881, "epoch": 2517} {"train_loss": -12.770822525024414, "global_step": 422882, "epoch": 2517} {"train_loss": -12.632463455200195, "global_step": 422883, "epoch": 2517} {"train_loss": -12.414575576782227, "global_step": 422884, "epoch": 2517} {"train_loss": -12.517810821533203, "global_step": 422885, "epoch": 2517} {"train_loss": -12.727087020874023, "global_step": 422886, "epoch": 2517} {"train_loss": -12.394876480102539, "global_step": 422887, "epoch": 2517} {"train_loss": -12.698460578918457, "global_step": 422888, "epoch": 2517} {"train_loss": -12.51705551147461, "global_step": 422889, "epoch": 2517} {"train_loss": -12.39071273803711, "global_step": 422890, "epoch": 2517} {"train_loss": -12.510819435119629, "global_step": 422891, "epoch": 2517} {"train_loss": -12.684541702270508, "global_step": 422892, "epoch": 2517} {"train_loss": -12.84804630279541, "global_step": 422893, "epoch": 2517} {"train_loss": -12.895654678344727, "global_step": 422894, "epoch": 2517} {"train_loss": -12.698901176452637, "global_step": 422895, "epoch": 2517} {"train_loss": -12.518701553344727, "global_step": 422896, "epoch": 2517} {"train_loss": -12.707029342651367, "global_step": 422897, "epoch": 2517} {"train_loss": -12.708619117736816, "global_step": 422898, "epoch": 2517} {"train_loss": -12.698211669921875, "global_step": 422899, "epoch": 2517} {"train_loss": -12.785890579223633, "global_step": 422900, "epoch": 2517} {"train_loss": -12.855134963989258, "global_step": 422901, "epoch": 2517} {"train_loss": -12.669074058532715, "global_step": 422902, "epoch": 2517} {"train_loss": -12.339487075805664, "global_step": 422903, "epoch": 2517} {"train_loss": -12.78476333618164, "global_step": 422904, "epoch": 2517} {"train_loss": -12.665024757385254, "global_step": 422905, "epoch": 2517} {"train_loss": -12.469988822937012, "global_step": 422906, "epoch": 2517} {"train_loss": -12.261669158935547, "global_step": 422907, "epoch": 2517} {"train_loss": -12.142004013061523, "global_step": 422908, "epoch": 2517} {"train_loss": -12.813729286193848, "global_step": 422909, "epoch": 2517} {"train_loss": -12.756686210632324, "global_step": 422910, "epoch": 2517} {"train_loss": -12.071391105651855, "global_step": 422911, "epoch": 2517} {"train_loss": -11.956363677978516, "global_step": 422912, "epoch": 2517} {"train_loss": -12.778509140014648, "global_step": 422913, "epoch": 2517} {"train_loss": -12.67820930480957, "global_step": 422914, "epoch": 2517} {"train_loss": -12.35926628112793, "global_step": 422915, "epoch": 2517} {"train_loss": -12.488302230834961, "global_step": 422916, "epoch": 2517} {"train_loss": -12.544692039489746, "global_step": 422917, "epoch": 2517} {"train_loss": -12.536609649658203, "global_step": 422918, "epoch": 2517} {"train_loss": -12.001432418823242, "global_step": 422919, "epoch": 2517} {"train_loss": -9.896586418151855, "global_step": 422920, "epoch": 2517} {"train_loss": -11.667638778686523, "global_step": 422921, "epoch": 2517} {"train_loss": -11.023433685302734, "global_step": 422922, "epoch": 2517} {"train_loss": -8.772180557250977, "global_step": 422923, "epoch": 2517} {"train_loss": -8.65799331665039, "global_step": 422924, "epoch": 2517} {"train_loss": -9.161338806152344, "global_step": 422925, "epoch": 2517} {"train_loss": -9.131610870361328, "global_step": 422926, "epoch": 2517} {"train_loss": -9.694478988647461, "global_step": 422927, "epoch": 2517} {"train_loss": -9.567283630371094, "global_step": 422928, "epoch": 2517} {"train_loss": -10.480840682983398, "global_step": 422929, "epoch": 2517} {"train_loss": -9.347631454467773, "global_step": 422930, "epoch": 2517} {"train_loss": -10.136909484863281, "global_step": 422931, "epoch": 2517} {"train_loss": -10.082221984863281, "global_step": 422932, "epoch": 2517} {"train_loss": -10.281930923461914, "global_step": 422933, "epoch": 2517} {"train_loss": -9.846840858459473, "global_step": 422934, "epoch": 2517} {"train_loss": -10.197916984558105, "global_step": 422935, "epoch": 2517} {"train_loss": -10.610006332397461, "global_step": 422936, "epoch": 2517} {"train_loss": -10.341039657592773, "global_step": 422937, "epoch": 2517} {"train_loss": -10.965048789978027, "global_step": 422938, "epoch": 2517} {"train_loss": -10.498581886291504, "global_step": 422939, "epoch": 2517} {"train_loss": -11.61338996887207, "global_step": 422940, "epoch": 2517} {"train_loss": -10.600645065307617, "global_step": 422941, "epoch": 2517} {"train_loss": -12.01164436340332, "global_step": 422942, "epoch": 2517} {"train_loss": -9.951338768005371, "global_step": 422943, "epoch": 2517} {"train_loss": -11.837248802185059, "global_step": 422944, "epoch": 2517} {"train_loss": -10.64836311340332, "global_step": 422945, "epoch": 2517} {"train_loss": -11.093280792236328, "global_step": 422946, "epoch": 2517} {"train_loss": -11.821413040161133, "global_step": 422947, "epoch": 2517} {"train_loss": -10.798137664794922, "global_step": 422948, "epoch": 2517} {"train_loss": -11.25174331665039, "global_step": 422949, "epoch": 2517} {"train_loss": -11.489500999450684, "global_step": 422950, "epoch": 2517} {"train_loss": -10.44943618774414, "global_step": 422951, "epoch": 2517} {"train_loss": -11.439912796020508, "global_step": 422952, "epoch": 2517} {"train_loss": -10.159431457519531, "global_step": 422953, "epoch": 2517} {"train_loss": -10.076886177062988, "global_step": 422954, "epoch": 2517} {"train_loss": -11.463467597961426, "global_step": 422955, "epoch": 2517} {"train_loss": -10.48104476928711, "global_step": 422956, "epoch": 2517} {"train_loss": -10.690959930419922, "global_step": 422957, "epoch": 2517} {"train_loss": -11.347671508789062, "global_step": 422958, "epoch": 2517} {"train_loss": -10.679407119750977, "global_step": 422959, "epoch": 2517} {"train_loss": -10.836138725280762, "global_step": 422960, "epoch": 2517} {"train_loss": -10.801822662353516, "global_step": 422961, "epoch": 2517} {"train_loss": -11.078545570373535, "global_step": 422962, "epoch": 2517} {"train_loss": -10.902824401855469, "global_step": 422963, "epoch": 2517} {"train_loss": -11.608400344848633, "global_step": 422964, "epoch": 2517} {"train_loss": -10.673042297363281, "global_step": 422965, "epoch": 2517} {"train_loss": -11.111709594726562, "global_step": 422966, "epoch": 2517} {"train_loss": -11.750368118286133, "global_step": 422967, "epoch": 2517} {"train_loss": -11.646125793457031, "global_step": 422968, "epoch": 2517} {"train_loss": -11.312644958496094, "global_step": 422969, "epoch": 2517} {"train_loss": -11.92856216430664, "global_step": 422970, "epoch": 2517} {"train_loss": -11.795970916748047, "global_step": 422971, "epoch": 2517} {"train_loss": -11.378097534179688, "global_step": 422972, "epoch": 2517} {"train_loss": -12.086341857910156, "global_step": 422973, "epoch": 2517} {"train_loss": -11.788361549377441, "global_step": 422974, "epoch": 2517} {"train_loss": -11.832453727722168, "global_step": 422975, "epoch": 2517} {"train_loss": -12.169769287109375, "global_step": 422976, "epoch": 2517} {"train_loss": -12.117630004882812, "global_step": 422977, "epoch": 2517} {"train_loss": -11.680564880371094, "global_step": 422978, "epoch": 2517} {"train_loss": -12.138893127441406, "global_step": 422979, "epoch": 2517} {"train_loss": -11.96261978149414, "global_step": 422980, "epoch": 2517} {"train_loss": -11.805286407470703, "global_step": 422981, "epoch": 2517} {"train_loss": -12.259174346923828, "global_step": 422982, "epoch": 2517} {"train_loss": -12.131638526916504, "global_step": 422983, "epoch": 2517} {"train_loss": -11.894469261169434, "global_step": 422984, "epoch": 2517} {"train_loss": -12.238655090332031, "global_step": 422985, "epoch": 2517} {"train_loss": -12.282649040222168, "global_step": 422986, "epoch": 2517} {"train_loss": -12.186655044555664, "global_step": 422987, "epoch": 2517} {"train_loss": -12.459381103515625, "global_step": 422988, "epoch": 2517} {"train_loss": -12.231395721435547, "global_step": 422989, "epoch": 2517} {"train_loss": -12.319795608520508, "global_step": 422990, "epoch": 2517} {"train_loss": -12.363383293151855, "global_step": 422991, "epoch": 2517} {"train_loss": -12.198936462402344, "global_step": 422992, "epoch": 2517} {"train_loss": -12.448619842529297, "global_step": 422993, "epoch": 2517} {"train_loss": -12.209938049316406, "global_step": 422994, "epoch": 2517} {"train_loss": -12.524478912353516, "global_step": 422995, "epoch": 2517} {"train_loss": -12.110908508300781, "global_step": 422996, "epoch": 2517} {"train_loss": -12.487382888793945, "global_step": 422997, "epoch": 2517} {"train_loss": -12.168582916259766, "global_step": 422998, "epoch": 2517} {"train_loss": -12.423444747924805, "global_step": 422999, "epoch": 2517} {"train_loss": -12.39146614074707, "global_step": 423000, "epoch": 2517} {"train_loss": -12.421869277954102, "global_step": 423001, "epoch": 2517} {"train_loss": -12.350164413452148, "global_step": 423002, "epoch": 2517} {"train_loss": -12.204898834228516, "global_step": 423003, "epoch": 2517} {"train_loss": -12.108372688293457, "global_step": 423004, "epoch": 2517} {"train_loss": -12.42128849029541, "global_step": 423005, "epoch": 2517} {"train_loss": -12.107728004455566, "global_step": 423006, "epoch": 2517} {"train_loss": -12.283331871032715, "global_step": 423007, "epoch": 2517} {"train_loss": -12.510110855102539, "global_step": 423008, "epoch": 2517} {"train_loss": -12.390081405639648, "global_step": 423009, "epoch": 2517} {"train_loss": -12.365026473999023, "global_step": 423010, "epoch": 2517} {"train_loss": -12.368221282958984, "global_step": 423011, "epoch": 2517} {"train_loss": -12.424774169921875, "global_step": 423012, "epoch": 2517} {"train_loss": -12.505623817443848, "global_step": 423013, "epoch": 2517} {"train_loss": -12.59146499633789, "global_step": 423014, "epoch": 2517} {"train_loss": -12.616918563842773, "global_step": 423015, "epoch": 2517} {"train_loss": -12.32522964477539, "global_step": 423016, "epoch": 2517} {"train_loss": -12.59205436706543, "global_step": 423017, "epoch": 2517} {"train_loss": -12.285611152648926, "global_step": 423018, "epoch": 2517} {"train_loss": -12.650190353393555, "global_step": 423019, "epoch": 2517} {"train_loss": -12.671857833862305, "global_step": 423020, "epoch": 2517} {"train_loss": -12.440223693847656, "global_step": 423021, "epoch": 2517} {"train_loss": -12.46407699584961, "global_step": 423022, "epoch": 2517} {"train_loss": -11.887239092872257, "global_step": 423023, "epoch": 2517, "val_loss": 309004.3125} {"train_loss": -12.810717582702637, "global_step": 423024, "epoch": 2518} {"train_loss": -12.681108474731445, "global_step": 423025, "epoch": 2518} {"train_loss": -12.631709098815918, "global_step": 423026, "epoch": 2518} {"train_loss": -12.644350051879883, "global_step": 423027, "epoch": 2518} {"train_loss": -12.750946998596191, "global_step": 423028, "epoch": 2518} {"train_loss": -12.66353988647461, "global_step": 423029, "epoch": 2518} {"train_loss": -12.74867057800293, "global_step": 423030, "epoch": 2518} {"train_loss": -12.55322551727295, "global_step": 423031, "epoch": 2518} {"train_loss": -12.382366180419922, "global_step": 423032, "epoch": 2518} {"train_loss": -12.651751518249512, "global_step": 423033, "epoch": 2518} {"train_loss": -12.90457534790039, "global_step": 423034, "epoch": 2518} {"train_loss": -12.530974388122559, "global_step": 423035, "epoch": 2518} {"train_loss": -12.826264381408691, "global_step": 423036, "epoch": 2518} {"train_loss": -12.754058837890625, "global_step": 423037, "epoch": 2518} {"train_loss": -12.7213134765625, "global_step": 423038, "epoch": 2518} {"train_loss": -12.245105743408203, "global_step": 423039, "epoch": 2518} {"train_loss": -11.438053131103516, "global_step": 423040, "epoch": 2518} {"train_loss": -11.72055435180664, "global_step": 423041, "epoch": 2518} {"train_loss": -12.555639266967773, "global_step": 423042, "epoch": 2518} {"train_loss": -12.187037467956543, "global_step": 423043, "epoch": 2518} {"train_loss": -11.020763397216797, "global_step": 423044, "epoch": 2518} {"train_loss": -10.207630157470703, "global_step": 423045, "epoch": 2518} {"train_loss": -11.891387939453125, "global_step": 423046, "epoch": 2518} {"train_loss": -11.981403350830078, "global_step": 423047, "epoch": 2518} {"train_loss": -10.6764554977417, "global_step": 423048, "epoch": 2518} {"train_loss": -11.735689163208008, "global_step": 423049, "epoch": 2518} {"train_loss": -12.167787551879883, "global_step": 423050, "epoch": 2518} {"train_loss": -12.015409469604492, "global_step": 423051, "epoch": 2518} {"train_loss": -12.245190620422363, "global_step": 423052, "epoch": 2518} {"train_loss": -12.25899887084961, "global_step": 423053, "epoch": 2518} {"train_loss": -12.31344223022461, "global_step": 423054, "epoch": 2518} {"train_loss": -11.87287712097168, "global_step": 423055, "epoch": 2518} {"train_loss": -12.492197036743164, "global_step": 423056, "epoch": 2518} {"train_loss": -11.708817481994629, "global_step": 423057, "epoch": 2518} {"train_loss": -12.404809951782227, "global_step": 423058, "epoch": 2518} {"train_loss": -11.414960861206055, "global_step": 423059, "epoch": 2518} {"train_loss": -12.220658302307129, "global_step": 423060, "epoch": 2518} {"train_loss": -11.088796615600586, "global_step": 423061, "epoch": 2518} {"train_loss": -12.328832626342773, "global_step": 423062, "epoch": 2518} {"train_loss": -11.641876220703125, "global_step": 423063, "epoch": 2518} {"train_loss": -11.43844985961914, "global_step": 423064, "epoch": 2518} {"train_loss": -12.13960075378418, "global_step": 423065, "epoch": 2518} {"train_loss": -11.120685577392578, "global_step": 423066, "epoch": 2518} {"train_loss": -11.734426498413086, "global_step": 423067, "epoch": 2518} {"train_loss": -11.914081573486328, "global_step": 423068, "epoch": 2518} {"train_loss": -11.773368835449219, "global_step": 423069, "epoch": 2518} {"train_loss": -11.786346435546875, "global_step": 423070, "epoch": 2518} {"train_loss": -12.62814998626709, "global_step": 423071, "epoch": 2518} {"train_loss": -11.468300819396973, "global_step": 423072, "epoch": 2518} {"train_loss": -11.755729675292969, "global_step": 423073, "epoch": 2518} {"train_loss": -11.446043014526367, "global_step": 423074, "epoch": 2518} {"train_loss": -11.907617568969727, "global_step": 423075, "epoch": 2518} {"train_loss": -11.631467819213867, "global_step": 423076, "epoch": 2518} {"train_loss": -11.945760726928711, "global_step": 423077, "epoch": 2518} {"train_loss": -12.023459434509277, "global_step": 423078, "epoch": 2518} {"train_loss": -12.094629287719727, "global_step": 423079, "epoch": 2518} {"train_loss": -12.008922576904297, "global_step": 423080, "epoch": 2518} {"train_loss": -11.76499080657959, "global_step": 423081, "epoch": 2518} {"train_loss": -12.423518180847168, "global_step": 423082, "epoch": 2518} {"train_loss": -11.224876403808594, "global_step": 423083, "epoch": 2518} {"train_loss": -12.118029594421387, "global_step": 423084, "epoch": 2518} {"train_loss": -11.54470443725586, "global_step": 423085, "epoch": 2518} {"train_loss": -11.475377082824707, "global_step": 423086, "epoch": 2518} {"train_loss": -12.348394393920898, "global_step": 423087, "epoch": 2518} {"train_loss": -11.658363342285156, "global_step": 423088, "epoch": 2518} {"train_loss": -12.373401641845703, "global_step": 423089, "epoch": 2518} {"train_loss": -12.173361778259277, "global_step": 423090, "epoch": 2518} {"train_loss": -12.4666166305542, "global_step": 423091, "epoch": 2518} {"train_loss": -12.424901008605957, "global_step": 423092, "epoch": 2518} {"train_loss": -12.094600677490234, "global_step": 423093, "epoch": 2518} {"train_loss": -12.3903226852417, "global_step": 423094, "epoch": 2518} {"train_loss": -12.587373733520508, "global_step": 423095, "epoch": 2518} {"train_loss": -12.322668075561523, "global_step": 423096, "epoch": 2518} {"train_loss": -12.502935409545898, "global_step": 423097, "epoch": 2518} {"train_loss": -12.314061164855957, "global_step": 423098, "epoch": 2518} {"train_loss": -12.471559524536133, "global_step": 423099, "epoch": 2518} {"train_loss": -12.403114318847656, "global_step": 423100, "epoch": 2518} {"train_loss": -12.661458969116211, "global_step": 423101, "epoch": 2518} {"train_loss": -12.447208404541016, "global_step": 423102, "epoch": 2518} {"train_loss": -12.644001007080078, "global_step": 423103, "epoch": 2518} {"train_loss": -12.414506912231445, "global_step": 423104, "epoch": 2518} {"train_loss": -12.272551536560059, "global_step": 423105, "epoch": 2518} {"train_loss": -12.3963623046875, "global_step": 423106, "epoch": 2518} {"train_loss": -12.545064926147461, "global_step": 423107, "epoch": 2518} {"train_loss": -12.532051086425781, "global_step": 423108, "epoch": 2518} {"train_loss": -12.497513771057129, "global_step": 423109, "epoch": 2518} {"train_loss": -12.378650665283203, "global_step": 423110, "epoch": 2518} {"train_loss": -12.306455612182617, "global_step": 423111, "epoch": 2518} {"train_loss": -11.977510452270508, "global_step": 423112, "epoch": 2518} {"train_loss": -12.437653541564941, "global_step": 423113, "epoch": 2518} {"train_loss": -12.0280122756958, "global_step": 423114, "epoch": 2518} {"train_loss": -12.43812370300293, "global_step": 423115, "epoch": 2518} {"train_loss": -12.301286697387695, "global_step": 423116, "epoch": 2518} {"train_loss": -12.43408489227295, "global_step": 423117, "epoch": 2518} {"train_loss": -12.333837509155273, "global_step": 423118, "epoch": 2518} {"train_loss": -12.160555839538574, "global_step": 423119, "epoch": 2518} {"train_loss": -11.549625396728516, "global_step": 423120, "epoch": 2518} {"train_loss": -12.380788803100586, "global_step": 423121, "epoch": 2518} {"train_loss": -11.895650863647461, "global_step": 423122, "epoch": 2518} {"train_loss": -11.491151809692383, "global_step": 423123, "epoch": 2518} {"train_loss": -12.567777633666992, "global_step": 423124, "epoch": 2518} {"train_loss": -11.62314224243164, "global_step": 423125, "epoch": 2518} {"train_loss": -10.877742767333984, "global_step": 423126, "epoch": 2518} {"train_loss": -12.600078582763672, "global_step": 423127, "epoch": 2518} {"train_loss": -11.63154411315918, "global_step": 423128, "epoch": 2518} {"train_loss": -12.28027629852295, "global_step": 423129, "epoch": 2518} {"train_loss": -11.802387237548828, "global_step": 423130, "epoch": 2518} {"train_loss": -12.02060604095459, "global_step": 423131, "epoch": 2518} {"train_loss": -12.288684844970703, "global_step": 423132, "epoch": 2518} {"train_loss": -12.085311889648438, "global_step": 423133, "epoch": 2518} {"train_loss": -12.453649520874023, "global_step": 423134, "epoch": 2518} {"train_loss": -12.070028305053711, "global_step": 423135, "epoch": 2518} {"train_loss": -12.359903335571289, "global_step": 423136, "epoch": 2518} {"train_loss": -12.31790542602539, "global_step": 423137, "epoch": 2518} {"train_loss": -11.86548900604248, "global_step": 423138, "epoch": 2518} {"train_loss": -12.416214942932129, "global_step": 423139, "epoch": 2518} {"train_loss": -12.258278846740723, "global_step": 423140, "epoch": 2518} {"train_loss": -12.430946350097656, "global_step": 423141, "epoch": 2518} {"train_loss": -12.183940887451172, "global_step": 423142, "epoch": 2518} {"train_loss": -12.440576553344727, "global_step": 423143, "epoch": 2518} {"train_loss": -12.579630851745605, "global_step": 423144, "epoch": 2518} {"train_loss": -12.136247634887695, "global_step": 423145, "epoch": 2518} {"train_loss": -12.192437171936035, "global_step": 423146, "epoch": 2518} {"train_loss": -12.023494720458984, "global_step": 423147, "epoch": 2518} {"train_loss": -12.187365531921387, "global_step": 423148, "epoch": 2518} {"train_loss": -12.220420837402344, "global_step": 423149, "epoch": 2518} {"train_loss": -12.198152542114258, "global_step": 423150, "epoch": 2518} {"train_loss": -12.03654670715332, "global_step": 423151, "epoch": 2518} {"train_loss": -11.91494083404541, "global_step": 423152, "epoch": 2518} {"train_loss": -12.499725341796875, "global_step": 423153, "epoch": 2518} {"train_loss": -12.584430694580078, "global_step": 423154, "epoch": 2518} {"train_loss": -11.570755004882812, "global_step": 423155, "epoch": 2518} {"train_loss": -12.211130142211914, "global_step": 423156, "epoch": 2518} {"train_loss": -11.844331741333008, "global_step": 423157, "epoch": 2518} {"train_loss": -11.862561225891113, "global_step": 423158, "epoch": 2518} {"train_loss": -11.550214767456055, "global_step": 423159, "epoch": 2518} {"train_loss": -12.608968734741211, "global_step": 423160, "epoch": 2518} {"train_loss": -11.925747871398926, "global_step": 423161, "epoch": 2518} {"train_loss": -12.465964317321777, "global_step": 423162, "epoch": 2518} {"train_loss": -12.348907470703125, "global_step": 423163, "epoch": 2518} {"train_loss": -12.60809326171875, "global_step": 423164, "epoch": 2518} {"train_loss": -12.295909881591797, "global_step": 423165, "epoch": 2518} {"train_loss": -12.525060653686523, "global_step": 423166, "epoch": 2518} {"train_loss": -12.628273010253906, "global_step": 423167, "epoch": 2518} {"train_loss": -12.564897537231445, "global_step": 423168, "epoch": 2518} {"train_loss": -12.793510437011719, "global_step": 423169, "epoch": 2518} {"train_loss": -12.331031799316406, "global_step": 423170, "epoch": 2518} {"train_loss": -12.633237838745117, "global_step": 423171, "epoch": 2518} {"train_loss": -12.61551284790039, "global_step": 423172, "epoch": 2518} {"train_loss": -12.012307167053223, "global_step": 423173, "epoch": 2518} {"train_loss": -12.516693115234375, "global_step": 423174, "epoch": 2518} {"train_loss": -12.496587753295898, "global_step": 423175, "epoch": 2518} {"train_loss": -12.476767539978027, "global_step": 423176, "epoch": 2518} {"train_loss": -12.517660140991211, "global_step": 423177, "epoch": 2518} {"train_loss": -12.299369812011719, "global_step": 423178, "epoch": 2518} {"train_loss": -12.566496849060059, "global_step": 423179, "epoch": 2518} {"train_loss": -12.459400177001953, "global_step": 423180, "epoch": 2518} {"train_loss": -12.271018981933594, "global_step": 423181, "epoch": 2518} {"train_loss": -12.143813133239746, "global_step": 423182, "epoch": 2518} {"train_loss": -12.611875534057617, "global_step": 423183, "epoch": 2518} {"train_loss": -12.006510734558105, "global_step": 423184, "epoch": 2518} {"train_loss": -12.417405128479004, "global_step": 423185, "epoch": 2518} {"train_loss": -11.471000671386719, "global_step": 423186, "epoch": 2518} {"train_loss": -12.36404037475586, "global_step": 423187, "epoch": 2518} {"train_loss": -12.021377563476562, "global_step": 423188, "epoch": 2518} {"train_loss": -12.681163787841797, "global_step": 423189, "epoch": 2518} {"train_loss": -11.828516006469727, "global_step": 423190, "epoch": 2518} {"train_loss": -12.170983791351318, "global_step": 423191, "epoch": 2518, "val_loss": 310707.59375} {"train_loss": -11.933061599731445, "global_step": 423192, "epoch": 2519} {"train_loss": -12.435270309448242, "global_step": 423193, "epoch": 2519} {"train_loss": -12.047612190246582, "global_step": 423194, "epoch": 2519} {"train_loss": -12.260149002075195, "global_step": 423195, "epoch": 2519} {"train_loss": -11.885826110839844, "global_step": 423196, "epoch": 2519} {"train_loss": -12.249921798706055, "global_step": 423197, "epoch": 2519} {"train_loss": -12.345254898071289, "global_step": 423198, "epoch": 2519} {"train_loss": -12.015289306640625, "global_step": 423199, "epoch": 2519} {"train_loss": -12.364001274108887, "global_step": 423200, "epoch": 2519} {"train_loss": -12.494267463684082, "global_step": 423201, "epoch": 2519} {"train_loss": -12.025594711303711, "global_step": 423202, "epoch": 2519} {"train_loss": -12.374061584472656, "global_step": 423203, "epoch": 2519} {"train_loss": -12.695305824279785, "global_step": 423204, "epoch": 2519} {"train_loss": -12.528830528259277, "global_step": 423205, "epoch": 2519} {"train_loss": -12.609260559082031, "global_step": 423206, "epoch": 2519} {"train_loss": -12.520842552185059, "global_step": 423207, "epoch": 2519} {"train_loss": -12.660724639892578, "global_step": 423208, "epoch": 2519} {"train_loss": -12.527395248413086, "global_step": 423209, "epoch": 2519} {"train_loss": -12.643495559692383, "global_step": 423210, "epoch": 2519} {"train_loss": -12.477767944335938, "global_step": 423211, "epoch": 2519} {"train_loss": -12.600493431091309, "global_step": 423212, "epoch": 2519} {"train_loss": -12.325847625732422, "global_step": 423213, "epoch": 2519} {"train_loss": -12.302864074707031, "global_step": 423214, "epoch": 2519} {"train_loss": -12.658153533935547, "global_step": 423215, "epoch": 2519} {"train_loss": -12.189250946044922, "global_step": 423216, "epoch": 2519} {"train_loss": -11.914472579956055, "global_step": 423217, "epoch": 2519} {"train_loss": -12.231547355651855, "global_step": 423218, "epoch": 2519} {"train_loss": -12.379218101501465, "global_step": 423219, "epoch": 2519} {"train_loss": -12.021230697631836, "global_step": 423220, "epoch": 2519} {"train_loss": -12.399261474609375, "global_step": 423221, "epoch": 2519} {"train_loss": -12.121578216552734, "global_step": 423222, "epoch": 2519} {"train_loss": -12.13170051574707, "global_step": 423223, "epoch": 2519} {"train_loss": -12.592819213867188, "global_step": 423224, "epoch": 2519} {"train_loss": -12.15247917175293, "global_step": 423225, "epoch": 2519} {"train_loss": -12.056219100952148, "global_step": 423226, "epoch": 2519} {"train_loss": -12.403863906860352, "global_step": 423227, "epoch": 2519} {"train_loss": -12.274490356445312, "global_step": 423228, "epoch": 2519} {"train_loss": -11.532537460327148, "global_step": 423229, "epoch": 2519} {"train_loss": -12.772587776184082, "global_step": 423230, "epoch": 2519} {"train_loss": -12.08962631225586, "global_step": 423231, "epoch": 2519} {"train_loss": -11.887420654296875, "global_step": 423232, "epoch": 2519} {"train_loss": -12.473468780517578, "global_step": 423233, "epoch": 2519} {"train_loss": -12.260852813720703, "global_step": 423234, "epoch": 2519} {"train_loss": -10.953093528747559, "global_step": 423235, "epoch": 2519} {"train_loss": -12.215136528015137, "global_step": 423236, "epoch": 2519} {"train_loss": -11.774571418762207, "global_step": 423237, "epoch": 2519} {"train_loss": -11.964008331298828, "global_step": 423238, "epoch": 2519} {"train_loss": -12.230209350585938, "global_step": 423239, "epoch": 2519} {"train_loss": -11.764715194702148, "global_step": 423240, "epoch": 2519} {"train_loss": -11.82913589477539, "global_step": 423241, "epoch": 2519} {"train_loss": -12.00741958618164, "global_step": 423242, "epoch": 2519} {"train_loss": -10.836278915405273, "global_step": 423243, "epoch": 2519} {"train_loss": -11.610885620117188, "global_step": 423244, "epoch": 2519} {"train_loss": -11.705108642578125, "global_step": 423245, "epoch": 2519} {"train_loss": -11.482236862182617, "global_step": 423246, "epoch": 2519} {"train_loss": -11.349517822265625, "global_step": 423247, "epoch": 2519} {"train_loss": -9.980416297912598, "global_step": 423248, "epoch": 2519} {"train_loss": -10.7305908203125, "global_step": 423249, "epoch": 2519} {"train_loss": -9.960237503051758, "global_step": 423250, "epoch": 2519} {"train_loss": -11.96284294128418, "global_step": 423251, "epoch": 2519} {"train_loss": -10.521860122680664, "global_step": 423252, "epoch": 2519} {"train_loss": -11.09625244140625, "global_step": 423253, "epoch": 2519} {"train_loss": -10.623617172241211, "global_step": 423254, "epoch": 2519} {"train_loss": -11.808676719665527, "global_step": 423255, "epoch": 2519} {"train_loss": -11.433720588684082, "global_step": 423256, "epoch": 2519} {"train_loss": -11.804362297058105, "global_step": 423257, "epoch": 2519} {"train_loss": -11.527299880981445, "global_step": 423258, "epoch": 2519} {"train_loss": -10.662259101867676, "global_step": 423259, "epoch": 2519} {"train_loss": -12.208624839782715, "global_step": 423260, "epoch": 2519} {"train_loss": -11.706345558166504, "global_step": 423261, "epoch": 2519} {"train_loss": -12.350818634033203, "global_step": 423262, "epoch": 2519} {"train_loss": -12.042012214660645, "global_step": 423263, "epoch": 2519} {"train_loss": -11.711544036865234, "global_step": 423264, "epoch": 2519} {"train_loss": -12.544631958007812, "global_step": 423265, "epoch": 2519} {"train_loss": -11.77558708190918, "global_step": 423266, "epoch": 2519} {"train_loss": -12.490514755249023, "global_step": 423267, "epoch": 2519} {"train_loss": -11.868680953979492, "global_step": 423268, "epoch": 2519} {"train_loss": -12.276291847229004, "global_step": 423269, "epoch": 2519} {"train_loss": -12.023938179016113, "global_step": 423270, "epoch": 2519} {"train_loss": -11.740474700927734, "global_step": 423271, "epoch": 2519} {"train_loss": -12.337520599365234, "global_step": 423272, "epoch": 2519} {"train_loss": -11.944658279418945, "global_step": 423273, "epoch": 2519} {"train_loss": -12.333837509155273, "global_step": 423274, "epoch": 2519} {"train_loss": -12.236074447631836, "global_step": 423275, "epoch": 2519} {"train_loss": -12.421587944030762, "global_step": 423276, "epoch": 2519} {"train_loss": -12.308976173400879, "global_step": 423277, "epoch": 2519} {"train_loss": -12.121942520141602, "global_step": 423278, "epoch": 2519} {"train_loss": -12.379684448242188, "global_step": 423279, "epoch": 2519} {"train_loss": -12.385492324829102, "global_step": 423280, "epoch": 2519} {"train_loss": -12.485817909240723, "global_step": 423281, "epoch": 2519} {"train_loss": -12.374945640563965, "global_step": 423282, "epoch": 2519} {"train_loss": -12.563922882080078, "global_step": 423283, "epoch": 2519} {"train_loss": -12.29107666015625, "global_step": 423284, "epoch": 2519} {"train_loss": -12.405519485473633, "global_step": 423285, "epoch": 2519} {"train_loss": -12.168073654174805, "global_step": 423286, "epoch": 2519} {"train_loss": -12.758440017700195, "global_step": 423287, "epoch": 2519} {"train_loss": -12.319031715393066, "global_step": 423288, "epoch": 2519} {"train_loss": -12.43341064453125, "global_step": 423289, "epoch": 2519} {"train_loss": -12.669750213623047, "global_step": 423290, "epoch": 2519} {"train_loss": -12.354969024658203, "global_step": 423291, "epoch": 2519} {"train_loss": -12.634760856628418, "global_step": 423292, "epoch": 2519} {"train_loss": -12.357620239257812, "global_step": 423293, "epoch": 2519} {"train_loss": -12.462285041809082, "global_step": 423294, "epoch": 2519} {"train_loss": -12.181746482849121, "global_step": 423295, "epoch": 2519} {"train_loss": -12.461289405822754, "global_step": 423296, "epoch": 2519} {"train_loss": -12.495138168334961, "global_step": 423297, "epoch": 2519} {"train_loss": -11.955342292785645, "global_step": 423298, "epoch": 2519} {"train_loss": -12.018150329589844, "global_step": 423299, "epoch": 2519} {"train_loss": -12.270748138427734, "global_step": 423300, "epoch": 2519} {"train_loss": -11.99498176574707, "global_step": 423301, "epoch": 2519} {"train_loss": -12.545080184936523, "global_step": 423302, "epoch": 2519} {"train_loss": -11.768284797668457, "global_step": 423303, "epoch": 2519} {"train_loss": -12.401466369628906, "global_step": 423304, "epoch": 2519} {"train_loss": -12.368870735168457, "global_step": 423305, "epoch": 2519} {"train_loss": -12.554847717285156, "global_step": 423306, "epoch": 2519} {"train_loss": -12.41130542755127, "global_step": 423307, "epoch": 2519} {"train_loss": -12.482746124267578, "global_step": 423308, "epoch": 2519} {"train_loss": -12.148502349853516, "global_step": 423309, "epoch": 2519} {"train_loss": -12.596782684326172, "global_step": 423310, "epoch": 2519} {"train_loss": -12.535652160644531, "global_step": 423311, "epoch": 2519} {"train_loss": -12.781915664672852, "global_step": 423312, "epoch": 2519} {"train_loss": -12.656890869140625, "global_step": 423313, "epoch": 2519} {"train_loss": -12.70545482635498, "global_step": 423314, "epoch": 2519} {"train_loss": -12.680379867553711, "global_step": 423315, "epoch": 2519} {"train_loss": -12.697608947753906, "global_step": 423316, "epoch": 2519} {"train_loss": -12.761127471923828, "global_step": 423317, "epoch": 2519} {"train_loss": -12.381745338439941, "global_step": 423318, "epoch": 2519} {"train_loss": -12.718616485595703, "global_step": 423319, "epoch": 2519} {"train_loss": -12.573089599609375, "global_step": 423320, "epoch": 2519} {"train_loss": -12.510650634765625, "global_step": 423321, "epoch": 2519} {"train_loss": -12.719629287719727, "global_step": 423322, "epoch": 2519} {"train_loss": -12.70943832397461, "global_step": 423323, "epoch": 2519} {"train_loss": -12.739143371582031, "global_step": 423324, "epoch": 2519} {"train_loss": -12.947169303894043, "global_step": 423325, "epoch": 2519} {"train_loss": -12.423721313476562, "global_step": 423326, "epoch": 2519} {"train_loss": -12.586530685424805, "global_step": 423327, "epoch": 2519} {"train_loss": -12.894521713256836, "global_step": 423328, "epoch": 2519} {"train_loss": -12.669052124023438, "global_step": 423329, "epoch": 2519} {"train_loss": -12.745603561401367, "global_step": 423330, "epoch": 2519} {"train_loss": -12.748268127441406, "global_step": 423331, "epoch": 2519} {"train_loss": -12.34854507446289, "global_step": 423332, "epoch": 2519} {"train_loss": -12.665855407714844, "global_step": 423333, "epoch": 2519} {"train_loss": -12.315888404846191, "global_step": 423334, "epoch": 2519} {"train_loss": -12.742032051086426, "global_step": 423335, "epoch": 2519} {"train_loss": -12.652008056640625, "global_step": 423336, "epoch": 2519} {"train_loss": -12.245246887207031, "global_step": 423337, "epoch": 2519} {"train_loss": -11.890949249267578, "global_step": 423338, "epoch": 2519} {"train_loss": -11.409707069396973, "global_step": 423339, "epoch": 2519} {"train_loss": -10.713171005249023, "global_step": 423340, "epoch": 2519} {"train_loss": -10.99303913116455, "global_step": 423341, "epoch": 2519} {"train_loss": -12.181246757507324, "global_step": 423342, "epoch": 2519} {"train_loss": -11.612152099609375, "global_step": 423343, "epoch": 2519} {"train_loss": -9.005047798156738, "global_step": 423344, "epoch": 2519} {"train_loss": -10.23300552368164, "global_step": 423345, "epoch": 2519} {"train_loss": -10.219574928283691, "global_step": 423346, "epoch": 2519} {"train_loss": -10.827936172485352, "global_step": 423347, "epoch": 2519} {"train_loss": -9.933505058288574, "global_step": 423348, "epoch": 2519} {"train_loss": -11.230173110961914, "global_step": 423349, "epoch": 2519} {"train_loss": -10.002325057983398, "global_step": 423350, "epoch": 2519} {"train_loss": -11.64809513092041, "global_step": 423351, "epoch": 2519} {"train_loss": -10.395163536071777, "global_step": 423352, "epoch": 2519} {"train_loss": -12.17143440246582, "global_step": 423353, "epoch": 2519} {"train_loss": -11.22172737121582, "global_step": 423354, "epoch": 2519} {"train_loss": -10.900866508483887, "global_step": 423355, "epoch": 2519} {"train_loss": -11.086898803710938, "global_step": 423356, "epoch": 2519} {"train_loss": -11.526119232177734, "global_step": 423357, "epoch": 2519} {"train_loss": -11.26313591003418, "global_step": 423358, "epoch": 2519} {"train_loss": -12.034247580028715, "global_step": 423359, "epoch": 2519, "val_loss": 307896.59375} {"train_loss": -11.091365814208984, "global_step": 423360, "epoch": 2520} {"train_loss": -11.827475547790527, "global_step": 423361, "epoch": 2520} {"train_loss": -10.494343757629395, "global_step": 423362, "epoch": 2520} {"train_loss": -11.894721031188965, "global_step": 423363, "epoch": 2520} {"train_loss": -11.125659942626953, "global_step": 423364, "epoch": 2520} {"train_loss": -11.522934913635254, "global_step": 423365, "epoch": 2520} {"train_loss": -11.823369979858398, "global_step": 423366, "epoch": 2520} {"train_loss": -11.645917892456055, "global_step": 423367, "epoch": 2520} {"train_loss": -11.835737228393555, "global_step": 423368, "epoch": 2520} {"train_loss": -11.727965354919434, "global_step": 423369, "epoch": 2520} {"train_loss": -11.80124282836914, "global_step": 423370, "epoch": 2520} {"train_loss": -12.22374439239502, "global_step": 423371, "epoch": 2520} {"train_loss": -12.065576553344727, "global_step": 423372, "epoch": 2520} {"train_loss": -12.448776245117188, "global_step": 423373, "epoch": 2520} {"train_loss": -12.137808799743652, "global_step": 423374, "epoch": 2520} {"train_loss": -11.650588989257812, "global_step": 423375, "epoch": 2520} {"train_loss": -12.243534088134766, "global_step": 423376, "epoch": 2520} {"train_loss": -12.197019577026367, "global_step": 423377, "epoch": 2520} {"train_loss": -12.201654434204102, "global_step": 423378, "epoch": 2520} {"train_loss": -12.364164352416992, "global_step": 423379, "epoch": 2520} {"train_loss": -12.044639587402344, "global_step": 423380, "epoch": 2520} {"train_loss": -12.16181468963623, "global_step": 423381, "epoch": 2520} {"train_loss": -12.075698852539062, "global_step": 423382, "epoch": 2520} {"train_loss": -12.450557708740234, "global_step": 423383, "epoch": 2520} {"train_loss": -11.93923568725586, "global_step": 423384, "epoch": 2520} {"train_loss": -12.461633682250977, "global_step": 423385, "epoch": 2520} {"train_loss": -12.280515670776367, "global_step": 423386, "epoch": 2520} {"train_loss": -12.488570213317871, "global_step": 423387, "epoch": 2520} {"train_loss": -12.4481840133667, "global_step": 423388, "epoch": 2520} {"train_loss": -12.170846939086914, "global_step": 423389, "epoch": 2520} {"train_loss": -12.19162368774414, "global_step": 423390, "epoch": 2520} {"train_loss": -12.156579971313477, "global_step": 423391, "epoch": 2520} {"train_loss": -12.556809425354004, "global_step": 423392, "epoch": 2520} {"train_loss": -12.298591613769531, "global_step": 423393, "epoch": 2520} {"train_loss": -12.458353042602539, "global_step": 423394, "epoch": 2520} {"train_loss": -12.622329711914062, "global_step": 423395, "epoch": 2520} {"train_loss": -12.368224143981934, "global_step": 423396, "epoch": 2520} {"train_loss": -12.532401084899902, "global_step": 423397, "epoch": 2520} {"train_loss": -12.411397933959961, "global_step": 423398, "epoch": 2520} {"train_loss": -12.586492538452148, "global_step": 423399, "epoch": 2520} {"train_loss": -12.267438888549805, "global_step": 423400, "epoch": 2520} {"train_loss": -12.406686782836914, "global_step": 423401, "epoch": 2520} {"train_loss": -12.577216148376465, "global_step": 423402, "epoch": 2520} {"train_loss": -12.562572479248047, "global_step": 423403, "epoch": 2520} {"train_loss": -12.572948455810547, "global_step": 423404, "epoch": 2520} {"train_loss": -12.542269706726074, "global_step": 423405, "epoch": 2520} {"train_loss": -12.793225288391113, "global_step": 423406, "epoch": 2520} {"train_loss": -12.568482398986816, "global_step": 423407, "epoch": 2520} {"train_loss": -12.37961483001709, "global_step": 423408, "epoch": 2520} {"train_loss": -12.626411437988281, "global_step": 423409, "epoch": 2520} {"train_loss": -12.668867111206055, "global_step": 423410, "epoch": 2520} {"train_loss": -12.620429039001465, "global_step": 423411, "epoch": 2520} {"train_loss": -12.72153091430664, "global_step": 423412, "epoch": 2520} {"train_loss": -12.566567420959473, "global_step": 423413, "epoch": 2520} {"train_loss": -12.703702926635742, "global_step": 423414, "epoch": 2520} {"train_loss": -12.506427764892578, "global_step": 423415, "epoch": 2520} {"train_loss": -12.665452003479004, "global_step": 423416, "epoch": 2520} {"train_loss": -12.4817476272583, "global_step": 423417, "epoch": 2520} {"train_loss": -12.745309829711914, "global_step": 423418, "epoch": 2520} {"train_loss": -12.614712715148926, "global_step": 423419, "epoch": 2520} {"train_loss": -12.731858253479004, "global_step": 423420, "epoch": 2520} {"train_loss": -12.48552131652832, "global_step": 423421, "epoch": 2520} {"train_loss": -12.613619804382324, "global_step": 423422, "epoch": 2520} {"train_loss": -12.57951545715332, "global_step": 423423, "epoch": 2520} {"train_loss": -12.66707706451416, "global_step": 423424, "epoch": 2520} {"train_loss": -12.570684432983398, "global_step": 423425, "epoch": 2520} {"train_loss": -12.61616325378418, "global_step": 423426, "epoch": 2520} {"train_loss": -12.235799789428711, "global_step": 423427, "epoch": 2520} {"train_loss": -12.643922805786133, "global_step": 423428, "epoch": 2520} {"train_loss": -13.001077651977539, "global_step": 423429, "epoch": 2520} {"train_loss": -12.563034057617188, "global_step": 423430, "epoch": 2520} {"train_loss": -12.503805160522461, "global_step": 423431, "epoch": 2520} {"train_loss": -12.81624984741211, "global_step": 423432, "epoch": 2520} {"train_loss": -12.805573463439941, "global_step": 423433, "epoch": 2520} {"train_loss": -12.609701156616211, "global_step": 423434, "epoch": 2520} {"train_loss": -12.732536315917969, "global_step": 423435, "epoch": 2520} {"train_loss": -12.622753143310547, "global_step": 423436, "epoch": 2520} {"train_loss": -12.61577033996582, "global_step": 423437, "epoch": 2520} {"train_loss": -12.545941352844238, "global_step": 423438, "epoch": 2520} {"train_loss": -12.664530754089355, "global_step": 423439, "epoch": 2520} {"train_loss": -12.531145095825195, "global_step": 423440, "epoch": 2520} {"train_loss": -12.407866477966309, "global_step": 423441, "epoch": 2520} {"train_loss": -12.577159881591797, "global_step": 423442, "epoch": 2520} {"train_loss": -12.535345077514648, "global_step": 423443, "epoch": 2520} {"train_loss": -12.705991744995117, "global_step": 423444, "epoch": 2520} {"train_loss": -12.205684661865234, "global_step": 423445, "epoch": 2520} {"train_loss": -12.532793045043945, "global_step": 423446, "epoch": 2520} {"train_loss": -12.0673828125, "global_step": 423447, "epoch": 2520} {"train_loss": -12.319000244140625, "global_step": 423448, "epoch": 2520} {"train_loss": -11.876679420471191, "global_step": 423449, "epoch": 2520} {"train_loss": -12.114794731140137, "global_step": 423450, "epoch": 2520} {"train_loss": -11.263681411743164, "global_step": 423451, "epoch": 2520} {"train_loss": -11.396142959594727, "global_step": 423452, "epoch": 2520} {"train_loss": -10.001649856567383, "global_step": 423453, "epoch": 2520} {"train_loss": -10.96010684967041, "global_step": 423454, "epoch": 2520} {"train_loss": -10.467090606689453, "global_step": 423455, "epoch": 2520} {"train_loss": -9.90333366394043, "global_step": 423456, "epoch": 2520} {"train_loss": -10.007782936096191, "global_step": 423457, "epoch": 2520} {"train_loss": -11.518795013427734, "global_step": 423458, "epoch": 2520} {"train_loss": -11.071150779724121, "global_step": 423459, "epoch": 2520} {"train_loss": -11.184040069580078, "global_step": 423460, "epoch": 2520} {"train_loss": -11.601365089416504, "global_step": 423461, "epoch": 2520} {"train_loss": -11.343090057373047, "global_step": 423462, "epoch": 2520} {"train_loss": -10.82381534576416, "global_step": 423463, "epoch": 2520} {"train_loss": -10.624507904052734, "global_step": 423464, "epoch": 2520} {"train_loss": -11.524818420410156, "global_step": 423465, "epoch": 2520} {"train_loss": -12.041744232177734, "global_step": 423466, "epoch": 2520} {"train_loss": -10.58139419555664, "global_step": 423467, "epoch": 2520} {"train_loss": -10.192145347595215, "global_step": 423468, "epoch": 2520} {"train_loss": -11.012664794921875, "global_step": 423469, "epoch": 2520} {"train_loss": -11.599939346313477, "global_step": 423470, "epoch": 2520} {"train_loss": -11.243823051452637, "global_step": 423471, "epoch": 2520} {"train_loss": -12.267045974731445, "global_step": 423472, "epoch": 2520} {"train_loss": -11.15088939666748, "global_step": 423473, "epoch": 2520} {"train_loss": -11.585054397583008, "global_step": 423474, "epoch": 2520} {"train_loss": -11.422350883483887, "global_step": 423475, "epoch": 2520} {"train_loss": -11.028838157653809, "global_step": 423476, "epoch": 2520} {"train_loss": -11.459346771240234, "global_step": 423477, "epoch": 2520} {"train_loss": -11.590320587158203, "global_step": 423478, "epoch": 2520} {"train_loss": -11.101271629333496, "global_step": 423479, "epoch": 2520} {"train_loss": -11.616921424865723, "global_step": 423480, "epoch": 2520} {"train_loss": -11.540264129638672, "global_step": 423481, "epoch": 2520} {"train_loss": -11.30179214477539, "global_step": 423482, "epoch": 2520} {"train_loss": -11.267247200012207, "global_step": 423483, "epoch": 2520} {"train_loss": -11.631624221801758, "global_step": 423484, "epoch": 2520} {"train_loss": -10.879813194274902, "global_step": 423485, "epoch": 2520} {"train_loss": -11.125716209411621, "global_step": 423486, "epoch": 2520} {"train_loss": -12.120779037475586, "global_step": 423487, "epoch": 2520} {"train_loss": -11.7706298828125, "global_step": 423488, "epoch": 2520} {"train_loss": -11.834117889404297, "global_step": 423489, "epoch": 2520} {"train_loss": -11.923728942871094, "global_step": 423490, "epoch": 2520} {"train_loss": -11.670957565307617, "global_step": 423491, "epoch": 2520} {"train_loss": -11.692378997802734, "global_step": 423492, "epoch": 2520} {"train_loss": -12.208786010742188, "global_step": 423493, "epoch": 2520} {"train_loss": -11.901531219482422, "global_step": 423494, "epoch": 2520} {"train_loss": -12.073290824890137, "global_step": 423495, "epoch": 2520} {"train_loss": -11.76036262512207, "global_step": 423496, "epoch": 2520} {"train_loss": -11.491832733154297, "global_step": 423497, "epoch": 2520} {"train_loss": -11.872766494750977, "global_step": 423498, "epoch": 2520} {"train_loss": -11.627496719360352, "global_step": 423499, "epoch": 2520} {"train_loss": -12.249029159545898, "global_step": 423500, "epoch": 2520} {"train_loss": -11.722497940063477, "global_step": 423501, "epoch": 2520} {"train_loss": -12.197866439819336, "global_step": 423502, "epoch": 2520} {"train_loss": -12.03419303894043, "global_step": 423503, "epoch": 2520} {"train_loss": -12.410755157470703, "global_step": 423504, "epoch": 2520} {"train_loss": -12.362079620361328, "global_step": 423505, "epoch": 2520} {"train_loss": -12.176979064941406, "global_step": 423506, "epoch": 2520} {"train_loss": -12.536452293395996, "global_step": 423507, "epoch": 2520} {"train_loss": -12.361464500427246, "global_step": 423508, "epoch": 2520} {"train_loss": -12.485530853271484, "global_step": 423509, "epoch": 2520} {"train_loss": -12.514361381530762, "global_step": 423510, "epoch": 2520} {"train_loss": -12.126737594604492, "global_step": 423511, "epoch": 2520} {"train_loss": -12.528924942016602, "global_step": 423512, "epoch": 2520} {"train_loss": -12.386842727661133, "global_step": 423513, "epoch": 2520} {"train_loss": -12.457340240478516, "global_step": 423514, "epoch": 2520} {"train_loss": -12.467192649841309, "global_step": 423515, "epoch": 2520} {"train_loss": -12.659443855285645, "global_step": 423516, "epoch": 2520} {"train_loss": -12.633197784423828, "global_step": 423517, "epoch": 2520} {"train_loss": -12.281511306762695, "global_step": 423518, "epoch": 2520} {"train_loss": -12.56743049621582, "global_step": 423519, "epoch": 2520} {"train_loss": -12.579326629638672, "global_step": 423520, "epoch": 2520} {"train_loss": -12.226101875305176, "global_step": 423521, "epoch": 2520} {"train_loss": -12.455971717834473, "global_step": 423522, "epoch": 2520} {"train_loss": -12.39741325378418, "global_step": 423523, "epoch": 2520} {"train_loss": -12.498319625854492, "global_step": 423524, "epoch": 2520} {"train_loss": -12.52059555053711, "global_step": 423525, "epoch": 2520} {"train_loss": -12.392080307006836, "global_step": 423526, "epoch": 2520} {"train_loss": -12.054528026353745, "global_step": 423527, "epoch": 2520, "val_loss": 308864.25, "train_action_mse_error": 2.2529296875} {"train_loss": -12.13027572631836, "global_step": 423528, "epoch": 2521} {"train_loss": -12.273822784423828, "global_step": 423529, "epoch": 2521} {"train_loss": -12.008613586425781, "global_step": 423530, "epoch": 2521} {"train_loss": -12.235881805419922, "global_step": 423531, "epoch": 2521} {"train_loss": -11.948047637939453, "global_step": 423532, "epoch": 2521} {"train_loss": -12.007955551147461, "global_step": 423533, "epoch": 2521} {"train_loss": -10.939825057983398, "global_step": 423534, "epoch": 2521} {"train_loss": -12.513055801391602, "global_step": 423535, "epoch": 2521} {"train_loss": -11.696348190307617, "global_step": 423536, "epoch": 2521} {"train_loss": -11.94869613647461, "global_step": 423537, "epoch": 2521} {"train_loss": -11.878150939941406, "global_step": 423538, "epoch": 2521} {"train_loss": -12.026893615722656, "global_step": 423539, "epoch": 2521} {"train_loss": -12.047679901123047, "global_step": 423540, "epoch": 2521} {"train_loss": -12.028999328613281, "global_step": 423541, "epoch": 2521} {"train_loss": -11.901042938232422, "global_step": 423542, "epoch": 2521} {"train_loss": -12.28019905090332, "global_step": 423543, "epoch": 2521} {"train_loss": -11.426126480102539, "global_step": 423544, "epoch": 2521} {"train_loss": -11.516660690307617, "global_step": 423545, "epoch": 2521} {"train_loss": -11.316740036010742, "global_step": 423546, "epoch": 2521} {"train_loss": -11.544022560119629, "global_step": 423547, "epoch": 2521} {"train_loss": -12.182219505310059, "global_step": 423548, "epoch": 2521} {"train_loss": -10.80255126953125, "global_step": 423549, "epoch": 2521} {"train_loss": -12.358965873718262, "global_step": 423550, "epoch": 2521} {"train_loss": -10.545522689819336, "global_step": 423551, "epoch": 2521} {"train_loss": -11.896973609924316, "global_step": 423552, "epoch": 2521} {"train_loss": -11.336559295654297, "global_step": 423553, "epoch": 2521} {"train_loss": -11.828883171081543, "global_step": 423554, "epoch": 2521} {"train_loss": -12.099983215332031, "global_step": 423555, "epoch": 2521} {"train_loss": -11.690818786621094, "global_step": 423556, "epoch": 2521} {"train_loss": -12.363276481628418, "global_step": 423557, "epoch": 2521} {"train_loss": -11.76553726196289, "global_step": 423558, "epoch": 2521} {"train_loss": -12.141504287719727, "global_step": 423559, "epoch": 2521} {"train_loss": -12.412690162658691, "global_step": 423560, "epoch": 2521} {"train_loss": -12.433609962463379, "global_step": 423561, "epoch": 2521} {"train_loss": -12.480596542358398, "global_step": 423562, "epoch": 2521} {"train_loss": -12.238068580627441, "global_step": 423563, "epoch": 2521} {"train_loss": -12.247369766235352, "global_step": 423564, "epoch": 2521} {"train_loss": -12.24834156036377, "global_step": 423565, "epoch": 2521} {"train_loss": -12.228606224060059, "global_step": 423566, "epoch": 2521} {"train_loss": -12.24421501159668, "global_step": 423567, "epoch": 2521} {"train_loss": -12.27168083190918, "global_step": 423568, "epoch": 2521} {"train_loss": -11.78715705871582, "global_step": 423569, "epoch": 2521} {"train_loss": -12.281296730041504, "global_step": 423570, "epoch": 2521} {"train_loss": -11.996807098388672, "global_step": 423571, "epoch": 2521} {"train_loss": -12.119508743286133, "global_step": 423572, "epoch": 2521} {"train_loss": -12.135208129882812, "global_step": 423573, "epoch": 2521} {"train_loss": -12.413829803466797, "global_step": 423574, "epoch": 2521} {"train_loss": -11.784261703491211, "global_step": 423575, "epoch": 2521} {"train_loss": -12.399263381958008, "global_step": 423576, "epoch": 2521} {"train_loss": -11.97311782836914, "global_step": 423577, "epoch": 2521} {"train_loss": -12.416460990905762, "global_step": 423578, "epoch": 2521} {"train_loss": -12.361515045166016, "global_step": 423579, "epoch": 2521} {"train_loss": -12.261627197265625, "global_step": 423580, "epoch": 2521} {"train_loss": -12.406417846679688, "global_step": 423581, "epoch": 2521} {"train_loss": -12.453344345092773, "global_step": 423582, "epoch": 2521} {"train_loss": -12.60193157196045, "global_step": 423583, "epoch": 2521} {"train_loss": -12.688966751098633, "global_step": 423584, "epoch": 2521} {"train_loss": -12.524274826049805, "global_step": 423585, "epoch": 2521} {"train_loss": -12.492410659790039, "global_step": 423586, "epoch": 2521} {"train_loss": -12.370325088500977, "global_step": 423587, "epoch": 2521} {"train_loss": -12.772501945495605, "global_step": 423588, "epoch": 2521} {"train_loss": -12.401494026184082, "global_step": 423589, "epoch": 2521} {"train_loss": -12.60987663269043, "global_step": 423590, "epoch": 2521} {"train_loss": -12.378637313842773, "global_step": 423591, "epoch": 2521} {"train_loss": -12.63267993927002, "global_step": 423592, "epoch": 2521} {"train_loss": -12.767467498779297, "global_step": 423593, "epoch": 2521} {"train_loss": -12.645238876342773, "global_step": 423594, "epoch": 2521} {"train_loss": -12.787336349487305, "global_step": 423595, "epoch": 2521} {"train_loss": -12.705915451049805, "global_step": 423596, "epoch": 2521} {"train_loss": -12.374260902404785, "global_step": 423597, "epoch": 2521} {"train_loss": -12.80671501159668, "global_step": 423598, "epoch": 2521} {"train_loss": -12.282432556152344, "global_step": 423599, "epoch": 2521} {"train_loss": -12.363351821899414, "global_step": 423600, "epoch": 2521} {"train_loss": -12.548040390014648, "global_step": 423601, "epoch": 2521} {"train_loss": -12.21153450012207, "global_step": 423602, "epoch": 2521} {"train_loss": -12.556009292602539, "global_step": 423603, "epoch": 2521} {"train_loss": -12.39756965637207, "global_step": 423604, "epoch": 2521} {"train_loss": -12.293325424194336, "global_step": 423605, "epoch": 2521} {"train_loss": -12.571264266967773, "global_step": 423606, "epoch": 2521} {"train_loss": -12.401369094848633, "global_step": 423607, "epoch": 2521} {"train_loss": -11.73866081237793, "global_step": 423608, "epoch": 2521} {"train_loss": -11.954578399658203, "global_step": 423609, "epoch": 2521} {"train_loss": -12.446621894836426, "global_step": 423610, "epoch": 2521} {"train_loss": -12.271462440490723, "global_step": 423611, "epoch": 2521} {"train_loss": -11.81207275390625, "global_step": 423612, "epoch": 2521} {"train_loss": -12.605627059936523, "global_step": 423613, "epoch": 2521} {"train_loss": -12.450159072875977, "global_step": 423614, "epoch": 2521} {"train_loss": -12.853461265563965, "global_step": 423615, "epoch": 2521} {"train_loss": -12.516914367675781, "global_step": 423616, "epoch": 2521} {"train_loss": -12.358254432678223, "global_step": 423617, "epoch": 2521} {"train_loss": -12.832215309143066, "global_step": 423618, "epoch": 2521} {"train_loss": -12.486030578613281, "global_step": 423619, "epoch": 2521} {"train_loss": -13.088480949401855, "global_step": 423620, "epoch": 2521} {"train_loss": -12.669301986694336, "global_step": 423621, "epoch": 2521} {"train_loss": -12.6795072555542, "global_step": 423622, "epoch": 2521} {"train_loss": -12.782115936279297, "global_step": 423623, "epoch": 2521} {"train_loss": -12.450733184814453, "global_step": 423624, "epoch": 2521} {"train_loss": -12.730846405029297, "global_step": 423625, "epoch": 2521} {"train_loss": -12.501882553100586, "global_step": 423626, "epoch": 2521} {"train_loss": -12.706792831420898, "global_step": 423627, "epoch": 2521} {"train_loss": -12.671751976013184, "global_step": 423628, "epoch": 2521} {"train_loss": -12.364227294921875, "global_step": 423629, "epoch": 2521} {"train_loss": -11.869054794311523, "global_step": 423630, "epoch": 2521} {"train_loss": -12.510185241699219, "global_step": 423631, "epoch": 2521} {"train_loss": -10.493480682373047, "global_step": 423632, "epoch": 2521} {"train_loss": -12.509828567504883, "global_step": 423633, "epoch": 2521} {"train_loss": -11.06921100616455, "global_step": 423634, "epoch": 2521} {"train_loss": -9.966699600219727, "global_step": 423635, "epoch": 2521} {"train_loss": -10.38468074798584, "global_step": 423636, "epoch": 2521} {"train_loss": -10.500823974609375, "global_step": 423637, "epoch": 2521} {"train_loss": -12.1391019821167, "global_step": 423638, "epoch": 2521} {"train_loss": -11.018110275268555, "global_step": 423639, "epoch": 2521} {"train_loss": -10.830577850341797, "global_step": 423640, "epoch": 2521} {"train_loss": -11.281721115112305, "global_step": 423641, "epoch": 2521} {"train_loss": -11.758281707763672, "global_step": 423642, "epoch": 2521} {"train_loss": -11.171300888061523, "global_step": 423643, "epoch": 2521} {"train_loss": -12.026325225830078, "global_step": 423644, "epoch": 2521} {"train_loss": -11.645179748535156, "global_step": 423645, "epoch": 2521} {"train_loss": -11.476824760437012, "global_step": 423646, "epoch": 2521} {"train_loss": -11.484481811523438, "global_step": 423647, "epoch": 2521} {"train_loss": -11.009368896484375, "global_step": 423648, "epoch": 2521} {"train_loss": -11.199739456176758, "global_step": 423649, "epoch": 2521} {"train_loss": -11.92357349395752, "global_step": 423650, "epoch": 2521} {"train_loss": -11.820228576660156, "global_step": 423651, "epoch": 2521} {"train_loss": -11.721145629882812, "global_step": 423652, "epoch": 2521} {"train_loss": -11.124670028686523, "global_step": 423653, "epoch": 2521} {"train_loss": -11.418359756469727, "global_step": 423654, "epoch": 2521} {"train_loss": -10.64837646484375, "global_step": 423655, "epoch": 2521} {"train_loss": -10.593174934387207, "global_step": 423656, "epoch": 2521} {"train_loss": -10.645395278930664, "global_step": 423657, "epoch": 2521} {"train_loss": -11.751470565795898, "global_step": 423658, "epoch": 2521} {"train_loss": -10.716484069824219, "global_step": 423659, "epoch": 2521} {"train_loss": -11.393865585327148, "global_step": 423660, "epoch": 2521} {"train_loss": -10.555076599121094, "global_step": 423661, "epoch": 2521} {"train_loss": -11.304351806640625, "global_step": 423662, "epoch": 2521} {"train_loss": -11.687748908996582, "global_step": 423663, "epoch": 2521} {"train_loss": -10.35776138305664, "global_step": 423664, "epoch": 2521} {"train_loss": -11.48244571685791, "global_step": 423665, "epoch": 2521} {"train_loss": -10.002753257751465, "global_step": 423666, "epoch": 2521} {"train_loss": -11.635340690612793, "global_step": 423667, "epoch": 2521} {"train_loss": -11.452787399291992, "global_step": 423668, "epoch": 2521} {"train_loss": -10.944663047790527, "global_step": 423669, "epoch": 2521} {"train_loss": -11.763551712036133, "global_step": 423670, "epoch": 2521} {"train_loss": -11.625893592834473, "global_step": 423671, "epoch": 2521} {"train_loss": -11.33957290649414, "global_step": 423672, "epoch": 2521} {"train_loss": -11.98093032836914, "global_step": 423673, "epoch": 2521} {"train_loss": -11.522965431213379, "global_step": 423674, "epoch": 2521} {"train_loss": -12.09835147857666, "global_step": 423675, "epoch": 2521} {"train_loss": -11.822460174560547, "global_step": 423676, "epoch": 2521} {"train_loss": -12.116796493530273, "global_step": 423677, "epoch": 2521} {"train_loss": -12.133442878723145, "global_step": 423678, "epoch": 2521} {"train_loss": -12.079654693603516, "global_step": 423679, "epoch": 2521} {"train_loss": -11.917264938354492, "global_step": 423680, "epoch": 2521} {"train_loss": -12.068496704101562, "global_step": 423681, "epoch": 2521} {"train_loss": -12.059261322021484, "global_step": 423682, "epoch": 2521} {"train_loss": -11.961601257324219, "global_step": 423683, "epoch": 2521} {"train_loss": -12.07497787475586, "global_step": 423684, "epoch": 2521} {"train_loss": -11.863847732543945, "global_step": 423685, "epoch": 2521} {"train_loss": -12.306205749511719, "global_step": 423686, "epoch": 2521} {"train_loss": -12.039756774902344, "global_step": 423687, "epoch": 2521} {"train_loss": -11.915950775146484, "global_step": 423688, "epoch": 2521} {"train_loss": -12.411144256591797, "global_step": 423689, "epoch": 2521} {"train_loss": -11.98332405090332, "global_step": 423690, "epoch": 2521} {"train_loss": -12.056821823120117, "global_step": 423691, "epoch": 2521} {"train_loss": -12.351310729980469, "global_step": 423692, "epoch": 2521} {"train_loss": -12.261898040771484, "global_step": 423693, "epoch": 2521} {"train_loss": -12.54046630859375, "global_step": 423694, "epoch": 2521} {"train_loss": -11.967612198420934, "global_step": 423695, "epoch": 2521, "val_loss": 310629.125} {"train_loss": -12.390438079833984, "global_step": 423696, "epoch": 2522} {"train_loss": -12.599580764770508, "global_step": 423697, "epoch": 2522} {"train_loss": -12.219776153564453, "global_step": 423698, "epoch": 2522} {"train_loss": -12.632665634155273, "global_step": 423699, "epoch": 2522} {"train_loss": -12.171550750732422, "global_step": 423700, "epoch": 2522} {"train_loss": -12.506647109985352, "global_step": 423701, "epoch": 2522} {"train_loss": -12.267629623413086, "global_step": 423702, "epoch": 2522} {"train_loss": -12.55461311340332, "global_step": 423703, "epoch": 2522} {"train_loss": -12.319801330566406, "global_step": 423704, "epoch": 2522} {"train_loss": -12.570976257324219, "global_step": 423705, "epoch": 2522} {"train_loss": -12.453065872192383, "global_step": 423706, "epoch": 2522} {"train_loss": -12.167648315429688, "global_step": 423707, "epoch": 2522} {"train_loss": -12.426311492919922, "global_step": 423708, "epoch": 2522} {"train_loss": -11.634735107421875, "global_step": 423709, "epoch": 2522} {"train_loss": -12.431377410888672, "global_step": 423710, "epoch": 2522} {"train_loss": -12.29704475402832, "global_step": 423711, "epoch": 2522} {"train_loss": -10.849361419677734, "global_step": 423712, "epoch": 2522} {"train_loss": -11.957500457763672, "global_step": 423713, "epoch": 2522} {"train_loss": -11.541372299194336, "global_step": 423714, "epoch": 2522} {"train_loss": -11.214441299438477, "global_step": 423715, "epoch": 2522} {"train_loss": -11.379992485046387, "global_step": 423716, "epoch": 2522} {"train_loss": -12.416332244873047, "global_step": 423717, "epoch": 2522} {"train_loss": -11.609342575073242, "global_step": 423718, "epoch": 2522} {"train_loss": -12.321650505065918, "global_step": 423719, "epoch": 2522} {"train_loss": -12.027398109436035, "global_step": 423720, "epoch": 2522} {"train_loss": -11.233787536621094, "global_step": 423721, "epoch": 2522} {"train_loss": -11.669118881225586, "global_step": 423722, "epoch": 2522} {"train_loss": -10.991691589355469, "global_step": 423723, "epoch": 2522} {"train_loss": -12.439743041992188, "global_step": 423724, "epoch": 2522} {"train_loss": -11.515670776367188, "global_step": 423725, "epoch": 2522} {"train_loss": -11.63656234741211, "global_step": 423726, "epoch": 2522} {"train_loss": -12.693442344665527, "global_step": 423727, "epoch": 2522} {"train_loss": -11.207204818725586, "global_step": 423728, "epoch": 2522} {"train_loss": -12.15311336517334, "global_step": 423729, "epoch": 2522} {"train_loss": -11.874113082885742, "global_step": 423730, "epoch": 2522} {"train_loss": -11.412496566772461, "global_step": 423731, "epoch": 2522} {"train_loss": -12.559761047363281, "global_step": 423732, "epoch": 2522} {"train_loss": -11.584833145141602, "global_step": 423733, "epoch": 2522} {"train_loss": -12.350893020629883, "global_step": 423734, "epoch": 2522} {"train_loss": -12.260660171508789, "global_step": 423735, "epoch": 2522} {"train_loss": -12.213062286376953, "global_step": 423736, "epoch": 2522} {"train_loss": -12.58787727355957, "global_step": 423737, "epoch": 2522} {"train_loss": -12.21630859375, "global_step": 423738, "epoch": 2522} {"train_loss": -12.274287223815918, "global_step": 423739, "epoch": 2522} {"train_loss": -12.082795143127441, "global_step": 423740, "epoch": 2522} {"train_loss": -11.94560432434082, "global_step": 423741, "epoch": 2522} {"train_loss": -12.021188735961914, "global_step": 423742, "epoch": 2522} {"train_loss": -11.584989547729492, "global_step": 423743, "epoch": 2522} {"train_loss": -11.183162689208984, "global_step": 423744, "epoch": 2522} {"train_loss": -11.023847579956055, "global_step": 423745, "epoch": 2522} {"train_loss": -12.313802719116211, "global_step": 423746, "epoch": 2522} {"train_loss": -10.983153343200684, "global_step": 423747, "epoch": 2522} {"train_loss": -11.351835250854492, "global_step": 423748, "epoch": 2522} {"train_loss": -11.693737030029297, "global_step": 423749, "epoch": 2522} {"train_loss": -11.66457462310791, "global_step": 423750, "epoch": 2522} {"train_loss": -12.038808822631836, "global_step": 423751, "epoch": 2522} {"train_loss": -11.708009719848633, "global_step": 423752, "epoch": 2522} {"train_loss": -12.156455993652344, "global_step": 423753, "epoch": 2522} {"train_loss": -12.122371673583984, "global_step": 423754, "epoch": 2522} {"train_loss": -12.450432777404785, "global_step": 423755, "epoch": 2522} {"train_loss": -11.688156127929688, "global_step": 423756, "epoch": 2522} {"train_loss": -11.857601165771484, "global_step": 423757, "epoch": 2522} {"train_loss": -12.476593017578125, "global_step": 423758, "epoch": 2522} {"train_loss": -11.609611511230469, "global_step": 423759, "epoch": 2522} {"train_loss": -12.349038124084473, "global_step": 423760, "epoch": 2522} {"train_loss": -12.30579948425293, "global_step": 423761, "epoch": 2522} {"train_loss": -12.135553359985352, "global_step": 423762, "epoch": 2522} {"train_loss": -12.48538589477539, "global_step": 423763, "epoch": 2522} {"train_loss": -12.279762268066406, "global_step": 423764, "epoch": 2522} {"train_loss": -12.27328872680664, "global_step": 423765, "epoch": 2522} {"train_loss": -12.237001419067383, "global_step": 423766, "epoch": 2522} {"train_loss": -12.301608085632324, "global_step": 423767, "epoch": 2522} {"train_loss": -12.405516624450684, "global_step": 423768, "epoch": 2522} {"train_loss": -12.58721923828125, "global_step": 423769, "epoch": 2522} {"train_loss": -12.345598220825195, "global_step": 423770, "epoch": 2522} {"train_loss": -12.475584983825684, "global_step": 423771, "epoch": 2522} {"train_loss": -12.136679649353027, "global_step": 423772, "epoch": 2522} {"train_loss": -12.50219440460205, "global_step": 423773, "epoch": 2522} {"train_loss": -12.535198211669922, "global_step": 423774, "epoch": 2522} {"train_loss": -12.24328327178955, "global_step": 423775, "epoch": 2522} {"train_loss": -12.61307430267334, "global_step": 423776, "epoch": 2522} {"train_loss": -12.662760734558105, "global_step": 423777, "epoch": 2522} {"train_loss": -12.641824722290039, "global_step": 423778, "epoch": 2522} {"train_loss": -12.52383041381836, "global_step": 423779, "epoch": 2522} {"train_loss": -12.538071632385254, "global_step": 423780, "epoch": 2522} {"train_loss": -12.7117919921875, "global_step": 423781, "epoch": 2522} {"train_loss": -12.714625358581543, "global_step": 423782, "epoch": 2522} {"train_loss": -12.855062484741211, "global_step": 423783, "epoch": 2522} {"train_loss": -12.364969253540039, "global_step": 423784, "epoch": 2522} {"train_loss": -12.522281646728516, "global_step": 423785, "epoch": 2522} {"train_loss": -12.58134651184082, "global_step": 423786, "epoch": 2522} {"train_loss": -12.69377326965332, "global_step": 423787, "epoch": 2522} {"train_loss": -12.42682933807373, "global_step": 423788, "epoch": 2522} {"train_loss": -12.657135963439941, "global_step": 423789, "epoch": 2522} {"train_loss": -12.592947006225586, "global_step": 423790, "epoch": 2522} {"train_loss": -12.655595779418945, "global_step": 423791, "epoch": 2522} {"train_loss": -12.733983993530273, "global_step": 423792, "epoch": 2522} {"train_loss": -12.803669929504395, "global_step": 423793, "epoch": 2522} {"train_loss": -12.541522979736328, "global_step": 423794, "epoch": 2522} {"train_loss": -12.283977508544922, "global_step": 423795, "epoch": 2522} {"train_loss": -12.744556427001953, "global_step": 423796, "epoch": 2522} {"train_loss": -12.62936019897461, "global_step": 423797, "epoch": 2522} {"train_loss": -12.52896499633789, "global_step": 423798, "epoch": 2522} {"train_loss": -12.50219440460205, "global_step": 423799, "epoch": 2522} {"train_loss": -12.744229316711426, "global_step": 423800, "epoch": 2522} {"train_loss": -12.619056701660156, "global_step": 423801, "epoch": 2522} {"train_loss": -12.93519401550293, "global_step": 423802, "epoch": 2522} {"train_loss": -12.522256851196289, "global_step": 423803, "epoch": 2522} {"train_loss": -12.644063949584961, "global_step": 423804, "epoch": 2522} {"train_loss": -12.718974113464355, "global_step": 423805, "epoch": 2522} {"train_loss": -12.57400131225586, "global_step": 423806, "epoch": 2522} {"train_loss": -12.775028228759766, "global_step": 423807, "epoch": 2522} {"train_loss": -12.744295120239258, "global_step": 423808, "epoch": 2522} {"train_loss": -12.63510513305664, "global_step": 423809, "epoch": 2522} {"train_loss": -12.4203519821167, "global_step": 423810, "epoch": 2522} {"train_loss": -12.733101844787598, "global_step": 423811, "epoch": 2522} {"train_loss": -12.691983222961426, "global_step": 423812, "epoch": 2522} {"train_loss": -12.296274185180664, "global_step": 423813, "epoch": 2522} {"train_loss": -12.449579238891602, "global_step": 423814, "epoch": 2522} {"train_loss": -12.433629989624023, "global_step": 423815, "epoch": 2522} {"train_loss": -12.386991500854492, "global_step": 423816, "epoch": 2522} {"train_loss": -11.902128219604492, "global_step": 423817, "epoch": 2522} {"train_loss": -12.54986572265625, "global_step": 423818, "epoch": 2522} {"train_loss": -12.490596771240234, "global_step": 423819, "epoch": 2522} {"train_loss": -12.425077438354492, "global_step": 423820, "epoch": 2522} {"train_loss": -12.9183988571167, "global_step": 423821, "epoch": 2522} {"train_loss": -12.387547492980957, "global_step": 423822, "epoch": 2522} {"train_loss": -12.103517532348633, "global_step": 423823, "epoch": 2522} {"train_loss": -12.317587852478027, "global_step": 423824, "epoch": 2522} {"train_loss": -12.98527717590332, "global_step": 423825, "epoch": 2522} {"train_loss": -12.698264122009277, "global_step": 423826, "epoch": 2522} {"train_loss": -12.153791427612305, "global_step": 423827, "epoch": 2522} {"train_loss": -12.635557174682617, "global_step": 423828, "epoch": 2522} {"train_loss": -12.550844192504883, "global_step": 423829, "epoch": 2522} {"train_loss": -12.419095993041992, "global_step": 423830, "epoch": 2522} {"train_loss": -12.626372337341309, "global_step": 423831, "epoch": 2522} {"train_loss": -12.796998977661133, "global_step": 423832, "epoch": 2522} {"train_loss": -12.110824584960938, "global_step": 423833, "epoch": 2522} {"train_loss": -11.624672889709473, "global_step": 423834, "epoch": 2522} {"train_loss": -12.592382431030273, "global_step": 423835, "epoch": 2522} {"train_loss": -12.359823226928711, "global_step": 423836, "epoch": 2522} {"train_loss": -11.833023071289062, "global_step": 423837, "epoch": 2522} {"train_loss": -12.59644889831543, "global_step": 423838, "epoch": 2522} {"train_loss": -12.432600021362305, "global_step": 423839, "epoch": 2522} {"train_loss": -12.535123825073242, "global_step": 423840, "epoch": 2522} {"train_loss": -12.309980392456055, "global_step": 423841, "epoch": 2522} {"train_loss": -12.564273834228516, "global_step": 423842, "epoch": 2522} {"train_loss": -12.797762870788574, "global_step": 423843, "epoch": 2522} {"train_loss": -12.309871673583984, "global_step": 423844, "epoch": 2522} {"train_loss": -12.545661926269531, "global_step": 423845, "epoch": 2522} {"train_loss": -12.68674373626709, "global_step": 423846, "epoch": 2522} {"train_loss": -12.060416221618652, "global_step": 423847, "epoch": 2522} {"train_loss": -12.388769149780273, "global_step": 423848, "epoch": 2522} {"train_loss": -12.54796028137207, "global_step": 423849, "epoch": 2522} {"train_loss": -12.633318901062012, "global_step": 423850, "epoch": 2522} {"train_loss": -12.786323547363281, "global_step": 423851, "epoch": 2522} {"train_loss": -12.299423217773438, "global_step": 423852, "epoch": 2522} {"train_loss": -12.53455924987793, "global_step": 423853, "epoch": 2522} {"train_loss": -12.429950714111328, "global_step": 423854, "epoch": 2522} {"train_loss": -12.803961753845215, "global_step": 423855, "epoch": 2522} {"train_loss": -12.66343879699707, "global_step": 423856, "epoch": 2522} {"train_loss": -11.66530704498291, "global_step": 423857, "epoch": 2522} {"train_loss": -12.67471981048584, "global_step": 423858, "epoch": 2522} {"train_loss": -12.838485717773438, "global_step": 423859, "epoch": 2522} {"train_loss": -12.294652938842773, "global_step": 423860, "epoch": 2522} {"train_loss": -11.641756057739258, "global_step": 423861, "epoch": 2522} {"train_loss": -12.32590389251709, "global_step": 423862, "epoch": 2522} {"train_loss": -12.288428380375816, "global_step": 423863, "epoch": 2522, "val_loss": 307573.21875} {"train_loss": -11.81960678100586, "global_step": 423864, "epoch": 2523} {"train_loss": -11.21926498413086, "global_step": 423865, "epoch": 2523} {"train_loss": -11.591836929321289, "global_step": 423866, "epoch": 2523} {"train_loss": -11.891268730163574, "global_step": 423867, "epoch": 2523} {"train_loss": -11.966604232788086, "global_step": 423868, "epoch": 2523} {"train_loss": -12.087017059326172, "global_step": 423869, "epoch": 2523} {"train_loss": -11.184621810913086, "global_step": 423870, "epoch": 2523} {"train_loss": -11.816132545471191, "global_step": 423871, "epoch": 2523} {"train_loss": -11.08734130859375, "global_step": 423872, "epoch": 2523} {"train_loss": -9.78160285949707, "global_step": 423873, "epoch": 2523} {"train_loss": -10.58161735534668, "global_step": 423874, "epoch": 2523} {"train_loss": -10.407655715942383, "global_step": 423875, "epoch": 2523} {"train_loss": -10.016645431518555, "global_step": 423876, "epoch": 2523} {"train_loss": -9.965595245361328, "global_step": 423877, "epoch": 2523} {"train_loss": -11.459325790405273, "global_step": 423878, "epoch": 2523} {"train_loss": -10.682378768920898, "global_step": 423879, "epoch": 2523} {"train_loss": -11.908537864685059, "global_step": 423880, "epoch": 2523} {"train_loss": -10.434795379638672, "global_step": 423881, "epoch": 2523} {"train_loss": -9.831328392028809, "global_step": 423882, "epoch": 2523} {"train_loss": -11.607498168945312, "global_step": 423883, "epoch": 2523} {"train_loss": -9.838272094726562, "global_step": 423884, "epoch": 2523} {"train_loss": -10.222678184509277, "global_step": 423885, "epoch": 2523} {"train_loss": -11.562500953674316, "global_step": 423886, "epoch": 2523} {"train_loss": -10.865890502929688, "global_step": 423887, "epoch": 2523} {"train_loss": -10.78326416015625, "global_step": 423888, "epoch": 2523} {"train_loss": -11.524009704589844, "global_step": 423889, "epoch": 2523} {"train_loss": -11.058256149291992, "global_step": 423890, "epoch": 2523} {"train_loss": -10.656858444213867, "global_step": 423891, "epoch": 2523} {"train_loss": -11.840075492858887, "global_step": 423892, "epoch": 2523} {"train_loss": -10.494217872619629, "global_step": 423893, "epoch": 2523} {"train_loss": -11.18731689453125, "global_step": 423894, "epoch": 2523} {"train_loss": -10.017407417297363, "global_step": 423895, "epoch": 2523} {"train_loss": -10.981927871704102, "global_step": 423896, "epoch": 2523} {"train_loss": -9.404340744018555, "global_step": 423897, "epoch": 2523} {"train_loss": -10.977540969848633, "global_step": 423898, "epoch": 2523} {"train_loss": -10.240281105041504, "global_step": 423899, "epoch": 2523} {"train_loss": -10.747758865356445, "global_step": 423900, "epoch": 2523} {"train_loss": -10.65090560913086, "global_step": 423901, "epoch": 2523} {"train_loss": -11.778345108032227, "global_step": 423902, "epoch": 2523} {"train_loss": -10.273171424865723, "global_step": 423903, "epoch": 2523} {"train_loss": -11.88649845123291, "global_step": 423904, "epoch": 2523} {"train_loss": -11.076899528503418, "global_step": 423905, "epoch": 2523} {"train_loss": -11.496484756469727, "global_step": 423906, "epoch": 2523} {"train_loss": -11.719650268554688, "global_step": 423907, "epoch": 2523} {"train_loss": -11.631790161132812, "global_step": 423908, "epoch": 2523} {"train_loss": -11.189952850341797, "global_step": 423909, "epoch": 2523} {"train_loss": -11.834855079650879, "global_step": 423910, "epoch": 2523} {"train_loss": -11.362958908081055, "global_step": 423911, "epoch": 2523} {"train_loss": -11.531598091125488, "global_step": 423912, "epoch": 2523} {"train_loss": -11.66619873046875, "global_step": 423913, "epoch": 2523} {"train_loss": -11.445585250854492, "global_step": 423914, "epoch": 2523} {"train_loss": -11.969426155090332, "global_step": 423915, "epoch": 2523} {"train_loss": -11.91378402709961, "global_step": 423916, "epoch": 2523} {"train_loss": -11.714067459106445, "global_step": 423917, "epoch": 2523} {"train_loss": -11.563342094421387, "global_step": 423918, "epoch": 2523} {"train_loss": -11.86147689819336, "global_step": 423919, "epoch": 2523} {"train_loss": -12.022150039672852, "global_step": 423920, "epoch": 2523} {"train_loss": -12.149808883666992, "global_step": 423921, "epoch": 2523} {"train_loss": -11.712156295776367, "global_step": 423922, "epoch": 2523} {"train_loss": -12.136316299438477, "global_step": 423923, "epoch": 2523} {"train_loss": -11.551582336425781, "global_step": 423924, "epoch": 2523} {"train_loss": -11.650863647460938, "global_step": 423925, "epoch": 2523} {"train_loss": -12.24837589263916, "global_step": 423926, "epoch": 2523} {"train_loss": -10.93576431274414, "global_step": 423927, "epoch": 2523} {"train_loss": -11.853032112121582, "global_step": 423928, "epoch": 2523} {"train_loss": -10.728675842285156, "global_step": 423929, "epoch": 2523} {"train_loss": -11.747360229492188, "global_step": 423930, "epoch": 2523} {"train_loss": -11.441516876220703, "global_step": 423931, "epoch": 2523} {"train_loss": -11.476615905761719, "global_step": 423932, "epoch": 2523} {"train_loss": -11.104574203491211, "global_step": 423933, "epoch": 2523} {"train_loss": -12.159334182739258, "global_step": 423934, "epoch": 2523} {"train_loss": -11.588495254516602, "global_step": 423935, "epoch": 2523} {"train_loss": -11.998237609863281, "global_step": 423936, "epoch": 2523} {"train_loss": -12.060515403747559, "global_step": 423937, "epoch": 2523} {"train_loss": -12.024993896484375, "global_step": 423938, "epoch": 2523} {"train_loss": -12.013822555541992, "global_step": 423939, "epoch": 2523} {"train_loss": -12.056652069091797, "global_step": 423940, "epoch": 2523} {"train_loss": -12.094989776611328, "global_step": 423941, "epoch": 2523} {"train_loss": -11.934829711914062, "global_step": 423942, "epoch": 2523} {"train_loss": -12.174139022827148, "global_step": 423943, "epoch": 2523} {"train_loss": -12.415916442871094, "global_step": 423944, "epoch": 2523} {"train_loss": -12.342584609985352, "global_step": 423945, "epoch": 2523} {"train_loss": -12.351423263549805, "global_step": 423946, "epoch": 2523} {"train_loss": -12.269569396972656, "global_step": 423947, "epoch": 2523} {"train_loss": -12.447904586791992, "global_step": 423948, "epoch": 2523} {"train_loss": -12.486783027648926, "global_step": 423949, "epoch": 2523} {"train_loss": -12.567195892333984, "global_step": 423950, "epoch": 2523} {"train_loss": -12.265846252441406, "global_step": 423951, "epoch": 2523} {"train_loss": -12.498211860656738, "global_step": 423952, "epoch": 2523} {"train_loss": -12.592849731445312, "global_step": 423953, "epoch": 2523} {"train_loss": -12.424101829528809, "global_step": 423954, "epoch": 2523} {"train_loss": -12.534101486206055, "global_step": 423955, "epoch": 2523} {"train_loss": -12.450889587402344, "global_step": 423956, "epoch": 2523} {"train_loss": -12.561580657958984, "global_step": 423957, "epoch": 2523} {"train_loss": -12.430242538452148, "global_step": 423958, "epoch": 2523} {"train_loss": -12.737594604492188, "global_step": 423959, "epoch": 2523} {"train_loss": -12.448746681213379, "global_step": 423960, "epoch": 2523} {"train_loss": -12.585975646972656, "global_step": 423961, "epoch": 2523} {"train_loss": -12.2860746383667, "global_step": 423962, "epoch": 2523} {"train_loss": -12.531158447265625, "global_step": 423963, "epoch": 2523} {"train_loss": -12.558852195739746, "global_step": 423964, "epoch": 2523} {"train_loss": -12.564436912536621, "global_step": 423965, "epoch": 2523} {"train_loss": -12.835161209106445, "global_step": 423966, "epoch": 2523} {"train_loss": -12.720864295959473, "global_step": 423967, "epoch": 2523} {"train_loss": -12.26972770690918, "global_step": 423968, "epoch": 2523} {"train_loss": -12.702569961547852, "global_step": 423969, "epoch": 2523} {"train_loss": -12.514755249023438, "global_step": 423970, "epoch": 2523} {"train_loss": -12.542167663574219, "global_step": 423971, "epoch": 2523} {"train_loss": -12.726602554321289, "global_step": 423972, "epoch": 2523} {"train_loss": -12.585460662841797, "global_step": 423973, "epoch": 2523} {"train_loss": -12.712345123291016, "global_step": 423974, "epoch": 2523} {"train_loss": -12.403841018676758, "global_step": 423975, "epoch": 2523} {"train_loss": -12.70866584777832, "global_step": 423976, "epoch": 2523} {"train_loss": -12.542328834533691, "global_step": 423977, "epoch": 2523} {"train_loss": -12.521590232849121, "global_step": 423978, "epoch": 2523} {"train_loss": -12.587656021118164, "global_step": 423979, "epoch": 2523} {"train_loss": -12.737096786499023, "global_step": 423980, "epoch": 2523} {"train_loss": -12.581586837768555, "global_step": 423981, "epoch": 2523} {"train_loss": -12.794927597045898, "global_step": 423982, "epoch": 2523} {"train_loss": -12.596992492675781, "global_step": 423983, "epoch": 2523} {"train_loss": -12.450030326843262, "global_step": 423984, "epoch": 2523} {"train_loss": -12.551175117492676, "global_step": 423985, "epoch": 2523} {"train_loss": -12.641779899597168, "global_step": 423986, "epoch": 2523} {"train_loss": -12.623286247253418, "global_step": 423987, "epoch": 2523} {"train_loss": -12.552064895629883, "global_step": 423988, "epoch": 2523} {"train_loss": -12.548978805541992, "global_step": 423989, "epoch": 2523} {"train_loss": -12.714421272277832, "global_step": 423990, "epoch": 2523} {"train_loss": -12.705793380737305, "global_step": 423991, "epoch": 2523} {"train_loss": -12.395809173583984, "global_step": 423992, "epoch": 2523} {"train_loss": -12.840560913085938, "global_step": 423993, "epoch": 2523} {"train_loss": -12.611717224121094, "global_step": 423994, "epoch": 2523} {"train_loss": -12.777069091796875, "global_step": 423995, "epoch": 2523} {"train_loss": -12.41541576385498, "global_step": 423996, "epoch": 2523} {"train_loss": -12.86146354675293, "global_step": 423997, "epoch": 2523} {"train_loss": -12.614319801330566, "global_step": 423998, "epoch": 2523} {"train_loss": -12.673210144042969, "global_step": 423999, "epoch": 2523} {"train_loss": -12.546097755432129, "global_step": 424000, "epoch": 2523} {"train_loss": -12.393695831298828, "global_step": 424001, "epoch": 2523} {"train_loss": -12.694043159484863, "global_step": 424002, "epoch": 2523} {"train_loss": -12.05097770690918, "global_step": 424003, "epoch": 2523} {"train_loss": -12.145033836364746, "global_step": 424004, "epoch": 2523} {"train_loss": -11.962194442749023, "global_step": 424005, "epoch": 2523} {"train_loss": -11.647834777832031, "global_step": 424006, "epoch": 2523} {"train_loss": -10.876482963562012, "global_step": 424007, "epoch": 2523} {"train_loss": -12.66534423828125, "global_step": 424008, "epoch": 2523} {"train_loss": -10.69198226928711, "global_step": 424009, "epoch": 2523} {"train_loss": -11.079526901245117, "global_step": 424010, "epoch": 2523} {"train_loss": -11.472485542297363, "global_step": 424011, "epoch": 2523} {"train_loss": -11.385347366333008, "global_step": 424012, "epoch": 2523} {"train_loss": -12.342439651489258, "global_step": 424013, "epoch": 2523} {"train_loss": -11.858501434326172, "global_step": 424014, "epoch": 2523} {"train_loss": -12.199817657470703, "global_step": 424015, "epoch": 2523} {"train_loss": -12.029613494873047, "global_step": 424016, "epoch": 2523} {"train_loss": -12.500011444091797, "global_step": 424017, "epoch": 2523} {"train_loss": -11.642379760742188, "global_step": 424018, "epoch": 2523} {"train_loss": -12.211055755615234, "global_step": 424019, "epoch": 2523} {"train_loss": -12.212760925292969, "global_step": 424020, "epoch": 2523} {"train_loss": -11.228988647460938, "global_step": 424021, "epoch": 2523} {"train_loss": -11.893582344055176, "global_step": 424022, "epoch": 2523} {"train_loss": -12.579429626464844, "global_step": 424023, "epoch": 2523} {"train_loss": -12.152960777282715, "global_step": 424024, "epoch": 2523} {"train_loss": -12.623605728149414, "global_step": 424025, "epoch": 2523} {"train_loss": -12.541423797607422, "global_step": 424026, "epoch": 2523} {"train_loss": -12.17662239074707, "global_step": 424027, "epoch": 2523} {"train_loss": -12.443211555480957, "global_step": 424028, "epoch": 2523} {"train_loss": -12.379261016845703, "global_step": 424029, "epoch": 2523} {"train_loss": -11.594301223754883, "global_step": 424030, "epoch": 2523} {"train_loss": -11.863424494152977, "global_step": 424031, "epoch": 2523, "val_loss": 310133.3125} {"train_loss": -11.453988075256348, "global_step": 424032, "epoch": 2524} {"train_loss": -11.771347999572754, "global_step": 424033, "epoch": 2524} {"train_loss": -12.60955810546875, "global_step": 424034, "epoch": 2524} {"train_loss": -12.00367546081543, "global_step": 424035, "epoch": 2524} {"train_loss": -11.67335319519043, "global_step": 424036, "epoch": 2524} {"train_loss": -12.583858489990234, "global_step": 424037, "epoch": 2524} {"train_loss": -12.211145401000977, "global_step": 424038, "epoch": 2524} {"train_loss": -12.111756324768066, "global_step": 424039, "epoch": 2524} {"train_loss": -12.309446334838867, "global_step": 424040, "epoch": 2524} {"train_loss": -12.26458740234375, "global_step": 424041, "epoch": 2524} {"train_loss": -12.388956069946289, "global_step": 424042, "epoch": 2524} {"train_loss": -12.594104766845703, "global_step": 424043, "epoch": 2524} {"train_loss": -12.508074760437012, "global_step": 424044, "epoch": 2524} {"train_loss": -12.291372299194336, "global_step": 424045, "epoch": 2524} {"train_loss": -12.209549903869629, "global_step": 424046, "epoch": 2524} {"train_loss": -12.454656600952148, "global_step": 424047, "epoch": 2524} {"train_loss": -11.883441925048828, "global_step": 424048, "epoch": 2524} {"train_loss": -12.277633666992188, "global_step": 424049, "epoch": 2524} {"train_loss": -11.722681999206543, "global_step": 424050, "epoch": 2524} {"train_loss": -12.168615341186523, "global_step": 424051, "epoch": 2524} {"train_loss": -11.744220733642578, "global_step": 424052, "epoch": 2524} {"train_loss": -12.492488861083984, "global_step": 424053, "epoch": 2524} {"train_loss": -12.47799015045166, "global_step": 424054, "epoch": 2524} {"train_loss": -12.430913925170898, "global_step": 424055, "epoch": 2524} {"train_loss": -12.156328201293945, "global_step": 424056, "epoch": 2524} {"train_loss": -12.375168800354004, "global_step": 424057, "epoch": 2524} {"train_loss": -12.301810264587402, "global_step": 424058, "epoch": 2524} {"train_loss": -12.364892959594727, "global_step": 424059, "epoch": 2524} {"train_loss": -12.512001037597656, "global_step": 424060, "epoch": 2524} {"train_loss": -12.292484283447266, "global_step": 424061, "epoch": 2524} {"train_loss": -12.275344848632812, "global_step": 424062, "epoch": 2524} {"train_loss": -12.475205421447754, "global_step": 424063, "epoch": 2524} {"train_loss": -12.394899368286133, "global_step": 424064, "epoch": 2524} {"train_loss": -11.204513549804688, "global_step": 424065, "epoch": 2524} {"train_loss": -12.3667631149292, "global_step": 424066, "epoch": 2524} {"train_loss": -12.190386772155762, "global_step": 424067, "epoch": 2524} {"train_loss": -12.221540451049805, "global_step": 424068, "epoch": 2524} {"train_loss": -12.409805297851562, "global_step": 424069, "epoch": 2524} {"train_loss": -12.262056350708008, "global_step": 424070, "epoch": 2524} {"train_loss": -11.485739707946777, "global_step": 424071, "epoch": 2524} {"train_loss": -12.528484344482422, "global_step": 424072, "epoch": 2524} {"train_loss": -11.917632102966309, "global_step": 424073, "epoch": 2524} {"train_loss": -12.017986297607422, "global_step": 424074, "epoch": 2524} {"train_loss": -11.482837677001953, "global_step": 424075, "epoch": 2524} {"train_loss": -12.043686866760254, "global_step": 424076, "epoch": 2524} {"train_loss": -11.718297958374023, "global_step": 424077, "epoch": 2524} {"train_loss": -12.451520919799805, "global_step": 424078, "epoch": 2524} {"train_loss": -12.197588920593262, "global_step": 424079, "epoch": 2524} {"train_loss": -12.143630981445312, "global_step": 424080, "epoch": 2524} {"train_loss": -11.645654678344727, "global_step": 424081, "epoch": 2524} {"train_loss": -11.947030067443848, "global_step": 424082, "epoch": 2524} {"train_loss": -12.15802001953125, "global_step": 424083, "epoch": 2524} {"train_loss": -11.557516098022461, "global_step": 424084, "epoch": 2524} {"train_loss": -11.795799255371094, "global_step": 424085, "epoch": 2524} {"train_loss": -11.434484481811523, "global_step": 424086, "epoch": 2524} {"train_loss": -11.421993255615234, "global_step": 424087, "epoch": 2524} {"train_loss": -11.736310958862305, "global_step": 424088, "epoch": 2524} {"train_loss": -12.188969612121582, "global_step": 424089, "epoch": 2524} {"train_loss": -11.553385734558105, "global_step": 424090, "epoch": 2524} {"train_loss": -12.315231323242188, "global_step": 424091, "epoch": 2524} {"train_loss": -11.666511535644531, "global_step": 424092, "epoch": 2524} {"train_loss": -12.172751426696777, "global_step": 424093, "epoch": 2524} {"train_loss": -12.338637351989746, "global_step": 424094, "epoch": 2524} {"train_loss": -12.143453598022461, "global_step": 424095, "epoch": 2524} {"train_loss": -12.022693634033203, "global_step": 424096, "epoch": 2524} {"train_loss": -12.225990295410156, "global_step": 424097, "epoch": 2524} {"train_loss": -11.617378234863281, "global_step": 424098, "epoch": 2524} {"train_loss": -12.390872955322266, "global_step": 424099, "epoch": 2524} {"train_loss": -12.178406715393066, "global_step": 424100, "epoch": 2524} {"train_loss": -12.28924560546875, "global_step": 424101, "epoch": 2524} {"train_loss": -12.268050193786621, "global_step": 424102, "epoch": 2524} {"train_loss": -12.185312271118164, "global_step": 424103, "epoch": 2524} {"train_loss": -12.051799774169922, "global_step": 424104, "epoch": 2524} {"train_loss": -12.125777244567871, "global_step": 424105, "epoch": 2524} {"train_loss": -11.745626449584961, "global_step": 424106, "epoch": 2524} {"train_loss": -11.629968643188477, "global_step": 424107, "epoch": 2524} {"train_loss": -12.188643455505371, "global_step": 424108, "epoch": 2524} {"train_loss": -10.87757396697998, "global_step": 424109, "epoch": 2524} {"train_loss": -12.319604873657227, "global_step": 424110, "epoch": 2524} {"train_loss": -11.13890266418457, "global_step": 424111, "epoch": 2524} {"train_loss": -11.669110298156738, "global_step": 424112, "epoch": 2524} {"train_loss": -11.785409927368164, "global_step": 424113, "epoch": 2524} {"train_loss": -10.69723892211914, "global_step": 424114, "epoch": 2524} {"train_loss": -11.373555183410645, "global_step": 424115, "epoch": 2524} {"train_loss": -11.370780944824219, "global_step": 424116, "epoch": 2524} {"train_loss": -10.872430801391602, "global_step": 424117, "epoch": 2524} {"train_loss": -11.990608215332031, "global_step": 424118, "epoch": 2524} {"train_loss": -11.644033432006836, "global_step": 424119, "epoch": 2524} {"train_loss": -11.746904373168945, "global_step": 424120, "epoch": 2524} {"train_loss": -11.839235305786133, "global_step": 424121, "epoch": 2524} {"train_loss": -11.601543426513672, "global_step": 424122, "epoch": 2524} {"train_loss": -11.976238250732422, "global_step": 424123, "epoch": 2524} {"train_loss": -11.747289657592773, "global_step": 424124, "epoch": 2524} {"train_loss": -12.105429649353027, "global_step": 424125, "epoch": 2524} {"train_loss": -11.637420654296875, "global_step": 424126, "epoch": 2524} {"train_loss": -11.672343254089355, "global_step": 424127, "epoch": 2524} {"train_loss": -12.142674446105957, "global_step": 424128, "epoch": 2524} {"train_loss": -11.470797538757324, "global_step": 424129, "epoch": 2524} {"train_loss": -12.30431079864502, "global_step": 424130, "epoch": 2524} {"train_loss": -11.681011199951172, "global_step": 424131, "epoch": 2524} {"train_loss": -11.924524307250977, "global_step": 424132, "epoch": 2524} {"train_loss": -11.917648315429688, "global_step": 424133, "epoch": 2524} {"train_loss": -11.846015930175781, "global_step": 424134, "epoch": 2524} {"train_loss": -11.812880516052246, "global_step": 424135, "epoch": 2524} {"train_loss": -12.01639461517334, "global_step": 424136, "epoch": 2524} {"train_loss": -12.03652572631836, "global_step": 424137, "epoch": 2524} {"train_loss": -12.391594886779785, "global_step": 424138, "epoch": 2524} {"train_loss": -11.842188835144043, "global_step": 424139, "epoch": 2524} {"train_loss": -12.350387573242188, "global_step": 424140, "epoch": 2524} {"train_loss": -11.882487297058105, "global_step": 424141, "epoch": 2524} {"train_loss": -12.309244155883789, "global_step": 424142, "epoch": 2524} {"train_loss": -12.014509201049805, "global_step": 424143, "epoch": 2524} {"train_loss": -11.776958465576172, "global_step": 424144, "epoch": 2524} {"train_loss": -11.624418258666992, "global_step": 424145, "epoch": 2524} {"train_loss": -11.127294540405273, "global_step": 424146, "epoch": 2524} {"train_loss": -11.969459533691406, "global_step": 424147, "epoch": 2524} {"train_loss": -10.880170822143555, "global_step": 424148, "epoch": 2524} {"train_loss": -11.871606826782227, "global_step": 424149, "epoch": 2524} {"train_loss": -11.233192443847656, "global_step": 424150, "epoch": 2524} {"train_loss": -11.720970153808594, "global_step": 424151, "epoch": 2524} {"train_loss": -11.554069519042969, "global_step": 424152, "epoch": 2524} {"train_loss": -11.899410247802734, "global_step": 424153, "epoch": 2524} {"train_loss": -11.822887420654297, "global_step": 424154, "epoch": 2524} {"train_loss": -11.820839881896973, "global_step": 424155, "epoch": 2524} {"train_loss": -12.123153686523438, "global_step": 424156, "epoch": 2524} {"train_loss": -12.094700813293457, "global_step": 424157, "epoch": 2524} {"train_loss": -12.24307918548584, "global_step": 424158, "epoch": 2524} {"train_loss": -11.997726440429688, "global_step": 424159, "epoch": 2524} {"train_loss": -12.334623336791992, "global_step": 424160, "epoch": 2524} {"train_loss": -12.226728439331055, "global_step": 424161, "epoch": 2524} {"train_loss": -12.288888931274414, "global_step": 424162, "epoch": 2524} {"train_loss": -12.290839195251465, "global_step": 424163, "epoch": 2524} {"train_loss": -12.390107154846191, "global_step": 424164, "epoch": 2524} {"train_loss": -12.327493667602539, "global_step": 424165, "epoch": 2524} {"train_loss": -12.4306640625, "global_step": 424166, "epoch": 2524} {"train_loss": -12.506954193115234, "global_step": 424167, "epoch": 2524} {"train_loss": -12.448392868041992, "global_step": 424168, "epoch": 2524} {"train_loss": -12.508367538452148, "global_step": 424169, "epoch": 2524} {"train_loss": -12.36530590057373, "global_step": 424170, "epoch": 2524} {"train_loss": -12.60209846496582, "global_step": 424171, "epoch": 2524} {"train_loss": -12.474020957946777, "global_step": 424172, "epoch": 2524} {"train_loss": -12.183303833007812, "global_step": 424173, "epoch": 2524} {"train_loss": -12.672954559326172, "global_step": 424174, "epoch": 2524} {"train_loss": -12.474296569824219, "global_step": 424175, "epoch": 2524} {"train_loss": -12.687458992004395, "global_step": 424176, "epoch": 2524} {"train_loss": -12.44430160522461, "global_step": 424177, "epoch": 2524} {"train_loss": -12.55911636352539, "global_step": 424178, "epoch": 2524} {"train_loss": -12.56097412109375, "global_step": 424179, "epoch": 2524} {"train_loss": -12.510241508483887, "global_step": 424180, "epoch": 2524} {"train_loss": -12.779483795166016, "global_step": 424181, "epoch": 2524} {"train_loss": -12.261474609375, "global_step": 424182, "epoch": 2524} {"train_loss": -12.543407440185547, "global_step": 424183, "epoch": 2524} {"train_loss": -12.38115119934082, "global_step": 424184, "epoch": 2524} {"train_loss": -12.505352020263672, "global_step": 424185, "epoch": 2524} {"train_loss": -12.661874771118164, "global_step": 424186, "epoch": 2524} {"train_loss": -12.054941177368164, "global_step": 424187, "epoch": 2524} {"train_loss": -12.607475280761719, "global_step": 424188, "epoch": 2524} {"train_loss": -12.438127517700195, "global_step": 424189, "epoch": 2524} {"train_loss": -12.556809425354004, "global_step": 424190, "epoch": 2524} {"train_loss": -12.578344345092773, "global_step": 424191, "epoch": 2524} {"train_loss": -12.328299522399902, "global_step": 424192, "epoch": 2524} {"train_loss": -12.598146438598633, "global_step": 424193, "epoch": 2524} {"train_loss": -12.390838623046875, "global_step": 424194, "epoch": 2524} {"train_loss": -12.373037338256836, "global_step": 424195, "epoch": 2524} {"train_loss": -12.396900177001953, "global_step": 424196, "epoch": 2524} {"train_loss": -12.533939361572266, "global_step": 424197, "epoch": 2524} {"train_loss": -12.673417091369629, "global_step": 424198, "epoch": 2524} {"train_loss": -12.081471954073224, "global_step": 424199, "epoch": 2524, "val_loss": 311186.71875} {"train_loss": -12.549470901489258, "global_step": 424200, "epoch": 2525} {"train_loss": -12.274174690246582, "global_step": 424201, "epoch": 2525} {"train_loss": -12.097352981567383, "global_step": 424202, "epoch": 2525} {"train_loss": -12.624075889587402, "global_step": 424203, "epoch": 2525} {"train_loss": -12.026681900024414, "global_step": 424204, "epoch": 2525} {"train_loss": -12.623741149902344, "global_step": 424205, "epoch": 2525} {"train_loss": -12.172866821289062, "global_step": 424206, "epoch": 2525} {"train_loss": -12.227449417114258, "global_step": 424207, "epoch": 2525} {"train_loss": -12.471495628356934, "global_step": 424208, "epoch": 2525} {"train_loss": -11.398462295532227, "global_step": 424209, "epoch": 2525} {"train_loss": -12.274234771728516, "global_step": 424210, "epoch": 2525} {"train_loss": -12.567605018615723, "global_step": 424211, "epoch": 2525} {"train_loss": -11.287145614624023, "global_step": 424212, "epoch": 2525} {"train_loss": -12.215530395507812, "global_step": 424213, "epoch": 2525} {"train_loss": -12.163544654846191, "global_step": 424214, "epoch": 2525} {"train_loss": -12.499938011169434, "global_step": 424215, "epoch": 2525} {"train_loss": -12.15190315246582, "global_step": 424216, "epoch": 2525} {"train_loss": -12.363099098205566, "global_step": 424217, "epoch": 2525} {"train_loss": -12.312919616699219, "global_step": 424218, "epoch": 2525} {"train_loss": -12.359193801879883, "global_step": 424219, "epoch": 2525} {"train_loss": -12.505685806274414, "global_step": 424220, "epoch": 2525} {"train_loss": -12.297992706298828, "global_step": 424221, "epoch": 2525} {"train_loss": -12.813153266906738, "global_step": 424222, "epoch": 2525} {"train_loss": -12.558963775634766, "global_step": 424223, "epoch": 2525} {"train_loss": -12.661800384521484, "global_step": 424224, "epoch": 2525} {"train_loss": -12.815828323364258, "global_step": 424225, "epoch": 2525} {"train_loss": -12.274813652038574, "global_step": 424226, "epoch": 2525} {"train_loss": -12.415504455566406, "global_step": 424227, "epoch": 2525} {"train_loss": -12.794390678405762, "global_step": 424228, "epoch": 2525} {"train_loss": -12.561304092407227, "global_step": 424229, "epoch": 2525} {"train_loss": -12.840977668762207, "global_step": 424230, "epoch": 2525} {"train_loss": -12.671037673950195, "global_step": 424231, "epoch": 2525} {"train_loss": -12.782547950744629, "global_step": 424232, "epoch": 2525} {"train_loss": -12.626522064208984, "global_step": 424233, "epoch": 2525} {"train_loss": -12.81660270690918, "global_step": 424234, "epoch": 2525} {"train_loss": -12.536359786987305, "global_step": 424235, "epoch": 2525} {"train_loss": -12.777144432067871, "global_step": 424236, "epoch": 2525} {"train_loss": -12.329462051391602, "global_step": 424237, "epoch": 2525} {"train_loss": -12.432622909545898, "global_step": 424238, "epoch": 2525} {"train_loss": -12.915386199951172, "global_step": 424239, "epoch": 2525} {"train_loss": -12.448089599609375, "global_step": 424240, "epoch": 2525} {"train_loss": -12.787801742553711, "global_step": 424241, "epoch": 2525} {"train_loss": -12.805231094360352, "global_step": 424242, "epoch": 2525} {"train_loss": -12.740803718566895, "global_step": 424243, "epoch": 2525} {"train_loss": -12.767675399780273, "global_step": 424244, "epoch": 2525} {"train_loss": -12.947604179382324, "global_step": 424245, "epoch": 2525} {"train_loss": -12.815893173217773, "global_step": 424246, "epoch": 2525} {"train_loss": -12.640909194946289, "global_step": 424247, "epoch": 2525} {"train_loss": -12.50219440460205, "global_step": 424248, "epoch": 2525} {"train_loss": -12.460203170776367, "global_step": 424249, "epoch": 2525} {"train_loss": -12.562524795532227, "global_step": 424250, "epoch": 2525} {"train_loss": -11.968829154968262, "global_step": 424251, "epoch": 2525} {"train_loss": -12.1557035446167, "global_step": 424252, "epoch": 2525} {"train_loss": -12.11557388305664, "global_step": 424253, "epoch": 2525} {"train_loss": -12.43101978302002, "global_step": 424254, "epoch": 2525} {"train_loss": -12.184350967407227, "global_step": 424255, "epoch": 2525} {"train_loss": -11.514551162719727, "global_step": 424256, "epoch": 2525} {"train_loss": -12.804793357849121, "global_step": 424257, "epoch": 2525} {"train_loss": -12.079645156860352, "global_step": 424258, "epoch": 2525} {"train_loss": -12.247400283813477, "global_step": 424259, "epoch": 2525} {"train_loss": -12.646038055419922, "global_step": 424260, "epoch": 2525} {"train_loss": -12.577203750610352, "global_step": 424261, "epoch": 2525} {"train_loss": -12.186439514160156, "global_step": 424262, "epoch": 2525} {"train_loss": -12.649761199951172, "global_step": 424263, "epoch": 2525} {"train_loss": -12.441519737243652, "global_step": 424264, "epoch": 2525} {"train_loss": -12.76211166381836, "global_step": 424265, "epoch": 2525} {"train_loss": -12.037160873413086, "global_step": 424266, "epoch": 2525} {"train_loss": -12.004914283752441, "global_step": 424267, "epoch": 2525} {"train_loss": -11.846641540527344, "global_step": 424268, "epoch": 2525} {"train_loss": -10.086158752441406, "global_step": 424269, "epoch": 2525} {"train_loss": -11.052538871765137, "global_step": 424270, "epoch": 2525} {"train_loss": -11.986040115356445, "global_step": 424271, "epoch": 2525} {"train_loss": -9.827892303466797, "global_step": 424272, "epoch": 2525} {"train_loss": -11.462403297424316, "global_step": 424273, "epoch": 2525} {"train_loss": -9.192651748657227, "global_step": 424274, "epoch": 2525} {"train_loss": -10.68212890625, "global_step": 424275, "epoch": 2525} {"train_loss": -10.026605606079102, "global_step": 424276, "epoch": 2525} {"train_loss": -10.282308578491211, "global_step": 424277, "epoch": 2525} {"train_loss": -10.63723087310791, "global_step": 424278, "epoch": 2525} {"train_loss": -10.216702461242676, "global_step": 424279, "epoch": 2525} {"train_loss": -10.11307430267334, "global_step": 424280, "epoch": 2525} {"train_loss": -11.089339256286621, "global_step": 424281, "epoch": 2525} {"train_loss": -11.065496444702148, "global_step": 424282, "epoch": 2525} {"train_loss": -9.247087478637695, "global_step": 424283, "epoch": 2525} {"train_loss": -11.211637496948242, "global_step": 424284, "epoch": 2525} {"train_loss": -10.400615692138672, "global_step": 424285, "epoch": 2525} {"train_loss": -11.229647636413574, "global_step": 424286, "epoch": 2525} {"train_loss": -8.940975189208984, "global_step": 424287, "epoch": 2525} {"train_loss": -9.92220687866211, "global_step": 424288, "epoch": 2525} {"train_loss": -11.214494705200195, "global_step": 424289, "epoch": 2525} {"train_loss": -7.706301212310791, "global_step": 424290, "epoch": 2525} {"train_loss": -9.629098892211914, "global_step": 424291, "epoch": 2525} {"train_loss": -9.751031875610352, "global_step": 424292, "epoch": 2525} {"train_loss": -8.690361022949219, "global_step": 424293, "epoch": 2525} {"train_loss": -8.589207649230957, "global_step": 424294, "epoch": 2525} {"train_loss": -7.619649887084961, "global_step": 424295, "epoch": 2525} {"train_loss": -8.266887664794922, "global_step": 424296, "epoch": 2525} {"train_loss": -8.870399475097656, "global_step": 424297, "epoch": 2525} {"train_loss": -9.846269607543945, "global_step": 424298, "epoch": 2525} {"train_loss": -9.457178115844727, "global_step": 424299, "epoch": 2525} {"train_loss": -9.414237976074219, "global_step": 424300, "epoch": 2525} {"train_loss": -10.10159683227539, "global_step": 424301, "epoch": 2525} {"train_loss": -10.522656440734863, "global_step": 424302, "epoch": 2525} {"train_loss": -10.596473693847656, "global_step": 424303, "epoch": 2525} {"train_loss": -10.820886611938477, "global_step": 424304, "epoch": 2525} {"train_loss": -10.95212173461914, "global_step": 424305, "epoch": 2525} {"train_loss": -10.911405563354492, "global_step": 424306, "epoch": 2525} {"train_loss": -11.142923355102539, "global_step": 424307, "epoch": 2525} {"train_loss": -11.420781135559082, "global_step": 424308, "epoch": 2525} {"train_loss": -11.269872665405273, "global_step": 424309, "epoch": 2525} {"train_loss": -11.38824462890625, "global_step": 424310, "epoch": 2525} {"train_loss": -11.738805770874023, "global_step": 424311, "epoch": 2525} {"train_loss": -11.874433517456055, "global_step": 424312, "epoch": 2525} {"train_loss": -11.875850677490234, "global_step": 424313, "epoch": 2525} {"train_loss": -12.00547981262207, "global_step": 424314, "epoch": 2525} {"train_loss": -11.545623779296875, "global_step": 424315, "epoch": 2525} {"train_loss": -11.730514526367188, "global_step": 424316, "epoch": 2525} {"train_loss": -11.791598320007324, "global_step": 424317, "epoch": 2525} {"train_loss": -11.842784881591797, "global_step": 424318, "epoch": 2525} {"train_loss": -11.881307601928711, "global_step": 424319, "epoch": 2525} {"train_loss": -11.968633651733398, "global_step": 424320, "epoch": 2525} {"train_loss": -12.070526123046875, "global_step": 424321, "epoch": 2525} {"train_loss": -12.178434371948242, "global_step": 424322, "epoch": 2525} {"train_loss": -12.150656700134277, "global_step": 424323, "epoch": 2525} {"train_loss": -12.123380661010742, "global_step": 424324, "epoch": 2525} {"train_loss": -12.209333419799805, "global_step": 424325, "epoch": 2525} {"train_loss": -12.222187042236328, "global_step": 424326, "epoch": 2525} {"train_loss": -12.322806358337402, "global_step": 424327, "epoch": 2525} {"train_loss": -12.113353729248047, "global_step": 424328, "epoch": 2525} {"train_loss": -12.473897933959961, "global_step": 424329, "epoch": 2525} {"train_loss": -12.365547180175781, "global_step": 424330, "epoch": 2525} {"train_loss": -11.887929916381836, "global_step": 424331, "epoch": 2525} {"train_loss": -12.29195499420166, "global_step": 424332, "epoch": 2525} {"train_loss": -12.520071029663086, "global_step": 424333, "epoch": 2525} {"train_loss": -12.108316421508789, "global_step": 424334, "epoch": 2525} {"train_loss": -12.267454147338867, "global_step": 424335, "epoch": 2525} {"train_loss": -12.236682891845703, "global_step": 424336, "epoch": 2525} {"train_loss": -12.362625122070312, "global_step": 424337, "epoch": 2525} {"train_loss": -12.392605781555176, "global_step": 424338, "epoch": 2525} {"train_loss": -12.222740173339844, "global_step": 424339, "epoch": 2525} {"train_loss": -12.41832160949707, "global_step": 424340, "epoch": 2525} {"train_loss": -12.38528060913086, "global_step": 424341, "epoch": 2525} {"train_loss": -12.39501667022705, "global_step": 424342, "epoch": 2525} {"train_loss": -12.451669692993164, "global_step": 424343, "epoch": 2525} {"train_loss": -12.269598960876465, "global_step": 424344, "epoch": 2525} {"train_loss": -12.439123153686523, "global_step": 424345, "epoch": 2525} {"train_loss": -12.446019172668457, "global_step": 424346, "epoch": 2525} {"train_loss": -12.355522155761719, "global_step": 424347, "epoch": 2525} {"train_loss": -12.450738906860352, "global_step": 424348, "epoch": 2525} {"train_loss": -12.589696884155273, "global_step": 424349, "epoch": 2525} {"train_loss": -12.438238143920898, "global_step": 424350, "epoch": 2525} {"train_loss": -12.516120910644531, "global_step": 424351, "epoch": 2525} {"train_loss": -12.544571876525879, "global_step": 424352, "epoch": 2525} {"train_loss": -12.543302536010742, "global_step": 424353, "epoch": 2525} {"train_loss": -12.433375358581543, "global_step": 424354, "epoch": 2525} {"train_loss": -12.534605026245117, "global_step": 424355, "epoch": 2525} {"train_loss": -12.679885864257812, "global_step": 424356, "epoch": 2525} {"train_loss": -12.55167007446289, "global_step": 424357, "epoch": 2525} {"train_loss": -12.486740112304688, "global_step": 424358, "epoch": 2525} {"train_loss": -12.760112762451172, "global_step": 424359, "epoch": 2525} {"train_loss": -12.503475189208984, "global_step": 424360, "epoch": 2525} {"train_loss": -12.311271667480469, "global_step": 424361, "epoch": 2525} {"train_loss": -12.667129516601562, "global_step": 424362, "epoch": 2525} {"train_loss": -12.62136173248291, "global_step": 424363, "epoch": 2525} {"train_loss": -12.353775024414062, "global_step": 424364, "epoch": 2525} {"train_loss": -12.41588020324707, "global_step": 424365, "epoch": 2525} {"train_loss": -12.357953071594238, "global_step": 424366, "epoch": 2525} {"train_loss": -11.812471687793732, "global_step": 424367, "epoch": 2525, "val_loss": 309527.46875, "train_action_mse_error": 0.2761406898498535} {"train_loss": -12.444605827331543, "global_step": 424368, "epoch": 2526} {"train_loss": -12.875833511352539, "global_step": 424369, "epoch": 2526} {"train_loss": -12.347890853881836, "global_step": 424370, "epoch": 2526} {"train_loss": -12.394309043884277, "global_step": 424371, "epoch": 2526} {"train_loss": -12.536529541015625, "global_step": 424372, "epoch": 2526} {"train_loss": -12.650151252746582, "global_step": 424373, "epoch": 2526} {"train_loss": -12.685779571533203, "global_step": 424374, "epoch": 2526} {"train_loss": -12.388729095458984, "global_step": 424375, "epoch": 2526} {"train_loss": -12.750307083129883, "global_step": 424376, "epoch": 2526} {"train_loss": -12.278362274169922, "global_step": 424377, "epoch": 2526} {"train_loss": -12.473831176757812, "global_step": 424378, "epoch": 2526} {"train_loss": -12.72446346282959, "global_step": 424379, "epoch": 2526} {"train_loss": -12.453747749328613, "global_step": 424380, "epoch": 2526} {"train_loss": -12.517032623291016, "global_step": 424381, "epoch": 2526} {"train_loss": -12.543094635009766, "global_step": 424382, "epoch": 2526} {"train_loss": -12.59086799621582, "global_step": 424383, "epoch": 2526} {"train_loss": -12.672734260559082, "global_step": 424384, "epoch": 2526} {"train_loss": -12.726001739501953, "global_step": 424385, "epoch": 2526} {"train_loss": -12.70755386352539, "global_step": 424386, "epoch": 2526} {"train_loss": -12.716049194335938, "global_step": 424387, "epoch": 2526} {"train_loss": -12.891475677490234, "global_step": 424388, "epoch": 2526} {"train_loss": -12.67190170288086, "global_step": 424389, "epoch": 2526} {"train_loss": -12.457326889038086, "global_step": 424390, "epoch": 2526} {"train_loss": -12.772971153259277, "global_step": 424391, "epoch": 2526} {"train_loss": -12.511092185974121, "global_step": 424392, "epoch": 2526} {"train_loss": -12.590399742126465, "global_step": 424393, "epoch": 2526} {"train_loss": -12.551319122314453, "global_step": 424394, "epoch": 2526} {"train_loss": -12.589925765991211, "global_step": 424395, "epoch": 2526} {"train_loss": -13.018241882324219, "global_step": 424396, "epoch": 2526} {"train_loss": -12.76250171661377, "global_step": 424397, "epoch": 2526} {"train_loss": -12.662528991699219, "global_step": 424398, "epoch": 2526} {"train_loss": -12.716554641723633, "global_step": 424399, "epoch": 2526} {"train_loss": -12.659114837646484, "global_step": 424400, "epoch": 2526} {"train_loss": -12.595627784729004, "global_step": 424401, "epoch": 2526} {"train_loss": -12.043862342834473, "global_step": 424402, "epoch": 2526} {"train_loss": -12.08859920501709, "global_step": 424403, "epoch": 2526} {"train_loss": -12.49490737915039, "global_step": 424404, "epoch": 2526} {"train_loss": -12.062566757202148, "global_step": 424405, "epoch": 2526} {"train_loss": -12.675537109375, "global_step": 424406, "epoch": 2526} {"train_loss": -12.11509895324707, "global_step": 424407, "epoch": 2526} {"train_loss": -12.559671401977539, "global_step": 424408, "epoch": 2526} {"train_loss": -11.96790885925293, "global_step": 424409, "epoch": 2526} {"train_loss": -12.72663688659668, "global_step": 424410, "epoch": 2526} {"train_loss": -12.07484245300293, "global_step": 424411, "epoch": 2526} {"train_loss": -12.338099479675293, "global_step": 424412, "epoch": 2526} {"train_loss": -12.52737808227539, "global_step": 424413, "epoch": 2526} {"train_loss": -12.432146072387695, "global_step": 424414, "epoch": 2526} {"train_loss": -12.458651542663574, "global_step": 424415, "epoch": 2526} {"train_loss": -12.184883117675781, "global_step": 424416, "epoch": 2526} {"train_loss": -11.752130508422852, "global_step": 424417, "epoch": 2526} {"train_loss": -11.637943267822266, "global_step": 424418, "epoch": 2526} {"train_loss": -12.446168899536133, "global_step": 424419, "epoch": 2526} {"train_loss": -12.416969299316406, "global_step": 424420, "epoch": 2526} {"train_loss": -11.23160171508789, "global_step": 424421, "epoch": 2526} {"train_loss": -12.261666297912598, "global_step": 424422, "epoch": 2526} {"train_loss": -11.834808349609375, "global_step": 424423, "epoch": 2526} {"train_loss": -11.72062873840332, "global_step": 424424, "epoch": 2526} {"train_loss": -11.008529663085938, "global_step": 424425, "epoch": 2526} {"train_loss": -12.02177619934082, "global_step": 424426, "epoch": 2526} {"train_loss": -11.666657447814941, "global_step": 424427, "epoch": 2526} {"train_loss": -11.521673202514648, "global_step": 424428, "epoch": 2526} {"train_loss": -11.186528205871582, "global_step": 424429, "epoch": 2526} {"train_loss": -12.146434783935547, "global_step": 424430, "epoch": 2526} {"train_loss": -11.065789222717285, "global_step": 424431, "epoch": 2526} {"train_loss": -10.392181396484375, "global_step": 424432, "epoch": 2526} {"train_loss": -12.213846206665039, "global_step": 424433, "epoch": 2526} {"train_loss": -11.062702178955078, "global_step": 424434, "epoch": 2526} {"train_loss": -11.616353988647461, "global_step": 424435, "epoch": 2526} {"train_loss": -11.435293197631836, "global_step": 424436, "epoch": 2526} {"train_loss": -12.044108390808105, "global_step": 424437, "epoch": 2526} {"train_loss": -10.94546890258789, "global_step": 424438, "epoch": 2526} {"train_loss": -12.405994415283203, "global_step": 424439, "epoch": 2526} {"train_loss": -10.837116241455078, "global_step": 424440, "epoch": 2526} {"train_loss": -11.724803924560547, "global_step": 424441, "epoch": 2526} {"train_loss": -11.002331733703613, "global_step": 424442, "epoch": 2526} {"train_loss": -11.16132926940918, "global_step": 424443, "epoch": 2526} {"train_loss": -10.852009773254395, "global_step": 424444, "epoch": 2526} {"train_loss": -10.06968879699707, "global_step": 424445, "epoch": 2526} {"train_loss": -10.182502746582031, "global_step": 424446, "epoch": 2526} {"train_loss": -10.708194732666016, "global_step": 424447, "epoch": 2526} {"train_loss": -11.791444778442383, "global_step": 424448, "epoch": 2526} {"train_loss": -10.794315338134766, "global_step": 424449, "epoch": 2526} {"train_loss": -10.992009162902832, "global_step": 424450, "epoch": 2526} {"train_loss": -11.770177841186523, "global_step": 424451, "epoch": 2526} {"train_loss": -11.436097145080566, "global_step": 424452, "epoch": 2526} {"train_loss": -11.748519897460938, "global_step": 424453, "epoch": 2526} {"train_loss": -11.843791961669922, "global_step": 424454, "epoch": 2526} {"train_loss": -11.26226806640625, "global_step": 424455, "epoch": 2526} {"train_loss": -11.832040786743164, "global_step": 424456, "epoch": 2526} {"train_loss": -11.139036178588867, "global_step": 424457, "epoch": 2526} {"train_loss": -11.940970420837402, "global_step": 424458, "epoch": 2526} {"train_loss": -11.390450477600098, "global_step": 424459, "epoch": 2526} {"train_loss": -11.57859992980957, "global_step": 424460, "epoch": 2526} {"train_loss": -12.083514213562012, "global_step": 424461, "epoch": 2526} {"train_loss": -11.042381286621094, "global_step": 424462, "epoch": 2526} {"train_loss": -11.975728988647461, "global_step": 424463, "epoch": 2526} {"train_loss": -11.826802253723145, "global_step": 424464, "epoch": 2526} {"train_loss": -11.983027458190918, "global_step": 424465, "epoch": 2526} {"train_loss": -12.07104206085205, "global_step": 424466, "epoch": 2526} {"train_loss": -11.791419982910156, "global_step": 424467, "epoch": 2526} {"train_loss": -12.530204772949219, "global_step": 424468, "epoch": 2526} {"train_loss": -12.073071479797363, "global_step": 424469, "epoch": 2526} {"train_loss": -12.230386734008789, "global_step": 424470, "epoch": 2526} {"train_loss": -12.177019119262695, "global_step": 424471, "epoch": 2526} {"train_loss": -12.17466926574707, "global_step": 424472, "epoch": 2526} {"train_loss": -12.102926254272461, "global_step": 424473, "epoch": 2526} {"train_loss": -11.987168312072754, "global_step": 424474, "epoch": 2526} {"train_loss": -12.166759490966797, "global_step": 424475, "epoch": 2526} {"train_loss": -12.169439315795898, "global_step": 424476, "epoch": 2526} {"train_loss": -12.253459930419922, "global_step": 424477, "epoch": 2526} {"train_loss": -12.430070877075195, "global_step": 424478, "epoch": 2526} {"train_loss": -12.442546844482422, "global_step": 424479, "epoch": 2526} {"train_loss": -12.091567993164062, "global_step": 424480, "epoch": 2526} {"train_loss": -12.51198673248291, "global_step": 424481, "epoch": 2526} {"train_loss": -12.046432495117188, "global_step": 424482, "epoch": 2526} {"train_loss": -12.497730255126953, "global_step": 424483, "epoch": 2526} {"train_loss": -12.51132583618164, "global_step": 424484, "epoch": 2526} {"train_loss": -12.183063507080078, "global_step": 424485, "epoch": 2526} {"train_loss": -12.470701217651367, "global_step": 424486, "epoch": 2526} {"train_loss": -12.178112983703613, "global_step": 424487, "epoch": 2526} {"train_loss": -12.63886833190918, "global_step": 424488, "epoch": 2526} {"train_loss": -12.589669227600098, "global_step": 424489, "epoch": 2526} {"train_loss": -12.264883995056152, "global_step": 424490, "epoch": 2526} {"train_loss": -12.572476387023926, "global_step": 424491, "epoch": 2526} {"train_loss": -12.500211715698242, "global_step": 424492, "epoch": 2526} {"train_loss": -12.420736312866211, "global_step": 424493, "epoch": 2526} {"train_loss": -12.651543617248535, "global_step": 424494, "epoch": 2526} {"train_loss": -12.8260498046875, "global_step": 424495, "epoch": 2526} {"train_loss": -12.379274368286133, "global_step": 424496, "epoch": 2526} {"train_loss": -12.436640739440918, "global_step": 424497, "epoch": 2526} {"train_loss": -12.333220481872559, "global_step": 424498, "epoch": 2526} {"train_loss": -12.349534034729004, "global_step": 424499, "epoch": 2526} {"train_loss": -11.841753005981445, "global_step": 424500, "epoch": 2526} {"train_loss": -12.305093765258789, "global_step": 424501, "epoch": 2526} {"train_loss": -12.091443061828613, "global_step": 424502, "epoch": 2526} {"train_loss": -11.86327838897705, "global_step": 424503, "epoch": 2526} {"train_loss": -12.183428764343262, "global_step": 424504, "epoch": 2526} {"train_loss": -11.445770263671875, "global_step": 424505, "epoch": 2526} {"train_loss": -12.267705917358398, "global_step": 424506, "epoch": 2526} {"train_loss": -11.943260192871094, "global_step": 424507, "epoch": 2526} {"train_loss": -11.287298202514648, "global_step": 424508, "epoch": 2526} {"train_loss": -12.471671104431152, "global_step": 424509, "epoch": 2526} {"train_loss": -11.918838500976562, "global_step": 424510, "epoch": 2526} {"train_loss": -11.94583511352539, "global_step": 424511, "epoch": 2526} {"train_loss": -12.376507759094238, "global_step": 424512, "epoch": 2526} {"train_loss": -12.073668479919434, "global_step": 424513, "epoch": 2526} {"train_loss": -11.931024551391602, "global_step": 424514, "epoch": 2526} {"train_loss": -11.535806655883789, "global_step": 424515, "epoch": 2526} {"train_loss": -11.521578788757324, "global_step": 424516, "epoch": 2526} {"train_loss": -11.599579811096191, "global_step": 424517, "epoch": 2526} {"train_loss": -10.676409721374512, "global_step": 424518, "epoch": 2526} {"train_loss": -11.266252517700195, "global_step": 424519, "epoch": 2526} {"train_loss": -10.768487930297852, "global_step": 424520, "epoch": 2526} {"train_loss": -10.004944801330566, "global_step": 424521, "epoch": 2526} {"train_loss": -8.648219108581543, "global_step": 424522, "epoch": 2526} {"train_loss": -9.634698867797852, "global_step": 424523, "epoch": 2526} {"train_loss": -9.167205810546875, "global_step": 424524, "epoch": 2526} {"train_loss": -9.168258666992188, "global_step": 424525, "epoch": 2526} {"train_loss": -9.759521484375, "global_step": 424526, "epoch": 2526} {"train_loss": -10.89599609375, "global_step": 424527, "epoch": 2526} {"train_loss": -8.445387840270996, "global_step": 424528, "epoch": 2526} {"train_loss": -10.997520446777344, "global_step": 424529, "epoch": 2526} {"train_loss": -9.688817024230957, "global_step": 424530, "epoch": 2526} {"train_loss": -11.123981475830078, "global_step": 424531, "epoch": 2526} {"train_loss": -10.095358848571777, "global_step": 424532, "epoch": 2526} {"train_loss": -10.448577880859375, "global_step": 424533, "epoch": 2526} {"train_loss": -10.401545524597168, "global_step": 424534, "epoch": 2526} {"train_loss": -11.853508529208955, "global_step": 424535, "epoch": 2526, "val_loss": 303225.65625} {"train_loss": -10.278541564941406, "global_step": 424536, "epoch": 2527} {"train_loss": -10.874238014221191, "global_step": 424537, "epoch": 2527} {"train_loss": -10.047764778137207, "global_step": 424538, "epoch": 2527} {"train_loss": -10.273641586303711, "global_step": 424539, "epoch": 2527} {"train_loss": -10.855669021606445, "global_step": 424540, "epoch": 2527} {"train_loss": -11.505170822143555, "global_step": 424541, "epoch": 2527} {"train_loss": -11.125762939453125, "global_step": 424542, "epoch": 2527} {"train_loss": -11.877043724060059, "global_step": 424543, "epoch": 2527} {"train_loss": -11.439867973327637, "global_step": 424544, "epoch": 2527} {"train_loss": -11.879609107971191, "global_step": 424545, "epoch": 2527} {"train_loss": -10.885710716247559, "global_step": 424546, "epoch": 2527} {"train_loss": -11.768587112426758, "global_step": 424547, "epoch": 2527} {"train_loss": -11.888101577758789, "global_step": 424548, "epoch": 2527} {"train_loss": -11.55950927734375, "global_step": 424549, "epoch": 2527} {"train_loss": -12.066566467285156, "global_step": 424550, "epoch": 2527} {"train_loss": -11.64565658569336, "global_step": 424551, "epoch": 2527} {"train_loss": -11.65733528137207, "global_step": 424552, "epoch": 2527} {"train_loss": -11.968109130859375, "global_step": 424553, "epoch": 2527} {"train_loss": -12.000651359558105, "global_step": 424554, "epoch": 2527} {"train_loss": -11.976991653442383, "global_step": 424555, "epoch": 2527} {"train_loss": -12.066499710083008, "global_step": 424556, "epoch": 2527} {"train_loss": -11.652450561523438, "global_step": 424557, "epoch": 2527} {"train_loss": -11.879384994506836, "global_step": 424558, "epoch": 2527} {"train_loss": -11.989986419677734, "global_step": 424559, "epoch": 2527} {"train_loss": -12.060127258300781, "global_step": 424560, "epoch": 2527} {"train_loss": -11.879207611083984, "global_step": 424561, "epoch": 2527} {"train_loss": -12.380941390991211, "global_step": 424562, "epoch": 2527} {"train_loss": -11.74981689453125, "global_step": 424563, "epoch": 2527} {"train_loss": -12.310464859008789, "global_step": 424564, "epoch": 2527} {"train_loss": -12.1184720993042, "global_step": 424565, "epoch": 2527} {"train_loss": -12.301387786865234, "global_step": 424566, "epoch": 2527} {"train_loss": -12.417540550231934, "global_step": 424567, "epoch": 2527} {"train_loss": -12.2772216796875, "global_step": 424568, "epoch": 2527} {"train_loss": -12.3137788772583, "global_step": 424569, "epoch": 2527} {"train_loss": -12.140721321105957, "global_step": 424570, "epoch": 2527} {"train_loss": -12.119199752807617, "global_step": 424571, "epoch": 2527} {"train_loss": -12.18130874633789, "global_step": 424572, "epoch": 2527} {"train_loss": -12.199308395385742, "global_step": 424573, "epoch": 2527} {"train_loss": -12.424295425415039, "global_step": 424574, "epoch": 2527} {"train_loss": -12.204118728637695, "global_step": 424575, "epoch": 2527} {"train_loss": -12.628153800964355, "global_step": 424576, "epoch": 2527} {"train_loss": -12.379013061523438, "global_step": 424577, "epoch": 2527} {"train_loss": -12.40848159790039, "global_step": 424578, "epoch": 2527} {"train_loss": -12.482794761657715, "global_step": 424579, "epoch": 2527} {"train_loss": -12.27968978881836, "global_step": 424580, "epoch": 2527} {"train_loss": -12.45698356628418, "global_step": 424581, "epoch": 2527} {"train_loss": -12.432079315185547, "global_step": 424582, "epoch": 2527} {"train_loss": -12.42680549621582, "global_step": 424583, "epoch": 2527} {"train_loss": -12.21229362487793, "global_step": 424584, "epoch": 2527} {"train_loss": -12.496925354003906, "global_step": 424585, "epoch": 2527} {"train_loss": -12.498422622680664, "global_step": 424586, "epoch": 2527} {"train_loss": -12.532075881958008, "global_step": 424587, "epoch": 2527} {"train_loss": -12.53706169128418, "global_step": 424588, "epoch": 2527} {"train_loss": -12.642346382141113, "global_step": 424589, "epoch": 2527} {"train_loss": -12.706032752990723, "global_step": 424590, "epoch": 2527} {"train_loss": -12.586320877075195, "global_step": 424591, "epoch": 2527} {"train_loss": -12.634998321533203, "global_step": 424592, "epoch": 2527} {"train_loss": -12.770136833190918, "global_step": 424593, "epoch": 2527} {"train_loss": -12.494537353515625, "global_step": 424594, "epoch": 2527} {"train_loss": -12.70205307006836, "global_step": 424595, "epoch": 2527} {"train_loss": -12.62222671508789, "global_step": 424596, "epoch": 2527} {"train_loss": -12.535974502563477, "global_step": 424597, "epoch": 2527} {"train_loss": -12.469871520996094, "global_step": 424598, "epoch": 2527} {"train_loss": -12.722892761230469, "global_step": 424599, "epoch": 2527} {"train_loss": -12.803430557250977, "global_step": 424600, "epoch": 2527} {"train_loss": -12.404817581176758, "global_step": 424601, "epoch": 2527} {"train_loss": -12.67657470703125, "global_step": 424602, "epoch": 2527} {"train_loss": -12.588467597961426, "global_step": 424603, "epoch": 2527} {"train_loss": -12.735540390014648, "global_step": 424604, "epoch": 2527} {"train_loss": -12.611320495605469, "global_step": 424605, "epoch": 2527} {"train_loss": -12.607589721679688, "global_step": 424606, "epoch": 2527} {"train_loss": -12.721878051757812, "global_step": 424607, "epoch": 2527} {"train_loss": -12.832704544067383, "global_step": 424608, "epoch": 2527} {"train_loss": -12.719061851501465, "global_step": 424609, "epoch": 2527} {"train_loss": -12.683137893676758, "global_step": 424610, "epoch": 2527} {"train_loss": -12.747160911560059, "global_step": 424611, "epoch": 2527} {"train_loss": -12.695198059082031, "global_step": 424612, "epoch": 2527} {"train_loss": -12.831087112426758, "global_step": 424613, "epoch": 2527} {"train_loss": -12.64614486694336, "global_step": 424614, "epoch": 2527} {"train_loss": -12.655941009521484, "global_step": 424615, "epoch": 2527} {"train_loss": -12.645986557006836, "global_step": 424616, "epoch": 2527} {"train_loss": -12.800483703613281, "global_step": 424617, "epoch": 2527} {"train_loss": -12.912242889404297, "global_step": 424618, "epoch": 2527} {"train_loss": -12.731514930725098, "global_step": 424619, "epoch": 2527} {"train_loss": -12.668539047241211, "global_step": 424620, "epoch": 2527} {"train_loss": -12.368562698364258, "global_step": 424621, "epoch": 2527} {"train_loss": -12.842096328735352, "global_step": 424622, "epoch": 2527} {"train_loss": -12.383130073547363, "global_step": 424623, "epoch": 2527} {"train_loss": -12.534658432006836, "global_step": 424624, "epoch": 2527} {"train_loss": -12.846707344055176, "global_step": 424625, "epoch": 2527} {"train_loss": -12.822047233581543, "global_step": 424626, "epoch": 2527} {"train_loss": -12.858595848083496, "global_step": 424627, "epoch": 2527} {"train_loss": -12.570398330688477, "global_step": 424628, "epoch": 2527} {"train_loss": -12.730180740356445, "global_step": 424629, "epoch": 2527} {"train_loss": -12.46943473815918, "global_step": 424630, "epoch": 2527} {"train_loss": -12.561173439025879, "global_step": 424631, "epoch": 2527} {"train_loss": -12.773433685302734, "global_step": 424632, "epoch": 2527} {"train_loss": -12.887066841125488, "global_step": 424633, "epoch": 2527} {"train_loss": -12.645135879516602, "global_step": 424634, "epoch": 2527} {"train_loss": -12.659364700317383, "global_step": 424635, "epoch": 2527} {"train_loss": -12.37581729888916, "global_step": 424636, "epoch": 2527} {"train_loss": -11.339303970336914, "global_step": 424637, "epoch": 2527} {"train_loss": -12.372212409973145, "global_step": 424638, "epoch": 2527} {"train_loss": -12.118193626403809, "global_step": 424639, "epoch": 2527} {"train_loss": -12.376598358154297, "global_step": 424640, "epoch": 2527} {"train_loss": -11.6712007522583, "global_step": 424641, "epoch": 2527} {"train_loss": -12.102360725402832, "global_step": 424642, "epoch": 2527} {"train_loss": -12.268879890441895, "global_step": 424643, "epoch": 2527} {"train_loss": -12.156034469604492, "global_step": 424644, "epoch": 2527} {"train_loss": -12.798763275146484, "global_step": 424645, "epoch": 2527} {"train_loss": -12.00107192993164, "global_step": 424646, "epoch": 2527} {"train_loss": -12.320160865783691, "global_step": 424647, "epoch": 2527} {"train_loss": -11.219894409179688, "global_step": 424648, "epoch": 2527} {"train_loss": -11.907426834106445, "global_step": 424649, "epoch": 2527} {"train_loss": -11.816659927368164, "global_step": 424650, "epoch": 2527} {"train_loss": -12.668560028076172, "global_step": 424651, "epoch": 2527} {"train_loss": -11.921661376953125, "global_step": 424652, "epoch": 2527} {"train_loss": -11.749809265136719, "global_step": 424653, "epoch": 2527} {"train_loss": -11.530048370361328, "global_step": 424654, "epoch": 2527} {"train_loss": -11.238482475280762, "global_step": 424655, "epoch": 2527} {"train_loss": -10.195732116699219, "global_step": 424656, "epoch": 2527} {"train_loss": -12.106449127197266, "global_step": 424657, "epoch": 2527} {"train_loss": -12.183910369873047, "global_step": 424658, "epoch": 2527} {"train_loss": -10.663183212280273, "global_step": 424659, "epoch": 2527} {"train_loss": -10.988984107971191, "global_step": 424660, "epoch": 2527} {"train_loss": -11.633824348449707, "global_step": 424661, "epoch": 2527} {"train_loss": -10.911029815673828, "global_step": 424662, "epoch": 2527} {"train_loss": -11.864770889282227, "global_step": 424663, "epoch": 2527} {"train_loss": -10.727926254272461, "global_step": 424664, "epoch": 2527} {"train_loss": -11.768390655517578, "global_step": 424665, "epoch": 2527} {"train_loss": -11.864002227783203, "global_step": 424666, "epoch": 2527} {"train_loss": -11.769670486450195, "global_step": 424667, "epoch": 2527} {"train_loss": -11.313806533813477, "global_step": 424668, "epoch": 2527} {"train_loss": -11.735498428344727, "global_step": 424669, "epoch": 2527} {"train_loss": -12.043252944946289, "global_step": 424670, "epoch": 2527} {"train_loss": -11.868230819702148, "global_step": 424671, "epoch": 2527} {"train_loss": -12.177580833435059, "global_step": 424672, "epoch": 2527} {"train_loss": -11.897836685180664, "global_step": 424673, "epoch": 2527} {"train_loss": -12.297639846801758, "global_step": 424674, "epoch": 2527} {"train_loss": -11.627737045288086, "global_step": 424675, "epoch": 2527} {"train_loss": -11.775701522827148, "global_step": 424676, "epoch": 2527} {"train_loss": -12.144170761108398, "global_step": 424677, "epoch": 2527} {"train_loss": -11.471315383911133, "global_step": 424678, "epoch": 2527} {"train_loss": -12.40323543548584, "global_step": 424679, "epoch": 2527} {"train_loss": -11.462164878845215, "global_step": 424680, "epoch": 2527} {"train_loss": -11.117532730102539, "global_step": 424681, "epoch": 2527} {"train_loss": -12.093877792358398, "global_step": 424682, "epoch": 2527} {"train_loss": -11.272727012634277, "global_step": 424683, "epoch": 2527} {"train_loss": -12.044397354125977, "global_step": 424684, "epoch": 2527} {"train_loss": -11.959991455078125, "global_step": 424685, "epoch": 2527} {"train_loss": -11.821033477783203, "global_step": 424686, "epoch": 2527} {"train_loss": -12.381004333496094, "global_step": 424687, "epoch": 2527} {"train_loss": -10.99570369720459, "global_step": 424688, "epoch": 2527} {"train_loss": -11.342949867248535, "global_step": 424689, "epoch": 2527} {"train_loss": -11.429666519165039, "global_step": 424690, "epoch": 2527} {"train_loss": -11.06965446472168, "global_step": 424691, "epoch": 2527} {"train_loss": -10.90027904510498, "global_step": 424692, "epoch": 2527} {"train_loss": -10.614635467529297, "global_step": 424693, "epoch": 2527} {"train_loss": -11.895654678344727, "global_step": 424694, "epoch": 2527} {"train_loss": -11.154647827148438, "global_step": 424695, "epoch": 2527} {"train_loss": -12.39259147644043, "global_step": 424696, "epoch": 2527} {"train_loss": -11.740232467651367, "global_step": 424697, "epoch": 2527} {"train_loss": -12.312643051147461, "global_step": 424698, "epoch": 2527} {"train_loss": -11.740364074707031, "global_step": 424699, "epoch": 2527} {"train_loss": -12.081424713134766, "global_step": 424700, "epoch": 2527} {"train_loss": -11.851696014404297, "global_step": 424701, "epoch": 2527} {"train_loss": -11.87515640258789, "global_step": 424702, "epoch": 2527} {"train_loss": -12.062338170551119, "global_step": 424703, "epoch": 2527, "val_loss": 307842.1875} {"train_loss": -12.16256332397461, "global_step": 424704, "epoch": 2528} {"train_loss": -11.979934692382812, "global_step": 424705, "epoch": 2528} {"train_loss": -12.07739543914795, "global_step": 424706, "epoch": 2528} {"train_loss": -12.068032264709473, "global_step": 424707, "epoch": 2528} {"train_loss": -11.767146110534668, "global_step": 424708, "epoch": 2528} {"train_loss": -12.179206848144531, "global_step": 424709, "epoch": 2528} {"train_loss": -12.040950775146484, "global_step": 424710, "epoch": 2528} {"train_loss": -12.246500015258789, "global_step": 424711, "epoch": 2528} {"train_loss": -12.378198623657227, "global_step": 424712, "epoch": 2528} {"train_loss": -12.41378402709961, "global_step": 424713, "epoch": 2528} {"train_loss": -12.307708740234375, "global_step": 424714, "epoch": 2528} {"train_loss": -12.169086456298828, "global_step": 424715, "epoch": 2528} {"train_loss": -11.95801067352295, "global_step": 424716, "epoch": 2528} {"train_loss": -12.28550910949707, "global_step": 424717, "epoch": 2528} {"train_loss": -12.269865989685059, "global_step": 424718, "epoch": 2528} {"train_loss": -12.346841812133789, "global_step": 424719, "epoch": 2528} {"train_loss": -12.610422134399414, "global_step": 424720, "epoch": 2528} {"train_loss": -12.412341117858887, "global_step": 424721, "epoch": 2528} {"train_loss": -12.70725154876709, "global_step": 424722, "epoch": 2528} {"train_loss": -12.450654983520508, "global_step": 424723, "epoch": 2528} {"train_loss": -12.594396591186523, "global_step": 424724, "epoch": 2528} {"train_loss": -12.496391296386719, "global_step": 424725, "epoch": 2528} {"train_loss": -12.572236061096191, "global_step": 424726, "epoch": 2528} {"train_loss": -12.572456359863281, "global_step": 424727, "epoch": 2528} {"train_loss": -12.339773178100586, "global_step": 424728, "epoch": 2528} {"train_loss": -12.561488151550293, "global_step": 424729, "epoch": 2528} {"train_loss": -12.641712188720703, "global_step": 424730, "epoch": 2528} {"train_loss": -12.389897346496582, "global_step": 424731, "epoch": 2528} {"train_loss": -12.663206100463867, "global_step": 424732, "epoch": 2528} {"train_loss": -12.670245170593262, "global_step": 424733, "epoch": 2528} {"train_loss": -12.741127014160156, "global_step": 424734, "epoch": 2528} {"train_loss": -12.76998519897461, "global_step": 424735, "epoch": 2528} {"train_loss": -12.648555755615234, "global_step": 424736, "epoch": 2528} {"train_loss": -12.761299133300781, "global_step": 424737, "epoch": 2528} {"train_loss": -12.689335823059082, "global_step": 424738, "epoch": 2528} {"train_loss": -12.722837448120117, "global_step": 424739, "epoch": 2528} {"train_loss": -12.71754264831543, "global_step": 424740, "epoch": 2528} {"train_loss": -12.648025512695312, "global_step": 424741, "epoch": 2528} {"train_loss": -12.388750076293945, "global_step": 424742, "epoch": 2528} {"train_loss": -12.338525772094727, "global_step": 424743, "epoch": 2528} {"train_loss": -12.68270492553711, "global_step": 424744, "epoch": 2528} {"train_loss": -12.544168472290039, "global_step": 424745, "epoch": 2528} {"train_loss": -12.407795906066895, "global_step": 424746, "epoch": 2528} {"train_loss": -12.622882843017578, "global_step": 424747, "epoch": 2528} {"train_loss": -12.721054077148438, "global_step": 424748, "epoch": 2528} {"train_loss": -12.589195251464844, "global_step": 424749, "epoch": 2528} {"train_loss": -12.76260757446289, "global_step": 424750, "epoch": 2528} {"train_loss": -12.27452278137207, "global_step": 424751, "epoch": 2528} {"train_loss": -12.624303817749023, "global_step": 424752, "epoch": 2528} {"train_loss": -12.632583618164062, "global_step": 424753, "epoch": 2528} {"train_loss": -12.541244506835938, "global_step": 424754, "epoch": 2528} {"train_loss": -12.551902770996094, "global_step": 424755, "epoch": 2528} {"train_loss": -12.730093002319336, "global_step": 424756, "epoch": 2528} {"train_loss": -12.756038665771484, "global_step": 424757, "epoch": 2528} {"train_loss": -12.625234603881836, "global_step": 424758, "epoch": 2528} {"train_loss": -12.585122108459473, "global_step": 424759, "epoch": 2528} {"train_loss": -12.614795684814453, "global_step": 424760, "epoch": 2528} {"train_loss": -12.145400047302246, "global_step": 424761, "epoch": 2528} {"train_loss": -12.14480209350586, "global_step": 424762, "epoch": 2528} {"train_loss": -12.798105239868164, "global_step": 424763, "epoch": 2528} {"train_loss": -12.356159210205078, "global_step": 424764, "epoch": 2528} {"train_loss": -12.071462631225586, "global_step": 424765, "epoch": 2528} {"train_loss": -12.23853874206543, "global_step": 424766, "epoch": 2528} {"train_loss": -12.913961410522461, "global_step": 424767, "epoch": 2528} {"train_loss": -12.460278511047363, "global_step": 424768, "epoch": 2528} {"train_loss": -12.592426300048828, "global_step": 424769, "epoch": 2528} {"train_loss": -12.71574592590332, "global_step": 424770, "epoch": 2528} {"train_loss": -12.622262001037598, "global_step": 424771, "epoch": 2528} {"train_loss": -12.653118133544922, "global_step": 424772, "epoch": 2528} {"train_loss": -12.596622467041016, "global_step": 424773, "epoch": 2528} {"train_loss": -12.687447547912598, "global_step": 424774, "epoch": 2528} {"train_loss": -12.883792877197266, "global_step": 424775, "epoch": 2528} {"train_loss": -12.68848991394043, "global_step": 424776, "epoch": 2528} {"train_loss": -13.087379455566406, "global_step": 424777, "epoch": 2528} {"train_loss": -12.554267883300781, "global_step": 424778, "epoch": 2528} {"train_loss": -12.904077529907227, "global_step": 424779, "epoch": 2528} {"train_loss": -12.677804946899414, "global_step": 424780, "epoch": 2528} {"train_loss": -12.713165283203125, "global_step": 424781, "epoch": 2528} {"train_loss": -12.602407455444336, "global_step": 424782, "epoch": 2528} {"train_loss": -12.61296272277832, "global_step": 424783, "epoch": 2528} {"train_loss": -12.676609992980957, "global_step": 424784, "epoch": 2528} {"train_loss": -12.729212760925293, "global_step": 424785, "epoch": 2528} {"train_loss": -12.736770629882812, "global_step": 424786, "epoch": 2528} {"train_loss": -12.567420959472656, "global_step": 424787, "epoch": 2528} {"train_loss": -12.72538948059082, "global_step": 424788, "epoch": 2528} {"train_loss": -12.648944854736328, "global_step": 424789, "epoch": 2528} {"train_loss": -12.25141429901123, "global_step": 424790, "epoch": 2528} {"train_loss": -12.306244850158691, "global_step": 424791, "epoch": 2528} {"train_loss": -12.708942413330078, "global_step": 424792, "epoch": 2528} {"train_loss": -12.445470809936523, "global_step": 424793, "epoch": 2528} {"train_loss": -12.950444221496582, "global_step": 424794, "epoch": 2528} {"train_loss": -13.023113250732422, "global_step": 424795, "epoch": 2528} {"train_loss": -12.901895523071289, "global_step": 424796, "epoch": 2528} {"train_loss": -12.656539916992188, "global_step": 424797, "epoch": 2528} {"train_loss": -12.967090606689453, "global_step": 424798, "epoch": 2528} {"train_loss": -12.874161720275879, "global_step": 424799, "epoch": 2528} {"train_loss": -12.745137214660645, "global_step": 424800, "epoch": 2528} {"train_loss": -12.860551834106445, "global_step": 424801, "epoch": 2528} {"train_loss": -12.331547737121582, "global_step": 424802, "epoch": 2528} {"train_loss": -12.005510330200195, "global_step": 424803, "epoch": 2528} {"train_loss": -12.072425842285156, "global_step": 424804, "epoch": 2528} {"train_loss": -12.130311012268066, "global_step": 424805, "epoch": 2528} {"train_loss": -11.848286628723145, "global_step": 424806, "epoch": 2528} {"train_loss": -10.751161575317383, "global_step": 424807, "epoch": 2528} {"train_loss": -11.54961109161377, "global_step": 424808, "epoch": 2528} {"train_loss": -11.223834991455078, "global_step": 424809, "epoch": 2528} {"train_loss": -10.308475494384766, "global_step": 424810, "epoch": 2528} {"train_loss": -12.118440628051758, "global_step": 424811, "epoch": 2528} {"train_loss": -11.846670150756836, "global_step": 424812, "epoch": 2528} {"train_loss": -10.72188949584961, "global_step": 424813, "epoch": 2528} {"train_loss": -11.95192813873291, "global_step": 424814, "epoch": 2528} {"train_loss": -11.231367111206055, "global_step": 424815, "epoch": 2528} {"train_loss": -11.64185905456543, "global_step": 424816, "epoch": 2528} {"train_loss": -11.654135704040527, "global_step": 424817, "epoch": 2528} {"train_loss": -12.10986328125, "global_step": 424818, "epoch": 2528} {"train_loss": -11.254154205322266, "global_step": 424819, "epoch": 2528} {"train_loss": -12.420644760131836, "global_step": 424820, "epoch": 2528} {"train_loss": -12.105632781982422, "global_step": 424821, "epoch": 2528} {"train_loss": -11.99805736541748, "global_step": 424822, "epoch": 2528} {"train_loss": -11.97783088684082, "global_step": 424823, "epoch": 2528} {"train_loss": -12.66552734375, "global_step": 424824, "epoch": 2528} {"train_loss": -12.509916305541992, "global_step": 424825, "epoch": 2528} {"train_loss": -12.811378479003906, "global_step": 424826, "epoch": 2528} {"train_loss": -12.53504753112793, "global_step": 424827, "epoch": 2528} {"train_loss": -12.56641960144043, "global_step": 424828, "epoch": 2528} {"train_loss": -12.726821899414062, "global_step": 424829, "epoch": 2528} {"train_loss": -12.34635066986084, "global_step": 424830, "epoch": 2528} {"train_loss": -12.474557876586914, "global_step": 424831, "epoch": 2528} {"train_loss": -12.647238731384277, "global_step": 424832, "epoch": 2528} {"train_loss": -12.701772689819336, "global_step": 424833, "epoch": 2528} {"train_loss": -12.588523864746094, "global_step": 424834, "epoch": 2528} {"train_loss": -12.550703048706055, "global_step": 424835, "epoch": 2528} {"train_loss": -12.733510971069336, "global_step": 424836, "epoch": 2528} {"train_loss": -12.57398509979248, "global_step": 424837, "epoch": 2528} {"train_loss": -12.584131240844727, "global_step": 424838, "epoch": 2528} {"train_loss": -12.569664001464844, "global_step": 424839, "epoch": 2528} {"train_loss": -12.547595977783203, "global_step": 424840, "epoch": 2528} {"train_loss": -12.644720077514648, "global_step": 424841, "epoch": 2528} {"train_loss": -12.434539794921875, "global_step": 424842, "epoch": 2528} {"train_loss": -12.611173629760742, "global_step": 424843, "epoch": 2528} {"train_loss": -12.39431095123291, "global_step": 424844, "epoch": 2528} {"train_loss": -12.51279067993164, "global_step": 424845, "epoch": 2528} {"train_loss": -12.777885437011719, "global_step": 424846, "epoch": 2528} {"train_loss": -12.720332145690918, "global_step": 424847, "epoch": 2528} {"train_loss": -12.703371047973633, "global_step": 424848, "epoch": 2528} {"train_loss": -12.584807395935059, "global_step": 424849, "epoch": 2528} {"train_loss": -12.47134017944336, "global_step": 424850, "epoch": 2528} {"train_loss": -12.394021987915039, "global_step": 424851, "epoch": 2528} {"train_loss": -12.457395553588867, "global_step": 424852, "epoch": 2528} {"train_loss": -12.284185409545898, "global_step": 424853, "epoch": 2528} {"train_loss": -12.051204681396484, "global_step": 424854, "epoch": 2528} {"train_loss": -11.808837890625, "global_step": 424855, "epoch": 2528} {"train_loss": -11.5857515335083, "global_step": 424856, "epoch": 2528} {"train_loss": -12.301166534423828, "global_step": 424857, "epoch": 2528} {"train_loss": -12.394481658935547, "global_step": 424858, "epoch": 2528} {"train_loss": -12.523561477661133, "global_step": 424859, "epoch": 2528} {"train_loss": -12.383726119995117, "global_step": 424860, "epoch": 2528} {"train_loss": -12.393911361694336, "global_step": 424861, "epoch": 2528} {"train_loss": -12.136405944824219, "global_step": 424862, "epoch": 2528} {"train_loss": -12.421764373779297, "global_step": 424863, "epoch": 2528} {"train_loss": -12.07748794555664, "global_step": 424864, "epoch": 2528} {"train_loss": -12.465930938720703, "global_step": 424865, "epoch": 2528} {"train_loss": -11.734112739562988, "global_step": 424866, "epoch": 2528} {"train_loss": -12.33416748046875, "global_step": 424867, "epoch": 2528} {"train_loss": -12.147319793701172, "global_step": 424868, "epoch": 2528} {"train_loss": -12.567874908447266, "global_step": 424869, "epoch": 2528} {"train_loss": -12.016377449035645, "global_step": 424870, "epoch": 2528} {"train_loss": -12.39963564418611, "global_step": 424871, "epoch": 2528, "val_loss": 309085.53125} {"train_loss": -11.499342918395996, "global_step": 424872, "epoch": 2529} {"train_loss": -11.999444007873535, "global_step": 424873, "epoch": 2529} {"train_loss": -10.491464614868164, "global_step": 424874, "epoch": 2529} {"train_loss": -11.708755493164062, "global_step": 424875, "epoch": 2529} {"train_loss": -9.208158493041992, "global_step": 424876, "epoch": 2529} {"train_loss": -11.184745788574219, "global_step": 424877, "epoch": 2529} {"train_loss": -10.654558181762695, "global_step": 424878, "epoch": 2529} {"train_loss": -10.654202461242676, "global_step": 424879, "epoch": 2529} {"train_loss": -11.843481063842773, "global_step": 424880, "epoch": 2529} {"train_loss": -11.02988052368164, "global_step": 424881, "epoch": 2529} {"train_loss": -10.961516380310059, "global_step": 424882, "epoch": 2529} {"train_loss": -10.912070274353027, "global_step": 424883, "epoch": 2529} {"train_loss": -10.408632278442383, "global_step": 424884, "epoch": 2529} {"train_loss": -10.447711944580078, "global_step": 424885, "epoch": 2529} {"train_loss": -11.20942497253418, "global_step": 424886, "epoch": 2529} {"train_loss": -10.150635719299316, "global_step": 424887, "epoch": 2529} {"train_loss": -11.045917510986328, "global_step": 424888, "epoch": 2529} {"train_loss": -11.040611267089844, "global_step": 424889, "epoch": 2529} {"train_loss": -9.817581176757812, "global_step": 424890, "epoch": 2529} {"train_loss": -12.235883712768555, "global_step": 424891, "epoch": 2529} {"train_loss": -10.228250503540039, "global_step": 424892, "epoch": 2529} {"train_loss": -11.22861099243164, "global_step": 424893, "epoch": 2529} {"train_loss": -11.476765632629395, "global_step": 424894, "epoch": 2529} {"train_loss": -10.880504608154297, "global_step": 424895, "epoch": 2529} {"train_loss": -11.111968994140625, "global_step": 424896, "epoch": 2529} {"train_loss": -11.313079833984375, "global_step": 424897, "epoch": 2529} {"train_loss": -9.930926322937012, "global_step": 424898, "epoch": 2529} {"train_loss": -11.394086837768555, "global_step": 424899, "epoch": 2529} {"train_loss": -9.795389175415039, "global_step": 424900, "epoch": 2529} {"train_loss": -11.091440200805664, "global_step": 424901, "epoch": 2529} {"train_loss": -8.708361625671387, "global_step": 424902, "epoch": 2529} {"train_loss": -9.764497756958008, "global_step": 424903, "epoch": 2529} {"train_loss": -11.09541130065918, "global_step": 424904, "epoch": 2529} {"train_loss": -10.348529815673828, "global_step": 424905, "epoch": 2529} {"train_loss": -11.20406436920166, "global_step": 424906, "epoch": 2529} {"train_loss": -11.127519607543945, "global_step": 424907, "epoch": 2529} {"train_loss": -11.662452697753906, "global_step": 424908, "epoch": 2529} {"train_loss": -10.664247512817383, "global_step": 424909, "epoch": 2529} {"train_loss": -11.643722534179688, "global_step": 424910, "epoch": 2529} {"train_loss": -11.417305946350098, "global_step": 424911, "epoch": 2529} {"train_loss": -11.862617492675781, "global_step": 424912, "epoch": 2529} {"train_loss": -11.57127571105957, "global_step": 424913, "epoch": 2529} {"train_loss": -11.517234802246094, "global_step": 424914, "epoch": 2529} {"train_loss": -11.040151596069336, "global_step": 424915, "epoch": 2529} {"train_loss": -11.328739166259766, "global_step": 424916, "epoch": 2529} {"train_loss": -11.91982650756836, "global_step": 424917, "epoch": 2529} {"train_loss": -11.974164962768555, "global_step": 424918, "epoch": 2529} {"train_loss": -11.880197525024414, "global_step": 424919, "epoch": 2529} {"train_loss": -11.775239944458008, "global_step": 424920, "epoch": 2529} {"train_loss": -11.472291946411133, "global_step": 424921, "epoch": 2529} {"train_loss": -11.837244987487793, "global_step": 424922, "epoch": 2529} {"train_loss": -12.140302658081055, "global_step": 424923, "epoch": 2529} {"train_loss": -11.919445037841797, "global_step": 424924, "epoch": 2529} {"train_loss": -11.848453521728516, "global_step": 424925, "epoch": 2529} {"train_loss": -12.3182954788208, "global_step": 424926, "epoch": 2529} {"train_loss": -11.9222412109375, "global_step": 424927, "epoch": 2529} {"train_loss": -12.192975997924805, "global_step": 424928, "epoch": 2529} {"train_loss": -12.000733375549316, "global_step": 424929, "epoch": 2529} {"train_loss": -12.299615859985352, "global_step": 424930, "epoch": 2529} {"train_loss": -12.324258804321289, "global_step": 424931, "epoch": 2529} {"train_loss": -12.148569107055664, "global_step": 424932, "epoch": 2529} {"train_loss": -12.50288200378418, "global_step": 424933, "epoch": 2529} {"train_loss": -11.873038291931152, "global_step": 424934, "epoch": 2529} {"train_loss": -12.172643661499023, "global_step": 424935, "epoch": 2529} {"train_loss": -12.121920585632324, "global_step": 424936, "epoch": 2529} {"train_loss": -12.28088092803955, "global_step": 424937, "epoch": 2529} {"train_loss": -12.402719497680664, "global_step": 424938, "epoch": 2529} {"train_loss": -12.199801445007324, "global_step": 424939, "epoch": 2529} {"train_loss": -12.534820556640625, "global_step": 424940, "epoch": 2529} {"train_loss": -12.268950462341309, "global_step": 424941, "epoch": 2529} {"train_loss": -12.476507186889648, "global_step": 424942, "epoch": 2529} {"train_loss": -12.298967361450195, "global_step": 424943, "epoch": 2529} {"train_loss": -12.404214859008789, "global_step": 424944, "epoch": 2529} {"train_loss": -12.451416969299316, "global_step": 424945, "epoch": 2529} {"train_loss": -12.418992042541504, "global_step": 424946, "epoch": 2529} {"train_loss": -12.566041946411133, "global_step": 424947, "epoch": 2529} {"train_loss": -12.32619857788086, "global_step": 424948, "epoch": 2529} {"train_loss": -12.591289520263672, "global_step": 424949, "epoch": 2529} {"train_loss": -12.500865936279297, "global_step": 424950, "epoch": 2529} {"train_loss": -12.437346458435059, "global_step": 424951, "epoch": 2529} {"train_loss": -12.403779983520508, "global_step": 424952, "epoch": 2529} {"train_loss": -12.564023971557617, "global_step": 424953, "epoch": 2529} {"train_loss": -12.632950782775879, "global_step": 424954, "epoch": 2529} {"train_loss": -12.733892440795898, "global_step": 424955, "epoch": 2529} {"train_loss": -12.745321273803711, "global_step": 424956, "epoch": 2529} {"train_loss": -12.601035118103027, "global_step": 424957, "epoch": 2529} {"train_loss": -12.690494537353516, "global_step": 424958, "epoch": 2529} {"train_loss": -12.57358169555664, "global_step": 424959, "epoch": 2529} {"train_loss": -12.648033142089844, "global_step": 424960, "epoch": 2529} {"train_loss": -12.66839599609375, "global_step": 424961, "epoch": 2529} {"train_loss": -12.704619407653809, "global_step": 424962, "epoch": 2529} {"train_loss": -12.849265098571777, "global_step": 424963, "epoch": 2529} {"train_loss": -12.73779582977295, "global_step": 424964, "epoch": 2529} {"train_loss": -12.638010025024414, "global_step": 424965, "epoch": 2529} {"train_loss": -12.649431228637695, "global_step": 424966, "epoch": 2529} {"train_loss": -12.748956680297852, "global_step": 424967, "epoch": 2529} {"train_loss": -12.4527587890625, "global_step": 424968, "epoch": 2529} {"train_loss": -12.656460762023926, "global_step": 424969, "epoch": 2529} {"train_loss": -12.789758682250977, "global_step": 424970, "epoch": 2529} {"train_loss": -12.683622360229492, "global_step": 424971, "epoch": 2529} {"train_loss": -12.671606063842773, "global_step": 424972, "epoch": 2529} {"train_loss": -12.575582504272461, "global_step": 424973, "epoch": 2529} {"train_loss": -12.532740592956543, "global_step": 424974, "epoch": 2529} {"train_loss": -12.65843391418457, "global_step": 424975, "epoch": 2529} {"train_loss": -12.661455154418945, "global_step": 424976, "epoch": 2529} {"train_loss": -12.692390441894531, "global_step": 424977, "epoch": 2529} {"train_loss": -12.781349182128906, "global_step": 424978, "epoch": 2529} {"train_loss": -12.680617332458496, "global_step": 424979, "epoch": 2529} {"train_loss": -12.687331199645996, "global_step": 424980, "epoch": 2529} {"train_loss": -12.619464874267578, "global_step": 424981, "epoch": 2529} {"train_loss": -12.769353866577148, "global_step": 424982, "epoch": 2529} {"train_loss": -12.630245208740234, "global_step": 424983, "epoch": 2529} {"train_loss": -12.376935005187988, "global_step": 424984, "epoch": 2529} {"train_loss": -12.782537460327148, "global_step": 424985, "epoch": 2529} {"train_loss": -12.495166778564453, "global_step": 424986, "epoch": 2529} {"train_loss": -12.517143249511719, "global_step": 424987, "epoch": 2529} {"train_loss": -12.835184097290039, "global_step": 424988, "epoch": 2529} {"train_loss": -12.534378051757812, "global_step": 424989, "epoch": 2529} {"train_loss": -12.286534309387207, "global_step": 424990, "epoch": 2529} {"train_loss": -12.81143569946289, "global_step": 424991, "epoch": 2529} {"train_loss": -11.985528945922852, "global_step": 424992, "epoch": 2529} {"train_loss": -12.781206130981445, "global_step": 424993, "epoch": 2529} {"train_loss": -12.534773826599121, "global_step": 424994, "epoch": 2529} {"train_loss": -12.223016738891602, "global_step": 424995, "epoch": 2529} {"train_loss": -12.314643859863281, "global_step": 424996, "epoch": 2529} {"train_loss": -11.889838218688965, "global_step": 424997, "epoch": 2529} {"train_loss": -10.806827545166016, "global_step": 424998, "epoch": 2529} {"train_loss": -11.85526180267334, "global_step": 424999, "epoch": 2529} {"train_loss": -11.877874374389648, "global_step": 425000, "epoch": 2529} {"train_loss": -10.775870323181152, "global_step": 425001, "epoch": 2529} {"train_loss": -12.488631248474121, "global_step": 425002, "epoch": 2529} {"train_loss": -11.433308601379395, "global_step": 425003, "epoch": 2529} {"train_loss": -11.662580490112305, "global_step": 425004, "epoch": 2529} {"train_loss": -12.52863883972168, "global_step": 425005, "epoch": 2529} {"train_loss": -11.582324981689453, "global_step": 425006, "epoch": 2529} {"train_loss": -11.87042236328125, "global_step": 425007, "epoch": 2529} {"train_loss": -11.677350997924805, "global_step": 425008, "epoch": 2529} {"train_loss": -11.497660636901855, "global_step": 425009, "epoch": 2529} {"train_loss": -12.549288749694824, "global_step": 425010, "epoch": 2529} {"train_loss": -11.79658031463623, "global_step": 425011, "epoch": 2529} {"train_loss": -12.304141998291016, "global_step": 425012, "epoch": 2529} {"train_loss": -12.366033554077148, "global_step": 425013, "epoch": 2529} {"train_loss": -12.45490837097168, "global_step": 425014, "epoch": 2529} {"train_loss": -12.249213218688965, "global_step": 425015, "epoch": 2529} {"train_loss": -12.286149978637695, "global_step": 425016, "epoch": 2529} {"train_loss": -12.72903823852539, "global_step": 425017, "epoch": 2529} {"train_loss": -12.367757797241211, "global_step": 425018, "epoch": 2529} {"train_loss": -12.305804252624512, "global_step": 425019, "epoch": 2529} {"train_loss": -12.267285346984863, "global_step": 425020, "epoch": 2529} {"train_loss": -12.445703506469727, "global_step": 425021, "epoch": 2529} {"train_loss": -12.530008316040039, "global_step": 425022, "epoch": 2529} {"train_loss": -12.589997291564941, "global_step": 425023, "epoch": 2529} {"train_loss": -12.595210075378418, "global_step": 425024, "epoch": 2529} {"train_loss": -12.526346206665039, "global_step": 425025, "epoch": 2529} {"train_loss": -12.593165397644043, "global_step": 425026, "epoch": 2529} {"train_loss": -12.479740142822266, "global_step": 425027, "epoch": 2529} {"train_loss": -12.501688957214355, "global_step": 425028, "epoch": 2529} {"train_loss": -12.6954927444458, "global_step": 425029, "epoch": 2529} {"train_loss": -12.66015338897705, "global_step": 425030, "epoch": 2529} {"train_loss": -12.48244857788086, "global_step": 425031, "epoch": 2529} {"train_loss": -12.551081657409668, "global_step": 425032, "epoch": 2529} {"train_loss": -12.648666381835938, "global_step": 425033, "epoch": 2529} {"train_loss": -12.594478607177734, "global_step": 425034, "epoch": 2529} {"train_loss": -12.8604736328125, "global_step": 425035, "epoch": 2529} {"train_loss": -12.558122634887695, "global_step": 425036, "epoch": 2529} {"train_loss": -12.642066955566406, "global_step": 425037, "epoch": 2529} {"train_loss": -12.407026290893555, "global_step": 425038, "epoch": 2529} {"train_loss": -11.98256326289404, "global_step": 425039, "epoch": 2529, "val_loss": 309178.0} {"train_loss": -12.529755592346191, "global_step": 425040, "epoch": 2530} {"train_loss": -12.346101760864258, "global_step": 425041, "epoch": 2530} {"train_loss": -12.53493881225586, "global_step": 425042, "epoch": 2530} {"train_loss": -12.246807098388672, "global_step": 425043, "epoch": 2530} {"train_loss": -12.286920547485352, "global_step": 425044, "epoch": 2530} {"train_loss": -12.843921661376953, "global_step": 425045, "epoch": 2530} {"train_loss": -12.290914535522461, "global_step": 425046, "epoch": 2530} {"train_loss": -12.566435813903809, "global_step": 425047, "epoch": 2530} {"train_loss": -12.52037239074707, "global_step": 425048, "epoch": 2530} {"train_loss": -12.514068603515625, "global_step": 425049, "epoch": 2530} {"train_loss": -12.654848098754883, "global_step": 425050, "epoch": 2530} {"train_loss": -12.531499862670898, "global_step": 425051, "epoch": 2530} {"train_loss": -12.396688461303711, "global_step": 425052, "epoch": 2530} {"train_loss": -12.673402786254883, "global_step": 425053, "epoch": 2530} {"train_loss": -12.369392395019531, "global_step": 425054, "epoch": 2530} {"train_loss": -12.598849296569824, "global_step": 425055, "epoch": 2530} {"train_loss": -12.320042610168457, "global_step": 425056, "epoch": 2530} {"train_loss": -12.219030380249023, "global_step": 425057, "epoch": 2530} {"train_loss": -12.952848434448242, "global_step": 425058, "epoch": 2530} {"train_loss": -12.518256187438965, "global_step": 425059, "epoch": 2530} {"train_loss": -11.789835929870605, "global_step": 425060, "epoch": 2530} {"train_loss": -12.3552885055542, "global_step": 425061, "epoch": 2530} {"train_loss": -12.642351150512695, "global_step": 425062, "epoch": 2530} {"train_loss": -12.040644645690918, "global_step": 425063, "epoch": 2530} {"train_loss": -12.199338912963867, "global_step": 425064, "epoch": 2530} {"train_loss": -12.617610931396484, "global_step": 425065, "epoch": 2530} {"train_loss": -12.26637077331543, "global_step": 425066, "epoch": 2530} {"train_loss": -12.641423225402832, "global_step": 425067, "epoch": 2530} {"train_loss": -12.4910249710083, "global_step": 425068, "epoch": 2530} {"train_loss": -12.65831470489502, "global_step": 425069, "epoch": 2530} {"train_loss": -12.356246948242188, "global_step": 425070, "epoch": 2530} {"train_loss": -12.493997573852539, "global_step": 425071, "epoch": 2530} {"train_loss": -12.608650207519531, "global_step": 425072, "epoch": 2530} {"train_loss": -12.39315414428711, "global_step": 425073, "epoch": 2530} {"train_loss": -12.279581069946289, "global_step": 425074, "epoch": 2530} {"train_loss": -11.454578399658203, "global_step": 425075, "epoch": 2530} {"train_loss": -11.119030952453613, "global_step": 425076, "epoch": 2530} {"train_loss": -12.656867027282715, "global_step": 425077, "epoch": 2530} {"train_loss": -9.58584213256836, "global_step": 425078, "epoch": 2530} {"train_loss": -11.977367401123047, "global_step": 425079, "epoch": 2530} {"train_loss": -10.147436141967773, "global_step": 425080, "epoch": 2530} {"train_loss": -10.444520950317383, "global_step": 425081, "epoch": 2530} {"train_loss": -11.652271270751953, "global_step": 425082, "epoch": 2530} {"train_loss": -9.827043533325195, "global_step": 425083, "epoch": 2530} {"train_loss": -12.067063331604004, "global_step": 425084, "epoch": 2530} {"train_loss": -10.754159927368164, "global_step": 425085, "epoch": 2530} {"train_loss": -10.736949920654297, "global_step": 425086, "epoch": 2530} {"train_loss": -11.836359024047852, "global_step": 425087, "epoch": 2530} {"train_loss": -11.222416877746582, "global_step": 425088, "epoch": 2530} {"train_loss": -10.821039199829102, "global_step": 425089, "epoch": 2530} {"train_loss": -11.598773956298828, "global_step": 425090, "epoch": 2530} {"train_loss": -11.950197219848633, "global_step": 425091, "epoch": 2530} {"train_loss": -11.540199279785156, "global_step": 425092, "epoch": 2530} {"train_loss": -12.21054458618164, "global_step": 425093, "epoch": 2530} {"train_loss": -11.80526351928711, "global_step": 425094, "epoch": 2530} {"train_loss": -12.023880958557129, "global_step": 425095, "epoch": 2530} {"train_loss": -12.084396362304688, "global_step": 425096, "epoch": 2530} {"train_loss": -11.826119422912598, "global_step": 425097, "epoch": 2530} {"train_loss": -11.703864097595215, "global_step": 425098, "epoch": 2530} {"train_loss": -11.998127937316895, "global_step": 425099, "epoch": 2530} {"train_loss": -11.634142875671387, "global_step": 425100, "epoch": 2530} {"train_loss": -11.86088752746582, "global_step": 425101, "epoch": 2530} {"train_loss": -12.070769309997559, "global_step": 425102, "epoch": 2530} {"train_loss": -11.842840194702148, "global_step": 425103, "epoch": 2530} {"train_loss": -12.024051666259766, "global_step": 425104, "epoch": 2530} {"train_loss": -12.376630783081055, "global_step": 425105, "epoch": 2530} {"train_loss": -11.757713317871094, "global_step": 425106, "epoch": 2530} {"train_loss": -12.080549240112305, "global_step": 425107, "epoch": 2530} {"train_loss": -11.887227058410645, "global_step": 425108, "epoch": 2530} {"train_loss": -11.715950012207031, "global_step": 425109, "epoch": 2530} {"train_loss": -11.48765754699707, "global_step": 425110, "epoch": 2530} {"train_loss": -12.412185668945312, "global_step": 425111, "epoch": 2530} {"train_loss": -11.880934715270996, "global_step": 425112, "epoch": 2530} {"train_loss": -11.835294723510742, "global_step": 425113, "epoch": 2530} {"train_loss": -12.04820442199707, "global_step": 425114, "epoch": 2530} {"train_loss": -11.681198120117188, "global_step": 425115, "epoch": 2530} {"train_loss": -12.354188919067383, "global_step": 425116, "epoch": 2530} {"train_loss": -11.266375541687012, "global_step": 425117, "epoch": 2530} {"train_loss": -12.203563690185547, "global_step": 425118, "epoch": 2530} {"train_loss": -12.063727378845215, "global_step": 425119, "epoch": 2530} {"train_loss": -12.471817970275879, "global_step": 425120, "epoch": 2530} {"train_loss": -12.236283302307129, "global_step": 425121, "epoch": 2530} {"train_loss": -12.347475051879883, "global_step": 425122, "epoch": 2530} {"train_loss": -11.599935531616211, "global_step": 425123, "epoch": 2530} {"train_loss": -12.476981163024902, "global_step": 425124, "epoch": 2530} {"train_loss": -12.046859741210938, "global_step": 425125, "epoch": 2530} {"train_loss": -12.474710464477539, "global_step": 425126, "epoch": 2530} {"train_loss": -12.671138763427734, "global_step": 425127, "epoch": 2530} {"train_loss": -12.20407485961914, "global_step": 425128, "epoch": 2530} {"train_loss": -12.670097351074219, "global_step": 425129, "epoch": 2530} {"train_loss": -12.305749893188477, "global_step": 425130, "epoch": 2530} {"train_loss": -12.579399108886719, "global_step": 425131, "epoch": 2530} {"train_loss": -12.417048454284668, "global_step": 425132, "epoch": 2530} {"train_loss": -12.365313529968262, "global_step": 425133, "epoch": 2530} {"train_loss": -12.505376815795898, "global_step": 425134, "epoch": 2530} {"train_loss": -12.423135757446289, "global_step": 425135, "epoch": 2530} {"train_loss": -12.700876235961914, "global_step": 425136, "epoch": 2530} {"train_loss": -12.383245468139648, "global_step": 425137, "epoch": 2530} {"train_loss": -12.625938415527344, "global_step": 425138, "epoch": 2530} {"train_loss": -12.443532943725586, "global_step": 425139, "epoch": 2530} {"train_loss": -12.569948196411133, "global_step": 425140, "epoch": 2530} {"train_loss": -12.506342887878418, "global_step": 425141, "epoch": 2530} {"train_loss": -12.5075101852417, "global_step": 425142, "epoch": 2530} {"train_loss": -12.717144012451172, "global_step": 425143, "epoch": 2530} {"train_loss": -12.658048629760742, "global_step": 425144, "epoch": 2530} {"train_loss": -12.456709861755371, "global_step": 425145, "epoch": 2530} {"train_loss": -12.261341094970703, "global_step": 425146, "epoch": 2530} {"train_loss": -11.776851654052734, "global_step": 425147, "epoch": 2530} {"train_loss": -12.031325340270996, "global_step": 425148, "epoch": 2530} {"train_loss": -11.397525787353516, "global_step": 425149, "epoch": 2530} {"train_loss": -11.328874588012695, "global_step": 425150, "epoch": 2530} {"train_loss": -10.853141784667969, "global_step": 425151, "epoch": 2530} {"train_loss": -11.216691017150879, "global_step": 425152, "epoch": 2530} {"train_loss": -11.345771789550781, "global_step": 425153, "epoch": 2530} {"train_loss": -11.727546691894531, "global_step": 425154, "epoch": 2530} {"train_loss": -10.756750106811523, "global_step": 425155, "epoch": 2530} {"train_loss": -12.014348983764648, "global_step": 425156, "epoch": 2530} {"train_loss": -10.985918998718262, "global_step": 425157, "epoch": 2530} {"train_loss": -11.79385757446289, "global_step": 425158, "epoch": 2530} {"train_loss": -11.575763702392578, "global_step": 425159, "epoch": 2530} {"train_loss": -10.704768180847168, "global_step": 425160, "epoch": 2530} {"train_loss": -12.14193344116211, "global_step": 425161, "epoch": 2530} {"train_loss": -10.94848918914795, "global_step": 425162, "epoch": 2530} {"train_loss": -11.968114852905273, "global_step": 425163, "epoch": 2530} {"train_loss": -11.24350357055664, "global_step": 425164, "epoch": 2530} {"train_loss": -11.666219711303711, "global_step": 425165, "epoch": 2530} {"train_loss": -11.36413288116455, "global_step": 425166, "epoch": 2530} {"train_loss": -12.248190879821777, "global_step": 425167, "epoch": 2530} {"train_loss": -11.217501640319824, "global_step": 425168, "epoch": 2530} {"train_loss": -11.923258781433105, "global_step": 425169, "epoch": 2530} {"train_loss": -11.533138275146484, "global_step": 425170, "epoch": 2530} {"train_loss": -11.329238891601562, "global_step": 425171, "epoch": 2530} {"train_loss": -11.938199996948242, "global_step": 425172, "epoch": 2530} {"train_loss": -11.177399635314941, "global_step": 425173, "epoch": 2530} {"train_loss": -11.695253372192383, "global_step": 425174, "epoch": 2530} {"train_loss": -10.842755317687988, "global_step": 425175, "epoch": 2530} {"train_loss": -11.78175163269043, "global_step": 425176, "epoch": 2530} {"train_loss": -11.821313858032227, "global_step": 425177, "epoch": 2530} {"train_loss": -11.348634719848633, "global_step": 425178, "epoch": 2530} {"train_loss": -11.859755516052246, "global_step": 425179, "epoch": 2530} {"train_loss": -11.673624038696289, "global_step": 425180, "epoch": 2530} {"train_loss": -11.599163055419922, "global_step": 425181, "epoch": 2530} {"train_loss": -12.209410667419434, "global_step": 425182, "epoch": 2530} {"train_loss": -10.998495101928711, "global_step": 425183, "epoch": 2530} {"train_loss": -12.204727172851562, "global_step": 425184, "epoch": 2530} {"train_loss": -11.242927551269531, "global_step": 425185, "epoch": 2530} {"train_loss": -12.00490665435791, "global_step": 425186, "epoch": 2530} {"train_loss": -11.702527046203613, "global_step": 425187, "epoch": 2530} {"train_loss": -11.69767951965332, "global_step": 425188, "epoch": 2530} {"train_loss": -10.606053352355957, "global_step": 425189, "epoch": 2530} {"train_loss": -10.966115951538086, "global_step": 425190, "epoch": 2530} {"train_loss": -11.16696834564209, "global_step": 425191, "epoch": 2530} {"train_loss": -10.989692687988281, "global_step": 425192, "epoch": 2530} {"train_loss": -10.485038757324219, "global_step": 425193, "epoch": 2530} {"train_loss": -10.951798439025879, "global_step": 425194, "epoch": 2530} {"train_loss": -9.958535194396973, "global_step": 425195, "epoch": 2530} {"train_loss": -10.640800476074219, "global_step": 425196, "epoch": 2530} {"train_loss": -11.543649673461914, "global_step": 425197, "epoch": 2530} {"train_loss": -10.71479606628418, "global_step": 425198, "epoch": 2530} {"train_loss": -12.005369186401367, "global_step": 425199, "epoch": 2530} {"train_loss": -10.8609037399292, "global_step": 425200, "epoch": 2530} {"train_loss": -12.374250411987305, "global_step": 425201, "epoch": 2530} {"train_loss": -11.385488510131836, "global_step": 425202, "epoch": 2530} {"train_loss": -11.853281021118164, "global_step": 425203, "epoch": 2530} {"train_loss": -11.214497566223145, "global_step": 425204, "epoch": 2530} {"train_loss": -11.520748138427734, "global_step": 425205, "epoch": 2530} {"train_loss": -11.199371337890625, "global_step": 425206, "epoch": 2530} {"train_loss": -11.856538403601874, "global_step": 425207, "epoch": 2530, "val_loss": 307024.75, "train_action_mse_error": 1.7700371742248535} {"train_loss": -11.350411415100098, "global_step": 425208, "epoch": 2531} {"train_loss": -11.198814392089844, "global_step": 425209, "epoch": 2531} {"train_loss": -10.635477066040039, "global_step": 425210, "epoch": 2531} {"train_loss": -10.452457427978516, "global_step": 425211, "epoch": 2531} {"train_loss": -10.599740028381348, "global_step": 425212, "epoch": 2531} {"train_loss": -12.212081909179688, "global_step": 425213, "epoch": 2531} {"train_loss": -10.399548530578613, "global_step": 425214, "epoch": 2531} {"train_loss": -11.350126266479492, "global_step": 425215, "epoch": 2531} {"train_loss": -10.570243835449219, "global_step": 425216, "epoch": 2531} {"train_loss": -11.370230674743652, "global_step": 425217, "epoch": 2531} {"train_loss": -10.675933837890625, "global_step": 425218, "epoch": 2531} {"train_loss": -11.568258285522461, "global_step": 425219, "epoch": 2531} {"train_loss": -9.781766891479492, "global_step": 425220, "epoch": 2531} {"train_loss": -11.081923484802246, "global_step": 425221, "epoch": 2531} {"train_loss": -11.379684448242188, "global_step": 425222, "epoch": 2531} {"train_loss": -10.742393493652344, "global_step": 425223, "epoch": 2531} {"train_loss": -11.68875503540039, "global_step": 425224, "epoch": 2531} {"train_loss": -10.8657865524292, "global_step": 425225, "epoch": 2531} {"train_loss": -11.394765853881836, "global_step": 425226, "epoch": 2531} {"train_loss": -10.669015884399414, "global_step": 425227, "epoch": 2531} {"train_loss": -11.391925811767578, "global_step": 425228, "epoch": 2531} {"train_loss": -10.689209938049316, "global_step": 425229, "epoch": 2531} {"train_loss": -12.075723648071289, "global_step": 425230, "epoch": 2531} {"train_loss": -10.997137069702148, "global_step": 425231, "epoch": 2531} {"train_loss": -11.282272338867188, "global_step": 425232, "epoch": 2531} {"train_loss": -11.548751831054688, "global_step": 425233, "epoch": 2531} {"train_loss": -11.530529022216797, "global_step": 425234, "epoch": 2531} {"train_loss": -10.983856201171875, "global_step": 425235, "epoch": 2531} {"train_loss": -11.359073638916016, "global_step": 425236, "epoch": 2531} {"train_loss": -11.827386856079102, "global_step": 425237, "epoch": 2531} {"train_loss": -10.940174102783203, "global_step": 425238, "epoch": 2531} {"train_loss": -11.676389694213867, "global_step": 425239, "epoch": 2531} {"train_loss": -11.158499717712402, "global_step": 425240, "epoch": 2531} {"train_loss": -11.407505989074707, "global_step": 425241, "epoch": 2531} {"train_loss": -12.108963966369629, "global_step": 425242, "epoch": 2531} {"train_loss": -11.393863677978516, "global_step": 425243, "epoch": 2531} {"train_loss": -11.950603485107422, "global_step": 425244, "epoch": 2531} {"train_loss": -11.435869216918945, "global_step": 425245, "epoch": 2531} {"train_loss": -12.211288452148438, "global_step": 425246, "epoch": 2531} {"train_loss": -11.174839973449707, "global_step": 425247, "epoch": 2531} {"train_loss": -12.342180252075195, "global_step": 425248, "epoch": 2531} {"train_loss": -11.569524765014648, "global_step": 425249, "epoch": 2531} {"train_loss": -11.507431030273438, "global_step": 425250, "epoch": 2531} {"train_loss": -12.035700798034668, "global_step": 425251, "epoch": 2531} {"train_loss": -11.653209686279297, "global_step": 425252, "epoch": 2531} {"train_loss": -12.223505020141602, "global_step": 425253, "epoch": 2531} {"train_loss": -11.618210792541504, "global_step": 425254, "epoch": 2531} {"train_loss": -12.460000991821289, "global_step": 425255, "epoch": 2531} {"train_loss": -11.891741752624512, "global_step": 425256, "epoch": 2531} {"train_loss": -12.213720321655273, "global_step": 425257, "epoch": 2531} {"train_loss": -12.173728942871094, "global_step": 425258, "epoch": 2531} {"train_loss": -12.139827728271484, "global_step": 425259, "epoch": 2531} {"train_loss": -12.262007713317871, "global_step": 425260, "epoch": 2531} {"train_loss": -12.114686965942383, "global_step": 425261, "epoch": 2531} {"train_loss": -12.377584457397461, "global_step": 425262, "epoch": 2531} {"train_loss": -12.028995513916016, "global_step": 425263, "epoch": 2531} {"train_loss": -12.264337539672852, "global_step": 425264, "epoch": 2531} {"train_loss": -12.361412048339844, "global_step": 425265, "epoch": 2531} {"train_loss": -12.186540603637695, "global_step": 425266, "epoch": 2531} {"train_loss": -12.253549575805664, "global_step": 425267, "epoch": 2531} {"train_loss": -12.160572052001953, "global_step": 425268, "epoch": 2531} {"train_loss": -12.44056510925293, "global_step": 425269, "epoch": 2531} {"train_loss": -12.564918518066406, "global_step": 425270, "epoch": 2531} {"train_loss": -12.24799919128418, "global_step": 425271, "epoch": 2531} {"train_loss": -12.431814193725586, "global_step": 425272, "epoch": 2531} {"train_loss": -12.446210861206055, "global_step": 425273, "epoch": 2531} {"train_loss": -12.359031677246094, "global_step": 425274, "epoch": 2531} {"train_loss": -12.305349349975586, "global_step": 425275, "epoch": 2531} {"train_loss": -12.58038330078125, "global_step": 425276, "epoch": 2531} {"train_loss": -12.59524154663086, "global_step": 425277, "epoch": 2531} {"train_loss": -12.378064155578613, "global_step": 425278, "epoch": 2531} {"train_loss": -12.484959602355957, "global_step": 425279, "epoch": 2531} {"train_loss": -12.516660690307617, "global_step": 425280, "epoch": 2531} {"train_loss": -12.333463668823242, "global_step": 425281, "epoch": 2531} {"train_loss": -12.533947944641113, "global_step": 425282, "epoch": 2531} {"train_loss": -12.706575393676758, "global_step": 425283, "epoch": 2531} {"train_loss": -12.568633079528809, "global_step": 425284, "epoch": 2531} {"train_loss": -12.489508628845215, "global_step": 425285, "epoch": 2531} {"train_loss": -12.634060859680176, "global_step": 425286, "epoch": 2531} {"train_loss": -12.549266815185547, "global_step": 425287, "epoch": 2531} {"train_loss": -12.581120491027832, "global_step": 425288, "epoch": 2531} {"train_loss": -12.7662935256958, "global_step": 425289, "epoch": 2531} {"train_loss": -12.711845397949219, "global_step": 425290, "epoch": 2531} {"train_loss": -12.71902847290039, "global_step": 425291, "epoch": 2531} {"train_loss": -12.386653900146484, "global_step": 425292, "epoch": 2531} {"train_loss": -12.674301147460938, "global_step": 425293, "epoch": 2531} {"train_loss": -12.260520935058594, "global_step": 425294, "epoch": 2531} {"train_loss": -12.391060829162598, "global_step": 425295, "epoch": 2531} {"train_loss": -12.47309684753418, "global_step": 425296, "epoch": 2531} {"train_loss": -12.370867729187012, "global_step": 425297, "epoch": 2531} {"train_loss": -12.354330062866211, "global_step": 425298, "epoch": 2531} {"train_loss": -12.455207824707031, "global_step": 425299, "epoch": 2531} {"train_loss": -12.353120803833008, "global_step": 425300, "epoch": 2531} {"train_loss": -12.664800643920898, "global_step": 425301, "epoch": 2531} {"train_loss": -12.518706321716309, "global_step": 425302, "epoch": 2531} {"train_loss": -12.483453750610352, "global_step": 425303, "epoch": 2531} {"train_loss": -12.416728973388672, "global_step": 425304, "epoch": 2531} {"train_loss": -12.73737907409668, "global_step": 425305, "epoch": 2531} {"train_loss": -12.260334014892578, "global_step": 425306, "epoch": 2531} {"train_loss": -12.663163185119629, "global_step": 425307, "epoch": 2531} {"train_loss": -12.543054580688477, "global_step": 425308, "epoch": 2531} {"train_loss": -12.585626602172852, "global_step": 425309, "epoch": 2531} {"train_loss": -12.626432418823242, "global_step": 425310, "epoch": 2531} {"train_loss": -12.739883422851562, "global_step": 425311, "epoch": 2531} {"train_loss": -12.579219818115234, "global_step": 425312, "epoch": 2531} {"train_loss": -12.724113464355469, "global_step": 425313, "epoch": 2531} {"train_loss": -12.517881393432617, "global_step": 425314, "epoch": 2531} {"train_loss": -12.722931861877441, "global_step": 425315, "epoch": 2531} {"train_loss": -12.738611221313477, "global_step": 425316, "epoch": 2531} {"train_loss": -12.738840103149414, "global_step": 425317, "epoch": 2531} {"train_loss": -12.953947067260742, "global_step": 425318, "epoch": 2531} {"train_loss": -12.674398422241211, "global_step": 425319, "epoch": 2531} {"train_loss": -12.66174602508545, "global_step": 425320, "epoch": 2531} {"train_loss": -12.503618240356445, "global_step": 425321, "epoch": 2531} {"train_loss": -12.504352569580078, "global_step": 425322, "epoch": 2531} {"train_loss": -12.834182739257812, "global_step": 425323, "epoch": 2531} {"train_loss": -12.655311584472656, "global_step": 425324, "epoch": 2531} {"train_loss": -12.835748672485352, "global_step": 425325, "epoch": 2531} {"train_loss": -12.696293830871582, "global_step": 425326, "epoch": 2531} {"train_loss": -12.854789733886719, "global_step": 425327, "epoch": 2531} {"train_loss": -12.683919906616211, "global_step": 425328, "epoch": 2531} {"train_loss": -12.86196517944336, "global_step": 425329, "epoch": 2531} {"train_loss": -12.80250072479248, "global_step": 425330, "epoch": 2531} {"train_loss": -12.869649887084961, "global_step": 425331, "epoch": 2531} {"train_loss": -12.739779472351074, "global_step": 425332, "epoch": 2531} {"train_loss": -12.731351852416992, "global_step": 425333, "epoch": 2531} {"train_loss": -12.705498695373535, "global_step": 425334, "epoch": 2531} {"train_loss": -12.59967041015625, "global_step": 425335, "epoch": 2531} {"train_loss": -12.704309463500977, "global_step": 425336, "epoch": 2531} {"train_loss": -12.706795692443848, "global_step": 425337, "epoch": 2531} {"train_loss": -12.424480438232422, "global_step": 425338, "epoch": 2531} {"train_loss": -12.81627082824707, "global_step": 425339, "epoch": 2531} {"train_loss": -12.685327529907227, "global_step": 425340, "epoch": 2531} {"train_loss": -12.749882698059082, "global_step": 425341, "epoch": 2531} {"train_loss": -12.292149543762207, "global_step": 425342, "epoch": 2531} {"train_loss": -11.970481872558594, "global_step": 425343, "epoch": 2531} {"train_loss": -12.63821792602539, "global_step": 425344, "epoch": 2531} {"train_loss": -12.565479278564453, "global_step": 425345, "epoch": 2531} {"train_loss": -12.369327545166016, "global_step": 425346, "epoch": 2531} {"train_loss": -12.714110374450684, "global_step": 425347, "epoch": 2531} {"train_loss": -12.414138793945312, "global_step": 425348, "epoch": 2531} {"train_loss": -11.955394744873047, "global_step": 425349, "epoch": 2531} {"train_loss": -12.648665428161621, "global_step": 425350, "epoch": 2531} {"train_loss": -12.694713592529297, "global_step": 425351, "epoch": 2531} {"train_loss": -12.626871109008789, "global_step": 425352, "epoch": 2531} {"train_loss": -12.700469017028809, "global_step": 425353, "epoch": 2531} {"train_loss": -12.692682266235352, "global_step": 425354, "epoch": 2531} {"train_loss": -12.55979061126709, "global_step": 425355, "epoch": 2531} {"train_loss": -12.752158164978027, "global_step": 425356, "epoch": 2531} {"train_loss": -12.524155616760254, "global_step": 425357, "epoch": 2531} {"train_loss": -12.339946746826172, "global_step": 425358, "epoch": 2531} {"train_loss": -12.71320915222168, "global_step": 425359, "epoch": 2531} {"train_loss": -12.156143188476562, "global_step": 425360, "epoch": 2531} {"train_loss": -12.175207138061523, "global_step": 425361, "epoch": 2531} {"train_loss": -12.380973815917969, "global_step": 425362, "epoch": 2531} {"train_loss": -11.817340850830078, "global_step": 425363, "epoch": 2531} {"train_loss": -12.01893424987793, "global_step": 425364, "epoch": 2531} {"train_loss": -12.071219444274902, "global_step": 425365, "epoch": 2531} {"train_loss": -12.630484580993652, "global_step": 425366, "epoch": 2531} {"train_loss": -12.193681716918945, "global_step": 425367, "epoch": 2531} {"train_loss": -12.414387702941895, "global_step": 425368, "epoch": 2531} {"train_loss": -12.48618221282959, "global_step": 425369, "epoch": 2531} {"train_loss": -12.415359497070312, "global_step": 425370, "epoch": 2531} {"train_loss": -12.43032455444336, "global_step": 425371, "epoch": 2531} {"train_loss": -12.338051795959473, "global_step": 425372, "epoch": 2531} {"train_loss": -12.140934944152832, "global_step": 425373, "epoch": 2531} {"train_loss": -12.18471908569336, "global_step": 425374, "epoch": 2531} {"train_loss": -12.167356184550695, "global_step": 425375, "epoch": 2531, "val_loss": 307730.625} {"train_loss": -12.073975563049316, "global_step": 425376, "epoch": 2532} {"train_loss": -12.358572006225586, "global_step": 425377, "epoch": 2532} {"train_loss": -12.476935386657715, "global_step": 425378, "epoch": 2532} {"train_loss": -12.307599067687988, "global_step": 425379, "epoch": 2532} {"train_loss": -12.15870189666748, "global_step": 425380, "epoch": 2532} {"train_loss": -11.902827262878418, "global_step": 425381, "epoch": 2532} {"train_loss": -12.177356719970703, "global_step": 425382, "epoch": 2532} {"train_loss": -11.873836517333984, "global_step": 425383, "epoch": 2532} {"train_loss": -11.136625289916992, "global_step": 425384, "epoch": 2532} {"train_loss": -10.779840469360352, "global_step": 425385, "epoch": 2532} {"train_loss": -12.086006164550781, "global_step": 425386, "epoch": 2532} {"train_loss": -9.286215782165527, "global_step": 425387, "epoch": 2532} {"train_loss": -9.853503227233887, "global_step": 425388, "epoch": 2532} {"train_loss": -9.095081329345703, "global_step": 425389, "epoch": 2532} {"train_loss": -10.230135917663574, "global_step": 425390, "epoch": 2532} {"train_loss": -10.075475692749023, "global_step": 425391, "epoch": 2532} {"train_loss": -10.879447937011719, "global_step": 425392, "epoch": 2532} {"train_loss": -9.348426818847656, "global_step": 425393, "epoch": 2532} {"train_loss": -10.617542266845703, "global_step": 425394, "epoch": 2532} {"train_loss": -9.18492317199707, "global_step": 425395, "epoch": 2532} {"train_loss": -10.448559761047363, "global_step": 425396, "epoch": 2532} {"train_loss": -8.291682243347168, "global_step": 425397, "epoch": 2532} {"train_loss": -8.445087432861328, "global_step": 425398, "epoch": 2532} {"train_loss": -8.679243087768555, "global_step": 425399, "epoch": 2532} {"train_loss": -10.911478996276855, "global_step": 425400, "epoch": 2532} {"train_loss": -10.148614883422852, "global_step": 425401, "epoch": 2532} {"train_loss": -9.504446029663086, "global_step": 425402, "epoch": 2532} {"train_loss": -10.515307426452637, "global_step": 425403, "epoch": 2532} {"train_loss": -10.186567306518555, "global_step": 425404, "epoch": 2532} {"train_loss": -10.63907527923584, "global_step": 425405, "epoch": 2532} {"train_loss": -10.785717964172363, "global_step": 425406, "epoch": 2532} {"train_loss": -9.221569061279297, "global_step": 425407, "epoch": 2532} {"train_loss": -11.706914901733398, "global_step": 425408, "epoch": 2532} {"train_loss": -9.892066955566406, "global_step": 425409, "epoch": 2532} {"train_loss": -10.91087532043457, "global_step": 425410, "epoch": 2532} {"train_loss": -11.14987564086914, "global_step": 425411, "epoch": 2532} {"train_loss": -10.56250286102295, "global_step": 425412, "epoch": 2532} {"train_loss": -11.88410758972168, "global_step": 425413, "epoch": 2532} {"train_loss": -11.048661231994629, "global_step": 425414, "epoch": 2532} {"train_loss": -10.768791198730469, "global_step": 425415, "epoch": 2532} {"train_loss": -11.968439102172852, "global_step": 425416, "epoch": 2532} {"train_loss": -10.667362213134766, "global_step": 425417, "epoch": 2532} {"train_loss": -11.648517608642578, "global_step": 425418, "epoch": 2532} {"train_loss": -11.855912208557129, "global_step": 425419, "epoch": 2532} {"train_loss": -11.473832130432129, "global_step": 425420, "epoch": 2532} {"train_loss": -11.923308372497559, "global_step": 425421, "epoch": 2532} {"train_loss": -11.82520866394043, "global_step": 425422, "epoch": 2532} {"train_loss": -11.919474601745605, "global_step": 425423, "epoch": 2532} {"train_loss": -12.135147094726562, "global_step": 425424, "epoch": 2532} {"train_loss": -11.478874206542969, "global_step": 425425, "epoch": 2532} {"train_loss": -11.994009017944336, "global_step": 425426, "epoch": 2532} {"train_loss": -11.571685791015625, "global_step": 425427, "epoch": 2532} {"train_loss": -11.904308319091797, "global_step": 425428, "epoch": 2532} {"train_loss": -11.752860069274902, "global_step": 425429, "epoch": 2532} {"train_loss": -11.878473281860352, "global_step": 425430, "epoch": 2532} {"train_loss": -11.854016304016113, "global_step": 425431, "epoch": 2532} {"train_loss": -12.304669380187988, "global_step": 425432, "epoch": 2532} {"train_loss": -11.988977432250977, "global_step": 425433, "epoch": 2532} {"train_loss": -12.295761108398438, "global_step": 425434, "epoch": 2532} {"train_loss": -12.066057205200195, "global_step": 425435, "epoch": 2532} {"train_loss": -12.371563911437988, "global_step": 425436, "epoch": 2532} {"train_loss": -12.072218894958496, "global_step": 425437, "epoch": 2532} {"train_loss": -12.218546867370605, "global_step": 425438, "epoch": 2532} {"train_loss": -12.27400016784668, "global_step": 425439, "epoch": 2532} {"train_loss": -12.382081985473633, "global_step": 425440, "epoch": 2532} {"train_loss": -12.16790771484375, "global_step": 425441, "epoch": 2532} {"train_loss": -12.426101684570312, "global_step": 425442, "epoch": 2532} {"train_loss": -12.191690444946289, "global_step": 425443, "epoch": 2532} {"train_loss": -12.372941970825195, "global_step": 425444, "epoch": 2532} {"train_loss": -12.109451293945312, "global_step": 425445, "epoch": 2532} {"train_loss": -12.405593872070312, "global_step": 425446, "epoch": 2532} {"train_loss": -12.041780471801758, "global_step": 425447, "epoch": 2532} {"train_loss": -12.48870849609375, "global_step": 425448, "epoch": 2532} {"train_loss": -12.254358291625977, "global_step": 425449, "epoch": 2532} {"train_loss": -12.584568977355957, "global_step": 425450, "epoch": 2532} {"train_loss": -12.27873706817627, "global_step": 425451, "epoch": 2532} {"train_loss": -12.448580741882324, "global_step": 425452, "epoch": 2532} {"train_loss": -12.339207649230957, "global_step": 425453, "epoch": 2532} {"train_loss": -12.530343055725098, "global_step": 425454, "epoch": 2532} {"train_loss": -12.492944717407227, "global_step": 425455, "epoch": 2532} {"train_loss": -12.324565887451172, "global_step": 425456, "epoch": 2532} {"train_loss": -12.487130165100098, "global_step": 425457, "epoch": 2532} {"train_loss": -12.32375431060791, "global_step": 425458, "epoch": 2532} {"train_loss": -12.641497611999512, "global_step": 425459, "epoch": 2532} {"train_loss": -12.351795196533203, "global_step": 425460, "epoch": 2532} {"train_loss": -12.638370513916016, "global_step": 425461, "epoch": 2532} {"train_loss": -12.573229789733887, "global_step": 425462, "epoch": 2532} {"train_loss": -12.617449760437012, "global_step": 425463, "epoch": 2532} {"train_loss": -12.632144927978516, "global_step": 425464, "epoch": 2532} {"train_loss": -12.706245422363281, "global_step": 425465, "epoch": 2532} {"train_loss": -12.252372741699219, "global_step": 425466, "epoch": 2532} {"train_loss": -12.699047088623047, "global_step": 425467, "epoch": 2532} {"train_loss": -12.392000198364258, "global_step": 425468, "epoch": 2532} {"train_loss": -12.692020416259766, "global_step": 425469, "epoch": 2532} {"train_loss": -12.660355567932129, "global_step": 425470, "epoch": 2532} {"train_loss": -12.577461242675781, "global_step": 425471, "epoch": 2532} {"train_loss": -12.577003479003906, "global_step": 425472, "epoch": 2532} {"train_loss": -12.723254203796387, "global_step": 425473, "epoch": 2532} {"train_loss": -12.419424057006836, "global_step": 425474, "epoch": 2532} {"train_loss": -12.558708190917969, "global_step": 425475, "epoch": 2532} {"train_loss": -12.648839950561523, "global_step": 425476, "epoch": 2532} {"train_loss": -12.668899536132812, "global_step": 425477, "epoch": 2532} {"train_loss": -12.674173355102539, "global_step": 425478, "epoch": 2532} {"train_loss": -12.551013946533203, "global_step": 425479, "epoch": 2532} {"train_loss": -12.734702110290527, "global_step": 425480, "epoch": 2532} {"train_loss": -12.753169059753418, "global_step": 425481, "epoch": 2532} {"train_loss": -12.588335990905762, "global_step": 425482, "epoch": 2532} {"train_loss": -12.777387619018555, "global_step": 425483, "epoch": 2532} {"train_loss": -12.824943542480469, "global_step": 425484, "epoch": 2532} {"train_loss": -12.740063667297363, "global_step": 425485, "epoch": 2532} {"train_loss": -12.684989929199219, "global_step": 425486, "epoch": 2532} {"train_loss": -12.721914291381836, "global_step": 425487, "epoch": 2532} {"train_loss": -12.633983612060547, "global_step": 425488, "epoch": 2532} {"train_loss": -12.757278442382812, "global_step": 425489, "epoch": 2532} {"train_loss": -12.728809356689453, "global_step": 425490, "epoch": 2532} {"train_loss": -12.852041244506836, "global_step": 425491, "epoch": 2532} {"train_loss": -12.64382553100586, "global_step": 425492, "epoch": 2532} {"train_loss": -12.600793838500977, "global_step": 425493, "epoch": 2532} {"train_loss": -12.703271865844727, "global_step": 425494, "epoch": 2532} {"train_loss": -12.629051208496094, "global_step": 425495, "epoch": 2532} {"train_loss": -12.813976287841797, "global_step": 425496, "epoch": 2532} {"train_loss": -12.704623222351074, "global_step": 425497, "epoch": 2532} {"train_loss": -12.982288360595703, "global_step": 425498, "epoch": 2532} {"train_loss": -12.605812072753906, "global_step": 425499, "epoch": 2532} {"train_loss": -12.882542610168457, "global_step": 425500, "epoch": 2532} {"train_loss": -12.776789665222168, "global_step": 425501, "epoch": 2532} {"train_loss": -12.602916717529297, "global_step": 425502, "epoch": 2532} {"train_loss": -12.75296688079834, "global_step": 425503, "epoch": 2532} {"train_loss": -12.789121627807617, "global_step": 425504, "epoch": 2532} {"train_loss": -12.817009925842285, "global_step": 425505, "epoch": 2532} {"train_loss": -12.78136920928955, "global_step": 425506, "epoch": 2532} {"train_loss": -12.760873794555664, "global_step": 425507, "epoch": 2532} {"train_loss": -12.403793334960938, "global_step": 425508, "epoch": 2532} {"train_loss": -12.92378044128418, "global_step": 425509, "epoch": 2532} {"train_loss": -12.502561569213867, "global_step": 425510, "epoch": 2532} {"train_loss": -12.785212516784668, "global_step": 425511, "epoch": 2532} {"train_loss": -12.678568840026855, "global_step": 425512, "epoch": 2532} {"train_loss": -12.188440322875977, "global_step": 425513, "epoch": 2532} {"train_loss": -12.724982261657715, "global_step": 425514, "epoch": 2532} {"train_loss": -12.908557891845703, "global_step": 425515, "epoch": 2532} {"train_loss": -12.450109481811523, "global_step": 425516, "epoch": 2532} {"train_loss": -12.563274383544922, "global_step": 425517, "epoch": 2532} {"train_loss": -12.592643737792969, "global_step": 425518, "epoch": 2532} {"train_loss": -12.648858070373535, "global_step": 425519, "epoch": 2532} {"train_loss": -12.786725997924805, "global_step": 425520, "epoch": 2532} {"train_loss": -12.718842506408691, "global_step": 425521, "epoch": 2532} {"train_loss": -12.811786651611328, "global_step": 425522, "epoch": 2532} {"train_loss": -12.847912788391113, "global_step": 425523, "epoch": 2532} {"train_loss": -12.66606330871582, "global_step": 425524, "epoch": 2532} {"train_loss": -12.70844841003418, "global_step": 425525, "epoch": 2532} {"train_loss": -12.63623046875, "global_step": 425526, "epoch": 2532} {"train_loss": -12.733612060546875, "global_step": 425527, "epoch": 2532} {"train_loss": -12.408594131469727, "global_step": 425528, "epoch": 2532} {"train_loss": -12.737367630004883, "global_step": 425529, "epoch": 2532} {"train_loss": -12.657072067260742, "global_step": 425530, "epoch": 2532} {"train_loss": -12.138885498046875, "global_step": 425531, "epoch": 2532} {"train_loss": -12.374258041381836, "global_step": 425532, "epoch": 2532} {"train_loss": -12.798559188842773, "global_step": 425533, "epoch": 2532} {"train_loss": -11.806503295898438, "global_step": 425534, "epoch": 2532} {"train_loss": -10.905621528625488, "global_step": 425535, "epoch": 2532} {"train_loss": -12.280888557434082, "global_step": 425536, "epoch": 2532} {"train_loss": -10.35684585571289, "global_step": 425537, "epoch": 2532} {"train_loss": -11.008766174316406, "global_step": 425538, "epoch": 2532} {"train_loss": -11.932259559631348, "global_step": 425539, "epoch": 2532} {"train_loss": -11.225232124328613, "global_step": 425540, "epoch": 2532} {"train_loss": -11.478944778442383, "global_step": 425541, "epoch": 2532} {"train_loss": -10.890632629394531, "global_step": 425542, "epoch": 2532} {"train_loss": -11.950309770447868, "global_step": 425543, "epoch": 2532, "val_loss": 304227.53125} {"train_loss": -11.288593292236328, "global_step": 425544, "epoch": 2533} {"train_loss": -10.354936599731445, "global_step": 425545, "epoch": 2533} {"train_loss": -10.31387710571289, "global_step": 425546, "epoch": 2533} {"train_loss": -11.233736991882324, "global_step": 425547, "epoch": 2533} {"train_loss": -10.427779197692871, "global_step": 425548, "epoch": 2533} {"train_loss": -10.819156646728516, "global_step": 425549, "epoch": 2533} {"train_loss": -11.97549057006836, "global_step": 425550, "epoch": 2533} {"train_loss": -9.291366577148438, "global_step": 425551, "epoch": 2533} {"train_loss": -11.548150062561035, "global_step": 425552, "epoch": 2533} {"train_loss": -10.943456649780273, "global_step": 425553, "epoch": 2533} {"train_loss": -11.68414306640625, "global_step": 425554, "epoch": 2533} {"train_loss": -11.294000625610352, "global_step": 425555, "epoch": 2533} {"train_loss": -11.326796531677246, "global_step": 425556, "epoch": 2533} {"train_loss": -11.342639923095703, "global_step": 425557, "epoch": 2533} {"train_loss": -11.0739164352417, "global_step": 425558, "epoch": 2533} {"train_loss": -11.570173263549805, "global_step": 425559, "epoch": 2533} {"train_loss": -11.172325134277344, "global_step": 425560, "epoch": 2533} {"train_loss": -11.418876647949219, "global_step": 425561, "epoch": 2533} {"train_loss": -11.696367263793945, "global_step": 425562, "epoch": 2533} {"train_loss": -11.323837280273438, "global_step": 425563, "epoch": 2533} {"train_loss": -11.832757949829102, "global_step": 425564, "epoch": 2533} {"train_loss": -11.634026527404785, "global_step": 425565, "epoch": 2533} {"train_loss": -11.54856014251709, "global_step": 425566, "epoch": 2533} {"train_loss": -12.047089576721191, "global_step": 425567, "epoch": 2533} {"train_loss": -11.209080696105957, "global_step": 425568, "epoch": 2533} {"train_loss": -11.464715957641602, "global_step": 425569, "epoch": 2533} {"train_loss": -12.101277351379395, "global_step": 425570, "epoch": 2533} {"train_loss": -11.823648452758789, "global_step": 425571, "epoch": 2533} {"train_loss": -11.633245468139648, "global_step": 425572, "epoch": 2533} {"train_loss": -11.6624755859375, "global_step": 425573, "epoch": 2533} {"train_loss": -11.206668853759766, "global_step": 425574, "epoch": 2533} {"train_loss": -11.379400253295898, "global_step": 425575, "epoch": 2533} {"train_loss": -12.16884994506836, "global_step": 425576, "epoch": 2533} {"train_loss": -11.138944625854492, "global_step": 425577, "epoch": 2533} {"train_loss": -12.153400421142578, "global_step": 425578, "epoch": 2533} {"train_loss": -11.073385238647461, "global_step": 425579, "epoch": 2533} {"train_loss": -12.405725479125977, "global_step": 425580, "epoch": 2533} {"train_loss": -11.301231384277344, "global_step": 425581, "epoch": 2533} {"train_loss": -11.813841819763184, "global_step": 425582, "epoch": 2533} {"train_loss": -12.447284698486328, "global_step": 425583, "epoch": 2533} {"train_loss": -11.589641571044922, "global_step": 425584, "epoch": 2533} {"train_loss": -12.347457885742188, "global_step": 425585, "epoch": 2533} {"train_loss": -11.971687316894531, "global_step": 425586, "epoch": 2533} {"train_loss": -12.310813903808594, "global_step": 425587, "epoch": 2533} {"train_loss": -11.70484733581543, "global_step": 425588, "epoch": 2533} {"train_loss": -11.97657299041748, "global_step": 425589, "epoch": 2533} {"train_loss": -11.644959449768066, "global_step": 425590, "epoch": 2533} {"train_loss": -11.463305473327637, "global_step": 425591, "epoch": 2533} {"train_loss": -12.292135238647461, "global_step": 425592, "epoch": 2533} {"train_loss": -12.110572814941406, "global_step": 425593, "epoch": 2533} {"train_loss": -12.317270278930664, "global_step": 425594, "epoch": 2533} {"train_loss": -12.367987632751465, "global_step": 425595, "epoch": 2533} {"train_loss": -12.515970230102539, "global_step": 425596, "epoch": 2533} {"train_loss": -12.187376022338867, "global_step": 425597, "epoch": 2533} {"train_loss": -12.28317928314209, "global_step": 425598, "epoch": 2533} {"train_loss": -12.370468139648438, "global_step": 425599, "epoch": 2533} {"train_loss": -12.528036117553711, "global_step": 425600, "epoch": 2533} {"train_loss": -12.260713577270508, "global_step": 425601, "epoch": 2533} {"train_loss": -12.641733169555664, "global_step": 425602, "epoch": 2533} {"train_loss": -12.390913009643555, "global_step": 425603, "epoch": 2533} {"train_loss": -12.322378158569336, "global_step": 425604, "epoch": 2533} {"train_loss": -12.497223854064941, "global_step": 425605, "epoch": 2533} {"train_loss": -12.233732223510742, "global_step": 425606, "epoch": 2533} {"train_loss": -12.467230796813965, "global_step": 425607, "epoch": 2533} {"train_loss": -12.591803550720215, "global_step": 425608, "epoch": 2533} {"train_loss": -12.621269226074219, "global_step": 425609, "epoch": 2533} {"train_loss": -12.398527145385742, "global_step": 425610, "epoch": 2533} {"train_loss": -12.423626899719238, "global_step": 425611, "epoch": 2533} {"train_loss": -12.385259628295898, "global_step": 425612, "epoch": 2533} {"train_loss": -12.572572708129883, "global_step": 425613, "epoch": 2533} {"train_loss": -12.719481468200684, "global_step": 425614, "epoch": 2533} {"train_loss": -12.683965682983398, "global_step": 425615, "epoch": 2533} {"train_loss": -12.482795715332031, "global_step": 425616, "epoch": 2533} {"train_loss": -12.855237007141113, "global_step": 425617, "epoch": 2533} {"train_loss": -12.64468765258789, "global_step": 425618, "epoch": 2533} {"train_loss": -12.688068389892578, "global_step": 425619, "epoch": 2533} {"train_loss": -12.780743598937988, "global_step": 425620, "epoch": 2533} {"train_loss": -12.674456596374512, "global_step": 425621, "epoch": 2533} {"train_loss": -12.77659797668457, "global_step": 425622, "epoch": 2533} {"train_loss": -12.69070053100586, "global_step": 425623, "epoch": 2533} {"train_loss": -12.808073997497559, "global_step": 425624, "epoch": 2533} {"train_loss": -12.657675743103027, "global_step": 425625, "epoch": 2533} {"train_loss": -12.835896492004395, "global_step": 425626, "epoch": 2533} {"train_loss": -12.710041046142578, "global_step": 425627, "epoch": 2533} {"train_loss": -12.38371467590332, "global_step": 425628, "epoch": 2533} {"train_loss": -12.911996841430664, "global_step": 425629, "epoch": 2533} {"train_loss": -12.534427642822266, "global_step": 425630, "epoch": 2533} {"train_loss": -12.657855033874512, "global_step": 425631, "epoch": 2533} {"train_loss": -12.681302070617676, "global_step": 425632, "epoch": 2533} {"train_loss": -12.385337829589844, "global_step": 425633, "epoch": 2533} {"train_loss": -13.04589557647705, "global_step": 425634, "epoch": 2533} {"train_loss": -12.640302658081055, "global_step": 425635, "epoch": 2533} {"train_loss": -12.618022918701172, "global_step": 425636, "epoch": 2533} {"train_loss": -12.803749084472656, "global_step": 425637, "epoch": 2533} {"train_loss": -12.751985549926758, "global_step": 425638, "epoch": 2533} {"train_loss": -12.382913589477539, "global_step": 425639, "epoch": 2533} {"train_loss": -12.742740631103516, "global_step": 425640, "epoch": 2533} {"train_loss": -12.620857238769531, "global_step": 425641, "epoch": 2533} {"train_loss": -12.585958480834961, "global_step": 425642, "epoch": 2533} {"train_loss": -12.30246353149414, "global_step": 425643, "epoch": 2533} {"train_loss": -12.717784881591797, "global_step": 425644, "epoch": 2533} {"train_loss": -12.43940258026123, "global_step": 425645, "epoch": 2533} {"train_loss": -12.704303741455078, "global_step": 425646, "epoch": 2533} {"train_loss": -12.582448959350586, "global_step": 425647, "epoch": 2533} {"train_loss": -12.399555206298828, "global_step": 425648, "epoch": 2533} {"train_loss": -12.65809154510498, "global_step": 425649, "epoch": 2533} {"train_loss": -12.43592643737793, "global_step": 425650, "epoch": 2533} {"train_loss": -12.567928314208984, "global_step": 425651, "epoch": 2533} {"train_loss": -12.82992172241211, "global_step": 425652, "epoch": 2533} {"train_loss": -12.759729385375977, "global_step": 425653, "epoch": 2533} {"train_loss": -12.616159439086914, "global_step": 425654, "epoch": 2533} {"train_loss": -12.30219841003418, "global_step": 425655, "epoch": 2533} {"train_loss": -11.891406059265137, "global_step": 425656, "epoch": 2533} {"train_loss": -12.424509048461914, "global_step": 425657, "epoch": 2533} {"train_loss": -12.450374603271484, "global_step": 425658, "epoch": 2533} {"train_loss": -12.478079795837402, "global_step": 425659, "epoch": 2533} {"train_loss": -12.357641220092773, "global_step": 425660, "epoch": 2533} {"train_loss": -12.311214447021484, "global_step": 425661, "epoch": 2533} {"train_loss": -12.06418514251709, "global_step": 425662, "epoch": 2533} {"train_loss": -12.594623565673828, "global_step": 425663, "epoch": 2533} {"train_loss": -11.77013874053955, "global_step": 425664, "epoch": 2533} {"train_loss": -11.934932708740234, "global_step": 425665, "epoch": 2533} {"train_loss": -12.247882843017578, "global_step": 425666, "epoch": 2533} {"train_loss": -12.535456657409668, "global_step": 425667, "epoch": 2533} {"train_loss": -11.136966705322266, "global_step": 425668, "epoch": 2533} {"train_loss": -11.830825805664062, "global_step": 425669, "epoch": 2533} {"train_loss": -12.546006202697754, "global_step": 425670, "epoch": 2533} {"train_loss": -12.043954849243164, "global_step": 425671, "epoch": 2533} {"train_loss": -12.402048110961914, "global_step": 425672, "epoch": 2533} {"train_loss": -11.378253936767578, "global_step": 425673, "epoch": 2533} {"train_loss": -11.852654457092285, "global_step": 425674, "epoch": 2533} {"train_loss": -12.179553985595703, "global_step": 425675, "epoch": 2533} {"train_loss": -11.242546081542969, "global_step": 425676, "epoch": 2533} {"train_loss": -11.266195297241211, "global_step": 425677, "epoch": 2533} {"train_loss": -11.704819679260254, "global_step": 425678, "epoch": 2533} {"train_loss": -11.602522850036621, "global_step": 425679, "epoch": 2533} {"train_loss": -11.49795913696289, "global_step": 425680, "epoch": 2533} {"train_loss": -12.048006057739258, "global_step": 425681, "epoch": 2533} {"train_loss": -11.543943405151367, "global_step": 425682, "epoch": 2533} {"train_loss": -12.100915908813477, "global_step": 425683, "epoch": 2533} {"train_loss": -11.388727188110352, "global_step": 425684, "epoch": 2533} {"train_loss": -12.034438133239746, "global_step": 425685, "epoch": 2533} {"train_loss": -12.103740692138672, "global_step": 425686, "epoch": 2533} {"train_loss": -12.187797546386719, "global_step": 425687, "epoch": 2533} {"train_loss": -11.946205139160156, "global_step": 425688, "epoch": 2533} {"train_loss": -12.094058990478516, "global_step": 425689, "epoch": 2533} {"train_loss": -12.489140510559082, "global_step": 425690, "epoch": 2533} {"train_loss": -12.107587814331055, "global_step": 425691, "epoch": 2533} {"train_loss": -12.615901947021484, "global_step": 425692, "epoch": 2533} {"train_loss": -12.184779167175293, "global_step": 425693, "epoch": 2533} {"train_loss": -12.09389591217041, "global_step": 425694, "epoch": 2533} {"train_loss": -12.214210510253906, "global_step": 425695, "epoch": 2533} {"train_loss": -12.469889640808105, "global_step": 425696, "epoch": 2533} {"train_loss": -11.88601303100586, "global_step": 425697, "epoch": 2533} {"train_loss": -12.651578903198242, "global_step": 425698, "epoch": 2533} {"train_loss": -12.019827842712402, "global_step": 425699, "epoch": 2533} {"train_loss": -12.307577133178711, "global_step": 425700, "epoch": 2533} {"train_loss": -12.510852813720703, "global_step": 425701, "epoch": 2533} {"train_loss": -12.194402694702148, "global_step": 425702, "epoch": 2533} {"train_loss": -12.542900085449219, "global_step": 425703, "epoch": 2533} {"train_loss": -12.181753158569336, "global_step": 425704, "epoch": 2533} {"train_loss": -11.780961990356445, "global_step": 425705, "epoch": 2533} {"train_loss": -12.298357009887695, "global_step": 425706, "epoch": 2533} {"train_loss": -11.616012573242188, "global_step": 425707, "epoch": 2533} {"train_loss": -12.407249450683594, "global_step": 425708, "epoch": 2533} {"train_loss": -11.68378734588623, "global_step": 425709, "epoch": 2533} {"train_loss": -12.0053071975708, "global_step": 425710, "epoch": 2533} {"train_loss": -12.087129893757048, "global_step": 425711, "epoch": 2533, "val_loss": 307780.6875} {"train_loss": -11.631355285644531, "global_step": 425712, "epoch": 2534} {"train_loss": -12.233933448791504, "global_step": 425713, "epoch": 2534} {"train_loss": -11.928852081298828, "global_step": 425714, "epoch": 2534} {"train_loss": -11.896331787109375, "global_step": 425715, "epoch": 2534} {"train_loss": -12.240762710571289, "global_step": 425716, "epoch": 2534} {"train_loss": -12.238739013671875, "global_step": 425717, "epoch": 2534} {"train_loss": -12.174543380737305, "global_step": 425718, "epoch": 2534} {"train_loss": -12.561851501464844, "global_step": 425719, "epoch": 2534} {"train_loss": -12.293503761291504, "global_step": 425720, "epoch": 2534} {"train_loss": -12.360411643981934, "global_step": 425721, "epoch": 2534} {"train_loss": -12.16769790649414, "global_step": 425722, "epoch": 2534} {"train_loss": -12.63467025756836, "global_step": 425723, "epoch": 2534} {"train_loss": -12.451567649841309, "global_step": 425724, "epoch": 2534} {"train_loss": -12.486738204956055, "global_step": 425725, "epoch": 2534} {"train_loss": -12.48222827911377, "global_step": 425726, "epoch": 2534} {"train_loss": -12.363628387451172, "global_step": 425727, "epoch": 2534} {"train_loss": -12.638151168823242, "global_step": 425728, "epoch": 2534} {"train_loss": -12.595622062683105, "global_step": 425729, "epoch": 2534} {"train_loss": -12.446168899536133, "global_step": 425730, "epoch": 2534} {"train_loss": -12.611724853515625, "global_step": 425731, "epoch": 2534} {"train_loss": -12.681013107299805, "global_step": 425732, "epoch": 2534} {"train_loss": -12.637173652648926, "global_step": 425733, "epoch": 2534} {"train_loss": -12.538185119628906, "global_step": 425734, "epoch": 2534} {"train_loss": -12.589319229125977, "global_step": 425735, "epoch": 2534} {"train_loss": -11.894601821899414, "global_step": 425736, "epoch": 2534} {"train_loss": -12.668652534484863, "global_step": 425737, "epoch": 2534} {"train_loss": -12.795782089233398, "global_step": 425738, "epoch": 2534} {"train_loss": -12.566215515136719, "global_step": 425739, "epoch": 2534} {"train_loss": -12.365182876586914, "global_step": 425740, "epoch": 2534} {"train_loss": -12.506128311157227, "global_step": 425741, "epoch": 2534} {"train_loss": -12.520612716674805, "global_step": 425742, "epoch": 2534} {"train_loss": -12.867208480834961, "global_step": 425743, "epoch": 2534} {"train_loss": -12.380424499511719, "global_step": 425744, "epoch": 2534} {"train_loss": -12.96977424621582, "global_step": 425745, "epoch": 2534} {"train_loss": -12.767515182495117, "global_step": 425746, "epoch": 2534} {"train_loss": -12.473716735839844, "global_step": 425747, "epoch": 2534} {"train_loss": -12.444303512573242, "global_step": 425748, "epoch": 2534} {"train_loss": -12.846611976623535, "global_step": 425749, "epoch": 2534} {"train_loss": -12.631024360656738, "global_step": 425750, "epoch": 2534} {"train_loss": -12.622457504272461, "global_step": 425751, "epoch": 2534} {"train_loss": -12.354548454284668, "global_step": 425752, "epoch": 2534} {"train_loss": -12.749425888061523, "global_step": 425753, "epoch": 2534} {"train_loss": -12.78213119506836, "global_step": 425754, "epoch": 2534} {"train_loss": -12.65490436553955, "global_step": 425755, "epoch": 2534} {"train_loss": -12.731210708618164, "global_step": 425756, "epoch": 2534} {"train_loss": -12.589805603027344, "global_step": 425757, "epoch": 2534} {"train_loss": -12.580961227416992, "global_step": 425758, "epoch": 2534} {"train_loss": -12.66595458984375, "global_step": 425759, "epoch": 2534} {"train_loss": -12.574895858764648, "global_step": 425760, "epoch": 2534} {"train_loss": -12.620010375976562, "global_step": 425761, "epoch": 2534} {"train_loss": -12.831805229187012, "global_step": 425762, "epoch": 2534} {"train_loss": -12.667329788208008, "global_step": 425763, "epoch": 2534} {"train_loss": -12.808914184570312, "global_step": 425764, "epoch": 2534} {"train_loss": -12.574732780456543, "global_step": 425765, "epoch": 2534} {"train_loss": -12.65829849243164, "global_step": 425766, "epoch": 2534} {"train_loss": -12.557967185974121, "global_step": 425767, "epoch": 2534} {"train_loss": -12.231772422790527, "global_step": 425768, "epoch": 2534} {"train_loss": -11.722636222839355, "global_step": 425769, "epoch": 2534} {"train_loss": -11.529240608215332, "global_step": 425770, "epoch": 2534} {"train_loss": -10.938554763793945, "global_step": 425771, "epoch": 2534} {"train_loss": -9.009431838989258, "global_step": 425772, "epoch": 2534} {"train_loss": -9.248649597167969, "global_step": 425773, "epoch": 2534} {"train_loss": -11.619342803955078, "global_step": 425774, "epoch": 2534} {"train_loss": -8.759857177734375, "global_step": 425775, "epoch": 2534} {"train_loss": -9.648008346557617, "global_step": 425776, "epoch": 2534} {"train_loss": -9.636137008666992, "global_step": 425777, "epoch": 2534} {"train_loss": -9.058357238769531, "global_step": 425778, "epoch": 2534} {"train_loss": -8.361448287963867, "global_step": 425779, "epoch": 2534} {"train_loss": -11.286484718322754, "global_step": 425780, "epoch": 2534} {"train_loss": -11.411595344543457, "global_step": 425781, "epoch": 2534} {"train_loss": -10.529598236083984, "global_step": 425782, "epoch": 2534} {"train_loss": -10.692413330078125, "global_step": 425783, "epoch": 2534} {"train_loss": -10.917495727539062, "global_step": 425784, "epoch": 2534} {"train_loss": -10.235158920288086, "global_step": 425785, "epoch": 2534} {"train_loss": -11.31973648071289, "global_step": 425786, "epoch": 2534} {"train_loss": -10.48670768737793, "global_step": 425787, "epoch": 2534} {"train_loss": -11.771174430847168, "global_step": 425788, "epoch": 2534} {"train_loss": -10.644979476928711, "global_step": 425789, "epoch": 2534} {"train_loss": -11.705201148986816, "global_step": 425790, "epoch": 2534} {"train_loss": -11.55214786529541, "global_step": 425791, "epoch": 2534} {"train_loss": -11.115218162536621, "global_step": 425792, "epoch": 2534} {"train_loss": -11.857404708862305, "global_step": 425793, "epoch": 2534} {"train_loss": -11.148202896118164, "global_step": 425794, "epoch": 2534} {"train_loss": -11.77105712890625, "global_step": 425795, "epoch": 2534} {"train_loss": -11.409610748291016, "global_step": 425796, "epoch": 2534} {"train_loss": -11.799459457397461, "global_step": 425797, "epoch": 2534} {"train_loss": -11.583822250366211, "global_step": 425798, "epoch": 2534} {"train_loss": -11.868072509765625, "global_step": 425799, "epoch": 2534} {"train_loss": -11.478377342224121, "global_step": 425800, "epoch": 2534} {"train_loss": -11.841605186462402, "global_step": 425801, "epoch": 2534} {"train_loss": -11.720458984375, "global_step": 425802, "epoch": 2534} {"train_loss": -11.77004623413086, "global_step": 425803, "epoch": 2534} {"train_loss": -12.184261322021484, "global_step": 425804, "epoch": 2534} {"train_loss": -12.161723136901855, "global_step": 425805, "epoch": 2534} {"train_loss": -12.040456771850586, "global_step": 425806, "epoch": 2534} {"train_loss": -11.966520309448242, "global_step": 425807, "epoch": 2534} {"train_loss": -11.98859977722168, "global_step": 425808, "epoch": 2534} {"train_loss": -11.63618278503418, "global_step": 425809, "epoch": 2534} {"train_loss": -12.328533172607422, "global_step": 425810, "epoch": 2534} {"train_loss": -11.8670654296875, "global_step": 425811, "epoch": 2534} {"train_loss": -12.401229858398438, "global_step": 425812, "epoch": 2534} {"train_loss": -11.8421630859375, "global_step": 425813, "epoch": 2534} {"train_loss": -12.403907775878906, "global_step": 425814, "epoch": 2534} {"train_loss": -12.164461135864258, "global_step": 425815, "epoch": 2534} {"train_loss": -12.167059898376465, "global_step": 425816, "epoch": 2534} {"train_loss": -12.065034866333008, "global_step": 425817, "epoch": 2534} {"train_loss": -12.407905578613281, "global_step": 425818, "epoch": 2534} {"train_loss": -12.265986442565918, "global_step": 425819, "epoch": 2534} {"train_loss": -12.180194854736328, "global_step": 425820, "epoch": 2534} {"train_loss": -12.21644115447998, "global_step": 425821, "epoch": 2534} {"train_loss": -12.253096580505371, "global_step": 425822, "epoch": 2534} {"train_loss": -12.240833282470703, "global_step": 425823, "epoch": 2534} {"train_loss": -12.349274635314941, "global_step": 425824, "epoch": 2534} {"train_loss": -12.17612361907959, "global_step": 425825, "epoch": 2534} {"train_loss": -12.476069450378418, "global_step": 425826, "epoch": 2534} {"train_loss": -12.2236328125, "global_step": 425827, "epoch": 2534} {"train_loss": -12.391273498535156, "global_step": 425828, "epoch": 2534} {"train_loss": -12.300436973571777, "global_step": 425829, "epoch": 2534} {"train_loss": -12.189565658569336, "global_step": 425830, "epoch": 2534} {"train_loss": -12.088894844055176, "global_step": 425831, "epoch": 2534} {"train_loss": -12.50951862335205, "global_step": 425832, "epoch": 2534} {"train_loss": -11.955897331237793, "global_step": 425833, "epoch": 2534} {"train_loss": -12.234128952026367, "global_step": 425834, "epoch": 2534} {"train_loss": -12.047441482543945, "global_step": 425835, "epoch": 2534} {"train_loss": -11.77070426940918, "global_step": 425836, "epoch": 2534} {"train_loss": -12.567436218261719, "global_step": 425837, "epoch": 2534} {"train_loss": -12.16787338256836, "global_step": 425838, "epoch": 2534} {"train_loss": -12.0548677444458, "global_step": 425839, "epoch": 2534} {"train_loss": -12.557104110717773, "global_step": 425840, "epoch": 2534} {"train_loss": -12.006875991821289, "global_step": 425841, "epoch": 2534} {"train_loss": -12.395400047302246, "global_step": 425842, "epoch": 2534} {"train_loss": -12.414117813110352, "global_step": 425843, "epoch": 2534} {"train_loss": -12.294870376586914, "global_step": 425844, "epoch": 2534} {"train_loss": -12.255868911743164, "global_step": 425845, "epoch": 2534} {"train_loss": -12.597336769104004, "global_step": 425846, "epoch": 2534} {"train_loss": -12.537067413330078, "global_step": 425847, "epoch": 2534} {"train_loss": -12.060770034790039, "global_step": 425848, "epoch": 2534} {"train_loss": -12.79454231262207, "global_step": 425849, "epoch": 2534} {"train_loss": -12.371118545532227, "global_step": 425850, "epoch": 2534} {"train_loss": -12.745210647583008, "global_step": 425851, "epoch": 2534} {"train_loss": -12.191812515258789, "global_step": 425852, "epoch": 2534} {"train_loss": -12.677759170532227, "global_step": 425853, "epoch": 2534} {"train_loss": -12.444601058959961, "global_step": 425854, "epoch": 2534} {"train_loss": -12.513526916503906, "global_step": 425855, "epoch": 2534} {"train_loss": -12.341341972351074, "global_step": 425856, "epoch": 2534} {"train_loss": -12.331533432006836, "global_step": 425857, "epoch": 2534} {"train_loss": -12.521281242370605, "global_step": 425858, "epoch": 2534} {"train_loss": -12.344844818115234, "global_step": 425859, "epoch": 2534} {"train_loss": -11.833995819091797, "global_step": 425860, "epoch": 2534} {"train_loss": -12.527511596679688, "global_step": 425861, "epoch": 2534} {"train_loss": -12.278883934020996, "global_step": 425862, "epoch": 2534} {"train_loss": -12.520357131958008, "global_step": 425863, "epoch": 2534} {"train_loss": -12.486701965332031, "global_step": 425864, "epoch": 2534} {"train_loss": -12.721546173095703, "global_step": 425865, "epoch": 2534} {"train_loss": -12.639900207519531, "global_step": 425866, "epoch": 2534} {"train_loss": -12.219566345214844, "global_step": 425867, "epoch": 2534} {"train_loss": -12.626029968261719, "global_step": 425868, "epoch": 2534} {"train_loss": -12.471639633178711, "global_step": 425869, "epoch": 2534} {"train_loss": -12.668498992919922, "global_step": 425870, "epoch": 2534} {"train_loss": -12.281509399414062, "global_step": 425871, "epoch": 2534} {"train_loss": -12.39944076538086, "global_step": 425872, "epoch": 2534} {"train_loss": -12.533021926879883, "global_step": 425873, "epoch": 2534} {"train_loss": -12.382939338684082, "global_step": 425874, "epoch": 2534} {"train_loss": -11.987749099731445, "global_step": 425875, "epoch": 2534} {"train_loss": -12.580148696899414, "global_step": 425876, "epoch": 2534} {"train_loss": -12.24191951751709, "global_step": 425877, "epoch": 2534} {"train_loss": -12.288811683654785, "global_step": 425878, "epoch": 2534} {"train_loss": -12.074398182687306, "global_step": 425879, "epoch": 2534, "val_loss": 301077.375} {"train_loss": -12.299205780029297, "global_step": 425880, "epoch": 2535} {"train_loss": -11.790217399597168, "global_step": 425881, "epoch": 2535} {"train_loss": -12.222556114196777, "global_step": 425882, "epoch": 2535} {"train_loss": -12.226460456848145, "global_step": 425883, "epoch": 2535} {"train_loss": -12.147697448730469, "global_step": 425884, "epoch": 2535} {"train_loss": -11.780088424682617, "global_step": 425885, "epoch": 2535} {"train_loss": -12.309200286865234, "global_step": 425886, "epoch": 2535} {"train_loss": -12.47414493560791, "global_step": 425887, "epoch": 2535} {"train_loss": -12.4439058303833, "global_step": 425888, "epoch": 2535} {"train_loss": -12.285057067871094, "global_step": 425889, "epoch": 2535} {"train_loss": -12.662062644958496, "global_step": 425890, "epoch": 2535} {"train_loss": -12.428365707397461, "global_step": 425891, "epoch": 2535} {"train_loss": -12.415913581848145, "global_step": 425892, "epoch": 2535} {"train_loss": -12.6588134765625, "global_step": 425893, "epoch": 2535} {"train_loss": -12.57435131072998, "global_step": 425894, "epoch": 2535} {"train_loss": -12.574862480163574, "global_step": 425895, "epoch": 2535} {"train_loss": -12.474672317504883, "global_step": 425896, "epoch": 2535} {"train_loss": -12.60143756866455, "global_step": 425897, "epoch": 2535} {"train_loss": -12.056119918823242, "global_step": 425898, "epoch": 2535} {"train_loss": -12.787954330444336, "global_step": 425899, "epoch": 2535} {"train_loss": -12.159124374389648, "global_step": 425900, "epoch": 2535} {"train_loss": -12.377127647399902, "global_step": 425901, "epoch": 2535} {"train_loss": -12.086472511291504, "global_step": 425902, "epoch": 2535} {"train_loss": -12.589153289794922, "global_step": 425903, "epoch": 2535} {"train_loss": -12.109200477600098, "global_step": 425904, "epoch": 2535} {"train_loss": -12.065706253051758, "global_step": 425905, "epoch": 2535} {"train_loss": -12.284955024719238, "global_step": 425906, "epoch": 2535} {"train_loss": -11.320695877075195, "global_step": 425907, "epoch": 2535} {"train_loss": -12.145561218261719, "global_step": 425908, "epoch": 2535} {"train_loss": -11.562501907348633, "global_step": 425909, "epoch": 2535} {"train_loss": -11.368877410888672, "global_step": 425910, "epoch": 2535} {"train_loss": -11.793306350708008, "global_step": 425911, "epoch": 2535} {"train_loss": -12.19017219543457, "global_step": 425912, "epoch": 2535} {"train_loss": -11.915481567382812, "global_step": 425913, "epoch": 2535} {"train_loss": -11.396738052368164, "global_step": 425914, "epoch": 2535} {"train_loss": -12.212440490722656, "global_step": 425915, "epoch": 2535} {"train_loss": -11.104397773742676, "global_step": 425916, "epoch": 2535} {"train_loss": -12.049217224121094, "global_step": 425917, "epoch": 2535} {"train_loss": -11.560029983520508, "global_step": 425918, "epoch": 2535} {"train_loss": -12.218486785888672, "global_step": 425919, "epoch": 2535} {"train_loss": -12.581388473510742, "global_step": 425920, "epoch": 2535} {"train_loss": -12.031339645385742, "global_step": 425921, "epoch": 2535} {"train_loss": -12.318354606628418, "global_step": 425922, "epoch": 2535} {"train_loss": -11.903512001037598, "global_step": 425923, "epoch": 2535} {"train_loss": -12.148736953735352, "global_step": 425924, "epoch": 2535} {"train_loss": -11.95162582397461, "global_step": 425925, "epoch": 2535} {"train_loss": -12.000419616699219, "global_step": 425926, "epoch": 2535} {"train_loss": -12.669380187988281, "global_step": 425927, "epoch": 2535} {"train_loss": -12.251840591430664, "global_step": 425928, "epoch": 2535} {"train_loss": -12.237211227416992, "global_step": 425929, "epoch": 2535} {"train_loss": -11.751264572143555, "global_step": 425930, "epoch": 2535} {"train_loss": -12.444602966308594, "global_step": 425931, "epoch": 2535} {"train_loss": -12.276668548583984, "global_step": 425932, "epoch": 2535} {"train_loss": -12.38549518585205, "global_step": 425933, "epoch": 2535} {"train_loss": -12.530715942382812, "global_step": 425934, "epoch": 2535} {"train_loss": -12.151409149169922, "global_step": 425935, "epoch": 2535} {"train_loss": -12.147842407226562, "global_step": 425936, "epoch": 2535} {"train_loss": -12.104517936706543, "global_step": 425937, "epoch": 2535} {"train_loss": -12.765826225280762, "global_step": 425938, "epoch": 2535} {"train_loss": -12.252093315124512, "global_step": 425939, "epoch": 2535} {"train_loss": -11.97520637512207, "global_step": 425940, "epoch": 2535} {"train_loss": -12.560751914978027, "global_step": 425941, "epoch": 2535} {"train_loss": -12.204752922058105, "global_step": 425942, "epoch": 2535} {"train_loss": -12.47221565246582, "global_step": 425943, "epoch": 2535} {"train_loss": -12.174043655395508, "global_step": 425944, "epoch": 2535} {"train_loss": -11.820829391479492, "global_step": 425945, "epoch": 2535} {"train_loss": -12.259441375732422, "global_step": 425946, "epoch": 2535} {"train_loss": -11.838876724243164, "global_step": 425947, "epoch": 2535} {"train_loss": -11.529450416564941, "global_step": 425948, "epoch": 2535} {"train_loss": -10.320575714111328, "global_step": 425949, "epoch": 2535} {"train_loss": -10.688589096069336, "global_step": 425950, "epoch": 2535} {"train_loss": -11.461041450500488, "global_step": 425951, "epoch": 2535} {"train_loss": -11.17530632019043, "global_step": 425952, "epoch": 2535} {"train_loss": -10.735011100769043, "global_step": 425953, "epoch": 2535} {"train_loss": -10.885381698608398, "global_step": 425954, "epoch": 2535} {"train_loss": -10.331870079040527, "global_step": 425955, "epoch": 2535} {"train_loss": -10.098575592041016, "global_step": 425956, "epoch": 2535} {"train_loss": -9.441648483276367, "global_step": 425957, "epoch": 2535} {"train_loss": -11.220148086547852, "global_step": 425958, "epoch": 2535} {"train_loss": -9.76137924194336, "global_step": 425959, "epoch": 2535} {"train_loss": -11.795989990234375, "global_step": 425960, "epoch": 2535} {"train_loss": -11.087625503540039, "global_step": 425961, "epoch": 2535} {"train_loss": -11.483996391296387, "global_step": 425962, "epoch": 2535} {"train_loss": -11.677373886108398, "global_step": 425963, "epoch": 2535} {"train_loss": -10.467690467834473, "global_step": 425964, "epoch": 2535} {"train_loss": -10.762208938598633, "global_step": 425965, "epoch": 2535} {"train_loss": -9.881645202636719, "global_step": 425966, "epoch": 2535} {"train_loss": -11.706084251403809, "global_step": 425967, "epoch": 2535} {"train_loss": -10.77749252319336, "global_step": 425968, "epoch": 2535} {"train_loss": -11.61185073852539, "global_step": 425969, "epoch": 2535} {"train_loss": -10.858180046081543, "global_step": 425970, "epoch": 2535} {"train_loss": -12.1260404586792, "global_step": 425971, "epoch": 2535} {"train_loss": -11.408485412597656, "global_step": 425972, "epoch": 2535} {"train_loss": -11.91340446472168, "global_step": 425973, "epoch": 2535} {"train_loss": -11.431293487548828, "global_step": 425974, "epoch": 2535} {"train_loss": -12.391877174377441, "global_step": 425975, "epoch": 2535} {"train_loss": -11.539619445800781, "global_step": 425976, "epoch": 2535} {"train_loss": -12.385308265686035, "global_step": 425977, "epoch": 2535} {"train_loss": -11.575971603393555, "global_step": 425978, "epoch": 2535} {"train_loss": -12.454344749450684, "global_step": 425979, "epoch": 2535} {"train_loss": -11.793510437011719, "global_step": 425980, "epoch": 2535} {"train_loss": -12.259758949279785, "global_step": 425981, "epoch": 2535} {"train_loss": -12.114553451538086, "global_step": 425982, "epoch": 2535} {"train_loss": -12.439557075500488, "global_step": 425983, "epoch": 2535} {"train_loss": -12.061126708984375, "global_step": 425984, "epoch": 2535} {"train_loss": -12.463897705078125, "global_step": 425985, "epoch": 2535} {"train_loss": -12.342499732971191, "global_step": 425986, "epoch": 2535} {"train_loss": -12.496456146240234, "global_step": 425987, "epoch": 2535} {"train_loss": -12.189220428466797, "global_step": 425988, "epoch": 2535} {"train_loss": -12.231454849243164, "global_step": 425989, "epoch": 2535} {"train_loss": -11.991388320922852, "global_step": 425990, "epoch": 2535} {"train_loss": -12.462064743041992, "global_step": 425991, "epoch": 2535} {"train_loss": -12.210526466369629, "global_step": 425992, "epoch": 2535} {"train_loss": -12.37051010131836, "global_step": 425993, "epoch": 2535} {"train_loss": -11.927297592163086, "global_step": 425994, "epoch": 2535} {"train_loss": -11.789794921875, "global_step": 425995, "epoch": 2535} {"train_loss": -11.981521606445312, "global_step": 425996, "epoch": 2535} {"train_loss": -12.029500961303711, "global_step": 425997, "epoch": 2535} {"train_loss": -11.768068313598633, "global_step": 425998, "epoch": 2535} {"train_loss": -12.13215446472168, "global_step": 425999, "epoch": 2535} {"train_loss": -11.608631134033203, "global_step": 426000, "epoch": 2535} {"train_loss": -11.737899780273438, "global_step": 426001, "epoch": 2535} {"train_loss": -12.021139144897461, "global_step": 426002, "epoch": 2535} {"train_loss": -11.456866264343262, "global_step": 426003, "epoch": 2535} {"train_loss": -12.076955795288086, "global_step": 426004, "epoch": 2535} {"train_loss": -11.315229415893555, "global_step": 426005, "epoch": 2535} {"train_loss": -12.370088577270508, "global_step": 426006, "epoch": 2535} {"train_loss": -11.669301986694336, "global_step": 426007, "epoch": 2535} {"train_loss": -11.854557991027832, "global_step": 426008, "epoch": 2535} {"train_loss": -12.187559127807617, "global_step": 426009, "epoch": 2535} {"train_loss": -11.89309310913086, "global_step": 426010, "epoch": 2535} {"train_loss": -12.41204833984375, "global_step": 426011, "epoch": 2535} {"train_loss": -12.088403701782227, "global_step": 426012, "epoch": 2535} {"train_loss": -12.33218765258789, "global_step": 426013, "epoch": 2535} {"train_loss": -11.702680587768555, "global_step": 426014, "epoch": 2535} {"train_loss": -12.435043334960938, "global_step": 426015, "epoch": 2535} {"train_loss": -12.04236125946045, "global_step": 426016, "epoch": 2535} {"train_loss": -12.420069694519043, "global_step": 426017, "epoch": 2535} {"train_loss": -12.170848846435547, "global_step": 426018, "epoch": 2535} {"train_loss": -12.272071838378906, "global_step": 426019, "epoch": 2535} {"train_loss": -12.330456733703613, "global_step": 426020, "epoch": 2535} {"train_loss": -12.595935821533203, "global_step": 426021, "epoch": 2535} {"train_loss": -12.204063415527344, "global_step": 426022, "epoch": 2535} {"train_loss": -12.437021255493164, "global_step": 426023, "epoch": 2535} {"train_loss": -12.58867073059082, "global_step": 426024, "epoch": 2535} {"train_loss": -12.39973258972168, "global_step": 426025, "epoch": 2535} {"train_loss": -12.592523574829102, "global_step": 426026, "epoch": 2535} {"train_loss": -12.301015853881836, "global_step": 426027, "epoch": 2535} {"train_loss": -12.364118576049805, "global_step": 426028, "epoch": 2535} {"train_loss": -12.240839004516602, "global_step": 426029, "epoch": 2535} {"train_loss": -12.353455543518066, "global_step": 426030, "epoch": 2535} {"train_loss": -12.514322280883789, "global_step": 426031, "epoch": 2535} {"train_loss": -12.460179328918457, "global_step": 426032, "epoch": 2535} {"train_loss": -12.652091979980469, "global_step": 426033, "epoch": 2535} {"train_loss": -12.580212593078613, "global_step": 426034, "epoch": 2535} {"train_loss": -12.663402557373047, "global_step": 426035, "epoch": 2535} {"train_loss": -12.428407669067383, "global_step": 426036, "epoch": 2535} {"train_loss": -12.523405075073242, "global_step": 426037, "epoch": 2535} {"train_loss": -12.53116226196289, "global_step": 426038, "epoch": 2535} {"train_loss": -12.66539478302002, "global_step": 426039, "epoch": 2535} {"train_loss": -12.618009567260742, "global_step": 426040, "epoch": 2535} {"train_loss": -12.636575698852539, "global_step": 426041, "epoch": 2535} {"train_loss": -12.677541732788086, "global_step": 426042, "epoch": 2535} {"train_loss": -12.553915023803711, "global_step": 426043, "epoch": 2535} {"train_loss": -12.645729064941406, "global_step": 426044, "epoch": 2535} {"train_loss": -12.569934844970703, "global_step": 426045, "epoch": 2535} {"train_loss": -12.634705543518066, "global_step": 426046, "epoch": 2535} {"train_loss": -12.013348868915013, "global_step": 426047, "epoch": 2535, "val_loss": 307736.65625, "train_action_mse_error": 1.379742980003357} {"train_loss": -12.800498962402344, "global_step": 426048, "epoch": 2536} {"train_loss": -12.681900024414062, "global_step": 426049, "epoch": 2536} {"train_loss": -12.702764511108398, "global_step": 426050, "epoch": 2536} {"train_loss": -12.777237892150879, "global_step": 426051, "epoch": 2536} {"train_loss": -12.664430618286133, "global_step": 426052, "epoch": 2536} {"train_loss": -12.591329574584961, "global_step": 426053, "epoch": 2536} {"train_loss": -12.72944450378418, "global_step": 426054, "epoch": 2536} {"train_loss": -12.354174613952637, "global_step": 426055, "epoch": 2536} {"train_loss": -12.48580551147461, "global_step": 426056, "epoch": 2536} {"train_loss": -12.430956840515137, "global_step": 426057, "epoch": 2536} {"train_loss": -12.124670028686523, "global_step": 426058, "epoch": 2536} {"train_loss": -12.548866271972656, "global_step": 426059, "epoch": 2536} {"train_loss": -12.198492050170898, "global_step": 426060, "epoch": 2536} {"train_loss": -12.66042709350586, "global_step": 426061, "epoch": 2536} {"train_loss": -12.356067657470703, "global_step": 426062, "epoch": 2536} {"train_loss": -12.627618789672852, "global_step": 426063, "epoch": 2536} {"train_loss": -12.492914199829102, "global_step": 426064, "epoch": 2536} {"train_loss": -12.377455711364746, "global_step": 426065, "epoch": 2536} {"train_loss": -12.524209976196289, "global_step": 426066, "epoch": 2536} {"train_loss": -12.477235794067383, "global_step": 426067, "epoch": 2536} {"train_loss": -12.537321090698242, "global_step": 426068, "epoch": 2536} {"train_loss": -12.261068344116211, "global_step": 426069, "epoch": 2536} {"train_loss": -12.387527465820312, "global_step": 426070, "epoch": 2536} {"train_loss": -12.02812385559082, "global_step": 426071, "epoch": 2536} {"train_loss": -12.441123962402344, "global_step": 426072, "epoch": 2536} {"train_loss": -11.854921340942383, "global_step": 426073, "epoch": 2536} {"train_loss": -12.078248023986816, "global_step": 426074, "epoch": 2536} {"train_loss": -11.566865921020508, "global_step": 426075, "epoch": 2536} {"train_loss": -12.511419296264648, "global_step": 426076, "epoch": 2536} {"train_loss": -11.085023880004883, "global_step": 426077, "epoch": 2536} {"train_loss": -12.075870513916016, "global_step": 426078, "epoch": 2536} {"train_loss": -11.767681121826172, "global_step": 426079, "epoch": 2536} {"train_loss": -11.512407302856445, "global_step": 426080, "epoch": 2536} {"train_loss": -12.214503288269043, "global_step": 426081, "epoch": 2536} {"train_loss": -11.12670612335205, "global_step": 426082, "epoch": 2536} {"train_loss": -11.097843170166016, "global_step": 426083, "epoch": 2536} {"train_loss": -12.371691703796387, "global_step": 426084, "epoch": 2536} {"train_loss": -10.128395080566406, "global_step": 426085, "epoch": 2536} {"train_loss": -11.315327644348145, "global_step": 426086, "epoch": 2536} {"train_loss": -11.488525390625, "global_step": 426087, "epoch": 2536} {"train_loss": -10.906595230102539, "global_step": 426088, "epoch": 2536} {"train_loss": -11.79316520690918, "global_step": 426089, "epoch": 2536} {"train_loss": -11.011480331420898, "global_step": 426090, "epoch": 2536} {"train_loss": -10.806146621704102, "global_step": 426091, "epoch": 2536} {"train_loss": -11.1048583984375, "global_step": 426092, "epoch": 2536} {"train_loss": -10.191883087158203, "global_step": 426093, "epoch": 2536} {"train_loss": -11.150054931640625, "global_step": 426094, "epoch": 2536} {"train_loss": -10.753131866455078, "global_step": 426095, "epoch": 2536} {"train_loss": -10.361358642578125, "global_step": 426096, "epoch": 2536} {"train_loss": -10.436372756958008, "global_step": 426097, "epoch": 2536} {"train_loss": -11.18493366241455, "global_step": 426098, "epoch": 2536} {"train_loss": -9.709026336669922, "global_step": 426099, "epoch": 2536} {"train_loss": -10.290447235107422, "global_step": 426100, "epoch": 2536} {"train_loss": -11.332530975341797, "global_step": 426101, "epoch": 2536} {"train_loss": -10.568815231323242, "global_step": 426102, "epoch": 2536} {"train_loss": -11.070932388305664, "global_step": 426103, "epoch": 2536} {"train_loss": -11.131568908691406, "global_step": 426104, "epoch": 2536} {"train_loss": -10.277414321899414, "global_step": 426105, "epoch": 2536} {"train_loss": -10.863237380981445, "global_step": 426106, "epoch": 2536} {"train_loss": -11.337064743041992, "global_step": 426107, "epoch": 2536} {"train_loss": -11.258994102478027, "global_step": 426108, "epoch": 2536} {"train_loss": -11.801494598388672, "global_step": 426109, "epoch": 2536} {"train_loss": -11.989510536193848, "global_step": 426110, "epoch": 2536} {"train_loss": -11.313297271728516, "global_step": 426111, "epoch": 2536} {"train_loss": -11.606341361999512, "global_step": 426112, "epoch": 2536} {"train_loss": -11.72613525390625, "global_step": 426113, "epoch": 2536} {"train_loss": -10.47310733795166, "global_step": 426114, "epoch": 2536} {"train_loss": -11.558431625366211, "global_step": 426115, "epoch": 2536} {"train_loss": -10.633980751037598, "global_step": 426116, "epoch": 2536} {"train_loss": -10.555948257446289, "global_step": 426117, "epoch": 2536} {"train_loss": -11.369159698486328, "global_step": 426118, "epoch": 2536} {"train_loss": -11.691465377807617, "global_step": 426119, "epoch": 2536} {"train_loss": -10.632351875305176, "global_step": 426120, "epoch": 2536} {"train_loss": -11.568422317504883, "global_step": 426121, "epoch": 2536} {"train_loss": -10.889768600463867, "global_step": 426122, "epoch": 2536} {"train_loss": -11.205177307128906, "global_step": 426123, "epoch": 2536} {"train_loss": -11.620412826538086, "global_step": 426124, "epoch": 2536} {"train_loss": -11.721735000610352, "global_step": 426125, "epoch": 2536} {"train_loss": -10.899526596069336, "global_step": 426126, "epoch": 2536} {"train_loss": -12.153504371643066, "global_step": 426127, "epoch": 2536} {"train_loss": -11.434876441955566, "global_step": 426128, "epoch": 2536} {"train_loss": -12.11678695678711, "global_step": 426129, "epoch": 2536} {"train_loss": -11.194982528686523, "global_step": 426130, "epoch": 2536} {"train_loss": -11.878254890441895, "global_step": 426131, "epoch": 2536} {"train_loss": -11.378543853759766, "global_step": 426132, "epoch": 2536} {"train_loss": -11.884910583496094, "global_step": 426133, "epoch": 2536} {"train_loss": -11.574213027954102, "global_step": 426134, "epoch": 2536} {"train_loss": -11.818586349487305, "global_step": 426135, "epoch": 2536} {"train_loss": -11.586946487426758, "global_step": 426136, "epoch": 2536} {"train_loss": -11.690038681030273, "global_step": 426137, "epoch": 2536} {"train_loss": -11.92236042022705, "global_step": 426138, "epoch": 2536} {"train_loss": -11.547113418579102, "global_step": 426139, "epoch": 2536} {"train_loss": -12.405603408813477, "global_step": 426140, "epoch": 2536} {"train_loss": -11.763632774353027, "global_step": 426141, "epoch": 2536} {"train_loss": -12.025627136230469, "global_step": 426142, "epoch": 2536} {"train_loss": -11.360442161560059, "global_step": 426143, "epoch": 2536} {"train_loss": -12.329172134399414, "global_step": 426144, "epoch": 2536} {"train_loss": -11.16977310180664, "global_step": 426145, "epoch": 2536} {"train_loss": -12.450550079345703, "global_step": 426146, "epoch": 2536} {"train_loss": -11.885479927062988, "global_step": 426147, "epoch": 2536} {"train_loss": -12.04882526397705, "global_step": 426148, "epoch": 2536} {"train_loss": -12.124095916748047, "global_step": 426149, "epoch": 2536} {"train_loss": -12.090588569641113, "global_step": 426150, "epoch": 2536} {"train_loss": -11.910293579101562, "global_step": 426151, "epoch": 2536} {"train_loss": -12.332775115966797, "global_step": 426152, "epoch": 2536} {"train_loss": -12.277034759521484, "global_step": 426153, "epoch": 2536} {"train_loss": -12.0377197265625, "global_step": 426154, "epoch": 2536} {"train_loss": -12.394603729248047, "global_step": 426155, "epoch": 2536} {"train_loss": -12.295275688171387, "global_step": 426156, "epoch": 2536} {"train_loss": -12.347969055175781, "global_step": 426157, "epoch": 2536} {"train_loss": -12.195293426513672, "global_step": 426158, "epoch": 2536} {"train_loss": -12.354288101196289, "global_step": 426159, "epoch": 2536} {"train_loss": -12.183349609375, "global_step": 426160, "epoch": 2536} {"train_loss": -12.396312713623047, "global_step": 426161, "epoch": 2536} {"train_loss": -12.199331283569336, "global_step": 426162, "epoch": 2536} {"train_loss": -12.28384780883789, "global_step": 426163, "epoch": 2536} {"train_loss": -12.393190383911133, "global_step": 426164, "epoch": 2536} {"train_loss": -12.457576751708984, "global_step": 426165, "epoch": 2536} {"train_loss": -12.581509590148926, "global_step": 426166, "epoch": 2536} {"train_loss": -12.329693794250488, "global_step": 426167, "epoch": 2536} {"train_loss": -12.519784927368164, "global_step": 426168, "epoch": 2536} {"train_loss": -12.439599990844727, "global_step": 426169, "epoch": 2536} {"train_loss": -12.6583251953125, "global_step": 426170, "epoch": 2536} {"train_loss": -12.621829986572266, "global_step": 426171, "epoch": 2536} {"train_loss": -12.713896751403809, "global_step": 426172, "epoch": 2536} {"train_loss": -12.619549751281738, "global_step": 426173, "epoch": 2536} {"train_loss": -12.604246139526367, "global_step": 426174, "epoch": 2536} {"train_loss": -12.579394340515137, "global_step": 426175, "epoch": 2536} {"train_loss": -12.502689361572266, "global_step": 426176, "epoch": 2536} {"train_loss": -12.393376350402832, "global_step": 426177, "epoch": 2536} {"train_loss": -12.627531051635742, "global_step": 426178, "epoch": 2536} {"train_loss": -12.607332229614258, "global_step": 426179, "epoch": 2536} {"train_loss": -12.481475830078125, "global_step": 426180, "epoch": 2536} {"train_loss": -12.645227432250977, "global_step": 426181, "epoch": 2536} {"train_loss": -12.516387939453125, "global_step": 426182, "epoch": 2536} {"train_loss": -12.553808212280273, "global_step": 426183, "epoch": 2536} {"train_loss": -12.802253723144531, "global_step": 426184, "epoch": 2536} {"train_loss": -12.739177703857422, "global_step": 426185, "epoch": 2536} {"train_loss": -12.508458137512207, "global_step": 426186, "epoch": 2536} {"train_loss": -12.5794677734375, "global_step": 426187, "epoch": 2536} {"train_loss": -12.807584762573242, "global_step": 426188, "epoch": 2536} {"train_loss": -12.701438903808594, "global_step": 426189, "epoch": 2536} {"train_loss": -12.801097869873047, "global_step": 426190, "epoch": 2536} {"train_loss": -12.739741325378418, "global_step": 426191, "epoch": 2536} {"train_loss": -12.647939682006836, "global_step": 426192, "epoch": 2536} {"train_loss": -12.769903182983398, "global_step": 426193, "epoch": 2536} {"train_loss": -12.705728530883789, "global_step": 426194, "epoch": 2536} {"train_loss": -12.665796279907227, "global_step": 426195, "epoch": 2536} {"train_loss": -12.870433807373047, "global_step": 426196, "epoch": 2536} {"train_loss": -12.903810501098633, "global_step": 426197, "epoch": 2536} {"train_loss": -12.707328796386719, "global_step": 426198, "epoch": 2536} {"train_loss": -12.799212455749512, "global_step": 426199, "epoch": 2536} {"train_loss": -12.677505493164062, "global_step": 426200, "epoch": 2536} {"train_loss": -12.707637786865234, "global_step": 426201, "epoch": 2536} {"train_loss": -12.580169677734375, "global_step": 426202, "epoch": 2536} {"train_loss": -12.618093490600586, "global_step": 426203, "epoch": 2536} {"train_loss": -12.62040901184082, "global_step": 426204, "epoch": 2536} {"train_loss": -12.683565139770508, "global_step": 426205, "epoch": 2536} {"train_loss": -12.667154312133789, "global_step": 426206, "epoch": 2536} {"train_loss": -12.714006423950195, "global_step": 426207, "epoch": 2536} {"train_loss": -12.623823165893555, "global_step": 426208, "epoch": 2536} {"train_loss": -12.875502586364746, "global_step": 426209, "epoch": 2536} {"train_loss": -12.708390235900879, "global_step": 426210, "epoch": 2536} {"train_loss": -12.68442440032959, "global_step": 426211, "epoch": 2536} {"train_loss": -12.640204429626465, "global_step": 426212, "epoch": 2536} {"train_loss": -12.669914245605469, "global_step": 426213, "epoch": 2536} {"train_loss": -12.712701797485352, "global_step": 426214, "epoch": 2536} {"train_loss": -12.011846962429228, "global_step": 426215, "epoch": 2536, "val_loss": 308052.65625} {"train_loss": -12.684887886047363, "global_step": 426216, "epoch": 2537} {"train_loss": -12.783592224121094, "global_step": 426217, "epoch": 2537} {"train_loss": -12.740184783935547, "global_step": 426218, "epoch": 2537} {"train_loss": -12.62106704711914, "global_step": 426219, "epoch": 2537} {"train_loss": -12.797419548034668, "global_step": 426220, "epoch": 2537} {"train_loss": -12.860898971557617, "global_step": 426221, "epoch": 2537} {"train_loss": -12.837604522705078, "global_step": 426222, "epoch": 2537} {"train_loss": -12.466974258422852, "global_step": 426223, "epoch": 2537} {"train_loss": -12.627384185791016, "global_step": 426224, "epoch": 2537} {"train_loss": -12.329931259155273, "global_step": 426225, "epoch": 2537} {"train_loss": -12.78901195526123, "global_step": 426226, "epoch": 2537} {"train_loss": -12.37457275390625, "global_step": 426227, "epoch": 2537} {"train_loss": -12.42721176147461, "global_step": 426228, "epoch": 2537} {"train_loss": -11.936115264892578, "global_step": 426229, "epoch": 2537} {"train_loss": -11.898102760314941, "global_step": 426230, "epoch": 2537} {"train_loss": -12.209894180297852, "global_step": 426231, "epoch": 2537} {"train_loss": -11.665916442871094, "global_step": 426232, "epoch": 2537} {"train_loss": -12.04518985748291, "global_step": 426233, "epoch": 2537} {"train_loss": -10.266229629516602, "global_step": 426234, "epoch": 2537} {"train_loss": -10.713813781738281, "global_step": 426235, "epoch": 2537} {"train_loss": -11.116503715515137, "global_step": 426236, "epoch": 2537} {"train_loss": -9.159815788269043, "global_step": 426237, "epoch": 2537} {"train_loss": -8.940164566040039, "global_step": 426238, "epoch": 2537} {"train_loss": -8.207581520080566, "global_step": 426239, "epoch": 2537} {"train_loss": -8.509015083312988, "global_step": 426240, "epoch": 2537} {"train_loss": -8.530752182006836, "global_step": 426241, "epoch": 2537} {"train_loss": -9.025337219238281, "global_step": 426242, "epoch": 2537} {"train_loss": -8.750049591064453, "global_step": 426243, "epoch": 2537} {"train_loss": -8.936351776123047, "global_step": 426244, "epoch": 2537} {"train_loss": -9.090200424194336, "global_step": 426245, "epoch": 2537} {"train_loss": -8.558982849121094, "global_step": 426246, "epoch": 2537} {"train_loss": -8.676324844360352, "global_step": 426247, "epoch": 2537} {"train_loss": -8.661685943603516, "global_step": 426248, "epoch": 2537} {"train_loss": -8.643696784973145, "global_step": 426249, "epoch": 2537} {"train_loss": -9.318431854248047, "global_step": 426250, "epoch": 2537} {"train_loss": -9.801655769348145, "global_step": 426251, "epoch": 2537} {"train_loss": -10.184290885925293, "global_step": 426252, "epoch": 2537} {"train_loss": -9.865243911743164, "global_step": 426253, "epoch": 2537} {"train_loss": -10.575520515441895, "global_step": 426254, "epoch": 2537} {"train_loss": -11.213851928710938, "global_step": 426255, "epoch": 2537} {"train_loss": -11.080839157104492, "global_step": 426256, "epoch": 2537} {"train_loss": -11.30417251586914, "global_step": 426257, "epoch": 2537} {"train_loss": -11.278030395507812, "global_step": 426258, "epoch": 2537} {"train_loss": -10.772500038146973, "global_step": 426259, "epoch": 2537} {"train_loss": -11.295000076293945, "global_step": 426260, "epoch": 2537} {"train_loss": -10.84494400024414, "global_step": 426261, "epoch": 2537} {"train_loss": -11.426944732666016, "global_step": 426262, "epoch": 2537} {"train_loss": -11.68474006652832, "global_step": 426263, "epoch": 2537} {"train_loss": -11.802461624145508, "global_step": 426264, "epoch": 2537} {"train_loss": -12.078349113464355, "global_step": 426265, "epoch": 2537} {"train_loss": -12.032633781433105, "global_step": 426266, "epoch": 2537} {"train_loss": -11.773539543151855, "global_step": 426267, "epoch": 2537} {"train_loss": -12.037633895874023, "global_step": 426268, "epoch": 2537} {"train_loss": -12.071267127990723, "global_step": 426269, "epoch": 2537} {"train_loss": -11.93728256225586, "global_step": 426270, "epoch": 2537} {"train_loss": -11.963111877441406, "global_step": 426271, "epoch": 2537} {"train_loss": -11.972769737243652, "global_step": 426272, "epoch": 2537} {"train_loss": -11.989112854003906, "global_step": 426273, "epoch": 2537} {"train_loss": -12.085329055786133, "global_step": 426274, "epoch": 2537} {"train_loss": -11.95048713684082, "global_step": 426275, "epoch": 2537} {"train_loss": -12.171603202819824, "global_step": 426276, "epoch": 2537} {"train_loss": -12.357475280761719, "global_step": 426277, "epoch": 2537} {"train_loss": -12.347530364990234, "global_step": 426278, "epoch": 2537} {"train_loss": -12.012615203857422, "global_step": 426279, "epoch": 2537} {"train_loss": -12.174331665039062, "global_step": 426280, "epoch": 2537} {"train_loss": -12.18673324584961, "global_step": 426281, "epoch": 2537} {"train_loss": -12.265151977539062, "global_step": 426282, "epoch": 2537} {"train_loss": -12.319957733154297, "global_step": 426283, "epoch": 2537} {"train_loss": -11.907997131347656, "global_step": 426284, "epoch": 2537} {"train_loss": -11.859922409057617, "global_step": 426285, "epoch": 2537} {"train_loss": -12.201387405395508, "global_step": 426286, "epoch": 2537} {"train_loss": -11.571949005126953, "global_step": 426287, "epoch": 2537} {"train_loss": -12.228534698486328, "global_step": 426288, "epoch": 2537} {"train_loss": -11.507112503051758, "global_step": 426289, "epoch": 2537} {"train_loss": -12.40001106262207, "global_step": 426290, "epoch": 2537} {"train_loss": -11.585512161254883, "global_step": 426291, "epoch": 2537} {"train_loss": -12.422070503234863, "global_step": 426292, "epoch": 2537} {"train_loss": -12.458158493041992, "global_step": 426293, "epoch": 2537} {"train_loss": -12.11920166015625, "global_step": 426294, "epoch": 2537} {"train_loss": -12.403860092163086, "global_step": 426295, "epoch": 2537} {"train_loss": -12.332182884216309, "global_step": 426296, "epoch": 2537} {"train_loss": -12.486237525939941, "global_step": 426297, "epoch": 2537} {"train_loss": -12.376657485961914, "global_step": 426298, "epoch": 2537} {"train_loss": -12.725953102111816, "global_step": 426299, "epoch": 2537} {"train_loss": -12.39328670501709, "global_step": 426300, "epoch": 2537} {"train_loss": -12.57614517211914, "global_step": 426301, "epoch": 2537} {"train_loss": -12.48007583618164, "global_step": 426302, "epoch": 2537} {"train_loss": -12.345285415649414, "global_step": 426303, "epoch": 2537} {"train_loss": -12.477819442749023, "global_step": 426304, "epoch": 2537} {"train_loss": -12.206356048583984, "global_step": 426305, "epoch": 2537} {"train_loss": -12.38215446472168, "global_step": 426306, "epoch": 2537} {"train_loss": -12.386301040649414, "global_step": 426307, "epoch": 2537} {"train_loss": -12.318456649780273, "global_step": 426308, "epoch": 2537} {"train_loss": -12.472258567810059, "global_step": 426309, "epoch": 2537} {"train_loss": -12.43065071105957, "global_step": 426310, "epoch": 2537} {"train_loss": -12.523983001708984, "global_step": 426311, "epoch": 2537} {"train_loss": -12.438060760498047, "global_step": 426312, "epoch": 2537} {"train_loss": -12.476670265197754, "global_step": 426313, "epoch": 2537} {"train_loss": -12.423043251037598, "global_step": 426314, "epoch": 2537} {"train_loss": -12.633031845092773, "global_step": 426315, "epoch": 2537} {"train_loss": -12.673823356628418, "global_step": 426316, "epoch": 2537} {"train_loss": -12.460466384887695, "global_step": 426317, "epoch": 2537} {"train_loss": -12.74897575378418, "global_step": 426318, "epoch": 2537} {"train_loss": -12.56601619720459, "global_step": 426319, "epoch": 2537} {"train_loss": -12.63973331451416, "global_step": 426320, "epoch": 2537} {"train_loss": -12.327540397644043, "global_step": 426321, "epoch": 2537} {"train_loss": -12.486050605773926, "global_step": 426322, "epoch": 2537} {"train_loss": -12.388821601867676, "global_step": 426323, "epoch": 2537} {"train_loss": -12.316861152648926, "global_step": 426324, "epoch": 2537} {"train_loss": -12.560233116149902, "global_step": 426325, "epoch": 2537} {"train_loss": -12.730533599853516, "global_step": 426326, "epoch": 2537} {"train_loss": -12.535654067993164, "global_step": 426327, "epoch": 2537} {"train_loss": -12.611326217651367, "global_step": 426328, "epoch": 2537} {"train_loss": -12.15414047241211, "global_step": 426329, "epoch": 2537} {"train_loss": -12.341864585876465, "global_step": 426330, "epoch": 2537} {"train_loss": -12.43421745300293, "global_step": 426331, "epoch": 2537} {"train_loss": -12.827339172363281, "global_step": 426332, "epoch": 2537} {"train_loss": -12.55708122253418, "global_step": 426333, "epoch": 2537} {"train_loss": -12.470487594604492, "global_step": 426334, "epoch": 2537} {"train_loss": -12.857885360717773, "global_step": 426335, "epoch": 2537} {"train_loss": -12.457712173461914, "global_step": 426336, "epoch": 2537} {"train_loss": -12.122906684875488, "global_step": 426337, "epoch": 2537} {"train_loss": -12.928342819213867, "global_step": 426338, "epoch": 2537} {"train_loss": -12.283326148986816, "global_step": 426339, "epoch": 2537} {"train_loss": -12.089681625366211, "global_step": 426340, "epoch": 2537} {"train_loss": -12.474855422973633, "global_step": 426341, "epoch": 2537} {"train_loss": -12.589839935302734, "global_step": 426342, "epoch": 2537} {"train_loss": -12.01699447631836, "global_step": 426343, "epoch": 2537} {"train_loss": -12.836305618286133, "global_step": 426344, "epoch": 2537} {"train_loss": -12.542171478271484, "global_step": 426345, "epoch": 2537} {"train_loss": -12.643665313720703, "global_step": 426346, "epoch": 2537} {"train_loss": -12.483901977539062, "global_step": 426347, "epoch": 2537} {"train_loss": -12.574132919311523, "global_step": 426348, "epoch": 2537} {"train_loss": -12.634429931640625, "global_step": 426349, "epoch": 2537} {"train_loss": -12.353985786437988, "global_step": 426350, "epoch": 2537} {"train_loss": -12.443314552307129, "global_step": 426351, "epoch": 2537} {"train_loss": -12.619429588317871, "global_step": 426352, "epoch": 2537} {"train_loss": -12.275314331054688, "global_step": 426353, "epoch": 2537} {"train_loss": -11.76305866241455, "global_step": 426354, "epoch": 2537} {"train_loss": -12.37709903717041, "global_step": 426355, "epoch": 2537} {"train_loss": -12.518150329589844, "global_step": 426356, "epoch": 2537} {"train_loss": -12.47535514831543, "global_step": 426357, "epoch": 2537} {"train_loss": -12.501174926757812, "global_step": 426358, "epoch": 2537} {"train_loss": -12.42903995513916, "global_step": 426359, "epoch": 2537} {"train_loss": -12.492250442504883, "global_step": 426360, "epoch": 2537} {"train_loss": -12.633769989013672, "global_step": 426361, "epoch": 2537} {"train_loss": -12.229259490966797, "global_step": 426362, "epoch": 2537} {"train_loss": -12.59304141998291, "global_step": 426363, "epoch": 2537} {"train_loss": -12.267980575561523, "global_step": 426364, "epoch": 2537} {"train_loss": -11.955384254455566, "global_step": 426365, "epoch": 2537} {"train_loss": -11.987245559692383, "global_step": 426366, "epoch": 2537} {"train_loss": -12.646585464477539, "global_step": 426367, "epoch": 2537} {"train_loss": -12.11915397644043, "global_step": 426368, "epoch": 2537} {"train_loss": -11.65631103515625, "global_step": 426369, "epoch": 2537} {"train_loss": -11.957283973693848, "global_step": 426370, "epoch": 2537} {"train_loss": -12.299028396606445, "global_step": 426371, "epoch": 2537} {"train_loss": -12.286222457885742, "global_step": 426372, "epoch": 2537} {"train_loss": -12.355548858642578, "global_step": 426373, "epoch": 2537} {"train_loss": -12.368083953857422, "global_step": 426374, "epoch": 2537} {"train_loss": -12.330333709716797, "global_step": 426375, "epoch": 2537} {"train_loss": -12.043689727783203, "global_step": 426376, "epoch": 2537} {"train_loss": -12.674507141113281, "global_step": 426377, "epoch": 2537} {"train_loss": -12.673057556152344, "global_step": 426378, "epoch": 2537} {"train_loss": -12.748433113098145, "global_step": 426379, "epoch": 2537} {"train_loss": -11.972975730895996, "global_step": 426380, "epoch": 2537} {"train_loss": -12.534910202026367, "global_step": 426381, "epoch": 2537} {"train_loss": -11.776849746704102, "global_step": 426382, "epoch": 2537} {"train_loss": -11.902041384152003, "global_step": 426383, "epoch": 2537, "val_loss": 299518.4375} {"train_loss": -10.226367950439453, "global_step": 426384, "epoch": 2538} {"train_loss": -12.264280319213867, "global_step": 426385, "epoch": 2538} {"train_loss": -11.902994155883789, "global_step": 426386, "epoch": 2538} {"train_loss": -11.588754653930664, "global_step": 426387, "epoch": 2538} {"train_loss": -11.401971817016602, "global_step": 426388, "epoch": 2538} {"train_loss": -12.475674629211426, "global_step": 426389, "epoch": 2538} {"train_loss": -11.356621742248535, "global_step": 426390, "epoch": 2538} {"train_loss": -11.944347381591797, "global_step": 426391, "epoch": 2538} {"train_loss": -11.588045120239258, "global_step": 426392, "epoch": 2538} {"train_loss": -11.221675872802734, "global_step": 426393, "epoch": 2538} {"train_loss": -12.058591842651367, "global_step": 426394, "epoch": 2538} {"train_loss": -11.413432121276855, "global_step": 426395, "epoch": 2538} {"train_loss": -11.247867584228516, "global_step": 426396, "epoch": 2538} {"train_loss": -10.882423400878906, "global_step": 426397, "epoch": 2538} {"train_loss": -11.83607292175293, "global_step": 426398, "epoch": 2538} {"train_loss": -11.608073234558105, "global_step": 426399, "epoch": 2538} {"train_loss": -11.819851875305176, "global_step": 426400, "epoch": 2538} {"train_loss": -11.564292907714844, "global_step": 426401, "epoch": 2538} {"train_loss": -11.65512466430664, "global_step": 426402, "epoch": 2538} {"train_loss": -12.08686351776123, "global_step": 426403, "epoch": 2538} {"train_loss": -12.294286727905273, "global_step": 426404, "epoch": 2538} {"train_loss": -11.639028549194336, "global_step": 426405, "epoch": 2538} {"train_loss": -11.914529800415039, "global_step": 426406, "epoch": 2538} {"train_loss": -12.048437118530273, "global_step": 426407, "epoch": 2538} {"train_loss": -11.289957046508789, "global_step": 426408, "epoch": 2538} {"train_loss": -11.95388412475586, "global_step": 426409, "epoch": 2538} {"train_loss": -10.549198150634766, "global_step": 426410, "epoch": 2538} {"train_loss": -11.989960670471191, "global_step": 426411, "epoch": 2538} {"train_loss": -10.782258987426758, "global_step": 426412, "epoch": 2538} {"train_loss": -11.986597061157227, "global_step": 426413, "epoch": 2538} {"train_loss": -11.326343536376953, "global_step": 426414, "epoch": 2538} {"train_loss": -12.02692985534668, "global_step": 426415, "epoch": 2538} {"train_loss": -11.709466934204102, "global_step": 426416, "epoch": 2538} {"train_loss": -11.632198333740234, "global_step": 426417, "epoch": 2538} {"train_loss": -12.046561241149902, "global_step": 426418, "epoch": 2538} {"train_loss": -12.068903923034668, "global_step": 426419, "epoch": 2538} {"train_loss": -12.357383728027344, "global_step": 426420, "epoch": 2538} {"train_loss": -11.391508102416992, "global_step": 426421, "epoch": 2538} {"train_loss": -12.120891571044922, "global_step": 426422, "epoch": 2538} {"train_loss": -11.631382942199707, "global_step": 426423, "epoch": 2538} {"train_loss": -11.826940536499023, "global_step": 426424, "epoch": 2538} {"train_loss": -11.51784896850586, "global_step": 426425, "epoch": 2538} {"train_loss": -11.91174602508545, "global_step": 426426, "epoch": 2538} {"train_loss": -11.492443084716797, "global_step": 426427, "epoch": 2538} {"train_loss": -12.54236125946045, "global_step": 426428, "epoch": 2538} {"train_loss": -11.490796089172363, "global_step": 426429, "epoch": 2538} {"train_loss": -11.835990905761719, "global_step": 426430, "epoch": 2538} {"train_loss": -11.256139755249023, "global_step": 426431, "epoch": 2538} {"train_loss": -11.59652042388916, "global_step": 426432, "epoch": 2538} {"train_loss": -10.681159973144531, "global_step": 426433, "epoch": 2538} {"train_loss": -12.162933349609375, "global_step": 426434, "epoch": 2538} {"train_loss": -10.697308540344238, "global_step": 426435, "epoch": 2538} {"train_loss": -11.171562194824219, "global_step": 426436, "epoch": 2538} {"train_loss": -11.304100036621094, "global_step": 426437, "epoch": 2538} {"train_loss": -10.449551582336426, "global_step": 426438, "epoch": 2538} {"train_loss": -11.929634094238281, "global_step": 426439, "epoch": 2538} {"train_loss": -9.92190170288086, "global_step": 426440, "epoch": 2538} {"train_loss": -10.606364250183105, "global_step": 426441, "epoch": 2538} {"train_loss": -10.299026489257812, "global_step": 426442, "epoch": 2538} {"train_loss": -11.73050308227539, "global_step": 426443, "epoch": 2538} {"train_loss": -10.271461486816406, "global_step": 426444, "epoch": 2538} {"train_loss": -11.79825496673584, "global_step": 426445, "epoch": 2538} {"train_loss": -10.791231155395508, "global_step": 426446, "epoch": 2538} {"train_loss": -11.708213806152344, "global_step": 426447, "epoch": 2538} {"train_loss": -11.154767990112305, "global_step": 426448, "epoch": 2538} {"train_loss": -11.293584823608398, "global_step": 426449, "epoch": 2538} {"train_loss": -11.077072143554688, "global_step": 426450, "epoch": 2538} {"train_loss": -11.623401641845703, "global_step": 426451, "epoch": 2538} {"train_loss": -11.144948959350586, "global_step": 426452, "epoch": 2538} {"train_loss": -11.641073226928711, "global_step": 426453, "epoch": 2538} {"train_loss": -11.211429595947266, "global_step": 426454, "epoch": 2538} {"train_loss": -11.894754409790039, "global_step": 426455, "epoch": 2538} {"train_loss": -11.117202758789062, "global_step": 426456, "epoch": 2538} {"train_loss": -11.51034927368164, "global_step": 426457, "epoch": 2538} {"train_loss": -11.978185653686523, "global_step": 426458, "epoch": 2538} {"train_loss": -11.999985694885254, "global_step": 426459, "epoch": 2538} {"train_loss": -12.077373504638672, "global_step": 426460, "epoch": 2538} {"train_loss": -11.928060531616211, "global_step": 426461, "epoch": 2538} {"train_loss": -12.116758346557617, "global_step": 426462, "epoch": 2538} {"train_loss": -11.903956413269043, "global_step": 426463, "epoch": 2538} {"train_loss": -12.302881240844727, "global_step": 426464, "epoch": 2538} {"train_loss": -11.756391525268555, "global_step": 426465, "epoch": 2538} {"train_loss": -12.325801849365234, "global_step": 426466, "epoch": 2538} {"train_loss": -11.996369361877441, "global_step": 426467, "epoch": 2538} {"train_loss": -12.141884803771973, "global_step": 426468, "epoch": 2538} {"train_loss": -11.753663063049316, "global_step": 426469, "epoch": 2538} {"train_loss": -12.097171783447266, "global_step": 426470, "epoch": 2538} {"train_loss": -11.931723594665527, "global_step": 426471, "epoch": 2538} {"train_loss": -12.167975425720215, "global_step": 426472, "epoch": 2538} {"train_loss": -11.555620193481445, "global_step": 426473, "epoch": 2538} {"train_loss": -12.090747833251953, "global_step": 426474, "epoch": 2538} {"train_loss": -11.898569107055664, "global_step": 426475, "epoch": 2538} {"train_loss": -12.121136665344238, "global_step": 426476, "epoch": 2538} {"train_loss": -12.226097106933594, "global_step": 426477, "epoch": 2538} {"train_loss": -12.343570709228516, "global_step": 426478, "epoch": 2538} {"train_loss": -12.570001602172852, "global_step": 426479, "epoch": 2538} {"train_loss": -12.214309692382812, "global_step": 426480, "epoch": 2538} {"train_loss": -12.472832679748535, "global_step": 426481, "epoch": 2538} {"train_loss": -12.37669563293457, "global_step": 426482, "epoch": 2538} {"train_loss": -12.50310230255127, "global_step": 426483, "epoch": 2538} {"train_loss": -12.400068283081055, "global_step": 426484, "epoch": 2538} {"train_loss": -12.501070022583008, "global_step": 426485, "epoch": 2538} {"train_loss": -12.251635551452637, "global_step": 426486, "epoch": 2538} {"train_loss": -12.101724624633789, "global_step": 426487, "epoch": 2538} {"train_loss": -12.52467155456543, "global_step": 426488, "epoch": 2538} {"train_loss": -12.003994941711426, "global_step": 426489, "epoch": 2538} {"train_loss": -12.458345413208008, "global_step": 426490, "epoch": 2538} {"train_loss": -12.204477310180664, "global_step": 426491, "epoch": 2538} {"train_loss": -12.466623306274414, "global_step": 426492, "epoch": 2538} {"train_loss": -12.413934707641602, "global_step": 426493, "epoch": 2538} {"train_loss": -12.47436237335205, "global_step": 426494, "epoch": 2538} {"train_loss": -12.677088737487793, "global_step": 426495, "epoch": 2538} {"train_loss": -12.407463073730469, "global_step": 426496, "epoch": 2538} {"train_loss": -12.607316970825195, "global_step": 426497, "epoch": 2538} {"train_loss": -12.512557029724121, "global_step": 426498, "epoch": 2538} {"train_loss": -12.509834289550781, "global_step": 426499, "epoch": 2538} {"train_loss": -12.344433784484863, "global_step": 426500, "epoch": 2538} {"train_loss": -11.915894508361816, "global_step": 426501, "epoch": 2538} {"train_loss": -12.15164852142334, "global_step": 426502, "epoch": 2538} {"train_loss": -12.247628211975098, "global_step": 426503, "epoch": 2538} {"train_loss": -12.028619766235352, "global_step": 426504, "epoch": 2538} {"train_loss": -12.351608276367188, "global_step": 426505, "epoch": 2538} {"train_loss": -12.254203796386719, "global_step": 426506, "epoch": 2538} {"train_loss": -12.343643188476562, "global_step": 426507, "epoch": 2538} {"train_loss": -12.125425338745117, "global_step": 426508, "epoch": 2538} {"train_loss": -12.268217086791992, "global_step": 426509, "epoch": 2538} {"train_loss": -12.418752670288086, "global_step": 426510, "epoch": 2538} {"train_loss": -11.426607131958008, "global_step": 426511, "epoch": 2538} {"train_loss": -11.984088897705078, "global_step": 426512, "epoch": 2538} {"train_loss": -12.327423095703125, "global_step": 426513, "epoch": 2538} {"train_loss": -11.971792221069336, "global_step": 426514, "epoch": 2538} {"train_loss": -12.449021339416504, "global_step": 426515, "epoch": 2538} {"train_loss": -12.119392395019531, "global_step": 426516, "epoch": 2538} {"train_loss": -12.345624923706055, "global_step": 426517, "epoch": 2538} {"train_loss": -12.064432144165039, "global_step": 426518, "epoch": 2538} {"train_loss": -12.086339950561523, "global_step": 426519, "epoch": 2538} {"train_loss": -12.544424057006836, "global_step": 426520, "epoch": 2538} {"train_loss": -12.324858665466309, "global_step": 426521, "epoch": 2538} {"train_loss": -12.382022857666016, "global_step": 426522, "epoch": 2538} {"train_loss": -12.271197319030762, "global_step": 426523, "epoch": 2538} {"train_loss": -12.404277801513672, "global_step": 426524, "epoch": 2538} {"train_loss": -12.082720756530762, "global_step": 426525, "epoch": 2538} {"train_loss": -12.389205932617188, "global_step": 426526, "epoch": 2538} {"train_loss": -12.515768051147461, "global_step": 426527, "epoch": 2538} {"train_loss": -12.558420181274414, "global_step": 426528, "epoch": 2538} {"train_loss": -12.553741455078125, "global_step": 426529, "epoch": 2538} {"train_loss": -12.447473526000977, "global_step": 426530, "epoch": 2538} {"train_loss": -12.525638580322266, "global_step": 426531, "epoch": 2538} {"train_loss": -12.63155460357666, "global_step": 426532, "epoch": 2538} {"train_loss": -12.542526245117188, "global_step": 426533, "epoch": 2538} {"train_loss": -12.540739059448242, "global_step": 426534, "epoch": 2538} {"train_loss": -12.676593780517578, "global_step": 426535, "epoch": 2538} {"train_loss": -12.537555694580078, "global_step": 426536, "epoch": 2538} {"train_loss": -12.619516372680664, "global_step": 426537, "epoch": 2538} {"train_loss": -12.56728458404541, "global_step": 426538, "epoch": 2538} {"train_loss": -12.766502380371094, "global_step": 426539, "epoch": 2538} {"train_loss": -12.563470840454102, "global_step": 426540, "epoch": 2538} {"train_loss": -12.581605911254883, "global_step": 426541, "epoch": 2538} {"train_loss": -12.630012512207031, "global_step": 426542, "epoch": 2538} {"train_loss": -12.706059455871582, "global_step": 426543, "epoch": 2538} {"train_loss": -12.823246955871582, "global_step": 426544, "epoch": 2538} {"train_loss": -12.721890449523926, "global_step": 426545, "epoch": 2538} {"train_loss": -12.782508850097656, "global_step": 426546, "epoch": 2538} {"train_loss": -12.794386863708496, "global_step": 426547, "epoch": 2538} {"train_loss": -12.594096183776855, "global_step": 426548, "epoch": 2538} {"train_loss": -12.647871971130371, "global_step": 426549, "epoch": 2538} {"train_loss": -12.52148151397705, "global_step": 426550, "epoch": 2538} {"train_loss": -11.963575834319705, "global_step": 426551, "epoch": 2538, "val_loss": 305122.46875} {"train_loss": -12.810628890991211, "global_step": 426552, "epoch": 2539} {"train_loss": -12.585521697998047, "global_step": 426553, "epoch": 2539} {"train_loss": -12.752046585083008, "global_step": 426554, "epoch": 2539} {"train_loss": -12.53525447845459, "global_step": 426555, "epoch": 2539} {"train_loss": -12.688106536865234, "global_step": 426556, "epoch": 2539} {"train_loss": -12.767131805419922, "global_step": 426557, "epoch": 2539} {"train_loss": -12.69288444519043, "global_step": 426558, "epoch": 2539} {"train_loss": -12.44162368774414, "global_step": 426559, "epoch": 2539} {"train_loss": -12.681159973144531, "global_step": 426560, "epoch": 2539} {"train_loss": -12.201181411743164, "global_step": 426561, "epoch": 2539} {"train_loss": -12.29380989074707, "global_step": 426562, "epoch": 2539} {"train_loss": -11.648122787475586, "global_step": 426563, "epoch": 2539} {"train_loss": -12.402585983276367, "global_step": 426564, "epoch": 2539} {"train_loss": -12.120333671569824, "global_step": 426565, "epoch": 2539} {"train_loss": -12.191911697387695, "global_step": 426566, "epoch": 2539} {"train_loss": -12.372537612915039, "global_step": 426567, "epoch": 2539} {"train_loss": -12.318574905395508, "global_step": 426568, "epoch": 2539} {"train_loss": -12.400081634521484, "global_step": 426569, "epoch": 2539} {"train_loss": -12.61172103881836, "global_step": 426570, "epoch": 2539} {"train_loss": -12.365103721618652, "global_step": 426571, "epoch": 2539} {"train_loss": -12.177131652832031, "global_step": 426572, "epoch": 2539} {"train_loss": -12.681295394897461, "global_step": 426573, "epoch": 2539} {"train_loss": -12.050045013427734, "global_step": 426574, "epoch": 2539} {"train_loss": -12.54393196105957, "global_step": 426575, "epoch": 2539} {"train_loss": -12.11578369140625, "global_step": 426576, "epoch": 2539} {"train_loss": -12.149595260620117, "global_step": 426577, "epoch": 2539} {"train_loss": -12.191423416137695, "global_step": 426578, "epoch": 2539} {"train_loss": -12.623712539672852, "global_step": 426579, "epoch": 2539} {"train_loss": -12.043096542358398, "global_step": 426580, "epoch": 2539} {"train_loss": -12.436811447143555, "global_step": 426581, "epoch": 2539} {"train_loss": -12.382206916809082, "global_step": 426582, "epoch": 2539} {"train_loss": -12.735267639160156, "global_step": 426583, "epoch": 2539} {"train_loss": -12.387508392333984, "global_step": 426584, "epoch": 2539} {"train_loss": -12.029415130615234, "global_step": 426585, "epoch": 2539} {"train_loss": -12.397520065307617, "global_step": 426586, "epoch": 2539} {"train_loss": -12.843433380126953, "global_step": 426587, "epoch": 2539} {"train_loss": -12.075639724731445, "global_step": 426588, "epoch": 2539} {"train_loss": -12.338764190673828, "global_step": 426589, "epoch": 2539} {"train_loss": -11.694267272949219, "global_step": 426590, "epoch": 2539} {"train_loss": -12.359003067016602, "global_step": 426591, "epoch": 2539} {"train_loss": -11.760854721069336, "global_step": 426592, "epoch": 2539} {"train_loss": -12.357762336730957, "global_step": 426593, "epoch": 2539} {"train_loss": -12.141450881958008, "global_step": 426594, "epoch": 2539} {"train_loss": -12.266178131103516, "global_step": 426595, "epoch": 2539} {"train_loss": -11.967103958129883, "global_step": 426596, "epoch": 2539} {"train_loss": -12.50917911529541, "global_step": 426597, "epoch": 2539} {"train_loss": -11.933486938476562, "global_step": 426598, "epoch": 2539} {"train_loss": -12.315650939941406, "global_step": 426599, "epoch": 2539} {"train_loss": -11.752998352050781, "global_step": 426600, "epoch": 2539} {"train_loss": -12.244460105895996, "global_step": 426601, "epoch": 2539} {"train_loss": -11.754542350769043, "global_step": 426602, "epoch": 2539} {"train_loss": -12.157820701599121, "global_step": 426603, "epoch": 2539} {"train_loss": -12.398439407348633, "global_step": 426604, "epoch": 2539} {"train_loss": -12.356183052062988, "global_step": 426605, "epoch": 2539} {"train_loss": -11.452803611755371, "global_step": 426606, "epoch": 2539} {"train_loss": -11.336925506591797, "global_step": 426607, "epoch": 2539} {"train_loss": -9.677669525146484, "global_step": 426608, "epoch": 2539} {"train_loss": -10.32229232788086, "global_step": 426609, "epoch": 2539} {"train_loss": -11.80422592163086, "global_step": 426610, "epoch": 2539} {"train_loss": -10.927867889404297, "global_step": 426611, "epoch": 2539} {"train_loss": -10.77325439453125, "global_step": 426612, "epoch": 2539} {"train_loss": -11.12251091003418, "global_step": 426613, "epoch": 2539} {"train_loss": -10.858692169189453, "global_step": 426614, "epoch": 2539} {"train_loss": -10.960884094238281, "global_step": 426615, "epoch": 2539} {"train_loss": -11.675198554992676, "global_step": 426616, "epoch": 2539} {"train_loss": -11.160884857177734, "global_step": 426617, "epoch": 2539} {"train_loss": -10.91427993774414, "global_step": 426618, "epoch": 2539} {"train_loss": -10.812335968017578, "global_step": 426619, "epoch": 2539} {"train_loss": -11.442743301391602, "global_step": 426620, "epoch": 2539} {"train_loss": -10.541492462158203, "global_step": 426621, "epoch": 2539} {"train_loss": -11.57994556427002, "global_step": 426622, "epoch": 2539} {"train_loss": -10.510169982910156, "global_step": 426623, "epoch": 2539} {"train_loss": -11.103515625, "global_step": 426624, "epoch": 2539} {"train_loss": -10.56002426147461, "global_step": 426625, "epoch": 2539} {"train_loss": -11.16435432434082, "global_step": 426626, "epoch": 2539} {"train_loss": -11.478178024291992, "global_step": 426627, "epoch": 2539} {"train_loss": -10.840540885925293, "global_step": 426628, "epoch": 2539} {"train_loss": -11.840621948242188, "global_step": 426629, "epoch": 2539} {"train_loss": -10.803333282470703, "global_step": 426630, "epoch": 2539} {"train_loss": -10.573739051818848, "global_step": 426631, "epoch": 2539} {"train_loss": -11.600977897644043, "global_step": 426632, "epoch": 2539} {"train_loss": -10.460590362548828, "global_step": 426633, "epoch": 2539} {"train_loss": -11.90112018585205, "global_step": 426634, "epoch": 2539} {"train_loss": -11.115720748901367, "global_step": 426635, "epoch": 2539} {"train_loss": -11.391222953796387, "global_step": 426636, "epoch": 2539} {"train_loss": -11.584449768066406, "global_step": 426637, "epoch": 2539} {"train_loss": -11.716009140014648, "global_step": 426638, "epoch": 2539} {"train_loss": -12.027624130249023, "global_step": 426639, "epoch": 2539} {"train_loss": -11.733713150024414, "global_step": 426640, "epoch": 2539} {"train_loss": -12.27515983581543, "global_step": 426641, "epoch": 2539} {"train_loss": -11.517230987548828, "global_step": 426642, "epoch": 2539} {"train_loss": -12.247392654418945, "global_step": 426643, "epoch": 2539} {"train_loss": -11.767690658569336, "global_step": 426644, "epoch": 2539} {"train_loss": -12.398893356323242, "global_step": 426645, "epoch": 2539} {"train_loss": -12.207351684570312, "global_step": 426646, "epoch": 2539} {"train_loss": -12.048364639282227, "global_step": 426647, "epoch": 2539} {"train_loss": -12.43179702758789, "global_step": 426648, "epoch": 2539} {"train_loss": -12.18001937866211, "global_step": 426649, "epoch": 2539} {"train_loss": -12.287130355834961, "global_step": 426650, "epoch": 2539} {"train_loss": -12.331981658935547, "global_step": 426651, "epoch": 2539} {"train_loss": -12.167339324951172, "global_step": 426652, "epoch": 2539} {"train_loss": -12.437501907348633, "global_step": 426653, "epoch": 2539} {"train_loss": -12.001974105834961, "global_step": 426654, "epoch": 2539} {"train_loss": -12.438499450683594, "global_step": 426655, "epoch": 2539} {"train_loss": -11.806513786315918, "global_step": 426656, "epoch": 2539} {"train_loss": -11.93325138092041, "global_step": 426657, "epoch": 2539} {"train_loss": -12.382930755615234, "global_step": 426658, "epoch": 2539} {"train_loss": -12.195155143737793, "global_step": 426659, "epoch": 2539} {"train_loss": -12.365131378173828, "global_step": 426660, "epoch": 2539} {"train_loss": -11.963044166564941, "global_step": 426661, "epoch": 2539} {"train_loss": -12.347134590148926, "global_step": 426662, "epoch": 2539} {"train_loss": -11.882339477539062, "global_step": 426663, "epoch": 2539} {"train_loss": -12.240459442138672, "global_step": 426664, "epoch": 2539} {"train_loss": -12.145503997802734, "global_step": 426665, "epoch": 2539} {"train_loss": -12.429024696350098, "global_step": 426666, "epoch": 2539} {"train_loss": -12.310529708862305, "global_step": 426667, "epoch": 2539} {"train_loss": -11.961446762084961, "global_step": 426668, "epoch": 2539} {"train_loss": -12.186053276062012, "global_step": 426669, "epoch": 2539} {"train_loss": -11.9210786819458, "global_step": 426670, "epoch": 2539} {"train_loss": -12.273953437805176, "global_step": 426671, "epoch": 2539} {"train_loss": -12.26623249053955, "global_step": 426672, "epoch": 2539} {"train_loss": -12.377836227416992, "global_step": 426673, "epoch": 2539} {"train_loss": -12.36685848236084, "global_step": 426674, "epoch": 2539} {"train_loss": -12.437522888183594, "global_step": 426675, "epoch": 2539} {"train_loss": -12.261862754821777, "global_step": 426676, "epoch": 2539} {"train_loss": -12.4251708984375, "global_step": 426677, "epoch": 2539} {"train_loss": -11.805912971496582, "global_step": 426678, "epoch": 2539} {"train_loss": -12.716384887695312, "global_step": 426679, "epoch": 2539} {"train_loss": -12.226637840270996, "global_step": 426680, "epoch": 2539} {"train_loss": -12.53152084350586, "global_step": 426681, "epoch": 2539} {"train_loss": -12.517498970031738, "global_step": 426682, "epoch": 2539} {"train_loss": -11.8963623046875, "global_step": 426683, "epoch": 2539} {"train_loss": -12.346696853637695, "global_step": 426684, "epoch": 2539} {"train_loss": -12.207740783691406, "global_step": 426685, "epoch": 2539} {"train_loss": -12.312681198120117, "global_step": 426686, "epoch": 2539} {"train_loss": -12.244272232055664, "global_step": 426687, "epoch": 2539} {"train_loss": -12.090839385986328, "global_step": 426688, "epoch": 2539} {"train_loss": -12.409704208374023, "global_step": 426689, "epoch": 2539} {"train_loss": -12.233272552490234, "global_step": 426690, "epoch": 2539} {"train_loss": -12.390039443969727, "global_step": 426691, "epoch": 2539} {"train_loss": -12.454865455627441, "global_step": 426692, "epoch": 2539} {"train_loss": -12.372771263122559, "global_step": 426693, "epoch": 2539} {"train_loss": -12.558050155639648, "global_step": 426694, "epoch": 2539} {"train_loss": -12.243560791015625, "global_step": 426695, "epoch": 2539} {"train_loss": -12.481057167053223, "global_step": 426696, "epoch": 2539} {"train_loss": -12.20089054107666, "global_step": 426697, "epoch": 2539} {"train_loss": -12.345479965209961, "global_step": 426698, "epoch": 2539} {"train_loss": -12.442606925964355, "global_step": 426699, "epoch": 2539} {"train_loss": -12.343033790588379, "global_step": 426700, "epoch": 2539} {"train_loss": -12.202641487121582, "global_step": 426701, "epoch": 2539} {"train_loss": -12.244331359863281, "global_step": 426702, "epoch": 2539} {"train_loss": -12.425848007202148, "global_step": 426703, "epoch": 2539} {"train_loss": -11.95450210571289, "global_step": 426704, "epoch": 2539} {"train_loss": -12.373757362365723, "global_step": 426705, "epoch": 2539} {"train_loss": -12.133119583129883, "global_step": 426706, "epoch": 2539} {"train_loss": -12.6617431640625, "global_step": 426707, "epoch": 2539} {"train_loss": -11.57653522491455, "global_step": 426708, "epoch": 2539} {"train_loss": -12.67591381072998, "global_step": 426709, "epoch": 2539} {"train_loss": -11.583999633789062, "global_step": 426710, "epoch": 2539} {"train_loss": -12.542433738708496, "global_step": 426711, "epoch": 2539} {"train_loss": -11.350603103637695, "global_step": 426712, "epoch": 2539} {"train_loss": -12.77180290222168, "global_step": 426713, "epoch": 2539} {"train_loss": -11.520452499389648, "global_step": 426714, "epoch": 2539} {"train_loss": -12.070068359375, "global_step": 426715, "epoch": 2539} {"train_loss": -11.584224700927734, "global_step": 426716, "epoch": 2539} {"train_loss": -11.359918594360352, "global_step": 426717, "epoch": 2539} {"train_loss": -12.221646308898926, "global_step": 426718, "epoch": 2539} {"train_loss": -12.014961168879555, "global_step": 426719, "epoch": 2539, "val_loss": 306834.375} {"train_loss": -11.742039680480957, "global_step": 426720, "epoch": 2540} {"train_loss": -12.24832534790039, "global_step": 426721, "epoch": 2540} {"train_loss": -11.768465995788574, "global_step": 426722, "epoch": 2540} {"train_loss": -11.575486183166504, "global_step": 426723, "epoch": 2540} {"train_loss": -11.773560523986816, "global_step": 426724, "epoch": 2540} {"train_loss": -11.699542045593262, "global_step": 426725, "epoch": 2540} {"train_loss": -11.877351760864258, "global_step": 426726, "epoch": 2540} {"train_loss": -12.13344669342041, "global_step": 426727, "epoch": 2540} {"train_loss": -11.128318786621094, "global_step": 426728, "epoch": 2540} {"train_loss": -10.889127731323242, "global_step": 426729, "epoch": 2540} {"train_loss": -10.912423133850098, "global_step": 426730, "epoch": 2540} {"train_loss": -12.053879737854004, "global_step": 426731, "epoch": 2540} {"train_loss": -12.194060325622559, "global_step": 426732, "epoch": 2540} {"train_loss": -11.784071922302246, "global_step": 426733, "epoch": 2540} {"train_loss": -12.17784595489502, "global_step": 426734, "epoch": 2540} {"train_loss": -11.433403015136719, "global_step": 426735, "epoch": 2540} {"train_loss": -12.307595252990723, "global_step": 426736, "epoch": 2540} {"train_loss": -12.024764060974121, "global_step": 426737, "epoch": 2540} {"train_loss": -12.377059936523438, "global_step": 426738, "epoch": 2540} {"train_loss": -12.336867332458496, "global_step": 426739, "epoch": 2540} {"train_loss": -12.481622695922852, "global_step": 426740, "epoch": 2540} {"train_loss": -12.243234634399414, "global_step": 426741, "epoch": 2540} {"train_loss": -11.930717468261719, "global_step": 426742, "epoch": 2540} {"train_loss": -11.970422744750977, "global_step": 426743, "epoch": 2540} {"train_loss": -12.252702713012695, "global_step": 426744, "epoch": 2540} {"train_loss": -12.361083984375, "global_step": 426745, "epoch": 2540} {"train_loss": -12.046029090881348, "global_step": 426746, "epoch": 2540} {"train_loss": -12.372111320495605, "global_step": 426747, "epoch": 2540} {"train_loss": -12.105009078979492, "global_step": 426748, "epoch": 2540} {"train_loss": -12.530168533325195, "global_step": 426749, "epoch": 2540} {"train_loss": -11.836006164550781, "global_step": 426750, "epoch": 2540} {"train_loss": -11.754966735839844, "global_step": 426751, "epoch": 2540} {"train_loss": -11.223771095275879, "global_step": 426752, "epoch": 2540} {"train_loss": -11.779375076293945, "global_step": 426753, "epoch": 2540} {"train_loss": -12.037040710449219, "global_step": 426754, "epoch": 2540} {"train_loss": -11.957036972045898, "global_step": 426755, "epoch": 2540} {"train_loss": -12.059608459472656, "global_step": 426756, "epoch": 2540} {"train_loss": -12.258134841918945, "global_step": 426757, "epoch": 2540} {"train_loss": -12.146364212036133, "global_step": 426758, "epoch": 2540} {"train_loss": -12.002546310424805, "global_step": 426759, "epoch": 2540} {"train_loss": -11.595796585083008, "global_step": 426760, "epoch": 2540} {"train_loss": -12.35318660736084, "global_step": 426761, "epoch": 2540} {"train_loss": -12.172343254089355, "global_step": 426762, "epoch": 2540} {"train_loss": -12.59049129486084, "global_step": 426763, "epoch": 2540} {"train_loss": -12.480962753295898, "global_step": 426764, "epoch": 2540} {"train_loss": -12.531570434570312, "global_step": 426765, "epoch": 2540} {"train_loss": -12.365212440490723, "global_step": 426766, "epoch": 2540} {"train_loss": -12.739054679870605, "global_step": 426767, "epoch": 2540} {"train_loss": -12.516782760620117, "global_step": 426768, "epoch": 2540} {"train_loss": -12.417652130126953, "global_step": 426769, "epoch": 2540} {"train_loss": -12.554570198059082, "global_step": 426770, "epoch": 2540} {"train_loss": -12.607893943786621, "global_step": 426771, "epoch": 2540} {"train_loss": -12.814451217651367, "global_step": 426772, "epoch": 2540} {"train_loss": -12.586573600769043, "global_step": 426773, "epoch": 2540} {"train_loss": -12.64590072631836, "global_step": 426774, "epoch": 2540} {"train_loss": -12.42641830444336, "global_step": 426775, "epoch": 2540} {"train_loss": -12.577336311340332, "global_step": 426776, "epoch": 2540} {"train_loss": -12.596883773803711, "global_step": 426777, "epoch": 2540} {"train_loss": -12.510162353515625, "global_step": 426778, "epoch": 2540} {"train_loss": -12.56562614440918, "global_step": 426779, "epoch": 2540} {"train_loss": -12.692231178283691, "global_step": 426780, "epoch": 2540} {"train_loss": -12.804537773132324, "global_step": 426781, "epoch": 2540} {"train_loss": -12.430891990661621, "global_step": 426782, "epoch": 2540} {"train_loss": -12.667247772216797, "global_step": 426783, "epoch": 2540} {"train_loss": -12.448720932006836, "global_step": 426784, "epoch": 2540} {"train_loss": -12.502622604370117, "global_step": 426785, "epoch": 2540} {"train_loss": -12.782607078552246, "global_step": 426786, "epoch": 2540} {"train_loss": -12.72933578491211, "global_step": 426787, "epoch": 2540} {"train_loss": -12.597188949584961, "global_step": 426788, "epoch": 2540} {"train_loss": -12.637735366821289, "global_step": 426789, "epoch": 2540} {"train_loss": -12.640508651733398, "global_step": 426790, "epoch": 2540} {"train_loss": -12.787086486816406, "global_step": 426791, "epoch": 2540} {"train_loss": -12.854963302612305, "global_step": 426792, "epoch": 2540} {"train_loss": -12.770930290222168, "global_step": 426793, "epoch": 2540} {"train_loss": -12.59196662902832, "global_step": 426794, "epoch": 2540} {"train_loss": -12.453454971313477, "global_step": 426795, "epoch": 2540} {"train_loss": -12.585780143737793, "global_step": 426796, "epoch": 2540} {"train_loss": -12.497797012329102, "global_step": 426797, "epoch": 2540} {"train_loss": -12.293240547180176, "global_step": 426798, "epoch": 2540} {"train_loss": -12.777896881103516, "global_step": 426799, "epoch": 2540} {"train_loss": -11.892285346984863, "global_step": 426800, "epoch": 2540} {"train_loss": -11.38284969329834, "global_step": 426801, "epoch": 2540} {"train_loss": -11.803703308105469, "global_step": 426802, "epoch": 2540} {"train_loss": -12.112176895141602, "global_step": 426803, "epoch": 2540} {"train_loss": -12.429800033569336, "global_step": 426804, "epoch": 2540} {"train_loss": -12.478294372558594, "global_step": 426805, "epoch": 2540} {"train_loss": -12.542922973632812, "global_step": 426806, "epoch": 2540} {"train_loss": -12.639455795288086, "global_step": 426807, "epoch": 2540} {"train_loss": -12.557772636413574, "global_step": 426808, "epoch": 2540} {"train_loss": -12.779840469360352, "global_step": 426809, "epoch": 2540} {"train_loss": -12.059776306152344, "global_step": 426810, "epoch": 2540} {"train_loss": -11.723207473754883, "global_step": 426811, "epoch": 2540} {"train_loss": -12.670638084411621, "global_step": 426812, "epoch": 2540} {"train_loss": -11.678536415100098, "global_step": 426813, "epoch": 2540} {"train_loss": -11.719306945800781, "global_step": 426814, "epoch": 2540} {"train_loss": -12.638238906860352, "global_step": 426815, "epoch": 2540} {"train_loss": -11.444032669067383, "global_step": 426816, "epoch": 2540} {"train_loss": -11.659635543823242, "global_step": 426817, "epoch": 2540} {"train_loss": -11.683626174926758, "global_step": 426818, "epoch": 2540} {"train_loss": -11.831836700439453, "global_step": 426819, "epoch": 2540} {"train_loss": -12.309213638305664, "global_step": 426820, "epoch": 2540} {"train_loss": -11.680496215820312, "global_step": 426821, "epoch": 2540} {"train_loss": -11.803773880004883, "global_step": 426822, "epoch": 2540} {"train_loss": -12.11602783203125, "global_step": 426823, "epoch": 2540} {"train_loss": -12.201961517333984, "global_step": 426824, "epoch": 2540} {"train_loss": -11.861641883850098, "global_step": 426825, "epoch": 2540} {"train_loss": -12.319844245910645, "global_step": 426826, "epoch": 2540} {"train_loss": -12.31666374206543, "global_step": 426827, "epoch": 2540} {"train_loss": -12.303524017333984, "global_step": 426828, "epoch": 2540} {"train_loss": -12.242685317993164, "global_step": 426829, "epoch": 2540} {"train_loss": -11.933341979980469, "global_step": 426830, "epoch": 2540} {"train_loss": -11.016524314880371, "global_step": 426831, "epoch": 2540} {"train_loss": -12.087721824645996, "global_step": 426832, "epoch": 2540} {"train_loss": -11.68878173828125, "global_step": 426833, "epoch": 2540} {"train_loss": -11.872045516967773, "global_step": 426834, "epoch": 2540} {"train_loss": -12.027755737304688, "global_step": 426835, "epoch": 2540} {"train_loss": -11.898792266845703, "global_step": 426836, "epoch": 2540} {"train_loss": -12.449933052062988, "global_step": 426837, "epoch": 2540} {"train_loss": -11.374153137207031, "global_step": 426838, "epoch": 2540} {"train_loss": -11.57751750946045, "global_step": 426839, "epoch": 2540} {"train_loss": -11.345620155334473, "global_step": 426840, "epoch": 2540} {"train_loss": -11.744386672973633, "global_step": 426841, "epoch": 2540} {"train_loss": -11.302986145019531, "global_step": 426842, "epoch": 2540} {"train_loss": -11.663960456848145, "global_step": 426843, "epoch": 2540} {"train_loss": -11.29524040222168, "global_step": 426844, "epoch": 2540} {"train_loss": -11.895890235900879, "global_step": 426845, "epoch": 2540} {"train_loss": -10.3613920211792, "global_step": 426846, "epoch": 2540} {"train_loss": -11.876701354980469, "global_step": 426847, "epoch": 2540} {"train_loss": -11.126745223999023, "global_step": 426848, "epoch": 2540} {"train_loss": -10.994027137756348, "global_step": 426849, "epoch": 2540} {"train_loss": -12.325639724731445, "global_step": 426850, "epoch": 2540} {"train_loss": -10.792288780212402, "global_step": 426851, "epoch": 2540} {"train_loss": -12.282674789428711, "global_step": 426852, "epoch": 2540} {"train_loss": -10.893115997314453, "global_step": 426853, "epoch": 2540} {"train_loss": -10.608479499816895, "global_step": 426854, "epoch": 2540} {"train_loss": -10.82297134399414, "global_step": 426855, "epoch": 2540} {"train_loss": -11.332599639892578, "global_step": 426856, "epoch": 2540} {"train_loss": -10.848508834838867, "global_step": 426857, "epoch": 2540} {"train_loss": -11.413125991821289, "global_step": 426858, "epoch": 2540} {"train_loss": -11.148935317993164, "global_step": 426859, "epoch": 2540} {"train_loss": -10.98861312866211, "global_step": 426860, "epoch": 2540} {"train_loss": -11.771408081054688, "global_step": 426861, "epoch": 2540} {"train_loss": -11.328424453735352, "global_step": 426862, "epoch": 2540} {"train_loss": -11.862044334411621, "global_step": 426863, "epoch": 2540} {"train_loss": -11.302988052368164, "global_step": 426864, "epoch": 2540} {"train_loss": -12.208925247192383, "global_step": 426865, "epoch": 2540} {"train_loss": -10.41758918762207, "global_step": 426866, "epoch": 2540} {"train_loss": -12.247000694274902, "global_step": 426867, "epoch": 2540} {"train_loss": -10.11968994140625, "global_step": 426868, "epoch": 2540} {"train_loss": -12.16836166381836, "global_step": 426869, "epoch": 2540} {"train_loss": -10.675562858581543, "global_step": 426870, "epoch": 2540} {"train_loss": -11.505234718322754, "global_step": 426871, "epoch": 2540} {"train_loss": -9.993375778198242, "global_step": 426872, "epoch": 2540} {"train_loss": -11.654068946838379, "global_step": 426873, "epoch": 2540} {"train_loss": -10.455411911010742, "global_step": 426874, "epoch": 2540} {"train_loss": -12.291339874267578, "global_step": 426875, "epoch": 2540} {"train_loss": -10.491552352905273, "global_step": 426876, "epoch": 2540} {"train_loss": -11.728882789611816, "global_step": 426877, "epoch": 2540} {"train_loss": -11.106739044189453, "global_step": 426878, "epoch": 2540} {"train_loss": -11.976484298706055, "global_step": 426879, "epoch": 2540} {"train_loss": -10.882196426391602, "global_step": 426880, "epoch": 2540} {"train_loss": -12.116613388061523, "global_step": 426881, "epoch": 2540} {"train_loss": -11.517128944396973, "global_step": 426882, "epoch": 2540} {"train_loss": -11.887388229370117, "global_step": 426883, "epoch": 2540} {"train_loss": -11.917287826538086, "global_step": 426884, "epoch": 2540} {"train_loss": -12.24105453491211, "global_step": 426885, "epoch": 2540} {"train_loss": -11.980585098266602, "global_step": 426886, "epoch": 2540} {"train_loss": -11.950835721833366, "global_step": 426887, "epoch": 2540, "val_loss": 307783.21875, "train_action_mse_error": 1.2599436044692993} {"train_loss": -11.972116470336914, "global_step": 426888, "epoch": 2541} {"train_loss": -12.37724494934082, "global_step": 426889, "epoch": 2541} {"train_loss": -12.168351173400879, "global_step": 426890, "epoch": 2541} {"train_loss": -12.342469215393066, "global_step": 426891, "epoch": 2541} {"train_loss": -12.18795108795166, "global_step": 426892, "epoch": 2541} {"train_loss": -12.103736877441406, "global_step": 426893, "epoch": 2541} {"train_loss": -11.8967924118042, "global_step": 426894, "epoch": 2541} {"train_loss": -12.129556655883789, "global_step": 426895, "epoch": 2541} {"train_loss": -12.15157699584961, "global_step": 426896, "epoch": 2541} {"train_loss": -12.509258270263672, "global_step": 426897, "epoch": 2541} {"train_loss": -12.22618293762207, "global_step": 426898, "epoch": 2541} {"train_loss": -12.200027465820312, "global_step": 426899, "epoch": 2541} {"train_loss": -12.27053451538086, "global_step": 426900, "epoch": 2541} {"train_loss": -12.24050521850586, "global_step": 426901, "epoch": 2541} {"train_loss": -12.2887601852417, "global_step": 426902, "epoch": 2541} {"train_loss": -12.323352813720703, "global_step": 426903, "epoch": 2541} {"train_loss": -12.184099197387695, "global_step": 426904, "epoch": 2541} {"train_loss": -12.50741195678711, "global_step": 426905, "epoch": 2541} {"train_loss": -12.023078918457031, "global_step": 426906, "epoch": 2541} {"train_loss": -12.6161470413208, "global_step": 426907, "epoch": 2541} {"train_loss": -12.252538681030273, "global_step": 426908, "epoch": 2541} {"train_loss": -12.456704139709473, "global_step": 426909, "epoch": 2541} {"train_loss": -12.067634582519531, "global_step": 426910, "epoch": 2541} {"train_loss": -12.411376953125, "global_step": 426911, "epoch": 2541} {"train_loss": -12.465750694274902, "global_step": 426912, "epoch": 2541} {"train_loss": -12.528717041015625, "global_step": 426913, "epoch": 2541} {"train_loss": -12.51664924621582, "global_step": 426914, "epoch": 2541} {"train_loss": -12.44758129119873, "global_step": 426915, "epoch": 2541} {"train_loss": -12.49278450012207, "global_step": 426916, "epoch": 2541} {"train_loss": -12.291094779968262, "global_step": 426917, "epoch": 2541} {"train_loss": -12.532861709594727, "global_step": 426918, "epoch": 2541} {"train_loss": -12.442590713500977, "global_step": 426919, "epoch": 2541} {"train_loss": -12.862527847290039, "global_step": 426920, "epoch": 2541} {"train_loss": -12.658590316772461, "global_step": 426921, "epoch": 2541} {"train_loss": -12.584311485290527, "global_step": 426922, "epoch": 2541} {"train_loss": -12.845972061157227, "global_step": 426923, "epoch": 2541} {"train_loss": -12.472038269042969, "global_step": 426924, "epoch": 2541} {"train_loss": -12.75527572631836, "global_step": 426925, "epoch": 2541} {"train_loss": -12.484796524047852, "global_step": 426926, "epoch": 2541} {"train_loss": -12.664579391479492, "global_step": 426927, "epoch": 2541} {"train_loss": -12.697154998779297, "global_step": 426928, "epoch": 2541} {"train_loss": -12.68134880065918, "global_step": 426929, "epoch": 2541} {"train_loss": -12.607958793640137, "global_step": 426930, "epoch": 2541} {"train_loss": -12.659222602844238, "global_step": 426931, "epoch": 2541} {"train_loss": -12.755388259887695, "global_step": 426932, "epoch": 2541} {"train_loss": -12.462911605834961, "global_step": 426933, "epoch": 2541} {"train_loss": -12.665236473083496, "global_step": 426934, "epoch": 2541} {"train_loss": -12.815585136413574, "global_step": 426935, "epoch": 2541} {"train_loss": -12.49409008026123, "global_step": 426936, "epoch": 2541} {"train_loss": -12.967926025390625, "global_step": 426937, "epoch": 2541} {"train_loss": -12.31673526763916, "global_step": 426938, "epoch": 2541} {"train_loss": -12.353874206542969, "global_step": 426939, "epoch": 2541} {"train_loss": -12.618672370910645, "global_step": 426940, "epoch": 2541} {"train_loss": -12.115328788757324, "global_step": 426941, "epoch": 2541} {"train_loss": -12.45393180847168, "global_step": 426942, "epoch": 2541} {"train_loss": -12.365825653076172, "global_step": 426943, "epoch": 2541} {"train_loss": -12.276189804077148, "global_step": 426944, "epoch": 2541} {"train_loss": -12.68018627166748, "global_step": 426945, "epoch": 2541} {"train_loss": -11.855316162109375, "global_step": 426946, "epoch": 2541} {"train_loss": -12.693609237670898, "global_step": 426947, "epoch": 2541} {"train_loss": -12.246671676635742, "global_step": 426948, "epoch": 2541} {"train_loss": -12.654233932495117, "global_step": 426949, "epoch": 2541} {"train_loss": -12.326530456542969, "global_step": 426950, "epoch": 2541} {"train_loss": -12.419340133666992, "global_step": 426951, "epoch": 2541} {"train_loss": -12.649374008178711, "global_step": 426952, "epoch": 2541} {"train_loss": -12.579730987548828, "global_step": 426953, "epoch": 2541} {"train_loss": -12.192479133605957, "global_step": 426954, "epoch": 2541} {"train_loss": -12.229423522949219, "global_step": 426955, "epoch": 2541} {"train_loss": -12.487750053405762, "global_step": 426956, "epoch": 2541} {"train_loss": -12.367948532104492, "global_step": 426957, "epoch": 2541} {"train_loss": -12.51451587677002, "global_step": 426958, "epoch": 2541} {"train_loss": -12.793598175048828, "global_step": 426959, "epoch": 2541} {"train_loss": -12.70461654663086, "global_step": 426960, "epoch": 2541} {"train_loss": -12.561004638671875, "global_step": 426961, "epoch": 2541} {"train_loss": -12.666187286376953, "global_step": 426962, "epoch": 2541} {"train_loss": -12.577099800109863, "global_step": 426963, "epoch": 2541} {"train_loss": -12.441271781921387, "global_step": 426964, "epoch": 2541} {"train_loss": -12.670777320861816, "global_step": 426965, "epoch": 2541} {"train_loss": -12.368766784667969, "global_step": 426966, "epoch": 2541} {"train_loss": -12.163619995117188, "global_step": 426967, "epoch": 2541} {"train_loss": -12.676172256469727, "global_step": 426968, "epoch": 2541} {"train_loss": -12.25225830078125, "global_step": 426969, "epoch": 2541} {"train_loss": -12.367232322692871, "global_step": 426970, "epoch": 2541} {"train_loss": -12.306364059448242, "global_step": 426971, "epoch": 2541} {"train_loss": -12.392375946044922, "global_step": 426972, "epoch": 2541} {"train_loss": -11.841190338134766, "global_step": 426973, "epoch": 2541} {"train_loss": -12.279947280883789, "global_step": 426974, "epoch": 2541} {"train_loss": -11.72443962097168, "global_step": 426975, "epoch": 2541} {"train_loss": -11.725139617919922, "global_step": 426976, "epoch": 2541} {"train_loss": -11.791902542114258, "global_step": 426977, "epoch": 2541} {"train_loss": -12.525117874145508, "global_step": 426978, "epoch": 2541} {"train_loss": -11.852170944213867, "global_step": 426979, "epoch": 2541} {"train_loss": -12.279460906982422, "global_step": 426980, "epoch": 2541} {"train_loss": -12.4764986038208, "global_step": 426981, "epoch": 2541} {"train_loss": -11.819426536560059, "global_step": 426982, "epoch": 2541} {"train_loss": -12.70788860321045, "global_step": 426983, "epoch": 2541} {"train_loss": -12.30037784576416, "global_step": 426984, "epoch": 2541} {"train_loss": -12.318771362304688, "global_step": 426985, "epoch": 2541} {"train_loss": -12.148168563842773, "global_step": 426986, "epoch": 2541} {"train_loss": -12.612802505493164, "global_step": 426987, "epoch": 2541} {"train_loss": -12.004131317138672, "global_step": 426988, "epoch": 2541} {"train_loss": -11.147228240966797, "global_step": 426989, "epoch": 2541} {"train_loss": -10.241293907165527, "global_step": 426990, "epoch": 2541} {"train_loss": -10.259225845336914, "global_step": 426991, "epoch": 2541} {"train_loss": -11.100720405578613, "global_step": 426992, "epoch": 2541} {"train_loss": -10.215057373046875, "global_step": 426993, "epoch": 2541} {"train_loss": -10.925338745117188, "global_step": 426994, "epoch": 2541} {"train_loss": -10.037641525268555, "global_step": 426995, "epoch": 2541} {"train_loss": -10.988177299499512, "global_step": 426996, "epoch": 2541} {"train_loss": -10.420719146728516, "global_step": 426997, "epoch": 2541} {"train_loss": -11.549938201904297, "global_step": 426998, "epoch": 2541} {"train_loss": -11.882861137390137, "global_step": 426999, "epoch": 2541} {"train_loss": -11.444355964660645, "global_step": 427000, "epoch": 2541} {"train_loss": -11.816692352294922, "global_step": 427001, "epoch": 2541} {"train_loss": -11.201736450195312, "global_step": 427002, "epoch": 2541} {"train_loss": -11.480730056762695, "global_step": 427003, "epoch": 2541} {"train_loss": -11.646607398986816, "global_step": 427004, "epoch": 2541} {"train_loss": -11.892127990722656, "global_step": 427005, "epoch": 2541} {"train_loss": -11.74963665008545, "global_step": 427006, "epoch": 2541} {"train_loss": -11.162967681884766, "global_step": 427007, "epoch": 2541} {"train_loss": -11.86239242553711, "global_step": 427008, "epoch": 2541} {"train_loss": -10.727882385253906, "global_step": 427009, "epoch": 2541} {"train_loss": -11.296601295471191, "global_step": 427010, "epoch": 2541} {"train_loss": -11.33682918548584, "global_step": 427011, "epoch": 2541} {"train_loss": -10.918046951293945, "global_step": 427012, "epoch": 2541} {"train_loss": -11.40793228149414, "global_step": 427013, "epoch": 2541} {"train_loss": -11.376296043395996, "global_step": 427014, "epoch": 2541} {"train_loss": -11.183841705322266, "global_step": 427015, "epoch": 2541} {"train_loss": -11.370223045349121, "global_step": 427016, "epoch": 2541} {"train_loss": -11.177640914916992, "global_step": 427017, "epoch": 2541} {"train_loss": -11.458367347717285, "global_step": 427018, "epoch": 2541} {"train_loss": -11.232244491577148, "global_step": 427019, "epoch": 2541} {"train_loss": -11.138940811157227, "global_step": 427020, "epoch": 2541} {"train_loss": -10.972827911376953, "global_step": 427021, "epoch": 2541} {"train_loss": -11.565067291259766, "global_step": 427022, "epoch": 2541} {"train_loss": -11.791526794433594, "global_step": 427023, "epoch": 2541} {"train_loss": -10.786922454833984, "global_step": 427024, "epoch": 2541} {"train_loss": -12.212430953979492, "global_step": 427025, "epoch": 2541} {"train_loss": -11.238115310668945, "global_step": 427026, "epoch": 2541} {"train_loss": -11.422104835510254, "global_step": 427027, "epoch": 2541} {"train_loss": -11.856218338012695, "global_step": 427028, "epoch": 2541} {"train_loss": -11.345537185668945, "global_step": 427029, "epoch": 2541} {"train_loss": -12.066347122192383, "global_step": 427030, "epoch": 2541} {"train_loss": -12.127552032470703, "global_step": 427031, "epoch": 2541} {"train_loss": -11.895293235778809, "global_step": 427032, "epoch": 2541} {"train_loss": -12.064430236816406, "global_step": 427033, "epoch": 2541} {"train_loss": -11.897361755371094, "global_step": 427034, "epoch": 2541} {"train_loss": -12.204557418823242, "global_step": 427035, "epoch": 2541} {"train_loss": -12.184024810791016, "global_step": 427036, "epoch": 2541} {"train_loss": -12.283353805541992, "global_step": 427037, "epoch": 2541} {"train_loss": -12.18630599975586, "global_step": 427038, "epoch": 2541} {"train_loss": -12.342920303344727, "global_step": 427039, "epoch": 2541} {"train_loss": -12.287583351135254, "global_step": 427040, "epoch": 2541} {"train_loss": -12.284652709960938, "global_step": 427041, "epoch": 2541} {"train_loss": -11.998947143554688, "global_step": 427042, "epoch": 2541} {"train_loss": -11.840133666992188, "global_step": 427043, "epoch": 2541} {"train_loss": -12.440650939941406, "global_step": 427044, "epoch": 2541} {"train_loss": -11.53985595703125, "global_step": 427045, "epoch": 2541} {"train_loss": -12.380422592163086, "global_step": 427046, "epoch": 2541} {"train_loss": -11.935630798339844, "global_step": 427047, "epoch": 2541} {"train_loss": -12.4139404296875, "global_step": 427048, "epoch": 2541} {"train_loss": -11.881597518920898, "global_step": 427049, "epoch": 2541} {"train_loss": -12.530962944030762, "global_step": 427050, "epoch": 2541} {"train_loss": -12.276779174804688, "global_step": 427051, "epoch": 2541} {"train_loss": -12.210649490356445, "global_step": 427052, "epoch": 2541} {"train_loss": -12.382316589355469, "global_step": 427053, "epoch": 2541} {"train_loss": -12.42497444152832, "global_step": 427054, "epoch": 2541} {"train_loss": -12.07584768249875, "global_step": 427055, "epoch": 2541, "val_loss": 306305.53125} {"train_loss": -12.680000305175781, "global_step": 427056, "epoch": 2542} {"train_loss": -12.41610336303711, "global_step": 427057, "epoch": 2542} {"train_loss": -12.329591751098633, "global_step": 427058, "epoch": 2542} {"train_loss": -12.377799034118652, "global_step": 427059, "epoch": 2542} {"train_loss": -12.4478759765625, "global_step": 427060, "epoch": 2542} {"train_loss": -12.333978652954102, "global_step": 427061, "epoch": 2542} {"train_loss": -12.654878616333008, "global_step": 427062, "epoch": 2542} {"train_loss": -12.543275833129883, "global_step": 427063, "epoch": 2542} {"train_loss": -12.54787540435791, "global_step": 427064, "epoch": 2542} {"train_loss": -12.705536842346191, "global_step": 427065, "epoch": 2542} {"train_loss": -12.291629791259766, "global_step": 427066, "epoch": 2542} {"train_loss": -12.709692001342773, "global_step": 427067, "epoch": 2542} {"train_loss": -12.580473899841309, "global_step": 427068, "epoch": 2542} {"train_loss": -12.558815956115723, "global_step": 427069, "epoch": 2542} {"train_loss": -12.687454223632812, "global_step": 427070, "epoch": 2542} {"train_loss": -12.548660278320312, "global_step": 427071, "epoch": 2542} {"train_loss": -12.399136543273926, "global_step": 427072, "epoch": 2542} {"train_loss": -12.599614143371582, "global_step": 427073, "epoch": 2542} {"train_loss": -12.549161911010742, "global_step": 427074, "epoch": 2542} {"train_loss": -12.776798248291016, "global_step": 427075, "epoch": 2542} {"train_loss": -12.743427276611328, "global_step": 427076, "epoch": 2542} {"train_loss": -12.721111297607422, "global_step": 427077, "epoch": 2542} {"train_loss": -12.640325546264648, "global_step": 427078, "epoch": 2542} {"train_loss": -12.505868911743164, "global_step": 427079, "epoch": 2542} {"train_loss": -12.563632011413574, "global_step": 427080, "epoch": 2542} {"train_loss": -12.581305503845215, "global_step": 427081, "epoch": 2542} {"train_loss": -12.614049911499023, "global_step": 427082, "epoch": 2542} {"train_loss": -12.533957481384277, "global_step": 427083, "epoch": 2542} {"train_loss": -12.458353042602539, "global_step": 427084, "epoch": 2542} {"train_loss": -12.708806991577148, "global_step": 427085, "epoch": 2542} {"train_loss": -12.724474906921387, "global_step": 427086, "epoch": 2542} {"train_loss": -12.597415924072266, "global_step": 427087, "epoch": 2542} {"train_loss": -12.694433212280273, "global_step": 427088, "epoch": 2542} {"train_loss": -12.637372016906738, "global_step": 427089, "epoch": 2542} {"train_loss": -12.2386474609375, "global_step": 427090, "epoch": 2542} {"train_loss": -12.835992813110352, "global_step": 427091, "epoch": 2542} {"train_loss": -12.694992065429688, "global_step": 427092, "epoch": 2542} {"train_loss": -12.612363815307617, "global_step": 427093, "epoch": 2542} {"train_loss": -12.816656112670898, "global_step": 427094, "epoch": 2542} {"train_loss": -12.772549629211426, "global_step": 427095, "epoch": 2542} {"train_loss": -12.780611038208008, "global_step": 427096, "epoch": 2542} {"train_loss": -12.926998138427734, "global_step": 427097, "epoch": 2542} {"train_loss": -12.721982955932617, "global_step": 427098, "epoch": 2542} {"train_loss": -12.743626594543457, "global_step": 427099, "epoch": 2542} {"train_loss": -12.889577865600586, "global_step": 427100, "epoch": 2542} {"train_loss": -12.665916442871094, "global_step": 427101, "epoch": 2542} {"train_loss": -12.423948287963867, "global_step": 427102, "epoch": 2542} {"train_loss": -12.937017440795898, "global_step": 427103, "epoch": 2542} {"train_loss": -12.885419845581055, "global_step": 427104, "epoch": 2542} {"train_loss": -12.775419235229492, "global_step": 427105, "epoch": 2542} {"train_loss": -12.693562507629395, "global_step": 427106, "epoch": 2542} {"train_loss": -12.531859397888184, "global_step": 427107, "epoch": 2542} {"train_loss": -13.099288940429688, "global_step": 427108, "epoch": 2542} {"train_loss": -12.52911376953125, "global_step": 427109, "epoch": 2542} {"train_loss": -12.509891510009766, "global_step": 427110, "epoch": 2542} {"train_loss": -12.609793663024902, "global_step": 427111, "epoch": 2542} {"train_loss": -12.953378677368164, "global_step": 427112, "epoch": 2542} {"train_loss": -12.622071266174316, "global_step": 427113, "epoch": 2542} {"train_loss": -12.542884826660156, "global_step": 427114, "epoch": 2542} {"train_loss": -12.638504981994629, "global_step": 427115, "epoch": 2542} {"train_loss": -12.427572250366211, "global_step": 427116, "epoch": 2542} {"train_loss": -12.691208839416504, "global_step": 427117, "epoch": 2542} {"train_loss": -12.794687271118164, "global_step": 427118, "epoch": 2542} {"train_loss": -12.900825500488281, "global_step": 427119, "epoch": 2542} {"train_loss": -11.91529655456543, "global_step": 427120, "epoch": 2542} {"train_loss": -11.973299980163574, "global_step": 427121, "epoch": 2542} {"train_loss": -11.93757152557373, "global_step": 427122, "epoch": 2542} {"train_loss": -12.764554977416992, "global_step": 427123, "epoch": 2542} {"train_loss": -11.465240478515625, "global_step": 427124, "epoch": 2542} {"train_loss": -10.589422225952148, "global_step": 427125, "epoch": 2542} {"train_loss": -12.528090476989746, "global_step": 427126, "epoch": 2542} {"train_loss": -9.123018264770508, "global_step": 427127, "epoch": 2542} {"train_loss": -8.396095275878906, "global_step": 427128, "epoch": 2542} {"train_loss": -9.207035064697266, "global_step": 427129, "epoch": 2542} {"train_loss": -9.583675384521484, "global_step": 427130, "epoch": 2542} {"train_loss": -9.374242782592773, "global_step": 427131, "epoch": 2542} {"train_loss": -9.919549942016602, "global_step": 427132, "epoch": 2542} {"train_loss": -9.102163314819336, "global_step": 427133, "epoch": 2542} {"train_loss": -9.963886260986328, "global_step": 427134, "epoch": 2542} {"train_loss": -11.00148868560791, "global_step": 427135, "epoch": 2542} {"train_loss": -9.914398193359375, "global_step": 427136, "epoch": 2542} {"train_loss": -11.011898040771484, "global_step": 427137, "epoch": 2542} {"train_loss": -11.141900062561035, "global_step": 427138, "epoch": 2542} {"train_loss": -11.424527168273926, "global_step": 427139, "epoch": 2542} {"train_loss": -11.91099739074707, "global_step": 427140, "epoch": 2542} {"train_loss": -9.930295944213867, "global_step": 427141, "epoch": 2542} {"train_loss": -10.798870086669922, "global_step": 427142, "epoch": 2542} {"train_loss": -11.178126335144043, "global_step": 427143, "epoch": 2542} {"train_loss": -10.255163192749023, "global_step": 427144, "epoch": 2542} {"train_loss": -10.84277629852295, "global_step": 427145, "epoch": 2542} {"train_loss": -11.632091522216797, "global_step": 427146, "epoch": 2542} {"train_loss": -10.977216720581055, "global_step": 427147, "epoch": 2542} {"train_loss": -11.604187965393066, "global_step": 427148, "epoch": 2542} {"train_loss": -11.831598281860352, "global_step": 427149, "epoch": 2542} {"train_loss": -11.798334121704102, "global_step": 427150, "epoch": 2542} {"train_loss": -11.817644119262695, "global_step": 427151, "epoch": 2542} {"train_loss": -11.540851593017578, "global_step": 427152, "epoch": 2542} {"train_loss": -11.869817733764648, "global_step": 427153, "epoch": 2542} {"train_loss": -11.045724868774414, "global_step": 427154, "epoch": 2542} {"train_loss": -11.673770904541016, "global_step": 427155, "epoch": 2542} {"train_loss": -11.296300888061523, "global_step": 427156, "epoch": 2542} {"train_loss": -11.037009239196777, "global_step": 427157, "epoch": 2542} {"train_loss": -10.838788986206055, "global_step": 427158, "epoch": 2542} {"train_loss": -10.685315132141113, "global_step": 427159, "epoch": 2542} {"train_loss": -11.157681465148926, "global_step": 427160, "epoch": 2542} {"train_loss": -11.510374069213867, "global_step": 427161, "epoch": 2542} {"train_loss": -11.801332473754883, "global_step": 427162, "epoch": 2542} {"train_loss": -11.75070571899414, "global_step": 427163, "epoch": 2542} {"train_loss": -12.275853157043457, "global_step": 427164, "epoch": 2542} {"train_loss": -11.926486015319824, "global_step": 427165, "epoch": 2542} {"train_loss": -12.304281234741211, "global_step": 427166, "epoch": 2542} {"train_loss": -12.039243698120117, "global_step": 427167, "epoch": 2542} {"train_loss": -12.396164894104004, "global_step": 427168, "epoch": 2542} {"train_loss": -12.328140258789062, "global_step": 427169, "epoch": 2542} {"train_loss": -12.542255401611328, "global_step": 427170, "epoch": 2542} {"train_loss": -12.34753131866455, "global_step": 427171, "epoch": 2542} {"train_loss": -12.552459716796875, "global_step": 427172, "epoch": 2542} {"train_loss": -12.256505012512207, "global_step": 427173, "epoch": 2542} {"train_loss": -12.378134727478027, "global_step": 427174, "epoch": 2542} {"train_loss": -12.24654769897461, "global_step": 427175, "epoch": 2542} {"train_loss": -12.466869354248047, "global_step": 427176, "epoch": 2542} {"train_loss": -12.100953102111816, "global_step": 427177, "epoch": 2542} {"train_loss": -12.250431060791016, "global_step": 427178, "epoch": 2542} {"train_loss": -12.166316986083984, "global_step": 427179, "epoch": 2542} {"train_loss": -12.258646965026855, "global_step": 427180, "epoch": 2542} {"train_loss": -12.35438346862793, "global_step": 427181, "epoch": 2542} {"train_loss": -12.382485389709473, "global_step": 427182, "epoch": 2542} {"train_loss": -12.03884506225586, "global_step": 427183, "epoch": 2542} {"train_loss": -12.126462936401367, "global_step": 427184, "epoch": 2542} {"train_loss": -12.25023078918457, "global_step": 427185, "epoch": 2542} {"train_loss": -12.29059886932373, "global_step": 427186, "epoch": 2542} {"train_loss": -11.905351638793945, "global_step": 427187, "epoch": 2542} {"train_loss": -12.177608489990234, "global_step": 427188, "epoch": 2542} {"train_loss": -12.252117156982422, "global_step": 427189, "epoch": 2542} {"train_loss": -12.26455307006836, "global_step": 427190, "epoch": 2542} {"train_loss": -12.545348167419434, "global_step": 427191, "epoch": 2542} {"train_loss": -12.227804183959961, "global_step": 427192, "epoch": 2542} {"train_loss": -12.627996444702148, "global_step": 427193, "epoch": 2542} {"train_loss": -12.385262489318848, "global_step": 427194, "epoch": 2542} {"train_loss": -12.472646713256836, "global_step": 427195, "epoch": 2542} {"train_loss": -12.423018455505371, "global_step": 427196, "epoch": 2542} {"train_loss": -12.441904067993164, "global_step": 427197, "epoch": 2542} {"train_loss": -12.026243209838867, "global_step": 427198, "epoch": 2542} {"train_loss": -12.16172981262207, "global_step": 427199, "epoch": 2542} {"train_loss": -12.242425918579102, "global_step": 427200, "epoch": 2542} {"train_loss": -12.221037864685059, "global_step": 427201, "epoch": 2542} {"train_loss": -12.158584594726562, "global_step": 427202, "epoch": 2542} {"train_loss": -12.43695068359375, "global_step": 427203, "epoch": 2542} {"train_loss": -11.976066589355469, "global_step": 427204, "epoch": 2542} {"train_loss": -12.259525299072266, "global_step": 427205, "epoch": 2542} {"train_loss": -12.047703742980957, "global_step": 427206, "epoch": 2542} {"train_loss": -12.613685607910156, "global_step": 427207, "epoch": 2542} {"train_loss": -12.518665313720703, "global_step": 427208, "epoch": 2542} {"train_loss": -12.427534103393555, "global_step": 427209, "epoch": 2542} {"train_loss": -12.330427169799805, "global_step": 427210, "epoch": 2542} {"train_loss": -12.426422119140625, "global_step": 427211, "epoch": 2542} {"train_loss": -12.45408821105957, "global_step": 427212, "epoch": 2542} {"train_loss": -12.513066291809082, "global_step": 427213, "epoch": 2542} {"train_loss": -12.305448532104492, "global_step": 427214, "epoch": 2542} {"train_loss": -12.591085433959961, "global_step": 427215, "epoch": 2542} {"train_loss": -12.530511856079102, "global_step": 427216, "epoch": 2542} {"train_loss": -12.52580451965332, "global_step": 427217, "epoch": 2542} {"train_loss": -12.043672561645508, "global_step": 427218, "epoch": 2542} {"train_loss": -12.559706687927246, "global_step": 427219, "epoch": 2542} {"train_loss": -12.623918533325195, "global_step": 427220, "epoch": 2542} {"train_loss": -12.338996887207031, "global_step": 427221, "epoch": 2542} {"train_loss": -12.46475601196289, "global_step": 427222, "epoch": 2542} {"train_loss": -12.08944845199585, "global_step": 427223, "epoch": 2542, "val_loss": 304936.59375} {"train_loss": -12.224066734313965, "global_step": 427224, "epoch": 2543} {"train_loss": -12.615596771240234, "global_step": 427225, "epoch": 2543} {"train_loss": -12.183448791503906, "global_step": 427226, "epoch": 2543} {"train_loss": -12.231873512268066, "global_step": 427227, "epoch": 2543} {"train_loss": -12.092230796813965, "global_step": 427228, "epoch": 2543} {"train_loss": -12.417776107788086, "global_step": 427229, "epoch": 2543} {"train_loss": -12.143585205078125, "global_step": 427230, "epoch": 2543} {"train_loss": -12.085884094238281, "global_step": 427231, "epoch": 2543} {"train_loss": -12.110496520996094, "global_step": 427232, "epoch": 2543} {"train_loss": -12.011956214904785, "global_step": 427233, "epoch": 2543} {"train_loss": -12.2530517578125, "global_step": 427234, "epoch": 2543} {"train_loss": -12.578352928161621, "global_step": 427235, "epoch": 2543} {"train_loss": -12.650402069091797, "global_step": 427236, "epoch": 2543} {"train_loss": -12.311327934265137, "global_step": 427237, "epoch": 2543} {"train_loss": -12.405444145202637, "global_step": 427238, "epoch": 2543} {"train_loss": -12.369644165039062, "global_step": 427239, "epoch": 2543} {"train_loss": -12.837336540222168, "global_step": 427240, "epoch": 2543} {"train_loss": -12.183958053588867, "global_step": 427241, "epoch": 2543} {"train_loss": -12.639411926269531, "global_step": 427242, "epoch": 2543} {"train_loss": -12.25741195678711, "global_step": 427243, "epoch": 2543} {"train_loss": -12.666120529174805, "global_step": 427244, "epoch": 2543} {"train_loss": -12.393073081970215, "global_step": 427245, "epoch": 2543} {"train_loss": -12.755329132080078, "global_step": 427246, "epoch": 2543} {"train_loss": -12.578768730163574, "global_step": 427247, "epoch": 2543} {"train_loss": -12.433277130126953, "global_step": 427248, "epoch": 2543} {"train_loss": -12.696649551391602, "global_step": 427249, "epoch": 2543} {"train_loss": -12.446907043457031, "global_step": 427250, "epoch": 2543} {"train_loss": -12.440461158752441, "global_step": 427251, "epoch": 2543} {"train_loss": -12.656274795532227, "global_step": 427252, "epoch": 2543} {"train_loss": -12.476229667663574, "global_step": 427253, "epoch": 2543} {"train_loss": -12.009140014648438, "global_step": 427254, "epoch": 2543} {"train_loss": -12.521045684814453, "global_step": 427255, "epoch": 2543} {"train_loss": -12.536130905151367, "global_step": 427256, "epoch": 2543} {"train_loss": -12.356195449829102, "global_step": 427257, "epoch": 2543} {"train_loss": -12.507810592651367, "global_step": 427258, "epoch": 2543} {"train_loss": -12.267135620117188, "global_step": 427259, "epoch": 2543} {"train_loss": -12.492111206054688, "global_step": 427260, "epoch": 2543} {"train_loss": -12.500265121459961, "global_step": 427261, "epoch": 2543} {"train_loss": -12.51761531829834, "global_step": 427262, "epoch": 2543} {"train_loss": -12.602615356445312, "global_step": 427263, "epoch": 2543} {"train_loss": -12.544952392578125, "global_step": 427264, "epoch": 2543} {"train_loss": -12.388051986694336, "global_step": 427265, "epoch": 2543} {"train_loss": -12.54269027709961, "global_step": 427266, "epoch": 2543} {"train_loss": -12.101689338684082, "global_step": 427267, "epoch": 2543} {"train_loss": -12.342876434326172, "global_step": 427268, "epoch": 2543} {"train_loss": -12.491598129272461, "global_step": 427269, "epoch": 2543} {"train_loss": -12.583210945129395, "global_step": 427270, "epoch": 2543} {"train_loss": -12.5962495803833, "global_step": 427271, "epoch": 2543} {"train_loss": -12.353504180908203, "global_step": 427272, "epoch": 2543} {"train_loss": -12.232817649841309, "global_step": 427273, "epoch": 2543} {"train_loss": -12.776036262512207, "global_step": 427274, "epoch": 2543} {"train_loss": -12.03193187713623, "global_step": 427275, "epoch": 2543} {"train_loss": -11.540140151977539, "global_step": 427276, "epoch": 2543} {"train_loss": -10.5809965133667, "global_step": 427277, "epoch": 2543} {"train_loss": -10.712292671203613, "global_step": 427278, "epoch": 2543} {"train_loss": -11.38375186920166, "global_step": 427279, "epoch": 2543} {"train_loss": -10.823808670043945, "global_step": 427280, "epoch": 2543} {"train_loss": -12.158727645874023, "global_step": 427281, "epoch": 2543} {"train_loss": -11.100028991699219, "global_step": 427282, "epoch": 2543} {"train_loss": -12.366971969604492, "global_step": 427283, "epoch": 2543} {"train_loss": -10.83306884765625, "global_step": 427284, "epoch": 2543} {"train_loss": -11.456852912902832, "global_step": 427285, "epoch": 2543} {"train_loss": -11.880864143371582, "global_step": 427286, "epoch": 2543} {"train_loss": -10.54052734375, "global_step": 427287, "epoch": 2543} {"train_loss": -11.279670715332031, "global_step": 427288, "epoch": 2543} {"train_loss": -10.320544242858887, "global_step": 427289, "epoch": 2543} {"train_loss": -11.636222839355469, "global_step": 427290, "epoch": 2543} {"train_loss": -9.969358444213867, "global_step": 427291, "epoch": 2543} {"train_loss": -10.19520378112793, "global_step": 427292, "epoch": 2543} {"train_loss": -11.779691696166992, "global_step": 427293, "epoch": 2543} {"train_loss": -10.200155258178711, "global_step": 427294, "epoch": 2543} {"train_loss": -11.147544860839844, "global_step": 427295, "epoch": 2543} {"train_loss": -11.235550880432129, "global_step": 427296, "epoch": 2543} {"train_loss": -10.571619033813477, "global_step": 427297, "epoch": 2543} {"train_loss": -10.667768478393555, "global_step": 427298, "epoch": 2543} {"train_loss": -11.686050415039062, "global_step": 427299, "epoch": 2543} {"train_loss": -11.306872367858887, "global_step": 427300, "epoch": 2543} {"train_loss": -11.482213973999023, "global_step": 427301, "epoch": 2543} {"train_loss": -10.11380386352539, "global_step": 427302, "epoch": 2543} {"train_loss": -11.430124282836914, "global_step": 427303, "epoch": 2543} {"train_loss": -11.424009323120117, "global_step": 427304, "epoch": 2543} {"train_loss": -11.329813003540039, "global_step": 427305, "epoch": 2543} {"train_loss": -10.688777923583984, "global_step": 427306, "epoch": 2543} {"train_loss": -10.734467506408691, "global_step": 427307, "epoch": 2543} {"train_loss": -11.844764709472656, "global_step": 427308, "epoch": 2543} {"train_loss": -11.624016761779785, "global_step": 427309, "epoch": 2543} {"train_loss": -11.275466918945312, "global_step": 427310, "epoch": 2543} {"train_loss": -12.297011375427246, "global_step": 427311, "epoch": 2543} {"train_loss": -11.759995460510254, "global_step": 427312, "epoch": 2543} {"train_loss": -11.539670944213867, "global_step": 427313, "epoch": 2543} {"train_loss": -11.738750457763672, "global_step": 427314, "epoch": 2543} {"train_loss": -11.291000366210938, "global_step": 427315, "epoch": 2543} {"train_loss": -11.926769256591797, "global_step": 427316, "epoch": 2543} {"train_loss": -11.236797332763672, "global_step": 427317, "epoch": 2543} {"train_loss": -11.998859405517578, "global_step": 427318, "epoch": 2543} {"train_loss": -11.919867515563965, "global_step": 427319, "epoch": 2543} {"train_loss": -11.970024108886719, "global_step": 427320, "epoch": 2543} {"train_loss": -11.993114471435547, "global_step": 427321, "epoch": 2543} {"train_loss": -12.063705444335938, "global_step": 427322, "epoch": 2543} {"train_loss": -11.883064270019531, "global_step": 427323, "epoch": 2543} {"train_loss": -12.157752990722656, "global_step": 427324, "epoch": 2543} {"train_loss": -12.104020118713379, "global_step": 427325, "epoch": 2543} {"train_loss": -12.071139335632324, "global_step": 427326, "epoch": 2543} {"train_loss": -11.96352767944336, "global_step": 427327, "epoch": 2543} {"train_loss": -11.84461784362793, "global_step": 427328, "epoch": 2543} {"train_loss": -12.013570785522461, "global_step": 427329, "epoch": 2543} {"train_loss": -11.87430191040039, "global_step": 427330, "epoch": 2543} {"train_loss": -12.153502464294434, "global_step": 427331, "epoch": 2543} {"train_loss": -11.812984466552734, "global_step": 427332, "epoch": 2543} {"train_loss": -12.134258270263672, "global_step": 427333, "epoch": 2543} {"train_loss": -11.986910820007324, "global_step": 427334, "epoch": 2543} {"train_loss": -11.913633346557617, "global_step": 427335, "epoch": 2543} {"train_loss": -12.023507118225098, "global_step": 427336, "epoch": 2543} {"train_loss": -11.84322738647461, "global_step": 427337, "epoch": 2543} {"train_loss": -11.546955108642578, "global_step": 427338, "epoch": 2543} {"train_loss": -12.07699203491211, "global_step": 427339, "epoch": 2543} {"train_loss": -12.02978515625, "global_step": 427340, "epoch": 2543} {"train_loss": -11.880024909973145, "global_step": 427341, "epoch": 2543} {"train_loss": -12.248010635375977, "global_step": 427342, "epoch": 2543} {"train_loss": -11.732172966003418, "global_step": 427343, "epoch": 2543} {"train_loss": -12.363032341003418, "global_step": 427344, "epoch": 2543} {"train_loss": -11.812847137451172, "global_step": 427345, "epoch": 2543} {"train_loss": -11.855681419372559, "global_step": 427346, "epoch": 2543} {"train_loss": -12.376070022583008, "global_step": 427347, "epoch": 2543} {"train_loss": -11.17807388305664, "global_step": 427348, "epoch": 2543} {"train_loss": -12.415029525756836, "global_step": 427349, "epoch": 2543} {"train_loss": -12.101829528808594, "global_step": 427350, "epoch": 2543} {"train_loss": -11.728185653686523, "global_step": 427351, "epoch": 2543} {"train_loss": -12.551511764526367, "global_step": 427352, "epoch": 2543} {"train_loss": -12.120267868041992, "global_step": 427353, "epoch": 2543} {"train_loss": -12.493030548095703, "global_step": 427354, "epoch": 2543} {"train_loss": -12.199178695678711, "global_step": 427355, "epoch": 2543} {"train_loss": -11.86138916015625, "global_step": 427356, "epoch": 2543} {"train_loss": -12.073497772216797, "global_step": 427357, "epoch": 2543} {"train_loss": -11.629660606384277, "global_step": 427358, "epoch": 2543} {"train_loss": -12.267294883728027, "global_step": 427359, "epoch": 2543} {"train_loss": -11.735357284545898, "global_step": 427360, "epoch": 2543} {"train_loss": -12.11419677734375, "global_step": 427361, "epoch": 2543} {"train_loss": -12.21731948852539, "global_step": 427362, "epoch": 2543} {"train_loss": -11.875377655029297, "global_step": 427363, "epoch": 2543} {"train_loss": -12.333422660827637, "global_step": 427364, "epoch": 2543} {"train_loss": -11.743694305419922, "global_step": 427365, "epoch": 2543} {"train_loss": -12.447284698486328, "global_step": 427366, "epoch": 2543} {"train_loss": -12.101005554199219, "global_step": 427367, "epoch": 2543} {"train_loss": -12.602731704711914, "global_step": 427368, "epoch": 2543} {"train_loss": -12.254762649536133, "global_step": 427369, "epoch": 2543} {"train_loss": -12.266552925109863, "global_step": 427370, "epoch": 2543} {"train_loss": -12.413424491882324, "global_step": 427371, "epoch": 2543} {"train_loss": -12.283833503723145, "global_step": 427372, "epoch": 2543} {"train_loss": -12.410484313964844, "global_step": 427373, "epoch": 2543} {"train_loss": -12.586236000061035, "global_step": 427374, "epoch": 2543} {"train_loss": -12.306241989135742, "global_step": 427375, "epoch": 2543} {"train_loss": -12.498308181762695, "global_step": 427376, "epoch": 2543} {"train_loss": -12.376805305480957, "global_step": 427377, "epoch": 2543} {"train_loss": -12.448044776916504, "global_step": 427378, "epoch": 2543} {"train_loss": -12.622981071472168, "global_step": 427379, "epoch": 2543} {"train_loss": -12.422208786010742, "global_step": 427380, "epoch": 2543} {"train_loss": -12.450325012207031, "global_step": 427381, "epoch": 2543} {"train_loss": -12.398441314697266, "global_step": 427382, "epoch": 2543} {"train_loss": -11.86526107788086, "global_step": 427383, "epoch": 2543} {"train_loss": -12.461483001708984, "global_step": 427384, "epoch": 2543} {"train_loss": -12.070457458496094, "global_step": 427385, "epoch": 2543} {"train_loss": -12.147512435913086, "global_step": 427386, "epoch": 2543} {"train_loss": -12.517135620117188, "global_step": 427387, "epoch": 2543} {"train_loss": -12.253832817077637, "global_step": 427388, "epoch": 2543} {"train_loss": -12.586097717285156, "global_step": 427389, "epoch": 2543} {"train_loss": -12.490001678466797, "global_step": 427390, "epoch": 2543} {"train_loss": -11.990592808950515, "global_step": 427391, "epoch": 2543, "val_loss": 309515.15625} {"train_loss": -12.611248970031738, "global_step": 427392, "epoch": 2544} {"train_loss": -12.597307205200195, "global_step": 427393, "epoch": 2544} {"train_loss": -12.754220962524414, "global_step": 427394, "epoch": 2544} {"train_loss": -12.40098762512207, "global_step": 427395, "epoch": 2544} {"train_loss": -12.301305770874023, "global_step": 427396, "epoch": 2544} {"train_loss": -12.54771614074707, "global_step": 427397, "epoch": 2544} {"train_loss": -12.509539604187012, "global_step": 427398, "epoch": 2544} {"train_loss": -12.526102066040039, "global_step": 427399, "epoch": 2544} {"train_loss": -12.746630668640137, "global_step": 427400, "epoch": 2544} {"train_loss": -12.402099609375, "global_step": 427401, "epoch": 2544} {"train_loss": -12.657310485839844, "global_step": 427402, "epoch": 2544} {"train_loss": -12.61223316192627, "global_step": 427403, "epoch": 2544} {"train_loss": -12.38747787475586, "global_step": 427404, "epoch": 2544} {"train_loss": -12.718172073364258, "global_step": 427405, "epoch": 2544} {"train_loss": -12.72718334197998, "global_step": 427406, "epoch": 2544} {"train_loss": -12.391857147216797, "global_step": 427407, "epoch": 2544} {"train_loss": -12.324905395507812, "global_step": 427408, "epoch": 2544} {"train_loss": -12.00326919555664, "global_step": 427409, "epoch": 2544} {"train_loss": -11.428773880004883, "global_step": 427410, "epoch": 2544} {"train_loss": -12.825315475463867, "global_step": 427411, "epoch": 2544} {"train_loss": -11.723936080932617, "global_step": 427412, "epoch": 2544} {"train_loss": -11.873135566711426, "global_step": 427413, "epoch": 2544} {"train_loss": -12.731277465820312, "global_step": 427414, "epoch": 2544} {"train_loss": -11.752360343933105, "global_step": 427415, "epoch": 2544} {"train_loss": -12.344501495361328, "global_step": 427416, "epoch": 2544} {"train_loss": -12.51519775390625, "global_step": 427417, "epoch": 2544} {"train_loss": -12.562572479248047, "global_step": 427418, "epoch": 2544} {"train_loss": -12.543750762939453, "global_step": 427419, "epoch": 2544} {"train_loss": -12.13841724395752, "global_step": 427420, "epoch": 2544} {"train_loss": -12.376076698303223, "global_step": 427421, "epoch": 2544} {"train_loss": -12.508894920349121, "global_step": 427422, "epoch": 2544} {"train_loss": -12.309741973876953, "global_step": 427423, "epoch": 2544} {"train_loss": -11.496644973754883, "global_step": 427424, "epoch": 2544} {"train_loss": -11.95981216430664, "global_step": 427425, "epoch": 2544} {"train_loss": -11.93172550201416, "global_step": 427426, "epoch": 2544} {"train_loss": -10.498655319213867, "global_step": 427427, "epoch": 2544} {"train_loss": -12.754977226257324, "global_step": 427428, "epoch": 2544} {"train_loss": -11.095754623413086, "global_step": 427429, "epoch": 2544} {"train_loss": -12.041463851928711, "global_step": 427430, "epoch": 2544} {"train_loss": -11.836538314819336, "global_step": 427431, "epoch": 2544} {"train_loss": -11.140848159790039, "global_step": 427432, "epoch": 2544} {"train_loss": -11.737510681152344, "global_step": 427433, "epoch": 2544} {"train_loss": -10.713054656982422, "global_step": 427434, "epoch": 2544} {"train_loss": -11.652092933654785, "global_step": 427435, "epoch": 2544} {"train_loss": -10.670400619506836, "global_step": 427436, "epoch": 2544} {"train_loss": -11.739583015441895, "global_step": 427437, "epoch": 2544} {"train_loss": -11.279094696044922, "global_step": 427438, "epoch": 2544} {"train_loss": -11.333260536193848, "global_step": 427439, "epoch": 2544} {"train_loss": -11.382308959960938, "global_step": 427440, "epoch": 2544} {"train_loss": -11.841968536376953, "global_step": 427441, "epoch": 2544} {"train_loss": -11.74909782409668, "global_step": 427442, "epoch": 2544} {"train_loss": -11.793086051940918, "global_step": 427443, "epoch": 2544} {"train_loss": -12.222485542297363, "global_step": 427444, "epoch": 2544} {"train_loss": -12.238635063171387, "global_step": 427445, "epoch": 2544} {"train_loss": -12.083391189575195, "global_step": 427446, "epoch": 2544} {"train_loss": -12.676448822021484, "global_step": 427447, "epoch": 2544} {"train_loss": -12.057568550109863, "global_step": 427448, "epoch": 2544} {"train_loss": -12.33322525024414, "global_step": 427449, "epoch": 2544} {"train_loss": -12.63924789428711, "global_step": 427450, "epoch": 2544} {"train_loss": -12.003178596496582, "global_step": 427451, "epoch": 2544} {"train_loss": -12.33434009552002, "global_step": 427452, "epoch": 2544} {"train_loss": -12.04802131652832, "global_step": 427453, "epoch": 2544} {"train_loss": -12.302523612976074, "global_step": 427454, "epoch": 2544} {"train_loss": -12.284355163574219, "global_step": 427455, "epoch": 2544} {"train_loss": -12.264820098876953, "global_step": 427456, "epoch": 2544} {"train_loss": -12.515384674072266, "global_step": 427457, "epoch": 2544} {"train_loss": -11.979570388793945, "global_step": 427458, "epoch": 2544} {"train_loss": -12.429189682006836, "global_step": 427459, "epoch": 2544} {"train_loss": -12.443739891052246, "global_step": 427460, "epoch": 2544} {"train_loss": -12.427988052368164, "global_step": 427461, "epoch": 2544} {"train_loss": -12.492599487304688, "global_step": 427462, "epoch": 2544} {"train_loss": -12.44896125793457, "global_step": 427463, "epoch": 2544} {"train_loss": -12.653170585632324, "global_step": 427464, "epoch": 2544} {"train_loss": -12.322484970092773, "global_step": 427465, "epoch": 2544} {"train_loss": -12.710121154785156, "global_step": 427466, "epoch": 2544} {"train_loss": -12.379182815551758, "global_step": 427467, "epoch": 2544} {"train_loss": -12.732991218566895, "global_step": 427468, "epoch": 2544} {"train_loss": -12.63636302947998, "global_step": 427469, "epoch": 2544} {"train_loss": -12.644779205322266, "global_step": 427470, "epoch": 2544} {"train_loss": -12.492518424987793, "global_step": 427471, "epoch": 2544} {"train_loss": -12.338744163513184, "global_step": 427472, "epoch": 2544} {"train_loss": -12.617591857910156, "global_step": 427473, "epoch": 2544} {"train_loss": -12.58154296875, "global_step": 427474, "epoch": 2544} {"train_loss": -12.486221313476562, "global_step": 427475, "epoch": 2544} {"train_loss": -12.235097885131836, "global_step": 427476, "epoch": 2544} {"train_loss": -12.428049087524414, "global_step": 427477, "epoch": 2544} {"train_loss": -12.474678039550781, "global_step": 427478, "epoch": 2544} {"train_loss": -12.529122352600098, "global_step": 427479, "epoch": 2544} {"train_loss": -12.493339538574219, "global_step": 427480, "epoch": 2544} {"train_loss": -12.060964584350586, "global_step": 427481, "epoch": 2544} {"train_loss": -12.36016845703125, "global_step": 427482, "epoch": 2544} {"train_loss": -12.45206069946289, "global_step": 427483, "epoch": 2544} {"train_loss": -12.775274276733398, "global_step": 427484, "epoch": 2544} {"train_loss": -12.529619216918945, "global_step": 427485, "epoch": 2544} {"train_loss": -12.626182556152344, "global_step": 427486, "epoch": 2544} {"train_loss": -12.394325256347656, "global_step": 427487, "epoch": 2544} {"train_loss": -12.501920700073242, "global_step": 427488, "epoch": 2544} {"train_loss": -12.620615005493164, "global_step": 427489, "epoch": 2544} {"train_loss": -12.545635223388672, "global_step": 427490, "epoch": 2544} {"train_loss": -12.411069869995117, "global_step": 427491, "epoch": 2544} {"train_loss": -12.224359512329102, "global_step": 427492, "epoch": 2544} {"train_loss": -12.690021514892578, "global_step": 427493, "epoch": 2544} {"train_loss": -12.545669555664062, "global_step": 427494, "epoch": 2544} {"train_loss": -12.298896789550781, "global_step": 427495, "epoch": 2544} {"train_loss": -12.564312934875488, "global_step": 427496, "epoch": 2544} {"train_loss": -11.878951072692871, "global_step": 427497, "epoch": 2544} {"train_loss": -12.264350891113281, "global_step": 427498, "epoch": 2544} {"train_loss": -12.181307792663574, "global_step": 427499, "epoch": 2544} {"train_loss": -11.755399703979492, "global_step": 427500, "epoch": 2544} {"train_loss": -12.664596557617188, "global_step": 427501, "epoch": 2544} {"train_loss": -12.256032943725586, "global_step": 427502, "epoch": 2544} {"train_loss": -12.547916412353516, "global_step": 427503, "epoch": 2544} {"train_loss": -12.41986083984375, "global_step": 427504, "epoch": 2544} {"train_loss": -12.498762130737305, "global_step": 427505, "epoch": 2544} {"train_loss": -12.511857032775879, "global_step": 427506, "epoch": 2544} {"train_loss": -12.360359191894531, "global_step": 427507, "epoch": 2544} {"train_loss": -11.934598922729492, "global_step": 427508, "epoch": 2544} {"train_loss": -11.45464038848877, "global_step": 427509, "epoch": 2544} {"train_loss": -11.715778350830078, "global_step": 427510, "epoch": 2544} {"train_loss": -12.627029418945312, "global_step": 427511, "epoch": 2544} {"train_loss": -12.158445358276367, "global_step": 427512, "epoch": 2544} {"train_loss": -11.22874641418457, "global_step": 427513, "epoch": 2544} {"train_loss": -11.730887413024902, "global_step": 427514, "epoch": 2544} {"train_loss": -12.286593437194824, "global_step": 427515, "epoch": 2544} {"train_loss": -11.659271240234375, "global_step": 427516, "epoch": 2544} {"train_loss": -11.522537231445312, "global_step": 427517, "epoch": 2544} {"train_loss": -12.637296676635742, "global_step": 427518, "epoch": 2544} {"train_loss": -11.904555320739746, "global_step": 427519, "epoch": 2544} {"train_loss": -12.339229583740234, "global_step": 427520, "epoch": 2544} {"train_loss": -12.524250030517578, "global_step": 427521, "epoch": 2544} {"train_loss": -12.10041618347168, "global_step": 427522, "epoch": 2544} {"train_loss": -12.434999465942383, "global_step": 427523, "epoch": 2544} {"train_loss": -12.378904342651367, "global_step": 427524, "epoch": 2544} {"train_loss": -12.349990844726562, "global_step": 427525, "epoch": 2544} {"train_loss": -12.198674201965332, "global_step": 427526, "epoch": 2544} {"train_loss": -12.635208129882812, "global_step": 427527, "epoch": 2544} {"train_loss": -12.158734321594238, "global_step": 427528, "epoch": 2544} {"train_loss": -12.367680549621582, "global_step": 427529, "epoch": 2544} {"train_loss": -12.203084945678711, "global_step": 427530, "epoch": 2544} {"train_loss": -12.394948959350586, "global_step": 427531, "epoch": 2544} {"train_loss": -12.380926132202148, "global_step": 427532, "epoch": 2544} {"train_loss": -11.981884002685547, "global_step": 427533, "epoch": 2544} {"train_loss": -12.440511703491211, "global_step": 427534, "epoch": 2544} {"train_loss": -12.377817153930664, "global_step": 427535, "epoch": 2544} {"train_loss": -12.345680236816406, "global_step": 427536, "epoch": 2544} {"train_loss": -12.349251747131348, "global_step": 427537, "epoch": 2544} {"train_loss": -12.441425323486328, "global_step": 427538, "epoch": 2544} {"train_loss": -12.277421951293945, "global_step": 427539, "epoch": 2544} {"train_loss": -12.497998237609863, "global_step": 427540, "epoch": 2544} {"train_loss": -12.279340744018555, "global_step": 427541, "epoch": 2544} {"train_loss": -12.424514770507812, "global_step": 427542, "epoch": 2544} {"train_loss": -12.308457374572754, "global_step": 427543, "epoch": 2544} {"train_loss": -12.078027725219727, "global_step": 427544, "epoch": 2544} {"train_loss": -12.40989875793457, "global_step": 427545, "epoch": 2544} {"train_loss": -11.28993034362793, "global_step": 427546, "epoch": 2544} {"train_loss": -12.011140823364258, "global_step": 427547, "epoch": 2544} {"train_loss": -12.085664749145508, "global_step": 427548, "epoch": 2544} {"train_loss": -11.541894912719727, "global_step": 427549, "epoch": 2544} {"train_loss": -12.141019821166992, "global_step": 427550, "epoch": 2544} {"train_loss": -12.396190643310547, "global_step": 427551, "epoch": 2544} {"train_loss": -11.766838073730469, "global_step": 427552, "epoch": 2544} {"train_loss": -12.53110408782959, "global_step": 427553, "epoch": 2544} {"train_loss": -12.15447998046875, "global_step": 427554, "epoch": 2544} {"train_loss": -12.426412582397461, "global_step": 427555, "epoch": 2544} {"train_loss": -11.969515800476074, "global_step": 427556, "epoch": 2544} {"train_loss": -10.051542282104492, "global_step": 427557, "epoch": 2544} {"train_loss": -10.804670333862305, "global_step": 427558, "epoch": 2544} {"train_loss": -12.20159065155756, "global_step": 427559, "epoch": 2544, "val_loss": 305681.75} {"train_loss": -11.338949203491211, "global_step": 427560, "epoch": 2545} {"train_loss": -12.636326789855957, "global_step": 427561, "epoch": 2545} {"train_loss": -11.912862777709961, "global_step": 427562, "epoch": 2545} {"train_loss": -12.077441215515137, "global_step": 427563, "epoch": 2545} {"train_loss": -11.240486145019531, "global_step": 427564, "epoch": 2545} {"train_loss": -12.171010971069336, "global_step": 427565, "epoch": 2545} {"train_loss": -12.157254219055176, "global_step": 427566, "epoch": 2545} {"train_loss": -11.452099800109863, "global_step": 427567, "epoch": 2545} {"train_loss": -11.607885360717773, "global_step": 427568, "epoch": 2545} {"train_loss": -11.953224182128906, "global_step": 427569, "epoch": 2545} {"train_loss": -11.076040267944336, "global_step": 427570, "epoch": 2545} {"train_loss": -12.149430274963379, "global_step": 427571, "epoch": 2545} {"train_loss": -11.769973754882812, "global_step": 427572, "epoch": 2545} {"train_loss": -11.519025802612305, "global_step": 427573, "epoch": 2545} {"train_loss": -12.237141609191895, "global_step": 427574, "epoch": 2545} {"train_loss": -11.46065616607666, "global_step": 427575, "epoch": 2545} {"train_loss": -12.356182098388672, "global_step": 427576, "epoch": 2545} {"train_loss": -12.133610725402832, "global_step": 427577, "epoch": 2545} {"train_loss": -11.756746292114258, "global_step": 427578, "epoch": 2545} {"train_loss": -12.349428176879883, "global_step": 427579, "epoch": 2545} {"train_loss": -11.580526351928711, "global_step": 427580, "epoch": 2545} {"train_loss": -11.316749572753906, "global_step": 427581, "epoch": 2545} {"train_loss": -11.491552352905273, "global_step": 427582, "epoch": 2545} {"train_loss": -11.69290828704834, "global_step": 427583, "epoch": 2545} {"train_loss": -10.006464004516602, "global_step": 427584, "epoch": 2545} {"train_loss": -11.702423095703125, "global_step": 427585, "epoch": 2545} {"train_loss": -11.65800666809082, "global_step": 427586, "epoch": 2545} {"train_loss": -11.875859260559082, "global_step": 427587, "epoch": 2545} {"train_loss": -12.004605293273926, "global_step": 427588, "epoch": 2545} {"train_loss": -11.930561065673828, "global_step": 427589, "epoch": 2545} {"train_loss": -12.2510986328125, "global_step": 427590, "epoch": 2545} {"train_loss": -11.893495559692383, "global_step": 427591, "epoch": 2545} {"train_loss": -12.275179862976074, "global_step": 427592, "epoch": 2545} {"train_loss": -11.953704833984375, "global_step": 427593, "epoch": 2545} {"train_loss": -11.862720489501953, "global_step": 427594, "epoch": 2545} {"train_loss": -12.269869804382324, "global_step": 427595, "epoch": 2545} {"train_loss": -11.62781810760498, "global_step": 427596, "epoch": 2545} {"train_loss": -12.343470573425293, "global_step": 427597, "epoch": 2545} {"train_loss": -12.254462242126465, "global_step": 427598, "epoch": 2545} {"train_loss": -12.173372268676758, "global_step": 427599, "epoch": 2545} {"train_loss": -12.321486473083496, "global_step": 427600, "epoch": 2545} {"train_loss": -12.19086742401123, "global_step": 427601, "epoch": 2545} {"train_loss": -12.583318710327148, "global_step": 427602, "epoch": 2545} {"train_loss": -12.485099792480469, "global_step": 427603, "epoch": 2545} {"train_loss": -12.503227233886719, "global_step": 427604, "epoch": 2545} {"train_loss": -12.504915237426758, "global_step": 427605, "epoch": 2545} {"train_loss": -12.188746452331543, "global_step": 427606, "epoch": 2545} {"train_loss": -12.555530548095703, "global_step": 427607, "epoch": 2545} {"train_loss": -12.034782409667969, "global_step": 427608, "epoch": 2545} {"train_loss": -12.484772682189941, "global_step": 427609, "epoch": 2545} {"train_loss": -12.298006057739258, "global_step": 427610, "epoch": 2545} {"train_loss": -12.377025604248047, "global_step": 427611, "epoch": 2545} {"train_loss": -12.369118690490723, "global_step": 427612, "epoch": 2545} {"train_loss": -12.168819427490234, "global_step": 427613, "epoch": 2545} {"train_loss": -12.180364608764648, "global_step": 427614, "epoch": 2545} {"train_loss": -12.350141525268555, "global_step": 427615, "epoch": 2545} {"train_loss": -12.135751724243164, "global_step": 427616, "epoch": 2545} {"train_loss": -12.306078910827637, "global_step": 427617, "epoch": 2545} {"train_loss": -12.496147155761719, "global_step": 427618, "epoch": 2545} {"train_loss": -12.554377555847168, "global_step": 427619, "epoch": 2545} {"train_loss": -12.5094633102417, "global_step": 427620, "epoch": 2545} {"train_loss": -12.629454612731934, "global_step": 427621, "epoch": 2545} {"train_loss": -12.634037017822266, "global_step": 427622, "epoch": 2545} {"train_loss": -12.548383712768555, "global_step": 427623, "epoch": 2545} {"train_loss": -12.680826187133789, "global_step": 427624, "epoch": 2545} {"train_loss": -12.38588809967041, "global_step": 427625, "epoch": 2545} {"train_loss": -12.63917350769043, "global_step": 427626, "epoch": 2545} {"train_loss": -12.017366409301758, "global_step": 427627, "epoch": 2545} {"train_loss": -12.540445327758789, "global_step": 427628, "epoch": 2545} {"train_loss": -12.201168060302734, "global_step": 427629, "epoch": 2545} {"train_loss": -12.769529342651367, "global_step": 427630, "epoch": 2545} {"train_loss": -12.325645446777344, "global_step": 427631, "epoch": 2545} {"train_loss": -12.607351303100586, "global_step": 427632, "epoch": 2545} {"train_loss": -12.184961318969727, "global_step": 427633, "epoch": 2545} {"train_loss": -12.309932708740234, "global_step": 427634, "epoch": 2545} {"train_loss": -12.497079849243164, "global_step": 427635, "epoch": 2545} {"train_loss": -12.376110076904297, "global_step": 427636, "epoch": 2545} {"train_loss": -12.33582878112793, "global_step": 427637, "epoch": 2545} {"train_loss": -12.588558197021484, "global_step": 427638, "epoch": 2545} {"train_loss": -12.51587200164795, "global_step": 427639, "epoch": 2545} {"train_loss": -12.518009185791016, "global_step": 427640, "epoch": 2545} {"train_loss": -12.766528129577637, "global_step": 427641, "epoch": 2545} {"train_loss": -12.584329605102539, "global_step": 427642, "epoch": 2545} {"train_loss": -12.838294982910156, "global_step": 427643, "epoch": 2545} {"train_loss": -12.679852485656738, "global_step": 427644, "epoch": 2545} {"train_loss": -12.675859451293945, "global_step": 427645, "epoch": 2545} {"train_loss": -12.623924255371094, "global_step": 427646, "epoch": 2545} {"train_loss": -12.645158767700195, "global_step": 427647, "epoch": 2545} {"train_loss": -12.772212982177734, "global_step": 427648, "epoch": 2545} {"train_loss": -12.563716888427734, "global_step": 427649, "epoch": 2545} {"train_loss": -12.591066360473633, "global_step": 427650, "epoch": 2545} {"train_loss": -12.737691879272461, "global_step": 427651, "epoch": 2545} {"train_loss": -12.350399017333984, "global_step": 427652, "epoch": 2545} {"train_loss": -12.767757415771484, "global_step": 427653, "epoch": 2545} {"train_loss": -12.518624305725098, "global_step": 427654, "epoch": 2545} {"train_loss": -12.102215766906738, "global_step": 427655, "epoch": 2545} {"train_loss": -12.705632209777832, "global_step": 427656, "epoch": 2545} {"train_loss": -12.52230453491211, "global_step": 427657, "epoch": 2545} {"train_loss": -12.477252960205078, "global_step": 427658, "epoch": 2545} {"train_loss": -12.626944541931152, "global_step": 427659, "epoch": 2545} {"train_loss": -12.350757598876953, "global_step": 427660, "epoch": 2545} {"train_loss": -12.812976837158203, "global_step": 427661, "epoch": 2545} {"train_loss": -12.01167106628418, "global_step": 427662, "epoch": 2545} {"train_loss": -11.710870742797852, "global_step": 427663, "epoch": 2545} {"train_loss": -12.478175163269043, "global_step": 427664, "epoch": 2545} {"train_loss": -12.299236297607422, "global_step": 427665, "epoch": 2545} {"train_loss": -12.265064239501953, "global_step": 427666, "epoch": 2545} {"train_loss": -12.532224655151367, "global_step": 427667, "epoch": 2545} {"train_loss": -12.111794471740723, "global_step": 427668, "epoch": 2545} {"train_loss": -11.840620040893555, "global_step": 427669, "epoch": 2545} {"train_loss": -12.389331817626953, "global_step": 427670, "epoch": 2545} {"train_loss": -12.779745101928711, "global_step": 427671, "epoch": 2545} {"train_loss": -12.155843734741211, "global_step": 427672, "epoch": 2545} {"train_loss": -11.826031684875488, "global_step": 427673, "epoch": 2545} {"train_loss": -12.536687850952148, "global_step": 427674, "epoch": 2545} {"train_loss": -11.54405403137207, "global_step": 427675, "epoch": 2545} {"train_loss": -12.0786771774292, "global_step": 427676, "epoch": 2545} {"train_loss": -12.198015213012695, "global_step": 427677, "epoch": 2545} {"train_loss": -12.374250411987305, "global_step": 427678, "epoch": 2545} {"train_loss": -12.223470687866211, "global_step": 427679, "epoch": 2545} {"train_loss": -12.581833839416504, "global_step": 427680, "epoch": 2545} {"train_loss": -12.402320861816406, "global_step": 427681, "epoch": 2545} {"train_loss": -12.36141586303711, "global_step": 427682, "epoch": 2545} {"train_loss": -12.364542007446289, "global_step": 427683, "epoch": 2545} {"train_loss": -12.616132736206055, "global_step": 427684, "epoch": 2545} {"train_loss": -12.664949417114258, "global_step": 427685, "epoch": 2545} {"train_loss": -12.28626823425293, "global_step": 427686, "epoch": 2545} {"train_loss": -12.384744644165039, "global_step": 427687, "epoch": 2545} {"train_loss": -12.558283805847168, "global_step": 427688, "epoch": 2545} {"train_loss": -12.611486434936523, "global_step": 427689, "epoch": 2545} {"train_loss": -12.637948989868164, "global_step": 427690, "epoch": 2545} {"train_loss": -12.712371826171875, "global_step": 427691, "epoch": 2545} {"train_loss": -12.645513534545898, "global_step": 427692, "epoch": 2545} {"train_loss": -12.152790069580078, "global_step": 427693, "epoch": 2545} {"train_loss": -12.441560745239258, "global_step": 427694, "epoch": 2545} {"train_loss": -12.825682640075684, "global_step": 427695, "epoch": 2545} {"train_loss": -12.062715530395508, "global_step": 427696, "epoch": 2545} {"train_loss": -11.984560012817383, "global_step": 427697, "epoch": 2545} {"train_loss": -12.548055648803711, "global_step": 427698, "epoch": 2545} {"train_loss": -12.614358901977539, "global_step": 427699, "epoch": 2545} {"train_loss": -12.472776412963867, "global_step": 427700, "epoch": 2545} {"train_loss": -12.088006019592285, "global_step": 427701, "epoch": 2545} {"train_loss": -12.389249801635742, "global_step": 427702, "epoch": 2545} {"train_loss": -11.959465980529785, "global_step": 427703, "epoch": 2545} {"train_loss": -12.695379257202148, "global_step": 427704, "epoch": 2545} {"train_loss": -12.145245552062988, "global_step": 427705, "epoch": 2545} {"train_loss": -12.406597137451172, "global_step": 427706, "epoch": 2545} {"train_loss": -12.172845840454102, "global_step": 427707, "epoch": 2545} {"train_loss": -12.022321701049805, "global_step": 427708, "epoch": 2545} {"train_loss": -12.634371757507324, "global_step": 427709, "epoch": 2545} {"train_loss": -12.358959197998047, "global_step": 427710, "epoch": 2545} {"train_loss": -12.153173446655273, "global_step": 427711, "epoch": 2545} {"train_loss": -12.535969734191895, "global_step": 427712, "epoch": 2545} {"train_loss": -12.644693374633789, "global_step": 427713, "epoch": 2545} {"train_loss": -12.006237030029297, "global_step": 427714, "epoch": 2545} {"train_loss": -12.280130386352539, "global_step": 427715, "epoch": 2545} {"train_loss": -12.731985092163086, "global_step": 427716, "epoch": 2545} {"train_loss": -12.537175178527832, "global_step": 427717, "epoch": 2545} {"train_loss": -12.665163040161133, "global_step": 427718, "epoch": 2545} {"train_loss": -12.760751724243164, "global_step": 427719, "epoch": 2545} {"train_loss": -12.799089431762695, "global_step": 427720, "epoch": 2545} {"train_loss": -12.504236221313477, "global_step": 427721, "epoch": 2545} {"train_loss": -12.872028350830078, "global_step": 427722, "epoch": 2545} {"train_loss": -12.873442649841309, "global_step": 427723, "epoch": 2545} {"train_loss": -12.995684623718262, "global_step": 427724, "epoch": 2545} {"train_loss": -12.71757984161377, "global_step": 427725, "epoch": 2545} {"train_loss": -12.452688217163086, "global_step": 427726, "epoch": 2545} {"train_loss": -12.28966736793518, "global_step": 427727, "epoch": 2545, "val_loss": 306516.03125, "train_action_mse_error": 1.3296340703964233} {"train_loss": -12.220709800720215, "global_step": 427728, "epoch": 2546} {"train_loss": -12.726236343383789, "global_step": 427729, "epoch": 2546} {"train_loss": -12.093505859375, "global_step": 427730, "epoch": 2546} {"train_loss": -12.374520301818848, "global_step": 427731, "epoch": 2546} {"train_loss": -12.544168472290039, "global_step": 427732, "epoch": 2546} {"train_loss": -12.439689636230469, "global_step": 427733, "epoch": 2546} {"train_loss": -12.203597068786621, "global_step": 427734, "epoch": 2546} {"train_loss": -12.330151557922363, "global_step": 427735, "epoch": 2546} {"train_loss": -12.561357498168945, "global_step": 427736, "epoch": 2546} {"train_loss": -12.662370681762695, "global_step": 427737, "epoch": 2546} {"train_loss": -12.189865112304688, "global_step": 427738, "epoch": 2546} {"train_loss": -12.281038284301758, "global_step": 427739, "epoch": 2546} {"train_loss": -12.887310981750488, "global_step": 427740, "epoch": 2546} {"train_loss": -12.772477149963379, "global_step": 427741, "epoch": 2546} {"train_loss": -12.539207458496094, "global_step": 427742, "epoch": 2546} {"train_loss": -12.552550315856934, "global_step": 427743, "epoch": 2546} {"train_loss": -12.96895980834961, "global_step": 427744, "epoch": 2546} {"train_loss": -12.651634216308594, "global_step": 427745, "epoch": 2546} {"train_loss": -12.619030952453613, "global_step": 427746, "epoch": 2546} {"train_loss": -12.477574348449707, "global_step": 427747, "epoch": 2546} {"train_loss": -12.762481689453125, "global_step": 427748, "epoch": 2546} {"train_loss": -12.183632850646973, "global_step": 427749, "epoch": 2546} {"train_loss": -12.385225296020508, "global_step": 427750, "epoch": 2546} {"train_loss": -12.503228187561035, "global_step": 427751, "epoch": 2546} {"train_loss": -11.593206405639648, "global_step": 427752, "epoch": 2546} {"train_loss": -11.857452392578125, "global_step": 427753, "epoch": 2546} {"train_loss": -12.379030227661133, "global_step": 427754, "epoch": 2546} {"train_loss": -12.489089965820312, "global_step": 427755, "epoch": 2546} {"train_loss": -12.555803298950195, "global_step": 427756, "epoch": 2546} {"train_loss": -12.555604934692383, "global_step": 427757, "epoch": 2546} {"train_loss": -12.540237426757812, "global_step": 427758, "epoch": 2546} {"train_loss": -12.143980979919434, "global_step": 427759, "epoch": 2546} {"train_loss": -12.73967170715332, "global_step": 427760, "epoch": 2546} {"train_loss": -12.208858489990234, "global_step": 427761, "epoch": 2546} {"train_loss": -12.514900207519531, "global_step": 427762, "epoch": 2546} {"train_loss": -12.112229347229004, "global_step": 427763, "epoch": 2546} {"train_loss": -12.116931915283203, "global_step": 427764, "epoch": 2546} {"train_loss": -12.422876358032227, "global_step": 427765, "epoch": 2546} {"train_loss": -12.09222412109375, "global_step": 427766, "epoch": 2546} {"train_loss": -11.800300598144531, "global_step": 427767, "epoch": 2546} {"train_loss": -11.5903959274292, "global_step": 427768, "epoch": 2546} {"train_loss": -11.890775680541992, "global_step": 427769, "epoch": 2546} {"train_loss": -11.656009674072266, "global_step": 427770, "epoch": 2546} {"train_loss": -10.711427688598633, "global_step": 427771, "epoch": 2546} {"train_loss": -10.745402336120605, "global_step": 427772, "epoch": 2546} {"train_loss": -12.388696670532227, "global_step": 427773, "epoch": 2546} {"train_loss": -11.67517375946045, "global_step": 427774, "epoch": 2546} {"train_loss": -11.270919799804688, "global_step": 427775, "epoch": 2546} {"train_loss": -12.059062957763672, "global_step": 427776, "epoch": 2546} {"train_loss": -12.235832214355469, "global_step": 427777, "epoch": 2546} {"train_loss": -11.657737731933594, "global_step": 427778, "epoch": 2546} {"train_loss": -12.121160507202148, "global_step": 427779, "epoch": 2546} {"train_loss": -11.951438903808594, "global_step": 427780, "epoch": 2546} {"train_loss": -11.234121322631836, "global_step": 427781, "epoch": 2546} {"train_loss": -12.026244163513184, "global_step": 427782, "epoch": 2546} {"train_loss": -10.519598960876465, "global_step": 427783, "epoch": 2546} {"train_loss": -12.362135887145996, "global_step": 427784, "epoch": 2546} {"train_loss": -10.500839233398438, "global_step": 427785, "epoch": 2546} {"train_loss": -11.772651672363281, "global_step": 427786, "epoch": 2546} {"train_loss": -10.718657493591309, "global_step": 427787, "epoch": 2546} {"train_loss": -11.330766677856445, "global_step": 427788, "epoch": 2546} {"train_loss": -11.438898086547852, "global_step": 427789, "epoch": 2546} {"train_loss": -10.518638610839844, "global_step": 427790, "epoch": 2546} {"train_loss": -12.115172386169434, "global_step": 427791, "epoch": 2546} {"train_loss": -10.382587432861328, "global_step": 427792, "epoch": 2546} {"train_loss": -11.463046073913574, "global_step": 427793, "epoch": 2546} {"train_loss": -11.118949890136719, "global_step": 427794, "epoch": 2546} {"train_loss": -11.285627365112305, "global_step": 427795, "epoch": 2546} {"train_loss": -11.269194602966309, "global_step": 427796, "epoch": 2546} {"train_loss": -10.317401885986328, "global_step": 427797, "epoch": 2546} {"train_loss": -12.327123641967773, "global_step": 427798, "epoch": 2546} {"train_loss": -10.391892433166504, "global_step": 427799, "epoch": 2546} {"train_loss": -11.603217124938965, "global_step": 427800, "epoch": 2546} {"train_loss": -9.981714248657227, "global_step": 427801, "epoch": 2546} {"train_loss": -11.754063606262207, "global_step": 427802, "epoch": 2546} {"train_loss": -11.039339065551758, "global_step": 427803, "epoch": 2546} {"train_loss": -11.615765571594238, "global_step": 427804, "epoch": 2546} {"train_loss": -11.266788482666016, "global_step": 427805, "epoch": 2546} {"train_loss": -11.08791446685791, "global_step": 427806, "epoch": 2546} {"train_loss": -11.867846488952637, "global_step": 427807, "epoch": 2546} {"train_loss": -11.490152359008789, "global_step": 427808, "epoch": 2546} {"train_loss": -11.88056755065918, "global_step": 427809, "epoch": 2546} {"train_loss": -11.719378471374512, "global_step": 427810, "epoch": 2546} {"train_loss": -11.935226440429688, "global_step": 427811, "epoch": 2546} {"train_loss": -11.55203628540039, "global_step": 427812, "epoch": 2546} {"train_loss": -11.87083625793457, "global_step": 427813, "epoch": 2546} {"train_loss": -11.111934661865234, "global_step": 427814, "epoch": 2546} {"train_loss": -11.310823440551758, "global_step": 427815, "epoch": 2546} {"train_loss": -11.667003631591797, "global_step": 427816, "epoch": 2546} {"train_loss": -11.570115089416504, "global_step": 427817, "epoch": 2546} {"train_loss": -11.864654541015625, "global_step": 427818, "epoch": 2546} {"train_loss": -11.435075759887695, "global_step": 427819, "epoch": 2546} {"train_loss": -11.852051734924316, "global_step": 427820, "epoch": 2546} {"train_loss": -11.99887466430664, "global_step": 427821, "epoch": 2546} {"train_loss": -12.012450218200684, "global_step": 427822, "epoch": 2546} {"train_loss": -11.772964477539062, "global_step": 427823, "epoch": 2546} {"train_loss": -12.438663482666016, "global_step": 427824, "epoch": 2546} {"train_loss": -12.065345764160156, "global_step": 427825, "epoch": 2546} {"train_loss": -12.370030403137207, "global_step": 427826, "epoch": 2546} {"train_loss": -12.246044158935547, "global_step": 427827, "epoch": 2546} {"train_loss": -11.981512069702148, "global_step": 427828, "epoch": 2546} {"train_loss": -12.387812614440918, "global_step": 427829, "epoch": 2546} {"train_loss": -11.984479904174805, "global_step": 427830, "epoch": 2546} {"train_loss": -12.094659805297852, "global_step": 427831, "epoch": 2546} {"train_loss": -12.007692337036133, "global_step": 427832, "epoch": 2546} {"train_loss": -12.145496368408203, "global_step": 427833, "epoch": 2546} {"train_loss": -12.247636795043945, "global_step": 427834, "epoch": 2546} {"train_loss": -12.153593063354492, "global_step": 427835, "epoch": 2546} {"train_loss": -12.42534065246582, "global_step": 427836, "epoch": 2546} {"train_loss": -12.20400619506836, "global_step": 427837, "epoch": 2546} {"train_loss": -12.019183158874512, "global_step": 427838, "epoch": 2546} {"train_loss": -12.05829906463623, "global_step": 427839, "epoch": 2546} {"train_loss": -12.380691528320312, "global_step": 427840, "epoch": 2546} {"train_loss": -12.535554885864258, "global_step": 427841, "epoch": 2546} {"train_loss": -12.56800365447998, "global_step": 427842, "epoch": 2546} {"train_loss": -12.456687927246094, "global_step": 427843, "epoch": 2546} {"train_loss": -12.517370223999023, "global_step": 427844, "epoch": 2546} {"train_loss": -12.354366302490234, "global_step": 427845, "epoch": 2546} {"train_loss": -12.570564270019531, "global_step": 427846, "epoch": 2546} {"train_loss": -12.442205429077148, "global_step": 427847, "epoch": 2546} {"train_loss": -12.614705085754395, "global_step": 427848, "epoch": 2546} {"train_loss": -12.66489028930664, "global_step": 427849, "epoch": 2546} {"train_loss": -12.480386734008789, "global_step": 427850, "epoch": 2546} {"train_loss": -12.55077075958252, "global_step": 427851, "epoch": 2546} {"train_loss": -12.646018981933594, "global_step": 427852, "epoch": 2546} {"train_loss": -12.472282409667969, "global_step": 427853, "epoch": 2546} {"train_loss": -12.538891792297363, "global_step": 427854, "epoch": 2546} {"train_loss": -12.606647491455078, "global_step": 427855, "epoch": 2546} {"train_loss": -12.46566104888916, "global_step": 427856, "epoch": 2546} {"train_loss": -12.571651458740234, "global_step": 427857, "epoch": 2546} {"train_loss": -12.224270820617676, "global_step": 427858, "epoch": 2546} {"train_loss": -12.552032470703125, "global_step": 427859, "epoch": 2546} {"train_loss": -12.177728652954102, "global_step": 427860, "epoch": 2546} {"train_loss": -12.647425651550293, "global_step": 427861, "epoch": 2546} {"train_loss": -12.42668342590332, "global_step": 427862, "epoch": 2546} {"train_loss": -12.390628814697266, "global_step": 427863, "epoch": 2546} {"train_loss": -12.774085998535156, "global_step": 427864, "epoch": 2546} {"train_loss": -12.303306579589844, "global_step": 427865, "epoch": 2546} {"train_loss": -12.687275886535645, "global_step": 427866, "epoch": 2546} {"train_loss": -12.36077880859375, "global_step": 427867, "epoch": 2546} {"train_loss": -12.726612091064453, "global_step": 427868, "epoch": 2546} {"train_loss": -12.264326095581055, "global_step": 427869, "epoch": 2546} {"train_loss": -12.698671340942383, "global_step": 427870, "epoch": 2546} {"train_loss": -12.415724754333496, "global_step": 427871, "epoch": 2546} {"train_loss": -12.46897029876709, "global_step": 427872, "epoch": 2546} {"train_loss": -12.156265258789062, "global_step": 427873, "epoch": 2546} {"train_loss": -12.515641212463379, "global_step": 427874, "epoch": 2546} {"train_loss": -12.277971267700195, "global_step": 427875, "epoch": 2546} {"train_loss": -12.566034317016602, "global_step": 427876, "epoch": 2546} {"train_loss": -12.423736572265625, "global_step": 427877, "epoch": 2546} {"train_loss": -12.545825004577637, "global_step": 427878, "epoch": 2546} {"train_loss": -12.583436012268066, "global_step": 427879, "epoch": 2546} {"train_loss": -12.549952507019043, "global_step": 427880, "epoch": 2546} {"train_loss": -12.778877258300781, "global_step": 427881, "epoch": 2546} {"train_loss": -12.613822937011719, "global_step": 427882, "epoch": 2546} {"train_loss": -12.59184455871582, "global_step": 427883, "epoch": 2546} {"train_loss": -12.359858512878418, "global_step": 427884, "epoch": 2546} {"train_loss": -12.652721405029297, "global_step": 427885, "epoch": 2546} {"train_loss": -12.616937637329102, "global_step": 427886, "epoch": 2546} {"train_loss": -12.824529647827148, "global_step": 427887, "epoch": 2546} {"train_loss": -12.89371109008789, "global_step": 427888, "epoch": 2546} {"train_loss": -12.34449577331543, "global_step": 427889, "epoch": 2546} {"train_loss": -12.63387393951416, "global_step": 427890, "epoch": 2546} {"train_loss": -12.520216941833496, "global_step": 427891, "epoch": 2546} {"train_loss": -12.687522888183594, "global_step": 427892, "epoch": 2546} {"train_loss": -12.441883087158203, "global_step": 427893, "epoch": 2546} {"train_loss": -12.634053230285645, "global_step": 427894, "epoch": 2546} {"train_loss": -12.11218077795846, "global_step": 427895, "epoch": 2546, "val_loss": 307521.9375} {"train_loss": -12.552806854248047, "global_step": 427896, "epoch": 2547} {"train_loss": -12.753034591674805, "global_step": 427897, "epoch": 2547} {"train_loss": -12.89194107055664, "global_step": 427898, "epoch": 2547} {"train_loss": -12.56449031829834, "global_step": 427899, "epoch": 2547} {"train_loss": -11.9974946975708, "global_step": 427900, "epoch": 2547} {"train_loss": -12.407674789428711, "global_step": 427901, "epoch": 2547} {"train_loss": -12.377340316772461, "global_step": 427902, "epoch": 2547} {"train_loss": -12.33096981048584, "global_step": 427903, "epoch": 2547} {"train_loss": -12.363929748535156, "global_step": 427904, "epoch": 2547} {"train_loss": -12.261116981506348, "global_step": 427905, "epoch": 2547} {"train_loss": -12.519207000732422, "global_step": 427906, "epoch": 2547} {"train_loss": -12.423471450805664, "global_step": 427907, "epoch": 2547} {"train_loss": -12.260560035705566, "global_step": 427908, "epoch": 2547} {"train_loss": -12.578866958618164, "global_step": 427909, "epoch": 2547} {"train_loss": -12.844917297363281, "global_step": 427910, "epoch": 2547} {"train_loss": -12.526012420654297, "global_step": 427911, "epoch": 2547} {"train_loss": -13.036954879760742, "global_step": 427912, "epoch": 2547} {"train_loss": -12.830867767333984, "global_step": 427913, "epoch": 2547} {"train_loss": -12.88564395904541, "global_step": 427914, "epoch": 2547} {"train_loss": -12.654510498046875, "global_step": 427915, "epoch": 2547} {"train_loss": -12.579730033874512, "global_step": 427916, "epoch": 2547} {"train_loss": -12.899001121520996, "global_step": 427917, "epoch": 2547} {"train_loss": -12.53111457824707, "global_step": 427918, "epoch": 2547} {"train_loss": -12.652884483337402, "global_step": 427919, "epoch": 2547} {"train_loss": -12.754749298095703, "global_step": 427920, "epoch": 2547} {"train_loss": -12.52161979675293, "global_step": 427921, "epoch": 2547} {"train_loss": -11.633885383605957, "global_step": 427922, "epoch": 2547} {"train_loss": -11.438365936279297, "global_step": 427923, "epoch": 2547} {"train_loss": -11.898452758789062, "global_step": 427924, "epoch": 2547} {"train_loss": -11.243215560913086, "global_step": 427925, "epoch": 2547} {"train_loss": -10.73127269744873, "global_step": 427926, "epoch": 2547} {"train_loss": -12.11823558807373, "global_step": 427927, "epoch": 2547} {"train_loss": -11.670804023742676, "global_step": 427928, "epoch": 2547} {"train_loss": -9.962939262390137, "global_step": 427929, "epoch": 2547} {"train_loss": -11.875516891479492, "global_step": 427930, "epoch": 2547} {"train_loss": -9.480378150939941, "global_step": 427931, "epoch": 2547} {"train_loss": -9.605701446533203, "global_step": 427932, "epoch": 2547} {"train_loss": -9.903229713439941, "global_step": 427933, "epoch": 2547} {"train_loss": -10.352855682373047, "global_step": 427934, "epoch": 2547} {"train_loss": -10.541783332824707, "global_step": 427935, "epoch": 2547} {"train_loss": -10.627985954284668, "global_step": 427936, "epoch": 2547} {"train_loss": -9.035541534423828, "global_step": 427937, "epoch": 2547} {"train_loss": -10.116161346435547, "global_step": 427938, "epoch": 2547} {"train_loss": -11.05601692199707, "global_step": 427939, "epoch": 2547} {"train_loss": -10.07482624053955, "global_step": 427940, "epoch": 2547} {"train_loss": -10.14356803894043, "global_step": 427941, "epoch": 2547} {"train_loss": -10.624724388122559, "global_step": 427942, "epoch": 2547} {"train_loss": -10.853925704956055, "global_step": 427943, "epoch": 2547} {"train_loss": -10.809409141540527, "global_step": 427944, "epoch": 2547} {"train_loss": -9.609977722167969, "global_step": 427945, "epoch": 2547} {"train_loss": -11.795467376708984, "global_step": 427946, "epoch": 2547} {"train_loss": -10.628350257873535, "global_step": 427947, "epoch": 2547} {"train_loss": -11.453607559204102, "global_step": 427948, "epoch": 2547} {"train_loss": -10.482378959655762, "global_step": 427949, "epoch": 2547} {"train_loss": -11.779600143432617, "global_step": 427950, "epoch": 2547} {"train_loss": -10.506675720214844, "global_step": 427951, "epoch": 2547} {"train_loss": -11.791633605957031, "global_step": 427952, "epoch": 2547} {"train_loss": -11.596139907836914, "global_step": 427953, "epoch": 2547} {"train_loss": -10.971564292907715, "global_step": 427954, "epoch": 2547} {"train_loss": -11.817403793334961, "global_step": 427955, "epoch": 2547} {"train_loss": -11.475741386413574, "global_step": 427956, "epoch": 2547} {"train_loss": -11.002706527709961, "global_step": 427957, "epoch": 2547} {"train_loss": -11.981289863586426, "global_step": 427958, "epoch": 2547} {"train_loss": -10.732352256774902, "global_step": 427959, "epoch": 2547} {"train_loss": -11.170063018798828, "global_step": 427960, "epoch": 2547} {"train_loss": -11.605474472045898, "global_step": 427961, "epoch": 2547} {"train_loss": -11.22584056854248, "global_step": 427962, "epoch": 2547} {"train_loss": -11.450899124145508, "global_step": 427963, "epoch": 2547} {"train_loss": -10.97797966003418, "global_step": 427964, "epoch": 2547} {"train_loss": -11.453473091125488, "global_step": 427965, "epoch": 2547} {"train_loss": -11.637449264526367, "global_step": 427966, "epoch": 2547} {"train_loss": -11.773163795471191, "global_step": 427967, "epoch": 2547} {"train_loss": -11.510994911193848, "global_step": 427968, "epoch": 2547} {"train_loss": -11.212336540222168, "global_step": 427969, "epoch": 2547} {"train_loss": -11.426332473754883, "global_step": 427970, "epoch": 2547} {"train_loss": -10.639202117919922, "global_step": 427971, "epoch": 2547} {"train_loss": -12.00985336303711, "global_step": 427972, "epoch": 2547} {"train_loss": -10.797548294067383, "global_step": 427973, "epoch": 2547} {"train_loss": -11.99441146850586, "global_step": 427974, "epoch": 2547} {"train_loss": -11.339832305908203, "global_step": 427975, "epoch": 2547} {"train_loss": -11.359634399414062, "global_step": 427976, "epoch": 2547} {"train_loss": -11.888049125671387, "global_step": 427977, "epoch": 2547} {"train_loss": -11.426334381103516, "global_step": 427978, "epoch": 2547} {"train_loss": -11.377893447875977, "global_step": 427979, "epoch": 2547} {"train_loss": -12.008188247680664, "global_step": 427980, "epoch": 2547} {"train_loss": -11.703455924987793, "global_step": 427981, "epoch": 2547} {"train_loss": -11.195801734924316, "global_step": 427982, "epoch": 2547} {"train_loss": -12.11229133605957, "global_step": 427983, "epoch": 2547} {"train_loss": -10.946372032165527, "global_step": 427984, "epoch": 2547} {"train_loss": -11.886625289916992, "global_step": 427985, "epoch": 2547} {"train_loss": -11.720855712890625, "global_step": 427986, "epoch": 2547} {"train_loss": -11.661428451538086, "global_step": 427987, "epoch": 2547} {"train_loss": -11.85986042022705, "global_step": 427988, "epoch": 2547} {"train_loss": -11.605072975158691, "global_step": 427989, "epoch": 2547} {"train_loss": -11.739198684692383, "global_step": 427990, "epoch": 2547} {"train_loss": -11.826074600219727, "global_step": 427991, "epoch": 2547} {"train_loss": -11.702812194824219, "global_step": 427992, "epoch": 2547} {"train_loss": -11.677507400512695, "global_step": 427993, "epoch": 2547} {"train_loss": -12.10649299621582, "global_step": 427994, "epoch": 2547} {"train_loss": -11.36142635345459, "global_step": 427995, "epoch": 2547} {"train_loss": -12.1950101852417, "global_step": 427996, "epoch": 2547} {"train_loss": -11.769393920898438, "global_step": 427997, "epoch": 2547} {"train_loss": -11.75428581237793, "global_step": 427998, "epoch": 2547} {"train_loss": -12.308113098144531, "global_step": 427999, "epoch": 2547} {"train_loss": -11.816417694091797, "global_step": 428000, "epoch": 2547} {"train_loss": -12.276822090148926, "global_step": 428001, "epoch": 2547} {"train_loss": -11.892599105834961, "global_step": 428002, "epoch": 2547} {"train_loss": -12.304767608642578, "global_step": 428003, "epoch": 2547} {"train_loss": -12.092802047729492, "global_step": 428004, "epoch": 2547} {"train_loss": -12.247604370117188, "global_step": 428005, "epoch": 2547} {"train_loss": -12.170980453491211, "global_step": 428006, "epoch": 2547} {"train_loss": -12.143375396728516, "global_step": 428007, "epoch": 2547} {"train_loss": -12.23538589477539, "global_step": 428008, "epoch": 2547} {"train_loss": -12.275016784667969, "global_step": 428009, "epoch": 2547} {"train_loss": -12.261225700378418, "global_step": 428010, "epoch": 2547} {"train_loss": -12.482745170593262, "global_step": 428011, "epoch": 2547} {"train_loss": -11.944404602050781, "global_step": 428012, "epoch": 2547} {"train_loss": -12.263772964477539, "global_step": 428013, "epoch": 2547} {"train_loss": -12.249994277954102, "global_step": 428014, "epoch": 2547} {"train_loss": -12.418987274169922, "global_step": 428015, "epoch": 2547} {"train_loss": -12.324457168579102, "global_step": 428016, "epoch": 2547} {"train_loss": -12.232416152954102, "global_step": 428017, "epoch": 2547} {"train_loss": -12.017023086547852, "global_step": 428018, "epoch": 2547} {"train_loss": -12.143241882324219, "global_step": 428019, "epoch": 2547} {"train_loss": -12.326668739318848, "global_step": 428020, "epoch": 2547} {"train_loss": -12.316776275634766, "global_step": 428021, "epoch": 2547} {"train_loss": -12.048494338989258, "global_step": 428022, "epoch": 2547} {"train_loss": -12.550233840942383, "global_step": 428023, "epoch": 2547} {"train_loss": -12.069755554199219, "global_step": 428024, "epoch": 2547} {"train_loss": -12.24990463256836, "global_step": 428025, "epoch": 2547} {"train_loss": -12.404500961303711, "global_step": 428026, "epoch": 2547} {"train_loss": -12.254390716552734, "global_step": 428027, "epoch": 2547} {"train_loss": -12.478485107421875, "global_step": 428028, "epoch": 2547} {"train_loss": -12.270331382751465, "global_step": 428029, "epoch": 2547} {"train_loss": -12.030587196350098, "global_step": 428030, "epoch": 2547} {"train_loss": -11.984596252441406, "global_step": 428031, "epoch": 2547} {"train_loss": -11.998069763183594, "global_step": 428032, "epoch": 2547} {"train_loss": -12.289848327636719, "global_step": 428033, "epoch": 2547} {"train_loss": -12.156383514404297, "global_step": 428034, "epoch": 2547} {"train_loss": -12.395523071289062, "global_step": 428035, "epoch": 2547} {"train_loss": -12.070880889892578, "global_step": 428036, "epoch": 2547} {"train_loss": -11.92753791809082, "global_step": 428037, "epoch": 2547} {"train_loss": -12.091773986816406, "global_step": 428038, "epoch": 2547} {"train_loss": -11.958096504211426, "global_step": 428039, "epoch": 2547} {"train_loss": -12.507596015930176, "global_step": 428040, "epoch": 2547} {"train_loss": -11.628059387207031, "global_step": 428041, "epoch": 2547} {"train_loss": -12.215973854064941, "global_step": 428042, "epoch": 2547} {"train_loss": -12.374550819396973, "global_step": 428043, "epoch": 2547} {"train_loss": -12.580926895141602, "global_step": 428044, "epoch": 2547} {"train_loss": -12.369797706604004, "global_step": 428045, "epoch": 2547} {"train_loss": -12.064842224121094, "global_step": 428046, "epoch": 2547} {"train_loss": -12.456656455993652, "global_step": 428047, "epoch": 2547} {"train_loss": -12.307097434997559, "global_step": 428048, "epoch": 2547} {"train_loss": -12.33706283569336, "global_step": 428049, "epoch": 2547} {"train_loss": -12.56308650970459, "global_step": 428050, "epoch": 2547} {"train_loss": -12.1664400100708, "global_step": 428051, "epoch": 2547} {"train_loss": -12.645878791809082, "global_step": 428052, "epoch": 2547} {"train_loss": -12.193132400512695, "global_step": 428053, "epoch": 2547} {"train_loss": -12.354324340820312, "global_step": 428054, "epoch": 2547} {"train_loss": -12.30866813659668, "global_step": 428055, "epoch": 2547} {"train_loss": -12.204965591430664, "global_step": 428056, "epoch": 2547} {"train_loss": -12.501023292541504, "global_step": 428057, "epoch": 2547} {"train_loss": -12.37144947052002, "global_step": 428058, "epoch": 2547} {"train_loss": -12.101953506469727, "global_step": 428059, "epoch": 2547} {"train_loss": -12.500293731689453, "global_step": 428060, "epoch": 2547} {"train_loss": -11.853080749511719, "global_step": 428061, "epoch": 2547} {"train_loss": -12.136762619018555, "global_step": 428062, "epoch": 2547} {"train_loss": -11.822163842973255, "global_step": 428063, "epoch": 2547, "val_loss": 307339.375} {"train_loss": -11.527580261230469, "global_step": 428064, "epoch": 2548} {"train_loss": -11.739595413208008, "global_step": 428065, "epoch": 2548} {"train_loss": -11.11683177947998, "global_step": 428066, "epoch": 2548} {"train_loss": -11.365837097167969, "global_step": 428067, "epoch": 2548} {"train_loss": -12.085653305053711, "global_step": 428068, "epoch": 2548} {"train_loss": -10.295979499816895, "global_step": 428069, "epoch": 2548} {"train_loss": -12.37569808959961, "global_step": 428070, "epoch": 2548} {"train_loss": -11.487743377685547, "global_step": 428071, "epoch": 2548} {"train_loss": -12.305195808410645, "global_step": 428072, "epoch": 2548} {"train_loss": -12.001788139343262, "global_step": 428073, "epoch": 2548} {"train_loss": -11.637125015258789, "global_step": 428074, "epoch": 2548} {"train_loss": -12.264877319335938, "global_step": 428075, "epoch": 2548} {"train_loss": -11.874223709106445, "global_step": 428076, "epoch": 2548} {"train_loss": -12.027177810668945, "global_step": 428077, "epoch": 2548} {"train_loss": -12.147125244140625, "global_step": 428078, "epoch": 2548} {"train_loss": -11.826935768127441, "global_step": 428079, "epoch": 2548} {"train_loss": -12.283125877380371, "global_step": 428080, "epoch": 2548} {"train_loss": -12.350956916809082, "global_step": 428081, "epoch": 2548} {"train_loss": -12.24170970916748, "global_step": 428082, "epoch": 2548} {"train_loss": -11.93110466003418, "global_step": 428083, "epoch": 2548} {"train_loss": -12.058904647827148, "global_step": 428084, "epoch": 2548} {"train_loss": -12.223875045776367, "global_step": 428085, "epoch": 2548} {"train_loss": -11.644932746887207, "global_step": 428086, "epoch": 2548} {"train_loss": -12.542275428771973, "global_step": 428087, "epoch": 2548} {"train_loss": -12.02944564819336, "global_step": 428088, "epoch": 2548} {"train_loss": -12.712991714477539, "global_step": 428089, "epoch": 2548} {"train_loss": -12.343249320983887, "global_step": 428090, "epoch": 2548} {"train_loss": -12.463401794433594, "global_step": 428091, "epoch": 2548} {"train_loss": -12.31258487701416, "global_step": 428092, "epoch": 2548} {"train_loss": -12.387110710144043, "global_step": 428093, "epoch": 2548} {"train_loss": -12.503517150878906, "global_step": 428094, "epoch": 2548} {"train_loss": -12.084537506103516, "global_step": 428095, "epoch": 2548} {"train_loss": -12.395461082458496, "global_step": 428096, "epoch": 2548} {"train_loss": -12.463224411010742, "global_step": 428097, "epoch": 2548} {"train_loss": -12.562238693237305, "global_step": 428098, "epoch": 2548} {"train_loss": -12.376006126403809, "global_step": 428099, "epoch": 2548} {"train_loss": -12.640874862670898, "global_step": 428100, "epoch": 2548} {"train_loss": -12.49984359741211, "global_step": 428101, "epoch": 2548} {"train_loss": -12.515963554382324, "global_step": 428102, "epoch": 2548} {"train_loss": -12.6058349609375, "global_step": 428103, "epoch": 2548} {"train_loss": -12.653742790222168, "global_step": 428104, "epoch": 2548} {"train_loss": -12.8206787109375, "global_step": 428105, "epoch": 2548} {"train_loss": -12.751506805419922, "global_step": 428106, "epoch": 2548} {"train_loss": -12.643790245056152, "global_step": 428107, "epoch": 2548} {"train_loss": -12.636177062988281, "global_step": 428108, "epoch": 2548} {"train_loss": -12.737210273742676, "global_step": 428109, "epoch": 2548} {"train_loss": -12.494997024536133, "global_step": 428110, "epoch": 2548} {"train_loss": -12.830117225646973, "global_step": 428111, "epoch": 2548} {"train_loss": -12.787117004394531, "global_step": 428112, "epoch": 2548} {"train_loss": -12.685317039489746, "global_step": 428113, "epoch": 2548} {"train_loss": -12.757316589355469, "global_step": 428114, "epoch": 2548} {"train_loss": -12.655160903930664, "global_step": 428115, "epoch": 2548} {"train_loss": -12.814376831054688, "global_step": 428116, "epoch": 2548} {"train_loss": -12.7681884765625, "global_step": 428117, "epoch": 2548} {"train_loss": -12.725574493408203, "global_step": 428118, "epoch": 2548} {"train_loss": -12.691703796386719, "global_step": 428119, "epoch": 2548} {"train_loss": -12.649120330810547, "global_step": 428120, "epoch": 2548} {"train_loss": -12.614511489868164, "global_step": 428121, "epoch": 2548} {"train_loss": -12.698392868041992, "global_step": 428122, "epoch": 2548} {"train_loss": -12.6341552734375, "global_step": 428123, "epoch": 2548} {"train_loss": -12.727347373962402, "global_step": 428124, "epoch": 2548} {"train_loss": -12.720514297485352, "global_step": 428125, "epoch": 2548} {"train_loss": -12.572879791259766, "global_step": 428126, "epoch": 2548} {"train_loss": -12.680839538574219, "global_step": 428127, "epoch": 2548} {"train_loss": -12.492033004760742, "global_step": 428128, "epoch": 2548} {"train_loss": -12.444198608398438, "global_step": 428129, "epoch": 2548} {"train_loss": -12.683062553405762, "global_step": 428130, "epoch": 2548} {"train_loss": -12.472993850708008, "global_step": 428131, "epoch": 2548} {"train_loss": -12.350545883178711, "global_step": 428132, "epoch": 2548} {"train_loss": -11.746360778808594, "global_step": 428133, "epoch": 2548} {"train_loss": -12.537909507751465, "global_step": 428134, "epoch": 2548} {"train_loss": -11.638321876525879, "global_step": 428135, "epoch": 2548} {"train_loss": -12.51186466217041, "global_step": 428136, "epoch": 2548} {"train_loss": -12.218340873718262, "global_step": 428137, "epoch": 2548} {"train_loss": -12.490130424499512, "global_step": 428138, "epoch": 2548} {"train_loss": -12.5071382522583, "global_step": 428139, "epoch": 2548} {"train_loss": -12.198465347290039, "global_step": 428140, "epoch": 2548} {"train_loss": -12.48513412475586, "global_step": 428141, "epoch": 2548} {"train_loss": -12.242778778076172, "global_step": 428142, "epoch": 2548} {"train_loss": -12.10195541381836, "global_step": 428143, "epoch": 2548} {"train_loss": -12.235495567321777, "global_step": 428144, "epoch": 2548} {"train_loss": -12.170931816101074, "global_step": 428145, "epoch": 2548} {"train_loss": -12.064794540405273, "global_step": 428146, "epoch": 2548} {"train_loss": -11.301166534423828, "global_step": 428147, "epoch": 2548} {"train_loss": -11.453680038452148, "global_step": 428148, "epoch": 2548} {"train_loss": -12.076040267944336, "global_step": 428149, "epoch": 2548} {"train_loss": -10.847882270812988, "global_step": 428150, "epoch": 2548} {"train_loss": -11.536087989807129, "global_step": 428151, "epoch": 2548} {"train_loss": -11.774710655212402, "global_step": 428152, "epoch": 2548} {"train_loss": -12.130704879760742, "global_step": 428153, "epoch": 2548} {"train_loss": -11.391775131225586, "global_step": 428154, "epoch": 2548} {"train_loss": -12.556329727172852, "global_step": 428155, "epoch": 2548} {"train_loss": -10.746026992797852, "global_step": 428156, "epoch": 2548} {"train_loss": -11.725627899169922, "global_step": 428157, "epoch": 2548} {"train_loss": -11.79733943939209, "global_step": 428158, "epoch": 2548} {"train_loss": -11.527615547180176, "global_step": 428159, "epoch": 2548} {"train_loss": -12.001684188842773, "global_step": 428160, "epoch": 2548} {"train_loss": -11.389613151550293, "global_step": 428161, "epoch": 2548} {"train_loss": -12.391080856323242, "global_step": 428162, "epoch": 2548} {"train_loss": -11.995403289794922, "global_step": 428163, "epoch": 2548} {"train_loss": -12.519787788391113, "global_step": 428164, "epoch": 2548} {"train_loss": -11.905932426452637, "global_step": 428165, "epoch": 2548} {"train_loss": -12.19696044921875, "global_step": 428166, "epoch": 2548} {"train_loss": -12.233148574829102, "global_step": 428167, "epoch": 2548} {"train_loss": -12.227506637573242, "global_step": 428168, "epoch": 2548} {"train_loss": -12.23591423034668, "global_step": 428169, "epoch": 2548} {"train_loss": -12.405813217163086, "global_step": 428170, "epoch": 2548} {"train_loss": -12.273927688598633, "global_step": 428171, "epoch": 2548} {"train_loss": -12.10946273803711, "global_step": 428172, "epoch": 2548} {"train_loss": -12.489492416381836, "global_step": 428173, "epoch": 2548} {"train_loss": -12.539061546325684, "global_step": 428174, "epoch": 2548} {"train_loss": -12.49401569366455, "global_step": 428175, "epoch": 2548} {"train_loss": -12.518901824951172, "global_step": 428176, "epoch": 2548} {"train_loss": -12.237028121948242, "global_step": 428177, "epoch": 2548} {"train_loss": -12.615224838256836, "global_step": 428178, "epoch": 2548} {"train_loss": -12.160711288452148, "global_step": 428179, "epoch": 2548} {"train_loss": -12.285600662231445, "global_step": 428180, "epoch": 2548} {"train_loss": -12.305944442749023, "global_step": 428181, "epoch": 2548} {"train_loss": -12.233196258544922, "global_step": 428182, "epoch": 2548} {"train_loss": -11.75104808807373, "global_step": 428183, "epoch": 2548} {"train_loss": -12.580296516418457, "global_step": 428184, "epoch": 2548} {"train_loss": -12.345834732055664, "global_step": 428185, "epoch": 2548} {"train_loss": -12.64476490020752, "global_step": 428186, "epoch": 2548} {"train_loss": -12.29358959197998, "global_step": 428187, "epoch": 2548} {"train_loss": -12.554543495178223, "global_step": 428188, "epoch": 2548} {"train_loss": -12.385107040405273, "global_step": 428189, "epoch": 2548} {"train_loss": -12.678665161132812, "global_step": 428190, "epoch": 2548} {"train_loss": -11.942420959472656, "global_step": 428191, "epoch": 2548} {"train_loss": -12.57798957824707, "global_step": 428192, "epoch": 2548} {"train_loss": -11.85019302368164, "global_step": 428193, "epoch": 2548} {"train_loss": -12.419814109802246, "global_step": 428194, "epoch": 2548} {"train_loss": -11.686698913574219, "global_step": 428195, "epoch": 2548} {"train_loss": -11.846968650817871, "global_step": 428196, "epoch": 2548} {"train_loss": -11.598912239074707, "global_step": 428197, "epoch": 2548} {"train_loss": -11.828034400939941, "global_step": 428198, "epoch": 2548} {"train_loss": -12.165080070495605, "global_step": 428199, "epoch": 2548} {"train_loss": -10.626752853393555, "global_step": 428200, "epoch": 2548} {"train_loss": -11.972969055175781, "global_step": 428201, "epoch": 2548} {"train_loss": -12.033839225769043, "global_step": 428202, "epoch": 2548} {"train_loss": -11.145015716552734, "global_step": 428203, "epoch": 2548} {"train_loss": -12.110188484191895, "global_step": 428204, "epoch": 2548} {"train_loss": -11.335721969604492, "global_step": 428205, "epoch": 2548} {"train_loss": -12.395086288452148, "global_step": 428206, "epoch": 2548} {"train_loss": -11.834098815917969, "global_step": 428207, "epoch": 2548} {"train_loss": -11.838240623474121, "global_step": 428208, "epoch": 2548} {"train_loss": -11.40240478515625, "global_step": 428209, "epoch": 2548} {"train_loss": -12.140766143798828, "global_step": 428210, "epoch": 2548} {"train_loss": -11.905096054077148, "global_step": 428211, "epoch": 2548} {"train_loss": -12.180112838745117, "global_step": 428212, "epoch": 2548} {"train_loss": -12.124128341674805, "global_step": 428213, "epoch": 2548} {"train_loss": -11.741378784179688, "global_step": 428214, "epoch": 2548} {"train_loss": -12.159732818603516, "global_step": 428215, "epoch": 2548} {"train_loss": -11.622488975524902, "global_step": 428216, "epoch": 2548} {"train_loss": -11.893421173095703, "global_step": 428217, "epoch": 2548} {"train_loss": -12.364643096923828, "global_step": 428218, "epoch": 2548} {"train_loss": -11.480149269104004, "global_step": 428219, "epoch": 2548} {"train_loss": -12.050048828125, "global_step": 428220, "epoch": 2548} {"train_loss": -11.754138946533203, "global_step": 428221, "epoch": 2548} {"train_loss": -12.080341339111328, "global_step": 428222, "epoch": 2548} {"train_loss": -12.177992820739746, "global_step": 428223, "epoch": 2548} {"train_loss": -11.866281509399414, "global_step": 428224, "epoch": 2548} {"train_loss": -12.343655586242676, "global_step": 428225, "epoch": 2548} {"train_loss": -12.270090103149414, "global_step": 428226, "epoch": 2548} {"train_loss": -12.352587699890137, "global_step": 428227, "epoch": 2548} {"train_loss": -12.449029922485352, "global_step": 428228, "epoch": 2548} {"train_loss": -12.329303741455078, "global_step": 428229, "epoch": 2548} {"train_loss": -12.602567672729492, "global_step": 428230, "epoch": 2548} {"train_loss": -12.174819094794136, "global_step": 428231, "epoch": 2548, "val_loss": 308768.65625} {"train_loss": -12.801725387573242, "global_step": 428232, "epoch": 2549} {"train_loss": -12.459671974182129, "global_step": 428233, "epoch": 2549} {"train_loss": -12.546712875366211, "global_step": 428234, "epoch": 2549} {"train_loss": -12.52541732788086, "global_step": 428235, "epoch": 2549} {"train_loss": -12.62684440612793, "global_step": 428236, "epoch": 2549} {"train_loss": -12.811317443847656, "global_step": 428237, "epoch": 2549} {"train_loss": -12.50796890258789, "global_step": 428238, "epoch": 2549} {"train_loss": -12.552225112915039, "global_step": 428239, "epoch": 2549} {"train_loss": -12.674901962280273, "global_step": 428240, "epoch": 2549} {"train_loss": -12.768852233886719, "global_step": 428241, "epoch": 2549} {"train_loss": -12.569465637207031, "global_step": 428242, "epoch": 2549} {"train_loss": -12.67055892944336, "global_step": 428243, "epoch": 2549} {"train_loss": -12.807799339294434, "global_step": 428244, "epoch": 2549} {"train_loss": -12.58934211730957, "global_step": 428245, "epoch": 2549} {"train_loss": -12.743376731872559, "global_step": 428246, "epoch": 2549} {"train_loss": -12.513479232788086, "global_step": 428247, "epoch": 2549} {"train_loss": -12.738014221191406, "global_step": 428248, "epoch": 2549} {"train_loss": -12.811590194702148, "global_step": 428249, "epoch": 2549} {"train_loss": -12.603755950927734, "global_step": 428250, "epoch": 2549} {"train_loss": -12.978137969970703, "global_step": 428251, "epoch": 2549} {"train_loss": -12.6953706741333, "global_step": 428252, "epoch": 2549} {"train_loss": -12.848139762878418, "global_step": 428253, "epoch": 2549} {"train_loss": -12.594667434692383, "global_step": 428254, "epoch": 2549} {"train_loss": -12.692952156066895, "global_step": 428255, "epoch": 2549} {"train_loss": -12.596693992614746, "global_step": 428256, "epoch": 2549} {"train_loss": -12.674783706665039, "global_step": 428257, "epoch": 2549} {"train_loss": -12.384502410888672, "global_step": 428258, "epoch": 2549} {"train_loss": -12.797931671142578, "global_step": 428259, "epoch": 2549} {"train_loss": -12.39698600769043, "global_step": 428260, "epoch": 2549} {"train_loss": -12.615785598754883, "global_step": 428261, "epoch": 2549} {"train_loss": -12.892778396606445, "global_step": 428262, "epoch": 2549} {"train_loss": -12.890975952148438, "global_step": 428263, "epoch": 2549} {"train_loss": -12.916189193725586, "global_step": 428264, "epoch": 2549} {"train_loss": -12.803848266601562, "global_step": 428265, "epoch": 2549} {"train_loss": -12.777793884277344, "global_step": 428266, "epoch": 2549} {"train_loss": -12.81684684753418, "global_step": 428267, "epoch": 2549} {"train_loss": -12.939669609069824, "global_step": 428268, "epoch": 2549} {"train_loss": -12.68671989440918, "global_step": 428269, "epoch": 2549} {"train_loss": -12.98388671875, "global_step": 428270, "epoch": 2549} {"train_loss": -12.607198715209961, "global_step": 428271, "epoch": 2549} {"train_loss": -12.703886032104492, "global_step": 428272, "epoch": 2549} {"train_loss": -12.726327896118164, "global_step": 428273, "epoch": 2549} {"train_loss": -12.805553436279297, "global_step": 428274, "epoch": 2549} {"train_loss": -12.752538681030273, "global_step": 428275, "epoch": 2549} {"train_loss": -12.780516624450684, "global_step": 428276, "epoch": 2549} {"train_loss": -13.023757934570312, "global_step": 428277, "epoch": 2549} {"train_loss": -12.819099426269531, "global_step": 428278, "epoch": 2549} {"train_loss": -12.95629596710205, "global_step": 428279, "epoch": 2549} {"train_loss": -12.86337661743164, "global_step": 428280, "epoch": 2549} {"train_loss": -12.860909461975098, "global_step": 428281, "epoch": 2549} {"train_loss": -12.480124473571777, "global_step": 428282, "epoch": 2549} {"train_loss": -12.651174545288086, "global_step": 428283, "epoch": 2549} {"train_loss": -12.758493423461914, "global_step": 428284, "epoch": 2549} {"train_loss": -12.84738540649414, "global_step": 428285, "epoch": 2549} {"train_loss": -12.761232376098633, "global_step": 428286, "epoch": 2549} {"train_loss": -12.549541473388672, "global_step": 428287, "epoch": 2549} {"train_loss": -12.822370529174805, "global_step": 428288, "epoch": 2549} {"train_loss": -11.864027976989746, "global_step": 428289, "epoch": 2549} {"train_loss": -11.027857780456543, "global_step": 428290, "epoch": 2549} {"train_loss": -8.542874336242676, "global_step": 428291, "epoch": 2549} {"train_loss": -9.703822135925293, "global_step": 428292, "epoch": 2549} {"train_loss": -8.233230590820312, "global_step": 428293, "epoch": 2549} {"train_loss": -10.02579116821289, "global_step": 428294, "epoch": 2549} {"train_loss": -7.611489295959473, "global_step": 428295, "epoch": 2549} {"train_loss": -7.457448959350586, "global_step": 428296, "epoch": 2549} {"train_loss": -6.448174953460693, "global_step": 428297, "epoch": 2549} {"train_loss": -6.344490051269531, "global_step": 428298, "epoch": 2549} {"train_loss": -6.363077163696289, "global_step": 428299, "epoch": 2549} {"train_loss": -5.72139310836792, "global_step": 428300, "epoch": 2549} {"train_loss": -6.117693901062012, "global_step": 428301, "epoch": 2549} {"train_loss": -5.558256149291992, "global_step": 428302, "epoch": 2549} {"train_loss": -6.126713275909424, "global_step": 428303, "epoch": 2549} {"train_loss": -5.930756568908691, "global_step": 428304, "epoch": 2549} {"train_loss": -6.055002212524414, "global_step": 428305, "epoch": 2549} {"train_loss": -7.052251815795898, "global_step": 428306, "epoch": 2549} {"train_loss": -8.0134916305542, "global_step": 428307, "epoch": 2549} {"train_loss": -7.652166366577148, "global_step": 428308, "epoch": 2549} {"train_loss": -7.15628719329834, "global_step": 428309, "epoch": 2549} {"train_loss": -8.353385925292969, "global_step": 428310, "epoch": 2549} {"train_loss": -7.815704345703125, "global_step": 428311, "epoch": 2549} {"train_loss": -8.110084533691406, "global_step": 428312, "epoch": 2549} {"train_loss": -9.346851348876953, "global_step": 428313, "epoch": 2549} {"train_loss": -9.144124984741211, "global_step": 428314, "epoch": 2549} {"train_loss": -10.24903392791748, "global_step": 428315, "epoch": 2549} {"train_loss": -9.603780746459961, "global_step": 428316, "epoch": 2549} {"train_loss": -9.002666473388672, "global_step": 428317, "epoch": 2549} {"train_loss": -9.926101684570312, "global_step": 428318, "epoch": 2549} {"train_loss": -10.957194328308105, "global_step": 428319, "epoch": 2549} {"train_loss": -10.98760986328125, "global_step": 428320, "epoch": 2549} {"train_loss": -10.18244457244873, "global_step": 428321, "epoch": 2549} {"train_loss": -10.637575149536133, "global_step": 428322, "epoch": 2549} {"train_loss": -11.41741943359375, "global_step": 428323, "epoch": 2549} {"train_loss": -10.307891845703125, "global_step": 428324, "epoch": 2549} {"train_loss": -11.83393383026123, "global_step": 428325, "epoch": 2549} {"train_loss": -10.429520606994629, "global_step": 428326, "epoch": 2549} {"train_loss": -11.376632690429688, "global_step": 428327, "epoch": 2549} {"train_loss": -11.478654861450195, "global_step": 428328, "epoch": 2549} {"train_loss": -10.800168991088867, "global_step": 428329, "epoch": 2549} {"train_loss": -11.95556354522705, "global_step": 428330, "epoch": 2549} {"train_loss": -10.915021896362305, "global_step": 428331, "epoch": 2549} {"train_loss": -11.564178466796875, "global_step": 428332, "epoch": 2549} {"train_loss": -11.009781837463379, "global_step": 428333, "epoch": 2549} {"train_loss": -11.81132698059082, "global_step": 428334, "epoch": 2549} {"train_loss": -11.86260986328125, "global_step": 428335, "epoch": 2549} {"train_loss": -11.600162506103516, "global_step": 428336, "epoch": 2549} {"train_loss": -11.337789535522461, "global_step": 428337, "epoch": 2549} {"train_loss": -11.461588859558105, "global_step": 428338, "epoch": 2549} {"train_loss": -10.384653091430664, "global_step": 428339, "epoch": 2549} {"train_loss": -11.096588134765625, "global_step": 428340, "epoch": 2549} {"train_loss": -11.218578338623047, "global_step": 428341, "epoch": 2549} {"train_loss": -10.107198715209961, "global_step": 428342, "epoch": 2549} {"train_loss": -11.916665077209473, "global_step": 428343, "epoch": 2549} {"train_loss": -10.773441314697266, "global_step": 428344, "epoch": 2549} {"train_loss": -11.040882110595703, "global_step": 428345, "epoch": 2549} {"train_loss": -11.883597373962402, "global_step": 428346, "epoch": 2549} {"train_loss": -10.781712532043457, "global_step": 428347, "epoch": 2549} {"train_loss": -11.769718170166016, "global_step": 428348, "epoch": 2549} {"train_loss": -11.514240264892578, "global_step": 428349, "epoch": 2549} {"train_loss": -10.914355278015137, "global_step": 428350, "epoch": 2549} {"train_loss": -11.778450012207031, "global_step": 428351, "epoch": 2549} {"train_loss": -11.808643341064453, "global_step": 428352, "epoch": 2549} {"train_loss": -11.376350402832031, "global_step": 428353, "epoch": 2549} {"train_loss": -11.869893074035645, "global_step": 428354, "epoch": 2549} {"train_loss": -11.403066635131836, "global_step": 428355, "epoch": 2549} {"train_loss": -11.809829711914062, "global_step": 428356, "epoch": 2549} {"train_loss": -11.767369270324707, "global_step": 428357, "epoch": 2549} {"train_loss": -11.703804016113281, "global_step": 428358, "epoch": 2549} {"train_loss": -12.077367782592773, "global_step": 428359, "epoch": 2549} {"train_loss": -11.807981491088867, "global_step": 428360, "epoch": 2549} {"train_loss": -12.116043090820312, "global_step": 428361, "epoch": 2549} {"train_loss": -11.451780319213867, "global_step": 428362, "epoch": 2549} {"train_loss": -11.958211898803711, "global_step": 428363, "epoch": 2549} {"train_loss": -12.075467109680176, "global_step": 428364, "epoch": 2549} {"train_loss": -11.896842956542969, "global_step": 428365, "epoch": 2549} {"train_loss": -11.915838241577148, "global_step": 428366, "epoch": 2549} {"train_loss": -11.795413970947266, "global_step": 428367, "epoch": 2549} {"train_loss": -12.139599800109863, "global_step": 428368, "epoch": 2549} {"train_loss": -12.094730377197266, "global_step": 428369, "epoch": 2549} {"train_loss": -11.96739387512207, "global_step": 428370, "epoch": 2549} {"train_loss": -11.721717834472656, "global_step": 428371, "epoch": 2549} {"train_loss": -11.890039443969727, "global_step": 428372, "epoch": 2549} {"train_loss": -11.778928756713867, "global_step": 428373, "epoch": 2549} {"train_loss": -12.472738265991211, "global_step": 428374, "epoch": 2549} {"train_loss": -12.049467086791992, "global_step": 428375, "epoch": 2549} {"train_loss": -12.230289459228516, "global_step": 428376, "epoch": 2549} {"train_loss": -12.055328369140625, "global_step": 428377, "epoch": 2549} {"train_loss": -12.119890213012695, "global_step": 428378, "epoch": 2549} {"train_loss": -12.02328872680664, "global_step": 428379, "epoch": 2549} {"train_loss": -12.44561767578125, "global_step": 428380, "epoch": 2549} {"train_loss": -12.226578712463379, "global_step": 428381, "epoch": 2549} {"train_loss": -12.247745513916016, "global_step": 428382, "epoch": 2549} {"train_loss": -12.25650405883789, "global_step": 428383, "epoch": 2549} {"train_loss": -12.550260543823242, "global_step": 428384, "epoch": 2549} {"train_loss": -12.178239822387695, "global_step": 428385, "epoch": 2549} {"train_loss": -12.434006690979004, "global_step": 428386, "epoch": 2549} {"train_loss": -12.357563018798828, "global_step": 428387, "epoch": 2549} {"train_loss": -12.284382820129395, "global_step": 428388, "epoch": 2549} {"train_loss": -12.575788497924805, "global_step": 428389, "epoch": 2549} {"train_loss": -12.303764343261719, "global_step": 428390, "epoch": 2549} {"train_loss": -12.5841646194458, "global_step": 428391, "epoch": 2549} {"train_loss": -12.46086311340332, "global_step": 428392, "epoch": 2549} {"train_loss": -12.619162559509277, "global_step": 428393, "epoch": 2549} {"train_loss": -12.52688980102539, "global_step": 428394, "epoch": 2549} {"train_loss": -12.533130645751953, "global_step": 428395, "epoch": 2549} {"train_loss": -12.425859451293945, "global_step": 428396, "epoch": 2549} {"train_loss": -12.5632963180542, "global_step": 428397, "epoch": 2549} {"train_loss": -12.419708251953125, "global_step": 428398, "epoch": 2549} {"train_loss": -11.408235677650996, "global_step": 428399, "epoch": 2549, "val_loss": 306171.875} {"train_loss": -12.486702919006348, "global_step": 428400, "epoch": 2550} {"train_loss": -12.487195014953613, "global_step": 428401, "epoch": 2550} {"train_loss": -12.560760498046875, "global_step": 428402, "epoch": 2550} {"train_loss": -12.805734634399414, "global_step": 428403, "epoch": 2550} {"train_loss": -12.503750801086426, "global_step": 428404, "epoch": 2550} {"train_loss": -12.597832679748535, "global_step": 428405, "epoch": 2550} {"train_loss": -12.75979995727539, "global_step": 428406, "epoch": 2550} {"train_loss": -12.5067777633667, "global_step": 428407, "epoch": 2550} {"train_loss": -12.507402420043945, "global_step": 428408, "epoch": 2550} {"train_loss": -12.696773529052734, "global_step": 428409, "epoch": 2550} {"train_loss": -12.620012283325195, "global_step": 428410, "epoch": 2550} {"train_loss": -12.728174209594727, "global_step": 428411, "epoch": 2550} {"train_loss": -12.691058158874512, "global_step": 428412, "epoch": 2550} {"train_loss": -12.550867080688477, "global_step": 428413, "epoch": 2550} {"train_loss": -12.645844459533691, "global_step": 428414, "epoch": 2550} {"train_loss": -12.699095726013184, "global_step": 428415, "epoch": 2550} {"train_loss": -12.832143783569336, "global_step": 428416, "epoch": 2550} {"train_loss": -12.689704895019531, "global_step": 428417, "epoch": 2550} {"train_loss": -12.708791732788086, "global_step": 428418, "epoch": 2550} {"train_loss": -12.65965461730957, "global_step": 428419, "epoch": 2550} {"train_loss": -12.56808090209961, "global_step": 428420, "epoch": 2550} {"train_loss": -12.909690856933594, "global_step": 428421, "epoch": 2550} {"train_loss": -12.732913970947266, "global_step": 428422, "epoch": 2550} {"train_loss": -12.448124885559082, "global_step": 428423, "epoch": 2550} {"train_loss": -12.892071723937988, "global_step": 428424, "epoch": 2550} {"train_loss": -12.699586868286133, "global_step": 428425, "epoch": 2550} {"train_loss": -12.882678985595703, "global_step": 428426, "epoch": 2550} {"train_loss": -12.60628890991211, "global_step": 428427, "epoch": 2550} {"train_loss": -12.836404800415039, "global_step": 428428, "epoch": 2550} {"train_loss": -12.950784683227539, "global_step": 428429, "epoch": 2550} {"train_loss": -12.756502151489258, "global_step": 428430, "epoch": 2550} {"train_loss": -12.496257781982422, "global_step": 428431, "epoch": 2550} {"train_loss": -12.855600357055664, "global_step": 428432, "epoch": 2550} {"train_loss": -12.605608940124512, "global_step": 428433, "epoch": 2550} {"train_loss": -12.651788711547852, "global_step": 428434, "epoch": 2550} {"train_loss": -12.672673225402832, "global_step": 428435, "epoch": 2550} {"train_loss": -12.563220024108887, "global_step": 428436, "epoch": 2550} {"train_loss": -12.799211502075195, "global_step": 428437, "epoch": 2550} {"train_loss": -12.65893268585205, "global_step": 428438, "epoch": 2550} {"train_loss": -12.445451736450195, "global_step": 428439, "epoch": 2550} {"train_loss": -12.577122688293457, "global_step": 428440, "epoch": 2550} {"train_loss": -12.502678871154785, "global_step": 428441, "epoch": 2550} {"train_loss": -12.74539566040039, "global_step": 428442, "epoch": 2550} {"train_loss": -12.514963150024414, "global_step": 428443, "epoch": 2550} {"train_loss": -12.946523666381836, "global_step": 428444, "epoch": 2550} {"train_loss": -12.52485466003418, "global_step": 428445, "epoch": 2550} {"train_loss": -12.62148666381836, "global_step": 428446, "epoch": 2550} {"train_loss": -12.76762866973877, "global_step": 428447, "epoch": 2550} {"train_loss": -12.393089294433594, "global_step": 428448, "epoch": 2550} {"train_loss": -12.658529281616211, "global_step": 428449, "epoch": 2550} {"train_loss": -12.843772888183594, "global_step": 428450, "epoch": 2550} {"train_loss": -12.4194917678833, "global_step": 428451, "epoch": 2550} {"train_loss": -12.206435203552246, "global_step": 428452, "epoch": 2550} {"train_loss": -10.900520324707031, "global_step": 428453, "epoch": 2550} {"train_loss": -12.669722557067871, "global_step": 428454, "epoch": 2550} {"train_loss": -11.261503219604492, "global_step": 428455, "epoch": 2550} {"train_loss": -12.284872055053711, "global_step": 428456, "epoch": 2550} {"train_loss": -11.996464729309082, "global_step": 428457, "epoch": 2550} {"train_loss": -11.454116821289062, "global_step": 428458, "epoch": 2550} {"train_loss": -11.738588333129883, "global_step": 428459, "epoch": 2550} {"train_loss": -12.192819595336914, "global_step": 428460, "epoch": 2550} {"train_loss": -11.472533226013184, "global_step": 428461, "epoch": 2550} {"train_loss": -12.820926666259766, "global_step": 428462, "epoch": 2550} {"train_loss": -11.589638710021973, "global_step": 428463, "epoch": 2550} {"train_loss": -12.444768905639648, "global_step": 428464, "epoch": 2550} {"train_loss": -11.738177299499512, "global_step": 428465, "epoch": 2550} {"train_loss": -12.485239028930664, "global_step": 428466, "epoch": 2550} {"train_loss": -11.885015487670898, "global_step": 428467, "epoch": 2550} {"train_loss": -12.388456344604492, "global_step": 428468, "epoch": 2550} {"train_loss": -11.020009994506836, "global_step": 428469, "epoch": 2550} {"train_loss": -12.548919677734375, "global_step": 428470, "epoch": 2550} {"train_loss": -12.612458229064941, "global_step": 428471, "epoch": 2550} {"train_loss": -12.450684547424316, "global_step": 428472, "epoch": 2550} {"train_loss": -12.474749565124512, "global_step": 428473, "epoch": 2550} {"train_loss": -12.534337997436523, "global_step": 428474, "epoch": 2550} {"train_loss": -12.269535064697266, "global_step": 428475, "epoch": 2550} {"train_loss": -12.615368843078613, "global_step": 428476, "epoch": 2550} {"train_loss": -12.329588890075684, "global_step": 428477, "epoch": 2550} {"train_loss": -12.193594932556152, "global_step": 428478, "epoch": 2550} {"train_loss": -12.005960464477539, "global_step": 428479, "epoch": 2550} {"train_loss": -12.121728897094727, "global_step": 428480, "epoch": 2550} {"train_loss": -12.625436782836914, "global_step": 428481, "epoch": 2550} {"train_loss": -12.17872428894043, "global_step": 428482, "epoch": 2550} {"train_loss": -12.568198204040527, "global_step": 428483, "epoch": 2550} {"train_loss": -11.864209175109863, "global_step": 428484, "epoch": 2550} {"train_loss": -12.097078323364258, "global_step": 428485, "epoch": 2550} {"train_loss": -12.453291893005371, "global_step": 428486, "epoch": 2550} {"train_loss": -11.65188217163086, "global_step": 428487, "epoch": 2550} {"train_loss": -12.409191131591797, "global_step": 428488, "epoch": 2550} {"train_loss": -10.878149032592773, "global_step": 428489, "epoch": 2550} {"train_loss": -12.605964660644531, "global_step": 428490, "epoch": 2550} {"train_loss": -11.914932250976562, "global_step": 428491, "epoch": 2550} {"train_loss": -12.209735870361328, "global_step": 428492, "epoch": 2550} {"train_loss": -12.162656784057617, "global_step": 428493, "epoch": 2550} {"train_loss": -12.067829132080078, "global_step": 428494, "epoch": 2550} {"train_loss": -12.406207084655762, "global_step": 428495, "epoch": 2550} {"train_loss": -11.750088691711426, "global_step": 428496, "epoch": 2550} {"train_loss": -11.797599792480469, "global_step": 428497, "epoch": 2550} {"train_loss": -12.133722305297852, "global_step": 428498, "epoch": 2550} {"train_loss": -11.907218933105469, "global_step": 428499, "epoch": 2550} {"train_loss": -11.565594673156738, "global_step": 428500, "epoch": 2550} {"train_loss": -12.151077270507812, "global_step": 428501, "epoch": 2550} {"train_loss": -12.13494873046875, "global_step": 428502, "epoch": 2550} {"train_loss": -12.125860214233398, "global_step": 428503, "epoch": 2550} {"train_loss": -11.360475540161133, "global_step": 428504, "epoch": 2550} {"train_loss": -11.634729385375977, "global_step": 428505, "epoch": 2550} {"train_loss": -12.506658554077148, "global_step": 428506, "epoch": 2550} {"train_loss": -11.878252029418945, "global_step": 428507, "epoch": 2550} {"train_loss": -12.146940231323242, "global_step": 428508, "epoch": 2550} {"train_loss": -12.204328536987305, "global_step": 428509, "epoch": 2550} {"train_loss": -12.107070922851562, "global_step": 428510, "epoch": 2550} {"train_loss": -11.911458969116211, "global_step": 428511, "epoch": 2550} {"train_loss": -12.093606948852539, "global_step": 428512, "epoch": 2550} {"train_loss": -12.209250450134277, "global_step": 428513, "epoch": 2550} {"train_loss": -12.211517333984375, "global_step": 428514, "epoch": 2550} {"train_loss": -12.131650924682617, "global_step": 428515, "epoch": 2550} {"train_loss": -12.399441719055176, "global_step": 428516, "epoch": 2550} {"train_loss": -12.288312911987305, "global_step": 428517, "epoch": 2550} {"train_loss": -12.475363731384277, "global_step": 428518, "epoch": 2550} {"train_loss": -12.677624702453613, "global_step": 428519, "epoch": 2550} {"train_loss": -12.47797966003418, "global_step": 428520, "epoch": 2550} {"train_loss": -11.990816116333008, "global_step": 428521, "epoch": 2550} {"train_loss": -12.014131546020508, "global_step": 428522, "epoch": 2550} {"train_loss": -12.52540397644043, "global_step": 428523, "epoch": 2550} {"train_loss": -11.95557975769043, "global_step": 428524, "epoch": 2550} {"train_loss": -11.819549560546875, "global_step": 428525, "epoch": 2550} {"train_loss": -12.13782024383545, "global_step": 428526, "epoch": 2550} {"train_loss": -12.691481590270996, "global_step": 428527, "epoch": 2550} {"train_loss": -11.722813606262207, "global_step": 428528, "epoch": 2550} {"train_loss": -12.281986236572266, "global_step": 428529, "epoch": 2550} {"train_loss": -12.591320037841797, "global_step": 428530, "epoch": 2550} {"train_loss": -12.311145782470703, "global_step": 428531, "epoch": 2550} {"train_loss": -12.069626808166504, "global_step": 428532, "epoch": 2550} {"train_loss": -12.254546165466309, "global_step": 428533, "epoch": 2550} {"train_loss": -12.298782348632812, "global_step": 428534, "epoch": 2550} {"train_loss": -12.174338340759277, "global_step": 428535, "epoch": 2550} {"train_loss": -12.09058666229248, "global_step": 428536, "epoch": 2550} {"train_loss": -12.729483604431152, "global_step": 428537, "epoch": 2550} {"train_loss": -12.391861915588379, "global_step": 428538, "epoch": 2550} {"train_loss": -12.418710708618164, "global_step": 428539, "epoch": 2550} {"train_loss": -12.327659606933594, "global_step": 428540, "epoch": 2550} {"train_loss": -12.38129997253418, "global_step": 428541, "epoch": 2550} {"train_loss": -12.573766708374023, "global_step": 428542, "epoch": 2550} {"train_loss": -12.296259880065918, "global_step": 428543, "epoch": 2550} {"train_loss": -12.162638664245605, "global_step": 428544, "epoch": 2550} {"train_loss": -12.445816040039062, "global_step": 428545, "epoch": 2550} {"train_loss": -12.656673431396484, "global_step": 428546, "epoch": 2550} {"train_loss": -12.583538055419922, "global_step": 428547, "epoch": 2550} {"train_loss": -12.583623886108398, "global_step": 428548, "epoch": 2550} {"train_loss": -12.709634780883789, "global_step": 428549, "epoch": 2550} {"train_loss": -12.698084831237793, "global_step": 428550, "epoch": 2550} {"train_loss": -12.623268127441406, "global_step": 428551, "epoch": 2550} {"train_loss": -12.759571075439453, "global_step": 428552, "epoch": 2550} {"train_loss": -12.650659561157227, "global_step": 428553, "epoch": 2550} {"train_loss": -12.634461402893066, "global_step": 428554, "epoch": 2550} {"train_loss": -12.745563507080078, "global_step": 428555, "epoch": 2550} {"train_loss": -12.55069637298584, "global_step": 428556, "epoch": 2550} {"train_loss": -12.079898834228516, "global_step": 428557, "epoch": 2550} {"train_loss": -12.677396774291992, "global_step": 428558, "epoch": 2550} {"train_loss": -12.535856246948242, "global_step": 428559, "epoch": 2550} {"train_loss": -11.39502239227295, "global_step": 428560, "epoch": 2550} {"train_loss": -11.066059112548828, "global_step": 428561, "epoch": 2550} {"train_loss": -11.613214492797852, "global_step": 428562, "epoch": 2550} {"train_loss": -7.838430881500244, "global_step": 428563, "epoch": 2550} {"train_loss": -7.881821155548096, "global_step": 428564, "epoch": 2550} {"train_loss": -7.908592700958252, "global_step": 428565, "epoch": 2550} {"train_loss": -7.723334789276123, "global_step": 428566, "epoch": 2550} {"train_loss": -12.203494594210671, "global_step": 428567, "epoch": 2550, "train/sim_max_reward_0": 0.4776927208726461, "train/sim_max_reward_1": 0.8933596405366241, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.8931776387274297, "train/sim_max_reward_4": 0.9497516795093317, "train/sim_max_reward_5": 0.6074198889267547, "test/sim_max_reward_4400000": 0.9745744816467674, "test/sim_max_reward_4400001": 0.36860699021542875, "test/sim_max_reward_4400002": 0.5702047212251611, "test/sim_max_reward_4400003": 0.1830349468249435, "test/sim_max_reward_4400004": 0.21327279615382388, "test/sim_max_reward_4400005": 0.9879400342210632, "test/sim_max_reward_4400006": 0.30576851583271675, "test/sim_max_reward_4400007": 0.4860922935202522, "test/sim_max_reward_4400008": 0.6029560232668759, "test/sim_max_reward_4400009": 0.5416443848333412, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.8727117700294588, "test/sim_max_reward_4400012": 0.9820017221627879, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.36828460324848356, "test/sim_max_reward_4400015": 0.04471650257143209, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.05473323355091742, "test/sim_max_reward_4400018": 0.9818536323409514, "test/sim_max_reward_4400019": 0.22929738978930195, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.688334124003951, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.15037950855797708, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.5148883797816586, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.34138106712274674, "test/sim_max_reward_4400028": 0.9621447840517995, "test/sim_max_reward_4400029": 1.0, "test/sim_max_reward_4400030": 0.9284731285046783, "test/sim_max_reward_4400031": 1.0, "test/sim_max_reward_4400032": 0.09163126883354059, "test/sim_max_reward_4400033": 0.42253214552572393, "test/sim_max_reward_4400034": 0.9429706320860441, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.3381370221156382, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.7300229073488606, "test/sim_max_reward_4400042": 0.0, "test/sim_max_reward_4400043": 0.8999969752438505, "test/sim_max_reward_4400044": 0.4941670333511407, "test/sim_max_reward_4400045": 0.0, "test/sim_max_reward_4400046": 0.9966542259044885, "test/sim_max_reward_4400047": 0.9719160683959587, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.00804848058560959, "train/mean_score": 0.6369002614287976, "test/mean_score": 0.5030636599863108, "val_loss": 308273.8125, "train_action_mse_error": 1.3143610954284668} {"train_loss": -8.20290756225586, "global_step": 428568, "epoch": 2551} {"train_loss": -8.220863342285156, "global_step": 428569, "epoch": 2551} {"train_loss": -8.901330947875977, "global_step": 428570, "epoch": 2551} {"train_loss": -8.904141426086426, "global_step": 428571, "epoch": 2551} {"train_loss": -8.298818588256836, "global_step": 428572, "epoch": 2551} {"train_loss": -8.971363067626953, "global_step": 428573, "epoch": 2551} {"train_loss": -9.272024154663086, "global_step": 428574, "epoch": 2551} {"train_loss": -8.701774597167969, "global_step": 428575, "epoch": 2551} {"train_loss": -9.503734588623047, "global_step": 428576, "epoch": 2551} {"train_loss": -9.511194229125977, "global_step": 428577, "epoch": 2551} {"train_loss": -9.095856666564941, "global_step": 428578, "epoch": 2551} {"train_loss": -9.735430717468262, "global_step": 428579, "epoch": 2551} {"train_loss": -8.871851921081543, "global_step": 428580, "epoch": 2551} {"train_loss": -9.226234436035156, "global_step": 428581, "epoch": 2551} {"train_loss": -10.068044662475586, "global_step": 428582, "epoch": 2551} {"train_loss": -10.07331657409668, "global_step": 428583, "epoch": 2551} {"train_loss": -10.738475799560547, "global_step": 428584, "epoch": 2551} {"train_loss": -10.870372772216797, "global_step": 428585, "epoch": 2551} {"train_loss": -11.020109176635742, "global_step": 428586, "epoch": 2551} {"train_loss": -11.23176383972168, "global_step": 428587, "epoch": 2551} {"train_loss": -11.593194007873535, "global_step": 428588, "epoch": 2551} {"train_loss": -11.011238098144531, "global_step": 428589, "epoch": 2551} {"train_loss": -11.079561233520508, "global_step": 428590, "epoch": 2551} {"train_loss": -10.942644119262695, "global_step": 428591, "epoch": 2551} {"train_loss": -9.671772003173828, "global_step": 428592, "epoch": 2551} {"train_loss": -10.469029426574707, "global_step": 428593, "epoch": 2551} {"train_loss": -11.400226593017578, "global_step": 428594, "epoch": 2551} {"train_loss": -10.370813369750977, "global_step": 428595, "epoch": 2551} {"train_loss": -11.338638305664062, "global_step": 428596, "epoch": 2551} {"train_loss": -11.106067657470703, "global_step": 428597, "epoch": 2551} {"train_loss": -11.546796798706055, "global_step": 428598, "epoch": 2551} {"train_loss": -10.997802734375, "global_step": 428599, "epoch": 2551} {"train_loss": -11.44630241394043, "global_step": 428600, "epoch": 2551} {"train_loss": -11.635884284973145, "global_step": 428601, "epoch": 2551} {"train_loss": -10.484175682067871, "global_step": 428602, "epoch": 2551} {"train_loss": -12.310545921325684, "global_step": 428603, "epoch": 2551} {"train_loss": -10.919506072998047, "global_step": 428604, "epoch": 2551} {"train_loss": -11.680344581604004, "global_step": 428605, "epoch": 2551} {"train_loss": -12.150835990905762, "global_step": 428606, "epoch": 2551} {"train_loss": -11.462774276733398, "global_step": 428607, "epoch": 2551} {"train_loss": -12.044240951538086, "global_step": 428608, "epoch": 2551} {"train_loss": -11.826568603515625, "global_step": 428609, "epoch": 2551} {"train_loss": -12.142480850219727, "global_step": 428610, "epoch": 2551} {"train_loss": -12.315118789672852, "global_step": 428611, "epoch": 2551} {"train_loss": -11.836359024047852, "global_step": 428612, "epoch": 2551} {"train_loss": -12.212512016296387, "global_step": 428613, "epoch": 2551} {"train_loss": -12.055242538452148, "global_step": 428614, "epoch": 2551} {"train_loss": -12.403614044189453, "global_step": 428615, "epoch": 2551} {"train_loss": -12.095413208007812, "global_step": 428616, "epoch": 2551} {"train_loss": -12.112545013427734, "global_step": 428617, "epoch": 2551} {"train_loss": -12.316858291625977, "global_step": 428618, "epoch": 2551} {"train_loss": -12.438050270080566, "global_step": 428619, "epoch": 2551} {"train_loss": -12.138628005981445, "global_step": 428620, "epoch": 2551} {"train_loss": -12.25338363647461, "global_step": 428621, "epoch": 2551} {"train_loss": -12.299640655517578, "global_step": 428622, "epoch": 2551} {"train_loss": -12.39919376373291, "global_step": 428623, "epoch": 2551} {"train_loss": -12.602904319763184, "global_step": 428624, "epoch": 2551} {"train_loss": -12.323823928833008, "global_step": 428625, "epoch": 2551} {"train_loss": -12.56698989868164, "global_step": 428626, "epoch": 2551} {"train_loss": -12.379389762878418, "global_step": 428627, "epoch": 2551} {"train_loss": -12.511151313781738, "global_step": 428628, "epoch": 2551} {"train_loss": -12.665852546691895, "global_step": 428629, "epoch": 2551} {"train_loss": -12.512406349182129, "global_step": 428630, "epoch": 2551} {"train_loss": -12.309959411621094, "global_step": 428631, "epoch": 2551} {"train_loss": -12.444849014282227, "global_step": 428632, "epoch": 2551} {"train_loss": -12.504083633422852, "global_step": 428633, "epoch": 2551} {"train_loss": -12.353767395019531, "global_step": 428634, "epoch": 2551} {"train_loss": -12.28506088256836, "global_step": 428635, "epoch": 2551} {"train_loss": -12.778385162353516, "global_step": 428636, "epoch": 2551} {"train_loss": -12.518277168273926, "global_step": 428637, "epoch": 2551} {"train_loss": -12.75727653503418, "global_step": 428638, "epoch": 2551} {"train_loss": -12.522332191467285, "global_step": 428639, "epoch": 2551} {"train_loss": -12.693802833557129, "global_step": 428640, "epoch": 2551} {"train_loss": -12.671961784362793, "global_step": 428641, "epoch": 2551} {"train_loss": -12.677017211914062, "global_step": 428642, "epoch": 2551} {"train_loss": -12.732112884521484, "global_step": 428643, "epoch": 2551} {"train_loss": -12.749011039733887, "global_step": 428644, "epoch": 2551} {"train_loss": -12.773469924926758, "global_step": 428645, "epoch": 2551} {"train_loss": -12.57071304321289, "global_step": 428646, "epoch": 2551} {"train_loss": -12.62429428100586, "global_step": 428647, "epoch": 2551} {"train_loss": -12.868139266967773, "global_step": 428648, "epoch": 2551} {"train_loss": -12.507694244384766, "global_step": 428649, "epoch": 2551} {"train_loss": -12.729369163513184, "global_step": 428650, "epoch": 2551} {"train_loss": -12.648004531860352, "global_step": 428651, "epoch": 2551} {"train_loss": -12.446968078613281, "global_step": 428652, "epoch": 2551} {"train_loss": -12.58065128326416, "global_step": 428653, "epoch": 2551} {"train_loss": -12.563511848449707, "global_step": 428654, "epoch": 2551} {"train_loss": -12.443893432617188, "global_step": 428655, "epoch": 2551} {"train_loss": -12.665489196777344, "global_step": 428656, "epoch": 2551} {"train_loss": -12.672197341918945, "global_step": 428657, "epoch": 2551} {"train_loss": -12.601789474487305, "global_step": 428658, "epoch": 2551} {"train_loss": -12.677617073059082, "global_step": 428659, "epoch": 2551} {"train_loss": -12.67772388458252, "global_step": 428660, "epoch": 2551} {"train_loss": -12.550833702087402, "global_step": 428661, "epoch": 2551} {"train_loss": -12.639817237854004, "global_step": 428662, "epoch": 2551} {"train_loss": -12.619890213012695, "global_step": 428663, "epoch": 2551} {"train_loss": -11.747455596923828, "global_step": 428664, "epoch": 2551} {"train_loss": -12.400079727172852, "global_step": 428665, "epoch": 2551} {"train_loss": -12.144848823547363, "global_step": 428666, "epoch": 2551} {"train_loss": -11.308568954467773, "global_step": 428667, "epoch": 2551} {"train_loss": -11.999391555786133, "global_step": 428668, "epoch": 2551} {"train_loss": -12.378454208374023, "global_step": 428669, "epoch": 2551} {"train_loss": -12.313737869262695, "global_step": 428670, "epoch": 2551} {"train_loss": -11.474620819091797, "global_step": 428671, "epoch": 2551} {"train_loss": -11.143232345581055, "global_step": 428672, "epoch": 2551} {"train_loss": -11.258625030517578, "global_step": 428673, "epoch": 2551} {"train_loss": -12.47175121307373, "global_step": 428674, "epoch": 2551} {"train_loss": -11.314933776855469, "global_step": 428675, "epoch": 2551} {"train_loss": -10.58591079711914, "global_step": 428676, "epoch": 2551} {"train_loss": -11.419672966003418, "global_step": 428677, "epoch": 2551} {"train_loss": -8.664409637451172, "global_step": 428678, "epoch": 2551} {"train_loss": -11.90715217590332, "global_step": 428679, "epoch": 2551} {"train_loss": -10.906230926513672, "global_step": 428680, "epoch": 2551} {"train_loss": -10.86718463897705, "global_step": 428681, "epoch": 2551} {"train_loss": -11.834258079528809, "global_step": 428682, "epoch": 2551} {"train_loss": -10.366119384765625, "global_step": 428683, "epoch": 2551} {"train_loss": -11.630054473876953, "global_step": 428684, "epoch": 2551} {"train_loss": -10.961112976074219, "global_step": 428685, "epoch": 2551} {"train_loss": -11.054643630981445, "global_step": 428686, "epoch": 2551} {"train_loss": -10.71152400970459, "global_step": 428687, "epoch": 2551} {"train_loss": -10.05251693725586, "global_step": 428688, "epoch": 2551} {"train_loss": -11.015235900878906, "global_step": 428689, "epoch": 2551} {"train_loss": -9.405471801757812, "global_step": 428690, "epoch": 2551} {"train_loss": -9.77707576751709, "global_step": 428691, "epoch": 2551} {"train_loss": -10.355806350708008, "global_step": 428692, "epoch": 2551} {"train_loss": -11.456310272216797, "global_step": 428693, "epoch": 2551} {"train_loss": -10.289861679077148, "global_step": 428694, "epoch": 2551} {"train_loss": -10.138726234436035, "global_step": 428695, "epoch": 2551} {"train_loss": -11.431305885314941, "global_step": 428696, "epoch": 2551} {"train_loss": -11.247932434082031, "global_step": 428697, "epoch": 2551} {"train_loss": -10.084020614624023, "global_step": 428698, "epoch": 2551} {"train_loss": -11.091063499450684, "global_step": 428699, "epoch": 2551} {"train_loss": -10.666336059570312, "global_step": 428700, "epoch": 2551} {"train_loss": -10.898216247558594, "global_step": 428701, "epoch": 2551} {"train_loss": -10.368940353393555, "global_step": 428702, "epoch": 2551} {"train_loss": -11.669492721557617, "global_step": 428703, "epoch": 2551} {"train_loss": -10.879015922546387, "global_step": 428704, "epoch": 2551} {"train_loss": -11.166322708129883, "global_step": 428705, "epoch": 2551} {"train_loss": -10.664349555969238, "global_step": 428706, "epoch": 2551} {"train_loss": -11.418378829956055, "global_step": 428707, "epoch": 2551} {"train_loss": -11.514740943908691, "global_step": 428708, "epoch": 2551} {"train_loss": -11.269573211669922, "global_step": 428709, "epoch": 2551} {"train_loss": -11.592161178588867, "global_step": 428710, "epoch": 2551} {"train_loss": -11.261539459228516, "global_step": 428711, "epoch": 2551} {"train_loss": -11.182260513305664, "global_step": 428712, "epoch": 2551} {"train_loss": -11.238932609558105, "global_step": 428713, "epoch": 2551} {"train_loss": -11.16502571105957, "global_step": 428714, "epoch": 2551} {"train_loss": -11.424081802368164, "global_step": 428715, "epoch": 2551} {"train_loss": -11.579740524291992, "global_step": 428716, "epoch": 2551} {"train_loss": -11.156478881835938, "global_step": 428717, "epoch": 2551} {"train_loss": -11.511214256286621, "global_step": 428718, "epoch": 2551} {"train_loss": -11.61132526397705, "global_step": 428719, "epoch": 2551} {"train_loss": -11.8092041015625, "global_step": 428720, "epoch": 2551} {"train_loss": -11.788161277770996, "global_step": 428721, "epoch": 2551} {"train_loss": -11.5990571975708, "global_step": 428722, "epoch": 2551} {"train_loss": -11.913093566894531, "global_step": 428723, "epoch": 2551} {"train_loss": -11.771364212036133, "global_step": 428724, "epoch": 2551} {"train_loss": -11.724440574645996, "global_step": 428725, "epoch": 2551} {"train_loss": -11.981283187866211, "global_step": 428726, "epoch": 2551} {"train_loss": -11.864925384521484, "global_step": 428727, "epoch": 2551} {"train_loss": -11.92280387878418, "global_step": 428728, "epoch": 2551} {"train_loss": -11.994028091430664, "global_step": 428729, "epoch": 2551} {"train_loss": -12.18212890625, "global_step": 428730, "epoch": 2551} {"train_loss": -12.235859870910645, "global_step": 428731, "epoch": 2551} {"train_loss": -12.288276672363281, "global_step": 428732, "epoch": 2551} {"train_loss": -12.101699829101562, "global_step": 428733, "epoch": 2551} {"train_loss": -12.125265121459961, "global_step": 428734, "epoch": 2551} {"train_loss": -11.463710796265374, "global_step": 428735, "epoch": 2551, "val_loss": 309969.0625} {"train_loss": -12.51616382598877, "global_step": 428736, "epoch": 2552} {"train_loss": -12.096159934997559, "global_step": 428737, "epoch": 2552} {"train_loss": -12.352686882019043, "global_step": 428738, "epoch": 2552} {"train_loss": -12.186517715454102, "global_step": 428739, "epoch": 2552} {"train_loss": -12.408943176269531, "global_step": 428740, "epoch": 2552} {"train_loss": -12.328640937805176, "global_step": 428741, "epoch": 2552} {"train_loss": -12.256382942199707, "global_step": 428742, "epoch": 2552} {"train_loss": -12.231786727905273, "global_step": 428743, "epoch": 2552} {"train_loss": -12.167333602905273, "global_step": 428744, "epoch": 2552} {"train_loss": -12.342350006103516, "global_step": 428745, "epoch": 2552} {"train_loss": -12.266695022583008, "global_step": 428746, "epoch": 2552} {"train_loss": -12.410989761352539, "global_step": 428747, "epoch": 2552} {"train_loss": -12.230392456054688, "global_step": 428748, "epoch": 2552} {"train_loss": -12.38885498046875, "global_step": 428749, "epoch": 2552} {"train_loss": -12.549169540405273, "global_step": 428750, "epoch": 2552} {"train_loss": -12.288166046142578, "global_step": 428751, "epoch": 2552} {"train_loss": -12.496247291564941, "global_step": 428752, "epoch": 2552} {"train_loss": -12.329643249511719, "global_step": 428753, "epoch": 2552} {"train_loss": -12.29547119140625, "global_step": 428754, "epoch": 2552} {"train_loss": -12.537273406982422, "global_step": 428755, "epoch": 2552} {"train_loss": -12.534676551818848, "global_step": 428756, "epoch": 2552} {"train_loss": -12.564420700073242, "global_step": 428757, "epoch": 2552} {"train_loss": -12.489130020141602, "global_step": 428758, "epoch": 2552} {"train_loss": -12.347196578979492, "global_step": 428759, "epoch": 2552} {"train_loss": -12.598933219909668, "global_step": 428760, "epoch": 2552} {"train_loss": -12.356250762939453, "global_step": 428761, "epoch": 2552} {"train_loss": -12.551263809204102, "global_step": 428762, "epoch": 2552} {"train_loss": -12.76792049407959, "global_step": 428763, "epoch": 2552} {"train_loss": -12.537528991699219, "global_step": 428764, "epoch": 2552} {"train_loss": -12.676386833190918, "global_step": 428765, "epoch": 2552} {"train_loss": -12.502376556396484, "global_step": 428766, "epoch": 2552} {"train_loss": -12.48979663848877, "global_step": 428767, "epoch": 2552} {"train_loss": -12.627339363098145, "global_step": 428768, "epoch": 2552} {"train_loss": -12.715337753295898, "global_step": 428769, "epoch": 2552} {"train_loss": -12.45547866821289, "global_step": 428770, "epoch": 2552} {"train_loss": -12.763689041137695, "global_step": 428771, "epoch": 2552} {"train_loss": -12.667182922363281, "global_step": 428772, "epoch": 2552} {"train_loss": -12.524787902832031, "global_step": 428773, "epoch": 2552} {"train_loss": -12.865415573120117, "global_step": 428774, "epoch": 2552} {"train_loss": -12.43594741821289, "global_step": 428775, "epoch": 2552} {"train_loss": -12.675411224365234, "global_step": 428776, "epoch": 2552} {"train_loss": -12.512993812561035, "global_step": 428777, "epoch": 2552} {"train_loss": -12.684097290039062, "global_step": 428778, "epoch": 2552} {"train_loss": -12.392131805419922, "global_step": 428779, "epoch": 2552} {"train_loss": -12.587579727172852, "global_step": 428780, "epoch": 2552} {"train_loss": -12.708148956298828, "global_step": 428781, "epoch": 2552} {"train_loss": -12.363993644714355, "global_step": 428782, "epoch": 2552} {"train_loss": -12.54155445098877, "global_step": 428783, "epoch": 2552} {"train_loss": -12.43714714050293, "global_step": 428784, "epoch": 2552} {"train_loss": -12.564226150512695, "global_step": 428785, "epoch": 2552} {"train_loss": -12.62716293334961, "global_step": 428786, "epoch": 2552} {"train_loss": -11.718865394592285, "global_step": 428787, "epoch": 2552} {"train_loss": -12.112666130065918, "global_step": 428788, "epoch": 2552} {"train_loss": -11.663934707641602, "global_step": 428789, "epoch": 2552} {"train_loss": -12.033936500549316, "global_step": 428790, "epoch": 2552} {"train_loss": -10.999263763427734, "global_step": 428791, "epoch": 2552} {"train_loss": -11.368534088134766, "global_step": 428792, "epoch": 2552} {"train_loss": -10.808488845825195, "global_step": 428793, "epoch": 2552} {"train_loss": -11.584005355834961, "global_step": 428794, "epoch": 2552} {"train_loss": -10.42177677154541, "global_step": 428795, "epoch": 2552} {"train_loss": -12.131765365600586, "global_step": 428796, "epoch": 2552} {"train_loss": -11.361713409423828, "global_step": 428797, "epoch": 2552} {"train_loss": -11.582538604736328, "global_step": 428798, "epoch": 2552} {"train_loss": -12.157244682312012, "global_step": 428799, "epoch": 2552} {"train_loss": -11.277389526367188, "global_step": 428800, "epoch": 2552} {"train_loss": -12.206890106201172, "global_step": 428801, "epoch": 2552} {"train_loss": -11.141708374023438, "global_step": 428802, "epoch": 2552} {"train_loss": -12.20773696899414, "global_step": 428803, "epoch": 2552} {"train_loss": -11.951628684997559, "global_step": 428804, "epoch": 2552} {"train_loss": -12.089972496032715, "global_step": 428805, "epoch": 2552} {"train_loss": -12.066356658935547, "global_step": 428806, "epoch": 2552} {"train_loss": -12.034685134887695, "global_step": 428807, "epoch": 2552} {"train_loss": -12.505061149597168, "global_step": 428808, "epoch": 2552} {"train_loss": -12.234580039978027, "global_step": 428809, "epoch": 2552} {"train_loss": -12.572820663452148, "global_step": 428810, "epoch": 2552} {"train_loss": -12.016756057739258, "global_step": 428811, "epoch": 2552} {"train_loss": -12.52243423461914, "global_step": 428812, "epoch": 2552} {"train_loss": -12.183731079101562, "global_step": 428813, "epoch": 2552} {"train_loss": -12.42292594909668, "global_step": 428814, "epoch": 2552} {"train_loss": -12.363250732421875, "global_step": 428815, "epoch": 2552} {"train_loss": -12.147521018981934, "global_step": 428816, "epoch": 2552} {"train_loss": -12.124238967895508, "global_step": 428817, "epoch": 2552} {"train_loss": -12.561134338378906, "global_step": 428818, "epoch": 2552} {"train_loss": -12.315654754638672, "global_step": 428819, "epoch": 2552} {"train_loss": -12.474227905273438, "global_step": 428820, "epoch": 2552} {"train_loss": -12.256607055664062, "global_step": 428821, "epoch": 2552} {"train_loss": -12.824777603149414, "global_step": 428822, "epoch": 2552} {"train_loss": -12.572981834411621, "global_step": 428823, "epoch": 2552} {"train_loss": -12.525701522827148, "global_step": 428824, "epoch": 2552} {"train_loss": -12.467424392700195, "global_step": 428825, "epoch": 2552} {"train_loss": -12.192116737365723, "global_step": 428826, "epoch": 2552} {"train_loss": -12.610296249389648, "global_step": 428827, "epoch": 2552} {"train_loss": -12.497230529785156, "global_step": 428828, "epoch": 2552} {"train_loss": -12.476213455200195, "global_step": 428829, "epoch": 2552} {"train_loss": -12.544188499450684, "global_step": 428830, "epoch": 2552} {"train_loss": -12.46009635925293, "global_step": 428831, "epoch": 2552} {"train_loss": -12.427921295166016, "global_step": 428832, "epoch": 2552} {"train_loss": -12.25509262084961, "global_step": 428833, "epoch": 2552} {"train_loss": -12.64759349822998, "global_step": 428834, "epoch": 2552} {"train_loss": -12.389413833618164, "global_step": 428835, "epoch": 2552} {"train_loss": -12.671672821044922, "global_step": 428836, "epoch": 2552} {"train_loss": -12.322019577026367, "global_step": 428837, "epoch": 2552} {"train_loss": -12.441937446594238, "global_step": 428838, "epoch": 2552} {"train_loss": -12.08053207397461, "global_step": 428839, "epoch": 2552} {"train_loss": -12.466819763183594, "global_step": 428840, "epoch": 2552} {"train_loss": -12.503337860107422, "global_step": 428841, "epoch": 2552} {"train_loss": -12.51701545715332, "global_step": 428842, "epoch": 2552} {"train_loss": -12.889284133911133, "global_step": 428843, "epoch": 2552} {"train_loss": -12.556255340576172, "global_step": 428844, "epoch": 2552} {"train_loss": -11.760704040527344, "global_step": 428845, "epoch": 2552} {"train_loss": -12.27946662902832, "global_step": 428846, "epoch": 2552} {"train_loss": -12.337715148925781, "global_step": 428847, "epoch": 2552} {"train_loss": -11.985437393188477, "global_step": 428848, "epoch": 2552} {"train_loss": -12.742244720458984, "global_step": 428849, "epoch": 2552} {"train_loss": -11.97231388092041, "global_step": 428850, "epoch": 2552} {"train_loss": -12.428184509277344, "global_step": 428851, "epoch": 2552} {"train_loss": -12.035317420959473, "global_step": 428852, "epoch": 2552} {"train_loss": -12.804412841796875, "global_step": 428853, "epoch": 2552} {"train_loss": -12.126962661743164, "global_step": 428854, "epoch": 2552} {"train_loss": -12.598398208618164, "global_step": 428855, "epoch": 2552} {"train_loss": -12.484936714172363, "global_step": 428856, "epoch": 2552} {"train_loss": -12.493036270141602, "global_step": 428857, "epoch": 2552} {"train_loss": -12.487749099731445, "global_step": 428858, "epoch": 2552} {"train_loss": -12.518220901489258, "global_step": 428859, "epoch": 2552} {"train_loss": -11.989906311035156, "global_step": 428860, "epoch": 2552} {"train_loss": -12.214544296264648, "global_step": 428861, "epoch": 2552} {"train_loss": -12.152481079101562, "global_step": 428862, "epoch": 2552} {"train_loss": -11.934020042419434, "global_step": 428863, "epoch": 2552} {"train_loss": -12.174001693725586, "global_step": 428864, "epoch": 2552} {"train_loss": -12.065359115600586, "global_step": 428865, "epoch": 2552} {"train_loss": -11.964237213134766, "global_step": 428866, "epoch": 2552} {"train_loss": -12.083677291870117, "global_step": 428867, "epoch": 2552} {"train_loss": -11.780986785888672, "global_step": 428868, "epoch": 2552} {"train_loss": -12.358074188232422, "global_step": 428869, "epoch": 2552} {"train_loss": -11.975839614868164, "global_step": 428870, "epoch": 2552} {"train_loss": -12.057100296020508, "global_step": 428871, "epoch": 2552} {"train_loss": -12.089883804321289, "global_step": 428872, "epoch": 2552} {"train_loss": -12.172704696655273, "global_step": 428873, "epoch": 2552} {"train_loss": -12.634521484375, "global_step": 428874, "epoch": 2552} {"train_loss": -12.13671875, "global_step": 428875, "epoch": 2552} {"train_loss": -12.098859786987305, "global_step": 428876, "epoch": 2552} {"train_loss": -12.310966491699219, "global_step": 428877, "epoch": 2552} {"train_loss": -12.474176406860352, "global_step": 428878, "epoch": 2552} {"train_loss": -12.379419326782227, "global_step": 428879, "epoch": 2552} {"train_loss": -12.654239654541016, "global_step": 428880, "epoch": 2552} {"train_loss": -12.47958755493164, "global_step": 428881, "epoch": 2552} {"train_loss": -12.833227157592773, "global_step": 428882, "epoch": 2552} {"train_loss": -12.474841117858887, "global_step": 428883, "epoch": 2552} {"train_loss": -12.85395336151123, "global_step": 428884, "epoch": 2552} {"train_loss": -12.512327194213867, "global_step": 428885, "epoch": 2552} {"train_loss": -12.524133682250977, "global_step": 428886, "epoch": 2552} {"train_loss": -12.558938026428223, "global_step": 428887, "epoch": 2552} {"train_loss": -12.71411418914795, "global_step": 428888, "epoch": 2552} {"train_loss": -12.463305473327637, "global_step": 428889, "epoch": 2552} {"train_loss": -12.677835464477539, "global_step": 428890, "epoch": 2552} {"train_loss": -12.275373458862305, "global_step": 428891, "epoch": 2552} {"train_loss": -12.582612991333008, "global_step": 428892, "epoch": 2552} {"train_loss": -12.469300270080566, "global_step": 428893, "epoch": 2552} {"train_loss": -12.876784324645996, "global_step": 428894, "epoch": 2552} {"train_loss": -12.680398941040039, "global_step": 428895, "epoch": 2552} {"train_loss": -12.863836288452148, "global_step": 428896, "epoch": 2552} {"train_loss": -12.505672454833984, "global_step": 428897, "epoch": 2552} {"train_loss": -12.560222625732422, "global_step": 428898, "epoch": 2552} {"train_loss": -12.553885459899902, "global_step": 428899, "epoch": 2552} {"train_loss": -12.758931159973145, "global_step": 428900, "epoch": 2552} {"train_loss": -12.65603256225586, "global_step": 428901, "epoch": 2552} {"train_loss": -12.589003562927246, "global_step": 428902, "epoch": 2552} {"train_loss": -12.334853149595714, "global_step": 428903, "epoch": 2552, "val_loss": 310827.46875} {"train_loss": -12.32293701171875, "global_step": 428904, "epoch": 2553} {"train_loss": -12.082258224487305, "global_step": 428905, "epoch": 2553} {"train_loss": -12.016483306884766, "global_step": 428906, "epoch": 2553} {"train_loss": -12.287070274353027, "global_step": 428907, "epoch": 2553} {"train_loss": -12.499407768249512, "global_step": 428908, "epoch": 2553} {"train_loss": -12.565729141235352, "global_step": 428909, "epoch": 2553} {"train_loss": -11.926680564880371, "global_step": 428910, "epoch": 2553} {"train_loss": -12.830976486206055, "global_step": 428911, "epoch": 2553} {"train_loss": -12.326801300048828, "global_step": 428912, "epoch": 2553} {"train_loss": -12.334115982055664, "global_step": 428913, "epoch": 2553} {"train_loss": -12.554817199707031, "global_step": 428914, "epoch": 2553} {"train_loss": -12.406219482421875, "global_step": 428915, "epoch": 2553} {"train_loss": -11.693825721740723, "global_step": 428916, "epoch": 2553} {"train_loss": -11.975010871887207, "global_step": 428917, "epoch": 2553} {"train_loss": -12.224780082702637, "global_step": 428918, "epoch": 2553} {"train_loss": -11.867420196533203, "global_step": 428919, "epoch": 2553} {"train_loss": -12.189719200134277, "global_step": 428920, "epoch": 2553} {"train_loss": -11.839300155639648, "global_step": 428921, "epoch": 2553} {"train_loss": -12.103548049926758, "global_step": 428922, "epoch": 2553} {"train_loss": -12.675100326538086, "global_step": 428923, "epoch": 2553} {"train_loss": -11.966882705688477, "global_step": 428924, "epoch": 2553} {"train_loss": -12.160860061645508, "global_step": 428925, "epoch": 2553} {"train_loss": -12.606797218322754, "global_step": 428926, "epoch": 2553} {"train_loss": -12.10527229309082, "global_step": 428927, "epoch": 2553} {"train_loss": -11.777491569519043, "global_step": 428928, "epoch": 2553} {"train_loss": -11.788341522216797, "global_step": 428929, "epoch": 2553} {"train_loss": -12.543642044067383, "global_step": 428930, "epoch": 2553} {"train_loss": -10.799125671386719, "global_step": 428931, "epoch": 2553} {"train_loss": -11.845726013183594, "global_step": 428932, "epoch": 2553} {"train_loss": -12.583392143249512, "global_step": 428933, "epoch": 2553} {"train_loss": -11.622525215148926, "global_step": 428934, "epoch": 2553} {"train_loss": -11.987075805664062, "global_step": 428935, "epoch": 2553} {"train_loss": -12.156579971313477, "global_step": 428936, "epoch": 2553} {"train_loss": -10.74658489227295, "global_step": 428937, "epoch": 2553} {"train_loss": -11.788286209106445, "global_step": 428938, "epoch": 2553} {"train_loss": -12.228273391723633, "global_step": 428939, "epoch": 2553} {"train_loss": -10.100066184997559, "global_step": 428940, "epoch": 2553} {"train_loss": -12.254096984863281, "global_step": 428941, "epoch": 2553} {"train_loss": -10.456026077270508, "global_step": 428942, "epoch": 2553} {"train_loss": -10.508001327514648, "global_step": 428943, "epoch": 2553} {"train_loss": -11.038215637207031, "global_step": 428944, "epoch": 2553} {"train_loss": -10.540324211120605, "global_step": 428945, "epoch": 2553} {"train_loss": -11.710775375366211, "global_step": 428946, "epoch": 2553} {"train_loss": -10.759867668151855, "global_step": 428947, "epoch": 2553} {"train_loss": -11.801267623901367, "global_step": 428948, "epoch": 2553} {"train_loss": -10.230511665344238, "global_step": 428949, "epoch": 2553} {"train_loss": -12.00727653503418, "global_step": 428950, "epoch": 2553} {"train_loss": -10.842101097106934, "global_step": 428951, "epoch": 2553} {"train_loss": -12.193374633789062, "global_step": 428952, "epoch": 2553} {"train_loss": -10.658454895019531, "global_step": 428953, "epoch": 2553} {"train_loss": -12.071633338928223, "global_step": 428954, "epoch": 2553} {"train_loss": -11.315377235412598, "global_step": 428955, "epoch": 2553} {"train_loss": -11.081859588623047, "global_step": 428956, "epoch": 2553} {"train_loss": -10.895471572875977, "global_step": 428957, "epoch": 2553} {"train_loss": -10.812124252319336, "global_step": 428958, "epoch": 2553} {"train_loss": -11.649364471435547, "global_step": 428959, "epoch": 2553} {"train_loss": -9.806074142456055, "global_step": 428960, "epoch": 2553} {"train_loss": -11.702434539794922, "global_step": 428961, "epoch": 2553} {"train_loss": -10.251153945922852, "global_step": 428962, "epoch": 2553} {"train_loss": -10.831336975097656, "global_step": 428963, "epoch": 2553} {"train_loss": -9.64920425415039, "global_step": 428964, "epoch": 2553} {"train_loss": -10.274066925048828, "global_step": 428965, "epoch": 2553} {"train_loss": -9.890792846679688, "global_step": 428966, "epoch": 2553} {"train_loss": -10.165800094604492, "global_step": 428967, "epoch": 2553} {"train_loss": -11.232316970825195, "global_step": 428968, "epoch": 2553} {"train_loss": -10.080253601074219, "global_step": 428969, "epoch": 2553} {"train_loss": -9.412537574768066, "global_step": 428970, "epoch": 2553} {"train_loss": -9.881145477294922, "global_step": 428971, "epoch": 2553} {"train_loss": -10.601186752319336, "global_step": 428972, "epoch": 2553} {"train_loss": -10.838847160339355, "global_step": 428973, "epoch": 2553} {"train_loss": -9.423944473266602, "global_step": 428974, "epoch": 2553} {"train_loss": -10.585027694702148, "global_step": 428975, "epoch": 2553} {"train_loss": -11.429422378540039, "global_step": 428976, "epoch": 2553} {"train_loss": -9.324578285217285, "global_step": 428977, "epoch": 2553} {"train_loss": -10.088235855102539, "global_step": 428978, "epoch": 2553} {"train_loss": -11.694597244262695, "global_step": 428979, "epoch": 2553} {"train_loss": -10.103902816772461, "global_step": 428980, "epoch": 2553} {"train_loss": -10.604761123657227, "global_step": 428981, "epoch": 2553} {"train_loss": -11.34986686706543, "global_step": 428982, "epoch": 2553} {"train_loss": -10.124945640563965, "global_step": 428983, "epoch": 2553} {"train_loss": -10.541011810302734, "global_step": 428984, "epoch": 2553} {"train_loss": -11.58690357208252, "global_step": 428985, "epoch": 2553} {"train_loss": -10.634563446044922, "global_step": 428986, "epoch": 2553} {"train_loss": -10.97385025024414, "global_step": 428987, "epoch": 2553} {"train_loss": -11.823614120483398, "global_step": 428988, "epoch": 2553} {"train_loss": -11.536215782165527, "global_step": 428989, "epoch": 2553} {"train_loss": -11.323945045471191, "global_step": 428990, "epoch": 2553} {"train_loss": -12.018138885498047, "global_step": 428991, "epoch": 2553} {"train_loss": -11.46377944946289, "global_step": 428992, "epoch": 2553} {"train_loss": -11.944486618041992, "global_step": 428993, "epoch": 2553} {"train_loss": -11.97542953491211, "global_step": 428994, "epoch": 2553} {"train_loss": -12.015885353088379, "global_step": 428995, "epoch": 2553} {"train_loss": -11.436155319213867, "global_step": 428996, "epoch": 2553} {"train_loss": -11.90866470336914, "global_step": 428997, "epoch": 2553} {"train_loss": -11.42264461517334, "global_step": 428998, "epoch": 2553} {"train_loss": -11.688475608825684, "global_step": 428999, "epoch": 2553} {"train_loss": -11.894290924072266, "global_step": 429000, "epoch": 2553} {"train_loss": -11.517561912536621, "global_step": 429001, "epoch": 2553} {"train_loss": -12.100817680358887, "global_step": 429002, "epoch": 2553} {"train_loss": -11.840700149536133, "global_step": 429003, "epoch": 2553} {"train_loss": -11.770194053649902, "global_step": 429004, "epoch": 2553} {"train_loss": -12.144660949707031, "global_step": 429005, "epoch": 2553} {"train_loss": -12.083646774291992, "global_step": 429006, "epoch": 2553} {"train_loss": -12.185038566589355, "global_step": 429007, "epoch": 2553} {"train_loss": -12.034676551818848, "global_step": 429008, "epoch": 2553} {"train_loss": -11.990933418273926, "global_step": 429009, "epoch": 2553} {"train_loss": -12.131589889526367, "global_step": 429010, "epoch": 2553} {"train_loss": -12.237726211547852, "global_step": 429011, "epoch": 2553} {"train_loss": -12.13786792755127, "global_step": 429012, "epoch": 2553} {"train_loss": -11.926902770996094, "global_step": 429013, "epoch": 2553} {"train_loss": -12.057511329650879, "global_step": 429014, "epoch": 2553} {"train_loss": -12.288633346557617, "global_step": 429015, "epoch": 2553} {"train_loss": -11.991508483886719, "global_step": 429016, "epoch": 2553} {"train_loss": -12.151801109313965, "global_step": 429017, "epoch": 2553} {"train_loss": -11.906404495239258, "global_step": 429018, "epoch": 2553} {"train_loss": -12.01675796508789, "global_step": 429019, "epoch": 2553} {"train_loss": -11.649456977844238, "global_step": 429020, "epoch": 2553} {"train_loss": -12.045937538146973, "global_step": 429021, "epoch": 2553} {"train_loss": -11.938186645507812, "global_step": 429022, "epoch": 2553} {"train_loss": -12.241083145141602, "global_step": 429023, "epoch": 2553} {"train_loss": -12.0988187789917, "global_step": 429024, "epoch": 2553} {"train_loss": -12.215230941772461, "global_step": 429025, "epoch": 2553} {"train_loss": -12.394710540771484, "global_step": 429026, "epoch": 2553} {"train_loss": -11.542303085327148, "global_step": 429027, "epoch": 2553} {"train_loss": -12.366849899291992, "global_step": 429028, "epoch": 2553} {"train_loss": -11.65221881866455, "global_step": 429029, "epoch": 2553} {"train_loss": -12.357723236083984, "global_step": 429030, "epoch": 2553} {"train_loss": -12.10192584991455, "global_step": 429031, "epoch": 2553} {"train_loss": -12.046623229980469, "global_step": 429032, "epoch": 2553} {"train_loss": -12.112829208374023, "global_step": 429033, "epoch": 2553} {"train_loss": -12.133377075195312, "global_step": 429034, "epoch": 2553} {"train_loss": -12.208444595336914, "global_step": 429035, "epoch": 2553} {"train_loss": -12.108203887939453, "global_step": 429036, "epoch": 2553} {"train_loss": -12.301834106445312, "global_step": 429037, "epoch": 2553} {"train_loss": -12.325624465942383, "global_step": 429038, "epoch": 2553} {"train_loss": -12.365351676940918, "global_step": 429039, "epoch": 2553} {"train_loss": -12.313393592834473, "global_step": 429040, "epoch": 2553} {"train_loss": -12.451208114624023, "global_step": 429041, "epoch": 2553} {"train_loss": -12.513826370239258, "global_step": 429042, "epoch": 2553} {"train_loss": -12.25285816192627, "global_step": 429043, "epoch": 2553} {"train_loss": -12.20040225982666, "global_step": 429044, "epoch": 2553} {"train_loss": -12.352025032043457, "global_step": 429045, "epoch": 2553} {"train_loss": -12.415410995483398, "global_step": 429046, "epoch": 2553} {"train_loss": -12.447265625, "global_step": 429047, "epoch": 2553} {"train_loss": -12.423542976379395, "global_step": 429048, "epoch": 2553} {"train_loss": -12.29047679901123, "global_step": 429049, "epoch": 2553} {"train_loss": -12.35500717163086, "global_step": 429050, "epoch": 2553} {"train_loss": -12.469025611877441, "global_step": 429051, "epoch": 2553} {"train_loss": -12.303717613220215, "global_step": 429052, "epoch": 2553} {"train_loss": -12.461749076843262, "global_step": 429053, "epoch": 2553} {"train_loss": -12.381839752197266, "global_step": 429054, "epoch": 2553} {"train_loss": -12.58875846862793, "global_step": 429055, "epoch": 2553} {"train_loss": -12.509212493896484, "global_step": 429056, "epoch": 2553} {"train_loss": -12.458040237426758, "global_step": 429057, "epoch": 2553} {"train_loss": -12.495328903198242, "global_step": 429058, "epoch": 2553} {"train_loss": -12.484221458435059, "global_step": 429059, "epoch": 2553} {"train_loss": -12.342161178588867, "global_step": 429060, "epoch": 2553} {"train_loss": -12.522104263305664, "global_step": 429061, "epoch": 2553} {"train_loss": -12.58791732788086, "global_step": 429062, "epoch": 2553} {"train_loss": -12.730603218078613, "global_step": 429063, "epoch": 2553} {"train_loss": -12.519989013671875, "global_step": 429064, "epoch": 2553} {"train_loss": -12.635726928710938, "global_step": 429065, "epoch": 2553} {"train_loss": -12.540168762207031, "global_step": 429066, "epoch": 2553} {"train_loss": -12.623106002807617, "global_step": 429067, "epoch": 2553} {"train_loss": -12.457643508911133, "global_step": 429068, "epoch": 2553} {"train_loss": -12.344491958618164, "global_step": 429069, "epoch": 2553} {"train_loss": -12.948914527893066, "global_step": 429070, "epoch": 2553} {"train_loss": -11.747184225491115, "global_step": 429071, "epoch": 2553, "val_loss": 309846.34375} {"train_loss": -11.901578903198242, "global_step": 429072, "epoch": 2554} {"train_loss": -12.405133247375488, "global_step": 429073, "epoch": 2554} {"train_loss": -12.423995018005371, "global_step": 429074, "epoch": 2554} {"train_loss": -11.886381149291992, "global_step": 429075, "epoch": 2554} {"train_loss": -12.023626327514648, "global_step": 429076, "epoch": 2554} {"train_loss": -12.453834533691406, "global_step": 429077, "epoch": 2554} {"train_loss": -11.493611335754395, "global_step": 429078, "epoch": 2554} {"train_loss": -11.810728073120117, "global_step": 429079, "epoch": 2554} {"train_loss": -12.486288070678711, "global_step": 429080, "epoch": 2554} {"train_loss": -11.34134578704834, "global_step": 429081, "epoch": 2554} {"train_loss": -11.281919479370117, "global_step": 429082, "epoch": 2554} {"train_loss": -12.567126274108887, "global_step": 429083, "epoch": 2554} {"train_loss": -12.070236206054688, "global_step": 429084, "epoch": 2554} {"train_loss": -12.645431518554688, "global_step": 429085, "epoch": 2554} {"train_loss": -12.163122177124023, "global_step": 429086, "epoch": 2554} {"train_loss": -12.518306732177734, "global_step": 429087, "epoch": 2554} {"train_loss": -12.337287902832031, "global_step": 429088, "epoch": 2554} {"train_loss": -12.645917892456055, "global_step": 429089, "epoch": 2554} {"train_loss": -12.538125038146973, "global_step": 429090, "epoch": 2554} {"train_loss": -12.5294189453125, "global_step": 429091, "epoch": 2554} {"train_loss": -12.385322570800781, "global_step": 429092, "epoch": 2554} {"train_loss": -12.537405014038086, "global_step": 429093, "epoch": 2554} {"train_loss": -12.335978507995605, "global_step": 429094, "epoch": 2554} {"train_loss": -12.613718032836914, "global_step": 429095, "epoch": 2554} {"train_loss": -12.705151557922363, "global_step": 429096, "epoch": 2554} {"train_loss": -12.544191360473633, "global_step": 429097, "epoch": 2554} {"train_loss": -12.739980697631836, "global_step": 429098, "epoch": 2554} {"train_loss": -12.74616813659668, "global_step": 429099, "epoch": 2554} {"train_loss": -12.595125198364258, "global_step": 429100, "epoch": 2554} {"train_loss": -12.642221450805664, "global_step": 429101, "epoch": 2554} {"train_loss": -12.572135925292969, "global_step": 429102, "epoch": 2554} {"train_loss": -12.57234001159668, "global_step": 429103, "epoch": 2554} {"train_loss": -12.794958114624023, "global_step": 429104, "epoch": 2554} {"train_loss": -12.698768615722656, "global_step": 429105, "epoch": 2554} {"train_loss": -12.680713653564453, "global_step": 429106, "epoch": 2554} {"train_loss": -12.598600387573242, "global_step": 429107, "epoch": 2554} {"train_loss": -12.610296249389648, "global_step": 429108, "epoch": 2554} {"train_loss": -12.707792282104492, "global_step": 429109, "epoch": 2554} {"train_loss": -12.714889526367188, "global_step": 429110, "epoch": 2554} {"train_loss": -12.624979019165039, "global_step": 429111, "epoch": 2554} {"train_loss": -12.668100357055664, "global_step": 429112, "epoch": 2554} {"train_loss": -12.607879638671875, "global_step": 429113, "epoch": 2554} {"train_loss": -12.628591537475586, "global_step": 429114, "epoch": 2554} {"train_loss": -12.683612823486328, "global_step": 429115, "epoch": 2554} {"train_loss": -12.49519157409668, "global_step": 429116, "epoch": 2554} {"train_loss": -12.580409049987793, "global_step": 429117, "epoch": 2554} {"train_loss": -12.749074935913086, "global_step": 429118, "epoch": 2554} {"train_loss": -12.489845275878906, "global_step": 429119, "epoch": 2554} {"train_loss": -12.58548355102539, "global_step": 429120, "epoch": 2554} {"train_loss": -12.762809753417969, "global_step": 429121, "epoch": 2554} {"train_loss": -12.922961235046387, "global_step": 429122, "epoch": 2554} {"train_loss": -12.592174530029297, "global_step": 429123, "epoch": 2554} {"train_loss": -12.524826049804688, "global_step": 429124, "epoch": 2554} {"train_loss": -12.720049858093262, "global_step": 429125, "epoch": 2554} {"train_loss": -12.35245132446289, "global_step": 429126, "epoch": 2554} {"train_loss": -12.698305130004883, "global_step": 429127, "epoch": 2554} {"train_loss": -12.369775772094727, "global_step": 429128, "epoch": 2554} {"train_loss": -12.167932510375977, "global_step": 429129, "epoch": 2554} {"train_loss": -11.996318817138672, "global_step": 429130, "epoch": 2554} {"train_loss": -12.105525970458984, "global_step": 429131, "epoch": 2554} {"train_loss": -12.40143871307373, "global_step": 429132, "epoch": 2554} {"train_loss": -12.420129776000977, "global_step": 429133, "epoch": 2554} {"train_loss": -12.495075225830078, "global_step": 429134, "epoch": 2554} {"train_loss": -12.650550842285156, "global_step": 429135, "epoch": 2554} {"train_loss": -11.794103622436523, "global_step": 429136, "epoch": 2554} {"train_loss": -11.313404083251953, "global_step": 429137, "epoch": 2554} {"train_loss": -11.045303344726562, "global_step": 429138, "epoch": 2554} {"train_loss": -11.110815048217773, "global_step": 429139, "epoch": 2554} {"train_loss": -11.476408004760742, "global_step": 429140, "epoch": 2554} {"train_loss": -12.130226135253906, "global_step": 429141, "epoch": 2554} {"train_loss": -10.687223434448242, "global_step": 429142, "epoch": 2554} {"train_loss": -12.227298736572266, "global_step": 429143, "epoch": 2554} {"train_loss": -10.76118278503418, "global_step": 429144, "epoch": 2554} {"train_loss": -11.751461029052734, "global_step": 429145, "epoch": 2554} {"train_loss": -11.892662048339844, "global_step": 429146, "epoch": 2554} {"train_loss": -11.591941833496094, "global_step": 429147, "epoch": 2554} {"train_loss": -11.93684196472168, "global_step": 429148, "epoch": 2554} {"train_loss": -11.80474853515625, "global_step": 429149, "epoch": 2554} {"train_loss": -11.422473907470703, "global_step": 429150, "epoch": 2554} {"train_loss": -11.516834259033203, "global_step": 429151, "epoch": 2554} {"train_loss": -11.746861457824707, "global_step": 429152, "epoch": 2554} {"train_loss": -11.998336791992188, "global_step": 429153, "epoch": 2554} {"train_loss": -12.441995620727539, "global_step": 429154, "epoch": 2554} {"train_loss": -11.89133071899414, "global_step": 429155, "epoch": 2554} {"train_loss": -12.326089859008789, "global_step": 429156, "epoch": 2554} {"train_loss": -12.141013145446777, "global_step": 429157, "epoch": 2554} {"train_loss": -12.183208465576172, "global_step": 429158, "epoch": 2554} {"train_loss": -12.334563255310059, "global_step": 429159, "epoch": 2554} {"train_loss": -12.427424430847168, "global_step": 429160, "epoch": 2554} {"train_loss": -12.504104614257812, "global_step": 429161, "epoch": 2554} {"train_loss": -12.297900199890137, "global_step": 429162, "epoch": 2554} {"train_loss": -12.229280471801758, "global_step": 429163, "epoch": 2554} {"train_loss": -12.232813835144043, "global_step": 429164, "epoch": 2554} {"train_loss": -12.690414428710938, "global_step": 429165, "epoch": 2554} {"train_loss": -12.224884033203125, "global_step": 429166, "epoch": 2554} {"train_loss": -12.398818969726562, "global_step": 429167, "epoch": 2554} {"train_loss": -11.996339797973633, "global_step": 429168, "epoch": 2554} {"train_loss": -12.500605583190918, "global_step": 429169, "epoch": 2554} {"train_loss": -11.877992630004883, "global_step": 429170, "epoch": 2554} {"train_loss": -12.516419410705566, "global_step": 429171, "epoch": 2554} {"train_loss": -12.046279907226562, "global_step": 429172, "epoch": 2554} {"train_loss": -12.3251953125, "global_step": 429173, "epoch": 2554} {"train_loss": -12.566682815551758, "global_step": 429174, "epoch": 2554} {"train_loss": -12.392036437988281, "global_step": 429175, "epoch": 2554} {"train_loss": -12.400676727294922, "global_step": 429176, "epoch": 2554} {"train_loss": -12.367204666137695, "global_step": 429177, "epoch": 2554} {"train_loss": -12.423848152160645, "global_step": 429178, "epoch": 2554} {"train_loss": -12.349020004272461, "global_step": 429179, "epoch": 2554} {"train_loss": -12.62436294555664, "global_step": 429180, "epoch": 2554} {"train_loss": -12.51829719543457, "global_step": 429181, "epoch": 2554} {"train_loss": -12.212520599365234, "global_step": 429182, "epoch": 2554} {"train_loss": -12.674971580505371, "global_step": 429183, "epoch": 2554} {"train_loss": -12.57335090637207, "global_step": 429184, "epoch": 2554} {"train_loss": -12.063533782958984, "global_step": 429185, "epoch": 2554} {"train_loss": -12.834222793579102, "global_step": 429186, "epoch": 2554} {"train_loss": -12.353191375732422, "global_step": 429187, "epoch": 2554} {"train_loss": -12.239112854003906, "global_step": 429188, "epoch": 2554} {"train_loss": -12.334493637084961, "global_step": 429189, "epoch": 2554} {"train_loss": -12.153030395507812, "global_step": 429190, "epoch": 2554} {"train_loss": -12.407617568969727, "global_step": 429191, "epoch": 2554} {"train_loss": -12.351439476013184, "global_step": 429192, "epoch": 2554} {"train_loss": -12.305778503417969, "global_step": 429193, "epoch": 2554} {"train_loss": -12.024192810058594, "global_step": 429194, "epoch": 2554} {"train_loss": -12.48542308807373, "global_step": 429195, "epoch": 2554} {"train_loss": -12.239113807678223, "global_step": 429196, "epoch": 2554} {"train_loss": -12.650086402893066, "global_step": 429197, "epoch": 2554} {"train_loss": -12.393230438232422, "global_step": 429198, "epoch": 2554} {"train_loss": -12.243589401245117, "global_step": 429199, "epoch": 2554} {"train_loss": -12.437023162841797, "global_step": 429200, "epoch": 2554} {"train_loss": -12.672961235046387, "global_step": 429201, "epoch": 2554} {"train_loss": -12.44636344909668, "global_step": 429202, "epoch": 2554} {"train_loss": -12.660709381103516, "global_step": 429203, "epoch": 2554} {"train_loss": -12.52022933959961, "global_step": 429204, "epoch": 2554} {"train_loss": -12.788522720336914, "global_step": 429205, "epoch": 2554} {"train_loss": -12.527305603027344, "global_step": 429206, "epoch": 2554} {"train_loss": -12.307825088500977, "global_step": 429207, "epoch": 2554} {"train_loss": -12.578550338745117, "global_step": 429208, "epoch": 2554} {"train_loss": -12.73898696899414, "global_step": 429209, "epoch": 2554} {"train_loss": -12.344813346862793, "global_step": 429210, "epoch": 2554} {"train_loss": -12.02519416809082, "global_step": 429211, "epoch": 2554} {"train_loss": -12.391971588134766, "global_step": 429212, "epoch": 2554} {"train_loss": -11.605718612670898, "global_step": 429213, "epoch": 2554} {"train_loss": -12.367359161376953, "global_step": 429214, "epoch": 2554} {"train_loss": -12.158851623535156, "global_step": 429215, "epoch": 2554} {"train_loss": -11.55745792388916, "global_step": 429216, "epoch": 2554} {"train_loss": -12.733893394470215, "global_step": 429217, "epoch": 2554} {"train_loss": -11.804740905761719, "global_step": 429218, "epoch": 2554} {"train_loss": -12.568897247314453, "global_step": 429219, "epoch": 2554} {"train_loss": -12.27033805847168, "global_step": 429220, "epoch": 2554} {"train_loss": -11.77403450012207, "global_step": 429221, "epoch": 2554} {"train_loss": -12.07247257232666, "global_step": 429222, "epoch": 2554} {"train_loss": -11.469961166381836, "global_step": 429223, "epoch": 2554} {"train_loss": -11.685859680175781, "global_step": 429224, "epoch": 2554} {"train_loss": -11.341438293457031, "global_step": 429225, "epoch": 2554} {"train_loss": -11.703784942626953, "global_step": 429226, "epoch": 2554} {"train_loss": -11.89395523071289, "global_step": 429227, "epoch": 2554} {"train_loss": -11.494028091430664, "global_step": 429228, "epoch": 2554} {"train_loss": -11.998987197875977, "global_step": 429229, "epoch": 2554} {"train_loss": -11.667906761169434, "global_step": 429230, "epoch": 2554} {"train_loss": -12.208824157714844, "global_step": 429231, "epoch": 2554} {"train_loss": -12.101511001586914, "global_step": 429232, "epoch": 2554} {"train_loss": -11.46358871459961, "global_step": 429233, "epoch": 2554} {"train_loss": -11.454988479614258, "global_step": 429234, "epoch": 2554} {"train_loss": -12.426246643066406, "global_step": 429235, "epoch": 2554} {"train_loss": -11.435750007629395, "global_step": 429236, "epoch": 2554} {"train_loss": -11.86745834350586, "global_step": 429237, "epoch": 2554} {"train_loss": -11.52571964263916, "global_step": 429238, "epoch": 2554} {"train_loss": -12.233585976418995, "global_step": 429239, "epoch": 2554, "val_loss": 312846.375} {"train_loss": -12.150300979614258, "global_step": 429240, "epoch": 2555} {"train_loss": -10.957404136657715, "global_step": 429241, "epoch": 2555} {"train_loss": -12.278997421264648, "global_step": 429242, "epoch": 2555} {"train_loss": -11.212653160095215, "global_step": 429243, "epoch": 2555} {"train_loss": -11.13821029663086, "global_step": 429244, "epoch": 2555} {"train_loss": -11.880671501159668, "global_step": 429245, "epoch": 2555} {"train_loss": -10.743579864501953, "global_step": 429246, "epoch": 2555} {"train_loss": -11.829615592956543, "global_step": 429247, "epoch": 2555} {"train_loss": -11.256765365600586, "global_step": 429248, "epoch": 2555} {"train_loss": -12.080842971801758, "global_step": 429249, "epoch": 2555} {"train_loss": -11.127500534057617, "global_step": 429250, "epoch": 2555} {"train_loss": -12.455953598022461, "global_step": 429251, "epoch": 2555} {"train_loss": -11.27912425994873, "global_step": 429252, "epoch": 2555} {"train_loss": -11.897183418273926, "global_step": 429253, "epoch": 2555} {"train_loss": -11.454628944396973, "global_step": 429254, "epoch": 2555} {"train_loss": -12.128259658813477, "global_step": 429255, "epoch": 2555} {"train_loss": -12.040745735168457, "global_step": 429256, "epoch": 2555} {"train_loss": -11.483163833618164, "global_step": 429257, "epoch": 2555} {"train_loss": -12.072654724121094, "global_step": 429258, "epoch": 2555} {"train_loss": -12.033794403076172, "global_step": 429259, "epoch": 2555} {"train_loss": -11.88470458984375, "global_step": 429260, "epoch": 2555} {"train_loss": -12.245676040649414, "global_step": 429261, "epoch": 2555} {"train_loss": -12.14745807647705, "global_step": 429262, "epoch": 2555} {"train_loss": -12.346698760986328, "global_step": 429263, "epoch": 2555} {"train_loss": -11.739847183227539, "global_step": 429264, "epoch": 2555} {"train_loss": -12.311727523803711, "global_step": 429265, "epoch": 2555} {"train_loss": -11.928740501403809, "global_step": 429266, "epoch": 2555} {"train_loss": -12.226204872131348, "global_step": 429267, "epoch": 2555} {"train_loss": -12.02685546875, "global_step": 429268, "epoch": 2555} {"train_loss": -12.347637176513672, "global_step": 429269, "epoch": 2555} {"train_loss": -12.09920883178711, "global_step": 429270, "epoch": 2555} {"train_loss": -12.333532333374023, "global_step": 429271, "epoch": 2555} {"train_loss": -12.105758666992188, "global_step": 429272, "epoch": 2555} {"train_loss": -12.319971084594727, "global_step": 429273, "epoch": 2555} {"train_loss": -12.340292930603027, "global_step": 429274, "epoch": 2555} {"train_loss": -12.035115242004395, "global_step": 429275, "epoch": 2555} {"train_loss": -12.215498924255371, "global_step": 429276, "epoch": 2555} {"train_loss": -12.373823165893555, "global_step": 429277, "epoch": 2555} {"train_loss": -11.676619529724121, "global_step": 429278, "epoch": 2555} {"train_loss": -12.59400749206543, "global_step": 429279, "epoch": 2555} {"train_loss": -11.939240455627441, "global_step": 429280, "epoch": 2555} {"train_loss": -12.14006519317627, "global_step": 429281, "epoch": 2555} {"train_loss": -11.910324096679688, "global_step": 429282, "epoch": 2555} {"train_loss": -12.318323135375977, "global_step": 429283, "epoch": 2555} {"train_loss": -12.039857864379883, "global_step": 429284, "epoch": 2555} {"train_loss": -12.158079147338867, "global_step": 429285, "epoch": 2555} {"train_loss": -11.940397262573242, "global_step": 429286, "epoch": 2555} {"train_loss": -12.428525924682617, "global_step": 429287, "epoch": 2555} {"train_loss": -12.107314109802246, "global_step": 429288, "epoch": 2555} {"train_loss": -12.597402572631836, "global_step": 429289, "epoch": 2555} {"train_loss": -12.011667251586914, "global_step": 429290, "epoch": 2555} {"train_loss": -12.328815460205078, "global_step": 429291, "epoch": 2555} {"train_loss": -12.14123821258545, "global_step": 429292, "epoch": 2555} {"train_loss": -12.304927825927734, "global_step": 429293, "epoch": 2555} {"train_loss": -12.255229949951172, "global_step": 429294, "epoch": 2555} {"train_loss": -12.209526062011719, "global_step": 429295, "epoch": 2555} {"train_loss": -12.068766593933105, "global_step": 429296, "epoch": 2555} {"train_loss": -11.791848182678223, "global_step": 429297, "epoch": 2555} {"train_loss": -12.168868064880371, "global_step": 429298, "epoch": 2555} {"train_loss": -11.548503875732422, "global_step": 429299, "epoch": 2555} {"train_loss": -12.119983673095703, "global_step": 429300, "epoch": 2555} {"train_loss": -11.835304260253906, "global_step": 429301, "epoch": 2555} {"train_loss": -11.017380714416504, "global_step": 429302, "epoch": 2555} {"train_loss": -11.484145164489746, "global_step": 429303, "epoch": 2555} {"train_loss": -10.044309616088867, "global_step": 429304, "epoch": 2555} {"train_loss": -10.431785583496094, "global_step": 429305, "epoch": 2555} {"train_loss": -11.743489265441895, "global_step": 429306, "epoch": 2555} {"train_loss": -10.894010543823242, "global_step": 429307, "epoch": 2555} {"train_loss": -12.014726638793945, "global_step": 429308, "epoch": 2555} {"train_loss": -11.49476432800293, "global_step": 429309, "epoch": 2555} {"train_loss": -11.708040237426758, "global_step": 429310, "epoch": 2555} {"train_loss": -11.379002571105957, "global_step": 429311, "epoch": 2555} {"train_loss": -11.182825088500977, "global_step": 429312, "epoch": 2555} {"train_loss": -11.521088600158691, "global_step": 429313, "epoch": 2555} {"train_loss": -11.063392639160156, "global_step": 429314, "epoch": 2555} {"train_loss": -10.900091171264648, "global_step": 429315, "epoch": 2555} {"train_loss": -11.299083709716797, "global_step": 429316, "epoch": 2555} {"train_loss": -12.090686798095703, "global_step": 429317, "epoch": 2555} {"train_loss": -12.233553886413574, "global_step": 429318, "epoch": 2555} {"train_loss": -12.11577033996582, "global_step": 429319, "epoch": 2555} {"train_loss": -12.112103462219238, "global_step": 429320, "epoch": 2555} {"train_loss": -12.040458679199219, "global_step": 429321, "epoch": 2555} {"train_loss": -11.793529510498047, "global_step": 429322, "epoch": 2555} {"train_loss": -11.917631149291992, "global_step": 429323, "epoch": 2555} {"train_loss": -12.37338924407959, "global_step": 429324, "epoch": 2555} {"train_loss": -12.049267768859863, "global_step": 429325, "epoch": 2555} {"train_loss": -12.354374885559082, "global_step": 429326, "epoch": 2555} {"train_loss": -11.974363327026367, "global_step": 429327, "epoch": 2555} {"train_loss": -12.354774475097656, "global_step": 429328, "epoch": 2555} {"train_loss": -12.082447052001953, "global_step": 429329, "epoch": 2555} {"train_loss": -12.280630111694336, "global_step": 429330, "epoch": 2555} {"train_loss": -12.49569320678711, "global_step": 429331, "epoch": 2555} {"train_loss": -12.270442962646484, "global_step": 429332, "epoch": 2555} {"train_loss": -12.225406646728516, "global_step": 429333, "epoch": 2555} {"train_loss": -12.379148483276367, "global_step": 429334, "epoch": 2555} {"train_loss": -12.310590744018555, "global_step": 429335, "epoch": 2555} {"train_loss": -12.13199520111084, "global_step": 429336, "epoch": 2555} {"train_loss": -12.518943786621094, "global_step": 429337, "epoch": 2555} {"train_loss": -12.22586727142334, "global_step": 429338, "epoch": 2555} {"train_loss": -12.565513610839844, "global_step": 429339, "epoch": 2555} {"train_loss": -12.677512168884277, "global_step": 429340, "epoch": 2555} {"train_loss": -12.764982223510742, "global_step": 429341, "epoch": 2555} {"train_loss": -12.639113426208496, "global_step": 429342, "epoch": 2555} {"train_loss": -12.452098846435547, "global_step": 429343, "epoch": 2555} {"train_loss": -12.729101181030273, "global_step": 429344, "epoch": 2555} {"train_loss": -12.4273099899292, "global_step": 429345, "epoch": 2555} {"train_loss": -12.505549430847168, "global_step": 429346, "epoch": 2555} {"train_loss": -12.575796127319336, "global_step": 429347, "epoch": 2555} {"train_loss": -12.45434284210205, "global_step": 429348, "epoch": 2555} {"train_loss": -12.268577575683594, "global_step": 429349, "epoch": 2555} {"train_loss": -12.244522094726562, "global_step": 429350, "epoch": 2555} {"train_loss": -12.027711868286133, "global_step": 429351, "epoch": 2555} {"train_loss": -12.705486297607422, "global_step": 429352, "epoch": 2555} {"train_loss": -12.241803169250488, "global_step": 429353, "epoch": 2555} {"train_loss": -12.560663223266602, "global_step": 429354, "epoch": 2555} {"train_loss": -12.164615631103516, "global_step": 429355, "epoch": 2555} {"train_loss": -12.676170349121094, "global_step": 429356, "epoch": 2555} {"train_loss": -12.551152229309082, "global_step": 429357, "epoch": 2555} {"train_loss": -12.557886123657227, "global_step": 429358, "epoch": 2555} {"train_loss": -12.595266342163086, "global_step": 429359, "epoch": 2555} {"train_loss": -12.515837669372559, "global_step": 429360, "epoch": 2555} {"train_loss": -12.771306037902832, "global_step": 429361, "epoch": 2555} {"train_loss": -12.77098274230957, "global_step": 429362, "epoch": 2555} {"train_loss": -12.726119995117188, "global_step": 429363, "epoch": 2555} {"train_loss": -12.327427864074707, "global_step": 429364, "epoch": 2555} {"train_loss": -12.661262512207031, "global_step": 429365, "epoch": 2555} {"train_loss": -12.586617469787598, "global_step": 429366, "epoch": 2555} {"train_loss": -12.660538673400879, "global_step": 429367, "epoch": 2555} {"train_loss": -12.762849807739258, "global_step": 429368, "epoch": 2555} {"train_loss": -12.524524688720703, "global_step": 429369, "epoch": 2555} {"train_loss": -12.537538528442383, "global_step": 429370, "epoch": 2555} {"train_loss": -12.855987548828125, "global_step": 429371, "epoch": 2555} {"train_loss": -12.472578048706055, "global_step": 429372, "epoch": 2555} {"train_loss": -12.530973434448242, "global_step": 429373, "epoch": 2555} {"train_loss": -12.625925064086914, "global_step": 429374, "epoch": 2555} {"train_loss": -12.538312911987305, "global_step": 429375, "epoch": 2555} {"train_loss": -12.68738842010498, "global_step": 429376, "epoch": 2555} {"train_loss": -12.85038948059082, "global_step": 429377, "epoch": 2555} {"train_loss": -12.652498245239258, "global_step": 429378, "epoch": 2555} {"train_loss": -12.479747772216797, "global_step": 429379, "epoch": 2555} {"train_loss": -12.712116241455078, "global_step": 429380, "epoch": 2555} {"train_loss": -12.739420890808105, "global_step": 429381, "epoch": 2555} {"train_loss": -12.764453887939453, "global_step": 429382, "epoch": 2555} {"train_loss": -12.486540794372559, "global_step": 429383, "epoch": 2555} {"train_loss": -12.570280075073242, "global_step": 429384, "epoch": 2555} {"train_loss": -12.546831130981445, "global_step": 429385, "epoch": 2555} {"train_loss": -11.849756240844727, "global_step": 429386, "epoch": 2555} {"train_loss": -11.742423057556152, "global_step": 429387, "epoch": 2555} {"train_loss": -12.39456558227539, "global_step": 429388, "epoch": 2555} {"train_loss": -11.880526542663574, "global_step": 429389, "epoch": 2555} {"train_loss": -12.107213020324707, "global_step": 429390, "epoch": 2555} {"train_loss": -12.376264572143555, "global_step": 429391, "epoch": 2555} {"train_loss": -11.48673152923584, "global_step": 429392, "epoch": 2555} {"train_loss": -11.590253829956055, "global_step": 429393, "epoch": 2555} {"train_loss": -12.316082954406738, "global_step": 429394, "epoch": 2555} {"train_loss": -11.664661407470703, "global_step": 429395, "epoch": 2555} {"train_loss": -11.729728698730469, "global_step": 429396, "epoch": 2555} {"train_loss": -12.458362579345703, "global_step": 429397, "epoch": 2555} {"train_loss": -11.77774429321289, "global_step": 429398, "epoch": 2555} {"train_loss": -11.401390075683594, "global_step": 429399, "epoch": 2555} {"train_loss": -12.36502456665039, "global_step": 429400, "epoch": 2555} {"train_loss": -10.621267318725586, "global_step": 429401, "epoch": 2555} {"train_loss": -12.21696662902832, "global_step": 429402, "epoch": 2555} {"train_loss": -11.645998001098633, "global_step": 429403, "epoch": 2555} {"train_loss": -11.5278902053833, "global_step": 429404, "epoch": 2555} {"train_loss": -12.53541374206543, "global_step": 429405, "epoch": 2555} {"train_loss": -11.76969051361084, "global_step": 429406, "epoch": 2555} {"train_loss": -12.094942109925407, "global_step": 429407, "epoch": 2555, "val_loss": 310045.71875, "train_action_mse_error": 1.6296573877334595} {"train_loss": -12.183491706848145, "global_step": 429408, "epoch": 2556} {"train_loss": -11.369430541992188, "global_step": 429409, "epoch": 2556} {"train_loss": -11.986553192138672, "global_step": 429410, "epoch": 2556} {"train_loss": -11.335790634155273, "global_step": 429411, "epoch": 2556} {"train_loss": -11.709195137023926, "global_step": 429412, "epoch": 2556} {"train_loss": -11.443903923034668, "global_step": 429413, "epoch": 2556} {"train_loss": -10.333681106567383, "global_step": 429414, "epoch": 2556} {"train_loss": -11.797934532165527, "global_step": 429415, "epoch": 2556} {"train_loss": -10.782755851745605, "global_step": 429416, "epoch": 2556} {"train_loss": -10.461578369140625, "global_step": 429417, "epoch": 2556} {"train_loss": -10.599170684814453, "global_step": 429418, "epoch": 2556} {"train_loss": -11.717581748962402, "global_step": 429419, "epoch": 2556} {"train_loss": -10.420302391052246, "global_step": 429420, "epoch": 2556} {"train_loss": -10.63290023803711, "global_step": 429421, "epoch": 2556} {"train_loss": -10.252447128295898, "global_step": 429422, "epoch": 2556} {"train_loss": -10.922072410583496, "global_step": 429423, "epoch": 2556} {"train_loss": -10.977459907531738, "global_step": 429424, "epoch": 2556} {"train_loss": -11.92837142944336, "global_step": 429425, "epoch": 2556} {"train_loss": -11.99264907836914, "global_step": 429426, "epoch": 2556} {"train_loss": -12.062304496765137, "global_step": 429427, "epoch": 2556} {"train_loss": -12.076961517333984, "global_step": 429428, "epoch": 2556} {"train_loss": -12.061656951904297, "global_step": 429429, "epoch": 2556} {"train_loss": -11.592057228088379, "global_step": 429430, "epoch": 2556} {"train_loss": -11.55899715423584, "global_step": 429431, "epoch": 2556} {"train_loss": -11.85302448272705, "global_step": 429432, "epoch": 2556} {"train_loss": -10.410524368286133, "global_step": 429433, "epoch": 2556} {"train_loss": -12.454635620117188, "global_step": 429434, "epoch": 2556} {"train_loss": -11.511300086975098, "global_step": 429435, "epoch": 2556} {"train_loss": -11.530884742736816, "global_step": 429436, "epoch": 2556} {"train_loss": -11.856609344482422, "global_step": 429437, "epoch": 2556} {"train_loss": -11.157252311706543, "global_step": 429438, "epoch": 2556} {"train_loss": -11.914863586425781, "global_step": 429439, "epoch": 2556} {"train_loss": -11.950139999389648, "global_step": 429440, "epoch": 2556} {"train_loss": -12.209383010864258, "global_step": 429441, "epoch": 2556} {"train_loss": -11.842424392700195, "global_step": 429442, "epoch": 2556} {"train_loss": -12.01310920715332, "global_step": 429443, "epoch": 2556} {"train_loss": -11.934944152832031, "global_step": 429444, "epoch": 2556} {"train_loss": -12.33541488647461, "global_step": 429445, "epoch": 2556} {"train_loss": -12.014321327209473, "global_step": 429446, "epoch": 2556} {"train_loss": -11.81267261505127, "global_step": 429447, "epoch": 2556} {"train_loss": -11.7108154296875, "global_step": 429448, "epoch": 2556} {"train_loss": -11.868843078613281, "global_step": 429449, "epoch": 2556} {"train_loss": -12.18026351928711, "global_step": 429450, "epoch": 2556} {"train_loss": -10.909147262573242, "global_step": 429451, "epoch": 2556} {"train_loss": -12.102716445922852, "global_step": 429452, "epoch": 2556} {"train_loss": -11.618281364440918, "global_step": 429453, "epoch": 2556} {"train_loss": -12.37826156616211, "global_step": 429454, "epoch": 2556} {"train_loss": -12.284263610839844, "global_step": 429455, "epoch": 2556} {"train_loss": -12.118656158447266, "global_step": 429456, "epoch": 2556} {"train_loss": -12.203691482543945, "global_step": 429457, "epoch": 2556} {"train_loss": -12.033222198486328, "global_step": 429458, "epoch": 2556} {"train_loss": -12.057990074157715, "global_step": 429459, "epoch": 2556} {"train_loss": -12.37836742401123, "global_step": 429460, "epoch": 2556} {"train_loss": -12.199040412902832, "global_step": 429461, "epoch": 2556} {"train_loss": -12.48883056640625, "global_step": 429462, "epoch": 2556} {"train_loss": -12.072738647460938, "global_step": 429463, "epoch": 2556} {"train_loss": -12.642281532287598, "global_step": 429464, "epoch": 2556} {"train_loss": -12.450738906860352, "global_step": 429465, "epoch": 2556} {"train_loss": -12.275339126586914, "global_step": 429466, "epoch": 2556} {"train_loss": -12.407082557678223, "global_step": 429467, "epoch": 2556} {"train_loss": -12.529572486877441, "global_step": 429468, "epoch": 2556} {"train_loss": -12.499914169311523, "global_step": 429469, "epoch": 2556} {"train_loss": -12.551334381103516, "global_step": 429470, "epoch": 2556} {"train_loss": -12.5299711227417, "global_step": 429471, "epoch": 2556} {"train_loss": -12.42835807800293, "global_step": 429472, "epoch": 2556} {"train_loss": -12.382667541503906, "global_step": 429473, "epoch": 2556} {"train_loss": -12.344612121582031, "global_step": 429474, "epoch": 2556} {"train_loss": -12.269039154052734, "global_step": 429475, "epoch": 2556} {"train_loss": -12.308082580566406, "global_step": 429476, "epoch": 2556} {"train_loss": -12.327587127685547, "global_step": 429477, "epoch": 2556} {"train_loss": -11.935027122497559, "global_step": 429478, "epoch": 2556} {"train_loss": -12.40027141571045, "global_step": 429479, "epoch": 2556} {"train_loss": -12.539419174194336, "global_step": 429480, "epoch": 2556} {"train_loss": -12.388753890991211, "global_step": 429481, "epoch": 2556} {"train_loss": -12.568918228149414, "global_step": 429482, "epoch": 2556} {"train_loss": -12.55465030670166, "global_step": 429483, "epoch": 2556} {"train_loss": -12.363081932067871, "global_step": 429484, "epoch": 2556} {"train_loss": -12.382757186889648, "global_step": 429485, "epoch": 2556} {"train_loss": -12.436527252197266, "global_step": 429486, "epoch": 2556} {"train_loss": -12.683113098144531, "global_step": 429487, "epoch": 2556} {"train_loss": -12.65902042388916, "global_step": 429488, "epoch": 2556} {"train_loss": -12.65774917602539, "global_step": 429489, "epoch": 2556} {"train_loss": -12.419608116149902, "global_step": 429490, "epoch": 2556} {"train_loss": -12.297374725341797, "global_step": 429491, "epoch": 2556} {"train_loss": -12.833518981933594, "global_step": 429492, "epoch": 2556} {"train_loss": -12.287559509277344, "global_step": 429493, "epoch": 2556} {"train_loss": -12.072511672973633, "global_step": 429494, "epoch": 2556} {"train_loss": -12.174836158752441, "global_step": 429495, "epoch": 2556} {"train_loss": -12.52684211730957, "global_step": 429496, "epoch": 2556} {"train_loss": -12.175475120544434, "global_step": 429497, "epoch": 2556} {"train_loss": -12.142349243164062, "global_step": 429498, "epoch": 2556} {"train_loss": -12.256826400756836, "global_step": 429499, "epoch": 2556} {"train_loss": -12.676036834716797, "global_step": 429500, "epoch": 2556} {"train_loss": -12.254119873046875, "global_step": 429501, "epoch": 2556} {"train_loss": -12.356969833374023, "global_step": 429502, "epoch": 2556} {"train_loss": -12.593381881713867, "global_step": 429503, "epoch": 2556} {"train_loss": -12.229087829589844, "global_step": 429504, "epoch": 2556} {"train_loss": -11.297750473022461, "global_step": 429505, "epoch": 2556} {"train_loss": -12.02334976196289, "global_step": 429506, "epoch": 2556} {"train_loss": -12.521345138549805, "global_step": 429507, "epoch": 2556} {"train_loss": -11.753912925720215, "global_step": 429508, "epoch": 2556} {"train_loss": -11.068207740783691, "global_step": 429509, "epoch": 2556} {"train_loss": -10.738941192626953, "global_step": 429510, "epoch": 2556} {"train_loss": -12.143529891967773, "global_step": 429511, "epoch": 2556} {"train_loss": -11.612852096557617, "global_step": 429512, "epoch": 2556} {"train_loss": -11.533958435058594, "global_step": 429513, "epoch": 2556} {"train_loss": -11.569128036499023, "global_step": 429514, "epoch": 2556} {"train_loss": -11.858072280883789, "global_step": 429515, "epoch": 2556} {"train_loss": -10.800546646118164, "global_step": 429516, "epoch": 2556} {"train_loss": -12.64259147644043, "global_step": 429517, "epoch": 2556} {"train_loss": -10.981536865234375, "global_step": 429518, "epoch": 2556} {"train_loss": -11.837808609008789, "global_step": 429519, "epoch": 2556} {"train_loss": -11.945262908935547, "global_step": 429520, "epoch": 2556} {"train_loss": -10.772478103637695, "global_step": 429521, "epoch": 2556} {"train_loss": -12.14143180847168, "global_step": 429522, "epoch": 2556} {"train_loss": -11.092560768127441, "global_step": 429523, "epoch": 2556} {"train_loss": -12.034163475036621, "global_step": 429524, "epoch": 2556} {"train_loss": -11.322946548461914, "global_step": 429525, "epoch": 2556} {"train_loss": -12.27918815612793, "global_step": 429526, "epoch": 2556} {"train_loss": -11.614386558532715, "global_step": 429527, "epoch": 2556} {"train_loss": -11.386848449707031, "global_step": 429528, "epoch": 2556} {"train_loss": -12.00723648071289, "global_step": 429529, "epoch": 2556} {"train_loss": -12.152615547180176, "global_step": 429530, "epoch": 2556} {"train_loss": -11.820240020751953, "global_step": 429531, "epoch": 2556} {"train_loss": -12.195730209350586, "global_step": 429532, "epoch": 2556} {"train_loss": -12.140400886535645, "global_step": 429533, "epoch": 2556} {"train_loss": -12.359838485717773, "global_step": 429534, "epoch": 2556} {"train_loss": -11.968839645385742, "global_step": 429535, "epoch": 2556} {"train_loss": -12.274796485900879, "global_step": 429536, "epoch": 2556} {"train_loss": -12.32791519165039, "global_step": 429537, "epoch": 2556} {"train_loss": -12.207298278808594, "global_step": 429538, "epoch": 2556} {"train_loss": -12.221789360046387, "global_step": 429539, "epoch": 2556} {"train_loss": -12.219825744628906, "global_step": 429540, "epoch": 2556} {"train_loss": -11.469244003295898, "global_step": 429541, "epoch": 2556} {"train_loss": -12.008800506591797, "global_step": 429542, "epoch": 2556} {"train_loss": -11.893720626831055, "global_step": 429543, "epoch": 2556} {"train_loss": -11.779688835144043, "global_step": 429544, "epoch": 2556} {"train_loss": -12.247530937194824, "global_step": 429545, "epoch": 2556} {"train_loss": -11.784062385559082, "global_step": 429546, "epoch": 2556} {"train_loss": -12.5396146774292, "global_step": 429547, "epoch": 2556} {"train_loss": -11.517352104187012, "global_step": 429548, "epoch": 2556} {"train_loss": -12.091060638427734, "global_step": 429549, "epoch": 2556} {"train_loss": -11.585065841674805, "global_step": 429550, "epoch": 2556} {"train_loss": -12.235004425048828, "global_step": 429551, "epoch": 2556} {"train_loss": -12.211177825927734, "global_step": 429552, "epoch": 2556} {"train_loss": -12.250381469726562, "global_step": 429553, "epoch": 2556} {"train_loss": -12.045236587524414, "global_step": 429554, "epoch": 2556} {"train_loss": -12.05871868133545, "global_step": 429555, "epoch": 2556} {"train_loss": -12.408679962158203, "global_step": 429556, "epoch": 2556} {"train_loss": -12.003329277038574, "global_step": 429557, "epoch": 2556} {"train_loss": -12.558780670166016, "global_step": 429558, "epoch": 2556} {"train_loss": -12.050714492797852, "global_step": 429559, "epoch": 2556} {"train_loss": -12.65312385559082, "global_step": 429560, "epoch": 2556} {"train_loss": -12.367332458496094, "global_step": 429561, "epoch": 2556} {"train_loss": -12.49635124206543, "global_step": 429562, "epoch": 2556} {"train_loss": -12.686356544494629, "global_step": 429563, "epoch": 2556} {"train_loss": -12.59107780456543, "global_step": 429564, "epoch": 2556} {"train_loss": -12.516016960144043, "global_step": 429565, "epoch": 2556} {"train_loss": -12.085050582885742, "global_step": 429566, "epoch": 2556} {"train_loss": -12.698856353759766, "global_step": 429567, "epoch": 2556} {"train_loss": -12.31181526184082, "global_step": 429568, "epoch": 2556} {"train_loss": -12.640743255615234, "global_step": 429569, "epoch": 2556} {"train_loss": -12.329167366027832, "global_step": 429570, "epoch": 2556} {"train_loss": -12.490264892578125, "global_step": 429571, "epoch": 2556} {"train_loss": -12.456555366516113, "global_step": 429572, "epoch": 2556} {"train_loss": -12.451322555541992, "global_step": 429573, "epoch": 2556} {"train_loss": -12.44183349609375, "global_step": 429574, "epoch": 2556} {"train_loss": -11.998538942564101, "global_step": 429575, "epoch": 2556, "val_loss": 306177.1875} {"train_loss": -12.45119857788086, "global_step": 429576, "epoch": 2557} {"train_loss": -12.31803035736084, "global_step": 429577, "epoch": 2557} {"train_loss": -12.650985717773438, "global_step": 429578, "epoch": 2557} {"train_loss": -12.428325653076172, "global_step": 429579, "epoch": 2557} {"train_loss": -12.645622253417969, "global_step": 429580, "epoch": 2557} {"train_loss": -12.8360595703125, "global_step": 429581, "epoch": 2557} {"train_loss": -12.576141357421875, "global_step": 429582, "epoch": 2557} {"train_loss": -12.727503776550293, "global_step": 429583, "epoch": 2557} {"train_loss": -12.654646873474121, "global_step": 429584, "epoch": 2557} {"train_loss": -12.787105560302734, "global_step": 429585, "epoch": 2557} {"train_loss": -12.705910682678223, "global_step": 429586, "epoch": 2557} {"train_loss": -12.845874786376953, "global_step": 429587, "epoch": 2557} {"train_loss": -12.920367240905762, "global_step": 429588, "epoch": 2557} {"train_loss": -12.52192497253418, "global_step": 429589, "epoch": 2557} {"train_loss": -12.686164855957031, "global_step": 429590, "epoch": 2557} {"train_loss": -12.622390747070312, "global_step": 429591, "epoch": 2557} {"train_loss": -12.768075942993164, "global_step": 429592, "epoch": 2557} {"train_loss": -12.491792678833008, "global_step": 429593, "epoch": 2557} {"train_loss": -12.542486190795898, "global_step": 429594, "epoch": 2557} {"train_loss": -12.650205612182617, "global_step": 429595, "epoch": 2557} {"train_loss": -12.531350135803223, "global_step": 429596, "epoch": 2557} {"train_loss": -12.77522087097168, "global_step": 429597, "epoch": 2557} {"train_loss": -12.708065032958984, "global_step": 429598, "epoch": 2557} {"train_loss": -12.536620140075684, "global_step": 429599, "epoch": 2557} {"train_loss": -12.79898452758789, "global_step": 429600, "epoch": 2557} {"train_loss": -12.526922225952148, "global_step": 429601, "epoch": 2557} {"train_loss": -12.718505859375, "global_step": 429602, "epoch": 2557} {"train_loss": -12.668453216552734, "global_step": 429603, "epoch": 2557} {"train_loss": -12.650876998901367, "global_step": 429604, "epoch": 2557} {"train_loss": -12.6370849609375, "global_step": 429605, "epoch": 2557} {"train_loss": -12.831212997436523, "global_step": 429606, "epoch": 2557} {"train_loss": -12.930438995361328, "global_step": 429607, "epoch": 2557} {"train_loss": -12.639385223388672, "global_step": 429608, "epoch": 2557} {"train_loss": -12.379676818847656, "global_step": 429609, "epoch": 2557} {"train_loss": -12.695873260498047, "global_step": 429610, "epoch": 2557} {"train_loss": -12.497493743896484, "global_step": 429611, "epoch": 2557} {"train_loss": -12.850031852722168, "global_step": 429612, "epoch": 2557} {"train_loss": -12.797479629516602, "global_step": 429613, "epoch": 2557} {"train_loss": -12.941588401794434, "global_step": 429614, "epoch": 2557} {"train_loss": -12.940650939941406, "global_step": 429615, "epoch": 2557} {"train_loss": -12.741693496704102, "global_step": 429616, "epoch": 2557} {"train_loss": -12.701062202453613, "global_step": 429617, "epoch": 2557} {"train_loss": -12.642457008361816, "global_step": 429618, "epoch": 2557} {"train_loss": -12.667276382446289, "global_step": 429619, "epoch": 2557} {"train_loss": -12.175782203674316, "global_step": 429620, "epoch": 2557} {"train_loss": -12.702252388000488, "global_step": 429621, "epoch": 2557} {"train_loss": -12.938661575317383, "global_step": 429622, "epoch": 2557} {"train_loss": -12.592011451721191, "global_step": 429623, "epoch": 2557} {"train_loss": -13.059274673461914, "global_step": 429624, "epoch": 2557} {"train_loss": -12.81941032409668, "global_step": 429625, "epoch": 2557} {"train_loss": -13.14333724975586, "global_step": 429626, "epoch": 2557} {"train_loss": -12.53062915802002, "global_step": 429627, "epoch": 2557} {"train_loss": -12.771450996398926, "global_step": 429628, "epoch": 2557} {"train_loss": -13.088648796081543, "global_step": 429629, "epoch": 2557} {"train_loss": -12.951656341552734, "global_step": 429630, "epoch": 2557} {"train_loss": -12.596654891967773, "global_step": 429631, "epoch": 2557} {"train_loss": -12.267899513244629, "global_step": 429632, "epoch": 2557} {"train_loss": -12.585456848144531, "global_step": 429633, "epoch": 2557} {"train_loss": -12.715372085571289, "global_step": 429634, "epoch": 2557} {"train_loss": -12.896268844604492, "global_step": 429635, "epoch": 2557} {"train_loss": -12.254724502563477, "global_step": 429636, "epoch": 2557} {"train_loss": -12.714925765991211, "global_step": 429637, "epoch": 2557} {"train_loss": -12.422731399536133, "global_step": 429638, "epoch": 2557} {"train_loss": -12.236804962158203, "global_step": 429639, "epoch": 2557} {"train_loss": -12.816692352294922, "global_step": 429640, "epoch": 2557} {"train_loss": -12.167709350585938, "global_step": 429641, "epoch": 2557} {"train_loss": -11.777143478393555, "global_step": 429642, "epoch": 2557} {"train_loss": -12.408153533935547, "global_step": 429643, "epoch": 2557} {"train_loss": -12.591841697692871, "global_step": 429644, "epoch": 2557} {"train_loss": -12.535662651062012, "global_step": 429645, "epoch": 2557} {"train_loss": -12.332259178161621, "global_step": 429646, "epoch": 2557} {"train_loss": -12.250555038452148, "global_step": 429647, "epoch": 2557} {"train_loss": -11.694242477416992, "global_step": 429648, "epoch": 2557} {"train_loss": -11.903569221496582, "global_step": 429649, "epoch": 2557} {"train_loss": -12.221879959106445, "global_step": 429650, "epoch": 2557} {"train_loss": -10.177833557128906, "global_step": 429651, "epoch": 2557} {"train_loss": -11.193406105041504, "global_step": 429652, "epoch": 2557} {"train_loss": -9.92904281616211, "global_step": 429653, "epoch": 2557} {"train_loss": -12.225252151489258, "global_step": 429654, "epoch": 2557} {"train_loss": -9.580430030822754, "global_step": 429655, "epoch": 2557} {"train_loss": -11.104887962341309, "global_step": 429656, "epoch": 2557} {"train_loss": -10.122026443481445, "global_step": 429657, "epoch": 2557} {"train_loss": -9.883273124694824, "global_step": 429658, "epoch": 2557} {"train_loss": -11.526412963867188, "global_step": 429659, "epoch": 2557} {"train_loss": -10.321943283081055, "global_step": 429660, "epoch": 2557} {"train_loss": -9.160676956176758, "global_step": 429661, "epoch": 2557} {"train_loss": -10.508862495422363, "global_step": 429662, "epoch": 2557} {"train_loss": -10.618288040161133, "global_step": 429663, "epoch": 2557} {"train_loss": -9.239152908325195, "global_step": 429664, "epoch": 2557} {"train_loss": -9.062664031982422, "global_step": 429665, "epoch": 2557} {"train_loss": -10.909817695617676, "global_step": 429666, "epoch": 2557} {"train_loss": -9.493852615356445, "global_step": 429667, "epoch": 2557} {"train_loss": -10.439921379089355, "global_step": 429668, "epoch": 2557} {"train_loss": -10.666071891784668, "global_step": 429669, "epoch": 2557} {"train_loss": -9.69221019744873, "global_step": 429670, "epoch": 2557} {"train_loss": -9.17228889465332, "global_step": 429671, "epoch": 2557} {"train_loss": -11.904184341430664, "global_step": 429672, "epoch": 2557} {"train_loss": -9.059494018554688, "global_step": 429673, "epoch": 2557} {"train_loss": -10.164478302001953, "global_step": 429674, "epoch": 2557} {"train_loss": -8.762771606445312, "global_step": 429675, "epoch": 2557} {"train_loss": -9.51983642578125, "global_step": 429676, "epoch": 2557} {"train_loss": -9.283008575439453, "global_step": 429677, "epoch": 2557} {"train_loss": -10.274120330810547, "global_step": 429678, "epoch": 2557} {"train_loss": -10.788615226745605, "global_step": 429679, "epoch": 2557} {"train_loss": -8.994030952453613, "global_step": 429680, "epoch": 2557} {"train_loss": -9.09254264831543, "global_step": 429681, "epoch": 2557} {"train_loss": -11.109186172485352, "global_step": 429682, "epoch": 2557} {"train_loss": -9.158523559570312, "global_step": 429683, "epoch": 2557} {"train_loss": -8.920541763305664, "global_step": 429684, "epoch": 2557} {"train_loss": -9.42567253112793, "global_step": 429685, "epoch": 2557} {"train_loss": -10.467069625854492, "global_step": 429686, "epoch": 2557} {"train_loss": -9.341522216796875, "global_step": 429687, "epoch": 2557} {"train_loss": -9.485054969787598, "global_step": 429688, "epoch": 2557} {"train_loss": -8.998221397399902, "global_step": 429689, "epoch": 2557} {"train_loss": -8.181816101074219, "global_step": 429690, "epoch": 2557} {"train_loss": -9.745658874511719, "global_step": 429691, "epoch": 2557} {"train_loss": -9.731002807617188, "global_step": 429692, "epoch": 2557} {"train_loss": -9.240921020507812, "global_step": 429693, "epoch": 2557} {"train_loss": -11.210175514221191, "global_step": 429694, "epoch": 2557} {"train_loss": -10.361108779907227, "global_step": 429695, "epoch": 2557} {"train_loss": -11.420448303222656, "global_step": 429696, "epoch": 2557} {"train_loss": -10.556440353393555, "global_step": 429697, "epoch": 2557} {"train_loss": -10.910860061645508, "global_step": 429698, "epoch": 2557} {"train_loss": -10.714472770690918, "global_step": 429699, "epoch": 2557} {"train_loss": -11.410819053649902, "global_step": 429700, "epoch": 2557} {"train_loss": -11.375568389892578, "global_step": 429701, "epoch": 2557} {"train_loss": -10.827556610107422, "global_step": 429702, "epoch": 2557} {"train_loss": -11.713891983032227, "global_step": 429703, "epoch": 2557} {"train_loss": -11.051055908203125, "global_step": 429704, "epoch": 2557} {"train_loss": -10.951459884643555, "global_step": 429705, "epoch": 2557} {"train_loss": -11.673331260681152, "global_step": 429706, "epoch": 2557} {"train_loss": -11.029861450195312, "global_step": 429707, "epoch": 2557} {"train_loss": -11.572898864746094, "global_step": 429708, "epoch": 2557} {"train_loss": -11.370782852172852, "global_step": 429709, "epoch": 2557} {"train_loss": -11.61978530883789, "global_step": 429710, "epoch": 2557} {"train_loss": -11.403000831604004, "global_step": 429711, "epoch": 2557} {"train_loss": -11.853435516357422, "global_step": 429712, "epoch": 2557} {"train_loss": -11.743465423583984, "global_step": 429713, "epoch": 2557} {"train_loss": -11.348365783691406, "global_step": 429714, "epoch": 2557} {"train_loss": -12.00519847869873, "global_step": 429715, "epoch": 2557} {"train_loss": -11.622973442077637, "global_step": 429716, "epoch": 2557} {"train_loss": -11.703094482421875, "global_step": 429717, "epoch": 2557} {"train_loss": -11.85568904876709, "global_step": 429718, "epoch": 2557} {"train_loss": -11.682035446166992, "global_step": 429719, "epoch": 2557} {"train_loss": -11.58769416809082, "global_step": 429720, "epoch": 2557} {"train_loss": -11.784076690673828, "global_step": 429721, "epoch": 2557} {"train_loss": -12.08954906463623, "global_step": 429722, "epoch": 2557} {"train_loss": -11.755941390991211, "global_step": 429723, "epoch": 2557} {"train_loss": -11.669224739074707, "global_step": 429724, "epoch": 2557} {"train_loss": -12.137466430664062, "global_step": 429725, "epoch": 2557} {"train_loss": -11.769782066345215, "global_step": 429726, "epoch": 2557} {"train_loss": -12.31067943572998, "global_step": 429727, "epoch": 2557} {"train_loss": -12.198934555053711, "global_step": 429728, "epoch": 2557} {"train_loss": -12.09328842163086, "global_step": 429729, "epoch": 2557} {"train_loss": -12.347848892211914, "global_step": 429730, "epoch": 2557} {"train_loss": -12.388997077941895, "global_step": 429731, "epoch": 2557} {"train_loss": -12.23275089263916, "global_step": 429732, "epoch": 2557} {"train_loss": -12.326745986938477, "global_step": 429733, "epoch": 2557} {"train_loss": -11.892004013061523, "global_step": 429734, "epoch": 2557} {"train_loss": -12.332380294799805, "global_step": 429735, "epoch": 2557} {"train_loss": -12.317069053649902, "global_step": 429736, "epoch": 2557} {"train_loss": -12.337507247924805, "global_step": 429737, "epoch": 2557} {"train_loss": -12.21689510345459, "global_step": 429738, "epoch": 2557} {"train_loss": -12.41092586517334, "global_step": 429739, "epoch": 2557} {"train_loss": -12.363273620605469, "global_step": 429740, "epoch": 2557} {"train_loss": -12.312546730041504, "global_step": 429741, "epoch": 2557} {"train_loss": -12.31740951538086, "global_step": 429742, "epoch": 2557} {"train_loss": -11.659550008319673, "global_step": 429743, "epoch": 2557, "val_loss": 309216.46875} {"train_loss": -12.270378112792969, "global_step": 429744, "epoch": 2558} {"train_loss": -12.362218856811523, "global_step": 429745, "epoch": 2558} {"train_loss": -12.341437339782715, "global_step": 429746, "epoch": 2558} {"train_loss": -12.576210021972656, "global_step": 429747, "epoch": 2558} {"train_loss": -12.57408332824707, "global_step": 429748, "epoch": 2558} {"train_loss": -12.381143569946289, "global_step": 429749, "epoch": 2558} {"train_loss": -12.494256973266602, "global_step": 429750, "epoch": 2558} {"train_loss": -12.617042541503906, "global_step": 429751, "epoch": 2558} {"train_loss": -12.5838623046875, "global_step": 429752, "epoch": 2558} {"train_loss": -12.636401176452637, "global_step": 429753, "epoch": 2558} {"train_loss": -12.418377876281738, "global_step": 429754, "epoch": 2558} {"train_loss": -12.436493873596191, "global_step": 429755, "epoch": 2558} {"train_loss": -12.623931884765625, "global_step": 429756, "epoch": 2558} {"train_loss": -12.43940544128418, "global_step": 429757, "epoch": 2558} {"train_loss": -12.454822540283203, "global_step": 429758, "epoch": 2558} {"train_loss": -12.549701690673828, "global_step": 429759, "epoch": 2558} {"train_loss": -12.72575569152832, "global_step": 429760, "epoch": 2558} {"train_loss": -12.7876615524292, "global_step": 429761, "epoch": 2558} {"train_loss": -12.605566024780273, "global_step": 429762, "epoch": 2558} {"train_loss": -12.720386505126953, "global_step": 429763, "epoch": 2558} {"train_loss": -12.67078971862793, "global_step": 429764, "epoch": 2558} {"train_loss": -12.754322052001953, "global_step": 429765, "epoch": 2558} {"train_loss": -12.510147094726562, "global_step": 429766, "epoch": 2558} {"train_loss": -12.638933181762695, "global_step": 429767, "epoch": 2558} {"train_loss": -12.679402351379395, "global_step": 429768, "epoch": 2558} {"train_loss": -12.624558448791504, "global_step": 429769, "epoch": 2558} {"train_loss": -12.736635208129883, "global_step": 429770, "epoch": 2558} {"train_loss": -12.662860870361328, "global_step": 429771, "epoch": 2558} {"train_loss": -12.709548950195312, "global_step": 429772, "epoch": 2558} {"train_loss": -12.896419525146484, "global_step": 429773, "epoch": 2558} {"train_loss": -12.727746963500977, "global_step": 429774, "epoch": 2558} {"train_loss": -12.560388565063477, "global_step": 429775, "epoch": 2558} {"train_loss": -12.511478424072266, "global_step": 429776, "epoch": 2558} {"train_loss": -12.688035011291504, "global_step": 429777, "epoch": 2558} {"train_loss": -12.786163330078125, "global_step": 429778, "epoch": 2558} {"train_loss": -12.920012474060059, "global_step": 429779, "epoch": 2558} {"train_loss": -12.701696395874023, "global_step": 429780, "epoch": 2558} {"train_loss": -12.709781646728516, "global_step": 429781, "epoch": 2558} {"train_loss": -12.38096809387207, "global_step": 429782, "epoch": 2558} {"train_loss": -12.503423690795898, "global_step": 429783, "epoch": 2558} {"train_loss": -12.660693168640137, "global_step": 429784, "epoch": 2558} {"train_loss": -12.763427734375, "global_step": 429785, "epoch": 2558} {"train_loss": -12.833311080932617, "global_step": 429786, "epoch": 2558} {"train_loss": -12.6942777633667, "global_step": 429787, "epoch": 2558} {"train_loss": -12.755293846130371, "global_step": 429788, "epoch": 2558} {"train_loss": -12.747245788574219, "global_step": 429789, "epoch": 2558} {"train_loss": -12.41578483581543, "global_step": 429790, "epoch": 2558} {"train_loss": -12.760391235351562, "global_step": 429791, "epoch": 2558} {"train_loss": -12.911478042602539, "global_step": 429792, "epoch": 2558} {"train_loss": -12.737225532531738, "global_step": 429793, "epoch": 2558} {"train_loss": -12.991242408752441, "global_step": 429794, "epoch": 2558} {"train_loss": -12.855820655822754, "global_step": 429795, "epoch": 2558} {"train_loss": -12.893421173095703, "global_step": 429796, "epoch": 2558} {"train_loss": -12.739971160888672, "global_step": 429797, "epoch": 2558} {"train_loss": -12.590742111206055, "global_step": 429798, "epoch": 2558} {"train_loss": -12.51729965209961, "global_step": 429799, "epoch": 2558} {"train_loss": -12.672704696655273, "global_step": 429800, "epoch": 2558} {"train_loss": -12.781217575073242, "global_step": 429801, "epoch": 2558} {"train_loss": -11.834306716918945, "global_step": 429802, "epoch": 2558} {"train_loss": -11.352465629577637, "global_step": 429803, "epoch": 2558} {"train_loss": -12.288158416748047, "global_step": 429804, "epoch": 2558} {"train_loss": -11.471834182739258, "global_step": 429805, "epoch": 2558} {"train_loss": -9.793102264404297, "global_step": 429806, "epoch": 2558} {"train_loss": -10.270458221435547, "global_step": 429807, "epoch": 2558} {"train_loss": -10.686941146850586, "global_step": 429808, "epoch": 2558} {"train_loss": -10.334112167358398, "global_step": 429809, "epoch": 2558} {"train_loss": -11.708293914794922, "global_step": 429810, "epoch": 2558} {"train_loss": -11.511661529541016, "global_step": 429811, "epoch": 2558} {"train_loss": -11.700002670288086, "global_step": 429812, "epoch": 2558} {"train_loss": -11.861326217651367, "global_step": 429813, "epoch": 2558} {"train_loss": -11.87386417388916, "global_step": 429814, "epoch": 2558} {"train_loss": -12.259468078613281, "global_step": 429815, "epoch": 2558} {"train_loss": -11.469282150268555, "global_step": 429816, "epoch": 2558} {"train_loss": -10.996485710144043, "global_step": 429817, "epoch": 2558} {"train_loss": -11.157401084899902, "global_step": 429818, "epoch": 2558} {"train_loss": -10.89077091217041, "global_step": 429819, "epoch": 2558} {"train_loss": -11.253657341003418, "global_step": 429820, "epoch": 2558} {"train_loss": -10.799412727355957, "global_step": 429821, "epoch": 2558} {"train_loss": -11.923497200012207, "global_step": 429822, "epoch": 2558} {"train_loss": -11.280736923217773, "global_step": 429823, "epoch": 2558} {"train_loss": -12.556245803833008, "global_step": 429824, "epoch": 2558} {"train_loss": -11.151618003845215, "global_step": 429825, "epoch": 2558} {"train_loss": -12.27013111114502, "global_step": 429826, "epoch": 2558} {"train_loss": -11.624608039855957, "global_step": 429827, "epoch": 2558} {"train_loss": -12.212488174438477, "global_step": 429828, "epoch": 2558} {"train_loss": -11.880180358886719, "global_step": 429829, "epoch": 2558} {"train_loss": -12.145466804504395, "global_step": 429830, "epoch": 2558} {"train_loss": -12.237838745117188, "global_step": 429831, "epoch": 2558} {"train_loss": -11.836976051330566, "global_step": 429832, "epoch": 2558} {"train_loss": -12.484183311462402, "global_step": 429833, "epoch": 2558} {"train_loss": -11.993191719055176, "global_step": 429834, "epoch": 2558} {"train_loss": -12.026603698730469, "global_step": 429835, "epoch": 2558} {"train_loss": -11.899505615234375, "global_step": 429836, "epoch": 2558} {"train_loss": -11.749662399291992, "global_step": 429837, "epoch": 2558} {"train_loss": -11.521419525146484, "global_step": 429838, "epoch": 2558} {"train_loss": -10.488794326782227, "global_step": 429839, "epoch": 2558} {"train_loss": -11.858152389526367, "global_step": 429840, "epoch": 2558} {"train_loss": -10.920862197875977, "global_step": 429841, "epoch": 2558} {"train_loss": -11.711268424987793, "global_step": 429842, "epoch": 2558} {"train_loss": -11.528029441833496, "global_step": 429843, "epoch": 2558} {"train_loss": -11.095878601074219, "global_step": 429844, "epoch": 2558} {"train_loss": -11.727851867675781, "global_step": 429845, "epoch": 2558} {"train_loss": -10.608261108398438, "global_step": 429846, "epoch": 2558} {"train_loss": -10.235529899597168, "global_step": 429847, "epoch": 2558} {"train_loss": -11.964600563049316, "global_step": 429848, "epoch": 2558} {"train_loss": -11.597084045410156, "global_step": 429849, "epoch": 2558} {"train_loss": -11.665628433227539, "global_step": 429850, "epoch": 2558} {"train_loss": -11.540803909301758, "global_step": 429851, "epoch": 2558} {"train_loss": -11.92119312286377, "global_step": 429852, "epoch": 2558} {"train_loss": -11.32298469543457, "global_step": 429853, "epoch": 2558} {"train_loss": -11.452327728271484, "global_step": 429854, "epoch": 2558} {"train_loss": -10.961297035217285, "global_step": 429855, "epoch": 2558} {"train_loss": -11.098184585571289, "global_step": 429856, "epoch": 2558} {"train_loss": -11.411428451538086, "global_step": 429857, "epoch": 2558} {"train_loss": -11.422247886657715, "global_step": 429858, "epoch": 2558} {"train_loss": -11.944917678833008, "global_step": 429859, "epoch": 2558} {"train_loss": -11.56856632232666, "global_step": 429860, "epoch": 2558} {"train_loss": -11.904728889465332, "global_step": 429861, "epoch": 2558} {"train_loss": -11.139683723449707, "global_step": 429862, "epoch": 2558} {"train_loss": -10.714017868041992, "global_step": 429863, "epoch": 2558} {"train_loss": -11.647295951843262, "global_step": 429864, "epoch": 2558} {"train_loss": -11.117761611938477, "global_step": 429865, "epoch": 2558} {"train_loss": -11.718338012695312, "global_step": 429866, "epoch": 2558} {"train_loss": -11.590843200683594, "global_step": 429867, "epoch": 2558} {"train_loss": -11.819295883178711, "global_step": 429868, "epoch": 2558} {"train_loss": -12.22115707397461, "global_step": 429869, "epoch": 2558} {"train_loss": -11.609813690185547, "global_step": 429870, "epoch": 2558} {"train_loss": -12.151540756225586, "global_step": 429871, "epoch": 2558} {"train_loss": -11.409283638000488, "global_step": 429872, "epoch": 2558} {"train_loss": -11.99045181274414, "global_step": 429873, "epoch": 2558} {"train_loss": -11.862109184265137, "global_step": 429874, "epoch": 2558} {"train_loss": -11.947860717773438, "global_step": 429875, "epoch": 2558} {"train_loss": -12.140209197998047, "global_step": 429876, "epoch": 2558} {"train_loss": -11.871953964233398, "global_step": 429877, "epoch": 2558} {"train_loss": -11.616815567016602, "global_step": 429878, "epoch": 2558} {"train_loss": -11.449235916137695, "global_step": 429879, "epoch": 2558} {"train_loss": -11.775199890136719, "global_step": 429880, "epoch": 2558} {"train_loss": -11.107046127319336, "global_step": 429881, "epoch": 2558} {"train_loss": -11.668781280517578, "global_step": 429882, "epoch": 2558} {"train_loss": -11.352471351623535, "global_step": 429883, "epoch": 2558} {"train_loss": -12.289932250976562, "global_step": 429884, "epoch": 2558} {"train_loss": -11.291154861450195, "global_step": 429885, "epoch": 2558} {"train_loss": -11.977399826049805, "global_step": 429886, "epoch": 2558} {"train_loss": -12.01715087890625, "global_step": 429887, "epoch": 2558} {"train_loss": -11.65068531036377, "global_step": 429888, "epoch": 2558} {"train_loss": -12.260151863098145, "global_step": 429889, "epoch": 2558} {"train_loss": -11.192270278930664, "global_step": 429890, "epoch": 2558} {"train_loss": -11.808857917785645, "global_step": 429891, "epoch": 2558} {"train_loss": -11.900809288024902, "global_step": 429892, "epoch": 2558} {"train_loss": -11.464475631713867, "global_step": 429893, "epoch": 2558} {"train_loss": -12.375086784362793, "global_step": 429894, "epoch": 2558} {"train_loss": -11.985127449035645, "global_step": 429895, "epoch": 2558} {"train_loss": -12.348335266113281, "global_step": 429896, "epoch": 2558} {"train_loss": -12.112308502197266, "global_step": 429897, "epoch": 2558} {"train_loss": -11.982444763183594, "global_step": 429898, "epoch": 2558} {"train_loss": -12.505098342895508, "global_step": 429899, "epoch": 2558} {"train_loss": -12.261751174926758, "global_step": 429900, "epoch": 2558} {"train_loss": -12.161108016967773, "global_step": 429901, "epoch": 2558} {"train_loss": -12.538854598999023, "global_step": 429902, "epoch": 2558} {"train_loss": -12.261419296264648, "global_step": 429903, "epoch": 2558} {"train_loss": -12.358360290527344, "global_step": 429904, "epoch": 2558} {"train_loss": -12.445686340332031, "global_step": 429905, "epoch": 2558} {"train_loss": -12.399420738220215, "global_step": 429906, "epoch": 2558} {"train_loss": -12.480823516845703, "global_step": 429907, "epoch": 2558} {"train_loss": -12.278257369995117, "global_step": 429908, "epoch": 2558} {"train_loss": -12.47548770904541, "global_step": 429909, "epoch": 2558} {"train_loss": -12.192465782165527, "global_step": 429910, "epoch": 2558} {"train_loss": -12.018592034067426, "global_step": 429911, "epoch": 2558, "val_loss": 308114.125} {"train_loss": -12.09150505065918, "global_step": 429912, "epoch": 2559} {"train_loss": -12.678733825683594, "global_step": 429913, "epoch": 2559} {"train_loss": -12.454935073852539, "global_step": 429914, "epoch": 2559} {"train_loss": -12.409513473510742, "global_step": 429915, "epoch": 2559} {"train_loss": -12.517749786376953, "global_step": 429916, "epoch": 2559} {"train_loss": -12.284268379211426, "global_step": 429917, "epoch": 2559} {"train_loss": -12.684879302978516, "global_step": 429918, "epoch": 2559} {"train_loss": -12.528535842895508, "global_step": 429919, "epoch": 2559} {"train_loss": -12.762500762939453, "global_step": 429920, "epoch": 2559} {"train_loss": -12.612406730651855, "global_step": 429921, "epoch": 2559} {"train_loss": -12.719554901123047, "global_step": 429922, "epoch": 2559} {"train_loss": -12.662186622619629, "global_step": 429923, "epoch": 2559} {"train_loss": -12.57382869720459, "global_step": 429924, "epoch": 2559} {"train_loss": -12.601619720458984, "global_step": 429925, "epoch": 2559} {"train_loss": -12.618579864501953, "global_step": 429926, "epoch": 2559} {"train_loss": -12.606492042541504, "global_step": 429927, "epoch": 2559} {"train_loss": -12.828044891357422, "global_step": 429928, "epoch": 2559} {"train_loss": -12.766681671142578, "global_step": 429929, "epoch": 2559} {"train_loss": -12.739380836486816, "global_step": 429930, "epoch": 2559} {"train_loss": -12.618621826171875, "global_step": 429931, "epoch": 2559} {"train_loss": -12.652316093444824, "global_step": 429932, "epoch": 2559} {"train_loss": -12.696626663208008, "global_step": 429933, "epoch": 2559} {"train_loss": -12.421560287475586, "global_step": 429934, "epoch": 2559} {"train_loss": -12.720787048339844, "global_step": 429935, "epoch": 2559} {"train_loss": -12.55440902709961, "global_step": 429936, "epoch": 2559} {"train_loss": -12.719930648803711, "global_step": 429937, "epoch": 2559} {"train_loss": -12.781523704528809, "global_step": 429938, "epoch": 2559} {"train_loss": -12.672653198242188, "global_step": 429939, "epoch": 2559} {"train_loss": -12.874561309814453, "global_step": 429940, "epoch": 2559} {"train_loss": -12.747602462768555, "global_step": 429941, "epoch": 2559} {"train_loss": -12.72518539428711, "global_step": 429942, "epoch": 2559} {"train_loss": -12.707695007324219, "global_step": 429943, "epoch": 2559} {"train_loss": -12.65941047668457, "global_step": 429944, "epoch": 2559} {"train_loss": -12.786858558654785, "global_step": 429945, "epoch": 2559} {"train_loss": -12.786407470703125, "global_step": 429946, "epoch": 2559} {"train_loss": -12.593271255493164, "global_step": 429947, "epoch": 2559} {"train_loss": -12.71696949005127, "global_step": 429948, "epoch": 2559} {"train_loss": -12.850849151611328, "global_step": 429949, "epoch": 2559} {"train_loss": -12.434589385986328, "global_step": 429950, "epoch": 2559} {"train_loss": -12.826701164245605, "global_step": 429951, "epoch": 2559} {"train_loss": -12.800653457641602, "global_step": 429952, "epoch": 2559} {"train_loss": -12.540122985839844, "global_step": 429953, "epoch": 2559} {"train_loss": -12.667040824890137, "global_step": 429954, "epoch": 2559} {"train_loss": -12.859637260437012, "global_step": 429955, "epoch": 2559} {"train_loss": -12.683425903320312, "global_step": 429956, "epoch": 2559} {"train_loss": -12.723187446594238, "global_step": 429957, "epoch": 2559} {"train_loss": -12.922880172729492, "global_step": 429958, "epoch": 2559} {"train_loss": -12.519895553588867, "global_step": 429959, "epoch": 2559} {"train_loss": -12.647232055664062, "global_step": 429960, "epoch": 2559} {"train_loss": -12.842708587646484, "global_step": 429961, "epoch": 2559} {"train_loss": -12.73456859588623, "global_step": 429962, "epoch": 2559} {"train_loss": -12.569236755371094, "global_step": 429963, "epoch": 2559} {"train_loss": -12.731941223144531, "global_step": 429964, "epoch": 2559} {"train_loss": -12.943283081054688, "global_step": 429965, "epoch": 2559} {"train_loss": -12.497737884521484, "global_step": 429966, "epoch": 2559} {"train_loss": -12.435205459594727, "global_step": 429967, "epoch": 2559} {"train_loss": -12.754793167114258, "global_step": 429968, "epoch": 2559} {"train_loss": -12.694378852844238, "global_step": 429969, "epoch": 2559} {"train_loss": -12.261517524719238, "global_step": 429970, "epoch": 2559} {"train_loss": -12.62818717956543, "global_step": 429971, "epoch": 2559} {"train_loss": -12.624040603637695, "global_step": 429972, "epoch": 2559} {"train_loss": -12.587870597839355, "global_step": 429973, "epoch": 2559} {"train_loss": -12.658441543579102, "global_step": 429974, "epoch": 2559} {"train_loss": -12.708335876464844, "global_step": 429975, "epoch": 2559} {"train_loss": -12.869729995727539, "global_step": 429976, "epoch": 2559} {"train_loss": -12.745887756347656, "global_step": 429977, "epoch": 2559} {"train_loss": -12.588541030883789, "global_step": 429978, "epoch": 2559} {"train_loss": -11.949226379394531, "global_step": 429979, "epoch": 2559} {"train_loss": -12.593376159667969, "global_step": 429980, "epoch": 2559} {"train_loss": -12.224763870239258, "global_step": 429981, "epoch": 2559} {"train_loss": -12.23672103881836, "global_step": 429982, "epoch": 2559} {"train_loss": -11.227970123291016, "global_step": 429983, "epoch": 2559} {"train_loss": -12.490372657775879, "global_step": 429984, "epoch": 2559} {"train_loss": -11.831071853637695, "global_step": 429985, "epoch": 2559} {"train_loss": -11.925241470336914, "global_step": 429986, "epoch": 2559} {"train_loss": -11.988349914550781, "global_step": 429987, "epoch": 2559} {"train_loss": -11.886697769165039, "global_step": 429988, "epoch": 2559} {"train_loss": -12.025022506713867, "global_step": 429989, "epoch": 2559} {"train_loss": -11.835260391235352, "global_step": 429990, "epoch": 2559} {"train_loss": -12.121353149414062, "global_step": 429991, "epoch": 2559} {"train_loss": -12.20292854309082, "global_step": 429992, "epoch": 2559} {"train_loss": -12.532205581665039, "global_step": 429993, "epoch": 2559} {"train_loss": -12.398092269897461, "global_step": 429994, "epoch": 2559} {"train_loss": -12.798110008239746, "global_step": 429995, "epoch": 2559} {"train_loss": -12.31281852722168, "global_step": 429996, "epoch": 2559} {"train_loss": -12.09086799621582, "global_step": 429997, "epoch": 2559} {"train_loss": -11.985337257385254, "global_step": 429998, "epoch": 2559} {"train_loss": -12.390189170837402, "global_step": 429999, "epoch": 2559} {"train_loss": -12.351593971252441, "global_step": 430000, "epoch": 2559} {"train_loss": -12.262508392333984, "global_step": 430001, "epoch": 2559} {"train_loss": -11.708490371704102, "global_step": 430002, "epoch": 2559} {"train_loss": -11.688145637512207, "global_step": 430003, "epoch": 2559} {"train_loss": -12.113426208496094, "global_step": 430004, "epoch": 2559} {"train_loss": -12.140414237976074, "global_step": 430005, "epoch": 2559} {"train_loss": -12.000097274780273, "global_step": 430006, "epoch": 2559} {"train_loss": -11.378463745117188, "global_step": 430007, "epoch": 2559} {"train_loss": -12.3079252243042, "global_step": 430008, "epoch": 2559} {"train_loss": -11.201920509338379, "global_step": 430009, "epoch": 2559} {"train_loss": -10.265838623046875, "global_step": 430010, "epoch": 2559} {"train_loss": -11.979705810546875, "global_step": 430011, "epoch": 2559} {"train_loss": -11.477531433105469, "global_step": 430012, "epoch": 2559} {"train_loss": -10.06700325012207, "global_step": 430013, "epoch": 2559} {"train_loss": -11.44377326965332, "global_step": 430014, "epoch": 2559} {"train_loss": -10.92335319519043, "global_step": 430015, "epoch": 2559} {"train_loss": -9.865196228027344, "global_step": 430016, "epoch": 2559} {"train_loss": -9.56437873840332, "global_step": 430017, "epoch": 2559} {"train_loss": -10.054084777832031, "global_step": 430018, "epoch": 2559} {"train_loss": -10.018352508544922, "global_step": 430019, "epoch": 2559} {"train_loss": -9.57773494720459, "global_step": 430020, "epoch": 2559} {"train_loss": -10.137375831604004, "global_step": 430021, "epoch": 2559} {"train_loss": -10.058839797973633, "global_step": 430022, "epoch": 2559} {"train_loss": -9.167418479919434, "global_step": 430023, "epoch": 2559} {"train_loss": -10.391611099243164, "global_step": 430024, "epoch": 2559} {"train_loss": -10.953550338745117, "global_step": 430025, "epoch": 2559} {"train_loss": -10.83814811706543, "global_step": 430026, "epoch": 2559} {"train_loss": -11.169862747192383, "global_step": 430027, "epoch": 2559} {"train_loss": -11.366903305053711, "global_step": 430028, "epoch": 2559} {"train_loss": -11.595758438110352, "global_step": 430029, "epoch": 2559} {"train_loss": -11.774635314941406, "global_step": 430030, "epoch": 2559} {"train_loss": -11.550146102905273, "global_step": 430031, "epoch": 2559} {"train_loss": -11.296852111816406, "global_step": 430032, "epoch": 2559} {"train_loss": -12.091580390930176, "global_step": 430033, "epoch": 2559} {"train_loss": -11.324256896972656, "global_step": 430034, "epoch": 2559} {"train_loss": -11.853338241577148, "global_step": 430035, "epoch": 2559} {"train_loss": -11.189047813415527, "global_step": 430036, "epoch": 2559} {"train_loss": -11.98955249786377, "global_step": 430037, "epoch": 2559} {"train_loss": -11.777032852172852, "global_step": 430038, "epoch": 2559} {"train_loss": -11.623984336853027, "global_step": 430039, "epoch": 2559} {"train_loss": -11.910801887512207, "global_step": 430040, "epoch": 2559} {"train_loss": -11.289522171020508, "global_step": 430041, "epoch": 2559} {"train_loss": -11.95518684387207, "global_step": 430042, "epoch": 2559} {"train_loss": -11.87832260131836, "global_step": 430043, "epoch": 2559} {"train_loss": -11.778648376464844, "global_step": 430044, "epoch": 2559} {"train_loss": -11.721466064453125, "global_step": 430045, "epoch": 2559} {"train_loss": -11.97157096862793, "global_step": 430046, "epoch": 2559} {"train_loss": -12.34619140625, "global_step": 430047, "epoch": 2559} {"train_loss": -11.841262817382812, "global_step": 430048, "epoch": 2559} {"train_loss": -11.969574928283691, "global_step": 430049, "epoch": 2559} {"train_loss": -11.741434097290039, "global_step": 430050, "epoch": 2559} {"train_loss": -12.317829132080078, "global_step": 430051, "epoch": 2559} {"train_loss": -12.070127487182617, "global_step": 430052, "epoch": 2559} {"train_loss": -12.109575271606445, "global_step": 430053, "epoch": 2559} {"train_loss": -11.945536613464355, "global_step": 430054, "epoch": 2559} {"train_loss": -12.046829223632812, "global_step": 430055, "epoch": 2559} {"train_loss": -12.326059341430664, "global_step": 430056, "epoch": 2559} {"train_loss": -12.39654541015625, "global_step": 430057, "epoch": 2559} {"train_loss": -12.291890144348145, "global_step": 430058, "epoch": 2559} {"train_loss": -12.267751693725586, "global_step": 430059, "epoch": 2559} {"train_loss": -12.175567626953125, "global_step": 430060, "epoch": 2559} {"train_loss": -12.391342163085938, "global_step": 430061, "epoch": 2559} {"train_loss": -12.53995418548584, "global_step": 430062, "epoch": 2559} {"train_loss": -12.281980514526367, "global_step": 430063, "epoch": 2559} {"train_loss": -12.257699012756348, "global_step": 430064, "epoch": 2559} {"train_loss": -12.479772567749023, "global_step": 430065, "epoch": 2559} {"train_loss": -12.54606819152832, "global_step": 430066, "epoch": 2559} {"train_loss": -12.042840957641602, "global_step": 430067, "epoch": 2559} {"train_loss": -12.310832023620605, "global_step": 430068, "epoch": 2559} {"train_loss": -12.281174659729004, "global_step": 430069, "epoch": 2559} {"train_loss": -12.138676643371582, "global_step": 430070, "epoch": 2559} {"train_loss": -12.444068908691406, "global_step": 430071, "epoch": 2559} {"train_loss": -11.651747703552246, "global_step": 430072, "epoch": 2559} {"train_loss": -12.341248512268066, "global_step": 430073, "epoch": 2559} {"train_loss": -12.52960205078125, "global_step": 430074, "epoch": 2559} {"train_loss": -12.15462589263916, "global_step": 430075, "epoch": 2559} {"train_loss": -12.230463027954102, "global_step": 430076, "epoch": 2559} {"train_loss": -12.8363037109375, "global_step": 430077, "epoch": 2559} {"train_loss": -12.410469055175781, "global_step": 430078, "epoch": 2559} {"train_loss": -12.12083716051919, "global_step": 430079, "epoch": 2559, "val_loss": 309860.84375} {"train_loss": -12.429632186889648, "global_step": 430080, "epoch": 2560} {"train_loss": -12.403247833251953, "global_step": 430081, "epoch": 2560} {"train_loss": -12.509099006652832, "global_step": 430082, "epoch": 2560} {"train_loss": -12.321884155273438, "global_step": 430083, "epoch": 2560} {"train_loss": -12.375368118286133, "global_step": 430084, "epoch": 2560} {"train_loss": -12.083039283752441, "global_step": 430085, "epoch": 2560} {"train_loss": -12.190471649169922, "global_step": 430086, "epoch": 2560} {"train_loss": -12.238109588623047, "global_step": 430087, "epoch": 2560} {"train_loss": -11.886106491088867, "global_step": 430088, "epoch": 2560} {"train_loss": -12.53657054901123, "global_step": 430089, "epoch": 2560} {"train_loss": -11.845998764038086, "global_step": 430090, "epoch": 2560} {"train_loss": -12.258537292480469, "global_step": 430091, "epoch": 2560} {"train_loss": -12.235291481018066, "global_step": 430092, "epoch": 2560} {"train_loss": -12.122884750366211, "global_step": 430093, "epoch": 2560} {"train_loss": -12.207879066467285, "global_step": 430094, "epoch": 2560} {"train_loss": -12.226034164428711, "global_step": 430095, "epoch": 2560} {"train_loss": -12.19060230255127, "global_step": 430096, "epoch": 2560} {"train_loss": -12.460195541381836, "global_step": 430097, "epoch": 2560} {"train_loss": -11.827659606933594, "global_step": 430098, "epoch": 2560} {"train_loss": -11.630722045898438, "global_step": 430099, "epoch": 2560} {"train_loss": -11.711637496948242, "global_step": 430100, "epoch": 2560} {"train_loss": -10.904237747192383, "global_step": 430101, "epoch": 2560} {"train_loss": -11.774085998535156, "global_step": 430102, "epoch": 2560} {"train_loss": -11.11170768737793, "global_step": 430103, "epoch": 2560} {"train_loss": -10.49129867553711, "global_step": 430104, "epoch": 2560} {"train_loss": -11.247379302978516, "global_step": 430105, "epoch": 2560} {"train_loss": -10.86398696899414, "global_step": 430106, "epoch": 2560} {"train_loss": -11.852316856384277, "global_step": 430107, "epoch": 2560} {"train_loss": -11.123562812805176, "global_step": 430108, "epoch": 2560} {"train_loss": -11.69222354888916, "global_step": 430109, "epoch": 2560} {"train_loss": -11.411947250366211, "global_step": 430110, "epoch": 2560} {"train_loss": -11.177125930786133, "global_step": 430111, "epoch": 2560} {"train_loss": -11.38960075378418, "global_step": 430112, "epoch": 2560} {"train_loss": -11.473149299621582, "global_step": 430113, "epoch": 2560} {"train_loss": -11.363494873046875, "global_step": 430114, "epoch": 2560} {"train_loss": -12.263919830322266, "global_step": 430115, "epoch": 2560} {"train_loss": -10.718327522277832, "global_step": 430116, "epoch": 2560} {"train_loss": -11.796624183654785, "global_step": 430117, "epoch": 2560} {"train_loss": -10.977178573608398, "global_step": 430118, "epoch": 2560} {"train_loss": -11.988157272338867, "global_step": 430119, "epoch": 2560} {"train_loss": -11.602933883666992, "global_step": 430120, "epoch": 2560} {"train_loss": -11.715377807617188, "global_step": 430121, "epoch": 2560} {"train_loss": -12.089553833007812, "global_step": 430122, "epoch": 2560} {"train_loss": -11.463933944702148, "global_step": 430123, "epoch": 2560} {"train_loss": -12.416919708251953, "global_step": 430124, "epoch": 2560} {"train_loss": -11.682376861572266, "global_step": 430125, "epoch": 2560} {"train_loss": -12.605168342590332, "global_step": 430126, "epoch": 2560} {"train_loss": -11.711708068847656, "global_step": 430127, "epoch": 2560} {"train_loss": -12.560762405395508, "global_step": 430128, "epoch": 2560} {"train_loss": -11.981803894042969, "global_step": 430129, "epoch": 2560} {"train_loss": -12.228130340576172, "global_step": 430130, "epoch": 2560} {"train_loss": -12.301409721374512, "global_step": 430131, "epoch": 2560} {"train_loss": -12.10342025756836, "global_step": 430132, "epoch": 2560} {"train_loss": -12.46634292602539, "global_step": 430133, "epoch": 2560} {"train_loss": -12.18128776550293, "global_step": 430134, "epoch": 2560} {"train_loss": -12.438563346862793, "global_step": 430135, "epoch": 2560} {"train_loss": -12.258309364318848, "global_step": 430136, "epoch": 2560} {"train_loss": -12.362322807312012, "global_step": 430137, "epoch": 2560} {"train_loss": -12.313058853149414, "global_step": 430138, "epoch": 2560} {"train_loss": -12.544540405273438, "global_step": 430139, "epoch": 2560} {"train_loss": -12.221616744995117, "global_step": 430140, "epoch": 2560} {"train_loss": -12.552412033081055, "global_step": 430141, "epoch": 2560} {"train_loss": -12.338239669799805, "global_step": 430142, "epoch": 2560} {"train_loss": -12.335355758666992, "global_step": 430143, "epoch": 2560} {"train_loss": -12.488748550415039, "global_step": 430144, "epoch": 2560} {"train_loss": -12.147916793823242, "global_step": 430145, "epoch": 2560} {"train_loss": -12.299793243408203, "global_step": 430146, "epoch": 2560} {"train_loss": -11.906124114990234, "global_step": 430147, "epoch": 2560} {"train_loss": -12.27989673614502, "global_step": 430148, "epoch": 2560} {"train_loss": -12.224161148071289, "global_step": 430149, "epoch": 2560} {"train_loss": -12.481836318969727, "global_step": 430150, "epoch": 2560} {"train_loss": -12.08633804321289, "global_step": 430151, "epoch": 2560} {"train_loss": -12.565082550048828, "global_step": 430152, "epoch": 2560} {"train_loss": -12.18274211883545, "global_step": 430153, "epoch": 2560} {"train_loss": -11.93959903717041, "global_step": 430154, "epoch": 2560} {"train_loss": -12.317008972167969, "global_step": 430155, "epoch": 2560} {"train_loss": -12.212251663208008, "global_step": 430156, "epoch": 2560} {"train_loss": -12.748889923095703, "global_step": 430157, "epoch": 2560} {"train_loss": -12.4627685546875, "global_step": 430158, "epoch": 2560} {"train_loss": -12.585367202758789, "global_step": 430159, "epoch": 2560} {"train_loss": -12.421619415283203, "global_step": 430160, "epoch": 2560} {"train_loss": -12.363404273986816, "global_step": 430161, "epoch": 2560} {"train_loss": -12.727825164794922, "global_step": 430162, "epoch": 2560} {"train_loss": -12.32535457611084, "global_step": 430163, "epoch": 2560} {"train_loss": -12.444549560546875, "global_step": 430164, "epoch": 2560} {"train_loss": -12.445887565612793, "global_step": 430165, "epoch": 2560} {"train_loss": -12.6595458984375, "global_step": 430166, "epoch": 2560} {"train_loss": -12.428014755249023, "global_step": 430167, "epoch": 2560} {"train_loss": -12.462321281433105, "global_step": 430168, "epoch": 2560} {"train_loss": -12.490572929382324, "global_step": 430169, "epoch": 2560} {"train_loss": -12.51236629486084, "global_step": 430170, "epoch": 2560} {"train_loss": -12.29961109161377, "global_step": 430171, "epoch": 2560} {"train_loss": -12.474913597106934, "global_step": 430172, "epoch": 2560} {"train_loss": -12.46088981628418, "global_step": 430173, "epoch": 2560} {"train_loss": -12.622114181518555, "global_step": 430174, "epoch": 2560} {"train_loss": -12.2859525680542, "global_step": 430175, "epoch": 2560} {"train_loss": -12.744726181030273, "global_step": 430176, "epoch": 2560} {"train_loss": -11.892451286315918, "global_step": 430177, "epoch": 2560} {"train_loss": -11.848201751708984, "global_step": 430178, "epoch": 2560} {"train_loss": -12.166604042053223, "global_step": 430179, "epoch": 2560} {"train_loss": -11.25956916809082, "global_step": 430180, "epoch": 2560} {"train_loss": -11.724037170410156, "global_step": 430181, "epoch": 2560} {"train_loss": -11.23996353149414, "global_step": 430182, "epoch": 2560} {"train_loss": -12.561402320861816, "global_step": 430183, "epoch": 2560} {"train_loss": -11.803247451782227, "global_step": 430184, "epoch": 2560} {"train_loss": -11.229702949523926, "global_step": 430185, "epoch": 2560} {"train_loss": -12.78769302368164, "global_step": 430186, "epoch": 2560} {"train_loss": -11.77440071105957, "global_step": 430187, "epoch": 2560} {"train_loss": -12.060930252075195, "global_step": 430188, "epoch": 2560} {"train_loss": -12.370262145996094, "global_step": 430189, "epoch": 2560} {"train_loss": -11.878217697143555, "global_step": 430190, "epoch": 2560} {"train_loss": -11.920783996582031, "global_step": 430191, "epoch": 2560} {"train_loss": -11.589921951293945, "global_step": 430192, "epoch": 2560} {"train_loss": -12.148672103881836, "global_step": 430193, "epoch": 2560} {"train_loss": -11.63210678100586, "global_step": 430194, "epoch": 2560} {"train_loss": -11.829818725585938, "global_step": 430195, "epoch": 2560} {"train_loss": -11.782569885253906, "global_step": 430196, "epoch": 2560} {"train_loss": -11.76611328125, "global_step": 430197, "epoch": 2560} {"train_loss": -11.66955852508545, "global_step": 430198, "epoch": 2560} {"train_loss": -12.085807800292969, "global_step": 430199, "epoch": 2560} {"train_loss": -12.231766700744629, "global_step": 430200, "epoch": 2560} {"train_loss": -12.260734558105469, "global_step": 430201, "epoch": 2560} {"train_loss": -12.042963981628418, "global_step": 430202, "epoch": 2560} {"train_loss": -11.800361633300781, "global_step": 430203, "epoch": 2560} {"train_loss": -12.22874641418457, "global_step": 430204, "epoch": 2560} {"train_loss": -12.420499801635742, "global_step": 430205, "epoch": 2560} {"train_loss": -12.461383819580078, "global_step": 430206, "epoch": 2560} {"train_loss": -12.212631225585938, "global_step": 430207, "epoch": 2560} {"train_loss": -12.419450759887695, "global_step": 430208, "epoch": 2560} {"train_loss": -12.035740852355957, "global_step": 430209, "epoch": 2560} {"train_loss": -12.487466812133789, "global_step": 430210, "epoch": 2560} {"train_loss": -12.168170928955078, "global_step": 430211, "epoch": 2560} {"train_loss": -12.283546447753906, "global_step": 430212, "epoch": 2560} {"train_loss": -12.184268951416016, "global_step": 430213, "epoch": 2560} {"train_loss": -11.845708847045898, "global_step": 430214, "epoch": 2560} {"train_loss": -12.435434341430664, "global_step": 430215, "epoch": 2560} {"train_loss": -12.088888168334961, "global_step": 430216, "epoch": 2560} {"train_loss": -12.712158203125, "global_step": 430217, "epoch": 2560} {"train_loss": -11.842901229858398, "global_step": 430218, "epoch": 2560} {"train_loss": -12.395450592041016, "global_step": 430219, "epoch": 2560} {"train_loss": -12.2760648727417, "global_step": 430220, "epoch": 2560} {"train_loss": -12.452692031860352, "global_step": 430221, "epoch": 2560} {"train_loss": -12.531899452209473, "global_step": 430222, "epoch": 2560} {"train_loss": -12.418608665466309, "global_step": 430223, "epoch": 2560} {"train_loss": -12.537772178649902, "global_step": 430224, "epoch": 2560} {"train_loss": -12.06916618347168, "global_step": 430225, "epoch": 2560} {"train_loss": -12.511251449584961, "global_step": 430226, "epoch": 2560} {"train_loss": -12.099287986755371, "global_step": 430227, "epoch": 2560} {"train_loss": -11.285574913024902, "global_step": 430228, "epoch": 2560} {"train_loss": -11.42498779296875, "global_step": 430229, "epoch": 2560} {"train_loss": -12.025385856628418, "global_step": 430230, "epoch": 2560} {"train_loss": -11.44373893737793, "global_step": 430231, "epoch": 2560} {"train_loss": -11.695816993713379, "global_step": 430232, "epoch": 2560} {"train_loss": -11.978777885437012, "global_step": 430233, "epoch": 2560} {"train_loss": -11.780311584472656, "global_step": 430234, "epoch": 2560} {"train_loss": -11.351751327514648, "global_step": 430235, "epoch": 2560} {"train_loss": -11.231525421142578, "global_step": 430236, "epoch": 2560} {"train_loss": -11.556900024414062, "global_step": 430237, "epoch": 2560} {"train_loss": -10.701335906982422, "global_step": 430238, "epoch": 2560} {"train_loss": -11.788139343261719, "global_step": 430239, "epoch": 2560} {"train_loss": -10.44814682006836, "global_step": 430240, "epoch": 2560} {"train_loss": -11.83425521850586, "global_step": 430241, "epoch": 2560} {"train_loss": -10.604827880859375, "global_step": 430242, "epoch": 2560} {"train_loss": -11.982748031616211, "global_step": 430243, "epoch": 2560} {"train_loss": -10.362922668457031, "global_step": 430244, "epoch": 2560} {"train_loss": -11.383397102355957, "global_step": 430245, "epoch": 2560} {"train_loss": -10.53323745727539, "global_step": 430246, "epoch": 2560} {"train_loss": -11.997931548527308, "global_step": 430247, "epoch": 2560, "val_loss": 310908.40625, "train_action_mse_error": 2.252681255340576} {"train_loss": -11.312801361083984, "global_step": 430248, "epoch": 2561} {"train_loss": -11.648994445800781, "global_step": 430249, "epoch": 2561} {"train_loss": -11.519612312316895, "global_step": 430250, "epoch": 2561} {"train_loss": -11.506162643432617, "global_step": 430251, "epoch": 2561} {"train_loss": -11.559200286865234, "global_step": 430252, "epoch": 2561} {"train_loss": -11.105274200439453, "global_step": 430253, "epoch": 2561} {"train_loss": -11.300912857055664, "global_step": 430254, "epoch": 2561} {"train_loss": -11.451680183410645, "global_step": 430255, "epoch": 2561} {"train_loss": -11.152667999267578, "global_step": 430256, "epoch": 2561} {"train_loss": -11.831785202026367, "global_step": 430257, "epoch": 2561} {"train_loss": -11.634048461914062, "global_step": 430258, "epoch": 2561} {"train_loss": -11.413208961486816, "global_step": 430259, "epoch": 2561} {"train_loss": -11.500961303710938, "global_step": 430260, "epoch": 2561} {"train_loss": -11.671974182128906, "global_step": 430261, "epoch": 2561} {"train_loss": -11.556122779846191, "global_step": 430262, "epoch": 2561} {"train_loss": -11.958754539489746, "global_step": 430263, "epoch": 2561} {"train_loss": -11.988565444946289, "global_step": 430264, "epoch": 2561} {"train_loss": -12.456255912780762, "global_step": 430265, "epoch": 2561} {"train_loss": -11.834030151367188, "global_step": 430266, "epoch": 2561} {"train_loss": -12.321449279785156, "global_step": 430267, "epoch": 2561} {"train_loss": -11.988045692443848, "global_step": 430268, "epoch": 2561} {"train_loss": -12.332263946533203, "global_step": 430269, "epoch": 2561} {"train_loss": -11.617273330688477, "global_step": 430270, "epoch": 2561} {"train_loss": -12.248682022094727, "global_step": 430271, "epoch": 2561} {"train_loss": -12.107775688171387, "global_step": 430272, "epoch": 2561} {"train_loss": -12.095470428466797, "global_step": 430273, "epoch": 2561} {"train_loss": -12.402265548706055, "global_step": 430274, "epoch": 2561} {"train_loss": -11.911277770996094, "global_step": 430275, "epoch": 2561} {"train_loss": -12.287306785583496, "global_step": 430276, "epoch": 2561} {"train_loss": -12.116097450256348, "global_step": 430277, "epoch": 2561} {"train_loss": -12.133491516113281, "global_step": 430278, "epoch": 2561} {"train_loss": -12.284085273742676, "global_step": 430279, "epoch": 2561} {"train_loss": -12.333651542663574, "global_step": 430280, "epoch": 2561} {"train_loss": -12.306352615356445, "global_step": 430281, "epoch": 2561} {"train_loss": -12.442214965820312, "global_step": 430282, "epoch": 2561} {"train_loss": -12.635271072387695, "global_step": 430283, "epoch": 2561} {"train_loss": -12.316709518432617, "global_step": 430284, "epoch": 2561} {"train_loss": -12.453475952148438, "global_step": 430285, "epoch": 2561} {"train_loss": -12.620792388916016, "global_step": 430286, "epoch": 2561} {"train_loss": -12.508244514465332, "global_step": 430287, "epoch": 2561} {"train_loss": -12.529017448425293, "global_step": 430288, "epoch": 2561} {"train_loss": -12.571959495544434, "global_step": 430289, "epoch": 2561} {"train_loss": -12.478586196899414, "global_step": 430290, "epoch": 2561} {"train_loss": -12.454607009887695, "global_step": 430291, "epoch": 2561} {"train_loss": -12.528417587280273, "global_step": 430292, "epoch": 2561} {"train_loss": -12.601211547851562, "global_step": 430293, "epoch": 2561} {"train_loss": -12.638764381408691, "global_step": 430294, "epoch": 2561} {"train_loss": -12.500045776367188, "global_step": 430295, "epoch": 2561} {"train_loss": -12.656030654907227, "global_step": 430296, "epoch": 2561} {"train_loss": -12.423423767089844, "global_step": 430297, "epoch": 2561} {"train_loss": -12.617366790771484, "global_step": 430298, "epoch": 2561} {"train_loss": -12.53860092163086, "global_step": 430299, "epoch": 2561} {"train_loss": -12.434774398803711, "global_step": 430300, "epoch": 2561} {"train_loss": -12.51072883605957, "global_step": 430301, "epoch": 2561} {"train_loss": -12.031194686889648, "global_step": 430302, "epoch": 2561} {"train_loss": -12.083420753479004, "global_step": 430303, "epoch": 2561} {"train_loss": -12.321083068847656, "global_step": 430304, "epoch": 2561} {"train_loss": -12.067176818847656, "global_step": 430305, "epoch": 2561} {"train_loss": -12.285102844238281, "global_step": 430306, "epoch": 2561} {"train_loss": -12.125533103942871, "global_step": 430307, "epoch": 2561} {"train_loss": -11.966562271118164, "global_step": 430308, "epoch": 2561} {"train_loss": -12.265157699584961, "global_step": 430309, "epoch": 2561} {"train_loss": -12.24201774597168, "global_step": 430310, "epoch": 2561} {"train_loss": -12.582399368286133, "global_step": 430311, "epoch": 2561} {"train_loss": -12.647250175476074, "global_step": 430312, "epoch": 2561} {"train_loss": -12.608573913574219, "global_step": 430313, "epoch": 2561} {"train_loss": -12.582611083984375, "global_step": 430314, "epoch": 2561} {"train_loss": -12.259236335754395, "global_step": 430315, "epoch": 2561} {"train_loss": -12.756677627563477, "global_step": 430316, "epoch": 2561} {"train_loss": -12.32510757446289, "global_step": 430317, "epoch": 2561} {"train_loss": -12.282965660095215, "global_step": 430318, "epoch": 2561} {"train_loss": -12.579761505126953, "global_step": 430319, "epoch": 2561} {"train_loss": -12.182442665100098, "global_step": 430320, "epoch": 2561} {"train_loss": -12.328887939453125, "global_step": 430321, "epoch": 2561} {"train_loss": -12.436305046081543, "global_step": 430322, "epoch": 2561} {"train_loss": -12.358380317687988, "global_step": 430323, "epoch": 2561} {"train_loss": -12.562856674194336, "global_step": 430324, "epoch": 2561} {"train_loss": -11.985611915588379, "global_step": 430325, "epoch": 2561} {"train_loss": -12.522612571716309, "global_step": 430326, "epoch": 2561} {"train_loss": -12.632013320922852, "global_step": 430327, "epoch": 2561} {"train_loss": -12.681422233581543, "global_step": 430328, "epoch": 2561} {"train_loss": -12.624924659729004, "global_step": 430329, "epoch": 2561} {"train_loss": -12.664640426635742, "global_step": 430330, "epoch": 2561} {"train_loss": -12.616328239440918, "global_step": 430331, "epoch": 2561} {"train_loss": -12.735968589782715, "global_step": 430332, "epoch": 2561} {"train_loss": -12.406342506408691, "global_step": 430333, "epoch": 2561} {"train_loss": -12.523906707763672, "global_step": 430334, "epoch": 2561} {"train_loss": -12.515298843383789, "global_step": 430335, "epoch": 2561} {"train_loss": -11.92593765258789, "global_step": 430336, "epoch": 2561} {"train_loss": -12.2528715133667, "global_step": 430337, "epoch": 2561} {"train_loss": -12.397216796875, "global_step": 430338, "epoch": 2561} {"train_loss": -11.907857894897461, "global_step": 430339, "epoch": 2561} {"train_loss": -12.500226020812988, "global_step": 430340, "epoch": 2561} {"train_loss": -11.907788276672363, "global_step": 430341, "epoch": 2561} {"train_loss": -9.898685455322266, "global_step": 430342, "epoch": 2561} {"train_loss": -12.407642364501953, "global_step": 430343, "epoch": 2561} {"train_loss": -8.117894172668457, "global_step": 430344, "epoch": 2561} {"train_loss": -11.329854011535645, "global_step": 430345, "epoch": 2561} {"train_loss": -9.537038803100586, "global_step": 430346, "epoch": 2561} {"train_loss": -10.123395919799805, "global_step": 430347, "epoch": 2561} {"train_loss": -9.602191925048828, "global_step": 430348, "epoch": 2561} {"train_loss": -10.037461280822754, "global_step": 430349, "epoch": 2561} {"train_loss": -10.53640365600586, "global_step": 430350, "epoch": 2561} {"train_loss": -10.36520004272461, "global_step": 430351, "epoch": 2561} {"train_loss": -10.674755096435547, "global_step": 430352, "epoch": 2561} {"train_loss": -9.734058380126953, "global_step": 430353, "epoch": 2561} {"train_loss": -9.40739631652832, "global_step": 430354, "epoch": 2561} {"train_loss": -9.796874046325684, "global_step": 430355, "epoch": 2561} {"train_loss": -11.363232612609863, "global_step": 430356, "epoch": 2561} {"train_loss": -10.140644073486328, "global_step": 430357, "epoch": 2561} {"train_loss": -9.176607131958008, "global_step": 430358, "epoch": 2561} {"train_loss": -9.556219100952148, "global_step": 430359, "epoch": 2561} {"train_loss": -11.014130592346191, "global_step": 430360, "epoch": 2561} {"train_loss": -10.048503875732422, "global_step": 430361, "epoch": 2561} {"train_loss": -11.086677551269531, "global_step": 430362, "epoch": 2561} {"train_loss": -10.57535171508789, "global_step": 430363, "epoch": 2561} {"train_loss": -11.052135467529297, "global_step": 430364, "epoch": 2561} {"train_loss": -10.857715606689453, "global_step": 430365, "epoch": 2561} {"train_loss": -11.729513168334961, "global_step": 430366, "epoch": 2561} {"train_loss": -11.48940658569336, "global_step": 430367, "epoch": 2561} {"train_loss": -11.598816871643066, "global_step": 430368, "epoch": 2561} {"train_loss": -11.857742309570312, "global_step": 430369, "epoch": 2561} {"train_loss": -12.12293815612793, "global_step": 430370, "epoch": 2561} {"train_loss": -12.159883499145508, "global_step": 430371, "epoch": 2561} {"train_loss": -11.867517471313477, "global_step": 430372, "epoch": 2561} {"train_loss": -12.150213241577148, "global_step": 430373, "epoch": 2561} {"train_loss": -12.08885669708252, "global_step": 430374, "epoch": 2561} {"train_loss": -11.918726921081543, "global_step": 430375, "epoch": 2561} {"train_loss": -12.086777687072754, "global_step": 430376, "epoch": 2561} {"train_loss": -11.931434631347656, "global_step": 430377, "epoch": 2561} {"train_loss": -11.951618194580078, "global_step": 430378, "epoch": 2561} {"train_loss": -11.987640380859375, "global_step": 430379, "epoch": 2561} {"train_loss": -11.916563034057617, "global_step": 430380, "epoch": 2561} {"train_loss": -11.679543495178223, "global_step": 430381, "epoch": 2561} {"train_loss": -12.413039207458496, "global_step": 430382, "epoch": 2561} {"train_loss": -11.827957153320312, "global_step": 430383, "epoch": 2561} {"train_loss": -12.24576187133789, "global_step": 430384, "epoch": 2561} {"train_loss": -12.184820175170898, "global_step": 430385, "epoch": 2561} {"train_loss": -11.900395393371582, "global_step": 430386, "epoch": 2561} {"train_loss": -12.345242500305176, "global_step": 430387, "epoch": 2561} {"train_loss": -12.109610557556152, "global_step": 430388, "epoch": 2561} {"train_loss": -12.089479446411133, "global_step": 430389, "epoch": 2561} {"train_loss": -12.255345344543457, "global_step": 430390, "epoch": 2561} {"train_loss": -12.508079528808594, "global_step": 430391, "epoch": 2561} {"train_loss": -12.128751754760742, "global_step": 430392, "epoch": 2561} {"train_loss": -12.392416954040527, "global_step": 430393, "epoch": 2561} {"train_loss": -11.921815872192383, "global_step": 430394, "epoch": 2561} {"train_loss": -12.478687286376953, "global_step": 430395, "epoch": 2561} {"train_loss": -12.205865859985352, "global_step": 430396, "epoch": 2561} {"train_loss": -12.588178634643555, "global_step": 430397, "epoch": 2561} {"train_loss": -11.996718406677246, "global_step": 430398, "epoch": 2561} {"train_loss": -12.412955284118652, "global_step": 430399, "epoch": 2561} {"train_loss": -12.085358619689941, "global_step": 430400, "epoch": 2561} {"train_loss": -12.499796867370605, "global_step": 430401, "epoch": 2561} {"train_loss": -12.117288589477539, "global_step": 430402, "epoch": 2561} {"train_loss": -12.294803619384766, "global_step": 430403, "epoch": 2561} {"train_loss": -12.426950454711914, "global_step": 430404, "epoch": 2561} {"train_loss": -12.097587585449219, "global_step": 430405, "epoch": 2561} {"train_loss": -12.344595909118652, "global_step": 430406, "epoch": 2561} {"train_loss": -12.224393844604492, "global_step": 430407, "epoch": 2561} {"train_loss": -12.154701232910156, "global_step": 430408, "epoch": 2561} {"train_loss": -12.366375923156738, "global_step": 430409, "epoch": 2561} {"train_loss": -12.505244255065918, "global_step": 430410, "epoch": 2561} {"train_loss": -12.070940017700195, "global_step": 430411, "epoch": 2561} {"train_loss": -12.245601654052734, "global_step": 430412, "epoch": 2561} {"train_loss": -12.30606746673584, "global_step": 430413, "epoch": 2561} {"train_loss": -12.073583602905273, "global_step": 430414, "epoch": 2561} {"train_loss": -11.911512000220162, "global_step": 430415, "epoch": 2561, "val_loss": 309183.6875} {"train_loss": -12.343891143798828, "global_step": 430416, "epoch": 2562} {"train_loss": -12.484752655029297, "global_step": 430417, "epoch": 2562} {"train_loss": -12.45620346069336, "global_step": 430418, "epoch": 2562} {"train_loss": -12.408103942871094, "global_step": 430419, "epoch": 2562} {"train_loss": -12.351247787475586, "global_step": 430420, "epoch": 2562} {"train_loss": -12.427022933959961, "global_step": 430421, "epoch": 2562} {"train_loss": -12.615915298461914, "global_step": 430422, "epoch": 2562} {"train_loss": -12.304699897766113, "global_step": 430423, "epoch": 2562} {"train_loss": -12.593250274658203, "global_step": 430424, "epoch": 2562} {"train_loss": -12.45181655883789, "global_step": 430425, "epoch": 2562} {"train_loss": -12.612350463867188, "global_step": 430426, "epoch": 2562} {"train_loss": -12.546052932739258, "global_step": 430427, "epoch": 2562} {"train_loss": -12.588118553161621, "global_step": 430428, "epoch": 2562} {"train_loss": -12.618040084838867, "global_step": 430429, "epoch": 2562} {"train_loss": -12.639925003051758, "global_step": 430430, "epoch": 2562} {"train_loss": -12.598664283752441, "global_step": 430431, "epoch": 2562} {"train_loss": -12.634952545166016, "global_step": 430432, "epoch": 2562} {"train_loss": -12.688328742980957, "global_step": 430433, "epoch": 2562} {"train_loss": -12.68515396118164, "global_step": 430434, "epoch": 2562} {"train_loss": -12.520173072814941, "global_step": 430435, "epoch": 2562} {"train_loss": -12.659326553344727, "global_step": 430436, "epoch": 2562} {"train_loss": -12.643621444702148, "global_step": 430437, "epoch": 2562} {"train_loss": -12.837815284729004, "global_step": 430438, "epoch": 2562} {"train_loss": -12.696080207824707, "global_step": 430439, "epoch": 2562} {"train_loss": -12.652791976928711, "global_step": 430440, "epoch": 2562} {"train_loss": -12.712422370910645, "global_step": 430441, "epoch": 2562} {"train_loss": -12.563199996948242, "global_step": 430442, "epoch": 2562} {"train_loss": -12.622572898864746, "global_step": 430443, "epoch": 2562} {"train_loss": -12.556375503540039, "global_step": 430444, "epoch": 2562} {"train_loss": -12.72763442993164, "global_step": 430445, "epoch": 2562} {"train_loss": -12.619049072265625, "global_step": 430446, "epoch": 2562} {"train_loss": -12.429214477539062, "global_step": 430447, "epoch": 2562} {"train_loss": -12.617276191711426, "global_step": 430448, "epoch": 2562} {"train_loss": -12.485291481018066, "global_step": 430449, "epoch": 2562} {"train_loss": -12.459232330322266, "global_step": 430450, "epoch": 2562} {"train_loss": -12.518214225769043, "global_step": 430451, "epoch": 2562} {"train_loss": -12.836585998535156, "global_step": 430452, "epoch": 2562} {"train_loss": -12.886682510375977, "global_step": 430453, "epoch": 2562} {"train_loss": -12.647665023803711, "global_step": 430454, "epoch": 2562} {"train_loss": -12.607500076293945, "global_step": 430455, "epoch": 2562} {"train_loss": -12.861837387084961, "global_step": 430456, "epoch": 2562} {"train_loss": -12.6593017578125, "global_step": 430457, "epoch": 2562} {"train_loss": -12.616630554199219, "global_step": 430458, "epoch": 2562} {"train_loss": -11.969095230102539, "global_step": 430459, "epoch": 2562} {"train_loss": -12.128911018371582, "global_step": 430460, "epoch": 2562} {"train_loss": -12.782148361206055, "global_step": 430461, "epoch": 2562} {"train_loss": -12.512856483459473, "global_step": 430462, "epoch": 2562} {"train_loss": -11.573978424072266, "global_step": 430463, "epoch": 2562} {"train_loss": -10.180870056152344, "global_step": 430464, "epoch": 2562} {"train_loss": -12.237762451171875, "global_step": 430465, "epoch": 2562} {"train_loss": -12.221117973327637, "global_step": 430466, "epoch": 2562} {"train_loss": -12.258659362792969, "global_step": 430467, "epoch": 2562} {"train_loss": -11.707929611206055, "global_step": 430468, "epoch": 2562} {"train_loss": -12.143665313720703, "global_step": 430469, "epoch": 2562} {"train_loss": -11.488231658935547, "global_step": 430470, "epoch": 2562} {"train_loss": -9.49169921875, "global_step": 430471, "epoch": 2562} {"train_loss": -9.704269409179688, "global_step": 430472, "epoch": 2562} {"train_loss": -11.13107967376709, "global_step": 430473, "epoch": 2562} {"train_loss": -9.502073287963867, "global_step": 430474, "epoch": 2562} {"train_loss": -9.128301620483398, "global_step": 430475, "epoch": 2562} {"train_loss": -9.157137870788574, "global_step": 430476, "epoch": 2562} {"train_loss": -11.436330795288086, "global_step": 430477, "epoch": 2562} {"train_loss": -8.78196907043457, "global_step": 430478, "epoch": 2562} {"train_loss": -12.027587890625, "global_step": 430479, "epoch": 2562} {"train_loss": -10.575555801391602, "global_step": 430480, "epoch": 2562} {"train_loss": -10.684529304504395, "global_step": 430481, "epoch": 2562} {"train_loss": -12.022577285766602, "global_step": 430482, "epoch": 2562} {"train_loss": -10.825277328491211, "global_step": 430483, "epoch": 2562} {"train_loss": -11.834654808044434, "global_step": 430484, "epoch": 2562} {"train_loss": -11.692039489746094, "global_step": 430485, "epoch": 2562} {"train_loss": -12.279559135437012, "global_step": 430486, "epoch": 2562} {"train_loss": -11.523036003112793, "global_step": 430487, "epoch": 2562} {"train_loss": -12.00124740600586, "global_step": 430488, "epoch": 2562} {"train_loss": -11.123549461364746, "global_step": 430489, "epoch": 2562} {"train_loss": -11.905351638793945, "global_step": 430490, "epoch": 2562} {"train_loss": -11.925386428833008, "global_step": 430491, "epoch": 2562} {"train_loss": -11.905540466308594, "global_step": 430492, "epoch": 2562} {"train_loss": -12.140331268310547, "global_step": 430493, "epoch": 2562} {"train_loss": -11.483028411865234, "global_step": 430494, "epoch": 2562} {"train_loss": -12.368452072143555, "global_step": 430495, "epoch": 2562} {"train_loss": -11.914496421813965, "global_step": 430496, "epoch": 2562} {"train_loss": -12.253558158874512, "global_step": 430497, "epoch": 2562} {"train_loss": -12.313300132751465, "global_step": 430498, "epoch": 2562} {"train_loss": -11.955120086669922, "global_step": 430499, "epoch": 2562} {"train_loss": -12.253422737121582, "global_step": 430500, "epoch": 2562} {"train_loss": -11.78507137298584, "global_step": 430501, "epoch": 2562} {"train_loss": -12.387775421142578, "global_step": 430502, "epoch": 2562} {"train_loss": -12.0745210647583, "global_step": 430503, "epoch": 2562} {"train_loss": -12.473318099975586, "global_step": 430504, "epoch": 2562} {"train_loss": -12.276652336120605, "global_step": 430505, "epoch": 2562} {"train_loss": -12.041110038757324, "global_step": 430506, "epoch": 2562} {"train_loss": -12.493165969848633, "global_step": 430507, "epoch": 2562} {"train_loss": -12.193063735961914, "global_step": 430508, "epoch": 2562} {"train_loss": -12.447711944580078, "global_step": 430509, "epoch": 2562} {"train_loss": -12.35784912109375, "global_step": 430510, "epoch": 2562} {"train_loss": -12.549060821533203, "global_step": 430511, "epoch": 2562} {"train_loss": -12.669729232788086, "global_step": 430512, "epoch": 2562} {"train_loss": -12.605087280273438, "global_step": 430513, "epoch": 2562} {"train_loss": -12.593997955322266, "global_step": 430514, "epoch": 2562} {"train_loss": -12.671465873718262, "global_step": 430515, "epoch": 2562} {"train_loss": -12.379743576049805, "global_step": 430516, "epoch": 2562} {"train_loss": -12.740121841430664, "global_step": 430517, "epoch": 2562} {"train_loss": -12.209732055664062, "global_step": 430518, "epoch": 2562} {"train_loss": -12.76850414276123, "global_step": 430519, "epoch": 2562} {"train_loss": -12.297906875610352, "global_step": 430520, "epoch": 2562} {"train_loss": -12.575206756591797, "global_step": 430521, "epoch": 2562} {"train_loss": -12.584527015686035, "global_step": 430522, "epoch": 2562} {"train_loss": -12.229583740234375, "global_step": 430523, "epoch": 2562} {"train_loss": -12.692831039428711, "global_step": 430524, "epoch": 2562} {"train_loss": -12.268728256225586, "global_step": 430525, "epoch": 2562} {"train_loss": -12.288414001464844, "global_step": 430526, "epoch": 2562} {"train_loss": -12.600058555603027, "global_step": 430527, "epoch": 2562} {"train_loss": -12.309282302856445, "global_step": 430528, "epoch": 2562} {"train_loss": -12.30386734008789, "global_step": 430529, "epoch": 2562} {"train_loss": -12.512845993041992, "global_step": 430530, "epoch": 2562} {"train_loss": -12.498590469360352, "global_step": 430531, "epoch": 2562} {"train_loss": -12.174215316772461, "global_step": 430532, "epoch": 2562} {"train_loss": -12.496174812316895, "global_step": 430533, "epoch": 2562} {"train_loss": -12.23951244354248, "global_step": 430534, "epoch": 2562} {"train_loss": -12.323856353759766, "global_step": 430535, "epoch": 2562} {"train_loss": -12.29287052154541, "global_step": 430536, "epoch": 2562} {"train_loss": -12.245840072631836, "global_step": 430537, "epoch": 2562} {"train_loss": -12.60333251953125, "global_step": 430538, "epoch": 2562} {"train_loss": -11.943987846374512, "global_step": 430539, "epoch": 2562} {"train_loss": -12.737017631530762, "global_step": 430540, "epoch": 2562} {"train_loss": -12.351755142211914, "global_step": 430541, "epoch": 2562} {"train_loss": -11.511463165283203, "global_step": 430542, "epoch": 2562} {"train_loss": -12.477149963378906, "global_step": 430543, "epoch": 2562} {"train_loss": -12.18669319152832, "global_step": 430544, "epoch": 2562} {"train_loss": -11.719343185424805, "global_step": 430545, "epoch": 2562} {"train_loss": -12.591153144836426, "global_step": 430546, "epoch": 2562} {"train_loss": -11.766436576843262, "global_step": 430547, "epoch": 2562} {"train_loss": -12.484305381774902, "global_step": 430548, "epoch": 2562} {"train_loss": -12.3268461227417, "global_step": 430549, "epoch": 2562} {"train_loss": -12.30569076538086, "global_step": 430550, "epoch": 2562} {"train_loss": -12.658135414123535, "global_step": 430551, "epoch": 2562} {"train_loss": -12.324170112609863, "global_step": 430552, "epoch": 2562} {"train_loss": -12.5174560546875, "global_step": 430553, "epoch": 2562} {"train_loss": -12.69853687286377, "global_step": 430554, "epoch": 2562} {"train_loss": -12.355916976928711, "global_step": 430555, "epoch": 2562} {"train_loss": -12.660198211669922, "global_step": 430556, "epoch": 2562} {"train_loss": -12.468550682067871, "global_step": 430557, "epoch": 2562} {"train_loss": -12.319986343383789, "global_step": 430558, "epoch": 2562} {"train_loss": -12.375243186950684, "global_step": 430559, "epoch": 2562} {"train_loss": -12.206512451171875, "global_step": 430560, "epoch": 2562} {"train_loss": -12.45876407623291, "global_step": 430561, "epoch": 2562} {"train_loss": -12.531256675720215, "global_step": 430562, "epoch": 2562} {"train_loss": -12.542556762695312, "global_step": 430563, "epoch": 2562} {"train_loss": -12.470884323120117, "global_step": 430564, "epoch": 2562} {"train_loss": -12.557218551635742, "global_step": 430565, "epoch": 2562} {"train_loss": -12.300352096557617, "global_step": 430566, "epoch": 2562} {"train_loss": -12.698028564453125, "global_step": 430567, "epoch": 2562} {"train_loss": -12.01008415222168, "global_step": 430568, "epoch": 2562} {"train_loss": -12.241495132446289, "global_step": 430569, "epoch": 2562} {"train_loss": -11.968286514282227, "global_step": 430570, "epoch": 2562} {"train_loss": -11.987998962402344, "global_step": 430571, "epoch": 2562} {"train_loss": -11.774490356445312, "global_step": 430572, "epoch": 2562} {"train_loss": -12.323633193969727, "global_step": 430573, "epoch": 2562} {"train_loss": -11.060620307922363, "global_step": 430574, "epoch": 2562} {"train_loss": -12.505102157592773, "global_step": 430575, "epoch": 2562} {"train_loss": -9.398303031921387, "global_step": 430576, "epoch": 2562} {"train_loss": -11.490434646606445, "global_step": 430577, "epoch": 2562} {"train_loss": -11.551773071289062, "global_step": 430578, "epoch": 2562} {"train_loss": -10.7808256149292, "global_step": 430579, "epoch": 2562} {"train_loss": -12.381964683532715, "global_step": 430580, "epoch": 2562} {"train_loss": -11.347339630126953, "global_step": 430581, "epoch": 2562} {"train_loss": -12.15445327758789, "global_step": 430582, "epoch": 2562} {"train_loss": -12.133108320690337, "global_step": 430583, "epoch": 2562, "val_loss": 309816.25} {"train_loss": -11.62884521484375, "global_step": 430584, "epoch": 2563} {"train_loss": -12.519060134887695, "global_step": 430585, "epoch": 2563} {"train_loss": -11.896764755249023, "global_step": 430586, "epoch": 2563} {"train_loss": -12.110166549682617, "global_step": 430587, "epoch": 2563} {"train_loss": -10.471787452697754, "global_step": 430588, "epoch": 2563} {"train_loss": -12.391472816467285, "global_step": 430589, "epoch": 2563} {"train_loss": -10.591411590576172, "global_step": 430590, "epoch": 2563} {"train_loss": -12.030624389648438, "global_step": 430591, "epoch": 2563} {"train_loss": -11.56531810760498, "global_step": 430592, "epoch": 2563} {"train_loss": -11.162189483642578, "global_step": 430593, "epoch": 2563} {"train_loss": -11.142509460449219, "global_step": 430594, "epoch": 2563} {"train_loss": -12.039838790893555, "global_step": 430595, "epoch": 2563} {"train_loss": -11.535204887390137, "global_step": 430596, "epoch": 2563} {"train_loss": -11.40614128112793, "global_step": 430597, "epoch": 2563} {"train_loss": -10.645258903503418, "global_step": 430598, "epoch": 2563} {"train_loss": -11.55968952178955, "global_step": 430599, "epoch": 2563} {"train_loss": -11.00007438659668, "global_step": 430600, "epoch": 2563} {"train_loss": -11.671609878540039, "global_step": 430601, "epoch": 2563} {"train_loss": -11.787209510803223, "global_step": 430602, "epoch": 2563} {"train_loss": -11.484940528869629, "global_step": 430603, "epoch": 2563} {"train_loss": -12.185321807861328, "global_step": 430604, "epoch": 2563} {"train_loss": -11.18901538848877, "global_step": 430605, "epoch": 2563} {"train_loss": -12.612142562866211, "global_step": 430606, "epoch": 2563} {"train_loss": -11.783379554748535, "global_step": 430607, "epoch": 2563} {"train_loss": -11.745429992675781, "global_step": 430608, "epoch": 2563} {"train_loss": -11.875104904174805, "global_step": 430609, "epoch": 2563} {"train_loss": -10.440065383911133, "global_step": 430610, "epoch": 2563} {"train_loss": -12.349081039428711, "global_step": 430611, "epoch": 2563} {"train_loss": -11.226665496826172, "global_step": 430612, "epoch": 2563} {"train_loss": -12.189491271972656, "global_step": 430613, "epoch": 2563} {"train_loss": -11.711917877197266, "global_step": 430614, "epoch": 2563} {"train_loss": -12.303777694702148, "global_step": 430615, "epoch": 2563} {"train_loss": -11.985795021057129, "global_step": 430616, "epoch": 2563} {"train_loss": -11.977569580078125, "global_step": 430617, "epoch": 2563} {"train_loss": -12.17910385131836, "global_step": 430618, "epoch": 2563} {"train_loss": -12.266609191894531, "global_step": 430619, "epoch": 2563} {"train_loss": -12.441598892211914, "global_step": 430620, "epoch": 2563} {"train_loss": -12.392292976379395, "global_step": 430621, "epoch": 2563} {"train_loss": -12.316210746765137, "global_step": 430622, "epoch": 2563} {"train_loss": -12.504644393920898, "global_step": 430623, "epoch": 2563} {"train_loss": -12.544891357421875, "global_step": 430624, "epoch": 2563} {"train_loss": -11.873590469360352, "global_step": 430625, "epoch": 2563} {"train_loss": -12.365144729614258, "global_step": 430626, "epoch": 2563} {"train_loss": -12.255912780761719, "global_step": 430627, "epoch": 2563} {"train_loss": -12.533724784851074, "global_step": 430628, "epoch": 2563} {"train_loss": -12.440675735473633, "global_step": 430629, "epoch": 2563} {"train_loss": -12.547500610351562, "global_step": 430630, "epoch": 2563} {"train_loss": -12.58125114440918, "global_step": 430631, "epoch": 2563} {"train_loss": -12.446798324584961, "global_step": 430632, "epoch": 2563} {"train_loss": -12.345305442810059, "global_step": 430633, "epoch": 2563} {"train_loss": -12.219755172729492, "global_step": 430634, "epoch": 2563} {"train_loss": -12.688157081604004, "global_step": 430635, "epoch": 2563} {"train_loss": -12.674643516540527, "global_step": 430636, "epoch": 2563} {"train_loss": -12.562179565429688, "global_step": 430637, "epoch": 2563} {"train_loss": -12.387086868286133, "global_step": 430638, "epoch": 2563} {"train_loss": -12.70046615600586, "global_step": 430639, "epoch": 2563} {"train_loss": -12.386107444763184, "global_step": 430640, "epoch": 2563} {"train_loss": -12.330707550048828, "global_step": 430641, "epoch": 2563} {"train_loss": -12.640257835388184, "global_step": 430642, "epoch": 2563} {"train_loss": -12.608691215515137, "global_step": 430643, "epoch": 2563} {"train_loss": -12.272253036499023, "global_step": 430644, "epoch": 2563} {"train_loss": -12.822021484375, "global_step": 430645, "epoch": 2563} {"train_loss": -12.491833686828613, "global_step": 430646, "epoch": 2563} {"train_loss": -12.786026000976562, "global_step": 430647, "epoch": 2563} {"train_loss": -12.695802688598633, "global_step": 430648, "epoch": 2563} {"train_loss": -12.631444931030273, "global_step": 430649, "epoch": 2563} {"train_loss": -12.536792755126953, "global_step": 430650, "epoch": 2563} {"train_loss": -12.4754056930542, "global_step": 430651, "epoch": 2563} {"train_loss": -12.563804626464844, "global_step": 430652, "epoch": 2563} {"train_loss": -12.49077320098877, "global_step": 430653, "epoch": 2563} {"train_loss": -12.576738357543945, "global_step": 430654, "epoch": 2563} {"train_loss": -12.438758850097656, "global_step": 430655, "epoch": 2563} {"train_loss": -12.50166130065918, "global_step": 430656, "epoch": 2563} {"train_loss": -12.293204307556152, "global_step": 430657, "epoch": 2563} {"train_loss": -12.7256441116333, "global_step": 430658, "epoch": 2563} {"train_loss": -12.41180419921875, "global_step": 430659, "epoch": 2563} {"train_loss": -12.433318138122559, "global_step": 430660, "epoch": 2563} {"train_loss": -12.601404190063477, "global_step": 430661, "epoch": 2563} {"train_loss": -12.425985336303711, "global_step": 430662, "epoch": 2563} {"train_loss": -12.638167381286621, "global_step": 430663, "epoch": 2563} {"train_loss": -12.524405479431152, "global_step": 430664, "epoch": 2563} {"train_loss": -12.640873908996582, "global_step": 430665, "epoch": 2563} {"train_loss": -12.784310340881348, "global_step": 430666, "epoch": 2563} {"train_loss": -12.580059051513672, "global_step": 430667, "epoch": 2563} {"train_loss": -12.920156478881836, "global_step": 430668, "epoch": 2563} {"train_loss": -12.783623695373535, "global_step": 430669, "epoch": 2563} {"train_loss": -12.719741821289062, "global_step": 430670, "epoch": 2563} {"train_loss": -12.701766967773438, "global_step": 430671, "epoch": 2563} {"train_loss": -12.896987915039062, "global_step": 430672, "epoch": 2563} {"train_loss": -12.886398315429688, "global_step": 430673, "epoch": 2563} {"train_loss": -12.93018627166748, "global_step": 430674, "epoch": 2563} {"train_loss": -12.723075866699219, "global_step": 430675, "epoch": 2563} {"train_loss": -12.935973167419434, "global_step": 430676, "epoch": 2563} {"train_loss": -12.893003463745117, "global_step": 430677, "epoch": 2563} {"train_loss": -12.787315368652344, "global_step": 430678, "epoch": 2563} {"train_loss": -12.800872802734375, "global_step": 430679, "epoch": 2563} {"train_loss": -12.732694625854492, "global_step": 430680, "epoch": 2563} {"train_loss": -12.215620040893555, "global_step": 430681, "epoch": 2563} {"train_loss": -12.805627822875977, "global_step": 430682, "epoch": 2563} {"train_loss": -12.628308296203613, "global_step": 430683, "epoch": 2563} {"train_loss": -12.862086296081543, "global_step": 430684, "epoch": 2563} {"train_loss": -12.834999084472656, "global_step": 430685, "epoch": 2563} {"train_loss": -12.996795654296875, "global_step": 430686, "epoch": 2563} {"train_loss": -12.997905731201172, "global_step": 430687, "epoch": 2563} {"train_loss": -12.93503475189209, "global_step": 430688, "epoch": 2563} {"train_loss": -12.96676254272461, "global_step": 430689, "epoch": 2563} {"train_loss": -12.965681076049805, "global_step": 430690, "epoch": 2563} {"train_loss": -12.961475372314453, "global_step": 430691, "epoch": 2563} {"train_loss": -12.951601028442383, "global_step": 430692, "epoch": 2563} {"train_loss": -13.09214973449707, "global_step": 430693, "epoch": 2563} {"train_loss": -12.910026550292969, "global_step": 430694, "epoch": 2563} {"train_loss": -12.916788101196289, "global_step": 430695, "epoch": 2563} {"train_loss": -12.932186126708984, "global_step": 430696, "epoch": 2563} {"train_loss": -12.71222972869873, "global_step": 430697, "epoch": 2563} {"train_loss": -12.905821800231934, "global_step": 430698, "epoch": 2563} {"train_loss": -12.739410400390625, "global_step": 430699, "epoch": 2563} {"train_loss": -12.521490097045898, "global_step": 430700, "epoch": 2563} {"train_loss": -12.756913185119629, "global_step": 430701, "epoch": 2563} {"train_loss": -12.846335411071777, "global_step": 430702, "epoch": 2563} {"train_loss": -12.795439720153809, "global_step": 430703, "epoch": 2563} {"train_loss": -12.74903678894043, "global_step": 430704, "epoch": 2563} {"train_loss": -12.576032638549805, "global_step": 430705, "epoch": 2563} {"train_loss": -12.888216018676758, "global_step": 430706, "epoch": 2563} {"train_loss": -12.58247184753418, "global_step": 430707, "epoch": 2563} {"train_loss": -12.518866539001465, "global_step": 430708, "epoch": 2563} {"train_loss": -12.610224723815918, "global_step": 430709, "epoch": 2563} {"train_loss": -12.782588005065918, "global_step": 430710, "epoch": 2563} {"train_loss": -12.757160186767578, "global_step": 430711, "epoch": 2563} {"train_loss": -12.479116439819336, "global_step": 430712, "epoch": 2563} {"train_loss": -12.298391342163086, "global_step": 430713, "epoch": 2563} {"train_loss": -12.68274974822998, "global_step": 430714, "epoch": 2563} {"train_loss": -12.173337936401367, "global_step": 430715, "epoch": 2563} {"train_loss": -12.641273498535156, "global_step": 430716, "epoch": 2563} {"train_loss": -11.972973823547363, "global_step": 430717, "epoch": 2563} {"train_loss": -11.090744018554688, "global_step": 430718, "epoch": 2563} {"train_loss": -11.543187141418457, "global_step": 430719, "epoch": 2563} {"train_loss": -12.560893058776855, "global_step": 430720, "epoch": 2563} {"train_loss": -10.180150032043457, "global_step": 430721, "epoch": 2563} {"train_loss": -11.28801441192627, "global_step": 430722, "epoch": 2563} {"train_loss": -12.126657485961914, "global_step": 430723, "epoch": 2563} {"train_loss": -10.68780517578125, "global_step": 430724, "epoch": 2563} {"train_loss": -9.910934448242188, "global_step": 430725, "epoch": 2563} {"train_loss": -11.87989330291748, "global_step": 430726, "epoch": 2563} {"train_loss": -9.170858383178711, "global_step": 430727, "epoch": 2563} {"train_loss": -8.50887680053711, "global_step": 430728, "epoch": 2563} {"train_loss": -7.916964530944824, "global_step": 430729, "epoch": 2563} {"train_loss": -8.835563659667969, "global_step": 430730, "epoch": 2563} {"train_loss": -8.245595932006836, "global_step": 430731, "epoch": 2563} {"train_loss": -7.232020378112793, "global_step": 430732, "epoch": 2563} {"train_loss": -8.724994659423828, "global_step": 430733, "epoch": 2563} {"train_loss": -9.510236740112305, "global_step": 430734, "epoch": 2563} {"train_loss": -9.22997760772705, "global_step": 430735, "epoch": 2563} {"train_loss": -8.833039283752441, "global_step": 430736, "epoch": 2563} {"train_loss": -9.461393356323242, "global_step": 430737, "epoch": 2563} {"train_loss": -8.189159393310547, "global_step": 430738, "epoch": 2563} {"train_loss": -7.111233711242676, "global_step": 430739, "epoch": 2563} {"train_loss": -7.685407638549805, "global_step": 430740, "epoch": 2563} {"train_loss": -7.409025192260742, "global_step": 430741, "epoch": 2563} {"train_loss": -8.78280258178711, "global_step": 430742, "epoch": 2563} {"train_loss": -8.669733047485352, "global_step": 430743, "epoch": 2563} {"train_loss": -9.61931037902832, "global_step": 430744, "epoch": 2563} {"train_loss": -9.212665557861328, "global_step": 430745, "epoch": 2563} {"train_loss": -9.380495071411133, "global_step": 430746, "epoch": 2563} {"train_loss": -9.039502143859863, "global_step": 430747, "epoch": 2563} {"train_loss": -8.42922306060791, "global_step": 430748, "epoch": 2563} {"train_loss": -10.301676750183105, "global_step": 430749, "epoch": 2563} {"train_loss": -9.288280487060547, "global_step": 430750, "epoch": 2563} {"train_loss": -11.773729892004104, "global_step": 430751, "epoch": 2563, "val_loss": 308767.125} {"train_loss": -8.916112899780273, "global_step": 430752, "epoch": 2564} {"train_loss": -10.39247989654541, "global_step": 430753, "epoch": 2564} {"train_loss": -10.316304206848145, "global_step": 430754, "epoch": 2564} {"train_loss": -9.45765495300293, "global_step": 430755, "epoch": 2564} {"train_loss": -11.519292831420898, "global_step": 430756, "epoch": 2564} {"train_loss": -10.713518142700195, "global_step": 430757, "epoch": 2564} {"train_loss": -10.239625930786133, "global_step": 430758, "epoch": 2564} {"train_loss": -11.128412246704102, "global_step": 430759, "epoch": 2564} {"train_loss": -10.171142578125, "global_step": 430760, "epoch": 2564} {"train_loss": -10.971002578735352, "global_step": 430761, "epoch": 2564} {"train_loss": -11.468283653259277, "global_step": 430762, "epoch": 2564} {"train_loss": -11.442010879516602, "global_step": 430763, "epoch": 2564} {"train_loss": -11.524934768676758, "global_step": 430764, "epoch": 2564} {"train_loss": -11.639032363891602, "global_step": 430765, "epoch": 2564} {"train_loss": -11.356947898864746, "global_step": 430766, "epoch": 2564} {"train_loss": -11.597553253173828, "global_step": 430767, "epoch": 2564} {"train_loss": -11.857020378112793, "global_step": 430768, "epoch": 2564} {"train_loss": -11.794528007507324, "global_step": 430769, "epoch": 2564} {"train_loss": -11.710161209106445, "global_step": 430770, "epoch": 2564} {"train_loss": -11.704172134399414, "global_step": 430771, "epoch": 2564} {"train_loss": -12.117711067199707, "global_step": 430772, "epoch": 2564} {"train_loss": -11.7849702835083, "global_step": 430773, "epoch": 2564} {"train_loss": -11.910550117492676, "global_step": 430774, "epoch": 2564} {"train_loss": -11.79388427734375, "global_step": 430775, "epoch": 2564} {"train_loss": -11.446666717529297, "global_step": 430776, "epoch": 2564} {"train_loss": -11.964775085449219, "global_step": 430777, "epoch": 2564} {"train_loss": -11.767963409423828, "global_step": 430778, "epoch": 2564} {"train_loss": -11.765822410583496, "global_step": 430779, "epoch": 2564} {"train_loss": -12.26234245300293, "global_step": 430780, "epoch": 2564} {"train_loss": -11.645885467529297, "global_step": 430781, "epoch": 2564} {"train_loss": -12.014544486999512, "global_step": 430782, "epoch": 2564} {"train_loss": -12.283134460449219, "global_step": 430783, "epoch": 2564} {"train_loss": -12.029244422912598, "global_step": 430784, "epoch": 2564} {"train_loss": -12.008073806762695, "global_step": 430785, "epoch": 2564} {"train_loss": -12.07507038116455, "global_step": 430786, "epoch": 2564} {"train_loss": -11.981783866882324, "global_step": 430787, "epoch": 2564} {"train_loss": -12.013697624206543, "global_step": 430788, "epoch": 2564} {"train_loss": -11.93812370300293, "global_step": 430789, "epoch": 2564} {"train_loss": -12.184694290161133, "global_step": 430790, "epoch": 2564} {"train_loss": -12.223773956298828, "global_step": 430791, "epoch": 2564} {"train_loss": -12.063556671142578, "global_step": 430792, "epoch": 2564} {"train_loss": -11.901427268981934, "global_step": 430793, "epoch": 2564} {"train_loss": -12.22414779663086, "global_step": 430794, "epoch": 2564} {"train_loss": -11.787111282348633, "global_step": 430795, "epoch": 2564} {"train_loss": -11.817346572875977, "global_step": 430796, "epoch": 2564} {"train_loss": -11.962234497070312, "global_step": 430797, "epoch": 2564} {"train_loss": -11.793099403381348, "global_step": 430798, "epoch": 2564} {"train_loss": -12.288333892822266, "global_step": 430799, "epoch": 2564} {"train_loss": -11.832642555236816, "global_step": 430800, "epoch": 2564} {"train_loss": -11.763725280761719, "global_step": 430801, "epoch": 2564} {"train_loss": -12.14879035949707, "global_step": 430802, "epoch": 2564} {"train_loss": -11.962875366210938, "global_step": 430803, "epoch": 2564} {"train_loss": -12.409490585327148, "global_step": 430804, "epoch": 2564} {"train_loss": -12.291790008544922, "global_step": 430805, "epoch": 2564} {"train_loss": -12.287662506103516, "global_step": 430806, "epoch": 2564} {"train_loss": -12.47647476196289, "global_step": 430807, "epoch": 2564} {"train_loss": -12.27142333984375, "global_step": 430808, "epoch": 2564} {"train_loss": -12.490036010742188, "global_step": 430809, "epoch": 2564} {"train_loss": -12.461477279663086, "global_step": 430810, "epoch": 2564} {"train_loss": -12.417308807373047, "global_step": 430811, "epoch": 2564} {"train_loss": -12.59018325805664, "global_step": 430812, "epoch": 2564} {"train_loss": -12.457420349121094, "global_step": 430813, "epoch": 2564} {"train_loss": -12.477701187133789, "global_step": 430814, "epoch": 2564} {"train_loss": -12.425106048583984, "global_step": 430815, "epoch": 2564} {"train_loss": -12.605086326599121, "global_step": 430816, "epoch": 2564} {"train_loss": -12.527867317199707, "global_step": 430817, "epoch": 2564} {"train_loss": -12.638575553894043, "global_step": 430818, "epoch": 2564} {"train_loss": -12.537555694580078, "global_step": 430819, "epoch": 2564} {"train_loss": -12.678987503051758, "global_step": 430820, "epoch": 2564} {"train_loss": -12.554128646850586, "global_step": 430821, "epoch": 2564} {"train_loss": -12.588403701782227, "global_step": 430822, "epoch": 2564} {"train_loss": -12.308223724365234, "global_step": 430823, "epoch": 2564} {"train_loss": -12.562250137329102, "global_step": 430824, "epoch": 2564} {"train_loss": -12.445686340332031, "global_step": 430825, "epoch": 2564} {"train_loss": -12.585289001464844, "global_step": 430826, "epoch": 2564} {"train_loss": -12.530828475952148, "global_step": 430827, "epoch": 2564} {"train_loss": -12.406513214111328, "global_step": 430828, "epoch": 2564} {"train_loss": -12.660726547241211, "global_step": 430829, "epoch": 2564} {"train_loss": -12.387765884399414, "global_step": 430830, "epoch": 2564} {"train_loss": -12.384933471679688, "global_step": 430831, "epoch": 2564} {"train_loss": -12.522749900817871, "global_step": 430832, "epoch": 2564} {"train_loss": -12.768863677978516, "global_step": 430833, "epoch": 2564} {"train_loss": -12.350639343261719, "global_step": 430834, "epoch": 2564} {"train_loss": -12.359732627868652, "global_step": 430835, "epoch": 2564} {"train_loss": -12.751693725585938, "global_step": 430836, "epoch": 2564} {"train_loss": -12.537839889526367, "global_step": 430837, "epoch": 2564} {"train_loss": -12.456443786621094, "global_step": 430838, "epoch": 2564} {"train_loss": -12.466228485107422, "global_step": 430839, "epoch": 2564} {"train_loss": -12.39998722076416, "global_step": 430840, "epoch": 2564} {"train_loss": -12.65754222869873, "global_step": 430841, "epoch": 2564} {"train_loss": -12.703176498413086, "global_step": 430842, "epoch": 2564} {"train_loss": -12.633950233459473, "global_step": 430843, "epoch": 2564} {"train_loss": -12.599396705627441, "global_step": 430844, "epoch": 2564} {"train_loss": -12.471746444702148, "global_step": 430845, "epoch": 2564} {"train_loss": -12.402644157409668, "global_step": 430846, "epoch": 2564} {"train_loss": -12.770612716674805, "global_step": 430847, "epoch": 2564} {"train_loss": -12.130041122436523, "global_step": 430848, "epoch": 2564} {"train_loss": -11.765535354614258, "global_step": 430849, "epoch": 2564} {"train_loss": -11.929790496826172, "global_step": 430850, "epoch": 2564} {"train_loss": -11.621028900146484, "global_step": 430851, "epoch": 2564} {"train_loss": -11.989728927612305, "global_step": 430852, "epoch": 2564} {"train_loss": -11.939369201660156, "global_step": 430853, "epoch": 2564} {"train_loss": -11.112724304199219, "global_step": 430854, "epoch": 2564} {"train_loss": -11.549993515014648, "global_step": 430855, "epoch": 2564} {"train_loss": -12.186614036560059, "global_step": 430856, "epoch": 2564} {"train_loss": -10.814780235290527, "global_step": 430857, "epoch": 2564} {"train_loss": -12.470245361328125, "global_step": 430858, "epoch": 2564} {"train_loss": -9.658966064453125, "global_step": 430859, "epoch": 2564} {"train_loss": -12.027012825012207, "global_step": 430860, "epoch": 2564} {"train_loss": -11.359251976013184, "global_step": 430861, "epoch": 2564} {"train_loss": -11.545267105102539, "global_step": 430862, "epoch": 2564} {"train_loss": -11.385040283203125, "global_step": 430863, "epoch": 2564} {"train_loss": -11.558805465698242, "global_step": 430864, "epoch": 2564} {"train_loss": -12.024053573608398, "global_step": 430865, "epoch": 2564} {"train_loss": -11.992369651794434, "global_step": 430866, "epoch": 2564} {"train_loss": -12.420389175415039, "global_step": 430867, "epoch": 2564} {"train_loss": -12.168014526367188, "global_step": 430868, "epoch": 2564} {"train_loss": -12.478856086730957, "global_step": 430869, "epoch": 2564} {"train_loss": -12.096625328063965, "global_step": 430870, "epoch": 2564} {"train_loss": -12.366416931152344, "global_step": 430871, "epoch": 2564} {"train_loss": -12.232559204101562, "global_step": 430872, "epoch": 2564} {"train_loss": -12.23388385772705, "global_step": 430873, "epoch": 2564} {"train_loss": -12.432690620422363, "global_step": 430874, "epoch": 2564} {"train_loss": -12.450695991516113, "global_step": 430875, "epoch": 2564} {"train_loss": -12.4121732711792, "global_step": 430876, "epoch": 2564} {"train_loss": -12.103822708129883, "global_step": 430877, "epoch": 2564} {"train_loss": -12.639142990112305, "global_step": 430878, "epoch": 2564} {"train_loss": -12.472511291503906, "global_step": 430879, "epoch": 2564} {"train_loss": -12.261398315429688, "global_step": 430880, "epoch": 2564} {"train_loss": -12.270853042602539, "global_step": 430881, "epoch": 2564} {"train_loss": -12.527847290039062, "global_step": 430882, "epoch": 2564} {"train_loss": -11.726210594177246, "global_step": 430883, "epoch": 2564} {"train_loss": -12.349382400512695, "global_step": 430884, "epoch": 2564} {"train_loss": -11.908803939819336, "global_step": 430885, "epoch": 2564} {"train_loss": -12.56702995300293, "global_step": 430886, "epoch": 2564} {"train_loss": -11.927724838256836, "global_step": 430887, "epoch": 2564} {"train_loss": -12.771737098693848, "global_step": 430888, "epoch": 2564} {"train_loss": -12.195877075195312, "global_step": 430889, "epoch": 2564} {"train_loss": -12.623430252075195, "global_step": 430890, "epoch": 2564} {"train_loss": -12.697300910949707, "global_step": 430891, "epoch": 2564} {"train_loss": -12.388503074645996, "global_step": 430892, "epoch": 2564} {"train_loss": -12.294110298156738, "global_step": 430893, "epoch": 2564} {"train_loss": -12.189061164855957, "global_step": 430894, "epoch": 2564} {"train_loss": -12.458314895629883, "global_step": 430895, "epoch": 2564} {"train_loss": -12.106998443603516, "global_step": 430896, "epoch": 2564} {"train_loss": -12.466978073120117, "global_step": 430897, "epoch": 2564} {"train_loss": -12.699126243591309, "global_step": 430898, "epoch": 2564} {"train_loss": -11.445480346679688, "global_step": 430899, "epoch": 2564} {"train_loss": -12.268306732177734, "global_step": 430900, "epoch": 2564} {"train_loss": -12.1238431930542, "global_step": 430901, "epoch": 2564} {"train_loss": -11.915933609008789, "global_step": 430902, "epoch": 2564} {"train_loss": -12.337533950805664, "global_step": 430903, "epoch": 2564} {"train_loss": -12.658039093017578, "global_step": 430904, "epoch": 2564} {"train_loss": -12.039841651916504, "global_step": 430905, "epoch": 2564} {"train_loss": -12.596238136291504, "global_step": 430906, "epoch": 2564} {"train_loss": -12.13089370727539, "global_step": 430907, "epoch": 2564} {"train_loss": -12.387239456176758, "global_step": 430908, "epoch": 2564} {"train_loss": -12.387946128845215, "global_step": 430909, "epoch": 2564} {"train_loss": -11.830912590026855, "global_step": 430910, "epoch": 2564} {"train_loss": -12.11499309539795, "global_step": 430911, "epoch": 2564} {"train_loss": -12.367107391357422, "global_step": 430912, "epoch": 2564} {"train_loss": -12.134140014648438, "global_step": 430913, "epoch": 2564} {"train_loss": -11.884998321533203, "global_step": 430914, "epoch": 2564} {"train_loss": -12.380722045898438, "global_step": 430915, "epoch": 2564} {"train_loss": -11.856462478637695, "global_step": 430916, "epoch": 2564} {"train_loss": -12.149027824401855, "global_step": 430917, "epoch": 2564} {"train_loss": -12.211105346679688, "global_step": 430918, "epoch": 2564} {"train_loss": -12.050928848130363, "global_step": 430919, "epoch": 2564, "val_loss": 311877.40625} {"train_loss": -12.624273300170898, "global_step": 430920, "epoch": 2565} {"train_loss": -11.006444931030273, "global_step": 430921, "epoch": 2565} {"train_loss": -11.878181457519531, "global_step": 430922, "epoch": 2565} {"train_loss": -11.963957786560059, "global_step": 430923, "epoch": 2565} {"train_loss": -11.71645736694336, "global_step": 430924, "epoch": 2565} {"train_loss": -11.86229419708252, "global_step": 430925, "epoch": 2565} {"train_loss": -11.790456771850586, "global_step": 430926, "epoch": 2565} {"train_loss": -11.75428581237793, "global_step": 430927, "epoch": 2565} {"train_loss": -10.967784881591797, "global_step": 430928, "epoch": 2565} {"train_loss": -11.070507049560547, "global_step": 430929, "epoch": 2565} {"train_loss": -10.376405715942383, "global_step": 430930, "epoch": 2565} {"train_loss": -11.157115936279297, "global_step": 430931, "epoch": 2565} {"train_loss": -11.052031517028809, "global_step": 430932, "epoch": 2565} {"train_loss": -9.548494338989258, "global_step": 430933, "epoch": 2565} {"train_loss": -11.026294708251953, "global_step": 430934, "epoch": 2565} {"train_loss": -10.590269088745117, "global_step": 430935, "epoch": 2565} {"train_loss": -10.637828826904297, "global_step": 430936, "epoch": 2565} {"train_loss": -11.92380428314209, "global_step": 430937, "epoch": 2565} {"train_loss": -10.768959045410156, "global_step": 430938, "epoch": 2565} {"train_loss": -12.05827522277832, "global_step": 430939, "epoch": 2565} {"train_loss": -11.76198959350586, "global_step": 430940, "epoch": 2565} {"train_loss": -11.736051559448242, "global_step": 430941, "epoch": 2565} {"train_loss": -11.934123039245605, "global_step": 430942, "epoch": 2565} {"train_loss": -12.118338584899902, "global_step": 430943, "epoch": 2565} {"train_loss": -12.256460189819336, "global_step": 430944, "epoch": 2565} {"train_loss": -12.447395324707031, "global_step": 430945, "epoch": 2565} {"train_loss": -12.33055305480957, "global_step": 430946, "epoch": 2565} {"train_loss": -12.26284408569336, "global_step": 430947, "epoch": 2565} {"train_loss": -12.569830894470215, "global_step": 430948, "epoch": 2565} {"train_loss": -12.427129745483398, "global_step": 430949, "epoch": 2565} {"train_loss": -12.443646430969238, "global_step": 430950, "epoch": 2565} {"train_loss": -12.391861915588379, "global_step": 430951, "epoch": 2565} {"train_loss": -12.329535484313965, "global_step": 430952, "epoch": 2565} {"train_loss": -12.583585739135742, "global_step": 430953, "epoch": 2565} {"train_loss": -12.557840347290039, "global_step": 430954, "epoch": 2565} {"train_loss": -12.250807762145996, "global_step": 430955, "epoch": 2565} {"train_loss": -12.464245796203613, "global_step": 430956, "epoch": 2565} {"train_loss": -12.478374481201172, "global_step": 430957, "epoch": 2565} {"train_loss": -12.279088973999023, "global_step": 430958, "epoch": 2565} {"train_loss": -12.611045837402344, "global_step": 430959, "epoch": 2565} {"train_loss": -12.352807998657227, "global_step": 430960, "epoch": 2565} {"train_loss": -12.177925109863281, "global_step": 430961, "epoch": 2565} {"train_loss": -12.568723678588867, "global_step": 430962, "epoch": 2565} {"train_loss": -12.698315620422363, "global_step": 430963, "epoch": 2565} {"train_loss": -12.683122634887695, "global_step": 430964, "epoch": 2565} {"train_loss": -12.607898712158203, "global_step": 430965, "epoch": 2565} {"train_loss": -12.630797386169434, "global_step": 430966, "epoch": 2565} {"train_loss": -12.484611511230469, "global_step": 430967, "epoch": 2565} {"train_loss": -12.693007469177246, "global_step": 430968, "epoch": 2565} {"train_loss": -12.617341041564941, "global_step": 430969, "epoch": 2565} {"train_loss": -12.599960327148438, "global_step": 430970, "epoch": 2565} {"train_loss": -12.699074745178223, "global_step": 430971, "epoch": 2565} {"train_loss": -12.5172758102417, "global_step": 430972, "epoch": 2565} {"train_loss": -12.346893310546875, "global_step": 430973, "epoch": 2565} {"train_loss": -12.472057342529297, "global_step": 430974, "epoch": 2565} {"train_loss": -12.853570938110352, "global_step": 430975, "epoch": 2565} {"train_loss": -12.346349716186523, "global_step": 430976, "epoch": 2565} {"train_loss": -12.719768524169922, "global_step": 430977, "epoch": 2565} {"train_loss": -12.533548355102539, "global_step": 430978, "epoch": 2565} {"train_loss": -12.286148071289062, "global_step": 430979, "epoch": 2565} {"train_loss": -12.282974243164062, "global_step": 430980, "epoch": 2565} {"train_loss": -12.6590576171875, "global_step": 430981, "epoch": 2565} {"train_loss": -12.550809860229492, "global_step": 430982, "epoch": 2565} {"train_loss": -12.613811492919922, "global_step": 430983, "epoch": 2565} {"train_loss": -12.717015266418457, "global_step": 430984, "epoch": 2565} {"train_loss": -12.732194900512695, "global_step": 430985, "epoch": 2565} {"train_loss": -12.59937572479248, "global_step": 430986, "epoch": 2565} {"train_loss": -12.424202919006348, "global_step": 430987, "epoch": 2565} {"train_loss": -12.583303451538086, "global_step": 430988, "epoch": 2565} {"train_loss": -12.606390953063965, "global_step": 430989, "epoch": 2565} {"train_loss": -12.700061798095703, "global_step": 430990, "epoch": 2565} {"train_loss": -12.323833465576172, "global_step": 430991, "epoch": 2565} {"train_loss": -11.980456352233887, "global_step": 430992, "epoch": 2565} {"train_loss": -12.246606826782227, "global_step": 430993, "epoch": 2565} {"train_loss": -11.861433029174805, "global_step": 430994, "epoch": 2565} {"train_loss": -10.547196388244629, "global_step": 430995, "epoch": 2565} {"train_loss": -12.19384765625, "global_step": 430996, "epoch": 2565} {"train_loss": -11.144140243530273, "global_step": 430997, "epoch": 2565} {"train_loss": -10.724764823913574, "global_step": 430998, "epoch": 2565} {"train_loss": -11.780723571777344, "global_step": 430999, "epoch": 2565} {"train_loss": -11.03497314453125, "global_step": 431000, "epoch": 2565} {"train_loss": -11.558128356933594, "global_step": 431001, "epoch": 2565} {"train_loss": -12.20596981048584, "global_step": 431002, "epoch": 2565} {"train_loss": -12.076204299926758, "global_step": 431003, "epoch": 2565} {"train_loss": -12.132271766662598, "global_step": 431004, "epoch": 2565} {"train_loss": -11.89264965057373, "global_step": 431005, "epoch": 2565} {"train_loss": -12.220379829406738, "global_step": 431006, "epoch": 2565} {"train_loss": -12.191850662231445, "global_step": 431007, "epoch": 2565} {"train_loss": -12.18703556060791, "global_step": 431008, "epoch": 2565} {"train_loss": -12.046819686889648, "global_step": 431009, "epoch": 2565} {"train_loss": -12.257333755493164, "global_step": 431010, "epoch": 2565} {"train_loss": -12.096087455749512, "global_step": 431011, "epoch": 2565} {"train_loss": -11.500246047973633, "global_step": 431012, "epoch": 2565} {"train_loss": -12.139772415161133, "global_step": 431013, "epoch": 2565} {"train_loss": -11.42593765258789, "global_step": 431014, "epoch": 2565} {"train_loss": -11.43886661529541, "global_step": 431015, "epoch": 2565} {"train_loss": -10.988008499145508, "global_step": 431016, "epoch": 2565} {"train_loss": -11.675237655639648, "global_step": 431017, "epoch": 2565} {"train_loss": -11.220136642456055, "global_step": 431018, "epoch": 2565} {"train_loss": -10.940143585205078, "global_step": 431019, "epoch": 2565} {"train_loss": -11.896032333374023, "global_step": 431020, "epoch": 2565} {"train_loss": -11.129104614257812, "global_step": 431021, "epoch": 2565} {"train_loss": -11.610595703125, "global_step": 431022, "epoch": 2565} {"train_loss": -11.065266609191895, "global_step": 431023, "epoch": 2565} {"train_loss": -11.566339492797852, "global_step": 431024, "epoch": 2565} {"train_loss": -11.557065963745117, "global_step": 431025, "epoch": 2565} {"train_loss": -11.102548599243164, "global_step": 431026, "epoch": 2565} {"train_loss": -11.616159439086914, "global_step": 431027, "epoch": 2565} {"train_loss": -11.269290924072266, "global_step": 431028, "epoch": 2565} {"train_loss": -10.820697784423828, "global_step": 431029, "epoch": 2565} {"train_loss": -10.72939682006836, "global_step": 431030, "epoch": 2565} {"train_loss": -10.423465728759766, "global_step": 431031, "epoch": 2565} {"train_loss": -11.112462997436523, "global_step": 431032, "epoch": 2565} {"train_loss": -10.6195707321167, "global_step": 431033, "epoch": 2565} {"train_loss": -10.615324020385742, "global_step": 431034, "epoch": 2565} {"train_loss": -11.598499298095703, "global_step": 431035, "epoch": 2565} {"train_loss": -11.262832641601562, "global_step": 431036, "epoch": 2565} {"train_loss": -11.17849349975586, "global_step": 431037, "epoch": 2565} {"train_loss": -11.770139694213867, "global_step": 431038, "epoch": 2565} {"train_loss": -11.053750038146973, "global_step": 431039, "epoch": 2565} {"train_loss": -11.028575897216797, "global_step": 431040, "epoch": 2565} {"train_loss": -10.960067749023438, "global_step": 431041, "epoch": 2565} {"train_loss": -11.935571670532227, "global_step": 431042, "epoch": 2565} {"train_loss": -11.388704299926758, "global_step": 431043, "epoch": 2565} {"train_loss": -12.126855850219727, "global_step": 431044, "epoch": 2565} {"train_loss": -11.759513854980469, "global_step": 431045, "epoch": 2565} {"train_loss": -11.432109832763672, "global_step": 431046, "epoch": 2565} {"train_loss": -11.299151420593262, "global_step": 431047, "epoch": 2565} {"train_loss": -10.744253158569336, "global_step": 431048, "epoch": 2565} {"train_loss": -11.800300598144531, "global_step": 431049, "epoch": 2565} {"train_loss": -11.050139427185059, "global_step": 431050, "epoch": 2565} {"train_loss": -12.050970077514648, "global_step": 431051, "epoch": 2565} {"train_loss": -11.250515937805176, "global_step": 431052, "epoch": 2565} {"train_loss": -12.118000030517578, "global_step": 431053, "epoch": 2565} {"train_loss": -11.551078796386719, "global_step": 431054, "epoch": 2565} {"train_loss": -12.230411529541016, "global_step": 431055, "epoch": 2565} {"train_loss": -11.568166732788086, "global_step": 431056, "epoch": 2565} {"train_loss": -12.525465965270996, "global_step": 431057, "epoch": 2565} {"train_loss": -10.848686218261719, "global_step": 431058, "epoch": 2565} {"train_loss": -12.287927627563477, "global_step": 431059, "epoch": 2565} {"train_loss": -11.424361228942871, "global_step": 431060, "epoch": 2565} {"train_loss": -12.22695541381836, "global_step": 431061, "epoch": 2565} {"train_loss": -11.47237777709961, "global_step": 431062, "epoch": 2565} {"train_loss": -11.603946685791016, "global_step": 431063, "epoch": 2565} {"train_loss": -10.897255897521973, "global_step": 431064, "epoch": 2565} {"train_loss": -12.11056900024414, "global_step": 431065, "epoch": 2565} {"train_loss": -11.632387161254883, "global_step": 431066, "epoch": 2565} {"train_loss": -11.612138748168945, "global_step": 431067, "epoch": 2565} {"train_loss": -12.165465354919434, "global_step": 431068, "epoch": 2565} {"train_loss": -11.958467483520508, "global_step": 431069, "epoch": 2565} {"train_loss": -12.331403732299805, "global_step": 431070, "epoch": 2565} {"train_loss": -12.306417465209961, "global_step": 431071, "epoch": 2565} {"train_loss": -12.249521255493164, "global_step": 431072, "epoch": 2565} {"train_loss": -12.555871963500977, "global_step": 431073, "epoch": 2565} {"train_loss": -12.321772575378418, "global_step": 431074, "epoch": 2565} {"train_loss": -12.271293640136719, "global_step": 431075, "epoch": 2565} {"train_loss": -12.557180404663086, "global_step": 431076, "epoch": 2565} {"train_loss": -12.251131057739258, "global_step": 431077, "epoch": 2565} {"train_loss": -12.362804412841797, "global_step": 431078, "epoch": 2565} {"train_loss": -12.532386779785156, "global_step": 431079, "epoch": 2565} {"train_loss": -12.296677589416504, "global_step": 431080, "epoch": 2565} {"train_loss": -12.424520492553711, "global_step": 431081, "epoch": 2565} {"train_loss": -12.467351913452148, "global_step": 431082, "epoch": 2565} {"train_loss": -12.496883392333984, "global_step": 431083, "epoch": 2565} {"train_loss": -11.990716934204102, "global_step": 431084, "epoch": 2565} {"train_loss": -12.524127960205078, "global_step": 431085, "epoch": 2565} {"train_loss": -12.261539459228516, "global_step": 431086, "epoch": 2565} {"train_loss": -11.887752311570305, "global_step": 431087, "epoch": 2565, "val_loss": 309301.96875, "train_action_mse_error": 1.9147038459777832} {"train_loss": -12.444040298461914, "global_step": 431088, "epoch": 2566} {"train_loss": -12.192450523376465, "global_step": 431089, "epoch": 2566} {"train_loss": -12.749436378479004, "global_step": 431090, "epoch": 2566} {"train_loss": -12.38436222076416, "global_step": 431091, "epoch": 2566} {"train_loss": -12.403294563293457, "global_step": 431092, "epoch": 2566} {"train_loss": -12.55108642578125, "global_step": 431093, "epoch": 2566} {"train_loss": -12.488588333129883, "global_step": 431094, "epoch": 2566} {"train_loss": -12.553069114685059, "global_step": 431095, "epoch": 2566} {"train_loss": -12.492069244384766, "global_step": 431096, "epoch": 2566} {"train_loss": -12.417081832885742, "global_step": 431097, "epoch": 2566} {"train_loss": -12.306394577026367, "global_step": 431098, "epoch": 2566} {"train_loss": -12.813705444335938, "global_step": 431099, "epoch": 2566} {"train_loss": -12.6198148727417, "global_step": 431100, "epoch": 2566} {"train_loss": -12.698152542114258, "global_step": 431101, "epoch": 2566} {"train_loss": -12.41879653930664, "global_step": 431102, "epoch": 2566} {"train_loss": -12.676826477050781, "global_step": 431103, "epoch": 2566} {"train_loss": -12.61900806427002, "global_step": 431104, "epoch": 2566} {"train_loss": -12.649224281311035, "global_step": 431105, "epoch": 2566} {"train_loss": -12.547693252563477, "global_step": 431106, "epoch": 2566} {"train_loss": -12.695825576782227, "global_step": 431107, "epoch": 2566} {"train_loss": -12.301704406738281, "global_step": 431108, "epoch": 2566} {"train_loss": -12.708450317382812, "global_step": 431109, "epoch": 2566} {"train_loss": -12.619010925292969, "global_step": 431110, "epoch": 2566} {"train_loss": -12.385149955749512, "global_step": 431111, "epoch": 2566} {"train_loss": -12.521798133850098, "global_step": 431112, "epoch": 2566} {"train_loss": -12.60260009765625, "global_step": 431113, "epoch": 2566} {"train_loss": -12.790825843811035, "global_step": 431114, "epoch": 2566} {"train_loss": -12.880918502807617, "global_step": 431115, "epoch": 2566} {"train_loss": -12.497871398925781, "global_step": 431116, "epoch": 2566} {"train_loss": -12.324374198913574, "global_step": 431117, "epoch": 2566} {"train_loss": -12.640647888183594, "global_step": 431118, "epoch": 2566} {"train_loss": -11.973390579223633, "global_step": 431119, "epoch": 2566} {"train_loss": -12.526908874511719, "global_step": 431120, "epoch": 2566} {"train_loss": -12.385923385620117, "global_step": 431121, "epoch": 2566} {"train_loss": -12.46556568145752, "global_step": 431122, "epoch": 2566} {"train_loss": -12.149290084838867, "global_step": 431123, "epoch": 2566} {"train_loss": -11.931090354919434, "global_step": 431124, "epoch": 2566} {"train_loss": -12.636670112609863, "global_step": 431125, "epoch": 2566} {"train_loss": -12.184243202209473, "global_step": 431126, "epoch": 2566} {"train_loss": -11.401626586914062, "global_step": 431127, "epoch": 2566} {"train_loss": -11.389156341552734, "global_step": 431128, "epoch": 2566} {"train_loss": -11.970803260803223, "global_step": 431129, "epoch": 2566} {"train_loss": -12.34487247467041, "global_step": 431130, "epoch": 2566} {"train_loss": -12.496467590332031, "global_step": 431131, "epoch": 2566} {"train_loss": -12.21754264831543, "global_step": 431132, "epoch": 2566} {"train_loss": -12.657544136047363, "global_step": 431133, "epoch": 2566} {"train_loss": -12.266214370727539, "global_step": 431134, "epoch": 2566} {"train_loss": -12.679875373840332, "global_step": 431135, "epoch": 2566} {"train_loss": -11.772618293762207, "global_step": 431136, "epoch": 2566} {"train_loss": -11.841341972351074, "global_step": 431137, "epoch": 2566} {"train_loss": -11.091190338134766, "global_step": 431138, "epoch": 2566} {"train_loss": -11.367877960205078, "global_step": 431139, "epoch": 2566} {"train_loss": -10.681567192077637, "global_step": 431140, "epoch": 2566} {"train_loss": -9.853063583374023, "global_step": 431141, "epoch": 2566} {"train_loss": -11.278688430786133, "global_step": 431142, "epoch": 2566} {"train_loss": -10.264171600341797, "global_step": 431143, "epoch": 2566} {"train_loss": -11.465373039245605, "global_step": 431144, "epoch": 2566} {"train_loss": -11.710454940795898, "global_step": 431145, "epoch": 2566} {"train_loss": -11.821123123168945, "global_step": 431146, "epoch": 2566} {"train_loss": -11.387896537780762, "global_step": 431147, "epoch": 2566} {"train_loss": -11.266883850097656, "global_step": 431148, "epoch": 2566} {"train_loss": -11.591047286987305, "global_step": 431149, "epoch": 2566} {"train_loss": -12.155116081237793, "global_step": 431150, "epoch": 2566} {"train_loss": -11.82236385345459, "global_step": 431151, "epoch": 2566} {"train_loss": -11.9192533493042, "global_step": 431152, "epoch": 2566} {"train_loss": -12.103656768798828, "global_step": 431153, "epoch": 2566} {"train_loss": -12.062225341796875, "global_step": 431154, "epoch": 2566} {"train_loss": -12.313305854797363, "global_step": 431155, "epoch": 2566} {"train_loss": -12.026603698730469, "global_step": 431156, "epoch": 2566} {"train_loss": -12.16751480102539, "global_step": 431157, "epoch": 2566} {"train_loss": -11.929591178894043, "global_step": 431158, "epoch": 2566} {"train_loss": -11.854828834533691, "global_step": 431159, "epoch": 2566} {"train_loss": -12.64634895324707, "global_step": 431160, "epoch": 2566} {"train_loss": -12.031551361083984, "global_step": 431161, "epoch": 2566} {"train_loss": -12.650397300720215, "global_step": 431162, "epoch": 2566} {"train_loss": -12.295287132263184, "global_step": 431163, "epoch": 2566} {"train_loss": -12.347223281860352, "global_step": 431164, "epoch": 2566} {"train_loss": -11.718910217285156, "global_step": 431165, "epoch": 2566} {"train_loss": -12.018112182617188, "global_step": 431166, "epoch": 2566} {"train_loss": -12.50091552734375, "global_step": 431167, "epoch": 2566} {"train_loss": -12.406396865844727, "global_step": 431168, "epoch": 2566} {"train_loss": -12.361980438232422, "global_step": 431169, "epoch": 2566} {"train_loss": -11.986604690551758, "global_step": 431170, "epoch": 2566} {"train_loss": -11.925015449523926, "global_step": 431171, "epoch": 2566} {"train_loss": -12.325276374816895, "global_step": 431172, "epoch": 2566} {"train_loss": -11.927497863769531, "global_step": 431173, "epoch": 2566} {"train_loss": -12.403353691101074, "global_step": 431174, "epoch": 2566} {"train_loss": -12.232510566711426, "global_step": 431175, "epoch": 2566} {"train_loss": -12.422380447387695, "global_step": 431176, "epoch": 2566} {"train_loss": -12.527974128723145, "global_step": 431177, "epoch": 2566} {"train_loss": -12.282224655151367, "global_step": 431178, "epoch": 2566} {"train_loss": -12.57164192199707, "global_step": 431179, "epoch": 2566} {"train_loss": -12.288450241088867, "global_step": 431180, "epoch": 2566} {"train_loss": -12.510568618774414, "global_step": 431181, "epoch": 2566} {"train_loss": -12.21049690246582, "global_step": 431182, "epoch": 2566} {"train_loss": -12.4744234085083, "global_step": 431183, "epoch": 2566} {"train_loss": -12.611786842346191, "global_step": 431184, "epoch": 2566} {"train_loss": -12.317747116088867, "global_step": 431185, "epoch": 2566} {"train_loss": -12.65427017211914, "global_step": 431186, "epoch": 2566} {"train_loss": -12.52331256866455, "global_step": 431187, "epoch": 2566} {"train_loss": -12.542369842529297, "global_step": 431188, "epoch": 2566} {"train_loss": -12.282793045043945, "global_step": 431189, "epoch": 2566} {"train_loss": -12.680560111999512, "global_step": 431190, "epoch": 2566} {"train_loss": -12.57646369934082, "global_step": 431191, "epoch": 2566} {"train_loss": -12.69916820526123, "global_step": 431192, "epoch": 2566} {"train_loss": -12.587492942810059, "global_step": 431193, "epoch": 2566} {"train_loss": -12.788420677185059, "global_step": 431194, "epoch": 2566} {"train_loss": -12.724530220031738, "global_step": 431195, "epoch": 2566} {"train_loss": -12.49577522277832, "global_step": 431196, "epoch": 2566} {"train_loss": -12.534774780273438, "global_step": 431197, "epoch": 2566} {"train_loss": -12.411308288574219, "global_step": 431198, "epoch": 2566} {"train_loss": -12.669267654418945, "global_step": 431199, "epoch": 2566} {"train_loss": -12.459209442138672, "global_step": 431200, "epoch": 2566} {"train_loss": -12.421424865722656, "global_step": 431201, "epoch": 2566} {"train_loss": -12.50733757019043, "global_step": 431202, "epoch": 2566} {"train_loss": -12.746891021728516, "global_step": 431203, "epoch": 2566} {"train_loss": -12.178657531738281, "global_step": 431204, "epoch": 2566} {"train_loss": -12.690452575683594, "global_step": 431205, "epoch": 2566} {"train_loss": -12.568735122680664, "global_step": 431206, "epoch": 2566} {"train_loss": -12.589814186096191, "global_step": 431207, "epoch": 2566} {"train_loss": -12.498323440551758, "global_step": 431208, "epoch": 2566} {"train_loss": -12.26400375366211, "global_step": 431209, "epoch": 2566} {"train_loss": -12.5430908203125, "global_step": 431210, "epoch": 2566} {"train_loss": -12.423221588134766, "global_step": 431211, "epoch": 2566} {"train_loss": -11.72947883605957, "global_step": 431212, "epoch": 2566} {"train_loss": -10.878467559814453, "global_step": 431213, "epoch": 2566} {"train_loss": -12.298112869262695, "global_step": 431214, "epoch": 2566} {"train_loss": -12.265965461730957, "global_step": 431215, "epoch": 2566} {"train_loss": -10.97549057006836, "global_step": 431216, "epoch": 2566} {"train_loss": -11.081317901611328, "global_step": 431217, "epoch": 2566} {"train_loss": -12.011102676391602, "global_step": 431218, "epoch": 2566} {"train_loss": -11.931976318359375, "global_step": 431219, "epoch": 2566} {"train_loss": -10.383012771606445, "global_step": 431220, "epoch": 2566} {"train_loss": -9.912446022033691, "global_step": 431221, "epoch": 2566} {"train_loss": -11.999223709106445, "global_step": 431222, "epoch": 2566} {"train_loss": -10.621253967285156, "global_step": 431223, "epoch": 2566} {"train_loss": -11.737038612365723, "global_step": 431224, "epoch": 2566} {"train_loss": -11.106077194213867, "global_step": 431225, "epoch": 2566} {"train_loss": -9.266193389892578, "global_step": 431226, "epoch": 2566} {"train_loss": -10.369248390197754, "global_step": 431227, "epoch": 2566} {"train_loss": -9.45638370513916, "global_step": 431228, "epoch": 2566} {"train_loss": -10.32568359375, "global_step": 431229, "epoch": 2566} {"train_loss": -9.629295349121094, "global_step": 431230, "epoch": 2566} {"train_loss": -10.545501708984375, "global_step": 431231, "epoch": 2566} {"train_loss": -9.421947479248047, "global_step": 431232, "epoch": 2566} {"train_loss": -11.427362442016602, "global_step": 431233, "epoch": 2566} {"train_loss": -9.10607624053955, "global_step": 431234, "epoch": 2566} {"train_loss": -9.76975154876709, "global_step": 431235, "epoch": 2566} {"train_loss": -8.82421875, "global_step": 431236, "epoch": 2566} {"train_loss": -9.248205184936523, "global_step": 431237, "epoch": 2566} {"train_loss": -9.224016189575195, "global_step": 431238, "epoch": 2566} {"train_loss": -10.668879508972168, "global_step": 431239, "epoch": 2566} {"train_loss": -9.680015563964844, "global_step": 431240, "epoch": 2566} {"train_loss": -9.408456802368164, "global_step": 431241, "epoch": 2566} {"train_loss": -9.87607192993164, "global_step": 431242, "epoch": 2566} {"train_loss": -11.20059585571289, "global_step": 431243, "epoch": 2566} {"train_loss": -10.202354431152344, "global_step": 431244, "epoch": 2566} {"train_loss": -10.043779373168945, "global_step": 431245, "epoch": 2566} {"train_loss": -10.298210144042969, "global_step": 431246, "epoch": 2566} {"train_loss": -10.545145988464355, "global_step": 431247, "epoch": 2566} {"train_loss": -9.8564453125, "global_step": 431248, "epoch": 2566} {"train_loss": -10.474931716918945, "global_step": 431249, "epoch": 2566} {"train_loss": -10.638862609863281, "global_step": 431250, "epoch": 2566} {"train_loss": -10.793680191040039, "global_step": 431251, "epoch": 2566} {"train_loss": -11.563173294067383, "global_step": 431252, "epoch": 2566} {"train_loss": -11.290945053100586, "global_step": 431253, "epoch": 2566} {"train_loss": -10.711334228515625, "global_step": 431254, "epoch": 2566} {"train_loss": -11.814739732515244, "global_step": 431255, "epoch": 2566, "val_loss": 308415.6875} {"train_loss": -11.839357376098633, "global_step": 431256, "epoch": 2567} {"train_loss": -11.29898452758789, "global_step": 431257, "epoch": 2567} {"train_loss": -11.649392127990723, "global_step": 431258, "epoch": 2567} {"train_loss": -11.513299942016602, "global_step": 431259, "epoch": 2567} {"train_loss": -11.952936172485352, "global_step": 431260, "epoch": 2567} {"train_loss": -11.504521369934082, "global_step": 431261, "epoch": 2567} {"train_loss": -11.79316234588623, "global_step": 431262, "epoch": 2567} {"train_loss": -11.874857902526855, "global_step": 431263, "epoch": 2567} {"train_loss": -11.586376190185547, "global_step": 431264, "epoch": 2567} {"train_loss": -12.100818634033203, "global_step": 431265, "epoch": 2567} {"train_loss": -11.984683990478516, "global_step": 431266, "epoch": 2567} {"train_loss": -12.214645385742188, "global_step": 431267, "epoch": 2567} {"train_loss": -11.861652374267578, "global_step": 431268, "epoch": 2567} {"train_loss": -12.15280532836914, "global_step": 431269, "epoch": 2567} {"train_loss": -11.813261985778809, "global_step": 431270, "epoch": 2567} {"train_loss": -11.888603210449219, "global_step": 431271, "epoch": 2567} {"train_loss": -11.948431015014648, "global_step": 431272, "epoch": 2567} {"train_loss": -11.97374153137207, "global_step": 431273, "epoch": 2567} {"train_loss": -11.91135025024414, "global_step": 431274, "epoch": 2567} {"train_loss": -11.858407974243164, "global_step": 431275, "epoch": 2567} {"train_loss": -11.966718673706055, "global_step": 431276, "epoch": 2567} {"train_loss": -11.94207763671875, "global_step": 431277, "epoch": 2567} {"train_loss": -12.384305000305176, "global_step": 431278, "epoch": 2567} {"train_loss": -11.966485977172852, "global_step": 431279, "epoch": 2567} {"train_loss": -12.20850944519043, "global_step": 431280, "epoch": 2567} {"train_loss": -12.000144004821777, "global_step": 431281, "epoch": 2567} {"train_loss": -11.977555274963379, "global_step": 431282, "epoch": 2567} {"train_loss": -12.350414276123047, "global_step": 431283, "epoch": 2567} {"train_loss": -12.337481498718262, "global_step": 431284, "epoch": 2567} {"train_loss": -12.090182304382324, "global_step": 431285, "epoch": 2567} {"train_loss": -12.27095890045166, "global_step": 431286, "epoch": 2567} {"train_loss": -12.060060501098633, "global_step": 431287, "epoch": 2567} {"train_loss": -12.347098350524902, "global_step": 431288, "epoch": 2567} {"train_loss": -12.312118530273438, "global_step": 431289, "epoch": 2567} {"train_loss": -12.305536270141602, "global_step": 431290, "epoch": 2567} {"train_loss": -12.324914932250977, "global_step": 431291, "epoch": 2567} {"train_loss": -12.202896118164062, "global_step": 431292, "epoch": 2567} {"train_loss": -12.233349800109863, "global_step": 431293, "epoch": 2567} {"train_loss": -12.435140609741211, "global_step": 431294, "epoch": 2567} {"train_loss": -12.405672073364258, "global_step": 431295, "epoch": 2567} {"train_loss": -12.651483535766602, "global_step": 431296, "epoch": 2567} {"train_loss": -12.548993110656738, "global_step": 431297, "epoch": 2567} {"train_loss": -12.583864212036133, "global_step": 431298, "epoch": 2567} {"train_loss": -12.586447715759277, "global_step": 431299, "epoch": 2567} {"train_loss": -12.395971298217773, "global_step": 431300, "epoch": 2567} {"train_loss": -12.546424865722656, "global_step": 431301, "epoch": 2567} {"train_loss": -12.432098388671875, "global_step": 431302, "epoch": 2567} {"train_loss": -12.571050643920898, "global_step": 431303, "epoch": 2567} {"train_loss": -12.462469100952148, "global_step": 431304, "epoch": 2567} {"train_loss": -12.514815330505371, "global_step": 431305, "epoch": 2567} {"train_loss": -12.426912307739258, "global_step": 431306, "epoch": 2567} {"train_loss": -12.594669342041016, "global_step": 431307, "epoch": 2567} {"train_loss": -12.49252700805664, "global_step": 431308, "epoch": 2567} {"train_loss": -12.689632415771484, "global_step": 431309, "epoch": 2567} {"train_loss": -12.630548477172852, "global_step": 431310, "epoch": 2567} {"train_loss": -12.444635391235352, "global_step": 431311, "epoch": 2567} {"train_loss": -12.679458618164062, "global_step": 431312, "epoch": 2567} {"train_loss": -12.730074882507324, "global_step": 431313, "epoch": 2567} {"train_loss": -12.485336303710938, "global_step": 431314, "epoch": 2567} {"train_loss": -12.587230682373047, "global_step": 431315, "epoch": 2567} {"train_loss": -12.663228988647461, "global_step": 431316, "epoch": 2567} {"train_loss": -12.542581558227539, "global_step": 431317, "epoch": 2567} {"train_loss": -12.95466136932373, "global_step": 431318, "epoch": 2567} {"train_loss": -12.52613639831543, "global_step": 431319, "epoch": 2567} {"train_loss": -12.745997428894043, "global_step": 431320, "epoch": 2567} {"train_loss": -12.59226131439209, "global_step": 431321, "epoch": 2567} {"train_loss": -12.556243896484375, "global_step": 431322, "epoch": 2567} {"train_loss": -12.879051208496094, "global_step": 431323, "epoch": 2567} {"train_loss": -12.619670867919922, "global_step": 431324, "epoch": 2567} {"train_loss": -12.843040466308594, "global_step": 431325, "epoch": 2567} {"train_loss": -12.717245101928711, "global_step": 431326, "epoch": 2567} {"train_loss": -12.724944114685059, "global_step": 431327, "epoch": 2567} {"train_loss": -12.804584503173828, "global_step": 431328, "epoch": 2567} {"train_loss": -12.82217788696289, "global_step": 431329, "epoch": 2567} {"train_loss": -12.64521598815918, "global_step": 431330, "epoch": 2567} {"train_loss": -12.86009407043457, "global_step": 431331, "epoch": 2567} {"train_loss": -12.84971809387207, "global_step": 431332, "epoch": 2567} {"train_loss": -12.808248519897461, "global_step": 431333, "epoch": 2567} {"train_loss": -12.698531150817871, "global_step": 431334, "epoch": 2567} {"train_loss": -12.596712112426758, "global_step": 431335, "epoch": 2567} {"train_loss": -12.860088348388672, "global_step": 431336, "epoch": 2567} {"train_loss": -12.76747989654541, "global_step": 431337, "epoch": 2567} {"train_loss": -12.725133895874023, "global_step": 431338, "epoch": 2567} {"train_loss": -12.770177841186523, "global_step": 431339, "epoch": 2567} {"train_loss": -12.548233032226562, "global_step": 431340, "epoch": 2567} {"train_loss": -12.71302318572998, "global_step": 431341, "epoch": 2567} {"train_loss": -12.797672271728516, "global_step": 431342, "epoch": 2567} {"train_loss": -12.549627304077148, "global_step": 431343, "epoch": 2567} {"train_loss": -12.199108123779297, "global_step": 431344, "epoch": 2567} {"train_loss": -12.032231330871582, "global_step": 431345, "epoch": 2567} {"train_loss": -12.441837310791016, "global_step": 431346, "epoch": 2567} {"train_loss": -11.584300994873047, "global_step": 431347, "epoch": 2567} {"train_loss": -12.227502822875977, "global_step": 431348, "epoch": 2567} {"train_loss": -12.456779479980469, "global_step": 431349, "epoch": 2567} {"train_loss": -11.478885650634766, "global_step": 431350, "epoch": 2567} {"train_loss": -12.451683044433594, "global_step": 431351, "epoch": 2567} {"train_loss": -11.900370597839355, "global_step": 431352, "epoch": 2567} {"train_loss": -11.579482078552246, "global_step": 431353, "epoch": 2567} {"train_loss": -12.357281684875488, "global_step": 431354, "epoch": 2567} {"train_loss": -12.235021591186523, "global_step": 431355, "epoch": 2567} {"train_loss": -11.558879852294922, "global_step": 431356, "epoch": 2567} {"train_loss": -12.44669246673584, "global_step": 431357, "epoch": 2567} {"train_loss": -11.623857498168945, "global_step": 431358, "epoch": 2567} {"train_loss": -12.299562454223633, "global_step": 431359, "epoch": 2567} {"train_loss": -11.874188423156738, "global_step": 431360, "epoch": 2567} {"train_loss": -10.433972358703613, "global_step": 431361, "epoch": 2567} {"train_loss": -11.867919921875, "global_step": 431362, "epoch": 2567} {"train_loss": -11.123062133789062, "global_step": 431363, "epoch": 2567} {"train_loss": -12.25826644897461, "global_step": 431364, "epoch": 2567} {"train_loss": -10.906081199645996, "global_step": 431365, "epoch": 2567} {"train_loss": -11.17553997039795, "global_step": 431366, "epoch": 2567} {"train_loss": -10.759479522705078, "global_step": 431367, "epoch": 2567} {"train_loss": -10.637666702270508, "global_step": 431368, "epoch": 2567} {"train_loss": -11.608963966369629, "global_step": 431369, "epoch": 2567} {"train_loss": -11.503643035888672, "global_step": 431370, "epoch": 2567} {"train_loss": -12.401411056518555, "global_step": 431371, "epoch": 2567} {"train_loss": -11.666311264038086, "global_step": 431372, "epoch": 2567} {"train_loss": -11.382455825805664, "global_step": 431373, "epoch": 2567} {"train_loss": -12.203903198242188, "global_step": 431374, "epoch": 2567} {"train_loss": -11.750640869140625, "global_step": 431375, "epoch": 2567} {"train_loss": -11.131341934204102, "global_step": 431376, "epoch": 2567} {"train_loss": -12.323341369628906, "global_step": 431377, "epoch": 2567} {"train_loss": -11.471870422363281, "global_step": 431378, "epoch": 2567} {"train_loss": -12.485018730163574, "global_step": 431379, "epoch": 2567} {"train_loss": -11.749290466308594, "global_step": 431380, "epoch": 2567} {"train_loss": -11.765606880187988, "global_step": 431381, "epoch": 2567} {"train_loss": -12.071101188659668, "global_step": 431382, "epoch": 2567} {"train_loss": -11.710567474365234, "global_step": 431383, "epoch": 2567} {"train_loss": -12.15376091003418, "global_step": 431384, "epoch": 2567} {"train_loss": -12.17078685760498, "global_step": 431385, "epoch": 2567} {"train_loss": -11.135010719299316, "global_step": 431386, "epoch": 2567} {"train_loss": -12.302791595458984, "global_step": 431387, "epoch": 2567} {"train_loss": -11.438933372497559, "global_step": 431388, "epoch": 2567} {"train_loss": -11.999692916870117, "global_step": 431389, "epoch": 2567} {"train_loss": -11.670700073242188, "global_step": 431390, "epoch": 2567} {"train_loss": -11.254006385803223, "global_step": 431391, "epoch": 2567} {"train_loss": -12.364791870117188, "global_step": 431392, "epoch": 2567} {"train_loss": -11.532876968383789, "global_step": 431393, "epoch": 2567} {"train_loss": -11.773117065429688, "global_step": 431394, "epoch": 2567} {"train_loss": -11.914658546447754, "global_step": 431395, "epoch": 2567} {"train_loss": -11.241351127624512, "global_step": 431396, "epoch": 2567} {"train_loss": -11.57363224029541, "global_step": 431397, "epoch": 2567} {"train_loss": -11.940715789794922, "global_step": 431398, "epoch": 2567} {"train_loss": -11.717266082763672, "global_step": 431399, "epoch": 2567} {"train_loss": -11.822307586669922, "global_step": 431400, "epoch": 2567} {"train_loss": -11.69992446899414, "global_step": 431401, "epoch": 2567} {"train_loss": -11.487592697143555, "global_step": 431402, "epoch": 2567} {"train_loss": -12.250325202941895, "global_step": 431403, "epoch": 2567} {"train_loss": -11.09721851348877, "global_step": 431404, "epoch": 2567} {"train_loss": -12.41047477722168, "global_step": 431405, "epoch": 2567} {"train_loss": -11.91557502746582, "global_step": 431406, "epoch": 2567} {"train_loss": -11.51831340789795, "global_step": 431407, "epoch": 2567} {"train_loss": -12.626171112060547, "global_step": 431408, "epoch": 2567} {"train_loss": -11.55649185180664, "global_step": 431409, "epoch": 2567} {"train_loss": -12.218525886535645, "global_step": 431410, "epoch": 2567} {"train_loss": -12.089061737060547, "global_step": 431411, "epoch": 2567} {"train_loss": -12.300566673278809, "global_step": 431412, "epoch": 2567} {"train_loss": -12.245917320251465, "global_step": 431413, "epoch": 2567} {"train_loss": -12.201839447021484, "global_step": 431414, "epoch": 2567} {"train_loss": -11.776095390319824, "global_step": 431415, "epoch": 2567} {"train_loss": -11.869156837463379, "global_step": 431416, "epoch": 2567} {"train_loss": -12.107513427734375, "global_step": 431417, "epoch": 2567} {"train_loss": -12.165254592895508, "global_step": 431418, "epoch": 2567} {"train_loss": -12.208974838256836, "global_step": 431419, "epoch": 2567} {"train_loss": -12.114068984985352, "global_step": 431420, "epoch": 2567} {"train_loss": -12.261442184448242, "global_step": 431421, "epoch": 2567} {"train_loss": -12.078431129455566, "global_step": 431422, "epoch": 2567} {"train_loss": -12.115666219166346, "global_step": 431423, "epoch": 2567, "val_loss": 312010.71875} {"train_loss": -12.207406997680664, "global_step": 431424, "epoch": 2568} {"train_loss": -12.111434936523438, "global_step": 431425, "epoch": 2568} {"train_loss": -11.202654838562012, "global_step": 431426, "epoch": 2568} {"train_loss": -11.917150497436523, "global_step": 431427, "epoch": 2568} {"train_loss": -11.75985050201416, "global_step": 431428, "epoch": 2568} {"train_loss": -11.327579498291016, "global_step": 431429, "epoch": 2568} {"train_loss": -12.40456771850586, "global_step": 431430, "epoch": 2568} {"train_loss": -11.17788314819336, "global_step": 431431, "epoch": 2568} {"train_loss": -12.227479934692383, "global_step": 431432, "epoch": 2568} {"train_loss": -11.06905746459961, "global_step": 431433, "epoch": 2568} {"train_loss": -12.188030242919922, "global_step": 431434, "epoch": 2568} {"train_loss": -10.893537521362305, "global_step": 431435, "epoch": 2568} {"train_loss": -11.836769104003906, "global_step": 431436, "epoch": 2568} {"train_loss": -11.758323669433594, "global_step": 431437, "epoch": 2568} {"train_loss": -11.791220664978027, "global_step": 431438, "epoch": 2568} {"train_loss": -12.184503555297852, "global_step": 431439, "epoch": 2568} {"train_loss": -11.548059463500977, "global_step": 431440, "epoch": 2568} {"train_loss": -12.198603630065918, "global_step": 431441, "epoch": 2568} {"train_loss": -11.755010604858398, "global_step": 431442, "epoch": 2568} {"train_loss": -11.952062606811523, "global_step": 431443, "epoch": 2568} {"train_loss": -11.231510162353516, "global_step": 431444, "epoch": 2568} {"train_loss": -11.900164604187012, "global_step": 431445, "epoch": 2568} {"train_loss": -11.018763542175293, "global_step": 431446, "epoch": 2568} {"train_loss": -12.332260131835938, "global_step": 431447, "epoch": 2568} {"train_loss": -10.808990478515625, "global_step": 431448, "epoch": 2568} {"train_loss": -12.182392120361328, "global_step": 431449, "epoch": 2568} {"train_loss": -11.337152481079102, "global_step": 431450, "epoch": 2568} {"train_loss": -11.920635223388672, "global_step": 431451, "epoch": 2568} {"train_loss": -11.304008483886719, "global_step": 431452, "epoch": 2568} {"train_loss": -11.497211456298828, "global_step": 431453, "epoch": 2568} {"train_loss": -10.98666763305664, "global_step": 431454, "epoch": 2568} {"train_loss": -11.512198448181152, "global_step": 431455, "epoch": 2568} {"train_loss": -10.798282623291016, "global_step": 431456, "epoch": 2568} {"train_loss": -11.367696762084961, "global_step": 431457, "epoch": 2568} {"train_loss": -10.175060272216797, "global_step": 431458, "epoch": 2568} {"train_loss": -11.863410949707031, "global_step": 431459, "epoch": 2568} {"train_loss": -10.28992748260498, "global_step": 431460, "epoch": 2568} {"train_loss": -11.243399620056152, "global_step": 431461, "epoch": 2568} {"train_loss": -8.577316284179688, "global_step": 431462, "epoch": 2568} {"train_loss": -10.373579978942871, "global_step": 431463, "epoch": 2568} {"train_loss": -9.9745454788208, "global_step": 431464, "epoch": 2568} {"train_loss": -9.906246185302734, "global_step": 431465, "epoch": 2568} {"train_loss": -11.421721458435059, "global_step": 431466, "epoch": 2568} {"train_loss": -10.177469253540039, "global_step": 431467, "epoch": 2568} {"train_loss": -11.57331657409668, "global_step": 431468, "epoch": 2568} {"train_loss": -11.093656539916992, "global_step": 431469, "epoch": 2568} {"train_loss": -11.260393142700195, "global_step": 431470, "epoch": 2568} {"train_loss": -11.11896800994873, "global_step": 431471, "epoch": 2568} {"train_loss": -11.670108795166016, "global_step": 431472, "epoch": 2568} {"train_loss": -11.060288429260254, "global_step": 431473, "epoch": 2568} {"train_loss": -11.141042709350586, "global_step": 431474, "epoch": 2568} {"train_loss": -11.217853546142578, "global_step": 431475, "epoch": 2568} {"train_loss": -11.171284675598145, "global_step": 431476, "epoch": 2568} {"train_loss": -11.745561599731445, "global_step": 431477, "epoch": 2568} {"train_loss": -11.34537410736084, "global_step": 431478, "epoch": 2568} {"train_loss": -11.972519874572754, "global_step": 431479, "epoch": 2568} {"train_loss": -11.581024169921875, "global_step": 431480, "epoch": 2568} {"train_loss": -11.768452644348145, "global_step": 431481, "epoch": 2568} {"train_loss": -11.627263069152832, "global_step": 431482, "epoch": 2568} {"train_loss": -11.90467643737793, "global_step": 431483, "epoch": 2568} {"train_loss": -11.877318382263184, "global_step": 431484, "epoch": 2568} {"train_loss": -11.544955253601074, "global_step": 431485, "epoch": 2568} {"train_loss": -12.110957145690918, "global_step": 431486, "epoch": 2568} {"train_loss": -11.819439888000488, "global_step": 431487, "epoch": 2568} {"train_loss": -12.2117919921875, "global_step": 431488, "epoch": 2568} {"train_loss": -11.944315910339355, "global_step": 431489, "epoch": 2568} {"train_loss": -12.357952117919922, "global_step": 431490, "epoch": 2568} {"train_loss": -11.930010795593262, "global_step": 431491, "epoch": 2568} {"train_loss": -12.203617095947266, "global_step": 431492, "epoch": 2568} {"train_loss": -12.287302017211914, "global_step": 431493, "epoch": 2568} {"train_loss": -12.17728328704834, "global_step": 431494, "epoch": 2568} {"train_loss": -11.832207679748535, "global_step": 431495, "epoch": 2568} {"train_loss": -12.241743087768555, "global_step": 431496, "epoch": 2568} {"train_loss": -11.828847885131836, "global_step": 431497, "epoch": 2568} {"train_loss": -12.413389205932617, "global_step": 431498, "epoch": 2568} {"train_loss": -12.14542293548584, "global_step": 431499, "epoch": 2568} {"train_loss": -12.25855541229248, "global_step": 431500, "epoch": 2568} {"train_loss": -12.142881393432617, "global_step": 431501, "epoch": 2568} {"train_loss": -12.477927207946777, "global_step": 431502, "epoch": 2568} {"train_loss": -12.141582489013672, "global_step": 431503, "epoch": 2568} {"train_loss": -12.365851402282715, "global_step": 431504, "epoch": 2568} {"train_loss": -12.08331298828125, "global_step": 431505, "epoch": 2568} {"train_loss": -12.384185791015625, "global_step": 431506, "epoch": 2568} {"train_loss": -12.313480377197266, "global_step": 431507, "epoch": 2568} {"train_loss": -12.462501525878906, "global_step": 431508, "epoch": 2568} {"train_loss": -12.705778121948242, "global_step": 431509, "epoch": 2568} {"train_loss": -12.341531753540039, "global_step": 431510, "epoch": 2568} {"train_loss": -12.543642044067383, "global_step": 431511, "epoch": 2568} {"train_loss": -12.266899108886719, "global_step": 431512, "epoch": 2568} {"train_loss": -12.470603942871094, "global_step": 431513, "epoch": 2568} {"train_loss": -12.544820785522461, "global_step": 431514, "epoch": 2568} {"train_loss": -12.43865966796875, "global_step": 431515, "epoch": 2568} {"train_loss": -12.602313995361328, "global_step": 431516, "epoch": 2568} {"train_loss": -12.498974800109863, "global_step": 431517, "epoch": 2568} {"train_loss": -12.464184761047363, "global_step": 431518, "epoch": 2568} {"train_loss": -12.492966651916504, "global_step": 431519, "epoch": 2568} {"train_loss": -12.497685432434082, "global_step": 431520, "epoch": 2568} {"train_loss": -12.504697799682617, "global_step": 431521, "epoch": 2568} {"train_loss": -12.628786087036133, "global_step": 431522, "epoch": 2568} {"train_loss": -12.392500877380371, "global_step": 431523, "epoch": 2568} {"train_loss": -12.718170166015625, "global_step": 431524, "epoch": 2568} {"train_loss": -12.55385971069336, "global_step": 431525, "epoch": 2568} {"train_loss": -12.472421646118164, "global_step": 431526, "epoch": 2568} {"train_loss": -12.615606307983398, "global_step": 431527, "epoch": 2568} {"train_loss": -12.621406555175781, "global_step": 431528, "epoch": 2568} {"train_loss": -12.728087425231934, "global_step": 431529, "epoch": 2568} {"train_loss": -12.649805068969727, "global_step": 431530, "epoch": 2568} {"train_loss": -12.584796905517578, "global_step": 431531, "epoch": 2568} {"train_loss": -12.662689208984375, "global_step": 431532, "epoch": 2568} {"train_loss": -12.875205993652344, "global_step": 431533, "epoch": 2568} {"train_loss": -12.719847679138184, "global_step": 431534, "epoch": 2568} {"train_loss": -12.66202163696289, "global_step": 431535, "epoch": 2568} {"train_loss": -12.653587341308594, "global_step": 431536, "epoch": 2568} {"train_loss": -12.698614120483398, "global_step": 431537, "epoch": 2568} {"train_loss": -12.610864639282227, "global_step": 431538, "epoch": 2568} {"train_loss": -12.585143089294434, "global_step": 431539, "epoch": 2568} {"train_loss": -12.633647918701172, "global_step": 431540, "epoch": 2568} {"train_loss": -12.637142181396484, "global_step": 431541, "epoch": 2568} {"train_loss": -12.752745628356934, "global_step": 431542, "epoch": 2568} {"train_loss": -12.738025665283203, "global_step": 431543, "epoch": 2568} {"train_loss": -12.74007797241211, "global_step": 431544, "epoch": 2568} {"train_loss": -12.641337394714355, "global_step": 431545, "epoch": 2568} {"train_loss": -12.725776672363281, "global_step": 431546, "epoch": 2568} {"train_loss": -12.821294784545898, "global_step": 431547, "epoch": 2568} {"train_loss": -12.809146881103516, "global_step": 431548, "epoch": 2568} {"train_loss": -12.886634826660156, "global_step": 431549, "epoch": 2568} {"train_loss": -12.667305946350098, "global_step": 431550, "epoch": 2568} {"train_loss": -12.584525108337402, "global_step": 431551, "epoch": 2568} {"train_loss": -12.685009002685547, "global_step": 431552, "epoch": 2568} {"train_loss": -12.723331451416016, "global_step": 431553, "epoch": 2568} {"train_loss": -12.686805725097656, "global_step": 431554, "epoch": 2568} {"train_loss": -12.532058715820312, "global_step": 431555, "epoch": 2568} {"train_loss": -12.828681945800781, "global_step": 431556, "epoch": 2568} {"train_loss": -12.346071243286133, "global_step": 431557, "epoch": 2568} {"train_loss": -12.28944206237793, "global_step": 431558, "epoch": 2568} {"train_loss": -12.459970474243164, "global_step": 431559, "epoch": 2568} {"train_loss": -12.275010108947754, "global_step": 431560, "epoch": 2568} {"train_loss": -12.208666801452637, "global_step": 431561, "epoch": 2568} {"train_loss": -12.74875259399414, "global_step": 431562, "epoch": 2568} {"train_loss": -12.669097900390625, "global_step": 431563, "epoch": 2568} {"train_loss": -12.840843200683594, "global_step": 431564, "epoch": 2568} {"train_loss": -12.639715194702148, "global_step": 431565, "epoch": 2568} {"train_loss": -12.718910217285156, "global_step": 431566, "epoch": 2568} {"train_loss": -12.644984245300293, "global_step": 431567, "epoch": 2568} {"train_loss": -12.372554779052734, "global_step": 431568, "epoch": 2568} {"train_loss": -12.241218566894531, "global_step": 431569, "epoch": 2568} {"train_loss": -12.764524459838867, "global_step": 431570, "epoch": 2568} {"train_loss": -12.433069229125977, "global_step": 431571, "epoch": 2568} {"train_loss": -12.443538665771484, "global_step": 431572, "epoch": 2568} {"train_loss": -12.799705505371094, "global_step": 431573, "epoch": 2568} {"train_loss": -12.52785873413086, "global_step": 431574, "epoch": 2568} {"train_loss": -12.500165939331055, "global_step": 431575, "epoch": 2568} {"train_loss": -12.456964492797852, "global_step": 431576, "epoch": 2568} {"train_loss": -12.694260597229004, "global_step": 431577, "epoch": 2568} {"train_loss": -12.531137466430664, "global_step": 431578, "epoch": 2568} {"train_loss": -12.699394226074219, "global_step": 431579, "epoch": 2568} {"train_loss": -12.365541458129883, "global_step": 431580, "epoch": 2568} {"train_loss": -12.735593795776367, "global_step": 431581, "epoch": 2568} {"train_loss": -12.355539321899414, "global_step": 431582, "epoch": 2568} {"train_loss": -12.443831443786621, "global_step": 431583, "epoch": 2568} {"train_loss": -12.3421630859375, "global_step": 431584, "epoch": 2568} {"train_loss": -12.764932632446289, "global_step": 431585, "epoch": 2568} {"train_loss": -12.747089385986328, "global_step": 431586, "epoch": 2568} {"train_loss": -12.950874328613281, "global_step": 431587, "epoch": 2568} {"train_loss": -12.775165557861328, "global_step": 431588, "epoch": 2568} {"train_loss": -12.78365421295166, "global_step": 431589, "epoch": 2568} {"train_loss": -12.458412170410156, "global_step": 431590, "epoch": 2568} {"train_loss": -12.094875630878267, "global_step": 431591, "epoch": 2568, "val_loss": 311590.375} {"train_loss": -12.450909614562988, "global_step": 431592, "epoch": 2569} {"train_loss": -12.007406234741211, "global_step": 431593, "epoch": 2569} {"train_loss": -12.017200469970703, "global_step": 431594, "epoch": 2569} {"train_loss": -12.282747268676758, "global_step": 431595, "epoch": 2569} {"train_loss": -12.440839767456055, "global_step": 431596, "epoch": 2569} {"train_loss": -12.37728500366211, "global_step": 431597, "epoch": 2569} {"train_loss": -12.176156997680664, "global_step": 431598, "epoch": 2569} {"train_loss": -12.475353240966797, "global_step": 431599, "epoch": 2569} {"train_loss": -12.113604545593262, "global_step": 431600, "epoch": 2569} {"train_loss": -12.480965614318848, "global_step": 431601, "epoch": 2569} {"train_loss": -12.191712379455566, "global_step": 431602, "epoch": 2569} {"train_loss": -12.738788604736328, "global_step": 431603, "epoch": 2569} {"train_loss": -11.846953392028809, "global_step": 431604, "epoch": 2569} {"train_loss": -10.807914733886719, "global_step": 431605, "epoch": 2569} {"train_loss": -11.744771957397461, "global_step": 431606, "epoch": 2569} {"train_loss": -11.543207168579102, "global_step": 431607, "epoch": 2569} {"train_loss": -10.99588394165039, "global_step": 431608, "epoch": 2569} {"train_loss": -9.898602485656738, "global_step": 431609, "epoch": 2569} {"train_loss": -11.499429702758789, "global_step": 431610, "epoch": 2569} {"train_loss": -10.540108680725098, "global_step": 431611, "epoch": 2569} {"train_loss": -10.393243789672852, "global_step": 431612, "epoch": 2569} {"train_loss": -11.065829277038574, "global_step": 431613, "epoch": 2569} {"train_loss": -10.34272575378418, "global_step": 431614, "epoch": 2569} {"train_loss": -12.090967178344727, "global_step": 431615, "epoch": 2569} {"train_loss": -11.163372039794922, "global_step": 431616, "epoch": 2569} {"train_loss": -11.437816619873047, "global_step": 431617, "epoch": 2569} {"train_loss": -10.551677703857422, "global_step": 431618, "epoch": 2569} {"train_loss": -11.946101188659668, "global_step": 431619, "epoch": 2569} {"train_loss": -10.752141952514648, "global_step": 431620, "epoch": 2569} {"train_loss": -10.34889030456543, "global_step": 431621, "epoch": 2569} {"train_loss": -11.166122436523438, "global_step": 431622, "epoch": 2569} {"train_loss": -10.029956817626953, "global_step": 431623, "epoch": 2569} {"train_loss": -9.831119537353516, "global_step": 431624, "epoch": 2569} {"train_loss": -11.371635437011719, "global_step": 431625, "epoch": 2569} {"train_loss": -9.394122123718262, "global_step": 431626, "epoch": 2569} {"train_loss": -10.26797103881836, "global_step": 431627, "epoch": 2569} {"train_loss": -10.913930892944336, "global_step": 431628, "epoch": 2569} {"train_loss": -10.245098114013672, "global_step": 431629, "epoch": 2569} {"train_loss": -11.31700325012207, "global_step": 431630, "epoch": 2569} {"train_loss": -11.002779960632324, "global_step": 431631, "epoch": 2569} {"train_loss": -11.268747329711914, "global_step": 431632, "epoch": 2569} {"train_loss": -11.357789993286133, "global_step": 431633, "epoch": 2569} {"train_loss": -11.775716781616211, "global_step": 431634, "epoch": 2569} {"train_loss": -11.28629207611084, "global_step": 431635, "epoch": 2569} {"train_loss": -11.672479629516602, "global_step": 431636, "epoch": 2569} {"train_loss": -11.62485122680664, "global_step": 431637, "epoch": 2569} {"train_loss": -11.815149307250977, "global_step": 431638, "epoch": 2569} {"train_loss": -11.892805099487305, "global_step": 431639, "epoch": 2569} {"train_loss": -12.325818061828613, "global_step": 431640, "epoch": 2569} {"train_loss": -11.337409973144531, "global_step": 431641, "epoch": 2569} {"train_loss": -12.33059024810791, "global_step": 431642, "epoch": 2569} {"train_loss": -11.801534652709961, "global_step": 431643, "epoch": 2569} {"train_loss": -11.598400115966797, "global_step": 431644, "epoch": 2569} {"train_loss": -11.628448486328125, "global_step": 431645, "epoch": 2569} {"train_loss": -11.800796508789062, "global_step": 431646, "epoch": 2569} {"train_loss": -12.159549713134766, "global_step": 431647, "epoch": 2569} {"train_loss": -11.753189086914062, "global_step": 431648, "epoch": 2569} {"train_loss": -12.111074447631836, "global_step": 431649, "epoch": 2569} {"train_loss": -11.791448593139648, "global_step": 431650, "epoch": 2569} {"train_loss": -12.277767181396484, "global_step": 431651, "epoch": 2569} {"train_loss": -12.134979248046875, "global_step": 431652, "epoch": 2569} {"train_loss": -12.540282249450684, "global_step": 431653, "epoch": 2569} {"train_loss": -12.431472778320312, "global_step": 431654, "epoch": 2569} {"train_loss": -12.181290626525879, "global_step": 431655, "epoch": 2569} {"train_loss": -12.391397476196289, "global_step": 431656, "epoch": 2569} {"train_loss": -12.192230224609375, "global_step": 431657, "epoch": 2569} {"train_loss": -12.326339721679688, "global_step": 431658, "epoch": 2569} {"train_loss": -12.434805870056152, "global_step": 431659, "epoch": 2569} {"train_loss": -12.475335121154785, "global_step": 431660, "epoch": 2569} {"train_loss": -12.21102237701416, "global_step": 431661, "epoch": 2569} {"train_loss": -12.362335205078125, "global_step": 431662, "epoch": 2569} {"train_loss": -12.420154571533203, "global_step": 431663, "epoch": 2569} {"train_loss": -12.650944709777832, "global_step": 431664, "epoch": 2569} {"train_loss": -12.236003875732422, "global_step": 431665, "epoch": 2569} {"train_loss": -12.440132141113281, "global_step": 431666, "epoch": 2569} {"train_loss": -12.461711883544922, "global_step": 431667, "epoch": 2569} {"train_loss": -12.472728729248047, "global_step": 431668, "epoch": 2569} {"train_loss": -12.352280616760254, "global_step": 431669, "epoch": 2569} {"train_loss": -12.420886039733887, "global_step": 431670, "epoch": 2569} {"train_loss": -12.711824417114258, "global_step": 431671, "epoch": 2569} {"train_loss": -12.630616188049316, "global_step": 431672, "epoch": 2569} {"train_loss": -12.419088363647461, "global_step": 431673, "epoch": 2569} {"train_loss": -12.221571922302246, "global_step": 431674, "epoch": 2569} {"train_loss": -12.595561981201172, "global_step": 431675, "epoch": 2569} {"train_loss": -12.654218673706055, "global_step": 431676, "epoch": 2569} {"train_loss": -12.479616165161133, "global_step": 431677, "epoch": 2569} {"train_loss": -12.466094970703125, "global_step": 431678, "epoch": 2569} {"train_loss": -12.64848804473877, "global_step": 431679, "epoch": 2569} {"train_loss": -12.426950454711914, "global_step": 431680, "epoch": 2569} {"train_loss": -12.46774673461914, "global_step": 431681, "epoch": 2569} {"train_loss": -12.65762710571289, "global_step": 431682, "epoch": 2569} {"train_loss": -12.497411727905273, "global_step": 431683, "epoch": 2569} {"train_loss": -12.705133438110352, "global_step": 431684, "epoch": 2569} {"train_loss": -12.541788101196289, "global_step": 431685, "epoch": 2569} {"train_loss": -12.680416107177734, "global_step": 431686, "epoch": 2569} {"train_loss": -12.789167404174805, "global_step": 431687, "epoch": 2569} {"train_loss": -12.568531036376953, "global_step": 431688, "epoch": 2569} {"train_loss": -12.72035026550293, "global_step": 431689, "epoch": 2569} {"train_loss": -12.563576698303223, "global_step": 431690, "epoch": 2569} {"train_loss": -12.450878143310547, "global_step": 431691, "epoch": 2569} {"train_loss": -12.609397888183594, "global_step": 431692, "epoch": 2569} {"train_loss": -12.582294464111328, "global_step": 431693, "epoch": 2569} {"train_loss": -12.816764831542969, "global_step": 431694, "epoch": 2569} {"train_loss": -12.817636489868164, "global_step": 431695, "epoch": 2569} {"train_loss": -12.530563354492188, "global_step": 431696, "epoch": 2569} {"train_loss": -12.720870971679688, "global_step": 431697, "epoch": 2569} {"train_loss": -12.88888931274414, "global_step": 431698, "epoch": 2569} {"train_loss": -12.792609214782715, "global_step": 431699, "epoch": 2569} {"train_loss": -12.855863571166992, "global_step": 431700, "epoch": 2569} {"train_loss": -12.85820198059082, "global_step": 431701, "epoch": 2569} {"train_loss": -12.775209426879883, "global_step": 431702, "epoch": 2569} {"train_loss": -12.747089385986328, "global_step": 431703, "epoch": 2569} {"train_loss": -12.922865867614746, "global_step": 431704, "epoch": 2569} {"train_loss": -13.10489273071289, "global_step": 431705, "epoch": 2569} {"train_loss": -12.971498489379883, "global_step": 431706, "epoch": 2569} {"train_loss": -12.778722763061523, "global_step": 431707, "epoch": 2569} {"train_loss": -12.917088508605957, "global_step": 431708, "epoch": 2569} {"train_loss": -12.694925308227539, "global_step": 431709, "epoch": 2569} {"train_loss": -12.712425231933594, "global_step": 431710, "epoch": 2569} {"train_loss": -12.541711807250977, "global_step": 431711, "epoch": 2569} {"train_loss": -12.773999214172363, "global_step": 431712, "epoch": 2569} {"train_loss": -12.861324310302734, "global_step": 431713, "epoch": 2569} {"train_loss": -12.867218017578125, "global_step": 431714, "epoch": 2569} {"train_loss": -12.89204216003418, "global_step": 431715, "epoch": 2569} {"train_loss": -13.120828628540039, "global_step": 431716, "epoch": 2569} {"train_loss": -13.024601936340332, "global_step": 431717, "epoch": 2569} {"train_loss": -12.786176681518555, "global_step": 431718, "epoch": 2569} {"train_loss": -12.981430053710938, "global_step": 431719, "epoch": 2569} {"train_loss": -12.926267623901367, "global_step": 431720, "epoch": 2569} {"train_loss": -12.819345474243164, "global_step": 431721, "epoch": 2569} {"train_loss": -12.821401596069336, "global_step": 431722, "epoch": 2569} {"train_loss": -12.85075569152832, "global_step": 431723, "epoch": 2569} {"train_loss": -12.795543670654297, "global_step": 431724, "epoch": 2569} {"train_loss": -12.800970077514648, "global_step": 431725, "epoch": 2569} {"train_loss": -12.874896049499512, "global_step": 431726, "epoch": 2569} {"train_loss": -12.996844291687012, "global_step": 431727, "epoch": 2569} {"train_loss": -12.709074020385742, "global_step": 431728, "epoch": 2569} {"train_loss": -12.562509536743164, "global_step": 431729, "epoch": 2569} {"train_loss": -12.96180534362793, "global_step": 431730, "epoch": 2569} {"train_loss": -12.400035858154297, "global_step": 431731, "epoch": 2569} {"train_loss": -12.202560424804688, "global_step": 431732, "epoch": 2569} {"train_loss": -12.552431106567383, "global_step": 431733, "epoch": 2569} {"train_loss": -12.78843879699707, "global_step": 431734, "epoch": 2569} {"train_loss": -12.514997482299805, "global_step": 431735, "epoch": 2569} {"train_loss": -12.228296279907227, "global_step": 431736, "epoch": 2569} {"train_loss": -12.697935104370117, "global_step": 431737, "epoch": 2569} {"train_loss": -12.662659645080566, "global_step": 431738, "epoch": 2569} {"train_loss": -12.733575820922852, "global_step": 431739, "epoch": 2569} {"train_loss": -12.778634071350098, "global_step": 431740, "epoch": 2569} {"train_loss": -12.651153564453125, "global_step": 431741, "epoch": 2569} {"train_loss": -12.538068771362305, "global_step": 431742, "epoch": 2569} {"train_loss": -10.707741737365723, "global_step": 431743, "epoch": 2569} {"train_loss": -10.474655151367188, "global_step": 431744, "epoch": 2569} {"train_loss": -10.674103736877441, "global_step": 431745, "epoch": 2569} {"train_loss": -10.91598892211914, "global_step": 431746, "epoch": 2569} {"train_loss": -11.274866104125977, "global_step": 431747, "epoch": 2569} {"train_loss": -11.105287551879883, "global_step": 431748, "epoch": 2569} {"train_loss": -9.42845344543457, "global_step": 431749, "epoch": 2569} {"train_loss": -9.801054000854492, "global_step": 431750, "epoch": 2569} {"train_loss": -9.024518966674805, "global_step": 431751, "epoch": 2569} {"train_loss": -8.811342239379883, "global_step": 431752, "epoch": 2569} {"train_loss": -9.536192893981934, "global_step": 431753, "epoch": 2569} {"train_loss": -10.336380958557129, "global_step": 431754, "epoch": 2569} {"train_loss": -9.251346588134766, "global_step": 431755, "epoch": 2569} {"train_loss": -8.906837463378906, "global_step": 431756, "epoch": 2569} {"train_loss": -8.13957691192627, "global_step": 431757, "epoch": 2569} {"train_loss": -9.66273307800293, "global_step": 431758, "epoch": 2569} {"train_loss": -11.936412447974796, "global_step": 431759, "epoch": 2569, "val_loss": 310017.5625} {"train_loss": -9.713891983032227, "global_step": 431760, "epoch": 2570} {"train_loss": -10.151206970214844, "global_step": 431761, "epoch": 2570} {"train_loss": -10.250165939331055, "global_step": 431762, "epoch": 2570} {"train_loss": -11.085405349731445, "global_step": 431763, "epoch": 2570} {"train_loss": -10.442848205566406, "global_step": 431764, "epoch": 2570} {"train_loss": -11.512693405151367, "global_step": 431765, "epoch": 2570} {"train_loss": -11.545785903930664, "global_step": 431766, "epoch": 2570} {"train_loss": -10.633480072021484, "global_step": 431767, "epoch": 2570} {"train_loss": -10.606707572937012, "global_step": 431768, "epoch": 2570} {"train_loss": -11.381936073303223, "global_step": 431769, "epoch": 2570} {"train_loss": -11.954425811767578, "global_step": 431770, "epoch": 2570} {"train_loss": -11.413213729858398, "global_step": 431771, "epoch": 2570} {"train_loss": -11.728962898254395, "global_step": 431772, "epoch": 2570} {"train_loss": -11.463932037353516, "global_step": 431773, "epoch": 2570} {"train_loss": -11.834132194519043, "global_step": 431774, "epoch": 2570} {"train_loss": -11.389558792114258, "global_step": 431775, "epoch": 2570} {"train_loss": -12.158407211303711, "global_step": 431776, "epoch": 2570} {"train_loss": -11.829842567443848, "global_step": 431777, "epoch": 2570} {"train_loss": -11.623432159423828, "global_step": 431778, "epoch": 2570} {"train_loss": -11.72881031036377, "global_step": 431779, "epoch": 2570} {"train_loss": -11.65666389465332, "global_step": 431780, "epoch": 2570} {"train_loss": -12.232869148254395, "global_step": 431781, "epoch": 2570} {"train_loss": -11.968033790588379, "global_step": 431782, "epoch": 2570} {"train_loss": -12.23362922668457, "global_step": 431783, "epoch": 2570} {"train_loss": -12.114806175231934, "global_step": 431784, "epoch": 2570} {"train_loss": -12.195629119873047, "global_step": 431785, "epoch": 2570} {"train_loss": -12.226629257202148, "global_step": 431786, "epoch": 2570} {"train_loss": -12.372901916503906, "global_step": 431787, "epoch": 2570} {"train_loss": -12.074079513549805, "global_step": 431788, "epoch": 2570} {"train_loss": -12.52065658569336, "global_step": 431789, "epoch": 2570} {"train_loss": -12.339607238769531, "global_step": 431790, "epoch": 2570} {"train_loss": -12.222004890441895, "global_step": 431791, "epoch": 2570} {"train_loss": -12.491019248962402, "global_step": 431792, "epoch": 2570} {"train_loss": -12.387945175170898, "global_step": 431793, "epoch": 2570} {"train_loss": -12.269670486450195, "global_step": 431794, "epoch": 2570} {"train_loss": -12.367391586303711, "global_step": 431795, "epoch": 2570} {"train_loss": -12.333361625671387, "global_step": 431796, "epoch": 2570} {"train_loss": -12.366780281066895, "global_step": 431797, "epoch": 2570} {"train_loss": -12.364873886108398, "global_step": 431798, "epoch": 2570} {"train_loss": -12.52727222442627, "global_step": 431799, "epoch": 2570} {"train_loss": -12.536169052124023, "global_step": 431800, "epoch": 2570} {"train_loss": -12.635579109191895, "global_step": 431801, "epoch": 2570} {"train_loss": -12.621429443359375, "global_step": 431802, "epoch": 2570} {"train_loss": -12.413334846496582, "global_step": 431803, "epoch": 2570} {"train_loss": -12.476781845092773, "global_step": 431804, "epoch": 2570} {"train_loss": -12.373603820800781, "global_step": 431805, "epoch": 2570} {"train_loss": -12.56646728515625, "global_step": 431806, "epoch": 2570} {"train_loss": -12.168821334838867, "global_step": 431807, "epoch": 2570} {"train_loss": -12.6199369430542, "global_step": 431808, "epoch": 2570} {"train_loss": -12.547922134399414, "global_step": 431809, "epoch": 2570} {"train_loss": -12.40328598022461, "global_step": 431810, "epoch": 2570} {"train_loss": -12.34695816040039, "global_step": 431811, "epoch": 2570} {"train_loss": -12.501794815063477, "global_step": 431812, "epoch": 2570} {"train_loss": -12.104701042175293, "global_step": 431813, "epoch": 2570} {"train_loss": -12.440299987792969, "global_step": 431814, "epoch": 2570} {"train_loss": -11.894624710083008, "global_step": 431815, "epoch": 2570} {"train_loss": -11.575958251953125, "global_step": 431816, "epoch": 2570} {"train_loss": -12.330326080322266, "global_step": 431817, "epoch": 2570} {"train_loss": -12.284154891967773, "global_step": 431818, "epoch": 2570} {"train_loss": -12.25672721862793, "global_step": 431819, "epoch": 2570} {"train_loss": -12.405174255371094, "global_step": 431820, "epoch": 2570} {"train_loss": -12.340446472167969, "global_step": 431821, "epoch": 2570} {"train_loss": -12.207698822021484, "global_step": 431822, "epoch": 2570} {"train_loss": -12.504812240600586, "global_step": 431823, "epoch": 2570} {"train_loss": -12.146707534790039, "global_step": 431824, "epoch": 2570} {"train_loss": -12.39293098449707, "global_step": 431825, "epoch": 2570} {"train_loss": -12.711065292358398, "global_step": 431826, "epoch": 2570} {"train_loss": -12.317256927490234, "global_step": 431827, "epoch": 2570} {"train_loss": -12.534366607666016, "global_step": 431828, "epoch": 2570} {"train_loss": -12.433091163635254, "global_step": 431829, "epoch": 2570} {"train_loss": -12.389392852783203, "global_step": 431830, "epoch": 2570} {"train_loss": -12.03171157836914, "global_step": 431831, "epoch": 2570} {"train_loss": -12.08445930480957, "global_step": 431832, "epoch": 2570} {"train_loss": -12.465080261230469, "global_step": 431833, "epoch": 2570} {"train_loss": -11.54692268371582, "global_step": 431834, "epoch": 2570} {"train_loss": -12.186362266540527, "global_step": 431835, "epoch": 2570} {"train_loss": -11.410444259643555, "global_step": 431836, "epoch": 2570} {"train_loss": -11.506246566772461, "global_step": 431837, "epoch": 2570} {"train_loss": -12.105432510375977, "global_step": 431838, "epoch": 2570} {"train_loss": -11.807842254638672, "global_step": 431839, "epoch": 2570} {"train_loss": -12.355331420898438, "global_step": 431840, "epoch": 2570} {"train_loss": -11.606761932373047, "global_step": 431841, "epoch": 2570} {"train_loss": -12.305925369262695, "global_step": 431842, "epoch": 2570} {"train_loss": -11.994439125061035, "global_step": 431843, "epoch": 2570} {"train_loss": -11.841400146484375, "global_step": 431844, "epoch": 2570} {"train_loss": -12.146145820617676, "global_step": 431845, "epoch": 2570} {"train_loss": -12.32856559753418, "global_step": 431846, "epoch": 2570} {"train_loss": -12.480127334594727, "global_step": 431847, "epoch": 2570} {"train_loss": -11.922185897827148, "global_step": 431848, "epoch": 2570} {"train_loss": -12.513420104980469, "global_step": 431849, "epoch": 2570} {"train_loss": -11.641033172607422, "global_step": 431850, "epoch": 2570} {"train_loss": -11.258808135986328, "global_step": 431851, "epoch": 2570} {"train_loss": -11.543011665344238, "global_step": 431852, "epoch": 2570} {"train_loss": -10.840049743652344, "global_step": 431853, "epoch": 2570} {"train_loss": -11.181666374206543, "global_step": 431854, "epoch": 2570} {"train_loss": -11.598114013671875, "global_step": 431855, "epoch": 2570} {"train_loss": -11.77806282043457, "global_step": 431856, "epoch": 2570} {"train_loss": -11.936403274536133, "global_step": 431857, "epoch": 2570} {"train_loss": -11.63833236694336, "global_step": 431858, "epoch": 2570} {"train_loss": -12.253194808959961, "global_step": 431859, "epoch": 2570} {"train_loss": -12.094950675964355, "global_step": 431860, "epoch": 2570} {"train_loss": -11.734094619750977, "global_step": 431861, "epoch": 2570} {"train_loss": -11.486133575439453, "global_step": 431862, "epoch": 2570} {"train_loss": -12.592296600341797, "global_step": 431863, "epoch": 2570} {"train_loss": -11.649757385253906, "global_step": 431864, "epoch": 2570} {"train_loss": -12.08666706085205, "global_step": 431865, "epoch": 2570} {"train_loss": -11.584676742553711, "global_step": 431866, "epoch": 2570} {"train_loss": -11.530008316040039, "global_step": 431867, "epoch": 2570} {"train_loss": -11.250189781188965, "global_step": 431868, "epoch": 2570} {"train_loss": -10.985616683959961, "global_step": 431869, "epoch": 2570} {"train_loss": -11.022052764892578, "global_step": 431870, "epoch": 2570} {"train_loss": -11.515653610229492, "global_step": 431871, "epoch": 2570} {"train_loss": -10.994709014892578, "global_step": 431872, "epoch": 2570} {"train_loss": -11.49447250366211, "global_step": 431873, "epoch": 2570} {"train_loss": -11.754009246826172, "global_step": 431874, "epoch": 2570} {"train_loss": -11.867671012878418, "global_step": 431875, "epoch": 2570} {"train_loss": -11.77849006652832, "global_step": 431876, "epoch": 2570} {"train_loss": -12.209973335266113, "global_step": 431877, "epoch": 2570} {"train_loss": -11.733963966369629, "global_step": 431878, "epoch": 2570} {"train_loss": -12.157517433166504, "global_step": 431879, "epoch": 2570} {"train_loss": -12.004526138305664, "global_step": 431880, "epoch": 2570} {"train_loss": -11.971670150756836, "global_step": 431881, "epoch": 2570} {"train_loss": -11.81259536743164, "global_step": 431882, "epoch": 2570} {"train_loss": -12.034460067749023, "global_step": 431883, "epoch": 2570} {"train_loss": -12.272154808044434, "global_step": 431884, "epoch": 2570} {"train_loss": -12.500617980957031, "global_step": 431885, "epoch": 2570} {"train_loss": -12.208334922790527, "global_step": 431886, "epoch": 2570} {"train_loss": -12.021976470947266, "global_step": 431887, "epoch": 2570} {"train_loss": -12.613983154296875, "global_step": 431888, "epoch": 2570} {"train_loss": -12.318500518798828, "global_step": 431889, "epoch": 2570} {"train_loss": -12.41368293762207, "global_step": 431890, "epoch": 2570} {"train_loss": -12.32931900024414, "global_step": 431891, "epoch": 2570} {"train_loss": -12.214120864868164, "global_step": 431892, "epoch": 2570} {"train_loss": -12.610356330871582, "global_step": 431893, "epoch": 2570} {"train_loss": -11.744852066040039, "global_step": 431894, "epoch": 2570} {"train_loss": -12.604630470275879, "global_step": 431895, "epoch": 2570} {"train_loss": -12.422538757324219, "global_step": 431896, "epoch": 2570} {"train_loss": -12.45875358581543, "global_step": 431897, "epoch": 2570} {"train_loss": -12.686046600341797, "global_step": 431898, "epoch": 2570} {"train_loss": -12.445822715759277, "global_step": 431899, "epoch": 2570} {"train_loss": -12.257771492004395, "global_step": 431900, "epoch": 2570} {"train_loss": -12.42497444152832, "global_step": 431901, "epoch": 2570} {"train_loss": -12.52714729309082, "global_step": 431902, "epoch": 2570} {"train_loss": -12.65505599975586, "global_step": 431903, "epoch": 2570} {"train_loss": -12.5388822555542, "global_step": 431904, "epoch": 2570} {"train_loss": -12.437705993652344, "global_step": 431905, "epoch": 2570} {"train_loss": -12.725317001342773, "global_step": 431906, "epoch": 2570} {"train_loss": -12.258312225341797, "global_step": 431907, "epoch": 2570} {"train_loss": -12.518699645996094, "global_step": 431908, "epoch": 2570} {"train_loss": -12.788313865661621, "global_step": 431909, "epoch": 2570} {"train_loss": -12.645550727844238, "global_step": 431910, "epoch": 2570} {"train_loss": -12.641881942749023, "global_step": 431911, "epoch": 2570} {"train_loss": -12.583380699157715, "global_step": 431912, "epoch": 2570} {"train_loss": -12.646892547607422, "global_step": 431913, "epoch": 2570} {"train_loss": -12.566226959228516, "global_step": 431914, "epoch": 2570} {"train_loss": -12.869104385375977, "global_step": 431915, "epoch": 2570} {"train_loss": -12.76986312866211, "global_step": 431916, "epoch": 2570} {"train_loss": -12.487207412719727, "global_step": 431917, "epoch": 2570} {"train_loss": -12.705463409423828, "global_step": 431918, "epoch": 2570} {"train_loss": -12.63604736328125, "global_step": 431919, "epoch": 2570} {"train_loss": -12.405723571777344, "global_step": 431920, "epoch": 2570} {"train_loss": -12.615238189697266, "global_step": 431921, "epoch": 2570} {"train_loss": -12.593836784362793, "global_step": 431922, "epoch": 2570} {"train_loss": -12.789466857910156, "global_step": 431923, "epoch": 2570} {"train_loss": -12.589892387390137, "global_step": 431924, "epoch": 2570} {"train_loss": -12.537810325622559, "global_step": 431925, "epoch": 2570} {"train_loss": -12.254374504089355, "global_step": 431926, "epoch": 2570} {"train_loss": -12.07604840255919, "global_step": 431927, "epoch": 2570, "val_loss": 312571.84375, "train_action_mse_error": 0.25192001461982727} {"train_loss": -12.066137313842773, "global_step": 431928, "epoch": 2571} {"train_loss": -11.658008575439453, "global_step": 431929, "epoch": 2571} {"train_loss": -11.988414764404297, "global_step": 431930, "epoch": 2571} {"train_loss": -11.683576583862305, "global_step": 431931, "epoch": 2571} {"train_loss": -10.090317726135254, "global_step": 431932, "epoch": 2571} {"train_loss": -12.548521041870117, "global_step": 431933, "epoch": 2571} {"train_loss": -10.856668472290039, "global_step": 431934, "epoch": 2571} {"train_loss": -11.466924667358398, "global_step": 431935, "epoch": 2571} {"train_loss": -12.208076477050781, "global_step": 431936, "epoch": 2571} {"train_loss": -10.907249450683594, "global_step": 431937, "epoch": 2571} {"train_loss": -9.49628734588623, "global_step": 431938, "epoch": 2571} {"train_loss": -11.139629364013672, "global_step": 431939, "epoch": 2571} {"train_loss": -9.069025039672852, "global_step": 431940, "epoch": 2571} {"train_loss": -9.646125793457031, "global_step": 431941, "epoch": 2571} {"train_loss": -9.945438385009766, "global_step": 431942, "epoch": 2571} {"train_loss": -9.168558120727539, "global_step": 431943, "epoch": 2571} {"train_loss": -9.339933395385742, "global_step": 431944, "epoch": 2571} {"train_loss": -8.971480369567871, "global_step": 431945, "epoch": 2571} {"train_loss": -9.391892433166504, "global_step": 431946, "epoch": 2571} {"train_loss": -10.07165813446045, "global_step": 431947, "epoch": 2571} {"train_loss": -10.833215713500977, "global_step": 431948, "epoch": 2571} {"train_loss": -9.36350154876709, "global_step": 431949, "epoch": 2571} {"train_loss": -10.020513534545898, "global_step": 431950, "epoch": 2571} {"train_loss": -10.437616348266602, "global_step": 431951, "epoch": 2571} {"train_loss": -10.642187118530273, "global_step": 431952, "epoch": 2571} {"train_loss": -10.312826156616211, "global_step": 431953, "epoch": 2571} {"train_loss": -10.699941635131836, "global_step": 431954, "epoch": 2571} {"train_loss": -11.19814395904541, "global_step": 431955, "epoch": 2571} {"train_loss": -10.755086898803711, "global_step": 431956, "epoch": 2571} {"train_loss": -11.073362350463867, "global_step": 431957, "epoch": 2571} {"train_loss": -12.057060241699219, "global_step": 431958, "epoch": 2571} {"train_loss": -11.188817977905273, "global_step": 431959, "epoch": 2571} {"train_loss": -11.694371223449707, "global_step": 431960, "epoch": 2571} {"train_loss": -11.586113929748535, "global_step": 431961, "epoch": 2571} {"train_loss": -11.60713005065918, "global_step": 431962, "epoch": 2571} {"train_loss": -11.634469985961914, "global_step": 431963, "epoch": 2571} {"train_loss": -11.672532081604004, "global_step": 431964, "epoch": 2571} {"train_loss": -11.715349197387695, "global_step": 431965, "epoch": 2571} {"train_loss": -11.733955383300781, "global_step": 431966, "epoch": 2571} {"train_loss": -11.605025291442871, "global_step": 431967, "epoch": 2571} {"train_loss": -11.737556457519531, "global_step": 431968, "epoch": 2571} {"train_loss": -11.798662185668945, "global_step": 431969, "epoch": 2571} {"train_loss": -11.455677032470703, "global_step": 431970, "epoch": 2571} {"train_loss": -12.095880508422852, "global_step": 431971, "epoch": 2571} {"train_loss": -11.512554168701172, "global_step": 431972, "epoch": 2571} {"train_loss": -12.266766548156738, "global_step": 431973, "epoch": 2571} {"train_loss": -12.085930824279785, "global_step": 431974, "epoch": 2571} {"train_loss": -11.893531799316406, "global_step": 431975, "epoch": 2571} {"train_loss": -12.310014724731445, "global_step": 431976, "epoch": 2571} {"train_loss": -11.884124755859375, "global_step": 431977, "epoch": 2571} {"train_loss": -12.562252044677734, "global_step": 431978, "epoch": 2571} {"train_loss": -11.764348030090332, "global_step": 431979, "epoch": 2571} {"train_loss": -12.566329002380371, "global_step": 431980, "epoch": 2571} {"train_loss": -12.404926300048828, "global_step": 431981, "epoch": 2571} {"train_loss": -12.405437469482422, "global_step": 431982, "epoch": 2571} {"train_loss": -12.347173690795898, "global_step": 431983, "epoch": 2571} {"train_loss": -12.315595626831055, "global_step": 431984, "epoch": 2571} {"train_loss": -12.520105361938477, "global_step": 431985, "epoch": 2571} {"train_loss": -12.563909530639648, "global_step": 431986, "epoch": 2571} {"train_loss": -12.50263500213623, "global_step": 431987, "epoch": 2571} {"train_loss": -12.379083633422852, "global_step": 431988, "epoch": 2571} {"train_loss": -12.507402420043945, "global_step": 431989, "epoch": 2571} {"train_loss": -12.613422393798828, "global_step": 431990, "epoch": 2571} {"train_loss": -12.66195297241211, "global_step": 431991, "epoch": 2571} {"train_loss": -12.533093452453613, "global_step": 431992, "epoch": 2571} {"train_loss": -12.474569320678711, "global_step": 431993, "epoch": 2571} {"train_loss": -12.81069278717041, "global_step": 431994, "epoch": 2571} {"train_loss": -12.501279830932617, "global_step": 431995, "epoch": 2571} {"train_loss": -12.794666290283203, "global_step": 431996, "epoch": 2571} {"train_loss": -12.664609909057617, "global_step": 431997, "epoch": 2571} {"train_loss": -12.561505317687988, "global_step": 431998, "epoch": 2571} {"train_loss": -12.497036933898926, "global_step": 431999, "epoch": 2571} {"train_loss": -12.45287799835205, "global_step": 432000, "epoch": 2571} {"train_loss": -12.480624198913574, "global_step": 432001, "epoch": 2571} {"train_loss": -12.664571762084961, "global_step": 432002, "epoch": 2571} {"train_loss": -12.793063163757324, "global_step": 432003, "epoch": 2571} {"train_loss": -12.638136863708496, "global_step": 432004, "epoch": 2571} {"train_loss": -12.78908920288086, "global_step": 432005, "epoch": 2571} {"train_loss": -12.724727630615234, "global_step": 432006, "epoch": 2571} {"train_loss": -12.731103897094727, "global_step": 432007, "epoch": 2571} {"train_loss": -12.849335670471191, "global_step": 432008, "epoch": 2571} {"train_loss": -12.59255599975586, "global_step": 432009, "epoch": 2571} {"train_loss": -12.703634262084961, "global_step": 432010, "epoch": 2571} {"train_loss": -12.663351058959961, "global_step": 432011, "epoch": 2571} {"train_loss": -12.713968276977539, "global_step": 432012, "epoch": 2571} {"train_loss": -12.56224250793457, "global_step": 432013, "epoch": 2571} {"train_loss": -12.619874954223633, "global_step": 432014, "epoch": 2571} {"train_loss": -12.668375015258789, "global_step": 432015, "epoch": 2571} {"train_loss": -12.780447006225586, "global_step": 432016, "epoch": 2571} {"train_loss": -12.399618148803711, "global_step": 432017, "epoch": 2571} {"train_loss": -12.507381439208984, "global_step": 432018, "epoch": 2571} {"train_loss": -12.630105018615723, "global_step": 432019, "epoch": 2571} {"train_loss": -12.42607307434082, "global_step": 432020, "epoch": 2571} {"train_loss": -12.685722351074219, "global_step": 432021, "epoch": 2571} {"train_loss": -12.421857833862305, "global_step": 432022, "epoch": 2571} {"train_loss": -12.074814796447754, "global_step": 432023, "epoch": 2571} {"train_loss": -12.60886001586914, "global_step": 432024, "epoch": 2571} {"train_loss": -12.128435134887695, "global_step": 432025, "epoch": 2571} {"train_loss": -12.397529602050781, "global_step": 432026, "epoch": 2571} {"train_loss": -12.560794830322266, "global_step": 432027, "epoch": 2571} {"train_loss": -12.338787078857422, "global_step": 432028, "epoch": 2571} {"train_loss": -12.339042663574219, "global_step": 432029, "epoch": 2571} {"train_loss": -12.343324661254883, "global_step": 432030, "epoch": 2571} {"train_loss": -11.91152286529541, "global_step": 432031, "epoch": 2571} {"train_loss": -11.920611381530762, "global_step": 432032, "epoch": 2571} {"train_loss": -11.621339797973633, "global_step": 432033, "epoch": 2571} {"train_loss": -12.313005447387695, "global_step": 432034, "epoch": 2571} {"train_loss": -12.021738052368164, "global_step": 432035, "epoch": 2571} {"train_loss": -11.891550064086914, "global_step": 432036, "epoch": 2571} {"train_loss": -12.108190536499023, "global_step": 432037, "epoch": 2571} {"train_loss": -11.73076343536377, "global_step": 432038, "epoch": 2571} {"train_loss": -12.170595169067383, "global_step": 432039, "epoch": 2571} {"train_loss": -12.454463958740234, "global_step": 432040, "epoch": 2571} {"train_loss": -11.989383697509766, "global_step": 432041, "epoch": 2571} {"train_loss": -12.297382354736328, "global_step": 432042, "epoch": 2571} {"train_loss": -12.3672513961792, "global_step": 432043, "epoch": 2571} {"train_loss": -11.786625862121582, "global_step": 432044, "epoch": 2571} {"train_loss": -12.012137413024902, "global_step": 432045, "epoch": 2571} {"train_loss": -12.311147689819336, "global_step": 432046, "epoch": 2571} {"train_loss": -11.646121978759766, "global_step": 432047, "epoch": 2571} {"train_loss": -12.479549407958984, "global_step": 432048, "epoch": 2571} {"train_loss": -12.232309341430664, "global_step": 432049, "epoch": 2571} {"train_loss": -11.864555358886719, "global_step": 432050, "epoch": 2571} {"train_loss": -12.409826278686523, "global_step": 432051, "epoch": 2571} {"train_loss": -12.432388305664062, "global_step": 432052, "epoch": 2571} {"train_loss": -11.812271118164062, "global_step": 432053, "epoch": 2571} {"train_loss": -12.405895233154297, "global_step": 432054, "epoch": 2571} {"train_loss": -12.662306785583496, "global_step": 432055, "epoch": 2571} {"train_loss": -12.121973037719727, "global_step": 432056, "epoch": 2571} {"train_loss": -12.294562339782715, "global_step": 432057, "epoch": 2571} {"train_loss": -12.306529998779297, "global_step": 432058, "epoch": 2571} {"train_loss": -12.281944274902344, "global_step": 432059, "epoch": 2571} {"train_loss": -12.385393142700195, "global_step": 432060, "epoch": 2571} {"train_loss": -11.754124641418457, "global_step": 432061, "epoch": 2571} {"train_loss": -12.414549827575684, "global_step": 432062, "epoch": 2571} {"train_loss": -11.731992721557617, "global_step": 432063, "epoch": 2571} {"train_loss": -12.024420738220215, "global_step": 432064, "epoch": 2571} {"train_loss": -12.149759292602539, "global_step": 432065, "epoch": 2571} {"train_loss": -12.115732192993164, "global_step": 432066, "epoch": 2571} {"train_loss": -12.55467700958252, "global_step": 432067, "epoch": 2571} {"train_loss": -11.982359886169434, "global_step": 432068, "epoch": 2571} {"train_loss": -12.17056941986084, "global_step": 432069, "epoch": 2571} {"train_loss": -12.263557434082031, "global_step": 432070, "epoch": 2571} {"train_loss": -11.758443832397461, "global_step": 432071, "epoch": 2571} {"train_loss": -11.770652770996094, "global_step": 432072, "epoch": 2571} {"train_loss": -11.710258483886719, "global_step": 432073, "epoch": 2571} {"train_loss": -10.661855697631836, "global_step": 432074, "epoch": 2571} {"train_loss": -12.200902938842773, "global_step": 432075, "epoch": 2571} {"train_loss": -10.219799041748047, "global_step": 432076, "epoch": 2571} {"train_loss": -12.146105766296387, "global_step": 432077, "epoch": 2571} {"train_loss": -10.795918464660645, "global_step": 432078, "epoch": 2571} {"train_loss": -10.674395561218262, "global_step": 432079, "epoch": 2571} {"train_loss": -11.53888988494873, "global_step": 432080, "epoch": 2571} {"train_loss": -10.30820083618164, "global_step": 432081, "epoch": 2571} {"train_loss": -10.273674011230469, "global_step": 432082, "epoch": 2571} {"train_loss": -10.308306694030762, "global_step": 432083, "epoch": 2571} {"train_loss": -10.020477294921875, "global_step": 432084, "epoch": 2571} {"train_loss": -10.855751037597656, "global_step": 432085, "epoch": 2571} {"train_loss": -11.24593734741211, "global_step": 432086, "epoch": 2571} {"train_loss": -11.68947982788086, "global_step": 432087, "epoch": 2571} {"train_loss": -10.905204772949219, "global_step": 432088, "epoch": 2571} {"train_loss": -11.861525535583496, "global_step": 432089, "epoch": 2571} {"train_loss": -11.424205780029297, "global_step": 432090, "epoch": 2571} {"train_loss": -11.984969139099121, "global_step": 432091, "epoch": 2571} {"train_loss": -11.729499816894531, "global_step": 432092, "epoch": 2571} {"train_loss": -12.027496337890625, "global_step": 432093, "epoch": 2571} {"train_loss": -12.061820983886719, "global_step": 432094, "epoch": 2571} {"train_loss": -11.810853203137716, "global_step": 432095, "epoch": 2571, "val_loss": 309919.5} {"train_loss": -11.770469665527344, "global_step": 432096, "epoch": 2572} {"train_loss": -11.696592330932617, "global_step": 432097, "epoch": 2572} {"train_loss": -11.972354888916016, "global_step": 432098, "epoch": 2572} {"train_loss": -12.117298126220703, "global_step": 432099, "epoch": 2572} {"train_loss": -12.047407150268555, "global_step": 432100, "epoch": 2572} {"train_loss": -11.568148612976074, "global_step": 432101, "epoch": 2572} {"train_loss": -11.428726196289062, "global_step": 432102, "epoch": 2572} {"train_loss": -11.898502349853516, "global_step": 432103, "epoch": 2572} {"train_loss": -11.353738784790039, "global_step": 432104, "epoch": 2572} {"train_loss": -12.449868202209473, "global_step": 432105, "epoch": 2572} {"train_loss": -10.999139785766602, "global_step": 432106, "epoch": 2572} {"train_loss": -11.770484924316406, "global_step": 432107, "epoch": 2572} {"train_loss": -11.708322525024414, "global_step": 432108, "epoch": 2572} {"train_loss": -12.232908248901367, "global_step": 432109, "epoch": 2572} {"train_loss": -11.674728393554688, "global_step": 432110, "epoch": 2572} {"train_loss": -12.207889556884766, "global_step": 432111, "epoch": 2572} {"train_loss": -11.622488975524902, "global_step": 432112, "epoch": 2572} {"train_loss": -12.33903694152832, "global_step": 432113, "epoch": 2572} {"train_loss": -12.003277778625488, "global_step": 432114, "epoch": 2572} {"train_loss": -12.034076690673828, "global_step": 432115, "epoch": 2572} {"train_loss": -11.899778366088867, "global_step": 432116, "epoch": 2572} {"train_loss": -11.742140769958496, "global_step": 432117, "epoch": 2572} {"train_loss": -12.241462707519531, "global_step": 432118, "epoch": 2572} {"train_loss": -12.056268692016602, "global_step": 432119, "epoch": 2572} {"train_loss": -12.19951057434082, "global_step": 432120, "epoch": 2572} {"train_loss": -12.03842830657959, "global_step": 432121, "epoch": 2572} {"train_loss": -11.996007919311523, "global_step": 432122, "epoch": 2572} {"train_loss": -11.835304260253906, "global_step": 432123, "epoch": 2572} {"train_loss": -11.951152801513672, "global_step": 432124, "epoch": 2572} {"train_loss": -12.388385772705078, "global_step": 432125, "epoch": 2572} {"train_loss": -11.90790843963623, "global_step": 432126, "epoch": 2572} {"train_loss": -12.442607879638672, "global_step": 432127, "epoch": 2572} {"train_loss": -11.754816055297852, "global_step": 432128, "epoch": 2572} {"train_loss": -12.092844009399414, "global_step": 432129, "epoch": 2572} {"train_loss": -12.255304336547852, "global_step": 432130, "epoch": 2572} {"train_loss": -12.385144233703613, "global_step": 432131, "epoch": 2572} {"train_loss": -12.564714431762695, "global_step": 432132, "epoch": 2572} {"train_loss": -12.203546524047852, "global_step": 432133, "epoch": 2572} {"train_loss": -12.580638885498047, "global_step": 432134, "epoch": 2572} {"train_loss": -12.30263900756836, "global_step": 432135, "epoch": 2572} {"train_loss": -12.36168098449707, "global_step": 432136, "epoch": 2572} {"train_loss": -12.471220016479492, "global_step": 432137, "epoch": 2572} {"train_loss": -12.216008186340332, "global_step": 432138, "epoch": 2572} {"train_loss": -12.633811950683594, "global_step": 432139, "epoch": 2572} {"train_loss": -12.292379379272461, "global_step": 432140, "epoch": 2572} {"train_loss": -12.345985412597656, "global_step": 432141, "epoch": 2572} {"train_loss": -12.366336822509766, "global_step": 432142, "epoch": 2572} {"train_loss": -12.654434204101562, "global_step": 432143, "epoch": 2572} {"train_loss": -12.471113204956055, "global_step": 432144, "epoch": 2572} {"train_loss": -12.580233573913574, "global_step": 432145, "epoch": 2572} {"train_loss": -12.499417304992676, "global_step": 432146, "epoch": 2572} {"train_loss": -12.351810455322266, "global_step": 432147, "epoch": 2572} {"train_loss": -12.636174201965332, "global_step": 432148, "epoch": 2572} {"train_loss": -12.360105514526367, "global_step": 432149, "epoch": 2572} {"train_loss": -12.5037841796875, "global_step": 432150, "epoch": 2572} {"train_loss": -12.11543083190918, "global_step": 432151, "epoch": 2572} {"train_loss": -12.481758117675781, "global_step": 432152, "epoch": 2572} {"train_loss": -12.365762710571289, "global_step": 432153, "epoch": 2572} {"train_loss": -12.699702262878418, "global_step": 432154, "epoch": 2572} {"train_loss": -12.356806755065918, "global_step": 432155, "epoch": 2572} {"train_loss": -12.706137657165527, "global_step": 432156, "epoch": 2572} {"train_loss": -12.701688766479492, "global_step": 432157, "epoch": 2572} {"train_loss": -12.520326614379883, "global_step": 432158, "epoch": 2572} {"train_loss": -12.6988525390625, "global_step": 432159, "epoch": 2572} {"train_loss": -12.573927879333496, "global_step": 432160, "epoch": 2572} {"train_loss": -12.539619445800781, "global_step": 432161, "epoch": 2572} {"train_loss": -12.387594223022461, "global_step": 432162, "epoch": 2572} {"train_loss": -12.609325408935547, "global_step": 432163, "epoch": 2572} {"train_loss": -12.727001190185547, "global_step": 432164, "epoch": 2572} {"train_loss": -12.565046310424805, "global_step": 432165, "epoch": 2572} {"train_loss": -12.673346519470215, "global_step": 432166, "epoch": 2572} {"train_loss": -12.604028701782227, "global_step": 432167, "epoch": 2572} {"train_loss": -12.595044136047363, "global_step": 432168, "epoch": 2572} {"train_loss": -12.739047050476074, "global_step": 432169, "epoch": 2572} {"train_loss": -12.663320541381836, "global_step": 432170, "epoch": 2572} {"train_loss": -12.614813804626465, "global_step": 432171, "epoch": 2572} {"train_loss": -12.348943710327148, "global_step": 432172, "epoch": 2572} {"train_loss": -12.894458770751953, "global_step": 432173, "epoch": 2572} {"train_loss": -12.908522605895996, "global_step": 432174, "epoch": 2572} {"train_loss": -12.676309585571289, "global_step": 432175, "epoch": 2572} {"train_loss": -12.908182144165039, "global_step": 432176, "epoch": 2572} {"train_loss": -12.750391006469727, "global_step": 432177, "epoch": 2572} {"train_loss": -12.783252716064453, "global_step": 432178, "epoch": 2572} {"train_loss": -12.927754402160645, "global_step": 432179, "epoch": 2572} {"train_loss": -12.700541496276855, "global_step": 432180, "epoch": 2572} {"train_loss": -12.760050773620605, "global_step": 432181, "epoch": 2572} {"train_loss": -12.791921615600586, "global_step": 432182, "epoch": 2572} {"train_loss": -12.687808990478516, "global_step": 432183, "epoch": 2572} {"train_loss": -12.5284423828125, "global_step": 432184, "epoch": 2572} {"train_loss": -12.754098892211914, "global_step": 432185, "epoch": 2572} {"train_loss": -12.776529312133789, "global_step": 432186, "epoch": 2572} {"train_loss": -12.59860897064209, "global_step": 432187, "epoch": 2572} {"train_loss": -12.206250190734863, "global_step": 432188, "epoch": 2572} {"train_loss": -12.293510437011719, "global_step": 432189, "epoch": 2572} {"train_loss": -12.565147399902344, "global_step": 432190, "epoch": 2572} {"train_loss": -12.247640609741211, "global_step": 432191, "epoch": 2572} {"train_loss": -11.926048278808594, "global_step": 432192, "epoch": 2572} {"train_loss": -12.771442413330078, "global_step": 432193, "epoch": 2572} {"train_loss": -11.98415470123291, "global_step": 432194, "epoch": 2572} {"train_loss": -11.634767532348633, "global_step": 432195, "epoch": 2572} {"train_loss": -12.301982879638672, "global_step": 432196, "epoch": 2572} {"train_loss": -12.47119426727295, "global_step": 432197, "epoch": 2572} {"train_loss": -12.130464553833008, "global_step": 432198, "epoch": 2572} {"train_loss": -12.307807922363281, "global_step": 432199, "epoch": 2572} {"train_loss": -12.097681045532227, "global_step": 432200, "epoch": 2572} {"train_loss": -11.753395080566406, "global_step": 432201, "epoch": 2572} {"train_loss": -12.304779052734375, "global_step": 432202, "epoch": 2572} {"train_loss": -12.267868041992188, "global_step": 432203, "epoch": 2572} {"train_loss": -12.337181091308594, "global_step": 432204, "epoch": 2572} {"train_loss": -12.173398971557617, "global_step": 432205, "epoch": 2572} {"train_loss": -12.03277587890625, "global_step": 432206, "epoch": 2572} {"train_loss": -12.461709022521973, "global_step": 432207, "epoch": 2572} {"train_loss": -12.067035675048828, "global_step": 432208, "epoch": 2572} {"train_loss": -12.19131851196289, "global_step": 432209, "epoch": 2572} {"train_loss": -11.741893768310547, "global_step": 432210, "epoch": 2572} {"train_loss": -12.248161315917969, "global_step": 432211, "epoch": 2572} {"train_loss": -12.038856506347656, "global_step": 432212, "epoch": 2572} {"train_loss": -12.131853103637695, "global_step": 432213, "epoch": 2572} {"train_loss": -12.785503387451172, "global_step": 432214, "epoch": 2572} {"train_loss": -12.038412094116211, "global_step": 432215, "epoch": 2572} {"train_loss": -12.703767776489258, "global_step": 432216, "epoch": 2572} {"train_loss": -12.086322784423828, "global_step": 432217, "epoch": 2572} {"train_loss": -12.17679214477539, "global_step": 432218, "epoch": 2572} {"train_loss": -12.300869941711426, "global_step": 432219, "epoch": 2572} {"train_loss": -12.540424346923828, "global_step": 432220, "epoch": 2572} {"train_loss": -12.669078826904297, "global_step": 432221, "epoch": 2572} {"train_loss": -12.073901176452637, "global_step": 432222, "epoch": 2572} {"train_loss": -12.328058242797852, "global_step": 432223, "epoch": 2572} {"train_loss": -12.041008949279785, "global_step": 432224, "epoch": 2572} {"train_loss": -12.508395195007324, "global_step": 432225, "epoch": 2572} {"train_loss": -10.714417457580566, "global_step": 432226, "epoch": 2572} {"train_loss": -12.13542366027832, "global_step": 432227, "epoch": 2572} {"train_loss": -11.262561798095703, "global_step": 432228, "epoch": 2572} {"train_loss": -10.19377613067627, "global_step": 432229, "epoch": 2572} {"train_loss": -11.217180252075195, "global_step": 432230, "epoch": 2572} {"train_loss": -11.104053497314453, "global_step": 432231, "epoch": 2572} {"train_loss": -11.818275451660156, "global_step": 432232, "epoch": 2572} {"train_loss": -11.188724517822266, "global_step": 432233, "epoch": 2572} {"train_loss": -9.640583038330078, "global_step": 432234, "epoch": 2572} {"train_loss": -11.888473510742188, "global_step": 432235, "epoch": 2572} {"train_loss": -9.450727462768555, "global_step": 432236, "epoch": 2572} {"train_loss": -11.47176456451416, "global_step": 432237, "epoch": 2572} {"train_loss": -9.482196807861328, "global_step": 432238, "epoch": 2572} {"train_loss": -10.871262550354004, "global_step": 432239, "epoch": 2572} {"train_loss": -10.511314392089844, "global_step": 432240, "epoch": 2572} {"train_loss": -10.7021484375, "global_step": 432241, "epoch": 2572} {"train_loss": -10.975811958312988, "global_step": 432242, "epoch": 2572} {"train_loss": -10.993267059326172, "global_step": 432243, "epoch": 2572} {"train_loss": -9.484029769897461, "global_step": 432244, "epoch": 2572} {"train_loss": -10.986766815185547, "global_step": 432245, "epoch": 2572} {"train_loss": -10.469806671142578, "global_step": 432246, "epoch": 2572} {"train_loss": -9.724435806274414, "global_step": 432247, "epoch": 2572} {"train_loss": -11.176475524902344, "global_step": 432248, "epoch": 2572} {"train_loss": -10.769576072692871, "global_step": 432249, "epoch": 2572} {"train_loss": -11.783031463623047, "global_step": 432250, "epoch": 2572} {"train_loss": -11.925889015197754, "global_step": 432251, "epoch": 2572} {"train_loss": -11.390029907226562, "global_step": 432252, "epoch": 2572} {"train_loss": -11.011449813842773, "global_step": 432253, "epoch": 2572} {"train_loss": -11.734477996826172, "global_step": 432254, "epoch": 2572} {"train_loss": -11.419929504394531, "global_step": 432255, "epoch": 2572} {"train_loss": -12.034834861755371, "global_step": 432256, "epoch": 2572} {"train_loss": -10.888925552368164, "global_step": 432257, "epoch": 2572} {"train_loss": -11.593605041503906, "global_step": 432258, "epoch": 2572} {"train_loss": -11.651411056518555, "global_step": 432259, "epoch": 2572} {"train_loss": -11.893656730651855, "global_step": 432260, "epoch": 2572} {"train_loss": -11.903234481811523, "global_step": 432261, "epoch": 2572} {"train_loss": -12.030054092407227, "global_step": 432262, "epoch": 2572} {"train_loss": -12.026267023313613, "global_step": 432263, "epoch": 2572, "val_loss": 311459.0625} {"train_loss": -11.970701217651367, "global_step": 432264, "epoch": 2573} {"train_loss": -11.855413436889648, "global_step": 432265, "epoch": 2573} {"train_loss": -11.946880340576172, "global_step": 432266, "epoch": 2573} {"train_loss": -11.855146408081055, "global_step": 432267, "epoch": 2573} {"train_loss": -11.553096771240234, "global_step": 432268, "epoch": 2573} {"train_loss": -11.896984100341797, "global_step": 432269, "epoch": 2573} {"train_loss": -11.877511978149414, "global_step": 432270, "epoch": 2573} {"train_loss": -11.791731834411621, "global_step": 432271, "epoch": 2573} {"train_loss": -12.176300048828125, "global_step": 432272, "epoch": 2573} {"train_loss": -11.59739875793457, "global_step": 432273, "epoch": 2573} {"train_loss": -12.286439895629883, "global_step": 432274, "epoch": 2573} {"train_loss": -11.634432792663574, "global_step": 432275, "epoch": 2573} {"train_loss": -12.045600891113281, "global_step": 432276, "epoch": 2573} {"train_loss": -11.671306610107422, "global_step": 432277, "epoch": 2573} {"train_loss": -12.005659103393555, "global_step": 432278, "epoch": 2573} {"train_loss": -12.115988731384277, "global_step": 432279, "epoch": 2573} {"train_loss": -12.062873840332031, "global_step": 432280, "epoch": 2573} {"train_loss": -12.160633087158203, "global_step": 432281, "epoch": 2573} {"train_loss": -12.35378646850586, "global_step": 432282, "epoch": 2573} {"train_loss": -11.948934555053711, "global_step": 432283, "epoch": 2573} {"train_loss": -12.068531036376953, "global_step": 432284, "epoch": 2573} {"train_loss": -12.266088485717773, "global_step": 432285, "epoch": 2573} {"train_loss": -11.616226196289062, "global_step": 432286, "epoch": 2573} {"train_loss": -12.212800025939941, "global_step": 432287, "epoch": 2573} {"train_loss": -11.618748664855957, "global_step": 432288, "epoch": 2573} {"train_loss": -12.355596542358398, "global_step": 432289, "epoch": 2573} {"train_loss": -11.831298828125, "global_step": 432290, "epoch": 2573} {"train_loss": -12.093644142150879, "global_step": 432291, "epoch": 2573} {"train_loss": -11.968029975891113, "global_step": 432292, "epoch": 2573} {"train_loss": -12.326862335205078, "global_step": 432293, "epoch": 2573} {"train_loss": -12.16690444946289, "global_step": 432294, "epoch": 2573} {"train_loss": -12.27275276184082, "global_step": 432295, "epoch": 2573} {"train_loss": -12.349748611450195, "global_step": 432296, "epoch": 2573} {"train_loss": -12.302956581115723, "global_step": 432297, "epoch": 2573} {"train_loss": -12.468101501464844, "global_step": 432298, "epoch": 2573} {"train_loss": -12.299919128417969, "global_step": 432299, "epoch": 2573} {"train_loss": -12.51636791229248, "global_step": 432300, "epoch": 2573} {"train_loss": -12.045063018798828, "global_step": 432301, "epoch": 2573} {"train_loss": -12.3880615234375, "global_step": 432302, "epoch": 2573} {"train_loss": -12.363574981689453, "global_step": 432303, "epoch": 2573} {"train_loss": -12.388439178466797, "global_step": 432304, "epoch": 2573} {"train_loss": -12.34036922454834, "global_step": 432305, "epoch": 2573} {"train_loss": -12.300836563110352, "global_step": 432306, "epoch": 2573} {"train_loss": -12.452051162719727, "global_step": 432307, "epoch": 2573} {"train_loss": -12.553253173828125, "global_step": 432308, "epoch": 2573} {"train_loss": -12.444231033325195, "global_step": 432309, "epoch": 2573} {"train_loss": -12.598308563232422, "global_step": 432310, "epoch": 2573} {"train_loss": -12.265931129455566, "global_step": 432311, "epoch": 2573} {"train_loss": -12.527579307556152, "global_step": 432312, "epoch": 2573} {"train_loss": -12.416573524475098, "global_step": 432313, "epoch": 2573} {"train_loss": -12.512552261352539, "global_step": 432314, "epoch": 2573} {"train_loss": -12.692934036254883, "global_step": 432315, "epoch": 2573} {"train_loss": -12.5262451171875, "global_step": 432316, "epoch": 2573} {"train_loss": -12.721506118774414, "global_step": 432317, "epoch": 2573} {"train_loss": -12.233104705810547, "global_step": 432318, "epoch": 2573} {"train_loss": -12.746776580810547, "global_step": 432319, "epoch": 2573} {"train_loss": -12.447057723999023, "global_step": 432320, "epoch": 2573} {"train_loss": -12.614828109741211, "global_step": 432321, "epoch": 2573} {"train_loss": -12.438945770263672, "global_step": 432322, "epoch": 2573} {"train_loss": -12.536624908447266, "global_step": 432323, "epoch": 2573} {"train_loss": -12.731929779052734, "global_step": 432324, "epoch": 2573} {"train_loss": -12.857830047607422, "global_step": 432325, "epoch": 2573} {"train_loss": -12.713961601257324, "global_step": 432326, "epoch": 2573} {"train_loss": -12.452272415161133, "global_step": 432327, "epoch": 2573} {"train_loss": -12.493341445922852, "global_step": 432328, "epoch": 2573} {"train_loss": -12.898605346679688, "global_step": 432329, "epoch": 2573} {"train_loss": -12.70529556274414, "global_step": 432330, "epoch": 2573} {"train_loss": -12.929838180541992, "global_step": 432331, "epoch": 2573} {"train_loss": -12.771841049194336, "global_step": 432332, "epoch": 2573} {"train_loss": -12.803561210632324, "global_step": 432333, "epoch": 2573} {"train_loss": -12.713846206665039, "global_step": 432334, "epoch": 2573} {"train_loss": -12.525634765625, "global_step": 432335, "epoch": 2573} {"train_loss": -12.639467239379883, "global_step": 432336, "epoch": 2573} {"train_loss": -12.439787864685059, "global_step": 432337, "epoch": 2573} {"train_loss": -12.643328666687012, "global_step": 432338, "epoch": 2573} {"train_loss": -12.59875202178955, "global_step": 432339, "epoch": 2573} {"train_loss": -12.625402450561523, "global_step": 432340, "epoch": 2573} {"train_loss": -12.795120239257812, "global_step": 432341, "epoch": 2573} {"train_loss": -12.526912689208984, "global_step": 432342, "epoch": 2573} {"train_loss": -12.412410736083984, "global_step": 432343, "epoch": 2573} {"train_loss": -12.911815643310547, "global_step": 432344, "epoch": 2573} {"train_loss": -12.259147644042969, "global_step": 432345, "epoch": 2573} {"train_loss": -12.446565628051758, "global_step": 432346, "epoch": 2573} {"train_loss": -12.551252365112305, "global_step": 432347, "epoch": 2573} {"train_loss": -12.126274108886719, "global_step": 432348, "epoch": 2573} {"train_loss": -12.177972793579102, "global_step": 432349, "epoch": 2573} {"train_loss": -12.588541030883789, "global_step": 432350, "epoch": 2573} {"train_loss": -12.216768264770508, "global_step": 432351, "epoch": 2573} {"train_loss": -12.349021911621094, "global_step": 432352, "epoch": 2573} {"train_loss": -12.56364631652832, "global_step": 432353, "epoch": 2573} {"train_loss": -12.567678451538086, "global_step": 432354, "epoch": 2573} {"train_loss": -12.677114486694336, "global_step": 432355, "epoch": 2573} {"train_loss": -12.789473533630371, "global_step": 432356, "epoch": 2573} {"train_loss": -12.628074645996094, "global_step": 432357, "epoch": 2573} {"train_loss": -12.658613204956055, "global_step": 432358, "epoch": 2573} {"train_loss": -12.70046615600586, "global_step": 432359, "epoch": 2573} {"train_loss": -12.658743858337402, "global_step": 432360, "epoch": 2573} {"train_loss": -12.625641822814941, "global_step": 432361, "epoch": 2573} {"train_loss": -12.825926780700684, "global_step": 432362, "epoch": 2573} {"train_loss": -12.589193344116211, "global_step": 432363, "epoch": 2573} {"train_loss": -12.707382202148438, "global_step": 432364, "epoch": 2573} {"train_loss": -12.465721130371094, "global_step": 432365, "epoch": 2573} {"train_loss": -12.627264022827148, "global_step": 432366, "epoch": 2573} {"train_loss": -12.551483154296875, "global_step": 432367, "epoch": 2573} {"train_loss": -12.773212432861328, "global_step": 432368, "epoch": 2573} {"train_loss": -12.856584548950195, "global_step": 432369, "epoch": 2573} {"train_loss": -12.911283493041992, "global_step": 432370, "epoch": 2573} {"train_loss": -12.470495223999023, "global_step": 432371, "epoch": 2573} {"train_loss": -12.9586820602417, "global_step": 432372, "epoch": 2573} {"train_loss": -12.767662048339844, "global_step": 432373, "epoch": 2573} {"train_loss": -12.791452407836914, "global_step": 432374, "epoch": 2573} {"train_loss": -12.753246307373047, "global_step": 432375, "epoch": 2573} {"train_loss": -12.86518669128418, "global_step": 432376, "epoch": 2573} {"train_loss": -12.746621131896973, "global_step": 432377, "epoch": 2573} {"train_loss": -12.495574951171875, "global_step": 432378, "epoch": 2573} {"train_loss": -12.243642807006836, "global_step": 432379, "epoch": 2573} {"train_loss": -12.159822463989258, "global_step": 432380, "epoch": 2573} {"train_loss": -12.78887939453125, "global_step": 432381, "epoch": 2573} {"train_loss": -11.997861862182617, "global_step": 432382, "epoch": 2573} {"train_loss": -12.303106307983398, "global_step": 432383, "epoch": 2573} {"train_loss": -12.213217735290527, "global_step": 432384, "epoch": 2573} {"train_loss": -11.970733642578125, "global_step": 432385, "epoch": 2573} {"train_loss": -12.420406341552734, "global_step": 432386, "epoch": 2573} {"train_loss": -12.806514739990234, "global_step": 432387, "epoch": 2573} {"train_loss": -11.929779052734375, "global_step": 432388, "epoch": 2573} {"train_loss": -11.716684341430664, "global_step": 432389, "epoch": 2573} {"train_loss": -12.603151321411133, "global_step": 432390, "epoch": 2573} {"train_loss": -12.139875411987305, "global_step": 432391, "epoch": 2573} {"train_loss": -11.22170352935791, "global_step": 432392, "epoch": 2573} {"train_loss": -11.826377868652344, "global_step": 432393, "epoch": 2573} {"train_loss": -12.698516845703125, "global_step": 432394, "epoch": 2573} {"train_loss": -11.02448844909668, "global_step": 432395, "epoch": 2573} {"train_loss": -12.454574584960938, "global_step": 432396, "epoch": 2573} {"train_loss": -12.45018196105957, "global_step": 432397, "epoch": 2573} {"train_loss": -12.36555290222168, "global_step": 432398, "epoch": 2573} {"train_loss": -12.192405700683594, "global_step": 432399, "epoch": 2573} {"train_loss": -12.342731475830078, "global_step": 432400, "epoch": 2573} {"train_loss": -12.448990821838379, "global_step": 432401, "epoch": 2573} {"train_loss": -12.15736198425293, "global_step": 432402, "epoch": 2573} {"train_loss": -12.271388053894043, "global_step": 432403, "epoch": 2573} {"train_loss": -12.411558151245117, "global_step": 432404, "epoch": 2573} {"train_loss": -12.253662109375, "global_step": 432405, "epoch": 2573} {"train_loss": -12.515390396118164, "global_step": 432406, "epoch": 2573} {"train_loss": -12.338260650634766, "global_step": 432407, "epoch": 2573} {"train_loss": -12.511685371398926, "global_step": 432408, "epoch": 2573} {"train_loss": -11.836207389831543, "global_step": 432409, "epoch": 2573} {"train_loss": -11.739523887634277, "global_step": 432410, "epoch": 2573} {"train_loss": -12.586006164550781, "global_step": 432411, "epoch": 2573} {"train_loss": -11.822883605957031, "global_step": 432412, "epoch": 2573} {"train_loss": -12.330974578857422, "global_step": 432413, "epoch": 2573} {"train_loss": -12.331339836120605, "global_step": 432414, "epoch": 2573} {"train_loss": -12.550689697265625, "global_step": 432415, "epoch": 2573} {"train_loss": -12.127740859985352, "global_step": 432416, "epoch": 2573} {"train_loss": -12.42001724243164, "global_step": 432417, "epoch": 2573} {"train_loss": -11.588329315185547, "global_step": 432418, "epoch": 2573} {"train_loss": -12.02727222442627, "global_step": 432419, "epoch": 2573} {"train_loss": -12.342594146728516, "global_step": 432420, "epoch": 2573} {"train_loss": -12.165094375610352, "global_step": 432421, "epoch": 2573} {"train_loss": -10.854055404663086, "global_step": 432422, "epoch": 2573} {"train_loss": -11.375741958618164, "global_step": 432423, "epoch": 2573} {"train_loss": -12.011475563049316, "global_step": 432424, "epoch": 2573} {"train_loss": -11.097966194152832, "global_step": 432425, "epoch": 2573} {"train_loss": -10.461723327636719, "global_step": 432426, "epoch": 2573} {"train_loss": -10.25147819519043, "global_step": 432427, "epoch": 2573} {"train_loss": -11.323944091796875, "global_step": 432428, "epoch": 2573} {"train_loss": -9.849162101745605, "global_step": 432429, "epoch": 2573} {"train_loss": -9.195243835449219, "global_step": 432430, "epoch": 2573} {"train_loss": -12.246252116702852, "global_step": 432431, "epoch": 2573, "val_loss": 310834.9375} {"train_loss": -11.002395629882812, "global_step": 432432, "epoch": 2574} {"train_loss": -10.626628875732422, "global_step": 432433, "epoch": 2574} {"train_loss": -9.559219360351562, "global_step": 432434, "epoch": 2574} {"train_loss": -10.095192909240723, "global_step": 432435, "epoch": 2574} {"train_loss": -10.127822875976562, "global_step": 432436, "epoch": 2574} {"train_loss": -10.806960105895996, "global_step": 432437, "epoch": 2574} {"train_loss": -9.940300941467285, "global_step": 432438, "epoch": 2574} {"train_loss": -10.263328552246094, "global_step": 432439, "epoch": 2574} {"train_loss": -11.448171615600586, "global_step": 432440, "epoch": 2574} {"train_loss": -10.854301452636719, "global_step": 432441, "epoch": 2574} {"train_loss": -10.675291061401367, "global_step": 432442, "epoch": 2574} {"train_loss": -11.137618064880371, "global_step": 432443, "epoch": 2574} {"train_loss": -11.430946350097656, "global_step": 432444, "epoch": 2574} {"train_loss": -11.3493013381958, "global_step": 432445, "epoch": 2574} {"train_loss": -11.593920707702637, "global_step": 432446, "epoch": 2574} {"train_loss": -11.904918670654297, "global_step": 432447, "epoch": 2574} {"train_loss": -11.955873489379883, "global_step": 432448, "epoch": 2574} {"train_loss": -11.777365684509277, "global_step": 432449, "epoch": 2574} {"train_loss": -11.93583869934082, "global_step": 432450, "epoch": 2574} {"train_loss": -12.184906005859375, "global_step": 432451, "epoch": 2574} {"train_loss": -12.01405143737793, "global_step": 432452, "epoch": 2574} {"train_loss": -11.704889297485352, "global_step": 432453, "epoch": 2574} {"train_loss": -12.040862083435059, "global_step": 432454, "epoch": 2574} {"train_loss": -11.71548843383789, "global_step": 432455, "epoch": 2574} {"train_loss": -11.822526931762695, "global_step": 432456, "epoch": 2574} {"train_loss": -12.10666275024414, "global_step": 432457, "epoch": 2574} {"train_loss": -12.068016052246094, "global_step": 432458, "epoch": 2574} {"train_loss": -12.189263343811035, "global_step": 432459, "epoch": 2574} {"train_loss": -12.278220176696777, "global_step": 432460, "epoch": 2574} {"train_loss": -12.123190879821777, "global_step": 432461, "epoch": 2574} {"train_loss": -12.072149276733398, "global_step": 432462, "epoch": 2574} {"train_loss": -12.15224838256836, "global_step": 432463, "epoch": 2574} {"train_loss": -12.377625465393066, "global_step": 432464, "epoch": 2574} {"train_loss": -12.461599349975586, "global_step": 432465, "epoch": 2574} {"train_loss": -12.168634414672852, "global_step": 432466, "epoch": 2574} {"train_loss": -12.147666931152344, "global_step": 432467, "epoch": 2574} {"train_loss": -12.160884857177734, "global_step": 432468, "epoch": 2574} {"train_loss": -12.511462211608887, "global_step": 432469, "epoch": 2574} {"train_loss": -12.276472091674805, "global_step": 432470, "epoch": 2574} {"train_loss": -12.285765647888184, "global_step": 432471, "epoch": 2574} {"train_loss": -12.381425857543945, "global_step": 432472, "epoch": 2574} {"train_loss": -12.041658401489258, "global_step": 432473, "epoch": 2574} {"train_loss": -12.481056213378906, "global_step": 432474, "epoch": 2574} {"train_loss": -12.391027450561523, "global_step": 432475, "epoch": 2574} {"train_loss": -12.628921508789062, "global_step": 432476, "epoch": 2574} {"train_loss": -12.342846870422363, "global_step": 432477, "epoch": 2574} {"train_loss": -12.53405475616455, "global_step": 432478, "epoch": 2574} {"train_loss": -12.25308609008789, "global_step": 432479, "epoch": 2574} {"train_loss": -12.508240699768066, "global_step": 432480, "epoch": 2574} {"train_loss": -12.398844718933105, "global_step": 432481, "epoch": 2574} {"train_loss": -12.431854248046875, "global_step": 432482, "epoch": 2574} {"train_loss": -12.489651679992676, "global_step": 432483, "epoch": 2574} {"train_loss": -12.54316234588623, "global_step": 432484, "epoch": 2574} {"train_loss": -12.736837387084961, "global_step": 432485, "epoch": 2574} {"train_loss": -12.118780136108398, "global_step": 432486, "epoch": 2574} {"train_loss": -12.421923637390137, "global_step": 432487, "epoch": 2574} {"train_loss": -12.72385311126709, "global_step": 432488, "epoch": 2574} {"train_loss": -12.616411209106445, "global_step": 432489, "epoch": 2574} {"train_loss": -12.474007606506348, "global_step": 432490, "epoch": 2574} {"train_loss": -12.55893325805664, "global_step": 432491, "epoch": 2574} {"train_loss": -12.772865295410156, "global_step": 432492, "epoch": 2574} {"train_loss": -12.764482498168945, "global_step": 432493, "epoch": 2574} {"train_loss": -12.485438346862793, "global_step": 432494, "epoch": 2574} {"train_loss": -12.475081443786621, "global_step": 432495, "epoch": 2574} {"train_loss": -12.334609985351562, "global_step": 432496, "epoch": 2574} {"train_loss": -12.362091064453125, "global_step": 432497, "epoch": 2574} {"train_loss": -12.424840927124023, "global_step": 432498, "epoch": 2574} {"train_loss": -12.670232772827148, "global_step": 432499, "epoch": 2574} {"train_loss": -12.34598159790039, "global_step": 432500, "epoch": 2574} {"train_loss": -12.561683654785156, "global_step": 432501, "epoch": 2574} {"train_loss": -12.59218978881836, "global_step": 432502, "epoch": 2574} {"train_loss": -12.617477416992188, "global_step": 432503, "epoch": 2574} {"train_loss": -12.86323356628418, "global_step": 432504, "epoch": 2574} {"train_loss": -12.470915794372559, "global_step": 432505, "epoch": 2574} {"train_loss": -12.689460754394531, "global_step": 432506, "epoch": 2574} {"train_loss": -12.603347778320312, "global_step": 432507, "epoch": 2574} {"train_loss": -12.061100006103516, "global_step": 432508, "epoch": 2574} {"train_loss": -12.428732872009277, "global_step": 432509, "epoch": 2574} {"train_loss": -12.152999877929688, "global_step": 432510, "epoch": 2574} {"train_loss": -12.632658958435059, "global_step": 432511, "epoch": 2574} {"train_loss": -12.250482559204102, "global_step": 432512, "epoch": 2574} {"train_loss": -11.810567855834961, "global_step": 432513, "epoch": 2574} {"train_loss": -12.123773574829102, "global_step": 432514, "epoch": 2574} {"train_loss": -12.355700492858887, "global_step": 432515, "epoch": 2574} {"train_loss": -12.227028846740723, "global_step": 432516, "epoch": 2574} {"train_loss": -12.403702735900879, "global_step": 432517, "epoch": 2574} {"train_loss": -11.985321044921875, "global_step": 432518, "epoch": 2574} {"train_loss": -12.299912452697754, "global_step": 432519, "epoch": 2574} {"train_loss": -12.231675148010254, "global_step": 432520, "epoch": 2574} {"train_loss": -12.035669326782227, "global_step": 432521, "epoch": 2574} {"train_loss": -12.428741455078125, "global_step": 432522, "epoch": 2574} {"train_loss": -11.960101127624512, "global_step": 432523, "epoch": 2574} {"train_loss": -12.245857238769531, "global_step": 432524, "epoch": 2574} {"train_loss": -12.215559005737305, "global_step": 432525, "epoch": 2574} {"train_loss": -12.054890632629395, "global_step": 432526, "epoch": 2574} {"train_loss": -11.44137954711914, "global_step": 432527, "epoch": 2574} {"train_loss": -12.301315307617188, "global_step": 432528, "epoch": 2574} {"train_loss": -11.69214916229248, "global_step": 432529, "epoch": 2574} {"train_loss": -11.129172325134277, "global_step": 432530, "epoch": 2574} {"train_loss": -11.99517822265625, "global_step": 432531, "epoch": 2574} {"train_loss": -11.974605560302734, "global_step": 432532, "epoch": 2574} {"train_loss": -10.531268119812012, "global_step": 432533, "epoch": 2574} {"train_loss": -11.22846794128418, "global_step": 432534, "epoch": 2574} {"train_loss": -12.039899826049805, "global_step": 432535, "epoch": 2574} {"train_loss": -11.195416450500488, "global_step": 432536, "epoch": 2574} {"train_loss": -11.236776351928711, "global_step": 432537, "epoch": 2574} {"train_loss": -11.18403148651123, "global_step": 432538, "epoch": 2574} {"train_loss": -10.091879844665527, "global_step": 432539, "epoch": 2574} {"train_loss": -10.358016967773438, "global_step": 432540, "epoch": 2574} {"train_loss": -9.896531105041504, "global_step": 432541, "epoch": 2574} {"train_loss": -11.095699310302734, "global_step": 432542, "epoch": 2574} {"train_loss": -9.220107078552246, "global_step": 432543, "epoch": 2574} {"train_loss": -9.819952011108398, "global_step": 432544, "epoch": 2574} {"train_loss": -8.943686485290527, "global_step": 432545, "epoch": 2574} {"train_loss": -9.671571731567383, "global_step": 432546, "epoch": 2574} {"train_loss": -10.436445236206055, "global_step": 432547, "epoch": 2574} {"train_loss": -9.778754234313965, "global_step": 432548, "epoch": 2574} {"train_loss": -9.550338745117188, "global_step": 432549, "epoch": 2574} {"train_loss": -10.206404685974121, "global_step": 432550, "epoch": 2574} {"train_loss": -10.483100891113281, "global_step": 432551, "epoch": 2574} {"train_loss": -11.785648345947266, "global_step": 432552, "epoch": 2574} {"train_loss": -10.919403076171875, "global_step": 432553, "epoch": 2574} {"train_loss": -10.906859397888184, "global_step": 432554, "epoch": 2574} {"train_loss": -11.146528244018555, "global_step": 432555, "epoch": 2574} {"train_loss": -10.787513732910156, "global_step": 432556, "epoch": 2574} {"train_loss": -10.75973892211914, "global_step": 432557, "epoch": 2574} {"train_loss": -10.080657958984375, "global_step": 432558, "epoch": 2574} {"train_loss": -10.722728729248047, "global_step": 432559, "epoch": 2574} {"train_loss": -9.892239570617676, "global_step": 432560, "epoch": 2574} {"train_loss": -10.759974479675293, "global_step": 432561, "epoch": 2574} {"train_loss": -10.859609603881836, "global_step": 432562, "epoch": 2574} {"train_loss": -11.127643585205078, "global_step": 432563, "epoch": 2574} {"train_loss": -11.091360092163086, "global_step": 432564, "epoch": 2574} {"train_loss": -10.28515625, "global_step": 432565, "epoch": 2574} {"train_loss": -11.378576278686523, "global_step": 432566, "epoch": 2574} {"train_loss": -10.672883987426758, "global_step": 432567, "epoch": 2574} {"train_loss": -9.639325141906738, "global_step": 432568, "epoch": 2574} {"train_loss": -11.05178451538086, "global_step": 432569, "epoch": 2574} {"train_loss": -11.193094253540039, "global_step": 432570, "epoch": 2574} {"train_loss": -10.608539581298828, "global_step": 432571, "epoch": 2574} {"train_loss": -11.160518646240234, "global_step": 432572, "epoch": 2574} {"train_loss": -10.39225959777832, "global_step": 432573, "epoch": 2574} {"train_loss": -10.82268238067627, "global_step": 432574, "epoch": 2574} {"train_loss": -11.486211776733398, "global_step": 432575, "epoch": 2574} {"train_loss": -10.906341552734375, "global_step": 432576, "epoch": 2574} {"train_loss": -11.596216201782227, "global_step": 432577, "epoch": 2574} {"train_loss": -11.453238487243652, "global_step": 432578, "epoch": 2574} {"train_loss": -10.878148078918457, "global_step": 432579, "epoch": 2574} {"train_loss": -10.81037425994873, "global_step": 432580, "epoch": 2574} {"train_loss": -11.343006134033203, "global_step": 432581, "epoch": 2574} {"train_loss": -11.405166625976562, "global_step": 432582, "epoch": 2574} {"train_loss": -11.683938026428223, "global_step": 432583, "epoch": 2574} {"train_loss": -11.700749397277832, "global_step": 432584, "epoch": 2574} {"train_loss": -11.627472877502441, "global_step": 432585, "epoch": 2574} {"train_loss": -11.32717227935791, "global_step": 432586, "epoch": 2574} {"train_loss": -11.860252380371094, "global_step": 432587, "epoch": 2574} {"train_loss": -11.414438247680664, "global_step": 432588, "epoch": 2574} {"train_loss": -11.798158645629883, "global_step": 432589, "epoch": 2574} {"train_loss": -11.594620704650879, "global_step": 432590, "epoch": 2574} {"train_loss": -11.301095962524414, "global_step": 432591, "epoch": 2574} {"train_loss": -11.899609565734863, "global_step": 432592, "epoch": 2574} {"train_loss": -11.797114372253418, "global_step": 432593, "epoch": 2574} {"train_loss": -11.522823333740234, "global_step": 432594, "epoch": 2574} {"train_loss": -11.879761695861816, "global_step": 432595, "epoch": 2574} {"train_loss": -11.661970138549805, "global_step": 432596, "epoch": 2574} {"train_loss": -11.689630508422852, "global_step": 432597, "epoch": 2574} {"train_loss": -12.225440979003906, "global_step": 432598, "epoch": 2574} {"train_loss": -11.60648573012579, "global_step": 432599, "epoch": 2574, "val_loss": 310829.03125} {"train_loss": -11.941994667053223, "global_step": 432600, "epoch": 2575} {"train_loss": -12.195265769958496, "global_step": 432601, "epoch": 2575} {"train_loss": -11.750550270080566, "global_step": 432602, "epoch": 2575} {"train_loss": -11.819503784179688, "global_step": 432603, "epoch": 2575} {"train_loss": -12.041476249694824, "global_step": 432604, "epoch": 2575} {"train_loss": -11.99856948852539, "global_step": 432605, "epoch": 2575} {"train_loss": -11.783132553100586, "global_step": 432606, "epoch": 2575} {"train_loss": -12.116796493530273, "global_step": 432607, "epoch": 2575} {"train_loss": -11.888548851013184, "global_step": 432608, "epoch": 2575} {"train_loss": -11.923871040344238, "global_step": 432609, "epoch": 2575} {"train_loss": -12.144654273986816, "global_step": 432610, "epoch": 2575} {"train_loss": -12.02156925201416, "global_step": 432611, "epoch": 2575} {"train_loss": -11.975196838378906, "global_step": 432612, "epoch": 2575} {"train_loss": -12.003119468688965, "global_step": 432613, "epoch": 2575} {"train_loss": -11.847972869873047, "global_step": 432614, "epoch": 2575} {"train_loss": -11.44312572479248, "global_step": 432615, "epoch": 2575} {"train_loss": -12.181680679321289, "global_step": 432616, "epoch": 2575} {"train_loss": -12.140830039978027, "global_step": 432617, "epoch": 2575} {"train_loss": -11.985065460205078, "global_step": 432618, "epoch": 2575} {"train_loss": -11.883318901062012, "global_step": 432619, "epoch": 2575} {"train_loss": -12.130102157592773, "global_step": 432620, "epoch": 2575} {"train_loss": -12.235007286071777, "global_step": 432621, "epoch": 2575} {"train_loss": -12.278621673583984, "global_step": 432622, "epoch": 2575} {"train_loss": -12.312203407287598, "global_step": 432623, "epoch": 2575} {"train_loss": -12.080206871032715, "global_step": 432624, "epoch": 2575} {"train_loss": -12.081008911132812, "global_step": 432625, "epoch": 2575} {"train_loss": -12.21229362487793, "global_step": 432626, "epoch": 2575} {"train_loss": -12.418220520019531, "global_step": 432627, "epoch": 2575} {"train_loss": -12.30212688446045, "global_step": 432628, "epoch": 2575} {"train_loss": -12.360382080078125, "global_step": 432629, "epoch": 2575} {"train_loss": -12.339590072631836, "global_step": 432630, "epoch": 2575} {"train_loss": -12.334053039550781, "global_step": 432631, "epoch": 2575} {"train_loss": -12.299541473388672, "global_step": 432632, "epoch": 2575} {"train_loss": -12.491068840026855, "global_step": 432633, "epoch": 2575} {"train_loss": -12.284814834594727, "global_step": 432634, "epoch": 2575} {"train_loss": -12.485163688659668, "global_step": 432635, "epoch": 2575} {"train_loss": -12.291187286376953, "global_step": 432636, "epoch": 2575} {"train_loss": -12.5020112991333, "global_step": 432637, "epoch": 2575} {"train_loss": -12.398113250732422, "global_step": 432638, "epoch": 2575} {"train_loss": -12.357097625732422, "global_step": 432639, "epoch": 2575} {"train_loss": -12.35439682006836, "global_step": 432640, "epoch": 2575} {"train_loss": -12.54935073852539, "global_step": 432641, "epoch": 2575} {"train_loss": -12.455610275268555, "global_step": 432642, "epoch": 2575} {"train_loss": -12.36482048034668, "global_step": 432643, "epoch": 2575} {"train_loss": -12.58363151550293, "global_step": 432644, "epoch": 2575} {"train_loss": -12.659629821777344, "global_step": 432645, "epoch": 2575} {"train_loss": -12.424976348876953, "global_step": 432646, "epoch": 2575} {"train_loss": -12.685437202453613, "global_step": 432647, "epoch": 2575} {"train_loss": -12.615848541259766, "global_step": 432648, "epoch": 2575} {"train_loss": -12.530588150024414, "global_step": 432649, "epoch": 2575} {"train_loss": -12.49237060546875, "global_step": 432650, "epoch": 2575} {"train_loss": -12.7510986328125, "global_step": 432651, "epoch": 2575} {"train_loss": -12.613484382629395, "global_step": 432652, "epoch": 2575} {"train_loss": -12.434171676635742, "global_step": 432653, "epoch": 2575} {"train_loss": -12.42002010345459, "global_step": 432654, "epoch": 2575} {"train_loss": -12.573793411254883, "global_step": 432655, "epoch": 2575} {"train_loss": -12.596883773803711, "global_step": 432656, "epoch": 2575} {"train_loss": -12.593507766723633, "global_step": 432657, "epoch": 2575} {"train_loss": -12.668825149536133, "global_step": 432658, "epoch": 2575} {"train_loss": -12.738617897033691, "global_step": 432659, "epoch": 2575} {"train_loss": -12.39093017578125, "global_step": 432660, "epoch": 2575} {"train_loss": -12.332662582397461, "global_step": 432661, "epoch": 2575} {"train_loss": -12.68916130065918, "global_step": 432662, "epoch": 2575} {"train_loss": -12.563055038452148, "global_step": 432663, "epoch": 2575} {"train_loss": -12.5057954788208, "global_step": 432664, "epoch": 2575} {"train_loss": -12.45156478881836, "global_step": 432665, "epoch": 2575} {"train_loss": -12.621204376220703, "global_step": 432666, "epoch": 2575} {"train_loss": -12.522892951965332, "global_step": 432667, "epoch": 2575} {"train_loss": -12.651388168334961, "global_step": 432668, "epoch": 2575} {"train_loss": -12.672460556030273, "global_step": 432669, "epoch": 2575} {"train_loss": -12.433686256408691, "global_step": 432670, "epoch": 2575} {"train_loss": -12.737289428710938, "global_step": 432671, "epoch": 2575} {"train_loss": -12.781747817993164, "global_step": 432672, "epoch": 2575} {"train_loss": -12.828662872314453, "global_step": 432673, "epoch": 2575} {"train_loss": -12.741029739379883, "global_step": 432674, "epoch": 2575} {"train_loss": -12.83637523651123, "global_step": 432675, "epoch": 2575} {"train_loss": -12.546209335327148, "global_step": 432676, "epoch": 2575} {"train_loss": -12.502163887023926, "global_step": 432677, "epoch": 2575} {"train_loss": -12.731952667236328, "global_step": 432678, "epoch": 2575} {"train_loss": -13.0284423828125, "global_step": 432679, "epoch": 2575} {"train_loss": -12.705436706542969, "global_step": 432680, "epoch": 2575} {"train_loss": -12.646191596984863, "global_step": 432681, "epoch": 2575} {"train_loss": -12.81770133972168, "global_step": 432682, "epoch": 2575} {"train_loss": -12.677129745483398, "global_step": 432683, "epoch": 2575} {"train_loss": -12.836278915405273, "global_step": 432684, "epoch": 2575} {"train_loss": -12.851667404174805, "global_step": 432685, "epoch": 2575} {"train_loss": -12.93867301940918, "global_step": 432686, "epoch": 2575} {"train_loss": -12.9000825881958, "global_step": 432687, "epoch": 2575} {"train_loss": -12.92336368560791, "global_step": 432688, "epoch": 2575} {"train_loss": -12.928333282470703, "global_step": 432689, "epoch": 2575} {"train_loss": -12.706931114196777, "global_step": 432690, "epoch": 2575} {"train_loss": -12.993782043457031, "global_step": 432691, "epoch": 2575} {"train_loss": -12.777183532714844, "global_step": 432692, "epoch": 2575} {"train_loss": -12.810622215270996, "global_step": 432693, "epoch": 2575} {"train_loss": -12.634101867675781, "global_step": 432694, "epoch": 2575} {"train_loss": -12.73281478881836, "global_step": 432695, "epoch": 2575} {"train_loss": -12.741490364074707, "global_step": 432696, "epoch": 2575} {"train_loss": -12.733558654785156, "global_step": 432697, "epoch": 2575} {"train_loss": -12.68199348449707, "global_step": 432698, "epoch": 2575} {"train_loss": -12.630084991455078, "global_step": 432699, "epoch": 2575} {"train_loss": -12.656770706176758, "global_step": 432700, "epoch": 2575} {"train_loss": -12.682469367980957, "global_step": 432701, "epoch": 2575} {"train_loss": -12.607421875, "global_step": 432702, "epoch": 2575} {"train_loss": -12.043558120727539, "global_step": 432703, "epoch": 2575} {"train_loss": -12.540231704711914, "global_step": 432704, "epoch": 2575} {"train_loss": -12.468548774719238, "global_step": 432705, "epoch": 2575} {"train_loss": -12.051273345947266, "global_step": 432706, "epoch": 2575} {"train_loss": -12.256092071533203, "global_step": 432707, "epoch": 2575} {"train_loss": -12.77325439453125, "global_step": 432708, "epoch": 2575} {"train_loss": -12.363349914550781, "global_step": 432709, "epoch": 2575} {"train_loss": -12.554373741149902, "global_step": 432710, "epoch": 2575} {"train_loss": -12.364684104919434, "global_step": 432711, "epoch": 2575} {"train_loss": -12.591360092163086, "global_step": 432712, "epoch": 2575} {"train_loss": -12.054576873779297, "global_step": 432713, "epoch": 2575} {"train_loss": -12.39792537689209, "global_step": 432714, "epoch": 2575} {"train_loss": -12.138238906860352, "global_step": 432715, "epoch": 2575} {"train_loss": -12.301795959472656, "global_step": 432716, "epoch": 2575} {"train_loss": -12.233856201171875, "global_step": 432717, "epoch": 2575} {"train_loss": -12.216775894165039, "global_step": 432718, "epoch": 2575} {"train_loss": -11.861114501953125, "global_step": 432719, "epoch": 2575} {"train_loss": -12.512811660766602, "global_step": 432720, "epoch": 2575} {"train_loss": -12.044132232666016, "global_step": 432721, "epoch": 2575} {"train_loss": -12.413873672485352, "global_step": 432722, "epoch": 2575} {"train_loss": -12.38834285736084, "global_step": 432723, "epoch": 2575} {"train_loss": -12.394672393798828, "global_step": 432724, "epoch": 2575} {"train_loss": -12.237030982971191, "global_step": 432725, "epoch": 2575} {"train_loss": -12.344327926635742, "global_step": 432726, "epoch": 2575} {"train_loss": -12.544941902160645, "global_step": 432727, "epoch": 2575} {"train_loss": -12.405669212341309, "global_step": 432728, "epoch": 2575} {"train_loss": -12.203075408935547, "global_step": 432729, "epoch": 2575} {"train_loss": -12.618891716003418, "global_step": 432730, "epoch": 2575} {"train_loss": -12.23965835571289, "global_step": 432731, "epoch": 2575} {"train_loss": -11.581412315368652, "global_step": 432732, "epoch": 2575} {"train_loss": -11.088808059692383, "global_step": 432733, "epoch": 2575} {"train_loss": -12.32426643371582, "global_step": 432734, "epoch": 2575} {"train_loss": -11.182989120483398, "global_step": 432735, "epoch": 2575} {"train_loss": -11.631446838378906, "global_step": 432736, "epoch": 2575} {"train_loss": -11.185609817504883, "global_step": 432737, "epoch": 2575} {"train_loss": -10.570415496826172, "global_step": 432738, "epoch": 2575} {"train_loss": -12.310075759887695, "global_step": 432739, "epoch": 2575} {"train_loss": -11.269098281860352, "global_step": 432740, "epoch": 2575} {"train_loss": -10.6207275390625, "global_step": 432741, "epoch": 2575} {"train_loss": -12.12691879272461, "global_step": 432742, "epoch": 2575} {"train_loss": -9.69653606414795, "global_step": 432743, "epoch": 2575} {"train_loss": -11.147592544555664, "global_step": 432744, "epoch": 2575} {"train_loss": -11.371160507202148, "global_step": 432745, "epoch": 2575} {"train_loss": -10.514507293701172, "global_step": 432746, "epoch": 2575} {"train_loss": -10.706944465637207, "global_step": 432747, "epoch": 2575} {"train_loss": -11.967511177062988, "global_step": 432748, "epoch": 2575} {"train_loss": -9.548843383789062, "global_step": 432749, "epoch": 2575} {"train_loss": -11.544008255004883, "global_step": 432750, "epoch": 2575} {"train_loss": -10.99195671081543, "global_step": 432751, "epoch": 2575} {"train_loss": -11.793547630310059, "global_step": 432752, "epoch": 2575} {"train_loss": -11.301172256469727, "global_step": 432753, "epoch": 2575} {"train_loss": -11.721342086791992, "global_step": 432754, "epoch": 2575} {"train_loss": -12.203654289245605, "global_step": 432755, "epoch": 2575} {"train_loss": -11.098562240600586, "global_step": 432756, "epoch": 2575} {"train_loss": -11.686086654663086, "global_step": 432757, "epoch": 2575} {"train_loss": -11.376527786254883, "global_step": 432758, "epoch": 2575} {"train_loss": -11.22362995147705, "global_step": 432759, "epoch": 2575} {"train_loss": -11.59675407409668, "global_step": 432760, "epoch": 2575} {"train_loss": -10.805692672729492, "global_step": 432761, "epoch": 2575} {"train_loss": -11.136858940124512, "global_step": 432762, "epoch": 2575} {"train_loss": -11.042909622192383, "global_step": 432763, "epoch": 2575} {"train_loss": -9.502532005310059, "global_step": 432764, "epoch": 2575} {"train_loss": -11.813590049743652, "global_step": 432765, "epoch": 2575} {"train_loss": -9.491544723510742, "global_step": 432766, "epoch": 2575} {"train_loss": -12.152449187778291, "global_step": 432767, "epoch": 2575, "val_loss": 312029.53125, "train_action_mse_error": 2.2483694553375244} {"train_loss": -10.79987907409668, "global_step": 432768, "epoch": 2576} {"train_loss": -10.339706420898438, "global_step": 432769, "epoch": 2576} {"train_loss": -10.550457000732422, "global_step": 432770, "epoch": 2576} {"train_loss": -9.670921325683594, "global_step": 432771, "epoch": 2576} {"train_loss": -10.842182159423828, "global_step": 432772, "epoch": 2576} {"train_loss": -10.174249649047852, "global_step": 432773, "epoch": 2576} {"train_loss": -11.272528648376465, "global_step": 432774, "epoch": 2576} {"train_loss": -10.199129104614258, "global_step": 432775, "epoch": 2576} {"train_loss": -11.282400131225586, "global_step": 432776, "epoch": 2576} {"train_loss": -11.525151252746582, "global_step": 432777, "epoch": 2576} {"train_loss": -11.106597900390625, "global_step": 432778, "epoch": 2576} {"train_loss": -11.292201042175293, "global_step": 432779, "epoch": 2576} {"train_loss": -11.067144393920898, "global_step": 432780, "epoch": 2576} {"train_loss": -11.59683609008789, "global_step": 432781, "epoch": 2576} {"train_loss": -11.98748779296875, "global_step": 432782, "epoch": 2576} {"train_loss": -11.629606246948242, "global_step": 432783, "epoch": 2576} {"train_loss": -11.668233871459961, "global_step": 432784, "epoch": 2576} {"train_loss": -11.71214485168457, "global_step": 432785, "epoch": 2576} {"train_loss": -12.225025177001953, "global_step": 432786, "epoch": 2576} {"train_loss": -12.096719741821289, "global_step": 432787, "epoch": 2576} {"train_loss": -11.83360481262207, "global_step": 432788, "epoch": 2576} {"train_loss": -11.9000883102417, "global_step": 432789, "epoch": 2576} {"train_loss": -11.431315422058105, "global_step": 432790, "epoch": 2576} {"train_loss": -12.164981842041016, "global_step": 432791, "epoch": 2576} {"train_loss": -11.809358596801758, "global_step": 432792, "epoch": 2576} {"train_loss": -12.077607154846191, "global_step": 432793, "epoch": 2576} {"train_loss": -12.3716459274292, "global_step": 432794, "epoch": 2576} {"train_loss": -12.120806694030762, "global_step": 432795, "epoch": 2576} {"train_loss": -12.207234382629395, "global_step": 432796, "epoch": 2576} {"train_loss": -12.049416542053223, "global_step": 432797, "epoch": 2576} {"train_loss": -12.047889709472656, "global_step": 432798, "epoch": 2576} {"train_loss": -12.19778823852539, "global_step": 432799, "epoch": 2576} {"train_loss": -12.180549621582031, "global_step": 432800, "epoch": 2576} {"train_loss": -11.964160919189453, "global_step": 432801, "epoch": 2576} {"train_loss": -12.374198913574219, "global_step": 432802, "epoch": 2576} {"train_loss": -12.029729843139648, "global_step": 432803, "epoch": 2576} {"train_loss": -12.242162704467773, "global_step": 432804, "epoch": 2576} {"train_loss": -12.331730842590332, "global_step": 432805, "epoch": 2576} {"train_loss": -12.259927749633789, "global_step": 432806, "epoch": 2576} {"train_loss": -12.397173881530762, "global_step": 432807, "epoch": 2576} {"train_loss": -12.556528091430664, "global_step": 432808, "epoch": 2576} {"train_loss": -12.28239631652832, "global_step": 432809, "epoch": 2576} {"train_loss": -12.507877349853516, "global_step": 432810, "epoch": 2576} {"train_loss": -12.3885498046875, "global_step": 432811, "epoch": 2576} {"train_loss": -12.475332260131836, "global_step": 432812, "epoch": 2576} {"train_loss": -12.265302658081055, "global_step": 432813, "epoch": 2576} {"train_loss": -12.494647979736328, "global_step": 432814, "epoch": 2576} {"train_loss": -12.583502769470215, "global_step": 432815, "epoch": 2576} {"train_loss": -12.250690460205078, "global_step": 432816, "epoch": 2576} {"train_loss": -12.354209899902344, "global_step": 432817, "epoch": 2576} {"train_loss": -12.558834075927734, "global_step": 432818, "epoch": 2576} {"train_loss": -12.203470230102539, "global_step": 432819, "epoch": 2576} {"train_loss": -12.348100662231445, "global_step": 432820, "epoch": 2576} {"train_loss": -12.396574974060059, "global_step": 432821, "epoch": 2576} {"train_loss": -12.432485580444336, "global_step": 432822, "epoch": 2576} {"train_loss": -12.295140266418457, "global_step": 432823, "epoch": 2576} {"train_loss": -12.381235122680664, "global_step": 432824, "epoch": 2576} {"train_loss": -12.231019973754883, "global_step": 432825, "epoch": 2576} {"train_loss": -12.320544242858887, "global_step": 432826, "epoch": 2576} {"train_loss": -12.454137802124023, "global_step": 432827, "epoch": 2576} {"train_loss": -12.38884162902832, "global_step": 432828, "epoch": 2576} {"train_loss": -12.493439674377441, "global_step": 432829, "epoch": 2576} {"train_loss": -12.016366004943848, "global_step": 432830, "epoch": 2576} {"train_loss": -12.457361221313477, "global_step": 432831, "epoch": 2576} {"train_loss": -12.276561737060547, "global_step": 432832, "epoch": 2576} {"train_loss": -12.491058349609375, "global_step": 432833, "epoch": 2576} {"train_loss": -12.167405128479004, "global_step": 432834, "epoch": 2576} {"train_loss": -12.483469009399414, "global_step": 432835, "epoch": 2576} {"train_loss": -12.295788764953613, "global_step": 432836, "epoch": 2576} {"train_loss": -12.580706596374512, "global_step": 432837, "epoch": 2576} {"train_loss": -12.368406295776367, "global_step": 432838, "epoch": 2576} {"train_loss": -12.603782653808594, "global_step": 432839, "epoch": 2576} {"train_loss": -12.715116500854492, "global_step": 432840, "epoch": 2576} {"train_loss": -12.413801193237305, "global_step": 432841, "epoch": 2576} {"train_loss": -12.790576934814453, "global_step": 432842, "epoch": 2576} {"train_loss": -12.37258529663086, "global_step": 432843, "epoch": 2576} {"train_loss": -12.704582214355469, "global_step": 432844, "epoch": 2576} {"train_loss": -12.632806777954102, "global_step": 432845, "epoch": 2576} {"train_loss": -12.851886749267578, "global_step": 432846, "epoch": 2576} {"train_loss": -12.56234359741211, "global_step": 432847, "epoch": 2576} {"train_loss": -12.687509536743164, "global_step": 432848, "epoch": 2576} {"train_loss": -12.941888809204102, "global_step": 432849, "epoch": 2576} {"train_loss": -12.469005584716797, "global_step": 432850, "epoch": 2576} {"train_loss": -12.57109260559082, "global_step": 432851, "epoch": 2576} {"train_loss": -12.706156730651855, "global_step": 432852, "epoch": 2576} {"train_loss": -12.447305679321289, "global_step": 432853, "epoch": 2576} {"train_loss": -12.452305793762207, "global_step": 432854, "epoch": 2576} {"train_loss": -12.648024559020996, "global_step": 432855, "epoch": 2576} {"train_loss": -12.640836715698242, "global_step": 432856, "epoch": 2576} {"train_loss": -12.652587890625, "global_step": 432857, "epoch": 2576} {"train_loss": -12.558005332946777, "global_step": 432858, "epoch": 2576} {"train_loss": -12.331829071044922, "global_step": 432859, "epoch": 2576} {"train_loss": -12.696128845214844, "global_step": 432860, "epoch": 2576} {"train_loss": -12.718331336975098, "global_step": 432861, "epoch": 2576} {"train_loss": -12.4568510055542, "global_step": 432862, "epoch": 2576} {"train_loss": -12.735336303710938, "global_step": 432863, "epoch": 2576} {"train_loss": -12.635273933410645, "global_step": 432864, "epoch": 2576} {"train_loss": -12.65068244934082, "global_step": 432865, "epoch": 2576} {"train_loss": -12.456758499145508, "global_step": 432866, "epoch": 2576} {"train_loss": -12.604347229003906, "global_step": 432867, "epoch": 2576} {"train_loss": -12.62138843536377, "global_step": 432868, "epoch": 2576} {"train_loss": -12.718544006347656, "global_step": 432869, "epoch": 2576} {"train_loss": -12.692171096801758, "global_step": 432870, "epoch": 2576} {"train_loss": -12.514408111572266, "global_step": 432871, "epoch": 2576} {"train_loss": -12.333638191223145, "global_step": 432872, "epoch": 2576} {"train_loss": -12.87618350982666, "global_step": 432873, "epoch": 2576} {"train_loss": -12.705209732055664, "global_step": 432874, "epoch": 2576} {"train_loss": -12.796775817871094, "global_step": 432875, "epoch": 2576} {"train_loss": -12.5465726852417, "global_step": 432876, "epoch": 2576} {"train_loss": -12.4942626953125, "global_step": 432877, "epoch": 2576} {"train_loss": -12.471189498901367, "global_step": 432878, "epoch": 2576} {"train_loss": -12.630779266357422, "global_step": 432879, "epoch": 2576} {"train_loss": -12.176506042480469, "global_step": 432880, "epoch": 2576} {"train_loss": -12.462620735168457, "global_step": 432881, "epoch": 2576} {"train_loss": -12.617630958557129, "global_step": 432882, "epoch": 2576} {"train_loss": -12.443791389465332, "global_step": 432883, "epoch": 2576} {"train_loss": -12.157429695129395, "global_step": 432884, "epoch": 2576} {"train_loss": -12.428777694702148, "global_step": 432885, "epoch": 2576} {"train_loss": -12.547663688659668, "global_step": 432886, "epoch": 2576} {"train_loss": -12.068355560302734, "global_step": 432887, "epoch": 2576} {"train_loss": -12.565908432006836, "global_step": 432888, "epoch": 2576} {"train_loss": -12.234999656677246, "global_step": 432889, "epoch": 2576} {"train_loss": -12.401873588562012, "global_step": 432890, "epoch": 2576} {"train_loss": -12.277283668518066, "global_step": 432891, "epoch": 2576} {"train_loss": -12.520581245422363, "global_step": 432892, "epoch": 2576} {"train_loss": -11.974958419799805, "global_step": 432893, "epoch": 2576} {"train_loss": -12.371977806091309, "global_step": 432894, "epoch": 2576} {"train_loss": -12.252240180969238, "global_step": 432895, "epoch": 2576} {"train_loss": -12.382469177246094, "global_step": 432896, "epoch": 2576} {"train_loss": -12.713982582092285, "global_step": 432897, "epoch": 2576} {"train_loss": -12.723848342895508, "global_step": 432898, "epoch": 2576} {"train_loss": -12.441946983337402, "global_step": 432899, "epoch": 2576} {"train_loss": -12.44826889038086, "global_step": 432900, "epoch": 2576} {"train_loss": -11.852276802062988, "global_step": 432901, "epoch": 2576} {"train_loss": -11.274871826171875, "global_step": 432902, "epoch": 2576} {"train_loss": -11.830862045288086, "global_step": 432903, "epoch": 2576} {"train_loss": -12.689016342163086, "global_step": 432904, "epoch": 2576} {"train_loss": -12.386665344238281, "global_step": 432905, "epoch": 2576} {"train_loss": -11.685667037963867, "global_step": 432906, "epoch": 2576} {"train_loss": -11.966405868530273, "global_step": 432907, "epoch": 2576} {"train_loss": -12.19125747680664, "global_step": 432908, "epoch": 2576} {"train_loss": -10.612815856933594, "global_step": 432909, "epoch": 2576} {"train_loss": -11.069393157958984, "global_step": 432910, "epoch": 2576} {"train_loss": -12.118350982666016, "global_step": 432911, "epoch": 2576} {"train_loss": -12.124166488647461, "global_step": 432912, "epoch": 2576} {"train_loss": -12.30820083618164, "global_step": 432913, "epoch": 2576} {"train_loss": -10.995776176452637, "global_step": 432914, "epoch": 2576} {"train_loss": -10.966408729553223, "global_step": 432915, "epoch": 2576} {"train_loss": -9.718893051147461, "global_step": 432916, "epoch": 2576} {"train_loss": -9.877996444702148, "global_step": 432917, "epoch": 2576} {"train_loss": -8.852926254272461, "global_step": 432918, "epoch": 2576} {"train_loss": -11.53408432006836, "global_step": 432919, "epoch": 2576} {"train_loss": -8.812909126281738, "global_step": 432920, "epoch": 2576} {"train_loss": -8.205778121948242, "global_step": 432921, "epoch": 2576} {"train_loss": -9.652071952819824, "global_step": 432922, "epoch": 2576} {"train_loss": -8.051064491271973, "global_step": 432923, "epoch": 2576} {"train_loss": -8.097280502319336, "global_step": 432924, "epoch": 2576} {"train_loss": -8.034341812133789, "global_step": 432925, "epoch": 2576} {"train_loss": -7.809178829193115, "global_step": 432926, "epoch": 2576} {"train_loss": -9.178828239440918, "global_step": 432927, "epoch": 2576} {"train_loss": -10.101003646850586, "global_step": 432928, "epoch": 2576} {"train_loss": -9.46088981628418, "global_step": 432929, "epoch": 2576} {"train_loss": -9.125163078308105, "global_step": 432930, "epoch": 2576} {"train_loss": -11.092753410339355, "global_step": 432931, "epoch": 2576} {"train_loss": -9.811727523803711, "global_step": 432932, "epoch": 2576} {"train_loss": -11.523966789245605, "global_step": 432933, "epoch": 2576} {"train_loss": -10.482065200805664, "global_step": 432934, "epoch": 2576} {"train_loss": -11.860557303542183, "global_step": 432935, "epoch": 2576, "val_loss": 302838.28125} {"train_loss": -11.372157096862793, "global_step": 432936, "epoch": 2577} {"train_loss": -10.550895690917969, "global_step": 432937, "epoch": 2577} {"train_loss": -10.18934440612793, "global_step": 432938, "epoch": 2577} {"train_loss": -11.433904647827148, "global_step": 432939, "epoch": 2577} {"train_loss": -10.93719482421875, "global_step": 432940, "epoch": 2577} {"train_loss": -10.901151657104492, "global_step": 432941, "epoch": 2577} {"train_loss": -11.86898422241211, "global_step": 432942, "epoch": 2577} {"train_loss": -10.734453201293945, "global_step": 432943, "epoch": 2577} {"train_loss": -11.410701751708984, "global_step": 432944, "epoch": 2577} {"train_loss": -11.47418212890625, "global_step": 432945, "epoch": 2577} {"train_loss": -10.944124221801758, "global_step": 432946, "epoch": 2577} {"train_loss": -12.02138900756836, "global_step": 432947, "epoch": 2577} {"train_loss": -11.292961120605469, "global_step": 432948, "epoch": 2577} {"train_loss": -11.687101364135742, "global_step": 432949, "epoch": 2577} {"train_loss": -11.583620071411133, "global_step": 432950, "epoch": 2577} {"train_loss": -10.989459037780762, "global_step": 432951, "epoch": 2577} {"train_loss": -11.932332038879395, "global_step": 432952, "epoch": 2577} {"train_loss": -11.52776050567627, "global_step": 432953, "epoch": 2577} {"train_loss": -11.001594543457031, "global_step": 432954, "epoch": 2577} {"train_loss": -11.657453536987305, "global_step": 432955, "epoch": 2577} {"train_loss": -11.32794189453125, "global_step": 432956, "epoch": 2577} {"train_loss": -11.247673034667969, "global_step": 432957, "epoch": 2577} {"train_loss": -11.770074844360352, "global_step": 432958, "epoch": 2577} {"train_loss": -10.825121879577637, "global_step": 432959, "epoch": 2577} {"train_loss": -12.102952003479004, "global_step": 432960, "epoch": 2577} {"train_loss": -11.535011291503906, "global_step": 432961, "epoch": 2577} {"train_loss": -11.743938446044922, "global_step": 432962, "epoch": 2577} {"train_loss": -12.089062690734863, "global_step": 432963, "epoch": 2577} {"train_loss": -11.790681838989258, "global_step": 432964, "epoch": 2577} {"train_loss": -12.073568344116211, "global_step": 432965, "epoch": 2577} {"train_loss": -12.159622192382812, "global_step": 432966, "epoch": 2577} {"train_loss": -11.994720458984375, "global_step": 432967, "epoch": 2577} {"train_loss": -12.075302124023438, "global_step": 432968, "epoch": 2577} {"train_loss": -12.421083450317383, "global_step": 432969, "epoch": 2577} {"train_loss": -12.090765953063965, "global_step": 432970, "epoch": 2577} {"train_loss": -12.369443893432617, "global_step": 432971, "epoch": 2577} {"train_loss": -12.184846878051758, "global_step": 432972, "epoch": 2577} {"train_loss": -12.076729774475098, "global_step": 432973, "epoch": 2577} {"train_loss": -12.548471450805664, "global_step": 432974, "epoch": 2577} {"train_loss": -12.283177375793457, "global_step": 432975, "epoch": 2577} {"train_loss": -12.289289474487305, "global_step": 432976, "epoch": 2577} {"train_loss": -12.47193717956543, "global_step": 432977, "epoch": 2577} {"train_loss": -12.23953628540039, "global_step": 432978, "epoch": 2577} {"train_loss": -12.404876708984375, "global_step": 432979, "epoch": 2577} {"train_loss": -12.314509391784668, "global_step": 432980, "epoch": 2577} {"train_loss": -12.275272369384766, "global_step": 432981, "epoch": 2577} {"train_loss": -12.453882217407227, "global_step": 432982, "epoch": 2577} {"train_loss": -12.562217712402344, "global_step": 432983, "epoch": 2577} {"train_loss": -12.522370338439941, "global_step": 432984, "epoch": 2577} {"train_loss": -12.444820404052734, "global_step": 432985, "epoch": 2577} {"train_loss": -12.639404296875, "global_step": 432986, "epoch": 2577} {"train_loss": -12.573161125183105, "global_step": 432987, "epoch": 2577} {"train_loss": -12.52475357055664, "global_step": 432988, "epoch": 2577} {"train_loss": -12.324963569641113, "global_step": 432989, "epoch": 2577} {"train_loss": -12.503240585327148, "global_step": 432990, "epoch": 2577} {"train_loss": -12.402162551879883, "global_step": 432991, "epoch": 2577} {"train_loss": -12.53502082824707, "global_step": 432992, "epoch": 2577} {"train_loss": -12.518216133117676, "global_step": 432993, "epoch": 2577} {"train_loss": -12.553913116455078, "global_step": 432994, "epoch": 2577} {"train_loss": -12.532382011413574, "global_step": 432995, "epoch": 2577} {"train_loss": -12.482895851135254, "global_step": 432996, "epoch": 2577} {"train_loss": -12.814872741699219, "global_step": 432997, "epoch": 2577} {"train_loss": -12.52653694152832, "global_step": 432998, "epoch": 2577} {"train_loss": -12.694826126098633, "global_step": 432999, "epoch": 2577} {"train_loss": -12.703436851501465, "global_step": 433000, "epoch": 2577} {"train_loss": -12.657686233520508, "global_step": 433001, "epoch": 2577} {"train_loss": -12.759830474853516, "global_step": 433002, "epoch": 2577} {"train_loss": -12.656534194946289, "global_step": 433003, "epoch": 2577} {"train_loss": -12.754327774047852, "global_step": 433004, "epoch": 2577} {"train_loss": -12.53756332397461, "global_step": 433005, "epoch": 2577} {"train_loss": -12.527167320251465, "global_step": 433006, "epoch": 2577} {"train_loss": -12.57205581665039, "global_step": 433007, "epoch": 2577} {"train_loss": -12.730693817138672, "global_step": 433008, "epoch": 2577} {"train_loss": -12.544639587402344, "global_step": 433009, "epoch": 2577} {"train_loss": -12.50577449798584, "global_step": 433010, "epoch": 2577} {"train_loss": -12.681118965148926, "global_step": 433011, "epoch": 2577} {"train_loss": -12.405108451843262, "global_step": 433012, "epoch": 2577} {"train_loss": -12.487116813659668, "global_step": 433013, "epoch": 2577} {"train_loss": -12.693782806396484, "global_step": 433014, "epoch": 2577} {"train_loss": -12.582720756530762, "global_step": 433015, "epoch": 2577} {"train_loss": -12.473175048828125, "global_step": 433016, "epoch": 2577} {"train_loss": -12.336191177368164, "global_step": 433017, "epoch": 2577} {"train_loss": -12.419910430908203, "global_step": 433018, "epoch": 2577} {"train_loss": -12.637386322021484, "global_step": 433019, "epoch": 2577} {"train_loss": -12.458568572998047, "global_step": 433020, "epoch": 2577} {"train_loss": -12.775873184204102, "global_step": 433021, "epoch": 2577} {"train_loss": -12.458511352539062, "global_step": 433022, "epoch": 2577} {"train_loss": -12.728312492370605, "global_step": 433023, "epoch": 2577} {"train_loss": -12.48133659362793, "global_step": 433024, "epoch": 2577} {"train_loss": -12.721571922302246, "global_step": 433025, "epoch": 2577} {"train_loss": -12.633100509643555, "global_step": 433026, "epoch": 2577} {"train_loss": -12.820039749145508, "global_step": 433027, "epoch": 2577} {"train_loss": -12.717610359191895, "global_step": 433028, "epoch": 2577} {"train_loss": -12.739704132080078, "global_step": 433029, "epoch": 2577} {"train_loss": -12.675907135009766, "global_step": 433030, "epoch": 2577} {"train_loss": -12.37481689453125, "global_step": 433031, "epoch": 2577} {"train_loss": -12.651483535766602, "global_step": 433032, "epoch": 2577} {"train_loss": -12.772003173828125, "global_step": 433033, "epoch": 2577} {"train_loss": -12.613128662109375, "global_step": 433034, "epoch": 2577} {"train_loss": -12.601856231689453, "global_step": 433035, "epoch": 2577} {"train_loss": -12.930042266845703, "global_step": 433036, "epoch": 2577} {"train_loss": -12.682392120361328, "global_step": 433037, "epoch": 2577} {"train_loss": -12.741426467895508, "global_step": 433038, "epoch": 2577} {"train_loss": -12.85280704498291, "global_step": 433039, "epoch": 2577} {"train_loss": -12.909603118896484, "global_step": 433040, "epoch": 2577} {"train_loss": -12.887843132019043, "global_step": 433041, "epoch": 2577} {"train_loss": -12.889761924743652, "global_step": 433042, "epoch": 2577} {"train_loss": -12.919075012207031, "global_step": 433043, "epoch": 2577} {"train_loss": -12.90321159362793, "global_step": 433044, "epoch": 2577} {"train_loss": -12.645553588867188, "global_step": 433045, "epoch": 2577} {"train_loss": -12.722199440002441, "global_step": 433046, "epoch": 2577} {"train_loss": -12.709473609924316, "global_step": 433047, "epoch": 2577} {"train_loss": -12.525270462036133, "global_step": 433048, "epoch": 2577} {"train_loss": -12.707953453063965, "global_step": 433049, "epoch": 2577} {"train_loss": -12.274815559387207, "global_step": 433050, "epoch": 2577} {"train_loss": -12.781987190246582, "global_step": 433051, "epoch": 2577} {"train_loss": -12.212676048278809, "global_step": 433052, "epoch": 2577} {"train_loss": -12.519287109375, "global_step": 433053, "epoch": 2577} {"train_loss": -12.058340072631836, "global_step": 433054, "epoch": 2577} {"train_loss": -12.450899124145508, "global_step": 433055, "epoch": 2577} {"train_loss": -11.657291412353516, "global_step": 433056, "epoch": 2577} {"train_loss": -11.961485862731934, "global_step": 433057, "epoch": 2577} {"train_loss": -12.262612342834473, "global_step": 433058, "epoch": 2577} {"train_loss": -12.155325889587402, "global_step": 433059, "epoch": 2577} {"train_loss": -11.531729698181152, "global_step": 433060, "epoch": 2577} {"train_loss": -11.926977157592773, "global_step": 433061, "epoch": 2577} {"train_loss": -11.85881519317627, "global_step": 433062, "epoch": 2577} {"train_loss": -11.548212051391602, "global_step": 433063, "epoch": 2577} {"train_loss": -10.775390625, "global_step": 433064, "epoch": 2577} {"train_loss": -11.212167739868164, "global_step": 433065, "epoch": 2577} {"train_loss": -11.164190292358398, "global_step": 433066, "epoch": 2577} {"train_loss": -11.380376815795898, "global_step": 433067, "epoch": 2577} {"train_loss": -10.146208763122559, "global_step": 433068, "epoch": 2577} {"train_loss": -11.655485153198242, "global_step": 433069, "epoch": 2577} {"train_loss": -11.394950866699219, "global_step": 433070, "epoch": 2577} {"train_loss": -10.354575157165527, "global_step": 433071, "epoch": 2577} {"train_loss": -10.747069358825684, "global_step": 433072, "epoch": 2577} {"train_loss": -10.948486328125, "global_step": 433073, "epoch": 2577} {"train_loss": -10.955419540405273, "global_step": 433074, "epoch": 2577} {"train_loss": -10.882415771484375, "global_step": 433075, "epoch": 2577} {"train_loss": -8.953926086425781, "global_step": 433076, "epoch": 2577} {"train_loss": -9.209331512451172, "global_step": 433077, "epoch": 2577} {"train_loss": -10.473139762878418, "global_step": 433078, "epoch": 2577} {"train_loss": -10.856084823608398, "global_step": 433079, "epoch": 2577} {"train_loss": -9.867517471313477, "global_step": 433080, "epoch": 2577} {"train_loss": -11.386667251586914, "global_step": 433081, "epoch": 2577} {"train_loss": -11.141826629638672, "global_step": 433082, "epoch": 2577} {"train_loss": -9.69102668762207, "global_step": 433083, "epoch": 2577} {"train_loss": -11.594011306762695, "global_step": 433084, "epoch": 2577} {"train_loss": -10.67725944519043, "global_step": 433085, "epoch": 2577} {"train_loss": -9.145675659179688, "global_step": 433086, "epoch": 2577} {"train_loss": -11.41651725769043, "global_step": 433087, "epoch": 2577} {"train_loss": -9.673196792602539, "global_step": 433088, "epoch": 2577} {"train_loss": -11.66977310180664, "global_step": 433089, "epoch": 2577} {"train_loss": -10.707677841186523, "global_step": 433090, "epoch": 2577} {"train_loss": -11.341114044189453, "global_step": 433091, "epoch": 2577} {"train_loss": -11.82583999633789, "global_step": 433092, "epoch": 2577} {"train_loss": -11.231999397277832, "global_step": 433093, "epoch": 2577} {"train_loss": -12.10886001586914, "global_step": 433094, "epoch": 2577} {"train_loss": -10.921407699584961, "global_step": 433095, "epoch": 2577} {"train_loss": -11.939603805541992, "global_step": 433096, "epoch": 2577} {"train_loss": -11.746667861938477, "global_step": 433097, "epoch": 2577} {"train_loss": -12.106637954711914, "global_step": 433098, "epoch": 2577} {"train_loss": -11.838274002075195, "global_step": 433099, "epoch": 2577} {"train_loss": -11.990303039550781, "global_step": 433100, "epoch": 2577} {"train_loss": -12.168635368347168, "global_step": 433101, "epoch": 2577} {"train_loss": -12.197731971740723, "global_step": 433102, "epoch": 2577} {"train_loss": -11.949276997929527, "global_step": 433103, "epoch": 2577, "val_loss": 306486.59375} {"train_loss": -12.03054428100586, "global_step": 433104, "epoch": 2578} {"train_loss": -12.015840530395508, "global_step": 433105, "epoch": 2578} {"train_loss": -12.092968940734863, "global_step": 433106, "epoch": 2578} {"train_loss": -11.90265941619873, "global_step": 433107, "epoch": 2578} {"train_loss": -12.054886817932129, "global_step": 433108, "epoch": 2578} {"train_loss": -12.134449005126953, "global_step": 433109, "epoch": 2578} {"train_loss": -12.237260818481445, "global_step": 433110, "epoch": 2578} {"train_loss": -12.112713813781738, "global_step": 433111, "epoch": 2578} {"train_loss": -11.885787963867188, "global_step": 433112, "epoch": 2578} {"train_loss": -11.937644958496094, "global_step": 433113, "epoch": 2578} {"train_loss": -12.178394317626953, "global_step": 433114, "epoch": 2578} {"train_loss": -12.193224906921387, "global_step": 433115, "epoch": 2578} {"train_loss": -12.150577545166016, "global_step": 433116, "epoch": 2578} {"train_loss": -11.990867614746094, "global_step": 433117, "epoch": 2578} {"train_loss": -12.523653984069824, "global_step": 433118, "epoch": 2578} {"train_loss": -12.174325942993164, "global_step": 433119, "epoch": 2578} {"train_loss": -12.357820510864258, "global_step": 433120, "epoch": 2578} {"train_loss": -11.874005317687988, "global_step": 433121, "epoch": 2578} {"train_loss": -12.25295639038086, "global_step": 433122, "epoch": 2578} {"train_loss": -12.299293518066406, "global_step": 433123, "epoch": 2578} {"train_loss": -12.05085563659668, "global_step": 433124, "epoch": 2578} {"train_loss": -12.486098289489746, "global_step": 433125, "epoch": 2578} {"train_loss": -11.864480972290039, "global_step": 433126, "epoch": 2578} {"train_loss": -12.269335746765137, "global_step": 433127, "epoch": 2578} {"train_loss": -11.778077125549316, "global_step": 433128, "epoch": 2578} {"train_loss": -12.554793357849121, "global_step": 433129, "epoch": 2578} {"train_loss": -11.924949645996094, "global_step": 433130, "epoch": 2578} {"train_loss": -12.165031433105469, "global_step": 433131, "epoch": 2578} {"train_loss": -11.74224853515625, "global_step": 433132, "epoch": 2578} {"train_loss": -12.154630661010742, "global_step": 433133, "epoch": 2578} {"train_loss": -11.828557968139648, "global_step": 433134, "epoch": 2578} {"train_loss": -12.088744163513184, "global_step": 433135, "epoch": 2578} {"train_loss": -12.108161926269531, "global_step": 433136, "epoch": 2578} {"train_loss": -12.328649520874023, "global_step": 433137, "epoch": 2578} {"train_loss": -11.877842903137207, "global_step": 433138, "epoch": 2578} {"train_loss": -12.07149600982666, "global_step": 433139, "epoch": 2578} {"train_loss": -11.715417861938477, "global_step": 433140, "epoch": 2578} {"train_loss": -12.335308074951172, "global_step": 433141, "epoch": 2578} {"train_loss": -12.206491470336914, "global_step": 433142, "epoch": 2578} {"train_loss": -12.28849983215332, "global_step": 433143, "epoch": 2578} {"train_loss": -12.319145202636719, "global_step": 433144, "epoch": 2578} {"train_loss": -12.13034439086914, "global_step": 433145, "epoch": 2578} {"train_loss": -12.547675132751465, "global_step": 433146, "epoch": 2578} {"train_loss": -12.053385734558105, "global_step": 433147, "epoch": 2578} {"train_loss": -12.416953086853027, "global_step": 433148, "epoch": 2578} {"train_loss": -12.137907981872559, "global_step": 433149, "epoch": 2578} {"train_loss": -12.142269134521484, "global_step": 433150, "epoch": 2578} {"train_loss": -12.207460403442383, "global_step": 433151, "epoch": 2578} {"train_loss": -12.24699592590332, "global_step": 433152, "epoch": 2578} {"train_loss": -12.550024032592773, "global_step": 433153, "epoch": 2578} {"train_loss": -12.56648063659668, "global_step": 433154, "epoch": 2578} {"train_loss": -12.1866455078125, "global_step": 433155, "epoch": 2578} {"train_loss": -12.475679397583008, "global_step": 433156, "epoch": 2578} {"train_loss": -12.376370429992676, "global_step": 433157, "epoch": 2578} {"train_loss": -12.655776023864746, "global_step": 433158, "epoch": 2578} {"train_loss": -12.580820083618164, "global_step": 433159, "epoch": 2578} {"train_loss": -12.623147964477539, "global_step": 433160, "epoch": 2578} {"train_loss": -12.556540489196777, "global_step": 433161, "epoch": 2578} {"train_loss": -12.492390632629395, "global_step": 433162, "epoch": 2578} {"train_loss": -12.369503021240234, "global_step": 433163, "epoch": 2578} {"train_loss": -12.545509338378906, "global_step": 433164, "epoch": 2578} {"train_loss": -12.46701431274414, "global_step": 433165, "epoch": 2578} {"train_loss": -12.56582260131836, "global_step": 433166, "epoch": 2578} {"train_loss": -12.485468864440918, "global_step": 433167, "epoch": 2578} {"train_loss": -12.702960014343262, "global_step": 433168, "epoch": 2578} {"train_loss": -12.40516471862793, "global_step": 433169, "epoch": 2578} {"train_loss": -12.70246696472168, "global_step": 433170, "epoch": 2578} {"train_loss": -12.585844039916992, "global_step": 433171, "epoch": 2578} {"train_loss": -12.688408851623535, "global_step": 433172, "epoch": 2578} {"train_loss": -12.750203132629395, "global_step": 433173, "epoch": 2578} {"train_loss": -12.525693893432617, "global_step": 433174, "epoch": 2578} {"train_loss": -12.782523155212402, "global_step": 433175, "epoch": 2578} {"train_loss": -12.740015029907227, "global_step": 433176, "epoch": 2578} {"train_loss": -12.615915298461914, "global_step": 433177, "epoch": 2578} {"train_loss": -12.62809944152832, "global_step": 433178, "epoch": 2578} {"train_loss": -12.38782024383545, "global_step": 433179, "epoch": 2578} {"train_loss": -12.713375091552734, "global_step": 433180, "epoch": 2578} {"train_loss": -12.6135892868042, "global_step": 433181, "epoch": 2578} {"train_loss": -12.732793807983398, "global_step": 433182, "epoch": 2578} {"train_loss": -12.757189750671387, "global_step": 433183, "epoch": 2578} {"train_loss": -12.833967208862305, "global_step": 433184, "epoch": 2578} {"train_loss": -12.7290678024292, "global_step": 433185, "epoch": 2578} {"train_loss": -12.955850601196289, "global_step": 433186, "epoch": 2578} {"train_loss": -12.893278121948242, "global_step": 433187, "epoch": 2578} {"train_loss": -12.906898498535156, "global_step": 433188, "epoch": 2578} {"train_loss": -12.660839080810547, "global_step": 433189, "epoch": 2578} {"train_loss": -12.670166015625, "global_step": 433190, "epoch": 2578} {"train_loss": -12.548196792602539, "global_step": 433191, "epoch": 2578} {"train_loss": -12.689998626708984, "global_step": 433192, "epoch": 2578} {"train_loss": -12.707319259643555, "global_step": 433193, "epoch": 2578} {"train_loss": -12.427061080932617, "global_step": 433194, "epoch": 2578} {"train_loss": -12.517423629760742, "global_step": 433195, "epoch": 2578} {"train_loss": -12.7225341796875, "global_step": 433196, "epoch": 2578} {"train_loss": -12.351430892944336, "global_step": 433197, "epoch": 2578} {"train_loss": -12.772432327270508, "global_step": 433198, "epoch": 2578} {"train_loss": -12.26767635345459, "global_step": 433199, "epoch": 2578} {"train_loss": -13.026115417480469, "global_step": 433200, "epoch": 2578} {"train_loss": -12.501748085021973, "global_step": 433201, "epoch": 2578} {"train_loss": -12.894756317138672, "global_step": 433202, "epoch": 2578} {"train_loss": -12.13321304321289, "global_step": 433203, "epoch": 2578} {"train_loss": -12.631258010864258, "global_step": 433204, "epoch": 2578} {"train_loss": -12.173821449279785, "global_step": 433205, "epoch": 2578} {"train_loss": -11.837236404418945, "global_step": 433206, "epoch": 2578} {"train_loss": -12.185897827148438, "global_step": 433207, "epoch": 2578} {"train_loss": -12.299748420715332, "global_step": 433208, "epoch": 2578} {"train_loss": -12.507339477539062, "global_step": 433209, "epoch": 2578} {"train_loss": -12.171256065368652, "global_step": 433210, "epoch": 2578} {"train_loss": -12.843401908874512, "global_step": 433211, "epoch": 2578} {"train_loss": -12.561538696289062, "global_step": 433212, "epoch": 2578} {"train_loss": -12.77943229675293, "global_step": 433213, "epoch": 2578} {"train_loss": -12.560603141784668, "global_step": 433214, "epoch": 2578} {"train_loss": -12.838323593139648, "global_step": 433215, "epoch": 2578} {"train_loss": -12.547727584838867, "global_step": 433216, "epoch": 2578} {"train_loss": -12.693554878234863, "global_step": 433217, "epoch": 2578} {"train_loss": -12.46513557434082, "global_step": 433218, "epoch": 2578} {"train_loss": -11.861148834228516, "global_step": 433219, "epoch": 2578} {"train_loss": -11.68764877319336, "global_step": 433220, "epoch": 2578} {"train_loss": -12.184896469116211, "global_step": 433221, "epoch": 2578} {"train_loss": -12.472713470458984, "global_step": 433222, "epoch": 2578} {"train_loss": -11.506595611572266, "global_step": 433223, "epoch": 2578} {"train_loss": -11.662403106689453, "global_step": 433224, "epoch": 2578} {"train_loss": -12.17155933380127, "global_step": 433225, "epoch": 2578} {"train_loss": -11.630602836608887, "global_step": 433226, "epoch": 2578} {"train_loss": -11.047744750976562, "global_step": 433227, "epoch": 2578} {"train_loss": -10.614608764648438, "global_step": 433228, "epoch": 2578} {"train_loss": -11.679039001464844, "global_step": 433229, "epoch": 2578} {"train_loss": -12.445085525512695, "global_step": 433230, "epoch": 2578} {"train_loss": -12.710063934326172, "global_step": 433231, "epoch": 2578} {"train_loss": -12.133359909057617, "global_step": 433232, "epoch": 2578} {"train_loss": -12.384095191955566, "global_step": 433233, "epoch": 2578} {"train_loss": -11.527381896972656, "global_step": 433234, "epoch": 2578} {"train_loss": -12.340822219848633, "global_step": 433235, "epoch": 2578} {"train_loss": -12.151859283447266, "global_step": 433236, "epoch": 2578} {"train_loss": -11.988910675048828, "global_step": 433237, "epoch": 2578} {"train_loss": -12.10809326171875, "global_step": 433238, "epoch": 2578} {"train_loss": -12.567462921142578, "global_step": 433239, "epoch": 2578} {"train_loss": -12.130542755126953, "global_step": 433240, "epoch": 2578} {"train_loss": -12.481231689453125, "global_step": 433241, "epoch": 2578} {"train_loss": -12.467397689819336, "global_step": 433242, "epoch": 2578} {"train_loss": -12.340805053710938, "global_step": 433243, "epoch": 2578} {"train_loss": -12.22457504272461, "global_step": 433244, "epoch": 2578} {"train_loss": -12.786429405212402, "global_step": 433245, "epoch": 2578} {"train_loss": -12.163606643676758, "global_step": 433246, "epoch": 2578} {"train_loss": -12.638046264648438, "global_step": 433247, "epoch": 2578} {"train_loss": -12.407327651977539, "global_step": 433248, "epoch": 2578} {"train_loss": -12.495527267456055, "global_step": 433249, "epoch": 2578} {"train_loss": -12.048393249511719, "global_step": 433250, "epoch": 2578} {"train_loss": -12.36468505859375, "global_step": 433251, "epoch": 2578} {"train_loss": -11.816228866577148, "global_step": 433252, "epoch": 2578} {"train_loss": -12.343063354492188, "global_step": 433253, "epoch": 2578} {"train_loss": -12.284974098205566, "global_step": 433254, "epoch": 2578} {"train_loss": -11.500731468200684, "global_step": 433255, "epoch": 2578} {"train_loss": -12.200793266296387, "global_step": 433256, "epoch": 2578} {"train_loss": -12.168973922729492, "global_step": 433257, "epoch": 2578} {"train_loss": -11.346482276916504, "global_step": 433258, "epoch": 2578} {"train_loss": -12.313011169433594, "global_step": 433259, "epoch": 2578} {"train_loss": -11.445624351501465, "global_step": 433260, "epoch": 2578} {"train_loss": -11.864336013793945, "global_step": 433261, "epoch": 2578} {"train_loss": -12.42891788482666, "global_step": 433262, "epoch": 2578} {"train_loss": -11.773165702819824, "global_step": 433263, "epoch": 2578} {"train_loss": -11.16986083984375, "global_step": 433264, "epoch": 2578} {"train_loss": -11.4555025100708, "global_step": 433265, "epoch": 2578} {"train_loss": -12.149703979492188, "global_step": 433266, "epoch": 2578} {"train_loss": -10.773773193359375, "global_step": 433267, "epoch": 2578} {"train_loss": -10.939846992492676, "global_step": 433268, "epoch": 2578} {"train_loss": -11.61507797241211, "global_step": 433269, "epoch": 2578} {"train_loss": -8.822641372680664, "global_step": 433270, "epoch": 2578} {"train_loss": -12.231421873683022, "global_step": 433271, "epoch": 2578, "val_loss": 311393.71875} {"train_loss": -9.004864692687988, "global_step": 433272, "epoch": 2579} {"train_loss": -7.971158504486084, "global_step": 433273, "epoch": 2579} {"train_loss": -9.786264419555664, "global_step": 433274, "epoch": 2579} {"train_loss": -9.581193923950195, "global_step": 433275, "epoch": 2579} {"train_loss": -10.374235153198242, "global_step": 433276, "epoch": 2579} {"train_loss": -10.078826904296875, "global_step": 433277, "epoch": 2579} {"train_loss": -10.797121047973633, "global_step": 433278, "epoch": 2579} {"train_loss": -11.02257251739502, "global_step": 433279, "epoch": 2579} {"train_loss": -10.117998123168945, "global_step": 433280, "epoch": 2579} {"train_loss": -9.443693161010742, "global_step": 433281, "epoch": 2579} {"train_loss": -10.18526554107666, "global_step": 433282, "epoch": 2579} {"train_loss": -10.7288179397583, "global_step": 433283, "epoch": 2579} {"train_loss": -9.810977935791016, "global_step": 433284, "epoch": 2579} {"train_loss": -11.395849227905273, "global_step": 433285, "epoch": 2579} {"train_loss": -9.722162246704102, "global_step": 433286, "epoch": 2579} {"train_loss": -11.01357650756836, "global_step": 433287, "epoch": 2579} {"train_loss": -10.409341812133789, "global_step": 433288, "epoch": 2579} {"train_loss": -11.451936721801758, "global_step": 433289, "epoch": 2579} {"train_loss": -11.252098083496094, "global_step": 433290, "epoch": 2579} {"train_loss": -10.908010482788086, "global_step": 433291, "epoch": 2579} {"train_loss": -11.51749038696289, "global_step": 433292, "epoch": 2579} {"train_loss": -10.683052062988281, "global_step": 433293, "epoch": 2579} {"train_loss": -11.639184951782227, "global_step": 433294, "epoch": 2579} {"train_loss": -10.645225524902344, "global_step": 433295, "epoch": 2579} {"train_loss": -11.55413818359375, "global_step": 433296, "epoch": 2579} {"train_loss": -11.363816261291504, "global_step": 433297, "epoch": 2579} {"train_loss": -11.651816368103027, "global_step": 433298, "epoch": 2579} {"train_loss": -11.770761489868164, "global_step": 433299, "epoch": 2579} {"train_loss": -11.489784240722656, "global_step": 433300, "epoch": 2579} {"train_loss": -12.099668502807617, "global_step": 433301, "epoch": 2579} {"train_loss": -11.677102088928223, "global_step": 433302, "epoch": 2579} {"train_loss": -11.892040252685547, "global_step": 433303, "epoch": 2579} {"train_loss": -11.80750846862793, "global_step": 433304, "epoch": 2579} {"train_loss": -11.757791519165039, "global_step": 433305, "epoch": 2579} {"train_loss": -11.563309669494629, "global_step": 433306, "epoch": 2579} {"train_loss": -12.079544067382812, "global_step": 433307, "epoch": 2579} {"train_loss": -11.97507381439209, "global_step": 433308, "epoch": 2579} {"train_loss": -11.488311767578125, "global_step": 433309, "epoch": 2579} {"train_loss": -11.827594757080078, "global_step": 433310, "epoch": 2579} {"train_loss": -11.73476791381836, "global_step": 433311, "epoch": 2579} {"train_loss": -11.823387145996094, "global_step": 433312, "epoch": 2579} {"train_loss": -11.796101570129395, "global_step": 433313, "epoch": 2579} {"train_loss": -11.520641326904297, "global_step": 433314, "epoch": 2579} {"train_loss": -11.936565399169922, "global_step": 433315, "epoch": 2579} {"train_loss": -11.82776165008545, "global_step": 433316, "epoch": 2579} {"train_loss": -12.015392303466797, "global_step": 433317, "epoch": 2579} {"train_loss": -12.028088569641113, "global_step": 433318, "epoch": 2579} {"train_loss": -11.68563175201416, "global_step": 433319, "epoch": 2579} {"train_loss": -12.012750625610352, "global_step": 433320, "epoch": 2579} {"train_loss": -11.832242012023926, "global_step": 433321, "epoch": 2579} {"train_loss": -12.105205535888672, "global_step": 433322, "epoch": 2579} {"train_loss": -11.680797576904297, "global_step": 433323, "epoch": 2579} {"train_loss": -11.894237518310547, "global_step": 433324, "epoch": 2579} {"train_loss": -12.099181175231934, "global_step": 433325, "epoch": 2579} {"train_loss": -12.33061408996582, "global_step": 433326, "epoch": 2579} {"train_loss": -12.226272583007812, "global_step": 433327, "epoch": 2579} {"train_loss": -12.259576797485352, "global_step": 433328, "epoch": 2579} {"train_loss": -12.411020278930664, "global_step": 433329, "epoch": 2579} {"train_loss": -12.154255867004395, "global_step": 433330, "epoch": 2579} {"train_loss": -12.207233428955078, "global_step": 433331, "epoch": 2579} {"train_loss": -12.357601165771484, "global_step": 433332, "epoch": 2579} {"train_loss": -12.333066940307617, "global_step": 433333, "epoch": 2579} {"train_loss": -12.319973945617676, "global_step": 433334, "epoch": 2579} {"train_loss": -12.476627349853516, "global_step": 433335, "epoch": 2579} {"train_loss": -12.270424842834473, "global_step": 433336, "epoch": 2579} {"train_loss": -12.492884635925293, "global_step": 433337, "epoch": 2579} {"train_loss": -12.134132385253906, "global_step": 433338, "epoch": 2579} {"train_loss": -12.334781646728516, "global_step": 433339, "epoch": 2579} {"train_loss": -12.378864288330078, "global_step": 433340, "epoch": 2579} {"train_loss": -12.539310455322266, "global_step": 433341, "epoch": 2579} {"train_loss": -12.594223976135254, "global_step": 433342, "epoch": 2579} {"train_loss": -12.648027420043945, "global_step": 433343, "epoch": 2579} {"train_loss": -12.593826293945312, "global_step": 433344, "epoch": 2579} {"train_loss": -12.583415985107422, "global_step": 433345, "epoch": 2579} {"train_loss": -12.44422721862793, "global_step": 433346, "epoch": 2579} {"train_loss": -12.62640380859375, "global_step": 433347, "epoch": 2579} {"train_loss": -12.41426944732666, "global_step": 433348, "epoch": 2579} {"train_loss": -12.541610717773438, "global_step": 433349, "epoch": 2579} {"train_loss": -12.782841682434082, "global_step": 433350, "epoch": 2579} {"train_loss": -12.607192993164062, "global_step": 433351, "epoch": 2579} {"train_loss": -12.605611801147461, "global_step": 433352, "epoch": 2579} {"train_loss": -12.572587966918945, "global_step": 433353, "epoch": 2579} {"train_loss": -12.672225952148438, "global_step": 433354, "epoch": 2579} {"train_loss": -12.769787788391113, "global_step": 433355, "epoch": 2579} {"train_loss": -12.686742782592773, "global_step": 433356, "epoch": 2579} {"train_loss": -12.708576202392578, "global_step": 433357, "epoch": 2579} {"train_loss": -12.46078109741211, "global_step": 433358, "epoch": 2579} {"train_loss": -12.873555183410645, "global_step": 433359, "epoch": 2579} {"train_loss": -12.558393478393555, "global_step": 433360, "epoch": 2579} {"train_loss": -12.851259231567383, "global_step": 433361, "epoch": 2579} {"train_loss": -12.650396347045898, "global_step": 433362, "epoch": 2579} {"train_loss": -12.655214309692383, "global_step": 433363, "epoch": 2579} {"train_loss": -12.582063674926758, "global_step": 433364, "epoch": 2579} {"train_loss": -12.697342872619629, "global_step": 433365, "epoch": 2579} {"train_loss": -12.482004165649414, "global_step": 433366, "epoch": 2579} {"train_loss": -12.659647941589355, "global_step": 433367, "epoch": 2579} {"train_loss": -12.674030303955078, "global_step": 433368, "epoch": 2579} {"train_loss": -12.814861297607422, "global_step": 433369, "epoch": 2579} {"train_loss": -12.51304817199707, "global_step": 433370, "epoch": 2579} {"train_loss": -12.617328643798828, "global_step": 433371, "epoch": 2579} {"train_loss": -12.844955444335938, "global_step": 433372, "epoch": 2579} {"train_loss": -12.693231582641602, "global_step": 433373, "epoch": 2579} {"train_loss": -12.433780670166016, "global_step": 433374, "epoch": 2579} {"train_loss": -12.842300415039062, "global_step": 433375, "epoch": 2579} {"train_loss": -12.701695442199707, "global_step": 433376, "epoch": 2579} {"train_loss": -12.704052925109863, "global_step": 433377, "epoch": 2579} {"train_loss": -12.655498504638672, "global_step": 433378, "epoch": 2579} {"train_loss": -12.88034439086914, "global_step": 433379, "epoch": 2579} {"train_loss": -12.798635482788086, "global_step": 433380, "epoch": 2579} {"train_loss": -12.631074905395508, "global_step": 433381, "epoch": 2579} {"train_loss": -12.897539138793945, "global_step": 433382, "epoch": 2579} {"train_loss": -12.630043029785156, "global_step": 433383, "epoch": 2579} {"train_loss": -12.704458236694336, "global_step": 433384, "epoch": 2579} {"train_loss": -12.833913803100586, "global_step": 433385, "epoch": 2579} {"train_loss": -12.792903900146484, "global_step": 433386, "epoch": 2579} {"train_loss": -12.345380783081055, "global_step": 433387, "epoch": 2579} {"train_loss": -12.377767562866211, "global_step": 433388, "epoch": 2579} {"train_loss": -12.487713813781738, "global_step": 433389, "epoch": 2579} {"train_loss": -12.001644134521484, "global_step": 433390, "epoch": 2579} {"train_loss": -11.978872299194336, "global_step": 433391, "epoch": 2579} {"train_loss": -12.205696105957031, "global_step": 433392, "epoch": 2579} {"train_loss": -12.315132141113281, "global_step": 433393, "epoch": 2579} {"train_loss": -12.507560729980469, "global_step": 433394, "epoch": 2579} {"train_loss": -12.421032905578613, "global_step": 433395, "epoch": 2579} {"train_loss": -12.755414962768555, "global_step": 433396, "epoch": 2579} {"train_loss": -12.380982398986816, "global_step": 433397, "epoch": 2579} {"train_loss": -12.563949584960938, "global_step": 433398, "epoch": 2579} {"train_loss": -12.54156494140625, "global_step": 433399, "epoch": 2579} {"train_loss": -12.875320434570312, "global_step": 433400, "epoch": 2579} {"train_loss": -12.583561897277832, "global_step": 433401, "epoch": 2579} {"train_loss": -12.388137817382812, "global_step": 433402, "epoch": 2579} {"train_loss": -12.136828422546387, "global_step": 433403, "epoch": 2579} {"train_loss": -12.594718933105469, "global_step": 433404, "epoch": 2579} {"train_loss": -12.182684898376465, "global_step": 433405, "epoch": 2579} {"train_loss": -11.832026481628418, "global_step": 433406, "epoch": 2579} {"train_loss": -12.012626647949219, "global_step": 433407, "epoch": 2579} {"train_loss": -12.64090347290039, "global_step": 433408, "epoch": 2579} {"train_loss": -11.869558334350586, "global_step": 433409, "epoch": 2579} {"train_loss": -11.54106330871582, "global_step": 433410, "epoch": 2579} {"train_loss": -12.069828033447266, "global_step": 433411, "epoch": 2579} {"train_loss": -11.682893753051758, "global_step": 433412, "epoch": 2579} {"train_loss": -11.905739784240723, "global_step": 433413, "epoch": 2579} {"train_loss": -11.623241424560547, "global_step": 433414, "epoch": 2579} {"train_loss": -12.446358680725098, "global_step": 433415, "epoch": 2579} {"train_loss": -11.735382080078125, "global_step": 433416, "epoch": 2579} {"train_loss": -10.713996887207031, "global_step": 433417, "epoch": 2579} {"train_loss": -11.94521427154541, "global_step": 433418, "epoch": 2579} {"train_loss": -12.068814277648926, "global_step": 433419, "epoch": 2579} {"train_loss": -10.864442825317383, "global_step": 433420, "epoch": 2579} {"train_loss": -12.337831497192383, "global_step": 433421, "epoch": 2579} {"train_loss": -12.139046669006348, "global_step": 433422, "epoch": 2579} {"train_loss": -11.182026863098145, "global_step": 433423, "epoch": 2579} {"train_loss": -10.979789733886719, "global_step": 433424, "epoch": 2579} {"train_loss": -11.46765422821045, "global_step": 433425, "epoch": 2579} {"train_loss": -9.923484802246094, "global_step": 433426, "epoch": 2579} {"train_loss": -10.991098403930664, "global_step": 433427, "epoch": 2579} {"train_loss": -10.508301734924316, "global_step": 433428, "epoch": 2579} {"train_loss": -11.23890495300293, "global_step": 433429, "epoch": 2579} {"train_loss": -9.964737892150879, "global_step": 433430, "epoch": 2579} {"train_loss": -9.790212631225586, "global_step": 433431, "epoch": 2579} {"train_loss": -11.248014450073242, "global_step": 433432, "epoch": 2579} {"train_loss": -10.720176696777344, "global_step": 433433, "epoch": 2579} {"train_loss": -10.706188201904297, "global_step": 433434, "epoch": 2579} {"train_loss": -11.527623176574707, "global_step": 433435, "epoch": 2579} {"train_loss": -11.249103546142578, "global_step": 433436, "epoch": 2579} {"train_loss": -11.558967590332031, "global_step": 433437, "epoch": 2579} {"train_loss": -11.800882339477539, "global_step": 433438, "epoch": 2579} {"train_loss": -11.867259743667784, "global_step": 433439, "epoch": 2579, "val_loss": 306827.78125} {"train_loss": -12.038515090942383, "global_step": 433440, "epoch": 2580} {"train_loss": -11.331172943115234, "global_step": 433441, "epoch": 2580} {"train_loss": -11.773954391479492, "global_step": 433442, "epoch": 2580} {"train_loss": -11.945234298706055, "global_step": 433443, "epoch": 2580} {"train_loss": -11.661527633666992, "global_step": 433444, "epoch": 2580} {"train_loss": -11.854645729064941, "global_step": 433445, "epoch": 2580} {"train_loss": -11.613966941833496, "global_step": 433446, "epoch": 2580} {"train_loss": -11.677669525146484, "global_step": 433447, "epoch": 2580} {"train_loss": -11.578222274780273, "global_step": 433448, "epoch": 2580} {"train_loss": -11.812653541564941, "global_step": 433449, "epoch": 2580} {"train_loss": -11.650016784667969, "global_step": 433450, "epoch": 2580} {"train_loss": -11.67318344116211, "global_step": 433451, "epoch": 2580} {"train_loss": -11.966530799865723, "global_step": 433452, "epoch": 2580} {"train_loss": -11.381632804870605, "global_step": 433453, "epoch": 2580} {"train_loss": -12.260029792785645, "global_step": 433454, "epoch": 2580} {"train_loss": -10.984477996826172, "global_step": 433455, "epoch": 2580} {"train_loss": -11.721986770629883, "global_step": 433456, "epoch": 2580} {"train_loss": -11.76173210144043, "global_step": 433457, "epoch": 2580} {"train_loss": -12.112180709838867, "global_step": 433458, "epoch": 2580} {"train_loss": -11.474325180053711, "global_step": 433459, "epoch": 2580} {"train_loss": -12.183109283447266, "global_step": 433460, "epoch": 2580} {"train_loss": -11.596277236938477, "global_step": 433461, "epoch": 2580} {"train_loss": -12.023338317871094, "global_step": 433462, "epoch": 2580} {"train_loss": -11.985794067382812, "global_step": 433463, "epoch": 2580} {"train_loss": -12.068649291992188, "global_step": 433464, "epoch": 2580} {"train_loss": -12.304804801940918, "global_step": 433465, "epoch": 2580} {"train_loss": -12.027976036071777, "global_step": 433466, "epoch": 2580} {"train_loss": -11.924413681030273, "global_step": 433467, "epoch": 2580} {"train_loss": -12.290267944335938, "global_step": 433468, "epoch": 2580} {"train_loss": -12.259562492370605, "global_step": 433469, "epoch": 2580} {"train_loss": -12.012872695922852, "global_step": 433470, "epoch": 2580} {"train_loss": -12.23785400390625, "global_step": 433471, "epoch": 2580} {"train_loss": -12.356878280639648, "global_step": 433472, "epoch": 2580} {"train_loss": -12.206342697143555, "global_step": 433473, "epoch": 2580} {"train_loss": -11.843603134155273, "global_step": 433474, "epoch": 2580} {"train_loss": -11.913728713989258, "global_step": 433475, "epoch": 2580} {"train_loss": -12.269559860229492, "global_step": 433476, "epoch": 2580} {"train_loss": -12.118650436401367, "global_step": 433477, "epoch": 2580} {"train_loss": -12.376508712768555, "global_step": 433478, "epoch": 2580} {"train_loss": -12.205093383789062, "global_step": 433479, "epoch": 2580} {"train_loss": -12.270820617675781, "global_step": 433480, "epoch": 2580} {"train_loss": -12.101181030273438, "global_step": 433481, "epoch": 2580} {"train_loss": -12.220390319824219, "global_step": 433482, "epoch": 2580} {"train_loss": -12.149567604064941, "global_step": 433483, "epoch": 2580} {"train_loss": -12.064765930175781, "global_step": 433484, "epoch": 2580} {"train_loss": -12.120932579040527, "global_step": 433485, "epoch": 2580} {"train_loss": -11.982934951782227, "global_step": 433486, "epoch": 2580} {"train_loss": -12.080037117004395, "global_step": 433487, "epoch": 2580} {"train_loss": -12.354727745056152, "global_step": 433488, "epoch": 2580} {"train_loss": -12.35727310180664, "global_step": 433489, "epoch": 2580} {"train_loss": -12.160419464111328, "global_step": 433490, "epoch": 2580} {"train_loss": -12.2950439453125, "global_step": 433491, "epoch": 2580} {"train_loss": -12.009571075439453, "global_step": 433492, "epoch": 2580} {"train_loss": -12.35370922088623, "global_step": 433493, "epoch": 2580} {"train_loss": -12.153369903564453, "global_step": 433494, "epoch": 2580} {"train_loss": -12.28190803527832, "global_step": 433495, "epoch": 2580} {"train_loss": -12.553482055664062, "global_step": 433496, "epoch": 2580} {"train_loss": -12.269527435302734, "global_step": 433497, "epoch": 2580} {"train_loss": -12.197233200073242, "global_step": 433498, "epoch": 2580} {"train_loss": -12.607873916625977, "global_step": 433499, "epoch": 2580} {"train_loss": -12.284259796142578, "global_step": 433500, "epoch": 2580} {"train_loss": -12.477689743041992, "global_step": 433501, "epoch": 2580} {"train_loss": -12.377741813659668, "global_step": 433502, "epoch": 2580} {"train_loss": -12.554723739624023, "global_step": 433503, "epoch": 2580} {"train_loss": -11.908740043640137, "global_step": 433504, "epoch": 2580} {"train_loss": -12.492585182189941, "global_step": 433505, "epoch": 2580} {"train_loss": -12.044279098510742, "global_step": 433506, "epoch": 2580} {"train_loss": -12.292238235473633, "global_step": 433507, "epoch": 2580} {"train_loss": -11.879742622375488, "global_step": 433508, "epoch": 2580} {"train_loss": -12.293449401855469, "global_step": 433509, "epoch": 2580} {"train_loss": -12.000057220458984, "global_step": 433510, "epoch": 2580} {"train_loss": -12.432880401611328, "global_step": 433511, "epoch": 2580} {"train_loss": -12.011929512023926, "global_step": 433512, "epoch": 2580} {"train_loss": -12.319961547851562, "global_step": 433513, "epoch": 2580} {"train_loss": -12.26411247253418, "global_step": 433514, "epoch": 2580} {"train_loss": -12.165913581848145, "global_step": 433515, "epoch": 2580} {"train_loss": -12.337507247924805, "global_step": 433516, "epoch": 2580} {"train_loss": -12.285594940185547, "global_step": 433517, "epoch": 2580} {"train_loss": -12.477548599243164, "global_step": 433518, "epoch": 2580} {"train_loss": -12.45217514038086, "global_step": 433519, "epoch": 2580} {"train_loss": -12.131593704223633, "global_step": 433520, "epoch": 2580} {"train_loss": -12.334067344665527, "global_step": 433521, "epoch": 2580} {"train_loss": -12.643715858459473, "global_step": 433522, "epoch": 2580} {"train_loss": -12.248226165771484, "global_step": 433523, "epoch": 2580} {"train_loss": -12.545537948608398, "global_step": 433524, "epoch": 2580} {"train_loss": -12.567455291748047, "global_step": 433525, "epoch": 2580} {"train_loss": -12.391852378845215, "global_step": 433526, "epoch": 2580} {"train_loss": -12.430389404296875, "global_step": 433527, "epoch": 2580} {"train_loss": -12.265315055847168, "global_step": 433528, "epoch": 2580} {"train_loss": -12.665682792663574, "global_step": 433529, "epoch": 2580} {"train_loss": -12.628520965576172, "global_step": 433530, "epoch": 2580} {"train_loss": -12.265132904052734, "global_step": 433531, "epoch": 2580} {"train_loss": -12.445597648620605, "global_step": 433532, "epoch": 2580} {"train_loss": -12.499022483825684, "global_step": 433533, "epoch": 2580} {"train_loss": -12.399446487426758, "global_step": 433534, "epoch": 2580} {"train_loss": -12.283660888671875, "global_step": 433535, "epoch": 2580} {"train_loss": -12.401538848876953, "global_step": 433536, "epoch": 2580} {"train_loss": -12.321001052856445, "global_step": 433537, "epoch": 2580} {"train_loss": -12.103657722473145, "global_step": 433538, "epoch": 2580} {"train_loss": -12.11385440826416, "global_step": 433539, "epoch": 2580} {"train_loss": -11.7969970703125, "global_step": 433540, "epoch": 2580} {"train_loss": -12.63452434539795, "global_step": 433541, "epoch": 2580} {"train_loss": -11.841577529907227, "global_step": 433542, "epoch": 2580} {"train_loss": -12.385592460632324, "global_step": 433543, "epoch": 2580} {"train_loss": -11.798101425170898, "global_step": 433544, "epoch": 2580} {"train_loss": -12.376516342163086, "global_step": 433545, "epoch": 2580} {"train_loss": -11.722284317016602, "global_step": 433546, "epoch": 2580} {"train_loss": -12.40536117553711, "global_step": 433547, "epoch": 2580} {"train_loss": -12.063840866088867, "global_step": 433548, "epoch": 2580} {"train_loss": -12.360734939575195, "global_step": 433549, "epoch": 2580} {"train_loss": -11.526325225830078, "global_step": 433550, "epoch": 2580} {"train_loss": -12.432672500610352, "global_step": 433551, "epoch": 2580} {"train_loss": -12.116316795349121, "global_step": 433552, "epoch": 2580} {"train_loss": -12.15959358215332, "global_step": 433553, "epoch": 2580} {"train_loss": -12.190069198608398, "global_step": 433554, "epoch": 2580} {"train_loss": -12.181317329406738, "global_step": 433555, "epoch": 2580} {"train_loss": -12.293716430664062, "global_step": 433556, "epoch": 2580} {"train_loss": -12.413818359375, "global_step": 433557, "epoch": 2580} {"train_loss": -12.200262069702148, "global_step": 433558, "epoch": 2580} {"train_loss": -12.503055572509766, "global_step": 433559, "epoch": 2580} {"train_loss": -12.664022445678711, "global_step": 433560, "epoch": 2580} {"train_loss": -12.117607116699219, "global_step": 433561, "epoch": 2580} {"train_loss": -11.925725936889648, "global_step": 433562, "epoch": 2580} {"train_loss": -12.526482582092285, "global_step": 433563, "epoch": 2580} {"train_loss": -12.447059631347656, "global_step": 433564, "epoch": 2580} {"train_loss": -11.729328155517578, "global_step": 433565, "epoch": 2580} {"train_loss": -12.071676254272461, "global_step": 433566, "epoch": 2580} {"train_loss": -12.744714736938477, "global_step": 433567, "epoch": 2580} {"train_loss": -12.088497161865234, "global_step": 433568, "epoch": 2580} {"train_loss": -11.802352905273438, "global_step": 433569, "epoch": 2580} {"train_loss": -12.199701309204102, "global_step": 433570, "epoch": 2580} {"train_loss": -11.914888381958008, "global_step": 433571, "epoch": 2580} {"train_loss": -12.730640411376953, "global_step": 433572, "epoch": 2580} {"train_loss": -11.936458587646484, "global_step": 433573, "epoch": 2580} {"train_loss": -12.30664348602295, "global_step": 433574, "epoch": 2580} {"train_loss": -11.982906341552734, "global_step": 433575, "epoch": 2580} {"train_loss": -12.026232719421387, "global_step": 433576, "epoch": 2580} {"train_loss": -11.685792922973633, "global_step": 433577, "epoch": 2580} {"train_loss": -12.787919998168945, "global_step": 433578, "epoch": 2580} {"train_loss": -11.331066131591797, "global_step": 433579, "epoch": 2580} {"train_loss": -12.329495429992676, "global_step": 433580, "epoch": 2580} {"train_loss": -12.306791305541992, "global_step": 433581, "epoch": 2580} {"train_loss": -11.805212020874023, "global_step": 433582, "epoch": 2580} {"train_loss": -12.204872131347656, "global_step": 433583, "epoch": 2580} {"train_loss": -12.562360763549805, "global_step": 433584, "epoch": 2580} {"train_loss": -12.663652420043945, "global_step": 433585, "epoch": 2580} {"train_loss": -12.478757858276367, "global_step": 433586, "epoch": 2580} {"train_loss": -12.344317436218262, "global_step": 433587, "epoch": 2580} {"train_loss": -12.015562057495117, "global_step": 433588, "epoch": 2580} {"train_loss": -12.282883644104004, "global_step": 433589, "epoch": 2580} {"train_loss": -11.874679565429688, "global_step": 433590, "epoch": 2580} {"train_loss": -11.045275688171387, "global_step": 433591, "epoch": 2580} {"train_loss": -11.579998016357422, "global_step": 433592, "epoch": 2580} {"train_loss": -10.502561569213867, "global_step": 433593, "epoch": 2580} {"train_loss": -12.349359512329102, "global_step": 433594, "epoch": 2580} {"train_loss": -10.131187438964844, "global_step": 433595, "epoch": 2580} {"train_loss": -11.263822555541992, "global_step": 433596, "epoch": 2580} {"train_loss": -11.23640251159668, "global_step": 433597, "epoch": 2580} {"train_loss": -10.759393692016602, "global_step": 433598, "epoch": 2580} {"train_loss": -11.399911880493164, "global_step": 433599, "epoch": 2580} {"train_loss": -12.032255172729492, "global_step": 433600, "epoch": 2580} {"train_loss": -11.07016372680664, "global_step": 433601, "epoch": 2580} {"train_loss": -11.83802604675293, "global_step": 433602, "epoch": 2580} {"train_loss": -11.259180068969727, "global_step": 433603, "epoch": 2580} {"train_loss": -10.427019119262695, "global_step": 433604, "epoch": 2580} {"train_loss": -12.272773742675781, "global_step": 433605, "epoch": 2580} {"train_loss": -11.256678581237793, "global_step": 433606, "epoch": 2580} {"train_loss": -12.07047404561724, "global_step": 433607, "epoch": 2580, "val_loss": 310311.5, "train_action_mse_error": 1.5356849431991577} {"train_loss": -11.029435157775879, "global_step": 433608, "epoch": 2581} {"train_loss": -11.214967727661133, "global_step": 433609, "epoch": 2581} {"train_loss": -11.311087608337402, "global_step": 433610, "epoch": 2581} {"train_loss": -11.452905654907227, "global_step": 433611, "epoch": 2581} {"train_loss": -12.166505813598633, "global_step": 433612, "epoch": 2581} {"train_loss": -11.774885177612305, "global_step": 433613, "epoch": 2581} {"train_loss": -11.789106369018555, "global_step": 433614, "epoch": 2581} {"train_loss": -11.629422187805176, "global_step": 433615, "epoch": 2581} {"train_loss": -11.154619216918945, "global_step": 433616, "epoch": 2581} {"train_loss": -10.962865829467773, "global_step": 433617, "epoch": 2581} {"train_loss": -11.832721710205078, "global_step": 433618, "epoch": 2581} {"train_loss": -11.44018268585205, "global_step": 433619, "epoch": 2581} {"train_loss": -12.024425506591797, "global_step": 433620, "epoch": 2581} {"train_loss": -12.225099563598633, "global_step": 433621, "epoch": 2581} {"train_loss": -12.035051345825195, "global_step": 433622, "epoch": 2581} {"train_loss": -12.010318756103516, "global_step": 433623, "epoch": 2581} {"train_loss": -12.164777755737305, "global_step": 433624, "epoch": 2581} {"train_loss": -11.849571228027344, "global_step": 433625, "epoch": 2581} {"train_loss": -12.201753616333008, "global_step": 433626, "epoch": 2581} {"train_loss": -12.249463081359863, "global_step": 433627, "epoch": 2581} {"train_loss": -12.05152416229248, "global_step": 433628, "epoch": 2581} {"train_loss": -12.51741886138916, "global_step": 433629, "epoch": 2581} {"train_loss": -12.488571166992188, "global_step": 433630, "epoch": 2581} {"train_loss": -12.345813751220703, "global_step": 433631, "epoch": 2581} {"train_loss": -12.375295639038086, "global_step": 433632, "epoch": 2581} {"train_loss": -12.60568904876709, "global_step": 433633, "epoch": 2581} {"train_loss": -12.307472229003906, "global_step": 433634, "epoch": 2581} {"train_loss": -12.296546936035156, "global_step": 433635, "epoch": 2581} {"train_loss": -12.395153999328613, "global_step": 433636, "epoch": 2581} {"train_loss": -12.680126190185547, "global_step": 433637, "epoch": 2581} {"train_loss": -12.477519989013672, "global_step": 433638, "epoch": 2581} {"train_loss": -12.341350555419922, "global_step": 433639, "epoch": 2581} {"train_loss": -12.40280818939209, "global_step": 433640, "epoch": 2581} {"train_loss": -12.401266098022461, "global_step": 433641, "epoch": 2581} {"train_loss": -12.63703441619873, "global_step": 433642, "epoch": 2581} {"train_loss": -12.482337951660156, "global_step": 433643, "epoch": 2581} {"train_loss": -12.52696418762207, "global_step": 433644, "epoch": 2581} {"train_loss": -12.437992095947266, "global_step": 433645, "epoch": 2581} {"train_loss": -12.594012260437012, "global_step": 433646, "epoch": 2581} {"train_loss": -12.479013442993164, "global_step": 433647, "epoch": 2581} {"train_loss": -12.449199676513672, "global_step": 433648, "epoch": 2581} {"train_loss": -12.449758529663086, "global_step": 433649, "epoch": 2581} {"train_loss": -12.238430976867676, "global_step": 433650, "epoch": 2581} {"train_loss": -12.626448631286621, "global_step": 433651, "epoch": 2581} {"train_loss": -12.385551452636719, "global_step": 433652, "epoch": 2581} {"train_loss": -12.607342720031738, "global_step": 433653, "epoch": 2581} {"train_loss": -12.323588371276855, "global_step": 433654, "epoch": 2581} {"train_loss": -12.548149108886719, "global_step": 433655, "epoch": 2581} {"train_loss": -12.121933937072754, "global_step": 433656, "epoch": 2581} {"train_loss": -12.42992877960205, "global_step": 433657, "epoch": 2581} {"train_loss": -12.79675579071045, "global_step": 433658, "epoch": 2581} {"train_loss": -12.294204711914062, "global_step": 433659, "epoch": 2581} {"train_loss": -12.132803916931152, "global_step": 433660, "epoch": 2581} {"train_loss": -12.615375518798828, "global_step": 433661, "epoch": 2581} {"train_loss": -12.66453742980957, "global_step": 433662, "epoch": 2581} {"train_loss": -12.528768539428711, "global_step": 433663, "epoch": 2581} {"train_loss": -12.50507640838623, "global_step": 433664, "epoch": 2581} {"train_loss": -12.43545150756836, "global_step": 433665, "epoch": 2581} {"train_loss": -12.617986679077148, "global_step": 433666, "epoch": 2581} {"train_loss": -12.609901428222656, "global_step": 433667, "epoch": 2581} {"train_loss": -12.5684814453125, "global_step": 433668, "epoch": 2581} {"train_loss": -12.317819595336914, "global_step": 433669, "epoch": 2581} {"train_loss": -12.674039840698242, "global_step": 433670, "epoch": 2581} {"train_loss": -12.61803150177002, "global_step": 433671, "epoch": 2581} {"train_loss": -12.405233383178711, "global_step": 433672, "epoch": 2581} {"train_loss": -12.439385414123535, "global_step": 433673, "epoch": 2581} {"train_loss": -12.64881706237793, "global_step": 433674, "epoch": 2581} {"train_loss": -12.828246116638184, "global_step": 433675, "epoch": 2581} {"train_loss": -12.70876693725586, "global_step": 433676, "epoch": 2581} {"train_loss": -12.624603271484375, "global_step": 433677, "epoch": 2581} {"train_loss": -12.586051940917969, "global_step": 433678, "epoch": 2581} {"train_loss": -12.884088516235352, "global_step": 433679, "epoch": 2581} {"train_loss": -12.795597076416016, "global_step": 433680, "epoch": 2581} {"train_loss": -12.709589004516602, "global_step": 433681, "epoch": 2581} {"train_loss": -12.600711822509766, "global_step": 433682, "epoch": 2581} {"train_loss": -12.663385391235352, "global_step": 433683, "epoch": 2581} {"train_loss": -12.724384307861328, "global_step": 433684, "epoch": 2581} {"train_loss": -12.435784339904785, "global_step": 433685, "epoch": 2581} {"train_loss": -12.682979583740234, "global_step": 433686, "epoch": 2581} {"train_loss": -12.040596008300781, "global_step": 433687, "epoch": 2581} {"train_loss": -12.128151893615723, "global_step": 433688, "epoch": 2581} {"train_loss": -12.706878662109375, "global_step": 433689, "epoch": 2581} {"train_loss": -12.575709342956543, "global_step": 433690, "epoch": 2581} {"train_loss": -12.574186325073242, "global_step": 433691, "epoch": 2581} {"train_loss": -12.494608879089355, "global_step": 433692, "epoch": 2581} {"train_loss": -12.040639877319336, "global_step": 433693, "epoch": 2581} {"train_loss": -12.48475170135498, "global_step": 433694, "epoch": 2581} {"train_loss": -11.828084945678711, "global_step": 433695, "epoch": 2581} {"train_loss": -10.897830963134766, "global_step": 433696, "epoch": 2581} {"train_loss": -11.243413925170898, "global_step": 433697, "epoch": 2581} {"train_loss": -12.398597717285156, "global_step": 433698, "epoch": 2581} {"train_loss": -10.228706359863281, "global_step": 433699, "epoch": 2581} {"train_loss": -12.245458602905273, "global_step": 433700, "epoch": 2581} {"train_loss": -10.332674026489258, "global_step": 433701, "epoch": 2581} {"train_loss": -10.813426971435547, "global_step": 433702, "epoch": 2581} {"train_loss": -11.95089054107666, "global_step": 433703, "epoch": 2581} {"train_loss": -11.176968574523926, "global_step": 433704, "epoch": 2581} {"train_loss": -12.16348934173584, "global_step": 433705, "epoch": 2581} {"train_loss": -10.866826057434082, "global_step": 433706, "epoch": 2581} {"train_loss": -12.713247299194336, "global_step": 433707, "epoch": 2581} {"train_loss": -10.847347259521484, "global_step": 433708, "epoch": 2581} {"train_loss": -12.702066421508789, "global_step": 433709, "epoch": 2581} {"train_loss": -11.471335411071777, "global_step": 433710, "epoch": 2581} {"train_loss": -11.810020446777344, "global_step": 433711, "epoch": 2581} {"train_loss": -11.603739738464355, "global_step": 433712, "epoch": 2581} {"train_loss": -12.348176002502441, "global_step": 433713, "epoch": 2581} {"train_loss": -12.107534408569336, "global_step": 433714, "epoch": 2581} {"train_loss": -11.594465255737305, "global_step": 433715, "epoch": 2581} {"train_loss": -11.816213607788086, "global_step": 433716, "epoch": 2581} {"train_loss": -10.621048927307129, "global_step": 433717, "epoch": 2581} {"train_loss": -11.586711883544922, "global_step": 433718, "epoch": 2581} {"train_loss": -11.012313842773438, "global_step": 433719, "epoch": 2581} {"train_loss": -10.63332462310791, "global_step": 433720, "epoch": 2581} {"train_loss": -10.213499069213867, "global_step": 433721, "epoch": 2581} {"train_loss": -10.338432312011719, "global_step": 433722, "epoch": 2581} {"train_loss": -11.881373405456543, "global_step": 433723, "epoch": 2581} {"train_loss": -10.725984573364258, "global_step": 433724, "epoch": 2581} {"train_loss": -12.255308151245117, "global_step": 433725, "epoch": 2581} {"train_loss": -10.372221946716309, "global_step": 433726, "epoch": 2581} {"train_loss": -11.812996864318848, "global_step": 433727, "epoch": 2581} {"train_loss": -10.732650756835938, "global_step": 433728, "epoch": 2581} {"train_loss": -12.215346336364746, "global_step": 433729, "epoch": 2581} {"train_loss": -10.57471752166748, "global_step": 433730, "epoch": 2581} {"train_loss": -12.120100021362305, "global_step": 433731, "epoch": 2581} {"train_loss": -11.471208572387695, "global_step": 433732, "epoch": 2581} {"train_loss": -11.653125762939453, "global_step": 433733, "epoch": 2581} {"train_loss": -12.058034896850586, "global_step": 433734, "epoch": 2581} {"train_loss": -11.482616424560547, "global_step": 433735, "epoch": 2581} {"train_loss": -12.136920928955078, "global_step": 433736, "epoch": 2581} {"train_loss": -11.316082000732422, "global_step": 433737, "epoch": 2581} {"train_loss": -11.984631538391113, "global_step": 433738, "epoch": 2581} {"train_loss": -11.556467056274414, "global_step": 433739, "epoch": 2581} {"train_loss": -11.553279876708984, "global_step": 433740, "epoch": 2581} {"train_loss": -11.819437026977539, "global_step": 433741, "epoch": 2581} {"train_loss": -11.518815994262695, "global_step": 433742, "epoch": 2581} {"train_loss": -12.311866760253906, "global_step": 433743, "epoch": 2581} {"train_loss": -11.535199165344238, "global_step": 433744, "epoch": 2581} {"train_loss": -11.702301025390625, "global_step": 433745, "epoch": 2581} {"train_loss": -11.779827117919922, "global_step": 433746, "epoch": 2581} {"train_loss": -11.931633949279785, "global_step": 433747, "epoch": 2581} {"train_loss": -12.12043571472168, "global_step": 433748, "epoch": 2581} {"train_loss": -12.271121978759766, "global_step": 433749, "epoch": 2581} {"train_loss": -11.895503044128418, "global_step": 433750, "epoch": 2581} {"train_loss": -11.894623756408691, "global_step": 433751, "epoch": 2581} {"train_loss": -11.895671844482422, "global_step": 433752, "epoch": 2581} {"train_loss": -12.112936973571777, "global_step": 433753, "epoch": 2581} {"train_loss": -11.459041595458984, "global_step": 433754, "epoch": 2581} {"train_loss": -12.129715919494629, "global_step": 433755, "epoch": 2581} {"train_loss": -11.839576721191406, "global_step": 433756, "epoch": 2581} {"train_loss": -11.723567962646484, "global_step": 433757, "epoch": 2581} {"train_loss": -12.113306999206543, "global_step": 433758, "epoch": 2581} {"train_loss": -11.773530960083008, "global_step": 433759, "epoch": 2581} {"train_loss": -11.921530723571777, "global_step": 433760, "epoch": 2581} {"train_loss": -12.243181228637695, "global_step": 433761, "epoch": 2581} {"train_loss": -11.749530792236328, "global_step": 433762, "epoch": 2581} {"train_loss": -12.169881820678711, "global_step": 433763, "epoch": 2581} {"train_loss": -12.103586196899414, "global_step": 433764, "epoch": 2581} {"train_loss": -11.733514785766602, "global_step": 433765, "epoch": 2581} {"train_loss": -12.085672378540039, "global_step": 433766, "epoch": 2581} {"train_loss": -11.998037338256836, "global_step": 433767, "epoch": 2581} {"train_loss": -12.186883926391602, "global_step": 433768, "epoch": 2581} {"train_loss": -11.684697151184082, "global_step": 433769, "epoch": 2581} {"train_loss": -12.118378639221191, "global_step": 433770, "epoch": 2581} {"train_loss": -11.718629837036133, "global_step": 433771, "epoch": 2581} {"train_loss": -12.381528854370117, "global_step": 433772, "epoch": 2581} {"train_loss": -12.290191650390625, "global_step": 433773, "epoch": 2581} {"train_loss": -11.844636917114258, "global_step": 433774, "epoch": 2581} {"train_loss": -12.010186240786599, "global_step": 433775, "epoch": 2581, "val_loss": 310986.8125} {"train_loss": -11.649579048156738, "global_step": 433776, "epoch": 2582} {"train_loss": -12.14548397064209, "global_step": 433777, "epoch": 2582} {"train_loss": -11.880741119384766, "global_step": 433778, "epoch": 2582} {"train_loss": -12.150016784667969, "global_step": 433779, "epoch": 2582} {"train_loss": -12.063943862915039, "global_step": 433780, "epoch": 2582} {"train_loss": -11.85924243927002, "global_step": 433781, "epoch": 2582} {"train_loss": -12.055074691772461, "global_step": 433782, "epoch": 2582} {"train_loss": -11.93728256225586, "global_step": 433783, "epoch": 2582} {"train_loss": -11.836020469665527, "global_step": 433784, "epoch": 2582} {"train_loss": -11.954418182373047, "global_step": 433785, "epoch": 2582} {"train_loss": -11.09854507446289, "global_step": 433786, "epoch": 2582} {"train_loss": -12.406734466552734, "global_step": 433787, "epoch": 2582} {"train_loss": -11.090719223022461, "global_step": 433788, "epoch": 2582} {"train_loss": -12.163159370422363, "global_step": 433789, "epoch": 2582} {"train_loss": -11.582857131958008, "global_step": 433790, "epoch": 2582} {"train_loss": -12.04974365234375, "global_step": 433791, "epoch": 2582} {"train_loss": -11.542586326599121, "global_step": 433792, "epoch": 2582} {"train_loss": -12.325767517089844, "global_step": 433793, "epoch": 2582} {"train_loss": -11.412519454956055, "global_step": 433794, "epoch": 2582} {"train_loss": -12.544692993164062, "global_step": 433795, "epoch": 2582} {"train_loss": -11.502894401550293, "global_step": 433796, "epoch": 2582} {"train_loss": -12.217379570007324, "global_step": 433797, "epoch": 2582} {"train_loss": -12.084417343139648, "global_step": 433798, "epoch": 2582} {"train_loss": -12.374430656433105, "global_step": 433799, "epoch": 2582} {"train_loss": -12.279773712158203, "global_step": 433800, "epoch": 2582} {"train_loss": -12.116039276123047, "global_step": 433801, "epoch": 2582} {"train_loss": -12.158924102783203, "global_step": 433802, "epoch": 2582} {"train_loss": -12.488595962524414, "global_step": 433803, "epoch": 2582} {"train_loss": -12.263711929321289, "global_step": 433804, "epoch": 2582} {"train_loss": -12.583257675170898, "global_step": 433805, "epoch": 2582} {"train_loss": -12.311702728271484, "global_step": 433806, "epoch": 2582} {"train_loss": -12.525585174560547, "global_step": 433807, "epoch": 2582} {"train_loss": -12.217214584350586, "global_step": 433808, "epoch": 2582} {"train_loss": -12.490772247314453, "global_step": 433809, "epoch": 2582} {"train_loss": -12.4570894241333, "global_step": 433810, "epoch": 2582} {"train_loss": -12.578869819641113, "global_step": 433811, "epoch": 2582} {"train_loss": -12.540459632873535, "global_step": 433812, "epoch": 2582} {"train_loss": -12.470797538757324, "global_step": 433813, "epoch": 2582} {"train_loss": -12.49075984954834, "global_step": 433814, "epoch": 2582} {"train_loss": -12.58597183227539, "global_step": 433815, "epoch": 2582} {"train_loss": -12.308160781860352, "global_step": 433816, "epoch": 2582} {"train_loss": -12.420907974243164, "global_step": 433817, "epoch": 2582} {"train_loss": -12.47213363647461, "global_step": 433818, "epoch": 2582} {"train_loss": -12.523962020874023, "global_step": 433819, "epoch": 2582} {"train_loss": -12.692427635192871, "global_step": 433820, "epoch": 2582} {"train_loss": -12.470014572143555, "global_step": 433821, "epoch": 2582} {"train_loss": -12.58067512512207, "global_step": 433822, "epoch": 2582} {"train_loss": -12.563091278076172, "global_step": 433823, "epoch": 2582} {"train_loss": -12.629409790039062, "global_step": 433824, "epoch": 2582} {"train_loss": -12.387931823730469, "global_step": 433825, "epoch": 2582} {"train_loss": -12.75346565246582, "global_step": 433826, "epoch": 2582} {"train_loss": -12.496835708618164, "global_step": 433827, "epoch": 2582} {"train_loss": -12.778191566467285, "global_step": 433828, "epoch": 2582} {"train_loss": -12.950441360473633, "global_step": 433829, "epoch": 2582} {"train_loss": -12.790628433227539, "global_step": 433830, "epoch": 2582} {"train_loss": -12.652103424072266, "global_step": 433831, "epoch": 2582} {"train_loss": -12.640275955200195, "global_step": 433832, "epoch": 2582} {"train_loss": -12.892040252685547, "global_step": 433833, "epoch": 2582} {"train_loss": -12.420916557312012, "global_step": 433834, "epoch": 2582} {"train_loss": -12.732324600219727, "global_step": 433835, "epoch": 2582} {"train_loss": -12.512130737304688, "global_step": 433836, "epoch": 2582} {"train_loss": -12.635220527648926, "global_step": 433837, "epoch": 2582} {"train_loss": -12.600997924804688, "global_step": 433838, "epoch": 2582} {"train_loss": -12.578642845153809, "global_step": 433839, "epoch": 2582} {"train_loss": -12.605886459350586, "global_step": 433840, "epoch": 2582} {"train_loss": -12.591437339782715, "global_step": 433841, "epoch": 2582} {"train_loss": -12.687216758728027, "global_step": 433842, "epoch": 2582} {"train_loss": -12.180959701538086, "global_step": 433843, "epoch": 2582} {"train_loss": -12.019794464111328, "global_step": 433844, "epoch": 2582} {"train_loss": -11.941713333129883, "global_step": 433845, "epoch": 2582} {"train_loss": -11.920591354370117, "global_step": 433846, "epoch": 2582} {"train_loss": -11.268404006958008, "global_step": 433847, "epoch": 2582} {"train_loss": -12.180164337158203, "global_step": 433848, "epoch": 2582} {"train_loss": -12.041111946105957, "global_step": 433849, "epoch": 2582} {"train_loss": -11.840621948242188, "global_step": 433850, "epoch": 2582} {"train_loss": -12.3177490234375, "global_step": 433851, "epoch": 2582} {"train_loss": -11.725648880004883, "global_step": 433852, "epoch": 2582} {"train_loss": -12.420587539672852, "global_step": 433853, "epoch": 2582} {"train_loss": -11.938419342041016, "global_step": 433854, "epoch": 2582} {"train_loss": -11.58078384399414, "global_step": 433855, "epoch": 2582} {"train_loss": -11.425646781921387, "global_step": 433856, "epoch": 2582} {"train_loss": -11.371124267578125, "global_step": 433857, "epoch": 2582} {"train_loss": -11.283242225646973, "global_step": 433858, "epoch": 2582} {"train_loss": -10.680405616760254, "global_step": 433859, "epoch": 2582} {"train_loss": -11.519519805908203, "global_step": 433860, "epoch": 2582} {"train_loss": -10.717966079711914, "global_step": 433861, "epoch": 2582} {"train_loss": -9.778450965881348, "global_step": 433862, "epoch": 2582} {"train_loss": -11.378963470458984, "global_step": 433863, "epoch": 2582} {"train_loss": -9.882251739501953, "global_step": 433864, "epoch": 2582} {"train_loss": -11.26723861694336, "global_step": 433865, "epoch": 2582} {"train_loss": -11.520770072937012, "global_step": 433866, "epoch": 2582} {"train_loss": -11.309954643249512, "global_step": 433867, "epoch": 2582} {"train_loss": -11.98398208618164, "global_step": 433868, "epoch": 2582} {"train_loss": -10.707225799560547, "global_step": 433869, "epoch": 2582} {"train_loss": -11.695718765258789, "global_step": 433870, "epoch": 2582} {"train_loss": -11.488605499267578, "global_step": 433871, "epoch": 2582} {"train_loss": -11.857786178588867, "global_step": 433872, "epoch": 2582} {"train_loss": -11.314980506896973, "global_step": 433873, "epoch": 2582} {"train_loss": -11.815760612487793, "global_step": 433874, "epoch": 2582} {"train_loss": -12.080609321594238, "global_step": 433875, "epoch": 2582} {"train_loss": -11.532127380371094, "global_step": 433876, "epoch": 2582} {"train_loss": -12.29269027709961, "global_step": 433877, "epoch": 2582} {"train_loss": -12.035177230834961, "global_step": 433878, "epoch": 2582} {"train_loss": -12.356048583984375, "global_step": 433879, "epoch": 2582} {"train_loss": -12.240983963012695, "global_step": 433880, "epoch": 2582} {"train_loss": -12.272998809814453, "global_step": 433881, "epoch": 2582} {"train_loss": -12.228492736816406, "global_step": 433882, "epoch": 2582} {"train_loss": -12.08951187133789, "global_step": 433883, "epoch": 2582} {"train_loss": -11.550352096557617, "global_step": 433884, "epoch": 2582} {"train_loss": -12.238445281982422, "global_step": 433885, "epoch": 2582} {"train_loss": -11.608552932739258, "global_step": 433886, "epoch": 2582} {"train_loss": -11.892793655395508, "global_step": 433887, "epoch": 2582} {"train_loss": -12.119430541992188, "global_step": 433888, "epoch": 2582} {"train_loss": -12.130599975585938, "global_step": 433889, "epoch": 2582} {"train_loss": -12.343457221984863, "global_step": 433890, "epoch": 2582} {"train_loss": -12.233742713928223, "global_step": 433891, "epoch": 2582} {"train_loss": -12.221651077270508, "global_step": 433892, "epoch": 2582} {"train_loss": -11.946249961853027, "global_step": 433893, "epoch": 2582} {"train_loss": -12.214497566223145, "global_step": 433894, "epoch": 2582} {"train_loss": -11.970866203308105, "global_step": 433895, "epoch": 2582} {"train_loss": -12.093950271606445, "global_step": 433896, "epoch": 2582} {"train_loss": -12.140213012695312, "global_step": 433897, "epoch": 2582} {"train_loss": -11.921512603759766, "global_step": 433898, "epoch": 2582} {"train_loss": -12.090007781982422, "global_step": 433899, "epoch": 2582} {"train_loss": -12.10207748413086, "global_step": 433900, "epoch": 2582} {"train_loss": -12.259117126464844, "global_step": 433901, "epoch": 2582} {"train_loss": -12.237813949584961, "global_step": 433902, "epoch": 2582} {"train_loss": -11.706332206726074, "global_step": 433903, "epoch": 2582} {"train_loss": -12.037981033325195, "global_step": 433904, "epoch": 2582} {"train_loss": -12.39171314239502, "global_step": 433905, "epoch": 2582} {"train_loss": -12.363906860351562, "global_step": 433906, "epoch": 2582} {"train_loss": -12.012534141540527, "global_step": 433907, "epoch": 2582} {"train_loss": -12.605684280395508, "global_step": 433908, "epoch": 2582} {"train_loss": -12.189841270446777, "global_step": 433909, "epoch": 2582} {"train_loss": -12.551929473876953, "global_step": 433910, "epoch": 2582} {"train_loss": -12.400487899780273, "global_step": 433911, "epoch": 2582} {"train_loss": -12.181432723999023, "global_step": 433912, "epoch": 2582} {"train_loss": -12.227588653564453, "global_step": 433913, "epoch": 2582} {"train_loss": -12.164737701416016, "global_step": 433914, "epoch": 2582} {"train_loss": -12.315377235412598, "global_step": 433915, "epoch": 2582} {"train_loss": -12.444437026977539, "global_step": 433916, "epoch": 2582} {"train_loss": -12.418322563171387, "global_step": 433917, "epoch": 2582} {"train_loss": -12.341448783874512, "global_step": 433918, "epoch": 2582} {"train_loss": -12.689403533935547, "global_step": 433919, "epoch": 2582} {"train_loss": -12.393634796142578, "global_step": 433920, "epoch": 2582} {"train_loss": -12.35209846496582, "global_step": 433921, "epoch": 2582} {"train_loss": -12.35805606842041, "global_step": 433922, "epoch": 2582} {"train_loss": -12.593977928161621, "global_step": 433923, "epoch": 2582} {"train_loss": -12.559829711914062, "global_step": 433924, "epoch": 2582} {"train_loss": -12.762228012084961, "global_step": 433925, "epoch": 2582} {"train_loss": -12.404290199279785, "global_step": 433926, "epoch": 2582} {"train_loss": -12.480567932128906, "global_step": 433927, "epoch": 2582} {"train_loss": -12.690840721130371, "global_step": 433928, "epoch": 2582} {"train_loss": -12.488384246826172, "global_step": 433929, "epoch": 2582} {"train_loss": -12.569454193115234, "global_step": 433930, "epoch": 2582} {"train_loss": -12.765889167785645, "global_step": 433931, "epoch": 2582} {"train_loss": -12.44687271118164, "global_step": 433932, "epoch": 2582} {"train_loss": -12.716019630432129, "global_step": 433933, "epoch": 2582} {"train_loss": -12.594111442565918, "global_step": 433934, "epoch": 2582} {"train_loss": -12.587447166442871, "global_step": 433935, "epoch": 2582} {"train_loss": -12.46044921875, "global_step": 433936, "epoch": 2582} {"train_loss": -12.653658866882324, "global_step": 433937, "epoch": 2582} {"train_loss": -12.497041702270508, "global_step": 433938, "epoch": 2582} {"train_loss": -12.620752334594727, "global_step": 433939, "epoch": 2582} {"train_loss": -12.720699310302734, "global_step": 433940, "epoch": 2582} {"train_loss": -12.324819564819336, "global_step": 433941, "epoch": 2582} {"train_loss": -12.458429336547852, "global_step": 433942, "epoch": 2582} {"train_loss": -12.153563766252427, "global_step": 433943, "epoch": 2582, "val_loss": 309766.25} {"train_loss": -12.03239917755127, "global_step": 433944, "epoch": 2583} {"train_loss": -12.300073623657227, "global_step": 433945, "epoch": 2583} {"train_loss": -12.540121078491211, "global_step": 433946, "epoch": 2583} {"train_loss": -12.011561393737793, "global_step": 433947, "epoch": 2583} {"train_loss": -11.746281623840332, "global_step": 433948, "epoch": 2583} {"train_loss": -11.93351936340332, "global_step": 433949, "epoch": 2583} {"train_loss": -12.24628734588623, "global_step": 433950, "epoch": 2583} {"train_loss": -10.624839782714844, "global_step": 433951, "epoch": 2583} {"train_loss": -12.386430740356445, "global_step": 433952, "epoch": 2583} {"train_loss": -11.752613067626953, "global_step": 433953, "epoch": 2583} {"train_loss": -11.997173309326172, "global_step": 433954, "epoch": 2583} {"train_loss": -12.333322525024414, "global_step": 433955, "epoch": 2583} {"train_loss": -11.32754898071289, "global_step": 433956, "epoch": 2583} {"train_loss": -11.571249008178711, "global_step": 433957, "epoch": 2583} {"train_loss": -12.27293872833252, "global_step": 433958, "epoch": 2583} {"train_loss": -11.51479721069336, "global_step": 433959, "epoch": 2583} {"train_loss": -11.030848503112793, "global_step": 433960, "epoch": 2583} {"train_loss": -12.356010437011719, "global_step": 433961, "epoch": 2583} {"train_loss": -10.299623489379883, "global_step": 433962, "epoch": 2583} {"train_loss": -12.385858535766602, "global_step": 433963, "epoch": 2583} {"train_loss": -11.644842147827148, "global_step": 433964, "epoch": 2583} {"train_loss": -11.236717224121094, "global_step": 433965, "epoch": 2583} {"train_loss": -11.312359809875488, "global_step": 433966, "epoch": 2583} {"train_loss": -10.290136337280273, "global_step": 433967, "epoch": 2583} {"train_loss": -12.425383567810059, "global_step": 433968, "epoch": 2583} {"train_loss": -10.401205062866211, "global_step": 433969, "epoch": 2583} {"train_loss": -11.034878730773926, "global_step": 433970, "epoch": 2583} {"train_loss": -10.442564010620117, "global_step": 433971, "epoch": 2583} {"train_loss": -11.706689834594727, "global_step": 433972, "epoch": 2583} {"train_loss": -10.781469345092773, "global_step": 433973, "epoch": 2583} {"train_loss": -10.434978485107422, "global_step": 433974, "epoch": 2583} {"train_loss": -11.604716300964355, "global_step": 433975, "epoch": 2583} {"train_loss": -10.709096908569336, "global_step": 433976, "epoch": 2583} {"train_loss": -10.937124252319336, "global_step": 433977, "epoch": 2583} {"train_loss": -10.339797973632812, "global_step": 433978, "epoch": 2583} {"train_loss": -12.034177780151367, "global_step": 433979, "epoch": 2583} {"train_loss": -10.771200180053711, "global_step": 433980, "epoch": 2583} {"train_loss": -11.46689224243164, "global_step": 433981, "epoch": 2583} {"train_loss": -12.193666458129883, "global_step": 433982, "epoch": 2583} {"train_loss": -11.638654708862305, "global_step": 433983, "epoch": 2583} {"train_loss": -12.179277420043945, "global_step": 433984, "epoch": 2583} {"train_loss": -11.661789894104004, "global_step": 433985, "epoch": 2583} {"train_loss": -11.806909561157227, "global_step": 433986, "epoch": 2583} {"train_loss": -11.543231964111328, "global_step": 433987, "epoch": 2583} {"train_loss": -12.222773551940918, "global_step": 433988, "epoch": 2583} {"train_loss": -11.726812362670898, "global_step": 433989, "epoch": 2583} {"train_loss": -11.675420761108398, "global_step": 433990, "epoch": 2583} {"train_loss": -11.974043846130371, "global_step": 433991, "epoch": 2583} {"train_loss": -11.756608009338379, "global_step": 433992, "epoch": 2583} {"train_loss": -11.822806358337402, "global_step": 433993, "epoch": 2583} {"train_loss": -11.480713844299316, "global_step": 433994, "epoch": 2583} {"train_loss": -12.268308639526367, "global_step": 433995, "epoch": 2583} {"train_loss": -11.659112930297852, "global_step": 433996, "epoch": 2583} {"train_loss": -12.290047645568848, "global_step": 433997, "epoch": 2583} {"train_loss": -11.953025817871094, "global_step": 433998, "epoch": 2583} {"train_loss": -12.119754791259766, "global_step": 433999, "epoch": 2583} {"train_loss": -11.984397888183594, "global_step": 434000, "epoch": 2583} {"train_loss": -11.911087036132812, "global_step": 434001, "epoch": 2583} {"train_loss": -12.410558700561523, "global_step": 434002, "epoch": 2583} {"train_loss": -11.78236198425293, "global_step": 434003, "epoch": 2583} {"train_loss": -12.301786422729492, "global_step": 434004, "epoch": 2583} {"train_loss": -11.920089721679688, "global_step": 434005, "epoch": 2583} {"train_loss": -12.064238548278809, "global_step": 434006, "epoch": 2583} {"train_loss": -12.139456748962402, "global_step": 434007, "epoch": 2583} {"train_loss": -12.01722526550293, "global_step": 434008, "epoch": 2583} {"train_loss": -12.423064231872559, "global_step": 434009, "epoch": 2583} {"train_loss": -12.132665634155273, "global_step": 434010, "epoch": 2583} {"train_loss": -12.421834945678711, "global_step": 434011, "epoch": 2583} {"train_loss": -12.21251106262207, "global_step": 434012, "epoch": 2583} {"train_loss": -12.193639755249023, "global_step": 434013, "epoch": 2583} {"train_loss": -12.281747817993164, "global_step": 434014, "epoch": 2583} {"train_loss": -12.101938247680664, "global_step": 434015, "epoch": 2583} {"train_loss": -12.41749095916748, "global_step": 434016, "epoch": 2583} {"train_loss": -12.336368560791016, "global_step": 434017, "epoch": 2583} {"train_loss": -12.07242488861084, "global_step": 434018, "epoch": 2583} {"train_loss": -12.212421417236328, "global_step": 434019, "epoch": 2583} {"train_loss": -12.359516143798828, "global_step": 434020, "epoch": 2583} {"train_loss": -12.353073120117188, "global_step": 434021, "epoch": 2583} {"train_loss": -12.384788513183594, "global_step": 434022, "epoch": 2583} {"train_loss": -12.143771171569824, "global_step": 434023, "epoch": 2583} {"train_loss": -12.020548820495605, "global_step": 434024, "epoch": 2583} {"train_loss": -12.12216567993164, "global_step": 434025, "epoch": 2583} {"train_loss": -12.26762866973877, "global_step": 434026, "epoch": 2583} {"train_loss": -12.170570373535156, "global_step": 434027, "epoch": 2583} {"train_loss": -12.496788024902344, "global_step": 434028, "epoch": 2583} {"train_loss": -12.404726028442383, "global_step": 434029, "epoch": 2583} {"train_loss": -12.455230712890625, "global_step": 434030, "epoch": 2583} {"train_loss": -12.306554794311523, "global_step": 434031, "epoch": 2583} {"train_loss": -12.358444213867188, "global_step": 434032, "epoch": 2583} {"train_loss": -12.469572067260742, "global_step": 434033, "epoch": 2583} {"train_loss": -12.470727920532227, "global_step": 434034, "epoch": 2583} {"train_loss": -12.607702255249023, "global_step": 434035, "epoch": 2583} {"train_loss": -12.326972007751465, "global_step": 434036, "epoch": 2583} {"train_loss": -12.297229766845703, "global_step": 434037, "epoch": 2583} {"train_loss": -12.454240798950195, "global_step": 434038, "epoch": 2583} {"train_loss": -12.456840515136719, "global_step": 434039, "epoch": 2583} {"train_loss": -12.325435638427734, "global_step": 434040, "epoch": 2583} {"train_loss": -12.534538269042969, "global_step": 434041, "epoch": 2583} {"train_loss": -12.487852096557617, "global_step": 434042, "epoch": 2583} {"train_loss": -12.619537353515625, "global_step": 434043, "epoch": 2583} {"train_loss": -12.631338119506836, "global_step": 434044, "epoch": 2583} {"train_loss": -12.459855079650879, "global_step": 434045, "epoch": 2583} {"train_loss": -12.658487319946289, "global_step": 434046, "epoch": 2583} {"train_loss": -12.611800193786621, "global_step": 434047, "epoch": 2583} {"train_loss": -12.545930862426758, "global_step": 434048, "epoch": 2583} {"train_loss": -12.792407989501953, "global_step": 434049, "epoch": 2583} {"train_loss": -12.563033103942871, "global_step": 434050, "epoch": 2583} {"train_loss": -12.515810012817383, "global_step": 434051, "epoch": 2583} {"train_loss": -12.560583114624023, "global_step": 434052, "epoch": 2583} {"train_loss": -12.580728530883789, "global_step": 434053, "epoch": 2583} {"train_loss": -12.110566139221191, "global_step": 434054, "epoch": 2583} {"train_loss": -12.815925598144531, "global_step": 434055, "epoch": 2583} {"train_loss": -12.40896224975586, "global_step": 434056, "epoch": 2583} {"train_loss": -12.742595672607422, "global_step": 434057, "epoch": 2583} {"train_loss": -12.73520565032959, "global_step": 434058, "epoch": 2583} {"train_loss": -12.375597953796387, "global_step": 434059, "epoch": 2583} {"train_loss": -12.69581413269043, "global_step": 434060, "epoch": 2583} {"train_loss": -12.276579856872559, "global_step": 434061, "epoch": 2583} {"train_loss": -12.801708221435547, "global_step": 434062, "epoch": 2583} {"train_loss": -12.258671760559082, "global_step": 434063, "epoch": 2583} {"train_loss": -12.202693939208984, "global_step": 434064, "epoch": 2583} {"train_loss": -12.572385787963867, "global_step": 434065, "epoch": 2583} {"train_loss": -12.411380767822266, "global_step": 434066, "epoch": 2583} {"train_loss": -12.684078216552734, "global_step": 434067, "epoch": 2583} {"train_loss": -12.566516876220703, "global_step": 434068, "epoch": 2583} {"train_loss": -12.324514389038086, "global_step": 434069, "epoch": 2583} {"train_loss": -12.767696380615234, "global_step": 434070, "epoch": 2583} {"train_loss": -12.416135787963867, "global_step": 434071, "epoch": 2583} {"train_loss": -11.776715278625488, "global_step": 434072, "epoch": 2583} {"train_loss": -12.705305099487305, "global_step": 434073, "epoch": 2583} {"train_loss": -12.389516830444336, "global_step": 434074, "epoch": 2583} {"train_loss": -12.185100555419922, "global_step": 434075, "epoch": 2583} {"train_loss": -12.609161376953125, "global_step": 434076, "epoch": 2583} {"train_loss": -12.688810348510742, "global_step": 434077, "epoch": 2583} {"train_loss": -12.424674987792969, "global_step": 434078, "epoch": 2583} {"train_loss": -12.288244247436523, "global_step": 434079, "epoch": 2583} {"train_loss": -12.428132057189941, "global_step": 434080, "epoch": 2583} {"train_loss": -12.631948471069336, "global_step": 434081, "epoch": 2583} {"train_loss": -12.498523712158203, "global_step": 434082, "epoch": 2583} {"train_loss": -12.337419509887695, "global_step": 434083, "epoch": 2583} {"train_loss": -12.673236846923828, "global_step": 434084, "epoch": 2583} {"train_loss": -12.062419891357422, "global_step": 434085, "epoch": 2583} {"train_loss": -12.548651695251465, "global_step": 434086, "epoch": 2583} {"train_loss": -12.648017883300781, "global_step": 434087, "epoch": 2583} {"train_loss": -12.492405891418457, "global_step": 434088, "epoch": 2583} {"train_loss": -12.798558235168457, "global_step": 434089, "epoch": 2583} {"train_loss": -12.411681175231934, "global_step": 434090, "epoch": 2583} {"train_loss": -12.065286636352539, "global_step": 434091, "epoch": 2583} {"train_loss": -12.660497665405273, "global_step": 434092, "epoch": 2583} {"train_loss": -12.290111541748047, "global_step": 434093, "epoch": 2583} {"train_loss": -11.693607330322266, "global_step": 434094, "epoch": 2583} {"train_loss": -12.118254661560059, "global_step": 434095, "epoch": 2583} {"train_loss": -12.54925537109375, "global_step": 434096, "epoch": 2583} {"train_loss": -12.424135208129883, "global_step": 434097, "epoch": 2583} {"train_loss": -12.002243995666504, "global_step": 434098, "epoch": 2583} {"train_loss": -12.674783706665039, "global_step": 434099, "epoch": 2583} {"train_loss": -12.427227020263672, "global_step": 434100, "epoch": 2583} {"train_loss": -12.172037124633789, "global_step": 434101, "epoch": 2583} {"train_loss": -12.692193984985352, "global_step": 434102, "epoch": 2583} {"train_loss": -11.754741668701172, "global_step": 434103, "epoch": 2583} {"train_loss": -11.694864273071289, "global_step": 434104, "epoch": 2583} {"train_loss": -12.860532760620117, "global_step": 434105, "epoch": 2583} {"train_loss": -12.109371185302734, "global_step": 434106, "epoch": 2583} {"train_loss": -11.763303756713867, "global_step": 434107, "epoch": 2583} {"train_loss": -11.711816787719727, "global_step": 434108, "epoch": 2583} {"train_loss": -12.47474479675293, "global_step": 434109, "epoch": 2583} {"train_loss": -11.737354278564453, "global_step": 434110, "epoch": 2583} {"train_loss": -12.108702387128558, "global_step": 434111, "epoch": 2583, "val_loss": 309120.1875} {"train_loss": -12.05226993560791, "global_step": 434112, "epoch": 2584} {"train_loss": -11.464648246765137, "global_step": 434113, "epoch": 2584} {"train_loss": -11.372125625610352, "global_step": 434114, "epoch": 2584} {"train_loss": -12.651775360107422, "global_step": 434115, "epoch": 2584} {"train_loss": -11.724187850952148, "global_step": 434116, "epoch": 2584} {"train_loss": -12.184735298156738, "global_step": 434117, "epoch": 2584} {"train_loss": -11.805021286010742, "global_step": 434118, "epoch": 2584} {"train_loss": -12.532583236694336, "global_step": 434119, "epoch": 2584} {"train_loss": -11.639190673828125, "global_step": 434120, "epoch": 2584} {"train_loss": -11.818096160888672, "global_step": 434121, "epoch": 2584} {"train_loss": -11.10482120513916, "global_step": 434122, "epoch": 2584} {"train_loss": -12.293148040771484, "global_step": 434123, "epoch": 2584} {"train_loss": -11.60903549194336, "global_step": 434124, "epoch": 2584} {"train_loss": -12.114969253540039, "global_step": 434125, "epoch": 2584} {"train_loss": -12.200302124023438, "global_step": 434126, "epoch": 2584} {"train_loss": -11.486213684082031, "global_step": 434127, "epoch": 2584} {"train_loss": -11.936054229736328, "global_step": 434128, "epoch": 2584} {"train_loss": -12.260616302490234, "global_step": 434129, "epoch": 2584} {"train_loss": -11.315896987915039, "global_step": 434130, "epoch": 2584} {"train_loss": -11.083986282348633, "global_step": 434131, "epoch": 2584} {"train_loss": -11.756378173828125, "global_step": 434132, "epoch": 2584} {"train_loss": -11.733118057250977, "global_step": 434133, "epoch": 2584} {"train_loss": -11.646524429321289, "global_step": 434134, "epoch": 2584} {"train_loss": -11.494544982910156, "global_step": 434135, "epoch": 2584} {"train_loss": -12.398468971252441, "global_step": 434136, "epoch": 2584} {"train_loss": -11.162154197692871, "global_step": 434137, "epoch": 2584} {"train_loss": -11.929269790649414, "global_step": 434138, "epoch": 2584} {"train_loss": -11.887163162231445, "global_step": 434139, "epoch": 2584} {"train_loss": -11.920780181884766, "global_step": 434140, "epoch": 2584} {"train_loss": -11.677908897399902, "global_step": 434141, "epoch": 2584} {"train_loss": -11.805824279785156, "global_step": 434142, "epoch": 2584} {"train_loss": -12.735648155212402, "global_step": 434143, "epoch": 2584} {"train_loss": -11.823348999023438, "global_step": 434144, "epoch": 2584} {"train_loss": -12.494367599487305, "global_step": 434145, "epoch": 2584} {"train_loss": -11.943806648254395, "global_step": 434146, "epoch": 2584} {"train_loss": -12.162421226501465, "global_step": 434147, "epoch": 2584} {"train_loss": -12.495455741882324, "global_step": 434148, "epoch": 2584} {"train_loss": -11.790834426879883, "global_step": 434149, "epoch": 2584} {"train_loss": -12.178125381469727, "global_step": 434150, "epoch": 2584} {"train_loss": -12.448976516723633, "global_step": 434151, "epoch": 2584} {"train_loss": -11.63027572631836, "global_step": 434152, "epoch": 2584} {"train_loss": -12.112285614013672, "global_step": 434153, "epoch": 2584} {"train_loss": -12.208970069885254, "global_step": 434154, "epoch": 2584} {"train_loss": -11.876173973083496, "global_step": 434155, "epoch": 2584} {"train_loss": -11.773937225341797, "global_step": 434156, "epoch": 2584} {"train_loss": -11.826741218566895, "global_step": 434157, "epoch": 2584} {"train_loss": -12.277027130126953, "global_step": 434158, "epoch": 2584} {"train_loss": -11.257917404174805, "global_step": 434159, "epoch": 2584} {"train_loss": -12.314111709594727, "global_step": 434160, "epoch": 2584} {"train_loss": -11.550268173217773, "global_step": 434161, "epoch": 2584} {"train_loss": -11.32585334777832, "global_step": 434162, "epoch": 2584} {"train_loss": -12.423349380493164, "global_step": 434163, "epoch": 2584} {"train_loss": -11.267396926879883, "global_step": 434164, "epoch": 2584} {"train_loss": -12.152420043945312, "global_step": 434165, "epoch": 2584} {"train_loss": -11.85873794555664, "global_step": 434166, "epoch": 2584} {"train_loss": -11.96915054321289, "global_step": 434167, "epoch": 2584} {"train_loss": -11.781853675842285, "global_step": 434168, "epoch": 2584} {"train_loss": -12.256685256958008, "global_step": 434169, "epoch": 2584} {"train_loss": -11.587169647216797, "global_step": 434170, "epoch": 2584} {"train_loss": -12.194280624389648, "global_step": 434171, "epoch": 2584} {"train_loss": -12.23082160949707, "global_step": 434172, "epoch": 2584} {"train_loss": -12.008197784423828, "global_step": 434173, "epoch": 2584} {"train_loss": -12.213589668273926, "global_step": 434174, "epoch": 2584} {"train_loss": -12.482368469238281, "global_step": 434175, "epoch": 2584} {"train_loss": -11.880057334899902, "global_step": 434176, "epoch": 2584} {"train_loss": -12.738834381103516, "global_step": 434177, "epoch": 2584} {"train_loss": -11.710421562194824, "global_step": 434178, "epoch": 2584} {"train_loss": -12.35515022277832, "global_step": 434179, "epoch": 2584} {"train_loss": -12.022699356079102, "global_step": 434180, "epoch": 2584} {"train_loss": -11.692583084106445, "global_step": 434181, "epoch": 2584} {"train_loss": -12.205875396728516, "global_step": 434182, "epoch": 2584} {"train_loss": -11.807518005371094, "global_step": 434183, "epoch": 2584} {"train_loss": -12.22219467163086, "global_step": 434184, "epoch": 2584} {"train_loss": -12.477861404418945, "global_step": 434185, "epoch": 2584} {"train_loss": -12.30229377746582, "global_step": 434186, "epoch": 2584} {"train_loss": -12.617639541625977, "global_step": 434187, "epoch": 2584} {"train_loss": -11.826525688171387, "global_step": 434188, "epoch": 2584} {"train_loss": -12.010883331298828, "global_step": 434189, "epoch": 2584} {"train_loss": -12.002519607543945, "global_step": 434190, "epoch": 2584} {"train_loss": -11.027896881103516, "global_step": 434191, "epoch": 2584} {"train_loss": -12.26541519165039, "global_step": 434192, "epoch": 2584} {"train_loss": -10.926405906677246, "global_step": 434193, "epoch": 2584} {"train_loss": -11.83462142944336, "global_step": 434194, "epoch": 2584} {"train_loss": -12.18116569519043, "global_step": 434195, "epoch": 2584} {"train_loss": -11.17917251586914, "global_step": 434196, "epoch": 2584} {"train_loss": -12.648910522460938, "global_step": 434197, "epoch": 2584} {"train_loss": -11.670058250427246, "global_step": 434198, "epoch": 2584} {"train_loss": -12.493759155273438, "global_step": 434199, "epoch": 2584} {"train_loss": -12.075094223022461, "global_step": 434200, "epoch": 2584} {"train_loss": -12.39021110534668, "global_step": 434201, "epoch": 2584} {"train_loss": -12.171565055847168, "global_step": 434202, "epoch": 2584} {"train_loss": -12.031123161315918, "global_step": 434203, "epoch": 2584} {"train_loss": -12.351118087768555, "global_step": 434204, "epoch": 2584} {"train_loss": -12.225458145141602, "global_step": 434205, "epoch": 2584} {"train_loss": -12.51452922821045, "global_step": 434206, "epoch": 2584} {"train_loss": -12.307332992553711, "global_step": 434207, "epoch": 2584} {"train_loss": -12.253318786621094, "global_step": 434208, "epoch": 2584} {"train_loss": -12.557463645935059, "global_step": 434209, "epoch": 2584} {"train_loss": -12.384239196777344, "global_step": 434210, "epoch": 2584} {"train_loss": -12.516712188720703, "global_step": 434211, "epoch": 2584} {"train_loss": -12.344486236572266, "global_step": 434212, "epoch": 2584} {"train_loss": -12.173908233642578, "global_step": 434213, "epoch": 2584} {"train_loss": -12.273651123046875, "global_step": 434214, "epoch": 2584} {"train_loss": -12.337149620056152, "global_step": 434215, "epoch": 2584} {"train_loss": -12.556966781616211, "global_step": 434216, "epoch": 2584} {"train_loss": -12.237503051757812, "global_step": 434217, "epoch": 2584} {"train_loss": -11.888574600219727, "global_step": 434218, "epoch": 2584} {"train_loss": -12.290901184082031, "global_step": 434219, "epoch": 2584} {"train_loss": -12.751179695129395, "global_step": 434220, "epoch": 2584} {"train_loss": -12.33230972290039, "global_step": 434221, "epoch": 2584} {"train_loss": -12.569133758544922, "global_step": 434222, "epoch": 2584} {"train_loss": -12.279106140136719, "global_step": 434223, "epoch": 2584} {"train_loss": -11.910890579223633, "global_step": 434224, "epoch": 2584} {"train_loss": -12.433577537536621, "global_step": 434225, "epoch": 2584} {"train_loss": -11.875306129455566, "global_step": 434226, "epoch": 2584} {"train_loss": -12.289932250976562, "global_step": 434227, "epoch": 2584} {"train_loss": -12.409611701965332, "global_step": 434228, "epoch": 2584} {"train_loss": -11.50261116027832, "global_step": 434229, "epoch": 2584} {"train_loss": -11.746164321899414, "global_step": 434230, "epoch": 2584} {"train_loss": -11.705631256103516, "global_step": 434231, "epoch": 2584} {"train_loss": -12.094568252563477, "global_step": 434232, "epoch": 2584} {"train_loss": -11.832935333251953, "global_step": 434233, "epoch": 2584} {"train_loss": -10.55305290222168, "global_step": 434234, "epoch": 2584} {"train_loss": -12.055482864379883, "global_step": 434235, "epoch": 2584} {"train_loss": -9.772727966308594, "global_step": 434236, "epoch": 2584} {"train_loss": -11.741960525512695, "global_step": 434237, "epoch": 2584} {"train_loss": -12.180479049682617, "global_step": 434238, "epoch": 2584} {"train_loss": -11.04230785369873, "global_step": 434239, "epoch": 2584} {"train_loss": -11.631048202514648, "global_step": 434240, "epoch": 2584} {"train_loss": -9.573976516723633, "global_step": 434241, "epoch": 2584} {"train_loss": -9.289434432983398, "global_step": 434242, "epoch": 2584} {"train_loss": -11.523521423339844, "global_step": 434243, "epoch": 2584} {"train_loss": -11.197796821594238, "global_step": 434244, "epoch": 2584} {"train_loss": -10.84231948852539, "global_step": 434245, "epoch": 2584} {"train_loss": -10.948989868164062, "global_step": 434246, "epoch": 2584} {"train_loss": -11.53341007232666, "global_step": 434247, "epoch": 2584} {"train_loss": -11.417247772216797, "global_step": 434248, "epoch": 2584} {"train_loss": -10.806175231933594, "global_step": 434249, "epoch": 2584} {"train_loss": -11.091533660888672, "global_step": 434250, "epoch": 2584} {"train_loss": -12.144850730895996, "global_step": 434251, "epoch": 2584} {"train_loss": -11.359496116638184, "global_step": 434252, "epoch": 2584} {"train_loss": -12.068950653076172, "global_step": 434253, "epoch": 2584} {"train_loss": -11.77599048614502, "global_step": 434254, "epoch": 2584} {"train_loss": -12.049172401428223, "global_step": 434255, "epoch": 2584} {"train_loss": -12.171586036682129, "global_step": 434256, "epoch": 2584} {"train_loss": -12.35138988494873, "global_step": 434257, "epoch": 2584} {"train_loss": -12.231935501098633, "global_step": 434258, "epoch": 2584} {"train_loss": -12.31630802154541, "global_step": 434259, "epoch": 2584} {"train_loss": -12.209280967712402, "global_step": 434260, "epoch": 2584} {"train_loss": -12.227790832519531, "global_step": 434261, "epoch": 2584} {"train_loss": -12.613143920898438, "global_step": 434262, "epoch": 2584} {"train_loss": -12.213835716247559, "global_step": 434263, "epoch": 2584} {"train_loss": -12.25890064239502, "global_step": 434264, "epoch": 2584} {"train_loss": -12.30190658569336, "global_step": 434265, "epoch": 2584} {"train_loss": -12.1517333984375, "global_step": 434266, "epoch": 2584} {"train_loss": -12.415228843688965, "global_step": 434267, "epoch": 2584} {"train_loss": -12.641546249389648, "global_step": 434268, "epoch": 2584} {"train_loss": -12.336708068847656, "global_step": 434269, "epoch": 2584} {"train_loss": -12.487858772277832, "global_step": 434270, "epoch": 2584} {"train_loss": -12.520936965942383, "global_step": 434271, "epoch": 2584} {"train_loss": -12.424371719360352, "global_step": 434272, "epoch": 2584} {"train_loss": -12.332605361938477, "global_step": 434273, "epoch": 2584} {"train_loss": -12.277469635009766, "global_step": 434274, "epoch": 2584} {"train_loss": -12.239843368530273, "global_step": 434275, "epoch": 2584} {"train_loss": -12.69692611694336, "global_step": 434276, "epoch": 2584} {"train_loss": -12.326091766357422, "global_step": 434277, "epoch": 2584} {"train_loss": -12.601653099060059, "global_step": 434278, "epoch": 2584} {"train_loss": -11.964344467435565, "global_step": 434279, "epoch": 2584, "val_loss": 308523.5625} {"train_loss": -12.072064399719238, "global_step": 434280, "epoch": 2585} {"train_loss": -12.559304237365723, "global_step": 434281, "epoch": 2585} {"train_loss": -12.247640609741211, "global_step": 434282, "epoch": 2585} {"train_loss": -12.550542831420898, "global_step": 434283, "epoch": 2585} {"train_loss": -11.983491897583008, "global_step": 434284, "epoch": 2585} {"train_loss": -12.6629638671875, "global_step": 434285, "epoch": 2585} {"train_loss": -12.154728889465332, "global_step": 434286, "epoch": 2585} {"train_loss": -12.614533424377441, "global_step": 434287, "epoch": 2585} {"train_loss": -12.394815444946289, "global_step": 434288, "epoch": 2585} {"train_loss": -12.503055572509766, "global_step": 434289, "epoch": 2585} {"train_loss": -12.546663284301758, "global_step": 434290, "epoch": 2585} {"train_loss": -12.42568588256836, "global_step": 434291, "epoch": 2585} {"train_loss": -12.45891284942627, "global_step": 434292, "epoch": 2585} {"train_loss": -12.737680435180664, "global_step": 434293, "epoch": 2585} {"train_loss": -12.738037109375, "global_step": 434294, "epoch": 2585} {"train_loss": -12.58660888671875, "global_step": 434295, "epoch": 2585} {"train_loss": -12.554057121276855, "global_step": 434296, "epoch": 2585} {"train_loss": -12.400103569030762, "global_step": 434297, "epoch": 2585} {"train_loss": -12.235941886901855, "global_step": 434298, "epoch": 2585} {"train_loss": -12.618461608886719, "global_step": 434299, "epoch": 2585} {"train_loss": -12.647468566894531, "global_step": 434300, "epoch": 2585} {"train_loss": -12.643423080444336, "global_step": 434301, "epoch": 2585} {"train_loss": -12.687896728515625, "global_step": 434302, "epoch": 2585} {"train_loss": -12.339408874511719, "global_step": 434303, "epoch": 2585} {"train_loss": -12.633500099182129, "global_step": 434304, "epoch": 2585} {"train_loss": -12.726920127868652, "global_step": 434305, "epoch": 2585} {"train_loss": -12.508846282958984, "global_step": 434306, "epoch": 2585} {"train_loss": -12.639368057250977, "global_step": 434307, "epoch": 2585} {"train_loss": -12.626923561096191, "global_step": 434308, "epoch": 2585} {"train_loss": -12.397561073303223, "global_step": 434309, "epoch": 2585} {"train_loss": -12.77256965637207, "global_step": 434310, "epoch": 2585} {"train_loss": -12.78913688659668, "global_step": 434311, "epoch": 2585} {"train_loss": -12.434864044189453, "global_step": 434312, "epoch": 2585} {"train_loss": -12.391824722290039, "global_step": 434313, "epoch": 2585} {"train_loss": -12.486705780029297, "global_step": 434314, "epoch": 2585} {"train_loss": -12.624410629272461, "global_step": 434315, "epoch": 2585} {"train_loss": -12.67782211303711, "global_step": 434316, "epoch": 2585} {"train_loss": -12.690404891967773, "global_step": 434317, "epoch": 2585} {"train_loss": -12.48924446105957, "global_step": 434318, "epoch": 2585} {"train_loss": -12.423263549804688, "global_step": 434319, "epoch": 2585} {"train_loss": -12.182676315307617, "global_step": 434320, "epoch": 2585} {"train_loss": -12.516229629516602, "global_step": 434321, "epoch": 2585} {"train_loss": -12.496124267578125, "global_step": 434322, "epoch": 2585} {"train_loss": -12.537408828735352, "global_step": 434323, "epoch": 2585} {"train_loss": -12.395164489746094, "global_step": 434324, "epoch": 2585} {"train_loss": -12.571857452392578, "global_step": 434325, "epoch": 2585} {"train_loss": -12.846311569213867, "global_step": 434326, "epoch": 2585} {"train_loss": -12.369529724121094, "global_step": 434327, "epoch": 2585} {"train_loss": -12.60281753540039, "global_step": 434328, "epoch": 2585} {"train_loss": -12.667113304138184, "global_step": 434329, "epoch": 2585} {"train_loss": -12.343761444091797, "global_step": 434330, "epoch": 2585} {"train_loss": -12.59611701965332, "global_step": 434331, "epoch": 2585} {"train_loss": -12.499493598937988, "global_step": 434332, "epoch": 2585} {"train_loss": -12.315474510192871, "global_step": 434333, "epoch": 2585} {"train_loss": -12.482589721679688, "global_step": 434334, "epoch": 2585} {"train_loss": -12.763580322265625, "global_step": 434335, "epoch": 2585} {"train_loss": -12.326650619506836, "global_step": 434336, "epoch": 2585} {"train_loss": -12.739673614501953, "global_step": 434337, "epoch": 2585} {"train_loss": -12.386849403381348, "global_step": 434338, "epoch": 2585} {"train_loss": -12.777976989746094, "global_step": 434339, "epoch": 2585} {"train_loss": -12.56214427947998, "global_step": 434340, "epoch": 2585} {"train_loss": -12.594571113586426, "global_step": 434341, "epoch": 2585} {"train_loss": -12.757560729980469, "global_step": 434342, "epoch": 2585} {"train_loss": -12.488399505615234, "global_step": 434343, "epoch": 2585} {"train_loss": -12.189784049987793, "global_step": 434344, "epoch": 2585} {"train_loss": -12.669713020324707, "global_step": 434345, "epoch": 2585} {"train_loss": -11.80961799621582, "global_step": 434346, "epoch": 2585} {"train_loss": -12.024901390075684, "global_step": 434347, "epoch": 2585} {"train_loss": -12.545345306396484, "global_step": 434348, "epoch": 2585} {"train_loss": -12.026668548583984, "global_step": 434349, "epoch": 2585} {"train_loss": -12.189322471618652, "global_step": 434350, "epoch": 2585} {"train_loss": -11.453683853149414, "global_step": 434351, "epoch": 2585} {"train_loss": -12.160333633422852, "global_step": 434352, "epoch": 2585} {"train_loss": -11.73288345336914, "global_step": 434353, "epoch": 2585} {"train_loss": -12.42580795288086, "global_step": 434354, "epoch": 2585} {"train_loss": -12.168882369995117, "global_step": 434355, "epoch": 2585} {"train_loss": -12.152438163757324, "global_step": 434356, "epoch": 2585} {"train_loss": -12.043094635009766, "global_step": 434357, "epoch": 2585} {"train_loss": -12.565132141113281, "global_step": 434358, "epoch": 2585} {"train_loss": -12.263479232788086, "global_step": 434359, "epoch": 2585} {"train_loss": -12.531964302062988, "global_step": 434360, "epoch": 2585} {"train_loss": -11.912923812866211, "global_step": 434361, "epoch": 2585} {"train_loss": -11.96234130859375, "global_step": 434362, "epoch": 2585} {"train_loss": -12.089559555053711, "global_step": 434363, "epoch": 2585} {"train_loss": -11.908909797668457, "global_step": 434364, "epoch": 2585} {"train_loss": -10.686474800109863, "global_step": 434365, "epoch": 2585} {"train_loss": -11.468503952026367, "global_step": 434366, "epoch": 2585} {"train_loss": -11.390632629394531, "global_step": 434367, "epoch": 2585} {"train_loss": -11.409845352172852, "global_step": 434368, "epoch": 2585} {"train_loss": -11.758810043334961, "global_step": 434369, "epoch": 2585} {"train_loss": -11.21994686126709, "global_step": 434370, "epoch": 2585} {"train_loss": -12.646951675415039, "global_step": 434371, "epoch": 2585} {"train_loss": -9.890069961547852, "global_step": 434372, "epoch": 2585} {"train_loss": -12.414237976074219, "global_step": 434373, "epoch": 2585} {"train_loss": -11.436686515808105, "global_step": 434374, "epoch": 2585} {"train_loss": -11.395709991455078, "global_step": 434375, "epoch": 2585} {"train_loss": -11.914724349975586, "global_step": 434376, "epoch": 2585} {"train_loss": -11.940677642822266, "global_step": 434377, "epoch": 2585} {"train_loss": -11.76580810546875, "global_step": 434378, "epoch": 2585} {"train_loss": -11.604045867919922, "global_step": 434379, "epoch": 2585} {"train_loss": -12.114984512329102, "global_step": 434380, "epoch": 2585} {"train_loss": -11.536901473999023, "global_step": 434381, "epoch": 2585} {"train_loss": -12.153075218200684, "global_step": 434382, "epoch": 2585} {"train_loss": -12.0081148147583, "global_step": 434383, "epoch": 2585} {"train_loss": -11.2949800491333, "global_step": 434384, "epoch": 2585} {"train_loss": -12.27733325958252, "global_step": 434385, "epoch": 2585} {"train_loss": -11.535562515258789, "global_step": 434386, "epoch": 2585} {"train_loss": -12.018669128417969, "global_step": 434387, "epoch": 2585} {"train_loss": -11.609436988830566, "global_step": 434388, "epoch": 2585} {"train_loss": -11.952184677124023, "global_step": 434389, "epoch": 2585} {"train_loss": -12.169748306274414, "global_step": 434390, "epoch": 2585} {"train_loss": -11.323678970336914, "global_step": 434391, "epoch": 2585} {"train_loss": -11.976350784301758, "global_step": 434392, "epoch": 2585} {"train_loss": -11.06238079071045, "global_step": 434393, "epoch": 2585} {"train_loss": -11.904491424560547, "global_step": 434394, "epoch": 2585} {"train_loss": -11.159589767456055, "global_step": 434395, "epoch": 2585} {"train_loss": -11.656907081604004, "global_step": 434396, "epoch": 2585} {"train_loss": -11.782415390014648, "global_step": 434397, "epoch": 2585} {"train_loss": -12.0516357421875, "global_step": 434398, "epoch": 2585} {"train_loss": -11.529438018798828, "global_step": 434399, "epoch": 2585} {"train_loss": -11.833213806152344, "global_step": 434400, "epoch": 2585} {"train_loss": -11.96005630493164, "global_step": 434401, "epoch": 2585} {"train_loss": -11.978479385375977, "global_step": 434402, "epoch": 2585} {"train_loss": -11.996173858642578, "global_step": 434403, "epoch": 2585} {"train_loss": -12.392865180969238, "global_step": 434404, "epoch": 2585} {"train_loss": -11.839134216308594, "global_step": 434405, "epoch": 2585} {"train_loss": -11.906851768493652, "global_step": 434406, "epoch": 2585} {"train_loss": -12.056432723999023, "global_step": 434407, "epoch": 2585} {"train_loss": -12.04454517364502, "global_step": 434408, "epoch": 2585} {"train_loss": -11.837451934814453, "global_step": 434409, "epoch": 2585} {"train_loss": -12.527918815612793, "global_step": 434410, "epoch": 2585} {"train_loss": -11.60608959197998, "global_step": 434411, "epoch": 2585} {"train_loss": -11.126113891601562, "global_step": 434412, "epoch": 2585} {"train_loss": -11.972768783569336, "global_step": 434413, "epoch": 2585} {"train_loss": -10.656896591186523, "global_step": 434414, "epoch": 2585} {"train_loss": -12.393348693847656, "global_step": 434415, "epoch": 2585} {"train_loss": -11.451204299926758, "global_step": 434416, "epoch": 2585} {"train_loss": -12.007246017456055, "global_step": 434417, "epoch": 2585} {"train_loss": -11.531702995300293, "global_step": 434418, "epoch": 2585} {"train_loss": -11.671329498291016, "global_step": 434419, "epoch": 2585} {"train_loss": -12.222397804260254, "global_step": 434420, "epoch": 2585} {"train_loss": -11.161967277526855, "global_step": 434421, "epoch": 2585} {"train_loss": -12.393026351928711, "global_step": 434422, "epoch": 2585} {"train_loss": -11.421737670898438, "global_step": 434423, "epoch": 2585} {"train_loss": -11.933122634887695, "global_step": 434424, "epoch": 2585} {"train_loss": -11.94365119934082, "global_step": 434425, "epoch": 2585} {"train_loss": -11.555656433105469, "global_step": 434426, "epoch": 2585} {"train_loss": -12.20837116241455, "global_step": 434427, "epoch": 2585} {"train_loss": -11.57461166381836, "global_step": 434428, "epoch": 2585} {"train_loss": -12.40353012084961, "global_step": 434429, "epoch": 2585} {"train_loss": -12.016996383666992, "global_step": 434430, "epoch": 2585} {"train_loss": -12.075382232666016, "global_step": 434431, "epoch": 2585} {"train_loss": -12.312307357788086, "global_step": 434432, "epoch": 2585} {"train_loss": -11.893497467041016, "global_step": 434433, "epoch": 2585} {"train_loss": -12.45303726196289, "global_step": 434434, "epoch": 2585} {"train_loss": -12.310346603393555, "global_step": 434435, "epoch": 2585} {"train_loss": -12.178671836853027, "global_step": 434436, "epoch": 2585} {"train_loss": -12.452741622924805, "global_step": 434437, "epoch": 2585} {"train_loss": -12.221994400024414, "global_step": 434438, "epoch": 2585} {"train_loss": -12.528038024902344, "global_step": 434439, "epoch": 2585} {"train_loss": -12.464644432067871, "global_step": 434440, "epoch": 2585} {"train_loss": -12.728116989135742, "global_step": 434441, "epoch": 2585} {"train_loss": -12.365050315856934, "global_step": 434442, "epoch": 2585} {"train_loss": -12.542097091674805, "global_step": 434443, "epoch": 2585} {"train_loss": -12.341753005981445, "global_step": 434444, "epoch": 2585} {"train_loss": -12.45763874053955, "global_step": 434445, "epoch": 2585} {"train_loss": -12.404280662536621, "global_step": 434446, "epoch": 2585} {"train_loss": -12.155662099520365, "global_step": 434447, "epoch": 2585, "val_loss": 313192.34375, "train_action_mse_error": 3.166343927383423} {"train_loss": -11.98989200592041, "global_step": 434448, "epoch": 2586} {"train_loss": -12.492742538452148, "global_step": 434449, "epoch": 2586} {"train_loss": -12.205934524536133, "global_step": 434450, "epoch": 2586} {"train_loss": -12.33750057220459, "global_step": 434451, "epoch": 2586} {"train_loss": -12.42497730255127, "global_step": 434452, "epoch": 2586} {"train_loss": -12.484326362609863, "global_step": 434453, "epoch": 2586} {"train_loss": -12.640096664428711, "global_step": 434454, "epoch": 2586} {"train_loss": -12.563690185546875, "global_step": 434455, "epoch": 2586} {"train_loss": -12.826866149902344, "global_step": 434456, "epoch": 2586} {"train_loss": -12.443410873413086, "global_step": 434457, "epoch": 2586} {"train_loss": -12.56637954711914, "global_step": 434458, "epoch": 2586} {"train_loss": -12.657479286193848, "global_step": 434459, "epoch": 2586} {"train_loss": -12.357128143310547, "global_step": 434460, "epoch": 2586} {"train_loss": -12.732486724853516, "global_step": 434461, "epoch": 2586} {"train_loss": -12.337868690490723, "global_step": 434462, "epoch": 2586} {"train_loss": -12.594008445739746, "global_step": 434463, "epoch": 2586} {"train_loss": -12.792656898498535, "global_step": 434464, "epoch": 2586} {"train_loss": -12.446883201599121, "global_step": 434465, "epoch": 2586} {"train_loss": -12.791462898254395, "global_step": 434466, "epoch": 2586} {"train_loss": -12.637744903564453, "global_step": 434467, "epoch": 2586} {"train_loss": -12.742740631103516, "global_step": 434468, "epoch": 2586} {"train_loss": -12.809122085571289, "global_step": 434469, "epoch": 2586} {"train_loss": -12.58107852935791, "global_step": 434470, "epoch": 2586} {"train_loss": -12.870742797851562, "global_step": 434471, "epoch": 2586} {"train_loss": -12.291935920715332, "global_step": 434472, "epoch": 2586} {"train_loss": -12.79482650756836, "global_step": 434473, "epoch": 2586} {"train_loss": -12.266759872436523, "global_step": 434474, "epoch": 2586} {"train_loss": -12.503532409667969, "global_step": 434475, "epoch": 2586} {"train_loss": -12.314952850341797, "global_step": 434476, "epoch": 2586} {"train_loss": -12.373619079589844, "global_step": 434477, "epoch": 2586} {"train_loss": -12.661248207092285, "global_step": 434478, "epoch": 2586} {"train_loss": -12.222856521606445, "global_step": 434479, "epoch": 2586} {"train_loss": -12.11685848236084, "global_step": 434480, "epoch": 2586} {"train_loss": -12.17505168914795, "global_step": 434481, "epoch": 2586} {"train_loss": -12.324064254760742, "global_step": 434482, "epoch": 2586} {"train_loss": -12.643906593322754, "global_step": 434483, "epoch": 2586} {"train_loss": -12.891321182250977, "global_step": 434484, "epoch": 2586} {"train_loss": -12.452861785888672, "global_step": 434485, "epoch": 2586} {"train_loss": -12.919485092163086, "global_step": 434486, "epoch": 2586} {"train_loss": -12.300918579101562, "global_step": 434487, "epoch": 2586} {"train_loss": -12.047096252441406, "global_step": 434488, "epoch": 2586} {"train_loss": -12.532285690307617, "global_step": 434489, "epoch": 2586} {"train_loss": -12.598201751708984, "global_step": 434490, "epoch": 2586} {"train_loss": -12.511146545410156, "global_step": 434491, "epoch": 2586} {"train_loss": -12.713356018066406, "global_step": 434492, "epoch": 2586} {"train_loss": -12.605707168579102, "global_step": 434493, "epoch": 2586} {"train_loss": -11.804901123046875, "global_step": 434494, "epoch": 2586} {"train_loss": -11.795581817626953, "global_step": 434495, "epoch": 2586} {"train_loss": -12.580495834350586, "global_step": 434496, "epoch": 2586} {"train_loss": -12.309788703918457, "global_step": 434497, "epoch": 2586} {"train_loss": -11.791252136230469, "global_step": 434498, "epoch": 2586} {"train_loss": -12.616706848144531, "global_step": 434499, "epoch": 2586} {"train_loss": -12.381636619567871, "global_step": 434500, "epoch": 2586} {"train_loss": -12.576401710510254, "global_step": 434501, "epoch": 2586} {"train_loss": -12.547731399536133, "global_step": 434502, "epoch": 2586} {"train_loss": -12.534114837646484, "global_step": 434503, "epoch": 2586} {"train_loss": -12.502482414245605, "global_step": 434504, "epoch": 2586} {"train_loss": -12.809736251831055, "global_step": 434505, "epoch": 2586} {"train_loss": -12.678884506225586, "global_step": 434506, "epoch": 2586} {"train_loss": -12.719369888305664, "global_step": 434507, "epoch": 2586} {"train_loss": -12.833623886108398, "global_step": 434508, "epoch": 2586} {"train_loss": -12.423177719116211, "global_step": 434509, "epoch": 2586} {"train_loss": -12.588927268981934, "global_step": 434510, "epoch": 2586} {"train_loss": -12.572820663452148, "global_step": 434511, "epoch": 2586} {"train_loss": -12.439359664916992, "global_step": 434512, "epoch": 2586} {"train_loss": -12.598121643066406, "global_step": 434513, "epoch": 2586} {"train_loss": -12.495765686035156, "global_step": 434514, "epoch": 2586} {"train_loss": -12.736001968383789, "global_step": 434515, "epoch": 2586} {"train_loss": -11.72253704071045, "global_step": 434516, "epoch": 2586} {"train_loss": -11.91637134552002, "global_step": 434517, "epoch": 2586} {"train_loss": -11.604106903076172, "global_step": 434518, "epoch": 2586} {"train_loss": -12.254878044128418, "global_step": 434519, "epoch": 2586} {"train_loss": -10.918371200561523, "global_step": 434520, "epoch": 2586} {"train_loss": -12.422046661376953, "global_step": 434521, "epoch": 2586} {"train_loss": -11.430609703063965, "global_step": 434522, "epoch": 2586} {"train_loss": -12.33924674987793, "global_step": 434523, "epoch": 2586} {"train_loss": -11.927087783813477, "global_step": 434524, "epoch": 2586} {"train_loss": -12.338895797729492, "global_step": 434525, "epoch": 2586} {"train_loss": -11.564165115356445, "global_step": 434526, "epoch": 2586} {"train_loss": -12.329551696777344, "global_step": 434527, "epoch": 2586} {"train_loss": -11.967811584472656, "global_step": 434528, "epoch": 2586} {"train_loss": -12.471673965454102, "global_step": 434529, "epoch": 2586} {"train_loss": -12.36470890045166, "global_step": 434530, "epoch": 2586} {"train_loss": -12.145755767822266, "global_step": 434531, "epoch": 2586} {"train_loss": -11.466133117675781, "global_step": 434532, "epoch": 2586} {"train_loss": -12.410120964050293, "global_step": 434533, "epoch": 2586} {"train_loss": -11.210641860961914, "global_step": 434534, "epoch": 2586} {"train_loss": -11.715261459350586, "global_step": 434535, "epoch": 2586} {"train_loss": -12.071374893188477, "global_step": 434536, "epoch": 2586} {"train_loss": -9.71562385559082, "global_step": 434537, "epoch": 2586} {"train_loss": -12.24604320526123, "global_step": 434538, "epoch": 2586} {"train_loss": -10.977827072143555, "global_step": 434539, "epoch": 2586} {"train_loss": -10.599992752075195, "global_step": 434540, "epoch": 2586} {"train_loss": -10.94515609741211, "global_step": 434541, "epoch": 2586} {"train_loss": -11.682586669921875, "global_step": 434542, "epoch": 2586} {"train_loss": -10.055609703063965, "global_step": 434543, "epoch": 2586} {"train_loss": -11.874902725219727, "global_step": 434544, "epoch": 2586} {"train_loss": -11.226825714111328, "global_step": 434545, "epoch": 2586} {"train_loss": -11.151252746582031, "global_step": 434546, "epoch": 2586} {"train_loss": -12.345695495605469, "global_step": 434547, "epoch": 2586} {"train_loss": -11.444744110107422, "global_step": 434548, "epoch": 2586} {"train_loss": -12.301065444946289, "global_step": 434549, "epoch": 2586} {"train_loss": -12.021108627319336, "global_step": 434550, "epoch": 2586} {"train_loss": -11.73758316040039, "global_step": 434551, "epoch": 2586} {"train_loss": -12.022773742675781, "global_step": 434552, "epoch": 2586} {"train_loss": -11.196187019348145, "global_step": 434553, "epoch": 2586} {"train_loss": -11.798074722290039, "global_step": 434554, "epoch": 2586} {"train_loss": -12.219606399536133, "global_step": 434555, "epoch": 2586} {"train_loss": -11.319232940673828, "global_step": 434556, "epoch": 2586} {"train_loss": -11.775301933288574, "global_step": 434557, "epoch": 2586} {"train_loss": -12.315780639648438, "global_step": 434558, "epoch": 2586} {"train_loss": -12.264837265014648, "global_step": 434559, "epoch": 2586} {"train_loss": -11.908538818359375, "global_step": 434560, "epoch": 2586} {"train_loss": -12.639409065246582, "global_step": 434561, "epoch": 2586} {"train_loss": -12.077861785888672, "global_step": 434562, "epoch": 2586} {"train_loss": -11.964536666870117, "global_step": 434563, "epoch": 2586} {"train_loss": -12.103748321533203, "global_step": 434564, "epoch": 2586} {"train_loss": -11.82247543334961, "global_step": 434565, "epoch": 2586} {"train_loss": -12.183052062988281, "global_step": 434566, "epoch": 2586} {"train_loss": -12.157146453857422, "global_step": 434567, "epoch": 2586} {"train_loss": -11.758142471313477, "global_step": 434568, "epoch": 2586} {"train_loss": -12.484916687011719, "global_step": 434569, "epoch": 2586} {"train_loss": -12.001493453979492, "global_step": 434570, "epoch": 2586} {"train_loss": -12.486518859863281, "global_step": 434571, "epoch": 2586} {"train_loss": -12.295880317687988, "global_step": 434572, "epoch": 2586} {"train_loss": -11.829498291015625, "global_step": 434573, "epoch": 2586} {"train_loss": -11.87917709350586, "global_step": 434574, "epoch": 2586} {"train_loss": -11.423311233520508, "global_step": 434575, "epoch": 2586} {"train_loss": -11.103994369506836, "global_step": 434576, "epoch": 2586} {"train_loss": -12.286050796508789, "global_step": 434577, "epoch": 2586} {"train_loss": -11.920555114746094, "global_step": 434578, "epoch": 2586} {"train_loss": -11.937654495239258, "global_step": 434579, "epoch": 2586} {"train_loss": -11.799822807312012, "global_step": 434580, "epoch": 2586} {"train_loss": -12.501163482666016, "global_step": 434581, "epoch": 2586} {"train_loss": -11.783398628234863, "global_step": 434582, "epoch": 2586} {"train_loss": -12.316225051879883, "global_step": 434583, "epoch": 2586} {"train_loss": -12.067564010620117, "global_step": 434584, "epoch": 2586} {"train_loss": -11.997490882873535, "global_step": 434585, "epoch": 2586} {"train_loss": -12.279382705688477, "global_step": 434586, "epoch": 2586} {"train_loss": -12.107704162597656, "global_step": 434587, "epoch": 2586} {"train_loss": -12.521169662475586, "global_step": 434588, "epoch": 2586} {"train_loss": -12.309680938720703, "global_step": 434589, "epoch": 2586} {"train_loss": -12.409407615661621, "global_step": 434590, "epoch": 2586} {"train_loss": -12.30093002319336, "global_step": 434591, "epoch": 2586} {"train_loss": -12.444644927978516, "global_step": 434592, "epoch": 2586} {"train_loss": -12.343521118164062, "global_step": 434593, "epoch": 2586} {"train_loss": -12.309415817260742, "global_step": 434594, "epoch": 2586} {"train_loss": -12.612344741821289, "global_step": 434595, "epoch": 2586} {"train_loss": -12.475790023803711, "global_step": 434596, "epoch": 2586} {"train_loss": -12.45441722869873, "global_step": 434597, "epoch": 2586} {"train_loss": -12.390310287475586, "global_step": 434598, "epoch": 2586} {"train_loss": -12.467318534851074, "global_step": 434599, "epoch": 2586} {"train_loss": -12.346193313598633, "global_step": 434600, "epoch": 2586} {"train_loss": -12.593999862670898, "global_step": 434601, "epoch": 2586} {"train_loss": -12.310230255126953, "global_step": 434602, "epoch": 2586} {"train_loss": -12.439295768737793, "global_step": 434603, "epoch": 2586} {"train_loss": -12.524086952209473, "global_step": 434604, "epoch": 2586} {"train_loss": -12.571524620056152, "global_step": 434605, "epoch": 2586} {"train_loss": -12.636728286743164, "global_step": 434606, "epoch": 2586} {"train_loss": -12.311952590942383, "global_step": 434607, "epoch": 2586} {"train_loss": -12.695245742797852, "global_step": 434608, "epoch": 2586} {"train_loss": -12.464118003845215, "global_step": 434609, "epoch": 2586} {"train_loss": -12.110862731933594, "global_step": 434610, "epoch": 2586} {"train_loss": -12.463043212890625, "global_step": 434611, "epoch": 2586} {"train_loss": -12.723733901977539, "global_step": 434612, "epoch": 2586} {"train_loss": -12.176473617553711, "global_step": 434613, "epoch": 2586} {"train_loss": -12.494426727294922, "global_step": 434614, "epoch": 2586} {"train_loss": -12.208526089077903, "global_step": 434615, "epoch": 2586, "val_loss": 312027.0625} {"train_loss": -12.608869552612305, "global_step": 434616, "epoch": 2587} {"train_loss": -12.524125099182129, "global_step": 434617, "epoch": 2587} {"train_loss": -12.332880020141602, "global_step": 434618, "epoch": 2587} {"train_loss": -12.732037544250488, "global_step": 434619, "epoch": 2587} {"train_loss": -12.475322723388672, "global_step": 434620, "epoch": 2587} {"train_loss": -12.497629165649414, "global_step": 434621, "epoch": 2587} {"train_loss": -12.399871826171875, "global_step": 434622, "epoch": 2587} {"train_loss": -11.872640609741211, "global_step": 434623, "epoch": 2587} {"train_loss": -12.317293167114258, "global_step": 434624, "epoch": 2587} {"train_loss": -12.130149841308594, "global_step": 434625, "epoch": 2587} {"train_loss": -11.054311752319336, "global_step": 434626, "epoch": 2587} {"train_loss": -11.84980583190918, "global_step": 434627, "epoch": 2587} {"train_loss": -11.728343963623047, "global_step": 434628, "epoch": 2587} {"train_loss": -11.662294387817383, "global_step": 434629, "epoch": 2587} {"train_loss": -11.02403450012207, "global_step": 434630, "epoch": 2587} {"train_loss": -10.340827941894531, "global_step": 434631, "epoch": 2587} {"train_loss": -10.223926544189453, "global_step": 434632, "epoch": 2587} {"train_loss": -10.919587135314941, "global_step": 434633, "epoch": 2587} {"train_loss": -12.220748901367188, "global_step": 434634, "epoch": 2587} {"train_loss": -10.765279769897461, "global_step": 434635, "epoch": 2587} {"train_loss": -10.956382751464844, "global_step": 434636, "epoch": 2587} {"train_loss": -12.139457702636719, "global_step": 434637, "epoch": 2587} {"train_loss": -11.916475296020508, "global_step": 434638, "epoch": 2587} {"train_loss": -12.13992977142334, "global_step": 434639, "epoch": 2587} {"train_loss": -12.066944122314453, "global_step": 434640, "epoch": 2587} {"train_loss": -12.266790390014648, "global_step": 434641, "epoch": 2587} {"train_loss": -11.899469375610352, "global_step": 434642, "epoch": 2587} {"train_loss": -11.43917179107666, "global_step": 434643, "epoch": 2587} {"train_loss": -11.748878479003906, "global_step": 434644, "epoch": 2587} {"train_loss": -12.118772506713867, "global_step": 434645, "epoch": 2587} {"train_loss": -11.42813491821289, "global_step": 434646, "epoch": 2587} {"train_loss": -12.426004409790039, "global_step": 434647, "epoch": 2587} {"train_loss": -11.303900718688965, "global_step": 434648, "epoch": 2587} {"train_loss": -12.083927154541016, "global_step": 434649, "epoch": 2587} {"train_loss": -12.368408203125, "global_step": 434650, "epoch": 2587} {"train_loss": -11.72082233428955, "global_step": 434651, "epoch": 2587} {"train_loss": -12.426874160766602, "global_step": 434652, "epoch": 2587} {"train_loss": -11.825201988220215, "global_step": 434653, "epoch": 2587} {"train_loss": -12.448625564575195, "global_step": 434654, "epoch": 2587} {"train_loss": -11.889368057250977, "global_step": 434655, "epoch": 2587} {"train_loss": -11.745125770568848, "global_step": 434656, "epoch": 2587} {"train_loss": -12.145000457763672, "global_step": 434657, "epoch": 2587} {"train_loss": -11.916664123535156, "global_step": 434658, "epoch": 2587} {"train_loss": -12.032073974609375, "global_step": 434659, "epoch": 2587} {"train_loss": -12.139015197753906, "global_step": 434660, "epoch": 2587} {"train_loss": -12.076425552368164, "global_step": 434661, "epoch": 2587} {"train_loss": -11.99332046508789, "global_step": 434662, "epoch": 2587} {"train_loss": -12.266042709350586, "global_step": 434663, "epoch": 2587} {"train_loss": -11.977888107299805, "global_step": 434664, "epoch": 2587} {"train_loss": -12.408031463623047, "global_step": 434665, "epoch": 2587} {"train_loss": -12.03276252746582, "global_step": 434666, "epoch": 2587} {"train_loss": -12.12503433227539, "global_step": 434667, "epoch": 2587} {"train_loss": -12.577129364013672, "global_step": 434668, "epoch": 2587} {"train_loss": -11.807513236999512, "global_step": 434669, "epoch": 2587} {"train_loss": -12.392330169677734, "global_step": 434670, "epoch": 2587} {"train_loss": -11.592803001403809, "global_step": 434671, "epoch": 2587} {"train_loss": -11.969070434570312, "global_step": 434672, "epoch": 2587} {"train_loss": -12.079916000366211, "global_step": 434673, "epoch": 2587} {"train_loss": -11.373123168945312, "global_step": 434674, "epoch": 2587} {"train_loss": -11.401930809020996, "global_step": 434675, "epoch": 2587} {"train_loss": -12.051593780517578, "global_step": 434676, "epoch": 2587} {"train_loss": -10.853317260742188, "global_step": 434677, "epoch": 2587} {"train_loss": -12.223159790039062, "global_step": 434678, "epoch": 2587} {"train_loss": -9.635862350463867, "global_step": 434679, "epoch": 2587} {"train_loss": -12.248905181884766, "global_step": 434680, "epoch": 2587} {"train_loss": -10.47134017944336, "global_step": 434681, "epoch": 2587} {"train_loss": -10.640820503234863, "global_step": 434682, "epoch": 2587} {"train_loss": -11.621061325073242, "global_step": 434683, "epoch": 2587} {"train_loss": -10.758735656738281, "global_step": 434684, "epoch": 2587} {"train_loss": -11.778286933898926, "global_step": 434685, "epoch": 2587} {"train_loss": -11.652273178100586, "global_step": 434686, "epoch": 2587} {"train_loss": -12.127359390258789, "global_step": 434687, "epoch": 2587} {"train_loss": -11.856842994689941, "global_step": 434688, "epoch": 2587} {"train_loss": -11.931307792663574, "global_step": 434689, "epoch": 2587} {"train_loss": -11.696290016174316, "global_step": 434690, "epoch": 2587} {"train_loss": -11.88551139831543, "global_step": 434691, "epoch": 2587} {"train_loss": -11.52871036529541, "global_step": 434692, "epoch": 2587} {"train_loss": -11.961363792419434, "global_step": 434693, "epoch": 2587} {"train_loss": -12.151630401611328, "global_step": 434694, "epoch": 2587} {"train_loss": -11.99842643737793, "global_step": 434695, "epoch": 2587} {"train_loss": -11.967599868774414, "global_step": 434696, "epoch": 2587} {"train_loss": -12.062580108642578, "global_step": 434697, "epoch": 2587} {"train_loss": -12.107942581176758, "global_step": 434698, "epoch": 2587} {"train_loss": -12.376311302185059, "global_step": 434699, "epoch": 2587} {"train_loss": -12.395271301269531, "global_step": 434700, "epoch": 2587} {"train_loss": -12.284969329833984, "global_step": 434701, "epoch": 2587} {"train_loss": -12.156211853027344, "global_step": 434702, "epoch": 2587} {"train_loss": -12.575983047485352, "global_step": 434703, "epoch": 2587} {"train_loss": -12.40749740600586, "global_step": 434704, "epoch": 2587} {"train_loss": -12.326902389526367, "global_step": 434705, "epoch": 2587} {"train_loss": -12.48698616027832, "global_step": 434706, "epoch": 2587} {"train_loss": -12.246330261230469, "global_step": 434707, "epoch": 2587} {"train_loss": -12.385555267333984, "global_step": 434708, "epoch": 2587} {"train_loss": -12.306510925292969, "global_step": 434709, "epoch": 2587} {"train_loss": -12.262325286865234, "global_step": 434710, "epoch": 2587} {"train_loss": -12.570716857910156, "global_step": 434711, "epoch": 2587} {"train_loss": -12.478450775146484, "global_step": 434712, "epoch": 2587} {"train_loss": -12.73862075805664, "global_step": 434713, "epoch": 2587} {"train_loss": -12.273725509643555, "global_step": 434714, "epoch": 2587} {"train_loss": -12.62722396850586, "global_step": 434715, "epoch": 2587} {"train_loss": -12.523775100708008, "global_step": 434716, "epoch": 2587} {"train_loss": -12.516220092773438, "global_step": 434717, "epoch": 2587} {"train_loss": -12.569685935974121, "global_step": 434718, "epoch": 2587} {"train_loss": -12.868046760559082, "global_step": 434719, "epoch": 2587} {"train_loss": -12.532299995422363, "global_step": 434720, "epoch": 2587} {"train_loss": -12.492901802062988, "global_step": 434721, "epoch": 2587} {"train_loss": -12.72201156616211, "global_step": 434722, "epoch": 2587} {"train_loss": -12.447162628173828, "global_step": 434723, "epoch": 2587} {"train_loss": -12.438631057739258, "global_step": 434724, "epoch": 2587} {"train_loss": -12.534759521484375, "global_step": 434725, "epoch": 2587} {"train_loss": -12.729144096374512, "global_step": 434726, "epoch": 2587} {"train_loss": -12.554208755493164, "global_step": 434727, "epoch": 2587} {"train_loss": -12.584957122802734, "global_step": 434728, "epoch": 2587} {"train_loss": -12.68942928314209, "global_step": 434729, "epoch": 2587} {"train_loss": -12.42039680480957, "global_step": 434730, "epoch": 2587} {"train_loss": -12.720259666442871, "global_step": 434731, "epoch": 2587} {"train_loss": -12.756675720214844, "global_step": 434732, "epoch": 2587} {"train_loss": -12.6624174118042, "global_step": 434733, "epoch": 2587} {"train_loss": -12.61927604675293, "global_step": 434734, "epoch": 2587} {"train_loss": -12.744559288024902, "global_step": 434735, "epoch": 2587} {"train_loss": -12.589677810668945, "global_step": 434736, "epoch": 2587} {"train_loss": -12.392894744873047, "global_step": 434737, "epoch": 2587} {"train_loss": -12.728889465332031, "global_step": 434738, "epoch": 2587} {"train_loss": -12.435418128967285, "global_step": 434739, "epoch": 2587} {"train_loss": -12.535675048828125, "global_step": 434740, "epoch": 2587} {"train_loss": -12.6070556640625, "global_step": 434741, "epoch": 2587} {"train_loss": -12.623527526855469, "global_step": 434742, "epoch": 2587} {"train_loss": -12.725784301757812, "global_step": 434743, "epoch": 2587} {"train_loss": -12.600870132446289, "global_step": 434744, "epoch": 2587} {"train_loss": -12.632063865661621, "global_step": 434745, "epoch": 2587} {"train_loss": -12.856414794921875, "global_step": 434746, "epoch": 2587} {"train_loss": -12.65047836303711, "global_step": 434747, "epoch": 2587} {"train_loss": -12.648119926452637, "global_step": 434748, "epoch": 2587} {"train_loss": -12.513525009155273, "global_step": 434749, "epoch": 2587} {"train_loss": -12.739435195922852, "global_step": 434750, "epoch": 2587} {"train_loss": -12.684198379516602, "global_step": 434751, "epoch": 2587} {"train_loss": -12.532906532287598, "global_step": 434752, "epoch": 2587} {"train_loss": -12.69898796081543, "global_step": 434753, "epoch": 2587} {"train_loss": -12.456491470336914, "global_step": 434754, "epoch": 2587} {"train_loss": -12.707159996032715, "global_step": 434755, "epoch": 2587} {"train_loss": -12.79116439819336, "global_step": 434756, "epoch": 2587} {"train_loss": -12.648259162902832, "global_step": 434757, "epoch": 2587} {"train_loss": -12.828548431396484, "global_step": 434758, "epoch": 2587} {"train_loss": -12.445878982543945, "global_step": 434759, "epoch": 2587} {"train_loss": -12.694070816040039, "global_step": 434760, "epoch": 2587} {"train_loss": -12.638508796691895, "global_step": 434761, "epoch": 2587} {"train_loss": -12.368244171142578, "global_step": 434762, "epoch": 2587} {"train_loss": -12.445751190185547, "global_step": 434763, "epoch": 2587} {"train_loss": -13.000066757202148, "global_step": 434764, "epoch": 2587} {"train_loss": -12.556299209594727, "global_step": 434765, "epoch": 2587} {"train_loss": -12.535589218139648, "global_step": 434766, "epoch": 2587} {"train_loss": -12.302436828613281, "global_step": 434767, "epoch": 2587} {"train_loss": -12.452219009399414, "global_step": 434768, "epoch": 2587} {"train_loss": -12.164648056030273, "global_step": 434769, "epoch": 2587} {"train_loss": -11.417847633361816, "global_step": 434770, "epoch": 2587} {"train_loss": -12.593225479125977, "global_step": 434771, "epoch": 2587} {"train_loss": -12.238760948181152, "global_step": 434772, "epoch": 2587} {"train_loss": -12.33781623840332, "global_step": 434773, "epoch": 2587} {"train_loss": -12.168386459350586, "global_step": 434774, "epoch": 2587} {"train_loss": -11.861391067504883, "global_step": 434775, "epoch": 2587} {"train_loss": -12.408899307250977, "global_step": 434776, "epoch": 2587} {"train_loss": -12.275917053222656, "global_step": 434777, "epoch": 2587} {"train_loss": -11.92698860168457, "global_step": 434778, "epoch": 2587} {"train_loss": -12.508813858032227, "global_step": 434779, "epoch": 2587} {"train_loss": -12.07221794128418, "global_step": 434780, "epoch": 2587} {"train_loss": -11.117377281188965, "global_step": 434781, "epoch": 2587} {"train_loss": -12.12277603149414, "global_step": 434782, "epoch": 2587} {"train_loss": -12.14647730759212, "global_step": 434783, "epoch": 2587, "val_loss": 313070.875} {"train_loss": -10.24422836303711, "global_step": 434784, "epoch": 2588} {"train_loss": -11.956798553466797, "global_step": 434785, "epoch": 2588} {"train_loss": -10.400485038757324, "global_step": 434786, "epoch": 2588} {"train_loss": -9.55134391784668, "global_step": 434787, "epoch": 2588} {"train_loss": -10.774007797241211, "global_step": 434788, "epoch": 2588} {"train_loss": -9.492324829101562, "global_step": 434789, "epoch": 2588} {"train_loss": -7.619637489318848, "global_step": 434790, "epoch": 2588} {"train_loss": -8.088269233703613, "global_step": 434791, "epoch": 2588} {"train_loss": -9.563196182250977, "global_step": 434792, "epoch": 2588} {"train_loss": -9.155202865600586, "global_step": 434793, "epoch": 2588} {"train_loss": -9.48272705078125, "global_step": 434794, "epoch": 2588} {"train_loss": -9.63257122039795, "global_step": 434795, "epoch": 2588} {"train_loss": -8.576534271240234, "global_step": 434796, "epoch": 2588} {"train_loss": -8.404756546020508, "global_step": 434797, "epoch": 2588} {"train_loss": -8.549592018127441, "global_step": 434798, "epoch": 2588} {"train_loss": -8.851266860961914, "global_step": 434799, "epoch": 2588} {"train_loss": -9.980834007263184, "global_step": 434800, "epoch": 2588} {"train_loss": -9.204286575317383, "global_step": 434801, "epoch": 2588} {"train_loss": -9.569765090942383, "global_step": 434802, "epoch": 2588} {"train_loss": -9.182973861694336, "global_step": 434803, "epoch": 2588} {"train_loss": -9.927992820739746, "global_step": 434804, "epoch": 2588} {"train_loss": -9.473002433776855, "global_step": 434805, "epoch": 2588} {"train_loss": -9.988724708557129, "global_step": 434806, "epoch": 2588} {"train_loss": -9.930463790893555, "global_step": 434807, "epoch": 2588} {"train_loss": -10.048429489135742, "global_step": 434808, "epoch": 2588} {"train_loss": -10.268667221069336, "global_step": 434809, "epoch": 2588} {"train_loss": -11.076337814331055, "global_step": 434810, "epoch": 2588} {"train_loss": -10.323003768920898, "global_step": 434811, "epoch": 2588} {"train_loss": -10.918313980102539, "global_step": 434812, "epoch": 2588} {"train_loss": -11.103069305419922, "global_step": 434813, "epoch": 2588} {"train_loss": -11.259235382080078, "global_step": 434814, "epoch": 2588} {"train_loss": -10.686875343322754, "global_step": 434815, "epoch": 2588} {"train_loss": -11.666459083557129, "global_step": 434816, "epoch": 2588} {"train_loss": -11.729942321777344, "global_step": 434817, "epoch": 2588} {"train_loss": -12.313161849975586, "global_step": 434818, "epoch": 2588} {"train_loss": -11.633638381958008, "global_step": 434819, "epoch": 2588} {"train_loss": -11.730280876159668, "global_step": 434820, "epoch": 2588} {"train_loss": -11.483579635620117, "global_step": 434821, "epoch": 2588} {"train_loss": -11.538418769836426, "global_step": 434822, "epoch": 2588} {"train_loss": -11.533103942871094, "global_step": 434823, "epoch": 2588} {"train_loss": -11.603559494018555, "global_step": 434824, "epoch": 2588} {"train_loss": -12.073820114135742, "global_step": 434825, "epoch": 2588} {"train_loss": -11.646398544311523, "global_step": 434826, "epoch": 2588} {"train_loss": -11.759628295898438, "global_step": 434827, "epoch": 2588} {"train_loss": -11.484704971313477, "global_step": 434828, "epoch": 2588} {"train_loss": -11.94610595703125, "global_step": 434829, "epoch": 2588} {"train_loss": -12.005430221557617, "global_step": 434830, "epoch": 2588} {"train_loss": -12.180679321289062, "global_step": 434831, "epoch": 2588} {"train_loss": -11.752315521240234, "global_step": 434832, "epoch": 2588} {"train_loss": -12.263428688049316, "global_step": 434833, "epoch": 2588} {"train_loss": -11.776732444763184, "global_step": 434834, "epoch": 2588} {"train_loss": -11.808382987976074, "global_step": 434835, "epoch": 2588} {"train_loss": -11.972160339355469, "global_step": 434836, "epoch": 2588} {"train_loss": -12.175403594970703, "global_step": 434837, "epoch": 2588} {"train_loss": -12.021551132202148, "global_step": 434838, "epoch": 2588} {"train_loss": -12.40166187286377, "global_step": 434839, "epoch": 2588} {"train_loss": -11.822259902954102, "global_step": 434840, "epoch": 2588} {"train_loss": -12.0274076461792, "global_step": 434841, "epoch": 2588} {"train_loss": -12.226707458496094, "global_step": 434842, "epoch": 2588} {"train_loss": -11.94681167602539, "global_step": 434843, "epoch": 2588} {"train_loss": -12.312522888183594, "global_step": 434844, "epoch": 2588} {"train_loss": -11.972265243530273, "global_step": 434845, "epoch": 2588} {"train_loss": -12.443977355957031, "global_step": 434846, "epoch": 2588} {"train_loss": -12.327226638793945, "global_step": 434847, "epoch": 2588} {"train_loss": -12.26679801940918, "global_step": 434848, "epoch": 2588} {"train_loss": -12.292037963867188, "global_step": 434849, "epoch": 2588} {"train_loss": -12.091947555541992, "global_step": 434850, "epoch": 2588} {"train_loss": -12.43051528930664, "global_step": 434851, "epoch": 2588} {"train_loss": -12.199356079101562, "global_step": 434852, "epoch": 2588} {"train_loss": -12.239014625549316, "global_step": 434853, "epoch": 2588} {"train_loss": -12.110767364501953, "global_step": 434854, "epoch": 2588} {"train_loss": -12.384265899658203, "global_step": 434855, "epoch": 2588} {"train_loss": -12.405806541442871, "global_step": 434856, "epoch": 2588} {"train_loss": -12.4121675491333, "global_step": 434857, "epoch": 2588} {"train_loss": -12.490854263305664, "global_step": 434858, "epoch": 2588} {"train_loss": -12.483147621154785, "global_step": 434859, "epoch": 2588} {"train_loss": -12.56987190246582, "global_step": 434860, "epoch": 2588} {"train_loss": -12.662882804870605, "global_step": 434861, "epoch": 2588} {"train_loss": -12.32741928100586, "global_step": 434862, "epoch": 2588} {"train_loss": -12.602787017822266, "global_step": 434863, "epoch": 2588} {"train_loss": -12.343886375427246, "global_step": 434864, "epoch": 2588} {"train_loss": -12.74782943725586, "global_step": 434865, "epoch": 2588} {"train_loss": -12.630924224853516, "global_step": 434866, "epoch": 2588} {"train_loss": -12.519737243652344, "global_step": 434867, "epoch": 2588} {"train_loss": -12.646553993225098, "global_step": 434868, "epoch": 2588} {"train_loss": -12.364365577697754, "global_step": 434869, "epoch": 2588} {"train_loss": -12.903846740722656, "global_step": 434870, "epoch": 2588} {"train_loss": -12.168407440185547, "global_step": 434871, "epoch": 2588} {"train_loss": -12.602899551391602, "global_step": 434872, "epoch": 2588} {"train_loss": -12.322673797607422, "global_step": 434873, "epoch": 2588} {"train_loss": -12.648910522460938, "global_step": 434874, "epoch": 2588} {"train_loss": -12.566522598266602, "global_step": 434875, "epoch": 2588} {"train_loss": -12.507660865783691, "global_step": 434876, "epoch": 2588} {"train_loss": -12.710176467895508, "global_step": 434877, "epoch": 2588} {"train_loss": -11.982105255126953, "global_step": 434878, "epoch": 2588} {"train_loss": -12.626331329345703, "global_step": 434879, "epoch": 2588} {"train_loss": -12.367313385009766, "global_step": 434880, "epoch": 2588} {"train_loss": -12.454662322998047, "global_step": 434881, "epoch": 2588} {"train_loss": -12.263246536254883, "global_step": 434882, "epoch": 2588} {"train_loss": -12.104351043701172, "global_step": 434883, "epoch": 2588} {"train_loss": -12.447389602661133, "global_step": 434884, "epoch": 2588} {"train_loss": -12.006629943847656, "global_step": 434885, "epoch": 2588} {"train_loss": -12.101234436035156, "global_step": 434886, "epoch": 2588} {"train_loss": -12.182964324951172, "global_step": 434887, "epoch": 2588} {"train_loss": -12.003009796142578, "global_step": 434888, "epoch": 2588} {"train_loss": -12.607556343078613, "global_step": 434889, "epoch": 2588} {"train_loss": -11.461416244506836, "global_step": 434890, "epoch": 2588} {"train_loss": -12.194737434387207, "global_step": 434891, "epoch": 2588} {"train_loss": -11.765838623046875, "global_step": 434892, "epoch": 2588} {"train_loss": -12.654878616333008, "global_step": 434893, "epoch": 2588} {"train_loss": -12.184446334838867, "global_step": 434894, "epoch": 2588} {"train_loss": -12.290414810180664, "global_step": 434895, "epoch": 2588} {"train_loss": -12.401211738586426, "global_step": 434896, "epoch": 2588} {"train_loss": -12.292596817016602, "global_step": 434897, "epoch": 2588} {"train_loss": -12.340249061584473, "global_step": 434898, "epoch": 2588} {"train_loss": -12.291885375976562, "global_step": 434899, "epoch": 2588} {"train_loss": -12.44466781616211, "global_step": 434900, "epoch": 2588} {"train_loss": -12.244195938110352, "global_step": 434901, "epoch": 2588} {"train_loss": -12.227685928344727, "global_step": 434902, "epoch": 2588} {"train_loss": -11.943028450012207, "global_step": 434903, "epoch": 2588} {"train_loss": -12.17574691772461, "global_step": 434904, "epoch": 2588} {"train_loss": -12.578271865844727, "global_step": 434905, "epoch": 2588} {"train_loss": -12.378946304321289, "global_step": 434906, "epoch": 2588} {"train_loss": -12.66363525390625, "global_step": 434907, "epoch": 2588} {"train_loss": -12.698477745056152, "global_step": 434908, "epoch": 2588} {"train_loss": -12.771337509155273, "global_step": 434909, "epoch": 2588} {"train_loss": -12.450679779052734, "global_step": 434910, "epoch": 2588} {"train_loss": -12.677984237670898, "global_step": 434911, "epoch": 2588} {"train_loss": -12.79145336151123, "global_step": 434912, "epoch": 2588} {"train_loss": -12.609781265258789, "global_step": 434913, "epoch": 2588} {"train_loss": -12.718856811523438, "global_step": 434914, "epoch": 2588} {"train_loss": -12.702274322509766, "global_step": 434915, "epoch": 2588} {"train_loss": -12.853164672851562, "global_step": 434916, "epoch": 2588} {"train_loss": -12.68360710144043, "global_step": 434917, "epoch": 2588} {"train_loss": -12.754745483398438, "global_step": 434918, "epoch": 2588} {"train_loss": -12.767265319824219, "global_step": 434919, "epoch": 2588} {"train_loss": -12.891695022583008, "global_step": 434920, "epoch": 2588} {"train_loss": -12.69879150390625, "global_step": 434921, "epoch": 2588} {"train_loss": -12.61532974243164, "global_step": 434922, "epoch": 2588} {"train_loss": -12.87479305267334, "global_step": 434923, "epoch": 2588} {"train_loss": -12.655261993408203, "global_step": 434924, "epoch": 2588} {"train_loss": -11.630326271057129, "global_step": 434925, "epoch": 2588} {"train_loss": -12.00511646270752, "global_step": 434926, "epoch": 2588} {"train_loss": -12.435623168945312, "global_step": 434927, "epoch": 2588} {"train_loss": -12.865081787109375, "global_step": 434928, "epoch": 2588} {"train_loss": -12.599305152893066, "global_step": 434929, "epoch": 2588} {"train_loss": -12.648545265197754, "global_step": 434930, "epoch": 2588} {"train_loss": -12.813749313354492, "global_step": 434931, "epoch": 2588} {"train_loss": -12.891873359680176, "global_step": 434932, "epoch": 2588} {"train_loss": -12.68676471710205, "global_step": 434933, "epoch": 2588} {"train_loss": -12.63545036315918, "global_step": 434934, "epoch": 2588} {"train_loss": -12.610353469848633, "global_step": 434935, "epoch": 2588} {"train_loss": -12.649383544921875, "global_step": 434936, "epoch": 2588} {"train_loss": -12.470026016235352, "global_step": 434937, "epoch": 2588} {"train_loss": -12.70129108428955, "global_step": 434938, "epoch": 2588} {"train_loss": -12.648117065429688, "global_step": 434939, "epoch": 2588} {"train_loss": -12.779139518737793, "global_step": 434940, "epoch": 2588} {"train_loss": -12.637429237365723, "global_step": 434941, "epoch": 2588} {"train_loss": -12.558704376220703, "global_step": 434942, "epoch": 2588} {"train_loss": -12.09187126159668, "global_step": 434943, "epoch": 2588} {"train_loss": -12.734140396118164, "global_step": 434944, "epoch": 2588} {"train_loss": -12.672426223754883, "global_step": 434945, "epoch": 2588} {"train_loss": -11.989459991455078, "global_step": 434946, "epoch": 2588} {"train_loss": -12.783635139465332, "global_step": 434947, "epoch": 2588} {"train_loss": -12.466571807861328, "global_step": 434948, "epoch": 2588} {"train_loss": -12.911567687988281, "global_step": 434949, "epoch": 2588} {"train_loss": -12.276708602905273, "global_step": 434950, "epoch": 2588} {"train_loss": -11.85213009516398, "global_step": 434951, "epoch": 2588, "val_loss": 310655.875} {"train_loss": -12.47719955444336, "global_step": 434952, "epoch": 2589} {"train_loss": -12.92121696472168, "global_step": 434953, "epoch": 2589} {"train_loss": -12.349082946777344, "global_step": 434954, "epoch": 2589} {"train_loss": -12.779239654541016, "global_step": 434955, "epoch": 2589} {"train_loss": -12.391550064086914, "global_step": 434956, "epoch": 2589} {"train_loss": -12.095065116882324, "global_step": 434957, "epoch": 2589} {"train_loss": -11.924042701721191, "global_step": 434958, "epoch": 2589} {"train_loss": -11.166629791259766, "global_step": 434959, "epoch": 2589} {"train_loss": -11.675046920776367, "global_step": 434960, "epoch": 2589} {"train_loss": -12.630498886108398, "global_step": 434961, "epoch": 2589} {"train_loss": -10.96870231628418, "global_step": 434962, "epoch": 2589} {"train_loss": -12.125368118286133, "global_step": 434963, "epoch": 2589} {"train_loss": -12.09065055847168, "global_step": 434964, "epoch": 2589} {"train_loss": -11.494739532470703, "global_step": 434965, "epoch": 2589} {"train_loss": -11.928812026977539, "global_step": 434966, "epoch": 2589} {"train_loss": -12.407012939453125, "global_step": 434967, "epoch": 2589} {"train_loss": -10.7957763671875, "global_step": 434968, "epoch": 2589} {"train_loss": -11.231443405151367, "global_step": 434969, "epoch": 2589} {"train_loss": -11.945561408996582, "global_step": 434970, "epoch": 2589} {"train_loss": -10.752372741699219, "global_step": 434971, "epoch": 2589} {"train_loss": -11.6055908203125, "global_step": 434972, "epoch": 2589} {"train_loss": -11.531492233276367, "global_step": 434973, "epoch": 2589} {"train_loss": -12.445951461791992, "global_step": 434974, "epoch": 2589} {"train_loss": -11.909555435180664, "global_step": 434975, "epoch": 2589} {"train_loss": -12.228874206542969, "global_step": 434976, "epoch": 2589} {"train_loss": -12.0423583984375, "global_step": 434977, "epoch": 2589} {"train_loss": -12.451665878295898, "global_step": 434978, "epoch": 2589} {"train_loss": -12.394346237182617, "global_step": 434979, "epoch": 2589} {"train_loss": -12.392526626586914, "global_step": 434980, "epoch": 2589} {"train_loss": -12.550256729125977, "global_step": 434981, "epoch": 2589} {"train_loss": -12.315911293029785, "global_step": 434982, "epoch": 2589} {"train_loss": -12.445598602294922, "global_step": 434983, "epoch": 2589} {"train_loss": -12.071259498596191, "global_step": 434984, "epoch": 2589} {"train_loss": -12.259459495544434, "global_step": 434985, "epoch": 2589} {"train_loss": -12.575881004333496, "global_step": 434986, "epoch": 2589} {"train_loss": -11.833667755126953, "global_step": 434987, "epoch": 2589} {"train_loss": -11.992155075073242, "global_step": 434988, "epoch": 2589} {"train_loss": -12.457782745361328, "global_step": 434989, "epoch": 2589} {"train_loss": -11.341582298278809, "global_step": 434990, "epoch": 2589} {"train_loss": -12.162349700927734, "global_step": 434991, "epoch": 2589} {"train_loss": -12.365952491760254, "global_step": 434992, "epoch": 2589} {"train_loss": -12.358009338378906, "global_step": 434993, "epoch": 2589} {"train_loss": -11.908571243286133, "global_step": 434994, "epoch": 2589} {"train_loss": -12.43591022491455, "global_step": 434995, "epoch": 2589} {"train_loss": -12.422978401184082, "global_step": 434996, "epoch": 2589} {"train_loss": -12.541532516479492, "global_step": 434997, "epoch": 2589} {"train_loss": -12.240913391113281, "global_step": 434998, "epoch": 2589} {"train_loss": -11.716588973999023, "global_step": 434999, "epoch": 2589} {"train_loss": -12.150250434875488, "global_step": 435000, "epoch": 2589} {"train_loss": -12.344287872314453, "global_step": 435001, "epoch": 2589} {"train_loss": -12.212265014648438, "global_step": 435002, "epoch": 2589} {"train_loss": -12.387771606445312, "global_step": 435003, "epoch": 2589} {"train_loss": -12.025975227355957, "global_step": 435004, "epoch": 2589} {"train_loss": -12.442179679870605, "global_step": 435005, "epoch": 2589} {"train_loss": -12.107101440429688, "global_step": 435006, "epoch": 2589} {"train_loss": -12.142171859741211, "global_step": 435007, "epoch": 2589} {"train_loss": -12.051610946655273, "global_step": 435008, "epoch": 2589} {"train_loss": -12.688833236694336, "global_step": 435009, "epoch": 2589} {"train_loss": -12.014073371887207, "global_step": 435010, "epoch": 2589} {"train_loss": -12.349411010742188, "global_step": 435011, "epoch": 2589} {"train_loss": -12.007675170898438, "global_step": 435012, "epoch": 2589} {"train_loss": -12.370594024658203, "global_step": 435013, "epoch": 2589} {"train_loss": -12.086278915405273, "global_step": 435014, "epoch": 2589} {"train_loss": -12.259109497070312, "global_step": 435015, "epoch": 2589} {"train_loss": -12.527100563049316, "global_step": 435016, "epoch": 2589} {"train_loss": -12.572317123413086, "global_step": 435017, "epoch": 2589} {"train_loss": -12.457971572875977, "global_step": 435018, "epoch": 2589} {"train_loss": -12.092694282531738, "global_step": 435019, "epoch": 2589} {"train_loss": -12.67837905883789, "global_step": 435020, "epoch": 2589} {"train_loss": -12.438989639282227, "global_step": 435021, "epoch": 2589} {"train_loss": -12.310091018676758, "global_step": 435022, "epoch": 2589} {"train_loss": -12.035306930541992, "global_step": 435023, "epoch": 2589} {"train_loss": -12.62979507446289, "global_step": 435024, "epoch": 2589} {"train_loss": -12.236163139343262, "global_step": 435025, "epoch": 2589} {"train_loss": -11.835413932800293, "global_step": 435026, "epoch": 2589} {"train_loss": -12.633172988891602, "global_step": 435027, "epoch": 2589} {"train_loss": -12.06964111328125, "global_step": 435028, "epoch": 2589} {"train_loss": -11.94585132598877, "global_step": 435029, "epoch": 2589} {"train_loss": -12.443828582763672, "global_step": 435030, "epoch": 2589} {"train_loss": -11.891948699951172, "global_step": 435031, "epoch": 2589} {"train_loss": -11.80902099609375, "global_step": 435032, "epoch": 2589} {"train_loss": -12.386100769042969, "global_step": 435033, "epoch": 2589} {"train_loss": -11.392358779907227, "global_step": 435034, "epoch": 2589} {"train_loss": -11.79210090637207, "global_step": 435035, "epoch": 2589} {"train_loss": -12.173717498779297, "global_step": 435036, "epoch": 2589} {"train_loss": -11.84974479675293, "global_step": 435037, "epoch": 2589} {"train_loss": -10.906296730041504, "global_step": 435038, "epoch": 2589} {"train_loss": -12.10519790649414, "global_step": 435039, "epoch": 2589} {"train_loss": -11.612890243530273, "global_step": 435040, "epoch": 2589} {"train_loss": -12.142349243164062, "global_step": 435041, "epoch": 2589} {"train_loss": -10.953019142150879, "global_step": 435042, "epoch": 2589} {"train_loss": -12.272563934326172, "global_step": 435043, "epoch": 2589} {"train_loss": -11.7537841796875, "global_step": 435044, "epoch": 2589} {"train_loss": -12.526525497436523, "global_step": 435045, "epoch": 2589} {"train_loss": -11.596521377563477, "global_step": 435046, "epoch": 2589} {"train_loss": -12.582371711730957, "global_step": 435047, "epoch": 2589} {"train_loss": -12.019648551940918, "global_step": 435048, "epoch": 2589} {"train_loss": -12.303844451904297, "global_step": 435049, "epoch": 2589} {"train_loss": -12.149800300598145, "global_step": 435050, "epoch": 2589} {"train_loss": -11.960721015930176, "global_step": 435051, "epoch": 2589} {"train_loss": -11.796875953674316, "global_step": 435052, "epoch": 2589} {"train_loss": -11.688179969787598, "global_step": 435053, "epoch": 2589} {"train_loss": -11.794150352478027, "global_step": 435054, "epoch": 2589} {"train_loss": -10.887317657470703, "global_step": 435055, "epoch": 2589} {"train_loss": -11.801743507385254, "global_step": 435056, "epoch": 2589} {"train_loss": -11.892313003540039, "global_step": 435057, "epoch": 2589} {"train_loss": -11.57960319519043, "global_step": 435058, "epoch": 2589} {"train_loss": -12.195244789123535, "global_step": 435059, "epoch": 2589} {"train_loss": -11.156028747558594, "global_step": 435060, "epoch": 2589} {"train_loss": -11.151535987854004, "global_step": 435061, "epoch": 2589} {"train_loss": -11.78018569946289, "global_step": 435062, "epoch": 2589} {"train_loss": -11.270339965820312, "global_step": 435063, "epoch": 2589} {"train_loss": -11.35057258605957, "global_step": 435064, "epoch": 2589} {"train_loss": -11.928794860839844, "global_step": 435065, "epoch": 2589} {"train_loss": -11.759695053100586, "global_step": 435066, "epoch": 2589} {"train_loss": -11.862693786621094, "global_step": 435067, "epoch": 2589} {"train_loss": -11.20236587524414, "global_step": 435068, "epoch": 2589} {"train_loss": -11.995233535766602, "global_step": 435069, "epoch": 2589} {"train_loss": -11.362527847290039, "global_step": 435070, "epoch": 2589} {"train_loss": -12.391796112060547, "global_step": 435071, "epoch": 2589} {"train_loss": -11.820927619934082, "global_step": 435072, "epoch": 2589} {"train_loss": -11.992269515991211, "global_step": 435073, "epoch": 2589} {"train_loss": -11.961898803710938, "global_step": 435074, "epoch": 2589} {"train_loss": -12.005545616149902, "global_step": 435075, "epoch": 2589} {"train_loss": -12.263236999511719, "global_step": 435076, "epoch": 2589} {"train_loss": -11.920753479003906, "global_step": 435077, "epoch": 2589} {"train_loss": -12.617818832397461, "global_step": 435078, "epoch": 2589} {"train_loss": -11.933239936828613, "global_step": 435079, "epoch": 2589} {"train_loss": -12.316652297973633, "global_step": 435080, "epoch": 2589} {"train_loss": -12.20405101776123, "global_step": 435081, "epoch": 2589} {"train_loss": -12.365198135375977, "global_step": 435082, "epoch": 2589} {"train_loss": -12.207998275756836, "global_step": 435083, "epoch": 2589} {"train_loss": -12.014440536499023, "global_step": 435084, "epoch": 2589} {"train_loss": -11.891984939575195, "global_step": 435085, "epoch": 2589} {"train_loss": -12.124597549438477, "global_step": 435086, "epoch": 2589} {"train_loss": -11.643667221069336, "global_step": 435087, "epoch": 2589} {"train_loss": -12.10574722290039, "global_step": 435088, "epoch": 2589} {"train_loss": -11.602838516235352, "global_step": 435089, "epoch": 2589} {"train_loss": -12.128366470336914, "global_step": 435090, "epoch": 2589} {"train_loss": -11.715723037719727, "global_step": 435091, "epoch": 2589} {"train_loss": -11.295136451721191, "global_step": 435092, "epoch": 2589} {"train_loss": -11.656996726989746, "global_step": 435093, "epoch": 2589} {"train_loss": -11.823699951171875, "global_step": 435094, "epoch": 2589} {"train_loss": -11.724964141845703, "global_step": 435095, "epoch": 2589} {"train_loss": -11.526362419128418, "global_step": 435096, "epoch": 2589} {"train_loss": -12.124181747436523, "global_step": 435097, "epoch": 2589} {"train_loss": -11.806255340576172, "global_step": 435098, "epoch": 2589} {"train_loss": -12.364879608154297, "global_step": 435099, "epoch": 2589} {"train_loss": -11.331016540527344, "global_step": 435100, "epoch": 2589} {"train_loss": -11.645074844360352, "global_step": 435101, "epoch": 2589} {"train_loss": -12.05494499206543, "global_step": 435102, "epoch": 2589} {"train_loss": -11.280193328857422, "global_step": 435103, "epoch": 2589} {"train_loss": -12.588663101196289, "global_step": 435104, "epoch": 2589} {"train_loss": -11.36039924621582, "global_step": 435105, "epoch": 2589} {"train_loss": -12.207796096801758, "global_step": 435106, "epoch": 2589} {"train_loss": -11.802780151367188, "global_step": 435107, "epoch": 2589} {"train_loss": -12.217379570007324, "global_step": 435108, "epoch": 2589} {"train_loss": -11.970572471618652, "global_step": 435109, "epoch": 2589} {"train_loss": -11.854857444763184, "global_step": 435110, "epoch": 2589} {"train_loss": -12.275040626525879, "global_step": 435111, "epoch": 2589} {"train_loss": -11.683349609375, "global_step": 435112, "epoch": 2589} {"train_loss": -12.377500534057617, "global_step": 435113, "epoch": 2589} {"train_loss": -12.354342460632324, "global_step": 435114, "epoch": 2589} {"train_loss": -12.172076225280762, "global_step": 435115, "epoch": 2589} {"train_loss": -12.526487350463867, "global_step": 435116, "epoch": 2589} {"train_loss": -12.392901420593262, "global_step": 435117, "epoch": 2589} {"train_loss": -12.361076354980469, "global_step": 435118, "epoch": 2589} {"train_loss": -12.018125454584757, "global_step": 435119, "epoch": 2589, "val_loss": 309881.5625} {"train_loss": -12.394355773925781, "global_step": 435120, "epoch": 2590} {"train_loss": -12.547231674194336, "global_step": 435121, "epoch": 2590} {"train_loss": -12.473810195922852, "global_step": 435122, "epoch": 2590} {"train_loss": -12.611040115356445, "global_step": 435123, "epoch": 2590} {"train_loss": -12.484169006347656, "global_step": 435124, "epoch": 2590} {"train_loss": -12.459875106811523, "global_step": 435125, "epoch": 2590} {"train_loss": -12.642168045043945, "global_step": 435126, "epoch": 2590} {"train_loss": -12.239201545715332, "global_step": 435127, "epoch": 2590} {"train_loss": -12.596833229064941, "global_step": 435128, "epoch": 2590} {"train_loss": -12.538339614868164, "global_step": 435129, "epoch": 2590} {"train_loss": -12.515218734741211, "global_step": 435130, "epoch": 2590} {"train_loss": -12.623086929321289, "global_step": 435131, "epoch": 2590} {"train_loss": -12.51059341430664, "global_step": 435132, "epoch": 2590} {"train_loss": -12.692022323608398, "global_step": 435133, "epoch": 2590} {"train_loss": -12.452062606811523, "global_step": 435134, "epoch": 2590} {"train_loss": -12.775074005126953, "global_step": 435135, "epoch": 2590} {"train_loss": -12.610666275024414, "global_step": 435136, "epoch": 2590} {"train_loss": -12.603841781616211, "global_step": 435137, "epoch": 2590} {"train_loss": -12.853898048400879, "global_step": 435138, "epoch": 2590} {"train_loss": -12.278105735778809, "global_step": 435139, "epoch": 2590} {"train_loss": -12.656654357910156, "global_step": 435140, "epoch": 2590} {"train_loss": -12.56995964050293, "global_step": 435141, "epoch": 2590} {"train_loss": -12.361183166503906, "global_step": 435142, "epoch": 2590} {"train_loss": -12.503290176391602, "global_step": 435143, "epoch": 2590} {"train_loss": -12.787819862365723, "global_step": 435144, "epoch": 2590} {"train_loss": -12.704944610595703, "global_step": 435145, "epoch": 2590} {"train_loss": -12.356412887573242, "global_step": 435146, "epoch": 2590} {"train_loss": -12.448516845703125, "global_step": 435147, "epoch": 2590} {"train_loss": -12.325913429260254, "global_step": 435148, "epoch": 2590} {"train_loss": -12.483552932739258, "global_step": 435149, "epoch": 2590} {"train_loss": -12.463335037231445, "global_step": 435150, "epoch": 2590} {"train_loss": -11.898560523986816, "global_step": 435151, "epoch": 2590} {"train_loss": -12.58237361907959, "global_step": 435152, "epoch": 2590} {"train_loss": -12.278766632080078, "global_step": 435153, "epoch": 2590} {"train_loss": -12.267735481262207, "global_step": 435154, "epoch": 2590} {"train_loss": -12.26961898803711, "global_step": 435155, "epoch": 2590} {"train_loss": -10.745222091674805, "global_step": 435156, "epoch": 2590} {"train_loss": -12.43124008178711, "global_step": 435157, "epoch": 2590} {"train_loss": -12.185945510864258, "global_step": 435158, "epoch": 2590} {"train_loss": -11.752248764038086, "global_step": 435159, "epoch": 2590} {"train_loss": -11.637619972229004, "global_step": 435160, "epoch": 2590} {"train_loss": -11.086669921875, "global_step": 435161, "epoch": 2590} {"train_loss": -11.790587425231934, "global_step": 435162, "epoch": 2590} {"train_loss": -12.157268524169922, "global_step": 435163, "epoch": 2590} {"train_loss": -11.224552154541016, "global_step": 435164, "epoch": 2590} {"train_loss": -12.261577606201172, "global_step": 435165, "epoch": 2590} {"train_loss": -12.34113597869873, "global_step": 435166, "epoch": 2590} {"train_loss": -12.576078414916992, "global_step": 435167, "epoch": 2590} {"train_loss": -12.448711395263672, "global_step": 435168, "epoch": 2590} {"train_loss": -12.352773666381836, "global_step": 435169, "epoch": 2590} {"train_loss": -12.493364334106445, "global_step": 435170, "epoch": 2590} {"train_loss": -12.269320487976074, "global_step": 435171, "epoch": 2590} {"train_loss": -12.4879732131958, "global_step": 435172, "epoch": 2590} {"train_loss": -12.60408878326416, "global_step": 435173, "epoch": 2590} {"train_loss": -12.518522262573242, "global_step": 435174, "epoch": 2590} {"train_loss": -12.344303131103516, "global_step": 435175, "epoch": 2590} {"train_loss": -12.588621139526367, "global_step": 435176, "epoch": 2590} {"train_loss": -12.50058364868164, "global_step": 435177, "epoch": 2590} {"train_loss": -12.339961051940918, "global_step": 435178, "epoch": 2590} {"train_loss": -12.545703887939453, "global_step": 435179, "epoch": 2590} {"train_loss": -12.356502532958984, "global_step": 435180, "epoch": 2590} {"train_loss": -12.53727912902832, "global_step": 435181, "epoch": 2590} {"train_loss": -12.195161819458008, "global_step": 435182, "epoch": 2590} {"train_loss": -12.571338653564453, "global_step": 435183, "epoch": 2590} {"train_loss": -12.124229431152344, "global_step": 435184, "epoch": 2590} {"train_loss": -12.451126098632812, "global_step": 435185, "epoch": 2590} {"train_loss": -12.131799697875977, "global_step": 435186, "epoch": 2590} {"train_loss": -12.601753234863281, "global_step": 435187, "epoch": 2590} {"train_loss": -12.279608726501465, "global_step": 435188, "epoch": 2590} {"train_loss": -12.501782417297363, "global_step": 435189, "epoch": 2590} {"train_loss": -12.198429107666016, "global_step": 435190, "epoch": 2590} {"train_loss": -12.419367790222168, "global_step": 435191, "epoch": 2590} {"train_loss": -12.711029052734375, "global_step": 435192, "epoch": 2590} {"train_loss": -12.382437705993652, "global_step": 435193, "epoch": 2590} {"train_loss": -12.702667236328125, "global_step": 435194, "epoch": 2590} {"train_loss": -12.353269577026367, "global_step": 435195, "epoch": 2590} {"train_loss": -12.77538013458252, "global_step": 435196, "epoch": 2590} {"train_loss": -12.568488121032715, "global_step": 435197, "epoch": 2590} {"train_loss": -12.66387939453125, "global_step": 435198, "epoch": 2590} {"train_loss": -12.732149124145508, "global_step": 435199, "epoch": 2590} {"train_loss": -12.439854621887207, "global_step": 435200, "epoch": 2590} {"train_loss": -12.596275329589844, "global_step": 435201, "epoch": 2590} {"train_loss": -12.542795181274414, "global_step": 435202, "epoch": 2590} {"train_loss": -12.412734985351562, "global_step": 435203, "epoch": 2590} {"train_loss": -12.516987800598145, "global_step": 435204, "epoch": 2590} {"train_loss": -12.594245910644531, "global_step": 435205, "epoch": 2590} {"train_loss": -12.49956226348877, "global_step": 435206, "epoch": 2590} {"train_loss": -12.555154800415039, "global_step": 435207, "epoch": 2590} {"train_loss": -12.455875396728516, "global_step": 435208, "epoch": 2590} {"train_loss": -12.198668479919434, "global_step": 435209, "epoch": 2590} {"train_loss": -12.833353996276855, "global_step": 435210, "epoch": 2590} {"train_loss": -12.108552932739258, "global_step": 435211, "epoch": 2590} {"train_loss": -12.38763427734375, "global_step": 435212, "epoch": 2590} {"train_loss": -12.269721031188965, "global_step": 435213, "epoch": 2590} {"train_loss": -12.482992172241211, "global_step": 435214, "epoch": 2590} {"train_loss": -12.664048194885254, "global_step": 435215, "epoch": 2590} {"train_loss": -12.280317306518555, "global_step": 435216, "epoch": 2590} {"train_loss": -12.39753532409668, "global_step": 435217, "epoch": 2590} {"train_loss": -12.333477020263672, "global_step": 435218, "epoch": 2590} {"train_loss": -12.336585998535156, "global_step": 435219, "epoch": 2590} {"train_loss": -11.86985969543457, "global_step": 435220, "epoch": 2590} {"train_loss": -12.70094108581543, "global_step": 435221, "epoch": 2590} {"train_loss": -11.043954849243164, "global_step": 435222, "epoch": 2590} {"train_loss": -12.599319458007812, "global_step": 435223, "epoch": 2590} {"train_loss": -11.743368148803711, "global_step": 435224, "epoch": 2590} {"train_loss": -12.352944374084473, "global_step": 435225, "epoch": 2590} {"train_loss": -12.67054557800293, "global_step": 435226, "epoch": 2590} {"train_loss": -12.296218872070312, "global_step": 435227, "epoch": 2590} {"train_loss": -12.419027328491211, "global_step": 435228, "epoch": 2590} {"train_loss": -11.891322135925293, "global_step": 435229, "epoch": 2590} {"train_loss": -12.805692672729492, "global_step": 435230, "epoch": 2590} {"train_loss": -11.76662826538086, "global_step": 435231, "epoch": 2590} {"train_loss": -11.157529830932617, "global_step": 435232, "epoch": 2590} {"train_loss": -12.480368614196777, "global_step": 435233, "epoch": 2590} {"train_loss": -11.45654296875, "global_step": 435234, "epoch": 2590} {"train_loss": -10.121431350708008, "global_step": 435235, "epoch": 2590} {"train_loss": -11.272687911987305, "global_step": 435236, "epoch": 2590} {"train_loss": -10.631448745727539, "global_step": 435237, "epoch": 2590} {"train_loss": -11.753219604492188, "global_step": 435238, "epoch": 2590} {"train_loss": -10.022644996643066, "global_step": 435239, "epoch": 2590} {"train_loss": -11.555266380310059, "global_step": 435240, "epoch": 2590} {"train_loss": -11.679512023925781, "global_step": 435241, "epoch": 2590} {"train_loss": -11.52680492401123, "global_step": 435242, "epoch": 2590} {"train_loss": -11.599447250366211, "global_step": 435243, "epoch": 2590} {"train_loss": -11.433850288391113, "global_step": 435244, "epoch": 2590} {"train_loss": -12.109615325927734, "global_step": 435245, "epoch": 2590} {"train_loss": -12.16235637664795, "global_step": 435246, "epoch": 2590} {"train_loss": -11.44338607788086, "global_step": 435247, "epoch": 2590} {"train_loss": -12.217735290527344, "global_step": 435248, "epoch": 2590} {"train_loss": -11.909419059753418, "global_step": 435249, "epoch": 2590} {"train_loss": -11.646303176879883, "global_step": 435250, "epoch": 2590} {"train_loss": -12.105463027954102, "global_step": 435251, "epoch": 2590} {"train_loss": -11.830198287963867, "global_step": 435252, "epoch": 2590} {"train_loss": -10.268491744995117, "global_step": 435253, "epoch": 2590} {"train_loss": -11.76784896850586, "global_step": 435254, "epoch": 2590} {"train_loss": -9.805425643920898, "global_step": 435255, "epoch": 2590} {"train_loss": -10.608148574829102, "global_step": 435256, "epoch": 2590} {"train_loss": -11.667627334594727, "global_step": 435257, "epoch": 2590} {"train_loss": -10.43315315246582, "global_step": 435258, "epoch": 2590} {"train_loss": -10.910518646240234, "global_step": 435259, "epoch": 2590} {"train_loss": -11.331933975219727, "global_step": 435260, "epoch": 2590} {"train_loss": -10.544857025146484, "global_step": 435261, "epoch": 2590} {"train_loss": -9.906461715698242, "global_step": 435262, "epoch": 2590} {"train_loss": -10.82852554321289, "global_step": 435263, "epoch": 2590} {"train_loss": -10.474502563476562, "global_step": 435264, "epoch": 2590} {"train_loss": -10.214105606079102, "global_step": 435265, "epoch": 2590} {"train_loss": -9.731943130493164, "global_step": 435266, "epoch": 2590} {"train_loss": -10.700141906738281, "global_step": 435267, "epoch": 2590} {"train_loss": -11.32308578491211, "global_step": 435268, "epoch": 2590} {"train_loss": -11.161556243896484, "global_step": 435269, "epoch": 2590} {"train_loss": -11.788904190063477, "global_step": 435270, "epoch": 2590} {"train_loss": -11.250459671020508, "global_step": 435271, "epoch": 2590} {"train_loss": -11.765769958496094, "global_step": 435272, "epoch": 2590} {"train_loss": -11.468149185180664, "global_step": 435273, "epoch": 2590} {"train_loss": -11.369239807128906, "global_step": 435274, "epoch": 2590} {"train_loss": -10.949185371398926, "global_step": 435275, "epoch": 2590} {"train_loss": -11.77625560760498, "global_step": 435276, "epoch": 2590} {"train_loss": -11.800155639648438, "global_step": 435277, "epoch": 2590} {"train_loss": -11.174225807189941, "global_step": 435278, "epoch": 2590} {"train_loss": -12.03493595123291, "global_step": 435279, "epoch": 2590} {"train_loss": -10.910255432128906, "global_step": 435280, "epoch": 2590} {"train_loss": -11.955591201782227, "global_step": 435281, "epoch": 2590} {"train_loss": -11.855209350585938, "global_step": 435282, "epoch": 2590} {"train_loss": -11.724499702453613, "global_step": 435283, "epoch": 2590} {"train_loss": -12.461872100830078, "global_step": 435284, "epoch": 2590} {"train_loss": -11.68149185180664, "global_step": 435285, "epoch": 2590} {"train_loss": -12.06899642944336, "global_step": 435286, "epoch": 2590} {"train_loss": -12.020710201490493, "global_step": 435287, "epoch": 2590, "val_loss": 302885.5625, "train_action_mse_error": 2.3648428916931152} {"train_loss": -12.159832000732422, "global_step": 435288, "epoch": 2591} {"train_loss": -11.984167098999023, "global_step": 435289, "epoch": 2591} {"train_loss": -12.108531951904297, "global_step": 435290, "epoch": 2591} {"train_loss": -11.83252239227295, "global_step": 435291, "epoch": 2591} {"train_loss": -12.156892776489258, "global_step": 435292, "epoch": 2591} {"train_loss": -12.111434936523438, "global_step": 435293, "epoch": 2591} {"train_loss": -11.953500747680664, "global_step": 435294, "epoch": 2591} {"train_loss": -12.550976753234863, "global_step": 435295, "epoch": 2591} {"train_loss": -12.2512788772583, "global_step": 435296, "epoch": 2591} {"train_loss": -12.36459732055664, "global_step": 435297, "epoch": 2591} {"train_loss": -12.596662521362305, "global_step": 435298, "epoch": 2591} {"train_loss": -12.486824989318848, "global_step": 435299, "epoch": 2591} {"train_loss": -12.593253135681152, "global_step": 435300, "epoch": 2591} {"train_loss": -12.437872886657715, "global_step": 435301, "epoch": 2591} {"train_loss": -12.425968170166016, "global_step": 435302, "epoch": 2591} {"train_loss": -12.483821868896484, "global_step": 435303, "epoch": 2591} {"train_loss": -12.608267784118652, "global_step": 435304, "epoch": 2591} {"train_loss": -12.646444320678711, "global_step": 435305, "epoch": 2591} {"train_loss": -12.518985748291016, "global_step": 435306, "epoch": 2591} {"train_loss": -12.409610748291016, "global_step": 435307, "epoch": 2591} {"train_loss": -12.550394058227539, "global_step": 435308, "epoch": 2591} {"train_loss": -12.516864776611328, "global_step": 435309, "epoch": 2591} {"train_loss": -12.500600814819336, "global_step": 435310, "epoch": 2591} {"train_loss": -12.541117668151855, "global_step": 435311, "epoch": 2591} {"train_loss": -12.706235885620117, "global_step": 435312, "epoch": 2591} {"train_loss": -12.683648109436035, "global_step": 435313, "epoch": 2591} {"train_loss": -12.666587829589844, "global_step": 435314, "epoch": 2591} {"train_loss": -12.659502029418945, "global_step": 435315, "epoch": 2591} {"train_loss": -12.560453414916992, "global_step": 435316, "epoch": 2591} {"train_loss": -12.694723129272461, "global_step": 435317, "epoch": 2591} {"train_loss": -12.719097137451172, "global_step": 435318, "epoch": 2591} {"train_loss": -12.821857452392578, "global_step": 435319, "epoch": 2591} {"train_loss": -12.833969116210938, "global_step": 435320, "epoch": 2591} {"train_loss": -12.739053726196289, "global_step": 435321, "epoch": 2591} {"train_loss": -12.801872253417969, "global_step": 435322, "epoch": 2591} {"train_loss": -12.759246826171875, "global_step": 435323, "epoch": 2591} {"train_loss": -12.786865234375, "global_step": 435324, "epoch": 2591} {"train_loss": -12.970590591430664, "global_step": 435325, "epoch": 2591} {"train_loss": -12.857824325561523, "global_step": 435326, "epoch": 2591} {"train_loss": -12.925750732421875, "global_step": 435327, "epoch": 2591} {"train_loss": -12.956260681152344, "global_step": 435328, "epoch": 2591} {"train_loss": -12.877237319946289, "global_step": 435329, "epoch": 2591} {"train_loss": -12.929304122924805, "global_step": 435330, "epoch": 2591} {"train_loss": -12.784327507019043, "global_step": 435331, "epoch": 2591} {"train_loss": -12.88235855102539, "global_step": 435332, "epoch": 2591} {"train_loss": -12.684797286987305, "global_step": 435333, "epoch": 2591} {"train_loss": -12.90109634399414, "global_step": 435334, "epoch": 2591} {"train_loss": -12.925193786621094, "global_step": 435335, "epoch": 2591} {"train_loss": -12.677419662475586, "global_step": 435336, "epoch": 2591} {"train_loss": -12.815380096435547, "global_step": 435337, "epoch": 2591} {"train_loss": -12.885369300842285, "global_step": 435338, "epoch": 2591} {"train_loss": -12.839422225952148, "global_step": 435339, "epoch": 2591} {"train_loss": -12.966644287109375, "global_step": 435340, "epoch": 2591} {"train_loss": -12.913127899169922, "global_step": 435341, "epoch": 2591} {"train_loss": -12.993656158447266, "global_step": 435342, "epoch": 2591} {"train_loss": -13.035188674926758, "global_step": 435343, "epoch": 2591} {"train_loss": -12.918161392211914, "global_step": 435344, "epoch": 2591} {"train_loss": -12.937185287475586, "global_step": 435345, "epoch": 2591} {"train_loss": -12.95980453491211, "global_step": 435346, "epoch": 2591} {"train_loss": -12.962095260620117, "global_step": 435347, "epoch": 2591} {"train_loss": -12.992147445678711, "global_step": 435348, "epoch": 2591} {"train_loss": -12.860551834106445, "global_step": 435349, "epoch": 2591} {"train_loss": -12.979082107543945, "global_step": 435350, "epoch": 2591} {"train_loss": -13.046929359436035, "global_step": 435351, "epoch": 2591} {"train_loss": -12.869918823242188, "global_step": 435352, "epoch": 2591} {"train_loss": -13.02660846710205, "global_step": 435353, "epoch": 2591} {"train_loss": -13.084403991699219, "global_step": 435354, "epoch": 2591} {"train_loss": -13.049440383911133, "global_step": 435355, "epoch": 2591} {"train_loss": -12.985895156860352, "global_step": 435356, "epoch": 2591} {"train_loss": -12.815115928649902, "global_step": 435357, "epoch": 2591} {"train_loss": -12.797746658325195, "global_step": 435358, "epoch": 2591} {"train_loss": -12.988615989685059, "global_step": 435359, "epoch": 2591} {"train_loss": -13.099578857421875, "global_step": 435360, "epoch": 2591} {"train_loss": -12.891006469726562, "global_step": 435361, "epoch": 2591} {"train_loss": -12.618728637695312, "global_step": 435362, "epoch": 2591} {"train_loss": -11.227060317993164, "global_step": 435363, "epoch": 2591} {"train_loss": -11.323514938354492, "global_step": 435364, "epoch": 2591} {"train_loss": -11.451059341430664, "global_step": 435365, "epoch": 2591} {"train_loss": -12.836015701293945, "global_step": 435366, "epoch": 2591} {"train_loss": -12.222342491149902, "global_step": 435367, "epoch": 2591} {"train_loss": -11.406866073608398, "global_step": 435368, "epoch": 2591} {"train_loss": -10.604753494262695, "global_step": 435369, "epoch": 2591} {"train_loss": -11.736034393310547, "global_step": 435370, "epoch": 2591} {"train_loss": -11.5418701171875, "global_step": 435371, "epoch": 2591} {"train_loss": -11.248390197753906, "global_step": 435372, "epoch": 2591} {"train_loss": -10.751181602478027, "global_step": 435373, "epoch": 2591} {"train_loss": -11.75959300994873, "global_step": 435374, "epoch": 2591} {"train_loss": -11.757108688354492, "global_step": 435375, "epoch": 2591} {"train_loss": -11.288783073425293, "global_step": 435376, "epoch": 2591} {"train_loss": -11.61812973022461, "global_step": 435377, "epoch": 2591} {"train_loss": -12.777718544006348, "global_step": 435378, "epoch": 2591} {"train_loss": -12.09661865234375, "global_step": 435379, "epoch": 2591} {"train_loss": -12.596506118774414, "global_step": 435380, "epoch": 2591} {"train_loss": -12.363088607788086, "global_step": 435381, "epoch": 2591} {"train_loss": -12.335156440734863, "global_step": 435382, "epoch": 2591} {"train_loss": -12.176019668579102, "global_step": 435383, "epoch": 2591} {"train_loss": -12.397804260253906, "global_step": 435384, "epoch": 2591} {"train_loss": -11.517931938171387, "global_step": 435385, "epoch": 2591} {"train_loss": -11.625886917114258, "global_step": 435386, "epoch": 2591} {"train_loss": -11.850847244262695, "global_step": 435387, "epoch": 2591} {"train_loss": -12.309000015258789, "global_step": 435388, "epoch": 2591} {"train_loss": -12.11240005493164, "global_step": 435389, "epoch": 2591} {"train_loss": -12.477608680725098, "global_step": 435390, "epoch": 2591} {"train_loss": -12.393196105957031, "global_step": 435391, "epoch": 2591} {"train_loss": -12.45121955871582, "global_step": 435392, "epoch": 2591} {"train_loss": -12.78161907196045, "global_step": 435393, "epoch": 2591} {"train_loss": -12.654645919799805, "global_step": 435394, "epoch": 2591} {"train_loss": -12.633463859558105, "global_step": 435395, "epoch": 2591} {"train_loss": -12.662290573120117, "global_step": 435396, "epoch": 2591} {"train_loss": -12.866939544677734, "global_step": 435397, "epoch": 2591} {"train_loss": -12.237662315368652, "global_step": 435398, "epoch": 2591} {"train_loss": -12.636051177978516, "global_step": 435399, "epoch": 2591} {"train_loss": -12.743324279785156, "global_step": 435400, "epoch": 2591} {"train_loss": -12.622827529907227, "global_step": 435401, "epoch": 2591} {"train_loss": -12.82160758972168, "global_step": 435402, "epoch": 2591} {"train_loss": -12.773752212524414, "global_step": 435403, "epoch": 2591} {"train_loss": -12.85346508026123, "global_step": 435404, "epoch": 2591} {"train_loss": -12.773067474365234, "global_step": 435405, "epoch": 2591} {"train_loss": -12.299493789672852, "global_step": 435406, "epoch": 2591} {"train_loss": -12.697577476501465, "global_step": 435407, "epoch": 2591} {"train_loss": -12.766448974609375, "global_step": 435408, "epoch": 2591} {"train_loss": -12.295873641967773, "global_step": 435409, "epoch": 2591} {"train_loss": -12.665070533752441, "global_step": 435410, "epoch": 2591} {"train_loss": -12.585590362548828, "global_step": 435411, "epoch": 2591} {"train_loss": -12.643149375915527, "global_step": 435412, "epoch": 2591} {"train_loss": -12.675287246704102, "global_step": 435413, "epoch": 2591} {"train_loss": -12.191275596618652, "global_step": 435414, "epoch": 2591} {"train_loss": -12.45643138885498, "global_step": 435415, "epoch": 2591} {"train_loss": -12.679628372192383, "global_step": 435416, "epoch": 2591} {"train_loss": -12.307583808898926, "global_step": 435417, "epoch": 2591} {"train_loss": -12.216087341308594, "global_step": 435418, "epoch": 2591} {"train_loss": -12.611373901367188, "global_step": 435419, "epoch": 2591} {"train_loss": -12.683540344238281, "global_step": 435420, "epoch": 2591} {"train_loss": -12.645040512084961, "global_step": 435421, "epoch": 2591} {"train_loss": -12.501993179321289, "global_step": 435422, "epoch": 2591} {"train_loss": -12.747482299804688, "global_step": 435423, "epoch": 2591} {"train_loss": -12.188039779663086, "global_step": 435424, "epoch": 2591} {"train_loss": -12.050132751464844, "global_step": 435425, "epoch": 2591} {"train_loss": -12.639457702636719, "global_step": 435426, "epoch": 2591} {"train_loss": -12.155704498291016, "global_step": 435427, "epoch": 2591} {"train_loss": -12.689327239990234, "global_step": 435428, "epoch": 2591} {"train_loss": -12.259066581726074, "global_step": 435429, "epoch": 2591} {"train_loss": -12.02996826171875, "global_step": 435430, "epoch": 2591} {"train_loss": -11.745992660522461, "global_step": 435431, "epoch": 2591} {"train_loss": -12.531110763549805, "global_step": 435432, "epoch": 2591} {"train_loss": -12.251197814941406, "global_step": 435433, "epoch": 2591} {"train_loss": -11.060296058654785, "global_step": 435434, "epoch": 2591} {"train_loss": -11.614469528198242, "global_step": 435435, "epoch": 2591} {"train_loss": -12.483316421508789, "global_step": 435436, "epoch": 2591} {"train_loss": -12.006258964538574, "global_step": 435437, "epoch": 2591} {"train_loss": -11.668745994567871, "global_step": 435438, "epoch": 2591} {"train_loss": -12.066925048828125, "global_step": 435439, "epoch": 2591} {"train_loss": -12.49878215789795, "global_step": 435440, "epoch": 2591} {"train_loss": -11.815156936645508, "global_step": 435441, "epoch": 2591} {"train_loss": -12.348392486572266, "global_step": 435442, "epoch": 2591} {"train_loss": -11.812114715576172, "global_step": 435443, "epoch": 2591} {"train_loss": -11.900471687316895, "global_step": 435444, "epoch": 2591} {"train_loss": -12.234423637390137, "global_step": 435445, "epoch": 2591} {"train_loss": -12.602227210998535, "global_step": 435446, "epoch": 2591} {"train_loss": -11.296180725097656, "global_step": 435447, "epoch": 2591} {"train_loss": -10.968923568725586, "global_step": 435448, "epoch": 2591} {"train_loss": -11.950435638427734, "global_step": 435449, "epoch": 2591} {"train_loss": -10.665239334106445, "global_step": 435450, "epoch": 2591} {"train_loss": -12.018092155456543, "global_step": 435451, "epoch": 2591} {"train_loss": -11.944759368896484, "global_step": 435452, "epoch": 2591} {"train_loss": -12.036270141601562, "global_step": 435453, "epoch": 2591} {"train_loss": -12.169219017028809, "global_step": 435454, "epoch": 2591} {"train_loss": -12.40155665647416, "global_step": 435455, "epoch": 2591, "val_loss": 309367.6875} {"train_loss": -12.645988464355469, "global_step": 435456, "epoch": 2592} {"train_loss": -11.587039947509766, "global_step": 435457, "epoch": 2592} {"train_loss": -12.378276824951172, "global_step": 435458, "epoch": 2592} {"train_loss": -11.281270980834961, "global_step": 435459, "epoch": 2592} {"train_loss": -11.747116088867188, "global_step": 435460, "epoch": 2592} {"train_loss": -11.644559860229492, "global_step": 435461, "epoch": 2592} {"train_loss": -11.631792068481445, "global_step": 435462, "epoch": 2592} {"train_loss": -11.650882720947266, "global_step": 435463, "epoch": 2592} {"train_loss": -11.565591812133789, "global_step": 435464, "epoch": 2592} {"train_loss": -11.908309936523438, "global_step": 435465, "epoch": 2592} {"train_loss": -11.45441722869873, "global_step": 435466, "epoch": 2592} {"train_loss": -11.767339706420898, "global_step": 435467, "epoch": 2592} {"train_loss": -11.642132759094238, "global_step": 435468, "epoch": 2592} {"train_loss": -12.103376388549805, "global_step": 435469, "epoch": 2592} {"train_loss": -11.656999588012695, "global_step": 435470, "epoch": 2592} {"train_loss": -11.847301483154297, "global_step": 435471, "epoch": 2592} {"train_loss": -11.87010669708252, "global_step": 435472, "epoch": 2592} {"train_loss": -11.85598373413086, "global_step": 435473, "epoch": 2592} {"train_loss": -11.186307907104492, "global_step": 435474, "epoch": 2592} {"train_loss": -11.214643478393555, "global_step": 435475, "epoch": 2592} {"train_loss": -12.152973175048828, "global_step": 435476, "epoch": 2592} {"train_loss": -11.498964309692383, "global_step": 435477, "epoch": 2592} {"train_loss": -12.038299560546875, "global_step": 435478, "epoch": 2592} {"train_loss": -11.076321601867676, "global_step": 435479, "epoch": 2592} {"train_loss": -12.410127639770508, "global_step": 435480, "epoch": 2592} {"train_loss": -11.387948989868164, "global_step": 435481, "epoch": 2592} {"train_loss": -12.409159660339355, "global_step": 435482, "epoch": 2592} {"train_loss": -11.81964111328125, "global_step": 435483, "epoch": 2592} {"train_loss": -12.164085388183594, "global_step": 435484, "epoch": 2592} {"train_loss": -12.073976516723633, "global_step": 435485, "epoch": 2592} {"train_loss": -12.11309814453125, "global_step": 435486, "epoch": 2592} {"train_loss": -11.912130355834961, "global_step": 435487, "epoch": 2592} {"train_loss": -12.067134857177734, "global_step": 435488, "epoch": 2592} {"train_loss": -11.768823623657227, "global_step": 435489, "epoch": 2592} {"train_loss": -11.705992698669434, "global_step": 435490, "epoch": 2592} {"train_loss": -12.359223365783691, "global_step": 435491, "epoch": 2592} {"train_loss": -12.382097244262695, "global_step": 435492, "epoch": 2592} {"train_loss": -11.964178085327148, "global_step": 435493, "epoch": 2592} {"train_loss": -12.073046684265137, "global_step": 435494, "epoch": 2592} {"train_loss": -11.8822603225708, "global_step": 435495, "epoch": 2592} {"train_loss": -12.264972686767578, "global_step": 435496, "epoch": 2592} {"train_loss": -12.0084228515625, "global_step": 435497, "epoch": 2592} {"train_loss": -12.430075645446777, "global_step": 435498, "epoch": 2592} {"train_loss": -12.39963150024414, "global_step": 435499, "epoch": 2592} {"train_loss": -12.61023998260498, "global_step": 435500, "epoch": 2592} {"train_loss": -12.300400733947754, "global_step": 435501, "epoch": 2592} {"train_loss": -12.587757110595703, "global_step": 435502, "epoch": 2592} {"train_loss": -12.285384178161621, "global_step": 435503, "epoch": 2592} {"train_loss": -12.267698287963867, "global_step": 435504, "epoch": 2592} {"train_loss": -12.597478866577148, "global_step": 435505, "epoch": 2592} {"train_loss": -11.948572158813477, "global_step": 435506, "epoch": 2592} {"train_loss": -12.661778450012207, "global_step": 435507, "epoch": 2592} {"train_loss": -12.072810173034668, "global_step": 435508, "epoch": 2592} {"train_loss": -12.667521476745605, "global_step": 435509, "epoch": 2592} {"train_loss": -12.36625862121582, "global_step": 435510, "epoch": 2592} {"train_loss": -12.551350593566895, "global_step": 435511, "epoch": 2592} {"train_loss": -12.612276077270508, "global_step": 435512, "epoch": 2592} {"train_loss": -12.346086502075195, "global_step": 435513, "epoch": 2592} {"train_loss": -12.483682632446289, "global_step": 435514, "epoch": 2592} {"train_loss": -12.653189659118652, "global_step": 435515, "epoch": 2592} {"train_loss": -12.336149215698242, "global_step": 435516, "epoch": 2592} {"train_loss": -12.725127220153809, "global_step": 435517, "epoch": 2592} {"train_loss": -11.968328475952148, "global_step": 435518, "epoch": 2592} {"train_loss": -12.780494689941406, "global_step": 435519, "epoch": 2592} {"train_loss": -12.248453140258789, "global_step": 435520, "epoch": 2592} {"train_loss": -12.244149208068848, "global_step": 435521, "epoch": 2592} {"train_loss": -12.370141983032227, "global_step": 435522, "epoch": 2592} {"train_loss": -12.15861701965332, "global_step": 435523, "epoch": 2592} {"train_loss": -11.794615745544434, "global_step": 435524, "epoch": 2592} {"train_loss": -11.849132537841797, "global_step": 435525, "epoch": 2592} {"train_loss": -12.307573318481445, "global_step": 435526, "epoch": 2592} {"train_loss": -11.950942039489746, "global_step": 435527, "epoch": 2592} {"train_loss": -12.535168647766113, "global_step": 435528, "epoch": 2592} {"train_loss": -12.015276908874512, "global_step": 435529, "epoch": 2592} {"train_loss": -12.492396354675293, "global_step": 435530, "epoch": 2592} {"train_loss": -12.000661849975586, "global_step": 435531, "epoch": 2592} {"train_loss": -12.266674995422363, "global_step": 435532, "epoch": 2592} {"train_loss": -12.591426849365234, "global_step": 435533, "epoch": 2592} {"train_loss": -11.71159839630127, "global_step": 435534, "epoch": 2592} {"train_loss": -12.167983055114746, "global_step": 435535, "epoch": 2592} {"train_loss": -12.245218276977539, "global_step": 435536, "epoch": 2592} {"train_loss": -12.484850883483887, "global_step": 435537, "epoch": 2592} {"train_loss": -12.143386840820312, "global_step": 435538, "epoch": 2592} {"train_loss": -12.558149337768555, "global_step": 435539, "epoch": 2592} {"train_loss": -12.347267150878906, "global_step": 435540, "epoch": 2592} {"train_loss": -12.291324615478516, "global_step": 435541, "epoch": 2592} {"train_loss": -11.843585968017578, "global_step": 435542, "epoch": 2592} {"train_loss": -11.943151473999023, "global_step": 435543, "epoch": 2592} {"train_loss": -12.592564582824707, "global_step": 435544, "epoch": 2592} {"train_loss": -12.24983024597168, "global_step": 435545, "epoch": 2592} {"train_loss": -12.567246437072754, "global_step": 435546, "epoch": 2592} {"train_loss": -12.679792404174805, "global_step": 435547, "epoch": 2592} {"train_loss": -12.2618408203125, "global_step": 435548, "epoch": 2592} {"train_loss": -12.309432983398438, "global_step": 435549, "epoch": 2592} {"train_loss": -12.64804744720459, "global_step": 435550, "epoch": 2592} {"train_loss": -12.312911987304688, "global_step": 435551, "epoch": 2592} {"train_loss": -12.74842357635498, "global_step": 435552, "epoch": 2592} {"train_loss": -12.748323440551758, "global_step": 435553, "epoch": 2592} {"train_loss": -12.744865417480469, "global_step": 435554, "epoch": 2592} {"train_loss": -12.61861801147461, "global_step": 435555, "epoch": 2592} {"train_loss": -12.608718872070312, "global_step": 435556, "epoch": 2592} {"train_loss": -12.81756591796875, "global_step": 435557, "epoch": 2592} {"train_loss": -12.47432804107666, "global_step": 435558, "epoch": 2592} {"train_loss": -12.573989868164062, "global_step": 435559, "epoch": 2592} {"train_loss": -12.872960090637207, "global_step": 435560, "epoch": 2592} {"train_loss": -12.500826835632324, "global_step": 435561, "epoch": 2592} {"train_loss": -12.493666648864746, "global_step": 435562, "epoch": 2592} {"train_loss": -12.612653732299805, "global_step": 435563, "epoch": 2592} {"train_loss": -12.753032684326172, "global_step": 435564, "epoch": 2592} {"train_loss": -12.744352340698242, "global_step": 435565, "epoch": 2592} {"train_loss": -12.605224609375, "global_step": 435566, "epoch": 2592} {"train_loss": -12.795318603515625, "global_step": 435567, "epoch": 2592} {"train_loss": -12.913854598999023, "global_step": 435568, "epoch": 2592} {"train_loss": -12.529751777648926, "global_step": 435569, "epoch": 2592} {"train_loss": -12.790197372436523, "global_step": 435570, "epoch": 2592} {"train_loss": -12.357172012329102, "global_step": 435571, "epoch": 2592} {"train_loss": -12.618202209472656, "global_step": 435572, "epoch": 2592} {"train_loss": -12.885077476501465, "global_step": 435573, "epoch": 2592} {"train_loss": -12.674631118774414, "global_step": 435574, "epoch": 2592} {"train_loss": -12.014019012451172, "global_step": 435575, "epoch": 2592} {"train_loss": -12.492595672607422, "global_step": 435576, "epoch": 2592} {"train_loss": -12.545836448669434, "global_step": 435577, "epoch": 2592} {"train_loss": -12.648962020874023, "global_step": 435578, "epoch": 2592} {"train_loss": -12.597808837890625, "global_step": 435579, "epoch": 2592} {"train_loss": -12.316823959350586, "global_step": 435580, "epoch": 2592} {"train_loss": -12.218171119689941, "global_step": 435581, "epoch": 2592} {"train_loss": -12.2875337600708, "global_step": 435582, "epoch": 2592} {"train_loss": -12.108558654785156, "global_step": 435583, "epoch": 2592} {"train_loss": -11.909769058227539, "global_step": 435584, "epoch": 2592} {"train_loss": -12.788902282714844, "global_step": 435585, "epoch": 2592} {"train_loss": -12.0562744140625, "global_step": 435586, "epoch": 2592} {"train_loss": -11.836751937866211, "global_step": 435587, "epoch": 2592} {"train_loss": -12.32383918762207, "global_step": 435588, "epoch": 2592} {"train_loss": -12.434610366821289, "global_step": 435589, "epoch": 2592} {"train_loss": -11.715645790100098, "global_step": 435590, "epoch": 2592} {"train_loss": -11.4595308303833, "global_step": 435591, "epoch": 2592} {"train_loss": -11.92788314819336, "global_step": 435592, "epoch": 2592} {"train_loss": -12.188848495483398, "global_step": 435593, "epoch": 2592} {"train_loss": -11.495267868041992, "global_step": 435594, "epoch": 2592} {"train_loss": -11.7135009765625, "global_step": 435595, "epoch": 2592} {"train_loss": -12.234395980834961, "global_step": 435596, "epoch": 2592} {"train_loss": -12.4227294921875, "global_step": 435597, "epoch": 2592} {"train_loss": -12.150946617126465, "global_step": 435598, "epoch": 2592} {"train_loss": -12.283061981201172, "global_step": 435599, "epoch": 2592} {"train_loss": -12.060098648071289, "global_step": 435600, "epoch": 2592} {"train_loss": -12.466683387756348, "global_step": 435601, "epoch": 2592} {"train_loss": -12.321813583374023, "global_step": 435602, "epoch": 2592} {"train_loss": -11.93920612335205, "global_step": 435603, "epoch": 2592} {"train_loss": -11.95165729522705, "global_step": 435604, "epoch": 2592} {"train_loss": -11.743415832519531, "global_step": 435605, "epoch": 2592} {"train_loss": -12.206121444702148, "global_step": 435606, "epoch": 2592} {"train_loss": -11.569722175598145, "global_step": 435607, "epoch": 2592} {"train_loss": -11.93887710571289, "global_step": 435608, "epoch": 2592} {"train_loss": -11.763080596923828, "global_step": 435609, "epoch": 2592} {"train_loss": -11.325447082519531, "global_step": 435610, "epoch": 2592} {"train_loss": -12.330329895019531, "global_step": 435611, "epoch": 2592} {"train_loss": -11.350692749023438, "global_step": 435612, "epoch": 2592} {"train_loss": -12.6727294921875, "global_step": 435613, "epoch": 2592} {"train_loss": -11.45654296875, "global_step": 435614, "epoch": 2592} {"train_loss": -11.417261123657227, "global_step": 435615, "epoch": 2592} {"train_loss": -11.519935607910156, "global_step": 435616, "epoch": 2592} {"train_loss": -11.184309005737305, "global_step": 435617, "epoch": 2592} {"train_loss": -11.847715377807617, "global_step": 435618, "epoch": 2592} {"train_loss": -10.86627197265625, "global_step": 435619, "epoch": 2592} {"train_loss": -11.732757568359375, "global_step": 435620, "epoch": 2592} {"train_loss": -10.165241241455078, "global_step": 435621, "epoch": 2592} {"train_loss": -9.325922966003418, "global_step": 435622, "epoch": 2592} {"train_loss": -12.130430874370393, "global_step": 435623, "epoch": 2592, "val_loss": 308776.40625} {"train_loss": -8.828508377075195, "global_step": 435624, "epoch": 2593} {"train_loss": -10.755640983581543, "global_step": 435625, "epoch": 2593} {"train_loss": -9.827587127685547, "global_step": 435626, "epoch": 2593} {"train_loss": -10.458744049072266, "global_step": 435627, "epoch": 2593} {"train_loss": -10.067850112915039, "global_step": 435628, "epoch": 2593} {"train_loss": -10.728233337402344, "global_step": 435629, "epoch": 2593} {"train_loss": -9.413222312927246, "global_step": 435630, "epoch": 2593} {"train_loss": -11.541386604309082, "global_step": 435631, "epoch": 2593} {"train_loss": -10.682558059692383, "global_step": 435632, "epoch": 2593} {"train_loss": -10.997093200683594, "global_step": 435633, "epoch": 2593} {"train_loss": -11.52978229522705, "global_step": 435634, "epoch": 2593} {"train_loss": -10.813077926635742, "global_step": 435635, "epoch": 2593} {"train_loss": -11.88936996459961, "global_step": 435636, "epoch": 2593} {"train_loss": -11.211109161376953, "global_step": 435637, "epoch": 2593} {"train_loss": -10.942055702209473, "global_step": 435638, "epoch": 2593} {"train_loss": -11.716894149780273, "global_step": 435639, "epoch": 2593} {"train_loss": -11.421092987060547, "global_step": 435640, "epoch": 2593} {"train_loss": -11.901235580444336, "global_step": 435641, "epoch": 2593} {"train_loss": -11.72884464263916, "global_step": 435642, "epoch": 2593} {"train_loss": -12.008367538452148, "global_step": 435643, "epoch": 2593} {"train_loss": -12.029472351074219, "global_step": 435644, "epoch": 2593} {"train_loss": -12.16927433013916, "global_step": 435645, "epoch": 2593} {"train_loss": -12.017496109008789, "global_step": 435646, "epoch": 2593} {"train_loss": -12.178934097290039, "global_step": 435647, "epoch": 2593} {"train_loss": -12.122076988220215, "global_step": 435648, "epoch": 2593} {"train_loss": -12.220353126525879, "global_step": 435649, "epoch": 2593} {"train_loss": -12.611064910888672, "global_step": 435650, "epoch": 2593} {"train_loss": -11.884744644165039, "global_step": 435651, "epoch": 2593} {"train_loss": -12.316296577453613, "global_step": 435652, "epoch": 2593} {"train_loss": -12.472151756286621, "global_step": 435653, "epoch": 2593} {"train_loss": -12.410280227661133, "global_step": 435654, "epoch": 2593} {"train_loss": -12.395581245422363, "global_step": 435655, "epoch": 2593} {"train_loss": -12.259844779968262, "global_step": 435656, "epoch": 2593} {"train_loss": -12.404519081115723, "global_step": 435657, "epoch": 2593} {"train_loss": -12.43503189086914, "global_step": 435658, "epoch": 2593} {"train_loss": -12.257625579833984, "global_step": 435659, "epoch": 2593} {"train_loss": -12.568012237548828, "global_step": 435660, "epoch": 2593} {"train_loss": -12.360946655273438, "global_step": 435661, "epoch": 2593} {"train_loss": -12.428253173828125, "global_step": 435662, "epoch": 2593} {"train_loss": -12.569442749023438, "global_step": 435663, "epoch": 2593} {"train_loss": -12.427719116210938, "global_step": 435664, "epoch": 2593} {"train_loss": -12.626235961914062, "global_step": 435665, "epoch": 2593} {"train_loss": -12.347427368164062, "global_step": 435666, "epoch": 2593} {"train_loss": -12.578742980957031, "global_step": 435667, "epoch": 2593} {"train_loss": -12.544516563415527, "global_step": 435668, "epoch": 2593} {"train_loss": -12.615848541259766, "global_step": 435669, "epoch": 2593} {"train_loss": -12.500284194946289, "global_step": 435670, "epoch": 2593} {"train_loss": -12.496955871582031, "global_step": 435671, "epoch": 2593} {"train_loss": -12.563472747802734, "global_step": 435672, "epoch": 2593} {"train_loss": -12.231514930725098, "global_step": 435673, "epoch": 2593} {"train_loss": -12.555017471313477, "global_step": 435674, "epoch": 2593} {"train_loss": -12.185050010681152, "global_step": 435675, "epoch": 2593} {"train_loss": -12.51856803894043, "global_step": 435676, "epoch": 2593} {"train_loss": -12.617574691772461, "global_step": 435677, "epoch": 2593} {"train_loss": -12.316640853881836, "global_step": 435678, "epoch": 2593} {"train_loss": -12.557853698730469, "global_step": 435679, "epoch": 2593} {"train_loss": -12.326681137084961, "global_step": 435680, "epoch": 2593} {"train_loss": -12.592473983764648, "global_step": 435681, "epoch": 2593} {"train_loss": -12.095340728759766, "global_step": 435682, "epoch": 2593} {"train_loss": -12.521068572998047, "global_step": 435683, "epoch": 2593} {"train_loss": -12.16789436340332, "global_step": 435684, "epoch": 2593} {"train_loss": -12.522984504699707, "global_step": 435685, "epoch": 2593} {"train_loss": -12.158527374267578, "global_step": 435686, "epoch": 2593} {"train_loss": -12.538960456848145, "global_step": 435687, "epoch": 2593} {"train_loss": -12.36530876159668, "global_step": 435688, "epoch": 2593} {"train_loss": -12.473564147949219, "global_step": 435689, "epoch": 2593} {"train_loss": -12.162211418151855, "global_step": 435690, "epoch": 2593} {"train_loss": -12.593330383300781, "global_step": 435691, "epoch": 2593} {"train_loss": -12.499040603637695, "global_step": 435692, "epoch": 2593} {"train_loss": -12.587034225463867, "global_step": 435693, "epoch": 2593} {"train_loss": -12.424457550048828, "global_step": 435694, "epoch": 2593} {"train_loss": -12.551141738891602, "global_step": 435695, "epoch": 2593} {"train_loss": -12.602852821350098, "global_step": 435696, "epoch": 2593} {"train_loss": -12.358381271362305, "global_step": 435697, "epoch": 2593} {"train_loss": -12.331135749816895, "global_step": 435698, "epoch": 2593} {"train_loss": -12.572420120239258, "global_step": 435699, "epoch": 2593} {"train_loss": -12.64090347290039, "global_step": 435700, "epoch": 2593} {"train_loss": -12.50273323059082, "global_step": 435701, "epoch": 2593} {"train_loss": -12.74833869934082, "global_step": 435702, "epoch": 2593} {"train_loss": -12.450803756713867, "global_step": 435703, "epoch": 2593} {"train_loss": -12.540534973144531, "global_step": 435704, "epoch": 2593} {"train_loss": -12.438447952270508, "global_step": 435705, "epoch": 2593} {"train_loss": -12.43239974975586, "global_step": 435706, "epoch": 2593} {"train_loss": -12.278766632080078, "global_step": 435707, "epoch": 2593} {"train_loss": -12.540753364562988, "global_step": 435708, "epoch": 2593} {"train_loss": -12.508467674255371, "global_step": 435709, "epoch": 2593} {"train_loss": -12.432161331176758, "global_step": 435710, "epoch": 2593} {"train_loss": -12.91673469543457, "global_step": 435711, "epoch": 2593} {"train_loss": -12.773504257202148, "global_step": 435712, "epoch": 2593} {"train_loss": -12.658455848693848, "global_step": 435713, "epoch": 2593} {"train_loss": -12.850359916687012, "global_step": 435714, "epoch": 2593} {"train_loss": -12.725099563598633, "global_step": 435715, "epoch": 2593} {"train_loss": -12.848546981811523, "global_step": 435716, "epoch": 2593} {"train_loss": -12.89280891418457, "global_step": 435717, "epoch": 2593} {"train_loss": -12.685274124145508, "global_step": 435718, "epoch": 2593} {"train_loss": -12.776752471923828, "global_step": 435719, "epoch": 2593} {"train_loss": -12.833307266235352, "global_step": 435720, "epoch": 2593} {"train_loss": -12.662931442260742, "global_step": 435721, "epoch": 2593} {"train_loss": -13.001359939575195, "global_step": 435722, "epoch": 2593} {"train_loss": -12.800735473632812, "global_step": 435723, "epoch": 2593} {"train_loss": -12.821752548217773, "global_step": 435724, "epoch": 2593} {"train_loss": -12.96194076538086, "global_step": 435725, "epoch": 2593} {"train_loss": -12.827047348022461, "global_step": 435726, "epoch": 2593} {"train_loss": -12.780977249145508, "global_step": 435727, "epoch": 2593} {"train_loss": -12.735451698303223, "global_step": 435728, "epoch": 2593} {"train_loss": -12.759642601013184, "global_step": 435729, "epoch": 2593} {"train_loss": -12.45363712310791, "global_step": 435730, "epoch": 2593} {"train_loss": -12.788093566894531, "global_step": 435731, "epoch": 2593} {"train_loss": -12.463873863220215, "global_step": 435732, "epoch": 2593} {"train_loss": -12.9708890914917, "global_step": 435733, "epoch": 2593} {"train_loss": -12.497274398803711, "global_step": 435734, "epoch": 2593} {"train_loss": -12.808487892150879, "global_step": 435735, "epoch": 2593} {"train_loss": -12.662519454956055, "global_step": 435736, "epoch": 2593} {"train_loss": -12.709157943725586, "global_step": 435737, "epoch": 2593} {"train_loss": -12.678139686584473, "global_step": 435738, "epoch": 2593} {"train_loss": -12.513723373413086, "global_step": 435739, "epoch": 2593} {"train_loss": -12.564477920532227, "global_step": 435740, "epoch": 2593} {"train_loss": -12.60135269165039, "global_step": 435741, "epoch": 2593} {"train_loss": -12.917829513549805, "global_step": 435742, "epoch": 2593} {"train_loss": -12.842992782592773, "global_step": 435743, "epoch": 2593} {"train_loss": -12.744304656982422, "global_step": 435744, "epoch": 2593} {"train_loss": -12.42985725402832, "global_step": 435745, "epoch": 2593} {"train_loss": -12.484933853149414, "global_step": 435746, "epoch": 2593} {"train_loss": -12.260910034179688, "global_step": 435747, "epoch": 2593} {"train_loss": -12.224727630615234, "global_step": 435748, "epoch": 2593} {"train_loss": -12.17671012878418, "global_step": 435749, "epoch": 2593} {"train_loss": -12.532234191894531, "global_step": 435750, "epoch": 2593} {"train_loss": -12.523965835571289, "global_step": 435751, "epoch": 2593} {"train_loss": -11.80909252166748, "global_step": 435752, "epoch": 2593} {"train_loss": -12.30333137512207, "global_step": 435753, "epoch": 2593} {"train_loss": -12.07578182220459, "global_step": 435754, "epoch": 2593} {"train_loss": -11.702961921691895, "global_step": 435755, "epoch": 2593} {"train_loss": -12.341141700744629, "global_step": 435756, "epoch": 2593} {"train_loss": -12.315122604370117, "global_step": 435757, "epoch": 2593} {"train_loss": -12.19133472442627, "global_step": 435758, "epoch": 2593} {"train_loss": -11.875776290893555, "global_step": 435759, "epoch": 2593} {"train_loss": -11.944448471069336, "global_step": 435760, "epoch": 2593} {"train_loss": -11.583793640136719, "global_step": 435761, "epoch": 2593} {"train_loss": -12.68729305267334, "global_step": 435762, "epoch": 2593} {"train_loss": -11.713207244873047, "global_step": 435763, "epoch": 2593} {"train_loss": -11.720443725585938, "global_step": 435764, "epoch": 2593} {"train_loss": -11.998886108398438, "global_step": 435765, "epoch": 2593} {"train_loss": -12.212154388427734, "global_step": 435766, "epoch": 2593} {"train_loss": -11.873679161071777, "global_step": 435767, "epoch": 2593} {"train_loss": -12.425529479980469, "global_step": 435768, "epoch": 2593} {"train_loss": -11.712891578674316, "global_step": 435769, "epoch": 2593} {"train_loss": -12.040996551513672, "global_step": 435770, "epoch": 2593} {"train_loss": -11.819652557373047, "global_step": 435771, "epoch": 2593} {"train_loss": -12.713711738586426, "global_step": 435772, "epoch": 2593} {"train_loss": -11.847987174987793, "global_step": 435773, "epoch": 2593} {"train_loss": -12.85361385345459, "global_step": 435774, "epoch": 2593} {"train_loss": -11.80746841430664, "global_step": 435775, "epoch": 2593} {"train_loss": -12.168811798095703, "global_step": 435776, "epoch": 2593} {"train_loss": -12.005903244018555, "global_step": 435777, "epoch": 2593} {"train_loss": -12.391340255737305, "global_step": 435778, "epoch": 2593} {"train_loss": -11.533428192138672, "global_step": 435779, "epoch": 2593} {"train_loss": -11.610383987426758, "global_step": 435780, "epoch": 2593} {"train_loss": -11.917470932006836, "global_step": 435781, "epoch": 2593} {"train_loss": -11.880840301513672, "global_step": 435782, "epoch": 2593} {"train_loss": -11.140324592590332, "global_step": 435783, "epoch": 2593} {"train_loss": -11.045753479003906, "global_step": 435784, "epoch": 2593} {"train_loss": -12.295228004455566, "global_step": 435785, "epoch": 2593} {"train_loss": -11.76679801940918, "global_step": 435786, "epoch": 2593} {"train_loss": -11.357213973999023, "global_step": 435787, "epoch": 2593} {"train_loss": -10.778240203857422, "global_step": 435788, "epoch": 2593} {"train_loss": -12.164546966552734, "global_step": 435789, "epoch": 2593} {"train_loss": -11.635072708129883, "global_step": 435790, "epoch": 2593} {"train_loss": -12.189885338147482, "global_step": 435791, "epoch": 2593, "val_loss": 307523.53125} {"train_loss": -11.803388595581055, "global_step": 435792, "epoch": 2594} {"train_loss": -12.012616157531738, "global_step": 435793, "epoch": 2594} {"train_loss": -11.800819396972656, "global_step": 435794, "epoch": 2594} {"train_loss": -12.159860610961914, "global_step": 435795, "epoch": 2594} {"train_loss": -12.218297958374023, "global_step": 435796, "epoch": 2594} {"train_loss": -12.612273216247559, "global_step": 435797, "epoch": 2594} {"train_loss": -12.01498794555664, "global_step": 435798, "epoch": 2594} {"train_loss": -12.077098846435547, "global_step": 435799, "epoch": 2594} {"train_loss": -12.1351318359375, "global_step": 435800, "epoch": 2594} {"train_loss": -12.092483520507812, "global_step": 435801, "epoch": 2594} {"train_loss": -12.364829063415527, "global_step": 435802, "epoch": 2594} {"train_loss": -12.398126602172852, "global_step": 435803, "epoch": 2594} {"train_loss": -12.490373611450195, "global_step": 435804, "epoch": 2594} {"train_loss": -12.374954223632812, "global_step": 435805, "epoch": 2594} {"train_loss": -12.538745880126953, "global_step": 435806, "epoch": 2594} {"train_loss": -12.247361183166504, "global_step": 435807, "epoch": 2594} {"train_loss": -12.225839614868164, "global_step": 435808, "epoch": 2594} {"train_loss": -12.158904075622559, "global_step": 435809, "epoch": 2594} {"train_loss": -12.35544204711914, "global_step": 435810, "epoch": 2594} {"train_loss": -11.941875457763672, "global_step": 435811, "epoch": 2594} {"train_loss": -12.069967269897461, "global_step": 435812, "epoch": 2594} {"train_loss": -12.147420883178711, "global_step": 435813, "epoch": 2594} {"train_loss": -12.180595397949219, "global_step": 435814, "epoch": 2594} {"train_loss": -12.543198585510254, "global_step": 435815, "epoch": 2594} {"train_loss": -12.283679962158203, "global_step": 435816, "epoch": 2594} {"train_loss": -12.390303611755371, "global_step": 435817, "epoch": 2594} {"train_loss": -12.770026206970215, "global_step": 435818, "epoch": 2594} {"train_loss": -12.382587432861328, "global_step": 435819, "epoch": 2594} {"train_loss": -12.359443664550781, "global_step": 435820, "epoch": 2594} {"train_loss": -12.446548461914062, "global_step": 435821, "epoch": 2594} {"train_loss": -12.491401672363281, "global_step": 435822, "epoch": 2594} {"train_loss": -12.210283279418945, "global_step": 435823, "epoch": 2594} {"train_loss": -12.57890510559082, "global_step": 435824, "epoch": 2594} {"train_loss": -12.104338645935059, "global_step": 435825, "epoch": 2594} {"train_loss": -12.506209373474121, "global_step": 435826, "epoch": 2594} {"train_loss": -12.278350830078125, "global_step": 435827, "epoch": 2594} {"train_loss": -12.616353988647461, "global_step": 435828, "epoch": 2594} {"train_loss": -12.016336441040039, "global_step": 435829, "epoch": 2594} {"train_loss": -12.493876457214355, "global_step": 435830, "epoch": 2594} {"train_loss": -12.057840347290039, "global_step": 435831, "epoch": 2594} {"train_loss": -11.731294631958008, "global_step": 435832, "epoch": 2594} {"train_loss": -12.140193939208984, "global_step": 435833, "epoch": 2594} {"train_loss": -12.035494804382324, "global_step": 435834, "epoch": 2594} {"train_loss": -12.104584693908691, "global_step": 435835, "epoch": 2594} {"train_loss": -11.66025447845459, "global_step": 435836, "epoch": 2594} {"train_loss": -12.079532623291016, "global_step": 435837, "epoch": 2594} {"train_loss": -11.548749923706055, "global_step": 435838, "epoch": 2594} {"train_loss": -12.350112915039062, "global_step": 435839, "epoch": 2594} {"train_loss": -12.475950241088867, "global_step": 435840, "epoch": 2594} {"train_loss": -11.375570297241211, "global_step": 435841, "epoch": 2594} {"train_loss": -12.721273422241211, "global_step": 435842, "epoch": 2594} {"train_loss": -11.94189167022705, "global_step": 435843, "epoch": 2594} {"train_loss": -11.851736068725586, "global_step": 435844, "epoch": 2594} {"train_loss": -11.914820671081543, "global_step": 435845, "epoch": 2594} {"train_loss": -12.368192672729492, "global_step": 435846, "epoch": 2594} {"train_loss": -12.576229095458984, "global_step": 435847, "epoch": 2594} {"train_loss": -11.874637603759766, "global_step": 435848, "epoch": 2594} {"train_loss": -12.602886199951172, "global_step": 435849, "epoch": 2594} {"train_loss": -12.293827056884766, "global_step": 435850, "epoch": 2594} {"train_loss": -12.350470542907715, "global_step": 435851, "epoch": 2594} {"train_loss": -12.592469215393066, "global_step": 435852, "epoch": 2594} {"train_loss": -12.230436325073242, "global_step": 435853, "epoch": 2594} {"train_loss": -12.296541213989258, "global_step": 435854, "epoch": 2594} {"train_loss": -11.591381072998047, "global_step": 435855, "epoch": 2594} {"train_loss": -12.213558197021484, "global_step": 435856, "epoch": 2594} {"train_loss": -11.964139938354492, "global_step": 435857, "epoch": 2594} {"train_loss": -11.532308578491211, "global_step": 435858, "epoch": 2594} {"train_loss": -11.926162719726562, "global_step": 435859, "epoch": 2594} {"train_loss": -12.213712692260742, "global_step": 435860, "epoch": 2594} {"train_loss": -11.353269577026367, "global_step": 435861, "epoch": 2594} {"train_loss": -12.464641571044922, "global_step": 435862, "epoch": 2594} {"train_loss": -11.365762710571289, "global_step": 435863, "epoch": 2594} {"train_loss": -11.685466766357422, "global_step": 435864, "epoch": 2594} {"train_loss": -12.183429718017578, "global_step": 435865, "epoch": 2594} {"train_loss": -11.68356704711914, "global_step": 435866, "epoch": 2594} {"train_loss": -12.190725326538086, "global_step": 435867, "epoch": 2594} {"train_loss": -12.304805755615234, "global_step": 435868, "epoch": 2594} {"train_loss": -12.096487998962402, "global_step": 435869, "epoch": 2594} {"train_loss": -12.700613021850586, "global_step": 435870, "epoch": 2594} {"train_loss": -12.473348617553711, "global_step": 435871, "epoch": 2594} {"train_loss": -12.114919662475586, "global_step": 435872, "epoch": 2594} {"train_loss": -12.564269065856934, "global_step": 435873, "epoch": 2594} {"train_loss": -12.164889335632324, "global_step": 435874, "epoch": 2594} {"train_loss": -12.513466835021973, "global_step": 435875, "epoch": 2594} {"train_loss": -12.279759407043457, "global_step": 435876, "epoch": 2594} {"train_loss": -12.49135971069336, "global_step": 435877, "epoch": 2594} {"train_loss": -12.672855377197266, "global_step": 435878, "epoch": 2594} {"train_loss": -12.553171157836914, "global_step": 435879, "epoch": 2594} {"train_loss": -12.663751602172852, "global_step": 435880, "epoch": 2594} {"train_loss": -12.6802978515625, "global_step": 435881, "epoch": 2594} {"train_loss": -12.488540649414062, "global_step": 435882, "epoch": 2594} {"train_loss": -12.614811897277832, "global_step": 435883, "epoch": 2594} {"train_loss": -12.621397972106934, "global_step": 435884, "epoch": 2594} {"train_loss": -12.373222351074219, "global_step": 435885, "epoch": 2594} {"train_loss": -12.358236312866211, "global_step": 435886, "epoch": 2594} {"train_loss": -12.464550018310547, "global_step": 435887, "epoch": 2594} {"train_loss": -12.279829978942871, "global_step": 435888, "epoch": 2594} {"train_loss": -12.389519691467285, "global_step": 435889, "epoch": 2594} {"train_loss": -12.470346450805664, "global_step": 435890, "epoch": 2594} {"train_loss": -12.233085632324219, "global_step": 435891, "epoch": 2594} {"train_loss": -12.3525390625, "global_step": 435892, "epoch": 2594} {"train_loss": -12.613447189331055, "global_step": 435893, "epoch": 2594} {"train_loss": -12.52198600769043, "global_step": 435894, "epoch": 2594} {"train_loss": -12.195452690124512, "global_step": 435895, "epoch": 2594} {"train_loss": -12.386953353881836, "global_step": 435896, "epoch": 2594} {"train_loss": -12.678716659545898, "global_step": 435897, "epoch": 2594} {"train_loss": -12.14240837097168, "global_step": 435898, "epoch": 2594} {"train_loss": -11.873300552368164, "global_step": 435899, "epoch": 2594} {"train_loss": -12.460079193115234, "global_step": 435900, "epoch": 2594} {"train_loss": -12.212892532348633, "global_step": 435901, "epoch": 2594} {"train_loss": -11.821008682250977, "global_step": 435902, "epoch": 2594} {"train_loss": -11.945212364196777, "global_step": 435903, "epoch": 2594} {"train_loss": -12.082298278808594, "global_step": 435904, "epoch": 2594} {"train_loss": -11.980155944824219, "global_step": 435905, "epoch": 2594} {"train_loss": -11.929302215576172, "global_step": 435906, "epoch": 2594} {"train_loss": -12.612950325012207, "global_step": 435907, "epoch": 2594} {"train_loss": -11.306333541870117, "global_step": 435908, "epoch": 2594} {"train_loss": -12.257867813110352, "global_step": 435909, "epoch": 2594} {"train_loss": -12.164962768554688, "global_step": 435910, "epoch": 2594} {"train_loss": -12.869783401489258, "global_step": 435911, "epoch": 2594} {"train_loss": -11.995160102844238, "global_step": 435912, "epoch": 2594} {"train_loss": -12.450801849365234, "global_step": 435913, "epoch": 2594} {"train_loss": -12.607902526855469, "global_step": 435914, "epoch": 2594} {"train_loss": -12.256317138671875, "global_step": 435915, "epoch": 2594} {"train_loss": -12.185150146484375, "global_step": 435916, "epoch": 2594} {"train_loss": -12.64968490600586, "global_step": 435917, "epoch": 2594} {"train_loss": -12.177614212036133, "global_step": 435918, "epoch": 2594} {"train_loss": -12.670670509338379, "global_step": 435919, "epoch": 2594} {"train_loss": -12.436789512634277, "global_step": 435920, "epoch": 2594} {"train_loss": -11.797534942626953, "global_step": 435921, "epoch": 2594} {"train_loss": -12.497920989990234, "global_step": 435922, "epoch": 2594} {"train_loss": -12.421357154846191, "global_step": 435923, "epoch": 2594} {"train_loss": -11.733031272888184, "global_step": 435924, "epoch": 2594} {"train_loss": -12.419029235839844, "global_step": 435925, "epoch": 2594} {"train_loss": -11.83934497833252, "global_step": 435926, "epoch": 2594} {"train_loss": -11.539909362792969, "global_step": 435927, "epoch": 2594} {"train_loss": -12.65212345123291, "global_step": 435928, "epoch": 2594} {"train_loss": -12.546126365661621, "global_step": 435929, "epoch": 2594} {"train_loss": -12.265769004821777, "global_step": 435930, "epoch": 2594} {"train_loss": -12.626873016357422, "global_step": 435931, "epoch": 2594} {"train_loss": -12.35107135772705, "global_step": 435932, "epoch": 2594} {"train_loss": -12.2896089553833, "global_step": 435933, "epoch": 2594} {"train_loss": -12.416797637939453, "global_step": 435934, "epoch": 2594} {"train_loss": -12.582643508911133, "global_step": 435935, "epoch": 2594} {"train_loss": -12.522054672241211, "global_step": 435936, "epoch": 2594} {"train_loss": -12.703603744506836, "global_step": 435937, "epoch": 2594} {"train_loss": -12.437454223632812, "global_step": 435938, "epoch": 2594} {"train_loss": -12.327851295471191, "global_step": 435939, "epoch": 2594} {"train_loss": -12.463324546813965, "global_step": 435940, "epoch": 2594} {"train_loss": -12.155452728271484, "global_step": 435941, "epoch": 2594} {"train_loss": -12.199939727783203, "global_step": 435942, "epoch": 2594} {"train_loss": -12.715846061706543, "global_step": 435943, "epoch": 2594} {"train_loss": -12.233039855957031, "global_step": 435944, "epoch": 2594} {"train_loss": -12.751895904541016, "global_step": 435945, "epoch": 2594} {"train_loss": -12.471231460571289, "global_step": 435946, "epoch": 2594} {"train_loss": -12.445226669311523, "global_step": 435947, "epoch": 2594} {"train_loss": -12.561092376708984, "global_step": 435948, "epoch": 2594} {"train_loss": -12.551441192626953, "global_step": 435949, "epoch": 2594} {"train_loss": -11.928537368774414, "global_step": 435950, "epoch": 2594} {"train_loss": -12.733743667602539, "global_step": 435951, "epoch": 2594} {"train_loss": -12.06072998046875, "global_step": 435952, "epoch": 2594} {"train_loss": -11.823661804199219, "global_step": 435953, "epoch": 2594} {"train_loss": -12.370821952819824, "global_step": 435954, "epoch": 2594} {"train_loss": -12.519859313964844, "global_step": 435955, "epoch": 2594} {"train_loss": -12.598609924316406, "global_step": 435956, "epoch": 2594} {"train_loss": -12.24921989440918, "global_step": 435957, "epoch": 2594} {"train_loss": -11.933822631835938, "global_step": 435958, "epoch": 2594} {"train_loss": -12.264601213591439, "global_step": 435959, "epoch": 2594, "val_loss": 311380.21875} {"train_loss": -12.180173873901367, "global_step": 435960, "epoch": 2595} {"train_loss": -12.557150840759277, "global_step": 435961, "epoch": 2595} {"train_loss": -12.334999084472656, "global_step": 435962, "epoch": 2595} {"train_loss": -12.893121719360352, "global_step": 435963, "epoch": 2595} {"train_loss": -12.6910400390625, "global_step": 435964, "epoch": 2595} {"train_loss": -12.788542747497559, "global_step": 435965, "epoch": 2595} {"train_loss": -12.728719711303711, "global_step": 435966, "epoch": 2595} {"train_loss": -12.817096710205078, "global_step": 435967, "epoch": 2595} {"train_loss": -12.632588386535645, "global_step": 435968, "epoch": 2595} {"train_loss": -12.905166625976562, "global_step": 435969, "epoch": 2595} {"train_loss": -12.81075382232666, "global_step": 435970, "epoch": 2595} {"train_loss": -12.743463516235352, "global_step": 435971, "epoch": 2595} {"train_loss": -12.793761253356934, "global_step": 435972, "epoch": 2595} {"train_loss": -12.728845596313477, "global_step": 435973, "epoch": 2595} {"train_loss": -12.86350154876709, "global_step": 435974, "epoch": 2595} {"train_loss": -12.72863483428955, "global_step": 435975, "epoch": 2595} {"train_loss": -12.75107479095459, "global_step": 435976, "epoch": 2595} {"train_loss": -12.594935417175293, "global_step": 435977, "epoch": 2595} {"train_loss": -12.20159912109375, "global_step": 435978, "epoch": 2595} {"train_loss": -12.712726593017578, "global_step": 435979, "epoch": 2595} {"train_loss": -12.488471031188965, "global_step": 435980, "epoch": 2595} {"train_loss": -12.618576049804688, "global_step": 435981, "epoch": 2595} {"train_loss": -12.391619682312012, "global_step": 435982, "epoch": 2595} {"train_loss": -11.073745727539062, "global_step": 435983, "epoch": 2595} {"train_loss": -12.24417495727539, "global_step": 435984, "epoch": 2595} {"train_loss": -12.028998374938965, "global_step": 435985, "epoch": 2595} {"train_loss": -10.200263023376465, "global_step": 435986, "epoch": 2595} {"train_loss": -11.615425109863281, "global_step": 435987, "epoch": 2595} {"train_loss": -11.770101547241211, "global_step": 435988, "epoch": 2595} {"train_loss": -10.521270751953125, "global_step": 435989, "epoch": 2595} {"train_loss": -12.469764709472656, "global_step": 435990, "epoch": 2595} {"train_loss": -10.100093841552734, "global_step": 435991, "epoch": 2595} {"train_loss": -9.761923789978027, "global_step": 435992, "epoch": 2595} {"train_loss": -9.353355407714844, "global_step": 435993, "epoch": 2595} {"train_loss": -10.549275398254395, "global_step": 435994, "epoch": 2595} {"train_loss": -10.172849655151367, "global_step": 435995, "epoch": 2595} {"train_loss": -9.376815795898438, "global_step": 435996, "epoch": 2595} {"train_loss": -10.776485443115234, "global_step": 435997, "epoch": 2595} {"train_loss": -11.183853149414062, "global_step": 435998, "epoch": 2595} {"train_loss": -9.458662033081055, "global_step": 435999, "epoch": 2595} {"train_loss": -10.604888916015625, "global_step": 436000, "epoch": 2595} {"train_loss": -10.951042175292969, "global_step": 436001, "epoch": 2595} {"train_loss": -11.416801452636719, "global_step": 436002, "epoch": 2595} {"train_loss": -10.444029808044434, "global_step": 436003, "epoch": 2595} {"train_loss": -11.476028442382812, "global_step": 436004, "epoch": 2595} {"train_loss": -11.236934661865234, "global_step": 436005, "epoch": 2595} {"train_loss": -11.555456161499023, "global_step": 436006, "epoch": 2595} {"train_loss": -10.940521240234375, "global_step": 436007, "epoch": 2595} {"train_loss": -11.428803443908691, "global_step": 436008, "epoch": 2595} {"train_loss": -11.337635040283203, "global_step": 436009, "epoch": 2595} {"train_loss": -11.21374225616455, "global_step": 436010, "epoch": 2595} {"train_loss": -11.688682556152344, "global_step": 436011, "epoch": 2595} {"train_loss": -11.737175941467285, "global_step": 436012, "epoch": 2595} {"train_loss": -11.889352798461914, "global_step": 436013, "epoch": 2595} {"train_loss": -11.619318008422852, "global_step": 436014, "epoch": 2595} {"train_loss": -12.238286972045898, "global_step": 436015, "epoch": 2595} {"train_loss": -11.7611665725708, "global_step": 436016, "epoch": 2595} {"train_loss": -12.168174743652344, "global_step": 436017, "epoch": 2595} {"train_loss": -11.912577629089355, "global_step": 436018, "epoch": 2595} {"train_loss": -11.893692016601562, "global_step": 436019, "epoch": 2595} {"train_loss": -12.050287246704102, "global_step": 436020, "epoch": 2595} {"train_loss": -11.83541488647461, "global_step": 436021, "epoch": 2595} {"train_loss": -12.284428596496582, "global_step": 436022, "epoch": 2595} {"train_loss": -11.945840835571289, "global_step": 436023, "epoch": 2595} {"train_loss": -12.257914543151855, "global_step": 436024, "epoch": 2595} {"train_loss": -11.921575546264648, "global_step": 436025, "epoch": 2595} {"train_loss": -11.784071922302246, "global_step": 436026, "epoch": 2595} {"train_loss": -12.171770095825195, "global_step": 436027, "epoch": 2595} {"train_loss": -11.821885108947754, "global_step": 436028, "epoch": 2595} {"train_loss": -11.768648147583008, "global_step": 436029, "epoch": 2595} {"train_loss": -12.365592956542969, "global_step": 436030, "epoch": 2595} {"train_loss": -11.779705047607422, "global_step": 436031, "epoch": 2595} {"train_loss": -12.1121244430542, "global_step": 436032, "epoch": 2595} {"train_loss": -11.860212326049805, "global_step": 436033, "epoch": 2595} {"train_loss": -12.147310256958008, "global_step": 436034, "epoch": 2595} {"train_loss": -11.881897926330566, "global_step": 436035, "epoch": 2595} {"train_loss": -11.903524398803711, "global_step": 436036, "epoch": 2595} {"train_loss": -12.185262680053711, "global_step": 436037, "epoch": 2595} {"train_loss": -11.735344886779785, "global_step": 436038, "epoch": 2595} {"train_loss": -12.339078903198242, "global_step": 436039, "epoch": 2595} {"train_loss": -11.56459903717041, "global_step": 436040, "epoch": 2595} {"train_loss": -11.996504783630371, "global_step": 436041, "epoch": 2595} {"train_loss": -11.699557304382324, "global_step": 436042, "epoch": 2595} {"train_loss": -12.124027252197266, "global_step": 436043, "epoch": 2595} {"train_loss": -11.58668041229248, "global_step": 436044, "epoch": 2595} {"train_loss": -12.193451881408691, "global_step": 436045, "epoch": 2595} {"train_loss": -11.188352584838867, "global_step": 436046, "epoch": 2595} {"train_loss": -11.746114730834961, "global_step": 436047, "epoch": 2595} {"train_loss": -11.084028244018555, "global_step": 436048, "epoch": 2595} {"train_loss": -10.553473472595215, "global_step": 436049, "epoch": 2595} {"train_loss": -11.62063980102539, "global_step": 436050, "epoch": 2595} {"train_loss": -11.069169998168945, "global_step": 436051, "epoch": 2595} {"train_loss": -11.020597457885742, "global_step": 436052, "epoch": 2595} {"train_loss": -11.347158432006836, "global_step": 436053, "epoch": 2595} {"train_loss": -11.661590576171875, "global_step": 436054, "epoch": 2595} {"train_loss": -11.86832046508789, "global_step": 436055, "epoch": 2595} {"train_loss": -10.754737854003906, "global_step": 436056, "epoch": 2595} {"train_loss": -12.132319450378418, "global_step": 436057, "epoch": 2595} {"train_loss": -11.467025756835938, "global_step": 436058, "epoch": 2595} {"train_loss": -11.883859634399414, "global_step": 436059, "epoch": 2595} {"train_loss": -11.224143028259277, "global_step": 436060, "epoch": 2595} {"train_loss": -12.15717887878418, "global_step": 436061, "epoch": 2595} {"train_loss": -11.828990936279297, "global_step": 436062, "epoch": 2595} {"train_loss": -12.188580513000488, "global_step": 436063, "epoch": 2595} {"train_loss": -12.154523849487305, "global_step": 436064, "epoch": 2595} {"train_loss": -11.586301803588867, "global_step": 436065, "epoch": 2595} {"train_loss": -12.136049270629883, "global_step": 436066, "epoch": 2595} {"train_loss": -12.100110054016113, "global_step": 436067, "epoch": 2595} {"train_loss": -12.021818161010742, "global_step": 436068, "epoch": 2595} {"train_loss": -12.06060791015625, "global_step": 436069, "epoch": 2595} {"train_loss": -12.484041213989258, "global_step": 436070, "epoch": 2595} {"train_loss": -12.245349884033203, "global_step": 436071, "epoch": 2595} {"train_loss": -12.098228454589844, "global_step": 436072, "epoch": 2595} {"train_loss": -12.333735466003418, "global_step": 436073, "epoch": 2595} {"train_loss": -12.412447929382324, "global_step": 436074, "epoch": 2595} {"train_loss": -12.218772888183594, "global_step": 436075, "epoch": 2595} {"train_loss": -12.428268432617188, "global_step": 436076, "epoch": 2595} {"train_loss": -12.521150588989258, "global_step": 436077, "epoch": 2595} {"train_loss": -12.309738159179688, "global_step": 436078, "epoch": 2595} {"train_loss": -12.700081825256348, "global_step": 436079, "epoch": 2595} {"train_loss": -12.479560852050781, "global_step": 436080, "epoch": 2595} {"train_loss": -12.454001426696777, "global_step": 436081, "epoch": 2595} {"train_loss": -12.58591365814209, "global_step": 436082, "epoch": 2595} {"train_loss": -12.292055130004883, "global_step": 436083, "epoch": 2595} {"train_loss": -12.149861335754395, "global_step": 436084, "epoch": 2595} {"train_loss": -12.66067123413086, "global_step": 436085, "epoch": 2595} {"train_loss": -12.115228652954102, "global_step": 436086, "epoch": 2595} {"train_loss": -12.553380012512207, "global_step": 436087, "epoch": 2595} {"train_loss": -12.581502914428711, "global_step": 436088, "epoch": 2595} {"train_loss": -12.361041069030762, "global_step": 436089, "epoch": 2595} {"train_loss": -12.705787658691406, "global_step": 436090, "epoch": 2595} {"train_loss": -12.64883804321289, "global_step": 436091, "epoch": 2595} {"train_loss": -12.825939178466797, "global_step": 436092, "epoch": 2595} {"train_loss": -12.552810668945312, "global_step": 436093, "epoch": 2595} {"train_loss": -12.734238624572754, "global_step": 436094, "epoch": 2595} {"train_loss": -12.643747329711914, "global_step": 436095, "epoch": 2595} {"train_loss": -12.891855239868164, "global_step": 436096, "epoch": 2595} {"train_loss": -12.616655349731445, "global_step": 436097, "epoch": 2595} {"train_loss": -12.7197904586792, "global_step": 436098, "epoch": 2595} {"train_loss": -12.69343376159668, "global_step": 436099, "epoch": 2595} {"train_loss": -12.584443092346191, "global_step": 436100, "epoch": 2595} {"train_loss": -12.76988410949707, "global_step": 436101, "epoch": 2595} {"train_loss": -12.677120208740234, "global_step": 436102, "epoch": 2595} {"train_loss": -12.720575332641602, "global_step": 436103, "epoch": 2595} {"train_loss": -12.596991539001465, "global_step": 436104, "epoch": 2595} {"train_loss": -12.704971313476562, "global_step": 436105, "epoch": 2595} {"train_loss": -12.687824249267578, "global_step": 436106, "epoch": 2595} {"train_loss": -12.80599308013916, "global_step": 436107, "epoch": 2595} {"train_loss": -12.781925201416016, "global_step": 436108, "epoch": 2595} {"train_loss": -12.672810554504395, "global_step": 436109, "epoch": 2595} {"train_loss": -12.692535400390625, "global_step": 436110, "epoch": 2595} {"train_loss": -12.636152267456055, "global_step": 436111, "epoch": 2595} {"train_loss": -12.618162155151367, "global_step": 436112, "epoch": 2595} {"train_loss": -12.795825004577637, "global_step": 436113, "epoch": 2595} {"train_loss": -12.817626953125, "global_step": 436114, "epoch": 2595} {"train_loss": -12.765767097473145, "global_step": 436115, "epoch": 2595} {"train_loss": -12.624120712280273, "global_step": 436116, "epoch": 2595} {"train_loss": -12.887083053588867, "global_step": 436117, "epoch": 2595} {"train_loss": -12.97613525390625, "global_step": 436118, "epoch": 2595} {"train_loss": -12.741726875305176, "global_step": 436119, "epoch": 2595} {"train_loss": -12.83074951171875, "global_step": 436120, "epoch": 2595} {"train_loss": -12.843135833740234, "global_step": 436121, "epoch": 2595} {"train_loss": -12.896782875061035, "global_step": 436122, "epoch": 2595} {"train_loss": -12.892925262451172, "global_step": 436123, "epoch": 2595} {"train_loss": -12.853976249694824, "global_step": 436124, "epoch": 2595} {"train_loss": -12.947300910949707, "global_step": 436125, "epoch": 2595} {"train_loss": -12.68198013305664, "global_step": 436126, "epoch": 2595} {"train_loss": -12.05845450219654, "global_step": 436127, "epoch": 2595, "val_loss": 310193.25, "train_action_mse_error": 2.036050319671631} {"train_loss": -12.72268295288086, "global_step": 436128, "epoch": 2596} {"train_loss": -12.871529579162598, "global_step": 436129, "epoch": 2596} {"train_loss": -12.859146118164062, "global_step": 436130, "epoch": 2596} {"train_loss": -12.748432159423828, "global_step": 436131, "epoch": 2596} {"train_loss": -12.771308898925781, "global_step": 436132, "epoch": 2596} {"train_loss": -12.887203216552734, "global_step": 436133, "epoch": 2596} {"train_loss": -12.820944786071777, "global_step": 436134, "epoch": 2596} {"train_loss": -12.850048065185547, "global_step": 436135, "epoch": 2596} {"train_loss": -12.747292518615723, "global_step": 436136, "epoch": 2596} {"train_loss": -12.81831169128418, "global_step": 436137, "epoch": 2596} {"train_loss": -12.752056121826172, "global_step": 436138, "epoch": 2596} {"train_loss": -12.78486156463623, "global_step": 436139, "epoch": 2596} {"train_loss": -12.744460105895996, "global_step": 436140, "epoch": 2596} {"train_loss": -11.741988182067871, "global_step": 436141, "epoch": 2596} {"train_loss": -11.338836669921875, "global_step": 436142, "epoch": 2596} {"train_loss": -12.174651145935059, "global_step": 436143, "epoch": 2596} {"train_loss": -12.615357398986816, "global_step": 436144, "epoch": 2596} {"train_loss": -11.172417640686035, "global_step": 436145, "epoch": 2596} {"train_loss": -11.280367851257324, "global_step": 436146, "epoch": 2596} {"train_loss": -12.92276382446289, "global_step": 436147, "epoch": 2596} {"train_loss": -11.371248245239258, "global_step": 436148, "epoch": 2596} {"train_loss": -11.351836204528809, "global_step": 436149, "epoch": 2596} {"train_loss": -11.78036880493164, "global_step": 436150, "epoch": 2596} {"train_loss": -11.798919677734375, "global_step": 436151, "epoch": 2596} {"train_loss": -11.04667854309082, "global_step": 436152, "epoch": 2596} {"train_loss": -12.611279487609863, "global_step": 436153, "epoch": 2596} {"train_loss": -11.10351276397705, "global_step": 436154, "epoch": 2596} {"train_loss": -11.108305931091309, "global_step": 436155, "epoch": 2596} {"train_loss": -11.894448280334473, "global_step": 436156, "epoch": 2596} {"train_loss": -10.383216857910156, "global_step": 436157, "epoch": 2596} {"train_loss": -11.265335083007812, "global_step": 436158, "epoch": 2596} {"train_loss": -10.443573951721191, "global_step": 436159, "epoch": 2596} {"train_loss": -10.986947059631348, "global_step": 436160, "epoch": 2596} {"train_loss": -11.248149871826172, "global_step": 436161, "epoch": 2596} {"train_loss": -11.66832160949707, "global_step": 436162, "epoch": 2596} {"train_loss": -12.626579284667969, "global_step": 436163, "epoch": 2596} {"train_loss": -11.561779022216797, "global_step": 436164, "epoch": 2596} {"train_loss": -12.314353942871094, "global_step": 436165, "epoch": 2596} {"train_loss": -12.368583679199219, "global_step": 436166, "epoch": 2596} {"train_loss": -12.07537841796875, "global_step": 436167, "epoch": 2596} {"train_loss": -12.38656997680664, "global_step": 436168, "epoch": 2596} {"train_loss": -11.553295135498047, "global_step": 436169, "epoch": 2596} {"train_loss": -12.366482734680176, "global_step": 436170, "epoch": 2596} {"train_loss": -12.553098678588867, "global_step": 436171, "epoch": 2596} {"train_loss": -12.219432830810547, "global_step": 436172, "epoch": 2596} {"train_loss": -12.512292861938477, "global_step": 436173, "epoch": 2596} {"train_loss": -12.308034896850586, "global_step": 436174, "epoch": 2596} {"train_loss": -12.438562393188477, "global_step": 436175, "epoch": 2596} {"train_loss": -12.480502128601074, "global_step": 436176, "epoch": 2596} {"train_loss": -12.340436935424805, "global_step": 436177, "epoch": 2596} {"train_loss": -12.794426918029785, "global_step": 436178, "epoch": 2596} {"train_loss": -12.401660919189453, "global_step": 436179, "epoch": 2596} {"train_loss": -12.698780059814453, "global_step": 436180, "epoch": 2596} {"train_loss": -12.810018539428711, "global_step": 436181, "epoch": 2596} {"train_loss": -12.79244613647461, "global_step": 436182, "epoch": 2596} {"train_loss": -12.722658157348633, "global_step": 436183, "epoch": 2596} {"train_loss": -12.542837142944336, "global_step": 436184, "epoch": 2596} {"train_loss": -12.449613571166992, "global_step": 436185, "epoch": 2596} {"train_loss": -12.245376586914062, "global_step": 436186, "epoch": 2596} {"train_loss": -12.206504821777344, "global_step": 436187, "epoch": 2596} {"train_loss": -12.609877586364746, "global_step": 436188, "epoch": 2596} {"train_loss": -12.244954109191895, "global_step": 436189, "epoch": 2596} {"train_loss": -11.789875030517578, "global_step": 436190, "epoch": 2596} {"train_loss": -12.443399429321289, "global_step": 436191, "epoch": 2596} {"train_loss": -12.107381820678711, "global_step": 436192, "epoch": 2596} {"train_loss": -12.305877685546875, "global_step": 436193, "epoch": 2596} {"train_loss": -12.396796226501465, "global_step": 436194, "epoch": 2596} {"train_loss": -11.779468536376953, "global_step": 436195, "epoch": 2596} {"train_loss": -12.216314315795898, "global_step": 436196, "epoch": 2596} {"train_loss": -12.266359329223633, "global_step": 436197, "epoch": 2596} {"train_loss": -12.294466018676758, "global_step": 436198, "epoch": 2596} {"train_loss": -12.37580680847168, "global_step": 436199, "epoch": 2596} {"train_loss": -12.573299407958984, "global_step": 436200, "epoch": 2596} {"train_loss": -12.295557022094727, "global_step": 436201, "epoch": 2596} {"train_loss": -12.443451881408691, "global_step": 436202, "epoch": 2596} {"train_loss": -12.47669506072998, "global_step": 436203, "epoch": 2596} {"train_loss": -12.057390213012695, "global_step": 436204, "epoch": 2596} {"train_loss": -12.65266227722168, "global_step": 436205, "epoch": 2596} {"train_loss": -12.274011611938477, "global_step": 436206, "epoch": 2596} {"train_loss": -11.45157241821289, "global_step": 436207, "epoch": 2596} {"train_loss": -12.646160125732422, "global_step": 436208, "epoch": 2596} {"train_loss": -11.536531448364258, "global_step": 436209, "epoch": 2596} {"train_loss": -11.318634986877441, "global_step": 436210, "epoch": 2596} {"train_loss": -12.32101821899414, "global_step": 436211, "epoch": 2596} {"train_loss": -11.414421081542969, "global_step": 436212, "epoch": 2596} {"train_loss": -11.334953308105469, "global_step": 436213, "epoch": 2596} {"train_loss": -11.657381057739258, "global_step": 436214, "epoch": 2596} {"train_loss": -11.176396369934082, "global_step": 436215, "epoch": 2596} {"train_loss": -9.944266319274902, "global_step": 436216, "epoch": 2596} {"train_loss": -10.808906555175781, "global_step": 436217, "epoch": 2596} {"train_loss": -11.543502807617188, "global_step": 436218, "epoch": 2596} {"train_loss": -11.631950378417969, "global_step": 436219, "epoch": 2596} {"train_loss": -10.957067489624023, "global_step": 436220, "epoch": 2596} {"train_loss": -12.364411354064941, "global_step": 436221, "epoch": 2596} {"train_loss": -10.901451110839844, "global_step": 436222, "epoch": 2596} {"train_loss": -10.704197883605957, "global_step": 436223, "epoch": 2596} {"train_loss": -11.91168212890625, "global_step": 436224, "epoch": 2596} {"train_loss": -11.630990982055664, "global_step": 436225, "epoch": 2596} {"train_loss": -12.207099914550781, "global_step": 436226, "epoch": 2596} {"train_loss": -11.299092292785645, "global_step": 436227, "epoch": 2596} {"train_loss": -11.331962585449219, "global_step": 436228, "epoch": 2596} {"train_loss": -12.267559051513672, "global_step": 436229, "epoch": 2596} {"train_loss": -11.353659629821777, "global_step": 436230, "epoch": 2596} {"train_loss": -12.377252578735352, "global_step": 436231, "epoch": 2596} {"train_loss": -12.03724479675293, "global_step": 436232, "epoch": 2596} {"train_loss": -11.925830841064453, "global_step": 436233, "epoch": 2596} {"train_loss": -12.123394966125488, "global_step": 436234, "epoch": 2596} {"train_loss": -10.982337951660156, "global_step": 436235, "epoch": 2596} {"train_loss": -12.268095016479492, "global_step": 436236, "epoch": 2596} {"train_loss": -11.651323318481445, "global_step": 436237, "epoch": 2596} {"train_loss": -12.25503921508789, "global_step": 436238, "epoch": 2596} {"train_loss": -11.734283447265625, "global_step": 436239, "epoch": 2596} {"train_loss": -12.449193954467773, "global_step": 436240, "epoch": 2596} {"train_loss": -12.400569915771484, "global_step": 436241, "epoch": 2596} {"train_loss": -11.960206985473633, "global_step": 436242, "epoch": 2596} {"train_loss": -11.753540992736816, "global_step": 436243, "epoch": 2596} {"train_loss": -12.479610443115234, "global_step": 436244, "epoch": 2596} {"train_loss": -12.116928100585938, "global_step": 436245, "epoch": 2596} {"train_loss": -12.556577682495117, "global_step": 436246, "epoch": 2596} {"train_loss": -12.300178527832031, "global_step": 436247, "epoch": 2596} {"train_loss": -12.104026794433594, "global_step": 436248, "epoch": 2596} {"train_loss": -12.5072021484375, "global_step": 436249, "epoch": 2596} {"train_loss": -12.620532989501953, "global_step": 436250, "epoch": 2596} {"train_loss": -12.355670928955078, "global_step": 436251, "epoch": 2596} {"train_loss": -12.451011657714844, "global_step": 436252, "epoch": 2596} {"train_loss": -12.323408126831055, "global_step": 436253, "epoch": 2596} {"train_loss": -12.463150024414062, "global_step": 436254, "epoch": 2596} {"train_loss": -12.450433731079102, "global_step": 436255, "epoch": 2596} {"train_loss": -12.63652515411377, "global_step": 436256, "epoch": 2596} {"train_loss": -12.563539505004883, "global_step": 436257, "epoch": 2596} {"train_loss": -12.322040557861328, "global_step": 436258, "epoch": 2596} {"train_loss": -12.55461311340332, "global_step": 436259, "epoch": 2596} {"train_loss": -12.448363304138184, "global_step": 436260, "epoch": 2596} {"train_loss": -12.381875991821289, "global_step": 436261, "epoch": 2596} {"train_loss": -12.52199935913086, "global_step": 436262, "epoch": 2596} {"train_loss": -12.566560745239258, "global_step": 436263, "epoch": 2596} {"train_loss": -12.583595275878906, "global_step": 436264, "epoch": 2596} {"train_loss": -12.508920669555664, "global_step": 436265, "epoch": 2596} {"train_loss": -12.477272033691406, "global_step": 436266, "epoch": 2596} {"train_loss": -12.502157211303711, "global_step": 436267, "epoch": 2596} {"train_loss": -12.465912818908691, "global_step": 436268, "epoch": 2596} {"train_loss": -12.515024185180664, "global_step": 436269, "epoch": 2596} {"train_loss": -12.026721954345703, "global_step": 436270, "epoch": 2596} {"train_loss": -12.52106761932373, "global_step": 436271, "epoch": 2596} {"train_loss": -12.073986053466797, "global_step": 436272, "epoch": 2596} {"train_loss": -12.434558868408203, "global_step": 436273, "epoch": 2596} {"train_loss": -11.685151100158691, "global_step": 436274, "epoch": 2596} {"train_loss": -12.51082992553711, "global_step": 436275, "epoch": 2596} {"train_loss": -12.280603408813477, "global_step": 436276, "epoch": 2596} {"train_loss": -12.298911094665527, "global_step": 436277, "epoch": 2596} {"train_loss": -12.077142715454102, "global_step": 436278, "epoch": 2596} {"train_loss": -11.9515380859375, "global_step": 436279, "epoch": 2596} {"train_loss": -12.564815521240234, "global_step": 436280, "epoch": 2596} {"train_loss": -11.875213623046875, "global_step": 436281, "epoch": 2596} {"train_loss": -11.76279067993164, "global_step": 436282, "epoch": 2596} {"train_loss": -12.440250396728516, "global_step": 436283, "epoch": 2596} {"train_loss": -11.784448623657227, "global_step": 436284, "epoch": 2596} {"train_loss": -12.282081604003906, "global_step": 436285, "epoch": 2596} {"train_loss": -12.27772331237793, "global_step": 436286, "epoch": 2596} {"train_loss": -11.804600715637207, "global_step": 436287, "epoch": 2596} {"train_loss": -12.205327987670898, "global_step": 436288, "epoch": 2596} {"train_loss": -11.85228157043457, "global_step": 436289, "epoch": 2596} {"train_loss": -12.294477462768555, "global_step": 436290, "epoch": 2596} {"train_loss": -12.712747573852539, "global_step": 436291, "epoch": 2596} {"train_loss": -12.299570083618164, "global_step": 436292, "epoch": 2596} {"train_loss": -12.55052661895752, "global_step": 436293, "epoch": 2596} {"train_loss": -12.397491455078125, "global_step": 436294, "epoch": 2596} {"train_loss": -12.117216558683486, "global_step": 436295, "epoch": 2596, "val_loss": 311276.8125} {"train_loss": -12.759556770324707, "global_step": 436296, "epoch": 2597} {"train_loss": -12.341141700744629, "global_step": 436297, "epoch": 2597} {"train_loss": -11.69777774810791, "global_step": 436298, "epoch": 2597} {"train_loss": -12.34562873840332, "global_step": 436299, "epoch": 2597} {"train_loss": -12.608367919921875, "global_step": 436300, "epoch": 2597} {"train_loss": -12.029134750366211, "global_step": 436301, "epoch": 2597} {"train_loss": -12.009571075439453, "global_step": 436302, "epoch": 2597} {"train_loss": -12.422362327575684, "global_step": 436303, "epoch": 2597} {"train_loss": -12.674718856811523, "global_step": 436304, "epoch": 2597} {"train_loss": -12.281190872192383, "global_step": 436305, "epoch": 2597} {"train_loss": -12.611177444458008, "global_step": 436306, "epoch": 2597} {"train_loss": -12.342737197875977, "global_step": 436307, "epoch": 2597} {"train_loss": -12.557933807373047, "global_step": 436308, "epoch": 2597} {"train_loss": -12.560218811035156, "global_step": 436309, "epoch": 2597} {"train_loss": -12.693309783935547, "global_step": 436310, "epoch": 2597} {"train_loss": -12.590868949890137, "global_step": 436311, "epoch": 2597} {"train_loss": -12.563946723937988, "global_step": 436312, "epoch": 2597} {"train_loss": -12.905359268188477, "global_step": 436313, "epoch": 2597} {"train_loss": -12.45628547668457, "global_step": 436314, "epoch": 2597} {"train_loss": -12.764013290405273, "global_step": 436315, "epoch": 2597} {"train_loss": -12.459847450256348, "global_step": 436316, "epoch": 2597} {"train_loss": -12.798871040344238, "global_step": 436317, "epoch": 2597} {"train_loss": -12.604070663452148, "global_step": 436318, "epoch": 2597} {"train_loss": -12.389888763427734, "global_step": 436319, "epoch": 2597} {"train_loss": -12.485507011413574, "global_step": 436320, "epoch": 2597} {"train_loss": -12.822225570678711, "global_step": 436321, "epoch": 2597} {"train_loss": -12.731609344482422, "global_step": 436322, "epoch": 2597} {"train_loss": -12.824528694152832, "global_step": 436323, "epoch": 2597} {"train_loss": -12.746905326843262, "global_step": 436324, "epoch": 2597} {"train_loss": -12.673044204711914, "global_step": 436325, "epoch": 2597} {"train_loss": -12.957613945007324, "global_step": 436326, "epoch": 2597} {"train_loss": -12.76943588256836, "global_step": 436327, "epoch": 2597} {"train_loss": -12.746354103088379, "global_step": 436328, "epoch": 2597} {"train_loss": -12.861151695251465, "global_step": 436329, "epoch": 2597} {"train_loss": -12.864368438720703, "global_step": 436330, "epoch": 2597} {"train_loss": -12.866912841796875, "global_step": 436331, "epoch": 2597} {"train_loss": -12.829748153686523, "global_step": 436332, "epoch": 2597} {"train_loss": -13.10605239868164, "global_step": 436333, "epoch": 2597} {"train_loss": -13.08768367767334, "global_step": 436334, "epoch": 2597} {"train_loss": -12.930920600891113, "global_step": 436335, "epoch": 2597} {"train_loss": -12.899826049804688, "global_step": 436336, "epoch": 2597} {"train_loss": -12.830876350402832, "global_step": 436337, "epoch": 2597} {"train_loss": -12.699115753173828, "global_step": 436338, "epoch": 2597} {"train_loss": -13.039341926574707, "global_step": 436339, "epoch": 2597} {"train_loss": -12.824954986572266, "global_step": 436340, "epoch": 2597} {"train_loss": -13.044134140014648, "global_step": 436341, "epoch": 2597} {"train_loss": -12.983760833740234, "global_step": 436342, "epoch": 2597} {"train_loss": -12.96861457824707, "global_step": 436343, "epoch": 2597} {"train_loss": -12.83563232421875, "global_step": 436344, "epoch": 2597} {"train_loss": -12.794267654418945, "global_step": 436345, "epoch": 2597} {"train_loss": -12.82642650604248, "global_step": 436346, "epoch": 2597} {"train_loss": -12.688753128051758, "global_step": 436347, "epoch": 2597} {"train_loss": -12.220916748046875, "global_step": 436348, "epoch": 2597} {"train_loss": -12.362637519836426, "global_step": 436349, "epoch": 2597} {"train_loss": -12.124245643615723, "global_step": 436350, "epoch": 2597} {"train_loss": -12.541703224182129, "global_step": 436351, "epoch": 2597} {"train_loss": -12.886037826538086, "global_step": 436352, "epoch": 2597} {"train_loss": -12.715381622314453, "global_step": 436353, "epoch": 2597} {"train_loss": -12.834372520446777, "global_step": 436354, "epoch": 2597} {"train_loss": -12.552587509155273, "global_step": 436355, "epoch": 2597} {"train_loss": -12.76068115234375, "global_step": 436356, "epoch": 2597} {"train_loss": -12.53805160522461, "global_step": 436357, "epoch": 2597} {"train_loss": -12.705970764160156, "global_step": 436358, "epoch": 2597} {"train_loss": -12.510412216186523, "global_step": 436359, "epoch": 2597} {"train_loss": -12.635950088500977, "global_step": 436360, "epoch": 2597} {"train_loss": -12.675106048583984, "global_step": 436361, "epoch": 2597} {"train_loss": -12.465401649475098, "global_step": 436362, "epoch": 2597} {"train_loss": -12.485761642456055, "global_step": 436363, "epoch": 2597} {"train_loss": -10.827997207641602, "global_step": 436364, "epoch": 2597} {"train_loss": -11.896984100341797, "global_step": 436365, "epoch": 2597} {"train_loss": -12.210796356201172, "global_step": 436366, "epoch": 2597} {"train_loss": -9.556949615478516, "global_step": 436367, "epoch": 2597} {"train_loss": -10.86398696899414, "global_step": 436368, "epoch": 2597} {"train_loss": -7.207293510437012, "global_step": 436369, "epoch": 2597} {"train_loss": -9.473108291625977, "global_step": 436370, "epoch": 2597} {"train_loss": -7.517667770385742, "global_step": 436371, "epoch": 2597} {"train_loss": -8.466986656188965, "global_step": 436372, "epoch": 2597} {"train_loss": -7.021040916442871, "global_step": 436373, "epoch": 2597} {"train_loss": -9.16201400756836, "global_step": 436374, "epoch": 2597} {"train_loss": -8.368110656738281, "global_step": 436375, "epoch": 2597} {"train_loss": -9.442681312561035, "global_step": 436376, "epoch": 2597} {"train_loss": -7.912661075592041, "global_step": 436377, "epoch": 2597} {"train_loss": -9.455283164978027, "global_step": 436378, "epoch": 2597} {"train_loss": -8.011528968811035, "global_step": 436379, "epoch": 2597} {"train_loss": -9.367147445678711, "global_step": 436380, "epoch": 2597} {"train_loss": -8.970149040222168, "global_step": 436381, "epoch": 2597} {"train_loss": -8.730792999267578, "global_step": 436382, "epoch": 2597} {"train_loss": -9.439888000488281, "global_step": 436383, "epoch": 2597} {"train_loss": -8.966084480285645, "global_step": 436384, "epoch": 2597} {"train_loss": -10.600961685180664, "global_step": 436385, "epoch": 2597} {"train_loss": -11.027071952819824, "global_step": 436386, "epoch": 2597} {"train_loss": -10.288527488708496, "global_step": 436387, "epoch": 2597} {"train_loss": -10.993343353271484, "global_step": 436388, "epoch": 2597} {"train_loss": -10.884037971496582, "global_step": 436389, "epoch": 2597} {"train_loss": -11.28812313079834, "global_step": 436390, "epoch": 2597} {"train_loss": -10.874592781066895, "global_step": 436391, "epoch": 2597} {"train_loss": -11.31827449798584, "global_step": 436392, "epoch": 2597} {"train_loss": -10.259978294372559, "global_step": 436393, "epoch": 2597} {"train_loss": -10.782678604125977, "global_step": 436394, "epoch": 2597} {"train_loss": -11.453728675842285, "global_step": 436395, "epoch": 2597} {"train_loss": -11.216934204101562, "global_step": 436396, "epoch": 2597} {"train_loss": -11.393416404724121, "global_step": 436397, "epoch": 2597} {"train_loss": -10.368876457214355, "global_step": 436398, "epoch": 2597} {"train_loss": -11.418777465820312, "global_step": 436399, "epoch": 2597} {"train_loss": -11.236456871032715, "global_step": 436400, "epoch": 2597} {"train_loss": -10.977327346801758, "global_step": 436401, "epoch": 2597} {"train_loss": -12.045791625976562, "global_step": 436402, "epoch": 2597} {"train_loss": -11.280632019042969, "global_step": 436403, "epoch": 2597} {"train_loss": -11.458488464355469, "global_step": 436404, "epoch": 2597} {"train_loss": -11.154136657714844, "global_step": 436405, "epoch": 2597} {"train_loss": -11.893730163574219, "global_step": 436406, "epoch": 2597} {"train_loss": -11.781810760498047, "global_step": 436407, "epoch": 2597} {"train_loss": -11.852407455444336, "global_step": 436408, "epoch": 2597} {"train_loss": -11.574915885925293, "global_step": 436409, "epoch": 2597} {"train_loss": -11.7659912109375, "global_step": 436410, "epoch": 2597} {"train_loss": -12.043798446655273, "global_step": 436411, "epoch": 2597} {"train_loss": -11.510488510131836, "global_step": 436412, "epoch": 2597} {"train_loss": -11.953081130981445, "global_step": 436413, "epoch": 2597} {"train_loss": -11.90909481048584, "global_step": 436414, "epoch": 2597} {"train_loss": -12.040425300598145, "global_step": 436415, "epoch": 2597} {"train_loss": -11.948598861694336, "global_step": 436416, "epoch": 2597} {"train_loss": -12.097909927368164, "global_step": 436417, "epoch": 2597} {"train_loss": -11.835244178771973, "global_step": 436418, "epoch": 2597} {"train_loss": -12.207197189331055, "global_step": 436419, "epoch": 2597} {"train_loss": -12.11387825012207, "global_step": 436420, "epoch": 2597} {"train_loss": -12.313321113586426, "global_step": 436421, "epoch": 2597} {"train_loss": -12.208317756652832, "global_step": 436422, "epoch": 2597} {"train_loss": -12.386136054992676, "global_step": 436423, "epoch": 2597} {"train_loss": -12.313661575317383, "global_step": 436424, "epoch": 2597} {"train_loss": -12.299474716186523, "global_step": 436425, "epoch": 2597} {"train_loss": -12.517260551452637, "global_step": 436426, "epoch": 2597} {"train_loss": -12.228455543518066, "global_step": 436427, "epoch": 2597} {"train_loss": -12.411905288696289, "global_step": 436428, "epoch": 2597} {"train_loss": -12.49814224243164, "global_step": 436429, "epoch": 2597} {"train_loss": -12.341350555419922, "global_step": 436430, "epoch": 2597} {"train_loss": -12.522640228271484, "global_step": 436431, "epoch": 2597} {"train_loss": -12.428606033325195, "global_step": 436432, "epoch": 2597} {"train_loss": -12.635515213012695, "global_step": 436433, "epoch": 2597} {"train_loss": -12.267473220825195, "global_step": 436434, "epoch": 2597} {"train_loss": -12.475773811340332, "global_step": 436435, "epoch": 2597} {"train_loss": -12.687910079956055, "global_step": 436436, "epoch": 2597} {"train_loss": -12.371463775634766, "global_step": 436437, "epoch": 2597} {"train_loss": -12.614605903625488, "global_step": 436438, "epoch": 2597} {"train_loss": -12.287094116210938, "global_step": 436439, "epoch": 2597} {"train_loss": -12.67849063873291, "global_step": 436440, "epoch": 2597} {"train_loss": -12.506280899047852, "global_step": 436441, "epoch": 2597} {"train_loss": -12.532821655273438, "global_step": 436442, "epoch": 2597} {"train_loss": -12.520224571228027, "global_step": 436443, "epoch": 2597} {"train_loss": -12.568475723266602, "global_step": 436444, "epoch": 2597} {"train_loss": -12.564574241638184, "global_step": 436445, "epoch": 2597} {"train_loss": -12.515026092529297, "global_step": 436446, "epoch": 2597} {"train_loss": -12.556285858154297, "global_step": 436447, "epoch": 2597} {"train_loss": -12.528614044189453, "global_step": 436448, "epoch": 2597} {"train_loss": -12.61678695678711, "global_step": 436449, "epoch": 2597} {"train_loss": -12.620739936828613, "global_step": 436450, "epoch": 2597} {"train_loss": -12.745388984680176, "global_step": 436451, "epoch": 2597} {"train_loss": -12.656984329223633, "global_step": 436452, "epoch": 2597} {"train_loss": -12.73939037322998, "global_step": 436453, "epoch": 2597} {"train_loss": -12.675434112548828, "global_step": 436454, "epoch": 2597} {"train_loss": -12.63051986694336, "global_step": 436455, "epoch": 2597} {"train_loss": -12.699978828430176, "global_step": 436456, "epoch": 2597} {"train_loss": -12.720841407775879, "global_step": 436457, "epoch": 2597} {"train_loss": -12.764379501342773, "global_step": 436458, "epoch": 2597} {"train_loss": -12.93459415435791, "global_step": 436459, "epoch": 2597} {"train_loss": -12.826303482055664, "global_step": 436460, "epoch": 2597} {"train_loss": -12.654525756835938, "global_step": 436461, "epoch": 2597} {"train_loss": -12.772462844848633, "global_step": 436462, "epoch": 2597} {"train_loss": -11.925440541335515, "global_step": 436463, "epoch": 2597, "val_loss": 309133.46875} {"train_loss": -12.928890228271484, "global_step": 436464, "epoch": 2598} {"train_loss": -12.566024780273438, "global_step": 436465, "epoch": 2598} {"train_loss": -12.591978073120117, "global_step": 436466, "epoch": 2598} {"train_loss": -12.822771072387695, "global_step": 436467, "epoch": 2598} {"train_loss": -12.605042457580566, "global_step": 436468, "epoch": 2598} {"train_loss": -12.959634780883789, "global_step": 436469, "epoch": 2598} {"train_loss": -12.794050216674805, "global_step": 436470, "epoch": 2598} {"train_loss": -12.79322338104248, "global_step": 436471, "epoch": 2598} {"train_loss": -12.954018592834473, "global_step": 436472, "epoch": 2598} {"train_loss": -12.668126106262207, "global_step": 436473, "epoch": 2598} {"train_loss": -12.864395141601562, "global_step": 436474, "epoch": 2598} {"train_loss": -12.905128479003906, "global_step": 436475, "epoch": 2598} {"train_loss": -13.012964248657227, "global_step": 436476, "epoch": 2598} {"train_loss": -12.781791687011719, "global_step": 436477, "epoch": 2598} {"train_loss": -12.839426040649414, "global_step": 436478, "epoch": 2598} {"train_loss": -12.815113067626953, "global_step": 436479, "epoch": 2598} {"train_loss": -12.680754661560059, "global_step": 436480, "epoch": 2598} {"train_loss": -12.74866771697998, "global_step": 436481, "epoch": 2598} {"train_loss": -12.768913269042969, "global_step": 436482, "epoch": 2598} {"train_loss": -12.47684383392334, "global_step": 436483, "epoch": 2598} {"train_loss": -11.896828651428223, "global_step": 436484, "epoch": 2598} {"train_loss": -12.87288761138916, "global_step": 436485, "epoch": 2598} {"train_loss": -11.367422103881836, "global_step": 436486, "epoch": 2598} {"train_loss": -12.342367172241211, "global_step": 436487, "epoch": 2598} {"train_loss": -12.197559356689453, "global_step": 436488, "epoch": 2598} {"train_loss": -12.650569915771484, "global_step": 436489, "epoch": 2598} {"train_loss": -12.026750564575195, "global_step": 436490, "epoch": 2598} {"train_loss": -13.001808166503906, "global_step": 436491, "epoch": 2598} {"train_loss": -11.574213027954102, "global_step": 436492, "epoch": 2598} {"train_loss": -11.672953605651855, "global_step": 436493, "epoch": 2598} {"train_loss": -12.224342346191406, "global_step": 436494, "epoch": 2598} {"train_loss": -12.746356964111328, "global_step": 436495, "epoch": 2598} {"train_loss": -11.649093627929688, "global_step": 436496, "epoch": 2598} {"train_loss": -11.139976501464844, "global_step": 436497, "epoch": 2598} {"train_loss": -11.350067138671875, "global_step": 436498, "epoch": 2598} {"train_loss": -8.942136764526367, "global_step": 436499, "epoch": 2598} {"train_loss": -7.670053482055664, "global_step": 436500, "epoch": 2598} {"train_loss": -8.997648239135742, "global_step": 436501, "epoch": 2598} {"train_loss": -9.485435485839844, "global_step": 436502, "epoch": 2598} {"train_loss": -10.13735580444336, "global_step": 436503, "epoch": 2598} {"train_loss": -9.815679550170898, "global_step": 436504, "epoch": 2598} {"train_loss": -8.720765113830566, "global_step": 436505, "epoch": 2598} {"train_loss": -9.534205436706543, "global_step": 436506, "epoch": 2598} {"train_loss": -9.80502986907959, "global_step": 436507, "epoch": 2598} {"train_loss": -9.996489524841309, "global_step": 436508, "epoch": 2598} {"train_loss": -9.303375244140625, "global_step": 436509, "epoch": 2598} {"train_loss": -10.560876846313477, "global_step": 436510, "epoch": 2598} {"train_loss": -10.045625686645508, "global_step": 436511, "epoch": 2598} {"train_loss": -10.43105697631836, "global_step": 436512, "epoch": 2598} {"train_loss": -10.524140357971191, "global_step": 436513, "epoch": 2598} {"train_loss": -10.11434555053711, "global_step": 436514, "epoch": 2598} {"train_loss": -10.516901016235352, "global_step": 436515, "epoch": 2598} {"train_loss": -9.674427032470703, "global_step": 436516, "epoch": 2598} {"train_loss": -10.223750114440918, "global_step": 436517, "epoch": 2598} {"train_loss": -10.617450714111328, "global_step": 436518, "epoch": 2598} {"train_loss": -10.844858169555664, "global_step": 436519, "epoch": 2598} {"train_loss": -11.345844268798828, "global_step": 436520, "epoch": 2598} {"train_loss": -11.808719635009766, "global_step": 436521, "epoch": 2598} {"train_loss": -10.951824188232422, "global_step": 436522, "epoch": 2598} {"train_loss": -11.624946594238281, "global_step": 436523, "epoch": 2598} {"train_loss": -10.10127067565918, "global_step": 436524, "epoch": 2598} {"train_loss": -11.357415199279785, "global_step": 436525, "epoch": 2598} {"train_loss": -11.116886138916016, "global_step": 436526, "epoch": 2598} {"train_loss": -10.6846284866333, "global_step": 436527, "epoch": 2598} {"train_loss": -11.463359832763672, "global_step": 436528, "epoch": 2598} {"train_loss": -11.697395324707031, "global_step": 436529, "epoch": 2598} {"train_loss": -11.813667297363281, "global_step": 436530, "epoch": 2598} {"train_loss": -11.564977645874023, "global_step": 436531, "epoch": 2598} {"train_loss": -11.345985412597656, "global_step": 436532, "epoch": 2598} {"train_loss": -11.593957901000977, "global_step": 436533, "epoch": 2598} {"train_loss": -11.250984191894531, "global_step": 436534, "epoch": 2598} {"train_loss": -11.90198040008545, "global_step": 436535, "epoch": 2598} {"train_loss": -11.231334686279297, "global_step": 436536, "epoch": 2598} {"train_loss": -12.015349388122559, "global_step": 436537, "epoch": 2598} {"train_loss": -11.354925155639648, "global_step": 436538, "epoch": 2598} {"train_loss": -11.876081466674805, "global_step": 436539, "epoch": 2598} {"train_loss": -11.75760269165039, "global_step": 436540, "epoch": 2598} {"train_loss": -11.974924087524414, "global_step": 436541, "epoch": 2598} {"train_loss": -11.462651252746582, "global_step": 436542, "epoch": 2598} {"train_loss": -12.293388366699219, "global_step": 436543, "epoch": 2598} {"train_loss": -11.902398109436035, "global_step": 436544, "epoch": 2598} {"train_loss": -12.162038803100586, "global_step": 436545, "epoch": 2598} {"train_loss": -12.375092506408691, "global_step": 436546, "epoch": 2598} {"train_loss": -12.435708999633789, "global_step": 436547, "epoch": 2598} {"train_loss": -12.28065299987793, "global_step": 436548, "epoch": 2598} {"train_loss": -12.295278549194336, "global_step": 436549, "epoch": 2598} {"train_loss": -12.495221138000488, "global_step": 436550, "epoch": 2598} {"train_loss": -12.184080123901367, "global_step": 436551, "epoch": 2598} {"train_loss": -12.291934967041016, "global_step": 436552, "epoch": 2598} {"train_loss": -12.315167427062988, "global_step": 436553, "epoch": 2598} {"train_loss": -12.046908378601074, "global_step": 436554, "epoch": 2598} {"train_loss": -12.589739799499512, "global_step": 436555, "epoch": 2598} {"train_loss": -12.399446487426758, "global_step": 436556, "epoch": 2598} {"train_loss": -12.239056587219238, "global_step": 436557, "epoch": 2598} {"train_loss": -12.329021453857422, "global_step": 436558, "epoch": 2598} {"train_loss": -12.289925575256348, "global_step": 436559, "epoch": 2598} {"train_loss": -12.499469757080078, "global_step": 436560, "epoch": 2598} {"train_loss": -12.387904167175293, "global_step": 436561, "epoch": 2598} {"train_loss": -12.490449905395508, "global_step": 436562, "epoch": 2598} {"train_loss": -12.531020164489746, "global_step": 436563, "epoch": 2598} {"train_loss": -12.379963874816895, "global_step": 436564, "epoch": 2598} {"train_loss": -12.456649780273438, "global_step": 436565, "epoch": 2598} {"train_loss": -12.483683586120605, "global_step": 436566, "epoch": 2598} {"train_loss": -12.599296569824219, "global_step": 436567, "epoch": 2598} {"train_loss": -12.578411102294922, "global_step": 436568, "epoch": 2598} {"train_loss": -12.566089630126953, "global_step": 436569, "epoch": 2598} {"train_loss": -12.788885116577148, "global_step": 436570, "epoch": 2598} {"train_loss": -12.596403121948242, "global_step": 436571, "epoch": 2598} {"train_loss": -12.580907821655273, "global_step": 436572, "epoch": 2598} {"train_loss": -12.649965286254883, "global_step": 436573, "epoch": 2598} {"train_loss": -12.483878135681152, "global_step": 436574, "epoch": 2598} {"train_loss": -12.531755447387695, "global_step": 436575, "epoch": 2598} {"train_loss": -12.611703872680664, "global_step": 436576, "epoch": 2598} {"train_loss": -12.662527084350586, "global_step": 436577, "epoch": 2598} {"train_loss": -12.94162368774414, "global_step": 436578, "epoch": 2598} {"train_loss": -12.547927856445312, "global_step": 436579, "epoch": 2598} {"train_loss": -12.65772819519043, "global_step": 436580, "epoch": 2598} {"train_loss": -12.834342002868652, "global_step": 436581, "epoch": 2598} {"train_loss": -12.644168853759766, "global_step": 436582, "epoch": 2598} {"train_loss": -12.785621643066406, "global_step": 436583, "epoch": 2598} {"train_loss": -12.449053764343262, "global_step": 436584, "epoch": 2598} {"train_loss": -12.522128105163574, "global_step": 436585, "epoch": 2598} {"train_loss": -12.834809303283691, "global_step": 436586, "epoch": 2598} {"train_loss": -12.74108600616455, "global_step": 436587, "epoch": 2598} {"train_loss": -12.696088790893555, "global_step": 436588, "epoch": 2598} {"train_loss": -12.46045970916748, "global_step": 436589, "epoch": 2598} {"train_loss": -12.78861141204834, "global_step": 436590, "epoch": 2598} {"train_loss": -12.941659927368164, "global_step": 436591, "epoch": 2598} {"train_loss": -12.930301666259766, "global_step": 436592, "epoch": 2598} {"train_loss": -12.891870498657227, "global_step": 436593, "epoch": 2598} {"train_loss": -12.597336769104004, "global_step": 436594, "epoch": 2598} {"train_loss": -12.800975799560547, "global_step": 436595, "epoch": 2598} {"train_loss": -12.594293594360352, "global_step": 436596, "epoch": 2598} {"train_loss": -12.878512382507324, "global_step": 436597, "epoch": 2598} {"train_loss": -12.771636009216309, "global_step": 436598, "epoch": 2598} {"train_loss": -12.954729080200195, "global_step": 436599, "epoch": 2598} {"train_loss": -12.674972534179688, "global_step": 436600, "epoch": 2598} {"train_loss": -13.046123504638672, "global_step": 436601, "epoch": 2598} {"train_loss": -12.944189071655273, "global_step": 436602, "epoch": 2598} {"train_loss": -12.908306121826172, "global_step": 436603, "epoch": 2598} {"train_loss": -12.840734481811523, "global_step": 436604, "epoch": 2598} {"train_loss": -12.76090145111084, "global_step": 436605, "epoch": 2598} {"train_loss": -12.806350708007812, "global_step": 436606, "epoch": 2598} {"train_loss": -12.755415916442871, "global_step": 436607, "epoch": 2598} {"train_loss": -12.598796844482422, "global_step": 436608, "epoch": 2598} {"train_loss": -12.827384948730469, "global_step": 436609, "epoch": 2598} {"train_loss": -12.915969848632812, "global_step": 436610, "epoch": 2598} {"train_loss": -12.909021377563477, "global_step": 436611, "epoch": 2598} {"train_loss": -12.920974731445312, "global_step": 436612, "epoch": 2598} {"train_loss": -12.656002044677734, "global_step": 436613, "epoch": 2598} {"train_loss": -12.824993133544922, "global_step": 436614, "epoch": 2598} {"train_loss": -12.681070327758789, "global_step": 436615, "epoch": 2598} {"train_loss": -12.892799377441406, "global_step": 436616, "epoch": 2598} {"train_loss": -12.961260795593262, "global_step": 436617, "epoch": 2598} {"train_loss": -12.72287368774414, "global_step": 436618, "epoch": 2598} {"train_loss": -13.11638069152832, "global_step": 436619, "epoch": 2598} {"train_loss": -12.869401931762695, "global_step": 436620, "epoch": 2598} {"train_loss": -12.785329818725586, "global_step": 436621, "epoch": 2598} {"train_loss": -12.827452659606934, "global_step": 436622, "epoch": 2598} {"train_loss": -12.978692054748535, "global_step": 436623, "epoch": 2598} {"train_loss": -13.158034324645996, "global_step": 436624, "epoch": 2598} {"train_loss": -12.893787384033203, "global_step": 436625, "epoch": 2598} {"train_loss": -12.852405548095703, "global_step": 436626, "epoch": 2598} {"train_loss": -13.167522430419922, "global_step": 436627, "epoch": 2598} {"train_loss": -12.620789527893066, "global_step": 436628, "epoch": 2598} {"train_loss": -11.734437942504883, "global_step": 436629, "epoch": 2598} {"train_loss": -11.257861137390137, "global_step": 436630, "epoch": 2598} {"train_loss": -12.078320940335592, "global_step": 436631, "epoch": 2598, "val_loss": 310427.25} {"train_loss": -12.752248764038086, "global_step": 436632, "epoch": 2599} {"train_loss": -12.645228385925293, "global_step": 436633, "epoch": 2599} {"train_loss": -12.249334335327148, "global_step": 436634, "epoch": 2599} {"train_loss": -10.875968933105469, "global_step": 436635, "epoch": 2599} {"train_loss": -12.673698425292969, "global_step": 436636, "epoch": 2599} {"train_loss": -12.170513153076172, "global_step": 436637, "epoch": 2599} {"train_loss": -11.607958793640137, "global_step": 436638, "epoch": 2599} {"train_loss": -11.565042495727539, "global_step": 436639, "epoch": 2599} {"train_loss": -11.983072280883789, "global_step": 436640, "epoch": 2599} {"train_loss": -11.610746383666992, "global_step": 436641, "epoch": 2599} {"train_loss": -11.066278457641602, "global_step": 436642, "epoch": 2599} {"train_loss": -10.862951278686523, "global_step": 436643, "epoch": 2599} {"train_loss": -10.677824020385742, "global_step": 436644, "epoch": 2599} {"train_loss": -11.7216215133667, "global_step": 436645, "epoch": 2599} {"train_loss": -10.979118347167969, "global_step": 436646, "epoch": 2599} {"train_loss": -11.167612075805664, "global_step": 436647, "epoch": 2599} {"train_loss": -11.899704933166504, "global_step": 436648, "epoch": 2599} {"train_loss": -10.984090805053711, "global_step": 436649, "epoch": 2599} {"train_loss": -10.601091384887695, "global_step": 436650, "epoch": 2599} {"train_loss": -9.414647102355957, "global_step": 436651, "epoch": 2599} {"train_loss": -9.508956909179688, "global_step": 436652, "epoch": 2599} {"train_loss": -9.382295608520508, "global_step": 436653, "epoch": 2599} {"train_loss": -11.15716552734375, "global_step": 436654, "epoch": 2599} {"train_loss": -9.682710647583008, "global_step": 436655, "epoch": 2599} {"train_loss": -10.748098373413086, "global_step": 436656, "epoch": 2599} {"train_loss": -10.377554893493652, "global_step": 436657, "epoch": 2599} {"train_loss": -11.130820274353027, "global_step": 436658, "epoch": 2599} {"train_loss": -10.527040481567383, "global_step": 436659, "epoch": 2599} {"train_loss": -10.626256942749023, "global_step": 436660, "epoch": 2599} {"train_loss": -11.351661682128906, "global_step": 436661, "epoch": 2599} {"train_loss": -10.306005477905273, "global_step": 436662, "epoch": 2599} {"train_loss": -10.804510116577148, "global_step": 436663, "epoch": 2599} {"train_loss": -10.96145248413086, "global_step": 436664, "epoch": 2599} {"train_loss": -10.872339248657227, "global_step": 436665, "epoch": 2599} {"train_loss": -11.677582740783691, "global_step": 436666, "epoch": 2599} {"train_loss": -10.746179580688477, "global_step": 436667, "epoch": 2599} {"train_loss": -11.52444839477539, "global_step": 436668, "epoch": 2599} {"train_loss": -10.895362854003906, "global_step": 436669, "epoch": 2599} {"train_loss": -11.400544166564941, "global_step": 436670, "epoch": 2599} {"train_loss": -11.681955337524414, "global_step": 436671, "epoch": 2599} {"train_loss": -10.809128761291504, "global_step": 436672, "epoch": 2599} {"train_loss": -11.97145938873291, "global_step": 436673, "epoch": 2599} {"train_loss": -11.77110767364502, "global_step": 436674, "epoch": 2599} {"train_loss": -12.046388626098633, "global_step": 436675, "epoch": 2599} {"train_loss": -11.893754959106445, "global_step": 436676, "epoch": 2599} {"train_loss": -11.878207206726074, "global_step": 436677, "epoch": 2599} {"train_loss": -12.26937198638916, "global_step": 436678, "epoch": 2599} {"train_loss": -11.99140739440918, "global_step": 436679, "epoch": 2599} {"train_loss": -12.34548568725586, "global_step": 436680, "epoch": 2599} {"train_loss": -12.261798858642578, "global_step": 436681, "epoch": 2599} {"train_loss": -11.780874252319336, "global_step": 436682, "epoch": 2599} {"train_loss": -12.000350952148438, "global_step": 436683, "epoch": 2599} {"train_loss": -12.355203628540039, "global_step": 436684, "epoch": 2599} {"train_loss": -12.00041675567627, "global_step": 436685, "epoch": 2599} {"train_loss": -12.06907844543457, "global_step": 436686, "epoch": 2599} {"train_loss": -12.327581405639648, "global_step": 436687, "epoch": 2599} {"train_loss": -11.82617473602295, "global_step": 436688, "epoch": 2599} {"train_loss": -12.192264556884766, "global_step": 436689, "epoch": 2599} {"train_loss": -12.316605567932129, "global_step": 436690, "epoch": 2599} {"train_loss": -12.133977890014648, "global_step": 436691, "epoch": 2599} {"train_loss": -11.38614273071289, "global_step": 436692, "epoch": 2599} {"train_loss": -10.87428092956543, "global_step": 436693, "epoch": 2599} {"train_loss": -11.90676498413086, "global_step": 436694, "epoch": 2599} {"train_loss": -11.101428985595703, "global_step": 436695, "epoch": 2599} {"train_loss": -11.624409675598145, "global_step": 436696, "epoch": 2599} {"train_loss": -11.854832649230957, "global_step": 436697, "epoch": 2599} {"train_loss": -12.155356407165527, "global_step": 436698, "epoch": 2599} {"train_loss": -11.456080436706543, "global_step": 436699, "epoch": 2599} {"train_loss": -12.050972938537598, "global_step": 436700, "epoch": 2599} {"train_loss": -11.748785972595215, "global_step": 436701, "epoch": 2599} {"train_loss": -12.343782424926758, "global_step": 436702, "epoch": 2599} {"train_loss": -11.964231491088867, "global_step": 436703, "epoch": 2599} {"train_loss": -12.019098281860352, "global_step": 436704, "epoch": 2599} {"train_loss": -11.803518295288086, "global_step": 436705, "epoch": 2599} {"train_loss": -11.561574935913086, "global_step": 436706, "epoch": 2599} {"train_loss": -12.108152389526367, "global_step": 436707, "epoch": 2599} {"train_loss": -11.67521858215332, "global_step": 436708, "epoch": 2599} {"train_loss": -12.385807037353516, "global_step": 436709, "epoch": 2599} {"train_loss": -11.846607208251953, "global_step": 436710, "epoch": 2599} {"train_loss": -12.209449768066406, "global_step": 436711, "epoch": 2599} {"train_loss": -12.219114303588867, "global_step": 436712, "epoch": 2599} {"train_loss": -12.024702072143555, "global_step": 436713, "epoch": 2599} {"train_loss": -12.403512954711914, "global_step": 436714, "epoch": 2599} {"train_loss": -12.253908157348633, "global_step": 436715, "epoch": 2599} {"train_loss": -12.529216766357422, "global_step": 436716, "epoch": 2599} {"train_loss": -12.46315860748291, "global_step": 436717, "epoch": 2599} {"train_loss": -12.208707809448242, "global_step": 436718, "epoch": 2599} {"train_loss": -12.258697509765625, "global_step": 436719, "epoch": 2599} {"train_loss": -12.31797981262207, "global_step": 436720, "epoch": 2599} {"train_loss": -12.414737701416016, "global_step": 436721, "epoch": 2599} {"train_loss": -12.424179077148438, "global_step": 436722, "epoch": 2599} {"train_loss": -12.505071640014648, "global_step": 436723, "epoch": 2599} {"train_loss": -12.387182235717773, "global_step": 436724, "epoch": 2599} {"train_loss": -12.711469650268555, "global_step": 436725, "epoch": 2599} {"train_loss": -12.465093612670898, "global_step": 436726, "epoch": 2599} {"train_loss": -12.183124542236328, "global_step": 436727, "epoch": 2599} {"train_loss": -12.579143524169922, "global_step": 436728, "epoch": 2599} {"train_loss": -12.47005844116211, "global_step": 436729, "epoch": 2599} {"train_loss": -12.563861846923828, "global_step": 436730, "epoch": 2599} {"train_loss": -12.617690086364746, "global_step": 436731, "epoch": 2599} {"train_loss": -12.449174880981445, "global_step": 436732, "epoch": 2599} {"train_loss": -12.761652946472168, "global_step": 436733, "epoch": 2599} {"train_loss": -12.520185470581055, "global_step": 436734, "epoch": 2599} {"train_loss": -12.667742729187012, "global_step": 436735, "epoch": 2599} {"train_loss": -12.761159896850586, "global_step": 436736, "epoch": 2599} {"train_loss": -12.411288261413574, "global_step": 436737, "epoch": 2599} {"train_loss": -12.746152877807617, "global_step": 436738, "epoch": 2599} {"train_loss": -12.38701057434082, "global_step": 436739, "epoch": 2599} {"train_loss": -12.837118148803711, "global_step": 436740, "epoch": 2599} {"train_loss": -12.632286071777344, "global_step": 436741, "epoch": 2599} {"train_loss": -12.498594284057617, "global_step": 436742, "epoch": 2599} {"train_loss": -12.680481910705566, "global_step": 436743, "epoch": 2599} {"train_loss": -12.492815017700195, "global_step": 436744, "epoch": 2599} {"train_loss": -12.657689094543457, "global_step": 436745, "epoch": 2599} {"train_loss": -12.800548553466797, "global_step": 436746, "epoch": 2599} {"train_loss": -12.677968978881836, "global_step": 436747, "epoch": 2599} {"train_loss": -12.809774398803711, "global_step": 436748, "epoch": 2599} {"train_loss": -12.637981414794922, "global_step": 436749, "epoch": 2599} {"train_loss": -12.567358016967773, "global_step": 436750, "epoch": 2599} {"train_loss": -12.716487884521484, "global_step": 436751, "epoch": 2599} {"train_loss": -12.867607116699219, "global_step": 436752, "epoch": 2599} {"train_loss": -12.837711334228516, "global_step": 436753, "epoch": 2599} {"train_loss": -12.515804290771484, "global_step": 436754, "epoch": 2599} {"train_loss": -12.82740592956543, "global_step": 436755, "epoch": 2599} {"train_loss": -12.57174015045166, "global_step": 436756, "epoch": 2599} {"train_loss": -12.750015258789062, "global_step": 436757, "epoch": 2599} {"train_loss": -12.851978302001953, "global_step": 436758, "epoch": 2599} {"train_loss": -12.820574760437012, "global_step": 436759, "epoch": 2599} {"train_loss": -12.722847938537598, "global_step": 436760, "epoch": 2599} {"train_loss": -12.637195587158203, "global_step": 436761, "epoch": 2599} {"train_loss": -12.491718292236328, "global_step": 436762, "epoch": 2599} {"train_loss": -12.620107650756836, "global_step": 436763, "epoch": 2599} {"train_loss": -12.544017791748047, "global_step": 436764, "epoch": 2599} {"train_loss": -12.076762199401855, "global_step": 436765, "epoch": 2599} {"train_loss": -11.819502830505371, "global_step": 436766, "epoch": 2599} {"train_loss": -11.070676803588867, "global_step": 436767, "epoch": 2599} {"train_loss": -12.232275009155273, "global_step": 436768, "epoch": 2599} {"train_loss": -11.795376777648926, "global_step": 436769, "epoch": 2599} {"train_loss": -10.591442108154297, "global_step": 436770, "epoch": 2599} {"train_loss": -11.056448936462402, "global_step": 436771, "epoch": 2599} {"train_loss": -12.290857315063477, "global_step": 436772, "epoch": 2599} {"train_loss": -11.020163536071777, "global_step": 436773, "epoch": 2599} {"train_loss": -10.651899337768555, "global_step": 436774, "epoch": 2599} {"train_loss": -11.825689315795898, "global_step": 436775, "epoch": 2599} {"train_loss": -12.253498077392578, "global_step": 436776, "epoch": 2599} {"train_loss": -10.793320655822754, "global_step": 436777, "epoch": 2599} {"train_loss": -12.365312576293945, "global_step": 436778, "epoch": 2599} {"train_loss": -12.049165725708008, "global_step": 436779, "epoch": 2599} {"train_loss": -11.572790145874023, "global_step": 436780, "epoch": 2599} {"train_loss": -11.716670989990234, "global_step": 436781, "epoch": 2599} {"train_loss": -12.633298873901367, "global_step": 436782, "epoch": 2599} {"train_loss": -12.104347229003906, "global_step": 436783, "epoch": 2599} {"train_loss": -12.032461166381836, "global_step": 436784, "epoch": 2599} {"train_loss": -12.616796493530273, "global_step": 436785, "epoch": 2599} {"train_loss": -12.001791000366211, "global_step": 436786, "epoch": 2599} {"train_loss": -12.353166580200195, "global_step": 436787, "epoch": 2599} {"train_loss": -12.295184135437012, "global_step": 436788, "epoch": 2599} {"train_loss": -12.293089866638184, "global_step": 436789, "epoch": 2599} {"train_loss": -12.547698020935059, "global_step": 436790, "epoch": 2599} {"train_loss": -12.562731742858887, "global_step": 436791, "epoch": 2599} {"train_loss": -12.140792846679688, "global_step": 436792, "epoch": 2599} {"train_loss": -12.42912483215332, "global_step": 436793, "epoch": 2599} {"train_loss": -12.665637969970703, "global_step": 436794, "epoch": 2599} {"train_loss": -11.864988327026367, "global_step": 436795, "epoch": 2599} {"train_loss": -12.611610412597656, "global_step": 436796, "epoch": 2599} {"train_loss": -12.3494291305542, "global_step": 436797, "epoch": 2599} {"train_loss": -12.353596687316895, "global_step": 436798, "epoch": 2599} {"train_loss": -11.941457742736453, "global_step": 436799, "epoch": 2599, "val_loss": 310142.875} {"train_loss": -12.32560920715332, "global_step": 436800, "epoch": 2600} {"train_loss": -12.272989273071289, "global_step": 436801, "epoch": 2600} {"train_loss": -12.494424819946289, "global_step": 436802, "epoch": 2600} {"train_loss": -12.600786209106445, "global_step": 436803, "epoch": 2600} {"train_loss": -12.349732398986816, "global_step": 436804, "epoch": 2600} {"train_loss": -11.870813369750977, "global_step": 436805, "epoch": 2600} {"train_loss": -12.403459548950195, "global_step": 436806, "epoch": 2600} {"train_loss": -12.30160903930664, "global_step": 436807, "epoch": 2600} {"train_loss": -12.570816040039062, "global_step": 436808, "epoch": 2600} {"train_loss": -12.570627212524414, "global_step": 436809, "epoch": 2600} {"train_loss": -12.746710777282715, "global_step": 436810, "epoch": 2600} {"train_loss": -12.518190383911133, "global_step": 436811, "epoch": 2600} {"train_loss": -12.709381103515625, "global_step": 436812, "epoch": 2600} {"train_loss": -12.833525657653809, "global_step": 436813, "epoch": 2600} {"train_loss": -12.754691123962402, "global_step": 436814, "epoch": 2600} {"train_loss": -12.362356185913086, "global_step": 436815, "epoch": 2600} {"train_loss": -12.828826904296875, "global_step": 436816, "epoch": 2600} {"train_loss": -12.587471961975098, "global_step": 436817, "epoch": 2600} {"train_loss": -12.423660278320312, "global_step": 436818, "epoch": 2600} {"train_loss": -12.87492561340332, "global_step": 436819, "epoch": 2600} {"train_loss": -12.493732452392578, "global_step": 436820, "epoch": 2600} {"train_loss": -12.622918128967285, "global_step": 436821, "epoch": 2600} {"train_loss": -12.496702194213867, "global_step": 436822, "epoch": 2600} {"train_loss": -12.601057052612305, "global_step": 436823, "epoch": 2600} {"train_loss": -11.825382232666016, "global_step": 436824, "epoch": 2600} {"train_loss": -12.506267547607422, "global_step": 436825, "epoch": 2600} {"train_loss": -12.600931167602539, "global_step": 436826, "epoch": 2600} {"train_loss": -12.09006404876709, "global_step": 436827, "epoch": 2600} {"train_loss": -11.91032600402832, "global_step": 436828, "epoch": 2600} {"train_loss": -12.154027938842773, "global_step": 436829, "epoch": 2600} {"train_loss": -12.15462875366211, "global_step": 436830, "epoch": 2600} {"train_loss": -12.311903953552246, "global_step": 436831, "epoch": 2600} {"train_loss": -11.545465469360352, "global_step": 436832, "epoch": 2600} {"train_loss": -12.353110313415527, "global_step": 436833, "epoch": 2600} {"train_loss": -12.494184494018555, "global_step": 436834, "epoch": 2600} {"train_loss": -12.165824890136719, "global_step": 436835, "epoch": 2600} {"train_loss": -12.747273445129395, "global_step": 436836, "epoch": 2600} {"train_loss": -12.349983215332031, "global_step": 436837, "epoch": 2600} {"train_loss": -11.852231979370117, "global_step": 436838, "epoch": 2600} {"train_loss": -12.542444229125977, "global_step": 436839, "epoch": 2600} {"train_loss": -12.403672218322754, "global_step": 436840, "epoch": 2600} {"train_loss": -12.49410629272461, "global_step": 436841, "epoch": 2600} {"train_loss": -12.452032089233398, "global_step": 436842, "epoch": 2600} {"train_loss": -12.538969993591309, "global_step": 436843, "epoch": 2600} {"train_loss": -12.414653778076172, "global_step": 436844, "epoch": 2600} {"train_loss": -11.96425724029541, "global_step": 436845, "epoch": 2600} {"train_loss": -11.872695922851562, "global_step": 436846, "epoch": 2600} {"train_loss": -12.541251182556152, "global_step": 436847, "epoch": 2600} {"train_loss": -11.964361190795898, "global_step": 436848, "epoch": 2600} {"train_loss": -11.881009101867676, "global_step": 436849, "epoch": 2600} {"train_loss": -12.542829513549805, "global_step": 436850, "epoch": 2600} {"train_loss": -11.999601364135742, "global_step": 436851, "epoch": 2600} {"train_loss": -11.853925704956055, "global_step": 436852, "epoch": 2600} {"train_loss": -12.600531578063965, "global_step": 436853, "epoch": 2600} {"train_loss": -11.99757194519043, "global_step": 436854, "epoch": 2600} {"train_loss": -11.938934326171875, "global_step": 436855, "epoch": 2600} {"train_loss": -12.620234489440918, "global_step": 436856, "epoch": 2600} {"train_loss": -12.136033058166504, "global_step": 436857, "epoch": 2600} {"train_loss": -12.270678520202637, "global_step": 436858, "epoch": 2600} {"train_loss": -12.498037338256836, "global_step": 436859, "epoch": 2600} {"train_loss": -12.254096984863281, "global_step": 436860, "epoch": 2600} {"train_loss": -12.742252349853516, "global_step": 436861, "epoch": 2600} {"train_loss": -12.200777053833008, "global_step": 436862, "epoch": 2600} {"train_loss": -12.321168899536133, "global_step": 436863, "epoch": 2600} {"train_loss": -11.714654922485352, "global_step": 436864, "epoch": 2600} {"train_loss": -11.662992477416992, "global_step": 436865, "epoch": 2600} {"train_loss": -12.01283073425293, "global_step": 436866, "epoch": 2600} {"train_loss": -12.403053283691406, "global_step": 436867, "epoch": 2600} {"train_loss": -11.75466251373291, "global_step": 436868, "epoch": 2600} {"train_loss": -11.839099884033203, "global_step": 436869, "epoch": 2600} {"train_loss": -11.830512046813965, "global_step": 436870, "epoch": 2600} {"train_loss": -11.955181121826172, "global_step": 436871, "epoch": 2600} {"train_loss": -12.200531005859375, "global_step": 436872, "epoch": 2600} {"train_loss": -12.38725471496582, "global_step": 436873, "epoch": 2600} {"train_loss": -12.46060562133789, "global_step": 436874, "epoch": 2600} {"train_loss": -12.177827835083008, "global_step": 436875, "epoch": 2600} {"train_loss": -12.387006759643555, "global_step": 436876, "epoch": 2600} {"train_loss": -12.165206909179688, "global_step": 436877, "epoch": 2600} {"train_loss": -12.638495445251465, "global_step": 436878, "epoch": 2600} {"train_loss": -12.167984008789062, "global_step": 436879, "epoch": 2600} {"train_loss": -12.244844436645508, "global_step": 436880, "epoch": 2600} {"train_loss": -12.10946273803711, "global_step": 436881, "epoch": 2600} {"train_loss": -11.664421081542969, "global_step": 436882, "epoch": 2600} {"train_loss": -12.661888122558594, "global_step": 436883, "epoch": 2600} {"train_loss": -11.571188926696777, "global_step": 436884, "epoch": 2600} {"train_loss": -12.065146446228027, "global_step": 436885, "epoch": 2600} {"train_loss": -12.490009307861328, "global_step": 436886, "epoch": 2600} {"train_loss": -11.99287223815918, "global_step": 436887, "epoch": 2600} {"train_loss": -12.323619842529297, "global_step": 436888, "epoch": 2600} {"train_loss": -11.846078872680664, "global_step": 436889, "epoch": 2600} {"train_loss": -11.489758491516113, "global_step": 436890, "epoch": 2600} {"train_loss": -12.45126724243164, "global_step": 436891, "epoch": 2600} {"train_loss": -12.02861213684082, "global_step": 436892, "epoch": 2600} {"train_loss": -12.073073387145996, "global_step": 436893, "epoch": 2600} {"train_loss": -11.443428993225098, "global_step": 436894, "epoch": 2600} {"train_loss": -12.391962051391602, "global_step": 436895, "epoch": 2600} {"train_loss": -12.076465606689453, "global_step": 436896, "epoch": 2600} {"train_loss": -11.163330078125, "global_step": 436897, "epoch": 2600} {"train_loss": -11.826412200927734, "global_step": 436898, "epoch": 2600} {"train_loss": -9.305438995361328, "global_step": 436899, "epoch": 2600} {"train_loss": -10.408608436584473, "global_step": 436900, "epoch": 2600} {"train_loss": -10.971771240234375, "global_step": 436901, "epoch": 2600} {"train_loss": -10.918314933776855, "global_step": 436902, "epoch": 2600} {"train_loss": -10.695669174194336, "global_step": 436903, "epoch": 2600} {"train_loss": -11.033411026000977, "global_step": 436904, "epoch": 2600} {"train_loss": -11.04449462890625, "global_step": 436905, "epoch": 2600} {"train_loss": -10.957261085510254, "global_step": 436906, "epoch": 2600} {"train_loss": -10.550397872924805, "global_step": 436907, "epoch": 2600} {"train_loss": -9.989097595214844, "global_step": 436908, "epoch": 2600} {"train_loss": -10.873220443725586, "global_step": 436909, "epoch": 2600} {"train_loss": -11.34495735168457, "global_step": 436910, "epoch": 2600} {"train_loss": -11.116682052612305, "global_step": 436911, "epoch": 2600} {"train_loss": -10.723241806030273, "global_step": 436912, "epoch": 2600} {"train_loss": -10.258201599121094, "global_step": 436913, "epoch": 2600} {"train_loss": -11.784241676330566, "global_step": 436914, "epoch": 2600} {"train_loss": -8.57399845123291, "global_step": 436915, "epoch": 2600} {"train_loss": -11.548331260681152, "global_step": 436916, "epoch": 2600} {"train_loss": -10.155899047851562, "global_step": 436917, "epoch": 2600} {"train_loss": -10.375936508178711, "global_step": 436918, "epoch": 2600} {"train_loss": -11.283143997192383, "global_step": 436919, "epoch": 2600} {"train_loss": -10.951403617858887, "global_step": 436920, "epoch": 2600} {"train_loss": -10.833662033081055, "global_step": 436921, "epoch": 2600} {"train_loss": -12.102191925048828, "global_step": 436922, "epoch": 2600} {"train_loss": -11.078510284423828, "global_step": 436923, "epoch": 2600} {"train_loss": -11.76414680480957, "global_step": 436924, "epoch": 2600} {"train_loss": -11.340965270996094, "global_step": 436925, "epoch": 2600} {"train_loss": -11.957530975341797, "global_step": 436926, "epoch": 2600} {"train_loss": -11.650557518005371, "global_step": 436927, "epoch": 2600} {"train_loss": -11.858715057373047, "global_step": 436928, "epoch": 2600} {"train_loss": -11.848444938659668, "global_step": 436929, "epoch": 2600} {"train_loss": -12.051074028015137, "global_step": 436930, "epoch": 2600} {"train_loss": -11.979659080505371, "global_step": 436931, "epoch": 2600} {"train_loss": -11.8955717086792, "global_step": 436932, "epoch": 2600} {"train_loss": -12.438352584838867, "global_step": 436933, "epoch": 2600} {"train_loss": -12.201103210449219, "global_step": 436934, "epoch": 2600} {"train_loss": -12.226984024047852, "global_step": 436935, "epoch": 2600} {"train_loss": -11.758488655090332, "global_step": 436936, "epoch": 2600} {"train_loss": -12.25399398803711, "global_step": 436937, "epoch": 2600} {"train_loss": -11.918302536010742, "global_step": 436938, "epoch": 2600} {"train_loss": -12.214563369750977, "global_step": 436939, "epoch": 2600} {"train_loss": -11.944623947143555, "global_step": 436940, "epoch": 2600} {"train_loss": -12.321606636047363, "global_step": 436941, "epoch": 2600} {"train_loss": -12.025629043579102, "global_step": 436942, "epoch": 2600} {"train_loss": -12.330546379089355, "global_step": 436943, "epoch": 2600} {"train_loss": -12.31982421875, "global_step": 436944, "epoch": 2600} {"train_loss": -12.498185157775879, "global_step": 436945, "epoch": 2600} {"train_loss": -12.523794174194336, "global_step": 436946, "epoch": 2600} {"train_loss": -12.41659164428711, "global_step": 436947, "epoch": 2600} {"train_loss": -12.548393249511719, "global_step": 436948, "epoch": 2600} {"train_loss": -12.452991485595703, "global_step": 436949, "epoch": 2600} {"train_loss": -12.414409637451172, "global_step": 436950, "epoch": 2600} {"train_loss": -12.497689247131348, "global_step": 436951, "epoch": 2600} {"train_loss": -12.40684700012207, "global_step": 436952, "epoch": 2600} {"train_loss": -12.530433654785156, "global_step": 436953, "epoch": 2600} {"train_loss": -12.686689376831055, "global_step": 436954, "epoch": 2600} {"train_loss": -12.228429794311523, "global_step": 436955, "epoch": 2600} {"train_loss": -12.502554893493652, "global_step": 436956, "epoch": 2600} {"train_loss": -12.247896194458008, "global_step": 436957, "epoch": 2600} {"train_loss": -12.669662475585938, "global_step": 436958, "epoch": 2600} {"train_loss": -12.344930648803711, "global_step": 436959, "epoch": 2600} {"train_loss": -12.593711853027344, "global_step": 436960, "epoch": 2600} {"train_loss": -12.484922409057617, "global_step": 436961, "epoch": 2600} {"train_loss": -12.7161226272583, "global_step": 436962, "epoch": 2600} {"train_loss": -12.440507888793945, "global_step": 436963, "epoch": 2600} {"train_loss": -12.420585632324219, "global_step": 436964, "epoch": 2600} {"train_loss": -12.424304962158203, "global_step": 436965, "epoch": 2600} {"train_loss": -12.69854736328125, "global_step": 436966, "epoch": 2600} {"train_loss": -12.029996764092218, "global_step": 436967, "epoch": 2600, "train/sim_max_reward_0": 0.6573402083952082, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.0008368713314036051, "train/sim_max_reward_3": 0.9932414722959454, "train/sim_max_reward_4": 0.5078785555964374, "train/sim_max_reward_5": 0.48545122027221305, "test/sim_max_reward_4400000": 0.9118427796429063, "test/sim_max_reward_4400001": 0.5166965212121263, "test/sim_max_reward_4400002": 0.06098237626791881, "test/sim_max_reward_4400003": 0.04259125932569781, "test/sim_max_reward_4400004": 0.9338298468805585, "test/sim_max_reward_4400005": 0.9353585781587016, "test/sim_max_reward_4400006": 0.5602884023601216, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.6246032363794075, "test/sim_max_reward_4400009": 0.3839501665149206, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 0.9567426807269755, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.8885044079176104, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.6931489930212157, "test/sim_max_reward_4400022": 0.9189098327035852, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.6252129640937735, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.17081512237449448, "test/sim_max_reward_4400028": 0.9785686726194086, "test/sim_max_reward_4400029": 0.8981442167648328, "test/sim_max_reward_4400030": 0.9926740157602798, "test/sim_max_reward_4400031": 0.9887501151520934, "test/sim_max_reward_4400032": 0.17402414255881288, "test/sim_max_reward_4400033": 0.9918791716002398, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.9641474815578382, "test/sim_max_reward_4400036": 0.3514598260141307, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.3064513782266675, "test/sim_max_reward_4400039": 0.9460014090338236, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.9016252845337105, "test/sim_max_reward_4400042": 0.09037855683109404, "test/sim_max_reward_4400043": 0.022320352865519363, "test/sim_max_reward_4400044": 1.0, "test/sim_max_reward_4400045": 0.0, "test/sim_max_reward_4400046": 0.3132662752089699, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6074580546485345, "test/mean_score": 0.5070179804909903, "val_loss": 310516.34375, "train_action_mse_error": 2.050616979598999} {"train_loss": -12.452800750732422, "global_step": 436968, "epoch": 2601} {"train_loss": -12.619977951049805, "global_step": 436969, "epoch": 2601} {"train_loss": -12.721402168273926, "global_step": 436970, "epoch": 2601} {"train_loss": -12.687328338623047, "global_step": 436971, "epoch": 2601} {"train_loss": -12.709174156188965, "global_step": 436972, "epoch": 2601} {"train_loss": -12.572443008422852, "global_step": 436973, "epoch": 2601} {"train_loss": -12.391420364379883, "global_step": 436974, "epoch": 2601} {"train_loss": -12.7472505569458, "global_step": 436975, "epoch": 2601} {"train_loss": -12.592973709106445, "global_step": 436976, "epoch": 2601} {"train_loss": -12.520877838134766, "global_step": 436977, "epoch": 2601} {"train_loss": -12.471569061279297, "global_step": 436978, "epoch": 2601} {"train_loss": -12.70086669921875, "global_step": 436979, "epoch": 2601} {"train_loss": -12.685657501220703, "global_step": 436980, "epoch": 2601} {"train_loss": -12.614571571350098, "global_step": 436981, "epoch": 2601} {"train_loss": -12.594168663024902, "global_step": 436982, "epoch": 2601} {"train_loss": -12.66556453704834, "global_step": 436983, "epoch": 2601} {"train_loss": -12.720880508422852, "global_step": 436984, "epoch": 2601} {"train_loss": -12.5343599319458, "global_step": 436985, "epoch": 2601} {"train_loss": -12.425426483154297, "global_step": 436986, "epoch": 2601} {"train_loss": -12.62255859375, "global_step": 436987, "epoch": 2601} {"train_loss": -12.39142894744873, "global_step": 436988, "epoch": 2601} {"train_loss": -12.594819068908691, "global_step": 436989, "epoch": 2601} {"train_loss": -12.546456336975098, "global_step": 436990, "epoch": 2601} {"train_loss": -12.638130187988281, "global_step": 436991, "epoch": 2601} {"train_loss": -12.424360275268555, "global_step": 436992, "epoch": 2601} {"train_loss": -12.565701484680176, "global_step": 436993, "epoch": 2601} {"train_loss": -12.789423942565918, "global_step": 436994, "epoch": 2601} {"train_loss": -12.885848999023438, "global_step": 436995, "epoch": 2601} {"train_loss": -12.52532958984375, "global_step": 436996, "epoch": 2601} {"train_loss": -12.814569473266602, "global_step": 436997, "epoch": 2601} {"train_loss": -12.649148941040039, "global_step": 436998, "epoch": 2601} {"train_loss": -12.520630836486816, "global_step": 436999, "epoch": 2601} {"train_loss": -12.743260383605957, "global_step": 437000, "epoch": 2601} {"train_loss": -12.871360778808594, "global_step": 437001, "epoch": 2601} {"train_loss": -12.69083309173584, "global_step": 437002, "epoch": 2601} {"train_loss": -12.629034042358398, "global_step": 437003, "epoch": 2601} {"train_loss": -12.685504913330078, "global_step": 437004, "epoch": 2601} {"train_loss": -12.743204116821289, "global_step": 437005, "epoch": 2601} {"train_loss": -12.527617454528809, "global_step": 437006, "epoch": 2601} {"train_loss": -12.372102737426758, "global_step": 437007, "epoch": 2601} {"train_loss": -12.484350204467773, "global_step": 437008, "epoch": 2601} {"train_loss": -12.443269729614258, "global_step": 437009, "epoch": 2601} {"train_loss": -12.504173278808594, "global_step": 437010, "epoch": 2601} {"train_loss": -12.828338623046875, "global_step": 437011, "epoch": 2601} {"train_loss": -12.389383316040039, "global_step": 437012, "epoch": 2601} {"train_loss": -12.25197696685791, "global_step": 437013, "epoch": 2601} {"train_loss": -12.747517585754395, "global_step": 437014, "epoch": 2601} {"train_loss": -12.923203468322754, "global_step": 437015, "epoch": 2601} {"train_loss": -12.55510425567627, "global_step": 437016, "epoch": 2601} {"train_loss": -12.802297592163086, "global_step": 437017, "epoch": 2601} {"train_loss": -12.684839248657227, "global_step": 437018, "epoch": 2601} {"train_loss": -12.168218612670898, "global_step": 437019, "epoch": 2601} {"train_loss": -12.883064270019531, "global_step": 437020, "epoch": 2601} {"train_loss": -12.72304630279541, "global_step": 437021, "epoch": 2601} {"train_loss": -12.68438720703125, "global_step": 437022, "epoch": 2601} {"train_loss": -12.775402069091797, "global_step": 437023, "epoch": 2601} {"train_loss": -12.867916107177734, "global_step": 437024, "epoch": 2601} {"train_loss": -12.781951904296875, "global_step": 437025, "epoch": 2601} {"train_loss": -12.877252578735352, "global_step": 437026, "epoch": 2601} {"train_loss": -12.790362358093262, "global_step": 437027, "epoch": 2601} {"train_loss": -12.644103050231934, "global_step": 437028, "epoch": 2601} {"train_loss": -12.521824836730957, "global_step": 437029, "epoch": 2601} {"train_loss": -12.852848052978516, "global_step": 437030, "epoch": 2601} {"train_loss": -12.641643524169922, "global_step": 437031, "epoch": 2601} {"train_loss": -12.116080284118652, "global_step": 437032, "epoch": 2601} {"train_loss": -11.375934600830078, "global_step": 437033, "epoch": 2601} {"train_loss": -12.7486572265625, "global_step": 437034, "epoch": 2601} {"train_loss": -11.951099395751953, "global_step": 437035, "epoch": 2601} {"train_loss": -9.105459213256836, "global_step": 437036, "epoch": 2601} {"train_loss": -9.167299270629883, "global_step": 437037, "epoch": 2601} {"train_loss": -10.964433670043945, "global_step": 437038, "epoch": 2601} {"train_loss": -11.164656639099121, "global_step": 437039, "epoch": 2601} {"train_loss": -8.735832214355469, "global_step": 437040, "epoch": 2601} {"train_loss": -10.66098403930664, "global_step": 437041, "epoch": 2601} {"train_loss": -9.517483711242676, "global_step": 437042, "epoch": 2601} {"train_loss": -11.397584915161133, "global_step": 437043, "epoch": 2601} {"train_loss": -10.197192192077637, "global_step": 437044, "epoch": 2601} {"train_loss": -8.964601516723633, "global_step": 437045, "epoch": 2601} {"train_loss": -10.337406158447266, "global_step": 437046, "epoch": 2601} {"train_loss": -6.280435562133789, "global_step": 437047, "epoch": 2601} {"train_loss": -7.6747145652771, "global_step": 437048, "epoch": 2601} {"train_loss": -7.001042366027832, "global_step": 437049, "epoch": 2601} {"train_loss": -6.528829574584961, "global_step": 437050, "epoch": 2601} {"train_loss": -7.581004619598389, "global_step": 437051, "epoch": 2601} {"train_loss": -8.336238861083984, "global_step": 437052, "epoch": 2601} {"train_loss": -7.796685695648193, "global_step": 437053, "epoch": 2601} {"train_loss": -6.909167289733887, "global_step": 437054, "epoch": 2601} {"train_loss": -8.250600814819336, "global_step": 437055, "epoch": 2601} {"train_loss": -8.126791000366211, "global_step": 437056, "epoch": 2601} {"train_loss": -7.504474639892578, "global_step": 437057, "epoch": 2601} {"train_loss": -7.61376953125, "global_step": 437058, "epoch": 2601} {"train_loss": -7.778488636016846, "global_step": 437059, "epoch": 2601} {"train_loss": -7.997453212738037, "global_step": 437060, "epoch": 2601} {"train_loss": -7.894495487213135, "global_step": 437061, "epoch": 2601} {"train_loss": -8.555980682373047, "global_step": 437062, "epoch": 2601} {"train_loss": -9.087690353393555, "global_step": 437063, "epoch": 2601} {"train_loss": -8.053350448608398, "global_step": 437064, "epoch": 2601} {"train_loss": -9.1393461227417, "global_step": 437065, "epoch": 2601} {"train_loss": -9.483177185058594, "global_step": 437066, "epoch": 2601} {"train_loss": -9.66771125793457, "global_step": 437067, "epoch": 2601} {"train_loss": -8.683794021606445, "global_step": 437068, "epoch": 2601} {"train_loss": -9.353565216064453, "global_step": 437069, "epoch": 2601} {"train_loss": -9.919188499450684, "global_step": 437070, "epoch": 2601} {"train_loss": -10.53676986694336, "global_step": 437071, "epoch": 2601} {"train_loss": -9.902776718139648, "global_step": 437072, "epoch": 2601} {"train_loss": -9.784414291381836, "global_step": 437073, "epoch": 2601} {"train_loss": -9.656303405761719, "global_step": 437074, "epoch": 2601} {"train_loss": -10.421533584594727, "global_step": 437075, "epoch": 2601} {"train_loss": -10.649091720581055, "global_step": 437076, "epoch": 2601} {"train_loss": -10.532510757446289, "global_step": 437077, "epoch": 2601} {"train_loss": -10.482608795166016, "global_step": 437078, "epoch": 2601} {"train_loss": -11.007654190063477, "global_step": 437079, "epoch": 2601} {"train_loss": -11.01327133178711, "global_step": 437080, "epoch": 2601} {"train_loss": -11.663619995117188, "global_step": 437081, "epoch": 2601} {"train_loss": -11.098262786865234, "global_step": 437082, "epoch": 2601} {"train_loss": -11.559538841247559, "global_step": 437083, "epoch": 2601} {"train_loss": -11.14100456237793, "global_step": 437084, "epoch": 2601} {"train_loss": -11.420242309570312, "global_step": 437085, "epoch": 2601} {"train_loss": -11.638288497924805, "global_step": 437086, "epoch": 2601} {"train_loss": -11.652477264404297, "global_step": 437087, "epoch": 2601} {"train_loss": -11.787521362304688, "global_step": 437088, "epoch": 2601} {"train_loss": -12.022966384887695, "global_step": 437089, "epoch": 2601} {"train_loss": -11.661184310913086, "global_step": 437090, "epoch": 2601} {"train_loss": -11.660993576049805, "global_step": 437091, "epoch": 2601} {"train_loss": -11.490744590759277, "global_step": 437092, "epoch": 2601} {"train_loss": -11.689018249511719, "global_step": 437093, "epoch": 2601} {"train_loss": -11.944053649902344, "global_step": 437094, "epoch": 2601} {"train_loss": -11.76270866394043, "global_step": 437095, "epoch": 2601} {"train_loss": -11.956416130065918, "global_step": 437096, "epoch": 2601} {"train_loss": -11.901965141296387, "global_step": 437097, "epoch": 2601} {"train_loss": -11.88947868347168, "global_step": 437098, "epoch": 2601} {"train_loss": -12.047294616699219, "global_step": 437099, "epoch": 2601} {"train_loss": -11.8544282913208, "global_step": 437100, "epoch": 2601} {"train_loss": -12.042369842529297, "global_step": 437101, "epoch": 2601} {"train_loss": -12.61903190612793, "global_step": 437102, "epoch": 2601} {"train_loss": -11.94095230102539, "global_step": 437103, "epoch": 2601} {"train_loss": -12.107942581176758, "global_step": 437104, "epoch": 2601} {"train_loss": -12.083155632019043, "global_step": 437105, "epoch": 2601} {"train_loss": -12.156012535095215, "global_step": 437106, "epoch": 2601} {"train_loss": -11.843754768371582, "global_step": 437107, "epoch": 2601} {"train_loss": -12.364949226379395, "global_step": 437108, "epoch": 2601} {"train_loss": -12.089048385620117, "global_step": 437109, "epoch": 2601} {"train_loss": -12.213687896728516, "global_step": 437110, "epoch": 2601} {"train_loss": -11.871353149414062, "global_step": 437111, "epoch": 2601} {"train_loss": -12.355945587158203, "global_step": 437112, "epoch": 2601} {"train_loss": -12.222099304199219, "global_step": 437113, "epoch": 2601} {"train_loss": -12.035100936889648, "global_step": 437114, "epoch": 2601} {"train_loss": -12.151870727539062, "global_step": 437115, "epoch": 2601} {"train_loss": -11.940408706665039, "global_step": 437116, "epoch": 2601} {"train_loss": -12.328845024108887, "global_step": 437117, "epoch": 2601} {"train_loss": -12.184041976928711, "global_step": 437118, "epoch": 2601} {"train_loss": -12.4066743850708, "global_step": 437119, "epoch": 2601} {"train_loss": -12.376077651977539, "global_step": 437120, "epoch": 2601} {"train_loss": -11.807347297668457, "global_step": 437121, "epoch": 2601} {"train_loss": -12.277105331420898, "global_step": 437122, "epoch": 2601} {"train_loss": -12.163341522216797, "global_step": 437123, "epoch": 2601} {"train_loss": -12.241154670715332, "global_step": 437124, "epoch": 2601} {"train_loss": -12.21048355102539, "global_step": 437125, "epoch": 2601} {"train_loss": -12.259971618652344, "global_step": 437126, "epoch": 2601} {"train_loss": -12.216341972351074, "global_step": 437127, "epoch": 2601} {"train_loss": -12.223791122436523, "global_step": 437128, "epoch": 2601} {"train_loss": -12.368972778320312, "global_step": 437129, "epoch": 2601} {"train_loss": -12.037799835205078, "global_step": 437130, "epoch": 2601} {"train_loss": -12.257795333862305, "global_step": 437131, "epoch": 2601} {"train_loss": -12.43590259552002, "global_step": 437132, "epoch": 2601} {"train_loss": -12.162778854370117, "global_step": 437133, "epoch": 2601} {"train_loss": -12.311634063720703, "global_step": 437134, "epoch": 2601} {"train_loss": -11.467397712525868, "global_step": 437135, "epoch": 2601, "val_loss": 317216.84375} {"train_loss": -12.392242431640625, "global_step": 437136, "epoch": 2602} {"train_loss": -12.435046195983887, "global_step": 437137, "epoch": 2602} {"train_loss": -12.605212211608887, "global_step": 437138, "epoch": 2602} {"train_loss": -12.545232772827148, "global_step": 437139, "epoch": 2602} {"train_loss": -12.499883651733398, "global_step": 437140, "epoch": 2602} {"train_loss": -12.41745662689209, "global_step": 437141, "epoch": 2602} {"train_loss": -12.574995994567871, "global_step": 437142, "epoch": 2602} {"train_loss": -12.579069137573242, "global_step": 437143, "epoch": 2602} {"train_loss": -12.567509651184082, "global_step": 437144, "epoch": 2602} {"train_loss": -12.439227104187012, "global_step": 437145, "epoch": 2602} {"train_loss": -12.464570999145508, "global_step": 437146, "epoch": 2602} {"train_loss": -12.494892120361328, "global_step": 437147, "epoch": 2602} {"train_loss": -12.560738563537598, "global_step": 437148, "epoch": 2602} {"train_loss": -12.581775665283203, "global_step": 437149, "epoch": 2602} {"train_loss": -12.491296768188477, "global_step": 437150, "epoch": 2602} {"train_loss": -12.534801483154297, "global_step": 437151, "epoch": 2602} {"train_loss": -12.488638877868652, "global_step": 437152, "epoch": 2602} {"train_loss": -12.089550018310547, "global_step": 437153, "epoch": 2602} {"train_loss": -12.392410278320312, "global_step": 437154, "epoch": 2602} {"train_loss": -12.138152122497559, "global_step": 437155, "epoch": 2602} {"train_loss": -12.359612464904785, "global_step": 437156, "epoch": 2602} {"train_loss": -12.34847640991211, "global_step": 437157, "epoch": 2602} {"train_loss": -12.386180877685547, "global_step": 437158, "epoch": 2602} {"train_loss": -12.660154342651367, "global_step": 437159, "epoch": 2602} {"train_loss": -12.415557861328125, "global_step": 437160, "epoch": 2602} {"train_loss": -12.607736587524414, "global_step": 437161, "epoch": 2602} {"train_loss": -12.626001358032227, "global_step": 437162, "epoch": 2602} {"train_loss": -12.570409774780273, "global_step": 437163, "epoch": 2602} {"train_loss": -12.612150192260742, "global_step": 437164, "epoch": 2602} {"train_loss": -12.424277305603027, "global_step": 437165, "epoch": 2602} {"train_loss": -12.506780624389648, "global_step": 437166, "epoch": 2602} {"train_loss": -12.796870231628418, "global_step": 437167, "epoch": 2602} {"train_loss": -12.76307487487793, "global_step": 437168, "epoch": 2602} {"train_loss": -12.652705192565918, "global_step": 437169, "epoch": 2602} {"train_loss": -12.83700180053711, "global_step": 437170, "epoch": 2602} {"train_loss": -12.52277660369873, "global_step": 437171, "epoch": 2602} {"train_loss": -13.012246131896973, "global_step": 437172, "epoch": 2602} {"train_loss": -12.467611312866211, "global_step": 437173, "epoch": 2602} {"train_loss": -12.900070190429688, "global_step": 437174, "epoch": 2602} {"train_loss": -12.532631874084473, "global_step": 437175, "epoch": 2602} {"train_loss": -12.759512901306152, "global_step": 437176, "epoch": 2602} {"train_loss": -12.504552841186523, "global_step": 437177, "epoch": 2602} {"train_loss": -12.696834564208984, "global_step": 437178, "epoch": 2602} {"train_loss": -12.637798309326172, "global_step": 437179, "epoch": 2602} {"train_loss": -12.629499435424805, "global_step": 437180, "epoch": 2602} {"train_loss": -12.766271591186523, "global_step": 437181, "epoch": 2602} {"train_loss": -12.937668800354004, "global_step": 437182, "epoch": 2602} {"train_loss": -12.831320762634277, "global_step": 437183, "epoch": 2602} {"train_loss": -12.746883392333984, "global_step": 437184, "epoch": 2602} {"train_loss": -12.842303276062012, "global_step": 437185, "epoch": 2602} {"train_loss": -12.734634399414062, "global_step": 437186, "epoch": 2602} {"train_loss": -12.662393569946289, "global_step": 437187, "epoch": 2602} {"train_loss": -12.964302062988281, "global_step": 437188, "epoch": 2602} {"train_loss": -12.366634368896484, "global_step": 437189, "epoch": 2602} {"train_loss": -12.495735168457031, "global_step": 437190, "epoch": 2602} {"train_loss": -12.65822982788086, "global_step": 437191, "epoch": 2602} {"train_loss": -12.31505012512207, "global_step": 437192, "epoch": 2602} {"train_loss": -12.725467681884766, "global_step": 437193, "epoch": 2602} {"train_loss": -12.628342628479004, "global_step": 437194, "epoch": 2602} {"train_loss": -12.304317474365234, "global_step": 437195, "epoch": 2602} {"train_loss": -12.75039291381836, "global_step": 437196, "epoch": 2602} {"train_loss": -12.648272514343262, "global_step": 437197, "epoch": 2602} {"train_loss": -12.51594066619873, "global_step": 437198, "epoch": 2602} {"train_loss": -12.498527526855469, "global_step": 437199, "epoch": 2602} {"train_loss": -12.532751083374023, "global_step": 437200, "epoch": 2602} {"train_loss": -12.808846473693848, "global_step": 437201, "epoch": 2602} {"train_loss": -12.299542427062988, "global_step": 437202, "epoch": 2602} {"train_loss": -11.850412368774414, "global_step": 437203, "epoch": 2602} {"train_loss": -12.615790367126465, "global_step": 437204, "epoch": 2602} {"train_loss": -12.482465744018555, "global_step": 437205, "epoch": 2602} {"train_loss": -12.578765869140625, "global_step": 437206, "epoch": 2602} {"train_loss": -12.296815872192383, "global_step": 437207, "epoch": 2602} {"train_loss": -12.41281509399414, "global_step": 437208, "epoch": 2602} {"train_loss": -12.538966178894043, "global_step": 437209, "epoch": 2602} {"train_loss": -12.63082504272461, "global_step": 437210, "epoch": 2602} {"train_loss": -12.535265922546387, "global_step": 437211, "epoch": 2602} {"train_loss": -12.512422561645508, "global_step": 437212, "epoch": 2602} {"train_loss": -12.846780776977539, "global_step": 437213, "epoch": 2602} {"train_loss": -12.757412910461426, "global_step": 437214, "epoch": 2602} {"train_loss": -12.759082794189453, "global_step": 437215, "epoch": 2602} {"train_loss": -12.668222427368164, "global_step": 437216, "epoch": 2602} {"train_loss": -12.645569801330566, "global_step": 437217, "epoch": 2602} {"train_loss": -12.786935806274414, "global_step": 437218, "epoch": 2602} {"train_loss": -12.211057662963867, "global_step": 437219, "epoch": 2602} {"train_loss": -11.844513893127441, "global_step": 437220, "epoch": 2602} {"train_loss": -11.922632217407227, "global_step": 437221, "epoch": 2602} {"train_loss": -12.552833557128906, "global_step": 437222, "epoch": 2602} {"train_loss": -12.102804183959961, "global_step": 437223, "epoch": 2602} {"train_loss": -11.20910930633545, "global_step": 437224, "epoch": 2602} {"train_loss": -12.208292961120605, "global_step": 437225, "epoch": 2602} {"train_loss": -12.438129425048828, "global_step": 437226, "epoch": 2602} {"train_loss": -11.708438873291016, "global_step": 437227, "epoch": 2602} {"train_loss": -11.014982223510742, "global_step": 437228, "epoch": 2602} {"train_loss": -10.98560905456543, "global_step": 437229, "epoch": 2602} {"train_loss": -11.508966445922852, "global_step": 437230, "epoch": 2602} {"train_loss": -12.245399475097656, "global_step": 437231, "epoch": 2602} {"train_loss": -10.627691268920898, "global_step": 437232, "epoch": 2602} {"train_loss": -11.864006042480469, "global_step": 437233, "epoch": 2602} {"train_loss": -11.700316429138184, "global_step": 437234, "epoch": 2602} {"train_loss": -11.624000549316406, "global_step": 437235, "epoch": 2602} {"train_loss": -11.185901641845703, "global_step": 437236, "epoch": 2602} {"train_loss": -11.569918632507324, "global_step": 437237, "epoch": 2602} {"train_loss": -11.686732292175293, "global_step": 437238, "epoch": 2602} {"train_loss": -12.192342758178711, "global_step": 437239, "epoch": 2602} {"train_loss": -12.14225959777832, "global_step": 437240, "epoch": 2602} {"train_loss": -11.202827453613281, "global_step": 437241, "epoch": 2602} {"train_loss": -12.462265968322754, "global_step": 437242, "epoch": 2602} {"train_loss": -10.793025016784668, "global_step": 437243, "epoch": 2602} {"train_loss": -11.544685363769531, "global_step": 437244, "epoch": 2602} {"train_loss": -10.756522178649902, "global_step": 437245, "epoch": 2602} {"train_loss": -12.127119064331055, "global_step": 437246, "epoch": 2602} {"train_loss": -10.37163257598877, "global_step": 437247, "epoch": 2602} {"train_loss": -11.632794380187988, "global_step": 437248, "epoch": 2602} {"train_loss": -11.355022430419922, "global_step": 437249, "epoch": 2602} {"train_loss": -10.75603199005127, "global_step": 437250, "epoch": 2602} {"train_loss": -11.734964370727539, "global_step": 437251, "epoch": 2602} {"train_loss": -10.604487419128418, "global_step": 437252, "epoch": 2602} {"train_loss": -11.125537872314453, "global_step": 437253, "epoch": 2602} {"train_loss": -11.657381057739258, "global_step": 437254, "epoch": 2602} {"train_loss": -11.722511291503906, "global_step": 437255, "epoch": 2602} {"train_loss": -11.239973068237305, "global_step": 437256, "epoch": 2602} {"train_loss": -11.57523250579834, "global_step": 437257, "epoch": 2602} {"train_loss": -11.105751991271973, "global_step": 437258, "epoch": 2602} {"train_loss": -11.845489501953125, "global_step": 437259, "epoch": 2602} {"train_loss": -11.22047233581543, "global_step": 437260, "epoch": 2602} {"train_loss": -11.875236511230469, "global_step": 437261, "epoch": 2602} {"train_loss": -12.056242942810059, "global_step": 437262, "epoch": 2602} {"train_loss": -11.280903816223145, "global_step": 437263, "epoch": 2602} {"train_loss": -12.30164909362793, "global_step": 437264, "epoch": 2602} {"train_loss": -11.62421989440918, "global_step": 437265, "epoch": 2602} {"train_loss": -11.831886291503906, "global_step": 437266, "epoch": 2602} {"train_loss": -12.178987503051758, "global_step": 437267, "epoch": 2602} {"train_loss": -11.54864501953125, "global_step": 437268, "epoch": 2602} {"train_loss": -12.31093978881836, "global_step": 437269, "epoch": 2602} {"train_loss": -12.154298782348633, "global_step": 437270, "epoch": 2602} {"train_loss": -12.384101867675781, "global_step": 437271, "epoch": 2602} {"train_loss": -12.418725967407227, "global_step": 437272, "epoch": 2602} {"train_loss": -12.109291076660156, "global_step": 437273, "epoch": 2602} {"train_loss": -12.382644653320312, "global_step": 437274, "epoch": 2602} {"train_loss": -12.060198783874512, "global_step": 437275, "epoch": 2602} {"train_loss": -12.259748458862305, "global_step": 437276, "epoch": 2602} {"train_loss": -12.25881290435791, "global_step": 437277, "epoch": 2602} {"train_loss": -12.031293869018555, "global_step": 437278, "epoch": 2602} {"train_loss": -12.378335952758789, "global_step": 437279, "epoch": 2602} {"train_loss": -12.358236312866211, "global_step": 437280, "epoch": 2602} {"train_loss": -12.501964569091797, "global_step": 437281, "epoch": 2602} {"train_loss": -12.526180267333984, "global_step": 437282, "epoch": 2602} {"train_loss": -12.437483787536621, "global_step": 437283, "epoch": 2602} {"train_loss": -12.365994453430176, "global_step": 437284, "epoch": 2602} {"train_loss": -12.523597717285156, "global_step": 437285, "epoch": 2602} {"train_loss": -12.165323257446289, "global_step": 437286, "epoch": 2602} {"train_loss": -12.362081527709961, "global_step": 437287, "epoch": 2602} {"train_loss": -12.411137580871582, "global_step": 437288, "epoch": 2602} {"train_loss": -12.374406814575195, "global_step": 437289, "epoch": 2602} {"train_loss": -12.270893096923828, "global_step": 437290, "epoch": 2602} {"train_loss": -12.589300155639648, "global_step": 437291, "epoch": 2602} {"train_loss": -12.399690628051758, "global_step": 437292, "epoch": 2602} {"train_loss": -12.551986694335938, "global_step": 437293, "epoch": 2602} {"train_loss": -12.666818618774414, "global_step": 437294, "epoch": 2602} {"train_loss": -12.657448768615723, "global_step": 437295, "epoch": 2602} {"train_loss": -12.535431861877441, "global_step": 437296, "epoch": 2602} {"train_loss": -12.339518547058105, "global_step": 437297, "epoch": 2602} {"train_loss": -12.60972785949707, "global_step": 437298, "epoch": 2602} {"train_loss": -12.477469444274902, "global_step": 437299, "epoch": 2602} {"train_loss": -12.264019966125488, "global_step": 437300, "epoch": 2602} {"train_loss": -12.39625358581543, "global_step": 437301, "epoch": 2602} {"train_loss": -12.409209251403809, "global_step": 437302, "epoch": 2602} {"train_loss": -12.243871098472958, "global_step": 437303, "epoch": 2602, "val_loss": 313167.0625} {"train_loss": -12.019693374633789, "global_step": 437304, "epoch": 2603} {"train_loss": -12.573530197143555, "global_step": 437305, "epoch": 2603} {"train_loss": -12.059009552001953, "global_step": 437306, "epoch": 2603} {"train_loss": -12.611967086791992, "global_step": 437307, "epoch": 2603} {"train_loss": -11.976093292236328, "global_step": 437308, "epoch": 2603} {"train_loss": -12.165044784545898, "global_step": 437309, "epoch": 2603} {"train_loss": -12.599908828735352, "global_step": 437310, "epoch": 2603} {"train_loss": -12.15670394897461, "global_step": 437311, "epoch": 2603} {"train_loss": -12.461610794067383, "global_step": 437312, "epoch": 2603} {"train_loss": -12.379910469055176, "global_step": 437313, "epoch": 2603} {"train_loss": -12.667134284973145, "global_step": 437314, "epoch": 2603} {"train_loss": -12.281167984008789, "global_step": 437315, "epoch": 2603} {"train_loss": -12.616947174072266, "global_step": 437316, "epoch": 2603} {"train_loss": -12.379863739013672, "global_step": 437317, "epoch": 2603} {"train_loss": -12.400188446044922, "global_step": 437318, "epoch": 2603} {"train_loss": -12.155601501464844, "global_step": 437319, "epoch": 2603} {"train_loss": -12.490989685058594, "global_step": 437320, "epoch": 2603} {"train_loss": -12.38896369934082, "global_step": 437321, "epoch": 2603} {"train_loss": -11.9453706741333, "global_step": 437322, "epoch": 2603} {"train_loss": -12.399758338928223, "global_step": 437323, "epoch": 2603} {"train_loss": -12.378955841064453, "global_step": 437324, "epoch": 2603} {"train_loss": -12.258197784423828, "global_step": 437325, "epoch": 2603} {"train_loss": -12.314767837524414, "global_step": 437326, "epoch": 2603} {"train_loss": -12.409843444824219, "global_step": 437327, "epoch": 2603} {"train_loss": -12.678400039672852, "global_step": 437328, "epoch": 2603} {"train_loss": -12.213436126708984, "global_step": 437329, "epoch": 2603} {"train_loss": -11.723477363586426, "global_step": 437330, "epoch": 2603} {"train_loss": -12.640119552612305, "global_step": 437331, "epoch": 2603} {"train_loss": -11.654730796813965, "global_step": 437332, "epoch": 2603} {"train_loss": -11.886537551879883, "global_step": 437333, "epoch": 2603} {"train_loss": -12.139958381652832, "global_step": 437334, "epoch": 2603} {"train_loss": -12.521783828735352, "global_step": 437335, "epoch": 2603} {"train_loss": -11.98748779296875, "global_step": 437336, "epoch": 2603} {"train_loss": -11.416125297546387, "global_step": 437337, "epoch": 2603} {"train_loss": -11.80827522277832, "global_step": 437338, "epoch": 2603} {"train_loss": -11.590841293334961, "global_step": 437339, "epoch": 2603} {"train_loss": -11.850837707519531, "global_step": 437340, "epoch": 2603} {"train_loss": -11.829305648803711, "global_step": 437341, "epoch": 2603} {"train_loss": -12.206647872924805, "global_step": 437342, "epoch": 2603} {"train_loss": -11.604325294494629, "global_step": 437343, "epoch": 2603} {"train_loss": -12.25322151184082, "global_step": 437344, "epoch": 2603} {"train_loss": -12.007843971252441, "global_step": 437345, "epoch": 2603} {"train_loss": -12.03923225402832, "global_step": 437346, "epoch": 2603} {"train_loss": -11.89300537109375, "global_step": 437347, "epoch": 2603} {"train_loss": -10.9153413772583, "global_step": 437348, "epoch": 2603} {"train_loss": -11.998408317565918, "global_step": 437349, "epoch": 2603} {"train_loss": -12.461973190307617, "global_step": 437350, "epoch": 2603} {"train_loss": -11.773536682128906, "global_step": 437351, "epoch": 2603} {"train_loss": -12.571598052978516, "global_step": 437352, "epoch": 2603} {"train_loss": -11.551253318786621, "global_step": 437353, "epoch": 2603} {"train_loss": -12.158581733703613, "global_step": 437354, "epoch": 2603} {"train_loss": -12.202215194702148, "global_step": 437355, "epoch": 2603} {"train_loss": -11.879898071289062, "global_step": 437356, "epoch": 2603} {"train_loss": -12.4332914352417, "global_step": 437357, "epoch": 2603} {"train_loss": -12.4410982131958, "global_step": 437358, "epoch": 2603} {"train_loss": -12.572563171386719, "global_step": 437359, "epoch": 2603} {"train_loss": -12.007230758666992, "global_step": 437360, "epoch": 2603} {"train_loss": -12.489154815673828, "global_step": 437361, "epoch": 2603} {"train_loss": -12.303567886352539, "global_step": 437362, "epoch": 2603} {"train_loss": -12.65060806274414, "global_step": 437363, "epoch": 2603} {"train_loss": -12.588964462280273, "global_step": 437364, "epoch": 2603} {"train_loss": -12.501032829284668, "global_step": 437365, "epoch": 2603} {"train_loss": -12.591409683227539, "global_step": 437366, "epoch": 2603} {"train_loss": -12.419305801391602, "global_step": 437367, "epoch": 2603} {"train_loss": -12.869680404663086, "global_step": 437368, "epoch": 2603} {"train_loss": -12.5943603515625, "global_step": 437369, "epoch": 2603} {"train_loss": -12.751849174499512, "global_step": 437370, "epoch": 2603} {"train_loss": -12.571231842041016, "global_step": 437371, "epoch": 2603} {"train_loss": -12.816473007202148, "global_step": 437372, "epoch": 2603} {"train_loss": -12.522565841674805, "global_step": 437373, "epoch": 2603} {"train_loss": -12.610759735107422, "global_step": 437374, "epoch": 2603} {"train_loss": -12.747812271118164, "global_step": 437375, "epoch": 2603} {"train_loss": -12.694872856140137, "global_step": 437376, "epoch": 2603} {"train_loss": -12.639374732971191, "global_step": 437377, "epoch": 2603} {"train_loss": -12.526844024658203, "global_step": 437378, "epoch": 2603} {"train_loss": -12.263076782226562, "global_step": 437379, "epoch": 2603} {"train_loss": -12.497579574584961, "global_step": 437380, "epoch": 2603} {"train_loss": -11.975675582885742, "global_step": 437381, "epoch": 2603} {"train_loss": -12.572919845581055, "global_step": 437382, "epoch": 2603} {"train_loss": -12.614084243774414, "global_step": 437383, "epoch": 2603} {"train_loss": -11.884450912475586, "global_step": 437384, "epoch": 2603} {"train_loss": -11.04804515838623, "global_step": 437385, "epoch": 2603} {"train_loss": -11.9185209274292, "global_step": 437386, "epoch": 2603} {"train_loss": -10.988676071166992, "global_step": 437387, "epoch": 2603} {"train_loss": -10.683236122131348, "global_step": 437388, "epoch": 2603} {"train_loss": -10.487764358520508, "global_step": 437389, "epoch": 2603} {"train_loss": -10.144716262817383, "global_step": 437390, "epoch": 2603} {"train_loss": -10.555469512939453, "global_step": 437391, "epoch": 2603} {"train_loss": -8.380645751953125, "global_step": 437392, "epoch": 2603} {"train_loss": -7.740257263183594, "global_step": 437393, "epoch": 2603} {"train_loss": -8.135738372802734, "global_step": 437394, "epoch": 2603} {"train_loss": -8.427831649780273, "global_step": 437395, "epoch": 2603} {"train_loss": -8.55953598022461, "global_step": 437396, "epoch": 2603} {"train_loss": -8.921102523803711, "global_step": 437397, "epoch": 2603} {"train_loss": -8.290172576904297, "global_step": 437398, "epoch": 2603} {"train_loss": -9.397039413452148, "global_step": 437399, "epoch": 2603} {"train_loss": -9.019601821899414, "global_step": 437400, "epoch": 2603} {"train_loss": -8.71011734008789, "global_step": 437401, "epoch": 2603} {"train_loss": -10.009078979492188, "global_step": 437402, "epoch": 2603} {"train_loss": -9.754068374633789, "global_step": 437403, "epoch": 2603} {"train_loss": -11.046079635620117, "global_step": 437404, "epoch": 2603} {"train_loss": -10.87041187286377, "global_step": 437405, "epoch": 2603} {"train_loss": -11.344182014465332, "global_step": 437406, "epoch": 2603} {"train_loss": -11.245452880859375, "global_step": 437407, "epoch": 2603} {"train_loss": -10.981074333190918, "global_step": 437408, "epoch": 2603} {"train_loss": -11.768206596374512, "global_step": 437409, "epoch": 2603} {"train_loss": -11.222694396972656, "global_step": 437410, "epoch": 2603} {"train_loss": -11.25360107421875, "global_step": 437411, "epoch": 2603} {"train_loss": -11.249393463134766, "global_step": 437412, "epoch": 2603} {"train_loss": -11.27684211730957, "global_step": 437413, "epoch": 2603} {"train_loss": -11.931777000427246, "global_step": 437414, "epoch": 2603} {"train_loss": -11.687938690185547, "global_step": 437415, "epoch": 2603} {"train_loss": -12.077333450317383, "global_step": 437416, "epoch": 2603} {"train_loss": -11.309812545776367, "global_step": 437417, "epoch": 2603} {"train_loss": -11.574481964111328, "global_step": 437418, "epoch": 2603} {"train_loss": -12.139168739318848, "global_step": 437419, "epoch": 2603} {"train_loss": -12.006002426147461, "global_step": 437420, "epoch": 2603} {"train_loss": -12.044864654541016, "global_step": 437421, "epoch": 2603} {"train_loss": -12.248881340026855, "global_step": 437422, "epoch": 2603} {"train_loss": -11.885380744934082, "global_step": 437423, "epoch": 2603} {"train_loss": -12.025390625, "global_step": 437424, "epoch": 2603} {"train_loss": -12.292025566101074, "global_step": 437425, "epoch": 2603} {"train_loss": -12.34180736541748, "global_step": 437426, "epoch": 2603} {"train_loss": -12.370790481567383, "global_step": 437427, "epoch": 2603} {"train_loss": -12.09339714050293, "global_step": 437428, "epoch": 2603} {"train_loss": -12.305831909179688, "global_step": 437429, "epoch": 2603} {"train_loss": -12.437877655029297, "global_step": 437430, "epoch": 2603} {"train_loss": -12.2540864944458, "global_step": 437431, "epoch": 2603} {"train_loss": -12.183769226074219, "global_step": 437432, "epoch": 2603} {"train_loss": -12.309368133544922, "global_step": 437433, "epoch": 2603} {"train_loss": -12.392549514770508, "global_step": 437434, "epoch": 2603} {"train_loss": -12.187317848205566, "global_step": 437435, "epoch": 2603} {"train_loss": -12.365058898925781, "global_step": 437436, "epoch": 2603} {"train_loss": -12.166499137878418, "global_step": 437437, "epoch": 2603} {"train_loss": -12.662221908569336, "global_step": 437438, "epoch": 2603} {"train_loss": -12.1840181350708, "global_step": 437439, "epoch": 2603} {"train_loss": -12.483182907104492, "global_step": 437440, "epoch": 2603} {"train_loss": -12.49468994140625, "global_step": 437441, "epoch": 2603} {"train_loss": -12.43918228149414, "global_step": 437442, "epoch": 2603} {"train_loss": -12.201150894165039, "global_step": 437443, "epoch": 2603} {"train_loss": -12.527969360351562, "global_step": 437444, "epoch": 2603} {"train_loss": -11.987482070922852, "global_step": 437445, "epoch": 2603} {"train_loss": -12.216245651245117, "global_step": 437446, "epoch": 2603} {"train_loss": -12.147568702697754, "global_step": 437447, "epoch": 2603} {"train_loss": -12.291141510009766, "global_step": 437448, "epoch": 2603} {"train_loss": -12.473040580749512, "global_step": 437449, "epoch": 2603} {"train_loss": -12.375240325927734, "global_step": 437450, "epoch": 2603} {"train_loss": -11.500248908996582, "global_step": 437451, "epoch": 2603} {"train_loss": -12.564369201660156, "global_step": 437452, "epoch": 2603} {"train_loss": -12.368574142456055, "global_step": 437453, "epoch": 2603} {"train_loss": -9.452853202819824, "global_step": 437454, "epoch": 2603} {"train_loss": -12.659887313842773, "global_step": 437455, "epoch": 2603} {"train_loss": -12.131071090698242, "global_step": 437456, "epoch": 2603} {"train_loss": -12.125754356384277, "global_step": 437457, "epoch": 2603} {"train_loss": -12.154510498046875, "global_step": 437458, "epoch": 2603} {"train_loss": -11.985847473144531, "global_step": 437459, "epoch": 2603} {"train_loss": -11.921892166137695, "global_step": 437460, "epoch": 2603} {"train_loss": -12.244641304016113, "global_step": 437461, "epoch": 2603} {"train_loss": -12.063430786132812, "global_step": 437462, "epoch": 2603} {"train_loss": -12.172050476074219, "global_step": 437463, "epoch": 2603} {"train_loss": -12.580021858215332, "global_step": 437464, "epoch": 2603} {"train_loss": -12.24019718170166, "global_step": 437465, "epoch": 2603} {"train_loss": -12.221567153930664, "global_step": 437466, "epoch": 2603} {"train_loss": -12.28924560546875, "global_step": 437467, "epoch": 2603} {"train_loss": -12.115985870361328, "global_step": 437468, "epoch": 2603} {"train_loss": -12.4075927734375, "global_step": 437469, "epoch": 2603} {"train_loss": -12.272262573242188, "global_step": 437470, "epoch": 2603} {"train_loss": -11.856872484797524, "global_step": 437471, "epoch": 2603, "val_loss": 310197.78125} {"train_loss": -12.286103248596191, "global_step": 437472, "epoch": 2604} {"train_loss": -12.34700870513916, "global_step": 437473, "epoch": 2604} {"train_loss": -11.515581130981445, "global_step": 437474, "epoch": 2604} {"train_loss": -12.214607238769531, "global_step": 437475, "epoch": 2604} {"train_loss": -12.371895790100098, "global_step": 437476, "epoch": 2604} {"train_loss": -12.494972229003906, "global_step": 437477, "epoch": 2604} {"train_loss": -12.414911270141602, "global_step": 437478, "epoch": 2604} {"train_loss": -12.429800987243652, "global_step": 437479, "epoch": 2604} {"train_loss": -12.36900520324707, "global_step": 437480, "epoch": 2604} {"train_loss": -12.301008224487305, "global_step": 437481, "epoch": 2604} {"train_loss": -12.001632690429688, "global_step": 437482, "epoch": 2604} {"train_loss": -12.689994812011719, "global_step": 437483, "epoch": 2604} {"train_loss": -12.020391464233398, "global_step": 437484, "epoch": 2604} {"train_loss": -12.70045280456543, "global_step": 437485, "epoch": 2604} {"train_loss": -12.35038948059082, "global_step": 437486, "epoch": 2604} {"train_loss": -12.496688842773438, "global_step": 437487, "epoch": 2604} {"train_loss": -12.368389129638672, "global_step": 437488, "epoch": 2604} {"train_loss": -12.588040351867676, "global_step": 437489, "epoch": 2604} {"train_loss": -12.488204956054688, "global_step": 437490, "epoch": 2604} {"train_loss": -12.214519500732422, "global_step": 437491, "epoch": 2604} {"train_loss": -12.557796478271484, "global_step": 437492, "epoch": 2604} {"train_loss": -12.70162582397461, "global_step": 437493, "epoch": 2604} {"train_loss": -12.572081565856934, "global_step": 437494, "epoch": 2604} {"train_loss": -12.224483489990234, "global_step": 437495, "epoch": 2604} {"train_loss": -12.810720443725586, "global_step": 437496, "epoch": 2604} {"train_loss": -12.800590515136719, "global_step": 437497, "epoch": 2604} {"train_loss": -12.816879272460938, "global_step": 437498, "epoch": 2604} {"train_loss": -12.66995620727539, "global_step": 437499, "epoch": 2604} {"train_loss": -12.633756637573242, "global_step": 437500, "epoch": 2604} {"train_loss": -12.40296745300293, "global_step": 437501, "epoch": 2604} {"train_loss": -12.556785583496094, "global_step": 437502, "epoch": 2604} {"train_loss": -12.622504234313965, "global_step": 437503, "epoch": 2604} {"train_loss": -12.734663009643555, "global_step": 437504, "epoch": 2604} {"train_loss": -12.641777038574219, "global_step": 437505, "epoch": 2604} {"train_loss": -12.517873764038086, "global_step": 437506, "epoch": 2604} {"train_loss": -12.405614852905273, "global_step": 437507, "epoch": 2604} {"train_loss": -12.508218765258789, "global_step": 437508, "epoch": 2604} {"train_loss": -12.414653778076172, "global_step": 437509, "epoch": 2604} {"train_loss": -12.496088981628418, "global_step": 437510, "epoch": 2604} {"train_loss": -12.385701179504395, "global_step": 437511, "epoch": 2604} {"train_loss": -12.318411827087402, "global_step": 437512, "epoch": 2604} {"train_loss": -12.3361177444458, "global_step": 437513, "epoch": 2604} {"train_loss": -12.386536598205566, "global_step": 437514, "epoch": 2604} {"train_loss": -12.705689430236816, "global_step": 437515, "epoch": 2604} {"train_loss": -12.723037719726562, "global_step": 437516, "epoch": 2604} {"train_loss": -12.456478118896484, "global_step": 437517, "epoch": 2604} {"train_loss": -12.589612007141113, "global_step": 437518, "epoch": 2604} {"train_loss": -12.779106140136719, "global_step": 437519, "epoch": 2604} {"train_loss": -12.035642623901367, "global_step": 437520, "epoch": 2604} {"train_loss": -12.451944351196289, "global_step": 437521, "epoch": 2604} {"train_loss": -12.483807563781738, "global_step": 437522, "epoch": 2604} {"train_loss": -12.112285614013672, "global_step": 437523, "epoch": 2604} {"train_loss": -12.24203109741211, "global_step": 437524, "epoch": 2604} {"train_loss": -12.459232330322266, "global_step": 437525, "epoch": 2604} {"train_loss": -12.262337684631348, "global_step": 437526, "epoch": 2604} {"train_loss": -11.72739315032959, "global_step": 437527, "epoch": 2604} {"train_loss": -12.468920707702637, "global_step": 437528, "epoch": 2604} {"train_loss": -12.178215980529785, "global_step": 437529, "epoch": 2604} {"train_loss": -12.48762321472168, "global_step": 437530, "epoch": 2604} {"train_loss": -12.341157913208008, "global_step": 437531, "epoch": 2604} {"train_loss": -12.494709968566895, "global_step": 437532, "epoch": 2604} {"train_loss": -11.54690170288086, "global_step": 437533, "epoch": 2604} {"train_loss": -10.500402450561523, "global_step": 437534, "epoch": 2604} {"train_loss": -12.349678039550781, "global_step": 437535, "epoch": 2604} {"train_loss": -11.691760063171387, "global_step": 437536, "epoch": 2604} {"train_loss": -11.718931198120117, "global_step": 437537, "epoch": 2604} {"train_loss": -11.136055946350098, "global_step": 437538, "epoch": 2604} {"train_loss": -10.98751449584961, "global_step": 437539, "epoch": 2604} {"train_loss": -10.798382759094238, "global_step": 437540, "epoch": 2604} {"train_loss": -11.40268325805664, "global_step": 437541, "epoch": 2604} {"train_loss": -11.08369255065918, "global_step": 437542, "epoch": 2604} {"train_loss": -9.549964904785156, "global_step": 437543, "epoch": 2604} {"train_loss": -10.146577835083008, "global_step": 437544, "epoch": 2604} {"train_loss": -10.621788024902344, "global_step": 437545, "epoch": 2604} {"train_loss": -9.706868171691895, "global_step": 437546, "epoch": 2604} {"train_loss": -8.698469161987305, "global_step": 437547, "epoch": 2604} {"train_loss": -9.249093055725098, "global_step": 437548, "epoch": 2604} {"train_loss": -10.394920349121094, "global_step": 437549, "epoch": 2604} {"train_loss": -9.656789779663086, "global_step": 437550, "epoch": 2604} {"train_loss": -9.60285472869873, "global_step": 437551, "epoch": 2604} {"train_loss": -8.79547119140625, "global_step": 437552, "epoch": 2604} {"train_loss": -9.395596504211426, "global_step": 437553, "epoch": 2604} {"train_loss": -10.187399864196777, "global_step": 437554, "epoch": 2604} {"train_loss": -9.224870681762695, "global_step": 437555, "epoch": 2604} {"train_loss": -10.260970115661621, "global_step": 437556, "epoch": 2604} {"train_loss": -10.957592010498047, "global_step": 437557, "epoch": 2604} {"train_loss": -10.905780792236328, "global_step": 437558, "epoch": 2604} {"train_loss": -10.819615364074707, "global_step": 437559, "epoch": 2604} {"train_loss": -11.214052200317383, "global_step": 437560, "epoch": 2604} {"train_loss": -10.496732711791992, "global_step": 437561, "epoch": 2604} {"train_loss": -10.969627380371094, "global_step": 437562, "epoch": 2604} {"train_loss": -11.053558349609375, "global_step": 437563, "epoch": 2604} {"train_loss": -10.125411033630371, "global_step": 437564, "epoch": 2604} {"train_loss": -11.433961868286133, "global_step": 437565, "epoch": 2604} {"train_loss": -11.298112869262695, "global_step": 437566, "epoch": 2604} {"train_loss": -11.471632957458496, "global_step": 437567, "epoch": 2604} {"train_loss": -11.183876037597656, "global_step": 437568, "epoch": 2604} {"train_loss": -11.286930084228516, "global_step": 437569, "epoch": 2604} {"train_loss": -11.510156631469727, "global_step": 437570, "epoch": 2604} {"train_loss": -11.317037582397461, "global_step": 437571, "epoch": 2604} {"train_loss": -11.638158798217773, "global_step": 437572, "epoch": 2604} {"train_loss": -11.48785400390625, "global_step": 437573, "epoch": 2604} {"train_loss": -11.35437297821045, "global_step": 437574, "epoch": 2604} {"train_loss": -11.590197563171387, "global_step": 437575, "epoch": 2604} {"train_loss": -11.597622871398926, "global_step": 437576, "epoch": 2604} {"train_loss": -11.203184127807617, "global_step": 437577, "epoch": 2604} {"train_loss": -11.551691055297852, "global_step": 437578, "epoch": 2604} {"train_loss": -11.709952354431152, "global_step": 437579, "epoch": 2604} {"train_loss": -11.611774444580078, "global_step": 437580, "epoch": 2604} {"train_loss": -11.758831977844238, "global_step": 437581, "epoch": 2604} {"train_loss": -11.413385391235352, "global_step": 437582, "epoch": 2604} {"train_loss": -12.036542892456055, "global_step": 437583, "epoch": 2604} {"train_loss": -11.74547290802002, "global_step": 437584, "epoch": 2604} {"train_loss": -11.966596603393555, "global_step": 437585, "epoch": 2604} {"train_loss": -11.853572845458984, "global_step": 437586, "epoch": 2604} {"train_loss": -12.275005340576172, "global_step": 437587, "epoch": 2604} {"train_loss": -12.127262115478516, "global_step": 437588, "epoch": 2604} {"train_loss": -12.042850494384766, "global_step": 437589, "epoch": 2604} {"train_loss": -12.04983139038086, "global_step": 437590, "epoch": 2604} {"train_loss": -11.612503051757812, "global_step": 437591, "epoch": 2604} {"train_loss": -12.26923942565918, "global_step": 437592, "epoch": 2604} {"train_loss": -11.142786026000977, "global_step": 437593, "epoch": 2604} {"train_loss": -12.330729484558105, "global_step": 437594, "epoch": 2604} {"train_loss": -12.116636276245117, "global_step": 437595, "epoch": 2604} {"train_loss": -12.162092208862305, "global_step": 437596, "epoch": 2604} {"train_loss": -11.888548851013184, "global_step": 437597, "epoch": 2604} {"train_loss": -12.325578689575195, "global_step": 437598, "epoch": 2604} {"train_loss": -11.67706298828125, "global_step": 437599, "epoch": 2604} {"train_loss": -12.083257675170898, "global_step": 437600, "epoch": 2604} {"train_loss": -12.016204833984375, "global_step": 437601, "epoch": 2604} {"train_loss": -12.113924026489258, "global_step": 437602, "epoch": 2604} {"train_loss": -12.47559928894043, "global_step": 437603, "epoch": 2604} {"train_loss": -11.90652084350586, "global_step": 437604, "epoch": 2604} {"train_loss": -12.625748634338379, "global_step": 437605, "epoch": 2604} {"train_loss": -12.266547203063965, "global_step": 437606, "epoch": 2604} {"train_loss": -12.160968780517578, "global_step": 437607, "epoch": 2604} {"train_loss": -12.091533660888672, "global_step": 437608, "epoch": 2604} {"train_loss": -12.231888771057129, "global_step": 437609, "epoch": 2604} {"train_loss": -12.188232421875, "global_step": 437610, "epoch": 2604} {"train_loss": -12.414327621459961, "global_step": 437611, "epoch": 2604} {"train_loss": -12.536109924316406, "global_step": 437612, "epoch": 2604} {"train_loss": -12.329649925231934, "global_step": 437613, "epoch": 2604} {"train_loss": -12.243192672729492, "global_step": 437614, "epoch": 2604} {"train_loss": -12.430381774902344, "global_step": 437615, "epoch": 2604} {"train_loss": -12.168962478637695, "global_step": 437616, "epoch": 2604} {"train_loss": -12.257698059082031, "global_step": 437617, "epoch": 2604} {"train_loss": -12.193808555603027, "global_step": 437618, "epoch": 2604} {"train_loss": -12.215572357177734, "global_step": 437619, "epoch": 2604} {"train_loss": -12.620874404907227, "global_step": 437620, "epoch": 2604} {"train_loss": -12.295184135437012, "global_step": 437621, "epoch": 2604} {"train_loss": -12.340158462524414, "global_step": 437622, "epoch": 2604} {"train_loss": -12.32464599609375, "global_step": 437623, "epoch": 2604} {"train_loss": -12.647614479064941, "global_step": 437624, "epoch": 2604} {"train_loss": -12.7637939453125, "global_step": 437625, "epoch": 2604} {"train_loss": -12.503170013427734, "global_step": 437626, "epoch": 2604} {"train_loss": -12.720573425292969, "global_step": 437627, "epoch": 2604} {"train_loss": -12.440536499023438, "global_step": 437628, "epoch": 2604} {"train_loss": -12.497596740722656, "global_step": 437629, "epoch": 2604} {"train_loss": -12.568120956420898, "global_step": 437630, "epoch": 2604} {"train_loss": -12.414908409118652, "global_step": 437631, "epoch": 2604} {"train_loss": -12.584896087646484, "global_step": 437632, "epoch": 2604} {"train_loss": -12.732976913452148, "global_step": 437633, "epoch": 2604} {"train_loss": -12.568702697753906, "global_step": 437634, "epoch": 2604} {"train_loss": -12.591435432434082, "global_step": 437635, "epoch": 2604} {"train_loss": -12.744279861450195, "global_step": 437636, "epoch": 2604} {"train_loss": -12.745437622070312, "global_step": 437637, "epoch": 2604} {"train_loss": -12.731067657470703, "global_step": 437638, "epoch": 2604} {"train_loss": -11.903297492436, "global_step": 437639, "epoch": 2604, "val_loss": 309297.78125} {"train_loss": -12.734583854675293, "global_step": 437640, "epoch": 2605} {"train_loss": -12.686389923095703, "global_step": 437641, "epoch": 2605} {"train_loss": -12.643312454223633, "global_step": 437642, "epoch": 2605} {"train_loss": -12.465730667114258, "global_step": 437643, "epoch": 2605} {"train_loss": -12.731922149658203, "global_step": 437644, "epoch": 2605} {"train_loss": -12.75204849243164, "global_step": 437645, "epoch": 2605} {"train_loss": -12.476400375366211, "global_step": 437646, "epoch": 2605} {"train_loss": -12.878841400146484, "global_step": 437647, "epoch": 2605} {"train_loss": -12.64525032043457, "global_step": 437648, "epoch": 2605} {"train_loss": -12.813777923583984, "global_step": 437649, "epoch": 2605} {"train_loss": -12.80111312866211, "global_step": 437650, "epoch": 2605} {"train_loss": -13.070938110351562, "global_step": 437651, "epoch": 2605} {"train_loss": -12.475915908813477, "global_step": 437652, "epoch": 2605} {"train_loss": -12.64537239074707, "global_step": 437653, "epoch": 2605} {"train_loss": -12.834080696105957, "global_step": 437654, "epoch": 2605} {"train_loss": -12.725470542907715, "global_step": 437655, "epoch": 2605} {"train_loss": -12.780056953430176, "global_step": 437656, "epoch": 2605} {"train_loss": -12.021693229675293, "global_step": 437657, "epoch": 2605} {"train_loss": -11.440661430358887, "global_step": 437658, "epoch": 2605} {"train_loss": -12.608860969543457, "global_step": 437659, "epoch": 2605} {"train_loss": -11.005516052246094, "global_step": 437660, "epoch": 2605} {"train_loss": -10.219524383544922, "global_step": 437661, "epoch": 2605} {"train_loss": -11.268362045288086, "global_step": 437662, "epoch": 2605} {"train_loss": -10.380105018615723, "global_step": 437663, "epoch": 2605} {"train_loss": -9.9066162109375, "global_step": 437664, "epoch": 2605} {"train_loss": -8.932398796081543, "global_step": 437665, "epoch": 2605} {"train_loss": -8.650663375854492, "global_step": 437666, "epoch": 2605} {"train_loss": -8.746140480041504, "global_step": 437667, "epoch": 2605} {"train_loss": -8.831188201904297, "global_step": 437668, "epoch": 2605} {"train_loss": -9.287687301635742, "global_step": 437669, "epoch": 2605} {"train_loss": -8.828254699707031, "global_step": 437670, "epoch": 2605} {"train_loss": -9.64584732055664, "global_step": 437671, "epoch": 2605} {"train_loss": -9.448369979858398, "global_step": 437672, "epoch": 2605} {"train_loss": -9.099239349365234, "global_step": 437673, "epoch": 2605} {"train_loss": -10.040567398071289, "global_step": 437674, "epoch": 2605} {"train_loss": -9.452095985412598, "global_step": 437675, "epoch": 2605} {"train_loss": -9.794092178344727, "global_step": 437676, "epoch": 2605} {"train_loss": -9.920295715332031, "global_step": 437677, "epoch": 2605} {"train_loss": -10.216200828552246, "global_step": 437678, "epoch": 2605} {"train_loss": -10.786569595336914, "global_step": 437679, "epoch": 2605} {"train_loss": -10.350762367248535, "global_step": 437680, "epoch": 2605} {"train_loss": -10.937910079956055, "global_step": 437681, "epoch": 2605} {"train_loss": -10.863699913024902, "global_step": 437682, "epoch": 2605} {"train_loss": -11.315862655639648, "global_step": 437683, "epoch": 2605} {"train_loss": -11.167808532714844, "global_step": 437684, "epoch": 2605} {"train_loss": -11.413293838500977, "global_step": 437685, "epoch": 2605} {"train_loss": -11.661197662353516, "global_step": 437686, "epoch": 2605} {"train_loss": -11.69352912902832, "global_step": 437687, "epoch": 2605} {"train_loss": -11.655061721801758, "global_step": 437688, "epoch": 2605} {"train_loss": -11.336530685424805, "global_step": 437689, "epoch": 2605} {"train_loss": -11.796037673950195, "global_step": 437690, "epoch": 2605} {"train_loss": -11.68853759765625, "global_step": 437691, "epoch": 2605} {"train_loss": -12.030891418457031, "global_step": 437692, "epoch": 2605} {"train_loss": -11.887640953063965, "global_step": 437693, "epoch": 2605} {"train_loss": -11.623674392700195, "global_step": 437694, "epoch": 2605} {"train_loss": -11.792377471923828, "global_step": 437695, "epoch": 2605} {"train_loss": -11.978653907775879, "global_step": 437696, "epoch": 2605} {"train_loss": -11.586770057678223, "global_step": 437697, "epoch": 2605} {"train_loss": -11.856425285339355, "global_step": 437698, "epoch": 2605} {"train_loss": -11.696602821350098, "global_step": 437699, "epoch": 2605} {"train_loss": -11.99510383605957, "global_step": 437700, "epoch": 2605} {"train_loss": -11.830660820007324, "global_step": 437701, "epoch": 2605} {"train_loss": -12.556343078613281, "global_step": 437702, "epoch": 2605} {"train_loss": -12.27375602722168, "global_step": 437703, "epoch": 2605} {"train_loss": -11.809417724609375, "global_step": 437704, "epoch": 2605} {"train_loss": -12.402639389038086, "global_step": 437705, "epoch": 2605} {"train_loss": -11.945737838745117, "global_step": 437706, "epoch": 2605} {"train_loss": -11.993844985961914, "global_step": 437707, "epoch": 2605} {"train_loss": -12.06091022491455, "global_step": 437708, "epoch": 2605} {"train_loss": -12.18744945526123, "global_step": 437709, "epoch": 2605} {"train_loss": -12.108930587768555, "global_step": 437710, "epoch": 2605} {"train_loss": -12.289072036743164, "global_step": 437711, "epoch": 2605} {"train_loss": -12.040870666503906, "global_step": 437712, "epoch": 2605} {"train_loss": -12.234657287597656, "global_step": 437713, "epoch": 2605} {"train_loss": -12.247909545898438, "global_step": 437714, "epoch": 2605} {"train_loss": -12.61529541015625, "global_step": 437715, "epoch": 2605} {"train_loss": -12.060813903808594, "global_step": 437716, "epoch": 2605} {"train_loss": -12.367465019226074, "global_step": 437717, "epoch": 2605} {"train_loss": -11.525042533874512, "global_step": 437718, "epoch": 2605} {"train_loss": -12.468177795410156, "global_step": 437719, "epoch": 2605} {"train_loss": -11.934146881103516, "global_step": 437720, "epoch": 2605} {"train_loss": -11.7860689163208, "global_step": 437721, "epoch": 2605} {"train_loss": -12.33209228515625, "global_step": 437722, "epoch": 2605} {"train_loss": -11.538992881774902, "global_step": 437723, "epoch": 2605} {"train_loss": -12.56360912322998, "global_step": 437724, "epoch": 2605} {"train_loss": -12.186990737915039, "global_step": 437725, "epoch": 2605} {"train_loss": -12.011249542236328, "global_step": 437726, "epoch": 2605} {"train_loss": -12.080179214477539, "global_step": 437727, "epoch": 2605} {"train_loss": -11.852210998535156, "global_step": 437728, "epoch": 2605} {"train_loss": -11.756050109863281, "global_step": 437729, "epoch": 2605} {"train_loss": -11.818790435791016, "global_step": 437730, "epoch": 2605} {"train_loss": -11.577327728271484, "global_step": 437731, "epoch": 2605} {"train_loss": -11.673680305480957, "global_step": 437732, "epoch": 2605} {"train_loss": -11.21419906616211, "global_step": 437733, "epoch": 2605} {"train_loss": -11.484037399291992, "global_step": 437734, "epoch": 2605} {"train_loss": -11.862604141235352, "global_step": 437735, "epoch": 2605} {"train_loss": -11.376642227172852, "global_step": 437736, "epoch": 2605} {"train_loss": -12.105493545532227, "global_step": 437737, "epoch": 2605} {"train_loss": -11.310257911682129, "global_step": 437738, "epoch": 2605} {"train_loss": -12.329626083374023, "global_step": 437739, "epoch": 2605} {"train_loss": -11.500106811523438, "global_step": 437740, "epoch": 2605} {"train_loss": -11.972087860107422, "global_step": 437741, "epoch": 2605} {"train_loss": -12.210166931152344, "global_step": 437742, "epoch": 2605} {"train_loss": -11.270317077636719, "global_step": 437743, "epoch": 2605} {"train_loss": -12.288166046142578, "global_step": 437744, "epoch": 2605} {"train_loss": -11.851179122924805, "global_step": 437745, "epoch": 2605} {"train_loss": -12.296995162963867, "global_step": 437746, "epoch": 2605} {"train_loss": -11.384182929992676, "global_step": 437747, "epoch": 2605} {"train_loss": -12.344917297363281, "global_step": 437748, "epoch": 2605} {"train_loss": -11.848791122436523, "global_step": 437749, "epoch": 2605} {"train_loss": -12.24104118347168, "global_step": 437750, "epoch": 2605} {"train_loss": -12.060355186462402, "global_step": 437751, "epoch": 2605} {"train_loss": -12.093057632446289, "global_step": 437752, "epoch": 2605} {"train_loss": -12.284870147705078, "global_step": 437753, "epoch": 2605} {"train_loss": -11.981731414794922, "global_step": 437754, "epoch": 2605} {"train_loss": -12.364832878112793, "global_step": 437755, "epoch": 2605} {"train_loss": -12.155728340148926, "global_step": 437756, "epoch": 2605} {"train_loss": -12.49870777130127, "global_step": 437757, "epoch": 2605} {"train_loss": -12.211222648620605, "global_step": 437758, "epoch": 2605} {"train_loss": -12.127087593078613, "global_step": 437759, "epoch": 2605} {"train_loss": -12.062969207763672, "global_step": 437760, "epoch": 2605} {"train_loss": -12.16190242767334, "global_step": 437761, "epoch": 2605} {"train_loss": -12.302559852600098, "global_step": 437762, "epoch": 2605} {"train_loss": -12.604582786560059, "global_step": 437763, "epoch": 2605} {"train_loss": -12.420503616333008, "global_step": 437764, "epoch": 2605} {"train_loss": -12.643096923828125, "global_step": 437765, "epoch": 2605} {"train_loss": -12.338977813720703, "global_step": 437766, "epoch": 2605} {"train_loss": -12.271905899047852, "global_step": 437767, "epoch": 2605} {"train_loss": -12.611255645751953, "global_step": 437768, "epoch": 2605} {"train_loss": -12.458534240722656, "global_step": 437769, "epoch": 2605} {"train_loss": -12.568401336669922, "global_step": 437770, "epoch": 2605} {"train_loss": -12.444082260131836, "global_step": 437771, "epoch": 2605} {"train_loss": -12.541805267333984, "global_step": 437772, "epoch": 2605} {"train_loss": -12.208475112915039, "global_step": 437773, "epoch": 2605} {"train_loss": -12.734109878540039, "global_step": 437774, "epoch": 2605} {"train_loss": -12.51700210571289, "global_step": 437775, "epoch": 2605} {"train_loss": -12.553291320800781, "global_step": 437776, "epoch": 2605} {"train_loss": -12.799871444702148, "global_step": 437777, "epoch": 2605} {"train_loss": -12.733200073242188, "global_step": 437778, "epoch": 2605} {"train_loss": -12.814591407775879, "global_step": 437779, "epoch": 2605} {"train_loss": -12.828559875488281, "global_step": 437780, "epoch": 2605} {"train_loss": -12.69570541381836, "global_step": 437781, "epoch": 2605} {"train_loss": -12.76346206665039, "global_step": 437782, "epoch": 2605} {"train_loss": -12.722572326660156, "global_step": 437783, "epoch": 2605} {"train_loss": -12.825429916381836, "global_step": 437784, "epoch": 2605} {"train_loss": -12.62470817565918, "global_step": 437785, "epoch": 2605} {"train_loss": -12.70035171508789, "global_step": 437786, "epoch": 2605} {"train_loss": -12.533077239990234, "global_step": 437787, "epoch": 2605} {"train_loss": -12.611438751220703, "global_step": 437788, "epoch": 2605} {"train_loss": -12.54098892211914, "global_step": 437789, "epoch": 2605} {"train_loss": -12.800122261047363, "global_step": 437790, "epoch": 2605} {"train_loss": -12.380613327026367, "global_step": 437791, "epoch": 2605} {"train_loss": -12.777825355529785, "global_step": 437792, "epoch": 2605} {"train_loss": -12.559852600097656, "global_step": 437793, "epoch": 2605} {"train_loss": -12.822874069213867, "global_step": 437794, "epoch": 2605} {"train_loss": -12.5908842086792, "global_step": 437795, "epoch": 2605} {"train_loss": -12.72153377532959, "global_step": 437796, "epoch": 2605} {"train_loss": -12.44051742553711, "global_step": 437797, "epoch": 2605} {"train_loss": -12.749649047851562, "global_step": 437798, "epoch": 2605} {"train_loss": -12.444160461425781, "global_step": 437799, "epoch": 2605} {"train_loss": -12.556215286254883, "global_step": 437800, "epoch": 2605} {"train_loss": -12.539551734924316, "global_step": 437801, "epoch": 2605} {"train_loss": -12.746036529541016, "global_step": 437802, "epoch": 2605} {"train_loss": -12.961366653442383, "global_step": 437803, "epoch": 2605} {"train_loss": -12.620467185974121, "global_step": 437804, "epoch": 2605} {"train_loss": -12.806325912475586, "global_step": 437805, "epoch": 2605} {"train_loss": -12.4765043258667, "global_step": 437806, "epoch": 2605} {"train_loss": -11.918910656656537, "global_step": 437807, "epoch": 2605, "val_loss": 310554.53125, "train_action_mse_error": 1.3902548551559448} {"train_loss": -12.735419273376465, "global_step": 437808, "epoch": 2606} {"train_loss": -12.889452934265137, "global_step": 437809, "epoch": 2606} {"train_loss": -12.741863250732422, "global_step": 437810, "epoch": 2606} {"train_loss": -12.914163589477539, "global_step": 437811, "epoch": 2606} {"train_loss": -12.310637474060059, "global_step": 437812, "epoch": 2606} {"train_loss": -12.983026504516602, "global_step": 437813, "epoch": 2606} {"train_loss": -12.448297500610352, "global_step": 437814, "epoch": 2606} {"train_loss": -13.068743705749512, "global_step": 437815, "epoch": 2606} {"train_loss": -12.510761260986328, "global_step": 437816, "epoch": 2606} {"train_loss": -12.681108474731445, "global_step": 437817, "epoch": 2606} {"train_loss": -12.730447769165039, "global_step": 437818, "epoch": 2606} {"train_loss": -12.737035751342773, "global_step": 437819, "epoch": 2606} {"train_loss": -12.580306053161621, "global_step": 437820, "epoch": 2606} {"train_loss": -12.60328483581543, "global_step": 437821, "epoch": 2606} {"train_loss": -12.655773162841797, "global_step": 437822, "epoch": 2606} {"train_loss": -12.724845886230469, "global_step": 437823, "epoch": 2606} {"train_loss": -12.936379432678223, "global_step": 437824, "epoch": 2606} {"train_loss": -12.95046615600586, "global_step": 437825, "epoch": 2606} {"train_loss": -12.627378463745117, "global_step": 437826, "epoch": 2606} {"train_loss": -12.44013786315918, "global_step": 437827, "epoch": 2606} {"train_loss": -11.148792266845703, "global_step": 437828, "epoch": 2606} {"train_loss": -12.440752029418945, "global_step": 437829, "epoch": 2606} {"train_loss": -12.003037452697754, "global_step": 437830, "epoch": 2606} {"train_loss": -12.760648727416992, "global_step": 437831, "epoch": 2606} {"train_loss": -11.428312301635742, "global_step": 437832, "epoch": 2606} {"train_loss": -12.709041595458984, "global_step": 437833, "epoch": 2606} {"train_loss": -10.98072624206543, "global_step": 437834, "epoch": 2606} {"train_loss": -12.36661148071289, "global_step": 437835, "epoch": 2606} {"train_loss": -11.372357368469238, "global_step": 437836, "epoch": 2606} {"train_loss": -12.458988189697266, "global_step": 437837, "epoch": 2606} {"train_loss": -11.773224830627441, "global_step": 437838, "epoch": 2606} {"train_loss": -11.502737998962402, "global_step": 437839, "epoch": 2606} {"train_loss": -10.859201431274414, "global_step": 437840, "epoch": 2606} {"train_loss": -11.065055847167969, "global_step": 437841, "epoch": 2606} {"train_loss": -10.744410514831543, "global_step": 437842, "epoch": 2606} {"train_loss": -11.282808303833008, "global_step": 437843, "epoch": 2606} {"train_loss": -10.819968223571777, "global_step": 437844, "epoch": 2606} {"train_loss": -12.150976181030273, "global_step": 437845, "epoch": 2606} {"train_loss": -12.15031623840332, "global_step": 437846, "epoch": 2606} {"train_loss": -11.82636833190918, "global_step": 437847, "epoch": 2606} {"train_loss": -11.666801452636719, "global_step": 437848, "epoch": 2606} {"train_loss": -11.753233909606934, "global_step": 437849, "epoch": 2606} {"train_loss": -11.433069229125977, "global_step": 437850, "epoch": 2606} {"train_loss": -11.84200668334961, "global_step": 437851, "epoch": 2606} {"train_loss": -10.724407196044922, "global_step": 437852, "epoch": 2606} {"train_loss": -11.296728134155273, "global_step": 437853, "epoch": 2606} {"train_loss": -11.446313858032227, "global_step": 437854, "epoch": 2606} {"train_loss": -10.275777816772461, "global_step": 437855, "epoch": 2606} {"train_loss": -11.032106399536133, "global_step": 437856, "epoch": 2606} {"train_loss": -10.381813049316406, "global_step": 437857, "epoch": 2606} {"train_loss": -10.038480758666992, "global_step": 437858, "epoch": 2606} {"train_loss": -11.408602714538574, "global_step": 437859, "epoch": 2606} {"train_loss": -9.576181411743164, "global_step": 437860, "epoch": 2606} {"train_loss": -9.442928314208984, "global_step": 437861, "epoch": 2606} {"train_loss": -11.400087356567383, "global_step": 437862, "epoch": 2606} {"train_loss": -10.414311408996582, "global_step": 437863, "epoch": 2606} {"train_loss": -10.13002872467041, "global_step": 437864, "epoch": 2606} {"train_loss": -11.611265182495117, "global_step": 437865, "epoch": 2606} {"train_loss": -10.612382888793945, "global_step": 437866, "epoch": 2606} {"train_loss": -11.38673210144043, "global_step": 437867, "epoch": 2606} {"train_loss": -11.604942321777344, "global_step": 437868, "epoch": 2606} {"train_loss": -11.974782943725586, "global_step": 437869, "epoch": 2606} {"train_loss": -11.016607284545898, "global_step": 437870, "epoch": 2606} {"train_loss": -11.719897270202637, "global_step": 437871, "epoch": 2606} {"train_loss": -11.848428726196289, "global_step": 437872, "epoch": 2606} {"train_loss": -11.294126510620117, "global_step": 437873, "epoch": 2606} {"train_loss": -12.476302146911621, "global_step": 437874, "epoch": 2606} {"train_loss": -11.417510986328125, "global_step": 437875, "epoch": 2606} {"train_loss": -11.501745223999023, "global_step": 437876, "epoch": 2606} {"train_loss": -11.539102554321289, "global_step": 437877, "epoch": 2606} {"train_loss": -11.528647422790527, "global_step": 437878, "epoch": 2606} {"train_loss": -11.77933120727539, "global_step": 437879, "epoch": 2606} {"train_loss": -11.842432975769043, "global_step": 437880, "epoch": 2606} {"train_loss": -11.38189697265625, "global_step": 437881, "epoch": 2606} {"train_loss": -11.806557655334473, "global_step": 437882, "epoch": 2606} {"train_loss": -11.671442985534668, "global_step": 437883, "epoch": 2606} {"train_loss": -11.169702529907227, "global_step": 437884, "epoch": 2606} {"train_loss": -11.86094856262207, "global_step": 437885, "epoch": 2606} {"train_loss": -11.823531150817871, "global_step": 437886, "epoch": 2606} {"train_loss": -11.727543830871582, "global_step": 437887, "epoch": 2606} {"train_loss": -12.281648635864258, "global_step": 437888, "epoch": 2606} {"train_loss": -12.314628601074219, "global_step": 437889, "epoch": 2606} {"train_loss": -12.256734848022461, "global_step": 437890, "epoch": 2606} {"train_loss": -12.299703598022461, "global_step": 437891, "epoch": 2606} {"train_loss": -12.334928512573242, "global_step": 437892, "epoch": 2606} {"train_loss": -12.150714874267578, "global_step": 437893, "epoch": 2606} {"train_loss": -12.387237548828125, "global_step": 437894, "epoch": 2606} {"train_loss": -12.085369110107422, "global_step": 437895, "epoch": 2606} {"train_loss": -12.254194259643555, "global_step": 437896, "epoch": 2606} {"train_loss": -11.916364669799805, "global_step": 437897, "epoch": 2606} {"train_loss": -12.476016998291016, "global_step": 437898, "epoch": 2606} {"train_loss": -11.938119888305664, "global_step": 437899, "epoch": 2606} {"train_loss": -12.25748062133789, "global_step": 437900, "epoch": 2606} {"train_loss": -12.417675018310547, "global_step": 437901, "epoch": 2606} {"train_loss": -12.519641876220703, "global_step": 437902, "epoch": 2606} {"train_loss": -12.094562530517578, "global_step": 437903, "epoch": 2606} {"train_loss": -12.70393180847168, "global_step": 437904, "epoch": 2606} {"train_loss": -11.905564308166504, "global_step": 437905, "epoch": 2606} {"train_loss": -12.174131393432617, "global_step": 437906, "epoch": 2606} {"train_loss": -12.420143127441406, "global_step": 437907, "epoch": 2606} {"train_loss": -11.726778030395508, "global_step": 437908, "epoch": 2606} {"train_loss": -12.446828842163086, "global_step": 437909, "epoch": 2606} {"train_loss": -12.560003280639648, "global_step": 437910, "epoch": 2606} {"train_loss": -12.554182052612305, "global_step": 437911, "epoch": 2606} {"train_loss": -12.52267837524414, "global_step": 437912, "epoch": 2606} {"train_loss": -12.41666030883789, "global_step": 437913, "epoch": 2606} {"train_loss": -12.411131858825684, "global_step": 437914, "epoch": 2606} {"train_loss": -12.398833274841309, "global_step": 437915, "epoch": 2606} {"train_loss": -12.607891082763672, "global_step": 437916, "epoch": 2606} {"train_loss": -12.336763381958008, "global_step": 437917, "epoch": 2606} {"train_loss": -12.389309883117676, "global_step": 437918, "epoch": 2606} {"train_loss": -12.527557373046875, "global_step": 437919, "epoch": 2606} {"train_loss": -12.624263763427734, "global_step": 437920, "epoch": 2606} {"train_loss": -12.764381408691406, "global_step": 437921, "epoch": 2606} {"train_loss": -12.530567169189453, "global_step": 437922, "epoch": 2606} {"train_loss": -12.803645133972168, "global_step": 437923, "epoch": 2606} {"train_loss": -12.477668762207031, "global_step": 437924, "epoch": 2606} {"train_loss": -12.775514602661133, "global_step": 437925, "epoch": 2606} {"train_loss": -12.254754066467285, "global_step": 437926, "epoch": 2606} {"train_loss": -12.799930572509766, "global_step": 437927, "epoch": 2606} {"train_loss": -12.705528259277344, "global_step": 437928, "epoch": 2606} {"train_loss": -12.827281951904297, "global_step": 437929, "epoch": 2606} {"train_loss": -12.703045845031738, "global_step": 437930, "epoch": 2606} {"train_loss": -12.619906425476074, "global_step": 437931, "epoch": 2606} {"train_loss": -12.529755592346191, "global_step": 437932, "epoch": 2606} {"train_loss": -12.675955772399902, "global_step": 437933, "epoch": 2606} {"train_loss": -12.83367919921875, "global_step": 437934, "epoch": 2606} {"train_loss": -12.380367279052734, "global_step": 437935, "epoch": 2606} {"train_loss": -12.504234313964844, "global_step": 437936, "epoch": 2606} {"train_loss": -11.907493591308594, "global_step": 437937, "epoch": 2606} {"train_loss": -12.574888229370117, "global_step": 437938, "epoch": 2606} {"train_loss": -12.637324333190918, "global_step": 437939, "epoch": 2606} {"train_loss": -12.887062072753906, "global_step": 437940, "epoch": 2606} {"train_loss": -12.462202072143555, "global_step": 437941, "epoch": 2606} {"train_loss": -12.865459442138672, "global_step": 437942, "epoch": 2606} {"train_loss": -12.745023727416992, "global_step": 437943, "epoch": 2606} {"train_loss": -12.704564094543457, "global_step": 437944, "epoch": 2606} {"train_loss": -12.831560134887695, "global_step": 437945, "epoch": 2606} {"train_loss": -12.725441932678223, "global_step": 437946, "epoch": 2606} {"train_loss": -12.80637264251709, "global_step": 437947, "epoch": 2606} {"train_loss": -12.822175025939941, "global_step": 437948, "epoch": 2606} {"train_loss": -12.726081848144531, "global_step": 437949, "epoch": 2606} {"train_loss": -12.974398612976074, "global_step": 437950, "epoch": 2606} {"train_loss": -12.713197708129883, "global_step": 437951, "epoch": 2606} {"train_loss": -12.910106658935547, "global_step": 437952, "epoch": 2606} {"train_loss": -12.968947410583496, "global_step": 437953, "epoch": 2606} {"train_loss": -12.843916893005371, "global_step": 437954, "epoch": 2606} {"train_loss": -12.917793273925781, "global_step": 437955, "epoch": 2606} {"train_loss": -12.572735786437988, "global_step": 437956, "epoch": 2606} {"train_loss": -12.25943374633789, "global_step": 437957, "epoch": 2606} {"train_loss": -11.929512023925781, "global_step": 437958, "epoch": 2606} {"train_loss": -12.172591209411621, "global_step": 437959, "epoch": 2606} {"train_loss": -11.955790519714355, "global_step": 437960, "epoch": 2606} {"train_loss": -11.090337753295898, "global_step": 437961, "epoch": 2606} {"train_loss": -12.14210319519043, "global_step": 437962, "epoch": 2606} {"train_loss": -11.972251892089844, "global_step": 437963, "epoch": 2606} {"train_loss": -12.503829956054688, "global_step": 437964, "epoch": 2606} {"train_loss": -11.351951599121094, "global_step": 437965, "epoch": 2606} {"train_loss": -12.291694641113281, "global_step": 437966, "epoch": 2606} {"train_loss": -11.883843421936035, "global_step": 437967, "epoch": 2606} {"train_loss": -12.467552185058594, "global_step": 437968, "epoch": 2606} {"train_loss": -11.525535583496094, "global_step": 437969, "epoch": 2606} {"train_loss": -12.482988357543945, "global_step": 437970, "epoch": 2606} {"train_loss": -11.32563304901123, "global_step": 437971, "epoch": 2606} {"train_loss": -12.43575668334961, "global_step": 437972, "epoch": 2606} {"train_loss": -11.781519889831543, "global_step": 437973, "epoch": 2606} {"train_loss": -12.143211364746094, "global_step": 437974, "epoch": 2606} {"train_loss": -12.08354177361443, "global_step": 437975, "epoch": 2606, "val_loss": 312928.5625} {"train_loss": -12.397168159484863, "global_step": 437976, "epoch": 2607} {"train_loss": -12.16006088256836, "global_step": 437977, "epoch": 2607} {"train_loss": -11.285390853881836, "global_step": 437978, "epoch": 2607} {"train_loss": -10.436702728271484, "global_step": 437979, "epoch": 2607} {"train_loss": -12.172500610351562, "global_step": 437980, "epoch": 2607} {"train_loss": -9.879968643188477, "global_step": 437981, "epoch": 2607} {"train_loss": -10.224822998046875, "global_step": 437982, "epoch": 2607} {"train_loss": -10.039360046386719, "global_step": 437983, "epoch": 2607} {"train_loss": -9.177033424377441, "global_step": 437984, "epoch": 2607} {"train_loss": -8.207329750061035, "global_step": 437985, "epoch": 2607} {"train_loss": -8.3394193649292, "global_step": 437986, "epoch": 2607} {"train_loss": -7.768718719482422, "global_step": 437987, "epoch": 2607} {"train_loss": -8.754045486450195, "global_step": 437988, "epoch": 2607} {"train_loss": -7.941477298736572, "global_step": 437989, "epoch": 2607} {"train_loss": -8.62485122680664, "global_step": 437990, "epoch": 2607} {"train_loss": -8.875287055969238, "global_step": 437991, "epoch": 2607} {"train_loss": -8.295247077941895, "global_step": 437992, "epoch": 2607} {"train_loss": -8.537864685058594, "global_step": 437993, "epoch": 2607} {"train_loss": -8.418457984924316, "global_step": 437994, "epoch": 2607} {"train_loss": -9.158180236816406, "global_step": 437995, "epoch": 2607} {"train_loss": -9.005322456359863, "global_step": 437996, "epoch": 2607} {"train_loss": -8.96473217010498, "global_step": 437997, "epoch": 2607} {"train_loss": -9.147366523742676, "global_step": 437998, "epoch": 2607} {"train_loss": -10.16224479675293, "global_step": 437999, "epoch": 2607} {"train_loss": -10.91113567352295, "global_step": 438000, "epoch": 2607} {"train_loss": -10.181957244873047, "global_step": 438001, "epoch": 2607} {"train_loss": -10.444365501403809, "global_step": 438002, "epoch": 2607} {"train_loss": -8.993905067443848, "global_step": 438003, "epoch": 2607} {"train_loss": -9.61463451385498, "global_step": 438004, "epoch": 2607} {"train_loss": -10.511383056640625, "global_step": 438005, "epoch": 2607} {"train_loss": -9.690181732177734, "global_step": 438006, "epoch": 2607} {"train_loss": -9.792091369628906, "global_step": 438007, "epoch": 2607} {"train_loss": -10.157827377319336, "global_step": 438008, "epoch": 2607} {"train_loss": -9.363340377807617, "global_step": 438009, "epoch": 2607} {"train_loss": -10.631294250488281, "global_step": 438010, "epoch": 2607} {"train_loss": -9.417679786682129, "global_step": 438011, "epoch": 2607} {"train_loss": -9.172693252563477, "global_step": 438012, "epoch": 2607} {"train_loss": -10.44038200378418, "global_step": 438013, "epoch": 2607} {"train_loss": -9.897176742553711, "global_step": 438014, "epoch": 2607} {"train_loss": -11.32772159576416, "global_step": 438015, "epoch": 2607} {"train_loss": -9.90548324584961, "global_step": 438016, "epoch": 2607} {"train_loss": -10.063878059387207, "global_step": 438017, "epoch": 2607} {"train_loss": -11.589795112609863, "global_step": 438018, "epoch": 2607} {"train_loss": -10.378395080566406, "global_step": 438019, "epoch": 2607} {"train_loss": -10.788386344909668, "global_step": 438020, "epoch": 2607} {"train_loss": -10.229754447937012, "global_step": 438021, "epoch": 2607} {"train_loss": -11.437616348266602, "global_step": 438022, "epoch": 2607} {"train_loss": -10.242606163024902, "global_step": 438023, "epoch": 2607} {"train_loss": -11.895896911621094, "global_step": 438024, "epoch": 2607} {"train_loss": -10.874410629272461, "global_step": 438025, "epoch": 2607} {"train_loss": -11.661425590515137, "global_step": 438026, "epoch": 2607} {"train_loss": -11.74302864074707, "global_step": 438027, "epoch": 2607} {"train_loss": -11.790220260620117, "global_step": 438028, "epoch": 2607} {"train_loss": -11.100573539733887, "global_step": 438029, "epoch": 2607} {"train_loss": -11.465995788574219, "global_step": 438030, "epoch": 2607} {"train_loss": -11.388387680053711, "global_step": 438031, "epoch": 2607} {"train_loss": -11.20764446258545, "global_step": 438032, "epoch": 2607} {"train_loss": -11.929606437683105, "global_step": 438033, "epoch": 2607} {"train_loss": -11.359057426452637, "global_step": 438034, "epoch": 2607} {"train_loss": -11.944204330444336, "global_step": 438035, "epoch": 2607} {"train_loss": -11.705388069152832, "global_step": 438036, "epoch": 2607} {"train_loss": -12.216300964355469, "global_step": 438037, "epoch": 2607} {"train_loss": -11.322271347045898, "global_step": 438038, "epoch": 2607} {"train_loss": -12.277983665466309, "global_step": 438039, "epoch": 2607} {"train_loss": -11.864542007446289, "global_step": 438040, "epoch": 2607} {"train_loss": -11.874014854431152, "global_step": 438041, "epoch": 2607} {"train_loss": -12.176741600036621, "global_step": 438042, "epoch": 2607} {"train_loss": -12.041055679321289, "global_step": 438043, "epoch": 2607} {"train_loss": -11.955867767333984, "global_step": 438044, "epoch": 2607} {"train_loss": -12.109374046325684, "global_step": 438045, "epoch": 2607} {"train_loss": -12.024652481079102, "global_step": 438046, "epoch": 2607} {"train_loss": -12.05546760559082, "global_step": 438047, "epoch": 2607} {"train_loss": -12.245230674743652, "global_step": 438048, "epoch": 2607} {"train_loss": -12.014886856079102, "global_step": 438049, "epoch": 2607} {"train_loss": -12.200931549072266, "global_step": 438050, "epoch": 2607} {"train_loss": -12.358851432800293, "global_step": 438051, "epoch": 2607} {"train_loss": -12.285626411437988, "global_step": 438052, "epoch": 2607} {"train_loss": -12.499076843261719, "global_step": 438053, "epoch": 2607} {"train_loss": -12.515300750732422, "global_step": 438054, "epoch": 2607} {"train_loss": -12.268111228942871, "global_step": 438055, "epoch": 2607} {"train_loss": -12.494670867919922, "global_step": 438056, "epoch": 2607} {"train_loss": -12.497697830200195, "global_step": 438057, "epoch": 2607} {"train_loss": -12.515569686889648, "global_step": 438058, "epoch": 2607} {"train_loss": -12.196342468261719, "global_step": 438059, "epoch": 2607} {"train_loss": -12.459156036376953, "global_step": 438060, "epoch": 2607} {"train_loss": -12.50100326538086, "global_step": 438061, "epoch": 2607} {"train_loss": -12.401273727416992, "global_step": 438062, "epoch": 2607} {"train_loss": -12.36404037475586, "global_step": 438063, "epoch": 2607} {"train_loss": -12.468481063842773, "global_step": 438064, "epoch": 2607} {"train_loss": -12.497923851013184, "global_step": 438065, "epoch": 2607} {"train_loss": -12.659463882446289, "global_step": 438066, "epoch": 2607} {"train_loss": -12.53133773803711, "global_step": 438067, "epoch": 2607} {"train_loss": -12.381864547729492, "global_step": 438068, "epoch": 2607} {"train_loss": -12.338369369506836, "global_step": 438069, "epoch": 2607} {"train_loss": -12.532320022583008, "global_step": 438070, "epoch": 2607} {"train_loss": -12.410472869873047, "global_step": 438071, "epoch": 2607} {"train_loss": -12.5348482131958, "global_step": 438072, "epoch": 2607} {"train_loss": -12.539393424987793, "global_step": 438073, "epoch": 2607} {"train_loss": -12.301519393920898, "global_step": 438074, "epoch": 2607} {"train_loss": -12.698671340942383, "global_step": 438075, "epoch": 2607} {"train_loss": -12.421892166137695, "global_step": 438076, "epoch": 2607} {"train_loss": -12.596820831298828, "global_step": 438077, "epoch": 2607} {"train_loss": -12.819722175598145, "global_step": 438078, "epoch": 2607} {"train_loss": -12.609746932983398, "global_step": 438079, "epoch": 2607} {"train_loss": -12.545614242553711, "global_step": 438080, "epoch": 2607} {"train_loss": -12.664863586425781, "global_step": 438081, "epoch": 2607} {"train_loss": -12.441689491271973, "global_step": 438082, "epoch": 2607} {"train_loss": -12.614587783813477, "global_step": 438083, "epoch": 2607} {"train_loss": -12.492021560668945, "global_step": 438084, "epoch": 2607} {"train_loss": -12.639730453491211, "global_step": 438085, "epoch": 2607} {"train_loss": -12.730525970458984, "global_step": 438086, "epoch": 2607} {"train_loss": -12.692895889282227, "global_step": 438087, "epoch": 2607} {"train_loss": -12.830623626708984, "global_step": 438088, "epoch": 2607} {"train_loss": -12.457586288452148, "global_step": 438089, "epoch": 2607} {"train_loss": -12.789896011352539, "global_step": 438090, "epoch": 2607} {"train_loss": -12.791986465454102, "global_step": 438091, "epoch": 2607} {"train_loss": -12.817225456237793, "global_step": 438092, "epoch": 2607} {"train_loss": -12.683843612670898, "global_step": 438093, "epoch": 2607} {"train_loss": -12.533751487731934, "global_step": 438094, "epoch": 2607} {"train_loss": -12.661199569702148, "global_step": 438095, "epoch": 2607} {"train_loss": -12.585836410522461, "global_step": 438096, "epoch": 2607} {"train_loss": -12.511140823364258, "global_step": 438097, "epoch": 2607} {"train_loss": -12.979856491088867, "global_step": 438098, "epoch": 2607} {"train_loss": -12.696304321289062, "global_step": 438099, "epoch": 2607} {"train_loss": -12.48358154296875, "global_step": 438100, "epoch": 2607} {"train_loss": -12.738849639892578, "global_step": 438101, "epoch": 2607} {"train_loss": -12.791338920593262, "global_step": 438102, "epoch": 2607} {"train_loss": -12.709314346313477, "global_step": 438103, "epoch": 2607} {"train_loss": -12.69037914276123, "global_step": 438104, "epoch": 2607} {"train_loss": -12.571805953979492, "global_step": 438105, "epoch": 2607} {"train_loss": -12.805112838745117, "global_step": 438106, "epoch": 2607} {"train_loss": -12.653457641601562, "global_step": 438107, "epoch": 2607} {"train_loss": -12.612972259521484, "global_step": 438108, "epoch": 2607} {"train_loss": -12.687324523925781, "global_step": 438109, "epoch": 2607} {"train_loss": -12.843549728393555, "global_step": 438110, "epoch": 2607} {"train_loss": -12.383365631103516, "global_step": 438111, "epoch": 2607} {"train_loss": -12.28437328338623, "global_step": 438112, "epoch": 2607} {"train_loss": -12.621585845947266, "global_step": 438113, "epoch": 2607} {"train_loss": -12.394815444946289, "global_step": 438114, "epoch": 2607} {"train_loss": -11.945758819580078, "global_step": 438115, "epoch": 2607} {"train_loss": -12.343720436096191, "global_step": 438116, "epoch": 2607} {"train_loss": -12.689085006713867, "global_step": 438117, "epoch": 2607} {"train_loss": -12.000003814697266, "global_step": 438118, "epoch": 2607} {"train_loss": -12.596733093261719, "global_step": 438119, "epoch": 2607} {"train_loss": -12.202163696289062, "global_step": 438120, "epoch": 2607} {"train_loss": -12.350271224975586, "global_step": 438121, "epoch": 2607} {"train_loss": -12.196517944335938, "global_step": 438122, "epoch": 2607} {"train_loss": -12.450394630432129, "global_step": 438123, "epoch": 2607} {"train_loss": -12.497919082641602, "global_step": 438124, "epoch": 2607} {"train_loss": -12.309760093688965, "global_step": 438125, "epoch": 2607} {"train_loss": -12.720861434936523, "global_step": 438126, "epoch": 2607} {"train_loss": -12.528704643249512, "global_step": 438127, "epoch": 2607} {"train_loss": -11.607351303100586, "global_step": 438128, "epoch": 2607} {"train_loss": -11.377809524536133, "global_step": 438129, "epoch": 2607} {"train_loss": -12.578975677490234, "global_step": 438130, "epoch": 2607} {"train_loss": -10.340352058410645, "global_step": 438131, "epoch": 2607} {"train_loss": -11.466214179992676, "global_step": 438132, "epoch": 2607} {"train_loss": -11.752055168151855, "global_step": 438133, "epoch": 2607} {"train_loss": -12.397276878356934, "global_step": 438134, "epoch": 2607} {"train_loss": -11.965877532958984, "global_step": 438135, "epoch": 2607} {"train_loss": -11.961557388305664, "global_step": 438136, "epoch": 2607} {"train_loss": -11.508424758911133, "global_step": 438137, "epoch": 2607} {"train_loss": -11.19666862487793, "global_step": 438138, "epoch": 2607} {"train_loss": -11.864564895629883, "global_step": 438139, "epoch": 2607} {"train_loss": -11.00602912902832, "global_step": 438140, "epoch": 2607} {"train_loss": -11.629260063171387, "global_step": 438141, "epoch": 2607} {"train_loss": -11.60928726196289, "global_step": 438142, "epoch": 2607} {"train_loss": -11.557059018384843, "global_step": 438143, "epoch": 2607, "val_loss": 310389.53125} {"train_loss": -11.737863540649414, "global_step": 438144, "epoch": 2608} {"train_loss": -9.704309463500977, "global_step": 438145, "epoch": 2608} {"train_loss": -10.181297302246094, "global_step": 438146, "epoch": 2608} {"train_loss": -10.488395690917969, "global_step": 438147, "epoch": 2608} {"train_loss": -11.18520736694336, "global_step": 438148, "epoch": 2608} {"train_loss": -10.61037826538086, "global_step": 438149, "epoch": 2608} {"train_loss": -12.503799438476562, "global_step": 438150, "epoch": 2608} {"train_loss": -10.020930290222168, "global_step": 438151, "epoch": 2608} {"train_loss": -11.214601516723633, "global_step": 438152, "epoch": 2608} {"train_loss": -11.024635314941406, "global_step": 438153, "epoch": 2608} {"train_loss": -12.243389129638672, "global_step": 438154, "epoch": 2608} {"train_loss": -10.972891807556152, "global_step": 438155, "epoch": 2608} {"train_loss": -11.89345932006836, "global_step": 438156, "epoch": 2608} {"train_loss": -11.124755859375, "global_step": 438157, "epoch": 2608} {"train_loss": -12.012628555297852, "global_step": 438158, "epoch": 2608} {"train_loss": -11.290159225463867, "global_step": 438159, "epoch": 2608} {"train_loss": -11.758237838745117, "global_step": 438160, "epoch": 2608} {"train_loss": -12.024675369262695, "global_step": 438161, "epoch": 2608} {"train_loss": -11.59823226928711, "global_step": 438162, "epoch": 2608} {"train_loss": -11.889595031738281, "global_step": 438163, "epoch": 2608} {"train_loss": -11.80587387084961, "global_step": 438164, "epoch": 2608} {"train_loss": -12.270512580871582, "global_step": 438165, "epoch": 2608} {"train_loss": -12.205138206481934, "global_step": 438166, "epoch": 2608} {"train_loss": -11.762073516845703, "global_step": 438167, "epoch": 2608} {"train_loss": -12.108104705810547, "global_step": 438168, "epoch": 2608} {"train_loss": -11.889486312866211, "global_step": 438169, "epoch": 2608} {"train_loss": -11.895723342895508, "global_step": 438170, "epoch": 2608} {"train_loss": -11.880377769470215, "global_step": 438171, "epoch": 2608} {"train_loss": -11.964433670043945, "global_step": 438172, "epoch": 2608} {"train_loss": -12.537065505981445, "global_step": 438173, "epoch": 2608} {"train_loss": -12.456321716308594, "global_step": 438174, "epoch": 2608} {"train_loss": -12.361207962036133, "global_step": 438175, "epoch": 2608} {"train_loss": -12.387956619262695, "global_step": 438176, "epoch": 2608} {"train_loss": -12.199652671813965, "global_step": 438177, "epoch": 2608} {"train_loss": -12.488618850708008, "global_step": 438178, "epoch": 2608} {"train_loss": -11.863449096679688, "global_step": 438179, "epoch": 2608} {"train_loss": -12.593827247619629, "global_step": 438180, "epoch": 2608} {"train_loss": -12.250750541687012, "global_step": 438181, "epoch": 2608} {"train_loss": -12.516496658325195, "global_step": 438182, "epoch": 2608} {"train_loss": -12.274181365966797, "global_step": 438183, "epoch": 2608} {"train_loss": -12.45956039428711, "global_step": 438184, "epoch": 2608} {"train_loss": -12.023914337158203, "global_step": 438185, "epoch": 2608} {"train_loss": -12.481295585632324, "global_step": 438186, "epoch": 2608} {"train_loss": -12.45662784576416, "global_step": 438187, "epoch": 2608} {"train_loss": -12.16313362121582, "global_step": 438188, "epoch": 2608} {"train_loss": -11.991758346557617, "global_step": 438189, "epoch": 2608} {"train_loss": -12.440885543823242, "global_step": 438190, "epoch": 2608} {"train_loss": -12.141082763671875, "global_step": 438191, "epoch": 2608} {"train_loss": -12.574451446533203, "global_step": 438192, "epoch": 2608} {"train_loss": -12.572412490844727, "global_step": 438193, "epoch": 2608} {"train_loss": -12.433067321777344, "global_step": 438194, "epoch": 2608} {"train_loss": -12.330462455749512, "global_step": 438195, "epoch": 2608} {"train_loss": -12.524328231811523, "global_step": 438196, "epoch": 2608} {"train_loss": -12.515175819396973, "global_step": 438197, "epoch": 2608} {"train_loss": -12.1515531539917, "global_step": 438198, "epoch": 2608} {"train_loss": -12.73996353149414, "global_step": 438199, "epoch": 2608} {"train_loss": -12.44191837310791, "global_step": 438200, "epoch": 2608} {"train_loss": -12.037699699401855, "global_step": 438201, "epoch": 2608} {"train_loss": -12.42740249633789, "global_step": 438202, "epoch": 2608} {"train_loss": -11.922487258911133, "global_step": 438203, "epoch": 2608} {"train_loss": -12.368266105651855, "global_step": 438204, "epoch": 2608} {"train_loss": -12.45583724975586, "global_step": 438205, "epoch": 2608} {"train_loss": -11.721672058105469, "global_step": 438206, "epoch": 2608} {"train_loss": -12.38093376159668, "global_step": 438207, "epoch": 2608} {"train_loss": -12.325347900390625, "global_step": 438208, "epoch": 2608} {"train_loss": -11.857711791992188, "global_step": 438209, "epoch": 2608} {"train_loss": -12.676980972290039, "global_step": 438210, "epoch": 2608} {"train_loss": -11.676633834838867, "global_step": 438211, "epoch": 2608} {"train_loss": -12.637457847595215, "global_step": 438212, "epoch": 2608} {"train_loss": -12.585966110229492, "global_step": 438213, "epoch": 2608} {"train_loss": -12.529208183288574, "global_step": 438214, "epoch": 2608} {"train_loss": -12.302234649658203, "global_step": 438215, "epoch": 2608} {"train_loss": -11.962282180786133, "global_step": 438216, "epoch": 2608} {"train_loss": -12.195730209350586, "global_step": 438217, "epoch": 2608} {"train_loss": -12.325775146484375, "global_step": 438218, "epoch": 2608} {"train_loss": -11.874918937683105, "global_step": 438219, "epoch": 2608} {"train_loss": -12.783552169799805, "global_step": 438220, "epoch": 2608} {"train_loss": -12.276939392089844, "global_step": 438221, "epoch": 2608} {"train_loss": -12.58816909790039, "global_step": 438222, "epoch": 2608} {"train_loss": -12.352156639099121, "global_step": 438223, "epoch": 2608} {"train_loss": -12.232145309448242, "global_step": 438224, "epoch": 2608} {"train_loss": -12.210040092468262, "global_step": 438225, "epoch": 2608} {"train_loss": -11.727503776550293, "global_step": 438226, "epoch": 2608} {"train_loss": -12.135744094848633, "global_step": 438227, "epoch": 2608} {"train_loss": -11.968001365661621, "global_step": 438228, "epoch": 2608} {"train_loss": -11.849069595336914, "global_step": 438229, "epoch": 2608} {"train_loss": -10.747406005859375, "global_step": 438230, "epoch": 2608} {"train_loss": -12.022375106811523, "global_step": 438231, "epoch": 2608} {"train_loss": -10.567159652709961, "global_step": 438232, "epoch": 2608} {"train_loss": -11.913797378540039, "global_step": 438233, "epoch": 2608} {"train_loss": -11.406328201293945, "global_step": 438234, "epoch": 2608} {"train_loss": -11.78834056854248, "global_step": 438235, "epoch": 2608} {"train_loss": -11.5300874710083, "global_step": 438236, "epoch": 2608} {"train_loss": -10.897955894470215, "global_step": 438237, "epoch": 2608} {"train_loss": -11.86788272857666, "global_step": 438238, "epoch": 2608} {"train_loss": -10.180137634277344, "global_step": 438239, "epoch": 2608} {"train_loss": -11.579703330993652, "global_step": 438240, "epoch": 2608} {"train_loss": -10.818548202514648, "global_step": 438241, "epoch": 2608} {"train_loss": -11.38566780090332, "global_step": 438242, "epoch": 2608} {"train_loss": -11.575784683227539, "global_step": 438243, "epoch": 2608} {"train_loss": -11.389838218688965, "global_step": 438244, "epoch": 2608} {"train_loss": -10.900224685668945, "global_step": 438245, "epoch": 2608} {"train_loss": -11.991036415100098, "global_step": 438246, "epoch": 2608} {"train_loss": -10.900787353515625, "global_step": 438247, "epoch": 2608} {"train_loss": -11.955039978027344, "global_step": 438248, "epoch": 2608} {"train_loss": -11.59321403503418, "global_step": 438249, "epoch": 2608} {"train_loss": -11.223188400268555, "global_step": 438250, "epoch": 2608} {"train_loss": -11.288622856140137, "global_step": 438251, "epoch": 2608} {"train_loss": -11.254618644714355, "global_step": 438252, "epoch": 2608} {"train_loss": -11.85520076751709, "global_step": 438253, "epoch": 2608} {"train_loss": -11.680551528930664, "global_step": 438254, "epoch": 2608} {"train_loss": -12.035170555114746, "global_step": 438255, "epoch": 2608} {"train_loss": -12.254745483398438, "global_step": 438256, "epoch": 2608} {"train_loss": -12.327980041503906, "global_step": 438257, "epoch": 2608} {"train_loss": -11.966569900512695, "global_step": 438258, "epoch": 2608} {"train_loss": -12.437667846679688, "global_step": 438259, "epoch": 2608} {"train_loss": -11.98029899597168, "global_step": 438260, "epoch": 2608} {"train_loss": -11.891118049621582, "global_step": 438261, "epoch": 2608} {"train_loss": -12.141256332397461, "global_step": 438262, "epoch": 2608} {"train_loss": -11.856956481933594, "global_step": 438263, "epoch": 2608} {"train_loss": -11.968483924865723, "global_step": 438264, "epoch": 2608} {"train_loss": -11.754697799682617, "global_step": 438265, "epoch": 2608} {"train_loss": -11.667940139770508, "global_step": 438266, "epoch": 2608} {"train_loss": -11.7744722366333, "global_step": 438267, "epoch": 2608} {"train_loss": -11.961141586303711, "global_step": 438268, "epoch": 2608} {"train_loss": -11.624614715576172, "global_step": 438269, "epoch": 2608} {"train_loss": -11.849136352539062, "global_step": 438270, "epoch": 2608} {"train_loss": -11.619186401367188, "global_step": 438271, "epoch": 2608} {"train_loss": -11.111162185668945, "global_step": 438272, "epoch": 2608} {"train_loss": -11.540822982788086, "global_step": 438273, "epoch": 2608} {"train_loss": -12.266056060791016, "global_step": 438274, "epoch": 2608} {"train_loss": -11.45215129852295, "global_step": 438275, "epoch": 2608} {"train_loss": -11.541942596435547, "global_step": 438276, "epoch": 2608} {"train_loss": -11.296634674072266, "global_step": 438277, "epoch": 2608} {"train_loss": -11.287761688232422, "global_step": 438278, "epoch": 2608} {"train_loss": -11.72652816772461, "global_step": 438279, "epoch": 2608} {"train_loss": -11.622587203979492, "global_step": 438280, "epoch": 2608} {"train_loss": -12.380768775939941, "global_step": 438281, "epoch": 2608} {"train_loss": -12.100274085998535, "global_step": 438282, "epoch": 2608} {"train_loss": -12.118226051330566, "global_step": 438283, "epoch": 2608} {"train_loss": -12.110513687133789, "global_step": 438284, "epoch": 2608} {"train_loss": -11.740571022033691, "global_step": 438285, "epoch": 2608} {"train_loss": -11.942317962646484, "global_step": 438286, "epoch": 2608} {"train_loss": -11.783529281616211, "global_step": 438287, "epoch": 2608} {"train_loss": -11.721580505371094, "global_step": 438288, "epoch": 2608} {"train_loss": -12.206785202026367, "global_step": 438289, "epoch": 2608} {"train_loss": -11.769981384277344, "global_step": 438290, "epoch": 2608} {"train_loss": -12.040016174316406, "global_step": 438291, "epoch": 2608} {"train_loss": -12.26280689239502, "global_step": 438292, "epoch": 2608} {"train_loss": -11.938183784484863, "global_step": 438293, "epoch": 2608} {"train_loss": -12.268447875976562, "global_step": 438294, "epoch": 2608} {"train_loss": -12.225807189941406, "global_step": 438295, "epoch": 2608} {"train_loss": -12.324468612670898, "global_step": 438296, "epoch": 2608} {"train_loss": -12.113615036010742, "global_step": 438297, "epoch": 2608} {"train_loss": -12.268791198730469, "global_step": 438298, "epoch": 2608} {"train_loss": -12.111932754516602, "global_step": 438299, "epoch": 2608} {"train_loss": -12.33014965057373, "global_step": 438300, "epoch": 2608} {"train_loss": -12.36239242553711, "global_step": 438301, "epoch": 2608} {"train_loss": -12.186767578125, "global_step": 438302, "epoch": 2608} {"train_loss": -12.588176727294922, "global_step": 438303, "epoch": 2608} {"train_loss": -12.124405860900879, "global_step": 438304, "epoch": 2608} {"train_loss": -12.569259643554688, "global_step": 438305, "epoch": 2608} {"train_loss": -12.248930931091309, "global_step": 438306, "epoch": 2608} {"train_loss": -12.314836502075195, "global_step": 438307, "epoch": 2608} {"train_loss": -12.338717460632324, "global_step": 438308, "epoch": 2608} {"train_loss": -12.25319766998291, "global_step": 438309, "epoch": 2608} {"train_loss": -12.646296501159668, "global_step": 438310, "epoch": 2608} {"train_loss": -11.919555612972804, "global_step": 438311, "epoch": 2608, "val_loss": 312416.4375} {"train_loss": -12.361303329467773, "global_step": 438312, "epoch": 2609} {"train_loss": -12.065887451171875, "global_step": 438313, "epoch": 2609} {"train_loss": -12.199087142944336, "global_step": 438314, "epoch": 2609} {"train_loss": -12.627487182617188, "global_step": 438315, "epoch": 2609} {"train_loss": -12.315643310546875, "global_step": 438316, "epoch": 2609} {"train_loss": -12.757431983947754, "global_step": 438317, "epoch": 2609} {"train_loss": -12.583724975585938, "global_step": 438318, "epoch": 2609} {"train_loss": -12.541004180908203, "global_step": 438319, "epoch": 2609} {"train_loss": -12.126045227050781, "global_step": 438320, "epoch": 2609} {"train_loss": -12.442310333251953, "global_step": 438321, "epoch": 2609} {"train_loss": -12.331502914428711, "global_step": 438322, "epoch": 2609} {"train_loss": -12.503501892089844, "global_step": 438323, "epoch": 2609} {"train_loss": -12.824629783630371, "global_step": 438324, "epoch": 2609} {"train_loss": -12.439889907836914, "global_step": 438325, "epoch": 2609} {"train_loss": -12.458337783813477, "global_step": 438326, "epoch": 2609} {"train_loss": -12.507509231567383, "global_step": 438327, "epoch": 2609} {"train_loss": -12.272972106933594, "global_step": 438328, "epoch": 2609} {"train_loss": -12.495083808898926, "global_step": 438329, "epoch": 2609} {"train_loss": -12.383157730102539, "global_step": 438330, "epoch": 2609} {"train_loss": -12.675081253051758, "global_step": 438331, "epoch": 2609} {"train_loss": -12.83275032043457, "global_step": 438332, "epoch": 2609} {"train_loss": -12.82652473449707, "global_step": 438333, "epoch": 2609} {"train_loss": -12.551328659057617, "global_step": 438334, "epoch": 2609} {"train_loss": -12.647604942321777, "global_step": 438335, "epoch": 2609} {"train_loss": -12.830587387084961, "global_step": 438336, "epoch": 2609} {"train_loss": -12.72732162475586, "global_step": 438337, "epoch": 2609} {"train_loss": -12.736709594726562, "global_step": 438338, "epoch": 2609} {"train_loss": -12.918071746826172, "global_step": 438339, "epoch": 2609} {"train_loss": -12.69601821899414, "global_step": 438340, "epoch": 2609} {"train_loss": -12.700689315795898, "global_step": 438341, "epoch": 2609} {"train_loss": -12.778149604797363, "global_step": 438342, "epoch": 2609} {"train_loss": -12.55548095703125, "global_step": 438343, "epoch": 2609} {"train_loss": -12.228782653808594, "global_step": 438344, "epoch": 2609} {"train_loss": -12.573081016540527, "global_step": 438345, "epoch": 2609} {"train_loss": -12.727842330932617, "global_step": 438346, "epoch": 2609} {"train_loss": -12.649373054504395, "global_step": 438347, "epoch": 2609} {"train_loss": -12.843732833862305, "global_step": 438348, "epoch": 2609} {"train_loss": -12.77591323852539, "global_step": 438349, "epoch": 2609} {"train_loss": -12.447507858276367, "global_step": 438350, "epoch": 2609} {"train_loss": -12.739838600158691, "global_step": 438351, "epoch": 2609} {"train_loss": -12.678596496582031, "global_step": 438352, "epoch": 2609} {"train_loss": -12.60531997680664, "global_step": 438353, "epoch": 2609} {"train_loss": -12.54092025756836, "global_step": 438354, "epoch": 2609} {"train_loss": -12.074581146240234, "global_step": 438355, "epoch": 2609} {"train_loss": -12.495256423950195, "global_step": 438356, "epoch": 2609} {"train_loss": -12.92576789855957, "global_step": 438357, "epoch": 2609} {"train_loss": -12.326740264892578, "global_step": 438358, "epoch": 2609} {"train_loss": -12.634737014770508, "global_step": 438359, "epoch": 2609} {"train_loss": -12.675830841064453, "global_step": 438360, "epoch": 2609} {"train_loss": -12.66000747680664, "global_step": 438361, "epoch": 2609} {"train_loss": -12.36206340789795, "global_step": 438362, "epoch": 2609} {"train_loss": -12.509449005126953, "global_step": 438363, "epoch": 2609} {"train_loss": -11.940963745117188, "global_step": 438364, "epoch": 2609} {"train_loss": -12.406251907348633, "global_step": 438365, "epoch": 2609} {"train_loss": -12.418096542358398, "global_step": 438366, "epoch": 2609} {"train_loss": -12.032305717468262, "global_step": 438367, "epoch": 2609} {"train_loss": -11.395484924316406, "global_step": 438368, "epoch": 2609} {"train_loss": -11.852331161499023, "global_step": 438369, "epoch": 2609} {"train_loss": -11.513214111328125, "global_step": 438370, "epoch": 2609} {"train_loss": -11.371097564697266, "global_step": 438371, "epoch": 2609} {"train_loss": -12.56535530090332, "global_step": 438372, "epoch": 2609} {"train_loss": -11.691591262817383, "global_step": 438373, "epoch": 2609} {"train_loss": -11.591592788696289, "global_step": 438374, "epoch": 2609} {"train_loss": -11.383094787597656, "global_step": 438375, "epoch": 2609} {"train_loss": -11.737537384033203, "global_step": 438376, "epoch": 2609} {"train_loss": -10.881245613098145, "global_step": 438377, "epoch": 2609} {"train_loss": -12.236722946166992, "global_step": 438378, "epoch": 2609} {"train_loss": -11.004870414733887, "global_step": 438379, "epoch": 2609} {"train_loss": -12.185077667236328, "global_step": 438380, "epoch": 2609} {"train_loss": -11.404966354370117, "global_step": 438381, "epoch": 2609} {"train_loss": -12.333740234375, "global_step": 438382, "epoch": 2609} {"train_loss": -11.770099639892578, "global_step": 438383, "epoch": 2609} {"train_loss": -12.121068954467773, "global_step": 438384, "epoch": 2609} {"train_loss": -11.834949493408203, "global_step": 438385, "epoch": 2609} {"train_loss": -12.36497688293457, "global_step": 438386, "epoch": 2609} {"train_loss": -12.193979263305664, "global_step": 438387, "epoch": 2609} {"train_loss": -11.85750961303711, "global_step": 438388, "epoch": 2609} {"train_loss": -11.410253524780273, "global_step": 438389, "epoch": 2609} {"train_loss": -11.855298042297363, "global_step": 438390, "epoch": 2609} {"train_loss": -11.50721263885498, "global_step": 438391, "epoch": 2609} {"train_loss": -12.46815299987793, "global_step": 438392, "epoch": 2609} {"train_loss": -11.687308311462402, "global_step": 438393, "epoch": 2609} {"train_loss": -12.378854751586914, "global_step": 438394, "epoch": 2609} {"train_loss": -12.378220558166504, "global_step": 438395, "epoch": 2609} {"train_loss": -12.386106491088867, "global_step": 438396, "epoch": 2609} {"train_loss": -12.29434585571289, "global_step": 438397, "epoch": 2609} {"train_loss": -12.18173599243164, "global_step": 438398, "epoch": 2609} {"train_loss": -12.08206558227539, "global_step": 438399, "epoch": 2609} {"train_loss": -10.58895492553711, "global_step": 438400, "epoch": 2609} {"train_loss": -12.060372352600098, "global_step": 438401, "epoch": 2609} {"train_loss": -11.021406173706055, "global_step": 438402, "epoch": 2609} {"train_loss": -11.382396697998047, "global_step": 438403, "epoch": 2609} {"train_loss": -11.831814765930176, "global_step": 438404, "epoch": 2609} {"train_loss": -11.822120666503906, "global_step": 438405, "epoch": 2609} {"train_loss": -11.833036422729492, "global_step": 438406, "epoch": 2609} {"train_loss": -11.465690612792969, "global_step": 438407, "epoch": 2609} {"train_loss": -12.398820877075195, "global_step": 438408, "epoch": 2609} {"train_loss": -10.796791076660156, "global_step": 438409, "epoch": 2609} {"train_loss": -11.788538932800293, "global_step": 438410, "epoch": 2609} {"train_loss": -12.093088150024414, "global_step": 438411, "epoch": 2609} {"train_loss": -11.031583786010742, "global_step": 438412, "epoch": 2609} {"train_loss": -11.842157363891602, "global_step": 438413, "epoch": 2609} {"train_loss": -12.351365089416504, "global_step": 438414, "epoch": 2609} {"train_loss": -11.191608428955078, "global_step": 438415, "epoch": 2609} {"train_loss": -12.074766159057617, "global_step": 438416, "epoch": 2609} {"train_loss": -10.634769439697266, "global_step": 438417, "epoch": 2609} {"train_loss": -11.558297157287598, "global_step": 438418, "epoch": 2609} {"train_loss": -12.011007308959961, "global_step": 438419, "epoch": 2609} {"train_loss": -11.12010669708252, "global_step": 438420, "epoch": 2609} {"train_loss": -12.268302917480469, "global_step": 438421, "epoch": 2609} {"train_loss": -11.215250968933105, "global_step": 438422, "epoch": 2609} {"train_loss": -11.969474792480469, "global_step": 438423, "epoch": 2609} {"train_loss": -12.036449432373047, "global_step": 438424, "epoch": 2609} {"train_loss": -11.231016159057617, "global_step": 438425, "epoch": 2609} {"train_loss": -12.27444076538086, "global_step": 438426, "epoch": 2609} {"train_loss": -11.487934112548828, "global_step": 438427, "epoch": 2609} {"train_loss": -12.55819320678711, "global_step": 438428, "epoch": 2609} {"train_loss": -11.419252395629883, "global_step": 438429, "epoch": 2609} {"train_loss": -12.178479194641113, "global_step": 438430, "epoch": 2609} {"train_loss": -11.168566703796387, "global_step": 438431, "epoch": 2609} {"train_loss": -12.124778747558594, "global_step": 438432, "epoch": 2609} {"train_loss": -12.447652816772461, "global_step": 438433, "epoch": 2609} {"train_loss": -12.048518180847168, "global_step": 438434, "epoch": 2609} {"train_loss": -12.538012504577637, "global_step": 438435, "epoch": 2609} {"train_loss": -11.496871948242188, "global_step": 438436, "epoch": 2609} {"train_loss": -12.417128562927246, "global_step": 438437, "epoch": 2609} {"train_loss": -11.954849243164062, "global_step": 438438, "epoch": 2609} {"train_loss": -12.093273162841797, "global_step": 438439, "epoch": 2609} {"train_loss": -12.161076545715332, "global_step": 438440, "epoch": 2609} {"train_loss": -11.709177017211914, "global_step": 438441, "epoch": 2609} {"train_loss": -12.409036636352539, "global_step": 438442, "epoch": 2609} {"train_loss": -11.857261657714844, "global_step": 438443, "epoch": 2609} {"train_loss": -12.171209335327148, "global_step": 438444, "epoch": 2609} {"train_loss": -12.288455963134766, "global_step": 438445, "epoch": 2609} {"train_loss": -12.175981521606445, "global_step": 438446, "epoch": 2609} {"train_loss": -12.236181259155273, "global_step": 438447, "epoch": 2609} {"train_loss": -12.307530403137207, "global_step": 438448, "epoch": 2609} {"train_loss": -12.390944480895996, "global_step": 438449, "epoch": 2609} {"train_loss": -12.169708251953125, "global_step": 438450, "epoch": 2609} {"train_loss": -12.397688865661621, "global_step": 438451, "epoch": 2609} {"train_loss": -12.683382034301758, "global_step": 438452, "epoch": 2609} {"train_loss": -12.606871604919434, "global_step": 438453, "epoch": 2609} {"train_loss": -12.293100357055664, "global_step": 438454, "epoch": 2609} {"train_loss": -12.029121398925781, "global_step": 438455, "epoch": 2609} {"train_loss": -12.470195770263672, "global_step": 438456, "epoch": 2609} {"train_loss": -12.400604248046875, "global_step": 438457, "epoch": 2609} {"train_loss": -12.525248527526855, "global_step": 438458, "epoch": 2609} {"train_loss": -12.085517883300781, "global_step": 438459, "epoch": 2609} {"train_loss": -12.183286666870117, "global_step": 438460, "epoch": 2609} {"train_loss": -12.015070915222168, "global_step": 438461, "epoch": 2609} {"train_loss": -11.733053207397461, "global_step": 438462, "epoch": 2609} {"train_loss": -12.171283721923828, "global_step": 438463, "epoch": 2609} {"train_loss": -11.271356582641602, "global_step": 438464, "epoch": 2609} {"train_loss": -12.44173526763916, "global_step": 438465, "epoch": 2609} {"train_loss": -11.654505729675293, "global_step": 438466, "epoch": 2609} {"train_loss": -11.533332824707031, "global_step": 438467, "epoch": 2609} {"train_loss": -12.252822875976562, "global_step": 438468, "epoch": 2609} {"train_loss": -11.887632369995117, "global_step": 438469, "epoch": 2609} {"train_loss": -12.744197845458984, "global_step": 438470, "epoch": 2609} {"train_loss": -11.800243377685547, "global_step": 438471, "epoch": 2609} {"train_loss": -12.172897338867188, "global_step": 438472, "epoch": 2609} {"train_loss": -12.406265258789062, "global_step": 438473, "epoch": 2609} {"train_loss": -12.548555374145508, "global_step": 438474, "epoch": 2609} {"train_loss": -12.681779861450195, "global_step": 438475, "epoch": 2609} {"train_loss": -12.410751342773438, "global_step": 438476, "epoch": 2609} {"train_loss": -12.424184799194336, "global_step": 438477, "epoch": 2609} {"train_loss": -12.6283597946167, "global_step": 438478, "epoch": 2609} {"train_loss": -12.144142809368315, "global_step": 438479, "epoch": 2609, "val_loss": 311462.6875} {"train_loss": -12.421326637268066, "global_step": 438480, "epoch": 2610} {"train_loss": -12.258295059204102, "global_step": 438481, "epoch": 2610} {"train_loss": -12.593936920166016, "global_step": 438482, "epoch": 2610} {"train_loss": -12.088217735290527, "global_step": 438483, "epoch": 2610} {"train_loss": -12.3525972366333, "global_step": 438484, "epoch": 2610} {"train_loss": -12.20724868774414, "global_step": 438485, "epoch": 2610} {"train_loss": -12.057549476623535, "global_step": 438486, "epoch": 2610} {"train_loss": -12.042263984680176, "global_step": 438487, "epoch": 2610} {"train_loss": -12.414069175720215, "global_step": 438488, "epoch": 2610} {"train_loss": -12.433042526245117, "global_step": 438489, "epoch": 2610} {"train_loss": -12.601320266723633, "global_step": 438490, "epoch": 2610} {"train_loss": -12.403390884399414, "global_step": 438491, "epoch": 2610} {"train_loss": -12.518206596374512, "global_step": 438492, "epoch": 2610} {"train_loss": -12.799768447875977, "global_step": 438493, "epoch": 2610} {"train_loss": -12.278285026550293, "global_step": 438494, "epoch": 2610} {"train_loss": -12.89337158203125, "global_step": 438495, "epoch": 2610} {"train_loss": -12.515130996704102, "global_step": 438496, "epoch": 2610} {"train_loss": -12.667373657226562, "global_step": 438497, "epoch": 2610} {"train_loss": -12.530872344970703, "global_step": 438498, "epoch": 2610} {"train_loss": -12.71202278137207, "global_step": 438499, "epoch": 2610} {"train_loss": -12.810537338256836, "global_step": 438500, "epoch": 2610} {"train_loss": -12.746028900146484, "global_step": 438501, "epoch": 2610} {"train_loss": -12.681486129760742, "global_step": 438502, "epoch": 2610} {"train_loss": -12.679570198059082, "global_step": 438503, "epoch": 2610} {"train_loss": -12.806351661682129, "global_step": 438504, "epoch": 2610} {"train_loss": -12.551130294799805, "global_step": 438505, "epoch": 2610} {"train_loss": -12.611257553100586, "global_step": 438506, "epoch": 2610} {"train_loss": -12.515874862670898, "global_step": 438507, "epoch": 2610} {"train_loss": -12.829858779907227, "global_step": 438508, "epoch": 2610} {"train_loss": -12.493139266967773, "global_step": 438509, "epoch": 2610} {"train_loss": -12.260936737060547, "global_step": 438510, "epoch": 2610} {"train_loss": -12.753800392150879, "global_step": 438511, "epoch": 2610} {"train_loss": -12.299123764038086, "global_step": 438512, "epoch": 2610} {"train_loss": -12.531702041625977, "global_step": 438513, "epoch": 2610} {"train_loss": -12.210861206054688, "global_step": 438514, "epoch": 2610} {"train_loss": -12.689990997314453, "global_step": 438515, "epoch": 2610} {"train_loss": -12.475765228271484, "global_step": 438516, "epoch": 2610} {"train_loss": -12.792619705200195, "global_step": 438517, "epoch": 2610} {"train_loss": -12.235280990600586, "global_step": 438518, "epoch": 2610} {"train_loss": -12.805426597595215, "global_step": 438519, "epoch": 2610} {"train_loss": -12.410432815551758, "global_step": 438520, "epoch": 2610} {"train_loss": -12.425408363342285, "global_step": 438521, "epoch": 2610} {"train_loss": -11.929584503173828, "global_step": 438522, "epoch": 2610} {"train_loss": -12.627817153930664, "global_step": 438523, "epoch": 2610} {"train_loss": -12.507209777832031, "global_step": 438524, "epoch": 2610} {"train_loss": -12.68064022064209, "global_step": 438525, "epoch": 2610} {"train_loss": -12.22298812866211, "global_step": 438526, "epoch": 2610} {"train_loss": -12.88317584991455, "global_step": 438527, "epoch": 2610} {"train_loss": -12.47718620300293, "global_step": 438528, "epoch": 2610} {"train_loss": -12.81558609008789, "global_step": 438529, "epoch": 2610} {"train_loss": -12.217531204223633, "global_step": 438530, "epoch": 2610} {"train_loss": -12.536437034606934, "global_step": 438531, "epoch": 2610} {"train_loss": -12.406786918640137, "global_step": 438532, "epoch": 2610} {"train_loss": -12.620779037475586, "global_step": 438533, "epoch": 2610} {"train_loss": -12.21211051940918, "global_step": 438534, "epoch": 2610} {"train_loss": -11.842710494995117, "global_step": 438535, "epoch": 2610} {"train_loss": -11.702884674072266, "global_step": 438536, "epoch": 2610} {"train_loss": -12.282835006713867, "global_step": 438537, "epoch": 2610} {"train_loss": -11.953596115112305, "global_step": 438538, "epoch": 2610} {"train_loss": -12.4531831741333, "global_step": 438539, "epoch": 2610} {"train_loss": -11.743144035339355, "global_step": 438540, "epoch": 2610} {"train_loss": -12.705135345458984, "global_step": 438541, "epoch": 2610} {"train_loss": -11.916566848754883, "global_step": 438542, "epoch": 2610} {"train_loss": -12.568805694580078, "global_step": 438543, "epoch": 2610} {"train_loss": -12.03018569946289, "global_step": 438544, "epoch": 2610} {"train_loss": -12.786428451538086, "global_step": 438545, "epoch": 2610} {"train_loss": -12.423101425170898, "global_step": 438546, "epoch": 2610} {"train_loss": -12.590270042419434, "global_step": 438547, "epoch": 2610} {"train_loss": -11.7540922164917, "global_step": 438548, "epoch": 2610} {"train_loss": -12.884119033813477, "global_step": 438549, "epoch": 2610} {"train_loss": -12.219846725463867, "global_step": 438550, "epoch": 2610} {"train_loss": -12.082030296325684, "global_step": 438551, "epoch": 2610} {"train_loss": -12.456062316894531, "global_step": 438552, "epoch": 2610} {"train_loss": -12.509431838989258, "global_step": 438553, "epoch": 2610} {"train_loss": -12.324471473693848, "global_step": 438554, "epoch": 2610} {"train_loss": -12.103395462036133, "global_step": 438555, "epoch": 2610} {"train_loss": -12.676006317138672, "global_step": 438556, "epoch": 2610} {"train_loss": -12.407088279724121, "global_step": 438557, "epoch": 2610} {"train_loss": -12.393393516540527, "global_step": 438558, "epoch": 2610} {"train_loss": -12.158038139343262, "global_step": 438559, "epoch": 2610} {"train_loss": -12.632011413574219, "global_step": 438560, "epoch": 2610} {"train_loss": -11.125114440917969, "global_step": 438561, "epoch": 2610} {"train_loss": -11.740459442138672, "global_step": 438562, "epoch": 2610} {"train_loss": -11.895830154418945, "global_step": 438563, "epoch": 2610} {"train_loss": -11.551721572875977, "global_step": 438564, "epoch": 2610} {"train_loss": -10.802690505981445, "global_step": 438565, "epoch": 2610} {"train_loss": -11.774190902709961, "global_step": 438566, "epoch": 2610} {"train_loss": -11.091673851013184, "global_step": 438567, "epoch": 2610} {"train_loss": -11.020687103271484, "global_step": 438568, "epoch": 2610} {"train_loss": -11.697264671325684, "global_step": 438569, "epoch": 2610} {"train_loss": -10.880606651306152, "global_step": 438570, "epoch": 2610} {"train_loss": -10.411510467529297, "global_step": 438571, "epoch": 2610} {"train_loss": -11.596487998962402, "global_step": 438572, "epoch": 2610} {"train_loss": -11.214446067810059, "global_step": 438573, "epoch": 2610} {"train_loss": -11.328567504882812, "global_step": 438574, "epoch": 2610} {"train_loss": -10.697771072387695, "global_step": 438575, "epoch": 2610} {"train_loss": -11.941427230834961, "global_step": 438576, "epoch": 2610} {"train_loss": -11.439265251159668, "global_step": 438577, "epoch": 2610} {"train_loss": -11.298830032348633, "global_step": 438578, "epoch": 2610} {"train_loss": -10.873741149902344, "global_step": 438579, "epoch": 2610} {"train_loss": -10.066486358642578, "global_step": 438580, "epoch": 2610} {"train_loss": -11.154332160949707, "global_step": 438581, "epoch": 2610} {"train_loss": -11.599737167358398, "global_step": 438582, "epoch": 2610} {"train_loss": -10.312254905700684, "global_step": 438583, "epoch": 2610} {"train_loss": -11.38516902923584, "global_step": 438584, "epoch": 2610} {"train_loss": -11.003551483154297, "global_step": 438585, "epoch": 2610} {"train_loss": -11.358159065246582, "global_step": 438586, "epoch": 2610} {"train_loss": -11.76835823059082, "global_step": 438587, "epoch": 2610} {"train_loss": -11.375362396240234, "global_step": 438588, "epoch": 2610} {"train_loss": -11.372945785522461, "global_step": 438589, "epoch": 2610} {"train_loss": -11.495567321777344, "global_step": 438590, "epoch": 2610} {"train_loss": -12.060236930847168, "global_step": 438591, "epoch": 2610} {"train_loss": -11.49313735961914, "global_step": 438592, "epoch": 2610} {"train_loss": -12.053703308105469, "global_step": 438593, "epoch": 2610} {"train_loss": -11.969346046447754, "global_step": 438594, "epoch": 2610} {"train_loss": -12.100159645080566, "global_step": 438595, "epoch": 2610} {"train_loss": -11.970118522644043, "global_step": 438596, "epoch": 2610} {"train_loss": -11.794654846191406, "global_step": 438597, "epoch": 2610} {"train_loss": -11.814969062805176, "global_step": 438598, "epoch": 2610} {"train_loss": -12.285317420959473, "global_step": 438599, "epoch": 2610} {"train_loss": -12.220542907714844, "global_step": 438600, "epoch": 2610} {"train_loss": -12.285179138183594, "global_step": 438601, "epoch": 2610} {"train_loss": -11.728179931640625, "global_step": 438602, "epoch": 2610} {"train_loss": -12.240527153015137, "global_step": 438603, "epoch": 2610} {"train_loss": -12.24307918548584, "global_step": 438604, "epoch": 2610} {"train_loss": -12.200464248657227, "global_step": 438605, "epoch": 2610} {"train_loss": -12.046628952026367, "global_step": 438606, "epoch": 2610} {"train_loss": -12.037360191345215, "global_step": 438607, "epoch": 2610} {"train_loss": -12.212974548339844, "global_step": 438608, "epoch": 2610} {"train_loss": -12.334053993225098, "global_step": 438609, "epoch": 2610} {"train_loss": -12.272366523742676, "global_step": 438610, "epoch": 2610} {"train_loss": -12.545862197875977, "global_step": 438611, "epoch": 2610} {"train_loss": -12.290203094482422, "global_step": 438612, "epoch": 2610} {"train_loss": -12.474032402038574, "global_step": 438613, "epoch": 2610} {"train_loss": -12.273967742919922, "global_step": 438614, "epoch": 2610} {"train_loss": -12.318713188171387, "global_step": 438615, "epoch": 2610} {"train_loss": -11.959019660949707, "global_step": 438616, "epoch": 2610} {"train_loss": -12.309494018554688, "global_step": 438617, "epoch": 2610} {"train_loss": -12.287089347839355, "global_step": 438618, "epoch": 2610} {"train_loss": -12.313782691955566, "global_step": 438619, "epoch": 2610} {"train_loss": -12.232535362243652, "global_step": 438620, "epoch": 2610} {"train_loss": -12.118124961853027, "global_step": 438621, "epoch": 2610} {"train_loss": -12.31973648071289, "global_step": 438622, "epoch": 2610} {"train_loss": -12.082708358764648, "global_step": 438623, "epoch": 2610} {"train_loss": -12.279449462890625, "global_step": 438624, "epoch": 2610} {"train_loss": -12.365560531616211, "global_step": 438625, "epoch": 2610} {"train_loss": -12.38283634185791, "global_step": 438626, "epoch": 2610} {"train_loss": -12.422847747802734, "global_step": 438627, "epoch": 2610} {"train_loss": -12.472068786621094, "global_step": 438628, "epoch": 2610} {"train_loss": -12.096525192260742, "global_step": 438629, "epoch": 2610} {"train_loss": -12.299751281738281, "global_step": 438630, "epoch": 2610} {"train_loss": -12.15501594543457, "global_step": 438631, "epoch": 2610} {"train_loss": -12.580924987792969, "global_step": 438632, "epoch": 2610} {"train_loss": -12.246932983398438, "global_step": 438633, "epoch": 2610} {"train_loss": -12.09677505493164, "global_step": 438634, "epoch": 2610} {"train_loss": -11.7049560546875, "global_step": 438635, "epoch": 2610} {"train_loss": -12.48892593383789, "global_step": 438636, "epoch": 2610} {"train_loss": -11.613875389099121, "global_step": 438637, "epoch": 2610} {"train_loss": -12.137182235717773, "global_step": 438638, "epoch": 2610} {"train_loss": -12.573013305664062, "global_step": 438639, "epoch": 2610} {"train_loss": -11.835742950439453, "global_step": 438640, "epoch": 2610} {"train_loss": -11.933107376098633, "global_step": 438641, "epoch": 2610} {"train_loss": -12.273764610290527, "global_step": 438642, "epoch": 2610} {"train_loss": -12.287984848022461, "global_step": 438643, "epoch": 2610} {"train_loss": -12.602334022521973, "global_step": 438644, "epoch": 2610} {"train_loss": -12.246186256408691, "global_step": 438645, "epoch": 2610} {"train_loss": -12.323070526123047, "global_step": 438646, "epoch": 2610} {"train_loss": -12.136885535149347, "global_step": 438647, "epoch": 2610, "val_loss": 310656.90625, "train_action_mse_error": 1.66713285446167} {"train_loss": -12.274606704711914, "global_step": 438648, "epoch": 2611} {"train_loss": -11.747730255126953, "global_step": 438649, "epoch": 2611} {"train_loss": -12.3587646484375, "global_step": 438650, "epoch": 2611} {"train_loss": -11.966218948364258, "global_step": 438651, "epoch": 2611} {"train_loss": -12.385271072387695, "global_step": 438652, "epoch": 2611} {"train_loss": -12.327857971191406, "global_step": 438653, "epoch": 2611} {"train_loss": -12.332026481628418, "global_step": 438654, "epoch": 2611} {"train_loss": -11.800679206848145, "global_step": 438655, "epoch": 2611} {"train_loss": -11.647272109985352, "global_step": 438656, "epoch": 2611} {"train_loss": -12.345529556274414, "global_step": 438657, "epoch": 2611} {"train_loss": -11.171783447265625, "global_step": 438658, "epoch": 2611} {"train_loss": -10.478652000427246, "global_step": 438659, "epoch": 2611} {"train_loss": -11.683893203735352, "global_step": 438660, "epoch": 2611} {"train_loss": -11.742546081542969, "global_step": 438661, "epoch": 2611} {"train_loss": -11.442389488220215, "global_step": 438662, "epoch": 2611} {"train_loss": -11.960047721862793, "global_step": 438663, "epoch": 2611} {"train_loss": -11.522005081176758, "global_step": 438664, "epoch": 2611} {"train_loss": -12.11014461517334, "global_step": 438665, "epoch": 2611} {"train_loss": -11.935644149780273, "global_step": 438666, "epoch": 2611} {"train_loss": -11.601688385009766, "global_step": 438667, "epoch": 2611} {"train_loss": -12.41970157623291, "global_step": 438668, "epoch": 2611} {"train_loss": -12.02406120300293, "global_step": 438669, "epoch": 2611} {"train_loss": -11.91702938079834, "global_step": 438670, "epoch": 2611} {"train_loss": -12.382567405700684, "global_step": 438671, "epoch": 2611} {"train_loss": -12.254727363586426, "global_step": 438672, "epoch": 2611} {"train_loss": -12.417673110961914, "global_step": 438673, "epoch": 2611} {"train_loss": -12.58605670928955, "global_step": 438674, "epoch": 2611} {"train_loss": -12.41384220123291, "global_step": 438675, "epoch": 2611} {"train_loss": -12.340124130249023, "global_step": 438676, "epoch": 2611} {"train_loss": -12.512730598449707, "global_step": 438677, "epoch": 2611} {"train_loss": -12.26215934753418, "global_step": 438678, "epoch": 2611} {"train_loss": -12.517024993896484, "global_step": 438679, "epoch": 2611} {"train_loss": -12.353813171386719, "global_step": 438680, "epoch": 2611} {"train_loss": -12.603351593017578, "global_step": 438681, "epoch": 2611} {"train_loss": -12.332246780395508, "global_step": 438682, "epoch": 2611} {"train_loss": -12.658402442932129, "global_step": 438683, "epoch": 2611} {"train_loss": -12.238797187805176, "global_step": 438684, "epoch": 2611} {"train_loss": -12.810686111450195, "global_step": 438685, "epoch": 2611} {"train_loss": -12.573604583740234, "global_step": 438686, "epoch": 2611} {"train_loss": -12.675704956054688, "global_step": 438687, "epoch": 2611} {"train_loss": -12.766804695129395, "global_step": 438688, "epoch": 2611} {"train_loss": -12.455021858215332, "global_step": 438689, "epoch": 2611} {"train_loss": -12.425989151000977, "global_step": 438690, "epoch": 2611} {"train_loss": -12.350634574890137, "global_step": 438691, "epoch": 2611} {"train_loss": -12.453130722045898, "global_step": 438692, "epoch": 2611} {"train_loss": -12.461599349975586, "global_step": 438693, "epoch": 2611} {"train_loss": -12.827228546142578, "global_step": 438694, "epoch": 2611} {"train_loss": -12.203503608703613, "global_step": 438695, "epoch": 2611} {"train_loss": -12.716974258422852, "global_step": 438696, "epoch": 2611} {"train_loss": -12.750096321105957, "global_step": 438697, "epoch": 2611} {"train_loss": -12.620260238647461, "global_step": 438698, "epoch": 2611} {"train_loss": -12.568632125854492, "global_step": 438699, "epoch": 2611} {"train_loss": -12.474325180053711, "global_step": 438700, "epoch": 2611} {"train_loss": -12.571284294128418, "global_step": 438701, "epoch": 2611} {"train_loss": -12.266495704650879, "global_step": 438702, "epoch": 2611} {"train_loss": -12.585193634033203, "global_step": 438703, "epoch": 2611} {"train_loss": -12.45169734954834, "global_step": 438704, "epoch": 2611} {"train_loss": -12.112312316894531, "global_step": 438705, "epoch": 2611} {"train_loss": -12.739297866821289, "global_step": 438706, "epoch": 2611} {"train_loss": -12.00948715209961, "global_step": 438707, "epoch": 2611} {"train_loss": -12.562352180480957, "global_step": 438708, "epoch": 2611} {"train_loss": -12.049564361572266, "global_step": 438709, "epoch": 2611} {"train_loss": -11.854601860046387, "global_step": 438710, "epoch": 2611} {"train_loss": -12.239875793457031, "global_step": 438711, "epoch": 2611} {"train_loss": -12.250465393066406, "global_step": 438712, "epoch": 2611} {"train_loss": -12.431516647338867, "global_step": 438713, "epoch": 2611} {"train_loss": -12.694257736206055, "global_step": 438714, "epoch": 2611} {"train_loss": -12.246811866760254, "global_step": 438715, "epoch": 2611} {"train_loss": -12.627044677734375, "global_step": 438716, "epoch": 2611} {"train_loss": -11.863160133361816, "global_step": 438717, "epoch": 2611} {"train_loss": -11.718011856079102, "global_step": 438718, "epoch": 2611} {"train_loss": -12.689040184020996, "global_step": 438719, "epoch": 2611} {"train_loss": -11.961580276489258, "global_step": 438720, "epoch": 2611} {"train_loss": -12.068611145019531, "global_step": 438721, "epoch": 2611} {"train_loss": -11.963142395019531, "global_step": 438722, "epoch": 2611} {"train_loss": -12.35525131225586, "global_step": 438723, "epoch": 2611} {"train_loss": -12.381772994995117, "global_step": 438724, "epoch": 2611} {"train_loss": -11.757678985595703, "global_step": 438725, "epoch": 2611} {"train_loss": -11.687092781066895, "global_step": 438726, "epoch": 2611} {"train_loss": -12.714828491210938, "global_step": 438727, "epoch": 2611} {"train_loss": -11.675424575805664, "global_step": 438728, "epoch": 2611} {"train_loss": -11.897788047790527, "global_step": 438729, "epoch": 2611} {"train_loss": -12.23676872253418, "global_step": 438730, "epoch": 2611} {"train_loss": -12.18834114074707, "global_step": 438731, "epoch": 2611} {"train_loss": -11.099706649780273, "global_step": 438732, "epoch": 2611} {"train_loss": -11.523880004882812, "global_step": 438733, "epoch": 2611} {"train_loss": -12.00787353515625, "global_step": 438734, "epoch": 2611} {"train_loss": -10.604251861572266, "global_step": 438735, "epoch": 2611} {"train_loss": -11.677206039428711, "global_step": 438736, "epoch": 2611} {"train_loss": -11.806951522827148, "global_step": 438737, "epoch": 2611} {"train_loss": -11.553106307983398, "global_step": 438738, "epoch": 2611} {"train_loss": -12.064821243286133, "global_step": 438739, "epoch": 2611} {"train_loss": -11.651226043701172, "global_step": 438740, "epoch": 2611} {"train_loss": -12.151044845581055, "global_step": 438741, "epoch": 2611} {"train_loss": -11.637378692626953, "global_step": 438742, "epoch": 2611} {"train_loss": -11.42237663269043, "global_step": 438743, "epoch": 2611} {"train_loss": -11.306391716003418, "global_step": 438744, "epoch": 2611} {"train_loss": -12.189323425292969, "global_step": 438745, "epoch": 2611} {"train_loss": -12.030044555664062, "global_step": 438746, "epoch": 2611} {"train_loss": -11.844411849975586, "global_step": 438747, "epoch": 2611} {"train_loss": -11.699445724487305, "global_step": 438748, "epoch": 2611} {"train_loss": -11.066417694091797, "global_step": 438749, "epoch": 2611} {"train_loss": -11.792957305908203, "global_step": 438750, "epoch": 2611} {"train_loss": -11.823266983032227, "global_step": 438751, "epoch": 2611} {"train_loss": -10.961860656738281, "global_step": 438752, "epoch": 2611} {"train_loss": -11.823797225952148, "global_step": 438753, "epoch": 2611} {"train_loss": -11.561556816101074, "global_step": 438754, "epoch": 2611} {"train_loss": -11.762097358703613, "global_step": 438755, "epoch": 2611} {"train_loss": -11.787210464477539, "global_step": 438756, "epoch": 2611} {"train_loss": -11.823919296264648, "global_step": 438757, "epoch": 2611} {"train_loss": -12.124269485473633, "global_step": 438758, "epoch": 2611} {"train_loss": -11.458602905273438, "global_step": 438759, "epoch": 2611} {"train_loss": -12.003796577453613, "global_step": 438760, "epoch": 2611} {"train_loss": -11.582191467285156, "global_step": 438761, "epoch": 2611} {"train_loss": -12.540851593017578, "global_step": 438762, "epoch": 2611} {"train_loss": -11.54287338256836, "global_step": 438763, "epoch": 2611} {"train_loss": -11.91704273223877, "global_step": 438764, "epoch": 2611} {"train_loss": -11.880725860595703, "global_step": 438765, "epoch": 2611} {"train_loss": -12.309762001037598, "global_step": 438766, "epoch": 2611} {"train_loss": -12.004310607910156, "global_step": 438767, "epoch": 2611} {"train_loss": -12.160858154296875, "global_step": 438768, "epoch": 2611} {"train_loss": -11.975650787353516, "global_step": 438769, "epoch": 2611} {"train_loss": -12.412132263183594, "global_step": 438770, "epoch": 2611} {"train_loss": -11.929193496704102, "global_step": 438771, "epoch": 2611} {"train_loss": -12.669252395629883, "global_step": 438772, "epoch": 2611} {"train_loss": -12.222497940063477, "global_step": 438773, "epoch": 2611} {"train_loss": -12.387919425964355, "global_step": 438774, "epoch": 2611} {"train_loss": -12.654651641845703, "global_step": 438775, "epoch": 2611} {"train_loss": -12.320585250854492, "global_step": 438776, "epoch": 2611} {"train_loss": -12.399784088134766, "global_step": 438777, "epoch": 2611} {"train_loss": -12.546960830688477, "global_step": 438778, "epoch": 2611} {"train_loss": -12.578413963317871, "global_step": 438779, "epoch": 2611} {"train_loss": -12.502778053283691, "global_step": 438780, "epoch": 2611} {"train_loss": -12.505838394165039, "global_step": 438781, "epoch": 2611} {"train_loss": -12.371063232421875, "global_step": 438782, "epoch": 2611} {"train_loss": -12.696514129638672, "global_step": 438783, "epoch": 2611} {"train_loss": -12.620037078857422, "global_step": 438784, "epoch": 2611} {"train_loss": -12.624017715454102, "global_step": 438785, "epoch": 2611} {"train_loss": -12.405498504638672, "global_step": 438786, "epoch": 2611} {"train_loss": -12.715458869934082, "global_step": 438787, "epoch": 2611} {"train_loss": -12.592721939086914, "global_step": 438788, "epoch": 2611} {"train_loss": -12.57506275177002, "global_step": 438789, "epoch": 2611} {"train_loss": -12.669889450073242, "global_step": 438790, "epoch": 2611} {"train_loss": -12.474074363708496, "global_step": 438791, "epoch": 2611} {"train_loss": -12.332403182983398, "global_step": 438792, "epoch": 2611} {"train_loss": -12.668128967285156, "global_step": 438793, "epoch": 2611} {"train_loss": -12.472015380859375, "global_step": 438794, "epoch": 2611} {"train_loss": -12.72899055480957, "global_step": 438795, "epoch": 2611} {"train_loss": -12.498069763183594, "global_step": 438796, "epoch": 2611} {"train_loss": -12.514394760131836, "global_step": 438797, "epoch": 2611} {"train_loss": -12.386218070983887, "global_step": 438798, "epoch": 2611} {"train_loss": -12.787277221679688, "global_step": 438799, "epoch": 2611} {"train_loss": -12.648273468017578, "global_step": 438800, "epoch": 2611} {"train_loss": -12.628761291503906, "global_step": 438801, "epoch": 2611} {"train_loss": -12.870626449584961, "global_step": 438802, "epoch": 2611} {"train_loss": -12.439545631408691, "global_step": 438803, "epoch": 2611} {"train_loss": -12.806638717651367, "global_step": 438804, "epoch": 2611} {"train_loss": -12.550252914428711, "global_step": 438805, "epoch": 2611} {"train_loss": -12.448078155517578, "global_step": 438806, "epoch": 2611} {"train_loss": -12.65172290802002, "global_step": 438807, "epoch": 2611} {"train_loss": -12.13158893585205, "global_step": 438808, "epoch": 2611} {"train_loss": -12.704665184020996, "global_step": 438809, "epoch": 2611} {"train_loss": -12.498708724975586, "global_step": 438810, "epoch": 2611} {"train_loss": -12.605056762695312, "global_step": 438811, "epoch": 2611} {"train_loss": -12.424238204956055, "global_step": 438812, "epoch": 2611} {"train_loss": -12.049330711364746, "global_step": 438813, "epoch": 2611} {"train_loss": -12.622062683105469, "global_step": 438814, "epoch": 2611} {"train_loss": -12.194303064119248, "global_step": 438815, "epoch": 2611, "val_loss": 312483.96875} {"train_loss": -11.904899597167969, "global_step": 438816, "epoch": 2612} {"train_loss": -12.276761054992676, "global_step": 438817, "epoch": 2612} {"train_loss": -12.168902397155762, "global_step": 438818, "epoch": 2612} {"train_loss": -12.221525192260742, "global_step": 438819, "epoch": 2612} {"train_loss": -12.363231658935547, "global_step": 438820, "epoch": 2612} {"train_loss": -11.576223373413086, "global_step": 438821, "epoch": 2612} {"train_loss": -12.594703674316406, "global_step": 438822, "epoch": 2612} {"train_loss": -11.397658348083496, "global_step": 438823, "epoch": 2612} {"train_loss": -12.309455871582031, "global_step": 438824, "epoch": 2612} {"train_loss": -11.70695686340332, "global_step": 438825, "epoch": 2612} {"train_loss": -11.866144180297852, "global_step": 438826, "epoch": 2612} {"train_loss": -11.358777046203613, "global_step": 438827, "epoch": 2612} {"train_loss": -12.175272941589355, "global_step": 438828, "epoch": 2612} {"train_loss": -11.386040687561035, "global_step": 438829, "epoch": 2612} {"train_loss": -12.276469230651855, "global_step": 438830, "epoch": 2612} {"train_loss": -12.221522331237793, "global_step": 438831, "epoch": 2612} {"train_loss": -11.558661460876465, "global_step": 438832, "epoch": 2612} {"train_loss": -11.92931079864502, "global_step": 438833, "epoch": 2612} {"train_loss": -11.351186752319336, "global_step": 438834, "epoch": 2612} {"train_loss": -10.141416549682617, "global_step": 438835, "epoch": 2612} {"train_loss": -11.5018892288208, "global_step": 438836, "epoch": 2612} {"train_loss": -10.744110107421875, "global_step": 438837, "epoch": 2612} {"train_loss": -9.107687950134277, "global_step": 438838, "epoch": 2612} {"train_loss": -9.461591720581055, "global_step": 438839, "epoch": 2612} {"train_loss": -9.133382797241211, "global_step": 438840, "epoch": 2612} {"train_loss": -10.830413818359375, "global_step": 438841, "epoch": 2612} {"train_loss": -9.020818710327148, "global_step": 438842, "epoch": 2612} {"train_loss": -10.602483749389648, "global_step": 438843, "epoch": 2612} {"train_loss": -8.942728042602539, "global_step": 438844, "epoch": 2612} {"train_loss": -8.381620407104492, "global_step": 438845, "epoch": 2612} {"train_loss": -8.994062423706055, "global_step": 438846, "epoch": 2612} {"train_loss": -9.940444946289062, "global_step": 438847, "epoch": 2612} {"train_loss": -8.438596725463867, "global_step": 438848, "epoch": 2612} {"train_loss": -10.112180709838867, "global_step": 438849, "epoch": 2612} {"train_loss": -10.369481086730957, "global_step": 438850, "epoch": 2612} {"train_loss": -9.752190589904785, "global_step": 438851, "epoch": 2612} {"train_loss": -8.839204788208008, "global_step": 438852, "epoch": 2612} {"train_loss": -9.851062774658203, "global_step": 438853, "epoch": 2612} {"train_loss": -11.336912155151367, "global_step": 438854, "epoch": 2612} {"train_loss": -9.791200637817383, "global_step": 438855, "epoch": 2612} {"train_loss": -11.427538871765137, "global_step": 438856, "epoch": 2612} {"train_loss": -10.378050804138184, "global_step": 438857, "epoch": 2612} {"train_loss": -11.64138412475586, "global_step": 438858, "epoch": 2612} {"train_loss": -10.451337814331055, "global_step": 438859, "epoch": 2612} {"train_loss": -11.794729232788086, "global_step": 438860, "epoch": 2612} {"train_loss": -11.06856918334961, "global_step": 438861, "epoch": 2612} {"train_loss": -11.919158935546875, "global_step": 438862, "epoch": 2612} {"train_loss": -11.033586502075195, "global_step": 438863, "epoch": 2612} {"train_loss": -12.048551559448242, "global_step": 438864, "epoch": 2612} {"train_loss": -11.190631866455078, "global_step": 438865, "epoch": 2612} {"train_loss": -12.123950958251953, "global_step": 438866, "epoch": 2612} {"train_loss": -11.36768913269043, "global_step": 438867, "epoch": 2612} {"train_loss": -11.97227668762207, "global_step": 438868, "epoch": 2612} {"train_loss": -11.795759201049805, "global_step": 438869, "epoch": 2612} {"train_loss": -12.025874137878418, "global_step": 438870, "epoch": 2612} {"train_loss": -11.459199905395508, "global_step": 438871, "epoch": 2612} {"train_loss": -11.93597412109375, "global_step": 438872, "epoch": 2612} {"train_loss": -11.44974136352539, "global_step": 438873, "epoch": 2612} {"train_loss": -12.033893585205078, "global_step": 438874, "epoch": 2612} {"train_loss": -12.07534408569336, "global_step": 438875, "epoch": 2612} {"train_loss": -12.21461009979248, "global_step": 438876, "epoch": 2612} {"train_loss": -11.734643936157227, "global_step": 438877, "epoch": 2612} {"train_loss": -12.126320838928223, "global_step": 438878, "epoch": 2612} {"train_loss": -12.051177978515625, "global_step": 438879, "epoch": 2612} {"train_loss": -12.358894348144531, "global_step": 438880, "epoch": 2612} {"train_loss": -12.297531127929688, "global_step": 438881, "epoch": 2612} {"train_loss": -12.120063781738281, "global_step": 438882, "epoch": 2612} {"train_loss": -11.937917709350586, "global_step": 438883, "epoch": 2612} {"train_loss": -12.358562469482422, "global_step": 438884, "epoch": 2612} {"train_loss": -11.754847526550293, "global_step": 438885, "epoch": 2612} {"train_loss": -12.228693008422852, "global_step": 438886, "epoch": 2612} {"train_loss": -11.868124961853027, "global_step": 438887, "epoch": 2612} {"train_loss": -12.380412101745605, "global_step": 438888, "epoch": 2612} {"train_loss": -12.433883666992188, "global_step": 438889, "epoch": 2612} {"train_loss": -12.282403945922852, "global_step": 438890, "epoch": 2612} {"train_loss": -12.594493865966797, "global_step": 438891, "epoch": 2612} {"train_loss": -12.410048484802246, "global_step": 438892, "epoch": 2612} {"train_loss": -12.538114547729492, "global_step": 438893, "epoch": 2612} {"train_loss": -12.34522819519043, "global_step": 438894, "epoch": 2612} {"train_loss": -12.464487075805664, "global_step": 438895, "epoch": 2612} {"train_loss": -12.407100677490234, "global_step": 438896, "epoch": 2612} {"train_loss": -12.526159286499023, "global_step": 438897, "epoch": 2612} {"train_loss": -12.463008880615234, "global_step": 438898, "epoch": 2612} {"train_loss": -12.552000045776367, "global_step": 438899, "epoch": 2612} {"train_loss": -12.29658317565918, "global_step": 438900, "epoch": 2612} {"train_loss": -12.430121421813965, "global_step": 438901, "epoch": 2612} {"train_loss": -12.640503883361816, "global_step": 438902, "epoch": 2612} {"train_loss": -12.661370277404785, "global_step": 438903, "epoch": 2612} {"train_loss": -12.510530471801758, "global_step": 438904, "epoch": 2612} {"train_loss": -12.662338256835938, "global_step": 438905, "epoch": 2612} {"train_loss": -12.648375511169434, "global_step": 438906, "epoch": 2612} {"train_loss": -12.416614532470703, "global_step": 438907, "epoch": 2612} {"train_loss": -12.695770263671875, "global_step": 438908, "epoch": 2612} {"train_loss": -12.599136352539062, "global_step": 438909, "epoch": 2612} {"train_loss": -12.738142013549805, "global_step": 438910, "epoch": 2612} {"train_loss": -12.709733963012695, "global_step": 438911, "epoch": 2612} {"train_loss": -12.789451599121094, "global_step": 438912, "epoch": 2612} {"train_loss": -12.824557304382324, "global_step": 438913, "epoch": 2612} {"train_loss": -12.584217071533203, "global_step": 438914, "epoch": 2612} {"train_loss": -12.50212287902832, "global_step": 438915, "epoch": 2612} {"train_loss": -12.816398620605469, "global_step": 438916, "epoch": 2612} {"train_loss": -12.552334785461426, "global_step": 438917, "epoch": 2612} {"train_loss": -12.648880958557129, "global_step": 438918, "epoch": 2612} {"train_loss": -12.761175155639648, "global_step": 438919, "epoch": 2612} {"train_loss": -12.579347610473633, "global_step": 438920, "epoch": 2612} {"train_loss": -12.808243751525879, "global_step": 438921, "epoch": 2612} {"train_loss": -12.535377502441406, "global_step": 438922, "epoch": 2612} {"train_loss": -12.661888122558594, "global_step": 438923, "epoch": 2612} {"train_loss": -12.65302562713623, "global_step": 438924, "epoch": 2612} {"train_loss": -12.86093521118164, "global_step": 438925, "epoch": 2612} {"train_loss": -12.76632308959961, "global_step": 438926, "epoch": 2612} {"train_loss": -12.485919952392578, "global_step": 438927, "epoch": 2612} {"train_loss": -12.355792999267578, "global_step": 438928, "epoch": 2612} {"train_loss": -12.693845748901367, "global_step": 438929, "epoch": 2612} {"train_loss": -12.380146980285645, "global_step": 438930, "epoch": 2612} {"train_loss": -12.376108169555664, "global_step": 438931, "epoch": 2612} {"train_loss": -12.12672233581543, "global_step": 438932, "epoch": 2612} {"train_loss": -12.406234741210938, "global_step": 438933, "epoch": 2612} {"train_loss": -12.019986152648926, "global_step": 438934, "epoch": 2612} {"train_loss": -12.22260856628418, "global_step": 438935, "epoch": 2612} {"train_loss": -12.388406753540039, "global_step": 438936, "epoch": 2612} {"train_loss": -12.518714904785156, "global_step": 438937, "epoch": 2612} {"train_loss": -12.037367820739746, "global_step": 438938, "epoch": 2612} {"train_loss": -12.45418643951416, "global_step": 438939, "epoch": 2612} {"train_loss": -12.39228630065918, "global_step": 438940, "epoch": 2612} {"train_loss": -11.962260246276855, "global_step": 438941, "epoch": 2612} {"train_loss": -12.307744979858398, "global_step": 438942, "epoch": 2612} {"train_loss": -12.538313865661621, "global_step": 438943, "epoch": 2612} {"train_loss": -12.172043800354004, "global_step": 438944, "epoch": 2612} {"train_loss": -11.315032958984375, "global_step": 438945, "epoch": 2612} {"train_loss": -12.329102516174316, "global_step": 438946, "epoch": 2612} {"train_loss": -12.353126525878906, "global_step": 438947, "epoch": 2612} {"train_loss": -12.1151762008667, "global_step": 438948, "epoch": 2612} {"train_loss": -11.723751068115234, "global_step": 438949, "epoch": 2612} {"train_loss": -12.214312553405762, "global_step": 438950, "epoch": 2612} {"train_loss": -11.281503677368164, "global_step": 438951, "epoch": 2612} {"train_loss": -12.182619094848633, "global_step": 438952, "epoch": 2612} {"train_loss": -11.774789810180664, "global_step": 438953, "epoch": 2612} {"train_loss": -11.21145248413086, "global_step": 438954, "epoch": 2612} {"train_loss": -11.158563613891602, "global_step": 438955, "epoch": 2612} {"train_loss": -11.919477462768555, "global_step": 438956, "epoch": 2612} {"train_loss": -9.405464172363281, "global_step": 438957, "epoch": 2612} {"train_loss": -10.491456985473633, "global_step": 438958, "epoch": 2612} {"train_loss": -10.032207489013672, "global_step": 438959, "epoch": 2612} {"train_loss": -11.673873901367188, "global_step": 438960, "epoch": 2612} {"train_loss": -10.929738998413086, "global_step": 438961, "epoch": 2612} {"train_loss": -10.5835599899292, "global_step": 438962, "epoch": 2612} {"train_loss": -11.311633110046387, "global_step": 438963, "epoch": 2612} {"train_loss": -11.568799018859863, "global_step": 438964, "epoch": 2612} {"train_loss": -11.332307815551758, "global_step": 438965, "epoch": 2612} {"train_loss": -11.199514389038086, "global_step": 438966, "epoch": 2612} {"train_loss": -11.966240882873535, "global_step": 438967, "epoch": 2612} {"train_loss": -11.070918083190918, "global_step": 438968, "epoch": 2612} {"train_loss": -12.219552993774414, "global_step": 438969, "epoch": 2612} {"train_loss": -11.42235279083252, "global_step": 438970, "epoch": 2612} {"train_loss": -11.17605209350586, "global_step": 438971, "epoch": 2612} {"train_loss": -11.323193550109863, "global_step": 438972, "epoch": 2612} {"train_loss": -11.744396209716797, "global_step": 438973, "epoch": 2612} {"train_loss": -11.258523941040039, "global_step": 438974, "epoch": 2612} {"train_loss": -11.280705451965332, "global_step": 438975, "epoch": 2612} {"train_loss": -11.765883445739746, "global_step": 438976, "epoch": 2612} {"train_loss": -11.151592254638672, "global_step": 438977, "epoch": 2612} {"train_loss": -11.077861785888672, "global_step": 438978, "epoch": 2612} {"train_loss": -12.07311725616455, "global_step": 438979, "epoch": 2612} {"train_loss": -11.150489807128906, "global_step": 438980, "epoch": 2612} {"train_loss": -11.176458358764648, "global_step": 438981, "epoch": 2612} {"train_loss": -12.100709915161133, "global_step": 438982, "epoch": 2612} {"train_loss": -11.704642903237115, "global_step": 438983, "epoch": 2612, "val_loss": 306817.3125} {"train_loss": -12.26122760772705, "global_step": 438984, "epoch": 2613} {"train_loss": -11.444730758666992, "global_step": 438985, "epoch": 2613} {"train_loss": -12.39028549194336, "global_step": 438986, "epoch": 2613} {"train_loss": -12.230997085571289, "global_step": 438987, "epoch": 2613} {"train_loss": -12.22504997253418, "global_step": 438988, "epoch": 2613} {"train_loss": -12.267562866210938, "global_step": 438989, "epoch": 2613} {"train_loss": -12.314017295837402, "global_step": 438990, "epoch": 2613} {"train_loss": -12.004474639892578, "global_step": 438991, "epoch": 2613} {"train_loss": -12.294649124145508, "global_step": 438992, "epoch": 2613} {"train_loss": -12.037647247314453, "global_step": 438993, "epoch": 2613} {"train_loss": -12.361929893493652, "global_step": 438994, "epoch": 2613} {"train_loss": -12.146761894226074, "global_step": 438995, "epoch": 2613} {"train_loss": -12.255352973937988, "global_step": 438996, "epoch": 2613} {"train_loss": -11.778529167175293, "global_step": 438997, "epoch": 2613} {"train_loss": -12.129990577697754, "global_step": 438998, "epoch": 2613} {"train_loss": -12.592453002929688, "global_step": 438999, "epoch": 2613} {"train_loss": -12.070638656616211, "global_step": 439000, "epoch": 2613} {"train_loss": -12.603336334228516, "global_step": 439001, "epoch": 2613} {"train_loss": -11.981573104858398, "global_step": 439002, "epoch": 2613} {"train_loss": -12.609201431274414, "global_step": 439003, "epoch": 2613} {"train_loss": -12.369928359985352, "global_step": 439004, "epoch": 2613} {"train_loss": -12.28060531616211, "global_step": 439005, "epoch": 2613} {"train_loss": -12.227283477783203, "global_step": 439006, "epoch": 2613} {"train_loss": -12.394645690917969, "global_step": 439007, "epoch": 2613} {"train_loss": -12.24199390411377, "global_step": 439008, "epoch": 2613} {"train_loss": -12.645750045776367, "global_step": 439009, "epoch": 2613} {"train_loss": -12.487112045288086, "global_step": 439010, "epoch": 2613} {"train_loss": -12.418524742126465, "global_step": 439011, "epoch": 2613} {"train_loss": -12.616692543029785, "global_step": 439012, "epoch": 2613} {"train_loss": -12.472909927368164, "global_step": 439013, "epoch": 2613} {"train_loss": -12.610502243041992, "global_step": 439014, "epoch": 2613} {"train_loss": -12.582696914672852, "global_step": 439015, "epoch": 2613} {"train_loss": -12.63723373413086, "global_step": 439016, "epoch": 2613} {"train_loss": -12.692301750183105, "global_step": 439017, "epoch": 2613} {"train_loss": -12.534954071044922, "global_step": 439018, "epoch": 2613} {"train_loss": -12.4157133102417, "global_step": 439019, "epoch": 2613} {"train_loss": -12.72055435180664, "global_step": 439020, "epoch": 2613} {"train_loss": -12.596982955932617, "global_step": 439021, "epoch": 2613} {"train_loss": -12.55647087097168, "global_step": 439022, "epoch": 2613} {"train_loss": -12.489717483520508, "global_step": 439023, "epoch": 2613} {"train_loss": -12.794967651367188, "global_step": 439024, "epoch": 2613} {"train_loss": -12.78359317779541, "global_step": 439025, "epoch": 2613} {"train_loss": -12.819737434387207, "global_step": 439026, "epoch": 2613} {"train_loss": -12.784111976623535, "global_step": 439027, "epoch": 2613} {"train_loss": -12.704362869262695, "global_step": 439028, "epoch": 2613} {"train_loss": -12.691963195800781, "global_step": 439029, "epoch": 2613} {"train_loss": -12.885602951049805, "global_step": 439030, "epoch": 2613} {"train_loss": -12.850242614746094, "global_step": 439031, "epoch": 2613} {"train_loss": -12.872638702392578, "global_step": 439032, "epoch": 2613} {"train_loss": -12.402034759521484, "global_step": 439033, "epoch": 2613} {"train_loss": -12.6077880859375, "global_step": 439034, "epoch": 2613} {"train_loss": -12.505825996398926, "global_step": 439035, "epoch": 2613} {"train_loss": -12.840317726135254, "global_step": 439036, "epoch": 2613} {"train_loss": -12.73740005493164, "global_step": 439037, "epoch": 2613} {"train_loss": -12.893742561340332, "global_step": 439038, "epoch": 2613} {"train_loss": -12.681327819824219, "global_step": 439039, "epoch": 2613} {"train_loss": -12.732011795043945, "global_step": 439040, "epoch": 2613} {"train_loss": -12.755789756774902, "global_step": 439041, "epoch": 2613} {"train_loss": -12.675034523010254, "global_step": 439042, "epoch": 2613} {"train_loss": -12.485700607299805, "global_step": 439043, "epoch": 2613} {"train_loss": -12.372387886047363, "global_step": 439044, "epoch": 2613} {"train_loss": -12.229240417480469, "global_step": 439045, "epoch": 2613} {"train_loss": -12.817907333374023, "global_step": 439046, "epoch": 2613} {"train_loss": -12.664531707763672, "global_step": 439047, "epoch": 2613} {"train_loss": -12.8623046875, "global_step": 439048, "epoch": 2613} {"train_loss": -12.401153564453125, "global_step": 439049, "epoch": 2613} {"train_loss": -11.736908912658691, "global_step": 439050, "epoch": 2613} {"train_loss": -12.01400375366211, "global_step": 439051, "epoch": 2613} {"train_loss": -12.490751266479492, "global_step": 439052, "epoch": 2613} {"train_loss": -11.909906387329102, "global_step": 439053, "epoch": 2613} {"train_loss": -11.631621360778809, "global_step": 439054, "epoch": 2613} {"train_loss": -12.679765701293945, "global_step": 439055, "epoch": 2613} {"train_loss": -11.61280345916748, "global_step": 439056, "epoch": 2613} {"train_loss": -11.206735610961914, "global_step": 439057, "epoch": 2613} {"train_loss": -11.35911750793457, "global_step": 439058, "epoch": 2613} {"train_loss": -12.432244300842285, "global_step": 439059, "epoch": 2613} {"train_loss": -11.142841339111328, "global_step": 439060, "epoch": 2613} {"train_loss": -10.934409141540527, "global_step": 439061, "epoch": 2613} {"train_loss": -11.260725975036621, "global_step": 439062, "epoch": 2613} {"train_loss": -9.119413375854492, "global_step": 439063, "epoch": 2613} {"train_loss": -10.745166778564453, "global_step": 439064, "epoch": 2613} {"train_loss": -10.019571304321289, "global_step": 439065, "epoch": 2613} {"train_loss": -10.827159881591797, "global_step": 439066, "epoch": 2613} {"train_loss": -10.256633758544922, "global_step": 439067, "epoch": 2613} {"train_loss": -11.321258544921875, "global_step": 439068, "epoch": 2613} {"train_loss": -10.409168243408203, "global_step": 439069, "epoch": 2613} {"train_loss": -9.588061332702637, "global_step": 439070, "epoch": 2613} {"train_loss": -11.826851844787598, "global_step": 439071, "epoch": 2613} {"train_loss": -10.705322265625, "global_step": 439072, "epoch": 2613} {"train_loss": -10.596246719360352, "global_step": 439073, "epoch": 2613} {"train_loss": -12.130653381347656, "global_step": 439074, "epoch": 2613} {"train_loss": -10.472064971923828, "global_step": 439075, "epoch": 2613} {"train_loss": -11.942639350891113, "global_step": 439076, "epoch": 2613} {"train_loss": -10.291820526123047, "global_step": 439077, "epoch": 2613} {"train_loss": -11.50933837890625, "global_step": 439078, "epoch": 2613} {"train_loss": -11.04896354675293, "global_step": 439079, "epoch": 2613} {"train_loss": -10.830591201782227, "global_step": 439080, "epoch": 2613} {"train_loss": -12.07847785949707, "global_step": 439081, "epoch": 2613} {"train_loss": -10.49370002746582, "global_step": 439082, "epoch": 2613} {"train_loss": -12.188081741333008, "global_step": 439083, "epoch": 2613} {"train_loss": -10.994888305664062, "global_step": 439084, "epoch": 2613} {"train_loss": -11.46030330657959, "global_step": 439085, "epoch": 2613} {"train_loss": -11.796138763427734, "global_step": 439086, "epoch": 2613} {"train_loss": -11.236698150634766, "global_step": 439087, "epoch": 2613} {"train_loss": -11.903764724731445, "global_step": 439088, "epoch": 2613} {"train_loss": -11.731040954589844, "global_step": 439089, "epoch": 2613} {"train_loss": -11.068371772766113, "global_step": 439090, "epoch": 2613} {"train_loss": -11.440924644470215, "global_step": 439091, "epoch": 2613} {"train_loss": -11.061939239501953, "global_step": 439092, "epoch": 2613} {"train_loss": -11.948500633239746, "global_step": 439093, "epoch": 2613} {"train_loss": -11.322784423828125, "global_step": 439094, "epoch": 2613} {"train_loss": -10.849424362182617, "global_step": 439095, "epoch": 2613} {"train_loss": -11.161285400390625, "global_step": 439096, "epoch": 2613} {"train_loss": -11.062154769897461, "global_step": 439097, "epoch": 2613} {"train_loss": -11.183235168457031, "global_step": 439098, "epoch": 2613} {"train_loss": -11.945956230163574, "global_step": 439099, "epoch": 2613} {"train_loss": -10.810007095336914, "global_step": 439100, "epoch": 2613} {"train_loss": -11.43172836303711, "global_step": 439101, "epoch": 2613} {"train_loss": -10.863155364990234, "global_step": 439102, "epoch": 2613} {"train_loss": -10.821388244628906, "global_step": 439103, "epoch": 2613} {"train_loss": -10.722620010375977, "global_step": 439104, "epoch": 2613} {"train_loss": -11.268807411193848, "global_step": 439105, "epoch": 2613} {"train_loss": -11.035941123962402, "global_step": 439106, "epoch": 2613} {"train_loss": -11.302891731262207, "global_step": 439107, "epoch": 2613} {"train_loss": -11.902910232543945, "global_step": 439108, "epoch": 2613} {"train_loss": -11.793998718261719, "global_step": 439109, "epoch": 2613} {"train_loss": -11.785628318786621, "global_step": 439110, "epoch": 2613} {"train_loss": -12.046319007873535, "global_step": 439111, "epoch": 2613} {"train_loss": -11.777791976928711, "global_step": 439112, "epoch": 2613} {"train_loss": -11.984720230102539, "global_step": 439113, "epoch": 2613} {"train_loss": -12.168474197387695, "global_step": 439114, "epoch": 2613} {"train_loss": -12.03474235534668, "global_step": 439115, "epoch": 2613} {"train_loss": -11.962355613708496, "global_step": 439116, "epoch": 2613} {"train_loss": -11.932518005371094, "global_step": 439117, "epoch": 2613} {"train_loss": -12.254953384399414, "global_step": 439118, "epoch": 2613} {"train_loss": -11.985074043273926, "global_step": 439119, "epoch": 2613} {"train_loss": -12.181204795837402, "global_step": 439120, "epoch": 2613} {"train_loss": -12.095008850097656, "global_step": 439121, "epoch": 2613} {"train_loss": -12.361490249633789, "global_step": 439122, "epoch": 2613} {"train_loss": -12.123492240905762, "global_step": 439123, "epoch": 2613} {"train_loss": -12.288228988647461, "global_step": 439124, "epoch": 2613} {"train_loss": -12.22317123413086, "global_step": 439125, "epoch": 2613} {"train_loss": -12.057531356811523, "global_step": 439126, "epoch": 2613} {"train_loss": -12.554729461669922, "global_step": 439127, "epoch": 2613} {"train_loss": -12.456551551818848, "global_step": 439128, "epoch": 2613} {"train_loss": -12.37559700012207, "global_step": 439129, "epoch": 2613} {"train_loss": -12.388311386108398, "global_step": 439130, "epoch": 2613} {"train_loss": -12.079322814941406, "global_step": 439131, "epoch": 2613} {"train_loss": -12.4970703125, "global_step": 439132, "epoch": 2613} {"train_loss": -12.140998840332031, "global_step": 439133, "epoch": 2613} {"train_loss": -12.34697151184082, "global_step": 439134, "epoch": 2613} {"train_loss": -12.217029571533203, "global_step": 439135, "epoch": 2613} {"train_loss": -12.477091789245605, "global_step": 439136, "epoch": 2613} {"train_loss": -12.438240051269531, "global_step": 439137, "epoch": 2613} {"train_loss": -12.444601058959961, "global_step": 439138, "epoch": 2613} {"train_loss": -12.644218444824219, "global_step": 439139, "epoch": 2613} {"train_loss": -12.458160400390625, "global_step": 439140, "epoch": 2613} {"train_loss": -12.463005065917969, "global_step": 439141, "epoch": 2613} {"train_loss": -12.550930976867676, "global_step": 439142, "epoch": 2613} {"train_loss": -12.60698127746582, "global_step": 439143, "epoch": 2613} {"train_loss": -12.71451187133789, "global_step": 439144, "epoch": 2613} {"train_loss": -12.552751541137695, "global_step": 439145, "epoch": 2613} {"train_loss": -12.691712379455566, "global_step": 439146, "epoch": 2613} {"train_loss": -12.472466468811035, "global_step": 439147, "epoch": 2613} {"train_loss": -12.764957427978516, "global_step": 439148, "epoch": 2613} {"train_loss": -12.533979415893555, "global_step": 439149, "epoch": 2613} {"train_loss": -12.315166473388672, "global_step": 439150, "epoch": 2613} {"train_loss": -11.99673240525382, "global_step": 439151, "epoch": 2613, "val_loss": 312308.28125} {"train_loss": -12.701763153076172, "global_step": 439152, "epoch": 2614} {"train_loss": -12.564248085021973, "global_step": 439153, "epoch": 2614} {"train_loss": -12.584228515625, "global_step": 439154, "epoch": 2614} {"train_loss": -12.70359992980957, "global_step": 439155, "epoch": 2614} {"train_loss": -12.731287002563477, "global_step": 439156, "epoch": 2614} {"train_loss": -12.744527816772461, "global_step": 439157, "epoch": 2614} {"train_loss": -12.656243324279785, "global_step": 439158, "epoch": 2614} {"train_loss": -12.890432357788086, "global_step": 439159, "epoch": 2614} {"train_loss": -12.531903266906738, "global_step": 439160, "epoch": 2614} {"train_loss": -12.834747314453125, "global_step": 439161, "epoch": 2614} {"train_loss": -12.676311492919922, "global_step": 439162, "epoch": 2614} {"train_loss": -12.837970733642578, "global_step": 439163, "epoch": 2614} {"train_loss": -12.774701118469238, "global_step": 439164, "epoch": 2614} {"train_loss": -12.71386432647705, "global_step": 439165, "epoch": 2614} {"train_loss": -12.835350036621094, "global_step": 439166, "epoch": 2614} {"train_loss": -12.571159362792969, "global_step": 439167, "epoch": 2614} {"train_loss": -12.489614486694336, "global_step": 439168, "epoch": 2614} {"train_loss": -12.748420715332031, "global_step": 439169, "epoch": 2614} {"train_loss": -12.832595825195312, "global_step": 439170, "epoch": 2614} {"train_loss": -12.63652229309082, "global_step": 439171, "epoch": 2614} {"train_loss": -12.811844825744629, "global_step": 439172, "epoch": 2614} {"train_loss": -12.762914657592773, "global_step": 439173, "epoch": 2614} {"train_loss": -12.72553825378418, "global_step": 439174, "epoch": 2614} {"train_loss": -12.98995590209961, "global_step": 439175, "epoch": 2614} {"train_loss": -12.673314094543457, "global_step": 439176, "epoch": 2614} {"train_loss": -12.898212432861328, "global_step": 439177, "epoch": 2614} {"train_loss": -12.85632610321045, "global_step": 439178, "epoch": 2614} {"train_loss": -12.916604995727539, "global_step": 439179, "epoch": 2614} {"train_loss": -12.525981903076172, "global_step": 439180, "epoch": 2614} {"train_loss": -12.88638687133789, "global_step": 439181, "epoch": 2614} {"train_loss": -12.444742202758789, "global_step": 439182, "epoch": 2614} {"train_loss": -12.661334991455078, "global_step": 439183, "epoch": 2614} {"train_loss": -12.56319808959961, "global_step": 439184, "epoch": 2614} {"train_loss": -12.693065643310547, "global_step": 439185, "epoch": 2614} {"train_loss": -12.419485092163086, "global_step": 439186, "epoch": 2614} {"train_loss": -12.466207504272461, "global_step": 439187, "epoch": 2614} {"train_loss": -12.827659606933594, "global_step": 439188, "epoch": 2614} {"train_loss": -12.741292953491211, "global_step": 439189, "epoch": 2614} {"train_loss": -12.672569274902344, "global_step": 439190, "epoch": 2614} {"train_loss": -12.883702278137207, "global_step": 439191, "epoch": 2614} {"train_loss": -12.88817024230957, "global_step": 439192, "epoch": 2614} {"train_loss": -12.983465194702148, "global_step": 439193, "epoch": 2614} {"train_loss": -13.081934928894043, "global_step": 439194, "epoch": 2614} {"train_loss": -12.764667510986328, "global_step": 439195, "epoch": 2614} {"train_loss": -12.413437843322754, "global_step": 439196, "epoch": 2614} {"train_loss": -13.04410171508789, "global_step": 439197, "epoch": 2614} {"train_loss": -12.335189819335938, "global_step": 439198, "epoch": 2614} {"train_loss": -11.062750816345215, "global_step": 439199, "epoch": 2614} {"train_loss": -12.412878036499023, "global_step": 439200, "epoch": 2614} {"train_loss": -12.203691482543945, "global_step": 439201, "epoch": 2614} {"train_loss": -11.449591636657715, "global_step": 439202, "epoch": 2614} {"train_loss": -10.483111381530762, "global_step": 439203, "epoch": 2614} {"train_loss": -12.254276275634766, "global_step": 439204, "epoch": 2614} {"train_loss": -10.632699012756348, "global_step": 439205, "epoch": 2614} {"train_loss": -10.162124633789062, "global_step": 439206, "epoch": 2614} {"train_loss": -9.983991622924805, "global_step": 439207, "epoch": 2614} {"train_loss": -10.245760917663574, "global_step": 439208, "epoch": 2614} {"train_loss": -10.994525909423828, "global_step": 439209, "epoch": 2614} {"train_loss": -11.318893432617188, "global_step": 439210, "epoch": 2614} {"train_loss": -9.660797119140625, "global_step": 439211, "epoch": 2614} {"train_loss": -9.884881973266602, "global_step": 439212, "epoch": 2614} {"train_loss": -11.372751235961914, "global_step": 439213, "epoch": 2614} {"train_loss": -9.966262817382812, "global_step": 439214, "epoch": 2614} {"train_loss": -10.36336898803711, "global_step": 439215, "epoch": 2614} {"train_loss": -11.33594036102295, "global_step": 439216, "epoch": 2614} {"train_loss": -9.985391616821289, "global_step": 439217, "epoch": 2614} {"train_loss": -11.733986854553223, "global_step": 439218, "epoch": 2614} {"train_loss": -9.847942352294922, "global_step": 439219, "epoch": 2614} {"train_loss": -11.266834259033203, "global_step": 439220, "epoch": 2614} {"train_loss": -10.697416305541992, "global_step": 439221, "epoch": 2614} {"train_loss": -10.928840637207031, "global_step": 439222, "epoch": 2614} {"train_loss": -10.56767749786377, "global_step": 439223, "epoch": 2614} {"train_loss": -10.203049659729004, "global_step": 439224, "epoch": 2614} {"train_loss": -9.929357528686523, "global_step": 439225, "epoch": 2614} {"train_loss": -11.532541275024414, "global_step": 439226, "epoch": 2614} {"train_loss": -9.256284713745117, "global_step": 439227, "epoch": 2614} {"train_loss": -9.921751022338867, "global_step": 439228, "epoch": 2614} {"train_loss": -8.996675491333008, "global_step": 439229, "epoch": 2614} {"train_loss": -10.860452651977539, "global_step": 439230, "epoch": 2614} {"train_loss": -9.458574295043945, "global_step": 439231, "epoch": 2614} {"train_loss": -11.631355285644531, "global_step": 439232, "epoch": 2614} {"train_loss": -9.656209945678711, "global_step": 439233, "epoch": 2614} {"train_loss": -11.01326847076416, "global_step": 439234, "epoch": 2614} {"train_loss": -10.403599739074707, "global_step": 439235, "epoch": 2614} {"train_loss": -10.334342956542969, "global_step": 439236, "epoch": 2614} {"train_loss": -11.234109878540039, "global_step": 439237, "epoch": 2614} {"train_loss": -10.794349670410156, "global_step": 439238, "epoch": 2614} {"train_loss": -11.281901359558105, "global_step": 439239, "epoch": 2614} {"train_loss": -10.894388198852539, "global_step": 439240, "epoch": 2614} {"train_loss": -11.528242111206055, "global_step": 439241, "epoch": 2614} {"train_loss": -11.913299560546875, "global_step": 439242, "epoch": 2614} {"train_loss": -11.453757286071777, "global_step": 439243, "epoch": 2614} {"train_loss": -11.031493186950684, "global_step": 439244, "epoch": 2614} {"train_loss": -11.587111473083496, "global_step": 439245, "epoch": 2614} {"train_loss": -11.131526947021484, "global_step": 439246, "epoch": 2614} {"train_loss": -11.94605827331543, "global_step": 439247, "epoch": 2614} {"train_loss": -11.900845527648926, "global_step": 439248, "epoch": 2614} {"train_loss": -11.313591003417969, "global_step": 439249, "epoch": 2614} {"train_loss": -11.67078971862793, "global_step": 439250, "epoch": 2614} {"train_loss": -11.792693138122559, "global_step": 439251, "epoch": 2614} {"train_loss": -11.777412414550781, "global_step": 439252, "epoch": 2614} {"train_loss": -11.989654541015625, "global_step": 439253, "epoch": 2614} {"train_loss": -11.958892822265625, "global_step": 439254, "epoch": 2614} {"train_loss": -12.04965591430664, "global_step": 439255, "epoch": 2614} {"train_loss": -12.225723266601562, "global_step": 439256, "epoch": 2614} {"train_loss": -11.807490348815918, "global_step": 439257, "epoch": 2614} {"train_loss": -11.959538459777832, "global_step": 439258, "epoch": 2614} {"train_loss": -12.009012222290039, "global_step": 439259, "epoch": 2614} {"train_loss": -11.915191650390625, "global_step": 439260, "epoch": 2614} {"train_loss": -12.2932767868042, "global_step": 439261, "epoch": 2614} {"train_loss": -12.181791305541992, "global_step": 439262, "epoch": 2614} {"train_loss": -12.173739433288574, "global_step": 439263, "epoch": 2614} {"train_loss": -11.96884822845459, "global_step": 439264, "epoch": 2614} {"train_loss": -12.316730499267578, "global_step": 439265, "epoch": 2614} {"train_loss": -11.910726547241211, "global_step": 439266, "epoch": 2614} {"train_loss": -12.336567878723145, "global_step": 439267, "epoch": 2614} {"train_loss": -12.204794883728027, "global_step": 439268, "epoch": 2614} {"train_loss": -12.268983840942383, "global_step": 439269, "epoch": 2614} {"train_loss": -12.324786186218262, "global_step": 439270, "epoch": 2614} {"train_loss": -12.605413436889648, "global_step": 439271, "epoch": 2614} {"train_loss": -12.147344589233398, "global_step": 439272, "epoch": 2614} {"train_loss": -12.42581558227539, "global_step": 439273, "epoch": 2614} {"train_loss": -12.500569343566895, "global_step": 439274, "epoch": 2614} {"train_loss": -12.181175231933594, "global_step": 439275, "epoch": 2614} {"train_loss": -12.375957489013672, "global_step": 439276, "epoch": 2614} {"train_loss": -12.423490524291992, "global_step": 439277, "epoch": 2614} {"train_loss": -12.193680763244629, "global_step": 439278, "epoch": 2614} {"train_loss": -12.173733711242676, "global_step": 439279, "epoch": 2614} {"train_loss": -12.362876892089844, "global_step": 439280, "epoch": 2614} {"train_loss": -12.118812561035156, "global_step": 439281, "epoch": 2614} {"train_loss": -12.012374877929688, "global_step": 439282, "epoch": 2614} {"train_loss": -12.274127006530762, "global_step": 439283, "epoch": 2614} {"train_loss": -12.15093994140625, "global_step": 439284, "epoch": 2614} {"train_loss": -12.288764953613281, "global_step": 439285, "epoch": 2614} {"train_loss": -12.374573707580566, "global_step": 439286, "epoch": 2614} {"train_loss": -12.4051513671875, "global_step": 439287, "epoch": 2614} {"train_loss": -12.381025314331055, "global_step": 439288, "epoch": 2614} {"train_loss": -12.446073532104492, "global_step": 439289, "epoch": 2614} {"train_loss": -12.336044311523438, "global_step": 439290, "epoch": 2614} {"train_loss": -12.471864700317383, "global_step": 439291, "epoch": 2614} {"train_loss": -12.623088836669922, "global_step": 439292, "epoch": 2614} {"train_loss": -12.301273345947266, "global_step": 439293, "epoch": 2614} {"train_loss": -12.458935737609863, "global_step": 439294, "epoch": 2614} {"train_loss": -12.47170639038086, "global_step": 439295, "epoch": 2614} {"train_loss": -12.197690963745117, "global_step": 439296, "epoch": 2614} {"train_loss": -12.227648735046387, "global_step": 439297, "epoch": 2614} {"train_loss": -12.44770622253418, "global_step": 439298, "epoch": 2614} {"train_loss": -12.464506149291992, "global_step": 439299, "epoch": 2614} {"train_loss": -12.630136489868164, "global_step": 439300, "epoch": 2614} {"train_loss": -12.420408248901367, "global_step": 439301, "epoch": 2614} {"train_loss": -12.623749732971191, "global_step": 439302, "epoch": 2614} {"train_loss": -12.622291564941406, "global_step": 439303, "epoch": 2614} {"train_loss": -12.302401542663574, "global_step": 439304, "epoch": 2614} {"train_loss": -12.499157905578613, "global_step": 439305, "epoch": 2614} {"train_loss": -12.590782165527344, "global_step": 439306, "epoch": 2614} {"train_loss": -12.418208122253418, "global_step": 439307, "epoch": 2614} {"train_loss": -12.738968849182129, "global_step": 439308, "epoch": 2614} {"train_loss": -12.785070419311523, "global_step": 439309, "epoch": 2614} {"train_loss": -12.742781639099121, "global_step": 439310, "epoch": 2614} {"train_loss": -12.603271484375, "global_step": 439311, "epoch": 2614} {"train_loss": -12.732678413391113, "global_step": 439312, "epoch": 2614} {"train_loss": -12.59365177154541, "global_step": 439313, "epoch": 2614} {"train_loss": -12.60612678527832, "global_step": 439314, "epoch": 2614} {"train_loss": -12.651206970214844, "global_step": 439315, "epoch": 2614} {"train_loss": -12.647974967956543, "global_step": 439316, "epoch": 2614} {"train_loss": -12.793922424316406, "global_step": 439317, "epoch": 2614} {"train_loss": -12.85175609588623, "global_step": 439318, "epoch": 2614} {"train_loss": -11.985383533296131, "global_step": 439319, "epoch": 2614, "val_loss": 308768.5625} {"train_loss": -12.625971794128418, "global_step": 439320, "epoch": 2615} {"train_loss": -12.854743957519531, "global_step": 439321, "epoch": 2615} {"train_loss": -12.762659072875977, "global_step": 439322, "epoch": 2615} {"train_loss": -12.780341148376465, "global_step": 439323, "epoch": 2615} {"train_loss": -12.634353637695312, "global_step": 439324, "epoch": 2615} {"train_loss": -12.582632064819336, "global_step": 439325, "epoch": 2615} {"train_loss": -13.05921459197998, "global_step": 439326, "epoch": 2615} {"train_loss": -12.641088485717773, "global_step": 439327, "epoch": 2615} {"train_loss": -12.70527458190918, "global_step": 439328, "epoch": 2615} {"train_loss": -12.788131713867188, "global_step": 439329, "epoch": 2615} {"train_loss": -12.736551284790039, "global_step": 439330, "epoch": 2615} {"train_loss": -12.83675479888916, "global_step": 439331, "epoch": 2615} {"train_loss": -12.8843994140625, "global_step": 439332, "epoch": 2615} {"train_loss": -12.625408172607422, "global_step": 439333, "epoch": 2615} {"train_loss": -12.60545539855957, "global_step": 439334, "epoch": 2615} {"train_loss": -12.717729568481445, "global_step": 439335, "epoch": 2615} {"train_loss": -12.683494567871094, "global_step": 439336, "epoch": 2615} {"train_loss": -12.708261489868164, "global_step": 439337, "epoch": 2615} {"train_loss": -12.649377822875977, "global_step": 439338, "epoch": 2615} {"train_loss": -12.506303787231445, "global_step": 439339, "epoch": 2615} {"train_loss": -12.442155838012695, "global_step": 439340, "epoch": 2615} {"train_loss": -12.356728553771973, "global_step": 439341, "epoch": 2615} {"train_loss": -13.070167541503906, "global_step": 439342, "epoch": 2615} {"train_loss": -12.360745429992676, "global_step": 439343, "epoch": 2615} {"train_loss": -12.127662658691406, "global_step": 439344, "epoch": 2615} {"train_loss": -12.045467376708984, "global_step": 439345, "epoch": 2615} {"train_loss": -11.108137130737305, "global_step": 439346, "epoch": 2615} {"train_loss": -12.377930641174316, "global_step": 439347, "epoch": 2615} {"train_loss": -11.892528533935547, "global_step": 439348, "epoch": 2615} {"train_loss": -11.938377380371094, "global_step": 439349, "epoch": 2615} {"train_loss": -11.441022872924805, "global_step": 439350, "epoch": 2615} {"train_loss": -12.332008361816406, "global_step": 439351, "epoch": 2615} {"train_loss": -11.824960708618164, "global_step": 439352, "epoch": 2615} {"train_loss": -12.797178268432617, "global_step": 439353, "epoch": 2615} {"train_loss": -12.316547393798828, "global_step": 439354, "epoch": 2615} {"train_loss": -12.806127548217773, "global_step": 439355, "epoch": 2615} {"train_loss": -12.133480072021484, "global_step": 439356, "epoch": 2615} {"train_loss": -12.283571243286133, "global_step": 439357, "epoch": 2615} {"train_loss": -12.233244895935059, "global_step": 439358, "epoch": 2615} {"train_loss": -12.646063804626465, "global_step": 439359, "epoch": 2615} {"train_loss": -12.090675354003906, "global_step": 439360, "epoch": 2615} {"train_loss": -12.728961944580078, "global_step": 439361, "epoch": 2615} {"train_loss": -12.243882179260254, "global_step": 439362, "epoch": 2615} {"train_loss": -12.598758697509766, "global_step": 439363, "epoch": 2615} {"train_loss": -12.577430725097656, "global_step": 439364, "epoch": 2615} {"train_loss": -12.441835403442383, "global_step": 439365, "epoch": 2615} {"train_loss": -12.163658142089844, "global_step": 439366, "epoch": 2615} {"train_loss": -12.740419387817383, "global_step": 439367, "epoch": 2615} {"train_loss": -11.866459846496582, "global_step": 439368, "epoch": 2615} {"train_loss": -12.53329086303711, "global_step": 439369, "epoch": 2615} {"train_loss": -12.172149658203125, "global_step": 439370, "epoch": 2615} {"train_loss": -12.069404602050781, "global_step": 439371, "epoch": 2615} {"train_loss": -11.942121505737305, "global_step": 439372, "epoch": 2615} {"train_loss": -12.06594467163086, "global_step": 439373, "epoch": 2615} {"train_loss": -12.10365104675293, "global_step": 439374, "epoch": 2615} {"train_loss": -12.605131149291992, "global_step": 439375, "epoch": 2615} {"train_loss": -12.421882629394531, "global_step": 439376, "epoch": 2615} {"train_loss": -11.75296401977539, "global_step": 439377, "epoch": 2615} {"train_loss": -12.044149398803711, "global_step": 439378, "epoch": 2615} {"train_loss": -10.807573318481445, "global_step": 439379, "epoch": 2615} {"train_loss": -11.864263534545898, "global_step": 439380, "epoch": 2615} {"train_loss": -10.431121826171875, "global_step": 439381, "epoch": 2615} {"train_loss": -9.940272331237793, "global_step": 439382, "epoch": 2615} {"train_loss": -11.706949234008789, "global_step": 439383, "epoch": 2615} {"train_loss": -10.238834381103516, "global_step": 439384, "epoch": 2615} {"train_loss": -11.649380683898926, "global_step": 439385, "epoch": 2615} {"train_loss": -11.92510986328125, "global_step": 439386, "epoch": 2615} {"train_loss": -10.508698463439941, "global_step": 439387, "epoch": 2615} {"train_loss": -11.874714851379395, "global_step": 439388, "epoch": 2615} {"train_loss": -10.599123001098633, "global_step": 439389, "epoch": 2615} {"train_loss": -12.583995819091797, "global_step": 439390, "epoch": 2615} {"train_loss": -10.489136695861816, "global_step": 439391, "epoch": 2615} {"train_loss": -11.590925216674805, "global_step": 439392, "epoch": 2615} {"train_loss": -12.097042083740234, "global_step": 439393, "epoch": 2615} {"train_loss": -11.600421905517578, "global_step": 439394, "epoch": 2615} {"train_loss": -11.612226486206055, "global_step": 439395, "epoch": 2615} {"train_loss": -12.213357925415039, "global_step": 439396, "epoch": 2615} {"train_loss": -11.968046188354492, "global_step": 439397, "epoch": 2615} {"train_loss": -11.562628746032715, "global_step": 439398, "epoch": 2615} {"train_loss": -12.717395782470703, "global_step": 439399, "epoch": 2615} {"train_loss": -11.203542709350586, "global_step": 439400, "epoch": 2615} {"train_loss": -12.321097373962402, "global_step": 439401, "epoch": 2615} {"train_loss": -11.86863899230957, "global_step": 439402, "epoch": 2615} {"train_loss": -12.08719253540039, "global_step": 439403, "epoch": 2615} {"train_loss": -12.42011833190918, "global_step": 439404, "epoch": 2615} {"train_loss": -12.16346549987793, "global_step": 439405, "epoch": 2615} {"train_loss": -12.498374938964844, "global_step": 439406, "epoch": 2615} {"train_loss": -12.311763763427734, "global_step": 439407, "epoch": 2615} {"train_loss": -12.175345420837402, "global_step": 439408, "epoch": 2615} {"train_loss": -12.618863105773926, "global_step": 439409, "epoch": 2615} {"train_loss": -12.410531997680664, "global_step": 439410, "epoch": 2615} {"train_loss": -12.770675659179688, "global_step": 439411, "epoch": 2615} {"train_loss": -12.500652313232422, "global_step": 439412, "epoch": 2615} {"train_loss": -12.686272621154785, "global_step": 439413, "epoch": 2615} {"train_loss": -12.203923225402832, "global_step": 439414, "epoch": 2615} {"train_loss": -12.586176872253418, "global_step": 439415, "epoch": 2615} {"train_loss": -12.317022323608398, "global_step": 439416, "epoch": 2615} {"train_loss": -12.379050254821777, "global_step": 439417, "epoch": 2615} {"train_loss": -12.347278594970703, "global_step": 439418, "epoch": 2615} {"train_loss": -12.443353652954102, "global_step": 439419, "epoch": 2615} {"train_loss": -12.423543930053711, "global_step": 439420, "epoch": 2615} {"train_loss": -12.587921142578125, "global_step": 439421, "epoch": 2615} {"train_loss": -12.253198623657227, "global_step": 439422, "epoch": 2615} {"train_loss": -12.425758361816406, "global_step": 439423, "epoch": 2615} {"train_loss": -12.331725120544434, "global_step": 439424, "epoch": 2615} {"train_loss": -12.409120559692383, "global_step": 439425, "epoch": 2615} {"train_loss": -12.659273147583008, "global_step": 439426, "epoch": 2615} {"train_loss": -12.09770393371582, "global_step": 439427, "epoch": 2615} {"train_loss": -12.420061111450195, "global_step": 439428, "epoch": 2615} {"train_loss": -12.507818222045898, "global_step": 439429, "epoch": 2615} {"train_loss": -12.279739379882812, "global_step": 439430, "epoch": 2615} {"train_loss": -12.337228775024414, "global_step": 439431, "epoch": 2615} {"train_loss": -12.740421295166016, "global_step": 439432, "epoch": 2615} {"train_loss": -12.331829071044922, "global_step": 439433, "epoch": 2615} {"train_loss": -12.242741584777832, "global_step": 439434, "epoch": 2615} {"train_loss": -12.252723693847656, "global_step": 439435, "epoch": 2615} {"train_loss": -12.674701690673828, "global_step": 439436, "epoch": 2615} {"train_loss": -12.560291290283203, "global_step": 439437, "epoch": 2615} {"train_loss": -12.308660507202148, "global_step": 439438, "epoch": 2615} {"train_loss": -12.53896713256836, "global_step": 439439, "epoch": 2615} {"train_loss": -12.36723518371582, "global_step": 439440, "epoch": 2615} {"train_loss": -12.671204566955566, "global_step": 439441, "epoch": 2615} {"train_loss": -12.30846881866455, "global_step": 439442, "epoch": 2615} {"train_loss": -12.29554557800293, "global_step": 439443, "epoch": 2615} {"train_loss": -12.411821365356445, "global_step": 439444, "epoch": 2615} {"train_loss": -12.585774421691895, "global_step": 439445, "epoch": 2615} {"train_loss": -12.503593444824219, "global_step": 439446, "epoch": 2615} {"train_loss": -12.624013900756836, "global_step": 439447, "epoch": 2615} {"train_loss": -12.610639572143555, "global_step": 439448, "epoch": 2615} {"train_loss": -12.656877517700195, "global_step": 439449, "epoch": 2615} {"train_loss": -12.68235969543457, "global_step": 439450, "epoch": 2615} {"train_loss": -12.797142028808594, "global_step": 439451, "epoch": 2615} {"train_loss": -12.815948486328125, "global_step": 439452, "epoch": 2615} {"train_loss": -12.759674072265625, "global_step": 439453, "epoch": 2615} {"train_loss": -12.381591796875, "global_step": 439454, "epoch": 2615} {"train_loss": -12.97374439239502, "global_step": 439455, "epoch": 2615} {"train_loss": -12.951141357421875, "global_step": 439456, "epoch": 2615} {"train_loss": -12.958444595336914, "global_step": 439457, "epoch": 2615} {"train_loss": -12.713764190673828, "global_step": 439458, "epoch": 2615} {"train_loss": -12.699250221252441, "global_step": 439459, "epoch": 2615} {"train_loss": -12.866073608398438, "global_step": 439460, "epoch": 2615} {"train_loss": -12.584877967834473, "global_step": 439461, "epoch": 2615} {"train_loss": -12.651531219482422, "global_step": 439462, "epoch": 2615} {"train_loss": -12.507328033447266, "global_step": 439463, "epoch": 2615} {"train_loss": -12.673657417297363, "global_step": 439464, "epoch": 2615} {"train_loss": -12.748244285583496, "global_step": 439465, "epoch": 2615} {"train_loss": -12.28619384765625, "global_step": 439466, "epoch": 2615} {"train_loss": -11.411022186279297, "global_step": 439467, "epoch": 2615} {"train_loss": -12.608922958374023, "global_step": 439468, "epoch": 2615} {"train_loss": -12.337709426879883, "global_step": 439469, "epoch": 2615} {"train_loss": -11.11644172668457, "global_step": 439470, "epoch": 2615} {"train_loss": -12.37823486328125, "global_step": 439471, "epoch": 2615} {"train_loss": -12.028205871582031, "global_step": 439472, "epoch": 2615} {"train_loss": -11.610057830810547, "global_step": 439473, "epoch": 2615} {"train_loss": -10.56513786315918, "global_step": 439474, "epoch": 2615} {"train_loss": -12.505489349365234, "global_step": 439475, "epoch": 2615} {"train_loss": -11.957721710205078, "global_step": 439476, "epoch": 2615} {"train_loss": -11.326520919799805, "global_step": 439477, "epoch": 2615} {"train_loss": -11.144054412841797, "global_step": 439478, "epoch": 2615} {"train_loss": -11.73540210723877, "global_step": 439479, "epoch": 2615} {"train_loss": -11.90687370300293, "global_step": 439480, "epoch": 2615} {"train_loss": -11.548057556152344, "global_step": 439481, "epoch": 2615} {"train_loss": -11.569689750671387, "global_step": 439482, "epoch": 2615} {"train_loss": -10.37881851196289, "global_step": 439483, "epoch": 2615} {"train_loss": -11.980774879455566, "global_step": 439484, "epoch": 2615} {"train_loss": -10.840682029724121, "global_step": 439485, "epoch": 2615} {"train_loss": -10.160606384277344, "global_step": 439486, "epoch": 2615} {"train_loss": -12.197654065631685, "global_step": 439487, "epoch": 2615, "val_loss": 309477.03125, "train_action_mse_error": 2.3679161071777344} {"train_loss": -11.682024002075195, "global_step": 439488, "epoch": 2616} {"train_loss": -11.085906982421875, "global_step": 439489, "epoch": 2616} {"train_loss": -11.224390983581543, "global_step": 439490, "epoch": 2616} {"train_loss": -12.2857027053833, "global_step": 439491, "epoch": 2616} {"train_loss": -10.807003021240234, "global_step": 439492, "epoch": 2616} {"train_loss": -11.891341209411621, "global_step": 439493, "epoch": 2616} {"train_loss": -11.872323036193848, "global_step": 439494, "epoch": 2616} {"train_loss": -11.059036254882812, "global_step": 439495, "epoch": 2616} {"train_loss": -12.059837341308594, "global_step": 439496, "epoch": 2616} {"train_loss": -11.593622207641602, "global_step": 439497, "epoch": 2616} {"train_loss": -12.304971694946289, "global_step": 439498, "epoch": 2616} {"train_loss": -11.759265899658203, "global_step": 439499, "epoch": 2616} {"train_loss": -12.33244514465332, "global_step": 439500, "epoch": 2616} {"train_loss": -11.324320793151855, "global_step": 439501, "epoch": 2616} {"train_loss": -12.375444412231445, "global_step": 439502, "epoch": 2616} {"train_loss": -11.526901245117188, "global_step": 439503, "epoch": 2616} {"train_loss": -12.1984281539917, "global_step": 439504, "epoch": 2616} {"train_loss": -11.625843048095703, "global_step": 439505, "epoch": 2616} {"train_loss": -11.890751838684082, "global_step": 439506, "epoch": 2616} {"train_loss": -11.98720645904541, "global_step": 439507, "epoch": 2616} {"train_loss": -11.766600608825684, "global_step": 439508, "epoch": 2616} {"train_loss": -11.893966674804688, "global_step": 439509, "epoch": 2616} {"train_loss": -12.195455551147461, "global_step": 439510, "epoch": 2616} {"train_loss": -11.873716354370117, "global_step": 439511, "epoch": 2616} {"train_loss": -12.371296882629395, "global_step": 439512, "epoch": 2616} {"train_loss": -12.198312759399414, "global_step": 439513, "epoch": 2616} {"train_loss": -11.878482818603516, "global_step": 439514, "epoch": 2616} {"train_loss": -12.293678283691406, "global_step": 439515, "epoch": 2616} {"train_loss": -11.727985382080078, "global_step": 439516, "epoch": 2616} {"train_loss": -11.903974533081055, "global_step": 439517, "epoch": 2616} {"train_loss": -11.081657409667969, "global_step": 439518, "epoch": 2616} {"train_loss": -12.044776916503906, "global_step": 439519, "epoch": 2616} {"train_loss": -10.850894927978516, "global_step": 439520, "epoch": 2616} {"train_loss": -12.42282772064209, "global_step": 439521, "epoch": 2616} {"train_loss": -11.025863647460938, "global_step": 439522, "epoch": 2616} {"train_loss": -11.941463470458984, "global_step": 439523, "epoch": 2616} {"train_loss": -11.979735374450684, "global_step": 439524, "epoch": 2616} {"train_loss": -12.03007698059082, "global_step": 439525, "epoch": 2616} {"train_loss": -11.794586181640625, "global_step": 439526, "epoch": 2616} {"train_loss": -11.559188842773438, "global_step": 439527, "epoch": 2616} {"train_loss": -11.674903869628906, "global_step": 439528, "epoch": 2616} {"train_loss": -12.036259651184082, "global_step": 439529, "epoch": 2616} {"train_loss": -11.64691162109375, "global_step": 439530, "epoch": 2616} {"train_loss": -11.983470916748047, "global_step": 439531, "epoch": 2616} {"train_loss": -12.173095703125, "global_step": 439532, "epoch": 2616} {"train_loss": -11.856966018676758, "global_step": 439533, "epoch": 2616} {"train_loss": -12.002321243286133, "global_step": 439534, "epoch": 2616} {"train_loss": -12.000731468200684, "global_step": 439535, "epoch": 2616} {"train_loss": -12.041433334350586, "global_step": 439536, "epoch": 2616} {"train_loss": -12.721735000610352, "global_step": 439537, "epoch": 2616} {"train_loss": -11.9042329788208, "global_step": 439538, "epoch": 2616} {"train_loss": -12.180627822875977, "global_step": 439539, "epoch": 2616} {"train_loss": -12.183510780334473, "global_step": 439540, "epoch": 2616} {"train_loss": -12.328681945800781, "global_step": 439541, "epoch": 2616} {"train_loss": -12.386757850646973, "global_step": 439542, "epoch": 2616} {"train_loss": -12.471394538879395, "global_step": 439543, "epoch": 2616} {"train_loss": -12.083410263061523, "global_step": 439544, "epoch": 2616} {"train_loss": -12.501358985900879, "global_step": 439545, "epoch": 2616} {"train_loss": -12.427250862121582, "global_step": 439546, "epoch": 2616} {"train_loss": -12.388436317443848, "global_step": 439547, "epoch": 2616} {"train_loss": -12.73965072631836, "global_step": 439548, "epoch": 2616} {"train_loss": -12.604374885559082, "global_step": 439549, "epoch": 2616} {"train_loss": -12.67931079864502, "global_step": 439550, "epoch": 2616} {"train_loss": -12.49652099609375, "global_step": 439551, "epoch": 2616} {"train_loss": -12.514959335327148, "global_step": 439552, "epoch": 2616} {"train_loss": -12.768144607543945, "global_step": 439553, "epoch": 2616} {"train_loss": -12.606451034545898, "global_step": 439554, "epoch": 2616} {"train_loss": -12.661164283752441, "global_step": 439555, "epoch": 2616} {"train_loss": -12.799829483032227, "global_step": 439556, "epoch": 2616} {"train_loss": -12.551908493041992, "global_step": 439557, "epoch": 2616} {"train_loss": -12.673328399658203, "global_step": 439558, "epoch": 2616} {"train_loss": -12.590499877929688, "global_step": 439559, "epoch": 2616} {"train_loss": -12.833795547485352, "global_step": 439560, "epoch": 2616} {"train_loss": -12.659994125366211, "global_step": 439561, "epoch": 2616} {"train_loss": -12.717682838439941, "global_step": 439562, "epoch": 2616} {"train_loss": -12.954460144042969, "global_step": 439563, "epoch": 2616} {"train_loss": -12.658916473388672, "global_step": 439564, "epoch": 2616} {"train_loss": -12.730777740478516, "global_step": 439565, "epoch": 2616} {"train_loss": -12.724859237670898, "global_step": 439566, "epoch": 2616} {"train_loss": -12.881271362304688, "global_step": 439567, "epoch": 2616} {"train_loss": -12.657083511352539, "global_step": 439568, "epoch": 2616} {"train_loss": -12.509033203125, "global_step": 439569, "epoch": 2616} {"train_loss": -12.754865646362305, "global_step": 439570, "epoch": 2616} {"train_loss": -12.571669578552246, "global_step": 439571, "epoch": 2616} {"train_loss": -12.37704086303711, "global_step": 439572, "epoch": 2616} {"train_loss": -12.253798484802246, "global_step": 439573, "epoch": 2616} {"train_loss": -12.168106079101562, "global_step": 439574, "epoch": 2616} {"train_loss": -12.191141128540039, "global_step": 439575, "epoch": 2616} {"train_loss": -12.71809196472168, "global_step": 439576, "epoch": 2616} {"train_loss": -11.924259185791016, "global_step": 439577, "epoch": 2616} {"train_loss": -12.686275482177734, "global_step": 439578, "epoch": 2616} {"train_loss": -12.595247268676758, "global_step": 439579, "epoch": 2616} {"train_loss": -12.239797592163086, "global_step": 439580, "epoch": 2616} {"train_loss": -12.240049362182617, "global_step": 439581, "epoch": 2616} {"train_loss": -12.637117385864258, "global_step": 439582, "epoch": 2616} {"train_loss": -12.797558784484863, "global_step": 439583, "epoch": 2616} {"train_loss": -12.679805755615234, "global_step": 439584, "epoch": 2616} {"train_loss": -12.598235130310059, "global_step": 439585, "epoch": 2616} {"train_loss": -12.43724536895752, "global_step": 439586, "epoch": 2616} {"train_loss": -12.700566291809082, "global_step": 439587, "epoch": 2616} {"train_loss": -12.646734237670898, "global_step": 439588, "epoch": 2616} {"train_loss": -12.783431053161621, "global_step": 439589, "epoch": 2616} {"train_loss": -12.676963806152344, "global_step": 439590, "epoch": 2616} {"train_loss": -12.78022289276123, "global_step": 439591, "epoch": 2616} {"train_loss": -12.763151168823242, "global_step": 439592, "epoch": 2616} {"train_loss": -12.829891204833984, "global_step": 439593, "epoch": 2616} {"train_loss": -12.91922378540039, "global_step": 439594, "epoch": 2616} {"train_loss": -12.700879096984863, "global_step": 439595, "epoch": 2616} {"train_loss": -12.925016403198242, "global_step": 439596, "epoch": 2616} {"train_loss": -12.335939407348633, "global_step": 439597, "epoch": 2616} {"train_loss": -12.474617958068848, "global_step": 439598, "epoch": 2616} {"train_loss": -12.744954109191895, "global_step": 439599, "epoch": 2616} {"train_loss": -12.063211441040039, "global_step": 439600, "epoch": 2616} {"train_loss": -12.088587760925293, "global_step": 439601, "epoch": 2616} {"train_loss": -12.517044067382812, "global_step": 439602, "epoch": 2616} {"train_loss": -11.978416442871094, "global_step": 439603, "epoch": 2616} {"train_loss": -11.296063423156738, "global_step": 439604, "epoch": 2616} {"train_loss": -11.922983169555664, "global_step": 439605, "epoch": 2616} {"train_loss": -12.110774040222168, "global_step": 439606, "epoch": 2616} {"train_loss": -10.602567672729492, "global_step": 439607, "epoch": 2616} {"train_loss": -12.630584716796875, "global_step": 439608, "epoch": 2616} {"train_loss": -10.668636322021484, "global_step": 439609, "epoch": 2616} {"train_loss": -11.605515480041504, "global_step": 439610, "epoch": 2616} {"train_loss": -11.919859886169434, "global_step": 439611, "epoch": 2616} {"train_loss": -11.294204711914062, "global_step": 439612, "epoch": 2616} {"train_loss": -12.079889297485352, "global_step": 439613, "epoch": 2616} {"train_loss": -11.180238723754883, "global_step": 439614, "epoch": 2616} {"train_loss": -11.184537887573242, "global_step": 439615, "epoch": 2616} {"train_loss": -11.777042388916016, "global_step": 439616, "epoch": 2616} {"train_loss": -12.387740135192871, "global_step": 439617, "epoch": 2616} {"train_loss": -11.516661643981934, "global_step": 439618, "epoch": 2616} {"train_loss": -12.122133255004883, "global_step": 439619, "epoch": 2616} {"train_loss": -11.422074317932129, "global_step": 439620, "epoch": 2616} {"train_loss": -11.285146713256836, "global_step": 439621, "epoch": 2616} {"train_loss": -11.84135913848877, "global_step": 439622, "epoch": 2616} {"train_loss": -12.352693557739258, "global_step": 439623, "epoch": 2616} {"train_loss": -11.564620018005371, "global_step": 439624, "epoch": 2616} {"train_loss": -11.894668579101562, "global_step": 439625, "epoch": 2616} {"train_loss": -11.217422485351562, "global_step": 439626, "epoch": 2616} {"train_loss": -11.717218399047852, "global_step": 439627, "epoch": 2616} {"train_loss": -9.66061782836914, "global_step": 439628, "epoch": 2616} {"train_loss": -10.639265060424805, "global_step": 439629, "epoch": 2616} {"train_loss": -11.038604736328125, "global_step": 439630, "epoch": 2616} {"train_loss": -10.061383247375488, "global_step": 439631, "epoch": 2616} {"train_loss": -10.079788208007812, "global_step": 439632, "epoch": 2616} {"train_loss": -10.767586708068848, "global_step": 439633, "epoch": 2616} {"train_loss": -11.061317443847656, "global_step": 439634, "epoch": 2616} {"train_loss": -9.058671951293945, "global_step": 439635, "epoch": 2616} {"train_loss": -9.531208038330078, "global_step": 439636, "epoch": 2616} {"train_loss": -8.35338020324707, "global_step": 439637, "epoch": 2616} {"train_loss": -9.165351867675781, "global_step": 439638, "epoch": 2616} {"train_loss": -8.20114517211914, "global_step": 439639, "epoch": 2616} {"train_loss": -10.534366607666016, "global_step": 439640, "epoch": 2616} {"train_loss": -10.182645797729492, "global_step": 439641, "epoch": 2616} {"train_loss": -10.037636756896973, "global_step": 439642, "epoch": 2616} {"train_loss": -10.601999282836914, "global_step": 439643, "epoch": 2616} {"train_loss": -10.718841552734375, "global_step": 439644, "epoch": 2616} {"train_loss": -11.164769172668457, "global_step": 439645, "epoch": 2616} {"train_loss": -10.537525177001953, "global_step": 439646, "epoch": 2616} {"train_loss": -10.944574356079102, "global_step": 439647, "epoch": 2616} {"train_loss": -10.644819259643555, "global_step": 439648, "epoch": 2616} {"train_loss": -11.409025192260742, "global_step": 439649, "epoch": 2616} {"train_loss": -11.799072265625, "global_step": 439650, "epoch": 2616} {"train_loss": -11.606071472167969, "global_step": 439651, "epoch": 2616} {"train_loss": -12.08008098602295, "global_step": 439652, "epoch": 2616} {"train_loss": -11.697000503540039, "global_step": 439653, "epoch": 2616} {"train_loss": -11.896839141845703, "global_step": 439654, "epoch": 2616} {"train_loss": -11.870920482135954, "global_step": 439655, "epoch": 2616, "val_loss": 304544.40625} {"train_loss": -11.766645431518555, "global_step": 439656, "epoch": 2617} {"train_loss": -11.841115951538086, "global_step": 439657, "epoch": 2617} {"train_loss": -11.912211418151855, "global_step": 439658, "epoch": 2617} {"train_loss": -11.855703353881836, "global_step": 439659, "epoch": 2617} {"train_loss": -11.639830589294434, "global_step": 439660, "epoch": 2617} {"train_loss": -12.043978691101074, "global_step": 439661, "epoch": 2617} {"train_loss": -11.969108581542969, "global_step": 439662, "epoch": 2617} {"train_loss": -11.537317276000977, "global_step": 439663, "epoch": 2617} {"train_loss": -12.34500789642334, "global_step": 439664, "epoch": 2617} {"train_loss": -11.308241844177246, "global_step": 439665, "epoch": 2617} {"train_loss": -12.337102890014648, "global_step": 439666, "epoch": 2617} {"train_loss": -11.702963829040527, "global_step": 439667, "epoch": 2617} {"train_loss": -11.718612670898438, "global_step": 439668, "epoch": 2617} {"train_loss": -12.052985191345215, "global_step": 439669, "epoch": 2617} {"train_loss": -11.742019653320312, "global_step": 439670, "epoch": 2617} {"train_loss": -12.492278099060059, "global_step": 439671, "epoch": 2617} {"train_loss": -12.159429550170898, "global_step": 439672, "epoch": 2617} {"train_loss": -12.244848251342773, "global_step": 439673, "epoch": 2617} {"train_loss": -12.398651123046875, "global_step": 439674, "epoch": 2617} {"train_loss": -12.359395980834961, "global_step": 439675, "epoch": 2617} {"train_loss": -12.42116641998291, "global_step": 439676, "epoch": 2617} {"train_loss": -12.19863510131836, "global_step": 439677, "epoch": 2617} {"train_loss": -12.185340881347656, "global_step": 439678, "epoch": 2617} {"train_loss": -12.305330276489258, "global_step": 439679, "epoch": 2617} {"train_loss": -12.111160278320312, "global_step": 439680, "epoch": 2617} {"train_loss": -12.455154418945312, "global_step": 439681, "epoch": 2617} {"train_loss": -12.383968353271484, "global_step": 439682, "epoch": 2617} {"train_loss": -12.606401443481445, "global_step": 439683, "epoch": 2617} {"train_loss": -12.406061172485352, "global_step": 439684, "epoch": 2617} {"train_loss": -12.349528312683105, "global_step": 439685, "epoch": 2617} {"train_loss": -12.272855758666992, "global_step": 439686, "epoch": 2617} {"train_loss": -12.409673690795898, "global_step": 439687, "epoch": 2617} {"train_loss": -12.272072792053223, "global_step": 439688, "epoch": 2617} {"train_loss": -12.423054695129395, "global_step": 439689, "epoch": 2617} {"train_loss": -12.095060348510742, "global_step": 439690, "epoch": 2617} {"train_loss": -12.539095878601074, "global_step": 439691, "epoch": 2617} {"train_loss": -12.293426513671875, "global_step": 439692, "epoch": 2617} {"train_loss": -12.5716552734375, "global_step": 439693, "epoch": 2617} {"train_loss": -12.402323722839355, "global_step": 439694, "epoch": 2617} {"train_loss": -12.424193382263184, "global_step": 439695, "epoch": 2617} {"train_loss": -12.6929931640625, "global_step": 439696, "epoch": 2617} {"train_loss": -12.591957092285156, "global_step": 439697, "epoch": 2617} {"train_loss": -12.58697509765625, "global_step": 439698, "epoch": 2617} {"train_loss": -12.47593879699707, "global_step": 439699, "epoch": 2617} {"train_loss": -12.53650951385498, "global_step": 439700, "epoch": 2617} {"train_loss": -12.46699333190918, "global_step": 439701, "epoch": 2617} {"train_loss": -12.501310348510742, "global_step": 439702, "epoch": 2617} {"train_loss": -12.572221755981445, "global_step": 439703, "epoch": 2617} {"train_loss": -12.443150520324707, "global_step": 439704, "epoch": 2617} {"train_loss": -12.590763092041016, "global_step": 439705, "epoch": 2617} {"train_loss": -12.548649787902832, "global_step": 439706, "epoch": 2617} {"train_loss": -12.681694030761719, "global_step": 439707, "epoch": 2617} {"train_loss": -12.521408081054688, "global_step": 439708, "epoch": 2617} {"train_loss": -12.709966659545898, "global_step": 439709, "epoch": 2617} {"train_loss": -12.777509689331055, "global_step": 439710, "epoch": 2617} {"train_loss": -12.654680252075195, "global_step": 439711, "epoch": 2617} {"train_loss": -12.36839485168457, "global_step": 439712, "epoch": 2617} {"train_loss": -12.816703796386719, "global_step": 439713, "epoch": 2617} {"train_loss": -12.632705688476562, "global_step": 439714, "epoch": 2617} {"train_loss": -12.599996566772461, "global_step": 439715, "epoch": 2617} {"train_loss": -12.788366317749023, "global_step": 439716, "epoch": 2617} {"train_loss": -12.366521835327148, "global_step": 439717, "epoch": 2617} {"train_loss": -12.703788757324219, "global_step": 439718, "epoch": 2617} {"train_loss": -12.665422439575195, "global_step": 439719, "epoch": 2617} {"train_loss": -12.547664642333984, "global_step": 439720, "epoch": 2617} {"train_loss": -12.545352935791016, "global_step": 439721, "epoch": 2617} {"train_loss": -12.466442108154297, "global_step": 439722, "epoch": 2617} {"train_loss": -12.629060745239258, "global_step": 439723, "epoch": 2617} {"train_loss": -12.611494064331055, "global_step": 439724, "epoch": 2617} {"train_loss": -12.446807861328125, "global_step": 439725, "epoch": 2617} {"train_loss": -12.60874080657959, "global_step": 439726, "epoch": 2617} {"train_loss": -12.48426628112793, "global_step": 439727, "epoch": 2617} {"train_loss": -12.455314636230469, "global_step": 439728, "epoch": 2617} {"train_loss": -12.52159309387207, "global_step": 439729, "epoch": 2617} {"train_loss": -12.798222541809082, "global_step": 439730, "epoch": 2617} {"train_loss": -12.618688583374023, "global_step": 439731, "epoch": 2617} {"train_loss": -12.751785278320312, "global_step": 439732, "epoch": 2617} {"train_loss": -12.834976196289062, "global_step": 439733, "epoch": 2617} {"train_loss": -12.652298927307129, "global_step": 439734, "epoch": 2617} {"train_loss": -12.80972671508789, "global_step": 439735, "epoch": 2617} {"train_loss": -12.732405662536621, "global_step": 439736, "epoch": 2617} {"train_loss": -12.686966896057129, "global_step": 439737, "epoch": 2617} {"train_loss": -12.91584587097168, "global_step": 439738, "epoch": 2617} {"train_loss": -12.881185531616211, "global_step": 439739, "epoch": 2617} {"train_loss": -12.620833396911621, "global_step": 439740, "epoch": 2617} {"train_loss": -12.818001747131348, "global_step": 439741, "epoch": 2617} {"train_loss": -12.43517780303955, "global_step": 439742, "epoch": 2617} {"train_loss": -12.51664924621582, "global_step": 439743, "epoch": 2617} {"train_loss": -11.869356155395508, "global_step": 439744, "epoch": 2617} {"train_loss": -11.808103561401367, "global_step": 439745, "epoch": 2617} {"train_loss": -12.657720565795898, "global_step": 439746, "epoch": 2617} {"train_loss": -12.197847366333008, "global_step": 439747, "epoch": 2617} {"train_loss": -12.162012100219727, "global_step": 439748, "epoch": 2617} {"train_loss": -12.234583854675293, "global_step": 439749, "epoch": 2617} {"train_loss": -13.031696319580078, "global_step": 439750, "epoch": 2617} {"train_loss": -12.13510799407959, "global_step": 439751, "epoch": 2617} {"train_loss": -12.596112251281738, "global_step": 439752, "epoch": 2617} {"train_loss": -12.75240421295166, "global_step": 439753, "epoch": 2617} {"train_loss": -11.920852661132812, "global_step": 439754, "epoch": 2617} {"train_loss": -10.81343936920166, "global_step": 439755, "epoch": 2617} {"train_loss": -12.802020072937012, "global_step": 439756, "epoch": 2617} {"train_loss": -11.534161567687988, "global_step": 439757, "epoch": 2617} {"train_loss": -11.60356330871582, "global_step": 439758, "epoch": 2617} {"train_loss": -11.926506996154785, "global_step": 439759, "epoch": 2617} {"train_loss": -12.467382431030273, "global_step": 439760, "epoch": 2617} {"train_loss": -12.554052352905273, "global_step": 439761, "epoch": 2617} {"train_loss": -12.397592544555664, "global_step": 439762, "epoch": 2617} {"train_loss": -12.279043197631836, "global_step": 439763, "epoch": 2617} {"train_loss": -12.042393684387207, "global_step": 439764, "epoch": 2617} {"train_loss": -12.243985176086426, "global_step": 439765, "epoch": 2617} {"train_loss": -11.68659496307373, "global_step": 439766, "epoch": 2617} {"train_loss": -12.567513465881348, "global_step": 439767, "epoch": 2617} {"train_loss": -11.900571823120117, "global_step": 439768, "epoch": 2617} {"train_loss": -12.656155586242676, "global_step": 439769, "epoch": 2617} {"train_loss": -11.57406997680664, "global_step": 439770, "epoch": 2617} {"train_loss": -11.911787033081055, "global_step": 439771, "epoch": 2617} {"train_loss": -12.85602855682373, "global_step": 439772, "epoch": 2617} {"train_loss": -12.349889755249023, "global_step": 439773, "epoch": 2617} {"train_loss": -12.033134460449219, "global_step": 439774, "epoch": 2617} {"train_loss": -12.547371864318848, "global_step": 439775, "epoch": 2617} {"train_loss": -12.002197265625, "global_step": 439776, "epoch": 2617} {"train_loss": -12.241174697875977, "global_step": 439777, "epoch": 2617} {"train_loss": -12.61271858215332, "global_step": 439778, "epoch": 2617} {"train_loss": -11.738116264343262, "global_step": 439779, "epoch": 2617} {"train_loss": -12.036523818969727, "global_step": 439780, "epoch": 2617} {"train_loss": -11.54154109954834, "global_step": 439781, "epoch": 2617} {"train_loss": -11.249692916870117, "global_step": 439782, "epoch": 2617} {"train_loss": -11.64098834991455, "global_step": 439783, "epoch": 2617} {"train_loss": -11.838593482971191, "global_step": 439784, "epoch": 2617} {"train_loss": -11.279924392700195, "global_step": 439785, "epoch": 2617} {"train_loss": -11.8508939743042, "global_step": 439786, "epoch": 2617} {"train_loss": -11.128399848937988, "global_step": 439787, "epoch": 2617} {"train_loss": -11.847529411315918, "global_step": 439788, "epoch": 2617} {"train_loss": -11.979742050170898, "global_step": 439789, "epoch": 2617} {"train_loss": -11.104029655456543, "global_step": 439790, "epoch": 2617} {"train_loss": -12.078420639038086, "global_step": 439791, "epoch": 2617} {"train_loss": -11.786531448364258, "global_step": 439792, "epoch": 2617} {"train_loss": -11.731398582458496, "global_step": 439793, "epoch": 2617} {"train_loss": -12.1730318069458, "global_step": 439794, "epoch": 2617} {"train_loss": -11.62429428100586, "global_step": 439795, "epoch": 2617} {"train_loss": -12.159460067749023, "global_step": 439796, "epoch": 2617} {"train_loss": -11.576238632202148, "global_step": 439797, "epoch": 2617} {"train_loss": -11.613327026367188, "global_step": 439798, "epoch": 2617} {"train_loss": -11.912288665771484, "global_step": 439799, "epoch": 2617} {"train_loss": -10.990190505981445, "global_step": 439800, "epoch": 2617} {"train_loss": -11.419840812683105, "global_step": 439801, "epoch": 2617} {"train_loss": -9.571374893188477, "global_step": 439802, "epoch": 2617} {"train_loss": -10.750866889953613, "global_step": 439803, "epoch": 2617} {"train_loss": -11.151981353759766, "global_step": 439804, "epoch": 2617} {"train_loss": -11.523937225341797, "global_step": 439805, "epoch": 2617} {"train_loss": -11.181259155273438, "global_step": 439806, "epoch": 2617} {"train_loss": -11.047937393188477, "global_step": 439807, "epoch": 2617} {"train_loss": -11.299367904663086, "global_step": 439808, "epoch": 2617} {"train_loss": -11.568110466003418, "global_step": 439809, "epoch": 2617} {"train_loss": -11.05899429321289, "global_step": 439810, "epoch": 2617} {"train_loss": -11.31570816040039, "global_step": 439811, "epoch": 2617} {"train_loss": -10.293414115905762, "global_step": 439812, "epoch": 2617} {"train_loss": -12.069799423217773, "global_step": 439813, "epoch": 2617} {"train_loss": -10.569421768188477, "global_step": 439814, "epoch": 2617} {"train_loss": -11.773454666137695, "global_step": 439815, "epoch": 2617} {"train_loss": -11.467704772949219, "global_step": 439816, "epoch": 2617} {"train_loss": -11.87356185913086, "global_step": 439817, "epoch": 2617} {"train_loss": -11.565777778625488, "global_step": 439818, "epoch": 2617} {"train_loss": -11.426595687866211, "global_step": 439819, "epoch": 2617} {"train_loss": -12.001283645629883, "global_step": 439820, "epoch": 2617} {"train_loss": -12.335077285766602, "global_step": 439821, "epoch": 2617} {"train_loss": -12.063255310058594, "global_step": 439822, "epoch": 2617} {"train_loss": -12.126476611409869, "global_step": 439823, "epoch": 2617, "val_loss": 307667.71875} {"train_loss": -12.396100044250488, "global_step": 439824, "epoch": 2618} {"train_loss": -12.08574104309082, "global_step": 439825, "epoch": 2618} {"train_loss": -12.321443557739258, "global_step": 439826, "epoch": 2618} {"train_loss": -11.966654777526855, "global_step": 439827, "epoch": 2618} {"train_loss": -12.0267972946167, "global_step": 439828, "epoch": 2618} {"train_loss": -12.100507736206055, "global_step": 439829, "epoch": 2618} {"train_loss": -12.166669845581055, "global_step": 439830, "epoch": 2618} {"train_loss": -12.031440734863281, "global_step": 439831, "epoch": 2618} {"train_loss": -12.285799980163574, "global_step": 439832, "epoch": 2618} {"train_loss": -12.470354080200195, "global_step": 439833, "epoch": 2618} {"train_loss": -12.537704467773438, "global_step": 439834, "epoch": 2618} {"train_loss": -12.30012035369873, "global_step": 439835, "epoch": 2618} {"train_loss": -12.496623992919922, "global_step": 439836, "epoch": 2618} {"train_loss": -12.362005233764648, "global_step": 439837, "epoch": 2618} {"train_loss": -12.453633308410645, "global_step": 439838, "epoch": 2618} {"train_loss": -12.24635124206543, "global_step": 439839, "epoch": 2618} {"train_loss": -12.506973266601562, "global_step": 439840, "epoch": 2618} {"train_loss": -12.301490783691406, "global_step": 439841, "epoch": 2618} {"train_loss": -12.623998641967773, "global_step": 439842, "epoch": 2618} {"train_loss": -12.507932662963867, "global_step": 439843, "epoch": 2618} {"train_loss": -12.351688385009766, "global_step": 439844, "epoch": 2618} {"train_loss": -12.624187469482422, "global_step": 439845, "epoch": 2618} {"train_loss": -12.490861892700195, "global_step": 439846, "epoch": 2618} {"train_loss": -12.536407470703125, "global_step": 439847, "epoch": 2618} {"train_loss": -12.72072982788086, "global_step": 439848, "epoch": 2618} {"train_loss": -12.466470718383789, "global_step": 439849, "epoch": 2618} {"train_loss": -12.46380615234375, "global_step": 439850, "epoch": 2618} {"train_loss": -12.385581970214844, "global_step": 439851, "epoch": 2618} {"train_loss": -12.319305419921875, "global_step": 439852, "epoch": 2618} {"train_loss": -12.479593276977539, "global_step": 439853, "epoch": 2618} {"train_loss": -12.610304832458496, "global_step": 439854, "epoch": 2618} {"train_loss": -12.285900115966797, "global_step": 439855, "epoch": 2618} {"train_loss": -12.273345947265625, "global_step": 439856, "epoch": 2618} {"train_loss": -12.44887924194336, "global_step": 439857, "epoch": 2618} {"train_loss": -12.32868480682373, "global_step": 439858, "epoch": 2618} {"train_loss": -12.504585266113281, "global_step": 439859, "epoch": 2618} {"train_loss": -12.35250186920166, "global_step": 439860, "epoch": 2618} {"train_loss": -12.23996353149414, "global_step": 439861, "epoch": 2618} {"train_loss": -12.639458656311035, "global_step": 439862, "epoch": 2618} {"train_loss": -12.44780445098877, "global_step": 439863, "epoch": 2618} {"train_loss": -12.413488388061523, "global_step": 439864, "epoch": 2618} {"train_loss": -12.70424747467041, "global_step": 439865, "epoch": 2618} {"train_loss": -12.665205955505371, "global_step": 439866, "epoch": 2618} {"train_loss": -12.49425983428955, "global_step": 439867, "epoch": 2618} {"train_loss": -12.632072448730469, "global_step": 439868, "epoch": 2618} {"train_loss": -12.327869415283203, "global_step": 439869, "epoch": 2618} {"train_loss": -12.907438278198242, "global_step": 439870, "epoch": 2618} {"train_loss": -12.301505088806152, "global_step": 439871, "epoch": 2618} {"train_loss": -12.739692687988281, "global_step": 439872, "epoch": 2618} {"train_loss": -12.447990417480469, "global_step": 439873, "epoch": 2618} {"train_loss": -12.473937034606934, "global_step": 439874, "epoch": 2618} {"train_loss": -12.20669174194336, "global_step": 439875, "epoch": 2618} {"train_loss": -12.52544116973877, "global_step": 439876, "epoch": 2618} {"train_loss": -12.283910751342773, "global_step": 439877, "epoch": 2618} {"train_loss": -12.03274154663086, "global_step": 439878, "epoch": 2618} {"train_loss": -11.552556037902832, "global_step": 439879, "epoch": 2618} {"train_loss": -12.451409339904785, "global_step": 439880, "epoch": 2618} {"train_loss": -11.880817413330078, "global_step": 439881, "epoch": 2618} {"train_loss": -11.957052230834961, "global_step": 439882, "epoch": 2618} {"train_loss": -12.436281204223633, "global_step": 439883, "epoch": 2618} {"train_loss": -12.182504653930664, "global_step": 439884, "epoch": 2618} {"train_loss": -12.154194831848145, "global_step": 439885, "epoch": 2618} {"train_loss": -12.753742218017578, "global_step": 439886, "epoch": 2618} {"train_loss": -12.113844871520996, "global_step": 439887, "epoch": 2618} {"train_loss": -12.073020935058594, "global_step": 439888, "epoch": 2618} {"train_loss": -12.33358097076416, "global_step": 439889, "epoch": 2618} {"train_loss": -12.005906105041504, "global_step": 439890, "epoch": 2618} {"train_loss": -11.186123847961426, "global_step": 439891, "epoch": 2618} {"train_loss": -12.652046203613281, "global_step": 439892, "epoch": 2618} {"train_loss": -11.894368171691895, "global_step": 439893, "epoch": 2618} {"train_loss": -11.987648010253906, "global_step": 439894, "epoch": 2618} {"train_loss": -11.933186531066895, "global_step": 439895, "epoch": 2618} {"train_loss": -11.367435455322266, "global_step": 439896, "epoch": 2618} {"train_loss": -12.344778060913086, "global_step": 439897, "epoch": 2618} {"train_loss": -12.09512710571289, "global_step": 439898, "epoch": 2618} {"train_loss": -11.039600372314453, "global_step": 439899, "epoch": 2618} {"train_loss": -12.12849235534668, "global_step": 439900, "epoch": 2618} {"train_loss": -12.33717155456543, "global_step": 439901, "epoch": 2618} {"train_loss": -12.312347412109375, "global_step": 439902, "epoch": 2618} {"train_loss": -12.213540077209473, "global_step": 439903, "epoch": 2618} {"train_loss": -12.172119140625, "global_step": 439904, "epoch": 2618} {"train_loss": -11.58467960357666, "global_step": 439905, "epoch": 2618} {"train_loss": -11.789033889770508, "global_step": 439906, "epoch": 2618} {"train_loss": -11.966188430786133, "global_step": 439907, "epoch": 2618} {"train_loss": -12.36351203918457, "global_step": 439908, "epoch": 2618} {"train_loss": -11.953351974487305, "global_step": 439909, "epoch": 2618} {"train_loss": -12.112548828125, "global_step": 439910, "epoch": 2618} {"train_loss": -12.427694320678711, "global_step": 439911, "epoch": 2618} {"train_loss": -12.542405128479004, "global_step": 439912, "epoch": 2618} {"train_loss": -12.605607032775879, "global_step": 439913, "epoch": 2618} {"train_loss": -12.339738845825195, "global_step": 439914, "epoch": 2618} {"train_loss": -12.614375114440918, "global_step": 439915, "epoch": 2618} {"train_loss": -12.500566482543945, "global_step": 439916, "epoch": 2618} {"train_loss": -12.759780883789062, "global_step": 439917, "epoch": 2618} {"train_loss": -12.747442245483398, "global_step": 439918, "epoch": 2618} {"train_loss": -12.66733455657959, "global_step": 439919, "epoch": 2618} {"train_loss": -12.226127624511719, "global_step": 439920, "epoch": 2618} {"train_loss": -12.59703254699707, "global_step": 439921, "epoch": 2618} {"train_loss": -12.309029579162598, "global_step": 439922, "epoch": 2618} {"train_loss": -12.621391296386719, "global_step": 439923, "epoch": 2618} {"train_loss": -12.414843559265137, "global_step": 439924, "epoch": 2618} {"train_loss": -12.51384162902832, "global_step": 439925, "epoch": 2618} {"train_loss": -12.457558631896973, "global_step": 439926, "epoch": 2618} {"train_loss": -12.390178680419922, "global_step": 439927, "epoch": 2618} {"train_loss": -12.327168464660645, "global_step": 439928, "epoch": 2618} {"train_loss": -12.352813720703125, "global_step": 439929, "epoch": 2618} {"train_loss": -12.840871810913086, "global_step": 439930, "epoch": 2618} {"train_loss": -12.34276008605957, "global_step": 439931, "epoch": 2618} {"train_loss": -12.163226127624512, "global_step": 439932, "epoch": 2618} {"train_loss": -12.133443832397461, "global_step": 439933, "epoch": 2618} {"train_loss": -12.689292907714844, "global_step": 439934, "epoch": 2618} {"train_loss": -11.636274337768555, "global_step": 439935, "epoch": 2618} {"train_loss": -12.25045394897461, "global_step": 439936, "epoch": 2618} {"train_loss": -12.74084186553955, "global_step": 439937, "epoch": 2618} {"train_loss": -12.598650932312012, "global_step": 439938, "epoch": 2618} {"train_loss": -12.352272987365723, "global_step": 439939, "epoch": 2618} {"train_loss": -12.574373245239258, "global_step": 439940, "epoch": 2618} {"train_loss": -12.684297561645508, "global_step": 439941, "epoch": 2618} {"train_loss": -12.72036361694336, "global_step": 439942, "epoch": 2618} {"train_loss": -12.50527572631836, "global_step": 439943, "epoch": 2618} {"train_loss": -13.000176429748535, "global_step": 439944, "epoch": 2618} {"train_loss": -12.36600112915039, "global_step": 439945, "epoch": 2618} {"train_loss": -12.536856651306152, "global_step": 439946, "epoch": 2618} {"train_loss": -12.647994995117188, "global_step": 439947, "epoch": 2618} {"train_loss": -12.485931396484375, "global_step": 439948, "epoch": 2618} {"train_loss": -12.35234260559082, "global_step": 439949, "epoch": 2618} {"train_loss": -12.747018814086914, "global_step": 439950, "epoch": 2618} {"train_loss": -12.185455322265625, "global_step": 439951, "epoch": 2618} {"train_loss": -12.581306457519531, "global_step": 439952, "epoch": 2618} {"train_loss": -12.571229934692383, "global_step": 439953, "epoch": 2618} {"train_loss": -12.354204177856445, "global_step": 439954, "epoch": 2618} {"train_loss": -12.668657302856445, "global_step": 439955, "epoch": 2618} {"train_loss": -12.585813522338867, "global_step": 439956, "epoch": 2618} {"train_loss": -12.517924308776855, "global_step": 439957, "epoch": 2618} {"train_loss": -12.770437240600586, "global_step": 439958, "epoch": 2618} {"train_loss": -12.29238510131836, "global_step": 439959, "epoch": 2618} {"train_loss": -12.549373626708984, "global_step": 439960, "epoch": 2618} {"train_loss": -12.70449447631836, "global_step": 439961, "epoch": 2618} {"train_loss": -12.360301971435547, "global_step": 439962, "epoch": 2618} {"train_loss": -12.391512870788574, "global_step": 439963, "epoch": 2618} {"train_loss": -12.908685684204102, "global_step": 439964, "epoch": 2618} {"train_loss": -11.410259246826172, "global_step": 439965, "epoch": 2618} {"train_loss": -12.088521957397461, "global_step": 439966, "epoch": 2618} {"train_loss": -12.085927963256836, "global_step": 439967, "epoch": 2618} {"train_loss": -11.264924049377441, "global_step": 439968, "epoch": 2618} {"train_loss": -11.799358367919922, "global_step": 439969, "epoch": 2618} {"train_loss": -12.787910461425781, "global_step": 439970, "epoch": 2618} {"train_loss": -11.057404518127441, "global_step": 439971, "epoch": 2618} {"train_loss": -12.255374908447266, "global_step": 439972, "epoch": 2618} {"train_loss": -12.544097900390625, "global_step": 439973, "epoch": 2618} {"train_loss": -12.060548782348633, "global_step": 439974, "epoch": 2618} {"train_loss": -12.049825668334961, "global_step": 439975, "epoch": 2618} {"train_loss": -12.737052917480469, "global_step": 439976, "epoch": 2618} {"train_loss": -12.325468063354492, "global_step": 439977, "epoch": 2618} {"train_loss": -11.63764476776123, "global_step": 439978, "epoch": 2618} {"train_loss": -12.200312614440918, "global_step": 439979, "epoch": 2618} {"train_loss": -11.6959810256958, "global_step": 439980, "epoch": 2618} {"train_loss": -11.15093994140625, "global_step": 439981, "epoch": 2618} {"train_loss": -10.653669357299805, "global_step": 439982, "epoch": 2618} {"train_loss": -11.960224151611328, "global_step": 439983, "epoch": 2618} {"train_loss": -12.330820083618164, "global_step": 439984, "epoch": 2618} {"train_loss": -11.627710342407227, "global_step": 439985, "epoch": 2618} {"train_loss": -12.706698417663574, "global_step": 439986, "epoch": 2618} {"train_loss": -11.716470718383789, "global_step": 439987, "epoch": 2618} {"train_loss": -11.52008056640625, "global_step": 439988, "epoch": 2618} {"train_loss": -11.981328964233398, "global_step": 439989, "epoch": 2618} {"train_loss": -12.05268669128418, "global_step": 439990, "epoch": 2618} {"train_loss": -12.29126170703343, "global_step": 439991, "epoch": 2618, "val_loss": 311405.625} {"train_loss": -12.328170776367188, "global_step": 439992, "epoch": 2619} {"train_loss": -11.888900756835938, "global_step": 439993, "epoch": 2619} {"train_loss": -12.188333511352539, "global_step": 439994, "epoch": 2619} {"train_loss": -11.774710655212402, "global_step": 439995, "epoch": 2619} {"train_loss": -11.477593421936035, "global_step": 439996, "epoch": 2619} {"train_loss": -11.677852630615234, "global_step": 439997, "epoch": 2619} {"train_loss": -11.53522777557373, "global_step": 439998, "epoch": 2619} {"train_loss": -11.908117294311523, "global_step": 439999, "epoch": 2619} {"train_loss": -11.27407455444336, "global_step": 440000, "epoch": 2619} {"train_loss": -11.445100784301758, "global_step": 440001, "epoch": 2619} {"train_loss": -12.25868034362793, "global_step": 440002, "epoch": 2619} {"train_loss": -11.589987754821777, "global_step": 440003, "epoch": 2619} {"train_loss": -11.71488094329834, "global_step": 440004, "epoch": 2619} {"train_loss": -12.034543991088867, "global_step": 440005, "epoch": 2619} {"train_loss": -11.843025207519531, "global_step": 440006, "epoch": 2619} {"train_loss": -12.338607788085938, "global_step": 440007, "epoch": 2619} {"train_loss": -11.596034049987793, "global_step": 440008, "epoch": 2619} {"train_loss": -12.412487030029297, "global_step": 440009, "epoch": 2619} {"train_loss": -12.178796768188477, "global_step": 440010, "epoch": 2619} {"train_loss": -12.483905792236328, "global_step": 440011, "epoch": 2619} {"train_loss": -12.28288459777832, "global_step": 440012, "epoch": 2619} {"train_loss": -12.220498085021973, "global_step": 440013, "epoch": 2619} {"train_loss": -11.923202514648438, "global_step": 440014, "epoch": 2619} {"train_loss": -12.345257759094238, "global_step": 440015, "epoch": 2619} {"train_loss": -11.962226867675781, "global_step": 440016, "epoch": 2619} {"train_loss": -12.31477165222168, "global_step": 440017, "epoch": 2619} {"train_loss": -12.235658645629883, "global_step": 440018, "epoch": 2619} {"train_loss": -12.067291259765625, "global_step": 440019, "epoch": 2619} {"train_loss": -12.28322982788086, "global_step": 440020, "epoch": 2619} {"train_loss": -11.474658966064453, "global_step": 440021, "epoch": 2619} {"train_loss": -12.328413009643555, "global_step": 440022, "epoch": 2619} {"train_loss": -12.439756393432617, "global_step": 440023, "epoch": 2619} {"train_loss": -12.332727432250977, "global_step": 440024, "epoch": 2619} {"train_loss": -12.434417724609375, "global_step": 440025, "epoch": 2619} {"train_loss": -12.367137908935547, "global_step": 440026, "epoch": 2619} {"train_loss": -12.107587814331055, "global_step": 440027, "epoch": 2619} {"train_loss": -12.572896957397461, "global_step": 440028, "epoch": 2619} {"train_loss": -12.146903991699219, "global_step": 440029, "epoch": 2619} {"train_loss": -12.602529525756836, "global_step": 440030, "epoch": 2619} {"train_loss": -12.404266357421875, "global_step": 440031, "epoch": 2619} {"train_loss": -12.350495338439941, "global_step": 440032, "epoch": 2619} {"train_loss": -12.653348922729492, "global_step": 440033, "epoch": 2619} {"train_loss": -12.40488338470459, "global_step": 440034, "epoch": 2619} {"train_loss": -12.501546859741211, "global_step": 440035, "epoch": 2619} {"train_loss": -12.49795150756836, "global_step": 440036, "epoch": 2619} {"train_loss": -12.61345386505127, "global_step": 440037, "epoch": 2619} {"train_loss": -12.718244552612305, "global_step": 440038, "epoch": 2619} {"train_loss": -12.350576400756836, "global_step": 440039, "epoch": 2619} {"train_loss": -12.61720085144043, "global_step": 440040, "epoch": 2619} {"train_loss": -12.511420249938965, "global_step": 440041, "epoch": 2619} {"train_loss": -11.95530891418457, "global_step": 440042, "epoch": 2619} {"train_loss": -12.596802711486816, "global_step": 440043, "epoch": 2619} {"train_loss": -12.488566398620605, "global_step": 440044, "epoch": 2619} {"train_loss": -12.286507606506348, "global_step": 440045, "epoch": 2619} {"train_loss": -12.80473518371582, "global_step": 440046, "epoch": 2619} {"train_loss": -12.313721656799316, "global_step": 440047, "epoch": 2619} {"train_loss": -12.358004570007324, "global_step": 440048, "epoch": 2619} {"train_loss": -12.649627685546875, "global_step": 440049, "epoch": 2619} {"train_loss": -12.347850799560547, "global_step": 440050, "epoch": 2619} {"train_loss": -12.390663146972656, "global_step": 440051, "epoch": 2619} {"train_loss": -12.602298736572266, "global_step": 440052, "epoch": 2619} {"train_loss": -12.325013160705566, "global_step": 440053, "epoch": 2619} {"train_loss": -12.167251586914062, "global_step": 440054, "epoch": 2619} {"train_loss": -12.675862312316895, "global_step": 440055, "epoch": 2619} {"train_loss": -12.694275856018066, "global_step": 440056, "epoch": 2619} {"train_loss": -12.319816589355469, "global_step": 440057, "epoch": 2619} {"train_loss": -12.65977954864502, "global_step": 440058, "epoch": 2619} {"train_loss": -12.290144920349121, "global_step": 440059, "epoch": 2619} {"train_loss": -12.48940372467041, "global_step": 440060, "epoch": 2619} {"train_loss": -12.433987617492676, "global_step": 440061, "epoch": 2619} {"train_loss": -12.106698036193848, "global_step": 440062, "epoch": 2619} {"train_loss": -12.166633605957031, "global_step": 440063, "epoch": 2619} {"train_loss": -12.57925033569336, "global_step": 440064, "epoch": 2619} {"train_loss": -12.447128295898438, "global_step": 440065, "epoch": 2619} {"train_loss": -12.047821044921875, "global_step": 440066, "epoch": 2619} {"train_loss": -12.698274612426758, "global_step": 440067, "epoch": 2619} {"train_loss": -12.179923057556152, "global_step": 440068, "epoch": 2619} {"train_loss": -11.979238510131836, "global_step": 440069, "epoch": 2619} {"train_loss": -12.21458911895752, "global_step": 440070, "epoch": 2619} {"train_loss": -12.268157005310059, "global_step": 440071, "epoch": 2619} {"train_loss": -11.091934204101562, "global_step": 440072, "epoch": 2619} {"train_loss": -12.712263107299805, "global_step": 440073, "epoch": 2619} {"train_loss": -12.095365524291992, "global_step": 440074, "epoch": 2619} {"train_loss": -12.513769149780273, "global_step": 440075, "epoch": 2619} {"train_loss": -11.11944580078125, "global_step": 440076, "epoch": 2619} {"train_loss": -12.339488983154297, "global_step": 440077, "epoch": 2619} {"train_loss": -10.859107971191406, "global_step": 440078, "epoch": 2619} {"train_loss": -11.91400146484375, "global_step": 440079, "epoch": 2619} {"train_loss": -12.41925048828125, "global_step": 440080, "epoch": 2619} {"train_loss": -11.940320014953613, "global_step": 440081, "epoch": 2619} {"train_loss": -12.091964721679688, "global_step": 440082, "epoch": 2619} {"train_loss": -12.449478149414062, "global_step": 440083, "epoch": 2619} {"train_loss": -11.982215881347656, "global_step": 440084, "epoch": 2619} {"train_loss": -12.50621223449707, "global_step": 440085, "epoch": 2619} {"train_loss": -12.280099868774414, "global_step": 440086, "epoch": 2619} {"train_loss": -12.41623592376709, "global_step": 440087, "epoch": 2619} {"train_loss": -12.29653549194336, "global_step": 440088, "epoch": 2619} {"train_loss": -12.555299758911133, "global_step": 440089, "epoch": 2619} {"train_loss": -12.328695297241211, "global_step": 440090, "epoch": 2619} {"train_loss": -12.519755363464355, "global_step": 440091, "epoch": 2619} {"train_loss": -12.081053733825684, "global_step": 440092, "epoch": 2619} {"train_loss": -11.879934310913086, "global_step": 440093, "epoch": 2619} {"train_loss": -12.311295509338379, "global_step": 440094, "epoch": 2619} {"train_loss": -11.700523376464844, "global_step": 440095, "epoch": 2619} {"train_loss": -11.886129379272461, "global_step": 440096, "epoch": 2619} {"train_loss": -12.400894165039062, "global_step": 440097, "epoch": 2619} {"train_loss": -12.360316276550293, "global_step": 440098, "epoch": 2619} {"train_loss": -12.508003234863281, "global_step": 440099, "epoch": 2619} {"train_loss": -12.41975212097168, "global_step": 440100, "epoch": 2619} {"train_loss": -11.968573570251465, "global_step": 440101, "epoch": 2619} {"train_loss": -12.336715698242188, "global_step": 440102, "epoch": 2619} {"train_loss": -12.765851020812988, "global_step": 440103, "epoch": 2619} {"train_loss": -12.255962371826172, "global_step": 440104, "epoch": 2619} {"train_loss": -12.056554794311523, "global_step": 440105, "epoch": 2619} {"train_loss": -12.67606258392334, "global_step": 440106, "epoch": 2619} {"train_loss": -12.419821739196777, "global_step": 440107, "epoch": 2619} {"train_loss": -12.223974227905273, "global_step": 440108, "epoch": 2619} {"train_loss": -12.40945053100586, "global_step": 440109, "epoch": 2619} {"train_loss": -11.606069564819336, "global_step": 440110, "epoch": 2619} {"train_loss": -12.569089889526367, "global_step": 440111, "epoch": 2619} {"train_loss": -12.165826797485352, "global_step": 440112, "epoch": 2619} {"train_loss": -12.653955459594727, "global_step": 440113, "epoch": 2619} {"train_loss": -12.495124816894531, "global_step": 440114, "epoch": 2619} {"train_loss": -12.408438682556152, "global_step": 440115, "epoch": 2619} {"train_loss": -12.573775291442871, "global_step": 440116, "epoch": 2619} {"train_loss": -12.43072509765625, "global_step": 440117, "epoch": 2619} {"train_loss": -12.465685844421387, "global_step": 440118, "epoch": 2619} {"train_loss": -12.63073444366455, "global_step": 440119, "epoch": 2619} {"train_loss": -12.66048812866211, "global_step": 440120, "epoch": 2619} {"train_loss": -12.6612548828125, "global_step": 440121, "epoch": 2619} {"train_loss": -12.590499877929688, "global_step": 440122, "epoch": 2619} {"train_loss": -12.804622650146484, "global_step": 440123, "epoch": 2619} {"train_loss": -12.577808380126953, "global_step": 440124, "epoch": 2619} {"train_loss": -12.65376091003418, "global_step": 440125, "epoch": 2619} {"train_loss": -12.407554626464844, "global_step": 440126, "epoch": 2619} {"train_loss": -12.707952499389648, "global_step": 440127, "epoch": 2619} {"train_loss": -12.675312042236328, "global_step": 440128, "epoch": 2619} {"train_loss": -12.695791244506836, "global_step": 440129, "epoch": 2619} {"train_loss": -12.684859275817871, "global_step": 440130, "epoch": 2619} {"train_loss": -12.518022537231445, "global_step": 440131, "epoch": 2619} {"train_loss": -11.879764556884766, "global_step": 440132, "epoch": 2619} {"train_loss": -12.574883460998535, "global_step": 440133, "epoch": 2619} {"train_loss": -12.188112258911133, "global_step": 440134, "epoch": 2619} {"train_loss": -11.492242813110352, "global_step": 440135, "epoch": 2619} {"train_loss": -12.715442657470703, "global_step": 440136, "epoch": 2619} {"train_loss": -11.469240188598633, "global_step": 440137, "epoch": 2619} {"train_loss": -11.33881664276123, "global_step": 440138, "epoch": 2619} {"train_loss": -11.850046157836914, "global_step": 440139, "epoch": 2619} {"train_loss": -11.404022216796875, "global_step": 440140, "epoch": 2619} {"train_loss": -11.250171661376953, "global_step": 440141, "epoch": 2619} {"train_loss": -10.882442474365234, "global_step": 440142, "epoch": 2619} {"train_loss": -10.600934982299805, "global_step": 440143, "epoch": 2619} {"train_loss": -9.220563888549805, "global_step": 440144, "epoch": 2619} {"train_loss": -10.774008750915527, "global_step": 440145, "epoch": 2619} {"train_loss": -8.172174453735352, "global_step": 440146, "epoch": 2619} {"train_loss": -11.899432182312012, "global_step": 440147, "epoch": 2619} {"train_loss": -9.120655059814453, "global_step": 440148, "epoch": 2619} {"train_loss": -10.944263458251953, "global_step": 440149, "epoch": 2619} {"train_loss": -11.092723846435547, "global_step": 440150, "epoch": 2619} {"train_loss": -11.975812911987305, "global_step": 440151, "epoch": 2619} {"train_loss": -10.712886810302734, "global_step": 440152, "epoch": 2619} {"train_loss": -11.084015846252441, "global_step": 440153, "epoch": 2619} {"train_loss": -11.85221004486084, "global_step": 440154, "epoch": 2619} {"train_loss": -12.03628921508789, "global_step": 440155, "epoch": 2619} {"train_loss": -11.640485763549805, "global_step": 440156, "epoch": 2619} {"train_loss": -11.254420280456543, "global_step": 440157, "epoch": 2619} {"train_loss": -12.169958114624023, "global_step": 440158, "epoch": 2619} {"train_loss": -12.104353285971142, "global_step": 440159, "epoch": 2619, "val_loss": 305401.625} {"train_loss": -12.217559814453125, "global_step": 440160, "epoch": 2620} {"train_loss": -11.770442008972168, "global_step": 440161, "epoch": 2620} {"train_loss": -11.42470645904541, "global_step": 440162, "epoch": 2620} {"train_loss": -10.915539741516113, "global_step": 440163, "epoch": 2620} {"train_loss": -11.548040390014648, "global_step": 440164, "epoch": 2620} {"train_loss": -11.819601058959961, "global_step": 440165, "epoch": 2620} {"train_loss": -11.554374694824219, "global_step": 440166, "epoch": 2620} {"train_loss": -11.961772918701172, "global_step": 440167, "epoch": 2620} {"train_loss": -11.113971710205078, "global_step": 440168, "epoch": 2620} {"train_loss": -11.573831558227539, "global_step": 440169, "epoch": 2620} {"train_loss": -12.230158805847168, "global_step": 440170, "epoch": 2620} {"train_loss": -11.636847496032715, "global_step": 440171, "epoch": 2620} {"train_loss": -11.91533374786377, "global_step": 440172, "epoch": 2620} {"train_loss": -12.283552169799805, "global_step": 440173, "epoch": 2620} {"train_loss": -12.022838592529297, "global_step": 440174, "epoch": 2620} {"train_loss": -12.608609199523926, "global_step": 440175, "epoch": 2620} {"train_loss": -12.110359191894531, "global_step": 440176, "epoch": 2620} {"train_loss": -12.349888801574707, "global_step": 440177, "epoch": 2620} {"train_loss": -11.991714477539062, "global_step": 440178, "epoch": 2620} {"train_loss": -12.310739517211914, "global_step": 440179, "epoch": 2620} {"train_loss": -12.211784362792969, "global_step": 440180, "epoch": 2620} {"train_loss": -12.284261703491211, "global_step": 440181, "epoch": 2620} {"train_loss": -12.187355995178223, "global_step": 440182, "epoch": 2620} {"train_loss": -12.653901100158691, "global_step": 440183, "epoch": 2620} {"train_loss": -11.997841835021973, "global_step": 440184, "epoch": 2620} {"train_loss": -12.479491233825684, "global_step": 440185, "epoch": 2620} {"train_loss": -12.132654190063477, "global_step": 440186, "epoch": 2620} {"train_loss": -12.086601257324219, "global_step": 440187, "epoch": 2620} {"train_loss": -12.147903442382812, "global_step": 440188, "epoch": 2620} {"train_loss": -12.569051742553711, "global_step": 440189, "epoch": 2620} {"train_loss": -12.259550094604492, "global_step": 440190, "epoch": 2620} {"train_loss": -12.73395824432373, "global_step": 440191, "epoch": 2620} {"train_loss": -12.549428939819336, "global_step": 440192, "epoch": 2620} {"train_loss": -12.39554214477539, "global_step": 440193, "epoch": 2620} {"train_loss": -12.605095863342285, "global_step": 440194, "epoch": 2620} {"train_loss": -12.415155410766602, "global_step": 440195, "epoch": 2620} {"train_loss": -12.574491500854492, "global_step": 440196, "epoch": 2620} {"train_loss": -12.362241744995117, "global_step": 440197, "epoch": 2620} {"train_loss": -12.623188972473145, "global_step": 440198, "epoch": 2620} {"train_loss": -12.736494064331055, "global_step": 440199, "epoch": 2620} {"train_loss": -12.5819091796875, "global_step": 440200, "epoch": 2620} {"train_loss": -12.604381561279297, "global_step": 440201, "epoch": 2620} {"train_loss": -12.504796028137207, "global_step": 440202, "epoch": 2620} {"train_loss": -12.491737365722656, "global_step": 440203, "epoch": 2620} {"train_loss": -12.475582122802734, "global_step": 440204, "epoch": 2620} {"train_loss": -12.57406997680664, "global_step": 440205, "epoch": 2620} {"train_loss": -12.437780380249023, "global_step": 440206, "epoch": 2620} {"train_loss": -12.256135940551758, "global_step": 440207, "epoch": 2620} {"train_loss": -12.501066207885742, "global_step": 440208, "epoch": 2620} {"train_loss": -12.586487770080566, "global_step": 440209, "epoch": 2620} {"train_loss": -12.691018104553223, "global_step": 440210, "epoch": 2620} {"train_loss": -12.546277046203613, "global_step": 440211, "epoch": 2620} {"train_loss": -12.732396125793457, "global_step": 440212, "epoch": 2620} {"train_loss": -12.506790161132812, "global_step": 440213, "epoch": 2620} {"train_loss": -12.493504524230957, "global_step": 440214, "epoch": 2620} {"train_loss": -12.59976577758789, "global_step": 440215, "epoch": 2620} {"train_loss": -12.463425636291504, "global_step": 440216, "epoch": 2620} {"train_loss": -12.669065475463867, "global_step": 440217, "epoch": 2620} {"train_loss": -12.745104789733887, "global_step": 440218, "epoch": 2620} {"train_loss": -12.817776679992676, "global_step": 440219, "epoch": 2620} {"train_loss": -12.692112922668457, "global_step": 440220, "epoch": 2620} {"train_loss": -12.807524681091309, "global_step": 440221, "epoch": 2620} {"train_loss": -12.499013900756836, "global_step": 440222, "epoch": 2620} {"train_loss": -12.673822402954102, "global_step": 440223, "epoch": 2620} {"train_loss": -12.517833709716797, "global_step": 440224, "epoch": 2620} {"train_loss": -12.698413848876953, "global_step": 440225, "epoch": 2620} {"train_loss": -12.701457977294922, "global_step": 440226, "epoch": 2620} {"train_loss": -12.845956802368164, "global_step": 440227, "epoch": 2620} {"train_loss": -12.042572021484375, "global_step": 440228, "epoch": 2620} {"train_loss": -12.389888763427734, "global_step": 440229, "epoch": 2620} {"train_loss": -12.565851211547852, "global_step": 440230, "epoch": 2620} {"train_loss": -12.607278823852539, "global_step": 440231, "epoch": 2620} {"train_loss": -12.569618225097656, "global_step": 440232, "epoch": 2620} {"train_loss": -12.030908584594727, "global_step": 440233, "epoch": 2620} {"train_loss": -12.251893043518066, "global_step": 440234, "epoch": 2620} {"train_loss": -12.815288543701172, "global_step": 440235, "epoch": 2620} {"train_loss": -12.698010444641113, "global_step": 440236, "epoch": 2620} {"train_loss": -12.4669771194458, "global_step": 440237, "epoch": 2620} {"train_loss": -12.243350982666016, "global_step": 440238, "epoch": 2620} {"train_loss": -12.304973602294922, "global_step": 440239, "epoch": 2620} {"train_loss": -12.783631324768066, "global_step": 440240, "epoch": 2620} {"train_loss": -12.343259811401367, "global_step": 440241, "epoch": 2620} {"train_loss": -12.238651275634766, "global_step": 440242, "epoch": 2620} {"train_loss": -12.434303283691406, "global_step": 440243, "epoch": 2620} {"train_loss": -12.884096145629883, "global_step": 440244, "epoch": 2620} {"train_loss": -12.486251831054688, "global_step": 440245, "epoch": 2620} {"train_loss": -12.589500427246094, "global_step": 440246, "epoch": 2620} {"train_loss": -12.584747314453125, "global_step": 440247, "epoch": 2620} {"train_loss": -12.633293151855469, "global_step": 440248, "epoch": 2620} {"train_loss": -12.548728942871094, "global_step": 440249, "epoch": 2620} {"train_loss": -12.681438446044922, "global_step": 440250, "epoch": 2620} {"train_loss": -12.634404182434082, "global_step": 440251, "epoch": 2620} {"train_loss": -13.05426025390625, "global_step": 440252, "epoch": 2620} {"train_loss": -12.655158996582031, "global_step": 440253, "epoch": 2620} {"train_loss": -12.811189651489258, "global_step": 440254, "epoch": 2620} {"train_loss": -12.800833702087402, "global_step": 440255, "epoch": 2620} {"train_loss": -12.971613883972168, "global_step": 440256, "epoch": 2620} {"train_loss": -12.555421829223633, "global_step": 440257, "epoch": 2620} {"train_loss": -12.505415916442871, "global_step": 440258, "epoch": 2620} {"train_loss": -12.524187088012695, "global_step": 440259, "epoch": 2620} {"train_loss": -12.305349349975586, "global_step": 440260, "epoch": 2620} {"train_loss": -12.652402877807617, "global_step": 440261, "epoch": 2620} {"train_loss": -12.573200225830078, "global_step": 440262, "epoch": 2620} {"train_loss": -12.837818145751953, "global_step": 440263, "epoch": 2620} {"train_loss": -12.388826370239258, "global_step": 440264, "epoch": 2620} {"train_loss": -12.54983139038086, "global_step": 440265, "epoch": 2620} {"train_loss": -12.870798110961914, "global_step": 440266, "epoch": 2620} {"train_loss": -12.653549194335938, "global_step": 440267, "epoch": 2620} {"train_loss": -12.412837982177734, "global_step": 440268, "epoch": 2620} {"train_loss": -12.393693923950195, "global_step": 440269, "epoch": 2620} {"train_loss": -12.555196762084961, "global_step": 440270, "epoch": 2620} {"train_loss": -12.466785430908203, "global_step": 440271, "epoch": 2620} {"train_loss": -12.113308906555176, "global_step": 440272, "epoch": 2620} {"train_loss": -10.909276962280273, "global_step": 440273, "epoch": 2620} {"train_loss": -12.085260391235352, "global_step": 440274, "epoch": 2620} {"train_loss": -10.78407096862793, "global_step": 440275, "epoch": 2620} {"train_loss": -11.547089576721191, "global_step": 440276, "epoch": 2620} {"train_loss": -11.554750442504883, "global_step": 440277, "epoch": 2620} {"train_loss": -11.760412216186523, "global_step": 440278, "epoch": 2620} {"train_loss": -12.417007446289062, "global_step": 440279, "epoch": 2620} {"train_loss": -10.718584060668945, "global_step": 440280, "epoch": 2620} {"train_loss": -11.155311584472656, "global_step": 440281, "epoch": 2620} {"train_loss": -12.12442398071289, "global_step": 440282, "epoch": 2620} {"train_loss": -12.728946685791016, "global_step": 440283, "epoch": 2620} {"train_loss": -12.356597900390625, "global_step": 440284, "epoch": 2620} {"train_loss": -11.991086959838867, "global_step": 440285, "epoch": 2620} {"train_loss": -12.6734619140625, "global_step": 440286, "epoch": 2620} {"train_loss": -12.310250282287598, "global_step": 440287, "epoch": 2620} {"train_loss": -11.905302047729492, "global_step": 440288, "epoch": 2620} {"train_loss": -11.681293487548828, "global_step": 440289, "epoch": 2620} {"train_loss": -11.882210731506348, "global_step": 440290, "epoch": 2620} {"train_loss": -11.953201293945312, "global_step": 440291, "epoch": 2620} {"train_loss": -12.39962387084961, "global_step": 440292, "epoch": 2620} {"train_loss": -12.108699798583984, "global_step": 440293, "epoch": 2620} {"train_loss": -11.12030029296875, "global_step": 440294, "epoch": 2620} {"train_loss": -11.388721466064453, "global_step": 440295, "epoch": 2620} {"train_loss": -12.581751823425293, "global_step": 440296, "epoch": 2620} {"train_loss": -11.239816665649414, "global_step": 440297, "epoch": 2620} {"train_loss": -11.961996078491211, "global_step": 440298, "epoch": 2620} {"train_loss": -12.327058792114258, "global_step": 440299, "epoch": 2620} {"train_loss": -11.232237815856934, "global_step": 440300, "epoch": 2620} {"train_loss": -12.028234481811523, "global_step": 440301, "epoch": 2620} {"train_loss": -11.986104965209961, "global_step": 440302, "epoch": 2620} {"train_loss": -11.441370010375977, "global_step": 440303, "epoch": 2620} {"train_loss": -12.619600296020508, "global_step": 440304, "epoch": 2620} {"train_loss": -12.06506061553955, "global_step": 440305, "epoch": 2620} {"train_loss": -12.14207649230957, "global_step": 440306, "epoch": 2620} {"train_loss": -12.429449081420898, "global_step": 440307, "epoch": 2620} {"train_loss": -12.494482040405273, "global_step": 440308, "epoch": 2620} {"train_loss": -11.757964134216309, "global_step": 440309, "epoch": 2620} {"train_loss": -11.770757675170898, "global_step": 440310, "epoch": 2620} {"train_loss": -11.90188217163086, "global_step": 440311, "epoch": 2620} {"train_loss": -11.37186050415039, "global_step": 440312, "epoch": 2620} {"train_loss": -11.847996711730957, "global_step": 440313, "epoch": 2620} {"train_loss": -12.004011154174805, "global_step": 440314, "epoch": 2620} {"train_loss": -11.798982620239258, "global_step": 440315, "epoch": 2620} {"train_loss": -12.289617538452148, "global_step": 440316, "epoch": 2620} {"train_loss": -12.526094436645508, "global_step": 440317, "epoch": 2620} {"train_loss": -11.887922286987305, "global_step": 440318, "epoch": 2620} {"train_loss": -11.610380172729492, "global_step": 440319, "epoch": 2620} {"train_loss": -12.336177825927734, "global_step": 440320, "epoch": 2620} {"train_loss": -12.255067825317383, "global_step": 440321, "epoch": 2620} {"train_loss": -12.260103225708008, "global_step": 440322, "epoch": 2620} {"train_loss": -12.098165512084961, "global_step": 440323, "epoch": 2620} {"train_loss": -12.348247528076172, "global_step": 440324, "epoch": 2620} {"train_loss": -11.928412437438965, "global_step": 440325, "epoch": 2620} {"train_loss": -12.126972198486328, "global_step": 440326, "epoch": 2620} {"train_loss": -12.255375095776149, "global_step": 440327, "epoch": 2620, "val_loss": 311190.34375, "train_action_mse_error": 1.1209856271743774} {"train_loss": -12.142410278320312, "global_step": 440328, "epoch": 2621} {"train_loss": -12.300403594970703, "global_step": 440329, "epoch": 2621} {"train_loss": -12.097107887268066, "global_step": 440330, "epoch": 2621} {"train_loss": -12.288232803344727, "global_step": 440331, "epoch": 2621} {"train_loss": -12.618946075439453, "global_step": 440332, "epoch": 2621} {"train_loss": -11.856886863708496, "global_step": 440333, "epoch": 2621} {"train_loss": -12.5684175491333, "global_step": 440334, "epoch": 2621} {"train_loss": -12.202075958251953, "global_step": 440335, "epoch": 2621} {"train_loss": -11.931413650512695, "global_step": 440336, "epoch": 2621} {"train_loss": -12.651606559753418, "global_step": 440337, "epoch": 2621} {"train_loss": -12.064409255981445, "global_step": 440338, "epoch": 2621} {"train_loss": -12.425573348999023, "global_step": 440339, "epoch": 2621} {"train_loss": -12.451885223388672, "global_step": 440340, "epoch": 2621} {"train_loss": -12.198562622070312, "global_step": 440341, "epoch": 2621} {"train_loss": -12.451581954956055, "global_step": 440342, "epoch": 2621} {"train_loss": -11.920975685119629, "global_step": 440343, "epoch": 2621} {"train_loss": -12.43163013458252, "global_step": 440344, "epoch": 2621} {"train_loss": -11.429697036743164, "global_step": 440345, "epoch": 2621} {"train_loss": -12.170419692993164, "global_step": 440346, "epoch": 2621} {"train_loss": -12.34627628326416, "global_step": 440347, "epoch": 2621} {"train_loss": -11.805095672607422, "global_step": 440348, "epoch": 2621} {"train_loss": -12.266815185546875, "global_step": 440349, "epoch": 2621} {"train_loss": -12.116884231567383, "global_step": 440350, "epoch": 2621} {"train_loss": -12.074760437011719, "global_step": 440351, "epoch": 2621} {"train_loss": -12.67192268371582, "global_step": 440352, "epoch": 2621} {"train_loss": -12.274604797363281, "global_step": 440353, "epoch": 2621} {"train_loss": -12.202898025512695, "global_step": 440354, "epoch": 2621} {"train_loss": -12.465875625610352, "global_step": 440355, "epoch": 2621} {"train_loss": -11.779374122619629, "global_step": 440356, "epoch": 2621} {"train_loss": -12.43681812286377, "global_step": 440357, "epoch": 2621} {"train_loss": -11.393004417419434, "global_step": 440358, "epoch": 2621} {"train_loss": -12.147708892822266, "global_step": 440359, "epoch": 2621} {"train_loss": -12.247841835021973, "global_step": 440360, "epoch": 2621} {"train_loss": -12.418594360351562, "global_step": 440361, "epoch": 2621} {"train_loss": -12.125418663024902, "global_step": 440362, "epoch": 2621} {"train_loss": -12.490103721618652, "global_step": 440363, "epoch": 2621} {"train_loss": -12.226154327392578, "global_step": 440364, "epoch": 2621} {"train_loss": -12.299555778503418, "global_step": 440365, "epoch": 2621} {"train_loss": -11.877355575561523, "global_step": 440366, "epoch": 2621} {"train_loss": -12.362407684326172, "global_step": 440367, "epoch": 2621} {"train_loss": -12.173849105834961, "global_step": 440368, "epoch": 2621} {"train_loss": -12.433778762817383, "global_step": 440369, "epoch": 2621} {"train_loss": -12.419994354248047, "global_step": 440370, "epoch": 2621} {"train_loss": -12.263453483581543, "global_step": 440371, "epoch": 2621} {"train_loss": -12.423334121704102, "global_step": 440372, "epoch": 2621} {"train_loss": -12.21721076965332, "global_step": 440373, "epoch": 2621} {"train_loss": -12.184547424316406, "global_step": 440374, "epoch": 2621} {"train_loss": -12.28939151763916, "global_step": 440375, "epoch": 2621} {"train_loss": -12.232919692993164, "global_step": 440376, "epoch": 2621} {"train_loss": -12.433277130126953, "global_step": 440377, "epoch": 2621} {"train_loss": -12.125017166137695, "global_step": 440378, "epoch": 2621} {"train_loss": -12.28013801574707, "global_step": 440379, "epoch": 2621} {"train_loss": -12.145841598510742, "global_step": 440380, "epoch": 2621} {"train_loss": -12.03718376159668, "global_step": 440381, "epoch": 2621} {"train_loss": -12.523336410522461, "global_step": 440382, "epoch": 2621} {"train_loss": -11.99095344543457, "global_step": 440383, "epoch": 2621} {"train_loss": -11.67257022857666, "global_step": 440384, "epoch": 2621} {"train_loss": -12.498045921325684, "global_step": 440385, "epoch": 2621} {"train_loss": -12.21397590637207, "global_step": 440386, "epoch": 2621} {"train_loss": -10.872749328613281, "global_step": 440387, "epoch": 2621} {"train_loss": -12.255558013916016, "global_step": 440388, "epoch": 2621} {"train_loss": -11.65661334991455, "global_step": 440389, "epoch": 2621} {"train_loss": -12.194868087768555, "global_step": 440390, "epoch": 2621} {"train_loss": -11.981913566589355, "global_step": 440391, "epoch": 2621} {"train_loss": -11.483907699584961, "global_step": 440392, "epoch": 2621} {"train_loss": -12.344842910766602, "global_step": 440393, "epoch": 2621} {"train_loss": -12.083166122436523, "global_step": 440394, "epoch": 2621} {"train_loss": -11.898441314697266, "global_step": 440395, "epoch": 2621} {"train_loss": -11.984211921691895, "global_step": 440396, "epoch": 2621} {"train_loss": -11.968477249145508, "global_step": 440397, "epoch": 2621} {"train_loss": -11.467063903808594, "global_step": 440398, "epoch": 2621} {"train_loss": -12.006589889526367, "global_step": 440399, "epoch": 2621} {"train_loss": -9.964990615844727, "global_step": 440400, "epoch": 2621} {"train_loss": -10.756274223327637, "global_step": 440401, "epoch": 2621} {"train_loss": -11.935107231140137, "global_step": 440402, "epoch": 2621} {"train_loss": -11.300539016723633, "global_step": 440403, "epoch": 2621} {"train_loss": -11.752370834350586, "global_step": 440404, "epoch": 2621} {"train_loss": -10.867132186889648, "global_step": 440405, "epoch": 2621} {"train_loss": -11.511783599853516, "global_step": 440406, "epoch": 2621} {"train_loss": -11.60087776184082, "global_step": 440407, "epoch": 2621} {"train_loss": -11.981786727905273, "global_step": 440408, "epoch": 2621} {"train_loss": -12.05484676361084, "global_step": 440409, "epoch": 2621} {"train_loss": -11.811787605285645, "global_step": 440410, "epoch": 2621} {"train_loss": -11.741083145141602, "global_step": 440411, "epoch": 2621} {"train_loss": -11.879042625427246, "global_step": 440412, "epoch": 2621} {"train_loss": -11.77983283996582, "global_step": 440413, "epoch": 2621} {"train_loss": -12.076532363891602, "global_step": 440414, "epoch": 2621} {"train_loss": -12.400691986083984, "global_step": 440415, "epoch": 2621} {"train_loss": -12.262243270874023, "global_step": 440416, "epoch": 2621} {"train_loss": -12.436483383178711, "global_step": 440417, "epoch": 2621} {"train_loss": -12.081587791442871, "global_step": 440418, "epoch": 2621} {"train_loss": -12.321450233459473, "global_step": 440419, "epoch": 2621} {"train_loss": -12.312085151672363, "global_step": 440420, "epoch": 2621} {"train_loss": -12.46343994140625, "global_step": 440421, "epoch": 2621} {"train_loss": -12.468135833740234, "global_step": 440422, "epoch": 2621} {"train_loss": -12.42182731628418, "global_step": 440423, "epoch": 2621} {"train_loss": -12.594144821166992, "global_step": 440424, "epoch": 2621} {"train_loss": -12.428577423095703, "global_step": 440425, "epoch": 2621} {"train_loss": -12.47085952758789, "global_step": 440426, "epoch": 2621} {"train_loss": -12.5346040725708, "global_step": 440427, "epoch": 2621} {"train_loss": -12.562301635742188, "global_step": 440428, "epoch": 2621} {"train_loss": -12.458078384399414, "global_step": 440429, "epoch": 2621} {"train_loss": -12.60153865814209, "global_step": 440430, "epoch": 2621} {"train_loss": -12.489864349365234, "global_step": 440431, "epoch": 2621} {"train_loss": -12.38174057006836, "global_step": 440432, "epoch": 2621} {"train_loss": -12.64915943145752, "global_step": 440433, "epoch": 2621} {"train_loss": -12.083515167236328, "global_step": 440434, "epoch": 2621} {"train_loss": -12.321423530578613, "global_step": 440435, "epoch": 2621} {"train_loss": -12.527185440063477, "global_step": 440436, "epoch": 2621} {"train_loss": -12.22054386138916, "global_step": 440437, "epoch": 2621} {"train_loss": -12.197952270507812, "global_step": 440438, "epoch": 2621} {"train_loss": -12.486523628234863, "global_step": 440439, "epoch": 2621} {"train_loss": -12.336498260498047, "global_step": 440440, "epoch": 2621} {"train_loss": -12.406200408935547, "global_step": 440441, "epoch": 2621} {"train_loss": -12.302440643310547, "global_step": 440442, "epoch": 2621} {"train_loss": -12.534988403320312, "global_step": 440443, "epoch": 2621} {"train_loss": -12.52193832397461, "global_step": 440444, "epoch": 2621} {"train_loss": -12.068951606750488, "global_step": 440445, "epoch": 2621} {"train_loss": -12.791725158691406, "global_step": 440446, "epoch": 2621} {"train_loss": -12.430207252502441, "global_step": 440447, "epoch": 2621} {"train_loss": -12.531177520751953, "global_step": 440448, "epoch": 2621} {"train_loss": -12.647369384765625, "global_step": 440449, "epoch": 2621} {"train_loss": -12.689186096191406, "global_step": 440450, "epoch": 2621} {"train_loss": -12.679567337036133, "global_step": 440451, "epoch": 2621} {"train_loss": -12.578988075256348, "global_step": 440452, "epoch": 2621} {"train_loss": -12.551056861877441, "global_step": 440453, "epoch": 2621} {"train_loss": -12.644744873046875, "global_step": 440454, "epoch": 2621} {"train_loss": -12.795684814453125, "global_step": 440455, "epoch": 2621} {"train_loss": -12.410415649414062, "global_step": 440456, "epoch": 2621} {"train_loss": -12.596292495727539, "global_step": 440457, "epoch": 2621} {"train_loss": -12.612737655639648, "global_step": 440458, "epoch": 2621} {"train_loss": -12.628547668457031, "global_step": 440459, "epoch": 2621} {"train_loss": -12.630880355834961, "global_step": 440460, "epoch": 2621} {"train_loss": -12.391454696655273, "global_step": 440461, "epoch": 2621} {"train_loss": -12.501493453979492, "global_step": 440462, "epoch": 2621} {"train_loss": -12.548433303833008, "global_step": 440463, "epoch": 2621} {"train_loss": -12.840288162231445, "global_step": 440464, "epoch": 2621} {"train_loss": -12.805320739746094, "global_step": 440465, "epoch": 2621} {"train_loss": -12.673807144165039, "global_step": 440466, "epoch": 2621} {"train_loss": -12.680500030517578, "global_step": 440467, "epoch": 2621} {"train_loss": -12.585002899169922, "global_step": 440468, "epoch": 2621} {"train_loss": -12.631624221801758, "global_step": 440469, "epoch": 2621} {"train_loss": -12.499911308288574, "global_step": 440470, "epoch": 2621} {"train_loss": -12.335467338562012, "global_step": 440471, "epoch": 2621} {"train_loss": -12.438919067382812, "global_step": 440472, "epoch": 2621} {"train_loss": -12.310609817504883, "global_step": 440473, "epoch": 2621} {"train_loss": -12.37101936340332, "global_step": 440474, "epoch": 2621} {"train_loss": -11.985466003417969, "global_step": 440475, "epoch": 2621} {"train_loss": -10.744565963745117, "global_step": 440476, "epoch": 2621} {"train_loss": -12.068290710449219, "global_step": 440477, "epoch": 2621} {"train_loss": -10.995490074157715, "global_step": 440478, "epoch": 2621} {"train_loss": -9.885830879211426, "global_step": 440479, "epoch": 2621} {"train_loss": -10.640905380249023, "global_step": 440480, "epoch": 2621} {"train_loss": -9.774248123168945, "global_step": 440481, "epoch": 2621} {"train_loss": -10.494913101196289, "global_step": 440482, "epoch": 2621} {"train_loss": -9.796140670776367, "global_step": 440483, "epoch": 2621} {"train_loss": -11.057958602905273, "global_step": 440484, "epoch": 2621} {"train_loss": -10.831684112548828, "global_step": 440485, "epoch": 2621} {"train_loss": -9.912887573242188, "global_step": 440486, "epoch": 2621} {"train_loss": -11.53066635131836, "global_step": 440487, "epoch": 2621} {"train_loss": -9.55575180053711, "global_step": 440488, "epoch": 2621} {"train_loss": -11.202646255493164, "global_step": 440489, "epoch": 2621} {"train_loss": -10.49046516418457, "global_step": 440490, "epoch": 2621} {"train_loss": -10.962042808532715, "global_step": 440491, "epoch": 2621} {"train_loss": -11.08978271484375, "global_step": 440492, "epoch": 2621} {"train_loss": -10.324904441833496, "global_step": 440493, "epoch": 2621} {"train_loss": -11.730767250061035, "global_step": 440494, "epoch": 2621} {"train_loss": -12.041571912311372, "global_step": 440495, "epoch": 2621, "val_loss": 311477.0} {"train_loss": -10.806978225708008, "global_step": 440496, "epoch": 2622} {"train_loss": -11.820435523986816, "global_step": 440497, "epoch": 2622} {"train_loss": -10.992215156555176, "global_step": 440498, "epoch": 2622} {"train_loss": -11.656415939331055, "global_step": 440499, "epoch": 2622} {"train_loss": -11.16872787475586, "global_step": 440500, "epoch": 2622} {"train_loss": -11.325016021728516, "global_step": 440501, "epoch": 2622} {"train_loss": -12.254892349243164, "global_step": 440502, "epoch": 2622} {"train_loss": -10.437211990356445, "global_step": 440503, "epoch": 2622} {"train_loss": -12.316949844360352, "global_step": 440504, "epoch": 2622} {"train_loss": -10.837332725524902, "global_step": 440505, "epoch": 2622} {"train_loss": -11.933965682983398, "global_step": 440506, "epoch": 2622} {"train_loss": -11.443548202514648, "global_step": 440507, "epoch": 2622} {"train_loss": -11.385808944702148, "global_step": 440508, "epoch": 2622} {"train_loss": -11.673044204711914, "global_step": 440509, "epoch": 2622} {"train_loss": -11.111579895019531, "global_step": 440510, "epoch": 2622} {"train_loss": -12.037247657775879, "global_step": 440511, "epoch": 2622} {"train_loss": -11.331047058105469, "global_step": 440512, "epoch": 2622} {"train_loss": -11.828629493713379, "global_step": 440513, "epoch": 2622} {"train_loss": -11.558853149414062, "global_step": 440514, "epoch": 2622} {"train_loss": -12.07707405090332, "global_step": 440515, "epoch": 2622} {"train_loss": -11.725074768066406, "global_step": 440516, "epoch": 2622} {"train_loss": -11.875423431396484, "global_step": 440517, "epoch": 2622} {"train_loss": -11.809906959533691, "global_step": 440518, "epoch": 2622} {"train_loss": -12.265583992004395, "global_step": 440519, "epoch": 2622} {"train_loss": -11.74662971496582, "global_step": 440520, "epoch": 2622} {"train_loss": -12.350675582885742, "global_step": 440521, "epoch": 2622} {"train_loss": -11.733001708984375, "global_step": 440522, "epoch": 2622} {"train_loss": -11.933359146118164, "global_step": 440523, "epoch": 2622} {"train_loss": -12.044519424438477, "global_step": 440524, "epoch": 2622} {"train_loss": -11.858051300048828, "global_step": 440525, "epoch": 2622} {"train_loss": -11.916696548461914, "global_step": 440526, "epoch": 2622} {"train_loss": -12.127189636230469, "global_step": 440527, "epoch": 2622} {"train_loss": -11.330717086791992, "global_step": 440528, "epoch": 2622} {"train_loss": -12.628872871398926, "global_step": 440529, "epoch": 2622} {"train_loss": -12.134779930114746, "global_step": 440530, "epoch": 2622} {"train_loss": -12.28271198272705, "global_step": 440531, "epoch": 2622} {"train_loss": -12.095422744750977, "global_step": 440532, "epoch": 2622} {"train_loss": -12.12208366394043, "global_step": 440533, "epoch": 2622} {"train_loss": -12.5224609375, "global_step": 440534, "epoch": 2622} {"train_loss": -12.06479263305664, "global_step": 440535, "epoch": 2622} {"train_loss": -12.269186973571777, "global_step": 440536, "epoch": 2622} {"train_loss": -12.236725807189941, "global_step": 440537, "epoch": 2622} {"train_loss": -12.347626686096191, "global_step": 440538, "epoch": 2622} {"train_loss": -12.26272201538086, "global_step": 440539, "epoch": 2622} {"train_loss": -12.355602264404297, "global_step": 440540, "epoch": 2622} {"train_loss": -12.358028411865234, "global_step": 440541, "epoch": 2622} {"train_loss": -12.482611656188965, "global_step": 440542, "epoch": 2622} {"train_loss": -12.436726570129395, "global_step": 440543, "epoch": 2622} {"train_loss": -12.696548461914062, "global_step": 440544, "epoch": 2622} {"train_loss": -12.614053726196289, "global_step": 440545, "epoch": 2622} {"train_loss": -12.618274688720703, "global_step": 440546, "epoch": 2622} {"train_loss": -12.688655853271484, "global_step": 440547, "epoch": 2622} {"train_loss": -12.593564987182617, "global_step": 440548, "epoch": 2622} {"train_loss": -12.691225051879883, "global_step": 440549, "epoch": 2622} {"train_loss": -12.536279678344727, "global_step": 440550, "epoch": 2622} {"train_loss": -12.659982681274414, "global_step": 440551, "epoch": 2622} {"train_loss": -12.621309280395508, "global_step": 440552, "epoch": 2622} {"train_loss": -12.611669540405273, "global_step": 440553, "epoch": 2622} {"train_loss": -12.611422538757324, "global_step": 440554, "epoch": 2622} {"train_loss": -12.582412719726562, "global_step": 440555, "epoch": 2622} {"train_loss": -12.528088569641113, "global_step": 440556, "epoch": 2622} {"train_loss": -12.628353118896484, "global_step": 440557, "epoch": 2622} {"train_loss": -12.391737937927246, "global_step": 440558, "epoch": 2622} {"train_loss": -12.524410247802734, "global_step": 440559, "epoch": 2622} {"train_loss": -12.494421005249023, "global_step": 440560, "epoch": 2622} {"train_loss": -12.927820205688477, "global_step": 440561, "epoch": 2622} {"train_loss": -12.561025619506836, "global_step": 440562, "epoch": 2622} {"train_loss": -12.608161926269531, "global_step": 440563, "epoch": 2622} {"train_loss": -12.685897827148438, "global_step": 440564, "epoch": 2622} {"train_loss": -12.664648056030273, "global_step": 440565, "epoch": 2622} {"train_loss": -12.676795959472656, "global_step": 440566, "epoch": 2622} {"train_loss": -12.66754150390625, "global_step": 440567, "epoch": 2622} {"train_loss": -12.789851188659668, "global_step": 440568, "epoch": 2622} {"train_loss": -12.487789154052734, "global_step": 440569, "epoch": 2622} {"train_loss": -12.714590072631836, "global_step": 440570, "epoch": 2622} {"train_loss": -12.623831748962402, "global_step": 440571, "epoch": 2622} {"train_loss": -12.654783248901367, "global_step": 440572, "epoch": 2622} {"train_loss": -12.494976043701172, "global_step": 440573, "epoch": 2622} {"train_loss": -12.685359954833984, "global_step": 440574, "epoch": 2622} {"train_loss": -12.669668197631836, "global_step": 440575, "epoch": 2622} {"train_loss": -12.813782691955566, "global_step": 440576, "epoch": 2622} {"train_loss": -12.829071044921875, "global_step": 440577, "epoch": 2622} {"train_loss": -12.523748397827148, "global_step": 440578, "epoch": 2622} {"train_loss": -12.535211563110352, "global_step": 440579, "epoch": 2622} {"train_loss": -12.47091293334961, "global_step": 440580, "epoch": 2622} {"train_loss": -12.675061225891113, "global_step": 440581, "epoch": 2622} {"train_loss": -12.618965148925781, "global_step": 440582, "epoch": 2622} {"train_loss": -12.582745552062988, "global_step": 440583, "epoch": 2622} {"train_loss": -12.754302978515625, "global_step": 440584, "epoch": 2622} {"train_loss": -12.734169006347656, "global_step": 440585, "epoch": 2622} {"train_loss": -12.962108612060547, "global_step": 440586, "epoch": 2622} {"train_loss": -12.652364730834961, "global_step": 440587, "epoch": 2622} {"train_loss": -12.754753112792969, "global_step": 440588, "epoch": 2622} {"train_loss": -12.564844131469727, "global_step": 440589, "epoch": 2622} {"train_loss": -12.631301879882812, "global_step": 440590, "epoch": 2622} {"train_loss": -12.055194854736328, "global_step": 440591, "epoch": 2622} {"train_loss": -12.848465919494629, "global_step": 440592, "epoch": 2622} {"train_loss": -12.404364585876465, "global_step": 440593, "epoch": 2622} {"train_loss": -12.748001098632812, "global_step": 440594, "epoch": 2622} {"train_loss": -12.346607208251953, "global_step": 440595, "epoch": 2622} {"train_loss": -12.54210376739502, "global_step": 440596, "epoch": 2622} {"train_loss": -12.514986038208008, "global_step": 440597, "epoch": 2622} {"train_loss": -12.714326858520508, "global_step": 440598, "epoch": 2622} {"train_loss": -12.345094680786133, "global_step": 440599, "epoch": 2622} {"train_loss": -12.379205703735352, "global_step": 440600, "epoch": 2622} {"train_loss": -12.688276290893555, "global_step": 440601, "epoch": 2622} {"train_loss": -12.154857635498047, "global_step": 440602, "epoch": 2622} {"train_loss": -12.17121410369873, "global_step": 440603, "epoch": 2622} {"train_loss": -12.368450164794922, "global_step": 440604, "epoch": 2622} {"train_loss": -12.512088775634766, "global_step": 440605, "epoch": 2622} {"train_loss": -12.362297058105469, "global_step": 440606, "epoch": 2622} {"train_loss": -12.359518051147461, "global_step": 440607, "epoch": 2622} {"train_loss": -12.46568489074707, "global_step": 440608, "epoch": 2622} {"train_loss": -12.10992431640625, "global_step": 440609, "epoch": 2622} {"train_loss": -12.420625686645508, "global_step": 440610, "epoch": 2622} {"train_loss": -12.279369354248047, "global_step": 440611, "epoch": 2622} {"train_loss": -12.001328468322754, "global_step": 440612, "epoch": 2622} {"train_loss": -12.622504234313965, "global_step": 440613, "epoch": 2622} {"train_loss": -12.124363899230957, "global_step": 440614, "epoch": 2622} {"train_loss": -12.593047142028809, "global_step": 440615, "epoch": 2622} {"train_loss": -12.87031364440918, "global_step": 440616, "epoch": 2622} {"train_loss": -12.669296264648438, "global_step": 440617, "epoch": 2622} {"train_loss": -12.391246795654297, "global_step": 440618, "epoch": 2622} {"train_loss": -12.820428848266602, "global_step": 440619, "epoch": 2622} {"train_loss": -12.554235458374023, "global_step": 440620, "epoch": 2622} {"train_loss": -12.486248016357422, "global_step": 440621, "epoch": 2622} {"train_loss": -12.842655181884766, "global_step": 440622, "epoch": 2622} {"train_loss": -12.694330215454102, "global_step": 440623, "epoch": 2622} {"train_loss": -12.576547622680664, "global_step": 440624, "epoch": 2622} {"train_loss": -12.71379280090332, "global_step": 440625, "epoch": 2622} {"train_loss": -12.862302780151367, "global_step": 440626, "epoch": 2622} {"train_loss": -12.28077507019043, "global_step": 440627, "epoch": 2622} {"train_loss": -12.78692626953125, "global_step": 440628, "epoch": 2622} {"train_loss": -12.57708740234375, "global_step": 440629, "epoch": 2622} {"train_loss": -12.089221954345703, "global_step": 440630, "epoch": 2622} {"train_loss": -12.635683059692383, "global_step": 440631, "epoch": 2622} {"train_loss": -12.489288330078125, "global_step": 440632, "epoch": 2622} {"train_loss": -11.792152404785156, "global_step": 440633, "epoch": 2622} {"train_loss": -12.484099388122559, "global_step": 440634, "epoch": 2622} {"train_loss": -12.531176567077637, "global_step": 440635, "epoch": 2622} {"train_loss": -12.471902847290039, "global_step": 440636, "epoch": 2622} {"train_loss": -12.482413291931152, "global_step": 440637, "epoch": 2622} {"train_loss": -12.968664169311523, "global_step": 440638, "epoch": 2622} {"train_loss": -12.301719665527344, "global_step": 440639, "epoch": 2622} {"train_loss": -12.45561408996582, "global_step": 440640, "epoch": 2622} {"train_loss": -12.82429313659668, "global_step": 440641, "epoch": 2622} {"train_loss": -12.245853424072266, "global_step": 440642, "epoch": 2622} {"train_loss": -11.914895057678223, "global_step": 440643, "epoch": 2622} {"train_loss": -12.145048141479492, "global_step": 440644, "epoch": 2622} {"train_loss": -12.406261444091797, "global_step": 440645, "epoch": 2622} {"train_loss": -12.414541244506836, "global_step": 440646, "epoch": 2622} {"train_loss": -12.767165184020996, "global_step": 440647, "epoch": 2622} {"train_loss": -12.656840324401855, "global_step": 440648, "epoch": 2622} {"train_loss": -12.277816772460938, "global_step": 440649, "epoch": 2622} {"train_loss": -11.951348304748535, "global_step": 440650, "epoch": 2622} {"train_loss": -12.37849235534668, "global_step": 440651, "epoch": 2622} {"train_loss": -12.292318344116211, "global_step": 440652, "epoch": 2622} {"train_loss": -12.142133712768555, "global_step": 440653, "epoch": 2622} {"train_loss": -11.803557395935059, "global_step": 440654, "epoch": 2622} {"train_loss": -12.704317092895508, "global_step": 440655, "epoch": 2622} {"train_loss": -12.1922607421875, "global_step": 440656, "epoch": 2622} {"train_loss": -12.398401260375977, "global_step": 440657, "epoch": 2622} {"train_loss": -11.788740158081055, "global_step": 440658, "epoch": 2622} {"train_loss": -12.111227989196777, "global_step": 440659, "epoch": 2622} {"train_loss": -11.448756217956543, "global_step": 440660, "epoch": 2622} {"train_loss": -11.063884735107422, "global_step": 440661, "epoch": 2622} {"train_loss": -11.011037826538086, "global_step": 440662, "epoch": 2622} {"train_loss": -12.285227202233814, "global_step": 440663, "epoch": 2622, "val_loss": 312648.40625} {"train_loss": -9.323168754577637, "global_step": 440664, "epoch": 2623} {"train_loss": -9.45680046081543, "global_step": 440665, "epoch": 2623} {"train_loss": -10.413758277893066, "global_step": 440666, "epoch": 2623} {"train_loss": -10.43362808227539, "global_step": 440667, "epoch": 2623} {"train_loss": -10.395362854003906, "global_step": 440668, "epoch": 2623} {"train_loss": -9.68492317199707, "global_step": 440669, "epoch": 2623} {"train_loss": -10.745786666870117, "global_step": 440670, "epoch": 2623} {"train_loss": -11.12149429321289, "global_step": 440671, "epoch": 2623} {"train_loss": -9.778590202331543, "global_step": 440672, "epoch": 2623} {"train_loss": -9.980823516845703, "global_step": 440673, "epoch": 2623} {"train_loss": -9.36630630493164, "global_step": 440674, "epoch": 2623} {"train_loss": -8.931083679199219, "global_step": 440675, "epoch": 2623} {"train_loss": -10.394631385803223, "global_step": 440676, "epoch": 2623} {"train_loss": -10.294822692871094, "global_step": 440677, "epoch": 2623} {"train_loss": -11.491329193115234, "global_step": 440678, "epoch": 2623} {"train_loss": -10.564891815185547, "global_step": 440679, "epoch": 2623} {"train_loss": -10.621987342834473, "global_step": 440680, "epoch": 2623} {"train_loss": -10.223811149597168, "global_step": 440681, "epoch": 2623} {"train_loss": -10.344757080078125, "global_step": 440682, "epoch": 2623} {"train_loss": -10.482283592224121, "global_step": 440683, "epoch": 2623} {"train_loss": -11.003730773925781, "global_step": 440684, "epoch": 2623} {"train_loss": -11.537074089050293, "global_step": 440685, "epoch": 2623} {"train_loss": -10.422966003417969, "global_step": 440686, "epoch": 2623} {"train_loss": -11.288261413574219, "global_step": 440687, "epoch": 2623} {"train_loss": -10.841086387634277, "global_step": 440688, "epoch": 2623} {"train_loss": -12.216058731079102, "global_step": 440689, "epoch": 2623} {"train_loss": -11.192924499511719, "global_step": 440690, "epoch": 2623} {"train_loss": -11.97553825378418, "global_step": 440691, "epoch": 2623} {"train_loss": -11.367301940917969, "global_step": 440692, "epoch": 2623} {"train_loss": -11.82758903503418, "global_step": 440693, "epoch": 2623} {"train_loss": -11.995555877685547, "global_step": 440694, "epoch": 2623} {"train_loss": -11.81734848022461, "global_step": 440695, "epoch": 2623} {"train_loss": -11.732709884643555, "global_step": 440696, "epoch": 2623} {"train_loss": -11.996337890625, "global_step": 440697, "epoch": 2623} {"train_loss": -12.044849395751953, "global_step": 440698, "epoch": 2623} {"train_loss": -12.388229370117188, "global_step": 440699, "epoch": 2623} {"train_loss": -12.579488754272461, "global_step": 440700, "epoch": 2623} {"train_loss": -11.990363121032715, "global_step": 440701, "epoch": 2623} {"train_loss": -12.36495590209961, "global_step": 440702, "epoch": 2623} {"train_loss": -12.33303451538086, "global_step": 440703, "epoch": 2623} {"train_loss": -12.340644836425781, "global_step": 440704, "epoch": 2623} {"train_loss": -12.317377090454102, "global_step": 440705, "epoch": 2623} {"train_loss": -12.444624900817871, "global_step": 440706, "epoch": 2623} {"train_loss": -12.260507583618164, "global_step": 440707, "epoch": 2623} {"train_loss": -12.30084228515625, "global_step": 440708, "epoch": 2623} {"train_loss": -12.450824737548828, "global_step": 440709, "epoch": 2623} {"train_loss": -11.855550765991211, "global_step": 440710, "epoch": 2623} {"train_loss": -12.632492065429688, "global_step": 440711, "epoch": 2623} {"train_loss": -12.451465606689453, "global_step": 440712, "epoch": 2623} {"train_loss": -12.293859481811523, "global_step": 440713, "epoch": 2623} {"train_loss": -12.41793441772461, "global_step": 440714, "epoch": 2623} {"train_loss": -12.042889595031738, "global_step": 440715, "epoch": 2623} {"train_loss": -12.45905876159668, "global_step": 440716, "epoch": 2623} {"train_loss": -12.34477424621582, "global_step": 440717, "epoch": 2623} {"train_loss": -12.383269309997559, "global_step": 440718, "epoch": 2623} {"train_loss": -12.517045974731445, "global_step": 440719, "epoch": 2623} {"train_loss": -12.526897430419922, "global_step": 440720, "epoch": 2623} {"train_loss": -12.706329345703125, "global_step": 440721, "epoch": 2623} {"train_loss": -12.443424224853516, "global_step": 440722, "epoch": 2623} {"train_loss": -12.554460525512695, "global_step": 440723, "epoch": 2623} {"train_loss": -12.833510398864746, "global_step": 440724, "epoch": 2623} {"train_loss": -12.512445449829102, "global_step": 440725, "epoch": 2623} {"train_loss": -12.6682710647583, "global_step": 440726, "epoch": 2623} {"train_loss": -12.611701011657715, "global_step": 440727, "epoch": 2623} {"train_loss": -12.500974655151367, "global_step": 440728, "epoch": 2623} {"train_loss": -12.775087356567383, "global_step": 440729, "epoch": 2623} {"train_loss": -12.311256408691406, "global_step": 440730, "epoch": 2623} {"train_loss": -12.73796558380127, "global_step": 440731, "epoch": 2623} {"train_loss": -12.30099868774414, "global_step": 440732, "epoch": 2623} {"train_loss": -12.559066772460938, "global_step": 440733, "epoch": 2623} {"train_loss": -12.565239906311035, "global_step": 440734, "epoch": 2623} {"train_loss": -12.414172172546387, "global_step": 440735, "epoch": 2623} {"train_loss": -12.541997909545898, "global_step": 440736, "epoch": 2623} {"train_loss": -12.660400390625, "global_step": 440737, "epoch": 2623} {"train_loss": -12.716829299926758, "global_step": 440738, "epoch": 2623} {"train_loss": -12.85743522644043, "global_step": 440739, "epoch": 2623} {"train_loss": -12.383727073669434, "global_step": 440740, "epoch": 2623} {"train_loss": -12.487467765808105, "global_step": 440741, "epoch": 2623} {"train_loss": -11.887001991271973, "global_step": 440742, "epoch": 2623} {"train_loss": -12.348621368408203, "global_step": 440743, "epoch": 2623} {"train_loss": -12.619731903076172, "global_step": 440744, "epoch": 2623} {"train_loss": -12.182367324829102, "global_step": 440745, "epoch": 2623} {"train_loss": -12.476739883422852, "global_step": 440746, "epoch": 2623} {"train_loss": -12.159523010253906, "global_step": 440747, "epoch": 2623} {"train_loss": -11.673795700073242, "global_step": 440748, "epoch": 2623} {"train_loss": -12.119638442993164, "global_step": 440749, "epoch": 2623} {"train_loss": -12.32713508605957, "global_step": 440750, "epoch": 2623} {"train_loss": -12.477416038513184, "global_step": 440751, "epoch": 2623} {"train_loss": -12.488090515136719, "global_step": 440752, "epoch": 2623} {"train_loss": -12.330486297607422, "global_step": 440753, "epoch": 2623} {"train_loss": -12.462318420410156, "global_step": 440754, "epoch": 2623} {"train_loss": -12.416074752807617, "global_step": 440755, "epoch": 2623} {"train_loss": -12.684808731079102, "global_step": 440756, "epoch": 2623} {"train_loss": -12.39889144897461, "global_step": 440757, "epoch": 2623} {"train_loss": -12.626728057861328, "global_step": 440758, "epoch": 2623} {"train_loss": -12.798179626464844, "global_step": 440759, "epoch": 2623} {"train_loss": -12.306467056274414, "global_step": 440760, "epoch": 2623} {"train_loss": -12.707561492919922, "global_step": 440761, "epoch": 2623} {"train_loss": -12.50526237487793, "global_step": 440762, "epoch": 2623} {"train_loss": -12.601278305053711, "global_step": 440763, "epoch": 2623} {"train_loss": -12.621232032775879, "global_step": 440764, "epoch": 2623} {"train_loss": -12.694475173950195, "global_step": 440765, "epoch": 2623} {"train_loss": -12.59721565246582, "global_step": 440766, "epoch": 2623} {"train_loss": -12.699191093444824, "global_step": 440767, "epoch": 2623} {"train_loss": -12.793771743774414, "global_step": 440768, "epoch": 2623} {"train_loss": -12.629372596740723, "global_step": 440769, "epoch": 2623} {"train_loss": -12.779402732849121, "global_step": 440770, "epoch": 2623} {"train_loss": -12.613937377929688, "global_step": 440771, "epoch": 2623} {"train_loss": -12.925254821777344, "global_step": 440772, "epoch": 2623} {"train_loss": -12.680087089538574, "global_step": 440773, "epoch": 2623} {"train_loss": -13.01609992980957, "global_step": 440774, "epoch": 2623} {"train_loss": -12.541354179382324, "global_step": 440775, "epoch": 2623} {"train_loss": -12.538546562194824, "global_step": 440776, "epoch": 2623} {"train_loss": -12.5812349319458, "global_step": 440777, "epoch": 2623} {"train_loss": -12.578660011291504, "global_step": 440778, "epoch": 2623} {"train_loss": -12.616629600524902, "global_step": 440779, "epoch": 2623} {"train_loss": -12.309738159179688, "global_step": 440780, "epoch": 2623} {"train_loss": -12.76522445678711, "global_step": 440781, "epoch": 2623} {"train_loss": -12.485485076904297, "global_step": 440782, "epoch": 2623} {"train_loss": -13.02081298828125, "global_step": 440783, "epoch": 2623} {"train_loss": -12.225787162780762, "global_step": 440784, "epoch": 2623} {"train_loss": -12.32246208190918, "global_step": 440785, "epoch": 2623} {"train_loss": -12.83144760131836, "global_step": 440786, "epoch": 2623} {"train_loss": -12.285619735717773, "global_step": 440787, "epoch": 2623} {"train_loss": -12.384469032287598, "global_step": 440788, "epoch": 2623} {"train_loss": -12.429563522338867, "global_step": 440789, "epoch": 2623} {"train_loss": -12.171735763549805, "global_step": 440790, "epoch": 2623} {"train_loss": -12.280555725097656, "global_step": 440791, "epoch": 2623} {"train_loss": -12.494550704956055, "global_step": 440792, "epoch": 2623} {"train_loss": -12.354219436645508, "global_step": 440793, "epoch": 2623} {"train_loss": -11.536409378051758, "global_step": 440794, "epoch": 2623} {"train_loss": -12.364486694335938, "global_step": 440795, "epoch": 2623} {"train_loss": -12.417581558227539, "global_step": 440796, "epoch": 2623} {"train_loss": -12.127567291259766, "global_step": 440797, "epoch": 2623} {"train_loss": -12.25674057006836, "global_step": 440798, "epoch": 2623} {"train_loss": -12.306083679199219, "global_step": 440799, "epoch": 2623} {"train_loss": -12.10666561126709, "global_step": 440800, "epoch": 2623} {"train_loss": -12.343378067016602, "global_step": 440801, "epoch": 2623} {"train_loss": -11.901509284973145, "global_step": 440802, "epoch": 2623} {"train_loss": -12.39551067352295, "global_step": 440803, "epoch": 2623} {"train_loss": -11.80716609954834, "global_step": 440804, "epoch": 2623} {"train_loss": -12.259225845336914, "global_step": 440805, "epoch": 2623} {"train_loss": -12.135917663574219, "global_step": 440806, "epoch": 2623} {"train_loss": -12.444283485412598, "global_step": 440807, "epoch": 2623} {"train_loss": -12.298064231872559, "global_step": 440808, "epoch": 2623} {"train_loss": -12.352093696594238, "global_step": 440809, "epoch": 2623} {"train_loss": -12.242929458618164, "global_step": 440810, "epoch": 2623} {"train_loss": -12.41749095916748, "global_step": 440811, "epoch": 2623} {"train_loss": -11.942290306091309, "global_step": 440812, "epoch": 2623} {"train_loss": -11.898687362670898, "global_step": 440813, "epoch": 2623} {"train_loss": -12.327638626098633, "global_step": 440814, "epoch": 2623} {"train_loss": -11.851852416992188, "global_step": 440815, "epoch": 2623} {"train_loss": -12.649604797363281, "global_step": 440816, "epoch": 2623} {"train_loss": -11.898022651672363, "global_step": 440817, "epoch": 2623} {"train_loss": -11.907072067260742, "global_step": 440818, "epoch": 2623} {"train_loss": -11.700773239135742, "global_step": 440819, "epoch": 2623} {"train_loss": -11.494473457336426, "global_step": 440820, "epoch": 2623} {"train_loss": -12.352962493896484, "global_step": 440821, "epoch": 2623} {"train_loss": -11.586288452148438, "global_step": 440822, "epoch": 2623} {"train_loss": -11.419955253601074, "global_step": 440823, "epoch": 2623} {"train_loss": -12.34768295288086, "global_step": 440824, "epoch": 2623} {"train_loss": -11.114370346069336, "global_step": 440825, "epoch": 2623} {"train_loss": -11.612157821655273, "global_step": 440826, "epoch": 2623} {"train_loss": -11.685461044311523, "global_step": 440827, "epoch": 2623} {"train_loss": -11.472577095031738, "global_step": 440828, "epoch": 2623} {"train_loss": -10.752969741821289, "global_step": 440829, "epoch": 2623} {"train_loss": -11.583991050720215, "global_step": 440830, "epoch": 2623} {"train_loss": -12.013747550192333, "global_step": 440831, "epoch": 2623, "val_loss": 312550.59375} {"train_loss": -11.468587875366211, "global_step": 440832, "epoch": 2624} {"train_loss": -12.086084365844727, "global_step": 440833, "epoch": 2624} {"train_loss": -11.853241920471191, "global_step": 440834, "epoch": 2624} {"train_loss": -11.258821487426758, "global_step": 440835, "epoch": 2624} {"train_loss": -11.94296646118164, "global_step": 440836, "epoch": 2624} {"train_loss": -12.229110717773438, "global_step": 440837, "epoch": 2624} {"train_loss": -11.68255615234375, "global_step": 440838, "epoch": 2624} {"train_loss": -12.103743553161621, "global_step": 440839, "epoch": 2624} {"train_loss": -12.030878067016602, "global_step": 440840, "epoch": 2624} {"train_loss": -12.124004364013672, "global_step": 440841, "epoch": 2624} {"train_loss": -11.991098403930664, "global_step": 440842, "epoch": 2624} {"train_loss": -11.768040657043457, "global_step": 440843, "epoch": 2624} {"train_loss": -12.066545486450195, "global_step": 440844, "epoch": 2624} {"train_loss": -12.079331398010254, "global_step": 440845, "epoch": 2624} {"train_loss": -12.198572158813477, "global_step": 440846, "epoch": 2624} {"train_loss": -12.409050941467285, "global_step": 440847, "epoch": 2624} {"train_loss": -12.319631576538086, "global_step": 440848, "epoch": 2624} {"train_loss": -12.16604232788086, "global_step": 440849, "epoch": 2624} {"train_loss": -12.127466201782227, "global_step": 440850, "epoch": 2624} {"train_loss": -11.995030403137207, "global_step": 440851, "epoch": 2624} {"train_loss": -12.053801536560059, "global_step": 440852, "epoch": 2624} {"train_loss": -11.949277877807617, "global_step": 440853, "epoch": 2624} {"train_loss": -11.974055290222168, "global_step": 440854, "epoch": 2624} {"train_loss": -12.322053909301758, "global_step": 440855, "epoch": 2624} {"train_loss": -12.12841796875, "global_step": 440856, "epoch": 2624} {"train_loss": -12.62955379486084, "global_step": 440857, "epoch": 2624} {"train_loss": -11.935049057006836, "global_step": 440858, "epoch": 2624} {"train_loss": -12.442407608032227, "global_step": 440859, "epoch": 2624} {"train_loss": -12.180447578430176, "global_step": 440860, "epoch": 2624} {"train_loss": -12.06325912475586, "global_step": 440861, "epoch": 2624} {"train_loss": -12.090083122253418, "global_step": 440862, "epoch": 2624} {"train_loss": -12.385704040527344, "global_step": 440863, "epoch": 2624} {"train_loss": -12.356019020080566, "global_step": 440864, "epoch": 2624} {"train_loss": -12.114262580871582, "global_step": 440865, "epoch": 2624} {"train_loss": -12.092025756835938, "global_step": 440866, "epoch": 2624} {"train_loss": -12.348291397094727, "global_step": 440867, "epoch": 2624} {"train_loss": -12.197881698608398, "global_step": 440868, "epoch": 2624} {"train_loss": -12.143045425415039, "global_step": 440869, "epoch": 2624} {"train_loss": -12.320442199707031, "global_step": 440870, "epoch": 2624} {"train_loss": -12.673110961914062, "global_step": 440871, "epoch": 2624} {"train_loss": -12.267471313476562, "global_step": 440872, "epoch": 2624} {"train_loss": -12.19952392578125, "global_step": 440873, "epoch": 2624} {"train_loss": -12.472272872924805, "global_step": 440874, "epoch": 2624} {"train_loss": -12.851184844970703, "global_step": 440875, "epoch": 2624} {"train_loss": -12.346866607666016, "global_step": 440876, "epoch": 2624} {"train_loss": -12.473127365112305, "global_step": 440877, "epoch": 2624} {"train_loss": -12.168172836303711, "global_step": 440878, "epoch": 2624} {"train_loss": -12.119855880737305, "global_step": 440879, "epoch": 2624} {"train_loss": -12.393095970153809, "global_step": 440880, "epoch": 2624} {"train_loss": -12.053543090820312, "global_step": 440881, "epoch": 2624} {"train_loss": -11.986242294311523, "global_step": 440882, "epoch": 2624} {"train_loss": -12.132713317871094, "global_step": 440883, "epoch": 2624} {"train_loss": -12.418512344360352, "global_step": 440884, "epoch": 2624} {"train_loss": -11.360662460327148, "global_step": 440885, "epoch": 2624} {"train_loss": -11.997783660888672, "global_step": 440886, "epoch": 2624} {"train_loss": -12.53879165649414, "global_step": 440887, "epoch": 2624} {"train_loss": -12.200990676879883, "global_step": 440888, "epoch": 2624} {"train_loss": -12.839258193969727, "global_step": 440889, "epoch": 2624} {"train_loss": -12.174560546875, "global_step": 440890, "epoch": 2624} {"train_loss": -12.479730606079102, "global_step": 440891, "epoch": 2624} {"train_loss": -12.052234649658203, "global_step": 440892, "epoch": 2624} {"train_loss": -12.359504699707031, "global_step": 440893, "epoch": 2624} {"train_loss": -12.356657028198242, "global_step": 440894, "epoch": 2624} {"train_loss": -12.62590217590332, "global_step": 440895, "epoch": 2624} {"train_loss": -12.48043441772461, "global_step": 440896, "epoch": 2624} {"train_loss": -12.620580673217773, "global_step": 440897, "epoch": 2624} {"train_loss": -12.801774978637695, "global_step": 440898, "epoch": 2624} {"train_loss": -12.697393417358398, "global_step": 440899, "epoch": 2624} {"train_loss": -12.695152282714844, "global_step": 440900, "epoch": 2624} {"train_loss": -12.743088722229004, "global_step": 440901, "epoch": 2624} {"train_loss": -12.336784362792969, "global_step": 440902, "epoch": 2624} {"train_loss": -12.49753189086914, "global_step": 440903, "epoch": 2624} {"train_loss": -12.542728424072266, "global_step": 440904, "epoch": 2624} {"train_loss": -12.6627779006958, "global_step": 440905, "epoch": 2624} {"train_loss": -12.854754447937012, "global_step": 440906, "epoch": 2624} {"train_loss": -12.668521881103516, "global_step": 440907, "epoch": 2624} {"train_loss": -12.685379981994629, "global_step": 440908, "epoch": 2624} {"train_loss": -12.67300796508789, "global_step": 440909, "epoch": 2624} {"train_loss": -12.828393936157227, "global_step": 440910, "epoch": 2624} {"train_loss": -12.835342407226562, "global_step": 440911, "epoch": 2624} {"train_loss": -12.628622055053711, "global_step": 440912, "epoch": 2624} {"train_loss": -12.726577758789062, "global_step": 440913, "epoch": 2624} {"train_loss": -12.584775924682617, "global_step": 440914, "epoch": 2624} {"train_loss": -12.930028915405273, "global_step": 440915, "epoch": 2624} {"train_loss": -12.520999908447266, "global_step": 440916, "epoch": 2624} {"train_loss": -12.822115898132324, "global_step": 440917, "epoch": 2624} {"train_loss": -12.636853218078613, "global_step": 440918, "epoch": 2624} {"train_loss": -12.44678783416748, "global_step": 440919, "epoch": 2624} {"train_loss": -12.748771667480469, "global_step": 440920, "epoch": 2624} {"train_loss": -12.79197883605957, "global_step": 440921, "epoch": 2624} {"train_loss": -12.841961860656738, "global_step": 440922, "epoch": 2624} {"train_loss": -12.572309494018555, "global_step": 440923, "epoch": 2624} {"train_loss": -12.706130981445312, "global_step": 440924, "epoch": 2624} {"train_loss": -12.78846263885498, "global_step": 440925, "epoch": 2624} {"train_loss": -12.752217292785645, "global_step": 440926, "epoch": 2624} {"train_loss": -12.556648254394531, "global_step": 440927, "epoch": 2624} {"train_loss": -12.642864227294922, "global_step": 440928, "epoch": 2624} {"train_loss": -12.576559066772461, "global_step": 440929, "epoch": 2624} {"train_loss": -12.549768447875977, "global_step": 440930, "epoch": 2624} {"train_loss": -12.12614917755127, "global_step": 440931, "epoch": 2624} {"train_loss": -12.295466423034668, "global_step": 440932, "epoch": 2624} {"train_loss": -12.402978897094727, "global_step": 440933, "epoch": 2624} {"train_loss": -12.786233901977539, "global_step": 440934, "epoch": 2624} {"train_loss": -12.487796783447266, "global_step": 440935, "epoch": 2624} {"train_loss": -12.207645416259766, "global_step": 440936, "epoch": 2624} {"train_loss": -11.741211891174316, "global_step": 440937, "epoch": 2624} {"train_loss": -12.554153442382812, "global_step": 440938, "epoch": 2624} {"train_loss": -12.092924118041992, "global_step": 440939, "epoch": 2624} {"train_loss": -11.139238357543945, "global_step": 440940, "epoch": 2624} {"train_loss": -11.573799133300781, "global_step": 440941, "epoch": 2624} {"train_loss": -12.51303482055664, "global_step": 440942, "epoch": 2624} {"train_loss": -12.128774642944336, "global_step": 440943, "epoch": 2624} {"train_loss": -11.65781021118164, "global_step": 440944, "epoch": 2624} {"train_loss": -11.860147476196289, "global_step": 440945, "epoch": 2624} {"train_loss": -12.044118881225586, "global_step": 440946, "epoch": 2624} {"train_loss": -10.885704040527344, "global_step": 440947, "epoch": 2624} {"train_loss": -11.718823432922363, "global_step": 440948, "epoch": 2624} {"train_loss": -11.956087112426758, "global_step": 440949, "epoch": 2624} {"train_loss": -12.335174560546875, "global_step": 440950, "epoch": 2624} {"train_loss": -11.959110260009766, "global_step": 440951, "epoch": 2624} {"train_loss": -12.145486831665039, "global_step": 440952, "epoch": 2624} {"train_loss": -12.136863708496094, "global_step": 440953, "epoch": 2624} {"train_loss": -12.238954544067383, "global_step": 440954, "epoch": 2624} {"train_loss": -12.377355575561523, "global_step": 440955, "epoch": 2624} {"train_loss": -11.719179153442383, "global_step": 440956, "epoch": 2624} {"train_loss": -11.975893020629883, "global_step": 440957, "epoch": 2624} {"train_loss": -11.619424819946289, "global_step": 440958, "epoch": 2624} {"train_loss": -12.235355377197266, "global_step": 440959, "epoch": 2624} {"train_loss": -11.861572265625, "global_step": 440960, "epoch": 2624} {"train_loss": -11.970407485961914, "global_step": 440961, "epoch": 2624} {"train_loss": -12.028337478637695, "global_step": 440962, "epoch": 2624} {"train_loss": -12.110126495361328, "global_step": 440963, "epoch": 2624} {"train_loss": -12.245824813842773, "global_step": 440964, "epoch": 2624} {"train_loss": -12.229131698608398, "global_step": 440965, "epoch": 2624} {"train_loss": -12.117330551147461, "global_step": 440966, "epoch": 2624} {"train_loss": -11.681390762329102, "global_step": 440967, "epoch": 2624} {"train_loss": -12.282855987548828, "global_step": 440968, "epoch": 2624} {"train_loss": -12.347537994384766, "global_step": 440969, "epoch": 2624} {"train_loss": -11.829814910888672, "global_step": 440970, "epoch": 2624} {"train_loss": -12.503131866455078, "global_step": 440971, "epoch": 2624} {"train_loss": -11.88615608215332, "global_step": 440972, "epoch": 2624} {"train_loss": -11.76401138305664, "global_step": 440973, "epoch": 2624} {"train_loss": -12.044204711914062, "global_step": 440974, "epoch": 2624} {"train_loss": -12.329526901245117, "global_step": 440975, "epoch": 2624} {"train_loss": -11.982198715209961, "global_step": 440976, "epoch": 2624} {"train_loss": -12.591506958007812, "global_step": 440977, "epoch": 2624} {"train_loss": -12.30586051940918, "global_step": 440978, "epoch": 2624} {"train_loss": -12.075678825378418, "global_step": 440979, "epoch": 2624} {"train_loss": -11.947566986083984, "global_step": 440980, "epoch": 2624} {"train_loss": -12.32848072052002, "global_step": 440981, "epoch": 2624} {"train_loss": -11.696733474731445, "global_step": 440982, "epoch": 2624} {"train_loss": -11.468655586242676, "global_step": 440983, "epoch": 2624} {"train_loss": -11.887784957885742, "global_step": 440984, "epoch": 2624} {"train_loss": -10.650933265686035, "global_step": 440985, "epoch": 2624} {"train_loss": -10.92399787902832, "global_step": 440986, "epoch": 2624} {"train_loss": -11.959419250488281, "global_step": 440987, "epoch": 2624} {"train_loss": -10.720318794250488, "global_step": 440988, "epoch": 2624} {"train_loss": -10.289560317993164, "global_step": 440989, "epoch": 2624} {"train_loss": -11.179328918457031, "global_step": 440990, "epoch": 2624} {"train_loss": -10.438661575317383, "global_step": 440991, "epoch": 2624} {"train_loss": -9.697583198547363, "global_step": 440992, "epoch": 2624} {"train_loss": -11.441986083984375, "global_step": 440993, "epoch": 2624} {"train_loss": -8.709879875183105, "global_step": 440994, "epoch": 2624} {"train_loss": -10.1058349609375, "global_step": 440995, "epoch": 2624} {"train_loss": -9.635034561157227, "global_step": 440996, "epoch": 2624} {"train_loss": -10.133641242980957, "global_step": 440997, "epoch": 2624} {"train_loss": -10.46681022644043, "global_step": 440998, "epoch": 2624} {"train_loss": -12.084980431057158, "global_step": 440999, "epoch": 2624, "val_loss": 313084.15625} {"train_loss": -10.840015411376953, "global_step": 441000, "epoch": 2625} {"train_loss": -11.041406631469727, "global_step": 441001, "epoch": 2625} {"train_loss": -10.812392234802246, "global_step": 441002, "epoch": 2625} {"train_loss": -11.650357246398926, "global_step": 441003, "epoch": 2625} {"train_loss": -11.998544692993164, "global_step": 441004, "epoch": 2625} {"train_loss": -11.04483699798584, "global_step": 441005, "epoch": 2625} {"train_loss": -11.630941390991211, "global_step": 441006, "epoch": 2625} {"train_loss": -11.275177001953125, "global_step": 441007, "epoch": 2625} {"train_loss": -11.744016647338867, "global_step": 441008, "epoch": 2625} {"train_loss": -11.90457820892334, "global_step": 441009, "epoch": 2625} {"train_loss": -12.043241500854492, "global_step": 441010, "epoch": 2625} {"train_loss": -11.155996322631836, "global_step": 441011, "epoch": 2625} {"train_loss": -11.81035041809082, "global_step": 441012, "epoch": 2625} {"train_loss": -11.899930953979492, "global_step": 441013, "epoch": 2625} {"train_loss": -12.069313049316406, "global_step": 441014, "epoch": 2625} {"train_loss": -11.581695556640625, "global_step": 441015, "epoch": 2625} {"train_loss": -11.896437644958496, "global_step": 441016, "epoch": 2625} {"train_loss": -11.653861045837402, "global_step": 441017, "epoch": 2625} {"train_loss": -12.096217155456543, "global_step": 441018, "epoch": 2625} {"train_loss": -11.331937789916992, "global_step": 441019, "epoch": 2625} {"train_loss": -12.077677726745605, "global_step": 441020, "epoch": 2625} {"train_loss": -11.746492385864258, "global_step": 441021, "epoch": 2625} {"train_loss": -12.077547073364258, "global_step": 441022, "epoch": 2625} {"train_loss": -12.42426586151123, "global_step": 441023, "epoch": 2625} {"train_loss": -11.866161346435547, "global_step": 441024, "epoch": 2625} {"train_loss": -12.092070579528809, "global_step": 441025, "epoch": 2625} {"train_loss": -11.719558715820312, "global_step": 441026, "epoch": 2625} {"train_loss": -12.236896514892578, "global_step": 441027, "epoch": 2625} {"train_loss": -11.494636535644531, "global_step": 441028, "epoch": 2625} {"train_loss": -12.359990119934082, "global_step": 441029, "epoch": 2625} {"train_loss": -11.341901779174805, "global_step": 441030, "epoch": 2625} {"train_loss": -12.18471622467041, "global_step": 441031, "epoch": 2625} {"train_loss": -11.584819793701172, "global_step": 441032, "epoch": 2625} {"train_loss": -12.4074068069458, "global_step": 441033, "epoch": 2625} {"train_loss": -12.165351867675781, "global_step": 441034, "epoch": 2625} {"train_loss": -12.197153091430664, "global_step": 441035, "epoch": 2625} {"train_loss": -12.327942848205566, "global_step": 441036, "epoch": 2625} {"train_loss": -12.461938858032227, "global_step": 441037, "epoch": 2625} {"train_loss": -12.290544509887695, "global_step": 441038, "epoch": 2625} {"train_loss": -12.308300018310547, "global_step": 441039, "epoch": 2625} {"train_loss": -12.097209930419922, "global_step": 441040, "epoch": 2625} {"train_loss": -11.992612838745117, "global_step": 441041, "epoch": 2625} {"train_loss": -12.185498237609863, "global_step": 441042, "epoch": 2625} {"train_loss": -12.256193161010742, "global_step": 441043, "epoch": 2625} {"train_loss": -12.411722183227539, "global_step": 441044, "epoch": 2625} {"train_loss": -12.31085205078125, "global_step": 441045, "epoch": 2625} {"train_loss": -12.628233909606934, "global_step": 441046, "epoch": 2625} {"train_loss": -12.340299606323242, "global_step": 441047, "epoch": 2625} {"train_loss": -12.31292724609375, "global_step": 441048, "epoch": 2625} {"train_loss": -12.35881519317627, "global_step": 441049, "epoch": 2625} {"train_loss": -12.520429611206055, "global_step": 441050, "epoch": 2625} {"train_loss": -12.610339164733887, "global_step": 441051, "epoch": 2625} {"train_loss": -12.57369327545166, "global_step": 441052, "epoch": 2625} {"train_loss": -12.432287216186523, "global_step": 441053, "epoch": 2625} {"train_loss": -12.597058296203613, "global_step": 441054, "epoch": 2625} {"train_loss": -12.27155876159668, "global_step": 441055, "epoch": 2625} {"train_loss": -12.456033706665039, "global_step": 441056, "epoch": 2625} {"train_loss": -12.271739959716797, "global_step": 441057, "epoch": 2625} {"train_loss": -12.46017837524414, "global_step": 441058, "epoch": 2625} {"train_loss": -12.383325576782227, "global_step": 441059, "epoch": 2625} {"train_loss": -12.523887634277344, "global_step": 441060, "epoch": 2625} {"train_loss": -12.364019393920898, "global_step": 441061, "epoch": 2625} {"train_loss": -12.456113815307617, "global_step": 441062, "epoch": 2625} {"train_loss": -12.494752883911133, "global_step": 441063, "epoch": 2625} {"train_loss": -12.306659698486328, "global_step": 441064, "epoch": 2625} {"train_loss": -12.663570404052734, "global_step": 441065, "epoch": 2625} {"train_loss": -12.539756774902344, "global_step": 441066, "epoch": 2625} {"train_loss": -12.54408073425293, "global_step": 441067, "epoch": 2625} {"train_loss": -12.442817687988281, "global_step": 441068, "epoch": 2625} {"train_loss": -12.58212661743164, "global_step": 441069, "epoch": 2625} {"train_loss": -12.412168502807617, "global_step": 441070, "epoch": 2625} {"train_loss": -12.662091255187988, "global_step": 441071, "epoch": 2625} {"train_loss": -12.35683822631836, "global_step": 441072, "epoch": 2625} {"train_loss": -12.419482231140137, "global_step": 441073, "epoch": 2625} {"train_loss": -12.253472328186035, "global_step": 441074, "epoch": 2625} {"train_loss": -12.82418441772461, "global_step": 441075, "epoch": 2625} {"train_loss": -12.3873291015625, "global_step": 441076, "epoch": 2625} {"train_loss": -12.525224685668945, "global_step": 441077, "epoch": 2625} {"train_loss": -12.587589263916016, "global_step": 441078, "epoch": 2625} {"train_loss": -12.479408264160156, "global_step": 441079, "epoch": 2625} {"train_loss": -12.517260551452637, "global_step": 441080, "epoch": 2625} {"train_loss": -12.597905158996582, "global_step": 441081, "epoch": 2625} {"train_loss": -12.575321197509766, "global_step": 441082, "epoch": 2625} {"train_loss": -12.486151695251465, "global_step": 441083, "epoch": 2625} {"train_loss": -12.688482284545898, "global_step": 441084, "epoch": 2625} {"train_loss": -12.51163101196289, "global_step": 441085, "epoch": 2625} {"train_loss": -12.561355590820312, "global_step": 441086, "epoch": 2625} {"train_loss": -12.92569351196289, "global_step": 441087, "epoch": 2625} {"train_loss": -12.620305061340332, "global_step": 441088, "epoch": 2625} {"train_loss": -12.718145370483398, "global_step": 441089, "epoch": 2625} {"train_loss": -12.634946823120117, "global_step": 441090, "epoch": 2625} {"train_loss": -12.681547164916992, "global_step": 441091, "epoch": 2625} {"train_loss": -12.802228927612305, "global_step": 441092, "epoch": 2625} {"train_loss": -12.781978607177734, "global_step": 441093, "epoch": 2625} {"train_loss": -12.477295875549316, "global_step": 441094, "epoch": 2625} {"train_loss": -12.919145584106445, "global_step": 441095, "epoch": 2625} {"train_loss": -12.586544036865234, "global_step": 441096, "epoch": 2625} {"train_loss": -12.807920455932617, "global_step": 441097, "epoch": 2625} {"train_loss": -12.837160110473633, "global_step": 441098, "epoch": 2625} {"train_loss": -12.791546821594238, "global_step": 441099, "epoch": 2625} {"train_loss": -12.887333869934082, "global_step": 441100, "epoch": 2625} {"train_loss": -12.783856391906738, "global_step": 441101, "epoch": 2625} {"train_loss": -12.922867774963379, "global_step": 441102, "epoch": 2625} {"train_loss": -12.799338340759277, "global_step": 441103, "epoch": 2625} {"train_loss": -12.767426490783691, "global_step": 441104, "epoch": 2625} {"train_loss": -12.83619213104248, "global_step": 441105, "epoch": 2625} {"train_loss": -12.552324295043945, "global_step": 441106, "epoch": 2625} {"train_loss": -12.673582077026367, "global_step": 441107, "epoch": 2625} {"train_loss": -12.819965362548828, "global_step": 441108, "epoch": 2625} {"train_loss": -12.72586441040039, "global_step": 441109, "epoch": 2625} {"train_loss": -12.474733352661133, "global_step": 441110, "epoch": 2625} {"train_loss": -12.825252532958984, "global_step": 441111, "epoch": 2625} {"train_loss": -12.589973449707031, "global_step": 441112, "epoch": 2625} {"train_loss": -12.396072387695312, "global_step": 441113, "epoch": 2625} {"train_loss": -12.524711608886719, "global_step": 441114, "epoch": 2625} {"train_loss": -12.776455879211426, "global_step": 441115, "epoch": 2625} {"train_loss": -12.549488067626953, "global_step": 441116, "epoch": 2625} {"train_loss": -12.209585189819336, "global_step": 441117, "epoch": 2625} {"train_loss": -12.435043334960938, "global_step": 441118, "epoch": 2625} {"train_loss": -13.04684829711914, "global_step": 441119, "epoch": 2625} {"train_loss": -12.39604377746582, "global_step": 441120, "epoch": 2625} {"train_loss": -10.825485229492188, "global_step": 441121, "epoch": 2625} {"train_loss": -10.82049560546875, "global_step": 441122, "epoch": 2625} {"train_loss": -12.077394485473633, "global_step": 441123, "epoch": 2625} {"train_loss": -11.940919876098633, "global_step": 441124, "epoch": 2625} {"train_loss": -11.065054893493652, "global_step": 441125, "epoch": 2625} {"train_loss": -11.801916122436523, "global_step": 441126, "epoch": 2625} {"train_loss": -11.448439598083496, "global_step": 441127, "epoch": 2625} {"train_loss": -11.055708885192871, "global_step": 441128, "epoch": 2625} {"train_loss": -10.911331176757812, "global_step": 441129, "epoch": 2625} {"train_loss": -10.65477180480957, "global_step": 441130, "epoch": 2625} {"train_loss": -10.858561515808105, "global_step": 441131, "epoch": 2625} {"train_loss": -11.339969635009766, "global_step": 441132, "epoch": 2625} {"train_loss": -10.643938064575195, "global_step": 441133, "epoch": 2625} {"train_loss": -10.772440910339355, "global_step": 441134, "epoch": 2625} {"train_loss": -11.644475936889648, "global_step": 441135, "epoch": 2625} {"train_loss": -10.328862190246582, "global_step": 441136, "epoch": 2625} {"train_loss": -10.14360237121582, "global_step": 441137, "epoch": 2625} {"train_loss": -11.50874137878418, "global_step": 441138, "epoch": 2625} {"train_loss": -9.974872589111328, "global_step": 441139, "epoch": 2625} {"train_loss": -11.068225860595703, "global_step": 441140, "epoch": 2625} {"train_loss": -10.535787582397461, "global_step": 441141, "epoch": 2625} {"train_loss": -10.839221954345703, "global_step": 441142, "epoch": 2625} {"train_loss": -11.45903205871582, "global_step": 441143, "epoch": 2625} {"train_loss": -10.984869956970215, "global_step": 441144, "epoch": 2625} {"train_loss": -11.500046730041504, "global_step": 441145, "epoch": 2625} {"train_loss": -11.379810333251953, "global_step": 441146, "epoch": 2625} {"train_loss": -11.644489288330078, "global_step": 441147, "epoch": 2625} {"train_loss": -9.848053932189941, "global_step": 441148, "epoch": 2625} {"train_loss": -11.864503860473633, "global_step": 441149, "epoch": 2625} {"train_loss": -11.086097717285156, "global_step": 441150, "epoch": 2625} {"train_loss": -11.213865280151367, "global_step": 441151, "epoch": 2625} {"train_loss": -11.303178787231445, "global_step": 441152, "epoch": 2625} {"train_loss": -10.569395065307617, "global_step": 441153, "epoch": 2625} {"train_loss": -11.782442092895508, "global_step": 441154, "epoch": 2625} {"train_loss": -11.120601654052734, "global_step": 441155, "epoch": 2625} {"train_loss": -10.85419750213623, "global_step": 441156, "epoch": 2625} {"train_loss": -10.551490783691406, "global_step": 441157, "epoch": 2625} {"train_loss": -11.080534934997559, "global_step": 441158, "epoch": 2625} {"train_loss": -11.469348907470703, "global_step": 441159, "epoch": 2625} {"train_loss": -11.675586700439453, "global_step": 441160, "epoch": 2625} {"train_loss": -11.04144287109375, "global_step": 441161, "epoch": 2625} {"train_loss": -12.2837553024292, "global_step": 441162, "epoch": 2625} {"train_loss": -11.745662689208984, "global_step": 441163, "epoch": 2625} {"train_loss": -11.750394821166992, "global_step": 441164, "epoch": 2625} {"train_loss": -11.966707229614258, "global_step": 441165, "epoch": 2625} {"train_loss": -11.650775909423828, "global_step": 441166, "epoch": 2625} {"train_loss": -11.997360507647196, "global_step": 441167, "epoch": 2625, "val_loss": 308346.15625, "train_action_mse_error": 0.7019627094268799} {"train_loss": -11.714016914367676, "global_step": 441168, "epoch": 2626} {"train_loss": -11.929214477539062, "global_step": 441169, "epoch": 2626} {"train_loss": -11.943143844604492, "global_step": 441170, "epoch": 2626} {"train_loss": -12.047845840454102, "global_step": 441171, "epoch": 2626} {"train_loss": -11.911447525024414, "global_step": 441172, "epoch": 2626} {"train_loss": -12.20107650756836, "global_step": 441173, "epoch": 2626} {"train_loss": -12.150741577148438, "global_step": 441174, "epoch": 2626} {"train_loss": -11.981809616088867, "global_step": 441175, "epoch": 2626} {"train_loss": -12.168556213378906, "global_step": 441176, "epoch": 2626} {"train_loss": -12.190784454345703, "global_step": 441177, "epoch": 2626} {"train_loss": -12.345726013183594, "global_step": 441178, "epoch": 2626} {"train_loss": -11.917108535766602, "global_step": 441179, "epoch": 2626} {"train_loss": -12.550132751464844, "global_step": 441180, "epoch": 2626} {"train_loss": -12.304363250732422, "global_step": 441181, "epoch": 2626} {"train_loss": -12.322102546691895, "global_step": 441182, "epoch": 2626} {"train_loss": -12.245019912719727, "global_step": 441183, "epoch": 2626} {"train_loss": -12.13327407836914, "global_step": 441184, "epoch": 2626} {"train_loss": -12.436229705810547, "global_step": 441185, "epoch": 2626} {"train_loss": -12.321329116821289, "global_step": 441186, "epoch": 2626} {"train_loss": -12.275545120239258, "global_step": 441187, "epoch": 2626} {"train_loss": -12.513598442077637, "global_step": 441188, "epoch": 2626} {"train_loss": -12.315949440002441, "global_step": 441189, "epoch": 2626} {"train_loss": -12.524405479431152, "global_step": 441190, "epoch": 2626} {"train_loss": -12.609100341796875, "global_step": 441191, "epoch": 2626} {"train_loss": -12.370025634765625, "global_step": 441192, "epoch": 2626} {"train_loss": -12.473751068115234, "global_step": 441193, "epoch": 2626} {"train_loss": -12.540349960327148, "global_step": 441194, "epoch": 2626} {"train_loss": -12.383279800415039, "global_step": 441195, "epoch": 2626} {"train_loss": -12.450660705566406, "global_step": 441196, "epoch": 2626} {"train_loss": -12.460384368896484, "global_step": 441197, "epoch": 2626} {"train_loss": -12.321144104003906, "global_step": 441198, "epoch": 2626} {"train_loss": -12.612312316894531, "global_step": 441199, "epoch": 2626} {"train_loss": -12.3404541015625, "global_step": 441200, "epoch": 2626} {"train_loss": -12.476251602172852, "global_step": 441201, "epoch": 2626} {"train_loss": -12.388148307800293, "global_step": 441202, "epoch": 2626} {"train_loss": -12.497027397155762, "global_step": 441203, "epoch": 2626} {"train_loss": -12.270777702331543, "global_step": 441204, "epoch": 2626} {"train_loss": -12.089820861816406, "global_step": 441205, "epoch": 2626} {"train_loss": -12.256832122802734, "global_step": 441206, "epoch": 2626} {"train_loss": -12.446311950683594, "global_step": 441207, "epoch": 2626} {"train_loss": -12.631671905517578, "global_step": 441208, "epoch": 2626} {"train_loss": -12.33102035522461, "global_step": 441209, "epoch": 2626} {"train_loss": -12.64476203918457, "global_step": 441210, "epoch": 2626} {"train_loss": -12.68966293334961, "global_step": 441211, "epoch": 2626} {"train_loss": -12.467880249023438, "global_step": 441212, "epoch": 2626} {"train_loss": -12.670053482055664, "global_step": 441213, "epoch": 2626} {"train_loss": -12.467876434326172, "global_step": 441214, "epoch": 2626} {"train_loss": -12.869773864746094, "global_step": 441215, "epoch": 2626} {"train_loss": -12.472234725952148, "global_step": 441216, "epoch": 2626} {"train_loss": -12.404640197753906, "global_step": 441217, "epoch": 2626} {"train_loss": -12.751296997070312, "global_step": 441218, "epoch": 2626} {"train_loss": -12.294134140014648, "global_step": 441219, "epoch": 2626} {"train_loss": -12.671918869018555, "global_step": 441220, "epoch": 2626} {"train_loss": -12.76447868347168, "global_step": 441221, "epoch": 2626} {"train_loss": -12.77768325805664, "global_step": 441222, "epoch": 2626} {"train_loss": -12.851520538330078, "global_step": 441223, "epoch": 2626} {"train_loss": -12.756889343261719, "global_step": 441224, "epoch": 2626} {"train_loss": -12.744586944580078, "global_step": 441225, "epoch": 2626} {"train_loss": -12.750686645507812, "global_step": 441226, "epoch": 2626} {"train_loss": -12.481851577758789, "global_step": 441227, "epoch": 2626} {"train_loss": -12.687250137329102, "global_step": 441228, "epoch": 2626} {"train_loss": -12.680377960205078, "global_step": 441229, "epoch": 2626} {"train_loss": -12.624220848083496, "global_step": 441230, "epoch": 2626} {"train_loss": -12.336811065673828, "global_step": 441231, "epoch": 2626} {"train_loss": -12.888129234313965, "global_step": 441232, "epoch": 2626} {"train_loss": -11.931435585021973, "global_step": 441233, "epoch": 2626} {"train_loss": -12.108007431030273, "global_step": 441234, "epoch": 2626} {"train_loss": -11.257270812988281, "global_step": 441235, "epoch": 2626} {"train_loss": -12.091133117675781, "global_step": 441236, "epoch": 2626} {"train_loss": -11.929777145385742, "global_step": 441237, "epoch": 2626} {"train_loss": -12.33151626586914, "global_step": 441238, "epoch": 2626} {"train_loss": -11.597553253173828, "global_step": 441239, "epoch": 2626} {"train_loss": -12.070253372192383, "global_step": 441240, "epoch": 2626} {"train_loss": -12.153844833374023, "global_step": 441241, "epoch": 2626} {"train_loss": -11.577038764953613, "global_step": 441242, "epoch": 2626} {"train_loss": -12.44410228729248, "global_step": 441243, "epoch": 2626} {"train_loss": -11.737625122070312, "global_step": 441244, "epoch": 2626} {"train_loss": -12.087310791015625, "global_step": 441245, "epoch": 2626} {"train_loss": -12.106060028076172, "global_step": 441246, "epoch": 2626} {"train_loss": -12.034421920776367, "global_step": 441247, "epoch": 2626} {"train_loss": -11.071006774902344, "global_step": 441248, "epoch": 2626} {"train_loss": -12.11496353149414, "global_step": 441249, "epoch": 2626} {"train_loss": -10.309101104736328, "global_step": 441250, "epoch": 2626} {"train_loss": -11.757587432861328, "global_step": 441251, "epoch": 2626} {"train_loss": -11.935163497924805, "global_step": 441252, "epoch": 2626} {"train_loss": -10.883936882019043, "global_step": 441253, "epoch": 2626} {"train_loss": -11.856714248657227, "global_step": 441254, "epoch": 2626} {"train_loss": -11.10024642944336, "global_step": 441255, "epoch": 2626} {"train_loss": -11.963335037231445, "global_step": 441256, "epoch": 2626} {"train_loss": -11.36250114440918, "global_step": 441257, "epoch": 2626} {"train_loss": -11.573308944702148, "global_step": 441258, "epoch": 2626} {"train_loss": -12.204610824584961, "global_step": 441259, "epoch": 2626} {"train_loss": -10.758878707885742, "global_step": 441260, "epoch": 2626} {"train_loss": -11.70451831817627, "global_step": 441261, "epoch": 2626} {"train_loss": -11.791831970214844, "global_step": 441262, "epoch": 2626} {"train_loss": -11.651556015014648, "global_step": 441263, "epoch": 2626} {"train_loss": -11.9442138671875, "global_step": 441264, "epoch": 2626} {"train_loss": -11.465097427368164, "global_step": 441265, "epoch": 2626} {"train_loss": -12.039283752441406, "global_step": 441266, "epoch": 2626} {"train_loss": -12.15302848815918, "global_step": 441267, "epoch": 2626} {"train_loss": -11.618812561035156, "global_step": 441268, "epoch": 2626} {"train_loss": -12.325573921203613, "global_step": 441269, "epoch": 2626} {"train_loss": -11.638181686401367, "global_step": 441270, "epoch": 2626} {"train_loss": -11.928717613220215, "global_step": 441271, "epoch": 2626} {"train_loss": -11.756366729736328, "global_step": 441272, "epoch": 2626} {"train_loss": -12.289636611938477, "global_step": 441273, "epoch": 2626} {"train_loss": -12.217205047607422, "global_step": 441274, "epoch": 2626} {"train_loss": -12.142308235168457, "global_step": 441275, "epoch": 2626} {"train_loss": -12.15156364440918, "global_step": 441276, "epoch": 2626} {"train_loss": -12.224836349487305, "global_step": 441277, "epoch": 2626} {"train_loss": -12.020317077636719, "global_step": 441278, "epoch": 2626} {"train_loss": -12.195663452148438, "global_step": 441279, "epoch": 2626} {"train_loss": -11.707386016845703, "global_step": 441280, "epoch": 2626} {"train_loss": -12.311454772949219, "global_step": 441281, "epoch": 2626} {"train_loss": -12.239215850830078, "global_step": 441282, "epoch": 2626} {"train_loss": -12.347655296325684, "global_step": 441283, "epoch": 2626} {"train_loss": -12.117552757263184, "global_step": 441284, "epoch": 2626} {"train_loss": -11.672656059265137, "global_step": 441285, "epoch": 2626} {"train_loss": -12.506306648254395, "global_step": 441286, "epoch": 2626} {"train_loss": -11.496345520019531, "global_step": 441287, "epoch": 2626} {"train_loss": -12.412969589233398, "global_step": 441288, "epoch": 2626} {"train_loss": -12.263340950012207, "global_step": 441289, "epoch": 2626} {"train_loss": -12.520261764526367, "global_step": 441290, "epoch": 2626} {"train_loss": -12.497577667236328, "global_step": 441291, "epoch": 2626} {"train_loss": -12.45554256439209, "global_step": 441292, "epoch": 2626} {"train_loss": -12.584537506103516, "global_step": 441293, "epoch": 2626} {"train_loss": -12.44349479675293, "global_step": 441294, "epoch": 2626} {"train_loss": -12.79955005645752, "global_step": 441295, "epoch": 2626} {"train_loss": -12.316655158996582, "global_step": 441296, "epoch": 2626} {"train_loss": -12.63525390625, "global_step": 441297, "epoch": 2626} {"train_loss": -12.367850303649902, "global_step": 441298, "epoch": 2626} {"train_loss": -12.2908935546875, "global_step": 441299, "epoch": 2626} {"train_loss": -12.681536674499512, "global_step": 441300, "epoch": 2626} {"train_loss": -12.312275886535645, "global_step": 441301, "epoch": 2626} {"train_loss": -12.656630516052246, "global_step": 441302, "epoch": 2626} {"train_loss": -12.440566062927246, "global_step": 441303, "epoch": 2626} {"train_loss": -12.58884048461914, "global_step": 441304, "epoch": 2626} {"train_loss": -12.54555892944336, "global_step": 441305, "epoch": 2626} {"train_loss": -12.399860382080078, "global_step": 441306, "epoch": 2626} {"train_loss": -12.403366088867188, "global_step": 441307, "epoch": 2626} {"train_loss": -12.530545234680176, "global_step": 441308, "epoch": 2626} {"train_loss": -12.502201080322266, "global_step": 441309, "epoch": 2626} {"train_loss": -12.27791976928711, "global_step": 441310, "epoch": 2626} {"train_loss": -12.621771812438965, "global_step": 441311, "epoch": 2626} {"train_loss": -12.378119468688965, "global_step": 441312, "epoch": 2626} {"train_loss": -12.587191581726074, "global_step": 441313, "epoch": 2626} {"train_loss": -12.455790519714355, "global_step": 441314, "epoch": 2626} {"train_loss": -12.354183197021484, "global_step": 441315, "epoch": 2626} {"train_loss": -12.649358749389648, "global_step": 441316, "epoch": 2626} {"train_loss": -12.518129348754883, "global_step": 441317, "epoch": 2626} {"train_loss": -12.787002563476562, "global_step": 441318, "epoch": 2626} {"train_loss": -12.61832046508789, "global_step": 441319, "epoch": 2626} {"train_loss": -12.763779640197754, "global_step": 441320, "epoch": 2626} {"train_loss": -12.469865798950195, "global_step": 441321, "epoch": 2626} {"train_loss": -12.572141647338867, "global_step": 441322, "epoch": 2626} {"train_loss": -12.587016105651855, "global_step": 441323, "epoch": 2626} {"train_loss": -12.715799331665039, "global_step": 441324, "epoch": 2626} {"train_loss": -12.777639389038086, "global_step": 441325, "epoch": 2626} {"train_loss": -12.91861343383789, "global_step": 441326, "epoch": 2626} {"train_loss": -12.288095474243164, "global_step": 441327, "epoch": 2626} {"train_loss": -12.843137741088867, "global_step": 441328, "epoch": 2626} {"train_loss": -12.790027618408203, "global_step": 441329, "epoch": 2626} {"train_loss": -12.933847427368164, "global_step": 441330, "epoch": 2626} {"train_loss": -12.776716232299805, "global_step": 441331, "epoch": 2626} {"train_loss": -12.758474349975586, "global_step": 441332, "epoch": 2626} {"train_loss": -12.634708404541016, "global_step": 441333, "epoch": 2626} {"train_loss": -12.907252311706543, "global_step": 441334, "epoch": 2626} {"train_loss": -12.27853645029522, "global_step": 441335, "epoch": 2626, "val_loss": 311501.09375} {"train_loss": -12.643256187438965, "global_step": 441336, "epoch": 2627} {"train_loss": -12.954599380493164, "global_step": 441337, "epoch": 2627} {"train_loss": -12.64727783203125, "global_step": 441338, "epoch": 2627} {"train_loss": -12.785005569458008, "global_step": 441339, "epoch": 2627} {"train_loss": -12.900055885314941, "global_step": 441340, "epoch": 2627} {"train_loss": -12.823556900024414, "global_step": 441341, "epoch": 2627} {"train_loss": -12.577066421508789, "global_step": 441342, "epoch": 2627} {"train_loss": -12.680075645446777, "global_step": 441343, "epoch": 2627} {"train_loss": -12.865703582763672, "global_step": 441344, "epoch": 2627} {"train_loss": -12.60728645324707, "global_step": 441345, "epoch": 2627} {"train_loss": -12.739948272705078, "global_step": 441346, "epoch": 2627} {"train_loss": -12.637710571289062, "global_step": 441347, "epoch": 2627} {"train_loss": -12.574788093566895, "global_step": 441348, "epoch": 2627} {"train_loss": -12.604915618896484, "global_step": 441349, "epoch": 2627} {"train_loss": -12.77720832824707, "global_step": 441350, "epoch": 2627} {"train_loss": -12.294239044189453, "global_step": 441351, "epoch": 2627} {"train_loss": -12.498920440673828, "global_step": 441352, "epoch": 2627} {"train_loss": -12.813493728637695, "global_step": 441353, "epoch": 2627} {"train_loss": -12.523727416992188, "global_step": 441354, "epoch": 2627} {"train_loss": -12.360788345336914, "global_step": 441355, "epoch": 2627} {"train_loss": -12.563033103942871, "global_step": 441356, "epoch": 2627} {"train_loss": -12.763494491577148, "global_step": 441357, "epoch": 2627} {"train_loss": -11.729297637939453, "global_step": 441358, "epoch": 2627} {"train_loss": -12.64069938659668, "global_step": 441359, "epoch": 2627} {"train_loss": -12.491765975952148, "global_step": 441360, "epoch": 2627} {"train_loss": -12.489046096801758, "global_step": 441361, "epoch": 2627} {"train_loss": -12.496760368347168, "global_step": 441362, "epoch": 2627} {"train_loss": -12.255441665649414, "global_step": 441363, "epoch": 2627} {"train_loss": -12.162809371948242, "global_step": 441364, "epoch": 2627} {"train_loss": -12.5555419921875, "global_step": 441365, "epoch": 2627} {"train_loss": -10.817972183227539, "global_step": 441366, "epoch": 2627} {"train_loss": -11.889556884765625, "global_step": 441367, "epoch": 2627} {"train_loss": -12.414710998535156, "global_step": 441368, "epoch": 2627} {"train_loss": -10.98106575012207, "global_step": 441369, "epoch": 2627} {"train_loss": -10.575605392456055, "global_step": 441370, "epoch": 2627} {"train_loss": -11.831483840942383, "global_step": 441371, "epoch": 2627} {"train_loss": -11.190047264099121, "global_step": 441372, "epoch": 2627} {"train_loss": -12.267667770385742, "global_step": 441373, "epoch": 2627} {"train_loss": -11.600207328796387, "global_step": 441374, "epoch": 2627} {"train_loss": -11.454455375671387, "global_step": 441375, "epoch": 2627} {"train_loss": -12.040332794189453, "global_step": 441376, "epoch": 2627} {"train_loss": -12.128113746643066, "global_step": 441377, "epoch": 2627} {"train_loss": -11.948715209960938, "global_step": 441378, "epoch": 2627} {"train_loss": -12.376138687133789, "global_step": 441379, "epoch": 2627} {"train_loss": -11.446017265319824, "global_step": 441380, "epoch": 2627} {"train_loss": -12.003522872924805, "global_step": 441381, "epoch": 2627} {"train_loss": -11.33043098449707, "global_step": 441382, "epoch": 2627} {"train_loss": -12.125252723693848, "global_step": 441383, "epoch": 2627} {"train_loss": -11.365438461303711, "global_step": 441384, "epoch": 2627} {"train_loss": -10.651296615600586, "global_step": 441385, "epoch": 2627} {"train_loss": -12.509295463562012, "global_step": 441386, "epoch": 2627} {"train_loss": -11.529851913452148, "global_step": 441387, "epoch": 2627} {"train_loss": -11.202255249023438, "global_step": 441388, "epoch": 2627} {"train_loss": -12.449935913085938, "global_step": 441389, "epoch": 2627} {"train_loss": -11.51894760131836, "global_step": 441390, "epoch": 2627} {"train_loss": -11.386634826660156, "global_step": 441391, "epoch": 2627} {"train_loss": -11.952917098999023, "global_step": 441392, "epoch": 2627} {"train_loss": -12.301860809326172, "global_step": 441393, "epoch": 2627} {"train_loss": -12.60659122467041, "global_step": 441394, "epoch": 2627} {"train_loss": -11.91150188446045, "global_step": 441395, "epoch": 2627} {"train_loss": -12.267183303833008, "global_step": 441396, "epoch": 2627} {"train_loss": -12.093299865722656, "global_step": 441397, "epoch": 2627} {"train_loss": -12.247451782226562, "global_step": 441398, "epoch": 2627} {"train_loss": -11.925264358520508, "global_step": 441399, "epoch": 2627} {"train_loss": -11.751487731933594, "global_step": 441400, "epoch": 2627} {"train_loss": -12.166375160217285, "global_step": 441401, "epoch": 2627} {"train_loss": -11.343597412109375, "global_step": 441402, "epoch": 2627} {"train_loss": -11.845226287841797, "global_step": 441403, "epoch": 2627} {"train_loss": -11.760817527770996, "global_step": 441404, "epoch": 2627} {"train_loss": -11.414192199707031, "global_step": 441405, "epoch": 2627} {"train_loss": -11.972715377807617, "global_step": 441406, "epoch": 2627} {"train_loss": -10.895926475524902, "global_step": 441407, "epoch": 2627} {"train_loss": -11.278759956359863, "global_step": 441408, "epoch": 2627} {"train_loss": -11.269454956054688, "global_step": 441409, "epoch": 2627} {"train_loss": -10.675626754760742, "global_step": 441410, "epoch": 2627} {"train_loss": -10.93194580078125, "global_step": 441411, "epoch": 2627} {"train_loss": -9.745513916015625, "global_step": 441412, "epoch": 2627} {"train_loss": -9.851322174072266, "global_step": 441413, "epoch": 2627} {"train_loss": -11.105788230895996, "global_step": 441414, "epoch": 2627} {"train_loss": -10.735692977905273, "global_step": 441415, "epoch": 2627} {"train_loss": -10.480247497558594, "global_step": 441416, "epoch": 2627} {"train_loss": -11.31760025024414, "global_step": 441417, "epoch": 2627} {"train_loss": -10.558830261230469, "global_step": 441418, "epoch": 2627} {"train_loss": -11.19128704071045, "global_step": 441419, "epoch": 2627} {"train_loss": -11.783145904541016, "global_step": 441420, "epoch": 2627} {"train_loss": -11.419414520263672, "global_step": 441421, "epoch": 2627} {"train_loss": -12.157391548156738, "global_step": 441422, "epoch": 2627} {"train_loss": -11.76814079284668, "global_step": 441423, "epoch": 2627} {"train_loss": -10.807644844055176, "global_step": 441424, "epoch": 2627} {"train_loss": -11.904233932495117, "global_step": 441425, "epoch": 2627} {"train_loss": -12.130226135253906, "global_step": 441426, "epoch": 2627} {"train_loss": -12.147235870361328, "global_step": 441427, "epoch": 2627} {"train_loss": -12.12314224243164, "global_step": 441428, "epoch": 2627} {"train_loss": -12.16047191619873, "global_step": 441429, "epoch": 2627} {"train_loss": -11.931468963623047, "global_step": 441430, "epoch": 2627} {"train_loss": -12.095858573913574, "global_step": 441431, "epoch": 2627} {"train_loss": -11.535608291625977, "global_step": 441432, "epoch": 2627} {"train_loss": -12.372743606567383, "global_step": 441433, "epoch": 2627} {"train_loss": -11.915861129760742, "global_step": 441434, "epoch": 2627} {"train_loss": -12.106515884399414, "global_step": 441435, "epoch": 2627} {"train_loss": -12.162840843200684, "global_step": 441436, "epoch": 2627} {"train_loss": -12.253966331481934, "global_step": 441437, "epoch": 2627} {"train_loss": -12.232173919677734, "global_step": 441438, "epoch": 2627} {"train_loss": -12.16317081451416, "global_step": 441439, "epoch": 2627} {"train_loss": -12.077629089355469, "global_step": 441440, "epoch": 2627} {"train_loss": -12.53412914276123, "global_step": 441441, "epoch": 2627} {"train_loss": -12.268638610839844, "global_step": 441442, "epoch": 2627} {"train_loss": -12.132549285888672, "global_step": 441443, "epoch": 2627} {"train_loss": -12.40583610534668, "global_step": 441444, "epoch": 2627} {"train_loss": -12.267633438110352, "global_step": 441445, "epoch": 2627} {"train_loss": -12.432783126831055, "global_step": 441446, "epoch": 2627} {"train_loss": -11.88223648071289, "global_step": 441447, "epoch": 2627} {"train_loss": -12.562538146972656, "global_step": 441448, "epoch": 2627} {"train_loss": -11.969868659973145, "global_step": 441449, "epoch": 2627} {"train_loss": -12.616151809692383, "global_step": 441450, "epoch": 2627} {"train_loss": -12.621938705444336, "global_step": 441451, "epoch": 2627} {"train_loss": -12.510454177856445, "global_step": 441452, "epoch": 2627} {"train_loss": -12.524177551269531, "global_step": 441453, "epoch": 2627} {"train_loss": -12.159021377563477, "global_step": 441454, "epoch": 2627} {"train_loss": -12.546148300170898, "global_step": 441455, "epoch": 2627} {"train_loss": -12.444181442260742, "global_step": 441456, "epoch": 2627} {"train_loss": -12.455415725708008, "global_step": 441457, "epoch": 2627} {"train_loss": -12.582208633422852, "global_step": 441458, "epoch": 2627} {"train_loss": -12.347105026245117, "global_step": 441459, "epoch": 2627} {"train_loss": -12.464905738830566, "global_step": 441460, "epoch": 2627} {"train_loss": -12.564346313476562, "global_step": 441461, "epoch": 2627} {"train_loss": -12.731122970581055, "global_step": 441462, "epoch": 2627} {"train_loss": -12.812301635742188, "global_step": 441463, "epoch": 2627} {"train_loss": -12.579994201660156, "global_step": 441464, "epoch": 2627} {"train_loss": -12.54537296295166, "global_step": 441465, "epoch": 2627} {"train_loss": -12.65737533569336, "global_step": 441466, "epoch": 2627} {"train_loss": -12.67049503326416, "global_step": 441467, "epoch": 2627} {"train_loss": -12.509485244750977, "global_step": 441468, "epoch": 2627} {"train_loss": -12.806955337524414, "global_step": 441469, "epoch": 2627} {"train_loss": -12.580390930175781, "global_step": 441470, "epoch": 2627} {"train_loss": -12.562335968017578, "global_step": 441471, "epoch": 2627} {"train_loss": -12.832012176513672, "global_step": 441472, "epoch": 2627} {"train_loss": -12.567499160766602, "global_step": 441473, "epoch": 2627} {"train_loss": -12.398402214050293, "global_step": 441474, "epoch": 2627} {"train_loss": -12.707825660705566, "global_step": 441475, "epoch": 2627} {"train_loss": -12.959627151489258, "global_step": 441476, "epoch": 2627} {"train_loss": -12.543458938598633, "global_step": 441477, "epoch": 2627} {"train_loss": -12.65939712524414, "global_step": 441478, "epoch": 2627} {"train_loss": -12.698485374450684, "global_step": 441479, "epoch": 2627} {"train_loss": -12.405922889709473, "global_step": 441480, "epoch": 2627} {"train_loss": -12.612739562988281, "global_step": 441481, "epoch": 2627} {"train_loss": -12.519281387329102, "global_step": 441482, "epoch": 2627} {"train_loss": -12.43012809753418, "global_step": 441483, "epoch": 2627} {"train_loss": -12.72169303894043, "global_step": 441484, "epoch": 2627} {"train_loss": -12.332500457763672, "global_step": 441485, "epoch": 2627} {"train_loss": -12.135857582092285, "global_step": 441486, "epoch": 2627} {"train_loss": -12.815679550170898, "global_step": 441487, "epoch": 2627} {"train_loss": -12.591202735900879, "global_step": 441488, "epoch": 2627} {"train_loss": -12.500197410583496, "global_step": 441489, "epoch": 2627} {"train_loss": -12.447187423706055, "global_step": 441490, "epoch": 2627} {"train_loss": -12.475687026977539, "global_step": 441491, "epoch": 2627} {"train_loss": -12.3145751953125, "global_step": 441492, "epoch": 2627} {"train_loss": -12.835179328918457, "global_step": 441493, "epoch": 2627} {"train_loss": -11.965444564819336, "global_step": 441494, "epoch": 2627} {"train_loss": -12.880647659301758, "global_step": 441495, "epoch": 2627} {"train_loss": -11.57661247253418, "global_step": 441496, "epoch": 2627} {"train_loss": -12.585907936096191, "global_step": 441497, "epoch": 2627} {"train_loss": -12.37887191772461, "global_step": 441498, "epoch": 2627} {"train_loss": -12.602351188659668, "global_step": 441499, "epoch": 2627} {"train_loss": -12.434712409973145, "global_step": 441500, "epoch": 2627} {"train_loss": -12.023050308227539, "global_step": 441501, "epoch": 2627} {"train_loss": -12.23956298828125, "global_step": 441502, "epoch": 2627} {"train_loss": -12.121701314335777, "global_step": 441503, "epoch": 2627, "val_loss": 307999.4375} {"train_loss": -11.98183822631836, "global_step": 441504, "epoch": 2628} {"train_loss": -11.896060943603516, "global_step": 441505, "epoch": 2628} {"train_loss": -12.128134727478027, "global_step": 441506, "epoch": 2628} {"train_loss": -9.777994155883789, "global_step": 441507, "epoch": 2628} {"train_loss": -10.599197387695312, "global_step": 441508, "epoch": 2628} {"train_loss": -9.24559211730957, "global_step": 441509, "epoch": 2628} {"train_loss": -10.411641120910645, "global_step": 441510, "epoch": 2628} {"train_loss": -11.44124984741211, "global_step": 441511, "epoch": 2628} {"train_loss": -11.084708213806152, "global_step": 441512, "epoch": 2628} {"train_loss": -11.674824714660645, "global_step": 441513, "epoch": 2628} {"train_loss": -10.524080276489258, "global_step": 441514, "epoch": 2628} {"train_loss": -11.048885345458984, "global_step": 441515, "epoch": 2628} {"train_loss": -10.49647331237793, "global_step": 441516, "epoch": 2628} {"train_loss": -12.133929252624512, "global_step": 441517, "epoch": 2628} {"train_loss": -10.778855323791504, "global_step": 441518, "epoch": 2628} {"train_loss": -11.779760360717773, "global_step": 441519, "epoch": 2628} {"train_loss": -10.400871276855469, "global_step": 441520, "epoch": 2628} {"train_loss": -11.305122375488281, "global_step": 441521, "epoch": 2628} {"train_loss": -11.337417602539062, "global_step": 441522, "epoch": 2628} {"train_loss": -10.404693603515625, "global_step": 441523, "epoch": 2628} {"train_loss": -11.637365341186523, "global_step": 441524, "epoch": 2628} {"train_loss": -10.460350036621094, "global_step": 441525, "epoch": 2628} {"train_loss": -10.479196548461914, "global_step": 441526, "epoch": 2628} {"train_loss": -10.58497428894043, "global_step": 441527, "epoch": 2628} {"train_loss": -11.605266571044922, "global_step": 441528, "epoch": 2628} {"train_loss": -10.37872314453125, "global_step": 441529, "epoch": 2628} {"train_loss": -11.715566635131836, "global_step": 441530, "epoch": 2628} {"train_loss": -11.410123825073242, "global_step": 441531, "epoch": 2628} {"train_loss": -11.365099906921387, "global_step": 441532, "epoch": 2628} {"train_loss": -11.143060684204102, "global_step": 441533, "epoch": 2628} {"train_loss": -11.149700164794922, "global_step": 441534, "epoch": 2628} {"train_loss": -11.4124755859375, "global_step": 441535, "epoch": 2628} {"train_loss": -10.9619140625, "global_step": 441536, "epoch": 2628} {"train_loss": -11.870233535766602, "global_step": 441537, "epoch": 2628} {"train_loss": -11.009897232055664, "global_step": 441538, "epoch": 2628} {"train_loss": -11.322084426879883, "global_step": 441539, "epoch": 2628} {"train_loss": -11.894227981567383, "global_step": 441540, "epoch": 2628} {"train_loss": -11.663654327392578, "global_step": 441541, "epoch": 2628} {"train_loss": -12.1382474899292, "global_step": 441542, "epoch": 2628} {"train_loss": -10.768425941467285, "global_step": 441543, "epoch": 2628} {"train_loss": -11.96815299987793, "global_step": 441544, "epoch": 2628} {"train_loss": -11.549527168273926, "global_step": 441545, "epoch": 2628} {"train_loss": -11.471101760864258, "global_step": 441546, "epoch": 2628} {"train_loss": -11.723546981811523, "global_step": 441547, "epoch": 2628} {"train_loss": -11.31004810333252, "global_step": 441548, "epoch": 2628} {"train_loss": -11.922568321228027, "global_step": 441549, "epoch": 2628} {"train_loss": -11.8439302444458, "global_step": 441550, "epoch": 2628} {"train_loss": -11.919122695922852, "global_step": 441551, "epoch": 2628} {"train_loss": -11.976821899414062, "global_step": 441552, "epoch": 2628} {"train_loss": -11.817605018615723, "global_step": 441553, "epoch": 2628} {"train_loss": -11.96950912475586, "global_step": 441554, "epoch": 2628} {"train_loss": -11.919376373291016, "global_step": 441555, "epoch": 2628} {"train_loss": -12.399852752685547, "global_step": 441556, "epoch": 2628} {"train_loss": -12.085537910461426, "global_step": 441557, "epoch": 2628} {"train_loss": -12.253997802734375, "global_step": 441558, "epoch": 2628} {"train_loss": -12.468116760253906, "global_step": 441559, "epoch": 2628} {"train_loss": -12.297245979309082, "global_step": 441560, "epoch": 2628} {"train_loss": -12.326114654541016, "global_step": 441561, "epoch": 2628} {"train_loss": -12.366199493408203, "global_step": 441562, "epoch": 2628} {"train_loss": -12.270149230957031, "global_step": 441563, "epoch": 2628} {"train_loss": -12.362215042114258, "global_step": 441564, "epoch": 2628} {"train_loss": -12.49819564819336, "global_step": 441565, "epoch": 2628} {"train_loss": -12.57182788848877, "global_step": 441566, "epoch": 2628} {"train_loss": -12.380270004272461, "global_step": 441567, "epoch": 2628} {"train_loss": -12.350343704223633, "global_step": 441568, "epoch": 2628} {"train_loss": -12.53245735168457, "global_step": 441569, "epoch": 2628} {"train_loss": -12.159337997436523, "global_step": 441570, "epoch": 2628} {"train_loss": -12.26909065246582, "global_step": 441571, "epoch": 2628} {"train_loss": -12.222824096679688, "global_step": 441572, "epoch": 2628} {"train_loss": -12.411295890808105, "global_step": 441573, "epoch": 2628} {"train_loss": -12.365535736083984, "global_step": 441574, "epoch": 2628} {"train_loss": -12.437943458557129, "global_step": 441575, "epoch": 2628} {"train_loss": -12.674060821533203, "global_step": 441576, "epoch": 2628} {"train_loss": -12.358190536499023, "global_step": 441577, "epoch": 2628} {"train_loss": -12.599132537841797, "global_step": 441578, "epoch": 2628} {"train_loss": -12.607122421264648, "global_step": 441579, "epoch": 2628} {"train_loss": -12.669095993041992, "global_step": 441580, "epoch": 2628} {"train_loss": -12.582636833190918, "global_step": 441581, "epoch": 2628} {"train_loss": -12.524181365966797, "global_step": 441582, "epoch": 2628} {"train_loss": -12.64790153503418, "global_step": 441583, "epoch": 2628} {"train_loss": -12.510396957397461, "global_step": 441584, "epoch": 2628} {"train_loss": -12.432644844055176, "global_step": 441585, "epoch": 2628} {"train_loss": -12.545069694519043, "global_step": 441586, "epoch": 2628} {"train_loss": -12.594598770141602, "global_step": 441587, "epoch": 2628} {"train_loss": -12.52944564819336, "global_step": 441588, "epoch": 2628} {"train_loss": -12.820758819580078, "global_step": 441589, "epoch": 2628} {"train_loss": -12.664295196533203, "global_step": 441590, "epoch": 2628} {"train_loss": -12.87994384765625, "global_step": 441591, "epoch": 2628} {"train_loss": -12.847709655761719, "global_step": 441592, "epoch": 2628} {"train_loss": -12.751749038696289, "global_step": 441593, "epoch": 2628} {"train_loss": -12.779923439025879, "global_step": 441594, "epoch": 2628} {"train_loss": -12.857089042663574, "global_step": 441595, "epoch": 2628} {"train_loss": -12.854974746704102, "global_step": 441596, "epoch": 2628} {"train_loss": -12.774663925170898, "global_step": 441597, "epoch": 2628} {"train_loss": -12.612768173217773, "global_step": 441598, "epoch": 2628} {"train_loss": -12.935365676879883, "global_step": 441599, "epoch": 2628} {"train_loss": -12.858072280883789, "global_step": 441600, "epoch": 2628} {"train_loss": -12.841930389404297, "global_step": 441601, "epoch": 2628} {"train_loss": -12.905472755432129, "global_step": 441602, "epoch": 2628} {"train_loss": -12.82882022857666, "global_step": 441603, "epoch": 2628} {"train_loss": -12.823396682739258, "global_step": 441604, "epoch": 2628} {"train_loss": -12.711286544799805, "global_step": 441605, "epoch": 2628} {"train_loss": -12.795411109924316, "global_step": 441606, "epoch": 2628} {"train_loss": -12.808073997497559, "global_step": 441607, "epoch": 2628} {"train_loss": -12.567728042602539, "global_step": 441608, "epoch": 2628} {"train_loss": -12.92220687866211, "global_step": 441609, "epoch": 2628} {"train_loss": -12.654281616210938, "global_step": 441610, "epoch": 2628} {"train_loss": -12.60188102722168, "global_step": 441611, "epoch": 2628} {"train_loss": -12.990804672241211, "global_step": 441612, "epoch": 2628} {"train_loss": -12.87153434753418, "global_step": 441613, "epoch": 2628} {"train_loss": -12.937820434570312, "global_step": 441614, "epoch": 2628} {"train_loss": -12.904023170471191, "global_step": 441615, "epoch": 2628} {"train_loss": -12.830738067626953, "global_step": 441616, "epoch": 2628} {"train_loss": -12.940767288208008, "global_step": 441617, "epoch": 2628} {"train_loss": -12.820358276367188, "global_step": 441618, "epoch": 2628} {"train_loss": -12.946731567382812, "global_step": 441619, "epoch": 2628} {"train_loss": -12.797971725463867, "global_step": 441620, "epoch": 2628} {"train_loss": -12.807247161865234, "global_step": 441621, "epoch": 2628} {"train_loss": -12.43771743774414, "global_step": 441622, "epoch": 2628} {"train_loss": -12.837907791137695, "global_step": 441623, "epoch": 2628} {"train_loss": -12.587942123413086, "global_step": 441624, "epoch": 2628} {"train_loss": -12.784457206726074, "global_step": 441625, "epoch": 2628} {"train_loss": -12.750133514404297, "global_step": 441626, "epoch": 2628} {"train_loss": -12.711381912231445, "global_step": 441627, "epoch": 2628} {"train_loss": -12.578580856323242, "global_step": 441628, "epoch": 2628} {"train_loss": -12.355697631835938, "global_step": 441629, "epoch": 2628} {"train_loss": -12.628999710083008, "global_step": 441630, "epoch": 2628} {"train_loss": -13.030296325683594, "global_step": 441631, "epoch": 2628} {"train_loss": -12.538557052612305, "global_step": 441632, "epoch": 2628} {"train_loss": -12.545862197875977, "global_step": 441633, "epoch": 2628} {"train_loss": -12.539040565490723, "global_step": 441634, "epoch": 2628} {"train_loss": -12.815108299255371, "global_step": 441635, "epoch": 2628} {"train_loss": -13.036474227905273, "global_step": 441636, "epoch": 2628} {"train_loss": -12.494863510131836, "global_step": 441637, "epoch": 2628} {"train_loss": -12.360166549682617, "global_step": 441638, "epoch": 2628} {"train_loss": -12.384237289428711, "global_step": 441639, "epoch": 2628} {"train_loss": -12.722225189208984, "global_step": 441640, "epoch": 2628} {"train_loss": -11.668342590332031, "global_step": 441641, "epoch": 2628} {"train_loss": -10.603089332580566, "global_step": 441642, "epoch": 2628} {"train_loss": -11.35129165649414, "global_step": 441643, "epoch": 2628} {"train_loss": -12.199348449707031, "global_step": 441644, "epoch": 2628} {"train_loss": -12.241774559020996, "global_step": 441645, "epoch": 2628} {"train_loss": -12.261795997619629, "global_step": 441646, "epoch": 2628} {"train_loss": -12.050837516784668, "global_step": 441647, "epoch": 2628} {"train_loss": -10.931995391845703, "global_step": 441648, "epoch": 2628} {"train_loss": -12.280893325805664, "global_step": 441649, "epoch": 2628} {"train_loss": -11.626745223999023, "global_step": 441650, "epoch": 2628} {"train_loss": -10.539069175720215, "global_step": 441651, "epoch": 2628} {"train_loss": -12.105478286743164, "global_step": 441652, "epoch": 2628} {"train_loss": -12.198661804199219, "global_step": 441653, "epoch": 2628} {"train_loss": -11.1187744140625, "global_step": 441654, "epoch": 2628} {"train_loss": -11.178999900817871, "global_step": 441655, "epoch": 2628} {"train_loss": -12.000045776367188, "global_step": 441656, "epoch": 2628} {"train_loss": -12.192072868347168, "global_step": 441657, "epoch": 2628} {"train_loss": -11.455458641052246, "global_step": 441658, "epoch": 2628} {"train_loss": -11.457286834716797, "global_step": 441659, "epoch": 2628} {"train_loss": -12.201635360717773, "global_step": 441660, "epoch": 2628} {"train_loss": -11.288655281066895, "global_step": 441661, "epoch": 2628} {"train_loss": -11.791736602783203, "global_step": 441662, "epoch": 2628} {"train_loss": -11.669511795043945, "global_step": 441663, "epoch": 2628} {"train_loss": -11.211780548095703, "global_step": 441664, "epoch": 2628} {"train_loss": -11.632250785827637, "global_step": 441665, "epoch": 2628} {"train_loss": -12.016048431396484, "global_step": 441666, "epoch": 2628} {"train_loss": -12.303105354309082, "global_step": 441667, "epoch": 2628} {"train_loss": -12.323537826538086, "global_step": 441668, "epoch": 2628} {"train_loss": -11.655879974365234, "global_step": 441669, "epoch": 2628} {"train_loss": -12.432126998901367, "global_step": 441670, "epoch": 2628} {"train_loss": -12.04730224609375, "global_step": 441671, "epoch": 2628, "val_loss": 313686.8125} {"train_loss": -11.724822044372559, "global_step": 441672, "epoch": 2629} {"train_loss": -10.663163185119629, "global_step": 441673, "epoch": 2629} {"train_loss": -11.209365844726562, "global_step": 441674, "epoch": 2629} {"train_loss": -10.533726692199707, "global_step": 441675, "epoch": 2629} {"train_loss": -11.263372421264648, "global_step": 441676, "epoch": 2629} {"train_loss": -9.380850791931152, "global_step": 441677, "epoch": 2629} {"train_loss": -9.558456420898438, "global_step": 441678, "epoch": 2629} {"train_loss": -9.797683715820312, "global_step": 441679, "epoch": 2629} {"train_loss": -9.271322250366211, "global_step": 441680, "epoch": 2629} {"train_loss": -11.229007720947266, "global_step": 441681, "epoch": 2629} {"train_loss": -10.947566986083984, "global_step": 441682, "epoch": 2629} {"train_loss": -11.57386589050293, "global_step": 441683, "epoch": 2629} {"train_loss": -11.070384979248047, "global_step": 441684, "epoch": 2629} {"train_loss": -11.495973587036133, "global_step": 441685, "epoch": 2629} {"train_loss": -11.372512817382812, "global_step": 441686, "epoch": 2629} {"train_loss": -10.905802726745605, "global_step": 441687, "epoch": 2629} {"train_loss": -11.44758129119873, "global_step": 441688, "epoch": 2629} {"train_loss": -10.791465759277344, "global_step": 441689, "epoch": 2629} {"train_loss": -12.051773071289062, "global_step": 441690, "epoch": 2629} {"train_loss": -11.110694885253906, "global_step": 441691, "epoch": 2629} {"train_loss": -11.567761421203613, "global_step": 441692, "epoch": 2629} {"train_loss": -11.601469039916992, "global_step": 441693, "epoch": 2629} {"train_loss": -10.831789016723633, "global_step": 441694, "epoch": 2629} {"train_loss": -11.17560863494873, "global_step": 441695, "epoch": 2629} {"train_loss": -10.657052993774414, "global_step": 441696, "epoch": 2629} {"train_loss": -10.954069137573242, "global_step": 441697, "epoch": 2629} {"train_loss": -11.325892448425293, "global_step": 441698, "epoch": 2629} {"train_loss": -11.374494552612305, "global_step": 441699, "epoch": 2629} {"train_loss": -10.606025695800781, "global_step": 441700, "epoch": 2629} {"train_loss": -12.207351684570312, "global_step": 441701, "epoch": 2629} {"train_loss": -10.93585205078125, "global_step": 441702, "epoch": 2629} {"train_loss": -11.50221061706543, "global_step": 441703, "epoch": 2629} {"train_loss": -11.504297256469727, "global_step": 441704, "epoch": 2629} {"train_loss": -10.940765380859375, "global_step": 441705, "epoch": 2629} {"train_loss": -12.05634880065918, "global_step": 441706, "epoch": 2629} {"train_loss": -11.040555000305176, "global_step": 441707, "epoch": 2629} {"train_loss": -12.017809867858887, "global_step": 441708, "epoch": 2629} {"train_loss": -11.488692283630371, "global_step": 441709, "epoch": 2629} {"train_loss": -11.934000015258789, "global_step": 441710, "epoch": 2629} {"train_loss": -11.376565933227539, "global_step": 441711, "epoch": 2629} {"train_loss": -12.020404815673828, "global_step": 441712, "epoch": 2629} {"train_loss": -11.315057754516602, "global_step": 441713, "epoch": 2629} {"train_loss": -11.247413635253906, "global_step": 441714, "epoch": 2629} {"train_loss": -11.644673347473145, "global_step": 441715, "epoch": 2629} {"train_loss": -11.628564834594727, "global_step": 441716, "epoch": 2629} {"train_loss": -11.764191627502441, "global_step": 441717, "epoch": 2629} {"train_loss": -12.062515258789062, "global_step": 441718, "epoch": 2629} {"train_loss": -12.042569160461426, "global_step": 441719, "epoch": 2629} {"train_loss": -12.050941467285156, "global_step": 441720, "epoch": 2629} {"train_loss": -11.978765487670898, "global_step": 441721, "epoch": 2629} {"train_loss": -11.839128494262695, "global_step": 441722, "epoch": 2629} {"train_loss": -11.668684005737305, "global_step": 441723, "epoch": 2629} {"train_loss": -12.177274703979492, "global_step": 441724, "epoch": 2629} {"train_loss": -11.811147689819336, "global_step": 441725, "epoch": 2629} {"train_loss": -12.109314918518066, "global_step": 441726, "epoch": 2629} {"train_loss": -12.068948745727539, "global_step": 441727, "epoch": 2629} {"train_loss": -12.149394989013672, "global_step": 441728, "epoch": 2629} {"train_loss": -11.887779235839844, "global_step": 441729, "epoch": 2629} {"train_loss": -12.45052719116211, "global_step": 441730, "epoch": 2629} {"train_loss": -12.068216323852539, "global_step": 441731, "epoch": 2629} {"train_loss": -12.355448722839355, "global_step": 441732, "epoch": 2629} {"train_loss": -12.2471923828125, "global_step": 441733, "epoch": 2629} {"train_loss": -11.944430351257324, "global_step": 441734, "epoch": 2629} {"train_loss": -12.023852348327637, "global_step": 441735, "epoch": 2629} {"train_loss": -12.531600952148438, "global_step": 441736, "epoch": 2629} {"train_loss": -11.855093002319336, "global_step": 441737, "epoch": 2629} {"train_loss": -12.321049690246582, "global_step": 441738, "epoch": 2629} {"train_loss": -12.313854217529297, "global_step": 441739, "epoch": 2629} {"train_loss": -12.108255386352539, "global_step": 441740, "epoch": 2629} {"train_loss": -12.088883399963379, "global_step": 441741, "epoch": 2629} {"train_loss": -11.876758575439453, "global_step": 441742, "epoch": 2629} {"train_loss": -11.841300964355469, "global_step": 441743, "epoch": 2629} {"train_loss": -12.241257667541504, "global_step": 441744, "epoch": 2629} {"train_loss": -11.977109909057617, "global_step": 441745, "epoch": 2629} {"train_loss": -11.8956937789917, "global_step": 441746, "epoch": 2629} {"train_loss": -12.445026397705078, "global_step": 441747, "epoch": 2629} {"train_loss": -12.116779327392578, "global_step": 441748, "epoch": 2629} {"train_loss": -12.229103088378906, "global_step": 441749, "epoch": 2629} {"train_loss": -12.217308044433594, "global_step": 441750, "epoch": 2629} {"train_loss": -12.092118263244629, "global_step": 441751, "epoch": 2629} {"train_loss": -12.561359405517578, "global_step": 441752, "epoch": 2629} {"train_loss": -12.438474655151367, "global_step": 441753, "epoch": 2629} {"train_loss": -11.956206321716309, "global_step": 441754, "epoch": 2629} {"train_loss": -12.211402893066406, "global_step": 441755, "epoch": 2629} {"train_loss": -12.119626998901367, "global_step": 441756, "epoch": 2629} {"train_loss": -12.588151931762695, "global_step": 441757, "epoch": 2629} {"train_loss": -12.415648460388184, "global_step": 441758, "epoch": 2629} {"train_loss": -12.242265701293945, "global_step": 441759, "epoch": 2629} {"train_loss": -12.162643432617188, "global_step": 441760, "epoch": 2629} {"train_loss": -12.309285163879395, "global_step": 441761, "epoch": 2629} {"train_loss": -12.432245254516602, "global_step": 441762, "epoch": 2629} {"train_loss": -12.415424346923828, "global_step": 441763, "epoch": 2629} {"train_loss": -12.055680274963379, "global_step": 441764, "epoch": 2629} {"train_loss": -12.680850982666016, "global_step": 441765, "epoch": 2629} {"train_loss": -12.245015144348145, "global_step": 441766, "epoch": 2629} {"train_loss": -12.305027961730957, "global_step": 441767, "epoch": 2629} {"train_loss": -12.414724349975586, "global_step": 441768, "epoch": 2629} {"train_loss": -12.412477493286133, "global_step": 441769, "epoch": 2629} {"train_loss": -12.388227462768555, "global_step": 441770, "epoch": 2629} {"train_loss": -12.502703666687012, "global_step": 441771, "epoch": 2629} {"train_loss": -12.522455215454102, "global_step": 441772, "epoch": 2629} {"train_loss": -12.527700424194336, "global_step": 441773, "epoch": 2629} {"train_loss": -12.532005310058594, "global_step": 441774, "epoch": 2629} {"train_loss": -12.722162246704102, "global_step": 441775, "epoch": 2629} {"train_loss": -12.708610534667969, "global_step": 441776, "epoch": 2629} {"train_loss": -12.64527702331543, "global_step": 441777, "epoch": 2629} {"train_loss": -12.534586906433105, "global_step": 441778, "epoch": 2629} {"train_loss": -12.574816703796387, "global_step": 441779, "epoch": 2629} {"train_loss": -12.72269058227539, "global_step": 441780, "epoch": 2629} {"train_loss": -12.380680084228516, "global_step": 441781, "epoch": 2629} {"train_loss": -12.478128433227539, "global_step": 441782, "epoch": 2629} {"train_loss": -12.88937759399414, "global_step": 441783, "epoch": 2629} {"train_loss": -12.723608016967773, "global_step": 441784, "epoch": 2629} {"train_loss": -12.813764572143555, "global_step": 441785, "epoch": 2629} {"train_loss": -12.510377883911133, "global_step": 441786, "epoch": 2629} {"train_loss": -12.879301071166992, "global_step": 441787, "epoch": 2629} {"train_loss": -12.552444458007812, "global_step": 441788, "epoch": 2629} {"train_loss": -12.709539413452148, "global_step": 441789, "epoch": 2629} {"train_loss": -12.546627044677734, "global_step": 441790, "epoch": 2629} {"train_loss": -12.366653442382812, "global_step": 441791, "epoch": 2629} {"train_loss": -12.728658676147461, "global_step": 441792, "epoch": 2629} {"train_loss": -12.47435188293457, "global_step": 441793, "epoch": 2629} {"train_loss": -12.197093963623047, "global_step": 441794, "epoch": 2629} {"train_loss": -12.702783584594727, "global_step": 441795, "epoch": 2629} {"train_loss": -12.316863059997559, "global_step": 441796, "epoch": 2629} {"train_loss": -12.94297981262207, "global_step": 441797, "epoch": 2629} {"train_loss": -12.434884071350098, "global_step": 441798, "epoch": 2629} {"train_loss": -12.499135971069336, "global_step": 441799, "epoch": 2629} {"train_loss": -12.696609497070312, "global_step": 441800, "epoch": 2629} {"train_loss": -12.484128952026367, "global_step": 441801, "epoch": 2629} {"train_loss": -12.494138717651367, "global_step": 441802, "epoch": 2629} {"train_loss": -12.703611373901367, "global_step": 441803, "epoch": 2629} {"train_loss": -12.41102409362793, "global_step": 441804, "epoch": 2629} {"train_loss": -12.574934005737305, "global_step": 441805, "epoch": 2629} {"train_loss": -12.283108711242676, "global_step": 441806, "epoch": 2629} {"train_loss": -12.826723098754883, "global_step": 441807, "epoch": 2629} {"train_loss": -12.723898887634277, "global_step": 441808, "epoch": 2629} {"train_loss": -12.606298446655273, "global_step": 441809, "epoch": 2629} {"train_loss": -12.520875930786133, "global_step": 441810, "epoch": 2629} {"train_loss": -12.665675163269043, "global_step": 441811, "epoch": 2629} {"train_loss": -12.84961223602295, "global_step": 441812, "epoch": 2629} {"train_loss": -12.562789916992188, "global_step": 441813, "epoch": 2629} {"train_loss": -12.559174537658691, "global_step": 441814, "epoch": 2629} {"train_loss": -12.674330711364746, "global_step": 441815, "epoch": 2629} {"train_loss": -12.753119468688965, "global_step": 441816, "epoch": 2629} {"train_loss": -12.814529418945312, "global_step": 441817, "epoch": 2629} {"train_loss": -12.486104965209961, "global_step": 441818, "epoch": 2629} {"train_loss": -12.810429573059082, "global_step": 441819, "epoch": 2629} {"train_loss": -12.87819766998291, "global_step": 441820, "epoch": 2629} {"train_loss": -12.02316665649414, "global_step": 441821, "epoch": 2629} {"train_loss": -12.130071640014648, "global_step": 441822, "epoch": 2629} {"train_loss": -12.306995391845703, "global_step": 441823, "epoch": 2629} {"train_loss": -11.374784469604492, "global_step": 441824, "epoch": 2629} {"train_loss": -12.546345710754395, "global_step": 441825, "epoch": 2629} {"train_loss": -11.108848571777344, "global_step": 441826, "epoch": 2629} {"train_loss": -10.925695419311523, "global_step": 441827, "epoch": 2629} {"train_loss": -12.324493408203125, "global_step": 441828, "epoch": 2629} {"train_loss": -11.890838623046875, "global_step": 441829, "epoch": 2629} {"train_loss": -12.158559799194336, "global_step": 441830, "epoch": 2629} {"train_loss": -12.24943733215332, "global_step": 441831, "epoch": 2629} {"train_loss": -11.694198608398438, "global_step": 441832, "epoch": 2629} {"train_loss": -12.040250778198242, "global_step": 441833, "epoch": 2629} {"train_loss": -11.73038101196289, "global_step": 441834, "epoch": 2629} {"train_loss": -12.232460021972656, "global_step": 441835, "epoch": 2629} {"train_loss": -12.202744483947754, "global_step": 441836, "epoch": 2629} {"train_loss": -11.828512191772461, "global_step": 441837, "epoch": 2629} {"train_loss": -12.256322860717773, "global_step": 441838, "epoch": 2629} {"train_loss": -12.002794691494532, "global_step": 441839, "epoch": 2629, "val_loss": 308734.375} {"train_loss": -11.572769165039062, "global_step": 441840, "epoch": 2630} {"train_loss": -12.471708297729492, "global_step": 441841, "epoch": 2630} {"train_loss": -11.505611419677734, "global_step": 441842, "epoch": 2630} {"train_loss": -12.222000122070312, "global_step": 441843, "epoch": 2630} {"train_loss": -12.210987091064453, "global_step": 441844, "epoch": 2630} {"train_loss": -12.054855346679688, "global_step": 441845, "epoch": 2630} {"train_loss": -12.331440925598145, "global_step": 441846, "epoch": 2630} {"train_loss": -12.466202735900879, "global_step": 441847, "epoch": 2630} {"train_loss": -12.440183639526367, "global_step": 441848, "epoch": 2630} {"train_loss": -12.294672966003418, "global_step": 441849, "epoch": 2630} {"train_loss": -12.292333602905273, "global_step": 441850, "epoch": 2630} {"train_loss": -12.535226821899414, "global_step": 441851, "epoch": 2630} {"train_loss": -12.76015853881836, "global_step": 441852, "epoch": 2630} {"train_loss": -12.545488357543945, "global_step": 441853, "epoch": 2630} {"train_loss": -12.082332611083984, "global_step": 441854, "epoch": 2630} {"train_loss": -12.246500015258789, "global_step": 441855, "epoch": 2630} {"train_loss": -11.920913696289062, "global_step": 441856, "epoch": 2630} {"train_loss": -11.811734199523926, "global_step": 441857, "epoch": 2630} {"train_loss": -12.076028823852539, "global_step": 441858, "epoch": 2630} {"train_loss": -11.052667617797852, "global_step": 441859, "epoch": 2630} {"train_loss": -11.24276351928711, "global_step": 441860, "epoch": 2630} {"train_loss": -12.139372825622559, "global_step": 441861, "epoch": 2630} {"train_loss": -11.835208892822266, "global_step": 441862, "epoch": 2630} {"train_loss": -12.092533111572266, "global_step": 441863, "epoch": 2630} {"train_loss": -12.434369087219238, "global_step": 441864, "epoch": 2630} {"train_loss": -11.851200103759766, "global_step": 441865, "epoch": 2630} {"train_loss": -11.427330017089844, "global_step": 441866, "epoch": 2630} {"train_loss": -12.059736251831055, "global_step": 441867, "epoch": 2630} {"train_loss": -11.784046173095703, "global_step": 441868, "epoch": 2630} {"train_loss": -11.927324295043945, "global_step": 441869, "epoch": 2630} {"train_loss": -12.121770858764648, "global_step": 441870, "epoch": 2630} {"train_loss": -11.835762023925781, "global_step": 441871, "epoch": 2630} {"train_loss": -11.887972831726074, "global_step": 441872, "epoch": 2630} {"train_loss": -12.209085464477539, "global_step": 441873, "epoch": 2630} {"train_loss": -11.782861709594727, "global_step": 441874, "epoch": 2630} {"train_loss": -11.675603866577148, "global_step": 441875, "epoch": 2630} {"train_loss": -12.063030242919922, "global_step": 441876, "epoch": 2630} {"train_loss": -11.361618995666504, "global_step": 441877, "epoch": 2630} {"train_loss": -11.758014678955078, "global_step": 441878, "epoch": 2630} {"train_loss": -11.296031951904297, "global_step": 441879, "epoch": 2630} {"train_loss": -11.839102745056152, "global_step": 441880, "epoch": 2630} {"train_loss": -11.643539428710938, "global_step": 441881, "epoch": 2630} {"train_loss": -11.906982421875, "global_step": 441882, "epoch": 2630} {"train_loss": -11.845874786376953, "global_step": 441883, "epoch": 2630} {"train_loss": -12.400819778442383, "global_step": 441884, "epoch": 2630} {"train_loss": -11.688539505004883, "global_step": 441885, "epoch": 2630} {"train_loss": -12.301128387451172, "global_step": 441886, "epoch": 2630} {"train_loss": -12.378735542297363, "global_step": 441887, "epoch": 2630} {"train_loss": -12.07509994506836, "global_step": 441888, "epoch": 2630} {"train_loss": -12.053749084472656, "global_step": 441889, "epoch": 2630} {"train_loss": -11.772928237915039, "global_step": 441890, "epoch": 2630} {"train_loss": -12.2171630859375, "global_step": 441891, "epoch": 2630} {"train_loss": -11.646868705749512, "global_step": 441892, "epoch": 2630} {"train_loss": -11.923343658447266, "global_step": 441893, "epoch": 2630} {"train_loss": -12.296429634094238, "global_step": 441894, "epoch": 2630} {"train_loss": -11.80703353881836, "global_step": 441895, "epoch": 2630} {"train_loss": -12.363710403442383, "global_step": 441896, "epoch": 2630} {"train_loss": -12.18046760559082, "global_step": 441897, "epoch": 2630} {"train_loss": -12.224029541015625, "global_step": 441898, "epoch": 2630} {"train_loss": -11.888803482055664, "global_step": 441899, "epoch": 2630} {"train_loss": -11.79726791381836, "global_step": 441900, "epoch": 2630} {"train_loss": -12.222658157348633, "global_step": 441901, "epoch": 2630} {"train_loss": -12.450296401977539, "global_step": 441902, "epoch": 2630} {"train_loss": -11.976030349731445, "global_step": 441903, "epoch": 2630} {"train_loss": -12.509084701538086, "global_step": 441904, "epoch": 2630} {"train_loss": -12.456365585327148, "global_step": 441905, "epoch": 2630} {"train_loss": -12.750185012817383, "global_step": 441906, "epoch": 2630} {"train_loss": -12.094114303588867, "global_step": 441907, "epoch": 2630} {"train_loss": -12.370513916015625, "global_step": 441908, "epoch": 2630} {"train_loss": -12.645984649658203, "global_step": 441909, "epoch": 2630} {"train_loss": -12.345521926879883, "global_step": 441910, "epoch": 2630} {"train_loss": -12.690168380737305, "global_step": 441911, "epoch": 2630} {"train_loss": -12.456584930419922, "global_step": 441912, "epoch": 2630} {"train_loss": -12.44559097290039, "global_step": 441913, "epoch": 2630} {"train_loss": -12.57892894744873, "global_step": 441914, "epoch": 2630} {"train_loss": -12.309041023254395, "global_step": 441915, "epoch": 2630} {"train_loss": -12.390958786010742, "global_step": 441916, "epoch": 2630} {"train_loss": -12.819417953491211, "global_step": 441917, "epoch": 2630} {"train_loss": -12.627135276794434, "global_step": 441918, "epoch": 2630} {"train_loss": -12.710987091064453, "global_step": 441919, "epoch": 2630} {"train_loss": -12.548303604125977, "global_step": 441920, "epoch": 2630} {"train_loss": -12.641889572143555, "global_step": 441921, "epoch": 2630} {"train_loss": -12.640392303466797, "global_step": 441922, "epoch": 2630} {"train_loss": -12.31678581237793, "global_step": 441923, "epoch": 2630} {"train_loss": -12.687533378601074, "global_step": 441924, "epoch": 2630} {"train_loss": -12.378549575805664, "global_step": 441925, "epoch": 2630} {"train_loss": -12.662834167480469, "global_step": 441926, "epoch": 2630} {"train_loss": -12.726444244384766, "global_step": 441927, "epoch": 2630} {"train_loss": -12.21230697631836, "global_step": 441928, "epoch": 2630} {"train_loss": -12.567712783813477, "global_step": 441929, "epoch": 2630} {"train_loss": -12.50992202758789, "global_step": 441930, "epoch": 2630} {"train_loss": -12.127660751342773, "global_step": 441931, "epoch": 2630} {"train_loss": -12.753971099853516, "global_step": 441932, "epoch": 2630} {"train_loss": -12.636865615844727, "global_step": 441933, "epoch": 2630} {"train_loss": -12.133700370788574, "global_step": 441934, "epoch": 2630} {"train_loss": -12.643674850463867, "global_step": 441935, "epoch": 2630} {"train_loss": -12.608766555786133, "global_step": 441936, "epoch": 2630} {"train_loss": -12.232693672180176, "global_step": 441937, "epoch": 2630} {"train_loss": -12.754647254943848, "global_step": 441938, "epoch": 2630} {"train_loss": -12.240067481994629, "global_step": 441939, "epoch": 2630} {"train_loss": -12.329607009887695, "global_step": 441940, "epoch": 2630} {"train_loss": -12.13249397277832, "global_step": 441941, "epoch": 2630} {"train_loss": -12.284013748168945, "global_step": 441942, "epoch": 2630} {"train_loss": -12.039458274841309, "global_step": 441943, "epoch": 2630} {"train_loss": -12.75205135345459, "global_step": 441944, "epoch": 2630} {"train_loss": -11.943914413452148, "global_step": 441945, "epoch": 2630} {"train_loss": -12.768402099609375, "global_step": 441946, "epoch": 2630} {"train_loss": -11.59904670715332, "global_step": 441947, "epoch": 2630} {"train_loss": -12.502555847167969, "global_step": 441948, "epoch": 2630} {"train_loss": -12.078241348266602, "global_step": 441949, "epoch": 2630} {"train_loss": -11.676593780517578, "global_step": 441950, "epoch": 2630} {"train_loss": -12.04369831085205, "global_step": 441951, "epoch": 2630} {"train_loss": -12.185680389404297, "global_step": 441952, "epoch": 2630} {"train_loss": -12.648621559143066, "global_step": 441953, "epoch": 2630} {"train_loss": -12.225675582885742, "global_step": 441954, "epoch": 2630} {"train_loss": -12.617013931274414, "global_step": 441955, "epoch": 2630} {"train_loss": -12.407561302185059, "global_step": 441956, "epoch": 2630} {"train_loss": -12.570810317993164, "global_step": 441957, "epoch": 2630} {"train_loss": -12.41081428527832, "global_step": 441958, "epoch": 2630} {"train_loss": -12.377199172973633, "global_step": 441959, "epoch": 2630} {"train_loss": -12.517755508422852, "global_step": 441960, "epoch": 2630} {"train_loss": -12.319976806640625, "global_step": 441961, "epoch": 2630} {"train_loss": -12.599956512451172, "global_step": 441962, "epoch": 2630} {"train_loss": -12.811702728271484, "global_step": 441963, "epoch": 2630} {"train_loss": -12.391803741455078, "global_step": 441964, "epoch": 2630} {"train_loss": -12.68708610534668, "global_step": 441965, "epoch": 2630} {"train_loss": -12.539504051208496, "global_step": 441966, "epoch": 2630} {"train_loss": -12.506404876708984, "global_step": 441967, "epoch": 2630} {"train_loss": -12.512836456298828, "global_step": 441968, "epoch": 2630} {"train_loss": -12.480864524841309, "global_step": 441969, "epoch": 2630} {"train_loss": -12.821674346923828, "global_step": 441970, "epoch": 2630} {"train_loss": -12.709287643432617, "global_step": 441971, "epoch": 2630} {"train_loss": -12.657474517822266, "global_step": 441972, "epoch": 2630} {"train_loss": -12.746687889099121, "global_step": 441973, "epoch": 2630} {"train_loss": -12.721960067749023, "global_step": 441974, "epoch": 2630} {"train_loss": -12.643675804138184, "global_step": 441975, "epoch": 2630} {"train_loss": -12.7893648147583, "global_step": 441976, "epoch": 2630} {"train_loss": -12.795618057250977, "global_step": 441977, "epoch": 2630} {"train_loss": -12.918184280395508, "global_step": 441978, "epoch": 2630} {"train_loss": -12.759214401245117, "global_step": 441979, "epoch": 2630} {"train_loss": -12.64423942565918, "global_step": 441980, "epoch": 2630} {"train_loss": -12.563810348510742, "global_step": 441981, "epoch": 2630} {"train_loss": -12.79946517944336, "global_step": 441982, "epoch": 2630} {"train_loss": -12.647507667541504, "global_step": 441983, "epoch": 2630} {"train_loss": -12.662384986877441, "global_step": 441984, "epoch": 2630} {"train_loss": -12.883041381835938, "global_step": 441985, "epoch": 2630} {"train_loss": -12.818737030029297, "global_step": 441986, "epoch": 2630} {"train_loss": -12.846552848815918, "global_step": 441987, "epoch": 2630} {"train_loss": -12.811016082763672, "global_step": 441988, "epoch": 2630} {"train_loss": -12.527894020080566, "global_step": 441989, "epoch": 2630} {"train_loss": -12.849494934082031, "global_step": 441990, "epoch": 2630} {"train_loss": -12.441329002380371, "global_step": 441991, "epoch": 2630} {"train_loss": -12.82292366027832, "global_step": 441992, "epoch": 2630} {"train_loss": -12.626506805419922, "global_step": 441993, "epoch": 2630} {"train_loss": -12.487302780151367, "global_step": 441994, "epoch": 2630} {"train_loss": -12.464473724365234, "global_step": 441995, "epoch": 2630} {"train_loss": -13.062294006347656, "global_step": 441996, "epoch": 2630} {"train_loss": -11.989143371582031, "global_step": 441997, "epoch": 2630} {"train_loss": -12.177677154541016, "global_step": 441998, "epoch": 2630} {"train_loss": -12.396432876586914, "global_step": 441999, "epoch": 2630} {"train_loss": -10.150688171386719, "global_step": 442000, "epoch": 2630} {"train_loss": -10.735071182250977, "global_step": 442001, "epoch": 2630} {"train_loss": -11.541936874389648, "global_step": 442002, "epoch": 2630} {"train_loss": -11.5444917678833, "global_step": 442003, "epoch": 2630} {"train_loss": -10.773704528808594, "global_step": 442004, "epoch": 2630} {"train_loss": -12.14400577545166, "global_step": 442005, "epoch": 2630} {"train_loss": -9.783212661743164, "global_step": 442006, "epoch": 2630} {"train_loss": -12.236302006812323, "global_step": 442007, "epoch": 2630, "val_loss": 310370.78125, "train_action_mse_error": 1.3609063625335693} {"train_loss": -11.659636497497559, "global_step": 442008, "epoch": 2631} {"train_loss": -10.295819282531738, "global_step": 442009, "epoch": 2631} {"train_loss": -10.1552152633667, "global_step": 442010, "epoch": 2631} {"train_loss": -12.006260871887207, "global_step": 442011, "epoch": 2631} {"train_loss": -11.364330291748047, "global_step": 442012, "epoch": 2631} {"train_loss": -11.082929611206055, "global_step": 442013, "epoch": 2631} {"train_loss": -11.457658767700195, "global_step": 442014, "epoch": 2631} {"train_loss": -11.825664520263672, "global_step": 442015, "epoch": 2631} {"train_loss": -11.629388809204102, "global_step": 442016, "epoch": 2631} {"train_loss": -11.751479148864746, "global_step": 442017, "epoch": 2631} {"train_loss": -11.809104919433594, "global_step": 442018, "epoch": 2631} {"train_loss": -11.711786270141602, "global_step": 442019, "epoch": 2631} {"train_loss": -11.579694747924805, "global_step": 442020, "epoch": 2631} {"train_loss": -11.799843788146973, "global_step": 442021, "epoch": 2631} {"train_loss": -12.162215232849121, "global_step": 442022, "epoch": 2631} {"train_loss": -11.258478164672852, "global_step": 442023, "epoch": 2631} {"train_loss": -12.148908615112305, "global_step": 442024, "epoch": 2631} {"train_loss": -11.869338035583496, "global_step": 442025, "epoch": 2631} {"train_loss": -12.128395080566406, "global_step": 442026, "epoch": 2631} {"train_loss": -12.12503719329834, "global_step": 442027, "epoch": 2631} {"train_loss": -12.176597595214844, "global_step": 442028, "epoch": 2631} {"train_loss": -11.936984062194824, "global_step": 442029, "epoch": 2631} {"train_loss": -12.311847686767578, "global_step": 442030, "epoch": 2631} {"train_loss": -12.509328842163086, "global_step": 442031, "epoch": 2631} {"train_loss": -12.175664901733398, "global_step": 442032, "epoch": 2631} {"train_loss": -12.240621566772461, "global_step": 442033, "epoch": 2631} {"train_loss": -12.17898941040039, "global_step": 442034, "epoch": 2631} {"train_loss": -12.521383285522461, "global_step": 442035, "epoch": 2631} {"train_loss": -12.096830368041992, "global_step": 442036, "epoch": 2631} {"train_loss": -12.278707504272461, "global_step": 442037, "epoch": 2631} {"train_loss": -12.374910354614258, "global_step": 442038, "epoch": 2631} {"train_loss": -12.279077529907227, "global_step": 442039, "epoch": 2631} {"train_loss": -12.303722381591797, "global_step": 442040, "epoch": 2631} {"train_loss": -12.107208251953125, "global_step": 442041, "epoch": 2631} {"train_loss": -12.377689361572266, "global_step": 442042, "epoch": 2631} {"train_loss": -11.938040733337402, "global_step": 442043, "epoch": 2631} {"train_loss": -11.937214851379395, "global_step": 442044, "epoch": 2631} {"train_loss": -12.312496185302734, "global_step": 442045, "epoch": 2631} {"train_loss": -12.130478858947754, "global_step": 442046, "epoch": 2631} {"train_loss": -12.363866806030273, "global_step": 442047, "epoch": 2631} {"train_loss": -12.181554794311523, "global_step": 442048, "epoch": 2631} {"train_loss": -12.348738670349121, "global_step": 442049, "epoch": 2631} {"train_loss": -12.326421737670898, "global_step": 442050, "epoch": 2631} {"train_loss": -12.296168327331543, "global_step": 442051, "epoch": 2631} {"train_loss": -12.566141128540039, "global_step": 442052, "epoch": 2631} {"train_loss": -12.033374786376953, "global_step": 442053, "epoch": 2631} {"train_loss": -12.802560806274414, "global_step": 442054, "epoch": 2631} {"train_loss": -12.039088249206543, "global_step": 442055, "epoch": 2631} {"train_loss": -12.446024894714355, "global_step": 442056, "epoch": 2631} {"train_loss": -12.403409004211426, "global_step": 442057, "epoch": 2631} {"train_loss": -12.384721755981445, "global_step": 442058, "epoch": 2631} {"train_loss": -12.462812423706055, "global_step": 442059, "epoch": 2631} {"train_loss": -12.484227180480957, "global_step": 442060, "epoch": 2631} {"train_loss": -12.33937931060791, "global_step": 442061, "epoch": 2631} {"train_loss": -12.59929084777832, "global_step": 442062, "epoch": 2631} {"train_loss": -12.261409759521484, "global_step": 442063, "epoch": 2631} {"train_loss": -12.10505485534668, "global_step": 442064, "epoch": 2631} {"train_loss": -12.815788269042969, "global_step": 442065, "epoch": 2631} {"train_loss": -12.123254776000977, "global_step": 442066, "epoch": 2631} {"train_loss": -12.295699119567871, "global_step": 442067, "epoch": 2631} {"train_loss": -12.189414024353027, "global_step": 442068, "epoch": 2631} {"train_loss": -12.043033599853516, "global_step": 442069, "epoch": 2631} {"train_loss": -11.759322166442871, "global_step": 442070, "epoch": 2631} {"train_loss": -12.295156478881836, "global_step": 442071, "epoch": 2631} {"train_loss": -12.291603088378906, "global_step": 442072, "epoch": 2631} {"train_loss": -11.748865127563477, "global_step": 442073, "epoch": 2631} {"train_loss": -12.542752265930176, "global_step": 442074, "epoch": 2631} {"train_loss": -12.124074935913086, "global_step": 442075, "epoch": 2631} {"train_loss": -12.40914535522461, "global_step": 442076, "epoch": 2631} {"train_loss": -12.20574951171875, "global_step": 442077, "epoch": 2631} {"train_loss": -12.579095840454102, "global_step": 442078, "epoch": 2631} {"train_loss": -12.192825317382812, "global_step": 442079, "epoch": 2631} {"train_loss": -12.627467155456543, "global_step": 442080, "epoch": 2631} {"train_loss": -11.995698928833008, "global_step": 442081, "epoch": 2631} {"train_loss": -12.51417064666748, "global_step": 442082, "epoch": 2631} {"train_loss": -11.826887130737305, "global_step": 442083, "epoch": 2631} {"train_loss": -12.518760681152344, "global_step": 442084, "epoch": 2631} {"train_loss": -12.242168426513672, "global_step": 442085, "epoch": 2631} {"train_loss": -12.289225578308105, "global_step": 442086, "epoch": 2631} {"train_loss": -12.04153823852539, "global_step": 442087, "epoch": 2631} {"train_loss": -12.550691604614258, "global_step": 442088, "epoch": 2631} {"train_loss": -12.154376983642578, "global_step": 442089, "epoch": 2631} {"train_loss": -12.16232681274414, "global_step": 442090, "epoch": 2631} {"train_loss": -12.63396167755127, "global_step": 442091, "epoch": 2631} {"train_loss": -12.43880844116211, "global_step": 442092, "epoch": 2631} {"train_loss": -12.525630950927734, "global_step": 442093, "epoch": 2631} {"train_loss": -12.369245529174805, "global_step": 442094, "epoch": 2631} {"train_loss": -12.721457481384277, "global_step": 442095, "epoch": 2631} {"train_loss": -12.719602584838867, "global_step": 442096, "epoch": 2631} {"train_loss": -12.453605651855469, "global_step": 442097, "epoch": 2631} {"train_loss": -12.664669036865234, "global_step": 442098, "epoch": 2631} {"train_loss": -12.653938293457031, "global_step": 442099, "epoch": 2631} {"train_loss": -12.492775917053223, "global_step": 442100, "epoch": 2631} {"train_loss": -12.641488075256348, "global_step": 442101, "epoch": 2631} {"train_loss": -12.747800827026367, "global_step": 442102, "epoch": 2631} {"train_loss": -12.75649642944336, "global_step": 442103, "epoch": 2631} {"train_loss": -12.657382011413574, "global_step": 442104, "epoch": 2631} {"train_loss": -12.512639999389648, "global_step": 442105, "epoch": 2631} {"train_loss": -12.498260498046875, "global_step": 442106, "epoch": 2631} {"train_loss": -12.634014129638672, "global_step": 442107, "epoch": 2631} {"train_loss": -12.733176231384277, "global_step": 442108, "epoch": 2631} {"train_loss": -12.85399055480957, "global_step": 442109, "epoch": 2631} {"train_loss": -12.484471321105957, "global_step": 442110, "epoch": 2631} {"train_loss": -12.908735275268555, "global_step": 442111, "epoch": 2631} {"train_loss": -12.00271987915039, "global_step": 442112, "epoch": 2631} {"train_loss": -12.852523803710938, "global_step": 442113, "epoch": 2631} {"train_loss": -12.367507934570312, "global_step": 442114, "epoch": 2631} {"train_loss": -12.041437149047852, "global_step": 442115, "epoch": 2631} {"train_loss": -12.580327987670898, "global_step": 442116, "epoch": 2631} {"train_loss": -12.649572372436523, "global_step": 442117, "epoch": 2631} {"train_loss": -12.556205749511719, "global_step": 442118, "epoch": 2631} {"train_loss": -12.202116012573242, "global_step": 442119, "epoch": 2631} {"train_loss": -12.373894691467285, "global_step": 442120, "epoch": 2631} {"train_loss": -12.65096664428711, "global_step": 442121, "epoch": 2631} {"train_loss": -12.518789291381836, "global_step": 442122, "epoch": 2631} {"train_loss": -12.503360748291016, "global_step": 442123, "epoch": 2631} {"train_loss": -12.174993515014648, "global_step": 442124, "epoch": 2631} {"train_loss": -12.756771087646484, "global_step": 442125, "epoch": 2631} {"train_loss": -12.259358406066895, "global_step": 442126, "epoch": 2631} {"train_loss": -12.214627265930176, "global_step": 442127, "epoch": 2631} {"train_loss": -12.212870597839355, "global_step": 442128, "epoch": 2631} {"train_loss": -12.412939071655273, "global_step": 442129, "epoch": 2631} {"train_loss": -11.873991012573242, "global_step": 442130, "epoch": 2631} {"train_loss": -11.69551944732666, "global_step": 442131, "epoch": 2631} {"train_loss": -12.029255867004395, "global_step": 442132, "epoch": 2631} {"train_loss": -12.626230239868164, "global_step": 442133, "epoch": 2631} {"train_loss": -11.833592414855957, "global_step": 442134, "epoch": 2631} {"train_loss": -10.838048934936523, "global_step": 442135, "epoch": 2631} {"train_loss": -11.990121841430664, "global_step": 442136, "epoch": 2631} {"train_loss": -12.243278503417969, "global_step": 442137, "epoch": 2631} {"train_loss": -12.417560577392578, "global_step": 442138, "epoch": 2631} {"train_loss": -12.390039443969727, "global_step": 442139, "epoch": 2631} {"train_loss": -12.280830383300781, "global_step": 442140, "epoch": 2631} {"train_loss": -12.702856063842773, "global_step": 442141, "epoch": 2631} {"train_loss": -12.660443305969238, "global_step": 442142, "epoch": 2631} {"train_loss": -12.415437698364258, "global_step": 442143, "epoch": 2631} {"train_loss": -12.468186378479004, "global_step": 442144, "epoch": 2631} {"train_loss": -11.980740547180176, "global_step": 442145, "epoch": 2631} {"train_loss": -12.42393684387207, "global_step": 442146, "epoch": 2631} {"train_loss": -10.946577072143555, "global_step": 442147, "epoch": 2631} {"train_loss": -12.647878646850586, "global_step": 442148, "epoch": 2631} {"train_loss": -12.08479118347168, "global_step": 442149, "epoch": 2631} {"train_loss": -11.523954391479492, "global_step": 442150, "epoch": 2631} {"train_loss": -11.9403076171875, "global_step": 442151, "epoch": 2631} {"train_loss": -12.079972267150879, "global_step": 442152, "epoch": 2631} {"train_loss": -10.611024856567383, "global_step": 442153, "epoch": 2631} {"train_loss": -12.09614372253418, "global_step": 442154, "epoch": 2631} {"train_loss": -12.019309997558594, "global_step": 442155, "epoch": 2631} {"train_loss": -11.150663375854492, "global_step": 442156, "epoch": 2631} {"train_loss": -12.272494316101074, "global_step": 442157, "epoch": 2631} {"train_loss": -11.376572608947754, "global_step": 442158, "epoch": 2631} {"train_loss": -11.278877258300781, "global_step": 442159, "epoch": 2631} {"train_loss": -12.516149520874023, "global_step": 442160, "epoch": 2631} {"train_loss": -11.846589088439941, "global_step": 442161, "epoch": 2631} {"train_loss": -11.71689224243164, "global_step": 442162, "epoch": 2631} {"train_loss": -11.678163528442383, "global_step": 442163, "epoch": 2631} {"train_loss": -12.674195289611816, "global_step": 442164, "epoch": 2631} {"train_loss": -11.675115585327148, "global_step": 442165, "epoch": 2631} {"train_loss": -12.892866134643555, "global_step": 442166, "epoch": 2631} {"train_loss": -11.880000114440918, "global_step": 442167, "epoch": 2631} {"train_loss": -12.222114562988281, "global_step": 442168, "epoch": 2631} {"train_loss": -12.227496147155762, "global_step": 442169, "epoch": 2631} {"train_loss": -12.467672348022461, "global_step": 442170, "epoch": 2631} {"train_loss": -12.009197235107422, "global_step": 442171, "epoch": 2631} {"train_loss": -12.469982147216797, "global_step": 442172, "epoch": 2631} {"train_loss": -11.671697616577148, "global_step": 442173, "epoch": 2631} {"train_loss": -12.561378479003906, "global_step": 442174, "epoch": 2631} {"train_loss": -12.183401607331776, "global_step": 442175, "epoch": 2631, "val_loss": 309939.34375} {"train_loss": -12.533215522766113, "global_step": 442176, "epoch": 2632} {"train_loss": -12.015046119689941, "global_step": 442177, "epoch": 2632} {"train_loss": -11.954132080078125, "global_step": 442178, "epoch": 2632} {"train_loss": -11.54987907409668, "global_step": 442179, "epoch": 2632} {"train_loss": -12.360797882080078, "global_step": 442180, "epoch": 2632} {"train_loss": -11.248741149902344, "global_step": 442181, "epoch": 2632} {"train_loss": -12.355682373046875, "global_step": 442182, "epoch": 2632} {"train_loss": -11.819575309753418, "global_step": 442183, "epoch": 2632} {"train_loss": -11.437150955200195, "global_step": 442184, "epoch": 2632} {"train_loss": -12.105579376220703, "global_step": 442185, "epoch": 2632} {"train_loss": -11.019357681274414, "global_step": 442186, "epoch": 2632} {"train_loss": -11.599410057067871, "global_step": 442187, "epoch": 2632} {"train_loss": -11.834911346435547, "global_step": 442188, "epoch": 2632} {"train_loss": -10.696978569030762, "global_step": 442189, "epoch": 2632} {"train_loss": -11.982292175292969, "global_step": 442190, "epoch": 2632} {"train_loss": -11.38539981842041, "global_step": 442191, "epoch": 2632} {"train_loss": -12.281242370605469, "global_step": 442192, "epoch": 2632} {"train_loss": -12.038764953613281, "global_step": 442193, "epoch": 2632} {"train_loss": -11.671762466430664, "global_step": 442194, "epoch": 2632} {"train_loss": -12.28966236114502, "global_step": 442195, "epoch": 2632} {"train_loss": -11.709728240966797, "global_step": 442196, "epoch": 2632} {"train_loss": -11.209647178649902, "global_step": 442197, "epoch": 2632} {"train_loss": -12.274396896362305, "global_step": 442198, "epoch": 2632} {"train_loss": -11.88370132446289, "global_step": 442199, "epoch": 2632} {"train_loss": -11.79808235168457, "global_step": 442200, "epoch": 2632} {"train_loss": -11.806680679321289, "global_step": 442201, "epoch": 2632} {"train_loss": -11.898744583129883, "global_step": 442202, "epoch": 2632} {"train_loss": -10.994159698486328, "global_step": 442203, "epoch": 2632} {"train_loss": -11.602027893066406, "global_step": 442204, "epoch": 2632} {"train_loss": -12.221563339233398, "global_step": 442205, "epoch": 2632} {"train_loss": -11.363635063171387, "global_step": 442206, "epoch": 2632} {"train_loss": -12.193578720092773, "global_step": 442207, "epoch": 2632} {"train_loss": -11.659021377563477, "global_step": 442208, "epoch": 2632} {"train_loss": -12.246504783630371, "global_step": 442209, "epoch": 2632} {"train_loss": -11.836572647094727, "global_step": 442210, "epoch": 2632} {"train_loss": -11.92752742767334, "global_step": 442211, "epoch": 2632} {"train_loss": -12.11385440826416, "global_step": 442212, "epoch": 2632} {"train_loss": -11.773263931274414, "global_step": 442213, "epoch": 2632} {"train_loss": -11.72055435180664, "global_step": 442214, "epoch": 2632} {"train_loss": -11.935006141662598, "global_step": 442215, "epoch": 2632} {"train_loss": -12.01951789855957, "global_step": 442216, "epoch": 2632} {"train_loss": -11.370412826538086, "global_step": 442217, "epoch": 2632} {"train_loss": -12.316168785095215, "global_step": 442218, "epoch": 2632} {"train_loss": -11.571940422058105, "global_step": 442219, "epoch": 2632} {"train_loss": -11.658387184143066, "global_step": 442220, "epoch": 2632} {"train_loss": -11.188713073730469, "global_step": 442221, "epoch": 2632} {"train_loss": -11.465065002441406, "global_step": 442222, "epoch": 2632} {"train_loss": -11.826555252075195, "global_step": 442223, "epoch": 2632} {"train_loss": -11.568648338317871, "global_step": 442224, "epoch": 2632} {"train_loss": -12.253105163574219, "global_step": 442225, "epoch": 2632} {"train_loss": -11.803594589233398, "global_step": 442226, "epoch": 2632} {"train_loss": -12.006854057312012, "global_step": 442227, "epoch": 2632} {"train_loss": -12.214803695678711, "global_step": 442228, "epoch": 2632} {"train_loss": -12.079292297363281, "global_step": 442229, "epoch": 2632} {"train_loss": -11.715822219848633, "global_step": 442230, "epoch": 2632} {"train_loss": -12.033161163330078, "global_step": 442231, "epoch": 2632} {"train_loss": -11.75501823425293, "global_step": 442232, "epoch": 2632} {"train_loss": -11.684329986572266, "global_step": 442233, "epoch": 2632} {"train_loss": -12.275015830993652, "global_step": 442234, "epoch": 2632} {"train_loss": -11.103828430175781, "global_step": 442235, "epoch": 2632} {"train_loss": -11.459473609924316, "global_step": 442236, "epoch": 2632} {"train_loss": -12.089946746826172, "global_step": 442237, "epoch": 2632} {"train_loss": -11.469322204589844, "global_step": 442238, "epoch": 2632} {"train_loss": -12.337739944458008, "global_step": 442239, "epoch": 2632} {"train_loss": -11.51850700378418, "global_step": 442240, "epoch": 2632} {"train_loss": -12.054762840270996, "global_step": 442241, "epoch": 2632} {"train_loss": -12.176347732543945, "global_step": 442242, "epoch": 2632} {"train_loss": -11.793872833251953, "global_step": 442243, "epoch": 2632} {"train_loss": -12.260502815246582, "global_step": 442244, "epoch": 2632} {"train_loss": -12.17109203338623, "global_step": 442245, "epoch": 2632} {"train_loss": -12.507136344909668, "global_step": 442246, "epoch": 2632} {"train_loss": -12.134748458862305, "global_step": 442247, "epoch": 2632} {"train_loss": -12.622152328491211, "global_step": 442248, "epoch": 2632} {"train_loss": -12.264284133911133, "global_step": 442249, "epoch": 2632} {"train_loss": -12.379801750183105, "global_step": 442250, "epoch": 2632} {"train_loss": -12.29452133178711, "global_step": 442251, "epoch": 2632} {"train_loss": -12.058012008666992, "global_step": 442252, "epoch": 2632} {"train_loss": -12.688972473144531, "global_step": 442253, "epoch": 2632} {"train_loss": -12.18870735168457, "global_step": 442254, "epoch": 2632} {"train_loss": -12.684486389160156, "global_step": 442255, "epoch": 2632} {"train_loss": -12.333688735961914, "global_step": 442256, "epoch": 2632} {"train_loss": -12.532864570617676, "global_step": 442257, "epoch": 2632} {"train_loss": -12.225257873535156, "global_step": 442258, "epoch": 2632} {"train_loss": -12.384847640991211, "global_step": 442259, "epoch": 2632} {"train_loss": -12.42422866821289, "global_step": 442260, "epoch": 2632} {"train_loss": -12.49275016784668, "global_step": 442261, "epoch": 2632} {"train_loss": -12.726770401000977, "global_step": 442262, "epoch": 2632} {"train_loss": -12.00725269317627, "global_step": 442263, "epoch": 2632} {"train_loss": -12.71481704711914, "global_step": 442264, "epoch": 2632} {"train_loss": -11.926878929138184, "global_step": 442265, "epoch": 2632} {"train_loss": -12.36941909790039, "global_step": 442266, "epoch": 2632} {"train_loss": -12.288554191589355, "global_step": 442267, "epoch": 2632} {"train_loss": -12.536943435668945, "global_step": 442268, "epoch": 2632} {"train_loss": -12.581523895263672, "global_step": 442269, "epoch": 2632} {"train_loss": -12.11406135559082, "global_step": 442270, "epoch": 2632} {"train_loss": -12.763496398925781, "global_step": 442271, "epoch": 2632} {"train_loss": -12.342998504638672, "global_step": 442272, "epoch": 2632} {"train_loss": -12.119175910949707, "global_step": 442273, "epoch": 2632} {"train_loss": -11.74394416809082, "global_step": 442274, "epoch": 2632} {"train_loss": -12.10171127319336, "global_step": 442275, "epoch": 2632} {"train_loss": -11.928421974182129, "global_step": 442276, "epoch": 2632} {"train_loss": -12.170743942260742, "global_step": 442277, "epoch": 2632} {"train_loss": -12.65113639831543, "global_step": 442278, "epoch": 2632} {"train_loss": -11.408117294311523, "global_step": 442279, "epoch": 2632} {"train_loss": -12.252790451049805, "global_step": 442280, "epoch": 2632} {"train_loss": -10.69352912902832, "global_step": 442281, "epoch": 2632} {"train_loss": -12.595281600952148, "global_step": 442282, "epoch": 2632} {"train_loss": -11.55125904083252, "global_step": 442283, "epoch": 2632} {"train_loss": -12.340080261230469, "global_step": 442284, "epoch": 2632} {"train_loss": -12.195367813110352, "global_step": 442285, "epoch": 2632} {"train_loss": -11.8118896484375, "global_step": 442286, "epoch": 2632} {"train_loss": -12.195621490478516, "global_step": 442287, "epoch": 2632} {"train_loss": -11.228629112243652, "global_step": 442288, "epoch": 2632} {"train_loss": -12.09975528717041, "global_step": 442289, "epoch": 2632} {"train_loss": -12.053353309631348, "global_step": 442290, "epoch": 2632} {"train_loss": -11.780280113220215, "global_step": 442291, "epoch": 2632} {"train_loss": -11.857240676879883, "global_step": 442292, "epoch": 2632} {"train_loss": -11.953695297241211, "global_step": 442293, "epoch": 2632} {"train_loss": -11.86623764038086, "global_step": 442294, "epoch": 2632} {"train_loss": -12.058769226074219, "global_step": 442295, "epoch": 2632} {"train_loss": -11.132261276245117, "global_step": 442296, "epoch": 2632} {"train_loss": -11.867395401000977, "global_step": 442297, "epoch": 2632} {"train_loss": -10.893807411193848, "global_step": 442298, "epoch": 2632} {"train_loss": -10.998056411743164, "global_step": 442299, "epoch": 2632} {"train_loss": -12.011035919189453, "global_step": 442300, "epoch": 2632} {"train_loss": -10.795068740844727, "global_step": 442301, "epoch": 2632} {"train_loss": -11.41445255279541, "global_step": 442302, "epoch": 2632} {"train_loss": -11.494470596313477, "global_step": 442303, "epoch": 2632} {"train_loss": -11.815942764282227, "global_step": 442304, "epoch": 2632} {"train_loss": -11.751640319824219, "global_step": 442305, "epoch": 2632} {"train_loss": -11.933817863464355, "global_step": 442306, "epoch": 2632} {"train_loss": -11.97755241394043, "global_step": 442307, "epoch": 2632} {"train_loss": -11.675345420837402, "global_step": 442308, "epoch": 2632} {"train_loss": -12.330326080322266, "global_step": 442309, "epoch": 2632} {"train_loss": -11.787176132202148, "global_step": 442310, "epoch": 2632} {"train_loss": -11.992822647094727, "global_step": 442311, "epoch": 2632} {"train_loss": -12.055604934692383, "global_step": 442312, "epoch": 2632} {"train_loss": -11.896039962768555, "global_step": 442313, "epoch": 2632} {"train_loss": -12.738268852233887, "global_step": 442314, "epoch": 2632} {"train_loss": -11.870538711547852, "global_step": 442315, "epoch": 2632} {"train_loss": -12.531744003295898, "global_step": 442316, "epoch": 2632} {"train_loss": -12.389017105102539, "global_step": 442317, "epoch": 2632} {"train_loss": -12.332277297973633, "global_step": 442318, "epoch": 2632} {"train_loss": -12.42308521270752, "global_step": 442319, "epoch": 2632} {"train_loss": -12.377614974975586, "global_step": 442320, "epoch": 2632} {"train_loss": -12.526168823242188, "global_step": 442321, "epoch": 2632} {"train_loss": -12.476561546325684, "global_step": 442322, "epoch": 2632} {"train_loss": -12.462799072265625, "global_step": 442323, "epoch": 2632} {"train_loss": -12.445585250854492, "global_step": 442324, "epoch": 2632} {"train_loss": -12.511868476867676, "global_step": 442325, "epoch": 2632} {"train_loss": -12.707254409790039, "global_step": 442326, "epoch": 2632} {"train_loss": -12.582681655883789, "global_step": 442327, "epoch": 2632} {"train_loss": -12.637752532958984, "global_step": 442328, "epoch": 2632} {"train_loss": -12.694941520690918, "global_step": 442329, "epoch": 2632} {"train_loss": -12.41786003112793, "global_step": 442330, "epoch": 2632} {"train_loss": -12.739531517028809, "global_step": 442331, "epoch": 2632} {"train_loss": -12.424018859863281, "global_step": 442332, "epoch": 2632} {"train_loss": -12.690317153930664, "global_step": 442333, "epoch": 2632} {"train_loss": -12.236934661865234, "global_step": 442334, "epoch": 2632} {"train_loss": -12.640460968017578, "global_step": 442335, "epoch": 2632} {"train_loss": -12.704273223876953, "global_step": 442336, "epoch": 2632} {"train_loss": -12.473058700561523, "global_step": 442337, "epoch": 2632} {"train_loss": -12.595882415771484, "global_step": 442338, "epoch": 2632} {"train_loss": -12.585346221923828, "global_step": 442339, "epoch": 2632} {"train_loss": -12.480830192565918, "global_step": 442340, "epoch": 2632} {"train_loss": -12.612227439880371, "global_step": 442341, "epoch": 2632} {"train_loss": -12.675558090209961, "global_step": 442342, "epoch": 2632} {"train_loss": -12.039101441701254, "global_step": 442343, "epoch": 2632, "val_loss": 310164.03125} {"train_loss": -12.69835090637207, "global_step": 442344, "epoch": 2633} {"train_loss": -12.808606147766113, "global_step": 442345, "epoch": 2633} {"train_loss": -12.837139129638672, "global_step": 442346, "epoch": 2633} {"train_loss": -12.806304931640625, "global_step": 442347, "epoch": 2633} {"train_loss": -12.674295425415039, "global_step": 442348, "epoch": 2633} {"train_loss": -12.442359924316406, "global_step": 442349, "epoch": 2633} {"train_loss": -12.724886894226074, "global_step": 442350, "epoch": 2633} {"train_loss": -12.648025512695312, "global_step": 442351, "epoch": 2633} {"train_loss": -12.739496231079102, "global_step": 442352, "epoch": 2633} {"train_loss": -12.359220504760742, "global_step": 442353, "epoch": 2633} {"train_loss": -12.693845748901367, "global_step": 442354, "epoch": 2633} {"train_loss": -12.71828842163086, "global_step": 442355, "epoch": 2633} {"train_loss": -12.594854354858398, "global_step": 442356, "epoch": 2633} {"train_loss": -12.691198348999023, "global_step": 442357, "epoch": 2633} {"train_loss": -12.666590690612793, "global_step": 442358, "epoch": 2633} {"train_loss": -12.827678680419922, "global_step": 442359, "epoch": 2633} {"train_loss": -12.858274459838867, "global_step": 442360, "epoch": 2633} {"train_loss": -12.735755920410156, "global_step": 442361, "epoch": 2633} {"train_loss": -12.722633361816406, "global_step": 442362, "epoch": 2633} {"train_loss": -12.591182708740234, "global_step": 442363, "epoch": 2633} {"train_loss": -12.651681900024414, "global_step": 442364, "epoch": 2633} {"train_loss": -12.56088638305664, "global_step": 442365, "epoch": 2633} {"train_loss": -12.844184875488281, "global_step": 442366, "epoch": 2633} {"train_loss": -12.930749893188477, "global_step": 442367, "epoch": 2633} {"train_loss": -12.535268783569336, "global_step": 442368, "epoch": 2633} {"train_loss": -12.874397277832031, "global_step": 442369, "epoch": 2633} {"train_loss": -12.296411514282227, "global_step": 442370, "epoch": 2633} {"train_loss": -12.835073471069336, "global_step": 442371, "epoch": 2633} {"train_loss": -12.62011432647705, "global_step": 442372, "epoch": 2633} {"train_loss": -12.671281814575195, "global_step": 442373, "epoch": 2633} {"train_loss": -12.769039154052734, "global_step": 442374, "epoch": 2633} {"train_loss": -12.729082107543945, "global_step": 442375, "epoch": 2633} {"train_loss": -12.640737533569336, "global_step": 442376, "epoch": 2633} {"train_loss": -12.701278686523438, "global_step": 442377, "epoch": 2633} {"train_loss": -12.902101516723633, "global_step": 442378, "epoch": 2633} {"train_loss": -12.402212142944336, "global_step": 442379, "epoch": 2633} {"train_loss": -12.649348258972168, "global_step": 442380, "epoch": 2633} {"train_loss": -12.42981243133545, "global_step": 442381, "epoch": 2633} {"train_loss": -12.219539642333984, "global_step": 442382, "epoch": 2633} {"train_loss": -12.592634201049805, "global_step": 442383, "epoch": 2633} {"train_loss": -12.620086669921875, "global_step": 442384, "epoch": 2633} {"train_loss": -11.881962776184082, "global_step": 442385, "epoch": 2633} {"train_loss": -12.437158584594727, "global_step": 442386, "epoch": 2633} {"train_loss": -12.267524719238281, "global_step": 442387, "epoch": 2633} {"train_loss": -12.511491775512695, "global_step": 442388, "epoch": 2633} {"train_loss": -12.4886474609375, "global_step": 442389, "epoch": 2633} {"train_loss": -12.853038787841797, "global_step": 442390, "epoch": 2633} {"train_loss": -12.725835800170898, "global_step": 442391, "epoch": 2633} {"train_loss": -12.403568267822266, "global_step": 442392, "epoch": 2633} {"train_loss": -12.739788055419922, "global_step": 442393, "epoch": 2633} {"train_loss": -12.552223205566406, "global_step": 442394, "epoch": 2633} {"train_loss": -12.4740629196167, "global_step": 442395, "epoch": 2633} {"train_loss": -12.207202911376953, "global_step": 442396, "epoch": 2633} {"train_loss": -12.09074878692627, "global_step": 442397, "epoch": 2633} {"train_loss": -12.465312957763672, "global_step": 442398, "epoch": 2633} {"train_loss": -12.185009002685547, "global_step": 442399, "epoch": 2633} {"train_loss": -12.048192977905273, "global_step": 442400, "epoch": 2633} {"train_loss": -12.359309196472168, "global_step": 442401, "epoch": 2633} {"train_loss": -12.072585105895996, "global_step": 442402, "epoch": 2633} {"train_loss": -12.316917419433594, "global_step": 442403, "epoch": 2633} {"train_loss": -12.571146011352539, "global_step": 442404, "epoch": 2633} {"train_loss": -12.036699295043945, "global_step": 442405, "epoch": 2633} {"train_loss": -11.428110122680664, "global_step": 442406, "epoch": 2633} {"train_loss": -12.0562744140625, "global_step": 442407, "epoch": 2633} {"train_loss": -12.31403636932373, "global_step": 442408, "epoch": 2633} {"train_loss": -10.652081489562988, "global_step": 442409, "epoch": 2633} {"train_loss": -9.81869888305664, "global_step": 442410, "epoch": 2633} {"train_loss": -10.795990943908691, "global_step": 442411, "epoch": 2633} {"train_loss": -11.458025932312012, "global_step": 442412, "epoch": 2633} {"train_loss": -10.257668495178223, "global_step": 442413, "epoch": 2633} {"train_loss": -10.890538215637207, "global_step": 442414, "epoch": 2633} {"train_loss": -11.36689281463623, "global_step": 442415, "epoch": 2633} {"train_loss": -10.92062759399414, "global_step": 442416, "epoch": 2633} {"train_loss": -9.704608917236328, "global_step": 442417, "epoch": 2633} {"train_loss": -11.885894775390625, "global_step": 442418, "epoch": 2633} {"train_loss": -11.580606460571289, "global_step": 442419, "epoch": 2633} {"train_loss": -10.202064514160156, "global_step": 442420, "epoch": 2633} {"train_loss": -10.483428001403809, "global_step": 442421, "epoch": 2633} {"train_loss": -10.67135238647461, "global_step": 442422, "epoch": 2633} {"train_loss": -11.398360252380371, "global_step": 442423, "epoch": 2633} {"train_loss": -11.347278594970703, "global_step": 442424, "epoch": 2633} {"train_loss": -11.544511795043945, "global_step": 442425, "epoch": 2633} {"train_loss": -11.866122245788574, "global_step": 442426, "epoch": 2633} {"train_loss": -10.638772010803223, "global_step": 442427, "epoch": 2633} {"train_loss": -12.607687950134277, "global_step": 442428, "epoch": 2633} {"train_loss": -11.523504257202148, "global_step": 442429, "epoch": 2633} {"train_loss": -12.344077110290527, "global_step": 442430, "epoch": 2633} {"train_loss": -11.503791809082031, "global_step": 442431, "epoch": 2633} {"train_loss": -12.085062026977539, "global_step": 442432, "epoch": 2633} {"train_loss": -11.467333793640137, "global_step": 442433, "epoch": 2633} {"train_loss": -11.675131797790527, "global_step": 442434, "epoch": 2633} {"train_loss": -11.214376449584961, "global_step": 442435, "epoch": 2633} {"train_loss": -12.011765480041504, "global_step": 442436, "epoch": 2633} {"train_loss": -9.986167907714844, "global_step": 442437, "epoch": 2633} {"train_loss": -11.541930198669434, "global_step": 442438, "epoch": 2633} {"train_loss": -11.076714515686035, "global_step": 442439, "epoch": 2633} {"train_loss": -11.806411743164062, "global_step": 442440, "epoch": 2633} {"train_loss": -11.701534271240234, "global_step": 442441, "epoch": 2633} {"train_loss": -11.398883819580078, "global_step": 442442, "epoch": 2633} {"train_loss": -12.441234588623047, "global_step": 442443, "epoch": 2633} {"train_loss": -11.556526184082031, "global_step": 442444, "epoch": 2633} {"train_loss": -12.246162414550781, "global_step": 442445, "epoch": 2633} {"train_loss": -11.903566360473633, "global_step": 442446, "epoch": 2633} {"train_loss": -12.090936660766602, "global_step": 442447, "epoch": 2633} {"train_loss": -11.820531845092773, "global_step": 442448, "epoch": 2633} {"train_loss": -12.296424865722656, "global_step": 442449, "epoch": 2633} {"train_loss": -12.035721778869629, "global_step": 442450, "epoch": 2633} {"train_loss": -12.390436172485352, "global_step": 442451, "epoch": 2633} {"train_loss": -12.118597030639648, "global_step": 442452, "epoch": 2633} {"train_loss": -12.391448974609375, "global_step": 442453, "epoch": 2633} {"train_loss": -12.38062858581543, "global_step": 442454, "epoch": 2633} {"train_loss": -11.94840145111084, "global_step": 442455, "epoch": 2633} {"train_loss": -12.192209243774414, "global_step": 442456, "epoch": 2633} {"train_loss": -11.867082595825195, "global_step": 442457, "epoch": 2633} {"train_loss": -11.414048194885254, "global_step": 442458, "epoch": 2633} {"train_loss": -12.057780265808105, "global_step": 442459, "epoch": 2633} {"train_loss": -10.990647315979004, "global_step": 442460, "epoch": 2633} {"train_loss": -11.505345344543457, "global_step": 442461, "epoch": 2633} {"train_loss": -10.745811462402344, "global_step": 442462, "epoch": 2633} {"train_loss": -11.08028793334961, "global_step": 442463, "epoch": 2633} {"train_loss": -11.69749927520752, "global_step": 442464, "epoch": 2633} {"train_loss": -10.903714179992676, "global_step": 442465, "epoch": 2633} {"train_loss": -12.23432445526123, "global_step": 442466, "epoch": 2633} {"train_loss": -10.748395919799805, "global_step": 442467, "epoch": 2633} {"train_loss": -12.296539306640625, "global_step": 442468, "epoch": 2633} {"train_loss": -11.180416107177734, "global_step": 442469, "epoch": 2633} {"train_loss": -12.082466125488281, "global_step": 442470, "epoch": 2633} {"train_loss": -11.660301208496094, "global_step": 442471, "epoch": 2633} {"train_loss": -12.031753540039062, "global_step": 442472, "epoch": 2633} {"train_loss": -12.000768661499023, "global_step": 442473, "epoch": 2633} {"train_loss": -12.043458938598633, "global_step": 442474, "epoch": 2633} {"train_loss": -12.152421951293945, "global_step": 442475, "epoch": 2633} {"train_loss": -11.959312438964844, "global_step": 442476, "epoch": 2633} {"train_loss": -12.040874481201172, "global_step": 442477, "epoch": 2633} {"train_loss": -12.327991485595703, "global_step": 442478, "epoch": 2633} {"train_loss": -11.822388648986816, "global_step": 442479, "epoch": 2633} {"train_loss": -12.325089454650879, "global_step": 442480, "epoch": 2633} {"train_loss": -11.906533241271973, "global_step": 442481, "epoch": 2633} {"train_loss": -12.370744705200195, "global_step": 442482, "epoch": 2633} {"train_loss": -11.861058235168457, "global_step": 442483, "epoch": 2633} {"train_loss": -12.451004028320312, "global_step": 442484, "epoch": 2633} {"train_loss": -12.145256996154785, "global_step": 442485, "epoch": 2633} {"train_loss": -12.538146018981934, "global_step": 442486, "epoch": 2633} {"train_loss": -12.490671157836914, "global_step": 442487, "epoch": 2633} {"train_loss": -12.465278625488281, "global_step": 442488, "epoch": 2633} {"train_loss": -12.209296226501465, "global_step": 442489, "epoch": 2633} {"train_loss": -12.215006828308105, "global_step": 442490, "epoch": 2633} {"train_loss": -12.362995147705078, "global_step": 442491, "epoch": 2633} {"train_loss": -12.327402114868164, "global_step": 442492, "epoch": 2633} {"train_loss": -12.065668106079102, "global_step": 442493, "epoch": 2633} {"train_loss": -12.18902587890625, "global_step": 442494, "epoch": 2633} {"train_loss": -12.294666290283203, "global_step": 442495, "epoch": 2633} {"train_loss": -12.110445022583008, "global_step": 442496, "epoch": 2633} {"train_loss": -12.378785133361816, "global_step": 442497, "epoch": 2633} {"train_loss": -12.225208282470703, "global_step": 442498, "epoch": 2633} {"train_loss": -11.806184768676758, "global_step": 442499, "epoch": 2633} {"train_loss": -12.361780166625977, "global_step": 442500, "epoch": 2633} {"train_loss": -12.118741035461426, "global_step": 442501, "epoch": 2633} {"train_loss": -12.387435913085938, "global_step": 442502, "epoch": 2633} {"train_loss": -12.122676849365234, "global_step": 442503, "epoch": 2633} {"train_loss": -12.545955657958984, "global_step": 442504, "epoch": 2633} {"train_loss": -12.179157257080078, "global_step": 442505, "epoch": 2633} {"train_loss": -12.355467796325684, "global_step": 442506, "epoch": 2633} {"train_loss": -12.267742156982422, "global_step": 442507, "epoch": 2633} {"train_loss": -12.501195907592773, "global_step": 442508, "epoch": 2633} {"train_loss": -12.329761505126953, "global_step": 442509, "epoch": 2633} {"train_loss": -12.258434295654297, "global_step": 442510, "epoch": 2633} {"train_loss": -12.066215674082438, "global_step": 442511, "epoch": 2633, "val_loss": 304444.34375} {"train_loss": -12.44393539428711, "global_step": 442512, "epoch": 2634} {"train_loss": -12.399441719055176, "global_step": 442513, "epoch": 2634} {"train_loss": -12.50184440612793, "global_step": 442514, "epoch": 2634} {"train_loss": -12.592229843139648, "global_step": 442515, "epoch": 2634} {"train_loss": -12.38425064086914, "global_step": 442516, "epoch": 2634} {"train_loss": -12.370233535766602, "global_step": 442517, "epoch": 2634} {"train_loss": -12.45126724243164, "global_step": 442518, "epoch": 2634} {"train_loss": -12.321939468383789, "global_step": 442519, "epoch": 2634} {"train_loss": -12.552453994750977, "global_step": 442520, "epoch": 2634} {"train_loss": -12.516029357910156, "global_step": 442521, "epoch": 2634} {"train_loss": -12.701857566833496, "global_step": 442522, "epoch": 2634} {"train_loss": -12.27782154083252, "global_step": 442523, "epoch": 2634} {"train_loss": -12.277911186218262, "global_step": 442524, "epoch": 2634} {"train_loss": -12.349287033081055, "global_step": 442525, "epoch": 2634} {"train_loss": -12.361777305603027, "global_step": 442526, "epoch": 2634} {"train_loss": -12.540776252746582, "global_step": 442527, "epoch": 2634} {"train_loss": -12.89860725402832, "global_step": 442528, "epoch": 2634} {"train_loss": -12.398927688598633, "global_step": 442529, "epoch": 2634} {"train_loss": -12.688313484191895, "global_step": 442530, "epoch": 2634} {"train_loss": -12.324335098266602, "global_step": 442531, "epoch": 2634} {"train_loss": -12.233294486999512, "global_step": 442532, "epoch": 2634} {"train_loss": -12.534004211425781, "global_step": 442533, "epoch": 2634} {"train_loss": -12.470054626464844, "global_step": 442534, "epoch": 2634} {"train_loss": -12.237934112548828, "global_step": 442535, "epoch": 2634} {"train_loss": -12.75234317779541, "global_step": 442536, "epoch": 2634} {"train_loss": -12.521965026855469, "global_step": 442537, "epoch": 2634} {"train_loss": -12.276144027709961, "global_step": 442538, "epoch": 2634} {"train_loss": -12.666130065917969, "global_step": 442539, "epoch": 2634} {"train_loss": -12.4766845703125, "global_step": 442540, "epoch": 2634} {"train_loss": -12.394969940185547, "global_step": 442541, "epoch": 2634} {"train_loss": -12.56938362121582, "global_step": 442542, "epoch": 2634} {"train_loss": -12.547164916992188, "global_step": 442543, "epoch": 2634} {"train_loss": -12.610729217529297, "global_step": 442544, "epoch": 2634} {"train_loss": -12.6863374710083, "global_step": 442545, "epoch": 2634} {"train_loss": -12.719027519226074, "global_step": 442546, "epoch": 2634} {"train_loss": -12.791067123413086, "global_step": 442547, "epoch": 2634} {"train_loss": -12.672983169555664, "global_step": 442548, "epoch": 2634} {"train_loss": -12.635982513427734, "global_step": 442549, "epoch": 2634} {"train_loss": -12.582218170166016, "global_step": 442550, "epoch": 2634} {"train_loss": -12.72615909576416, "global_step": 442551, "epoch": 2634} {"train_loss": -12.571996688842773, "global_step": 442552, "epoch": 2634} {"train_loss": -12.890218734741211, "global_step": 442553, "epoch": 2634} {"train_loss": -12.734781265258789, "global_step": 442554, "epoch": 2634} {"train_loss": -12.786420822143555, "global_step": 442555, "epoch": 2634} {"train_loss": -12.869626998901367, "global_step": 442556, "epoch": 2634} {"train_loss": -12.925039291381836, "global_step": 442557, "epoch": 2634} {"train_loss": -12.73861312866211, "global_step": 442558, "epoch": 2634} {"train_loss": -12.99135684967041, "global_step": 442559, "epoch": 2634} {"train_loss": -13.002213478088379, "global_step": 442560, "epoch": 2634} {"train_loss": -12.811552047729492, "global_step": 442561, "epoch": 2634} {"train_loss": -12.78227710723877, "global_step": 442562, "epoch": 2634} {"train_loss": -12.988348007202148, "global_step": 442563, "epoch": 2634} {"train_loss": -12.750534057617188, "global_step": 442564, "epoch": 2634} {"train_loss": -12.74069595336914, "global_step": 442565, "epoch": 2634} {"train_loss": -12.74345874786377, "global_step": 442566, "epoch": 2634} {"train_loss": -12.649299621582031, "global_step": 442567, "epoch": 2634} {"train_loss": -12.516687393188477, "global_step": 442568, "epoch": 2634} {"train_loss": -12.619025230407715, "global_step": 442569, "epoch": 2634} {"train_loss": -12.422273635864258, "global_step": 442570, "epoch": 2634} {"train_loss": -12.763413429260254, "global_step": 442571, "epoch": 2634} {"train_loss": -12.513753890991211, "global_step": 442572, "epoch": 2634} {"train_loss": -12.397710800170898, "global_step": 442573, "epoch": 2634} {"train_loss": -12.70551872253418, "global_step": 442574, "epoch": 2634} {"train_loss": -12.310905456542969, "global_step": 442575, "epoch": 2634} {"train_loss": -11.888282775878906, "global_step": 442576, "epoch": 2634} {"train_loss": -12.39017105102539, "global_step": 442577, "epoch": 2634} {"train_loss": -11.450274467468262, "global_step": 442578, "epoch": 2634} {"train_loss": -11.00459098815918, "global_step": 442579, "epoch": 2634} {"train_loss": -11.85112190246582, "global_step": 442580, "epoch": 2634} {"train_loss": -11.782995223999023, "global_step": 442581, "epoch": 2634} {"train_loss": -11.000590324401855, "global_step": 442582, "epoch": 2634} {"train_loss": -11.584938049316406, "global_step": 442583, "epoch": 2634} {"train_loss": -11.727745056152344, "global_step": 442584, "epoch": 2634} {"train_loss": -10.98065185546875, "global_step": 442585, "epoch": 2634} {"train_loss": -11.047721862792969, "global_step": 442586, "epoch": 2634} {"train_loss": -12.32221794128418, "global_step": 442587, "epoch": 2634} {"train_loss": -11.776203155517578, "global_step": 442588, "epoch": 2634} {"train_loss": -12.439956665039062, "global_step": 442589, "epoch": 2634} {"train_loss": -11.85745620727539, "global_step": 442590, "epoch": 2634} {"train_loss": -12.207958221435547, "global_step": 442591, "epoch": 2634} {"train_loss": -11.726497650146484, "global_step": 442592, "epoch": 2634} {"train_loss": -12.175702095031738, "global_step": 442593, "epoch": 2634} {"train_loss": -11.978291511535645, "global_step": 442594, "epoch": 2634} {"train_loss": -10.51244831085205, "global_step": 442595, "epoch": 2634} {"train_loss": -12.063475608825684, "global_step": 442596, "epoch": 2634} {"train_loss": -11.044387817382812, "global_step": 442597, "epoch": 2634} {"train_loss": -10.823015213012695, "global_step": 442598, "epoch": 2634} {"train_loss": -11.964930534362793, "global_step": 442599, "epoch": 2634} {"train_loss": -11.56981372833252, "global_step": 442600, "epoch": 2634} {"train_loss": -11.73111343383789, "global_step": 442601, "epoch": 2634} {"train_loss": -11.963814735412598, "global_step": 442602, "epoch": 2634} {"train_loss": -12.449690818786621, "global_step": 442603, "epoch": 2634} {"train_loss": -12.24712085723877, "global_step": 442604, "epoch": 2634} {"train_loss": -12.215629577636719, "global_step": 442605, "epoch": 2634} {"train_loss": -12.424395561218262, "global_step": 442606, "epoch": 2634} {"train_loss": -11.917572021484375, "global_step": 442607, "epoch": 2634} {"train_loss": -12.566463470458984, "global_step": 442608, "epoch": 2634} {"train_loss": -12.095222473144531, "global_step": 442609, "epoch": 2634} {"train_loss": -12.65017318725586, "global_step": 442610, "epoch": 2634} {"train_loss": -12.671842575073242, "global_step": 442611, "epoch": 2634} {"train_loss": -12.389408111572266, "global_step": 442612, "epoch": 2634} {"train_loss": -12.375563621520996, "global_step": 442613, "epoch": 2634} {"train_loss": -12.564491271972656, "global_step": 442614, "epoch": 2634} {"train_loss": -12.533451080322266, "global_step": 442615, "epoch": 2634} {"train_loss": -12.313220977783203, "global_step": 442616, "epoch": 2634} {"train_loss": -12.42399787902832, "global_step": 442617, "epoch": 2634} {"train_loss": -12.121479034423828, "global_step": 442618, "epoch": 2634} {"train_loss": -12.387619018554688, "global_step": 442619, "epoch": 2634} {"train_loss": -12.263803482055664, "global_step": 442620, "epoch": 2634} {"train_loss": -12.109358787536621, "global_step": 442621, "epoch": 2634} {"train_loss": -12.338048934936523, "global_step": 442622, "epoch": 2634} {"train_loss": -12.206766128540039, "global_step": 442623, "epoch": 2634} {"train_loss": -11.657127380371094, "global_step": 442624, "epoch": 2634} {"train_loss": -12.386641502380371, "global_step": 442625, "epoch": 2634} {"train_loss": -11.435422897338867, "global_step": 442626, "epoch": 2634} {"train_loss": -12.413644790649414, "global_step": 442627, "epoch": 2634} {"train_loss": -11.681879997253418, "global_step": 442628, "epoch": 2634} {"train_loss": -11.406755447387695, "global_step": 442629, "epoch": 2634} {"train_loss": -12.33796501159668, "global_step": 442630, "epoch": 2634} {"train_loss": -11.715949058532715, "global_step": 442631, "epoch": 2634} {"train_loss": -11.908295631408691, "global_step": 442632, "epoch": 2634} {"train_loss": -11.620405197143555, "global_step": 442633, "epoch": 2634} {"train_loss": -11.768489837646484, "global_step": 442634, "epoch": 2634} {"train_loss": -12.367515563964844, "global_step": 442635, "epoch": 2634} {"train_loss": -11.523569107055664, "global_step": 442636, "epoch": 2634} {"train_loss": -12.051511764526367, "global_step": 442637, "epoch": 2634} {"train_loss": -11.740548133850098, "global_step": 442638, "epoch": 2634} {"train_loss": -11.26038932800293, "global_step": 442639, "epoch": 2634} {"train_loss": -11.845458984375, "global_step": 442640, "epoch": 2634} {"train_loss": -11.744050025939941, "global_step": 442641, "epoch": 2634} {"train_loss": -11.684423446655273, "global_step": 442642, "epoch": 2634} {"train_loss": -10.451184272766113, "global_step": 442643, "epoch": 2634} {"train_loss": -10.902620315551758, "global_step": 442644, "epoch": 2634} {"train_loss": -11.192521095275879, "global_step": 442645, "epoch": 2634} {"train_loss": -10.832401275634766, "global_step": 442646, "epoch": 2634} {"train_loss": -10.638782501220703, "global_step": 442647, "epoch": 2634} {"train_loss": -12.23489761352539, "global_step": 442648, "epoch": 2634} {"train_loss": -9.866416931152344, "global_step": 442649, "epoch": 2634} {"train_loss": -11.941350936889648, "global_step": 442650, "epoch": 2634} {"train_loss": -11.789665222167969, "global_step": 442651, "epoch": 2634} {"train_loss": -11.383305549621582, "global_step": 442652, "epoch": 2634} {"train_loss": -11.807069778442383, "global_step": 442653, "epoch": 2634} {"train_loss": -11.917112350463867, "global_step": 442654, "epoch": 2634} {"train_loss": -11.432157516479492, "global_step": 442655, "epoch": 2634} {"train_loss": -12.549814224243164, "global_step": 442656, "epoch": 2634} {"train_loss": -11.271894454956055, "global_step": 442657, "epoch": 2634} {"train_loss": -12.154555320739746, "global_step": 442658, "epoch": 2634} {"train_loss": -11.755332946777344, "global_step": 442659, "epoch": 2634} {"train_loss": -11.784957885742188, "global_step": 442660, "epoch": 2634} {"train_loss": -12.358319282531738, "global_step": 442661, "epoch": 2634} {"train_loss": -11.624265670776367, "global_step": 442662, "epoch": 2634} {"train_loss": -12.530086517333984, "global_step": 442663, "epoch": 2634} {"train_loss": -12.065376281738281, "global_step": 442664, "epoch": 2634} {"train_loss": -12.598455429077148, "global_step": 442665, "epoch": 2634} {"train_loss": -12.281420707702637, "global_step": 442666, "epoch": 2634} {"train_loss": -12.311840057373047, "global_step": 442667, "epoch": 2634} {"train_loss": -12.161455154418945, "global_step": 442668, "epoch": 2634} {"train_loss": -12.199350357055664, "global_step": 442669, "epoch": 2634} {"train_loss": -11.987374305725098, "global_step": 442670, "epoch": 2634} {"train_loss": -12.624252319335938, "global_step": 442671, "epoch": 2634} {"train_loss": -12.046632766723633, "global_step": 442672, "epoch": 2634} {"train_loss": -12.121078491210938, "global_step": 442673, "epoch": 2634} {"train_loss": -12.557937622070312, "global_step": 442674, "epoch": 2634} {"train_loss": -12.29824447631836, "global_step": 442675, "epoch": 2634} {"train_loss": -12.68808650970459, "global_step": 442676, "epoch": 2634} {"train_loss": -12.341806411743164, "global_step": 442677, "epoch": 2634} {"train_loss": -12.541866302490234, "global_step": 442678, "epoch": 2634} {"train_loss": -12.166120784623283, "global_step": 442679, "epoch": 2634, "val_loss": 313080.6875} {"train_loss": -12.460084915161133, "global_step": 442680, "epoch": 2635} {"train_loss": -12.622696876525879, "global_step": 442681, "epoch": 2635} {"train_loss": -12.586660385131836, "global_step": 442682, "epoch": 2635} {"train_loss": -12.421567916870117, "global_step": 442683, "epoch": 2635} {"train_loss": -12.646936416625977, "global_step": 442684, "epoch": 2635} {"train_loss": -12.610420227050781, "global_step": 442685, "epoch": 2635} {"train_loss": -12.485157012939453, "global_step": 442686, "epoch": 2635} {"train_loss": -12.597925186157227, "global_step": 442687, "epoch": 2635} {"train_loss": -12.710271835327148, "global_step": 442688, "epoch": 2635} {"train_loss": -12.44534683227539, "global_step": 442689, "epoch": 2635} {"train_loss": -12.50171184539795, "global_step": 442690, "epoch": 2635} {"train_loss": -12.798507690429688, "global_step": 442691, "epoch": 2635} {"train_loss": -12.775633811950684, "global_step": 442692, "epoch": 2635} {"train_loss": -12.770532608032227, "global_step": 442693, "epoch": 2635} {"train_loss": -12.769765853881836, "global_step": 442694, "epoch": 2635} {"train_loss": -12.724385261535645, "global_step": 442695, "epoch": 2635} {"train_loss": -12.816028594970703, "global_step": 442696, "epoch": 2635} {"train_loss": -12.618086814880371, "global_step": 442697, "epoch": 2635} {"train_loss": -12.70085620880127, "global_step": 442698, "epoch": 2635} {"train_loss": -12.767282485961914, "global_step": 442699, "epoch": 2635} {"train_loss": -12.882713317871094, "global_step": 442700, "epoch": 2635} {"train_loss": -12.677779197692871, "global_step": 442701, "epoch": 2635} {"train_loss": -12.523519515991211, "global_step": 442702, "epoch": 2635} {"train_loss": -12.793740272521973, "global_step": 442703, "epoch": 2635} {"train_loss": -12.972007751464844, "global_step": 442704, "epoch": 2635} {"train_loss": -12.663747787475586, "global_step": 442705, "epoch": 2635} {"train_loss": -12.966775894165039, "global_step": 442706, "epoch": 2635} {"train_loss": -12.749391555786133, "global_step": 442707, "epoch": 2635} {"train_loss": -12.636455535888672, "global_step": 442708, "epoch": 2635} {"train_loss": -12.46445369720459, "global_step": 442709, "epoch": 2635} {"train_loss": -12.759065628051758, "global_step": 442710, "epoch": 2635} {"train_loss": -12.439628601074219, "global_step": 442711, "epoch": 2635} {"train_loss": -12.937092781066895, "global_step": 442712, "epoch": 2635} {"train_loss": -12.725683212280273, "global_step": 442713, "epoch": 2635} {"train_loss": -12.791168212890625, "global_step": 442714, "epoch": 2635} {"train_loss": -12.764608383178711, "global_step": 442715, "epoch": 2635} {"train_loss": -12.934024810791016, "global_step": 442716, "epoch": 2635} {"train_loss": -12.62605094909668, "global_step": 442717, "epoch": 2635} {"train_loss": -12.881244659423828, "global_step": 442718, "epoch": 2635} {"train_loss": -12.777456283569336, "global_step": 442719, "epoch": 2635} {"train_loss": -12.69778823852539, "global_step": 442720, "epoch": 2635} {"train_loss": -12.40169906616211, "global_step": 442721, "epoch": 2635} {"train_loss": -12.77854061126709, "global_step": 442722, "epoch": 2635} {"train_loss": -12.098052978515625, "global_step": 442723, "epoch": 2635} {"train_loss": -12.258697509765625, "global_step": 442724, "epoch": 2635} {"train_loss": -12.642548561096191, "global_step": 442725, "epoch": 2635} {"train_loss": -12.007942199707031, "global_step": 442726, "epoch": 2635} {"train_loss": -12.678190231323242, "global_step": 442727, "epoch": 2635} {"train_loss": -12.19749641418457, "global_step": 442728, "epoch": 2635} {"train_loss": -12.117398262023926, "global_step": 442729, "epoch": 2635} {"train_loss": -12.839956283569336, "global_step": 442730, "epoch": 2635} {"train_loss": -12.314666748046875, "global_step": 442731, "epoch": 2635} {"train_loss": -12.275896072387695, "global_step": 442732, "epoch": 2635} {"train_loss": -12.544422149658203, "global_step": 442733, "epoch": 2635} {"train_loss": -12.384653091430664, "global_step": 442734, "epoch": 2635} {"train_loss": -12.520206451416016, "global_step": 442735, "epoch": 2635} {"train_loss": -12.640586853027344, "global_step": 442736, "epoch": 2635} {"train_loss": -12.405900955200195, "global_step": 442737, "epoch": 2635} {"train_loss": -12.689898490905762, "global_step": 442738, "epoch": 2635} {"train_loss": -12.582462310791016, "global_step": 442739, "epoch": 2635} {"train_loss": -12.266777038574219, "global_step": 442740, "epoch": 2635} {"train_loss": -12.33821964263916, "global_step": 442741, "epoch": 2635} {"train_loss": -12.294181823730469, "global_step": 442742, "epoch": 2635} {"train_loss": -12.236224174499512, "global_step": 442743, "epoch": 2635} {"train_loss": -12.779390335083008, "global_step": 442744, "epoch": 2635} {"train_loss": -12.320510864257812, "global_step": 442745, "epoch": 2635} {"train_loss": -12.749917984008789, "global_step": 442746, "epoch": 2635} {"train_loss": -12.579063415527344, "global_step": 442747, "epoch": 2635} {"train_loss": -12.203655242919922, "global_step": 442748, "epoch": 2635} {"train_loss": -12.572249412536621, "global_step": 442749, "epoch": 2635} {"train_loss": -12.415056228637695, "global_step": 442750, "epoch": 2635} {"train_loss": -12.314065933227539, "global_step": 442751, "epoch": 2635} {"train_loss": -12.6845703125, "global_step": 442752, "epoch": 2635} {"train_loss": -12.834135055541992, "global_step": 442753, "epoch": 2635} {"train_loss": -12.695956230163574, "global_step": 442754, "epoch": 2635} {"train_loss": -12.65527057647705, "global_step": 442755, "epoch": 2635} {"train_loss": -12.206350326538086, "global_step": 442756, "epoch": 2635} {"train_loss": -12.487555503845215, "global_step": 442757, "epoch": 2635} {"train_loss": -12.894912719726562, "global_step": 442758, "epoch": 2635} {"train_loss": -12.491042137145996, "global_step": 442759, "epoch": 2635} {"train_loss": -12.254240036010742, "global_step": 442760, "epoch": 2635} {"train_loss": -12.708820343017578, "global_step": 442761, "epoch": 2635} {"train_loss": -12.615303039550781, "global_step": 442762, "epoch": 2635} {"train_loss": -12.338533401489258, "global_step": 442763, "epoch": 2635} {"train_loss": -12.287120819091797, "global_step": 442764, "epoch": 2635} {"train_loss": -12.747520446777344, "global_step": 442765, "epoch": 2635} {"train_loss": -12.430814743041992, "global_step": 442766, "epoch": 2635} {"train_loss": -12.296634674072266, "global_step": 442767, "epoch": 2635} {"train_loss": -11.21551513671875, "global_step": 442768, "epoch": 2635} {"train_loss": -12.215496063232422, "global_step": 442769, "epoch": 2635} {"train_loss": -12.630050659179688, "global_step": 442770, "epoch": 2635} {"train_loss": -12.40020751953125, "global_step": 442771, "epoch": 2635} {"train_loss": -12.2489013671875, "global_step": 442772, "epoch": 2635} {"train_loss": -12.0314302444458, "global_step": 442773, "epoch": 2635} {"train_loss": -11.138776779174805, "global_step": 442774, "epoch": 2635} {"train_loss": -11.458256721496582, "global_step": 442775, "epoch": 2635} {"train_loss": -10.935993194580078, "global_step": 442776, "epoch": 2635} {"train_loss": -9.160623550415039, "global_step": 442777, "epoch": 2635} {"train_loss": -9.06287956237793, "global_step": 442778, "epoch": 2635} {"train_loss": -9.950868606567383, "global_step": 442779, "epoch": 2635} {"train_loss": -9.806431770324707, "global_step": 442780, "epoch": 2635} {"train_loss": -10.721267700195312, "global_step": 442781, "epoch": 2635} {"train_loss": -9.680733680725098, "global_step": 442782, "epoch": 2635} {"train_loss": -11.086362838745117, "global_step": 442783, "epoch": 2635} {"train_loss": -10.252593994140625, "global_step": 442784, "epoch": 2635} {"train_loss": -9.710601806640625, "global_step": 442785, "epoch": 2635} {"train_loss": -10.476344108581543, "global_step": 442786, "epoch": 2635} {"train_loss": -10.996294021606445, "global_step": 442787, "epoch": 2635} {"train_loss": -10.4381685256958, "global_step": 442788, "epoch": 2635} {"train_loss": -11.09266185760498, "global_step": 442789, "epoch": 2635} {"train_loss": -11.030458450317383, "global_step": 442790, "epoch": 2635} {"train_loss": -11.470166206359863, "global_step": 442791, "epoch": 2635} {"train_loss": -11.260719299316406, "global_step": 442792, "epoch": 2635} {"train_loss": -11.118338584899902, "global_step": 442793, "epoch": 2635} {"train_loss": -11.246550559997559, "global_step": 442794, "epoch": 2635} {"train_loss": -11.133190155029297, "global_step": 442795, "epoch": 2635} {"train_loss": -10.23613166809082, "global_step": 442796, "epoch": 2635} {"train_loss": -11.110490798950195, "global_step": 442797, "epoch": 2635} {"train_loss": -11.257606506347656, "global_step": 442798, "epoch": 2635} {"train_loss": -11.379597663879395, "global_step": 442799, "epoch": 2635} {"train_loss": -11.409765243530273, "global_step": 442800, "epoch": 2635} {"train_loss": -11.613014221191406, "global_step": 442801, "epoch": 2635} {"train_loss": -11.514711380004883, "global_step": 442802, "epoch": 2635} {"train_loss": -11.485738754272461, "global_step": 442803, "epoch": 2635} {"train_loss": -10.822093963623047, "global_step": 442804, "epoch": 2635} {"train_loss": -10.136802673339844, "global_step": 442805, "epoch": 2635} {"train_loss": -10.818700790405273, "global_step": 442806, "epoch": 2635} {"train_loss": -10.629537582397461, "global_step": 442807, "epoch": 2635} {"train_loss": -10.993430137634277, "global_step": 442808, "epoch": 2635} {"train_loss": -11.008413314819336, "global_step": 442809, "epoch": 2635} {"train_loss": -10.801108360290527, "global_step": 442810, "epoch": 2635} {"train_loss": -11.456249237060547, "global_step": 442811, "epoch": 2635} {"train_loss": -10.870332717895508, "global_step": 442812, "epoch": 2635} {"train_loss": -10.648189544677734, "global_step": 442813, "epoch": 2635} {"train_loss": -11.594139099121094, "global_step": 442814, "epoch": 2635} {"train_loss": -11.170028686523438, "global_step": 442815, "epoch": 2635} {"train_loss": -11.794610023498535, "global_step": 442816, "epoch": 2635} {"train_loss": -11.717540740966797, "global_step": 442817, "epoch": 2635} {"train_loss": -11.1615571975708, "global_step": 442818, "epoch": 2635} {"train_loss": -10.986446380615234, "global_step": 442819, "epoch": 2635} {"train_loss": -11.619423866271973, "global_step": 442820, "epoch": 2635} {"train_loss": -11.89714241027832, "global_step": 442821, "epoch": 2635} {"train_loss": -11.954374313354492, "global_step": 442822, "epoch": 2635} {"train_loss": -11.12915325164795, "global_step": 442823, "epoch": 2635} {"train_loss": -11.970869064331055, "global_step": 442824, "epoch": 2635} {"train_loss": -11.802946090698242, "global_step": 442825, "epoch": 2635} {"train_loss": -12.214679718017578, "global_step": 442826, "epoch": 2635} {"train_loss": -12.139589309692383, "global_step": 442827, "epoch": 2635} {"train_loss": -11.856063842773438, "global_step": 442828, "epoch": 2635} {"train_loss": -12.265617370605469, "global_step": 442829, "epoch": 2635} {"train_loss": -12.102458000183105, "global_step": 442830, "epoch": 2635} {"train_loss": -12.192209243774414, "global_step": 442831, "epoch": 2635} {"train_loss": -11.946087837219238, "global_step": 442832, "epoch": 2635} {"train_loss": -12.160114288330078, "global_step": 442833, "epoch": 2635} {"train_loss": -12.112203598022461, "global_step": 442834, "epoch": 2635} {"train_loss": -12.117046356201172, "global_step": 442835, "epoch": 2635} {"train_loss": -12.027042388916016, "global_step": 442836, "epoch": 2635} {"train_loss": -12.299346923828125, "global_step": 442837, "epoch": 2635} {"train_loss": -12.081143379211426, "global_step": 442838, "epoch": 2635} {"train_loss": -12.065095901489258, "global_step": 442839, "epoch": 2635} {"train_loss": -12.32621955871582, "global_step": 442840, "epoch": 2635} {"train_loss": -12.253198623657227, "global_step": 442841, "epoch": 2635} {"train_loss": -12.26537799835205, "global_step": 442842, "epoch": 2635} {"train_loss": -12.285651206970215, "global_step": 442843, "epoch": 2635} {"train_loss": -12.460365295410156, "global_step": 442844, "epoch": 2635} {"train_loss": -12.393745422363281, "global_step": 442845, "epoch": 2635} {"train_loss": -12.360392570495605, "global_step": 442846, "epoch": 2635} {"train_loss": -12.009998639424643, "global_step": 442847, "epoch": 2635, "val_loss": 304988.90625, "train_action_mse_error": 0.9860081076622009} {"train_loss": -12.34730339050293, "global_step": 442848, "epoch": 2636} {"train_loss": -12.315048217773438, "global_step": 442849, "epoch": 2636} {"train_loss": -12.33804702758789, "global_step": 442850, "epoch": 2636} {"train_loss": -12.317464828491211, "global_step": 442851, "epoch": 2636} {"train_loss": -12.519259452819824, "global_step": 442852, "epoch": 2636} {"train_loss": -12.498966217041016, "global_step": 442853, "epoch": 2636} {"train_loss": -12.51486587524414, "global_step": 442854, "epoch": 2636} {"train_loss": -12.462150573730469, "global_step": 442855, "epoch": 2636} {"train_loss": -12.428672790527344, "global_step": 442856, "epoch": 2636} {"train_loss": -12.595519065856934, "global_step": 442857, "epoch": 2636} {"train_loss": -12.409244537353516, "global_step": 442858, "epoch": 2636} {"train_loss": -12.69148063659668, "global_step": 442859, "epoch": 2636} {"train_loss": -12.350606918334961, "global_step": 442860, "epoch": 2636} {"train_loss": -12.559572219848633, "global_step": 442861, "epoch": 2636} {"train_loss": -12.509251594543457, "global_step": 442862, "epoch": 2636} {"train_loss": -12.623836517333984, "global_step": 442863, "epoch": 2636} {"train_loss": -12.52401065826416, "global_step": 442864, "epoch": 2636} {"train_loss": -12.552638053894043, "global_step": 442865, "epoch": 2636} {"train_loss": -12.632120132446289, "global_step": 442866, "epoch": 2636} {"train_loss": -12.733383178710938, "global_step": 442867, "epoch": 2636} {"train_loss": -12.870872497558594, "global_step": 442868, "epoch": 2636} {"train_loss": -12.654370307922363, "global_step": 442869, "epoch": 2636} {"train_loss": -12.781774520874023, "global_step": 442870, "epoch": 2636} {"train_loss": -12.730499267578125, "global_step": 442871, "epoch": 2636} {"train_loss": -12.821772575378418, "global_step": 442872, "epoch": 2636} {"train_loss": -12.655706405639648, "global_step": 442873, "epoch": 2636} {"train_loss": -12.656543731689453, "global_step": 442874, "epoch": 2636} {"train_loss": -12.66649055480957, "global_step": 442875, "epoch": 2636} {"train_loss": -12.789085388183594, "global_step": 442876, "epoch": 2636} {"train_loss": -12.864751815795898, "global_step": 442877, "epoch": 2636} {"train_loss": -12.690980911254883, "global_step": 442878, "epoch": 2636} {"train_loss": -12.885431289672852, "global_step": 442879, "epoch": 2636} {"train_loss": -12.823915481567383, "global_step": 442880, "epoch": 2636} {"train_loss": -12.700201034545898, "global_step": 442881, "epoch": 2636} {"train_loss": -12.700981140136719, "global_step": 442882, "epoch": 2636} {"train_loss": -12.945463180541992, "global_step": 442883, "epoch": 2636} {"train_loss": -12.84030532836914, "global_step": 442884, "epoch": 2636} {"train_loss": -12.991562843322754, "global_step": 442885, "epoch": 2636} {"train_loss": -12.818778038024902, "global_step": 442886, "epoch": 2636} {"train_loss": -12.960237503051758, "global_step": 442887, "epoch": 2636} {"train_loss": -12.925350189208984, "global_step": 442888, "epoch": 2636} {"train_loss": -12.891231536865234, "global_step": 442889, "epoch": 2636} {"train_loss": -12.572364807128906, "global_step": 442890, "epoch": 2636} {"train_loss": -12.813100814819336, "global_step": 442891, "epoch": 2636} {"train_loss": -12.872419357299805, "global_step": 442892, "epoch": 2636} {"train_loss": -12.37394905090332, "global_step": 442893, "epoch": 2636} {"train_loss": -12.829766273498535, "global_step": 442894, "epoch": 2636} {"train_loss": -12.827993392944336, "global_step": 442895, "epoch": 2636} {"train_loss": -12.726707458496094, "global_step": 442896, "epoch": 2636} {"train_loss": -12.926443099975586, "global_step": 442897, "epoch": 2636} {"train_loss": -12.65064525604248, "global_step": 442898, "epoch": 2636} {"train_loss": -12.644462585449219, "global_step": 442899, "epoch": 2636} {"train_loss": -12.877822875976562, "global_step": 442900, "epoch": 2636} {"train_loss": -12.46522331237793, "global_step": 442901, "epoch": 2636} {"train_loss": -12.559930801391602, "global_step": 442902, "epoch": 2636} {"train_loss": -12.596056938171387, "global_step": 442903, "epoch": 2636} {"train_loss": -12.65693187713623, "global_step": 442904, "epoch": 2636} {"train_loss": -12.974761009216309, "global_step": 442905, "epoch": 2636} {"train_loss": -12.631816864013672, "global_step": 442906, "epoch": 2636} {"train_loss": -12.8468017578125, "global_step": 442907, "epoch": 2636} {"train_loss": -12.791715621948242, "global_step": 442908, "epoch": 2636} {"train_loss": -12.697484970092773, "global_step": 442909, "epoch": 2636} {"train_loss": -12.766263961791992, "global_step": 442910, "epoch": 2636} {"train_loss": -12.822090148925781, "global_step": 442911, "epoch": 2636} {"train_loss": -12.509820938110352, "global_step": 442912, "epoch": 2636} {"train_loss": -12.287177085876465, "global_step": 442913, "epoch": 2636} {"train_loss": -12.503864288330078, "global_step": 442914, "epoch": 2636} {"train_loss": -11.93635368347168, "global_step": 442915, "epoch": 2636} {"train_loss": -11.448867797851562, "global_step": 442916, "epoch": 2636} {"train_loss": -10.082231521606445, "global_step": 442917, "epoch": 2636} {"train_loss": -12.50754165649414, "global_step": 442918, "epoch": 2636} {"train_loss": -10.882150650024414, "global_step": 442919, "epoch": 2636} {"train_loss": -12.186092376708984, "global_step": 442920, "epoch": 2636} {"train_loss": -11.935027122497559, "global_step": 442921, "epoch": 2636} {"train_loss": -12.138124465942383, "global_step": 442922, "epoch": 2636} {"train_loss": -11.162256240844727, "global_step": 442923, "epoch": 2636} {"train_loss": -11.474853515625, "global_step": 442924, "epoch": 2636} {"train_loss": -11.60120964050293, "global_step": 442925, "epoch": 2636} {"train_loss": -12.174269676208496, "global_step": 442926, "epoch": 2636} {"train_loss": -11.341264724731445, "global_step": 442927, "epoch": 2636} {"train_loss": -11.758974075317383, "global_step": 442928, "epoch": 2636} {"train_loss": -11.005277633666992, "global_step": 442929, "epoch": 2636} {"train_loss": -11.166011810302734, "global_step": 442930, "epoch": 2636} {"train_loss": -11.379302978515625, "global_step": 442931, "epoch": 2636} {"train_loss": -9.258602142333984, "global_step": 442932, "epoch": 2636} {"train_loss": -11.24947452545166, "global_step": 442933, "epoch": 2636} {"train_loss": -12.10658073425293, "global_step": 442934, "epoch": 2636} {"train_loss": -10.558233261108398, "global_step": 442935, "epoch": 2636} {"train_loss": -11.05154037475586, "global_step": 442936, "epoch": 2636} {"train_loss": -10.728819847106934, "global_step": 442937, "epoch": 2636} {"train_loss": -11.038141250610352, "global_step": 442938, "epoch": 2636} {"train_loss": -10.893570899963379, "global_step": 442939, "epoch": 2636} {"train_loss": -10.124258041381836, "global_step": 442940, "epoch": 2636} {"train_loss": -10.348428726196289, "global_step": 442941, "epoch": 2636} {"train_loss": -10.266105651855469, "global_step": 442942, "epoch": 2636} {"train_loss": -9.16421890258789, "global_step": 442943, "epoch": 2636} {"train_loss": -10.771035194396973, "global_step": 442944, "epoch": 2636} {"train_loss": -10.58387565612793, "global_step": 442945, "epoch": 2636} {"train_loss": -9.456111907958984, "global_step": 442946, "epoch": 2636} {"train_loss": -10.73715877532959, "global_step": 442947, "epoch": 2636} {"train_loss": -10.322077751159668, "global_step": 442948, "epoch": 2636} {"train_loss": -9.256685256958008, "global_step": 442949, "epoch": 2636} {"train_loss": -10.22237491607666, "global_step": 442950, "epoch": 2636} {"train_loss": -10.363336563110352, "global_step": 442951, "epoch": 2636} {"train_loss": -10.983636856079102, "global_step": 442952, "epoch": 2636} {"train_loss": -10.101515769958496, "global_step": 442953, "epoch": 2636} {"train_loss": -9.856287002563477, "global_step": 442954, "epoch": 2636} {"train_loss": -11.037878036499023, "global_step": 442955, "epoch": 2636} {"train_loss": -9.908187866210938, "global_step": 442956, "epoch": 2636} {"train_loss": -9.049932479858398, "global_step": 442957, "epoch": 2636} {"train_loss": -10.972552299499512, "global_step": 442958, "epoch": 2636} {"train_loss": -10.389350891113281, "global_step": 442959, "epoch": 2636} {"train_loss": -9.42515754699707, "global_step": 442960, "epoch": 2636} {"train_loss": -11.65527629852295, "global_step": 442961, "epoch": 2636} {"train_loss": -10.839414596557617, "global_step": 442962, "epoch": 2636} {"train_loss": -9.70571517944336, "global_step": 442963, "epoch": 2636} {"train_loss": -11.190759658813477, "global_step": 442964, "epoch": 2636} {"train_loss": -11.061310768127441, "global_step": 442965, "epoch": 2636} {"train_loss": -9.917070388793945, "global_step": 442966, "epoch": 2636} {"train_loss": -11.22624397277832, "global_step": 442967, "epoch": 2636} {"train_loss": -11.70602035522461, "global_step": 442968, "epoch": 2636} {"train_loss": -11.510297775268555, "global_step": 442969, "epoch": 2636} {"train_loss": -11.318511962890625, "global_step": 442970, "epoch": 2636} {"train_loss": -11.839790344238281, "global_step": 442971, "epoch": 2636} {"train_loss": -11.428586959838867, "global_step": 442972, "epoch": 2636} {"train_loss": -11.734071731567383, "global_step": 442973, "epoch": 2636} {"train_loss": -11.81583023071289, "global_step": 442974, "epoch": 2636} {"train_loss": -11.256473541259766, "global_step": 442975, "epoch": 2636} {"train_loss": -11.734676361083984, "global_step": 442976, "epoch": 2636} {"train_loss": -11.41676139831543, "global_step": 442977, "epoch": 2636} {"train_loss": -11.454293251037598, "global_step": 442978, "epoch": 2636} {"train_loss": -11.731029510498047, "global_step": 442979, "epoch": 2636} {"train_loss": -11.88432502746582, "global_step": 442980, "epoch": 2636} {"train_loss": -11.92399787902832, "global_step": 442981, "epoch": 2636} {"train_loss": -11.968307495117188, "global_step": 442982, "epoch": 2636} {"train_loss": -12.170877456665039, "global_step": 442983, "epoch": 2636} {"train_loss": -11.925344467163086, "global_step": 442984, "epoch": 2636} {"train_loss": -11.861223220825195, "global_step": 442985, "epoch": 2636} {"train_loss": -12.076760292053223, "global_step": 442986, "epoch": 2636} {"train_loss": -11.933452606201172, "global_step": 442987, "epoch": 2636} {"train_loss": -12.040592193603516, "global_step": 442988, "epoch": 2636} {"train_loss": -12.113922119140625, "global_step": 442989, "epoch": 2636} {"train_loss": -12.160490036010742, "global_step": 442990, "epoch": 2636} {"train_loss": -12.316776275634766, "global_step": 442991, "epoch": 2636} {"train_loss": -12.198122024536133, "global_step": 442992, "epoch": 2636} {"train_loss": -12.144824028015137, "global_step": 442993, "epoch": 2636} {"train_loss": -12.287769317626953, "global_step": 442994, "epoch": 2636} {"train_loss": -12.205135345458984, "global_step": 442995, "epoch": 2636} {"train_loss": -12.191396713256836, "global_step": 442996, "epoch": 2636} {"train_loss": -12.083641052246094, "global_step": 442997, "epoch": 2636} {"train_loss": -12.215690612792969, "global_step": 442998, "epoch": 2636} {"train_loss": -11.911336898803711, "global_step": 442999, "epoch": 2636} {"train_loss": -12.45583724975586, "global_step": 443000, "epoch": 2636} {"train_loss": -12.077661514282227, "global_step": 443001, "epoch": 2636} {"train_loss": -12.218109130859375, "global_step": 443002, "epoch": 2636} {"train_loss": -12.243406295776367, "global_step": 443003, "epoch": 2636} {"train_loss": -12.118972778320312, "global_step": 443004, "epoch": 2636} {"train_loss": -12.313146591186523, "global_step": 443005, "epoch": 2636} {"train_loss": -12.083919525146484, "global_step": 443006, "epoch": 2636} {"train_loss": -12.298881530761719, "global_step": 443007, "epoch": 2636} {"train_loss": -12.468289375305176, "global_step": 443008, "epoch": 2636} {"train_loss": -12.378966331481934, "global_step": 443009, "epoch": 2636} {"train_loss": -12.514861106872559, "global_step": 443010, "epoch": 2636} {"train_loss": -12.276102066040039, "global_step": 443011, "epoch": 2636} {"train_loss": -12.485040664672852, "global_step": 443012, "epoch": 2636} {"train_loss": -12.436511993408203, "global_step": 443013, "epoch": 2636} {"train_loss": -12.555547714233398, "global_step": 443014, "epoch": 2636} {"train_loss": -11.898049252373832, "global_step": 443015, "epoch": 2636, "val_loss": 308352.25} {"train_loss": -12.580388069152832, "global_step": 443016, "epoch": 2637} {"train_loss": -12.25906753540039, "global_step": 443017, "epoch": 2637} {"train_loss": -12.449832916259766, "global_step": 443018, "epoch": 2637} {"train_loss": -12.680686950683594, "global_step": 443019, "epoch": 2637} {"train_loss": -12.45865249633789, "global_step": 443020, "epoch": 2637} {"train_loss": -12.521869659423828, "global_step": 443021, "epoch": 2637} {"train_loss": -12.708391189575195, "global_step": 443022, "epoch": 2637} {"train_loss": -12.645465850830078, "global_step": 443023, "epoch": 2637} {"train_loss": -12.742435455322266, "global_step": 443024, "epoch": 2637} {"train_loss": -12.78281021118164, "global_step": 443025, "epoch": 2637} {"train_loss": -12.523412704467773, "global_step": 443026, "epoch": 2637} {"train_loss": -12.63521671295166, "global_step": 443027, "epoch": 2637} {"train_loss": -12.640701293945312, "global_step": 443028, "epoch": 2637} {"train_loss": -12.867400169372559, "global_step": 443029, "epoch": 2637} {"train_loss": -12.648377418518066, "global_step": 443030, "epoch": 2637} {"train_loss": -12.639636993408203, "global_step": 443031, "epoch": 2637} {"train_loss": -12.826922416687012, "global_step": 443032, "epoch": 2637} {"train_loss": -12.731954574584961, "global_step": 443033, "epoch": 2637} {"train_loss": -12.77572250366211, "global_step": 443034, "epoch": 2637} {"train_loss": -12.959705352783203, "global_step": 443035, "epoch": 2637} {"train_loss": -12.866912841796875, "global_step": 443036, "epoch": 2637} {"train_loss": -12.763921737670898, "global_step": 443037, "epoch": 2637} {"train_loss": -12.773128509521484, "global_step": 443038, "epoch": 2637} {"train_loss": -12.897415161132812, "global_step": 443039, "epoch": 2637} {"train_loss": -12.731486320495605, "global_step": 443040, "epoch": 2637} {"train_loss": -12.930527687072754, "global_step": 443041, "epoch": 2637} {"train_loss": -12.68094253540039, "global_step": 443042, "epoch": 2637} {"train_loss": -12.728099822998047, "global_step": 443043, "epoch": 2637} {"train_loss": -12.76767349243164, "global_step": 443044, "epoch": 2637} {"train_loss": -12.8246431350708, "global_step": 443045, "epoch": 2637} {"train_loss": -12.83046817779541, "global_step": 443046, "epoch": 2637} {"train_loss": -12.874076843261719, "global_step": 443047, "epoch": 2637} {"train_loss": -12.805180549621582, "global_step": 443048, "epoch": 2637} {"train_loss": -12.813959121704102, "global_step": 443049, "epoch": 2637} {"train_loss": -12.793828010559082, "global_step": 443050, "epoch": 2637} {"train_loss": -12.818324089050293, "global_step": 443051, "epoch": 2637} {"train_loss": -13.068029403686523, "global_step": 443052, "epoch": 2637} {"train_loss": -12.912210464477539, "global_step": 443053, "epoch": 2637} {"train_loss": -12.88286018371582, "global_step": 443054, "epoch": 2637} {"train_loss": -12.88679027557373, "global_step": 443055, "epoch": 2637} {"train_loss": -12.792915344238281, "global_step": 443056, "epoch": 2637} {"train_loss": -12.784042358398438, "global_step": 443057, "epoch": 2637} {"train_loss": -12.853816032409668, "global_step": 443058, "epoch": 2637} {"train_loss": -12.978738784790039, "global_step": 443059, "epoch": 2637} {"train_loss": -12.812625885009766, "global_step": 443060, "epoch": 2637} {"train_loss": -12.89674186706543, "global_step": 443061, "epoch": 2637} {"train_loss": -12.661779403686523, "global_step": 443062, "epoch": 2637} {"train_loss": -12.993906021118164, "global_step": 443063, "epoch": 2637} {"train_loss": -12.987421035766602, "global_step": 443064, "epoch": 2637} {"train_loss": -12.987959861755371, "global_step": 443065, "epoch": 2637} {"train_loss": -12.87668514251709, "global_step": 443066, "epoch": 2637} {"train_loss": -12.737449645996094, "global_step": 443067, "epoch": 2637} {"train_loss": -12.88882064819336, "global_step": 443068, "epoch": 2637} {"train_loss": -12.906818389892578, "global_step": 443069, "epoch": 2637} {"train_loss": -13.11522102355957, "global_step": 443070, "epoch": 2637} {"train_loss": -12.907785415649414, "global_step": 443071, "epoch": 2637} {"train_loss": -12.809983253479004, "global_step": 443072, "epoch": 2637} {"train_loss": -12.718070983886719, "global_step": 443073, "epoch": 2637} {"train_loss": -12.946517944335938, "global_step": 443074, "epoch": 2637} {"train_loss": -12.986675262451172, "global_step": 443075, "epoch": 2637} {"train_loss": -12.786632537841797, "global_step": 443076, "epoch": 2637} {"train_loss": -13.002507209777832, "global_step": 443077, "epoch": 2637} {"train_loss": -13.116918563842773, "global_step": 443078, "epoch": 2637} {"train_loss": -12.85258674621582, "global_step": 443079, "epoch": 2637} {"train_loss": -12.454937934875488, "global_step": 443080, "epoch": 2637} {"train_loss": -12.451622009277344, "global_step": 443081, "epoch": 2637} {"train_loss": -12.731663703918457, "global_step": 443082, "epoch": 2637} {"train_loss": -12.711849212646484, "global_step": 443083, "epoch": 2637} {"train_loss": -12.01591682434082, "global_step": 443084, "epoch": 2637} {"train_loss": -11.821891784667969, "global_step": 443085, "epoch": 2637} {"train_loss": -12.539667129516602, "global_step": 443086, "epoch": 2637} {"train_loss": -12.77412223815918, "global_step": 443087, "epoch": 2637} {"train_loss": -11.161860466003418, "global_step": 443088, "epoch": 2637} {"train_loss": -10.343864440917969, "global_step": 443089, "epoch": 2637} {"train_loss": -12.289849281311035, "global_step": 443090, "epoch": 2637} {"train_loss": -12.166357040405273, "global_step": 443091, "epoch": 2637} {"train_loss": -10.015766143798828, "global_step": 443092, "epoch": 2637} {"train_loss": -10.17840576171875, "global_step": 443093, "epoch": 2637} {"train_loss": -11.117509841918945, "global_step": 443094, "epoch": 2637} {"train_loss": -11.72679328918457, "global_step": 443095, "epoch": 2637} {"train_loss": -11.536365509033203, "global_step": 443096, "epoch": 2637} {"train_loss": -10.443995475769043, "global_step": 443097, "epoch": 2637} {"train_loss": -12.14732551574707, "global_step": 443098, "epoch": 2637} {"train_loss": -10.014215469360352, "global_step": 443099, "epoch": 2637} {"train_loss": -11.134605407714844, "global_step": 443100, "epoch": 2637} {"train_loss": -9.069371223449707, "global_step": 443101, "epoch": 2637} {"train_loss": -8.585944175720215, "global_step": 443102, "epoch": 2637} {"train_loss": -8.367908477783203, "global_step": 443103, "epoch": 2637} {"train_loss": -7.870267391204834, "global_step": 443104, "epoch": 2637} {"train_loss": -8.437141418457031, "global_step": 443105, "epoch": 2637} {"train_loss": -9.45650863647461, "global_step": 443106, "epoch": 2637} {"train_loss": -10.50009536743164, "global_step": 443107, "epoch": 2637} {"train_loss": -8.88525390625, "global_step": 443108, "epoch": 2637} {"train_loss": -9.328218460083008, "global_step": 443109, "epoch": 2637} {"train_loss": -9.070579528808594, "global_step": 443110, "epoch": 2637} {"train_loss": -9.736774444580078, "global_step": 443111, "epoch": 2637} {"train_loss": -9.406172752380371, "global_step": 443112, "epoch": 2637} {"train_loss": -10.574047088623047, "global_step": 443113, "epoch": 2637} {"train_loss": -10.86133861541748, "global_step": 443114, "epoch": 2637} {"train_loss": -9.165887832641602, "global_step": 443115, "epoch": 2637} {"train_loss": -11.374317169189453, "global_step": 443116, "epoch": 2637} {"train_loss": -9.332792282104492, "global_step": 443117, "epoch": 2637} {"train_loss": -10.832086563110352, "global_step": 443118, "epoch": 2637} {"train_loss": -10.573467254638672, "global_step": 443119, "epoch": 2637} {"train_loss": -10.516707420349121, "global_step": 443120, "epoch": 2637} {"train_loss": -10.128623962402344, "global_step": 443121, "epoch": 2637} {"train_loss": -11.519140243530273, "global_step": 443122, "epoch": 2637} {"train_loss": -10.471620559692383, "global_step": 443123, "epoch": 2637} {"train_loss": -11.608991622924805, "global_step": 443124, "epoch": 2637} {"train_loss": -11.24063491821289, "global_step": 443125, "epoch": 2637} {"train_loss": -11.683775901794434, "global_step": 443126, "epoch": 2637} {"train_loss": -11.53431224822998, "global_step": 443127, "epoch": 2637} {"train_loss": -12.162337303161621, "global_step": 443128, "epoch": 2637} {"train_loss": -11.804340362548828, "global_step": 443129, "epoch": 2637} {"train_loss": -12.074434280395508, "global_step": 443130, "epoch": 2637} {"train_loss": -11.67680549621582, "global_step": 443131, "epoch": 2637} {"train_loss": -12.017671585083008, "global_step": 443132, "epoch": 2637} {"train_loss": -11.961418151855469, "global_step": 443133, "epoch": 2637} {"train_loss": -11.944631576538086, "global_step": 443134, "epoch": 2637} {"train_loss": -12.28419303894043, "global_step": 443135, "epoch": 2637} {"train_loss": -11.880692481994629, "global_step": 443136, "epoch": 2637} {"train_loss": -11.819008827209473, "global_step": 443137, "epoch": 2637} {"train_loss": -12.183408737182617, "global_step": 443138, "epoch": 2637} {"train_loss": -11.680776596069336, "global_step": 443139, "epoch": 2637} {"train_loss": -12.533622741699219, "global_step": 443140, "epoch": 2637} {"train_loss": -11.557037353515625, "global_step": 443141, "epoch": 2637} {"train_loss": -12.301990509033203, "global_step": 443142, "epoch": 2637} {"train_loss": -12.071479797363281, "global_step": 443143, "epoch": 2637} {"train_loss": -11.983161926269531, "global_step": 443144, "epoch": 2637} {"train_loss": -12.497029304504395, "global_step": 443145, "epoch": 2637} {"train_loss": -12.197463989257812, "global_step": 443146, "epoch": 2637} {"train_loss": -12.113225936889648, "global_step": 443147, "epoch": 2637} {"train_loss": -12.349431037902832, "global_step": 443148, "epoch": 2637} {"train_loss": -12.252096176147461, "global_step": 443149, "epoch": 2637} {"train_loss": -12.23710823059082, "global_step": 443150, "epoch": 2637} {"train_loss": -12.364307403564453, "global_step": 443151, "epoch": 2637} {"train_loss": -12.357879638671875, "global_step": 443152, "epoch": 2637} {"train_loss": -12.179391860961914, "global_step": 443153, "epoch": 2637} {"train_loss": -12.17728328704834, "global_step": 443154, "epoch": 2637} {"train_loss": -12.008049011230469, "global_step": 443155, "epoch": 2637} {"train_loss": -12.345544815063477, "global_step": 443156, "epoch": 2637} {"train_loss": -12.373558044433594, "global_step": 443157, "epoch": 2637} {"train_loss": -12.074655532836914, "global_step": 443158, "epoch": 2637} {"train_loss": -12.28758716583252, "global_step": 443159, "epoch": 2637} {"train_loss": -12.23520565032959, "global_step": 443160, "epoch": 2637} {"train_loss": -12.36315631866455, "global_step": 443161, "epoch": 2637} {"train_loss": -12.182222366333008, "global_step": 443162, "epoch": 2637} {"train_loss": -11.9993896484375, "global_step": 443163, "epoch": 2637} {"train_loss": -12.490056037902832, "global_step": 443164, "epoch": 2637} {"train_loss": -12.410865783691406, "global_step": 443165, "epoch": 2637} {"train_loss": -12.471323013305664, "global_step": 443166, "epoch": 2637} {"train_loss": -12.435527801513672, "global_step": 443167, "epoch": 2637} {"train_loss": -12.377786636352539, "global_step": 443168, "epoch": 2637} {"train_loss": -12.21766185760498, "global_step": 443169, "epoch": 2637} {"train_loss": -12.268149375915527, "global_step": 443170, "epoch": 2637} {"train_loss": -12.386852264404297, "global_step": 443171, "epoch": 2637} {"train_loss": -12.404192924499512, "global_step": 443172, "epoch": 2637} {"train_loss": -12.765585899353027, "global_step": 443173, "epoch": 2637} {"train_loss": -12.4445219039917, "global_step": 443174, "epoch": 2637} {"train_loss": -12.294817924499512, "global_step": 443175, "epoch": 2637} {"train_loss": -12.625378608703613, "global_step": 443176, "epoch": 2637} {"train_loss": -12.45840072631836, "global_step": 443177, "epoch": 2637} {"train_loss": -12.538050651550293, "global_step": 443178, "epoch": 2637} {"train_loss": -12.394383430480957, "global_step": 443179, "epoch": 2637} {"train_loss": -12.357778549194336, "global_step": 443180, "epoch": 2637} {"train_loss": -12.862096786499023, "global_step": 443181, "epoch": 2637} {"train_loss": -12.510702133178711, "global_step": 443182, "epoch": 2637} {"train_loss": -12.017357091108957, "global_step": 443183, "epoch": 2637, "val_loss": 308870.4375} {"train_loss": -12.75136947631836, "global_step": 443184, "epoch": 2638} {"train_loss": -12.767838478088379, "global_step": 443185, "epoch": 2638} {"train_loss": -12.869473457336426, "global_step": 443186, "epoch": 2638} {"train_loss": -12.616241455078125, "global_step": 443187, "epoch": 2638} {"train_loss": -12.643209457397461, "global_step": 443188, "epoch": 2638} {"train_loss": -12.53939151763916, "global_step": 443189, "epoch": 2638} {"train_loss": -12.750670433044434, "global_step": 443190, "epoch": 2638} {"train_loss": -12.712392807006836, "global_step": 443191, "epoch": 2638} {"train_loss": -12.676469802856445, "global_step": 443192, "epoch": 2638} {"train_loss": -12.762022018432617, "global_step": 443193, "epoch": 2638} {"train_loss": -12.70022964477539, "global_step": 443194, "epoch": 2638} {"train_loss": -12.709264755249023, "global_step": 443195, "epoch": 2638} {"train_loss": -12.950215339660645, "global_step": 443196, "epoch": 2638} {"train_loss": -12.961936950683594, "global_step": 443197, "epoch": 2638} {"train_loss": -12.696212768554688, "global_step": 443198, "epoch": 2638} {"train_loss": -12.784326553344727, "global_step": 443199, "epoch": 2638} {"train_loss": -12.943364143371582, "global_step": 443200, "epoch": 2638} {"train_loss": -13.040044784545898, "global_step": 443201, "epoch": 2638} {"train_loss": -12.953767776489258, "global_step": 443202, "epoch": 2638} {"train_loss": -12.730714797973633, "global_step": 443203, "epoch": 2638} {"train_loss": -12.954928398132324, "global_step": 443204, "epoch": 2638} {"train_loss": -13.043359756469727, "global_step": 443205, "epoch": 2638} {"train_loss": -12.640708923339844, "global_step": 443206, "epoch": 2638} {"train_loss": -12.85548210144043, "global_step": 443207, "epoch": 2638} {"train_loss": -12.829168319702148, "global_step": 443208, "epoch": 2638} {"train_loss": -12.690374374389648, "global_step": 443209, "epoch": 2638} {"train_loss": -12.91057014465332, "global_step": 443210, "epoch": 2638} {"train_loss": -12.808521270751953, "global_step": 443211, "epoch": 2638} {"train_loss": -12.839807510375977, "global_step": 443212, "epoch": 2638} {"train_loss": -12.79974365234375, "global_step": 443213, "epoch": 2638} {"train_loss": -12.619573593139648, "global_step": 443214, "epoch": 2638} {"train_loss": -13.115501403808594, "global_step": 443215, "epoch": 2638} {"train_loss": -12.832603454589844, "global_step": 443216, "epoch": 2638} {"train_loss": -13.091018676757812, "global_step": 443217, "epoch": 2638} {"train_loss": -12.985941886901855, "global_step": 443218, "epoch": 2638} {"train_loss": -12.584894180297852, "global_step": 443219, "epoch": 2638} {"train_loss": -12.198546409606934, "global_step": 443220, "epoch": 2638} {"train_loss": -12.668832778930664, "global_step": 443221, "epoch": 2638} {"train_loss": -12.723471641540527, "global_step": 443222, "epoch": 2638} {"train_loss": -12.439752578735352, "global_step": 443223, "epoch": 2638} {"train_loss": -12.325689315795898, "global_step": 443224, "epoch": 2638} {"train_loss": -12.216323852539062, "global_step": 443225, "epoch": 2638} {"train_loss": -12.65770149230957, "global_step": 443226, "epoch": 2638} {"train_loss": -12.58617877960205, "global_step": 443227, "epoch": 2638} {"train_loss": -12.161230087280273, "global_step": 443228, "epoch": 2638} {"train_loss": -11.540842056274414, "global_step": 443229, "epoch": 2638} {"train_loss": -12.097810745239258, "global_step": 443230, "epoch": 2638} {"train_loss": -12.330330848693848, "global_step": 443231, "epoch": 2638} {"train_loss": -12.273786544799805, "global_step": 443232, "epoch": 2638} {"train_loss": -12.719589233398438, "global_step": 443233, "epoch": 2638} {"train_loss": -12.094686508178711, "global_step": 443234, "epoch": 2638} {"train_loss": -12.62489128112793, "global_step": 443235, "epoch": 2638} {"train_loss": -11.565204620361328, "global_step": 443236, "epoch": 2638} {"train_loss": -12.347722053527832, "global_step": 443237, "epoch": 2638} {"train_loss": -11.316823959350586, "global_step": 443238, "epoch": 2638} {"train_loss": -9.03676986694336, "global_step": 443239, "epoch": 2638} {"train_loss": -11.261137962341309, "global_step": 443240, "epoch": 2638} {"train_loss": -10.031332969665527, "global_step": 443241, "epoch": 2638} {"train_loss": -10.016841888427734, "global_step": 443242, "epoch": 2638} {"train_loss": -9.18789005279541, "global_step": 443243, "epoch": 2638} {"train_loss": -10.600666046142578, "global_step": 443244, "epoch": 2638} {"train_loss": -9.649236679077148, "global_step": 443245, "epoch": 2638} {"train_loss": -9.926316261291504, "global_step": 443246, "epoch": 2638} {"train_loss": -10.30047607421875, "global_step": 443247, "epoch": 2638} {"train_loss": -8.597980499267578, "global_step": 443248, "epoch": 2638} {"train_loss": -8.604747772216797, "global_step": 443249, "epoch": 2638} {"train_loss": -9.208039283752441, "global_step": 443250, "epoch": 2638} {"train_loss": -8.575274467468262, "global_step": 443251, "epoch": 2638} {"train_loss": -10.744604110717773, "global_step": 443252, "epoch": 2638} {"train_loss": -9.823362350463867, "global_step": 443253, "epoch": 2638} {"train_loss": -9.981290817260742, "global_step": 443254, "epoch": 2638} {"train_loss": -11.405867576599121, "global_step": 443255, "epoch": 2638} {"train_loss": -9.57249641418457, "global_step": 443256, "epoch": 2638} {"train_loss": -10.470480918884277, "global_step": 443257, "epoch": 2638} {"train_loss": -10.82081413269043, "global_step": 443258, "epoch": 2638} {"train_loss": -10.725019454956055, "global_step": 443259, "epoch": 2638} {"train_loss": -11.314202308654785, "global_step": 443260, "epoch": 2638} {"train_loss": -11.200565338134766, "global_step": 443261, "epoch": 2638} {"train_loss": -11.949808120727539, "global_step": 443262, "epoch": 2638} {"train_loss": -11.561543464660645, "global_step": 443263, "epoch": 2638} {"train_loss": -11.97284984588623, "global_step": 443264, "epoch": 2638} {"train_loss": -11.871129989624023, "global_step": 443265, "epoch": 2638} {"train_loss": -11.658243179321289, "global_step": 443266, "epoch": 2638} {"train_loss": -11.947944641113281, "global_step": 443267, "epoch": 2638} {"train_loss": -11.644550323486328, "global_step": 443268, "epoch": 2638} {"train_loss": -11.924907684326172, "global_step": 443269, "epoch": 2638} {"train_loss": -12.17616081237793, "global_step": 443270, "epoch": 2638} {"train_loss": -11.991898536682129, "global_step": 443271, "epoch": 2638} {"train_loss": -11.684672355651855, "global_step": 443272, "epoch": 2638} {"train_loss": -12.125221252441406, "global_step": 443273, "epoch": 2638} {"train_loss": -12.199432373046875, "global_step": 443274, "epoch": 2638} {"train_loss": -11.875563621520996, "global_step": 443275, "epoch": 2638} {"train_loss": -12.180906295776367, "global_step": 443276, "epoch": 2638} {"train_loss": -12.51400375366211, "global_step": 443277, "epoch": 2638} {"train_loss": -12.130884170532227, "global_step": 443278, "epoch": 2638} {"train_loss": -12.168426513671875, "global_step": 443279, "epoch": 2638} {"train_loss": -12.439698219299316, "global_step": 443280, "epoch": 2638} {"train_loss": -12.192756652832031, "global_step": 443281, "epoch": 2638} {"train_loss": -12.468367576599121, "global_step": 443282, "epoch": 2638} {"train_loss": -12.043037414550781, "global_step": 443283, "epoch": 2638} {"train_loss": -12.398825645446777, "global_step": 443284, "epoch": 2638} {"train_loss": -12.220873832702637, "global_step": 443285, "epoch": 2638} {"train_loss": -12.480112075805664, "global_step": 443286, "epoch": 2638} {"train_loss": -12.289698600769043, "global_step": 443287, "epoch": 2638} {"train_loss": -12.480512619018555, "global_step": 443288, "epoch": 2638} {"train_loss": -12.308876037597656, "global_step": 443289, "epoch": 2638} {"train_loss": -12.421300888061523, "global_step": 443290, "epoch": 2638} {"train_loss": -12.120658874511719, "global_step": 443291, "epoch": 2638} {"train_loss": -12.48150634765625, "global_step": 443292, "epoch": 2638} {"train_loss": -12.387566566467285, "global_step": 443293, "epoch": 2638} {"train_loss": -12.237443923950195, "global_step": 443294, "epoch": 2638} {"train_loss": -12.36927604675293, "global_step": 443295, "epoch": 2638} {"train_loss": -12.017635345458984, "global_step": 443296, "epoch": 2638} {"train_loss": -12.434164047241211, "global_step": 443297, "epoch": 2638} {"train_loss": -12.104827880859375, "global_step": 443298, "epoch": 2638} {"train_loss": -12.636953353881836, "global_step": 443299, "epoch": 2638} {"train_loss": -12.455322265625, "global_step": 443300, "epoch": 2638} {"train_loss": -12.420433044433594, "global_step": 443301, "epoch": 2638} {"train_loss": -12.520540237426758, "global_step": 443302, "epoch": 2638} {"train_loss": -12.559403419494629, "global_step": 443303, "epoch": 2638} {"train_loss": -12.623702049255371, "global_step": 443304, "epoch": 2638} {"train_loss": -12.459601402282715, "global_step": 443305, "epoch": 2638} {"train_loss": -12.415725708007812, "global_step": 443306, "epoch": 2638} {"train_loss": -12.88274097442627, "global_step": 443307, "epoch": 2638} {"train_loss": -12.481463432312012, "global_step": 443308, "epoch": 2638} {"train_loss": -12.71855354309082, "global_step": 443309, "epoch": 2638} {"train_loss": -12.623862266540527, "global_step": 443310, "epoch": 2638} {"train_loss": -12.52116584777832, "global_step": 443311, "epoch": 2638} {"train_loss": -12.422508239746094, "global_step": 443312, "epoch": 2638} {"train_loss": -12.562268257141113, "global_step": 443313, "epoch": 2638} {"train_loss": -12.730709075927734, "global_step": 443314, "epoch": 2638} {"train_loss": -12.355125427246094, "global_step": 443315, "epoch": 2638} {"train_loss": -12.440030097961426, "global_step": 443316, "epoch": 2638} {"train_loss": -12.677729606628418, "global_step": 443317, "epoch": 2638} {"train_loss": -12.585123062133789, "global_step": 443318, "epoch": 2638} {"train_loss": -12.757143020629883, "global_step": 443319, "epoch": 2638} {"train_loss": -12.425789833068848, "global_step": 443320, "epoch": 2638} {"train_loss": -12.571211814880371, "global_step": 443321, "epoch": 2638} {"train_loss": -12.771408081054688, "global_step": 443322, "epoch": 2638} {"train_loss": -12.120378494262695, "global_step": 443323, "epoch": 2638} {"train_loss": -12.716044425964355, "global_step": 443324, "epoch": 2638} {"train_loss": -11.9017915725708, "global_step": 443325, "epoch": 2638} {"train_loss": -12.604107856750488, "global_step": 443326, "epoch": 2638} {"train_loss": -12.486615180969238, "global_step": 443327, "epoch": 2638} {"train_loss": -12.454204559326172, "global_step": 443328, "epoch": 2638} {"train_loss": -12.406417846679688, "global_step": 443329, "epoch": 2638} {"train_loss": -12.429161071777344, "global_step": 443330, "epoch": 2638} {"train_loss": -12.512807846069336, "global_step": 443331, "epoch": 2638} {"train_loss": -12.173914909362793, "global_step": 443332, "epoch": 2638} {"train_loss": -12.494182586669922, "global_step": 443333, "epoch": 2638} {"train_loss": -11.505769729614258, "global_step": 443334, "epoch": 2638} {"train_loss": -10.914831161499023, "global_step": 443335, "epoch": 2638} {"train_loss": -12.452371597290039, "global_step": 443336, "epoch": 2638} {"train_loss": -11.649133682250977, "global_step": 443337, "epoch": 2638} {"train_loss": -11.238153457641602, "global_step": 443338, "epoch": 2638} {"train_loss": -12.206536293029785, "global_step": 443339, "epoch": 2638} {"train_loss": -12.015426635742188, "global_step": 443340, "epoch": 2638} {"train_loss": -12.23779010772705, "global_step": 443341, "epoch": 2638} {"train_loss": -11.250801086425781, "global_step": 443342, "epoch": 2638} {"train_loss": -12.129121780395508, "global_step": 443343, "epoch": 2638} {"train_loss": -12.434734344482422, "global_step": 443344, "epoch": 2638} {"train_loss": -11.706588745117188, "global_step": 443345, "epoch": 2638} {"train_loss": -11.951910972595215, "global_step": 443346, "epoch": 2638} {"train_loss": -11.419649124145508, "global_step": 443347, "epoch": 2638} {"train_loss": -11.889081954956055, "global_step": 443348, "epoch": 2638} {"train_loss": -11.646011352539062, "global_step": 443349, "epoch": 2638} {"train_loss": -12.144426345825195, "global_step": 443350, "epoch": 2638} {"train_loss": -12.053401481537591, "global_step": 443351, "epoch": 2638, "val_loss": 303953.28125} {"train_loss": -11.310432434082031, "global_step": 443352, "epoch": 2639} {"train_loss": -11.787226676940918, "global_step": 443353, "epoch": 2639} {"train_loss": -11.069804191589355, "global_step": 443354, "epoch": 2639} {"train_loss": -11.89809513092041, "global_step": 443355, "epoch": 2639} {"train_loss": -11.353218078613281, "global_step": 443356, "epoch": 2639} {"train_loss": -12.112464904785156, "global_step": 443357, "epoch": 2639} {"train_loss": -12.021865844726562, "global_step": 443358, "epoch": 2639} {"train_loss": -11.70969009399414, "global_step": 443359, "epoch": 2639} {"train_loss": -11.870208740234375, "global_step": 443360, "epoch": 2639} {"train_loss": -11.688467025756836, "global_step": 443361, "epoch": 2639} {"train_loss": -12.389364242553711, "global_step": 443362, "epoch": 2639} {"train_loss": -11.850654602050781, "global_step": 443363, "epoch": 2639} {"train_loss": -12.407441139221191, "global_step": 443364, "epoch": 2639} {"train_loss": -11.923276901245117, "global_step": 443365, "epoch": 2639} {"train_loss": -11.866021156311035, "global_step": 443366, "epoch": 2639} {"train_loss": -12.038402557373047, "global_step": 443367, "epoch": 2639} {"train_loss": -11.670400619506836, "global_step": 443368, "epoch": 2639} {"train_loss": -12.013635635375977, "global_step": 443369, "epoch": 2639} {"train_loss": -11.971700668334961, "global_step": 443370, "epoch": 2639} {"train_loss": -12.16982650756836, "global_step": 443371, "epoch": 2639} {"train_loss": -12.407508850097656, "global_step": 443372, "epoch": 2639} {"train_loss": -12.063973426818848, "global_step": 443373, "epoch": 2639} {"train_loss": -12.339232444763184, "global_step": 443374, "epoch": 2639} {"train_loss": -11.988729476928711, "global_step": 443375, "epoch": 2639} {"train_loss": -12.533066749572754, "global_step": 443376, "epoch": 2639} {"train_loss": -11.907692909240723, "global_step": 443377, "epoch": 2639} {"train_loss": -12.078935623168945, "global_step": 443378, "epoch": 2639} {"train_loss": -12.283123970031738, "global_step": 443379, "epoch": 2639} {"train_loss": -12.285478591918945, "global_step": 443380, "epoch": 2639} {"train_loss": -12.349224090576172, "global_step": 443381, "epoch": 2639} {"train_loss": -12.127174377441406, "global_step": 443382, "epoch": 2639} {"train_loss": -12.418319702148438, "global_step": 443383, "epoch": 2639} {"train_loss": -12.586250305175781, "global_step": 443384, "epoch": 2639} {"train_loss": -12.42659854888916, "global_step": 443385, "epoch": 2639} {"train_loss": -12.446860313415527, "global_step": 443386, "epoch": 2639} {"train_loss": -12.755796432495117, "global_step": 443387, "epoch": 2639} {"train_loss": -12.599563598632812, "global_step": 443388, "epoch": 2639} {"train_loss": -12.56042766571045, "global_step": 443389, "epoch": 2639} {"train_loss": -12.367359161376953, "global_step": 443390, "epoch": 2639} {"train_loss": -12.771162033081055, "global_step": 443391, "epoch": 2639} {"train_loss": -12.510507583618164, "global_step": 443392, "epoch": 2639} {"train_loss": -12.395751953125, "global_step": 443393, "epoch": 2639} {"train_loss": -12.187260627746582, "global_step": 443394, "epoch": 2639} {"train_loss": -12.450919151306152, "global_step": 443395, "epoch": 2639} {"train_loss": -12.380383491516113, "global_step": 443396, "epoch": 2639} {"train_loss": -11.881027221679688, "global_step": 443397, "epoch": 2639} {"train_loss": -12.350652694702148, "global_step": 443398, "epoch": 2639} {"train_loss": -12.390190124511719, "global_step": 443399, "epoch": 2639} {"train_loss": -11.939550399780273, "global_step": 443400, "epoch": 2639} {"train_loss": -12.496986389160156, "global_step": 443401, "epoch": 2639} {"train_loss": -11.534379959106445, "global_step": 443402, "epoch": 2639} {"train_loss": -11.306684494018555, "global_step": 443403, "epoch": 2639} {"train_loss": -12.005071640014648, "global_step": 443404, "epoch": 2639} {"train_loss": -11.67843246459961, "global_step": 443405, "epoch": 2639} {"train_loss": -11.11300277709961, "global_step": 443406, "epoch": 2639} {"train_loss": -12.04636001586914, "global_step": 443407, "epoch": 2639} {"train_loss": -11.40765380859375, "global_step": 443408, "epoch": 2639} {"train_loss": -11.916306495666504, "global_step": 443409, "epoch": 2639} {"train_loss": -11.85892105102539, "global_step": 443410, "epoch": 2639} {"train_loss": -11.55694580078125, "global_step": 443411, "epoch": 2639} {"train_loss": -12.385818481445312, "global_step": 443412, "epoch": 2639} {"train_loss": -12.574126243591309, "global_step": 443413, "epoch": 2639} {"train_loss": -12.11249828338623, "global_step": 443414, "epoch": 2639} {"train_loss": -12.630521774291992, "global_step": 443415, "epoch": 2639} {"train_loss": -12.112504959106445, "global_step": 443416, "epoch": 2639} {"train_loss": -12.741439819335938, "global_step": 443417, "epoch": 2639} {"train_loss": -12.179206848144531, "global_step": 443418, "epoch": 2639} {"train_loss": -12.524044036865234, "global_step": 443419, "epoch": 2639} {"train_loss": -12.432394027709961, "global_step": 443420, "epoch": 2639} {"train_loss": -12.487788200378418, "global_step": 443421, "epoch": 2639} {"train_loss": -12.649286270141602, "global_step": 443422, "epoch": 2639} {"train_loss": -12.265218734741211, "global_step": 443423, "epoch": 2639} {"train_loss": -12.426712036132812, "global_step": 443424, "epoch": 2639} {"train_loss": -12.041109085083008, "global_step": 443425, "epoch": 2639} {"train_loss": -11.239213943481445, "global_step": 443426, "epoch": 2639} {"train_loss": -12.167594909667969, "global_step": 443427, "epoch": 2639} {"train_loss": -12.382835388183594, "global_step": 443428, "epoch": 2639} {"train_loss": -11.542978286743164, "global_step": 443429, "epoch": 2639} {"train_loss": -12.54869270324707, "global_step": 443430, "epoch": 2639} {"train_loss": -12.340349197387695, "global_step": 443431, "epoch": 2639} {"train_loss": -11.966634750366211, "global_step": 443432, "epoch": 2639} {"train_loss": -12.29153823852539, "global_step": 443433, "epoch": 2639} {"train_loss": -11.644548416137695, "global_step": 443434, "epoch": 2639} {"train_loss": -12.52375602722168, "global_step": 443435, "epoch": 2639} {"train_loss": -12.413336753845215, "global_step": 443436, "epoch": 2639} {"train_loss": -12.44418716430664, "global_step": 443437, "epoch": 2639} {"train_loss": -12.802358627319336, "global_step": 443438, "epoch": 2639} {"train_loss": -12.743629455566406, "global_step": 443439, "epoch": 2639} {"train_loss": -12.314319610595703, "global_step": 443440, "epoch": 2639} {"train_loss": -12.803451538085938, "global_step": 443441, "epoch": 2639} {"train_loss": -12.57475757598877, "global_step": 443442, "epoch": 2639} {"train_loss": -12.768041610717773, "global_step": 443443, "epoch": 2639} {"train_loss": -12.694592475891113, "global_step": 443444, "epoch": 2639} {"train_loss": -12.607434272766113, "global_step": 443445, "epoch": 2639} {"train_loss": -12.762876510620117, "global_step": 443446, "epoch": 2639} {"train_loss": -12.41296672821045, "global_step": 443447, "epoch": 2639} {"train_loss": -12.986747741699219, "global_step": 443448, "epoch": 2639} {"train_loss": -12.546361923217773, "global_step": 443449, "epoch": 2639} {"train_loss": -12.764902114868164, "global_step": 443450, "epoch": 2639} {"train_loss": -12.448932647705078, "global_step": 443451, "epoch": 2639} {"train_loss": -12.52334213256836, "global_step": 443452, "epoch": 2639} {"train_loss": -12.62486743927002, "global_step": 443453, "epoch": 2639} {"train_loss": -12.782356262207031, "global_step": 443454, "epoch": 2639} {"train_loss": -12.517998695373535, "global_step": 443455, "epoch": 2639} {"train_loss": -12.431177139282227, "global_step": 443456, "epoch": 2639} {"train_loss": -12.423118591308594, "global_step": 443457, "epoch": 2639} {"train_loss": -12.170604705810547, "global_step": 443458, "epoch": 2639} {"train_loss": -12.620735168457031, "global_step": 443459, "epoch": 2639} {"train_loss": -11.844961166381836, "global_step": 443460, "epoch": 2639} {"train_loss": -12.287250518798828, "global_step": 443461, "epoch": 2639} {"train_loss": -11.934252738952637, "global_step": 443462, "epoch": 2639} {"train_loss": -12.135374069213867, "global_step": 443463, "epoch": 2639} {"train_loss": -12.39168643951416, "global_step": 443464, "epoch": 2639} {"train_loss": -11.814002990722656, "global_step": 443465, "epoch": 2639} {"train_loss": -12.085830688476562, "global_step": 443466, "epoch": 2639} {"train_loss": -11.954229354858398, "global_step": 443467, "epoch": 2639} {"train_loss": -11.997234344482422, "global_step": 443468, "epoch": 2639} {"train_loss": -11.935859680175781, "global_step": 443469, "epoch": 2639} {"train_loss": -11.542952537536621, "global_step": 443470, "epoch": 2639} {"train_loss": -11.039640426635742, "global_step": 443471, "epoch": 2639} {"train_loss": -11.884358406066895, "global_step": 443472, "epoch": 2639} {"train_loss": -11.186352729797363, "global_step": 443473, "epoch": 2639} {"train_loss": -11.317599296569824, "global_step": 443474, "epoch": 2639} {"train_loss": -12.179889678955078, "global_step": 443475, "epoch": 2639} {"train_loss": -11.722736358642578, "global_step": 443476, "epoch": 2639} {"train_loss": -12.06271743774414, "global_step": 443477, "epoch": 2639} {"train_loss": -12.424270629882812, "global_step": 443478, "epoch": 2639} {"train_loss": -11.76611042022705, "global_step": 443479, "epoch": 2639} {"train_loss": -12.341440200805664, "global_step": 443480, "epoch": 2639} {"train_loss": -12.01289176940918, "global_step": 443481, "epoch": 2639} {"train_loss": -11.955392837524414, "global_step": 443482, "epoch": 2639} {"train_loss": -12.701229095458984, "global_step": 443483, "epoch": 2639} {"train_loss": -12.182796478271484, "global_step": 443484, "epoch": 2639} {"train_loss": -12.046371459960938, "global_step": 443485, "epoch": 2639} {"train_loss": -12.373880386352539, "global_step": 443486, "epoch": 2639} {"train_loss": -12.342089653015137, "global_step": 443487, "epoch": 2639} {"train_loss": -11.764158248901367, "global_step": 443488, "epoch": 2639} {"train_loss": -12.41915512084961, "global_step": 443489, "epoch": 2639} {"train_loss": -11.530221939086914, "global_step": 443490, "epoch": 2639} {"train_loss": -12.576408386230469, "global_step": 443491, "epoch": 2639} {"train_loss": -12.070417404174805, "global_step": 443492, "epoch": 2639} {"train_loss": -12.078601837158203, "global_step": 443493, "epoch": 2639} {"train_loss": -12.642826080322266, "global_step": 443494, "epoch": 2639} {"train_loss": -12.091680526733398, "global_step": 443495, "epoch": 2639} {"train_loss": -11.725675582885742, "global_step": 443496, "epoch": 2639} {"train_loss": -12.463470458984375, "global_step": 443497, "epoch": 2639} {"train_loss": -12.55870532989502, "global_step": 443498, "epoch": 2639} {"train_loss": -12.23274040222168, "global_step": 443499, "epoch": 2639} {"train_loss": -12.48581314086914, "global_step": 443500, "epoch": 2639} {"train_loss": -12.580060958862305, "global_step": 443501, "epoch": 2639} {"train_loss": -12.329975128173828, "global_step": 443502, "epoch": 2639} {"train_loss": -12.741127014160156, "global_step": 443503, "epoch": 2639} {"train_loss": -12.697615623474121, "global_step": 443504, "epoch": 2639} {"train_loss": -12.589512825012207, "global_step": 443505, "epoch": 2639} {"train_loss": -12.329407691955566, "global_step": 443506, "epoch": 2639} {"train_loss": -12.434778213500977, "global_step": 443507, "epoch": 2639} {"train_loss": -12.830451011657715, "global_step": 443508, "epoch": 2639} {"train_loss": -12.572063446044922, "global_step": 443509, "epoch": 2639} {"train_loss": -12.519967079162598, "global_step": 443510, "epoch": 2639} {"train_loss": -12.43886947631836, "global_step": 443511, "epoch": 2639} {"train_loss": -12.591728210449219, "global_step": 443512, "epoch": 2639} {"train_loss": -12.535651206970215, "global_step": 443513, "epoch": 2639} {"train_loss": -12.51899528503418, "global_step": 443514, "epoch": 2639} {"train_loss": -12.616019248962402, "global_step": 443515, "epoch": 2639} {"train_loss": -12.489906311035156, "global_step": 443516, "epoch": 2639} {"train_loss": -12.552424430847168, "global_step": 443517, "epoch": 2639} {"train_loss": -12.410636901855469, "global_step": 443518, "epoch": 2639} {"train_loss": -12.217940131823221, "global_step": 443519, "epoch": 2639, "val_loss": 310053.84375} {"train_loss": -12.576549530029297, "global_step": 443520, "epoch": 2640} {"train_loss": -12.506355285644531, "global_step": 443521, "epoch": 2640} {"train_loss": -12.428871154785156, "global_step": 443522, "epoch": 2640} {"train_loss": -12.706113815307617, "global_step": 443523, "epoch": 2640} {"train_loss": -12.488845825195312, "global_step": 443524, "epoch": 2640} {"train_loss": -12.70809555053711, "global_step": 443525, "epoch": 2640} {"train_loss": -12.557713508605957, "global_step": 443526, "epoch": 2640} {"train_loss": -12.538246154785156, "global_step": 443527, "epoch": 2640} {"train_loss": -12.586416244506836, "global_step": 443528, "epoch": 2640} {"train_loss": -12.338153839111328, "global_step": 443529, "epoch": 2640} {"train_loss": -12.417743682861328, "global_step": 443530, "epoch": 2640} {"train_loss": -12.696342468261719, "global_step": 443531, "epoch": 2640} {"train_loss": -12.078367233276367, "global_step": 443532, "epoch": 2640} {"train_loss": -12.25281047821045, "global_step": 443533, "epoch": 2640} {"train_loss": -12.881024360656738, "global_step": 443534, "epoch": 2640} {"train_loss": -12.101214408874512, "global_step": 443535, "epoch": 2640} {"train_loss": -12.332876205444336, "global_step": 443536, "epoch": 2640} {"train_loss": -12.745952606201172, "global_step": 443537, "epoch": 2640} {"train_loss": -11.996808052062988, "global_step": 443538, "epoch": 2640} {"train_loss": -12.525287628173828, "global_step": 443539, "epoch": 2640} {"train_loss": -12.397528648376465, "global_step": 443540, "epoch": 2640} {"train_loss": -12.346075057983398, "global_step": 443541, "epoch": 2640} {"train_loss": -12.52977180480957, "global_step": 443542, "epoch": 2640} {"train_loss": -12.549051284790039, "global_step": 443543, "epoch": 2640} {"train_loss": -12.536897659301758, "global_step": 443544, "epoch": 2640} {"train_loss": -12.686604499816895, "global_step": 443545, "epoch": 2640} {"train_loss": -12.748588562011719, "global_step": 443546, "epoch": 2640} {"train_loss": -12.622814178466797, "global_step": 443547, "epoch": 2640} {"train_loss": -12.69251823425293, "global_step": 443548, "epoch": 2640} {"train_loss": -12.789234161376953, "global_step": 443549, "epoch": 2640} {"train_loss": -12.792337417602539, "global_step": 443550, "epoch": 2640} {"train_loss": -12.847844123840332, "global_step": 443551, "epoch": 2640} {"train_loss": -12.741300582885742, "global_step": 443552, "epoch": 2640} {"train_loss": -12.804975509643555, "global_step": 443553, "epoch": 2640} {"train_loss": -12.572986602783203, "global_step": 443554, "epoch": 2640} {"train_loss": -12.640865325927734, "global_step": 443555, "epoch": 2640} {"train_loss": -12.739452362060547, "global_step": 443556, "epoch": 2640} {"train_loss": -12.751180648803711, "global_step": 443557, "epoch": 2640} {"train_loss": -12.446677207946777, "global_step": 443558, "epoch": 2640} {"train_loss": -12.855833053588867, "global_step": 443559, "epoch": 2640} {"train_loss": -12.533865928649902, "global_step": 443560, "epoch": 2640} {"train_loss": -12.443172454833984, "global_step": 443561, "epoch": 2640} {"train_loss": -12.762542724609375, "global_step": 443562, "epoch": 2640} {"train_loss": -12.732545852661133, "global_step": 443563, "epoch": 2640} {"train_loss": -12.81902027130127, "global_step": 443564, "epoch": 2640} {"train_loss": -12.796114921569824, "global_step": 443565, "epoch": 2640} {"train_loss": -12.647407531738281, "global_step": 443566, "epoch": 2640} {"train_loss": -12.880962371826172, "global_step": 443567, "epoch": 2640} {"train_loss": -12.639995574951172, "global_step": 443568, "epoch": 2640} {"train_loss": -11.919683456420898, "global_step": 443569, "epoch": 2640} {"train_loss": -12.005027770996094, "global_step": 443570, "epoch": 2640} {"train_loss": -12.401719093322754, "global_step": 443571, "epoch": 2640} {"train_loss": -12.612858772277832, "global_step": 443572, "epoch": 2640} {"train_loss": -11.293006896972656, "global_step": 443573, "epoch": 2640} {"train_loss": -11.201849937438965, "global_step": 443574, "epoch": 2640} {"train_loss": -11.728097915649414, "global_step": 443575, "epoch": 2640} {"train_loss": -11.369532585144043, "global_step": 443576, "epoch": 2640} {"train_loss": -12.29069995880127, "global_step": 443577, "epoch": 2640} {"train_loss": -11.669195175170898, "global_step": 443578, "epoch": 2640} {"train_loss": -12.14520263671875, "global_step": 443579, "epoch": 2640} {"train_loss": -12.353859901428223, "global_step": 443580, "epoch": 2640} {"train_loss": -12.262470245361328, "global_step": 443581, "epoch": 2640} {"train_loss": -11.10932731628418, "global_step": 443582, "epoch": 2640} {"train_loss": -11.686851501464844, "global_step": 443583, "epoch": 2640} {"train_loss": -12.177468299865723, "global_step": 443584, "epoch": 2640} {"train_loss": -12.290810585021973, "global_step": 443585, "epoch": 2640} {"train_loss": -11.605788230895996, "global_step": 443586, "epoch": 2640} {"train_loss": -11.755836486816406, "global_step": 443587, "epoch": 2640} {"train_loss": -12.515599250793457, "global_step": 443588, "epoch": 2640} {"train_loss": -11.9493408203125, "global_step": 443589, "epoch": 2640} {"train_loss": -11.59813117980957, "global_step": 443590, "epoch": 2640} {"train_loss": -11.056436538696289, "global_step": 443591, "epoch": 2640} {"train_loss": -12.119178771972656, "global_step": 443592, "epoch": 2640} {"train_loss": -10.78780746459961, "global_step": 443593, "epoch": 2640} {"train_loss": -11.076566696166992, "global_step": 443594, "epoch": 2640} {"train_loss": -10.75640869140625, "global_step": 443595, "epoch": 2640} {"train_loss": -10.616342544555664, "global_step": 443596, "epoch": 2640} {"train_loss": -11.805281639099121, "global_step": 443597, "epoch": 2640} {"train_loss": -9.830459594726562, "global_step": 443598, "epoch": 2640} {"train_loss": -10.667047500610352, "global_step": 443599, "epoch": 2640} {"train_loss": -12.472640991210938, "global_step": 443600, "epoch": 2640} {"train_loss": -10.54776382446289, "global_step": 443601, "epoch": 2640} {"train_loss": -11.83243465423584, "global_step": 443602, "epoch": 2640} {"train_loss": -10.527116775512695, "global_step": 443603, "epoch": 2640} {"train_loss": -11.60069751739502, "global_step": 443604, "epoch": 2640} {"train_loss": -11.827215194702148, "global_step": 443605, "epoch": 2640} {"train_loss": -11.470376968383789, "global_step": 443606, "epoch": 2640} {"train_loss": -12.297770500183105, "global_step": 443607, "epoch": 2640} {"train_loss": -11.241357803344727, "global_step": 443608, "epoch": 2640} {"train_loss": -12.426730155944824, "global_step": 443609, "epoch": 2640} {"train_loss": -11.875120162963867, "global_step": 443610, "epoch": 2640} {"train_loss": -12.467142105102539, "global_step": 443611, "epoch": 2640} {"train_loss": -11.663785934448242, "global_step": 443612, "epoch": 2640} {"train_loss": -12.480777740478516, "global_step": 443613, "epoch": 2640} {"train_loss": -11.827369689941406, "global_step": 443614, "epoch": 2640} {"train_loss": -12.413777351379395, "global_step": 443615, "epoch": 2640} {"train_loss": -12.249853134155273, "global_step": 443616, "epoch": 2640} {"train_loss": -12.315431594848633, "global_step": 443617, "epoch": 2640} {"train_loss": -12.27513313293457, "global_step": 443618, "epoch": 2640} {"train_loss": -12.318235397338867, "global_step": 443619, "epoch": 2640} {"train_loss": -12.154353141784668, "global_step": 443620, "epoch": 2640} {"train_loss": -11.516833305358887, "global_step": 443621, "epoch": 2640} {"train_loss": -12.397733688354492, "global_step": 443622, "epoch": 2640} {"train_loss": -11.93687915802002, "global_step": 443623, "epoch": 2640} {"train_loss": -11.509634971618652, "global_step": 443624, "epoch": 2640} {"train_loss": -12.133590698242188, "global_step": 443625, "epoch": 2640} {"train_loss": -11.201948165893555, "global_step": 443626, "epoch": 2640} {"train_loss": -11.008001327514648, "global_step": 443627, "epoch": 2640} {"train_loss": -12.05868911743164, "global_step": 443628, "epoch": 2640} {"train_loss": -10.614862442016602, "global_step": 443629, "epoch": 2640} {"train_loss": -12.371188163757324, "global_step": 443630, "epoch": 2640} {"train_loss": -11.253425598144531, "global_step": 443631, "epoch": 2640} {"train_loss": -11.813546180725098, "global_step": 443632, "epoch": 2640} {"train_loss": -12.068119049072266, "global_step": 443633, "epoch": 2640} {"train_loss": -11.897441864013672, "global_step": 443634, "epoch": 2640} {"train_loss": -12.502649307250977, "global_step": 443635, "epoch": 2640} {"train_loss": -11.877176284790039, "global_step": 443636, "epoch": 2640} {"train_loss": -12.187212944030762, "global_step": 443637, "epoch": 2640} {"train_loss": -12.039831161499023, "global_step": 443638, "epoch": 2640} {"train_loss": -12.028647422790527, "global_step": 443639, "epoch": 2640} {"train_loss": -12.336997032165527, "global_step": 443640, "epoch": 2640} {"train_loss": -12.21799373626709, "global_step": 443641, "epoch": 2640} {"train_loss": -12.45492172241211, "global_step": 443642, "epoch": 2640} {"train_loss": -11.781984329223633, "global_step": 443643, "epoch": 2640} {"train_loss": -12.414811134338379, "global_step": 443644, "epoch": 2640} {"train_loss": -12.083853721618652, "global_step": 443645, "epoch": 2640} {"train_loss": -11.735438346862793, "global_step": 443646, "epoch": 2640} {"train_loss": -12.430832862854004, "global_step": 443647, "epoch": 2640} {"train_loss": -12.162727355957031, "global_step": 443648, "epoch": 2640} {"train_loss": -12.503595352172852, "global_step": 443649, "epoch": 2640} {"train_loss": -12.362093925476074, "global_step": 443650, "epoch": 2640} {"train_loss": -12.425701141357422, "global_step": 443651, "epoch": 2640} {"train_loss": -12.23551082611084, "global_step": 443652, "epoch": 2640} {"train_loss": -12.306082725524902, "global_step": 443653, "epoch": 2640} {"train_loss": -12.213645935058594, "global_step": 443654, "epoch": 2640} {"train_loss": -12.156988143920898, "global_step": 443655, "epoch": 2640} {"train_loss": -12.048469543457031, "global_step": 443656, "epoch": 2640} {"train_loss": -12.392101287841797, "global_step": 443657, "epoch": 2640} {"train_loss": -12.043416023254395, "global_step": 443658, "epoch": 2640} {"train_loss": -12.551576614379883, "global_step": 443659, "epoch": 2640} {"train_loss": -12.435006141662598, "global_step": 443660, "epoch": 2640} {"train_loss": -12.04814338684082, "global_step": 443661, "epoch": 2640} {"train_loss": -12.383523941040039, "global_step": 443662, "epoch": 2640} {"train_loss": -12.023770332336426, "global_step": 443663, "epoch": 2640} {"train_loss": -12.20688247680664, "global_step": 443664, "epoch": 2640} {"train_loss": -12.441499710083008, "global_step": 443665, "epoch": 2640} {"train_loss": -12.372340202331543, "global_step": 443666, "epoch": 2640} {"train_loss": -12.280800819396973, "global_step": 443667, "epoch": 2640} {"train_loss": -12.364845275878906, "global_step": 443668, "epoch": 2640} {"train_loss": -12.4022855758667, "global_step": 443669, "epoch": 2640} {"train_loss": -12.357338905334473, "global_step": 443670, "epoch": 2640} {"train_loss": -11.49176025390625, "global_step": 443671, "epoch": 2640} {"train_loss": -12.00814437866211, "global_step": 443672, "epoch": 2640} {"train_loss": -12.058320045471191, "global_step": 443673, "epoch": 2640} {"train_loss": -11.582521438598633, "global_step": 443674, "epoch": 2640} {"train_loss": -11.808748245239258, "global_step": 443675, "epoch": 2640} {"train_loss": -11.111806869506836, "global_step": 443676, "epoch": 2640} {"train_loss": -12.382123947143555, "global_step": 443677, "epoch": 2640} {"train_loss": -11.213354110717773, "global_step": 443678, "epoch": 2640} {"train_loss": -12.36919116973877, "global_step": 443679, "epoch": 2640} {"train_loss": -11.70244312286377, "global_step": 443680, "epoch": 2640} {"train_loss": -11.645868301391602, "global_step": 443681, "epoch": 2640} {"train_loss": -12.288658142089844, "global_step": 443682, "epoch": 2640} {"train_loss": -11.12968635559082, "global_step": 443683, "epoch": 2640} {"train_loss": -12.150740623474121, "global_step": 443684, "epoch": 2640} {"train_loss": -10.927037239074707, "global_step": 443685, "epoch": 2640} {"train_loss": -12.174745559692383, "global_step": 443686, "epoch": 2640} {"train_loss": -12.093809071041289, "global_step": 443687, "epoch": 2640, "val_loss": 312155.75, "train_action_mse_error": 1.9007071256637573} {"train_loss": -12.465651512145996, "global_step": 443688, "epoch": 2641} {"train_loss": -11.93055534362793, "global_step": 443689, "epoch": 2641} {"train_loss": -11.993069648742676, "global_step": 443690, "epoch": 2641} {"train_loss": -12.084359169006348, "global_step": 443691, "epoch": 2641} {"train_loss": -11.929327011108398, "global_step": 443692, "epoch": 2641} {"train_loss": -12.691242218017578, "global_step": 443693, "epoch": 2641} {"train_loss": -11.677824974060059, "global_step": 443694, "epoch": 2641} {"train_loss": -12.728660583496094, "global_step": 443695, "epoch": 2641} {"train_loss": -11.83482551574707, "global_step": 443696, "epoch": 2641} {"train_loss": -12.312284469604492, "global_step": 443697, "epoch": 2641} {"train_loss": -12.478340148925781, "global_step": 443698, "epoch": 2641} {"train_loss": -12.073871612548828, "global_step": 443699, "epoch": 2641} {"train_loss": -12.243961334228516, "global_step": 443700, "epoch": 2641} {"train_loss": -12.134950637817383, "global_step": 443701, "epoch": 2641} {"train_loss": -12.493841171264648, "global_step": 443702, "epoch": 2641} {"train_loss": -12.033467292785645, "global_step": 443703, "epoch": 2641} {"train_loss": -12.001653671264648, "global_step": 443704, "epoch": 2641} {"train_loss": -12.279739379882812, "global_step": 443705, "epoch": 2641} {"train_loss": -12.183021545410156, "global_step": 443706, "epoch": 2641} {"train_loss": -11.506990432739258, "global_step": 443707, "epoch": 2641} {"train_loss": -12.604072570800781, "global_step": 443708, "epoch": 2641} {"train_loss": -11.367137908935547, "global_step": 443709, "epoch": 2641} {"train_loss": -12.46055793762207, "global_step": 443710, "epoch": 2641} {"train_loss": -11.42751693725586, "global_step": 443711, "epoch": 2641} {"train_loss": -12.04865550994873, "global_step": 443712, "epoch": 2641} {"train_loss": -12.153949737548828, "global_step": 443713, "epoch": 2641} {"train_loss": -12.063809394836426, "global_step": 443714, "epoch": 2641} {"train_loss": -11.93677806854248, "global_step": 443715, "epoch": 2641} {"train_loss": -12.18991470336914, "global_step": 443716, "epoch": 2641} {"train_loss": -11.603218078613281, "global_step": 443717, "epoch": 2641} {"train_loss": -11.140531539916992, "global_step": 443718, "epoch": 2641} {"train_loss": -11.604750633239746, "global_step": 443719, "epoch": 2641} {"train_loss": -11.403510093688965, "global_step": 443720, "epoch": 2641} {"train_loss": -12.197975158691406, "global_step": 443721, "epoch": 2641} {"train_loss": -11.44859504699707, "global_step": 443722, "epoch": 2641} {"train_loss": -12.281452178955078, "global_step": 443723, "epoch": 2641} {"train_loss": -11.498619079589844, "global_step": 443724, "epoch": 2641} {"train_loss": -12.328516006469727, "global_step": 443725, "epoch": 2641} {"train_loss": -11.697861671447754, "global_step": 443726, "epoch": 2641} {"train_loss": -12.343873023986816, "global_step": 443727, "epoch": 2641} {"train_loss": -11.988304138183594, "global_step": 443728, "epoch": 2641} {"train_loss": -12.543867111206055, "global_step": 443729, "epoch": 2641} {"train_loss": -11.859935760498047, "global_step": 443730, "epoch": 2641} {"train_loss": -12.552966117858887, "global_step": 443731, "epoch": 2641} {"train_loss": -12.171847343444824, "global_step": 443732, "epoch": 2641} {"train_loss": -12.39133071899414, "global_step": 443733, "epoch": 2641} {"train_loss": -12.588825225830078, "global_step": 443734, "epoch": 2641} {"train_loss": -12.478382110595703, "global_step": 443735, "epoch": 2641} {"train_loss": -12.393584251403809, "global_step": 443736, "epoch": 2641} {"train_loss": -12.514495849609375, "global_step": 443737, "epoch": 2641} {"train_loss": -12.639791488647461, "global_step": 443738, "epoch": 2641} {"train_loss": -12.534992218017578, "global_step": 443739, "epoch": 2641} {"train_loss": -12.338424682617188, "global_step": 443740, "epoch": 2641} {"train_loss": -12.436861038208008, "global_step": 443741, "epoch": 2641} {"train_loss": -12.570699691772461, "global_step": 443742, "epoch": 2641} {"train_loss": -12.403417587280273, "global_step": 443743, "epoch": 2641} {"train_loss": -12.709829330444336, "global_step": 443744, "epoch": 2641} {"train_loss": -12.622872352600098, "global_step": 443745, "epoch": 2641} {"train_loss": -12.17430305480957, "global_step": 443746, "epoch": 2641} {"train_loss": -12.54594612121582, "global_step": 443747, "epoch": 2641} {"train_loss": -12.384897232055664, "global_step": 443748, "epoch": 2641} {"train_loss": -12.490226745605469, "global_step": 443749, "epoch": 2641} {"train_loss": -12.455345153808594, "global_step": 443750, "epoch": 2641} {"train_loss": -12.252388000488281, "global_step": 443751, "epoch": 2641} {"train_loss": -12.606222152709961, "global_step": 443752, "epoch": 2641} {"train_loss": -12.272708892822266, "global_step": 443753, "epoch": 2641} {"train_loss": -12.380331039428711, "global_step": 443754, "epoch": 2641} {"train_loss": -12.54362678527832, "global_step": 443755, "epoch": 2641} {"train_loss": -12.429712295532227, "global_step": 443756, "epoch": 2641} {"train_loss": -12.586885452270508, "global_step": 443757, "epoch": 2641} {"train_loss": -12.478811264038086, "global_step": 443758, "epoch": 2641} {"train_loss": -12.420167922973633, "global_step": 443759, "epoch": 2641} {"train_loss": -12.211936950683594, "global_step": 443760, "epoch": 2641} {"train_loss": -12.624622344970703, "global_step": 443761, "epoch": 2641} {"train_loss": -12.219686508178711, "global_step": 443762, "epoch": 2641} {"train_loss": -12.631708145141602, "global_step": 443763, "epoch": 2641} {"train_loss": -11.964465141296387, "global_step": 443764, "epoch": 2641} {"train_loss": -12.107708930969238, "global_step": 443765, "epoch": 2641} {"train_loss": -12.407633781433105, "global_step": 443766, "epoch": 2641} {"train_loss": -12.238113403320312, "global_step": 443767, "epoch": 2641} {"train_loss": -11.29981517791748, "global_step": 443768, "epoch": 2641} {"train_loss": -12.115078926086426, "global_step": 443769, "epoch": 2641} {"train_loss": -11.387517929077148, "global_step": 443770, "epoch": 2641} {"train_loss": -12.265474319458008, "global_step": 443771, "epoch": 2641} {"train_loss": -11.339591979980469, "global_step": 443772, "epoch": 2641} {"train_loss": -11.64857292175293, "global_step": 443773, "epoch": 2641} {"train_loss": -12.471717834472656, "global_step": 443774, "epoch": 2641} {"train_loss": -12.051380157470703, "global_step": 443775, "epoch": 2641} {"train_loss": -11.968414306640625, "global_step": 443776, "epoch": 2641} {"train_loss": -12.412940979003906, "global_step": 443777, "epoch": 2641} {"train_loss": -12.475088119506836, "global_step": 443778, "epoch": 2641} {"train_loss": -12.240148544311523, "global_step": 443779, "epoch": 2641} {"train_loss": -12.710796356201172, "global_step": 443780, "epoch": 2641} {"train_loss": -12.286069869995117, "global_step": 443781, "epoch": 2641} {"train_loss": -12.767538070678711, "global_step": 443782, "epoch": 2641} {"train_loss": -12.521236419677734, "global_step": 443783, "epoch": 2641} {"train_loss": -12.906388282775879, "global_step": 443784, "epoch": 2641} {"train_loss": -12.544364929199219, "global_step": 443785, "epoch": 2641} {"train_loss": -12.538017272949219, "global_step": 443786, "epoch": 2641} {"train_loss": -12.483953475952148, "global_step": 443787, "epoch": 2641} {"train_loss": -12.720314025878906, "global_step": 443788, "epoch": 2641} {"train_loss": -12.663989067077637, "global_step": 443789, "epoch": 2641} {"train_loss": -12.464482307434082, "global_step": 443790, "epoch": 2641} {"train_loss": -12.628968238830566, "global_step": 443791, "epoch": 2641} {"train_loss": -12.352999687194824, "global_step": 443792, "epoch": 2641} {"train_loss": -12.466972351074219, "global_step": 443793, "epoch": 2641} {"train_loss": -12.315810203552246, "global_step": 443794, "epoch": 2641} {"train_loss": -12.38238525390625, "global_step": 443795, "epoch": 2641} {"train_loss": -12.122281074523926, "global_step": 443796, "epoch": 2641} {"train_loss": -12.470718383789062, "global_step": 443797, "epoch": 2641} {"train_loss": -12.223979949951172, "global_step": 443798, "epoch": 2641} {"train_loss": -11.743428230285645, "global_step": 443799, "epoch": 2641} {"train_loss": -12.31265640258789, "global_step": 443800, "epoch": 2641} {"train_loss": -11.882248878479004, "global_step": 443801, "epoch": 2641} {"train_loss": -12.253273963928223, "global_step": 443802, "epoch": 2641} {"train_loss": -12.256202697753906, "global_step": 443803, "epoch": 2641} {"train_loss": -11.983951568603516, "global_step": 443804, "epoch": 2641} {"train_loss": -12.480676651000977, "global_step": 443805, "epoch": 2641} {"train_loss": -12.336723327636719, "global_step": 443806, "epoch": 2641} {"train_loss": -12.464384078979492, "global_step": 443807, "epoch": 2641} {"train_loss": -12.73063850402832, "global_step": 443808, "epoch": 2641} {"train_loss": -12.623536109924316, "global_step": 443809, "epoch": 2641} {"train_loss": -12.721200942993164, "global_step": 443810, "epoch": 2641} {"train_loss": -12.522764205932617, "global_step": 443811, "epoch": 2641} {"train_loss": -12.728109359741211, "global_step": 443812, "epoch": 2641} {"train_loss": -12.80514907836914, "global_step": 443813, "epoch": 2641} {"train_loss": -12.982145309448242, "global_step": 443814, "epoch": 2641} {"train_loss": -12.652408599853516, "global_step": 443815, "epoch": 2641} {"train_loss": -12.674863815307617, "global_step": 443816, "epoch": 2641} {"train_loss": -12.59724235534668, "global_step": 443817, "epoch": 2641} {"train_loss": -12.68228530883789, "global_step": 443818, "epoch": 2641} {"train_loss": -12.59492015838623, "global_step": 443819, "epoch": 2641} {"train_loss": -12.836223602294922, "global_step": 443820, "epoch": 2641} {"train_loss": -12.607840538024902, "global_step": 443821, "epoch": 2641} {"train_loss": -12.819204330444336, "global_step": 443822, "epoch": 2641} {"train_loss": -12.983396530151367, "global_step": 443823, "epoch": 2641} {"train_loss": -12.812402725219727, "global_step": 443824, "epoch": 2641} {"train_loss": -12.901727676391602, "global_step": 443825, "epoch": 2641} {"train_loss": -12.721994400024414, "global_step": 443826, "epoch": 2641} {"train_loss": -12.890419960021973, "global_step": 443827, "epoch": 2641} {"train_loss": -12.520069122314453, "global_step": 443828, "epoch": 2641} {"train_loss": -12.364362716674805, "global_step": 443829, "epoch": 2641} {"train_loss": -12.567033767700195, "global_step": 443830, "epoch": 2641} {"train_loss": -12.498154640197754, "global_step": 443831, "epoch": 2641} {"train_loss": -12.87684154510498, "global_step": 443832, "epoch": 2641} {"train_loss": -12.564920425415039, "global_step": 443833, "epoch": 2641} {"train_loss": -11.942583084106445, "global_step": 443834, "epoch": 2641} {"train_loss": -11.23254108428955, "global_step": 443835, "epoch": 2641} {"train_loss": -12.512100219726562, "global_step": 443836, "epoch": 2641} {"train_loss": -10.614124298095703, "global_step": 443837, "epoch": 2641} {"train_loss": -11.860844612121582, "global_step": 443838, "epoch": 2641} {"train_loss": -11.259206771850586, "global_step": 443839, "epoch": 2641} {"train_loss": -12.580963134765625, "global_step": 443840, "epoch": 2641} {"train_loss": -11.286746978759766, "global_step": 443841, "epoch": 2641} {"train_loss": -12.322080612182617, "global_step": 443842, "epoch": 2641} {"train_loss": -12.127883911132812, "global_step": 443843, "epoch": 2641} {"train_loss": -11.978514671325684, "global_step": 443844, "epoch": 2641} {"train_loss": -10.733475685119629, "global_step": 443845, "epoch": 2641} {"train_loss": -11.104267120361328, "global_step": 443846, "epoch": 2641} {"train_loss": -11.175209045410156, "global_step": 443847, "epoch": 2641} {"train_loss": -11.32780647277832, "global_step": 443848, "epoch": 2641} {"train_loss": -11.293331146240234, "global_step": 443849, "epoch": 2641} {"train_loss": -11.87843132019043, "global_step": 443850, "epoch": 2641} {"train_loss": -12.145099639892578, "global_step": 443851, "epoch": 2641} {"train_loss": -11.525225639343262, "global_step": 443852, "epoch": 2641} {"train_loss": -12.073043823242188, "global_step": 443853, "epoch": 2641} {"train_loss": -12.351057052612305, "global_step": 443854, "epoch": 2641} {"train_loss": -12.228950574284507, "global_step": 443855, "epoch": 2641, "val_loss": 311147.75} {"train_loss": -10.152640342712402, "global_step": 443856, "epoch": 2642} {"train_loss": -12.253942489624023, "global_step": 443857, "epoch": 2642} {"train_loss": -11.221364974975586, "global_step": 443858, "epoch": 2642} {"train_loss": -11.060056686401367, "global_step": 443859, "epoch": 2642} {"train_loss": -12.17656135559082, "global_step": 443860, "epoch": 2642} {"train_loss": -11.002335548400879, "global_step": 443861, "epoch": 2642} {"train_loss": -10.902482986450195, "global_step": 443862, "epoch": 2642} {"train_loss": -11.968600273132324, "global_step": 443863, "epoch": 2642} {"train_loss": -11.557007789611816, "global_step": 443864, "epoch": 2642} {"train_loss": -12.240579605102539, "global_step": 443865, "epoch": 2642} {"train_loss": -11.107521057128906, "global_step": 443866, "epoch": 2642} {"train_loss": -12.087249755859375, "global_step": 443867, "epoch": 2642} {"train_loss": -11.356027603149414, "global_step": 443868, "epoch": 2642} {"train_loss": -11.415953636169434, "global_step": 443869, "epoch": 2642} {"train_loss": -11.786396026611328, "global_step": 443870, "epoch": 2642} {"train_loss": -11.58366584777832, "global_step": 443871, "epoch": 2642} {"train_loss": -12.374256134033203, "global_step": 443872, "epoch": 2642} {"train_loss": -12.163257598876953, "global_step": 443873, "epoch": 2642} {"train_loss": -12.182292938232422, "global_step": 443874, "epoch": 2642} {"train_loss": -12.065018653869629, "global_step": 443875, "epoch": 2642} {"train_loss": -12.193975448608398, "global_step": 443876, "epoch": 2642} {"train_loss": -12.741925239562988, "global_step": 443877, "epoch": 2642} {"train_loss": -12.427492141723633, "global_step": 443878, "epoch": 2642} {"train_loss": -12.670025825500488, "global_step": 443879, "epoch": 2642} {"train_loss": -12.763326644897461, "global_step": 443880, "epoch": 2642} {"train_loss": -12.555181503295898, "global_step": 443881, "epoch": 2642} {"train_loss": -12.494245529174805, "global_step": 443882, "epoch": 2642} {"train_loss": -12.542047500610352, "global_step": 443883, "epoch": 2642} {"train_loss": -12.578968048095703, "global_step": 443884, "epoch": 2642} {"train_loss": -12.761225700378418, "global_step": 443885, "epoch": 2642} {"train_loss": -12.797143936157227, "global_step": 443886, "epoch": 2642} {"train_loss": -12.542623519897461, "global_step": 443887, "epoch": 2642} {"train_loss": -12.627481460571289, "global_step": 443888, "epoch": 2642} {"train_loss": -12.534468650817871, "global_step": 443889, "epoch": 2642} {"train_loss": -12.453239440917969, "global_step": 443890, "epoch": 2642} {"train_loss": -12.435403823852539, "global_step": 443891, "epoch": 2642} {"train_loss": -12.590152740478516, "global_step": 443892, "epoch": 2642} {"train_loss": -12.851932525634766, "global_step": 443893, "epoch": 2642} {"train_loss": -12.608171463012695, "global_step": 443894, "epoch": 2642} {"train_loss": -12.769193649291992, "global_step": 443895, "epoch": 2642} {"train_loss": -12.591694831848145, "global_step": 443896, "epoch": 2642} {"train_loss": -12.662412643432617, "global_step": 443897, "epoch": 2642} {"train_loss": -12.578977584838867, "global_step": 443898, "epoch": 2642} {"train_loss": -12.773151397705078, "global_step": 443899, "epoch": 2642} {"train_loss": -12.834733963012695, "global_step": 443900, "epoch": 2642} {"train_loss": -12.673851013183594, "global_step": 443901, "epoch": 2642} {"train_loss": -12.69971752166748, "global_step": 443902, "epoch": 2642} {"train_loss": -12.929969787597656, "global_step": 443903, "epoch": 2642} {"train_loss": -12.752341270446777, "global_step": 443904, "epoch": 2642} {"train_loss": -12.922998428344727, "global_step": 443905, "epoch": 2642} {"train_loss": -12.531795501708984, "global_step": 443906, "epoch": 2642} {"train_loss": -12.372064590454102, "global_step": 443907, "epoch": 2642} {"train_loss": -12.947222709655762, "global_step": 443908, "epoch": 2642} {"train_loss": -12.980340957641602, "global_step": 443909, "epoch": 2642} {"train_loss": -12.54043960571289, "global_step": 443910, "epoch": 2642} {"train_loss": -12.744548797607422, "global_step": 443911, "epoch": 2642} {"train_loss": -12.671310424804688, "global_step": 443912, "epoch": 2642} {"train_loss": -12.520905494689941, "global_step": 443913, "epoch": 2642} {"train_loss": -13.030409812927246, "global_step": 443914, "epoch": 2642} {"train_loss": -12.681934356689453, "global_step": 443915, "epoch": 2642} {"train_loss": -12.624022483825684, "global_step": 443916, "epoch": 2642} {"train_loss": -12.634916305541992, "global_step": 443917, "epoch": 2642} {"train_loss": -12.591428756713867, "global_step": 443918, "epoch": 2642} {"train_loss": -12.812605857849121, "global_step": 443919, "epoch": 2642} {"train_loss": -12.929449081420898, "global_step": 443920, "epoch": 2642} {"train_loss": -12.692730903625488, "global_step": 443921, "epoch": 2642} {"train_loss": -12.876504898071289, "global_step": 443922, "epoch": 2642} {"train_loss": -12.76852035522461, "global_step": 443923, "epoch": 2642} {"train_loss": -12.615873336791992, "global_step": 443924, "epoch": 2642} {"train_loss": -12.412654876708984, "global_step": 443925, "epoch": 2642} {"train_loss": -12.391286849975586, "global_step": 443926, "epoch": 2642} {"train_loss": -12.216142654418945, "global_step": 443927, "epoch": 2642} {"train_loss": -12.454242706298828, "global_step": 443928, "epoch": 2642} {"train_loss": -12.890296936035156, "global_step": 443929, "epoch": 2642} {"train_loss": -12.260647773742676, "global_step": 443930, "epoch": 2642} {"train_loss": -12.276577949523926, "global_step": 443931, "epoch": 2642} {"train_loss": -12.287849426269531, "global_step": 443932, "epoch": 2642} {"train_loss": -12.707839965820312, "global_step": 443933, "epoch": 2642} {"train_loss": -12.283587455749512, "global_step": 443934, "epoch": 2642} {"train_loss": -11.828012466430664, "global_step": 443935, "epoch": 2642} {"train_loss": -12.646516799926758, "global_step": 443936, "epoch": 2642} {"train_loss": -12.896238327026367, "global_step": 443937, "epoch": 2642} {"train_loss": -12.330808639526367, "global_step": 443938, "epoch": 2642} {"train_loss": -12.467411041259766, "global_step": 443939, "epoch": 2642} {"train_loss": -12.560449600219727, "global_step": 443940, "epoch": 2642} {"train_loss": -12.27509593963623, "global_step": 443941, "epoch": 2642} {"train_loss": -11.783754348754883, "global_step": 443942, "epoch": 2642} {"train_loss": -12.622396469116211, "global_step": 443943, "epoch": 2642} {"train_loss": -12.612401962280273, "global_step": 443944, "epoch": 2642} {"train_loss": -10.631839752197266, "global_step": 443945, "epoch": 2642} {"train_loss": -11.820428848266602, "global_step": 443946, "epoch": 2642} {"train_loss": -12.476366996765137, "global_step": 443947, "epoch": 2642} {"train_loss": -11.422881126403809, "global_step": 443948, "epoch": 2642} {"train_loss": -11.410941123962402, "global_step": 443949, "epoch": 2642} {"train_loss": -12.574197769165039, "global_step": 443950, "epoch": 2642} {"train_loss": -11.226985931396484, "global_step": 443951, "epoch": 2642} {"train_loss": -11.14896297454834, "global_step": 443952, "epoch": 2642} {"train_loss": -13.017465591430664, "global_step": 443953, "epoch": 2642} {"train_loss": -10.999669075012207, "global_step": 443954, "epoch": 2642} {"train_loss": -11.413214683532715, "global_step": 443955, "epoch": 2642} {"train_loss": -12.298934936523438, "global_step": 443956, "epoch": 2642} {"train_loss": -9.530693054199219, "global_step": 443957, "epoch": 2642} {"train_loss": -10.78732681274414, "global_step": 443958, "epoch": 2642} {"train_loss": -9.307647705078125, "global_step": 443959, "epoch": 2642} {"train_loss": -10.461095809936523, "global_step": 443960, "epoch": 2642} {"train_loss": -7.7797346115112305, "global_step": 443961, "epoch": 2642} {"train_loss": -7.907063007354736, "global_step": 443962, "epoch": 2642} {"train_loss": -9.289026260375977, "global_step": 443963, "epoch": 2642} {"train_loss": -8.163137435913086, "global_step": 443964, "epoch": 2642} {"train_loss": -8.78098201751709, "global_step": 443965, "epoch": 2642} {"train_loss": -9.689115524291992, "global_step": 443966, "epoch": 2642} {"train_loss": -10.015872955322266, "global_step": 443967, "epoch": 2642} {"train_loss": -8.364011764526367, "global_step": 443968, "epoch": 2642} {"train_loss": -9.398832321166992, "global_step": 443969, "epoch": 2642} {"train_loss": -9.962646484375, "global_step": 443970, "epoch": 2642} {"train_loss": -10.007394790649414, "global_step": 443971, "epoch": 2642} {"train_loss": -9.328781127929688, "global_step": 443972, "epoch": 2642} {"train_loss": -11.282251358032227, "global_step": 443973, "epoch": 2642} {"train_loss": -9.510477066040039, "global_step": 443974, "epoch": 2642} {"train_loss": -8.21395206451416, "global_step": 443975, "epoch": 2642} {"train_loss": -10.59519100189209, "global_step": 443976, "epoch": 2642} {"train_loss": -9.397336959838867, "global_step": 443977, "epoch": 2642} {"train_loss": -9.275535583496094, "global_step": 443978, "epoch": 2642} {"train_loss": -11.288570404052734, "global_step": 443979, "epoch": 2642} {"train_loss": -10.634511947631836, "global_step": 443980, "epoch": 2642} {"train_loss": -10.51683235168457, "global_step": 443981, "epoch": 2642} {"train_loss": -11.401108741760254, "global_step": 443982, "epoch": 2642} {"train_loss": -10.083528518676758, "global_step": 443983, "epoch": 2642} {"train_loss": -10.179716110229492, "global_step": 443984, "epoch": 2642} {"train_loss": -10.990899085998535, "global_step": 443985, "epoch": 2642} {"train_loss": -11.700451850891113, "global_step": 443986, "epoch": 2642} {"train_loss": -10.3539400100708, "global_step": 443987, "epoch": 2642} {"train_loss": -11.923676490783691, "global_step": 443988, "epoch": 2642} {"train_loss": -11.000810623168945, "global_step": 443989, "epoch": 2642} {"train_loss": -11.67123794555664, "global_step": 443990, "epoch": 2642} {"train_loss": -11.00456428527832, "global_step": 443991, "epoch": 2642} {"train_loss": -11.225580215454102, "global_step": 443992, "epoch": 2642} {"train_loss": -11.038541793823242, "global_step": 443993, "epoch": 2642} {"train_loss": -11.86004638671875, "global_step": 443994, "epoch": 2642} {"train_loss": -11.32604694366455, "global_step": 443995, "epoch": 2642} {"train_loss": -11.780908584594727, "global_step": 443996, "epoch": 2642} {"train_loss": -11.525518417358398, "global_step": 443997, "epoch": 2642} {"train_loss": -11.667566299438477, "global_step": 443998, "epoch": 2642} {"train_loss": -11.51743221282959, "global_step": 443999, "epoch": 2642} {"train_loss": -11.559640884399414, "global_step": 444000, "epoch": 2642} {"train_loss": -11.797307968139648, "global_step": 444001, "epoch": 2642} {"train_loss": -12.241357803344727, "global_step": 444002, "epoch": 2642} {"train_loss": -12.049201965332031, "global_step": 444003, "epoch": 2642} {"train_loss": -12.037344932556152, "global_step": 444004, "epoch": 2642} {"train_loss": -12.20779800415039, "global_step": 444005, "epoch": 2642} {"train_loss": -12.022336959838867, "global_step": 444006, "epoch": 2642} {"train_loss": -12.048606872558594, "global_step": 444007, "epoch": 2642} {"train_loss": -12.145855903625488, "global_step": 444008, "epoch": 2642} {"train_loss": -11.968295097351074, "global_step": 444009, "epoch": 2642} {"train_loss": -12.144140243530273, "global_step": 444010, "epoch": 2642} {"train_loss": -11.717690467834473, "global_step": 444011, "epoch": 2642} {"train_loss": -12.213809967041016, "global_step": 444012, "epoch": 2642} {"train_loss": -11.915807723999023, "global_step": 444013, "epoch": 2642} {"train_loss": -12.065640449523926, "global_step": 444014, "epoch": 2642} {"train_loss": -12.360519409179688, "global_step": 444015, "epoch": 2642} {"train_loss": -12.035487174987793, "global_step": 444016, "epoch": 2642} {"train_loss": -12.625977516174316, "global_step": 444017, "epoch": 2642} {"train_loss": -12.410364151000977, "global_step": 444018, "epoch": 2642} {"train_loss": -12.128908157348633, "global_step": 444019, "epoch": 2642} {"train_loss": -12.294644355773926, "global_step": 444020, "epoch": 2642} {"train_loss": -12.445959091186523, "global_step": 444021, "epoch": 2642} {"train_loss": -12.515615463256836, "global_step": 444022, "epoch": 2642} {"train_loss": -11.755762023585183, "global_step": 444023, "epoch": 2642, "val_loss": 312425.9375} {"train_loss": -12.524760246276855, "global_step": 444024, "epoch": 2643} {"train_loss": -12.40233039855957, "global_step": 444025, "epoch": 2643} {"train_loss": -12.535587310791016, "global_step": 444026, "epoch": 2643} {"train_loss": -12.388618469238281, "global_step": 444027, "epoch": 2643} {"train_loss": -12.224830627441406, "global_step": 444028, "epoch": 2643} {"train_loss": -12.703407287597656, "global_step": 444029, "epoch": 2643} {"train_loss": -12.20751667022705, "global_step": 444030, "epoch": 2643} {"train_loss": -12.407149314880371, "global_step": 444031, "epoch": 2643} {"train_loss": -12.0282621383667, "global_step": 444032, "epoch": 2643} {"train_loss": -12.368280410766602, "global_step": 444033, "epoch": 2643} {"train_loss": -12.360788345336914, "global_step": 444034, "epoch": 2643} {"train_loss": -12.259723663330078, "global_step": 444035, "epoch": 2643} {"train_loss": -12.237154960632324, "global_step": 444036, "epoch": 2643} {"train_loss": -12.4817533493042, "global_step": 444037, "epoch": 2643} {"train_loss": -12.366903305053711, "global_step": 444038, "epoch": 2643} {"train_loss": -12.581701278686523, "global_step": 444039, "epoch": 2643} {"train_loss": -12.325214385986328, "global_step": 444040, "epoch": 2643} {"train_loss": -12.747217178344727, "global_step": 444041, "epoch": 2643} {"train_loss": -12.35869026184082, "global_step": 444042, "epoch": 2643} {"train_loss": -12.84659481048584, "global_step": 444043, "epoch": 2643} {"train_loss": -12.553953170776367, "global_step": 444044, "epoch": 2643} {"train_loss": -12.514331817626953, "global_step": 444045, "epoch": 2643} {"train_loss": -12.63990592956543, "global_step": 444046, "epoch": 2643} {"train_loss": -12.660505294799805, "global_step": 444047, "epoch": 2643} {"train_loss": -12.640127182006836, "global_step": 444048, "epoch": 2643} {"train_loss": -12.285266876220703, "global_step": 444049, "epoch": 2643} {"train_loss": -12.717117309570312, "global_step": 444050, "epoch": 2643} {"train_loss": -12.459016799926758, "global_step": 444051, "epoch": 2643} {"train_loss": -12.578556060791016, "global_step": 444052, "epoch": 2643} {"train_loss": -12.590291023254395, "global_step": 444053, "epoch": 2643} {"train_loss": -12.625102996826172, "global_step": 444054, "epoch": 2643} {"train_loss": -12.702510833740234, "global_step": 444055, "epoch": 2643} {"train_loss": -12.656339645385742, "global_step": 444056, "epoch": 2643} {"train_loss": -12.705682754516602, "global_step": 444057, "epoch": 2643} {"train_loss": -12.750919342041016, "global_step": 444058, "epoch": 2643} {"train_loss": -12.658330917358398, "global_step": 444059, "epoch": 2643} {"train_loss": -12.783987045288086, "global_step": 444060, "epoch": 2643} {"train_loss": -12.740720748901367, "global_step": 444061, "epoch": 2643} {"train_loss": -12.85401725769043, "global_step": 444062, "epoch": 2643} {"train_loss": -12.787945747375488, "global_step": 444063, "epoch": 2643} {"train_loss": -12.57406234741211, "global_step": 444064, "epoch": 2643} {"train_loss": -12.794124603271484, "global_step": 444065, "epoch": 2643} {"train_loss": -12.819307327270508, "global_step": 444066, "epoch": 2643} {"train_loss": -12.725275039672852, "global_step": 444067, "epoch": 2643} {"train_loss": -12.600666046142578, "global_step": 444068, "epoch": 2643} {"train_loss": -12.754678726196289, "global_step": 444069, "epoch": 2643} {"train_loss": -12.75335693359375, "global_step": 444070, "epoch": 2643} {"train_loss": -12.777029037475586, "global_step": 444071, "epoch": 2643} {"train_loss": -12.820819854736328, "global_step": 444072, "epoch": 2643} {"train_loss": -13.000553131103516, "global_step": 444073, "epoch": 2643} {"train_loss": -12.712981224060059, "global_step": 444074, "epoch": 2643} {"train_loss": -12.83842658996582, "global_step": 444075, "epoch": 2643} {"train_loss": -12.844554901123047, "global_step": 444076, "epoch": 2643} {"train_loss": -12.473541259765625, "global_step": 444077, "epoch": 2643} {"train_loss": -12.718091011047363, "global_step": 444078, "epoch": 2643} {"train_loss": -12.489267349243164, "global_step": 444079, "epoch": 2643} {"train_loss": -12.424077987670898, "global_step": 444080, "epoch": 2643} {"train_loss": -12.637850761413574, "global_step": 444081, "epoch": 2643} {"train_loss": -12.283807754516602, "global_step": 444082, "epoch": 2643} {"train_loss": -12.786090850830078, "global_step": 444083, "epoch": 2643} {"train_loss": -12.385038375854492, "global_step": 444084, "epoch": 2643} {"train_loss": -12.632498741149902, "global_step": 444085, "epoch": 2643} {"train_loss": -12.78934383392334, "global_step": 444086, "epoch": 2643} {"train_loss": -12.588529586791992, "global_step": 444087, "epoch": 2643} {"train_loss": -12.689104080200195, "global_step": 444088, "epoch": 2643} {"train_loss": -12.752822875976562, "global_step": 444089, "epoch": 2643} {"train_loss": -12.786726951599121, "global_step": 444090, "epoch": 2643} {"train_loss": -12.668233871459961, "global_step": 444091, "epoch": 2643} {"train_loss": -12.688447952270508, "global_step": 444092, "epoch": 2643} {"train_loss": -12.857635498046875, "global_step": 444093, "epoch": 2643} {"train_loss": -12.711337089538574, "global_step": 444094, "epoch": 2643} {"train_loss": -12.768874168395996, "global_step": 444095, "epoch": 2643} {"train_loss": -12.514656066894531, "global_step": 444096, "epoch": 2643} {"train_loss": -12.831249237060547, "global_step": 444097, "epoch": 2643} {"train_loss": -12.887897491455078, "global_step": 444098, "epoch": 2643} {"train_loss": -12.294511795043945, "global_step": 444099, "epoch": 2643} {"train_loss": -12.607133865356445, "global_step": 444100, "epoch": 2643} {"train_loss": -12.719327926635742, "global_step": 444101, "epoch": 2643} {"train_loss": -12.782779693603516, "global_step": 444102, "epoch": 2643} {"train_loss": -12.386056900024414, "global_step": 444103, "epoch": 2643} {"train_loss": -12.790688514709473, "global_step": 444104, "epoch": 2643} {"train_loss": -12.622076988220215, "global_step": 444105, "epoch": 2643} {"train_loss": -12.936261177062988, "global_step": 444106, "epoch": 2643} {"train_loss": -12.683297157287598, "global_step": 444107, "epoch": 2643} {"train_loss": -12.85042667388916, "global_step": 444108, "epoch": 2643} {"train_loss": -12.84910774230957, "global_step": 444109, "epoch": 2643} {"train_loss": -12.336795806884766, "global_step": 444110, "epoch": 2643} {"train_loss": -12.732208251953125, "global_step": 444111, "epoch": 2643} {"train_loss": -12.4623384475708, "global_step": 444112, "epoch": 2643} {"train_loss": -12.624506950378418, "global_step": 444113, "epoch": 2643} {"train_loss": -12.184602737426758, "global_step": 444114, "epoch": 2643} {"train_loss": -12.516599655151367, "global_step": 444115, "epoch": 2643} {"train_loss": -12.764083862304688, "global_step": 444116, "epoch": 2643} {"train_loss": -12.468950271606445, "global_step": 444117, "epoch": 2643} {"train_loss": -12.62745475769043, "global_step": 444118, "epoch": 2643} {"train_loss": -12.717592239379883, "global_step": 444119, "epoch": 2643} {"train_loss": -12.316068649291992, "global_step": 444120, "epoch": 2643} {"train_loss": -12.409536361694336, "global_step": 444121, "epoch": 2643} {"train_loss": -12.499380111694336, "global_step": 444122, "epoch": 2643} {"train_loss": -12.442749977111816, "global_step": 444123, "epoch": 2643} {"train_loss": -12.51272964477539, "global_step": 444124, "epoch": 2643} {"train_loss": -12.770439147949219, "global_step": 444125, "epoch": 2643} {"train_loss": -12.148776054382324, "global_step": 444126, "epoch": 2643} {"train_loss": -11.885873794555664, "global_step": 444127, "epoch": 2643} {"train_loss": -12.155540466308594, "global_step": 444128, "epoch": 2643} {"train_loss": -12.570296287536621, "global_step": 444129, "epoch": 2643} {"train_loss": -11.408487319946289, "global_step": 444130, "epoch": 2643} {"train_loss": -11.767318725585938, "global_step": 444131, "epoch": 2643} {"train_loss": -12.273200035095215, "global_step": 444132, "epoch": 2643} {"train_loss": -11.795036315917969, "global_step": 444133, "epoch": 2643} {"train_loss": -11.101750373840332, "global_step": 444134, "epoch": 2643} {"train_loss": -11.883054733276367, "global_step": 444135, "epoch": 2643} {"train_loss": -12.302939414978027, "global_step": 444136, "epoch": 2643} {"train_loss": -12.568264961242676, "global_step": 444137, "epoch": 2643} {"train_loss": -11.380743980407715, "global_step": 444138, "epoch": 2643} {"train_loss": -12.47632122039795, "global_step": 444139, "epoch": 2643} {"train_loss": -12.304798126220703, "global_step": 444140, "epoch": 2643} {"train_loss": -12.211662292480469, "global_step": 444141, "epoch": 2643} {"train_loss": -11.42965030670166, "global_step": 444142, "epoch": 2643} {"train_loss": -12.291523933410645, "global_step": 444143, "epoch": 2643} {"train_loss": -10.678529739379883, "global_step": 444144, "epoch": 2643} {"train_loss": -12.074012756347656, "global_step": 444145, "epoch": 2643} {"train_loss": -12.23072624206543, "global_step": 444146, "epoch": 2643} {"train_loss": -11.515146255493164, "global_step": 444147, "epoch": 2643} {"train_loss": -12.014425277709961, "global_step": 444148, "epoch": 2643} {"train_loss": -11.439013481140137, "global_step": 444149, "epoch": 2643} {"train_loss": -11.670011520385742, "global_step": 444150, "epoch": 2643} {"train_loss": -11.863306045532227, "global_step": 444151, "epoch": 2643} {"train_loss": -11.325030326843262, "global_step": 444152, "epoch": 2643} {"train_loss": -11.576461791992188, "global_step": 444153, "epoch": 2643} {"train_loss": -11.090668678283691, "global_step": 444154, "epoch": 2643} {"train_loss": -11.863364219665527, "global_step": 444155, "epoch": 2643} {"train_loss": -9.564826965332031, "global_step": 444156, "epoch": 2643} {"train_loss": -8.845640182495117, "global_step": 444157, "epoch": 2643} {"train_loss": -8.899925231933594, "global_step": 444158, "epoch": 2643} {"train_loss": -9.367687225341797, "global_step": 444159, "epoch": 2643} {"train_loss": -9.939181327819824, "global_step": 444160, "epoch": 2643} {"train_loss": -10.608596801757812, "global_step": 444161, "epoch": 2643} {"train_loss": -9.981826782226562, "global_step": 444162, "epoch": 2643} {"train_loss": -10.164690017700195, "global_step": 444163, "epoch": 2643} {"train_loss": -9.997125625610352, "global_step": 444164, "epoch": 2643} {"train_loss": -11.482087135314941, "global_step": 444165, "epoch": 2643} {"train_loss": -10.929986000061035, "global_step": 444166, "epoch": 2643} {"train_loss": -10.595065116882324, "global_step": 444167, "epoch": 2643} {"train_loss": -11.613256454467773, "global_step": 444168, "epoch": 2643} {"train_loss": -11.296194076538086, "global_step": 444169, "epoch": 2643} {"train_loss": -11.837906837463379, "global_step": 444170, "epoch": 2643} {"train_loss": -11.00271224975586, "global_step": 444171, "epoch": 2643} {"train_loss": -11.2157564163208, "global_step": 444172, "epoch": 2643} {"train_loss": -11.93688678741455, "global_step": 444173, "epoch": 2643} {"train_loss": -11.109639167785645, "global_step": 444174, "epoch": 2643} {"train_loss": -11.763450622558594, "global_step": 444175, "epoch": 2643} {"train_loss": -11.388880729675293, "global_step": 444176, "epoch": 2643} {"train_loss": -11.663446426391602, "global_step": 444177, "epoch": 2643} {"train_loss": -11.774764060974121, "global_step": 444178, "epoch": 2643} {"train_loss": -11.26365852355957, "global_step": 444179, "epoch": 2643} {"train_loss": -11.839707374572754, "global_step": 444180, "epoch": 2643} {"train_loss": -10.715539932250977, "global_step": 444181, "epoch": 2643} {"train_loss": -12.143890380859375, "global_step": 444182, "epoch": 2643} {"train_loss": -11.044848442077637, "global_step": 444183, "epoch": 2643} {"train_loss": -11.68853759765625, "global_step": 444184, "epoch": 2643} {"train_loss": -11.236852645874023, "global_step": 444185, "epoch": 2643} {"train_loss": -11.748733520507812, "global_step": 444186, "epoch": 2643} {"train_loss": -11.645645141601562, "global_step": 444187, "epoch": 2643} {"train_loss": -11.880440711975098, "global_step": 444188, "epoch": 2643} {"train_loss": -11.950849533081055, "global_step": 444189, "epoch": 2643} {"train_loss": -11.438621520996094, "global_step": 444190, "epoch": 2643} {"train_loss": -12.135811005319868, "global_step": 444191, "epoch": 2643, "val_loss": 310325.96875} {"train_loss": -10.311635971069336, "global_step": 444192, "epoch": 2644} {"train_loss": -11.564087867736816, "global_step": 444193, "epoch": 2644} {"train_loss": -11.189918518066406, "global_step": 444194, "epoch": 2644} {"train_loss": -11.642521858215332, "global_step": 444195, "epoch": 2644} {"train_loss": -12.10226821899414, "global_step": 444196, "epoch": 2644} {"train_loss": -11.692063331604004, "global_step": 444197, "epoch": 2644} {"train_loss": -12.034420013427734, "global_step": 444198, "epoch": 2644} {"train_loss": -11.975090026855469, "global_step": 444199, "epoch": 2644} {"train_loss": -12.140710830688477, "global_step": 444200, "epoch": 2644} {"train_loss": -12.194063186645508, "global_step": 444201, "epoch": 2644} {"train_loss": -12.244918823242188, "global_step": 444202, "epoch": 2644} {"train_loss": -12.482192993164062, "global_step": 444203, "epoch": 2644} {"train_loss": -12.118782043457031, "global_step": 444204, "epoch": 2644} {"train_loss": -12.180721282958984, "global_step": 444205, "epoch": 2644} {"train_loss": -11.725898742675781, "global_step": 444206, "epoch": 2644} {"train_loss": -12.396316528320312, "global_step": 444207, "epoch": 2644} {"train_loss": -12.076544761657715, "global_step": 444208, "epoch": 2644} {"train_loss": -12.58118724822998, "global_step": 444209, "epoch": 2644} {"train_loss": -12.207674026489258, "global_step": 444210, "epoch": 2644} {"train_loss": -12.297514915466309, "global_step": 444211, "epoch": 2644} {"train_loss": -12.419814109802246, "global_step": 444212, "epoch": 2644} {"train_loss": -12.201543807983398, "global_step": 444213, "epoch": 2644} {"train_loss": -12.443584442138672, "global_step": 444214, "epoch": 2644} {"train_loss": -12.283956527709961, "global_step": 444215, "epoch": 2644} {"train_loss": -12.490148544311523, "global_step": 444216, "epoch": 2644} {"train_loss": -12.410148620605469, "global_step": 444217, "epoch": 2644} {"train_loss": -12.272109985351562, "global_step": 444218, "epoch": 2644} {"train_loss": -12.49496078491211, "global_step": 444219, "epoch": 2644} {"train_loss": -12.611331939697266, "global_step": 444220, "epoch": 2644} {"train_loss": -12.493938446044922, "global_step": 444221, "epoch": 2644} {"train_loss": -12.523847579956055, "global_step": 444222, "epoch": 2644} {"train_loss": -12.577766418457031, "global_step": 444223, "epoch": 2644} {"train_loss": -12.779598236083984, "global_step": 444224, "epoch": 2644} {"train_loss": -12.319241523742676, "global_step": 444225, "epoch": 2644} {"train_loss": -12.481836318969727, "global_step": 444226, "epoch": 2644} {"train_loss": -12.429887771606445, "global_step": 444227, "epoch": 2644} {"train_loss": -12.499876022338867, "global_step": 444228, "epoch": 2644} {"train_loss": -12.736425399780273, "global_step": 444229, "epoch": 2644} {"train_loss": -12.63758659362793, "global_step": 444230, "epoch": 2644} {"train_loss": -12.880834579467773, "global_step": 444231, "epoch": 2644} {"train_loss": -12.76776123046875, "global_step": 444232, "epoch": 2644} {"train_loss": -12.716808319091797, "global_step": 444233, "epoch": 2644} {"train_loss": -12.634801864624023, "global_step": 444234, "epoch": 2644} {"train_loss": -12.6990966796875, "global_step": 444235, "epoch": 2644} {"train_loss": -12.871438026428223, "global_step": 444236, "epoch": 2644} {"train_loss": -12.55836009979248, "global_step": 444237, "epoch": 2644} {"train_loss": -12.880473136901855, "global_step": 444238, "epoch": 2644} {"train_loss": -12.769472122192383, "global_step": 444239, "epoch": 2644} {"train_loss": -12.345112800598145, "global_step": 444240, "epoch": 2644} {"train_loss": -12.792951583862305, "global_step": 444241, "epoch": 2644} {"train_loss": -12.486040115356445, "global_step": 444242, "epoch": 2644} {"train_loss": -12.652311325073242, "global_step": 444243, "epoch": 2644} {"train_loss": -12.59487533569336, "global_step": 444244, "epoch": 2644} {"train_loss": -12.915997505187988, "global_step": 444245, "epoch": 2644} {"train_loss": -12.603372573852539, "global_step": 444246, "epoch": 2644} {"train_loss": -12.626513481140137, "global_step": 444247, "epoch": 2644} {"train_loss": -12.847433090209961, "global_step": 444248, "epoch": 2644} {"train_loss": -12.500931739807129, "global_step": 444249, "epoch": 2644} {"train_loss": -12.787606239318848, "global_step": 444250, "epoch": 2644} {"train_loss": -12.662466049194336, "global_step": 444251, "epoch": 2644} {"train_loss": -12.63099479675293, "global_step": 444252, "epoch": 2644} {"train_loss": -12.859132766723633, "global_step": 444253, "epoch": 2644} {"train_loss": -12.6373872756958, "global_step": 444254, "epoch": 2644} {"train_loss": -12.481800079345703, "global_step": 444255, "epoch": 2644} {"train_loss": -12.68978500366211, "global_step": 444256, "epoch": 2644} {"train_loss": -12.80104923248291, "global_step": 444257, "epoch": 2644} {"train_loss": -12.504501342773438, "global_step": 444258, "epoch": 2644} {"train_loss": -12.843789100646973, "global_step": 444259, "epoch": 2644} {"train_loss": -12.496131896972656, "global_step": 444260, "epoch": 2644} {"train_loss": -12.65165901184082, "global_step": 444261, "epoch": 2644} {"train_loss": -12.850576400756836, "global_step": 444262, "epoch": 2644} {"train_loss": -12.820722579956055, "global_step": 444263, "epoch": 2644} {"train_loss": -12.616836547851562, "global_step": 444264, "epoch": 2644} {"train_loss": -12.253201484680176, "global_step": 444265, "epoch": 2644} {"train_loss": -12.46418285369873, "global_step": 444266, "epoch": 2644} {"train_loss": -12.653305053710938, "global_step": 444267, "epoch": 2644} {"train_loss": -12.738664627075195, "global_step": 444268, "epoch": 2644} {"train_loss": -12.723445892333984, "global_step": 444269, "epoch": 2644} {"train_loss": -12.863252639770508, "global_step": 444270, "epoch": 2644} {"train_loss": -12.743602752685547, "global_step": 444271, "epoch": 2644} {"train_loss": -12.494214057922363, "global_step": 444272, "epoch": 2644} {"train_loss": -12.805455207824707, "global_step": 444273, "epoch": 2644} {"train_loss": -12.702945709228516, "global_step": 444274, "epoch": 2644} {"train_loss": -12.758983612060547, "global_step": 444275, "epoch": 2644} {"train_loss": -12.42848014831543, "global_step": 444276, "epoch": 2644} {"train_loss": -12.407831192016602, "global_step": 444277, "epoch": 2644} {"train_loss": -12.361550331115723, "global_step": 444278, "epoch": 2644} {"train_loss": -12.74856185913086, "global_step": 444279, "epoch": 2644} {"train_loss": -12.520370483398438, "global_step": 444280, "epoch": 2644} {"train_loss": -12.427129745483398, "global_step": 444281, "epoch": 2644} {"train_loss": -12.263883590698242, "global_step": 444282, "epoch": 2644} {"train_loss": -12.749688148498535, "global_step": 444283, "epoch": 2644} {"train_loss": -12.474241256713867, "global_step": 444284, "epoch": 2644} {"train_loss": -12.398452758789062, "global_step": 444285, "epoch": 2644} {"train_loss": -11.772087097167969, "global_step": 444286, "epoch": 2644} {"train_loss": -12.226208686828613, "global_step": 444287, "epoch": 2644} {"train_loss": -12.58318042755127, "global_step": 444288, "epoch": 2644} {"train_loss": -12.155525207519531, "global_step": 444289, "epoch": 2644} {"train_loss": -12.678092956542969, "global_step": 444290, "epoch": 2644} {"train_loss": -12.694999694824219, "global_step": 444291, "epoch": 2644} {"train_loss": -12.29698371887207, "global_step": 444292, "epoch": 2644} {"train_loss": -12.825164794921875, "global_step": 444293, "epoch": 2644} {"train_loss": -12.1043119430542, "global_step": 444294, "epoch": 2644} {"train_loss": -12.697649002075195, "global_step": 444295, "epoch": 2644} {"train_loss": -11.888063430786133, "global_step": 444296, "epoch": 2644} {"train_loss": -12.114810943603516, "global_step": 444297, "epoch": 2644} {"train_loss": -11.460301399230957, "global_step": 444298, "epoch": 2644} {"train_loss": -12.287179946899414, "global_step": 444299, "epoch": 2644} {"train_loss": -11.53198528289795, "global_step": 444300, "epoch": 2644} {"train_loss": -11.992973327636719, "global_step": 444301, "epoch": 2644} {"train_loss": -11.723993301391602, "global_step": 444302, "epoch": 2644} {"train_loss": -11.327788352966309, "global_step": 444303, "epoch": 2644} {"train_loss": -11.26875114440918, "global_step": 444304, "epoch": 2644} {"train_loss": -11.85574722290039, "global_step": 444305, "epoch": 2644} {"train_loss": -11.415257453918457, "global_step": 444306, "epoch": 2644} {"train_loss": -11.611322402954102, "global_step": 444307, "epoch": 2644} {"train_loss": -11.92845344543457, "global_step": 444308, "epoch": 2644} {"train_loss": -11.452986717224121, "global_step": 444309, "epoch": 2644} {"train_loss": -11.588726043701172, "global_step": 444310, "epoch": 2644} {"train_loss": -11.288297653198242, "global_step": 444311, "epoch": 2644} {"train_loss": -11.804862976074219, "global_step": 444312, "epoch": 2644} {"train_loss": -11.210712432861328, "global_step": 444313, "epoch": 2644} {"train_loss": -10.584274291992188, "global_step": 444314, "epoch": 2644} {"train_loss": -10.931163787841797, "global_step": 444315, "epoch": 2644} {"train_loss": -11.526326179504395, "global_step": 444316, "epoch": 2644} {"train_loss": -11.541146278381348, "global_step": 444317, "epoch": 2644} {"train_loss": -11.271510124206543, "global_step": 444318, "epoch": 2644} {"train_loss": -11.396902084350586, "global_step": 444319, "epoch": 2644} {"train_loss": -11.267513275146484, "global_step": 444320, "epoch": 2644} {"train_loss": -10.826651573181152, "global_step": 444321, "epoch": 2644} {"train_loss": -10.39819622039795, "global_step": 444322, "epoch": 2644} {"train_loss": -11.4390287399292, "global_step": 444323, "epoch": 2644} {"train_loss": -11.629127502441406, "global_step": 444324, "epoch": 2644} {"train_loss": -11.273004531860352, "global_step": 444325, "epoch": 2644} {"train_loss": -11.586036682128906, "global_step": 444326, "epoch": 2644} {"train_loss": -11.53760051727295, "global_step": 444327, "epoch": 2644} {"train_loss": -11.46400260925293, "global_step": 444328, "epoch": 2644} {"train_loss": -12.043612480163574, "global_step": 444329, "epoch": 2644} {"train_loss": -11.554326057434082, "global_step": 444330, "epoch": 2644} {"train_loss": -11.874881744384766, "global_step": 444331, "epoch": 2644} {"train_loss": -11.855717658996582, "global_step": 444332, "epoch": 2644} {"train_loss": -12.116650581359863, "global_step": 444333, "epoch": 2644} {"train_loss": -11.856815338134766, "global_step": 444334, "epoch": 2644} {"train_loss": -12.080926895141602, "global_step": 444335, "epoch": 2644} {"train_loss": -11.954622268676758, "global_step": 444336, "epoch": 2644} {"train_loss": -12.099960327148438, "global_step": 444337, "epoch": 2644} {"train_loss": -12.343250274658203, "global_step": 444338, "epoch": 2644} {"train_loss": -11.961105346679688, "global_step": 444339, "epoch": 2644} {"train_loss": -12.332132339477539, "global_step": 444340, "epoch": 2644} {"train_loss": -11.909039497375488, "global_step": 444341, "epoch": 2644} {"train_loss": -12.064301490783691, "global_step": 444342, "epoch": 2644} {"train_loss": -12.240816116333008, "global_step": 444343, "epoch": 2644} {"train_loss": -11.57708740234375, "global_step": 444344, "epoch": 2644} {"train_loss": -12.713251113891602, "global_step": 444345, "epoch": 2644} {"train_loss": -11.8077974319458, "global_step": 444346, "epoch": 2644} {"train_loss": -12.260741233825684, "global_step": 444347, "epoch": 2644} {"train_loss": -11.999979019165039, "global_step": 444348, "epoch": 2644} {"train_loss": -12.153519630432129, "global_step": 444349, "epoch": 2644} {"train_loss": -12.644527435302734, "global_step": 444350, "epoch": 2644} {"train_loss": -12.060142517089844, "global_step": 444351, "epoch": 2644} {"train_loss": -12.300762176513672, "global_step": 444352, "epoch": 2644} {"train_loss": -12.117231369018555, "global_step": 444353, "epoch": 2644} {"train_loss": -12.183167457580566, "global_step": 444354, "epoch": 2644} {"train_loss": -12.395435333251953, "global_step": 444355, "epoch": 2644} {"train_loss": -12.409685134887695, "global_step": 444356, "epoch": 2644} {"train_loss": -12.505620956420898, "global_step": 444357, "epoch": 2644} {"train_loss": -12.416790008544922, "global_step": 444358, "epoch": 2644} {"train_loss": -12.20382779552823, "global_step": 444359, "epoch": 2644, "val_loss": 312996.125} {"train_loss": -12.495092391967773, "global_step": 444360, "epoch": 2645} {"train_loss": -12.11898136138916, "global_step": 444361, "epoch": 2645} {"train_loss": -12.449041366577148, "global_step": 444362, "epoch": 2645} {"train_loss": -12.517372131347656, "global_step": 444363, "epoch": 2645} {"train_loss": -12.47455883026123, "global_step": 444364, "epoch": 2645} {"train_loss": -12.538593292236328, "global_step": 444365, "epoch": 2645} {"train_loss": -12.438518524169922, "global_step": 444366, "epoch": 2645} {"train_loss": -12.696589469909668, "global_step": 444367, "epoch": 2645} {"train_loss": -12.432940483093262, "global_step": 444368, "epoch": 2645} {"train_loss": -12.490416526794434, "global_step": 444369, "epoch": 2645} {"train_loss": -12.115530014038086, "global_step": 444370, "epoch": 2645} {"train_loss": -12.471549034118652, "global_step": 444371, "epoch": 2645} {"train_loss": -12.684213638305664, "global_step": 444372, "epoch": 2645} {"train_loss": -12.478853225708008, "global_step": 444373, "epoch": 2645} {"train_loss": -12.401937484741211, "global_step": 444374, "epoch": 2645} {"train_loss": -12.587736129760742, "global_step": 444375, "epoch": 2645} {"train_loss": -12.437742233276367, "global_step": 444376, "epoch": 2645} {"train_loss": -12.767206192016602, "global_step": 444377, "epoch": 2645} {"train_loss": -12.32422924041748, "global_step": 444378, "epoch": 2645} {"train_loss": -12.593055725097656, "global_step": 444379, "epoch": 2645} {"train_loss": -12.302970886230469, "global_step": 444380, "epoch": 2645} {"train_loss": -12.816553115844727, "global_step": 444381, "epoch": 2645} {"train_loss": -12.550094604492188, "global_step": 444382, "epoch": 2645} {"train_loss": -12.724174499511719, "global_step": 444383, "epoch": 2645} {"train_loss": -12.427419662475586, "global_step": 444384, "epoch": 2645} {"train_loss": -12.779899597167969, "global_step": 444385, "epoch": 2645} {"train_loss": -12.744979858398438, "global_step": 444386, "epoch": 2645} {"train_loss": -12.730192184448242, "global_step": 444387, "epoch": 2645} {"train_loss": -12.783975601196289, "global_step": 444388, "epoch": 2645} {"train_loss": -12.64034652709961, "global_step": 444389, "epoch": 2645} {"train_loss": -12.75644302368164, "global_step": 444390, "epoch": 2645} {"train_loss": -12.673663139343262, "global_step": 444391, "epoch": 2645} {"train_loss": -12.312326431274414, "global_step": 444392, "epoch": 2645} {"train_loss": -12.848103523254395, "global_step": 444393, "epoch": 2645} {"train_loss": -12.391975402832031, "global_step": 444394, "epoch": 2645} {"train_loss": -12.619041442871094, "global_step": 444395, "epoch": 2645} {"train_loss": -12.532922744750977, "global_step": 444396, "epoch": 2645} {"train_loss": -12.833234786987305, "global_step": 444397, "epoch": 2645} {"train_loss": -12.566267013549805, "global_step": 444398, "epoch": 2645} {"train_loss": -12.912344932556152, "global_step": 444399, "epoch": 2645} {"train_loss": -12.640475273132324, "global_step": 444400, "epoch": 2645} {"train_loss": -12.887813568115234, "global_step": 444401, "epoch": 2645} {"train_loss": -12.39710521697998, "global_step": 444402, "epoch": 2645} {"train_loss": -12.680957794189453, "global_step": 444403, "epoch": 2645} {"train_loss": -12.462263107299805, "global_step": 444404, "epoch": 2645} {"train_loss": -12.878560066223145, "global_step": 444405, "epoch": 2645} {"train_loss": -12.766189575195312, "global_step": 444406, "epoch": 2645} {"train_loss": -12.560094833374023, "global_step": 444407, "epoch": 2645} {"train_loss": -11.948333740234375, "global_step": 444408, "epoch": 2645} {"train_loss": -11.64161491394043, "global_step": 444409, "epoch": 2645} {"train_loss": -12.450902938842773, "global_step": 444410, "epoch": 2645} {"train_loss": -11.512941360473633, "global_step": 444411, "epoch": 2645} {"train_loss": -10.553573608398438, "global_step": 444412, "epoch": 2645} {"train_loss": -10.012351036071777, "global_step": 444413, "epoch": 2645} {"train_loss": -11.433350563049316, "global_step": 444414, "epoch": 2645} {"train_loss": -9.10976505279541, "global_step": 444415, "epoch": 2645} {"train_loss": -8.99704360961914, "global_step": 444416, "epoch": 2645} {"train_loss": -10.78689193725586, "global_step": 444417, "epoch": 2645} {"train_loss": -11.086893081665039, "global_step": 444418, "epoch": 2645} {"train_loss": -9.25942611694336, "global_step": 444419, "epoch": 2645} {"train_loss": -10.654289245605469, "global_step": 444420, "epoch": 2645} {"train_loss": -10.475554466247559, "global_step": 444421, "epoch": 2645} {"train_loss": -10.937206268310547, "global_step": 444422, "epoch": 2645} {"train_loss": -11.68514633178711, "global_step": 444423, "epoch": 2645} {"train_loss": -12.103187561035156, "global_step": 444424, "epoch": 2645} {"train_loss": -11.80112361907959, "global_step": 444425, "epoch": 2645} {"train_loss": -12.004803657531738, "global_step": 444426, "epoch": 2645} {"train_loss": -12.243143081665039, "global_step": 444427, "epoch": 2645} {"train_loss": -12.067279815673828, "global_step": 444428, "epoch": 2645} {"train_loss": -11.973756790161133, "global_step": 444429, "epoch": 2645} {"train_loss": -12.343830108642578, "global_step": 444430, "epoch": 2645} {"train_loss": -12.074317932128906, "global_step": 444431, "epoch": 2645} {"train_loss": -11.943987846374512, "global_step": 444432, "epoch": 2645} {"train_loss": -12.030906677246094, "global_step": 444433, "epoch": 2645} {"train_loss": -12.028225898742676, "global_step": 444434, "epoch": 2645} {"train_loss": -11.753582000732422, "global_step": 444435, "epoch": 2645} {"train_loss": -11.78702163696289, "global_step": 444436, "epoch": 2645} {"train_loss": -11.750922203063965, "global_step": 444437, "epoch": 2645} {"train_loss": -11.792730331420898, "global_step": 444438, "epoch": 2645} {"train_loss": -11.70173454284668, "global_step": 444439, "epoch": 2645} {"train_loss": -11.565003395080566, "global_step": 444440, "epoch": 2645} {"train_loss": -11.984434127807617, "global_step": 444441, "epoch": 2645} {"train_loss": -10.981685638427734, "global_step": 444442, "epoch": 2645} {"train_loss": -12.297919273376465, "global_step": 444443, "epoch": 2645} {"train_loss": -11.046914100646973, "global_step": 444444, "epoch": 2645} {"train_loss": -11.793302536010742, "global_step": 444445, "epoch": 2645} {"train_loss": -11.487098693847656, "global_step": 444446, "epoch": 2645} {"train_loss": -11.319757461547852, "global_step": 444447, "epoch": 2645} {"train_loss": -12.426578521728516, "global_step": 444448, "epoch": 2645} {"train_loss": -11.095632553100586, "global_step": 444449, "epoch": 2645} {"train_loss": -12.081465721130371, "global_step": 444450, "epoch": 2645} {"train_loss": -11.59959888458252, "global_step": 444451, "epoch": 2645} {"train_loss": -11.898448944091797, "global_step": 444452, "epoch": 2645} {"train_loss": -12.21457290649414, "global_step": 444453, "epoch": 2645} {"train_loss": -11.95849609375, "global_step": 444454, "epoch": 2645} {"train_loss": -12.163078308105469, "global_step": 444455, "epoch": 2645} {"train_loss": -11.75338363647461, "global_step": 444456, "epoch": 2645} {"train_loss": -11.382471084594727, "global_step": 444457, "epoch": 2645} {"train_loss": -12.014034271240234, "global_step": 444458, "epoch": 2645} {"train_loss": -11.597094535827637, "global_step": 444459, "epoch": 2645} {"train_loss": -12.086709976196289, "global_step": 444460, "epoch": 2645} {"train_loss": -11.650871276855469, "global_step": 444461, "epoch": 2645} {"train_loss": -12.183115005493164, "global_step": 444462, "epoch": 2645} {"train_loss": -12.114468574523926, "global_step": 444463, "epoch": 2645} {"train_loss": -11.899869918823242, "global_step": 444464, "epoch": 2645} {"train_loss": -12.589083671569824, "global_step": 444465, "epoch": 2645} {"train_loss": -12.030723571777344, "global_step": 444466, "epoch": 2645} {"train_loss": -12.472902297973633, "global_step": 444467, "epoch": 2645} {"train_loss": -11.814130783081055, "global_step": 444468, "epoch": 2645} {"train_loss": -12.319765090942383, "global_step": 444469, "epoch": 2645} {"train_loss": -12.199773788452148, "global_step": 444470, "epoch": 2645} {"train_loss": -12.385988235473633, "global_step": 444471, "epoch": 2645} {"train_loss": -12.302289009094238, "global_step": 444472, "epoch": 2645} {"train_loss": -12.240852355957031, "global_step": 444473, "epoch": 2645} {"train_loss": -12.437776565551758, "global_step": 444474, "epoch": 2645} {"train_loss": -12.652437210083008, "global_step": 444475, "epoch": 2645} {"train_loss": -12.473569869995117, "global_step": 444476, "epoch": 2645} {"train_loss": -12.457225799560547, "global_step": 444477, "epoch": 2645} {"train_loss": -12.399750709533691, "global_step": 444478, "epoch": 2645} {"train_loss": -12.345709800720215, "global_step": 444479, "epoch": 2645} {"train_loss": -12.286031723022461, "global_step": 444480, "epoch": 2645} {"train_loss": -12.608829498291016, "global_step": 444481, "epoch": 2645} {"train_loss": -12.454927444458008, "global_step": 444482, "epoch": 2645} {"train_loss": -12.59078311920166, "global_step": 444483, "epoch": 2645} {"train_loss": -12.501687049865723, "global_step": 444484, "epoch": 2645} {"train_loss": -12.29292106628418, "global_step": 444485, "epoch": 2645} {"train_loss": -12.5625, "global_step": 444486, "epoch": 2645} {"train_loss": -12.230470657348633, "global_step": 444487, "epoch": 2645} {"train_loss": -12.714591979980469, "global_step": 444488, "epoch": 2645} {"train_loss": -12.75008487701416, "global_step": 444489, "epoch": 2645} {"train_loss": -12.58706283569336, "global_step": 444490, "epoch": 2645} {"train_loss": -12.62890338897705, "global_step": 444491, "epoch": 2645} {"train_loss": -12.259380340576172, "global_step": 444492, "epoch": 2645} {"train_loss": -12.65777587890625, "global_step": 444493, "epoch": 2645} {"train_loss": -12.79653549194336, "global_step": 444494, "epoch": 2645} {"train_loss": -12.668424606323242, "global_step": 444495, "epoch": 2645} {"train_loss": -12.682964324951172, "global_step": 444496, "epoch": 2645} {"train_loss": -12.47484016418457, "global_step": 444497, "epoch": 2645} {"train_loss": -12.205129623413086, "global_step": 444498, "epoch": 2645} {"train_loss": -12.746743202209473, "global_step": 444499, "epoch": 2645} {"train_loss": -12.82044792175293, "global_step": 444500, "epoch": 2645} {"train_loss": -12.460479736328125, "global_step": 444501, "epoch": 2645} {"train_loss": -12.305774688720703, "global_step": 444502, "epoch": 2645} {"train_loss": -12.150774002075195, "global_step": 444503, "epoch": 2645} {"train_loss": -12.129698753356934, "global_step": 444504, "epoch": 2645} {"train_loss": -11.927818298339844, "global_step": 444505, "epoch": 2645} {"train_loss": -12.531394958496094, "global_step": 444506, "epoch": 2645} {"train_loss": -11.28070068359375, "global_step": 444507, "epoch": 2645} {"train_loss": -12.354372024536133, "global_step": 444508, "epoch": 2645} {"train_loss": -12.131280899047852, "global_step": 444509, "epoch": 2645} {"train_loss": -11.741912841796875, "global_step": 444510, "epoch": 2645} {"train_loss": -12.967758178710938, "global_step": 444511, "epoch": 2645} {"train_loss": -12.289633750915527, "global_step": 444512, "epoch": 2645} {"train_loss": -12.09212875366211, "global_step": 444513, "epoch": 2645} {"train_loss": -12.576638221740723, "global_step": 444514, "epoch": 2645} {"train_loss": -11.89612102508545, "global_step": 444515, "epoch": 2645} {"train_loss": -12.596978187561035, "global_step": 444516, "epoch": 2645} {"train_loss": -12.026534080505371, "global_step": 444517, "epoch": 2645} {"train_loss": -11.919065475463867, "global_step": 444518, "epoch": 2645} {"train_loss": -12.2823486328125, "global_step": 444519, "epoch": 2645} {"train_loss": -11.10972785949707, "global_step": 444520, "epoch": 2645} {"train_loss": -12.30250358581543, "global_step": 444521, "epoch": 2645} {"train_loss": -12.390399932861328, "global_step": 444522, "epoch": 2645} {"train_loss": -11.420719146728516, "global_step": 444523, "epoch": 2645} {"train_loss": -12.610940933227539, "global_step": 444524, "epoch": 2645} {"train_loss": -11.451521873474121, "global_step": 444525, "epoch": 2645} {"train_loss": -10.213139533996582, "global_step": 444526, "epoch": 2645} {"train_loss": -12.116293634687151, "global_step": 444527, "epoch": 2645, "val_loss": 306648.34375, "train_action_mse_error": 1.3226085901260376} {"train_loss": -10.46125602722168, "global_step": 444528, "epoch": 2646} {"train_loss": -11.754228591918945, "global_step": 444529, "epoch": 2646} {"train_loss": -11.698328018188477, "global_step": 444530, "epoch": 2646} {"train_loss": -11.332332611083984, "global_step": 444531, "epoch": 2646} {"train_loss": -12.178502082824707, "global_step": 444532, "epoch": 2646} {"train_loss": -11.873859405517578, "global_step": 444533, "epoch": 2646} {"train_loss": -11.71580696105957, "global_step": 444534, "epoch": 2646} {"train_loss": -11.45396614074707, "global_step": 444535, "epoch": 2646} {"train_loss": -12.003328323364258, "global_step": 444536, "epoch": 2646} {"train_loss": -11.665576934814453, "global_step": 444537, "epoch": 2646} {"train_loss": -11.793435096740723, "global_step": 444538, "epoch": 2646} {"train_loss": -11.810559272766113, "global_step": 444539, "epoch": 2646} {"train_loss": -12.035028457641602, "global_step": 444540, "epoch": 2646} {"train_loss": -12.294260025024414, "global_step": 444541, "epoch": 2646} {"train_loss": -12.07229995727539, "global_step": 444542, "epoch": 2646} {"train_loss": -12.193292617797852, "global_step": 444543, "epoch": 2646} {"train_loss": -11.985260009765625, "global_step": 444544, "epoch": 2646} {"train_loss": -12.286593437194824, "global_step": 444545, "epoch": 2646} {"train_loss": -12.318202018737793, "global_step": 444546, "epoch": 2646} {"train_loss": -12.543872833251953, "global_step": 444547, "epoch": 2646} {"train_loss": -12.303592681884766, "global_step": 444548, "epoch": 2646} {"train_loss": -12.43484115600586, "global_step": 444549, "epoch": 2646} {"train_loss": -12.210365295410156, "global_step": 444550, "epoch": 2646} {"train_loss": -11.979286193847656, "global_step": 444551, "epoch": 2646} {"train_loss": -12.379680633544922, "global_step": 444552, "epoch": 2646} {"train_loss": -12.120986938476562, "global_step": 444553, "epoch": 2646} {"train_loss": -12.169950485229492, "global_step": 444554, "epoch": 2646} {"train_loss": -12.530498504638672, "global_step": 444555, "epoch": 2646} {"train_loss": -12.13292407989502, "global_step": 444556, "epoch": 2646} {"train_loss": -12.812646865844727, "global_step": 444557, "epoch": 2646} {"train_loss": -12.387435913085938, "global_step": 444558, "epoch": 2646} {"train_loss": -12.423123359680176, "global_step": 444559, "epoch": 2646} {"train_loss": -12.832762718200684, "global_step": 444560, "epoch": 2646} {"train_loss": -12.164522171020508, "global_step": 444561, "epoch": 2646} {"train_loss": -12.781608581542969, "global_step": 444562, "epoch": 2646} {"train_loss": -12.298711776733398, "global_step": 444563, "epoch": 2646} {"train_loss": -12.80543327331543, "global_step": 444564, "epoch": 2646} {"train_loss": -12.508001327514648, "global_step": 444565, "epoch": 2646} {"train_loss": -12.629016876220703, "global_step": 444566, "epoch": 2646} {"train_loss": -12.636129379272461, "global_step": 444567, "epoch": 2646} {"train_loss": -12.581937789916992, "global_step": 444568, "epoch": 2646} {"train_loss": -12.549235343933105, "global_step": 444569, "epoch": 2646} {"train_loss": -12.644598007202148, "global_step": 444570, "epoch": 2646} {"train_loss": -12.660244941711426, "global_step": 444571, "epoch": 2646} {"train_loss": -12.68189811706543, "global_step": 444572, "epoch": 2646} {"train_loss": -12.739702224731445, "global_step": 444573, "epoch": 2646} {"train_loss": -12.794584274291992, "global_step": 444574, "epoch": 2646} {"train_loss": -12.555333137512207, "global_step": 444575, "epoch": 2646} {"train_loss": -12.687475204467773, "global_step": 444576, "epoch": 2646} {"train_loss": -12.755281448364258, "global_step": 444577, "epoch": 2646} {"train_loss": -12.747323989868164, "global_step": 444578, "epoch": 2646} {"train_loss": -12.886221885681152, "global_step": 444579, "epoch": 2646} {"train_loss": -12.666927337646484, "global_step": 444580, "epoch": 2646} {"train_loss": -12.799348831176758, "global_step": 444581, "epoch": 2646} {"train_loss": -12.409900665283203, "global_step": 444582, "epoch": 2646} {"train_loss": -12.675337791442871, "global_step": 444583, "epoch": 2646} {"train_loss": -12.692403793334961, "global_step": 444584, "epoch": 2646} {"train_loss": -12.449779510498047, "global_step": 444585, "epoch": 2646} {"train_loss": -12.823224067687988, "global_step": 444586, "epoch": 2646} {"train_loss": -12.755149841308594, "global_step": 444587, "epoch": 2646} {"train_loss": -12.322307586669922, "global_step": 444588, "epoch": 2646} {"train_loss": -12.619414329528809, "global_step": 444589, "epoch": 2646} {"train_loss": -13.025653839111328, "global_step": 444590, "epoch": 2646} {"train_loss": -12.250875473022461, "global_step": 444591, "epoch": 2646} {"train_loss": -12.766530990600586, "global_step": 444592, "epoch": 2646} {"train_loss": -12.712635040283203, "global_step": 444593, "epoch": 2646} {"train_loss": -12.724503517150879, "global_step": 444594, "epoch": 2646} {"train_loss": -12.921895980834961, "global_step": 444595, "epoch": 2646} {"train_loss": -12.671941757202148, "global_step": 444596, "epoch": 2646} {"train_loss": -12.514967918395996, "global_step": 444597, "epoch": 2646} {"train_loss": -12.235797882080078, "global_step": 444598, "epoch": 2646} {"train_loss": -12.723701477050781, "global_step": 444599, "epoch": 2646} {"train_loss": -12.229392051696777, "global_step": 444600, "epoch": 2646} {"train_loss": -12.119524002075195, "global_step": 444601, "epoch": 2646} {"train_loss": -12.735879898071289, "global_step": 444602, "epoch": 2646} {"train_loss": -11.574811935424805, "global_step": 444603, "epoch": 2646} {"train_loss": -11.932414054870605, "global_step": 444604, "epoch": 2646} {"train_loss": -12.325454711914062, "global_step": 444605, "epoch": 2646} {"train_loss": -12.303701400756836, "global_step": 444606, "epoch": 2646} {"train_loss": -12.371050834655762, "global_step": 444607, "epoch": 2646} {"train_loss": -12.524980545043945, "global_step": 444608, "epoch": 2646} {"train_loss": -12.541023254394531, "global_step": 444609, "epoch": 2646} {"train_loss": -12.393630027770996, "global_step": 444610, "epoch": 2646} {"train_loss": -12.699743270874023, "global_step": 444611, "epoch": 2646} {"train_loss": -12.459664344787598, "global_step": 444612, "epoch": 2646} {"train_loss": -12.159351348876953, "global_step": 444613, "epoch": 2646} {"train_loss": -12.54776382446289, "global_step": 444614, "epoch": 2646} {"train_loss": -12.338706970214844, "global_step": 444615, "epoch": 2646} {"train_loss": -12.248849868774414, "global_step": 444616, "epoch": 2646} {"train_loss": -12.861438751220703, "global_step": 444617, "epoch": 2646} {"train_loss": -12.306135177612305, "global_step": 444618, "epoch": 2646} {"train_loss": -12.550079345703125, "global_step": 444619, "epoch": 2646} {"train_loss": -12.203178405761719, "global_step": 444620, "epoch": 2646} {"train_loss": -12.635223388671875, "global_step": 444621, "epoch": 2646} {"train_loss": -12.34135627746582, "global_step": 444622, "epoch": 2646} {"train_loss": -12.645742416381836, "global_step": 444623, "epoch": 2646} {"train_loss": -12.561613082885742, "global_step": 444624, "epoch": 2646} {"train_loss": -12.584819793701172, "global_step": 444625, "epoch": 2646} {"train_loss": -12.42989730834961, "global_step": 444626, "epoch": 2646} {"train_loss": -12.394068717956543, "global_step": 444627, "epoch": 2646} {"train_loss": -11.706024169921875, "global_step": 444628, "epoch": 2646} {"train_loss": -12.019744873046875, "global_step": 444629, "epoch": 2646} {"train_loss": -11.507757186889648, "global_step": 444630, "epoch": 2646} {"train_loss": -11.787005424499512, "global_step": 444631, "epoch": 2646} {"train_loss": -12.253679275512695, "global_step": 444632, "epoch": 2646} {"train_loss": -10.218803405761719, "global_step": 444633, "epoch": 2646} {"train_loss": -11.871268272399902, "global_step": 444634, "epoch": 2646} {"train_loss": -11.595640182495117, "global_step": 444635, "epoch": 2646} {"train_loss": -12.27076530456543, "global_step": 444636, "epoch": 2646} {"train_loss": -12.21529483795166, "global_step": 444637, "epoch": 2646} {"train_loss": -12.059318542480469, "global_step": 444638, "epoch": 2646} {"train_loss": -11.764854431152344, "global_step": 444639, "epoch": 2646} {"train_loss": -12.574468612670898, "global_step": 444640, "epoch": 2646} {"train_loss": -12.208934783935547, "global_step": 444641, "epoch": 2646} {"train_loss": -12.692365646362305, "global_step": 444642, "epoch": 2646} {"train_loss": -12.119123458862305, "global_step": 444643, "epoch": 2646} {"train_loss": -12.385442733764648, "global_step": 444644, "epoch": 2646} {"train_loss": -11.95965576171875, "global_step": 444645, "epoch": 2646} {"train_loss": -12.000711441040039, "global_step": 444646, "epoch": 2646} {"train_loss": -12.068758010864258, "global_step": 444647, "epoch": 2646} {"train_loss": -11.900981903076172, "global_step": 444648, "epoch": 2646} {"train_loss": -12.105387687683105, "global_step": 444649, "epoch": 2646} {"train_loss": -12.359081268310547, "global_step": 444650, "epoch": 2646} {"train_loss": -11.925551414489746, "global_step": 444651, "epoch": 2646} {"train_loss": -12.107871055603027, "global_step": 444652, "epoch": 2646} {"train_loss": -12.142383575439453, "global_step": 444653, "epoch": 2646} {"train_loss": -12.091611862182617, "global_step": 444654, "epoch": 2646} {"train_loss": -11.34875774383545, "global_step": 444655, "epoch": 2646} {"train_loss": -10.661402702331543, "global_step": 444656, "epoch": 2646} {"train_loss": -12.124454498291016, "global_step": 444657, "epoch": 2646} {"train_loss": -12.021045684814453, "global_step": 444658, "epoch": 2646} {"train_loss": -11.697057723999023, "global_step": 444659, "epoch": 2646} {"train_loss": -12.137760162353516, "global_step": 444660, "epoch": 2646} {"train_loss": -12.19096565246582, "global_step": 444661, "epoch": 2646} {"train_loss": -12.073870658874512, "global_step": 444662, "epoch": 2646} {"train_loss": -12.297259330749512, "global_step": 444663, "epoch": 2646} {"train_loss": -11.507770538330078, "global_step": 444664, "epoch": 2646} {"train_loss": -10.599831581115723, "global_step": 444665, "epoch": 2646} {"train_loss": -12.498334884643555, "global_step": 444666, "epoch": 2646} {"train_loss": -11.006632804870605, "global_step": 444667, "epoch": 2646} {"train_loss": -12.160064697265625, "global_step": 444668, "epoch": 2646} {"train_loss": -12.204214096069336, "global_step": 444669, "epoch": 2646} {"train_loss": -11.861307144165039, "global_step": 444670, "epoch": 2646} {"train_loss": -12.449514389038086, "global_step": 444671, "epoch": 2646} {"train_loss": -11.239751815795898, "global_step": 444672, "epoch": 2646} {"train_loss": -12.203767776489258, "global_step": 444673, "epoch": 2646} {"train_loss": -11.84131908416748, "global_step": 444674, "epoch": 2646} {"train_loss": -11.17310905456543, "global_step": 444675, "epoch": 2646} {"train_loss": -12.306991577148438, "global_step": 444676, "epoch": 2646} {"train_loss": -11.036125183105469, "global_step": 444677, "epoch": 2646} {"train_loss": -11.806144714355469, "global_step": 444678, "epoch": 2646} {"train_loss": -11.921120643615723, "global_step": 444679, "epoch": 2646} {"train_loss": -10.186430931091309, "global_step": 444680, "epoch": 2646} {"train_loss": -11.213136672973633, "global_step": 444681, "epoch": 2646} {"train_loss": -11.940747261047363, "global_step": 444682, "epoch": 2646} {"train_loss": -11.33508586883545, "global_step": 444683, "epoch": 2646} {"train_loss": -11.827205657958984, "global_step": 444684, "epoch": 2646} {"train_loss": -10.69865894317627, "global_step": 444685, "epoch": 2646} {"train_loss": -11.37924575805664, "global_step": 444686, "epoch": 2646} {"train_loss": -11.658378601074219, "global_step": 444687, "epoch": 2646} {"train_loss": -11.92111587524414, "global_step": 444688, "epoch": 2646} {"train_loss": -11.033296585083008, "global_step": 444689, "epoch": 2646} {"train_loss": -12.281761169433594, "global_step": 444690, "epoch": 2646} {"train_loss": -10.536691665649414, "global_step": 444691, "epoch": 2646} {"train_loss": -11.177837371826172, "global_step": 444692, "epoch": 2646} {"train_loss": -12.180852890014648, "global_step": 444693, "epoch": 2646} {"train_loss": -11.251065254211426, "global_step": 444694, "epoch": 2646} {"train_loss": -12.136938044003077, "global_step": 444695, "epoch": 2646, "val_loss": 311527.53125} {"train_loss": -10.839753150939941, "global_step": 444696, "epoch": 2647} {"train_loss": -11.786508560180664, "global_step": 444697, "epoch": 2647} {"train_loss": -11.72907543182373, "global_step": 444698, "epoch": 2647} {"train_loss": -11.486028671264648, "global_step": 444699, "epoch": 2647} {"train_loss": -12.311063766479492, "global_step": 444700, "epoch": 2647} {"train_loss": -11.355284690856934, "global_step": 444701, "epoch": 2647} {"train_loss": -11.796932220458984, "global_step": 444702, "epoch": 2647} {"train_loss": -11.950899124145508, "global_step": 444703, "epoch": 2647} {"train_loss": -11.35772705078125, "global_step": 444704, "epoch": 2647} {"train_loss": -12.127601623535156, "global_step": 444705, "epoch": 2647} {"train_loss": -11.913087844848633, "global_step": 444706, "epoch": 2647} {"train_loss": -11.736061096191406, "global_step": 444707, "epoch": 2647} {"train_loss": -12.22153091430664, "global_step": 444708, "epoch": 2647} {"train_loss": -12.080703735351562, "global_step": 444709, "epoch": 2647} {"train_loss": -12.142316818237305, "global_step": 444710, "epoch": 2647} {"train_loss": -12.029346466064453, "global_step": 444711, "epoch": 2647} {"train_loss": -12.066703796386719, "global_step": 444712, "epoch": 2647} {"train_loss": -12.423689842224121, "global_step": 444713, "epoch": 2647} {"train_loss": -11.291044235229492, "global_step": 444714, "epoch": 2647} {"train_loss": -12.280417442321777, "global_step": 444715, "epoch": 2647} {"train_loss": -11.747039794921875, "global_step": 444716, "epoch": 2647} {"train_loss": -12.475329399108887, "global_step": 444717, "epoch": 2647} {"train_loss": -12.15117359161377, "global_step": 444718, "epoch": 2647} {"train_loss": -12.232002258300781, "global_step": 444719, "epoch": 2647} {"train_loss": -12.492452621459961, "global_step": 444720, "epoch": 2647} {"train_loss": -12.219144821166992, "global_step": 444721, "epoch": 2647} {"train_loss": -12.453271865844727, "global_step": 444722, "epoch": 2647} {"train_loss": -12.402022361755371, "global_step": 444723, "epoch": 2647} {"train_loss": -12.415273666381836, "global_step": 444724, "epoch": 2647} {"train_loss": -12.597284317016602, "global_step": 444725, "epoch": 2647} {"train_loss": -12.715476989746094, "global_step": 444726, "epoch": 2647} {"train_loss": -12.694772720336914, "global_step": 444727, "epoch": 2647} {"train_loss": -12.590961456298828, "global_step": 444728, "epoch": 2647} {"train_loss": -12.650749206542969, "global_step": 444729, "epoch": 2647} {"train_loss": -12.600059509277344, "global_step": 444730, "epoch": 2647} {"train_loss": -12.606109619140625, "global_step": 444731, "epoch": 2647} {"train_loss": -12.65931510925293, "global_step": 444732, "epoch": 2647} {"train_loss": -12.52437686920166, "global_step": 444733, "epoch": 2647} {"train_loss": -12.742782592773438, "global_step": 444734, "epoch": 2647} {"train_loss": -12.683229446411133, "global_step": 444735, "epoch": 2647} {"train_loss": -12.811054229736328, "global_step": 444736, "epoch": 2647} {"train_loss": -12.611207008361816, "global_step": 444737, "epoch": 2647} {"train_loss": -12.69612979888916, "global_step": 444738, "epoch": 2647} {"train_loss": -12.71837043762207, "global_step": 444739, "epoch": 2647} {"train_loss": -12.579845428466797, "global_step": 444740, "epoch": 2647} {"train_loss": -12.913302421569824, "global_step": 444741, "epoch": 2647} {"train_loss": -12.65221881866455, "global_step": 444742, "epoch": 2647} {"train_loss": -12.716773986816406, "global_step": 444743, "epoch": 2647} {"train_loss": -12.679426193237305, "global_step": 444744, "epoch": 2647} {"train_loss": -12.575047492980957, "global_step": 444745, "epoch": 2647} {"train_loss": -12.752044677734375, "global_step": 444746, "epoch": 2647} {"train_loss": -12.592931747436523, "global_step": 444747, "epoch": 2647} {"train_loss": -12.82366943359375, "global_step": 444748, "epoch": 2647} {"train_loss": -12.997440338134766, "global_step": 444749, "epoch": 2647} {"train_loss": -12.825992584228516, "global_step": 444750, "epoch": 2647} {"train_loss": -12.743860244750977, "global_step": 444751, "epoch": 2647} {"train_loss": -12.670970916748047, "global_step": 444752, "epoch": 2647} {"train_loss": -12.749030113220215, "global_step": 444753, "epoch": 2647} {"train_loss": -12.611270904541016, "global_step": 444754, "epoch": 2647} {"train_loss": -12.906216621398926, "global_step": 444755, "epoch": 2647} {"train_loss": -12.864227294921875, "global_step": 444756, "epoch": 2647} {"train_loss": -12.911798477172852, "global_step": 444757, "epoch": 2647} {"train_loss": -12.688440322875977, "global_step": 444758, "epoch": 2647} {"train_loss": -12.619762420654297, "global_step": 444759, "epoch": 2647} {"train_loss": -12.783658981323242, "global_step": 444760, "epoch": 2647} {"train_loss": -12.694507598876953, "global_step": 444761, "epoch": 2647} {"train_loss": -12.668269157409668, "global_step": 444762, "epoch": 2647} {"train_loss": -12.687088012695312, "global_step": 444763, "epoch": 2647} {"train_loss": -12.814180374145508, "global_step": 444764, "epoch": 2647} {"train_loss": -12.798175811767578, "global_step": 444765, "epoch": 2647} {"train_loss": -12.592409133911133, "global_step": 444766, "epoch": 2647} {"train_loss": -12.79384994506836, "global_step": 444767, "epoch": 2647} {"train_loss": -12.866144180297852, "global_step": 444768, "epoch": 2647} {"train_loss": -12.502903938293457, "global_step": 444769, "epoch": 2647} {"train_loss": -13.016990661621094, "global_step": 444770, "epoch": 2647} {"train_loss": -12.37316608428955, "global_step": 444771, "epoch": 2647} {"train_loss": -12.223556518554688, "global_step": 444772, "epoch": 2647} {"train_loss": -12.586484909057617, "global_step": 444773, "epoch": 2647} {"train_loss": -12.355066299438477, "global_step": 444774, "epoch": 2647} {"train_loss": -12.580804824829102, "global_step": 444775, "epoch": 2647} {"train_loss": -12.563377380371094, "global_step": 444776, "epoch": 2647} {"train_loss": -12.705864906311035, "global_step": 444777, "epoch": 2647} {"train_loss": -12.016155242919922, "global_step": 444778, "epoch": 2647} {"train_loss": -12.041556358337402, "global_step": 444779, "epoch": 2647} {"train_loss": -12.52032470703125, "global_step": 444780, "epoch": 2647} {"train_loss": -12.415510177612305, "global_step": 444781, "epoch": 2647} {"train_loss": -12.365289688110352, "global_step": 444782, "epoch": 2647} {"train_loss": -12.025593757629395, "global_step": 444783, "epoch": 2647} {"train_loss": -12.572823524475098, "global_step": 444784, "epoch": 2647} {"train_loss": -12.292984008789062, "global_step": 444785, "epoch": 2647} {"train_loss": -12.458867073059082, "global_step": 444786, "epoch": 2647} {"train_loss": -12.18429946899414, "global_step": 444787, "epoch": 2647} {"train_loss": -12.395931243896484, "global_step": 444788, "epoch": 2647} {"train_loss": -12.588972091674805, "global_step": 444789, "epoch": 2647} {"train_loss": -12.739469528198242, "global_step": 444790, "epoch": 2647} {"train_loss": -12.304632186889648, "global_step": 444791, "epoch": 2647} {"train_loss": -11.625566482543945, "global_step": 444792, "epoch": 2647} {"train_loss": -11.272972106933594, "global_step": 444793, "epoch": 2647} {"train_loss": -11.817110061645508, "global_step": 444794, "epoch": 2647} {"train_loss": -9.71064281463623, "global_step": 444795, "epoch": 2647} {"train_loss": -12.266595840454102, "global_step": 444796, "epoch": 2647} {"train_loss": -11.886850357055664, "global_step": 444797, "epoch": 2647} {"train_loss": -12.259775161743164, "global_step": 444798, "epoch": 2647} {"train_loss": -11.18992805480957, "global_step": 444799, "epoch": 2647} {"train_loss": -11.760392189025879, "global_step": 444800, "epoch": 2647} {"train_loss": -10.460800170898438, "global_step": 444801, "epoch": 2647} {"train_loss": -10.892318725585938, "global_step": 444802, "epoch": 2647} {"train_loss": -10.245895385742188, "global_step": 444803, "epoch": 2647} {"train_loss": -9.70218563079834, "global_step": 444804, "epoch": 2647} {"train_loss": -9.518224716186523, "global_step": 444805, "epoch": 2647} {"train_loss": -9.741790771484375, "global_step": 444806, "epoch": 2647} {"train_loss": -10.504631042480469, "global_step": 444807, "epoch": 2647} {"train_loss": -10.994991302490234, "global_step": 444808, "epoch": 2647} {"train_loss": -9.885002136230469, "global_step": 444809, "epoch": 2647} {"train_loss": -10.21937084197998, "global_step": 444810, "epoch": 2647} {"train_loss": -11.364876747131348, "global_step": 444811, "epoch": 2647} {"train_loss": -10.522554397583008, "global_step": 444812, "epoch": 2647} {"train_loss": -9.493757247924805, "global_step": 444813, "epoch": 2647} {"train_loss": -9.68077278137207, "global_step": 444814, "epoch": 2647} {"train_loss": -11.143518447875977, "global_step": 444815, "epoch": 2647} {"train_loss": -9.573034286499023, "global_step": 444816, "epoch": 2647} {"train_loss": -11.601556777954102, "global_step": 444817, "epoch": 2647} {"train_loss": -11.124279022216797, "global_step": 444818, "epoch": 2647} {"train_loss": -11.414389610290527, "global_step": 444819, "epoch": 2647} {"train_loss": -11.71634578704834, "global_step": 444820, "epoch": 2647} {"train_loss": -11.39220905303955, "global_step": 444821, "epoch": 2647} {"train_loss": -11.743314743041992, "global_step": 444822, "epoch": 2647} {"train_loss": -11.086010932922363, "global_step": 444823, "epoch": 2647} {"train_loss": -12.017614364624023, "global_step": 444824, "epoch": 2647} {"train_loss": -11.558843612670898, "global_step": 444825, "epoch": 2647} {"train_loss": -11.438087463378906, "global_step": 444826, "epoch": 2647} {"train_loss": -12.109829902648926, "global_step": 444827, "epoch": 2647} {"train_loss": -11.972225189208984, "global_step": 444828, "epoch": 2647} {"train_loss": -11.895795822143555, "global_step": 444829, "epoch": 2647} {"train_loss": -11.303428649902344, "global_step": 444830, "epoch": 2647} {"train_loss": -12.030499458312988, "global_step": 444831, "epoch": 2647} {"train_loss": -11.418766021728516, "global_step": 444832, "epoch": 2647} {"train_loss": -11.723718643188477, "global_step": 444833, "epoch": 2647} {"train_loss": -11.972431182861328, "global_step": 444834, "epoch": 2647} {"train_loss": -11.910524368286133, "global_step": 444835, "epoch": 2647} {"train_loss": -11.974483489990234, "global_step": 444836, "epoch": 2647} {"train_loss": -12.18230152130127, "global_step": 444837, "epoch": 2647} {"train_loss": -11.579744338989258, "global_step": 444838, "epoch": 2647} {"train_loss": -11.761932373046875, "global_step": 444839, "epoch": 2647} {"train_loss": -11.912939071655273, "global_step": 444840, "epoch": 2647} {"train_loss": -11.965232849121094, "global_step": 444841, "epoch": 2647} {"train_loss": -12.0828218460083, "global_step": 444842, "epoch": 2647} {"train_loss": -11.96261978149414, "global_step": 444843, "epoch": 2647} {"train_loss": -12.539551734924316, "global_step": 444844, "epoch": 2647} {"train_loss": -11.893974304199219, "global_step": 444845, "epoch": 2647} {"train_loss": -12.47926139831543, "global_step": 444846, "epoch": 2647} {"train_loss": -12.31173324584961, "global_step": 444847, "epoch": 2647} {"train_loss": -12.334288597106934, "global_step": 444848, "epoch": 2647} {"train_loss": -12.300809860229492, "global_step": 444849, "epoch": 2647} {"train_loss": -12.249698638916016, "global_step": 444850, "epoch": 2647} {"train_loss": -12.322044372558594, "global_step": 444851, "epoch": 2647} {"train_loss": -12.327247619628906, "global_step": 444852, "epoch": 2647} {"train_loss": -12.130393981933594, "global_step": 444853, "epoch": 2647} {"train_loss": -12.380615234375, "global_step": 444854, "epoch": 2647} {"train_loss": -11.915096282958984, "global_step": 444855, "epoch": 2647} {"train_loss": -12.68635368347168, "global_step": 444856, "epoch": 2647} {"train_loss": -12.12460708618164, "global_step": 444857, "epoch": 2647} {"train_loss": -12.454500198364258, "global_step": 444858, "epoch": 2647} {"train_loss": -12.246387481689453, "global_step": 444859, "epoch": 2647} {"train_loss": -12.702168464660645, "global_step": 444860, "epoch": 2647} {"train_loss": -12.006363868713379, "global_step": 444861, "epoch": 2647} {"train_loss": -12.34294319152832, "global_step": 444862, "epoch": 2647} {"train_loss": -12.04331320240384, "global_step": 444863, "epoch": 2647, "val_loss": 313372.96875} {"train_loss": -12.514106750488281, "global_step": 444864, "epoch": 2648} {"train_loss": -12.249102592468262, "global_step": 444865, "epoch": 2648} {"train_loss": -12.517660140991211, "global_step": 444866, "epoch": 2648} {"train_loss": -12.366158485412598, "global_step": 444867, "epoch": 2648} {"train_loss": -12.784223556518555, "global_step": 444868, "epoch": 2648} {"train_loss": -12.224855422973633, "global_step": 444869, "epoch": 2648} {"train_loss": -12.724376678466797, "global_step": 444870, "epoch": 2648} {"train_loss": -12.362829208374023, "global_step": 444871, "epoch": 2648} {"train_loss": -12.56445598602295, "global_step": 444872, "epoch": 2648} {"train_loss": -12.660388946533203, "global_step": 444873, "epoch": 2648} {"train_loss": -12.533266067504883, "global_step": 444874, "epoch": 2648} {"train_loss": -12.780694961547852, "global_step": 444875, "epoch": 2648} {"train_loss": -12.641616821289062, "global_step": 444876, "epoch": 2648} {"train_loss": -12.819268226623535, "global_step": 444877, "epoch": 2648} {"train_loss": -12.713892936706543, "global_step": 444878, "epoch": 2648} {"train_loss": -12.769571304321289, "global_step": 444879, "epoch": 2648} {"train_loss": -12.684276580810547, "global_step": 444880, "epoch": 2648} {"train_loss": -12.795068740844727, "global_step": 444881, "epoch": 2648} {"train_loss": -12.731612205505371, "global_step": 444882, "epoch": 2648} {"train_loss": -12.800823211669922, "global_step": 444883, "epoch": 2648} {"train_loss": -12.804058074951172, "global_step": 444884, "epoch": 2648} {"train_loss": -12.721502304077148, "global_step": 444885, "epoch": 2648} {"train_loss": -12.818750381469727, "global_step": 444886, "epoch": 2648} {"train_loss": -12.774430274963379, "global_step": 444887, "epoch": 2648} {"train_loss": -12.805398941040039, "global_step": 444888, "epoch": 2648} {"train_loss": -12.747425079345703, "global_step": 444889, "epoch": 2648} {"train_loss": -12.646772384643555, "global_step": 444890, "epoch": 2648} {"train_loss": -12.741572380065918, "global_step": 444891, "epoch": 2648} {"train_loss": -12.749598503112793, "global_step": 444892, "epoch": 2648} {"train_loss": -12.971658706665039, "global_step": 444893, "epoch": 2648} {"train_loss": -12.840446472167969, "global_step": 444894, "epoch": 2648} {"train_loss": -12.912217140197754, "global_step": 444895, "epoch": 2648} {"train_loss": -12.90740966796875, "global_step": 444896, "epoch": 2648} {"train_loss": -12.63714599609375, "global_step": 444897, "epoch": 2648} {"train_loss": -12.903420448303223, "global_step": 444898, "epoch": 2648} {"train_loss": -12.75022029876709, "global_step": 444899, "epoch": 2648} {"train_loss": -12.717490196228027, "global_step": 444900, "epoch": 2648} {"train_loss": -12.818981170654297, "global_step": 444901, "epoch": 2648} {"train_loss": -12.931488037109375, "global_step": 444902, "epoch": 2648} {"train_loss": -12.822200775146484, "global_step": 444903, "epoch": 2648} {"train_loss": -12.570037841796875, "global_step": 444904, "epoch": 2648} {"train_loss": -11.872818946838379, "global_step": 444905, "epoch": 2648} {"train_loss": -12.402911186218262, "global_step": 444906, "epoch": 2648} {"train_loss": -12.493420600891113, "global_step": 444907, "epoch": 2648} {"train_loss": -11.918643951416016, "global_step": 444908, "epoch": 2648} {"train_loss": -11.177197456359863, "global_step": 444909, "epoch": 2648} {"train_loss": -12.351757049560547, "global_step": 444910, "epoch": 2648} {"train_loss": -12.18603515625, "global_step": 444911, "epoch": 2648} {"train_loss": -12.146923065185547, "global_step": 444912, "epoch": 2648} {"train_loss": -12.618553161621094, "global_step": 444913, "epoch": 2648} {"train_loss": -12.281411170959473, "global_step": 444914, "epoch": 2648} {"train_loss": -12.222768783569336, "global_step": 444915, "epoch": 2648} {"train_loss": -12.36097526550293, "global_step": 444916, "epoch": 2648} {"train_loss": -12.109770774841309, "global_step": 444917, "epoch": 2648} {"train_loss": -11.964662551879883, "global_step": 444918, "epoch": 2648} {"train_loss": -12.246417999267578, "global_step": 444919, "epoch": 2648} {"train_loss": -12.568819046020508, "global_step": 444920, "epoch": 2648} {"train_loss": -12.401177406311035, "global_step": 444921, "epoch": 2648} {"train_loss": -11.910122871398926, "global_step": 444922, "epoch": 2648} {"train_loss": -12.285039901733398, "global_step": 444923, "epoch": 2648} {"train_loss": -12.628758430480957, "global_step": 444924, "epoch": 2648} {"train_loss": -12.213364601135254, "global_step": 444925, "epoch": 2648} {"train_loss": -11.662384033203125, "global_step": 444926, "epoch": 2648} {"train_loss": -12.767362594604492, "global_step": 444927, "epoch": 2648} {"train_loss": -12.155119895935059, "global_step": 444928, "epoch": 2648} {"train_loss": -12.090381622314453, "global_step": 444929, "epoch": 2648} {"train_loss": -11.990427017211914, "global_step": 444930, "epoch": 2648} {"train_loss": -12.263375282287598, "global_step": 444931, "epoch": 2648} {"train_loss": -11.800919532775879, "global_step": 444932, "epoch": 2648} {"train_loss": -12.161226272583008, "global_step": 444933, "epoch": 2648} {"train_loss": -12.69572639465332, "global_step": 444934, "epoch": 2648} {"train_loss": -12.690807342529297, "global_step": 444935, "epoch": 2648} {"train_loss": -12.508081436157227, "global_step": 444936, "epoch": 2648} {"train_loss": -12.549491882324219, "global_step": 444937, "epoch": 2648} {"train_loss": -12.65831184387207, "global_step": 444938, "epoch": 2648} {"train_loss": -12.237916946411133, "global_step": 444939, "epoch": 2648} {"train_loss": -12.582267761230469, "global_step": 444940, "epoch": 2648} {"train_loss": -12.575035095214844, "global_step": 444941, "epoch": 2648} {"train_loss": -12.224018096923828, "global_step": 444942, "epoch": 2648} {"train_loss": -12.477344512939453, "global_step": 444943, "epoch": 2648} {"train_loss": -12.496835708618164, "global_step": 444944, "epoch": 2648} {"train_loss": -12.268257141113281, "global_step": 444945, "epoch": 2648} {"train_loss": -12.949173927307129, "global_step": 444946, "epoch": 2648} {"train_loss": -12.40967845916748, "global_step": 444947, "epoch": 2648} {"train_loss": -12.33731460571289, "global_step": 444948, "epoch": 2648} {"train_loss": -12.37759780883789, "global_step": 444949, "epoch": 2648} {"train_loss": -12.472929954528809, "global_step": 444950, "epoch": 2648} {"train_loss": -12.254870414733887, "global_step": 444951, "epoch": 2648} {"train_loss": -12.178874969482422, "global_step": 444952, "epoch": 2648} {"train_loss": -12.290447235107422, "global_step": 444953, "epoch": 2648} {"train_loss": -12.273321151733398, "global_step": 444954, "epoch": 2648} {"train_loss": -12.018529891967773, "global_step": 444955, "epoch": 2648} {"train_loss": -11.503519058227539, "global_step": 444956, "epoch": 2648} {"train_loss": -11.978362083435059, "global_step": 444957, "epoch": 2648} {"train_loss": -12.466226577758789, "global_step": 444958, "epoch": 2648} {"train_loss": -11.41404914855957, "global_step": 444959, "epoch": 2648} {"train_loss": -12.149065017700195, "global_step": 444960, "epoch": 2648} {"train_loss": -12.222108840942383, "global_step": 444961, "epoch": 2648} {"train_loss": -12.081735610961914, "global_step": 444962, "epoch": 2648} {"train_loss": -12.431341171264648, "global_step": 444963, "epoch": 2648} {"train_loss": -12.27296257019043, "global_step": 444964, "epoch": 2648} {"train_loss": -12.563323020935059, "global_step": 444965, "epoch": 2648} {"train_loss": -12.608759880065918, "global_step": 444966, "epoch": 2648} {"train_loss": -12.297557830810547, "global_step": 444967, "epoch": 2648} {"train_loss": -12.248748779296875, "global_step": 444968, "epoch": 2648} {"train_loss": -12.604192733764648, "global_step": 444969, "epoch": 2648} {"train_loss": -11.966909408569336, "global_step": 444970, "epoch": 2648} {"train_loss": -12.532036781311035, "global_step": 444971, "epoch": 2648} {"train_loss": -12.17396354675293, "global_step": 444972, "epoch": 2648} {"train_loss": -12.666183471679688, "global_step": 444973, "epoch": 2648} {"train_loss": -12.342681884765625, "global_step": 444974, "epoch": 2648} {"train_loss": -12.410486221313477, "global_step": 444975, "epoch": 2648} {"train_loss": -12.382204055786133, "global_step": 444976, "epoch": 2648} {"train_loss": -12.233760833740234, "global_step": 444977, "epoch": 2648} {"train_loss": -12.538104057312012, "global_step": 444978, "epoch": 2648} {"train_loss": -12.73865795135498, "global_step": 444979, "epoch": 2648} {"train_loss": -12.382946014404297, "global_step": 444980, "epoch": 2648} {"train_loss": -12.942153930664062, "global_step": 444981, "epoch": 2648} {"train_loss": -12.649033546447754, "global_step": 444982, "epoch": 2648} {"train_loss": -12.618006706237793, "global_step": 444983, "epoch": 2648} {"train_loss": -12.70851993560791, "global_step": 444984, "epoch": 2648} {"train_loss": -12.799430847167969, "global_step": 444985, "epoch": 2648} {"train_loss": -12.730972290039062, "global_step": 444986, "epoch": 2648} {"train_loss": -12.725488662719727, "global_step": 444987, "epoch": 2648} {"train_loss": -12.537899017333984, "global_step": 444988, "epoch": 2648} {"train_loss": -12.579492568969727, "global_step": 444989, "epoch": 2648} {"train_loss": -12.657278060913086, "global_step": 444990, "epoch": 2648} {"train_loss": -12.57687759399414, "global_step": 444991, "epoch": 2648} {"train_loss": -12.977890014648438, "global_step": 444992, "epoch": 2648} {"train_loss": -12.629341125488281, "global_step": 444993, "epoch": 2648} {"train_loss": -12.726632118225098, "global_step": 444994, "epoch": 2648} {"train_loss": -12.79486083984375, "global_step": 444995, "epoch": 2648} {"train_loss": -12.723419189453125, "global_step": 444996, "epoch": 2648} {"train_loss": -12.672663688659668, "global_step": 444997, "epoch": 2648} {"train_loss": -12.782365798950195, "global_step": 444998, "epoch": 2648} {"train_loss": -12.57282829284668, "global_step": 444999, "epoch": 2648} {"train_loss": -12.63472843170166, "global_step": 445000, "epoch": 2648} {"train_loss": -12.64442253112793, "global_step": 445001, "epoch": 2648} {"train_loss": -12.943235397338867, "global_step": 445002, "epoch": 2648} {"train_loss": -12.581619262695312, "global_step": 445003, "epoch": 2648} {"train_loss": -12.412712097167969, "global_step": 445004, "epoch": 2648} {"train_loss": -12.759147644042969, "global_step": 445005, "epoch": 2648} {"train_loss": -12.694984436035156, "global_step": 445006, "epoch": 2648} {"train_loss": -11.313346862792969, "global_step": 445007, "epoch": 2648} {"train_loss": -9.768783569335938, "global_step": 445008, "epoch": 2648} {"train_loss": -12.241905212402344, "global_step": 445009, "epoch": 2648} {"train_loss": -11.612407684326172, "global_step": 445010, "epoch": 2648} {"train_loss": -10.65748405456543, "global_step": 445011, "epoch": 2648} {"train_loss": -12.22508430480957, "global_step": 445012, "epoch": 2648} {"train_loss": -10.451915740966797, "global_step": 445013, "epoch": 2648} {"train_loss": -11.945690155029297, "global_step": 445014, "epoch": 2648} {"train_loss": -10.429786682128906, "global_step": 445015, "epoch": 2648} {"train_loss": -11.466440200805664, "global_step": 445016, "epoch": 2648} {"train_loss": -11.035924911499023, "global_step": 445017, "epoch": 2648} {"train_loss": -11.497823715209961, "global_step": 445018, "epoch": 2648} {"train_loss": -9.191715240478516, "global_step": 445019, "epoch": 2648} {"train_loss": -11.610589981079102, "global_step": 445020, "epoch": 2648} {"train_loss": -11.916231155395508, "global_step": 445021, "epoch": 2648} {"train_loss": -9.422924041748047, "global_step": 445022, "epoch": 2648} {"train_loss": -11.69394302368164, "global_step": 445023, "epoch": 2648} {"train_loss": -8.498289108276367, "global_step": 445024, "epoch": 2648} {"train_loss": -9.45361328125, "global_step": 445025, "epoch": 2648} {"train_loss": -10.067171096801758, "global_step": 445026, "epoch": 2648} {"train_loss": -10.375293731689453, "global_step": 445027, "epoch": 2648} {"train_loss": -9.543039321899414, "global_step": 445028, "epoch": 2648} {"train_loss": -9.748835563659668, "global_step": 445029, "epoch": 2648} {"train_loss": -11.584291458129883, "global_step": 445030, "epoch": 2648} {"train_loss": -12.221123746463231, "global_step": 445031, "epoch": 2648, "val_loss": 308672.6875} {"train_loss": -11.085916519165039, "global_step": 445032, "epoch": 2649} {"train_loss": -11.66827392578125, "global_step": 445033, "epoch": 2649} {"train_loss": -9.406350135803223, "global_step": 445034, "epoch": 2649} {"train_loss": -12.125947952270508, "global_step": 445035, "epoch": 2649} {"train_loss": -10.667526245117188, "global_step": 445036, "epoch": 2649} {"train_loss": -10.620993614196777, "global_step": 445037, "epoch": 2649} {"train_loss": -10.915782928466797, "global_step": 445038, "epoch": 2649} {"train_loss": -10.502910614013672, "global_step": 445039, "epoch": 2649} {"train_loss": -11.794291496276855, "global_step": 445040, "epoch": 2649} {"train_loss": -11.323888778686523, "global_step": 445041, "epoch": 2649} {"train_loss": -11.979830741882324, "global_step": 445042, "epoch": 2649} {"train_loss": -12.050345420837402, "global_step": 445043, "epoch": 2649} {"train_loss": -11.759493827819824, "global_step": 445044, "epoch": 2649} {"train_loss": -12.04343032836914, "global_step": 445045, "epoch": 2649} {"train_loss": -11.972536087036133, "global_step": 445046, "epoch": 2649} {"train_loss": -12.014010429382324, "global_step": 445047, "epoch": 2649} {"train_loss": -12.33537769317627, "global_step": 445048, "epoch": 2649} {"train_loss": -11.68690299987793, "global_step": 445049, "epoch": 2649} {"train_loss": -12.18950080871582, "global_step": 445050, "epoch": 2649} {"train_loss": -11.64330768585205, "global_step": 445051, "epoch": 2649} {"train_loss": -12.439855575561523, "global_step": 445052, "epoch": 2649} {"train_loss": -11.901131629943848, "global_step": 445053, "epoch": 2649} {"train_loss": -11.654870986938477, "global_step": 445054, "epoch": 2649} {"train_loss": -11.910357475280762, "global_step": 445055, "epoch": 2649} {"train_loss": -12.16314697265625, "global_step": 445056, "epoch": 2649} {"train_loss": -11.597053527832031, "global_step": 445057, "epoch": 2649} {"train_loss": -12.265107154846191, "global_step": 445058, "epoch": 2649} {"train_loss": -11.995363235473633, "global_step": 445059, "epoch": 2649} {"train_loss": -12.319409370422363, "global_step": 445060, "epoch": 2649} {"train_loss": -12.235824584960938, "global_step": 445061, "epoch": 2649} {"train_loss": -12.45810604095459, "global_step": 445062, "epoch": 2649} {"train_loss": -12.27360725402832, "global_step": 445063, "epoch": 2649} {"train_loss": -12.3612060546875, "global_step": 445064, "epoch": 2649} {"train_loss": -12.18492317199707, "global_step": 445065, "epoch": 2649} {"train_loss": -12.241990089416504, "global_step": 445066, "epoch": 2649} {"train_loss": -12.267478942871094, "global_step": 445067, "epoch": 2649} {"train_loss": -12.244836807250977, "global_step": 445068, "epoch": 2649} {"train_loss": -12.238365173339844, "global_step": 445069, "epoch": 2649} {"train_loss": -12.21087646484375, "global_step": 445070, "epoch": 2649} {"train_loss": -12.375755310058594, "global_step": 445071, "epoch": 2649} {"train_loss": -12.439729690551758, "global_step": 445072, "epoch": 2649} {"train_loss": -12.537505149841309, "global_step": 445073, "epoch": 2649} {"train_loss": -12.603958129882812, "global_step": 445074, "epoch": 2649} {"train_loss": -12.541934967041016, "global_step": 445075, "epoch": 2649} {"train_loss": -12.504951477050781, "global_step": 445076, "epoch": 2649} {"train_loss": -12.359461784362793, "global_step": 445077, "epoch": 2649} {"train_loss": -12.536050796508789, "global_step": 445078, "epoch": 2649} {"train_loss": -12.631074905395508, "global_step": 445079, "epoch": 2649} {"train_loss": -12.680500030517578, "global_step": 445080, "epoch": 2649} {"train_loss": -12.412480354309082, "global_step": 445081, "epoch": 2649} {"train_loss": -12.685582160949707, "global_step": 445082, "epoch": 2649} {"train_loss": -12.37087345123291, "global_step": 445083, "epoch": 2649} {"train_loss": -12.783832550048828, "global_step": 445084, "epoch": 2649} {"train_loss": -12.453612327575684, "global_step": 445085, "epoch": 2649} {"train_loss": -12.656563758850098, "global_step": 445086, "epoch": 2649} {"train_loss": -12.402042388916016, "global_step": 445087, "epoch": 2649} {"train_loss": -12.451085090637207, "global_step": 445088, "epoch": 2649} {"train_loss": -12.712776184082031, "global_step": 445089, "epoch": 2649} {"train_loss": -12.357887268066406, "global_step": 445090, "epoch": 2649} {"train_loss": -12.771591186523438, "global_step": 445091, "epoch": 2649} {"train_loss": -12.721879959106445, "global_step": 445092, "epoch": 2649} {"train_loss": -12.835124969482422, "global_step": 445093, "epoch": 2649} {"train_loss": -12.617318153381348, "global_step": 445094, "epoch": 2649} {"train_loss": -12.865743637084961, "global_step": 445095, "epoch": 2649} {"train_loss": -12.807899475097656, "global_step": 445096, "epoch": 2649} {"train_loss": -12.806023597717285, "global_step": 445097, "epoch": 2649} {"train_loss": -12.901666641235352, "global_step": 445098, "epoch": 2649} {"train_loss": -12.918888092041016, "global_step": 445099, "epoch": 2649} {"train_loss": -12.83548355102539, "global_step": 445100, "epoch": 2649} {"train_loss": -12.568507194519043, "global_step": 445101, "epoch": 2649} {"train_loss": -12.631492614746094, "global_step": 445102, "epoch": 2649} {"train_loss": -12.97488784790039, "global_step": 445103, "epoch": 2649} {"train_loss": -12.849167823791504, "global_step": 445104, "epoch": 2649} {"train_loss": -12.898662567138672, "global_step": 445105, "epoch": 2649} {"train_loss": -13.031242370605469, "global_step": 445106, "epoch": 2649} {"train_loss": -12.996535301208496, "global_step": 445107, "epoch": 2649} {"train_loss": -12.765106201171875, "global_step": 445108, "epoch": 2649} {"train_loss": -12.87393569946289, "global_step": 445109, "epoch": 2649} {"train_loss": -12.77190113067627, "global_step": 445110, "epoch": 2649} {"train_loss": -12.75436782836914, "global_step": 445111, "epoch": 2649} {"train_loss": -12.87450885772705, "global_step": 445112, "epoch": 2649} {"train_loss": -12.89047622680664, "global_step": 445113, "epoch": 2649} {"train_loss": -12.46357250213623, "global_step": 445114, "epoch": 2649} {"train_loss": -12.733001708984375, "global_step": 445115, "epoch": 2649} {"train_loss": -12.486461639404297, "global_step": 445116, "epoch": 2649} {"train_loss": -12.689554214477539, "global_step": 445117, "epoch": 2649} {"train_loss": -12.742514610290527, "global_step": 445118, "epoch": 2649} {"train_loss": -12.533214569091797, "global_step": 445119, "epoch": 2649} {"train_loss": -12.163219451904297, "global_step": 445120, "epoch": 2649} {"train_loss": -12.572324752807617, "global_step": 445121, "epoch": 2649} {"train_loss": -12.39674186706543, "global_step": 445122, "epoch": 2649} {"train_loss": -12.833672523498535, "global_step": 445123, "epoch": 2649} {"train_loss": -12.60717487335205, "global_step": 445124, "epoch": 2649} {"train_loss": -12.364745140075684, "global_step": 445125, "epoch": 2649} {"train_loss": -12.53879165649414, "global_step": 445126, "epoch": 2649} {"train_loss": -12.704085350036621, "global_step": 445127, "epoch": 2649} {"train_loss": -12.79971694946289, "global_step": 445128, "epoch": 2649} {"train_loss": -12.554756164550781, "global_step": 445129, "epoch": 2649} {"train_loss": -12.616634368896484, "global_step": 445130, "epoch": 2649} {"train_loss": -12.581592559814453, "global_step": 445131, "epoch": 2649} {"train_loss": -12.846113204956055, "global_step": 445132, "epoch": 2649} {"train_loss": -12.651742935180664, "global_step": 445133, "epoch": 2649} {"train_loss": -12.434999465942383, "global_step": 445134, "epoch": 2649} {"train_loss": -12.554790496826172, "global_step": 445135, "epoch": 2649} {"train_loss": -12.808069229125977, "global_step": 445136, "epoch": 2649} {"train_loss": -12.698690414428711, "global_step": 445137, "epoch": 2649} {"train_loss": -12.242898941040039, "global_step": 445138, "epoch": 2649} {"train_loss": -12.478939056396484, "global_step": 445139, "epoch": 2649} {"train_loss": -12.669281005859375, "global_step": 445140, "epoch": 2649} {"train_loss": -12.707338333129883, "global_step": 445141, "epoch": 2649} {"train_loss": -11.729512214660645, "global_step": 445142, "epoch": 2649} {"train_loss": -12.354317665100098, "global_step": 445143, "epoch": 2649} {"train_loss": -12.508216857910156, "global_step": 445144, "epoch": 2649} {"train_loss": -12.33871841430664, "global_step": 445145, "epoch": 2649} {"train_loss": -11.276908874511719, "global_step": 445146, "epoch": 2649} {"train_loss": -11.146421432495117, "global_step": 445147, "epoch": 2649} {"train_loss": -12.41805648803711, "global_step": 445148, "epoch": 2649} {"train_loss": -12.30129337310791, "global_step": 445149, "epoch": 2649} {"train_loss": -10.576852798461914, "global_step": 445150, "epoch": 2649} {"train_loss": -10.323999404907227, "global_step": 445151, "epoch": 2649} {"train_loss": -12.336645126342773, "global_step": 445152, "epoch": 2649} {"train_loss": -10.249561309814453, "global_step": 445153, "epoch": 2649} {"train_loss": -12.815589904785156, "global_step": 445154, "epoch": 2649} {"train_loss": -10.161272048950195, "global_step": 445155, "epoch": 2649} {"train_loss": -10.250160217285156, "global_step": 445156, "epoch": 2649} {"train_loss": -8.675148010253906, "global_step": 445157, "epoch": 2649} {"train_loss": -10.397281646728516, "global_step": 445158, "epoch": 2649} {"train_loss": -9.33298397064209, "global_step": 445159, "epoch": 2649} {"train_loss": -9.046499252319336, "global_step": 445160, "epoch": 2649} {"train_loss": -10.149823188781738, "global_step": 445161, "epoch": 2649} {"train_loss": -10.078757286071777, "global_step": 445162, "epoch": 2649} {"train_loss": -10.415395736694336, "global_step": 445163, "epoch": 2649} {"train_loss": -10.064720153808594, "global_step": 445164, "epoch": 2649} {"train_loss": -10.863985061645508, "global_step": 445165, "epoch": 2649} {"train_loss": -10.447521209716797, "global_step": 445166, "epoch": 2649} {"train_loss": -10.846733093261719, "global_step": 445167, "epoch": 2649} {"train_loss": -10.99538803100586, "global_step": 445168, "epoch": 2649} {"train_loss": -10.35921573638916, "global_step": 445169, "epoch": 2649} {"train_loss": -11.325167655944824, "global_step": 445170, "epoch": 2649} {"train_loss": -10.838395118713379, "global_step": 445171, "epoch": 2649} {"train_loss": -10.879928588867188, "global_step": 445172, "epoch": 2649} {"train_loss": -10.894728660583496, "global_step": 445173, "epoch": 2649} {"train_loss": -11.05433464050293, "global_step": 445174, "epoch": 2649} {"train_loss": -11.56385612487793, "global_step": 445175, "epoch": 2649} {"train_loss": -10.71126937866211, "global_step": 445176, "epoch": 2649} {"train_loss": -11.66758918762207, "global_step": 445177, "epoch": 2649} {"train_loss": -10.67989730834961, "global_step": 445178, "epoch": 2649} {"train_loss": -12.16518783569336, "global_step": 445179, "epoch": 2649} {"train_loss": -10.496543884277344, "global_step": 445180, "epoch": 2649} {"train_loss": -11.512699127197266, "global_step": 445181, "epoch": 2649} {"train_loss": -11.170936584472656, "global_step": 445182, "epoch": 2649} {"train_loss": -11.792673110961914, "global_step": 445183, "epoch": 2649} {"train_loss": -11.951484680175781, "global_step": 445184, "epoch": 2649} {"train_loss": -11.916624069213867, "global_step": 445185, "epoch": 2649} {"train_loss": -11.230402946472168, "global_step": 445186, "epoch": 2649} {"train_loss": -11.504063606262207, "global_step": 445187, "epoch": 2649} {"train_loss": -10.860953330993652, "global_step": 445188, "epoch": 2649} {"train_loss": -11.543631553649902, "global_step": 445189, "epoch": 2649} {"train_loss": -11.884195327758789, "global_step": 445190, "epoch": 2649} {"train_loss": -11.259613037109375, "global_step": 445191, "epoch": 2649} {"train_loss": -11.9296875, "global_step": 445192, "epoch": 2649} {"train_loss": -11.138382911682129, "global_step": 445193, "epoch": 2649} {"train_loss": -11.614568710327148, "global_step": 445194, "epoch": 2649} {"train_loss": -10.994673728942871, "global_step": 445195, "epoch": 2649} {"train_loss": -12.05562973022461, "global_step": 445196, "epoch": 2649} {"train_loss": -11.4959716796875, "global_step": 445197, "epoch": 2649} {"train_loss": -11.486276626586914, "global_step": 445198, "epoch": 2649} {"train_loss": -11.928995807965597, "global_step": 445199, "epoch": 2649, "val_loss": 316620.53125} {"train_loss": -12.19285774230957, "global_step": 445200, "epoch": 2650} {"train_loss": -11.303512573242188, "global_step": 445201, "epoch": 2650} {"train_loss": -12.073881149291992, "global_step": 445202, "epoch": 2650} {"train_loss": -11.840972900390625, "global_step": 445203, "epoch": 2650} {"train_loss": -11.525418281555176, "global_step": 445204, "epoch": 2650} {"train_loss": -11.845178604125977, "global_step": 445205, "epoch": 2650} {"train_loss": -12.072440147399902, "global_step": 445206, "epoch": 2650} {"train_loss": -11.898650169372559, "global_step": 445207, "epoch": 2650} {"train_loss": -12.100255966186523, "global_step": 445208, "epoch": 2650} {"train_loss": -12.24893569946289, "global_step": 445209, "epoch": 2650} {"train_loss": -12.229568481445312, "global_step": 445210, "epoch": 2650} {"train_loss": -12.172188758850098, "global_step": 445211, "epoch": 2650} {"train_loss": -12.291516304016113, "global_step": 445212, "epoch": 2650} {"train_loss": -12.203839302062988, "global_step": 445213, "epoch": 2650} {"train_loss": -12.474544525146484, "global_step": 445214, "epoch": 2650} {"train_loss": -12.328843116760254, "global_step": 445215, "epoch": 2650} {"train_loss": -12.314020156860352, "global_step": 445216, "epoch": 2650} {"train_loss": -12.281445503234863, "global_step": 445217, "epoch": 2650} {"train_loss": -12.101168632507324, "global_step": 445218, "epoch": 2650} {"train_loss": -12.470402717590332, "global_step": 445219, "epoch": 2650} {"train_loss": -12.36181354522705, "global_step": 445220, "epoch": 2650} {"train_loss": -12.403264999389648, "global_step": 445221, "epoch": 2650} {"train_loss": -12.469111442565918, "global_step": 445222, "epoch": 2650} {"train_loss": -12.46771240234375, "global_step": 445223, "epoch": 2650} {"train_loss": -12.426986694335938, "global_step": 445224, "epoch": 2650} {"train_loss": -12.182819366455078, "global_step": 445225, "epoch": 2650} {"train_loss": -12.137594223022461, "global_step": 445226, "epoch": 2650} {"train_loss": -12.522455215454102, "global_step": 445227, "epoch": 2650} {"train_loss": -12.209835052490234, "global_step": 445228, "epoch": 2650} {"train_loss": -12.662742614746094, "global_step": 445229, "epoch": 2650} {"train_loss": -12.207009315490723, "global_step": 445230, "epoch": 2650} {"train_loss": -12.416791915893555, "global_step": 445231, "epoch": 2650} {"train_loss": -12.63594913482666, "global_step": 445232, "epoch": 2650} {"train_loss": -12.418851852416992, "global_step": 445233, "epoch": 2650} {"train_loss": -12.543328285217285, "global_step": 445234, "epoch": 2650} {"train_loss": -12.544855117797852, "global_step": 445235, "epoch": 2650} {"train_loss": -12.432533264160156, "global_step": 445236, "epoch": 2650} {"train_loss": -12.332045555114746, "global_step": 445237, "epoch": 2650} {"train_loss": -12.332911491394043, "global_step": 445238, "epoch": 2650} {"train_loss": -12.42437744140625, "global_step": 445239, "epoch": 2650} {"train_loss": -12.721691131591797, "global_step": 445240, "epoch": 2650} {"train_loss": -12.305614471435547, "global_step": 445241, "epoch": 2650} {"train_loss": -12.660140991210938, "global_step": 445242, "epoch": 2650} {"train_loss": -12.664297103881836, "global_step": 445243, "epoch": 2650} {"train_loss": -12.51760196685791, "global_step": 445244, "epoch": 2650} {"train_loss": -12.704557418823242, "global_step": 445245, "epoch": 2650} {"train_loss": -12.827698707580566, "global_step": 445246, "epoch": 2650} {"train_loss": -12.493220329284668, "global_step": 445247, "epoch": 2650} {"train_loss": -12.601940155029297, "global_step": 445248, "epoch": 2650} {"train_loss": -12.765532493591309, "global_step": 445249, "epoch": 2650} {"train_loss": -12.50149154663086, "global_step": 445250, "epoch": 2650} {"train_loss": -12.601276397705078, "global_step": 445251, "epoch": 2650} {"train_loss": -12.371074676513672, "global_step": 445252, "epoch": 2650} {"train_loss": -12.37144660949707, "global_step": 445253, "epoch": 2650} {"train_loss": -12.498620986938477, "global_step": 445254, "epoch": 2650} {"train_loss": -11.980775833129883, "global_step": 445255, "epoch": 2650} {"train_loss": -12.35303020477295, "global_step": 445256, "epoch": 2650} {"train_loss": -12.293853759765625, "global_step": 445257, "epoch": 2650} {"train_loss": -12.292808532714844, "global_step": 445258, "epoch": 2650} {"train_loss": -12.329858779907227, "global_step": 445259, "epoch": 2650} {"train_loss": -12.398383140563965, "global_step": 445260, "epoch": 2650} {"train_loss": -12.620946884155273, "global_step": 445261, "epoch": 2650} {"train_loss": -12.286226272583008, "global_step": 445262, "epoch": 2650} {"train_loss": -12.32835578918457, "global_step": 445263, "epoch": 2650} {"train_loss": -12.591421127319336, "global_step": 445264, "epoch": 2650} {"train_loss": -11.795764923095703, "global_step": 445265, "epoch": 2650} {"train_loss": -12.19255542755127, "global_step": 445266, "epoch": 2650} {"train_loss": -12.532356262207031, "global_step": 445267, "epoch": 2650} {"train_loss": -12.368919372558594, "global_step": 445268, "epoch": 2650} {"train_loss": -12.644340515136719, "global_step": 445269, "epoch": 2650} {"train_loss": -12.090770721435547, "global_step": 445270, "epoch": 2650} {"train_loss": -12.814072608947754, "global_step": 445271, "epoch": 2650} {"train_loss": -12.196826934814453, "global_step": 445272, "epoch": 2650} {"train_loss": -12.484504699707031, "global_step": 445273, "epoch": 2650} {"train_loss": -12.475886344909668, "global_step": 445274, "epoch": 2650} {"train_loss": -12.322808265686035, "global_step": 445275, "epoch": 2650} {"train_loss": -12.76522445678711, "global_step": 445276, "epoch": 2650} {"train_loss": -12.4631929397583, "global_step": 445277, "epoch": 2650} {"train_loss": -12.465532302856445, "global_step": 445278, "epoch": 2650} {"train_loss": -12.51368236541748, "global_step": 445279, "epoch": 2650} {"train_loss": -12.600539207458496, "global_step": 445280, "epoch": 2650} {"train_loss": -12.808820724487305, "global_step": 445281, "epoch": 2650} {"train_loss": -12.478168487548828, "global_step": 445282, "epoch": 2650} {"train_loss": -12.667350769042969, "global_step": 445283, "epoch": 2650} {"train_loss": -12.2581787109375, "global_step": 445284, "epoch": 2650} {"train_loss": -12.58777904510498, "global_step": 445285, "epoch": 2650} {"train_loss": -12.527722358703613, "global_step": 445286, "epoch": 2650} {"train_loss": -12.635992050170898, "global_step": 445287, "epoch": 2650} {"train_loss": -12.359323501586914, "global_step": 445288, "epoch": 2650} {"train_loss": -12.739827156066895, "global_step": 445289, "epoch": 2650} {"train_loss": -12.29604721069336, "global_step": 445290, "epoch": 2650} {"train_loss": -12.20287799835205, "global_step": 445291, "epoch": 2650} {"train_loss": -13.001123428344727, "global_step": 445292, "epoch": 2650} {"train_loss": -12.154674530029297, "global_step": 445293, "epoch": 2650} {"train_loss": -12.173982620239258, "global_step": 445294, "epoch": 2650} {"train_loss": -12.969328880310059, "global_step": 445295, "epoch": 2650} {"train_loss": -12.218178749084473, "global_step": 445296, "epoch": 2650} {"train_loss": -12.01417350769043, "global_step": 445297, "epoch": 2650} {"train_loss": -12.558699607849121, "global_step": 445298, "epoch": 2650} {"train_loss": -12.186962127685547, "global_step": 445299, "epoch": 2650} {"train_loss": -11.582947731018066, "global_step": 445300, "epoch": 2650} {"train_loss": -12.591687202453613, "global_step": 445301, "epoch": 2650} {"train_loss": -11.79764461517334, "global_step": 445302, "epoch": 2650} {"train_loss": -12.607789993286133, "global_step": 445303, "epoch": 2650} {"train_loss": -12.355941772460938, "global_step": 445304, "epoch": 2650} {"train_loss": -12.251931190490723, "global_step": 445305, "epoch": 2650} {"train_loss": -12.751660346984863, "global_step": 445306, "epoch": 2650} {"train_loss": -11.954050064086914, "global_step": 445307, "epoch": 2650} {"train_loss": -12.324946403503418, "global_step": 445308, "epoch": 2650} {"train_loss": -12.445999145507812, "global_step": 445309, "epoch": 2650} {"train_loss": -12.071940422058105, "global_step": 445310, "epoch": 2650} {"train_loss": -12.667384147644043, "global_step": 445311, "epoch": 2650} {"train_loss": -12.340968132019043, "global_step": 445312, "epoch": 2650} {"train_loss": -12.53273868560791, "global_step": 445313, "epoch": 2650} {"train_loss": -12.244840621948242, "global_step": 445314, "epoch": 2650} {"train_loss": -12.691169738769531, "global_step": 445315, "epoch": 2650} {"train_loss": -12.335930824279785, "global_step": 445316, "epoch": 2650} {"train_loss": -12.642701148986816, "global_step": 445317, "epoch": 2650} {"train_loss": -12.672040939331055, "global_step": 445318, "epoch": 2650} {"train_loss": -12.650774002075195, "global_step": 445319, "epoch": 2650} {"train_loss": -12.803512573242188, "global_step": 445320, "epoch": 2650} {"train_loss": -12.782203674316406, "global_step": 445321, "epoch": 2650} {"train_loss": -12.522075653076172, "global_step": 445322, "epoch": 2650} {"train_loss": -12.57335376739502, "global_step": 445323, "epoch": 2650} {"train_loss": -12.420896530151367, "global_step": 445324, "epoch": 2650} {"train_loss": -12.790407180786133, "global_step": 445325, "epoch": 2650} {"train_loss": -12.191646575927734, "global_step": 445326, "epoch": 2650} {"train_loss": -12.688605308532715, "global_step": 445327, "epoch": 2650} {"train_loss": -12.17822551727295, "global_step": 445328, "epoch": 2650} {"train_loss": -11.935188293457031, "global_step": 445329, "epoch": 2650} {"train_loss": -12.122432708740234, "global_step": 445330, "epoch": 2650} {"train_loss": -12.38278579711914, "global_step": 445331, "epoch": 2650} {"train_loss": -12.553695678710938, "global_step": 445332, "epoch": 2650} {"train_loss": -12.332290649414062, "global_step": 445333, "epoch": 2650} {"train_loss": -11.83288288116455, "global_step": 445334, "epoch": 2650} {"train_loss": -12.830353736877441, "global_step": 445335, "epoch": 2650} {"train_loss": -12.187532424926758, "global_step": 445336, "epoch": 2650} {"train_loss": -12.308736801147461, "global_step": 445337, "epoch": 2650} {"train_loss": -12.523874282836914, "global_step": 445338, "epoch": 2650} {"train_loss": -12.230055809020996, "global_step": 445339, "epoch": 2650} {"train_loss": -11.724687576293945, "global_step": 445340, "epoch": 2650} {"train_loss": -12.230598449707031, "global_step": 445341, "epoch": 2650} {"train_loss": -11.71185302734375, "global_step": 445342, "epoch": 2650} {"train_loss": -11.475225448608398, "global_step": 445343, "epoch": 2650} {"train_loss": -12.503999710083008, "global_step": 445344, "epoch": 2650} {"train_loss": -12.394941329956055, "global_step": 445345, "epoch": 2650} {"train_loss": -11.172240257263184, "global_step": 445346, "epoch": 2650} {"train_loss": -12.3599271774292, "global_step": 445347, "epoch": 2650} {"train_loss": -10.919792175292969, "global_step": 445348, "epoch": 2650} {"train_loss": -10.637594223022461, "global_step": 445349, "epoch": 2650} {"train_loss": -12.41821575164795, "global_step": 445350, "epoch": 2650} {"train_loss": -11.500110626220703, "global_step": 445351, "epoch": 2650} {"train_loss": -11.61703109741211, "global_step": 445352, "epoch": 2650} {"train_loss": -12.296619415283203, "global_step": 445353, "epoch": 2650} {"train_loss": -11.895951271057129, "global_step": 445354, "epoch": 2650} {"train_loss": -11.683320999145508, "global_step": 445355, "epoch": 2650} {"train_loss": -10.542630195617676, "global_step": 445356, "epoch": 2650} {"train_loss": -12.166376113891602, "global_step": 445357, "epoch": 2650} {"train_loss": -11.801605224609375, "global_step": 445358, "epoch": 2650} {"train_loss": -11.553378105163574, "global_step": 445359, "epoch": 2650} {"train_loss": -12.681143760681152, "global_step": 445360, "epoch": 2650} {"train_loss": -12.097593307495117, "global_step": 445361, "epoch": 2650} {"train_loss": -11.88907241821289, "global_step": 445362, "epoch": 2650} {"train_loss": -12.52810287475586, "global_step": 445363, "epoch": 2650} {"train_loss": -12.335359573364258, "global_step": 445364, "epoch": 2650} {"train_loss": -12.031037330627441, "global_step": 445365, "epoch": 2650} {"train_loss": -12.136896133422852, "global_step": 445366, "epoch": 2650} {"train_loss": -12.296249980018253, "global_step": 445367, "epoch": 2650, "train/sim_max_reward_0": 0.677970568470611, "train/sim_max_reward_1": 0.9712715005360866, "train/sim_max_reward_2": 0.0021132379135489483, "train/sim_max_reward_3": 0.43014619764431244, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.5341327270952592, "test/sim_max_reward_4400000": 0.9930281095026862, "test/sim_max_reward_4400001": 0.34443609331815783, "test/sim_max_reward_4400002": 0.9916155328019637, "test/sim_max_reward_4400003": 0.9051798442641055, "test/sim_max_reward_4400004": 0.4077665111247232, "test/sim_max_reward_4400005": 0.5490056889630048, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 0.9683111189220411, "test/sim_max_reward_4400008": 0.611334808048501, "test/sim_max_reward_4400009": 0.38652780546614374, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.2586657740887651, "test/sim_max_reward_4400012": 0.14110722128947978, "test/sim_max_reward_4400013": 0.9995858024289409, "test/sim_max_reward_4400014": 0.9986604539344006, "test/sim_max_reward_4400015": 0.44980708757319776, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.8475669576737537, "test/sim_max_reward_4400019": 0.3843439472897075, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.9047541856838786, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.3518540875803431, "test/sim_max_reward_4400025": 0.5190853848178105, "test/sim_max_reward_4400026": 0.07684640752236192, "test/sim_max_reward_4400027": 0.31357038002967075, "test/sim_max_reward_4400028": 0.7188224623092653, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9455886512053805, "test/sim_max_reward_4400031": 0.9815691737837237, "test/sim_max_reward_4400032": 0.172395354537494, "test/sim_max_reward_4400033": 0.3668105953834192, "test/sim_max_reward_4400034": 0.4495518976842609, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.363718004248909, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.281545972483768, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.17229656548764277, "test/sim_max_reward_4400042": 0.5207351758278069, "test/sim_max_reward_4400043": 0.26514760473020876, "test/sim_max_reward_4400044": 0.09003919033464856, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.9757387682880695, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.3092185290520184, "train/mean_score": 0.6026057052766364, "test/mean_score": 0.49643471414653534, "val_loss": 313771.21875, "train_action_mse_error": 1.4790985584259033} {"train_loss": -11.962414741516113, "global_step": 445368, "epoch": 2651} {"train_loss": -12.606117248535156, "global_step": 445369, "epoch": 2651} {"train_loss": -12.106939315795898, "global_step": 445370, "epoch": 2651} {"train_loss": -12.252161979675293, "global_step": 445371, "epoch": 2651} {"train_loss": -12.303661346435547, "global_step": 445372, "epoch": 2651} {"train_loss": -11.981979370117188, "global_step": 445373, "epoch": 2651} {"train_loss": -12.368656158447266, "global_step": 445374, "epoch": 2651} {"train_loss": -11.913009643554688, "global_step": 445375, "epoch": 2651} {"train_loss": -12.362337112426758, "global_step": 445376, "epoch": 2651} {"train_loss": -12.616373062133789, "global_step": 445377, "epoch": 2651} {"train_loss": -12.509081840515137, "global_step": 445378, "epoch": 2651} {"train_loss": -12.4248628616333, "global_step": 445379, "epoch": 2651} {"train_loss": -12.53043270111084, "global_step": 445380, "epoch": 2651} {"train_loss": -12.179370880126953, "global_step": 445381, "epoch": 2651} {"train_loss": -12.640949249267578, "global_step": 445382, "epoch": 2651} {"train_loss": -12.403215408325195, "global_step": 445383, "epoch": 2651} {"train_loss": -12.522007942199707, "global_step": 445384, "epoch": 2651} {"train_loss": -12.160143852233887, "global_step": 445385, "epoch": 2651} {"train_loss": -12.37697982788086, "global_step": 445386, "epoch": 2651} {"train_loss": -12.647153854370117, "global_step": 445387, "epoch": 2651} {"train_loss": -12.442359924316406, "global_step": 445388, "epoch": 2651} {"train_loss": -12.613996505737305, "global_step": 445389, "epoch": 2651} {"train_loss": -12.07401180267334, "global_step": 445390, "epoch": 2651} {"train_loss": -11.639314651489258, "global_step": 445391, "epoch": 2651} {"train_loss": -12.684154510498047, "global_step": 445392, "epoch": 2651} {"train_loss": -12.08473014831543, "global_step": 445393, "epoch": 2651} {"train_loss": -12.566337585449219, "global_step": 445394, "epoch": 2651} {"train_loss": -12.62458610534668, "global_step": 445395, "epoch": 2651} {"train_loss": -12.578319549560547, "global_step": 445396, "epoch": 2651} {"train_loss": -11.909183502197266, "global_step": 445397, "epoch": 2651} {"train_loss": -12.275308609008789, "global_step": 445398, "epoch": 2651} {"train_loss": -12.02995777130127, "global_step": 445399, "epoch": 2651} {"train_loss": -12.664056777954102, "global_step": 445400, "epoch": 2651} {"train_loss": -11.439559936523438, "global_step": 445401, "epoch": 2651} {"train_loss": -12.04966926574707, "global_step": 445402, "epoch": 2651} {"train_loss": -12.307638168334961, "global_step": 445403, "epoch": 2651} {"train_loss": -12.74281120300293, "global_step": 445404, "epoch": 2651} {"train_loss": -12.317852020263672, "global_step": 445405, "epoch": 2651} {"train_loss": -12.598400115966797, "global_step": 445406, "epoch": 2651} {"train_loss": -12.528487205505371, "global_step": 445407, "epoch": 2651} {"train_loss": -12.558021545410156, "global_step": 445408, "epoch": 2651} {"train_loss": -12.425048828125, "global_step": 445409, "epoch": 2651} {"train_loss": -12.568300247192383, "global_step": 445410, "epoch": 2651} {"train_loss": -12.295875549316406, "global_step": 445411, "epoch": 2651} {"train_loss": -12.655391693115234, "global_step": 445412, "epoch": 2651} {"train_loss": -12.224377632141113, "global_step": 445413, "epoch": 2651} {"train_loss": -11.997276306152344, "global_step": 445414, "epoch": 2651} {"train_loss": -12.543740272521973, "global_step": 445415, "epoch": 2651} {"train_loss": -11.12787914276123, "global_step": 445416, "epoch": 2651} {"train_loss": -12.308923721313477, "global_step": 445417, "epoch": 2651} {"train_loss": -12.188434600830078, "global_step": 445418, "epoch": 2651} {"train_loss": -11.858345031738281, "global_step": 445419, "epoch": 2651} {"train_loss": -12.584571838378906, "global_step": 445420, "epoch": 2651} {"train_loss": -12.564432144165039, "global_step": 445421, "epoch": 2651} {"train_loss": -12.103100776672363, "global_step": 445422, "epoch": 2651} {"train_loss": -12.717475891113281, "global_step": 445423, "epoch": 2651} {"train_loss": -12.266987800598145, "global_step": 445424, "epoch": 2651} {"train_loss": -12.48165225982666, "global_step": 445425, "epoch": 2651} {"train_loss": -12.58890151977539, "global_step": 445426, "epoch": 2651} {"train_loss": -11.856706619262695, "global_step": 445427, "epoch": 2651} {"train_loss": -12.342931747436523, "global_step": 445428, "epoch": 2651} {"train_loss": -12.750144958496094, "global_step": 445429, "epoch": 2651} {"train_loss": -12.206804275512695, "global_step": 445430, "epoch": 2651} {"train_loss": -12.36101245880127, "global_step": 445431, "epoch": 2651} {"train_loss": -12.728265762329102, "global_step": 445432, "epoch": 2651} {"train_loss": -12.455083847045898, "global_step": 445433, "epoch": 2651} {"train_loss": -12.036903381347656, "global_step": 445434, "epoch": 2651} {"train_loss": -12.18408203125, "global_step": 445435, "epoch": 2651} {"train_loss": -12.25370979309082, "global_step": 445436, "epoch": 2651} {"train_loss": -11.76608657836914, "global_step": 445437, "epoch": 2651} {"train_loss": -12.536108016967773, "global_step": 445438, "epoch": 2651} {"train_loss": -11.777556419372559, "global_step": 445439, "epoch": 2651} {"train_loss": -12.560111045837402, "global_step": 445440, "epoch": 2651} {"train_loss": -12.10714054107666, "global_step": 445441, "epoch": 2651} {"train_loss": -12.716011047363281, "global_step": 445442, "epoch": 2651} {"train_loss": -12.479358673095703, "global_step": 445443, "epoch": 2651} {"train_loss": -12.831626892089844, "global_step": 445444, "epoch": 2651} {"train_loss": -12.414594650268555, "global_step": 445445, "epoch": 2651} {"train_loss": -12.950286865234375, "global_step": 445446, "epoch": 2651} {"train_loss": -12.49545669555664, "global_step": 445447, "epoch": 2651} {"train_loss": -12.681164741516113, "global_step": 445448, "epoch": 2651} {"train_loss": -12.43467903137207, "global_step": 445449, "epoch": 2651} {"train_loss": -12.66865062713623, "global_step": 445450, "epoch": 2651} {"train_loss": -12.989818572998047, "global_step": 445451, "epoch": 2651} {"train_loss": -12.533971786499023, "global_step": 445452, "epoch": 2651} {"train_loss": -12.807207107543945, "global_step": 445453, "epoch": 2651} {"train_loss": -12.943349838256836, "global_step": 445454, "epoch": 2651} {"train_loss": -12.75693130493164, "global_step": 445455, "epoch": 2651} {"train_loss": -12.68765926361084, "global_step": 445456, "epoch": 2651} {"train_loss": -12.792367935180664, "global_step": 445457, "epoch": 2651} {"train_loss": -12.472654342651367, "global_step": 445458, "epoch": 2651} {"train_loss": -12.796022415161133, "global_step": 445459, "epoch": 2651} {"train_loss": -12.55521011352539, "global_step": 445460, "epoch": 2651} {"train_loss": -12.005668640136719, "global_step": 445461, "epoch": 2651} {"train_loss": -12.423559188842773, "global_step": 445462, "epoch": 2651} {"train_loss": -12.74754524230957, "global_step": 445463, "epoch": 2651} {"train_loss": -12.067962646484375, "global_step": 445464, "epoch": 2651} {"train_loss": -12.052604675292969, "global_step": 445465, "epoch": 2651} {"train_loss": -12.416278839111328, "global_step": 445466, "epoch": 2651} {"train_loss": -12.225671768188477, "global_step": 445467, "epoch": 2651} {"train_loss": -11.965627670288086, "global_step": 445468, "epoch": 2651} {"train_loss": -12.334646224975586, "global_step": 445469, "epoch": 2651} {"train_loss": -12.296015739440918, "global_step": 445470, "epoch": 2651} {"train_loss": -12.597840309143066, "global_step": 445471, "epoch": 2651} {"train_loss": -12.6135835647583, "global_step": 445472, "epoch": 2651} {"train_loss": -12.642921447753906, "global_step": 445473, "epoch": 2651} {"train_loss": -12.734636306762695, "global_step": 445474, "epoch": 2651} {"train_loss": -12.368169784545898, "global_step": 445475, "epoch": 2651} {"train_loss": -12.485761642456055, "global_step": 445476, "epoch": 2651} {"train_loss": -12.747604370117188, "global_step": 445477, "epoch": 2651} {"train_loss": -12.538825988769531, "global_step": 445478, "epoch": 2651} {"train_loss": -12.893341064453125, "global_step": 445479, "epoch": 2651} {"train_loss": -12.753825187683105, "global_step": 445480, "epoch": 2651} {"train_loss": -12.408523559570312, "global_step": 445481, "epoch": 2651} {"train_loss": -12.64681625366211, "global_step": 445482, "epoch": 2651} {"train_loss": -12.630589485168457, "global_step": 445483, "epoch": 2651} {"train_loss": -12.57433032989502, "global_step": 445484, "epoch": 2651} {"train_loss": -12.84981632232666, "global_step": 445485, "epoch": 2651} {"train_loss": -12.650632858276367, "global_step": 445486, "epoch": 2651} {"train_loss": -11.763139724731445, "global_step": 445487, "epoch": 2651} {"train_loss": -12.569988250732422, "global_step": 445488, "epoch": 2651} {"train_loss": -12.506341934204102, "global_step": 445489, "epoch": 2651} {"train_loss": -12.135961532592773, "global_step": 445490, "epoch": 2651} {"train_loss": -12.169570922851562, "global_step": 445491, "epoch": 2651} {"train_loss": -12.890739440917969, "global_step": 445492, "epoch": 2651} {"train_loss": -12.07095718383789, "global_step": 445493, "epoch": 2651} {"train_loss": -11.89222526550293, "global_step": 445494, "epoch": 2651} {"train_loss": -12.408287048339844, "global_step": 445495, "epoch": 2651} {"train_loss": -12.736296653747559, "global_step": 445496, "epoch": 2651} {"train_loss": -11.991134643554688, "global_step": 445497, "epoch": 2651} {"train_loss": -11.968748092651367, "global_step": 445498, "epoch": 2651} {"train_loss": -12.622591972351074, "global_step": 445499, "epoch": 2651} {"train_loss": -12.300548553466797, "global_step": 445500, "epoch": 2651} {"train_loss": -12.423025131225586, "global_step": 445501, "epoch": 2651} {"train_loss": -12.232305526733398, "global_step": 445502, "epoch": 2651} {"train_loss": -12.042886734008789, "global_step": 445503, "epoch": 2651} {"train_loss": -12.341381072998047, "global_step": 445504, "epoch": 2651} {"train_loss": -12.343375205993652, "global_step": 445505, "epoch": 2651} {"train_loss": -12.096803665161133, "global_step": 445506, "epoch": 2651} {"train_loss": -11.423458099365234, "global_step": 445507, "epoch": 2651} {"train_loss": -12.583980560302734, "global_step": 445508, "epoch": 2651} {"train_loss": -12.305231094360352, "global_step": 445509, "epoch": 2651} {"train_loss": -12.281816482543945, "global_step": 445510, "epoch": 2651} {"train_loss": -12.596309661865234, "global_step": 445511, "epoch": 2651} {"train_loss": -12.356388092041016, "global_step": 445512, "epoch": 2651} {"train_loss": -12.345947265625, "global_step": 445513, "epoch": 2651} {"train_loss": -12.214889526367188, "global_step": 445514, "epoch": 2651} {"train_loss": -12.38336181640625, "global_step": 445515, "epoch": 2651} {"train_loss": -11.572816848754883, "global_step": 445516, "epoch": 2651} {"train_loss": -11.772733688354492, "global_step": 445517, "epoch": 2651} {"train_loss": -12.093645095825195, "global_step": 445518, "epoch": 2651} {"train_loss": -11.82746696472168, "global_step": 445519, "epoch": 2651} {"train_loss": -12.381725311279297, "global_step": 445520, "epoch": 2651} {"train_loss": -11.836162567138672, "global_step": 445521, "epoch": 2651} {"train_loss": -11.3887939453125, "global_step": 445522, "epoch": 2651} {"train_loss": -12.579771041870117, "global_step": 445523, "epoch": 2651} {"train_loss": -11.829446792602539, "global_step": 445524, "epoch": 2651} {"train_loss": -12.202775955200195, "global_step": 445525, "epoch": 2651} {"train_loss": -12.286306381225586, "global_step": 445526, "epoch": 2651} {"train_loss": -12.063358306884766, "global_step": 445527, "epoch": 2651} {"train_loss": -12.275129318237305, "global_step": 445528, "epoch": 2651} {"train_loss": -12.501888275146484, "global_step": 445529, "epoch": 2651} {"train_loss": -12.630112648010254, "global_step": 445530, "epoch": 2651} {"train_loss": -12.521896362304688, "global_step": 445531, "epoch": 2651} {"train_loss": -12.461548805236816, "global_step": 445532, "epoch": 2651} {"train_loss": -12.343914031982422, "global_step": 445533, "epoch": 2651} {"train_loss": -12.479734420776367, "global_step": 445534, "epoch": 2651} {"train_loss": -12.35729417914436, "global_step": 445535, "epoch": 2651, "val_loss": 312826.40625} {"train_loss": -12.533721923828125, "global_step": 445536, "epoch": 2652} {"train_loss": -12.448095321655273, "global_step": 445537, "epoch": 2652} {"train_loss": -12.46948528289795, "global_step": 445538, "epoch": 2652} {"train_loss": -12.505467414855957, "global_step": 445539, "epoch": 2652} {"train_loss": -12.79538345336914, "global_step": 445540, "epoch": 2652} {"train_loss": -12.12602424621582, "global_step": 445541, "epoch": 2652} {"train_loss": -12.46227741241455, "global_step": 445542, "epoch": 2652} {"train_loss": -12.253491401672363, "global_step": 445543, "epoch": 2652} {"train_loss": -12.377325057983398, "global_step": 445544, "epoch": 2652} {"train_loss": -12.136323928833008, "global_step": 445545, "epoch": 2652} {"train_loss": -12.527600288391113, "global_step": 445546, "epoch": 2652} {"train_loss": -12.5234956741333, "global_step": 445547, "epoch": 2652} {"train_loss": -12.418410301208496, "global_step": 445548, "epoch": 2652} {"train_loss": -12.340466499328613, "global_step": 445549, "epoch": 2652} {"train_loss": -12.111851692199707, "global_step": 445550, "epoch": 2652} {"train_loss": -10.95522689819336, "global_step": 445551, "epoch": 2652} {"train_loss": -10.681160926818848, "global_step": 445552, "epoch": 2652} {"train_loss": -12.154125213623047, "global_step": 445553, "epoch": 2652} {"train_loss": -10.6810941696167, "global_step": 445554, "epoch": 2652} {"train_loss": -11.155315399169922, "global_step": 445555, "epoch": 2652} {"train_loss": -11.358407020568848, "global_step": 445556, "epoch": 2652} {"train_loss": -10.430205345153809, "global_step": 445557, "epoch": 2652} {"train_loss": -12.331575393676758, "global_step": 445558, "epoch": 2652} {"train_loss": -10.057395935058594, "global_step": 445559, "epoch": 2652} {"train_loss": -10.715742111206055, "global_step": 445560, "epoch": 2652} {"train_loss": -11.55868911743164, "global_step": 445561, "epoch": 2652} {"train_loss": -10.598840713500977, "global_step": 445562, "epoch": 2652} {"train_loss": -11.857349395751953, "global_step": 445563, "epoch": 2652} {"train_loss": -11.068140029907227, "global_step": 445564, "epoch": 2652} {"train_loss": -11.837300300598145, "global_step": 445565, "epoch": 2652} {"train_loss": -10.715030670166016, "global_step": 445566, "epoch": 2652} {"train_loss": -12.446024894714355, "global_step": 445567, "epoch": 2652} {"train_loss": -11.168793678283691, "global_step": 445568, "epoch": 2652} {"train_loss": -11.100505828857422, "global_step": 445569, "epoch": 2652} {"train_loss": -11.603668212890625, "global_step": 445570, "epoch": 2652} {"train_loss": -12.13315200805664, "global_step": 445571, "epoch": 2652} {"train_loss": -10.876435279846191, "global_step": 445572, "epoch": 2652} {"train_loss": -10.743498802185059, "global_step": 445573, "epoch": 2652} {"train_loss": -11.585212707519531, "global_step": 445574, "epoch": 2652} {"train_loss": -11.173235893249512, "global_step": 445575, "epoch": 2652} {"train_loss": -11.286161422729492, "global_step": 445576, "epoch": 2652} {"train_loss": -10.403496742248535, "global_step": 445577, "epoch": 2652} {"train_loss": -12.00651741027832, "global_step": 445578, "epoch": 2652} {"train_loss": -10.37218952178955, "global_step": 445579, "epoch": 2652} {"train_loss": -11.374951362609863, "global_step": 445580, "epoch": 2652} {"train_loss": -11.224297523498535, "global_step": 445581, "epoch": 2652} {"train_loss": -10.716644287109375, "global_step": 445582, "epoch": 2652} {"train_loss": -12.178951263427734, "global_step": 445583, "epoch": 2652} {"train_loss": -10.375470161437988, "global_step": 445584, "epoch": 2652} {"train_loss": -11.951507568359375, "global_step": 445585, "epoch": 2652} {"train_loss": -11.191917419433594, "global_step": 445586, "epoch": 2652} {"train_loss": -11.745773315429688, "global_step": 445587, "epoch": 2652} {"train_loss": -11.352380752563477, "global_step": 445588, "epoch": 2652} {"train_loss": -11.28089714050293, "global_step": 445589, "epoch": 2652} {"train_loss": -11.740885734558105, "global_step": 445590, "epoch": 2652} {"train_loss": -11.600141525268555, "global_step": 445591, "epoch": 2652} {"train_loss": -11.965398788452148, "global_step": 445592, "epoch": 2652} {"train_loss": -11.793292999267578, "global_step": 445593, "epoch": 2652} {"train_loss": -11.897294998168945, "global_step": 445594, "epoch": 2652} {"train_loss": -11.760723114013672, "global_step": 445595, "epoch": 2652} {"train_loss": -12.119020462036133, "global_step": 445596, "epoch": 2652} {"train_loss": -11.923805236816406, "global_step": 445597, "epoch": 2652} {"train_loss": -11.929637908935547, "global_step": 445598, "epoch": 2652} {"train_loss": -11.789709091186523, "global_step": 445599, "epoch": 2652} {"train_loss": -12.263053894042969, "global_step": 445600, "epoch": 2652} {"train_loss": -11.943168640136719, "global_step": 445601, "epoch": 2652} {"train_loss": -12.20887565612793, "global_step": 445602, "epoch": 2652} {"train_loss": -11.875213623046875, "global_step": 445603, "epoch": 2652} {"train_loss": -12.145508766174316, "global_step": 445604, "epoch": 2652} {"train_loss": -12.091837882995605, "global_step": 445605, "epoch": 2652} {"train_loss": -11.776622772216797, "global_step": 445606, "epoch": 2652} {"train_loss": -12.30586051940918, "global_step": 445607, "epoch": 2652} {"train_loss": -12.18246841430664, "global_step": 445608, "epoch": 2652} {"train_loss": -12.32804012298584, "global_step": 445609, "epoch": 2652} {"train_loss": -12.030305862426758, "global_step": 445610, "epoch": 2652} {"train_loss": -12.502458572387695, "global_step": 445611, "epoch": 2652} {"train_loss": -12.257895469665527, "global_step": 445612, "epoch": 2652} {"train_loss": -12.543841361999512, "global_step": 445613, "epoch": 2652} {"train_loss": -12.203451156616211, "global_step": 445614, "epoch": 2652} {"train_loss": -12.522729873657227, "global_step": 445615, "epoch": 2652} {"train_loss": -12.214930534362793, "global_step": 445616, "epoch": 2652} {"train_loss": -12.490038871765137, "global_step": 445617, "epoch": 2652} {"train_loss": -12.16912841796875, "global_step": 445618, "epoch": 2652} {"train_loss": -12.203652381896973, "global_step": 445619, "epoch": 2652} {"train_loss": -12.289621353149414, "global_step": 445620, "epoch": 2652} {"train_loss": -12.237648963928223, "global_step": 445621, "epoch": 2652} {"train_loss": -12.632630348205566, "global_step": 445622, "epoch": 2652} {"train_loss": -12.16380500793457, "global_step": 445623, "epoch": 2652} {"train_loss": -12.520125389099121, "global_step": 445624, "epoch": 2652} {"train_loss": -12.564840316772461, "global_step": 445625, "epoch": 2652} {"train_loss": -12.714845657348633, "global_step": 445626, "epoch": 2652} {"train_loss": -12.41523265838623, "global_step": 445627, "epoch": 2652} {"train_loss": -12.609867095947266, "global_step": 445628, "epoch": 2652} {"train_loss": -12.500021934509277, "global_step": 445629, "epoch": 2652} {"train_loss": -12.717443466186523, "global_step": 445630, "epoch": 2652} {"train_loss": -12.445255279541016, "global_step": 445631, "epoch": 2652} {"train_loss": -12.896219253540039, "global_step": 445632, "epoch": 2652} {"train_loss": -12.614883422851562, "global_step": 445633, "epoch": 2652} {"train_loss": -12.9111328125, "global_step": 445634, "epoch": 2652} {"train_loss": -12.81196403503418, "global_step": 445635, "epoch": 2652} {"train_loss": -12.427887916564941, "global_step": 445636, "epoch": 2652} {"train_loss": -12.734477996826172, "global_step": 445637, "epoch": 2652} {"train_loss": -12.571474075317383, "global_step": 445638, "epoch": 2652} {"train_loss": -12.80211067199707, "global_step": 445639, "epoch": 2652} {"train_loss": -12.709084510803223, "global_step": 445640, "epoch": 2652} {"train_loss": -12.701597213745117, "global_step": 445641, "epoch": 2652} {"train_loss": -12.736227989196777, "global_step": 445642, "epoch": 2652} {"train_loss": -12.650371551513672, "global_step": 445643, "epoch": 2652} {"train_loss": -12.754323959350586, "global_step": 445644, "epoch": 2652} {"train_loss": -12.790102005004883, "global_step": 445645, "epoch": 2652} {"train_loss": -12.958976745605469, "global_step": 445646, "epoch": 2652} {"train_loss": -12.687399864196777, "global_step": 445647, "epoch": 2652} {"train_loss": -13.019533157348633, "global_step": 445648, "epoch": 2652} {"train_loss": -12.823406219482422, "global_step": 445649, "epoch": 2652} {"train_loss": -12.671707153320312, "global_step": 445650, "epoch": 2652} {"train_loss": -12.647143363952637, "global_step": 445651, "epoch": 2652} {"train_loss": -12.833642959594727, "global_step": 445652, "epoch": 2652} {"train_loss": -12.769333839416504, "global_step": 445653, "epoch": 2652} {"train_loss": -12.906768798828125, "global_step": 445654, "epoch": 2652} {"train_loss": -12.5867919921875, "global_step": 445655, "epoch": 2652} {"train_loss": -12.768850326538086, "global_step": 445656, "epoch": 2652} {"train_loss": -12.950918197631836, "global_step": 445657, "epoch": 2652} {"train_loss": -12.681493759155273, "global_step": 445658, "epoch": 2652} {"train_loss": -12.776942253112793, "global_step": 445659, "epoch": 2652} {"train_loss": -13.008091926574707, "global_step": 445660, "epoch": 2652} {"train_loss": -12.740718841552734, "global_step": 445661, "epoch": 2652} {"train_loss": -12.676005363464355, "global_step": 445662, "epoch": 2652} {"train_loss": -12.745231628417969, "global_step": 445663, "epoch": 2652} {"train_loss": -12.621725082397461, "global_step": 445664, "epoch": 2652} {"train_loss": -12.618121147155762, "global_step": 445665, "epoch": 2652} {"train_loss": -12.47912883758545, "global_step": 445666, "epoch": 2652} {"train_loss": -12.81226921081543, "global_step": 445667, "epoch": 2652} {"train_loss": -12.89177131652832, "global_step": 445668, "epoch": 2652} {"train_loss": -12.64072036743164, "global_step": 445669, "epoch": 2652} {"train_loss": -12.658287048339844, "global_step": 445670, "epoch": 2652} {"train_loss": -12.737577438354492, "global_step": 445671, "epoch": 2652} {"train_loss": -12.551860809326172, "global_step": 445672, "epoch": 2652} {"train_loss": -12.087236404418945, "global_step": 445673, "epoch": 2652} {"train_loss": -12.842756271362305, "global_step": 445674, "epoch": 2652} {"train_loss": -12.232122421264648, "global_step": 445675, "epoch": 2652} {"train_loss": -12.0404634475708, "global_step": 445676, "epoch": 2652} {"train_loss": -12.741762161254883, "global_step": 445677, "epoch": 2652} {"train_loss": -12.817972183227539, "global_step": 445678, "epoch": 2652} {"train_loss": -12.523048400878906, "global_step": 445679, "epoch": 2652} {"train_loss": -12.957036972045898, "global_step": 445680, "epoch": 2652} {"train_loss": -12.254732131958008, "global_step": 445681, "epoch": 2652} {"train_loss": -12.509552001953125, "global_step": 445682, "epoch": 2652} {"train_loss": -12.354803085327148, "global_step": 445683, "epoch": 2652} {"train_loss": -12.362031936645508, "global_step": 445684, "epoch": 2652} {"train_loss": -11.557158470153809, "global_step": 445685, "epoch": 2652} {"train_loss": -12.677396774291992, "global_step": 445686, "epoch": 2652} {"train_loss": -11.735235214233398, "global_step": 445687, "epoch": 2652} {"train_loss": -12.354390144348145, "global_step": 445688, "epoch": 2652} {"train_loss": -12.364274978637695, "global_step": 445689, "epoch": 2652} {"train_loss": -12.091388702392578, "global_step": 445690, "epoch": 2652} {"train_loss": -12.448205947875977, "global_step": 445691, "epoch": 2652} {"train_loss": -12.374364852905273, "global_step": 445692, "epoch": 2652} {"train_loss": -12.163955688476562, "global_step": 445693, "epoch": 2652} {"train_loss": -11.960369110107422, "global_step": 445694, "epoch": 2652} {"train_loss": -12.225255966186523, "global_step": 445695, "epoch": 2652} {"train_loss": -11.787796020507812, "global_step": 445696, "epoch": 2652} {"train_loss": -12.132584571838379, "global_step": 445697, "epoch": 2652} {"train_loss": -11.51918888092041, "global_step": 445698, "epoch": 2652} {"train_loss": -12.263427734375, "global_step": 445699, "epoch": 2652} {"train_loss": -10.578676223754883, "global_step": 445700, "epoch": 2652} {"train_loss": -10.623058319091797, "global_step": 445701, "epoch": 2652} {"train_loss": -12.420276641845703, "global_step": 445702, "epoch": 2652} {"train_loss": -12.117300271987915, "global_step": 445703, "epoch": 2652, "val_loss": 313759.34375} {"train_loss": -10.665942192077637, "global_step": 445704, "epoch": 2653} {"train_loss": -10.85595703125, "global_step": 445705, "epoch": 2653} {"train_loss": -10.478509902954102, "global_step": 445706, "epoch": 2653} {"train_loss": -11.127469062805176, "global_step": 445707, "epoch": 2653} {"train_loss": -10.094280242919922, "global_step": 445708, "epoch": 2653} {"train_loss": -11.255346298217773, "global_step": 445709, "epoch": 2653} {"train_loss": -11.63650131225586, "global_step": 445710, "epoch": 2653} {"train_loss": -11.780797958374023, "global_step": 445711, "epoch": 2653} {"train_loss": -10.822369575500488, "global_step": 445712, "epoch": 2653} {"train_loss": -11.51589298248291, "global_step": 445713, "epoch": 2653} {"train_loss": -11.923571586608887, "global_step": 445714, "epoch": 2653} {"train_loss": -11.941883087158203, "global_step": 445715, "epoch": 2653} {"train_loss": -11.674468040466309, "global_step": 445716, "epoch": 2653} {"train_loss": -12.145379066467285, "global_step": 445717, "epoch": 2653} {"train_loss": -12.06281566619873, "global_step": 445718, "epoch": 2653} {"train_loss": -11.82936954498291, "global_step": 445719, "epoch": 2653} {"train_loss": -12.352657318115234, "global_step": 445720, "epoch": 2653} {"train_loss": -11.856147766113281, "global_step": 445721, "epoch": 2653} {"train_loss": -11.434659004211426, "global_step": 445722, "epoch": 2653} {"train_loss": -11.917597770690918, "global_step": 445723, "epoch": 2653} {"train_loss": -11.628194808959961, "global_step": 445724, "epoch": 2653} {"train_loss": -11.939321517944336, "global_step": 445725, "epoch": 2653} {"train_loss": -11.535118103027344, "global_step": 445726, "epoch": 2653} {"train_loss": -11.850488662719727, "global_step": 445727, "epoch": 2653} {"train_loss": -12.295507431030273, "global_step": 445728, "epoch": 2653} {"train_loss": -11.9712495803833, "global_step": 445729, "epoch": 2653} {"train_loss": -12.187174797058105, "global_step": 445730, "epoch": 2653} {"train_loss": -11.634264945983887, "global_step": 445731, "epoch": 2653} {"train_loss": -12.551837921142578, "global_step": 445732, "epoch": 2653} {"train_loss": -11.579553604125977, "global_step": 445733, "epoch": 2653} {"train_loss": -11.932199478149414, "global_step": 445734, "epoch": 2653} {"train_loss": -11.527626037597656, "global_step": 445735, "epoch": 2653} {"train_loss": -11.936147689819336, "global_step": 445736, "epoch": 2653} {"train_loss": -11.763252258300781, "global_step": 445737, "epoch": 2653} {"train_loss": -12.201873779296875, "global_step": 445738, "epoch": 2653} {"train_loss": -12.055746078491211, "global_step": 445739, "epoch": 2653} {"train_loss": -12.09499740600586, "global_step": 445740, "epoch": 2653} {"train_loss": -12.340587615966797, "global_step": 445741, "epoch": 2653} {"train_loss": -11.993209838867188, "global_step": 445742, "epoch": 2653} {"train_loss": -12.561464309692383, "global_step": 445743, "epoch": 2653} {"train_loss": -11.816059112548828, "global_step": 445744, "epoch": 2653} {"train_loss": -12.440701484680176, "global_step": 445745, "epoch": 2653} {"train_loss": -11.90937614440918, "global_step": 445746, "epoch": 2653} {"train_loss": -12.131645202636719, "global_step": 445747, "epoch": 2653} {"train_loss": -12.27841567993164, "global_step": 445748, "epoch": 2653} {"train_loss": -11.63687801361084, "global_step": 445749, "epoch": 2653} {"train_loss": -12.331136703491211, "global_step": 445750, "epoch": 2653} {"train_loss": -11.943548202514648, "global_step": 445751, "epoch": 2653} {"train_loss": -12.238998413085938, "global_step": 445752, "epoch": 2653} {"train_loss": -12.138891220092773, "global_step": 445753, "epoch": 2653} {"train_loss": -12.37794017791748, "global_step": 445754, "epoch": 2653} {"train_loss": -12.387123107910156, "global_step": 445755, "epoch": 2653} {"train_loss": -12.53384017944336, "global_step": 445756, "epoch": 2653} {"train_loss": -12.40719223022461, "global_step": 445757, "epoch": 2653} {"train_loss": -12.739304542541504, "global_step": 445758, "epoch": 2653} {"train_loss": -12.505495071411133, "global_step": 445759, "epoch": 2653} {"train_loss": -12.719963073730469, "global_step": 445760, "epoch": 2653} {"train_loss": -12.609277725219727, "global_step": 445761, "epoch": 2653} {"train_loss": -12.698945999145508, "global_step": 445762, "epoch": 2653} {"train_loss": -12.362333297729492, "global_step": 445763, "epoch": 2653} {"train_loss": -12.707408905029297, "global_step": 445764, "epoch": 2653} {"train_loss": -12.561704635620117, "global_step": 445765, "epoch": 2653} {"train_loss": -12.65158748626709, "global_step": 445766, "epoch": 2653} {"train_loss": -12.622901916503906, "global_step": 445767, "epoch": 2653} {"train_loss": -12.537771224975586, "global_step": 445768, "epoch": 2653} {"train_loss": -12.690084457397461, "global_step": 445769, "epoch": 2653} {"train_loss": -12.548206329345703, "global_step": 445770, "epoch": 2653} {"train_loss": -12.610601425170898, "global_step": 445771, "epoch": 2653} {"train_loss": -12.505248069763184, "global_step": 445772, "epoch": 2653} {"train_loss": -12.440285682678223, "global_step": 445773, "epoch": 2653} {"train_loss": -12.568436622619629, "global_step": 445774, "epoch": 2653} {"train_loss": -12.730796813964844, "global_step": 445775, "epoch": 2653} {"train_loss": -12.353964805603027, "global_step": 445776, "epoch": 2653} {"train_loss": -12.75732135772705, "global_step": 445777, "epoch": 2653} {"train_loss": -12.655033111572266, "global_step": 445778, "epoch": 2653} {"train_loss": -12.51688003540039, "global_step": 445779, "epoch": 2653} {"train_loss": -12.670339584350586, "global_step": 445780, "epoch": 2653} {"train_loss": -12.847578048706055, "global_step": 445781, "epoch": 2653} {"train_loss": -12.763291358947754, "global_step": 445782, "epoch": 2653} {"train_loss": -12.591967582702637, "global_step": 445783, "epoch": 2653} {"train_loss": -12.980066299438477, "global_step": 445784, "epoch": 2653} {"train_loss": -12.631797790527344, "global_step": 445785, "epoch": 2653} {"train_loss": -12.8928804397583, "global_step": 445786, "epoch": 2653} {"train_loss": -12.539698600769043, "global_step": 445787, "epoch": 2653} {"train_loss": -12.764350891113281, "global_step": 445788, "epoch": 2653} {"train_loss": -12.902800559997559, "global_step": 445789, "epoch": 2653} {"train_loss": -12.828832626342773, "global_step": 445790, "epoch": 2653} {"train_loss": -12.915767669677734, "global_step": 445791, "epoch": 2653} {"train_loss": -12.830410957336426, "global_step": 445792, "epoch": 2653} {"train_loss": -12.75059700012207, "global_step": 445793, "epoch": 2653} {"train_loss": -12.653355598449707, "global_step": 445794, "epoch": 2653} {"train_loss": -12.884591102600098, "global_step": 445795, "epoch": 2653} {"train_loss": -12.758091926574707, "global_step": 445796, "epoch": 2653} {"train_loss": -12.799614906311035, "global_step": 445797, "epoch": 2653} {"train_loss": -12.689081192016602, "global_step": 445798, "epoch": 2653} {"train_loss": -12.976222038269043, "global_step": 445799, "epoch": 2653} {"train_loss": -12.531333923339844, "global_step": 445800, "epoch": 2653} {"train_loss": -12.762734413146973, "global_step": 445801, "epoch": 2653} {"train_loss": -12.54288101196289, "global_step": 445802, "epoch": 2653} {"train_loss": -12.328842163085938, "global_step": 445803, "epoch": 2653} {"train_loss": -12.659025192260742, "global_step": 445804, "epoch": 2653} {"train_loss": -12.9954833984375, "global_step": 445805, "epoch": 2653} {"train_loss": -12.627117156982422, "global_step": 445806, "epoch": 2653} {"train_loss": -12.78352165222168, "global_step": 445807, "epoch": 2653} {"train_loss": -12.838848114013672, "global_step": 445808, "epoch": 2653} {"train_loss": -12.562517166137695, "global_step": 445809, "epoch": 2653} {"train_loss": -12.611831665039062, "global_step": 445810, "epoch": 2653} {"train_loss": -12.987025260925293, "global_step": 445811, "epoch": 2653} {"train_loss": -12.502466201782227, "global_step": 445812, "epoch": 2653} {"train_loss": -12.99659538269043, "global_step": 445813, "epoch": 2653} {"train_loss": -12.500839233398438, "global_step": 445814, "epoch": 2653} {"train_loss": -12.831684112548828, "global_step": 445815, "epoch": 2653} {"train_loss": -12.351840019226074, "global_step": 445816, "epoch": 2653} {"train_loss": -12.910590171813965, "global_step": 445817, "epoch": 2653} {"train_loss": -12.532977104187012, "global_step": 445818, "epoch": 2653} {"train_loss": -12.79190444946289, "global_step": 445819, "epoch": 2653} {"train_loss": -12.740589141845703, "global_step": 445820, "epoch": 2653} {"train_loss": -12.451773643493652, "global_step": 445821, "epoch": 2653} {"train_loss": -12.861900329589844, "global_step": 445822, "epoch": 2653} {"train_loss": -12.902689933776855, "global_step": 445823, "epoch": 2653} {"train_loss": -12.656673431396484, "global_step": 445824, "epoch": 2653} {"train_loss": -12.429067611694336, "global_step": 445825, "epoch": 2653} {"train_loss": -12.094456672668457, "global_step": 445826, "epoch": 2653} {"train_loss": -12.128571510314941, "global_step": 445827, "epoch": 2653} {"train_loss": -11.96334457397461, "global_step": 445828, "epoch": 2653} {"train_loss": -12.09926700592041, "global_step": 445829, "epoch": 2653} {"train_loss": -12.107748031616211, "global_step": 445830, "epoch": 2653} {"train_loss": -12.350950241088867, "global_step": 445831, "epoch": 2653} {"train_loss": -11.012260437011719, "global_step": 445832, "epoch": 2653} {"train_loss": -11.796721458435059, "global_step": 445833, "epoch": 2653} {"train_loss": -11.94483757019043, "global_step": 445834, "epoch": 2653} {"train_loss": -11.131948471069336, "global_step": 445835, "epoch": 2653} {"train_loss": -11.785993576049805, "global_step": 445836, "epoch": 2653} {"train_loss": -11.767496109008789, "global_step": 445837, "epoch": 2653} {"train_loss": -11.981792449951172, "global_step": 445838, "epoch": 2653} {"train_loss": -11.876699447631836, "global_step": 445839, "epoch": 2653} {"train_loss": -11.894096374511719, "global_step": 445840, "epoch": 2653} {"train_loss": -10.909344673156738, "global_step": 445841, "epoch": 2653} {"train_loss": -11.737399101257324, "global_step": 445842, "epoch": 2653} {"train_loss": -11.48068618774414, "global_step": 445843, "epoch": 2653} {"train_loss": -10.232950210571289, "global_step": 445844, "epoch": 2653} {"train_loss": -11.432437896728516, "global_step": 445845, "epoch": 2653} {"train_loss": -9.570026397705078, "global_step": 445846, "epoch": 2653} {"train_loss": -10.727762222290039, "global_step": 445847, "epoch": 2653} {"train_loss": -10.488431930541992, "global_step": 445848, "epoch": 2653} {"train_loss": -11.294837951660156, "global_step": 445849, "epoch": 2653} {"train_loss": -11.379388809204102, "global_step": 445850, "epoch": 2653} {"train_loss": -9.55329418182373, "global_step": 445851, "epoch": 2653} {"train_loss": -11.82335090637207, "global_step": 445852, "epoch": 2653} {"train_loss": -8.646852493286133, "global_step": 445853, "epoch": 2653} {"train_loss": -11.560235977172852, "global_step": 445854, "epoch": 2653} {"train_loss": -10.088184356689453, "global_step": 445855, "epoch": 2653} {"train_loss": -10.586507797241211, "global_step": 445856, "epoch": 2653} {"train_loss": -11.781303405761719, "global_step": 445857, "epoch": 2653} {"train_loss": -11.102554321289062, "global_step": 445858, "epoch": 2653} {"train_loss": -11.123872756958008, "global_step": 445859, "epoch": 2653} {"train_loss": -11.462366104125977, "global_step": 445860, "epoch": 2653} {"train_loss": -11.083566665649414, "global_step": 445861, "epoch": 2653} {"train_loss": -10.336822509765625, "global_step": 445862, "epoch": 2653} {"train_loss": -12.065071105957031, "global_step": 445863, "epoch": 2653} {"train_loss": -10.926445007324219, "global_step": 445864, "epoch": 2653} {"train_loss": -11.961165428161621, "global_step": 445865, "epoch": 2653} {"train_loss": -11.826651573181152, "global_step": 445866, "epoch": 2653} {"train_loss": -10.930866241455078, "global_step": 445867, "epoch": 2653} {"train_loss": -11.627445220947266, "global_step": 445868, "epoch": 2653} {"train_loss": -10.980110168457031, "global_step": 445869, "epoch": 2653} {"train_loss": -11.491462707519531, "global_step": 445870, "epoch": 2653} {"train_loss": -12.03263707388015, "global_step": 445871, "epoch": 2653, "val_loss": 313675.84375} {"train_loss": -11.292367935180664, "global_step": 445872, "epoch": 2654} {"train_loss": -11.50953197479248, "global_step": 445873, "epoch": 2654} {"train_loss": -11.276744842529297, "global_step": 445874, "epoch": 2654} {"train_loss": -11.184860229492188, "global_step": 445875, "epoch": 2654} {"train_loss": -11.552448272705078, "global_step": 445876, "epoch": 2654} {"train_loss": -11.782712936401367, "global_step": 445877, "epoch": 2654} {"train_loss": -10.943094253540039, "global_step": 445878, "epoch": 2654} {"train_loss": -12.106568336486816, "global_step": 445879, "epoch": 2654} {"train_loss": -11.560955047607422, "global_step": 445880, "epoch": 2654} {"train_loss": -11.970453262329102, "global_step": 445881, "epoch": 2654} {"train_loss": -11.70705509185791, "global_step": 445882, "epoch": 2654} {"train_loss": -11.698022842407227, "global_step": 445883, "epoch": 2654} {"train_loss": -11.685541152954102, "global_step": 445884, "epoch": 2654} {"train_loss": -11.177072525024414, "global_step": 445885, "epoch": 2654} {"train_loss": -11.817037582397461, "global_step": 445886, "epoch": 2654} {"train_loss": -11.668603897094727, "global_step": 445887, "epoch": 2654} {"train_loss": -12.130512237548828, "global_step": 445888, "epoch": 2654} {"train_loss": -11.462862014770508, "global_step": 445889, "epoch": 2654} {"train_loss": -12.14062786102295, "global_step": 445890, "epoch": 2654} {"train_loss": -11.769601821899414, "global_step": 445891, "epoch": 2654} {"train_loss": -11.716991424560547, "global_step": 445892, "epoch": 2654} {"train_loss": -12.088171005249023, "global_step": 445893, "epoch": 2654} {"train_loss": -11.754127502441406, "global_step": 445894, "epoch": 2654} {"train_loss": -12.114838600158691, "global_step": 445895, "epoch": 2654} {"train_loss": -12.022214889526367, "global_step": 445896, "epoch": 2654} {"train_loss": -11.956643104553223, "global_step": 445897, "epoch": 2654} {"train_loss": -12.265729904174805, "global_step": 445898, "epoch": 2654} {"train_loss": -12.099651336669922, "global_step": 445899, "epoch": 2654} {"train_loss": -12.191699981689453, "global_step": 445900, "epoch": 2654} {"train_loss": -12.093088150024414, "global_step": 445901, "epoch": 2654} {"train_loss": -12.116652488708496, "global_step": 445902, "epoch": 2654} {"train_loss": -12.370674133300781, "global_step": 445903, "epoch": 2654} {"train_loss": -12.244449615478516, "global_step": 445904, "epoch": 2654} {"train_loss": -12.446917533874512, "global_step": 445905, "epoch": 2654} {"train_loss": -12.386543273925781, "global_step": 445906, "epoch": 2654} {"train_loss": -12.44250202178955, "global_step": 445907, "epoch": 2654} {"train_loss": -12.123571395874023, "global_step": 445908, "epoch": 2654} {"train_loss": -12.292570114135742, "global_step": 445909, "epoch": 2654} {"train_loss": -12.397262573242188, "global_step": 445910, "epoch": 2654} {"train_loss": -12.641412734985352, "global_step": 445911, "epoch": 2654} {"train_loss": -12.425148010253906, "global_step": 445912, "epoch": 2654} {"train_loss": -12.63286018371582, "global_step": 445913, "epoch": 2654} {"train_loss": -12.41932487487793, "global_step": 445914, "epoch": 2654} {"train_loss": -12.404450416564941, "global_step": 445915, "epoch": 2654} {"train_loss": -12.334488868713379, "global_step": 445916, "epoch": 2654} {"train_loss": -12.608640670776367, "global_step": 445917, "epoch": 2654} {"train_loss": -12.312386512756348, "global_step": 445918, "epoch": 2654} {"train_loss": -12.58156967163086, "global_step": 445919, "epoch": 2654} {"train_loss": -12.507039070129395, "global_step": 445920, "epoch": 2654} {"train_loss": -12.486958503723145, "global_step": 445921, "epoch": 2654} {"train_loss": -12.37868595123291, "global_step": 445922, "epoch": 2654} {"train_loss": -12.701976776123047, "global_step": 445923, "epoch": 2654} {"train_loss": -12.615697860717773, "global_step": 445924, "epoch": 2654} {"train_loss": -12.810569763183594, "global_step": 445925, "epoch": 2654} {"train_loss": -12.436864852905273, "global_step": 445926, "epoch": 2654} {"train_loss": -12.454044342041016, "global_step": 445927, "epoch": 2654} {"train_loss": -12.658124923706055, "global_step": 445928, "epoch": 2654} {"train_loss": -12.492670059204102, "global_step": 445929, "epoch": 2654} {"train_loss": -12.581768035888672, "global_step": 445930, "epoch": 2654} {"train_loss": -12.216569900512695, "global_step": 445931, "epoch": 2654} {"train_loss": -12.500591278076172, "global_step": 445932, "epoch": 2654} {"train_loss": -12.547109603881836, "global_step": 445933, "epoch": 2654} {"train_loss": -12.22708797454834, "global_step": 445934, "epoch": 2654} {"train_loss": -12.552003860473633, "global_step": 445935, "epoch": 2654} {"train_loss": -12.577255249023438, "global_step": 445936, "epoch": 2654} {"train_loss": -12.651931762695312, "global_step": 445937, "epoch": 2654} {"train_loss": -12.768353462219238, "global_step": 445938, "epoch": 2654} {"train_loss": -12.660954475402832, "global_step": 445939, "epoch": 2654} {"train_loss": -12.527376174926758, "global_step": 445940, "epoch": 2654} {"train_loss": -12.694541931152344, "global_step": 445941, "epoch": 2654} {"train_loss": -12.510196685791016, "global_step": 445942, "epoch": 2654} {"train_loss": -12.720233917236328, "global_step": 445943, "epoch": 2654} {"train_loss": -12.768915176391602, "global_step": 445944, "epoch": 2654} {"train_loss": -12.63294506072998, "global_step": 445945, "epoch": 2654} {"train_loss": -12.668774604797363, "global_step": 445946, "epoch": 2654} {"train_loss": -12.333191871643066, "global_step": 445947, "epoch": 2654} {"train_loss": -12.7059907913208, "global_step": 445948, "epoch": 2654} {"train_loss": -12.359895706176758, "global_step": 445949, "epoch": 2654} {"train_loss": -12.6602783203125, "global_step": 445950, "epoch": 2654} {"train_loss": -12.48663330078125, "global_step": 445951, "epoch": 2654} {"train_loss": -12.480607986450195, "global_step": 445952, "epoch": 2654} {"train_loss": -12.528691291809082, "global_step": 445953, "epoch": 2654} {"train_loss": -12.519794464111328, "global_step": 445954, "epoch": 2654} {"train_loss": -12.57746410369873, "global_step": 445955, "epoch": 2654} {"train_loss": -12.75634765625, "global_step": 445956, "epoch": 2654} {"train_loss": -12.671100616455078, "global_step": 445957, "epoch": 2654} {"train_loss": -12.822802543640137, "global_step": 445958, "epoch": 2654} {"train_loss": -12.763416290283203, "global_step": 445959, "epoch": 2654} {"train_loss": -12.867914199829102, "global_step": 445960, "epoch": 2654} {"train_loss": -12.892643928527832, "global_step": 445961, "epoch": 2654} {"train_loss": -12.843851089477539, "global_step": 445962, "epoch": 2654} {"train_loss": -12.945856094360352, "global_step": 445963, "epoch": 2654} {"train_loss": -12.58044147491455, "global_step": 445964, "epoch": 2654} {"train_loss": -12.787078857421875, "global_step": 445965, "epoch": 2654} {"train_loss": -12.663881301879883, "global_step": 445966, "epoch": 2654} {"train_loss": -13.085936546325684, "global_step": 445967, "epoch": 2654} {"train_loss": -12.656070709228516, "global_step": 445968, "epoch": 2654} {"train_loss": -12.756752014160156, "global_step": 445969, "epoch": 2654} {"train_loss": -12.763456344604492, "global_step": 445970, "epoch": 2654} {"train_loss": -12.583703994750977, "global_step": 445971, "epoch": 2654} {"train_loss": -12.71960735321045, "global_step": 445972, "epoch": 2654} {"train_loss": -12.855924606323242, "global_step": 445973, "epoch": 2654} {"train_loss": -12.728059768676758, "global_step": 445974, "epoch": 2654} {"train_loss": -12.556412696838379, "global_step": 445975, "epoch": 2654} {"train_loss": -12.705723762512207, "global_step": 445976, "epoch": 2654} {"train_loss": -12.901481628417969, "global_step": 445977, "epoch": 2654} {"train_loss": -12.752191543579102, "global_step": 445978, "epoch": 2654} {"train_loss": -12.778951644897461, "global_step": 445979, "epoch": 2654} {"train_loss": -12.820656776428223, "global_step": 445980, "epoch": 2654} {"train_loss": -12.987091064453125, "global_step": 445981, "epoch": 2654} {"train_loss": -12.771150588989258, "global_step": 445982, "epoch": 2654} {"train_loss": -12.678731918334961, "global_step": 445983, "epoch": 2654} {"train_loss": -12.495140075683594, "global_step": 445984, "epoch": 2654} {"train_loss": -12.455789566040039, "global_step": 445985, "epoch": 2654} {"train_loss": -12.658126831054688, "global_step": 445986, "epoch": 2654} {"train_loss": -12.783267974853516, "global_step": 445987, "epoch": 2654} {"train_loss": -12.253532409667969, "global_step": 445988, "epoch": 2654} {"train_loss": -12.679540634155273, "global_step": 445989, "epoch": 2654} {"train_loss": -12.630868911743164, "global_step": 445990, "epoch": 2654} {"train_loss": -12.276307106018066, "global_step": 445991, "epoch": 2654} {"train_loss": -12.745397567749023, "global_step": 445992, "epoch": 2654} {"train_loss": -12.545950889587402, "global_step": 445993, "epoch": 2654} {"train_loss": -12.168771743774414, "global_step": 445994, "epoch": 2654} {"train_loss": -12.486088752746582, "global_step": 445995, "epoch": 2654} {"train_loss": -12.712061882019043, "global_step": 445996, "epoch": 2654} {"train_loss": -12.372871398925781, "global_step": 445997, "epoch": 2654} {"train_loss": -11.462154388427734, "global_step": 445998, "epoch": 2654} {"train_loss": -11.90201187133789, "global_step": 445999, "epoch": 2654} {"train_loss": -11.182267189025879, "global_step": 446000, "epoch": 2654} {"train_loss": -8.951522827148438, "global_step": 446001, "epoch": 2654} {"train_loss": -10.878890991210938, "global_step": 446002, "epoch": 2654} {"train_loss": -9.116972923278809, "global_step": 446003, "epoch": 2654} {"train_loss": -10.610048294067383, "global_step": 446004, "epoch": 2654} {"train_loss": -10.253470420837402, "global_step": 446005, "epoch": 2654} {"train_loss": -10.048052787780762, "global_step": 446006, "epoch": 2654} {"train_loss": -10.079374313354492, "global_step": 446007, "epoch": 2654} {"train_loss": -11.02905559539795, "global_step": 446008, "epoch": 2654} {"train_loss": -11.26541519165039, "global_step": 446009, "epoch": 2654} {"train_loss": -11.068659782409668, "global_step": 446010, "epoch": 2654} {"train_loss": -11.45566177368164, "global_step": 446011, "epoch": 2654} {"train_loss": -10.430039405822754, "global_step": 446012, "epoch": 2654} {"train_loss": -11.04478931427002, "global_step": 446013, "epoch": 2654} {"train_loss": -11.344507217407227, "global_step": 446014, "epoch": 2654} {"train_loss": -11.549821853637695, "global_step": 446015, "epoch": 2654} {"train_loss": -11.87707233428955, "global_step": 446016, "epoch": 2654} {"train_loss": -11.755629539489746, "global_step": 446017, "epoch": 2654} {"train_loss": -12.231800079345703, "global_step": 446018, "epoch": 2654} {"train_loss": -11.748682975769043, "global_step": 446019, "epoch": 2654} {"train_loss": -11.684328079223633, "global_step": 446020, "epoch": 2654} {"train_loss": -11.945032119750977, "global_step": 446021, "epoch": 2654} {"train_loss": -11.703390121459961, "global_step": 446022, "epoch": 2654} {"train_loss": -12.011518478393555, "global_step": 446023, "epoch": 2654} {"train_loss": -12.182504653930664, "global_step": 446024, "epoch": 2654} {"train_loss": -11.710506439208984, "global_step": 446025, "epoch": 2654} {"train_loss": -11.882753372192383, "global_step": 446026, "epoch": 2654} {"train_loss": -12.401823043823242, "global_step": 446027, "epoch": 2654} {"train_loss": -12.23255443572998, "global_step": 446028, "epoch": 2654} {"train_loss": -11.933780670166016, "global_step": 446029, "epoch": 2654} {"train_loss": -12.49116325378418, "global_step": 446030, "epoch": 2654} {"train_loss": -12.03659439086914, "global_step": 446031, "epoch": 2654} {"train_loss": -12.278400421142578, "global_step": 446032, "epoch": 2654} {"train_loss": -12.126476287841797, "global_step": 446033, "epoch": 2654} {"train_loss": -12.266611099243164, "global_step": 446034, "epoch": 2654} {"train_loss": -12.290874481201172, "global_step": 446035, "epoch": 2654} {"train_loss": -11.908060073852539, "global_step": 446036, "epoch": 2654} {"train_loss": -12.103790283203125, "global_step": 446037, "epoch": 2654} {"train_loss": -11.922539710998535, "global_step": 446038, "epoch": 2654} {"train_loss": -12.165611687160673, "global_step": 446039, "epoch": 2654, "val_loss": 307371.4375} {"train_loss": -12.176801681518555, "global_step": 446040, "epoch": 2655} {"train_loss": -12.21986198425293, "global_step": 446041, "epoch": 2655} {"train_loss": -12.360434532165527, "global_step": 446042, "epoch": 2655} {"train_loss": -12.13300895690918, "global_step": 446043, "epoch": 2655} {"train_loss": -12.158777236938477, "global_step": 446044, "epoch": 2655} {"train_loss": -12.266462326049805, "global_step": 446045, "epoch": 2655} {"train_loss": -12.363981246948242, "global_step": 446046, "epoch": 2655} {"train_loss": -12.201042175292969, "global_step": 446047, "epoch": 2655} {"train_loss": -12.588042259216309, "global_step": 446048, "epoch": 2655} {"train_loss": -12.042169570922852, "global_step": 446049, "epoch": 2655} {"train_loss": -12.664840698242188, "global_step": 446050, "epoch": 2655} {"train_loss": -12.203371047973633, "global_step": 446051, "epoch": 2655} {"train_loss": -11.946406364440918, "global_step": 446052, "epoch": 2655} {"train_loss": -12.455209732055664, "global_step": 446053, "epoch": 2655} {"train_loss": -12.224651336669922, "global_step": 446054, "epoch": 2655} {"train_loss": -12.716534614562988, "global_step": 446055, "epoch": 2655} {"train_loss": -12.304573059082031, "global_step": 446056, "epoch": 2655} {"train_loss": -12.589493751525879, "global_step": 446057, "epoch": 2655} {"train_loss": -12.479137420654297, "global_step": 446058, "epoch": 2655} {"train_loss": -12.402618408203125, "global_step": 446059, "epoch": 2655} {"train_loss": -12.687271118164062, "global_step": 446060, "epoch": 2655} {"train_loss": -12.115250587463379, "global_step": 446061, "epoch": 2655} {"train_loss": -12.695634841918945, "global_step": 446062, "epoch": 2655} {"train_loss": -12.45622444152832, "global_step": 446063, "epoch": 2655} {"train_loss": -12.547833442687988, "global_step": 446064, "epoch": 2655} {"train_loss": -12.82579231262207, "global_step": 446065, "epoch": 2655} {"train_loss": -12.457123756408691, "global_step": 446066, "epoch": 2655} {"train_loss": -12.7069730758667, "global_step": 446067, "epoch": 2655} {"train_loss": -12.851072311401367, "global_step": 446068, "epoch": 2655} {"train_loss": -12.616996765136719, "global_step": 446069, "epoch": 2655} {"train_loss": -12.545875549316406, "global_step": 446070, "epoch": 2655} {"train_loss": -12.600698471069336, "global_step": 446071, "epoch": 2655} {"train_loss": -12.789406776428223, "global_step": 446072, "epoch": 2655} {"train_loss": -12.327552795410156, "global_step": 446073, "epoch": 2655} {"train_loss": -12.794981002807617, "global_step": 446074, "epoch": 2655} {"train_loss": -12.796615600585938, "global_step": 446075, "epoch": 2655} {"train_loss": -12.715306282043457, "global_step": 446076, "epoch": 2655} {"train_loss": -12.528839111328125, "global_step": 446077, "epoch": 2655} {"train_loss": -12.822105407714844, "global_step": 446078, "epoch": 2655} {"train_loss": -12.614388465881348, "global_step": 446079, "epoch": 2655} {"train_loss": -12.479883193969727, "global_step": 446080, "epoch": 2655} {"train_loss": -12.445633888244629, "global_step": 446081, "epoch": 2655} {"train_loss": -12.704421997070312, "global_step": 446082, "epoch": 2655} {"train_loss": -12.547025680541992, "global_step": 446083, "epoch": 2655} {"train_loss": -12.52559757232666, "global_step": 446084, "epoch": 2655} {"train_loss": -12.67213249206543, "global_step": 446085, "epoch": 2655} {"train_loss": -12.549066543579102, "global_step": 446086, "epoch": 2655} {"train_loss": -12.656244277954102, "global_step": 446087, "epoch": 2655} {"train_loss": -12.867511749267578, "global_step": 446088, "epoch": 2655} {"train_loss": -12.200562477111816, "global_step": 446089, "epoch": 2655} {"train_loss": -12.165246963500977, "global_step": 446090, "epoch": 2655} {"train_loss": -12.474328994750977, "global_step": 446091, "epoch": 2655} {"train_loss": -12.705486297607422, "global_step": 446092, "epoch": 2655} {"train_loss": -11.785186767578125, "global_step": 446093, "epoch": 2655} {"train_loss": -12.181822776794434, "global_step": 446094, "epoch": 2655} {"train_loss": -12.656158447265625, "global_step": 446095, "epoch": 2655} {"train_loss": -11.954596519470215, "global_step": 446096, "epoch": 2655} {"train_loss": -12.37013053894043, "global_step": 446097, "epoch": 2655} {"train_loss": -12.012378692626953, "global_step": 446098, "epoch": 2655} {"train_loss": -12.22131633758545, "global_step": 446099, "epoch": 2655} {"train_loss": -12.26003646850586, "global_step": 446100, "epoch": 2655} {"train_loss": -12.890151023864746, "global_step": 446101, "epoch": 2655} {"train_loss": -11.981334686279297, "global_step": 446102, "epoch": 2655} {"train_loss": -12.115575790405273, "global_step": 446103, "epoch": 2655} {"train_loss": -12.450315475463867, "global_step": 446104, "epoch": 2655} {"train_loss": -12.10404109954834, "global_step": 446105, "epoch": 2655} {"train_loss": -12.951642036437988, "global_step": 446106, "epoch": 2655} {"train_loss": -12.590636253356934, "global_step": 446107, "epoch": 2655} {"train_loss": -12.374189376831055, "global_step": 446108, "epoch": 2655} {"train_loss": -12.565972328186035, "global_step": 446109, "epoch": 2655} {"train_loss": -12.42943000793457, "global_step": 446110, "epoch": 2655} {"train_loss": -11.97348690032959, "global_step": 446111, "epoch": 2655} {"train_loss": -12.759429931640625, "global_step": 446112, "epoch": 2655} {"train_loss": -12.286901473999023, "global_step": 446113, "epoch": 2655} {"train_loss": -11.912580490112305, "global_step": 446114, "epoch": 2655} {"train_loss": -12.480937957763672, "global_step": 446115, "epoch": 2655} {"train_loss": -12.296368598937988, "global_step": 446116, "epoch": 2655} {"train_loss": -11.961776733398438, "global_step": 446117, "epoch": 2655} {"train_loss": -12.272462844848633, "global_step": 446118, "epoch": 2655} {"train_loss": -12.557293891906738, "global_step": 446119, "epoch": 2655} {"train_loss": -12.639793395996094, "global_step": 446120, "epoch": 2655} {"train_loss": -12.592039108276367, "global_step": 446121, "epoch": 2655} {"train_loss": -12.198646545410156, "global_step": 446122, "epoch": 2655} {"train_loss": -12.72686767578125, "global_step": 446123, "epoch": 2655} {"train_loss": -12.45798397064209, "global_step": 446124, "epoch": 2655} {"train_loss": -12.31123161315918, "global_step": 446125, "epoch": 2655} {"train_loss": -12.580102920532227, "global_step": 446126, "epoch": 2655} {"train_loss": -12.432748794555664, "global_step": 446127, "epoch": 2655} {"train_loss": -12.62155532836914, "global_step": 446128, "epoch": 2655} {"train_loss": -12.663403511047363, "global_step": 446129, "epoch": 2655} {"train_loss": -11.965801239013672, "global_step": 446130, "epoch": 2655} {"train_loss": -12.531881332397461, "global_step": 446131, "epoch": 2655} {"train_loss": -12.500862121582031, "global_step": 446132, "epoch": 2655} {"train_loss": -12.154911041259766, "global_step": 446133, "epoch": 2655} {"train_loss": -12.470117568969727, "global_step": 446134, "epoch": 2655} {"train_loss": -12.341798782348633, "global_step": 446135, "epoch": 2655} {"train_loss": -12.317662239074707, "global_step": 446136, "epoch": 2655} {"train_loss": -12.581947326660156, "global_step": 446137, "epoch": 2655} {"train_loss": -12.430672645568848, "global_step": 446138, "epoch": 2655} {"train_loss": -12.208721160888672, "global_step": 446139, "epoch": 2655} {"train_loss": -12.499841690063477, "global_step": 446140, "epoch": 2655} {"train_loss": -12.199213027954102, "global_step": 446141, "epoch": 2655} {"train_loss": -11.954115867614746, "global_step": 446142, "epoch": 2655} {"train_loss": -12.70590591430664, "global_step": 446143, "epoch": 2655} {"train_loss": -11.891911506652832, "global_step": 446144, "epoch": 2655} {"train_loss": -11.651369094848633, "global_step": 446145, "epoch": 2655} {"train_loss": -12.629226684570312, "global_step": 446146, "epoch": 2655} {"train_loss": -11.563451766967773, "global_step": 446147, "epoch": 2655} {"train_loss": -12.397266387939453, "global_step": 446148, "epoch": 2655} {"train_loss": -12.60047721862793, "global_step": 446149, "epoch": 2655} {"train_loss": -12.53497314453125, "global_step": 446150, "epoch": 2655} {"train_loss": -12.567355155944824, "global_step": 446151, "epoch": 2655} {"train_loss": -12.718547821044922, "global_step": 446152, "epoch": 2655} {"train_loss": -12.484999656677246, "global_step": 446153, "epoch": 2655} {"train_loss": -12.863693237304688, "global_step": 446154, "epoch": 2655} {"train_loss": -12.569829940795898, "global_step": 446155, "epoch": 2655} {"train_loss": -12.806358337402344, "global_step": 446156, "epoch": 2655} {"train_loss": -12.145769119262695, "global_step": 446157, "epoch": 2655} {"train_loss": -12.513467788696289, "global_step": 446158, "epoch": 2655} {"train_loss": -12.40670108795166, "global_step": 446159, "epoch": 2655} {"train_loss": -12.570648193359375, "global_step": 446160, "epoch": 2655} {"train_loss": -12.165961265563965, "global_step": 446161, "epoch": 2655} {"train_loss": -12.557065963745117, "global_step": 446162, "epoch": 2655} {"train_loss": -12.333356857299805, "global_step": 446163, "epoch": 2655} {"train_loss": -12.250238418579102, "global_step": 446164, "epoch": 2655} {"train_loss": -12.032623291015625, "global_step": 446165, "epoch": 2655} {"train_loss": -11.912002563476562, "global_step": 446166, "epoch": 2655} {"train_loss": -12.395256996154785, "global_step": 446167, "epoch": 2655} {"train_loss": -11.970966339111328, "global_step": 446168, "epoch": 2655} {"train_loss": -12.692377090454102, "global_step": 446169, "epoch": 2655} {"train_loss": -11.605351448059082, "global_step": 446170, "epoch": 2655} {"train_loss": -12.009364128112793, "global_step": 446171, "epoch": 2655} {"train_loss": -11.740823745727539, "global_step": 446172, "epoch": 2655} {"train_loss": -12.341412544250488, "global_step": 446173, "epoch": 2655} {"train_loss": -11.982396125793457, "global_step": 446174, "epoch": 2655} {"train_loss": -12.64246940612793, "global_step": 446175, "epoch": 2655} {"train_loss": -12.333539962768555, "global_step": 446176, "epoch": 2655} {"train_loss": -12.420928955078125, "global_step": 446177, "epoch": 2655} {"train_loss": -12.094219207763672, "global_step": 446178, "epoch": 2655} {"train_loss": -12.456364631652832, "global_step": 446179, "epoch": 2655} {"train_loss": -12.191377639770508, "global_step": 446180, "epoch": 2655} {"train_loss": -11.529151916503906, "global_step": 446181, "epoch": 2655} {"train_loss": -12.028970718383789, "global_step": 446182, "epoch": 2655} {"train_loss": -12.507051467895508, "global_step": 446183, "epoch": 2655} {"train_loss": -11.594280242919922, "global_step": 446184, "epoch": 2655} {"train_loss": -11.801102638244629, "global_step": 446185, "epoch": 2655} {"train_loss": -12.171396255493164, "global_step": 446186, "epoch": 2655} {"train_loss": -9.88931941986084, "global_step": 446187, "epoch": 2655} {"train_loss": -12.263214111328125, "global_step": 446188, "epoch": 2655} {"train_loss": -11.620318412780762, "global_step": 446189, "epoch": 2655} {"train_loss": -11.27989387512207, "global_step": 446190, "epoch": 2655} {"train_loss": -12.071834564208984, "global_step": 446191, "epoch": 2655} {"train_loss": -11.42662239074707, "global_step": 446192, "epoch": 2655} {"train_loss": -11.242673873901367, "global_step": 446193, "epoch": 2655} {"train_loss": -11.50523567199707, "global_step": 446194, "epoch": 2655} {"train_loss": -11.500078201293945, "global_step": 446195, "epoch": 2655} {"train_loss": -11.582008361816406, "global_step": 446196, "epoch": 2655} {"train_loss": -11.483392715454102, "global_step": 446197, "epoch": 2655} {"train_loss": -9.510515213012695, "global_step": 446198, "epoch": 2655} {"train_loss": -10.96956729888916, "global_step": 446199, "epoch": 2655} {"train_loss": -10.273921966552734, "global_step": 446200, "epoch": 2655} {"train_loss": -10.326935768127441, "global_step": 446201, "epoch": 2655} {"train_loss": -8.982000350952148, "global_step": 446202, "epoch": 2655} {"train_loss": -8.354740142822266, "global_step": 446203, "epoch": 2655} {"train_loss": -10.053250312805176, "global_step": 446204, "epoch": 2655} {"train_loss": -10.590646743774414, "global_step": 446205, "epoch": 2655} {"train_loss": -11.50654411315918, "global_step": 446206, "epoch": 2655} {"train_loss": -12.179851066498529, "global_step": 446207, "epoch": 2655, "val_loss": 305970.96875, "train_action_mse_error": 0.3206615447998047} {"train_loss": -11.256386756896973, "global_step": 446208, "epoch": 2656} {"train_loss": -11.082379341125488, "global_step": 446209, "epoch": 2656} {"train_loss": -10.972550392150879, "global_step": 446210, "epoch": 2656} {"train_loss": -11.465417861938477, "global_step": 446211, "epoch": 2656} {"train_loss": -11.193628311157227, "global_step": 446212, "epoch": 2656} {"train_loss": -11.365013122558594, "global_step": 446213, "epoch": 2656} {"train_loss": -10.786569595336914, "global_step": 446214, "epoch": 2656} {"train_loss": -10.75997257232666, "global_step": 446215, "epoch": 2656} {"train_loss": -10.297623634338379, "global_step": 446216, "epoch": 2656} {"train_loss": -10.668941497802734, "global_step": 446217, "epoch": 2656} {"train_loss": -10.722440719604492, "global_step": 446218, "epoch": 2656} {"train_loss": -9.818509101867676, "global_step": 446219, "epoch": 2656} {"train_loss": -11.60400390625, "global_step": 446220, "epoch": 2656} {"train_loss": -11.266192436218262, "global_step": 446221, "epoch": 2656} {"train_loss": -11.915610313415527, "global_step": 446222, "epoch": 2656} {"train_loss": -10.894161224365234, "global_step": 446223, "epoch": 2656} {"train_loss": -11.6487455368042, "global_step": 446224, "epoch": 2656} {"train_loss": -11.21008014678955, "global_step": 446225, "epoch": 2656} {"train_loss": -12.287460327148438, "global_step": 446226, "epoch": 2656} {"train_loss": -11.366910934448242, "global_step": 446227, "epoch": 2656} {"train_loss": -12.024823188781738, "global_step": 446228, "epoch": 2656} {"train_loss": -11.580951690673828, "global_step": 446229, "epoch": 2656} {"train_loss": -12.172557830810547, "global_step": 446230, "epoch": 2656} {"train_loss": -11.237384796142578, "global_step": 446231, "epoch": 2656} {"train_loss": -12.166149139404297, "global_step": 446232, "epoch": 2656} {"train_loss": -11.785270690917969, "global_step": 446233, "epoch": 2656} {"train_loss": -12.272672653198242, "global_step": 446234, "epoch": 2656} {"train_loss": -11.86390209197998, "global_step": 446235, "epoch": 2656} {"train_loss": -12.045522689819336, "global_step": 446236, "epoch": 2656} {"train_loss": -12.029287338256836, "global_step": 446237, "epoch": 2656} {"train_loss": -11.922012329101562, "global_step": 446238, "epoch": 2656} {"train_loss": -12.000324249267578, "global_step": 446239, "epoch": 2656} {"train_loss": -12.334595680236816, "global_step": 446240, "epoch": 2656} {"train_loss": -12.210440635681152, "global_step": 446241, "epoch": 2656} {"train_loss": -12.14976692199707, "global_step": 446242, "epoch": 2656} {"train_loss": -12.07347583770752, "global_step": 446243, "epoch": 2656} {"train_loss": -12.134915351867676, "global_step": 446244, "epoch": 2656} {"train_loss": -12.455398559570312, "global_step": 446245, "epoch": 2656} {"train_loss": -12.154680252075195, "global_step": 446246, "epoch": 2656} {"train_loss": -12.093035697937012, "global_step": 446247, "epoch": 2656} {"train_loss": -12.220113754272461, "global_step": 446248, "epoch": 2656} {"train_loss": -12.306655883789062, "global_step": 446249, "epoch": 2656} {"train_loss": -12.4847412109375, "global_step": 446250, "epoch": 2656} {"train_loss": -12.185988426208496, "global_step": 446251, "epoch": 2656} {"train_loss": -12.189254760742188, "global_step": 446252, "epoch": 2656} {"train_loss": -12.239381790161133, "global_step": 446253, "epoch": 2656} {"train_loss": -12.383596420288086, "global_step": 446254, "epoch": 2656} {"train_loss": -12.255945205688477, "global_step": 446255, "epoch": 2656} {"train_loss": -12.494434356689453, "global_step": 446256, "epoch": 2656} {"train_loss": -12.50529670715332, "global_step": 446257, "epoch": 2656} {"train_loss": -12.560669898986816, "global_step": 446258, "epoch": 2656} {"train_loss": -12.341476440429688, "global_step": 446259, "epoch": 2656} {"train_loss": -12.366222381591797, "global_step": 446260, "epoch": 2656} {"train_loss": -12.547165870666504, "global_step": 446261, "epoch": 2656} {"train_loss": -12.326196670532227, "global_step": 446262, "epoch": 2656} {"train_loss": -12.245855331420898, "global_step": 446263, "epoch": 2656} {"train_loss": -12.488753318786621, "global_step": 446264, "epoch": 2656} {"train_loss": -12.504704475402832, "global_step": 446265, "epoch": 2656} {"train_loss": -12.555505752563477, "global_step": 446266, "epoch": 2656} {"train_loss": -12.569917678833008, "global_step": 446267, "epoch": 2656} {"train_loss": -12.406620979309082, "global_step": 446268, "epoch": 2656} {"train_loss": -12.461639404296875, "global_step": 446269, "epoch": 2656} {"train_loss": -12.385173797607422, "global_step": 446270, "epoch": 2656} {"train_loss": -12.398979187011719, "global_step": 446271, "epoch": 2656} {"train_loss": -12.314474105834961, "global_step": 446272, "epoch": 2656} {"train_loss": -12.571924209594727, "global_step": 446273, "epoch": 2656} {"train_loss": -12.263672828674316, "global_step": 446274, "epoch": 2656} {"train_loss": -12.570999145507812, "global_step": 446275, "epoch": 2656} {"train_loss": -12.246204376220703, "global_step": 446276, "epoch": 2656} {"train_loss": -12.350260734558105, "global_step": 446277, "epoch": 2656} {"train_loss": -12.510892868041992, "global_step": 446278, "epoch": 2656} {"train_loss": -12.471431732177734, "global_step": 446279, "epoch": 2656} {"train_loss": -12.40108871459961, "global_step": 446280, "epoch": 2656} {"train_loss": -12.520174980163574, "global_step": 446281, "epoch": 2656} {"train_loss": -12.537217140197754, "global_step": 446282, "epoch": 2656} {"train_loss": -12.666851043701172, "global_step": 446283, "epoch": 2656} {"train_loss": -12.65418815612793, "global_step": 446284, "epoch": 2656} {"train_loss": -12.324092864990234, "global_step": 446285, "epoch": 2656} {"train_loss": -12.566938400268555, "global_step": 446286, "epoch": 2656} {"train_loss": -12.480293273925781, "global_step": 446287, "epoch": 2656} {"train_loss": -12.486300468444824, "global_step": 446288, "epoch": 2656} {"train_loss": -12.436727523803711, "global_step": 446289, "epoch": 2656} {"train_loss": -12.730020523071289, "global_step": 446290, "epoch": 2656} {"train_loss": -12.25672435760498, "global_step": 446291, "epoch": 2656} {"train_loss": -12.740099906921387, "global_step": 446292, "epoch": 2656} {"train_loss": -12.298501014709473, "global_step": 446293, "epoch": 2656} {"train_loss": -12.850996017456055, "global_step": 446294, "epoch": 2656} {"train_loss": -12.516851425170898, "global_step": 446295, "epoch": 2656} {"train_loss": -12.784049987792969, "global_step": 446296, "epoch": 2656} {"train_loss": -12.372920989990234, "global_step": 446297, "epoch": 2656} {"train_loss": -12.439544677734375, "global_step": 446298, "epoch": 2656} {"train_loss": -12.787928581237793, "global_step": 446299, "epoch": 2656} {"train_loss": -12.838058471679688, "global_step": 446300, "epoch": 2656} {"train_loss": -12.667943954467773, "global_step": 446301, "epoch": 2656} {"train_loss": -12.726163864135742, "global_step": 446302, "epoch": 2656} {"train_loss": -12.486791610717773, "global_step": 446303, "epoch": 2656} {"train_loss": -12.641145706176758, "global_step": 446304, "epoch": 2656} {"train_loss": -12.591398239135742, "global_step": 446305, "epoch": 2656} {"train_loss": -12.684623718261719, "global_step": 446306, "epoch": 2656} {"train_loss": -12.696908950805664, "global_step": 446307, "epoch": 2656} {"train_loss": -12.353291511535645, "global_step": 446308, "epoch": 2656} {"train_loss": -12.74056339263916, "global_step": 446309, "epoch": 2656} {"train_loss": -12.70524787902832, "global_step": 446310, "epoch": 2656} {"train_loss": -12.439102172851562, "global_step": 446311, "epoch": 2656} {"train_loss": -12.524116516113281, "global_step": 446312, "epoch": 2656} {"train_loss": -12.45857048034668, "global_step": 446313, "epoch": 2656} {"train_loss": -12.202438354492188, "global_step": 446314, "epoch": 2656} {"train_loss": -12.700794219970703, "global_step": 446315, "epoch": 2656} {"train_loss": -12.263664245605469, "global_step": 446316, "epoch": 2656} {"train_loss": -12.500415802001953, "global_step": 446317, "epoch": 2656} {"train_loss": -12.692712783813477, "global_step": 446318, "epoch": 2656} {"train_loss": -12.488555908203125, "global_step": 446319, "epoch": 2656} {"train_loss": -12.69676399230957, "global_step": 446320, "epoch": 2656} {"train_loss": -12.710809707641602, "global_step": 446321, "epoch": 2656} {"train_loss": -12.526592254638672, "global_step": 446322, "epoch": 2656} {"train_loss": -12.7551851272583, "global_step": 446323, "epoch": 2656} {"train_loss": -12.885810852050781, "global_step": 446324, "epoch": 2656} {"train_loss": -12.794411659240723, "global_step": 446325, "epoch": 2656} {"train_loss": -12.859288215637207, "global_step": 446326, "epoch": 2656} {"train_loss": -12.966065406799316, "global_step": 446327, "epoch": 2656} {"train_loss": -12.75280475616455, "global_step": 446328, "epoch": 2656} {"train_loss": -12.942757606506348, "global_step": 446329, "epoch": 2656} {"train_loss": -12.755975723266602, "global_step": 446330, "epoch": 2656} {"train_loss": -12.969095230102539, "global_step": 446331, "epoch": 2656} {"train_loss": -12.840557098388672, "global_step": 446332, "epoch": 2656} {"train_loss": -12.499940872192383, "global_step": 446333, "epoch": 2656} {"train_loss": -12.766865730285645, "global_step": 446334, "epoch": 2656} {"train_loss": -12.331518173217773, "global_step": 446335, "epoch": 2656} {"train_loss": -12.826008796691895, "global_step": 446336, "epoch": 2656} {"train_loss": -13.034103393554688, "global_step": 446337, "epoch": 2656} {"train_loss": -12.362746238708496, "global_step": 446338, "epoch": 2656} {"train_loss": -12.21723747253418, "global_step": 446339, "epoch": 2656} {"train_loss": -12.817838668823242, "global_step": 446340, "epoch": 2656} {"train_loss": -12.993648529052734, "global_step": 446341, "epoch": 2656} {"train_loss": -12.785160064697266, "global_step": 446342, "epoch": 2656} {"train_loss": -12.493871688842773, "global_step": 446343, "epoch": 2656} {"train_loss": -12.651388168334961, "global_step": 446344, "epoch": 2656} {"train_loss": -12.353984832763672, "global_step": 446345, "epoch": 2656} {"train_loss": -12.458806991577148, "global_step": 446346, "epoch": 2656} {"train_loss": -12.746675491333008, "global_step": 446347, "epoch": 2656} {"train_loss": -12.495085716247559, "global_step": 446348, "epoch": 2656} {"train_loss": -13.154995918273926, "global_step": 446349, "epoch": 2656} {"train_loss": -12.852209091186523, "global_step": 446350, "epoch": 2656} {"train_loss": -12.823687553405762, "global_step": 446351, "epoch": 2656} {"train_loss": -12.596662521362305, "global_step": 446352, "epoch": 2656} {"train_loss": -12.88089370727539, "global_step": 446353, "epoch": 2656} {"train_loss": -12.866413116455078, "global_step": 446354, "epoch": 2656} {"train_loss": -12.889894485473633, "global_step": 446355, "epoch": 2656} {"train_loss": -12.758161544799805, "global_step": 446356, "epoch": 2656} {"train_loss": -12.644457817077637, "global_step": 446357, "epoch": 2656} {"train_loss": -12.586569786071777, "global_step": 446358, "epoch": 2656} {"train_loss": -12.304142951965332, "global_step": 446359, "epoch": 2656} {"train_loss": -12.541412353515625, "global_step": 446360, "epoch": 2656} {"train_loss": -12.523992538452148, "global_step": 446361, "epoch": 2656} {"train_loss": -12.601954460144043, "global_step": 446362, "epoch": 2656} {"train_loss": -12.48745346069336, "global_step": 446363, "epoch": 2656} {"train_loss": -12.555695533752441, "global_step": 446364, "epoch": 2656} {"train_loss": -12.963763236999512, "global_step": 446365, "epoch": 2656} {"train_loss": -12.52393913269043, "global_step": 446366, "epoch": 2656} {"train_loss": -12.495314598083496, "global_step": 446367, "epoch": 2656} {"train_loss": -12.809599876403809, "global_step": 446368, "epoch": 2656} {"train_loss": -12.579195022583008, "global_step": 446369, "epoch": 2656} {"train_loss": -12.142748832702637, "global_step": 446370, "epoch": 2656} {"train_loss": -12.028938293457031, "global_step": 446371, "epoch": 2656} {"train_loss": -12.814412117004395, "global_step": 446372, "epoch": 2656} {"train_loss": -11.723421096801758, "global_step": 446373, "epoch": 2656} {"train_loss": -11.436400413513184, "global_step": 446374, "epoch": 2656} {"train_loss": -12.312233686447144, "global_step": 446375, "epoch": 2656, "val_loss": 309383.75} {"train_loss": -12.177927017211914, "global_step": 446376, "epoch": 2657} {"train_loss": -12.170114517211914, "global_step": 446377, "epoch": 2657} {"train_loss": -12.298676490783691, "global_step": 446378, "epoch": 2657} {"train_loss": -12.707317352294922, "global_step": 446379, "epoch": 2657} {"train_loss": -12.552793502807617, "global_step": 446380, "epoch": 2657} {"train_loss": -12.723108291625977, "global_step": 446381, "epoch": 2657} {"train_loss": -12.322639465332031, "global_step": 446382, "epoch": 2657} {"train_loss": -12.658111572265625, "global_step": 446383, "epoch": 2657} {"train_loss": -12.297820091247559, "global_step": 446384, "epoch": 2657} {"train_loss": -12.474510192871094, "global_step": 446385, "epoch": 2657} {"train_loss": -12.586017608642578, "global_step": 446386, "epoch": 2657} {"train_loss": -12.146688461303711, "global_step": 446387, "epoch": 2657} {"train_loss": -12.07547664642334, "global_step": 446388, "epoch": 2657} {"train_loss": -12.545400619506836, "global_step": 446389, "epoch": 2657} {"train_loss": -11.98875617980957, "global_step": 446390, "epoch": 2657} {"train_loss": -12.567243576049805, "global_step": 446391, "epoch": 2657} {"train_loss": -11.844242095947266, "global_step": 446392, "epoch": 2657} {"train_loss": -11.745376586914062, "global_step": 446393, "epoch": 2657} {"train_loss": -11.851839065551758, "global_step": 446394, "epoch": 2657} {"train_loss": -12.179936408996582, "global_step": 446395, "epoch": 2657} {"train_loss": -8.908363342285156, "global_step": 446396, "epoch": 2657} {"train_loss": -12.33999252319336, "global_step": 446397, "epoch": 2657} {"train_loss": -11.292049407958984, "global_step": 446398, "epoch": 2657} {"train_loss": -9.530908584594727, "global_step": 446399, "epoch": 2657} {"train_loss": -9.273200035095215, "global_step": 446400, "epoch": 2657} {"train_loss": -11.314422607421875, "global_step": 446401, "epoch": 2657} {"train_loss": -9.218902587890625, "global_step": 446402, "epoch": 2657} {"train_loss": -10.807975769042969, "global_step": 446403, "epoch": 2657} {"train_loss": -10.082376480102539, "global_step": 446404, "epoch": 2657} {"train_loss": -9.666932106018066, "global_step": 446405, "epoch": 2657} {"train_loss": -10.014932632446289, "global_step": 446406, "epoch": 2657} {"train_loss": -11.096500396728516, "global_step": 446407, "epoch": 2657} {"train_loss": -11.121269226074219, "global_step": 446408, "epoch": 2657} {"train_loss": -11.803086280822754, "global_step": 446409, "epoch": 2657} {"train_loss": -10.734779357910156, "global_step": 446410, "epoch": 2657} {"train_loss": -10.629091262817383, "global_step": 446411, "epoch": 2657} {"train_loss": -11.748744010925293, "global_step": 446412, "epoch": 2657} {"train_loss": -10.713081359863281, "global_step": 446413, "epoch": 2657} {"train_loss": -12.025382995605469, "global_step": 446414, "epoch": 2657} {"train_loss": -11.608397483825684, "global_step": 446415, "epoch": 2657} {"train_loss": -12.209687232971191, "global_step": 446416, "epoch": 2657} {"train_loss": -11.97212028503418, "global_step": 446417, "epoch": 2657} {"train_loss": -12.113523483276367, "global_step": 446418, "epoch": 2657} {"train_loss": -12.085089683532715, "global_step": 446419, "epoch": 2657} {"train_loss": -12.330820083618164, "global_step": 446420, "epoch": 2657} {"train_loss": -11.947694778442383, "global_step": 446421, "epoch": 2657} {"train_loss": -11.887153625488281, "global_step": 446422, "epoch": 2657} {"train_loss": -12.111136436462402, "global_step": 446423, "epoch": 2657} {"train_loss": -12.201671600341797, "global_step": 446424, "epoch": 2657} {"train_loss": -12.491016387939453, "global_step": 446425, "epoch": 2657} {"train_loss": -11.963582992553711, "global_step": 446426, "epoch": 2657} {"train_loss": -12.202657699584961, "global_step": 446427, "epoch": 2657} {"train_loss": -12.445415496826172, "global_step": 446428, "epoch": 2657} {"train_loss": -12.254337310791016, "global_step": 446429, "epoch": 2657} {"train_loss": -12.13736629486084, "global_step": 446430, "epoch": 2657} {"train_loss": -12.25181770324707, "global_step": 446431, "epoch": 2657} {"train_loss": -11.874266624450684, "global_step": 446432, "epoch": 2657} {"train_loss": -12.285116195678711, "global_step": 446433, "epoch": 2657} {"train_loss": -12.466429710388184, "global_step": 446434, "epoch": 2657} {"train_loss": -12.148187637329102, "global_step": 446435, "epoch": 2657} {"train_loss": -12.245600700378418, "global_step": 446436, "epoch": 2657} {"train_loss": -12.426815032958984, "global_step": 446437, "epoch": 2657} {"train_loss": -12.117589950561523, "global_step": 446438, "epoch": 2657} {"train_loss": -12.278724670410156, "global_step": 446439, "epoch": 2657} {"train_loss": -12.31089973449707, "global_step": 446440, "epoch": 2657} {"train_loss": -12.094961166381836, "global_step": 446441, "epoch": 2657} {"train_loss": -12.613374710083008, "global_step": 446442, "epoch": 2657} {"train_loss": -12.207257270812988, "global_step": 446443, "epoch": 2657} {"train_loss": -12.354351043701172, "global_step": 446444, "epoch": 2657} {"train_loss": -12.50377082824707, "global_step": 446445, "epoch": 2657} {"train_loss": -12.399861335754395, "global_step": 446446, "epoch": 2657} {"train_loss": -12.394607543945312, "global_step": 446447, "epoch": 2657} {"train_loss": -12.393718719482422, "global_step": 446448, "epoch": 2657} {"train_loss": -11.870704650878906, "global_step": 446449, "epoch": 2657} {"train_loss": -12.74215316772461, "global_step": 446450, "epoch": 2657} {"train_loss": -12.160184860229492, "global_step": 446451, "epoch": 2657} {"train_loss": -12.68603229522705, "global_step": 446452, "epoch": 2657} {"train_loss": -12.071495056152344, "global_step": 446453, "epoch": 2657} {"train_loss": -11.984212875366211, "global_step": 446454, "epoch": 2657} {"train_loss": -12.297262191772461, "global_step": 446455, "epoch": 2657} {"train_loss": -11.400802612304688, "global_step": 446456, "epoch": 2657} {"train_loss": -12.229410171508789, "global_step": 446457, "epoch": 2657} {"train_loss": -11.62879753112793, "global_step": 446458, "epoch": 2657} {"train_loss": -10.857807159423828, "global_step": 446459, "epoch": 2657} {"train_loss": -12.53272819519043, "global_step": 446460, "epoch": 2657} {"train_loss": -10.939054489135742, "global_step": 446461, "epoch": 2657} {"train_loss": -12.488243103027344, "global_step": 446462, "epoch": 2657} {"train_loss": -11.963706970214844, "global_step": 446463, "epoch": 2657} {"train_loss": -11.59931755065918, "global_step": 446464, "epoch": 2657} {"train_loss": -11.80600643157959, "global_step": 446465, "epoch": 2657} {"train_loss": -12.205901145935059, "global_step": 446466, "epoch": 2657} {"train_loss": -11.431242942810059, "global_step": 446467, "epoch": 2657} {"train_loss": -12.257335662841797, "global_step": 446468, "epoch": 2657} {"train_loss": -11.319725036621094, "global_step": 446469, "epoch": 2657} {"train_loss": -10.715424537658691, "global_step": 446470, "epoch": 2657} {"train_loss": -12.603355407714844, "global_step": 446471, "epoch": 2657} {"train_loss": -11.28742504119873, "global_step": 446472, "epoch": 2657} {"train_loss": -12.092103958129883, "global_step": 446473, "epoch": 2657} {"train_loss": -11.814569473266602, "global_step": 446474, "epoch": 2657} {"train_loss": -12.167439460754395, "global_step": 446475, "epoch": 2657} {"train_loss": -12.508988380432129, "global_step": 446476, "epoch": 2657} {"train_loss": -11.733941078186035, "global_step": 446477, "epoch": 2657} {"train_loss": -12.27768611907959, "global_step": 446478, "epoch": 2657} {"train_loss": -11.95694351196289, "global_step": 446479, "epoch": 2657} {"train_loss": -12.460558891296387, "global_step": 446480, "epoch": 2657} {"train_loss": -12.217906951904297, "global_step": 446481, "epoch": 2657} {"train_loss": -12.461525917053223, "global_step": 446482, "epoch": 2657} {"train_loss": -12.53055477142334, "global_step": 446483, "epoch": 2657} {"train_loss": -12.495336532592773, "global_step": 446484, "epoch": 2657} {"train_loss": -12.54221248626709, "global_step": 446485, "epoch": 2657} {"train_loss": -12.579290390014648, "global_step": 446486, "epoch": 2657} {"train_loss": -12.476309776306152, "global_step": 446487, "epoch": 2657} {"train_loss": -12.619120597839355, "global_step": 446488, "epoch": 2657} {"train_loss": -12.55758285522461, "global_step": 446489, "epoch": 2657} {"train_loss": -12.683358192443848, "global_step": 446490, "epoch": 2657} {"train_loss": -12.693717002868652, "global_step": 446491, "epoch": 2657} {"train_loss": -12.714076042175293, "global_step": 446492, "epoch": 2657} {"train_loss": -12.675567626953125, "global_step": 446493, "epoch": 2657} {"train_loss": -12.62607479095459, "global_step": 446494, "epoch": 2657} {"train_loss": -12.690194129943848, "global_step": 446495, "epoch": 2657} {"train_loss": -12.585336685180664, "global_step": 446496, "epoch": 2657} {"train_loss": -12.837505340576172, "global_step": 446497, "epoch": 2657} {"train_loss": -12.633272171020508, "global_step": 446498, "epoch": 2657} {"train_loss": -12.667633056640625, "global_step": 446499, "epoch": 2657} {"train_loss": -12.737335205078125, "global_step": 446500, "epoch": 2657} {"train_loss": -12.72684097290039, "global_step": 446501, "epoch": 2657} {"train_loss": -12.575040817260742, "global_step": 446502, "epoch": 2657} {"train_loss": -12.54360580444336, "global_step": 446503, "epoch": 2657} {"train_loss": -12.619242668151855, "global_step": 446504, "epoch": 2657} {"train_loss": -12.723093032836914, "global_step": 446505, "epoch": 2657} {"train_loss": -12.774303436279297, "global_step": 446506, "epoch": 2657} {"train_loss": -12.697643280029297, "global_step": 446507, "epoch": 2657} {"train_loss": -12.51816177368164, "global_step": 446508, "epoch": 2657} {"train_loss": -12.775277137756348, "global_step": 446509, "epoch": 2657} {"train_loss": -12.63234806060791, "global_step": 446510, "epoch": 2657} {"train_loss": -12.733177185058594, "global_step": 446511, "epoch": 2657} {"train_loss": -12.876913070678711, "global_step": 446512, "epoch": 2657} {"train_loss": -12.5589599609375, "global_step": 446513, "epoch": 2657} {"train_loss": -12.514324188232422, "global_step": 446514, "epoch": 2657} {"train_loss": -12.627368927001953, "global_step": 446515, "epoch": 2657} {"train_loss": -12.424549102783203, "global_step": 446516, "epoch": 2657} {"train_loss": -12.63111686706543, "global_step": 446517, "epoch": 2657} {"train_loss": -12.453668594360352, "global_step": 446518, "epoch": 2657} {"train_loss": -12.620298385620117, "global_step": 446519, "epoch": 2657} {"train_loss": -12.754596710205078, "global_step": 446520, "epoch": 2657} {"train_loss": -12.256959915161133, "global_step": 446521, "epoch": 2657} {"train_loss": -12.632400512695312, "global_step": 446522, "epoch": 2657} {"train_loss": -12.486124038696289, "global_step": 446523, "epoch": 2657} {"train_loss": -12.460685729980469, "global_step": 446524, "epoch": 2657} {"train_loss": -12.424577713012695, "global_step": 446525, "epoch": 2657} {"train_loss": -12.768341064453125, "global_step": 446526, "epoch": 2657} {"train_loss": -12.511926651000977, "global_step": 446527, "epoch": 2657} {"train_loss": -12.849837303161621, "global_step": 446528, "epoch": 2657} {"train_loss": -12.46159839630127, "global_step": 446529, "epoch": 2657} {"train_loss": -12.862401008605957, "global_step": 446530, "epoch": 2657} {"train_loss": -12.536301612854004, "global_step": 446531, "epoch": 2657} {"train_loss": -12.826057434082031, "global_step": 446532, "epoch": 2657} {"train_loss": -12.23819351196289, "global_step": 446533, "epoch": 2657} {"train_loss": -12.430533409118652, "global_step": 446534, "epoch": 2657} {"train_loss": -12.697342872619629, "global_step": 446535, "epoch": 2657} {"train_loss": -12.322916984558105, "global_step": 446536, "epoch": 2657} {"train_loss": -12.525202751159668, "global_step": 446537, "epoch": 2657} {"train_loss": -12.028358459472656, "global_step": 446538, "epoch": 2657} {"train_loss": -12.424442291259766, "global_step": 446539, "epoch": 2657} {"train_loss": -12.092570304870605, "global_step": 446540, "epoch": 2657} {"train_loss": -12.3880033493042, "global_step": 446541, "epoch": 2657} {"train_loss": -11.964376449584961, "global_step": 446542, "epoch": 2657} {"train_loss": -12.126808399245853, "global_step": 446543, "epoch": 2657, "val_loss": 313750.75} {"train_loss": -11.479177474975586, "global_step": 446544, "epoch": 2658} {"train_loss": -11.81948471069336, "global_step": 446545, "epoch": 2658} {"train_loss": -11.876646995544434, "global_step": 446546, "epoch": 2658} {"train_loss": -11.167651176452637, "global_step": 446547, "epoch": 2658} {"train_loss": -11.168703079223633, "global_step": 446548, "epoch": 2658} {"train_loss": -12.340846061706543, "global_step": 446549, "epoch": 2658} {"train_loss": -10.874710083007812, "global_step": 446550, "epoch": 2658} {"train_loss": -12.395954132080078, "global_step": 446551, "epoch": 2658} {"train_loss": -10.476444244384766, "global_step": 446552, "epoch": 2658} {"train_loss": -10.119765281677246, "global_step": 446553, "epoch": 2658} {"train_loss": -10.407173156738281, "global_step": 446554, "epoch": 2658} {"train_loss": -11.06531810760498, "global_step": 446555, "epoch": 2658} {"train_loss": -10.69575309753418, "global_step": 446556, "epoch": 2658} {"train_loss": -10.363086700439453, "global_step": 446557, "epoch": 2658} {"train_loss": -11.571874618530273, "global_step": 446558, "epoch": 2658} {"train_loss": -10.52033519744873, "global_step": 446559, "epoch": 2658} {"train_loss": -11.5323486328125, "global_step": 446560, "epoch": 2658} {"train_loss": -10.470708847045898, "global_step": 446561, "epoch": 2658} {"train_loss": -10.117940902709961, "global_step": 446562, "epoch": 2658} {"train_loss": -10.532295227050781, "global_step": 446563, "epoch": 2658} {"train_loss": -10.373880386352539, "global_step": 446564, "epoch": 2658} {"train_loss": -10.35709285736084, "global_step": 446565, "epoch": 2658} {"train_loss": -10.733078002929688, "global_step": 446566, "epoch": 2658} {"train_loss": -11.588123321533203, "global_step": 446567, "epoch": 2658} {"train_loss": -11.670125007629395, "global_step": 446568, "epoch": 2658} {"train_loss": -11.584433555603027, "global_step": 446569, "epoch": 2658} {"train_loss": -12.215648651123047, "global_step": 446570, "epoch": 2658} {"train_loss": -11.955079078674316, "global_step": 446571, "epoch": 2658} {"train_loss": -11.57858657836914, "global_step": 446572, "epoch": 2658} {"train_loss": -11.83800983428955, "global_step": 446573, "epoch": 2658} {"train_loss": -11.516379356384277, "global_step": 446574, "epoch": 2658} {"train_loss": -12.105419158935547, "global_step": 446575, "epoch": 2658} {"train_loss": -11.816608428955078, "global_step": 446576, "epoch": 2658} {"train_loss": -12.024944305419922, "global_step": 446577, "epoch": 2658} {"train_loss": -11.368043899536133, "global_step": 446578, "epoch": 2658} {"train_loss": -11.239388465881348, "global_step": 446579, "epoch": 2658} {"train_loss": -11.692047119140625, "global_step": 446580, "epoch": 2658} {"train_loss": -10.803242683410645, "global_step": 446581, "epoch": 2658} {"train_loss": -11.43405532836914, "global_step": 446582, "epoch": 2658} {"train_loss": -11.316307067871094, "global_step": 446583, "epoch": 2658} {"train_loss": -11.334125518798828, "global_step": 446584, "epoch": 2658} {"train_loss": -10.520888328552246, "global_step": 446585, "epoch": 2658} {"train_loss": -11.716557502746582, "global_step": 446586, "epoch": 2658} {"train_loss": -10.73141098022461, "global_step": 446587, "epoch": 2658} {"train_loss": -11.876791000366211, "global_step": 446588, "epoch": 2658} {"train_loss": -10.524765014648438, "global_step": 446589, "epoch": 2658} {"train_loss": -12.052620887756348, "global_step": 446590, "epoch": 2658} {"train_loss": -11.20603084564209, "global_step": 446591, "epoch": 2658} {"train_loss": -11.794532775878906, "global_step": 446592, "epoch": 2658} {"train_loss": -11.995296478271484, "global_step": 446593, "epoch": 2658} {"train_loss": -11.395837783813477, "global_step": 446594, "epoch": 2658} {"train_loss": -11.973163604736328, "global_step": 446595, "epoch": 2658} {"train_loss": -11.486943244934082, "global_step": 446596, "epoch": 2658} {"train_loss": -12.114609718322754, "global_step": 446597, "epoch": 2658} {"train_loss": -11.707475662231445, "global_step": 446598, "epoch": 2658} {"train_loss": -12.176619529724121, "global_step": 446599, "epoch": 2658} {"train_loss": -11.834579467773438, "global_step": 446600, "epoch": 2658} {"train_loss": -12.058673858642578, "global_step": 446601, "epoch": 2658} {"train_loss": -12.243416786193848, "global_step": 446602, "epoch": 2658} {"train_loss": -12.497236251831055, "global_step": 446603, "epoch": 2658} {"train_loss": -12.085943222045898, "global_step": 446604, "epoch": 2658} {"train_loss": -12.38751220703125, "global_step": 446605, "epoch": 2658} {"train_loss": -11.892897605895996, "global_step": 446606, "epoch": 2658} {"train_loss": -12.42254638671875, "global_step": 446607, "epoch": 2658} {"train_loss": -12.34938907623291, "global_step": 446608, "epoch": 2658} {"train_loss": -12.245340347290039, "global_step": 446609, "epoch": 2658} {"train_loss": -12.396381378173828, "global_step": 446610, "epoch": 2658} {"train_loss": -12.376609802246094, "global_step": 446611, "epoch": 2658} {"train_loss": -12.346152305603027, "global_step": 446612, "epoch": 2658} {"train_loss": -12.542498588562012, "global_step": 446613, "epoch": 2658} {"train_loss": -12.250638961791992, "global_step": 446614, "epoch": 2658} {"train_loss": -12.649506568908691, "global_step": 446615, "epoch": 2658} {"train_loss": -12.336359024047852, "global_step": 446616, "epoch": 2658} {"train_loss": -12.523069381713867, "global_step": 446617, "epoch": 2658} {"train_loss": -12.423458099365234, "global_step": 446618, "epoch": 2658} {"train_loss": -12.536145210266113, "global_step": 446619, "epoch": 2658} {"train_loss": -12.610128402709961, "global_step": 446620, "epoch": 2658} {"train_loss": -12.55044937133789, "global_step": 446621, "epoch": 2658} {"train_loss": -12.565319061279297, "global_step": 446622, "epoch": 2658} {"train_loss": -12.629072189331055, "global_step": 446623, "epoch": 2658} {"train_loss": -12.707216262817383, "global_step": 446624, "epoch": 2658} {"train_loss": -12.482664108276367, "global_step": 446625, "epoch": 2658} {"train_loss": -12.482757568359375, "global_step": 446626, "epoch": 2658} {"train_loss": -12.67866325378418, "global_step": 446627, "epoch": 2658} {"train_loss": -12.782299041748047, "global_step": 446628, "epoch": 2658} {"train_loss": -12.686380386352539, "global_step": 446629, "epoch": 2658} {"train_loss": -12.617682456970215, "global_step": 446630, "epoch": 2658} {"train_loss": -12.737021446228027, "global_step": 446631, "epoch": 2658} {"train_loss": -12.613319396972656, "global_step": 446632, "epoch": 2658} {"train_loss": -12.516727447509766, "global_step": 446633, "epoch": 2658} {"train_loss": -12.652212142944336, "global_step": 446634, "epoch": 2658} {"train_loss": -12.797368049621582, "global_step": 446635, "epoch": 2658} {"train_loss": -12.691965103149414, "global_step": 446636, "epoch": 2658} {"train_loss": -12.896995544433594, "global_step": 446637, "epoch": 2658} {"train_loss": -12.456350326538086, "global_step": 446638, "epoch": 2658} {"train_loss": -12.95132827758789, "global_step": 446639, "epoch": 2658} {"train_loss": -12.751897811889648, "global_step": 446640, "epoch": 2658} {"train_loss": -12.490930557250977, "global_step": 446641, "epoch": 2658} {"train_loss": -12.791402816772461, "global_step": 446642, "epoch": 2658} {"train_loss": -12.559253692626953, "global_step": 446643, "epoch": 2658} {"train_loss": -12.877236366271973, "global_step": 446644, "epoch": 2658} {"train_loss": -12.711936950683594, "global_step": 446645, "epoch": 2658} {"train_loss": -12.73664379119873, "global_step": 446646, "epoch": 2658} {"train_loss": -12.695115089416504, "global_step": 446647, "epoch": 2658} {"train_loss": -12.767864227294922, "global_step": 446648, "epoch": 2658} {"train_loss": -12.665014266967773, "global_step": 446649, "epoch": 2658} {"train_loss": -12.939236640930176, "global_step": 446650, "epoch": 2658} {"train_loss": -12.879193305969238, "global_step": 446651, "epoch": 2658} {"train_loss": -12.560478210449219, "global_step": 446652, "epoch": 2658} {"train_loss": -12.984550476074219, "global_step": 446653, "epoch": 2658} {"train_loss": -12.661256790161133, "global_step": 446654, "epoch": 2658} {"train_loss": -12.961902618408203, "global_step": 446655, "epoch": 2658} {"train_loss": -12.692686080932617, "global_step": 446656, "epoch": 2658} {"train_loss": -12.844850540161133, "global_step": 446657, "epoch": 2658} {"train_loss": -12.488412857055664, "global_step": 446658, "epoch": 2658} {"train_loss": -12.415289878845215, "global_step": 446659, "epoch": 2658} {"train_loss": -12.717849731445312, "global_step": 446660, "epoch": 2658} {"train_loss": -12.505218505859375, "global_step": 446661, "epoch": 2658} {"train_loss": -12.61377239227295, "global_step": 446662, "epoch": 2658} {"train_loss": -12.458184242248535, "global_step": 446663, "epoch": 2658} {"train_loss": -12.830183029174805, "global_step": 446664, "epoch": 2658} {"train_loss": -12.06330394744873, "global_step": 446665, "epoch": 2658} {"train_loss": -12.153570175170898, "global_step": 446666, "epoch": 2658} {"train_loss": -12.206474304199219, "global_step": 446667, "epoch": 2658} {"train_loss": -12.411521911621094, "global_step": 446668, "epoch": 2658} {"train_loss": -12.550482749938965, "global_step": 446669, "epoch": 2658} {"train_loss": -12.699283599853516, "global_step": 446670, "epoch": 2658} {"train_loss": -12.540708541870117, "global_step": 446671, "epoch": 2658} {"train_loss": -12.755897521972656, "global_step": 446672, "epoch": 2658} {"train_loss": -12.48044490814209, "global_step": 446673, "epoch": 2658} {"train_loss": -12.915870666503906, "global_step": 446674, "epoch": 2658} {"train_loss": -12.470682144165039, "global_step": 446675, "epoch": 2658} {"train_loss": -12.553709983825684, "global_step": 446676, "epoch": 2658} {"train_loss": -12.34556770324707, "global_step": 446677, "epoch": 2658} {"train_loss": -12.870176315307617, "global_step": 446678, "epoch": 2658} {"train_loss": -12.627625465393066, "global_step": 446679, "epoch": 2658} {"train_loss": -12.10528564453125, "global_step": 446680, "epoch": 2658} {"train_loss": -12.447413444519043, "global_step": 446681, "epoch": 2658} {"train_loss": -12.52374267578125, "global_step": 446682, "epoch": 2658} {"train_loss": -12.438043594360352, "global_step": 446683, "epoch": 2658} {"train_loss": -12.262237548828125, "global_step": 446684, "epoch": 2658} {"train_loss": -12.556979179382324, "global_step": 446685, "epoch": 2658} {"train_loss": -11.32686710357666, "global_step": 446686, "epoch": 2658} {"train_loss": -11.420476913452148, "global_step": 446687, "epoch": 2658} {"train_loss": -12.72127628326416, "global_step": 446688, "epoch": 2658} {"train_loss": -11.811527252197266, "global_step": 446689, "epoch": 2658} {"train_loss": -11.80279541015625, "global_step": 446690, "epoch": 2658} {"train_loss": -12.413308143615723, "global_step": 446691, "epoch": 2658} {"train_loss": -12.835271835327148, "global_step": 446692, "epoch": 2658} {"train_loss": -11.843192100524902, "global_step": 446693, "epoch": 2658} {"train_loss": -12.441892623901367, "global_step": 446694, "epoch": 2658} {"train_loss": -12.68548583984375, "global_step": 446695, "epoch": 2658} {"train_loss": -12.57090950012207, "global_step": 446696, "epoch": 2658} {"train_loss": -12.64596176147461, "global_step": 446697, "epoch": 2658} {"train_loss": -12.896438598632812, "global_step": 446698, "epoch": 2658} {"train_loss": -12.406534194946289, "global_step": 446699, "epoch": 2658} {"train_loss": -12.487831115722656, "global_step": 446700, "epoch": 2658} {"train_loss": -12.652801513671875, "global_step": 446701, "epoch": 2658} {"train_loss": -12.248802185058594, "global_step": 446702, "epoch": 2658} {"train_loss": -12.023083686828613, "global_step": 446703, "epoch": 2658} {"train_loss": -12.730785369873047, "global_step": 446704, "epoch": 2658} {"train_loss": -12.23962116241455, "global_step": 446705, "epoch": 2658} {"train_loss": -11.85921859741211, "global_step": 446706, "epoch": 2658} {"train_loss": -11.882855415344238, "global_step": 446707, "epoch": 2658} {"train_loss": -12.355657577514648, "global_step": 446708, "epoch": 2658} {"train_loss": -11.262811660766602, "global_step": 446709, "epoch": 2658} {"train_loss": -12.357576370239258, "global_step": 446710, "epoch": 2658} {"train_loss": -12.087932098479499, "global_step": 446711, "epoch": 2658, "val_loss": 311686.8125} {"train_loss": -11.590248107910156, "global_step": 446712, "epoch": 2659} {"train_loss": -8.481647491455078, "global_step": 446713, "epoch": 2659} {"train_loss": -7.8862528800964355, "global_step": 446714, "epoch": 2659} {"train_loss": -7.799899101257324, "global_step": 446715, "epoch": 2659} {"train_loss": -7.829329013824463, "global_step": 446716, "epoch": 2659} {"train_loss": -8.050727844238281, "global_step": 446717, "epoch": 2659} {"train_loss": -7.884652137756348, "global_step": 446718, "epoch": 2659} {"train_loss": -8.529594421386719, "global_step": 446719, "epoch": 2659} {"train_loss": -8.761375427246094, "global_step": 446720, "epoch": 2659} {"train_loss": -8.53898811340332, "global_step": 446721, "epoch": 2659} {"train_loss": -8.794869422912598, "global_step": 446722, "epoch": 2659} {"train_loss": -9.44727897644043, "global_step": 446723, "epoch": 2659} {"train_loss": -9.232759475708008, "global_step": 446724, "epoch": 2659} {"train_loss": -8.60352611541748, "global_step": 446725, "epoch": 2659} {"train_loss": -9.452381134033203, "global_step": 446726, "epoch": 2659} {"train_loss": -9.306418418884277, "global_step": 446727, "epoch": 2659} {"train_loss": -9.942636489868164, "global_step": 446728, "epoch": 2659} {"train_loss": -11.028621673583984, "global_step": 446729, "epoch": 2659} {"train_loss": -10.647890090942383, "global_step": 446730, "epoch": 2659} {"train_loss": -10.836212158203125, "global_step": 446731, "epoch": 2659} {"train_loss": -10.940686225891113, "global_step": 446732, "epoch": 2659} {"train_loss": -10.83536148071289, "global_step": 446733, "epoch": 2659} {"train_loss": -11.059494972229004, "global_step": 446734, "epoch": 2659} {"train_loss": -11.052507400512695, "global_step": 446735, "epoch": 2659} {"train_loss": -11.040239334106445, "global_step": 446736, "epoch": 2659} {"train_loss": -10.866853713989258, "global_step": 446737, "epoch": 2659} {"train_loss": -11.425862312316895, "global_step": 446738, "epoch": 2659} {"train_loss": -11.679817199707031, "global_step": 446739, "epoch": 2659} {"train_loss": -11.253928184509277, "global_step": 446740, "epoch": 2659} {"train_loss": -11.58575439453125, "global_step": 446741, "epoch": 2659} {"train_loss": -11.663920402526855, "global_step": 446742, "epoch": 2659} {"train_loss": -11.89556884765625, "global_step": 446743, "epoch": 2659} {"train_loss": -12.301593780517578, "global_step": 446744, "epoch": 2659} {"train_loss": -11.594865798950195, "global_step": 446745, "epoch": 2659} {"train_loss": -11.701797485351562, "global_step": 446746, "epoch": 2659} {"train_loss": -11.68416976928711, "global_step": 446747, "epoch": 2659} {"train_loss": -11.572440147399902, "global_step": 446748, "epoch": 2659} {"train_loss": -11.679377555847168, "global_step": 446749, "epoch": 2659} {"train_loss": -11.417598724365234, "global_step": 446750, "epoch": 2659} {"train_loss": -10.985984802246094, "global_step": 446751, "epoch": 2659} {"train_loss": -11.257823944091797, "global_step": 446752, "epoch": 2659} {"train_loss": -10.913408279418945, "global_step": 446753, "epoch": 2659} {"train_loss": -11.537960052490234, "global_step": 446754, "epoch": 2659} {"train_loss": -11.493013381958008, "global_step": 446755, "epoch": 2659} {"train_loss": -12.020381927490234, "global_step": 446756, "epoch": 2659} {"train_loss": -12.069385528564453, "global_step": 446757, "epoch": 2659} {"train_loss": -11.584970474243164, "global_step": 446758, "epoch": 2659} {"train_loss": -12.022298812866211, "global_step": 446759, "epoch": 2659} {"train_loss": -11.74456787109375, "global_step": 446760, "epoch": 2659} {"train_loss": -12.150127410888672, "global_step": 446761, "epoch": 2659} {"train_loss": -11.727079391479492, "global_step": 446762, "epoch": 2659} {"train_loss": -11.995488166809082, "global_step": 446763, "epoch": 2659} {"train_loss": -11.611343383789062, "global_step": 446764, "epoch": 2659} {"train_loss": -11.458220481872559, "global_step": 446765, "epoch": 2659} {"train_loss": -11.733513832092285, "global_step": 446766, "epoch": 2659} {"train_loss": -11.592218399047852, "global_step": 446767, "epoch": 2659} {"train_loss": -11.60495376586914, "global_step": 446768, "epoch": 2659} {"train_loss": -11.412975311279297, "global_step": 446769, "epoch": 2659} {"train_loss": -11.539908409118652, "global_step": 446770, "epoch": 2659} {"train_loss": -11.936908721923828, "global_step": 446771, "epoch": 2659} {"train_loss": -12.275504112243652, "global_step": 446772, "epoch": 2659} {"train_loss": -12.061200141906738, "global_step": 446773, "epoch": 2659} {"train_loss": -11.971384048461914, "global_step": 446774, "epoch": 2659} {"train_loss": -12.294112205505371, "global_step": 446775, "epoch": 2659} {"train_loss": -12.435721397399902, "global_step": 446776, "epoch": 2659} {"train_loss": -12.316452026367188, "global_step": 446777, "epoch": 2659} {"train_loss": -11.973215103149414, "global_step": 446778, "epoch": 2659} {"train_loss": -12.421419143676758, "global_step": 446779, "epoch": 2659} {"train_loss": -12.446722030639648, "global_step": 446780, "epoch": 2659} {"train_loss": -12.3924560546875, "global_step": 446781, "epoch": 2659} {"train_loss": -12.279993057250977, "global_step": 446782, "epoch": 2659} {"train_loss": -12.43974781036377, "global_step": 446783, "epoch": 2659} {"train_loss": -12.335325241088867, "global_step": 446784, "epoch": 2659} {"train_loss": -12.34377670288086, "global_step": 446785, "epoch": 2659} {"train_loss": -12.631010055541992, "global_step": 446786, "epoch": 2659} {"train_loss": -12.485130310058594, "global_step": 446787, "epoch": 2659} {"train_loss": -12.577003479003906, "global_step": 446788, "epoch": 2659} {"train_loss": -12.56938648223877, "global_step": 446789, "epoch": 2659} {"train_loss": -12.675642967224121, "global_step": 446790, "epoch": 2659} {"train_loss": -12.555635452270508, "global_step": 446791, "epoch": 2659} {"train_loss": -12.652599334716797, "global_step": 446792, "epoch": 2659} {"train_loss": -12.589622497558594, "global_step": 446793, "epoch": 2659} {"train_loss": -12.791828155517578, "global_step": 446794, "epoch": 2659} {"train_loss": -12.784737586975098, "global_step": 446795, "epoch": 2659} {"train_loss": -12.645502090454102, "global_step": 446796, "epoch": 2659} {"train_loss": -12.63638687133789, "global_step": 446797, "epoch": 2659} {"train_loss": -12.846916198730469, "global_step": 446798, "epoch": 2659} {"train_loss": -12.824247360229492, "global_step": 446799, "epoch": 2659} {"train_loss": -12.787779808044434, "global_step": 446800, "epoch": 2659} {"train_loss": -12.887044906616211, "global_step": 446801, "epoch": 2659} {"train_loss": -12.802803039550781, "global_step": 446802, "epoch": 2659} {"train_loss": -12.704025268554688, "global_step": 446803, "epoch": 2659} {"train_loss": -12.761740684509277, "global_step": 446804, "epoch": 2659} {"train_loss": -12.680699348449707, "global_step": 446805, "epoch": 2659} {"train_loss": -12.574397087097168, "global_step": 446806, "epoch": 2659} {"train_loss": -12.765462875366211, "global_step": 446807, "epoch": 2659} {"train_loss": -12.649017333984375, "global_step": 446808, "epoch": 2659} {"train_loss": -12.87401008605957, "global_step": 446809, "epoch": 2659} {"train_loss": -12.867643356323242, "global_step": 446810, "epoch": 2659} {"train_loss": -12.65825366973877, "global_step": 446811, "epoch": 2659} {"train_loss": -12.864737510681152, "global_step": 446812, "epoch": 2659} {"train_loss": -12.82491683959961, "global_step": 446813, "epoch": 2659} {"train_loss": -12.526853561401367, "global_step": 446814, "epoch": 2659} {"train_loss": -12.786856651306152, "global_step": 446815, "epoch": 2659} {"train_loss": -12.736124992370605, "global_step": 446816, "epoch": 2659} {"train_loss": -12.880073547363281, "global_step": 446817, "epoch": 2659} {"train_loss": -12.910236358642578, "global_step": 446818, "epoch": 2659} {"train_loss": -12.875236511230469, "global_step": 446819, "epoch": 2659} {"train_loss": -12.394587516784668, "global_step": 446820, "epoch": 2659} {"train_loss": -12.924419403076172, "global_step": 446821, "epoch": 2659} {"train_loss": -12.639028549194336, "global_step": 446822, "epoch": 2659} {"train_loss": -12.713499069213867, "global_step": 446823, "epoch": 2659} {"train_loss": -12.721586227416992, "global_step": 446824, "epoch": 2659} {"train_loss": -13.008729934692383, "global_step": 446825, "epoch": 2659} {"train_loss": -12.508430480957031, "global_step": 446826, "epoch": 2659} {"train_loss": -12.79791259765625, "global_step": 446827, "epoch": 2659} {"train_loss": -12.699460983276367, "global_step": 446828, "epoch": 2659} {"train_loss": -13.067358016967773, "global_step": 446829, "epoch": 2659} {"train_loss": -12.780080795288086, "global_step": 446830, "epoch": 2659} {"train_loss": -13.023774147033691, "global_step": 446831, "epoch": 2659} {"train_loss": -12.811639785766602, "global_step": 446832, "epoch": 2659} {"train_loss": -12.823841094970703, "global_step": 446833, "epoch": 2659} {"train_loss": -12.707108497619629, "global_step": 446834, "epoch": 2659} {"train_loss": -12.755233764648438, "global_step": 446835, "epoch": 2659} {"train_loss": -12.616294860839844, "global_step": 446836, "epoch": 2659} {"train_loss": -12.902107238769531, "global_step": 446837, "epoch": 2659} {"train_loss": -12.892356872558594, "global_step": 446838, "epoch": 2659} {"train_loss": -12.562315940856934, "global_step": 446839, "epoch": 2659} {"train_loss": -12.903314590454102, "global_step": 446840, "epoch": 2659} {"train_loss": -12.766242980957031, "global_step": 446841, "epoch": 2659} {"train_loss": -12.706280708312988, "global_step": 446842, "epoch": 2659} {"train_loss": -12.586990356445312, "global_step": 446843, "epoch": 2659} {"train_loss": -12.78608512878418, "global_step": 446844, "epoch": 2659} {"train_loss": -12.71822738647461, "global_step": 446845, "epoch": 2659} {"train_loss": -12.871086120605469, "global_step": 446846, "epoch": 2659} {"train_loss": -12.905436515808105, "global_step": 446847, "epoch": 2659} {"train_loss": -12.851762771606445, "global_step": 446848, "epoch": 2659} {"train_loss": -12.910888671875, "global_step": 446849, "epoch": 2659} {"train_loss": -12.978321075439453, "global_step": 446850, "epoch": 2659} {"train_loss": -12.835086822509766, "global_step": 446851, "epoch": 2659} {"train_loss": -12.288726806640625, "global_step": 446852, "epoch": 2659} {"train_loss": -12.750082015991211, "global_step": 446853, "epoch": 2659} {"train_loss": -12.431524276733398, "global_step": 446854, "epoch": 2659} {"train_loss": -12.303756713867188, "global_step": 446855, "epoch": 2659} {"train_loss": -11.285041809082031, "global_step": 446856, "epoch": 2659} {"train_loss": -11.224663734436035, "global_step": 446857, "epoch": 2659} {"train_loss": -12.59141731262207, "global_step": 446858, "epoch": 2659} {"train_loss": -11.553047180175781, "global_step": 446859, "epoch": 2659} {"train_loss": -11.576114654541016, "global_step": 446860, "epoch": 2659} {"train_loss": -12.057125091552734, "global_step": 446861, "epoch": 2659} {"train_loss": -11.903438568115234, "global_step": 446862, "epoch": 2659} {"train_loss": -11.144426345825195, "global_step": 446863, "epoch": 2659} {"train_loss": -11.1239013671875, "global_step": 446864, "epoch": 2659} {"train_loss": -12.19035530090332, "global_step": 446865, "epoch": 2659} {"train_loss": -11.849834442138672, "global_step": 446866, "epoch": 2659} {"train_loss": -12.074884414672852, "global_step": 446867, "epoch": 2659} {"train_loss": -10.801762580871582, "global_step": 446868, "epoch": 2659} {"train_loss": -10.494834899902344, "global_step": 446869, "epoch": 2659} {"train_loss": -11.985006332397461, "global_step": 446870, "epoch": 2659} {"train_loss": -9.251970291137695, "global_step": 446871, "epoch": 2659} {"train_loss": -9.322216987609863, "global_step": 446872, "epoch": 2659} {"train_loss": -11.07362174987793, "global_step": 446873, "epoch": 2659} {"train_loss": -10.03878402709961, "global_step": 446874, "epoch": 2659} {"train_loss": -9.381278991699219, "global_step": 446875, "epoch": 2659} {"train_loss": -10.029308319091797, "global_step": 446876, "epoch": 2659} {"train_loss": -10.138727188110352, "global_step": 446877, "epoch": 2659} {"train_loss": -9.444478988647461, "global_step": 446878, "epoch": 2659} {"train_loss": -11.733888796397618, "global_step": 446879, "epoch": 2659, "val_loss": 308554.34375} {"train_loss": -10.368999481201172, "global_step": 446880, "epoch": 2660} {"train_loss": -10.716327667236328, "global_step": 446881, "epoch": 2660} {"train_loss": -10.366247177124023, "global_step": 446882, "epoch": 2660} {"train_loss": -9.960359573364258, "global_step": 446883, "epoch": 2660} {"train_loss": -11.50922679901123, "global_step": 446884, "epoch": 2660} {"train_loss": -10.19560432434082, "global_step": 446885, "epoch": 2660} {"train_loss": -9.841739654541016, "global_step": 446886, "epoch": 2660} {"train_loss": -11.797852516174316, "global_step": 446887, "epoch": 2660} {"train_loss": -10.192667007446289, "global_step": 446888, "epoch": 2660} {"train_loss": -11.375873565673828, "global_step": 446889, "epoch": 2660} {"train_loss": -10.642630577087402, "global_step": 446890, "epoch": 2660} {"train_loss": -11.187004089355469, "global_step": 446891, "epoch": 2660} {"train_loss": -10.319731712341309, "global_step": 446892, "epoch": 2660} {"train_loss": -11.33432388305664, "global_step": 446893, "epoch": 2660} {"train_loss": -11.2197265625, "global_step": 446894, "epoch": 2660} {"train_loss": -11.734811782836914, "global_step": 446895, "epoch": 2660} {"train_loss": -11.083536148071289, "global_step": 446896, "epoch": 2660} {"train_loss": -11.365833282470703, "global_step": 446897, "epoch": 2660} {"train_loss": -11.389816284179688, "global_step": 446898, "epoch": 2660} {"train_loss": -11.69863510131836, "global_step": 446899, "epoch": 2660} {"train_loss": -11.999273300170898, "global_step": 446900, "epoch": 2660} {"train_loss": -11.766780853271484, "global_step": 446901, "epoch": 2660} {"train_loss": -11.528680801391602, "global_step": 446902, "epoch": 2660} {"train_loss": -11.77894401550293, "global_step": 446903, "epoch": 2660} {"train_loss": -11.957868576049805, "global_step": 446904, "epoch": 2660} {"train_loss": -11.253301620483398, "global_step": 446905, "epoch": 2660} {"train_loss": -11.804841995239258, "global_step": 446906, "epoch": 2660} {"train_loss": -11.713508605957031, "global_step": 446907, "epoch": 2660} {"train_loss": -12.022745132446289, "global_step": 446908, "epoch": 2660} {"train_loss": -11.517450332641602, "global_step": 446909, "epoch": 2660} {"train_loss": -12.040904998779297, "global_step": 446910, "epoch": 2660} {"train_loss": -11.946685791015625, "global_step": 446911, "epoch": 2660} {"train_loss": -11.857006072998047, "global_step": 446912, "epoch": 2660} {"train_loss": -11.948759078979492, "global_step": 446913, "epoch": 2660} {"train_loss": -12.154464721679688, "global_step": 446914, "epoch": 2660} {"train_loss": -12.006961822509766, "global_step": 446915, "epoch": 2660} {"train_loss": -12.074979782104492, "global_step": 446916, "epoch": 2660} {"train_loss": -12.0731201171875, "global_step": 446917, "epoch": 2660} {"train_loss": -12.070908546447754, "global_step": 446918, "epoch": 2660} {"train_loss": -12.131736755371094, "global_step": 446919, "epoch": 2660} {"train_loss": -12.414285659790039, "global_step": 446920, "epoch": 2660} {"train_loss": -12.333768844604492, "global_step": 446921, "epoch": 2660} {"train_loss": -11.882640838623047, "global_step": 446922, "epoch": 2660} {"train_loss": -12.293424606323242, "global_step": 446923, "epoch": 2660} {"train_loss": -12.134714126586914, "global_step": 446924, "epoch": 2660} {"train_loss": -12.044900894165039, "global_step": 446925, "epoch": 2660} {"train_loss": -12.151348114013672, "global_step": 446926, "epoch": 2660} {"train_loss": -12.067869186401367, "global_step": 446927, "epoch": 2660} {"train_loss": -11.977140426635742, "global_step": 446928, "epoch": 2660} {"train_loss": -12.27902603149414, "global_step": 446929, "epoch": 2660} {"train_loss": -12.562932014465332, "global_step": 446930, "epoch": 2660} {"train_loss": -12.045104026794434, "global_step": 446931, "epoch": 2660} {"train_loss": -12.446775436401367, "global_step": 446932, "epoch": 2660} {"train_loss": -12.051602363586426, "global_step": 446933, "epoch": 2660} {"train_loss": -12.42373275756836, "global_step": 446934, "epoch": 2660} {"train_loss": -12.3944091796875, "global_step": 446935, "epoch": 2660} {"train_loss": -12.19317626953125, "global_step": 446936, "epoch": 2660} {"train_loss": -12.624296188354492, "global_step": 446937, "epoch": 2660} {"train_loss": -12.10638427734375, "global_step": 446938, "epoch": 2660} {"train_loss": -12.526017189025879, "global_step": 446939, "epoch": 2660} {"train_loss": -12.237959861755371, "global_step": 446940, "epoch": 2660} {"train_loss": -12.368188858032227, "global_step": 446941, "epoch": 2660} {"train_loss": -12.56390380859375, "global_step": 446942, "epoch": 2660} {"train_loss": -12.286834716796875, "global_step": 446943, "epoch": 2660} {"train_loss": -12.695931434631348, "global_step": 446944, "epoch": 2660} {"train_loss": -12.166629791259766, "global_step": 446945, "epoch": 2660} {"train_loss": -12.515721321105957, "global_step": 446946, "epoch": 2660} {"train_loss": -12.57715892791748, "global_step": 446947, "epoch": 2660} {"train_loss": -12.30497932434082, "global_step": 446948, "epoch": 2660} {"train_loss": -12.302057266235352, "global_step": 446949, "epoch": 2660} {"train_loss": -12.523624420166016, "global_step": 446950, "epoch": 2660} {"train_loss": -12.36322021484375, "global_step": 446951, "epoch": 2660} {"train_loss": -12.611593246459961, "global_step": 446952, "epoch": 2660} {"train_loss": -12.584320068359375, "global_step": 446953, "epoch": 2660} {"train_loss": -12.57560920715332, "global_step": 446954, "epoch": 2660} {"train_loss": -12.340058326721191, "global_step": 446955, "epoch": 2660} {"train_loss": -12.430988311767578, "global_step": 446956, "epoch": 2660} {"train_loss": -12.271476745605469, "global_step": 446957, "epoch": 2660} {"train_loss": -12.342988014221191, "global_step": 446958, "epoch": 2660} {"train_loss": -12.313690185546875, "global_step": 446959, "epoch": 2660} {"train_loss": -12.698667526245117, "global_step": 446960, "epoch": 2660} {"train_loss": -12.272466659545898, "global_step": 446961, "epoch": 2660} {"train_loss": -12.596332550048828, "global_step": 446962, "epoch": 2660} {"train_loss": -12.383749008178711, "global_step": 446963, "epoch": 2660} {"train_loss": -12.645965576171875, "global_step": 446964, "epoch": 2660} {"train_loss": -12.424273490905762, "global_step": 446965, "epoch": 2660} {"train_loss": -12.628612518310547, "global_step": 446966, "epoch": 2660} {"train_loss": -12.72843074798584, "global_step": 446967, "epoch": 2660} {"train_loss": -12.83092975616455, "global_step": 446968, "epoch": 2660} {"train_loss": -12.578428268432617, "global_step": 446969, "epoch": 2660} {"train_loss": -12.705917358398438, "global_step": 446970, "epoch": 2660} {"train_loss": -12.733856201171875, "global_step": 446971, "epoch": 2660} {"train_loss": -12.6212739944458, "global_step": 446972, "epoch": 2660} {"train_loss": -12.804179191589355, "global_step": 446973, "epoch": 2660} {"train_loss": -12.648590087890625, "global_step": 446974, "epoch": 2660} {"train_loss": -12.736698150634766, "global_step": 446975, "epoch": 2660} {"train_loss": -12.706880569458008, "global_step": 446976, "epoch": 2660} {"train_loss": -12.820777893066406, "global_step": 446977, "epoch": 2660} {"train_loss": -12.769330978393555, "global_step": 446978, "epoch": 2660} {"train_loss": -12.757477760314941, "global_step": 446979, "epoch": 2660} {"train_loss": -12.464180946350098, "global_step": 446980, "epoch": 2660} {"train_loss": -12.830827713012695, "global_step": 446981, "epoch": 2660} {"train_loss": -12.775613784790039, "global_step": 446982, "epoch": 2660} {"train_loss": -12.490814208984375, "global_step": 446983, "epoch": 2660} {"train_loss": -13.004504203796387, "global_step": 446984, "epoch": 2660} {"train_loss": -12.587224006652832, "global_step": 446985, "epoch": 2660} {"train_loss": -12.852499008178711, "global_step": 446986, "epoch": 2660} {"train_loss": -12.692716598510742, "global_step": 446987, "epoch": 2660} {"train_loss": -12.246841430664062, "global_step": 446988, "epoch": 2660} {"train_loss": -12.605146408081055, "global_step": 446989, "epoch": 2660} {"train_loss": -12.715466499328613, "global_step": 446990, "epoch": 2660} {"train_loss": -12.79542350769043, "global_step": 446991, "epoch": 2660} {"train_loss": -13.106337547302246, "global_step": 446992, "epoch": 2660} {"train_loss": -12.812442779541016, "global_step": 446993, "epoch": 2660} {"train_loss": -12.668567657470703, "global_step": 446994, "epoch": 2660} {"train_loss": -12.578643798828125, "global_step": 446995, "epoch": 2660} {"train_loss": -12.89109992980957, "global_step": 446996, "epoch": 2660} {"train_loss": -12.895605087280273, "global_step": 446997, "epoch": 2660} {"train_loss": -12.800735473632812, "global_step": 446998, "epoch": 2660} {"train_loss": -12.861669540405273, "global_step": 446999, "epoch": 2660} {"train_loss": -12.880611419677734, "global_step": 447000, "epoch": 2660} {"train_loss": -12.808235168457031, "global_step": 447001, "epoch": 2660} {"train_loss": -12.989360809326172, "global_step": 447002, "epoch": 2660} {"train_loss": -12.960124015808105, "global_step": 447003, "epoch": 2660} {"train_loss": -12.737444877624512, "global_step": 447004, "epoch": 2660} {"train_loss": -12.925710678100586, "global_step": 447005, "epoch": 2660} {"train_loss": -12.873847961425781, "global_step": 447006, "epoch": 2660} {"train_loss": -12.310749053955078, "global_step": 447007, "epoch": 2660} {"train_loss": -12.408124923706055, "global_step": 447008, "epoch": 2660} {"train_loss": -12.28390121459961, "global_step": 447009, "epoch": 2660} {"train_loss": -12.735334396362305, "global_step": 447010, "epoch": 2660} {"train_loss": -12.885476112365723, "global_step": 447011, "epoch": 2660} {"train_loss": -12.66741943359375, "global_step": 447012, "epoch": 2660} {"train_loss": -11.965499877929688, "global_step": 447013, "epoch": 2660} {"train_loss": -12.014902114868164, "global_step": 447014, "epoch": 2660} {"train_loss": -12.652231216430664, "global_step": 447015, "epoch": 2660} {"train_loss": -12.422220230102539, "global_step": 447016, "epoch": 2660} {"train_loss": -11.026276588439941, "global_step": 447017, "epoch": 2660} {"train_loss": -10.162677764892578, "global_step": 447018, "epoch": 2660} {"train_loss": -11.066704750061035, "global_step": 447019, "epoch": 2660} {"train_loss": -11.90682601928711, "global_step": 447020, "epoch": 2660} {"train_loss": -11.507773399353027, "global_step": 447021, "epoch": 2660} {"train_loss": -11.76190185546875, "global_step": 447022, "epoch": 2660} {"train_loss": -10.114142417907715, "global_step": 447023, "epoch": 2660} {"train_loss": -12.015235900878906, "global_step": 447024, "epoch": 2660} {"train_loss": -10.084039688110352, "global_step": 447025, "epoch": 2660} {"train_loss": -10.094406127929688, "global_step": 447026, "epoch": 2660} {"train_loss": -11.926648139953613, "global_step": 447027, "epoch": 2660} {"train_loss": -9.532445907592773, "global_step": 447028, "epoch": 2660} {"train_loss": -10.845632553100586, "global_step": 447029, "epoch": 2660} {"train_loss": -9.489277839660645, "global_step": 447030, "epoch": 2660} {"train_loss": -10.689775466918945, "global_step": 447031, "epoch": 2660} {"train_loss": -9.50909423828125, "global_step": 447032, "epoch": 2660} {"train_loss": -9.497964859008789, "global_step": 447033, "epoch": 2660} {"train_loss": -8.730472564697266, "global_step": 447034, "epoch": 2660} {"train_loss": -8.560118675231934, "global_step": 447035, "epoch": 2660} {"train_loss": -10.471288681030273, "global_step": 447036, "epoch": 2660} {"train_loss": -9.947168350219727, "global_step": 447037, "epoch": 2660} {"train_loss": -10.143640518188477, "global_step": 447038, "epoch": 2660} {"train_loss": -10.499222755432129, "global_step": 447039, "epoch": 2660} {"train_loss": -10.520808219909668, "global_step": 447040, "epoch": 2660} {"train_loss": -11.96950912475586, "global_step": 447041, "epoch": 2660} {"train_loss": -11.179357528686523, "global_step": 447042, "epoch": 2660} {"train_loss": -11.756311416625977, "global_step": 447043, "epoch": 2660} {"train_loss": -11.455888748168945, "global_step": 447044, "epoch": 2660} {"train_loss": -10.874931335449219, "global_step": 447045, "epoch": 2660} {"train_loss": -12.010248184204102, "global_step": 447046, "epoch": 2660} {"train_loss": -11.918621063232422, "global_step": 447047, "epoch": 2660, "val_loss": 309657.59375, "train_action_mse_error": 1.7715073823928833} {"train_loss": -12.18846321105957, "global_step": 447048, "epoch": 2661} {"train_loss": -11.784322738647461, "global_step": 447049, "epoch": 2661} {"train_loss": -11.873403549194336, "global_step": 447050, "epoch": 2661} {"train_loss": -10.805002212524414, "global_step": 447051, "epoch": 2661} {"train_loss": -11.841043472290039, "global_step": 447052, "epoch": 2661} {"train_loss": -11.94654655456543, "global_step": 447053, "epoch": 2661} {"train_loss": -11.80025863647461, "global_step": 447054, "epoch": 2661} {"train_loss": -12.258623123168945, "global_step": 447055, "epoch": 2661} {"train_loss": -11.712207794189453, "global_step": 447056, "epoch": 2661} {"train_loss": -11.931334495544434, "global_step": 447057, "epoch": 2661} {"train_loss": -12.142618179321289, "global_step": 447058, "epoch": 2661} {"train_loss": -11.848665237426758, "global_step": 447059, "epoch": 2661} {"train_loss": -12.6040678024292, "global_step": 447060, "epoch": 2661} {"train_loss": -12.095708847045898, "global_step": 447061, "epoch": 2661} {"train_loss": -12.42563247680664, "global_step": 447062, "epoch": 2661} {"train_loss": -12.274270057678223, "global_step": 447063, "epoch": 2661} {"train_loss": -12.196026802062988, "global_step": 447064, "epoch": 2661} {"train_loss": -12.551462173461914, "global_step": 447065, "epoch": 2661} {"train_loss": -11.873558044433594, "global_step": 447066, "epoch": 2661} {"train_loss": -12.417512893676758, "global_step": 447067, "epoch": 2661} {"train_loss": -12.28581428527832, "global_step": 447068, "epoch": 2661} {"train_loss": -12.43510627746582, "global_step": 447069, "epoch": 2661} {"train_loss": -12.21225643157959, "global_step": 447070, "epoch": 2661} {"train_loss": -12.344865798950195, "global_step": 447071, "epoch": 2661} {"train_loss": -12.44316291809082, "global_step": 447072, "epoch": 2661} {"train_loss": -12.383674621582031, "global_step": 447073, "epoch": 2661} {"train_loss": -12.259449005126953, "global_step": 447074, "epoch": 2661} {"train_loss": -12.365548133850098, "global_step": 447075, "epoch": 2661} {"train_loss": -12.213253021240234, "global_step": 447076, "epoch": 2661} {"train_loss": -12.557807922363281, "global_step": 447077, "epoch": 2661} {"train_loss": -12.31765365600586, "global_step": 447078, "epoch": 2661} {"train_loss": -12.514994621276855, "global_step": 447079, "epoch": 2661} {"train_loss": -12.592423439025879, "global_step": 447080, "epoch": 2661} {"train_loss": -12.29696273803711, "global_step": 447081, "epoch": 2661} {"train_loss": -12.276079177856445, "global_step": 447082, "epoch": 2661} {"train_loss": -12.551619529724121, "global_step": 447083, "epoch": 2661} {"train_loss": -12.510209083557129, "global_step": 447084, "epoch": 2661} {"train_loss": -12.667933464050293, "global_step": 447085, "epoch": 2661} {"train_loss": -12.454605102539062, "global_step": 447086, "epoch": 2661} {"train_loss": -12.488525390625, "global_step": 447087, "epoch": 2661} {"train_loss": -12.372976303100586, "global_step": 447088, "epoch": 2661} {"train_loss": -12.455787658691406, "global_step": 447089, "epoch": 2661} {"train_loss": -12.572196006774902, "global_step": 447090, "epoch": 2661} {"train_loss": -12.637939453125, "global_step": 447091, "epoch": 2661} {"train_loss": -12.759454727172852, "global_step": 447092, "epoch": 2661} {"train_loss": -12.574146270751953, "global_step": 447093, "epoch": 2661} {"train_loss": -12.710298538208008, "global_step": 447094, "epoch": 2661} {"train_loss": -12.7501859664917, "global_step": 447095, "epoch": 2661} {"train_loss": -12.853131294250488, "global_step": 447096, "epoch": 2661} {"train_loss": -12.37730598449707, "global_step": 447097, "epoch": 2661} {"train_loss": -12.589546203613281, "global_step": 447098, "epoch": 2661} {"train_loss": -12.705263137817383, "global_step": 447099, "epoch": 2661} {"train_loss": -12.656925201416016, "global_step": 447100, "epoch": 2661} {"train_loss": -12.687236785888672, "global_step": 447101, "epoch": 2661} {"train_loss": -12.735173225402832, "global_step": 447102, "epoch": 2661} {"train_loss": -12.84119987487793, "global_step": 447103, "epoch": 2661} {"train_loss": -12.881820678710938, "global_step": 447104, "epoch": 2661} {"train_loss": -12.888591766357422, "global_step": 447105, "epoch": 2661} {"train_loss": -12.705761909484863, "global_step": 447106, "epoch": 2661} {"train_loss": -12.698188781738281, "global_step": 447107, "epoch": 2661} {"train_loss": -12.762372970581055, "global_step": 447108, "epoch": 2661} {"train_loss": -12.331470489501953, "global_step": 447109, "epoch": 2661} {"train_loss": -12.904340744018555, "global_step": 447110, "epoch": 2661} {"train_loss": -12.802410125732422, "global_step": 447111, "epoch": 2661} {"train_loss": -12.768514633178711, "global_step": 447112, "epoch": 2661} {"train_loss": -12.626150131225586, "global_step": 447113, "epoch": 2661} {"train_loss": -12.818013191223145, "global_step": 447114, "epoch": 2661} {"train_loss": -12.755696296691895, "global_step": 447115, "epoch": 2661} {"train_loss": -12.836406707763672, "global_step": 447116, "epoch": 2661} {"train_loss": -12.69287109375, "global_step": 447117, "epoch": 2661} {"train_loss": -12.709199905395508, "global_step": 447118, "epoch": 2661} {"train_loss": -12.594672203063965, "global_step": 447119, "epoch": 2661} {"train_loss": -12.229654312133789, "global_step": 447120, "epoch": 2661} {"train_loss": -12.331686019897461, "global_step": 447121, "epoch": 2661} {"train_loss": -12.951347351074219, "global_step": 447122, "epoch": 2661} {"train_loss": -12.322723388671875, "global_step": 447123, "epoch": 2661} {"train_loss": -12.475212097167969, "global_step": 447124, "epoch": 2661} {"train_loss": -13.005489349365234, "global_step": 447125, "epoch": 2661} {"train_loss": -12.953407287597656, "global_step": 447126, "epoch": 2661} {"train_loss": -12.400713920593262, "global_step": 447127, "epoch": 2661} {"train_loss": -12.360641479492188, "global_step": 447128, "epoch": 2661} {"train_loss": -12.891401290893555, "global_step": 447129, "epoch": 2661} {"train_loss": -12.586795806884766, "global_step": 447130, "epoch": 2661} {"train_loss": -11.802730560302734, "global_step": 447131, "epoch": 2661} {"train_loss": -12.070676803588867, "global_step": 447132, "epoch": 2661} {"train_loss": -12.81987190246582, "global_step": 447133, "epoch": 2661} {"train_loss": -12.389297485351562, "global_step": 447134, "epoch": 2661} {"train_loss": -12.234430313110352, "global_step": 447135, "epoch": 2661} {"train_loss": -12.791900634765625, "global_step": 447136, "epoch": 2661} {"train_loss": -12.067044258117676, "global_step": 447137, "epoch": 2661} {"train_loss": -11.350967407226562, "global_step": 447138, "epoch": 2661} {"train_loss": -11.797388076782227, "global_step": 447139, "epoch": 2661} {"train_loss": -12.253693580627441, "global_step": 447140, "epoch": 2661} {"train_loss": -11.328510284423828, "global_step": 447141, "epoch": 2661} {"train_loss": -12.121075630187988, "global_step": 447142, "epoch": 2661} {"train_loss": -12.417754173278809, "global_step": 447143, "epoch": 2661} {"train_loss": -11.786355972290039, "global_step": 447144, "epoch": 2661} {"train_loss": -11.731342315673828, "global_step": 447145, "epoch": 2661} {"train_loss": -11.987604141235352, "global_step": 447146, "epoch": 2661} {"train_loss": -11.964859962463379, "global_step": 447147, "epoch": 2661} {"train_loss": -11.45427131652832, "global_step": 447148, "epoch": 2661} {"train_loss": -11.02065658569336, "global_step": 447149, "epoch": 2661} {"train_loss": -11.452218055725098, "global_step": 447150, "epoch": 2661} {"train_loss": -9.428152084350586, "global_step": 447151, "epoch": 2661} {"train_loss": -9.283536911010742, "global_step": 447152, "epoch": 2661} {"train_loss": -9.472591400146484, "global_step": 447153, "epoch": 2661} {"train_loss": -10.129671096801758, "global_step": 447154, "epoch": 2661} {"train_loss": -10.0685453414917, "global_step": 447155, "epoch": 2661} {"train_loss": -9.54949951171875, "global_step": 447156, "epoch": 2661} {"train_loss": -10.545356750488281, "global_step": 447157, "epoch": 2661} {"train_loss": -10.798232078552246, "global_step": 447158, "epoch": 2661} {"train_loss": -9.949060440063477, "global_step": 447159, "epoch": 2661} {"train_loss": -10.050887107849121, "global_step": 447160, "epoch": 2661} {"train_loss": -10.682394027709961, "global_step": 447161, "epoch": 2661} {"train_loss": -11.422981262207031, "global_step": 447162, "epoch": 2661} {"train_loss": -10.857194900512695, "global_step": 447163, "epoch": 2661} {"train_loss": -10.986883163452148, "global_step": 447164, "epoch": 2661} {"train_loss": -11.3377046585083, "global_step": 447165, "epoch": 2661} {"train_loss": -11.661579132080078, "global_step": 447166, "epoch": 2661} {"train_loss": -10.409421920776367, "global_step": 447167, "epoch": 2661} {"train_loss": -11.701534271240234, "global_step": 447168, "epoch": 2661} {"train_loss": -12.018924713134766, "global_step": 447169, "epoch": 2661} {"train_loss": -11.181761741638184, "global_step": 447170, "epoch": 2661} {"train_loss": -11.104162216186523, "global_step": 447171, "epoch": 2661} {"train_loss": -11.579779624938965, "global_step": 447172, "epoch": 2661} {"train_loss": -10.252965927124023, "global_step": 447173, "epoch": 2661} {"train_loss": -11.334695816040039, "global_step": 447174, "epoch": 2661} {"train_loss": -10.029081344604492, "global_step": 447175, "epoch": 2661} {"train_loss": -10.736963272094727, "global_step": 447176, "epoch": 2661} {"train_loss": -9.64787769317627, "global_step": 447177, "epoch": 2661} {"train_loss": -11.464673042297363, "global_step": 447178, "epoch": 2661} {"train_loss": -10.290699005126953, "global_step": 447179, "epoch": 2661} {"train_loss": -11.68775749206543, "global_step": 447180, "epoch": 2661} {"train_loss": -10.408522605895996, "global_step": 447181, "epoch": 2661} {"train_loss": -11.321731567382812, "global_step": 447182, "epoch": 2661} {"train_loss": -10.880781173706055, "global_step": 447183, "epoch": 2661} {"train_loss": -10.943418502807617, "global_step": 447184, "epoch": 2661} {"train_loss": -11.078243255615234, "global_step": 447185, "epoch": 2661} {"train_loss": -11.598777770996094, "global_step": 447186, "epoch": 2661} {"train_loss": -11.618319511413574, "global_step": 447187, "epoch": 2661} {"train_loss": -11.831008911132812, "global_step": 447188, "epoch": 2661} {"train_loss": -11.757796287536621, "global_step": 447189, "epoch": 2661} {"train_loss": -11.937061309814453, "global_step": 447190, "epoch": 2661} {"train_loss": -11.910300254821777, "global_step": 447191, "epoch": 2661} {"train_loss": -12.139854431152344, "global_step": 447192, "epoch": 2661} {"train_loss": -12.054635047912598, "global_step": 447193, "epoch": 2661} {"train_loss": -12.022489547729492, "global_step": 447194, "epoch": 2661} {"train_loss": -12.334745407104492, "global_step": 447195, "epoch": 2661} {"train_loss": -12.410057067871094, "global_step": 447196, "epoch": 2661} {"train_loss": -12.10357666015625, "global_step": 447197, "epoch": 2661} {"train_loss": -12.321181297302246, "global_step": 447198, "epoch": 2661} {"train_loss": -12.569244384765625, "global_step": 447199, "epoch": 2661} {"train_loss": -12.385917663574219, "global_step": 447200, "epoch": 2661} {"train_loss": -12.408588409423828, "global_step": 447201, "epoch": 2661} {"train_loss": -12.567485809326172, "global_step": 447202, "epoch": 2661} {"train_loss": -12.453374862670898, "global_step": 447203, "epoch": 2661} {"train_loss": -12.559211730957031, "global_step": 447204, "epoch": 2661} {"train_loss": -12.382368087768555, "global_step": 447205, "epoch": 2661} {"train_loss": -12.55332088470459, "global_step": 447206, "epoch": 2661} {"train_loss": -12.38406753540039, "global_step": 447207, "epoch": 2661} {"train_loss": -12.431053161621094, "global_step": 447208, "epoch": 2661} {"train_loss": -12.684005737304688, "global_step": 447209, "epoch": 2661} {"train_loss": -12.705080032348633, "global_step": 447210, "epoch": 2661} {"train_loss": -12.470888137817383, "global_step": 447211, "epoch": 2661} {"train_loss": -12.703842163085938, "global_step": 447212, "epoch": 2661} {"train_loss": -12.524174690246582, "global_step": 447213, "epoch": 2661} {"train_loss": -12.63405990600586, "global_step": 447214, "epoch": 2661} {"train_loss": -11.99659172126225, "global_step": 447215, "epoch": 2661, "val_loss": 304763.75} {"train_loss": -12.510198593139648, "global_step": 447216, "epoch": 2662} {"train_loss": -12.457720756530762, "global_step": 447217, "epoch": 2662} {"train_loss": -12.869379043579102, "global_step": 447218, "epoch": 2662} {"train_loss": -12.565091133117676, "global_step": 447219, "epoch": 2662} {"train_loss": -12.69186019897461, "global_step": 447220, "epoch": 2662} {"train_loss": -12.66956901550293, "global_step": 447221, "epoch": 2662} {"train_loss": -12.64303207397461, "global_step": 447222, "epoch": 2662} {"train_loss": -12.641927719116211, "global_step": 447223, "epoch": 2662} {"train_loss": -12.612744331359863, "global_step": 447224, "epoch": 2662} {"train_loss": -12.677023887634277, "global_step": 447225, "epoch": 2662} {"train_loss": -12.750640869140625, "global_step": 447226, "epoch": 2662} {"train_loss": -12.485235214233398, "global_step": 447227, "epoch": 2662} {"train_loss": -12.729754447937012, "global_step": 447228, "epoch": 2662} {"train_loss": -12.758411407470703, "global_step": 447229, "epoch": 2662} {"train_loss": -12.643379211425781, "global_step": 447230, "epoch": 2662} {"train_loss": -12.622758865356445, "global_step": 447231, "epoch": 2662} {"train_loss": -12.621940612792969, "global_step": 447232, "epoch": 2662} {"train_loss": -12.674571990966797, "global_step": 447233, "epoch": 2662} {"train_loss": -12.786130905151367, "global_step": 447234, "epoch": 2662} {"train_loss": -12.712875366210938, "global_step": 447235, "epoch": 2662} {"train_loss": -12.736788749694824, "global_step": 447236, "epoch": 2662} {"train_loss": -12.595125198364258, "global_step": 447237, "epoch": 2662} {"train_loss": -12.590751647949219, "global_step": 447238, "epoch": 2662} {"train_loss": -12.648698806762695, "global_step": 447239, "epoch": 2662} {"train_loss": -12.925311088562012, "global_step": 447240, "epoch": 2662} {"train_loss": -12.85084056854248, "global_step": 447241, "epoch": 2662} {"train_loss": -12.710260391235352, "global_step": 447242, "epoch": 2662} {"train_loss": -12.711650848388672, "global_step": 447243, "epoch": 2662} {"train_loss": -12.600894927978516, "global_step": 447244, "epoch": 2662} {"train_loss": -12.73427677154541, "global_step": 447245, "epoch": 2662} {"train_loss": -12.932760238647461, "global_step": 447246, "epoch": 2662} {"train_loss": -12.909442901611328, "global_step": 447247, "epoch": 2662} {"train_loss": -12.830255508422852, "global_step": 447248, "epoch": 2662} {"train_loss": -12.802967071533203, "global_step": 447249, "epoch": 2662} {"train_loss": -12.794090270996094, "global_step": 447250, "epoch": 2662} {"train_loss": -12.68585205078125, "global_step": 447251, "epoch": 2662} {"train_loss": -12.698966026306152, "global_step": 447252, "epoch": 2662} {"train_loss": -12.846138000488281, "global_step": 447253, "epoch": 2662} {"train_loss": -12.619555473327637, "global_step": 447254, "epoch": 2662} {"train_loss": -12.862909317016602, "global_step": 447255, "epoch": 2662} {"train_loss": -12.514413833618164, "global_step": 447256, "epoch": 2662} {"train_loss": -12.784049987792969, "global_step": 447257, "epoch": 2662} {"train_loss": -12.724430084228516, "global_step": 447258, "epoch": 2662} {"train_loss": -12.64810848236084, "global_step": 447259, "epoch": 2662} {"train_loss": -12.424524307250977, "global_step": 447260, "epoch": 2662} {"train_loss": -12.346327781677246, "global_step": 447261, "epoch": 2662} {"train_loss": -12.549755096435547, "global_step": 447262, "epoch": 2662} {"train_loss": -12.57996940612793, "global_step": 447263, "epoch": 2662} {"train_loss": -12.365707397460938, "global_step": 447264, "epoch": 2662} {"train_loss": -12.413749694824219, "global_step": 447265, "epoch": 2662} {"train_loss": -12.243221282958984, "global_step": 447266, "epoch": 2662} {"train_loss": -12.709188461303711, "global_step": 447267, "epoch": 2662} {"train_loss": -12.219437599182129, "global_step": 447268, "epoch": 2662} {"train_loss": -12.912615776062012, "global_step": 447269, "epoch": 2662} {"train_loss": -12.466320991516113, "global_step": 447270, "epoch": 2662} {"train_loss": -12.192115783691406, "global_step": 447271, "epoch": 2662} {"train_loss": -11.265913009643555, "global_step": 447272, "epoch": 2662} {"train_loss": -11.484147071838379, "global_step": 447273, "epoch": 2662} {"train_loss": -12.665117263793945, "global_step": 447274, "epoch": 2662} {"train_loss": -11.152929306030273, "global_step": 447275, "epoch": 2662} {"train_loss": -10.447505950927734, "global_step": 447276, "epoch": 2662} {"train_loss": -11.151518821716309, "global_step": 447277, "epoch": 2662} {"train_loss": -11.821959495544434, "global_step": 447278, "epoch": 2662} {"train_loss": -11.937362670898438, "global_step": 447279, "epoch": 2662} {"train_loss": -10.415907859802246, "global_step": 447280, "epoch": 2662} {"train_loss": -11.709932327270508, "global_step": 447281, "epoch": 2662} {"train_loss": -10.726359367370605, "global_step": 447282, "epoch": 2662} {"train_loss": -11.227055549621582, "global_step": 447283, "epoch": 2662} {"train_loss": -11.15097427368164, "global_step": 447284, "epoch": 2662} {"train_loss": -10.776025772094727, "global_step": 447285, "epoch": 2662} {"train_loss": -11.6272611618042, "global_step": 447286, "epoch": 2662} {"train_loss": -11.072358131408691, "global_step": 447287, "epoch": 2662} {"train_loss": -11.414411544799805, "global_step": 447288, "epoch": 2662} {"train_loss": -11.20997428894043, "global_step": 447289, "epoch": 2662} {"train_loss": -10.679269790649414, "global_step": 447290, "epoch": 2662} {"train_loss": -11.479028701782227, "global_step": 447291, "epoch": 2662} {"train_loss": -11.64107894897461, "global_step": 447292, "epoch": 2662} {"train_loss": -12.097282409667969, "global_step": 447293, "epoch": 2662} {"train_loss": -11.864412307739258, "global_step": 447294, "epoch": 2662} {"train_loss": -11.521929740905762, "global_step": 447295, "epoch": 2662} {"train_loss": -11.292428970336914, "global_step": 447296, "epoch": 2662} {"train_loss": -12.486577987670898, "global_step": 447297, "epoch": 2662} {"train_loss": -11.598711013793945, "global_step": 447298, "epoch": 2662} {"train_loss": -12.048316955566406, "global_step": 447299, "epoch": 2662} {"train_loss": -12.284383773803711, "global_step": 447300, "epoch": 2662} {"train_loss": -11.94552993774414, "global_step": 447301, "epoch": 2662} {"train_loss": -11.928467750549316, "global_step": 447302, "epoch": 2662} {"train_loss": -12.201848983764648, "global_step": 447303, "epoch": 2662} {"train_loss": -12.241186141967773, "global_step": 447304, "epoch": 2662} {"train_loss": -11.929919242858887, "global_step": 447305, "epoch": 2662} {"train_loss": -11.96609878540039, "global_step": 447306, "epoch": 2662} {"train_loss": -12.092153549194336, "global_step": 447307, "epoch": 2662} {"train_loss": -12.032320022583008, "global_step": 447308, "epoch": 2662} {"train_loss": -11.90282154083252, "global_step": 447309, "epoch": 2662} {"train_loss": -12.314456939697266, "global_step": 447310, "epoch": 2662} {"train_loss": -11.258071899414062, "global_step": 447311, "epoch": 2662} {"train_loss": -12.451504707336426, "global_step": 447312, "epoch": 2662} {"train_loss": -11.435775756835938, "global_step": 447313, "epoch": 2662} {"train_loss": -11.490043640136719, "global_step": 447314, "epoch": 2662} {"train_loss": -11.559673309326172, "global_step": 447315, "epoch": 2662} {"train_loss": -12.087515830993652, "global_step": 447316, "epoch": 2662} {"train_loss": -11.726576805114746, "global_step": 447317, "epoch": 2662} {"train_loss": -11.964743614196777, "global_step": 447318, "epoch": 2662} {"train_loss": -11.702587127685547, "global_step": 447319, "epoch": 2662} {"train_loss": -12.460189819335938, "global_step": 447320, "epoch": 2662} {"train_loss": -11.540473937988281, "global_step": 447321, "epoch": 2662} {"train_loss": -12.30431842803955, "global_step": 447322, "epoch": 2662} {"train_loss": -11.88497543334961, "global_step": 447323, "epoch": 2662} {"train_loss": -11.50048542022705, "global_step": 447324, "epoch": 2662} {"train_loss": -12.049134254455566, "global_step": 447325, "epoch": 2662} {"train_loss": -12.001381874084473, "global_step": 447326, "epoch": 2662} {"train_loss": -11.748980522155762, "global_step": 447327, "epoch": 2662} {"train_loss": -12.48428726196289, "global_step": 447328, "epoch": 2662} {"train_loss": -11.314207077026367, "global_step": 447329, "epoch": 2662} {"train_loss": -12.019746780395508, "global_step": 447330, "epoch": 2662} {"train_loss": -11.81015396118164, "global_step": 447331, "epoch": 2662} {"train_loss": -11.669622421264648, "global_step": 447332, "epoch": 2662} {"train_loss": -11.51177978515625, "global_step": 447333, "epoch": 2662} {"train_loss": -12.138818740844727, "global_step": 447334, "epoch": 2662} {"train_loss": -11.454736709594727, "global_step": 447335, "epoch": 2662} {"train_loss": -11.683931350708008, "global_step": 447336, "epoch": 2662} {"train_loss": -10.766498565673828, "global_step": 447337, "epoch": 2662} {"train_loss": -11.332489967346191, "global_step": 447338, "epoch": 2662} {"train_loss": -11.931671142578125, "global_step": 447339, "epoch": 2662} {"train_loss": -11.19620132446289, "global_step": 447340, "epoch": 2662} {"train_loss": -11.475872039794922, "global_step": 447341, "epoch": 2662} {"train_loss": -11.363707542419434, "global_step": 447342, "epoch": 2662} {"train_loss": -10.886850357055664, "global_step": 447343, "epoch": 2662} {"train_loss": -11.780856132507324, "global_step": 447344, "epoch": 2662} {"train_loss": -11.791072845458984, "global_step": 447345, "epoch": 2662} {"train_loss": -10.808313369750977, "global_step": 447346, "epoch": 2662} {"train_loss": -10.457759857177734, "global_step": 447347, "epoch": 2662} {"train_loss": -11.545381546020508, "global_step": 447348, "epoch": 2662} {"train_loss": -10.777462005615234, "global_step": 447349, "epoch": 2662} {"train_loss": -12.244644165039062, "global_step": 447350, "epoch": 2662} {"train_loss": -11.482597351074219, "global_step": 447351, "epoch": 2662} {"train_loss": -11.733365058898926, "global_step": 447352, "epoch": 2662} {"train_loss": -11.893787384033203, "global_step": 447353, "epoch": 2662} {"train_loss": -11.732065200805664, "global_step": 447354, "epoch": 2662} {"train_loss": -12.198944091796875, "global_step": 447355, "epoch": 2662} {"train_loss": -11.933379173278809, "global_step": 447356, "epoch": 2662} {"train_loss": -12.159502029418945, "global_step": 447357, "epoch": 2662} {"train_loss": -12.119752883911133, "global_step": 447358, "epoch": 2662} {"train_loss": -11.826026916503906, "global_step": 447359, "epoch": 2662} {"train_loss": -12.140363693237305, "global_step": 447360, "epoch": 2662} {"train_loss": -11.819753646850586, "global_step": 447361, "epoch": 2662} {"train_loss": -12.286352157592773, "global_step": 447362, "epoch": 2662} {"train_loss": -12.055561065673828, "global_step": 447363, "epoch": 2662} {"train_loss": -12.449179649353027, "global_step": 447364, "epoch": 2662} {"train_loss": -12.315733909606934, "global_step": 447365, "epoch": 2662} {"train_loss": -12.49691104888916, "global_step": 447366, "epoch": 2662} {"train_loss": -12.432565689086914, "global_step": 447367, "epoch": 2662} {"train_loss": -12.450933456420898, "global_step": 447368, "epoch": 2662} {"train_loss": -12.579030990600586, "global_step": 447369, "epoch": 2662} {"train_loss": -12.52390193939209, "global_step": 447370, "epoch": 2662} {"train_loss": -12.377256393432617, "global_step": 447371, "epoch": 2662} {"train_loss": -12.521292686462402, "global_step": 447372, "epoch": 2662} {"train_loss": -12.388145446777344, "global_step": 447373, "epoch": 2662} {"train_loss": -12.618698120117188, "global_step": 447374, "epoch": 2662} {"train_loss": -12.372668266296387, "global_step": 447375, "epoch": 2662} {"train_loss": -12.40611743927002, "global_step": 447376, "epoch": 2662} {"train_loss": -12.695486068725586, "global_step": 447377, "epoch": 2662} {"train_loss": -12.70335865020752, "global_step": 447378, "epoch": 2662} {"train_loss": -12.71865463256836, "global_step": 447379, "epoch": 2662} {"train_loss": -12.624061584472656, "global_step": 447380, "epoch": 2662} {"train_loss": -12.69636344909668, "global_step": 447381, "epoch": 2662} {"train_loss": -12.797441482543945, "global_step": 447382, "epoch": 2662} {"train_loss": -12.100940551076617, "global_step": 447383, "epoch": 2662, "val_loss": 314794.59375} {"train_loss": -12.739904403686523, "global_step": 447384, "epoch": 2663} {"train_loss": -12.88943099975586, "global_step": 447385, "epoch": 2663} {"train_loss": -12.589984893798828, "global_step": 447386, "epoch": 2663} {"train_loss": -12.693608283996582, "global_step": 447387, "epoch": 2663} {"train_loss": -12.83981704711914, "global_step": 447388, "epoch": 2663} {"train_loss": -12.604747772216797, "global_step": 447389, "epoch": 2663} {"train_loss": -12.750786781311035, "global_step": 447390, "epoch": 2663} {"train_loss": -12.572786331176758, "global_step": 447391, "epoch": 2663} {"train_loss": -12.941730499267578, "global_step": 447392, "epoch": 2663} {"train_loss": -12.664655685424805, "global_step": 447393, "epoch": 2663} {"train_loss": -12.529146194458008, "global_step": 447394, "epoch": 2663} {"train_loss": -12.783721923828125, "global_step": 447395, "epoch": 2663} {"train_loss": -12.613290786743164, "global_step": 447396, "epoch": 2663} {"train_loss": -12.65886116027832, "global_step": 447397, "epoch": 2663} {"train_loss": -12.802811622619629, "global_step": 447398, "epoch": 2663} {"train_loss": -12.592513084411621, "global_step": 447399, "epoch": 2663} {"train_loss": -12.725252151489258, "global_step": 447400, "epoch": 2663} {"train_loss": -12.73294734954834, "global_step": 447401, "epoch": 2663} {"train_loss": -12.827627182006836, "global_step": 447402, "epoch": 2663} {"train_loss": -12.557718276977539, "global_step": 447403, "epoch": 2663} {"train_loss": -12.903987884521484, "global_step": 447404, "epoch": 2663} {"train_loss": -12.235849380493164, "global_step": 447405, "epoch": 2663} {"train_loss": -12.81008529663086, "global_step": 447406, "epoch": 2663} {"train_loss": -12.774103164672852, "global_step": 447407, "epoch": 2663} {"train_loss": -12.678308486938477, "global_step": 447408, "epoch": 2663} {"train_loss": -12.618422508239746, "global_step": 447409, "epoch": 2663} {"train_loss": -12.545953750610352, "global_step": 447410, "epoch": 2663} {"train_loss": -12.790454864501953, "global_step": 447411, "epoch": 2663} {"train_loss": -12.50745964050293, "global_step": 447412, "epoch": 2663} {"train_loss": -12.731422424316406, "global_step": 447413, "epoch": 2663} {"train_loss": -12.637075424194336, "global_step": 447414, "epoch": 2663} {"train_loss": -12.507210731506348, "global_step": 447415, "epoch": 2663} {"train_loss": -12.127496719360352, "global_step": 447416, "epoch": 2663} {"train_loss": -12.877543449401855, "global_step": 447417, "epoch": 2663} {"train_loss": -12.47649097442627, "global_step": 447418, "epoch": 2663} {"train_loss": -12.50426197052002, "global_step": 447419, "epoch": 2663} {"train_loss": -12.64647102355957, "global_step": 447420, "epoch": 2663} {"train_loss": -12.458673477172852, "global_step": 447421, "epoch": 2663} {"train_loss": -12.405794143676758, "global_step": 447422, "epoch": 2663} {"train_loss": -12.731714248657227, "global_step": 447423, "epoch": 2663} {"train_loss": -12.850561141967773, "global_step": 447424, "epoch": 2663} {"train_loss": -12.612146377563477, "global_step": 447425, "epoch": 2663} {"train_loss": -12.973838806152344, "global_step": 447426, "epoch": 2663} {"train_loss": -12.417203903198242, "global_step": 447427, "epoch": 2663} {"train_loss": -12.510223388671875, "global_step": 447428, "epoch": 2663} {"train_loss": -12.658428192138672, "global_step": 447429, "epoch": 2663} {"train_loss": -12.710888862609863, "global_step": 447430, "epoch": 2663} {"train_loss": -12.234563827514648, "global_step": 447431, "epoch": 2663} {"train_loss": -12.31047534942627, "global_step": 447432, "epoch": 2663} {"train_loss": -12.306774139404297, "global_step": 447433, "epoch": 2663} {"train_loss": -11.679443359375, "global_step": 447434, "epoch": 2663} {"train_loss": -11.536767959594727, "global_step": 447435, "epoch": 2663} {"train_loss": -12.864143371582031, "global_step": 447436, "epoch": 2663} {"train_loss": -12.007451057434082, "global_step": 447437, "epoch": 2663} {"train_loss": -11.26208782196045, "global_step": 447438, "epoch": 2663} {"train_loss": -12.345405578613281, "global_step": 447439, "epoch": 2663} {"train_loss": -11.543376922607422, "global_step": 447440, "epoch": 2663} {"train_loss": -11.882593154907227, "global_step": 447441, "epoch": 2663} {"train_loss": -12.053359985351562, "global_step": 447442, "epoch": 2663} {"train_loss": -11.730682373046875, "global_step": 447443, "epoch": 2663} {"train_loss": -11.767724990844727, "global_step": 447444, "epoch": 2663} {"train_loss": -12.150663375854492, "global_step": 447445, "epoch": 2663} {"train_loss": -12.570100784301758, "global_step": 447446, "epoch": 2663} {"train_loss": -11.680366516113281, "global_step": 447447, "epoch": 2663} {"train_loss": -11.138949394226074, "global_step": 447448, "epoch": 2663} {"train_loss": -12.354917526245117, "global_step": 447449, "epoch": 2663} {"train_loss": -11.730798721313477, "global_step": 447450, "epoch": 2663} {"train_loss": -10.644775390625, "global_step": 447451, "epoch": 2663} {"train_loss": -11.980907440185547, "global_step": 447452, "epoch": 2663} {"train_loss": -10.605891227722168, "global_step": 447453, "epoch": 2663} {"train_loss": -10.347980499267578, "global_step": 447454, "epoch": 2663} {"train_loss": -11.319411277770996, "global_step": 447455, "epoch": 2663} {"train_loss": -9.79844856262207, "global_step": 447456, "epoch": 2663} {"train_loss": -11.779254913330078, "global_step": 447457, "epoch": 2663} {"train_loss": -10.300653457641602, "global_step": 447458, "epoch": 2663} {"train_loss": -11.134559631347656, "global_step": 447459, "epoch": 2663} {"train_loss": -10.150970458984375, "global_step": 447460, "epoch": 2663} {"train_loss": -10.112163543701172, "global_step": 447461, "epoch": 2663} {"train_loss": -8.663668632507324, "global_step": 447462, "epoch": 2663} {"train_loss": -9.210869789123535, "global_step": 447463, "epoch": 2663} {"train_loss": -9.92060375213623, "global_step": 447464, "epoch": 2663} {"train_loss": -9.896783828735352, "global_step": 447465, "epoch": 2663} {"train_loss": -10.481508255004883, "global_step": 447466, "epoch": 2663} {"train_loss": -9.614315032958984, "global_step": 447467, "epoch": 2663} {"train_loss": -10.391972541809082, "global_step": 447468, "epoch": 2663} {"train_loss": -10.569290161132812, "global_step": 447469, "epoch": 2663} {"train_loss": -10.082941055297852, "global_step": 447470, "epoch": 2663} {"train_loss": -10.25200080871582, "global_step": 447471, "epoch": 2663} {"train_loss": -11.076427459716797, "global_step": 447472, "epoch": 2663} {"train_loss": -10.509743690490723, "global_step": 447473, "epoch": 2663} {"train_loss": -11.040640830993652, "global_step": 447474, "epoch": 2663} {"train_loss": -11.559297561645508, "global_step": 447475, "epoch": 2663} {"train_loss": -10.35814380645752, "global_step": 447476, "epoch": 2663} {"train_loss": -11.172690391540527, "global_step": 447477, "epoch": 2663} {"train_loss": -10.481468200683594, "global_step": 447478, "epoch": 2663} {"train_loss": -11.181001663208008, "global_step": 447479, "epoch": 2663} {"train_loss": -11.29108715057373, "global_step": 447480, "epoch": 2663} {"train_loss": -11.23039722442627, "global_step": 447481, "epoch": 2663} {"train_loss": -11.6659574508667, "global_step": 447482, "epoch": 2663} {"train_loss": -11.937898635864258, "global_step": 447483, "epoch": 2663} {"train_loss": -11.589343070983887, "global_step": 447484, "epoch": 2663} {"train_loss": -11.921350479125977, "global_step": 447485, "epoch": 2663} {"train_loss": -11.853076934814453, "global_step": 447486, "epoch": 2663} {"train_loss": -11.903657913208008, "global_step": 447487, "epoch": 2663} {"train_loss": -12.107056617736816, "global_step": 447488, "epoch": 2663} {"train_loss": -11.745980262756348, "global_step": 447489, "epoch": 2663} {"train_loss": -11.713177680969238, "global_step": 447490, "epoch": 2663} {"train_loss": -12.084392547607422, "global_step": 447491, "epoch": 2663} {"train_loss": -11.567621231079102, "global_step": 447492, "epoch": 2663} {"train_loss": -12.004204750061035, "global_step": 447493, "epoch": 2663} {"train_loss": -11.600349426269531, "global_step": 447494, "epoch": 2663} {"train_loss": -11.899100303649902, "global_step": 447495, "epoch": 2663} {"train_loss": -11.897940635681152, "global_step": 447496, "epoch": 2663} {"train_loss": -12.156248092651367, "global_step": 447497, "epoch": 2663} {"train_loss": -11.785027503967285, "global_step": 447498, "epoch": 2663} {"train_loss": -12.34622859954834, "global_step": 447499, "epoch": 2663} {"train_loss": -11.942996978759766, "global_step": 447500, "epoch": 2663} {"train_loss": -12.302143096923828, "global_step": 447501, "epoch": 2663} {"train_loss": -12.266569137573242, "global_step": 447502, "epoch": 2663} {"train_loss": -12.186651229858398, "global_step": 447503, "epoch": 2663} {"train_loss": -12.29696273803711, "global_step": 447504, "epoch": 2663} {"train_loss": -12.423456192016602, "global_step": 447505, "epoch": 2663} {"train_loss": -12.158470153808594, "global_step": 447506, "epoch": 2663} {"train_loss": -12.251422882080078, "global_step": 447507, "epoch": 2663} {"train_loss": -12.419197082519531, "global_step": 447508, "epoch": 2663} {"train_loss": -12.190783500671387, "global_step": 447509, "epoch": 2663} {"train_loss": -12.374984741210938, "global_step": 447510, "epoch": 2663} {"train_loss": -12.37468147277832, "global_step": 447511, "epoch": 2663} {"train_loss": -12.508485794067383, "global_step": 447512, "epoch": 2663} {"train_loss": -12.127016067504883, "global_step": 447513, "epoch": 2663} {"train_loss": -12.480915069580078, "global_step": 447514, "epoch": 2663} {"train_loss": -12.18334674835205, "global_step": 447515, "epoch": 2663} {"train_loss": -12.449760437011719, "global_step": 447516, "epoch": 2663} {"train_loss": -12.65302848815918, "global_step": 447517, "epoch": 2663} {"train_loss": -12.401187896728516, "global_step": 447518, "epoch": 2663} {"train_loss": -12.439554214477539, "global_step": 447519, "epoch": 2663} {"train_loss": -12.500072479248047, "global_step": 447520, "epoch": 2663} {"train_loss": -12.612874984741211, "global_step": 447521, "epoch": 2663} {"train_loss": -12.717514038085938, "global_step": 447522, "epoch": 2663} {"train_loss": -12.651132583618164, "global_step": 447523, "epoch": 2663} {"train_loss": -12.676409721374512, "global_step": 447524, "epoch": 2663} {"train_loss": -12.406501770019531, "global_step": 447525, "epoch": 2663} {"train_loss": -12.72304630279541, "global_step": 447526, "epoch": 2663} {"train_loss": -12.638279914855957, "global_step": 447527, "epoch": 2663} {"train_loss": -12.470826148986816, "global_step": 447528, "epoch": 2663} {"train_loss": -12.683381080627441, "global_step": 447529, "epoch": 2663} {"train_loss": -12.392662048339844, "global_step": 447530, "epoch": 2663} {"train_loss": -12.50130558013916, "global_step": 447531, "epoch": 2663} {"train_loss": -12.042678833007812, "global_step": 447532, "epoch": 2663} {"train_loss": -12.72425651550293, "global_step": 447533, "epoch": 2663} {"train_loss": -12.406420707702637, "global_step": 447534, "epoch": 2663} {"train_loss": -12.441337585449219, "global_step": 447535, "epoch": 2663} {"train_loss": -12.227581024169922, "global_step": 447536, "epoch": 2663} {"train_loss": -12.04222583770752, "global_step": 447537, "epoch": 2663} {"train_loss": -11.97193431854248, "global_step": 447538, "epoch": 2663} {"train_loss": -12.651430130004883, "global_step": 447539, "epoch": 2663} {"train_loss": -12.058995246887207, "global_step": 447540, "epoch": 2663} {"train_loss": -12.400142669677734, "global_step": 447541, "epoch": 2663} {"train_loss": -12.245489120483398, "global_step": 447542, "epoch": 2663} {"train_loss": -12.439939498901367, "global_step": 447543, "epoch": 2663} {"train_loss": -12.363274574279785, "global_step": 447544, "epoch": 2663} {"train_loss": -12.432029724121094, "global_step": 447545, "epoch": 2663} {"train_loss": -12.407100677490234, "global_step": 447546, "epoch": 2663} {"train_loss": -12.818624496459961, "global_step": 447547, "epoch": 2663} {"train_loss": -12.545604705810547, "global_step": 447548, "epoch": 2663} {"train_loss": -12.83073616027832, "global_step": 447549, "epoch": 2663} {"train_loss": -12.712754249572754, "global_step": 447550, "epoch": 2663} {"train_loss": -12.026738552820115, "global_step": 447551, "epoch": 2663, "val_loss": 312477.71875} {"train_loss": -12.616522789001465, "global_step": 447552, "epoch": 2664} {"train_loss": -12.567010879516602, "global_step": 447553, "epoch": 2664} {"train_loss": -12.467967987060547, "global_step": 447554, "epoch": 2664} {"train_loss": -12.211366653442383, "global_step": 447555, "epoch": 2664} {"train_loss": -12.322153091430664, "global_step": 447556, "epoch": 2664} {"train_loss": -11.78634262084961, "global_step": 447557, "epoch": 2664} {"train_loss": -12.651185989379883, "global_step": 447558, "epoch": 2664} {"train_loss": -11.987813949584961, "global_step": 447559, "epoch": 2664} {"train_loss": -12.569839477539062, "global_step": 447560, "epoch": 2664} {"train_loss": -12.483198165893555, "global_step": 447561, "epoch": 2664} {"train_loss": -12.265739440917969, "global_step": 447562, "epoch": 2664} {"train_loss": -12.594337463378906, "global_step": 447563, "epoch": 2664} {"train_loss": -12.947728157043457, "global_step": 447564, "epoch": 2664} {"train_loss": -12.4691743850708, "global_step": 447565, "epoch": 2664} {"train_loss": -12.740606307983398, "global_step": 447566, "epoch": 2664} {"train_loss": -12.531753540039062, "global_step": 447567, "epoch": 2664} {"train_loss": -12.295108795166016, "global_step": 447568, "epoch": 2664} {"train_loss": -12.363142013549805, "global_step": 447569, "epoch": 2664} {"train_loss": -12.314311981201172, "global_step": 447570, "epoch": 2664} {"train_loss": -11.623832702636719, "global_step": 447571, "epoch": 2664} {"train_loss": -11.865438461303711, "global_step": 447572, "epoch": 2664} {"train_loss": -8.903726577758789, "global_step": 447573, "epoch": 2664} {"train_loss": -10.214767456054688, "global_step": 447574, "epoch": 2664} {"train_loss": -10.477066040039062, "global_step": 447575, "epoch": 2664} {"train_loss": -11.047433853149414, "global_step": 447576, "epoch": 2664} {"train_loss": -10.774908065795898, "global_step": 447577, "epoch": 2664} {"train_loss": -11.630247116088867, "global_step": 447578, "epoch": 2664} {"train_loss": -10.83015251159668, "global_step": 447579, "epoch": 2664} {"train_loss": -11.799586296081543, "global_step": 447580, "epoch": 2664} {"train_loss": -11.418924331665039, "global_step": 447581, "epoch": 2664} {"train_loss": -11.28650188446045, "global_step": 447582, "epoch": 2664} {"train_loss": -11.870307922363281, "global_step": 447583, "epoch": 2664} {"train_loss": -11.41385269165039, "global_step": 447584, "epoch": 2664} {"train_loss": -11.87033462524414, "global_step": 447585, "epoch": 2664} {"train_loss": -12.131625175476074, "global_step": 447586, "epoch": 2664} {"train_loss": -12.061361312866211, "global_step": 447587, "epoch": 2664} {"train_loss": -11.60586166381836, "global_step": 447588, "epoch": 2664} {"train_loss": -12.150459289550781, "global_step": 447589, "epoch": 2664} {"train_loss": -12.140182495117188, "global_step": 447590, "epoch": 2664} {"train_loss": -11.58287525177002, "global_step": 447591, "epoch": 2664} {"train_loss": -12.268503189086914, "global_step": 447592, "epoch": 2664} {"train_loss": -12.102937698364258, "global_step": 447593, "epoch": 2664} {"train_loss": -12.117269515991211, "global_step": 447594, "epoch": 2664} {"train_loss": -11.537038803100586, "global_step": 447595, "epoch": 2664} {"train_loss": -12.502349853515625, "global_step": 447596, "epoch": 2664} {"train_loss": -11.925748825073242, "global_step": 447597, "epoch": 2664} {"train_loss": -12.463937759399414, "global_step": 447598, "epoch": 2664} {"train_loss": -12.001205444335938, "global_step": 447599, "epoch": 2664} {"train_loss": -12.386344909667969, "global_step": 447600, "epoch": 2664} {"train_loss": -12.248469352722168, "global_step": 447601, "epoch": 2664} {"train_loss": -12.358818054199219, "global_step": 447602, "epoch": 2664} {"train_loss": -12.60321044921875, "global_step": 447603, "epoch": 2664} {"train_loss": -12.229830741882324, "global_step": 447604, "epoch": 2664} {"train_loss": -12.685754776000977, "global_step": 447605, "epoch": 2664} {"train_loss": -11.906126022338867, "global_step": 447606, "epoch": 2664} {"train_loss": -12.440540313720703, "global_step": 447607, "epoch": 2664} {"train_loss": -12.550530433654785, "global_step": 447608, "epoch": 2664} {"train_loss": -12.413412094116211, "global_step": 447609, "epoch": 2664} {"train_loss": -12.475528717041016, "global_step": 447610, "epoch": 2664} {"train_loss": -12.291241645812988, "global_step": 447611, "epoch": 2664} {"train_loss": -12.47569751739502, "global_step": 447612, "epoch": 2664} {"train_loss": -12.155712127685547, "global_step": 447613, "epoch": 2664} {"train_loss": -12.078174591064453, "global_step": 447614, "epoch": 2664} {"train_loss": -12.279512405395508, "global_step": 447615, "epoch": 2664} {"train_loss": -12.035602569580078, "global_step": 447616, "epoch": 2664} {"train_loss": -11.896585464477539, "global_step": 447617, "epoch": 2664} {"train_loss": -12.052303314208984, "global_step": 447618, "epoch": 2664} {"train_loss": -12.321311950683594, "global_step": 447619, "epoch": 2664} {"train_loss": -12.251952171325684, "global_step": 447620, "epoch": 2664} {"train_loss": -12.283598899841309, "global_step": 447621, "epoch": 2664} {"train_loss": -12.271932601928711, "global_step": 447622, "epoch": 2664} {"train_loss": -12.446235656738281, "global_step": 447623, "epoch": 2664} {"train_loss": -12.215095520019531, "global_step": 447624, "epoch": 2664} {"train_loss": -12.261371612548828, "global_step": 447625, "epoch": 2664} {"train_loss": -12.406517028808594, "global_step": 447626, "epoch": 2664} {"train_loss": -12.228897094726562, "global_step": 447627, "epoch": 2664} {"train_loss": -12.016851425170898, "global_step": 447628, "epoch": 2664} {"train_loss": -11.970643997192383, "global_step": 447629, "epoch": 2664} {"train_loss": -12.39384937286377, "global_step": 447630, "epoch": 2664} {"train_loss": -11.435997009277344, "global_step": 447631, "epoch": 2664} {"train_loss": -12.361434936523438, "global_step": 447632, "epoch": 2664} {"train_loss": -11.544809341430664, "global_step": 447633, "epoch": 2664} {"train_loss": -11.981204986572266, "global_step": 447634, "epoch": 2664} {"train_loss": -12.146028518676758, "global_step": 447635, "epoch": 2664} {"train_loss": -11.359376907348633, "global_step": 447636, "epoch": 2664} {"train_loss": -12.314735412597656, "global_step": 447637, "epoch": 2664} {"train_loss": -11.597949028015137, "global_step": 447638, "epoch": 2664} {"train_loss": -12.631378173828125, "global_step": 447639, "epoch": 2664} {"train_loss": -12.079694747924805, "global_step": 447640, "epoch": 2664} {"train_loss": -12.303430557250977, "global_step": 447641, "epoch": 2664} {"train_loss": -12.178718566894531, "global_step": 447642, "epoch": 2664} {"train_loss": -12.111953735351562, "global_step": 447643, "epoch": 2664} {"train_loss": -12.404483795166016, "global_step": 447644, "epoch": 2664} {"train_loss": -12.54820442199707, "global_step": 447645, "epoch": 2664} {"train_loss": -12.51376724243164, "global_step": 447646, "epoch": 2664} {"train_loss": -12.710990905761719, "global_step": 447647, "epoch": 2664} {"train_loss": -12.40861988067627, "global_step": 447648, "epoch": 2664} {"train_loss": -12.813175201416016, "global_step": 447649, "epoch": 2664} {"train_loss": -12.404672622680664, "global_step": 447650, "epoch": 2664} {"train_loss": -12.55242919921875, "global_step": 447651, "epoch": 2664} {"train_loss": -12.606383323669434, "global_step": 447652, "epoch": 2664} {"train_loss": -12.714140892028809, "global_step": 447653, "epoch": 2664} {"train_loss": -12.582315444946289, "global_step": 447654, "epoch": 2664} {"train_loss": -12.316328048706055, "global_step": 447655, "epoch": 2664} {"train_loss": -12.408535957336426, "global_step": 447656, "epoch": 2664} {"train_loss": -12.413629531860352, "global_step": 447657, "epoch": 2664} {"train_loss": -12.56104850769043, "global_step": 447658, "epoch": 2664} {"train_loss": -12.492177963256836, "global_step": 447659, "epoch": 2664} {"train_loss": -12.641327857971191, "global_step": 447660, "epoch": 2664} {"train_loss": -12.338327407836914, "global_step": 447661, "epoch": 2664} {"train_loss": -12.436969757080078, "global_step": 447662, "epoch": 2664} {"train_loss": -12.047059059143066, "global_step": 447663, "epoch": 2664} {"train_loss": -12.479850769042969, "global_step": 447664, "epoch": 2664} {"train_loss": -12.080137252807617, "global_step": 447665, "epoch": 2664} {"train_loss": -12.605958938598633, "global_step": 447666, "epoch": 2664} {"train_loss": -12.128242492675781, "global_step": 447667, "epoch": 2664} {"train_loss": -12.510438919067383, "global_step": 447668, "epoch": 2664} {"train_loss": -12.424966812133789, "global_step": 447669, "epoch": 2664} {"train_loss": -12.52713394165039, "global_step": 447670, "epoch": 2664} {"train_loss": -12.330188751220703, "global_step": 447671, "epoch": 2664} {"train_loss": -12.597745895385742, "global_step": 447672, "epoch": 2664} {"train_loss": -12.005077362060547, "global_step": 447673, "epoch": 2664} {"train_loss": -12.171863555908203, "global_step": 447674, "epoch": 2664} {"train_loss": -12.091200828552246, "global_step": 447675, "epoch": 2664} {"train_loss": -11.944746017456055, "global_step": 447676, "epoch": 2664} {"train_loss": -12.41482925415039, "global_step": 447677, "epoch": 2664} {"train_loss": -12.521102905273438, "global_step": 447678, "epoch": 2664} {"train_loss": -12.491339683532715, "global_step": 447679, "epoch": 2664} {"train_loss": -12.785561561584473, "global_step": 447680, "epoch": 2664} {"train_loss": -12.727823257446289, "global_step": 447681, "epoch": 2664} {"train_loss": -12.445348739624023, "global_step": 447682, "epoch": 2664} {"train_loss": -12.425907135009766, "global_step": 447683, "epoch": 2664} {"train_loss": -12.56892204284668, "global_step": 447684, "epoch": 2664} {"train_loss": -12.220394134521484, "global_step": 447685, "epoch": 2664} {"train_loss": -12.389656066894531, "global_step": 447686, "epoch": 2664} {"train_loss": -12.402462005615234, "global_step": 447687, "epoch": 2664} {"train_loss": -12.30634880065918, "global_step": 447688, "epoch": 2664} {"train_loss": -12.038774490356445, "global_step": 447689, "epoch": 2664} {"train_loss": -12.586217880249023, "global_step": 447690, "epoch": 2664} {"train_loss": -12.084334373474121, "global_step": 447691, "epoch": 2664} {"train_loss": -12.732320785522461, "global_step": 447692, "epoch": 2664} {"train_loss": -12.319099426269531, "global_step": 447693, "epoch": 2664} {"train_loss": -12.408903121948242, "global_step": 447694, "epoch": 2664} {"train_loss": -12.62130069732666, "global_step": 447695, "epoch": 2664} {"train_loss": -12.481908798217773, "global_step": 447696, "epoch": 2664} {"train_loss": -12.272637367248535, "global_step": 447697, "epoch": 2664} {"train_loss": -12.820082664489746, "global_step": 447698, "epoch": 2664} {"train_loss": -12.580991744995117, "global_step": 447699, "epoch": 2664} {"train_loss": -12.499370574951172, "global_step": 447700, "epoch": 2664} {"train_loss": -12.550332069396973, "global_step": 447701, "epoch": 2664} {"train_loss": -12.177677154541016, "global_step": 447702, "epoch": 2664} {"train_loss": -12.301259994506836, "global_step": 447703, "epoch": 2664} {"train_loss": -12.606832504272461, "global_step": 447704, "epoch": 2664} {"train_loss": -12.468334197998047, "global_step": 447705, "epoch": 2664} {"train_loss": -12.292582511901855, "global_step": 447706, "epoch": 2664} {"train_loss": -12.275392532348633, "global_step": 447707, "epoch": 2664} {"train_loss": -12.821056365966797, "global_step": 447708, "epoch": 2664} {"train_loss": -12.13947868347168, "global_step": 447709, "epoch": 2664} {"train_loss": -12.317317962646484, "global_step": 447710, "epoch": 2664} {"train_loss": -12.140146255493164, "global_step": 447711, "epoch": 2664} {"train_loss": -12.477036476135254, "global_step": 447712, "epoch": 2664} {"train_loss": -11.89263916015625, "global_step": 447713, "epoch": 2664} {"train_loss": -12.683727264404297, "global_step": 447714, "epoch": 2664} {"train_loss": -12.313316345214844, "global_step": 447715, "epoch": 2664} {"train_loss": -12.769021987915039, "global_step": 447716, "epoch": 2664} {"train_loss": -11.87109375, "global_step": 447717, "epoch": 2664} {"train_loss": -12.578996658325195, "global_step": 447718, "epoch": 2664} {"train_loss": -12.219578095844813, "global_step": 447719, "epoch": 2664, "val_loss": 315103.09375} {"train_loss": -12.690110206604004, "global_step": 447720, "epoch": 2665} {"train_loss": -12.560958862304688, "global_step": 447721, "epoch": 2665} {"train_loss": -12.491413116455078, "global_step": 447722, "epoch": 2665} {"train_loss": -11.998483657836914, "global_step": 447723, "epoch": 2665} {"train_loss": -12.420146942138672, "global_step": 447724, "epoch": 2665} {"train_loss": -12.733875274658203, "global_step": 447725, "epoch": 2665} {"train_loss": -12.115569114685059, "global_step": 447726, "epoch": 2665} {"train_loss": -12.016141891479492, "global_step": 447727, "epoch": 2665} {"train_loss": -12.469348907470703, "global_step": 447728, "epoch": 2665} {"train_loss": -12.675190925598145, "global_step": 447729, "epoch": 2665} {"train_loss": -12.605401992797852, "global_step": 447730, "epoch": 2665} {"train_loss": -12.306291580200195, "global_step": 447731, "epoch": 2665} {"train_loss": -12.37154483795166, "global_step": 447732, "epoch": 2665} {"train_loss": -12.313617706298828, "global_step": 447733, "epoch": 2665} {"train_loss": -11.997674942016602, "global_step": 447734, "epoch": 2665} {"train_loss": -11.838756561279297, "global_step": 447735, "epoch": 2665} {"train_loss": -12.265742301940918, "global_step": 447736, "epoch": 2665} {"train_loss": -12.728109359741211, "global_step": 447737, "epoch": 2665} {"train_loss": -12.068197250366211, "global_step": 447738, "epoch": 2665} {"train_loss": -12.087158203125, "global_step": 447739, "epoch": 2665} {"train_loss": -11.591920852661133, "global_step": 447740, "epoch": 2665} {"train_loss": -10.696028709411621, "global_step": 447741, "epoch": 2665} {"train_loss": -9.8725004196167, "global_step": 447742, "epoch": 2665} {"train_loss": -12.005638122558594, "global_step": 447743, "epoch": 2665} {"train_loss": -9.150415420532227, "global_step": 447744, "epoch": 2665} {"train_loss": -10.429211616516113, "global_step": 447745, "epoch": 2665} {"train_loss": -11.388092994689941, "global_step": 447746, "epoch": 2665} {"train_loss": -10.340280532836914, "global_step": 447747, "epoch": 2665} {"train_loss": -12.106999397277832, "global_step": 447748, "epoch": 2665} {"train_loss": -10.607500076293945, "global_step": 447749, "epoch": 2665} {"train_loss": -10.427698135375977, "global_step": 447750, "epoch": 2665} {"train_loss": -12.031816482543945, "global_step": 447751, "epoch": 2665} {"train_loss": -11.931682586669922, "global_step": 447752, "epoch": 2665} {"train_loss": -11.161937713623047, "global_step": 447753, "epoch": 2665} {"train_loss": -11.810998916625977, "global_step": 447754, "epoch": 2665} {"train_loss": -11.248098373413086, "global_step": 447755, "epoch": 2665} {"train_loss": -11.706607818603516, "global_step": 447756, "epoch": 2665} {"train_loss": -12.081743240356445, "global_step": 447757, "epoch": 2665} {"train_loss": -11.780672073364258, "global_step": 447758, "epoch": 2665} {"train_loss": -11.920258522033691, "global_step": 447759, "epoch": 2665} {"train_loss": -11.94482421875, "global_step": 447760, "epoch": 2665} {"train_loss": -11.319375991821289, "global_step": 447761, "epoch": 2665} {"train_loss": -12.092174530029297, "global_step": 447762, "epoch": 2665} {"train_loss": -11.640539169311523, "global_step": 447763, "epoch": 2665} {"train_loss": -11.893035888671875, "global_step": 447764, "epoch": 2665} {"train_loss": -11.919071197509766, "global_step": 447765, "epoch": 2665} {"train_loss": -12.099102020263672, "global_step": 447766, "epoch": 2665} {"train_loss": -12.504100799560547, "global_step": 447767, "epoch": 2665} {"train_loss": -12.286495208740234, "global_step": 447768, "epoch": 2665} {"train_loss": -12.45109748840332, "global_step": 447769, "epoch": 2665} {"train_loss": -12.109527587890625, "global_step": 447770, "epoch": 2665} {"train_loss": -12.200176239013672, "global_step": 447771, "epoch": 2665} {"train_loss": -12.288434982299805, "global_step": 447772, "epoch": 2665} {"train_loss": -12.403754234313965, "global_step": 447773, "epoch": 2665} {"train_loss": -12.205516815185547, "global_step": 447774, "epoch": 2665} {"train_loss": -12.429885864257812, "global_step": 447775, "epoch": 2665} {"train_loss": -12.418405532836914, "global_step": 447776, "epoch": 2665} {"train_loss": -12.261408805847168, "global_step": 447777, "epoch": 2665} {"train_loss": -12.624530792236328, "global_step": 447778, "epoch": 2665} {"train_loss": -12.133502006530762, "global_step": 447779, "epoch": 2665} {"train_loss": -11.61601448059082, "global_step": 447780, "epoch": 2665} {"train_loss": -12.393390655517578, "global_step": 447781, "epoch": 2665} {"train_loss": -10.789493560791016, "global_step": 447782, "epoch": 2665} {"train_loss": -11.55963134765625, "global_step": 447783, "epoch": 2665} {"train_loss": -12.31873893737793, "global_step": 447784, "epoch": 2665} {"train_loss": -11.486302375793457, "global_step": 447785, "epoch": 2665} {"train_loss": -12.262750625610352, "global_step": 447786, "epoch": 2665} {"train_loss": -11.465703010559082, "global_step": 447787, "epoch": 2665} {"train_loss": -12.291370391845703, "global_step": 447788, "epoch": 2665} {"train_loss": -11.809026718139648, "global_step": 447789, "epoch": 2665} {"train_loss": -12.054737091064453, "global_step": 447790, "epoch": 2665} {"train_loss": -12.20155143737793, "global_step": 447791, "epoch": 2665} {"train_loss": -12.380958557128906, "global_step": 447792, "epoch": 2665} {"train_loss": -12.131855010986328, "global_step": 447793, "epoch": 2665} {"train_loss": -12.353269577026367, "global_step": 447794, "epoch": 2665} {"train_loss": -12.707634925842285, "global_step": 447795, "epoch": 2665} {"train_loss": -12.092493057250977, "global_step": 447796, "epoch": 2665} {"train_loss": -12.5831880569458, "global_step": 447797, "epoch": 2665} {"train_loss": -12.309517860412598, "global_step": 447798, "epoch": 2665} {"train_loss": -12.5425443649292, "global_step": 447799, "epoch": 2665} {"train_loss": -12.439019203186035, "global_step": 447800, "epoch": 2665} {"train_loss": -12.282476425170898, "global_step": 447801, "epoch": 2665} {"train_loss": -12.57027530670166, "global_step": 447802, "epoch": 2665} {"train_loss": -12.413172721862793, "global_step": 447803, "epoch": 2665} {"train_loss": -12.527313232421875, "global_step": 447804, "epoch": 2665} {"train_loss": -12.605143547058105, "global_step": 447805, "epoch": 2665} {"train_loss": -12.494266510009766, "global_step": 447806, "epoch": 2665} {"train_loss": -12.309779167175293, "global_step": 447807, "epoch": 2665} {"train_loss": -12.631111145019531, "global_step": 447808, "epoch": 2665} {"train_loss": -12.456663131713867, "global_step": 447809, "epoch": 2665} {"train_loss": -12.710926055908203, "global_step": 447810, "epoch": 2665} {"train_loss": -12.788335800170898, "global_step": 447811, "epoch": 2665} {"train_loss": -12.583287239074707, "global_step": 447812, "epoch": 2665} {"train_loss": -12.694761276245117, "global_step": 447813, "epoch": 2665} {"train_loss": -12.781301498413086, "global_step": 447814, "epoch": 2665} {"train_loss": -12.540794372558594, "global_step": 447815, "epoch": 2665} {"train_loss": -12.664915084838867, "global_step": 447816, "epoch": 2665} {"train_loss": -12.702886581420898, "global_step": 447817, "epoch": 2665} {"train_loss": -12.732051849365234, "global_step": 447818, "epoch": 2665} {"train_loss": -12.82613754272461, "global_step": 447819, "epoch": 2665} {"train_loss": -13.041786193847656, "global_step": 447820, "epoch": 2665} {"train_loss": -12.956241607666016, "global_step": 447821, "epoch": 2665} {"train_loss": -12.509713172912598, "global_step": 447822, "epoch": 2665} {"train_loss": -12.80152702331543, "global_step": 447823, "epoch": 2665} {"train_loss": -13.038507461547852, "global_step": 447824, "epoch": 2665} {"train_loss": -12.525777816772461, "global_step": 447825, "epoch": 2665} {"train_loss": -12.641706466674805, "global_step": 447826, "epoch": 2665} {"train_loss": -12.906497955322266, "global_step": 447827, "epoch": 2665} {"train_loss": -12.703685760498047, "global_step": 447828, "epoch": 2665} {"train_loss": -12.712069511413574, "global_step": 447829, "epoch": 2665} {"train_loss": -12.730030059814453, "global_step": 447830, "epoch": 2665} {"train_loss": -12.727943420410156, "global_step": 447831, "epoch": 2665} {"train_loss": -12.89542007446289, "global_step": 447832, "epoch": 2665} {"train_loss": -12.798337936401367, "global_step": 447833, "epoch": 2665} {"train_loss": -12.478048324584961, "global_step": 447834, "epoch": 2665} {"train_loss": -12.718886375427246, "global_step": 447835, "epoch": 2665} {"train_loss": -12.955577850341797, "global_step": 447836, "epoch": 2665} {"train_loss": -12.686006546020508, "global_step": 447837, "epoch": 2665} {"train_loss": -12.907331466674805, "global_step": 447838, "epoch": 2665} {"train_loss": -12.885232925415039, "global_step": 447839, "epoch": 2665} {"train_loss": -12.542013168334961, "global_step": 447840, "epoch": 2665} {"train_loss": -12.626121520996094, "global_step": 447841, "epoch": 2665} {"train_loss": -13.01296615600586, "global_step": 447842, "epoch": 2665} {"train_loss": -12.706539154052734, "global_step": 447843, "epoch": 2665} {"train_loss": -13.022207260131836, "global_step": 447844, "epoch": 2665} {"train_loss": -12.600969314575195, "global_step": 447845, "epoch": 2665} {"train_loss": -13.003076553344727, "global_step": 447846, "epoch": 2665} {"train_loss": -12.941189765930176, "global_step": 447847, "epoch": 2665} {"train_loss": -12.554954528808594, "global_step": 447848, "epoch": 2665} {"train_loss": -12.92833137512207, "global_step": 447849, "epoch": 2665} {"train_loss": -12.942891120910645, "global_step": 447850, "epoch": 2665} {"train_loss": -12.579582214355469, "global_step": 447851, "epoch": 2665} {"train_loss": -12.13497257232666, "global_step": 447852, "epoch": 2665} {"train_loss": -12.773750305175781, "global_step": 447853, "epoch": 2665} {"train_loss": -12.372169494628906, "global_step": 447854, "epoch": 2665} {"train_loss": -11.453011512756348, "global_step": 447855, "epoch": 2665} {"train_loss": -11.550511360168457, "global_step": 447856, "epoch": 2665} {"train_loss": -11.687026977539062, "global_step": 447857, "epoch": 2665} {"train_loss": -12.465314865112305, "global_step": 447858, "epoch": 2665} {"train_loss": -10.916482925415039, "global_step": 447859, "epoch": 2665} {"train_loss": -11.862691879272461, "global_step": 447860, "epoch": 2665} {"train_loss": -12.015426635742188, "global_step": 447861, "epoch": 2665} {"train_loss": -12.351953506469727, "global_step": 447862, "epoch": 2665} {"train_loss": -10.234163284301758, "global_step": 447863, "epoch": 2665} {"train_loss": -11.653032302856445, "global_step": 447864, "epoch": 2665} {"train_loss": -8.894027709960938, "global_step": 447865, "epoch": 2665} {"train_loss": -7.1783671379089355, "global_step": 447866, "epoch": 2665} {"train_loss": -7.313375949859619, "global_step": 447867, "epoch": 2665} {"train_loss": -7.839229583740234, "global_step": 447868, "epoch": 2665} {"train_loss": -8.332651138305664, "global_step": 447869, "epoch": 2665} {"train_loss": -7.946070671081543, "global_step": 447870, "epoch": 2665} {"train_loss": -7.15484619140625, "global_step": 447871, "epoch": 2665} {"train_loss": -8.870315551757812, "global_step": 447872, "epoch": 2665} {"train_loss": -8.327432632446289, "global_step": 447873, "epoch": 2665} {"train_loss": -8.680190086364746, "global_step": 447874, "epoch": 2665} {"train_loss": -8.572649955749512, "global_step": 447875, "epoch": 2665} {"train_loss": -9.261116027832031, "global_step": 447876, "epoch": 2665} {"train_loss": -9.950047492980957, "global_step": 447877, "epoch": 2665} {"train_loss": -10.13537883758545, "global_step": 447878, "epoch": 2665} {"train_loss": -10.035472869873047, "global_step": 447879, "epoch": 2665} {"train_loss": -10.72085952758789, "global_step": 447880, "epoch": 2665} {"train_loss": -10.986448287963867, "global_step": 447881, "epoch": 2665} {"train_loss": -10.623443603515625, "global_step": 447882, "epoch": 2665} {"train_loss": -11.01553726196289, "global_step": 447883, "epoch": 2665} {"train_loss": -10.175678253173828, "global_step": 447884, "epoch": 2665} {"train_loss": -10.42333984375, "global_step": 447885, "epoch": 2665} {"train_loss": -10.635355949401855, "global_step": 447886, "epoch": 2665} {"train_loss": -11.809974852062407, "global_step": 447887, "epoch": 2665, "val_loss": 314533.03125, "train_action_mse_error": 0.5128720998764038} {"train_loss": -10.348665237426758, "global_step": 447888, "epoch": 2666} {"train_loss": -10.769009590148926, "global_step": 447889, "epoch": 2666} {"train_loss": -11.479682922363281, "global_step": 447890, "epoch": 2666} {"train_loss": -11.30959701538086, "global_step": 447891, "epoch": 2666} {"train_loss": -10.214937210083008, "global_step": 447892, "epoch": 2666} {"train_loss": -10.570527076721191, "global_step": 447893, "epoch": 2666} {"train_loss": -11.692197799682617, "global_step": 447894, "epoch": 2666} {"train_loss": -10.499120712280273, "global_step": 447895, "epoch": 2666} {"train_loss": -12.027142524719238, "global_step": 447896, "epoch": 2666} {"train_loss": -11.117242813110352, "global_step": 447897, "epoch": 2666} {"train_loss": -11.935724258422852, "global_step": 447898, "epoch": 2666} {"train_loss": -11.471595764160156, "global_step": 447899, "epoch": 2666} {"train_loss": -11.120153427124023, "global_step": 447900, "epoch": 2666} {"train_loss": -11.052007675170898, "global_step": 447901, "epoch": 2666} {"train_loss": -11.683969497680664, "global_step": 447902, "epoch": 2666} {"train_loss": -10.995022773742676, "global_step": 447903, "epoch": 2666} {"train_loss": -11.589607238769531, "global_step": 447904, "epoch": 2666} {"train_loss": -11.481507301330566, "global_step": 447905, "epoch": 2666} {"train_loss": -10.660728454589844, "global_step": 447906, "epoch": 2666} {"train_loss": -10.972636222839355, "global_step": 447907, "epoch": 2666} {"train_loss": -11.608187675476074, "global_step": 447908, "epoch": 2666} {"train_loss": -11.161865234375, "global_step": 447909, "epoch": 2666} {"train_loss": -11.568922996520996, "global_step": 447910, "epoch": 2666} {"train_loss": -12.131278038024902, "global_step": 447911, "epoch": 2666} {"train_loss": -10.976176261901855, "global_step": 447912, "epoch": 2666} {"train_loss": -11.72061824798584, "global_step": 447913, "epoch": 2666} {"train_loss": -12.132842063903809, "global_step": 447914, "epoch": 2666} {"train_loss": -11.669512748718262, "global_step": 447915, "epoch": 2666} {"train_loss": -11.631124496459961, "global_step": 447916, "epoch": 2666} {"train_loss": -12.204309463500977, "global_step": 447917, "epoch": 2666} {"train_loss": -11.64594841003418, "global_step": 447918, "epoch": 2666} {"train_loss": -12.007052421569824, "global_step": 447919, "epoch": 2666} {"train_loss": -12.087163925170898, "global_step": 447920, "epoch": 2666} {"train_loss": -11.761898040771484, "global_step": 447921, "epoch": 2666} {"train_loss": -12.325679779052734, "global_step": 447922, "epoch": 2666} {"train_loss": -12.059215545654297, "global_step": 447923, "epoch": 2666} {"train_loss": -11.867868423461914, "global_step": 447924, "epoch": 2666} {"train_loss": -12.591371536254883, "global_step": 447925, "epoch": 2666} {"train_loss": -12.216007232666016, "global_step": 447926, "epoch": 2666} {"train_loss": -12.433867454528809, "global_step": 447927, "epoch": 2666} {"train_loss": -12.518054962158203, "global_step": 447928, "epoch": 2666} {"train_loss": -11.973270416259766, "global_step": 447929, "epoch": 2666} {"train_loss": -12.376622200012207, "global_step": 447930, "epoch": 2666} {"train_loss": -12.494057655334473, "global_step": 447931, "epoch": 2666} {"train_loss": -11.977237701416016, "global_step": 447932, "epoch": 2666} {"train_loss": -12.28995132446289, "global_step": 447933, "epoch": 2666} {"train_loss": -12.142498970031738, "global_step": 447934, "epoch": 2666} {"train_loss": -12.35665225982666, "global_step": 447935, "epoch": 2666} {"train_loss": -12.511249542236328, "global_step": 447936, "epoch": 2666} {"train_loss": -12.31652545928955, "global_step": 447937, "epoch": 2666} {"train_loss": -12.533353805541992, "global_step": 447938, "epoch": 2666} {"train_loss": -12.447057723999023, "global_step": 447939, "epoch": 2666} {"train_loss": -12.434892654418945, "global_step": 447940, "epoch": 2666} {"train_loss": -12.448862075805664, "global_step": 447941, "epoch": 2666} {"train_loss": -12.427364349365234, "global_step": 447942, "epoch": 2666} {"train_loss": -12.558202743530273, "global_step": 447943, "epoch": 2666} {"train_loss": -12.474530220031738, "global_step": 447944, "epoch": 2666} {"train_loss": -12.428749084472656, "global_step": 447945, "epoch": 2666} {"train_loss": -12.372801780700684, "global_step": 447946, "epoch": 2666} {"train_loss": -12.552584648132324, "global_step": 447947, "epoch": 2666} {"train_loss": -12.407352447509766, "global_step": 447948, "epoch": 2666} {"train_loss": -12.64399242401123, "global_step": 447949, "epoch": 2666} {"train_loss": -12.540822982788086, "global_step": 447950, "epoch": 2666} {"train_loss": -12.610706329345703, "global_step": 447951, "epoch": 2666} {"train_loss": -12.438003540039062, "global_step": 447952, "epoch": 2666} {"train_loss": -12.576225280761719, "global_step": 447953, "epoch": 2666} {"train_loss": -12.822954177856445, "global_step": 447954, "epoch": 2666} {"train_loss": -12.714637756347656, "global_step": 447955, "epoch": 2666} {"train_loss": -12.758447647094727, "global_step": 447956, "epoch": 2666} {"train_loss": -12.634941101074219, "global_step": 447957, "epoch": 2666} {"train_loss": -12.843236923217773, "global_step": 447958, "epoch": 2666} {"train_loss": -12.745746612548828, "global_step": 447959, "epoch": 2666} {"train_loss": -12.410502433776855, "global_step": 447960, "epoch": 2666} {"train_loss": -12.743585586547852, "global_step": 447961, "epoch": 2666} {"train_loss": -12.502152442932129, "global_step": 447962, "epoch": 2666} {"train_loss": -12.369367599487305, "global_step": 447963, "epoch": 2666} {"train_loss": -12.774993896484375, "global_step": 447964, "epoch": 2666} {"train_loss": -12.717374801635742, "global_step": 447965, "epoch": 2666} {"train_loss": -12.527563095092773, "global_step": 447966, "epoch": 2666} {"train_loss": -12.634115219116211, "global_step": 447967, "epoch": 2666} {"train_loss": -12.829975128173828, "global_step": 447968, "epoch": 2666} {"train_loss": -12.616988182067871, "global_step": 447969, "epoch": 2666} {"train_loss": -12.830317497253418, "global_step": 447970, "epoch": 2666} {"train_loss": -12.737104415893555, "global_step": 447971, "epoch": 2666} {"train_loss": -12.461919784545898, "global_step": 447972, "epoch": 2666} {"train_loss": -12.582411766052246, "global_step": 447973, "epoch": 2666} {"train_loss": -12.627484321594238, "global_step": 447974, "epoch": 2666} {"train_loss": -12.808009147644043, "global_step": 447975, "epoch": 2666} {"train_loss": -12.607138633728027, "global_step": 447976, "epoch": 2666} {"train_loss": -12.431553840637207, "global_step": 447977, "epoch": 2666} {"train_loss": -12.790878295898438, "global_step": 447978, "epoch": 2666} {"train_loss": -12.817659378051758, "global_step": 447979, "epoch": 2666} {"train_loss": -12.75190544128418, "global_step": 447980, "epoch": 2666} {"train_loss": -12.826711654663086, "global_step": 447981, "epoch": 2666} {"train_loss": -12.82846450805664, "global_step": 447982, "epoch": 2666} {"train_loss": -12.51663589477539, "global_step": 447983, "epoch": 2666} {"train_loss": -12.911518096923828, "global_step": 447984, "epoch": 2666} {"train_loss": -12.687837600708008, "global_step": 447985, "epoch": 2666} {"train_loss": -12.903520584106445, "global_step": 447986, "epoch": 2666} {"train_loss": -12.565691947937012, "global_step": 447987, "epoch": 2666} {"train_loss": -12.889379501342773, "global_step": 447988, "epoch": 2666} {"train_loss": -12.703645706176758, "global_step": 447989, "epoch": 2666} {"train_loss": -12.575352668762207, "global_step": 447990, "epoch": 2666} {"train_loss": -12.558209419250488, "global_step": 447991, "epoch": 2666} {"train_loss": -12.401803970336914, "global_step": 447992, "epoch": 2666} {"train_loss": -12.625755310058594, "global_step": 447993, "epoch": 2666} {"train_loss": -12.72546672821045, "global_step": 447994, "epoch": 2666} {"train_loss": -12.304438591003418, "global_step": 447995, "epoch": 2666} {"train_loss": -11.863171577453613, "global_step": 447996, "epoch": 2666} {"train_loss": -12.543533325195312, "global_step": 447997, "epoch": 2666} {"train_loss": -12.616598129272461, "global_step": 447998, "epoch": 2666} {"train_loss": -12.479433059692383, "global_step": 447999, "epoch": 2666} {"train_loss": -12.792766571044922, "global_step": 448000, "epoch": 2666} {"train_loss": -12.816909790039062, "global_step": 448001, "epoch": 2666} {"train_loss": -13.004652976989746, "global_step": 448002, "epoch": 2666} {"train_loss": -13.049225807189941, "global_step": 448003, "epoch": 2666} {"train_loss": -12.797122955322266, "global_step": 448004, "epoch": 2666} {"train_loss": -13.0399169921875, "global_step": 448005, "epoch": 2666} {"train_loss": -12.740060806274414, "global_step": 448006, "epoch": 2666} {"train_loss": -12.90150260925293, "global_step": 448007, "epoch": 2666} {"train_loss": -12.545684814453125, "global_step": 448008, "epoch": 2666} {"train_loss": -12.498231887817383, "global_step": 448009, "epoch": 2666} {"train_loss": -11.650197982788086, "global_step": 448010, "epoch": 2666} {"train_loss": -11.822851181030273, "global_step": 448011, "epoch": 2666} {"train_loss": -12.32668399810791, "global_step": 448012, "epoch": 2666} {"train_loss": -12.656469345092773, "global_step": 448013, "epoch": 2666} {"train_loss": -12.463645935058594, "global_step": 448014, "epoch": 2666} {"train_loss": -11.669683456420898, "global_step": 448015, "epoch": 2666} {"train_loss": -11.705148696899414, "global_step": 448016, "epoch": 2666} {"train_loss": -10.064611434936523, "global_step": 448017, "epoch": 2666} {"train_loss": -12.095443725585938, "global_step": 448018, "epoch": 2666} {"train_loss": -12.006195068359375, "global_step": 448019, "epoch": 2666} {"train_loss": -10.311315536499023, "global_step": 448020, "epoch": 2666} {"train_loss": -10.700957298278809, "global_step": 448021, "epoch": 2666} {"train_loss": -11.391936302185059, "global_step": 448022, "epoch": 2666} {"train_loss": -9.907036781311035, "global_step": 448023, "epoch": 2666} {"train_loss": -9.560623168945312, "global_step": 448024, "epoch": 2666} {"train_loss": -9.407032012939453, "global_step": 448025, "epoch": 2666} {"train_loss": -9.80574893951416, "global_step": 448026, "epoch": 2666} {"train_loss": -9.27857780456543, "global_step": 448027, "epoch": 2666} {"train_loss": -10.833086013793945, "global_step": 448028, "epoch": 2666} {"train_loss": -9.751382827758789, "global_step": 448029, "epoch": 2666} {"train_loss": -9.712074279785156, "global_step": 448030, "epoch": 2666} {"train_loss": -10.51071548461914, "global_step": 448031, "epoch": 2666} {"train_loss": -11.338113784790039, "global_step": 448032, "epoch": 2666} {"train_loss": -10.080069541931152, "global_step": 448033, "epoch": 2666} {"train_loss": -10.633872032165527, "global_step": 448034, "epoch": 2666} {"train_loss": -10.48741626739502, "global_step": 448035, "epoch": 2666} {"train_loss": -11.295723915100098, "global_step": 448036, "epoch": 2666} {"train_loss": -11.212514877319336, "global_step": 448037, "epoch": 2666} {"train_loss": -11.00864028930664, "global_step": 448038, "epoch": 2666} {"train_loss": -11.163678169250488, "global_step": 448039, "epoch": 2666} {"train_loss": -11.386222839355469, "global_step": 448040, "epoch": 2666} {"train_loss": -11.215349197387695, "global_step": 448041, "epoch": 2666} {"train_loss": -11.717913627624512, "global_step": 448042, "epoch": 2666} {"train_loss": -10.883378982543945, "global_step": 448043, "epoch": 2666} {"train_loss": -11.707497596740723, "global_step": 448044, "epoch": 2666} {"train_loss": -11.580863952636719, "global_step": 448045, "epoch": 2666} {"train_loss": -11.129127502441406, "global_step": 448046, "epoch": 2666} {"train_loss": -11.795044898986816, "global_step": 448047, "epoch": 2666} {"train_loss": -11.325366020202637, "global_step": 448048, "epoch": 2666} {"train_loss": -11.954788208007812, "global_step": 448049, "epoch": 2666} {"train_loss": -11.41700553894043, "global_step": 448050, "epoch": 2666} {"train_loss": -11.171653747558594, "global_step": 448051, "epoch": 2666} {"train_loss": -12.388903617858887, "global_step": 448052, "epoch": 2666} {"train_loss": -11.45701789855957, "global_step": 448053, "epoch": 2666} {"train_loss": -11.819364547729492, "global_step": 448054, "epoch": 2666} {"train_loss": -11.936279018719992, "global_step": 448055, "epoch": 2666, "val_loss": 313516.75} {"train_loss": -12.230154037475586, "global_step": 448056, "epoch": 2667} {"train_loss": -11.89950180053711, "global_step": 448057, "epoch": 2667} {"train_loss": -12.180075645446777, "global_step": 448058, "epoch": 2667} {"train_loss": -11.646204948425293, "global_step": 448059, "epoch": 2667} {"train_loss": -11.620980262756348, "global_step": 448060, "epoch": 2667} {"train_loss": -11.765486717224121, "global_step": 448061, "epoch": 2667} {"train_loss": -12.181467056274414, "global_step": 448062, "epoch": 2667} {"train_loss": -11.220921516418457, "global_step": 448063, "epoch": 2667} {"train_loss": -11.618441581726074, "global_step": 448064, "epoch": 2667} {"train_loss": -11.394411087036133, "global_step": 448065, "epoch": 2667} {"train_loss": -10.4851655960083, "global_step": 448066, "epoch": 2667} {"train_loss": -11.693582534790039, "global_step": 448067, "epoch": 2667} {"train_loss": -11.136945724487305, "global_step": 448068, "epoch": 2667} {"train_loss": -11.230396270751953, "global_step": 448069, "epoch": 2667} {"train_loss": -11.965019226074219, "global_step": 448070, "epoch": 2667} {"train_loss": -11.638132095336914, "global_step": 448071, "epoch": 2667} {"train_loss": -11.452408790588379, "global_step": 448072, "epoch": 2667} {"train_loss": -11.733806610107422, "global_step": 448073, "epoch": 2667} {"train_loss": -11.256952285766602, "global_step": 448074, "epoch": 2667} {"train_loss": -11.521310806274414, "global_step": 448075, "epoch": 2667} {"train_loss": -11.61604118347168, "global_step": 448076, "epoch": 2667} {"train_loss": -12.058430671691895, "global_step": 448077, "epoch": 2667} {"train_loss": -11.98745346069336, "global_step": 448078, "epoch": 2667} {"train_loss": -11.888179779052734, "global_step": 448079, "epoch": 2667} {"train_loss": -11.859046936035156, "global_step": 448080, "epoch": 2667} {"train_loss": -11.812248229980469, "global_step": 448081, "epoch": 2667} {"train_loss": -11.854424476623535, "global_step": 448082, "epoch": 2667} {"train_loss": -12.021843910217285, "global_step": 448083, "epoch": 2667} {"train_loss": -12.13421630859375, "global_step": 448084, "epoch": 2667} {"train_loss": -12.170087814331055, "global_step": 448085, "epoch": 2667} {"train_loss": -12.344269752502441, "global_step": 448086, "epoch": 2667} {"train_loss": -11.933608055114746, "global_step": 448087, "epoch": 2667} {"train_loss": -11.727607727050781, "global_step": 448088, "epoch": 2667} {"train_loss": -11.664143562316895, "global_step": 448089, "epoch": 2667} {"train_loss": -11.808477401733398, "global_step": 448090, "epoch": 2667} {"train_loss": -12.012785911560059, "global_step": 448091, "epoch": 2667} {"train_loss": -12.20905876159668, "global_step": 448092, "epoch": 2667} {"train_loss": -11.840925216674805, "global_step": 448093, "epoch": 2667} {"train_loss": -12.375749588012695, "global_step": 448094, "epoch": 2667} {"train_loss": -11.993480682373047, "global_step": 448095, "epoch": 2667} {"train_loss": -12.212677001953125, "global_step": 448096, "epoch": 2667} {"train_loss": -12.255455017089844, "global_step": 448097, "epoch": 2667} {"train_loss": -11.838142395019531, "global_step": 448098, "epoch": 2667} {"train_loss": -12.40343952178955, "global_step": 448099, "epoch": 2667} {"train_loss": -11.60654354095459, "global_step": 448100, "epoch": 2667} {"train_loss": -12.51789665222168, "global_step": 448101, "epoch": 2667} {"train_loss": -11.942195892333984, "global_step": 448102, "epoch": 2667} {"train_loss": -12.315589904785156, "global_step": 448103, "epoch": 2667} {"train_loss": -12.336816787719727, "global_step": 448104, "epoch": 2667} {"train_loss": -11.942785263061523, "global_step": 448105, "epoch": 2667} {"train_loss": -12.27811336517334, "global_step": 448106, "epoch": 2667} {"train_loss": -12.527206420898438, "global_step": 448107, "epoch": 2667} {"train_loss": -12.433880805969238, "global_step": 448108, "epoch": 2667} {"train_loss": -12.75299072265625, "global_step": 448109, "epoch": 2667} {"train_loss": -12.534229278564453, "global_step": 448110, "epoch": 2667} {"train_loss": -12.681783676147461, "global_step": 448111, "epoch": 2667} {"train_loss": -12.508545875549316, "global_step": 448112, "epoch": 2667} {"train_loss": -12.571748733520508, "global_step": 448113, "epoch": 2667} {"train_loss": -12.396787643432617, "global_step": 448114, "epoch": 2667} {"train_loss": -12.679502487182617, "global_step": 448115, "epoch": 2667} {"train_loss": -12.450984001159668, "global_step": 448116, "epoch": 2667} {"train_loss": -12.399656295776367, "global_step": 448117, "epoch": 2667} {"train_loss": -12.536890029907227, "global_step": 448118, "epoch": 2667} {"train_loss": -12.628357887268066, "global_step": 448119, "epoch": 2667} {"train_loss": -12.691388130187988, "global_step": 448120, "epoch": 2667} {"train_loss": -12.504343032836914, "global_step": 448121, "epoch": 2667} {"train_loss": -12.727928161621094, "global_step": 448122, "epoch": 2667} {"train_loss": -12.565237045288086, "global_step": 448123, "epoch": 2667} {"train_loss": -12.581968307495117, "global_step": 448124, "epoch": 2667} {"train_loss": -12.554835319519043, "global_step": 448125, "epoch": 2667} {"train_loss": -12.648126602172852, "global_step": 448126, "epoch": 2667} {"train_loss": -12.348928451538086, "global_step": 448127, "epoch": 2667} {"train_loss": -12.601264953613281, "global_step": 448128, "epoch": 2667} {"train_loss": -12.646021842956543, "global_step": 448129, "epoch": 2667} {"train_loss": -12.635530471801758, "global_step": 448130, "epoch": 2667} {"train_loss": -12.72923469543457, "global_step": 448131, "epoch": 2667} {"train_loss": -12.8983736038208, "global_step": 448132, "epoch": 2667} {"train_loss": -12.407865524291992, "global_step": 448133, "epoch": 2667} {"train_loss": -12.662476539611816, "global_step": 448134, "epoch": 2667} {"train_loss": -12.483771324157715, "global_step": 448135, "epoch": 2667} {"train_loss": -12.695667266845703, "global_step": 448136, "epoch": 2667} {"train_loss": -12.705242156982422, "global_step": 448137, "epoch": 2667} {"train_loss": -12.5695161819458, "global_step": 448138, "epoch": 2667} {"train_loss": -12.601200103759766, "global_step": 448139, "epoch": 2667} {"train_loss": -12.48953914642334, "global_step": 448140, "epoch": 2667} {"train_loss": -12.760191917419434, "global_step": 448141, "epoch": 2667} {"train_loss": -12.233559608459473, "global_step": 448142, "epoch": 2667} {"train_loss": -12.610260009765625, "global_step": 448143, "epoch": 2667} {"train_loss": -12.756149291992188, "global_step": 448144, "epoch": 2667} {"train_loss": -12.59027099609375, "global_step": 448145, "epoch": 2667} {"train_loss": -12.210713386535645, "global_step": 448146, "epoch": 2667} {"train_loss": -12.720321655273438, "global_step": 448147, "epoch": 2667} {"train_loss": -12.624031066894531, "global_step": 448148, "epoch": 2667} {"train_loss": -12.726505279541016, "global_step": 448149, "epoch": 2667} {"train_loss": -12.385332107543945, "global_step": 448150, "epoch": 2667} {"train_loss": -12.484522819519043, "global_step": 448151, "epoch": 2667} {"train_loss": -12.475629806518555, "global_step": 448152, "epoch": 2667} {"train_loss": -12.108874320983887, "global_step": 448153, "epoch": 2667} {"train_loss": -11.029220581054688, "global_step": 448154, "epoch": 2667} {"train_loss": -12.040135383605957, "global_step": 448155, "epoch": 2667} {"train_loss": -10.973522186279297, "global_step": 448156, "epoch": 2667} {"train_loss": -11.407376289367676, "global_step": 448157, "epoch": 2667} {"train_loss": -10.507251739501953, "global_step": 448158, "epoch": 2667} {"train_loss": -10.186384201049805, "global_step": 448159, "epoch": 2667} {"train_loss": -12.31895923614502, "global_step": 448160, "epoch": 2667} {"train_loss": -10.158050537109375, "global_step": 448161, "epoch": 2667} {"train_loss": -12.260774612426758, "global_step": 448162, "epoch": 2667} {"train_loss": -10.269104957580566, "global_step": 448163, "epoch": 2667} {"train_loss": -9.89987564086914, "global_step": 448164, "epoch": 2667} {"train_loss": -11.112277030944824, "global_step": 448165, "epoch": 2667} {"train_loss": -10.570568084716797, "global_step": 448166, "epoch": 2667} {"train_loss": -9.29675006866455, "global_step": 448167, "epoch": 2667} {"train_loss": -11.208450317382812, "global_step": 448168, "epoch": 2667} {"train_loss": -11.022923469543457, "global_step": 448169, "epoch": 2667} {"train_loss": -10.505523681640625, "global_step": 448170, "epoch": 2667} {"train_loss": -10.398426055908203, "global_step": 448171, "epoch": 2667} {"train_loss": -10.80119514465332, "global_step": 448172, "epoch": 2667} {"train_loss": -11.609945297241211, "global_step": 448173, "epoch": 2667} {"train_loss": -9.739486694335938, "global_step": 448174, "epoch": 2667} {"train_loss": -10.881612777709961, "global_step": 448175, "epoch": 2667} {"train_loss": -11.306389808654785, "global_step": 448176, "epoch": 2667} {"train_loss": -11.113574028015137, "global_step": 448177, "epoch": 2667} {"train_loss": -11.074995040893555, "global_step": 448178, "epoch": 2667} {"train_loss": -11.318489074707031, "global_step": 448179, "epoch": 2667} {"train_loss": -11.553840637207031, "global_step": 448180, "epoch": 2667} {"train_loss": -11.619499206542969, "global_step": 448181, "epoch": 2667} {"train_loss": -11.840475082397461, "global_step": 448182, "epoch": 2667} {"train_loss": -11.601499557495117, "global_step": 448183, "epoch": 2667} {"train_loss": -12.257182121276855, "global_step": 448184, "epoch": 2667} {"train_loss": -11.504902839660645, "global_step": 448185, "epoch": 2667} {"train_loss": -12.187214851379395, "global_step": 448186, "epoch": 2667} {"train_loss": -11.087881088256836, "global_step": 448187, "epoch": 2667} {"train_loss": -12.12149429321289, "global_step": 448188, "epoch": 2667} {"train_loss": -11.466411590576172, "global_step": 448189, "epoch": 2667} {"train_loss": -11.834840774536133, "global_step": 448190, "epoch": 2667} {"train_loss": -12.01976490020752, "global_step": 448191, "epoch": 2667} {"train_loss": -11.512514114379883, "global_step": 448192, "epoch": 2667} {"train_loss": -12.226184844970703, "global_step": 448193, "epoch": 2667} {"train_loss": -11.474358558654785, "global_step": 448194, "epoch": 2667} {"train_loss": -12.221258163452148, "global_step": 448195, "epoch": 2667} {"train_loss": -12.050593376159668, "global_step": 448196, "epoch": 2667} {"train_loss": -12.407525062561035, "global_step": 448197, "epoch": 2667} {"train_loss": -11.961183547973633, "global_step": 448198, "epoch": 2667} {"train_loss": -12.085622787475586, "global_step": 448199, "epoch": 2667} {"train_loss": -12.21910285949707, "global_step": 448200, "epoch": 2667} {"train_loss": -12.1675443649292, "global_step": 448201, "epoch": 2667} {"train_loss": -12.143462181091309, "global_step": 448202, "epoch": 2667} {"train_loss": -12.138461112976074, "global_step": 448203, "epoch": 2667} {"train_loss": -12.347024917602539, "global_step": 448204, "epoch": 2667} {"train_loss": -11.98831558227539, "global_step": 448205, "epoch": 2667} {"train_loss": -12.174657821655273, "global_step": 448206, "epoch": 2667} {"train_loss": -11.879868507385254, "global_step": 448207, "epoch": 2667} {"train_loss": -12.05154037475586, "global_step": 448208, "epoch": 2667} {"train_loss": -12.417975425720215, "global_step": 448209, "epoch": 2667} {"train_loss": -12.312673568725586, "global_step": 448210, "epoch": 2667} {"train_loss": -12.279006958007812, "global_step": 448211, "epoch": 2667} {"train_loss": -12.227596282958984, "global_step": 448212, "epoch": 2667} {"train_loss": -12.587007522583008, "global_step": 448213, "epoch": 2667} {"train_loss": -12.403422355651855, "global_step": 448214, "epoch": 2667} {"train_loss": -12.56205940246582, "global_step": 448215, "epoch": 2667} {"train_loss": -12.469289779663086, "global_step": 448216, "epoch": 2667} {"train_loss": -12.349000930786133, "global_step": 448217, "epoch": 2667} {"train_loss": -12.487537384033203, "global_step": 448218, "epoch": 2667} {"train_loss": -12.596985816955566, "global_step": 448219, "epoch": 2667} {"train_loss": -12.476566314697266, "global_step": 448220, "epoch": 2667} {"train_loss": -12.670424461364746, "global_step": 448221, "epoch": 2667} {"train_loss": -12.628616333007812, "global_step": 448222, "epoch": 2667} {"train_loss": -11.971997567585536, "global_step": 448223, "epoch": 2667, "val_loss": 314612.0} {"train_loss": -12.579130172729492, "global_step": 448224, "epoch": 2668} {"train_loss": -12.591880798339844, "global_step": 448225, "epoch": 2668} {"train_loss": -12.90611457824707, "global_step": 448226, "epoch": 2668} {"train_loss": -12.6339111328125, "global_step": 448227, "epoch": 2668} {"train_loss": -12.60812759399414, "global_step": 448228, "epoch": 2668} {"train_loss": -12.505516052246094, "global_step": 448229, "epoch": 2668} {"train_loss": -12.614209175109863, "global_step": 448230, "epoch": 2668} {"train_loss": -12.835794448852539, "global_step": 448231, "epoch": 2668} {"train_loss": -12.442926406860352, "global_step": 448232, "epoch": 2668} {"train_loss": -12.546077728271484, "global_step": 448233, "epoch": 2668} {"train_loss": -12.674263954162598, "global_step": 448234, "epoch": 2668} {"train_loss": -12.190074920654297, "global_step": 448235, "epoch": 2668} {"train_loss": -12.69896125793457, "global_step": 448236, "epoch": 2668} {"train_loss": -12.495749473571777, "global_step": 448237, "epoch": 2668} {"train_loss": -12.519120216369629, "global_step": 448238, "epoch": 2668} {"train_loss": -12.512428283691406, "global_step": 448239, "epoch": 2668} {"train_loss": -12.675475120544434, "global_step": 448240, "epoch": 2668} {"train_loss": -12.670507431030273, "global_step": 448241, "epoch": 2668} {"train_loss": -12.610816955566406, "global_step": 448242, "epoch": 2668} {"train_loss": -12.6101655960083, "global_step": 448243, "epoch": 2668} {"train_loss": -12.851249694824219, "global_step": 448244, "epoch": 2668} {"train_loss": -12.81751823425293, "global_step": 448245, "epoch": 2668} {"train_loss": -12.629549026489258, "global_step": 448246, "epoch": 2668} {"train_loss": -12.975042343139648, "global_step": 448247, "epoch": 2668} {"train_loss": -12.440020561218262, "global_step": 448248, "epoch": 2668} {"train_loss": -12.709294319152832, "global_step": 448249, "epoch": 2668} {"train_loss": -12.662128448486328, "global_step": 448250, "epoch": 2668} {"train_loss": -12.42987060546875, "global_step": 448251, "epoch": 2668} {"train_loss": -12.775779724121094, "global_step": 448252, "epoch": 2668} {"train_loss": -12.551958084106445, "global_step": 448253, "epoch": 2668} {"train_loss": -12.491125106811523, "global_step": 448254, "epoch": 2668} {"train_loss": -12.410064697265625, "global_step": 448255, "epoch": 2668} {"train_loss": -12.858833312988281, "global_step": 448256, "epoch": 2668} {"train_loss": -12.541922569274902, "global_step": 448257, "epoch": 2668} {"train_loss": -12.53348159790039, "global_step": 448258, "epoch": 2668} {"train_loss": -12.736696243286133, "global_step": 448259, "epoch": 2668} {"train_loss": -12.622140884399414, "global_step": 448260, "epoch": 2668} {"train_loss": -12.786319732666016, "global_step": 448261, "epoch": 2668} {"train_loss": -12.97917366027832, "global_step": 448262, "epoch": 2668} {"train_loss": -12.836152076721191, "global_step": 448263, "epoch": 2668} {"train_loss": -12.802982330322266, "global_step": 448264, "epoch": 2668} {"train_loss": -12.512075424194336, "global_step": 448265, "epoch": 2668} {"train_loss": -12.723613739013672, "global_step": 448266, "epoch": 2668} {"train_loss": -12.564894676208496, "global_step": 448267, "epoch": 2668} {"train_loss": -12.816222190856934, "global_step": 448268, "epoch": 2668} {"train_loss": -12.947399139404297, "global_step": 448269, "epoch": 2668} {"train_loss": -12.470541000366211, "global_step": 448270, "epoch": 2668} {"train_loss": -12.478753089904785, "global_step": 448271, "epoch": 2668} {"train_loss": -12.83445930480957, "global_step": 448272, "epoch": 2668} {"train_loss": -12.532233238220215, "global_step": 448273, "epoch": 2668} {"train_loss": -12.509173393249512, "global_step": 448274, "epoch": 2668} {"train_loss": -12.90629768371582, "global_step": 448275, "epoch": 2668} {"train_loss": -12.952704429626465, "global_step": 448276, "epoch": 2668} {"train_loss": -12.46487045288086, "global_step": 448277, "epoch": 2668} {"train_loss": -12.90599250793457, "global_step": 448278, "epoch": 2668} {"train_loss": -12.667964935302734, "global_step": 448279, "epoch": 2668} {"train_loss": -12.663774490356445, "global_step": 448280, "epoch": 2668} {"train_loss": -12.863348007202148, "global_step": 448281, "epoch": 2668} {"train_loss": -12.954513549804688, "global_step": 448282, "epoch": 2668} {"train_loss": -12.544149398803711, "global_step": 448283, "epoch": 2668} {"train_loss": -12.77903938293457, "global_step": 448284, "epoch": 2668} {"train_loss": -12.686335563659668, "global_step": 448285, "epoch": 2668} {"train_loss": -12.935609817504883, "global_step": 448286, "epoch": 2668} {"train_loss": -12.652099609375, "global_step": 448287, "epoch": 2668} {"train_loss": -12.679641723632812, "global_step": 448288, "epoch": 2668} {"train_loss": -12.87913703918457, "global_step": 448289, "epoch": 2668} {"train_loss": -12.965757369995117, "global_step": 448290, "epoch": 2668} {"train_loss": -12.55048942565918, "global_step": 448291, "epoch": 2668} {"train_loss": -12.68229866027832, "global_step": 448292, "epoch": 2668} {"train_loss": -13.019455909729004, "global_step": 448293, "epoch": 2668} {"train_loss": -12.64801025390625, "global_step": 448294, "epoch": 2668} {"train_loss": -12.34637451171875, "global_step": 448295, "epoch": 2668} {"train_loss": -12.386016845703125, "global_step": 448296, "epoch": 2668} {"train_loss": -12.631714820861816, "global_step": 448297, "epoch": 2668} {"train_loss": -12.170083999633789, "global_step": 448298, "epoch": 2668} {"train_loss": -10.678018569946289, "global_step": 448299, "epoch": 2668} {"train_loss": -12.59252643585205, "global_step": 448300, "epoch": 2668} {"train_loss": -12.195899963378906, "global_step": 448301, "epoch": 2668} {"train_loss": -11.174388885498047, "global_step": 448302, "epoch": 2668} {"train_loss": -11.782548904418945, "global_step": 448303, "epoch": 2668} {"train_loss": -12.626806259155273, "global_step": 448304, "epoch": 2668} {"train_loss": -11.985909461975098, "global_step": 448305, "epoch": 2668} {"train_loss": -11.832313537597656, "global_step": 448306, "epoch": 2668} {"train_loss": -12.092939376831055, "global_step": 448307, "epoch": 2668} {"train_loss": -12.451774597167969, "global_step": 448308, "epoch": 2668} {"train_loss": -10.99874496459961, "global_step": 448309, "epoch": 2668} {"train_loss": -10.612911224365234, "global_step": 448310, "epoch": 2668} {"train_loss": -10.887765884399414, "global_step": 448311, "epoch": 2668} {"train_loss": -11.579330444335938, "global_step": 448312, "epoch": 2668} {"train_loss": -11.321569442749023, "global_step": 448313, "epoch": 2668} {"train_loss": -10.124703407287598, "global_step": 448314, "epoch": 2668} {"train_loss": -9.379145622253418, "global_step": 448315, "epoch": 2668} {"train_loss": -9.33718490600586, "global_step": 448316, "epoch": 2668} {"train_loss": -10.535025596618652, "global_step": 448317, "epoch": 2668} {"train_loss": -10.536296844482422, "global_step": 448318, "epoch": 2668} {"train_loss": -10.635643005371094, "global_step": 448319, "epoch": 2668} {"train_loss": -9.918722152709961, "global_step": 448320, "epoch": 2668} {"train_loss": -11.807011604309082, "global_step": 448321, "epoch": 2668} {"train_loss": -10.786429405212402, "global_step": 448322, "epoch": 2668} {"train_loss": -11.034584045410156, "global_step": 448323, "epoch": 2668} {"train_loss": -11.637840270996094, "global_step": 448324, "epoch": 2668} {"train_loss": -11.121627807617188, "global_step": 448325, "epoch": 2668} {"train_loss": -11.546127319335938, "global_step": 448326, "epoch": 2668} {"train_loss": -11.865289688110352, "global_step": 448327, "epoch": 2668} {"train_loss": -11.347480773925781, "global_step": 448328, "epoch": 2668} {"train_loss": -11.85268783569336, "global_step": 448329, "epoch": 2668} {"train_loss": -11.182748794555664, "global_step": 448330, "epoch": 2668} {"train_loss": -11.558635711669922, "global_step": 448331, "epoch": 2668} {"train_loss": -11.7183256149292, "global_step": 448332, "epoch": 2668} {"train_loss": -11.442506790161133, "global_step": 448333, "epoch": 2668} {"train_loss": -11.887537002563477, "global_step": 448334, "epoch": 2668} {"train_loss": -11.265493392944336, "global_step": 448335, "epoch": 2668} {"train_loss": -11.756608963012695, "global_step": 448336, "epoch": 2668} {"train_loss": -11.494192123413086, "global_step": 448337, "epoch": 2668} {"train_loss": -11.225637435913086, "global_step": 448338, "epoch": 2668} {"train_loss": -12.09296989440918, "global_step": 448339, "epoch": 2668} {"train_loss": -11.339841842651367, "global_step": 448340, "epoch": 2668} {"train_loss": -11.5697021484375, "global_step": 448341, "epoch": 2668} {"train_loss": -10.581708908081055, "global_step": 448342, "epoch": 2668} {"train_loss": -11.131937980651855, "global_step": 448343, "epoch": 2668} {"train_loss": -10.845144271850586, "global_step": 448344, "epoch": 2668} {"train_loss": -10.776176452636719, "global_step": 448345, "epoch": 2668} {"train_loss": -10.717082977294922, "global_step": 448346, "epoch": 2668} {"train_loss": -10.573587417602539, "global_step": 448347, "epoch": 2668} {"train_loss": -10.495959281921387, "global_step": 448348, "epoch": 2668} {"train_loss": -10.233833312988281, "global_step": 448349, "epoch": 2668} {"train_loss": -11.15412712097168, "global_step": 448350, "epoch": 2668} {"train_loss": -10.005939483642578, "global_step": 448351, "epoch": 2668} {"train_loss": -11.610889434814453, "global_step": 448352, "epoch": 2668} {"train_loss": -9.481901168823242, "global_step": 448353, "epoch": 2668} {"train_loss": -9.97583293914795, "global_step": 448354, "epoch": 2668} {"train_loss": -9.963712692260742, "global_step": 448355, "epoch": 2668} {"train_loss": -11.003984451293945, "global_step": 448356, "epoch": 2668} {"train_loss": -10.117101669311523, "global_step": 448357, "epoch": 2668} {"train_loss": -10.842523574829102, "global_step": 448358, "epoch": 2668} {"train_loss": -11.114405632019043, "global_step": 448359, "epoch": 2668} {"train_loss": -10.815303802490234, "global_step": 448360, "epoch": 2668} {"train_loss": -11.575763702392578, "global_step": 448361, "epoch": 2668} {"train_loss": -10.814650535583496, "global_step": 448362, "epoch": 2668} {"train_loss": -10.704140663146973, "global_step": 448363, "epoch": 2668} {"train_loss": -11.716523170471191, "global_step": 448364, "epoch": 2668} {"train_loss": -10.819242477416992, "global_step": 448365, "epoch": 2668} {"train_loss": -10.806899070739746, "global_step": 448366, "epoch": 2668} {"train_loss": -10.425758361816406, "global_step": 448367, "epoch": 2668} {"train_loss": -11.352948188781738, "global_step": 448368, "epoch": 2668} {"train_loss": -11.058177947998047, "global_step": 448369, "epoch": 2668} {"train_loss": -11.611547470092773, "global_step": 448370, "epoch": 2668} {"train_loss": -10.875452041625977, "global_step": 448371, "epoch": 2668} {"train_loss": -10.893445014953613, "global_step": 448372, "epoch": 2668} {"train_loss": -11.673166275024414, "global_step": 448373, "epoch": 2668} {"train_loss": -10.497264862060547, "global_step": 448374, "epoch": 2668} {"train_loss": -11.218619346618652, "global_step": 448375, "epoch": 2668} {"train_loss": -11.919896125793457, "global_step": 448376, "epoch": 2668} {"train_loss": -11.581999778747559, "global_step": 448377, "epoch": 2668} {"train_loss": -11.810020446777344, "global_step": 448378, "epoch": 2668} {"train_loss": -11.855391502380371, "global_step": 448379, "epoch": 2668} {"train_loss": -11.786995887756348, "global_step": 448380, "epoch": 2668} {"train_loss": -12.043439865112305, "global_step": 448381, "epoch": 2668} {"train_loss": -11.299957275390625, "global_step": 448382, "epoch": 2668} {"train_loss": -12.208044052124023, "global_step": 448383, "epoch": 2668} {"train_loss": -11.092430114746094, "global_step": 448384, "epoch": 2668} {"train_loss": -12.003314971923828, "global_step": 448385, "epoch": 2668} {"train_loss": -11.064502716064453, "global_step": 448386, "epoch": 2668} {"train_loss": -11.605175018310547, "global_step": 448387, "epoch": 2668} {"train_loss": -11.472196578979492, "global_step": 448388, "epoch": 2668} {"train_loss": -11.567168235778809, "global_step": 448389, "epoch": 2668} {"train_loss": -11.949665069580078, "global_step": 448390, "epoch": 2668} {"train_loss": -11.850131613867623, "global_step": 448391, "epoch": 2668, "val_loss": 314446.6875} {"train_loss": -12.35998821258545, "global_step": 448392, "epoch": 2669} {"train_loss": -11.655685424804688, "global_step": 448393, "epoch": 2669} {"train_loss": -12.210714340209961, "global_step": 448394, "epoch": 2669} {"train_loss": -11.954313278198242, "global_step": 448395, "epoch": 2669} {"train_loss": -12.182212829589844, "global_step": 448396, "epoch": 2669} {"train_loss": -11.776606559753418, "global_step": 448397, "epoch": 2669} {"train_loss": -12.142789840698242, "global_step": 448398, "epoch": 2669} {"train_loss": -12.04275131225586, "global_step": 448399, "epoch": 2669} {"train_loss": -12.26241397857666, "global_step": 448400, "epoch": 2669} {"train_loss": -12.184962272644043, "global_step": 448401, "epoch": 2669} {"train_loss": -12.051918983459473, "global_step": 448402, "epoch": 2669} {"train_loss": -11.872815132141113, "global_step": 448403, "epoch": 2669} {"train_loss": -12.323655128479004, "global_step": 448404, "epoch": 2669} {"train_loss": -11.727386474609375, "global_step": 448405, "epoch": 2669} {"train_loss": -12.080780029296875, "global_step": 448406, "epoch": 2669} {"train_loss": -12.339790344238281, "global_step": 448407, "epoch": 2669} {"train_loss": -11.971839904785156, "global_step": 448408, "epoch": 2669} {"train_loss": -12.424491882324219, "global_step": 448409, "epoch": 2669} {"train_loss": -12.19847297668457, "global_step": 448410, "epoch": 2669} {"train_loss": -12.340704917907715, "global_step": 448411, "epoch": 2669} {"train_loss": -12.158321380615234, "global_step": 448412, "epoch": 2669} {"train_loss": -12.461990356445312, "global_step": 448413, "epoch": 2669} {"train_loss": -12.04141902923584, "global_step": 448414, "epoch": 2669} {"train_loss": -12.587271690368652, "global_step": 448415, "epoch": 2669} {"train_loss": -12.012079238891602, "global_step": 448416, "epoch": 2669} {"train_loss": -12.44814682006836, "global_step": 448417, "epoch": 2669} {"train_loss": -12.171012878417969, "global_step": 448418, "epoch": 2669} {"train_loss": -12.396939277648926, "global_step": 448419, "epoch": 2669} {"train_loss": -12.286308288574219, "global_step": 448420, "epoch": 2669} {"train_loss": -12.488494873046875, "global_step": 448421, "epoch": 2669} {"train_loss": -12.399203300476074, "global_step": 448422, "epoch": 2669} {"train_loss": -12.550674438476562, "global_step": 448423, "epoch": 2669} {"train_loss": -12.545401573181152, "global_step": 448424, "epoch": 2669} {"train_loss": -12.755535125732422, "global_step": 448425, "epoch": 2669} {"train_loss": -12.545173645019531, "global_step": 448426, "epoch": 2669} {"train_loss": -12.409976959228516, "global_step": 448427, "epoch": 2669} {"train_loss": -12.571809768676758, "global_step": 448428, "epoch": 2669} {"train_loss": -12.595033645629883, "global_step": 448429, "epoch": 2669} {"train_loss": -12.579009056091309, "global_step": 448430, "epoch": 2669} {"train_loss": -12.730531692504883, "global_step": 448431, "epoch": 2669} {"train_loss": -12.547240257263184, "global_step": 448432, "epoch": 2669} {"train_loss": -12.52048397064209, "global_step": 448433, "epoch": 2669} {"train_loss": -12.550776481628418, "global_step": 448434, "epoch": 2669} {"train_loss": -12.572908401489258, "global_step": 448435, "epoch": 2669} {"train_loss": -12.47979736328125, "global_step": 448436, "epoch": 2669} {"train_loss": -12.58846664428711, "global_step": 448437, "epoch": 2669} {"train_loss": -12.640623092651367, "global_step": 448438, "epoch": 2669} {"train_loss": -12.656656265258789, "global_step": 448439, "epoch": 2669} {"train_loss": -12.604334831237793, "global_step": 448440, "epoch": 2669} {"train_loss": -12.613924026489258, "global_step": 448441, "epoch": 2669} {"train_loss": -12.876489639282227, "global_step": 448442, "epoch": 2669} {"train_loss": -12.616287231445312, "global_step": 448443, "epoch": 2669} {"train_loss": -12.6143798828125, "global_step": 448444, "epoch": 2669} {"train_loss": -12.570040702819824, "global_step": 448445, "epoch": 2669} {"train_loss": -12.583590507507324, "global_step": 448446, "epoch": 2669} {"train_loss": -12.727869033813477, "global_step": 448447, "epoch": 2669} {"train_loss": -12.530694007873535, "global_step": 448448, "epoch": 2669} {"train_loss": -12.701337814331055, "global_step": 448449, "epoch": 2669} {"train_loss": -12.686962127685547, "global_step": 448450, "epoch": 2669} {"train_loss": -12.879894256591797, "global_step": 448451, "epoch": 2669} {"train_loss": -12.720221519470215, "global_step": 448452, "epoch": 2669} {"train_loss": -12.833406448364258, "global_step": 448453, "epoch": 2669} {"train_loss": -12.639518737792969, "global_step": 448454, "epoch": 2669} {"train_loss": -12.712207794189453, "global_step": 448455, "epoch": 2669} {"train_loss": -13.045842170715332, "global_step": 448456, "epoch": 2669} {"train_loss": -12.475086212158203, "global_step": 448457, "epoch": 2669} {"train_loss": -12.905302047729492, "global_step": 448458, "epoch": 2669} {"train_loss": -12.571334838867188, "global_step": 448459, "epoch": 2669} {"train_loss": -12.781397819519043, "global_step": 448460, "epoch": 2669} {"train_loss": -12.87855339050293, "global_step": 448461, "epoch": 2669} {"train_loss": -12.558296203613281, "global_step": 448462, "epoch": 2669} {"train_loss": -12.697145462036133, "global_step": 448463, "epoch": 2669} {"train_loss": -12.683711051940918, "global_step": 448464, "epoch": 2669} {"train_loss": -12.703384399414062, "global_step": 448465, "epoch": 2669} {"train_loss": -12.730205535888672, "global_step": 448466, "epoch": 2669} {"train_loss": -12.956490516662598, "global_step": 448467, "epoch": 2669} {"train_loss": -12.897764205932617, "global_step": 448468, "epoch": 2669} {"train_loss": -12.915987014770508, "global_step": 448469, "epoch": 2669} {"train_loss": -12.730966567993164, "global_step": 448470, "epoch": 2669} {"train_loss": -12.68806266784668, "global_step": 448471, "epoch": 2669} {"train_loss": -12.789971351623535, "global_step": 448472, "epoch": 2669} {"train_loss": -12.687093734741211, "global_step": 448473, "epoch": 2669} {"train_loss": -13.068519592285156, "global_step": 448474, "epoch": 2669} {"train_loss": -12.954730033874512, "global_step": 448475, "epoch": 2669} {"train_loss": -12.903706550598145, "global_step": 448476, "epoch": 2669} {"train_loss": -12.872879981994629, "global_step": 448477, "epoch": 2669} {"train_loss": -12.837024688720703, "global_step": 448478, "epoch": 2669} {"train_loss": -12.951730728149414, "global_step": 448479, "epoch": 2669} {"train_loss": -12.806909561157227, "global_step": 448480, "epoch": 2669} {"train_loss": -12.713836669921875, "global_step": 448481, "epoch": 2669} {"train_loss": -12.494356155395508, "global_step": 448482, "epoch": 2669} {"train_loss": -12.763772964477539, "global_step": 448483, "epoch": 2669} {"train_loss": -13.011537551879883, "global_step": 448484, "epoch": 2669} {"train_loss": -12.733136177062988, "global_step": 448485, "epoch": 2669} {"train_loss": -12.661107063293457, "global_step": 448486, "epoch": 2669} {"train_loss": -12.879570007324219, "global_step": 448487, "epoch": 2669} {"train_loss": -12.693166732788086, "global_step": 448488, "epoch": 2669} {"train_loss": -12.991878509521484, "global_step": 448489, "epoch": 2669} {"train_loss": -12.889412879943848, "global_step": 448490, "epoch": 2669} {"train_loss": -12.946471214294434, "global_step": 448491, "epoch": 2669} {"train_loss": -13.005426406860352, "global_step": 448492, "epoch": 2669} {"train_loss": -12.828498840332031, "global_step": 448493, "epoch": 2669} {"train_loss": -12.948896408081055, "global_step": 448494, "epoch": 2669} {"train_loss": -12.654510498046875, "global_step": 448495, "epoch": 2669} {"train_loss": -12.235782623291016, "global_step": 448496, "epoch": 2669} {"train_loss": -12.743871688842773, "global_step": 448497, "epoch": 2669} {"train_loss": -12.45752239227295, "global_step": 448498, "epoch": 2669} {"train_loss": -12.343795776367188, "global_step": 448499, "epoch": 2669} {"train_loss": -12.302495956420898, "global_step": 448500, "epoch": 2669} {"train_loss": -12.95500373840332, "global_step": 448501, "epoch": 2669} {"train_loss": -12.203231811523438, "global_step": 448502, "epoch": 2669} {"train_loss": -12.046072006225586, "global_step": 448503, "epoch": 2669} {"train_loss": -12.173130989074707, "global_step": 448504, "epoch": 2669} {"train_loss": -11.958816528320312, "global_step": 448505, "epoch": 2669} {"train_loss": -10.834441184997559, "global_step": 448506, "epoch": 2669} {"train_loss": -12.093379974365234, "global_step": 448507, "epoch": 2669} {"train_loss": -12.247166633605957, "global_step": 448508, "epoch": 2669} {"train_loss": -12.147722244262695, "global_step": 448509, "epoch": 2669} {"train_loss": -11.904970169067383, "global_step": 448510, "epoch": 2669} {"train_loss": -12.521432876586914, "global_step": 448511, "epoch": 2669} {"train_loss": -11.207396507263184, "global_step": 448512, "epoch": 2669} {"train_loss": -10.675704956054688, "global_step": 448513, "epoch": 2669} {"train_loss": -12.762117385864258, "global_step": 448514, "epoch": 2669} {"train_loss": -10.709382057189941, "global_step": 448515, "epoch": 2669} {"train_loss": -12.112587928771973, "global_step": 448516, "epoch": 2669} {"train_loss": -11.902566909790039, "global_step": 448517, "epoch": 2669} {"train_loss": -11.241593360900879, "global_step": 448518, "epoch": 2669} {"train_loss": -11.415483474731445, "global_step": 448519, "epoch": 2669} {"train_loss": -11.385194778442383, "global_step": 448520, "epoch": 2669} {"train_loss": -11.265292167663574, "global_step": 448521, "epoch": 2669} {"train_loss": -11.7550048828125, "global_step": 448522, "epoch": 2669} {"train_loss": -10.801937103271484, "global_step": 448523, "epoch": 2669} {"train_loss": -11.836006164550781, "global_step": 448524, "epoch": 2669} {"train_loss": -12.192614555358887, "global_step": 448525, "epoch": 2669} {"train_loss": -11.660837173461914, "global_step": 448526, "epoch": 2669} {"train_loss": -10.358123779296875, "global_step": 448527, "epoch": 2669} {"train_loss": -12.484569549560547, "global_step": 448528, "epoch": 2669} {"train_loss": -10.47569465637207, "global_step": 448529, "epoch": 2669} {"train_loss": -11.598384857177734, "global_step": 448530, "epoch": 2669} {"train_loss": -12.081209182739258, "global_step": 448531, "epoch": 2669} {"train_loss": -9.451807022094727, "global_step": 448532, "epoch": 2669} {"train_loss": -11.64462947845459, "global_step": 448533, "epoch": 2669} {"train_loss": -10.153074264526367, "global_step": 448534, "epoch": 2669} {"train_loss": -11.044400215148926, "global_step": 448535, "epoch": 2669} {"train_loss": -10.605870246887207, "global_step": 448536, "epoch": 2669} {"train_loss": -11.70305061340332, "global_step": 448537, "epoch": 2669} {"train_loss": -12.063521385192871, "global_step": 448538, "epoch": 2669} {"train_loss": -11.471212387084961, "global_step": 448539, "epoch": 2669} {"train_loss": -11.700124740600586, "global_step": 448540, "epoch": 2669} {"train_loss": -11.640233039855957, "global_step": 448541, "epoch": 2669} {"train_loss": -11.31263542175293, "global_step": 448542, "epoch": 2669} {"train_loss": -11.68297004699707, "global_step": 448543, "epoch": 2669} {"train_loss": -10.568367004394531, "global_step": 448544, "epoch": 2669} {"train_loss": -12.222710609436035, "global_step": 448545, "epoch": 2669} {"train_loss": -11.559803009033203, "global_step": 448546, "epoch": 2669} {"train_loss": -12.270628929138184, "global_step": 448547, "epoch": 2669} {"train_loss": -11.343732833862305, "global_step": 448548, "epoch": 2669} {"train_loss": -12.2178955078125, "global_step": 448549, "epoch": 2669} {"train_loss": -11.49395751953125, "global_step": 448550, "epoch": 2669} {"train_loss": -11.991436004638672, "global_step": 448551, "epoch": 2669} {"train_loss": -11.110858917236328, "global_step": 448552, "epoch": 2669} {"train_loss": -10.859964370727539, "global_step": 448553, "epoch": 2669} {"train_loss": -11.922725677490234, "global_step": 448554, "epoch": 2669} {"train_loss": -11.051835060119629, "global_step": 448555, "epoch": 2669} {"train_loss": -12.348122596740723, "global_step": 448556, "epoch": 2669} {"train_loss": -11.198976516723633, "global_step": 448557, "epoch": 2669} {"train_loss": -12.21651840209961, "global_step": 448558, "epoch": 2669} {"train_loss": -12.214983139719282, "global_step": 448559, "epoch": 2669, "val_loss": 314850.625} {"train_loss": -10.478109359741211, "global_step": 448560, "epoch": 2670} {"train_loss": -11.960023880004883, "global_step": 448561, "epoch": 2670} {"train_loss": -11.338226318359375, "global_step": 448562, "epoch": 2670} {"train_loss": -12.131811141967773, "global_step": 448563, "epoch": 2670} {"train_loss": -12.24551010131836, "global_step": 448564, "epoch": 2670} {"train_loss": -11.981432914733887, "global_step": 448565, "epoch": 2670} {"train_loss": -12.143506050109863, "global_step": 448566, "epoch": 2670} {"train_loss": -11.761920928955078, "global_step": 448567, "epoch": 2670} {"train_loss": -12.278961181640625, "global_step": 448568, "epoch": 2670} {"train_loss": -11.661735534667969, "global_step": 448569, "epoch": 2670} {"train_loss": -12.310510635375977, "global_step": 448570, "epoch": 2670} {"train_loss": -12.002647399902344, "global_step": 448571, "epoch": 2670} {"train_loss": -12.37301254272461, "global_step": 448572, "epoch": 2670} {"train_loss": -12.084982872009277, "global_step": 448573, "epoch": 2670} {"train_loss": -12.150816917419434, "global_step": 448574, "epoch": 2670} {"train_loss": -12.000255584716797, "global_step": 448575, "epoch": 2670} {"train_loss": -12.017393112182617, "global_step": 448576, "epoch": 2670} {"train_loss": -12.057713508605957, "global_step": 448577, "epoch": 2670} {"train_loss": -11.81820011138916, "global_step": 448578, "epoch": 2670} {"train_loss": -12.504667282104492, "global_step": 448579, "epoch": 2670} {"train_loss": -12.084056854248047, "global_step": 448580, "epoch": 2670} {"train_loss": -12.42798900604248, "global_step": 448581, "epoch": 2670} {"train_loss": -12.367034912109375, "global_step": 448582, "epoch": 2670} {"train_loss": -12.224075317382812, "global_step": 448583, "epoch": 2670} {"train_loss": -12.290257453918457, "global_step": 448584, "epoch": 2670} {"train_loss": -12.492898941040039, "global_step": 448585, "epoch": 2670} {"train_loss": -12.60702133178711, "global_step": 448586, "epoch": 2670} {"train_loss": -12.469024658203125, "global_step": 448587, "epoch": 2670} {"train_loss": -12.544471740722656, "global_step": 448588, "epoch": 2670} {"train_loss": -12.337806701660156, "global_step": 448589, "epoch": 2670} {"train_loss": -12.40255069732666, "global_step": 448590, "epoch": 2670} {"train_loss": -12.534828186035156, "global_step": 448591, "epoch": 2670} {"train_loss": -12.58956527709961, "global_step": 448592, "epoch": 2670} {"train_loss": -12.668839454650879, "global_step": 448593, "epoch": 2670} {"train_loss": -12.307273864746094, "global_step": 448594, "epoch": 2670} {"train_loss": -12.43971061706543, "global_step": 448595, "epoch": 2670} {"train_loss": -12.188868522644043, "global_step": 448596, "epoch": 2670} {"train_loss": -12.336837768554688, "global_step": 448597, "epoch": 2670} {"train_loss": -12.4810791015625, "global_step": 448598, "epoch": 2670} {"train_loss": -12.219327926635742, "global_step": 448599, "epoch": 2670} {"train_loss": -12.714792251586914, "global_step": 448600, "epoch": 2670} {"train_loss": -12.319721221923828, "global_step": 448601, "epoch": 2670} {"train_loss": -12.826343536376953, "global_step": 448602, "epoch": 2670} {"train_loss": -12.426596641540527, "global_step": 448603, "epoch": 2670} {"train_loss": -12.669838905334473, "global_step": 448604, "epoch": 2670} {"train_loss": -12.372886657714844, "global_step": 448605, "epoch": 2670} {"train_loss": -12.68752384185791, "global_step": 448606, "epoch": 2670} {"train_loss": -12.571061134338379, "global_step": 448607, "epoch": 2670} {"train_loss": -12.64422607421875, "global_step": 448608, "epoch": 2670} {"train_loss": -12.568156242370605, "global_step": 448609, "epoch": 2670} {"train_loss": -12.054864883422852, "global_step": 448610, "epoch": 2670} {"train_loss": -12.652892112731934, "global_step": 448611, "epoch": 2670} {"train_loss": -12.085710525512695, "global_step": 448612, "epoch": 2670} {"train_loss": -12.619016647338867, "global_step": 448613, "epoch": 2670} {"train_loss": -12.599687576293945, "global_step": 448614, "epoch": 2670} {"train_loss": -12.10079574584961, "global_step": 448615, "epoch": 2670} {"train_loss": -12.640461921691895, "global_step": 448616, "epoch": 2670} {"train_loss": -12.36029052734375, "global_step": 448617, "epoch": 2670} {"train_loss": -12.577648162841797, "global_step": 448618, "epoch": 2670} {"train_loss": -12.584811210632324, "global_step": 448619, "epoch": 2670} {"train_loss": -11.66218376159668, "global_step": 448620, "epoch": 2670} {"train_loss": -12.129434585571289, "global_step": 448621, "epoch": 2670} {"train_loss": -11.763283729553223, "global_step": 448622, "epoch": 2670} {"train_loss": -11.404458999633789, "global_step": 448623, "epoch": 2670} {"train_loss": -12.669305801391602, "global_step": 448624, "epoch": 2670} {"train_loss": -11.728386878967285, "global_step": 448625, "epoch": 2670} {"train_loss": -12.545244216918945, "global_step": 448626, "epoch": 2670} {"train_loss": -12.389405250549316, "global_step": 448627, "epoch": 2670} {"train_loss": -12.665142059326172, "global_step": 448628, "epoch": 2670} {"train_loss": -12.528547286987305, "global_step": 448629, "epoch": 2670} {"train_loss": -12.502252578735352, "global_step": 448630, "epoch": 2670} {"train_loss": -12.678318977355957, "global_step": 448631, "epoch": 2670} {"train_loss": -12.40185546875, "global_step": 448632, "epoch": 2670} {"train_loss": -12.603038787841797, "global_step": 448633, "epoch": 2670} {"train_loss": -12.513477325439453, "global_step": 448634, "epoch": 2670} {"train_loss": -12.76481819152832, "global_step": 448635, "epoch": 2670} {"train_loss": -12.52507209777832, "global_step": 448636, "epoch": 2670} {"train_loss": -12.572678565979004, "global_step": 448637, "epoch": 2670} {"train_loss": -12.645172119140625, "global_step": 448638, "epoch": 2670} {"train_loss": -12.198083877563477, "global_step": 448639, "epoch": 2670} {"train_loss": -12.867146492004395, "global_step": 448640, "epoch": 2670} {"train_loss": -12.551210403442383, "global_step": 448641, "epoch": 2670} {"train_loss": -12.914688110351562, "global_step": 448642, "epoch": 2670} {"train_loss": -12.600379943847656, "global_step": 448643, "epoch": 2670} {"train_loss": -12.523309707641602, "global_step": 448644, "epoch": 2670} {"train_loss": -12.655766487121582, "global_step": 448645, "epoch": 2670} {"train_loss": -12.656990051269531, "global_step": 448646, "epoch": 2670} {"train_loss": -12.819568634033203, "global_step": 448647, "epoch": 2670} {"train_loss": -12.50802230834961, "global_step": 448648, "epoch": 2670} {"train_loss": -12.62137508392334, "global_step": 448649, "epoch": 2670} {"train_loss": -12.687992095947266, "global_step": 448650, "epoch": 2670} {"train_loss": -12.195113182067871, "global_step": 448651, "epoch": 2670} {"train_loss": -12.085748672485352, "global_step": 448652, "epoch": 2670} {"train_loss": -12.440698623657227, "global_step": 448653, "epoch": 2670} {"train_loss": -12.313488006591797, "global_step": 448654, "epoch": 2670} {"train_loss": -11.438344955444336, "global_step": 448655, "epoch": 2670} {"train_loss": -11.914794921875, "global_step": 448656, "epoch": 2670} {"train_loss": -11.242083549499512, "global_step": 448657, "epoch": 2670} {"train_loss": -12.30034351348877, "global_step": 448658, "epoch": 2670} {"train_loss": -11.803503036499023, "global_step": 448659, "epoch": 2670} {"train_loss": -12.146320343017578, "global_step": 448660, "epoch": 2670} {"train_loss": -12.189476013183594, "global_step": 448661, "epoch": 2670} {"train_loss": -11.305604934692383, "global_step": 448662, "epoch": 2670} {"train_loss": -11.720382690429688, "global_step": 448663, "epoch": 2670} {"train_loss": -11.663679122924805, "global_step": 448664, "epoch": 2670} {"train_loss": -12.286355018615723, "global_step": 448665, "epoch": 2670} {"train_loss": -12.075265884399414, "global_step": 448666, "epoch": 2670} {"train_loss": -12.192727088928223, "global_step": 448667, "epoch": 2670} {"train_loss": -11.881156921386719, "global_step": 448668, "epoch": 2670} {"train_loss": -11.616684913635254, "global_step": 448669, "epoch": 2670} {"train_loss": -12.571293830871582, "global_step": 448670, "epoch": 2670} {"train_loss": -11.679221153259277, "global_step": 448671, "epoch": 2670} {"train_loss": -12.046306610107422, "global_step": 448672, "epoch": 2670} {"train_loss": -11.641108512878418, "global_step": 448673, "epoch": 2670} {"train_loss": -12.278173446655273, "global_step": 448674, "epoch": 2670} {"train_loss": -12.493817329406738, "global_step": 448675, "epoch": 2670} {"train_loss": -12.109209060668945, "global_step": 448676, "epoch": 2670} {"train_loss": -12.282125473022461, "global_step": 448677, "epoch": 2670} {"train_loss": -12.759814262390137, "global_step": 448678, "epoch": 2670} {"train_loss": -12.200973510742188, "global_step": 448679, "epoch": 2670} {"train_loss": -12.027189254760742, "global_step": 448680, "epoch": 2670} {"train_loss": -12.080053329467773, "global_step": 448681, "epoch": 2670} {"train_loss": -12.898696899414062, "global_step": 448682, "epoch": 2670} {"train_loss": -12.444780349731445, "global_step": 448683, "epoch": 2670} {"train_loss": -12.155224800109863, "global_step": 448684, "epoch": 2670} {"train_loss": -12.639979362487793, "global_step": 448685, "epoch": 2670} {"train_loss": -12.430282592773438, "global_step": 448686, "epoch": 2670} {"train_loss": -12.038662910461426, "global_step": 448687, "epoch": 2670} {"train_loss": -12.501119613647461, "global_step": 448688, "epoch": 2670} {"train_loss": -12.380789756774902, "global_step": 448689, "epoch": 2670} {"train_loss": -12.195510864257812, "global_step": 448690, "epoch": 2670} {"train_loss": -12.508646965026855, "global_step": 448691, "epoch": 2670} {"train_loss": -12.143211364746094, "global_step": 448692, "epoch": 2670} {"train_loss": -12.323341369628906, "global_step": 448693, "epoch": 2670} {"train_loss": -11.967917442321777, "global_step": 448694, "epoch": 2670} {"train_loss": -12.428494453430176, "global_step": 448695, "epoch": 2670} {"train_loss": -11.218994140625, "global_step": 448696, "epoch": 2670} {"train_loss": -12.698936462402344, "global_step": 448697, "epoch": 2670} {"train_loss": -12.286531448364258, "global_step": 448698, "epoch": 2670} {"train_loss": -12.37021255493164, "global_step": 448699, "epoch": 2670} {"train_loss": -12.519012451171875, "global_step": 448700, "epoch": 2670} {"train_loss": -12.125871658325195, "global_step": 448701, "epoch": 2670} {"train_loss": -12.532327651977539, "global_step": 448702, "epoch": 2670} {"train_loss": -11.9585542678833, "global_step": 448703, "epoch": 2670} {"train_loss": -12.592934608459473, "global_step": 448704, "epoch": 2670} {"train_loss": -12.05798053741455, "global_step": 448705, "epoch": 2670} {"train_loss": -12.61080265045166, "global_step": 448706, "epoch": 2670} {"train_loss": -11.900574684143066, "global_step": 448707, "epoch": 2670} {"train_loss": -12.334171295166016, "global_step": 448708, "epoch": 2670} {"train_loss": -11.98575210571289, "global_step": 448709, "epoch": 2670} {"train_loss": -11.301362991333008, "global_step": 448710, "epoch": 2670} {"train_loss": -12.089133262634277, "global_step": 448711, "epoch": 2670} {"train_loss": -12.319953918457031, "global_step": 448712, "epoch": 2670} {"train_loss": -11.70456600189209, "global_step": 448713, "epoch": 2670} {"train_loss": -12.759635925292969, "global_step": 448714, "epoch": 2670} {"train_loss": -11.703392028808594, "global_step": 448715, "epoch": 2670} {"train_loss": -12.274151802062988, "global_step": 448716, "epoch": 2670} {"train_loss": -12.34834098815918, "global_step": 448717, "epoch": 2670} {"train_loss": -12.343181610107422, "global_step": 448718, "epoch": 2670} {"train_loss": -12.098655700683594, "global_step": 448719, "epoch": 2670} {"train_loss": -12.299331665039062, "global_step": 448720, "epoch": 2670} {"train_loss": -10.70655632019043, "global_step": 448721, "epoch": 2670} {"train_loss": -12.164578437805176, "global_step": 448722, "epoch": 2670} {"train_loss": -11.705286979675293, "global_step": 448723, "epoch": 2670} {"train_loss": -10.829463958740234, "global_step": 448724, "epoch": 2670} {"train_loss": -12.39204216003418, "global_step": 448725, "epoch": 2670} {"train_loss": -10.820959091186523, "global_step": 448726, "epoch": 2670} {"train_loss": -12.227979546501523, "global_step": 448727, "epoch": 2670, "val_loss": 313567.9375, "train_action_mse_error": 1.181621789932251} {"train_loss": -10.116533279418945, "global_step": 448728, "epoch": 2671} {"train_loss": -11.940324783325195, "global_step": 448729, "epoch": 2671} {"train_loss": -10.7178955078125, "global_step": 448730, "epoch": 2671} {"train_loss": -11.427446365356445, "global_step": 448731, "epoch": 2671} {"train_loss": -10.77642822265625, "global_step": 448732, "epoch": 2671} {"train_loss": -11.692231178283691, "global_step": 448733, "epoch": 2671} {"train_loss": -11.352840423583984, "global_step": 448734, "epoch": 2671} {"train_loss": -11.016898155212402, "global_step": 448735, "epoch": 2671} {"train_loss": -11.805448532104492, "global_step": 448736, "epoch": 2671} {"train_loss": -9.405440330505371, "global_step": 448737, "epoch": 2671} {"train_loss": -11.142033576965332, "global_step": 448738, "epoch": 2671} {"train_loss": -9.94129753112793, "global_step": 448739, "epoch": 2671} {"train_loss": -11.548747062683105, "global_step": 448740, "epoch": 2671} {"train_loss": -9.793739318847656, "global_step": 448741, "epoch": 2671} {"train_loss": -10.904905319213867, "global_step": 448742, "epoch": 2671} {"train_loss": -9.576778411865234, "global_step": 448743, "epoch": 2671} {"train_loss": -7.744852066040039, "global_step": 448744, "epoch": 2671} {"train_loss": -9.506136894226074, "global_step": 448745, "epoch": 2671} {"train_loss": -8.856411933898926, "global_step": 448746, "epoch": 2671} {"train_loss": -11.091598510742188, "global_step": 448747, "epoch": 2671} {"train_loss": -8.865760803222656, "global_step": 448748, "epoch": 2671} {"train_loss": -10.227736473083496, "global_step": 448749, "epoch": 2671} {"train_loss": -9.294027328491211, "global_step": 448750, "epoch": 2671} {"train_loss": -9.465991973876953, "global_step": 448751, "epoch": 2671} {"train_loss": -8.430561065673828, "global_step": 448752, "epoch": 2671} {"train_loss": -10.210697174072266, "global_step": 448753, "epoch": 2671} {"train_loss": -10.291622161865234, "global_step": 448754, "epoch": 2671} {"train_loss": -7.895077705383301, "global_step": 448755, "epoch": 2671} {"train_loss": -9.905372619628906, "global_step": 448756, "epoch": 2671} {"train_loss": -9.877168655395508, "global_step": 448757, "epoch": 2671} {"train_loss": -9.177845001220703, "global_step": 448758, "epoch": 2671} {"train_loss": -8.394290924072266, "global_step": 448759, "epoch": 2671} {"train_loss": -9.840093612670898, "global_step": 448760, "epoch": 2671} {"train_loss": -10.998662948608398, "global_step": 448761, "epoch": 2671} {"train_loss": -10.378556251525879, "global_step": 448762, "epoch": 2671} {"train_loss": -9.7030668258667, "global_step": 448763, "epoch": 2671} {"train_loss": -10.031462669372559, "global_step": 448764, "epoch": 2671} {"train_loss": -11.155645370483398, "global_step": 448765, "epoch": 2671} {"train_loss": -10.54666519165039, "global_step": 448766, "epoch": 2671} {"train_loss": -11.493400573730469, "global_step": 448767, "epoch": 2671} {"train_loss": -11.295140266418457, "global_step": 448768, "epoch": 2671} {"train_loss": -11.11953067779541, "global_step": 448769, "epoch": 2671} {"train_loss": -11.669498443603516, "global_step": 448770, "epoch": 2671} {"train_loss": -11.557172775268555, "global_step": 448771, "epoch": 2671} {"train_loss": -11.330093383789062, "global_step": 448772, "epoch": 2671} {"train_loss": -11.595208168029785, "global_step": 448773, "epoch": 2671} {"train_loss": -11.948883056640625, "global_step": 448774, "epoch": 2671} {"train_loss": -11.353046417236328, "global_step": 448775, "epoch": 2671} {"train_loss": -11.951108932495117, "global_step": 448776, "epoch": 2671} {"train_loss": -11.789778709411621, "global_step": 448777, "epoch": 2671} {"train_loss": -11.992470741271973, "global_step": 448778, "epoch": 2671} {"train_loss": -11.903376579284668, "global_step": 448779, "epoch": 2671} {"train_loss": -12.181266784667969, "global_step": 448780, "epoch": 2671} {"train_loss": -11.892827987670898, "global_step": 448781, "epoch": 2671} {"train_loss": -11.803712844848633, "global_step": 448782, "epoch": 2671} {"train_loss": -12.154382705688477, "global_step": 448783, "epoch": 2671} {"train_loss": -11.84157943725586, "global_step": 448784, "epoch": 2671} {"train_loss": -12.300750732421875, "global_step": 448785, "epoch": 2671} {"train_loss": -12.242510795593262, "global_step": 448786, "epoch": 2671} {"train_loss": -12.122779846191406, "global_step": 448787, "epoch": 2671} {"train_loss": -12.156217575073242, "global_step": 448788, "epoch": 2671} {"train_loss": -12.190828323364258, "global_step": 448789, "epoch": 2671} {"train_loss": -12.385805130004883, "global_step": 448790, "epoch": 2671} {"train_loss": -12.429567337036133, "global_step": 448791, "epoch": 2671} {"train_loss": -12.19066333770752, "global_step": 448792, "epoch": 2671} {"train_loss": -12.304482460021973, "global_step": 448793, "epoch": 2671} {"train_loss": -12.25007438659668, "global_step": 448794, "epoch": 2671} {"train_loss": -12.312641143798828, "global_step": 448795, "epoch": 2671} {"train_loss": -12.436134338378906, "global_step": 448796, "epoch": 2671} {"train_loss": -12.37679672241211, "global_step": 448797, "epoch": 2671} {"train_loss": -12.46009635925293, "global_step": 448798, "epoch": 2671} {"train_loss": -12.15652847290039, "global_step": 448799, "epoch": 2671} {"train_loss": -12.391884803771973, "global_step": 448800, "epoch": 2671} {"train_loss": -12.328914642333984, "global_step": 448801, "epoch": 2671} {"train_loss": -12.40024185180664, "global_step": 448802, "epoch": 2671} {"train_loss": -12.513711929321289, "global_step": 448803, "epoch": 2671} {"train_loss": -12.276508331298828, "global_step": 448804, "epoch": 2671} {"train_loss": -12.560890197753906, "global_step": 448805, "epoch": 2671} {"train_loss": -12.377828598022461, "global_step": 448806, "epoch": 2671} {"train_loss": -12.418338775634766, "global_step": 448807, "epoch": 2671} {"train_loss": -12.645477294921875, "global_step": 448808, "epoch": 2671} {"train_loss": -12.466222763061523, "global_step": 448809, "epoch": 2671} {"train_loss": -12.528070449829102, "global_step": 448810, "epoch": 2671} {"train_loss": -12.25428581237793, "global_step": 448811, "epoch": 2671} {"train_loss": -12.488409042358398, "global_step": 448812, "epoch": 2671} {"train_loss": -12.589069366455078, "global_step": 448813, "epoch": 2671} {"train_loss": -12.567094802856445, "global_step": 448814, "epoch": 2671} {"train_loss": -12.614097595214844, "global_step": 448815, "epoch": 2671} {"train_loss": -12.472084045410156, "global_step": 448816, "epoch": 2671} {"train_loss": -12.697530746459961, "global_step": 448817, "epoch": 2671} {"train_loss": -12.728686332702637, "global_step": 448818, "epoch": 2671} {"train_loss": -12.674260139465332, "global_step": 448819, "epoch": 2671} {"train_loss": -12.79658031463623, "global_step": 448820, "epoch": 2671} {"train_loss": -12.585912704467773, "global_step": 448821, "epoch": 2671} {"train_loss": -12.532930374145508, "global_step": 448822, "epoch": 2671} {"train_loss": -12.738605499267578, "global_step": 448823, "epoch": 2671} {"train_loss": -12.921772956848145, "global_step": 448824, "epoch": 2671} {"train_loss": -12.64023494720459, "global_step": 448825, "epoch": 2671} {"train_loss": -12.661952018737793, "global_step": 448826, "epoch": 2671} {"train_loss": -12.627775192260742, "global_step": 448827, "epoch": 2671} {"train_loss": -12.764667510986328, "global_step": 448828, "epoch": 2671} {"train_loss": -12.647387504577637, "global_step": 448829, "epoch": 2671} {"train_loss": -12.61379623413086, "global_step": 448830, "epoch": 2671} {"train_loss": -12.732151985168457, "global_step": 448831, "epoch": 2671} {"train_loss": -12.654876708984375, "global_step": 448832, "epoch": 2671} {"train_loss": -12.681427001953125, "global_step": 448833, "epoch": 2671} {"train_loss": -12.624298095703125, "global_step": 448834, "epoch": 2671} {"train_loss": -12.597638130187988, "global_step": 448835, "epoch": 2671} {"train_loss": -12.739043235778809, "global_step": 448836, "epoch": 2671} {"train_loss": -12.734052658081055, "global_step": 448837, "epoch": 2671} {"train_loss": -12.770310401916504, "global_step": 448838, "epoch": 2671} {"train_loss": -12.730537414550781, "global_step": 448839, "epoch": 2671} {"train_loss": -12.951942443847656, "global_step": 448840, "epoch": 2671} {"train_loss": -12.81568717956543, "global_step": 448841, "epoch": 2671} {"train_loss": -12.891533851623535, "global_step": 448842, "epoch": 2671} {"train_loss": -12.754462242126465, "global_step": 448843, "epoch": 2671} {"train_loss": -12.808805465698242, "global_step": 448844, "epoch": 2671} {"train_loss": -12.62525749206543, "global_step": 448845, "epoch": 2671} {"train_loss": -12.83746337890625, "global_step": 448846, "epoch": 2671} {"train_loss": -12.656929016113281, "global_step": 448847, "epoch": 2671} {"train_loss": -12.898200035095215, "global_step": 448848, "epoch": 2671} {"train_loss": -12.566028594970703, "global_step": 448849, "epoch": 2671} {"train_loss": -12.726978302001953, "global_step": 448850, "epoch": 2671} {"train_loss": -12.82441520690918, "global_step": 448851, "epoch": 2671} {"train_loss": -12.482463836669922, "global_step": 448852, "epoch": 2671} {"train_loss": -12.732963562011719, "global_step": 448853, "epoch": 2671} {"train_loss": -12.660757064819336, "global_step": 448854, "epoch": 2671} {"train_loss": -12.448720932006836, "global_step": 448855, "epoch": 2671} {"train_loss": -12.858402252197266, "global_step": 448856, "epoch": 2671} {"train_loss": -12.651325225830078, "global_step": 448857, "epoch": 2671} {"train_loss": -12.804161071777344, "global_step": 448858, "epoch": 2671} {"train_loss": -12.716567993164062, "global_step": 448859, "epoch": 2671} {"train_loss": -12.910956382751465, "global_step": 448860, "epoch": 2671} {"train_loss": -12.814994812011719, "global_step": 448861, "epoch": 2671} {"train_loss": -12.977080345153809, "global_step": 448862, "epoch": 2671} {"train_loss": -12.821163177490234, "global_step": 448863, "epoch": 2671} {"train_loss": -12.63907241821289, "global_step": 448864, "epoch": 2671} {"train_loss": -12.877436637878418, "global_step": 448865, "epoch": 2671} {"train_loss": -12.783111572265625, "global_step": 448866, "epoch": 2671} {"train_loss": -12.933666229248047, "global_step": 448867, "epoch": 2671} {"train_loss": -12.719831466674805, "global_step": 448868, "epoch": 2671} {"train_loss": -12.97768497467041, "global_step": 448869, "epoch": 2671} {"train_loss": -12.685789108276367, "global_step": 448870, "epoch": 2671} {"train_loss": -13.030702590942383, "global_step": 448871, "epoch": 2671} {"train_loss": -12.857364654541016, "global_step": 448872, "epoch": 2671} {"train_loss": -12.747722625732422, "global_step": 448873, "epoch": 2671} {"train_loss": -12.827177047729492, "global_step": 448874, "epoch": 2671} {"train_loss": -12.808433532714844, "global_step": 448875, "epoch": 2671} {"train_loss": -12.884185791015625, "global_step": 448876, "epoch": 2671} {"train_loss": -12.916328430175781, "global_step": 448877, "epoch": 2671} {"train_loss": -12.926949501037598, "global_step": 448878, "epoch": 2671} {"train_loss": -13.059436798095703, "global_step": 448879, "epoch": 2671} {"train_loss": -12.934688568115234, "global_step": 448880, "epoch": 2671} {"train_loss": -12.954795837402344, "global_step": 448881, "epoch": 2671} {"train_loss": -12.614890098571777, "global_step": 448882, "epoch": 2671} {"train_loss": -13.10582447052002, "global_step": 448883, "epoch": 2671} {"train_loss": -12.949743270874023, "global_step": 448884, "epoch": 2671} {"train_loss": -12.689709663391113, "global_step": 448885, "epoch": 2671} {"train_loss": -12.855140686035156, "global_step": 448886, "epoch": 2671} {"train_loss": -12.908203125, "global_step": 448887, "epoch": 2671} {"train_loss": -12.854092597961426, "global_step": 448888, "epoch": 2671} {"train_loss": -12.967679977416992, "global_step": 448889, "epoch": 2671} {"train_loss": -12.776898384094238, "global_step": 448890, "epoch": 2671} {"train_loss": -13.120523452758789, "global_step": 448891, "epoch": 2671} {"train_loss": -12.511544227600098, "global_step": 448892, "epoch": 2671} {"train_loss": -11.536844253540039, "global_step": 448893, "epoch": 2671} {"train_loss": -10.831938743591309, "global_step": 448894, "epoch": 2671} {"train_loss": -11.950697274435134, "global_step": 448895, "epoch": 2671, "val_loss": 313278.46875} {"train_loss": -11.752032279968262, "global_step": 448896, "epoch": 2672} {"train_loss": -12.323553085327148, "global_step": 448897, "epoch": 2672} {"train_loss": -11.299938201904297, "global_step": 448898, "epoch": 2672} {"train_loss": -11.897472381591797, "global_step": 448899, "epoch": 2672} {"train_loss": -10.971875190734863, "global_step": 448900, "epoch": 2672} {"train_loss": -12.015460968017578, "global_step": 448901, "epoch": 2672} {"train_loss": -11.392566680908203, "global_step": 448902, "epoch": 2672} {"train_loss": -10.72989273071289, "global_step": 448903, "epoch": 2672} {"train_loss": -11.472851753234863, "global_step": 448904, "epoch": 2672} {"train_loss": -10.809972763061523, "global_step": 448905, "epoch": 2672} {"train_loss": -11.70622444152832, "global_step": 448906, "epoch": 2672} {"train_loss": -10.48015022277832, "global_step": 448907, "epoch": 2672} {"train_loss": -11.64980697631836, "global_step": 448908, "epoch": 2672} {"train_loss": -12.138256072998047, "global_step": 448909, "epoch": 2672} {"train_loss": -9.871735572814941, "global_step": 448910, "epoch": 2672} {"train_loss": -11.776071548461914, "global_step": 448911, "epoch": 2672} {"train_loss": -9.421957015991211, "global_step": 448912, "epoch": 2672} {"train_loss": -11.420830726623535, "global_step": 448913, "epoch": 2672} {"train_loss": -9.600430488586426, "global_step": 448914, "epoch": 2672} {"train_loss": -11.28183364868164, "global_step": 448915, "epoch": 2672} {"train_loss": -11.642484664916992, "global_step": 448916, "epoch": 2672} {"train_loss": -9.603470802307129, "global_step": 448917, "epoch": 2672} {"train_loss": -11.308277130126953, "global_step": 448918, "epoch": 2672} {"train_loss": -8.933309555053711, "global_step": 448919, "epoch": 2672} {"train_loss": -10.631087303161621, "global_step": 448920, "epoch": 2672} {"train_loss": -10.02122688293457, "global_step": 448921, "epoch": 2672} {"train_loss": -10.263931274414062, "global_step": 448922, "epoch": 2672} {"train_loss": -10.518022537231445, "global_step": 448923, "epoch": 2672} {"train_loss": -11.018684387207031, "global_step": 448924, "epoch": 2672} {"train_loss": -10.746769905090332, "global_step": 448925, "epoch": 2672} {"train_loss": -11.218122482299805, "global_step": 448926, "epoch": 2672} {"train_loss": -10.684757232666016, "global_step": 448927, "epoch": 2672} {"train_loss": -11.087297439575195, "global_step": 448928, "epoch": 2672} {"train_loss": -11.147150039672852, "global_step": 448929, "epoch": 2672} {"train_loss": -11.145868301391602, "global_step": 448930, "epoch": 2672} {"train_loss": -11.320338249206543, "global_step": 448931, "epoch": 2672} {"train_loss": -11.519702911376953, "global_step": 448932, "epoch": 2672} {"train_loss": -11.654966354370117, "global_step": 448933, "epoch": 2672} {"train_loss": -11.89333438873291, "global_step": 448934, "epoch": 2672} {"train_loss": -12.070708274841309, "global_step": 448935, "epoch": 2672} {"train_loss": -11.735639572143555, "global_step": 448936, "epoch": 2672} {"train_loss": -12.160322189331055, "global_step": 448937, "epoch": 2672} {"train_loss": -12.007116317749023, "global_step": 448938, "epoch": 2672} {"train_loss": -12.012821197509766, "global_step": 448939, "epoch": 2672} {"train_loss": -12.077692031860352, "global_step": 448940, "epoch": 2672} {"train_loss": -11.858278274536133, "global_step": 448941, "epoch": 2672} {"train_loss": -12.516338348388672, "global_step": 448942, "epoch": 2672} {"train_loss": -12.042362213134766, "global_step": 448943, "epoch": 2672} {"train_loss": -12.212058067321777, "global_step": 448944, "epoch": 2672} {"train_loss": -12.234576225280762, "global_step": 448945, "epoch": 2672} {"train_loss": -12.251893997192383, "global_step": 448946, "epoch": 2672} {"train_loss": -12.311132431030273, "global_step": 448947, "epoch": 2672} {"train_loss": -12.345719337463379, "global_step": 448948, "epoch": 2672} {"train_loss": -12.159875869750977, "global_step": 448949, "epoch": 2672} {"train_loss": -12.283102035522461, "global_step": 448950, "epoch": 2672} {"train_loss": -12.508382797241211, "global_step": 448951, "epoch": 2672} {"train_loss": -12.412792205810547, "global_step": 448952, "epoch": 2672} {"train_loss": -12.413589477539062, "global_step": 448953, "epoch": 2672} {"train_loss": -12.547125816345215, "global_step": 448954, "epoch": 2672} {"train_loss": -12.6276216506958, "global_step": 448955, "epoch": 2672} {"train_loss": -12.473827362060547, "global_step": 448956, "epoch": 2672} {"train_loss": -12.39320182800293, "global_step": 448957, "epoch": 2672} {"train_loss": -12.147455215454102, "global_step": 448958, "epoch": 2672} {"train_loss": -12.492136001586914, "global_step": 448959, "epoch": 2672} {"train_loss": -12.50955867767334, "global_step": 448960, "epoch": 2672} {"train_loss": -12.345307350158691, "global_step": 448961, "epoch": 2672} {"train_loss": -12.545780181884766, "global_step": 448962, "epoch": 2672} {"train_loss": -12.297318458557129, "global_step": 448963, "epoch": 2672} {"train_loss": -12.658891677856445, "global_step": 448964, "epoch": 2672} {"train_loss": -12.507806777954102, "global_step": 448965, "epoch": 2672} {"train_loss": -12.478745460510254, "global_step": 448966, "epoch": 2672} {"train_loss": -12.613605499267578, "global_step": 448967, "epoch": 2672} {"train_loss": -12.711518287658691, "global_step": 448968, "epoch": 2672} {"train_loss": -12.704904556274414, "global_step": 448969, "epoch": 2672} {"train_loss": -12.516357421875, "global_step": 448970, "epoch": 2672} {"train_loss": -12.62443733215332, "global_step": 448971, "epoch": 2672} {"train_loss": -12.694175720214844, "global_step": 448972, "epoch": 2672} {"train_loss": -12.562498092651367, "global_step": 448973, "epoch": 2672} {"train_loss": -12.64773941040039, "global_step": 448974, "epoch": 2672} {"train_loss": -12.454058647155762, "global_step": 448975, "epoch": 2672} {"train_loss": -12.525228500366211, "global_step": 448976, "epoch": 2672} {"train_loss": -12.520121574401855, "global_step": 448977, "epoch": 2672} {"train_loss": -12.447100639343262, "global_step": 448978, "epoch": 2672} {"train_loss": -12.67361831665039, "global_step": 448979, "epoch": 2672} {"train_loss": -12.571367263793945, "global_step": 448980, "epoch": 2672} {"train_loss": -12.532205581665039, "global_step": 448981, "epoch": 2672} {"train_loss": -12.610482215881348, "global_step": 448982, "epoch": 2672} {"train_loss": -12.022772789001465, "global_step": 448983, "epoch": 2672} {"train_loss": -12.389410018920898, "global_step": 448984, "epoch": 2672} {"train_loss": -12.509885787963867, "global_step": 448985, "epoch": 2672} {"train_loss": -12.017333984375, "global_step": 448986, "epoch": 2672} {"train_loss": -12.498360633850098, "global_step": 448987, "epoch": 2672} {"train_loss": -11.76755142211914, "global_step": 448988, "epoch": 2672} {"train_loss": -11.867648124694824, "global_step": 448989, "epoch": 2672} {"train_loss": -11.448445320129395, "global_step": 448990, "epoch": 2672} {"train_loss": -11.666708946228027, "global_step": 448991, "epoch": 2672} {"train_loss": -11.569109916687012, "global_step": 448992, "epoch": 2672} {"train_loss": -10.273008346557617, "global_step": 448993, "epoch": 2672} {"train_loss": -12.287530899047852, "global_step": 448994, "epoch": 2672} {"train_loss": -10.267536163330078, "global_step": 448995, "epoch": 2672} {"train_loss": -9.725908279418945, "global_step": 448996, "epoch": 2672} {"train_loss": -10.93118667602539, "global_step": 448997, "epoch": 2672} {"train_loss": -12.14289665222168, "global_step": 448998, "epoch": 2672} {"train_loss": -9.856070518493652, "global_step": 448999, "epoch": 2672} {"train_loss": -11.181575775146484, "global_step": 449000, "epoch": 2672} {"train_loss": -10.506792068481445, "global_step": 449001, "epoch": 2672} {"train_loss": -9.897523880004883, "global_step": 449002, "epoch": 2672} {"train_loss": -11.579425811767578, "global_step": 449003, "epoch": 2672} {"train_loss": -10.25112533569336, "global_step": 449004, "epoch": 2672} {"train_loss": -11.000608444213867, "global_step": 449005, "epoch": 2672} {"train_loss": -10.90498161315918, "global_step": 449006, "epoch": 2672} {"train_loss": -10.592998504638672, "global_step": 449007, "epoch": 2672} {"train_loss": -11.039056777954102, "global_step": 449008, "epoch": 2672} {"train_loss": -11.825153350830078, "global_step": 449009, "epoch": 2672} {"train_loss": -10.647510528564453, "global_step": 449010, "epoch": 2672} {"train_loss": -11.895646095275879, "global_step": 449011, "epoch": 2672} {"train_loss": -10.742053985595703, "global_step": 449012, "epoch": 2672} {"train_loss": -10.868766784667969, "global_step": 449013, "epoch": 2672} {"train_loss": -12.046728134155273, "global_step": 449014, "epoch": 2672} {"train_loss": -11.321455001831055, "global_step": 449015, "epoch": 2672} {"train_loss": -11.306070327758789, "global_step": 449016, "epoch": 2672} {"train_loss": -11.657597541809082, "global_step": 449017, "epoch": 2672} {"train_loss": -11.22603702545166, "global_step": 449018, "epoch": 2672} {"train_loss": -12.177885055541992, "global_step": 449019, "epoch": 2672} {"train_loss": -11.07928466796875, "global_step": 449020, "epoch": 2672} {"train_loss": -11.906192779541016, "global_step": 449021, "epoch": 2672} {"train_loss": -11.537364959716797, "global_step": 449022, "epoch": 2672} {"train_loss": -11.524169921875, "global_step": 449023, "epoch": 2672} {"train_loss": -11.842344284057617, "global_step": 449024, "epoch": 2672} {"train_loss": -12.112934112548828, "global_step": 449025, "epoch": 2672} {"train_loss": -11.887996673583984, "global_step": 449026, "epoch": 2672} {"train_loss": -12.270217895507812, "global_step": 449027, "epoch": 2672} {"train_loss": -11.77524185180664, "global_step": 449028, "epoch": 2672} {"train_loss": -12.265678405761719, "global_step": 449029, "epoch": 2672} {"train_loss": -12.085715293884277, "global_step": 449030, "epoch": 2672} {"train_loss": -12.211149215698242, "global_step": 449031, "epoch": 2672} {"train_loss": -12.058293342590332, "global_step": 449032, "epoch": 2672} {"train_loss": -12.04850959777832, "global_step": 449033, "epoch": 2672} {"train_loss": -11.935001373291016, "global_step": 449034, "epoch": 2672} {"train_loss": -12.138640403747559, "global_step": 449035, "epoch": 2672} {"train_loss": -11.714588165283203, "global_step": 449036, "epoch": 2672} {"train_loss": -12.426278114318848, "global_step": 449037, "epoch": 2672} {"train_loss": -11.521339416503906, "global_step": 449038, "epoch": 2672} {"train_loss": -12.522214889526367, "global_step": 449039, "epoch": 2672} {"train_loss": -12.158062934875488, "global_step": 449040, "epoch": 2672} {"train_loss": -12.063533782958984, "global_step": 449041, "epoch": 2672} {"train_loss": -12.521478652954102, "global_step": 449042, "epoch": 2672} {"train_loss": -12.500606536865234, "global_step": 449043, "epoch": 2672} {"train_loss": -12.3257474899292, "global_step": 449044, "epoch": 2672} {"train_loss": -12.52855110168457, "global_step": 449045, "epoch": 2672} {"train_loss": -12.236383438110352, "global_step": 449046, "epoch": 2672} {"train_loss": -12.76353645324707, "global_step": 449047, "epoch": 2672} {"train_loss": -12.452539443969727, "global_step": 449048, "epoch": 2672} {"train_loss": -12.741701126098633, "global_step": 449049, "epoch": 2672} {"train_loss": -12.722946166992188, "global_step": 449050, "epoch": 2672} {"train_loss": -12.483343124389648, "global_step": 449051, "epoch": 2672} {"train_loss": -12.392779350280762, "global_step": 449052, "epoch": 2672} {"train_loss": -12.54953670501709, "global_step": 449053, "epoch": 2672} {"train_loss": -12.714418411254883, "global_step": 449054, "epoch": 2672} {"train_loss": -12.413482666015625, "global_step": 449055, "epoch": 2672} {"train_loss": -12.542974472045898, "global_step": 449056, "epoch": 2672} {"train_loss": -12.585541725158691, "global_step": 449057, "epoch": 2672} {"train_loss": -12.776018142700195, "global_step": 449058, "epoch": 2672} {"train_loss": -12.557764053344727, "global_step": 449059, "epoch": 2672} {"train_loss": -12.533267974853516, "global_step": 449060, "epoch": 2672} {"train_loss": -12.480062484741211, "global_step": 449061, "epoch": 2672} {"train_loss": -12.505768775939941, "global_step": 449062, "epoch": 2672} {"train_loss": -11.798456941332136, "global_step": 449063, "epoch": 2672, "val_loss": 308388.46875} {"train_loss": -12.523538589477539, "global_step": 449064, "epoch": 2673} {"train_loss": -12.401912689208984, "global_step": 449065, "epoch": 2673} {"train_loss": -12.504814147949219, "global_step": 449066, "epoch": 2673} {"train_loss": -12.464529037475586, "global_step": 449067, "epoch": 2673} {"train_loss": -12.119427680969238, "global_step": 449068, "epoch": 2673} {"train_loss": -12.26534652709961, "global_step": 449069, "epoch": 2673} {"train_loss": -12.176453590393066, "global_step": 449070, "epoch": 2673} {"train_loss": -11.712822914123535, "global_step": 449071, "epoch": 2673} {"train_loss": -12.346964836120605, "global_step": 449072, "epoch": 2673} {"train_loss": -12.017143249511719, "global_step": 449073, "epoch": 2673} {"train_loss": -10.835250854492188, "global_step": 449074, "epoch": 2673} {"train_loss": -12.23065185546875, "global_step": 449075, "epoch": 2673} {"train_loss": -10.686649322509766, "global_step": 449076, "epoch": 2673} {"train_loss": -11.117088317871094, "global_step": 449077, "epoch": 2673} {"train_loss": -12.230260848999023, "global_step": 449078, "epoch": 2673} {"train_loss": -10.766075134277344, "global_step": 449079, "epoch": 2673} {"train_loss": -11.982769966125488, "global_step": 449080, "epoch": 2673} {"train_loss": -11.289127349853516, "global_step": 449081, "epoch": 2673} {"train_loss": -11.327079772949219, "global_step": 449082, "epoch": 2673} {"train_loss": -11.847513198852539, "global_step": 449083, "epoch": 2673} {"train_loss": -10.783699035644531, "global_step": 449084, "epoch": 2673} {"train_loss": -11.077642440795898, "global_step": 449085, "epoch": 2673} {"train_loss": -11.04499626159668, "global_step": 449086, "epoch": 2673} {"train_loss": -10.766114234924316, "global_step": 449087, "epoch": 2673} {"train_loss": -11.101629257202148, "global_step": 449088, "epoch": 2673} {"train_loss": -11.606292724609375, "global_step": 449089, "epoch": 2673} {"train_loss": -11.175326347351074, "global_step": 449090, "epoch": 2673} {"train_loss": -11.42827033996582, "global_step": 449091, "epoch": 2673} {"train_loss": -11.39532470703125, "global_step": 449092, "epoch": 2673} {"train_loss": -11.444792747497559, "global_step": 449093, "epoch": 2673} {"train_loss": -12.330456733703613, "global_step": 449094, "epoch": 2673} {"train_loss": -11.787483215332031, "global_step": 449095, "epoch": 2673} {"train_loss": -11.879508972167969, "global_step": 449096, "epoch": 2673} {"train_loss": -12.093685150146484, "global_step": 449097, "epoch": 2673} {"train_loss": -11.611637115478516, "global_step": 449098, "epoch": 2673} {"train_loss": -12.321840286254883, "global_step": 449099, "epoch": 2673} {"train_loss": -11.840633392333984, "global_step": 449100, "epoch": 2673} {"train_loss": -12.373331069946289, "global_step": 449101, "epoch": 2673} {"train_loss": -12.032692909240723, "global_step": 449102, "epoch": 2673} {"train_loss": -12.069526672363281, "global_step": 449103, "epoch": 2673} {"train_loss": -12.36562442779541, "global_step": 449104, "epoch": 2673} {"train_loss": -12.128374099731445, "global_step": 449105, "epoch": 2673} {"train_loss": -12.328069686889648, "global_step": 449106, "epoch": 2673} {"train_loss": -12.05925464630127, "global_step": 449107, "epoch": 2673} {"train_loss": -12.045371055603027, "global_step": 449108, "epoch": 2673} {"train_loss": -12.460558891296387, "global_step": 449109, "epoch": 2673} {"train_loss": -12.185444831848145, "global_step": 449110, "epoch": 2673} {"train_loss": -12.473312377929688, "global_step": 449111, "epoch": 2673} {"train_loss": -12.181224822998047, "global_step": 449112, "epoch": 2673} {"train_loss": -12.482797622680664, "global_step": 449113, "epoch": 2673} {"train_loss": -12.48408317565918, "global_step": 449114, "epoch": 2673} {"train_loss": -12.490095138549805, "global_step": 449115, "epoch": 2673} {"train_loss": -12.391372680664062, "global_step": 449116, "epoch": 2673} {"train_loss": -12.605880737304688, "global_step": 449117, "epoch": 2673} {"train_loss": -12.327934265136719, "global_step": 449118, "epoch": 2673} {"train_loss": -12.488992691040039, "global_step": 449119, "epoch": 2673} {"train_loss": -12.417956352233887, "global_step": 449120, "epoch": 2673} {"train_loss": -12.503643035888672, "global_step": 449121, "epoch": 2673} {"train_loss": -12.588136672973633, "global_step": 449122, "epoch": 2673} {"train_loss": -12.538910865783691, "global_step": 449123, "epoch": 2673} {"train_loss": -12.547586441040039, "global_step": 449124, "epoch": 2673} {"train_loss": -12.432361602783203, "global_step": 449125, "epoch": 2673} {"train_loss": -12.361407279968262, "global_step": 449126, "epoch": 2673} {"train_loss": -12.351624488830566, "global_step": 449127, "epoch": 2673} {"train_loss": -12.493947982788086, "global_step": 449128, "epoch": 2673} {"train_loss": -12.404783248901367, "global_step": 449129, "epoch": 2673} {"train_loss": -12.517393112182617, "global_step": 449130, "epoch": 2673} {"train_loss": -12.435513496398926, "global_step": 449131, "epoch": 2673} {"train_loss": -12.378605842590332, "global_step": 449132, "epoch": 2673} {"train_loss": -12.383041381835938, "global_step": 449133, "epoch": 2673} {"train_loss": -12.560784339904785, "global_step": 449134, "epoch": 2673} {"train_loss": -12.598928451538086, "global_step": 449135, "epoch": 2673} {"train_loss": -12.33914852142334, "global_step": 449136, "epoch": 2673} {"train_loss": -12.509188652038574, "global_step": 449137, "epoch": 2673} {"train_loss": -12.510437965393066, "global_step": 449138, "epoch": 2673} {"train_loss": -12.510824203491211, "global_step": 449139, "epoch": 2673} {"train_loss": -12.511640548706055, "global_step": 449140, "epoch": 2673} {"train_loss": -12.434826850891113, "global_step": 449141, "epoch": 2673} {"train_loss": -12.71555233001709, "global_step": 449142, "epoch": 2673} {"train_loss": -12.354415893554688, "global_step": 449143, "epoch": 2673} {"train_loss": -12.724882125854492, "global_step": 449144, "epoch": 2673} {"train_loss": -12.341222763061523, "global_step": 449145, "epoch": 2673} {"train_loss": -12.696548461914062, "global_step": 449146, "epoch": 2673} {"train_loss": -12.616765975952148, "global_step": 449147, "epoch": 2673} {"train_loss": -12.805851936340332, "global_step": 449148, "epoch": 2673} {"train_loss": -12.469793319702148, "global_step": 449149, "epoch": 2673} {"train_loss": -12.765746116638184, "global_step": 449150, "epoch": 2673} {"train_loss": -12.770763397216797, "global_step": 449151, "epoch": 2673} {"train_loss": -12.691892623901367, "global_step": 449152, "epoch": 2673} {"train_loss": -12.789161682128906, "global_step": 449153, "epoch": 2673} {"train_loss": -12.8424654006958, "global_step": 449154, "epoch": 2673} {"train_loss": -12.562010765075684, "global_step": 449155, "epoch": 2673} {"train_loss": -12.800058364868164, "global_step": 449156, "epoch": 2673} {"train_loss": -12.918160438537598, "global_step": 449157, "epoch": 2673} {"train_loss": -12.735517501831055, "global_step": 449158, "epoch": 2673} {"train_loss": -12.981160163879395, "global_step": 449159, "epoch": 2673} {"train_loss": -12.944964408874512, "global_step": 449160, "epoch": 2673} {"train_loss": -13.013010025024414, "global_step": 449161, "epoch": 2673} {"train_loss": -12.948290824890137, "global_step": 449162, "epoch": 2673} {"train_loss": -13.013961791992188, "global_step": 449163, "epoch": 2673} {"train_loss": -12.893363952636719, "global_step": 449164, "epoch": 2673} {"train_loss": -12.72980785369873, "global_step": 449165, "epoch": 2673} {"train_loss": -12.834478378295898, "global_step": 449166, "epoch": 2673} {"train_loss": -12.9546480178833, "global_step": 449167, "epoch": 2673} {"train_loss": -12.802104949951172, "global_step": 449168, "epoch": 2673} {"train_loss": -13.047446250915527, "global_step": 449169, "epoch": 2673} {"train_loss": -13.068954467773438, "global_step": 449170, "epoch": 2673} {"train_loss": -12.755769729614258, "global_step": 449171, "epoch": 2673} {"train_loss": -12.96591567993164, "global_step": 449172, "epoch": 2673} {"train_loss": -12.90328598022461, "global_step": 449173, "epoch": 2673} {"train_loss": -12.870391845703125, "global_step": 449174, "epoch": 2673} {"train_loss": -12.881927490234375, "global_step": 449175, "epoch": 2673} {"train_loss": -12.861554145812988, "global_step": 449176, "epoch": 2673} {"train_loss": -12.901002883911133, "global_step": 449177, "epoch": 2673} {"train_loss": -13.044267654418945, "global_step": 449178, "epoch": 2673} {"train_loss": -12.918821334838867, "global_step": 449179, "epoch": 2673} {"train_loss": -12.993464469909668, "global_step": 449180, "epoch": 2673} {"train_loss": -12.950721740722656, "global_step": 449181, "epoch": 2673} {"train_loss": -12.820910453796387, "global_step": 449182, "epoch": 2673} {"train_loss": -12.335882186889648, "global_step": 449183, "epoch": 2673} {"train_loss": -12.218746185302734, "global_step": 449184, "epoch": 2673} {"train_loss": -12.059917449951172, "global_step": 449185, "epoch": 2673} {"train_loss": -12.295814514160156, "global_step": 449186, "epoch": 2673} {"train_loss": -12.960249900817871, "global_step": 449187, "epoch": 2673} {"train_loss": -12.733697891235352, "global_step": 449188, "epoch": 2673} {"train_loss": -12.466520309448242, "global_step": 449189, "epoch": 2673} {"train_loss": -12.259133338928223, "global_step": 449190, "epoch": 2673} {"train_loss": -12.852469444274902, "global_step": 449191, "epoch": 2673} {"train_loss": -12.735036849975586, "global_step": 449192, "epoch": 2673} {"train_loss": -12.590967178344727, "global_step": 449193, "epoch": 2673} {"train_loss": -12.507074356079102, "global_step": 449194, "epoch": 2673} {"train_loss": -12.7511568069458, "global_step": 449195, "epoch": 2673} {"train_loss": -12.571001052856445, "global_step": 449196, "epoch": 2673} {"train_loss": -12.597246170043945, "global_step": 449197, "epoch": 2673} {"train_loss": -12.356282234191895, "global_step": 449198, "epoch": 2673} {"train_loss": -12.334861755371094, "global_step": 449199, "epoch": 2673} {"train_loss": -12.652448654174805, "global_step": 449200, "epoch": 2673} {"train_loss": -12.689605712890625, "global_step": 449201, "epoch": 2673} {"train_loss": -12.367090225219727, "global_step": 449202, "epoch": 2673} {"train_loss": -11.868553161621094, "global_step": 449203, "epoch": 2673} {"train_loss": -11.616019248962402, "global_step": 449204, "epoch": 2673} {"train_loss": -12.374703407287598, "global_step": 449205, "epoch": 2673} {"train_loss": -12.40666389465332, "global_step": 449206, "epoch": 2673} {"train_loss": -12.167496681213379, "global_step": 449207, "epoch": 2673} {"train_loss": -11.88161849975586, "global_step": 449208, "epoch": 2673} {"train_loss": -11.552555084228516, "global_step": 449209, "epoch": 2673} {"train_loss": -12.627706527709961, "global_step": 449210, "epoch": 2673} {"train_loss": -11.547041893005371, "global_step": 449211, "epoch": 2673} {"train_loss": -11.334247589111328, "global_step": 449212, "epoch": 2673} {"train_loss": -10.909194946289062, "global_step": 449213, "epoch": 2673} {"train_loss": -12.174899101257324, "global_step": 449214, "epoch": 2673} {"train_loss": -12.369754791259766, "global_step": 449215, "epoch": 2673} {"train_loss": -11.580150604248047, "global_step": 449216, "epoch": 2673} {"train_loss": -12.481204986572266, "global_step": 449217, "epoch": 2673} {"train_loss": -12.210837364196777, "global_step": 449218, "epoch": 2673} {"train_loss": -12.176591873168945, "global_step": 449219, "epoch": 2673} {"train_loss": -12.116268157958984, "global_step": 449220, "epoch": 2673} {"train_loss": -12.258201599121094, "global_step": 449221, "epoch": 2673} {"train_loss": -12.505099296569824, "global_step": 449222, "epoch": 2673} {"train_loss": -12.287707328796387, "global_step": 449223, "epoch": 2673} {"train_loss": -12.35787582397461, "global_step": 449224, "epoch": 2673} {"train_loss": -12.63991641998291, "global_step": 449225, "epoch": 2673} {"train_loss": -12.561027526855469, "global_step": 449226, "epoch": 2673} {"train_loss": -11.639862060546875, "global_step": 449227, "epoch": 2673} {"train_loss": -12.009693145751953, "global_step": 449228, "epoch": 2673} {"train_loss": -12.425403594970703, "global_step": 449229, "epoch": 2673} {"train_loss": -11.785447120666504, "global_step": 449230, "epoch": 2673} {"train_loss": -12.303241843268985, "global_step": 449231, "epoch": 2673, "val_loss": 312639.96875} {"train_loss": -11.938638687133789, "global_step": 449232, "epoch": 2674} {"train_loss": -10.891072273254395, "global_step": 449233, "epoch": 2674} {"train_loss": -11.990517616271973, "global_step": 449234, "epoch": 2674} {"train_loss": -12.154352188110352, "global_step": 449235, "epoch": 2674} {"train_loss": -10.523917198181152, "global_step": 449236, "epoch": 2674} {"train_loss": -11.684164047241211, "global_step": 449237, "epoch": 2674} {"train_loss": -12.458341598510742, "global_step": 449238, "epoch": 2674} {"train_loss": -12.397867202758789, "global_step": 449239, "epoch": 2674} {"train_loss": -12.588613510131836, "global_step": 449240, "epoch": 2674} {"train_loss": -12.590238571166992, "global_step": 449241, "epoch": 2674} {"train_loss": -12.53802490234375, "global_step": 449242, "epoch": 2674} {"train_loss": -12.14122200012207, "global_step": 449243, "epoch": 2674} {"train_loss": -11.90679931640625, "global_step": 449244, "epoch": 2674} {"train_loss": -12.507833480834961, "global_step": 449245, "epoch": 2674} {"train_loss": -11.896358489990234, "global_step": 449246, "epoch": 2674} {"train_loss": -11.980568885803223, "global_step": 449247, "epoch": 2674} {"train_loss": -12.33820915222168, "global_step": 449248, "epoch": 2674} {"train_loss": -11.829961776733398, "global_step": 449249, "epoch": 2674} {"train_loss": -11.105752944946289, "global_step": 449250, "epoch": 2674} {"train_loss": -12.457962036132812, "global_step": 449251, "epoch": 2674} {"train_loss": -12.08146858215332, "global_step": 449252, "epoch": 2674} {"train_loss": -11.626350402832031, "global_step": 449253, "epoch": 2674} {"train_loss": -12.21327018737793, "global_step": 449254, "epoch": 2674} {"train_loss": -12.231595993041992, "global_step": 449255, "epoch": 2674} {"train_loss": -12.11213493347168, "global_step": 449256, "epoch": 2674} {"train_loss": -12.387531280517578, "global_step": 449257, "epoch": 2674} {"train_loss": -12.33747673034668, "global_step": 449258, "epoch": 2674} {"train_loss": -12.357766151428223, "global_step": 449259, "epoch": 2674} {"train_loss": -12.096902847290039, "global_step": 449260, "epoch": 2674} {"train_loss": -12.37800407409668, "global_step": 449261, "epoch": 2674} {"train_loss": -12.31965446472168, "global_step": 449262, "epoch": 2674} {"train_loss": -12.125389099121094, "global_step": 449263, "epoch": 2674} {"train_loss": -12.075359344482422, "global_step": 449264, "epoch": 2674} {"train_loss": -12.241876602172852, "global_step": 449265, "epoch": 2674} {"train_loss": -12.68428897857666, "global_step": 449266, "epoch": 2674} {"train_loss": -12.565877914428711, "global_step": 449267, "epoch": 2674} {"train_loss": -11.994380950927734, "global_step": 449268, "epoch": 2674} {"train_loss": -12.370226860046387, "global_step": 449269, "epoch": 2674} {"train_loss": -12.623044967651367, "global_step": 449270, "epoch": 2674} {"train_loss": -12.286035537719727, "global_step": 449271, "epoch": 2674} {"train_loss": -12.22116470336914, "global_step": 449272, "epoch": 2674} {"train_loss": -12.591885566711426, "global_step": 449273, "epoch": 2674} {"train_loss": -12.230974197387695, "global_step": 449274, "epoch": 2674} {"train_loss": -12.299843788146973, "global_step": 449275, "epoch": 2674} {"train_loss": -12.368908882141113, "global_step": 449276, "epoch": 2674} {"train_loss": -12.317466735839844, "global_step": 449277, "epoch": 2674} {"train_loss": -12.682432174682617, "global_step": 449278, "epoch": 2674} {"train_loss": -12.593236923217773, "global_step": 449279, "epoch": 2674} {"train_loss": -12.229133605957031, "global_step": 449280, "epoch": 2674} {"train_loss": -12.335100173950195, "global_step": 449281, "epoch": 2674} {"train_loss": -12.31804084777832, "global_step": 449282, "epoch": 2674} {"train_loss": -12.116334915161133, "global_step": 449283, "epoch": 2674} {"train_loss": -12.363804817199707, "global_step": 449284, "epoch": 2674} {"train_loss": -12.204753875732422, "global_step": 449285, "epoch": 2674} {"train_loss": -12.126684188842773, "global_step": 449286, "epoch": 2674} {"train_loss": -12.606620788574219, "global_step": 449287, "epoch": 2674} {"train_loss": -11.97468376159668, "global_step": 449288, "epoch": 2674} {"train_loss": -11.950889587402344, "global_step": 449289, "epoch": 2674} {"train_loss": -12.188366889953613, "global_step": 449290, "epoch": 2674} {"train_loss": -12.275174140930176, "global_step": 449291, "epoch": 2674} {"train_loss": -12.223052024841309, "global_step": 449292, "epoch": 2674} {"train_loss": -12.167726516723633, "global_step": 449293, "epoch": 2674} {"train_loss": -11.979836463928223, "global_step": 449294, "epoch": 2674} {"train_loss": -12.507514953613281, "global_step": 449295, "epoch": 2674} {"train_loss": -11.119568824768066, "global_step": 449296, "epoch": 2674} {"train_loss": -12.38998794555664, "global_step": 449297, "epoch": 2674} {"train_loss": -12.128530502319336, "global_step": 449298, "epoch": 2674} {"train_loss": -12.170387268066406, "global_step": 449299, "epoch": 2674} {"train_loss": -12.14202880859375, "global_step": 449300, "epoch": 2674} {"train_loss": -12.357452392578125, "global_step": 449301, "epoch": 2674} {"train_loss": -11.586360931396484, "global_step": 449302, "epoch": 2674} {"train_loss": -12.537912368774414, "global_step": 449303, "epoch": 2674} {"train_loss": -12.46657943725586, "global_step": 449304, "epoch": 2674} {"train_loss": -12.02801513671875, "global_step": 449305, "epoch": 2674} {"train_loss": -12.189762115478516, "global_step": 449306, "epoch": 2674} {"train_loss": -11.872897148132324, "global_step": 449307, "epoch": 2674} {"train_loss": -12.258588790893555, "global_step": 449308, "epoch": 2674} {"train_loss": -12.5144624710083, "global_step": 449309, "epoch": 2674} {"train_loss": -12.452569961547852, "global_step": 449310, "epoch": 2674} {"train_loss": -12.56663703918457, "global_step": 449311, "epoch": 2674} {"train_loss": -12.411687850952148, "global_step": 449312, "epoch": 2674} {"train_loss": -12.689313888549805, "global_step": 449313, "epoch": 2674} {"train_loss": -12.316146850585938, "global_step": 449314, "epoch": 2674} {"train_loss": -12.354772567749023, "global_step": 449315, "epoch": 2674} {"train_loss": -12.032123565673828, "global_step": 449316, "epoch": 2674} {"train_loss": -12.233219146728516, "global_step": 449317, "epoch": 2674} {"train_loss": -12.12767219543457, "global_step": 449318, "epoch": 2674} {"train_loss": -12.22880744934082, "global_step": 449319, "epoch": 2674} {"train_loss": -11.938004493713379, "global_step": 449320, "epoch": 2674} {"train_loss": -12.608552932739258, "global_step": 449321, "epoch": 2674} {"train_loss": -11.537187576293945, "global_step": 449322, "epoch": 2674} {"train_loss": -10.768239974975586, "global_step": 449323, "epoch": 2674} {"train_loss": -11.792978286743164, "global_step": 449324, "epoch": 2674} {"train_loss": -11.63221549987793, "global_step": 449325, "epoch": 2674} {"train_loss": -12.336187362670898, "global_step": 449326, "epoch": 2674} {"train_loss": -12.044210433959961, "global_step": 449327, "epoch": 2674} {"train_loss": -11.62405014038086, "global_step": 449328, "epoch": 2674} {"train_loss": -12.441551208496094, "global_step": 449329, "epoch": 2674} {"train_loss": -11.305837631225586, "global_step": 449330, "epoch": 2674} {"train_loss": -12.542003631591797, "global_step": 449331, "epoch": 2674} {"train_loss": -11.749025344848633, "global_step": 449332, "epoch": 2674} {"train_loss": -11.488138198852539, "global_step": 449333, "epoch": 2674} {"train_loss": -11.781109809875488, "global_step": 449334, "epoch": 2674} {"train_loss": -11.551170349121094, "global_step": 449335, "epoch": 2674} {"train_loss": -11.993987083435059, "global_step": 449336, "epoch": 2674} {"train_loss": -12.220148086547852, "global_step": 449337, "epoch": 2674} {"train_loss": -11.530948638916016, "global_step": 449338, "epoch": 2674} {"train_loss": -12.279857635498047, "global_step": 449339, "epoch": 2674} {"train_loss": -11.527687072753906, "global_step": 449340, "epoch": 2674} {"train_loss": -11.755706787109375, "global_step": 449341, "epoch": 2674} {"train_loss": -12.329648971557617, "global_step": 449342, "epoch": 2674} {"train_loss": -12.226251602172852, "global_step": 449343, "epoch": 2674} {"train_loss": -11.838743209838867, "global_step": 449344, "epoch": 2674} {"train_loss": -12.417539596557617, "global_step": 449345, "epoch": 2674} {"train_loss": -11.769073486328125, "global_step": 449346, "epoch": 2674} {"train_loss": -12.444913864135742, "global_step": 449347, "epoch": 2674} {"train_loss": -11.808797836303711, "global_step": 449348, "epoch": 2674} {"train_loss": -12.389701843261719, "global_step": 449349, "epoch": 2674} {"train_loss": -12.051530838012695, "global_step": 449350, "epoch": 2674} {"train_loss": -12.576177597045898, "global_step": 449351, "epoch": 2674} {"train_loss": -12.375391006469727, "global_step": 449352, "epoch": 2674} {"train_loss": -12.219766616821289, "global_step": 449353, "epoch": 2674} {"train_loss": -12.121113777160645, "global_step": 449354, "epoch": 2674} {"train_loss": -12.512028694152832, "global_step": 449355, "epoch": 2674} {"train_loss": -12.356097221374512, "global_step": 449356, "epoch": 2674} {"train_loss": -12.435725212097168, "global_step": 449357, "epoch": 2674} {"train_loss": -12.599806785583496, "global_step": 449358, "epoch": 2674} {"train_loss": -12.008071899414062, "global_step": 449359, "epoch": 2674} {"train_loss": -12.69442367553711, "global_step": 449360, "epoch": 2674} {"train_loss": -12.466410636901855, "global_step": 449361, "epoch": 2674} {"train_loss": -12.432611465454102, "global_step": 449362, "epoch": 2674} {"train_loss": -12.38068675994873, "global_step": 449363, "epoch": 2674} {"train_loss": -11.838232040405273, "global_step": 449364, "epoch": 2674} {"train_loss": -12.085103988647461, "global_step": 449365, "epoch": 2674} {"train_loss": -12.228582382202148, "global_step": 449366, "epoch": 2674} {"train_loss": -12.095585823059082, "global_step": 449367, "epoch": 2674} {"train_loss": -12.345747947692871, "global_step": 449368, "epoch": 2674} {"train_loss": -12.380918502807617, "global_step": 449369, "epoch": 2674} {"train_loss": -12.181032180786133, "global_step": 449370, "epoch": 2674} {"train_loss": -11.852373123168945, "global_step": 449371, "epoch": 2674} {"train_loss": -12.46088981628418, "global_step": 449372, "epoch": 2674} {"train_loss": -11.902231216430664, "global_step": 449373, "epoch": 2674} {"train_loss": -12.547025680541992, "global_step": 449374, "epoch": 2674} {"train_loss": -12.605997085571289, "global_step": 449375, "epoch": 2674} {"train_loss": -12.097291946411133, "global_step": 449376, "epoch": 2674} {"train_loss": -12.553120613098145, "global_step": 449377, "epoch": 2674} {"train_loss": -11.830184936523438, "global_step": 449378, "epoch": 2674} {"train_loss": -12.527027130126953, "global_step": 449379, "epoch": 2674} {"train_loss": -12.01664924621582, "global_step": 449380, "epoch": 2674} {"train_loss": -11.601816177368164, "global_step": 449381, "epoch": 2674} {"train_loss": -12.11532211303711, "global_step": 449382, "epoch": 2674} {"train_loss": -11.71197509765625, "global_step": 449383, "epoch": 2674} {"train_loss": -11.922769546508789, "global_step": 449384, "epoch": 2674} {"train_loss": -11.990927696228027, "global_step": 449385, "epoch": 2674} {"train_loss": -11.423667907714844, "global_step": 449386, "epoch": 2674} {"train_loss": -12.307978630065918, "global_step": 449387, "epoch": 2674} {"train_loss": -12.289642333984375, "global_step": 449388, "epoch": 2674} {"train_loss": -12.488186836242676, "global_step": 449389, "epoch": 2674} {"train_loss": -12.211481094360352, "global_step": 449390, "epoch": 2674} {"train_loss": -12.257402420043945, "global_step": 449391, "epoch": 2674} {"train_loss": -12.25466251373291, "global_step": 449392, "epoch": 2674} {"train_loss": -12.5247802734375, "global_step": 449393, "epoch": 2674} {"train_loss": -11.792312622070312, "global_step": 449394, "epoch": 2674} {"train_loss": -12.134922981262207, "global_step": 449395, "epoch": 2674} {"train_loss": -12.613605499267578, "global_step": 449396, "epoch": 2674} {"train_loss": -11.763723373413086, "global_step": 449397, "epoch": 2674} {"train_loss": -12.668006896972656, "global_step": 449398, "epoch": 2674} {"train_loss": -12.154336021060036, "global_step": 449399, "epoch": 2674, "val_loss": 315743.5} {"train_loss": -12.822490692138672, "global_step": 449400, "epoch": 2675} {"train_loss": -12.050186157226562, "global_step": 449401, "epoch": 2675} {"train_loss": -11.887897491455078, "global_step": 449402, "epoch": 2675} {"train_loss": -12.417509078979492, "global_step": 449403, "epoch": 2675} {"train_loss": -11.839945793151855, "global_step": 449404, "epoch": 2675} {"train_loss": -12.13261604309082, "global_step": 449405, "epoch": 2675} {"train_loss": -12.252866744995117, "global_step": 449406, "epoch": 2675} {"train_loss": -10.855634689331055, "global_step": 449407, "epoch": 2675} {"train_loss": -11.405517578125, "global_step": 449408, "epoch": 2675} {"train_loss": -10.856913566589355, "global_step": 449409, "epoch": 2675} {"train_loss": -10.332903861999512, "global_step": 449410, "epoch": 2675} {"train_loss": -9.907264709472656, "global_step": 449411, "epoch": 2675} {"train_loss": -11.116004943847656, "global_step": 449412, "epoch": 2675} {"train_loss": -10.831310272216797, "global_step": 449413, "epoch": 2675} {"train_loss": -11.846451759338379, "global_step": 449414, "epoch": 2675} {"train_loss": -10.302831649780273, "global_step": 449415, "epoch": 2675} {"train_loss": -11.666433334350586, "global_step": 449416, "epoch": 2675} {"train_loss": -10.709239959716797, "global_step": 449417, "epoch": 2675} {"train_loss": -11.239782333374023, "global_step": 449418, "epoch": 2675} {"train_loss": -10.690559387207031, "global_step": 449419, "epoch": 2675} {"train_loss": -10.234310150146484, "global_step": 449420, "epoch": 2675} {"train_loss": -12.054119110107422, "global_step": 449421, "epoch": 2675} {"train_loss": -10.939698219299316, "global_step": 449422, "epoch": 2675} {"train_loss": -10.185718536376953, "global_step": 449423, "epoch": 2675} {"train_loss": -10.751670837402344, "global_step": 449424, "epoch": 2675} {"train_loss": -11.7645263671875, "global_step": 449425, "epoch": 2675} {"train_loss": -10.939547538757324, "global_step": 449426, "epoch": 2675} {"train_loss": -11.315351486206055, "global_step": 449427, "epoch": 2675} {"train_loss": -11.833789825439453, "global_step": 449428, "epoch": 2675} {"train_loss": -10.652053833007812, "global_step": 449429, "epoch": 2675} {"train_loss": -11.007201194763184, "global_step": 449430, "epoch": 2675} {"train_loss": -11.748941421508789, "global_step": 449431, "epoch": 2675} {"train_loss": -11.66114330291748, "global_step": 449432, "epoch": 2675} {"train_loss": -11.351354598999023, "global_step": 449433, "epoch": 2675} {"train_loss": -11.443795204162598, "global_step": 449434, "epoch": 2675} {"train_loss": -11.40010929107666, "global_step": 449435, "epoch": 2675} {"train_loss": -11.350384712219238, "global_step": 449436, "epoch": 2675} {"train_loss": -12.21621322631836, "global_step": 449437, "epoch": 2675} {"train_loss": -11.038810729980469, "global_step": 449438, "epoch": 2675} {"train_loss": -11.596358299255371, "global_step": 449439, "epoch": 2675} {"train_loss": -12.094711303710938, "global_step": 449440, "epoch": 2675} {"train_loss": -11.659309387207031, "global_step": 449441, "epoch": 2675} {"train_loss": -12.00762939453125, "global_step": 449442, "epoch": 2675} {"train_loss": -11.900447845458984, "global_step": 449443, "epoch": 2675} {"train_loss": -11.449079513549805, "global_step": 449444, "epoch": 2675} {"train_loss": -11.453197479248047, "global_step": 449445, "epoch": 2675} {"train_loss": -11.795684814453125, "global_step": 449446, "epoch": 2675} {"train_loss": -12.064470291137695, "global_step": 449447, "epoch": 2675} {"train_loss": -11.912569046020508, "global_step": 449448, "epoch": 2675} {"train_loss": -12.081647872924805, "global_step": 449449, "epoch": 2675} {"train_loss": -12.099675178527832, "global_step": 449450, "epoch": 2675} {"train_loss": -11.739681243896484, "global_step": 449451, "epoch": 2675} {"train_loss": -12.369630813598633, "global_step": 449452, "epoch": 2675} {"train_loss": -11.615640640258789, "global_step": 449453, "epoch": 2675} {"train_loss": -12.56535816192627, "global_step": 449454, "epoch": 2675} {"train_loss": -12.275323867797852, "global_step": 449455, "epoch": 2675} {"train_loss": -12.30119514465332, "global_step": 449456, "epoch": 2675} {"train_loss": -12.318306922912598, "global_step": 449457, "epoch": 2675} {"train_loss": -12.537347793579102, "global_step": 449458, "epoch": 2675} {"train_loss": -12.370281219482422, "global_step": 449459, "epoch": 2675} {"train_loss": -12.521236419677734, "global_step": 449460, "epoch": 2675} {"train_loss": -12.51270866394043, "global_step": 449461, "epoch": 2675} {"train_loss": -12.658327102661133, "global_step": 449462, "epoch": 2675} {"train_loss": -12.49298095703125, "global_step": 449463, "epoch": 2675} {"train_loss": -12.555013656616211, "global_step": 449464, "epoch": 2675} {"train_loss": -12.331130981445312, "global_step": 449465, "epoch": 2675} {"train_loss": -12.376971244812012, "global_step": 449466, "epoch": 2675} {"train_loss": -12.571105003356934, "global_step": 449467, "epoch": 2675} {"train_loss": -12.68182373046875, "global_step": 449468, "epoch": 2675} {"train_loss": -12.602426528930664, "global_step": 449469, "epoch": 2675} {"train_loss": -12.771133422851562, "global_step": 449470, "epoch": 2675} {"train_loss": -12.473308563232422, "global_step": 449471, "epoch": 2675} {"train_loss": -12.34846019744873, "global_step": 449472, "epoch": 2675} {"train_loss": -12.599920272827148, "global_step": 449473, "epoch": 2675} {"train_loss": -12.447159767150879, "global_step": 449474, "epoch": 2675} {"train_loss": -12.73508071899414, "global_step": 449475, "epoch": 2675} {"train_loss": -12.653773307800293, "global_step": 449476, "epoch": 2675} {"train_loss": -12.756231307983398, "global_step": 449477, "epoch": 2675} {"train_loss": -12.756616592407227, "global_step": 449478, "epoch": 2675} {"train_loss": -12.335172653198242, "global_step": 449479, "epoch": 2675} {"train_loss": -12.53195571899414, "global_step": 449480, "epoch": 2675} {"train_loss": -12.644845962524414, "global_step": 449481, "epoch": 2675} {"train_loss": -12.575769424438477, "global_step": 449482, "epoch": 2675} {"train_loss": -12.731335639953613, "global_step": 449483, "epoch": 2675} {"train_loss": -12.768555641174316, "global_step": 449484, "epoch": 2675} {"train_loss": -12.69791030883789, "global_step": 449485, "epoch": 2675} {"train_loss": -12.947402000427246, "global_step": 449486, "epoch": 2675} {"train_loss": -12.78121566772461, "global_step": 449487, "epoch": 2675} {"train_loss": -12.678468704223633, "global_step": 449488, "epoch": 2675} {"train_loss": -12.809779167175293, "global_step": 449489, "epoch": 2675} {"train_loss": -12.79627513885498, "global_step": 449490, "epoch": 2675} {"train_loss": -12.669870376586914, "global_step": 449491, "epoch": 2675} {"train_loss": -12.662052154541016, "global_step": 449492, "epoch": 2675} {"train_loss": -12.564496994018555, "global_step": 449493, "epoch": 2675} {"train_loss": -12.637298583984375, "global_step": 449494, "epoch": 2675} {"train_loss": -12.61492919921875, "global_step": 449495, "epoch": 2675} {"train_loss": -12.707914352416992, "global_step": 449496, "epoch": 2675} {"train_loss": -12.578088760375977, "global_step": 449497, "epoch": 2675} {"train_loss": -12.703775405883789, "global_step": 449498, "epoch": 2675} {"train_loss": -12.475564956665039, "global_step": 449499, "epoch": 2675} {"train_loss": -12.412557601928711, "global_step": 449500, "epoch": 2675} {"train_loss": -12.724648475646973, "global_step": 449501, "epoch": 2675} {"train_loss": -12.675945281982422, "global_step": 449502, "epoch": 2675} {"train_loss": -11.90262508392334, "global_step": 449503, "epoch": 2675} {"train_loss": -12.686151504516602, "global_step": 449504, "epoch": 2675} {"train_loss": -12.476594924926758, "global_step": 449505, "epoch": 2675} {"train_loss": -12.61459732055664, "global_step": 449506, "epoch": 2675} {"train_loss": -12.460878372192383, "global_step": 449507, "epoch": 2675} {"train_loss": -12.693159103393555, "global_step": 449508, "epoch": 2675} {"train_loss": -12.84774398803711, "global_step": 449509, "epoch": 2675} {"train_loss": -12.819294929504395, "global_step": 449510, "epoch": 2675} {"train_loss": -12.838982582092285, "global_step": 449511, "epoch": 2675} {"train_loss": -12.59211254119873, "global_step": 449512, "epoch": 2675} {"train_loss": -12.723945617675781, "global_step": 449513, "epoch": 2675} {"train_loss": -12.514961242675781, "global_step": 449514, "epoch": 2675} {"train_loss": -12.28532600402832, "global_step": 449515, "epoch": 2675} {"train_loss": -11.983043670654297, "global_step": 449516, "epoch": 2675} {"train_loss": -12.100750923156738, "global_step": 449517, "epoch": 2675} {"train_loss": -12.765178680419922, "global_step": 449518, "epoch": 2675} {"train_loss": -11.406658172607422, "global_step": 449519, "epoch": 2675} {"train_loss": -11.453201293945312, "global_step": 449520, "epoch": 2675} {"train_loss": -12.125558853149414, "global_step": 449521, "epoch": 2675} {"train_loss": -12.72806453704834, "global_step": 449522, "epoch": 2675} {"train_loss": -12.503154754638672, "global_step": 449523, "epoch": 2675} {"train_loss": -12.519340515136719, "global_step": 449524, "epoch": 2675} {"train_loss": -12.615190505981445, "global_step": 449525, "epoch": 2675} {"train_loss": -12.63394832611084, "global_step": 449526, "epoch": 2675} {"train_loss": -12.710111618041992, "global_step": 449527, "epoch": 2675} {"train_loss": -12.356724739074707, "global_step": 449528, "epoch": 2675} {"train_loss": -12.315729141235352, "global_step": 449529, "epoch": 2675} {"train_loss": -11.852033615112305, "global_step": 449530, "epoch": 2675} {"train_loss": -12.844470977783203, "global_step": 449531, "epoch": 2675} {"train_loss": -12.33352279663086, "global_step": 449532, "epoch": 2675} {"train_loss": -12.568480491638184, "global_step": 449533, "epoch": 2675} {"train_loss": -12.057785987854004, "global_step": 449534, "epoch": 2675} {"train_loss": -12.704605102539062, "global_step": 449535, "epoch": 2675} {"train_loss": -12.084993362426758, "global_step": 449536, "epoch": 2675} {"train_loss": -11.55955696105957, "global_step": 449537, "epoch": 2675} {"train_loss": -11.571746826171875, "global_step": 449538, "epoch": 2675} {"train_loss": -11.556326866149902, "global_step": 449539, "epoch": 2675} {"train_loss": -10.650907516479492, "global_step": 449540, "epoch": 2675} {"train_loss": -12.32281494140625, "global_step": 449541, "epoch": 2675} {"train_loss": -10.117391586303711, "global_step": 449542, "epoch": 2675} {"train_loss": -10.41439151763916, "global_step": 449543, "epoch": 2675} {"train_loss": -9.465805053710938, "global_step": 449544, "epoch": 2675} {"train_loss": -10.578153610229492, "global_step": 449545, "epoch": 2675} {"train_loss": -10.273707389831543, "global_step": 449546, "epoch": 2675} {"train_loss": -11.135893821716309, "global_step": 449547, "epoch": 2675} {"train_loss": -10.281244277954102, "global_step": 449548, "epoch": 2675} {"train_loss": -11.323997497558594, "global_step": 449549, "epoch": 2675} {"train_loss": -11.836813926696777, "global_step": 449550, "epoch": 2675} {"train_loss": -11.093149185180664, "global_step": 449551, "epoch": 2675} {"train_loss": -11.670021057128906, "global_step": 449552, "epoch": 2675} {"train_loss": -11.713141441345215, "global_step": 449553, "epoch": 2675} {"train_loss": -11.175971984863281, "global_step": 449554, "epoch": 2675} {"train_loss": -11.454919815063477, "global_step": 449555, "epoch": 2675} {"train_loss": -11.59908390045166, "global_step": 449556, "epoch": 2675} {"train_loss": -12.042769432067871, "global_step": 449557, "epoch": 2675} {"train_loss": -12.045337677001953, "global_step": 449558, "epoch": 2675} {"train_loss": -12.196535110473633, "global_step": 449559, "epoch": 2675} {"train_loss": -12.631492614746094, "global_step": 449560, "epoch": 2675} {"train_loss": -12.356239318847656, "global_step": 449561, "epoch": 2675} {"train_loss": -12.296082496643066, "global_step": 449562, "epoch": 2675} {"train_loss": -12.54731559753418, "global_step": 449563, "epoch": 2675} {"train_loss": -12.515119552612305, "global_step": 449564, "epoch": 2675} {"train_loss": -12.199451446533203, "global_step": 449565, "epoch": 2675} {"train_loss": -12.041276931762695, "global_step": 449566, "epoch": 2675} {"train_loss": -11.993841579982213, "global_step": 449567, "epoch": 2675, "val_loss": 312595.625, "train_action_mse_error": 0.9199537038803101} {"train_loss": -12.145305633544922, "global_step": 449568, "epoch": 2676} {"train_loss": -11.715994834899902, "global_step": 449569, "epoch": 2676} {"train_loss": -12.33319091796875, "global_step": 449570, "epoch": 2676} {"train_loss": -11.53437614440918, "global_step": 449571, "epoch": 2676} {"train_loss": -12.55948257446289, "global_step": 449572, "epoch": 2676} {"train_loss": -11.701404571533203, "global_step": 449573, "epoch": 2676} {"train_loss": -11.700784683227539, "global_step": 449574, "epoch": 2676} {"train_loss": -12.414743423461914, "global_step": 449575, "epoch": 2676} {"train_loss": -11.446989059448242, "global_step": 449576, "epoch": 2676} {"train_loss": -11.947722434997559, "global_step": 449577, "epoch": 2676} {"train_loss": -12.136295318603516, "global_step": 449578, "epoch": 2676} {"train_loss": -11.940498352050781, "global_step": 449579, "epoch": 2676} {"train_loss": -11.547262191772461, "global_step": 449580, "epoch": 2676} {"train_loss": -12.010200500488281, "global_step": 449581, "epoch": 2676} {"train_loss": -12.189338684082031, "global_step": 449582, "epoch": 2676} {"train_loss": -12.03299617767334, "global_step": 449583, "epoch": 2676} {"train_loss": -11.95941162109375, "global_step": 449584, "epoch": 2676} {"train_loss": -12.156278610229492, "global_step": 449585, "epoch": 2676} {"train_loss": -12.082392692565918, "global_step": 449586, "epoch": 2676} {"train_loss": -12.562370300292969, "global_step": 449587, "epoch": 2676} {"train_loss": -12.215755462646484, "global_step": 449588, "epoch": 2676} {"train_loss": -12.375670433044434, "global_step": 449589, "epoch": 2676} {"train_loss": -12.415746688842773, "global_step": 449590, "epoch": 2676} {"train_loss": -12.08635139465332, "global_step": 449591, "epoch": 2676} {"train_loss": -12.602729797363281, "global_step": 449592, "epoch": 2676} {"train_loss": -12.372248649597168, "global_step": 449593, "epoch": 2676} {"train_loss": -12.785846710205078, "global_step": 449594, "epoch": 2676} {"train_loss": -12.616888046264648, "global_step": 449595, "epoch": 2676} {"train_loss": -12.656461715698242, "global_step": 449596, "epoch": 2676} {"train_loss": -12.683561325073242, "global_step": 449597, "epoch": 2676} {"train_loss": -12.264723777770996, "global_step": 449598, "epoch": 2676} {"train_loss": -12.69151496887207, "global_step": 449599, "epoch": 2676} {"train_loss": -12.228904724121094, "global_step": 449600, "epoch": 2676} {"train_loss": -12.309059143066406, "global_step": 449601, "epoch": 2676} {"train_loss": -12.408245086669922, "global_step": 449602, "epoch": 2676} {"train_loss": -12.255538940429688, "global_step": 449603, "epoch": 2676} {"train_loss": -12.682355880737305, "global_step": 449604, "epoch": 2676} {"train_loss": -12.238725662231445, "global_step": 449605, "epoch": 2676} {"train_loss": -12.721925735473633, "global_step": 449606, "epoch": 2676} {"train_loss": -12.442461013793945, "global_step": 449607, "epoch": 2676} {"train_loss": -12.77630615234375, "global_step": 449608, "epoch": 2676} {"train_loss": -12.548786163330078, "global_step": 449609, "epoch": 2676} {"train_loss": -12.668977737426758, "global_step": 449610, "epoch": 2676} {"train_loss": -12.572465896606445, "global_step": 449611, "epoch": 2676} {"train_loss": -12.306612014770508, "global_step": 449612, "epoch": 2676} {"train_loss": -12.462215423583984, "global_step": 449613, "epoch": 2676} {"train_loss": -11.977224349975586, "global_step": 449614, "epoch": 2676} {"train_loss": -12.601298332214355, "global_step": 449615, "epoch": 2676} {"train_loss": -12.493682861328125, "global_step": 449616, "epoch": 2676} {"train_loss": -12.316558837890625, "global_step": 449617, "epoch": 2676} {"train_loss": -12.458795547485352, "global_step": 449618, "epoch": 2676} {"train_loss": -12.097671508789062, "global_step": 449619, "epoch": 2676} {"train_loss": -12.32375717163086, "global_step": 449620, "epoch": 2676} {"train_loss": -12.380937576293945, "global_step": 449621, "epoch": 2676} {"train_loss": -12.523258209228516, "global_step": 449622, "epoch": 2676} {"train_loss": -12.36476993560791, "global_step": 449623, "epoch": 2676} {"train_loss": -11.840578079223633, "global_step": 449624, "epoch": 2676} {"train_loss": -12.213421821594238, "global_step": 449625, "epoch": 2676} {"train_loss": -12.749056816101074, "global_step": 449626, "epoch": 2676} {"train_loss": -11.33407974243164, "global_step": 449627, "epoch": 2676} {"train_loss": -11.986600875854492, "global_step": 449628, "epoch": 2676} {"train_loss": -12.427433013916016, "global_step": 449629, "epoch": 2676} {"train_loss": -11.981712341308594, "global_step": 449630, "epoch": 2676} {"train_loss": -12.08863639831543, "global_step": 449631, "epoch": 2676} {"train_loss": -12.619625091552734, "global_step": 449632, "epoch": 2676} {"train_loss": -12.323770523071289, "global_step": 449633, "epoch": 2676} {"train_loss": -12.298778533935547, "global_step": 449634, "epoch": 2676} {"train_loss": -12.417512893676758, "global_step": 449635, "epoch": 2676} {"train_loss": -12.104391098022461, "global_step": 449636, "epoch": 2676} {"train_loss": -12.198545455932617, "global_step": 449637, "epoch": 2676} {"train_loss": -12.370330810546875, "global_step": 449638, "epoch": 2676} {"train_loss": -12.428406715393066, "global_step": 449639, "epoch": 2676} {"train_loss": -12.036493301391602, "global_step": 449640, "epoch": 2676} {"train_loss": -12.486522674560547, "global_step": 449641, "epoch": 2676} {"train_loss": -12.333870887756348, "global_step": 449642, "epoch": 2676} {"train_loss": -12.210007667541504, "global_step": 449643, "epoch": 2676} {"train_loss": -12.2653169631958, "global_step": 449644, "epoch": 2676} {"train_loss": -12.54309368133545, "global_step": 449645, "epoch": 2676} {"train_loss": -12.445436477661133, "global_step": 449646, "epoch": 2676} {"train_loss": -12.759419441223145, "global_step": 449647, "epoch": 2676} {"train_loss": -12.468671798706055, "global_step": 449648, "epoch": 2676} {"train_loss": -11.996480941772461, "global_step": 449649, "epoch": 2676} {"train_loss": -12.905656814575195, "global_step": 449650, "epoch": 2676} {"train_loss": -12.757811546325684, "global_step": 449651, "epoch": 2676} {"train_loss": -12.239665985107422, "global_step": 449652, "epoch": 2676} {"train_loss": -12.769355773925781, "global_step": 449653, "epoch": 2676} {"train_loss": -12.619634628295898, "global_step": 449654, "epoch": 2676} {"train_loss": -12.508987426757812, "global_step": 449655, "epoch": 2676} {"train_loss": -12.709489822387695, "global_step": 449656, "epoch": 2676} {"train_loss": -12.668601989746094, "global_step": 449657, "epoch": 2676} {"train_loss": -12.376394271850586, "global_step": 449658, "epoch": 2676} {"train_loss": -12.600631713867188, "global_step": 449659, "epoch": 2676} {"train_loss": -12.596149444580078, "global_step": 449660, "epoch": 2676} {"train_loss": -12.351845741271973, "global_step": 449661, "epoch": 2676} {"train_loss": -12.179950714111328, "global_step": 449662, "epoch": 2676} {"train_loss": -12.857858657836914, "global_step": 449663, "epoch": 2676} {"train_loss": -12.417243957519531, "global_step": 449664, "epoch": 2676} {"train_loss": -12.787883758544922, "global_step": 449665, "epoch": 2676} {"train_loss": -12.680387496948242, "global_step": 449666, "epoch": 2676} {"train_loss": -12.74889087677002, "global_step": 449667, "epoch": 2676} {"train_loss": -12.339712142944336, "global_step": 449668, "epoch": 2676} {"train_loss": -12.423944473266602, "global_step": 449669, "epoch": 2676} {"train_loss": -12.718305587768555, "global_step": 449670, "epoch": 2676} {"train_loss": -12.20943832397461, "global_step": 449671, "epoch": 2676} {"train_loss": -12.473345756530762, "global_step": 449672, "epoch": 2676} {"train_loss": -12.4767484664917, "global_step": 449673, "epoch": 2676} {"train_loss": -12.484075546264648, "global_step": 449674, "epoch": 2676} {"train_loss": -12.664407730102539, "global_step": 449675, "epoch": 2676} {"train_loss": -12.885566711425781, "global_step": 449676, "epoch": 2676} {"train_loss": -12.557193756103516, "global_step": 449677, "epoch": 2676} {"train_loss": -12.32956314086914, "global_step": 449678, "epoch": 2676} {"train_loss": -13.04317855834961, "global_step": 449679, "epoch": 2676} {"train_loss": -12.549111366271973, "global_step": 449680, "epoch": 2676} {"train_loss": -12.666584014892578, "global_step": 449681, "epoch": 2676} {"train_loss": -12.866896629333496, "global_step": 449682, "epoch": 2676} {"train_loss": -12.935243606567383, "global_step": 449683, "epoch": 2676} {"train_loss": -12.822436332702637, "global_step": 449684, "epoch": 2676} {"train_loss": -12.857345581054688, "global_step": 449685, "epoch": 2676} {"train_loss": -12.766281127929688, "global_step": 449686, "epoch": 2676} {"train_loss": -12.818891525268555, "global_step": 449687, "epoch": 2676} {"train_loss": -12.790976524353027, "global_step": 449688, "epoch": 2676} {"train_loss": -12.480514526367188, "global_step": 449689, "epoch": 2676} {"train_loss": -12.764856338500977, "global_step": 449690, "epoch": 2676} {"train_loss": -12.650371551513672, "global_step": 449691, "epoch": 2676} {"train_loss": -12.646146774291992, "global_step": 449692, "epoch": 2676} {"train_loss": -12.548181533813477, "global_step": 449693, "epoch": 2676} {"train_loss": -12.616266250610352, "global_step": 449694, "epoch": 2676} {"train_loss": -12.555234909057617, "global_step": 449695, "epoch": 2676} {"train_loss": -12.808832168579102, "global_step": 449696, "epoch": 2676} {"train_loss": -12.370292663574219, "global_step": 449697, "epoch": 2676} {"train_loss": -12.767553329467773, "global_step": 449698, "epoch": 2676} {"train_loss": -12.273740768432617, "global_step": 449699, "epoch": 2676} {"train_loss": -11.862508773803711, "global_step": 449700, "epoch": 2676} {"train_loss": -12.131895065307617, "global_step": 449701, "epoch": 2676} {"train_loss": -11.920661926269531, "global_step": 449702, "epoch": 2676} {"train_loss": -11.975113868713379, "global_step": 449703, "epoch": 2676} {"train_loss": -12.429637908935547, "global_step": 449704, "epoch": 2676} {"train_loss": -11.757153511047363, "global_step": 449705, "epoch": 2676} {"train_loss": -12.39254379272461, "global_step": 449706, "epoch": 2676} {"train_loss": -12.671643257141113, "global_step": 449707, "epoch": 2676} {"train_loss": -12.164518356323242, "global_step": 449708, "epoch": 2676} {"train_loss": -12.758134841918945, "global_step": 449709, "epoch": 2676} {"train_loss": -12.238595962524414, "global_step": 449710, "epoch": 2676} {"train_loss": -12.757282257080078, "global_step": 449711, "epoch": 2676} {"train_loss": -12.302722930908203, "global_step": 449712, "epoch": 2676} {"train_loss": -12.503141403198242, "global_step": 449713, "epoch": 2676} {"train_loss": -12.364025115966797, "global_step": 449714, "epoch": 2676} {"train_loss": -12.729694366455078, "global_step": 449715, "epoch": 2676} {"train_loss": -12.271974563598633, "global_step": 449716, "epoch": 2676} {"train_loss": -12.672262191772461, "global_step": 449717, "epoch": 2676} {"train_loss": -12.525131225585938, "global_step": 449718, "epoch": 2676} {"train_loss": -12.493511199951172, "global_step": 449719, "epoch": 2676} {"train_loss": -12.43101692199707, "global_step": 449720, "epoch": 2676} {"train_loss": -11.924055099487305, "global_step": 449721, "epoch": 2676} {"train_loss": -12.472610473632812, "global_step": 449722, "epoch": 2676} {"train_loss": -13.001425743103027, "global_step": 449723, "epoch": 2676} {"train_loss": -12.412466049194336, "global_step": 449724, "epoch": 2676} {"train_loss": -12.383646011352539, "global_step": 449725, "epoch": 2676} {"train_loss": -12.59473705291748, "global_step": 449726, "epoch": 2676} {"train_loss": -12.134856224060059, "global_step": 449727, "epoch": 2676} {"train_loss": -10.986905097961426, "global_step": 449728, "epoch": 2676} {"train_loss": -12.467214584350586, "global_step": 449729, "epoch": 2676} {"train_loss": -10.974481582641602, "global_step": 449730, "epoch": 2676} {"train_loss": -11.091287612915039, "global_step": 449731, "epoch": 2676} {"train_loss": -11.679805755615234, "global_step": 449732, "epoch": 2676} {"train_loss": -9.8056640625, "global_step": 449733, "epoch": 2676} {"train_loss": -11.548517227172852, "global_step": 449734, "epoch": 2676} {"train_loss": -12.348152410416375, "global_step": 449735, "epoch": 2676, "val_loss": 316476.875} {"train_loss": -10.740675926208496, "global_step": 449736, "epoch": 2677} {"train_loss": -12.492658615112305, "global_step": 449737, "epoch": 2677} {"train_loss": -10.691336631774902, "global_step": 449738, "epoch": 2677} {"train_loss": -11.556042671203613, "global_step": 449739, "epoch": 2677} {"train_loss": -11.484024047851562, "global_step": 449740, "epoch": 2677} {"train_loss": -11.073413848876953, "global_step": 449741, "epoch": 2677} {"train_loss": -11.678023338317871, "global_step": 449742, "epoch": 2677} {"train_loss": -11.567586898803711, "global_step": 449743, "epoch": 2677} {"train_loss": -10.440308570861816, "global_step": 449744, "epoch": 2677} {"train_loss": -11.801292419433594, "global_step": 449745, "epoch": 2677} {"train_loss": -11.088701248168945, "global_step": 449746, "epoch": 2677} {"train_loss": -10.580055236816406, "global_step": 449747, "epoch": 2677} {"train_loss": -12.054584503173828, "global_step": 449748, "epoch": 2677} {"train_loss": -11.440189361572266, "global_step": 449749, "epoch": 2677} {"train_loss": -11.543272018432617, "global_step": 449750, "epoch": 2677} {"train_loss": -12.314441680908203, "global_step": 449751, "epoch": 2677} {"train_loss": -10.695455551147461, "global_step": 449752, "epoch": 2677} {"train_loss": -12.166763305664062, "global_step": 449753, "epoch": 2677} {"train_loss": -11.484365463256836, "global_step": 449754, "epoch": 2677} {"train_loss": -12.011675834655762, "global_step": 449755, "epoch": 2677} {"train_loss": -11.815996170043945, "global_step": 449756, "epoch": 2677} {"train_loss": -11.90658950805664, "global_step": 449757, "epoch": 2677} {"train_loss": -12.148759841918945, "global_step": 449758, "epoch": 2677} {"train_loss": -12.138618469238281, "global_step": 449759, "epoch": 2677} {"train_loss": -12.14202880859375, "global_step": 449760, "epoch": 2677} {"train_loss": -12.419053077697754, "global_step": 449761, "epoch": 2677} {"train_loss": -12.130760192871094, "global_step": 449762, "epoch": 2677} {"train_loss": -12.0065279006958, "global_step": 449763, "epoch": 2677} {"train_loss": -11.976106643676758, "global_step": 449764, "epoch": 2677} {"train_loss": -12.302309036254883, "global_step": 449765, "epoch": 2677} {"train_loss": -11.880038261413574, "global_step": 449766, "epoch": 2677} {"train_loss": -11.901437759399414, "global_step": 449767, "epoch": 2677} {"train_loss": -12.344144821166992, "global_step": 449768, "epoch": 2677} {"train_loss": -12.146907806396484, "global_step": 449769, "epoch": 2677} {"train_loss": -12.311824798583984, "global_step": 449770, "epoch": 2677} {"train_loss": -11.75395393371582, "global_step": 449771, "epoch": 2677} {"train_loss": -12.161712646484375, "global_step": 449772, "epoch": 2677} {"train_loss": -12.307413101196289, "global_step": 449773, "epoch": 2677} {"train_loss": -12.213617324829102, "global_step": 449774, "epoch": 2677} {"train_loss": -12.123664855957031, "global_step": 449775, "epoch": 2677} {"train_loss": -12.26742172241211, "global_step": 449776, "epoch": 2677} {"train_loss": -12.008769989013672, "global_step": 449777, "epoch": 2677} {"train_loss": -11.783674240112305, "global_step": 449778, "epoch": 2677} {"train_loss": -11.403599739074707, "global_step": 449779, "epoch": 2677} {"train_loss": -12.25357723236084, "global_step": 449780, "epoch": 2677} {"train_loss": -11.448007583618164, "global_step": 449781, "epoch": 2677} {"train_loss": -12.270713806152344, "global_step": 449782, "epoch": 2677} {"train_loss": -12.56578540802002, "global_step": 449783, "epoch": 2677} {"train_loss": -12.095279693603516, "global_step": 449784, "epoch": 2677} {"train_loss": -11.763252258300781, "global_step": 449785, "epoch": 2677} {"train_loss": -12.27708911895752, "global_step": 449786, "epoch": 2677} {"train_loss": -11.836811065673828, "global_step": 449787, "epoch": 2677} {"train_loss": -12.39871883392334, "global_step": 449788, "epoch": 2677} {"train_loss": -12.069916725158691, "global_step": 449789, "epoch": 2677} {"train_loss": -12.56513500213623, "global_step": 449790, "epoch": 2677} {"train_loss": -12.13901138305664, "global_step": 449791, "epoch": 2677} {"train_loss": -12.167394638061523, "global_step": 449792, "epoch": 2677} {"train_loss": -12.422927856445312, "global_step": 449793, "epoch": 2677} {"train_loss": -11.946521759033203, "global_step": 449794, "epoch": 2677} {"train_loss": -12.501041412353516, "global_step": 449795, "epoch": 2677} {"train_loss": -12.172914505004883, "global_step": 449796, "epoch": 2677} {"train_loss": -12.572243690490723, "global_step": 449797, "epoch": 2677} {"train_loss": -12.015382766723633, "global_step": 449798, "epoch": 2677} {"train_loss": -12.20094108581543, "global_step": 449799, "epoch": 2677} {"train_loss": -12.451212882995605, "global_step": 449800, "epoch": 2677} {"train_loss": -11.928740501403809, "global_step": 449801, "epoch": 2677} {"train_loss": -12.164932250976562, "global_step": 449802, "epoch": 2677} {"train_loss": -12.2907133102417, "global_step": 449803, "epoch": 2677} {"train_loss": -12.561315536499023, "global_step": 449804, "epoch": 2677} {"train_loss": -12.116510391235352, "global_step": 449805, "epoch": 2677} {"train_loss": -12.62015438079834, "global_step": 449806, "epoch": 2677} {"train_loss": -12.362665176391602, "global_step": 449807, "epoch": 2677} {"train_loss": -12.022747039794922, "global_step": 449808, "epoch": 2677} {"train_loss": -12.448079109191895, "global_step": 449809, "epoch": 2677} {"train_loss": -12.759805679321289, "global_step": 449810, "epoch": 2677} {"train_loss": -12.343490600585938, "global_step": 449811, "epoch": 2677} {"train_loss": -12.67457389831543, "global_step": 449812, "epoch": 2677} {"train_loss": -12.522651672363281, "global_step": 449813, "epoch": 2677} {"train_loss": -12.427262306213379, "global_step": 449814, "epoch": 2677} {"train_loss": -12.675413131713867, "global_step": 449815, "epoch": 2677} {"train_loss": -12.645395278930664, "global_step": 449816, "epoch": 2677} {"train_loss": -12.540332794189453, "global_step": 449817, "epoch": 2677} {"train_loss": -12.044387817382812, "global_step": 449818, "epoch": 2677} {"train_loss": -11.802871704101562, "global_step": 449819, "epoch": 2677} {"train_loss": -12.2201509475708, "global_step": 449820, "epoch": 2677} {"train_loss": -11.70262622833252, "global_step": 449821, "epoch": 2677} {"train_loss": -11.754154205322266, "global_step": 449822, "epoch": 2677} {"train_loss": -11.458637237548828, "global_step": 449823, "epoch": 2677} {"train_loss": -11.281698226928711, "global_step": 449824, "epoch": 2677} {"train_loss": -11.978095054626465, "global_step": 449825, "epoch": 2677} {"train_loss": -12.071995735168457, "global_step": 449826, "epoch": 2677} {"train_loss": -10.5220308303833, "global_step": 449827, "epoch": 2677} {"train_loss": -11.798398971557617, "global_step": 449828, "epoch": 2677} {"train_loss": -11.37447738647461, "global_step": 449829, "epoch": 2677} {"train_loss": -12.08171558380127, "global_step": 449830, "epoch": 2677} {"train_loss": -12.325616836547852, "global_step": 449831, "epoch": 2677} {"train_loss": -12.454805374145508, "global_step": 449832, "epoch": 2677} {"train_loss": -12.019640922546387, "global_step": 449833, "epoch": 2677} {"train_loss": -12.537153244018555, "global_step": 449834, "epoch": 2677} {"train_loss": -12.69151782989502, "global_step": 449835, "epoch": 2677} {"train_loss": -12.581324577331543, "global_step": 449836, "epoch": 2677} {"train_loss": -12.41650390625, "global_step": 449837, "epoch": 2677} {"train_loss": -12.642236709594727, "global_step": 449838, "epoch": 2677} {"train_loss": -12.487157821655273, "global_step": 449839, "epoch": 2677} {"train_loss": -12.38631820678711, "global_step": 449840, "epoch": 2677} {"train_loss": -12.323184967041016, "global_step": 449841, "epoch": 2677} {"train_loss": -12.569607734680176, "global_step": 449842, "epoch": 2677} {"train_loss": -11.801079750061035, "global_step": 449843, "epoch": 2677} {"train_loss": -12.245988845825195, "global_step": 449844, "epoch": 2677} {"train_loss": -12.077289581298828, "global_step": 449845, "epoch": 2677} {"train_loss": -12.520668029785156, "global_step": 449846, "epoch": 2677} {"train_loss": -11.816770553588867, "global_step": 449847, "epoch": 2677} {"train_loss": -12.668327331542969, "global_step": 449848, "epoch": 2677} {"train_loss": -11.561070442199707, "global_step": 449849, "epoch": 2677} {"train_loss": -12.059976577758789, "global_step": 449850, "epoch": 2677} {"train_loss": -12.349056243896484, "global_step": 449851, "epoch": 2677} {"train_loss": -12.204354286193848, "global_step": 449852, "epoch": 2677} {"train_loss": -12.468111991882324, "global_step": 449853, "epoch": 2677} {"train_loss": -12.303500175476074, "global_step": 449854, "epoch": 2677} {"train_loss": -12.328041076660156, "global_step": 449855, "epoch": 2677} {"train_loss": -12.365907669067383, "global_step": 449856, "epoch": 2677} {"train_loss": -12.615283966064453, "global_step": 449857, "epoch": 2677} {"train_loss": -11.920001983642578, "global_step": 449858, "epoch": 2677} {"train_loss": -12.278951644897461, "global_step": 449859, "epoch": 2677} {"train_loss": -11.974759101867676, "global_step": 449860, "epoch": 2677} {"train_loss": -12.503854751586914, "global_step": 449861, "epoch": 2677} {"train_loss": -12.29973030090332, "global_step": 449862, "epoch": 2677} {"train_loss": -12.156283378601074, "global_step": 449863, "epoch": 2677} {"train_loss": -12.384810447692871, "global_step": 449864, "epoch": 2677} {"train_loss": -12.481366157531738, "global_step": 449865, "epoch": 2677} {"train_loss": -12.250194549560547, "global_step": 449866, "epoch": 2677} {"train_loss": -11.970054626464844, "global_step": 449867, "epoch": 2677} {"train_loss": -12.427799224853516, "global_step": 449868, "epoch": 2677} {"train_loss": -12.175060272216797, "global_step": 449869, "epoch": 2677} {"train_loss": -12.210175514221191, "global_step": 449870, "epoch": 2677} {"train_loss": -12.072264671325684, "global_step": 449871, "epoch": 2677} {"train_loss": -12.127830505371094, "global_step": 449872, "epoch": 2677} {"train_loss": -11.503229141235352, "global_step": 449873, "epoch": 2677} {"train_loss": -12.209405899047852, "global_step": 449874, "epoch": 2677} {"train_loss": -11.925271034240723, "global_step": 449875, "epoch": 2677} {"train_loss": -12.376367568969727, "global_step": 449876, "epoch": 2677} {"train_loss": -12.37894058227539, "global_step": 449877, "epoch": 2677} {"train_loss": -12.224088668823242, "global_step": 449878, "epoch": 2677} {"train_loss": -12.18582534790039, "global_step": 449879, "epoch": 2677} {"train_loss": -12.027778625488281, "global_step": 449880, "epoch": 2677} {"train_loss": -12.106181144714355, "global_step": 449881, "epoch": 2677} {"train_loss": -12.00733757019043, "global_step": 449882, "epoch": 2677} {"train_loss": -11.840167999267578, "global_step": 449883, "epoch": 2677} {"train_loss": -11.58694076538086, "global_step": 449884, "epoch": 2677} {"train_loss": -11.87065315246582, "global_step": 449885, "epoch": 2677} {"train_loss": -12.263471603393555, "global_step": 449886, "epoch": 2677} {"train_loss": -12.13774585723877, "global_step": 449887, "epoch": 2677} {"train_loss": -11.459999084472656, "global_step": 449888, "epoch": 2677} {"train_loss": -11.467631340026855, "global_step": 449889, "epoch": 2677} {"train_loss": -11.85750961303711, "global_step": 449890, "epoch": 2677} {"train_loss": -11.791796684265137, "global_step": 449891, "epoch": 2677} {"train_loss": -12.358661651611328, "global_step": 449892, "epoch": 2677} {"train_loss": -11.442442893981934, "global_step": 449893, "epoch": 2677} {"train_loss": -11.789527893066406, "global_step": 449894, "epoch": 2677} {"train_loss": -11.951786041259766, "global_step": 449895, "epoch": 2677} {"train_loss": -11.859663009643555, "global_step": 449896, "epoch": 2677} {"train_loss": -12.172201156616211, "global_step": 449897, "epoch": 2677} {"train_loss": -11.811817169189453, "global_step": 449898, "epoch": 2677} {"train_loss": -11.959858894348145, "global_step": 449899, "epoch": 2677} {"train_loss": -12.440423011779785, "global_step": 449900, "epoch": 2677} {"train_loss": -12.00892448425293, "global_step": 449901, "epoch": 2677} {"train_loss": -12.322433471679688, "global_step": 449902, "epoch": 2677} {"train_loss": -12.057137608528137, "global_step": 449903, "epoch": 2677, "val_loss": 313334.28125} {"train_loss": -11.902588844299316, "global_step": 449904, "epoch": 2678} {"train_loss": -11.785293579101562, "global_step": 449905, "epoch": 2678} {"train_loss": -11.20882797241211, "global_step": 449906, "epoch": 2678} {"train_loss": -12.179408073425293, "global_step": 449907, "epoch": 2678} {"train_loss": -12.027313232421875, "global_step": 449908, "epoch": 2678} {"train_loss": -11.715299606323242, "global_step": 449909, "epoch": 2678} {"train_loss": -12.235027313232422, "global_step": 449910, "epoch": 2678} {"train_loss": -11.97414779663086, "global_step": 449911, "epoch": 2678} {"train_loss": -12.392065048217773, "global_step": 449912, "epoch": 2678} {"train_loss": -12.365470886230469, "global_step": 449913, "epoch": 2678} {"train_loss": -12.470709800720215, "global_step": 449914, "epoch": 2678} {"train_loss": -12.498292922973633, "global_step": 449915, "epoch": 2678} {"train_loss": -12.371152877807617, "global_step": 449916, "epoch": 2678} {"train_loss": -12.702396392822266, "global_step": 449917, "epoch": 2678} {"train_loss": -12.613547325134277, "global_step": 449918, "epoch": 2678} {"train_loss": -12.688247680664062, "global_step": 449919, "epoch": 2678} {"train_loss": -12.629903793334961, "global_step": 449920, "epoch": 2678} {"train_loss": -12.420477867126465, "global_step": 449921, "epoch": 2678} {"train_loss": -12.536301612854004, "global_step": 449922, "epoch": 2678} {"train_loss": -12.44983196258545, "global_step": 449923, "epoch": 2678} {"train_loss": -12.41161060333252, "global_step": 449924, "epoch": 2678} {"train_loss": -12.514225959777832, "global_step": 449925, "epoch": 2678} {"train_loss": -12.56873607635498, "global_step": 449926, "epoch": 2678} {"train_loss": -12.514559745788574, "global_step": 449927, "epoch": 2678} {"train_loss": -12.256105422973633, "global_step": 449928, "epoch": 2678} {"train_loss": -12.710445404052734, "global_step": 449929, "epoch": 2678} {"train_loss": -12.539207458496094, "global_step": 449930, "epoch": 2678} {"train_loss": -12.60096549987793, "global_step": 449931, "epoch": 2678} {"train_loss": -12.263856887817383, "global_step": 449932, "epoch": 2678} {"train_loss": -12.722357749938965, "global_step": 449933, "epoch": 2678} {"train_loss": -12.575448989868164, "global_step": 449934, "epoch": 2678} {"train_loss": -12.200090408325195, "global_step": 449935, "epoch": 2678} {"train_loss": -12.844985961914062, "global_step": 449936, "epoch": 2678} {"train_loss": -12.604681968688965, "global_step": 449937, "epoch": 2678} {"train_loss": -12.50596809387207, "global_step": 449938, "epoch": 2678} {"train_loss": -12.381607055664062, "global_step": 449939, "epoch": 2678} {"train_loss": -12.790416717529297, "global_step": 449940, "epoch": 2678} {"train_loss": -12.663394927978516, "global_step": 449941, "epoch": 2678} {"train_loss": -12.840461730957031, "global_step": 449942, "epoch": 2678} {"train_loss": -12.682979583740234, "global_step": 449943, "epoch": 2678} {"train_loss": -12.94540023803711, "global_step": 449944, "epoch": 2678} {"train_loss": -12.76541519165039, "global_step": 449945, "epoch": 2678} {"train_loss": -12.812114715576172, "global_step": 449946, "epoch": 2678} {"train_loss": -12.681044578552246, "global_step": 449947, "epoch": 2678} {"train_loss": -12.69232177734375, "global_step": 449948, "epoch": 2678} {"train_loss": -12.831972122192383, "global_step": 449949, "epoch": 2678} {"train_loss": -12.499088287353516, "global_step": 449950, "epoch": 2678} {"train_loss": -12.36678695678711, "global_step": 449951, "epoch": 2678} {"train_loss": -11.884882926940918, "global_step": 449952, "epoch": 2678} {"train_loss": -12.68369197845459, "global_step": 449953, "epoch": 2678} {"train_loss": -12.730816841125488, "global_step": 449954, "epoch": 2678} {"train_loss": -12.53193473815918, "global_step": 449955, "epoch": 2678} {"train_loss": -12.434673309326172, "global_step": 449956, "epoch": 2678} {"train_loss": -12.670022964477539, "global_step": 449957, "epoch": 2678} {"train_loss": -12.579961776733398, "global_step": 449958, "epoch": 2678} {"train_loss": -12.631324768066406, "global_step": 449959, "epoch": 2678} {"train_loss": -12.078214645385742, "global_step": 449960, "epoch": 2678} {"train_loss": -12.828737258911133, "global_step": 449961, "epoch": 2678} {"train_loss": -12.40989875793457, "global_step": 449962, "epoch": 2678} {"train_loss": -12.282905578613281, "global_step": 449963, "epoch": 2678} {"train_loss": -12.718704223632812, "global_step": 449964, "epoch": 2678} {"train_loss": -12.624883651733398, "global_step": 449965, "epoch": 2678} {"train_loss": -12.751774787902832, "global_step": 449966, "epoch": 2678} {"train_loss": -12.626930236816406, "global_step": 449967, "epoch": 2678} {"train_loss": -12.619767189025879, "global_step": 449968, "epoch": 2678} {"train_loss": -12.613655090332031, "global_step": 449969, "epoch": 2678} {"train_loss": -12.557212829589844, "global_step": 449970, "epoch": 2678} {"train_loss": -12.87899112701416, "global_step": 449971, "epoch": 2678} {"train_loss": -12.678592681884766, "global_step": 449972, "epoch": 2678} {"train_loss": -12.621042251586914, "global_step": 449973, "epoch": 2678} {"train_loss": -12.556489944458008, "global_step": 449974, "epoch": 2678} {"train_loss": -12.907683372497559, "global_step": 449975, "epoch": 2678} {"train_loss": -12.62739372253418, "global_step": 449976, "epoch": 2678} {"train_loss": -12.725093841552734, "global_step": 449977, "epoch": 2678} {"train_loss": -12.6235933303833, "global_step": 449978, "epoch": 2678} {"train_loss": -12.934286117553711, "global_step": 449979, "epoch": 2678} {"train_loss": -12.880457878112793, "global_step": 449980, "epoch": 2678} {"train_loss": -13.068199157714844, "global_step": 449981, "epoch": 2678} {"train_loss": -12.754631996154785, "global_step": 449982, "epoch": 2678} {"train_loss": -12.877118110656738, "global_step": 449983, "epoch": 2678} {"train_loss": -12.917074203491211, "global_step": 449984, "epoch": 2678} {"train_loss": -12.949895858764648, "global_step": 449985, "epoch": 2678} {"train_loss": -12.753724098205566, "global_step": 449986, "epoch": 2678} {"train_loss": -12.641019821166992, "global_step": 449987, "epoch": 2678} {"train_loss": -12.346349716186523, "global_step": 449988, "epoch": 2678} {"train_loss": -12.838519096374512, "global_step": 449989, "epoch": 2678} {"train_loss": -12.353628158569336, "global_step": 449990, "epoch": 2678} {"train_loss": -12.22793197631836, "global_step": 449991, "epoch": 2678} {"train_loss": -12.31155014038086, "global_step": 449992, "epoch": 2678} {"train_loss": -12.548391342163086, "global_step": 449993, "epoch": 2678} {"train_loss": -12.077552795410156, "global_step": 449994, "epoch": 2678} {"train_loss": -12.04434585571289, "global_step": 449995, "epoch": 2678} {"train_loss": -11.427227020263672, "global_step": 449996, "epoch": 2678} {"train_loss": -11.09118938446045, "global_step": 449997, "epoch": 2678} {"train_loss": -9.605499267578125, "global_step": 449998, "epoch": 2678} {"train_loss": -10.427078247070312, "global_step": 449999, "epoch": 2678} {"train_loss": -11.179841995239258, "global_step": 450000, "epoch": 2678} {"train_loss": -8.823944091796875, "global_step": 450001, "epoch": 2678} {"train_loss": -8.762420654296875, "global_step": 450002, "epoch": 2678} {"train_loss": -11.11011791229248, "global_step": 450003, "epoch": 2678} {"train_loss": -8.46668815612793, "global_step": 450004, "epoch": 2678} {"train_loss": -9.299186706542969, "global_step": 450005, "epoch": 2678} {"train_loss": -8.475700378417969, "global_step": 450006, "epoch": 2678} {"train_loss": -9.186007499694824, "global_step": 450007, "epoch": 2678} {"train_loss": -9.723237991333008, "global_step": 450008, "epoch": 2678} {"train_loss": -9.933037757873535, "global_step": 450009, "epoch": 2678} {"train_loss": -9.75112533569336, "global_step": 450010, "epoch": 2678} {"train_loss": -8.402158737182617, "global_step": 450011, "epoch": 2678} {"train_loss": -10.887752532958984, "global_step": 450012, "epoch": 2678} {"train_loss": -10.070588111877441, "global_step": 450013, "epoch": 2678} {"train_loss": -10.097040176391602, "global_step": 450014, "epoch": 2678} {"train_loss": -9.971088409423828, "global_step": 450015, "epoch": 2678} {"train_loss": -10.322122573852539, "global_step": 450016, "epoch": 2678} {"train_loss": -10.429302215576172, "global_step": 450017, "epoch": 2678} {"train_loss": -10.322895050048828, "global_step": 450018, "epoch": 2678} {"train_loss": -10.312646865844727, "global_step": 450019, "epoch": 2678} {"train_loss": -11.221879959106445, "global_step": 450020, "epoch": 2678} {"train_loss": -10.84056282043457, "global_step": 450021, "epoch": 2678} {"train_loss": -10.501436233520508, "global_step": 450022, "epoch": 2678} {"train_loss": -11.140609741210938, "global_step": 450023, "epoch": 2678} {"train_loss": -10.74669361114502, "global_step": 450024, "epoch": 2678} {"train_loss": -10.70442008972168, "global_step": 450025, "epoch": 2678} {"train_loss": -10.859155654907227, "global_step": 450026, "epoch": 2678} {"train_loss": -11.360983848571777, "global_step": 450027, "epoch": 2678} {"train_loss": -10.967194557189941, "global_step": 450028, "epoch": 2678} {"train_loss": -11.36928653717041, "global_step": 450029, "epoch": 2678} {"train_loss": -11.448663711547852, "global_step": 450030, "epoch": 2678} {"train_loss": -11.366704940795898, "global_step": 450031, "epoch": 2678} {"train_loss": -11.476648330688477, "global_step": 450032, "epoch": 2678} {"train_loss": -11.583650588989258, "global_step": 450033, "epoch": 2678} {"train_loss": -11.074236869812012, "global_step": 450034, "epoch": 2678} {"train_loss": -12.064178466796875, "global_step": 450035, "epoch": 2678} {"train_loss": -11.30931568145752, "global_step": 450036, "epoch": 2678} {"train_loss": -11.869421005249023, "global_step": 450037, "epoch": 2678} {"train_loss": -11.99260139465332, "global_step": 450038, "epoch": 2678} {"train_loss": -11.420633316040039, "global_step": 450039, "epoch": 2678} {"train_loss": -11.887510299682617, "global_step": 450040, "epoch": 2678} {"train_loss": -11.827278137207031, "global_step": 450041, "epoch": 2678} {"train_loss": -12.063225746154785, "global_step": 450042, "epoch": 2678} {"train_loss": -11.873578071594238, "global_step": 450043, "epoch": 2678} {"train_loss": -11.882917404174805, "global_step": 450044, "epoch": 2678} {"train_loss": -11.746124267578125, "global_step": 450045, "epoch": 2678} {"train_loss": -11.854509353637695, "global_step": 450046, "epoch": 2678} {"train_loss": -12.18985366821289, "global_step": 450047, "epoch": 2678} {"train_loss": -12.220163345336914, "global_step": 450048, "epoch": 2678} {"train_loss": -11.971982955932617, "global_step": 450049, "epoch": 2678} {"train_loss": -12.364383697509766, "global_step": 450050, "epoch": 2678} {"train_loss": -12.097204208374023, "global_step": 450051, "epoch": 2678} {"train_loss": -12.453073501586914, "global_step": 450052, "epoch": 2678} {"train_loss": -12.206766128540039, "global_step": 450053, "epoch": 2678} {"train_loss": -12.458641052246094, "global_step": 450054, "epoch": 2678} {"train_loss": -12.098733901977539, "global_step": 450055, "epoch": 2678} {"train_loss": -12.514200210571289, "global_step": 450056, "epoch": 2678} {"train_loss": -12.139952659606934, "global_step": 450057, "epoch": 2678} {"train_loss": -12.358409881591797, "global_step": 450058, "epoch": 2678} {"train_loss": -12.207978248596191, "global_step": 450059, "epoch": 2678} {"train_loss": -12.669326782226562, "global_step": 450060, "epoch": 2678} {"train_loss": -12.502639770507812, "global_step": 450061, "epoch": 2678} {"train_loss": -12.624103546142578, "global_step": 450062, "epoch": 2678} {"train_loss": -12.269257545471191, "global_step": 450063, "epoch": 2678} {"train_loss": -12.532058715820312, "global_step": 450064, "epoch": 2678} {"train_loss": -12.38804817199707, "global_step": 450065, "epoch": 2678} {"train_loss": -12.562448501586914, "global_step": 450066, "epoch": 2678} {"train_loss": -12.505290985107422, "global_step": 450067, "epoch": 2678} {"train_loss": -12.437214851379395, "global_step": 450068, "epoch": 2678} {"train_loss": -12.743620872497559, "global_step": 450069, "epoch": 2678} {"train_loss": -12.580009460449219, "global_step": 450070, "epoch": 2678} {"train_loss": -11.95671352318355, "global_step": 450071, "epoch": 2678, "val_loss": 314270.28125} {"train_loss": -12.684160232543945, "global_step": 450072, "epoch": 2679} {"train_loss": -12.600704193115234, "global_step": 450073, "epoch": 2679} {"train_loss": -12.692683219909668, "global_step": 450074, "epoch": 2679} {"train_loss": -12.472143173217773, "global_step": 450075, "epoch": 2679} {"train_loss": -12.564889907836914, "global_step": 450076, "epoch": 2679} {"train_loss": -12.659221649169922, "global_step": 450077, "epoch": 2679} {"train_loss": -12.651668548583984, "global_step": 450078, "epoch": 2679} {"train_loss": -12.626070022583008, "global_step": 450079, "epoch": 2679} {"train_loss": -12.759416580200195, "global_step": 450080, "epoch": 2679} {"train_loss": -12.630561828613281, "global_step": 450081, "epoch": 2679} {"train_loss": -12.888252258300781, "global_step": 450082, "epoch": 2679} {"train_loss": -12.762491226196289, "global_step": 450083, "epoch": 2679} {"train_loss": -12.542622566223145, "global_step": 450084, "epoch": 2679} {"train_loss": -12.800539016723633, "global_step": 450085, "epoch": 2679} {"train_loss": -12.7100248336792, "global_step": 450086, "epoch": 2679} {"train_loss": -12.687870979309082, "global_step": 450087, "epoch": 2679} {"train_loss": -12.801329612731934, "global_step": 450088, "epoch": 2679} {"train_loss": -12.768320083618164, "global_step": 450089, "epoch": 2679} {"train_loss": -12.693979263305664, "global_step": 450090, "epoch": 2679} {"train_loss": -12.770345687866211, "global_step": 450091, "epoch": 2679} {"train_loss": -12.92254638671875, "global_step": 450092, "epoch": 2679} {"train_loss": -12.820779800415039, "global_step": 450093, "epoch": 2679} {"train_loss": -12.790148735046387, "global_step": 450094, "epoch": 2679} {"train_loss": -12.58682918548584, "global_step": 450095, "epoch": 2679} {"train_loss": -12.884260177612305, "global_step": 450096, "epoch": 2679} {"train_loss": -11.772870063781738, "global_step": 450097, "epoch": 2679} {"train_loss": -12.739259719848633, "global_step": 450098, "epoch": 2679} {"train_loss": -12.40254020690918, "global_step": 450099, "epoch": 2679} {"train_loss": -12.53575611114502, "global_step": 450100, "epoch": 2679} {"train_loss": -12.687897682189941, "global_step": 450101, "epoch": 2679} {"train_loss": -12.17956829071045, "global_step": 450102, "epoch": 2679} {"train_loss": -12.392881393432617, "global_step": 450103, "epoch": 2679} {"train_loss": -12.435125350952148, "global_step": 450104, "epoch": 2679} {"train_loss": -11.764832496643066, "global_step": 450105, "epoch": 2679} {"train_loss": -12.039437294006348, "global_step": 450106, "epoch": 2679} {"train_loss": -11.823492050170898, "global_step": 450107, "epoch": 2679} {"train_loss": -12.607879638671875, "global_step": 450108, "epoch": 2679} {"train_loss": -11.558820724487305, "global_step": 450109, "epoch": 2679} {"train_loss": -12.337035179138184, "global_step": 450110, "epoch": 2679} {"train_loss": -10.745768547058105, "global_step": 450111, "epoch": 2679} {"train_loss": -12.409385681152344, "global_step": 450112, "epoch": 2679} {"train_loss": -11.975525856018066, "global_step": 450113, "epoch": 2679} {"train_loss": -12.218217849731445, "global_step": 450114, "epoch": 2679} {"train_loss": -12.077951431274414, "global_step": 450115, "epoch": 2679} {"train_loss": -12.29992389678955, "global_step": 450116, "epoch": 2679} {"train_loss": -11.912725448608398, "global_step": 450117, "epoch": 2679} {"train_loss": -12.00163745880127, "global_step": 450118, "epoch": 2679} {"train_loss": -12.375296592712402, "global_step": 450119, "epoch": 2679} {"train_loss": -12.13228702545166, "global_step": 450120, "epoch": 2679} {"train_loss": -12.327308654785156, "global_step": 450121, "epoch": 2679} {"train_loss": -11.616819381713867, "global_step": 450122, "epoch": 2679} {"train_loss": -12.605291366577148, "global_step": 450123, "epoch": 2679} {"train_loss": -11.828958511352539, "global_step": 450124, "epoch": 2679} {"train_loss": -12.682781219482422, "global_step": 450125, "epoch": 2679} {"train_loss": -11.93349838256836, "global_step": 450126, "epoch": 2679} {"train_loss": -12.24156665802002, "global_step": 450127, "epoch": 2679} {"train_loss": -12.374517440795898, "global_step": 450128, "epoch": 2679} {"train_loss": -11.886028289794922, "global_step": 450129, "epoch": 2679} {"train_loss": -12.670951843261719, "global_step": 450130, "epoch": 2679} {"train_loss": -12.314964294433594, "global_step": 450131, "epoch": 2679} {"train_loss": -12.349547386169434, "global_step": 450132, "epoch": 2679} {"train_loss": -12.685672760009766, "global_step": 450133, "epoch": 2679} {"train_loss": -12.054628372192383, "global_step": 450134, "epoch": 2679} {"train_loss": -12.365631103515625, "global_step": 450135, "epoch": 2679} {"train_loss": -12.336010932922363, "global_step": 450136, "epoch": 2679} {"train_loss": -12.575498580932617, "global_step": 450137, "epoch": 2679} {"train_loss": -12.564849853515625, "global_step": 450138, "epoch": 2679} {"train_loss": -12.539911270141602, "global_step": 450139, "epoch": 2679} {"train_loss": -12.303295135498047, "global_step": 450140, "epoch": 2679} {"train_loss": -12.45156192779541, "global_step": 450141, "epoch": 2679} {"train_loss": -12.429341316223145, "global_step": 450142, "epoch": 2679} {"train_loss": -12.650197982788086, "global_step": 450143, "epoch": 2679} {"train_loss": -12.401420593261719, "global_step": 450144, "epoch": 2679} {"train_loss": -12.303337097167969, "global_step": 450145, "epoch": 2679} {"train_loss": -12.616127014160156, "global_step": 450146, "epoch": 2679} {"train_loss": -12.475574493408203, "global_step": 450147, "epoch": 2679} {"train_loss": -12.540664672851562, "global_step": 450148, "epoch": 2679} {"train_loss": -13.0128812789917, "global_step": 450149, "epoch": 2679} {"train_loss": -12.526522636413574, "global_step": 450150, "epoch": 2679} {"train_loss": -12.461109161376953, "global_step": 450151, "epoch": 2679} {"train_loss": -12.533221244812012, "global_step": 450152, "epoch": 2679} {"train_loss": -12.338645935058594, "global_step": 450153, "epoch": 2679} {"train_loss": -12.689613342285156, "global_step": 450154, "epoch": 2679} {"train_loss": -12.583452224731445, "global_step": 450155, "epoch": 2679} {"train_loss": -12.534855842590332, "global_step": 450156, "epoch": 2679} {"train_loss": -12.645210266113281, "global_step": 450157, "epoch": 2679} {"train_loss": -12.266736030578613, "global_step": 450158, "epoch": 2679} {"train_loss": -12.596534729003906, "global_step": 450159, "epoch": 2679} {"train_loss": -12.349258422851562, "global_step": 450160, "epoch": 2679} {"train_loss": -12.737154960632324, "global_step": 450161, "epoch": 2679} {"train_loss": -12.509098052978516, "global_step": 450162, "epoch": 2679} {"train_loss": -12.796545028686523, "global_step": 450163, "epoch": 2679} {"train_loss": -12.65988540649414, "global_step": 450164, "epoch": 2679} {"train_loss": -12.525470733642578, "global_step": 450165, "epoch": 2679} {"train_loss": -12.516149520874023, "global_step": 450166, "epoch": 2679} {"train_loss": -12.455228805541992, "global_step": 450167, "epoch": 2679} {"train_loss": -12.074211120605469, "global_step": 450168, "epoch": 2679} {"train_loss": -12.924150466918945, "global_step": 450169, "epoch": 2679} {"train_loss": -12.34353256225586, "global_step": 450170, "epoch": 2679} {"train_loss": -12.292856216430664, "global_step": 450171, "epoch": 2679} {"train_loss": -12.384827613830566, "global_step": 450172, "epoch": 2679} {"train_loss": -12.625619888305664, "global_step": 450173, "epoch": 2679} {"train_loss": -11.684240341186523, "global_step": 450174, "epoch": 2679} {"train_loss": -12.062141418457031, "global_step": 450175, "epoch": 2679} {"train_loss": -12.786327362060547, "global_step": 450176, "epoch": 2679} {"train_loss": -12.011783599853516, "global_step": 450177, "epoch": 2679} {"train_loss": -11.610159873962402, "global_step": 450178, "epoch": 2679} {"train_loss": -12.810784339904785, "global_step": 450179, "epoch": 2679} {"train_loss": -12.058084487915039, "global_step": 450180, "epoch": 2679} {"train_loss": -11.656089782714844, "global_step": 450181, "epoch": 2679} {"train_loss": -12.522558212280273, "global_step": 450182, "epoch": 2679} {"train_loss": -12.443683624267578, "global_step": 450183, "epoch": 2679} {"train_loss": -11.556406021118164, "global_step": 450184, "epoch": 2679} {"train_loss": -12.424339294433594, "global_step": 450185, "epoch": 2679} {"train_loss": -12.539904594421387, "global_step": 450186, "epoch": 2679} {"train_loss": -12.224115371704102, "global_step": 450187, "epoch": 2679} {"train_loss": -12.65994644165039, "global_step": 450188, "epoch": 2679} {"train_loss": -12.760730743408203, "global_step": 450189, "epoch": 2679} {"train_loss": -12.00397777557373, "global_step": 450190, "epoch": 2679} {"train_loss": -11.93160629272461, "global_step": 450191, "epoch": 2679} {"train_loss": -12.285240173339844, "global_step": 450192, "epoch": 2679} {"train_loss": -12.36839485168457, "global_step": 450193, "epoch": 2679} {"train_loss": -11.607136726379395, "global_step": 450194, "epoch": 2679} {"train_loss": -11.925838470458984, "global_step": 450195, "epoch": 2679} {"train_loss": -12.114767074584961, "global_step": 450196, "epoch": 2679} {"train_loss": -11.571327209472656, "global_step": 450197, "epoch": 2679} {"train_loss": -11.017147064208984, "global_step": 450198, "epoch": 2679} {"train_loss": -11.207657814025879, "global_step": 450199, "epoch": 2679} {"train_loss": -11.516955375671387, "global_step": 450200, "epoch": 2679} {"train_loss": -10.525739669799805, "global_step": 450201, "epoch": 2679} {"train_loss": -12.005425453186035, "global_step": 450202, "epoch": 2679} {"train_loss": -11.664874076843262, "global_step": 450203, "epoch": 2679} {"train_loss": -11.258115768432617, "global_step": 450204, "epoch": 2679} {"train_loss": -12.375679016113281, "global_step": 450205, "epoch": 2679} {"train_loss": -11.357336044311523, "global_step": 450206, "epoch": 2679} {"train_loss": -11.99083137512207, "global_step": 450207, "epoch": 2679} {"train_loss": -11.26681900024414, "global_step": 450208, "epoch": 2679} {"train_loss": -12.135663986206055, "global_step": 450209, "epoch": 2679} {"train_loss": -11.615459442138672, "global_step": 450210, "epoch": 2679} {"train_loss": -11.820257186889648, "global_step": 450211, "epoch": 2679} {"train_loss": -11.77393913269043, "global_step": 450212, "epoch": 2679} {"train_loss": -11.410421371459961, "global_step": 450213, "epoch": 2679} {"train_loss": -12.158112525939941, "global_step": 450214, "epoch": 2679} {"train_loss": -11.286020278930664, "global_step": 450215, "epoch": 2679} {"train_loss": -11.479080200195312, "global_step": 450216, "epoch": 2679} {"train_loss": -12.055133819580078, "global_step": 450217, "epoch": 2679} {"train_loss": -11.706096649169922, "global_step": 450218, "epoch": 2679} {"train_loss": -12.13919448852539, "global_step": 450219, "epoch": 2679} {"train_loss": -11.492593765258789, "global_step": 450220, "epoch": 2679} {"train_loss": -11.86788272857666, "global_step": 450221, "epoch": 2679} {"train_loss": -11.124893188476562, "global_step": 450222, "epoch": 2679} {"train_loss": -11.79678726196289, "global_step": 450223, "epoch": 2679} {"train_loss": -12.005620956420898, "global_step": 450224, "epoch": 2679} {"train_loss": -11.43313217163086, "global_step": 450225, "epoch": 2679} {"train_loss": -11.718568801879883, "global_step": 450226, "epoch": 2679} {"train_loss": -11.438592910766602, "global_step": 450227, "epoch": 2679} {"train_loss": -12.189445495605469, "global_step": 450228, "epoch": 2679} {"train_loss": -11.907916069030762, "global_step": 450229, "epoch": 2679} {"train_loss": -12.380756378173828, "global_step": 450230, "epoch": 2679} {"train_loss": -11.822320938110352, "global_step": 450231, "epoch": 2679} {"train_loss": -12.342018127441406, "global_step": 450232, "epoch": 2679} {"train_loss": -12.308090209960938, "global_step": 450233, "epoch": 2679} {"train_loss": -12.192216873168945, "global_step": 450234, "epoch": 2679} {"train_loss": -12.400749206542969, "global_step": 450235, "epoch": 2679} {"train_loss": -12.401565551757812, "global_step": 450236, "epoch": 2679} {"train_loss": -12.34078598022461, "global_step": 450237, "epoch": 2679} {"train_loss": -12.374523162841797, "global_step": 450238, "epoch": 2679} {"train_loss": -12.237799604733786, "global_step": 450239, "epoch": 2679, "val_loss": 314937.125} {"train_loss": -12.062601089477539, "global_step": 450240, "epoch": 2680} {"train_loss": -12.451960563659668, "global_step": 450241, "epoch": 2680} {"train_loss": -12.448867797851562, "global_step": 450242, "epoch": 2680} {"train_loss": -12.346470832824707, "global_step": 450243, "epoch": 2680} {"train_loss": -12.008064270019531, "global_step": 450244, "epoch": 2680} {"train_loss": -11.734212875366211, "global_step": 450245, "epoch": 2680} {"train_loss": -12.840736389160156, "global_step": 450246, "epoch": 2680} {"train_loss": -12.010480880737305, "global_step": 450247, "epoch": 2680} {"train_loss": -12.112564086914062, "global_step": 450248, "epoch": 2680} {"train_loss": -12.463427543640137, "global_step": 450249, "epoch": 2680} {"train_loss": -11.846373558044434, "global_step": 450250, "epoch": 2680} {"train_loss": -11.93669319152832, "global_step": 450251, "epoch": 2680} {"train_loss": -12.628320693969727, "global_step": 450252, "epoch": 2680} {"train_loss": -12.035871505737305, "global_step": 450253, "epoch": 2680} {"train_loss": -12.1929292678833, "global_step": 450254, "epoch": 2680} {"train_loss": -12.343740463256836, "global_step": 450255, "epoch": 2680} {"train_loss": -12.220523834228516, "global_step": 450256, "epoch": 2680} {"train_loss": -12.210053443908691, "global_step": 450257, "epoch": 2680} {"train_loss": -12.52927303314209, "global_step": 450258, "epoch": 2680} {"train_loss": -11.728595733642578, "global_step": 450259, "epoch": 2680} {"train_loss": -11.399971008300781, "global_step": 450260, "epoch": 2680} {"train_loss": -12.68994426727295, "global_step": 450261, "epoch": 2680} {"train_loss": -12.064549446105957, "global_step": 450262, "epoch": 2680} {"train_loss": -12.373870849609375, "global_step": 450263, "epoch": 2680} {"train_loss": -12.361828804016113, "global_step": 450264, "epoch": 2680} {"train_loss": -12.508495330810547, "global_step": 450265, "epoch": 2680} {"train_loss": -12.634917259216309, "global_step": 450266, "epoch": 2680} {"train_loss": -12.610803604125977, "global_step": 450267, "epoch": 2680} {"train_loss": -12.707538604736328, "global_step": 450268, "epoch": 2680} {"train_loss": -12.677001953125, "global_step": 450269, "epoch": 2680} {"train_loss": -12.634941101074219, "global_step": 450270, "epoch": 2680} {"train_loss": -12.706607818603516, "global_step": 450271, "epoch": 2680} {"train_loss": -12.606517791748047, "global_step": 450272, "epoch": 2680} {"train_loss": -12.707270622253418, "global_step": 450273, "epoch": 2680} {"train_loss": -12.851272583007812, "global_step": 450274, "epoch": 2680} {"train_loss": -12.468191146850586, "global_step": 450275, "epoch": 2680} {"train_loss": -12.608060836791992, "global_step": 450276, "epoch": 2680} {"train_loss": -12.708355903625488, "global_step": 450277, "epoch": 2680} {"train_loss": -12.734834671020508, "global_step": 450278, "epoch": 2680} {"train_loss": -12.691360473632812, "global_step": 450279, "epoch": 2680} {"train_loss": -12.772735595703125, "global_step": 450280, "epoch": 2680} {"train_loss": -12.928735733032227, "global_step": 450281, "epoch": 2680} {"train_loss": -12.8480224609375, "global_step": 450282, "epoch": 2680} {"train_loss": -12.841915130615234, "global_step": 450283, "epoch": 2680} {"train_loss": -12.794073104858398, "global_step": 450284, "epoch": 2680} {"train_loss": -12.626863479614258, "global_step": 450285, "epoch": 2680} {"train_loss": -12.867995262145996, "global_step": 450286, "epoch": 2680} {"train_loss": -12.624521255493164, "global_step": 450287, "epoch": 2680} {"train_loss": -12.454748153686523, "global_step": 450288, "epoch": 2680} {"train_loss": -12.165199279785156, "global_step": 450289, "epoch": 2680} {"train_loss": -12.815381050109863, "global_step": 450290, "epoch": 2680} {"train_loss": -12.277262687683105, "global_step": 450291, "epoch": 2680} {"train_loss": -12.739237785339355, "global_step": 450292, "epoch": 2680} {"train_loss": -12.08662223815918, "global_step": 450293, "epoch": 2680} {"train_loss": -12.264469146728516, "global_step": 450294, "epoch": 2680} {"train_loss": -12.376007080078125, "global_step": 450295, "epoch": 2680} {"train_loss": -12.288432121276855, "global_step": 450296, "epoch": 2680} {"train_loss": -12.368717193603516, "global_step": 450297, "epoch": 2680} {"train_loss": -12.237739562988281, "global_step": 450298, "epoch": 2680} {"train_loss": -12.65110969543457, "global_step": 450299, "epoch": 2680} {"train_loss": -12.483062744140625, "global_step": 450300, "epoch": 2680} {"train_loss": -12.480581283569336, "global_step": 450301, "epoch": 2680} {"train_loss": -12.406426429748535, "global_step": 450302, "epoch": 2680} {"train_loss": -12.473379135131836, "global_step": 450303, "epoch": 2680} {"train_loss": -12.54279613494873, "global_step": 450304, "epoch": 2680} {"train_loss": -12.134138107299805, "global_step": 450305, "epoch": 2680} {"train_loss": -12.864462852478027, "global_step": 450306, "epoch": 2680} {"train_loss": -11.98560905456543, "global_step": 450307, "epoch": 2680} {"train_loss": -12.198066711425781, "global_step": 450308, "epoch": 2680} {"train_loss": -11.76787281036377, "global_step": 450309, "epoch": 2680} {"train_loss": -12.407451629638672, "global_step": 450310, "epoch": 2680} {"train_loss": -11.738720893859863, "global_step": 450311, "epoch": 2680} {"train_loss": -11.094499588012695, "global_step": 450312, "epoch": 2680} {"train_loss": -12.189313888549805, "global_step": 450313, "epoch": 2680} {"train_loss": -11.4962739944458, "global_step": 450314, "epoch": 2680} {"train_loss": -11.522087097167969, "global_step": 450315, "epoch": 2680} {"train_loss": -12.357378005981445, "global_step": 450316, "epoch": 2680} {"train_loss": -10.850323677062988, "global_step": 450317, "epoch": 2680} {"train_loss": -11.249713897705078, "global_step": 450318, "epoch": 2680} {"train_loss": -12.037765502929688, "global_step": 450319, "epoch": 2680} {"train_loss": -12.124967575073242, "global_step": 450320, "epoch": 2680} {"train_loss": -11.256500244140625, "global_step": 450321, "epoch": 2680} {"train_loss": -12.217880249023438, "global_step": 450322, "epoch": 2680} {"train_loss": -11.399210929870605, "global_step": 450323, "epoch": 2680} {"train_loss": -12.013230323791504, "global_step": 450324, "epoch": 2680} {"train_loss": -11.770448684692383, "global_step": 450325, "epoch": 2680} {"train_loss": -10.77329158782959, "global_step": 450326, "epoch": 2680} {"train_loss": -11.087841033935547, "global_step": 450327, "epoch": 2680} {"train_loss": -12.002420425415039, "global_step": 450328, "epoch": 2680} {"train_loss": -10.11957836151123, "global_step": 450329, "epoch": 2680} {"train_loss": -11.551111221313477, "global_step": 450330, "epoch": 2680} {"train_loss": -9.750438690185547, "global_step": 450331, "epoch": 2680} {"train_loss": -11.32894515991211, "global_step": 450332, "epoch": 2680} {"train_loss": -11.405132293701172, "global_step": 450333, "epoch": 2680} {"train_loss": -10.508038520812988, "global_step": 450334, "epoch": 2680} {"train_loss": -10.476055145263672, "global_step": 450335, "epoch": 2680} {"train_loss": -10.365764617919922, "global_step": 450336, "epoch": 2680} {"train_loss": -10.997591018676758, "global_step": 450337, "epoch": 2680} {"train_loss": -9.987663269042969, "global_step": 450338, "epoch": 2680} {"train_loss": -10.478399276733398, "global_step": 450339, "epoch": 2680} {"train_loss": -9.573097229003906, "global_step": 450340, "epoch": 2680} {"train_loss": -11.384003639221191, "global_step": 450341, "epoch": 2680} {"train_loss": -9.362004280090332, "global_step": 450342, "epoch": 2680} {"train_loss": -10.58670425415039, "global_step": 450343, "epoch": 2680} {"train_loss": -10.91748046875, "global_step": 450344, "epoch": 2680} {"train_loss": -11.176231384277344, "global_step": 450345, "epoch": 2680} {"train_loss": -10.715644836425781, "global_step": 450346, "epoch": 2680} {"train_loss": -12.16295051574707, "global_step": 450347, "epoch": 2680} {"train_loss": -10.76254653930664, "global_step": 450348, "epoch": 2680} {"train_loss": -11.287708282470703, "global_step": 450349, "epoch": 2680} {"train_loss": -11.66623592376709, "global_step": 450350, "epoch": 2680} {"train_loss": -10.717658996582031, "global_step": 450351, "epoch": 2680} {"train_loss": -12.269987106323242, "global_step": 450352, "epoch": 2680} {"train_loss": -11.434593200683594, "global_step": 450353, "epoch": 2680} {"train_loss": -11.735335350036621, "global_step": 450354, "epoch": 2680} {"train_loss": -11.332477569580078, "global_step": 450355, "epoch": 2680} {"train_loss": -11.077108383178711, "global_step": 450356, "epoch": 2680} {"train_loss": -11.767475128173828, "global_step": 450357, "epoch": 2680} {"train_loss": -11.701133728027344, "global_step": 450358, "epoch": 2680} {"train_loss": -11.88265609741211, "global_step": 450359, "epoch": 2680} {"train_loss": -12.236028671264648, "global_step": 450360, "epoch": 2680} {"train_loss": -11.9413423538208, "global_step": 450361, "epoch": 2680} {"train_loss": -12.047056198120117, "global_step": 450362, "epoch": 2680} {"train_loss": -12.153221130371094, "global_step": 450363, "epoch": 2680} {"train_loss": -12.221226692199707, "global_step": 450364, "epoch": 2680} {"train_loss": -12.018144607543945, "global_step": 450365, "epoch": 2680} {"train_loss": -11.885357856750488, "global_step": 450366, "epoch": 2680} {"train_loss": -12.180728912353516, "global_step": 450367, "epoch": 2680} {"train_loss": -12.211344718933105, "global_step": 450368, "epoch": 2680} {"train_loss": -11.985158920288086, "global_step": 450369, "epoch": 2680} {"train_loss": -12.2655668258667, "global_step": 450370, "epoch": 2680} {"train_loss": -12.228031158447266, "global_step": 450371, "epoch": 2680} {"train_loss": -12.279706954956055, "global_step": 450372, "epoch": 2680} {"train_loss": -12.533246040344238, "global_step": 450373, "epoch": 2680} {"train_loss": -12.34503173828125, "global_step": 450374, "epoch": 2680} {"train_loss": -12.191499710083008, "global_step": 450375, "epoch": 2680} {"train_loss": -12.506734848022461, "global_step": 450376, "epoch": 2680} {"train_loss": -12.29681396484375, "global_step": 450377, "epoch": 2680} {"train_loss": -12.387273788452148, "global_step": 450378, "epoch": 2680} {"train_loss": -12.44609260559082, "global_step": 450379, "epoch": 2680} {"train_loss": -12.608981132507324, "global_step": 450380, "epoch": 2680} {"train_loss": -12.392032623291016, "global_step": 450381, "epoch": 2680} {"train_loss": -12.443450927734375, "global_step": 450382, "epoch": 2680} {"train_loss": -12.549802780151367, "global_step": 450383, "epoch": 2680} {"train_loss": -12.429011344909668, "global_step": 450384, "epoch": 2680} {"train_loss": -12.453282356262207, "global_step": 450385, "epoch": 2680} {"train_loss": -12.599968910217285, "global_step": 450386, "epoch": 2680} {"train_loss": -12.515830993652344, "global_step": 450387, "epoch": 2680} {"train_loss": -12.681171417236328, "global_step": 450388, "epoch": 2680} {"train_loss": -12.66408920288086, "global_step": 450389, "epoch": 2680} {"train_loss": -12.639959335327148, "global_step": 450390, "epoch": 2680} {"train_loss": -12.455519676208496, "global_step": 450391, "epoch": 2680} {"train_loss": -12.50076675415039, "global_step": 450392, "epoch": 2680} {"train_loss": -12.677722930908203, "global_step": 450393, "epoch": 2680} {"train_loss": -12.553529739379883, "global_step": 450394, "epoch": 2680} {"train_loss": -12.74306583404541, "global_step": 450395, "epoch": 2680} {"train_loss": -12.661794662475586, "global_step": 450396, "epoch": 2680} {"train_loss": -12.693683624267578, "global_step": 450397, "epoch": 2680} {"train_loss": -12.66195297241211, "global_step": 450398, "epoch": 2680} {"train_loss": -12.76626968383789, "global_step": 450399, "epoch": 2680} {"train_loss": -12.671416282653809, "global_step": 450400, "epoch": 2680} {"train_loss": -12.704366683959961, "global_step": 450401, "epoch": 2680} {"train_loss": -12.663690567016602, "global_step": 450402, "epoch": 2680} {"train_loss": -12.662355422973633, "global_step": 450403, "epoch": 2680} {"train_loss": -12.859321594238281, "global_step": 450404, "epoch": 2680} {"train_loss": -12.715627670288086, "global_step": 450405, "epoch": 2680} {"train_loss": -12.936342239379883, "global_step": 450406, "epoch": 2680} {"train_loss": -12.079316945303054, "global_step": 450407, "epoch": 2680, "val_loss": 311779.875, "train_action_mse_error": 1.2188512086868286} {"train_loss": -12.555859565734863, "global_step": 450408, "epoch": 2681} {"train_loss": -12.862020492553711, "global_step": 450409, "epoch": 2681} {"train_loss": -12.829018592834473, "global_step": 450410, "epoch": 2681} {"train_loss": -12.611984252929688, "global_step": 450411, "epoch": 2681} {"train_loss": -12.548198699951172, "global_step": 450412, "epoch": 2681} {"train_loss": -12.877335548400879, "global_step": 450413, "epoch": 2681} {"train_loss": -12.706664085388184, "global_step": 450414, "epoch": 2681} {"train_loss": -12.854369163513184, "global_step": 450415, "epoch": 2681} {"train_loss": -12.774134635925293, "global_step": 450416, "epoch": 2681} {"train_loss": -12.746357917785645, "global_step": 450417, "epoch": 2681} {"train_loss": -12.680305480957031, "global_step": 450418, "epoch": 2681} {"train_loss": -12.722858428955078, "global_step": 450419, "epoch": 2681} {"train_loss": -12.889999389648438, "global_step": 450420, "epoch": 2681} {"train_loss": -12.931246757507324, "global_step": 450421, "epoch": 2681} {"train_loss": -12.83719253540039, "global_step": 450422, "epoch": 2681} {"train_loss": -12.701713562011719, "global_step": 450423, "epoch": 2681} {"train_loss": -12.991864204406738, "global_step": 450424, "epoch": 2681} {"train_loss": -12.84339714050293, "global_step": 450425, "epoch": 2681} {"train_loss": -12.844467163085938, "global_step": 450426, "epoch": 2681} {"train_loss": -12.89879322052002, "global_step": 450427, "epoch": 2681} {"train_loss": -12.990621566772461, "global_step": 450428, "epoch": 2681} {"train_loss": -12.773868560791016, "global_step": 450429, "epoch": 2681} {"train_loss": -12.890332221984863, "global_step": 450430, "epoch": 2681} {"train_loss": -12.578913688659668, "global_step": 450431, "epoch": 2681} {"train_loss": -12.506556510925293, "global_step": 450432, "epoch": 2681} {"train_loss": -12.958548545837402, "global_step": 450433, "epoch": 2681} {"train_loss": -12.708853721618652, "global_step": 450434, "epoch": 2681} {"train_loss": -13.060510635375977, "global_step": 450435, "epoch": 2681} {"train_loss": -12.866043090820312, "global_step": 450436, "epoch": 2681} {"train_loss": -12.925697326660156, "global_step": 450437, "epoch": 2681} {"train_loss": -12.930803298950195, "global_step": 450438, "epoch": 2681} {"train_loss": -13.0383939743042, "global_step": 450439, "epoch": 2681} {"train_loss": -12.98926830291748, "global_step": 450440, "epoch": 2681} {"train_loss": -12.764034271240234, "global_step": 450441, "epoch": 2681} {"train_loss": -12.550105094909668, "global_step": 450442, "epoch": 2681} {"train_loss": -12.79659652709961, "global_step": 450443, "epoch": 2681} {"train_loss": -12.808082580566406, "global_step": 450444, "epoch": 2681} {"train_loss": -12.357954025268555, "global_step": 450445, "epoch": 2681} {"train_loss": -12.419123649597168, "global_step": 450446, "epoch": 2681} {"train_loss": -13.027371406555176, "global_step": 450447, "epoch": 2681} {"train_loss": -12.353118896484375, "global_step": 450448, "epoch": 2681} {"train_loss": -12.239303588867188, "global_step": 450449, "epoch": 2681} {"train_loss": -12.74358081817627, "global_step": 450450, "epoch": 2681} {"train_loss": -12.376462936401367, "global_step": 450451, "epoch": 2681} {"train_loss": -10.439947128295898, "global_step": 450452, "epoch": 2681} {"train_loss": -11.173704147338867, "global_step": 450453, "epoch": 2681} {"train_loss": -12.289654731750488, "global_step": 450454, "epoch": 2681} {"train_loss": -12.660207748413086, "global_step": 450455, "epoch": 2681} {"train_loss": -12.063431739807129, "global_step": 450456, "epoch": 2681} {"train_loss": -11.803625106811523, "global_step": 450457, "epoch": 2681} {"train_loss": -11.773175239562988, "global_step": 450458, "epoch": 2681} {"train_loss": -12.393695831298828, "global_step": 450459, "epoch": 2681} {"train_loss": -12.437919616699219, "global_step": 450460, "epoch": 2681} {"train_loss": -12.341357231140137, "global_step": 450461, "epoch": 2681} {"train_loss": -12.08683967590332, "global_step": 450462, "epoch": 2681} {"train_loss": -12.155684471130371, "global_step": 450463, "epoch": 2681} {"train_loss": -12.165422439575195, "global_step": 450464, "epoch": 2681} {"train_loss": -12.692083358764648, "global_step": 450465, "epoch": 2681} {"train_loss": -11.969747543334961, "global_step": 450466, "epoch": 2681} {"train_loss": -12.412772178649902, "global_step": 450467, "epoch": 2681} {"train_loss": -11.685858726501465, "global_step": 450468, "epoch": 2681} {"train_loss": -12.026824951171875, "global_step": 450469, "epoch": 2681} {"train_loss": -9.618834495544434, "global_step": 450470, "epoch": 2681} {"train_loss": -11.183035850524902, "global_step": 450471, "epoch": 2681} {"train_loss": -7.703524112701416, "global_step": 450472, "epoch": 2681} {"train_loss": -7.827855110168457, "global_step": 450473, "epoch": 2681} {"train_loss": -6.951230049133301, "global_step": 450474, "epoch": 2681} {"train_loss": -6.9292192459106445, "global_step": 450475, "epoch": 2681} {"train_loss": -7.111994743347168, "global_step": 450476, "epoch": 2681} {"train_loss": -7.001599311828613, "global_step": 450477, "epoch": 2681} {"train_loss": -6.398509979248047, "global_step": 450478, "epoch": 2681} {"train_loss": -6.834104537963867, "global_step": 450479, "epoch": 2681} {"train_loss": -6.987478256225586, "global_step": 450480, "epoch": 2681} {"train_loss": -6.865784645080566, "global_step": 450481, "epoch": 2681} {"train_loss": -6.79583740234375, "global_step": 450482, "epoch": 2681} {"train_loss": -7.255767822265625, "global_step": 450483, "epoch": 2681} {"train_loss": -7.334961891174316, "global_step": 450484, "epoch": 2681} {"train_loss": -7.04854679107666, "global_step": 450485, "epoch": 2681} {"train_loss": -7.891016006469727, "global_step": 450486, "epoch": 2681} {"train_loss": -7.680431365966797, "global_step": 450487, "epoch": 2681} {"train_loss": -7.503186225891113, "global_step": 450488, "epoch": 2681} {"train_loss": -7.847594261169434, "global_step": 450489, "epoch": 2681} {"train_loss": -8.024791717529297, "global_step": 450490, "epoch": 2681} {"train_loss": -8.239347457885742, "global_step": 450491, "epoch": 2681} {"train_loss": -8.440767288208008, "global_step": 450492, "epoch": 2681} {"train_loss": -9.411937713623047, "global_step": 450493, "epoch": 2681} {"train_loss": -9.410590171813965, "global_step": 450494, "epoch": 2681} {"train_loss": -9.19021987915039, "global_step": 450495, "epoch": 2681} {"train_loss": -9.738950729370117, "global_step": 450496, "epoch": 2681} {"train_loss": -9.395072937011719, "global_step": 450497, "epoch": 2681} {"train_loss": -9.966175079345703, "global_step": 450498, "epoch": 2681} {"train_loss": -10.285074234008789, "global_step": 450499, "epoch": 2681} {"train_loss": -10.304760932922363, "global_step": 450500, "epoch": 2681} {"train_loss": -10.586404800415039, "global_step": 450501, "epoch": 2681} {"train_loss": -10.666213989257812, "global_step": 450502, "epoch": 2681} {"train_loss": -10.582687377929688, "global_step": 450503, "epoch": 2681} {"train_loss": -10.830625534057617, "global_step": 450504, "epoch": 2681} {"train_loss": -11.092483520507812, "global_step": 450505, "epoch": 2681} {"train_loss": -11.29696273803711, "global_step": 450506, "epoch": 2681} {"train_loss": -11.441017150878906, "global_step": 450507, "epoch": 2681} {"train_loss": -11.747457504272461, "global_step": 450508, "epoch": 2681} {"train_loss": -11.49110221862793, "global_step": 450509, "epoch": 2681} {"train_loss": -11.548755645751953, "global_step": 450510, "epoch": 2681} {"train_loss": -11.48271656036377, "global_step": 450511, "epoch": 2681} {"train_loss": -11.701444625854492, "global_step": 450512, "epoch": 2681} {"train_loss": -11.158899307250977, "global_step": 450513, "epoch": 2681} {"train_loss": -11.79830551147461, "global_step": 450514, "epoch": 2681} {"train_loss": -11.775484085083008, "global_step": 450515, "epoch": 2681} {"train_loss": -11.969085693359375, "global_step": 450516, "epoch": 2681} {"train_loss": -11.901725769042969, "global_step": 450517, "epoch": 2681} {"train_loss": -12.377676963806152, "global_step": 450518, "epoch": 2681} {"train_loss": -11.804330825805664, "global_step": 450519, "epoch": 2681} {"train_loss": -11.906564712524414, "global_step": 450520, "epoch": 2681} {"train_loss": -12.0867919921875, "global_step": 450521, "epoch": 2681} {"train_loss": -12.019309997558594, "global_step": 450522, "epoch": 2681} {"train_loss": -11.953458786010742, "global_step": 450523, "epoch": 2681} {"train_loss": -11.871092796325684, "global_step": 450524, "epoch": 2681} {"train_loss": -11.936367988586426, "global_step": 450525, "epoch": 2681} {"train_loss": -12.113965034484863, "global_step": 450526, "epoch": 2681} {"train_loss": -12.220178604125977, "global_step": 450527, "epoch": 2681} {"train_loss": -11.775745391845703, "global_step": 450528, "epoch": 2681} {"train_loss": -12.179274559020996, "global_step": 450529, "epoch": 2681} {"train_loss": -11.535991668701172, "global_step": 450530, "epoch": 2681} {"train_loss": -12.169942855834961, "global_step": 450531, "epoch": 2681} {"train_loss": -11.538323402404785, "global_step": 450532, "epoch": 2681} {"train_loss": -11.760190963745117, "global_step": 450533, "epoch": 2681} {"train_loss": -12.016538619995117, "global_step": 450534, "epoch": 2681} {"train_loss": -11.76656436920166, "global_step": 450535, "epoch": 2681} {"train_loss": -12.299166679382324, "global_step": 450536, "epoch": 2681} {"train_loss": -11.83616828918457, "global_step": 450537, "epoch": 2681} {"train_loss": -12.187047958374023, "global_step": 450538, "epoch": 2681} {"train_loss": -11.944181442260742, "global_step": 450539, "epoch": 2681} {"train_loss": -12.34476089477539, "global_step": 450540, "epoch": 2681} {"train_loss": -12.078324317932129, "global_step": 450541, "epoch": 2681} {"train_loss": -12.205098152160645, "global_step": 450542, "epoch": 2681} {"train_loss": -11.647466659545898, "global_step": 450543, "epoch": 2681} {"train_loss": -12.519584655761719, "global_step": 450544, "epoch": 2681} {"train_loss": -12.241172790527344, "global_step": 450545, "epoch": 2681} {"train_loss": -12.231864929199219, "global_step": 450546, "epoch": 2681} {"train_loss": -12.349164962768555, "global_step": 450547, "epoch": 2681} {"train_loss": -11.769403457641602, "global_step": 450548, "epoch": 2681} {"train_loss": -12.386320114135742, "global_step": 450549, "epoch": 2681} {"train_loss": -12.171590805053711, "global_step": 450550, "epoch": 2681} {"train_loss": -12.19912338256836, "global_step": 450551, "epoch": 2681} {"train_loss": -12.065069198608398, "global_step": 450552, "epoch": 2681} {"train_loss": -12.221555709838867, "global_step": 450553, "epoch": 2681} {"train_loss": -12.327932357788086, "global_step": 450554, "epoch": 2681} {"train_loss": -12.7089204788208, "global_step": 450555, "epoch": 2681} {"train_loss": -12.576154708862305, "global_step": 450556, "epoch": 2681} {"train_loss": -12.238576889038086, "global_step": 450557, "epoch": 2681} {"train_loss": -12.465203285217285, "global_step": 450558, "epoch": 2681} {"train_loss": -12.588417053222656, "global_step": 450559, "epoch": 2681} {"train_loss": -12.518865585327148, "global_step": 450560, "epoch": 2681} {"train_loss": -12.364913940429688, "global_step": 450561, "epoch": 2681} {"train_loss": -12.412755012512207, "global_step": 450562, "epoch": 2681} {"train_loss": -12.704668045043945, "global_step": 450563, "epoch": 2681} {"train_loss": -12.445140838623047, "global_step": 450564, "epoch": 2681} {"train_loss": -12.629166603088379, "global_step": 450565, "epoch": 2681} {"train_loss": -12.316408157348633, "global_step": 450566, "epoch": 2681} {"train_loss": -12.587495803833008, "global_step": 450567, "epoch": 2681} {"train_loss": -12.518953323364258, "global_step": 450568, "epoch": 2681} {"train_loss": -12.623940467834473, "global_step": 450569, "epoch": 2681} {"train_loss": -12.60766887664795, "global_step": 450570, "epoch": 2681} {"train_loss": -12.589102745056152, "global_step": 450571, "epoch": 2681} {"train_loss": -12.707192420959473, "global_step": 450572, "epoch": 2681} {"train_loss": -12.482561111450195, "global_step": 450573, "epoch": 2681} {"train_loss": -12.53522777557373, "global_step": 450574, "epoch": 2681} {"train_loss": -11.51014673993701, "global_step": 450575, "epoch": 2681, "val_loss": 314056.5625} {"train_loss": -12.390607833862305, "global_step": 450576, "epoch": 2682} {"train_loss": -12.668705940246582, "global_step": 450577, "epoch": 2682} {"train_loss": -12.519571304321289, "global_step": 450578, "epoch": 2682} {"train_loss": -12.580211639404297, "global_step": 450579, "epoch": 2682} {"train_loss": -12.146917343139648, "global_step": 450580, "epoch": 2682} {"train_loss": -12.495119094848633, "global_step": 450581, "epoch": 2682} {"train_loss": -12.420594215393066, "global_step": 450582, "epoch": 2682} {"train_loss": -12.557119369506836, "global_step": 450583, "epoch": 2682} {"train_loss": -12.504632949829102, "global_step": 450584, "epoch": 2682} {"train_loss": -12.50644588470459, "global_step": 450585, "epoch": 2682} {"train_loss": -12.425971984863281, "global_step": 450586, "epoch": 2682} {"train_loss": -12.418577194213867, "global_step": 450587, "epoch": 2682} {"train_loss": -12.052900314331055, "global_step": 450588, "epoch": 2682} {"train_loss": -12.79627799987793, "global_step": 450589, "epoch": 2682} {"train_loss": -12.142970085144043, "global_step": 450590, "epoch": 2682} {"train_loss": -11.251049041748047, "global_step": 450591, "epoch": 2682} {"train_loss": -12.687883377075195, "global_step": 450592, "epoch": 2682} {"train_loss": -10.611318588256836, "global_step": 450593, "epoch": 2682} {"train_loss": -10.825017929077148, "global_step": 450594, "epoch": 2682} {"train_loss": -12.719303131103516, "global_step": 450595, "epoch": 2682} {"train_loss": -10.9991455078125, "global_step": 450596, "epoch": 2682} {"train_loss": -12.136341094970703, "global_step": 450597, "epoch": 2682} {"train_loss": -12.199207305908203, "global_step": 450598, "epoch": 2682} {"train_loss": -11.786490440368652, "global_step": 450599, "epoch": 2682} {"train_loss": -11.597797393798828, "global_step": 450600, "epoch": 2682} {"train_loss": -12.255643844604492, "global_step": 450601, "epoch": 2682} {"train_loss": -11.53182601928711, "global_step": 450602, "epoch": 2682} {"train_loss": -12.539587020874023, "global_step": 450603, "epoch": 2682} {"train_loss": -12.211282730102539, "global_step": 450604, "epoch": 2682} {"train_loss": -11.9599027633667, "global_step": 450605, "epoch": 2682} {"train_loss": -12.263223648071289, "global_step": 450606, "epoch": 2682} {"train_loss": -12.426311492919922, "global_step": 450607, "epoch": 2682} {"train_loss": -12.093973159790039, "global_step": 450608, "epoch": 2682} {"train_loss": -12.252290725708008, "global_step": 450609, "epoch": 2682} {"train_loss": -12.443206787109375, "global_step": 450610, "epoch": 2682} {"train_loss": -12.217758178710938, "global_step": 450611, "epoch": 2682} {"train_loss": -12.555597305297852, "global_step": 450612, "epoch": 2682} {"train_loss": -12.214905738830566, "global_step": 450613, "epoch": 2682} {"train_loss": -12.456509590148926, "global_step": 450614, "epoch": 2682} {"train_loss": -12.669717788696289, "global_step": 450615, "epoch": 2682} {"train_loss": -12.71302604675293, "global_step": 450616, "epoch": 2682} {"train_loss": -12.422141075134277, "global_step": 450617, "epoch": 2682} {"train_loss": -12.429868698120117, "global_step": 450618, "epoch": 2682} {"train_loss": -12.303333282470703, "global_step": 450619, "epoch": 2682} {"train_loss": -12.181539535522461, "global_step": 450620, "epoch": 2682} {"train_loss": -12.682854652404785, "global_step": 450621, "epoch": 2682} {"train_loss": -12.222150802612305, "global_step": 450622, "epoch": 2682} {"train_loss": -12.652131080627441, "global_step": 450623, "epoch": 2682} {"train_loss": -12.593141555786133, "global_step": 450624, "epoch": 2682} {"train_loss": -12.214613914489746, "global_step": 450625, "epoch": 2682} {"train_loss": -12.367183685302734, "global_step": 450626, "epoch": 2682} {"train_loss": -12.539251327514648, "global_step": 450627, "epoch": 2682} {"train_loss": -12.275705337524414, "global_step": 450628, "epoch": 2682} {"train_loss": -12.510873794555664, "global_step": 450629, "epoch": 2682} {"train_loss": -12.617441177368164, "global_step": 450630, "epoch": 2682} {"train_loss": -11.969250679016113, "global_step": 450631, "epoch": 2682} {"train_loss": -12.436704635620117, "global_step": 450632, "epoch": 2682} {"train_loss": -12.542972564697266, "global_step": 450633, "epoch": 2682} {"train_loss": -12.241209983825684, "global_step": 450634, "epoch": 2682} {"train_loss": -12.238012313842773, "global_step": 450635, "epoch": 2682} {"train_loss": -12.458648681640625, "global_step": 450636, "epoch": 2682} {"train_loss": -12.713130950927734, "global_step": 450637, "epoch": 2682} {"train_loss": -12.505792617797852, "global_step": 450638, "epoch": 2682} {"train_loss": -12.615758895874023, "global_step": 450639, "epoch": 2682} {"train_loss": -12.576244354248047, "global_step": 450640, "epoch": 2682} {"train_loss": -12.799602508544922, "global_step": 450641, "epoch": 2682} {"train_loss": -12.369280815124512, "global_step": 450642, "epoch": 2682} {"train_loss": -12.533010482788086, "global_step": 450643, "epoch": 2682} {"train_loss": -12.723734855651855, "global_step": 450644, "epoch": 2682} {"train_loss": -12.301340103149414, "global_step": 450645, "epoch": 2682} {"train_loss": -11.860504150390625, "global_step": 450646, "epoch": 2682} {"train_loss": -12.157906532287598, "global_step": 450647, "epoch": 2682} {"train_loss": -11.550065994262695, "global_step": 450648, "epoch": 2682} {"train_loss": -12.343286514282227, "global_step": 450649, "epoch": 2682} {"train_loss": -11.4218111038208, "global_step": 450650, "epoch": 2682} {"train_loss": -11.61587905883789, "global_step": 450651, "epoch": 2682} {"train_loss": -12.33268928527832, "global_step": 450652, "epoch": 2682} {"train_loss": -11.528456687927246, "global_step": 450653, "epoch": 2682} {"train_loss": -12.24494743347168, "global_step": 450654, "epoch": 2682} {"train_loss": -12.198792457580566, "global_step": 450655, "epoch": 2682} {"train_loss": -12.110503196716309, "global_step": 450656, "epoch": 2682} {"train_loss": -12.539993286132812, "global_step": 450657, "epoch": 2682} {"train_loss": -11.872315406799316, "global_step": 450658, "epoch": 2682} {"train_loss": -12.467595100402832, "global_step": 450659, "epoch": 2682} {"train_loss": -12.214685440063477, "global_step": 450660, "epoch": 2682} {"train_loss": -12.494041442871094, "global_step": 450661, "epoch": 2682} {"train_loss": -12.21426010131836, "global_step": 450662, "epoch": 2682} {"train_loss": -12.605828285217285, "global_step": 450663, "epoch": 2682} {"train_loss": -12.548748016357422, "global_step": 450664, "epoch": 2682} {"train_loss": -12.117169380187988, "global_step": 450665, "epoch": 2682} {"train_loss": -12.385156631469727, "global_step": 450666, "epoch": 2682} {"train_loss": -12.404415130615234, "global_step": 450667, "epoch": 2682} {"train_loss": -12.45773983001709, "global_step": 450668, "epoch": 2682} {"train_loss": -12.424860000610352, "global_step": 450669, "epoch": 2682} {"train_loss": -12.61201000213623, "global_step": 450670, "epoch": 2682} {"train_loss": -12.243219375610352, "global_step": 450671, "epoch": 2682} {"train_loss": -12.451120376586914, "global_step": 450672, "epoch": 2682} {"train_loss": -12.65417766571045, "global_step": 450673, "epoch": 2682} {"train_loss": -11.607063293457031, "global_step": 450674, "epoch": 2682} {"train_loss": -12.403993606567383, "global_step": 450675, "epoch": 2682} {"train_loss": -12.602602005004883, "global_step": 450676, "epoch": 2682} {"train_loss": -12.065276145935059, "global_step": 450677, "epoch": 2682} {"train_loss": -12.029073715209961, "global_step": 450678, "epoch": 2682} {"train_loss": -12.296598434448242, "global_step": 450679, "epoch": 2682} {"train_loss": -12.182474136352539, "global_step": 450680, "epoch": 2682} {"train_loss": -11.987922668457031, "global_step": 450681, "epoch": 2682} {"train_loss": -12.280126571655273, "global_step": 450682, "epoch": 2682} {"train_loss": -11.74884033203125, "global_step": 450683, "epoch": 2682} {"train_loss": -12.215742111206055, "global_step": 450684, "epoch": 2682} {"train_loss": -11.917182922363281, "global_step": 450685, "epoch": 2682} {"train_loss": -12.627038955688477, "global_step": 450686, "epoch": 2682} {"train_loss": -12.546333312988281, "global_step": 450687, "epoch": 2682} {"train_loss": -12.345666885375977, "global_step": 450688, "epoch": 2682} {"train_loss": -12.322765350341797, "global_step": 450689, "epoch": 2682} {"train_loss": -11.864431381225586, "global_step": 450690, "epoch": 2682} {"train_loss": -12.264680862426758, "global_step": 450691, "epoch": 2682} {"train_loss": -12.389751434326172, "global_step": 450692, "epoch": 2682} {"train_loss": -11.920808792114258, "global_step": 450693, "epoch": 2682} {"train_loss": -11.876428604125977, "global_step": 450694, "epoch": 2682} {"train_loss": -12.422830581665039, "global_step": 450695, "epoch": 2682} {"train_loss": -11.637014389038086, "global_step": 450696, "epoch": 2682} {"train_loss": -12.051651000976562, "global_step": 450697, "epoch": 2682} {"train_loss": -12.306222915649414, "global_step": 450698, "epoch": 2682} {"train_loss": -12.5916166305542, "global_step": 450699, "epoch": 2682} {"train_loss": -12.25901985168457, "global_step": 450700, "epoch": 2682} {"train_loss": -12.634031295776367, "global_step": 450701, "epoch": 2682} {"train_loss": -11.765424728393555, "global_step": 450702, "epoch": 2682} {"train_loss": -12.457929611206055, "global_step": 450703, "epoch": 2682} {"train_loss": -11.338144302368164, "global_step": 450704, "epoch": 2682} {"train_loss": -11.594151496887207, "global_step": 450705, "epoch": 2682} {"train_loss": -11.741726875305176, "global_step": 450706, "epoch": 2682} {"train_loss": -11.195158004760742, "global_step": 450707, "epoch": 2682} {"train_loss": -11.57320785522461, "global_step": 450708, "epoch": 2682} {"train_loss": -11.568138122558594, "global_step": 450709, "epoch": 2682} {"train_loss": -11.391763687133789, "global_step": 450710, "epoch": 2682} {"train_loss": -12.58869743347168, "global_step": 450711, "epoch": 2682} {"train_loss": -11.35713005065918, "global_step": 450712, "epoch": 2682} {"train_loss": -12.347214698791504, "global_step": 450713, "epoch": 2682} {"train_loss": -11.690107345581055, "global_step": 450714, "epoch": 2682} {"train_loss": -9.829496383666992, "global_step": 450715, "epoch": 2682} {"train_loss": -11.900001525878906, "global_step": 450716, "epoch": 2682} {"train_loss": -11.24073600769043, "global_step": 450717, "epoch": 2682} {"train_loss": -11.641586303710938, "global_step": 450718, "epoch": 2682} {"train_loss": -11.595090866088867, "global_step": 450719, "epoch": 2682} {"train_loss": -11.613704681396484, "global_step": 450720, "epoch": 2682} {"train_loss": -11.578365325927734, "global_step": 450721, "epoch": 2682} {"train_loss": -11.459644317626953, "global_step": 450722, "epoch": 2682} {"train_loss": -11.54725456237793, "global_step": 450723, "epoch": 2682} {"train_loss": -10.483963966369629, "global_step": 450724, "epoch": 2682} {"train_loss": -11.405289649963379, "global_step": 450725, "epoch": 2682} {"train_loss": -11.993886947631836, "global_step": 450726, "epoch": 2682} {"train_loss": -9.855485916137695, "global_step": 450727, "epoch": 2682} {"train_loss": -11.549300193786621, "global_step": 450728, "epoch": 2682} {"train_loss": -10.326518058776855, "global_step": 450729, "epoch": 2682} {"train_loss": -10.014530181884766, "global_step": 450730, "epoch": 2682} {"train_loss": -10.932109832763672, "global_step": 450731, "epoch": 2682} {"train_loss": -9.65437126159668, "global_step": 450732, "epoch": 2682} {"train_loss": -11.382804870605469, "global_step": 450733, "epoch": 2682} {"train_loss": -9.964516639709473, "global_step": 450734, "epoch": 2682} {"train_loss": -11.847467422485352, "global_step": 450735, "epoch": 2682} {"train_loss": -10.594937324523926, "global_step": 450736, "epoch": 2682} {"train_loss": -11.077317237854004, "global_step": 450737, "epoch": 2682} {"train_loss": -11.507123947143555, "global_step": 450738, "epoch": 2682} {"train_loss": -10.749418258666992, "global_step": 450739, "epoch": 2682} {"train_loss": -11.061365127563477, "global_step": 450740, "epoch": 2682} {"train_loss": -11.197517395019531, "global_step": 450741, "epoch": 2682} {"train_loss": -10.03451919555664, "global_step": 450742, "epoch": 2682} {"train_loss": -12.003845913069588, "global_step": 450743, "epoch": 2682, "val_loss": 313975.25} {"train_loss": -10.000134468078613, "global_step": 450744, "epoch": 2683} {"train_loss": -10.177607536315918, "global_step": 450745, "epoch": 2683} {"train_loss": -11.280791282653809, "global_step": 450746, "epoch": 2683} {"train_loss": -10.290154457092285, "global_step": 450747, "epoch": 2683} {"train_loss": -10.141813278198242, "global_step": 450748, "epoch": 2683} {"train_loss": -11.389179229736328, "global_step": 450749, "epoch": 2683} {"train_loss": -10.812238693237305, "global_step": 450750, "epoch": 2683} {"train_loss": -11.513204574584961, "global_step": 450751, "epoch": 2683} {"train_loss": -11.733579635620117, "global_step": 450752, "epoch": 2683} {"train_loss": -11.730450630187988, "global_step": 450753, "epoch": 2683} {"train_loss": -11.164769172668457, "global_step": 450754, "epoch": 2683} {"train_loss": -11.523815155029297, "global_step": 450755, "epoch": 2683} {"train_loss": -10.731602668762207, "global_step": 450756, "epoch": 2683} {"train_loss": -11.982905387878418, "global_step": 450757, "epoch": 2683} {"train_loss": -10.913179397583008, "global_step": 450758, "epoch": 2683} {"train_loss": -11.527093887329102, "global_step": 450759, "epoch": 2683} {"train_loss": -11.727684020996094, "global_step": 450760, "epoch": 2683} {"train_loss": -12.147224426269531, "global_step": 450761, "epoch": 2683} {"train_loss": -11.631537437438965, "global_step": 450762, "epoch": 2683} {"train_loss": -10.962478637695312, "global_step": 450763, "epoch": 2683} {"train_loss": -11.713383674621582, "global_step": 450764, "epoch": 2683} {"train_loss": -10.88711166381836, "global_step": 450765, "epoch": 2683} {"train_loss": -11.443380355834961, "global_step": 450766, "epoch": 2683} {"train_loss": -11.620418548583984, "global_step": 450767, "epoch": 2683} {"train_loss": -11.186964988708496, "global_step": 450768, "epoch": 2683} {"train_loss": -11.262772560119629, "global_step": 450769, "epoch": 2683} {"train_loss": -11.369224548339844, "global_step": 450770, "epoch": 2683} {"train_loss": -11.061606407165527, "global_step": 450771, "epoch": 2683} {"train_loss": -12.096221923828125, "global_step": 450772, "epoch": 2683} {"train_loss": -11.434904098510742, "global_step": 450773, "epoch": 2683} {"train_loss": -11.945571899414062, "global_step": 450774, "epoch": 2683} {"train_loss": -11.895081520080566, "global_step": 450775, "epoch": 2683} {"train_loss": -11.569847106933594, "global_step": 450776, "epoch": 2683} {"train_loss": -11.959585189819336, "global_step": 450777, "epoch": 2683} {"train_loss": -12.127269744873047, "global_step": 450778, "epoch": 2683} {"train_loss": -11.829357147216797, "global_step": 450779, "epoch": 2683} {"train_loss": -12.018623352050781, "global_step": 450780, "epoch": 2683} {"train_loss": -11.585487365722656, "global_step": 450781, "epoch": 2683} {"train_loss": -12.309709548950195, "global_step": 450782, "epoch": 2683} {"train_loss": -12.081680297851562, "global_step": 450783, "epoch": 2683} {"train_loss": -12.345964431762695, "global_step": 450784, "epoch": 2683} {"train_loss": -12.191810607910156, "global_step": 450785, "epoch": 2683} {"train_loss": -12.052373886108398, "global_step": 450786, "epoch": 2683} {"train_loss": -12.379522323608398, "global_step": 450787, "epoch": 2683} {"train_loss": -12.397050857543945, "global_step": 450788, "epoch": 2683} {"train_loss": -12.178606033325195, "global_step": 450789, "epoch": 2683} {"train_loss": -12.571501731872559, "global_step": 450790, "epoch": 2683} {"train_loss": -12.453401565551758, "global_step": 450791, "epoch": 2683} {"train_loss": -12.449485778808594, "global_step": 450792, "epoch": 2683} {"train_loss": -12.369827270507812, "global_step": 450793, "epoch": 2683} {"train_loss": -12.5789794921875, "global_step": 450794, "epoch": 2683} {"train_loss": -12.603255271911621, "global_step": 450795, "epoch": 2683} {"train_loss": -12.567548751831055, "global_step": 450796, "epoch": 2683} {"train_loss": -12.425760269165039, "global_step": 450797, "epoch": 2683} {"train_loss": -12.479019165039062, "global_step": 450798, "epoch": 2683} {"train_loss": -12.713890075683594, "global_step": 450799, "epoch": 2683} {"train_loss": -12.645694732666016, "global_step": 450800, "epoch": 2683} {"train_loss": -12.52287769317627, "global_step": 450801, "epoch": 2683} {"train_loss": -12.523494720458984, "global_step": 450802, "epoch": 2683} {"train_loss": -12.645578384399414, "global_step": 450803, "epoch": 2683} {"train_loss": -12.6482572555542, "global_step": 450804, "epoch": 2683} {"train_loss": -12.67082691192627, "global_step": 450805, "epoch": 2683} {"train_loss": -12.482604026794434, "global_step": 450806, "epoch": 2683} {"train_loss": -12.517364501953125, "global_step": 450807, "epoch": 2683} {"train_loss": -12.624374389648438, "global_step": 450808, "epoch": 2683} {"train_loss": -12.646587371826172, "global_step": 450809, "epoch": 2683} {"train_loss": -12.541555404663086, "global_step": 450810, "epoch": 2683} {"train_loss": -12.434595108032227, "global_step": 450811, "epoch": 2683} {"train_loss": -12.60268497467041, "global_step": 450812, "epoch": 2683} {"train_loss": -12.422779083251953, "global_step": 450813, "epoch": 2683} {"train_loss": -12.736089706420898, "global_step": 450814, "epoch": 2683} {"train_loss": -12.689383506774902, "global_step": 450815, "epoch": 2683} {"train_loss": -12.847885131835938, "global_step": 450816, "epoch": 2683} {"train_loss": -12.650456428527832, "global_step": 450817, "epoch": 2683} {"train_loss": -12.641305923461914, "global_step": 450818, "epoch": 2683} {"train_loss": -12.523591995239258, "global_step": 450819, "epoch": 2683} {"train_loss": -12.803507804870605, "global_step": 450820, "epoch": 2683} {"train_loss": -12.630449295043945, "global_step": 450821, "epoch": 2683} {"train_loss": -12.711931228637695, "global_step": 450822, "epoch": 2683} {"train_loss": -12.669163703918457, "global_step": 450823, "epoch": 2683} {"train_loss": -12.675276756286621, "global_step": 450824, "epoch": 2683} {"train_loss": -12.651253700256348, "global_step": 450825, "epoch": 2683} {"train_loss": -12.688173294067383, "global_step": 450826, "epoch": 2683} {"train_loss": -12.719868659973145, "global_step": 450827, "epoch": 2683} {"train_loss": -12.651169776916504, "global_step": 450828, "epoch": 2683} {"train_loss": -12.790294647216797, "global_step": 450829, "epoch": 2683} {"train_loss": -12.514461517333984, "global_step": 450830, "epoch": 2683} {"train_loss": -12.76945686340332, "global_step": 450831, "epoch": 2683} {"train_loss": -12.807112693786621, "global_step": 450832, "epoch": 2683} {"train_loss": -12.813549995422363, "global_step": 450833, "epoch": 2683} {"train_loss": -12.725196838378906, "global_step": 450834, "epoch": 2683} {"train_loss": -12.764528274536133, "global_step": 450835, "epoch": 2683} {"train_loss": -12.758910179138184, "global_step": 450836, "epoch": 2683} {"train_loss": -12.548620223999023, "global_step": 450837, "epoch": 2683} {"train_loss": -12.321357727050781, "global_step": 450838, "epoch": 2683} {"train_loss": -12.626626014709473, "global_step": 450839, "epoch": 2683} {"train_loss": -12.730628967285156, "global_step": 450840, "epoch": 2683} {"train_loss": -11.84421157836914, "global_step": 450841, "epoch": 2683} {"train_loss": -12.0986909866333, "global_step": 450842, "epoch": 2683} {"train_loss": -12.875726699829102, "global_step": 450843, "epoch": 2683} {"train_loss": -12.017297744750977, "global_step": 450844, "epoch": 2683} {"train_loss": -12.640252113342285, "global_step": 450845, "epoch": 2683} {"train_loss": -12.650514602661133, "global_step": 450846, "epoch": 2683} {"train_loss": -12.527502059936523, "global_step": 450847, "epoch": 2683} {"train_loss": -12.555747985839844, "global_step": 450848, "epoch": 2683} {"train_loss": -12.693353652954102, "global_step": 450849, "epoch": 2683} {"train_loss": -12.659217834472656, "global_step": 450850, "epoch": 2683} {"train_loss": -12.519876480102539, "global_step": 450851, "epoch": 2683} {"train_loss": -12.205535888671875, "global_step": 450852, "epoch": 2683} {"train_loss": -12.629236221313477, "global_step": 450853, "epoch": 2683} {"train_loss": -12.346572875976562, "global_step": 450854, "epoch": 2683} {"train_loss": -12.518636703491211, "global_step": 450855, "epoch": 2683} {"train_loss": -12.254114151000977, "global_step": 450856, "epoch": 2683} {"train_loss": -12.653477668762207, "global_step": 450857, "epoch": 2683} {"train_loss": -12.517894744873047, "global_step": 450858, "epoch": 2683} {"train_loss": -12.69944953918457, "global_step": 450859, "epoch": 2683} {"train_loss": -12.517411231994629, "global_step": 450860, "epoch": 2683} {"train_loss": -12.200246810913086, "global_step": 450861, "epoch": 2683} {"train_loss": -12.605040550231934, "global_step": 450862, "epoch": 2683} {"train_loss": -12.764850616455078, "global_step": 450863, "epoch": 2683} {"train_loss": -12.422231674194336, "global_step": 450864, "epoch": 2683} {"train_loss": -12.027084350585938, "global_step": 450865, "epoch": 2683} {"train_loss": -12.396848678588867, "global_step": 450866, "epoch": 2683} {"train_loss": -12.473936080932617, "global_step": 450867, "epoch": 2683} {"train_loss": -12.495040893554688, "global_step": 450868, "epoch": 2683} {"train_loss": -12.719078063964844, "global_step": 450869, "epoch": 2683} {"train_loss": -12.163286209106445, "global_step": 450870, "epoch": 2683} {"train_loss": -12.860316276550293, "global_step": 450871, "epoch": 2683} {"train_loss": -12.2684907913208, "global_step": 450872, "epoch": 2683} {"train_loss": -12.567426681518555, "global_step": 450873, "epoch": 2683} {"train_loss": -12.574922561645508, "global_step": 450874, "epoch": 2683} {"train_loss": -12.491678237915039, "global_step": 450875, "epoch": 2683} {"train_loss": -12.324050903320312, "global_step": 450876, "epoch": 2683} {"train_loss": -12.868929862976074, "global_step": 450877, "epoch": 2683} {"train_loss": -12.748512268066406, "global_step": 450878, "epoch": 2683} {"train_loss": -12.703554153442383, "global_step": 450879, "epoch": 2683} {"train_loss": -12.643692016601562, "global_step": 450880, "epoch": 2683} {"train_loss": -12.722549438476562, "global_step": 450881, "epoch": 2683} {"train_loss": -12.605293273925781, "global_step": 450882, "epoch": 2683} {"train_loss": -12.82105827331543, "global_step": 450883, "epoch": 2683} {"train_loss": -12.827768325805664, "global_step": 450884, "epoch": 2683} {"train_loss": -12.986928939819336, "global_step": 450885, "epoch": 2683} {"train_loss": -12.671682357788086, "global_step": 450886, "epoch": 2683} {"train_loss": -13.077848434448242, "global_step": 450887, "epoch": 2683} {"train_loss": -12.557708740234375, "global_step": 450888, "epoch": 2683} {"train_loss": -12.51706314086914, "global_step": 450889, "epoch": 2683} {"train_loss": -13.016061782836914, "global_step": 450890, "epoch": 2683} {"train_loss": -12.41653060913086, "global_step": 450891, "epoch": 2683} {"train_loss": -12.730304718017578, "global_step": 450892, "epoch": 2683} {"train_loss": -12.54703426361084, "global_step": 450893, "epoch": 2683} {"train_loss": -12.768436431884766, "global_step": 450894, "epoch": 2683} {"train_loss": -12.320107460021973, "global_step": 450895, "epoch": 2683} {"train_loss": -12.56896686553955, "global_step": 450896, "epoch": 2683} {"train_loss": -12.324724197387695, "global_step": 450897, "epoch": 2683} {"train_loss": -12.693181037902832, "global_step": 450898, "epoch": 2683} {"train_loss": -11.35693359375, "global_step": 450899, "epoch": 2683} {"train_loss": -11.798370361328125, "global_step": 450900, "epoch": 2683} {"train_loss": -12.313276290893555, "global_step": 450901, "epoch": 2683} {"train_loss": -12.301698684692383, "global_step": 450902, "epoch": 2683} {"train_loss": -12.320880889892578, "global_step": 450903, "epoch": 2683} {"train_loss": -11.731819152832031, "global_step": 450904, "epoch": 2683} {"train_loss": -12.255123138427734, "global_step": 450905, "epoch": 2683} {"train_loss": -11.912287712097168, "global_step": 450906, "epoch": 2683} {"train_loss": -11.14391040802002, "global_step": 450907, "epoch": 2683} {"train_loss": -12.055233001708984, "global_step": 450908, "epoch": 2683} {"train_loss": -10.096830368041992, "global_step": 450909, "epoch": 2683} {"train_loss": -12.134247779846191, "global_step": 450910, "epoch": 2683} {"train_loss": -12.228741055443173, "global_step": 450911, "epoch": 2683, "val_loss": 312473.46875} {"train_loss": -11.798686981201172, "global_step": 450912, "epoch": 2684} {"train_loss": -10.502838134765625, "global_step": 450913, "epoch": 2684} {"train_loss": -10.165792465209961, "global_step": 450914, "epoch": 2684} {"train_loss": -10.069668769836426, "global_step": 450915, "epoch": 2684} {"train_loss": -8.482563972473145, "global_step": 450916, "epoch": 2684} {"train_loss": -9.661993026733398, "global_step": 450917, "epoch": 2684} {"train_loss": -9.80336856842041, "global_step": 450918, "epoch": 2684} {"train_loss": -9.472648620605469, "global_step": 450919, "epoch": 2684} {"train_loss": -9.879693031311035, "global_step": 450920, "epoch": 2684} {"train_loss": -9.390995979309082, "global_step": 450921, "epoch": 2684} {"train_loss": -10.052274703979492, "global_step": 450922, "epoch": 2684} {"train_loss": -10.399225234985352, "global_step": 450923, "epoch": 2684} {"train_loss": -10.442138671875, "global_step": 450924, "epoch": 2684} {"train_loss": -9.970122337341309, "global_step": 450925, "epoch": 2684} {"train_loss": -10.326618194580078, "global_step": 450926, "epoch": 2684} {"train_loss": -10.233718872070312, "global_step": 450927, "epoch": 2684} {"train_loss": -10.09183120727539, "global_step": 450928, "epoch": 2684} {"train_loss": -10.871753692626953, "global_step": 450929, "epoch": 2684} {"train_loss": -11.39877700805664, "global_step": 450930, "epoch": 2684} {"train_loss": -11.300318717956543, "global_step": 450931, "epoch": 2684} {"train_loss": -11.941733360290527, "global_step": 450932, "epoch": 2684} {"train_loss": -10.839603424072266, "global_step": 450933, "epoch": 2684} {"train_loss": -11.644201278686523, "global_step": 450934, "epoch": 2684} {"train_loss": -11.159010887145996, "global_step": 450935, "epoch": 2684} {"train_loss": -11.578248977661133, "global_step": 450936, "epoch": 2684} {"train_loss": -12.056116104125977, "global_step": 450937, "epoch": 2684} {"train_loss": -11.637150764465332, "global_step": 450938, "epoch": 2684} {"train_loss": -11.856033325195312, "global_step": 450939, "epoch": 2684} {"train_loss": -11.030847549438477, "global_step": 450940, "epoch": 2684} {"train_loss": -11.363965034484863, "global_step": 450941, "epoch": 2684} {"train_loss": -10.097034454345703, "global_step": 450942, "epoch": 2684} {"train_loss": -10.942654609680176, "global_step": 450943, "epoch": 2684} {"train_loss": -10.026325225830078, "global_step": 450944, "epoch": 2684} {"train_loss": -10.353948593139648, "global_step": 450945, "epoch": 2684} {"train_loss": -11.411735534667969, "global_step": 450946, "epoch": 2684} {"train_loss": -11.63175106048584, "global_step": 450947, "epoch": 2684} {"train_loss": -10.20612621307373, "global_step": 450948, "epoch": 2684} {"train_loss": -11.521126747131348, "global_step": 450949, "epoch": 2684} {"train_loss": -11.135774612426758, "global_step": 450950, "epoch": 2684} {"train_loss": -11.101325988769531, "global_step": 450951, "epoch": 2684} {"train_loss": -11.963468551635742, "global_step": 450952, "epoch": 2684} {"train_loss": -11.463157653808594, "global_step": 450953, "epoch": 2684} {"train_loss": -11.825338363647461, "global_step": 450954, "epoch": 2684} {"train_loss": -12.030827522277832, "global_step": 450955, "epoch": 2684} {"train_loss": -11.422172546386719, "global_step": 450956, "epoch": 2684} {"train_loss": -11.784588813781738, "global_step": 450957, "epoch": 2684} {"train_loss": -11.513320922851562, "global_step": 450958, "epoch": 2684} {"train_loss": -11.734993934631348, "global_step": 450959, "epoch": 2684} {"train_loss": -11.659637451171875, "global_step": 450960, "epoch": 2684} {"train_loss": -12.094064712524414, "global_step": 450961, "epoch": 2684} {"train_loss": -11.894941329956055, "global_step": 450962, "epoch": 2684} {"train_loss": -12.049591064453125, "global_step": 450963, "epoch": 2684} {"train_loss": -11.901455879211426, "global_step": 450964, "epoch": 2684} {"train_loss": -11.773164749145508, "global_step": 450965, "epoch": 2684} {"train_loss": -12.384873390197754, "global_step": 450966, "epoch": 2684} {"train_loss": -12.205806732177734, "global_step": 450967, "epoch": 2684} {"train_loss": -12.434456825256348, "global_step": 450968, "epoch": 2684} {"train_loss": -12.425500869750977, "global_step": 450969, "epoch": 2684} {"train_loss": -12.479510307312012, "global_step": 450970, "epoch": 2684} {"train_loss": -12.50484561920166, "global_step": 450971, "epoch": 2684} {"train_loss": -12.457408905029297, "global_step": 450972, "epoch": 2684} {"train_loss": -12.564789772033691, "global_step": 450973, "epoch": 2684} {"train_loss": -12.27334976196289, "global_step": 450974, "epoch": 2684} {"train_loss": -12.545637130737305, "global_step": 450975, "epoch": 2684} {"train_loss": -12.353254318237305, "global_step": 450976, "epoch": 2684} {"train_loss": -12.586759567260742, "global_step": 450977, "epoch": 2684} {"train_loss": -12.355069160461426, "global_step": 450978, "epoch": 2684} {"train_loss": -12.451908111572266, "global_step": 450979, "epoch": 2684} {"train_loss": -12.502004623413086, "global_step": 450980, "epoch": 2684} {"train_loss": -12.579181671142578, "global_step": 450981, "epoch": 2684} {"train_loss": -12.4158296585083, "global_step": 450982, "epoch": 2684} {"train_loss": -12.609537124633789, "global_step": 450983, "epoch": 2684} {"train_loss": -12.523136138916016, "global_step": 450984, "epoch": 2684} {"train_loss": -12.666205406188965, "global_step": 450985, "epoch": 2684} {"train_loss": -12.69946575164795, "global_step": 450986, "epoch": 2684} {"train_loss": -12.640514373779297, "global_step": 450987, "epoch": 2684} {"train_loss": -12.563899993896484, "global_step": 450988, "epoch": 2684} {"train_loss": -12.650858879089355, "global_step": 450989, "epoch": 2684} {"train_loss": -12.662349700927734, "global_step": 450990, "epoch": 2684} {"train_loss": -12.67678451538086, "global_step": 450991, "epoch": 2684} {"train_loss": -12.66270923614502, "global_step": 450992, "epoch": 2684} {"train_loss": -12.611328125, "global_step": 450993, "epoch": 2684} {"train_loss": -12.72918701171875, "global_step": 450994, "epoch": 2684} {"train_loss": -12.617990493774414, "global_step": 450995, "epoch": 2684} {"train_loss": -12.612771987915039, "global_step": 450996, "epoch": 2684} {"train_loss": -12.637641906738281, "global_step": 450997, "epoch": 2684} {"train_loss": -12.57258129119873, "global_step": 450998, "epoch": 2684} {"train_loss": -12.83213996887207, "global_step": 450999, "epoch": 2684} {"train_loss": -12.544851303100586, "global_step": 451000, "epoch": 2684} {"train_loss": -12.711854934692383, "global_step": 451001, "epoch": 2684} {"train_loss": -12.694849967956543, "global_step": 451002, "epoch": 2684} {"train_loss": -12.490200996398926, "global_step": 451003, "epoch": 2684} {"train_loss": -12.892679214477539, "global_step": 451004, "epoch": 2684} {"train_loss": -12.736297607421875, "global_step": 451005, "epoch": 2684} {"train_loss": -12.620498657226562, "global_step": 451006, "epoch": 2684} {"train_loss": -12.735259056091309, "global_step": 451007, "epoch": 2684} {"train_loss": -12.86817741394043, "global_step": 451008, "epoch": 2684} {"train_loss": -12.594249725341797, "global_step": 451009, "epoch": 2684} {"train_loss": -12.729795455932617, "global_step": 451010, "epoch": 2684} {"train_loss": -12.783236503601074, "global_step": 451011, "epoch": 2684} {"train_loss": -12.596662521362305, "global_step": 451012, "epoch": 2684} {"train_loss": -12.53957748413086, "global_step": 451013, "epoch": 2684} {"train_loss": -12.572845458984375, "global_step": 451014, "epoch": 2684} {"train_loss": -12.63943862915039, "global_step": 451015, "epoch": 2684} {"train_loss": -12.774652481079102, "global_step": 451016, "epoch": 2684} {"train_loss": -12.745928764343262, "global_step": 451017, "epoch": 2684} {"train_loss": -12.69533920288086, "global_step": 451018, "epoch": 2684} {"train_loss": -12.645864486694336, "global_step": 451019, "epoch": 2684} {"train_loss": -12.718425750732422, "global_step": 451020, "epoch": 2684} {"train_loss": -12.948616981506348, "global_step": 451021, "epoch": 2684} {"train_loss": -12.779376983642578, "global_step": 451022, "epoch": 2684} {"train_loss": -12.698843955993652, "global_step": 451023, "epoch": 2684} {"train_loss": -12.843379974365234, "global_step": 451024, "epoch": 2684} {"train_loss": -12.685139656066895, "global_step": 451025, "epoch": 2684} {"train_loss": -12.745607376098633, "global_step": 451026, "epoch": 2684} {"train_loss": -12.985404968261719, "global_step": 451027, "epoch": 2684} {"train_loss": -12.937172889709473, "global_step": 451028, "epoch": 2684} {"train_loss": -12.856463432312012, "global_step": 451029, "epoch": 2684} {"train_loss": -12.88319206237793, "global_step": 451030, "epoch": 2684} {"train_loss": -12.853826522827148, "global_step": 451031, "epoch": 2684} {"train_loss": -12.809154510498047, "global_step": 451032, "epoch": 2684} {"train_loss": -12.72690486907959, "global_step": 451033, "epoch": 2684} {"train_loss": -12.77943229675293, "global_step": 451034, "epoch": 2684} {"train_loss": -12.794227600097656, "global_step": 451035, "epoch": 2684} {"train_loss": -12.9022798538208, "global_step": 451036, "epoch": 2684} {"train_loss": -13.10043716430664, "global_step": 451037, "epoch": 2684} {"train_loss": -12.673643112182617, "global_step": 451038, "epoch": 2684} {"train_loss": -12.463617324829102, "global_step": 451039, "epoch": 2684} {"train_loss": -12.794569969177246, "global_step": 451040, "epoch": 2684} {"train_loss": -13.140762329101562, "global_step": 451041, "epoch": 2684} {"train_loss": -12.825201034545898, "global_step": 451042, "epoch": 2684} {"train_loss": -12.790336608886719, "global_step": 451043, "epoch": 2684} {"train_loss": -12.889593124389648, "global_step": 451044, "epoch": 2684} {"train_loss": -12.947298049926758, "global_step": 451045, "epoch": 2684} {"train_loss": -12.07950210571289, "global_step": 451046, "epoch": 2684} {"train_loss": -12.026097297668457, "global_step": 451047, "epoch": 2684} {"train_loss": -11.861442565917969, "global_step": 451048, "epoch": 2684} {"train_loss": -12.568845748901367, "global_step": 451049, "epoch": 2684} {"train_loss": -12.247037887573242, "global_step": 451050, "epoch": 2684} {"train_loss": -12.285425186157227, "global_step": 451051, "epoch": 2684} {"train_loss": -11.432229995727539, "global_step": 451052, "epoch": 2684} {"train_loss": -11.609831809997559, "global_step": 451053, "epoch": 2684} {"train_loss": -12.613527297973633, "global_step": 451054, "epoch": 2684} {"train_loss": -11.831299781799316, "global_step": 451055, "epoch": 2684} {"train_loss": -9.681702613830566, "global_step": 451056, "epoch": 2684} {"train_loss": -11.573034286499023, "global_step": 451057, "epoch": 2684} {"train_loss": -12.078245162963867, "global_step": 451058, "epoch": 2684} {"train_loss": -11.718520164489746, "global_step": 451059, "epoch": 2684} {"train_loss": -11.641439437866211, "global_step": 451060, "epoch": 2684} {"train_loss": -12.291557312011719, "global_step": 451061, "epoch": 2684} {"train_loss": -10.496374130249023, "global_step": 451062, "epoch": 2684} {"train_loss": -12.132957458496094, "global_step": 451063, "epoch": 2684} {"train_loss": -11.891489028930664, "global_step": 451064, "epoch": 2684} {"train_loss": -12.260319709777832, "global_step": 451065, "epoch": 2684} {"train_loss": -11.475820541381836, "global_step": 451066, "epoch": 2684} {"train_loss": -12.185701370239258, "global_step": 451067, "epoch": 2684} {"train_loss": -12.069618225097656, "global_step": 451068, "epoch": 2684} {"train_loss": -11.855443954467773, "global_step": 451069, "epoch": 2684} {"train_loss": -11.377128601074219, "global_step": 451070, "epoch": 2684} {"train_loss": -11.819334030151367, "global_step": 451071, "epoch": 2684} {"train_loss": -11.116286277770996, "global_step": 451072, "epoch": 2684} {"train_loss": -10.002143859863281, "global_step": 451073, "epoch": 2684} {"train_loss": -12.340879440307617, "global_step": 451074, "epoch": 2684} {"train_loss": -10.498235702514648, "global_step": 451075, "epoch": 2684} {"train_loss": -10.713229179382324, "global_step": 451076, "epoch": 2684} {"train_loss": -11.930959701538086, "global_step": 451077, "epoch": 2684} {"train_loss": -10.31692123413086, "global_step": 451078, "epoch": 2684} {"train_loss": -11.917652601287479, "global_step": 451079, "epoch": 2684, "val_loss": 312251.09375} {"train_loss": -10.996121406555176, "global_step": 451080, "epoch": 2685} {"train_loss": -10.650053024291992, "global_step": 451081, "epoch": 2685} {"train_loss": -12.244993209838867, "global_step": 451082, "epoch": 2685} {"train_loss": -10.587261199951172, "global_step": 451083, "epoch": 2685} {"train_loss": -12.077444076538086, "global_step": 451084, "epoch": 2685} {"train_loss": -12.058517456054688, "global_step": 451085, "epoch": 2685} {"train_loss": -11.241042137145996, "global_step": 451086, "epoch": 2685} {"train_loss": -12.247309684753418, "global_step": 451087, "epoch": 2685} {"train_loss": -11.487998962402344, "global_step": 451088, "epoch": 2685} {"train_loss": -11.683034896850586, "global_step": 451089, "epoch": 2685} {"train_loss": -12.236446380615234, "global_step": 451090, "epoch": 2685} {"train_loss": -11.953887939453125, "global_step": 451091, "epoch": 2685} {"train_loss": -12.303892135620117, "global_step": 451092, "epoch": 2685} {"train_loss": -12.301575660705566, "global_step": 451093, "epoch": 2685} {"train_loss": -12.030344009399414, "global_step": 451094, "epoch": 2685} {"train_loss": -12.09170150756836, "global_step": 451095, "epoch": 2685} {"train_loss": -12.235190391540527, "global_step": 451096, "epoch": 2685} {"train_loss": -11.665332794189453, "global_step": 451097, "epoch": 2685} {"train_loss": -12.416753768920898, "global_step": 451098, "epoch": 2685} {"train_loss": -11.580320358276367, "global_step": 451099, "epoch": 2685} {"train_loss": -12.510202407836914, "global_step": 451100, "epoch": 2685} {"train_loss": -12.26051139831543, "global_step": 451101, "epoch": 2685} {"train_loss": -12.241113662719727, "global_step": 451102, "epoch": 2685} {"train_loss": -12.436245918273926, "global_step": 451103, "epoch": 2685} {"train_loss": -12.302234649658203, "global_step": 451104, "epoch": 2685} {"train_loss": -12.251834869384766, "global_step": 451105, "epoch": 2685} {"train_loss": -12.42127799987793, "global_step": 451106, "epoch": 2685} {"train_loss": -12.11099624633789, "global_step": 451107, "epoch": 2685} {"train_loss": -12.332966804504395, "global_step": 451108, "epoch": 2685} {"train_loss": -12.267942428588867, "global_step": 451109, "epoch": 2685} {"train_loss": -12.181571960449219, "global_step": 451110, "epoch": 2685} {"train_loss": -12.487604141235352, "global_step": 451111, "epoch": 2685} {"train_loss": -12.305402755737305, "global_step": 451112, "epoch": 2685} {"train_loss": -12.589425086975098, "global_step": 451113, "epoch": 2685} {"train_loss": -12.434175491333008, "global_step": 451114, "epoch": 2685} {"train_loss": -12.422833442687988, "global_step": 451115, "epoch": 2685} {"train_loss": -12.49155330657959, "global_step": 451116, "epoch": 2685} {"train_loss": -12.4921293258667, "global_step": 451117, "epoch": 2685} {"train_loss": -12.255370140075684, "global_step": 451118, "epoch": 2685} {"train_loss": -12.394466400146484, "global_step": 451119, "epoch": 2685} {"train_loss": -12.677841186523438, "global_step": 451120, "epoch": 2685} {"train_loss": -12.152383804321289, "global_step": 451121, "epoch": 2685} {"train_loss": -12.647136688232422, "global_step": 451122, "epoch": 2685} {"train_loss": -12.580713272094727, "global_step": 451123, "epoch": 2685} {"train_loss": -12.787376403808594, "global_step": 451124, "epoch": 2685} {"train_loss": -12.715713500976562, "global_step": 451125, "epoch": 2685} {"train_loss": -12.751200675964355, "global_step": 451126, "epoch": 2685} {"train_loss": -12.567354202270508, "global_step": 451127, "epoch": 2685} {"train_loss": -12.714991569519043, "global_step": 451128, "epoch": 2685} {"train_loss": -12.530571937561035, "global_step": 451129, "epoch": 2685} {"train_loss": -12.647354125976562, "global_step": 451130, "epoch": 2685} {"train_loss": -12.610183715820312, "global_step": 451131, "epoch": 2685} {"train_loss": -12.732650756835938, "global_step": 451132, "epoch": 2685} {"train_loss": -12.65113639831543, "global_step": 451133, "epoch": 2685} {"train_loss": -12.835517883300781, "global_step": 451134, "epoch": 2685} {"train_loss": -12.645584106445312, "global_step": 451135, "epoch": 2685} {"train_loss": -12.831073760986328, "global_step": 451136, "epoch": 2685} {"train_loss": -12.874073028564453, "global_step": 451137, "epoch": 2685} {"train_loss": -12.94395637512207, "global_step": 451138, "epoch": 2685} {"train_loss": -12.843449592590332, "global_step": 451139, "epoch": 2685} {"train_loss": -12.859726905822754, "global_step": 451140, "epoch": 2685} {"train_loss": -12.858657836914062, "global_step": 451141, "epoch": 2685} {"train_loss": -12.776298522949219, "global_step": 451142, "epoch": 2685} {"train_loss": -12.67327880859375, "global_step": 451143, "epoch": 2685} {"train_loss": -12.962236404418945, "global_step": 451144, "epoch": 2685} {"train_loss": -12.665998458862305, "global_step": 451145, "epoch": 2685} {"train_loss": -12.959585189819336, "global_step": 451146, "epoch": 2685} {"train_loss": -12.861981391906738, "global_step": 451147, "epoch": 2685} {"train_loss": -12.90289306640625, "global_step": 451148, "epoch": 2685} {"train_loss": -12.631343841552734, "global_step": 451149, "epoch": 2685} {"train_loss": -12.799718856811523, "global_step": 451150, "epoch": 2685} {"train_loss": -12.71470832824707, "global_step": 451151, "epoch": 2685} {"train_loss": -12.84669303894043, "global_step": 451152, "epoch": 2685} {"train_loss": -12.749679565429688, "global_step": 451153, "epoch": 2685} {"train_loss": -12.675130844116211, "global_step": 451154, "epoch": 2685} {"train_loss": -12.993368148803711, "global_step": 451155, "epoch": 2685} {"train_loss": -12.596002578735352, "global_step": 451156, "epoch": 2685} {"train_loss": -12.718843460083008, "global_step": 451157, "epoch": 2685} {"train_loss": -12.75114917755127, "global_step": 451158, "epoch": 2685} {"train_loss": -12.7451753616333, "global_step": 451159, "epoch": 2685} {"train_loss": -13.056371688842773, "global_step": 451160, "epoch": 2685} {"train_loss": -12.964584350585938, "global_step": 451161, "epoch": 2685} {"train_loss": -12.864002227783203, "global_step": 451162, "epoch": 2685} {"train_loss": -12.83461856842041, "global_step": 451163, "epoch": 2685} {"train_loss": -12.770122528076172, "global_step": 451164, "epoch": 2685} {"train_loss": -12.549628257751465, "global_step": 451165, "epoch": 2685} {"train_loss": -12.414206504821777, "global_step": 451166, "epoch": 2685} {"train_loss": -12.723794937133789, "global_step": 451167, "epoch": 2685} {"train_loss": -12.443521499633789, "global_step": 451168, "epoch": 2685} {"train_loss": -12.617981910705566, "global_step": 451169, "epoch": 2685} {"train_loss": -12.470403671264648, "global_step": 451170, "epoch": 2685} {"train_loss": -12.655210494995117, "global_step": 451171, "epoch": 2685} {"train_loss": -12.554018020629883, "global_step": 451172, "epoch": 2685} {"train_loss": -12.646858215332031, "global_step": 451173, "epoch": 2685} {"train_loss": -12.88682746887207, "global_step": 451174, "epoch": 2685} {"train_loss": -12.787949562072754, "global_step": 451175, "epoch": 2685} {"train_loss": -12.88194751739502, "global_step": 451176, "epoch": 2685} {"train_loss": -12.720060348510742, "global_step": 451177, "epoch": 2685} {"train_loss": -12.561997413635254, "global_step": 451178, "epoch": 2685} {"train_loss": -12.367578506469727, "global_step": 451179, "epoch": 2685} {"train_loss": -12.883907318115234, "global_step": 451180, "epoch": 2685} {"train_loss": -12.674373626708984, "global_step": 451181, "epoch": 2685} {"train_loss": -12.999156951904297, "global_step": 451182, "epoch": 2685} {"train_loss": -12.565544128417969, "global_step": 451183, "epoch": 2685} {"train_loss": -11.925288200378418, "global_step": 451184, "epoch": 2685} {"train_loss": -12.135858535766602, "global_step": 451185, "epoch": 2685} {"train_loss": -12.641745567321777, "global_step": 451186, "epoch": 2685} {"train_loss": -12.46860122680664, "global_step": 451187, "epoch": 2685} {"train_loss": -11.222877502441406, "global_step": 451188, "epoch": 2685} {"train_loss": -11.429876327514648, "global_step": 451189, "epoch": 2685} {"train_loss": -11.440899848937988, "global_step": 451190, "epoch": 2685} {"train_loss": -10.903644561767578, "global_step": 451191, "epoch": 2685} {"train_loss": -11.977989196777344, "global_step": 451192, "epoch": 2685} {"train_loss": -11.396960258483887, "global_step": 451193, "epoch": 2685} {"train_loss": -11.838607788085938, "global_step": 451194, "epoch": 2685} {"train_loss": -11.325030326843262, "global_step": 451195, "epoch": 2685} {"train_loss": -11.848526954650879, "global_step": 451196, "epoch": 2685} {"train_loss": -9.800209045410156, "global_step": 451197, "epoch": 2685} {"train_loss": -9.85582447052002, "global_step": 451198, "epoch": 2685} {"train_loss": -10.499131202697754, "global_step": 451199, "epoch": 2685} {"train_loss": -11.327502250671387, "global_step": 451200, "epoch": 2685} {"train_loss": -10.066441535949707, "global_step": 451201, "epoch": 2685} {"train_loss": -9.616900444030762, "global_step": 451202, "epoch": 2685} {"train_loss": -8.908651351928711, "global_step": 451203, "epoch": 2685} {"train_loss": -11.486963272094727, "global_step": 451204, "epoch": 2685} {"train_loss": -8.275352478027344, "global_step": 451205, "epoch": 2685} {"train_loss": -10.235799789428711, "global_step": 451206, "epoch": 2685} {"train_loss": -9.030653953552246, "global_step": 451207, "epoch": 2685} {"train_loss": -8.131013870239258, "global_step": 451208, "epoch": 2685} {"train_loss": -7.410791873931885, "global_step": 451209, "epoch": 2685} {"train_loss": -7.762848377227783, "global_step": 451210, "epoch": 2685} {"train_loss": -7.69182014465332, "global_step": 451211, "epoch": 2685} {"train_loss": -7.447924613952637, "global_step": 451212, "epoch": 2685} {"train_loss": -7.953711986541748, "global_step": 451213, "epoch": 2685} {"train_loss": -7.877079010009766, "global_step": 451214, "epoch": 2685} {"train_loss": -8.145544052124023, "global_step": 451215, "epoch": 2685} {"train_loss": -8.230936050415039, "global_step": 451216, "epoch": 2685} {"train_loss": -7.863022804260254, "global_step": 451217, "epoch": 2685} {"train_loss": -7.842081069946289, "global_step": 451218, "epoch": 2685} {"train_loss": -8.604776382446289, "global_step": 451219, "epoch": 2685} {"train_loss": -8.274328231811523, "global_step": 451220, "epoch": 2685} {"train_loss": -9.016740798950195, "global_step": 451221, "epoch": 2685} {"train_loss": -8.998403549194336, "global_step": 451222, "epoch": 2685} {"train_loss": -9.005133628845215, "global_step": 451223, "epoch": 2685} {"train_loss": -8.326005935668945, "global_step": 451224, "epoch": 2685} {"train_loss": -8.829399108886719, "global_step": 451225, "epoch": 2685} {"train_loss": -9.206876754760742, "global_step": 451226, "epoch": 2685} {"train_loss": -9.350180625915527, "global_step": 451227, "epoch": 2685} {"train_loss": -9.295109748840332, "global_step": 451228, "epoch": 2685} {"train_loss": -9.147416114807129, "global_step": 451229, "epoch": 2685} {"train_loss": -9.185495376586914, "global_step": 451230, "epoch": 2685} {"train_loss": -9.381156921386719, "global_step": 451231, "epoch": 2685} {"train_loss": -9.813152313232422, "global_step": 451232, "epoch": 2685} {"train_loss": -10.30086898803711, "global_step": 451233, "epoch": 2685} {"train_loss": -9.919599533081055, "global_step": 451234, "epoch": 2685} {"train_loss": -9.46451187133789, "global_step": 451235, "epoch": 2685} {"train_loss": -9.683187484741211, "global_step": 451236, "epoch": 2685} {"train_loss": -9.889534950256348, "global_step": 451237, "epoch": 2685} {"train_loss": -9.561456680297852, "global_step": 451238, "epoch": 2685} {"train_loss": -9.989950180053711, "global_step": 451239, "epoch": 2685} {"train_loss": -10.197031021118164, "global_step": 451240, "epoch": 2685} {"train_loss": -10.684012413024902, "global_step": 451241, "epoch": 2685} {"train_loss": -10.516107559204102, "global_step": 451242, "epoch": 2685} {"train_loss": -10.401994705200195, "global_step": 451243, "epoch": 2685} {"train_loss": -10.54258918762207, "global_step": 451244, "epoch": 2685} {"train_loss": -10.749208450317383, "global_step": 451245, "epoch": 2685} {"train_loss": -10.178102493286133, "global_step": 451246, "epoch": 2685} {"train_loss": -11.454626841204506, "global_step": 451247, "epoch": 2685, "val_loss": 308568.21875, "train_action_mse_error": 2.798034191131592} {"train_loss": -10.562512397766113, "global_step": 451248, "epoch": 2686} {"train_loss": -10.358394622802734, "global_step": 451249, "epoch": 2686} {"train_loss": -10.726884841918945, "global_step": 451250, "epoch": 2686} {"train_loss": -10.521493911743164, "global_step": 451251, "epoch": 2686} {"train_loss": -10.769407272338867, "global_step": 451252, "epoch": 2686} {"train_loss": -10.829010009765625, "global_step": 451253, "epoch": 2686} {"train_loss": -11.320344924926758, "global_step": 451254, "epoch": 2686} {"train_loss": -10.982645034790039, "global_step": 451255, "epoch": 2686} {"train_loss": -10.940231323242188, "global_step": 451256, "epoch": 2686} {"train_loss": -10.587827682495117, "global_step": 451257, "epoch": 2686} {"train_loss": -10.684038162231445, "global_step": 451258, "epoch": 2686} {"train_loss": -11.296163558959961, "global_step": 451259, "epoch": 2686} {"train_loss": -11.208709716796875, "global_step": 451260, "epoch": 2686} {"train_loss": -11.269193649291992, "global_step": 451261, "epoch": 2686} {"train_loss": -11.45947265625, "global_step": 451262, "epoch": 2686} {"train_loss": -11.591928482055664, "global_step": 451263, "epoch": 2686} {"train_loss": -11.498563766479492, "global_step": 451264, "epoch": 2686} {"train_loss": -11.14547348022461, "global_step": 451265, "epoch": 2686} {"train_loss": -11.50564956665039, "global_step": 451266, "epoch": 2686} {"train_loss": -11.602315902709961, "global_step": 451267, "epoch": 2686} {"train_loss": -11.921747207641602, "global_step": 451268, "epoch": 2686} {"train_loss": -11.272113800048828, "global_step": 451269, "epoch": 2686} {"train_loss": -11.224344253540039, "global_step": 451270, "epoch": 2686} {"train_loss": -11.239618301391602, "global_step": 451271, "epoch": 2686} {"train_loss": -10.38132095336914, "global_step": 451272, "epoch": 2686} {"train_loss": -11.48138427734375, "global_step": 451273, "epoch": 2686} {"train_loss": -9.451431274414062, "global_step": 451274, "epoch": 2686} {"train_loss": -9.387984275817871, "global_step": 451275, "epoch": 2686} {"train_loss": -9.907893180847168, "global_step": 451276, "epoch": 2686} {"train_loss": -9.817590713500977, "global_step": 451277, "epoch": 2686} {"train_loss": -11.16235065460205, "global_step": 451278, "epoch": 2686} {"train_loss": -10.619778633117676, "global_step": 451279, "epoch": 2686} {"train_loss": -10.096534729003906, "global_step": 451280, "epoch": 2686} {"train_loss": -10.329391479492188, "global_step": 451281, "epoch": 2686} {"train_loss": -10.596172332763672, "global_step": 451282, "epoch": 2686} {"train_loss": -10.88323974609375, "global_step": 451283, "epoch": 2686} {"train_loss": -10.560216903686523, "global_step": 451284, "epoch": 2686} {"train_loss": -10.655569076538086, "global_step": 451285, "epoch": 2686} {"train_loss": -11.280641555786133, "global_step": 451286, "epoch": 2686} {"train_loss": -10.737792015075684, "global_step": 451287, "epoch": 2686} {"train_loss": -10.798635482788086, "global_step": 451288, "epoch": 2686} {"train_loss": -11.422196388244629, "global_step": 451289, "epoch": 2686} {"train_loss": -11.079041481018066, "global_step": 451290, "epoch": 2686} {"train_loss": -11.406448364257812, "global_step": 451291, "epoch": 2686} {"train_loss": -12.085159301757812, "global_step": 451292, "epoch": 2686} {"train_loss": -11.417076110839844, "global_step": 451293, "epoch": 2686} {"train_loss": -12.17449951171875, "global_step": 451294, "epoch": 2686} {"train_loss": -11.557140350341797, "global_step": 451295, "epoch": 2686} {"train_loss": -12.081811904907227, "global_step": 451296, "epoch": 2686} {"train_loss": -11.708160400390625, "global_step": 451297, "epoch": 2686} {"train_loss": -10.826902389526367, "global_step": 451298, "epoch": 2686} {"train_loss": -11.063756942749023, "global_step": 451299, "epoch": 2686} {"train_loss": -11.946922302246094, "global_step": 451300, "epoch": 2686} {"train_loss": -11.045576095581055, "global_step": 451301, "epoch": 2686} {"train_loss": -11.855792999267578, "global_step": 451302, "epoch": 2686} {"train_loss": -11.192023277282715, "global_step": 451303, "epoch": 2686} {"train_loss": -11.644010543823242, "global_step": 451304, "epoch": 2686} {"train_loss": -11.680495262145996, "global_step": 451305, "epoch": 2686} {"train_loss": -11.743513107299805, "global_step": 451306, "epoch": 2686} {"train_loss": -11.315922737121582, "global_step": 451307, "epoch": 2686} {"train_loss": -11.927648544311523, "global_step": 451308, "epoch": 2686} {"train_loss": -11.588085174560547, "global_step": 451309, "epoch": 2686} {"train_loss": -12.404001235961914, "global_step": 451310, "epoch": 2686} {"train_loss": -11.93719482421875, "global_step": 451311, "epoch": 2686} {"train_loss": -11.641854286193848, "global_step": 451312, "epoch": 2686} {"train_loss": -11.844696044921875, "global_step": 451313, "epoch": 2686} {"train_loss": -11.517027854919434, "global_step": 451314, "epoch": 2686} {"train_loss": -11.595661163330078, "global_step": 451315, "epoch": 2686} {"train_loss": -11.793283462524414, "global_step": 451316, "epoch": 2686} {"train_loss": -12.012301445007324, "global_step": 451317, "epoch": 2686} {"train_loss": -11.788922309875488, "global_step": 451318, "epoch": 2686} {"train_loss": -11.746391296386719, "global_step": 451319, "epoch": 2686} {"train_loss": -11.732990264892578, "global_step": 451320, "epoch": 2686} {"train_loss": -11.91196060180664, "global_step": 451321, "epoch": 2686} {"train_loss": -11.296180725097656, "global_step": 451322, "epoch": 2686} {"train_loss": -12.028676986694336, "global_step": 451323, "epoch": 2686} {"train_loss": -11.54012680053711, "global_step": 451324, "epoch": 2686} {"train_loss": -12.062793731689453, "global_step": 451325, "epoch": 2686} {"train_loss": -11.927396774291992, "global_step": 451326, "epoch": 2686} {"train_loss": -12.007890701293945, "global_step": 451327, "epoch": 2686} {"train_loss": -11.88114070892334, "global_step": 451328, "epoch": 2686} {"train_loss": -11.997994422912598, "global_step": 451329, "epoch": 2686} {"train_loss": -11.978449821472168, "global_step": 451330, "epoch": 2686} {"train_loss": -12.07656478881836, "global_step": 451331, "epoch": 2686} {"train_loss": -12.211833953857422, "global_step": 451332, "epoch": 2686} {"train_loss": -11.831531524658203, "global_step": 451333, "epoch": 2686} {"train_loss": -12.2919921875, "global_step": 451334, "epoch": 2686} {"train_loss": -11.826924324035645, "global_step": 451335, "epoch": 2686} {"train_loss": -12.138489723205566, "global_step": 451336, "epoch": 2686} {"train_loss": -12.164396286010742, "global_step": 451337, "epoch": 2686} {"train_loss": -12.170133590698242, "global_step": 451338, "epoch": 2686} {"train_loss": -12.102250099182129, "global_step": 451339, "epoch": 2686} {"train_loss": -12.19352912902832, "global_step": 451340, "epoch": 2686} {"train_loss": -12.266820907592773, "global_step": 451341, "epoch": 2686} {"train_loss": -12.139934539794922, "global_step": 451342, "epoch": 2686} {"train_loss": -12.54778003692627, "global_step": 451343, "epoch": 2686} {"train_loss": -12.287253379821777, "global_step": 451344, "epoch": 2686} {"train_loss": -12.103689193725586, "global_step": 451345, "epoch": 2686} {"train_loss": -12.395678520202637, "global_step": 451346, "epoch": 2686} {"train_loss": -12.209693908691406, "global_step": 451347, "epoch": 2686} {"train_loss": -12.31714153289795, "global_step": 451348, "epoch": 2686} {"train_loss": -12.155240058898926, "global_step": 451349, "epoch": 2686} {"train_loss": -12.397628784179688, "global_step": 451350, "epoch": 2686} {"train_loss": -12.541152954101562, "global_step": 451351, "epoch": 2686} {"train_loss": -12.643884658813477, "global_step": 451352, "epoch": 2686} {"train_loss": -12.75949478149414, "global_step": 451353, "epoch": 2686} {"train_loss": -12.404071807861328, "global_step": 451354, "epoch": 2686} {"train_loss": -12.508203506469727, "global_step": 451355, "epoch": 2686} {"train_loss": -12.439720153808594, "global_step": 451356, "epoch": 2686} {"train_loss": -12.573269844055176, "global_step": 451357, "epoch": 2686} {"train_loss": -12.631977081298828, "global_step": 451358, "epoch": 2686} {"train_loss": -12.720788955688477, "global_step": 451359, "epoch": 2686} {"train_loss": -12.720808029174805, "global_step": 451360, "epoch": 2686} {"train_loss": -12.406778335571289, "global_step": 451361, "epoch": 2686} {"train_loss": -12.639857292175293, "global_step": 451362, "epoch": 2686} {"train_loss": -12.425949096679688, "global_step": 451363, "epoch": 2686} {"train_loss": -12.714431762695312, "global_step": 451364, "epoch": 2686} {"train_loss": -12.475568771362305, "global_step": 451365, "epoch": 2686} {"train_loss": -12.762453079223633, "global_step": 451366, "epoch": 2686} {"train_loss": -12.792806625366211, "global_step": 451367, "epoch": 2686} {"train_loss": -12.522626876831055, "global_step": 451368, "epoch": 2686} {"train_loss": -12.656061172485352, "global_step": 451369, "epoch": 2686} {"train_loss": -12.749837875366211, "global_step": 451370, "epoch": 2686} {"train_loss": -12.70059871673584, "global_step": 451371, "epoch": 2686} {"train_loss": -12.77596664428711, "global_step": 451372, "epoch": 2686} {"train_loss": -12.654483795166016, "global_step": 451373, "epoch": 2686} {"train_loss": -12.657712936401367, "global_step": 451374, "epoch": 2686} {"train_loss": -12.590362548828125, "global_step": 451375, "epoch": 2686} {"train_loss": -12.737432479858398, "global_step": 451376, "epoch": 2686} {"train_loss": -12.788321495056152, "global_step": 451377, "epoch": 2686} {"train_loss": -12.720416069030762, "global_step": 451378, "epoch": 2686} {"train_loss": -12.568163871765137, "global_step": 451379, "epoch": 2686} {"train_loss": -12.86400032043457, "global_step": 451380, "epoch": 2686} {"train_loss": -12.535712242126465, "global_step": 451381, "epoch": 2686} {"train_loss": -12.665319442749023, "global_step": 451382, "epoch": 2686} {"train_loss": -12.80056381225586, "global_step": 451383, "epoch": 2686} {"train_loss": -12.858918190002441, "global_step": 451384, "epoch": 2686} {"train_loss": -12.634750366210938, "global_step": 451385, "epoch": 2686} {"train_loss": -12.985645294189453, "global_step": 451386, "epoch": 2686} {"train_loss": -12.895824432373047, "global_step": 451387, "epoch": 2686} {"train_loss": -12.971089363098145, "global_step": 451388, "epoch": 2686} {"train_loss": -12.612295150756836, "global_step": 451389, "epoch": 2686} {"train_loss": -12.801056861877441, "global_step": 451390, "epoch": 2686} {"train_loss": -12.934528350830078, "global_step": 451391, "epoch": 2686} {"train_loss": -12.491739273071289, "global_step": 451392, "epoch": 2686} {"train_loss": -12.594816207885742, "global_step": 451393, "epoch": 2686} {"train_loss": -12.481315612792969, "global_step": 451394, "epoch": 2686} {"train_loss": -12.34980583190918, "global_step": 451395, "epoch": 2686} {"train_loss": -12.545124053955078, "global_step": 451396, "epoch": 2686} {"train_loss": -12.646364212036133, "global_step": 451397, "epoch": 2686} {"train_loss": -12.812889099121094, "global_step": 451398, "epoch": 2686} {"train_loss": -12.769437789916992, "global_step": 451399, "epoch": 2686} {"train_loss": -12.52711296081543, "global_step": 451400, "epoch": 2686} {"train_loss": -12.809967041015625, "global_step": 451401, "epoch": 2686} {"train_loss": -12.859046936035156, "global_step": 451402, "epoch": 2686} {"train_loss": -12.760269165039062, "global_step": 451403, "epoch": 2686} {"train_loss": -12.492368698120117, "global_step": 451404, "epoch": 2686} {"train_loss": -12.873430252075195, "global_step": 451405, "epoch": 2686} {"train_loss": -12.82771110534668, "global_step": 451406, "epoch": 2686} {"train_loss": -12.74794864654541, "global_step": 451407, "epoch": 2686} {"train_loss": -12.485641479492188, "global_step": 451408, "epoch": 2686} {"train_loss": -12.832962036132812, "global_step": 451409, "epoch": 2686} {"train_loss": -12.733793258666992, "global_step": 451410, "epoch": 2686} {"train_loss": -12.744549751281738, "global_step": 451411, "epoch": 2686} {"train_loss": -12.639826774597168, "global_step": 451412, "epoch": 2686} {"train_loss": -12.36485481262207, "global_step": 451413, "epoch": 2686} {"train_loss": -12.725265502929688, "global_step": 451414, "epoch": 2686} {"train_loss": -11.925699018296742, "global_step": 451415, "epoch": 2686, "val_loss": 313925.59375} {"train_loss": -12.205098152160645, "global_step": 451416, "epoch": 2687} {"train_loss": -11.988276481628418, "global_step": 451417, "epoch": 2687} {"train_loss": -12.56263256072998, "global_step": 451418, "epoch": 2687} {"train_loss": -12.88994026184082, "global_step": 451419, "epoch": 2687} {"train_loss": -12.015373229980469, "global_step": 451420, "epoch": 2687} {"train_loss": -12.296669006347656, "global_step": 451421, "epoch": 2687} {"train_loss": -12.233325958251953, "global_step": 451422, "epoch": 2687} {"train_loss": -12.327680587768555, "global_step": 451423, "epoch": 2687} {"train_loss": -11.92875862121582, "global_step": 451424, "epoch": 2687} {"train_loss": -12.507623672485352, "global_step": 451425, "epoch": 2687} {"train_loss": -12.588132858276367, "global_step": 451426, "epoch": 2687} {"train_loss": -12.013666152954102, "global_step": 451427, "epoch": 2687} {"train_loss": -12.426547050476074, "global_step": 451428, "epoch": 2687} {"train_loss": -11.859983444213867, "global_step": 451429, "epoch": 2687} {"train_loss": -11.943480491638184, "global_step": 451430, "epoch": 2687} {"train_loss": -12.21419906616211, "global_step": 451431, "epoch": 2687} {"train_loss": -12.585630416870117, "global_step": 451432, "epoch": 2687} {"train_loss": -12.357952117919922, "global_step": 451433, "epoch": 2687} {"train_loss": -12.053654670715332, "global_step": 451434, "epoch": 2687} {"train_loss": -11.843708038330078, "global_step": 451435, "epoch": 2687} {"train_loss": -12.150508880615234, "global_step": 451436, "epoch": 2687} {"train_loss": -12.127787590026855, "global_step": 451437, "epoch": 2687} {"train_loss": -12.322259902954102, "global_step": 451438, "epoch": 2687} {"train_loss": -11.737603187561035, "global_step": 451439, "epoch": 2687} {"train_loss": -12.425201416015625, "global_step": 451440, "epoch": 2687} {"train_loss": -12.24984073638916, "global_step": 451441, "epoch": 2687} {"train_loss": -12.461652755737305, "global_step": 451442, "epoch": 2687} {"train_loss": -12.239233016967773, "global_step": 451443, "epoch": 2687} {"train_loss": -11.145126342773438, "global_step": 451444, "epoch": 2687} {"train_loss": -12.571035385131836, "global_step": 451445, "epoch": 2687} {"train_loss": -11.784709930419922, "global_step": 451446, "epoch": 2687} {"train_loss": -11.10869026184082, "global_step": 451447, "epoch": 2687} {"train_loss": -12.720645904541016, "global_step": 451448, "epoch": 2687} {"train_loss": -10.456602096557617, "global_step": 451449, "epoch": 2687} {"train_loss": -11.364648818969727, "global_step": 451450, "epoch": 2687} {"train_loss": -10.623177528381348, "global_step": 451451, "epoch": 2687} {"train_loss": -10.967981338500977, "global_step": 451452, "epoch": 2687} {"train_loss": -11.299647331237793, "global_step": 451453, "epoch": 2687} {"train_loss": -11.430373191833496, "global_step": 451454, "epoch": 2687} {"train_loss": -10.024352073669434, "global_step": 451455, "epoch": 2687} {"train_loss": -11.936291694641113, "global_step": 451456, "epoch": 2687} {"train_loss": -11.184799194335938, "global_step": 451457, "epoch": 2687} {"train_loss": -12.341337203979492, "global_step": 451458, "epoch": 2687} {"train_loss": -11.785982131958008, "global_step": 451459, "epoch": 2687} {"train_loss": -11.975360870361328, "global_step": 451460, "epoch": 2687} {"train_loss": -12.019527435302734, "global_step": 451461, "epoch": 2687} {"train_loss": -12.058828353881836, "global_step": 451462, "epoch": 2687} {"train_loss": -12.387392044067383, "global_step": 451463, "epoch": 2687} {"train_loss": -12.205238342285156, "global_step": 451464, "epoch": 2687} {"train_loss": -11.648178100585938, "global_step": 451465, "epoch": 2687} {"train_loss": -12.061543464660645, "global_step": 451466, "epoch": 2687} {"train_loss": -12.021101951599121, "global_step": 451467, "epoch": 2687} {"train_loss": -12.049243927001953, "global_step": 451468, "epoch": 2687} {"train_loss": -11.927698135375977, "global_step": 451469, "epoch": 2687} {"train_loss": -11.846567153930664, "global_step": 451470, "epoch": 2687} {"train_loss": -11.94194221496582, "global_step": 451471, "epoch": 2687} {"train_loss": -11.722539901733398, "global_step": 451472, "epoch": 2687} {"train_loss": -12.368390083312988, "global_step": 451473, "epoch": 2687} {"train_loss": -12.08327865600586, "global_step": 451474, "epoch": 2687} {"train_loss": -12.119401931762695, "global_step": 451475, "epoch": 2687} {"train_loss": -12.126020431518555, "global_step": 451476, "epoch": 2687} {"train_loss": -12.20926284790039, "global_step": 451477, "epoch": 2687} {"train_loss": -11.864742279052734, "global_step": 451478, "epoch": 2687} {"train_loss": -11.823434829711914, "global_step": 451479, "epoch": 2687} {"train_loss": -12.029146194458008, "global_step": 451480, "epoch": 2687} {"train_loss": -12.169717788696289, "global_step": 451481, "epoch": 2687} {"train_loss": -11.988265991210938, "global_step": 451482, "epoch": 2687} {"train_loss": -12.347023010253906, "global_step": 451483, "epoch": 2687} {"train_loss": -12.229219436645508, "global_step": 451484, "epoch": 2687} {"train_loss": -12.24820327758789, "global_step": 451485, "epoch": 2687} {"train_loss": -12.129690170288086, "global_step": 451486, "epoch": 2687} {"train_loss": -12.240242004394531, "global_step": 451487, "epoch": 2687} {"train_loss": -11.97143268585205, "global_step": 451488, "epoch": 2687} {"train_loss": -11.957990646362305, "global_step": 451489, "epoch": 2687} {"train_loss": -12.665763854980469, "global_step": 451490, "epoch": 2687} {"train_loss": -12.341536521911621, "global_step": 451491, "epoch": 2687} {"train_loss": -12.463922500610352, "global_step": 451492, "epoch": 2687} {"train_loss": -12.384086608886719, "global_step": 451493, "epoch": 2687} {"train_loss": -12.5103120803833, "global_step": 451494, "epoch": 2687} {"train_loss": -12.547449111938477, "global_step": 451495, "epoch": 2687} {"train_loss": -12.591769218444824, "global_step": 451496, "epoch": 2687} {"train_loss": -12.207904815673828, "global_step": 451497, "epoch": 2687} {"train_loss": -12.720062255859375, "global_step": 451498, "epoch": 2687} {"train_loss": -11.60279655456543, "global_step": 451499, "epoch": 2687} {"train_loss": -12.520809173583984, "global_step": 451500, "epoch": 2687} {"train_loss": -12.403584480285645, "global_step": 451501, "epoch": 2687} {"train_loss": -11.932520866394043, "global_step": 451502, "epoch": 2687} {"train_loss": -12.565266609191895, "global_step": 451503, "epoch": 2687} {"train_loss": -12.340898513793945, "global_step": 451504, "epoch": 2687} {"train_loss": -12.008198738098145, "global_step": 451505, "epoch": 2687} {"train_loss": -12.412044525146484, "global_step": 451506, "epoch": 2687} {"train_loss": -12.32961654663086, "global_step": 451507, "epoch": 2687} {"train_loss": -12.00588321685791, "global_step": 451508, "epoch": 2687} {"train_loss": -11.952522277832031, "global_step": 451509, "epoch": 2687} {"train_loss": -12.156726837158203, "global_step": 451510, "epoch": 2687} {"train_loss": -12.249436378479004, "global_step": 451511, "epoch": 2687} {"train_loss": -11.837451934814453, "global_step": 451512, "epoch": 2687} {"train_loss": -12.654007911682129, "global_step": 451513, "epoch": 2687} {"train_loss": -11.963722229003906, "global_step": 451514, "epoch": 2687} {"train_loss": -11.725639343261719, "global_step": 451515, "epoch": 2687} {"train_loss": -12.648767471313477, "global_step": 451516, "epoch": 2687} {"train_loss": -10.872184753417969, "global_step": 451517, "epoch": 2687} {"train_loss": -11.896021842956543, "global_step": 451518, "epoch": 2687} {"train_loss": -11.490628242492676, "global_step": 451519, "epoch": 2687} {"train_loss": -10.319067001342773, "global_step": 451520, "epoch": 2687} {"train_loss": -9.915364265441895, "global_step": 451521, "epoch": 2687} {"train_loss": -11.942876815795898, "global_step": 451522, "epoch": 2687} {"train_loss": -8.722509384155273, "global_step": 451523, "epoch": 2687} {"train_loss": -8.306652069091797, "global_step": 451524, "epoch": 2687} {"train_loss": -8.594449996948242, "global_step": 451525, "epoch": 2687} {"train_loss": -9.560375213623047, "global_step": 451526, "epoch": 2687} {"train_loss": -9.735466957092285, "global_step": 451527, "epoch": 2687} {"train_loss": -11.490564346313477, "global_step": 451528, "epoch": 2687} {"train_loss": -10.628501892089844, "global_step": 451529, "epoch": 2687} {"train_loss": -12.030599594116211, "global_step": 451530, "epoch": 2687} {"train_loss": -10.445123672485352, "global_step": 451531, "epoch": 2687} {"train_loss": -11.385891914367676, "global_step": 451532, "epoch": 2687} {"train_loss": -8.438888549804688, "global_step": 451533, "epoch": 2687} {"train_loss": -9.630526542663574, "global_step": 451534, "epoch": 2687} {"train_loss": -10.77828598022461, "global_step": 451535, "epoch": 2687} {"train_loss": -9.713476181030273, "global_step": 451536, "epoch": 2687} {"train_loss": -9.014726638793945, "global_step": 451537, "epoch": 2687} {"train_loss": -11.454912185668945, "global_step": 451538, "epoch": 2687} {"train_loss": -9.36699390411377, "global_step": 451539, "epoch": 2687} {"train_loss": -10.92098617553711, "global_step": 451540, "epoch": 2687} {"train_loss": -10.092855453491211, "global_step": 451541, "epoch": 2687} {"train_loss": -10.012654304504395, "global_step": 451542, "epoch": 2687} {"train_loss": -10.403377532958984, "global_step": 451543, "epoch": 2687} {"train_loss": -10.844035148620605, "global_step": 451544, "epoch": 2687} {"train_loss": -11.3388671875, "global_step": 451545, "epoch": 2687} {"train_loss": -11.30162239074707, "global_step": 451546, "epoch": 2687} {"train_loss": -11.566177368164062, "global_step": 451547, "epoch": 2687} {"train_loss": -11.251578330993652, "global_step": 451548, "epoch": 2687} {"train_loss": -11.106189727783203, "global_step": 451549, "epoch": 2687} {"train_loss": -11.886356353759766, "global_step": 451550, "epoch": 2687} {"train_loss": -11.54964828491211, "global_step": 451551, "epoch": 2687} {"train_loss": -11.709430694580078, "global_step": 451552, "epoch": 2687} {"train_loss": -11.898752212524414, "global_step": 451553, "epoch": 2687} {"train_loss": -11.837051391601562, "global_step": 451554, "epoch": 2687} {"train_loss": -11.908148765563965, "global_step": 451555, "epoch": 2687} {"train_loss": -11.817517280578613, "global_step": 451556, "epoch": 2687} {"train_loss": -12.030274391174316, "global_step": 451557, "epoch": 2687} {"train_loss": -12.150044441223145, "global_step": 451558, "epoch": 2687} {"train_loss": -12.054353713989258, "global_step": 451559, "epoch": 2687} {"train_loss": -12.16987419128418, "global_step": 451560, "epoch": 2687} {"train_loss": -12.307242393493652, "global_step": 451561, "epoch": 2687} {"train_loss": -12.164276123046875, "global_step": 451562, "epoch": 2687} {"train_loss": -12.376446723937988, "global_step": 451563, "epoch": 2687} {"train_loss": -12.012646675109863, "global_step": 451564, "epoch": 2687} {"train_loss": -12.379124641418457, "global_step": 451565, "epoch": 2687} {"train_loss": -11.890501022338867, "global_step": 451566, "epoch": 2687} {"train_loss": -12.207071304321289, "global_step": 451567, "epoch": 2687} {"train_loss": -12.381143569946289, "global_step": 451568, "epoch": 2687} {"train_loss": -12.061399459838867, "global_step": 451569, "epoch": 2687} {"train_loss": -12.021655082702637, "global_step": 451570, "epoch": 2687} {"train_loss": -12.20553970336914, "global_step": 451571, "epoch": 2687} {"train_loss": -12.2844877243042, "global_step": 451572, "epoch": 2687} {"train_loss": -12.418107032775879, "global_step": 451573, "epoch": 2687} {"train_loss": -11.921598434448242, "global_step": 451574, "epoch": 2687} {"train_loss": -12.27147388458252, "global_step": 451575, "epoch": 2687} {"train_loss": -12.150665283203125, "global_step": 451576, "epoch": 2687} {"train_loss": -12.203285217285156, "global_step": 451577, "epoch": 2687} {"train_loss": -12.416879653930664, "global_step": 451578, "epoch": 2687} {"train_loss": -12.228825569152832, "global_step": 451579, "epoch": 2687} {"train_loss": -12.441078186035156, "global_step": 451580, "epoch": 2687} {"train_loss": -11.9503173828125, "global_step": 451581, "epoch": 2687} {"train_loss": -12.215811729431152, "global_step": 451582, "epoch": 2687} {"train_loss": -11.753170098577227, "global_step": 451583, "epoch": 2687, "val_loss": 307191.84375} {"train_loss": -12.428297996520996, "global_step": 451584, "epoch": 2688} {"train_loss": -12.068754196166992, "global_step": 451585, "epoch": 2688} {"train_loss": -11.729754447937012, "global_step": 451586, "epoch": 2688} {"train_loss": -12.344146728515625, "global_step": 451587, "epoch": 2688} {"train_loss": -11.799798965454102, "global_step": 451588, "epoch": 2688} {"train_loss": -12.674006462097168, "global_step": 451589, "epoch": 2688} {"train_loss": -12.297513008117676, "global_step": 451590, "epoch": 2688} {"train_loss": -12.343945503234863, "global_step": 451591, "epoch": 2688} {"train_loss": -12.2457275390625, "global_step": 451592, "epoch": 2688} {"train_loss": -12.412504196166992, "global_step": 451593, "epoch": 2688} {"train_loss": -12.532232284545898, "global_step": 451594, "epoch": 2688} {"train_loss": -12.318323135375977, "global_step": 451595, "epoch": 2688} {"train_loss": -12.524382591247559, "global_step": 451596, "epoch": 2688} {"train_loss": -12.43111515045166, "global_step": 451597, "epoch": 2688} {"train_loss": -12.099065780639648, "global_step": 451598, "epoch": 2688} {"train_loss": -12.329540252685547, "global_step": 451599, "epoch": 2688} {"train_loss": -12.39971923828125, "global_step": 451600, "epoch": 2688} {"train_loss": -12.092071533203125, "global_step": 451601, "epoch": 2688} {"train_loss": -12.283124923706055, "global_step": 451602, "epoch": 2688} {"train_loss": -12.156037330627441, "global_step": 451603, "epoch": 2688} {"train_loss": -11.976577758789062, "global_step": 451604, "epoch": 2688} {"train_loss": -12.070140838623047, "global_step": 451605, "epoch": 2688} {"train_loss": -12.273885726928711, "global_step": 451606, "epoch": 2688} {"train_loss": -11.510663032531738, "global_step": 451607, "epoch": 2688} {"train_loss": -12.38007640838623, "global_step": 451608, "epoch": 2688} {"train_loss": -12.2823486328125, "global_step": 451609, "epoch": 2688} {"train_loss": -12.167398452758789, "global_step": 451610, "epoch": 2688} {"train_loss": -12.188497543334961, "global_step": 451611, "epoch": 2688} {"train_loss": -12.333399772644043, "global_step": 451612, "epoch": 2688} {"train_loss": -12.470702171325684, "global_step": 451613, "epoch": 2688} {"train_loss": -12.374451637268066, "global_step": 451614, "epoch": 2688} {"train_loss": -12.246877670288086, "global_step": 451615, "epoch": 2688} {"train_loss": -12.12259292602539, "global_step": 451616, "epoch": 2688} {"train_loss": -12.220279693603516, "global_step": 451617, "epoch": 2688} {"train_loss": -12.388697624206543, "global_step": 451618, "epoch": 2688} {"train_loss": -12.378660202026367, "global_step": 451619, "epoch": 2688} {"train_loss": -12.11314582824707, "global_step": 451620, "epoch": 2688} {"train_loss": -12.14008903503418, "global_step": 451621, "epoch": 2688} {"train_loss": -11.991011619567871, "global_step": 451622, "epoch": 2688} {"train_loss": -12.186010360717773, "global_step": 451623, "epoch": 2688} {"train_loss": -11.916306495666504, "global_step": 451624, "epoch": 2688} {"train_loss": -12.23109245300293, "global_step": 451625, "epoch": 2688} {"train_loss": -11.900830268859863, "global_step": 451626, "epoch": 2688} {"train_loss": -12.629369735717773, "global_step": 451627, "epoch": 2688} {"train_loss": -12.39567756652832, "global_step": 451628, "epoch": 2688} {"train_loss": -12.469650268554688, "global_step": 451629, "epoch": 2688} {"train_loss": -12.13843822479248, "global_step": 451630, "epoch": 2688} {"train_loss": -12.080887794494629, "global_step": 451631, "epoch": 2688} {"train_loss": -12.652178764343262, "global_step": 451632, "epoch": 2688} {"train_loss": -12.212775230407715, "global_step": 451633, "epoch": 2688} {"train_loss": -12.519651412963867, "global_step": 451634, "epoch": 2688} {"train_loss": -12.078889846801758, "global_step": 451635, "epoch": 2688} {"train_loss": -11.451881408691406, "global_step": 451636, "epoch": 2688} {"train_loss": -11.81362533569336, "global_step": 451637, "epoch": 2688} {"train_loss": -12.181370735168457, "global_step": 451638, "epoch": 2688} {"train_loss": -12.080150604248047, "global_step": 451639, "epoch": 2688} {"train_loss": -11.798295974731445, "global_step": 451640, "epoch": 2688} {"train_loss": -12.12435531616211, "global_step": 451641, "epoch": 2688} {"train_loss": -11.49585247039795, "global_step": 451642, "epoch": 2688} {"train_loss": -11.478815078735352, "global_step": 451643, "epoch": 2688} {"train_loss": -12.694339752197266, "global_step": 451644, "epoch": 2688} {"train_loss": -11.537063598632812, "global_step": 451645, "epoch": 2688} {"train_loss": -12.175564765930176, "global_step": 451646, "epoch": 2688} {"train_loss": -11.947690963745117, "global_step": 451647, "epoch": 2688} {"train_loss": -11.97105598449707, "global_step": 451648, "epoch": 2688} {"train_loss": -12.174519538879395, "global_step": 451649, "epoch": 2688} {"train_loss": -12.136119842529297, "global_step": 451650, "epoch": 2688} {"train_loss": -12.114197731018066, "global_step": 451651, "epoch": 2688} {"train_loss": -12.3987455368042, "global_step": 451652, "epoch": 2688} {"train_loss": -11.644922256469727, "global_step": 451653, "epoch": 2688} {"train_loss": -12.205863952636719, "global_step": 451654, "epoch": 2688} {"train_loss": -12.345236778259277, "global_step": 451655, "epoch": 2688} {"train_loss": -11.881526947021484, "global_step": 451656, "epoch": 2688} {"train_loss": -12.258158683776855, "global_step": 451657, "epoch": 2688} {"train_loss": -12.041533470153809, "global_step": 451658, "epoch": 2688} {"train_loss": -10.981428146362305, "global_step": 451659, "epoch": 2688} {"train_loss": -10.306978225708008, "global_step": 451660, "epoch": 2688} {"train_loss": -10.58228874206543, "global_step": 451661, "epoch": 2688} {"train_loss": -11.464947700500488, "global_step": 451662, "epoch": 2688} {"train_loss": -10.859914779663086, "global_step": 451663, "epoch": 2688} {"train_loss": -11.594755172729492, "global_step": 451664, "epoch": 2688} {"train_loss": -11.22305679321289, "global_step": 451665, "epoch": 2688} {"train_loss": -11.419395446777344, "global_step": 451666, "epoch": 2688} {"train_loss": -10.934231758117676, "global_step": 451667, "epoch": 2688} {"train_loss": -12.172589302062988, "global_step": 451668, "epoch": 2688} {"train_loss": -11.4955472946167, "global_step": 451669, "epoch": 2688} {"train_loss": -11.337209701538086, "global_step": 451670, "epoch": 2688} {"train_loss": -11.770841598510742, "global_step": 451671, "epoch": 2688} {"train_loss": -11.258378982543945, "global_step": 451672, "epoch": 2688} {"train_loss": -11.950836181640625, "global_step": 451673, "epoch": 2688} {"train_loss": -11.203702926635742, "global_step": 451674, "epoch": 2688} {"train_loss": -12.093908309936523, "global_step": 451675, "epoch": 2688} {"train_loss": -11.4158296585083, "global_step": 451676, "epoch": 2688} {"train_loss": -11.900175094604492, "global_step": 451677, "epoch": 2688} {"train_loss": -11.714286804199219, "global_step": 451678, "epoch": 2688} {"train_loss": -11.479511260986328, "global_step": 451679, "epoch": 2688} {"train_loss": -12.408329010009766, "global_step": 451680, "epoch": 2688} {"train_loss": -11.920653343200684, "global_step": 451681, "epoch": 2688} {"train_loss": -12.263813972473145, "global_step": 451682, "epoch": 2688} {"train_loss": -11.640179634094238, "global_step": 451683, "epoch": 2688} {"train_loss": -11.84485149383545, "global_step": 451684, "epoch": 2688} {"train_loss": -11.711652755737305, "global_step": 451685, "epoch": 2688} {"train_loss": -12.21497917175293, "global_step": 451686, "epoch": 2688} {"train_loss": -11.914274215698242, "global_step": 451687, "epoch": 2688} {"train_loss": -12.098146438598633, "global_step": 451688, "epoch": 2688} {"train_loss": -12.1045560836792, "global_step": 451689, "epoch": 2688} {"train_loss": -12.148073196411133, "global_step": 451690, "epoch": 2688} {"train_loss": -12.31779670715332, "global_step": 451691, "epoch": 2688} {"train_loss": -12.009130477905273, "global_step": 451692, "epoch": 2688} {"train_loss": -12.088823318481445, "global_step": 451693, "epoch": 2688} {"train_loss": -12.09296703338623, "global_step": 451694, "epoch": 2688} {"train_loss": -12.022594451904297, "global_step": 451695, "epoch": 2688} {"train_loss": -12.323101043701172, "global_step": 451696, "epoch": 2688} {"train_loss": -11.974223136901855, "global_step": 451697, "epoch": 2688} {"train_loss": -12.370231628417969, "global_step": 451698, "epoch": 2688} {"train_loss": -11.96591567993164, "global_step": 451699, "epoch": 2688} {"train_loss": -12.213332176208496, "global_step": 451700, "epoch": 2688} {"train_loss": -11.946565628051758, "global_step": 451701, "epoch": 2688} {"train_loss": -12.135753631591797, "global_step": 451702, "epoch": 2688} {"train_loss": -11.858166694641113, "global_step": 451703, "epoch": 2688} {"train_loss": -11.75936222076416, "global_step": 451704, "epoch": 2688} {"train_loss": -12.027180671691895, "global_step": 451705, "epoch": 2688} {"train_loss": -10.997419357299805, "global_step": 451706, "epoch": 2688} {"train_loss": -11.707858085632324, "global_step": 451707, "epoch": 2688} {"train_loss": -11.23741340637207, "global_step": 451708, "epoch": 2688} {"train_loss": -11.82046890258789, "global_step": 451709, "epoch": 2688} {"train_loss": -11.56301498413086, "global_step": 451710, "epoch": 2688} {"train_loss": -11.767717361450195, "global_step": 451711, "epoch": 2688} {"train_loss": -11.788753509521484, "global_step": 451712, "epoch": 2688} {"train_loss": -11.909900665283203, "global_step": 451713, "epoch": 2688} {"train_loss": -11.834253311157227, "global_step": 451714, "epoch": 2688} {"train_loss": -11.884858131408691, "global_step": 451715, "epoch": 2688} {"train_loss": -12.037428855895996, "global_step": 451716, "epoch": 2688} {"train_loss": -12.119460105895996, "global_step": 451717, "epoch": 2688} {"train_loss": -12.484609603881836, "global_step": 451718, "epoch": 2688} {"train_loss": -11.925497055053711, "global_step": 451719, "epoch": 2688} {"train_loss": -12.430523872375488, "global_step": 451720, "epoch": 2688} {"train_loss": -11.67791748046875, "global_step": 451721, "epoch": 2688} {"train_loss": -12.090672492980957, "global_step": 451722, "epoch": 2688} {"train_loss": -12.14940357208252, "global_step": 451723, "epoch": 2688} {"train_loss": -11.987667083740234, "global_step": 451724, "epoch": 2688} {"train_loss": -12.122135162353516, "global_step": 451725, "epoch": 2688} {"train_loss": -11.970024108886719, "global_step": 451726, "epoch": 2688} {"train_loss": -12.478031158447266, "global_step": 451727, "epoch": 2688} {"train_loss": -12.119900703430176, "global_step": 451728, "epoch": 2688} {"train_loss": -12.295646667480469, "global_step": 451729, "epoch": 2688} {"train_loss": -12.136436462402344, "global_step": 451730, "epoch": 2688} {"train_loss": -12.251678466796875, "global_step": 451731, "epoch": 2688} {"train_loss": -12.19596004486084, "global_step": 451732, "epoch": 2688} {"train_loss": -11.94019889831543, "global_step": 451733, "epoch": 2688} {"train_loss": -12.166675567626953, "global_step": 451734, "epoch": 2688} {"train_loss": -12.058631896972656, "global_step": 451735, "epoch": 2688} {"train_loss": -12.267772674560547, "global_step": 451736, "epoch": 2688} {"train_loss": -12.267971992492676, "global_step": 451737, "epoch": 2688} {"train_loss": -11.941213607788086, "global_step": 451738, "epoch": 2688} {"train_loss": -11.999978065490723, "global_step": 451739, "epoch": 2688} {"train_loss": -11.938526153564453, "global_step": 451740, "epoch": 2688} {"train_loss": -12.28262710571289, "global_step": 451741, "epoch": 2688} {"train_loss": -12.099411964416504, "global_step": 451742, "epoch": 2688} {"train_loss": -12.330327987670898, "global_step": 451743, "epoch": 2688} {"train_loss": -11.913021087646484, "global_step": 451744, "epoch": 2688} {"train_loss": -12.234554290771484, "global_step": 451745, "epoch": 2688} {"train_loss": -11.718267440795898, "global_step": 451746, "epoch": 2688} {"train_loss": -12.282397270202637, "global_step": 451747, "epoch": 2688} {"train_loss": -12.18001937866211, "global_step": 451748, "epoch": 2688} {"train_loss": -12.113418579101562, "global_step": 451749, "epoch": 2688} {"train_loss": -12.146968841552734, "global_step": 451750, "epoch": 2688} {"train_loss": -12.012907073611306, "global_step": 451751, "epoch": 2688, "val_loss": 307206.0} {"train_loss": -12.354957580566406, "global_step": 451752, "epoch": 2689} {"train_loss": -12.290741920471191, "global_step": 451753, "epoch": 2689} {"train_loss": -12.01829719543457, "global_step": 451754, "epoch": 2689} {"train_loss": -11.891353607177734, "global_step": 451755, "epoch": 2689} {"train_loss": -11.473844528198242, "global_step": 451756, "epoch": 2689} {"train_loss": -12.195789337158203, "global_step": 451757, "epoch": 2689} {"train_loss": -11.715103149414062, "global_step": 451758, "epoch": 2689} {"train_loss": -11.917228698730469, "global_step": 451759, "epoch": 2689} {"train_loss": -12.369193077087402, "global_step": 451760, "epoch": 2689} {"train_loss": -12.279972076416016, "global_step": 451761, "epoch": 2689} {"train_loss": -12.220611572265625, "global_step": 451762, "epoch": 2689} {"train_loss": -12.15986442565918, "global_step": 451763, "epoch": 2689} {"train_loss": -12.22938346862793, "global_step": 451764, "epoch": 2689} {"train_loss": -11.710774421691895, "global_step": 451765, "epoch": 2689} {"train_loss": -11.943559646606445, "global_step": 451766, "epoch": 2689} {"train_loss": -11.973390579223633, "global_step": 451767, "epoch": 2689} {"train_loss": -11.58493423461914, "global_step": 451768, "epoch": 2689} {"train_loss": -12.59412956237793, "global_step": 451769, "epoch": 2689} {"train_loss": -11.909025192260742, "global_step": 451770, "epoch": 2689} {"train_loss": -12.248497009277344, "global_step": 451771, "epoch": 2689} {"train_loss": -12.304084777832031, "global_step": 451772, "epoch": 2689} {"train_loss": -12.234042167663574, "global_step": 451773, "epoch": 2689} {"train_loss": -12.415154457092285, "global_step": 451774, "epoch": 2689} {"train_loss": -12.191581726074219, "global_step": 451775, "epoch": 2689} {"train_loss": -12.491966247558594, "global_step": 451776, "epoch": 2689} {"train_loss": -12.461440086364746, "global_step": 451777, "epoch": 2689} {"train_loss": -12.313314437866211, "global_step": 451778, "epoch": 2689} {"train_loss": -12.804727554321289, "global_step": 451779, "epoch": 2689} {"train_loss": -12.495466232299805, "global_step": 451780, "epoch": 2689} {"train_loss": -12.560884475708008, "global_step": 451781, "epoch": 2689} {"train_loss": -12.400629043579102, "global_step": 451782, "epoch": 2689} {"train_loss": -12.643173217773438, "global_step": 451783, "epoch": 2689} {"train_loss": -12.755441665649414, "global_step": 451784, "epoch": 2689} {"train_loss": -12.5525541305542, "global_step": 451785, "epoch": 2689} {"train_loss": -12.71731185913086, "global_step": 451786, "epoch": 2689} {"train_loss": -12.472997665405273, "global_step": 451787, "epoch": 2689} {"train_loss": -12.31037712097168, "global_step": 451788, "epoch": 2689} {"train_loss": -12.476338386535645, "global_step": 451789, "epoch": 2689} {"train_loss": -12.367021560668945, "global_step": 451790, "epoch": 2689} {"train_loss": -12.568695068359375, "global_step": 451791, "epoch": 2689} {"train_loss": -12.474679946899414, "global_step": 451792, "epoch": 2689} {"train_loss": -12.545930862426758, "global_step": 451793, "epoch": 2689} {"train_loss": -12.465755462646484, "global_step": 451794, "epoch": 2689} {"train_loss": -12.661147117614746, "global_step": 451795, "epoch": 2689} {"train_loss": -12.626810073852539, "global_step": 451796, "epoch": 2689} {"train_loss": -12.584428787231445, "global_step": 451797, "epoch": 2689} {"train_loss": -12.424848556518555, "global_step": 451798, "epoch": 2689} {"train_loss": -12.644246101379395, "global_step": 451799, "epoch": 2689} {"train_loss": -12.686173439025879, "global_step": 451800, "epoch": 2689} {"train_loss": -12.685466766357422, "global_step": 451801, "epoch": 2689} {"train_loss": -12.84929084777832, "global_step": 451802, "epoch": 2689} {"train_loss": -12.759307861328125, "global_step": 451803, "epoch": 2689} {"train_loss": -12.670315742492676, "global_step": 451804, "epoch": 2689} {"train_loss": -12.906508445739746, "global_step": 451805, "epoch": 2689} {"train_loss": -12.72891616821289, "global_step": 451806, "epoch": 2689} {"train_loss": -12.549636840820312, "global_step": 451807, "epoch": 2689} {"train_loss": -12.75172233581543, "global_step": 451808, "epoch": 2689} {"train_loss": -12.459218978881836, "global_step": 451809, "epoch": 2689} {"train_loss": -12.779440879821777, "global_step": 451810, "epoch": 2689} {"train_loss": -12.322118759155273, "global_step": 451811, "epoch": 2689} {"train_loss": -12.882831573486328, "global_step": 451812, "epoch": 2689} {"train_loss": -12.801427841186523, "global_step": 451813, "epoch": 2689} {"train_loss": -12.667940139770508, "global_step": 451814, "epoch": 2689} {"train_loss": -12.81789493560791, "global_step": 451815, "epoch": 2689} {"train_loss": -12.635009765625, "global_step": 451816, "epoch": 2689} {"train_loss": -12.736967086791992, "global_step": 451817, "epoch": 2689} {"train_loss": -12.648134231567383, "global_step": 451818, "epoch": 2689} {"train_loss": -12.783432006835938, "global_step": 451819, "epoch": 2689} {"train_loss": -12.45301342010498, "global_step": 451820, "epoch": 2689} {"train_loss": -12.7760009765625, "global_step": 451821, "epoch": 2689} {"train_loss": -12.486021041870117, "global_step": 451822, "epoch": 2689} {"train_loss": -12.721940994262695, "global_step": 451823, "epoch": 2689} {"train_loss": -12.700613021850586, "global_step": 451824, "epoch": 2689} {"train_loss": -12.894184112548828, "global_step": 451825, "epoch": 2689} {"train_loss": -12.510894775390625, "global_step": 451826, "epoch": 2689} {"train_loss": -12.698080062866211, "global_step": 451827, "epoch": 2689} {"train_loss": -12.438016891479492, "global_step": 451828, "epoch": 2689} {"train_loss": -12.856987953186035, "global_step": 451829, "epoch": 2689} {"train_loss": -12.330536842346191, "global_step": 451830, "epoch": 2689} {"train_loss": -12.628341674804688, "global_step": 451831, "epoch": 2689} {"train_loss": -12.462095260620117, "global_step": 451832, "epoch": 2689} {"train_loss": -12.882913589477539, "global_step": 451833, "epoch": 2689} {"train_loss": -12.65707015991211, "global_step": 451834, "epoch": 2689} {"train_loss": -12.311079978942871, "global_step": 451835, "epoch": 2689} {"train_loss": -12.51339054107666, "global_step": 451836, "epoch": 2689} {"train_loss": -12.533723831176758, "global_step": 451837, "epoch": 2689} {"train_loss": -12.85588264465332, "global_step": 451838, "epoch": 2689} {"train_loss": -12.341836929321289, "global_step": 451839, "epoch": 2689} {"train_loss": -12.52119255065918, "global_step": 451840, "epoch": 2689} {"train_loss": -12.363828659057617, "global_step": 451841, "epoch": 2689} {"train_loss": -12.492441177368164, "global_step": 451842, "epoch": 2689} {"train_loss": -12.684993743896484, "global_step": 451843, "epoch": 2689} {"train_loss": -12.47182846069336, "global_step": 451844, "epoch": 2689} {"train_loss": -12.86840534210205, "global_step": 451845, "epoch": 2689} {"train_loss": -12.149173736572266, "global_step": 451846, "epoch": 2689} {"train_loss": -12.44488525390625, "global_step": 451847, "epoch": 2689} {"train_loss": -12.223676681518555, "global_step": 451848, "epoch": 2689} {"train_loss": -12.199798583984375, "global_step": 451849, "epoch": 2689} {"train_loss": -12.385662078857422, "global_step": 451850, "epoch": 2689} {"train_loss": -12.178176879882812, "global_step": 451851, "epoch": 2689} {"train_loss": -11.570246696472168, "global_step": 451852, "epoch": 2689} {"train_loss": -12.225927352905273, "global_step": 451853, "epoch": 2689} {"train_loss": -12.346195220947266, "global_step": 451854, "epoch": 2689} {"train_loss": -11.604787826538086, "global_step": 451855, "epoch": 2689} {"train_loss": -12.298105239868164, "global_step": 451856, "epoch": 2689} {"train_loss": -11.787178039550781, "global_step": 451857, "epoch": 2689} {"train_loss": -11.2736177444458, "global_step": 451858, "epoch": 2689} {"train_loss": -11.562335968017578, "global_step": 451859, "epoch": 2689} {"train_loss": -11.849225997924805, "global_step": 451860, "epoch": 2689} {"train_loss": -10.341632843017578, "global_step": 451861, "epoch": 2689} {"train_loss": -11.867746353149414, "global_step": 451862, "epoch": 2689} {"train_loss": -10.466148376464844, "global_step": 451863, "epoch": 2689} {"train_loss": -10.315338134765625, "global_step": 451864, "epoch": 2689} {"train_loss": -11.164536476135254, "global_step": 451865, "epoch": 2689} {"train_loss": -9.391339302062988, "global_step": 451866, "epoch": 2689} {"train_loss": -11.09126091003418, "global_step": 451867, "epoch": 2689} {"train_loss": -11.237926483154297, "global_step": 451868, "epoch": 2689} {"train_loss": -11.16301155090332, "global_step": 451869, "epoch": 2689} {"train_loss": -10.769530296325684, "global_step": 451870, "epoch": 2689} {"train_loss": -10.341558456420898, "global_step": 451871, "epoch": 2689} {"train_loss": -11.390071868896484, "global_step": 451872, "epoch": 2689} {"train_loss": -11.274235725402832, "global_step": 451873, "epoch": 2689} {"train_loss": -10.169071197509766, "global_step": 451874, "epoch": 2689} {"train_loss": -9.166009902954102, "global_step": 451875, "epoch": 2689} {"train_loss": -11.023099899291992, "global_step": 451876, "epoch": 2689} {"train_loss": -9.950687408447266, "global_step": 451877, "epoch": 2689} {"train_loss": -6.620941162109375, "global_step": 451878, "epoch": 2689} {"train_loss": -10.520240783691406, "global_step": 451879, "epoch": 2689} {"train_loss": -9.816211700439453, "global_step": 451880, "epoch": 2689} {"train_loss": -10.258358001708984, "global_step": 451881, "epoch": 2689} {"train_loss": -7.343411445617676, "global_step": 451882, "epoch": 2689} {"train_loss": -8.942846298217773, "global_step": 451883, "epoch": 2689} {"train_loss": -10.181907653808594, "global_step": 451884, "epoch": 2689} {"train_loss": -10.500954627990723, "global_step": 451885, "epoch": 2689} {"train_loss": -9.65512466430664, "global_step": 451886, "epoch": 2689} {"train_loss": -10.328227996826172, "global_step": 451887, "epoch": 2689} {"train_loss": -11.252066612243652, "global_step": 451888, "epoch": 2689} {"train_loss": -10.235427856445312, "global_step": 451889, "epoch": 2689} {"train_loss": -10.484190940856934, "global_step": 451890, "epoch": 2689} {"train_loss": -10.905462265014648, "global_step": 451891, "epoch": 2689} {"train_loss": -11.005688667297363, "global_step": 451892, "epoch": 2689} {"train_loss": -10.634283065795898, "global_step": 451893, "epoch": 2689} {"train_loss": -11.176850318908691, "global_step": 451894, "epoch": 2689} {"train_loss": -11.066274642944336, "global_step": 451895, "epoch": 2689} {"train_loss": -11.575458526611328, "global_step": 451896, "epoch": 2689} {"train_loss": -11.11846923828125, "global_step": 451897, "epoch": 2689} {"train_loss": -11.718485832214355, "global_step": 451898, "epoch": 2689} {"train_loss": -11.977593421936035, "global_step": 451899, "epoch": 2689} {"train_loss": -11.474849700927734, "global_step": 451900, "epoch": 2689} {"train_loss": -11.48452377319336, "global_step": 451901, "epoch": 2689} {"train_loss": -11.68394947052002, "global_step": 451902, "epoch": 2689} {"train_loss": -11.818639755249023, "global_step": 451903, "epoch": 2689} {"train_loss": -11.55439567565918, "global_step": 451904, "epoch": 2689} {"train_loss": -12.228557586669922, "global_step": 451905, "epoch": 2689} {"train_loss": -11.554523468017578, "global_step": 451906, "epoch": 2689} {"train_loss": -12.007535934448242, "global_step": 451907, "epoch": 2689} {"train_loss": -11.924123764038086, "global_step": 451908, "epoch": 2689} {"train_loss": -11.90873908996582, "global_step": 451909, "epoch": 2689} {"train_loss": -12.186545372009277, "global_step": 451910, "epoch": 2689} {"train_loss": -12.05810260772705, "global_step": 451911, "epoch": 2689} {"train_loss": -11.984525680541992, "global_step": 451912, "epoch": 2689} {"train_loss": -12.43995475769043, "global_step": 451913, "epoch": 2689} {"train_loss": -12.292552947998047, "global_step": 451914, "epoch": 2689} {"train_loss": -12.193145751953125, "global_step": 451915, "epoch": 2689} {"train_loss": -12.265922546386719, "global_step": 451916, "epoch": 2689} {"train_loss": -12.348743438720703, "global_step": 451917, "epoch": 2689} {"train_loss": -12.158132553100586, "global_step": 451918, "epoch": 2689} {"train_loss": -11.910502297537667, "global_step": 451919, "epoch": 2689, "val_loss": 311559.0} {"train_loss": -12.181266784667969, "global_step": 451920, "epoch": 2690} {"train_loss": -12.44621467590332, "global_step": 451921, "epoch": 2690} {"train_loss": -12.083688735961914, "global_step": 451922, "epoch": 2690} {"train_loss": -12.290558815002441, "global_step": 451923, "epoch": 2690} {"train_loss": -12.2685546875, "global_step": 451924, "epoch": 2690} {"train_loss": -12.238399505615234, "global_step": 451925, "epoch": 2690} {"train_loss": -12.305408477783203, "global_step": 451926, "epoch": 2690} {"train_loss": -12.501592636108398, "global_step": 451927, "epoch": 2690} {"train_loss": -12.532251358032227, "global_step": 451928, "epoch": 2690} {"train_loss": -12.489636421203613, "global_step": 451929, "epoch": 2690} {"train_loss": -12.529830932617188, "global_step": 451930, "epoch": 2690} {"train_loss": -12.58108901977539, "global_step": 451931, "epoch": 2690} {"train_loss": -12.262075424194336, "global_step": 451932, "epoch": 2690} {"train_loss": -12.446154594421387, "global_step": 451933, "epoch": 2690} {"train_loss": -12.339376449584961, "global_step": 451934, "epoch": 2690} {"train_loss": -12.441875457763672, "global_step": 451935, "epoch": 2690} {"train_loss": -12.689118385314941, "global_step": 451936, "epoch": 2690} {"train_loss": -12.595121383666992, "global_step": 451937, "epoch": 2690} {"train_loss": -12.450140953063965, "global_step": 451938, "epoch": 2690} {"train_loss": -12.624545097351074, "global_step": 451939, "epoch": 2690} {"train_loss": -12.467973709106445, "global_step": 451940, "epoch": 2690} {"train_loss": -12.54446792602539, "global_step": 451941, "epoch": 2690} {"train_loss": -12.750242233276367, "global_step": 451942, "epoch": 2690} {"train_loss": -12.455951690673828, "global_step": 451943, "epoch": 2690} {"train_loss": -12.642220497131348, "global_step": 451944, "epoch": 2690} {"train_loss": -12.60154914855957, "global_step": 451945, "epoch": 2690} {"train_loss": -12.586861610412598, "global_step": 451946, "epoch": 2690} {"train_loss": -12.548981666564941, "global_step": 451947, "epoch": 2690} {"train_loss": -12.791107177734375, "global_step": 451948, "epoch": 2690} {"train_loss": -12.602437019348145, "global_step": 451949, "epoch": 2690} {"train_loss": -12.708314895629883, "global_step": 451950, "epoch": 2690} {"train_loss": -12.717991828918457, "global_step": 451951, "epoch": 2690} {"train_loss": -12.609394073486328, "global_step": 451952, "epoch": 2690} {"train_loss": -12.76732063293457, "global_step": 451953, "epoch": 2690} {"train_loss": -12.783012390136719, "global_step": 451954, "epoch": 2690} {"train_loss": -12.961017608642578, "global_step": 451955, "epoch": 2690} {"train_loss": -12.700029373168945, "global_step": 451956, "epoch": 2690} {"train_loss": -12.955143928527832, "global_step": 451957, "epoch": 2690} {"train_loss": -12.549080848693848, "global_step": 451958, "epoch": 2690} {"train_loss": -12.817092895507812, "global_step": 451959, "epoch": 2690} {"train_loss": -12.518251419067383, "global_step": 451960, "epoch": 2690} {"train_loss": -12.66231918334961, "global_step": 451961, "epoch": 2690} {"train_loss": -12.504079818725586, "global_step": 451962, "epoch": 2690} {"train_loss": -12.791899681091309, "global_step": 451963, "epoch": 2690} {"train_loss": -12.682517051696777, "global_step": 451964, "epoch": 2690} {"train_loss": -12.664199829101562, "global_step": 451965, "epoch": 2690} {"train_loss": -12.85270881652832, "global_step": 451966, "epoch": 2690} {"train_loss": -12.576016426086426, "global_step": 451967, "epoch": 2690} {"train_loss": -12.922378540039062, "global_step": 451968, "epoch": 2690} {"train_loss": -12.597932815551758, "global_step": 451969, "epoch": 2690} {"train_loss": -12.69308853149414, "global_step": 451970, "epoch": 2690} {"train_loss": -12.67623519897461, "global_step": 451971, "epoch": 2690} {"train_loss": -12.602176666259766, "global_step": 451972, "epoch": 2690} {"train_loss": -12.838920593261719, "global_step": 451973, "epoch": 2690} {"train_loss": -12.647781372070312, "global_step": 451974, "epoch": 2690} {"train_loss": -12.859247207641602, "global_step": 451975, "epoch": 2690} {"train_loss": -12.625816345214844, "global_step": 451976, "epoch": 2690} {"train_loss": -12.63625431060791, "global_step": 451977, "epoch": 2690} {"train_loss": -12.705178260803223, "global_step": 451978, "epoch": 2690} {"train_loss": -12.548301696777344, "global_step": 451979, "epoch": 2690} {"train_loss": -12.387210845947266, "global_step": 451980, "epoch": 2690} {"train_loss": -12.907154083251953, "global_step": 451981, "epoch": 2690} {"train_loss": -12.483871459960938, "global_step": 451982, "epoch": 2690} {"train_loss": -12.641834259033203, "global_step": 451983, "epoch": 2690} {"train_loss": -12.39511775970459, "global_step": 451984, "epoch": 2690} {"train_loss": -12.878488540649414, "global_step": 451985, "epoch": 2690} {"train_loss": -12.625682830810547, "global_step": 451986, "epoch": 2690} {"train_loss": -12.771805763244629, "global_step": 451987, "epoch": 2690} {"train_loss": -12.419025421142578, "global_step": 451988, "epoch": 2690} {"train_loss": -12.556646347045898, "global_step": 451989, "epoch": 2690} {"train_loss": -12.921820640563965, "global_step": 451990, "epoch": 2690} {"train_loss": -12.73055362701416, "global_step": 451991, "epoch": 2690} {"train_loss": -11.797691345214844, "global_step": 451992, "epoch": 2690} {"train_loss": -12.385584831237793, "global_step": 451993, "epoch": 2690} {"train_loss": -12.416243553161621, "global_step": 451994, "epoch": 2690} {"train_loss": -12.012794494628906, "global_step": 451995, "epoch": 2690} {"train_loss": -11.128351211547852, "global_step": 451996, "epoch": 2690} {"train_loss": -12.827157974243164, "global_step": 451997, "epoch": 2690} {"train_loss": -11.491182327270508, "global_step": 451998, "epoch": 2690} {"train_loss": -11.603100776672363, "global_step": 451999, "epoch": 2690} {"train_loss": -12.646361351013184, "global_step": 452000, "epoch": 2690} {"train_loss": -12.469132423400879, "global_step": 452001, "epoch": 2690} {"train_loss": -10.75406265258789, "global_step": 452002, "epoch": 2690} {"train_loss": -11.724358558654785, "global_step": 452003, "epoch": 2690} {"train_loss": -11.840267181396484, "global_step": 452004, "epoch": 2690} {"train_loss": -11.615957260131836, "global_step": 452005, "epoch": 2690} {"train_loss": -11.559794425964355, "global_step": 452006, "epoch": 2690} {"train_loss": -12.309247016906738, "global_step": 452007, "epoch": 2690} {"train_loss": -11.475619316101074, "global_step": 452008, "epoch": 2690} {"train_loss": -10.701786041259766, "global_step": 452009, "epoch": 2690} {"train_loss": -12.577583312988281, "global_step": 452010, "epoch": 2690} {"train_loss": -11.547628402709961, "global_step": 452011, "epoch": 2690} {"train_loss": -12.363201141357422, "global_step": 452012, "epoch": 2690} {"train_loss": -11.499452590942383, "global_step": 452013, "epoch": 2690} {"train_loss": -12.374393463134766, "global_step": 452014, "epoch": 2690} {"train_loss": -12.334218978881836, "global_step": 452015, "epoch": 2690} {"train_loss": -12.294938087463379, "global_step": 452016, "epoch": 2690} {"train_loss": -12.501382827758789, "global_step": 452017, "epoch": 2690} {"train_loss": -11.863164901733398, "global_step": 452018, "epoch": 2690} {"train_loss": -12.209123611450195, "global_step": 452019, "epoch": 2690} {"train_loss": -12.456257820129395, "global_step": 452020, "epoch": 2690} {"train_loss": -11.953083038330078, "global_step": 452021, "epoch": 2690} {"train_loss": -11.429045677185059, "global_step": 452022, "epoch": 2690} {"train_loss": -12.467550277709961, "global_step": 452023, "epoch": 2690} {"train_loss": -12.201659202575684, "global_step": 452024, "epoch": 2690} {"train_loss": -12.46065902709961, "global_step": 452025, "epoch": 2690} {"train_loss": -12.082399368286133, "global_step": 452026, "epoch": 2690} {"train_loss": -12.166524887084961, "global_step": 452027, "epoch": 2690} {"train_loss": -12.550212860107422, "global_step": 452028, "epoch": 2690} {"train_loss": -12.29544448852539, "global_step": 452029, "epoch": 2690} {"train_loss": -12.633454322814941, "global_step": 452030, "epoch": 2690} {"train_loss": -11.993318557739258, "global_step": 452031, "epoch": 2690} {"train_loss": -12.495285034179688, "global_step": 452032, "epoch": 2690} {"train_loss": -12.279096603393555, "global_step": 452033, "epoch": 2690} {"train_loss": -11.804819107055664, "global_step": 452034, "epoch": 2690} {"train_loss": -11.778753280639648, "global_step": 452035, "epoch": 2690} {"train_loss": -12.345739364624023, "global_step": 452036, "epoch": 2690} {"train_loss": -12.068127632141113, "global_step": 452037, "epoch": 2690} {"train_loss": -12.427268981933594, "global_step": 452038, "epoch": 2690} {"train_loss": -12.593122482299805, "global_step": 452039, "epoch": 2690} {"train_loss": -12.07900619506836, "global_step": 452040, "epoch": 2690} {"train_loss": -12.476948738098145, "global_step": 452041, "epoch": 2690} {"train_loss": -12.502630233764648, "global_step": 452042, "epoch": 2690} {"train_loss": -12.28303337097168, "global_step": 452043, "epoch": 2690} {"train_loss": -12.085838317871094, "global_step": 452044, "epoch": 2690} {"train_loss": -12.716327667236328, "global_step": 452045, "epoch": 2690} {"train_loss": -12.040313720703125, "global_step": 452046, "epoch": 2690} {"train_loss": -12.672239303588867, "global_step": 452047, "epoch": 2690} {"train_loss": -12.361714363098145, "global_step": 452048, "epoch": 2690} {"train_loss": -12.702957153320312, "global_step": 452049, "epoch": 2690} {"train_loss": -12.328146934509277, "global_step": 452050, "epoch": 2690} {"train_loss": -12.695409774780273, "global_step": 452051, "epoch": 2690} {"train_loss": -12.267110824584961, "global_step": 452052, "epoch": 2690} {"train_loss": -11.892547607421875, "global_step": 452053, "epoch": 2690} {"train_loss": -12.624813079833984, "global_step": 452054, "epoch": 2690} {"train_loss": -11.868707656860352, "global_step": 452055, "epoch": 2690} {"train_loss": -12.300056457519531, "global_step": 452056, "epoch": 2690} {"train_loss": -11.887097358703613, "global_step": 452057, "epoch": 2690} {"train_loss": -11.780527114868164, "global_step": 452058, "epoch": 2690} {"train_loss": -12.089950561523438, "global_step": 452059, "epoch": 2690} {"train_loss": -11.353355407714844, "global_step": 452060, "epoch": 2690} {"train_loss": -12.523324966430664, "global_step": 452061, "epoch": 2690} {"train_loss": -11.898744583129883, "global_step": 452062, "epoch": 2690} {"train_loss": -12.192100524902344, "global_step": 452063, "epoch": 2690} {"train_loss": -12.436010360717773, "global_step": 452064, "epoch": 2690} {"train_loss": -11.136249542236328, "global_step": 452065, "epoch": 2690} {"train_loss": -12.414432525634766, "global_step": 452066, "epoch": 2690} {"train_loss": -12.025150299072266, "global_step": 452067, "epoch": 2690} {"train_loss": -12.462119102478027, "global_step": 452068, "epoch": 2690} {"train_loss": -12.395296096801758, "global_step": 452069, "epoch": 2690} {"train_loss": -12.416278839111328, "global_step": 452070, "epoch": 2690} {"train_loss": -12.626386642456055, "global_step": 452071, "epoch": 2690} {"train_loss": -12.451753616333008, "global_step": 452072, "epoch": 2690} {"train_loss": -12.5404052734375, "global_step": 452073, "epoch": 2690} {"train_loss": -12.828557968139648, "global_step": 452074, "epoch": 2690} {"train_loss": -12.717264175415039, "global_step": 452075, "epoch": 2690} {"train_loss": -12.504648208618164, "global_step": 452076, "epoch": 2690} {"train_loss": -12.784475326538086, "global_step": 452077, "epoch": 2690} {"train_loss": -12.40957260131836, "global_step": 452078, "epoch": 2690} {"train_loss": -12.46217155456543, "global_step": 452079, "epoch": 2690} {"train_loss": -12.533075332641602, "global_step": 452080, "epoch": 2690} {"train_loss": -12.609443664550781, "global_step": 452081, "epoch": 2690} {"train_loss": -12.210411071777344, "global_step": 452082, "epoch": 2690} {"train_loss": -12.239936828613281, "global_step": 452083, "epoch": 2690} {"train_loss": -12.186134338378906, "global_step": 452084, "epoch": 2690} {"train_loss": -12.605971336364746, "global_step": 452085, "epoch": 2690} {"train_loss": -11.926871299743652, "global_step": 452086, "epoch": 2690} {"train_loss": -12.361762608800616, "global_step": 452087, "epoch": 2690, "val_loss": 314688.90625, "train_action_mse_error": 1.943185567855835} {"train_loss": -12.525496482849121, "global_step": 452088, "epoch": 2691} {"train_loss": -12.042742729187012, "global_step": 452089, "epoch": 2691} {"train_loss": -11.451323509216309, "global_step": 452090, "epoch": 2691} {"train_loss": -11.924005508422852, "global_step": 452091, "epoch": 2691} {"train_loss": -12.287505149841309, "global_step": 452092, "epoch": 2691} {"train_loss": -10.324592590332031, "global_step": 452093, "epoch": 2691} {"train_loss": -12.141769409179688, "global_step": 452094, "epoch": 2691} {"train_loss": -9.860197067260742, "global_step": 452095, "epoch": 2691} {"train_loss": -11.097349166870117, "global_step": 452096, "epoch": 2691} {"train_loss": -11.497580528259277, "global_step": 452097, "epoch": 2691} {"train_loss": -9.090651512145996, "global_step": 452098, "epoch": 2691} {"train_loss": -9.38602066040039, "global_step": 452099, "epoch": 2691} {"train_loss": -9.313289642333984, "global_step": 452100, "epoch": 2691} {"train_loss": -11.218925476074219, "global_step": 452101, "epoch": 2691} {"train_loss": -10.277776718139648, "global_step": 452102, "epoch": 2691} {"train_loss": -8.801843643188477, "global_step": 452103, "epoch": 2691} {"train_loss": -10.435464859008789, "global_step": 452104, "epoch": 2691} {"train_loss": -10.216972351074219, "global_step": 452105, "epoch": 2691} {"train_loss": -10.601993560791016, "global_step": 452106, "epoch": 2691} {"train_loss": -10.428998947143555, "global_step": 452107, "epoch": 2691} {"train_loss": -11.63191032409668, "global_step": 452108, "epoch": 2691} {"train_loss": -10.6619873046875, "global_step": 452109, "epoch": 2691} {"train_loss": -11.019855499267578, "global_step": 452110, "epoch": 2691} {"train_loss": -11.36701774597168, "global_step": 452111, "epoch": 2691} {"train_loss": -10.036219596862793, "global_step": 452112, "epoch": 2691} {"train_loss": -11.203710556030273, "global_step": 452113, "epoch": 2691} {"train_loss": -11.536019325256348, "global_step": 452114, "epoch": 2691} {"train_loss": -11.506939888000488, "global_step": 452115, "epoch": 2691} {"train_loss": -11.69709300994873, "global_step": 452116, "epoch": 2691} {"train_loss": -12.154631614685059, "global_step": 452117, "epoch": 2691} {"train_loss": -12.123855590820312, "global_step": 452118, "epoch": 2691} {"train_loss": -11.703275680541992, "global_step": 452119, "epoch": 2691} {"train_loss": -11.877492904663086, "global_step": 452120, "epoch": 2691} {"train_loss": -11.129498481750488, "global_step": 452121, "epoch": 2691} {"train_loss": -12.180635452270508, "global_step": 452122, "epoch": 2691} {"train_loss": -11.484832763671875, "global_step": 452123, "epoch": 2691} {"train_loss": -11.478196144104004, "global_step": 452124, "epoch": 2691} {"train_loss": -11.954835891723633, "global_step": 452125, "epoch": 2691} {"train_loss": -10.719581604003906, "global_step": 452126, "epoch": 2691} {"train_loss": -12.15261459350586, "global_step": 452127, "epoch": 2691} {"train_loss": -10.493507385253906, "global_step": 452128, "epoch": 2691} {"train_loss": -11.32539176940918, "global_step": 452129, "epoch": 2691} {"train_loss": -10.667217254638672, "global_step": 452130, "epoch": 2691} {"train_loss": -10.943674087524414, "global_step": 452131, "epoch": 2691} {"train_loss": -10.723894119262695, "global_step": 452132, "epoch": 2691} {"train_loss": -11.315317153930664, "global_step": 452133, "epoch": 2691} {"train_loss": -10.986831665039062, "global_step": 452134, "epoch": 2691} {"train_loss": -11.237741470336914, "global_step": 452135, "epoch": 2691} {"train_loss": -11.937532424926758, "global_step": 452136, "epoch": 2691} {"train_loss": -11.65240478515625, "global_step": 452137, "epoch": 2691} {"train_loss": -12.377481460571289, "global_step": 452138, "epoch": 2691} {"train_loss": -11.676021575927734, "global_step": 452139, "epoch": 2691} {"train_loss": -12.427804946899414, "global_step": 452140, "epoch": 2691} {"train_loss": -11.815771102905273, "global_step": 452141, "epoch": 2691} {"train_loss": -12.105627059936523, "global_step": 452142, "epoch": 2691} {"train_loss": -12.266130447387695, "global_step": 452143, "epoch": 2691} {"train_loss": -12.036317825317383, "global_step": 452144, "epoch": 2691} {"train_loss": -12.052597045898438, "global_step": 452145, "epoch": 2691} {"train_loss": -12.095252990722656, "global_step": 452146, "epoch": 2691} {"train_loss": -11.982427597045898, "global_step": 452147, "epoch": 2691} {"train_loss": -12.411101341247559, "global_step": 452148, "epoch": 2691} {"train_loss": -12.019149780273438, "global_step": 452149, "epoch": 2691} {"train_loss": -12.245532989501953, "global_step": 452150, "epoch": 2691} {"train_loss": -12.137235641479492, "global_step": 452151, "epoch": 2691} {"train_loss": -12.286101341247559, "global_step": 452152, "epoch": 2691} {"train_loss": -12.293720245361328, "global_step": 452153, "epoch": 2691} {"train_loss": -12.03135871887207, "global_step": 452154, "epoch": 2691} {"train_loss": -12.344558715820312, "global_step": 452155, "epoch": 2691} {"train_loss": -12.205732345581055, "global_step": 452156, "epoch": 2691} {"train_loss": -12.20309829711914, "global_step": 452157, "epoch": 2691} {"train_loss": -12.248984336853027, "global_step": 452158, "epoch": 2691} {"train_loss": -12.298295974731445, "global_step": 452159, "epoch": 2691} {"train_loss": -12.39881706237793, "global_step": 452160, "epoch": 2691} {"train_loss": -12.323955535888672, "global_step": 452161, "epoch": 2691} {"train_loss": -12.536746978759766, "global_step": 452162, "epoch": 2691} {"train_loss": -12.2796630859375, "global_step": 452163, "epoch": 2691} {"train_loss": -12.411094665527344, "global_step": 452164, "epoch": 2691} {"train_loss": -12.226672172546387, "global_step": 452165, "epoch": 2691} {"train_loss": -12.533864974975586, "global_step": 452166, "epoch": 2691} {"train_loss": -12.452037811279297, "global_step": 452167, "epoch": 2691} {"train_loss": -12.512462615966797, "global_step": 452168, "epoch": 2691} {"train_loss": -12.444872856140137, "global_step": 452169, "epoch": 2691} {"train_loss": -12.704330444335938, "global_step": 452170, "epoch": 2691} {"train_loss": -12.480243682861328, "global_step": 452171, "epoch": 2691} {"train_loss": -12.465799331665039, "global_step": 452172, "epoch": 2691} {"train_loss": -12.646100997924805, "global_step": 452173, "epoch": 2691} {"train_loss": -12.437373161315918, "global_step": 452174, "epoch": 2691} {"train_loss": -12.655693054199219, "global_step": 452175, "epoch": 2691} {"train_loss": -12.489428520202637, "global_step": 452176, "epoch": 2691} {"train_loss": -12.85792350769043, "global_step": 452177, "epoch": 2691} {"train_loss": -12.675363540649414, "global_step": 452178, "epoch": 2691} {"train_loss": -12.566786766052246, "global_step": 452179, "epoch": 2691} {"train_loss": -12.529184341430664, "global_step": 452180, "epoch": 2691} {"train_loss": -12.407421112060547, "global_step": 452181, "epoch": 2691} {"train_loss": -12.61112117767334, "global_step": 452182, "epoch": 2691} {"train_loss": -12.719160079956055, "global_step": 452183, "epoch": 2691} {"train_loss": -12.671060562133789, "global_step": 452184, "epoch": 2691} {"train_loss": -12.556836128234863, "global_step": 452185, "epoch": 2691} {"train_loss": -12.634354591369629, "global_step": 452186, "epoch": 2691} {"train_loss": -12.710089683532715, "global_step": 452187, "epoch": 2691} {"train_loss": -12.750893592834473, "global_step": 452188, "epoch": 2691} {"train_loss": -12.855744361877441, "global_step": 452189, "epoch": 2691} {"train_loss": -12.76015853881836, "global_step": 452190, "epoch": 2691} {"train_loss": -12.769538879394531, "global_step": 452191, "epoch": 2691} {"train_loss": -12.620931625366211, "global_step": 452192, "epoch": 2691} {"train_loss": -12.625960350036621, "global_step": 452193, "epoch": 2691} {"train_loss": -12.363344192504883, "global_step": 452194, "epoch": 2691} {"train_loss": -12.553430557250977, "global_step": 452195, "epoch": 2691} {"train_loss": -12.33317756652832, "global_step": 452196, "epoch": 2691} {"train_loss": -12.94487190246582, "global_step": 452197, "epoch": 2691} {"train_loss": -12.477767944335938, "global_step": 452198, "epoch": 2691} {"train_loss": -12.760908126831055, "global_step": 452199, "epoch": 2691} {"train_loss": -12.66993522644043, "global_step": 452200, "epoch": 2691} {"train_loss": -12.549317359924316, "global_step": 452201, "epoch": 2691} {"train_loss": -12.629921913146973, "global_step": 452202, "epoch": 2691} {"train_loss": -12.380792617797852, "global_step": 452203, "epoch": 2691} {"train_loss": -12.46019172668457, "global_step": 452204, "epoch": 2691} {"train_loss": -12.566666603088379, "global_step": 452205, "epoch": 2691} {"train_loss": -12.438484191894531, "global_step": 452206, "epoch": 2691} {"train_loss": -12.54270076751709, "global_step": 452207, "epoch": 2691} {"train_loss": -12.549020767211914, "global_step": 452208, "epoch": 2691} {"train_loss": -12.688538551330566, "global_step": 452209, "epoch": 2691} {"train_loss": -12.343897819519043, "global_step": 452210, "epoch": 2691} {"train_loss": -12.842292785644531, "global_step": 452211, "epoch": 2691} {"train_loss": -12.43313217163086, "global_step": 452212, "epoch": 2691} {"train_loss": -12.765209197998047, "global_step": 452213, "epoch": 2691} {"train_loss": -12.457754135131836, "global_step": 452214, "epoch": 2691} {"train_loss": -12.870355606079102, "global_step": 452215, "epoch": 2691} {"train_loss": -12.424083709716797, "global_step": 452216, "epoch": 2691} {"train_loss": -12.867332458496094, "global_step": 452217, "epoch": 2691} {"train_loss": -12.563626289367676, "global_step": 452218, "epoch": 2691} {"train_loss": -12.725786209106445, "global_step": 452219, "epoch": 2691} {"train_loss": -12.389957427978516, "global_step": 452220, "epoch": 2691} {"train_loss": -12.735357284545898, "global_step": 452221, "epoch": 2691} {"train_loss": -12.68276596069336, "global_step": 452222, "epoch": 2691} {"train_loss": -12.24807357788086, "global_step": 452223, "epoch": 2691} {"train_loss": -12.353973388671875, "global_step": 452224, "epoch": 2691} {"train_loss": -12.445100784301758, "global_step": 452225, "epoch": 2691} {"train_loss": -12.146650314331055, "global_step": 452226, "epoch": 2691} {"train_loss": -12.465744018554688, "global_step": 452227, "epoch": 2691} {"train_loss": -12.33651351928711, "global_step": 452228, "epoch": 2691} {"train_loss": -12.046502113342285, "global_step": 452229, "epoch": 2691} {"train_loss": -12.355417251586914, "global_step": 452230, "epoch": 2691} {"train_loss": -12.198795318603516, "global_step": 452231, "epoch": 2691} {"train_loss": -11.841486930847168, "global_step": 452232, "epoch": 2691} {"train_loss": -11.212728500366211, "global_step": 452233, "epoch": 2691} {"train_loss": -11.405534744262695, "global_step": 452234, "epoch": 2691} {"train_loss": -11.091686248779297, "global_step": 452235, "epoch": 2691} {"train_loss": -10.219690322875977, "global_step": 452236, "epoch": 2691} {"train_loss": -12.047529220581055, "global_step": 452237, "epoch": 2691} {"train_loss": -11.04294490814209, "global_step": 452238, "epoch": 2691} {"train_loss": -11.989048957824707, "global_step": 452239, "epoch": 2691} {"train_loss": -11.586431503295898, "global_step": 452240, "epoch": 2691} {"train_loss": -11.901362419128418, "global_step": 452241, "epoch": 2691} {"train_loss": -11.795024871826172, "global_step": 452242, "epoch": 2691} {"train_loss": -11.918577194213867, "global_step": 452243, "epoch": 2691} {"train_loss": -12.229211807250977, "global_step": 452244, "epoch": 2691} {"train_loss": -12.242975234985352, "global_step": 452245, "epoch": 2691} {"train_loss": -12.288651466369629, "global_step": 452246, "epoch": 2691} {"train_loss": -11.815018653869629, "global_step": 452247, "epoch": 2691} {"train_loss": -12.543802261352539, "global_step": 452248, "epoch": 2691} {"train_loss": -11.946669578552246, "global_step": 452249, "epoch": 2691} {"train_loss": -12.031621932983398, "global_step": 452250, "epoch": 2691} {"train_loss": -12.237064361572266, "global_step": 452251, "epoch": 2691} {"train_loss": -12.294591903686523, "global_step": 452252, "epoch": 2691} {"train_loss": -11.398881912231445, "global_step": 452253, "epoch": 2691} {"train_loss": -12.21430778503418, "global_step": 452254, "epoch": 2691} {"train_loss": -11.960377142542885, "global_step": 452255, "epoch": 2691, "val_loss": 313818.0625} {"train_loss": -11.761100769042969, "global_step": 452256, "epoch": 2692} {"train_loss": -12.6153564453125, "global_step": 452257, "epoch": 2692} {"train_loss": -11.656229019165039, "global_step": 452258, "epoch": 2692} {"train_loss": -11.723539352416992, "global_step": 452259, "epoch": 2692} {"train_loss": -12.119043350219727, "global_step": 452260, "epoch": 2692} {"train_loss": -11.444927215576172, "global_step": 452261, "epoch": 2692} {"train_loss": -12.301384925842285, "global_step": 452262, "epoch": 2692} {"train_loss": -11.393933296203613, "global_step": 452263, "epoch": 2692} {"train_loss": -11.74195671081543, "global_step": 452264, "epoch": 2692} {"train_loss": -11.597469329833984, "global_step": 452265, "epoch": 2692} {"train_loss": -11.149453163146973, "global_step": 452266, "epoch": 2692} {"train_loss": -11.036233901977539, "global_step": 452267, "epoch": 2692} {"train_loss": -11.67984390258789, "global_step": 452268, "epoch": 2692} {"train_loss": -11.387157440185547, "global_step": 452269, "epoch": 2692} {"train_loss": -10.944316864013672, "global_step": 452270, "epoch": 2692} {"train_loss": -11.62033462524414, "global_step": 452271, "epoch": 2692} {"train_loss": -11.799110412597656, "global_step": 452272, "epoch": 2692} {"train_loss": -10.916120529174805, "global_step": 452273, "epoch": 2692} {"train_loss": -12.04992961883545, "global_step": 452274, "epoch": 2692} {"train_loss": -11.440414428710938, "global_step": 452275, "epoch": 2692} {"train_loss": -11.489190101623535, "global_step": 452276, "epoch": 2692} {"train_loss": -12.016100883483887, "global_step": 452277, "epoch": 2692} {"train_loss": -11.854646682739258, "global_step": 452278, "epoch": 2692} {"train_loss": -12.431163787841797, "global_step": 452279, "epoch": 2692} {"train_loss": -11.586965560913086, "global_step": 452280, "epoch": 2692} {"train_loss": -12.207576751708984, "global_step": 452281, "epoch": 2692} {"train_loss": -11.861928939819336, "global_step": 452282, "epoch": 2692} {"train_loss": -12.109902381896973, "global_step": 452283, "epoch": 2692} {"train_loss": -11.909597396850586, "global_step": 452284, "epoch": 2692} {"train_loss": -12.010629653930664, "global_step": 452285, "epoch": 2692} {"train_loss": -12.241182327270508, "global_step": 452286, "epoch": 2692} {"train_loss": -11.672680854797363, "global_step": 452287, "epoch": 2692} {"train_loss": -12.28787612915039, "global_step": 452288, "epoch": 2692} {"train_loss": -12.489762306213379, "global_step": 452289, "epoch": 2692} {"train_loss": -11.732377052307129, "global_step": 452290, "epoch": 2692} {"train_loss": -12.421541213989258, "global_step": 452291, "epoch": 2692} {"train_loss": -11.97622299194336, "global_step": 452292, "epoch": 2692} {"train_loss": -12.468884468078613, "global_step": 452293, "epoch": 2692} {"train_loss": -12.291910171508789, "global_step": 452294, "epoch": 2692} {"train_loss": -12.368770599365234, "global_step": 452295, "epoch": 2692} {"train_loss": -12.054885864257812, "global_step": 452296, "epoch": 2692} {"train_loss": -12.127114295959473, "global_step": 452297, "epoch": 2692} {"train_loss": -12.396035194396973, "global_step": 452298, "epoch": 2692} {"train_loss": -12.205772399902344, "global_step": 452299, "epoch": 2692} {"train_loss": -12.226236343383789, "global_step": 452300, "epoch": 2692} {"train_loss": -12.023681640625, "global_step": 452301, "epoch": 2692} {"train_loss": -12.427481651306152, "global_step": 452302, "epoch": 2692} {"train_loss": -12.361854553222656, "global_step": 452303, "epoch": 2692} {"train_loss": -12.108888626098633, "global_step": 452304, "epoch": 2692} {"train_loss": -12.418500900268555, "global_step": 452305, "epoch": 2692} {"train_loss": -12.183267593383789, "global_step": 452306, "epoch": 2692} {"train_loss": -12.118864059448242, "global_step": 452307, "epoch": 2692} {"train_loss": -12.614727973937988, "global_step": 452308, "epoch": 2692} {"train_loss": -12.386295318603516, "global_step": 452309, "epoch": 2692} {"train_loss": -12.535472869873047, "global_step": 452310, "epoch": 2692} {"train_loss": -12.12479019165039, "global_step": 452311, "epoch": 2692} {"train_loss": -12.496943473815918, "global_step": 452312, "epoch": 2692} {"train_loss": -12.09907341003418, "global_step": 452313, "epoch": 2692} {"train_loss": -12.567767143249512, "global_step": 452314, "epoch": 2692} {"train_loss": -12.218002319335938, "global_step": 452315, "epoch": 2692} {"train_loss": -12.458856582641602, "global_step": 452316, "epoch": 2692} {"train_loss": -12.642308235168457, "global_step": 452317, "epoch": 2692} {"train_loss": -11.94472885131836, "global_step": 452318, "epoch": 2692} {"train_loss": -12.432926177978516, "global_step": 452319, "epoch": 2692} {"train_loss": -12.149539947509766, "global_step": 452320, "epoch": 2692} {"train_loss": -11.961545944213867, "global_step": 452321, "epoch": 2692} {"train_loss": -12.246749877929688, "global_step": 452322, "epoch": 2692} {"train_loss": -12.46339225769043, "global_step": 452323, "epoch": 2692} {"train_loss": -12.553016662597656, "global_step": 452324, "epoch": 2692} {"train_loss": -12.168802261352539, "global_step": 452325, "epoch": 2692} {"train_loss": -12.641962051391602, "global_step": 452326, "epoch": 2692} {"train_loss": -11.594467163085938, "global_step": 452327, "epoch": 2692} {"train_loss": -12.432121276855469, "global_step": 452328, "epoch": 2692} {"train_loss": -12.111955642700195, "global_step": 452329, "epoch": 2692} {"train_loss": -12.265989303588867, "global_step": 452330, "epoch": 2692} {"train_loss": -12.471349716186523, "global_step": 452331, "epoch": 2692} {"train_loss": -12.407598495483398, "global_step": 452332, "epoch": 2692} {"train_loss": -12.078983306884766, "global_step": 452333, "epoch": 2692} {"train_loss": -12.180736541748047, "global_step": 452334, "epoch": 2692} {"train_loss": -12.137514114379883, "global_step": 452335, "epoch": 2692} {"train_loss": -12.529029846191406, "global_step": 452336, "epoch": 2692} {"train_loss": -11.98343276977539, "global_step": 452337, "epoch": 2692} {"train_loss": -12.492216110229492, "global_step": 452338, "epoch": 2692} {"train_loss": -12.443070411682129, "global_step": 452339, "epoch": 2692} {"train_loss": -12.132492065429688, "global_step": 452340, "epoch": 2692} {"train_loss": -11.910250663757324, "global_step": 452341, "epoch": 2692} {"train_loss": -12.696887969970703, "global_step": 452342, "epoch": 2692} {"train_loss": -12.367136001586914, "global_step": 452343, "epoch": 2692} {"train_loss": -12.61463737487793, "global_step": 452344, "epoch": 2692} {"train_loss": -12.43830394744873, "global_step": 452345, "epoch": 2692} {"train_loss": -12.918941497802734, "global_step": 452346, "epoch": 2692} {"train_loss": -12.290567398071289, "global_step": 452347, "epoch": 2692} {"train_loss": -12.672204971313477, "global_step": 452348, "epoch": 2692} {"train_loss": -12.523017883300781, "global_step": 452349, "epoch": 2692} {"train_loss": -12.527104377746582, "global_step": 452350, "epoch": 2692} {"train_loss": -11.708377838134766, "global_step": 452351, "epoch": 2692} {"train_loss": -12.581707000732422, "global_step": 452352, "epoch": 2692} {"train_loss": -12.120030403137207, "global_step": 452353, "epoch": 2692} {"train_loss": -12.307052612304688, "global_step": 452354, "epoch": 2692} {"train_loss": -11.896492958068848, "global_step": 452355, "epoch": 2692} {"train_loss": -12.182929992675781, "global_step": 452356, "epoch": 2692} {"train_loss": -11.799055099487305, "global_step": 452357, "epoch": 2692} {"train_loss": -12.319611549377441, "global_step": 452358, "epoch": 2692} {"train_loss": -12.699840545654297, "global_step": 452359, "epoch": 2692} {"train_loss": -12.502412796020508, "global_step": 452360, "epoch": 2692} {"train_loss": -12.269073486328125, "global_step": 452361, "epoch": 2692} {"train_loss": -12.541937828063965, "global_step": 452362, "epoch": 2692} {"train_loss": -12.400979995727539, "global_step": 452363, "epoch": 2692} {"train_loss": -12.714007377624512, "global_step": 452364, "epoch": 2692} {"train_loss": -12.814913749694824, "global_step": 452365, "epoch": 2692} {"train_loss": -12.647916793823242, "global_step": 452366, "epoch": 2692} {"train_loss": -12.32679557800293, "global_step": 452367, "epoch": 2692} {"train_loss": -12.855754852294922, "global_step": 452368, "epoch": 2692} {"train_loss": -12.360095977783203, "global_step": 452369, "epoch": 2692} {"train_loss": -12.866795539855957, "global_step": 452370, "epoch": 2692} {"train_loss": -12.387513160705566, "global_step": 452371, "epoch": 2692} {"train_loss": -12.531147003173828, "global_step": 452372, "epoch": 2692} {"train_loss": -12.761165618896484, "global_step": 452373, "epoch": 2692} {"train_loss": -12.454219818115234, "global_step": 452374, "epoch": 2692} {"train_loss": -12.008550643920898, "global_step": 452375, "epoch": 2692} {"train_loss": -12.608041763305664, "global_step": 452376, "epoch": 2692} {"train_loss": -12.47016716003418, "global_step": 452377, "epoch": 2692} {"train_loss": -12.358407974243164, "global_step": 452378, "epoch": 2692} {"train_loss": -12.567951202392578, "global_step": 452379, "epoch": 2692} {"train_loss": -12.802302360534668, "global_step": 452380, "epoch": 2692} {"train_loss": -12.901490211486816, "global_step": 452381, "epoch": 2692} {"train_loss": -12.746349334716797, "global_step": 452382, "epoch": 2692} {"train_loss": -12.74466323852539, "global_step": 452383, "epoch": 2692} {"train_loss": -12.834213256835938, "global_step": 452384, "epoch": 2692} {"train_loss": -12.707696914672852, "global_step": 452385, "epoch": 2692} {"train_loss": -12.881916046142578, "global_step": 452386, "epoch": 2692} {"train_loss": -12.844470024108887, "global_step": 452387, "epoch": 2692} {"train_loss": -12.641386032104492, "global_step": 452388, "epoch": 2692} {"train_loss": -12.805537223815918, "global_step": 452389, "epoch": 2692} {"train_loss": -12.727002143859863, "global_step": 452390, "epoch": 2692} {"train_loss": -12.677912712097168, "global_step": 452391, "epoch": 2692} {"train_loss": -12.900325775146484, "global_step": 452392, "epoch": 2692} {"train_loss": -12.930419921875, "global_step": 452393, "epoch": 2692} {"train_loss": -12.825883865356445, "global_step": 452394, "epoch": 2692} {"train_loss": -12.773031234741211, "global_step": 452395, "epoch": 2692} {"train_loss": -12.442795753479004, "global_step": 452396, "epoch": 2692} {"train_loss": -12.860380172729492, "global_step": 452397, "epoch": 2692} {"train_loss": -12.819555282592773, "global_step": 452398, "epoch": 2692} {"train_loss": -12.851592063903809, "global_step": 452399, "epoch": 2692} {"train_loss": -12.515581130981445, "global_step": 452400, "epoch": 2692} {"train_loss": -12.56503963470459, "global_step": 452401, "epoch": 2692} {"train_loss": -12.624061584472656, "global_step": 452402, "epoch": 2692} {"train_loss": -12.777115821838379, "global_step": 452403, "epoch": 2692} {"train_loss": -12.52375316619873, "global_step": 452404, "epoch": 2692} {"train_loss": -12.85158920288086, "global_step": 452405, "epoch": 2692} {"train_loss": -12.805168151855469, "global_step": 452406, "epoch": 2692} {"train_loss": -12.66627311706543, "global_step": 452407, "epoch": 2692} {"train_loss": -12.428128242492676, "global_step": 452408, "epoch": 2692} {"train_loss": -12.595035552978516, "global_step": 452409, "epoch": 2692} {"train_loss": -12.081846237182617, "global_step": 452410, "epoch": 2692} {"train_loss": -11.573620796203613, "global_step": 452411, "epoch": 2692} {"train_loss": -11.552549362182617, "global_step": 452412, "epoch": 2692} {"train_loss": -12.404065132141113, "global_step": 452413, "epoch": 2692} {"train_loss": -12.608616828918457, "global_step": 452414, "epoch": 2692} {"train_loss": -11.120293617248535, "global_step": 452415, "epoch": 2692} {"train_loss": -11.667961120605469, "global_step": 452416, "epoch": 2692} {"train_loss": -11.951837539672852, "global_step": 452417, "epoch": 2692} {"train_loss": -11.469863891601562, "global_step": 452418, "epoch": 2692} {"train_loss": -11.703563690185547, "global_step": 452419, "epoch": 2692} {"train_loss": -12.265915870666504, "global_step": 452420, "epoch": 2692} {"train_loss": -12.282849311828613, "global_step": 452421, "epoch": 2692} {"train_loss": -12.14406967163086, "global_step": 452422, "epoch": 2692} {"train_loss": -12.26611834480649, "global_step": 452423, "epoch": 2692, "val_loss": 317053.65625} {"train_loss": -12.2095308303833, "global_step": 452424, "epoch": 2693} {"train_loss": -12.452617645263672, "global_step": 452425, "epoch": 2693} {"train_loss": -12.017062187194824, "global_step": 452426, "epoch": 2693} {"train_loss": -12.178998947143555, "global_step": 452427, "epoch": 2693} {"train_loss": -11.650352478027344, "global_step": 452428, "epoch": 2693} {"train_loss": -12.52481746673584, "global_step": 452429, "epoch": 2693} {"train_loss": -11.977418899536133, "global_step": 452430, "epoch": 2693} {"train_loss": -12.131488800048828, "global_step": 452431, "epoch": 2693} {"train_loss": -11.411080360412598, "global_step": 452432, "epoch": 2693} {"train_loss": -11.379617691040039, "global_step": 452433, "epoch": 2693} {"train_loss": -11.63923454284668, "global_step": 452434, "epoch": 2693} {"train_loss": -12.414803504943848, "global_step": 452435, "epoch": 2693} {"train_loss": -11.341133117675781, "global_step": 452436, "epoch": 2693} {"train_loss": -11.873132705688477, "global_step": 452437, "epoch": 2693} {"train_loss": -11.960655212402344, "global_step": 452438, "epoch": 2693} {"train_loss": -11.778278350830078, "global_step": 452439, "epoch": 2693} {"train_loss": -11.62451171875, "global_step": 452440, "epoch": 2693} {"train_loss": -11.825468063354492, "global_step": 452441, "epoch": 2693} {"train_loss": -11.944061279296875, "global_step": 452442, "epoch": 2693} {"train_loss": -11.72607421875, "global_step": 452443, "epoch": 2693} {"train_loss": -11.664291381835938, "global_step": 452444, "epoch": 2693} {"train_loss": -11.495315551757812, "global_step": 452445, "epoch": 2693} {"train_loss": -11.77203369140625, "global_step": 452446, "epoch": 2693} {"train_loss": -12.160147666931152, "global_step": 452447, "epoch": 2693} {"train_loss": -12.016709327697754, "global_step": 452448, "epoch": 2693} {"train_loss": -11.924762725830078, "global_step": 452449, "epoch": 2693} {"train_loss": -12.191366195678711, "global_step": 452450, "epoch": 2693} {"train_loss": -11.765630722045898, "global_step": 452451, "epoch": 2693} {"train_loss": -12.362689018249512, "global_step": 452452, "epoch": 2693} {"train_loss": -11.787471771240234, "global_step": 452453, "epoch": 2693} {"train_loss": -11.551935195922852, "global_step": 452454, "epoch": 2693} {"train_loss": -11.707813262939453, "global_step": 452455, "epoch": 2693} {"train_loss": -10.16464900970459, "global_step": 452456, "epoch": 2693} {"train_loss": -11.86660385131836, "global_step": 452457, "epoch": 2693} {"train_loss": -10.72157096862793, "global_step": 452458, "epoch": 2693} {"train_loss": -11.358510971069336, "global_step": 452459, "epoch": 2693} {"train_loss": -12.195486068725586, "global_step": 452460, "epoch": 2693} {"train_loss": -11.702005386352539, "global_step": 452461, "epoch": 2693} {"train_loss": -11.913922309875488, "global_step": 452462, "epoch": 2693} {"train_loss": -11.147329330444336, "global_step": 452463, "epoch": 2693} {"train_loss": -11.996590614318848, "global_step": 452464, "epoch": 2693} {"train_loss": -11.107431411743164, "global_step": 452465, "epoch": 2693} {"train_loss": -11.733776092529297, "global_step": 452466, "epoch": 2693} {"train_loss": -11.82780647277832, "global_step": 452467, "epoch": 2693} {"train_loss": -11.240510940551758, "global_step": 452468, "epoch": 2693} {"train_loss": -11.888407707214355, "global_step": 452469, "epoch": 2693} {"train_loss": -11.44163703918457, "global_step": 452470, "epoch": 2693} {"train_loss": -10.996003150939941, "global_step": 452471, "epoch": 2693} {"train_loss": -9.916707992553711, "global_step": 452472, "epoch": 2693} {"train_loss": -11.45565128326416, "global_step": 452473, "epoch": 2693} {"train_loss": -9.348596572875977, "global_step": 452474, "epoch": 2693} {"train_loss": -11.279899597167969, "global_step": 452475, "epoch": 2693} {"train_loss": -10.516684532165527, "global_step": 452476, "epoch": 2693} {"train_loss": -10.90035629272461, "global_step": 452477, "epoch": 2693} {"train_loss": -11.094040870666504, "global_step": 452478, "epoch": 2693} {"train_loss": -10.789607048034668, "global_step": 452479, "epoch": 2693} {"train_loss": -9.804384231567383, "global_step": 452480, "epoch": 2693} {"train_loss": -11.81557846069336, "global_step": 452481, "epoch": 2693} {"train_loss": -10.364208221435547, "global_step": 452482, "epoch": 2693} {"train_loss": -10.790719985961914, "global_step": 452483, "epoch": 2693} {"train_loss": -10.998506546020508, "global_step": 452484, "epoch": 2693} {"train_loss": -10.292057037353516, "global_step": 452485, "epoch": 2693} {"train_loss": -11.20808219909668, "global_step": 452486, "epoch": 2693} {"train_loss": -11.324939727783203, "global_step": 452487, "epoch": 2693} {"train_loss": -10.972869873046875, "global_step": 452488, "epoch": 2693} {"train_loss": -12.132997512817383, "global_step": 452489, "epoch": 2693} {"train_loss": -10.642532348632812, "global_step": 452490, "epoch": 2693} {"train_loss": -11.174901962280273, "global_step": 452491, "epoch": 2693} {"train_loss": -11.422536849975586, "global_step": 452492, "epoch": 2693} {"train_loss": -11.64350700378418, "global_step": 452493, "epoch": 2693} {"train_loss": -11.907340049743652, "global_step": 452494, "epoch": 2693} {"train_loss": -11.839570045471191, "global_step": 452495, "epoch": 2693} {"train_loss": -11.191816329956055, "global_step": 452496, "epoch": 2693} {"train_loss": -11.105616569519043, "global_step": 452497, "epoch": 2693} {"train_loss": -11.524469375610352, "global_step": 452498, "epoch": 2693} {"train_loss": -11.289738655090332, "global_step": 452499, "epoch": 2693} {"train_loss": -11.44836711883545, "global_step": 452500, "epoch": 2693} {"train_loss": -11.018745422363281, "global_step": 452501, "epoch": 2693} {"train_loss": -11.63559341430664, "global_step": 452502, "epoch": 2693} {"train_loss": -11.419002532958984, "global_step": 452503, "epoch": 2693} {"train_loss": -11.880804061889648, "global_step": 452504, "epoch": 2693} {"train_loss": -11.291868209838867, "global_step": 452505, "epoch": 2693} {"train_loss": -12.099231719970703, "global_step": 452506, "epoch": 2693} {"train_loss": -11.430124282836914, "global_step": 452507, "epoch": 2693} {"train_loss": -12.120651245117188, "global_step": 452508, "epoch": 2693} {"train_loss": -11.578460693359375, "global_step": 452509, "epoch": 2693} {"train_loss": -11.917106628417969, "global_step": 452510, "epoch": 2693} {"train_loss": -12.280376434326172, "global_step": 452511, "epoch": 2693} {"train_loss": -11.726318359375, "global_step": 452512, "epoch": 2693} {"train_loss": -12.232149124145508, "global_step": 452513, "epoch": 2693} {"train_loss": -11.733203887939453, "global_step": 452514, "epoch": 2693} {"train_loss": -11.739481925964355, "global_step": 452515, "epoch": 2693} {"train_loss": -11.730989456176758, "global_step": 452516, "epoch": 2693} {"train_loss": -11.624637603759766, "global_step": 452517, "epoch": 2693} {"train_loss": -11.934795379638672, "global_step": 452518, "epoch": 2693} {"train_loss": -11.503711700439453, "global_step": 452519, "epoch": 2693} {"train_loss": -11.08853530883789, "global_step": 452520, "epoch": 2693} {"train_loss": -11.361665725708008, "global_step": 452521, "epoch": 2693} {"train_loss": -11.72574520111084, "global_step": 452522, "epoch": 2693} {"train_loss": -11.629911422729492, "global_step": 452523, "epoch": 2693} {"train_loss": -11.385590553283691, "global_step": 452524, "epoch": 2693} {"train_loss": -12.501382827758789, "global_step": 452525, "epoch": 2693} {"train_loss": -12.026888847351074, "global_step": 452526, "epoch": 2693} {"train_loss": -12.091423034667969, "global_step": 452527, "epoch": 2693} {"train_loss": -12.017378807067871, "global_step": 452528, "epoch": 2693} {"train_loss": -12.073417663574219, "global_step": 452529, "epoch": 2693} {"train_loss": -12.093379974365234, "global_step": 452530, "epoch": 2693} {"train_loss": -12.388401985168457, "global_step": 452531, "epoch": 2693} {"train_loss": -12.142194747924805, "global_step": 452532, "epoch": 2693} {"train_loss": -12.072616577148438, "global_step": 452533, "epoch": 2693} {"train_loss": -12.073164939880371, "global_step": 452534, "epoch": 2693} {"train_loss": -12.136091232299805, "global_step": 452535, "epoch": 2693} {"train_loss": -12.275131225585938, "global_step": 452536, "epoch": 2693} {"train_loss": -11.936805725097656, "global_step": 452537, "epoch": 2693} {"train_loss": -11.852680206298828, "global_step": 452538, "epoch": 2693} {"train_loss": -12.352109909057617, "global_step": 452539, "epoch": 2693} {"train_loss": -12.03010368347168, "global_step": 452540, "epoch": 2693} {"train_loss": -12.36779499053955, "global_step": 452541, "epoch": 2693} {"train_loss": -11.951133728027344, "global_step": 452542, "epoch": 2693} {"train_loss": -11.899223327636719, "global_step": 452543, "epoch": 2693} {"train_loss": -11.35659408569336, "global_step": 452544, "epoch": 2693} {"train_loss": -11.946598052978516, "global_step": 452545, "epoch": 2693} {"train_loss": -11.492185592651367, "global_step": 452546, "epoch": 2693} {"train_loss": -12.253702163696289, "global_step": 452547, "epoch": 2693} {"train_loss": -11.59293270111084, "global_step": 452548, "epoch": 2693} {"train_loss": -11.888932228088379, "global_step": 452549, "epoch": 2693} {"train_loss": -11.946651458740234, "global_step": 452550, "epoch": 2693} {"train_loss": -12.21692180633545, "global_step": 452551, "epoch": 2693} {"train_loss": -12.101740837097168, "global_step": 452552, "epoch": 2693} {"train_loss": -12.308106422424316, "global_step": 452553, "epoch": 2693} {"train_loss": -12.44757080078125, "global_step": 452554, "epoch": 2693} {"train_loss": -12.197748184204102, "global_step": 452555, "epoch": 2693} {"train_loss": -12.375141143798828, "global_step": 452556, "epoch": 2693} {"train_loss": -12.263402938842773, "global_step": 452557, "epoch": 2693} {"train_loss": -11.989908218383789, "global_step": 452558, "epoch": 2693} {"train_loss": -12.500777244567871, "global_step": 452559, "epoch": 2693} {"train_loss": -11.822538375854492, "global_step": 452560, "epoch": 2693} {"train_loss": -12.486543655395508, "global_step": 452561, "epoch": 2693} {"train_loss": -11.907530784606934, "global_step": 452562, "epoch": 2693} {"train_loss": -12.207932472229004, "global_step": 452563, "epoch": 2693} {"train_loss": -12.35007381439209, "global_step": 452564, "epoch": 2693} {"train_loss": -12.123418807983398, "global_step": 452565, "epoch": 2693} {"train_loss": -12.48868179321289, "global_step": 452566, "epoch": 2693} {"train_loss": -12.116518020629883, "global_step": 452567, "epoch": 2693} {"train_loss": -12.538491249084473, "global_step": 452568, "epoch": 2693} {"train_loss": -12.233148574829102, "global_step": 452569, "epoch": 2693} {"train_loss": -12.554062843322754, "global_step": 452570, "epoch": 2693} {"train_loss": -12.276254653930664, "global_step": 452571, "epoch": 2693} {"train_loss": -11.955741882324219, "global_step": 452572, "epoch": 2693} {"train_loss": -11.977855682373047, "global_step": 452573, "epoch": 2693} {"train_loss": -12.290572166442871, "global_step": 452574, "epoch": 2693} {"train_loss": -11.621208190917969, "global_step": 452575, "epoch": 2693} {"train_loss": -12.664129257202148, "global_step": 452576, "epoch": 2693} {"train_loss": -11.837800979614258, "global_step": 452577, "epoch": 2693} {"train_loss": -12.127002716064453, "global_step": 452578, "epoch": 2693} {"train_loss": -12.306583404541016, "global_step": 452579, "epoch": 2693} {"train_loss": -12.196398735046387, "global_step": 452580, "epoch": 2693} {"train_loss": -12.34615421295166, "global_step": 452581, "epoch": 2693} {"train_loss": -12.396059036254883, "global_step": 452582, "epoch": 2693} {"train_loss": -11.708927154541016, "global_step": 452583, "epoch": 2693} {"train_loss": -12.526561737060547, "global_step": 452584, "epoch": 2693} {"train_loss": -11.890288352966309, "global_step": 452585, "epoch": 2693} {"train_loss": -12.58448600769043, "global_step": 452586, "epoch": 2693} {"train_loss": -12.119182586669922, "global_step": 452587, "epoch": 2693} {"train_loss": -12.535394668579102, "global_step": 452588, "epoch": 2693} {"train_loss": -12.026996612548828, "global_step": 452589, "epoch": 2693} {"train_loss": -12.430392265319824, "global_step": 452590, "epoch": 2693} {"train_loss": -11.771170337994894, "global_step": 452591, "epoch": 2693, "val_loss": 315991.28125} {"train_loss": -12.561586380004883, "global_step": 452592, "epoch": 2694} {"train_loss": -11.946568489074707, "global_step": 452593, "epoch": 2694} {"train_loss": -12.314240455627441, "global_step": 452594, "epoch": 2694} {"train_loss": -11.934616088867188, "global_step": 452595, "epoch": 2694} {"train_loss": -12.206469535827637, "global_step": 452596, "epoch": 2694} {"train_loss": -12.231095314025879, "global_step": 452597, "epoch": 2694} {"train_loss": -11.961872100830078, "global_step": 452598, "epoch": 2694} {"train_loss": -11.846148490905762, "global_step": 452599, "epoch": 2694} {"train_loss": -11.846091270446777, "global_step": 452600, "epoch": 2694} {"train_loss": -11.725031852722168, "global_step": 452601, "epoch": 2694} {"train_loss": -12.028780937194824, "global_step": 452602, "epoch": 2694} {"train_loss": -12.022756576538086, "global_step": 452603, "epoch": 2694} {"train_loss": -12.053752899169922, "global_step": 452604, "epoch": 2694} {"train_loss": -12.263582229614258, "global_step": 452605, "epoch": 2694} {"train_loss": -12.13482666015625, "global_step": 452606, "epoch": 2694} {"train_loss": -12.284252166748047, "global_step": 452607, "epoch": 2694} {"train_loss": -11.819734573364258, "global_step": 452608, "epoch": 2694} {"train_loss": -12.042162895202637, "global_step": 452609, "epoch": 2694} {"train_loss": -12.294060707092285, "global_step": 452610, "epoch": 2694} {"train_loss": -11.618667602539062, "global_step": 452611, "epoch": 2694} {"train_loss": -12.363363265991211, "global_step": 452612, "epoch": 2694} {"train_loss": -12.04006576538086, "global_step": 452613, "epoch": 2694} {"train_loss": -12.282025337219238, "global_step": 452614, "epoch": 2694} {"train_loss": -12.169473648071289, "global_step": 452615, "epoch": 2694} {"train_loss": -11.985946655273438, "global_step": 452616, "epoch": 2694} {"train_loss": -12.339790344238281, "global_step": 452617, "epoch": 2694} {"train_loss": -11.898283004760742, "global_step": 452618, "epoch": 2694} {"train_loss": -12.588760375976562, "global_step": 452619, "epoch": 2694} {"train_loss": -12.531147003173828, "global_step": 452620, "epoch": 2694} {"train_loss": -12.212247848510742, "global_step": 452621, "epoch": 2694} {"train_loss": -12.216277122497559, "global_step": 452622, "epoch": 2694} {"train_loss": -12.405570983886719, "global_step": 452623, "epoch": 2694} {"train_loss": -12.467458724975586, "global_step": 452624, "epoch": 2694} {"train_loss": -12.669024467468262, "global_step": 452625, "epoch": 2694} {"train_loss": -12.070783615112305, "global_step": 452626, "epoch": 2694} {"train_loss": -11.991965293884277, "global_step": 452627, "epoch": 2694} {"train_loss": -12.609889030456543, "global_step": 452628, "epoch": 2694} {"train_loss": -12.312774658203125, "global_step": 452629, "epoch": 2694} {"train_loss": -12.586390495300293, "global_step": 452630, "epoch": 2694} {"train_loss": -12.135971069335938, "global_step": 452631, "epoch": 2694} {"train_loss": -12.38753890991211, "global_step": 452632, "epoch": 2694} {"train_loss": -12.258674621582031, "global_step": 452633, "epoch": 2694} {"train_loss": -12.374313354492188, "global_step": 452634, "epoch": 2694} {"train_loss": -12.566900253295898, "global_step": 452635, "epoch": 2694} {"train_loss": -12.309698104858398, "global_step": 452636, "epoch": 2694} {"train_loss": -12.225770950317383, "global_step": 452637, "epoch": 2694} {"train_loss": -12.384623527526855, "global_step": 452638, "epoch": 2694} {"train_loss": -12.21908950805664, "global_step": 452639, "epoch": 2694} {"train_loss": -12.673343658447266, "global_step": 452640, "epoch": 2694} {"train_loss": -12.367449760437012, "global_step": 452641, "epoch": 2694} {"train_loss": -12.593914031982422, "global_step": 452642, "epoch": 2694} {"train_loss": -12.546195983886719, "global_step": 452643, "epoch": 2694} {"train_loss": -12.688364028930664, "global_step": 452644, "epoch": 2694} {"train_loss": -12.583624839782715, "global_step": 452645, "epoch": 2694} {"train_loss": -12.662907600402832, "global_step": 452646, "epoch": 2694} {"train_loss": -12.604379653930664, "global_step": 452647, "epoch": 2694} {"train_loss": -12.57313346862793, "global_step": 452648, "epoch": 2694} {"train_loss": -12.612344741821289, "global_step": 452649, "epoch": 2694} {"train_loss": -12.45682144165039, "global_step": 452650, "epoch": 2694} {"train_loss": -12.702970504760742, "global_step": 452651, "epoch": 2694} {"train_loss": -12.78879165649414, "global_step": 452652, "epoch": 2694} {"train_loss": -12.703596115112305, "global_step": 452653, "epoch": 2694} {"train_loss": -12.63128662109375, "global_step": 452654, "epoch": 2694} {"train_loss": -12.755928039550781, "global_step": 452655, "epoch": 2694} {"train_loss": -12.855552673339844, "global_step": 452656, "epoch": 2694} {"train_loss": -12.870330810546875, "global_step": 452657, "epoch": 2694} {"train_loss": -12.633724212646484, "global_step": 452658, "epoch": 2694} {"train_loss": -12.672477722167969, "global_step": 452659, "epoch": 2694} {"train_loss": -12.832742691040039, "global_step": 452660, "epoch": 2694} {"train_loss": -12.492544174194336, "global_step": 452661, "epoch": 2694} {"train_loss": -12.603494644165039, "global_step": 452662, "epoch": 2694} {"train_loss": -12.919021606445312, "global_step": 452663, "epoch": 2694} {"train_loss": -12.63072395324707, "global_step": 452664, "epoch": 2694} {"train_loss": -12.72049331665039, "global_step": 452665, "epoch": 2694} {"train_loss": -12.970731735229492, "global_step": 452666, "epoch": 2694} {"train_loss": -12.447566986083984, "global_step": 452667, "epoch": 2694} {"train_loss": -12.88089370727539, "global_step": 452668, "epoch": 2694} {"train_loss": -12.783281326293945, "global_step": 452669, "epoch": 2694} {"train_loss": -12.574701309204102, "global_step": 452670, "epoch": 2694} {"train_loss": -12.83021354675293, "global_step": 452671, "epoch": 2694} {"train_loss": -12.540885925292969, "global_step": 452672, "epoch": 2694} {"train_loss": -12.5352144241333, "global_step": 452673, "epoch": 2694} {"train_loss": -12.671971321105957, "global_step": 452674, "epoch": 2694} {"train_loss": -12.688982963562012, "global_step": 452675, "epoch": 2694} {"train_loss": -12.8214111328125, "global_step": 452676, "epoch": 2694} {"train_loss": -12.951550483703613, "global_step": 452677, "epoch": 2694} {"train_loss": -12.857534408569336, "global_step": 452678, "epoch": 2694} {"train_loss": -12.936978340148926, "global_step": 452679, "epoch": 2694} {"train_loss": -12.798274040222168, "global_step": 452680, "epoch": 2694} {"train_loss": -12.914592742919922, "global_step": 452681, "epoch": 2694} {"train_loss": -13.035709381103516, "global_step": 452682, "epoch": 2694} {"train_loss": -12.98462963104248, "global_step": 452683, "epoch": 2694} {"train_loss": -12.72184944152832, "global_step": 452684, "epoch": 2694} {"train_loss": -12.983444213867188, "global_step": 452685, "epoch": 2694} {"train_loss": -12.744794845581055, "global_step": 452686, "epoch": 2694} {"train_loss": -13.093517303466797, "global_step": 452687, "epoch": 2694} {"train_loss": -12.831872940063477, "global_step": 452688, "epoch": 2694} {"train_loss": -12.700462341308594, "global_step": 452689, "epoch": 2694} {"train_loss": -12.860074043273926, "global_step": 452690, "epoch": 2694} {"train_loss": -12.606059074401855, "global_step": 452691, "epoch": 2694} {"train_loss": -12.470447540283203, "global_step": 452692, "epoch": 2694} {"train_loss": -12.575927734375, "global_step": 452693, "epoch": 2694} {"train_loss": -12.387969970703125, "global_step": 452694, "epoch": 2694} {"train_loss": -12.455497741699219, "global_step": 452695, "epoch": 2694} {"train_loss": -12.223894119262695, "global_step": 452696, "epoch": 2694} {"train_loss": -12.774534225463867, "global_step": 452697, "epoch": 2694} {"train_loss": -11.742413520812988, "global_step": 452698, "epoch": 2694} {"train_loss": -12.284101486206055, "global_step": 452699, "epoch": 2694} {"train_loss": -12.465415000915527, "global_step": 452700, "epoch": 2694} {"train_loss": -12.655536651611328, "global_step": 452701, "epoch": 2694} {"train_loss": -11.77541732788086, "global_step": 452702, "epoch": 2694} {"train_loss": -12.45674991607666, "global_step": 452703, "epoch": 2694} {"train_loss": -12.628353118896484, "global_step": 452704, "epoch": 2694} {"train_loss": -11.764877319335938, "global_step": 452705, "epoch": 2694} {"train_loss": -11.465715408325195, "global_step": 452706, "epoch": 2694} {"train_loss": -12.571821212768555, "global_step": 452707, "epoch": 2694} {"train_loss": -11.723989486694336, "global_step": 452708, "epoch": 2694} {"train_loss": -11.65206527709961, "global_step": 452709, "epoch": 2694} {"train_loss": -12.339967727661133, "global_step": 452710, "epoch": 2694} {"train_loss": -11.38990592956543, "global_step": 452711, "epoch": 2694} {"train_loss": -12.16073989868164, "global_step": 452712, "epoch": 2694} {"train_loss": -12.088356018066406, "global_step": 452713, "epoch": 2694} {"train_loss": -12.467638969421387, "global_step": 452714, "epoch": 2694} {"train_loss": -11.51823616027832, "global_step": 452715, "epoch": 2694} {"train_loss": -12.667914390563965, "global_step": 452716, "epoch": 2694} {"train_loss": -11.627972602844238, "global_step": 452717, "epoch": 2694} {"train_loss": -12.098587036132812, "global_step": 452718, "epoch": 2694} {"train_loss": -11.710477828979492, "global_step": 452719, "epoch": 2694} {"train_loss": -12.387351989746094, "global_step": 452720, "epoch": 2694} {"train_loss": -12.273706436157227, "global_step": 452721, "epoch": 2694} {"train_loss": -11.959487915039062, "global_step": 452722, "epoch": 2694} {"train_loss": -12.400917053222656, "global_step": 452723, "epoch": 2694} {"train_loss": -11.554450035095215, "global_step": 452724, "epoch": 2694} {"train_loss": -12.525588989257812, "global_step": 452725, "epoch": 2694} {"train_loss": -12.043161392211914, "global_step": 452726, "epoch": 2694} {"train_loss": -12.403278350830078, "global_step": 452727, "epoch": 2694} {"train_loss": -10.929866790771484, "global_step": 452728, "epoch": 2694} {"train_loss": -12.301091194152832, "global_step": 452729, "epoch": 2694} {"train_loss": -10.889853477478027, "global_step": 452730, "epoch": 2694} {"train_loss": -12.222429275512695, "global_step": 452731, "epoch": 2694} {"train_loss": -11.631088256835938, "global_step": 452732, "epoch": 2694} {"train_loss": -11.335554122924805, "global_step": 452733, "epoch": 2694} {"train_loss": -12.039260864257812, "global_step": 452734, "epoch": 2694} {"train_loss": -11.391948699951172, "global_step": 452735, "epoch": 2694} {"train_loss": -11.656909942626953, "global_step": 452736, "epoch": 2694} {"train_loss": -11.02216911315918, "global_step": 452737, "epoch": 2694} {"train_loss": -11.809436798095703, "global_step": 452738, "epoch": 2694} {"train_loss": -11.819181442260742, "global_step": 452739, "epoch": 2694} {"train_loss": -11.218695640563965, "global_step": 452740, "epoch": 2694} {"train_loss": -11.62507152557373, "global_step": 452741, "epoch": 2694} {"train_loss": -11.321080207824707, "global_step": 452742, "epoch": 2694} {"train_loss": -11.132582664489746, "global_step": 452743, "epoch": 2694} {"train_loss": -11.100736618041992, "global_step": 452744, "epoch": 2694} {"train_loss": -11.409524917602539, "global_step": 452745, "epoch": 2694} {"train_loss": -10.465709686279297, "global_step": 452746, "epoch": 2694} {"train_loss": -9.734882354736328, "global_step": 452747, "epoch": 2694} {"train_loss": -11.171171188354492, "global_step": 452748, "epoch": 2694} {"train_loss": -11.075719833374023, "global_step": 452749, "epoch": 2694} {"train_loss": -10.994061470031738, "global_step": 452750, "epoch": 2694} {"train_loss": -11.582182884216309, "global_step": 452751, "epoch": 2694} {"train_loss": -11.8265380859375, "global_step": 452752, "epoch": 2694} {"train_loss": -11.657713890075684, "global_step": 452753, "epoch": 2694} {"train_loss": -12.040630340576172, "global_step": 452754, "epoch": 2694} {"train_loss": -11.69478988647461, "global_step": 452755, "epoch": 2694} {"train_loss": -11.602821350097656, "global_step": 452756, "epoch": 2694} {"train_loss": -11.688302993774414, "global_step": 452757, "epoch": 2694} {"train_loss": -12.0576171875, "global_step": 452758, "epoch": 2694} {"train_loss": -12.20684077626183, "global_step": 452759, "epoch": 2694, "val_loss": 312806.46875} {"train_loss": -12.216283798217773, "global_step": 452760, "epoch": 2695} {"train_loss": -11.392361640930176, "global_step": 452761, "epoch": 2695} {"train_loss": -11.92146110534668, "global_step": 452762, "epoch": 2695} {"train_loss": -11.397146224975586, "global_step": 452763, "epoch": 2695} {"train_loss": -11.437456130981445, "global_step": 452764, "epoch": 2695} {"train_loss": -12.135438919067383, "global_step": 452765, "epoch": 2695} {"train_loss": -11.474313735961914, "global_step": 452766, "epoch": 2695} {"train_loss": -11.663631439208984, "global_step": 452767, "epoch": 2695} {"train_loss": -11.784058570861816, "global_step": 452768, "epoch": 2695} {"train_loss": -11.568525314331055, "global_step": 452769, "epoch": 2695} {"train_loss": -11.934041976928711, "global_step": 452770, "epoch": 2695} {"train_loss": -11.853559494018555, "global_step": 452771, "epoch": 2695} {"train_loss": -11.98771858215332, "global_step": 452772, "epoch": 2695} {"train_loss": -12.12669563293457, "global_step": 452773, "epoch": 2695} {"train_loss": -12.023418426513672, "global_step": 452774, "epoch": 2695} {"train_loss": -12.06356430053711, "global_step": 452775, "epoch": 2695} {"train_loss": -12.526754379272461, "global_step": 452776, "epoch": 2695} {"train_loss": -11.942770004272461, "global_step": 452777, "epoch": 2695} {"train_loss": -12.2017822265625, "global_step": 452778, "epoch": 2695} {"train_loss": -12.292816162109375, "global_step": 452779, "epoch": 2695} {"train_loss": -12.320552825927734, "global_step": 452780, "epoch": 2695} {"train_loss": -12.20532512664795, "global_step": 452781, "epoch": 2695} {"train_loss": -12.49787712097168, "global_step": 452782, "epoch": 2695} {"train_loss": -12.459344863891602, "global_step": 452783, "epoch": 2695} {"train_loss": -12.491731643676758, "global_step": 452784, "epoch": 2695} {"train_loss": -12.415992736816406, "global_step": 452785, "epoch": 2695} {"train_loss": -12.088103294372559, "global_step": 452786, "epoch": 2695} {"train_loss": -12.578436851501465, "global_step": 452787, "epoch": 2695} {"train_loss": -12.369356155395508, "global_step": 452788, "epoch": 2695} {"train_loss": -12.387763977050781, "global_step": 452789, "epoch": 2695} {"train_loss": -12.297412872314453, "global_step": 452790, "epoch": 2695} {"train_loss": -12.388006210327148, "global_step": 452791, "epoch": 2695} {"train_loss": -12.321481704711914, "global_step": 452792, "epoch": 2695} {"train_loss": -12.445381164550781, "global_step": 452793, "epoch": 2695} {"train_loss": -12.368305206298828, "global_step": 452794, "epoch": 2695} {"train_loss": -12.700166702270508, "global_step": 452795, "epoch": 2695} {"train_loss": -12.224687576293945, "global_step": 452796, "epoch": 2695} {"train_loss": -12.580109596252441, "global_step": 452797, "epoch": 2695} {"train_loss": -12.391860961914062, "global_step": 452798, "epoch": 2695} {"train_loss": -12.58813762664795, "global_step": 452799, "epoch": 2695} {"train_loss": -12.277543067932129, "global_step": 452800, "epoch": 2695} {"train_loss": -12.453834533691406, "global_step": 452801, "epoch": 2695} {"train_loss": -12.409429550170898, "global_step": 452802, "epoch": 2695} {"train_loss": -12.076265335083008, "global_step": 452803, "epoch": 2695} {"train_loss": -12.534923553466797, "global_step": 452804, "epoch": 2695} {"train_loss": -11.391843795776367, "global_step": 452805, "epoch": 2695} {"train_loss": -12.414615631103516, "global_step": 452806, "epoch": 2695} {"train_loss": -12.120087623596191, "global_step": 452807, "epoch": 2695} {"train_loss": -12.200305938720703, "global_step": 452808, "epoch": 2695} {"train_loss": -12.252617835998535, "global_step": 452809, "epoch": 2695} {"train_loss": -11.938142776489258, "global_step": 452810, "epoch": 2695} {"train_loss": -11.260570526123047, "global_step": 452811, "epoch": 2695} {"train_loss": -11.429817199707031, "global_step": 452812, "epoch": 2695} {"train_loss": -12.028432846069336, "global_step": 452813, "epoch": 2695} {"train_loss": -10.92185115814209, "global_step": 452814, "epoch": 2695} {"train_loss": -11.34156608581543, "global_step": 452815, "epoch": 2695} {"train_loss": -11.33511734008789, "global_step": 452816, "epoch": 2695} {"train_loss": -11.944358825683594, "global_step": 452817, "epoch": 2695} {"train_loss": -11.180378913879395, "global_step": 452818, "epoch": 2695} {"train_loss": -11.768942832946777, "global_step": 452819, "epoch": 2695} {"train_loss": -10.893911361694336, "global_step": 452820, "epoch": 2695} {"train_loss": -10.866265296936035, "global_step": 452821, "epoch": 2695} {"train_loss": -10.906201362609863, "global_step": 452822, "epoch": 2695} {"train_loss": -10.680793762207031, "global_step": 452823, "epoch": 2695} {"train_loss": -10.385613441467285, "global_step": 452824, "epoch": 2695} {"train_loss": -10.785848617553711, "global_step": 452825, "epoch": 2695} {"train_loss": -10.78860092163086, "global_step": 452826, "epoch": 2695} {"train_loss": -11.731112480163574, "global_step": 452827, "epoch": 2695} {"train_loss": -10.495626449584961, "global_step": 452828, "epoch": 2695} {"train_loss": -11.690797805786133, "global_step": 452829, "epoch": 2695} {"train_loss": -11.18038558959961, "global_step": 452830, "epoch": 2695} {"train_loss": -11.164389610290527, "global_step": 452831, "epoch": 2695} {"train_loss": -11.727029800415039, "global_step": 452832, "epoch": 2695} {"train_loss": -10.977399826049805, "global_step": 452833, "epoch": 2695} {"train_loss": -10.869757652282715, "global_step": 452834, "epoch": 2695} {"train_loss": -11.46044921875, "global_step": 452835, "epoch": 2695} {"train_loss": -11.80876636505127, "global_step": 452836, "epoch": 2695} {"train_loss": -12.285039901733398, "global_step": 452837, "epoch": 2695} {"train_loss": -11.28612232208252, "global_step": 452838, "epoch": 2695} {"train_loss": -12.264053344726562, "global_step": 452839, "epoch": 2695} {"train_loss": -11.270989418029785, "global_step": 452840, "epoch": 2695} {"train_loss": -11.799373626708984, "global_step": 452841, "epoch": 2695} {"train_loss": -11.542421340942383, "global_step": 452842, "epoch": 2695} {"train_loss": -12.258675575256348, "global_step": 452843, "epoch": 2695} {"train_loss": -11.72457218170166, "global_step": 452844, "epoch": 2695} {"train_loss": -12.313966751098633, "global_step": 452845, "epoch": 2695} {"train_loss": -11.683055877685547, "global_step": 452846, "epoch": 2695} {"train_loss": -12.306538581848145, "global_step": 452847, "epoch": 2695} {"train_loss": -12.229511260986328, "global_step": 452848, "epoch": 2695} {"train_loss": -12.41059684753418, "global_step": 452849, "epoch": 2695} {"train_loss": -12.159469604492188, "global_step": 452850, "epoch": 2695} {"train_loss": -12.137105941772461, "global_step": 452851, "epoch": 2695} {"train_loss": -12.34693717956543, "global_step": 452852, "epoch": 2695} {"train_loss": -12.225790023803711, "global_step": 452853, "epoch": 2695} {"train_loss": -12.465108871459961, "global_step": 452854, "epoch": 2695} {"train_loss": -12.659689903259277, "global_step": 452855, "epoch": 2695} {"train_loss": -12.50398063659668, "global_step": 452856, "epoch": 2695} {"train_loss": -12.416024208068848, "global_step": 452857, "epoch": 2695} {"train_loss": -12.296379089355469, "global_step": 452858, "epoch": 2695} {"train_loss": -12.302835464477539, "global_step": 452859, "epoch": 2695} {"train_loss": -12.276862144470215, "global_step": 452860, "epoch": 2695} {"train_loss": -12.535913467407227, "global_step": 452861, "epoch": 2695} {"train_loss": -12.433034896850586, "global_step": 452862, "epoch": 2695} {"train_loss": -12.440458297729492, "global_step": 452863, "epoch": 2695} {"train_loss": -12.464296340942383, "global_step": 452864, "epoch": 2695} {"train_loss": -12.294488906860352, "global_step": 452865, "epoch": 2695} {"train_loss": -12.35323429107666, "global_step": 452866, "epoch": 2695} {"train_loss": -12.505590438842773, "global_step": 452867, "epoch": 2695} {"train_loss": -12.59827995300293, "global_step": 452868, "epoch": 2695} {"train_loss": -12.650447845458984, "global_step": 452869, "epoch": 2695} {"train_loss": -12.529861450195312, "global_step": 452870, "epoch": 2695} {"train_loss": -12.673784255981445, "global_step": 452871, "epoch": 2695} {"train_loss": -12.746748924255371, "global_step": 452872, "epoch": 2695} {"train_loss": -12.534551620483398, "global_step": 452873, "epoch": 2695} {"train_loss": -12.456393241882324, "global_step": 452874, "epoch": 2695} {"train_loss": -12.770517349243164, "global_step": 452875, "epoch": 2695} {"train_loss": -12.688240051269531, "global_step": 452876, "epoch": 2695} {"train_loss": -12.751638412475586, "global_step": 452877, "epoch": 2695} {"train_loss": -12.617521286010742, "global_step": 452878, "epoch": 2695} {"train_loss": -12.682271003723145, "global_step": 452879, "epoch": 2695} {"train_loss": -12.347089767456055, "global_step": 452880, "epoch": 2695} {"train_loss": -12.545985221862793, "global_step": 452881, "epoch": 2695} {"train_loss": -12.778280258178711, "global_step": 452882, "epoch": 2695} {"train_loss": -12.429102897644043, "global_step": 452883, "epoch": 2695} {"train_loss": -12.898844718933105, "global_step": 452884, "epoch": 2695} {"train_loss": -12.581460952758789, "global_step": 452885, "epoch": 2695} {"train_loss": -12.637415885925293, "global_step": 452886, "epoch": 2695} {"train_loss": -12.50848388671875, "global_step": 452887, "epoch": 2695} {"train_loss": -12.466876029968262, "global_step": 452888, "epoch": 2695} {"train_loss": -12.485273361206055, "global_step": 452889, "epoch": 2695} {"train_loss": -12.721272468566895, "global_step": 452890, "epoch": 2695} {"train_loss": -12.498689651489258, "global_step": 452891, "epoch": 2695} {"train_loss": -12.538026809692383, "global_step": 452892, "epoch": 2695} {"train_loss": -12.809503555297852, "global_step": 452893, "epoch": 2695} {"train_loss": -12.978923797607422, "global_step": 452894, "epoch": 2695} {"train_loss": -12.91619873046875, "global_step": 452895, "epoch": 2695} {"train_loss": -12.634846687316895, "global_step": 452896, "epoch": 2695} {"train_loss": -12.697263717651367, "global_step": 452897, "epoch": 2695} {"train_loss": -12.876720428466797, "global_step": 452898, "epoch": 2695} {"train_loss": -12.624446868896484, "global_step": 452899, "epoch": 2695} {"train_loss": -12.894830703735352, "global_step": 452900, "epoch": 2695} {"train_loss": -12.654387474060059, "global_step": 452901, "epoch": 2695} {"train_loss": -12.644359588623047, "global_step": 452902, "epoch": 2695} {"train_loss": -12.611513137817383, "global_step": 452903, "epoch": 2695} {"train_loss": -12.798116683959961, "global_step": 452904, "epoch": 2695} {"train_loss": -12.687620162963867, "global_step": 452905, "epoch": 2695} {"train_loss": -12.837907791137695, "global_step": 452906, "epoch": 2695} {"train_loss": -12.575263977050781, "global_step": 452907, "epoch": 2695} {"train_loss": -12.755106925964355, "global_step": 452908, "epoch": 2695} {"train_loss": -12.630534172058105, "global_step": 452909, "epoch": 2695} {"train_loss": -12.672703742980957, "global_step": 452910, "epoch": 2695} {"train_loss": -12.973628997802734, "global_step": 452911, "epoch": 2695} {"train_loss": -12.784284591674805, "global_step": 452912, "epoch": 2695} {"train_loss": -12.886322021484375, "global_step": 452913, "epoch": 2695} {"train_loss": -12.8173828125, "global_step": 452914, "epoch": 2695} {"train_loss": -12.747568130493164, "global_step": 452915, "epoch": 2695} {"train_loss": -12.304033279418945, "global_step": 452916, "epoch": 2695} {"train_loss": -12.281106948852539, "global_step": 452917, "epoch": 2695} {"train_loss": -12.945793151855469, "global_step": 452918, "epoch": 2695} {"train_loss": -12.068628311157227, "global_step": 452919, "epoch": 2695} {"train_loss": -11.441925048828125, "global_step": 452920, "epoch": 2695} {"train_loss": -12.242400169372559, "global_step": 452921, "epoch": 2695} {"train_loss": -12.111492156982422, "global_step": 452922, "epoch": 2695} {"train_loss": -12.578664779663086, "global_step": 452923, "epoch": 2695} {"train_loss": -12.481016159057617, "global_step": 452924, "epoch": 2695} {"train_loss": -12.481013298034668, "global_step": 452925, "epoch": 2695} {"train_loss": -11.9188232421875, "global_step": 452926, "epoch": 2695} {"train_loss": -12.179600488571893, "global_step": 452927, "epoch": 2695, "val_loss": 313101.71875, "train_action_mse_error": 1.8852711915969849} {"train_loss": -12.108437538146973, "global_step": 452928, "epoch": 2696} {"train_loss": -12.722664833068848, "global_step": 452929, "epoch": 2696} {"train_loss": -12.202816009521484, "global_step": 452930, "epoch": 2696} {"train_loss": -12.58144760131836, "global_step": 452931, "epoch": 2696} {"train_loss": -11.99206829071045, "global_step": 452932, "epoch": 2696} {"train_loss": -12.296120643615723, "global_step": 452933, "epoch": 2696} {"train_loss": -12.10366153717041, "global_step": 452934, "epoch": 2696} {"train_loss": -12.414948463439941, "global_step": 452935, "epoch": 2696} {"train_loss": -12.319669723510742, "global_step": 452936, "epoch": 2696} {"train_loss": -12.765183448791504, "global_step": 452937, "epoch": 2696} {"train_loss": -12.523641586303711, "global_step": 452938, "epoch": 2696} {"train_loss": -12.506366729736328, "global_step": 452939, "epoch": 2696} {"train_loss": -12.218360900878906, "global_step": 452940, "epoch": 2696} {"train_loss": -12.50620174407959, "global_step": 452941, "epoch": 2696} {"train_loss": -12.392295837402344, "global_step": 452942, "epoch": 2696} {"train_loss": -12.313278198242188, "global_step": 452943, "epoch": 2696} {"train_loss": -12.207015991210938, "global_step": 452944, "epoch": 2696} {"train_loss": -12.572030067443848, "global_step": 452945, "epoch": 2696} {"train_loss": -12.312395095825195, "global_step": 452946, "epoch": 2696} {"train_loss": -12.374557495117188, "global_step": 452947, "epoch": 2696} {"train_loss": -12.484106063842773, "global_step": 452948, "epoch": 2696} {"train_loss": -12.426496505737305, "global_step": 452949, "epoch": 2696} {"train_loss": -12.369646072387695, "global_step": 452950, "epoch": 2696} {"train_loss": -12.155961036682129, "global_step": 452951, "epoch": 2696} {"train_loss": -11.953153610229492, "global_step": 452952, "epoch": 2696} {"train_loss": -11.546931266784668, "global_step": 452953, "epoch": 2696} {"train_loss": -11.862850189208984, "global_step": 452954, "epoch": 2696} {"train_loss": -11.978499412536621, "global_step": 452955, "epoch": 2696} {"train_loss": -12.419422149658203, "global_step": 452956, "epoch": 2696} {"train_loss": -12.412351608276367, "global_step": 452957, "epoch": 2696} {"train_loss": -11.928258895874023, "global_step": 452958, "epoch": 2696} {"train_loss": -12.478368759155273, "global_step": 452959, "epoch": 2696} {"train_loss": -11.956844329833984, "global_step": 452960, "epoch": 2696} {"train_loss": -12.462213516235352, "global_step": 452961, "epoch": 2696} {"train_loss": -11.795292854309082, "global_step": 452962, "epoch": 2696} {"train_loss": -12.27629280090332, "global_step": 452963, "epoch": 2696} {"train_loss": -11.74050235748291, "global_step": 452964, "epoch": 2696} {"train_loss": -12.295902252197266, "global_step": 452965, "epoch": 2696} {"train_loss": -12.336734771728516, "global_step": 452966, "epoch": 2696} {"train_loss": -12.124979972839355, "global_step": 452967, "epoch": 2696} {"train_loss": -12.525014877319336, "global_step": 452968, "epoch": 2696} {"train_loss": -12.131268501281738, "global_step": 452969, "epoch": 2696} {"train_loss": -12.33449935913086, "global_step": 452970, "epoch": 2696} {"train_loss": -11.977405548095703, "global_step": 452971, "epoch": 2696} {"train_loss": -11.622116088867188, "global_step": 452972, "epoch": 2696} {"train_loss": -10.910720825195312, "global_step": 452973, "epoch": 2696} {"train_loss": -11.7643404006958, "global_step": 452974, "epoch": 2696} {"train_loss": -12.181127548217773, "global_step": 452975, "epoch": 2696} {"train_loss": -10.924785614013672, "global_step": 452976, "epoch": 2696} {"train_loss": -12.548057556152344, "global_step": 452977, "epoch": 2696} {"train_loss": -11.328353881835938, "global_step": 452978, "epoch": 2696} {"train_loss": -11.041707992553711, "global_step": 452979, "epoch": 2696} {"train_loss": -12.284263610839844, "global_step": 452980, "epoch": 2696} {"train_loss": -11.924140930175781, "global_step": 452981, "epoch": 2696} {"train_loss": -12.062458992004395, "global_step": 452982, "epoch": 2696} {"train_loss": -11.751250267028809, "global_step": 452983, "epoch": 2696} {"train_loss": -12.184616088867188, "global_step": 452984, "epoch": 2696} {"train_loss": -11.834505081176758, "global_step": 452985, "epoch": 2696} {"train_loss": -11.155876159667969, "global_step": 452986, "epoch": 2696} {"train_loss": -12.597053527832031, "global_step": 452987, "epoch": 2696} {"train_loss": -11.074899673461914, "global_step": 452988, "epoch": 2696} {"train_loss": -12.128215789794922, "global_step": 452989, "epoch": 2696} {"train_loss": -12.308128356933594, "global_step": 452990, "epoch": 2696} {"train_loss": -11.799774169921875, "global_step": 452991, "epoch": 2696} {"train_loss": -12.545849800109863, "global_step": 452992, "epoch": 2696} {"train_loss": -12.218425750732422, "global_step": 452993, "epoch": 2696} {"train_loss": -11.316493034362793, "global_step": 452994, "epoch": 2696} {"train_loss": -12.608192443847656, "global_step": 452995, "epoch": 2696} {"train_loss": -11.525216102600098, "global_step": 452996, "epoch": 2696} {"train_loss": -11.80533218383789, "global_step": 452997, "epoch": 2696} {"train_loss": -12.471633911132812, "global_step": 452998, "epoch": 2696} {"train_loss": -11.239051818847656, "global_step": 452999, "epoch": 2696} {"train_loss": -12.195615768432617, "global_step": 453000, "epoch": 2696} {"train_loss": -12.17646598815918, "global_step": 453001, "epoch": 2696} {"train_loss": -11.941423416137695, "global_step": 453002, "epoch": 2696} {"train_loss": -12.297042846679688, "global_step": 453003, "epoch": 2696} {"train_loss": -12.37175178527832, "global_step": 453004, "epoch": 2696} {"train_loss": -12.196855545043945, "global_step": 453005, "epoch": 2696} {"train_loss": -12.208207130432129, "global_step": 453006, "epoch": 2696} {"train_loss": -12.137032508850098, "global_step": 453007, "epoch": 2696} {"train_loss": -12.453390121459961, "global_step": 453008, "epoch": 2696} {"train_loss": -12.313209533691406, "global_step": 453009, "epoch": 2696} {"train_loss": -12.752857208251953, "global_step": 453010, "epoch": 2696} {"train_loss": -12.72041130065918, "global_step": 453011, "epoch": 2696} {"train_loss": -12.573812484741211, "global_step": 453012, "epoch": 2696} {"train_loss": -12.336454391479492, "global_step": 453013, "epoch": 2696} {"train_loss": -12.508058547973633, "global_step": 453014, "epoch": 2696} {"train_loss": -12.475994110107422, "global_step": 453015, "epoch": 2696} {"train_loss": -12.353092193603516, "global_step": 453016, "epoch": 2696} {"train_loss": -12.63243293762207, "global_step": 453017, "epoch": 2696} {"train_loss": -12.211013793945312, "global_step": 453018, "epoch": 2696} {"train_loss": -12.736373901367188, "global_step": 453019, "epoch": 2696} {"train_loss": -12.114044189453125, "global_step": 453020, "epoch": 2696} {"train_loss": -12.531246185302734, "global_step": 453021, "epoch": 2696} {"train_loss": -12.519169807434082, "global_step": 453022, "epoch": 2696} {"train_loss": -12.467584609985352, "global_step": 453023, "epoch": 2696} {"train_loss": -12.372781753540039, "global_step": 453024, "epoch": 2696} {"train_loss": -11.449681282043457, "global_step": 453025, "epoch": 2696} {"train_loss": -11.927825927734375, "global_step": 453026, "epoch": 2696} {"train_loss": -11.011582374572754, "global_step": 453027, "epoch": 2696} {"train_loss": -11.93959903717041, "global_step": 453028, "epoch": 2696} {"train_loss": -12.073759078979492, "global_step": 453029, "epoch": 2696} {"train_loss": -11.35300064086914, "global_step": 453030, "epoch": 2696} {"train_loss": -12.332747459411621, "global_step": 453031, "epoch": 2696} {"train_loss": -11.607707977294922, "global_step": 453032, "epoch": 2696} {"train_loss": -12.162506103515625, "global_step": 453033, "epoch": 2696} {"train_loss": -11.727363586425781, "global_step": 453034, "epoch": 2696} {"train_loss": -11.486336708068848, "global_step": 453035, "epoch": 2696} {"train_loss": -11.748871803283691, "global_step": 453036, "epoch": 2696} {"train_loss": -11.334903717041016, "global_step": 453037, "epoch": 2696} {"train_loss": -11.61258602142334, "global_step": 453038, "epoch": 2696} {"train_loss": -11.29432201385498, "global_step": 453039, "epoch": 2696} {"train_loss": -11.687386512756348, "global_step": 453040, "epoch": 2696} {"train_loss": -11.97174072265625, "global_step": 453041, "epoch": 2696} {"train_loss": -12.126535415649414, "global_step": 453042, "epoch": 2696} {"train_loss": -12.071349143981934, "global_step": 453043, "epoch": 2696} {"train_loss": -12.255939483642578, "global_step": 453044, "epoch": 2696} {"train_loss": -11.818893432617188, "global_step": 453045, "epoch": 2696} {"train_loss": -12.310881614685059, "global_step": 453046, "epoch": 2696} {"train_loss": -12.093436241149902, "global_step": 453047, "epoch": 2696} {"train_loss": -12.231470108032227, "global_step": 453048, "epoch": 2696} {"train_loss": -12.298952102661133, "global_step": 453049, "epoch": 2696} {"train_loss": -11.649222373962402, "global_step": 453050, "epoch": 2696} {"train_loss": -12.28512954711914, "global_step": 453051, "epoch": 2696} {"train_loss": -11.342689514160156, "global_step": 453052, "epoch": 2696} {"train_loss": -11.963740348815918, "global_step": 453053, "epoch": 2696} {"train_loss": -11.525918006896973, "global_step": 453054, "epoch": 2696} {"train_loss": -11.55770206451416, "global_step": 453055, "epoch": 2696} {"train_loss": -11.3626708984375, "global_step": 453056, "epoch": 2696} {"train_loss": -11.812259674072266, "global_step": 453057, "epoch": 2696} {"train_loss": -12.4873685836792, "global_step": 453058, "epoch": 2696} {"train_loss": -11.436685562133789, "global_step": 453059, "epoch": 2696} {"train_loss": -11.834059715270996, "global_step": 453060, "epoch": 2696} {"train_loss": -12.121383666992188, "global_step": 453061, "epoch": 2696} {"train_loss": -11.82175064086914, "global_step": 453062, "epoch": 2696} {"train_loss": -12.155876159667969, "global_step": 453063, "epoch": 2696} {"train_loss": -11.904197692871094, "global_step": 453064, "epoch": 2696} {"train_loss": -12.39388370513916, "global_step": 453065, "epoch": 2696} {"train_loss": -12.125638961791992, "global_step": 453066, "epoch": 2696} {"train_loss": -12.445119857788086, "global_step": 453067, "epoch": 2696} {"train_loss": -11.795280456542969, "global_step": 453068, "epoch": 2696} {"train_loss": -12.458355903625488, "global_step": 453069, "epoch": 2696} {"train_loss": -12.302727699279785, "global_step": 453070, "epoch": 2696} {"train_loss": -12.453628540039062, "global_step": 453071, "epoch": 2696} {"train_loss": -12.357950210571289, "global_step": 453072, "epoch": 2696} {"train_loss": -12.535467147827148, "global_step": 453073, "epoch": 2696} {"train_loss": -12.439998626708984, "global_step": 453074, "epoch": 2696} {"train_loss": -12.755716323852539, "global_step": 453075, "epoch": 2696} {"train_loss": -12.383014678955078, "global_step": 453076, "epoch": 2696} {"train_loss": -12.812044143676758, "global_step": 453077, "epoch": 2696} {"train_loss": -12.438933372497559, "global_step": 453078, "epoch": 2696} {"train_loss": -12.797920227050781, "global_step": 453079, "epoch": 2696} {"train_loss": -12.723193168640137, "global_step": 453080, "epoch": 2696} {"train_loss": -12.542743682861328, "global_step": 453081, "epoch": 2696} {"train_loss": -12.75687026977539, "global_step": 453082, "epoch": 2696} {"train_loss": -12.44847583770752, "global_step": 453083, "epoch": 2696} {"train_loss": -12.720087051391602, "global_step": 453084, "epoch": 2696} {"train_loss": -12.64985466003418, "global_step": 453085, "epoch": 2696} {"train_loss": -12.768190383911133, "global_step": 453086, "epoch": 2696} {"train_loss": -12.395265579223633, "global_step": 453087, "epoch": 2696} {"train_loss": -12.86606216430664, "global_step": 453088, "epoch": 2696} {"train_loss": -12.640897750854492, "global_step": 453089, "epoch": 2696} {"train_loss": -12.667101860046387, "global_step": 453090, "epoch": 2696} {"train_loss": -12.738336563110352, "global_step": 453091, "epoch": 2696} {"train_loss": -12.556577682495117, "global_step": 453092, "epoch": 2696} {"train_loss": -12.645431518554688, "global_step": 453093, "epoch": 2696} {"train_loss": -12.717544555664062, "global_step": 453094, "epoch": 2696} {"train_loss": -12.157096590314593, "global_step": 453095, "epoch": 2696, "val_loss": 315706.15625} {"train_loss": -12.512414932250977, "global_step": 453096, "epoch": 2697} {"train_loss": -12.854636192321777, "global_step": 453097, "epoch": 2697} {"train_loss": -12.68091869354248, "global_step": 453098, "epoch": 2697} {"train_loss": -12.487322807312012, "global_step": 453099, "epoch": 2697} {"train_loss": -12.840408325195312, "global_step": 453100, "epoch": 2697} {"train_loss": -12.64249038696289, "global_step": 453101, "epoch": 2697} {"train_loss": -12.688608169555664, "global_step": 453102, "epoch": 2697} {"train_loss": -12.745514869689941, "global_step": 453103, "epoch": 2697} {"train_loss": -12.469648361206055, "global_step": 453104, "epoch": 2697} {"train_loss": -12.775840759277344, "global_step": 453105, "epoch": 2697} {"train_loss": -12.583309173583984, "global_step": 453106, "epoch": 2697} {"train_loss": -12.584087371826172, "global_step": 453107, "epoch": 2697} {"train_loss": -12.602746963500977, "global_step": 453108, "epoch": 2697} {"train_loss": -12.767416000366211, "global_step": 453109, "epoch": 2697} {"train_loss": -12.242523193359375, "global_step": 453110, "epoch": 2697} {"train_loss": -12.004793167114258, "global_step": 453111, "epoch": 2697} {"train_loss": -11.840982437133789, "global_step": 453112, "epoch": 2697} {"train_loss": -12.732851028442383, "global_step": 453113, "epoch": 2697} {"train_loss": -11.974053382873535, "global_step": 453114, "epoch": 2697} {"train_loss": -11.091795921325684, "global_step": 453115, "epoch": 2697} {"train_loss": -12.29035758972168, "global_step": 453116, "epoch": 2697} {"train_loss": -12.331371307373047, "global_step": 453117, "epoch": 2697} {"train_loss": -11.587664604187012, "global_step": 453118, "epoch": 2697} {"train_loss": -12.669187545776367, "global_step": 453119, "epoch": 2697} {"train_loss": -11.752730369567871, "global_step": 453120, "epoch": 2697} {"train_loss": -11.578296661376953, "global_step": 453121, "epoch": 2697} {"train_loss": -12.299331665039062, "global_step": 453122, "epoch": 2697} {"train_loss": -12.037286758422852, "global_step": 453123, "epoch": 2697} {"train_loss": -11.484013557434082, "global_step": 453124, "epoch": 2697} {"train_loss": -12.172811508178711, "global_step": 453125, "epoch": 2697} {"train_loss": -10.795500755310059, "global_step": 453126, "epoch": 2697} {"train_loss": -11.596370697021484, "global_step": 453127, "epoch": 2697} {"train_loss": -11.812784194946289, "global_step": 453128, "epoch": 2697} {"train_loss": -10.461766242980957, "global_step": 453129, "epoch": 2697} {"train_loss": -10.740314483642578, "global_step": 453130, "epoch": 2697} {"train_loss": -10.299651145935059, "global_step": 453131, "epoch": 2697} {"train_loss": -11.388392448425293, "global_step": 453132, "epoch": 2697} {"train_loss": -9.289669036865234, "global_step": 453133, "epoch": 2697} {"train_loss": -10.432234764099121, "global_step": 453134, "epoch": 2697} {"train_loss": -9.432832717895508, "global_step": 453135, "epoch": 2697} {"train_loss": -11.31037712097168, "global_step": 453136, "epoch": 2697} {"train_loss": -9.021089553833008, "global_step": 453137, "epoch": 2697} {"train_loss": -10.978402137756348, "global_step": 453138, "epoch": 2697} {"train_loss": -9.66356372833252, "global_step": 453139, "epoch": 2697} {"train_loss": -10.997196197509766, "global_step": 453140, "epoch": 2697} {"train_loss": -10.006195068359375, "global_step": 453141, "epoch": 2697} {"train_loss": -11.045228004455566, "global_step": 453142, "epoch": 2697} {"train_loss": -10.935663223266602, "global_step": 453143, "epoch": 2697} {"train_loss": -10.488225936889648, "global_step": 453144, "epoch": 2697} {"train_loss": -11.41646671295166, "global_step": 453145, "epoch": 2697} {"train_loss": -10.576417922973633, "global_step": 453146, "epoch": 2697} {"train_loss": -11.391237258911133, "global_step": 453147, "epoch": 2697} {"train_loss": -11.297266006469727, "global_step": 453148, "epoch": 2697} {"train_loss": -11.811055183410645, "global_step": 453149, "epoch": 2697} {"train_loss": -12.060921669006348, "global_step": 453150, "epoch": 2697} {"train_loss": -11.094804763793945, "global_step": 453151, "epoch": 2697} {"train_loss": -12.23241901397705, "global_step": 453152, "epoch": 2697} {"train_loss": -11.666203498840332, "global_step": 453153, "epoch": 2697} {"train_loss": -11.85892105102539, "global_step": 453154, "epoch": 2697} {"train_loss": -11.832653999328613, "global_step": 453155, "epoch": 2697} {"train_loss": -11.658267974853516, "global_step": 453156, "epoch": 2697} {"train_loss": -12.260726928710938, "global_step": 453157, "epoch": 2697} {"train_loss": -11.786478042602539, "global_step": 453158, "epoch": 2697} {"train_loss": -12.196855545043945, "global_step": 453159, "epoch": 2697} {"train_loss": -11.991178512573242, "global_step": 453160, "epoch": 2697} {"train_loss": -12.01196575164795, "global_step": 453161, "epoch": 2697} {"train_loss": -11.917953491210938, "global_step": 453162, "epoch": 2697} {"train_loss": -11.393314361572266, "global_step": 453163, "epoch": 2697} {"train_loss": -11.817731857299805, "global_step": 453164, "epoch": 2697} {"train_loss": -12.32094955444336, "global_step": 453165, "epoch": 2697} {"train_loss": -11.281492233276367, "global_step": 453166, "epoch": 2697} {"train_loss": -12.230077743530273, "global_step": 453167, "epoch": 2697} {"train_loss": -11.5575532913208, "global_step": 453168, "epoch": 2697} {"train_loss": -12.017228126525879, "global_step": 453169, "epoch": 2697} {"train_loss": -12.315771102905273, "global_step": 453170, "epoch": 2697} {"train_loss": -12.113624572753906, "global_step": 453171, "epoch": 2697} {"train_loss": -12.382214546203613, "global_step": 453172, "epoch": 2697} {"train_loss": -12.22089958190918, "global_step": 453173, "epoch": 2697} {"train_loss": -11.946783065795898, "global_step": 453174, "epoch": 2697} {"train_loss": -12.065890312194824, "global_step": 453175, "epoch": 2697} {"train_loss": -11.682657241821289, "global_step": 453176, "epoch": 2697} {"train_loss": -12.282064437866211, "global_step": 453177, "epoch": 2697} {"train_loss": -12.29343032836914, "global_step": 453178, "epoch": 2697} {"train_loss": -12.010486602783203, "global_step": 453179, "epoch": 2697} {"train_loss": -12.273919105529785, "global_step": 453180, "epoch": 2697} {"train_loss": -12.26291275024414, "global_step": 453181, "epoch": 2697} {"train_loss": -11.944140434265137, "global_step": 453182, "epoch": 2697} {"train_loss": -12.054986953735352, "global_step": 453183, "epoch": 2697} {"train_loss": -12.106302261352539, "global_step": 453184, "epoch": 2697} {"train_loss": -12.037339210510254, "global_step": 453185, "epoch": 2697} {"train_loss": -12.504480361938477, "global_step": 453186, "epoch": 2697} {"train_loss": -12.198427200317383, "global_step": 453187, "epoch": 2697} {"train_loss": -12.520157814025879, "global_step": 453188, "epoch": 2697} {"train_loss": -12.46319580078125, "global_step": 453189, "epoch": 2697} {"train_loss": -12.193436622619629, "global_step": 453190, "epoch": 2697} {"train_loss": -12.377378463745117, "global_step": 453191, "epoch": 2697} {"train_loss": -12.4761381149292, "global_step": 453192, "epoch": 2697} {"train_loss": -12.574088096618652, "global_step": 453193, "epoch": 2697} {"train_loss": -12.569293975830078, "global_step": 453194, "epoch": 2697} {"train_loss": -12.483840942382812, "global_step": 453195, "epoch": 2697} {"train_loss": -12.659029006958008, "global_step": 453196, "epoch": 2697} {"train_loss": -12.355497360229492, "global_step": 453197, "epoch": 2697} {"train_loss": -12.689277648925781, "global_step": 453198, "epoch": 2697} {"train_loss": -12.732165336608887, "global_step": 453199, "epoch": 2697} {"train_loss": -12.451473236083984, "global_step": 453200, "epoch": 2697} {"train_loss": -12.589733123779297, "global_step": 453201, "epoch": 2697} {"train_loss": -12.675437927246094, "global_step": 453202, "epoch": 2697} {"train_loss": -12.382305145263672, "global_step": 453203, "epoch": 2697} {"train_loss": -12.650103569030762, "global_step": 453204, "epoch": 2697} {"train_loss": -12.732085227966309, "global_step": 453205, "epoch": 2697} {"train_loss": -12.533233642578125, "global_step": 453206, "epoch": 2697} {"train_loss": -12.759743690490723, "global_step": 453207, "epoch": 2697} {"train_loss": -12.500589370727539, "global_step": 453208, "epoch": 2697} {"train_loss": -12.643308639526367, "global_step": 453209, "epoch": 2697} {"train_loss": -12.750761032104492, "global_step": 453210, "epoch": 2697} {"train_loss": -12.652700424194336, "global_step": 453211, "epoch": 2697} {"train_loss": -12.502484321594238, "global_step": 453212, "epoch": 2697} {"train_loss": -12.604997634887695, "global_step": 453213, "epoch": 2697} {"train_loss": -12.49307918548584, "global_step": 453214, "epoch": 2697} {"train_loss": -12.610830307006836, "global_step": 453215, "epoch": 2697} {"train_loss": -12.817276000976562, "global_step": 453216, "epoch": 2697} {"train_loss": -12.547922134399414, "global_step": 453217, "epoch": 2697} {"train_loss": -12.610092163085938, "global_step": 453218, "epoch": 2697} {"train_loss": -12.275947570800781, "global_step": 453219, "epoch": 2697} {"train_loss": -12.585798263549805, "global_step": 453220, "epoch": 2697} {"train_loss": -12.600448608398438, "global_step": 453221, "epoch": 2697} {"train_loss": -12.488261222839355, "global_step": 453222, "epoch": 2697} {"train_loss": -12.238590240478516, "global_step": 453223, "epoch": 2697} {"train_loss": -12.597620010375977, "global_step": 453224, "epoch": 2697} {"train_loss": -12.437131881713867, "global_step": 453225, "epoch": 2697} {"train_loss": -12.510684967041016, "global_step": 453226, "epoch": 2697} {"train_loss": -12.551591873168945, "global_step": 453227, "epoch": 2697} {"train_loss": -12.196128845214844, "global_step": 453228, "epoch": 2697} {"train_loss": -12.735254287719727, "global_step": 453229, "epoch": 2697} {"train_loss": -12.825010299682617, "global_step": 453230, "epoch": 2697} {"train_loss": -12.66578197479248, "global_step": 453231, "epoch": 2697} {"train_loss": -12.79347038269043, "global_step": 453232, "epoch": 2697} {"train_loss": -12.690299034118652, "global_step": 453233, "epoch": 2697} {"train_loss": -12.7671480178833, "global_step": 453234, "epoch": 2697} {"train_loss": -12.85693645477295, "global_step": 453235, "epoch": 2697} {"train_loss": -12.51779842376709, "global_step": 453236, "epoch": 2697} {"train_loss": -12.940329551696777, "global_step": 453237, "epoch": 2697} {"train_loss": -12.657218933105469, "global_step": 453238, "epoch": 2697} {"train_loss": -12.840853691101074, "global_step": 453239, "epoch": 2697} {"train_loss": -12.771278381347656, "global_step": 453240, "epoch": 2697} {"train_loss": -12.63891887664795, "global_step": 453241, "epoch": 2697} {"train_loss": -12.691953659057617, "global_step": 453242, "epoch": 2697} {"train_loss": -12.868243217468262, "global_step": 453243, "epoch": 2697} {"train_loss": -12.631444931030273, "global_step": 453244, "epoch": 2697} {"train_loss": -12.741373062133789, "global_step": 453245, "epoch": 2697} {"train_loss": -12.80499267578125, "global_step": 453246, "epoch": 2697} {"train_loss": -12.433727264404297, "global_step": 453247, "epoch": 2697} {"train_loss": -12.584856033325195, "global_step": 453248, "epoch": 2697} {"train_loss": -12.432024955749512, "global_step": 453249, "epoch": 2697} {"train_loss": -11.96853256225586, "global_step": 453250, "epoch": 2697} {"train_loss": -12.458052635192871, "global_step": 453251, "epoch": 2697} {"train_loss": -12.81052017211914, "global_step": 453252, "epoch": 2697} {"train_loss": -12.508875846862793, "global_step": 453253, "epoch": 2697} {"train_loss": -11.667596817016602, "global_step": 453254, "epoch": 2697} {"train_loss": -12.25283432006836, "global_step": 453255, "epoch": 2697} {"train_loss": -12.633886337280273, "global_step": 453256, "epoch": 2697} {"train_loss": -11.76993179321289, "global_step": 453257, "epoch": 2697} {"train_loss": -11.314830780029297, "global_step": 453258, "epoch": 2697} {"train_loss": -12.665121078491211, "global_step": 453259, "epoch": 2697} {"train_loss": -10.947103500366211, "global_step": 453260, "epoch": 2697} {"train_loss": -11.924201011657715, "global_step": 453261, "epoch": 2697} {"train_loss": -12.592818260192871, "global_step": 453262, "epoch": 2697} {"train_loss": -12.103517594791594, "global_step": 453263, "epoch": 2697, "val_loss": 312020.75} {"train_loss": -11.845480918884277, "global_step": 453264, "epoch": 2698} {"train_loss": -12.110687255859375, "global_step": 453265, "epoch": 2698} {"train_loss": -12.369220733642578, "global_step": 453266, "epoch": 2698} {"train_loss": -12.191267967224121, "global_step": 453267, "epoch": 2698} {"train_loss": -12.032038688659668, "global_step": 453268, "epoch": 2698} {"train_loss": -12.515576362609863, "global_step": 453269, "epoch": 2698} {"train_loss": -12.413156509399414, "global_step": 453270, "epoch": 2698} {"train_loss": -12.408910751342773, "global_step": 453271, "epoch": 2698} {"train_loss": -12.752187728881836, "global_step": 453272, "epoch": 2698} {"train_loss": -12.321562767028809, "global_step": 453273, "epoch": 2698} {"train_loss": -12.52393913269043, "global_step": 453274, "epoch": 2698} {"train_loss": -12.433837890625, "global_step": 453275, "epoch": 2698} {"train_loss": -12.673303604125977, "global_step": 453276, "epoch": 2698} {"train_loss": -12.326101303100586, "global_step": 453277, "epoch": 2698} {"train_loss": -12.787124633789062, "global_step": 453278, "epoch": 2698} {"train_loss": -12.432013511657715, "global_step": 453279, "epoch": 2698} {"train_loss": -12.247617721557617, "global_step": 453280, "epoch": 2698} {"train_loss": -12.184277534484863, "global_step": 453281, "epoch": 2698} {"train_loss": -12.402250289916992, "global_step": 453282, "epoch": 2698} {"train_loss": -12.479177474975586, "global_step": 453283, "epoch": 2698} {"train_loss": -12.890047073364258, "global_step": 453284, "epoch": 2698} {"train_loss": -12.086531639099121, "global_step": 453285, "epoch": 2698} {"train_loss": -11.304434776306152, "global_step": 453286, "epoch": 2698} {"train_loss": -12.686467170715332, "global_step": 453287, "epoch": 2698} {"train_loss": -12.065685272216797, "global_step": 453288, "epoch": 2698} {"train_loss": -12.85403823852539, "global_step": 453289, "epoch": 2698} {"train_loss": -12.6585111618042, "global_step": 453290, "epoch": 2698} {"train_loss": -12.711529731750488, "global_step": 453291, "epoch": 2698} {"train_loss": -12.770647048950195, "global_step": 453292, "epoch": 2698} {"train_loss": -12.871660232543945, "global_step": 453293, "epoch": 2698} {"train_loss": -12.839911460876465, "global_step": 453294, "epoch": 2698} {"train_loss": -12.706228256225586, "global_step": 453295, "epoch": 2698} {"train_loss": -12.637113571166992, "global_step": 453296, "epoch": 2698} {"train_loss": -12.781623840332031, "global_step": 453297, "epoch": 2698} {"train_loss": -12.858972549438477, "global_step": 453298, "epoch": 2698} {"train_loss": -12.468008041381836, "global_step": 453299, "epoch": 2698} {"train_loss": -12.687372207641602, "global_step": 453300, "epoch": 2698} {"train_loss": -12.546880722045898, "global_step": 453301, "epoch": 2698} {"train_loss": -12.333619117736816, "global_step": 453302, "epoch": 2698} {"train_loss": -12.033437728881836, "global_step": 453303, "epoch": 2698} {"train_loss": -11.793715476989746, "global_step": 453304, "epoch": 2698} {"train_loss": -12.781413078308105, "global_step": 453305, "epoch": 2698} {"train_loss": -12.363067626953125, "global_step": 453306, "epoch": 2698} {"train_loss": -12.022378921508789, "global_step": 453307, "epoch": 2698} {"train_loss": -11.326780319213867, "global_step": 453308, "epoch": 2698} {"train_loss": -11.713590621948242, "global_step": 453309, "epoch": 2698} {"train_loss": -11.88380241394043, "global_step": 453310, "epoch": 2698} {"train_loss": -11.787656784057617, "global_step": 453311, "epoch": 2698} {"train_loss": -10.677740097045898, "global_step": 453312, "epoch": 2698} {"train_loss": -11.910236358642578, "global_step": 453313, "epoch": 2698} {"train_loss": -9.781100273132324, "global_step": 453314, "epoch": 2698} {"train_loss": -9.815038681030273, "global_step": 453315, "epoch": 2698} {"train_loss": -10.989080429077148, "global_step": 453316, "epoch": 2698} {"train_loss": -11.429250717163086, "global_step": 453317, "epoch": 2698} {"train_loss": -10.759246826171875, "global_step": 453318, "epoch": 2698} {"train_loss": -11.50461196899414, "global_step": 453319, "epoch": 2698} {"train_loss": -10.802627563476562, "global_step": 453320, "epoch": 2698} {"train_loss": -11.363664627075195, "global_step": 453321, "epoch": 2698} {"train_loss": -11.252914428710938, "global_step": 453322, "epoch": 2698} {"train_loss": -10.850884437561035, "global_step": 453323, "epoch": 2698} {"train_loss": -11.428834915161133, "global_step": 453324, "epoch": 2698} {"train_loss": -11.423877716064453, "global_step": 453325, "epoch": 2698} {"train_loss": -10.235113143920898, "global_step": 453326, "epoch": 2698} {"train_loss": -11.062429428100586, "global_step": 453327, "epoch": 2698} {"train_loss": -11.239452362060547, "global_step": 453328, "epoch": 2698} {"train_loss": -10.657761573791504, "global_step": 453329, "epoch": 2698} {"train_loss": -11.608173370361328, "global_step": 453330, "epoch": 2698} {"train_loss": -11.114212036132812, "global_step": 453331, "epoch": 2698} {"train_loss": -11.357756614685059, "global_step": 453332, "epoch": 2698} {"train_loss": -11.635337829589844, "global_step": 453333, "epoch": 2698} {"train_loss": -11.955209732055664, "global_step": 453334, "epoch": 2698} {"train_loss": -12.200772285461426, "global_step": 453335, "epoch": 2698} {"train_loss": -11.214786529541016, "global_step": 453336, "epoch": 2698} {"train_loss": -12.351065635681152, "global_step": 453337, "epoch": 2698} {"train_loss": -11.789551734924316, "global_step": 453338, "epoch": 2698} {"train_loss": -12.360344886779785, "global_step": 453339, "epoch": 2698} {"train_loss": -12.40128231048584, "global_step": 453340, "epoch": 2698} {"train_loss": -12.150921821594238, "global_step": 453341, "epoch": 2698} {"train_loss": -12.377155303955078, "global_step": 453342, "epoch": 2698} {"train_loss": -12.016109466552734, "global_step": 453343, "epoch": 2698} {"train_loss": -12.483943939208984, "global_step": 453344, "epoch": 2698} {"train_loss": -12.122173309326172, "global_step": 453345, "epoch": 2698} {"train_loss": -12.295125007629395, "global_step": 453346, "epoch": 2698} {"train_loss": -12.272924423217773, "global_step": 453347, "epoch": 2698} {"train_loss": -12.211450576782227, "global_step": 453348, "epoch": 2698} {"train_loss": -12.32291030883789, "global_step": 453349, "epoch": 2698} {"train_loss": -12.40744400024414, "global_step": 453350, "epoch": 2698} {"train_loss": -12.497100830078125, "global_step": 453351, "epoch": 2698} {"train_loss": -12.162437438964844, "global_step": 453352, "epoch": 2698} {"train_loss": -12.535131454467773, "global_step": 453353, "epoch": 2698} {"train_loss": -12.064435958862305, "global_step": 453354, "epoch": 2698} {"train_loss": -12.345972061157227, "global_step": 453355, "epoch": 2698} {"train_loss": -12.100391387939453, "global_step": 453356, "epoch": 2698} {"train_loss": -12.565169334411621, "global_step": 453357, "epoch": 2698} {"train_loss": -12.1348876953125, "global_step": 453358, "epoch": 2698} {"train_loss": -12.193584442138672, "global_step": 453359, "epoch": 2698} {"train_loss": -11.364513397216797, "global_step": 453360, "epoch": 2698} {"train_loss": -11.585382461547852, "global_step": 453361, "epoch": 2698} {"train_loss": -10.628911972045898, "global_step": 453362, "epoch": 2698} {"train_loss": -12.138923645019531, "global_step": 453363, "epoch": 2698} {"train_loss": -11.512777328491211, "global_step": 453364, "epoch": 2698} {"train_loss": -12.04020881652832, "global_step": 453365, "epoch": 2698} {"train_loss": -11.250993728637695, "global_step": 453366, "epoch": 2698} {"train_loss": -12.444756507873535, "global_step": 453367, "epoch": 2698} {"train_loss": -11.31901741027832, "global_step": 453368, "epoch": 2698} {"train_loss": -11.954961776733398, "global_step": 453369, "epoch": 2698} {"train_loss": -11.692519187927246, "global_step": 453370, "epoch": 2698} {"train_loss": -11.691766738891602, "global_step": 453371, "epoch": 2698} {"train_loss": -12.114263534545898, "global_step": 453372, "epoch": 2698} {"train_loss": -11.636167526245117, "global_step": 453373, "epoch": 2698} {"train_loss": -11.91380500793457, "global_step": 453374, "epoch": 2698} {"train_loss": -11.900016784667969, "global_step": 453375, "epoch": 2698} {"train_loss": -12.133543014526367, "global_step": 453376, "epoch": 2698} {"train_loss": -11.664346694946289, "global_step": 453377, "epoch": 2698} {"train_loss": -12.26048469543457, "global_step": 453378, "epoch": 2698} {"train_loss": -11.799620628356934, "global_step": 453379, "epoch": 2698} {"train_loss": -12.349746704101562, "global_step": 453380, "epoch": 2698} {"train_loss": -12.138351440429688, "global_step": 453381, "epoch": 2698} {"train_loss": -12.173089981079102, "global_step": 453382, "epoch": 2698} {"train_loss": -12.457259178161621, "global_step": 453383, "epoch": 2698} {"train_loss": -12.300813674926758, "global_step": 453384, "epoch": 2698} {"train_loss": -12.391845703125, "global_step": 453385, "epoch": 2698} {"train_loss": -12.439897537231445, "global_step": 453386, "epoch": 2698} {"train_loss": -12.450862884521484, "global_step": 453387, "epoch": 2698} {"train_loss": -12.468147277832031, "global_step": 453388, "epoch": 2698} {"train_loss": -12.663797378540039, "global_step": 453389, "epoch": 2698} {"train_loss": -12.484593391418457, "global_step": 453390, "epoch": 2698} {"train_loss": -12.383888244628906, "global_step": 453391, "epoch": 2698} {"train_loss": -12.675909042358398, "global_step": 453392, "epoch": 2698} {"train_loss": -12.236610412597656, "global_step": 453393, "epoch": 2698} {"train_loss": -12.729280471801758, "global_step": 453394, "epoch": 2698} {"train_loss": -12.529038429260254, "global_step": 453395, "epoch": 2698} {"train_loss": -12.580677032470703, "global_step": 453396, "epoch": 2698} {"train_loss": -12.601095199584961, "global_step": 453397, "epoch": 2698} {"train_loss": -12.385318756103516, "global_step": 453398, "epoch": 2698} {"train_loss": -12.608555793762207, "global_step": 453399, "epoch": 2698} {"train_loss": -12.34803581237793, "global_step": 453400, "epoch": 2698} {"train_loss": -12.853328704833984, "global_step": 453401, "epoch": 2698} {"train_loss": -12.457801818847656, "global_step": 453402, "epoch": 2698} {"train_loss": -12.513229370117188, "global_step": 453403, "epoch": 2698} {"train_loss": -12.678596496582031, "global_step": 453404, "epoch": 2698} {"train_loss": -12.619430541992188, "global_step": 453405, "epoch": 2698} {"train_loss": -12.626392364501953, "global_step": 453406, "epoch": 2698} {"train_loss": -12.534407615661621, "global_step": 453407, "epoch": 2698} {"train_loss": -12.47641658782959, "global_step": 453408, "epoch": 2698} {"train_loss": -12.580282211303711, "global_step": 453409, "epoch": 2698} {"train_loss": -12.154760360717773, "global_step": 453410, "epoch": 2698} {"train_loss": -12.644100189208984, "global_step": 453411, "epoch": 2698} {"train_loss": -12.60568618774414, "global_step": 453412, "epoch": 2698} {"train_loss": -12.234142303466797, "global_step": 453413, "epoch": 2698} {"train_loss": -11.865692138671875, "global_step": 453414, "epoch": 2698} {"train_loss": -12.576465606689453, "global_step": 453415, "epoch": 2698} {"train_loss": -12.090319633483887, "global_step": 453416, "epoch": 2698} {"train_loss": -11.70815372467041, "global_step": 453417, "epoch": 2698} {"train_loss": -12.312376022338867, "global_step": 453418, "epoch": 2698} {"train_loss": -12.271272659301758, "global_step": 453419, "epoch": 2698} {"train_loss": -11.079314231872559, "global_step": 453420, "epoch": 2698} {"train_loss": -12.364919662475586, "global_step": 453421, "epoch": 2698} {"train_loss": -10.605731964111328, "global_step": 453422, "epoch": 2698} {"train_loss": -12.190108299255371, "global_step": 453423, "epoch": 2698} {"train_loss": -11.643133163452148, "global_step": 453424, "epoch": 2698} {"train_loss": -11.875313758850098, "global_step": 453425, "epoch": 2698} {"train_loss": -12.006242752075195, "global_step": 453426, "epoch": 2698} {"train_loss": -11.778360366821289, "global_step": 453427, "epoch": 2698} {"train_loss": -12.445305824279785, "global_step": 453428, "epoch": 2698} {"train_loss": -11.56314468383789, "global_step": 453429, "epoch": 2698} {"train_loss": -12.663599014282227, "global_step": 453430, "epoch": 2698} {"train_loss": -12.07320158822196, "global_step": 453431, "epoch": 2698, "val_loss": 308459.78125} {"train_loss": -12.25736141204834, "global_step": 453432, "epoch": 2699} {"train_loss": -11.670413970947266, "global_step": 453433, "epoch": 2699} {"train_loss": -11.80134391784668, "global_step": 453434, "epoch": 2699} {"train_loss": -12.258772850036621, "global_step": 453435, "epoch": 2699} {"train_loss": -11.872512817382812, "global_step": 453436, "epoch": 2699} {"train_loss": -11.935708999633789, "global_step": 453437, "epoch": 2699} {"train_loss": -12.219136238098145, "global_step": 453438, "epoch": 2699} {"train_loss": -11.978205680847168, "global_step": 453439, "epoch": 2699} {"train_loss": -12.346214294433594, "global_step": 453440, "epoch": 2699} {"train_loss": -12.228458404541016, "global_step": 453441, "epoch": 2699} {"train_loss": -11.600702285766602, "global_step": 453442, "epoch": 2699} {"train_loss": -12.384398460388184, "global_step": 453443, "epoch": 2699} {"train_loss": -11.014156341552734, "global_step": 453444, "epoch": 2699} {"train_loss": -12.164344787597656, "global_step": 453445, "epoch": 2699} {"train_loss": -11.998863220214844, "global_step": 453446, "epoch": 2699} {"train_loss": -11.668451309204102, "global_step": 453447, "epoch": 2699} {"train_loss": -12.362431526184082, "global_step": 453448, "epoch": 2699} {"train_loss": -10.825800895690918, "global_step": 453449, "epoch": 2699} {"train_loss": -12.316028594970703, "global_step": 453450, "epoch": 2699} {"train_loss": -10.809653282165527, "global_step": 453451, "epoch": 2699} {"train_loss": -11.527460098266602, "global_step": 453452, "epoch": 2699} {"train_loss": -12.026073455810547, "global_step": 453453, "epoch": 2699} {"train_loss": -11.71153450012207, "global_step": 453454, "epoch": 2699} {"train_loss": -11.857847213745117, "global_step": 453455, "epoch": 2699} {"train_loss": -11.899534225463867, "global_step": 453456, "epoch": 2699} {"train_loss": -12.400591850280762, "global_step": 453457, "epoch": 2699} {"train_loss": -12.624289512634277, "global_step": 453458, "epoch": 2699} {"train_loss": -12.289484977722168, "global_step": 453459, "epoch": 2699} {"train_loss": -12.613512992858887, "global_step": 453460, "epoch": 2699} {"train_loss": -12.556612014770508, "global_step": 453461, "epoch": 2699} {"train_loss": -12.42226791381836, "global_step": 453462, "epoch": 2699} {"train_loss": -12.354581832885742, "global_step": 453463, "epoch": 2699} {"train_loss": -12.357906341552734, "global_step": 453464, "epoch": 2699} {"train_loss": -12.451051712036133, "global_step": 453465, "epoch": 2699} {"train_loss": -12.728957176208496, "global_step": 453466, "epoch": 2699} {"train_loss": -12.435493469238281, "global_step": 453467, "epoch": 2699} {"train_loss": -12.25929069519043, "global_step": 453468, "epoch": 2699} {"train_loss": -12.75288200378418, "global_step": 453469, "epoch": 2699} {"train_loss": -12.521430969238281, "global_step": 453470, "epoch": 2699} {"train_loss": -12.723152160644531, "global_step": 453471, "epoch": 2699} {"train_loss": -12.807701110839844, "global_step": 453472, "epoch": 2699} {"train_loss": -12.45018482208252, "global_step": 453473, "epoch": 2699} {"train_loss": -12.73321533203125, "global_step": 453474, "epoch": 2699} {"train_loss": -12.320154190063477, "global_step": 453475, "epoch": 2699} {"train_loss": -12.738326072692871, "global_step": 453476, "epoch": 2699} {"train_loss": -12.637109756469727, "global_step": 453477, "epoch": 2699} {"train_loss": -12.696207046508789, "global_step": 453478, "epoch": 2699} {"train_loss": -12.569526672363281, "global_step": 453479, "epoch": 2699} {"train_loss": -12.691793441772461, "global_step": 453480, "epoch": 2699} {"train_loss": -12.943403244018555, "global_step": 453481, "epoch": 2699} {"train_loss": -12.62771987915039, "global_step": 453482, "epoch": 2699} {"train_loss": -12.752287864685059, "global_step": 453483, "epoch": 2699} {"train_loss": -12.875202178955078, "global_step": 453484, "epoch": 2699} {"train_loss": -12.603124618530273, "global_step": 453485, "epoch": 2699} {"train_loss": -12.685513496398926, "global_step": 453486, "epoch": 2699} {"train_loss": -12.672079086303711, "global_step": 453487, "epoch": 2699} {"train_loss": -12.922012329101562, "global_step": 453488, "epoch": 2699} {"train_loss": -12.638766288757324, "global_step": 453489, "epoch": 2699} {"train_loss": -12.530134201049805, "global_step": 453490, "epoch": 2699} {"train_loss": -12.812080383300781, "global_step": 453491, "epoch": 2699} {"train_loss": -12.813375473022461, "global_step": 453492, "epoch": 2699} {"train_loss": -12.731244087219238, "global_step": 453493, "epoch": 2699} {"train_loss": -12.650285720825195, "global_step": 453494, "epoch": 2699} {"train_loss": -12.393598556518555, "global_step": 453495, "epoch": 2699} {"train_loss": -12.86355209350586, "global_step": 453496, "epoch": 2699} {"train_loss": -12.426223754882812, "global_step": 453497, "epoch": 2699} {"train_loss": -12.773645401000977, "global_step": 453498, "epoch": 2699} {"train_loss": -12.421594619750977, "global_step": 453499, "epoch": 2699} {"train_loss": -12.738290786743164, "global_step": 453500, "epoch": 2699} {"train_loss": -12.85593032836914, "global_step": 453501, "epoch": 2699} {"train_loss": -12.547208786010742, "global_step": 453502, "epoch": 2699} {"train_loss": -12.71603775024414, "global_step": 453503, "epoch": 2699} {"train_loss": -12.680305480957031, "global_step": 453504, "epoch": 2699} {"train_loss": -12.235467910766602, "global_step": 453505, "epoch": 2699} {"train_loss": -12.662118911743164, "global_step": 453506, "epoch": 2699} {"train_loss": -12.564159393310547, "global_step": 453507, "epoch": 2699} {"train_loss": -12.4335298538208, "global_step": 453508, "epoch": 2699} {"train_loss": -13.00084400177002, "global_step": 453509, "epoch": 2699} {"train_loss": -12.404985427856445, "global_step": 453510, "epoch": 2699} {"train_loss": -12.388063430786133, "global_step": 453511, "epoch": 2699} {"train_loss": -12.731019020080566, "global_step": 453512, "epoch": 2699} {"train_loss": -12.83328628540039, "global_step": 453513, "epoch": 2699} {"train_loss": -12.534067153930664, "global_step": 453514, "epoch": 2699} {"train_loss": -12.759257316589355, "global_step": 453515, "epoch": 2699} {"train_loss": -12.815987586975098, "global_step": 453516, "epoch": 2699} {"train_loss": -12.683370590209961, "global_step": 453517, "epoch": 2699} {"train_loss": -12.794171333312988, "global_step": 453518, "epoch": 2699} {"train_loss": -12.393071174621582, "global_step": 453519, "epoch": 2699} {"train_loss": -11.727577209472656, "global_step": 453520, "epoch": 2699} {"train_loss": -12.011220932006836, "global_step": 453521, "epoch": 2699} {"train_loss": -12.497024536132812, "global_step": 453522, "epoch": 2699} {"train_loss": -12.725839614868164, "global_step": 453523, "epoch": 2699} {"train_loss": -12.502119064331055, "global_step": 453524, "epoch": 2699} {"train_loss": -11.75967788696289, "global_step": 453525, "epoch": 2699} {"train_loss": -12.265752792358398, "global_step": 453526, "epoch": 2699} {"train_loss": -12.259896278381348, "global_step": 453527, "epoch": 2699} {"train_loss": -11.699263572692871, "global_step": 453528, "epoch": 2699} {"train_loss": -12.384834289550781, "global_step": 453529, "epoch": 2699} {"train_loss": -11.594325065612793, "global_step": 453530, "epoch": 2699} {"train_loss": -12.233474731445312, "global_step": 453531, "epoch": 2699} {"train_loss": -11.436120986938477, "global_step": 453532, "epoch": 2699} {"train_loss": -10.351806640625, "global_step": 453533, "epoch": 2699} {"train_loss": -9.996602058410645, "global_step": 453534, "epoch": 2699} {"train_loss": -10.973859786987305, "global_step": 453535, "epoch": 2699} {"train_loss": -10.26557445526123, "global_step": 453536, "epoch": 2699} {"train_loss": -10.22525405883789, "global_step": 453537, "epoch": 2699} {"train_loss": -10.951072692871094, "global_step": 453538, "epoch": 2699} {"train_loss": -10.368785858154297, "global_step": 453539, "epoch": 2699} {"train_loss": -11.883492469787598, "global_step": 453540, "epoch": 2699} {"train_loss": -11.694328308105469, "global_step": 453541, "epoch": 2699} {"train_loss": -11.639252662658691, "global_step": 453542, "epoch": 2699} {"train_loss": -11.51382827758789, "global_step": 453543, "epoch": 2699} {"train_loss": -11.090494155883789, "global_step": 453544, "epoch": 2699} {"train_loss": -11.869294166564941, "global_step": 453545, "epoch": 2699} {"train_loss": -11.735124588012695, "global_step": 453546, "epoch": 2699} {"train_loss": -12.107128143310547, "global_step": 453547, "epoch": 2699} {"train_loss": -11.393516540527344, "global_step": 453548, "epoch": 2699} {"train_loss": -11.949729919433594, "global_step": 453549, "epoch": 2699} {"train_loss": -10.893004417419434, "global_step": 453550, "epoch": 2699} {"train_loss": -12.189925193786621, "global_step": 453551, "epoch": 2699} {"train_loss": -10.86623477935791, "global_step": 453552, "epoch": 2699} {"train_loss": -11.65185546875, "global_step": 453553, "epoch": 2699} {"train_loss": -11.70458984375, "global_step": 453554, "epoch": 2699} {"train_loss": -11.627853393554688, "global_step": 453555, "epoch": 2699} {"train_loss": -11.818512916564941, "global_step": 453556, "epoch": 2699} {"train_loss": -11.900264739990234, "global_step": 453557, "epoch": 2699} {"train_loss": -11.263284683227539, "global_step": 453558, "epoch": 2699} {"train_loss": -10.561264991760254, "global_step": 453559, "epoch": 2699} {"train_loss": -11.730332374572754, "global_step": 453560, "epoch": 2699} {"train_loss": -11.115897178649902, "global_step": 453561, "epoch": 2699} {"train_loss": -11.684280395507812, "global_step": 453562, "epoch": 2699} {"train_loss": -11.416236877441406, "global_step": 453563, "epoch": 2699} {"train_loss": -11.687155723571777, "global_step": 453564, "epoch": 2699} {"train_loss": -12.027338981628418, "global_step": 453565, "epoch": 2699} {"train_loss": -11.378171920776367, "global_step": 453566, "epoch": 2699} {"train_loss": -12.168277740478516, "global_step": 453567, "epoch": 2699} {"train_loss": -11.707672119140625, "global_step": 453568, "epoch": 2699} {"train_loss": -11.987691879272461, "global_step": 453569, "epoch": 2699} {"train_loss": -11.252294540405273, "global_step": 453570, "epoch": 2699} {"train_loss": -12.126056671142578, "global_step": 453571, "epoch": 2699} {"train_loss": -11.553155899047852, "global_step": 453572, "epoch": 2699} {"train_loss": -12.314191818237305, "global_step": 453573, "epoch": 2699} {"train_loss": -11.66061019897461, "global_step": 453574, "epoch": 2699} {"train_loss": -12.151893615722656, "global_step": 453575, "epoch": 2699} {"train_loss": -11.55398941040039, "global_step": 453576, "epoch": 2699} {"train_loss": -12.174428939819336, "global_step": 453577, "epoch": 2699} {"train_loss": -11.550760269165039, "global_step": 453578, "epoch": 2699} {"train_loss": -11.760845184326172, "global_step": 453579, "epoch": 2699} {"train_loss": -11.974128723144531, "global_step": 453580, "epoch": 2699} {"train_loss": -11.690589904785156, "global_step": 453581, "epoch": 2699} {"train_loss": -12.31350040435791, "global_step": 453582, "epoch": 2699} {"train_loss": -11.848320960998535, "global_step": 453583, "epoch": 2699} {"train_loss": -12.09063720703125, "global_step": 453584, "epoch": 2699} {"train_loss": -12.128907203674316, "global_step": 453585, "epoch": 2699} {"train_loss": -11.541421890258789, "global_step": 453586, "epoch": 2699} {"train_loss": -12.490738868713379, "global_step": 453587, "epoch": 2699} {"train_loss": -11.961379051208496, "global_step": 453588, "epoch": 2699} {"train_loss": -12.421324729919434, "global_step": 453589, "epoch": 2699} {"train_loss": -12.042142868041992, "global_step": 453590, "epoch": 2699} {"train_loss": -12.123039245605469, "global_step": 453591, "epoch": 2699} {"train_loss": -11.91702651977539, "global_step": 453592, "epoch": 2699} {"train_loss": -12.545976638793945, "global_step": 453593, "epoch": 2699} {"train_loss": -12.040300369262695, "global_step": 453594, "epoch": 2699} {"train_loss": -12.202869415283203, "global_step": 453595, "epoch": 2699} {"train_loss": -12.185169219970703, "global_step": 453596, "epoch": 2699} {"train_loss": -11.421621322631836, "global_step": 453597, "epoch": 2699} {"train_loss": -11.868926048278809, "global_step": 453598, "epoch": 2699} {"train_loss": -12.077872741790046, "global_step": 453599, "epoch": 2699, "val_loss": 312211.9375} {"train_loss": -10.763782501220703, "global_step": 453600, "epoch": 2700} {"train_loss": -12.194513320922852, "global_step": 453601, "epoch": 2700} {"train_loss": -10.983306884765625, "global_step": 453602, "epoch": 2700} {"train_loss": -11.88337230682373, "global_step": 453603, "epoch": 2700} {"train_loss": -9.875528335571289, "global_step": 453604, "epoch": 2700} {"train_loss": -11.346731185913086, "global_step": 453605, "epoch": 2700} {"train_loss": -8.959959030151367, "global_step": 453606, "epoch": 2700} {"train_loss": -10.980213165283203, "global_step": 453607, "epoch": 2700} {"train_loss": -9.378252983093262, "global_step": 453608, "epoch": 2700} {"train_loss": -10.762858390808105, "global_step": 453609, "epoch": 2700} {"train_loss": -10.418401718139648, "global_step": 453610, "epoch": 2700} {"train_loss": -10.883155822753906, "global_step": 453611, "epoch": 2700} {"train_loss": -11.670866012573242, "global_step": 453612, "epoch": 2700} {"train_loss": -11.360063552856445, "global_step": 453613, "epoch": 2700} {"train_loss": -11.62232780456543, "global_step": 453614, "epoch": 2700} {"train_loss": -11.232964515686035, "global_step": 453615, "epoch": 2700} {"train_loss": -12.27982234954834, "global_step": 453616, "epoch": 2700} {"train_loss": -11.887819290161133, "global_step": 453617, "epoch": 2700} {"train_loss": -11.423012733459473, "global_step": 453618, "epoch": 2700} {"train_loss": -11.54664421081543, "global_step": 453619, "epoch": 2700} {"train_loss": -11.350566864013672, "global_step": 453620, "epoch": 2700} {"train_loss": -11.668550491333008, "global_step": 453621, "epoch": 2700} {"train_loss": -12.099967002868652, "global_step": 453622, "epoch": 2700} {"train_loss": -11.700901985168457, "global_step": 453623, "epoch": 2700} {"train_loss": -11.892016410827637, "global_step": 453624, "epoch": 2700} {"train_loss": -11.78528881072998, "global_step": 453625, "epoch": 2700} {"train_loss": -11.774188041687012, "global_step": 453626, "epoch": 2700} {"train_loss": -12.07102108001709, "global_step": 453627, "epoch": 2700} {"train_loss": -11.64787483215332, "global_step": 453628, "epoch": 2700} {"train_loss": -11.998212814331055, "global_step": 453629, "epoch": 2700} {"train_loss": -12.07155990600586, "global_step": 453630, "epoch": 2700} {"train_loss": -11.978374481201172, "global_step": 453631, "epoch": 2700} {"train_loss": -12.200862884521484, "global_step": 453632, "epoch": 2700} {"train_loss": -11.791891098022461, "global_step": 453633, "epoch": 2700} {"train_loss": -12.061859130859375, "global_step": 453634, "epoch": 2700} {"train_loss": -12.155052185058594, "global_step": 453635, "epoch": 2700} {"train_loss": -11.984729766845703, "global_step": 453636, "epoch": 2700} {"train_loss": -12.406661987304688, "global_step": 453637, "epoch": 2700} {"train_loss": -11.882255554199219, "global_step": 453638, "epoch": 2700} {"train_loss": -12.184403419494629, "global_step": 453639, "epoch": 2700} {"train_loss": -12.423791885375977, "global_step": 453640, "epoch": 2700} {"train_loss": -12.100011825561523, "global_step": 453641, "epoch": 2700} {"train_loss": -12.387767791748047, "global_step": 453642, "epoch": 2700} {"train_loss": -12.488125801086426, "global_step": 453643, "epoch": 2700} {"train_loss": -12.462663650512695, "global_step": 453644, "epoch": 2700} {"train_loss": -12.672370910644531, "global_step": 453645, "epoch": 2700} {"train_loss": -12.382261276245117, "global_step": 453646, "epoch": 2700} {"train_loss": -12.551359176635742, "global_step": 453647, "epoch": 2700} {"train_loss": -12.357673645019531, "global_step": 453648, "epoch": 2700} {"train_loss": -12.460371017456055, "global_step": 453649, "epoch": 2700} {"train_loss": -12.55955696105957, "global_step": 453650, "epoch": 2700} {"train_loss": -12.360820770263672, "global_step": 453651, "epoch": 2700} {"train_loss": -12.568936347961426, "global_step": 453652, "epoch": 2700} {"train_loss": -12.495141983032227, "global_step": 453653, "epoch": 2700} {"train_loss": -12.441078186035156, "global_step": 453654, "epoch": 2700} {"train_loss": -12.651222229003906, "global_step": 453655, "epoch": 2700} {"train_loss": -12.51867389678955, "global_step": 453656, "epoch": 2700} {"train_loss": -12.575413703918457, "global_step": 453657, "epoch": 2700} {"train_loss": -12.509055137634277, "global_step": 453658, "epoch": 2700} {"train_loss": -12.61442756652832, "global_step": 453659, "epoch": 2700} {"train_loss": -12.271724700927734, "global_step": 453660, "epoch": 2700} {"train_loss": -12.732805252075195, "global_step": 453661, "epoch": 2700} {"train_loss": -12.621541976928711, "global_step": 453662, "epoch": 2700} {"train_loss": -12.663379669189453, "global_step": 453663, "epoch": 2700} {"train_loss": -12.672407150268555, "global_step": 453664, "epoch": 2700} {"train_loss": -12.741390228271484, "global_step": 453665, "epoch": 2700} {"train_loss": -12.7780122756958, "global_step": 453666, "epoch": 2700} {"train_loss": -12.671063423156738, "global_step": 453667, "epoch": 2700} {"train_loss": -12.559236526489258, "global_step": 453668, "epoch": 2700} {"train_loss": -12.314640045166016, "global_step": 453669, "epoch": 2700} {"train_loss": -12.7498779296875, "global_step": 453670, "epoch": 2700} {"train_loss": -12.941549301147461, "global_step": 453671, "epoch": 2700} {"train_loss": -12.649526596069336, "global_step": 453672, "epoch": 2700} {"train_loss": -12.731042861938477, "global_step": 453673, "epoch": 2700} {"train_loss": -12.82199764251709, "global_step": 453674, "epoch": 2700} {"train_loss": -12.723727226257324, "global_step": 453675, "epoch": 2700} {"train_loss": -12.779359817504883, "global_step": 453676, "epoch": 2700} {"train_loss": -12.658330917358398, "global_step": 453677, "epoch": 2700} {"train_loss": -12.938943862915039, "global_step": 453678, "epoch": 2700} {"train_loss": -12.664314270019531, "global_step": 453679, "epoch": 2700} {"train_loss": -12.806716918945312, "global_step": 453680, "epoch": 2700} {"train_loss": -12.558565139770508, "global_step": 453681, "epoch": 2700} {"train_loss": -12.806817054748535, "global_step": 453682, "epoch": 2700} {"train_loss": -12.723621368408203, "global_step": 453683, "epoch": 2700} {"train_loss": -12.507643699645996, "global_step": 453684, "epoch": 2700} {"train_loss": -12.897468566894531, "global_step": 453685, "epoch": 2700} {"train_loss": -12.458995819091797, "global_step": 453686, "epoch": 2700} {"train_loss": -12.649168014526367, "global_step": 453687, "epoch": 2700} {"train_loss": -12.753719329833984, "global_step": 453688, "epoch": 2700} {"train_loss": -12.178346633911133, "global_step": 453689, "epoch": 2700} {"train_loss": -12.60450553894043, "global_step": 453690, "epoch": 2700} {"train_loss": -11.944560050964355, "global_step": 453691, "epoch": 2700} {"train_loss": -12.218847274780273, "global_step": 453692, "epoch": 2700} {"train_loss": -12.227035522460938, "global_step": 453693, "epoch": 2700} {"train_loss": -12.602689743041992, "global_step": 453694, "epoch": 2700} {"train_loss": -12.185432434082031, "global_step": 453695, "epoch": 2700} {"train_loss": -12.455541610717773, "global_step": 453696, "epoch": 2700} {"train_loss": -12.546908378601074, "global_step": 453697, "epoch": 2700} {"train_loss": -12.534523010253906, "global_step": 453698, "epoch": 2700} {"train_loss": -12.470571517944336, "global_step": 453699, "epoch": 2700} {"train_loss": -12.374164581298828, "global_step": 453700, "epoch": 2700} {"train_loss": -12.380413055419922, "global_step": 453701, "epoch": 2700} {"train_loss": -12.501058578491211, "global_step": 453702, "epoch": 2700} {"train_loss": -12.699966430664062, "global_step": 453703, "epoch": 2700} {"train_loss": -12.140432357788086, "global_step": 453704, "epoch": 2700} {"train_loss": -12.674912452697754, "global_step": 453705, "epoch": 2700} {"train_loss": -12.69680404663086, "global_step": 453706, "epoch": 2700} {"train_loss": -12.343267440795898, "global_step": 453707, "epoch": 2700} {"train_loss": -12.520347595214844, "global_step": 453708, "epoch": 2700} {"train_loss": -12.13686752319336, "global_step": 453709, "epoch": 2700} {"train_loss": -12.85407829284668, "global_step": 453710, "epoch": 2700} {"train_loss": -12.415428161621094, "global_step": 453711, "epoch": 2700} {"train_loss": -12.604973793029785, "global_step": 453712, "epoch": 2700} {"train_loss": -12.633692741394043, "global_step": 453713, "epoch": 2700} {"train_loss": -12.477640151977539, "global_step": 453714, "epoch": 2700} {"train_loss": -12.121286392211914, "global_step": 453715, "epoch": 2700} {"train_loss": -12.264634132385254, "global_step": 453716, "epoch": 2700} {"train_loss": -12.489163398742676, "global_step": 453717, "epoch": 2700} {"train_loss": -12.298858642578125, "global_step": 453718, "epoch": 2700} {"train_loss": -12.65403938293457, "global_step": 453719, "epoch": 2700} {"train_loss": -12.224184036254883, "global_step": 453720, "epoch": 2700} {"train_loss": -12.580202102661133, "global_step": 453721, "epoch": 2700} {"train_loss": -12.456279754638672, "global_step": 453722, "epoch": 2700} {"train_loss": -12.145638465881348, "global_step": 453723, "epoch": 2700} {"train_loss": -12.160581588745117, "global_step": 453724, "epoch": 2700} {"train_loss": -12.363173484802246, "global_step": 453725, "epoch": 2700} {"train_loss": -12.695863723754883, "global_step": 453726, "epoch": 2700} {"train_loss": -12.326254844665527, "global_step": 453727, "epoch": 2700} {"train_loss": -12.513504028320312, "global_step": 453728, "epoch": 2700} {"train_loss": -12.693840026855469, "global_step": 453729, "epoch": 2700} {"train_loss": -12.404531478881836, "global_step": 453730, "epoch": 2700} {"train_loss": -12.588878631591797, "global_step": 453731, "epoch": 2700} {"train_loss": -12.345924377441406, "global_step": 453732, "epoch": 2700} {"train_loss": -12.559015274047852, "global_step": 453733, "epoch": 2700} {"train_loss": -12.869768142700195, "global_step": 453734, "epoch": 2700} {"train_loss": -12.547112464904785, "global_step": 453735, "epoch": 2700} {"train_loss": -12.986398696899414, "global_step": 453736, "epoch": 2700} {"train_loss": -12.34892463684082, "global_step": 453737, "epoch": 2700} {"train_loss": -12.580387115478516, "global_step": 453738, "epoch": 2700} {"train_loss": -12.613876342773438, "global_step": 453739, "epoch": 2700} {"train_loss": -12.630668640136719, "global_step": 453740, "epoch": 2700} {"train_loss": -12.805505752563477, "global_step": 453741, "epoch": 2700} {"train_loss": -12.67818832397461, "global_step": 453742, "epoch": 2700} {"train_loss": -12.388500213623047, "global_step": 453743, "epoch": 2700} {"train_loss": -12.645432472229004, "global_step": 453744, "epoch": 2700} {"train_loss": -12.59227466583252, "global_step": 453745, "epoch": 2700} {"train_loss": -12.479723930358887, "global_step": 453746, "epoch": 2700} {"train_loss": -12.632293701171875, "global_step": 453747, "epoch": 2700} {"train_loss": -12.810117721557617, "global_step": 453748, "epoch": 2700} {"train_loss": -12.577648162841797, "global_step": 453749, "epoch": 2700} {"train_loss": -12.283933639526367, "global_step": 453750, "epoch": 2700} {"train_loss": -12.670018196105957, "global_step": 453751, "epoch": 2700} {"train_loss": -12.750524520874023, "global_step": 453752, "epoch": 2700} {"train_loss": -12.664413452148438, "global_step": 453753, "epoch": 2700} {"train_loss": -12.885887145996094, "global_step": 453754, "epoch": 2700} {"train_loss": -12.609903335571289, "global_step": 453755, "epoch": 2700} {"train_loss": -12.58469009399414, "global_step": 453756, "epoch": 2700} {"train_loss": -12.543275833129883, "global_step": 453757, "epoch": 2700} {"train_loss": -12.637584686279297, "global_step": 453758, "epoch": 2700} {"train_loss": -12.540241241455078, "global_step": 453759, "epoch": 2700} {"train_loss": -11.91062068939209, "global_step": 453760, "epoch": 2700} {"train_loss": -11.093589782714844, "global_step": 453761, "epoch": 2700} {"train_loss": -12.836280822753906, "global_step": 453762, "epoch": 2700} {"train_loss": -10.907970428466797, "global_step": 453763, "epoch": 2700} {"train_loss": -10.64790153503418, "global_step": 453764, "epoch": 2700} {"train_loss": -12.423423767089844, "global_step": 453765, "epoch": 2700} {"train_loss": -10.929349899291992, "global_step": 453766, "epoch": 2700} {"train_loss": -12.239519136292595, "global_step": 453767, "epoch": 2700, "train/sim_max_reward_0": 0.6916452758798064, "train/sim_max_reward_1": 0.9739591707601848, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.18039375080601233, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.5386345209693093, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.39758876759724815, "test/sim_max_reward_4400002": 0.20019946833244354, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.5078275375675384, "test/sim_max_reward_4400005": 0.9616077115160574, "test/sim_max_reward_4400006": 0.9383806389331221, "test/sim_max_reward_4400007": 0.547722111087503, "test/sim_max_reward_4400008": 0.619665550395375, "test/sim_max_reward_4400009": 0.03500506192459271, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 0.3358764655711159, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 0.7090256856989867, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.08045226365117034, "test/sim_max_reward_4400018": 0.9881134772300277, "test/sim_max_reward_4400019": 0.6283415043821722, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.9278645541823518, "test/sim_max_reward_4400022": 0.9960512639454896, "test/sim_max_reward_4400023": 0.13776260824450076, "test/sim_max_reward_4400024": 1.0, "test/sim_max_reward_4400025": 0.523214516395814, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.42967268118364643, "test/sim_max_reward_4400028": 0.7226338422691687, "test/sim_max_reward_4400029": 0.9742989095913546, "test/sim_max_reward_4400030": 0.9681933495880967, "test/sim_max_reward_4400031": 0.9468397548650782, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 1.0, "test/sim_max_reward_4400034": 1.0, "test/sim_max_reward_4400035": 0.41733266231670585, "test/sim_max_reward_4400036": 0.3617076861119238, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.0, "test/sim_max_reward_4400039": 1.0, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.18226000321311261, "test/sim_max_reward_4400042": 0.4390551574798449, "test/sim_max_reward_4400043": 0.3159550664314296, "test/sim_max_reward_4400044": 0.29767619203909546, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.9741848892492186, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.33197082393089794, "train/mean_score": 0.5641054530692188, "test/mean_score": 0.5779338126106282, "val_loss": 316590.96875, "train_action_mse_error": 1.5915350914001465} {"train_loss": -10.009361267089844, "global_step": 453768, "epoch": 2701} {"train_loss": -9.803461074829102, "global_step": 453769, "epoch": 2701} {"train_loss": -10.709382057189941, "global_step": 453770, "epoch": 2701} {"train_loss": -9.631433486938477, "global_step": 453771, "epoch": 2701} {"train_loss": -9.970348358154297, "global_step": 453772, "epoch": 2701} {"train_loss": -11.983014106750488, "global_step": 453773, "epoch": 2701} {"train_loss": -10.151927947998047, "global_step": 453774, "epoch": 2701} {"train_loss": -10.673893928527832, "global_step": 453775, "epoch": 2701} {"train_loss": -8.62891960144043, "global_step": 453776, "epoch": 2701} {"train_loss": -8.550249099731445, "global_step": 453777, "epoch": 2701} {"train_loss": -9.745962142944336, "global_step": 453778, "epoch": 2701} {"train_loss": -11.332927703857422, "global_step": 453779, "epoch": 2701} {"train_loss": -8.143841743469238, "global_step": 453780, "epoch": 2701} {"train_loss": -9.28500747680664, "global_step": 453781, "epoch": 2701} {"train_loss": -9.48183822631836, "global_step": 453782, "epoch": 2701} {"train_loss": -10.432367324829102, "global_step": 453783, "epoch": 2701} {"train_loss": -9.948800086975098, "global_step": 453784, "epoch": 2701} {"train_loss": -10.162092208862305, "global_step": 453785, "epoch": 2701} {"train_loss": -9.961687088012695, "global_step": 453786, "epoch": 2701} {"train_loss": -9.628504753112793, "global_step": 453787, "epoch": 2701} {"train_loss": -9.598045349121094, "global_step": 453788, "epoch": 2701} {"train_loss": -9.853728294372559, "global_step": 453789, "epoch": 2701} {"train_loss": -9.13210391998291, "global_step": 453790, "epoch": 2701} {"train_loss": -9.191436767578125, "global_step": 453791, "epoch": 2701} {"train_loss": -10.078733444213867, "global_step": 453792, "epoch": 2701} {"train_loss": -9.99476432800293, "global_step": 453793, "epoch": 2701} {"train_loss": -10.719976425170898, "global_step": 453794, "epoch": 2701} {"train_loss": -9.242853164672852, "global_step": 453795, "epoch": 2701} {"train_loss": -9.66744613647461, "global_step": 453796, "epoch": 2701} {"train_loss": -11.596162796020508, "global_step": 453797, "epoch": 2701} {"train_loss": -10.623096466064453, "global_step": 453798, "epoch": 2701} {"train_loss": -10.261061668395996, "global_step": 453799, "epoch": 2701} {"train_loss": -11.229506492614746, "global_step": 453800, "epoch": 2701} {"train_loss": -10.58746337890625, "global_step": 453801, "epoch": 2701} {"train_loss": -11.213260650634766, "global_step": 453802, "epoch": 2701} {"train_loss": -10.869598388671875, "global_step": 453803, "epoch": 2701} {"train_loss": -11.156584739685059, "global_step": 453804, "epoch": 2701} {"train_loss": -11.684417724609375, "global_step": 453805, "epoch": 2701} {"train_loss": -11.619071960449219, "global_step": 453806, "epoch": 2701} {"train_loss": -11.518909454345703, "global_step": 453807, "epoch": 2701} {"train_loss": -11.222003936767578, "global_step": 453808, "epoch": 2701} {"train_loss": -11.778999328613281, "global_step": 453809, "epoch": 2701} {"train_loss": -11.529191017150879, "global_step": 453810, "epoch": 2701} {"train_loss": -11.328903198242188, "global_step": 453811, "epoch": 2701} {"train_loss": -12.026439666748047, "global_step": 453812, "epoch": 2701} {"train_loss": -12.107391357421875, "global_step": 453813, "epoch": 2701} {"train_loss": -11.427389144897461, "global_step": 453814, "epoch": 2701} {"train_loss": -12.02697467803955, "global_step": 453815, "epoch": 2701} {"train_loss": -11.791364669799805, "global_step": 453816, "epoch": 2701} {"train_loss": -11.962218284606934, "global_step": 453817, "epoch": 2701} {"train_loss": -11.999439239501953, "global_step": 453818, "epoch": 2701} {"train_loss": -12.018850326538086, "global_step": 453819, "epoch": 2701} {"train_loss": -12.25369644165039, "global_step": 453820, "epoch": 2701} {"train_loss": -11.91015338897705, "global_step": 453821, "epoch": 2701} {"train_loss": -11.659209251403809, "global_step": 453822, "epoch": 2701} {"train_loss": -12.003460884094238, "global_step": 453823, "epoch": 2701} {"train_loss": -11.871053695678711, "global_step": 453824, "epoch": 2701} {"train_loss": -12.273520469665527, "global_step": 453825, "epoch": 2701} {"train_loss": -12.258384704589844, "global_step": 453826, "epoch": 2701} {"train_loss": -12.072633743286133, "global_step": 453827, "epoch": 2701} {"train_loss": -12.345412254333496, "global_step": 453828, "epoch": 2701} {"train_loss": -12.271078109741211, "global_step": 453829, "epoch": 2701} {"train_loss": -12.091078758239746, "global_step": 453830, "epoch": 2701} {"train_loss": -12.304045677185059, "global_step": 453831, "epoch": 2701} {"train_loss": -12.013814926147461, "global_step": 453832, "epoch": 2701} {"train_loss": -12.341514587402344, "global_step": 453833, "epoch": 2701} {"train_loss": -12.474649429321289, "global_step": 453834, "epoch": 2701} {"train_loss": -12.375551223754883, "global_step": 453835, "epoch": 2701} {"train_loss": -12.442700386047363, "global_step": 453836, "epoch": 2701} {"train_loss": -12.321723937988281, "global_step": 453837, "epoch": 2701} {"train_loss": -12.585837364196777, "global_step": 453838, "epoch": 2701} {"train_loss": -12.540843963623047, "global_step": 453839, "epoch": 2701} {"train_loss": -12.371088981628418, "global_step": 453840, "epoch": 2701} {"train_loss": -12.193314552307129, "global_step": 453841, "epoch": 2701} {"train_loss": -12.315328598022461, "global_step": 453842, "epoch": 2701} {"train_loss": -12.260944366455078, "global_step": 453843, "epoch": 2701} {"train_loss": -12.293241500854492, "global_step": 453844, "epoch": 2701} {"train_loss": -12.48550796508789, "global_step": 453845, "epoch": 2701} {"train_loss": -12.169356346130371, "global_step": 453846, "epoch": 2701} {"train_loss": -12.481544494628906, "global_step": 453847, "epoch": 2701} {"train_loss": -12.358853340148926, "global_step": 453848, "epoch": 2701} {"train_loss": -12.301985740661621, "global_step": 453849, "epoch": 2701} {"train_loss": -12.581979751586914, "global_step": 453850, "epoch": 2701} {"train_loss": -12.341442108154297, "global_step": 453851, "epoch": 2701} {"train_loss": -12.495113372802734, "global_step": 453852, "epoch": 2701} {"train_loss": -12.400444030761719, "global_step": 453853, "epoch": 2701} {"train_loss": -12.667972564697266, "global_step": 453854, "epoch": 2701} {"train_loss": -12.166751861572266, "global_step": 453855, "epoch": 2701} {"train_loss": -12.63102912902832, "global_step": 453856, "epoch": 2701} {"train_loss": -12.44088077545166, "global_step": 453857, "epoch": 2701} {"train_loss": -12.431609153747559, "global_step": 453858, "epoch": 2701} {"train_loss": -12.5947904586792, "global_step": 453859, "epoch": 2701} {"train_loss": -12.043291091918945, "global_step": 453860, "epoch": 2701} {"train_loss": -12.447853088378906, "global_step": 453861, "epoch": 2701} {"train_loss": -12.36370849609375, "global_step": 453862, "epoch": 2701} {"train_loss": -11.819318771362305, "global_step": 453863, "epoch": 2701} {"train_loss": -12.503173828125, "global_step": 453864, "epoch": 2701} {"train_loss": -12.139833450317383, "global_step": 453865, "epoch": 2701} {"train_loss": -11.774431228637695, "global_step": 453866, "epoch": 2701} {"train_loss": -12.623234748840332, "global_step": 453867, "epoch": 2701} {"train_loss": -11.480880737304688, "global_step": 453868, "epoch": 2701} {"train_loss": -12.387374877929688, "global_step": 453869, "epoch": 2701} {"train_loss": -12.330570220947266, "global_step": 453870, "epoch": 2701} {"train_loss": -11.03045654296875, "global_step": 453871, "epoch": 2701} {"train_loss": -12.001802444458008, "global_step": 453872, "epoch": 2701} {"train_loss": -12.486085891723633, "global_step": 453873, "epoch": 2701} {"train_loss": -12.36919116973877, "global_step": 453874, "epoch": 2701} {"train_loss": -12.00773811340332, "global_step": 453875, "epoch": 2701} {"train_loss": -11.567361831665039, "global_step": 453876, "epoch": 2701} {"train_loss": -11.14777660369873, "global_step": 453877, "epoch": 2701} {"train_loss": -12.076560974121094, "global_step": 453878, "epoch": 2701} {"train_loss": -10.43582534790039, "global_step": 453879, "epoch": 2701} {"train_loss": -12.387992858886719, "global_step": 453880, "epoch": 2701} {"train_loss": -10.152620315551758, "global_step": 453881, "epoch": 2701} {"train_loss": -10.997928619384766, "global_step": 453882, "epoch": 2701} {"train_loss": -11.924810409545898, "global_step": 453883, "epoch": 2701} {"train_loss": -9.942609786987305, "global_step": 453884, "epoch": 2701} {"train_loss": -11.464067459106445, "global_step": 453885, "epoch": 2701} {"train_loss": -11.247933387756348, "global_step": 453886, "epoch": 2701} {"train_loss": -11.731464385986328, "global_step": 453887, "epoch": 2701} {"train_loss": -12.013076782226562, "global_step": 453888, "epoch": 2701} {"train_loss": -11.515661239624023, "global_step": 453889, "epoch": 2701} {"train_loss": -12.200420379638672, "global_step": 453890, "epoch": 2701} {"train_loss": -11.797054290771484, "global_step": 453891, "epoch": 2701} {"train_loss": -12.137250900268555, "global_step": 453892, "epoch": 2701} {"train_loss": -12.544612884521484, "global_step": 453893, "epoch": 2701} {"train_loss": -11.983715057373047, "global_step": 453894, "epoch": 2701} {"train_loss": -12.244750022888184, "global_step": 453895, "epoch": 2701} {"train_loss": -12.364964485168457, "global_step": 453896, "epoch": 2701} {"train_loss": -12.15252685546875, "global_step": 453897, "epoch": 2701} {"train_loss": -12.544670104980469, "global_step": 453898, "epoch": 2701} {"train_loss": -12.183372497558594, "global_step": 453899, "epoch": 2701} {"train_loss": -12.25869369506836, "global_step": 453900, "epoch": 2701} {"train_loss": -12.35676097869873, "global_step": 453901, "epoch": 2701} {"train_loss": -12.289891242980957, "global_step": 453902, "epoch": 2701} {"train_loss": -12.362627029418945, "global_step": 453903, "epoch": 2701} {"train_loss": -12.341907501220703, "global_step": 453904, "epoch": 2701} {"train_loss": -12.136959075927734, "global_step": 453905, "epoch": 2701} {"train_loss": -12.385164260864258, "global_step": 453906, "epoch": 2701} {"train_loss": -12.148245811462402, "global_step": 453907, "epoch": 2701} {"train_loss": -12.558736801147461, "global_step": 453908, "epoch": 2701} {"train_loss": -11.717239379882812, "global_step": 453909, "epoch": 2701} {"train_loss": -12.443061828613281, "global_step": 453910, "epoch": 2701} {"train_loss": -11.905500411987305, "global_step": 453911, "epoch": 2701} {"train_loss": -12.158615112304688, "global_step": 453912, "epoch": 2701} {"train_loss": -12.318495750427246, "global_step": 453913, "epoch": 2701} {"train_loss": -12.432064056396484, "global_step": 453914, "epoch": 2701} {"train_loss": -12.590736389160156, "global_step": 453915, "epoch": 2701} {"train_loss": -12.520647048950195, "global_step": 453916, "epoch": 2701} {"train_loss": -12.484773635864258, "global_step": 453917, "epoch": 2701} {"train_loss": -12.582778930664062, "global_step": 453918, "epoch": 2701} {"train_loss": -12.549174308776855, "global_step": 453919, "epoch": 2701} {"train_loss": -12.704031944274902, "global_step": 453920, "epoch": 2701} {"train_loss": -12.48331069946289, "global_step": 453921, "epoch": 2701} {"train_loss": -12.716093063354492, "global_step": 453922, "epoch": 2701} {"train_loss": -12.669614791870117, "global_step": 453923, "epoch": 2701} {"train_loss": -12.477062225341797, "global_step": 453924, "epoch": 2701} {"train_loss": -12.560579299926758, "global_step": 453925, "epoch": 2701} {"train_loss": -12.736696243286133, "global_step": 453926, "epoch": 2701} {"train_loss": -12.673334121704102, "global_step": 453927, "epoch": 2701} {"train_loss": -12.556305885314941, "global_step": 453928, "epoch": 2701} {"train_loss": -12.70508098602295, "global_step": 453929, "epoch": 2701} {"train_loss": -12.697402954101562, "global_step": 453930, "epoch": 2701} {"train_loss": -12.630501747131348, "global_step": 453931, "epoch": 2701} {"train_loss": -12.933578491210938, "global_step": 453932, "epoch": 2701} {"train_loss": -12.33011245727539, "global_step": 453933, "epoch": 2701} {"train_loss": -12.760974884033203, "global_step": 453934, "epoch": 2701} {"train_loss": -11.697259937013898, "global_step": 453935, "epoch": 2701, "val_loss": 315374.6875} {"train_loss": -12.587275505065918, "global_step": 453936, "epoch": 2702} {"train_loss": -12.404478073120117, "global_step": 453937, "epoch": 2702} {"train_loss": -12.413219451904297, "global_step": 453938, "epoch": 2702} {"train_loss": -12.540396690368652, "global_step": 453939, "epoch": 2702} {"train_loss": -12.654088973999023, "global_step": 453940, "epoch": 2702} {"train_loss": -12.306726455688477, "global_step": 453941, "epoch": 2702} {"train_loss": -12.609694480895996, "global_step": 453942, "epoch": 2702} {"train_loss": -12.825550079345703, "global_step": 453943, "epoch": 2702} {"train_loss": -12.787964820861816, "global_step": 453944, "epoch": 2702} {"train_loss": -12.516575813293457, "global_step": 453945, "epoch": 2702} {"train_loss": -12.709647178649902, "global_step": 453946, "epoch": 2702} {"train_loss": -12.85249137878418, "global_step": 453947, "epoch": 2702} {"train_loss": -12.683271408081055, "global_step": 453948, "epoch": 2702} {"train_loss": -12.492314338684082, "global_step": 453949, "epoch": 2702} {"train_loss": -12.534485816955566, "global_step": 453950, "epoch": 2702} {"train_loss": -12.846954345703125, "global_step": 453951, "epoch": 2702} {"train_loss": -12.713581085205078, "global_step": 453952, "epoch": 2702} {"train_loss": -12.198965072631836, "global_step": 453953, "epoch": 2702} {"train_loss": -12.921981811523438, "global_step": 453954, "epoch": 2702} {"train_loss": -12.76335334777832, "global_step": 453955, "epoch": 2702} {"train_loss": -12.238753318786621, "global_step": 453956, "epoch": 2702} {"train_loss": -12.334066390991211, "global_step": 453957, "epoch": 2702} {"train_loss": -12.557441711425781, "global_step": 453958, "epoch": 2702} {"train_loss": -12.540200233459473, "global_step": 453959, "epoch": 2702} {"train_loss": -12.554140090942383, "global_step": 453960, "epoch": 2702} {"train_loss": -12.815522193908691, "global_step": 453961, "epoch": 2702} {"train_loss": -12.75473690032959, "global_step": 453962, "epoch": 2702} {"train_loss": -12.809103965759277, "global_step": 453963, "epoch": 2702} {"train_loss": -12.531281471252441, "global_step": 453964, "epoch": 2702} {"train_loss": -12.869467735290527, "global_step": 453965, "epoch": 2702} {"train_loss": -12.59054946899414, "global_step": 453966, "epoch": 2702} {"train_loss": -12.749554634094238, "global_step": 453967, "epoch": 2702} {"train_loss": -12.41331958770752, "global_step": 453968, "epoch": 2702} {"train_loss": -12.777050971984863, "global_step": 453969, "epoch": 2702} {"train_loss": -12.881111145019531, "global_step": 453970, "epoch": 2702} {"train_loss": -12.892888069152832, "global_step": 453971, "epoch": 2702} {"train_loss": -12.538562774658203, "global_step": 453972, "epoch": 2702} {"train_loss": -12.685157775878906, "global_step": 453973, "epoch": 2702} {"train_loss": -12.857852935791016, "global_step": 453974, "epoch": 2702} {"train_loss": -12.341268539428711, "global_step": 453975, "epoch": 2702} {"train_loss": -12.699090957641602, "global_step": 453976, "epoch": 2702} {"train_loss": -12.972352981567383, "global_step": 453977, "epoch": 2702} {"train_loss": -12.705850601196289, "global_step": 453978, "epoch": 2702} {"train_loss": -12.28802490234375, "global_step": 453979, "epoch": 2702} {"train_loss": -12.778255462646484, "global_step": 453980, "epoch": 2702} {"train_loss": -12.806035041809082, "global_step": 453981, "epoch": 2702} {"train_loss": -12.360372543334961, "global_step": 453982, "epoch": 2702} {"train_loss": -12.029934883117676, "global_step": 453983, "epoch": 2702} {"train_loss": -11.808806419372559, "global_step": 453984, "epoch": 2702} {"train_loss": -12.367828369140625, "global_step": 453985, "epoch": 2702} {"train_loss": -12.67176628112793, "global_step": 453986, "epoch": 2702} {"train_loss": -12.785486221313477, "global_step": 453987, "epoch": 2702} {"train_loss": -12.788763999938965, "global_step": 453988, "epoch": 2702} {"train_loss": -12.805877685546875, "global_step": 453989, "epoch": 2702} {"train_loss": -12.09759521484375, "global_step": 453990, "epoch": 2702} {"train_loss": -12.271621704101562, "global_step": 453991, "epoch": 2702} {"train_loss": -12.279336929321289, "global_step": 453992, "epoch": 2702} {"train_loss": -12.665138244628906, "global_step": 453993, "epoch": 2702} {"train_loss": -12.310586929321289, "global_step": 453994, "epoch": 2702} {"train_loss": -12.25831127166748, "global_step": 453995, "epoch": 2702} {"train_loss": -12.095209121704102, "global_step": 453996, "epoch": 2702} {"train_loss": -12.319416999816895, "global_step": 453997, "epoch": 2702} {"train_loss": -11.864048957824707, "global_step": 453998, "epoch": 2702} {"train_loss": -12.289586067199707, "global_step": 453999, "epoch": 2702} {"train_loss": -11.717065811157227, "global_step": 454000, "epoch": 2702} {"train_loss": -12.177751541137695, "global_step": 454001, "epoch": 2702} {"train_loss": -11.821100234985352, "global_step": 454002, "epoch": 2702} {"train_loss": -12.247936248779297, "global_step": 454003, "epoch": 2702} {"train_loss": -12.218353271484375, "global_step": 454004, "epoch": 2702} {"train_loss": -11.486003875732422, "global_step": 454005, "epoch": 2702} {"train_loss": -11.688212394714355, "global_step": 454006, "epoch": 2702} {"train_loss": -12.205791473388672, "global_step": 454007, "epoch": 2702} {"train_loss": -12.162732124328613, "global_step": 454008, "epoch": 2702} {"train_loss": -10.825889587402344, "global_step": 454009, "epoch": 2702} {"train_loss": -11.520999908447266, "global_step": 454010, "epoch": 2702} {"train_loss": -10.65024185180664, "global_step": 454011, "epoch": 2702} {"train_loss": -11.44517993927002, "global_step": 454012, "epoch": 2702} {"train_loss": -11.620176315307617, "global_step": 454013, "epoch": 2702} {"train_loss": -8.7893648147583, "global_step": 454014, "epoch": 2702} {"train_loss": -9.28803825378418, "global_step": 454015, "epoch": 2702} {"train_loss": -9.340063095092773, "global_step": 454016, "epoch": 2702} {"train_loss": -9.707595825195312, "global_step": 454017, "epoch": 2702} {"train_loss": -9.377495765686035, "global_step": 454018, "epoch": 2702} {"train_loss": -10.589067459106445, "global_step": 454019, "epoch": 2702} {"train_loss": -9.615468978881836, "global_step": 454020, "epoch": 2702} {"train_loss": -9.59292984008789, "global_step": 454021, "epoch": 2702} {"train_loss": -9.729998588562012, "global_step": 454022, "epoch": 2702} {"train_loss": -9.03227424621582, "global_step": 454023, "epoch": 2702} {"train_loss": -7.800828456878662, "global_step": 454024, "epoch": 2702} {"train_loss": -8.947019577026367, "global_step": 454025, "epoch": 2702} {"train_loss": -9.120168685913086, "global_step": 454026, "epoch": 2702} {"train_loss": -10.330693244934082, "global_step": 454027, "epoch": 2702} {"train_loss": -8.998326301574707, "global_step": 454028, "epoch": 2702} {"train_loss": -9.005799293518066, "global_step": 454029, "epoch": 2702} {"train_loss": -10.834315299987793, "global_step": 454030, "epoch": 2702} {"train_loss": -10.276264190673828, "global_step": 454031, "epoch": 2702} {"train_loss": -10.608479499816895, "global_step": 454032, "epoch": 2702} {"train_loss": -10.95848274230957, "global_step": 454033, "epoch": 2702} {"train_loss": -10.589614868164062, "global_step": 454034, "epoch": 2702} {"train_loss": -11.7513427734375, "global_step": 454035, "epoch": 2702} {"train_loss": -11.32742977142334, "global_step": 454036, "epoch": 2702} {"train_loss": -11.373214721679688, "global_step": 454037, "epoch": 2702} {"train_loss": -11.308417320251465, "global_step": 454038, "epoch": 2702} {"train_loss": -11.193111419677734, "global_step": 454039, "epoch": 2702} {"train_loss": -11.74703311920166, "global_step": 454040, "epoch": 2702} {"train_loss": -11.272786140441895, "global_step": 454041, "epoch": 2702} {"train_loss": -11.607061386108398, "global_step": 454042, "epoch": 2702} {"train_loss": -11.551826477050781, "global_step": 454043, "epoch": 2702} {"train_loss": -12.137381553649902, "global_step": 454044, "epoch": 2702} {"train_loss": -11.493725776672363, "global_step": 454045, "epoch": 2702} {"train_loss": -11.794553756713867, "global_step": 454046, "epoch": 2702} {"train_loss": -11.971027374267578, "global_step": 454047, "epoch": 2702} {"train_loss": -11.897974014282227, "global_step": 454048, "epoch": 2702} {"train_loss": -11.688658714294434, "global_step": 454049, "epoch": 2702} {"train_loss": -12.175935745239258, "global_step": 454050, "epoch": 2702} {"train_loss": -12.148695945739746, "global_step": 454051, "epoch": 2702} {"train_loss": -11.718488693237305, "global_step": 454052, "epoch": 2702} {"train_loss": -12.269699096679688, "global_step": 454053, "epoch": 2702} {"train_loss": -12.389219284057617, "global_step": 454054, "epoch": 2702} {"train_loss": -12.270447731018066, "global_step": 454055, "epoch": 2702} {"train_loss": -12.295774459838867, "global_step": 454056, "epoch": 2702} {"train_loss": -12.299505233764648, "global_step": 454057, "epoch": 2702} {"train_loss": -12.275947570800781, "global_step": 454058, "epoch": 2702} {"train_loss": -12.380165100097656, "global_step": 454059, "epoch": 2702} {"train_loss": -12.475607872009277, "global_step": 454060, "epoch": 2702} {"train_loss": -12.364923477172852, "global_step": 454061, "epoch": 2702} {"train_loss": -12.515422821044922, "global_step": 454062, "epoch": 2702} {"train_loss": -12.267264366149902, "global_step": 454063, "epoch": 2702} {"train_loss": -12.208490371704102, "global_step": 454064, "epoch": 2702} {"train_loss": -12.070819854736328, "global_step": 454065, "epoch": 2702} {"train_loss": -12.232779502868652, "global_step": 454066, "epoch": 2702} {"train_loss": -12.392268180847168, "global_step": 454067, "epoch": 2702} {"train_loss": -12.365010261535645, "global_step": 454068, "epoch": 2702} {"train_loss": -12.289312362670898, "global_step": 454069, "epoch": 2702} {"train_loss": -12.163461685180664, "global_step": 454070, "epoch": 2702} {"train_loss": -12.469679832458496, "global_step": 454071, "epoch": 2702} {"train_loss": -11.968072891235352, "global_step": 454072, "epoch": 2702} {"train_loss": -12.284492492675781, "global_step": 454073, "epoch": 2702} {"train_loss": -12.531196594238281, "global_step": 454074, "epoch": 2702} {"train_loss": -11.869621276855469, "global_step": 454075, "epoch": 2702} {"train_loss": -12.575504302978516, "global_step": 454076, "epoch": 2702} {"train_loss": -12.317342758178711, "global_step": 454077, "epoch": 2702} {"train_loss": -12.200714111328125, "global_step": 454078, "epoch": 2702} {"train_loss": -12.432233810424805, "global_step": 454079, "epoch": 2702} {"train_loss": -12.771634101867676, "global_step": 454080, "epoch": 2702} {"train_loss": -12.73205852508545, "global_step": 454081, "epoch": 2702} {"train_loss": -12.304319381713867, "global_step": 454082, "epoch": 2702} {"train_loss": -12.734210968017578, "global_step": 454083, "epoch": 2702} {"train_loss": -12.509790420532227, "global_step": 454084, "epoch": 2702} {"train_loss": -12.424219131469727, "global_step": 454085, "epoch": 2702} {"train_loss": -12.731610298156738, "global_step": 454086, "epoch": 2702} {"train_loss": -12.567392349243164, "global_step": 454087, "epoch": 2702} {"train_loss": -12.516185760498047, "global_step": 454088, "epoch": 2702} {"train_loss": -12.770827293395996, "global_step": 454089, "epoch": 2702} {"train_loss": -12.498345375061035, "global_step": 454090, "epoch": 2702} {"train_loss": -12.70289421081543, "global_step": 454091, "epoch": 2702} {"train_loss": -12.436016082763672, "global_step": 454092, "epoch": 2702} {"train_loss": -12.623529434204102, "global_step": 454093, "epoch": 2702} {"train_loss": -12.626431465148926, "global_step": 454094, "epoch": 2702} {"train_loss": -12.654870986938477, "global_step": 454095, "epoch": 2702} {"train_loss": -12.534357070922852, "global_step": 454096, "epoch": 2702} {"train_loss": -12.781636238098145, "global_step": 454097, "epoch": 2702} {"train_loss": -12.760347366333008, "global_step": 454098, "epoch": 2702} {"train_loss": -12.678045272827148, "global_step": 454099, "epoch": 2702} {"train_loss": -12.714205741882324, "global_step": 454100, "epoch": 2702} {"train_loss": -12.50184154510498, "global_step": 454101, "epoch": 2702} {"train_loss": -12.59514045715332, "global_step": 454102, "epoch": 2702} {"train_loss": -11.994168522812071, "global_step": 454103, "epoch": 2702, "val_loss": 313772.5625} {"train_loss": -12.191776275634766, "global_step": 454104, "epoch": 2703} {"train_loss": -12.604828834533691, "global_step": 454105, "epoch": 2703} {"train_loss": -12.751289367675781, "global_step": 454106, "epoch": 2703} {"train_loss": -12.545251846313477, "global_step": 454107, "epoch": 2703} {"train_loss": -12.449935913085938, "global_step": 454108, "epoch": 2703} {"train_loss": -12.701244354248047, "global_step": 454109, "epoch": 2703} {"train_loss": -12.841289520263672, "global_step": 454110, "epoch": 2703} {"train_loss": -12.592984199523926, "global_step": 454111, "epoch": 2703} {"train_loss": -12.530202865600586, "global_step": 454112, "epoch": 2703} {"train_loss": -12.913885116577148, "global_step": 454113, "epoch": 2703} {"train_loss": -12.782509803771973, "global_step": 454114, "epoch": 2703} {"train_loss": -12.744854927062988, "global_step": 454115, "epoch": 2703} {"train_loss": -12.727373123168945, "global_step": 454116, "epoch": 2703} {"train_loss": -12.667744636535645, "global_step": 454117, "epoch": 2703} {"train_loss": -12.297523498535156, "global_step": 454118, "epoch": 2703} {"train_loss": -12.779833793640137, "global_step": 454119, "epoch": 2703} {"train_loss": -12.16291332244873, "global_step": 454120, "epoch": 2703} {"train_loss": -11.771514892578125, "global_step": 454121, "epoch": 2703} {"train_loss": -12.178306579589844, "global_step": 454122, "epoch": 2703} {"train_loss": -12.597299575805664, "global_step": 454123, "epoch": 2703} {"train_loss": -12.543659210205078, "global_step": 454124, "epoch": 2703} {"train_loss": -12.442472457885742, "global_step": 454125, "epoch": 2703} {"train_loss": -12.669705390930176, "global_step": 454126, "epoch": 2703} {"train_loss": -11.585697174072266, "global_step": 454127, "epoch": 2703} {"train_loss": -12.180233001708984, "global_step": 454128, "epoch": 2703} {"train_loss": -12.719005584716797, "global_step": 454129, "epoch": 2703} {"train_loss": -12.500011444091797, "global_step": 454130, "epoch": 2703} {"train_loss": -12.433185577392578, "global_step": 454131, "epoch": 2703} {"train_loss": -12.524353981018066, "global_step": 454132, "epoch": 2703} {"train_loss": -12.506122589111328, "global_step": 454133, "epoch": 2703} {"train_loss": -12.4572114944458, "global_step": 454134, "epoch": 2703} {"train_loss": -12.281620025634766, "global_step": 454135, "epoch": 2703} {"train_loss": -12.072181701660156, "global_step": 454136, "epoch": 2703} {"train_loss": -12.497605323791504, "global_step": 454137, "epoch": 2703} {"train_loss": -12.335516929626465, "global_step": 454138, "epoch": 2703} {"train_loss": -12.325006484985352, "global_step": 454139, "epoch": 2703} {"train_loss": -12.483261108398438, "global_step": 454140, "epoch": 2703} {"train_loss": -12.212923049926758, "global_step": 454141, "epoch": 2703} {"train_loss": -12.26275634765625, "global_step": 454142, "epoch": 2703} {"train_loss": -12.453083038330078, "global_step": 454143, "epoch": 2703} {"train_loss": -12.352418899536133, "global_step": 454144, "epoch": 2703} {"train_loss": -12.755130767822266, "global_step": 454145, "epoch": 2703} {"train_loss": -12.06169319152832, "global_step": 454146, "epoch": 2703} {"train_loss": -11.966363906860352, "global_step": 454147, "epoch": 2703} {"train_loss": -12.229640007019043, "global_step": 454148, "epoch": 2703} {"train_loss": -11.841287612915039, "global_step": 454149, "epoch": 2703} {"train_loss": -12.146078109741211, "global_step": 454150, "epoch": 2703} {"train_loss": -11.404348373413086, "global_step": 454151, "epoch": 2703} {"train_loss": -12.607137680053711, "global_step": 454152, "epoch": 2703} {"train_loss": -11.742814064025879, "global_step": 454153, "epoch": 2703} {"train_loss": -12.15212631225586, "global_step": 454154, "epoch": 2703} {"train_loss": -11.765863418579102, "global_step": 454155, "epoch": 2703} {"train_loss": -11.888734817504883, "global_step": 454156, "epoch": 2703} {"train_loss": -11.783294677734375, "global_step": 454157, "epoch": 2703} {"train_loss": -12.349063873291016, "global_step": 454158, "epoch": 2703} {"train_loss": -11.639867782592773, "global_step": 454159, "epoch": 2703} {"train_loss": -11.711051940917969, "global_step": 454160, "epoch": 2703} {"train_loss": -11.888046264648438, "global_step": 454161, "epoch": 2703} {"train_loss": -12.336868286132812, "global_step": 454162, "epoch": 2703} {"train_loss": -11.194506645202637, "global_step": 454163, "epoch": 2703} {"train_loss": -11.927810668945312, "global_step": 454164, "epoch": 2703} {"train_loss": -12.014130592346191, "global_step": 454165, "epoch": 2703} {"train_loss": -11.128655433654785, "global_step": 454166, "epoch": 2703} {"train_loss": -11.910468101501465, "global_step": 454167, "epoch": 2703} {"train_loss": -10.74268627166748, "global_step": 454168, "epoch": 2703} {"train_loss": -12.428353309631348, "global_step": 454169, "epoch": 2703} {"train_loss": -11.187808990478516, "global_step": 454170, "epoch": 2703} {"train_loss": -10.958599090576172, "global_step": 454171, "epoch": 2703} {"train_loss": -11.883853912353516, "global_step": 454172, "epoch": 2703} {"train_loss": -11.560395240783691, "global_step": 454173, "epoch": 2703} {"train_loss": -10.584857940673828, "global_step": 454174, "epoch": 2703} {"train_loss": -12.488927841186523, "global_step": 454175, "epoch": 2703} {"train_loss": -11.178506851196289, "global_step": 454176, "epoch": 2703} {"train_loss": -11.593006134033203, "global_step": 454177, "epoch": 2703} {"train_loss": -11.451264381408691, "global_step": 454178, "epoch": 2703} {"train_loss": -11.460678100585938, "global_step": 454179, "epoch": 2703} {"train_loss": -11.128900527954102, "global_step": 454180, "epoch": 2703} {"train_loss": -10.963878631591797, "global_step": 454181, "epoch": 2703} {"train_loss": -10.485918045043945, "global_step": 454182, "epoch": 2703} {"train_loss": -11.813697814941406, "global_step": 454183, "epoch": 2703} {"train_loss": -10.081514358520508, "global_step": 454184, "epoch": 2703} {"train_loss": -11.932034492492676, "global_step": 454185, "epoch": 2703} {"train_loss": -10.42949104309082, "global_step": 454186, "epoch": 2703} {"train_loss": -11.532886505126953, "global_step": 454187, "epoch": 2703} {"train_loss": -9.923097610473633, "global_step": 454188, "epoch": 2703} {"train_loss": -11.874873161315918, "global_step": 454189, "epoch": 2703} {"train_loss": -10.508369445800781, "global_step": 454190, "epoch": 2703} {"train_loss": -12.349647521972656, "global_step": 454191, "epoch": 2703} {"train_loss": -11.655797958374023, "global_step": 454192, "epoch": 2703} {"train_loss": -11.543891906738281, "global_step": 454193, "epoch": 2703} {"train_loss": -11.835708618164062, "global_step": 454194, "epoch": 2703} {"train_loss": -11.837319374084473, "global_step": 454195, "epoch": 2703} {"train_loss": -12.203462600708008, "global_step": 454196, "epoch": 2703} {"train_loss": -11.906057357788086, "global_step": 454197, "epoch": 2703} {"train_loss": -11.94333267211914, "global_step": 454198, "epoch": 2703} {"train_loss": -11.758973121643066, "global_step": 454199, "epoch": 2703} {"train_loss": -12.099662780761719, "global_step": 454200, "epoch": 2703} {"train_loss": -11.370044708251953, "global_step": 454201, "epoch": 2703} {"train_loss": -12.460559844970703, "global_step": 454202, "epoch": 2703} {"train_loss": -11.561517715454102, "global_step": 454203, "epoch": 2703} {"train_loss": -11.619941711425781, "global_step": 454204, "epoch": 2703} {"train_loss": -11.996857643127441, "global_step": 454205, "epoch": 2703} {"train_loss": -11.798530578613281, "global_step": 454206, "epoch": 2703} {"train_loss": -12.461965560913086, "global_step": 454207, "epoch": 2703} {"train_loss": -11.69151496887207, "global_step": 454208, "epoch": 2703} {"train_loss": -12.432769775390625, "global_step": 454209, "epoch": 2703} {"train_loss": -12.040410995483398, "global_step": 454210, "epoch": 2703} {"train_loss": -12.490388870239258, "global_step": 454211, "epoch": 2703} {"train_loss": -12.054438591003418, "global_step": 454212, "epoch": 2703} {"train_loss": -12.287376403808594, "global_step": 454213, "epoch": 2703} {"train_loss": -12.158395767211914, "global_step": 454214, "epoch": 2703} {"train_loss": -12.265951156616211, "global_step": 454215, "epoch": 2703} {"train_loss": -12.418371200561523, "global_step": 454216, "epoch": 2703} {"train_loss": -12.243098258972168, "global_step": 454217, "epoch": 2703} {"train_loss": -12.484302520751953, "global_step": 454218, "epoch": 2703} {"train_loss": -12.35634708404541, "global_step": 454219, "epoch": 2703} {"train_loss": -12.637411117553711, "global_step": 454220, "epoch": 2703} {"train_loss": -12.372834205627441, "global_step": 454221, "epoch": 2703} {"train_loss": -12.429584503173828, "global_step": 454222, "epoch": 2703} {"train_loss": -12.391637802124023, "global_step": 454223, "epoch": 2703} {"train_loss": -12.658329010009766, "global_step": 454224, "epoch": 2703} {"train_loss": -12.475273132324219, "global_step": 454225, "epoch": 2703} {"train_loss": -12.478694915771484, "global_step": 454226, "epoch": 2703} {"train_loss": -12.461494445800781, "global_step": 454227, "epoch": 2703} {"train_loss": -12.595043182373047, "global_step": 454228, "epoch": 2703} {"train_loss": -12.249567985534668, "global_step": 454229, "epoch": 2703} {"train_loss": -12.569103240966797, "global_step": 454230, "epoch": 2703} {"train_loss": -12.480310440063477, "global_step": 454231, "epoch": 2703} {"train_loss": -12.351919174194336, "global_step": 454232, "epoch": 2703} {"train_loss": -12.406597137451172, "global_step": 454233, "epoch": 2703} {"train_loss": -11.944243431091309, "global_step": 454234, "epoch": 2703} {"train_loss": -12.662551879882812, "global_step": 454235, "epoch": 2703} {"train_loss": -12.091638565063477, "global_step": 454236, "epoch": 2703} {"train_loss": -12.458808898925781, "global_step": 454237, "epoch": 2703} {"train_loss": -12.179733276367188, "global_step": 454238, "epoch": 2703} {"train_loss": -11.993885040283203, "global_step": 454239, "epoch": 2703} {"train_loss": -12.131759643554688, "global_step": 454240, "epoch": 2703} {"train_loss": -12.081896781921387, "global_step": 454241, "epoch": 2703} {"train_loss": -12.454132080078125, "global_step": 454242, "epoch": 2703} {"train_loss": -12.464744567871094, "global_step": 454243, "epoch": 2703} {"train_loss": -12.52602481842041, "global_step": 454244, "epoch": 2703} {"train_loss": -12.429924011230469, "global_step": 454245, "epoch": 2703} {"train_loss": -12.43191909790039, "global_step": 454246, "epoch": 2703} {"train_loss": -12.260002136230469, "global_step": 454247, "epoch": 2703} {"train_loss": -12.52888298034668, "global_step": 454248, "epoch": 2703} {"train_loss": -12.26373291015625, "global_step": 454249, "epoch": 2703} {"train_loss": -12.653558731079102, "global_step": 454250, "epoch": 2703} {"train_loss": -12.323480606079102, "global_step": 454251, "epoch": 2703} {"train_loss": -12.268560409545898, "global_step": 454252, "epoch": 2703} {"train_loss": -12.22212028503418, "global_step": 454253, "epoch": 2703} {"train_loss": -12.54106330871582, "global_step": 454254, "epoch": 2703} {"train_loss": -12.508708953857422, "global_step": 454255, "epoch": 2703} {"train_loss": -12.389355659484863, "global_step": 454256, "epoch": 2703} {"train_loss": -12.609182357788086, "global_step": 454257, "epoch": 2703} {"train_loss": -12.18493366241455, "global_step": 454258, "epoch": 2703} {"train_loss": -12.616893768310547, "global_step": 454259, "epoch": 2703} {"train_loss": -12.176362037658691, "global_step": 454260, "epoch": 2703} {"train_loss": -12.364829063415527, "global_step": 454261, "epoch": 2703} {"train_loss": -11.830471992492676, "global_step": 454262, "epoch": 2703} {"train_loss": -12.435256958007812, "global_step": 454263, "epoch": 2703} {"train_loss": -11.680200576782227, "global_step": 454264, "epoch": 2703} {"train_loss": -11.573129653930664, "global_step": 454265, "epoch": 2703} {"train_loss": -12.34257984161377, "global_step": 454266, "epoch": 2703} {"train_loss": -12.29182243347168, "global_step": 454267, "epoch": 2703} {"train_loss": -12.122251510620117, "global_step": 454268, "epoch": 2703} {"train_loss": -11.805854797363281, "global_step": 454269, "epoch": 2703} {"train_loss": -12.313711166381836, "global_step": 454270, "epoch": 2703} {"train_loss": -12.102340272494725, "global_step": 454271, "epoch": 2703, "val_loss": 313004.25} {"train_loss": -11.971083641052246, "global_step": 454272, "epoch": 2704} {"train_loss": -12.238250732421875, "global_step": 454273, "epoch": 2704} {"train_loss": -12.563852310180664, "global_step": 454274, "epoch": 2704} {"train_loss": -12.347151756286621, "global_step": 454275, "epoch": 2704} {"train_loss": -11.81112289428711, "global_step": 454276, "epoch": 2704} {"train_loss": -12.258240699768066, "global_step": 454277, "epoch": 2704} {"train_loss": -12.528585433959961, "global_step": 454278, "epoch": 2704} {"train_loss": -12.672704696655273, "global_step": 454279, "epoch": 2704} {"train_loss": -12.499696731567383, "global_step": 454280, "epoch": 2704} {"train_loss": -12.725157737731934, "global_step": 454281, "epoch": 2704} {"train_loss": -12.428619384765625, "global_step": 454282, "epoch": 2704} {"train_loss": -12.377893447875977, "global_step": 454283, "epoch": 2704} {"train_loss": -11.546137809753418, "global_step": 454284, "epoch": 2704} {"train_loss": -11.667733192443848, "global_step": 454285, "epoch": 2704} {"train_loss": -11.661107063293457, "global_step": 454286, "epoch": 2704} {"train_loss": -10.386775970458984, "global_step": 454287, "epoch": 2704} {"train_loss": -10.996002197265625, "global_step": 454288, "epoch": 2704} {"train_loss": -11.61193561553955, "global_step": 454289, "epoch": 2704} {"train_loss": -11.695829391479492, "global_step": 454290, "epoch": 2704} {"train_loss": -12.26846694946289, "global_step": 454291, "epoch": 2704} {"train_loss": -11.987421035766602, "global_step": 454292, "epoch": 2704} {"train_loss": -12.037457466125488, "global_step": 454293, "epoch": 2704} {"train_loss": -12.164875030517578, "global_step": 454294, "epoch": 2704} {"train_loss": -11.871875762939453, "global_step": 454295, "epoch": 2704} {"train_loss": -11.464778900146484, "global_step": 454296, "epoch": 2704} {"train_loss": -11.87584400177002, "global_step": 454297, "epoch": 2704} {"train_loss": -11.63007926940918, "global_step": 454298, "epoch": 2704} {"train_loss": -12.385750770568848, "global_step": 454299, "epoch": 2704} {"train_loss": -11.795848846435547, "global_step": 454300, "epoch": 2704} {"train_loss": -11.89921760559082, "global_step": 454301, "epoch": 2704} {"train_loss": -12.218313217163086, "global_step": 454302, "epoch": 2704} {"train_loss": -12.350686073303223, "global_step": 454303, "epoch": 2704} {"train_loss": -11.49952507019043, "global_step": 454304, "epoch": 2704} {"train_loss": -11.961037635803223, "global_step": 454305, "epoch": 2704} {"train_loss": -12.281289100646973, "global_step": 454306, "epoch": 2704} {"train_loss": -11.93100643157959, "global_step": 454307, "epoch": 2704} {"train_loss": -12.409523963928223, "global_step": 454308, "epoch": 2704} {"train_loss": -12.160585403442383, "global_step": 454309, "epoch": 2704} {"train_loss": -11.655010223388672, "global_step": 454310, "epoch": 2704} {"train_loss": -12.277801513671875, "global_step": 454311, "epoch": 2704} {"train_loss": -12.264755249023438, "global_step": 454312, "epoch": 2704} {"train_loss": -12.070355415344238, "global_step": 454313, "epoch": 2704} {"train_loss": -12.515003204345703, "global_step": 454314, "epoch": 2704} {"train_loss": -11.920036315917969, "global_step": 454315, "epoch": 2704} {"train_loss": -12.498099327087402, "global_step": 454316, "epoch": 2704} {"train_loss": -12.394122123718262, "global_step": 454317, "epoch": 2704} {"train_loss": -12.393965721130371, "global_step": 454318, "epoch": 2704} {"train_loss": -12.537678718566895, "global_step": 454319, "epoch": 2704} {"train_loss": -11.670631408691406, "global_step": 454320, "epoch": 2704} {"train_loss": -12.427051544189453, "global_step": 454321, "epoch": 2704} {"train_loss": -11.880044937133789, "global_step": 454322, "epoch": 2704} {"train_loss": -11.87198257446289, "global_step": 454323, "epoch": 2704} {"train_loss": -11.829374313354492, "global_step": 454324, "epoch": 2704} {"train_loss": -11.68043327331543, "global_step": 454325, "epoch": 2704} {"train_loss": -12.256205558776855, "global_step": 454326, "epoch": 2704} {"train_loss": -11.563796997070312, "global_step": 454327, "epoch": 2704} {"train_loss": -12.671205520629883, "global_step": 454328, "epoch": 2704} {"train_loss": -11.744815826416016, "global_step": 454329, "epoch": 2704} {"train_loss": -12.268227577209473, "global_step": 454330, "epoch": 2704} {"train_loss": -12.209742546081543, "global_step": 454331, "epoch": 2704} {"train_loss": -12.508106231689453, "global_step": 454332, "epoch": 2704} {"train_loss": -12.293065071105957, "global_step": 454333, "epoch": 2704} {"train_loss": -12.479626655578613, "global_step": 454334, "epoch": 2704} {"train_loss": -12.417058944702148, "global_step": 454335, "epoch": 2704} {"train_loss": -12.536269187927246, "global_step": 454336, "epoch": 2704} {"train_loss": -12.501252174377441, "global_step": 454337, "epoch": 2704} {"train_loss": -12.6533784866333, "global_step": 454338, "epoch": 2704} {"train_loss": -12.60009765625, "global_step": 454339, "epoch": 2704} {"train_loss": -12.656005859375, "global_step": 454340, "epoch": 2704} {"train_loss": -12.221246719360352, "global_step": 454341, "epoch": 2704} {"train_loss": -12.630767822265625, "global_step": 454342, "epoch": 2704} {"train_loss": -12.42042350769043, "global_step": 454343, "epoch": 2704} {"train_loss": -11.887962341308594, "global_step": 454344, "epoch": 2704} {"train_loss": -12.500734329223633, "global_step": 454345, "epoch": 2704} {"train_loss": -12.253777503967285, "global_step": 454346, "epoch": 2704} {"train_loss": -12.223665237426758, "global_step": 454347, "epoch": 2704} {"train_loss": -12.799988746643066, "global_step": 454348, "epoch": 2704} {"train_loss": -12.200630187988281, "global_step": 454349, "epoch": 2704} {"train_loss": -12.668084144592285, "global_step": 454350, "epoch": 2704} {"train_loss": -12.37407398223877, "global_step": 454351, "epoch": 2704} {"train_loss": -12.645980834960938, "global_step": 454352, "epoch": 2704} {"train_loss": -12.303473472595215, "global_step": 454353, "epoch": 2704} {"train_loss": -12.464509010314941, "global_step": 454354, "epoch": 2704} {"train_loss": -12.691671371459961, "global_step": 454355, "epoch": 2704} {"train_loss": -12.121881484985352, "global_step": 454356, "epoch": 2704} {"train_loss": -12.373566627502441, "global_step": 454357, "epoch": 2704} {"train_loss": -12.414161682128906, "global_step": 454358, "epoch": 2704} {"train_loss": -12.146195411682129, "global_step": 454359, "epoch": 2704} {"train_loss": -12.526312828063965, "global_step": 454360, "epoch": 2704} {"train_loss": -11.938312530517578, "global_step": 454361, "epoch": 2704} {"train_loss": -12.639537811279297, "global_step": 454362, "epoch": 2704} {"train_loss": -12.196532249450684, "global_step": 454363, "epoch": 2704} {"train_loss": -12.176079750061035, "global_step": 454364, "epoch": 2704} {"train_loss": -12.261405944824219, "global_step": 454365, "epoch": 2704} {"train_loss": -12.138691902160645, "global_step": 454366, "epoch": 2704} {"train_loss": -12.39976692199707, "global_step": 454367, "epoch": 2704} {"train_loss": -12.114131927490234, "global_step": 454368, "epoch": 2704} {"train_loss": -12.457531929016113, "global_step": 454369, "epoch": 2704} {"train_loss": -12.333324432373047, "global_step": 454370, "epoch": 2704} {"train_loss": -12.311903953552246, "global_step": 454371, "epoch": 2704} {"train_loss": -12.469806671142578, "global_step": 454372, "epoch": 2704} {"train_loss": -12.473970413208008, "global_step": 454373, "epoch": 2704} {"train_loss": -12.607536315917969, "global_step": 454374, "epoch": 2704} {"train_loss": -12.65562629699707, "global_step": 454375, "epoch": 2704} {"train_loss": -12.601515769958496, "global_step": 454376, "epoch": 2704} {"train_loss": -12.428285598754883, "global_step": 454377, "epoch": 2704} {"train_loss": -12.620522499084473, "global_step": 454378, "epoch": 2704} {"train_loss": -12.428704261779785, "global_step": 454379, "epoch": 2704} {"train_loss": -11.937725067138672, "global_step": 454380, "epoch": 2704} {"train_loss": -12.862829208374023, "global_step": 454381, "epoch": 2704} {"train_loss": -12.473686218261719, "global_step": 454382, "epoch": 2704} {"train_loss": -12.283851623535156, "global_step": 454383, "epoch": 2704} {"train_loss": -12.413482666015625, "global_step": 454384, "epoch": 2704} {"train_loss": -12.919892311096191, "global_step": 454385, "epoch": 2704} {"train_loss": -12.632291793823242, "global_step": 454386, "epoch": 2704} {"train_loss": -12.485301971435547, "global_step": 454387, "epoch": 2704} {"train_loss": -12.57585334777832, "global_step": 454388, "epoch": 2704} {"train_loss": -12.868497848510742, "global_step": 454389, "epoch": 2704} {"train_loss": -11.97613525390625, "global_step": 454390, "epoch": 2704} {"train_loss": -11.583709716796875, "global_step": 454391, "epoch": 2704} {"train_loss": -12.219697952270508, "global_step": 454392, "epoch": 2704} {"train_loss": -13.073360443115234, "global_step": 454393, "epoch": 2704} {"train_loss": -12.522777557373047, "global_step": 454394, "epoch": 2704} {"train_loss": -12.601165771484375, "global_step": 454395, "epoch": 2704} {"train_loss": -12.704833030700684, "global_step": 454396, "epoch": 2704} {"train_loss": -12.677152633666992, "global_step": 454397, "epoch": 2704} {"train_loss": -12.809865951538086, "global_step": 454398, "epoch": 2704} {"train_loss": -12.806204795837402, "global_step": 454399, "epoch": 2704} {"train_loss": -12.794780731201172, "global_step": 454400, "epoch": 2704} {"train_loss": -12.902256965637207, "global_step": 454401, "epoch": 2704} {"train_loss": -12.839405059814453, "global_step": 454402, "epoch": 2704} {"train_loss": -12.866689682006836, "global_step": 454403, "epoch": 2704} {"train_loss": -12.66435718536377, "global_step": 454404, "epoch": 2704} {"train_loss": -12.753856658935547, "global_step": 454405, "epoch": 2704} {"train_loss": -12.60795783996582, "global_step": 454406, "epoch": 2704} {"train_loss": -12.714454650878906, "global_step": 454407, "epoch": 2704} {"train_loss": -12.51496696472168, "global_step": 454408, "epoch": 2704} {"train_loss": -12.457247734069824, "global_step": 454409, "epoch": 2704} {"train_loss": -12.786746978759766, "global_step": 454410, "epoch": 2704} {"train_loss": -12.68900203704834, "global_step": 454411, "epoch": 2704} {"train_loss": -12.651050567626953, "global_step": 454412, "epoch": 2704} {"train_loss": -12.91542911529541, "global_step": 454413, "epoch": 2704} {"train_loss": -13.036672592163086, "global_step": 454414, "epoch": 2704} {"train_loss": -12.302605628967285, "global_step": 454415, "epoch": 2704} {"train_loss": -11.914609909057617, "global_step": 454416, "epoch": 2704} {"train_loss": -11.972757339477539, "global_step": 454417, "epoch": 2704} {"train_loss": -12.434402465820312, "global_step": 454418, "epoch": 2704} {"train_loss": -11.39087200164795, "global_step": 454419, "epoch": 2704} {"train_loss": -10.537263870239258, "global_step": 454420, "epoch": 2704} {"train_loss": -12.602381706237793, "global_step": 454421, "epoch": 2704} {"train_loss": -9.42576789855957, "global_step": 454422, "epoch": 2704} {"train_loss": -12.046708106994629, "global_step": 454423, "epoch": 2704} {"train_loss": -11.95793628692627, "global_step": 454424, "epoch": 2704} {"train_loss": -12.184240341186523, "global_step": 454425, "epoch": 2704} {"train_loss": -12.511576652526855, "global_step": 454426, "epoch": 2704} {"train_loss": -12.406930923461914, "global_step": 454427, "epoch": 2704} {"train_loss": -12.466480255126953, "global_step": 454428, "epoch": 2704} {"train_loss": -12.35757827758789, "global_step": 454429, "epoch": 2704} {"train_loss": -12.408684730529785, "global_step": 454430, "epoch": 2704} {"train_loss": -11.517261505126953, "global_step": 454431, "epoch": 2704} {"train_loss": -11.763157844543457, "global_step": 454432, "epoch": 2704} {"train_loss": -12.640894889831543, "global_step": 454433, "epoch": 2704} {"train_loss": -12.036404609680176, "global_step": 454434, "epoch": 2704} {"train_loss": -11.344432830810547, "global_step": 454435, "epoch": 2704} {"train_loss": -12.111889839172363, "global_step": 454436, "epoch": 2704} {"train_loss": -12.087196350097656, "global_step": 454437, "epoch": 2704} {"train_loss": -11.601921081542969, "global_step": 454438, "epoch": 2704} {"train_loss": -12.252067838396345, "global_step": 454439, "epoch": 2704, "val_loss": 312896.78125} {"train_loss": -11.973540306091309, "global_step": 454440, "epoch": 2705} {"train_loss": -11.673192977905273, "global_step": 454441, "epoch": 2705} {"train_loss": -11.535452842712402, "global_step": 454442, "epoch": 2705} {"train_loss": -12.578861236572266, "global_step": 454443, "epoch": 2705} {"train_loss": -11.709280014038086, "global_step": 454444, "epoch": 2705} {"train_loss": -11.926042556762695, "global_step": 454445, "epoch": 2705} {"train_loss": -12.050646781921387, "global_step": 454446, "epoch": 2705} {"train_loss": -11.732086181640625, "global_step": 454447, "epoch": 2705} {"train_loss": -11.556671142578125, "global_step": 454448, "epoch": 2705} {"train_loss": -12.813594818115234, "global_step": 454449, "epoch": 2705} {"train_loss": -11.864335060119629, "global_step": 454450, "epoch": 2705} {"train_loss": -11.500511169433594, "global_step": 454451, "epoch": 2705} {"train_loss": -12.435323715209961, "global_step": 454452, "epoch": 2705} {"train_loss": -12.486748695373535, "global_step": 454453, "epoch": 2705} {"train_loss": -11.912796020507812, "global_step": 454454, "epoch": 2705} {"train_loss": -12.859614372253418, "global_step": 454455, "epoch": 2705} {"train_loss": -12.380928993225098, "global_step": 454456, "epoch": 2705} {"train_loss": -12.393198013305664, "global_step": 454457, "epoch": 2705} {"train_loss": -12.513877868652344, "global_step": 454458, "epoch": 2705} {"train_loss": -12.250215530395508, "global_step": 454459, "epoch": 2705} {"train_loss": -11.98987865447998, "global_step": 454460, "epoch": 2705} {"train_loss": -12.576353073120117, "global_step": 454461, "epoch": 2705} {"train_loss": -11.72363567352295, "global_step": 454462, "epoch": 2705} {"train_loss": -12.418380737304688, "global_step": 454463, "epoch": 2705} {"train_loss": -11.316781997680664, "global_step": 454464, "epoch": 2705} {"train_loss": -11.562154769897461, "global_step": 454465, "epoch": 2705} {"train_loss": -11.786914825439453, "global_step": 454466, "epoch": 2705} {"train_loss": -10.263191223144531, "global_step": 454467, "epoch": 2705} {"train_loss": -11.604890823364258, "global_step": 454468, "epoch": 2705} {"train_loss": -11.59862232208252, "global_step": 454469, "epoch": 2705} {"train_loss": -11.329130172729492, "global_step": 454470, "epoch": 2705} {"train_loss": -11.727141380310059, "global_step": 454471, "epoch": 2705} {"train_loss": -11.459798812866211, "global_step": 454472, "epoch": 2705} {"train_loss": -11.434717178344727, "global_step": 454473, "epoch": 2705} {"train_loss": -12.080987930297852, "global_step": 454474, "epoch": 2705} {"train_loss": -11.886216163635254, "global_step": 454475, "epoch": 2705} {"train_loss": -12.18928337097168, "global_step": 454476, "epoch": 2705} {"train_loss": -11.941007614135742, "global_step": 454477, "epoch": 2705} {"train_loss": -12.122777938842773, "global_step": 454478, "epoch": 2705} {"train_loss": -12.624062538146973, "global_step": 454479, "epoch": 2705} {"train_loss": -12.30540943145752, "global_step": 454480, "epoch": 2705} {"train_loss": -12.552363395690918, "global_step": 454481, "epoch": 2705} {"train_loss": -12.512201309204102, "global_step": 454482, "epoch": 2705} {"train_loss": -12.507731437683105, "global_step": 454483, "epoch": 2705} {"train_loss": -12.391758918762207, "global_step": 454484, "epoch": 2705} {"train_loss": -12.666653633117676, "global_step": 454485, "epoch": 2705} {"train_loss": -12.634587287902832, "global_step": 454486, "epoch": 2705} {"train_loss": -12.484659194946289, "global_step": 454487, "epoch": 2705} {"train_loss": -12.700634002685547, "global_step": 454488, "epoch": 2705} {"train_loss": -12.743549346923828, "global_step": 454489, "epoch": 2705} {"train_loss": -12.767507553100586, "global_step": 454490, "epoch": 2705} {"train_loss": -12.238040924072266, "global_step": 454491, "epoch": 2705} {"train_loss": -12.504276275634766, "global_step": 454492, "epoch": 2705} {"train_loss": -12.718597412109375, "global_step": 454493, "epoch": 2705} {"train_loss": -12.222698211669922, "global_step": 454494, "epoch": 2705} {"train_loss": -12.338386535644531, "global_step": 454495, "epoch": 2705} {"train_loss": -12.735847473144531, "global_step": 454496, "epoch": 2705} {"train_loss": -12.430585861206055, "global_step": 454497, "epoch": 2705} {"train_loss": -12.792854309082031, "global_step": 454498, "epoch": 2705} {"train_loss": -12.429683685302734, "global_step": 454499, "epoch": 2705} {"train_loss": -12.68031120300293, "global_step": 454500, "epoch": 2705} {"train_loss": -12.348919868469238, "global_step": 454501, "epoch": 2705} {"train_loss": -12.441264152526855, "global_step": 454502, "epoch": 2705} {"train_loss": -12.558670043945312, "global_step": 454503, "epoch": 2705} {"train_loss": -12.632579803466797, "global_step": 454504, "epoch": 2705} {"train_loss": -12.581944465637207, "global_step": 454505, "epoch": 2705} {"train_loss": -12.619486808776855, "global_step": 454506, "epoch": 2705} {"train_loss": -12.69729232788086, "global_step": 454507, "epoch": 2705} {"train_loss": -12.691230773925781, "global_step": 454508, "epoch": 2705} {"train_loss": -12.538175582885742, "global_step": 454509, "epoch": 2705} {"train_loss": -11.617236137390137, "global_step": 454510, "epoch": 2705} {"train_loss": -12.09821605682373, "global_step": 454511, "epoch": 2705} {"train_loss": -12.784014701843262, "global_step": 454512, "epoch": 2705} {"train_loss": -12.10384750366211, "global_step": 454513, "epoch": 2705} {"train_loss": -11.004079818725586, "global_step": 454514, "epoch": 2705} {"train_loss": -12.332324981689453, "global_step": 454515, "epoch": 2705} {"train_loss": -12.22810173034668, "global_step": 454516, "epoch": 2705} {"train_loss": -11.588068008422852, "global_step": 454517, "epoch": 2705} {"train_loss": -11.741615295410156, "global_step": 454518, "epoch": 2705} {"train_loss": -12.365912437438965, "global_step": 454519, "epoch": 2705} {"train_loss": -12.428955078125, "global_step": 454520, "epoch": 2705} {"train_loss": -12.059661865234375, "global_step": 454521, "epoch": 2705} {"train_loss": -12.565187454223633, "global_step": 454522, "epoch": 2705} {"train_loss": -12.197601318359375, "global_step": 454523, "epoch": 2705} {"train_loss": -12.795744895935059, "global_step": 454524, "epoch": 2705} {"train_loss": -12.539355278015137, "global_step": 454525, "epoch": 2705} {"train_loss": -12.614385604858398, "global_step": 454526, "epoch": 2705} {"train_loss": -12.575122833251953, "global_step": 454527, "epoch": 2705} {"train_loss": -12.823162078857422, "global_step": 454528, "epoch": 2705} {"train_loss": -12.645153045654297, "global_step": 454529, "epoch": 2705} {"train_loss": -12.70533561706543, "global_step": 454530, "epoch": 2705} {"train_loss": -12.641729354858398, "global_step": 454531, "epoch": 2705} {"train_loss": -13.02137565612793, "global_step": 454532, "epoch": 2705} {"train_loss": -12.876302719116211, "global_step": 454533, "epoch": 2705} {"train_loss": -12.8983154296875, "global_step": 454534, "epoch": 2705} {"train_loss": -12.961774826049805, "global_step": 454535, "epoch": 2705} {"train_loss": -12.816499710083008, "global_step": 454536, "epoch": 2705} {"train_loss": -12.389999389648438, "global_step": 454537, "epoch": 2705} {"train_loss": -12.7326078414917, "global_step": 454538, "epoch": 2705} {"train_loss": -12.951627731323242, "global_step": 454539, "epoch": 2705} {"train_loss": -12.372416496276855, "global_step": 454540, "epoch": 2705} {"train_loss": -12.599444389343262, "global_step": 454541, "epoch": 2705} {"train_loss": -12.819276809692383, "global_step": 454542, "epoch": 2705} {"train_loss": -12.538269996643066, "global_step": 454543, "epoch": 2705} {"train_loss": -12.37857437133789, "global_step": 454544, "epoch": 2705} {"train_loss": -12.657183647155762, "global_step": 454545, "epoch": 2705} {"train_loss": -12.80416488647461, "global_step": 454546, "epoch": 2705} {"train_loss": -12.305620193481445, "global_step": 454547, "epoch": 2705} {"train_loss": -11.985240936279297, "global_step": 454548, "epoch": 2705} {"train_loss": -12.69808292388916, "global_step": 454549, "epoch": 2705} {"train_loss": -11.96925163269043, "global_step": 454550, "epoch": 2705} {"train_loss": -11.599808692932129, "global_step": 454551, "epoch": 2705} {"train_loss": -12.22568130493164, "global_step": 454552, "epoch": 2705} {"train_loss": -12.483634948730469, "global_step": 454553, "epoch": 2705} {"train_loss": -11.618362426757812, "global_step": 454554, "epoch": 2705} {"train_loss": -12.26744556427002, "global_step": 454555, "epoch": 2705} {"train_loss": -12.189027786254883, "global_step": 454556, "epoch": 2705} {"train_loss": -12.414340019226074, "global_step": 454557, "epoch": 2705} {"train_loss": -11.68613052368164, "global_step": 454558, "epoch": 2705} {"train_loss": -12.66931438446045, "global_step": 454559, "epoch": 2705} {"train_loss": -12.506080627441406, "global_step": 454560, "epoch": 2705} {"train_loss": -12.307668685913086, "global_step": 454561, "epoch": 2705} {"train_loss": -12.553901672363281, "global_step": 454562, "epoch": 2705} {"train_loss": -12.746489524841309, "global_step": 454563, "epoch": 2705} {"train_loss": -12.529586791992188, "global_step": 454564, "epoch": 2705} {"train_loss": -12.302752494812012, "global_step": 454565, "epoch": 2705} {"train_loss": -12.441606521606445, "global_step": 454566, "epoch": 2705} {"train_loss": -12.73689079284668, "global_step": 454567, "epoch": 2705} {"train_loss": -12.436986923217773, "global_step": 454568, "epoch": 2705} {"train_loss": -12.664825439453125, "global_step": 454569, "epoch": 2705} {"train_loss": -12.796513557434082, "global_step": 454570, "epoch": 2705} {"train_loss": -12.505484580993652, "global_step": 454571, "epoch": 2705} {"train_loss": -12.402702331542969, "global_step": 454572, "epoch": 2705} {"train_loss": -12.563089370727539, "global_step": 454573, "epoch": 2705} {"train_loss": -12.693620681762695, "global_step": 454574, "epoch": 2705} {"train_loss": -12.144347190856934, "global_step": 454575, "epoch": 2705} {"train_loss": -11.681770324707031, "global_step": 454576, "epoch": 2705} {"train_loss": -12.13230037689209, "global_step": 454577, "epoch": 2705} {"train_loss": -12.603675842285156, "global_step": 454578, "epoch": 2705} {"train_loss": -11.762835502624512, "global_step": 454579, "epoch": 2705} {"train_loss": -11.818864822387695, "global_step": 454580, "epoch": 2705} {"train_loss": -12.583651542663574, "global_step": 454581, "epoch": 2705} {"train_loss": -11.280132293701172, "global_step": 454582, "epoch": 2705} {"train_loss": -11.503641128540039, "global_step": 454583, "epoch": 2705} {"train_loss": -11.670623779296875, "global_step": 454584, "epoch": 2705} {"train_loss": -9.647286415100098, "global_step": 454585, "epoch": 2705} {"train_loss": -10.60804557800293, "global_step": 454586, "epoch": 2705} {"train_loss": -10.729785919189453, "global_step": 454587, "epoch": 2705} {"train_loss": -9.693658828735352, "global_step": 454588, "epoch": 2705} {"train_loss": -9.291093826293945, "global_step": 454589, "epoch": 2705} {"train_loss": -10.647682189941406, "global_step": 454590, "epoch": 2705} {"train_loss": -9.224794387817383, "global_step": 454591, "epoch": 2705} {"train_loss": -10.340309143066406, "global_step": 454592, "epoch": 2705} {"train_loss": -10.808822631835938, "global_step": 454593, "epoch": 2705} {"train_loss": -10.417200088500977, "global_step": 454594, "epoch": 2705} {"train_loss": -11.125570297241211, "global_step": 454595, "epoch": 2705} {"train_loss": -9.95009708404541, "global_step": 454596, "epoch": 2705} {"train_loss": -10.073031425476074, "global_step": 454597, "epoch": 2705} {"train_loss": -10.310460090637207, "global_step": 454598, "epoch": 2705} {"train_loss": -10.78153133392334, "global_step": 454599, "epoch": 2705} {"train_loss": -10.855846405029297, "global_step": 454600, "epoch": 2705} {"train_loss": -11.073503494262695, "global_step": 454601, "epoch": 2705} {"train_loss": -11.559537887573242, "global_step": 454602, "epoch": 2705} {"train_loss": -11.906927108764648, "global_step": 454603, "epoch": 2705} {"train_loss": -11.471126556396484, "global_step": 454604, "epoch": 2705} {"train_loss": -11.924347877502441, "global_step": 454605, "epoch": 2705} {"train_loss": -11.146490097045898, "global_step": 454606, "epoch": 2705} {"train_loss": -12.06017670177278, "global_step": 454607, "epoch": 2705, "val_loss": 314221.125, "train_action_mse_error": 0.3867247998714447} {"train_loss": -12.028772354125977, "global_step": 454608, "epoch": 2706} {"train_loss": -12.055473327636719, "global_step": 454609, "epoch": 2706} {"train_loss": -12.073208808898926, "global_step": 454610, "epoch": 2706} {"train_loss": -11.853458404541016, "global_step": 454611, "epoch": 2706} {"train_loss": -11.960921287536621, "global_step": 454612, "epoch": 2706} {"train_loss": -11.906609535217285, "global_step": 454613, "epoch": 2706} {"train_loss": -12.173648834228516, "global_step": 454614, "epoch": 2706} {"train_loss": -11.906490325927734, "global_step": 454615, "epoch": 2706} {"train_loss": -11.82412338256836, "global_step": 454616, "epoch": 2706} {"train_loss": -12.23093032836914, "global_step": 454617, "epoch": 2706} {"train_loss": -11.804729461669922, "global_step": 454618, "epoch": 2706} {"train_loss": -11.996460914611816, "global_step": 454619, "epoch": 2706} {"train_loss": -12.063687324523926, "global_step": 454620, "epoch": 2706} {"train_loss": -11.957353591918945, "global_step": 454621, "epoch": 2706} {"train_loss": -12.26408576965332, "global_step": 454622, "epoch": 2706} {"train_loss": -12.304204940795898, "global_step": 454623, "epoch": 2706} {"train_loss": -12.242216110229492, "global_step": 454624, "epoch": 2706} {"train_loss": -12.069459915161133, "global_step": 454625, "epoch": 2706} {"train_loss": -12.294028282165527, "global_step": 454626, "epoch": 2706} {"train_loss": -12.095829963684082, "global_step": 454627, "epoch": 2706} {"train_loss": -12.399541854858398, "global_step": 454628, "epoch": 2706} {"train_loss": -12.368319511413574, "global_step": 454629, "epoch": 2706} {"train_loss": -12.465740203857422, "global_step": 454630, "epoch": 2706} {"train_loss": -12.600103378295898, "global_step": 454631, "epoch": 2706} {"train_loss": -12.401873588562012, "global_step": 454632, "epoch": 2706} {"train_loss": -12.680914878845215, "global_step": 454633, "epoch": 2706} {"train_loss": -12.59360408782959, "global_step": 454634, "epoch": 2706} {"train_loss": -12.557315826416016, "global_step": 454635, "epoch": 2706} {"train_loss": -12.164450645446777, "global_step": 454636, "epoch": 2706} {"train_loss": -12.54035758972168, "global_step": 454637, "epoch": 2706} {"train_loss": -12.059335708618164, "global_step": 454638, "epoch": 2706} {"train_loss": -12.173738479614258, "global_step": 454639, "epoch": 2706} {"train_loss": -12.264993667602539, "global_step": 454640, "epoch": 2706} {"train_loss": -12.319063186645508, "global_step": 454641, "epoch": 2706} {"train_loss": -12.284503936767578, "global_step": 454642, "epoch": 2706} {"train_loss": -11.970539093017578, "global_step": 454643, "epoch": 2706} {"train_loss": -12.5984468460083, "global_step": 454644, "epoch": 2706} {"train_loss": -11.902172088623047, "global_step": 454645, "epoch": 2706} {"train_loss": -12.078126907348633, "global_step": 454646, "epoch": 2706} {"train_loss": -12.49879264831543, "global_step": 454647, "epoch": 2706} {"train_loss": -12.397104263305664, "global_step": 454648, "epoch": 2706} {"train_loss": -12.586849212646484, "global_step": 454649, "epoch": 2706} {"train_loss": -12.407014846801758, "global_step": 454650, "epoch": 2706} {"train_loss": -12.374561309814453, "global_step": 454651, "epoch": 2706} {"train_loss": -12.22439193725586, "global_step": 454652, "epoch": 2706} {"train_loss": -12.480255126953125, "global_step": 454653, "epoch": 2706} {"train_loss": -11.941640853881836, "global_step": 454654, "epoch": 2706} {"train_loss": -12.087104797363281, "global_step": 454655, "epoch": 2706} {"train_loss": -12.465904235839844, "global_step": 454656, "epoch": 2706} {"train_loss": -11.39676284790039, "global_step": 454657, "epoch": 2706} {"train_loss": -12.175052642822266, "global_step": 454658, "epoch": 2706} {"train_loss": -11.742391586303711, "global_step": 454659, "epoch": 2706} {"train_loss": -11.509317398071289, "global_step": 454660, "epoch": 2706} {"train_loss": -10.876712799072266, "global_step": 454661, "epoch": 2706} {"train_loss": -12.271282196044922, "global_step": 454662, "epoch": 2706} {"train_loss": -11.601633071899414, "global_step": 454663, "epoch": 2706} {"train_loss": -11.967708587646484, "global_step": 454664, "epoch": 2706} {"train_loss": -11.833793640136719, "global_step": 454665, "epoch": 2706} {"train_loss": -12.302506446838379, "global_step": 454666, "epoch": 2706} {"train_loss": -11.491870880126953, "global_step": 454667, "epoch": 2706} {"train_loss": -12.23340892791748, "global_step": 454668, "epoch": 2706} {"train_loss": -11.86156940460205, "global_step": 454669, "epoch": 2706} {"train_loss": -12.00792121887207, "global_step": 454670, "epoch": 2706} {"train_loss": -11.939007759094238, "global_step": 454671, "epoch": 2706} {"train_loss": -12.171582221984863, "global_step": 454672, "epoch": 2706} {"train_loss": -11.937942504882812, "global_step": 454673, "epoch": 2706} {"train_loss": -11.828296661376953, "global_step": 454674, "epoch": 2706} {"train_loss": -12.306663513183594, "global_step": 454675, "epoch": 2706} {"train_loss": -11.737504959106445, "global_step": 454676, "epoch": 2706} {"train_loss": -12.134218215942383, "global_step": 454677, "epoch": 2706} {"train_loss": -11.156356811523438, "global_step": 454678, "epoch": 2706} {"train_loss": -12.119606018066406, "global_step": 454679, "epoch": 2706} {"train_loss": -10.82559585571289, "global_step": 454680, "epoch": 2706} {"train_loss": -11.273807525634766, "global_step": 454681, "epoch": 2706} {"train_loss": -10.152037620544434, "global_step": 454682, "epoch": 2706} {"train_loss": -10.335874557495117, "global_step": 454683, "epoch": 2706} {"train_loss": -10.166553497314453, "global_step": 454684, "epoch": 2706} {"train_loss": -10.539587020874023, "global_step": 454685, "epoch": 2706} {"train_loss": -10.295988082885742, "global_step": 454686, "epoch": 2706} {"train_loss": -10.123590469360352, "global_step": 454687, "epoch": 2706} {"train_loss": -11.229336738586426, "global_step": 454688, "epoch": 2706} {"train_loss": -11.163663864135742, "global_step": 454689, "epoch": 2706} {"train_loss": -11.640022277832031, "global_step": 454690, "epoch": 2706} {"train_loss": -11.418439865112305, "global_step": 454691, "epoch": 2706} {"train_loss": -11.878173828125, "global_step": 454692, "epoch": 2706} {"train_loss": -11.569713592529297, "global_step": 454693, "epoch": 2706} {"train_loss": -11.41618537902832, "global_step": 454694, "epoch": 2706} {"train_loss": -11.588098526000977, "global_step": 454695, "epoch": 2706} {"train_loss": -11.629541397094727, "global_step": 454696, "epoch": 2706} {"train_loss": -11.893418312072754, "global_step": 454697, "epoch": 2706} {"train_loss": -12.017346382141113, "global_step": 454698, "epoch": 2706} {"train_loss": -11.727622032165527, "global_step": 454699, "epoch": 2706} {"train_loss": -12.099319458007812, "global_step": 454700, "epoch": 2706} {"train_loss": -11.523773193359375, "global_step": 454701, "epoch": 2706} {"train_loss": -12.249104499816895, "global_step": 454702, "epoch": 2706} {"train_loss": -12.342763900756836, "global_step": 454703, "epoch": 2706} {"train_loss": -12.439802169799805, "global_step": 454704, "epoch": 2706} {"train_loss": -12.297256469726562, "global_step": 454705, "epoch": 2706} {"train_loss": -11.904430389404297, "global_step": 454706, "epoch": 2706} {"train_loss": -12.192840576171875, "global_step": 454707, "epoch": 2706} {"train_loss": -12.304564476013184, "global_step": 454708, "epoch": 2706} {"train_loss": -12.231926918029785, "global_step": 454709, "epoch": 2706} {"train_loss": -12.140790939331055, "global_step": 454710, "epoch": 2706} {"train_loss": -12.384632110595703, "global_step": 454711, "epoch": 2706} {"train_loss": -11.902925491333008, "global_step": 454712, "epoch": 2706} {"train_loss": -12.321876525878906, "global_step": 454713, "epoch": 2706} {"train_loss": -12.107213973999023, "global_step": 454714, "epoch": 2706} {"train_loss": -12.446452140808105, "global_step": 454715, "epoch": 2706} {"train_loss": -12.420024871826172, "global_step": 454716, "epoch": 2706} {"train_loss": -12.381619453430176, "global_step": 454717, "epoch": 2706} {"train_loss": -12.733724594116211, "global_step": 454718, "epoch": 2706} {"train_loss": -12.31191635131836, "global_step": 454719, "epoch": 2706} {"train_loss": -12.480669021606445, "global_step": 454720, "epoch": 2706} {"train_loss": -12.343339920043945, "global_step": 454721, "epoch": 2706} {"train_loss": -12.452274322509766, "global_step": 454722, "epoch": 2706} {"train_loss": -12.54926872253418, "global_step": 454723, "epoch": 2706} {"train_loss": -12.600567817687988, "global_step": 454724, "epoch": 2706} {"train_loss": -12.339296340942383, "global_step": 454725, "epoch": 2706} {"train_loss": -12.665504455566406, "global_step": 454726, "epoch": 2706} {"train_loss": -12.267269134521484, "global_step": 454727, "epoch": 2706} {"train_loss": -12.647262573242188, "global_step": 454728, "epoch": 2706} {"train_loss": -12.653884887695312, "global_step": 454729, "epoch": 2706} {"train_loss": -12.599112510681152, "global_step": 454730, "epoch": 2706} {"train_loss": -12.503643035888672, "global_step": 454731, "epoch": 2706} {"train_loss": -12.248438835144043, "global_step": 454732, "epoch": 2706} {"train_loss": -12.695984840393066, "global_step": 454733, "epoch": 2706} {"train_loss": -12.689281463623047, "global_step": 454734, "epoch": 2706} {"train_loss": -12.841607093811035, "global_step": 454735, "epoch": 2706} {"train_loss": -12.796046257019043, "global_step": 454736, "epoch": 2706} {"train_loss": -12.744260787963867, "global_step": 454737, "epoch": 2706} {"train_loss": -12.760069847106934, "global_step": 454738, "epoch": 2706} {"train_loss": -12.681197166442871, "global_step": 454739, "epoch": 2706} {"train_loss": -12.740779876708984, "global_step": 454740, "epoch": 2706} {"train_loss": -12.761215209960938, "global_step": 454741, "epoch": 2706} {"train_loss": -12.797089576721191, "global_step": 454742, "epoch": 2706} {"train_loss": -12.625205993652344, "global_step": 454743, "epoch": 2706} {"train_loss": -12.763359069824219, "global_step": 454744, "epoch": 2706} {"train_loss": -12.569487571716309, "global_step": 454745, "epoch": 2706} {"train_loss": -12.651941299438477, "global_step": 454746, "epoch": 2706} {"train_loss": -12.72298812866211, "global_step": 454747, "epoch": 2706} {"train_loss": -12.677175521850586, "global_step": 454748, "epoch": 2706} {"train_loss": -12.837333679199219, "global_step": 454749, "epoch": 2706} {"train_loss": -12.603391647338867, "global_step": 454750, "epoch": 2706} {"train_loss": -12.881577491760254, "global_step": 454751, "epoch": 2706} {"train_loss": -12.681151390075684, "global_step": 454752, "epoch": 2706} {"train_loss": -13.008203506469727, "global_step": 454753, "epoch": 2706} {"train_loss": -12.88673210144043, "global_step": 454754, "epoch": 2706} {"train_loss": -12.870508193969727, "global_step": 454755, "epoch": 2706} {"train_loss": -13.04738712310791, "global_step": 454756, "epoch": 2706} {"train_loss": -12.812786102294922, "global_step": 454757, "epoch": 2706} {"train_loss": -13.017532348632812, "global_step": 454758, "epoch": 2706} {"train_loss": -12.858282089233398, "global_step": 454759, "epoch": 2706} {"train_loss": -12.806442260742188, "global_step": 454760, "epoch": 2706} {"train_loss": -12.794647216796875, "global_step": 454761, "epoch": 2706} {"train_loss": -12.858264923095703, "global_step": 454762, "epoch": 2706} {"train_loss": -12.990339279174805, "global_step": 454763, "epoch": 2706} {"train_loss": -13.021526336669922, "global_step": 454764, "epoch": 2706} {"train_loss": -12.99960708618164, "global_step": 454765, "epoch": 2706} {"train_loss": -12.867931365966797, "global_step": 454766, "epoch": 2706} {"train_loss": -12.876017570495605, "global_step": 454767, "epoch": 2706} {"train_loss": -12.790595054626465, "global_step": 454768, "epoch": 2706} {"train_loss": -12.762052536010742, "global_step": 454769, "epoch": 2706} {"train_loss": -12.688539505004883, "global_step": 454770, "epoch": 2706} {"train_loss": -12.869979858398438, "global_step": 454771, "epoch": 2706} {"train_loss": -12.753925323486328, "global_step": 454772, "epoch": 2706} {"train_loss": -12.841277122497559, "global_step": 454773, "epoch": 2706} {"train_loss": -12.59909725189209, "global_step": 454774, "epoch": 2706} {"train_loss": -12.21491083077022, "global_step": 454775, "epoch": 2706, "val_loss": 313807.53125} {"train_loss": -12.958242416381836, "global_step": 454776, "epoch": 2707} {"train_loss": -12.971927642822266, "global_step": 454777, "epoch": 2707} {"train_loss": -12.834922790527344, "global_step": 454778, "epoch": 2707} {"train_loss": -13.1765718460083, "global_step": 454779, "epoch": 2707} {"train_loss": -12.840775489807129, "global_step": 454780, "epoch": 2707} {"train_loss": -12.616122245788574, "global_step": 454781, "epoch": 2707} {"train_loss": -11.834856033325195, "global_step": 454782, "epoch": 2707} {"train_loss": -11.16500473022461, "global_step": 454783, "epoch": 2707} {"train_loss": -12.531120300292969, "global_step": 454784, "epoch": 2707} {"train_loss": -11.877218246459961, "global_step": 454785, "epoch": 2707} {"train_loss": -9.981949806213379, "global_step": 454786, "epoch": 2707} {"train_loss": -11.727743148803711, "global_step": 454787, "epoch": 2707} {"train_loss": -11.55817699432373, "global_step": 454788, "epoch": 2707} {"train_loss": -11.935089111328125, "global_step": 454789, "epoch": 2707} {"train_loss": -11.790641784667969, "global_step": 454790, "epoch": 2707} {"train_loss": -11.975370407104492, "global_step": 454791, "epoch": 2707} {"train_loss": -10.968969345092773, "global_step": 454792, "epoch": 2707} {"train_loss": -10.90650749206543, "global_step": 454793, "epoch": 2707} {"train_loss": -11.724722862243652, "global_step": 454794, "epoch": 2707} {"train_loss": -11.680801391601562, "global_step": 454795, "epoch": 2707} {"train_loss": -11.481684684753418, "global_step": 454796, "epoch": 2707} {"train_loss": -11.413409233093262, "global_step": 454797, "epoch": 2707} {"train_loss": -11.200549125671387, "global_step": 454798, "epoch": 2707} {"train_loss": -12.25451374053955, "global_step": 454799, "epoch": 2707} {"train_loss": -10.428742408752441, "global_step": 454800, "epoch": 2707} {"train_loss": -10.531471252441406, "global_step": 454801, "epoch": 2707} {"train_loss": -10.59262466430664, "global_step": 454802, "epoch": 2707} {"train_loss": -9.174054145812988, "global_step": 454803, "epoch": 2707} {"train_loss": -11.188129425048828, "global_step": 454804, "epoch": 2707} {"train_loss": -8.880607604980469, "global_step": 454805, "epoch": 2707} {"train_loss": -11.807901382446289, "global_step": 454806, "epoch": 2707} {"train_loss": -7.8436384201049805, "global_step": 454807, "epoch": 2707} {"train_loss": -9.320785522460938, "global_step": 454808, "epoch": 2707} {"train_loss": -9.324609756469727, "global_step": 454809, "epoch": 2707} {"train_loss": -11.229528427124023, "global_step": 454810, "epoch": 2707} {"train_loss": -9.734474182128906, "global_step": 454811, "epoch": 2707} {"train_loss": -11.622299194335938, "global_step": 454812, "epoch": 2707} {"train_loss": -9.111288070678711, "global_step": 454813, "epoch": 2707} {"train_loss": -9.595409393310547, "global_step": 454814, "epoch": 2707} {"train_loss": -7.953060626983643, "global_step": 454815, "epoch": 2707} {"train_loss": -8.229865074157715, "global_step": 454816, "epoch": 2707} {"train_loss": -9.845977783203125, "global_step": 454817, "epoch": 2707} {"train_loss": -9.467763900756836, "global_step": 454818, "epoch": 2707} {"train_loss": -10.552742004394531, "global_step": 454819, "epoch": 2707} {"train_loss": -9.857698440551758, "global_step": 454820, "epoch": 2707} {"train_loss": -10.39041519165039, "global_step": 454821, "epoch": 2707} {"train_loss": -10.574575424194336, "global_step": 454822, "epoch": 2707} {"train_loss": -12.020625114440918, "global_step": 454823, "epoch": 2707} {"train_loss": -11.650405883789062, "global_step": 454824, "epoch": 2707} {"train_loss": -12.250782012939453, "global_step": 454825, "epoch": 2707} {"train_loss": -11.646135330200195, "global_step": 454826, "epoch": 2707} {"train_loss": -11.633709907531738, "global_step": 454827, "epoch": 2707} {"train_loss": -11.456997871398926, "global_step": 454828, "epoch": 2707} {"train_loss": -12.07951831817627, "global_step": 454829, "epoch": 2707} {"train_loss": -12.048501968383789, "global_step": 454830, "epoch": 2707} {"train_loss": -12.114432334899902, "global_step": 454831, "epoch": 2707} {"train_loss": -11.722404479980469, "global_step": 454832, "epoch": 2707} {"train_loss": -11.928727149963379, "global_step": 454833, "epoch": 2707} {"train_loss": -11.967080116271973, "global_step": 454834, "epoch": 2707} {"train_loss": -11.785115242004395, "global_step": 454835, "epoch": 2707} {"train_loss": -11.902044296264648, "global_step": 454836, "epoch": 2707} {"train_loss": -11.90001106262207, "global_step": 454837, "epoch": 2707} {"train_loss": -12.124418258666992, "global_step": 454838, "epoch": 2707} {"train_loss": -12.154640197753906, "global_step": 454839, "epoch": 2707} {"train_loss": -12.177349090576172, "global_step": 454840, "epoch": 2707} {"train_loss": -12.24970817565918, "global_step": 454841, "epoch": 2707} {"train_loss": -12.286149024963379, "global_step": 454842, "epoch": 2707} {"train_loss": -12.160989761352539, "global_step": 454843, "epoch": 2707} {"train_loss": -12.047107696533203, "global_step": 454844, "epoch": 2707} {"train_loss": -12.237001419067383, "global_step": 454845, "epoch": 2707} {"train_loss": -12.458566665649414, "global_step": 454846, "epoch": 2707} {"train_loss": -12.019275665283203, "global_step": 454847, "epoch": 2707} {"train_loss": -12.400611877441406, "global_step": 454848, "epoch": 2707} {"train_loss": -12.024991989135742, "global_step": 454849, "epoch": 2707} {"train_loss": -12.211848258972168, "global_step": 454850, "epoch": 2707} {"train_loss": -12.502283096313477, "global_step": 454851, "epoch": 2707} {"train_loss": -11.9014253616333, "global_step": 454852, "epoch": 2707} {"train_loss": -12.262945175170898, "global_step": 454853, "epoch": 2707} {"train_loss": -12.014900207519531, "global_step": 454854, "epoch": 2707} {"train_loss": -12.50986099243164, "global_step": 454855, "epoch": 2707} {"train_loss": -12.379849433898926, "global_step": 454856, "epoch": 2707} {"train_loss": -12.206916809082031, "global_step": 454857, "epoch": 2707} {"train_loss": -12.37978744506836, "global_step": 454858, "epoch": 2707} {"train_loss": -12.31649112701416, "global_step": 454859, "epoch": 2707} {"train_loss": -12.361148834228516, "global_step": 454860, "epoch": 2707} {"train_loss": -12.247589111328125, "global_step": 454861, "epoch": 2707} {"train_loss": -12.507600784301758, "global_step": 454862, "epoch": 2707} {"train_loss": -12.442428588867188, "global_step": 454863, "epoch": 2707} {"train_loss": -12.494095802307129, "global_step": 454864, "epoch": 2707} {"train_loss": -12.15107536315918, "global_step": 454865, "epoch": 2707} {"train_loss": -12.540181159973145, "global_step": 454866, "epoch": 2707} {"train_loss": -12.339642524719238, "global_step": 454867, "epoch": 2707} {"train_loss": -12.617271423339844, "global_step": 454868, "epoch": 2707} {"train_loss": -12.435949325561523, "global_step": 454869, "epoch": 2707} {"train_loss": -12.587295532226562, "global_step": 454870, "epoch": 2707} {"train_loss": -12.202134132385254, "global_step": 454871, "epoch": 2707} {"train_loss": -12.512496948242188, "global_step": 454872, "epoch": 2707} {"train_loss": -12.522750854492188, "global_step": 454873, "epoch": 2707} {"train_loss": -12.286545753479004, "global_step": 454874, "epoch": 2707} {"train_loss": -12.720405578613281, "global_step": 454875, "epoch": 2707} {"train_loss": -12.37260627746582, "global_step": 454876, "epoch": 2707} {"train_loss": -12.603204727172852, "global_step": 454877, "epoch": 2707} {"train_loss": -12.162543296813965, "global_step": 454878, "epoch": 2707} {"train_loss": -12.39778995513916, "global_step": 454879, "epoch": 2707} {"train_loss": -12.527976989746094, "global_step": 454880, "epoch": 2707} {"train_loss": -12.375327110290527, "global_step": 454881, "epoch": 2707} {"train_loss": -12.602560043334961, "global_step": 454882, "epoch": 2707} {"train_loss": -12.262276649475098, "global_step": 454883, "epoch": 2707} {"train_loss": -12.459423065185547, "global_step": 454884, "epoch": 2707} {"train_loss": -12.358749389648438, "global_step": 454885, "epoch": 2707} {"train_loss": -11.98762321472168, "global_step": 454886, "epoch": 2707} {"train_loss": -12.33557415008545, "global_step": 454887, "epoch": 2707} {"train_loss": -12.05877685546875, "global_step": 454888, "epoch": 2707} {"train_loss": -12.607172966003418, "global_step": 454889, "epoch": 2707} {"train_loss": -12.343942642211914, "global_step": 454890, "epoch": 2707} {"train_loss": -12.473976135253906, "global_step": 454891, "epoch": 2707} {"train_loss": -12.232877731323242, "global_step": 454892, "epoch": 2707} {"train_loss": -11.872915267944336, "global_step": 454893, "epoch": 2707} {"train_loss": -12.357810974121094, "global_step": 454894, "epoch": 2707} {"train_loss": -11.80943775177002, "global_step": 454895, "epoch": 2707} {"train_loss": -11.637256622314453, "global_step": 454896, "epoch": 2707} {"train_loss": -12.271162033081055, "global_step": 454897, "epoch": 2707} {"train_loss": -12.006591796875, "global_step": 454898, "epoch": 2707} {"train_loss": -12.25381088256836, "global_step": 454899, "epoch": 2707} {"train_loss": -12.388607025146484, "global_step": 454900, "epoch": 2707} {"train_loss": -12.330981254577637, "global_step": 454901, "epoch": 2707} {"train_loss": -12.494991302490234, "global_step": 454902, "epoch": 2707} {"train_loss": -12.803300857543945, "global_step": 454903, "epoch": 2707} {"train_loss": -12.579804420471191, "global_step": 454904, "epoch": 2707} {"train_loss": -12.759689331054688, "global_step": 454905, "epoch": 2707} {"train_loss": -12.783711433410645, "global_step": 454906, "epoch": 2707} {"train_loss": -12.573953628540039, "global_step": 454907, "epoch": 2707} {"train_loss": -12.49760913848877, "global_step": 454908, "epoch": 2707} {"train_loss": -12.714471817016602, "global_step": 454909, "epoch": 2707} {"train_loss": -12.54153823852539, "global_step": 454910, "epoch": 2707} {"train_loss": -12.608882904052734, "global_step": 454911, "epoch": 2707} {"train_loss": -12.723777770996094, "global_step": 454912, "epoch": 2707} {"train_loss": -12.62452507019043, "global_step": 454913, "epoch": 2707} {"train_loss": -12.358344078063965, "global_step": 454914, "epoch": 2707} {"train_loss": -12.520051002502441, "global_step": 454915, "epoch": 2707} {"train_loss": -12.52469253540039, "global_step": 454916, "epoch": 2707} {"train_loss": -12.478784561157227, "global_step": 454917, "epoch": 2707} {"train_loss": -12.474841117858887, "global_step": 454918, "epoch": 2707} {"train_loss": -12.352234840393066, "global_step": 454919, "epoch": 2707} {"train_loss": -12.833318710327148, "global_step": 454920, "epoch": 2707} {"train_loss": -12.638816833496094, "global_step": 454921, "epoch": 2707} {"train_loss": -12.558490753173828, "global_step": 454922, "epoch": 2707} {"train_loss": -12.567697525024414, "global_step": 454923, "epoch": 2707} {"train_loss": -12.741987228393555, "global_step": 454924, "epoch": 2707} {"train_loss": -12.801124572753906, "global_step": 454925, "epoch": 2707} {"train_loss": -12.835919380187988, "global_step": 454926, "epoch": 2707} {"train_loss": -12.788101196289062, "global_step": 454927, "epoch": 2707} {"train_loss": -12.922637939453125, "global_step": 454928, "epoch": 2707} {"train_loss": -12.733491897583008, "global_step": 454929, "epoch": 2707} {"train_loss": -12.712329864501953, "global_step": 454930, "epoch": 2707} {"train_loss": -12.771594047546387, "global_step": 454931, "epoch": 2707} {"train_loss": -12.969595909118652, "global_step": 454932, "epoch": 2707} {"train_loss": -12.740425109863281, "global_step": 454933, "epoch": 2707} {"train_loss": -12.596244812011719, "global_step": 454934, "epoch": 2707} {"train_loss": -12.820087432861328, "global_step": 454935, "epoch": 2707} {"train_loss": -12.955477714538574, "global_step": 454936, "epoch": 2707} {"train_loss": -12.675134658813477, "global_step": 454937, "epoch": 2707} {"train_loss": -12.701089859008789, "global_step": 454938, "epoch": 2707} {"train_loss": -12.91713809967041, "global_step": 454939, "epoch": 2707} {"train_loss": -12.57235050201416, "global_step": 454940, "epoch": 2707} {"train_loss": -12.297725677490234, "global_step": 454941, "epoch": 2707} {"train_loss": -12.001477241516113, "global_step": 454942, "epoch": 2707} {"train_loss": -11.957763998281388, "global_step": 454943, "epoch": 2707, "val_loss": 314104.21875} {"train_loss": -12.896020889282227, "global_step": 454944, "epoch": 2708} {"train_loss": -12.563804626464844, "global_step": 454945, "epoch": 2708} {"train_loss": -12.725936889648438, "global_step": 454946, "epoch": 2708} {"train_loss": -12.660282135009766, "global_step": 454947, "epoch": 2708} {"train_loss": -12.477194786071777, "global_step": 454948, "epoch": 2708} {"train_loss": -12.77767562866211, "global_step": 454949, "epoch": 2708} {"train_loss": -11.961088180541992, "global_step": 454950, "epoch": 2708} {"train_loss": -10.843358993530273, "global_step": 454951, "epoch": 2708} {"train_loss": -11.90725040435791, "global_step": 454952, "epoch": 2708} {"train_loss": -12.712519645690918, "global_step": 454953, "epoch": 2708} {"train_loss": -12.564697265625, "global_step": 454954, "epoch": 2708} {"train_loss": -12.442879676818848, "global_step": 454955, "epoch": 2708} {"train_loss": -12.751981735229492, "global_step": 454956, "epoch": 2708} {"train_loss": -12.860746383666992, "global_step": 454957, "epoch": 2708} {"train_loss": -12.714278221130371, "global_step": 454958, "epoch": 2708} {"train_loss": -12.938100814819336, "global_step": 454959, "epoch": 2708} {"train_loss": -12.339054107666016, "global_step": 454960, "epoch": 2708} {"train_loss": -12.416614532470703, "global_step": 454961, "epoch": 2708} {"train_loss": -12.23896598815918, "global_step": 454962, "epoch": 2708} {"train_loss": -12.219430923461914, "global_step": 454963, "epoch": 2708} {"train_loss": -12.45614242553711, "global_step": 454964, "epoch": 2708} {"train_loss": -11.639287948608398, "global_step": 454965, "epoch": 2708} {"train_loss": -12.16598892211914, "global_step": 454966, "epoch": 2708} {"train_loss": -11.70871353149414, "global_step": 454967, "epoch": 2708} {"train_loss": -12.460328102111816, "global_step": 454968, "epoch": 2708} {"train_loss": -10.500774383544922, "global_step": 454969, "epoch": 2708} {"train_loss": -12.432846069335938, "global_step": 454970, "epoch": 2708} {"train_loss": -11.574813842773438, "global_step": 454971, "epoch": 2708} {"train_loss": -11.674020767211914, "global_step": 454972, "epoch": 2708} {"train_loss": -11.92782211303711, "global_step": 454973, "epoch": 2708} {"train_loss": -11.341672897338867, "global_step": 454974, "epoch": 2708} {"train_loss": -11.549135208129883, "global_step": 454975, "epoch": 2708} {"train_loss": -11.222172737121582, "global_step": 454976, "epoch": 2708} {"train_loss": -12.573460578918457, "global_step": 454977, "epoch": 2708} {"train_loss": -10.354186058044434, "global_step": 454978, "epoch": 2708} {"train_loss": -11.937737464904785, "global_step": 454979, "epoch": 2708} {"train_loss": -11.659063339233398, "global_step": 454980, "epoch": 2708} {"train_loss": -11.616280555725098, "global_step": 454981, "epoch": 2708} {"train_loss": -12.662694931030273, "global_step": 454982, "epoch": 2708} {"train_loss": -11.228175163269043, "global_step": 454983, "epoch": 2708} {"train_loss": -10.55356216430664, "global_step": 454984, "epoch": 2708} {"train_loss": -12.174038887023926, "global_step": 454985, "epoch": 2708} {"train_loss": -11.111713409423828, "global_step": 454986, "epoch": 2708} {"train_loss": -11.051922798156738, "global_step": 454987, "epoch": 2708} {"train_loss": -12.233026504516602, "global_step": 454988, "epoch": 2708} {"train_loss": -11.056451797485352, "global_step": 454989, "epoch": 2708} {"train_loss": -11.382820129394531, "global_step": 454990, "epoch": 2708} {"train_loss": -12.070714950561523, "global_step": 454991, "epoch": 2708} {"train_loss": -11.989961624145508, "global_step": 454992, "epoch": 2708} {"train_loss": -11.887057304382324, "global_step": 454993, "epoch": 2708} {"train_loss": -11.596504211425781, "global_step": 454994, "epoch": 2708} {"train_loss": -12.212051391601562, "global_step": 454995, "epoch": 2708} {"train_loss": -11.201254844665527, "global_step": 454996, "epoch": 2708} {"train_loss": -11.222517967224121, "global_step": 454997, "epoch": 2708} {"train_loss": -11.883930206298828, "global_step": 454998, "epoch": 2708} {"train_loss": -11.151873588562012, "global_step": 454999, "epoch": 2708} {"train_loss": -11.573122024536133, "global_step": 455000, "epoch": 2708} {"train_loss": -10.643284797668457, "global_step": 455001, "epoch": 2708} {"train_loss": -9.762018203735352, "global_step": 455002, "epoch": 2708} {"train_loss": -11.365848541259766, "global_step": 455003, "epoch": 2708} {"train_loss": -11.067458152770996, "global_step": 455004, "epoch": 2708} {"train_loss": -10.778291702270508, "global_step": 455005, "epoch": 2708} {"train_loss": -11.694982528686523, "global_step": 455006, "epoch": 2708} {"train_loss": -11.520076751708984, "global_step": 455007, "epoch": 2708} {"train_loss": -11.671846389770508, "global_step": 455008, "epoch": 2708} {"train_loss": -11.747455596923828, "global_step": 455009, "epoch": 2708} {"train_loss": -11.77511978149414, "global_step": 455010, "epoch": 2708} {"train_loss": -12.214336395263672, "global_step": 455011, "epoch": 2708} {"train_loss": -11.666733741760254, "global_step": 455012, "epoch": 2708} {"train_loss": -12.20659065246582, "global_step": 455013, "epoch": 2708} {"train_loss": -11.500272750854492, "global_step": 455014, "epoch": 2708} {"train_loss": -12.340557098388672, "global_step": 455015, "epoch": 2708} {"train_loss": -12.010346412658691, "global_step": 455016, "epoch": 2708} {"train_loss": -11.92668628692627, "global_step": 455017, "epoch": 2708} {"train_loss": -11.924877166748047, "global_step": 455018, "epoch": 2708} {"train_loss": -11.949969291687012, "global_step": 455019, "epoch": 2708} {"train_loss": -12.265581130981445, "global_step": 455020, "epoch": 2708} {"train_loss": -11.499368667602539, "global_step": 455021, "epoch": 2708} {"train_loss": -12.278013229370117, "global_step": 455022, "epoch": 2708} {"train_loss": -11.308095932006836, "global_step": 455023, "epoch": 2708} {"train_loss": -12.155464172363281, "global_step": 455024, "epoch": 2708} {"train_loss": -11.604595184326172, "global_step": 455025, "epoch": 2708} {"train_loss": -12.117820739746094, "global_step": 455026, "epoch": 2708} {"train_loss": -11.333576202392578, "global_step": 455027, "epoch": 2708} {"train_loss": -11.555432319641113, "global_step": 455028, "epoch": 2708} {"train_loss": -12.062475204467773, "global_step": 455029, "epoch": 2708} {"train_loss": -12.108114242553711, "global_step": 455030, "epoch": 2708} {"train_loss": -11.888606071472168, "global_step": 455031, "epoch": 2708} {"train_loss": -11.462738037109375, "global_step": 455032, "epoch": 2708} {"train_loss": -12.296960830688477, "global_step": 455033, "epoch": 2708} {"train_loss": -11.745879173278809, "global_step": 455034, "epoch": 2708} {"train_loss": -12.42868423461914, "global_step": 455035, "epoch": 2708} {"train_loss": -11.54557991027832, "global_step": 455036, "epoch": 2708} {"train_loss": -12.07595157623291, "global_step": 455037, "epoch": 2708} {"train_loss": -12.036491394042969, "global_step": 455038, "epoch": 2708} {"train_loss": -12.239877700805664, "global_step": 455039, "epoch": 2708} {"train_loss": -11.90454387664795, "global_step": 455040, "epoch": 2708} {"train_loss": -11.84256649017334, "global_step": 455041, "epoch": 2708} {"train_loss": -11.927254676818848, "global_step": 455042, "epoch": 2708} {"train_loss": -11.024338722229004, "global_step": 455043, "epoch": 2708} {"train_loss": -12.610759735107422, "global_step": 455044, "epoch": 2708} {"train_loss": -11.817524909973145, "global_step": 455045, "epoch": 2708} {"train_loss": -12.07419204711914, "global_step": 455046, "epoch": 2708} {"train_loss": -11.28343391418457, "global_step": 455047, "epoch": 2708} {"train_loss": -12.11142349243164, "global_step": 455048, "epoch": 2708} {"train_loss": -11.15782356262207, "global_step": 455049, "epoch": 2708} {"train_loss": -12.188421249389648, "global_step": 455050, "epoch": 2708} {"train_loss": -11.282095909118652, "global_step": 455051, "epoch": 2708} {"train_loss": -11.999313354492188, "global_step": 455052, "epoch": 2708} {"train_loss": -12.108631134033203, "global_step": 455053, "epoch": 2708} {"train_loss": -11.784510612487793, "global_step": 455054, "epoch": 2708} {"train_loss": -12.336734771728516, "global_step": 455055, "epoch": 2708} {"train_loss": -11.717238426208496, "global_step": 455056, "epoch": 2708} {"train_loss": -12.073780059814453, "global_step": 455057, "epoch": 2708} {"train_loss": -12.13698959350586, "global_step": 455058, "epoch": 2708} {"train_loss": -11.890085220336914, "global_step": 455059, "epoch": 2708} {"train_loss": -11.795515060424805, "global_step": 455060, "epoch": 2708} {"train_loss": -12.084634780883789, "global_step": 455061, "epoch": 2708} {"train_loss": -11.884750366210938, "global_step": 455062, "epoch": 2708} {"train_loss": -12.033475875854492, "global_step": 455063, "epoch": 2708} {"train_loss": -11.765023231506348, "global_step": 455064, "epoch": 2708} {"train_loss": -12.236963272094727, "global_step": 455065, "epoch": 2708} {"train_loss": -11.720746994018555, "global_step": 455066, "epoch": 2708} {"train_loss": -12.410987854003906, "global_step": 455067, "epoch": 2708} {"train_loss": -12.119474411010742, "global_step": 455068, "epoch": 2708} {"train_loss": -11.892428398132324, "global_step": 455069, "epoch": 2708} {"train_loss": -11.709226608276367, "global_step": 455070, "epoch": 2708} {"train_loss": -11.84934139251709, "global_step": 455071, "epoch": 2708} {"train_loss": -11.067720413208008, "global_step": 455072, "epoch": 2708} {"train_loss": -11.619236946105957, "global_step": 455073, "epoch": 2708} {"train_loss": -10.896551132202148, "global_step": 455074, "epoch": 2708} {"train_loss": -11.413345336914062, "global_step": 455075, "epoch": 2708} {"train_loss": -11.114786148071289, "global_step": 455076, "epoch": 2708} {"train_loss": -11.532440185546875, "global_step": 455077, "epoch": 2708} {"train_loss": -11.943039894104004, "global_step": 455078, "epoch": 2708} {"train_loss": -11.421334266662598, "global_step": 455079, "epoch": 2708} {"train_loss": -11.75984001159668, "global_step": 455080, "epoch": 2708} {"train_loss": -11.390339851379395, "global_step": 455081, "epoch": 2708} {"train_loss": -12.013639450073242, "global_step": 455082, "epoch": 2708} {"train_loss": -11.64655876159668, "global_step": 455083, "epoch": 2708} {"train_loss": -12.01176929473877, "global_step": 455084, "epoch": 2708} {"train_loss": -12.171929359436035, "global_step": 455085, "epoch": 2708} {"train_loss": -12.321163177490234, "global_step": 455086, "epoch": 2708} {"train_loss": -11.878053665161133, "global_step": 455087, "epoch": 2708} {"train_loss": -12.270816802978516, "global_step": 455088, "epoch": 2708} {"train_loss": -11.818127632141113, "global_step": 455089, "epoch": 2708} {"train_loss": -12.117212295532227, "global_step": 455090, "epoch": 2708} {"train_loss": -12.2072172164917, "global_step": 455091, "epoch": 2708} {"train_loss": -12.183752059936523, "global_step": 455092, "epoch": 2708} {"train_loss": -11.992464065551758, "global_step": 455093, "epoch": 2708} {"train_loss": -12.060537338256836, "global_step": 455094, "epoch": 2708} {"train_loss": -11.932295799255371, "global_step": 455095, "epoch": 2708} {"train_loss": -12.139017105102539, "global_step": 455096, "epoch": 2708} {"train_loss": -12.067583084106445, "global_step": 455097, "epoch": 2708} {"train_loss": -12.267068862915039, "global_step": 455098, "epoch": 2708} {"train_loss": -12.304494857788086, "global_step": 455099, "epoch": 2708} {"train_loss": -12.463651657104492, "global_step": 455100, "epoch": 2708} {"train_loss": -12.231664657592773, "global_step": 455101, "epoch": 2708} {"train_loss": -12.384553909301758, "global_step": 455102, "epoch": 2708} {"train_loss": -12.264623641967773, "global_step": 455103, "epoch": 2708} {"train_loss": -12.42660903930664, "global_step": 455104, "epoch": 2708} {"train_loss": -12.116086959838867, "global_step": 455105, "epoch": 2708} {"train_loss": -12.581053733825684, "global_step": 455106, "epoch": 2708} {"train_loss": -12.73507308959961, "global_step": 455107, "epoch": 2708} {"train_loss": -12.503238677978516, "global_step": 455108, "epoch": 2708} {"train_loss": -12.62865161895752, "global_step": 455109, "epoch": 2708} {"train_loss": -12.66498851776123, "global_step": 455110, "epoch": 2708} {"train_loss": -11.903018576758248, "global_step": 455111, "epoch": 2708, "val_loss": 313067.0625} {"train_loss": -12.571020126342773, "global_step": 455112, "epoch": 2709} {"train_loss": -12.620084762573242, "global_step": 455113, "epoch": 2709} {"train_loss": -12.803121566772461, "global_step": 455114, "epoch": 2709} {"train_loss": -12.610008239746094, "global_step": 455115, "epoch": 2709} {"train_loss": -12.673945426940918, "global_step": 455116, "epoch": 2709} {"train_loss": -12.649391174316406, "global_step": 455117, "epoch": 2709} {"train_loss": -12.577479362487793, "global_step": 455118, "epoch": 2709} {"train_loss": -12.637096405029297, "global_step": 455119, "epoch": 2709} {"train_loss": -12.638542175292969, "global_step": 455120, "epoch": 2709} {"train_loss": -12.711406707763672, "global_step": 455121, "epoch": 2709} {"train_loss": -12.549460411071777, "global_step": 455122, "epoch": 2709} {"train_loss": -12.658970832824707, "global_step": 455123, "epoch": 2709} {"train_loss": -12.802627563476562, "global_step": 455124, "epoch": 2709} {"train_loss": -12.714274406433105, "global_step": 455125, "epoch": 2709} {"train_loss": -12.766874313354492, "global_step": 455126, "epoch": 2709} {"train_loss": -12.816963195800781, "global_step": 455127, "epoch": 2709} {"train_loss": -12.791803359985352, "global_step": 455128, "epoch": 2709} {"train_loss": -12.675148963928223, "global_step": 455129, "epoch": 2709} {"train_loss": -12.928890228271484, "global_step": 455130, "epoch": 2709} {"train_loss": -13.075494766235352, "global_step": 455131, "epoch": 2709} {"train_loss": -12.792953491210938, "global_step": 455132, "epoch": 2709} {"train_loss": -12.887432098388672, "global_step": 455133, "epoch": 2709} {"train_loss": -12.801836013793945, "global_step": 455134, "epoch": 2709} {"train_loss": -12.673284530639648, "global_step": 455135, "epoch": 2709} {"train_loss": -12.800901412963867, "global_step": 455136, "epoch": 2709} {"train_loss": -12.94373893737793, "global_step": 455137, "epoch": 2709} {"train_loss": -12.79010009765625, "global_step": 455138, "epoch": 2709} {"train_loss": -13.007634162902832, "global_step": 455139, "epoch": 2709} {"train_loss": -12.81932258605957, "global_step": 455140, "epoch": 2709} {"train_loss": -12.816411018371582, "global_step": 455141, "epoch": 2709} {"train_loss": -12.835896492004395, "global_step": 455142, "epoch": 2709} {"train_loss": -12.839337348937988, "global_step": 455143, "epoch": 2709} {"train_loss": -12.821615219116211, "global_step": 455144, "epoch": 2709} {"train_loss": -12.88127326965332, "global_step": 455145, "epoch": 2709} {"train_loss": -12.581624031066895, "global_step": 455146, "epoch": 2709} {"train_loss": -12.647056579589844, "global_step": 455147, "epoch": 2709} {"train_loss": -12.596906661987305, "global_step": 455148, "epoch": 2709} {"train_loss": -12.350767135620117, "global_step": 455149, "epoch": 2709} {"train_loss": -12.547487258911133, "global_step": 455150, "epoch": 2709} {"train_loss": -12.761115074157715, "global_step": 455151, "epoch": 2709} {"train_loss": -12.41438102722168, "global_step": 455152, "epoch": 2709} {"train_loss": -12.929381370544434, "global_step": 455153, "epoch": 2709} {"train_loss": -12.4735689163208, "global_step": 455154, "epoch": 2709} {"train_loss": -12.187593460083008, "global_step": 455155, "epoch": 2709} {"train_loss": -12.844354629516602, "global_step": 455156, "epoch": 2709} {"train_loss": -12.94709587097168, "global_step": 455157, "epoch": 2709} {"train_loss": -12.621626853942871, "global_step": 455158, "epoch": 2709} {"train_loss": -12.754311561584473, "global_step": 455159, "epoch": 2709} {"train_loss": -12.860706329345703, "global_step": 455160, "epoch": 2709} {"train_loss": -13.01054859161377, "global_step": 455161, "epoch": 2709} {"train_loss": -12.85664176940918, "global_step": 455162, "epoch": 2709} {"train_loss": -13.105756759643555, "global_step": 455163, "epoch": 2709} {"train_loss": -12.924493789672852, "global_step": 455164, "epoch": 2709} {"train_loss": -12.723302841186523, "global_step": 455165, "epoch": 2709} {"train_loss": -12.772493362426758, "global_step": 455166, "epoch": 2709} {"train_loss": -13.024532318115234, "global_step": 455167, "epoch": 2709} {"train_loss": -12.670467376708984, "global_step": 455168, "epoch": 2709} {"train_loss": -12.507789611816406, "global_step": 455169, "epoch": 2709} {"train_loss": -11.218189239501953, "global_step": 455170, "epoch": 2709} {"train_loss": -12.234525680541992, "global_step": 455171, "epoch": 2709} {"train_loss": -12.724464416503906, "global_step": 455172, "epoch": 2709} {"train_loss": -11.806342124938965, "global_step": 455173, "epoch": 2709} {"train_loss": -10.417363166809082, "global_step": 455174, "epoch": 2709} {"train_loss": -12.125417709350586, "global_step": 455175, "epoch": 2709} {"train_loss": -12.498289108276367, "global_step": 455176, "epoch": 2709} {"train_loss": -11.751860618591309, "global_step": 455177, "epoch": 2709} {"train_loss": -11.205822944641113, "global_step": 455178, "epoch": 2709} {"train_loss": -12.00741958618164, "global_step": 455179, "epoch": 2709} {"train_loss": -12.133964538574219, "global_step": 455180, "epoch": 2709} {"train_loss": -11.412458419799805, "global_step": 455181, "epoch": 2709} {"train_loss": -11.144363403320312, "global_step": 455182, "epoch": 2709} {"train_loss": -11.643165588378906, "global_step": 455183, "epoch": 2709} {"train_loss": -11.496917724609375, "global_step": 455184, "epoch": 2709} {"train_loss": -10.256178855895996, "global_step": 455185, "epoch": 2709} {"train_loss": -11.398490905761719, "global_step": 455186, "epoch": 2709} {"train_loss": -9.754058837890625, "global_step": 455187, "epoch": 2709} {"train_loss": -10.169256210327148, "global_step": 455188, "epoch": 2709} {"train_loss": -8.032310485839844, "global_step": 455189, "epoch": 2709} {"train_loss": -8.765722274780273, "global_step": 455190, "epoch": 2709} {"train_loss": -8.831331253051758, "global_step": 455191, "epoch": 2709} {"train_loss": -8.949530601501465, "global_step": 455192, "epoch": 2709} {"train_loss": -11.031768798828125, "global_step": 455193, "epoch": 2709} {"train_loss": -9.207353591918945, "global_step": 455194, "epoch": 2709} {"train_loss": -9.587068557739258, "global_step": 455195, "epoch": 2709} {"train_loss": -11.274109840393066, "global_step": 455196, "epoch": 2709} {"train_loss": -10.078176498413086, "global_step": 455197, "epoch": 2709} {"train_loss": -9.460617065429688, "global_step": 455198, "epoch": 2709} {"train_loss": -11.227303504943848, "global_step": 455199, "epoch": 2709} {"train_loss": -10.935155868530273, "global_step": 455200, "epoch": 2709} {"train_loss": -11.57370376586914, "global_step": 455201, "epoch": 2709} {"train_loss": -11.335884094238281, "global_step": 455202, "epoch": 2709} {"train_loss": -10.920516967773438, "global_step": 455203, "epoch": 2709} {"train_loss": -11.656364440917969, "global_step": 455204, "epoch": 2709} {"train_loss": -11.080121994018555, "global_step": 455205, "epoch": 2709} {"train_loss": -11.510981559753418, "global_step": 455206, "epoch": 2709} {"train_loss": -11.765865325927734, "global_step": 455207, "epoch": 2709} {"train_loss": -11.596389770507812, "global_step": 455208, "epoch": 2709} {"train_loss": -11.998540878295898, "global_step": 455209, "epoch": 2709} {"train_loss": -11.404657363891602, "global_step": 455210, "epoch": 2709} {"train_loss": -11.653360366821289, "global_step": 455211, "epoch": 2709} {"train_loss": -12.035102844238281, "global_step": 455212, "epoch": 2709} {"train_loss": -11.885846138000488, "global_step": 455213, "epoch": 2709} {"train_loss": -12.369379997253418, "global_step": 455214, "epoch": 2709} {"train_loss": -12.192270278930664, "global_step": 455215, "epoch": 2709} {"train_loss": -12.29053020477295, "global_step": 455216, "epoch": 2709} {"train_loss": -12.267129898071289, "global_step": 455217, "epoch": 2709} {"train_loss": -12.32809829711914, "global_step": 455218, "epoch": 2709} {"train_loss": -12.131352424621582, "global_step": 455219, "epoch": 2709} {"train_loss": -11.684013366699219, "global_step": 455220, "epoch": 2709} {"train_loss": -12.360095024108887, "global_step": 455221, "epoch": 2709} {"train_loss": -11.815051078796387, "global_step": 455222, "epoch": 2709} {"train_loss": -12.562986373901367, "global_step": 455223, "epoch": 2709} {"train_loss": -12.267707824707031, "global_step": 455224, "epoch": 2709} {"train_loss": -12.35594654083252, "global_step": 455225, "epoch": 2709} {"train_loss": -12.327807426452637, "global_step": 455226, "epoch": 2709} {"train_loss": -12.506620407104492, "global_step": 455227, "epoch": 2709} {"train_loss": -12.551206588745117, "global_step": 455228, "epoch": 2709} {"train_loss": -12.423154830932617, "global_step": 455229, "epoch": 2709} {"train_loss": -12.267284393310547, "global_step": 455230, "epoch": 2709} {"train_loss": -12.509729385375977, "global_step": 455231, "epoch": 2709} {"train_loss": -12.566640853881836, "global_step": 455232, "epoch": 2709} {"train_loss": -12.607107162475586, "global_step": 455233, "epoch": 2709} {"train_loss": -12.541378021240234, "global_step": 455234, "epoch": 2709} {"train_loss": -12.58243179321289, "global_step": 455235, "epoch": 2709} {"train_loss": -12.568069458007812, "global_step": 455236, "epoch": 2709} {"train_loss": -12.45890998840332, "global_step": 455237, "epoch": 2709} {"train_loss": -12.760823249816895, "global_step": 455238, "epoch": 2709} {"train_loss": -12.48675537109375, "global_step": 455239, "epoch": 2709} {"train_loss": -12.617252349853516, "global_step": 455240, "epoch": 2709} {"train_loss": -12.404791831970215, "global_step": 455241, "epoch": 2709} {"train_loss": -12.748466491699219, "global_step": 455242, "epoch": 2709} {"train_loss": -12.537836074829102, "global_step": 455243, "epoch": 2709} {"train_loss": -12.656421661376953, "global_step": 455244, "epoch": 2709} {"train_loss": -12.71444320678711, "global_step": 455245, "epoch": 2709} {"train_loss": -12.659555435180664, "global_step": 455246, "epoch": 2709} {"train_loss": -12.873245239257812, "global_step": 455247, "epoch": 2709} {"train_loss": -12.534141540527344, "global_step": 455248, "epoch": 2709} {"train_loss": -12.792461395263672, "global_step": 455249, "epoch": 2709} {"train_loss": -12.682077407836914, "global_step": 455250, "epoch": 2709} {"train_loss": -12.51247787475586, "global_step": 455251, "epoch": 2709} {"train_loss": -12.756406784057617, "global_step": 455252, "epoch": 2709} {"train_loss": -12.713088989257812, "global_step": 455253, "epoch": 2709} {"train_loss": -12.85861587524414, "global_step": 455254, "epoch": 2709} {"train_loss": -12.644177436828613, "global_step": 455255, "epoch": 2709} {"train_loss": -12.776043891906738, "global_step": 455256, "epoch": 2709} {"train_loss": -12.604362487792969, "global_step": 455257, "epoch": 2709} {"train_loss": -12.922496795654297, "global_step": 455258, "epoch": 2709} {"train_loss": -12.930896759033203, "global_step": 455259, "epoch": 2709} {"train_loss": -12.904974937438965, "global_step": 455260, "epoch": 2709} {"train_loss": -12.674391746520996, "global_step": 455261, "epoch": 2709} {"train_loss": -12.92508316040039, "global_step": 455262, "epoch": 2709} {"train_loss": -12.744762420654297, "global_step": 455263, "epoch": 2709} {"train_loss": -12.949816703796387, "global_step": 455264, "epoch": 2709} {"train_loss": -12.851887702941895, "global_step": 455265, "epoch": 2709} {"train_loss": -12.944849967956543, "global_step": 455266, "epoch": 2709} {"train_loss": -12.928421974182129, "global_step": 455267, "epoch": 2709} {"train_loss": -12.80086898803711, "global_step": 455268, "epoch": 2709} {"train_loss": -12.971506118774414, "global_step": 455269, "epoch": 2709} {"train_loss": -12.737713813781738, "global_step": 455270, "epoch": 2709} {"train_loss": -12.906983375549316, "global_step": 455271, "epoch": 2709} {"train_loss": -12.935458183288574, "global_step": 455272, "epoch": 2709} {"train_loss": -12.988025665283203, "global_step": 455273, "epoch": 2709} {"train_loss": -13.084784507751465, "global_step": 455274, "epoch": 2709} {"train_loss": -13.023292541503906, "global_step": 455275, "epoch": 2709} {"train_loss": -12.83541488647461, "global_step": 455276, "epoch": 2709} {"train_loss": -12.710254669189453, "global_step": 455277, "epoch": 2709} {"train_loss": -12.964776992797852, "global_step": 455278, "epoch": 2709} {"train_loss": -12.24952709107172, "global_step": 455279, "epoch": 2709, "val_loss": 314623.5625} {"train_loss": -12.723871231079102, "global_step": 455280, "epoch": 2710} {"train_loss": -12.668304443359375, "global_step": 455281, "epoch": 2710} {"train_loss": -12.959304809570312, "global_step": 455282, "epoch": 2710} {"train_loss": -12.74117660522461, "global_step": 455283, "epoch": 2710} {"train_loss": -12.497161865234375, "global_step": 455284, "epoch": 2710} {"train_loss": -12.61804485321045, "global_step": 455285, "epoch": 2710} {"train_loss": -12.915998458862305, "global_step": 455286, "epoch": 2710} {"train_loss": -12.54573917388916, "global_step": 455287, "epoch": 2710} {"train_loss": -12.077969551086426, "global_step": 455288, "epoch": 2710} {"train_loss": -12.280532836914062, "global_step": 455289, "epoch": 2710} {"train_loss": -12.672744750976562, "global_step": 455290, "epoch": 2710} {"train_loss": -12.477601051330566, "global_step": 455291, "epoch": 2710} {"train_loss": -12.690030097961426, "global_step": 455292, "epoch": 2710} {"train_loss": -12.878218650817871, "global_step": 455293, "epoch": 2710} {"train_loss": -12.69133472442627, "global_step": 455294, "epoch": 2710} {"train_loss": -12.498690605163574, "global_step": 455295, "epoch": 2710} {"train_loss": -12.874574661254883, "global_step": 455296, "epoch": 2710} {"train_loss": -12.688764572143555, "global_step": 455297, "epoch": 2710} {"train_loss": -12.832908630371094, "global_step": 455298, "epoch": 2710} {"train_loss": -12.57284164428711, "global_step": 455299, "epoch": 2710} {"train_loss": -12.497659683227539, "global_step": 455300, "epoch": 2710} {"train_loss": -12.840874671936035, "global_step": 455301, "epoch": 2710} {"train_loss": -12.767651557922363, "global_step": 455302, "epoch": 2710} {"train_loss": -12.6414794921875, "global_step": 455303, "epoch": 2710} {"train_loss": -12.973993301391602, "global_step": 455304, "epoch": 2710} {"train_loss": -12.762231826782227, "global_step": 455305, "epoch": 2710} {"train_loss": -12.346163749694824, "global_step": 455306, "epoch": 2710} {"train_loss": -12.635896682739258, "global_step": 455307, "epoch": 2710} {"train_loss": -12.735002517700195, "global_step": 455308, "epoch": 2710} {"train_loss": -12.352964401245117, "global_step": 455309, "epoch": 2710} {"train_loss": -12.43209457397461, "global_step": 455310, "epoch": 2710} {"train_loss": -13.119757652282715, "global_step": 455311, "epoch": 2710} {"train_loss": -12.646427154541016, "global_step": 455312, "epoch": 2710} {"train_loss": -12.608354568481445, "global_step": 455313, "epoch": 2710} {"train_loss": -12.87605094909668, "global_step": 455314, "epoch": 2710} {"train_loss": -12.995718002319336, "global_step": 455315, "epoch": 2710} {"train_loss": -12.562060356140137, "global_step": 455316, "epoch": 2710} {"train_loss": -12.43514633178711, "global_step": 455317, "epoch": 2710} {"train_loss": -11.550737380981445, "global_step": 455318, "epoch": 2710} {"train_loss": -12.457014083862305, "global_step": 455319, "epoch": 2710} {"train_loss": -12.50888442993164, "global_step": 455320, "epoch": 2710} {"train_loss": -12.209115982055664, "global_step": 455321, "epoch": 2710} {"train_loss": -11.3326416015625, "global_step": 455322, "epoch": 2710} {"train_loss": -12.924504280090332, "global_step": 455323, "epoch": 2710} {"train_loss": -12.565485000610352, "global_step": 455324, "epoch": 2710} {"train_loss": -12.077617645263672, "global_step": 455325, "epoch": 2710} {"train_loss": -10.766985893249512, "global_step": 455326, "epoch": 2710} {"train_loss": -12.262825012207031, "global_step": 455327, "epoch": 2710} {"train_loss": -12.107344627380371, "global_step": 455328, "epoch": 2710} {"train_loss": -12.013944625854492, "global_step": 455329, "epoch": 2710} {"train_loss": -11.938535690307617, "global_step": 455330, "epoch": 2710} {"train_loss": -12.617382049560547, "global_step": 455331, "epoch": 2710} {"train_loss": -12.256586074829102, "global_step": 455332, "epoch": 2710} {"train_loss": -12.589725494384766, "global_step": 455333, "epoch": 2710} {"train_loss": -12.032206535339355, "global_step": 455334, "epoch": 2710} {"train_loss": -12.883103370666504, "global_step": 455335, "epoch": 2710} {"train_loss": -12.019338607788086, "global_step": 455336, "epoch": 2710} {"train_loss": -11.523011207580566, "global_step": 455337, "epoch": 2710} {"train_loss": -11.146806716918945, "global_step": 455338, "epoch": 2710} {"train_loss": -12.098428726196289, "global_step": 455339, "epoch": 2710} {"train_loss": -12.518978118896484, "global_step": 455340, "epoch": 2710} {"train_loss": -10.842926025390625, "global_step": 455341, "epoch": 2710} {"train_loss": -10.788726806640625, "global_step": 455342, "epoch": 2710} {"train_loss": -11.669057846069336, "global_step": 455343, "epoch": 2710} {"train_loss": -12.025396347045898, "global_step": 455344, "epoch": 2710} {"train_loss": -11.06318473815918, "global_step": 455345, "epoch": 2710} {"train_loss": -12.051528930664062, "global_step": 455346, "epoch": 2710} {"train_loss": -12.181631088256836, "global_step": 455347, "epoch": 2710} {"train_loss": -10.979665756225586, "global_step": 455348, "epoch": 2710} {"train_loss": -12.141812324523926, "global_step": 455349, "epoch": 2710} {"train_loss": -11.876699447631836, "global_step": 455350, "epoch": 2710} {"train_loss": -11.472841262817383, "global_step": 455351, "epoch": 2710} {"train_loss": -11.064081192016602, "global_step": 455352, "epoch": 2710} {"train_loss": -11.701532363891602, "global_step": 455353, "epoch": 2710} {"train_loss": -10.107802391052246, "global_step": 455354, "epoch": 2710} {"train_loss": -10.054383277893066, "global_step": 455355, "epoch": 2710} {"train_loss": -11.717755317687988, "global_step": 455356, "epoch": 2710} {"train_loss": -10.187393188476562, "global_step": 455357, "epoch": 2710} {"train_loss": -9.083740234375, "global_step": 455358, "epoch": 2710} {"train_loss": -8.750032424926758, "global_step": 455359, "epoch": 2710} {"train_loss": -9.465548515319824, "global_step": 455360, "epoch": 2710} {"train_loss": -10.265094757080078, "global_step": 455361, "epoch": 2710} {"train_loss": -10.386188507080078, "global_step": 455362, "epoch": 2710} {"train_loss": -10.159744262695312, "global_step": 455363, "epoch": 2710} {"train_loss": -10.19798755645752, "global_step": 455364, "epoch": 2710} {"train_loss": -10.315858840942383, "global_step": 455365, "epoch": 2710} {"train_loss": -11.46328067779541, "global_step": 455366, "epoch": 2710} {"train_loss": -10.754647254943848, "global_step": 455367, "epoch": 2710} {"train_loss": -11.280943870544434, "global_step": 455368, "epoch": 2710} {"train_loss": -10.902055740356445, "global_step": 455369, "epoch": 2710} {"train_loss": -10.9465913772583, "global_step": 455370, "epoch": 2710} {"train_loss": -9.98281192779541, "global_step": 455371, "epoch": 2710} {"train_loss": -11.037687301635742, "global_step": 455372, "epoch": 2710} {"train_loss": -11.618627548217773, "global_step": 455373, "epoch": 2710} {"train_loss": -10.68139934539795, "global_step": 455374, "epoch": 2710} {"train_loss": -10.62165641784668, "global_step": 455375, "epoch": 2710} {"train_loss": -11.808960914611816, "global_step": 455376, "epoch": 2710} {"train_loss": -11.079364776611328, "global_step": 455377, "epoch": 2710} {"train_loss": -12.165627479553223, "global_step": 455378, "epoch": 2710} {"train_loss": -11.101375579833984, "global_step": 455379, "epoch": 2710} {"train_loss": -11.310140609741211, "global_step": 455380, "epoch": 2710} {"train_loss": -10.976160049438477, "global_step": 455381, "epoch": 2710} {"train_loss": -11.817642211914062, "global_step": 455382, "epoch": 2710} {"train_loss": -11.653909683227539, "global_step": 455383, "epoch": 2710} {"train_loss": -12.0147123336792, "global_step": 455384, "epoch": 2710} {"train_loss": -11.657919883728027, "global_step": 455385, "epoch": 2710} {"train_loss": -12.349525451660156, "global_step": 455386, "epoch": 2710} {"train_loss": -11.796262741088867, "global_step": 455387, "epoch": 2710} {"train_loss": -12.55301284790039, "global_step": 455388, "epoch": 2710} {"train_loss": -12.135899543762207, "global_step": 455389, "epoch": 2710} {"train_loss": -12.479434967041016, "global_step": 455390, "epoch": 2710} {"train_loss": -12.194854736328125, "global_step": 455391, "epoch": 2710} {"train_loss": -12.19162654876709, "global_step": 455392, "epoch": 2710} {"train_loss": -12.29769515991211, "global_step": 455393, "epoch": 2710} {"train_loss": -12.15606689453125, "global_step": 455394, "epoch": 2710} {"train_loss": -12.257391929626465, "global_step": 455395, "epoch": 2710} {"train_loss": -12.491615295410156, "global_step": 455396, "epoch": 2710} {"train_loss": -12.364578247070312, "global_step": 455397, "epoch": 2710} {"train_loss": -12.265357971191406, "global_step": 455398, "epoch": 2710} {"train_loss": -12.53799819946289, "global_step": 455399, "epoch": 2710} {"train_loss": -12.321630477905273, "global_step": 455400, "epoch": 2710} {"train_loss": -12.462325096130371, "global_step": 455401, "epoch": 2710} {"train_loss": -12.176666259765625, "global_step": 455402, "epoch": 2710} {"train_loss": -12.426687240600586, "global_step": 455403, "epoch": 2710} {"train_loss": -12.630946159362793, "global_step": 455404, "epoch": 2710} {"train_loss": -12.279991149902344, "global_step": 455405, "epoch": 2710} {"train_loss": -12.628028869628906, "global_step": 455406, "epoch": 2710} {"train_loss": -12.534170150756836, "global_step": 455407, "epoch": 2710} {"train_loss": -12.67193603515625, "global_step": 455408, "epoch": 2710} {"train_loss": -12.607913970947266, "global_step": 455409, "epoch": 2710} {"train_loss": -12.594913482666016, "global_step": 455410, "epoch": 2710} {"train_loss": -12.691741943359375, "global_step": 455411, "epoch": 2710} {"train_loss": -12.665473937988281, "global_step": 455412, "epoch": 2710} {"train_loss": -12.579388618469238, "global_step": 455413, "epoch": 2710} {"train_loss": -12.51174259185791, "global_step": 455414, "epoch": 2710} {"train_loss": -12.629948616027832, "global_step": 455415, "epoch": 2710} {"train_loss": -12.36182689666748, "global_step": 455416, "epoch": 2710} {"train_loss": -12.916091918945312, "global_step": 455417, "epoch": 2710} {"train_loss": -12.699481964111328, "global_step": 455418, "epoch": 2710} {"train_loss": -12.707704544067383, "global_step": 455419, "epoch": 2710} {"train_loss": -12.914813995361328, "global_step": 455420, "epoch": 2710} {"train_loss": -12.581171035766602, "global_step": 455421, "epoch": 2710} {"train_loss": -12.547405242919922, "global_step": 455422, "epoch": 2710} {"train_loss": -12.286174774169922, "global_step": 455423, "epoch": 2710} {"train_loss": -12.9071626663208, "global_step": 455424, "epoch": 2710} {"train_loss": -12.568330764770508, "global_step": 455425, "epoch": 2710} {"train_loss": -12.86878776550293, "global_step": 455426, "epoch": 2710} {"train_loss": -12.732504844665527, "global_step": 455427, "epoch": 2710} {"train_loss": -13.003901481628418, "global_step": 455428, "epoch": 2710} {"train_loss": -12.745916366577148, "global_step": 455429, "epoch": 2710} {"train_loss": -13.005749702453613, "global_step": 455430, "epoch": 2710} {"train_loss": -12.871095657348633, "global_step": 455431, "epoch": 2710} {"train_loss": -12.82373332977295, "global_step": 455432, "epoch": 2710} {"train_loss": -12.66545581817627, "global_step": 455433, "epoch": 2710} {"train_loss": -12.725091934204102, "global_step": 455434, "epoch": 2710} {"train_loss": -12.654945373535156, "global_step": 455435, "epoch": 2710} {"train_loss": -12.89542293548584, "global_step": 455436, "epoch": 2710} {"train_loss": -12.333822250366211, "global_step": 455437, "epoch": 2710} {"train_loss": -12.709756851196289, "global_step": 455438, "epoch": 2710} {"train_loss": -12.746891975402832, "global_step": 455439, "epoch": 2710} {"train_loss": -12.163872718811035, "global_step": 455440, "epoch": 2710} {"train_loss": -12.772668838500977, "global_step": 455441, "epoch": 2710} {"train_loss": -12.564236640930176, "global_step": 455442, "epoch": 2710} {"train_loss": -12.140230178833008, "global_step": 455443, "epoch": 2710} {"train_loss": -12.69894027709961, "global_step": 455444, "epoch": 2710} {"train_loss": -12.73847770690918, "global_step": 455445, "epoch": 2710} {"train_loss": -12.498287200927734, "global_step": 455446, "epoch": 2710} {"train_loss": -12.10343701498849, "global_step": 455447, "epoch": 2710, "val_loss": 313877.65625, "train_action_mse_error": 1.0286880731582642} {"train_loss": -12.034229278564453, "global_step": 455448, "epoch": 2711} {"train_loss": -12.178800582885742, "global_step": 455449, "epoch": 2711} {"train_loss": -12.821195602416992, "global_step": 455450, "epoch": 2711} {"train_loss": -12.15323257446289, "global_step": 455451, "epoch": 2711} {"train_loss": -12.298957824707031, "global_step": 455452, "epoch": 2711} {"train_loss": -12.890522003173828, "global_step": 455453, "epoch": 2711} {"train_loss": -12.143402099609375, "global_step": 455454, "epoch": 2711} {"train_loss": -11.672698974609375, "global_step": 455455, "epoch": 2711} {"train_loss": -12.606802940368652, "global_step": 455456, "epoch": 2711} {"train_loss": -12.660075187683105, "global_step": 455457, "epoch": 2711} {"train_loss": -11.842851638793945, "global_step": 455458, "epoch": 2711} {"train_loss": -12.73876667022705, "global_step": 455459, "epoch": 2711} {"train_loss": -12.621673583984375, "global_step": 455460, "epoch": 2711} {"train_loss": -12.36416244506836, "global_step": 455461, "epoch": 2711} {"train_loss": -12.79439640045166, "global_step": 455462, "epoch": 2711} {"train_loss": -12.771271705627441, "global_step": 455463, "epoch": 2711} {"train_loss": -12.45224666595459, "global_step": 455464, "epoch": 2711} {"train_loss": -12.429003715515137, "global_step": 455465, "epoch": 2711} {"train_loss": -12.466755867004395, "global_step": 455466, "epoch": 2711} {"train_loss": -12.603643417358398, "global_step": 455467, "epoch": 2711} {"train_loss": -11.8284273147583, "global_step": 455468, "epoch": 2711} {"train_loss": -12.274126052856445, "global_step": 455469, "epoch": 2711} {"train_loss": -12.335944175720215, "global_step": 455470, "epoch": 2711} {"train_loss": -12.192323684692383, "global_step": 455471, "epoch": 2711} {"train_loss": -12.316539764404297, "global_step": 455472, "epoch": 2711} {"train_loss": -12.295857429504395, "global_step": 455473, "epoch": 2711} {"train_loss": -11.433294296264648, "global_step": 455474, "epoch": 2711} {"train_loss": -12.663390159606934, "global_step": 455475, "epoch": 2711} {"train_loss": -11.792411804199219, "global_step": 455476, "epoch": 2711} {"train_loss": -11.61862564086914, "global_step": 455477, "epoch": 2711} {"train_loss": -12.67214298248291, "global_step": 455478, "epoch": 2711} {"train_loss": -11.972118377685547, "global_step": 455479, "epoch": 2711} {"train_loss": -11.508955001831055, "global_step": 455480, "epoch": 2711} {"train_loss": -12.503972053527832, "global_step": 455481, "epoch": 2711} {"train_loss": -12.31151008605957, "global_step": 455482, "epoch": 2711} {"train_loss": -11.924964904785156, "global_step": 455483, "epoch": 2711} {"train_loss": -12.016855239868164, "global_step": 455484, "epoch": 2711} {"train_loss": -10.512873649597168, "global_step": 455485, "epoch": 2711} {"train_loss": -11.479514122009277, "global_step": 455486, "epoch": 2711} {"train_loss": -8.971616744995117, "global_step": 455487, "epoch": 2711} {"train_loss": -7.797761917114258, "global_step": 455488, "epoch": 2711} {"train_loss": -8.21673583984375, "global_step": 455489, "epoch": 2711} {"train_loss": -8.564697265625, "global_step": 455490, "epoch": 2711} {"train_loss": -8.868413925170898, "global_step": 455491, "epoch": 2711} {"train_loss": -10.437926292419434, "global_step": 455492, "epoch": 2711} {"train_loss": -9.921698570251465, "global_step": 455493, "epoch": 2711} {"train_loss": -11.094049453735352, "global_step": 455494, "epoch": 2711} {"train_loss": -10.00969123840332, "global_step": 455495, "epoch": 2711} {"train_loss": -11.50613021850586, "global_step": 455496, "epoch": 2711} {"train_loss": -11.558966636657715, "global_step": 455497, "epoch": 2711} {"train_loss": -11.46261978149414, "global_step": 455498, "epoch": 2711} {"train_loss": -11.332462310791016, "global_step": 455499, "epoch": 2711} {"train_loss": -11.368600845336914, "global_step": 455500, "epoch": 2711} {"train_loss": -11.30667495727539, "global_step": 455501, "epoch": 2711} {"train_loss": -12.026369094848633, "global_step": 455502, "epoch": 2711} {"train_loss": -12.096846580505371, "global_step": 455503, "epoch": 2711} {"train_loss": -12.174328804016113, "global_step": 455504, "epoch": 2711} {"train_loss": -12.020204544067383, "global_step": 455505, "epoch": 2711} {"train_loss": -11.605815887451172, "global_step": 455506, "epoch": 2711} {"train_loss": -11.650160789489746, "global_step": 455507, "epoch": 2711} {"train_loss": -12.14177131652832, "global_step": 455508, "epoch": 2711} {"train_loss": -11.849668502807617, "global_step": 455509, "epoch": 2711} {"train_loss": -11.760841369628906, "global_step": 455510, "epoch": 2711} {"train_loss": -11.96150016784668, "global_step": 455511, "epoch": 2711} {"train_loss": -11.98532772064209, "global_step": 455512, "epoch": 2711} {"train_loss": -12.250221252441406, "global_step": 455513, "epoch": 2711} {"train_loss": -12.225957870483398, "global_step": 455514, "epoch": 2711} {"train_loss": -12.56522274017334, "global_step": 455515, "epoch": 2711} {"train_loss": -12.145278930664062, "global_step": 455516, "epoch": 2711} {"train_loss": -12.119049072265625, "global_step": 455517, "epoch": 2711} {"train_loss": -12.34489631652832, "global_step": 455518, "epoch": 2711} {"train_loss": -11.990791320800781, "global_step": 455519, "epoch": 2711} {"train_loss": -12.3065824508667, "global_step": 455520, "epoch": 2711} {"train_loss": -12.543746948242188, "global_step": 455521, "epoch": 2711} {"train_loss": -12.513477325439453, "global_step": 455522, "epoch": 2711} {"train_loss": -12.63132095336914, "global_step": 455523, "epoch": 2711} {"train_loss": -12.234777450561523, "global_step": 455524, "epoch": 2711} {"train_loss": -12.601223945617676, "global_step": 455525, "epoch": 2711} {"train_loss": -12.23031997680664, "global_step": 455526, "epoch": 2711} {"train_loss": -12.063762664794922, "global_step": 455527, "epoch": 2711} {"train_loss": -12.523340225219727, "global_step": 455528, "epoch": 2711} {"train_loss": -12.493751525878906, "global_step": 455529, "epoch": 2711} {"train_loss": -12.578018188476562, "global_step": 455530, "epoch": 2711} {"train_loss": -12.454440116882324, "global_step": 455531, "epoch": 2711} {"train_loss": -12.58975887298584, "global_step": 455532, "epoch": 2711} {"train_loss": -12.296092987060547, "global_step": 455533, "epoch": 2711} {"train_loss": -12.572999954223633, "global_step": 455534, "epoch": 2711} {"train_loss": -12.521856307983398, "global_step": 455535, "epoch": 2711} {"train_loss": -12.343486785888672, "global_step": 455536, "epoch": 2711} {"train_loss": -12.589506149291992, "global_step": 455537, "epoch": 2711} {"train_loss": -11.968706130981445, "global_step": 455538, "epoch": 2711} {"train_loss": -12.651132583618164, "global_step": 455539, "epoch": 2711} {"train_loss": -12.430110931396484, "global_step": 455540, "epoch": 2711} {"train_loss": -12.371285438537598, "global_step": 455541, "epoch": 2711} {"train_loss": -12.646021842956543, "global_step": 455542, "epoch": 2711} {"train_loss": -12.421791076660156, "global_step": 455543, "epoch": 2711} {"train_loss": -12.567483901977539, "global_step": 455544, "epoch": 2711} {"train_loss": -12.618297576904297, "global_step": 455545, "epoch": 2711} {"train_loss": -12.606266975402832, "global_step": 455546, "epoch": 2711} {"train_loss": -12.394659996032715, "global_step": 455547, "epoch": 2711} {"train_loss": -12.607765197753906, "global_step": 455548, "epoch": 2711} {"train_loss": -12.927488327026367, "global_step": 455549, "epoch": 2711} {"train_loss": -12.74134635925293, "global_step": 455550, "epoch": 2711} {"train_loss": -12.766922950744629, "global_step": 455551, "epoch": 2711} {"train_loss": -12.932616233825684, "global_step": 455552, "epoch": 2711} {"train_loss": -12.662734985351562, "global_step": 455553, "epoch": 2711} {"train_loss": -12.68808364868164, "global_step": 455554, "epoch": 2711} {"train_loss": -12.750516891479492, "global_step": 455555, "epoch": 2711} {"train_loss": -12.68098258972168, "global_step": 455556, "epoch": 2711} {"train_loss": -12.698905944824219, "global_step": 455557, "epoch": 2711} {"train_loss": -12.62691879272461, "global_step": 455558, "epoch": 2711} {"train_loss": -12.63325309753418, "global_step": 455559, "epoch": 2711} {"train_loss": -12.86118221282959, "global_step": 455560, "epoch": 2711} {"train_loss": -12.617751121520996, "global_step": 455561, "epoch": 2711} {"train_loss": -12.705940246582031, "global_step": 455562, "epoch": 2711} {"train_loss": -12.642135620117188, "global_step": 455563, "epoch": 2711} {"train_loss": -12.828861236572266, "global_step": 455564, "epoch": 2711} {"train_loss": -12.456256866455078, "global_step": 455565, "epoch": 2711} {"train_loss": -12.973411560058594, "global_step": 455566, "epoch": 2711} {"train_loss": -12.919538497924805, "global_step": 455567, "epoch": 2711} {"train_loss": -12.80966854095459, "global_step": 455568, "epoch": 2711} {"train_loss": -12.667186737060547, "global_step": 455569, "epoch": 2711} {"train_loss": -12.917579650878906, "global_step": 455570, "epoch": 2711} {"train_loss": -12.6825590133667, "global_step": 455571, "epoch": 2711} {"train_loss": -12.746015548706055, "global_step": 455572, "epoch": 2711} {"train_loss": -12.372608184814453, "global_step": 455573, "epoch": 2711} {"train_loss": -12.54776668548584, "global_step": 455574, "epoch": 2711} {"train_loss": -12.806385040283203, "global_step": 455575, "epoch": 2711} {"train_loss": -12.513639450073242, "global_step": 455576, "epoch": 2711} {"train_loss": -12.81959342956543, "global_step": 455577, "epoch": 2711} {"train_loss": -12.583800315856934, "global_step": 455578, "epoch": 2711} {"train_loss": -12.36522102355957, "global_step": 455579, "epoch": 2711} {"train_loss": -12.45357894897461, "global_step": 455580, "epoch": 2711} {"train_loss": -12.791641235351562, "global_step": 455581, "epoch": 2711} {"train_loss": -12.211665153503418, "global_step": 455582, "epoch": 2711} {"train_loss": -12.059167861938477, "global_step": 455583, "epoch": 2711} {"train_loss": -12.415881156921387, "global_step": 455584, "epoch": 2711} {"train_loss": -12.693147659301758, "global_step": 455585, "epoch": 2711} {"train_loss": -12.888063430786133, "global_step": 455586, "epoch": 2711} {"train_loss": -12.5030517578125, "global_step": 455587, "epoch": 2711} {"train_loss": -12.687721252441406, "global_step": 455588, "epoch": 2711} {"train_loss": -12.510029792785645, "global_step": 455589, "epoch": 2711} {"train_loss": -12.89258098602295, "global_step": 455590, "epoch": 2711} {"train_loss": -12.378076553344727, "global_step": 455591, "epoch": 2711} {"train_loss": -12.103750228881836, "global_step": 455592, "epoch": 2711} {"train_loss": -11.924368858337402, "global_step": 455593, "epoch": 2711} {"train_loss": -12.008959770202637, "global_step": 455594, "epoch": 2711} {"train_loss": -12.813567161560059, "global_step": 455595, "epoch": 2711} {"train_loss": -12.396720886230469, "global_step": 455596, "epoch": 2711} {"train_loss": -11.617246627807617, "global_step": 455597, "epoch": 2711} {"train_loss": -11.706470489501953, "global_step": 455598, "epoch": 2711} {"train_loss": -12.092981338500977, "global_step": 455599, "epoch": 2711} {"train_loss": -11.67219352722168, "global_step": 455600, "epoch": 2711} {"train_loss": -12.503547668457031, "global_step": 455601, "epoch": 2711} {"train_loss": -12.796747207641602, "global_step": 455602, "epoch": 2711} {"train_loss": -12.301069259643555, "global_step": 455603, "epoch": 2711} {"train_loss": -12.370016098022461, "global_step": 455604, "epoch": 2711} {"train_loss": -12.61978530883789, "global_step": 455605, "epoch": 2711} {"train_loss": -12.775282859802246, "global_step": 455606, "epoch": 2711} {"train_loss": -11.151039123535156, "global_step": 455607, "epoch": 2711} {"train_loss": -11.05797290802002, "global_step": 455608, "epoch": 2711} {"train_loss": -11.320128440856934, "global_step": 455609, "epoch": 2711} {"train_loss": -12.763875007629395, "global_step": 455610, "epoch": 2711} {"train_loss": -11.894868850708008, "global_step": 455611, "epoch": 2711} {"train_loss": -12.71955394744873, "global_step": 455612, "epoch": 2711} {"train_loss": -12.069896697998047, "global_step": 455613, "epoch": 2711} {"train_loss": -12.435100555419922, "global_step": 455614, "epoch": 2711} {"train_loss": -12.1607890242622, "global_step": 455615, "epoch": 2711, "val_loss": 309611.3125} {"train_loss": -12.630888938903809, "global_step": 455616, "epoch": 2712} {"train_loss": -12.212084770202637, "global_step": 455617, "epoch": 2712} {"train_loss": -12.390357971191406, "global_step": 455618, "epoch": 2712} {"train_loss": -12.006511688232422, "global_step": 455619, "epoch": 2712} {"train_loss": -12.403936386108398, "global_step": 455620, "epoch": 2712} {"train_loss": -12.429594993591309, "global_step": 455621, "epoch": 2712} {"train_loss": -12.591330528259277, "global_step": 455622, "epoch": 2712} {"train_loss": -12.486079216003418, "global_step": 455623, "epoch": 2712} {"train_loss": -12.569812774658203, "global_step": 455624, "epoch": 2712} {"train_loss": -12.495450973510742, "global_step": 455625, "epoch": 2712} {"train_loss": -12.460537910461426, "global_step": 455626, "epoch": 2712} {"train_loss": -12.503395080566406, "global_step": 455627, "epoch": 2712} {"train_loss": -12.115249633789062, "global_step": 455628, "epoch": 2712} {"train_loss": -12.59843635559082, "global_step": 455629, "epoch": 2712} {"train_loss": -12.798799514770508, "global_step": 455630, "epoch": 2712} {"train_loss": -12.4948091506958, "global_step": 455631, "epoch": 2712} {"train_loss": -12.68410587310791, "global_step": 455632, "epoch": 2712} {"train_loss": -12.645162582397461, "global_step": 455633, "epoch": 2712} {"train_loss": -12.662137985229492, "global_step": 455634, "epoch": 2712} {"train_loss": -12.242435455322266, "global_step": 455635, "epoch": 2712} {"train_loss": -12.434871673583984, "global_step": 455636, "epoch": 2712} {"train_loss": -12.64162540435791, "global_step": 455637, "epoch": 2712} {"train_loss": -12.053041458129883, "global_step": 455638, "epoch": 2712} {"train_loss": -12.01211166381836, "global_step": 455639, "epoch": 2712} {"train_loss": -12.407148361206055, "global_step": 455640, "epoch": 2712} {"train_loss": -12.15395736694336, "global_step": 455641, "epoch": 2712} {"train_loss": -10.649299621582031, "global_step": 455642, "epoch": 2712} {"train_loss": -11.615152359008789, "global_step": 455643, "epoch": 2712} {"train_loss": -11.80021858215332, "global_step": 455644, "epoch": 2712} {"train_loss": -11.81887435913086, "global_step": 455645, "epoch": 2712} {"train_loss": -11.010092735290527, "global_step": 455646, "epoch": 2712} {"train_loss": -11.795944213867188, "global_step": 455647, "epoch": 2712} {"train_loss": -11.151517868041992, "global_step": 455648, "epoch": 2712} {"train_loss": -12.117786407470703, "global_step": 455649, "epoch": 2712} {"train_loss": -11.661996841430664, "global_step": 455650, "epoch": 2712} {"train_loss": -12.289590835571289, "global_step": 455651, "epoch": 2712} {"train_loss": -12.155548095703125, "global_step": 455652, "epoch": 2712} {"train_loss": -12.205862045288086, "global_step": 455653, "epoch": 2712} {"train_loss": -11.600146293640137, "global_step": 455654, "epoch": 2712} {"train_loss": -12.290251731872559, "global_step": 455655, "epoch": 2712} {"train_loss": -11.545846939086914, "global_step": 455656, "epoch": 2712} {"train_loss": -12.122869491577148, "global_step": 455657, "epoch": 2712} {"train_loss": -11.39805793762207, "global_step": 455658, "epoch": 2712} {"train_loss": -11.803506851196289, "global_step": 455659, "epoch": 2712} {"train_loss": -11.654176712036133, "global_step": 455660, "epoch": 2712} {"train_loss": -12.009215354919434, "global_step": 455661, "epoch": 2712} {"train_loss": -12.517147064208984, "global_step": 455662, "epoch": 2712} {"train_loss": -12.041688919067383, "global_step": 455663, "epoch": 2712} {"train_loss": -12.486250877380371, "global_step": 455664, "epoch": 2712} {"train_loss": -12.073360443115234, "global_step": 455665, "epoch": 2712} {"train_loss": -12.170965194702148, "global_step": 455666, "epoch": 2712} {"train_loss": -11.511346817016602, "global_step": 455667, "epoch": 2712} {"train_loss": -12.047687530517578, "global_step": 455668, "epoch": 2712} {"train_loss": -12.31756591796875, "global_step": 455669, "epoch": 2712} {"train_loss": -12.082796096801758, "global_step": 455670, "epoch": 2712} {"train_loss": -12.022788047790527, "global_step": 455671, "epoch": 2712} {"train_loss": -11.819087028503418, "global_step": 455672, "epoch": 2712} {"train_loss": -12.403995513916016, "global_step": 455673, "epoch": 2712} {"train_loss": -11.889774322509766, "global_step": 455674, "epoch": 2712} {"train_loss": -12.46543025970459, "global_step": 455675, "epoch": 2712} {"train_loss": -12.224405288696289, "global_step": 455676, "epoch": 2712} {"train_loss": -12.388823509216309, "global_step": 455677, "epoch": 2712} {"train_loss": -12.127398490905762, "global_step": 455678, "epoch": 2712} {"train_loss": -12.076925277709961, "global_step": 455679, "epoch": 2712} {"train_loss": -12.402019500732422, "global_step": 455680, "epoch": 2712} {"train_loss": -12.255108833312988, "global_step": 455681, "epoch": 2712} {"train_loss": -12.372023582458496, "global_step": 455682, "epoch": 2712} {"train_loss": -12.183151245117188, "global_step": 455683, "epoch": 2712} {"train_loss": -12.347545623779297, "global_step": 455684, "epoch": 2712} {"train_loss": -12.51357364654541, "global_step": 455685, "epoch": 2712} {"train_loss": -11.432714462280273, "global_step": 455686, "epoch": 2712} {"train_loss": -12.025005340576172, "global_step": 455687, "epoch": 2712} {"train_loss": -12.273855209350586, "global_step": 455688, "epoch": 2712} {"train_loss": -11.588178634643555, "global_step": 455689, "epoch": 2712} {"train_loss": -11.860441207885742, "global_step": 455690, "epoch": 2712} {"train_loss": -12.334861755371094, "global_step": 455691, "epoch": 2712} {"train_loss": -11.845504760742188, "global_step": 455692, "epoch": 2712} {"train_loss": -12.023752212524414, "global_step": 455693, "epoch": 2712} {"train_loss": -11.609720230102539, "global_step": 455694, "epoch": 2712} {"train_loss": -12.478200912475586, "global_step": 455695, "epoch": 2712} {"train_loss": -12.174434661865234, "global_step": 455696, "epoch": 2712} {"train_loss": -12.22651195526123, "global_step": 455697, "epoch": 2712} {"train_loss": -12.64100456237793, "global_step": 455698, "epoch": 2712} {"train_loss": -12.084273338317871, "global_step": 455699, "epoch": 2712} {"train_loss": -12.096525192260742, "global_step": 455700, "epoch": 2712} {"train_loss": -12.247015953063965, "global_step": 455701, "epoch": 2712} {"train_loss": -12.000816345214844, "global_step": 455702, "epoch": 2712} {"train_loss": -12.473426818847656, "global_step": 455703, "epoch": 2712} {"train_loss": -12.102415084838867, "global_step": 455704, "epoch": 2712} {"train_loss": -12.432735443115234, "global_step": 455705, "epoch": 2712} {"train_loss": -12.361766815185547, "global_step": 455706, "epoch": 2712} {"train_loss": -12.161297798156738, "global_step": 455707, "epoch": 2712} {"train_loss": -12.3168306350708, "global_step": 455708, "epoch": 2712} {"train_loss": -12.569446563720703, "global_step": 455709, "epoch": 2712} {"train_loss": -12.058913230895996, "global_step": 455710, "epoch": 2712} {"train_loss": -12.428606033325195, "global_step": 455711, "epoch": 2712} {"train_loss": -12.559602737426758, "global_step": 455712, "epoch": 2712} {"train_loss": -12.210775375366211, "global_step": 455713, "epoch": 2712} {"train_loss": -12.72914981842041, "global_step": 455714, "epoch": 2712} {"train_loss": -12.446746826171875, "global_step": 455715, "epoch": 2712} {"train_loss": -12.70901870727539, "global_step": 455716, "epoch": 2712} {"train_loss": -12.42414379119873, "global_step": 455717, "epoch": 2712} {"train_loss": -12.252471923828125, "global_step": 455718, "epoch": 2712} {"train_loss": -12.637249946594238, "global_step": 455719, "epoch": 2712} {"train_loss": -12.42680549621582, "global_step": 455720, "epoch": 2712} {"train_loss": -12.548526763916016, "global_step": 455721, "epoch": 2712} {"train_loss": -12.697657585144043, "global_step": 455722, "epoch": 2712} {"train_loss": -12.381805419921875, "global_step": 455723, "epoch": 2712} {"train_loss": -12.436531066894531, "global_step": 455724, "epoch": 2712} {"train_loss": -12.273212432861328, "global_step": 455725, "epoch": 2712} {"train_loss": -12.791092872619629, "global_step": 455726, "epoch": 2712} {"train_loss": -12.414739608764648, "global_step": 455727, "epoch": 2712} {"train_loss": -12.566346168518066, "global_step": 455728, "epoch": 2712} {"train_loss": -12.342883110046387, "global_step": 455729, "epoch": 2712} {"train_loss": -12.475776672363281, "global_step": 455730, "epoch": 2712} {"train_loss": -12.643022537231445, "global_step": 455731, "epoch": 2712} {"train_loss": -12.012344360351562, "global_step": 455732, "epoch": 2712} {"train_loss": -11.948297500610352, "global_step": 455733, "epoch": 2712} {"train_loss": -12.229090690612793, "global_step": 455734, "epoch": 2712} {"train_loss": -12.224798202514648, "global_step": 455735, "epoch": 2712} {"train_loss": -12.092031478881836, "global_step": 455736, "epoch": 2712} {"train_loss": -12.193581581115723, "global_step": 455737, "epoch": 2712} {"train_loss": -11.88332462310791, "global_step": 455738, "epoch": 2712} {"train_loss": -11.954277038574219, "global_step": 455739, "epoch": 2712} {"train_loss": -11.942514419555664, "global_step": 455740, "epoch": 2712} {"train_loss": -12.140786170959473, "global_step": 455741, "epoch": 2712} {"train_loss": -12.38133430480957, "global_step": 455742, "epoch": 2712} {"train_loss": -12.266067504882812, "global_step": 455743, "epoch": 2712} {"train_loss": -12.142963409423828, "global_step": 455744, "epoch": 2712} {"train_loss": -12.225666046142578, "global_step": 455745, "epoch": 2712} {"train_loss": -12.245594024658203, "global_step": 455746, "epoch": 2712} {"train_loss": -12.730327606201172, "global_step": 455747, "epoch": 2712} {"train_loss": -11.856739044189453, "global_step": 455748, "epoch": 2712} {"train_loss": -12.799997329711914, "global_step": 455749, "epoch": 2712} {"train_loss": -12.20570182800293, "global_step": 455750, "epoch": 2712} {"train_loss": -12.64065170288086, "global_step": 455751, "epoch": 2712} {"train_loss": -12.259279251098633, "global_step": 455752, "epoch": 2712} {"train_loss": -12.252235412597656, "global_step": 455753, "epoch": 2712} {"train_loss": -12.35245418548584, "global_step": 455754, "epoch": 2712} {"train_loss": -12.436861038208008, "global_step": 455755, "epoch": 2712} {"train_loss": -12.41651439666748, "global_step": 455756, "epoch": 2712} {"train_loss": -12.07658576965332, "global_step": 455757, "epoch": 2712} {"train_loss": -12.64459228515625, "global_step": 455758, "epoch": 2712} {"train_loss": -11.573357582092285, "global_step": 455759, "epoch": 2712} {"train_loss": -12.44703197479248, "global_step": 455760, "epoch": 2712} {"train_loss": -11.987751007080078, "global_step": 455761, "epoch": 2712} {"train_loss": -12.50378704071045, "global_step": 455762, "epoch": 2712} {"train_loss": -12.007660865783691, "global_step": 455763, "epoch": 2712} {"train_loss": -11.989622116088867, "global_step": 455764, "epoch": 2712} {"train_loss": -12.40068244934082, "global_step": 455765, "epoch": 2712} {"train_loss": -12.176706314086914, "global_step": 455766, "epoch": 2712} {"train_loss": -12.595036506652832, "global_step": 455767, "epoch": 2712} {"train_loss": -12.497580528259277, "global_step": 455768, "epoch": 2712} {"train_loss": -12.29826545715332, "global_step": 455769, "epoch": 2712} {"train_loss": -12.096120834350586, "global_step": 455770, "epoch": 2712} {"train_loss": -12.112150192260742, "global_step": 455771, "epoch": 2712} {"train_loss": -12.20782470703125, "global_step": 455772, "epoch": 2712} {"train_loss": -12.574395179748535, "global_step": 455773, "epoch": 2712} {"train_loss": -12.477659225463867, "global_step": 455774, "epoch": 2712} {"train_loss": -12.614140510559082, "global_step": 455775, "epoch": 2712} {"train_loss": -12.433897972106934, "global_step": 455776, "epoch": 2712} {"train_loss": -12.74592399597168, "global_step": 455777, "epoch": 2712} {"train_loss": -11.81634521484375, "global_step": 455778, "epoch": 2712} {"train_loss": -12.5296630859375, "global_step": 455779, "epoch": 2712} {"train_loss": -12.629361152648926, "global_step": 455780, "epoch": 2712} {"train_loss": -12.216165542602539, "global_step": 455781, "epoch": 2712} {"train_loss": -12.66274356842041, "global_step": 455782, "epoch": 2712} {"train_loss": -12.23202375570933, "global_step": 455783, "epoch": 2712, "val_loss": 309582.0625} {"train_loss": -12.010421752929688, "global_step": 455784, "epoch": 2713} {"train_loss": -12.14286994934082, "global_step": 455785, "epoch": 2713} {"train_loss": -12.721830368041992, "global_step": 455786, "epoch": 2713} {"train_loss": -12.101658821105957, "global_step": 455787, "epoch": 2713} {"train_loss": -12.177157402038574, "global_step": 455788, "epoch": 2713} {"train_loss": -11.422523498535156, "global_step": 455789, "epoch": 2713} {"train_loss": -12.085760116577148, "global_step": 455790, "epoch": 2713} {"train_loss": -12.313243865966797, "global_step": 455791, "epoch": 2713} {"train_loss": -12.485998153686523, "global_step": 455792, "epoch": 2713} {"train_loss": -12.086568832397461, "global_step": 455793, "epoch": 2713} {"train_loss": -12.666872024536133, "global_step": 455794, "epoch": 2713} {"train_loss": -12.273030281066895, "global_step": 455795, "epoch": 2713} {"train_loss": -12.368833541870117, "global_step": 455796, "epoch": 2713} {"train_loss": -12.517818450927734, "global_step": 455797, "epoch": 2713} {"train_loss": -12.829310417175293, "global_step": 455798, "epoch": 2713} {"train_loss": -12.641716957092285, "global_step": 455799, "epoch": 2713} {"train_loss": -12.122713088989258, "global_step": 455800, "epoch": 2713} {"train_loss": -12.390655517578125, "global_step": 455801, "epoch": 2713} {"train_loss": -11.852737426757812, "global_step": 455802, "epoch": 2713} {"train_loss": -12.420841217041016, "global_step": 455803, "epoch": 2713} {"train_loss": -12.20462417602539, "global_step": 455804, "epoch": 2713} {"train_loss": -11.651973724365234, "global_step": 455805, "epoch": 2713} {"train_loss": -12.145668029785156, "global_step": 455806, "epoch": 2713} {"train_loss": -12.68290901184082, "global_step": 455807, "epoch": 2713} {"train_loss": -12.370735168457031, "global_step": 455808, "epoch": 2713} {"train_loss": -12.378215789794922, "global_step": 455809, "epoch": 2713} {"train_loss": -12.319356918334961, "global_step": 455810, "epoch": 2713} {"train_loss": -12.552942276000977, "global_step": 455811, "epoch": 2713} {"train_loss": -12.659870147705078, "global_step": 455812, "epoch": 2713} {"train_loss": -12.42165470123291, "global_step": 455813, "epoch": 2713} {"train_loss": -12.59729290008545, "global_step": 455814, "epoch": 2713} {"train_loss": -12.2864990234375, "global_step": 455815, "epoch": 2713} {"train_loss": -12.373895645141602, "global_step": 455816, "epoch": 2713} {"train_loss": -12.28544807434082, "global_step": 455817, "epoch": 2713} {"train_loss": -12.101268768310547, "global_step": 455818, "epoch": 2713} {"train_loss": -12.524739265441895, "global_step": 455819, "epoch": 2713} {"train_loss": -11.670320510864258, "global_step": 455820, "epoch": 2713} {"train_loss": -12.433384895324707, "global_step": 455821, "epoch": 2713} {"train_loss": -12.41275405883789, "global_step": 455822, "epoch": 2713} {"train_loss": -12.604145050048828, "global_step": 455823, "epoch": 2713} {"train_loss": -12.377961158752441, "global_step": 455824, "epoch": 2713} {"train_loss": -12.41114330291748, "global_step": 455825, "epoch": 2713} {"train_loss": -12.70934772491455, "global_step": 455826, "epoch": 2713} {"train_loss": -12.447586059570312, "global_step": 455827, "epoch": 2713} {"train_loss": -12.15831184387207, "global_step": 455828, "epoch": 2713} {"train_loss": -12.23753547668457, "global_step": 455829, "epoch": 2713} {"train_loss": -12.094378471374512, "global_step": 455830, "epoch": 2713} {"train_loss": -12.20502758026123, "global_step": 455831, "epoch": 2713} {"train_loss": -12.330721855163574, "global_step": 455832, "epoch": 2713} {"train_loss": -12.454904556274414, "global_step": 455833, "epoch": 2713} {"train_loss": -11.847186088562012, "global_step": 455834, "epoch": 2713} {"train_loss": -11.870292663574219, "global_step": 455835, "epoch": 2713} {"train_loss": -12.780240058898926, "global_step": 455836, "epoch": 2713} {"train_loss": -12.023948669433594, "global_step": 455837, "epoch": 2713} {"train_loss": -12.405500411987305, "global_step": 455838, "epoch": 2713} {"train_loss": -12.63198471069336, "global_step": 455839, "epoch": 2713} {"train_loss": -12.408101081848145, "global_step": 455840, "epoch": 2713} {"train_loss": -12.234739303588867, "global_step": 455841, "epoch": 2713} {"train_loss": -12.503573417663574, "global_step": 455842, "epoch": 2713} {"train_loss": -11.93875503540039, "global_step": 455843, "epoch": 2713} {"train_loss": -11.922966003417969, "global_step": 455844, "epoch": 2713} {"train_loss": -12.60835075378418, "global_step": 455845, "epoch": 2713} {"train_loss": -11.785036087036133, "global_step": 455846, "epoch": 2713} {"train_loss": -11.971260070800781, "global_step": 455847, "epoch": 2713} {"train_loss": -12.122331619262695, "global_step": 455848, "epoch": 2713} {"train_loss": -12.403131484985352, "global_step": 455849, "epoch": 2713} {"train_loss": -12.200115203857422, "global_step": 455850, "epoch": 2713} {"train_loss": -12.151101112365723, "global_step": 455851, "epoch": 2713} {"train_loss": -12.379343032836914, "global_step": 455852, "epoch": 2713} {"train_loss": -12.083887100219727, "global_step": 455853, "epoch": 2713} {"train_loss": -12.17093276977539, "global_step": 455854, "epoch": 2713} {"train_loss": -12.639262199401855, "global_step": 455855, "epoch": 2713} {"train_loss": -11.95205307006836, "global_step": 455856, "epoch": 2713} {"train_loss": -12.118937492370605, "global_step": 455857, "epoch": 2713} {"train_loss": -12.08479118347168, "global_step": 455858, "epoch": 2713} {"train_loss": -12.778619766235352, "global_step": 455859, "epoch": 2713} {"train_loss": -12.387849807739258, "global_step": 455860, "epoch": 2713} {"train_loss": -12.823305130004883, "global_step": 455861, "epoch": 2713} {"train_loss": -12.37998104095459, "global_step": 455862, "epoch": 2713} {"train_loss": -12.543996810913086, "global_step": 455863, "epoch": 2713} {"train_loss": -12.194201469421387, "global_step": 455864, "epoch": 2713} {"train_loss": -12.301473617553711, "global_step": 455865, "epoch": 2713} {"train_loss": -12.461894989013672, "global_step": 455866, "epoch": 2713} {"train_loss": -12.510660171508789, "global_step": 455867, "epoch": 2713} {"train_loss": -11.999664306640625, "global_step": 455868, "epoch": 2713} {"train_loss": -12.531926155090332, "global_step": 455869, "epoch": 2713} {"train_loss": -11.038661003112793, "global_step": 455870, "epoch": 2713} {"train_loss": -11.273260116577148, "global_step": 455871, "epoch": 2713} {"train_loss": -12.47605037689209, "global_step": 455872, "epoch": 2713} {"train_loss": -11.17335319519043, "global_step": 455873, "epoch": 2713} {"train_loss": -11.629032135009766, "global_step": 455874, "epoch": 2713} {"train_loss": -12.474233627319336, "global_step": 455875, "epoch": 2713} {"train_loss": -11.589958190917969, "global_step": 455876, "epoch": 2713} {"train_loss": -12.614229202270508, "global_step": 455877, "epoch": 2713} {"train_loss": -11.790811538696289, "global_step": 455878, "epoch": 2713} {"train_loss": -12.278976440429688, "global_step": 455879, "epoch": 2713} {"train_loss": -12.151933670043945, "global_step": 455880, "epoch": 2713} {"train_loss": -12.229532241821289, "global_step": 455881, "epoch": 2713} {"train_loss": -11.775520324707031, "global_step": 455882, "epoch": 2713} {"train_loss": -12.522883415222168, "global_step": 455883, "epoch": 2713} {"train_loss": -11.975322723388672, "global_step": 455884, "epoch": 2713} {"train_loss": -12.786855697631836, "global_step": 455885, "epoch": 2713} {"train_loss": -12.060161590576172, "global_step": 455886, "epoch": 2713} {"train_loss": -11.94239616394043, "global_step": 455887, "epoch": 2713} {"train_loss": -12.531591415405273, "global_step": 455888, "epoch": 2713} {"train_loss": -12.24290657043457, "global_step": 455889, "epoch": 2713} {"train_loss": -12.314620971679688, "global_step": 455890, "epoch": 2713} {"train_loss": -12.227958679199219, "global_step": 455891, "epoch": 2713} {"train_loss": -12.541038513183594, "global_step": 455892, "epoch": 2713} {"train_loss": -12.559301376342773, "global_step": 455893, "epoch": 2713} {"train_loss": -11.935664176940918, "global_step": 455894, "epoch": 2713} {"train_loss": -11.881998062133789, "global_step": 455895, "epoch": 2713} {"train_loss": -11.780230522155762, "global_step": 455896, "epoch": 2713} {"train_loss": -12.52003288269043, "global_step": 455897, "epoch": 2713} {"train_loss": -11.525384902954102, "global_step": 455898, "epoch": 2713} {"train_loss": -12.530216217041016, "global_step": 455899, "epoch": 2713} {"train_loss": -11.981701850891113, "global_step": 455900, "epoch": 2713} {"train_loss": -12.122045516967773, "global_step": 455901, "epoch": 2713} {"train_loss": -12.372607231140137, "global_step": 455902, "epoch": 2713} {"train_loss": -11.80526351928711, "global_step": 455903, "epoch": 2713} {"train_loss": -11.793205261230469, "global_step": 455904, "epoch": 2713} {"train_loss": -11.7247953414917, "global_step": 455905, "epoch": 2713} {"train_loss": -11.80976390838623, "global_step": 455906, "epoch": 2713} {"train_loss": -12.246246337890625, "global_step": 455907, "epoch": 2713} {"train_loss": -11.949114799499512, "global_step": 455908, "epoch": 2713} {"train_loss": -12.282669067382812, "global_step": 455909, "epoch": 2713} {"train_loss": -11.954902648925781, "global_step": 455910, "epoch": 2713} {"train_loss": -11.902225494384766, "global_step": 455911, "epoch": 2713} {"train_loss": -12.174444198608398, "global_step": 455912, "epoch": 2713} {"train_loss": -12.073878288269043, "global_step": 455913, "epoch": 2713} {"train_loss": -11.79913330078125, "global_step": 455914, "epoch": 2713} {"train_loss": -12.144187927246094, "global_step": 455915, "epoch": 2713} {"train_loss": -12.473966598510742, "global_step": 455916, "epoch": 2713} {"train_loss": -10.840463638305664, "global_step": 455917, "epoch": 2713} {"train_loss": -12.436286926269531, "global_step": 455918, "epoch": 2713} {"train_loss": -12.123699188232422, "global_step": 455919, "epoch": 2713} {"train_loss": -12.020316123962402, "global_step": 455920, "epoch": 2713} {"train_loss": -12.517204284667969, "global_step": 455921, "epoch": 2713} {"train_loss": -11.944595336914062, "global_step": 455922, "epoch": 2713} {"train_loss": -12.26513957977295, "global_step": 455923, "epoch": 2713} {"train_loss": -12.13840103149414, "global_step": 455924, "epoch": 2713} {"train_loss": -12.649515151977539, "global_step": 455925, "epoch": 2713} {"train_loss": -12.567132949829102, "global_step": 455926, "epoch": 2713} {"train_loss": -11.788365364074707, "global_step": 455927, "epoch": 2713} {"train_loss": -12.563581466674805, "global_step": 455928, "epoch": 2713} {"train_loss": -12.704208374023438, "global_step": 455929, "epoch": 2713} {"train_loss": -12.133636474609375, "global_step": 455930, "epoch": 2713} {"train_loss": -12.743931770324707, "global_step": 455931, "epoch": 2713} {"train_loss": -12.317538261413574, "global_step": 455932, "epoch": 2713} {"train_loss": -12.25235366821289, "global_step": 455933, "epoch": 2713} {"train_loss": -12.283748626708984, "global_step": 455934, "epoch": 2713} {"train_loss": -12.09007740020752, "global_step": 455935, "epoch": 2713} {"train_loss": -12.389320373535156, "global_step": 455936, "epoch": 2713} {"train_loss": -12.404891014099121, "global_step": 455937, "epoch": 2713} {"train_loss": -11.580848693847656, "global_step": 455938, "epoch": 2713} {"train_loss": -12.202982902526855, "global_step": 455939, "epoch": 2713} {"train_loss": -11.91683292388916, "global_step": 455940, "epoch": 2713} {"train_loss": -11.640878677368164, "global_step": 455941, "epoch": 2713} {"train_loss": -12.196348190307617, "global_step": 455942, "epoch": 2713} {"train_loss": -11.592649459838867, "global_step": 455943, "epoch": 2713} {"train_loss": -12.633901596069336, "global_step": 455944, "epoch": 2713} {"train_loss": -12.059164047241211, "global_step": 455945, "epoch": 2713} {"train_loss": -12.161674499511719, "global_step": 455946, "epoch": 2713} {"train_loss": -11.83966064453125, "global_step": 455947, "epoch": 2713} {"train_loss": -12.240401268005371, "global_step": 455948, "epoch": 2713} {"train_loss": -11.892642974853516, "global_step": 455949, "epoch": 2713} {"train_loss": -12.237760543823242, "global_step": 455950, "epoch": 2713} {"train_loss": -12.205606057530357, "global_step": 455951, "epoch": 2713, "val_loss": 313151.6875} {"train_loss": -12.264238357543945, "global_step": 455952, "epoch": 2714} {"train_loss": -12.353387832641602, "global_step": 455953, "epoch": 2714} {"train_loss": -12.545921325683594, "global_step": 455954, "epoch": 2714} {"train_loss": -12.226659774780273, "global_step": 455955, "epoch": 2714} {"train_loss": -12.339942932128906, "global_step": 455956, "epoch": 2714} {"train_loss": -11.230716705322266, "global_step": 455957, "epoch": 2714} {"train_loss": -12.24992561340332, "global_step": 455958, "epoch": 2714} {"train_loss": -12.034690856933594, "global_step": 455959, "epoch": 2714} {"train_loss": -12.196237564086914, "global_step": 455960, "epoch": 2714} {"train_loss": -12.279518127441406, "global_step": 455961, "epoch": 2714} {"train_loss": -11.808786392211914, "global_step": 455962, "epoch": 2714} {"train_loss": -11.934917449951172, "global_step": 455963, "epoch": 2714} {"train_loss": -11.258607864379883, "global_step": 455964, "epoch": 2714} {"train_loss": -12.291779518127441, "global_step": 455965, "epoch": 2714} {"train_loss": -11.01099681854248, "global_step": 455966, "epoch": 2714} {"train_loss": -10.757566452026367, "global_step": 455967, "epoch": 2714} {"train_loss": -11.597469329833984, "global_step": 455968, "epoch": 2714} {"train_loss": -11.35851764678955, "global_step": 455969, "epoch": 2714} {"train_loss": -12.053801536560059, "global_step": 455970, "epoch": 2714} {"train_loss": -11.048717498779297, "global_step": 455971, "epoch": 2714} {"train_loss": -12.402307510375977, "global_step": 455972, "epoch": 2714} {"train_loss": -10.875996589660645, "global_step": 455973, "epoch": 2714} {"train_loss": -12.10198974609375, "global_step": 455974, "epoch": 2714} {"train_loss": -11.648768424987793, "global_step": 455975, "epoch": 2714} {"train_loss": -11.881032943725586, "global_step": 455976, "epoch": 2714} {"train_loss": -12.174896240234375, "global_step": 455977, "epoch": 2714} {"train_loss": -11.855215072631836, "global_step": 455978, "epoch": 2714} {"train_loss": -12.058295249938965, "global_step": 455979, "epoch": 2714} {"train_loss": -10.838970184326172, "global_step": 455980, "epoch": 2714} {"train_loss": -11.63543701171875, "global_step": 455981, "epoch": 2714} {"train_loss": -11.410664558410645, "global_step": 455982, "epoch": 2714} {"train_loss": -11.725892066955566, "global_step": 455983, "epoch": 2714} {"train_loss": -10.02243423461914, "global_step": 455984, "epoch": 2714} {"train_loss": -11.690799713134766, "global_step": 455985, "epoch": 2714} {"train_loss": -10.597249984741211, "global_step": 455986, "epoch": 2714} {"train_loss": -10.82087230682373, "global_step": 455987, "epoch": 2714} {"train_loss": -10.636993408203125, "global_step": 455988, "epoch": 2714} {"train_loss": -11.362979888916016, "global_step": 455989, "epoch": 2714} {"train_loss": -10.324153900146484, "global_step": 455990, "epoch": 2714} {"train_loss": -11.516988754272461, "global_step": 455991, "epoch": 2714} {"train_loss": -10.810144424438477, "global_step": 455992, "epoch": 2714} {"train_loss": -10.677165985107422, "global_step": 455993, "epoch": 2714} {"train_loss": -11.806991577148438, "global_step": 455994, "epoch": 2714} {"train_loss": -10.077312469482422, "global_step": 455995, "epoch": 2714} {"train_loss": -11.94627857208252, "global_step": 455996, "epoch": 2714} {"train_loss": -11.03905200958252, "global_step": 455997, "epoch": 2714} {"train_loss": -11.308324813842773, "global_step": 455998, "epoch": 2714} {"train_loss": -11.738973617553711, "global_step": 455999, "epoch": 2714} {"train_loss": -11.928060531616211, "global_step": 456000, "epoch": 2714} {"train_loss": -11.74948501586914, "global_step": 456001, "epoch": 2714} {"train_loss": -11.533949851989746, "global_step": 456002, "epoch": 2714} {"train_loss": -11.907312393188477, "global_step": 456003, "epoch": 2714} {"train_loss": -11.528735160827637, "global_step": 456004, "epoch": 2714} {"train_loss": -12.143688201904297, "global_step": 456005, "epoch": 2714} {"train_loss": -11.77166748046875, "global_step": 456006, "epoch": 2714} {"train_loss": -11.827634811401367, "global_step": 456007, "epoch": 2714} {"train_loss": -11.355642318725586, "global_step": 456008, "epoch": 2714} {"train_loss": -12.280619621276855, "global_step": 456009, "epoch": 2714} {"train_loss": -11.637056350708008, "global_step": 456010, "epoch": 2714} {"train_loss": -11.95280933380127, "global_step": 456011, "epoch": 2714} {"train_loss": -11.751903533935547, "global_step": 456012, "epoch": 2714} {"train_loss": -12.037755966186523, "global_step": 456013, "epoch": 2714} {"train_loss": -12.22348690032959, "global_step": 456014, "epoch": 2714} {"train_loss": -11.934138298034668, "global_step": 456015, "epoch": 2714} {"train_loss": -12.213552474975586, "global_step": 456016, "epoch": 2714} {"train_loss": -12.298137664794922, "global_step": 456017, "epoch": 2714} {"train_loss": -11.846251487731934, "global_step": 456018, "epoch": 2714} {"train_loss": -11.971250534057617, "global_step": 456019, "epoch": 2714} {"train_loss": -11.81457805633545, "global_step": 456020, "epoch": 2714} {"train_loss": -12.133054733276367, "global_step": 456021, "epoch": 2714} {"train_loss": -12.035360336303711, "global_step": 456022, "epoch": 2714} {"train_loss": -12.43474292755127, "global_step": 456023, "epoch": 2714} {"train_loss": -12.33454418182373, "global_step": 456024, "epoch": 2714} {"train_loss": -11.917398452758789, "global_step": 456025, "epoch": 2714} {"train_loss": -12.128751754760742, "global_step": 456026, "epoch": 2714} {"train_loss": -12.314090728759766, "global_step": 456027, "epoch": 2714} {"train_loss": -12.653177261352539, "global_step": 456028, "epoch": 2714} {"train_loss": -12.461620330810547, "global_step": 456029, "epoch": 2714} {"train_loss": -12.41482925415039, "global_step": 456030, "epoch": 2714} {"train_loss": -12.41716194152832, "global_step": 456031, "epoch": 2714} {"train_loss": -12.5440092086792, "global_step": 456032, "epoch": 2714} {"train_loss": -12.46457290649414, "global_step": 456033, "epoch": 2714} {"train_loss": -12.458881378173828, "global_step": 456034, "epoch": 2714} {"train_loss": -12.614995956420898, "global_step": 456035, "epoch": 2714} {"train_loss": -12.682747840881348, "global_step": 456036, "epoch": 2714} {"train_loss": -12.615488052368164, "global_step": 456037, "epoch": 2714} {"train_loss": -12.413543701171875, "global_step": 456038, "epoch": 2714} {"train_loss": -12.525148391723633, "global_step": 456039, "epoch": 2714} {"train_loss": -12.478495597839355, "global_step": 456040, "epoch": 2714} {"train_loss": -12.499421119689941, "global_step": 456041, "epoch": 2714} {"train_loss": -12.496795654296875, "global_step": 456042, "epoch": 2714} {"train_loss": -12.547464370727539, "global_step": 456043, "epoch": 2714} {"train_loss": -12.616888046264648, "global_step": 456044, "epoch": 2714} {"train_loss": -12.77261734008789, "global_step": 456045, "epoch": 2714} {"train_loss": -12.764413833618164, "global_step": 456046, "epoch": 2714} {"train_loss": -12.713380813598633, "global_step": 456047, "epoch": 2714} {"train_loss": -12.534741401672363, "global_step": 456048, "epoch": 2714} {"train_loss": -12.720367431640625, "global_step": 456049, "epoch": 2714} {"train_loss": -12.86951732635498, "global_step": 456050, "epoch": 2714} {"train_loss": -12.591801643371582, "global_step": 456051, "epoch": 2714} {"train_loss": -12.76740550994873, "global_step": 456052, "epoch": 2714} {"train_loss": -12.541055679321289, "global_step": 456053, "epoch": 2714} {"train_loss": -12.614530563354492, "global_step": 456054, "epoch": 2714} {"train_loss": -12.758743286132812, "global_step": 456055, "epoch": 2714} {"train_loss": -12.538578033447266, "global_step": 456056, "epoch": 2714} {"train_loss": -12.508223533630371, "global_step": 456057, "epoch": 2714} {"train_loss": -12.571029663085938, "global_step": 456058, "epoch": 2714} {"train_loss": -12.581063270568848, "global_step": 456059, "epoch": 2714} {"train_loss": -12.824807167053223, "global_step": 456060, "epoch": 2714} {"train_loss": -12.738288879394531, "global_step": 456061, "epoch": 2714} {"train_loss": -12.769218444824219, "global_step": 456062, "epoch": 2714} {"train_loss": -12.863495826721191, "global_step": 456063, "epoch": 2714} {"train_loss": -12.732221603393555, "global_step": 456064, "epoch": 2714} {"train_loss": -12.84882640838623, "global_step": 456065, "epoch": 2714} {"train_loss": -12.888289451599121, "global_step": 456066, "epoch": 2714} {"train_loss": -12.875940322875977, "global_step": 456067, "epoch": 2714} {"train_loss": -12.694644927978516, "global_step": 456068, "epoch": 2714} {"train_loss": -12.550829887390137, "global_step": 456069, "epoch": 2714} {"train_loss": -12.930463790893555, "global_step": 456070, "epoch": 2714} {"train_loss": -12.581464767456055, "global_step": 456071, "epoch": 2714} {"train_loss": -12.628448486328125, "global_step": 456072, "epoch": 2714} {"train_loss": -12.774481773376465, "global_step": 456073, "epoch": 2714} {"train_loss": -12.641539573669434, "global_step": 456074, "epoch": 2714} {"train_loss": -12.711442947387695, "global_step": 456075, "epoch": 2714} {"train_loss": -12.656702041625977, "global_step": 456076, "epoch": 2714} {"train_loss": -12.84682846069336, "global_step": 456077, "epoch": 2714} {"train_loss": -12.675910949707031, "global_step": 456078, "epoch": 2714} {"train_loss": -12.772675514221191, "global_step": 456079, "epoch": 2714} {"train_loss": -12.776914596557617, "global_step": 456080, "epoch": 2714} {"train_loss": -12.644844055175781, "global_step": 456081, "epoch": 2714} {"train_loss": -12.971592903137207, "global_step": 456082, "epoch": 2714} {"train_loss": -12.960466384887695, "global_step": 456083, "epoch": 2714} {"train_loss": -12.899520874023438, "global_step": 456084, "epoch": 2714} {"train_loss": -12.74996566772461, "global_step": 456085, "epoch": 2714} {"train_loss": -12.330419540405273, "global_step": 456086, "epoch": 2714} {"train_loss": -12.526140213012695, "global_step": 456087, "epoch": 2714} {"train_loss": -12.44349479675293, "global_step": 456088, "epoch": 2714} {"train_loss": -12.90078067779541, "global_step": 456089, "epoch": 2714} {"train_loss": -12.20730209350586, "global_step": 456090, "epoch": 2714} {"train_loss": -12.42418098449707, "global_step": 456091, "epoch": 2714} {"train_loss": -12.572433471679688, "global_step": 456092, "epoch": 2714} {"train_loss": -12.691107749938965, "global_step": 456093, "epoch": 2714} {"train_loss": -12.95119857788086, "global_step": 456094, "epoch": 2714} {"train_loss": -12.63016128540039, "global_step": 456095, "epoch": 2714} {"train_loss": -12.992035865783691, "global_step": 456096, "epoch": 2714} {"train_loss": -12.564362525939941, "global_step": 456097, "epoch": 2714} {"train_loss": -12.823423385620117, "global_step": 456098, "epoch": 2714} {"train_loss": -12.696969032287598, "global_step": 456099, "epoch": 2714} {"train_loss": -12.431215286254883, "global_step": 456100, "epoch": 2714} {"train_loss": -12.236955642700195, "global_step": 456101, "epoch": 2714} {"train_loss": -12.365714073181152, "global_step": 456102, "epoch": 2714} {"train_loss": -12.603947639465332, "global_step": 456103, "epoch": 2714} {"train_loss": -12.175243377685547, "global_step": 456104, "epoch": 2714} {"train_loss": -12.283160209655762, "global_step": 456105, "epoch": 2714} {"train_loss": -12.687068939208984, "global_step": 456106, "epoch": 2714} {"train_loss": -12.665323257446289, "global_step": 456107, "epoch": 2714} {"train_loss": -12.396303176879883, "global_step": 456108, "epoch": 2714} {"train_loss": -12.714261054992676, "global_step": 456109, "epoch": 2714} {"train_loss": -12.57740306854248, "global_step": 456110, "epoch": 2714} {"train_loss": -12.295408248901367, "global_step": 456111, "epoch": 2714} {"train_loss": -12.030298233032227, "global_step": 456112, "epoch": 2714} {"train_loss": -12.396785736083984, "global_step": 456113, "epoch": 2714} {"train_loss": -11.84129524230957, "global_step": 456114, "epoch": 2714} {"train_loss": -12.699163436889648, "global_step": 456115, "epoch": 2714} {"train_loss": -12.241326332092285, "global_step": 456116, "epoch": 2714} {"train_loss": -11.654890060424805, "global_step": 456117, "epoch": 2714} {"train_loss": -11.432671546936035, "global_step": 456118, "epoch": 2714} {"train_loss": -12.172150055567423, "global_step": 456119, "epoch": 2714, "val_loss": 312401.90625} {"train_loss": -12.621978759765625, "global_step": 456120, "epoch": 2715} {"train_loss": -11.035670280456543, "global_step": 456121, "epoch": 2715} {"train_loss": -9.915874481201172, "global_step": 456122, "epoch": 2715} {"train_loss": -12.537934303283691, "global_step": 456123, "epoch": 2715} {"train_loss": -10.809998512268066, "global_step": 456124, "epoch": 2715} {"train_loss": -11.373555183410645, "global_step": 456125, "epoch": 2715} {"train_loss": -12.484752655029297, "global_step": 456126, "epoch": 2715} {"train_loss": -11.120330810546875, "global_step": 456127, "epoch": 2715} {"train_loss": -11.405467987060547, "global_step": 456128, "epoch": 2715} {"train_loss": -12.135576248168945, "global_step": 456129, "epoch": 2715} {"train_loss": -10.877033233642578, "global_step": 456130, "epoch": 2715} {"train_loss": -10.240316390991211, "global_step": 456131, "epoch": 2715} {"train_loss": -12.495844841003418, "global_step": 456132, "epoch": 2715} {"train_loss": -9.690814971923828, "global_step": 456133, "epoch": 2715} {"train_loss": -11.6299467086792, "global_step": 456134, "epoch": 2715} {"train_loss": -11.732677459716797, "global_step": 456135, "epoch": 2715} {"train_loss": -11.25078010559082, "global_step": 456136, "epoch": 2715} {"train_loss": -11.300710678100586, "global_step": 456137, "epoch": 2715} {"train_loss": -11.914887428283691, "global_step": 456138, "epoch": 2715} {"train_loss": -11.463254928588867, "global_step": 456139, "epoch": 2715} {"train_loss": -11.766668319702148, "global_step": 456140, "epoch": 2715} {"train_loss": -12.115625381469727, "global_step": 456141, "epoch": 2715} {"train_loss": -11.889122009277344, "global_step": 456142, "epoch": 2715} {"train_loss": -11.613120079040527, "global_step": 456143, "epoch": 2715} {"train_loss": -11.487687110900879, "global_step": 456144, "epoch": 2715} {"train_loss": -12.477457046508789, "global_step": 456145, "epoch": 2715} {"train_loss": -11.748567581176758, "global_step": 456146, "epoch": 2715} {"train_loss": -12.482786178588867, "global_step": 456147, "epoch": 2715} {"train_loss": -12.136048316955566, "global_step": 456148, "epoch": 2715} {"train_loss": -12.321710586547852, "global_step": 456149, "epoch": 2715} {"train_loss": -12.024200439453125, "global_step": 456150, "epoch": 2715} {"train_loss": -12.48206901550293, "global_step": 456151, "epoch": 2715} {"train_loss": -12.045524597167969, "global_step": 456152, "epoch": 2715} {"train_loss": -12.483951568603516, "global_step": 456153, "epoch": 2715} {"train_loss": -12.143166542053223, "global_step": 456154, "epoch": 2715} {"train_loss": -12.160344123840332, "global_step": 456155, "epoch": 2715} {"train_loss": -11.571365356445312, "global_step": 456156, "epoch": 2715} {"train_loss": -12.113821029663086, "global_step": 456157, "epoch": 2715} {"train_loss": -12.052448272705078, "global_step": 456158, "epoch": 2715} {"train_loss": -12.198675155639648, "global_step": 456159, "epoch": 2715} {"train_loss": -12.371526718139648, "global_step": 456160, "epoch": 2715} {"train_loss": -12.123205184936523, "global_step": 456161, "epoch": 2715} {"train_loss": -12.377296447753906, "global_step": 456162, "epoch": 2715} {"train_loss": -11.818809509277344, "global_step": 456163, "epoch": 2715} {"train_loss": -12.53750228881836, "global_step": 456164, "epoch": 2715} {"train_loss": -12.019063949584961, "global_step": 456165, "epoch": 2715} {"train_loss": -12.75197696685791, "global_step": 456166, "epoch": 2715} {"train_loss": -12.07737922668457, "global_step": 456167, "epoch": 2715} {"train_loss": -12.370397567749023, "global_step": 456168, "epoch": 2715} {"train_loss": -12.392581939697266, "global_step": 456169, "epoch": 2715} {"train_loss": -12.22419548034668, "global_step": 456170, "epoch": 2715} {"train_loss": -12.831783294677734, "global_step": 456171, "epoch": 2715} {"train_loss": -12.419451713562012, "global_step": 456172, "epoch": 2715} {"train_loss": -12.497396469116211, "global_step": 456173, "epoch": 2715} {"train_loss": -12.666360855102539, "global_step": 456174, "epoch": 2715} {"train_loss": -12.17926025390625, "global_step": 456175, "epoch": 2715} {"train_loss": -12.564862251281738, "global_step": 456176, "epoch": 2715} {"train_loss": -11.976095199584961, "global_step": 456177, "epoch": 2715} {"train_loss": -12.281682014465332, "global_step": 456178, "epoch": 2715} {"train_loss": -12.733827590942383, "global_step": 456179, "epoch": 2715} {"train_loss": -12.118674278259277, "global_step": 456180, "epoch": 2715} {"train_loss": -12.71232795715332, "global_step": 456181, "epoch": 2715} {"train_loss": -12.284551620483398, "global_step": 456182, "epoch": 2715} {"train_loss": -12.610722541809082, "global_step": 456183, "epoch": 2715} {"train_loss": -12.359180450439453, "global_step": 456184, "epoch": 2715} {"train_loss": -12.34028148651123, "global_step": 456185, "epoch": 2715} {"train_loss": -12.558488845825195, "global_step": 456186, "epoch": 2715} {"train_loss": -12.564743995666504, "global_step": 456187, "epoch": 2715} {"train_loss": -12.504984855651855, "global_step": 456188, "epoch": 2715} {"train_loss": -12.363260269165039, "global_step": 456189, "epoch": 2715} {"train_loss": -12.752952575683594, "global_step": 456190, "epoch": 2715} {"train_loss": -12.465858459472656, "global_step": 456191, "epoch": 2715} {"train_loss": -12.509781837463379, "global_step": 456192, "epoch": 2715} {"train_loss": -12.684727668762207, "global_step": 456193, "epoch": 2715} {"train_loss": -12.569348335266113, "global_step": 456194, "epoch": 2715} {"train_loss": -12.802999496459961, "global_step": 456195, "epoch": 2715} {"train_loss": -12.682886123657227, "global_step": 456196, "epoch": 2715} {"train_loss": -12.789045333862305, "global_step": 456197, "epoch": 2715} {"train_loss": -12.805261611938477, "global_step": 456198, "epoch": 2715} {"train_loss": -12.724617004394531, "global_step": 456199, "epoch": 2715} {"train_loss": -12.86166763305664, "global_step": 456200, "epoch": 2715} {"train_loss": -12.63420295715332, "global_step": 456201, "epoch": 2715} {"train_loss": -12.978883743286133, "global_step": 456202, "epoch": 2715} {"train_loss": -12.749601364135742, "global_step": 456203, "epoch": 2715} {"train_loss": -12.83797836303711, "global_step": 456204, "epoch": 2715} {"train_loss": -12.794565200805664, "global_step": 456205, "epoch": 2715} {"train_loss": -12.844888687133789, "global_step": 456206, "epoch": 2715} {"train_loss": -12.385172843933105, "global_step": 456207, "epoch": 2715} {"train_loss": -12.9041166305542, "global_step": 456208, "epoch": 2715} {"train_loss": -12.537776947021484, "global_step": 456209, "epoch": 2715} {"train_loss": -12.636869430541992, "global_step": 456210, "epoch": 2715} {"train_loss": -12.958233833312988, "global_step": 456211, "epoch": 2715} {"train_loss": -12.618767738342285, "global_step": 456212, "epoch": 2715} {"train_loss": -12.753010749816895, "global_step": 456213, "epoch": 2715} {"train_loss": -12.812870025634766, "global_step": 456214, "epoch": 2715} {"train_loss": -12.697100639343262, "global_step": 456215, "epoch": 2715} {"train_loss": -12.897994995117188, "global_step": 456216, "epoch": 2715} {"train_loss": -12.768077850341797, "global_step": 456217, "epoch": 2715} {"train_loss": -12.83795166015625, "global_step": 456218, "epoch": 2715} {"train_loss": -12.758153915405273, "global_step": 456219, "epoch": 2715} {"train_loss": -12.594886779785156, "global_step": 456220, "epoch": 2715} {"train_loss": -12.572807312011719, "global_step": 456221, "epoch": 2715} {"train_loss": -12.309011459350586, "global_step": 456222, "epoch": 2715} {"train_loss": -12.475654602050781, "global_step": 456223, "epoch": 2715} {"train_loss": -12.861470222473145, "global_step": 456224, "epoch": 2715} {"train_loss": -12.57576847076416, "global_step": 456225, "epoch": 2715} {"train_loss": -12.578978538513184, "global_step": 456226, "epoch": 2715} {"train_loss": -12.293012619018555, "global_step": 456227, "epoch": 2715} {"train_loss": -12.459854125976562, "global_step": 456228, "epoch": 2715} {"train_loss": -12.420843124389648, "global_step": 456229, "epoch": 2715} {"train_loss": -12.58572006225586, "global_step": 456230, "epoch": 2715} {"train_loss": -12.284183502197266, "global_step": 456231, "epoch": 2715} {"train_loss": -12.961822509765625, "global_step": 456232, "epoch": 2715} {"train_loss": -12.861413955688477, "global_step": 456233, "epoch": 2715} {"train_loss": -12.49002742767334, "global_step": 456234, "epoch": 2715} {"train_loss": -12.346855163574219, "global_step": 456235, "epoch": 2715} {"train_loss": -12.828794479370117, "global_step": 456236, "epoch": 2715} {"train_loss": -12.670730590820312, "global_step": 456237, "epoch": 2715} {"train_loss": -12.952596664428711, "global_step": 456238, "epoch": 2715} {"train_loss": -12.349803924560547, "global_step": 456239, "epoch": 2715} {"train_loss": -11.844669342041016, "global_step": 456240, "epoch": 2715} {"train_loss": -12.350638389587402, "global_step": 456241, "epoch": 2715} {"train_loss": -12.838374137878418, "global_step": 456242, "epoch": 2715} {"train_loss": -12.802401542663574, "global_step": 456243, "epoch": 2715} {"train_loss": -12.79340934753418, "global_step": 456244, "epoch": 2715} {"train_loss": -12.747384071350098, "global_step": 456245, "epoch": 2715} {"train_loss": -12.739669799804688, "global_step": 456246, "epoch": 2715} {"train_loss": -12.437776565551758, "global_step": 456247, "epoch": 2715} {"train_loss": -12.192831993103027, "global_step": 456248, "epoch": 2715} {"train_loss": -12.524423599243164, "global_step": 456249, "epoch": 2715} {"train_loss": -12.67264175415039, "global_step": 456250, "epoch": 2715} {"train_loss": -12.934764862060547, "global_step": 456251, "epoch": 2715} {"train_loss": -12.847884178161621, "global_step": 456252, "epoch": 2715} {"train_loss": -12.506410598754883, "global_step": 456253, "epoch": 2715} {"train_loss": -12.828304290771484, "global_step": 456254, "epoch": 2715} {"train_loss": -12.724034309387207, "global_step": 456255, "epoch": 2715} {"train_loss": -12.463497161865234, "global_step": 456256, "epoch": 2715} {"train_loss": -12.10350513458252, "global_step": 456257, "epoch": 2715} {"train_loss": -12.766777038574219, "global_step": 456258, "epoch": 2715} {"train_loss": -12.175684928894043, "global_step": 456259, "epoch": 2715} {"train_loss": -11.300651550292969, "global_step": 456260, "epoch": 2715} {"train_loss": -12.215993881225586, "global_step": 456261, "epoch": 2715} {"train_loss": -12.936948776245117, "global_step": 456262, "epoch": 2715} {"train_loss": -12.177064895629883, "global_step": 456263, "epoch": 2715} {"train_loss": -11.279546737670898, "global_step": 456264, "epoch": 2715} {"train_loss": -11.596044540405273, "global_step": 456265, "epoch": 2715} {"train_loss": -12.614067077636719, "global_step": 456266, "epoch": 2715} {"train_loss": -12.591432571411133, "global_step": 456267, "epoch": 2715} {"train_loss": -12.562593460083008, "global_step": 456268, "epoch": 2715} {"train_loss": -12.576316833496094, "global_step": 456269, "epoch": 2715} {"train_loss": -12.640249252319336, "global_step": 456270, "epoch": 2715} {"train_loss": -12.149032592773438, "global_step": 456271, "epoch": 2715} {"train_loss": -12.696903228759766, "global_step": 456272, "epoch": 2715} {"train_loss": -12.631767272949219, "global_step": 456273, "epoch": 2715} {"train_loss": -12.74403190612793, "global_step": 456274, "epoch": 2715} {"train_loss": -12.625876426696777, "global_step": 456275, "epoch": 2715} {"train_loss": -12.379968643188477, "global_step": 456276, "epoch": 2715} {"train_loss": -12.308029174804688, "global_step": 456277, "epoch": 2715} {"train_loss": -11.375924110412598, "global_step": 456278, "epoch": 2715} {"train_loss": -11.967376708984375, "global_step": 456279, "epoch": 2715} {"train_loss": -12.135808944702148, "global_step": 456280, "epoch": 2715} {"train_loss": -11.804637908935547, "global_step": 456281, "epoch": 2715} {"train_loss": -12.64468765258789, "global_step": 456282, "epoch": 2715} {"train_loss": -12.477851867675781, "global_step": 456283, "epoch": 2715} {"train_loss": -12.166229248046875, "global_step": 456284, "epoch": 2715} {"train_loss": -12.464778900146484, "global_step": 456285, "epoch": 2715} {"train_loss": -12.574183464050293, "global_step": 456286, "epoch": 2715} {"train_loss": -12.32230525925046, "global_step": 456287, "epoch": 2715, "val_loss": 314669.1875, "train_action_mse_error": 1.1574461460113525} {"train_loss": -12.769994735717773, "global_step": 456288, "epoch": 2716} {"train_loss": -12.656728744506836, "global_step": 456289, "epoch": 2716} {"train_loss": -12.39030647277832, "global_step": 456290, "epoch": 2716} {"train_loss": -12.640020370483398, "global_step": 456291, "epoch": 2716} {"train_loss": -11.987630844116211, "global_step": 456292, "epoch": 2716} {"train_loss": -11.413931846618652, "global_step": 456293, "epoch": 2716} {"train_loss": -11.733068466186523, "global_step": 456294, "epoch": 2716} {"train_loss": -11.737574577331543, "global_step": 456295, "epoch": 2716} {"train_loss": -11.563377380371094, "global_step": 456296, "epoch": 2716} {"train_loss": -12.532934188842773, "global_step": 456297, "epoch": 2716} {"train_loss": -11.994362831115723, "global_step": 456298, "epoch": 2716} {"train_loss": -12.624218940734863, "global_step": 456299, "epoch": 2716} {"train_loss": -12.090158462524414, "global_step": 456300, "epoch": 2716} {"train_loss": -12.145076751708984, "global_step": 456301, "epoch": 2716} {"train_loss": -12.157261848449707, "global_step": 456302, "epoch": 2716} {"train_loss": -12.072468757629395, "global_step": 456303, "epoch": 2716} {"train_loss": -12.549905776977539, "global_step": 456304, "epoch": 2716} {"train_loss": -12.575745582580566, "global_step": 456305, "epoch": 2716} {"train_loss": -12.15580940246582, "global_step": 456306, "epoch": 2716} {"train_loss": -12.336783409118652, "global_step": 456307, "epoch": 2716} {"train_loss": -12.493446350097656, "global_step": 456308, "epoch": 2716} {"train_loss": -12.458065032958984, "global_step": 456309, "epoch": 2716} {"train_loss": -12.306783676147461, "global_step": 456310, "epoch": 2716} {"train_loss": -12.153435707092285, "global_step": 456311, "epoch": 2716} {"train_loss": -12.016990661621094, "global_step": 456312, "epoch": 2716} {"train_loss": -11.184255599975586, "global_step": 456313, "epoch": 2716} {"train_loss": -11.310507774353027, "global_step": 456314, "epoch": 2716} {"train_loss": -11.800775527954102, "global_step": 456315, "epoch": 2716} {"train_loss": -11.354131698608398, "global_step": 456316, "epoch": 2716} {"train_loss": -11.87851333618164, "global_step": 456317, "epoch": 2716} {"train_loss": -11.273000717163086, "global_step": 456318, "epoch": 2716} {"train_loss": -11.703747749328613, "global_step": 456319, "epoch": 2716} {"train_loss": -11.858221054077148, "global_step": 456320, "epoch": 2716} {"train_loss": -11.16754150390625, "global_step": 456321, "epoch": 2716} {"train_loss": -11.726423263549805, "global_step": 456322, "epoch": 2716} {"train_loss": -11.429884910583496, "global_step": 456323, "epoch": 2716} {"train_loss": -12.165769577026367, "global_step": 456324, "epoch": 2716} {"train_loss": -10.87468147277832, "global_step": 456325, "epoch": 2716} {"train_loss": -11.47961139678955, "global_step": 456326, "epoch": 2716} {"train_loss": -11.686429977416992, "global_step": 456327, "epoch": 2716} {"train_loss": -11.096832275390625, "global_step": 456328, "epoch": 2716} {"train_loss": -10.324386596679688, "global_step": 456329, "epoch": 2716} {"train_loss": -11.738137245178223, "global_step": 456330, "epoch": 2716} {"train_loss": -10.823272705078125, "global_step": 456331, "epoch": 2716} {"train_loss": -11.938308715820312, "global_step": 456332, "epoch": 2716} {"train_loss": -11.422621726989746, "global_step": 456333, "epoch": 2716} {"train_loss": -9.493703842163086, "global_step": 456334, "epoch": 2716} {"train_loss": -10.98074722290039, "global_step": 456335, "epoch": 2716} {"train_loss": -9.556510925292969, "global_step": 456336, "epoch": 2716} {"train_loss": -12.038032531738281, "global_step": 456337, "epoch": 2716} {"train_loss": -10.897383689880371, "global_step": 456338, "epoch": 2716} {"train_loss": -12.08916187286377, "global_step": 456339, "epoch": 2716} {"train_loss": -11.78781795501709, "global_step": 456340, "epoch": 2716} {"train_loss": -11.94533920288086, "global_step": 456341, "epoch": 2716} {"train_loss": -11.085013389587402, "global_step": 456342, "epoch": 2716} {"train_loss": -10.940546989440918, "global_step": 456343, "epoch": 2716} {"train_loss": -10.540454864501953, "global_step": 456344, "epoch": 2716} {"train_loss": -10.210241317749023, "global_step": 456345, "epoch": 2716} {"train_loss": -11.629120826721191, "global_step": 456346, "epoch": 2716} {"train_loss": -10.377412796020508, "global_step": 456347, "epoch": 2716} {"train_loss": -10.582239151000977, "global_step": 456348, "epoch": 2716} {"train_loss": -10.02410888671875, "global_step": 456349, "epoch": 2716} {"train_loss": -10.242790222167969, "global_step": 456350, "epoch": 2716} {"train_loss": -10.248472213745117, "global_step": 456351, "epoch": 2716} {"train_loss": -10.09023666381836, "global_step": 456352, "epoch": 2716} {"train_loss": -9.948841094970703, "global_step": 456353, "epoch": 2716} {"train_loss": -9.42534065246582, "global_step": 456354, "epoch": 2716} {"train_loss": -11.204961776733398, "global_step": 456355, "epoch": 2716} {"train_loss": -10.916458129882812, "global_step": 456356, "epoch": 2716} {"train_loss": -10.64761734008789, "global_step": 456357, "epoch": 2716} {"train_loss": -11.489644050598145, "global_step": 456358, "epoch": 2716} {"train_loss": -10.962814331054688, "global_step": 456359, "epoch": 2716} {"train_loss": -10.999174118041992, "global_step": 456360, "epoch": 2716} {"train_loss": -11.108745574951172, "global_step": 456361, "epoch": 2716} {"train_loss": -11.748250961303711, "global_step": 456362, "epoch": 2716} {"train_loss": -11.491640090942383, "global_step": 456363, "epoch": 2716} {"train_loss": -11.937325477600098, "global_step": 456364, "epoch": 2716} {"train_loss": -11.531656265258789, "global_step": 456365, "epoch": 2716} {"train_loss": -11.949926376342773, "global_step": 456366, "epoch": 2716} {"train_loss": -11.557886123657227, "global_step": 456367, "epoch": 2716} {"train_loss": -12.046907424926758, "global_step": 456368, "epoch": 2716} {"train_loss": -11.108946800231934, "global_step": 456369, "epoch": 2716} {"train_loss": -11.701044082641602, "global_step": 456370, "epoch": 2716} {"train_loss": -11.765161514282227, "global_step": 456371, "epoch": 2716} {"train_loss": -11.55947494506836, "global_step": 456372, "epoch": 2716} {"train_loss": -11.876058578491211, "global_step": 456373, "epoch": 2716} {"train_loss": -11.547374725341797, "global_step": 456374, "epoch": 2716} {"train_loss": -12.305804252624512, "global_step": 456375, "epoch": 2716} {"train_loss": -11.791635513305664, "global_step": 456376, "epoch": 2716} {"train_loss": -11.945039749145508, "global_step": 456377, "epoch": 2716} {"train_loss": -12.097098350524902, "global_step": 456378, "epoch": 2716} {"train_loss": -11.628046035766602, "global_step": 456379, "epoch": 2716} {"train_loss": -12.494256973266602, "global_step": 456380, "epoch": 2716} {"train_loss": -12.212246894836426, "global_step": 456381, "epoch": 2716} {"train_loss": -11.959453582763672, "global_step": 456382, "epoch": 2716} {"train_loss": -12.383328437805176, "global_step": 456383, "epoch": 2716} {"train_loss": -12.019170761108398, "global_step": 456384, "epoch": 2716} {"train_loss": -12.119556427001953, "global_step": 456385, "epoch": 2716} {"train_loss": -12.305763244628906, "global_step": 456386, "epoch": 2716} {"train_loss": -12.253290176391602, "global_step": 456387, "epoch": 2716} {"train_loss": -12.620109558105469, "global_step": 456388, "epoch": 2716} {"train_loss": -12.08944034576416, "global_step": 456389, "epoch": 2716} {"train_loss": -12.260099411010742, "global_step": 456390, "epoch": 2716} {"train_loss": -12.192495346069336, "global_step": 456391, "epoch": 2716} {"train_loss": -12.403908729553223, "global_step": 456392, "epoch": 2716} {"train_loss": -12.142594337463379, "global_step": 456393, "epoch": 2716} {"train_loss": -12.518211364746094, "global_step": 456394, "epoch": 2716} {"train_loss": -12.478599548339844, "global_step": 456395, "epoch": 2716} {"train_loss": -12.4899263381958, "global_step": 456396, "epoch": 2716} {"train_loss": -12.62312126159668, "global_step": 456397, "epoch": 2716} {"train_loss": -12.29853343963623, "global_step": 456398, "epoch": 2716} {"train_loss": -12.48875617980957, "global_step": 456399, "epoch": 2716} {"train_loss": -12.39718246459961, "global_step": 456400, "epoch": 2716} {"train_loss": -12.401514053344727, "global_step": 456401, "epoch": 2716} {"train_loss": -12.4181489944458, "global_step": 456402, "epoch": 2716} {"train_loss": -12.298775672912598, "global_step": 456403, "epoch": 2716} {"train_loss": -12.504487037658691, "global_step": 456404, "epoch": 2716} {"train_loss": -12.464035034179688, "global_step": 456405, "epoch": 2716} {"train_loss": -12.374746322631836, "global_step": 456406, "epoch": 2716} {"train_loss": -12.490190505981445, "global_step": 456407, "epoch": 2716} {"train_loss": -12.580977439880371, "global_step": 456408, "epoch": 2716} {"train_loss": -12.355443954467773, "global_step": 456409, "epoch": 2716} {"train_loss": -12.435483932495117, "global_step": 456410, "epoch": 2716} {"train_loss": -12.76620101928711, "global_step": 456411, "epoch": 2716} {"train_loss": -12.580132484436035, "global_step": 456412, "epoch": 2716} {"train_loss": -12.596851348876953, "global_step": 456413, "epoch": 2716} {"train_loss": -12.725261688232422, "global_step": 456414, "epoch": 2716} {"train_loss": -12.639318466186523, "global_step": 456415, "epoch": 2716} {"train_loss": -12.662425994873047, "global_step": 456416, "epoch": 2716} {"train_loss": -12.664787292480469, "global_step": 456417, "epoch": 2716} {"train_loss": -12.615715980529785, "global_step": 456418, "epoch": 2716} {"train_loss": -12.609790802001953, "global_step": 456419, "epoch": 2716} {"train_loss": -12.935489654541016, "global_step": 456420, "epoch": 2716} {"train_loss": -12.819067001342773, "global_step": 456421, "epoch": 2716} {"train_loss": -12.908812522888184, "global_step": 456422, "epoch": 2716} {"train_loss": -12.918035507202148, "global_step": 456423, "epoch": 2716} {"train_loss": -12.779991149902344, "global_step": 456424, "epoch": 2716} {"train_loss": -12.824782371520996, "global_step": 456425, "epoch": 2716} {"train_loss": -12.702348709106445, "global_step": 456426, "epoch": 2716} {"train_loss": -12.67570972442627, "global_step": 456427, "epoch": 2716} {"train_loss": -12.703012466430664, "global_step": 456428, "epoch": 2716} {"train_loss": -12.75311279296875, "global_step": 456429, "epoch": 2716} {"train_loss": -12.753307342529297, "global_step": 456430, "epoch": 2716} {"train_loss": -12.50739574432373, "global_step": 456431, "epoch": 2716} {"train_loss": -12.989701271057129, "global_step": 456432, "epoch": 2716} {"train_loss": -12.31350326538086, "global_step": 456433, "epoch": 2716} {"train_loss": -12.579351425170898, "global_step": 456434, "epoch": 2716} {"train_loss": -12.36124038696289, "global_step": 456435, "epoch": 2716} {"train_loss": -11.951924324035645, "global_step": 456436, "epoch": 2716} {"train_loss": -12.540731430053711, "global_step": 456437, "epoch": 2716} {"train_loss": -11.596864700317383, "global_step": 456438, "epoch": 2716} {"train_loss": -11.357918739318848, "global_step": 456439, "epoch": 2716} {"train_loss": -12.144217491149902, "global_step": 456440, "epoch": 2716} {"train_loss": -11.438665390014648, "global_step": 456441, "epoch": 2716} {"train_loss": -11.244277954101562, "global_step": 456442, "epoch": 2716} {"train_loss": -12.178569793701172, "global_step": 456443, "epoch": 2716} {"train_loss": -11.599886894226074, "global_step": 456444, "epoch": 2716} {"train_loss": -10.379287719726562, "global_step": 456445, "epoch": 2716} {"train_loss": -11.851982116699219, "global_step": 456446, "epoch": 2716} {"train_loss": -11.594892501831055, "global_step": 456447, "epoch": 2716} {"train_loss": -11.050098419189453, "global_step": 456448, "epoch": 2716} {"train_loss": -12.281030654907227, "global_step": 456449, "epoch": 2716} {"train_loss": -11.9514741897583, "global_step": 456450, "epoch": 2716} {"train_loss": -11.718069076538086, "global_step": 456451, "epoch": 2716} {"train_loss": -11.669415473937988, "global_step": 456452, "epoch": 2716} {"train_loss": -11.834394454956055, "global_step": 456453, "epoch": 2716} {"train_loss": -12.043320655822754, "global_step": 456454, "epoch": 2716} {"train_loss": -11.866313701584225, "global_step": 456455, "epoch": 2716, "val_loss": 311586.28125} {"train_loss": -12.191638946533203, "global_step": 456456, "epoch": 2717} {"train_loss": -11.66690444946289, "global_step": 456457, "epoch": 2717} {"train_loss": -12.169811248779297, "global_step": 456458, "epoch": 2717} {"train_loss": -11.475025177001953, "global_step": 456459, "epoch": 2717} {"train_loss": -10.785750389099121, "global_step": 456460, "epoch": 2717} {"train_loss": -12.008073806762695, "global_step": 456461, "epoch": 2717} {"train_loss": -11.294919967651367, "global_step": 456462, "epoch": 2717} {"train_loss": -12.258415222167969, "global_step": 456463, "epoch": 2717} {"train_loss": -10.750570297241211, "global_step": 456464, "epoch": 2717} {"train_loss": -12.270188331604004, "global_step": 456465, "epoch": 2717} {"train_loss": -11.389034271240234, "global_step": 456466, "epoch": 2717} {"train_loss": -12.046210289001465, "global_step": 456467, "epoch": 2717} {"train_loss": -12.03040885925293, "global_step": 456468, "epoch": 2717} {"train_loss": -12.172900199890137, "global_step": 456469, "epoch": 2717} {"train_loss": -11.862926483154297, "global_step": 456470, "epoch": 2717} {"train_loss": -12.316177368164062, "global_step": 456471, "epoch": 2717} {"train_loss": -12.312853813171387, "global_step": 456472, "epoch": 2717} {"train_loss": -12.30706787109375, "global_step": 456473, "epoch": 2717} {"train_loss": -11.953575134277344, "global_step": 456474, "epoch": 2717} {"train_loss": -12.161691665649414, "global_step": 456475, "epoch": 2717} {"train_loss": -12.105493545532227, "global_step": 456476, "epoch": 2717} {"train_loss": -12.238262176513672, "global_step": 456477, "epoch": 2717} {"train_loss": -12.561046600341797, "global_step": 456478, "epoch": 2717} {"train_loss": -12.02345085144043, "global_step": 456479, "epoch": 2717} {"train_loss": -12.464284896850586, "global_step": 456480, "epoch": 2717} {"train_loss": -12.036638259887695, "global_step": 456481, "epoch": 2717} {"train_loss": -11.905183792114258, "global_step": 456482, "epoch": 2717} {"train_loss": -12.367919921875, "global_step": 456483, "epoch": 2717} {"train_loss": -12.063612937927246, "global_step": 456484, "epoch": 2717} {"train_loss": -11.867779731750488, "global_step": 456485, "epoch": 2717} {"train_loss": -12.456369400024414, "global_step": 456486, "epoch": 2717} {"train_loss": -11.923216819763184, "global_step": 456487, "epoch": 2717} {"train_loss": -12.435686111450195, "global_step": 456488, "epoch": 2717} {"train_loss": -12.51388931274414, "global_step": 456489, "epoch": 2717} {"train_loss": -11.61605453491211, "global_step": 456490, "epoch": 2717} {"train_loss": -12.298938751220703, "global_step": 456491, "epoch": 2717} {"train_loss": -11.919136047363281, "global_step": 456492, "epoch": 2717} {"train_loss": -12.494037628173828, "global_step": 456493, "epoch": 2717} {"train_loss": -11.833711624145508, "global_step": 456494, "epoch": 2717} {"train_loss": -12.322456359863281, "global_step": 456495, "epoch": 2717} {"train_loss": -12.307268142700195, "global_step": 456496, "epoch": 2717} {"train_loss": -12.252130508422852, "global_step": 456497, "epoch": 2717} {"train_loss": -11.704882621765137, "global_step": 456498, "epoch": 2717} {"train_loss": -12.592954635620117, "global_step": 456499, "epoch": 2717} {"train_loss": -11.597230911254883, "global_step": 456500, "epoch": 2717} {"train_loss": -12.563772201538086, "global_step": 456501, "epoch": 2717} {"train_loss": -11.425605773925781, "global_step": 456502, "epoch": 2717} {"train_loss": -12.404146194458008, "global_step": 456503, "epoch": 2717} {"train_loss": -11.956681251525879, "global_step": 456504, "epoch": 2717} {"train_loss": -12.226751327514648, "global_step": 456505, "epoch": 2717} {"train_loss": -12.050239562988281, "global_step": 456506, "epoch": 2717} {"train_loss": -12.016688346862793, "global_step": 456507, "epoch": 2717} {"train_loss": -11.864070892333984, "global_step": 456508, "epoch": 2717} {"train_loss": -12.003582000732422, "global_step": 456509, "epoch": 2717} {"train_loss": -11.718294143676758, "global_step": 456510, "epoch": 2717} {"train_loss": -12.069479942321777, "global_step": 456511, "epoch": 2717} {"train_loss": -11.839946746826172, "global_step": 456512, "epoch": 2717} {"train_loss": -11.760374069213867, "global_step": 456513, "epoch": 2717} {"train_loss": -12.1541748046875, "global_step": 456514, "epoch": 2717} {"train_loss": -11.341609954833984, "global_step": 456515, "epoch": 2717} {"train_loss": -12.360984802246094, "global_step": 456516, "epoch": 2717} {"train_loss": -11.911201477050781, "global_step": 456517, "epoch": 2717} {"train_loss": -11.901388168334961, "global_step": 456518, "epoch": 2717} {"train_loss": -12.481842041015625, "global_step": 456519, "epoch": 2717} {"train_loss": -12.228803634643555, "global_step": 456520, "epoch": 2717} {"train_loss": -12.375384330749512, "global_step": 456521, "epoch": 2717} {"train_loss": -12.43589973449707, "global_step": 456522, "epoch": 2717} {"train_loss": -11.933833122253418, "global_step": 456523, "epoch": 2717} {"train_loss": -12.420049667358398, "global_step": 456524, "epoch": 2717} {"train_loss": -12.271930694580078, "global_step": 456525, "epoch": 2717} {"train_loss": -12.169046401977539, "global_step": 456526, "epoch": 2717} {"train_loss": -12.466211318969727, "global_step": 456527, "epoch": 2717} {"train_loss": -12.276323318481445, "global_step": 456528, "epoch": 2717} {"train_loss": -12.662216186523438, "global_step": 456529, "epoch": 2717} {"train_loss": -12.151222229003906, "global_step": 456530, "epoch": 2717} {"train_loss": -11.908218383789062, "global_step": 456531, "epoch": 2717} {"train_loss": -12.053592681884766, "global_step": 456532, "epoch": 2717} {"train_loss": -12.46348762512207, "global_step": 456533, "epoch": 2717} {"train_loss": -12.274300575256348, "global_step": 456534, "epoch": 2717} {"train_loss": -12.273107528686523, "global_step": 456535, "epoch": 2717} {"train_loss": -12.159687042236328, "global_step": 456536, "epoch": 2717} {"train_loss": -12.132314682006836, "global_step": 456537, "epoch": 2717} {"train_loss": -12.487150192260742, "global_step": 456538, "epoch": 2717} {"train_loss": -11.82863712310791, "global_step": 456539, "epoch": 2717} {"train_loss": -12.186626434326172, "global_step": 456540, "epoch": 2717} {"train_loss": -11.899871826171875, "global_step": 456541, "epoch": 2717} {"train_loss": -12.481281280517578, "global_step": 456542, "epoch": 2717} {"train_loss": -12.175627708435059, "global_step": 456543, "epoch": 2717} {"train_loss": -12.443365097045898, "global_step": 456544, "epoch": 2717} {"train_loss": -12.368545532226562, "global_step": 456545, "epoch": 2717} {"train_loss": -12.376321792602539, "global_step": 456546, "epoch": 2717} {"train_loss": -12.68022346496582, "global_step": 456547, "epoch": 2717} {"train_loss": -12.395225524902344, "global_step": 456548, "epoch": 2717} {"train_loss": -12.314205169677734, "global_step": 456549, "epoch": 2717} {"train_loss": -12.427725791931152, "global_step": 456550, "epoch": 2717} {"train_loss": -11.91185188293457, "global_step": 456551, "epoch": 2717} {"train_loss": -12.364490509033203, "global_step": 456552, "epoch": 2717} {"train_loss": -12.045196533203125, "global_step": 456553, "epoch": 2717} {"train_loss": -12.085331916809082, "global_step": 456554, "epoch": 2717} {"train_loss": -12.875602722167969, "global_step": 456555, "epoch": 2717} {"train_loss": -12.446285247802734, "global_step": 456556, "epoch": 2717} {"train_loss": -12.631050109863281, "global_step": 456557, "epoch": 2717} {"train_loss": -12.483663558959961, "global_step": 456558, "epoch": 2717} {"train_loss": -12.649368286132812, "global_step": 456559, "epoch": 2717} {"train_loss": -12.612987518310547, "global_step": 456560, "epoch": 2717} {"train_loss": -12.712374687194824, "global_step": 456561, "epoch": 2717} {"train_loss": -12.586064338684082, "global_step": 456562, "epoch": 2717} {"train_loss": -12.528020858764648, "global_step": 456563, "epoch": 2717} {"train_loss": -12.65267562866211, "global_step": 456564, "epoch": 2717} {"train_loss": -12.652877807617188, "global_step": 456565, "epoch": 2717} {"train_loss": -12.41628646850586, "global_step": 456566, "epoch": 2717} {"train_loss": -12.677656173706055, "global_step": 456567, "epoch": 2717} {"train_loss": -12.651268005371094, "global_step": 456568, "epoch": 2717} {"train_loss": -12.542783737182617, "global_step": 456569, "epoch": 2717} {"train_loss": -12.553594589233398, "global_step": 456570, "epoch": 2717} {"train_loss": -12.82260513305664, "global_step": 456571, "epoch": 2717} {"train_loss": -12.400857925415039, "global_step": 456572, "epoch": 2717} {"train_loss": -12.566673278808594, "global_step": 456573, "epoch": 2717} {"train_loss": -12.447059631347656, "global_step": 456574, "epoch": 2717} {"train_loss": -12.802775382995605, "global_step": 456575, "epoch": 2717} {"train_loss": -12.576345443725586, "global_step": 456576, "epoch": 2717} {"train_loss": -12.842133522033691, "global_step": 456577, "epoch": 2717} {"train_loss": -12.790382385253906, "global_step": 456578, "epoch": 2717} {"train_loss": -12.650324821472168, "global_step": 456579, "epoch": 2717} {"train_loss": -12.78133773803711, "global_step": 456580, "epoch": 2717} {"train_loss": -12.770963668823242, "global_step": 456581, "epoch": 2717} {"train_loss": -12.590629577636719, "global_step": 456582, "epoch": 2717} {"train_loss": -12.647499084472656, "global_step": 456583, "epoch": 2717} {"train_loss": -12.97066879272461, "global_step": 456584, "epoch": 2717} {"train_loss": -12.898839950561523, "global_step": 456585, "epoch": 2717} {"train_loss": -12.798112869262695, "global_step": 456586, "epoch": 2717} {"train_loss": -12.753252983093262, "global_step": 456587, "epoch": 2717} {"train_loss": -12.712974548339844, "global_step": 456588, "epoch": 2717} {"train_loss": -12.748540878295898, "global_step": 456589, "epoch": 2717} {"train_loss": -12.898653984069824, "global_step": 456590, "epoch": 2717} {"train_loss": -12.723320007324219, "global_step": 456591, "epoch": 2717} {"train_loss": -12.772119522094727, "global_step": 456592, "epoch": 2717} {"train_loss": -12.838980674743652, "global_step": 456593, "epoch": 2717} {"train_loss": -12.919236183166504, "global_step": 456594, "epoch": 2717} {"train_loss": -12.887386322021484, "global_step": 456595, "epoch": 2717} {"train_loss": -12.599724769592285, "global_step": 456596, "epoch": 2717} {"train_loss": -13.167440414428711, "global_step": 456597, "epoch": 2717} {"train_loss": -12.899909973144531, "global_step": 456598, "epoch": 2717} {"train_loss": -12.629555702209473, "global_step": 456599, "epoch": 2717} {"train_loss": -12.496040344238281, "global_step": 456600, "epoch": 2717} {"train_loss": -11.995524406433105, "global_step": 456601, "epoch": 2717} {"train_loss": -12.412799835205078, "global_step": 456602, "epoch": 2717} {"train_loss": -11.522615432739258, "global_step": 456603, "epoch": 2717} {"train_loss": -11.495149612426758, "global_step": 456604, "epoch": 2717} {"train_loss": -11.745643615722656, "global_step": 456605, "epoch": 2717} {"train_loss": -11.274736404418945, "global_step": 456606, "epoch": 2717} {"train_loss": -11.958793640136719, "global_step": 456607, "epoch": 2717} {"train_loss": -12.441662788391113, "global_step": 456608, "epoch": 2717} {"train_loss": -12.605040550231934, "global_step": 456609, "epoch": 2717} {"train_loss": -12.470356941223145, "global_step": 456610, "epoch": 2717} {"train_loss": -12.768348693847656, "global_step": 456611, "epoch": 2717} {"train_loss": -12.802603721618652, "global_step": 456612, "epoch": 2717} {"train_loss": -12.879426956176758, "global_step": 456613, "epoch": 2717} {"train_loss": -12.676010131835938, "global_step": 456614, "epoch": 2717} {"train_loss": -12.481122016906738, "global_step": 456615, "epoch": 2717} {"train_loss": -12.384292602539062, "global_step": 456616, "epoch": 2717} {"train_loss": -12.315064430236816, "global_step": 456617, "epoch": 2717} {"train_loss": -12.498510360717773, "global_step": 456618, "epoch": 2717} {"train_loss": -12.293956756591797, "global_step": 456619, "epoch": 2717} {"train_loss": -12.033173561096191, "global_step": 456620, "epoch": 2717} {"train_loss": -12.43214225769043, "global_step": 456621, "epoch": 2717} {"train_loss": -11.828171730041504, "global_step": 456622, "epoch": 2717} {"train_loss": -12.284535578319005, "global_step": 456623, "epoch": 2717, "val_loss": 314715.09375} {"train_loss": -11.987457275390625, "global_step": 456624, "epoch": 2718} {"train_loss": -11.782675743103027, "global_step": 456625, "epoch": 2718} {"train_loss": -12.051431655883789, "global_step": 456626, "epoch": 2718} {"train_loss": -12.38754653930664, "global_step": 456627, "epoch": 2718} {"train_loss": -12.045570373535156, "global_step": 456628, "epoch": 2718} {"train_loss": -12.238039016723633, "global_step": 456629, "epoch": 2718} {"train_loss": -12.414044380187988, "global_step": 456630, "epoch": 2718} {"train_loss": -12.073419570922852, "global_step": 456631, "epoch": 2718} {"train_loss": -12.42147159576416, "global_step": 456632, "epoch": 2718} {"train_loss": -11.941493034362793, "global_step": 456633, "epoch": 2718} {"train_loss": -12.624048233032227, "global_step": 456634, "epoch": 2718} {"train_loss": -12.212369918823242, "global_step": 456635, "epoch": 2718} {"train_loss": -12.406726837158203, "global_step": 456636, "epoch": 2718} {"train_loss": -12.239214897155762, "global_step": 456637, "epoch": 2718} {"train_loss": -12.462610244750977, "global_step": 456638, "epoch": 2718} {"train_loss": -12.307194709777832, "global_step": 456639, "epoch": 2718} {"train_loss": -11.51533317565918, "global_step": 456640, "epoch": 2718} {"train_loss": -11.186189651489258, "global_step": 456641, "epoch": 2718} {"train_loss": -12.612974166870117, "global_step": 456642, "epoch": 2718} {"train_loss": -11.54214859008789, "global_step": 456643, "epoch": 2718} {"train_loss": -10.846233367919922, "global_step": 456644, "epoch": 2718} {"train_loss": -11.872629165649414, "global_step": 456645, "epoch": 2718} {"train_loss": -12.52145767211914, "global_step": 456646, "epoch": 2718} {"train_loss": -11.629837036132812, "global_step": 456647, "epoch": 2718} {"train_loss": -12.556825637817383, "global_step": 456648, "epoch": 2718} {"train_loss": -12.253094673156738, "global_step": 456649, "epoch": 2718} {"train_loss": -11.953392028808594, "global_step": 456650, "epoch": 2718} {"train_loss": -12.525032043457031, "global_step": 456651, "epoch": 2718} {"train_loss": -12.090999603271484, "global_step": 456652, "epoch": 2718} {"train_loss": -12.232775688171387, "global_step": 456653, "epoch": 2718} {"train_loss": -12.480554580688477, "global_step": 456654, "epoch": 2718} {"train_loss": -11.581750869750977, "global_step": 456655, "epoch": 2718} {"train_loss": -12.151689529418945, "global_step": 456656, "epoch": 2718} {"train_loss": -12.168863296508789, "global_step": 456657, "epoch": 2718} {"train_loss": -10.834554672241211, "global_step": 456658, "epoch": 2718} {"train_loss": -11.74903678894043, "global_step": 456659, "epoch": 2718} {"train_loss": -12.034252166748047, "global_step": 456660, "epoch": 2718} {"train_loss": -11.269063949584961, "global_step": 456661, "epoch": 2718} {"train_loss": -12.462606430053711, "global_step": 456662, "epoch": 2718} {"train_loss": -11.421391487121582, "global_step": 456663, "epoch": 2718} {"train_loss": -11.972616195678711, "global_step": 456664, "epoch": 2718} {"train_loss": -12.005996704101562, "global_step": 456665, "epoch": 2718} {"train_loss": -11.862080574035645, "global_step": 456666, "epoch": 2718} {"train_loss": -12.539543151855469, "global_step": 456667, "epoch": 2718} {"train_loss": -11.971644401550293, "global_step": 456668, "epoch": 2718} {"train_loss": -12.175823211669922, "global_step": 456669, "epoch": 2718} {"train_loss": -11.69406795501709, "global_step": 456670, "epoch": 2718} {"train_loss": -12.631723403930664, "global_step": 456671, "epoch": 2718} {"train_loss": -12.220474243164062, "global_step": 456672, "epoch": 2718} {"train_loss": -11.827345848083496, "global_step": 456673, "epoch": 2718} {"train_loss": -12.290566444396973, "global_step": 456674, "epoch": 2718} {"train_loss": -12.025554656982422, "global_step": 456675, "epoch": 2718} {"train_loss": -12.197675704956055, "global_step": 456676, "epoch": 2718} {"train_loss": -11.838888168334961, "global_step": 456677, "epoch": 2718} {"train_loss": -12.150404930114746, "global_step": 456678, "epoch": 2718} {"train_loss": -11.692953109741211, "global_step": 456679, "epoch": 2718} {"train_loss": -12.154841423034668, "global_step": 456680, "epoch": 2718} {"train_loss": -11.785602569580078, "global_step": 456681, "epoch": 2718} {"train_loss": -12.031545639038086, "global_step": 456682, "epoch": 2718} {"train_loss": -12.385293006896973, "global_step": 456683, "epoch": 2718} {"train_loss": -11.103925704956055, "global_step": 456684, "epoch": 2718} {"train_loss": -11.034931182861328, "global_step": 456685, "epoch": 2718} {"train_loss": -12.196895599365234, "global_step": 456686, "epoch": 2718} {"train_loss": -11.622496604919434, "global_step": 456687, "epoch": 2718} {"train_loss": -11.92026138305664, "global_step": 456688, "epoch": 2718} {"train_loss": -12.047306060791016, "global_step": 456689, "epoch": 2718} {"train_loss": -11.538738250732422, "global_step": 456690, "epoch": 2718} {"train_loss": -12.034489631652832, "global_step": 456691, "epoch": 2718} {"train_loss": -12.239874839782715, "global_step": 456692, "epoch": 2718} {"train_loss": -11.471039772033691, "global_step": 456693, "epoch": 2718} {"train_loss": -12.04241943359375, "global_step": 456694, "epoch": 2718} {"train_loss": -11.709144592285156, "global_step": 456695, "epoch": 2718} {"train_loss": -11.935495376586914, "global_step": 456696, "epoch": 2718} {"train_loss": -11.800933837890625, "global_step": 456697, "epoch": 2718} {"train_loss": -12.07603645324707, "global_step": 456698, "epoch": 2718} {"train_loss": -12.066347122192383, "global_step": 456699, "epoch": 2718} {"train_loss": -12.085261344909668, "global_step": 456700, "epoch": 2718} {"train_loss": -11.901093482971191, "global_step": 456701, "epoch": 2718} {"train_loss": -11.943304061889648, "global_step": 456702, "epoch": 2718} {"train_loss": -12.005683898925781, "global_step": 456703, "epoch": 2718} {"train_loss": -11.527461051940918, "global_step": 456704, "epoch": 2718} {"train_loss": -11.887683868408203, "global_step": 456705, "epoch": 2718} {"train_loss": -12.432966232299805, "global_step": 456706, "epoch": 2718} {"train_loss": -12.066296577453613, "global_step": 456707, "epoch": 2718} {"train_loss": -12.008272171020508, "global_step": 456708, "epoch": 2718} {"train_loss": -11.523788452148438, "global_step": 456709, "epoch": 2718} {"train_loss": -11.846498489379883, "global_step": 456710, "epoch": 2718} {"train_loss": -12.045512199401855, "global_step": 456711, "epoch": 2718} {"train_loss": -11.343714714050293, "global_step": 456712, "epoch": 2718} {"train_loss": -11.883647918701172, "global_step": 456713, "epoch": 2718} {"train_loss": -11.565204620361328, "global_step": 456714, "epoch": 2718} {"train_loss": -12.54897403717041, "global_step": 456715, "epoch": 2718} {"train_loss": -12.040157318115234, "global_step": 456716, "epoch": 2718} {"train_loss": -12.232870101928711, "global_step": 456717, "epoch": 2718} {"train_loss": -12.07050895690918, "global_step": 456718, "epoch": 2718} {"train_loss": -12.72846794128418, "global_step": 456719, "epoch": 2718} {"train_loss": -12.511220932006836, "global_step": 456720, "epoch": 2718} {"train_loss": -12.466714859008789, "global_step": 456721, "epoch": 2718} {"train_loss": -12.587743759155273, "global_step": 456722, "epoch": 2718} {"train_loss": -12.447457313537598, "global_step": 456723, "epoch": 2718} {"train_loss": -12.459692001342773, "global_step": 456724, "epoch": 2718} {"train_loss": -12.202861785888672, "global_step": 456725, "epoch": 2718} {"train_loss": -12.795097351074219, "global_step": 456726, "epoch": 2718} {"train_loss": -12.465657234191895, "global_step": 456727, "epoch": 2718} {"train_loss": -12.743343353271484, "global_step": 456728, "epoch": 2718} {"train_loss": -12.545368194580078, "global_step": 456729, "epoch": 2718} {"train_loss": -12.20406723022461, "global_step": 456730, "epoch": 2718} {"train_loss": -12.610522270202637, "global_step": 456731, "epoch": 2718} {"train_loss": -12.111373901367188, "global_step": 456732, "epoch": 2718} {"train_loss": -12.738397598266602, "global_step": 456733, "epoch": 2718} {"train_loss": -12.646703720092773, "global_step": 456734, "epoch": 2718} {"train_loss": -12.586359024047852, "global_step": 456735, "epoch": 2718} {"train_loss": -12.426521301269531, "global_step": 456736, "epoch": 2718} {"train_loss": -12.649247169494629, "global_step": 456737, "epoch": 2718} {"train_loss": -12.756061553955078, "global_step": 456738, "epoch": 2718} {"train_loss": -12.85311508178711, "global_step": 456739, "epoch": 2718} {"train_loss": -12.834131240844727, "global_step": 456740, "epoch": 2718} {"train_loss": -12.941102027893066, "global_step": 456741, "epoch": 2718} {"train_loss": -12.769073486328125, "global_step": 456742, "epoch": 2718} {"train_loss": -12.694268226623535, "global_step": 456743, "epoch": 2718} {"train_loss": -12.822694778442383, "global_step": 456744, "epoch": 2718} {"train_loss": -12.885112762451172, "global_step": 456745, "epoch": 2718} {"train_loss": -12.843790054321289, "global_step": 456746, "epoch": 2718} {"train_loss": -12.97802448272705, "global_step": 456747, "epoch": 2718} {"train_loss": -12.742460250854492, "global_step": 456748, "epoch": 2718} {"train_loss": -12.847122192382812, "global_step": 456749, "epoch": 2718} {"train_loss": -12.680828094482422, "global_step": 456750, "epoch": 2718} {"train_loss": -12.928443908691406, "global_step": 456751, "epoch": 2718} {"train_loss": -12.985176086425781, "global_step": 456752, "epoch": 2718} {"train_loss": -12.986234664916992, "global_step": 456753, "epoch": 2718} {"train_loss": -13.129802703857422, "global_step": 456754, "epoch": 2718} {"train_loss": -12.866374015808105, "global_step": 456755, "epoch": 2718} {"train_loss": -13.083158493041992, "global_step": 456756, "epoch": 2718} {"train_loss": -12.725858688354492, "global_step": 456757, "epoch": 2718} {"train_loss": -12.974843978881836, "global_step": 456758, "epoch": 2718} {"train_loss": -12.928430557250977, "global_step": 456759, "epoch": 2718} {"train_loss": -12.763702392578125, "global_step": 456760, "epoch": 2718} {"train_loss": -12.730091094970703, "global_step": 456761, "epoch": 2718} {"train_loss": -12.884857177734375, "global_step": 456762, "epoch": 2718} {"train_loss": -12.495410919189453, "global_step": 456763, "epoch": 2718} {"train_loss": -12.65266227722168, "global_step": 456764, "epoch": 2718} {"train_loss": -12.891314506530762, "global_step": 456765, "epoch": 2718} {"train_loss": -12.919994354248047, "global_step": 456766, "epoch": 2718} {"train_loss": -13.035211563110352, "global_step": 456767, "epoch": 2718} {"train_loss": -13.101542472839355, "global_step": 456768, "epoch": 2718} {"train_loss": -12.90853500366211, "global_step": 456769, "epoch": 2718} {"train_loss": -12.789764404296875, "global_step": 456770, "epoch": 2718} {"train_loss": -13.176176071166992, "global_step": 456771, "epoch": 2718} {"train_loss": -12.892110824584961, "global_step": 456772, "epoch": 2718} {"train_loss": -12.302600860595703, "global_step": 456773, "epoch": 2718} {"train_loss": -11.922157287597656, "global_step": 456774, "epoch": 2718} {"train_loss": -12.59784984588623, "global_step": 456775, "epoch": 2718} {"train_loss": -12.94087028503418, "global_step": 456776, "epoch": 2718} {"train_loss": -12.155038833618164, "global_step": 456777, "epoch": 2718} {"train_loss": -12.273416519165039, "global_step": 456778, "epoch": 2718} {"train_loss": -12.807502746582031, "global_step": 456779, "epoch": 2718} {"train_loss": -12.832137107849121, "global_step": 456780, "epoch": 2718} {"train_loss": -12.632427215576172, "global_step": 456781, "epoch": 2718} {"train_loss": -12.548653602600098, "global_step": 456782, "epoch": 2718} {"train_loss": -12.842340469360352, "global_step": 456783, "epoch": 2718} {"train_loss": -12.433309555053711, "global_step": 456784, "epoch": 2718} {"train_loss": -12.52193546295166, "global_step": 456785, "epoch": 2718} {"train_loss": -12.161328315734863, "global_step": 456786, "epoch": 2718} {"train_loss": -12.7068452835083, "global_step": 456787, "epoch": 2718} {"train_loss": -12.836265563964844, "global_step": 456788, "epoch": 2718} {"train_loss": -12.78503704071045, "global_step": 456789, "epoch": 2718} {"train_loss": -12.765050888061523, "global_step": 456790, "epoch": 2718} {"train_loss": -12.295606896990822, "global_step": 456791, "epoch": 2718, "val_loss": 314341.75} {"train_loss": -12.765289306640625, "global_step": 456792, "epoch": 2719} {"train_loss": -12.706170082092285, "global_step": 456793, "epoch": 2719} {"train_loss": -12.825096130371094, "global_step": 456794, "epoch": 2719} {"train_loss": -12.831063270568848, "global_step": 456795, "epoch": 2719} {"train_loss": -12.753110885620117, "global_step": 456796, "epoch": 2719} {"train_loss": -12.879047393798828, "global_step": 456797, "epoch": 2719} {"train_loss": -12.72603988647461, "global_step": 456798, "epoch": 2719} {"train_loss": -12.754499435424805, "global_step": 456799, "epoch": 2719} {"train_loss": -12.9013090133667, "global_step": 456800, "epoch": 2719} {"train_loss": -12.779354095458984, "global_step": 456801, "epoch": 2719} {"train_loss": -12.66308879852295, "global_step": 456802, "epoch": 2719} {"train_loss": -12.950277328491211, "global_step": 456803, "epoch": 2719} {"train_loss": -12.602815628051758, "global_step": 456804, "epoch": 2719} {"train_loss": -12.636709213256836, "global_step": 456805, "epoch": 2719} {"train_loss": -12.493122100830078, "global_step": 456806, "epoch": 2719} {"train_loss": -12.604402542114258, "global_step": 456807, "epoch": 2719} {"train_loss": -12.620250701904297, "global_step": 456808, "epoch": 2719} {"train_loss": -12.708892822265625, "global_step": 456809, "epoch": 2719} {"train_loss": -12.092687606811523, "global_step": 456810, "epoch": 2719} {"train_loss": -12.084081649780273, "global_step": 456811, "epoch": 2719} {"train_loss": -12.023735046386719, "global_step": 456812, "epoch": 2719} {"train_loss": -12.757223129272461, "global_step": 456813, "epoch": 2719} {"train_loss": -12.126012802124023, "global_step": 456814, "epoch": 2719} {"train_loss": -12.264880180358887, "global_step": 456815, "epoch": 2719} {"train_loss": -11.965205192565918, "global_step": 456816, "epoch": 2719} {"train_loss": -11.928502082824707, "global_step": 456817, "epoch": 2719} {"train_loss": -11.671709060668945, "global_step": 456818, "epoch": 2719} {"train_loss": -12.84937572479248, "global_step": 456819, "epoch": 2719} {"train_loss": -11.55093002319336, "global_step": 456820, "epoch": 2719} {"train_loss": -10.61436653137207, "global_step": 456821, "epoch": 2719} {"train_loss": -11.823064804077148, "global_step": 456822, "epoch": 2719} {"train_loss": -10.419328689575195, "global_step": 456823, "epoch": 2719} {"train_loss": -10.307719230651855, "global_step": 456824, "epoch": 2719} {"train_loss": -11.472200393676758, "global_step": 456825, "epoch": 2719} {"train_loss": -10.690261840820312, "global_step": 456826, "epoch": 2719} {"train_loss": -10.151423454284668, "global_step": 456827, "epoch": 2719} {"train_loss": -10.359347343444824, "global_step": 456828, "epoch": 2719} {"train_loss": -11.420416831970215, "global_step": 456829, "epoch": 2719} {"train_loss": -10.964258193969727, "global_step": 456830, "epoch": 2719} {"train_loss": -11.118999481201172, "global_step": 456831, "epoch": 2719} {"train_loss": -11.09642219543457, "global_step": 456832, "epoch": 2719} {"train_loss": -9.973599433898926, "global_step": 456833, "epoch": 2719} {"train_loss": -9.390876770019531, "global_step": 456834, "epoch": 2719} {"train_loss": -10.459184646606445, "global_step": 456835, "epoch": 2719} {"train_loss": -11.035002708435059, "global_step": 456836, "epoch": 2719} {"train_loss": -9.69108772277832, "global_step": 456837, "epoch": 2719} {"train_loss": -9.259647369384766, "global_step": 456838, "epoch": 2719} {"train_loss": -9.59134292602539, "global_step": 456839, "epoch": 2719} {"train_loss": -8.207996368408203, "global_step": 456840, "epoch": 2719} {"train_loss": -8.1296968460083, "global_step": 456841, "epoch": 2719} {"train_loss": -8.725022315979004, "global_step": 456842, "epoch": 2719} {"train_loss": -8.722103118896484, "global_step": 456843, "epoch": 2719} {"train_loss": -9.289839744567871, "global_step": 456844, "epoch": 2719} {"train_loss": -10.488636016845703, "global_step": 456845, "epoch": 2719} {"train_loss": -9.772287368774414, "global_step": 456846, "epoch": 2719} {"train_loss": -10.904763221740723, "global_step": 456847, "epoch": 2719} {"train_loss": -10.167764663696289, "global_step": 456848, "epoch": 2719} {"train_loss": -10.944032669067383, "global_step": 456849, "epoch": 2719} {"train_loss": -10.747686386108398, "global_step": 456850, "epoch": 2719} {"train_loss": -10.958858489990234, "global_step": 456851, "epoch": 2719} {"train_loss": -10.290817260742188, "global_step": 456852, "epoch": 2719} {"train_loss": -11.657966613769531, "global_step": 456853, "epoch": 2719} {"train_loss": -11.275177955627441, "global_step": 456854, "epoch": 2719} {"train_loss": -11.49614143371582, "global_step": 456855, "epoch": 2719} {"train_loss": -9.836345672607422, "global_step": 456856, "epoch": 2719} {"train_loss": -10.39322566986084, "global_step": 456857, "epoch": 2719} {"train_loss": -10.529119491577148, "global_step": 456858, "epoch": 2719} {"train_loss": -11.879128456115723, "global_step": 456859, "epoch": 2719} {"train_loss": -11.504974365234375, "global_step": 456860, "epoch": 2719} {"train_loss": -11.833030700683594, "global_step": 456861, "epoch": 2719} {"train_loss": -11.683621406555176, "global_step": 456862, "epoch": 2719} {"train_loss": -11.874503135681152, "global_step": 456863, "epoch": 2719} {"train_loss": -11.838458061218262, "global_step": 456864, "epoch": 2719} {"train_loss": -11.34643268585205, "global_step": 456865, "epoch": 2719} {"train_loss": -11.918877601623535, "global_step": 456866, "epoch": 2719} {"train_loss": -11.786582946777344, "global_step": 456867, "epoch": 2719} {"train_loss": -12.067346572875977, "global_step": 456868, "epoch": 2719} {"train_loss": -11.949129104614258, "global_step": 456869, "epoch": 2719} {"train_loss": -12.112083435058594, "global_step": 456870, "epoch": 2719} {"train_loss": -11.969711303710938, "global_step": 456871, "epoch": 2719} {"train_loss": -12.181865692138672, "global_step": 456872, "epoch": 2719} {"train_loss": -12.213884353637695, "global_step": 456873, "epoch": 2719} {"train_loss": -12.187650680541992, "global_step": 456874, "epoch": 2719} {"train_loss": -12.399845123291016, "global_step": 456875, "epoch": 2719} {"train_loss": -12.149123191833496, "global_step": 456876, "epoch": 2719} {"train_loss": -12.509899139404297, "global_step": 456877, "epoch": 2719} {"train_loss": -12.514579772949219, "global_step": 456878, "epoch": 2719} {"train_loss": -12.187610626220703, "global_step": 456879, "epoch": 2719} {"train_loss": -12.6268892288208, "global_step": 456880, "epoch": 2719} {"train_loss": -12.213340759277344, "global_step": 456881, "epoch": 2719} {"train_loss": -12.5004243850708, "global_step": 456882, "epoch": 2719} {"train_loss": -12.467477798461914, "global_step": 456883, "epoch": 2719} {"train_loss": -12.481484413146973, "global_step": 456884, "epoch": 2719} {"train_loss": -12.603961944580078, "global_step": 456885, "epoch": 2719} {"train_loss": -12.480628967285156, "global_step": 456886, "epoch": 2719} {"train_loss": -12.506195068359375, "global_step": 456887, "epoch": 2719} {"train_loss": -12.581843376159668, "global_step": 456888, "epoch": 2719} {"train_loss": -12.472637176513672, "global_step": 456889, "epoch": 2719} {"train_loss": -12.525150299072266, "global_step": 456890, "epoch": 2719} {"train_loss": -12.390237808227539, "global_step": 456891, "epoch": 2719} {"train_loss": -12.001445770263672, "global_step": 456892, "epoch": 2719} {"train_loss": -12.436193466186523, "global_step": 456893, "epoch": 2719} {"train_loss": -12.247566223144531, "global_step": 456894, "epoch": 2719} {"train_loss": -12.383713722229004, "global_step": 456895, "epoch": 2719} {"train_loss": -12.499017715454102, "global_step": 456896, "epoch": 2719} {"train_loss": -12.64077377319336, "global_step": 456897, "epoch": 2719} {"train_loss": -12.576075553894043, "global_step": 456898, "epoch": 2719} {"train_loss": -12.447879791259766, "global_step": 456899, "epoch": 2719} {"train_loss": -12.483671188354492, "global_step": 456900, "epoch": 2719} {"train_loss": -12.855196952819824, "global_step": 456901, "epoch": 2719} {"train_loss": -12.592188835144043, "global_step": 456902, "epoch": 2719} {"train_loss": -12.533342361450195, "global_step": 456903, "epoch": 2719} {"train_loss": -12.696285247802734, "global_step": 456904, "epoch": 2719} {"train_loss": -12.769577980041504, "global_step": 456905, "epoch": 2719} {"train_loss": -12.670223236083984, "global_step": 456906, "epoch": 2719} {"train_loss": -12.71973991394043, "global_step": 456907, "epoch": 2719} {"train_loss": -12.51308536529541, "global_step": 456908, "epoch": 2719} {"train_loss": -12.607006072998047, "global_step": 456909, "epoch": 2719} {"train_loss": -12.62850284576416, "global_step": 456910, "epoch": 2719} {"train_loss": -12.840801239013672, "global_step": 456911, "epoch": 2719} {"train_loss": -12.691709518432617, "global_step": 456912, "epoch": 2719} {"train_loss": -12.629814147949219, "global_step": 456913, "epoch": 2719} {"train_loss": -12.743413925170898, "global_step": 456914, "epoch": 2719} {"train_loss": -12.31700611114502, "global_step": 456915, "epoch": 2719} {"train_loss": -12.694414138793945, "global_step": 456916, "epoch": 2719} {"train_loss": -12.717000961303711, "global_step": 456917, "epoch": 2719} {"train_loss": -12.68655776977539, "global_step": 456918, "epoch": 2719} {"train_loss": -12.693826675415039, "global_step": 456919, "epoch": 2719} {"train_loss": -12.74949836730957, "global_step": 456920, "epoch": 2719} {"train_loss": -12.8323335647583, "global_step": 456921, "epoch": 2719} {"train_loss": -12.626476287841797, "global_step": 456922, "epoch": 2719} {"train_loss": -12.458145141601562, "global_step": 456923, "epoch": 2719} {"train_loss": -12.71436882019043, "global_step": 456924, "epoch": 2719} {"train_loss": -12.696950912475586, "global_step": 456925, "epoch": 2719} {"train_loss": -12.72494125366211, "global_step": 456926, "epoch": 2719} {"train_loss": -12.73708724975586, "global_step": 456927, "epoch": 2719} {"train_loss": -12.740633010864258, "global_step": 456928, "epoch": 2719} {"train_loss": -12.908709526062012, "global_step": 456929, "epoch": 2719} {"train_loss": -12.841024398803711, "global_step": 456930, "epoch": 2719} {"train_loss": -12.788721084594727, "global_step": 456931, "epoch": 2719} {"train_loss": -12.770620346069336, "global_step": 456932, "epoch": 2719} {"train_loss": -12.817584991455078, "global_step": 456933, "epoch": 2719} {"train_loss": -12.8148832321167, "global_step": 456934, "epoch": 2719} {"train_loss": -12.702676773071289, "global_step": 456935, "epoch": 2719} {"train_loss": -12.794120788574219, "global_step": 456936, "epoch": 2719} {"train_loss": -12.707521438598633, "global_step": 456937, "epoch": 2719} {"train_loss": -12.56655216217041, "global_step": 456938, "epoch": 2719} {"train_loss": -12.66440486907959, "global_step": 456939, "epoch": 2719} {"train_loss": -12.66942024230957, "global_step": 456940, "epoch": 2719} {"train_loss": -11.58564567565918, "global_step": 456941, "epoch": 2719} {"train_loss": -12.2515230178833, "global_step": 456942, "epoch": 2719} {"train_loss": -12.801461219787598, "global_step": 456943, "epoch": 2719} {"train_loss": -11.836274147033691, "global_step": 456944, "epoch": 2719} {"train_loss": -12.679792404174805, "global_step": 456945, "epoch": 2719} {"train_loss": -12.564335823059082, "global_step": 456946, "epoch": 2719} {"train_loss": -12.340642929077148, "global_step": 456947, "epoch": 2719} {"train_loss": -13.118331909179688, "global_step": 456948, "epoch": 2719} {"train_loss": -12.509066581726074, "global_step": 456949, "epoch": 2719} {"train_loss": -12.924240112304688, "global_step": 456950, "epoch": 2719} {"train_loss": -12.790929794311523, "global_step": 456951, "epoch": 2719} {"train_loss": -12.968639373779297, "global_step": 456952, "epoch": 2719} {"train_loss": -12.61101245880127, "global_step": 456953, "epoch": 2719} {"train_loss": -12.77318000793457, "global_step": 456954, "epoch": 2719} {"train_loss": -12.35560417175293, "global_step": 456955, "epoch": 2719} {"train_loss": -12.709209442138672, "global_step": 456956, "epoch": 2719} {"train_loss": -12.470314025878906, "global_step": 456957, "epoch": 2719} {"train_loss": -12.531139373779297, "global_step": 456958, "epoch": 2719} {"train_loss": -11.994784514109293, "global_step": 456959, "epoch": 2719, "val_loss": 312206.28125} {"train_loss": -11.951775550842285, "global_step": 456960, "epoch": 2720} {"train_loss": -12.632485389709473, "global_step": 456961, "epoch": 2720} {"train_loss": -12.557967185974121, "global_step": 456962, "epoch": 2720} {"train_loss": -12.725799560546875, "global_step": 456963, "epoch": 2720} {"train_loss": -12.802716255187988, "global_step": 456964, "epoch": 2720} {"train_loss": -12.677011489868164, "global_step": 456965, "epoch": 2720} {"train_loss": -12.693958282470703, "global_step": 456966, "epoch": 2720} {"train_loss": -12.586099624633789, "global_step": 456967, "epoch": 2720} {"train_loss": -12.756473541259766, "global_step": 456968, "epoch": 2720} {"train_loss": -12.73011589050293, "global_step": 456969, "epoch": 2720} {"train_loss": -12.3675537109375, "global_step": 456970, "epoch": 2720} {"train_loss": -12.699257850646973, "global_step": 456971, "epoch": 2720} {"train_loss": -12.576839447021484, "global_step": 456972, "epoch": 2720} {"train_loss": -12.284521102905273, "global_step": 456973, "epoch": 2720} {"train_loss": -12.648831367492676, "global_step": 456974, "epoch": 2720} {"train_loss": -11.9835205078125, "global_step": 456975, "epoch": 2720} {"train_loss": -12.0765962600708, "global_step": 456976, "epoch": 2720} {"train_loss": -12.753950119018555, "global_step": 456977, "epoch": 2720} {"train_loss": -11.507984161376953, "global_step": 456978, "epoch": 2720} {"train_loss": -10.694337844848633, "global_step": 456979, "epoch": 2720} {"train_loss": -12.925520896911621, "global_step": 456980, "epoch": 2720} {"train_loss": -9.965316772460938, "global_step": 456981, "epoch": 2720} {"train_loss": -11.620637893676758, "global_step": 456982, "epoch": 2720} {"train_loss": -11.310091018676758, "global_step": 456983, "epoch": 2720} {"train_loss": -8.751282691955566, "global_step": 456984, "epoch": 2720} {"train_loss": -10.540582656860352, "global_step": 456985, "epoch": 2720} {"train_loss": -11.623443603515625, "global_step": 456986, "epoch": 2720} {"train_loss": -10.150659561157227, "global_step": 456987, "epoch": 2720} {"train_loss": -9.894481658935547, "global_step": 456988, "epoch": 2720} {"train_loss": -9.833045959472656, "global_step": 456989, "epoch": 2720} {"train_loss": -9.53826904296875, "global_step": 456990, "epoch": 2720} {"train_loss": -11.596355438232422, "global_step": 456991, "epoch": 2720} {"train_loss": -9.568368911743164, "global_step": 456992, "epoch": 2720} {"train_loss": -11.375398635864258, "global_step": 456993, "epoch": 2720} {"train_loss": -10.873992919921875, "global_step": 456994, "epoch": 2720} {"train_loss": -11.920680046081543, "global_step": 456995, "epoch": 2720} {"train_loss": -11.319581985473633, "global_step": 456996, "epoch": 2720} {"train_loss": -11.503053665161133, "global_step": 456997, "epoch": 2720} {"train_loss": -11.470787048339844, "global_step": 456998, "epoch": 2720} {"train_loss": -12.202491760253906, "global_step": 456999, "epoch": 2720} {"train_loss": -10.936775207519531, "global_step": 457000, "epoch": 2720} {"train_loss": -10.865421295166016, "global_step": 457001, "epoch": 2720} {"train_loss": -11.911672592163086, "global_step": 457002, "epoch": 2720} {"train_loss": -11.034120559692383, "global_step": 457003, "epoch": 2720} {"train_loss": -10.319695472717285, "global_step": 457004, "epoch": 2720} {"train_loss": -11.154542922973633, "global_step": 457005, "epoch": 2720} {"train_loss": -11.019481658935547, "global_step": 457006, "epoch": 2720} {"train_loss": -10.893598556518555, "global_step": 457007, "epoch": 2720} {"train_loss": -10.991193771362305, "global_step": 457008, "epoch": 2720} {"train_loss": -10.462556838989258, "global_step": 457009, "epoch": 2720} {"train_loss": -11.43307113647461, "global_step": 457010, "epoch": 2720} {"train_loss": -11.680170059204102, "global_step": 457011, "epoch": 2720} {"train_loss": -11.718994140625, "global_step": 457012, "epoch": 2720} {"train_loss": -11.100334167480469, "global_step": 457013, "epoch": 2720} {"train_loss": -11.298995971679688, "global_step": 457014, "epoch": 2720} {"train_loss": -12.022357940673828, "global_step": 457015, "epoch": 2720} {"train_loss": -11.874645233154297, "global_step": 457016, "epoch": 2720} {"train_loss": -12.044235229492188, "global_step": 457017, "epoch": 2720} {"train_loss": -12.036131858825684, "global_step": 457018, "epoch": 2720} {"train_loss": -12.239572525024414, "global_step": 457019, "epoch": 2720} {"train_loss": -11.988720893859863, "global_step": 457020, "epoch": 2720} {"train_loss": -12.418607711791992, "global_step": 457021, "epoch": 2720} {"train_loss": -12.253002166748047, "global_step": 457022, "epoch": 2720} {"train_loss": -11.958005905151367, "global_step": 457023, "epoch": 2720} {"train_loss": -12.244085311889648, "global_step": 457024, "epoch": 2720} {"train_loss": -11.770235061645508, "global_step": 457025, "epoch": 2720} {"train_loss": -12.500638961791992, "global_step": 457026, "epoch": 2720} {"train_loss": -11.881027221679688, "global_step": 457027, "epoch": 2720} {"train_loss": -12.362953186035156, "global_step": 457028, "epoch": 2720} {"train_loss": -11.93467903137207, "global_step": 457029, "epoch": 2720} {"train_loss": -12.091874122619629, "global_step": 457030, "epoch": 2720} {"train_loss": -12.21277904510498, "global_step": 457031, "epoch": 2720} {"train_loss": -12.008735656738281, "global_step": 457032, "epoch": 2720} {"train_loss": -12.025116920471191, "global_step": 457033, "epoch": 2720} {"train_loss": -12.425172805786133, "global_step": 457034, "epoch": 2720} {"train_loss": -11.680305480957031, "global_step": 457035, "epoch": 2720} {"train_loss": -12.43819808959961, "global_step": 457036, "epoch": 2720} {"train_loss": -12.093513488769531, "global_step": 457037, "epoch": 2720} {"train_loss": -12.10300064086914, "global_step": 457038, "epoch": 2720} {"train_loss": -12.140584945678711, "global_step": 457039, "epoch": 2720} {"train_loss": -12.25632095336914, "global_step": 457040, "epoch": 2720} {"train_loss": -12.007843017578125, "global_step": 457041, "epoch": 2720} {"train_loss": -12.777073860168457, "global_step": 457042, "epoch": 2720} {"train_loss": -12.124773025512695, "global_step": 457043, "epoch": 2720} {"train_loss": -12.44051456451416, "global_step": 457044, "epoch": 2720} {"train_loss": -12.182851791381836, "global_step": 457045, "epoch": 2720} {"train_loss": -12.372169494628906, "global_step": 457046, "epoch": 2720} {"train_loss": -12.599363327026367, "global_step": 457047, "epoch": 2720} {"train_loss": -12.037906646728516, "global_step": 457048, "epoch": 2720} {"train_loss": -12.262439727783203, "global_step": 457049, "epoch": 2720} {"train_loss": -12.553292274475098, "global_step": 457050, "epoch": 2720} {"train_loss": -12.123428344726562, "global_step": 457051, "epoch": 2720} {"train_loss": -12.706195831298828, "global_step": 457052, "epoch": 2720} {"train_loss": -12.232329368591309, "global_step": 457053, "epoch": 2720} {"train_loss": -12.334823608398438, "global_step": 457054, "epoch": 2720} {"train_loss": -12.394201278686523, "global_step": 457055, "epoch": 2720} {"train_loss": -12.357976913452148, "global_step": 457056, "epoch": 2720} {"train_loss": -12.473965644836426, "global_step": 457057, "epoch": 2720} {"train_loss": -12.612748146057129, "global_step": 457058, "epoch": 2720} {"train_loss": -12.19041633605957, "global_step": 457059, "epoch": 2720} {"train_loss": -12.74722957611084, "global_step": 457060, "epoch": 2720} {"train_loss": -12.236143112182617, "global_step": 457061, "epoch": 2720} {"train_loss": -12.12756061553955, "global_step": 457062, "epoch": 2720} {"train_loss": -12.762097358703613, "global_step": 457063, "epoch": 2720} {"train_loss": -12.288179397583008, "global_step": 457064, "epoch": 2720} {"train_loss": -12.619638442993164, "global_step": 457065, "epoch": 2720} {"train_loss": -12.53062629699707, "global_step": 457066, "epoch": 2720} {"train_loss": -12.148849487304688, "global_step": 457067, "epoch": 2720} {"train_loss": -11.943853378295898, "global_step": 457068, "epoch": 2720} {"train_loss": -12.033332824707031, "global_step": 457069, "epoch": 2720} {"train_loss": -11.928314208984375, "global_step": 457070, "epoch": 2720} {"train_loss": -11.977989196777344, "global_step": 457071, "epoch": 2720} {"train_loss": -12.157520294189453, "global_step": 457072, "epoch": 2720} {"train_loss": -11.954119682312012, "global_step": 457073, "epoch": 2720} {"train_loss": -12.620233535766602, "global_step": 457074, "epoch": 2720} {"train_loss": -11.48036003112793, "global_step": 457075, "epoch": 2720} {"train_loss": -12.205045700073242, "global_step": 457076, "epoch": 2720} {"train_loss": -12.143776893615723, "global_step": 457077, "epoch": 2720} {"train_loss": -11.894035339355469, "global_step": 457078, "epoch": 2720} {"train_loss": -12.17398452758789, "global_step": 457079, "epoch": 2720} {"train_loss": -11.854372024536133, "global_step": 457080, "epoch": 2720} {"train_loss": -12.019927024841309, "global_step": 457081, "epoch": 2720} {"train_loss": -12.464299201965332, "global_step": 457082, "epoch": 2720} {"train_loss": -12.316167831420898, "global_step": 457083, "epoch": 2720} {"train_loss": -12.354393005371094, "global_step": 457084, "epoch": 2720} {"train_loss": -12.560380935668945, "global_step": 457085, "epoch": 2720} {"train_loss": -11.966184616088867, "global_step": 457086, "epoch": 2720} {"train_loss": -12.596762657165527, "global_step": 457087, "epoch": 2720} {"train_loss": -12.114933967590332, "global_step": 457088, "epoch": 2720} {"train_loss": -12.579878807067871, "global_step": 457089, "epoch": 2720} {"train_loss": -12.386308670043945, "global_step": 457090, "epoch": 2720} {"train_loss": -12.358019828796387, "global_step": 457091, "epoch": 2720} {"train_loss": -12.907537460327148, "global_step": 457092, "epoch": 2720} {"train_loss": -12.480062484741211, "global_step": 457093, "epoch": 2720} {"train_loss": -12.681178092956543, "global_step": 457094, "epoch": 2720} {"train_loss": -12.553377151489258, "global_step": 457095, "epoch": 2720} {"train_loss": -12.677062034606934, "global_step": 457096, "epoch": 2720} {"train_loss": -12.881753921508789, "global_step": 457097, "epoch": 2720} {"train_loss": -12.507999420166016, "global_step": 457098, "epoch": 2720} {"train_loss": -12.577377319335938, "global_step": 457099, "epoch": 2720} {"train_loss": -12.748846054077148, "global_step": 457100, "epoch": 2720} {"train_loss": -12.605125427246094, "global_step": 457101, "epoch": 2720} {"train_loss": -12.370765686035156, "global_step": 457102, "epoch": 2720} {"train_loss": -12.538171768188477, "global_step": 457103, "epoch": 2720} {"train_loss": -12.327642440795898, "global_step": 457104, "epoch": 2720} {"train_loss": -12.578741073608398, "global_step": 457105, "epoch": 2720} {"train_loss": -12.686715126037598, "global_step": 457106, "epoch": 2720} {"train_loss": -12.673198699951172, "global_step": 457107, "epoch": 2720} {"train_loss": -12.768165588378906, "global_step": 457108, "epoch": 2720} {"train_loss": -12.740842819213867, "global_step": 457109, "epoch": 2720} {"train_loss": -12.787921905517578, "global_step": 457110, "epoch": 2720} {"train_loss": -12.827433586120605, "global_step": 457111, "epoch": 2720} {"train_loss": -12.688102722167969, "global_step": 457112, "epoch": 2720} {"train_loss": -12.951637268066406, "global_step": 457113, "epoch": 2720} {"train_loss": -12.860336303710938, "global_step": 457114, "epoch": 2720} {"train_loss": -13.040088653564453, "global_step": 457115, "epoch": 2720} {"train_loss": -12.6165771484375, "global_step": 457116, "epoch": 2720} {"train_loss": -12.613680839538574, "global_step": 457117, "epoch": 2720} {"train_loss": -12.990653991699219, "global_step": 457118, "epoch": 2720} {"train_loss": -12.641203880310059, "global_step": 457119, "epoch": 2720} {"train_loss": -12.419609069824219, "global_step": 457120, "epoch": 2720} {"train_loss": -12.3731689453125, "global_step": 457121, "epoch": 2720} {"train_loss": -12.558753967285156, "global_step": 457122, "epoch": 2720} {"train_loss": -12.71499252319336, "global_step": 457123, "epoch": 2720} {"train_loss": -11.980168342590332, "global_step": 457124, "epoch": 2720} {"train_loss": -12.047040939331055, "global_step": 457125, "epoch": 2720} {"train_loss": -11.741954803466797, "global_step": 457126, "epoch": 2720} {"train_loss": -12.066504841759091, "global_step": 457127, "epoch": 2720, "val_loss": 313334.4375, "train_action_mse_error": 1.7364221811294556} {"train_loss": -12.517849922180176, "global_step": 457128, "epoch": 2721} {"train_loss": -12.364593505859375, "global_step": 457129, "epoch": 2721} {"train_loss": -12.80429744720459, "global_step": 457130, "epoch": 2721} {"train_loss": -11.91294002532959, "global_step": 457131, "epoch": 2721} {"train_loss": -12.576372146606445, "global_step": 457132, "epoch": 2721} {"train_loss": -12.241411209106445, "global_step": 457133, "epoch": 2721} {"train_loss": -11.457149505615234, "global_step": 457134, "epoch": 2721} {"train_loss": -12.208861351013184, "global_step": 457135, "epoch": 2721} {"train_loss": -12.257176399230957, "global_step": 457136, "epoch": 2721} {"train_loss": -11.500328063964844, "global_step": 457137, "epoch": 2721} {"train_loss": -11.876361846923828, "global_step": 457138, "epoch": 2721} {"train_loss": -11.770135879516602, "global_step": 457139, "epoch": 2721} {"train_loss": -12.025846481323242, "global_step": 457140, "epoch": 2721} {"train_loss": -12.075152397155762, "global_step": 457141, "epoch": 2721} {"train_loss": -12.831389427185059, "global_step": 457142, "epoch": 2721} {"train_loss": -11.988910675048828, "global_step": 457143, "epoch": 2721} {"train_loss": -11.498966217041016, "global_step": 457144, "epoch": 2721} {"train_loss": -12.53624439239502, "global_step": 457145, "epoch": 2721} {"train_loss": -12.628931045532227, "global_step": 457146, "epoch": 2721} {"train_loss": -12.518157958984375, "global_step": 457147, "epoch": 2721} {"train_loss": -12.312803268432617, "global_step": 457148, "epoch": 2721} {"train_loss": -12.577492713928223, "global_step": 457149, "epoch": 2721} {"train_loss": -12.337800979614258, "global_step": 457150, "epoch": 2721} {"train_loss": -12.611547470092773, "global_step": 457151, "epoch": 2721} {"train_loss": -12.056536674499512, "global_step": 457152, "epoch": 2721} {"train_loss": -12.336639404296875, "global_step": 457153, "epoch": 2721} {"train_loss": -12.524867057800293, "global_step": 457154, "epoch": 2721} {"train_loss": -12.444784164428711, "global_step": 457155, "epoch": 2721} {"train_loss": -12.326815605163574, "global_step": 457156, "epoch": 2721} {"train_loss": -11.979865074157715, "global_step": 457157, "epoch": 2721} {"train_loss": -12.428390502929688, "global_step": 457158, "epoch": 2721} {"train_loss": -12.49080753326416, "global_step": 457159, "epoch": 2721} {"train_loss": -12.084566116333008, "global_step": 457160, "epoch": 2721} {"train_loss": -12.135992050170898, "global_step": 457161, "epoch": 2721} {"train_loss": -12.713447570800781, "global_step": 457162, "epoch": 2721} {"train_loss": -12.42331600189209, "global_step": 457163, "epoch": 2721} {"train_loss": -12.489638328552246, "global_step": 457164, "epoch": 2721} {"train_loss": -12.847822189331055, "global_step": 457165, "epoch": 2721} {"train_loss": -12.754307746887207, "global_step": 457166, "epoch": 2721} {"train_loss": -12.591140747070312, "global_step": 457167, "epoch": 2721} {"train_loss": -12.849393844604492, "global_step": 457168, "epoch": 2721} {"train_loss": -12.587738990783691, "global_step": 457169, "epoch": 2721} {"train_loss": -11.662995338439941, "global_step": 457170, "epoch": 2721} {"train_loss": -12.837442398071289, "global_step": 457171, "epoch": 2721} {"train_loss": -12.482133865356445, "global_step": 457172, "epoch": 2721} {"train_loss": -12.105020523071289, "global_step": 457173, "epoch": 2721} {"train_loss": -12.787739753723145, "global_step": 457174, "epoch": 2721} {"train_loss": -12.987508773803711, "global_step": 457175, "epoch": 2721} {"train_loss": -12.605903625488281, "global_step": 457176, "epoch": 2721} {"train_loss": -12.798870086669922, "global_step": 457177, "epoch": 2721} {"train_loss": -12.663505554199219, "global_step": 457178, "epoch": 2721} {"train_loss": -12.564227104187012, "global_step": 457179, "epoch": 2721} {"train_loss": -12.736305236816406, "global_step": 457180, "epoch": 2721} {"train_loss": -12.724616050720215, "global_step": 457181, "epoch": 2721} {"train_loss": -12.729963302612305, "global_step": 457182, "epoch": 2721} {"train_loss": -12.874863624572754, "global_step": 457183, "epoch": 2721} {"train_loss": -13.063591003417969, "global_step": 457184, "epoch": 2721} {"train_loss": -12.940479278564453, "global_step": 457185, "epoch": 2721} {"train_loss": -12.961368560791016, "global_step": 457186, "epoch": 2721} {"train_loss": -12.98999309539795, "global_step": 457187, "epoch": 2721} {"train_loss": -12.785242080688477, "global_step": 457188, "epoch": 2721} {"train_loss": -12.843944549560547, "global_step": 457189, "epoch": 2721} {"train_loss": -12.844345092773438, "global_step": 457190, "epoch": 2721} {"train_loss": -12.908329010009766, "global_step": 457191, "epoch": 2721} {"train_loss": -12.717342376708984, "global_step": 457192, "epoch": 2721} {"train_loss": -12.686430931091309, "global_step": 457193, "epoch": 2721} {"train_loss": -12.950952529907227, "global_step": 457194, "epoch": 2721} {"train_loss": -12.71093463897705, "global_step": 457195, "epoch": 2721} {"train_loss": -12.723241806030273, "global_step": 457196, "epoch": 2721} {"train_loss": -12.768939971923828, "global_step": 457197, "epoch": 2721} {"train_loss": -12.918018341064453, "global_step": 457198, "epoch": 2721} {"train_loss": -12.91241455078125, "global_step": 457199, "epoch": 2721} {"train_loss": -12.890243530273438, "global_step": 457200, "epoch": 2721} {"train_loss": -12.661090850830078, "global_step": 457201, "epoch": 2721} {"train_loss": -12.819718360900879, "global_step": 457202, "epoch": 2721} {"train_loss": -13.036266326904297, "global_step": 457203, "epoch": 2721} {"train_loss": -12.97121810913086, "global_step": 457204, "epoch": 2721} {"train_loss": -12.7623872756958, "global_step": 457205, "epoch": 2721} {"train_loss": -12.92091178894043, "global_step": 457206, "epoch": 2721} {"train_loss": -12.970455169677734, "global_step": 457207, "epoch": 2721} {"train_loss": -12.615029335021973, "global_step": 457208, "epoch": 2721} {"train_loss": -12.774465560913086, "global_step": 457209, "epoch": 2721} {"train_loss": -12.845020294189453, "global_step": 457210, "epoch": 2721} {"train_loss": -12.983318328857422, "global_step": 457211, "epoch": 2721} {"train_loss": -12.003849029541016, "global_step": 457212, "epoch": 2721} {"train_loss": -11.722394943237305, "global_step": 457213, "epoch": 2721} {"train_loss": -11.640121459960938, "global_step": 457214, "epoch": 2721} {"train_loss": -12.568230628967285, "global_step": 457215, "epoch": 2721} {"train_loss": -12.871192932128906, "global_step": 457216, "epoch": 2721} {"train_loss": -11.615883827209473, "global_step": 457217, "epoch": 2721} {"train_loss": -10.029071807861328, "global_step": 457218, "epoch": 2721} {"train_loss": -11.32049560546875, "global_step": 457219, "epoch": 2721} {"train_loss": -8.513238906860352, "global_step": 457220, "epoch": 2721} {"train_loss": -9.085958480834961, "global_step": 457221, "epoch": 2721} {"train_loss": -7.807954788208008, "global_step": 457222, "epoch": 2721} {"train_loss": -8.99550724029541, "global_step": 457223, "epoch": 2721} {"train_loss": -8.240875244140625, "global_step": 457224, "epoch": 2721} {"train_loss": -7.762420654296875, "global_step": 457225, "epoch": 2721} {"train_loss": -10.370405197143555, "global_step": 457226, "epoch": 2721} {"train_loss": -9.581192016601562, "global_step": 457227, "epoch": 2721} {"train_loss": -9.501180648803711, "global_step": 457228, "epoch": 2721} {"train_loss": -9.35551643371582, "global_step": 457229, "epoch": 2721} {"train_loss": -9.345062255859375, "global_step": 457230, "epoch": 2721} {"train_loss": -8.525575637817383, "global_step": 457231, "epoch": 2721} {"train_loss": -10.900425910949707, "global_step": 457232, "epoch": 2721} {"train_loss": -9.42558479309082, "global_step": 457233, "epoch": 2721} {"train_loss": -10.38532543182373, "global_step": 457234, "epoch": 2721} {"train_loss": -10.412696838378906, "global_step": 457235, "epoch": 2721} {"train_loss": -10.27725601196289, "global_step": 457236, "epoch": 2721} {"train_loss": -10.256014823913574, "global_step": 457237, "epoch": 2721} {"train_loss": -8.79503059387207, "global_step": 457238, "epoch": 2721} {"train_loss": -7.4066314697265625, "global_step": 457239, "epoch": 2721} {"train_loss": -8.582454681396484, "global_step": 457240, "epoch": 2721} {"train_loss": -10.117871284484863, "global_step": 457241, "epoch": 2721} {"train_loss": -9.134960174560547, "global_step": 457242, "epoch": 2721} {"train_loss": -9.483320236206055, "global_step": 457243, "epoch": 2721} {"train_loss": -10.888799667358398, "global_step": 457244, "epoch": 2721} {"train_loss": -8.723280906677246, "global_step": 457245, "epoch": 2721} {"train_loss": -10.340401649475098, "global_step": 457246, "epoch": 2721} {"train_loss": -10.77064323425293, "global_step": 457247, "epoch": 2721} {"train_loss": -9.144338607788086, "global_step": 457248, "epoch": 2721} {"train_loss": -11.794302940368652, "global_step": 457249, "epoch": 2721} {"train_loss": -9.545734405517578, "global_step": 457250, "epoch": 2721} {"train_loss": -9.551008224487305, "global_step": 457251, "epoch": 2721} {"train_loss": -11.006142616271973, "global_step": 457252, "epoch": 2721} {"train_loss": -10.277128219604492, "global_step": 457253, "epoch": 2721} {"train_loss": -9.369503021240234, "global_step": 457254, "epoch": 2721} {"train_loss": -11.109503746032715, "global_step": 457255, "epoch": 2721} {"train_loss": -9.42706298828125, "global_step": 457256, "epoch": 2721} {"train_loss": -11.294917106628418, "global_step": 457257, "epoch": 2721} {"train_loss": -10.695155143737793, "global_step": 457258, "epoch": 2721} {"train_loss": -10.84395980834961, "global_step": 457259, "epoch": 2721} {"train_loss": -10.783228874206543, "global_step": 457260, "epoch": 2721} {"train_loss": -10.6903076171875, "global_step": 457261, "epoch": 2721} {"train_loss": -10.702460289001465, "global_step": 457262, "epoch": 2721} {"train_loss": -10.132269859313965, "global_step": 457263, "epoch": 2721} {"train_loss": -10.095075607299805, "global_step": 457264, "epoch": 2721} {"train_loss": -8.763641357421875, "global_step": 457265, "epoch": 2721} {"train_loss": -10.679866790771484, "global_step": 457266, "epoch": 2721} {"train_loss": -10.44501781463623, "global_step": 457267, "epoch": 2721} {"train_loss": -10.355112075805664, "global_step": 457268, "epoch": 2721} {"train_loss": -10.86324405670166, "global_step": 457269, "epoch": 2721} {"train_loss": -11.029779434204102, "global_step": 457270, "epoch": 2721} {"train_loss": -11.609220504760742, "global_step": 457271, "epoch": 2721} {"train_loss": -11.486257553100586, "global_step": 457272, "epoch": 2721} {"train_loss": -11.628376007080078, "global_step": 457273, "epoch": 2721} {"train_loss": -11.484216690063477, "global_step": 457274, "epoch": 2721} {"train_loss": -11.7298583984375, "global_step": 457275, "epoch": 2721} {"train_loss": -11.757413864135742, "global_step": 457276, "epoch": 2721} {"train_loss": -11.566513061523438, "global_step": 457277, "epoch": 2721} {"train_loss": -11.782563209533691, "global_step": 457278, "epoch": 2721} {"train_loss": -12.003314971923828, "global_step": 457279, "epoch": 2721} {"train_loss": -11.994921684265137, "global_step": 457280, "epoch": 2721} {"train_loss": -11.727031707763672, "global_step": 457281, "epoch": 2721} {"train_loss": -11.986340522766113, "global_step": 457282, "epoch": 2721} {"train_loss": -12.023492813110352, "global_step": 457283, "epoch": 2721} {"train_loss": -11.570301055908203, "global_step": 457284, "epoch": 2721} {"train_loss": -12.041747093200684, "global_step": 457285, "epoch": 2721} {"train_loss": -11.632610321044922, "global_step": 457286, "epoch": 2721} {"train_loss": -11.81451416015625, "global_step": 457287, "epoch": 2721} {"train_loss": -11.985859870910645, "global_step": 457288, "epoch": 2721} {"train_loss": -11.972460746765137, "global_step": 457289, "epoch": 2721} {"train_loss": -12.154655456542969, "global_step": 457290, "epoch": 2721} {"train_loss": -11.903229713439941, "global_step": 457291, "epoch": 2721} {"train_loss": -12.097528457641602, "global_step": 457292, "epoch": 2721} {"train_loss": -11.783714294433594, "global_step": 457293, "epoch": 2721} {"train_loss": -12.265745162963867, "global_step": 457294, "epoch": 2721} {"train_loss": -11.579097446941194, "global_step": 457295, "epoch": 2721, "val_loss": 311356.46875} {"train_loss": -12.125751495361328, "global_step": 457296, "epoch": 2722} {"train_loss": -12.07776927947998, "global_step": 457297, "epoch": 2722} {"train_loss": -11.989144325256348, "global_step": 457298, "epoch": 2722} {"train_loss": -12.117565155029297, "global_step": 457299, "epoch": 2722} {"train_loss": -12.16469955444336, "global_step": 457300, "epoch": 2722} {"train_loss": -12.157901763916016, "global_step": 457301, "epoch": 2722} {"train_loss": -12.179971694946289, "global_step": 457302, "epoch": 2722} {"train_loss": -12.275848388671875, "global_step": 457303, "epoch": 2722} {"train_loss": -12.164852142333984, "global_step": 457304, "epoch": 2722} {"train_loss": -12.343658447265625, "global_step": 457305, "epoch": 2722} {"train_loss": -12.277544021606445, "global_step": 457306, "epoch": 2722} {"train_loss": -12.212132453918457, "global_step": 457307, "epoch": 2722} {"train_loss": -12.248761177062988, "global_step": 457308, "epoch": 2722} {"train_loss": -12.498141288757324, "global_step": 457309, "epoch": 2722} {"train_loss": -12.299468040466309, "global_step": 457310, "epoch": 2722} {"train_loss": -12.400521278381348, "global_step": 457311, "epoch": 2722} {"train_loss": -12.127677917480469, "global_step": 457312, "epoch": 2722} {"train_loss": -12.306035041809082, "global_step": 457313, "epoch": 2722} {"train_loss": -12.459966659545898, "global_step": 457314, "epoch": 2722} {"train_loss": -12.434781074523926, "global_step": 457315, "epoch": 2722} {"train_loss": -12.454258918762207, "global_step": 457316, "epoch": 2722} {"train_loss": -12.430157661437988, "global_step": 457317, "epoch": 2722} {"train_loss": -12.351924896240234, "global_step": 457318, "epoch": 2722} {"train_loss": -12.458821296691895, "global_step": 457319, "epoch": 2722} {"train_loss": -12.52478313446045, "global_step": 457320, "epoch": 2722} {"train_loss": -12.263238906860352, "global_step": 457321, "epoch": 2722} {"train_loss": -12.484715461730957, "global_step": 457322, "epoch": 2722} {"train_loss": -12.318290710449219, "global_step": 457323, "epoch": 2722} {"train_loss": -12.20070743560791, "global_step": 457324, "epoch": 2722} {"train_loss": -12.43535041809082, "global_step": 457325, "epoch": 2722} {"train_loss": -12.590517044067383, "global_step": 457326, "epoch": 2722} {"train_loss": -12.3651762008667, "global_step": 457327, "epoch": 2722} {"train_loss": -12.745811462402344, "global_step": 457328, "epoch": 2722} {"train_loss": -12.523405075073242, "global_step": 457329, "epoch": 2722} {"train_loss": -12.547223091125488, "global_step": 457330, "epoch": 2722} {"train_loss": -12.520986557006836, "global_step": 457331, "epoch": 2722} {"train_loss": -12.416088104248047, "global_step": 457332, "epoch": 2722} {"train_loss": -12.34975814819336, "global_step": 457333, "epoch": 2722} {"train_loss": -12.708314895629883, "global_step": 457334, "epoch": 2722} {"train_loss": -12.653517723083496, "global_step": 457335, "epoch": 2722} {"train_loss": -12.629127502441406, "global_step": 457336, "epoch": 2722} {"train_loss": -12.857034683227539, "global_step": 457337, "epoch": 2722} {"train_loss": -12.488908767700195, "global_step": 457338, "epoch": 2722} {"train_loss": -12.612021446228027, "global_step": 457339, "epoch": 2722} {"train_loss": -12.555953025817871, "global_step": 457340, "epoch": 2722} {"train_loss": -12.590254783630371, "global_step": 457341, "epoch": 2722} {"train_loss": -12.478787422180176, "global_step": 457342, "epoch": 2722} {"train_loss": -12.719284057617188, "global_step": 457343, "epoch": 2722} {"train_loss": -12.742486953735352, "global_step": 457344, "epoch": 2722} {"train_loss": -12.300056457519531, "global_step": 457345, "epoch": 2722} {"train_loss": -12.626638412475586, "global_step": 457346, "epoch": 2722} {"train_loss": -12.489241600036621, "global_step": 457347, "epoch": 2722} {"train_loss": -12.673151016235352, "global_step": 457348, "epoch": 2722} {"train_loss": -12.49034309387207, "global_step": 457349, "epoch": 2722} {"train_loss": -12.650306701660156, "global_step": 457350, "epoch": 2722} {"train_loss": -12.518383026123047, "global_step": 457351, "epoch": 2722} {"train_loss": -12.611989974975586, "global_step": 457352, "epoch": 2722} {"train_loss": -12.50822925567627, "global_step": 457353, "epoch": 2722} {"train_loss": -12.656291961669922, "global_step": 457354, "epoch": 2722} {"train_loss": -12.677886962890625, "global_step": 457355, "epoch": 2722} {"train_loss": -12.912435531616211, "global_step": 457356, "epoch": 2722} {"train_loss": -12.828376770019531, "global_step": 457357, "epoch": 2722} {"train_loss": -12.63494873046875, "global_step": 457358, "epoch": 2722} {"train_loss": -12.58731746673584, "global_step": 457359, "epoch": 2722} {"train_loss": -12.616962432861328, "global_step": 457360, "epoch": 2722} {"train_loss": -12.721480369567871, "global_step": 457361, "epoch": 2722} {"train_loss": -12.841465950012207, "global_step": 457362, "epoch": 2722} {"train_loss": -12.86884880065918, "global_step": 457363, "epoch": 2722} {"train_loss": -12.778708457946777, "global_step": 457364, "epoch": 2722} {"train_loss": -12.702259063720703, "global_step": 457365, "epoch": 2722} {"train_loss": -12.683357238769531, "global_step": 457366, "epoch": 2722} {"train_loss": -12.666714668273926, "global_step": 457367, "epoch": 2722} {"train_loss": -12.7753324508667, "global_step": 457368, "epoch": 2722} {"train_loss": -12.830474853515625, "global_step": 457369, "epoch": 2722} {"train_loss": -12.803596496582031, "global_step": 457370, "epoch": 2722} {"train_loss": -12.863521575927734, "global_step": 457371, "epoch": 2722} {"train_loss": -12.76051139831543, "global_step": 457372, "epoch": 2722} {"train_loss": -12.949535369873047, "global_step": 457373, "epoch": 2722} {"train_loss": -12.481412887573242, "global_step": 457374, "epoch": 2722} {"train_loss": -12.668365478515625, "global_step": 457375, "epoch": 2722} {"train_loss": -12.547430992126465, "global_step": 457376, "epoch": 2722} {"train_loss": -12.55057430267334, "global_step": 457377, "epoch": 2722} {"train_loss": -12.746408462524414, "global_step": 457378, "epoch": 2722} {"train_loss": -12.859344482421875, "global_step": 457379, "epoch": 2722} {"train_loss": -12.49045181274414, "global_step": 457380, "epoch": 2722} {"train_loss": -12.597003936767578, "global_step": 457381, "epoch": 2722} {"train_loss": -12.903076171875, "global_step": 457382, "epoch": 2722} {"train_loss": -13.00920581817627, "global_step": 457383, "epoch": 2722} {"train_loss": -12.869084358215332, "global_step": 457384, "epoch": 2722} {"train_loss": -12.808298110961914, "global_step": 457385, "epoch": 2722} {"train_loss": -13.032218933105469, "global_step": 457386, "epoch": 2722} {"train_loss": -13.061704635620117, "global_step": 457387, "epoch": 2722} {"train_loss": -12.94276237487793, "global_step": 457388, "epoch": 2722} {"train_loss": -12.975589752197266, "global_step": 457389, "epoch": 2722} {"train_loss": -12.863037109375, "global_step": 457390, "epoch": 2722} {"train_loss": -12.713823318481445, "global_step": 457391, "epoch": 2722} {"train_loss": -12.839599609375, "global_step": 457392, "epoch": 2722} {"train_loss": -12.960803985595703, "global_step": 457393, "epoch": 2722} {"train_loss": -12.907251358032227, "global_step": 457394, "epoch": 2722} {"train_loss": -12.913562774658203, "global_step": 457395, "epoch": 2722} {"train_loss": -13.109275817871094, "global_step": 457396, "epoch": 2722} {"train_loss": -12.99729061126709, "global_step": 457397, "epoch": 2722} {"train_loss": -12.938190460205078, "global_step": 457398, "epoch": 2722} {"train_loss": -13.16110610961914, "global_step": 457399, "epoch": 2722} {"train_loss": -12.650965690612793, "global_step": 457400, "epoch": 2722} {"train_loss": -12.996994018554688, "global_step": 457401, "epoch": 2722} {"train_loss": -12.951634407043457, "global_step": 457402, "epoch": 2722} {"train_loss": -13.113648414611816, "global_step": 457403, "epoch": 2722} {"train_loss": -13.225482940673828, "global_step": 457404, "epoch": 2722} {"train_loss": -12.941657066345215, "global_step": 457405, "epoch": 2722} {"train_loss": -12.990949630737305, "global_step": 457406, "epoch": 2722} {"train_loss": -13.234102249145508, "global_step": 457407, "epoch": 2722} {"train_loss": -12.782522201538086, "global_step": 457408, "epoch": 2722} {"train_loss": -13.035616874694824, "global_step": 457409, "epoch": 2722} {"train_loss": -12.62856388092041, "global_step": 457410, "epoch": 2722} {"train_loss": -12.543377876281738, "global_step": 457411, "epoch": 2722} {"train_loss": -12.780793190002441, "global_step": 457412, "epoch": 2722} {"train_loss": -12.878066062927246, "global_step": 457413, "epoch": 2722} {"train_loss": -12.975014686584473, "global_step": 457414, "epoch": 2722} {"train_loss": -12.908367156982422, "global_step": 457415, "epoch": 2722} {"train_loss": -12.770590782165527, "global_step": 457416, "epoch": 2722} {"train_loss": -12.78333854675293, "global_step": 457417, "epoch": 2722} {"train_loss": -12.417709350585938, "global_step": 457418, "epoch": 2722} {"train_loss": -12.946718215942383, "global_step": 457419, "epoch": 2722} {"train_loss": -12.544519424438477, "global_step": 457420, "epoch": 2722} {"train_loss": -12.416671752929688, "global_step": 457421, "epoch": 2722} {"train_loss": -11.82911491394043, "global_step": 457422, "epoch": 2722} {"train_loss": -12.138761520385742, "global_step": 457423, "epoch": 2722} {"train_loss": -11.964214324951172, "global_step": 457424, "epoch": 2722} {"train_loss": -12.751577377319336, "global_step": 457425, "epoch": 2722} {"train_loss": -12.683095932006836, "global_step": 457426, "epoch": 2722} {"train_loss": -12.83297348022461, "global_step": 457427, "epoch": 2722} {"train_loss": -12.63143253326416, "global_step": 457428, "epoch": 2722} {"train_loss": -12.087121963500977, "global_step": 457429, "epoch": 2722} {"train_loss": -12.364082336425781, "global_step": 457430, "epoch": 2722} {"train_loss": -12.201126098632812, "global_step": 457431, "epoch": 2722} {"train_loss": -10.848222732543945, "global_step": 457432, "epoch": 2722} {"train_loss": -11.460065841674805, "global_step": 457433, "epoch": 2722} {"train_loss": -12.119440078735352, "global_step": 457434, "epoch": 2722} {"train_loss": -10.152097702026367, "global_step": 457435, "epoch": 2722} {"train_loss": -10.335041046142578, "global_step": 457436, "epoch": 2722} {"train_loss": -11.502103805541992, "global_step": 457437, "epoch": 2722} {"train_loss": -11.672002792358398, "global_step": 457438, "epoch": 2722} {"train_loss": -10.805898666381836, "global_step": 457439, "epoch": 2722} {"train_loss": -10.258848190307617, "global_step": 457440, "epoch": 2722} {"train_loss": -12.212478637695312, "global_step": 457441, "epoch": 2722} {"train_loss": -10.862632751464844, "global_step": 457442, "epoch": 2722} {"train_loss": -11.202877044677734, "global_step": 457443, "epoch": 2722} {"train_loss": -11.735437393188477, "global_step": 457444, "epoch": 2722} {"train_loss": -11.479084014892578, "global_step": 457445, "epoch": 2722} {"train_loss": -10.967853546142578, "global_step": 457446, "epoch": 2722} {"train_loss": -11.93557357788086, "global_step": 457447, "epoch": 2722} {"train_loss": -10.171148300170898, "global_step": 457448, "epoch": 2722} {"train_loss": -11.416217803955078, "global_step": 457449, "epoch": 2722} {"train_loss": -11.82658576965332, "global_step": 457450, "epoch": 2722} {"train_loss": -10.376794815063477, "global_step": 457451, "epoch": 2722} {"train_loss": -11.821674346923828, "global_step": 457452, "epoch": 2722} {"train_loss": -11.257559776306152, "global_step": 457453, "epoch": 2722} {"train_loss": -11.78797435760498, "global_step": 457454, "epoch": 2722} {"train_loss": -11.629997253417969, "global_step": 457455, "epoch": 2722} {"train_loss": -11.0433349609375, "global_step": 457456, "epoch": 2722} {"train_loss": -11.959569931030273, "global_step": 457457, "epoch": 2722} {"train_loss": -11.035418510437012, "global_step": 457458, "epoch": 2722} {"train_loss": -11.772998809814453, "global_step": 457459, "epoch": 2722} {"train_loss": -11.707901954650879, "global_step": 457460, "epoch": 2722} {"train_loss": -11.926301956176758, "global_step": 457461, "epoch": 2722} {"train_loss": -11.64255428314209, "global_step": 457462, "epoch": 2722} {"train_loss": -12.374174407550267, "global_step": 457463, "epoch": 2722, "val_loss": 313048.0} {"train_loss": -11.439620971679688, "global_step": 457464, "epoch": 2723} {"train_loss": -11.541203498840332, "global_step": 457465, "epoch": 2723} {"train_loss": -11.051589965820312, "global_step": 457466, "epoch": 2723} {"train_loss": -11.596733093261719, "global_step": 457467, "epoch": 2723} {"train_loss": -10.876934051513672, "global_step": 457468, "epoch": 2723} {"train_loss": -11.037445068359375, "global_step": 457469, "epoch": 2723} {"train_loss": -10.919005393981934, "global_step": 457470, "epoch": 2723} {"train_loss": -11.617912292480469, "global_step": 457471, "epoch": 2723} {"train_loss": -10.466777801513672, "global_step": 457472, "epoch": 2723} {"train_loss": -11.009360313415527, "global_step": 457473, "epoch": 2723} {"train_loss": -10.779292106628418, "global_step": 457474, "epoch": 2723} {"train_loss": -11.204020500183105, "global_step": 457475, "epoch": 2723} {"train_loss": -11.192888259887695, "global_step": 457476, "epoch": 2723} {"train_loss": -12.016838073730469, "global_step": 457477, "epoch": 2723} {"train_loss": -11.461389541625977, "global_step": 457478, "epoch": 2723} {"train_loss": -11.838664054870605, "global_step": 457479, "epoch": 2723} {"train_loss": -12.063645362854004, "global_step": 457480, "epoch": 2723} {"train_loss": -11.780287742614746, "global_step": 457481, "epoch": 2723} {"train_loss": -11.404254913330078, "global_step": 457482, "epoch": 2723} {"train_loss": -12.094676971435547, "global_step": 457483, "epoch": 2723} {"train_loss": -11.38308334350586, "global_step": 457484, "epoch": 2723} {"train_loss": -12.35301399230957, "global_step": 457485, "epoch": 2723} {"train_loss": -11.838586807250977, "global_step": 457486, "epoch": 2723} {"train_loss": -12.20329475402832, "global_step": 457487, "epoch": 2723} {"train_loss": -12.060144424438477, "global_step": 457488, "epoch": 2723} {"train_loss": -12.009078979492188, "global_step": 457489, "epoch": 2723} {"train_loss": -12.311715126037598, "global_step": 457490, "epoch": 2723} {"train_loss": -12.003049850463867, "global_step": 457491, "epoch": 2723} {"train_loss": -12.463830947875977, "global_step": 457492, "epoch": 2723} {"train_loss": -12.313573837280273, "global_step": 457493, "epoch": 2723} {"train_loss": -12.274507522583008, "global_step": 457494, "epoch": 2723} {"train_loss": -12.417240142822266, "global_step": 457495, "epoch": 2723} {"train_loss": -12.39099407196045, "global_step": 457496, "epoch": 2723} {"train_loss": -12.192647933959961, "global_step": 457497, "epoch": 2723} {"train_loss": -12.30798625946045, "global_step": 457498, "epoch": 2723} {"train_loss": -12.412663459777832, "global_step": 457499, "epoch": 2723} {"train_loss": -12.513103485107422, "global_step": 457500, "epoch": 2723} {"train_loss": -12.592399597167969, "global_step": 457501, "epoch": 2723} {"train_loss": -12.446014404296875, "global_step": 457502, "epoch": 2723} {"train_loss": -12.694414138793945, "global_step": 457503, "epoch": 2723} {"train_loss": -12.397316932678223, "global_step": 457504, "epoch": 2723} {"train_loss": -12.515462875366211, "global_step": 457505, "epoch": 2723} {"train_loss": -12.317801475524902, "global_step": 457506, "epoch": 2723} {"train_loss": -12.362456321716309, "global_step": 457507, "epoch": 2723} {"train_loss": -12.403202056884766, "global_step": 457508, "epoch": 2723} {"train_loss": -12.070965766906738, "global_step": 457509, "epoch": 2723} {"train_loss": -12.427169799804688, "global_step": 457510, "epoch": 2723} {"train_loss": -11.956236839294434, "global_step": 457511, "epoch": 2723} {"train_loss": -12.236072540283203, "global_step": 457512, "epoch": 2723} {"train_loss": -12.19344425201416, "global_step": 457513, "epoch": 2723} {"train_loss": -12.08598518371582, "global_step": 457514, "epoch": 2723} {"train_loss": -12.585164070129395, "global_step": 457515, "epoch": 2723} {"train_loss": -11.853096008300781, "global_step": 457516, "epoch": 2723} {"train_loss": -12.001930236816406, "global_step": 457517, "epoch": 2723} {"train_loss": -11.927837371826172, "global_step": 457518, "epoch": 2723} {"train_loss": -12.013362884521484, "global_step": 457519, "epoch": 2723} {"train_loss": -12.508575439453125, "global_step": 457520, "epoch": 2723} {"train_loss": -12.002370834350586, "global_step": 457521, "epoch": 2723} {"train_loss": -12.046810150146484, "global_step": 457522, "epoch": 2723} {"train_loss": -12.010866165161133, "global_step": 457523, "epoch": 2723} {"train_loss": -11.820205688476562, "global_step": 457524, "epoch": 2723} {"train_loss": -12.384439468383789, "global_step": 457525, "epoch": 2723} {"train_loss": -11.553844451904297, "global_step": 457526, "epoch": 2723} {"train_loss": -11.696269989013672, "global_step": 457527, "epoch": 2723} {"train_loss": -12.375146865844727, "global_step": 457528, "epoch": 2723} {"train_loss": -12.088191986083984, "global_step": 457529, "epoch": 2723} {"train_loss": -12.308560371398926, "global_step": 457530, "epoch": 2723} {"train_loss": -11.85329532623291, "global_step": 457531, "epoch": 2723} {"train_loss": -12.103229522705078, "global_step": 457532, "epoch": 2723} {"train_loss": -11.999181747436523, "global_step": 457533, "epoch": 2723} {"train_loss": -11.744221687316895, "global_step": 457534, "epoch": 2723} {"train_loss": -12.158026695251465, "global_step": 457535, "epoch": 2723} {"train_loss": -11.797201156616211, "global_step": 457536, "epoch": 2723} {"train_loss": -11.936320304870605, "global_step": 457537, "epoch": 2723} {"train_loss": -12.155466079711914, "global_step": 457538, "epoch": 2723} {"train_loss": -11.940433502197266, "global_step": 457539, "epoch": 2723} {"train_loss": -12.182886123657227, "global_step": 457540, "epoch": 2723} {"train_loss": -11.826471328735352, "global_step": 457541, "epoch": 2723} {"train_loss": -12.298896789550781, "global_step": 457542, "epoch": 2723} {"train_loss": -11.831464767456055, "global_step": 457543, "epoch": 2723} {"train_loss": -11.714727401733398, "global_step": 457544, "epoch": 2723} {"train_loss": -12.419160842895508, "global_step": 457545, "epoch": 2723} {"train_loss": -12.28434944152832, "global_step": 457546, "epoch": 2723} {"train_loss": -12.558805465698242, "global_step": 457547, "epoch": 2723} {"train_loss": -12.173986434936523, "global_step": 457548, "epoch": 2723} {"train_loss": -12.234527587890625, "global_step": 457549, "epoch": 2723} {"train_loss": -12.552947998046875, "global_step": 457550, "epoch": 2723} {"train_loss": -12.420936584472656, "global_step": 457551, "epoch": 2723} {"train_loss": -12.424423217773438, "global_step": 457552, "epoch": 2723} {"train_loss": -12.663839340209961, "global_step": 457553, "epoch": 2723} {"train_loss": -12.322301864624023, "global_step": 457554, "epoch": 2723} {"train_loss": -12.415873527526855, "global_step": 457555, "epoch": 2723} {"train_loss": -12.676095962524414, "global_step": 457556, "epoch": 2723} {"train_loss": -12.415742874145508, "global_step": 457557, "epoch": 2723} {"train_loss": -12.523641586303711, "global_step": 457558, "epoch": 2723} {"train_loss": -12.151866912841797, "global_step": 457559, "epoch": 2723} {"train_loss": -12.620494842529297, "global_step": 457560, "epoch": 2723} {"train_loss": -12.412005424499512, "global_step": 457561, "epoch": 2723} {"train_loss": -12.683098793029785, "global_step": 457562, "epoch": 2723} {"train_loss": -12.614591598510742, "global_step": 457563, "epoch": 2723} {"train_loss": -12.6416015625, "global_step": 457564, "epoch": 2723} {"train_loss": -12.633955001831055, "global_step": 457565, "epoch": 2723} {"train_loss": -12.689112663269043, "global_step": 457566, "epoch": 2723} {"train_loss": -12.551301956176758, "global_step": 457567, "epoch": 2723} {"train_loss": -12.526225090026855, "global_step": 457568, "epoch": 2723} {"train_loss": -12.714715957641602, "global_step": 457569, "epoch": 2723} {"train_loss": -12.899917602539062, "global_step": 457570, "epoch": 2723} {"train_loss": -12.643918991088867, "global_step": 457571, "epoch": 2723} {"train_loss": -12.786382675170898, "global_step": 457572, "epoch": 2723} {"train_loss": -12.584757804870605, "global_step": 457573, "epoch": 2723} {"train_loss": -12.678369522094727, "global_step": 457574, "epoch": 2723} {"train_loss": -12.691147804260254, "global_step": 457575, "epoch": 2723} {"train_loss": -12.709616661071777, "global_step": 457576, "epoch": 2723} {"train_loss": -12.712284088134766, "global_step": 457577, "epoch": 2723} {"train_loss": -12.87015438079834, "global_step": 457578, "epoch": 2723} {"train_loss": -12.662117004394531, "global_step": 457579, "epoch": 2723} {"train_loss": -13.10089111328125, "global_step": 457580, "epoch": 2723} {"train_loss": -12.684240341186523, "global_step": 457581, "epoch": 2723} {"train_loss": -12.854410171508789, "global_step": 457582, "epoch": 2723} {"train_loss": -12.606220245361328, "global_step": 457583, "epoch": 2723} {"train_loss": -12.525245666503906, "global_step": 457584, "epoch": 2723} {"train_loss": -12.874216079711914, "global_step": 457585, "epoch": 2723} {"train_loss": -12.536872863769531, "global_step": 457586, "epoch": 2723} {"train_loss": -12.949172973632812, "global_step": 457587, "epoch": 2723} {"train_loss": -12.41135025024414, "global_step": 457588, "epoch": 2723} {"train_loss": -12.570100784301758, "global_step": 457589, "epoch": 2723} {"train_loss": -12.562650680541992, "global_step": 457590, "epoch": 2723} {"train_loss": -12.56363296508789, "global_step": 457591, "epoch": 2723} {"train_loss": -11.576645851135254, "global_step": 457592, "epoch": 2723} {"train_loss": -13.029821395874023, "global_step": 457593, "epoch": 2723} {"train_loss": -11.81983757019043, "global_step": 457594, "epoch": 2723} {"train_loss": -12.41749382019043, "global_step": 457595, "epoch": 2723} {"train_loss": -11.960359573364258, "global_step": 457596, "epoch": 2723} {"train_loss": -12.210441589355469, "global_step": 457597, "epoch": 2723} {"train_loss": -12.548336029052734, "global_step": 457598, "epoch": 2723} {"train_loss": -12.465730667114258, "global_step": 457599, "epoch": 2723} {"train_loss": -12.746078491210938, "global_step": 457600, "epoch": 2723} {"train_loss": -12.581536293029785, "global_step": 457601, "epoch": 2723} {"train_loss": -11.96638298034668, "global_step": 457602, "epoch": 2723} {"train_loss": -12.416912078857422, "global_step": 457603, "epoch": 2723} {"train_loss": -12.08396053314209, "global_step": 457604, "epoch": 2723} {"train_loss": -12.476497650146484, "global_step": 457605, "epoch": 2723} {"train_loss": -11.973163604736328, "global_step": 457606, "epoch": 2723} {"train_loss": -12.592229843139648, "global_step": 457607, "epoch": 2723} {"train_loss": -12.696998596191406, "global_step": 457608, "epoch": 2723} {"train_loss": -12.557290077209473, "global_step": 457609, "epoch": 2723} {"train_loss": -11.786202430725098, "global_step": 457610, "epoch": 2723} {"train_loss": -12.20698070526123, "global_step": 457611, "epoch": 2723} {"train_loss": -12.622462272644043, "global_step": 457612, "epoch": 2723} {"train_loss": -12.357463836669922, "global_step": 457613, "epoch": 2723} {"train_loss": -12.613500595092773, "global_step": 457614, "epoch": 2723} {"train_loss": -12.29649543762207, "global_step": 457615, "epoch": 2723} {"train_loss": -12.406671524047852, "global_step": 457616, "epoch": 2723} {"train_loss": -12.443374633789062, "global_step": 457617, "epoch": 2723} {"train_loss": -12.121078491210938, "global_step": 457618, "epoch": 2723} {"train_loss": -12.304615020751953, "global_step": 457619, "epoch": 2723} {"train_loss": -12.731868743896484, "global_step": 457620, "epoch": 2723} {"train_loss": -12.448943138122559, "global_step": 457621, "epoch": 2723} {"train_loss": -12.510086059570312, "global_step": 457622, "epoch": 2723} {"train_loss": -12.475860595703125, "global_step": 457623, "epoch": 2723} {"train_loss": -12.219657897949219, "global_step": 457624, "epoch": 2723} {"train_loss": -11.499077796936035, "global_step": 457625, "epoch": 2723} {"train_loss": -12.704265594482422, "global_step": 457626, "epoch": 2723} {"train_loss": -11.093289375305176, "global_step": 457627, "epoch": 2723} {"train_loss": -11.940741539001465, "global_step": 457628, "epoch": 2723} {"train_loss": -12.148059844970703, "global_step": 457629, "epoch": 2723} {"train_loss": -11.232505798339844, "global_step": 457630, "epoch": 2723} {"train_loss": -12.203155341602507, "global_step": 457631, "epoch": 2723, "val_loss": 316891.34375} {"train_loss": -11.199955940246582, "global_step": 457632, "epoch": 2724} {"train_loss": -9.880898475646973, "global_step": 457633, "epoch": 2724} {"train_loss": -10.754081726074219, "global_step": 457634, "epoch": 2724} {"train_loss": -9.999672889709473, "global_step": 457635, "epoch": 2724} {"train_loss": -10.973167419433594, "global_step": 457636, "epoch": 2724} {"train_loss": -9.660839080810547, "global_step": 457637, "epoch": 2724} {"train_loss": -11.155546188354492, "global_step": 457638, "epoch": 2724} {"train_loss": -9.501814842224121, "global_step": 457639, "epoch": 2724} {"train_loss": -11.907684326171875, "global_step": 457640, "epoch": 2724} {"train_loss": -9.29323959350586, "global_step": 457641, "epoch": 2724} {"train_loss": -10.870372772216797, "global_step": 457642, "epoch": 2724} {"train_loss": -10.127941131591797, "global_step": 457643, "epoch": 2724} {"train_loss": -11.015076637268066, "global_step": 457644, "epoch": 2724} {"train_loss": -10.506372451782227, "global_step": 457645, "epoch": 2724} {"train_loss": -10.43026351928711, "global_step": 457646, "epoch": 2724} {"train_loss": -10.181845664978027, "global_step": 457647, "epoch": 2724} {"train_loss": -11.823040008544922, "global_step": 457648, "epoch": 2724} {"train_loss": -11.421876907348633, "global_step": 457649, "epoch": 2724} {"train_loss": -11.938169479370117, "global_step": 457650, "epoch": 2724} {"train_loss": -11.646700859069824, "global_step": 457651, "epoch": 2724} {"train_loss": -12.1747407913208, "global_step": 457652, "epoch": 2724} {"train_loss": -11.982510566711426, "global_step": 457653, "epoch": 2724} {"train_loss": -11.162664413452148, "global_step": 457654, "epoch": 2724} {"train_loss": -12.068960189819336, "global_step": 457655, "epoch": 2724} {"train_loss": -11.843921661376953, "global_step": 457656, "epoch": 2724} {"train_loss": -11.011455535888672, "global_step": 457657, "epoch": 2724} {"train_loss": -11.52167797088623, "global_step": 457658, "epoch": 2724} {"train_loss": -11.201309204101562, "global_step": 457659, "epoch": 2724} {"train_loss": -12.071606636047363, "global_step": 457660, "epoch": 2724} {"train_loss": -10.961447715759277, "global_step": 457661, "epoch": 2724} {"train_loss": -12.192232131958008, "global_step": 457662, "epoch": 2724} {"train_loss": -11.336162567138672, "global_step": 457663, "epoch": 2724} {"train_loss": -12.129318237304688, "global_step": 457664, "epoch": 2724} {"train_loss": -11.945402145385742, "global_step": 457665, "epoch": 2724} {"train_loss": -12.282637596130371, "global_step": 457666, "epoch": 2724} {"train_loss": -11.9320707321167, "global_step": 457667, "epoch": 2724} {"train_loss": -12.115181922912598, "global_step": 457668, "epoch": 2724} {"train_loss": -11.584688186645508, "global_step": 457669, "epoch": 2724} {"train_loss": -11.863000869750977, "global_step": 457670, "epoch": 2724} {"train_loss": -12.408621788024902, "global_step": 457671, "epoch": 2724} {"train_loss": -11.398873329162598, "global_step": 457672, "epoch": 2724} {"train_loss": -12.194520950317383, "global_step": 457673, "epoch": 2724} {"train_loss": -11.966422080993652, "global_step": 457674, "epoch": 2724} {"train_loss": -11.805044174194336, "global_step": 457675, "epoch": 2724} {"train_loss": -12.351861953735352, "global_step": 457676, "epoch": 2724} {"train_loss": -12.322969436645508, "global_step": 457677, "epoch": 2724} {"train_loss": -12.043668746948242, "global_step": 457678, "epoch": 2724} {"train_loss": -12.26358413696289, "global_step": 457679, "epoch": 2724} {"train_loss": -12.07673168182373, "global_step": 457680, "epoch": 2724} {"train_loss": -12.360188484191895, "global_step": 457681, "epoch": 2724} {"train_loss": -11.774079322814941, "global_step": 457682, "epoch": 2724} {"train_loss": -12.509992599487305, "global_step": 457683, "epoch": 2724} {"train_loss": -11.788724899291992, "global_step": 457684, "epoch": 2724} {"train_loss": -12.332491874694824, "global_step": 457685, "epoch": 2724} {"train_loss": -12.420731544494629, "global_step": 457686, "epoch": 2724} {"train_loss": -12.195591926574707, "global_step": 457687, "epoch": 2724} {"train_loss": -12.482683181762695, "global_step": 457688, "epoch": 2724} {"train_loss": -12.551836013793945, "global_step": 457689, "epoch": 2724} {"train_loss": -12.21178913116455, "global_step": 457690, "epoch": 2724} {"train_loss": -12.59029483795166, "global_step": 457691, "epoch": 2724} {"train_loss": -12.236184120178223, "global_step": 457692, "epoch": 2724} {"train_loss": -12.215219497680664, "global_step": 457693, "epoch": 2724} {"train_loss": -12.235300064086914, "global_step": 457694, "epoch": 2724} {"train_loss": -12.284337997436523, "global_step": 457695, "epoch": 2724} {"train_loss": -12.035558700561523, "global_step": 457696, "epoch": 2724} {"train_loss": -12.54116153717041, "global_step": 457697, "epoch": 2724} {"train_loss": -12.174434661865234, "global_step": 457698, "epoch": 2724} {"train_loss": -12.752110481262207, "global_step": 457699, "epoch": 2724} {"train_loss": -12.377756118774414, "global_step": 457700, "epoch": 2724} {"train_loss": -12.313522338867188, "global_step": 457701, "epoch": 2724} {"train_loss": -12.27318000793457, "global_step": 457702, "epoch": 2724} {"train_loss": -12.49765396118164, "global_step": 457703, "epoch": 2724} {"train_loss": -12.589595794677734, "global_step": 457704, "epoch": 2724} {"train_loss": -12.438776016235352, "global_step": 457705, "epoch": 2724} {"train_loss": -12.741519927978516, "global_step": 457706, "epoch": 2724} {"train_loss": -12.18452262878418, "global_step": 457707, "epoch": 2724} {"train_loss": -12.65926742553711, "global_step": 457708, "epoch": 2724} {"train_loss": -12.373114585876465, "global_step": 457709, "epoch": 2724} {"train_loss": -12.605003356933594, "global_step": 457710, "epoch": 2724} {"train_loss": -12.753555297851562, "global_step": 457711, "epoch": 2724} {"train_loss": -12.398736953735352, "global_step": 457712, "epoch": 2724} {"train_loss": -12.636862754821777, "global_step": 457713, "epoch": 2724} {"train_loss": -12.478456497192383, "global_step": 457714, "epoch": 2724} {"train_loss": -12.735137939453125, "global_step": 457715, "epoch": 2724} {"train_loss": -12.608539581298828, "global_step": 457716, "epoch": 2724} {"train_loss": -12.822259902954102, "global_step": 457717, "epoch": 2724} {"train_loss": -12.69721508026123, "global_step": 457718, "epoch": 2724} {"train_loss": -12.855010986328125, "global_step": 457719, "epoch": 2724} {"train_loss": -12.928531646728516, "global_step": 457720, "epoch": 2724} {"train_loss": -12.90195083618164, "global_step": 457721, "epoch": 2724} {"train_loss": -12.786670684814453, "global_step": 457722, "epoch": 2724} {"train_loss": -12.821810722351074, "global_step": 457723, "epoch": 2724} {"train_loss": -12.719741821289062, "global_step": 457724, "epoch": 2724} {"train_loss": -12.797880172729492, "global_step": 457725, "epoch": 2724} {"train_loss": -12.837566375732422, "global_step": 457726, "epoch": 2724} {"train_loss": -12.838751792907715, "global_step": 457727, "epoch": 2724} {"train_loss": -12.79458999633789, "global_step": 457728, "epoch": 2724} {"train_loss": -12.841839790344238, "global_step": 457729, "epoch": 2724} {"train_loss": -12.837728500366211, "global_step": 457730, "epoch": 2724} {"train_loss": -12.869512557983398, "global_step": 457731, "epoch": 2724} {"train_loss": -12.982339859008789, "global_step": 457732, "epoch": 2724} {"train_loss": -12.689872741699219, "global_step": 457733, "epoch": 2724} {"train_loss": -12.802079200744629, "global_step": 457734, "epoch": 2724} {"train_loss": -12.908077239990234, "global_step": 457735, "epoch": 2724} {"train_loss": -12.89619255065918, "global_step": 457736, "epoch": 2724} {"train_loss": -12.835501670837402, "global_step": 457737, "epoch": 2724} {"train_loss": -12.922816276550293, "global_step": 457738, "epoch": 2724} {"train_loss": -12.886190414428711, "global_step": 457739, "epoch": 2724} {"train_loss": -13.02376651763916, "global_step": 457740, "epoch": 2724} {"train_loss": -13.025324821472168, "global_step": 457741, "epoch": 2724} {"train_loss": -12.76948356628418, "global_step": 457742, "epoch": 2724} {"train_loss": -12.922045707702637, "global_step": 457743, "epoch": 2724} {"train_loss": -12.972434997558594, "global_step": 457744, "epoch": 2724} {"train_loss": -12.771923065185547, "global_step": 457745, "epoch": 2724} {"train_loss": -12.790874481201172, "global_step": 457746, "epoch": 2724} {"train_loss": -12.7487154006958, "global_step": 457747, "epoch": 2724} {"train_loss": -13.090739250183105, "global_step": 457748, "epoch": 2724} {"train_loss": -13.033700942993164, "global_step": 457749, "epoch": 2724} {"train_loss": -12.928516387939453, "global_step": 457750, "epoch": 2724} {"train_loss": -13.02328872680664, "global_step": 457751, "epoch": 2724} {"train_loss": -12.841371536254883, "global_step": 457752, "epoch": 2724} {"train_loss": -12.755300521850586, "global_step": 457753, "epoch": 2724} {"train_loss": -12.793216705322266, "global_step": 457754, "epoch": 2724} {"train_loss": -12.733293533325195, "global_step": 457755, "epoch": 2724} {"train_loss": -12.57111930847168, "global_step": 457756, "epoch": 2724} {"train_loss": -12.917705535888672, "global_step": 457757, "epoch": 2724} {"train_loss": -12.585514068603516, "global_step": 457758, "epoch": 2724} {"train_loss": -11.43353271484375, "global_step": 457759, "epoch": 2724} {"train_loss": -11.284147262573242, "global_step": 457760, "epoch": 2724} {"train_loss": -12.649534225463867, "global_step": 457761, "epoch": 2724} {"train_loss": -12.715693473815918, "global_step": 457762, "epoch": 2724} {"train_loss": -12.205949783325195, "global_step": 457763, "epoch": 2724} {"train_loss": -10.735904693603516, "global_step": 457764, "epoch": 2724} {"train_loss": -11.882508277893066, "global_step": 457765, "epoch": 2724} {"train_loss": -12.348714828491211, "global_step": 457766, "epoch": 2724} {"train_loss": -11.405384063720703, "global_step": 457767, "epoch": 2724} {"train_loss": -11.456367492675781, "global_step": 457768, "epoch": 2724} {"train_loss": -11.958300590515137, "global_step": 457769, "epoch": 2724} {"train_loss": -12.468764305114746, "global_step": 457770, "epoch": 2724} {"train_loss": -10.655536651611328, "global_step": 457771, "epoch": 2724} {"train_loss": -12.283447265625, "global_step": 457772, "epoch": 2724} {"train_loss": -11.390569686889648, "global_step": 457773, "epoch": 2724} {"train_loss": -11.27975082397461, "global_step": 457774, "epoch": 2724} {"train_loss": -12.689477920532227, "global_step": 457775, "epoch": 2724} {"train_loss": -11.751020431518555, "global_step": 457776, "epoch": 2724} {"train_loss": -11.450780868530273, "global_step": 457777, "epoch": 2724} {"train_loss": -11.426244735717773, "global_step": 457778, "epoch": 2724} {"train_loss": -11.712711334228516, "global_step": 457779, "epoch": 2724} {"train_loss": -12.034226417541504, "global_step": 457780, "epoch": 2724} {"train_loss": -12.081015586853027, "global_step": 457781, "epoch": 2724} {"train_loss": -11.24957275390625, "global_step": 457782, "epoch": 2724} {"train_loss": -11.961867332458496, "global_step": 457783, "epoch": 2724} {"train_loss": -11.55972671508789, "global_step": 457784, "epoch": 2724} {"train_loss": -10.56495475769043, "global_step": 457785, "epoch": 2724} {"train_loss": -9.927814483642578, "global_step": 457786, "epoch": 2724} {"train_loss": -11.22508430480957, "global_step": 457787, "epoch": 2724} {"train_loss": -11.618804931640625, "global_step": 457788, "epoch": 2724} {"train_loss": -11.731471061706543, "global_step": 457789, "epoch": 2724} {"train_loss": -12.06118392944336, "global_step": 457790, "epoch": 2724} {"train_loss": -12.008813858032227, "global_step": 457791, "epoch": 2724} {"train_loss": -12.329376220703125, "global_step": 457792, "epoch": 2724} {"train_loss": -12.009766578674316, "global_step": 457793, "epoch": 2724} {"train_loss": -12.596237182617188, "global_step": 457794, "epoch": 2724} {"train_loss": -12.35891342163086, "global_step": 457795, "epoch": 2724} {"train_loss": -12.230539321899414, "global_step": 457796, "epoch": 2724} {"train_loss": -12.542738914489746, "global_step": 457797, "epoch": 2724} {"train_loss": -12.34299087524414, "global_step": 457798, "epoch": 2724} {"train_loss": -12.073643985248747, "global_step": 457799, "epoch": 2724, "val_loss": 313119.34375} {"train_loss": -12.37131118774414, "global_step": 457800, "epoch": 2725} {"train_loss": -12.544501304626465, "global_step": 457801, "epoch": 2725} {"train_loss": -12.398687362670898, "global_step": 457802, "epoch": 2725} {"train_loss": -12.464966773986816, "global_step": 457803, "epoch": 2725} {"train_loss": -12.335283279418945, "global_step": 457804, "epoch": 2725} {"train_loss": -12.611172676086426, "global_step": 457805, "epoch": 2725} {"train_loss": -12.432241439819336, "global_step": 457806, "epoch": 2725} {"train_loss": -12.806386947631836, "global_step": 457807, "epoch": 2725} {"train_loss": -12.345359802246094, "global_step": 457808, "epoch": 2725} {"train_loss": -12.605140686035156, "global_step": 457809, "epoch": 2725} {"train_loss": -12.69656753540039, "global_step": 457810, "epoch": 2725} {"train_loss": -12.806354522705078, "global_step": 457811, "epoch": 2725} {"train_loss": -12.525546073913574, "global_step": 457812, "epoch": 2725} {"train_loss": -12.837312698364258, "global_step": 457813, "epoch": 2725} {"train_loss": -12.689485549926758, "global_step": 457814, "epoch": 2725} {"train_loss": -12.768238067626953, "global_step": 457815, "epoch": 2725} {"train_loss": -12.8092622756958, "global_step": 457816, "epoch": 2725} {"train_loss": -12.734395027160645, "global_step": 457817, "epoch": 2725} {"train_loss": -12.855716705322266, "global_step": 457818, "epoch": 2725} {"train_loss": -12.735483169555664, "global_step": 457819, "epoch": 2725} {"train_loss": -12.380892753601074, "global_step": 457820, "epoch": 2725} {"train_loss": -12.222243309020996, "global_step": 457821, "epoch": 2725} {"train_loss": -12.845972061157227, "global_step": 457822, "epoch": 2725} {"train_loss": -12.538334846496582, "global_step": 457823, "epoch": 2725} {"train_loss": -12.844179153442383, "global_step": 457824, "epoch": 2725} {"train_loss": -12.644585609436035, "global_step": 457825, "epoch": 2725} {"train_loss": -12.665231704711914, "global_step": 457826, "epoch": 2725} {"train_loss": -12.876385688781738, "global_step": 457827, "epoch": 2725} {"train_loss": -12.65388298034668, "global_step": 457828, "epoch": 2725} {"train_loss": -12.755802154541016, "global_step": 457829, "epoch": 2725} {"train_loss": -12.883106231689453, "global_step": 457830, "epoch": 2725} {"train_loss": -12.746112823486328, "global_step": 457831, "epoch": 2725} {"train_loss": -12.842353820800781, "global_step": 457832, "epoch": 2725} {"train_loss": -12.604592323303223, "global_step": 457833, "epoch": 2725} {"train_loss": -12.820466041564941, "global_step": 457834, "epoch": 2725} {"train_loss": -12.951987266540527, "global_step": 457835, "epoch": 2725} {"train_loss": -12.786086082458496, "global_step": 457836, "epoch": 2725} {"train_loss": -12.594987869262695, "global_step": 457837, "epoch": 2725} {"train_loss": -12.831502914428711, "global_step": 457838, "epoch": 2725} {"train_loss": -12.84260368347168, "global_step": 457839, "epoch": 2725} {"train_loss": -12.824899673461914, "global_step": 457840, "epoch": 2725} {"train_loss": -12.808895111083984, "global_step": 457841, "epoch": 2725} {"train_loss": -12.908199310302734, "global_step": 457842, "epoch": 2725} {"train_loss": -12.907073974609375, "global_step": 457843, "epoch": 2725} {"train_loss": -12.934771537780762, "global_step": 457844, "epoch": 2725} {"train_loss": -12.478422164916992, "global_step": 457845, "epoch": 2725} {"train_loss": -12.324886322021484, "global_step": 457846, "epoch": 2725} {"train_loss": -12.929777145385742, "global_step": 457847, "epoch": 2725} {"train_loss": -12.412534713745117, "global_step": 457848, "epoch": 2725} {"train_loss": -11.058534622192383, "global_step": 457849, "epoch": 2725} {"train_loss": -12.265369415283203, "global_step": 457850, "epoch": 2725} {"train_loss": -12.722196578979492, "global_step": 457851, "epoch": 2725} {"train_loss": -12.500368118286133, "global_step": 457852, "epoch": 2725} {"train_loss": -12.496363639831543, "global_step": 457853, "epoch": 2725} {"train_loss": -12.214547157287598, "global_step": 457854, "epoch": 2725} {"train_loss": -12.736719131469727, "global_step": 457855, "epoch": 2725} {"train_loss": -12.00183391571045, "global_step": 457856, "epoch": 2725} {"train_loss": -12.395102500915527, "global_step": 457857, "epoch": 2725} {"train_loss": -12.828022956848145, "global_step": 457858, "epoch": 2725} {"train_loss": -12.824056625366211, "global_step": 457859, "epoch": 2725} {"train_loss": -12.118419647216797, "global_step": 457860, "epoch": 2725} {"train_loss": -11.787666320800781, "global_step": 457861, "epoch": 2725} {"train_loss": -11.81607437133789, "global_step": 457862, "epoch": 2725} {"train_loss": -12.625585556030273, "global_step": 457863, "epoch": 2725} {"train_loss": -12.314900398254395, "global_step": 457864, "epoch": 2725} {"train_loss": -11.516407012939453, "global_step": 457865, "epoch": 2725} {"train_loss": -11.997180938720703, "global_step": 457866, "epoch": 2725} {"train_loss": -11.33798885345459, "global_step": 457867, "epoch": 2725} {"train_loss": -11.030165672302246, "global_step": 457868, "epoch": 2725} {"train_loss": -12.081801414489746, "global_step": 457869, "epoch": 2725} {"train_loss": -9.45248031616211, "global_step": 457870, "epoch": 2725} {"train_loss": -10.245498657226562, "global_step": 457871, "epoch": 2725} {"train_loss": -10.81309700012207, "global_step": 457872, "epoch": 2725} {"train_loss": -8.97665023803711, "global_step": 457873, "epoch": 2725} {"train_loss": -10.80181884765625, "global_step": 457874, "epoch": 2725} {"train_loss": -10.774630546569824, "global_step": 457875, "epoch": 2725} {"train_loss": -10.047985076904297, "global_step": 457876, "epoch": 2725} {"train_loss": -9.279840469360352, "global_step": 457877, "epoch": 2725} {"train_loss": -10.004085540771484, "global_step": 457878, "epoch": 2725} {"train_loss": -10.083663940429688, "global_step": 457879, "epoch": 2725} {"train_loss": -9.713521003723145, "global_step": 457880, "epoch": 2725} {"train_loss": -10.946306228637695, "global_step": 457881, "epoch": 2725} {"train_loss": -10.005522727966309, "global_step": 457882, "epoch": 2725} {"train_loss": -10.1470365524292, "global_step": 457883, "epoch": 2725} {"train_loss": -10.78148078918457, "global_step": 457884, "epoch": 2725} {"train_loss": -10.794368743896484, "global_step": 457885, "epoch": 2725} {"train_loss": -10.571962356567383, "global_step": 457886, "epoch": 2725} {"train_loss": -11.404677391052246, "global_step": 457887, "epoch": 2725} {"train_loss": -10.546797752380371, "global_step": 457888, "epoch": 2725} {"train_loss": -10.773642539978027, "global_step": 457889, "epoch": 2725} {"train_loss": -10.430355072021484, "global_step": 457890, "epoch": 2725} {"train_loss": -11.30107307434082, "global_step": 457891, "epoch": 2725} {"train_loss": -10.54415512084961, "global_step": 457892, "epoch": 2725} {"train_loss": -11.92213249206543, "global_step": 457893, "epoch": 2725} {"train_loss": -10.6176118850708, "global_step": 457894, "epoch": 2725} {"train_loss": -11.268031120300293, "global_step": 457895, "epoch": 2725} {"train_loss": -11.592616081237793, "global_step": 457896, "epoch": 2725} {"train_loss": -11.305732727050781, "global_step": 457897, "epoch": 2725} {"train_loss": -11.646127700805664, "global_step": 457898, "epoch": 2725} {"train_loss": -11.03866958618164, "global_step": 457899, "epoch": 2725} {"train_loss": -11.768879890441895, "global_step": 457900, "epoch": 2725} {"train_loss": -11.00452995300293, "global_step": 457901, "epoch": 2725} {"train_loss": -11.86976432800293, "global_step": 457902, "epoch": 2725} {"train_loss": -11.329304695129395, "global_step": 457903, "epoch": 2725} {"train_loss": -12.150148391723633, "global_step": 457904, "epoch": 2725} {"train_loss": -11.891213417053223, "global_step": 457905, "epoch": 2725} {"train_loss": -11.971148490905762, "global_step": 457906, "epoch": 2725} {"train_loss": -11.868635177612305, "global_step": 457907, "epoch": 2725} {"train_loss": -11.965801239013672, "global_step": 457908, "epoch": 2725} {"train_loss": -12.19636344909668, "global_step": 457909, "epoch": 2725} {"train_loss": -11.524410247802734, "global_step": 457910, "epoch": 2725} {"train_loss": -12.282402038574219, "global_step": 457911, "epoch": 2725} {"train_loss": -11.829879760742188, "global_step": 457912, "epoch": 2725} {"train_loss": -11.954133987426758, "global_step": 457913, "epoch": 2725} {"train_loss": -12.013861656188965, "global_step": 457914, "epoch": 2725} {"train_loss": -12.143409729003906, "global_step": 457915, "epoch": 2725} {"train_loss": -11.73102855682373, "global_step": 457916, "epoch": 2725} {"train_loss": -11.65382194519043, "global_step": 457917, "epoch": 2725} {"train_loss": -12.177511215209961, "global_step": 457918, "epoch": 2725} {"train_loss": -11.83498764038086, "global_step": 457919, "epoch": 2725} {"train_loss": -12.216592788696289, "global_step": 457920, "epoch": 2725} {"train_loss": -12.052654266357422, "global_step": 457921, "epoch": 2725} {"train_loss": -12.117976188659668, "global_step": 457922, "epoch": 2725} {"train_loss": -12.398014068603516, "global_step": 457923, "epoch": 2725} {"train_loss": -12.167801856994629, "global_step": 457924, "epoch": 2725} {"train_loss": -12.201879501342773, "global_step": 457925, "epoch": 2725} {"train_loss": -12.136907577514648, "global_step": 457926, "epoch": 2725} {"train_loss": -12.484045028686523, "global_step": 457927, "epoch": 2725} {"train_loss": -12.650118827819824, "global_step": 457928, "epoch": 2725} {"train_loss": -11.964771270751953, "global_step": 457929, "epoch": 2725} {"train_loss": -12.542927742004395, "global_step": 457930, "epoch": 2725} {"train_loss": -12.483804702758789, "global_step": 457931, "epoch": 2725} {"train_loss": -12.458877563476562, "global_step": 457932, "epoch": 2725} {"train_loss": -12.4755277633667, "global_step": 457933, "epoch": 2725} {"train_loss": -12.481847763061523, "global_step": 457934, "epoch": 2725} {"train_loss": -12.59816837310791, "global_step": 457935, "epoch": 2725} {"train_loss": -12.461766242980957, "global_step": 457936, "epoch": 2725} {"train_loss": -12.334250450134277, "global_step": 457937, "epoch": 2725} {"train_loss": -12.505071640014648, "global_step": 457938, "epoch": 2725} {"train_loss": -12.80544662475586, "global_step": 457939, "epoch": 2725} {"train_loss": -12.542722702026367, "global_step": 457940, "epoch": 2725} {"train_loss": -12.667217254638672, "global_step": 457941, "epoch": 2725} {"train_loss": -12.600022315979004, "global_step": 457942, "epoch": 2725} {"train_loss": -12.727291107177734, "global_step": 457943, "epoch": 2725} {"train_loss": -12.659711837768555, "global_step": 457944, "epoch": 2725} {"train_loss": -12.508140563964844, "global_step": 457945, "epoch": 2725} {"train_loss": -12.572148323059082, "global_step": 457946, "epoch": 2725} {"train_loss": -12.636571884155273, "global_step": 457947, "epoch": 2725} {"train_loss": -12.724105834960938, "global_step": 457948, "epoch": 2725} {"train_loss": -12.52330493927002, "global_step": 457949, "epoch": 2725} {"train_loss": -12.496299743652344, "global_step": 457950, "epoch": 2725} {"train_loss": -12.605293273925781, "global_step": 457951, "epoch": 2725} {"train_loss": -12.62048625946045, "global_step": 457952, "epoch": 2725} {"train_loss": -12.299261093139648, "global_step": 457953, "epoch": 2725} {"train_loss": -12.361385345458984, "global_step": 457954, "epoch": 2725} {"train_loss": -12.302534103393555, "global_step": 457955, "epoch": 2725} {"train_loss": -11.768880844116211, "global_step": 457956, "epoch": 2725} {"train_loss": -12.601318359375, "global_step": 457957, "epoch": 2725} {"train_loss": -12.331048965454102, "global_step": 457958, "epoch": 2725} {"train_loss": -12.622934341430664, "global_step": 457959, "epoch": 2725} {"train_loss": -12.42772388458252, "global_step": 457960, "epoch": 2725} {"train_loss": -12.496931076049805, "global_step": 457961, "epoch": 2725} {"train_loss": -12.796162605285645, "global_step": 457962, "epoch": 2725} {"train_loss": -12.113729476928711, "global_step": 457963, "epoch": 2725} {"train_loss": -12.891407012939453, "global_step": 457964, "epoch": 2725} {"train_loss": -12.187931060791016, "global_step": 457965, "epoch": 2725} {"train_loss": -12.536205291748047, "global_step": 457966, "epoch": 2725} {"train_loss": -12.076206241335187, "global_step": 457967, "epoch": 2725, "val_loss": 316479.9375, "train_action_mse_error": 1.3514689207077026} {"train_loss": -12.498933792114258, "global_step": 457968, "epoch": 2726} {"train_loss": -12.534954071044922, "global_step": 457969, "epoch": 2726} {"train_loss": -12.541236877441406, "global_step": 457970, "epoch": 2726} {"train_loss": -12.743561744689941, "global_step": 457971, "epoch": 2726} {"train_loss": -12.733617782592773, "global_step": 457972, "epoch": 2726} {"train_loss": -12.483960151672363, "global_step": 457973, "epoch": 2726} {"train_loss": -12.230804443359375, "global_step": 457974, "epoch": 2726} {"train_loss": -12.413354873657227, "global_step": 457975, "epoch": 2726} {"train_loss": -12.616378784179688, "global_step": 457976, "epoch": 2726} {"train_loss": -12.577068328857422, "global_step": 457977, "epoch": 2726} {"train_loss": -12.61874771118164, "global_step": 457978, "epoch": 2726} {"train_loss": -12.572282791137695, "global_step": 457979, "epoch": 2726} {"train_loss": -12.932540893554688, "global_step": 457980, "epoch": 2726} {"train_loss": -12.738321304321289, "global_step": 457981, "epoch": 2726} {"train_loss": -12.78325080871582, "global_step": 457982, "epoch": 2726} {"train_loss": -12.989652633666992, "global_step": 457983, "epoch": 2726} {"train_loss": -12.640935897827148, "global_step": 457984, "epoch": 2726} {"train_loss": -12.675065994262695, "global_step": 457985, "epoch": 2726} {"train_loss": -12.959051132202148, "global_step": 457986, "epoch": 2726} {"train_loss": -12.788190841674805, "global_step": 457987, "epoch": 2726} {"train_loss": -12.87005615234375, "global_step": 457988, "epoch": 2726} {"train_loss": -12.91273307800293, "global_step": 457989, "epoch": 2726} {"train_loss": -12.898455619812012, "global_step": 457990, "epoch": 2726} {"train_loss": -12.605173110961914, "global_step": 457991, "epoch": 2726} {"train_loss": -12.78386116027832, "global_step": 457992, "epoch": 2726} {"train_loss": -12.735700607299805, "global_step": 457993, "epoch": 2726} {"train_loss": -12.800334930419922, "global_step": 457994, "epoch": 2726} {"train_loss": -12.712099075317383, "global_step": 457995, "epoch": 2726} {"train_loss": -13.132966995239258, "global_step": 457996, "epoch": 2726} {"train_loss": -12.667463302612305, "global_step": 457997, "epoch": 2726} {"train_loss": -12.69107437133789, "global_step": 457998, "epoch": 2726} {"train_loss": -12.680350303649902, "global_step": 457999, "epoch": 2726} {"train_loss": -12.7849760055542, "global_step": 458000, "epoch": 2726} {"train_loss": -12.834817886352539, "global_step": 458001, "epoch": 2726} {"train_loss": -12.703060150146484, "global_step": 458002, "epoch": 2726} {"train_loss": -12.751626968383789, "global_step": 458003, "epoch": 2726} {"train_loss": -12.661477088928223, "global_step": 458004, "epoch": 2726} {"train_loss": -12.798974990844727, "global_step": 458005, "epoch": 2726} {"train_loss": -12.483665466308594, "global_step": 458006, "epoch": 2726} {"train_loss": -12.751595497131348, "global_step": 458007, "epoch": 2726} {"train_loss": -12.47944450378418, "global_step": 458008, "epoch": 2726} {"train_loss": -12.673107147216797, "global_step": 458009, "epoch": 2726} {"train_loss": -12.513778686523438, "global_step": 458010, "epoch": 2726} {"train_loss": -12.395044326782227, "global_step": 458011, "epoch": 2726} {"train_loss": -12.141152381896973, "global_step": 458012, "epoch": 2726} {"train_loss": -11.864762306213379, "global_step": 458013, "epoch": 2726} {"train_loss": -12.668665885925293, "global_step": 458014, "epoch": 2726} {"train_loss": -11.665925979614258, "global_step": 458015, "epoch": 2726} {"train_loss": -12.4224271774292, "global_step": 458016, "epoch": 2726} {"train_loss": -12.118337631225586, "global_step": 458017, "epoch": 2726} {"train_loss": -11.522456169128418, "global_step": 458018, "epoch": 2726} {"train_loss": -11.968280792236328, "global_step": 458019, "epoch": 2726} {"train_loss": -10.914270401000977, "global_step": 458020, "epoch": 2726} {"train_loss": -10.942848205566406, "global_step": 458021, "epoch": 2726} {"train_loss": -11.215486526489258, "global_step": 458022, "epoch": 2726} {"train_loss": -11.644292831420898, "global_step": 458023, "epoch": 2726} {"train_loss": -10.853723526000977, "global_step": 458024, "epoch": 2726} {"train_loss": -12.21524429321289, "global_step": 458025, "epoch": 2726} {"train_loss": -11.26739501953125, "global_step": 458026, "epoch": 2726} {"train_loss": -12.386283874511719, "global_step": 458027, "epoch": 2726} {"train_loss": -11.505928039550781, "global_step": 458028, "epoch": 2726} {"train_loss": -11.494810104370117, "global_step": 458029, "epoch": 2726} {"train_loss": -11.710970878601074, "global_step": 458030, "epoch": 2726} {"train_loss": -11.749120712280273, "global_step": 458031, "epoch": 2726} {"train_loss": -11.809743881225586, "global_step": 458032, "epoch": 2726} {"train_loss": -10.661294937133789, "global_step": 458033, "epoch": 2726} {"train_loss": -11.869607925415039, "global_step": 458034, "epoch": 2726} {"train_loss": -11.764286041259766, "global_step": 458035, "epoch": 2726} {"train_loss": -11.723031997680664, "global_step": 458036, "epoch": 2726} {"train_loss": -11.791455268859863, "global_step": 458037, "epoch": 2726} {"train_loss": -12.103805541992188, "global_step": 458038, "epoch": 2726} {"train_loss": -11.219271659851074, "global_step": 458039, "epoch": 2726} {"train_loss": -11.588369369506836, "global_step": 458040, "epoch": 2726} {"train_loss": -11.9487943649292, "global_step": 458041, "epoch": 2726} {"train_loss": -11.932941436767578, "global_step": 458042, "epoch": 2726} {"train_loss": -12.078332901000977, "global_step": 458043, "epoch": 2726} {"train_loss": -12.637921333312988, "global_step": 458044, "epoch": 2726} {"train_loss": -11.749658584594727, "global_step": 458045, "epoch": 2726} {"train_loss": -12.409708023071289, "global_step": 458046, "epoch": 2726} {"train_loss": -11.876352310180664, "global_step": 458047, "epoch": 2726} {"train_loss": -12.40267276763916, "global_step": 458048, "epoch": 2726} {"train_loss": -12.313484191894531, "global_step": 458049, "epoch": 2726} {"train_loss": -11.733159065246582, "global_step": 458050, "epoch": 2726} {"train_loss": -11.933162689208984, "global_step": 458051, "epoch": 2726} {"train_loss": -12.654419898986816, "global_step": 458052, "epoch": 2726} {"train_loss": -12.286266326904297, "global_step": 458053, "epoch": 2726} {"train_loss": -12.379959106445312, "global_step": 458054, "epoch": 2726} {"train_loss": -12.24409294128418, "global_step": 458055, "epoch": 2726} {"train_loss": -11.828566551208496, "global_step": 458056, "epoch": 2726} {"train_loss": -12.240710258483887, "global_step": 458057, "epoch": 2726} {"train_loss": -12.333797454833984, "global_step": 458058, "epoch": 2726} {"train_loss": -12.064083099365234, "global_step": 458059, "epoch": 2726} {"train_loss": -11.744877815246582, "global_step": 458060, "epoch": 2726} {"train_loss": -12.348448753356934, "global_step": 458061, "epoch": 2726} {"train_loss": -12.177141189575195, "global_step": 458062, "epoch": 2726} {"train_loss": -12.13737964630127, "global_step": 458063, "epoch": 2726} {"train_loss": -12.457195281982422, "global_step": 458064, "epoch": 2726} {"train_loss": -12.535465240478516, "global_step": 458065, "epoch": 2726} {"train_loss": -12.560912132263184, "global_step": 458066, "epoch": 2726} {"train_loss": -12.468439102172852, "global_step": 458067, "epoch": 2726} {"train_loss": -12.241897583007812, "global_step": 458068, "epoch": 2726} {"train_loss": -12.409029006958008, "global_step": 458069, "epoch": 2726} {"train_loss": -12.515583038330078, "global_step": 458070, "epoch": 2726} {"train_loss": -12.490194320678711, "global_step": 458071, "epoch": 2726} {"train_loss": -12.553167343139648, "global_step": 458072, "epoch": 2726} {"train_loss": -12.221607208251953, "global_step": 458073, "epoch": 2726} {"train_loss": -12.507335662841797, "global_step": 458074, "epoch": 2726} {"train_loss": -12.719830513000488, "global_step": 458075, "epoch": 2726} {"train_loss": -12.562047004699707, "global_step": 458076, "epoch": 2726} {"train_loss": -12.816267013549805, "global_step": 458077, "epoch": 2726} {"train_loss": -12.47332763671875, "global_step": 458078, "epoch": 2726} {"train_loss": -12.414048194885254, "global_step": 458079, "epoch": 2726} {"train_loss": -12.6980562210083, "global_step": 458080, "epoch": 2726} {"train_loss": -12.126581192016602, "global_step": 458081, "epoch": 2726} {"train_loss": -12.426722526550293, "global_step": 458082, "epoch": 2726} {"train_loss": -12.639673233032227, "global_step": 458083, "epoch": 2726} {"train_loss": -12.32870101928711, "global_step": 458084, "epoch": 2726} {"train_loss": -12.462570190429688, "global_step": 458085, "epoch": 2726} {"train_loss": -12.904809951782227, "global_step": 458086, "epoch": 2726} {"train_loss": -12.457337379455566, "global_step": 458087, "epoch": 2726} {"train_loss": -12.683048248291016, "global_step": 458088, "epoch": 2726} {"train_loss": -12.80188274383545, "global_step": 458089, "epoch": 2726} {"train_loss": -12.724536895751953, "global_step": 458090, "epoch": 2726} {"train_loss": -12.793912887573242, "global_step": 458091, "epoch": 2726} {"train_loss": -12.658906936645508, "global_step": 458092, "epoch": 2726} {"train_loss": -12.72817611694336, "global_step": 458093, "epoch": 2726} {"train_loss": -12.803984642028809, "global_step": 458094, "epoch": 2726} {"train_loss": -12.921841621398926, "global_step": 458095, "epoch": 2726} {"train_loss": -12.45307731628418, "global_step": 458096, "epoch": 2726} {"train_loss": -12.663557052612305, "global_step": 458097, "epoch": 2726} {"train_loss": -12.78571891784668, "global_step": 458098, "epoch": 2726} {"train_loss": -12.520111083984375, "global_step": 458099, "epoch": 2726} {"train_loss": -12.395322799682617, "global_step": 458100, "epoch": 2726} {"train_loss": -12.418968200683594, "global_step": 458101, "epoch": 2726} {"train_loss": -12.118221282958984, "global_step": 458102, "epoch": 2726} {"train_loss": -12.425034523010254, "global_step": 458103, "epoch": 2726} {"train_loss": -12.701618194580078, "global_step": 458104, "epoch": 2726} {"train_loss": -12.040558815002441, "global_step": 458105, "epoch": 2726} {"train_loss": -12.378467559814453, "global_step": 458106, "epoch": 2726} {"train_loss": -12.762981414794922, "global_step": 458107, "epoch": 2726} {"train_loss": -12.499422073364258, "global_step": 458108, "epoch": 2726} {"train_loss": -12.57512378692627, "global_step": 458109, "epoch": 2726} {"train_loss": -12.49788761138916, "global_step": 458110, "epoch": 2726} {"train_loss": -12.02511978149414, "global_step": 458111, "epoch": 2726} {"train_loss": -12.278778076171875, "global_step": 458112, "epoch": 2726} {"train_loss": -12.505233764648438, "global_step": 458113, "epoch": 2726} {"train_loss": -12.475629806518555, "global_step": 458114, "epoch": 2726} {"train_loss": -12.364280700683594, "global_step": 458115, "epoch": 2726} {"train_loss": -12.445379257202148, "global_step": 458116, "epoch": 2726} {"train_loss": -12.518600463867188, "global_step": 458117, "epoch": 2726} {"train_loss": -12.632911682128906, "global_step": 458118, "epoch": 2726} {"train_loss": -12.154373168945312, "global_step": 458119, "epoch": 2726} {"train_loss": -12.579951286315918, "global_step": 458120, "epoch": 2726} {"train_loss": -12.676811218261719, "global_step": 458121, "epoch": 2726} {"train_loss": -12.780754089355469, "global_step": 458122, "epoch": 2726} {"train_loss": -12.369720458984375, "global_step": 458123, "epoch": 2726} {"train_loss": -12.550573348999023, "global_step": 458124, "epoch": 2726} {"train_loss": -12.532964706420898, "global_step": 458125, "epoch": 2726} {"train_loss": -12.701186180114746, "global_step": 458126, "epoch": 2726} {"train_loss": -12.331774711608887, "global_step": 458127, "epoch": 2726} {"train_loss": -12.461441040039062, "global_step": 458128, "epoch": 2726} {"train_loss": -12.672289848327637, "global_step": 458129, "epoch": 2726} {"train_loss": -12.548171997070312, "global_step": 458130, "epoch": 2726} {"train_loss": -12.874984741210938, "global_step": 458131, "epoch": 2726} {"train_loss": -12.488991737365723, "global_step": 458132, "epoch": 2726} {"train_loss": -12.773701667785645, "global_step": 458133, "epoch": 2726} {"train_loss": -12.70492172241211, "global_step": 458134, "epoch": 2726} {"train_loss": -12.376456584249224, "global_step": 458135, "epoch": 2726, "val_loss": 314947.09375} {"train_loss": -12.814077377319336, "global_step": 458136, "epoch": 2727} {"train_loss": -12.587383270263672, "global_step": 458137, "epoch": 2727} {"train_loss": -12.696008682250977, "global_step": 458138, "epoch": 2727} {"train_loss": -12.299221992492676, "global_step": 458139, "epoch": 2727} {"train_loss": -12.19157600402832, "global_step": 458140, "epoch": 2727} {"train_loss": -12.512534141540527, "global_step": 458141, "epoch": 2727} {"train_loss": -12.931137084960938, "global_step": 458142, "epoch": 2727} {"train_loss": -12.359781265258789, "global_step": 458143, "epoch": 2727} {"train_loss": -12.234109878540039, "global_step": 458144, "epoch": 2727} {"train_loss": -12.680146217346191, "global_step": 458145, "epoch": 2727} {"train_loss": -12.514256477355957, "global_step": 458146, "epoch": 2727} {"train_loss": -12.10131549835205, "global_step": 458147, "epoch": 2727} {"train_loss": -11.696325302124023, "global_step": 458148, "epoch": 2727} {"train_loss": -12.256630897521973, "global_step": 458149, "epoch": 2727} {"train_loss": -12.522695541381836, "global_step": 458150, "epoch": 2727} {"train_loss": -12.151641845703125, "global_step": 458151, "epoch": 2727} {"train_loss": -11.702741622924805, "global_step": 458152, "epoch": 2727} {"train_loss": -12.849376678466797, "global_step": 458153, "epoch": 2727} {"train_loss": -12.328330039978027, "global_step": 458154, "epoch": 2727} {"train_loss": -12.178472518920898, "global_step": 458155, "epoch": 2727} {"train_loss": -12.006179809570312, "global_step": 458156, "epoch": 2727} {"train_loss": -12.57020378112793, "global_step": 458157, "epoch": 2727} {"train_loss": -12.844919204711914, "global_step": 458158, "epoch": 2727} {"train_loss": -12.362339973449707, "global_step": 458159, "epoch": 2727} {"train_loss": -12.43192195892334, "global_step": 458160, "epoch": 2727} {"train_loss": -12.771544456481934, "global_step": 458161, "epoch": 2727} {"train_loss": -12.62759780883789, "global_step": 458162, "epoch": 2727} {"train_loss": -12.915840148925781, "global_step": 458163, "epoch": 2727} {"train_loss": -12.681747436523438, "global_step": 458164, "epoch": 2727} {"train_loss": -12.561887741088867, "global_step": 458165, "epoch": 2727} {"train_loss": -12.636474609375, "global_step": 458166, "epoch": 2727} {"train_loss": -12.72177791595459, "global_step": 458167, "epoch": 2727} {"train_loss": -12.412725448608398, "global_step": 458168, "epoch": 2727} {"train_loss": -12.77225112915039, "global_step": 458169, "epoch": 2727} {"train_loss": -12.706905364990234, "global_step": 458170, "epoch": 2727} {"train_loss": -12.71696662902832, "global_step": 458171, "epoch": 2727} {"train_loss": -12.568340301513672, "global_step": 458172, "epoch": 2727} {"train_loss": -12.706337928771973, "global_step": 458173, "epoch": 2727} {"train_loss": -12.706140518188477, "global_step": 458174, "epoch": 2727} {"train_loss": -12.907183647155762, "global_step": 458175, "epoch": 2727} {"train_loss": -12.488262176513672, "global_step": 458176, "epoch": 2727} {"train_loss": -12.694271087646484, "global_step": 458177, "epoch": 2727} {"train_loss": -12.507725715637207, "global_step": 458178, "epoch": 2727} {"train_loss": -11.508371353149414, "global_step": 458179, "epoch": 2727} {"train_loss": -12.53618335723877, "global_step": 458180, "epoch": 2727} {"train_loss": -10.507320404052734, "global_step": 458181, "epoch": 2727} {"train_loss": -12.335498809814453, "global_step": 458182, "epoch": 2727} {"train_loss": -11.682151794433594, "global_step": 458183, "epoch": 2727} {"train_loss": -11.657681465148926, "global_step": 458184, "epoch": 2727} {"train_loss": -11.8292236328125, "global_step": 458185, "epoch": 2727} {"train_loss": -10.376245498657227, "global_step": 458186, "epoch": 2727} {"train_loss": -10.5485200881958, "global_step": 458187, "epoch": 2727} {"train_loss": -9.787530899047852, "global_step": 458188, "epoch": 2727} {"train_loss": -11.351452827453613, "global_step": 458189, "epoch": 2727} {"train_loss": -10.048959732055664, "global_step": 458190, "epoch": 2727} {"train_loss": -9.504793167114258, "global_step": 458191, "epoch": 2727} {"train_loss": -10.492066383361816, "global_step": 458192, "epoch": 2727} {"train_loss": -9.554830551147461, "global_step": 458193, "epoch": 2727} {"train_loss": -10.242414474487305, "global_step": 458194, "epoch": 2727} {"train_loss": -11.284269332885742, "global_step": 458195, "epoch": 2727} {"train_loss": -10.850051879882812, "global_step": 458196, "epoch": 2727} {"train_loss": -11.542268753051758, "global_step": 458197, "epoch": 2727} {"train_loss": -11.099401473999023, "global_step": 458198, "epoch": 2727} {"train_loss": -10.139100074768066, "global_step": 458199, "epoch": 2727} {"train_loss": -11.143507957458496, "global_step": 458200, "epoch": 2727} {"train_loss": -10.206001281738281, "global_step": 458201, "epoch": 2727} {"train_loss": -11.65412712097168, "global_step": 458202, "epoch": 2727} {"train_loss": -10.829510688781738, "global_step": 458203, "epoch": 2727} {"train_loss": -11.535844802856445, "global_step": 458204, "epoch": 2727} {"train_loss": -11.739831924438477, "global_step": 458205, "epoch": 2727} {"train_loss": -11.91296672821045, "global_step": 458206, "epoch": 2727} {"train_loss": -11.753952026367188, "global_step": 458207, "epoch": 2727} {"train_loss": -11.955171585083008, "global_step": 458208, "epoch": 2727} {"train_loss": -11.833767890930176, "global_step": 458209, "epoch": 2727} {"train_loss": -11.982351303100586, "global_step": 458210, "epoch": 2727} {"train_loss": -12.047744750976562, "global_step": 458211, "epoch": 2727} {"train_loss": -11.472478866577148, "global_step": 458212, "epoch": 2727} {"train_loss": -12.233125686645508, "global_step": 458213, "epoch": 2727} {"train_loss": -12.034830093383789, "global_step": 458214, "epoch": 2727} {"train_loss": -11.287042617797852, "global_step": 458215, "epoch": 2727} {"train_loss": -12.150217056274414, "global_step": 458216, "epoch": 2727} {"train_loss": -11.48740291595459, "global_step": 458217, "epoch": 2727} {"train_loss": -12.03244400024414, "global_step": 458218, "epoch": 2727} {"train_loss": -12.113889694213867, "global_step": 458219, "epoch": 2727} {"train_loss": -11.895662307739258, "global_step": 458220, "epoch": 2727} {"train_loss": -12.054759979248047, "global_step": 458221, "epoch": 2727} {"train_loss": -12.141728401184082, "global_step": 458222, "epoch": 2727} {"train_loss": -12.260881423950195, "global_step": 458223, "epoch": 2727} {"train_loss": -12.128217697143555, "global_step": 458224, "epoch": 2727} {"train_loss": -12.407208442687988, "global_step": 458225, "epoch": 2727} {"train_loss": -12.131206512451172, "global_step": 458226, "epoch": 2727} {"train_loss": -12.164660453796387, "global_step": 458227, "epoch": 2727} {"train_loss": -12.154314041137695, "global_step": 458228, "epoch": 2727} {"train_loss": -12.036747932434082, "global_step": 458229, "epoch": 2727} {"train_loss": -11.934735298156738, "global_step": 458230, "epoch": 2727} {"train_loss": -11.870927810668945, "global_step": 458231, "epoch": 2727} {"train_loss": -12.457744598388672, "global_step": 458232, "epoch": 2727} {"train_loss": -11.841255187988281, "global_step": 458233, "epoch": 2727} {"train_loss": -12.499411582946777, "global_step": 458234, "epoch": 2727} {"train_loss": -11.776866912841797, "global_step": 458235, "epoch": 2727} {"train_loss": -12.4407958984375, "global_step": 458236, "epoch": 2727} {"train_loss": -11.492198944091797, "global_step": 458237, "epoch": 2727} {"train_loss": -12.385052680969238, "global_step": 458238, "epoch": 2727} {"train_loss": -11.775535583496094, "global_step": 458239, "epoch": 2727} {"train_loss": -12.330846786499023, "global_step": 458240, "epoch": 2727} {"train_loss": -12.058475494384766, "global_step": 458241, "epoch": 2727} {"train_loss": -12.18185043334961, "global_step": 458242, "epoch": 2727} {"train_loss": -12.244277954101562, "global_step": 458243, "epoch": 2727} {"train_loss": -12.243656158447266, "global_step": 458244, "epoch": 2727} {"train_loss": -12.257373809814453, "global_step": 458245, "epoch": 2727} {"train_loss": -12.145304679870605, "global_step": 458246, "epoch": 2727} {"train_loss": -12.095062255859375, "global_step": 458247, "epoch": 2727} {"train_loss": -11.95826244354248, "global_step": 458248, "epoch": 2727} {"train_loss": -12.411147117614746, "global_step": 458249, "epoch": 2727} {"train_loss": -12.524978637695312, "global_step": 458250, "epoch": 2727} {"train_loss": -12.267682075500488, "global_step": 458251, "epoch": 2727} {"train_loss": -12.181310653686523, "global_step": 458252, "epoch": 2727} {"train_loss": -12.591377258300781, "global_step": 458253, "epoch": 2727} {"train_loss": -12.42512321472168, "global_step": 458254, "epoch": 2727} {"train_loss": -12.260836601257324, "global_step": 458255, "epoch": 2727} {"train_loss": -12.36552619934082, "global_step": 458256, "epoch": 2727} {"train_loss": -12.01317310333252, "global_step": 458257, "epoch": 2727} {"train_loss": -12.42172622680664, "global_step": 458258, "epoch": 2727} {"train_loss": -12.436532974243164, "global_step": 458259, "epoch": 2727} {"train_loss": -12.358556747436523, "global_step": 458260, "epoch": 2727} {"train_loss": -12.601187705993652, "global_step": 458261, "epoch": 2727} {"train_loss": -12.283391952514648, "global_step": 458262, "epoch": 2727} {"train_loss": -12.662469863891602, "global_step": 458263, "epoch": 2727} {"train_loss": -12.449311256408691, "global_step": 458264, "epoch": 2727} {"train_loss": -12.609783172607422, "global_step": 458265, "epoch": 2727} {"train_loss": -12.406585693359375, "global_step": 458266, "epoch": 2727} {"train_loss": -12.379693984985352, "global_step": 458267, "epoch": 2727} {"train_loss": -12.75322151184082, "global_step": 458268, "epoch": 2727} {"train_loss": -12.590046882629395, "global_step": 458269, "epoch": 2727} {"train_loss": -12.474382400512695, "global_step": 458270, "epoch": 2727} {"train_loss": -12.575641632080078, "global_step": 458271, "epoch": 2727} {"train_loss": -12.527750015258789, "global_step": 458272, "epoch": 2727} {"train_loss": -12.449416160583496, "global_step": 458273, "epoch": 2727} {"train_loss": -12.619474411010742, "global_step": 458274, "epoch": 2727} {"train_loss": -12.39959716796875, "global_step": 458275, "epoch": 2727} {"train_loss": -12.725605010986328, "global_step": 458276, "epoch": 2727} {"train_loss": -12.512486457824707, "global_step": 458277, "epoch": 2727} {"train_loss": -12.461633682250977, "global_step": 458278, "epoch": 2727} {"train_loss": -12.773561477661133, "global_step": 458279, "epoch": 2727} {"train_loss": -12.615748405456543, "global_step": 458280, "epoch": 2727} {"train_loss": -12.913105964660645, "global_step": 458281, "epoch": 2727} {"train_loss": -12.604120254516602, "global_step": 458282, "epoch": 2727} {"train_loss": -12.541278839111328, "global_step": 458283, "epoch": 2727} {"train_loss": -12.593454360961914, "global_step": 458284, "epoch": 2727} {"train_loss": -12.478805541992188, "global_step": 458285, "epoch": 2727} {"train_loss": -12.265973091125488, "global_step": 458286, "epoch": 2727} {"train_loss": -12.451807022094727, "global_step": 458287, "epoch": 2727} {"train_loss": -11.935111999511719, "global_step": 458288, "epoch": 2727} {"train_loss": -12.461616516113281, "global_step": 458289, "epoch": 2727} {"train_loss": -12.421778678894043, "global_step": 458290, "epoch": 2727} {"train_loss": -12.367009162902832, "global_step": 458291, "epoch": 2727} {"train_loss": -12.457439422607422, "global_step": 458292, "epoch": 2727} {"train_loss": -12.898419380187988, "global_step": 458293, "epoch": 2727} {"train_loss": -12.544990539550781, "global_step": 458294, "epoch": 2727} {"train_loss": -12.783225059509277, "global_step": 458295, "epoch": 2727} {"train_loss": -12.411641120910645, "global_step": 458296, "epoch": 2727} {"train_loss": -12.459131240844727, "global_step": 458297, "epoch": 2727} {"train_loss": -12.74937629699707, "global_step": 458298, "epoch": 2727} {"train_loss": -12.621496200561523, "global_step": 458299, "epoch": 2727} {"train_loss": -12.752538681030273, "global_step": 458300, "epoch": 2727} {"train_loss": -12.867269515991211, "global_step": 458301, "epoch": 2727} {"train_loss": -12.436361312866211, "global_step": 458302, "epoch": 2727} {"train_loss": -12.140004050163995, "global_step": 458303, "epoch": 2727, "val_loss": 315922.875} {"train_loss": -12.710054397583008, "global_step": 458304, "epoch": 2728} {"train_loss": -12.535006523132324, "global_step": 458305, "epoch": 2728} {"train_loss": -12.726228713989258, "global_step": 458306, "epoch": 2728} {"train_loss": -12.590892791748047, "global_step": 458307, "epoch": 2728} {"train_loss": -12.839521408081055, "global_step": 458308, "epoch": 2728} {"train_loss": -12.451803207397461, "global_step": 458309, "epoch": 2728} {"train_loss": -12.731680870056152, "global_step": 458310, "epoch": 2728} {"train_loss": -12.724287033081055, "global_step": 458311, "epoch": 2728} {"train_loss": -12.403092384338379, "global_step": 458312, "epoch": 2728} {"train_loss": -12.837066650390625, "global_step": 458313, "epoch": 2728} {"train_loss": -12.572803497314453, "global_step": 458314, "epoch": 2728} {"train_loss": -12.540708541870117, "global_step": 458315, "epoch": 2728} {"train_loss": -12.665292739868164, "global_step": 458316, "epoch": 2728} {"train_loss": -12.372891426086426, "global_step": 458317, "epoch": 2728} {"train_loss": -12.666767120361328, "global_step": 458318, "epoch": 2728} {"train_loss": -12.679638862609863, "global_step": 458319, "epoch": 2728} {"train_loss": -12.40640640258789, "global_step": 458320, "epoch": 2728} {"train_loss": -12.827919006347656, "global_step": 458321, "epoch": 2728} {"train_loss": -12.831496238708496, "global_step": 458322, "epoch": 2728} {"train_loss": -12.306873321533203, "global_step": 458323, "epoch": 2728} {"train_loss": -12.12160873413086, "global_step": 458324, "epoch": 2728} {"train_loss": -12.567733764648438, "global_step": 458325, "epoch": 2728} {"train_loss": -12.23017692565918, "global_step": 458326, "epoch": 2728} {"train_loss": -12.400092124938965, "global_step": 458327, "epoch": 2728} {"train_loss": -11.881969451904297, "global_step": 458328, "epoch": 2728} {"train_loss": -12.234650611877441, "global_step": 458329, "epoch": 2728} {"train_loss": -12.24271011352539, "global_step": 458330, "epoch": 2728} {"train_loss": -11.362265586853027, "global_step": 458331, "epoch": 2728} {"train_loss": -11.465679168701172, "global_step": 458332, "epoch": 2728} {"train_loss": -12.842175483703613, "global_step": 458333, "epoch": 2728} {"train_loss": -10.726340293884277, "global_step": 458334, "epoch": 2728} {"train_loss": -11.644454956054688, "global_step": 458335, "epoch": 2728} {"train_loss": -11.785265922546387, "global_step": 458336, "epoch": 2728} {"train_loss": -10.918492317199707, "global_step": 458337, "epoch": 2728} {"train_loss": -11.657217025756836, "global_step": 458338, "epoch": 2728} {"train_loss": -9.008853912353516, "global_step": 458339, "epoch": 2728} {"train_loss": -10.873257637023926, "global_step": 458340, "epoch": 2728} {"train_loss": -10.076059341430664, "global_step": 458341, "epoch": 2728} {"train_loss": -12.063714981079102, "global_step": 458342, "epoch": 2728} {"train_loss": -9.493561744689941, "global_step": 458343, "epoch": 2728} {"train_loss": -11.423901557922363, "global_step": 458344, "epoch": 2728} {"train_loss": -9.983848571777344, "global_step": 458345, "epoch": 2728} {"train_loss": -11.226139068603516, "global_step": 458346, "epoch": 2728} {"train_loss": -9.525411605834961, "global_step": 458347, "epoch": 2728} {"train_loss": -8.766698837280273, "global_step": 458348, "epoch": 2728} {"train_loss": -9.956554412841797, "global_step": 458349, "epoch": 2728} {"train_loss": -11.244014739990234, "global_step": 458350, "epoch": 2728} {"train_loss": -9.108396530151367, "global_step": 458351, "epoch": 2728} {"train_loss": -9.592106819152832, "global_step": 458352, "epoch": 2728} {"train_loss": -10.591943740844727, "global_step": 458353, "epoch": 2728} {"train_loss": -9.245223045349121, "global_step": 458354, "epoch": 2728} {"train_loss": -10.123337745666504, "global_step": 458355, "epoch": 2728} {"train_loss": -11.162094116210938, "global_step": 458356, "epoch": 2728} {"train_loss": -9.425105094909668, "global_step": 458357, "epoch": 2728} {"train_loss": -10.960504531860352, "global_step": 458358, "epoch": 2728} {"train_loss": -11.197633743286133, "global_step": 458359, "epoch": 2728} {"train_loss": -10.80592155456543, "global_step": 458360, "epoch": 2728} {"train_loss": -11.3164644241333, "global_step": 458361, "epoch": 2728} {"train_loss": -11.448934555053711, "global_step": 458362, "epoch": 2728} {"train_loss": -11.940324783325195, "global_step": 458363, "epoch": 2728} {"train_loss": -11.329780578613281, "global_step": 458364, "epoch": 2728} {"train_loss": -11.603409767150879, "global_step": 458365, "epoch": 2728} {"train_loss": -11.890768051147461, "global_step": 458366, "epoch": 2728} {"train_loss": -11.80093002319336, "global_step": 458367, "epoch": 2728} {"train_loss": -11.525130271911621, "global_step": 458368, "epoch": 2728} {"train_loss": -11.671276092529297, "global_step": 458369, "epoch": 2728} {"train_loss": -11.31205940246582, "global_step": 458370, "epoch": 2728} {"train_loss": -11.524691581726074, "global_step": 458371, "epoch": 2728} {"train_loss": -11.610712051391602, "global_step": 458372, "epoch": 2728} {"train_loss": -11.527278900146484, "global_step": 458373, "epoch": 2728} {"train_loss": -12.3277587890625, "global_step": 458374, "epoch": 2728} {"train_loss": -11.371522903442383, "global_step": 458375, "epoch": 2728} {"train_loss": -12.231193542480469, "global_step": 458376, "epoch": 2728} {"train_loss": -11.825617790222168, "global_step": 458377, "epoch": 2728} {"train_loss": -12.237466812133789, "global_step": 458378, "epoch": 2728} {"train_loss": -11.815664291381836, "global_step": 458379, "epoch": 2728} {"train_loss": -12.454636573791504, "global_step": 458380, "epoch": 2728} {"train_loss": -12.107518196105957, "global_step": 458381, "epoch": 2728} {"train_loss": -12.03793716430664, "global_step": 458382, "epoch": 2728} {"train_loss": -11.926868438720703, "global_step": 458383, "epoch": 2728} {"train_loss": -12.30247688293457, "global_step": 458384, "epoch": 2728} {"train_loss": -12.300865173339844, "global_step": 458385, "epoch": 2728} {"train_loss": -12.183486938476562, "global_step": 458386, "epoch": 2728} {"train_loss": -12.033195495605469, "global_step": 458387, "epoch": 2728} {"train_loss": -12.413224220275879, "global_step": 458388, "epoch": 2728} {"train_loss": -12.458332061767578, "global_step": 458389, "epoch": 2728} {"train_loss": -12.61934757232666, "global_step": 458390, "epoch": 2728} {"train_loss": -12.212562561035156, "global_step": 458391, "epoch": 2728} {"train_loss": -12.385089874267578, "global_step": 458392, "epoch": 2728} {"train_loss": -11.8712158203125, "global_step": 458393, "epoch": 2728} {"train_loss": -12.475996971130371, "global_step": 458394, "epoch": 2728} {"train_loss": -11.971083641052246, "global_step": 458395, "epoch": 2728} {"train_loss": -11.821563720703125, "global_step": 458396, "epoch": 2728} {"train_loss": -12.27220630645752, "global_step": 458397, "epoch": 2728} {"train_loss": -11.907255172729492, "global_step": 458398, "epoch": 2728} {"train_loss": -11.429931640625, "global_step": 458399, "epoch": 2728} {"train_loss": -12.437101364135742, "global_step": 458400, "epoch": 2728} {"train_loss": -11.582683563232422, "global_step": 458401, "epoch": 2728} {"train_loss": -12.342089653015137, "global_step": 458402, "epoch": 2728} {"train_loss": -11.787304878234863, "global_step": 458403, "epoch": 2728} {"train_loss": -12.115340232849121, "global_step": 458404, "epoch": 2728} {"train_loss": -12.059947967529297, "global_step": 458405, "epoch": 2728} {"train_loss": -12.155027389526367, "global_step": 458406, "epoch": 2728} {"train_loss": -12.293425559997559, "global_step": 458407, "epoch": 2728} {"train_loss": -12.366737365722656, "global_step": 458408, "epoch": 2728} {"train_loss": -11.793927192687988, "global_step": 458409, "epoch": 2728} {"train_loss": -12.241537094116211, "global_step": 458410, "epoch": 2728} {"train_loss": -11.781255722045898, "global_step": 458411, "epoch": 2728} {"train_loss": -12.329551696777344, "global_step": 458412, "epoch": 2728} {"train_loss": -12.42891788482666, "global_step": 458413, "epoch": 2728} {"train_loss": -12.570119857788086, "global_step": 458414, "epoch": 2728} {"train_loss": -12.407918930053711, "global_step": 458415, "epoch": 2728} {"train_loss": -12.437158584594727, "global_step": 458416, "epoch": 2728} {"train_loss": -12.298816680908203, "global_step": 458417, "epoch": 2728} {"train_loss": -12.429779052734375, "global_step": 458418, "epoch": 2728} {"train_loss": -12.16470718383789, "global_step": 458419, "epoch": 2728} {"train_loss": -12.553991317749023, "global_step": 458420, "epoch": 2728} {"train_loss": -12.210071563720703, "global_step": 458421, "epoch": 2728} {"train_loss": -12.525346755981445, "global_step": 458422, "epoch": 2728} {"train_loss": -12.500317573547363, "global_step": 458423, "epoch": 2728} {"train_loss": -12.319175720214844, "global_step": 458424, "epoch": 2728} {"train_loss": -12.770442962646484, "global_step": 458425, "epoch": 2728} {"train_loss": -12.75878620147705, "global_step": 458426, "epoch": 2728} {"train_loss": -12.617589950561523, "global_step": 458427, "epoch": 2728} {"train_loss": -12.652860641479492, "global_step": 458428, "epoch": 2728} {"train_loss": -12.593244552612305, "global_step": 458429, "epoch": 2728} {"train_loss": -12.690287590026855, "global_step": 458430, "epoch": 2728} {"train_loss": -12.753661155700684, "global_step": 458431, "epoch": 2728} {"train_loss": -12.560222625732422, "global_step": 458432, "epoch": 2728} {"train_loss": -12.669594764709473, "global_step": 458433, "epoch": 2728} {"train_loss": -12.798404693603516, "global_step": 458434, "epoch": 2728} {"train_loss": -12.743082046508789, "global_step": 458435, "epoch": 2728} {"train_loss": -12.647499084472656, "global_step": 458436, "epoch": 2728} {"train_loss": -12.719666481018066, "global_step": 458437, "epoch": 2728} {"train_loss": -12.664228439331055, "global_step": 458438, "epoch": 2728} {"train_loss": -12.691837310791016, "global_step": 458439, "epoch": 2728} {"train_loss": -12.572613716125488, "global_step": 458440, "epoch": 2728} {"train_loss": -12.705615997314453, "global_step": 458441, "epoch": 2728} {"train_loss": -12.64647102355957, "global_step": 458442, "epoch": 2728} {"train_loss": -12.617948532104492, "global_step": 458443, "epoch": 2728} {"train_loss": -12.586057662963867, "global_step": 458444, "epoch": 2728} {"train_loss": -12.782002449035645, "global_step": 458445, "epoch": 2728} {"train_loss": -12.58731460571289, "global_step": 458446, "epoch": 2728} {"train_loss": -12.5784273147583, "global_step": 458447, "epoch": 2728} {"train_loss": -12.797957420349121, "global_step": 458448, "epoch": 2728} {"train_loss": -12.446670532226562, "global_step": 458449, "epoch": 2728} {"train_loss": -12.64077377319336, "global_step": 458450, "epoch": 2728} {"train_loss": -12.428900718688965, "global_step": 458451, "epoch": 2728} {"train_loss": -12.74769115447998, "global_step": 458452, "epoch": 2728} {"train_loss": -12.283287048339844, "global_step": 458453, "epoch": 2728} {"train_loss": -12.619441032409668, "global_step": 458454, "epoch": 2728} {"train_loss": -12.927001953125, "global_step": 458455, "epoch": 2728} {"train_loss": -12.75611686706543, "global_step": 458456, "epoch": 2728} {"train_loss": -12.67504596710205, "global_step": 458457, "epoch": 2728} {"train_loss": -12.805400848388672, "global_step": 458458, "epoch": 2728} {"train_loss": -12.504950523376465, "global_step": 458459, "epoch": 2728} {"train_loss": -12.847272872924805, "global_step": 458460, "epoch": 2728} {"train_loss": -12.744152069091797, "global_step": 458461, "epoch": 2728} {"train_loss": -12.781600952148438, "global_step": 458462, "epoch": 2728} {"train_loss": -12.523743629455566, "global_step": 458463, "epoch": 2728} {"train_loss": -12.478127479553223, "global_step": 458464, "epoch": 2728} {"train_loss": -12.829669952392578, "global_step": 458465, "epoch": 2728} {"train_loss": -12.938359260559082, "global_step": 458466, "epoch": 2728} {"train_loss": -12.847494125366211, "global_step": 458467, "epoch": 2728} {"train_loss": -12.540912628173828, "global_step": 458468, "epoch": 2728} {"train_loss": -12.345247268676758, "global_step": 458469, "epoch": 2728} {"train_loss": -12.584817886352539, "global_step": 458470, "epoch": 2728} {"train_loss": -12.042473997388567, "global_step": 458471, "epoch": 2728, "val_loss": 305788.5625} {"train_loss": -12.571958541870117, "global_step": 458472, "epoch": 2729} {"train_loss": -12.402875900268555, "global_step": 458473, "epoch": 2729} {"train_loss": -12.184736251831055, "global_step": 458474, "epoch": 2729} {"train_loss": -12.546497344970703, "global_step": 458475, "epoch": 2729} {"train_loss": -12.443870544433594, "global_step": 458476, "epoch": 2729} {"train_loss": -12.681831359863281, "global_step": 458477, "epoch": 2729} {"train_loss": -12.625957489013672, "global_step": 458478, "epoch": 2729} {"train_loss": -12.396713256835938, "global_step": 458479, "epoch": 2729} {"train_loss": -12.270347595214844, "global_step": 458480, "epoch": 2729} {"train_loss": -12.792211532592773, "global_step": 458481, "epoch": 2729} {"train_loss": -12.498113632202148, "global_step": 458482, "epoch": 2729} {"train_loss": -11.931137084960938, "global_step": 458483, "epoch": 2729} {"train_loss": -12.202839851379395, "global_step": 458484, "epoch": 2729} {"train_loss": -12.834174156188965, "global_step": 458485, "epoch": 2729} {"train_loss": -12.569673538208008, "global_step": 458486, "epoch": 2729} {"train_loss": -12.237098693847656, "global_step": 458487, "epoch": 2729} {"train_loss": -12.682697296142578, "global_step": 458488, "epoch": 2729} {"train_loss": -12.512678146362305, "global_step": 458489, "epoch": 2729} {"train_loss": -12.613081932067871, "global_step": 458490, "epoch": 2729} {"train_loss": -12.396038055419922, "global_step": 458491, "epoch": 2729} {"train_loss": -12.79937744140625, "global_step": 458492, "epoch": 2729} {"train_loss": -12.731826782226562, "global_step": 458493, "epoch": 2729} {"train_loss": -11.714814186096191, "global_step": 458494, "epoch": 2729} {"train_loss": -12.205060958862305, "global_step": 458495, "epoch": 2729} {"train_loss": -12.015281677246094, "global_step": 458496, "epoch": 2729} {"train_loss": -11.930334091186523, "global_step": 458497, "epoch": 2729} {"train_loss": -11.701370239257812, "global_step": 458498, "epoch": 2729} {"train_loss": -11.736994743347168, "global_step": 458499, "epoch": 2729} {"train_loss": -12.048006057739258, "global_step": 458500, "epoch": 2729} {"train_loss": -12.34097671508789, "global_step": 458501, "epoch": 2729} {"train_loss": -11.499088287353516, "global_step": 458502, "epoch": 2729} {"train_loss": -11.710070610046387, "global_step": 458503, "epoch": 2729} {"train_loss": -12.301673889160156, "global_step": 458504, "epoch": 2729} {"train_loss": -11.46885871887207, "global_step": 458505, "epoch": 2729} {"train_loss": -11.409473419189453, "global_step": 458506, "epoch": 2729} {"train_loss": -10.777837753295898, "global_step": 458507, "epoch": 2729} {"train_loss": -12.139577865600586, "global_step": 458508, "epoch": 2729} {"train_loss": -10.979040145874023, "global_step": 458509, "epoch": 2729} {"train_loss": -10.45833969116211, "global_step": 458510, "epoch": 2729} {"train_loss": -11.53309440612793, "global_step": 458511, "epoch": 2729} {"train_loss": -9.513511657714844, "global_step": 458512, "epoch": 2729} {"train_loss": -11.385698318481445, "global_step": 458513, "epoch": 2729} {"train_loss": -9.189875602722168, "global_step": 458514, "epoch": 2729} {"train_loss": -9.60019302368164, "global_step": 458515, "epoch": 2729} {"train_loss": -9.245609283447266, "global_step": 458516, "epoch": 2729} {"train_loss": -10.089003562927246, "global_step": 458517, "epoch": 2729} {"train_loss": -10.220457077026367, "global_step": 458518, "epoch": 2729} {"train_loss": -9.036888122558594, "global_step": 458519, "epoch": 2729} {"train_loss": -8.078758239746094, "global_step": 458520, "epoch": 2729} {"train_loss": -8.571399688720703, "global_step": 458521, "epoch": 2729} {"train_loss": -8.158230781555176, "global_step": 458522, "epoch": 2729} {"train_loss": -9.266060829162598, "global_step": 458523, "epoch": 2729} {"train_loss": -9.741958618164062, "global_step": 458524, "epoch": 2729} {"train_loss": -10.015748977661133, "global_step": 458525, "epoch": 2729} {"train_loss": -8.60593032836914, "global_step": 458526, "epoch": 2729} {"train_loss": -9.373161315917969, "global_step": 458527, "epoch": 2729} {"train_loss": -9.75179672241211, "global_step": 458528, "epoch": 2729} {"train_loss": -10.176509857177734, "global_step": 458529, "epoch": 2729} {"train_loss": -10.52552318572998, "global_step": 458530, "epoch": 2729} {"train_loss": -10.826555252075195, "global_step": 458531, "epoch": 2729} {"train_loss": -10.698053359985352, "global_step": 458532, "epoch": 2729} {"train_loss": -11.153812408447266, "global_step": 458533, "epoch": 2729} {"train_loss": -10.135112762451172, "global_step": 458534, "epoch": 2729} {"train_loss": -9.985143661499023, "global_step": 458535, "epoch": 2729} {"train_loss": -9.919529914855957, "global_step": 458536, "epoch": 2729} {"train_loss": -10.73517894744873, "global_step": 458537, "epoch": 2729} {"train_loss": -10.937357902526855, "global_step": 458538, "epoch": 2729} {"train_loss": -11.399015426635742, "global_step": 458539, "epoch": 2729} {"train_loss": -11.266672134399414, "global_step": 458540, "epoch": 2729} {"train_loss": -11.73726749420166, "global_step": 458541, "epoch": 2729} {"train_loss": -11.297916412353516, "global_step": 458542, "epoch": 2729} {"train_loss": -11.42750358581543, "global_step": 458543, "epoch": 2729} {"train_loss": -11.501678466796875, "global_step": 458544, "epoch": 2729} {"train_loss": -11.290071487426758, "global_step": 458545, "epoch": 2729} {"train_loss": -11.492691993713379, "global_step": 458546, "epoch": 2729} {"train_loss": -10.745323181152344, "global_step": 458547, "epoch": 2729} {"train_loss": -11.653082847595215, "global_step": 458548, "epoch": 2729} {"train_loss": -11.104389190673828, "global_step": 458549, "epoch": 2729} {"train_loss": -11.245431900024414, "global_step": 458550, "epoch": 2729} {"train_loss": -11.075817108154297, "global_step": 458551, "epoch": 2729} {"train_loss": -10.829574584960938, "global_step": 458552, "epoch": 2729} {"train_loss": -11.618585586547852, "global_step": 458553, "epoch": 2729} {"train_loss": -11.40355110168457, "global_step": 458554, "epoch": 2729} {"train_loss": -11.977928161621094, "global_step": 458555, "epoch": 2729} {"train_loss": -11.358665466308594, "global_step": 458556, "epoch": 2729} {"train_loss": -11.93270492553711, "global_step": 458557, "epoch": 2729} {"train_loss": -11.773788452148438, "global_step": 458558, "epoch": 2729} {"train_loss": -12.069380760192871, "global_step": 458559, "epoch": 2729} {"train_loss": -11.93964958190918, "global_step": 458560, "epoch": 2729} {"train_loss": -11.765382766723633, "global_step": 458561, "epoch": 2729} {"train_loss": -12.137248039245605, "global_step": 458562, "epoch": 2729} {"train_loss": -11.982129096984863, "global_step": 458563, "epoch": 2729} {"train_loss": -11.879337310791016, "global_step": 458564, "epoch": 2729} {"train_loss": -12.00762939453125, "global_step": 458565, "epoch": 2729} {"train_loss": -11.768608093261719, "global_step": 458566, "epoch": 2729} {"train_loss": -11.843542098999023, "global_step": 458567, "epoch": 2729} {"train_loss": -12.1033353805542, "global_step": 458568, "epoch": 2729} {"train_loss": -12.19097900390625, "global_step": 458569, "epoch": 2729} {"train_loss": -12.272806167602539, "global_step": 458570, "epoch": 2729} {"train_loss": -12.240653991699219, "global_step": 458571, "epoch": 2729} {"train_loss": -12.0974702835083, "global_step": 458572, "epoch": 2729} {"train_loss": -11.984869956970215, "global_step": 458573, "epoch": 2729} {"train_loss": -12.521949768066406, "global_step": 458574, "epoch": 2729} {"train_loss": -11.902442932128906, "global_step": 458575, "epoch": 2729} {"train_loss": -12.218429565429688, "global_step": 458576, "epoch": 2729} {"train_loss": -12.382707595825195, "global_step": 458577, "epoch": 2729} {"train_loss": -12.499835968017578, "global_step": 458578, "epoch": 2729} {"train_loss": -12.36604118347168, "global_step": 458579, "epoch": 2729} {"train_loss": -12.355742454528809, "global_step": 458580, "epoch": 2729} {"train_loss": -12.506949424743652, "global_step": 458581, "epoch": 2729} {"train_loss": -12.455020904541016, "global_step": 458582, "epoch": 2729} {"train_loss": -12.512800216674805, "global_step": 458583, "epoch": 2729} {"train_loss": -12.688095092773438, "global_step": 458584, "epoch": 2729} {"train_loss": -12.569452285766602, "global_step": 458585, "epoch": 2729} {"train_loss": -12.545642852783203, "global_step": 458586, "epoch": 2729} {"train_loss": -12.678875923156738, "global_step": 458587, "epoch": 2729} {"train_loss": -12.446639060974121, "global_step": 458588, "epoch": 2729} {"train_loss": -12.493064880371094, "global_step": 458589, "epoch": 2729} {"train_loss": -12.550552368164062, "global_step": 458590, "epoch": 2729} {"train_loss": -12.433115005493164, "global_step": 458591, "epoch": 2729} {"train_loss": -12.5248441696167, "global_step": 458592, "epoch": 2729} {"train_loss": -12.433135986328125, "global_step": 458593, "epoch": 2729} {"train_loss": -12.648771286010742, "global_step": 458594, "epoch": 2729} {"train_loss": -12.41508960723877, "global_step": 458595, "epoch": 2729} {"train_loss": -12.627338409423828, "global_step": 458596, "epoch": 2729} {"train_loss": -12.49968433380127, "global_step": 458597, "epoch": 2729} {"train_loss": -12.672670364379883, "global_step": 458598, "epoch": 2729} {"train_loss": -12.564835548400879, "global_step": 458599, "epoch": 2729} {"train_loss": -12.72526741027832, "global_step": 458600, "epoch": 2729} {"train_loss": -12.467456817626953, "global_step": 458601, "epoch": 2729} {"train_loss": -12.643245697021484, "global_step": 458602, "epoch": 2729} {"train_loss": -12.647897720336914, "global_step": 458603, "epoch": 2729} {"train_loss": -12.728256225585938, "global_step": 458604, "epoch": 2729} {"train_loss": -12.62434196472168, "global_step": 458605, "epoch": 2729} {"train_loss": -12.683019638061523, "global_step": 458606, "epoch": 2729} {"train_loss": -12.697189331054688, "global_step": 458607, "epoch": 2729} {"train_loss": -12.672229766845703, "global_step": 458608, "epoch": 2729} {"train_loss": -12.562782287597656, "global_step": 458609, "epoch": 2729} {"train_loss": -12.669147491455078, "global_step": 458610, "epoch": 2729} {"train_loss": -12.329010009765625, "global_step": 458611, "epoch": 2729} {"train_loss": -12.789019584655762, "global_step": 458612, "epoch": 2729} {"train_loss": -12.662857055664062, "global_step": 458613, "epoch": 2729} {"train_loss": -12.720012664794922, "global_step": 458614, "epoch": 2729} {"train_loss": -12.643939018249512, "global_step": 458615, "epoch": 2729} {"train_loss": -12.499479293823242, "global_step": 458616, "epoch": 2729} {"train_loss": -12.681657791137695, "global_step": 458617, "epoch": 2729} {"train_loss": -12.80830192565918, "global_step": 458618, "epoch": 2729} {"train_loss": -12.681038856506348, "global_step": 458619, "epoch": 2729} {"train_loss": -12.656737327575684, "global_step": 458620, "epoch": 2729} {"train_loss": -12.707776069641113, "global_step": 458621, "epoch": 2729} {"train_loss": -12.859582901000977, "global_step": 458622, "epoch": 2729} {"train_loss": -12.751382827758789, "global_step": 458623, "epoch": 2729} {"train_loss": -12.76717758178711, "global_step": 458624, "epoch": 2729} {"train_loss": -12.921561241149902, "global_step": 458625, "epoch": 2729} {"train_loss": -12.725672721862793, "global_step": 458626, "epoch": 2729} {"train_loss": -12.866296768188477, "global_step": 458627, "epoch": 2729} {"train_loss": -12.971158981323242, "global_step": 458628, "epoch": 2729} {"train_loss": -12.99709701538086, "global_step": 458629, "epoch": 2729} {"train_loss": -12.763023376464844, "global_step": 458630, "epoch": 2729} {"train_loss": -12.995193481445312, "global_step": 458631, "epoch": 2729} {"train_loss": -12.749114990234375, "global_step": 458632, "epoch": 2729} {"train_loss": -12.957114219665527, "global_step": 458633, "epoch": 2729} {"train_loss": -12.912323951721191, "global_step": 458634, "epoch": 2729} {"train_loss": -12.90323257446289, "global_step": 458635, "epoch": 2729} {"train_loss": -12.908334732055664, "global_step": 458636, "epoch": 2729} {"train_loss": -12.94256591796875, "global_step": 458637, "epoch": 2729} {"train_loss": -12.607177734375, "global_step": 458638, "epoch": 2729} {"train_loss": -11.858923775809151, "global_step": 458639, "epoch": 2729, "val_loss": 313085.3125} {"train_loss": -12.788888931274414, "global_step": 458640, "epoch": 2730} {"train_loss": -12.871912956237793, "global_step": 458641, "epoch": 2730} {"train_loss": -12.930034637451172, "global_step": 458642, "epoch": 2730} {"train_loss": -12.720001220703125, "global_step": 458643, "epoch": 2730} {"train_loss": -12.846724510192871, "global_step": 458644, "epoch": 2730} {"train_loss": -12.808990478515625, "global_step": 458645, "epoch": 2730} {"train_loss": -12.561477661132812, "global_step": 458646, "epoch": 2730} {"train_loss": -12.83077621459961, "global_step": 458647, "epoch": 2730} {"train_loss": -12.94778060913086, "global_step": 458648, "epoch": 2730} {"train_loss": -12.740522384643555, "global_step": 458649, "epoch": 2730} {"train_loss": -12.771368026733398, "global_step": 458650, "epoch": 2730} {"train_loss": -12.755962371826172, "global_step": 458651, "epoch": 2730} {"train_loss": -13.024835586547852, "global_step": 458652, "epoch": 2730} {"train_loss": -12.85550308227539, "global_step": 458653, "epoch": 2730} {"train_loss": -12.712250709533691, "global_step": 458654, "epoch": 2730} {"train_loss": -12.610356330871582, "global_step": 458655, "epoch": 2730} {"train_loss": -12.766013145446777, "global_step": 458656, "epoch": 2730} {"train_loss": -12.766393661499023, "global_step": 458657, "epoch": 2730} {"train_loss": -13.010602951049805, "global_step": 458658, "epoch": 2730} {"train_loss": -12.681623458862305, "global_step": 458659, "epoch": 2730} {"train_loss": -12.663328170776367, "global_step": 458660, "epoch": 2730} {"train_loss": -12.341243743896484, "global_step": 458661, "epoch": 2730} {"train_loss": -13.01705551147461, "global_step": 458662, "epoch": 2730} {"train_loss": -12.549565315246582, "global_step": 458663, "epoch": 2730} {"train_loss": -13.034978866577148, "global_step": 458664, "epoch": 2730} {"train_loss": -12.995927810668945, "global_step": 458665, "epoch": 2730} {"train_loss": -12.718822479248047, "global_step": 458666, "epoch": 2730} {"train_loss": -12.912824630737305, "global_step": 458667, "epoch": 2730} {"train_loss": -12.44160270690918, "global_step": 458668, "epoch": 2730} {"train_loss": -12.922042846679688, "global_step": 458669, "epoch": 2730} {"train_loss": -12.51734447479248, "global_step": 458670, "epoch": 2730} {"train_loss": -12.544578552246094, "global_step": 458671, "epoch": 2730} {"train_loss": -12.253816604614258, "global_step": 458672, "epoch": 2730} {"train_loss": -12.51583480834961, "global_step": 458673, "epoch": 2730} {"train_loss": -12.901927947998047, "global_step": 458674, "epoch": 2730} {"train_loss": -12.406295776367188, "global_step": 458675, "epoch": 2730} {"train_loss": -12.71356201171875, "global_step": 458676, "epoch": 2730} {"train_loss": -11.87059211730957, "global_step": 458677, "epoch": 2730} {"train_loss": -11.617369651794434, "global_step": 458678, "epoch": 2730} {"train_loss": -10.652149200439453, "global_step": 458679, "epoch": 2730} {"train_loss": -12.266914367675781, "global_step": 458680, "epoch": 2730} {"train_loss": -11.91907787322998, "global_step": 458681, "epoch": 2730} {"train_loss": -10.005578994750977, "global_step": 458682, "epoch": 2730} {"train_loss": -11.57414722442627, "global_step": 458683, "epoch": 2730} {"train_loss": -11.714797019958496, "global_step": 458684, "epoch": 2730} {"train_loss": -11.090316772460938, "global_step": 458685, "epoch": 2730} {"train_loss": -10.522356986999512, "global_step": 458686, "epoch": 2730} {"train_loss": -11.399900436401367, "global_step": 458687, "epoch": 2730} {"train_loss": -8.706279754638672, "global_step": 458688, "epoch": 2730} {"train_loss": -10.237527847290039, "global_step": 458689, "epoch": 2730} {"train_loss": -8.126605033874512, "global_step": 458690, "epoch": 2730} {"train_loss": -9.81462574005127, "global_step": 458691, "epoch": 2730} {"train_loss": -8.04098892211914, "global_step": 458692, "epoch": 2730} {"train_loss": -10.705353736877441, "global_step": 458693, "epoch": 2730} {"train_loss": -9.117552757263184, "global_step": 458694, "epoch": 2730} {"train_loss": -9.802192687988281, "global_step": 458695, "epoch": 2730} {"train_loss": -9.379100799560547, "global_step": 458696, "epoch": 2730} {"train_loss": -9.15712833404541, "global_step": 458697, "epoch": 2730} {"train_loss": -9.439817428588867, "global_step": 458698, "epoch": 2730} {"train_loss": -9.726847648620605, "global_step": 458699, "epoch": 2730} {"train_loss": -9.951114654541016, "global_step": 458700, "epoch": 2730} {"train_loss": -10.168399810791016, "global_step": 458701, "epoch": 2730} {"train_loss": -10.430703163146973, "global_step": 458702, "epoch": 2730} {"train_loss": -10.512487411499023, "global_step": 458703, "epoch": 2730} {"train_loss": -10.250139236450195, "global_step": 458704, "epoch": 2730} {"train_loss": -10.1494722366333, "global_step": 458705, "epoch": 2730} {"train_loss": -10.745288848876953, "global_step": 458706, "epoch": 2730} {"train_loss": -10.140369415283203, "global_step": 458707, "epoch": 2730} {"train_loss": -11.708916664123535, "global_step": 458708, "epoch": 2730} {"train_loss": -11.754806518554688, "global_step": 458709, "epoch": 2730} {"train_loss": -10.675455093383789, "global_step": 458710, "epoch": 2730} {"train_loss": -10.904723167419434, "global_step": 458711, "epoch": 2730} {"train_loss": -10.603858947753906, "global_step": 458712, "epoch": 2730} {"train_loss": -11.808956146240234, "global_step": 458713, "epoch": 2730} {"train_loss": -11.028438568115234, "global_step": 458714, "epoch": 2730} {"train_loss": -11.396480560302734, "global_step": 458715, "epoch": 2730} {"train_loss": -10.969429969787598, "global_step": 458716, "epoch": 2730} {"train_loss": -11.408647537231445, "global_step": 458717, "epoch": 2730} {"train_loss": -11.616413116455078, "global_step": 458718, "epoch": 2730} {"train_loss": -11.862366676330566, "global_step": 458719, "epoch": 2730} {"train_loss": -12.019388198852539, "global_step": 458720, "epoch": 2730} {"train_loss": -12.078855514526367, "global_step": 458721, "epoch": 2730} {"train_loss": -11.79452896118164, "global_step": 458722, "epoch": 2730} {"train_loss": -12.236830711364746, "global_step": 458723, "epoch": 2730} {"train_loss": -11.78310775756836, "global_step": 458724, "epoch": 2730} {"train_loss": -12.016904830932617, "global_step": 458725, "epoch": 2730} {"train_loss": -11.82186222076416, "global_step": 458726, "epoch": 2730} {"train_loss": -11.866752624511719, "global_step": 458727, "epoch": 2730} {"train_loss": -12.266103744506836, "global_step": 458728, "epoch": 2730} {"train_loss": -11.548505783081055, "global_step": 458729, "epoch": 2730} {"train_loss": -12.209188461303711, "global_step": 458730, "epoch": 2730} {"train_loss": -12.053525924682617, "global_step": 458731, "epoch": 2730} {"train_loss": -12.109091758728027, "global_step": 458732, "epoch": 2730} {"train_loss": -12.00722599029541, "global_step": 458733, "epoch": 2730} {"train_loss": -12.23111343383789, "global_step": 458734, "epoch": 2730} {"train_loss": -12.230049133300781, "global_step": 458735, "epoch": 2730} {"train_loss": -11.958866119384766, "global_step": 458736, "epoch": 2730} {"train_loss": -12.466676712036133, "global_step": 458737, "epoch": 2730} {"train_loss": -12.438047409057617, "global_step": 458738, "epoch": 2730} {"train_loss": -12.362630844116211, "global_step": 458739, "epoch": 2730} {"train_loss": -11.9708833694458, "global_step": 458740, "epoch": 2730} {"train_loss": -12.544017791748047, "global_step": 458741, "epoch": 2730} {"train_loss": -12.554094314575195, "global_step": 458742, "epoch": 2730} {"train_loss": -12.229164123535156, "global_step": 458743, "epoch": 2730} {"train_loss": -12.430420875549316, "global_step": 458744, "epoch": 2730} {"train_loss": -12.343116760253906, "global_step": 458745, "epoch": 2730} {"train_loss": -12.310521125793457, "global_step": 458746, "epoch": 2730} {"train_loss": -12.429755210876465, "global_step": 458747, "epoch": 2730} {"train_loss": -12.480074882507324, "global_step": 458748, "epoch": 2730} {"train_loss": -12.446379661560059, "global_step": 458749, "epoch": 2730} {"train_loss": -12.188270568847656, "global_step": 458750, "epoch": 2730} {"train_loss": -12.29659652709961, "global_step": 458751, "epoch": 2730} {"train_loss": -12.504721641540527, "global_step": 458752, "epoch": 2730} {"train_loss": -12.038285255432129, "global_step": 458753, "epoch": 2730} {"train_loss": -11.939659118652344, "global_step": 458754, "epoch": 2730} {"train_loss": -11.788202285766602, "global_step": 458755, "epoch": 2730} {"train_loss": -11.841756820678711, "global_step": 458756, "epoch": 2730} {"train_loss": -11.337482452392578, "global_step": 458757, "epoch": 2730} {"train_loss": -12.054526329040527, "global_step": 458758, "epoch": 2730} {"train_loss": -11.82503890991211, "global_step": 458759, "epoch": 2730} {"train_loss": -12.098921775817871, "global_step": 458760, "epoch": 2730} {"train_loss": -12.176655769348145, "global_step": 458761, "epoch": 2730} {"train_loss": -11.898881912231445, "global_step": 458762, "epoch": 2730} {"train_loss": -12.142691612243652, "global_step": 458763, "epoch": 2730} {"train_loss": -11.763228416442871, "global_step": 458764, "epoch": 2730} {"train_loss": -12.415209770202637, "global_step": 458765, "epoch": 2730} {"train_loss": -11.789566040039062, "global_step": 458766, "epoch": 2730} {"train_loss": -12.391637802124023, "global_step": 458767, "epoch": 2730} {"train_loss": -12.14599609375, "global_step": 458768, "epoch": 2730} {"train_loss": -12.070029258728027, "global_step": 458769, "epoch": 2730} {"train_loss": -11.595142364501953, "global_step": 458770, "epoch": 2730} {"train_loss": -11.682663917541504, "global_step": 458771, "epoch": 2730} {"train_loss": -12.059046745300293, "global_step": 458772, "epoch": 2730} {"train_loss": -11.298441886901855, "global_step": 458773, "epoch": 2730} {"train_loss": -11.900598526000977, "global_step": 458774, "epoch": 2730} {"train_loss": -11.311371803283691, "global_step": 458775, "epoch": 2730} {"train_loss": -11.789257049560547, "global_step": 458776, "epoch": 2730} {"train_loss": -12.083792686462402, "global_step": 458777, "epoch": 2730} {"train_loss": -11.584726333618164, "global_step": 458778, "epoch": 2730} {"train_loss": -12.764418601989746, "global_step": 458779, "epoch": 2730} {"train_loss": -11.143433570861816, "global_step": 458780, "epoch": 2730} {"train_loss": -12.50611686706543, "global_step": 458781, "epoch": 2730} {"train_loss": -11.445711135864258, "global_step": 458782, "epoch": 2730} {"train_loss": -12.277259826660156, "global_step": 458783, "epoch": 2730} {"train_loss": -11.804298400878906, "global_step": 458784, "epoch": 2730} {"train_loss": -11.494365692138672, "global_step": 458785, "epoch": 2730} {"train_loss": -12.39750862121582, "global_step": 458786, "epoch": 2730} {"train_loss": -12.02296257019043, "global_step": 458787, "epoch": 2730} {"train_loss": -11.950209617614746, "global_step": 458788, "epoch": 2730} {"train_loss": -11.92989730834961, "global_step": 458789, "epoch": 2730} {"train_loss": -12.176982879638672, "global_step": 458790, "epoch": 2730} {"train_loss": -12.272237777709961, "global_step": 458791, "epoch": 2730} {"train_loss": -11.70234489440918, "global_step": 458792, "epoch": 2730} {"train_loss": -12.076021194458008, "global_step": 458793, "epoch": 2730} {"train_loss": -12.223101615905762, "global_step": 458794, "epoch": 2730} {"train_loss": -11.845394134521484, "global_step": 458795, "epoch": 2730} {"train_loss": -12.099634170532227, "global_step": 458796, "epoch": 2730} {"train_loss": -12.084311485290527, "global_step": 458797, "epoch": 2730} {"train_loss": -12.231273651123047, "global_step": 458798, "epoch": 2730} {"train_loss": -12.437142372131348, "global_step": 458799, "epoch": 2730} {"train_loss": -12.171958923339844, "global_step": 458800, "epoch": 2730} {"train_loss": -12.368789672851562, "global_step": 458801, "epoch": 2730} {"train_loss": -12.414905548095703, "global_step": 458802, "epoch": 2730} {"train_loss": -12.460343360900879, "global_step": 458803, "epoch": 2730} {"train_loss": -12.150693893432617, "global_step": 458804, "epoch": 2730} {"train_loss": -12.273000717163086, "global_step": 458805, "epoch": 2730} {"train_loss": -12.440988540649414, "global_step": 458806, "epoch": 2730} {"train_loss": -11.8408332268397, "global_step": 458807, "epoch": 2730, "val_loss": 313882.34375, "train_action_mse_error": 1.8863173723220825} {"train_loss": -12.101058959960938, "global_step": 458808, "epoch": 2731} {"train_loss": -12.478195190429688, "global_step": 458809, "epoch": 2731} {"train_loss": -12.131065368652344, "global_step": 458810, "epoch": 2731} {"train_loss": -11.453781127929688, "global_step": 458811, "epoch": 2731} {"train_loss": -12.14579963684082, "global_step": 458812, "epoch": 2731} {"train_loss": -11.866012573242188, "global_step": 458813, "epoch": 2731} {"train_loss": -12.369209289550781, "global_step": 458814, "epoch": 2731} {"train_loss": -12.143869400024414, "global_step": 458815, "epoch": 2731} {"train_loss": -12.39448356628418, "global_step": 458816, "epoch": 2731} {"train_loss": -12.013426780700684, "global_step": 458817, "epoch": 2731} {"train_loss": -12.380216598510742, "global_step": 458818, "epoch": 2731} {"train_loss": -12.219504356384277, "global_step": 458819, "epoch": 2731} {"train_loss": -12.081369400024414, "global_step": 458820, "epoch": 2731} {"train_loss": -12.15670394897461, "global_step": 458821, "epoch": 2731} {"train_loss": -12.20096206665039, "global_step": 458822, "epoch": 2731} {"train_loss": -11.934163093566895, "global_step": 458823, "epoch": 2731} {"train_loss": -12.352989196777344, "global_step": 458824, "epoch": 2731} {"train_loss": -12.728796005249023, "global_step": 458825, "epoch": 2731} {"train_loss": -12.033049583435059, "global_step": 458826, "epoch": 2731} {"train_loss": -12.6730375289917, "global_step": 458827, "epoch": 2731} {"train_loss": -12.062997817993164, "global_step": 458828, "epoch": 2731} {"train_loss": -11.971932411193848, "global_step": 458829, "epoch": 2731} {"train_loss": -12.330551147460938, "global_step": 458830, "epoch": 2731} {"train_loss": -11.91469955444336, "global_step": 458831, "epoch": 2731} {"train_loss": -12.699657440185547, "global_step": 458832, "epoch": 2731} {"train_loss": -12.096189498901367, "global_step": 458833, "epoch": 2731} {"train_loss": -12.370234489440918, "global_step": 458834, "epoch": 2731} {"train_loss": -12.54661750793457, "global_step": 458835, "epoch": 2731} {"train_loss": -12.104175567626953, "global_step": 458836, "epoch": 2731} {"train_loss": -12.670663833618164, "global_step": 458837, "epoch": 2731} {"train_loss": -12.325218200683594, "global_step": 458838, "epoch": 2731} {"train_loss": -12.02577018737793, "global_step": 458839, "epoch": 2731} {"train_loss": -12.405203819274902, "global_step": 458840, "epoch": 2731} {"train_loss": -12.478668212890625, "global_step": 458841, "epoch": 2731} {"train_loss": -12.400541305541992, "global_step": 458842, "epoch": 2731} {"train_loss": -12.354835510253906, "global_step": 458843, "epoch": 2731} {"train_loss": -12.351783752441406, "global_step": 458844, "epoch": 2731} {"train_loss": -12.678811073303223, "global_step": 458845, "epoch": 2731} {"train_loss": -12.360820770263672, "global_step": 458846, "epoch": 2731} {"train_loss": -12.439811706542969, "global_step": 458847, "epoch": 2731} {"train_loss": -12.36859130859375, "global_step": 458848, "epoch": 2731} {"train_loss": -12.601984977722168, "global_step": 458849, "epoch": 2731} {"train_loss": -12.5495023727417, "global_step": 458850, "epoch": 2731} {"train_loss": -12.688065528869629, "global_step": 458851, "epoch": 2731} {"train_loss": -12.18437671661377, "global_step": 458852, "epoch": 2731} {"train_loss": -12.833221435546875, "global_step": 458853, "epoch": 2731} {"train_loss": -12.771528244018555, "global_step": 458854, "epoch": 2731} {"train_loss": -12.646371841430664, "global_step": 458855, "epoch": 2731} {"train_loss": -12.956003189086914, "global_step": 458856, "epoch": 2731} {"train_loss": -12.806356430053711, "global_step": 458857, "epoch": 2731} {"train_loss": -12.52052116394043, "global_step": 458858, "epoch": 2731} {"train_loss": -12.631303787231445, "global_step": 458859, "epoch": 2731} {"train_loss": -12.531597137451172, "global_step": 458860, "epoch": 2731} {"train_loss": -12.350208282470703, "global_step": 458861, "epoch": 2731} {"train_loss": -12.41459846496582, "global_step": 458862, "epoch": 2731} {"train_loss": -12.44823169708252, "global_step": 458863, "epoch": 2731} {"train_loss": -12.292067527770996, "global_step": 458864, "epoch": 2731} {"train_loss": -12.893574714660645, "global_step": 458865, "epoch": 2731} {"train_loss": -12.560615539550781, "global_step": 458866, "epoch": 2731} {"train_loss": -12.22075366973877, "global_step": 458867, "epoch": 2731} {"train_loss": -12.76600170135498, "global_step": 458868, "epoch": 2731} {"train_loss": -12.279059410095215, "global_step": 458869, "epoch": 2731} {"train_loss": -12.363216400146484, "global_step": 458870, "epoch": 2731} {"train_loss": -12.537911415100098, "global_step": 458871, "epoch": 2731} {"train_loss": -12.14719009399414, "global_step": 458872, "epoch": 2731} {"train_loss": -12.454421043395996, "global_step": 458873, "epoch": 2731} {"train_loss": -12.823009490966797, "global_step": 458874, "epoch": 2731} {"train_loss": -12.556561470031738, "global_step": 458875, "epoch": 2731} {"train_loss": -12.47341537475586, "global_step": 458876, "epoch": 2731} {"train_loss": -12.676957130432129, "global_step": 458877, "epoch": 2731} {"train_loss": -12.496054649353027, "global_step": 458878, "epoch": 2731} {"train_loss": -12.647880554199219, "global_step": 458879, "epoch": 2731} {"train_loss": -12.545431137084961, "global_step": 458880, "epoch": 2731} {"train_loss": -12.313191413879395, "global_step": 458881, "epoch": 2731} {"train_loss": -12.718914985656738, "global_step": 458882, "epoch": 2731} {"train_loss": -12.544452667236328, "global_step": 458883, "epoch": 2731} {"train_loss": -12.623544692993164, "global_step": 458884, "epoch": 2731} {"train_loss": -12.70534896850586, "global_step": 458885, "epoch": 2731} {"train_loss": -12.594401359558105, "global_step": 458886, "epoch": 2731} {"train_loss": -12.674251556396484, "global_step": 458887, "epoch": 2731} {"train_loss": -12.741597175598145, "global_step": 458888, "epoch": 2731} {"train_loss": -12.585800170898438, "global_step": 458889, "epoch": 2731} {"train_loss": -12.867517471313477, "global_step": 458890, "epoch": 2731} {"train_loss": -12.51259994506836, "global_step": 458891, "epoch": 2731} {"train_loss": -12.727893829345703, "global_step": 458892, "epoch": 2731} {"train_loss": -12.702763557434082, "global_step": 458893, "epoch": 2731} {"train_loss": -12.5232572555542, "global_step": 458894, "epoch": 2731} {"train_loss": -12.425336837768555, "global_step": 458895, "epoch": 2731} {"train_loss": -12.543777465820312, "global_step": 458896, "epoch": 2731} {"train_loss": -13.011663436889648, "global_step": 458897, "epoch": 2731} {"train_loss": -12.602351188659668, "global_step": 458898, "epoch": 2731} {"train_loss": -13.028812408447266, "global_step": 458899, "epoch": 2731} {"train_loss": -12.802591323852539, "global_step": 458900, "epoch": 2731} {"train_loss": -12.872225761413574, "global_step": 458901, "epoch": 2731} {"train_loss": -12.780150413513184, "global_step": 458902, "epoch": 2731} {"train_loss": -12.930044174194336, "global_step": 458903, "epoch": 2731} {"train_loss": -12.566177368164062, "global_step": 458904, "epoch": 2731} {"train_loss": -12.627195358276367, "global_step": 458905, "epoch": 2731} {"train_loss": -12.66585922241211, "global_step": 458906, "epoch": 2731} {"train_loss": -12.430292129516602, "global_step": 458907, "epoch": 2731} {"train_loss": -12.030088424682617, "global_step": 458908, "epoch": 2731} {"train_loss": -12.611320495605469, "global_step": 458909, "epoch": 2731} {"train_loss": -12.346956253051758, "global_step": 458910, "epoch": 2731} {"train_loss": -13.057809829711914, "global_step": 458911, "epoch": 2731} {"train_loss": -11.778328895568848, "global_step": 458912, "epoch": 2731} {"train_loss": -11.298652648925781, "global_step": 458913, "epoch": 2731} {"train_loss": -11.92714786529541, "global_step": 458914, "epoch": 2731} {"train_loss": -11.711980819702148, "global_step": 458915, "epoch": 2731} {"train_loss": -8.496725082397461, "global_step": 458916, "epoch": 2731} {"train_loss": -9.7594633102417, "global_step": 458917, "epoch": 2731} {"train_loss": -9.010536193847656, "global_step": 458918, "epoch": 2731} {"train_loss": -9.549077033996582, "global_step": 458919, "epoch": 2731} {"train_loss": -11.511795043945312, "global_step": 458920, "epoch": 2731} {"train_loss": -8.94472599029541, "global_step": 458921, "epoch": 2731} {"train_loss": -9.011463165283203, "global_step": 458922, "epoch": 2731} {"train_loss": -10.320146560668945, "global_step": 458923, "epoch": 2731} {"train_loss": -10.803977966308594, "global_step": 458924, "epoch": 2731} {"train_loss": -9.097193717956543, "global_step": 458925, "epoch": 2731} {"train_loss": -11.061612129211426, "global_step": 458926, "epoch": 2731} {"train_loss": -11.06794548034668, "global_step": 458927, "epoch": 2731} {"train_loss": -9.955684661865234, "global_step": 458928, "epoch": 2731} {"train_loss": -9.656089782714844, "global_step": 458929, "epoch": 2731} {"train_loss": -11.469259262084961, "global_step": 458930, "epoch": 2731} {"train_loss": -10.746504783630371, "global_step": 458931, "epoch": 2731} {"train_loss": -11.201327323913574, "global_step": 458932, "epoch": 2731} {"train_loss": -11.4664306640625, "global_step": 458933, "epoch": 2731} {"train_loss": -11.423171997070312, "global_step": 458934, "epoch": 2731} {"train_loss": -11.299999237060547, "global_step": 458935, "epoch": 2731} {"train_loss": -12.111202239990234, "global_step": 458936, "epoch": 2731} {"train_loss": -10.639307022094727, "global_step": 458937, "epoch": 2731} {"train_loss": -11.676826477050781, "global_step": 458938, "epoch": 2731} {"train_loss": -11.219525337219238, "global_step": 458939, "epoch": 2731} {"train_loss": -11.312705993652344, "global_step": 458940, "epoch": 2731} {"train_loss": -11.339059829711914, "global_step": 458941, "epoch": 2731} {"train_loss": -11.249781608581543, "global_step": 458942, "epoch": 2731} {"train_loss": -11.133872985839844, "global_step": 458943, "epoch": 2731} {"train_loss": -11.970776557922363, "global_step": 458944, "epoch": 2731} {"train_loss": -10.875226974487305, "global_step": 458945, "epoch": 2731} {"train_loss": -11.987746238708496, "global_step": 458946, "epoch": 2731} {"train_loss": -12.106955528259277, "global_step": 458947, "epoch": 2731} {"train_loss": -11.759960174560547, "global_step": 458948, "epoch": 2731} {"train_loss": -12.080787658691406, "global_step": 458949, "epoch": 2731} {"train_loss": -12.019989967346191, "global_step": 458950, "epoch": 2731} {"train_loss": -11.911961555480957, "global_step": 458951, "epoch": 2731} {"train_loss": -11.660622596740723, "global_step": 458952, "epoch": 2731} {"train_loss": -11.65682601928711, "global_step": 458953, "epoch": 2731} {"train_loss": -12.03913688659668, "global_step": 458954, "epoch": 2731} {"train_loss": -11.733195304870605, "global_step": 458955, "epoch": 2731} {"train_loss": -11.965600967407227, "global_step": 458956, "epoch": 2731} {"train_loss": -12.29682731628418, "global_step": 458957, "epoch": 2731} {"train_loss": -11.796425819396973, "global_step": 458958, "epoch": 2731} {"train_loss": -12.22647762298584, "global_step": 458959, "epoch": 2731} {"train_loss": -12.485357284545898, "global_step": 458960, "epoch": 2731} {"train_loss": -12.31617259979248, "global_step": 458961, "epoch": 2731} {"train_loss": -12.438848495483398, "global_step": 458962, "epoch": 2731} {"train_loss": -12.070537567138672, "global_step": 458963, "epoch": 2731} {"train_loss": -12.532355308532715, "global_step": 458964, "epoch": 2731} {"train_loss": -12.085742950439453, "global_step": 458965, "epoch": 2731} {"train_loss": -12.328524589538574, "global_step": 458966, "epoch": 2731} {"train_loss": -12.423460006713867, "global_step": 458967, "epoch": 2731} {"train_loss": -12.06860637664795, "global_step": 458968, "epoch": 2731} {"train_loss": -12.587762832641602, "global_step": 458969, "epoch": 2731} {"train_loss": -12.162759780883789, "global_step": 458970, "epoch": 2731} {"train_loss": -12.481058120727539, "global_step": 458971, "epoch": 2731} {"train_loss": -12.420979499816895, "global_step": 458972, "epoch": 2731} {"train_loss": -12.473745346069336, "global_step": 458973, "epoch": 2731} {"train_loss": -12.506510734558105, "global_step": 458974, "epoch": 2731} {"train_loss": -12.070097378322057, "global_step": 458975, "epoch": 2731, "val_loss": 313765.21875} {"train_loss": -12.288875579833984, "global_step": 458976, "epoch": 2732} {"train_loss": -12.235568046569824, "global_step": 458977, "epoch": 2732} {"train_loss": -11.962404251098633, "global_step": 458978, "epoch": 2732} {"train_loss": -12.343925476074219, "global_step": 458979, "epoch": 2732} {"train_loss": -12.241891860961914, "global_step": 458980, "epoch": 2732} {"train_loss": -12.098540306091309, "global_step": 458981, "epoch": 2732} {"train_loss": -12.501511573791504, "global_step": 458982, "epoch": 2732} {"train_loss": -12.23805046081543, "global_step": 458983, "epoch": 2732} {"train_loss": -12.454797744750977, "global_step": 458984, "epoch": 2732} {"train_loss": -12.392446517944336, "global_step": 458985, "epoch": 2732} {"train_loss": -12.194986343383789, "global_step": 458986, "epoch": 2732} {"train_loss": -12.574954986572266, "global_step": 458987, "epoch": 2732} {"train_loss": -12.286139488220215, "global_step": 458988, "epoch": 2732} {"train_loss": -11.653404235839844, "global_step": 458989, "epoch": 2732} {"train_loss": -12.581646919250488, "global_step": 458990, "epoch": 2732} {"train_loss": -12.04247760772705, "global_step": 458991, "epoch": 2732} {"train_loss": -12.312692642211914, "global_step": 458992, "epoch": 2732} {"train_loss": -12.237454414367676, "global_step": 458993, "epoch": 2732} {"train_loss": -12.406532287597656, "global_step": 458994, "epoch": 2732} {"train_loss": -12.202165603637695, "global_step": 458995, "epoch": 2732} {"train_loss": -11.81999397277832, "global_step": 458996, "epoch": 2732} {"train_loss": -12.141107559204102, "global_step": 458997, "epoch": 2732} {"train_loss": -11.6099853515625, "global_step": 458998, "epoch": 2732} {"train_loss": -11.622406959533691, "global_step": 458999, "epoch": 2732} {"train_loss": -12.446685791015625, "global_step": 459000, "epoch": 2732} {"train_loss": -11.711997032165527, "global_step": 459001, "epoch": 2732} {"train_loss": -11.947866439819336, "global_step": 459002, "epoch": 2732} {"train_loss": -11.62481689453125, "global_step": 459003, "epoch": 2732} {"train_loss": -11.759032249450684, "global_step": 459004, "epoch": 2732} {"train_loss": -12.273752212524414, "global_step": 459005, "epoch": 2732} {"train_loss": -11.931049346923828, "global_step": 459006, "epoch": 2732} {"train_loss": -12.274443626403809, "global_step": 459007, "epoch": 2732} {"train_loss": -12.03416633605957, "global_step": 459008, "epoch": 2732} {"train_loss": -12.287286758422852, "global_step": 459009, "epoch": 2732} {"train_loss": -12.188736915588379, "global_step": 459010, "epoch": 2732} {"train_loss": -12.124656677246094, "global_step": 459011, "epoch": 2732} {"train_loss": -12.057107925415039, "global_step": 459012, "epoch": 2732} {"train_loss": -12.001075744628906, "global_step": 459013, "epoch": 2732} {"train_loss": -12.253396987915039, "global_step": 459014, "epoch": 2732} {"train_loss": -12.105384826660156, "global_step": 459015, "epoch": 2732} {"train_loss": -11.971939086914062, "global_step": 459016, "epoch": 2732} {"train_loss": -12.22158432006836, "global_step": 459017, "epoch": 2732} {"train_loss": -12.155527114868164, "global_step": 459018, "epoch": 2732} {"train_loss": -12.53740119934082, "global_step": 459019, "epoch": 2732} {"train_loss": -12.351137161254883, "global_step": 459020, "epoch": 2732} {"train_loss": -12.355703353881836, "global_step": 459021, "epoch": 2732} {"train_loss": -11.361770629882812, "global_step": 459022, "epoch": 2732} {"train_loss": -12.043779373168945, "global_step": 459023, "epoch": 2732} {"train_loss": -11.682882308959961, "global_step": 459024, "epoch": 2732} {"train_loss": -11.461996078491211, "global_step": 459025, "epoch": 2732} {"train_loss": -12.422353744506836, "global_step": 459026, "epoch": 2732} {"train_loss": -11.279250144958496, "global_step": 459027, "epoch": 2732} {"train_loss": -12.381353378295898, "global_step": 459028, "epoch": 2732} {"train_loss": -11.970442771911621, "global_step": 459029, "epoch": 2732} {"train_loss": -11.315902709960938, "global_step": 459030, "epoch": 2732} {"train_loss": -11.97547721862793, "global_step": 459031, "epoch": 2732} {"train_loss": -11.918825149536133, "global_step": 459032, "epoch": 2732} {"train_loss": -11.897414207458496, "global_step": 459033, "epoch": 2732} {"train_loss": -12.25464153289795, "global_step": 459034, "epoch": 2732} {"train_loss": -11.683491706848145, "global_step": 459035, "epoch": 2732} {"train_loss": -12.34203815460205, "global_step": 459036, "epoch": 2732} {"train_loss": -12.317622184753418, "global_step": 459037, "epoch": 2732} {"train_loss": -11.952194213867188, "global_step": 459038, "epoch": 2732} {"train_loss": -12.072867393493652, "global_step": 459039, "epoch": 2732} {"train_loss": -12.061661720275879, "global_step": 459040, "epoch": 2732} {"train_loss": -12.415048599243164, "global_step": 459041, "epoch": 2732} {"train_loss": -12.514043807983398, "global_step": 459042, "epoch": 2732} {"train_loss": -12.435680389404297, "global_step": 459043, "epoch": 2732} {"train_loss": -12.5811767578125, "global_step": 459044, "epoch": 2732} {"train_loss": -12.396071434020996, "global_step": 459045, "epoch": 2732} {"train_loss": -12.328479766845703, "global_step": 459046, "epoch": 2732} {"train_loss": -12.435951232910156, "global_step": 459047, "epoch": 2732} {"train_loss": -12.5341157913208, "global_step": 459048, "epoch": 2732} {"train_loss": -12.332196235656738, "global_step": 459049, "epoch": 2732} {"train_loss": -12.555807113647461, "global_step": 459050, "epoch": 2732} {"train_loss": -12.185331344604492, "global_step": 459051, "epoch": 2732} {"train_loss": -12.593202590942383, "global_step": 459052, "epoch": 2732} {"train_loss": -12.549817085266113, "global_step": 459053, "epoch": 2732} {"train_loss": -12.35733413696289, "global_step": 459054, "epoch": 2732} {"train_loss": -12.48706340789795, "global_step": 459055, "epoch": 2732} {"train_loss": -12.329278945922852, "global_step": 459056, "epoch": 2732} {"train_loss": -12.600225448608398, "global_step": 459057, "epoch": 2732} {"train_loss": -12.597419738769531, "global_step": 459058, "epoch": 2732} {"train_loss": -12.230020523071289, "global_step": 459059, "epoch": 2732} {"train_loss": -12.712547302246094, "global_step": 459060, "epoch": 2732} {"train_loss": -12.485751152038574, "global_step": 459061, "epoch": 2732} {"train_loss": -12.538862228393555, "global_step": 459062, "epoch": 2732} {"train_loss": -12.591726303100586, "global_step": 459063, "epoch": 2732} {"train_loss": -12.004890441894531, "global_step": 459064, "epoch": 2732} {"train_loss": -12.081670761108398, "global_step": 459065, "epoch": 2732} {"train_loss": -11.957378387451172, "global_step": 459066, "epoch": 2732} {"train_loss": -12.456826210021973, "global_step": 459067, "epoch": 2732} {"train_loss": -12.387970924377441, "global_step": 459068, "epoch": 2732} {"train_loss": -12.277982711791992, "global_step": 459069, "epoch": 2732} {"train_loss": -12.454595565795898, "global_step": 459070, "epoch": 2732} {"train_loss": -12.164982795715332, "global_step": 459071, "epoch": 2732} {"train_loss": -11.786404609680176, "global_step": 459072, "epoch": 2732} {"train_loss": -12.44163703918457, "global_step": 459073, "epoch": 2732} {"train_loss": -12.172830581665039, "global_step": 459074, "epoch": 2732} {"train_loss": -12.490076065063477, "global_step": 459075, "epoch": 2732} {"train_loss": -12.503561973571777, "global_step": 459076, "epoch": 2732} {"train_loss": -12.123600959777832, "global_step": 459077, "epoch": 2732} {"train_loss": -12.333858489990234, "global_step": 459078, "epoch": 2732} {"train_loss": -12.527132034301758, "global_step": 459079, "epoch": 2732} {"train_loss": -12.413642883300781, "global_step": 459080, "epoch": 2732} {"train_loss": -12.680466651916504, "global_step": 459081, "epoch": 2732} {"train_loss": -12.219230651855469, "global_step": 459082, "epoch": 2732} {"train_loss": -12.635641098022461, "global_step": 459083, "epoch": 2732} {"train_loss": -12.329245567321777, "global_step": 459084, "epoch": 2732} {"train_loss": -12.516051292419434, "global_step": 459085, "epoch": 2732} {"train_loss": -12.378599166870117, "global_step": 459086, "epoch": 2732} {"train_loss": -12.442808151245117, "global_step": 459087, "epoch": 2732} {"train_loss": -12.333830833435059, "global_step": 459088, "epoch": 2732} {"train_loss": -12.399657249450684, "global_step": 459089, "epoch": 2732} {"train_loss": -12.244099617004395, "global_step": 459090, "epoch": 2732} {"train_loss": -12.487563133239746, "global_step": 459091, "epoch": 2732} {"train_loss": -12.390819549560547, "global_step": 459092, "epoch": 2732} {"train_loss": -12.06236457824707, "global_step": 459093, "epoch": 2732} {"train_loss": -12.192792892456055, "global_step": 459094, "epoch": 2732} {"train_loss": -12.27291488647461, "global_step": 459095, "epoch": 2732} {"train_loss": -12.172812461853027, "global_step": 459096, "epoch": 2732} {"train_loss": -12.371705055236816, "global_step": 459097, "epoch": 2732} {"train_loss": -12.144020080566406, "global_step": 459098, "epoch": 2732} {"train_loss": -12.40645980834961, "global_step": 459099, "epoch": 2732} {"train_loss": -12.494745254516602, "global_step": 459100, "epoch": 2732} {"train_loss": -12.1376953125, "global_step": 459101, "epoch": 2732} {"train_loss": -12.416682243347168, "global_step": 459102, "epoch": 2732} {"train_loss": -12.523470878601074, "global_step": 459103, "epoch": 2732} {"train_loss": -12.44573974609375, "global_step": 459104, "epoch": 2732} {"train_loss": -12.487903594970703, "global_step": 459105, "epoch": 2732} {"train_loss": -12.71881103515625, "global_step": 459106, "epoch": 2732} {"train_loss": -12.683350563049316, "global_step": 459107, "epoch": 2732} {"train_loss": -12.626688957214355, "global_step": 459108, "epoch": 2732} {"train_loss": -12.677746772766113, "global_step": 459109, "epoch": 2732} {"train_loss": -12.792166709899902, "global_step": 459110, "epoch": 2732} {"train_loss": -12.582435607910156, "global_step": 459111, "epoch": 2732} {"train_loss": -12.818349838256836, "global_step": 459112, "epoch": 2732} {"train_loss": -12.558135986328125, "global_step": 459113, "epoch": 2732} {"train_loss": -12.555248260498047, "global_step": 459114, "epoch": 2732} {"train_loss": -12.608121871948242, "global_step": 459115, "epoch": 2732} {"train_loss": -12.717262268066406, "global_step": 459116, "epoch": 2732} {"train_loss": -12.714381217956543, "global_step": 459117, "epoch": 2732} {"train_loss": -12.637173652648926, "global_step": 459118, "epoch": 2732} {"train_loss": -12.645936965942383, "global_step": 459119, "epoch": 2732} {"train_loss": -13.024027824401855, "global_step": 459120, "epoch": 2732} {"train_loss": -12.862092971801758, "global_step": 459121, "epoch": 2732} {"train_loss": -12.805706024169922, "global_step": 459122, "epoch": 2732} {"train_loss": -12.826109886169434, "global_step": 459123, "epoch": 2732} {"train_loss": -12.795074462890625, "global_step": 459124, "epoch": 2732} {"train_loss": -12.64436149597168, "global_step": 459125, "epoch": 2732} {"train_loss": -12.62801456451416, "global_step": 459126, "epoch": 2732} {"train_loss": -12.799015045166016, "global_step": 459127, "epoch": 2732} {"train_loss": -12.705918312072754, "global_step": 459128, "epoch": 2732} {"train_loss": -12.20926284790039, "global_step": 459129, "epoch": 2732} {"train_loss": -12.589834213256836, "global_step": 459130, "epoch": 2732} {"train_loss": -12.635129928588867, "global_step": 459131, "epoch": 2732} {"train_loss": -12.057428359985352, "global_step": 459132, "epoch": 2732} {"train_loss": -12.37509536743164, "global_step": 459133, "epoch": 2732} {"train_loss": -12.408803939819336, "global_step": 459134, "epoch": 2732} {"train_loss": -12.216144561767578, "global_step": 459135, "epoch": 2732} {"train_loss": -12.075764656066895, "global_step": 459136, "epoch": 2732} {"train_loss": -12.590591430664062, "global_step": 459137, "epoch": 2732} {"train_loss": -11.306150436401367, "global_step": 459138, "epoch": 2732} {"train_loss": -12.355578422546387, "global_step": 459139, "epoch": 2732} {"train_loss": -12.562418937683105, "global_step": 459140, "epoch": 2732} {"train_loss": -11.772098541259766, "global_step": 459141, "epoch": 2732} {"train_loss": -12.243677139282227, "global_step": 459142, "epoch": 2732} {"train_loss": -12.29970515909649, "global_step": 459143, "epoch": 2732, "val_loss": 314763.0625} {"train_loss": -11.324616432189941, "global_step": 459144, "epoch": 2733} {"train_loss": -11.83980941772461, "global_step": 459145, "epoch": 2733} {"train_loss": -12.064798355102539, "global_step": 459146, "epoch": 2733} {"train_loss": -10.979575157165527, "global_step": 459147, "epoch": 2733} {"train_loss": -11.791635513305664, "global_step": 459148, "epoch": 2733} {"train_loss": -11.533060073852539, "global_step": 459149, "epoch": 2733} {"train_loss": -10.977827072143555, "global_step": 459150, "epoch": 2733} {"train_loss": -10.642433166503906, "global_step": 459151, "epoch": 2733} {"train_loss": -11.480853080749512, "global_step": 459152, "epoch": 2733} {"train_loss": -11.152383804321289, "global_step": 459153, "epoch": 2733} {"train_loss": -12.01075553894043, "global_step": 459154, "epoch": 2733} {"train_loss": -11.326286315917969, "global_step": 459155, "epoch": 2733} {"train_loss": -11.773221969604492, "global_step": 459156, "epoch": 2733} {"train_loss": -11.505281448364258, "global_step": 459157, "epoch": 2733} {"train_loss": -11.739021301269531, "global_step": 459158, "epoch": 2733} {"train_loss": -12.05524730682373, "global_step": 459159, "epoch": 2733} {"train_loss": -12.328230857849121, "global_step": 459160, "epoch": 2733} {"train_loss": -11.550424575805664, "global_step": 459161, "epoch": 2733} {"train_loss": -12.741479873657227, "global_step": 459162, "epoch": 2733} {"train_loss": -12.024588584899902, "global_step": 459163, "epoch": 2733} {"train_loss": -12.070333480834961, "global_step": 459164, "epoch": 2733} {"train_loss": -12.404716491699219, "global_step": 459165, "epoch": 2733} {"train_loss": -11.401619911193848, "global_step": 459166, "epoch": 2733} {"train_loss": -11.845529556274414, "global_step": 459167, "epoch": 2733} {"train_loss": -12.286246299743652, "global_step": 459168, "epoch": 2733} {"train_loss": -12.261981964111328, "global_step": 459169, "epoch": 2733} {"train_loss": -12.36739444732666, "global_step": 459170, "epoch": 2733} {"train_loss": -12.411665916442871, "global_step": 459171, "epoch": 2733} {"train_loss": -12.284382820129395, "global_step": 459172, "epoch": 2733} {"train_loss": -12.090749740600586, "global_step": 459173, "epoch": 2733} {"train_loss": -12.2909574508667, "global_step": 459174, "epoch": 2733} {"train_loss": -12.421257019042969, "global_step": 459175, "epoch": 2733} {"train_loss": -12.514392852783203, "global_step": 459176, "epoch": 2733} {"train_loss": -11.699277877807617, "global_step": 459177, "epoch": 2733} {"train_loss": -12.543964385986328, "global_step": 459178, "epoch": 2733} {"train_loss": -11.587844848632812, "global_step": 459179, "epoch": 2733} {"train_loss": -12.511966705322266, "global_step": 459180, "epoch": 2733} {"train_loss": -11.402275085449219, "global_step": 459181, "epoch": 2733} {"train_loss": -11.686630249023438, "global_step": 459182, "epoch": 2733} {"train_loss": -11.856653213500977, "global_step": 459183, "epoch": 2733} {"train_loss": -11.836009979248047, "global_step": 459184, "epoch": 2733} {"train_loss": -11.173561096191406, "global_step": 459185, "epoch": 2733} {"train_loss": -12.637649536132812, "global_step": 459186, "epoch": 2733} {"train_loss": -11.080368995666504, "global_step": 459187, "epoch": 2733} {"train_loss": -12.5562744140625, "global_step": 459188, "epoch": 2733} {"train_loss": -10.498376846313477, "global_step": 459189, "epoch": 2733} {"train_loss": -12.557819366455078, "global_step": 459190, "epoch": 2733} {"train_loss": -11.82778549194336, "global_step": 459191, "epoch": 2733} {"train_loss": -11.767532348632812, "global_step": 459192, "epoch": 2733} {"train_loss": -12.676239013671875, "global_step": 459193, "epoch": 2733} {"train_loss": -11.625398635864258, "global_step": 459194, "epoch": 2733} {"train_loss": -12.543328285217285, "global_step": 459195, "epoch": 2733} {"train_loss": -11.798867225646973, "global_step": 459196, "epoch": 2733} {"train_loss": -11.725626945495605, "global_step": 459197, "epoch": 2733} {"train_loss": -12.04615306854248, "global_step": 459198, "epoch": 2733} {"train_loss": -11.83795166015625, "global_step": 459199, "epoch": 2733} {"train_loss": -12.57853889465332, "global_step": 459200, "epoch": 2733} {"train_loss": -11.608427047729492, "global_step": 459201, "epoch": 2733} {"train_loss": -12.423446655273438, "global_step": 459202, "epoch": 2733} {"train_loss": -12.194311141967773, "global_step": 459203, "epoch": 2733} {"train_loss": -12.441299438476562, "global_step": 459204, "epoch": 2733} {"train_loss": -12.213470458984375, "global_step": 459205, "epoch": 2733} {"train_loss": -12.159761428833008, "global_step": 459206, "epoch": 2733} {"train_loss": -12.648287773132324, "global_step": 459207, "epoch": 2733} {"train_loss": -12.266738891601562, "global_step": 459208, "epoch": 2733} {"train_loss": -12.590660095214844, "global_step": 459209, "epoch": 2733} {"train_loss": -12.402999877929688, "global_step": 459210, "epoch": 2733} {"train_loss": -12.39159870147705, "global_step": 459211, "epoch": 2733} {"train_loss": -12.605001449584961, "global_step": 459212, "epoch": 2733} {"train_loss": -12.482810020446777, "global_step": 459213, "epoch": 2733} {"train_loss": -12.744426727294922, "global_step": 459214, "epoch": 2733} {"train_loss": -12.406805992126465, "global_step": 459215, "epoch": 2733} {"train_loss": -11.917745590209961, "global_step": 459216, "epoch": 2733} {"train_loss": -12.617262840270996, "global_step": 459217, "epoch": 2733} {"train_loss": -11.623846054077148, "global_step": 459218, "epoch": 2733} {"train_loss": -12.488933563232422, "global_step": 459219, "epoch": 2733} {"train_loss": -11.94404411315918, "global_step": 459220, "epoch": 2733} {"train_loss": -12.04508113861084, "global_step": 459221, "epoch": 2733} {"train_loss": -12.449507713317871, "global_step": 459222, "epoch": 2733} {"train_loss": -11.737372398376465, "global_step": 459223, "epoch": 2733} {"train_loss": -12.546358108520508, "global_step": 459224, "epoch": 2733} {"train_loss": -12.011200904846191, "global_step": 459225, "epoch": 2733} {"train_loss": -12.381129264831543, "global_step": 459226, "epoch": 2733} {"train_loss": -12.548866271972656, "global_step": 459227, "epoch": 2733} {"train_loss": -12.372669219970703, "global_step": 459228, "epoch": 2733} {"train_loss": -12.728548049926758, "global_step": 459229, "epoch": 2733} {"train_loss": -12.575791358947754, "global_step": 459230, "epoch": 2733} {"train_loss": -12.423983573913574, "global_step": 459231, "epoch": 2733} {"train_loss": -12.356221199035645, "global_step": 459232, "epoch": 2733} {"train_loss": -12.405620574951172, "global_step": 459233, "epoch": 2733} {"train_loss": -12.502256393432617, "global_step": 459234, "epoch": 2733} {"train_loss": -12.761397361755371, "global_step": 459235, "epoch": 2733} {"train_loss": -12.744492530822754, "global_step": 459236, "epoch": 2733} {"train_loss": -12.547029495239258, "global_step": 459237, "epoch": 2733} {"train_loss": -12.686712265014648, "global_step": 459238, "epoch": 2733} {"train_loss": -12.167121887207031, "global_step": 459239, "epoch": 2733} {"train_loss": -12.390504837036133, "global_step": 459240, "epoch": 2733} {"train_loss": -12.176166534423828, "global_step": 459241, "epoch": 2733} {"train_loss": -12.233026504516602, "global_step": 459242, "epoch": 2733} {"train_loss": -12.32522201538086, "global_step": 459243, "epoch": 2733} {"train_loss": -11.643993377685547, "global_step": 459244, "epoch": 2733} {"train_loss": -12.582305908203125, "global_step": 459245, "epoch": 2733} {"train_loss": -12.056071281433105, "global_step": 459246, "epoch": 2733} {"train_loss": -12.117077827453613, "global_step": 459247, "epoch": 2733} {"train_loss": -11.973653793334961, "global_step": 459248, "epoch": 2733} {"train_loss": -12.193849563598633, "global_step": 459249, "epoch": 2733} {"train_loss": -12.594411849975586, "global_step": 459250, "epoch": 2733} {"train_loss": -12.07982349395752, "global_step": 459251, "epoch": 2733} {"train_loss": -12.24448013305664, "global_step": 459252, "epoch": 2733} {"train_loss": -12.787151336669922, "global_step": 459253, "epoch": 2733} {"train_loss": -12.340190887451172, "global_step": 459254, "epoch": 2733} {"train_loss": -12.302486419677734, "global_step": 459255, "epoch": 2733} {"train_loss": -12.576135635375977, "global_step": 459256, "epoch": 2733} {"train_loss": -12.149221420288086, "global_step": 459257, "epoch": 2733} {"train_loss": -12.32204818725586, "global_step": 459258, "epoch": 2733} {"train_loss": -12.121919631958008, "global_step": 459259, "epoch": 2733} {"train_loss": -12.374475479125977, "global_step": 459260, "epoch": 2733} {"train_loss": -12.271438598632812, "global_step": 459261, "epoch": 2733} {"train_loss": -12.736015319824219, "global_step": 459262, "epoch": 2733} {"train_loss": -12.220893859863281, "global_step": 459263, "epoch": 2733} {"train_loss": -12.331367492675781, "global_step": 459264, "epoch": 2733} {"train_loss": -12.459423065185547, "global_step": 459265, "epoch": 2733} {"train_loss": -12.317657470703125, "global_step": 459266, "epoch": 2733} {"train_loss": -12.18034839630127, "global_step": 459267, "epoch": 2733} {"train_loss": -12.658748626708984, "global_step": 459268, "epoch": 2733} {"train_loss": -12.63199520111084, "global_step": 459269, "epoch": 2733} {"train_loss": -12.61083984375, "global_step": 459270, "epoch": 2733} {"train_loss": -12.480791091918945, "global_step": 459271, "epoch": 2733} {"train_loss": -12.436285018920898, "global_step": 459272, "epoch": 2733} {"train_loss": -11.867502212524414, "global_step": 459273, "epoch": 2733} {"train_loss": -12.68577766418457, "global_step": 459274, "epoch": 2733} {"train_loss": -12.639455795288086, "global_step": 459275, "epoch": 2733} {"train_loss": -12.556986808776855, "global_step": 459276, "epoch": 2733} {"train_loss": -12.082785606384277, "global_step": 459277, "epoch": 2733} {"train_loss": -12.610076904296875, "global_step": 459278, "epoch": 2733} {"train_loss": -12.001968383789062, "global_step": 459279, "epoch": 2733} {"train_loss": -12.2861909866333, "global_step": 459280, "epoch": 2733} {"train_loss": -12.320104598999023, "global_step": 459281, "epoch": 2733} {"train_loss": -12.403322219848633, "global_step": 459282, "epoch": 2733} {"train_loss": -12.160706520080566, "global_step": 459283, "epoch": 2733} {"train_loss": -12.729696273803711, "global_step": 459284, "epoch": 2733} {"train_loss": -11.864053726196289, "global_step": 459285, "epoch": 2733} {"train_loss": -12.48974609375, "global_step": 459286, "epoch": 2733} {"train_loss": -12.63521957397461, "global_step": 459287, "epoch": 2733} {"train_loss": -12.598058700561523, "global_step": 459288, "epoch": 2733} {"train_loss": -12.479694366455078, "global_step": 459289, "epoch": 2733} {"train_loss": -12.483999252319336, "global_step": 459290, "epoch": 2733} {"train_loss": -12.260417938232422, "global_step": 459291, "epoch": 2733} {"train_loss": -12.725414276123047, "global_step": 459292, "epoch": 2733} {"train_loss": -12.468917846679688, "global_step": 459293, "epoch": 2733} {"train_loss": -12.676411628723145, "global_step": 459294, "epoch": 2733} {"train_loss": -12.321508407592773, "global_step": 459295, "epoch": 2733} {"train_loss": -12.545654296875, "global_step": 459296, "epoch": 2733} {"train_loss": -12.721407890319824, "global_step": 459297, "epoch": 2733} {"train_loss": -12.73342514038086, "global_step": 459298, "epoch": 2733} {"train_loss": -12.619185447692871, "global_step": 459299, "epoch": 2733} {"train_loss": -12.379777908325195, "global_step": 459300, "epoch": 2733} {"train_loss": -12.085912704467773, "global_step": 459301, "epoch": 2733} {"train_loss": -12.241496086120605, "global_step": 459302, "epoch": 2733} {"train_loss": -12.69807243347168, "global_step": 459303, "epoch": 2733} {"train_loss": -11.524298667907715, "global_step": 459304, "epoch": 2733} {"train_loss": -12.37475299835205, "global_step": 459305, "epoch": 2733} {"train_loss": -12.25092887878418, "global_step": 459306, "epoch": 2733} {"train_loss": -12.738733291625977, "global_step": 459307, "epoch": 2733} {"train_loss": -12.492623329162598, "global_step": 459308, "epoch": 2733} {"train_loss": -12.319375991821289, "global_step": 459309, "epoch": 2733} {"train_loss": -12.350236892700195, "global_step": 459310, "epoch": 2733} {"train_loss": -12.204331040382385, "global_step": 459311, "epoch": 2733, "val_loss": 313114.875} {"train_loss": -12.028731346130371, "global_step": 459312, "epoch": 2734} {"train_loss": -12.347509384155273, "global_step": 459313, "epoch": 2734} {"train_loss": -12.40178108215332, "global_step": 459314, "epoch": 2734} {"train_loss": -11.819742202758789, "global_step": 459315, "epoch": 2734} {"train_loss": -12.366317749023438, "global_step": 459316, "epoch": 2734} {"train_loss": -12.243352890014648, "global_step": 459317, "epoch": 2734} {"train_loss": -12.07181167602539, "global_step": 459318, "epoch": 2734} {"train_loss": -12.537900924682617, "global_step": 459319, "epoch": 2734} {"train_loss": -12.410650253295898, "global_step": 459320, "epoch": 2734} {"train_loss": -12.28587532043457, "global_step": 459321, "epoch": 2734} {"train_loss": -12.153875350952148, "global_step": 459322, "epoch": 2734} {"train_loss": -12.512613296508789, "global_step": 459323, "epoch": 2734} {"train_loss": -12.168696403503418, "global_step": 459324, "epoch": 2734} {"train_loss": -12.226024627685547, "global_step": 459325, "epoch": 2734} {"train_loss": -12.240676879882812, "global_step": 459326, "epoch": 2734} {"train_loss": -11.719350814819336, "global_step": 459327, "epoch": 2734} {"train_loss": -11.347980499267578, "global_step": 459328, "epoch": 2734} {"train_loss": -12.48379898071289, "global_step": 459329, "epoch": 2734} {"train_loss": -12.333189964294434, "global_step": 459330, "epoch": 2734} {"train_loss": -11.374282836914062, "global_step": 459331, "epoch": 2734} {"train_loss": -11.92689037322998, "global_step": 459332, "epoch": 2734} {"train_loss": -12.349325180053711, "global_step": 459333, "epoch": 2734} {"train_loss": -11.523590087890625, "global_step": 459334, "epoch": 2734} {"train_loss": -11.353126525878906, "global_step": 459335, "epoch": 2734} {"train_loss": -11.945062637329102, "global_step": 459336, "epoch": 2734} {"train_loss": -12.565390586853027, "global_step": 459337, "epoch": 2734} {"train_loss": -11.948139190673828, "global_step": 459338, "epoch": 2734} {"train_loss": -12.112306594848633, "global_step": 459339, "epoch": 2734} {"train_loss": -11.680622100830078, "global_step": 459340, "epoch": 2734} {"train_loss": -12.06413745880127, "global_step": 459341, "epoch": 2734} {"train_loss": -12.314563751220703, "global_step": 459342, "epoch": 2734} {"train_loss": -11.764693260192871, "global_step": 459343, "epoch": 2734} {"train_loss": -12.345897674560547, "global_step": 459344, "epoch": 2734} {"train_loss": -11.995256423950195, "global_step": 459345, "epoch": 2734} {"train_loss": -11.630277633666992, "global_step": 459346, "epoch": 2734} {"train_loss": -12.278884887695312, "global_step": 459347, "epoch": 2734} {"train_loss": -12.035276412963867, "global_step": 459348, "epoch": 2734} {"train_loss": -12.43096923828125, "global_step": 459349, "epoch": 2734} {"train_loss": -12.111236572265625, "global_step": 459350, "epoch": 2734} {"train_loss": -12.352123260498047, "global_step": 459351, "epoch": 2734} {"train_loss": -12.291158676147461, "global_step": 459352, "epoch": 2734} {"train_loss": -11.488372802734375, "global_step": 459353, "epoch": 2734} {"train_loss": -12.427956581115723, "global_step": 459354, "epoch": 2734} {"train_loss": -11.427803993225098, "global_step": 459355, "epoch": 2734} {"train_loss": -12.523853302001953, "global_step": 459356, "epoch": 2734} {"train_loss": -11.963536262512207, "global_step": 459357, "epoch": 2734} {"train_loss": -12.160867691040039, "global_step": 459358, "epoch": 2734} {"train_loss": -11.910747528076172, "global_step": 459359, "epoch": 2734} {"train_loss": -12.047530174255371, "global_step": 459360, "epoch": 2734} {"train_loss": -11.73854923248291, "global_step": 459361, "epoch": 2734} {"train_loss": -12.093400955200195, "global_step": 459362, "epoch": 2734} {"train_loss": -11.754894256591797, "global_step": 459363, "epoch": 2734} {"train_loss": -11.42212963104248, "global_step": 459364, "epoch": 2734} {"train_loss": -12.298243522644043, "global_step": 459365, "epoch": 2734} {"train_loss": -10.979402542114258, "global_step": 459366, "epoch": 2734} {"train_loss": -12.472528457641602, "global_step": 459367, "epoch": 2734} {"train_loss": -11.25521469116211, "global_step": 459368, "epoch": 2734} {"train_loss": -12.026055335998535, "global_step": 459369, "epoch": 2734} {"train_loss": -12.203539848327637, "global_step": 459370, "epoch": 2734} {"train_loss": -11.194360733032227, "global_step": 459371, "epoch": 2734} {"train_loss": -12.441689491271973, "global_step": 459372, "epoch": 2734} {"train_loss": -11.531637191772461, "global_step": 459373, "epoch": 2734} {"train_loss": -12.035212516784668, "global_step": 459374, "epoch": 2734} {"train_loss": -11.096464157104492, "global_step": 459375, "epoch": 2734} {"train_loss": -11.937458038330078, "global_step": 459376, "epoch": 2734} {"train_loss": -11.760503768920898, "global_step": 459377, "epoch": 2734} {"train_loss": -12.098833084106445, "global_step": 459378, "epoch": 2734} {"train_loss": -11.811295509338379, "global_step": 459379, "epoch": 2734} {"train_loss": -11.48031997680664, "global_step": 459380, "epoch": 2734} {"train_loss": -12.597421646118164, "global_step": 459381, "epoch": 2734} {"train_loss": -11.167370796203613, "global_step": 459382, "epoch": 2734} {"train_loss": -11.850812911987305, "global_step": 459383, "epoch": 2734} {"train_loss": -11.56165599822998, "global_step": 459384, "epoch": 2734} {"train_loss": -11.86514663696289, "global_step": 459385, "epoch": 2734} {"train_loss": -11.384801864624023, "global_step": 459386, "epoch": 2734} {"train_loss": -12.390512466430664, "global_step": 459387, "epoch": 2734} {"train_loss": -11.604941368103027, "global_step": 459388, "epoch": 2734} {"train_loss": -12.209253311157227, "global_step": 459389, "epoch": 2734} {"train_loss": -12.173675537109375, "global_step": 459390, "epoch": 2734} {"train_loss": -11.725841522216797, "global_step": 459391, "epoch": 2734} {"train_loss": -12.299287796020508, "global_step": 459392, "epoch": 2734} {"train_loss": -12.208379745483398, "global_step": 459393, "epoch": 2734} {"train_loss": -12.083784103393555, "global_step": 459394, "epoch": 2734} {"train_loss": -12.174661636352539, "global_step": 459395, "epoch": 2734} {"train_loss": -12.225711822509766, "global_step": 459396, "epoch": 2734} {"train_loss": -11.486316680908203, "global_step": 459397, "epoch": 2734} {"train_loss": -12.272697448730469, "global_step": 459398, "epoch": 2734} {"train_loss": -11.771204948425293, "global_step": 459399, "epoch": 2734} {"train_loss": -12.541328430175781, "global_step": 459400, "epoch": 2734} {"train_loss": -12.084508895874023, "global_step": 459401, "epoch": 2734} {"train_loss": -11.983808517456055, "global_step": 459402, "epoch": 2734} {"train_loss": -12.432624816894531, "global_step": 459403, "epoch": 2734} {"train_loss": -12.370073318481445, "global_step": 459404, "epoch": 2734} {"train_loss": -12.565505981445312, "global_step": 459405, "epoch": 2734} {"train_loss": -12.612594604492188, "global_step": 459406, "epoch": 2734} {"train_loss": -12.218290328979492, "global_step": 459407, "epoch": 2734} {"train_loss": -12.338152885437012, "global_step": 459408, "epoch": 2734} {"train_loss": -12.238313674926758, "global_step": 459409, "epoch": 2734} {"train_loss": -12.602033615112305, "global_step": 459410, "epoch": 2734} {"train_loss": -11.610082626342773, "global_step": 459411, "epoch": 2734} {"train_loss": -12.130987167358398, "global_step": 459412, "epoch": 2734} {"train_loss": -12.148797988891602, "global_step": 459413, "epoch": 2734} {"train_loss": -11.783601760864258, "global_step": 459414, "epoch": 2734} {"train_loss": -12.546125411987305, "global_step": 459415, "epoch": 2734} {"train_loss": -11.596965789794922, "global_step": 459416, "epoch": 2734} {"train_loss": -12.645125389099121, "global_step": 459417, "epoch": 2734} {"train_loss": -12.217198371887207, "global_step": 459418, "epoch": 2734} {"train_loss": -12.489291191101074, "global_step": 459419, "epoch": 2734} {"train_loss": -12.58460807800293, "global_step": 459420, "epoch": 2734} {"train_loss": -12.325723648071289, "global_step": 459421, "epoch": 2734} {"train_loss": -12.112384796142578, "global_step": 459422, "epoch": 2734} {"train_loss": -12.65185832977295, "global_step": 459423, "epoch": 2734} {"train_loss": -12.315262794494629, "global_step": 459424, "epoch": 2734} {"train_loss": -12.229442596435547, "global_step": 459425, "epoch": 2734} {"train_loss": -12.560564041137695, "global_step": 459426, "epoch": 2734} {"train_loss": -12.25219440460205, "global_step": 459427, "epoch": 2734} {"train_loss": -12.224088668823242, "global_step": 459428, "epoch": 2734} {"train_loss": -12.425542831420898, "global_step": 459429, "epoch": 2734} {"train_loss": -11.839895248413086, "global_step": 459430, "epoch": 2734} {"train_loss": -12.189353942871094, "global_step": 459431, "epoch": 2734} {"train_loss": -12.328508377075195, "global_step": 459432, "epoch": 2734} {"train_loss": -11.882762908935547, "global_step": 459433, "epoch": 2734} {"train_loss": -12.859969139099121, "global_step": 459434, "epoch": 2734} {"train_loss": -12.044273376464844, "global_step": 459435, "epoch": 2734} {"train_loss": -12.470916748046875, "global_step": 459436, "epoch": 2734} {"train_loss": -12.026586532592773, "global_step": 459437, "epoch": 2734} {"train_loss": -12.60285758972168, "global_step": 459438, "epoch": 2734} {"train_loss": -12.304848670959473, "global_step": 459439, "epoch": 2734} {"train_loss": -12.509105682373047, "global_step": 459440, "epoch": 2734} {"train_loss": -12.059350967407227, "global_step": 459441, "epoch": 2734} {"train_loss": -12.637585639953613, "global_step": 459442, "epoch": 2734} {"train_loss": -11.707316398620605, "global_step": 459443, "epoch": 2734} {"train_loss": -11.958332061767578, "global_step": 459444, "epoch": 2734} {"train_loss": -12.60708236694336, "global_step": 459445, "epoch": 2734} {"train_loss": -12.054672241210938, "global_step": 459446, "epoch": 2734} {"train_loss": -12.519744873046875, "global_step": 459447, "epoch": 2734} {"train_loss": -12.723309516906738, "global_step": 459448, "epoch": 2734} {"train_loss": -12.078117370605469, "global_step": 459449, "epoch": 2734} {"train_loss": -12.032873153686523, "global_step": 459450, "epoch": 2734} {"train_loss": -12.817081451416016, "global_step": 459451, "epoch": 2734} {"train_loss": -11.998773574829102, "global_step": 459452, "epoch": 2734} {"train_loss": -12.494430541992188, "global_step": 459453, "epoch": 2734} {"train_loss": -12.607328414916992, "global_step": 459454, "epoch": 2734} {"train_loss": -12.578590393066406, "global_step": 459455, "epoch": 2734} {"train_loss": -12.727876663208008, "global_step": 459456, "epoch": 2734} {"train_loss": -12.588302612304688, "global_step": 459457, "epoch": 2734} {"train_loss": -12.71027946472168, "global_step": 459458, "epoch": 2734} {"train_loss": -12.683748245239258, "global_step": 459459, "epoch": 2734} {"train_loss": -12.795232772827148, "global_step": 459460, "epoch": 2734} {"train_loss": -12.736907958984375, "global_step": 459461, "epoch": 2734} {"train_loss": -12.896303176879883, "global_step": 459462, "epoch": 2734} {"train_loss": -12.589821815490723, "global_step": 459463, "epoch": 2734} {"train_loss": -12.847663879394531, "global_step": 459464, "epoch": 2734} {"train_loss": -12.88015365600586, "global_step": 459465, "epoch": 2734} {"train_loss": -12.691784858703613, "global_step": 459466, "epoch": 2734} {"train_loss": -12.741568565368652, "global_step": 459467, "epoch": 2734} {"train_loss": -12.795520782470703, "global_step": 459468, "epoch": 2734} {"train_loss": -12.891386032104492, "global_step": 459469, "epoch": 2734} {"train_loss": -12.728782653808594, "global_step": 459470, "epoch": 2734} {"train_loss": -12.747652053833008, "global_step": 459471, "epoch": 2734} {"train_loss": -12.819157600402832, "global_step": 459472, "epoch": 2734} {"train_loss": -12.820793151855469, "global_step": 459473, "epoch": 2734} {"train_loss": -13.014161109924316, "global_step": 459474, "epoch": 2734} {"train_loss": -12.887725830078125, "global_step": 459475, "epoch": 2734} {"train_loss": -12.81461238861084, "global_step": 459476, "epoch": 2734} {"train_loss": -12.912864685058594, "global_step": 459477, "epoch": 2734} {"train_loss": -12.887042045593262, "global_step": 459478, "epoch": 2734} {"train_loss": -12.206841048740205, "global_step": 459479, "epoch": 2734, "val_loss": 315618.34375} {"train_loss": -13.000530242919922, "global_step": 459480, "epoch": 2735} {"train_loss": -13.02017593383789, "global_step": 459481, "epoch": 2735} {"train_loss": -12.931976318359375, "global_step": 459482, "epoch": 2735} {"train_loss": -12.732685089111328, "global_step": 459483, "epoch": 2735} {"train_loss": -12.7720947265625, "global_step": 459484, "epoch": 2735} {"train_loss": -13.074345588684082, "global_step": 459485, "epoch": 2735} {"train_loss": -12.838171005249023, "global_step": 459486, "epoch": 2735} {"train_loss": -12.84232234954834, "global_step": 459487, "epoch": 2735} {"train_loss": -12.842599868774414, "global_step": 459488, "epoch": 2735} {"train_loss": -12.678451538085938, "global_step": 459489, "epoch": 2735} {"train_loss": -12.256538391113281, "global_step": 459490, "epoch": 2735} {"train_loss": -12.646138191223145, "global_step": 459491, "epoch": 2735} {"train_loss": -12.969701766967773, "global_step": 459492, "epoch": 2735} {"train_loss": -12.321210861206055, "global_step": 459493, "epoch": 2735} {"train_loss": -12.340686798095703, "global_step": 459494, "epoch": 2735} {"train_loss": -12.73475456237793, "global_step": 459495, "epoch": 2735} {"train_loss": -12.529718399047852, "global_step": 459496, "epoch": 2735} {"train_loss": -12.45972728729248, "global_step": 459497, "epoch": 2735} {"train_loss": -12.679740905761719, "global_step": 459498, "epoch": 2735} {"train_loss": -12.693387985229492, "global_step": 459499, "epoch": 2735} {"train_loss": -12.465426445007324, "global_step": 459500, "epoch": 2735} {"train_loss": -12.371526718139648, "global_step": 459501, "epoch": 2735} {"train_loss": -11.632564544677734, "global_step": 459502, "epoch": 2735} {"train_loss": -11.930179595947266, "global_step": 459503, "epoch": 2735} {"train_loss": -12.294483184814453, "global_step": 459504, "epoch": 2735} {"train_loss": -11.54861831665039, "global_step": 459505, "epoch": 2735} {"train_loss": -11.656134605407715, "global_step": 459506, "epoch": 2735} {"train_loss": -12.451754570007324, "global_step": 459507, "epoch": 2735} {"train_loss": -12.436470031738281, "global_step": 459508, "epoch": 2735} {"train_loss": -11.826334953308105, "global_step": 459509, "epoch": 2735} {"train_loss": -12.287896156311035, "global_step": 459510, "epoch": 2735} {"train_loss": -12.20474624633789, "global_step": 459511, "epoch": 2735} {"train_loss": -12.236080169677734, "global_step": 459512, "epoch": 2735} {"train_loss": -11.871011734008789, "global_step": 459513, "epoch": 2735} {"train_loss": -12.551494598388672, "global_step": 459514, "epoch": 2735} {"train_loss": -12.349266052246094, "global_step": 459515, "epoch": 2735} {"train_loss": -12.308446884155273, "global_step": 459516, "epoch": 2735} {"train_loss": -12.353666305541992, "global_step": 459517, "epoch": 2735} {"train_loss": -12.35762882232666, "global_step": 459518, "epoch": 2735} {"train_loss": -11.764444351196289, "global_step": 459519, "epoch": 2735} {"train_loss": -12.094679832458496, "global_step": 459520, "epoch": 2735} {"train_loss": -11.793858528137207, "global_step": 459521, "epoch": 2735} {"train_loss": -11.845390319824219, "global_step": 459522, "epoch": 2735} {"train_loss": -12.431966781616211, "global_step": 459523, "epoch": 2735} {"train_loss": -11.594367980957031, "global_step": 459524, "epoch": 2735} {"train_loss": -12.520101547241211, "global_step": 459525, "epoch": 2735} {"train_loss": -11.903806686401367, "global_step": 459526, "epoch": 2735} {"train_loss": -12.865945816040039, "global_step": 459527, "epoch": 2735} {"train_loss": -12.186355590820312, "global_step": 459528, "epoch": 2735} {"train_loss": -12.38300895690918, "global_step": 459529, "epoch": 2735} {"train_loss": -12.048954010009766, "global_step": 459530, "epoch": 2735} {"train_loss": -12.265254974365234, "global_step": 459531, "epoch": 2735} {"train_loss": -12.149985313415527, "global_step": 459532, "epoch": 2735} {"train_loss": -11.188029289245605, "global_step": 459533, "epoch": 2735} {"train_loss": -10.027063369750977, "global_step": 459534, "epoch": 2735} {"train_loss": -12.297637939453125, "global_step": 459535, "epoch": 2735} {"train_loss": -8.893001556396484, "global_step": 459536, "epoch": 2735} {"train_loss": -8.908241271972656, "global_step": 459537, "epoch": 2735} {"train_loss": -10.553018569946289, "global_step": 459538, "epoch": 2735} {"train_loss": -11.532252311706543, "global_step": 459539, "epoch": 2735} {"train_loss": -10.765253067016602, "global_step": 459540, "epoch": 2735} {"train_loss": -10.335060119628906, "global_step": 459541, "epoch": 2735} {"train_loss": -12.057815551757812, "global_step": 459542, "epoch": 2735} {"train_loss": -10.007813453674316, "global_step": 459543, "epoch": 2735} {"train_loss": -11.197610855102539, "global_step": 459544, "epoch": 2735} {"train_loss": -11.762186050415039, "global_step": 459545, "epoch": 2735} {"train_loss": -10.494586944580078, "global_step": 459546, "epoch": 2735} {"train_loss": -12.094354629516602, "global_step": 459547, "epoch": 2735} {"train_loss": -11.82522964477539, "global_step": 459548, "epoch": 2735} {"train_loss": -11.305940628051758, "global_step": 459549, "epoch": 2735} {"train_loss": -11.646564483642578, "global_step": 459550, "epoch": 2735} {"train_loss": -11.82712459564209, "global_step": 459551, "epoch": 2735} {"train_loss": -11.68077278137207, "global_step": 459552, "epoch": 2735} {"train_loss": -12.265670776367188, "global_step": 459553, "epoch": 2735} {"train_loss": -11.739150047302246, "global_step": 459554, "epoch": 2735} {"train_loss": -12.057332992553711, "global_step": 459555, "epoch": 2735} {"train_loss": -12.463733673095703, "global_step": 459556, "epoch": 2735} {"train_loss": -12.13547420501709, "global_step": 459557, "epoch": 2735} {"train_loss": -11.975486755371094, "global_step": 459558, "epoch": 2735} {"train_loss": -11.948308944702148, "global_step": 459559, "epoch": 2735} {"train_loss": -12.161818504333496, "global_step": 459560, "epoch": 2735} {"train_loss": -12.024611473083496, "global_step": 459561, "epoch": 2735} {"train_loss": -10.774478912353516, "global_step": 459562, "epoch": 2735} {"train_loss": -11.644344329833984, "global_step": 459563, "epoch": 2735} {"train_loss": -11.072112083435059, "global_step": 459564, "epoch": 2735} {"train_loss": -11.33481216430664, "global_step": 459565, "epoch": 2735} {"train_loss": -11.444931030273438, "global_step": 459566, "epoch": 2735} {"train_loss": -11.233448028564453, "global_step": 459567, "epoch": 2735} {"train_loss": -11.604022979736328, "global_step": 459568, "epoch": 2735} {"train_loss": -11.711648941040039, "global_step": 459569, "epoch": 2735} {"train_loss": -11.628959655761719, "global_step": 459570, "epoch": 2735} {"train_loss": -12.040281295776367, "global_step": 459571, "epoch": 2735} {"train_loss": -11.494646072387695, "global_step": 459572, "epoch": 2735} {"train_loss": -12.195707321166992, "global_step": 459573, "epoch": 2735} {"train_loss": -12.3419771194458, "global_step": 459574, "epoch": 2735} {"train_loss": -12.19471549987793, "global_step": 459575, "epoch": 2735} {"train_loss": -12.066984176635742, "global_step": 459576, "epoch": 2735} {"train_loss": -11.901121139526367, "global_step": 459577, "epoch": 2735} {"train_loss": -12.73514461517334, "global_step": 459578, "epoch": 2735} {"train_loss": -11.842913627624512, "global_step": 459579, "epoch": 2735} {"train_loss": -12.257929801940918, "global_step": 459580, "epoch": 2735} {"train_loss": -12.057210922241211, "global_step": 459581, "epoch": 2735} {"train_loss": -11.946596145629883, "global_step": 459582, "epoch": 2735} {"train_loss": -11.89765739440918, "global_step": 459583, "epoch": 2735} {"train_loss": -12.00947380065918, "global_step": 459584, "epoch": 2735} {"train_loss": -12.457886695861816, "global_step": 459585, "epoch": 2735} {"train_loss": -11.98398208618164, "global_step": 459586, "epoch": 2735} {"train_loss": -11.99579906463623, "global_step": 459587, "epoch": 2735} {"train_loss": -11.042107582092285, "global_step": 459588, "epoch": 2735} {"train_loss": -12.459534645080566, "global_step": 459589, "epoch": 2735} {"train_loss": -11.606231689453125, "global_step": 459590, "epoch": 2735} {"train_loss": -12.466073989868164, "global_step": 459591, "epoch": 2735} {"train_loss": -11.881742477416992, "global_step": 459592, "epoch": 2735} {"train_loss": -12.130743026733398, "global_step": 459593, "epoch": 2735} {"train_loss": -12.296453475952148, "global_step": 459594, "epoch": 2735} {"train_loss": -11.733707427978516, "global_step": 459595, "epoch": 2735} {"train_loss": -12.706252098083496, "global_step": 459596, "epoch": 2735} {"train_loss": -12.115768432617188, "global_step": 459597, "epoch": 2735} {"train_loss": -12.51396369934082, "global_step": 459598, "epoch": 2735} {"train_loss": -12.484922409057617, "global_step": 459599, "epoch": 2735} {"train_loss": -12.21676254272461, "global_step": 459600, "epoch": 2735} {"train_loss": -12.582566261291504, "global_step": 459601, "epoch": 2735} {"train_loss": -12.294076919555664, "global_step": 459602, "epoch": 2735} {"train_loss": -12.672358512878418, "global_step": 459603, "epoch": 2735} {"train_loss": -12.45970630645752, "global_step": 459604, "epoch": 2735} {"train_loss": -12.502525329589844, "global_step": 459605, "epoch": 2735} {"train_loss": -12.519031524658203, "global_step": 459606, "epoch": 2735} {"train_loss": -12.717353820800781, "global_step": 459607, "epoch": 2735} {"train_loss": -12.499776840209961, "global_step": 459608, "epoch": 2735} {"train_loss": -12.402947425842285, "global_step": 459609, "epoch": 2735} {"train_loss": -12.757392883300781, "global_step": 459610, "epoch": 2735} {"train_loss": -12.441886901855469, "global_step": 459611, "epoch": 2735} {"train_loss": -12.579874038696289, "global_step": 459612, "epoch": 2735} {"train_loss": -12.273090362548828, "global_step": 459613, "epoch": 2735} {"train_loss": -12.5447998046875, "global_step": 459614, "epoch": 2735} {"train_loss": -12.666872024536133, "global_step": 459615, "epoch": 2735} {"train_loss": -12.50483512878418, "global_step": 459616, "epoch": 2735} {"train_loss": -12.659872055053711, "global_step": 459617, "epoch": 2735} {"train_loss": -12.427679061889648, "global_step": 459618, "epoch": 2735} {"train_loss": -12.737789154052734, "global_step": 459619, "epoch": 2735} {"train_loss": -12.575661659240723, "global_step": 459620, "epoch": 2735} {"train_loss": -12.710471153259277, "global_step": 459621, "epoch": 2735} {"train_loss": -12.707357406616211, "global_step": 459622, "epoch": 2735} {"train_loss": -12.9532470703125, "global_step": 459623, "epoch": 2735} {"train_loss": -12.68526840209961, "global_step": 459624, "epoch": 2735} {"train_loss": -12.90416145324707, "global_step": 459625, "epoch": 2735} {"train_loss": -12.753908157348633, "global_step": 459626, "epoch": 2735} {"train_loss": -12.862080574035645, "global_step": 459627, "epoch": 2735} {"train_loss": -12.714717864990234, "global_step": 459628, "epoch": 2735} {"train_loss": -12.867891311645508, "global_step": 459629, "epoch": 2735} {"train_loss": -12.985156059265137, "global_step": 459630, "epoch": 2735} {"train_loss": -12.795774459838867, "global_step": 459631, "epoch": 2735} {"train_loss": -12.77690601348877, "global_step": 459632, "epoch": 2735} {"train_loss": -12.696020126342773, "global_step": 459633, "epoch": 2735} {"train_loss": -12.753012657165527, "global_step": 459634, "epoch": 2735} {"train_loss": -12.419002532958984, "global_step": 459635, "epoch": 2735} {"train_loss": -12.760842323303223, "global_step": 459636, "epoch": 2735} {"train_loss": -12.353155136108398, "global_step": 459637, "epoch": 2735} {"train_loss": -12.542867660522461, "global_step": 459638, "epoch": 2735} {"train_loss": -12.764474868774414, "global_step": 459639, "epoch": 2735} {"train_loss": -12.555205345153809, "global_step": 459640, "epoch": 2735} {"train_loss": -12.692183494567871, "global_step": 459641, "epoch": 2735} {"train_loss": -12.566644668579102, "global_step": 459642, "epoch": 2735} {"train_loss": -12.496360778808594, "global_step": 459643, "epoch": 2735} {"train_loss": -12.840299606323242, "global_step": 459644, "epoch": 2735} {"train_loss": -12.643909454345703, "global_step": 459645, "epoch": 2735} {"train_loss": -12.036218643188477, "global_step": 459646, "epoch": 2735} {"train_loss": -12.164862797373818, "global_step": 459647, "epoch": 2735, "val_loss": 312363.96875, "train_action_mse_error": 1.1888608932495117} {"train_loss": -11.940616607666016, "global_step": 459648, "epoch": 2736} {"train_loss": -12.58322525024414, "global_step": 459649, "epoch": 2736} {"train_loss": -12.132356643676758, "global_step": 459650, "epoch": 2736} {"train_loss": -12.210742950439453, "global_step": 459651, "epoch": 2736} {"train_loss": -11.893838882446289, "global_step": 459652, "epoch": 2736} {"train_loss": -12.35261344909668, "global_step": 459653, "epoch": 2736} {"train_loss": -12.412649154663086, "global_step": 459654, "epoch": 2736} {"train_loss": -12.207473754882812, "global_step": 459655, "epoch": 2736} {"train_loss": -12.63330078125, "global_step": 459656, "epoch": 2736} {"train_loss": -12.414546012878418, "global_step": 459657, "epoch": 2736} {"train_loss": -12.50149154663086, "global_step": 459658, "epoch": 2736} {"train_loss": -12.467752456665039, "global_step": 459659, "epoch": 2736} {"train_loss": -12.506224632263184, "global_step": 459660, "epoch": 2736} {"train_loss": -12.20740795135498, "global_step": 459661, "epoch": 2736} {"train_loss": -12.542882919311523, "global_step": 459662, "epoch": 2736} {"train_loss": -12.591729164123535, "global_step": 459663, "epoch": 2736} {"train_loss": -12.641447067260742, "global_step": 459664, "epoch": 2736} {"train_loss": -12.677217483520508, "global_step": 459665, "epoch": 2736} {"train_loss": -12.75429630279541, "global_step": 459666, "epoch": 2736} {"train_loss": -12.393757820129395, "global_step": 459667, "epoch": 2736} {"train_loss": -12.472705841064453, "global_step": 459668, "epoch": 2736} {"train_loss": -12.51126480102539, "global_step": 459669, "epoch": 2736} {"train_loss": -12.133386611938477, "global_step": 459670, "epoch": 2736} {"train_loss": -12.464765548706055, "global_step": 459671, "epoch": 2736} {"train_loss": -12.053646087646484, "global_step": 459672, "epoch": 2736} {"train_loss": -11.964729309082031, "global_step": 459673, "epoch": 2736} {"train_loss": -12.331096649169922, "global_step": 459674, "epoch": 2736} {"train_loss": -11.412399291992188, "global_step": 459675, "epoch": 2736} {"train_loss": -12.10273265838623, "global_step": 459676, "epoch": 2736} {"train_loss": -12.182199478149414, "global_step": 459677, "epoch": 2736} {"train_loss": -10.40582275390625, "global_step": 459678, "epoch": 2736} {"train_loss": -11.71040153503418, "global_step": 459679, "epoch": 2736} {"train_loss": -11.784603118896484, "global_step": 459680, "epoch": 2736} {"train_loss": -11.098834991455078, "global_step": 459681, "epoch": 2736} {"train_loss": -11.931755065917969, "global_step": 459682, "epoch": 2736} {"train_loss": -11.687997817993164, "global_step": 459683, "epoch": 2736} {"train_loss": -10.173151016235352, "global_step": 459684, "epoch": 2736} {"train_loss": -11.85224437713623, "global_step": 459685, "epoch": 2736} {"train_loss": -8.92399787902832, "global_step": 459686, "epoch": 2736} {"train_loss": -11.127927780151367, "global_step": 459687, "epoch": 2736} {"train_loss": -10.224750518798828, "global_step": 459688, "epoch": 2736} {"train_loss": -9.171255111694336, "global_step": 459689, "epoch": 2736} {"train_loss": -9.38640022277832, "global_step": 459690, "epoch": 2736} {"train_loss": -10.555865287780762, "global_step": 459691, "epoch": 2736} {"train_loss": -11.411529541015625, "global_step": 459692, "epoch": 2736} {"train_loss": -10.446155548095703, "global_step": 459693, "epoch": 2736} {"train_loss": -9.124794006347656, "global_step": 459694, "epoch": 2736} {"train_loss": -9.445318222045898, "global_step": 459695, "epoch": 2736} {"train_loss": -10.573602676391602, "global_step": 459696, "epoch": 2736} {"train_loss": -10.776755332946777, "global_step": 459697, "epoch": 2736} {"train_loss": -10.233781814575195, "global_step": 459698, "epoch": 2736} {"train_loss": -11.368741989135742, "global_step": 459699, "epoch": 2736} {"train_loss": -11.804996490478516, "global_step": 459700, "epoch": 2736} {"train_loss": -11.194818496704102, "global_step": 459701, "epoch": 2736} {"train_loss": -11.569620132446289, "global_step": 459702, "epoch": 2736} {"train_loss": -11.12334156036377, "global_step": 459703, "epoch": 2736} {"train_loss": -11.719497680664062, "global_step": 459704, "epoch": 2736} {"train_loss": -11.209717750549316, "global_step": 459705, "epoch": 2736} {"train_loss": -11.086748123168945, "global_step": 459706, "epoch": 2736} {"train_loss": -11.653726577758789, "global_step": 459707, "epoch": 2736} {"train_loss": -11.362966537475586, "global_step": 459708, "epoch": 2736} {"train_loss": -11.233932495117188, "global_step": 459709, "epoch": 2736} {"train_loss": -10.580808639526367, "global_step": 459710, "epoch": 2736} {"train_loss": -11.78473949432373, "global_step": 459711, "epoch": 2736} {"train_loss": -10.378216743469238, "global_step": 459712, "epoch": 2736} {"train_loss": -10.153955459594727, "global_step": 459713, "epoch": 2736} {"train_loss": -11.380123138427734, "global_step": 459714, "epoch": 2736} {"train_loss": -10.77802848815918, "global_step": 459715, "epoch": 2736} {"train_loss": -11.208938598632812, "global_step": 459716, "epoch": 2736} {"train_loss": -11.301051139831543, "global_step": 459717, "epoch": 2736} {"train_loss": -10.748204231262207, "global_step": 459718, "epoch": 2736} {"train_loss": -11.58758544921875, "global_step": 459719, "epoch": 2736} {"train_loss": -10.547627449035645, "global_step": 459720, "epoch": 2736} {"train_loss": -11.239336013793945, "global_step": 459721, "epoch": 2736} {"train_loss": -11.291027069091797, "global_step": 459722, "epoch": 2736} {"train_loss": -11.113509178161621, "global_step": 459723, "epoch": 2736} {"train_loss": -11.0624418258667, "global_step": 459724, "epoch": 2736} {"train_loss": -11.867754936218262, "global_step": 459725, "epoch": 2736} {"train_loss": -11.505805969238281, "global_step": 459726, "epoch": 2736} {"train_loss": -11.687670707702637, "global_step": 459727, "epoch": 2736} {"train_loss": -11.677234649658203, "global_step": 459728, "epoch": 2736} {"train_loss": -10.950313568115234, "global_step": 459729, "epoch": 2736} {"train_loss": -11.697881698608398, "global_step": 459730, "epoch": 2736} {"train_loss": -11.71261978149414, "global_step": 459731, "epoch": 2736} {"train_loss": -11.187129974365234, "global_step": 459732, "epoch": 2736} {"train_loss": -12.278788566589355, "global_step": 459733, "epoch": 2736} {"train_loss": -11.591007232666016, "global_step": 459734, "epoch": 2736} {"train_loss": -11.843660354614258, "global_step": 459735, "epoch": 2736} {"train_loss": -12.282472610473633, "global_step": 459736, "epoch": 2736} {"train_loss": -11.471870422363281, "global_step": 459737, "epoch": 2736} {"train_loss": -11.474860191345215, "global_step": 459738, "epoch": 2736} {"train_loss": -12.15365219116211, "global_step": 459739, "epoch": 2736} {"train_loss": -11.409538269042969, "global_step": 459740, "epoch": 2736} {"train_loss": -11.936189651489258, "global_step": 459741, "epoch": 2736} {"train_loss": -12.270915985107422, "global_step": 459742, "epoch": 2736} {"train_loss": -11.638919830322266, "global_step": 459743, "epoch": 2736} {"train_loss": -11.924071311950684, "global_step": 459744, "epoch": 2736} {"train_loss": -11.917304992675781, "global_step": 459745, "epoch": 2736} {"train_loss": -11.807543754577637, "global_step": 459746, "epoch": 2736} {"train_loss": -12.312294006347656, "global_step": 459747, "epoch": 2736} {"train_loss": -12.231738090515137, "global_step": 459748, "epoch": 2736} {"train_loss": -12.097823143005371, "global_step": 459749, "epoch": 2736} {"train_loss": -12.19331169128418, "global_step": 459750, "epoch": 2736} {"train_loss": -12.267017364501953, "global_step": 459751, "epoch": 2736} {"train_loss": -12.266115188598633, "global_step": 459752, "epoch": 2736} {"train_loss": -12.36368179321289, "global_step": 459753, "epoch": 2736} {"train_loss": -12.109874725341797, "global_step": 459754, "epoch": 2736} {"train_loss": -12.246277809143066, "global_step": 459755, "epoch": 2736} {"train_loss": -12.470174789428711, "global_step": 459756, "epoch": 2736} {"train_loss": -12.191137313842773, "global_step": 459757, "epoch": 2736} {"train_loss": -12.320587158203125, "global_step": 459758, "epoch": 2736} {"train_loss": -12.377628326416016, "global_step": 459759, "epoch": 2736} {"train_loss": -12.427117347717285, "global_step": 459760, "epoch": 2736} {"train_loss": -12.418745040893555, "global_step": 459761, "epoch": 2736} {"train_loss": -12.420201301574707, "global_step": 459762, "epoch": 2736} {"train_loss": -12.394673347473145, "global_step": 459763, "epoch": 2736} {"train_loss": -12.589585304260254, "global_step": 459764, "epoch": 2736} {"train_loss": -12.440021514892578, "global_step": 459765, "epoch": 2736} {"train_loss": -12.683391571044922, "global_step": 459766, "epoch": 2736} {"train_loss": -12.550169944763184, "global_step": 459767, "epoch": 2736} {"train_loss": -12.758136749267578, "global_step": 459768, "epoch": 2736} {"train_loss": -12.765028953552246, "global_step": 459769, "epoch": 2736} {"train_loss": -12.791308403015137, "global_step": 459770, "epoch": 2736} {"train_loss": -12.392890930175781, "global_step": 459771, "epoch": 2736} {"train_loss": -12.298894882202148, "global_step": 459772, "epoch": 2736} {"train_loss": -12.583984375, "global_step": 459773, "epoch": 2736} {"train_loss": -12.459762573242188, "global_step": 459774, "epoch": 2736} {"train_loss": -12.590940475463867, "global_step": 459775, "epoch": 2736} {"train_loss": -12.594061851501465, "global_step": 459776, "epoch": 2736} {"train_loss": -12.330392837524414, "global_step": 459777, "epoch": 2736} {"train_loss": -12.763959884643555, "global_step": 459778, "epoch": 2736} {"train_loss": -12.58302116394043, "global_step": 459779, "epoch": 2736} {"train_loss": -12.699132919311523, "global_step": 459780, "epoch": 2736} {"train_loss": -12.642311096191406, "global_step": 459781, "epoch": 2736} {"train_loss": -12.50821304321289, "global_step": 459782, "epoch": 2736} {"train_loss": -12.510144233703613, "global_step": 459783, "epoch": 2736} {"train_loss": -12.342994689941406, "global_step": 459784, "epoch": 2736} {"train_loss": -12.62165355682373, "global_step": 459785, "epoch": 2736} {"train_loss": -12.540035247802734, "global_step": 459786, "epoch": 2736} {"train_loss": -12.76848030090332, "global_step": 459787, "epoch": 2736} {"train_loss": -12.429697036743164, "global_step": 459788, "epoch": 2736} {"train_loss": -12.837363243103027, "global_step": 459789, "epoch": 2736} {"train_loss": -12.738701820373535, "global_step": 459790, "epoch": 2736} {"train_loss": -12.64440631866455, "global_step": 459791, "epoch": 2736} {"train_loss": -12.703554153442383, "global_step": 459792, "epoch": 2736} {"train_loss": -12.681671142578125, "global_step": 459793, "epoch": 2736} {"train_loss": -12.757537841796875, "global_step": 459794, "epoch": 2736} {"train_loss": -12.715339660644531, "global_step": 459795, "epoch": 2736} {"train_loss": -12.758548736572266, "global_step": 459796, "epoch": 2736} {"train_loss": -12.816787719726562, "global_step": 459797, "epoch": 2736} {"train_loss": -12.880144119262695, "global_step": 459798, "epoch": 2736} {"train_loss": -12.803277969360352, "global_step": 459799, "epoch": 2736} {"train_loss": -12.695615768432617, "global_step": 459800, "epoch": 2736} {"train_loss": -12.835762023925781, "global_step": 459801, "epoch": 2736} {"train_loss": -12.792672157287598, "global_step": 459802, "epoch": 2736} {"train_loss": -12.738242149353027, "global_step": 459803, "epoch": 2736} {"train_loss": -12.629834175109863, "global_step": 459804, "epoch": 2736} {"train_loss": -12.614978790283203, "global_step": 459805, "epoch": 2736} {"train_loss": -12.066221237182617, "global_step": 459806, "epoch": 2736} {"train_loss": -12.86007308959961, "global_step": 459807, "epoch": 2736} {"train_loss": -12.242472648620605, "global_step": 459808, "epoch": 2736} {"train_loss": -12.259017944335938, "global_step": 459809, "epoch": 2736} {"train_loss": -12.804788589477539, "global_step": 459810, "epoch": 2736} {"train_loss": -12.64603328704834, "global_step": 459811, "epoch": 2736} {"train_loss": -12.694833755493164, "global_step": 459812, "epoch": 2736} {"train_loss": -12.782464981079102, "global_step": 459813, "epoch": 2736} {"train_loss": -12.810744285583496, "global_step": 459814, "epoch": 2736} {"train_loss": -11.941141968681698, "global_step": 459815, "epoch": 2736, "val_loss": 312920.875} {"train_loss": -12.454435348510742, "global_step": 459816, "epoch": 2737} {"train_loss": -13.036505699157715, "global_step": 459817, "epoch": 2737} {"train_loss": -12.273239135742188, "global_step": 459818, "epoch": 2737} {"train_loss": -12.565193176269531, "global_step": 459819, "epoch": 2737} {"train_loss": -12.485404968261719, "global_step": 459820, "epoch": 2737} {"train_loss": -11.60856819152832, "global_step": 459821, "epoch": 2737} {"train_loss": -12.37368106842041, "global_step": 459822, "epoch": 2737} {"train_loss": -10.800004005432129, "global_step": 459823, "epoch": 2737} {"train_loss": -12.097944259643555, "global_step": 459824, "epoch": 2737} {"train_loss": -11.623226165771484, "global_step": 459825, "epoch": 2737} {"train_loss": -9.451600074768066, "global_step": 459826, "epoch": 2737} {"train_loss": -12.298140525817871, "global_step": 459827, "epoch": 2737} {"train_loss": -11.53631591796875, "global_step": 459828, "epoch": 2737} {"train_loss": -11.605509757995605, "global_step": 459829, "epoch": 2737} {"train_loss": -11.85358715057373, "global_step": 459830, "epoch": 2737} {"train_loss": -11.039019584655762, "global_step": 459831, "epoch": 2737} {"train_loss": -11.359739303588867, "global_step": 459832, "epoch": 2737} {"train_loss": -11.059183120727539, "global_step": 459833, "epoch": 2737} {"train_loss": -11.905906677246094, "global_step": 459834, "epoch": 2737} {"train_loss": -10.74917984008789, "global_step": 459835, "epoch": 2737} {"train_loss": -11.831727981567383, "global_step": 459836, "epoch": 2737} {"train_loss": -11.372062683105469, "global_step": 459837, "epoch": 2737} {"train_loss": -11.239039421081543, "global_step": 459838, "epoch": 2737} {"train_loss": -11.884902000427246, "global_step": 459839, "epoch": 2737} {"train_loss": -11.01247787475586, "global_step": 459840, "epoch": 2737} {"train_loss": -11.884077072143555, "global_step": 459841, "epoch": 2737} {"train_loss": -10.589254379272461, "global_step": 459842, "epoch": 2737} {"train_loss": -12.310091018676758, "global_step": 459843, "epoch": 2737} {"train_loss": -10.029842376708984, "global_step": 459844, "epoch": 2737} {"train_loss": -11.867630004882812, "global_step": 459845, "epoch": 2737} {"train_loss": -11.336544036865234, "global_step": 459846, "epoch": 2737} {"train_loss": -11.088233947753906, "global_step": 459847, "epoch": 2737} {"train_loss": -11.641711235046387, "global_step": 459848, "epoch": 2737} {"train_loss": -10.893138885498047, "global_step": 459849, "epoch": 2737} {"train_loss": -11.287307739257812, "global_step": 459850, "epoch": 2737} {"train_loss": -10.830204010009766, "global_step": 459851, "epoch": 2737} {"train_loss": -11.270711898803711, "global_step": 459852, "epoch": 2737} {"train_loss": -11.250249862670898, "global_step": 459853, "epoch": 2737} {"train_loss": -11.633703231811523, "global_step": 459854, "epoch": 2737} {"train_loss": -11.498568534851074, "global_step": 459855, "epoch": 2737} {"train_loss": -12.072439193725586, "global_step": 459856, "epoch": 2737} {"train_loss": -10.999393463134766, "global_step": 459857, "epoch": 2737} {"train_loss": -11.56520938873291, "global_step": 459858, "epoch": 2737} {"train_loss": -10.94632339477539, "global_step": 459859, "epoch": 2737} {"train_loss": -11.042747497558594, "global_step": 459860, "epoch": 2737} {"train_loss": -11.80589485168457, "global_step": 459861, "epoch": 2737} {"train_loss": -10.979730606079102, "global_step": 459862, "epoch": 2737} {"train_loss": -10.951415061950684, "global_step": 459863, "epoch": 2737} {"train_loss": -10.790250778198242, "global_step": 459864, "epoch": 2737} {"train_loss": -11.374101638793945, "global_step": 459865, "epoch": 2737} {"train_loss": -11.427857398986816, "global_step": 459866, "epoch": 2737} {"train_loss": -11.838312149047852, "global_step": 459867, "epoch": 2737} {"train_loss": -11.179557800292969, "global_step": 459868, "epoch": 2737} {"train_loss": -12.086618423461914, "global_step": 459869, "epoch": 2737} {"train_loss": -11.588948249816895, "global_step": 459870, "epoch": 2737} {"train_loss": -11.853507995605469, "global_step": 459871, "epoch": 2737} {"train_loss": -11.874002456665039, "global_step": 459872, "epoch": 2737} {"train_loss": -12.175576210021973, "global_step": 459873, "epoch": 2737} {"train_loss": -12.085647583007812, "global_step": 459874, "epoch": 2737} {"train_loss": -12.261091232299805, "global_step": 459875, "epoch": 2737} {"train_loss": -11.891997337341309, "global_step": 459876, "epoch": 2737} {"train_loss": -12.493887901306152, "global_step": 459877, "epoch": 2737} {"train_loss": -12.04806900024414, "global_step": 459878, "epoch": 2737} {"train_loss": -12.181110382080078, "global_step": 459879, "epoch": 2737} {"train_loss": -12.11219310760498, "global_step": 459880, "epoch": 2737} {"train_loss": -12.300468444824219, "global_step": 459881, "epoch": 2737} {"train_loss": -12.324054718017578, "global_step": 459882, "epoch": 2737} {"train_loss": -12.16609001159668, "global_step": 459883, "epoch": 2737} {"train_loss": -12.15902328491211, "global_step": 459884, "epoch": 2737} {"train_loss": -12.561355590820312, "global_step": 459885, "epoch": 2737} {"train_loss": -12.186979293823242, "global_step": 459886, "epoch": 2737} {"train_loss": -12.19908332824707, "global_step": 459887, "epoch": 2737} {"train_loss": -12.124616622924805, "global_step": 459888, "epoch": 2737} {"train_loss": -12.368897438049316, "global_step": 459889, "epoch": 2737} {"train_loss": -12.238158226013184, "global_step": 459890, "epoch": 2737} {"train_loss": -12.478950500488281, "global_step": 459891, "epoch": 2737} {"train_loss": -12.307123184204102, "global_step": 459892, "epoch": 2737} {"train_loss": -12.46656608581543, "global_step": 459893, "epoch": 2737} {"train_loss": -12.505555152893066, "global_step": 459894, "epoch": 2737} {"train_loss": -12.12331771850586, "global_step": 459895, "epoch": 2737} {"train_loss": -12.358473777770996, "global_step": 459896, "epoch": 2737} {"train_loss": -12.437434196472168, "global_step": 459897, "epoch": 2737} {"train_loss": -12.464080810546875, "global_step": 459898, "epoch": 2737} {"train_loss": -12.505860328674316, "global_step": 459899, "epoch": 2737} {"train_loss": -12.337878227233887, "global_step": 459900, "epoch": 2737} {"train_loss": -12.451364517211914, "global_step": 459901, "epoch": 2737} {"train_loss": -12.551528930664062, "global_step": 459902, "epoch": 2737} {"train_loss": -12.587991714477539, "global_step": 459903, "epoch": 2737} {"train_loss": -12.531913757324219, "global_step": 459904, "epoch": 2737} {"train_loss": -12.631967544555664, "global_step": 459905, "epoch": 2737} {"train_loss": -12.76402759552002, "global_step": 459906, "epoch": 2737} {"train_loss": -12.543315887451172, "global_step": 459907, "epoch": 2737} {"train_loss": -12.512852668762207, "global_step": 459908, "epoch": 2737} {"train_loss": -12.41944694519043, "global_step": 459909, "epoch": 2737} {"train_loss": -12.506250381469727, "global_step": 459910, "epoch": 2737} {"train_loss": -12.383780479431152, "global_step": 459911, "epoch": 2737} {"train_loss": -12.672100067138672, "global_step": 459912, "epoch": 2737} {"train_loss": -12.290069580078125, "global_step": 459913, "epoch": 2737} {"train_loss": -12.359746932983398, "global_step": 459914, "epoch": 2737} {"train_loss": -12.49071979522705, "global_step": 459915, "epoch": 2737} {"train_loss": -12.848926544189453, "global_step": 459916, "epoch": 2737} {"train_loss": -12.578184127807617, "global_step": 459917, "epoch": 2737} {"train_loss": -12.411637306213379, "global_step": 459918, "epoch": 2737} {"train_loss": -12.711686134338379, "global_step": 459919, "epoch": 2737} {"train_loss": -12.327489852905273, "global_step": 459920, "epoch": 2737} {"train_loss": -12.481565475463867, "global_step": 459921, "epoch": 2737} {"train_loss": -12.28765869140625, "global_step": 459922, "epoch": 2737} {"train_loss": -12.488186836242676, "global_step": 459923, "epoch": 2737} {"train_loss": -12.430049896240234, "global_step": 459924, "epoch": 2737} {"train_loss": -12.58261489868164, "global_step": 459925, "epoch": 2737} {"train_loss": -12.57463264465332, "global_step": 459926, "epoch": 2737} {"train_loss": -12.520730972290039, "global_step": 459927, "epoch": 2737} {"train_loss": -12.154865264892578, "global_step": 459928, "epoch": 2737} {"train_loss": -12.62103271484375, "global_step": 459929, "epoch": 2737} {"train_loss": -12.653968811035156, "global_step": 459930, "epoch": 2737} {"train_loss": -12.363744735717773, "global_step": 459931, "epoch": 2737} {"train_loss": -12.725876808166504, "global_step": 459932, "epoch": 2737} {"train_loss": -12.117875099182129, "global_step": 459933, "epoch": 2737} {"train_loss": -12.662986755371094, "global_step": 459934, "epoch": 2737} {"train_loss": -11.914125442504883, "global_step": 459935, "epoch": 2737} {"train_loss": -12.527551651000977, "global_step": 459936, "epoch": 2737} {"train_loss": -12.460552215576172, "global_step": 459937, "epoch": 2737} {"train_loss": -12.394968032836914, "global_step": 459938, "epoch": 2737} {"train_loss": -12.653596878051758, "global_step": 459939, "epoch": 2737} {"train_loss": -12.340255737304688, "global_step": 459940, "epoch": 2737} {"train_loss": -12.357728958129883, "global_step": 459941, "epoch": 2737} {"train_loss": -12.351680755615234, "global_step": 459942, "epoch": 2737} {"train_loss": -12.557754516601562, "global_step": 459943, "epoch": 2737} {"train_loss": -12.603668212890625, "global_step": 459944, "epoch": 2737} {"train_loss": -12.378031730651855, "global_step": 459945, "epoch": 2737} {"train_loss": -12.608134269714355, "global_step": 459946, "epoch": 2737} {"train_loss": -12.470409393310547, "global_step": 459947, "epoch": 2737} {"train_loss": -12.346968650817871, "global_step": 459948, "epoch": 2737} {"train_loss": -12.465961456298828, "global_step": 459949, "epoch": 2737} {"train_loss": -12.352130889892578, "global_step": 459950, "epoch": 2737} {"train_loss": -12.07949161529541, "global_step": 459951, "epoch": 2737} {"train_loss": -12.761899948120117, "global_step": 459952, "epoch": 2737} {"train_loss": -11.92016887664795, "global_step": 459953, "epoch": 2737} {"train_loss": -12.675548553466797, "global_step": 459954, "epoch": 2737} {"train_loss": -12.242105484008789, "global_step": 459955, "epoch": 2737} {"train_loss": -12.616233825683594, "global_step": 459956, "epoch": 2737} {"train_loss": -12.704418182373047, "global_step": 459957, "epoch": 2737} {"train_loss": -12.399940490722656, "global_step": 459958, "epoch": 2737} {"train_loss": -12.542348861694336, "global_step": 459959, "epoch": 2737} {"train_loss": -12.468507766723633, "global_step": 459960, "epoch": 2737} {"train_loss": -12.256548881530762, "global_step": 459961, "epoch": 2737} {"train_loss": -11.587705612182617, "global_step": 459962, "epoch": 2737} {"train_loss": -12.171753883361816, "global_step": 459963, "epoch": 2737} {"train_loss": -12.19601821899414, "global_step": 459964, "epoch": 2737} {"train_loss": -11.946649551391602, "global_step": 459965, "epoch": 2737} {"train_loss": -11.85262393951416, "global_step": 459966, "epoch": 2737} {"train_loss": -12.431242942810059, "global_step": 459967, "epoch": 2737} {"train_loss": -12.307774543762207, "global_step": 459968, "epoch": 2737} {"train_loss": -11.688233375549316, "global_step": 459969, "epoch": 2737} {"train_loss": -12.120447158813477, "global_step": 459970, "epoch": 2737} {"train_loss": -12.395984649658203, "global_step": 459971, "epoch": 2737} {"train_loss": -11.770882606506348, "global_step": 459972, "epoch": 2737} {"train_loss": -12.267868041992188, "global_step": 459973, "epoch": 2737} {"train_loss": -11.371615409851074, "global_step": 459974, "epoch": 2737} {"train_loss": -11.583694458007812, "global_step": 459975, "epoch": 2737} {"train_loss": -11.854009628295898, "global_step": 459976, "epoch": 2737} {"train_loss": -11.935091018676758, "global_step": 459977, "epoch": 2737} {"train_loss": -11.514785766601562, "global_step": 459978, "epoch": 2737} {"train_loss": -12.09822940826416, "global_step": 459979, "epoch": 2737} {"train_loss": -12.22728157043457, "global_step": 459980, "epoch": 2737} {"train_loss": -11.371118545532227, "global_step": 459981, "epoch": 2737} {"train_loss": -12.292030334472656, "global_step": 459982, "epoch": 2737} {"train_loss": -12.033932430403572, "global_step": 459983, "epoch": 2737, "val_loss": 315283.75} {"train_loss": -12.442133903503418, "global_step": 459984, "epoch": 2738} {"train_loss": -10.806245803833008, "global_step": 459985, "epoch": 2738} {"train_loss": -11.802438735961914, "global_step": 459986, "epoch": 2738} {"train_loss": -12.016667366027832, "global_step": 459987, "epoch": 2738} {"train_loss": -11.408074378967285, "global_step": 459988, "epoch": 2738} {"train_loss": -11.624799728393555, "global_step": 459989, "epoch": 2738} {"train_loss": -12.131269454956055, "global_step": 459990, "epoch": 2738} {"train_loss": -11.325212478637695, "global_step": 459991, "epoch": 2738} {"train_loss": -12.225293159484863, "global_step": 459992, "epoch": 2738} {"train_loss": -11.509119033813477, "global_step": 459993, "epoch": 2738} {"train_loss": -12.434606552124023, "global_step": 459994, "epoch": 2738} {"train_loss": -12.145694732666016, "global_step": 459995, "epoch": 2738} {"train_loss": -11.739896774291992, "global_step": 459996, "epoch": 2738} {"train_loss": -12.170003890991211, "global_step": 459997, "epoch": 2738} {"train_loss": -10.981950759887695, "global_step": 459998, "epoch": 2738} {"train_loss": -11.219837188720703, "global_step": 459999, "epoch": 2738} {"train_loss": -11.350513458251953, "global_step": 460000, "epoch": 2738} {"train_loss": -11.562156677246094, "global_step": 460001, "epoch": 2738} {"train_loss": -11.51850700378418, "global_step": 460002, "epoch": 2738} {"train_loss": -12.085962295532227, "global_step": 460003, "epoch": 2738} {"train_loss": -11.918313980102539, "global_step": 460004, "epoch": 2738} {"train_loss": -12.127446174621582, "global_step": 460005, "epoch": 2738} {"train_loss": -12.177974700927734, "global_step": 460006, "epoch": 2738} {"train_loss": -12.169753074645996, "global_step": 460007, "epoch": 2738} {"train_loss": -12.066903114318848, "global_step": 460008, "epoch": 2738} {"train_loss": -12.589564323425293, "global_step": 460009, "epoch": 2738} {"train_loss": -12.007287979125977, "global_step": 460010, "epoch": 2738} {"train_loss": -12.05771541595459, "global_step": 460011, "epoch": 2738} {"train_loss": -12.318107604980469, "global_step": 460012, "epoch": 2738} {"train_loss": -12.048973083496094, "global_step": 460013, "epoch": 2738} {"train_loss": -12.589235305786133, "global_step": 460014, "epoch": 2738} {"train_loss": -12.3046293258667, "global_step": 460015, "epoch": 2738} {"train_loss": -12.322476387023926, "global_step": 460016, "epoch": 2738} {"train_loss": -12.44399356842041, "global_step": 460017, "epoch": 2738} {"train_loss": -12.375897407531738, "global_step": 460018, "epoch": 2738} {"train_loss": -12.353255271911621, "global_step": 460019, "epoch": 2738} {"train_loss": -12.316587448120117, "global_step": 460020, "epoch": 2738} {"train_loss": -11.87833023071289, "global_step": 460021, "epoch": 2738} {"train_loss": -12.261880874633789, "global_step": 460022, "epoch": 2738} {"train_loss": -12.152807235717773, "global_step": 460023, "epoch": 2738} {"train_loss": -12.458333969116211, "global_step": 460024, "epoch": 2738} {"train_loss": -12.187609672546387, "global_step": 460025, "epoch": 2738} {"train_loss": -12.28053092956543, "global_step": 460026, "epoch": 2738} {"train_loss": -12.361898422241211, "global_step": 460027, "epoch": 2738} {"train_loss": -12.38852596282959, "global_step": 460028, "epoch": 2738} {"train_loss": -12.338899612426758, "global_step": 460029, "epoch": 2738} {"train_loss": -12.350836753845215, "global_step": 460030, "epoch": 2738} {"train_loss": -12.226791381835938, "global_step": 460031, "epoch": 2738} {"train_loss": -12.323590278625488, "global_step": 460032, "epoch": 2738} {"train_loss": -11.776796340942383, "global_step": 460033, "epoch": 2738} {"train_loss": -11.04384708404541, "global_step": 460034, "epoch": 2738} {"train_loss": -12.128621101379395, "global_step": 460035, "epoch": 2738} {"train_loss": -10.439038276672363, "global_step": 460036, "epoch": 2738} {"train_loss": -12.253055572509766, "global_step": 460037, "epoch": 2738} {"train_loss": -11.970338821411133, "global_step": 460038, "epoch": 2738} {"train_loss": -11.506124496459961, "global_step": 460039, "epoch": 2738} {"train_loss": -12.443694114685059, "global_step": 460040, "epoch": 2738} {"train_loss": -11.572680473327637, "global_step": 460041, "epoch": 2738} {"train_loss": -12.409320831298828, "global_step": 460042, "epoch": 2738} {"train_loss": -11.446099281311035, "global_step": 460043, "epoch": 2738} {"train_loss": -12.333913803100586, "global_step": 460044, "epoch": 2738} {"train_loss": -11.351329803466797, "global_step": 460045, "epoch": 2738} {"train_loss": -11.832137107849121, "global_step": 460046, "epoch": 2738} {"train_loss": -11.461759567260742, "global_step": 460047, "epoch": 2738} {"train_loss": -12.245929718017578, "global_step": 460048, "epoch": 2738} {"train_loss": -11.357315063476562, "global_step": 460049, "epoch": 2738} {"train_loss": -11.141498565673828, "global_step": 460050, "epoch": 2738} {"train_loss": -11.52783489227295, "global_step": 460051, "epoch": 2738} {"train_loss": -11.442580223083496, "global_step": 460052, "epoch": 2738} {"train_loss": -11.123923301696777, "global_step": 460053, "epoch": 2738} {"train_loss": -12.137371063232422, "global_step": 460054, "epoch": 2738} {"train_loss": -11.707500457763672, "global_step": 460055, "epoch": 2738} {"train_loss": -11.864770889282227, "global_step": 460056, "epoch": 2738} {"train_loss": -12.264141082763672, "global_step": 460057, "epoch": 2738} {"train_loss": -11.784361839294434, "global_step": 460058, "epoch": 2738} {"train_loss": -12.25425910949707, "global_step": 460059, "epoch": 2738} {"train_loss": -11.758330345153809, "global_step": 460060, "epoch": 2738} {"train_loss": -11.792460441589355, "global_step": 460061, "epoch": 2738} {"train_loss": -12.059925079345703, "global_step": 460062, "epoch": 2738} {"train_loss": -11.522491455078125, "global_step": 460063, "epoch": 2738} {"train_loss": -12.226988792419434, "global_step": 460064, "epoch": 2738} {"train_loss": -11.99144172668457, "global_step": 460065, "epoch": 2738} {"train_loss": -11.844789505004883, "global_step": 460066, "epoch": 2738} {"train_loss": -12.293619155883789, "global_step": 460067, "epoch": 2738} {"train_loss": -12.004758834838867, "global_step": 460068, "epoch": 2738} {"train_loss": -12.20516586303711, "global_step": 460069, "epoch": 2738} {"train_loss": -11.856689453125, "global_step": 460070, "epoch": 2738} {"train_loss": -12.18655014038086, "global_step": 460071, "epoch": 2738} {"train_loss": -11.908023834228516, "global_step": 460072, "epoch": 2738} {"train_loss": -11.990078926086426, "global_step": 460073, "epoch": 2738} {"train_loss": -11.853677749633789, "global_step": 460074, "epoch": 2738} {"train_loss": -12.243081092834473, "global_step": 460075, "epoch": 2738} {"train_loss": -11.703094482421875, "global_step": 460076, "epoch": 2738} {"train_loss": -11.683353424072266, "global_step": 460077, "epoch": 2738} {"train_loss": -11.708356857299805, "global_step": 460078, "epoch": 2738} {"train_loss": -11.388127326965332, "global_step": 460079, "epoch": 2738} {"train_loss": -11.942115783691406, "global_step": 460080, "epoch": 2738} {"train_loss": -11.789205551147461, "global_step": 460081, "epoch": 2738} {"train_loss": -12.159109115600586, "global_step": 460082, "epoch": 2738} {"train_loss": -12.148258209228516, "global_step": 460083, "epoch": 2738} {"train_loss": -12.03734016418457, "global_step": 460084, "epoch": 2738} {"train_loss": -11.709367752075195, "global_step": 460085, "epoch": 2738} {"train_loss": -12.382678031921387, "global_step": 460086, "epoch": 2738} {"train_loss": -11.88136100769043, "global_step": 460087, "epoch": 2738} {"train_loss": -12.406030654907227, "global_step": 460088, "epoch": 2738} {"train_loss": -11.087732315063477, "global_step": 460089, "epoch": 2738} {"train_loss": -12.552841186523438, "global_step": 460090, "epoch": 2738} {"train_loss": -11.954541206359863, "global_step": 460091, "epoch": 2738} {"train_loss": -12.096867561340332, "global_step": 460092, "epoch": 2738} {"train_loss": -11.861034393310547, "global_step": 460093, "epoch": 2738} {"train_loss": -11.459709167480469, "global_step": 460094, "epoch": 2738} {"train_loss": -12.398065567016602, "global_step": 460095, "epoch": 2738} {"train_loss": -11.846561431884766, "global_step": 460096, "epoch": 2738} {"train_loss": -12.447811126708984, "global_step": 460097, "epoch": 2738} {"train_loss": -12.078454971313477, "global_step": 460098, "epoch": 2738} {"train_loss": -12.412040710449219, "global_step": 460099, "epoch": 2738} {"train_loss": -12.139167785644531, "global_step": 460100, "epoch": 2738} {"train_loss": -12.372952461242676, "global_step": 460101, "epoch": 2738} {"train_loss": -12.497213363647461, "global_step": 460102, "epoch": 2738} {"train_loss": -12.348236083984375, "global_step": 460103, "epoch": 2738} {"train_loss": -12.438570022583008, "global_step": 460104, "epoch": 2738} {"train_loss": -12.584023475646973, "global_step": 460105, "epoch": 2738} {"train_loss": -12.569860458374023, "global_step": 460106, "epoch": 2738} {"train_loss": -12.647751808166504, "global_step": 460107, "epoch": 2738} {"train_loss": -12.550995826721191, "global_step": 460108, "epoch": 2738} {"train_loss": -12.457437515258789, "global_step": 460109, "epoch": 2738} {"train_loss": -12.566320419311523, "global_step": 460110, "epoch": 2738} {"train_loss": -12.402961730957031, "global_step": 460111, "epoch": 2738} {"train_loss": -12.837345123291016, "global_step": 460112, "epoch": 2738} {"train_loss": -12.556690216064453, "global_step": 460113, "epoch": 2738} {"train_loss": -12.692955017089844, "global_step": 460114, "epoch": 2738} {"train_loss": -12.688169479370117, "global_step": 460115, "epoch": 2738} {"train_loss": -12.544904708862305, "global_step": 460116, "epoch": 2738} {"train_loss": -12.62309741973877, "global_step": 460117, "epoch": 2738} {"train_loss": -12.576885223388672, "global_step": 460118, "epoch": 2738} {"train_loss": -12.604951858520508, "global_step": 460119, "epoch": 2738} {"train_loss": -12.718154907226562, "global_step": 460120, "epoch": 2738} {"train_loss": -12.762746810913086, "global_step": 460121, "epoch": 2738} {"train_loss": -12.804651260375977, "global_step": 460122, "epoch": 2738} {"train_loss": -12.771429061889648, "global_step": 460123, "epoch": 2738} {"train_loss": -12.620491027832031, "global_step": 460124, "epoch": 2738} {"train_loss": -12.690430641174316, "global_step": 460125, "epoch": 2738} {"train_loss": -12.797195434570312, "global_step": 460126, "epoch": 2738} {"train_loss": -12.746466636657715, "global_step": 460127, "epoch": 2738} {"train_loss": -12.783440589904785, "global_step": 460128, "epoch": 2738} {"train_loss": -12.720600128173828, "global_step": 460129, "epoch": 2738} {"train_loss": -12.87258529663086, "global_step": 460130, "epoch": 2738} {"train_loss": -12.893418312072754, "global_step": 460131, "epoch": 2738} {"train_loss": -12.83862018585205, "global_step": 460132, "epoch": 2738} {"train_loss": -12.962689399719238, "global_step": 460133, "epoch": 2738} {"train_loss": -12.771527290344238, "global_step": 460134, "epoch": 2738} {"train_loss": -12.913936614990234, "global_step": 460135, "epoch": 2738} {"train_loss": -12.747228622436523, "global_step": 460136, "epoch": 2738} {"train_loss": -12.893416404724121, "global_step": 460137, "epoch": 2738} {"train_loss": -12.801639556884766, "global_step": 460138, "epoch": 2738} {"train_loss": -12.933845520019531, "global_step": 460139, "epoch": 2738} {"train_loss": -12.880854606628418, "global_step": 460140, "epoch": 2738} {"train_loss": -12.849318504333496, "global_step": 460141, "epoch": 2738} {"train_loss": -12.648908615112305, "global_step": 460142, "epoch": 2738} {"train_loss": -12.902628898620605, "global_step": 460143, "epoch": 2738} {"train_loss": -12.77559757232666, "global_step": 460144, "epoch": 2738} {"train_loss": -12.544249534606934, "global_step": 460145, "epoch": 2738} {"train_loss": -12.836512565612793, "global_step": 460146, "epoch": 2738} {"train_loss": -12.647516250610352, "global_step": 460147, "epoch": 2738} {"train_loss": -13.073516845703125, "global_step": 460148, "epoch": 2738} {"train_loss": -12.807820320129395, "global_step": 460149, "epoch": 2738} {"train_loss": -12.508301734924316, "global_step": 460150, "epoch": 2738} {"train_loss": -12.174763560295105, "global_step": 460151, "epoch": 2738, "val_loss": 314889.65625} {"train_loss": -12.874614715576172, "global_step": 460152, "epoch": 2739} {"train_loss": -12.512765884399414, "global_step": 460153, "epoch": 2739} {"train_loss": -12.8482027053833, "global_step": 460154, "epoch": 2739} {"train_loss": -12.844165802001953, "global_step": 460155, "epoch": 2739} {"train_loss": -12.576835632324219, "global_step": 460156, "epoch": 2739} {"train_loss": -12.527511596679688, "global_step": 460157, "epoch": 2739} {"train_loss": -12.907730102539062, "global_step": 460158, "epoch": 2739} {"train_loss": -12.900243759155273, "global_step": 460159, "epoch": 2739} {"train_loss": -12.721020698547363, "global_step": 460160, "epoch": 2739} {"train_loss": -13.052011489868164, "global_step": 460161, "epoch": 2739} {"train_loss": -12.777894973754883, "global_step": 460162, "epoch": 2739} {"train_loss": -12.41374397277832, "global_step": 460163, "epoch": 2739} {"train_loss": -12.624217987060547, "global_step": 460164, "epoch": 2739} {"train_loss": -12.982357025146484, "global_step": 460165, "epoch": 2739} {"train_loss": -12.826982498168945, "global_step": 460166, "epoch": 2739} {"train_loss": -12.838615417480469, "global_step": 460167, "epoch": 2739} {"train_loss": -12.721012115478516, "global_step": 460168, "epoch": 2739} {"train_loss": -12.888258934020996, "global_step": 460169, "epoch": 2739} {"train_loss": -12.478231430053711, "global_step": 460170, "epoch": 2739} {"train_loss": -12.798492431640625, "global_step": 460171, "epoch": 2739} {"train_loss": -12.817705154418945, "global_step": 460172, "epoch": 2739} {"train_loss": -12.699164390563965, "global_step": 460173, "epoch": 2739} {"train_loss": -12.898778915405273, "global_step": 460174, "epoch": 2739} {"train_loss": -12.686321258544922, "global_step": 460175, "epoch": 2739} {"train_loss": -13.085789680480957, "global_step": 460176, "epoch": 2739} {"train_loss": -12.9757080078125, "global_step": 460177, "epoch": 2739} {"train_loss": -12.590928077697754, "global_step": 460178, "epoch": 2739} {"train_loss": -12.83987808227539, "global_step": 460179, "epoch": 2739} {"train_loss": -12.540502548217773, "global_step": 460180, "epoch": 2739} {"train_loss": -12.636258125305176, "global_step": 460181, "epoch": 2739} {"train_loss": -12.187823295593262, "global_step": 460182, "epoch": 2739} {"train_loss": -12.215510368347168, "global_step": 460183, "epoch": 2739} {"train_loss": -12.431812286376953, "global_step": 460184, "epoch": 2739} {"train_loss": -12.798293113708496, "global_step": 460185, "epoch": 2739} {"train_loss": -12.347972869873047, "global_step": 460186, "epoch": 2739} {"train_loss": -12.364347457885742, "global_step": 460187, "epoch": 2739} {"train_loss": -12.301881790161133, "global_step": 460188, "epoch": 2739} {"train_loss": -12.731218338012695, "global_step": 460189, "epoch": 2739} {"train_loss": -12.417655944824219, "global_step": 460190, "epoch": 2739} {"train_loss": -12.283110618591309, "global_step": 460191, "epoch": 2739} {"train_loss": -12.312880516052246, "global_step": 460192, "epoch": 2739} {"train_loss": -12.0634126663208, "global_step": 460193, "epoch": 2739} {"train_loss": -11.997934341430664, "global_step": 460194, "epoch": 2739} {"train_loss": -11.309520721435547, "global_step": 460195, "epoch": 2739} {"train_loss": -12.408802032470703, "global_step": 460196, "epoch": 2739} {"train_loss": -11.985265731811523, "global_step": 460197, "epoch": 2739} {"train_loss": -12.412126541137695, "global_step": 460198, "epoch": 2739} {"train_loss": -11.976441383361816, "global_step": 460199, "epoch": 2739} {"train_loss": -12.31852912902832, "global_step": 460200, "epoch": 2739} {"train_loss": -12.639453887939453, "global_step": 460201, "epoch": 2739} {"train_loss": -11.903383255004883, "global_step": 460202, "epoch": 2739} {"train_loss": -11.986785888671875, "global_step": 460203, "epoch": 2739} {"train_loss": -12.277726173400879, "global_step": 460204, "epoch": 2739} {"train_loss": -10.946407318115234, "global_step": 460205, "epoch": 2739} {"train_loss": -10.30630111694336, "global_step": 460206, "epoch": 2739} {"train_loss": -9.369890213012695, "global_step": 460207, "epoch": 2739} {"train_loss": -11.457666397094727, "global_step": 460208, "epoch": 2739} {"train_loss": -8.93874740600586, "global_step": 460209, "epoch": 2739} {"train_loss": -10.200422286987305, "global_step": 460210, "epoch": 2739} {"train_loss": -11.976297378540039, "global_step": 460211, "epoch": 2739} {"train_loss": -9.644641876220703, "global_step": 460212, "epoch": 2739} {"train_loss": -11.029657363891602, "global_step": 460213, "epoch": 2739} {"train_loss": -11.61761474609375, "global_step": 460214, "epoch": 2739} {"train_loss": -10.21822452545166, "global_step": 460215, "epoch": 2739} {"train_loss": -9.963155746459961, "global_step": 460216, "epoch": 2739} {"train_loss": -11.3360595703125, "global_step": 460217, "epoch": 2739} {"train_loss": -10.682766914367676, "global_step": 460218, "epoch": 2739} {"train_loss": -11.819287300109863, "global_step": 460219, "epoch": 2739} {"train_loss": -10.464139938354492, "global_step": 460220, "epoch": 2739} {"train_loss": -9.50131607055664, "global_step": 460221, "epoch": 2739} {"train_loss": -10.42955207824707, "global_step": 460222, "epoch": 2739} {"train_loss": -10.362350463867188, "global_step": 460223, "epoch": 2739} {"train_loss": -9.778003692626953, "global_step": 460224, "epoch": 2739} {"train_loss": -10.815275192260742, "global_step": 460225, "epoch": 2739} {"train_loss": -11.274528503417969, "global_step": 460226, "epoch": 2739} {"train_loss": -11.302552223205566, "global_step": 460227, "epoch": 2739} {"train_loss": -10.739898681640625, "global_step": 460228, "epoch": 2739} {"train_loss": -11.069171905517578, "global_step": 460229, "epoch": 2739} {"train_loss": -11.103309631347656, "global_step": 460230, "epoch": 2739} {"train_loss": -11.096603393554688, "global_step": 460231, "epoch": 2739} {"train_loss": -11.876975059509277, "global_step": 460232, "epoch": 2739} {"train_loss": -11.313552856445312, "global_step": 460233, "epoch": 2739} {"train_loss": -11.637338638305664, "global_step": 460234, "epoch": 2739} {"train_loss": -11.608467102050781, "global_step": 460235, "epoch": 2739} {"train_loss": -11.817550659179688, "global_step": 460236, "epoch": 2739} {"train_loss": -11.915996551513672, "global_step": 460237, "epoch": 2739} {"train_loss": -11.5674467086792, "global_step": 460238, "epoch": 2739} {"train_loss": -12.094589233398438, "global_step": 460239, "epoch": 2739} {"train_loss": -12.009054183959961, "global_step": 460240, "epoch": 2739} {"train_loss": -12.025419235229492, "global_step": 460241, "epoch": 2739} {"train_loss": -12.23975944519043, "global_step": 460242, "epoch": 2739} {"train_loss": -11.773637771606445, "global_step": 460243, "epoch": 2739} {"train_loss": -12.361889839172363, "global_step": 460244, "epoch": 2739} {"train_loss": -12.104913711547852, "global_step": 460245, "epoch": 2739} {"train_loss": -12.01121711730957, "global_step": 460246, "epoch": 2739} {"train_loss": -12.211233139038086, "global_step": 460247, "epoch": 2739} {"train_loss": -12.10097885131836, "global_step": 460248, "epoch": 2739} {"train_loss": -12.372929573059082, "global_step": 460249, "epoch": 2739} {"train_loss": -12.165372848510742, "global_step": 460250, "epoch": 2739} {"train_loss": -12.16673469543457, "global_step": 460251, "epoch": 2739} {"train_loss": -12.323380470275879, "global_step": 460252, "epoch": 2739} {"train_loss": -11.744305610656738, "global_step": 460253, "epoch": 2739} {"train_loss": -12.501157760620117, "global_step": 460254, "epoch": 2739} {"train_loss": -12.07178783416748, "global_step": 460255, "epoch": 2739} {"train_loss": -12.367904663085938, "global_step": 460256, "epoch": 2739} {"train_loss": -12.300938606262207, "global_step": 460257, "epoch": 2739} {"train_loss": -12.058456420898438, "global_step": 460258, "epoch": 2739} {"train_loss": -12.371724128723145, "global_step": 460259, "epoch": 2739} {"train_loss": -11.963632583618164, "global_step": 460260, "epoch": 2739} {"train_loss": -12.577312469482422, "global_step": 460261, "epoch": 2739} {"train_loss": -12.095088958740234, "global_step": 460262, "epoch": 2739} {"train_loss": -12.386611938476562, "global_step": 460263, "epoch": 2739} {"train_loss": -12.280939102172852, "global_step": 460264, "epoch": 2739} {"train_loss": -12.108269691467285, "global_step": 460265, "epoch": 2739} {"train_loss": -12.606315612792969, "global_step": 460266, "epoch": 2739} {"train_loss": -12.298431396484375, "global_step": 460267, "epoch": 2739} {"train_loss": -12.183369636535645, "global_step": 460268, "epoch": 2739} {"train_loss": -12.454120635986328, "global_step": 460269, "epoch": 2739} {"train_loss": -11.973121643066406, "global_step": 460270, "epoch": 2739} {"train_loss": -12.81411075592041, "global_step": 460271, "epoch": 2739} {"train_loss": -12.426008224487305, "global_step": 460272, "epoch": 2739} {"train_loss": -12.398685455322266, "global_step": 460273, "epoch": 2739} {"train_loss": -12.741415023803711, "global_step": 460274, "epoch": 2739} {"train_loss": -12.644715309143066, "global_step": 460275, "epoch": 2739} {"train_loss": -12.676279067993164, "global_step": 460276, "epoch": 2739} {"train_loss": -12.679179191589355, "global_step": 460277, "epoch": 2739} {"train_loss": -12.502235412597656, "global_step": 460278, "epoch": 2739} {"train_loss": -12.543977737426758, "global_step": 460279, "epoch": 2739} {"train_loss": -12.759990692138672, "global_step": 460280, "epoch": 2739} {"train_loss": -12.865833282470703, "global_step": 460281, "epoch": 2739} {"train_loss": -12.642498016357422, "global_step": 460282, "epoch": 2739} {"train_loss": -12.938461303710938, "global_step": 460283, "epoch": 2739} {"train_loss": -12.472657203674316, "global_step": 460284, "epoch": 2739} {"train_loss": -12.588107109069824, "global_step": 460285, "epoch": 2739} {"train_loss": -12.641645431518555, "global_step": 460286, "epoch": 2739} {"train_loss": -12.873733520507812, "global_step": 460287, "epoch": 2739} {"train_loss": -12.653186798095703, "global_step": 460288, "epoch": 2739} {"train_loss": -12.822647094726562, "global_step": 460289, "epoch": 2739} {"train_loss": -12.731727600097656, "global_step": 460290, "epoch": 2739} {"train_loss": -12.628374099731445, "global_step": 460291, "epoch": 2739} {"train_loss": -12.683860778808594, "global_step": 460292, "epoch": 2739} {"train_loss": -12.624237060546875, "global_step": 460293, "epoch": 2739} {"train_loss": -12.655394554138184, "global_step": 460294, "epoch": 2739} {"train_loss": -12.756034851074219, "global_step": 460295, "epoch": 2739} {"train_loss": -12.725859642028809, "global_step": 460296, "epoch": 2739} {"train_loss": -12.505302429199219, "global_step": 460297, "epoch": 2739} {"train_loss": -12.986610412597656, "global_step": 460298, "epoch": 2739} {"train_loss": -12.794307708740234, "global_step": 460299, "epoch": 2739} {"train_loss": -12.54583740234375, "global_step": 460300, "epoch": 2739} {"train_loss": -12.936044692993164, "global_step": 460301, "epoch": 2739} {"train_loss": -12.814935684204102, "global_step": 460302, "epoch": 2739} {"train_loss": -12.940964698791504, "global_step": 460303, "epoch": 2739} {"train_loss": -12.860989570617676, "global_step": 460304, "epoch": 2739} {"train_loss": -12.762919425964355, "global_step": 460305, "epoch": 2739} {"train_loss": -12.983650207519531, "global_step": 460306, "epoch": 2739} {"train_loss": -12.83584976196289, "global_step": 460307, "epoch": 2739} {"train_loss": -12.85200023651123, "global_step": 460308, "epoch": 2739} {"train_loss": -12.873855590820312, "global_step": 460309, "epoch": 2739} {"train_loss": -12.90176010131836, "global_step": 460310, "epoch": 2739} {"train_loss": -12.819507598876953, "global_step": 460311, "epoch": 2739} {"train_loss": -13.058433532714844, "global_step": 460312, "epoch": 2739} {"train_loss": -12.854146957397461, "global_step": 460313, "epoch": 2739} {"train_loss": -13.061347961425781, "global_step": 460314, "epoch": 2739} {"train_loss": -12.798822402954102, "global_step": 460315, "epoch": 2739} {"train_loss": -13.15772819519043, "global_step": 460316, "epoch": 2739} {"train_loss": -13.011293411254883, "global_step": 460317, "epoch": 2739} {"train_loss": -13.033432006835938, "global_step": 460318, "epoch": 2739} {"train_loss": -12.201906045277914, "global_step": 460319, "epoch": 2739, "val_loss": 310145.0} {"train_loss": -12.987777709960938, "global_step": 460320, "epoch": 2740} {"train_loss": -13.095183372497559, "global_step": 460321, "epoch": 2740} {"train_loss": -12.987615585327148, "global_step": 460322, "epoch": 2740} {"train_loss": -13.094444274902344, "global_step": 460323, "epoch": 2740} {"train_loss": -13.078922271728516, "global_step": 460324, "epoch": 2740} {"train_loss": -12.983489036560059, "global_step": 460325, "epoch": 2740} {"train_loss": -12.900211334228516, "global_step": 460326, "epoch": 2740} {"train_loss": -12.999151229858398, "global_step": 460327, "epoch": 2740} {"train_loss": -13.037145614624023, "global_step": 460328, "epoch": 2740} {"train_loss": -12.840059280395508, "global_step": 460329, "epoch": 2740} {"train_loss": -12.913585662841797, "global_step": 460330, "epoch": 2740} {"train_loss": -12.746917724609375, "global_step": 460331, "epoch": 2740} {"train_loss": -13.037227630615234, "global_step": 460332, "epoch": 2740} {"train_loss": -12.773749351501465, "global_step": 460333, "epoch": 2740} {"train_loss": -12.90597152709961, "global_step": 460334, "epoch": 2740} {"train_loss": -12.905430793762207, "global_step": 460335, "epoch": 2740} {"train_loss": -12.518774032592773, "global_step": 460336, "epoch": 2740} {"train_loss": -12.444879531860352, "global_step": 460337, "epoch": 2740} {"train_loss": -12.25357437133789, "global_step": 460338, "epoch": 2740} {"train_loss": -12.208049774169922, "global_step": 460339, "epoch": 2740} {"train_loss": -11.054852485656738, "global_step": 460340, "epoch": 2740} {"train_loss": -12.45840072631836, "global_step": 460341, "epoch": 2740} {"train_loss": -10.276506423950195, "global_step": 460342, "epoch": 2740} {"train_loss": -10.257852554321289, "global_step": 460343, "epoch": 2740} {"train_loss": -11.807661056518555, "global_step": 460344, "epoch": 2740} {"train_loss": -9.203989028930664, "global_step": 460345, "epoch": 2740} {"train_loss": -10.174903869628906, "global_step": 460346, "epoch": 2740} {"train_loss": -12.264131546020508, "global_step": 460347, "epoch": 2740} {"train_loss": -10.241235733032227, "global_step": 460348, "epoch": 2740} {"train_loss": -12.067652702331543, "global_step": 460349, "epoch": 2740} {"train_loss": -10.05040454864502, "global_step": 460350, "epoch": 2740} {"train_loss": -12.211389541625977, "global_step": 460351, "epoch": 2740} {"train_loss": -10.745532035827637, "global_step": 460352, "epoch": 2740} {"train_loss": -9.294279098510742, "global_step": 460353, "epoch": 2740} {"train_loss": -8.249250411987305, "global_step": 460354, "epoch": 2740} {"train_loss": -9.504410743713379, "global_step": 460355, "epoch": 2740} {"train_loss": -6.212311744689941, "global_step": 460356, "epoch": 2740} {"train_loss": -5.895247459411621, "global_step": 460357, "epoch": 2740} {"train_loss": -4.118541717529297, "global_step": 460358, "epoch": 2740} {"train_loss": -4.6070146560668945, "global_step": 460359, "epoch": 2740} {"train_loss": -5.851612091064453, "global_step": 460360, "epoch": 2740} {"train_loss": -6.199831008911133, "global_step": 460361, "epoch": 2740} {"train_loss": -7.046600818634033, "global_step": 460362, "epoch": 2740} {"train_loss": -6.400688171386719, "global_step": 460363, "epoch": 2740} {"train_loss": -6.470119476318359, "global_step": 460364, "epoch": 2740} {"train_loss": -6.7339348793029785, "global_step": 460365, "epoch": 2740} {"train_loss": -6.695322513580322, "global_step": 460366, "epoch": 2740} {"train_loss": -6.565089225769043, "global_step": 460367, "epoch": 2740} {"train_loss": -7.033603668212891, "global_step": 460368, "epoch": 2740} {"train_loss": -7.562595367431641, "global_step": 460369, "epoch": 2740} {"train_loss": -6.622550964355469, "global_step": 460370, "epoch": 2740} {"train_loss": -7.458840370178223, "global_step": 460371, "epoch": 2740} {"train_loss": -7.8582353591918945, "global_step": 460372, "epoch": 2740} {"train_loss": -7.942259788513184, "global_step": 460373, "epoch": 2740} {"train_loss": -7.421347618103027, "global_step": 460374, "epoch": 2740} {"train_loss": -8.095169067382812, "global_step": 460375, "epoch": 2740} {"train_loss": -8.302436828613281, "global_step": 460376, "epoch": 2740} {"train_loss": -8.52729320526123, "global_step": 460377, "epoch": 2740} {"train_loss": -9.030248641967773, "global_step": 460378, "epoch": 2740} {"train_loss": -9.44808578491211, "global_step": 460379, "epoch": 2740} {"train_loss": -9.55129623413086, "global_step": 460380, "epoch": 2740} {"train_loss": -9.666753768920898, "global_step": 460381, "epoch": 2740} {"train_loss": -9.717811584472656, "global_step": 460382, "epoch": 2740} {"train_loss": -9.648702621459961, "global_step": 460383, "epoch": 2740} {"train_loss": -9.677167892456055, "global_step": 460384, "epoch": 2740} {"train_loss": -9.869389533996582, "global_step": 460385, "epoch": 2740} {"train_loss": -10.4502534866333, "global_step": 460386, "epoch": 2740} {"train_loss": -10.778446197509766, "global_step": 460387, "epoch": 2740} {"train_loss": -10.524934768676758, "global_step": 460388, "epoch": 2740} {"train_loss": -10.465822219848633, "global_step": 460389, "epoch": 2740} {"train_loss": -10.536197662353516, "global_step": 460390, "epoch": 2740} {"train_loss": -11.155349731445312, "global_step": 460391, "epoch": 2740} {"train_loss": -10.826227188110352, "global_step": 460392, "epoch": 2740} {"train_loss": -11.181373596191406, "global_step": 460393, "epoch": 2740} {"train_loss": -11.077239990234375, "global_step": 460394, "epoch": 2740} {"train_loss": -11.361942291259766, "global_step": 460395, "epoch": 2740} {"train_loss": -11.325579643249512, "global_step": 460396, "epoch": 2740} {"train_loss": -11.390129089355469, "global_step": 460397, "epoch": 2740} {"train_loss": -11.49421501159668, "global_step": 460398, "epoch": 2740} {"train_loss": -11.411918640136719, "global_step": 460399, "epoch": 2740} {"train_loss": -11.648235321044922, "global_step": 460400, "epoch": 2740} {"train_loss": -11.781569480895996, "global_step": 460401, "epoch": 2740} {"train_loss": -11.389328002929688, "global_step": 460402, "epoch": 2740} {"train_loss": -11.823455810546875, "global_step": 460403, "epoch": 2740} {"train_loss": -11.864063262939453, "global_step": 460404, "epoch": 2740} {"train_loss": -11.620424270629883, "global_step": 460405, "epoch": 2740} {"train_loss": -12.204940795898438, "global_step": 460406, "epoch": 2740} {"train_loss": -11.826764106750488, "global_step": 460407, "epoch": 2740} {"train_loss": -11.574295043945312, "global_step": 460408, "epoch": 2740} {"train_loss": -12.088525772094727, "global_step": 460409, "epoch": 2740} {"train_loss": -11.578425407409668, "global_step": 460410, "epoch": 2740} {"train_loss": -11.850406646728516, "global_step": 460411, "epoch": 2740} {"train_loss": -11.729169845581055, "global_step": 460412, "epoch": 2740} {"train_loss": -11.706977844238281, "global_step": 460413, "epoch": 2740} {"train_loss": -11.433557510375977, "global_step": 460414, "epoch": 2740} {"train_loss": -11.693519592285156, "global_step": 460415, "epoch": 2740} {"train_loss": -11.664434432983398, "global_step": 460416, "epoch": 2740} {"train_loss": -11.984027862548828, "global_step": 460417, "epoch": 2740} {"train_loss": -11.937715530395508, "global_step": 460418, "epoch": 2740} {"train_loss": -11.68685531616211, "global_step": 460419, "epoch": 2740} {"train_loss": -11.991680145263672, "global_step": 460420, "epoch": 2740} {"train_loss": -12.004953384399414, "global_step": 460421, "epoch": 2740} {"train_loss": -11.6517333984375, "global_step": 460422, "epoch": 2740} {"train_loss": -12.368091583251953, "global_step": 460423, "epoch": 2740} {"train_loss": -11.952291488647461, "global_step": 460424, "epoch": 2740} {"train_loss": -12.347813606262207, "global_step": 460425, "epoch": 2740} {"train_loss": -11.980244636535645, "global_step": 460426, "epoch": 2740} {"train_loss": -12.368429183959961, "global_step": 460427, "epoch": 2740} {"train_loss": -11.668243408203125, "global_step": 460428, "epoch": 2740} {"train_loss": -12.189011573791504, "global_step": 460429, "epoch": 2740} {"train_loss": -11.956398010253906, "global_step": 460430, "epoch": 2740} {"train_loss": -12.301950454711914, "global_step": 460431, "epoch": 2740} {"train_loss": -12.356910705566406, "global_step": 460432, "epoch": 2740} {"train_loss": -12.133859634399414, "global_step": 460433, "epoch": 2740} {"train_loss": -12.351733207702637, "global_step": 460434, "epoch": 2740} {"train_loss": -11.99699592590332, "global_step": 460435, "epoch": 2740} {"train_loss": -12.539896965026855, "global_step": 460436, "epoch": 2740} {"train_loss": -12.196847915649414, "global_step": 460437, "epoch": 2740} {"train_loss": -12.323476791381836, "global_step": 460438, "epoch": 2740} {"train_loss": -12.397268295288086, "global_step": 460439, "epoch": 2740} {"train_loss": -12.266927719116211, "global_step": 460440, "epoch": 2740} {"train_loss": -12.376075744628906, "global_step": 460441, "epoch": 2740} {"train_loss": -12.405723571777344, "global_step": 460442, "epoch": 2740} {"train_loss": -12.238042831420898, "global_step": 460443, "epoch": 2740} {"train_loss": -12.499526977539062, "global_step": 460444, "epoch": 2740} {"train_loss": -12.464133262634277, "global_step": 460445, "epoch": 2740} {"train_loss": -12.433615684509277, "global_step": 460446, "epoch": 2740} {"train_loss": -12.322687149047852, "global_step": 460447, "epoch": 2740} {"train_loss": -12.462236404418945, "global_step": 460448, "epoch": 2740} {"train_loss": -12.829044342041016, "global_step": 460449, "epoch": 2740} {"train_loss": -12.538620948791504, "global_step": 460450, "epoch": 2740} {"train_loss": -12.439037322998047, "global_step": 460451, "epoch": 2740} {"train_loss": -12.676441192626953, "global_step": 460452, "epoch": 2740} {"train_loss": -12.612176895141602, "global_step": 460453, "epoch": 2740} {"train_loss": -12.580937385559082, "global_step": 460454, "epoch": 2740} {"train_loss": -12.424727439880371, "global_step": 460455, "epoch": 2740} {"train_loss": -12.525806427001953, "global_step": 460456, "epoch": 2740} {"train_loss": -12.745315551757812, "global_step": 460457, "epoch": 2740} {"train_loss": -12.640999794006348, "global_step": 460458, "epoch": 2740} {"train_loss": -12.74189567565918, "global_step": 460459, "epoch": 2740} {"train_loss": -12.698988914489746, "global_step": 460460, "epoch": 2740} {"train_loss": -12.704999923706055, "global_step": 460461, "epoch": 2740} {"train_loss": -12.594575881958008, "global_step": 460462, "epoch": 2740} {"train_loss": -12.66893196105957, "global_step": 460463, "epoch": 2740} {"train_loss": -12.718060493469238, "global_step": 460464, "epoch": 2740} {"train_loss": -12.666669845581055, "global_step": 460465, "epoch": 2740} {"train_loss": -12.670875549316406, "global_step": 460466, "epoch": 2740} {"train_loss": -12.548845291137695, "global_step": 460467, "epoch": 2740} {"train_loss": -12.683588027954102, "global_step": 460468, "epoch": 2740} {"train_loss": -12.664657592773438, "global_step": 460469, "epoch": 2740} {"train_loss": -12.275003433227539, "global_step": 460470, "epoch": 2740} {"train_loss": -12.527692794799805, "global_step": 460471, "epoch": 2740} {"train_loss": -12.535554885864258, "global_step": 460472, "epoch": 2740} {"train_loss": -11.508956909179688, "global_step": 460473, "epoch": 2740} {"train_loss": -11.842872619628906, "global_step": 460474, "epoch": 2740} {"train_loss": -12.776846885681152, "global_step": 460475, "epoch": 2740} {"train_loss": -11.653963088989258, "global_step": 460476, "epoch": 2740} {"train_loss": -12.661396026611328, "global_step": 460477, "epoch": 2740} {"train_loss": -12.26925277709961, "global_step": 460478, "epoch": 2740} {"train_loss": -11.592588424682617, "global_step": 460479, "epoch": 2740} {"train_loss": -12.872711181640625, "global_step": 460480, "epoch": 2740} {"train_loss": -12.194239616394043, "global_step": 460481, "epoch": 2740} {"train_loss": -10.814535140991211, "global_step": 460482, "epoch": 2740} {"train_loss": -12.627580642700195, "global_step": 460483, "epoch": 2740} {"train_loss": -9.561147689819336, "global_step": 460484, "epoch": 2740} {"train_loss": -11.687370300292969, "global_step": 460485, "epoch": 2740} {"train_loss": -10.564061164855957, "global_step": 460486, "epoch": 2740} {"train_loss": -11.15989620628811, "global_step": 460487, "epoch": 2740, "val_loss": 313333.375, "train_action_mse_error": 3.0552546977996826} {"train_loss": -9.849466323852539, "global_step": 460488, "epoch": 2741} {"train_loss": -12.169637680053711, "global_step": 460489, "epoch": 2741} {"train_loss": -11.518762588500977, "global_step": 460490, "epoch": 2741} {"train_loss": -11.254106521606445, "global_step": 460491, "epoch": 2741} {"train_loss": -11.989137649536133, "global_step": 460492, "epoch": 2741} {"train_loss": -9.828020095825195, "global_step": 460493, "epoch": 2741} {"train_loss": -11.939764022827148, "global_step": 460494, "epoch": 2741} {"train_loss": -11.041955947875977, "global_step": 460495, "epoch": 2741} {"train_loss": -10.739774703979492, "global_step": 460496, "epoch": 2741} {"train_loss": -10.491403579711914, "global_step": 460497, "epoch": 2741} {"train_loss": -10.20351791381836, "global_step": 460498, "epoch": 2741} {"train_loss": -10.258865356445312, "global_step": 460499, "epoch": 2741} {"train_loss": -11.961281776428223, "global_step": 460500, "epoch": 2741} {"train_loss": -10.54857063293457, "global_step": 460501, "epoch": 2741} {"train_loss": -11.687789916992188, "global_step": 460502, "epoch": 2741} {"train_loss": -11.064196586608887, "global_step": 460503, "epoch": 2741} {"train_loss": -11.700738906860352, "global_step": 460504, "epoch": 2741} {"train_loss": -11.806447982788086, "global_step": 460505, "epoch": 2741} {"train_loss": -11.653337478637695, "global_step": 460506, "epoch": 2741} {"train_loss": -11.804193496704102, "global_step": 460507, "epoch": 2741} {"train_loss": -11.938058853149414, "global_step": 460508, "epoch": 2741} {"train_loss": -11.870107650756836, "global_step": 460509, "epoch": 2741} {"train_loss": -12.290369033813477, "global_step": 460510, "epoch": 2741} {"train_loss": -11.541833877563477, "global_step": 460511, "epoch": 2741} {"train_loss": -11.720863342285156, "global_step": 460512, "epoch": 2741} {"train_loss": -11.717266082763672, "global_step": 460513, "epoch": 2741} {"train_loss": -11.081172943115234, "global_step": 460514, "epoch": 2741} {"train_loss": -11.930767059326172, "global_step": 460515, "epoch": 2741} {"train_loss": -11.602191925048828, "global_step": 460516, "epoch": 2741} {"train_loss": -11.525715827941895, "global_step": 460517, "epoch": 2741} {"train_loss": -11.990880966186523, "global_step": 460518, "epoch": 2741} {"train_loss": -11.933294296264648, "global_step": 460519, "epoch": 2741} {"train_loss": -11.100088119506836, "global_step": 460520, "epoch": 2741} {"train_loss": -11.76165771484375, "global_step": 460521, "epoch": 2741} {"train_loss": -11.645263671875, "global_step": 460522, "epoch": 2741} {"train_loss": -11.319275856018066, "global_step": 460523, "epoch": 2741} {"train_loss": -11.676603317260742, "global_step": 460524, "epoch": 2741} {"train_loss": -12.011848449707031, "global_step": 460525, "epoch": 2741} {"train_loss": -11.692635536193848, "global_step": 460526, "epoch": 2741} {"train_loss": -11.955289840698242, "global_step": 460527, "epoch": 2741} {"train_loss": -11.390438079833984, "global_step": 460528, "epoch": 2741} {"train_loss": -11.581893920898438, "global_step": 460529, "epoch": 2741} {"train_loss": -11.597394943237305, "global_step": 460530, "epoch": 2741} {"train_loss": -11.909818649291992, "global_step": 460531, "epoch": 2741} {"train_loss": -11.521469116210938, "global_step": 460532, "epoch": 2741} {"train_loss": -11.965818405151367, "global_step": 460533, "epoch": 2741} {"train_loss": -11.719544410705566, "global_step": 460534, "epoch": 2741} {"train_loss": -12.038488388061523, "global_step": 460535, "epoch": 2741} {"train_loss": -12.122679710388184, "global_step": 460536, "epoch": 2741} {"train_loss": -11.88840103149414, "global_step": 460537, "epoch": 2741} {"train_loss": -12.49449348449707, "global_step": 460538, "epoch": 2741} {"train_loss": -12.008495330810547, "global_step": 460539, "epoch": 2741} {"train_loss": -12.288053512573242, "global_step": 460540, "epoch": 2741} {"train_loss": -12.220060348510742, "global_step": 460541, "epoch": 2741} {"train_loss": -12.248308181762695, "global_step": 460542, "epoch": 2741} {"train_loss": -12.448575019836426, "global_step": 460543, "epoch": 2741} {"train_loss": -12.444768905639648, "global_step": 460544, "epoch": 2741} {"train_loss": -12.557361602783203, "global_step": 460545, "epoch": 2741} {"train_loss": -12.280064582824707, "global_step": 460546, "epoch": 2741} {"train_loss": -12.302350997924805, "global_step": 460547, "epoch": 2741} {"train_loss": -12.355390548706055, "global_step": 460548, "epoch": 2741} {"train_loss": -12.484479904174805, "global_step": 460549, "epoch": 2741} {"train_loss": -12.626361846923828, "global_step": 460550, "epoch": 2741} {"train_loss": -12.604938507080078, "global_step": 460551, "epoch": 2741} {"train_loss": -12.557552337646484, "global_step": 460552, "epoch": 2741} {"train_loss": -12.534912109375, "global_step": 460553, "epoch": 2741} {"train_loss": -12.590486526489258, "global_step": 460554, "epoch": 2741} {"train_loss": -12.674161911010742, "global_step": 460555, "epoch": 2741} {"train_loss": -12.823665618896484, "global_step": 460556, "epoch": 2741} {"train_loss": -12.708707809448242, "global_step": 460557, "epoch": 2741} {"train_loss": -12.684669494628906, "global_step": 460558, "epoch": 2741} {"train_loss": -12.725496292114258, "global_step": 460559, "epoch": 2741} {"train_loss": -12.742693901062012, "global_step": 460560, "epoch": 2741} {"train_loss": -12.617462158203125, "global_step": 460561, "epoch": 2741} {"train_loss": -12.753846168518066, "global_step": 460562, "epoch": 2741} {"train_loss": -12.715152740478516, "global_step": 460563, "epoch": 2741} {"train_loss": -12.78135871887207, "global_step": 460564, "epoch": 2741} {"train_loss": -12.843119621276855, "global_step": 460565, "epoch": 2741} {"train_loss": -12.783224105834961, "global_step": 460566, "epoch": 2741} {"train_loss": -12.755016326904297, "global_step": 460567, "epoch": 2741} {"train_loss": -12.707258224487305, "global_step": 460568, "epoch": 2741} {"train_loss": -12.83581256866455, "global_step": 460569, "epoch": 2741} {"train_loss": -12.755781173706055, "global_step": 460570, "epoch": 2741} {"train_loss": -12.954164505004883, "global_step": 460571, "epoch": 2741} {"train_loss": -12.572832107543945, "global_step": 460572, "epoch": 2741} {"train_loss": -12.625993728637695, "global_step": 460573, "epoch": 2741} {"train_loss": -12.770563125610352, "global_step": 460574, "epoch": 2741} {"train_loss": -12.893730163574219, "global_step": 460575, "epoch": 2741} {"train_loss": -12.580862998962402, "global_step": 460576, "epoch": 2741} {"train_loss": -12.687662124633789, "global_step": 460577, "epoch": 2741} {"train_loss": -12.835023880004883, "global_step": 460578, "epoch": 2741} {"train_loss": -12.57261848449707, "global_step": 460579, "epoch": 2741} {"train_loss": -12.754793167114258, "global_step": 460580, "epoch": 2741} {"train_loss": -12.715102195739746, "global_step": 460581, "epoch": 2741} {"train_loss": -13.002623558044434, "global_step": 460582, "epoch": 2741} {"train_loss": -12.646865844726562, "global_step": 460583, "epoch": 2741} {"train_loss": -12.924735069274902, "global_step": 460584, "epoch": 2741} {"train_loss": -12.73221492767334, "global_step": 460585, "epoch": 2741} {"train_loss": -12.78399658203125, "global_step": 460586, "epoch": 2741} {"train_loss": -12.855018615722656, "global_step": 460587, "epoch": 2741} {"train_loss": -12.61793327331543, "global_step": 460588, "epoch": 2741} {"train_loss": -12.361659049987793, "global_step": 460589, "epoch": 2741} {"train_loss": -12.792779922485352, "global_step": 460590, "epoch": 2741} {"train_loss": -12.520196914672852, "global_step": 460591, "epoch": 2741} {"train_loss": -12.958410263061523, "global_step": 460592, "epoch": 2741} {"train_loss": -12.309450149536133, "global_step": 460593, "epoch": 2741} {"train_loss": -12.605168342590332, "global_step": 460594, "epoch": 2741} {"train_loss": -12.742621421813965, "global_step": 460595, "epoch": 2741} {"train_loss": -12.594282150268555, "global_step": 460596, "epoch": 2741} {"train_loss": -12.276700973510742, "global_step": 460597, "epoch": 2741} {"train_loss": -12.69218635559082, "global_step": 460598, "epoch": 2741} {"train_loss": -12.634756088256836, "global_step": 460599, "epoch": 2741} {"train_loss": -13.007030487060547, "global_step": 460600, "epoch": 2741} {"train_loss": -12.531333923339844, "global_step": 460601, "epoch": 2741} {"train_loss": -12.074014663696289, "global_step": 460602, "epoch": 2741} {"train_loss": -12.578533172607422, "global_step": 460603, "epoch": 2741} {"train_loss": -12.634950637817383, "global_step": 460604, "epoch": 2741} {"train_loss": -11.991907119750977, "global_step": 460605, "epoch": 2741} {"train_loss": -12.316036224365234, "global_step": 460606, "epoch": 2741} {"train_loss": -10.746522903442383, "global_step": 460607, "epoch": 2741} {"train_loss": -11.9431791305542, "global_step": 460608, "epoch": 2741} {"train_loss": -11.937808990478516, "global_step": 460609, "epoch": 2741} {"train_loss": -9.794711112976074, "global_step": 460610, "epoch": 2741} {"train_loss": -11.813770294189453, "global_step": 460611, "epoch": 2741} {"train_loss": -12.459590911865234, "global_step": 460612, "epoch": 2741} {"train_loss": -11.37397289276123, "global_step": 460613, "epoch": 2741} {"train_loss": -11.748580932617188, "global_step": 460614, "epoch": 2741} {"train_loss": -10.374144554138184, "global_step": 460615, "epoch": 2741} {"train_loss": -12.311345100402832, "global_step": 460616, "epoch": 2741} {"train_loss": -11.2600736618042, "global_step": 460617, "epoch": 2741} {"train_loss": -12.076983451843262, "global_step": 460618, "epoch": 2741} {"train_loss": -12.052114486694336, "global_step": 460619, "epoch": 2741} {"train_loss": -11.501566886901855, "global_step": 460620, "epoch": 2741} {"train_loss": -12.354918479919434, "global_step": 460621, "epoch": 2741} {"train_loss": -11.893699645996094, "global_step": 460622, "epoch": 2741} {"train_loss": -11.980836868286133, "global_step": 460623, "epoch": 2741} {"train_loss": -12.311895370483398, "global_step": 460624, "epoch": 2741} {"train_loss": -11.998080253601074, "global_step": 460625, "epoch": 2741} {"train_loss": -11.916720390319824, "global_step": 460626, "epoch": 2741} {"train_loss": -12.125052452087402, "global_step": 460627, "epoch": 2741} {"train_loss": -11.800086975097656, "global_step": 460628, "epoch": 2741} {"train_loss": -11.91452693939209, "global_step": 460629, "epoch": 2741} {"train_loss": -12.522274017333984, "global_step": 460630, "epoch": 2741} {"train_loss": -11.767354011535645, "global_step": 460631, "epoch": 2741} {"train_loss": -12.36424446105957, "global_step": 460632, "epoch": 2741} {"train_loss": -12.407655715942383, "global_step": 460633, "epoch": 2741} {"train_loss": -12.149266242980957, "global_step": 460634, "epoch": 2741} {"train_loss": -12.63563060760498, "global_step": 460635, "epoch": 2741} {"train_loss": -11.946647644042969, "global_step": 460636, "epoch": 2741} {"train_loss": -12.344884872436523, "global_step": 460637, "epoch": 2741} {"train_loss": -12.371219635009766, "global_step": 460638, "epoch": 2741} {"train_loss": -12.090486526489258, "global_step": 460639, "epoch": 2741} {"train_loss": -12.482338905334473, "global_step": 460640, "epoch": 2741} {"train_loss": -12.273483276367188, "global_step": 460641, "epoch": 2741} {"train_loss": -11.668561935424805, "global_step": 460642, "epoch": 2741} {"train_loss": -12.668926239013672, "global_step": 460643, "epoch": 2741} {"train_loss": -12.24180793762207, "global_step": 460644, "epoch": 2741} {"train_loss": -12.156673431396484, "global_step": 460645, "epoch": 2741} {"train_loss": -11.76390266418457, "global_step": 460646, "epoch": 2741} {"train_loss": -11.209463119506836, "global_step": 460647, "epoch": 2741} {"train_loss": -12.421339988708496, "global_step": 460648, "epoch": 2741} {"train_loss": -11.698458671569824, "global_step": 460649, "epoch": 2741} {"train_loss": -11.246988296508789, "global_step": 460650, "epoch": 2741} {"train_loss": -11.690073013305664, "global_step": 460651, "epoch": 2741} {"train_loss": -11.997008323669434, "global_step": 460652, "epoch": 2741} {"train_loss": -12.385883331298828, "global_step": 460653, "epoch": 2741} {"train_loss": -11.906496047973633, "global_step": 460654, "epoch": 2741} {"train_loss": -12.085336100487481, "global_step": 460655, "epoch": 2741, "val_loss": 313854.71875} {"train_loss": -12.732084274291992, "global_step": 460656, "epoch": 2742} {"train_loss": -11.853611946105957, "global_step": 460657, "epoch": 2742} {"train_loss": -12.225929260253906, "global_step": 460658, "epoch": 2742} {"train_loss": -12.352046012878418, "global_step": 460659, "epoch": 2742} {"train_loss": -11.165142059326172, "global_step": 460660, "epoch": 2742} {"train_loss": -11.762943267822266, "global_step": 460661, "epoch": 2742} {"train_loss": -12.005989074707031, "global_step": 460662, "epoch": 2742} {"train_loss": -11.777173042297363, "global_step": 460663, "epoch": 2742} {"train_loss": -11.488624572753906, "global_step": 460664, "epoch": 2742} {"train_loss": -11.483477592468262, "global_step": 460665, "epoch": 2742} {"train_loss": -12.34056282043457, "global_step": 460666, "epoch": 2742} {"train_loss": -11.97320556640625, "global_step": 460667, "epoch": 2742} {"train_loss": -11.749373435974121, "global_step": 460668, "epoch": 2742} {"train_loss": -11.884584426879883, "global_step": 460669, "epoch": 2742} {"train_loss": -11.44593620300293, "global_step": 460670, "epoch": 2742} {"train_loss": -11.718954086303711, "global_step": 460671, "epoch": 2742} {"train_loss": -11.387332916259766, "global_step": 460672, "epoch": 2742} {"train_loss": -12.151063919067383, "global_step": 460673, "epoch": 2742} {"train_loss": -12.177854537963867, "global_step": 460674, "epoch": 2742} {"train_loss": -11.618350982666016, "global_step": 460675, "epoch": 2742} {"train_loss": -12.370599746704102, "global_step": 460676, "epoch": 2742} {"train_loss": -11.791879653930664, "global_step": 460677, "epoch": 2742} {"train_loss": -12.017284393310547, "global_step": 460678, "epoch": 2742} {"train_loss": -12.416387557983398, "global_step": 460679, "epoch": 2742} {"train_loss": -12.40027904510498, "global_step": 460680, "epoch": 2742} {"train_loss": -12.593488693237305, "global_step": 460681, "epoch": 2742} {"train_loss": -12.388727188110352, "global_step": 460682, "epoch": 2742} {"train_loss": -12.797765731811523, "global_step": 460683, "epoch": 2742} {"train_loss": -12.473898887634277, "global_step": 460684, "epoch": 2742} {"train_loss": -12.640270233154297, "global_step": 460685, "epoch": 2742} {"train_loss": -12.276569366455078, "global_step": 460686, "epoch": 2742} {"train_loss": -12.700634002685547, "global_step": 460687, "epoch": 2742} {"train_loss": -12.429412841796875, "global_step": 460688, "epoch": 2742} {"train_loss": -12.29519271850586, "global_step": 460689, "epoch": 2742} {"train_loss": -12.545326232910156, "global_step": 460690, "epoch": 2742} {"train_loss": -12.237489700317383, "global_step": 460691, "epoch": 2742} {"train_loss": -12.52065372467041, "global_step": 460692, "epoch": 2742} {"train_loss": -11.973243713378906, "global_step": 460693, "epoch": 2742} {"train_loss": -12.639312744140625, "global_step": 460694, "epoch": 2742} {"train_loss": -12.523788452148438, "global_step": 460695, "epoch": 2742} {"train_loss": -12.185455322265625, "global_step": 460696, "epoch": 2742} {"train_loss": -12.686910629272461, "global_step": 460697, "epoch": 2742} {"train_loss": -12.291980743408203, "global_step": 460698, "epoch": 2742} {"train_loss": -12.79996395111084, "global_step": 460699, "epoch": 2742} {"train_loss": -12.458998680114746, "global_step": 460700, "epoch": 2742} {"train_loss": -12.622062683105469, "global_step": 460701, "epoch": 2742} {"train_loss": -12.523558616638184, "global_step": 460702, "epoch": 2742} {"train_loss": -12.325002670288086, "global_step": 460703, "epoch": 2742} {"train_loss": -12.39915657043457, "global_step": 460704, "epoch": 2742} {"train_loss": -12.433492660522461, "global_step": 460705, "epoch": 2742} {"train_loss": -12.509239196777344, "global_step": 460706, "epoch": 2742} {"train_loss": -12.307317733764648, "global_step": 460707, "epoch": 2742} {"train_loss": -12.149490356445312, "global_step": 460708, "epoch": 2742} {"train_loss": -12.20802116394043, "global_step": 460709, "epoch": 2742} {"train_loss": -12.360738754272461, "global_step": 460710, "epoch": 2742} {"train_loss": -12.33802604675293, "global_step": 460711, "epoch": 2742} {"train_loss": -12.181897163391113, "global_step": 460712, "epoch": 2742} {"train_loss": -12.526243209838867, "global_step": 460713, "epoch": 2742} {"train_loss": -12.359724044799805, "global_step": 460714, "epoch": 2742} {"train_loss": -12.512168884277344, "global_step": 460715, "epoch": 2742} {"train_loss": -12.463991165161133, "global_step": 460716, "epoch": 2742} {"train_loss": -12.01751708984375, "global_step": 460717, "epoch": 2742} {"train_loss": -12.916092872619629, "global_step": 460718, "epoch": 2742} {"train_loss": -12.263022422790527, "global_step": 460719, "epoch": 2742} {"train_loss": -12.533032417297363, "global_step": 460720, "epoch": 2742} {"train_loss": -12.43902587890625, "global_step": 460721, "epoch": 2742} {"train_loss": -12.8101224899292, "global_step": 460722, "epoch": 2742} {"train_loss": -12.518097877502441, "global_step": 460723, "epoch": 2742} {"train_loss": -12.513578414916992, "global_step": 460724, "epoch": 2742} {"train_loss": -12.672496795654297, "global_step": 460725, "epoch": 2742} {"train_loss": -12.440374374389648, "global_step": 460726, "epoch": 2742} {"train_loss": -12.486291885375977, "global_step": 460727, "epoch": 2742} {"train_loss": -12.537063598632812, "global_step": 460728, "epoch": 2742} {"train_loss": -12.49302864074707, "global_step": 460729, "epoch": 2742} {"train_loss": -12.243965148925781, "global_step": 460730, "epoch": 2742} {"train_loss": -12.333742141723633, "global_step": 460731, "epoch": 2742} {"train_loss": -12.146705627441406, "global_step": 460732, "epoch": 2742} {"train_loss": -11.316232681274414, "global_step": 460733, "epoch": 2742} {"train_loss": -12.102224349975586, "global_step": 460734, "epoch": 2742} {"train_loss": -12.567113876342773, "global_step": 460735, "epoch": 2742} {"train_loss": -12.031100273132324, "global_step": 460736, "epoch": 2742} {"train_loss": -12.442708969116211, "global_step": 460737, "epoch": 2742} {"train_loss": -12.648530960083008, "global_step": 460738, "epoch": 2742} {"train_loss": -11.809469223022461, "global_step": 460739, "epoch": 2742} {"train_loss": -12.085350036621094, "global_step": 460740, "epoch": 2742} {"train_loss": -11.861998558044434, "global_step": 460741, "epoch": 2742} {"train_loss": -12.232065200805664, "global_step": 460742, "epoch": 2742} {"train_loss": -11.768540382385254, "global_step": 460743, "epoch": 2742} {"train_loss": -12.216891288757324, "global_step": 460744, "epoch": 2742} {"train_loss": -12.079811096191406, "global_step": 460745, "epoch": 2742} {"train_loss": -12.399408340454102, "global_step": 460746, "epoch": 2742} {"train_loss": -11.98216438293457, "global_step": 460747, "epoch": 2742} {"train_loss": -12.713842391967773, "global_step": 460748, "epoch": 2742} {"train_loss": -12.227948188781738, "global_step": 460749, "epoch": 2742} {"train_loss": -12.119161605834961, "global_step": 460750, "epoch": 2742} {"train_loss": -11.825566291809082, "global_step": 460751, "epoch": 2742} {"train_loss": -12.406526565551758, "global_step": 460752, "epoch": 2742} {"train_loss": -11.992647171020508, "global_step": 460753, "epoch": 2742} {"train_loss": -10.979972839355469, "global_step": 460754, "epoch": 2742} {"train_loss": -12.033171653747559, "global_step": 460755, "epoch": 2742} {"train_loss": -11.45036792755127, "global_step": 460756, "epoch": 2742} {"train_loss": -9.828855514526367, "global_step": 460757, "epoch": 2742} {"train_loss": -10.8388671875, "global_step": 460758, "epoch": 2742} {"train_loss": -9.863831520080566, "global_step": 460759, "epoch": 2742} {"train_loss": -11.265671730041504, "global_step": 460760, "epoch": 2742} {"train_loss": -10.242470741271973, "global_step": 460761, "epoch": 2742} {"train_loss": -8.870367050170898, "global_step": 460762, "epoch": 2742} {"train_loss": -8.818016052246094, "global_step": 460763, "epoch": 2742} {"train_loss": -9.963502883911133, "global_step": 460764, "epoch": 2742} {"train_loss": -10.343856811523438, "global_step": 460765, "epoch": 2742} {"train_loss": -9.638594627380371, "global_step": 460766, "epoch": 2742} {"train_loss": -9.324390411376953, "global_step": 460767, "epoch": 2742} {"train_loss": -9.666486740112305, "global_step": 460768, "epoch": 2742} {"train_loss": -9.417512893676758, "global_step": 460769, "epoch": 2742} {"train_loss": -9.843915939331055, "global_step": 460770, "epoch": 2742} {"train_loss": -11.023722648620605, "global_step": 460771, "epoch": 2742} {"train_loss": -9.821771621704102, "global_step": 460772, "epoch": 2742} {"train_loss": -10.915834426879883, "global_step": 460773, "epoch": 2742} {"train_loss": -10.606279373168945, "global_step": 460774, "epoch": 2742} {"train_loss": -10.482987403869629, "global_step": 460775, "epoch": 2742} {"train_loss": -10.566181182861328, "global_step": 460776, "epoch": 2742} {"train_loss": -11.703914642333984, "global_step": 460777, "epoch": 2742} {"train_loss": -10.922359466552734, "global_step": 460778, "epoch": 2742} {"train_loss": -11.623218536376953, "global_step": 460779, "epoch": 2742} {"train_loss": -11.833719253540039, "global_step": 460780, "epoch": 2742} {"train_loss": -11.356457710266113, "global_step": 460781, "epoch": 2742} {"train_loss": -12.198678970336914, "global_step": 460782, "epoch": 2742} {"train_loss": -11.188155174255371, "global_step": 460783, "epoch": 2742} {"train_loss": -10.66037368774414, "global_step": 460784, "epoch": 2742} {"train_loss": -12.06696891784668, "global_step": 460785, "epoch": 2742} {"train_loss": -11.020573616027832, "global_step": 460786, "epoch": 2742} {"train_loss": -11.502092361450195, "global_step": 460787, "epoch": 2742} {"train_loss": -11.850433349609375, "global_step": 460788, "epoch": 2742} {"train_loss": -11.022726058959961, "global_step": 460789, "epoch": 2742} {"train_loss": -11.597820281982422, "global_step": 460790, "epoch": 2742} {"train_loss": -12.0916748046875, "global_step": 460791, "epoch": 2742} {"train_loss": -11.727397918701172, "global_step": 460792, "epoch": 2742} {"train_loss": -12.013520240783691, "global_step": 460793, "epoch": 2742} {"train_loss": -11.490449905395508, "global_step": 460794, "epoch": 2742} {"train_loss": -12.007672309875488, "global_step": 460795, "epoch": 2742} {"train_loss": -11.553722381591797, "global_step": 460796, "epoch": 2742} {"train_loss": -12.10374927520752, "global_step": 460797, "epoch": 2742} {"train_loss": -12.041341781616211, "global_step": 460798, "epoch": 2742} {"train_loss": -12.173641204833984, "global_step": 460799, "epoch": 2742} {"train_loss": -11.70724105834961, "global_step": 460800, "epoch": 2742} {"train_loss": -11.885528564453125, "global_step": 460801, "epoch": 2742} {"train_loss": -12.07204818725586, "global_step": 460802, "epoch": 2742} {"train_loss": -11.820028305053711, "global_step": 460803, "epoch": 2742} {"train_loss": -11.844002723693848, "global_step": 460804, "epoch": 2742} {"train_loss": -11.948840141296387, "global_step": 460805, "epoch": 2742} {"train_loss": -11.843791007995605, "global_step": 460806, "epoch": 2742} {"train_loss": -11.9047269821167, "global_step": 460807, "epoch": 2742} {"train_loss": -12.15978717803955, "global_step": 460808, "epoch": 2742} {"train_loss": -11.823736190795898, "global_step": 460809, "epoch": 2742} {"train_loss": -11.757891654968262, "global_step": 460810, "epoch": 2742} {"train_loss": -12.105621337890625, "global_step": 460811, "epoch": 2742} {"train_loss": -11.424100875854492, "global_step": 460812, "epoch": 2742} {"train_loss": -12.256591796875, "global_step": 460813, "epoch": 2742} {"train_loss": -11.802233695983887, "global_step": 460814, "epoch": 2742} {"train_loss": -11.97774600982666, "global_step": 460815, "epoch": 2742} {"train_loss": -12.158943176269531, "global_step": 460816, "epoch": 2742} {"train_loss": -11.602251052856445, "global_step": 460817, "epoch": 2742} {"train_loss": -12.208639144897461, "global_step": 460818, "epoch": 2742} {"train_loss": -11.780574798583984, "global_step": 460819, "epoch": 2742} {"train_loss": -12.279053688049316, "global_step": 460820, "epoch": 2742} {"train_loss": -12.100086212158203, "global_step": 460821, "epoch": 2742} {"train_loss": -11.74692153930664, "global_step": 460822, "epoch": 2742} {"train_loss": -11.846454898516336, "global_step": 460823, "epoch": 2742, "val_loss": 315205.71875} {"train_loss": -11.465166091918945, "global_step": 460824, "epoch": 2743} {"train_loss": -12.33981704711914, "global_step": 460825, "epoch": 2743} {"train_loss": -11.298251152038574, "global_step": 460826, "epoch": 2743} {"train_loss": -11.913541793823242, "global_step": 460827, "epoch": 2743} {"train_loss": -12.306543350219727, "global_step": 460828, "epoch": 2743} {"train_loss": -11.89189338684082, "global_step": 460829, "epoch": 2743} {"train_loss": -12.448925018310547, "global_step": 460830, "epoch": 2743} {"train_loss": -11.914146423339844, "global_step": 460831, "epoch": 2743} {"train_loss": -12.304391860961914, "global_step": 460832, "epoch": 2743} {"train_loss": -12.541206359863281, "global_step": 460833, "epoch": 2743} {"train_loss": -12.156814575195312, "global_step": 460834, "epoch": 2743} {"train_loss": -12.084928512573242, "global_step": 460835, "epoch": 2743} {"train_loss": -12.466403007507324, "global_step": 460836, "epoch": 2743} {"train_loss": -12.470062255859375, "global_step": 460837, "epoch": 2743} {"train_loss": -12.154555320739746, "global_step": 460838, "epoch": 2743} {"train_loss": -12.35488510131836, "global_step": 460839, "epoch": 2743} {"train_loss": -12.263256072998047, "global_step": 460840, "epoch": 2743} {"train_loss": -12.322994232177734, "global_step": 460841, "epoch": 2743} {"train_loss": -12.388007164001465, "global_step": 460842, "epoch": 2743} {"train_loss": -12.391429901123047, "global_step": 460843, "epoch": 2743} {"train_loss": -12.50082778930664, "global_step": 460844, "epoch": 2743} {"train_loss": -12.329134941101074, "global_step": 460845, "epoch": 2743} {"train_loss": -12.539600372314453, "global_step": 460846, "epoch": 2743} {"train_loss": -12.301223754882812, "global_step": 460847, "epoch": 2743} {"train_loss": -12.571386337280273, "global_step": 460848, "epoch": 2743} {"train_loss": -12.567227363586426, "global_step": 460849, "epoch": 2743} {"train_loss": -12.31404972076416, "global_step": 460850, "epoch": 2743} {"train_loss": -12.416869163513184, "global_step": 460851, "epoch": 2743} {"train_loss": -12.22619915008545, "global_step": 460852, "epoch": 2743} {"train_loss": -12.635708808898926, "global_step": 460853, "epoch": 2743} {"train_loss": -12.230270385742188, "global_step": 460854, "epoch": 2743} {"train_loss": -12.645520210266113, "global_step": 460855, "epoch": 2743} {"train_loss": -12.361249923706055, "global_step": 460856, "epoch": 2743} {"train_loss": -12.335145950317383, "global_step": 460857, "epoch": 2743} {"train_loss": -12.591760635375977, "global_step": 460858, "epoch": 2743} {"train_loss": -11.97648811340332, "global_step": 460859, "epoch": 2743} {"train_loss": -12.641490936279297, "global_step": 460860, "epoch": 2743} {"train_loss": -12.342554092407227, "global_step": 460861, "epoch": 2743} {"train_loss": -12.61500072479248, "global_step": 460862, "epoch": 2743} {"train_loss": -12.349127769470215, "global_step": 460863, "epoch": 2743} {"train_loss": -12.658391952514648, "global_step": 460864, "epoch": 2743} {"train_loss": -12.48385238647461, "global_step": 460865, "epoch": 2743} {"train_loss": -12.730947494506836, "global_step": 460866, "epoch": 2743} {"train_loss": -12.633134841918945, "global_step": 460867, "epoch": 2743} {"train_loss": -12.784940719604492, "global_step": 460868, "epoch": 2743} {"train_loss": -12.623573303222656, "global_step": 460869, "epoch": 2743} {"train_loss": -12.642696380615234, "global_step": 460870, "epoch": 2743} {"train_loss": -12.572441101074219, "global_step": 460871, "epoch": 2743} {"train_loss": -12.585918426513672, "global_step": 460872, "epoch": 2743} {"train_loss": -12.493206977844238, "global_step": 460873, "epoch": 2743} {"train_loss": -12.61028003692627, "global_step": 460874, "epoch": 2743} {"train_loss": -12.461893081665039, "global_step": 460875, "epoch": 2743} {"train_loss": -12.831907272338867, "global_step": 460876, "epoch": 2743} {"train_loss": -12.80716323852539, "global_step": 460877, "epoch": 2743} {"train_loss": -12.288881301879883, "global_step": 460878, "epoch": 2743} {"train_loss": -12.472289085388184, "global_step": 460879, "epoch": 2743} {"train_loss": -12.543561935424805, "global_step": 460880, "epoch": 2743} {"train_loss": -12.683343887329102, "global_step": 460881, "epoch": 2743} {"train_loss": -12.651838302612305, "global_step": 460882, "epoch": 2743} {"train_loss": -12.56462287902832, "global_step": 460883, "epoch": 2743} {"train_loss": -12.580413818359375, "global_step": 460884, "epoch": 2743} {"train_loss": -12.503338813781738, "global_step": 460885, "epoch": 2743} {"train_loss": -12.480753898620605, "global_step": 460886, "epoch": 2743} {"train_loss": -12.246705055236816, "global_step": 460887, "epoch": 2743} {"train_loss": -12.495461463928223, "global_step": 460888, "epoch": 2743} {"train_loss": -12.159107208251953, "global_step": 460889, "epoch": 2743} {"train_loss": -12.855042457580566, "global_step": 460890, "epoch": 2743} {"train_loss": -12.4517822265625, "global_step": 460891, "epoch": 2743} {"train_loss": -12.826445579528809, "global_step": 460892, "epoch": 2743} {"train_loss": -12.649116516113281, "global_step": 460893, "epoch": 2743} {"train_loss": -12.63471508026123, "global_step": 460894, "epoch": 2743} {"train_loss": -12.576260566711426, "global_step": 460895, "epoch": 2743} {"train_loss": -12.71916675567627, "global_step": 460896, "epoch": 2743} {"train_loss": -12.55657958984375, "global_step": 460897, "epoch": 2743} {"train_loss": -12.699593544006348, "global_step": 460898, "epoch": 2743} {"train_loss": -12.483406066894531, "global_step": 460899, "epoch": 2743} {"train_loss": -12.622401237487793, "global_step": 460900, "epoch": 2743} {"train_loss": -12.809183120727539, "global_step": 460901, "epoch": 2743} {"train_loss": -12.981210708618164, "global_step": 460902, "epoch": 2743} {"train_loss": -12.456184387207031, "global_step": 460903, "epoch": 2743} {"train_loss": -12.324082374572754, "global_step": 460904, "epoch": 2743} {"train_loss": -12.275453567504883, "global_step": 460905, "epoch": 2743} {"train_loss": -12.232633590698242, "global_step": 460906, "epoch": 2743} {"train_loss": -12.72606086730957, "global_step": 460907, "epoch": 2743} {"train_loss": -12.440631866455078, "global_step": 460908, "epoch": 2743} {"train_loss": -12.077360153198242, "global_step": 460909, "epoch": 2743} {"train_loss": -12.665285110473633, "global_step": 460910, "epoch": 2743} {"train_loss": -12.01341438293457, "global_step": 460911, "epoch": 2743} {"train_loss": -12.415767669677734, "global_step": 460912, "epoch": 2743} {"train_loss": -12.552347183227539, "global_step": 460913, "epoch": 2743} {"train_loss": -12.47596549987793, "global_step": 460914, "epoch": 2743} {"train_loss": -11.602463722229004, "global_step": 460915, "epoch": 2743} {"train_loss": -11.405252456665039, "global_step": 460916, "epoch": 2743} {"train_loss": -11.031648635864258, "global_step": 460917, "epoch": 2743} {"train_loss": -12.754839897155762, "global_step": 460918, "epoch": 2743} {"train_loss": -11.750913619995117, "global_step": 460919, "epoch": 2743} {"train_loss": -12.226624488830566, "global_step": 460920, "epoch": 2743} {"train_loss": -12.02488899230957, "global_step": 460921, "epoch": 2743} {"train_loss": -12.300625801086426, "global_step": 460922, "epoch": 2743} {"train_loss": -11.913639068603516, "global_step": 460923, "epoch": 2743} {"train_loss": -12.326560974121094, "global_step": 460924, "epoch": 2743} {"train_loss": -11.547401428222656, "global_step": 460925, "epoch": 2743} {"train_loss": -12.393856048583984, "global_step": 460926, "epoch": 2743} {"train_loss": -12.045648574829102, "global_step": 460927, "epoch": 2743} {"train_loss": -11.848799705505371, "global_step": 460928, "epoch": 2743} {"train_loss": -12.372060775756836, "global_step": 460929, "epoch": 2743} {"train_loss": -12.120393753051758, "global_step": 460930, "epoch": 2743} {"train_loss": -12.558992385864258, "global_step": 460931, "epoch": 2743} {"train_loss": -12.650761604309082, "global_step": 460932, "epoch": 2743} {"train_loss": -12.30803108215332, "global_step": 460933, "epoch": 2743} {"train_loss": -12.918144226074219, "global_step": 460934, "epoch": 2743} {"train_loss": -12.452871322631836, "global_step": 460935, "epoch": 2743} {"train_loss": -12.358489990234375, "global_step": 460936, "epoch": 2743} {"train_loss": -12.091729164123535, "global_step": 460937, "epoch": 2743} {"train_loss": -12.553781509399414, "global_step": 460938, "epoch": 2743} {"train_loss": -11.055891036987305, "global_step": 460939, "epoch": 2743} {"train_loss": -12.039841651916504, "global_step": 460940, "epoch": 2743} {"train_loss": -11.227535247802734, "global_step": 460941, "epoch": 2743} {"train_loss": -12.394163131713867, "global_step": 460942, "epoch": 2743} {"train_loss": -9.979143142700195, "global_step": 460943, "epoch": 2743} {"train_loss": -11.706864356994629, "global_step": 460944, "epoch": 2743} {"train_loss": -10.38762378692627, "global_step": 460945, "epoch": 2743} {"train_loss": -11.968955993652344, "global_step": 460946, "epoch": 2743} {"train_loss": -11.932042121887207, "global_step": 460947, "epoch": 2743} {"train_loss": -10.397924423217773, "global_step": 460948, "epoch": 2743} {"train_loss": -12.390392303466797, "global_step": 460949, "epoch": 2743} {"train_loss": -11.407885551452637, "global_step": 460950, "epoch": 2743} {"train_loss": -11.90291976928711, "global_step": 460951, "epoch": 2743} {"train_loss": -11.775331497192383, "global_step": 460952, "epoch": 2743} {"train_loss": -11.439896583557129, "global_step": 460953, "epoch": 2743} {"train_loss": -12.016852378845215, "global_step": 460954, "epoch": 2743} {"train_loss": -11.580779075622559, "global_step": 460955, "epoch": 2743} {"train_loss": -11.496938705444336, "global_step": 460956, "epoch": 2743} {"train_loss": -11.947915077209473, "global_step": 460957, "epoch": 2743} {"train_loss": -11.719112396240234, "global_step": 460958, "epoch": 2743} {"train_loss": -12.043722152709961, "global_step": 460959, "epoch": 2743} {"train_loss": -11.163193702697754, "global_step": 460960, "epoch": 2743} {"train_loss": -11.838018417358398, "global_step": 460961, "epoch": 2743} {"train_loss": -11.870152473449707, "global_step": 460962, "epoch": 2743} {"train_loss": -12.287938117980957, "global_step": 460963, "epoch": 2743} {"train_loss": -12.139598846435547, "global_step": 460964, "epoch": 2743} {"train_loss": -12.306097030639648, "global_step": 460965, "epoch": 2743} {"train_loss": -12.09735107421875, "global_step": 460966, "epoch": 2743} {"train_loss": -12.706331253051758, "global_step": 460967, "epoch": 2743} {"train_loss": -12.167828559875488, "global_step": 460968, "epoch": 2743} {"train_loss": -12.631156921386719, "global_step": 460969, "epoch": 2743} {"train_loss": -12.090755462646484, "global_step": 460970, "epoch": 2743} {"train_loss": -12.382179260253906, "global_step": 460971, "epoch": 2743} {"train_loss": -11.968961715698242, "global_step": 460972, "epoch": 2743} {"train_loss": -12.367737770080566, "global_step": 460973, "epoch": 2743} {"train_loss": -11.93480396270752, "global_step": 460974, "epoch": 2743} {"train_loss": -12.437546730041504, "global_step": 460975, "epoch": 2743} {"train_loss": -11.99939250946045, "global_step": 460976, "epoch": 2743} {"train_loss": -12.267383575439453, "global_step": 460977, "epoch": 2743} {"train_loss": -12.241422653198242, "global_step": 460978, "epoch": 2743} {"train_loss": -12.228036880493164, "global_step": 460979, "epoch": 2743} {"train_loss": -12.672014236450195, "global_step": 460980, "epoch": 2743} {"train_loss": -12.361186027526855, "global_step": 460981, "epoch": 2743} {"train_loss": -12.440410614013672, "global_step": 460982, "epoch": 2743} {"train_loss": -12.105981826782227, "global_step": 460983, "epoch": 2743} {"train_loss": -12.58913803100586, "global_step": 460984, "epoch": 2743} {"train_loss": -11.98286247253418, "global_step": 460985, "epoch": 2743} {"train_loss": -12.600448608398438, "global_step": 460986, "epoch": 2743} {"train_loss": -12.53510856628418, "global_step": 460987, "epoch": 2743} {"train_loss": -12.314729690551758, "global_step": 460988, "epoch": 2743} {"train_loss": -12.379739761352539, "global_step": 460989, "epoch": 2743} {"train_loss": -12.704235076904297, "global_step": 460990, "epoch": 2743} {"train_loss": -12.252048248336429, "global_step": 460991, "epoch": 2743, "val_loss": 315563.15625} {"train_loss": -12.029871940612793, "global_step": 460992, "epoch": 2744} {"train_loss": -12.309820175170898, "global_step": 460993, "epoch": 2744} {"train_loss": -12.22385311126709, "global_step": 460994, "epoch": 2744} {"train_loss": -12.486432075500488, "global_step": 460995, "epoch": 2744} {"train_loss": -12.309446334838867, "global_step": 460996, "epoch": 2744} {"train_loss": -12.412651062011719, "global_step": 460997, "epoch": 2744} {"train_loss": -11.675968170166016, "global_step": 460998, "epoch": 2744} {"train_loss": -12.273224830627441, "global_step": 460999, "epoch": 2744} {"train_loss": -11.931258201599121, "global_step": 461000, "epoch": 2744} {"train_loss": -11.978073120117188, "global_step": 461001, "epoch": 2744} {"train_loss": -12.138604164123535, "global_step": 461002, "epoch": 2744} {"train_loss": -11.990856170654297, "global_step": 461003, "epoch": 2744} {"train_loss": -12.602615356445312, "global_step": 461004, "epoch": 2744} {"train_loss": -12.314233779907227, "global_step": 461005, "epoch": 2744} {"train_loss": -12.395378112792969, "global_step": 461006, "epoch": 2744} {"train_loss": -12.43478775024414, "global_step": 461007, "epoch": 2744} {"train_loss": -12.129361152648926, "global_step": 461008, "epoch": 2744} {"train_loss": -12.396015167236328, "global_step": 461009, "epoch": 2744} {"train_loss": -12.683076858520508, "global_step": 461010, "epoch": 2744} {"train_loss": -12.198482513427734, "global_step": 461011, "epoch": 2744} {"train_loss": -12.60750961303711, "global_step": 461012, "epoch": 2744} {"train_loss": -12.03822135925293, "global_step": 461013, "epoch": 2744} {"train_loss": -12.574618339538574, "global_step": 461014, "epoch": 2744} {"train_loss": -12.352434158325195, "global_step": 461015, "epoch": 2744} {"train_loss": -12.64957332611084, "global_step": 461016, "epoch": 2744} {"train_loss": -12.635677337646484, "global_step": 461017, "epoch": 2744} {"train_loss": -12.723640441894531, "global_step": 461018, "epoch": 2744} {"train_loss": -12.511817932128906, "global_step": 461019, "epoch": 2744} {"train_loss": -12.615534782409668, "global_step": 461020, "epoch": 2744} {"train_loss": -12.724191665649414, "global_step": 461021, "epoch": 2744} {"train_loss": -12.584737777709961, "global_step": 461022, "epoch": 2744} {"train_loss": -12.544748306274414, "global_step": 461023, "epoch": 2744} {"train_loss": -12.336038589477539, "global_step": 461024, "epoch": 2744} {"train_loss": -12.493999481201172, "global_step": 461025, "epoch": 2744} {"train_loss": -12.60926342010498, "global_step": 461026, "epoch": 2744} {"train_loss": -12.740410804748535, "global_step": 461027, "epoch": 2744} {"train_loss": -12.847131729125977, "global_step": 461028, "epoch": 2744} {"train_loss": -12.684040069580078, "global_step": 461029, "epoch": 2744} {"train_loss": -12.709556579589844, "global_step": 461030, "epoch": 2744} {"train_loss": -12.014087677001953, "global_step": 461031, "epoch": 2744} {"train_loss": -12.470617294311523, "global_step": 461032, "epoch": 2744} {"train_loss": -12.560091018676758, "global_step": 461033, "epoch": 2744} {"train_loss": -12.629283905029297, "global_step": 461034, "epoch": 2744} {"train_loss": -12.610437393188477, "global_step": 461035, "epoch": 2744} {"train_loss": -12.341744422912598, "global_step": 461036, "epoch": 2744} {"train_loss": -12.47681999206543, "global_step": 461037, "epoch": 2744} {"train_loss": -12.3797607421875, "global_step": 461038, "epoch": 2744} {"train_loss": -12.799894332885742, "global_step": 461039, "epoch": 2744} {"train_loss": -12.252681732177734, "global_step": 461040, "epoch": 2744} {"train_loss": -12.836485862731934, "global_step": 461041, "epoch": 2744} {"train_loss": -12.534185409545898, "global_step": 461042, "epoch": 2744} {"train_loss": -12.633691787719727, "global_step": 461043, "epoch": 2744} {"train_loss": -12.39134407043457, "global_step": 461044, "epoch": 2744} {"train_loss": -11.500031471252441, "global_step": 461045, "epoch": 2744} {"train_loss": -12.471860885620117, "global_step": 461046, "epoch": 2744} {"train_loss": -12.55506706237793, "global_step": 461047, "epoch": 2744} {"train_loss": -11.500615119934082, "global_step": 461048, "epoch": 2744} {"train_loss": -12.169182777404785, "global_step": 461049, "epoch": 2744} {"train_loss": -10.764291763305664, "global_step": 461050, "epoch": 2744} {"train_loss": -11.073125839233398, "global_step": 461051, "epoch": 2744} {"train_loss": -11.99919319152832, "global_step": 461052, "epoch": 2744} {"train_loss": -10.406883239746094, "global_step": 461053, "epoch": 2744} {"train_loss": -10.709819793701172, "global_step": 461054, "epoch": 2744} {"train_loss": -10.946910858154297, "global_step": 461055, "epoch": 2744} {"train_loss": -11.734088897705078, "global_step": 461056, "epoch": 2744} {"train_loss": -11.258932113647461, "global_step": 461057, "epoch": 2744} {"train_loss": -11.127574920654297, "global_step": 461058, "epoch": 2744} {"train_loss": -9.270535469055176, "global_step": 461059, "epoch": 2744} {"train_loss": -12.132625579833984, "global_step": 461060, "epoch": 2744} {"train_loss": -9.724284172058105, "global_step": 461061, "epoch": 2744} {"train_loss": -11.7783842086792, "global_step": 461062, "epoch": 2744} {"train_loss": -10.522849082946777, "global_step": 461063, "epoch": 2744} {"train_loss": -9.87204360961914, "global_step": 461064, "epoch": 2744} {"train_loss": -9.840717315673828, "global_step": 461065, "epoch": 2744} {"train_loss": -9.999906539916992, "global_step": 461066, "epoch": 2744} {"train_loss": -11.63310432434082, "global_step": 461067, "epoch": 2744} {"train_loss": -10.750357627868652, "global_step": 461068, "epoch": 2744} {"train_loss": -11.17215633392334, "global_step": 461069, "epoch": 2744} {"train_loss": -11.288877487182617, "global_step": 461070, "epoch": 2744} {"train_loss": -11.443556785583496, "global_step": 461071, "epoch": 2744} {"train_loss": -11.112236976623535, "global_step": 461072, "epoch": 2744} {"train_loss": -11.298086166381836, "global_step": 461073, "epoch": 2744} {"train_loss": -11.511600494384766, "global_step": 461074, "epoch": 2744} {"train_loss": -11.452646255493164, "global_step": 461075, "epoch": 2744} {"train_loss": -11.622812271118164, "global_step": 461076, "epoch": 2744} {"train_loss": -11.266409873962402, "global_step": 461077, "epoch": 2744} {"train_loss": -11.111185073852539, "global_step": 461078, "epoch": 2744} {"train_loss": -12.162857055664062, "global_step": 461079, "epoch": 2744} {"train_loss": -11.907676696777344, "global_step": 461080, "epoch": 2744} {"train_loss": -12.214250564575195, "global_step": 461081, "epoch": 2744} {"train_loss": -12.30420970916748, "global_step": 461082, "epoch": 2744} {"train_loss": -11.640815734863281, "global_step": 461083, "epoch": 2744} {"train_loss": -12.397799491882324, "global_step": 461084, "epoch": 2744} {"train_loss": -11.775032997131348, "global_step": 461085, "epoch": 2744} {"train_loss": -12.394168853759766, "global_step": 461086, "epoch": 2744} {"train_loss": -12.146770477294922, "global_step": 461087, "epoch": 2744} {"train_loss": -12.287439346313477, "global_step": 461088, "epoch": 2744} {"train_loss": -12.478757858276367, "global_step": 461089, "epoch": 2744} {"train_loss": -12.565129280090332, "global_step": 461090, "epoch": 2744} {"train_loss": -12.732181549072266, "global_step": 461091, "epoch": 2744} {"train_loss": -12.484640121459961, "global_step": 461092, "epoch": 2744} {"train_loss": -12.426284790039062, "global_step": 461093, "epoch": 2744} {"train_loss": -12.529306411743164, "global_step": 461094, "epoch": 2744} {"train_loss": -12.497611045837402, "global_step": 461095, "epoch": 2744} {"train_loss": -12.66002082824707, "global_step": 461096, "epoch": 2744} {"train_loss": -12.484291076660156, "global_step": 461097, "epoch": 2744} {"train_loss": -12.600118637084961, "global_step": 461098, "epoch": 2744} {"train_loss": -12.60218620300293, "global_step": 461099, "epoch": 2744} {"train_loss": -12.548301696777344, "global_step": 461100, "epoch": 2744} {"train_loss": -12.802674293518066, "global_step": 461101, "epoch": 2744} {"train_loss": -12.52051067352295, "global_step": 461102, "epoch": 2744} {"train_loss": -12.790243148803711, "global_step": 461103, "epoch": 2744} {"train_loss": -12.647454261779785, "global_step": 461104, "epoch": 2744} {"train_loss": -12.603928565979004, "global_step": 461105, "epoch": 2744} {"train_loss": -12.510702133178711, "global_step": 461106, "epoch": 2744} {"train_loss": -12.584545135498047, "global_step": 461107, "epoch": 2744} {"train_loss": -12.586809158325195, "global_step": 461108, "epoch": 2744} {"train_loss": -12.41357707977295, "global_step": 461109, "epoch": 2744} {"train_loss": -12.46343994140625, "global_step": 461110, "epoch": 2744} {"train_loss": -12.795270919799805, "global_step": 461111, "epoch": 2744} {"train_loss": -12.817041397094727, "global_step": 461112, "epoch": 2744} {"train_loss": -12.694327354431152, "global_step": 461113, "epoch": 2744} {"train_loss": -12.752517700195312, "global_step": 461114, "epoch": 2744} {"train_loss": -12.67304515838623, "global_step": 461115, "epoch": 2744} {"train_loss": -12.723640441894531, "global_step": 461116, "epoch": 2744} {"train_loss": -12.68050765991211, "global_step": 461117, "epoch": 2744} {"train_loss": -12.486083030700684, "global_step": 461118, "epoch": 2744} {"train_loss": -12.620237350463867, "global_step": 461119, "epoch": 2744} {"train_loss": -12.66714859008789, "global_step": 461120, "epoch": 2744} {"train_loss": -11.372507095336914, "global_step": 461121, "epoch": 2744} {"train_loss": -12.053716659545898, "global_step": 461122, "epoch": 2744} {"train_loss": -12.520151138305664, "global_step": 461123, "epoch": 2744} {"train_loss": -11.914751052856445, "global_step": 461124, "epoch": 2744} {"train_loss": -10.759262084960938, "global_step": 461125, "epoch": 2744} {"train_loss": -11.757768630981445, "global_step": 461126, "epoch": 2744} {"train_loss": -12.392243385314941, "global_step": 461127, "epoch": 2744} {"train_loss": -12.471684455871582, "global_step": 461128, "epoch": 2744} {"train_loss": -11.977117538452148, "global_step": 461129, "epoch": 2744} {"train_loss": -12.58517837524414, "global_step": 461130, "epoch": 2744} {"train_loss": -12.21761417388916, "global_step": 461131, "epoch": 2744} {"train_loss": -12.497251510620117, "global_step": 461132, "epoch": 2744} {"train_loss": -11.189738273620605, "global_step": 461133, "epoch": 2744} {"train_loss": -12.876822471618652, "global_step": 461134, "epoch": 2744} {"train_loss": -11.697771072387695, "global_step": 461135, "epoch": 2744} {"train_loss": -12.430755615234375, "global_step": 461136, "epoch": 2744} {"train_loss": -10.700041770935059, "global_step": 461137, "epoch": 2744} {"train_loss": -11.425275802612305, "global_step": 461138, "epoch": 2744} {"train_loss": -12.412500381469727, "global_step": 461139, "epoch": 2744} {"train_loss": -10.788873672485352, "global_step": 461140, "epoch": 2744} {"train_loss": -12.338626861572266, "global_step": 461141, "epoch": 2744} {"train_loss": -11.614595413208008, "global_step": 461142, "epoch": 2744} {"train_loss": -12.489897727966309, "global_step": 461143, "epoch": 2744} {"train_loss": -11.49599838256836, "global_step": 461144, "epoch": 2744} {"train_loss": -12.330490112304688, "global_step": 461145, "epoch": 2744} {"train_loss": -11.852672576904297, "global_step": 461146, "epoch": 2744} {"train_loss": -12.250137329101562, "global_step": 461147, "epoch": 2744} {"train_loss": -11.852537155151367, "global_step": 461148, "epoch": 2744} {"train_loss": -11.332439422607422, "global_step": 461149, "epoch": 2744} {"train_loss": -12.211779594421387, "global_step": 461150, "epoch": 2744} {"train_loss": -11.204425811767578, "global_step": 461151, "epoch": 2744} {"train_loss": -12.021682739257812, "global_step": 461152, "epoch": 2744} {"train_loss": -11.616373062133789, "global_step": 461153, "epoch": 2744} {"train_loss": -12.251523971557617, "global_step": 461154, "epoch": 2744} {"train_loss": -11.514059066772461, "global_step": 461155, "epoch": 2744} {"train_loss": -12.273137092590332, "global_step": 461156, "epoch": 2744} {"train_loss": -11.419211387634277, "global_step": 461157, "epoch": 2744} {"train_loss": -12.371431350708008, "global_step": 461158, "epoch": 2744} {"train_loss": -12.06277156443823, "global_step": 461159, "epoch": 2744, "val_loss": 315942.09375} {"train_loss": -11.697893142700195, "global_step": 461160, "epoch": 2745} {"train_loss": -10.621684074401855, "global_step": 461161, "epoch": 2745} {"train_loss": -11.102225303649902, "global_step": 461162, "epoch": 2745} {"train_loss": -11.660880088806152, "global_step": 461163, "epoch": 2745} {"train_loss": -11.099603652954102, "global_step": 461164, "epoch": 2745} {"train_loss": -11.540586471557617, "global_step": 461165, "epoch": 2745} {"train_loss": -11.435455322265625, "global_step": 461166, "epoch": 2745} {"train_loss": -11.137741088867188, "global_step": 461167, "epoch": 2745} {"train_loss": -10.527717590332031, "global_step": 461168, "epoch": 2745} {"train_loss": -9.756744384765625, "global_step": 461169, "epoch": 2745} {"train_loss": -10.45323371887207, "global_step": 461170, "epoch": 2745} {"train_loss": -10.557500839233398, "global_step": 461171, "epoch": 2745} {"train_loss": -9.836971282958984, "global_step": 461172, "epoch": 2745} {"train_loss": -9.896206855773926, "global_step": 461173, "epoch": 2745} {"train_loss": -9.500223159790039, "global_step": 461174, "epoch": 2745} {"train_loss": -10.018699645996094, "global_step": 461175, "epoch": 2745} {"train_loss": -10.028885841369629, "global_step": 461176, "epoch": 2745} {"train_loss": -10.260165214538574, "global_step": 461177, "epoch": 2745} {"train_loss": -10.80612564086914, "global_step": 461178, "epoch": 2745} {"train_loss": -11.60915470123291, "global_step": 461179, "epoch": 2745} {"train_loss": -10.954357147216797, "global_step": 461180, "epoch": 2745} {"train_loss": -11.250711441040039, "global_step": 461181, "epoch": 2745} {"train_loss": -11.22804069519043, "global_step": 461182, "epoch": 2745} {"train_loss": -11.367116928100586, "global_step": 461183, "epoch": 2745} {"train_loss": -11.05257797241211, "global_step": 461184, "epoch": 2745} {"train_loss": -11.312670707702637, "global_step": 461185, "epoch": 2745} {"train_loss": -10.748527526855469, "global_step": 461186, "epoch": 2745} {"train_loss": -11.526815414428711, "global_step": 461187, "epoch": 2745} {"train_loss": -11.83470344543457, "global_step": 461188, "epoch": 2745} {"train_loss": -11.981688499450684, "global_step": 461189, "epoch": 2745} {"train_loss": -12.033026695251465, "global_step": 461190, "epoch": 2745} {"train_loss": -11.470449447631836, "global_step": 461191, "epoch": 2745} {"train_loss": -11.660758972167969, "global_step": 461192, "epoch": 2745} {"train_loss": -11.220680236816406, "global_step": 461193, "epoch": 2745} {"train_loss": -11.969680786132812, "global_step": 461194, "epoch": 2745} {"train_loss": -12.130526542663574, "global_step": 461195, "epoch": 2745} {"train_loss": -12.103758811950684, "global_step": 461196, "epoch": 2745} {"train_loss": -12.162322044372559, "global_step": 461197, "epoch": 2745} {"train_loss": -11.954385757446289, "global_step": 461198, "epoch": 2745} {"train_loss": -11.949138641357422, "global_step": 461199, "epoch": 2745} {"train_loss": -12.391204833984375, "global_step": 461200, "epoch": 2745} {"train_loss": -12.101736068725586, "global_step": 461201, "epoch": 2745} {"train_loss": -12.404611587524414, "global_step": 461202, "epoch": 2745} {"train_loss": -12.559516906738281, "global_step": 461203, "epoch": 2745} {"train_loss": -12.41999626159668, "global_step": 461204, "epoch": 2745} {"train_loss": -12.575309753417969, "global_step": 461205, "epoch": 2745} {"train_loss": -12.41112995147705, "global_step": 461206, "epoch": 2745} {"train_loss": -12.442154884338379, "global_step": 461207, "epoch": 2745} {"train_loss": -12.629016876220703, "global_step": 461208, "epoch": 2745} {"train_loss": -12.38827896118164, "global_step": 461209, "epoch": 2745} {"train_loss": -12.380180358886719, "global_step": 461210, "epoch": 2745} {"train_loss": -12.216970443725586, "global_step": 461211, "epoch": 2745} {"train_loss": -12.397748947143555, "global_step": 461212, "epoch": 2745} {"train_loss": -12.431023597717285, "global_step": 461213, "epoch": 2745} {"train_loss": -12.524730682373047, "global_step": 461214, "epoch": 2745} {"train_loss": -12.364849090576172, "global_step": 461215, "epoch": 2745} {"train_loss": -12.501026153564453, "global_step": 461216, "epoch": 2745} {"train_loss": -12.456488609313965, "global_step": 461217, "epoch": 2745} {"train_loss": -12.569517135620117, "global_step": 461218, "epoch": 2745} {"train_loss": -12.48135757446289, "global_step": 461219, "epoch": 2745} {"train_loss": -12.410323143005371, "global_step": 461220, "epoch": 2745} {"train_loss": -12.367136001586914, "global_step": 461221, "epoch": 2745} {"train_loss": -12.27912712097168, "global_step": 461222, "epoch": 2745} {"train_loss": -12.435450553894043, "global_step": 461223, "epoch": 2745} {"train_loss": -12.351822853088379, "global_step": 461224, "epoch": 2745} {"train_loss": -12.48481273651123, "global_step": 461225, "epoch": 2745} {"train_loss": -12.50552749633789, "global_step": 461226, "epoch": 2745} {"train_loss": -12.196889877319336, "global_step": 461227, "epoch": 2745} {"train_loss": -12.661384582519531, "global_step": 461228, "epoch": 2745} {"train_loss": -12.288328170776367, "global_step": 461229, "epoch": 2745} {"train_loss": -12.566075325012207, "global_step": 461230, "epoch": 2745} {"train_loss": -11.977439880371094, "global_step": 461231, "epoch": 2745} {"train_loss": -12.637840270996094, "global_step": 461232, "epoch": 2745} {"train_loss": -12.355182647705078, "global_step": 461233, "epoch": 2745} {"train_loss": -12.550491333007812, "global_step": 461234, "epoch": 2745} {"train_loss": -12.727280616760254, "global_step": 461235, "epoch": 2745} {"train_loss": -12.418050765991211, "global_step": 461236, "epoch": 2745} {"train_loss": -12.627470016479492, "global_step": 461237, "epoch": 2745} {"train_loss": -12.732787132263184, "global_step": 461238, "epoch": 2745} {"train_loss": -12.707071304321289, "global_step": 461239, "epoch": 2745} {"train_loss": -12.753175735473633, "global_step": 461240, "epoch": 2745} {"train_loss": -12.486024856567383, "global_step": 461241, "epoch": 2745} {"train_loss": -12.554410934448242, "global_step": 461242, "epoch": 2745} {"train_loss": -12.745537757873535, "global_step": 461243, "epoch": 2745} {"train_loss": -12.30340576171875, "global_step": 461244, "epoch": 2745} {"train_loss": -12.8429594039917, "global_step": 461245, "epoch": 2745} {"train_loss": -12.329965591430664, "global_step": 461246, "epoch": 2745} {"train_loss": -12.305441856384277, "global_step": 461247, "epoch": 2745} {"train_loss": -12.547534942626953, "global_step": 461248, "epoch": 2745} {"train_loss": -12.44671630859375, "global_step": 461249, "epoch": 2745} {"train_loss": -12.610518455505371, "global_step": 461250, "epoch": 2745} {"train_loss": -12.616774559020996, "global_step": 461251, "epoch": 2745} {"train_loss": -12.458721160888672, "global_step": 461252, "epoch": 2745} {"train_loss": -12.272041320800781, "global_step": 461253, "epoch": 2745} {"train_loss": -12.583574295043945, "global_step": 461254, "epoch": 2745} {"train_loss": -12.520755767822266, "global_step": 461255, "epoch": 2745} {"train_loss": -12.757033348083496, "global_step": 461256, "epoch": 2745} {"train_loss": -12.37326431274414, "global_step": 461257, "epoch": 2745} {"train_loss": -12.625993728637695, "global_step": 461258, "epoch": 2745} {"train_loss": -12.585921287536621, "global_step": 461259, "epoch": 2745} {"train_loss": -12.516952514648438, "global_step": 461260, "epoch": 2745} {"train_loss": -12.070228576660156, "global_step": 461261, "epoch": 2745} {"train_loss": -12.449052810668945, "global_step": 461262, "epoch": 2745} {"train_loss": -12.614205360412598, "global_step": 461263, "epoch": 2745} {"train_loss": -11.896859169006348, "global_step": 461264, "epoch": 2745} {"train_loss": -11.837373733520508, "global_step": 461265, "epoch": 2745} {"train_loss": -12.71995735168457, "global_step": 461266, "epoch": 2745} {"train_loss": -12.189191818237305, "global_step": 461267, "epoch": 2745} {"train_loss": -12.061681747436523, "global_step": 461268, "epoch": 2745} {"train_loss": -12.442989349365234, "global_step": 461269, "epoch": 2745} {"train_loss": -12.325854301452637, "global_step": 461270, "epoch": 2745} {"train_loss": -12.612003326416016, "global_step": 461271, "epoch": 2745} {"train_loss": -12.442170143127441, "global_step": 461272, "epoch": 2745} {"train_loss": -12.767991065979004, "global_step": 461273, "epoch": 2745} {"train_loss": -12.585580825805664, "global_step": 461274, "epoch": 2745} {"train_loss": -12.712564468383789, "global_step": 461275, "epoch": 2745} {"train_loss": -12.935873985290527, "global_step": 461276, "epoch": 2745} {"train_loss": -12.5872802734375, "global_step": 461277, "epoch": 2745} {"train_loss": -12.398174285888672, "global_step": 461278, "epoch": 2745} {"train_loss": -12.55734920501709, "global_step": 461279, "epoch": 2745} {"train_loss": -12.700787544250488, "global_step": 461280, "epoch": 2745} {"train_loss": -12.547539710998535, "global_step": 461281, "epoch": 2745} {"train_loss": -12.562671661376953, "global_step": 461282, "epoch": 2745} {"train_loss": -12.771440505981445, "global_step": 461283, "epoch": 2745} {"train_loss": -12.643613815307617, "global_step": 461284, "epoch": 2745} {"train_loss": -11.886978149414062, "global_step": 461285, "epoch": 2745} {"train_loss": -11.9239501953125, "global_step": 461286, "epoch": 2745} {"train_loss": -11.962390899658203, "global_step": 461287, "epoch": 2745} {"train_loss": -12.781574249267578, "global_step": 461288, "epoch": 2745} {"train_loss": -12.591046333312988, "global_step": 461289, "epoch": 2745} {"train_loss": -12.535947799682617, "global_step": 461290, "epoch": 2745} {"train_loss": -12.680850982666016, "global_step": 461291, "epoch": 2745} {"train_loss": -12.807589530944824, "global_step": 461292, "epoch": 2745} {"train_loss": -12.371767044067383, "global_step": 461293, "epoch": 2745} {"train_loss": -12.41579818725586, "global_step": 461294, "epoch": 2745} {"train_loss": -12.053311347961426, "global_step": 461295, "epoch": 2745} {"train_loss": -11.978500366210938, "global_step": 461296, "epoch": 2745} {"train_loss": -11.808011054992676, "global_step": 461297, "epoch": 2745} {"train_loss": -12.911553382873535, "global_step": 461298, "epoch": 2745} {"train_loss": -11.976873397827148, "global_step": 461299, "epoch": 2745} {"train_loss": -12.602957725524902, "global_step": 461300, "epoch": 2745} {"train_loss": -12.041218757629395, "global_step": 461301, "epoch": 2745} {"train_loss": -12.270709991455078, "global_step": 461302, "epoch": 2745} {"train_loss": -11.376848220825195, "global_step": 461303, "epoch": 2745} {"train_loss": -12.197265625, "global_step": 461304, "epoch": 2745} {"train_loss": -12.15246868133545, "global_step": 461305, "epoch": 2745} {"train_loss": -11.146291732788086, "global_step": 461306, "epoch": 2745} {"train_loss": -11.250856399536133, "global_step": 461307, "epoch": 2745} {"train_loss": -11.235713005065918, "global_step": 461308, "epoch": 2745} {"train_loss": -11.500073432922363, "global_step": 461309, "epoch": 2745} {"train_loss": -11.647833824157715, "global_step": 461310, "epoch": 2745} {"train_loss": -11.197382926940918, "global_step": 461311, "epoch": 2745} {"train_loss": -10.969842910766602, "global_step": 461312, "epoch": 2745} {"train_loss": -9.980131149291992, "global_step": 461313, "epoch": 2745} {"train_loss": -11.253182411193848, "global_step": 461314, "epoch": 2745} {"train_loss": -10.51921272277832, "global_step": 461315, "epoch": 2745} {"train_loss": -11.454523086547852, "global_step": 461316, "epoch": 2745} {"train_loss": -11.90128231048584, "global_step": 461317, "epoch": 2745} {"train_loss": -11.32365608215332, "global_step": 461318, "epoch": 2745} {"train_loss": -11.693772315979004, "global_step": 461319, "epoch": 2745} {"train_loss": -11.375986099243164, "global_step": 461320, "epoch": 2745} {"train_loss": -12.465394020080566, "global_step": 461321, "epoch": 2745} {"train_loss": -11.216582298278809, "global_step": 461322, "epoch": 2745} {"train_loss": -11.708822250366211, "global_step": 461323, "epoch": 2745} {"train_loss": -11.981132507324219, "global_step": 461324, "epoch": 2745} {"train_loss": -11.423604965209961, "global_step": 461325, "epoch": 2745} {"train_loss": -11.416626930236816, "global_step": 461326, "epoch": 2745} {"train_loss": -11.989419556799389, "global_step": 461327, "epoch": 2745, "val_loss": 314233.96875, "train_action_mse_error": 1.175581932067871} {"train_loss": -12.143141746520996, "global_step": 461328, "epoch": 2746} {"train_loss": -12.329227447509766, "global_step": 461329, "epoch": 2746} {"train_loss": -12.388519287109375, "global_step": 461330, "epoch": 2746} {"train_loss": -11.834205627441406, "global_step": 461331, "epoch": 2746} {"train_loss": -12.378131866455078, "global_step": 461332, "epoch": 2746} {"train_loss": -12.139945983886719, "global_step": 461333, "epoch": 2746} {"train_loss": -12.18425178527832, "global_step": 461334, "epoch": 2746} {"train_loss": -12.360756874084473, "global_step": 461335, "epoch": 2746} {"train_loss": -12.327777862548828, "global_step": 461336, "epoch": 2746} {"train_loss": -12.19057559967041, "global_step": 461337, "epoch": 2746} {"train_loss": -12.411123275756836, "global_step": 461338, "epoch": 2746} {"train_loss": -12.345516204833984, "global_step": 461339, "epoch": 2746} {"train_loss": -12.419239044189453, "global_step": 461340, "epoch": 2746} {"train_loss": -12.224777221679688, "global_step": 461341, "epoch": 2746} {"train_loss": -12.268548011779785, "global_step": 461342, "epoch": 2746} {"train_loss": -12.09463882446289, "global_step": 461343, "epoch": 2746} {"train_loss": -12.25185489654541, "global_step": 461344, "epoch": 2746} {"train_loss": -12.388731002807617, "global_step": 461345, "epoch": 2746} {"train_loss": -12.181485176086426, "global_step": 461346, "epoch": 2746} {"train_loss": -12.368685722351074, "global_step": 461347, "epoch": 2746} {"train_loss": -12.384284019470215, "global_step": 461348, "epoch": 2746} {"train_loss": -12.348974227905273, "global_step": 461349, "epoch": 2746} {"train_loss": -12.38010025024414, "global_step": 461350, "epoch": 2746} {"train_loss": -12.340675354003906, "global_step": 461351, "epoch": 2746} {"train_loss": -12.487081527709961, "global_step": 461352, "epoch": 2746} {"train_loss": -12.420723915100098, "global_step": 461353, "epoch": 2746} {"train_loss": -12.540626525878906, "global_step": 461354, "epoch": 2746} {"train_loss": -12.621103286743164, "global_step": 461355, "epoch": 2746} {"train_loss": -12.621835708618164, "global_step": 461356, "epoch": 2746} {"train_loss": -12.723516464233398, "global_step": 461357, "epoch": 2746} {"train_loss": -12.67768669128418, "global_step": 461358, "epoch": 2746} {"train_loss": -12.492923736572266, "global_step": 461359, "epoch": 2746} {"train_loss": -12.245748519897461, "global_step": 461360, "epoch": 2746} {"train_loss": -12.76083755493164, "global_step": 461361, "epoch": 2746} {"train_loss": -12.436563491821289, "global_step": 461362, "epoch": 2746} {"train_loss": -12.422652244567871, "global_step": 461363, "epoch": 2746} {"train_loss": -12.836703300476074, "global_step": 461364, "epoch": 2746} {"train_loss": -12.531095504760742, "global_step": 461365, "epoch": 2746} {"train_loss": -12.498636245727539, "global_step": 461366, "epoch": 2746} {"train_loss": -12.794729232788086, "global_step": 461367, "epoch": 2746} {"train_loss": -12.563603401184082, "global_step": 461368, "epoch": 2746} {"train_loss": -12.693650245666504, "global_step": 461369, "epoch": 2746} {"train_loss": -12.137575149536133, "global_step": 461370, "epoch": 2746} {"train_loss": -12.084502220153809, "global_step": 461371, "epoch": 2746} {"train_loss": -12.246929168701172, "global_step": 461372, "epoch": 2746} {"train_loss": -12.392905235290527, "global_step": 461373, "epoch": 2746} {"train_loss": -11.802131652832031, "global_step": 461374, "epoch": 2746} {"train_loss": -12.134998321533203, "global_step": 461375, "epoch": 2746} {"train_loss": -12.47114372253418, "global_step": 461376, "epoch": 2746} {"train_loss": -12.176654815673828, "global_step": 461377, "epoch": 2746} {"train_loss": -12.309432983398438, "global_step": 461378, "epoch": 2746} {"train_loss": -12.541629791259766, "global_step": 461379, "epoch": 2746} {"train_loss": -12.241022109985352, "global_step": 461380, "epoch": 2746} {"train_loss": -12.439872741699219, "global_step": 461381, "epoch": 2746} {"train_loss": -12.510786056518555, "global_step": 461382, "epoch": 2746} {"train_loss": -12.311376571655273, "global_step": 461383, "epoch": 2746} {"train_loss": -12.633769035339355, "global_step": 461384, "epoch": 2746} {"train_loss": -12.414606094360352, "global_step": 461385, "epoch": 2746} {"train_loss": -12.570144653320312, "global_step": 461386, "epoch": 2746} {"train_loss": -12.039299011230469, "global_step": 461387, "epoch": 2746} {"train_loss": -12.53898811340332, "global_step": 461388, "epoch": 2746} {"train_loss": -12.325490951538086, "global_step": 461389, "epoch": 2746} {"train_loss": -12.64130973815918, "global_step": 461390, "epoch": 2746} {"train_loss": -12.40986156463623, "global_step": 461391, "epoch": 2746} {"train_loss": -12.114389419555664, "global_step": 461392, "epoch": 2746} {"train_loss": -12.556112289428711, "global_step": 461393, "epoch": 2746} {"train_loss": -12.577207565307617, "global_step": 461394, "epoch": 2746} {"train_loss": -11.650555610656738, "global_step": 461395, "epoch": 2746} {"train_loss": -12.858745574951172, "global_step": 461396, "epoch": 2746} {"train_loss": -11.454132080078125, "global_step": 461397, "epoch": 2746} {"train_loss": -12.189716339111328, "global_step": 461398, "epoch": 2746} {"train_loss": -12.45351791381836, "global_step": 461399, "epoch": 2746} {"train_loss": -10.840970993041992, "global_step": 461400, "epoch": 2746} {"train_loss": -12.764093399047852, "global_step": 461401, "epoch": 2746} {"train_loss": -11.223301887512207, "global_step": 461402, "epoch": 2746} {"train_loss": -12.5706148147583, "global_step": 461403, "epoch": 2746} {"train_loss": -12.202840805053711, "global_step": 461404, "epoch": 2746} {"train_loss": -12.327308654785156, "global_step": 461405, "epoch": 2746} {"train_loss": -12.397090911865234, "global_step": 461406, "epoch": 2746} {"train_loss": -12.398756980895996, "global_step": 461407, "epoch": 2746} {"train_loss": -12.356292724609375, "global_step": 461408, "epoch": 2746} {"train_loss": -12.548264503479004, "global_step": 461409, "epoch": 2746} {"train_loss": -12.223365783691406, "global_step": 461410, "epoch": 2746} {"train_loss": -12.02206802368164, "global_step": 461411, "epoch": 2746} {"train_loss": -12.482991218566895, "global_step": 461412, "epoch": 2746} {"train_loss": -11.82229995727539, "global_step": 461413, "epoch": 2746} {"train_loss": -12.408571243286133, "global_step": 461414, "epoch": 2746} {"train_loss": -12.431175231933594, "global_step": 461415, "epoch": 2746} {"train_loss": -12.444972038269043, "global_step": 461416, "epoch": 2746} {"train_loss": -12.05610179901123, "global_step": 461417, "epoch": 2746} {"train_loss": -12.503133773803711, "global_step": 461418, "epoch": 2746} {"train_loss": -11.984573364257812, "global_step": 461419, "epoch": 2746} {"train_loss": -11.894075393676758, "global_step": 461420, "epoch": 2746} {"train_loss": -12.148473739624023, "global_step": 461421, "epoch": 2746} {"train_loss": -12.17821979522705, "global_step": 461422, "epoch": 2746} {"train_loss": -11.11442756652832, "global_step": 461423, "epoch": 2746} {"train_loss": -12.142244338989258, "global_step": 461424, "epoch": 2746} {"train_loss": -11.99802303314209, "global_step": 461425, "epoch": 2746} {"train_loss": -11.365056991577148, "global_step": 461426, "epoch": 2746} {"train_loss": -12.60706615447998, "global_step": 461427, "epoch": 2746} {"train_loss": -11.270998001098633, "global_step": 461428, "epoch": 2746} {"train_loss": -10.79624080657959, "global_step": 461429, "epoch": 2746} {"train_loss": -11.479631423950195, "global_step": 461430, "epoch": 2746} {"train_loss": -9.174214363098145, "global_step": 461431, "epoch": 2746} {"train_loss": -11.153564453125, "global_step": 461432, "epoch": 2746} {"train_loss": -8.980533599853516, "global_step": 461433, "epoch": 2746} {"train_loss": -9.969690322875977, "global_step": 461434, "epoch": 2746} {"train_loss": -10.865067481994629, "global_step": 461435, "epoch": 2746} {"train_loss": -11.262056350708008, "global_step": 461436, "epoch": 2746} {"train_loss": -10.68539810180664, "global_step": 461437, "epoch": 2746} {"train_loss": -10.552748680114746, "global_step": 461438, "epoch": 2746} {"train_loss": -12.068259239196777, "global_step": 461439, "epoch": 2746} {"train_loss": -10.568620681762695, "global_step": 461440, "epoch": 2746} {"train_loss": -11.180633544921875, "global_step": 461441, "epoch": 2746} {"train_loss": -10.915740013122559, "global_step": 461442, "epoch": 2746} {"train_loss": -10.890740394592285, "global_step": 461443, "epoch": 2746} {"train_loss": -11.847959518432617, "global_step": 461444, "epoch": 2746} {"train_loss": -11.85102653503418, "global_step": 461445, "epoch": 2746} {"train_loss": -11.913318634033203, "global_step": 461446, "epoch": 2746} {"train_loss": -10.98910140991211, "global_step": 461447, "epoch": 2746} {"train_loss": -12.316519737243652, "global_step": 461448, "epoch": 2746} {"train_loss": -11.642738342285156, "global_step": 461449, "epoch": 2746} {"train_loss": -12.20509147644043, "global_step": 461450, "epoch": 2746} {"train_loss": -11.957178115844727, "global_step": 461451, "epoch": 2746} {"train_loss": -12.268574714660645, "global_step": 461452, "epoch": 2746} {"train_loss": -12.074527740478516, "global_step": 461453, "epoch": 2746} {"train_loss": -12.393497467041016, "global_step": 461454, "epoch": 2746} {"train_loss": -12.181985855102539, "global_step": 461455, "epoch": 2746} {"train_loss": -12.256399154663086, "global_step": 461456, "epoch": 2746} {"train_loss": -12.26721477508545, "global_step": 461457, "epoch": 2746} {"train_loss": -12.246932983398438, "global_step": 461458, "epoch": 2746} {"train_loss": -12.566614151000977, "global_step": 461459, "epoch": 2746} {"train_loss": -12.363572120666504, "global_step": 461460, "epoch": 2746} {"train_loss": -12.097339630126953, "global_step": 461461, "epoch": 2746} {"train_loss": -12.197057723999023, "global_step": 461462, "epoch": 2746} {"train_loss": -12.339103698730469, "global_step": 461463, "epoch": 2746} {"train_loss": -12.55571460723877, "global_step": 461464, "epoch": 2746} {"train_loss": -12.274328231811523, "global_step": 461465, "epoch": 2746} {"train_loss": -12.3388671875, "global_step": 461466, "epoch": 2746} {"train_loss": -12.202184677124023, "global_step": 461467, "epoch": 2746} {"train_loss": -12.577411651611328, "global_step": 461468, "epoch": 2746} {"train_loss": -12.064920425415039, "global_step": 461469, "epoch": 2746} {"train_loss": -12.24444580078125, "global_step": 461470, "epoch": 2746} {"train_loss": -12.565978050231934, "global_step": 461471, "epoch": 2746} {"train_loss": -12.138727188110352, "global_step": 461472, "epoch": 2746} {"train_loss": -12.366812705993652, "global_step": 461473, "epoch": 2746} {"train_loss": -12.27593994140625, "global_step": 461474, "epoch": 2746} {"train_loss": -12.442007064819336, "global_step": 461475, "epoch": 2746} {"train_loss": -12.12054443359375, "global_step": 461476, "epoch": 2746} {"train_loss": -12.553606986999512, "global_step": 461477, "epoch": 2746} {"train_loss": -12.24040699005127, "global_step": 461478, "epoch": 2746} {"train_loss": -12.049262046813965, "global_step": 461479, "epoch": 2746} {"train_loss": -12.623443603515625, "global_step": 461480, "epoch": 2746} {"train_loss": -12.121212005615234, "global_step": 461481, "epoch": 2746} {"train_loss": -12.474230766296387, "global_step": 461482, "epoch": 2746} {"train_loss": -12.442626953125, "global_step": 461483, "epoch": 2746} {"train_loss": -12.36695384979248, "global_step": 461484, "epoch": 2746} {"train_loss": -12.809099197387695, "global_step": 461485, "epoch": 2746} {"train_loss": -12.24322509765625, "global_step": 461486, "epoch": 2746} {"train_loss": -12.67564582824707, "global_step": 461487, "epoch": 2746} {"train_loss": -12.321989059448242, "global_step": 461488, "epoch": 2746} {"train_loss": -12.759490013122559, "global_step": 461489, "epoch": 2746} {"train_loss": -12.626575469970703, "global_step": 461490, "epoch": 2746} {"train_loss": -12.632795333862305, "global_step": 461491, "epoch": 2746} {"train_loss": -12.487432479858398, "global_step": 461492, "epoch": 2746} {"train_loss": -12.498376846313477, "global_step": 461493, "epoch": 2746} {"train_loss": -12.401317596435547, "global_step": 461494, "epoch": 2746} {"train_loss": -12.1454865137736, "global_step": 461495, "epoch": 2746, "val_loss": 316931.0} {"train_loss": -12.827144622802734, "global_step": 461496, "epoch": 2747} {"train_loss": -12.396869659423828, "global_step": 461497, "epoch": 2747} {"train_loss": -12.520779609680176, "global_step": 461498, "epoch": 2747} {"train_loss": -12.543028831481934, "global_step": 461499, "epoch": 2747} {"train_loss": -12.611871719360352, "global_step": 461500, "epoch": 2747} {"train_loss": -12.777427673339844, "global_step": 461501, "epoch": 2747} {"train_loss": -12.86958122253418, "global_step": 461502, "epoch": 2747} {"train_loss": -12.360515594482422, "global_step": 461503, "epoch": 2747} {"train_loss": -12.867059707641602, "global_step": 461504, "epoch": 2747} {"train_loss": -12.477404594421387, "global_step": 461505, "epoch": 2747} {"train_loss": -12.168673515319824, "global_step": 461506, "epoch": 2747} {"train_loss": -12.442100524902344, "global_step": 461507, "epoch": 2747} {"train_loss": -12.689382553100586, "global_step": 461508, "epoch": 2747} {"train_loss": -12.65150260925293, "global_step": 461509, "epoch": 2747} {"train_loss": -12.754386901855469, "global_step": 461510, "epoch": 2747} {"train_loss": -12.43889045715332, "global_step": 461511, "epoch": 2747} {"train_loss": -12.756555557250977, "global_step": 461512, "epoch": 2747} {"train_loss": -11.984939575195312, "global_step": 461513, "epoch": 2747} {"train_loss": -11.95224380493164, "global_step": 461514, "epoch": 2747} {"train_loss": -12.162579536437988, "global_step": 461515, "epoch": 2747} {"train_loss": -11.128593444824219, "global_step": 461516, "epoch": 2747} {"train_loss": -12.006482124328613, "global_step": 461517, "epoch": 2747} {"train_loss": -9.507472038269043, "global_step": 461518, "epoch": 2747} {"train_loss": -11.241142272949219, "global_step": 461519, "epoch": 2747} {"train_loss": -9.951041221618652, "global_step": 461520, "epoch": 2747} {"train_loss": -9.190713882446289, "global_step": 461521, "epoch": 2747} {"train_loss": -8.714164733886719, "global_step": 461522, "epoch": 2747} {"train_loss": -8.850214004516602, "global_step": 461523, "epoch": 2747} {"train_loss": -10.192943572998047, "global_step": 461524, "epoch": 2747} {"train_loss": -9.160919189453125, "global_step": 461525, "epoch": 2747} {"train_loss": -10.95012092590332, "global_step": 461526, "epoch": 2747} {"train_loss": -9.86288070678711, "global_step": 461527, "epoch": 2747} {"train_loss": -10.463706016540527, "global_step": 461528, "epoch": 2747} {"train_loss": -10.61280632019043, "global_step": 461529, "epoch": 2747} {"train_loss": -10.177742004394531, "global_step": 461530, "epoch": 2747} {"train_loss": -10.46683406829834, "global_step": 461531, "epoch": 2747} {"train_loss": -9.420994758605957, "global_step": 461532, "epoch": 2747} {"train_loss": -11.023731231689453, "global_step": 461533, "epoch": 2747} {"train_loss": -10.135171890258789, "global_step": 461534, "epoch": 2747} {"train_loss": -10.940958023071289, "global_step": 461535, "epoch": 2747} {"train_loss": -11.088231086730957, "global_step": 461536, "epoch": 2747} {"train_loss": -10.72502613067627, "global_step": 461537, "epoch": 2747} {"train_loss": -10.957942962646484, "global_step": 461538, "epoch": 2747} {"train_loss": -12.296977996826172, "global_step": 461539, "epoch": 2747} {"train_loss": -9.740520477294922, "global_step": 461540, "epoch": 2747} {"train_loss": -11.68270492553711, "global_step": 461541, "epoch": 2747} {"train_loss": -11.463186264038086, "global_step": 461542, "epoch": 2747} {"train_loss": -10.95333480834961, "global_step": 461543, "epoch": 2747} {"train_loss": -12.099021911621094, "global_step": 461544, "epoch": 2747} {"train_loss": -11.492271423339844, "global_step": 461545, "epoch": 2747} {"train_loss": -11.889728546142578, "global_step": 461546, "epoch": 2747} {"train_loss": -11.937346458435059, "global_step": 461547, "epoch": 2747} {"train_loss": -11.783367156982422, "global_step": 461548, "epoch": 2747} {"train_loss": -11.613981246948242, "global_step": 461549, "epoch": 2747} {"train_loss": -11.908323287963867, "global_step": 461550, "epoch": 2747} {"train_loss": -11.94040298461914, "global_step": 461551, "epoch": 2747} {"train_loss": -11.938785552978516, "global_step": 461552, "epoch": 2747} {"train_loss": -12.202001571655273, "global_step": 461553, "epoch": 2747} {"train_loss": -12.090822219848633, "global_step": 461554, "epoch": 2747} {"train_loss": -12.144546508789062, "global_step": 461555, "epoch": 2747} {"train_loss": -12.338144302368164, "global_step": 461556, "epoch": 2747} {"train_loss": -12.217004776000977, "global_step": 461557, "epoch": 2747} {"train_loss": -12.126680374145508, "global_step": 461558, "epoch": 2747} {"train_loss": -12.481943130493164, "global_step": 461559, "epoch": 2747} {"train_loss": -12.497300148010254, "global_step": 461560, "epoch": 2747} {"train_loss": -12.189839363098145, "global_step": 461561, "epoch": 2747} {"train_loss": -12.472209930419922, "global_step": 461562, "epoch": 2747} {"train_loss": -12.354644775390625, "global_step": 461563, "epoch": 2747} {"train_loss": -12.542793273925781, "global_step": 461564, "epoch": 2747} {"train_loss": -12.443021774291992, "global_step": 461565, "epoch": 2747} {"train_loss": -12.623802185058594, "global_step": 461566, "epoch": 2747} {"train_loss": -12.453208923339844, "global_step": 461567, "epoch": 2747} {"train_loss": -12.61376953125, "global_step": 461568, "epoch": 2747} {"train_loss": -12.496330261230469, "global_step": 461569, "epoch": 2747} {"train_loss": -12.406728744506836, "global_step": 461570, "epoch": 2747} {"train_loss": -12.566627502441406, "global_step": 461571, "epoch": 2747} {"train_loss": -12.634563446044922, "global_step": 461572, "epoch": 2747} {"train_loss": -12.502131462097168, "global_step": 461573, "epoch": 2747} {"train_loss": -12.711517333984375, "global_step": 461574, "epoch": 2747} {"train_loss": -12.243602752685547, "global_step": 461575, "epoch": 2747} {"train_loss": -12.458662033081055, "global_step": 461576, "epoch": 2747} {"train_loss": -12.354473114013672, "global_step": 461577, "epoch": 2747} {"train_loss": -12.322155952453613, "global_step": 461578, "epoch": 2747} {"train_loss": -12.652064323425293, "global_step": 461579, "epoch": 2747} {"train_loss": -12.61750316619873, "global_step": 461580, "epoch": 2747} {"train_loss": -12.60295581817627, "global_step": 461581, "epoch": 2747} {"train_loss": -12.924661636352539, "global_step": 461582, "epoch": 2747} {"train_loss": -12.624906539916992, "global_step": 461583, "epoch": 2747} {"train_loss": -12.706120491027832, "global_step": 461584, "epoch": 2747} {"train_loss": -12.814460754394531, "global_step": 461585, "epoch": 2747} {"train_loss": -12.513012886047363, "global_step": 461586, "epoch": 2747} {"train_loss": -12.752259254455566, "global_step": 461587, "epoch": 2747} {"train_loss": -12.560844421386719, "global_step": 461588, "epoch": 2747} {"train_loss": -12.737272262573242, "global_step": 461589, "epoch": 2747} {"train_loss": -12.77842903137207, "global_step": 461590, "epoch": 2747} {"train_loss": -12.365961074829102, "global_step": 461591, "epoch": 2747} {"train_loss": -12.567648887634277, "global_step": 461592, "epoch": 2747} {"train_loss": -12.560811996459961, "global_step": 461593, "epoch": 2747} {"train_loss": -12.096431732177734, "global_step": 461594, "epoch": 2747} {"train_loss": -12.201553344726562, "global_step": 461595, "epoch": 2747} {"train_loss": -11.46670150756836, "global_step": 461596, "epoch": 2747} {"train_loss": -11.71406078338623, "global_step": 461597, "epoch": 2747} {"train_loss": -12.381746292114258, "global_step": 461598, "epoch": 2747} {"train_loss": -11.743773460388184, "global_step": 461599, "epoch": 2747} {"train_loss": -12.545705795288086, "global_step": 461600, "epoch": 2747} {"train_loss": -11.855463027954102, "global_step": 461601, "epoch": 2747} {"train_loss": -12.395837783813477, "global_step": 461602, "epoch": 2747} {"train_loss": -12.176076889038086, "global_step": 461603, "epoch": 2747} {"train_loss": -11.479743957519531, "global_step": 461604, "epoch": 2747} {"train_loss": -12.443208694458008, "global_step": 461605, "epoch": 2747} {"train_loss": -12.171496391296387, "global_step": 461606, "epoch": 2747} {"train_loss": -11.6279296875, "global_step": 461607, "epoch": 2747} {"train_loss": -12.579887390136719, "global_step": 461608, "epoch": 2747} {"train_loss": -11.960954666137695, "global_step": 461609, "epoch": 2747} {"train_loss": -12.465215682983398, "global_step": 461610, "epoch": 2747} {"train_loss": -12.374857902526855, "global_step": 461611, "epoch": 2747} {"train_loss": -12.646841049194336, "global_step": 461612, "epoch": 2747} {"train_loss": -12.349210739135742, "global_step": 461613, "epoch": 2747} {"train_loss": -12.662212371826172, "global_step": 461614, "epoch": 2747} {"train_loss": -12.592999458312988, "global_step": 461615, "epoch": 2747} {"train_loss": -12.36417293548584, "global_step": 461616, "epoch": 2747} {"train_loss": -12.348069190979004, "global_step": 461617, "epoch": 2747} {"train_loss": -12.058547973632812, "global_step": 461618, "epoch": 2747} {"train_loss": -12.79056167602539, "global_step": 461619, "epoch": 2747} {"train_loss": -12.062305450439453, "global_step": 461620, "epoch": 2747} {"train_loss": -12.65512466430664, "global_step": 461621, "epoch": 2747} {"train_loss": -12.374199867248535, "global_step": 461622, "epoch": 2747} {"train_loss": -12.799985885620117, "global_step": 461623, "epoch": 2747} {"train_loss": -12.685026168823242, "global_step": 461624, "epoch": 2747} {"train_loss": -12.41675853729248, "global_step": 461625, "epoch": 2747} {"train_loss": -12.462369918823242, "global_step": 461626, "epoch": 2747} {"train_loss": -12.736772537231445, "global_step": 461627, "epoch": 2747} {"train_loss": -12.67408561706543, "global_step": 461628, "epoch": 2747} {"train_loss": -12.71561336517334, "global_step": 461629, "epoch": 2747} {"train_loss": -12.553964614868164, "global_step": 461630, "epoch": 2747} {"train_loss": -12.979504585266113, "global_step": 461631, "epoch": 2747} {"train_loss": -12.665748596191406, "global_step": 461632, "epoch": 2747} {"train_loss": -12.843538284301758, "global_step": 461633, "epoch": 2747} {"train_loss": -12.592142105102539, "global_step": 461634, "epoch": 2747} {"train_loss": -12.697896957397461, "global_step": 461635, "epoch": 2747} {"train_loss": -12.323554992675781, "global_step": 461636, "epoch": 2747} {"train_loss": -12.314409255981445, "global_step": 461637, "epoch": 2747} {"train_loss": -12.343196868896484, "global_step": 461638, "epoch": 2747} {"train_loss": -12.750526428222656, "global_step": 461639, "epoch": 2747} {"train_loss": -12.079514503479004, "global_step": 461640, "epoch": 2747} {"train_loss": -12.738719940185547, "global_step": 461641, "epoch": 2747} {"train_loss": -12.429279327392578, "global_step": 461642, "epoch": 2747} {"train_loss": -12.401466369628906, "global_step": 461643, "epoch": 2747} {"train_loss": -12.336946487426758, "global_step": 461644, "epoch": 2747} {"train_loss": -12.681421279907227, "global_step": 461645, "epoch": 2747} {"train_loss": -12.75097942352295, "global_step": 461646, "epoch": 2747} {"train_loss": -12.775480270385742, "global_step": 461647, "epoch": 2747} {"train_loss": -12.614336013793945, "global_step": 461648, "epoch": 2747} {"train_loss": -12.612724304199219, "global_step": 461649, "epoch": 2747} {"train_loss": -12.470252990722656, "global_step": 461650, "epoch": 2747} {"train_loss": -12.682435989379883, "global_step": 461651, "epoch": 2747} {"train_loss": -12.753640174865723, "global_step": 461652, "epoch": 2747} {"train_loss": -12.661003112792969, "global_step": 461653, "epoch": 2747} {"train_loss": -12.884615898132324, "global_step": 461654, "epoch": 2747} {"train_loss": -12.820852279663086, "global_step": 461655, "epoch": 2747} {"train_loss": -12.559903144836426, "global_step": 461656, "epoch": 2747} {"train_loss": -12.893370628356934, "global_step": 461657, "epoch": 2747} {"train_loss": -12.531034469604492, "global_step": 461658, "epoch": 2747} {"train_loss": -12.958789825439453, "global_step": 461659, "epoch": 2747} {"train_loss": -12.598583221435547, "global_step": 461660, "epoch": 2747} {"train_loss": -12.611992835998535, "global_step": 461661, "epoch": 2747} {"train_loss": -12.727771759033203, "global_step": 461662, "epoch": 2747} {"train_loss": -12.10895231791905, "global_step": 461663, "epoch": 2747, "val_loss": 313610.09375} {"train_loss": -12.377549171447754, "global_step": 461664, "epoch": 2748} {"train_loss": -12.710389137268066, "global_step": 461665, "epoch": 2748} {"train_loss": -12.716744422912598, "global_step": 461666, "epoch": 2748} {"train_loss": -12.732070922851562, "global_step": 461667, "epoch": 2748} {"train_loss": -13.121663093566895, "global_step": 461668, "epoch": 2748} {"train_loss": -12.870941162109375, "global_step": 461669, "epoch": 2748} {"train_loss": -12.964944839477539, "global_step": 461670, "epoch": 2748} {"train_loss": -12.993228912353516, "global_step": 461671, "epoch": 2748} {"train_loss": -12.507946968078613, "global_step": 461672, "epoch": 2748} {"train_loss": -12.617572784423828, "global_step": 461673, "epoch": 2748} {"train_loss": -12.326166152954102, "global_step": 461674, "epoch": 2748} {"train_loss": -12.577614784240723, "global_step": 461675, "epoch": 2748} {"train_loss": -12.8224458694458, "global_step": 461676, "epoch": 2748} {"train_loss": -12.565855026245117, "global_step": 461677, "epoch": 2748} {"train_loss": -13.001777648925781, "global_step": 461678, "epoch": 2748} {"train_loss": -12.590747833251953, "global_step": 461679, "epoch": 2748} {"train_loss": -12.271455764770508, "global_step": 461680, "epoch": 2748} {"train_loss": -12.271379470825195, "global_step": 461681, "epoch": 2748} {"train_loss": -12.761998176574707, "global_step": 461682, "epoch": 2748} {"train_loss": -11.957328796386719, "global_step": 461683, "epoch": 2748} {"train_loss": -11.935125350952148, "global_step": 461684, "epoch": 2748} {"train_loss": -12.081789016723633, "global_step": 461685, "epoch": 2748} {"train_loss": -11.868986129760742, "global_step": 461686, "epoch": 2748} {"train_loss": -9.963955879211426, "global_step": 461687, "epoch": 2748} {"train_loss": -11.726158142089844, "global_step": 461688, "epoch": 2748} {"train_loss": -11.471090316772461, "global_step": 461689, "epoch": 2748} {"train_loss": -11.692743301391602, "global_step": 461690, "epoch": 2748} {"train_loss": -11.411664009094238, "global_step": 461691, "epoch": 2748} {"train_loss": -11.85533332824707, "global_step": 461692, "epoch": 2748} {"train_loss": -12.315999031066895, "global_step": 461693, "epoch": 2748} {"train_loss": -11.438186645507812, "global_step": 461694, "epoch": 2748} {"train_loss": -12.400252342224121, "global_step": 461695, "epoch": 2748} {"train_loss": -12.059666633605957, "global_step": 461696, "epoch": 2748} {"train_loss": -12.23448657989502, "global_step": 461697, "epoch": 2748} {"train_loss": -12.404645919799805, "global_step": 461698, "epoch": 2748} {"train_loss": -12.3489990234375, "global_step": 461699, "epoch": 2748} {"train_loss": -11.74842643737793, "global_step": 461700, "epoch": 2748} {"train_loss": -11.722281455993652, "global_step": 461701, "epoch": 2748} {"train_loss": -12.222493171691895, "global_step": 461702, "epoch": 2748} {"train_loss": -10.736096382141113, "global_step": 461703, "epoch": 2748} {"train_loss": -11.882962226867676, "global_step": 461704, "epoch": 2748} {"train_loss": -10.964849472045898, "global_step": 461705, "epoch": 2748} {"train_loss": -11.477254867553711, "global_step": 461706, "epoch": 2748} {"train_loss": -11.505712509155273, "global_step": 461707, "epoch": 2748} {"train_loss": -10.760774612426758, "global_step": 461708, "epoch": 2748} {"train_loss": -11.995908737182617, "global_step": 461709, "epoch": 2748} {"train_loss": -10.5064697265625, "global_step": 461710, "epoch": 2748} {"train_loss": -10.867950439453125, "global_step": 461711, "epoch": 2748} {"train_loss": -10.601457595825195, "global_step": 461712, "epoch": 2748} {"train_loss": -9.269947052001953, "global_step": 461713, "epoch": 2748} {"train_loss": -8.318304061889648, "global_step": 461714, "epoch": 2748} {"train_loss": -8.24185562133789, "global_step": 461715, "epoch": 2748} {"train_loss": -8.944477081298828, "global_step": 461716, "epoch": 2748} {"train_loss": -9.070788383483887, "global_step": 461717, "epoch": 2748} {"train_loss": -10.09105110168457, "global_step": 461718, "epoch": 2748} {"train_loss": -8.999381065368652, "global_step": 461719, "epoch": 2748} {"train_loss": -9.568381309509277, "global_step": 461720, "epoch": 2748} {"train_loss": -10.854860305786133, "global_step": 461721, "epoch": 2748} {"train_loss": -9.843809127807617, "global_step": 461722, "epoch": 2748} {"train_loss": -10.508077621459961, "global_step": 461723, "epoch": 2748} {"train_loss": -11.085063934326172, "global_step": 461724, "epoch": 2748} {"train_loss": -10.352909088134766, "global_step": 461725, "epoch": 2748} {"train_loss": -11.454985618591309, "global_step": 461726, "epoch": 2748} {"train_loss": -10.018671035766602, "global_step": 461727, "epoch": 2748} {"train_loss": -11.549360275268555, "global_step": 461728, "epoch": 2748} {"train_loss": -10.397773742675781, "global_step": 461729, "epoch": 2748} {"train_loss": -11.591530799865723, "global_step": 461730, "epoch": 2748} {"train_loss": -10.69975757598877, "global_step": 461731, "epoch": 2748} {"train_loss": -11.340492248535156, "global_step": 461732, "epoch": 2748} {"train_loss": -11.503671646118164, "global_step": 461733, "epoch": 2748} {"train_loss": -11.60778522491455, "global_step": 461734, "epoch": 2748} {"train_loss": -10.70693588256836, "global_step": 461735, "epoch": 2748} {"train_loss": -11.863576889038086, "global_step": 461736, "epoch": 2748} {"train_loss": -11.063688278198242, "global_step": 461737, "epoch": 2748} {"train_loss": -11.49968147277832, "global_step": 461738, "epoch": 2748} {"train_loss": -11.809295654296875, "global_step": 461739, "epoch": 2748} {"train_loss": -11.68326187133789, "global_step": 461740, "epoch": 2748} {"train_loss": -11.555434226989746, "global_step": 461741, "epoch": 2748} {"train_loss": -11.916656494140625, "global_step": 461742, "epoch": 2748} {"train_loss": -11.52924633026123, "global_step": 461743, "epoch": 2748} {"train_loss": -12.245136260986328, "global_step": 461744, "epoch": 2748} {"train_loss": -11.841837882995605, "global_step": 461745, "epoch": 2748} {"train_loss": -12.097193717956543, "global_step": 461746, "epoch": 2748} {"train_loss": -12.268272399902344, "global_step": 461747, "epoch": 2748} {"train_loss": -12.151790618896484, "global_step": 461748, "epoch": 2748} {"train_loss": -12.388394355773926, "global_step": 461749, "epoch": 2748} {"train_loss": -12.185413360595703, "global_step": 461750, "epoch": 2748} {"train_loss": -12.238203048706055, "global_step": 461751, "epoch": 2748} {"train_loss": -12.046741485595703, "global_step": 461752, "epoch": 2748} {"train_loss": -12.496981620788574, "global_step": 461753, "epoch": 2748} {"train_loss": -12.267724990844727, "global_step": 461754, "epoch": 2748} {"train_loss": -12.2135648727417, "global_step": 461755, "epoch": 2748} {"train_loss": -12.12745189666748, "global_step": 461756, "epoch": 2748} {"train_loss": -11.86640453338623, "global_step": 461757, "epoch": 2748} {"train_loss": -12.345975875854492, "global_step": 461758, "epoch": 2748} {"train_loss": -12.159852981567383, "global_step": 461759, "epoch": 2748} {"train_loss": -12.252481460571289, "global_step": 461760, "epoch": 2748} {"train_loss": -11.985122680664062, "global_step": 461761, "epoch": 2748} {"train_loss": -12.552541732788086, "global_step": 461762, "epoch": 2748} {"train_loss": -11.949930191040039, "global_step": 461763, "epoch": 2748} {"train_loss": -12.457819938659668, "global_step": 461764, "epoch": 2748} {"train_loss": -12.178398132324219, "global_step": 461765, "epoch": 2748} {"train_loss": -12.477314949035645, "global_step": 461766, "epoch": 2748} {"train_loss": -11.997598648071289, "global_step": 461767, "epoch": 2748} {"train_loss": -12.597139358520508, "global_step": 461768, "epoch": 2748} {"train_loss": -12.373239517211914, "global_step": 461769, "epoch": 2748} {"train_loss": -12.438800811767578, "global_step": 461770, "epoch": 2748} {"train_loss": -12.179744720458984, "global_step": 461771, "epoch": 2748} {"train_loss": -12.491840362548828, "global_step": 461772, "epoch": 2748} {"train_loss": -12.36690902709961, "global_step": 461773, "epoch": 2748} {"train_loss": -12.594427108764648, "global_step": 461774, "epoch": 2748} {"train_loss": -12.419777870178223, "global_step": 461775, "epoch": 2748} {"train_loss": -12.484081268310547, "global_step": 461776, "epoch": 2748} {"train_loss": -12.46799373626709, "global_step": 461777, "epoch": 2748} {"train_loss": -12.578523635864258, "global_step": 461778, "epoch": 2748} {"train_loss": -12.48337459564209, "global_step": 461779, "epoch": 2748} {"train_loss": -12.339493751525879, "global_step": 461780, "epoch": 2748} {"train_loss": -12.392922401428223, "global_step": 461781, "epoch": 2748} {"train_loss": -12.44028377532959, "global_step": 461782, "epoch": 2748} {"train_loss": -12.666040420532227, "global_step": 461783, "epoch": 2748} {"train_loss": -12.742647171020508, "global_step": 461784, "epoch": 2748} {"train_loss": -12.798532485961914, "global_step": 461785, "epoch": 2748} {"train_loss": -12.709525108337402, "global_step": 461786, "epoch": 2748} {"train_loss": -12.72659683227539, "global_step": 461787, "epoch": 2748} {"train_loss": -12.477044105529785, "global_step": 461788, "epoch": 2748} {"train_loss": -12.49717903137207, "global_step": 461789, "epoch": 2748} {"train_loss": -12.485834121704102, "global_step": 461790, "epoch": 2748} {"train_loss": -12.842016220092773, "global_step": 461791, "epoch": 2748} {"train_loss": -12.548624038696289, "global_step": 461792, "epoch": 2748} {"train_loss": -12.646543502807617, "global_step": 461793, "epoch": 2748} {"train_loss": -12.751792907714844, "global_step": 461794, "epoch": 2748} {"train_loss": -12.668155670166016, "global_step": 461795, "epoch": 2748} {"train_loss": -12.676021575927734, "global_step": 461796, "epoch": 2748} {"train_loss": -12.516866683959961, "global_step": 461797, "epoch": 2748} {"train_loss": -12.565418243408203, "global_step": 461798, "epoch": 2748} {"train_loss": -12.531009674072266, "global_step": 461799, "epoch": 2748} {"train_loss": -12.596290588378906, "global_step": 461800, "epoch": 2748} {"train_loss": -12.491534233093262, "global_step": 461801, "epoch": 2748} {"train_loss": -12.384622573852539, "global_step": 461802, "epoch": 2748} {"train_loss": -11.621560096740723, "global_step": 461803, "epoch": 2748} {"train_loss": -12.233713150024414, "global_step": 461804, "epoch": 2748} {"train_loss": -12.470083236694336, "global_step": 461805, "epoch": 2748} {"train_loss": -11.763345718383789, "global_step": 461806, "epoch": 2748} {"train_loss": -12.56663703918457, "global_step": 461807, "epoch": 2748} {"train_loss": -11.914960861206055, "global_step": 461808, "epoch": 2748} {"train_loss": -10.919227600097656, "global_step": 461809, "epoch": 2748} {"train_loss": -12.526556015014648, "global_step": 461810, "epoch": 2748} {"train_loss": -11.44180679321289, "global_step": 461811, "epoch": 2748} {"train_loss": -11.355844497680664, "global_step": 461812, "epoch": 2748} {"train_loss": -12.047904968261719, "global_step": 461813, "epoch": 2748} {"train_loss": -12.515050888061523, "global_step": 461814, "epoch": 2748} {"train_loss": -11.499316215515137, "global_step": 461815, "epoch": 2748} {"train_loss": -11.958901405334473, "global_step": 461816, "epoch": 2748} {"train_loss": -11.826118469238281, "global_step": 461817, "epoch": 2748} {"train_loss": -12.301603317260742, "global_step": 461818, "epoch": 2748} {"train_loss": -11.790536880493164, "global_step": 461819, "epoch": 2748} {"train_loss": -12.18362808227539, "global_step": 461820, "epoch": 2748} {"train_loss": -11.998711585998535, "global_step": 461821, "epoch": 2748} {"train_loss": -12.604978561401367, "global_step": 461822, "epoch": 2748} {"train_loss": -12.185897827148438, "global_step": 461823, "epoch": 2748} {"train_loss": -12.362415313720703, "global_step": 461824, "epoch": 2748} {"train_loss": -12.286667823791504, "global_step": 461825, "epoch": 2748} {"train_loss": -12.429314613342285, "global_step": 461826, "epoch": 2748} {"train_loss": -12.35405445098877, "global_step": 461827, "epoch": 2748} {"train_loss": -11.891408920288086, "global_step": 461828, "epoch": 2748} {"train_loss": -12.369152069091797, "global_step": 461829, "epoch": 2748} {"train_loss": -11.956476211547852, "global_step": 461830, "epoch": 2748} {"train_loss": -11.900901221093678, "global_step": 461831, "epoch": 2748, "val_loss": 317969.59375} {"train_loss": -12.428277969360352, "global_step": 461832, "epoch": 2749} {"train_loss": -12.137985229492188, "global_step": 461833, "epoch": 2749} {"train_loss": -12.137201309204102, "global_step": 461834, "epoch": 2749} {"train_loss": -12.614127159118652, "global_step": 461835, "epoch": 2749} {"train_loss": -12.493509292602539, "global_step": 461836, "epoch": 2749} {"train_loss": -12.405220031738281, "global_step": 461837, "epoch": 2749} {"train_loss": -12.695886611938477, "global_step": 461838, "epoch": 2749} {"train_loss": -12.419376373291016, "global_step": 461839, "epoch": 2749} {"train_loss": -12.746122360229492, "global_step": 461840, "epoch": 2749} {"train_loss": -12.341936111450195, "global_step": 461841, "epoch": 2749} {"train_loss": -12.51984977722168, "global_step": 461842, "epoch": 2749} {"train_loss": -12.508132934570312, "global_step": 461843, "epoch": 2749} {"train_loss": -12.587984085083008, "global_step": 461844, "epoch": 2749} {"train_loss": -12.728004455566406, "global_step": 461845, "epoch": 2749} {"train_loss": -12.5693359375, "global_step": 461846, "epoch": 2749} {"train_loss": -11.759868621826172, "global_step": 461847, "epoch": 2749} {"train_loss": -11.859063148498535, "global_step": 461848, "epoch": 2749} {"train_loss": -12.421430587768555, "global_step": 461849, "epoch": 2749} {"train_loss": -12.353178977966309, "global_step": 461850, "epoch": 2749} {"train_loss": -12.222392082214355, "global_step": 461851, "epoch": 2749} {"train_loss": -12.64226245880127, "global_step": 461852, "epoch": 2749} {"train_loss": -12.664298057556152, "global_step": 461853, "epoch": 2749} {"train_loss": -12.505143165588379, "global_step": 461854, "epoch": 2749} {"train_loss": -12.83145809173584, "global_step": 461855, "epoch": 2749} {"train_loss": -12.369231224060059, "global_step": 461856, "epoch": 2749} {"train_loss": -12.370414733886719, "global_step": 461857, "epoch": 2749} {"train_loss": -12.303619384765625, "global_step": 461858, "epoch": 2749} {"train_loss": -11.901338577270508, "global_step": 461859, "epoch": 2749} {"train_loss": -12.371417045593262, "global_step": 461860, "epoch": 2749} {"train_loss": -12.356061935424805, "global_step": 461861, "epoch": 2749} {"train_loss": -12.523933410644531, "global_step": 461862, "epoch": 2749} {"train_loss": -12.273630142211914, "global_step": 461863, "epoch": 2749} {"train_loss": -12.74519157409668, "global_step": 461864, "epoch": 2749} {"train_loss": -12.429779052734375, "global_step": 461865, "epoch": 2749} {"train_loss": -12.531538009643555, "global_step": 461866, "epoch": 2749} {"train_loss": -12.561573028564453, "global_step": 461867, "epoch": 2749} {"train_loss": -12.586088180541992, "global_step": 461868, "epoch": 2749} {"train_loss": -12.06582260131836, "global_step": 461869, "epoch": 2749} {"train_loss": -12.426383972167969, "global_step": 461870, "epoch": 2749} {"train_loss": -12.567773818969727, "global_step": 461871, "epoch": 2749} {"train_loss": -12.696475982666016, "global_step": 461872, "epoch": 2749} {"train_loss": -12.614595413208008, "global_step": 461873, "epoch": 2749} {"train_loss": -12.68187427520752, "global_step": 461874, "epoch": 2749} {"train_loss": -12.498661041259766, "global_step": 461875, "epoch": 2749} {"train_loss": -12.428153991699219, "global_step": 461876, "epoch": 2749} {"train_loss": -12.420241355895996, "global_step": 461877, "epoch": 2749} {"train_loss": -12.089662551879883, "global_step": 461878, "epoch": 2749} {"train_loss": -12.481683731079102, "global_step": 461879, "epoch": 2749} {"train_loss": -12.553098678588867, "global_step": 461880, "epoch": 2749} {"train_loss": -11.77234172821045, "global_step": 461881, "epoch": 2749} {"train_loss": -12.179740905761719, "global_step": 461882, "epoch": 2749} {"train_loss": -12.547341346740723, "global_step": 461883, "epoch": 2749} {"train_loss": -12.47981071472168, "global_step": 461884, "epoch": 2749} {"train_loss": -12.202340126037598, "global_step": 461885, "epoch": 2749} {"train_loss": -12.691545486450195, "global_step": 461886, "epoch": 2749} {"train_loss": -12.74521255493164, "global_step": 461887, "epoch": 2749} {"train_loss": -12.667861938476562, "global_step": 461888, "epoch": 2749} {"train_loss": -12.506866455078125, "global_step": 461889, "epoch": 2749} {"train_loss": -12.796388626098633, "global_step": 461890, "epoch": 2749} {"train_loss": -12.678325653076172, "global_step": 461891, "epoch": 2749} {"train_loss": -12.060038566589355, "global_step": 461892, "epoch": 2749} {"train_loss": -12.584301948547363, "global_step": 461893, "epoch": 2749} {"train_loss": -12.792488098144531, "global_step": 461894, "epoch": 2749} {"train_loss": -12.11888313293457, "global_step": 461895, "epoch": 2749} {"train_loss": -12.272940635681152, "global_step": 461896, "epoch": 2749} {"train_loss": -12.127988815307617, "global_step": 461897, "epoch": 2749} {"train_loss": -12.330791473388672, "global_step": 461898, "epoch": 2749} {"train_loss": -10.657516479492188, "global_step": 461899, "epoch": 2749} {"train_loss": -12.578583717346191, "global_step": 461900, "epoch": 2749} {"train_loss": -10.957143783569336, "global_step": 461901, "epoch": 2749} {"train_loss": -11.916634559631348, "global_step": 461902, "epoch": 2749} {"train_loss": -11.345192909240723, "global_step": 461903, "epoch": 2749} {"train_loss": -11.066330909729004, "global_step": 461904, "epoch": 2749} {"train_loss": -11.070720672607422, "global_step": 461905, "epoch": 2749} {"train_loss": -11.923559188842773, "global_step": 461906, "epoch": 2749} {"train_loss": -11.424230575561523, "global_step": 461907, "epoch": 2749} {"train_loss": -11.260000228881836, "global_step": 461908, "epoch": 2749} {"train_loss": -12.359651565551758, "global_step": 461909, "epoch": 2749} {"train_loss": -11.710746765136719, "global_step": 461910, "epoch": 2749} {"train_loss": -12.090728759765625, "global_step": 461911, "epoch": 2749} {"train_loss": -11.725255966186523, "global_step": 461912, "epoch": 2749} {"train_loss": -11.935790061950684, "global_step": 461913, "epoch": 2749} {"train_loss": -12.141115188598633, "global_step": 461914, "epoch": 2749} {"train_loss": -12.010533332824707, "global_step": 461915, "epoch": 2749} {"train_loss": -12.188461303710938, "global_step": 461916, "epoch": 2749} {"train_loss": -12.148992538452148, "global_step": 461917, "epoch": 2749} {"train_loss": -11.202343940734863, "global_step": 461918, "epoch": 2749} {"train_loss": -12.10107707977295, "global_step": 461919, "epoch": 2749} {"train_loss": -12.21235466003418, "global_step": 461920, "epoch": 2749} {"train_loss": -12.588396072387695, "global_step": 461921, "epoch": 2749} {"train_loss": -12.157478332519531, "global_step": 461922, "epoch": 2749} {"train_loss": -12.599823951721191, "global_step": 461923, "epoch": 2749} {"train_loss": -11.972980499267578, "global_step": 461924, "epoch": 2749} {"train_loss": -12.334668159484863, "global_step": 461925, "epoch": 2749} {"train_loss": -11.733349800109863, "global_step": 461926, "epoch": 2749} {"train_loss": -12.307676315307617, "global_step": 461927, "epoch": 2749} {"train_loss": -11.71307373046875, "global_step": 461928, "epoch": 2749} {"train_loss": -12.296469688415527, "global_step": 461929, "epoch": 2749} {"train_loss": -11.755578994750977, "global_step": 461930, "epoch": 2749} {"train_loss": -12.50732135772705, "global_step": 461931, "epoch": 2749} {"train_loss": -12.03782844543457, "global_step": 461932, "epoch": 2749} {"train_loss": -12.20208740234375, "global_step": 461933, "epoch": 2749} {"train_loss": -11.762263298034668, "global_step": 461934, "epoch": 2749} {"train_loss": -12.226608276367188, "global_step": 461935, "epoch": 2749} {"train_loss": -11.57199478149414, "global_step": 461936, "epoch": 2749} {"train_loss": -12.131072998046875, "global_step": 461937, "epoch": 2749} {"train_loss": -11.960546493530273, "global_step": 461938, "epoch": 2749} {"train_loss": -12.047857284545898, "global_step": 461939, "epoch": 2749} {"train_loss": -12.30522346496582, "global_step": 461940, "epoch": 2749} {"train_loss": -12.087913513183594, "global_step": 461941, "epoch": 2749} {"train_loss": -12.35738754272461, "global_step": 461942, "epoch": 2749} {"train_loss": -12.344923973083496, "global_step": 461943, "epoch": 2749} {"train_loss": -12.140625953674316, "global_step": 461944, "epoch": 2749} {"train_loss": -12.525315284729004, "global_step": 461945, "epoch": 2749} {"train_loss": -12.131986618041992, "global_step": 461946, "epoch": 2749} {"train_loss": -12.561102867126465, "global_step": 461947, "epoch": 2749} {"train_loss": -12.295690536499023, "global_step": 461948, "epoch": 2749} {"train_loss": -12.53172492980957, "global_step": 461949, "epoch": 2749} {"train_loss": -12.564273834228516, "global_step": 461950, "epoch": 2749} {"train_loss": -12.537618637084961, "global_step": 461951, "epoch": 2749} {"train_loss": -12.251492500305176, "global_step": 461952, "epoch": 2749} {"train_loss": -12.389914512634277, "global_step": 461953, "epoch": 2749} {"train_loss": -12.046302795410156, "global_step": 461954, "epoch": 2749} {"train_loss": -12.491739273071289, "global_step": 461955, "epoch": 2749} {"train_loss": -12.176586151123047, "global_step": 461956, "epoch": 2749} {"train_loss": -12.237062454223633, "global_step": 461957, "epoch": 2749} {"train_loss": -12.355862617492676, "global_step": 461958, "epoch": 2749} {"train_loss": -12.07929801940918, "global_step": 461959, "epoch": 2749} {"train_loss": -12.430915832519531, "global_step": 461960, "epoch": 2749} {"train_loss": -12.11734390258789, "global_step": 461961, "epoch": 2749} {"train_loss": -12.200716018676758, "global_step": 461962, "epoch": 2749} {"train_loss": -12.214863777160645, "global_step": 461963, "epoch": 2749} {"train_loss": -11.517377853393555, "global_step": 461964, "epoch": 2749} {"train_loss": -12.30632209777832, "global_step": 461965, "epoch": 2749} {"train_loss": -11.659782409667969, "global_step": 461966, "epoch": 2749} {"train_loss": -11.353158950805664, "global_step": 461967, "epoch": 2749} {"train_loss": -12.204328536987305, "global_step": 461968, "epoch": 2749} {"train_loss": -10.642708778381348, "global_step": 461969, "epoch": 2749} {"train_loss": -12.451563835144043, "global_step": 461970, "epoch": 2749} {"train_loss": -11.225364685058594, "global_step": 461971, "epoch": 2749} {"train_loss": -11.004790306091309, "global_step": 461972, "epoch": 2749} {"train_loss": -11.922508239746094, "global_step": 461973, "epoch": 2749} {"train_loss": -10.845476150512695, "global_step": 461974, "epoch": 2749} {"train_loss": -11.754318237304688, "global_step": 461975, "epoch": 2749} {"train_loss": -9.776721954345703, "global_step": 461976, "epoch": 2749} {"train_loss": -11.003349304199219, "global_step": 461977, "epoch": 2749} {"train_loss": -10.103326797485352, "global_step": 461978, "epoch": 2749} {"train_loss": -9.508886337280273, "global_step": 461979, "epoch": 2749} {"train_loss": -9.82774543762207, "global_step": 461980, "epoch": 2749} {"train_loss": -10.789077758789062, "global_step": 461981, "epoch": 2749} {"train_loss": -9.499103546142578, "global_step": 461982, "epoch": 2749} {"train_loss": -10.328827857971191, "global_step": 461983, "epoch": 2749} {"train_loss": -10.758749008178711, "global_step": 461984, "epoch": 2749} {"train_loss": -10.618916511535645, "global_step": 461985, "epoch": 2749} {"train_loss": -9.980606079101562, "global_step": 461986, "epoch": 2749} {"train_loss": -10.565982818603516, "global_step": 461987, "epoch": 2749} {"train_loss": -10.897835731506348, "global_step": 461988, "epoch": 2749} {"train_loss": -10.322835922241211, "global_step": 461989, "epoch": 2749} {"train_loss": -9.596317291259766, "global_step": 461990, "epoch": 2749} {"train_loss": -11.254968643188477, "global_step": 461991, "epoch": 2749} {"train_loss": -10.07234001159668, "global_step": 461992, "epoch": 2749} {"train_loss": -10.422674179077148, "global_step": 461993, "epoch": 2749} {"train_loss": -11.590442657470703, "global_step": 461994, "epoch": 2749} {"train_loss": -11.009645462036133, "global_step": 461995, "epoch": 2749} {"train_loss": -11.184257507324219, "global_step": 461996, "epoch": 2749} {"train_loss": -11.540842056274414, "global_step": 461997, "epoch": 2749} {"train_loss": -10.908380508422852, "global_step": 461998, "epoch": 2749} {"train_loss": -11.952795732588996, "global_step": 461999, "epoch": 2749, "val_loss": 310836.59375} {"train_loss": -11.283685684204102, "global_step": 462000, "epoch": 2750} {"train_loss": -10.903923034667969, "global_step": 462001, "epoch": 2750} {"train_loss": -11.273426055908203, "global_step": 462002, "epoch": 2750} {"train_loss": -11.48872184753418, "global_step": 462003, "epoch": 2750} {"train_loss": -11.264785766601562, "global_step": 462004, "epoch": 2750} {"train_loss": -11.054376602172852, "global_step": 462005, "epoch": 2750} {"train_loss": -11.693950653076172, "global_step": 462006, "epoch": 2750} {"train_loss": -11.169379234313965, "global_step": 462007, "epoch": 2750} {"train_loss": -11.536003112792969, "global_step": 462008, "epoch": 2750} {"train_loss": -11.512134552001953, "global_step": 462009, "epoch": 2750} {"train_loss": -11.790721893310547, "global_step": 462010, "epoch": 2750} {"train_loss": -11.561455726623535, "global_step": 462011, "epoch": 2750} {"train_loss": -11.826915740966797, "global_step": 462012, "epoch": 2750} {"train_loss": -11.490160942077637, "global_step": 462013, "epoch": 2750} {"train_loss": -11.588079452514648, "global_step": 462014, "epoch": 2750} {"train_loss": -11.861152648925781, "global_step": 462015, "epoch": 2750} {"train_loss": -11.356870651245117, "global_step": 462016, "epoch": 2750} {"train_loss": -11.67048454284668, "global_step": 462017, "epoch": 2750} {"train_loss": -12.012601852416992, "global_step": 462018, "epoch": 2750} {"train_loss": -11.663030624389648, "global_step": 462019, "epoch": 2750} {"train_loss": -12.214003562927246, "global_step": 462020, "epoch": 2750} {"train_loss": -11.97951889038086, "global_step": 462021, "epoch": 2750} {"train_loss": -11.747596740722656, "global_step": 462022, "epoch": 2750} {"train_loss": -12.251253128051758, "global_step": 462023, "epoch": 2750} {"train_loss": -11.953880310058594, "global_step": 462024, "epoch": 2750} {"train_loss": -11.826614379882812, "global_step": 462025, "epoch": 2750} {"train_loss": -12.391365051269531, "global_step": 462026, "epoch": 2750} {"train_loss": -11.455208778381348, "global_step": 462027, "epoch": 2750} {"train_loss": -12.076536178588867, "global_step": 462028, "epoch": 2750} {"train_loss": -12.218086242675781, "global_step": 462029, "epoch": 2750} {"train_loss": -11.729787826538086, "global_step": 462030, "epoch": 2750} {"train_loss": -12.287264823913574, "global_step": 462031, "epoch": 2750} {"train_loss": -12.370244979858398, "global_step": 462032, "epoch": 2750} {"train_loss": -12.013936996459961, "global_step": 462033, "epoch": 2750} {"train_loss": -12.376709938049316, "global_step": 462034, "epoch": 2750} {"train_loss": -12.28310489654541, "global_step": 462035, "epoch": 2750} {"train_loss": -12.005701065063477, "global_step": 462036, "epoch": 2750} {"train_loss": -12.411508560180664, "global_step": 462037, "epoch": 2750} {"train_loss": -12.398783683776855, "global_step": 462038, "epoch": 2750} {"train_loss": -12.125080108642578, "global_step": 462039, "epoch": 2750} {"train_loss": -12.316667556762695, "global_step": 462040, "epoch": 2750} {"train_loss": -12.493488311767578, "global_step": 462041, "epoch": 2750} {"train_loss": -12.140962600708008, "global_step": 462042, "epoch": 2750} {"train_loss": -12.349502563476562, "global_step": 462043, "epoch": 2750} {"train_loss": -12.423383712768555, "global_step": 462044, "epoch": 2750} {"train_loss": -12.395240783691406, "global_step": 462045, "epoch": 2750} {"train_loss": -12.436457633972168, "global_step": 462046, "epoch": 2750} {"train_loss": -12.450587272644043, "global_step": 462047, "epoch": 2750} {"train_loss": -12.625350952148438, "global_step": 462048, "epoch": 2750} {"train_loss": -12.390501022338867, "global_step": 462049, "epoch": 2750} {"train_loss": -12.741472244262695, "global_step": 462050, "epoch": 2750} {"train_loss": -12.69572639465332, "global_step": 462051, "epoch": 2750} {"train_loss": -12.12632942199707, "global_step": 462052, "epoch": 2750} {"train_loss": -12.48921012878418, "global_step": 462053, "epoch": 2750} {"train_loss": -12.403157234191895, "global_step": 462054, "epoch": 2750} {"train_loss": -12.543664932250977, "global_step": 462055, "epoch": 2750} {"train_loss": -12.312362670898438, "global_step": 462056, "epoch": 2750} {"train_loss": -12.261241912841797, "global_step": 462057, "epoch": 2750} {"train_loss": -12.524044036865234, "global_step": 462058, "epoch": 2750} {"train_loss": -12.21685791015625, "global_step": 462059, "epoch": 2750} {"train_loss": -12.387222290039062, "global_step": 462060, "epoch": 2750} {"train_loss": -11.642507553100586, "global_step": 462061, "epoch": 2750} {"train_loss": -12.542818069458008, "global_step": 462062, "epoch": 2750} {"train_loss": -11.673194885253906, "global_step": 462063, "epoch": 2750} {"train_loss": -12.543264389038086, "global_step": 462064, "epoch": 2750} {"train_loss": -11.948921203613281, "global_step": 462065, "epoch": 2750} {"train_loss": -12.147404670715332, "global_step": 462066, "epoch": 2750} {"train_loss": -12.725900650024414, "global_step": 462067, "epoch": 2750} {"train_loss": -12.237710952758789, "global_step": 462068, "epoch": 2750} {"train_loss": -12.56576919555664, "global_step": 462069, "epoch": 2750} {"train_loss": -11.954431533813477, "global_step": 462070, "epoch": 2750} {"train_loss": -12.362419128417969, "global_step": 462071, "epoch": 2750} {"train_loss": -12.215856552124023, "global_step": 462072, "epoch": 2750} {"train_loss": -12.523656845092773, "global_step": 462073, "epoch": 2750} {"train_loss": -12.235420227050781, "global_step": 462074, "epoch": 2750} {"train_loss": -12.597637176513672, "global_step": 462075, "epoch": 2750} {"train_loss": -12.653124809265137, "global_step": 462076, "epoch": 2750} {"train_loss": -12.69961929321289, "global_step": 462077, "epoch": 2750} {"train_loss": -12.495871543884277, "global_step": 462078, "epoch": 2750} {"train_loss": -12.539189338684082, "global_step": 462079, "epoch": 2750} {"train_loss": -12.281376838684082, "global_step": 462080, "epoch": 2750} {"train_loss": -12.560843467712402, "global_step": 462081, "epoch": 2750} {"train_loss": -12.682840347290039, "global_step": 462082, "epoch": 2750} {"train_loss": -12.39804458618164, "global_step": 462083, "epoch": 2750} {"train_loss": -12.645844459533691, "global_step": 462084, "epoch": 2750} {"train_loss": -12.508551597595215, "global_step": 462085, "epoch": 2750} {"train_loss": -12.499917984008789, "global_step": 462086, "epoch": 2750} {"train_loss": -12.58481216430664, "global_step": 462087, "epoch": 2750} {"train_loss": -12.357051849365234, "global_step": 462088, "epoch": 2750} {"train_loss": -12.50687026977539, "global_step": 462089, "epoch": 2750} {"train_loss": -12.559690475463867, "global_step": 462090, "epoch": 2750} {"train_loss": -12.642627716064453, "global_step": 462091, "epoch": 2750} {"train_loss": -12.464860916137695, "global_step": 462092, "epoch": 2750} {"train_loss": -12.408197402954102, "global_step": 462093, "epoch": 2750} {"train_loss": -12.366217613220215, "global_step": 462094, "epoch": 2750} {"train_loss": -12.560041427612305, "global_step": 462095, "epoch": 2750} {"train_loss": -12.236167907714844, "global_step": 462096, "epoch": 2750} {"train_loss": -12.445722579956055, "global_step": 462097, "epoch": 2750} {"train_loss": -12.4674072265625, "global_step": 462098, "epoch": 2750} {"train_loss": -12.494000434875488, "global_step": 462099, "epoch": 2750} {"train_loss": -12.485322952270508, "global_step": 462100, "epoch": 2750} {"train_loss": -12.361438751220703, "global_step": 462101, "epoch": 2750} {"train_loss": -12.529783248901367, "global_step": 462102, "epoch": 2750} {"train_loss": -12.360395431518555, "global_step": 462103, "epoch": 2750} {"train_loss": -12.042596817016602, "global_step": 462104, "epoch": 2750} {"train_loss": -12.82149600982666, "global_step": 462105, "epoch": 2750} {"train_loss": -11.771599769592285, "global_step": 462106, "epoch": 2750} {"train_loss": -12.201234817504883, "global_step": 462107, "epoch": 2750} {"train_loss": -12.214239120483398, "global_step": 462108, "epoch": 2750} {"train_loss": -11.956205368041992, "global_step": 462109, "epoch": 2750} {"train_loss": -10.774612426757812, "global_step": 462110, "epoch": 2750} {"train_loss": -12.51020622253418, "global_step": 462111, "epoch": 2750} {"train_loss": -11.85310173034668, "global_step": 462112, "epoch": 2750} {"train_loss": -12.168076515197754, "global_step": 462113, "epoch": 2750} {"train_loss": -12.058122634887695, "global_step": 462114, "epoch": 2750} {"train_loss": -11.914918899536133, "global_step": 462115, "epoch": 2750} {"train_loss": -12.079610824584961, "global_step": 462116, "epoch": 2750} {"train_loss": -12.482168197631836, "global_step": 462117, "epoch": 2750} {"train_loss": -12.230238914489746, "global_step": 462118, "epoch": 2750} {"train_loss": -12.433621406555176, "global_step": 462119, "epoch": 2750} {"train_loss": -12.36579704284668, "global_step": 462120, "epoch": 2750} {"train_loss": -12.243789672851562, "global_step": 462121, "epoch": 2750} {"train_loss": -12.348943710327148, "global_step": 462122, "epoch": 2750} {"train_loss": -12.228242874145508, "global_step": 462123, "epoch": 2750} {"train_loss": -12.50616455078125, "global_step": 462124, "epoch": 2750} {"train_loss": -12.501588821411133, "global_step": 462125, "epoch": 2750} {"train_loss": -12.37606143951416, "global_step": 462126, "epoch": 2750} {"train_loss": -11.816347122192383, "global_step": 462127, "epoch": 2750} {"train_loss": -11.574483871459961, "global_step": 462128, "epoch": 2750} {"train_loss": -12.458057403564453, "global_step": 462129, "epoch": 2750} {"train_loss": -11.29941463470459, "global_step": 462130, "epoch": 2750} {"train_loss": -12.244691848754883, "global_step": 462131, "epoch": 2750} {"train_loss": -12.009428024291992, "global_step": 462132, "epoch": 2750} {"train_loss": -9.46030044555664, "global_step": 462133, "epoch": 2750} {"train_loss": -12.292878150939941, "global_step": 462134, "epoch": 2750} {"train_loss": -10.76219654083252, "global_step": 462135, "epoch": 2750} {"train_loss": -10.904769897460938, "global_step": 462136, "epoch": 2750} {"train_loss": -11.66608715057373, "global_step": 462137, "epoch": 2750} {"train_loss": -11.144495010375977, "global_step": 462138, "epoch": 2750} {"train_loss": -11.188334465026855, "global_step": 462139, "epoch": 2750} {"train_loss": -11.583819389343262, "global_step": 462140, "epoch": 2750} {"train_loss": -11.996991157531738, "global_step": 462141, "epoch": 2750} {"train_loss": -11.646272659301758, "global_step": 462142, "epoch": 2750} {"train_loss": -12.022100448608398, "global_step": 462143, "epoch": 2750} {"train_loss": -12.104269981384277, "global_step": 462144, "epoch": 2750} {"train_loss": -11.713752746582031, "global_step": 462145, "epoch": 2750} {"train_loss": -12.031221389770508, "global_step": 462146, "epoch": 2750} {"train_loss": -11.335577011108398, "global_step": 462147, "epoch": 2750} {"train_loss": -12.296453475952148, "global_step": 462148, "epoch": 2750} {"train_loss": -11.908538818359375, "global_step": 462149, "epoch": 2750} {"train_loss": -12.03250503540039, "global_step": 462150, "epoch": 2750} {"train_loss": -12.046034812927246, "global_step": 462151, "epoch": 2750} {"train_loss": -12.074342727661133, "global_step": 462152, "epoch": 2750} {"train_loss": -12.585071563720703, "global_step": 462153, "epoch": 2750} {"train_loss": -12.01036262512207, "global_step": 462154, "epoch": 2750} {"train_loss": -11.788795471191406, "global_step": 462155, "epoch": 2750} {"train_loss": -12.071675300598145, "global_step": 462156, "epoch": 2750} {"train_loss": -12.227783203125, "global_step": 462157, "epoch": 2750} {"train_loss": -12.228649139404297, "global_step": 462158, "epoch": 2750} {"train_loss": -12.456562042236328, "global_step": 462159, "epoch": 2750} {"train_loss": -12.405359268188477, "global_step": 462160, "epoch": 2750} {"train_loss": -12.406946182250977, "global_step": 462161, "epoch": 2750} {"train_loss": -12.255105018615723, "global_step": 462162, "epoch": 2750} {"train_loss": -12.354092597961426, "global_step": 462163, "epoch": 2750} {"train_loss": -12.431941986083984, "global_step": 462164, "epoch": 2750} {"train_loss": -12.440218925476074, "global_step": 462165, "epoch": 2750} {"train_loss": -12.360831260681152, "global_step": 462166, "epoch": 2750} {"train_loss": -12.111013043494452, "global_step": 462167, "epoch": 2750, "train/sim_max_reward_0": 0.982900464071351, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.0014233853938151004, "train/sim_max_reward_3": 0.9508088231307725, "train/sim_max_reward_4": 0.9433797142012587, "train/sim_max_reward_5": 0.5890004733397135, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.3696759703830264, "test/sim_max_reward_4400002": 0.18481550674586553, "test/sim_max_reward_4400003": 0.5795619575110226, "test/sim_max_reward_4400004": 0.47496653648130766, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 0.9818107122973485, "test/sim_max_reward_4400007": 0.7101267742183004, "test/sim_max_reward_4400008": 0.6054149027788731, "test/sim_max_reward_4400009": 0.3895080024634373, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.27272288167786346, "test/sim_max_reward_4400012": 0.14110722128947978, "test/sim_max_reward_4400013": 0.8315376909686364, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 0.001733107399104781, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.973160535815228, "test/sim_max_reward_4400019": 0.4054768061327317, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.6541053326074454, "test/sim_max_reward_4400022": 0.9971790781896355, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.9753522962044425, "test/sim_max_reward_4400025": 0.7275221821288649, "test/sim_max_reward_4400026": 0.4120621834597376, "test/sim_max_reward_4400027": 0.43434573702256574, "test/sim_max_reward_4400028": 0.7085181758988792, "test/sim_max_reward_4400029": 0.440138996014243, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.983287566186438, "test/sim_max_reward_4400032": 0.1601803892806574, "test/sim_max_reward_4400033": 0.6888513178920735, "test/sim_max_reward_4400034": 0.5171089471876582, "test/sim_max_reward_4400035": 0.8849719766791061, "test/sim_max_reward_4400036": 0.36591755486405597, "test/sim_max_reward_4400037": 0.961129563287064, "test/sim_max_reward_4400038": 0.9605708338544902, "test/sim_max_reward_4400039": 0.968114366861438, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.15733761443141228, "test/sim_max_reward_4400042": 1.0, "test/sim_max_reward_4400043": 1.0, "test/sim_max_reward_4400044": 0.0818106567058431, "test/sim_max_reward_4400045": 0.9760554196097869, "test/sim_max_reward_4400046": 0.31509392986014034, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.744585476689485, "test/mean_score": 0.5480181492282993, "val_loss": 316204.40625, "train_action_mse_error": 1.2692079544067383} {"train_loss": -12.378447532653809, "global_step": 462168, "epoch": 2751} {"train_loss": -12.45250129699707, "global_step": 462169, "epoch": 2751} {"train_loss": -12.507450103759766, "global_step": 462170, "epoch": 2751} {"train_loss": -12.043342590332031, "global_step": 462171, "epoch": 2751} {"train_loss": -12.686393737792969, "global_step": 462172, "epoch": 2751} {"train_loss": -12.436668395996094, "global_step": 462173, "epoch": 2751} {"train_loss": -12.48891830444336, "global_step": 462174, "epoch": 2751} {"train_loss": -12.338518142700195, "global_step": 462175, "epoch": 2751} {"train_loss": -12.36417293548584, "global_step": 462176, "epoch": 2751} {"train_loss": -12.616962432861328, "global_step": 462177, "epoch": 2751} {"train_loss": -12.3469820022583, "global_step": 462178, "epoch": 2751} {"train_loss": -12.703400611877441, "global_step": 462179, "epoch": 2751} {"train_loss": -12.771613121032715, "global_step": 462180, "epoch": 2751} {"train_loss": -12.703165054321289, "global_step": 462181, "epoch": 2751} {"train_loss": -12.560463905334473, "global_step": 462182, "epoch": 2751} {"train_loss": -12.602591514587402, "global_step": 462183, "epoch": 2751} {"train_loss": -12.803910255432129, "global_step": 462184, "epoch": 2751} {"train_loss": -12.594578742980957, "global_step": 462185, "epoch": 2751} {"train_loss": -12.942729949951172, "global_step": 462186, "epoch": 2751} {"train_loss": -12.932393074035645, "global_step": 462187, "epoch": 2751} {"train_loss": -12.647146224975586, "global_step": 462188, "epoch": 2751} {"train_loss": -12.707246780395508, "global_step": 462189, "epoch": 2751} {"train_loss": -12.676457405090332, "global_step": 462190, "epoch": 2751} {"train_loss": -12.7371187210083, "global_step": 462191, "epoch": 2751} {"train_loss": -12.689664840698242, "global_step": 462192, "epoch": 2751} {"train_loss": -12.680641174316406, "global_step": 462193, "epoch": 2751} {"train_loss": -12.685455322265625, "global_step": 462194, "epoch": 2751} {"train_loss": -12.971067428588867, "global_step": 462195, "epoch": 2751} {"train_loss": -12.753978729248047, "global_step": 462196, "epoch": 2751} {"train_loss": -12.666019439697266, "global_step": 462197, "epoch": 2751} {"train_loss": -12.692185401916504, "global_step": 462198, "epoch": 2751} {"train_loss": -12.804295539855957, "global_step": 462199, "epoch": 2751} {"train_loss": -12.704660415649414, "global_step": 462200, "epoch": 2751} {"train_loss": -12.775686264038086, "global_step": 462201, "epoch": 2751} {"train_loss": -12.720491409301758, "global_step": 462202, "epoch": 2751} {"train_loss": -12.593931198120117, "global_step": 462203, "epoch": 2751} {"train_loss": -12.637054443359375, "global_step": 462204, "epoch": 2751} {"train_loss": -12.828882217407227, "global_step": 462205, "epoch": 2751} {"train_loss": -12.607059478759766, "global_step": 462206, "epoch": 2751} {"train_loss": -12.792625427246094, "global_step": 462207, "epoch": 2751} {"train_loss": -12.78754997253418, "global_step": 462208, "epoch": 2751} {"train_loss": -12.530387878417969, "global_step": 462209, "epoch": 2751} {"train_loss": -12.727352142333984, "global_step": 462210, "epoch": 2751} {"train_loss": -12.928825378417969, "global_step": 462211, "epoch": 2751} {"train_loss": -12.514738082885742, "global_step": 462212, "epoch": 2751} {"train_loss": -12.682369232177734, "global_step": 462213, "epoch": 2751} {"train_loss": -12.545055389404297, "global_step": 462214, "epoch": 2751} {"train_loss": -12.76416301727295, "global_step": 462215, "epoch": 2751} {"train_loss": -12.800907135009766, "global_step": 462216, "epoch": 2751} {"train_loss": -12.894670486450195, "global_step": 462217, "epoch": 2751} {"train_loss": -12.574101448059082, "global_step": 462218, "epoch": 2751} {"train_loss": -12.296485900878906, "global_step": 462219, "epoch": 2751} {"train_loss": -12.391729354858398, "global_step": 462220, "epoch": 2751} {"train_loss": -11.665489196777344, "global_step": 462221, "epoch": 2751} {"train_loss": -12.472006797790527, "global_step": 462222, "epoch": 2751} {"train_loss": -12.620591163635254, "global_step": 462223, "epoch": 2751} {"train_loss": -12.768774032592773, "global_step": 462224, "epoch": 2751} {"train_loss": -12.807912826538086, "global_step": 462225, "epoch": 2751} {"train_loss": -12.340356826782227, "global_step": 462226, "epoch": 2751} {"train_loss": -12.72605037689209, "global_step": 462227, "epoch": 2751} {"train_loss": -12.807108879089355, "global_step": 462228, "epoch": 2751} {"train_loss": -12.346449851989746, "global_step": 462229, "epoch": 2751} {"train_loss": -12.526678085327148, "global_step": 462230, "epoch": 2751} {"train_loss": -12.477436065673828, "global_step": 462231, "epoch": 2751} {"train_loss": -12.39955997467041, "global_step": 462232, "epoch": 2751} {"train_loss": -12.336897850036621, "global_step": 462233, "epoch": 2751} {"train_loss": -12.590730667114258, "global_step": 462234, "epoch": 2751} {"train_loss": -12.135703086853027, "global_step": 462235, "epoch": 2751} {"train_loss": -12.162172317504883, "global_step": 462236, "epoch": 2751} {"train_loss": -12.684202194213867, "global_step": 462237, "epoch": 2751} {"train_loss": -12.382905960083008, "global_step": 462238, "epoch": 2751} {"train_loss": -11.830551147460938, "global_step": 462239, "epoch": 2751} {"train_loss": -12.569177627563477, "global_step": 462240, "epoch": 2751} {"train_loss": -12.477460861206055, "global_step": 462241, "epoch": 2751} {"train_loss": -11.722799301147461, "global_step": 462242, "epoch": 2751} {"train_loss": -12.242923736572266, "global_step": 462243, "epoch": 2751} {"train_loss": -12.83770751953125, "global_step": 462244, "epoch": 2751} {"train_loss": -12.116860389709473, "global_step": 462245, "epoch": 2751} {"train_loss": -11.744314193725586, "global_step": 462246, "epoch": 2751} {"train_loss": -12.220519065856934, "global_step": 462247, "epoch": 2751} {"train_loss": -12.598682403564453, "global_step": 462248, "epoch": 2751} {"train_loss": -12.40037727355957, "global_step": 462249, "epoch": 2751} {"train_loss": -12.085183143615723, "global_step": 462250, "epoch": 2751} {"train_loss": -12.23924732208252, "global_step": 462251, "epoch": 2751} {"train_loss": -11.732095718383789, "global_step": 462252, "epoch": 2751} {"train_loss": -11.859518051147461, "global_step": 462253, "epoch": 2751} {"train_loss": -12.273125648498535, "global_step": 462254, "epoch": 2751} {"train_loss": -10.874058723449707, "global_step": 462255, "epoch": 2751} {"train_loss": -10.16463565826416, "global_step": 462256, "epoch": 2751} {"train_loss": -10.805770874023438, "global_step": 462257, "epoch": 2751} {"train_loss": -12.22578239440918, "global_step": 462258, "epoch": 2751} {"train_loss": -10.384809494018555, "global_step": 462259, "epoch": 2751} {"train_loss": -10.94019603729248, "global_step": 462260, "epoch": 2751} {"train_loss": -11.736221313476562, "global_step": 462261, "epoch": 2751} {"train_loss": -11.522272109985352, "global_step": 462262, "epoch": 2751} {"train_loss": -11.333196640014648, "global_step": 462263, "epoch": 2751} {"train_loss": -12.133684158325195, "global_step": 462264, "epoch": 2751} {"train_loss": -11.801488876342773, "global_step": 462265, "epoch": 2751} {"train_loss": -11.471647262573242, "global_step": 462266, "epoch": 2751} {"train_loss": -12.133987426757812, "global_step": 462267, "epoch": 2751} {"train_loss": -11.719080924987793, "global_step": 462268, "epoch": 2751} {"train_loss": -12.578577995300293, "global_step": 462269, "epoch": 2751} {"train_loss": -11.661821365356445, "global_step": 462270, "epoch": 2751} {"train_loss": -12.462237358093262, "global_step": 462271, "epoch": 2751} {"train_loss": -12.127041816711426, "global_step": 462272, "epoch": 2751} {"train_loss": -11.74775218963623, "global_step": 462273, "epoch": 2751} {"train_loss": -12.384076118469238, "global_step": 462274, "epoch": 2751} {"train_loss": -12.242703437805176, "global_step": 462275, "epoch": 2751} {"train_loss": -12.420217514038086, "global_step": 462276, "epoch": 2751} {"train_loss": -12.767295837402344, "global_step": 462277, "epoch": 2751} {"train_loss": -12.302772521972656, "global_step": 462278, "epoch": 2751} {"train_loss": -12.508293151855469, "global_step": 462279, "epoch": 2751} {"train_loss": -12.518743515014648, "global_step": 462280, "epoch": 2751} {"train_loss": -12.713689804077148, "global_step": 462281, "epoch": 2751} {"train_loss": -12.324626922607422, "global_step": 462282, "epoch": 2751} {"train_loss": -12.408636093139648, "global_step": 462283, "epoch": 2751} {"train_loss": -12.465445518493652, "global_step": 462284, "epoch": 2751} {"train_loss": -12.54458236694336, "global_step": 462285, "epoch": 2751} {"train_loss": -12.461305618286133, "global_step": 462286, "epoch": 2751} {"train_loss": -12.333992958068848, "global_step": 462287, "epoch": 2751} {"train_loss": -12.471714973449707, "global_step": 462288, "epoch": 2751} {"train_loss": -12.60573673248291, "global_step": 462289, "epoch": 2751} {"train_loss": -12.18638801574707, "global_step": 462290, "epoch": 2751} {"train_loss": -12.829904556274414, "global_step": 462291, "epoch": 2751} {"train_loss": -12.197675704956055, "global_step": 462292, "epoch": 2751} {"train_loss": -11.904047966003418, "global_step": 462293, "epoch": 2751} {"train_loss": -12.673524856567383, "global_step": 462294, "epoch": 2751} {"train_loss": -12.668519020080566, "global_step": 462295, "epoch": 2751} {"train_loss": -12.440587043762207, "global_step": 462296, "epoch": 2751} {"train_loss": -12.623332023620605, "global_step": 462297, "epoch": 2751} {"train_loss": -12.909749984741211, "global_step": 462298, "epoch": 2751} {"train_loss": -12.583385467529297, "global_step": 462299, "epoch": 2751} {"train_loss": -12.504866600036621, "global_step": 462300, "epoch": 2751} {"train_loss": -12.582386016845703, "global_step": 462301, "epoch": 2751} {"train_loss": -12.730449676513672, "global_step": 462302, "epoch": 2751} {"train_loss": -12.774900436401367, "global_step": 462303, "epoch": 2751} {"train_loss": -12.507331848144531, "global_step": 462304, "epoch": 2751} {"train_loss": -12.990326881408691, "global_step": 462305, "epoch": 2751} {"train_loss": -12.239749908447266, "global_step": 462306, "epoch": 2751} {"train_loss": -12.687128067016602, "global_step": 462307, "epoch": 2751} {"train_loss": -12.68034839630127, "global_step": 462308, "epoch": 2751} {"train_loss": -12.769481658935547, "global_step": 462309, "epoch": 2751} {"train_loss": -12.526643753051758, "global_step": 462310, "epoch": 2751} {"train_loss": -12.532697677612305, "global_step": 462311, "epoch": 2751} {"train_loss": -12.690879821777344, "global_step": 462312, "epoch": 2751} {"train_loss": -12.574631690979004, "global_step": 462313, "epoch": 2751} {"train_loss": -12.187629699707031, "global_step": 462314, "epoch": 2751} {"train_loss": -12.5189847946167, "global_step": 462315, "epoch": 2751} {"train_loss": -12.431192398071289, "global_step": 462316, "epoch": 2751} {"train_loss": -12.731197357177734, "global_step": 462317, "epoch": 2751} {"train_loss": -13.039482116699219, "global_step": 462318, "epoch": 2751} {"train_loss": -12.66473388671875, "global_step": 462319, "epoch": 2751} {"train_loss": -12.838302612304688, "global_step": 462320, "epoch": 2751} {"train_loss": -12.575560569763184, "global_step": 462321, "epoch": 2751} {"train_loss": -12.809036254882812, "global_step": 462322, "epoch": 2751} {"train_loss": -12.634873390197754, "global_step": 462323, "epoch": 2751} {"train_loss": -12.76646614074707, "global_step": 462324, "epoch": 2751} {"train_loss": -12.838242530822754, "global_step": 462325, "epoch": 2751} {"train_loss": -12.7329740524292, "global_step": 462326, "epoch": 2751} {"train_loss": -12.85867977142334, "global_step": 462327, "epoch": 2751} {"train_loss": -12.408509254455566, "global_step": 462328, "epoch": 2751} {"train_loss": -12.066638946533203, "global_step": 462329, "epoch": 2751} {"train_loss": -12.068317413330078, "global_step": 462330, "epoch": 2751} {"train_loss": -12.369073867797852, "global_step": 462331, "epoch": 2751} {"train_loss": -12.323372840881348, "global_step": 462332, "epoch": 2751} {"train_loss": -12.835960388183594, "global_step": 462333, "epoch": 2751} {"train_loss": -12.757312774658203, "global_step": 462334, "epoch": 2751} {"train_loss": -12.420969071842375, "global_step": 462335, "epoch": 2751, "val_loss": 317496.59375} {"train_loss": -12.72835636138916, "global_step": 462336, "epoch": 2752} {"train_loss": -12.003803253173828, "global_step": 462337, "epoch": 2752} {"train_loss": -11.951640129089355, "global_step": 462338, "epoch": 2752} {"train_loss": -11.641729354858398, "global_step": 462339, "epoch": 2752} {"train_loss": -12.063236236572266, "global_step": 462340, "epoch": 2752} {"train_loss": -12.555946350097656, "global_step": 462341, "epoch": 2752} {"train_loss": -12.012699127197266, "global_step": 462342, "epoch": 2752} {"train_loss": -12.536262512207031, "global_step": 462343, "epoch": 2752} {"train_loss": -12.35763168334961, "global_step": 462344, "epoch": 2752} {"train_loss": -11.992152214050293, "global_step": 462345, "epoch": 2752} {"train_loss": -11.791089057922363, "global_step": 462346, "epoch": 2752} {"train_loss": -12.504947662353516, "global_step": 462347, "epoch": 2752} {"train_loss": -11.900140762329102, "global_step": 462348, "epoch": 2752} {"train_loss": -11.923500061035156, "global_step": 462349, "epoch": 2752} {"train_loss": -12.330549240112305, "global_step": 462350, "epoch": 2752} {"train_loss": -11.888336181640625, "global_step": 462351, "epoch": 2752} {"train_loss": -12.121942520141602, "global_step": 462352, "epoch": 2752} {"train_loss": -11.842432975769043, "global_step": 462353, "epoch": 2752} {"train_loss": -11.465958595275879, "global_step": 462354, "epoch": 2752} {"train_loss": -12.013161659240723, "global_step": 462355, "epoch": 2752} {"train_loss": -11.787864685058594, "global_step": 462356, "epoch": 2752} {"train_loss": -12.326557159423828, "global_step": 462357, "epoch": 2752} {"train_loss": -12.42647647857666, "global_step": 462358, "epoch": 2752} {"train_loss": -12.227876663208008, "global_step": 462359, "epoch": 2752} {"train_loss": -11.947778701782227, "global_step": 462360, "epoch": 2752} {"train_loss": -11.94222354888916, "global_step": 462361, "epoch": 2752} {"train_loss": -11.708864212036133, "global_step": 462362, "epoch": 2752} {"train_loss": -11.280376434326172, "global_step": 462363, "epoch": 2752} {"train_loss": -11.60052490234375, "global_step": 462364, "epoch": 2752} {"train_loss": -10.744078636169434, "global_step": 462365, "epoch": 2752} {"train_loss": -11.245552062988281, "global_step": 462366, "epoch": 2752} {"train_loss": -10.89760971069336, "global_step": 462367, "epoch": 2752} {"train_loss": -10.459403038024902, "global_step": 462368, "epoch": 2752} {"train_loss": -11.91994857788086, "global_step": 462369, "epoch": 2752} {"train_loss": -9.767196655273438, "global_step": 462370, "epoch": 2752} {"train_loss": -9.306211471557617, "global_step": 462371, "epoch": 2752} {"train_loss": -10.255348205566406, "global_step": 462372, "epoch": 2752} {"train_loss": -9.93954849243164, "global_step": 462373, "epoch": 2752} {"train_loss": -10.690519332885742, "global_step": 462374, "epoch": 2752} {"train_loss": -9.398721694946289, "global_step": 462375, "epoch": 2752} {"train_loss": -9.660419464111328, "global_step": 462376, "epoch": 2752} {"train_loss": -11.197210311889648, "global_step": 462377, "epoch": 2752} {"train_loss": -11.178474426269531, "global_step": 462378, "epoch": 2752} {"train_loss": -11.153708457946777, "global_step": 462379, "epoch": 2752} {"train_loss": -11.741537094116211, "global_step": 462380, "epoch": 2752} {"train_loss": -11.227224349975586, "global_step": 462381, "epoch": 2752} {"train_loss": -11.692306518554688, "global_step": 462382, "epoch": 2752} {"train_loss": -10.824075698852539, "global_step": 462383, "epoch": 2752} {"train_loss": -11.000433921813965, "global_step": 462384, "epoch": 2752} {"train_loss": -11.328834533691406, "global_step": 462385, "epoch": 2752} {"train_loss": -11.755173683166504, "global_step": 462386, "epoch": 2752} {"train_loss": -10.54963493347168, "global_step": 462387, "epoch": 2752} {"train_loss": -10.91792106628418, "global_step": 462388, "epoch": 2752} {"train_loss": -11.51887321472168, "global_step": 462389, "epoch": 2752} {"train_loss": -11.444022178649902, "global_step": 462390, "epoch": 2752} {"train_loss": -11.834094047546387, "global_step": 462391, "epoch": 2752} {"train_loss": -11.507991790771484, "global_step": 462392, "epoch": 2752} {"train_loss": -11.922398567199707, "global_step": 462393, "epoch": 2752} {"train_loss": -11.493799209594727, "global_step": 462394, "epoch": 2752} {"train_loss": -11.729591369628906, "global_step": 462395, "epoch": 2752} {"train_loss": -11.998926162719727, "global_step": 462396, "epoch": 2752} {"train_loss": -11.715278625488281, "global_step": 462397, "epoch": 2752} {"train_loss": -12.153648376464844, "global_step": 462398, "epoch": 2752} {"train_loss": -11.481210708618164, "global_step": 462399, "epoch": 2752} {"train_loss": -11.953996658325195, "global_step": 462400, "epoch": 2752} {"train_loss": -11.924529075622559, "global_step": 462401, "epoch": 2752} {"train_loss": -12.326705932617188, "global_step": 462402, "epoch": 2752} {"train_loss": -12.191561698913574, "global_step": 462403, "epoch": 2752} {"train_loss": -12.143649101257324, "global_step": 462404, "epoch": 2752} {"train_loss": -12.224361419677734, "global_step": 462405, "epoch": 2752} {"train_loss": -12.161863327026367, "global_step": 462406, "epoch": 2752} {"train_loss": -12.358808517456055, "global_step": 462407, "epoch": 2752} {"train_loss": -12.484926223754883, "global_step": 462408, "epoch": 2752} {"train_loss": -12.078363418579102, "global_step": 462409, "epoch": 2752} {"train_loss": -12.358802795410156, "global_step": 462410, "epoch": 2752} {"train_loss": -12.315969467163086, "global_step": 462411, "epoch": 2752} {"train_loss": -12.067541122436523, "global_step": 462412, "epoch": 2752} {"train_loss": -12.335542678833008, "global_step": 462413, "epoch": 2752} {"train_loss": -12.157678604125977, "global_step": 462414, "epoch": 2752} {"train_loss": -12.552828788757324, "global_step": 462415, "epoch": 2752} {"train_loss": -12.141475677490234, "global_step": 462416, "epoch": 2752} {"train_loss": -12.416321754455566, "global_step": 462417, "epoch": 2752} {"train_loss": -12.023042678833008, "global_step": 462418, "epoch": 2752} {"train_loss": -12.204839706420898, "global_step": 462419, "epoch": 2752} {"train_loss": -12.154956817626953, "global_step": 462420, "epoch": 2752} {"train_loss": -12.370699882507324, "global_step": 462421, "epoch": 2752} {"train_loss": -12.39350700378418, "global_step": 462422, "epoch": 2752} {"train_loss": -12.702352523803711, "global_step": 462423, "epoch": 2752} {"train_loss": -12.52552318572998, "global_step": 462424, "epoch": 2752} {"train_loss": -12.563472747802734, "global_step": 462425, "epoch": 2752} {"train_loss": -12.543079376220703, "global_step": 462426, "epoch": 2752} {"train_loss": -12.474720001220703, "global_step": 462427, "epoch": 2752} {"train_loss": -12.735041618347168, "global_step": 462428, "epoch": 2752} {"train_loss": -12.630865097045898, "global_step": 462429, "epoch": 2752} {"train_loss": -12.700665473937988, "global_step": 462430, "epoch": 2752} {"train_loss": -12.78509521484375, "global_step": 462431, "epoch": 2752} {"train_loss": -12.70374584197998, "global_step": 462432, "epoch": 2752} {"train_loss": -12.561178207397461, "global_step": 462433, "epoch": 2752} {"train_loss": -12.501863479614258, "global_step": 462434, "epoch": 2752} {"train_loss": -12.637504577636719, "global_step": 462435, "epoch": 2752} {"train_loss": -12.883892059326172, "global_step": 462436, "epoch": 2752} {"train_loss": -12.604537963867188, "global_step": 462437, "epoch": 2752} {"train_loss": -12.644824981689453, "global_step": 462438, "epoch": 2752} {"train_loss": -12.598217010498047, "global_step": 462439, "epoch": 2752} {"train_loss": -12.65778923034668, "global_step": 462440, "epoch": 2752} {"train_loss": -12.785064697265625, "global_step": 462441, "epoch": 2752} {"train_loss": -12.441047668457031, "global_step": 462442, "epoch": 2752} {"train_loss": -12.699872970581055, "global_step": 462443, "epoch": 2752} {"train_loss": -12.561212539672852, "global_step": 462444, "epoch": 2752} {"train_loss": -12.840116500854492, "global_step": 462445, "epoch": 2752} {"train_loss": -12.669495582580566, "global_step": 462446, "epoch": 2752} {"train_loss": -12.576807022094727, "global_step": 462447, "epoch": 2752} {"train_loss": -12.827167510986328, "global_step": 462448, "epoch": 2752} {"train_loss": -12.708976745605469, "global_step": 462449, "epoch": 2752} {"train_loss": -12.38895034790039, "global_step": 462450, "epoch": 2752} {"train_loss": -12.618765830993652, "global_step": 462451, "epoch": 2752} {"train_loss": -12.642614364624023, "global_step": 462452, "epoch": 2752} {"train_loss": -12.288280487060547, "global_step": 462453, "epoch": 2752} {"train_loss": -12.602045059204102, "global_step": 462454, "epoch": 2752} {"train_loss": -12.921624183654785, "global_step": 462455, "epoch": 2752} {"train_loss": -12.559313774108887, "global_step": 462456, "epoch": 2752} {"train_loss": -12.729580879211426, "global_step": 462457, "epoch": 2752} {"train_loss": -12.52241325378418, "global_step": 462458, "epoch": 2752} {"train_loss": -12.735240936279297, "global_step": 462459, "epoch": 2752} {"train_loss": -12.589886665344238, "global_step": 462460, "epoch": 2752} {"train_loss": -12.83319091796875, "global_step": 462461, "epoch": 2752} {"train_loss": -12.64658260345459, "global_step": 462462, "epoch": 2752} {"train_loss": -12.976053237915039, "global_step": 462463, "epoch": 2752} {"train_loss": -12.667550086975098, "global_step": 462464, "epoch": 2752} {"train_loss": -12.749523162841797, "global_step": 462465, "epoch": 2752} {"train_loss": -12.819007873535156, "global_step": 462466, "epoch": 2752} {"train_loss": -12.773604393005371, "global_step": 462467, "epoch": 2752} {"train_loss": -12.783912658691406, "global_step": 462468, "epoch": 2752} {"train_loss": -12.707462310791016, "global_step": 462469, "epoch": 2752} {"train_loss": -12.847322463989258, "global_step": 462470, "epoch": 2752} {"train_loss": -12.857690811157227, "global_step": 462471, "epoch": 2752} {"train_loss": -12.68502426147461, "global_step": 462472, "epoch": 2752} {"train_loss": -12.943107604980469, "global_step": 462473, "epoch": 2752} {"train_loss": -12.588125228881836, "global_step": 462474, "epoch": 2752} {"train_loss": -12.359220504760742, "global_step": 462475, "epoch": 2752} {"train_loss": -12.156108856201172, "global_step": 462476, "epoch": 2752} {"train_loss": -12.164813995361328, "global_step": 462477, "epoch": 2752} {"train_loss": -12.725689888000488, "global_step": 462478, "epoch": 2752} {"train_loss": -12.55341911315918, "global_step": 462479, "epoch": 2752} {"train_loss": -12.48379135131836, "global_step": 462480, "epoch": 2752} {"train_loss": -12.514471054077148, "global_step": 462481, "epoch": 2752} {"train_loss": -12.729256629943848, "global_step": 462482, "epoch": 2752} {"train_loss": -12.874629974365234, "global_step": 462483, "epoch": 2752} {"train_loss": -12.913991928100586, "global_step": 462484, "epoch": 2752} {"train_loss": -12.841785430908203, "global_step": 462485, "epoch": 2752} {"train_loss": -13.13839340209961, "global_step": 462486, "epoch": 2752} {"train_loss": -12.589632034301758, "global_step": 462487, "epoch": 2752} {"train_loss": -12.679254531860352, "global_step": 462488, "epoch": 2752} {"train_loss": -12.43307113647461, "global_step": 462489, "epoch": 2752} {"train_loss": -12.574308395385742, "global_step": 462490, "epoch": 2752} {"train_loss": -13.069589614868164, "global_step": 462491, "epoch": 2752} {"train_loss": -12.138294219970703, "global_step": 462492, "epoch": 2752} {"train_loss": -12.132997512817383, "global_step": 462493, "epoch": 2752} {"train_loss": -12.483487129211426, "global_step": 462494, "epoch": 2752} {"train_loss": -12.750223159790039, "global_step": 462495, "epoch": 2752} {"train_loss": -12.806046485900879, "global_step": 462496, "epoch": 2752} {"train_loss": -12.82383918762207, "global_step": 462497, "epoch": 2752} {"train_loss": -12.722633361816406, "global_step": 462498, "epoch": 2752} {"train_loss": -12.865496635437012, "global_step": 462499, "epoch": 2752} {"train_loss": -12.622864723205566, "global_step": 462500, "epoch": 2752} {"train_loss": -12.594049453735352, "global_step": 462501, "epoch": 2752} {"train_loss": -11.641082763671875, "global_step": 462502, "epoch": 2752} {"train_loss": -12.150803974696569, "global_step": 462503, "epoch": 2752, "val_loss": 311438.6875} {"train_loss": -11.012837409973145, "global_step": 462504, "epoch": 2753} {"train_loss": -12.859308242797852, "global_step": 462505, "epoch": 2753} {"train_loss": -11.081645965576172, "global_step": 462506, "epoch": 2753} {"train_loss": -9.85315227508545, "global_step": 462507, "epoch": 2753} {"train_loss": -11.823735237121582, "global_step": 462508, "epoch": 2753} {"train_loss": -11.373252868652344, "global_step": 462509, "epoch": 2753} {"train_loss": -9.641096115112305, "global_step": 462510, "epoch": 2753} {"train_loss": -9.032179832458496, "global_step": 462511, "epoch": 2753} {"train_loss": -8.9273099899292, "global_step": 462512, "epoch": 2753} {"train_loss": -8.247929573059082, "global_step": 462513, "epoch": 2753} {"train_loss": -9.732839584350586, "global_step": 462514, "epoch": 2753} {"train_loss": -9.558815002441406, "global_step": 462515, "epoch": 2753} {"train_loss": -9.880863189697266, "global_step": 462516, "epoch": 2753} {"train_loss": -8.619789123535156, "global_step": 462517, "epoch": 2753} {"train_loss": -9.020036697387695, "global_step": 462518, "epoch": 2753} {"train_loss": -9.634974479675293, "global_step": 462519, "epoch": 2753} {"train_loss": -9.337727546691895, "global_step": 462520, "epoch": 2753} {"train_loss": -9.533153533935547, "global_step": 462521, "epoch": 2753} {"train_loss": -10.260396003723145, "global_step": 462522, "epoch": 2753} {"train_loss": -10.422325134277344, "global_step": 462523, "epoch": 2753} {"train_loss": -10.197903633117676, "global_step": 462524, "epoch": 2753} {"train_loss": -10.368999481201172, "global_step": 462525, "epoch": 2753} {"train_loss": -10.534444808959961, "global_step": 462526, "epoch": 2753} {"train_loss": -10.588516235351562, "global_step": 462527, "epoch": 2753} {"train_loss": -10.897686004638672, "global_step": 462528, "epoch": 2753} {"train_loss": -10.968782424926758, "global_step": 462529, "epoch": 2753} {"train_loss": -10.580330848693848, "global_step": 462530, "epoch": 2753} {"train_loss": -10.897283554077148, "global_step": 462531, "epoch": 2753} {"train_loss": -10.960943222045898, "global_step": 462532, "epoch": 2753} {"train_loss": -10.401230812072754, "global_step": 462533, "epoch": 2753} {"train_loss": -10.513908386230469, "global_step": 462534, "epoch": 2753} {"train_loss": -11.483304977416992, "global_step": 462535, "epoch": 2753} {"train_loss": -10.028550148010254, "global_step": 462536, "epoch": 2753} {"train_loss": -11.648109436035156, "global_step": 462537, "epoch": 2753} {"train_loss": -10.804317474365234, "global_step": 462538, "epoch": 2753} {"train_loss": -11.436220169067383, "global_step": 462539, "epoch": 2753} {"train_loss": -10.724855422973633, "global_step": 462540, "epoch": 2753} {"train_loss": -12.106588363647461, "global_step": 462541, "epoch": 2753} {"train_loss": -11.32475757598877, "global_step": 462542, "epoch": 2753} {"train_loss": -12.136103630065918, "global_step": 462543, "epoch": 2753} {"train_loss": -11.464000701904297, "global_step": 462544, "epoch": 2753} {"train_loss": -12.089827537536621, "global_step": 462545, "epoch": 2753} {"train_loss": -11.834118843078613, "global_step": 462546, "epoch": 2753} {"train_loss": -11.978410720825195, "global_step": 462547, "epoch": 2753} {"train_loss": -11.467617988586426, "global_step": 462548, "epoch": 2753} {"train_loss": -12.064902305603027, "global_step": 462549, "epoch": 2753} {"train_loss": -11.909440994262695, "global_step": 462550, "epoch": 2753} {"train_loss": -11.703031539916992, "global_step": 462551, "epoch": 2753} {"train_loss": -12.48354721069336, "global_step": 462552, "epoch": 2753} {"train_loss": -12.180895805358887, "global_step": 462553, "epoch": 2753} {"train_loss": -12.084457397460938, "global_step": 462554, "epoch": 2753} {"train_loss": -12.028560638427734, "global_step": 462555, "epoch": 2753} {"train_loss": -12.060550689697266, "global_step": 462556, "epoch": 2753} {"train_loss": -11.908072471618652, "global_step": 462557, "epoch": 2753} {"train_loss": -12.097023010253906, "global_step": 462558, "epoch": 2753} {"train_loss": -12.281522750854492, "global_step": 462559, "epoch": 2753} {"train_loss": -12.147185325622559, "global_step": 462560, "epoch": 2753} {"train_loss": -12.320047378540039, "global_step": 462561, "epoch": 2753} {"train_loss": -12.133916854858398, "global_step": 462562, "epoch": 2753} {"train_loss": -12.094526290893555, "global_step": 462563, "epoch": 2753} {"train_loss": -12.42953872680664, "global_step": 462564, "epoch": 2753} {"train_loss": -12.023050308227539, "global_step": 462565, "epoch": 2753} {"train_loss": -12.320111274719238, "global_step": 462566, "epoch": 2753} {"train_loss": -12.288850784301758, "global_step": 462567, "epoch": 2753} {"train_loss": -12.516969680786133, "global_step": 462568, "epoch": 2753} {"train_loss": -12.397046089172363, "global_step": 462569, "epoch": 2753} {"train_loss": -12.408271789550781, "global_step": 462570, "epoch": 2753} {"train_loss": -12.303083419799805, "global_step": 462571, "epoch": 2753} {"train_loss": -12.145159721374512, "global_step": 462572, "epoch": 2753} {"train_loss": -11.91831111907959, "global_step": 462573, "epoch": 2753} {"train_loss": -12.40140151977539, "global_step": 462574, "epoch": 2753} {"train_loss": -12.1353759765625, "global_step": 462575, "epoch": 2753} {"train_loss": -12.488901138305664, "global_step": 462576, "epoch": 2753} {"train_loss": -12.333646774291992, "global_step": 462577, "epoch": 2753} {"train_loss": -12.483247756958008, "global_step": 462578, "epoch": 2753} {"train_loss": -12.546785354614258, "global_step": 462579, "epoch": 2753} {"train_loss": -12.50558853149414, "global_step": 462580, "epoch": 2753} {"train_loss": -12.642627716064453, "global_step": 462581, "epoch": 2753} {"train_loss": -12.771100997924805, "global_step": 462582, "epoch": 2753} {"train_loss": -12.604653358459473, "global_step": 462583, "epoch": 2753} {"train_loss": -12.576959609985352, "global_step": 462584, "epoch": 2753} {"train_loss": -12.55575942993164, "global_step": 462585, "epoch": 2753} {"train_loss": -12.67421817779541, "global_step": 462586, "epoch": 2753} {"train_loss": -12.67827320098877, "global_step": 462587, "epoch": 2753} {"train_loss": -12.5139741897583, "global_step": 462588, "epoch": 2753} {"train_loss": -12.778006553649902, "global_step": 462589, "epoch": 2753} {"train_loss": -12.629781723022461, "global_step": 462590, "epoch": 2753} {"train_loss": -12.848855018615723, "global_step": 462591, "epoch": 2753} {"train_loss": -12.648787498474121, "global_step": 462592, "epoch": 2753} {"train_loss": -12.676793098449707, "global_step": 462593, "epoch": 2753} {"train_loss": -12.532240867614746, "global_step": 462594, "epoch": 2753} {"train_loss": -12.672395706176758, "global_step": 462595, "epoch": 2753} {"train_loss": -12.774593353271484, "global_step": 462596, "epoch": 2753} {"train_loss": -12.668388366699219, "global_step": 462597, "epoch": 2753} {"train_loss": -12.652883529663086, "global_step": 462598, "epoch": 2753} {"train_loss": -12.679939270019531, "global_step": 462599, "epoch": 2753} {"train_loss": -12.718265533447266, "global_step": 462600, "epoch": 2753} {"train_loss": -12.52381420135498, "global_step": 462601, "epoch": 2753} {"train_loss": -12.692161560058594, "global_step": 462602, "epoch": 2753} {"train_loss": -12.688323974609375, "global_step": 462603, "epoch": 2753} {"train_loss": -12.906673431396484, "global_step": 462604, "epoch": 2753} {"train_loss": -12.39458179473877, "global_step": 462605, "epoch": 2753} {"train_loss": -12.675838470458984, "global_step": 462606, "epoch": 2753} {"train_loss": -12.683528900146484, "global_step": 462607, "epoch": 2753} {"train_loss": -12.80754280090332, "global_step": 462608, "epoch": 2753} {"train_loss": -12.789525985717773, "global_step": 462609, "epoch": 2753} {"train_loss": -12.557662963867188, "global_step": 462610, "epoch": 2753} {"train_loss": -13.051961898803711, "global_step": 462611, "epoch": 2753} {"train_loss": -12.499744415283203, "global_step": 462612, "epoch": 2753} {"train_loss": -12.481538772583008, "global_step": 462613, "epoch": 2753} {"train_loss": -12.688785552978516, "global_step": 462614, "epoch": 2753} {"train_loss": -12.742345809936523, "global_step": 462615, "epoch": 2753} {"train_loss": -12.768339157104492, "global_step": 462616, "epoch": 2753} {"train_loss": -12.849092483520508, "global_step": 462617, "epoch": 2753} {"train_loss": -12.749682426452637, "global_step": 462618, "epoch": 2753} {"train_loss": -12.613601684570312, "global_step": 462619, "epoch": 2753} {"train_loss": -12.865782737731934, "global_step": 462620, "epoch": 2753} {"train_loss": -12.91567325592041, "global_step": 462621, "epoch": 2753} {"train_loss": -12.595513343811035, "global_step": 462622, "epoch": 2753} {"train_loss": -12.468361854553223, "global_step": 462623, "epoch": 2753} {"train_loss": -12.779480934143066, "global_step": 462624, "epoch": 2753} {"train_loss": -12.374555587768555, "global_step": 462625, "epoch": 2753} {"train_loss": -11.663005828857422, "global_step": 462626, "epoch": 2753} {"train_loss": -12.630155563354492, "global_step": 462627, "epoch": 2753} {"train_loss": -12.248588562011719, "global_step": 462628, "epoch": 2753} {"train_loss": -11.993242263793945, "global_step": 462629, "epoch": 2753} {"train_loss": -11.364877700805664, "global_step": 462630, "epoch": 2753} {"train_loss": -11.93274974822998, "global_step": 462631, "epoch": 2753} {"train_loss": -11.143415451049805, "global_step": 462632, "epoch": 2753} {"train_loss": -11.410826683044434, "global_step": 462633, "epoch": 2753} {"train_loss": -10.322577476501465, "global_step": 462634, "epoch": 2753} {"train_loss": -10.723679542541504, "global_step": 462635, "epoch": 2753} {"train_loss": -11.54296875, "global_step": 462636, "epoch": 2753} {"train_loss": -10.988130569458008, "global_step": 462637, "epoch": 2753} {"train_loss": -11.325809478759766, "global_step": 462638, "epoch": 2753} {"train_loss": -11.168333053588867, "global_step": 462639, "epoch": 2753} {"train_loss": -11.410016059875488, "global_step": 462640, "epoch": 2753} {"train_loss": -12.071502685546875, "global_step": 462641, "epoch": 2753} {"train_loss": -10.796394348144531, "global_step": 462642, "epoch": 2753} {"train_loss": -11.87807846069336, "global_step": 462643, "epoch": 2753} {"train_loss": -11.462605476379395, "global_step": 462644, "epoch": 2753} {"train_loss": -11.237176895141602, "global_step": 462645, "epoch": 2753} {"train_loss": -12.056300163269043, "global_step": 462646, "epoch": 2753} {"train_loss": -11.921520233154297, "global_step": 462647, "epoch": 2753} {"train_loss": -11.622049331665039, "global_step": 462648, "epoch": 2753} {"train_loss": -11.080259323120117, "global_step": 462649, "epoch": 2753} {"train_loss": -11.545684814453125, "global_step": 462650, "epoch": 2753} {"train_loss": -11.663457870483398, "global_step": 462651, "epoch": 2753} {"train_loss": -11.317486763000488, "global_step": 462652, "epoch": 2753} {"train_loss": -11.642840385437012, "global_step": 462653, "epoch": 2753} {"train_loss": -11.404914855957031, "global_step": 462654, "epoch": 2753} {"train_loss": -11.555387496948242, "global_step": 462655, "epoch": 2753} {"train_loss": -11.762012481689453, "global_step": 462656, "epoch": 2753} {"train_loss": -11.350652694702148, "global_step": 462657, "epoch": 2753} {"train_loss": -12.518655776977539, "global_step": 462658, "epoch": 2753} {"train_loss": -11.093645095825195, "global_step": 462659, "epoch": 2753} {"train_loss": -11.76774787902832, "global_step": 462660, "epoch": 2753} {"train_loss": -11.585176467895508, "global_step": 462661, "epoch": 2753} {"train_loss": -11.050307273864746, "global_step": 462662, "epoch": 2753} {"train_loss": -11.97057819366455, "global_step": 462663, "epoch": 2753} {"train_loss": -11.46286678314209, "global_step": 462664, "epoch": 2753} {"train_loss": -12.282890319824219, "global_step": 462665, "epoch": 2753} {"train_loss": -11.827280044555664, "global_step": 462666, "epoch": 2753} {"train_loss": -11.716304779052734, "global_step": 462667, "epoch": 2753} {"train_loss": -12.390764236450195, "global_step": 462668, "epoch": 2753} {"train_loss": -12.143671035766602, "global_step": 462669, "epoch": 2753} {"train_loss": -12.515356063842773, "global_step": 462670, "epoch": 2753} {"train_loss": -11.748560383206321, "global_step": 462671, "epoch": 2753, "val_loss": 312023.1875} {"train_loss": -11.810901641845703, "global_step": 462672, "epoch": 2754} {"train_loss": -11.914627075195312, "global_step": 462673, "epoch": 2754} {"train_loss": -12.003320693969727, "global_step": 462674, "epoch": 2754} {"train_loss": -11.96021842956543, "global_step": 462675, "epoch": 2754} {"train_loss": -12.062644004821777, "global_step": 462676, "epoch": 2754} {"train_loss": -12.345494270324707, "global_step": 462677, "epoch": 2754} {"train_loss": -12.31281566619873, "global_step": 462678, "epoch": 2754} {"train_loss": -12.414579391479492, "global_step": 462679, "epoch": 2754} {"train_loss": -12.080944061279297, "global_step": 462680, "epoch": 2754} {"train_loss": -12.49652099609375, "global_step": 462681, "epoch": 2754} {"train_loss": -12.419042587280273, "global_step": 462682, "epoch": 2754} {"train_loss": -12.35224437713623, "global_step": 462683, "epoch": 2754} {"train_loss": -12.362874984741211, "global_step": 462684, "epoch": 2754} {"train_loss": -12.109491348266602, "global_step": 462685, "epoch": 2754} {"train_loss": -12.279748916625977, "global_step": 462686, "epoch": 2754} {"train_loss": -12.244832992553711, "global_step": 462687, "epoch": 2754} {"train_loss": -12.156126976013184, "global_step": 462688, "epoch": 2754} {"train_loss": -12.233846664428711, "global_step": 462689, "epoch": 2754} {"train_loss": -12.332868576049805, "global_step": 462690, "epoch": 2754} {"train_loss": -12.32231616973877, "global_step": 462691, "epoch": 2754} {"train_loss": -12.40046501159668, "global_step": 462692, "epoch": 2754} {"train_loss": -12.628211975097656, "global_step": 462693, "epoch": 2754} {"train_loss": -12.526063919067383, "global_step": 462694, "epoch": 2754} {"train_loss": -12.501808166503906, "global_step": 462695, "epoch": 2754} {"train_loss": -12.426238059997559, "global_step": 462696, "epoch": 2754} {"train_loss": -12.385927200317383, "global_step": 462697, "epoch": 2754} {"train_loss": -12.490681648254395, "global_step": 462698, "epoch": 2754} {"train_loss": -12.448144912719727, "global_step": 462699, "epoch": 2754} {"train_loss": -12.424331665039062, "global_step": 462700, "epoch": 2754} {"train_loss": -12.358465194702148, "global_step": 462701, "epoch": 2754} {"train_loss": -12.619836807250977, "global_step": 462702, "epoch": 2754} {"train_loss": -12.528785705566406, "global_step": 462703, "epoch": 2754} {"train_loss": -12.506214141845703, "global_step": 462704, "epoch": 2754} {"train_loss": -12.563541412353516, "global_step": 462705, "epoch": 2754} {"train_loss": -11.998700141906738, "global_step": 462706, "epoch": 2754} {"train_loss": -12.739303588867188, "global_step": 462707, "epoch": 2754} {"train_loss": -12.564697265625, "global_step": 462708, "epoch": 2754} {"train_loss": -12.541179656982422, "global_step": 462709, "epoch": 2754} {"train_loss": -12.558815002441406, "global_step": 462710, "epoch": 2754} {"train_loss": -12.530338287353516, "global_step": 462711, "epoch": 2754} {"train_loss": -12.658743858337402, "global_step": 462712, "epoch": 2754} {"train_loss": -12.464483261108398, "global_step": 462713, "epoch": 2754} {"train_loss": -12.38752555847168, "global_step": 462714, "epoch": 2754} {"train_loss": -12.830276489257812, "global_step": 462715, "epoch": 2754} {"train_loss": -12.643709182739258, "global_step": 462716, "epoch": 2754} {"train_loss": -12.755528450012207, "global_step": 462717, "epoch": 2754} {"train_loss": -12.636833190917969, "global_step": 462718, "epoch": 2754} {"train_loss": -12.6023530960083, "global_step": 462719, "epoch": 2754} {"train_loss": -12.718628883361816, "global_step": 462720, "epoch": 2754} {"train_loss": -12.806890487670898, "global_step": 462721, "epoch": 2754} {"train_loss": -12.752054214477539, "global_step": 462722, "epoch": 2754} {"train_loss": -12.87662410736084, "global_step": 462723, "epoch": 2754} {"train_loss": -12.575003623962402, "global_step": 462724, "epoch": 2754} {"train_loss": -12.630494117736816, "global_step": 462725, "epoch": 2754} {"train_loss": -12.524073600769043, "global_step": 462726, "epoch": 2754} {"train_loss": -12.625971794128418, "global_step": 462727, "epoch": 2754} {"train_loss": -12.855062484741211, "global_step": 462728, "epoch": 2754} {"train_loss": -12.720405578613281, "global_step": 462729, "epoch": 2754} {"train_loss": -12.724346160888672, "global_step": 462730, "epoch": 2754} {"train_loss": -12.57144546508789, "global_step": 462731, "epoch": 2754} {"train_loss": -12.684128761291504, "global_step": 462732, "epoch": 2754} {"train_loss": -12.50481128692627, "global_step": 462733, "epoch": 2754} {"train_loss": -12.685443878173828, "global_step": 462734, "epoch": 2754} {"train_loss": -12.495870590209961, "global_step": 462735, "epoch": 2754} {"train_loss": -12.841768264770508, "global_step": 462736, "epoch": 2754} {"train_loss": -12.632039070129395, "global_step": 462737, "epoch": 2754} {"train_loss": -12.255678176879883, "global_step": 462738, "epoch": 2754} {"train_loss": -12.873064041137695, "global_step": 462739, "epoch": 2754} {"train_loss": -12.437232971191406, "global_step": 462740, "epoch": 2754} {"train_loss": -12.496284484863281, "global_step": 462741, "epoch": 2754} {"train_loss": -12.432531356811523, "global_step": 462742, "epoch": 2754} {"train_loss": -12.50506591796875, "global_step": 462743, "epoch": 2754} {"train_loss": -12.252908706665039, "global_step": 462744, "epoch": 2754} {"train_loss": -12.457481384277344, "global_step": 462745, "epoch": 2754} {"train_loss": -12.17172622680664, "global_step": 462746, "epoch": 2754} {"train_loss": -12.212100982666016, "global_step": 462747, "epoch": 2754} {"train_loss": -11.720998764038086, "global_step": 462748, "epoch": 2754} {"train_loss": -11.999423027038574, "global_step": 462749, "epoch": 2754} {"train_loss": -12.387076377868652, "global_step": 462750, "epoch": 2754} {"train_loss": -11.953035354614258, "global_step": 462751, "epoch": 2754} {"train_loss": -11.665532112121582, "global_step": 462752, "epoch": 2754} {"train_loss": -12.514392852783203, "global_step": 462753, "epoch": 2754} {"train_loss": -12.53731918334961, "global_step": 462754, "epoch": 2754} {"train_loss": -12.537904739379883, "global_step": 462755, "epoch": 2754} {"train_loss": -12.772491455078125, "global_step": 462756, "epoch": 2754} {"train_loss": -12.677291870117188, "global_step": 462757, "epoch": 2754} {"train_loss": -12.408618927001953, "global_step": 462758, "epoch": 2754} {"train_loss": -12.569806098937988, "global_step": 462759, "epoch": 2754} {"train_loss": -12.352616310119629, "global_step": 462760, "epoch": 2754} {"train_loss": -12.35785961151123, "global_step": 462761, "epoch": 2754} {"train_loss": -12.438553810119629, "global_step": 462762, "epoch": 2754} {"train_loss": -12.530681610107422, "global_step": 462763, "epoch": 2754} {"train_loss": -12.57957935333252, "global_step": 462764, "epoch": 2754} {"train_loss": -12.032238960266113, "global_step": 462765, "epoch": 2754} {"train_loss": -10.798206329345703, "global_step": 462766, "epoch": 2754} {"train_loss": -12.36600112915039, "global_step": 462767, "epoch": 2754} {"train_loss": -12.278186798095703, "global_step": 462768, "epoch": 2754} {"train_loss": -10.893454551696777, "global_step": 462769, "epoch": 2754} {"train_loss": -10.766475677490234, "global_step": 462770, "epoch": 2754} {"train_loss": -11.856682777404785, "global_step": 462771, "epoch": 2754} {"train_loss": -11.536968231201172, "global_step": 462772, "epoch": 2754} {"train_loss": -11.121578216552734, "global_step": 462773, "epoch": 2754} {"train_loss": -12.166431427001953, "global_step": 462774, "epoch": 2754} {"train_loss": -10.509151458740234, "global_step": 462775, "epoch": 2754} {"train_loss": -12.014287948608398, "global_step": 462776, "epoch": 2754} {"train_loss": -11.898173332214355, "global_step": 462777, "epoch": 2754} {"train_loss": -11.20602035522461, "global_step": 462778, "epoch": 2754} {"train_loss": -12.337568283081055, "global_step": 462779, "epoch": 2754} {"train_loss": -11.810552597045898, "global_step": 462780, "epoch": 2754} {"train_loss": -10.910209655761719, "global_step": 462781, "epoch": 2754} {"train_loss": -12.53718090057373, "global_step": 462782, "epoch": 2754} {"train_loss": -11.068782806396484, "global_step": 462783, "epoch": 2754} {"train_loss": -11.959826469421387, "global_step": 462784, "epoch": 2754} {"train_loss": -12.034637451171875, "global_step": 462785, "epoch": 2754} {"train_loss": -10.538557052612305, "global_step": 462786, "epoch": 2754} {"train_loss": -12.265705108642578, "global_step": 462787, "epoch": 2754} {"train_loss": -11.814605712890625, "global_step": 462788, "epoch": 2754} {"train_loss": -11.29649543762207, "global_step": 462789, "epoch": 2754} {"train_loss": -12.103354454040527, "global_step": 462790, "epoch": 2754} {"train_loss": -11.5100679397583, "global_step": 462791, "epoch": 2754} {"train_loss": -12.127225875854492, "global_step": 462792, "epoch": 2754} {"train_loss": -12.243616104125977, "global_step": 462793, "epoch": 2754} {"train_loss": -12.173310279846191, "global_step": 462794, "epoch": 2754} {"train_loss": -12.685303688049316, "global_step": 462795, "epoch": 2754} {"train_loss": -12.109066009521484, "global_step": 462796, "epoch": 2754} {"train_loss": -12.371583938598633, "global_step": 462797, "epoch": 2754} {"train_loss": -12.103460311889648, "global_step": 462798, "epoch": 2754} {"train_loss": -11.54210090637207, "global_step": 462799, "epoch": 2754} {"train_loss": -12.525725364685059, "global_step": 462800, "epoch": 2754} {"train_loss": -11.652647018432617, "global_step": 462801, "epoch": 2754} {"train_loss": -12.446870803833008, "global_step": 462802, "epoch": 2754} {"train_loss": -12.078695297241211, "global_step": 462803, "epoch": 2754} {"train_loss": -11.924615859985352, "global_step": 462804, "epoch": 2754} {"train_loss": -12.35372257232666, "global_step": 462805, "epoch": 2754} {"train_loss": -12.255136489868164, "global_step": 462806, "epoch": 2754} {"train_loss": -12.35003662109375, "global_step": 462807, "epoch": 2754} {"train_loss": -12.259407043457031, "global_step": 462808, "epoch": 2754} {"train_loss": -12.470209121704102, "global_step": 462809, "epoch": 2754} {"train_loss": -12.590895652770996, "global_step": 462810, "epoch": 2754} {"train_loss": -11.847561836242676, "global_step": 462811, "epoch": 2754} {"train_loss": -12.537487030029297, "global_step": 462812, "epoch": 2754} {"train_loss": -11.303732872009277, "global_step": 462813, "epoch": 2754} {"train_loss": -12.585216522216797, "global_step": 462814, "epoch": 2754} {"train_loss": -11.43781852722168, "global_step": 462815, "epoch": 2754} {"train_loss": -11.20356559753418, "global_step": 462816, "epoch": 2754} {"train_loss": -12.267693519592285, "global_step": 462817, "epoch": 2754} {"train_loss": -11.093019485473633, "global_step": 462818, "epoch": 2754} {"train_loss": -12.208539962768555, "global_step": 462819, "epoch": 2754} {"train_loss": -12.421674728393555, "global_step": 462820, "epoch": 2754} {"train_loss": -11.854493141174316, "global_step": 462821, "epoch": 2754} {"train_loss": -11.991742134094238, "global_step": 462822, "epoch": 2754} {"train_loss": -11.402669906616211, "global_step": 462823, "epoch": 2754} {"train_loss": -12.328625679016113, "global_step": 462824, "epoch": 2754} {"train_loss": -11.990880966186523, "global_step": 462825, "epoch": 2754} {"train_loss": -11.453595161437988, "global_step": 462826, "epoch": 2754} {"train_loss": -11.876911163330078, "global_step": 462827, "epoch": 2754} {"train_loss": -11.722657203674316, "global_step": 462828, "epoch": 2754} {"train_loss": -11.648573875427246, "global_step": 462829, "epoch": 2754} {"train_loss": -12.155364036560059, "global_step": 462830, "epoch": 2754} {"train_loss": -12.141046524047852, "global_step": 462831, "epoch": 2754} {"train_loss": -11.930285453796387, "global_step": 462832, "epoch": 2754} {"train_loss": -12.1744384765625, "global_step": 462833, "epoch": 2754} {"train_loss": -11.748636245727539, "global_step": 462834, "epoch": 2754} {"train_loss": -12.067253112792969, "global_step": 462835, "epoch": 2754} {"train_loss": -11.964922904968262, "global_step": 462836, "epoch": 2754} {"train_loss": -12.222219467163086, "global_step": 462837, "epoch": 2754} {"train_loss": -11.873669624328613, "global_step": 462838, "epoch": 2754} {"train_loss": -12.197306536492848, "global_step": 462839, "epoch": 2754, "val_loss": 316198.0} {"train_loss": -12.309497833251953, "global_step": 462840, "epoch": 2755} {"train_loss": -12.489994049072266, "global_step": 462841, "epoch": 2755} {"train_loss": -12.409152030944824, "global_step": 462842, "epoch": 2755} {"train_loss": -12.271400451660156, "global_step": 462843, "epoch": 2755} {"train_loss": -12.683564186096191, "global_step": 462844, "epoch": 2755} {"train_loss": -11.998954772949219, "global_step": 462845, "epoch": 2755} {"train_loss": -11.841529846191406, "global_step": 462846, "epoch": 2755} {"train_loss": -11.46905517578125, "global_step": 462847, "epoch": 2755} {"train_loss": -12.196855545043945, "global_step": 462848, "epoch": 2755} {"train_loss": -11.684287071228027, "global_step": 462849, "epoch": 2755} {"train_loss": -11.341358184814453, "global_step": 462850, "epoch": 2755} {"train_loss": -12.417579650878906, "global_step": 462851, "epoch": 2755} {"train_loss": -12.248163223266602, "global_step": 462852, "epoch": 2755} {"train_loss": -12.213692665100098, "global_step": 462853, "epoch": 2755} {"train_loss": -12.568496704101562, "global_step": 462854, "epoch": 2755} {"train_loss": -11.681278228759766, "global_step": 462855, "epoch": 2755} {"train_loss": -12.576461791992188, "global_step": 462856, "epoch": 2755} {"train_loss": -12.307828903198242, "global_step": 462857, "epoch": 2755} {"train_loss": -12.041991233825684, "global_step": 462858, "epoch": 2755} {"train_loss": -12.680927276611328, "global_step": 462859, "epoch": 2755} {"train_loss": -12.099629402160645, "global_step": 462860, "epoch": 2755} {"train_loss": -12.672310829162598, "global_step": 462861, "epoch": 2755} {"train_loss": -12.534751892089844, "global_step": 462862, "epoch": 2755} {"train_loss": -12.549959182739258, "global_step": 462863, "epoch": 2755} {"train_loss": -12.615524291992188, "global_step": 462864, "epoch": 2755} {"train_loss": -12.369054794311523, "global_step": 462865, "epoch": 2755} {"train_loss": -12.49826717376709, "global_step": 462866, "epoch": 2755} {"train_loss": -12.327303886413574, "global_step": 462867, "epoch": 2755} {"train_loss": -12.474376678466797, "global_step": 462868, "epoch": 2755} {"train_loss": -12.542154312133789, "global_step": 462869, "epoch": 2755} {"train_loss": -12.53071117401123, "global_step": 462870, "epoch": 2755} {"train_loss": -12.144737243652344, "global_step": 462871, "epoch": 2755} {"train_loss": -11.971579551696777, "global_step": 462872, "epoch": 2755} {"train_loss": -12.638232231140137, "global_step": 462873, "epoch": 2755} {"train_loss": -12.133258819580078, "global_step": 462874, "epoch": 2755} {"train_loss": -11.85206127166748, "global_step": 462875, "epoch": 2755} {"train_loss": -12.461799621582031, "global_step": 462876, "epoch": 2755} {"train_loss": -10.564123153686523, "global_step": 462877, "epoch": 2755} {"train_loss": -12.784416198730469, "global_step": 462878, "epoch": 2755} {"train_loss": -11.204081535339355, "global_step": 462879, "epoch": 2755} {"train_loss": -11.288559913635254, "global_step": 462880, "epoch": 2755} {"train_loss": -10.852128982543945, "global_step": 462881, "epoch": 2755} {"train_loss": -11.307690620422363, "global_step": 462882, "epoch": 2755} {"train_loss": -10.577930450439453, "global_step": 462883, "epoch": 2755} {"train_loss": -12.172463417053223, "global_step": 462884, "epoch": 2755} {"train_loss": -10.70143985748291, "global_step": 462885, "epoch": 2755} {"train_loss": -11.946925163269043, "global_step": 462886, "epoch": 2755} {"train_loss": -11.677896499633789, "global_step": 462887, "epoch": 2755} {"train_loss": -11.801942825317383, "global_step": 462888, "epoch": 2755} {"train_loss": -12.211793899536133, "global_step": 462889, "epoch": 2755} {"train_loss": -10.962289810180664, "global_step": 462890, "epoch": 2755} {"train_loss": -12.266942977905273, "global_step": 462891, "epoch": 2755} {"train_loss": -11.621999740600586, "global_step": 462892, "epoch": 2755} {"train_loss": -12.021507263183594, "global_step": 462893, "epoch": 2755} {"train_loss": -11.471514701843262, "global_step": 462894, "epoch": 2755} {"train_loss": -11.918960571289062, "global_step": 462895, "epoch": 2755} {"train_loss": -11.943355560302734, "global_step": 462896, "epoch": 2755} {"train_loss": -11.732667922973633, "global_step": 462897, "epoch": 2755} {"train_loss": -12.402229309082031, "global_step": 462898, "epoch": 2755} {"train_loss": -12.106757164001465, "global_step": 462899, "epoch": 2755} {"train_loss": -11.892193794250488, "global_step": 462900, "epoch": 2755} {"train_loss": -12.441263198852539, "global_step": 462901, "epoch": 2755} {"train_loss": -11.37913703918457, "global_step": 462902, "epoch": 2755} {"train_loss": -12.313125610351562, "global_step": 462903, "epoch": 2755} {"train_loss": -11.728099822998047, "global_step": 462904, "epoch": 2755} {"train_loss": -12.064306259155273, "global_step": 462905, "epoch": 2755} {"train_loss": -11.892251968383789, "global_step": 462906, "epoch": 2755} {"train_loss": -11.404603004455566, "global_step": 462907, "epoch": 2755} {"train_loss": -11.196073532104492, "global_step": 462908, "epoch": 2755} {"train_loss": -11.81687068939209, "global_step": 462909, "epoch": 2755} {"train_loss": -11.45030689239502, "global_step": 462910, "epoch": 2755} {"train_loss": -10.430115699768066, "global_step": 462911, "epoch": 2755} {"train_loss": -11.382294654846191, "global_step": 462912, "epoch": 2755} {"train_loss": -11.773524284362793, "global_step": 462913, "epoch": 2755} {"train_loss": -11.20283317565918, "global_step": 462914, "epoch": 2755} {"train_loss": -11.471226692199707, "global_step": 462915, "epoch": 2755} {"train_loss": -12.038047790527344, "global_step": 462916, "epoch": 2755} {"train_loss": -11.771392822265625, "global_step": 462917, "epoch": 2755} {"train_loss": -12.14200210571289, "global_step": 462918, "epoch": 2755} {"train_loss": -11.5267915725708, "global_step": 462919, "epoch": 2755} {"train_loss": -12.098791122436523, "global_step": 462920, "epoch": 2755} {"train_loss": -12.13344955444336, "global_step": 462921, "epoch": 2755} {"train_loss": -12.032119750976562, "global_step": 462922, "epoch": 2755} {"train_loss": -12.417693138122559, "global_step": 462923, "epoch": 2755} {"train_loss": -11.987282752990723, "global_step": 462924, "epoch": 2755} {"train_loss": -12.30922794342041, "global_step": 462925, "epoch": 2755} {"train_loss": -11.419365882873535, "global_step": 462926, "epoch": 2755} {"train_loss": -11.828621864318848, "global_step": 462927, "epoch": 2755} {"train_loss": -11.230547904968262, "global_step": 462928, "epoch": 2755} {"train_loss": -11.926058769226074, "global_step": 462929, "epoch": 2755} {"train_loss": -11.684295654296875, "global_step": 462930, "epoch": 2755} {"train_loss": -12.173816680908203, "global_step": 462931, "epoch": 2755} {"train_loss": -11.170648574829102, "global_step": 462932, "epoch": 2755} {"train_loss": -12.51585578918457, "global_step": 462933, "epoch": 2755} {"train_loss": -12.044174194335938, "global_step": 462934, "epoch": 2755} {"train_loss": -12.270759582519531, "global_step": 462935, "epoch": 2755} {"train_loss": -12.419904708862305, "global_step": 462936, "epoch": 2755} {"train_loss": -12.17001724243164, "global_step": 462937, "epoch": 2755} {"train_loss": -12.22586727142334, "global_step": 462938, "epoch": 2755} {"train_loss": -12.415939331054688, "global_step": 462939, "epoch": 2755} {"train_loss": -12.315106391906738, "global_step": 462940, "epoch": 2755} {"train_loss": -12.665143966674805, "global_step": 462941, "epoch": 2755} {"train_loss": -12.537515640258789, "global_step": 462942, "epoch": 2755} {"train_loss": -12.633403778076172, "global_step": 462943, "epoch": 2755} {"train_loss": -12.5982084274292, "global_step": 462944, "epoch": 2755} {"train_loss": -12.544197082519531, "global_step": 462945, "epoch": 2755} {"train_loss": -12.577829360961914, "global_step": 462946, "epoch": 2755} {"train_loss": -12.765287399291992, "global_step": 462947, "epoch": 2755} {"train_loss": -12.532615661621094, "global_step": 462948, "epoch": 2755} {"train_loss": -12.754316329956055, "global_step": 462949, "epoch": 2755} {"train_loss": -12.645397186279297, "global_step": 462950, "epoch": 2755} {"train_loss": -12.743820190429688, "global_step": 462951, "epoch": 2755} {"train_loss": -12.614103317260742, "global_step": 462952, "epoch": 2755} {"train_loss": -12.911848068237305, "global_step": 462953, "epoch": 2755} {"train_loss": -12.749834060668945, "global_step": 462954, "epoch": 2755} {"train_loss": -12.697233200073242, "global_step": 462955, "epoch": 2755} {"train_loss": -12.696993827819824, "global_step": 462956, "epoch": 2755} {"train_loss": -12.703320503234863, "global_step": 462957, "epoch": 2755} {"train_loss": -12.74826431274414, "global_step": 462958, "epoch": 2755} {"train_loss": -12.66557502746582, "global_step": 462959, "epoch": 2755} {"train_loss": -12.890863418579102, "global_step": 462960, "epoch": 2755} {"train_loss": -12.680137634277344, "global_step": 462961, "epoch": 2755} {"train_loss": -12.70928955078125, "global_step": 462962, "epoch": 2755} {"train_loss": -12.72520923614502, "global_step": 462963, "epoch": 2755} {"train_loss": -12.713062286376953, "global_step": 462964, "epoch": 2755} {"train_loss": -12.848223686218262, "global_step": 462965, "epoch": 2755} {"train_loss": -12.778848648071289, "global_step": 462966, "epoch": 2755} {"train_loss": -12.872734069824219, "global_step": 462967, "epoch": 2755} {"train_loss": -12.789238929748535, "global_step": 462968, "epoch": 2755} {"train_loss": -12.829370498657227, "global_step": 462969, "epoch": 2755} {"train_loss": -12.822282791137695, "global_step": 462970, "epoch": 2755} {"train_loss": -12.778247833251953, "global_step": 462971, "epoch": 2755} {"train_loss": -12.596813201904297, "global_step": 462972, "epoch": 2755} {"train_loss": -12.958078384399414, "global_step": 462973, "epoch": 2755} {"train_loss": -12.584823608398438, "global_step": 462974, "epoch": 2755} {"train_loss": -12.847745895385742, "global_step": 462975, "epoch": 2755} {"train_loss": -12.913370132446289, "global_step": 462976, "epoch": 2755} {"train_loss": -12.614648818969727, "global_step": 462977, "epoch": 2755} {"train_loss": -12.834575653076172, "global_step": 462978, "epoch": 2755} {"train_loss": -12.633722305297852, "global_step": 462979, "epoch": 2755} {"train_loss": -13.000792503356934, "global_step": 462980, "epoch": 2755} {"train_loss": -12.806224822998047, "global_step": 462981, "epoch": 2755} {"train_loss": -12.595170974731445, "global_step": 462982, "epoch": 2755} {"train_loss": -12.884678840637207, "global_step": 462983, "epoch": 2755} {"train_loss": -13.017742156982422, "global_step": 462984, "epoch": 2755} {"train_loss": -12.820907592773438, "global_step": 462985, "epoch": 2755} {"train_loss": -12.833490371704102, "global_step": 462986, "epoch": 2755} {"train_loss": -12.711393356323242, "global_step": 462987, "epoch": 2755} {"train_loss": -12.82735824584961, "global_step": 462988, "epoch": 2755} {"train_loss": -12.966527938842773, "global_step": 462989, "epoch": 2755} {"train_loss": -12.721617698669434, "global_step": 462990, "epoch": 2755} {"train_loss": -12.678318977355957, "global_step": 462991, "epoch": 2755} {"train_loss": -12.907346725463867, "global_step": 462992, "epoch": 2755} {"train_loss": -12.613759994506836, "global_step": 462993, "epoch": 2755} {"train_loss": -12.534462928771973, "global_step": 462994, "epoch": 2755} {"train_loss": -12.325772285461426, "global_step": 462995, "epoch": 2755} {"train_loss": -12.894521713256836, "global_step": 462996, "epoch": 2755} {"train_loss": -11.75312614440918, "global_step": 462997, "epoch": 2755} {"train_loss": -12.876803398132324, "global_step": 462998, "epoch": 2755} {"train_loss": -11.784281730651855, "global_step": 462999, "epoch": 2755} {"train_loss": -12.063511848449707, "global_step": 463000, "epoch": 2755} {"train_loss": -12.462373733520508, "global_step": 463001, "epoch": 2755} {"train_loss": -12.760372161865234, "global_step": 463002, "epoch": 2755} {"train_loss": -12.694154739379883, "global_step": 463003, "epoch": 2755} {"train_loss": -12.520995140075684, "global_step": 463004, "epoch": 2755} {"train_loss": -12.472797393798828, "global_step": 463005, "epoch": 2755} {"train_loss": -13.043825149536133, "global_step": 463006, "epoch": 2755} {"train_loss": -12.24766324815296, "global_step": 463007, "epoch": 2755, "val_loss": 316450.8125, "train_action_mse_error": 1.9064056873321533} {"train_loss": -11.877195358276367, "global_step": 463008, "epoch": 2756} {"train_loss": -12.319085121154785, "global_step": 463009, "epoch": 2756} {"train_loss": -12.242228507995605, "global_step": 463010, "epoch": 2756} {"train_loss": -12.119562149047852, "global_step": 463011, "epoch": 2756} {"train_loss": -12.774317741394043, "global_step": 463012, "epoch": 2756} {"train_loss": -12.17509651184082, "global_step": 463013, "epoch": 2756} {"train_loss": -12.409225463867188, "global_step": 463014, "epoch": 2756} {"train_loss": -12.541006088256836, "global_step": 463015, "epoch": 2756} {"train_loss": -12.395177841186523, "global_step": 463016, "epoch": 2756} {"train_loss": -12.36263656616211, "global_step": 463017, "epoch": 2756} {"train_loss": -12.120260238647461, "global_step": 463018, "epoch": 2756} {"train_loss": -12.630256652832031, "global_step": 463019, "epoch": 2756} {"train_loss": -12.390238761901855, "global_step": 463020, "epoch": 2756} {"train_loss": -12.407153129577637, "global_step": 463021, "epoch": 2756} {"train_loss": -12.731070518493652, "global_step": 463022, "epoch": 2756} {"train_loss": -12.703622817993164, "global_step": 463023, "epoch": 2756} {"train_loss": -12.72321605682373, "global_step": 463024, "epoch": 2756} {"train_loss": -11.553628921508789, "global_step": 463025, "epoch": 2756} {"train_loss": -12.102087020874023, "global_step": 463026, "epoch": 2756} {"train_loss": -12.63182544708252, "global_step": 463027, "epoch": 2756} {"train_loss": -12.62790584564209, "global_step": 463028, "epoch": 2756} {"train_loss": -12.163318634033203, "global_step": 463029, "epoch": 2756} {"train_loss": -12.069111824035645, "global_step": 463030, "epoch": 2756} {"train_loss": -12.380767822265625, "global_step": 463031, "epoch": 2756} {"train_loss": -12.84858512878418, "global_step": 463032, "epoch": 2756} {"train_loss": -11.907822608947754, "global_step": 463033, "epoch": 2756} {"train_loss": -12.07669448852539, "global_step": 463034, "epoch": 2756} {"train_loss": -12.171485900878906, "global_step": 463035, "epoch": 2756} {"train_loss": -11.497276306152344, "global_step": 463036, "epoch": 2756} {"train_loss": -11.659614562988281, "global_step": 463037, "epoch": 2756} {"train_loss": -12.274477005004883, "global_step": 463038, "epoch": 2756} {"train_loss": -12.629865646362305, "global_step": 463039, "epoch": 2756} {"train_loss": -12.216066360473633, "global_step": 463040, "epoch": 2756} {"train_loss": -12.345331192016602, "global_step": 463041, "epoch": 2756} {"train_loss": -12.255008697509766, "global_step": 463042, "epoch": 2756} {"train_loss": -12.509624481201172, "global_step": 463043, "epoch": 2756} {"train_loss": -12.447702407836914, "global_step": 463044, "epoch": 2756} {"train_loss": -12.177233695983887, "global_step": 463045, "epoch": 2756} {"train_loss": -12.491632461547852, "global_step": 463046, "epoch": 2756} {"train_loss": -12.036420822143555, "global_step": 463047, "epoch": 2756} {"train_loss": -12.086505889892578, "global_step": 463048, "epoch": 2756} {"train_loss": -12.20278549194336, "global_step": 463049, "epoch": 2756} {"train_loss": -12.25008773803711, "global_step": 463050, "epoch": 2756} {"train_loss": -12.220044136047363, "global_step": 463051, "epoch": 2756} {"train_loss": -12.200071334838867, "global_step": 463052, "epoch": 2756} {"train_loss": -11.741437911987305, "global_step": 463053, "epoch": 2756} {"train_loss": -11.847684860229492, "global_step": 463054, "epoch": 2756} {"train_loss": -12.30695915222168, "global_step": 463055, "epoch": 2756} {"train_loss": -11.693868637084961, "global_step": 463056, "epoch": 2756} {"train_loss": -11.589068412780762, "global_step": 463057, "epoch": 2756} {"train_loss": -12.268646240234375, "global_step": 463058, "epoch": 2756} {"train_loss": -11.329916000366211, "global_step": 463059, "epoch": 2756} {"train_loss": -11.033720016479492, "global_step": 463060, "epoch": 2756} {"train_loss": -12.199493408203125, "global_step": 463061, "epoch": 2756} {"train_loss": -11.375532150268555, "global_step": 463062, "epoch": 2756} {"train_loss": -12.09621810913086, "global_step": 463063, "epoch": 2756} {"train_loss": -11.83450984954834, "global_step": 463064, "epoch": 2756} {"train_loss": -11.447343826293945, "global_step": 463065, "epoch": 2756} {"train_loss": -11.625142097473145, "global_step": 463066, "epoch": 2756} {"train_loss": -12.025862693786621, "global_step": 463067, "epoch": 2756} {"train_loss": -11.327198028564453, "global_step": 463068, "epoch": 2756} {"train_loss": -12.219244003295898, "global_step": 463069, "epoch": 2756} {"train_loss": -12.008607864379883, "global_step": 463070, "epoch": 2756} {"train_loss": -12.289196014404297, "global_step": 463071, "epoch": 2756} {"train_loss": -12.344542503356934, "global_step": 463072, "epoch": 2756} {"train_loss": -12.403861999511719, "global_step": 463073, "epoch": 2756} {"train_loss": -11.953271865844727, "global_step": 463074, "epoch": 2756} {"train_loss": -12.118353843688965, "global_step": 463075, "epoch": 2756} {"train_loss": -12.423603057861328, "global_step": 463076, "epoch": 2756} {"train_loss": -12.48260498046875, "global_step": 463077, "epoch": 2756} {"train_loss": -12.322303771972656, "global_step": 463078, "epoch": 2756} {"train_loss": -12.583290100097656, "global_step": 463079, "epoch": 2756} {"train_loss": -12.138219833374023, "global_step": 463080, "epoch": 2756} {"train_loss": -12.056100845336914, "global_step": 463081, "epoch": 2756} {"train_loss": -12.292583465576172, "global_step": 463082, "epoch": 2756} {"train_loss": -12.220344543457031, "global_step": 463083, "epoch": 2756} {"train_loss": -11.906827926635742, "global_step": 463084, "epoch": 2756} {"train_loss": -12.384739875793457, "global_step": 463085, "epoch": 2756} {"train_loss": -12.181829452514648, "global_step": 463086, "epoch": 2756} {"train_loss": -12.436973571777344, "global_step": 463087, "epoch": 2756} {"train_loss": -12.260171890258789, "global_step": 463088, "epoch": 2756} {"train_loss": -12.496784210205078, "global_step": 463089, "epoch": 2756} {"train_loss": -12.57058048248291, "global_step": 463090, "epoch": 2756} {"train_loss": -12.163540840148926, "global_step": 463091, "epoch": 2756} {"train_loss": -12.345233917236328, "global_step": 463092, "epoch": 2756} {"train_loss": -12.501691818237305, "global_step": 463093, "epoch": 2756} {"train_loss": -11.456010818481445, "global_step": 463094, "epoch": 2756} {"train_loss": -12.424691200256348, "global_step": 463095, "epoch": 2756} {"train_loss": -12.35051155090332, "global_step": 463096, "epoch": 2756} {"train_loss": -11.239412307739258, "global_step": 463097, "epoch": 2756} {"train_loss": -12.392862319946289, "global_step": 463098, "epoch": 2756} {"train_loss": -11.812456130981445, "global_step": 463099, "epoch": 2756} {"train_loss": -11.720949172973633, "global_step": 463100, "epoch": 2756} {"train_loss": -12.503305435180664, "global_step": 463101, "epoch": 2756} {"train_loss": -11.549242973327637, "global_step": 463102, "epoch": 2756} {"train_loss": -11.9986572265625, "global_step": 463103, "epoch": 2756} {"train_loss": -12.571487426757812, "global_step": 463104, "epoch": 2756} {"train_loss": -11.441868782043457, "global_step": 463105, "epoch": 2756} {"train_loss": -12.185022354125977, "global_step": 463106, "epoch": 2756} {"train_loss": -12.20372486114502, "global_step": 463107, "epoch": 2756} {"train_loss": -12.35207748413086, "global_step": 463108, "epoch": 2756} {"train_loss": -11.958627700805664, "global_step": 463109, "epoch": 2756} {"train_loss": -12.046733856201172, "global_step": 463110, "epoch": 2756} {"train_loss": -12.551387786865234, "global_step": 463111, "epoch": 2756} {"train_loss": -12.156662940979004, "global_step": 463112, "epoch": 2756} {"train_loss": -12.287353515625, "global_step": 463113, "epoch": 2756} {"train_loss": -12.294851303100586, "global_step": 463114, "epoch": 2756} {"train_loss": -12.299856185913086, "global_step": 463115, "epoch": 2756} {"train_loss": -12.453176498413086, "global_step": 463116, "epoch": 2756} {"train_loss": -12.043343544006348, "global_step": 463117, "epoch": 2756} {"train_loss": -12.632210731506348, "global_step": 463118, "epoch": 2756} {"train_loss": -12.50628662109375, "global_step": 463119, "epoch": 2756} {"train_loss": -12.588805198669434, "global_step": 463120, "epoch": 2756} {"train_loss": -12.618906021118164, "global_step": 463121, "epoch": 2756} {"train_loss": -12.439594268798828, "global_step": 463122, "epoch": 2756} {"train_loss": -12.971942901611328, "global_step": 463123, "epoch": 2756} {"train_loss": -12.380550384521484, "global_step": 463124, "epoch": 2756} {"train_loss": -12.875844955444336, "global_step": 463125, "epoch": 2756} {"train_loss": -12.480118751525879, "global_step": 463126, "epoch": 2756} {"train_loss": -12.873054504394531, "global_step": 463127, "epoch": 2756} {"train_loss": -12.482139587402344, "global_step": 463128, "epoch": 2756} {"train_loss": -12.780052185058594, "global_step": 463129, "epoch": 2756} {"train_loss": -12.714271545410156, "global_step": 463130, "epoch": 2756} {"train_loss": -12.85684585571289, "global_step": 463131, "epoch": 2756} {"train_loss": -12.622852325439453, "global_step": 463132, "epoch": 2756} {"train_loss": -12.679240226745605, "global_step": 463133, "epoch": 2756} {"train_loss": -12.378296852111816, "global_step": 463134, "epoch": 2756} {"train_loss": -12.755630493164062, "global_step": 463135, "epoch": 2756} {"train_loss": -12.65321159362793, "global_step": 463136, "epoch": 2756} {"train_loss": -12.819181442260742, "global_step": 463137, "epoch": 2756} {"train_loss": -12.847254753112793, "global_step": 463138, "epoch": 2756} {"train_loss": -12.893241882324219, "global_step": 463139, "epoch": 2756} {"train_loss": -12.835868835449219, "global_step": 463140, "epoch": 2756} {"train_loss": -12.994989395141602, "global_step": 463141, "epoch": 2756} {"train_loss": -12.52780532836914, "global_step": 463142, "epoch": 2756} {"train_loss": -12.6196928024292, "global_step": 463143, "epoch": 2756} {"train_loss": -12.951176643371582, "global_step": 463144, "epoch": 2756} {"train_loss": -12.501199722290039, "global_step": 463145, "epoch": 2756} {"train_loss": -12.789459228515625, "global_step": 463146, "epoch": 2756} {"train_loss": -12.718719482421875, "global_step": 463147, "epoch": 2756} {"train_loss": -12.806619644165039, "global_step": 463148, "epoch": 2756} {"train_loss": -12.453384399414062, "global_step": 463149, "epoch": 2756} {"train_loss": -12.696585655212402, "global_step": 463150, "epoch": 2756} {"train_loss": -12.3910551071167, "global_step": 463151, "epoch": 2756} {"train_loss": -11.504144668579102, "global_step": 463152, "epoch": 2756} {"train_loss": -11.52775764465332, "global_step": 463153, "epoch": 2756} {"train_loss": -12.585639953613281, "global_step": 463154, "epoch": 2756} {"train_loss": -11.869277000427246, "global_step": 463155, "epoch": 2756} {"train_loss": -11.77212905883789, "global_step": 463156, "epoch": 2756} {"train_loss": -12.2788724899292, "global_step": 463157, "epoch": 2756} {"train_loss": -11.79224681854248, "global_step": 463158, "epoch": 2756} {"train_loss": -11.469306945800781, "global_step": 463159, "epoch": 2756} {"train_loss": -12.346040725708008, "global_step": 463160, "epoch": 2756} {"train_loss": -11.642763137817383, "global_step": 463161, "epoch": 2756} {"train_loss": -12.413063049316406, "global_step": 463162, "epoch": 2756} {"train_loss": -12.236329078674316, "global_step": 463163, "epoch": 2756} {"train_loss": -11.822386741638184, "global_step": 463164, "epoch": 2756} {"train_loss": -12.473531723022461, "global_step": 463165, "epoch": 2756} {"train_loss": -12.222271919250488, "global_step": 463166, "epoch": 2756} {"train_loss": -11.190364837646484, "global_step": 463167, "epoch": 2756} {"train_loss": -11.789752960205078, "global_step": 463168, "epoch": 2756} {"train_loss": -11.836578369140625, "global_step": 463169, "epoch": 2756} {"train_loss": -10.961053848266602, "global_step": 463170, "epoch": 2756} {"train_loss": -11.952505111694336, "global_step": 463171, "epoch": 2756} {"train_loss": -11.50984001159668, "global_step": 463172, "epoch": 2756} {"train_loss": -11.730195999145508, "global_step": 463173, "epoch": 2756} {"train_loss": -11.783019065856934, "global_step": 463174, "epoch": 2756} {"train_loss": -12.226934807641166, "global_step": 463175, "epoch": 2756, "val_loss": 318852.65625} {"train_loss": -11.240534782409668, "global_step": 463176, "epoch": 2757} {"train_loss": -10.915192604064941, "global_step": 463177, "epoch": 2757} {"train_loss": -11.882889747619629, "global_step": 463178, "epoch": 2757} {"train_loss": -11.144379615783691, "global_step": 463179, "epoch": 2757} {"train_loss": -11.44847297668457, "global_step": 463180, "epoch": 2757} {"train_loss": -11.864401817321777, "global_step": 463181, "epoch": 2757} {"train_loss": -11.815899848937988, "global_step": 463182, "epoch": 2757} {"train_loss": -12.130149841308594, "global_step": 463183, "epoch": 2757} {"train_loss": -12.396280288696289, "global_step": 463184, "epoch": 2757} {"train_loss": -11.206571578979492, "global_step": 463185, "epoch": 2757} {"train_loss": -12.003438949584961, "global_step": 463186, "epoch": 2757} {"train_loss": -11.438009262084961, "global_step": 463187, "epoch": 2757} {"train_loss": -11.576742172241211, "global_step": 463188, "epoch": 2757} {"train_loss": -12.162059783935547, "global_step": 463189, "epoch": 2757} {"train_loss": -10.976966857910156, "global_step": 463190, "epoch": 2757} {"train_loss": -11.313122749328613, "global_step": 463191, "epoch": 2757} {"train_loss": -10.815004348754883, "global_step": 463192, "epoch": 2757} {"train_loss": -11.073381423950195, "global_step": 463193, "epoch": 2757} {"train_loss": -11.497237205505371, "global_step": 463194, "epoch": 2757} {"train_loss": -10.903417587280273, "global_step": 463195, "epoch": 2757} {"train_loss": -11.977306365966797, "global_step": 463196, "epoch": 2757} {"train_loss": -11.450384140014648, "global_step": 463197, "epoch": 2757} {"train_loss": -12.398506164550781, "global_step": 463198, "epoch": 2757} {"train_loss": -11.381446838378906, "global_step": 463199, "epoch": 2757} {"train_loss": -12.300088882446289, "global_step": 463200, "epoch": 2757} {"train_loss": -12.177751541137695, "global_step": 463201, "epoch": 2757} {"train_loss": -11.95796012878418, "global_step": 463202, "epoch": 2757} {"train_loss": -12.026958465576172, "global_step": 463203, "epoch": 2757} {"train_loss": -12.008044242858887, "global_step": 463204, "epoch": 2757} {"train_loss": -12.10236644744873, "global_step": 463205, "epoch": 2757} {"train_loss": -11.820486068725586, "global_step": 463206, "epoch": 2757} {"train_loss": -11.31645679473877, "global_step": 463207, "epoch": 2757} {"train_loss": -12.359125137329102, "global_step": 463208, "epoch": 2757} {"train_loss": -11.726509094238281, "global_step": 463209, "epoch": 2757} {"train_loss": -11.985848426818848, "global_step": 463210, "epoch": 2757} {"train_loss": -11.767261505126953, "global_step": 463211, "epoch": 2757} {"train_loss": -12.130966186523438, "global_step": 463212, "epoch": 2757} {"train_loss": -12.071601867675781, "global_step": 463213, "epoch": 2757} {"train_loss": -11.446999549865723, "global_step": 463214, "epoch": 2757} {"train_loss": -11.510848999023438, "global_step": 463215, "epoch": 2757} {"train_loss": -11.75629997253418, "global_step": 463216, "epoch": 2757} {"train_loss": -11.790700912475586, "global_step": 463217, "epoch": 2757} {"train_loss": -11.879453659057617, "global_step": 463218, "epoch": 2757} {"train_loss": -11.538309097290039, "global_step": 463219, "epoch": 2757} {"train_loss": -12.035155296325684, "global_step": 463220, "epoch": 2757} {"train_loss": -12.081562995910645, "global_step": 463221, "epoch": 2757} {"train_loss": -12.30593490600586, "global_step": 463222, "epoch": 2757} {"train_loss": -12.250804901123047, "global_step": 463223, "epoch": 2757} {"train_loss": -12.01856803894043, "global_step": 463224, "epoch": 2757} {"train_loss": -12.12735652923584, "global_step": 463225, "epoch": 2757} {"train_loss": -11.692305564880371, "global_step": 463226, "epoch": 2757} {"train_loss": -11.98485279083252, "global_step": 463227, "epoch": 2757} {"train_loss": -11.900772094726562, "global_step": 463228, "epoch": 2757} {"train_loss": -12.124090194702148, "global_step": 463229, "epoch": 2757} {"train_loss": -11.53626823425293, "global_step": 463230, "epoch": 2757} {"train_loss": -11.28693675994873, "global_step": 463231, "epoch": 2757} {"train_loss": -11.738162994384766, "global_step": 463232, "epoch": 2757} {"train_loss": -11.947334289550781, "global_step": 463233, "epoch": 2757} {"train_loss": -12.08430290222168, "global_step": 463234, "epoch": 2757} {"train_loss": -11.884361267089844, "global_step": 463235, "epoch": 2757} {"train_loss": -12.327596664428711, "global_step": 463236, "epoch": 2757} {"train_loss": -12.143045425415039, "global_step": 463237, "epoch": 2757} {"train_loss": -11.779926300048828, "global_step": 463238, "epoch": 2757} {"train_loss": -12.049964904785156, "global_step": 463239, "epoch": 2757} {"train_loss": -12.156839370727539, "global_step": 463240, "epoch": 2757} {"train_loss": -11.943946838378906, "global_step": 463241, "epoch": 2757} {"train_loss": -11.974767684936523, "global_step": 463242, "epoch": 2757} {"train_loss": -12.355052947998047, "global_step": 463243, "epoch": 2757} {"train_loss": -12.30607795715332, "global_step": 463244, "epoch": 2757} {"train_loss": -12.305386543273926, "global_step": 463245, "epoch": 2757} {"train_loss": -12.087543487548828, "global_step": 463246, "epoch": 2757} {"train_loss": -12.437922477722168, "global_step": 463247, "epoch": 2757} {"train_loss": -12.426158905029297, "global_step": 463248, "epoch": 2757} {"train_loss": -12.503057479858398, "global_step": 463249, "epoch": 2757} {"train_loss": -12.530242919921875, "global_step": 463250, "epoch": 2757} {"train_loss": -12.491071701049805, "global_step": 463251, "epoch": 2757} {"train_loss": -12.368131637573242, "global_step": 463252, "epoch": 2757} {"train_loss": -12.635334014892578, "global_step": 463253, "epoch": 2757} {"train_loss": -12.302169799804688, "global_step": 463254, "epoch": 2757} {"train_loss": -12.46713638305664, "global_step": 463255, "epoch": 2757} {"train_loss": -12.314743041992188, "global_step": 463256, "epoch": 2757} {"train_loss": -12.584099769592285, "global_step": 463257, "epoch": 2757} {"train_loss": -12.312129020690918, "global_step": 463258, "epoch": 2757} {"train_loss": -12.543025970458984, "global_step": 463259, "epoch": 2757} {"train_loss": -12.639607429504395, "global_step": 463260, "epoch": 2757} {"train_loss": -12.735751152038574, "global_step": 463261, "epoch": 2757} {"train_loss": -12.440784454345703, "global_step": 463262, "epoch": 2757} {"train_loss": -12.709297180175781, "global_step": 463263, "epoch": 2757} {"train_loss": -12.55518627166748, "global_step": 463264, "epoch": 2757} {"train_loss": -12.520503997802734, "global_step": 463265, "epoch": 2757} {"train_loss": -12.502439498901367, "global_step": 463266, "epoch": 2757} {"train_loss": -12.591407775878906, "global_step": 463267, "epoch": 2757} {"train_loss": -12.57066535949707, "global_step": 463268, "epoch": 2757} {"train_loss": -12.550801277160645, "global_step": 463269, "epoch": 2757} {"train_loss": -12.728092193603516, "global_step": 463270, "epoch": 2757} {"train_loss": -12.734953880310059, "global_step": 463271, "epoch": 2757} {"train_loss": -12.810102462768555, "global_step": 463272, "epoch": 2757} {"train_loss": -12.816343307495117, "global_step": 463273, "epoch": 2757} {"train_loss": -12.675907135009766, "global_step": 463274, "epoch": 2757} {"train_loss": -12.879901885986328, "global_step": 463275, "epoch": 2757} {"train_loss": -12.829514503479004, "global_step": 463276, "epoch": 2757} {"train_loss": -12.847749710083008, "global_step": 463277, "epoch": 2757} {"train_loss": -12.692142486572266, "global_step": 463278, "epoch": 2757} {"train_loss": -13.010957717895508, "global_step": 463279, "epoch": 2757} {"train_loss": -12.78790283203125, "global_step": 463280, "epoch": 2757} {"train_loss": -12.668476104736328, "global_step": 463281, "epoch": 2757} {"train_loss": -12.759242057800293, "global_step": 463282, "epoch": 2757} {"train_loss": -12.912473678588867, "global_step": 463283, "epoch": 2757} {"train_loss": -12.535594940185547, "global_step": 463284, "epoch": 2757} {"train_loss": -12.866996765136719, "global_step": 463285, "epoch": 2757} {"train_loss": -12.705541610717773, "global_step": 463286, "epoch": 2757} {"train_loss": -12.031631469726562, "global_step": 463287, "epoch": 2757} {"train_loss": -12.380802154541016, "global_step": 463288, "epoch": 2757} {"train_loss": -12.68533706665039, "global_step": 463289, "epoch": 2757} {"train_loss": -12.720208168029785, "global_step": 463290, "epoch": 2757} {"train_loss": -12.413253784179688, "global_step": 463291, "epoch": 2757} {"train_loss": -12.684538841247559, "global_step": 463292, "epoch": 2757} {"train_loss": -12.10853385925293, "global_step": 463293, "epoch": 2757} {"train_loss": -12.256956100463867, "global_step": 463294, "epoch": 2757} {"train_loss": -12.842113494873047, "global_step": 463295, "epoch": 2757} {"train_loss": -12.745933532714844, "global_step": 463296, "epoch": 2757} {"train_loss": -12.903677940368652, "global_step": 463297, "epoch": 2757} {"train_loss": -12.93795108795166, "global_step": 463298, "epoch": 2757} {"train_loss": -12.825826644897461, "global_step": 463299, "epoch": 2757} {"train_loss": -12.819710731506348, "global_step": 463300, "epoch": 2757} {"train_loss": -12.537628173828125, "global_step": 463301, "epoch": 2757} {"train_loss": -12.535674095153809, "global_step": 463302, "epoch": 2757} {"train_loss": -12.581668853759766, "global_step": 463303, "epoch": 2757} {"train_loss": -12.69749641418457, "global_step": 463304, "epoch": 2757} {"train_loss": -12.369693756103516, "global_step": 463305, "epoch": 2757} {"train_loss": -12.896240234375, "global_step": 463306, "epoch": 2757} {"train_loss": -12.713279724121094, "global_step": 463307, "epoch": 2757} {"train_loss": -12.644890785217285, "global_step": 463308, "epoch": 2757} {"train_loss": -12.49980354309082, "global_step": 463309, "epoch": 2757} {"train_loss": -13.00478744506836, "global_step": 463310, "epoch": 2757} {"train_loss": -12.342582702636719, "global_step": 463311, "epoch": 2757} {"train_loss": -12.584327697753906, "global_step": 463312, "epoch": 2757} {"train_loss": -12.651941299438477, "global_step": 463313, "epoch": 2757} {"train_loss": -12.805562019348145, "global_step": 463314, "epoch": 2757} {"train_loss": -12.322479248046875, "global_step": 463315, "epoch": 2757} {"train_loss": -12.782905578613281, "global_step": 463316, "epoch": 2757} {"train_loss": -12.77957534790039, "global_step": 463317, "epoch": 2757} {"train_loss": -12.311283111572266, "global_step": 463318, "epoch": 2757} {"train_loss": -12.48569393157959, "global_step": 463319, "epoch": 2757} {"train_loss": -12.896851539611816, "global_step": 463320, "epoch": 2757} {"train_loss": -12.720839500427246, "global_step": 463321, "epoch": 2757} {"train_loss": -12.542478561401367, "global_step": 463322, "epoch": 2757} {"train_loss": -12.905111312866211, "global_step": 463323, "epoch": 2757} {"train_loss": -12.740674018859863, "global_step": 463324, "epoch": 2757} {"train_loss": -12.645995140075684, "global_step": 463325, "epoch": 2757} {"train_loss": -12.648524284362793, "global_step": 463326, "epoch": 2757} {"train_loss": -12.45094108581543, "global_step": 463327, "epoch": 2757} {"train_loss": -12.900887489318848, "global_step": 463328, "epoch": 2757} {"train_loss": -12.68921184539795, "global_step": 463329, "epoch": 2757} {"train_loss": -12.417606353759766, "global_step": 463330, "epoch": 2757} {"train_loss": -12.516990661621094, "global_step": 463331, "epoch": 2757} {"train_loss": -13.077820777893066, "global_step": 463332, "epoch": 2757} {"train_loss": -12.561248779296875, "global_step": 463333, "epoch": 2757} {"train_loss": -12.6795072555542, "global_step": 463334, "epoch": 2757} {"train_loss": -12.574837684631348, "global_step": 463335, "epoch": 2757} {"train_loss": -12.246965408325195, "global_step": 463336, "epoch": 2757} {"train_loss": -11.307653427124023, "global_step": 463337, "epoch": 2757} {"train_loss": -12.231437683105469, "global_step": 463338, "epoch": 2757} {"train_loss": -12.82874870300293, "global_step": 463339, "epoch": 2757} {"train_loss": -11.277482986450195, "global_step": 463340, "epoch": 2757} {"train_loss": -12.506810188293457, "global_step": 463341, "epoch": 2757} {"train_loss": -12.347742080688477, "global_step": 463342, "epoch": 2757} {"train_loss": -12.263845188277108, "global_step": 463343, "epoch": 2757, "val_loss": 315621.40625} {"train_loss": -12.450336456298828, "global_step": 463344, "epoch": 2758} {"train_loss": -12.473960876464844, "global_step": 463345, "epoch": 2758} {"train_loss": -12.358871459960938, "global_step": 463346, "epoch": 2758} {"train_loss": -11.47335433959961, "global_step": 463347, "epoch": 2758} {"train_loss": -11.998676300048828, "global_step": 463348, "epoch": 2758} {"train_loss": -12.003698348999023, "global_step": 463349, "epoch": 2758} {"train_loss": -11.13656997680664, "global_step": 463350, "epoch": 2758} {"train_loss": -11.196499824523926, "global_step": 463351, "epoch": 2758} {"train_loss": -11.64245891571045, "global_step": 463352, "epoch": 2758} {"train_loss": -8.872360229492188, "global_step": 463353, "epoch": 2758} {"train_loss": -10.909444808959961, "global_step": 463354, "epoch": 2758} {"train_loss": -10.214546203613281, "global_step": 463355, "epoch": 2758} {"train_loss": -9.200410842895508, "global_step": 463356, "epoch": 2758} {"train_loss": -9.62583065032959, "global_step": 463357, "epoch": 2758} {"train_loss": -11.559381484985352, "global_step": 463358, "epoch": 2758} {"train_loss": -11.094018936157227, "global_step": 463359, "epoch": 2758} {"train_loss": -11.286540985107422, "global_step": 463360, "epoch": 2758} {"train_loss": -11.666460037231445, "global_step": 463361, "epoch": 2758} {"train_loss": -10.827874183654785, "global_step": 463362, "epoch": 2758} {"train_loss": -11.642695426940918, "global_step": 463363, "epoch": 2758} {"train_loss": -9.02587890625, "global_step": 463364, "epoch": 2758} {"train_loss": -9.54359245300293, "global_step": 463365, "epoch": 2758} {"train_loss": -10.859716415405273, "global_step": 463366, "epoch": 2758} {"train_loss": -9.756219863891602, "global_step": 463367, "epoch": 2758} {"train_loss": -8.33065414428711, "global_step": 463368, "epoch": 2758} {"train_loss": -8.365762710571289, "global_step": 463369, "epoch": 2758} {"train_loss": -8.765735626220703, "global_step": 463370, "epoch": 2758} {"train_loss": -9.29208755493164, "global_step": 463371, "epoch": 2758} {"train_loss": -9.212303161621094, "global_step": 463372, "epoch": 2758} {"train_loss": -8.610101699829102, "global_step": 463373, "epoch": 2758} {"train_loss": -8.448576927185059, "global_step": 463374, "epoch": 2758} {"train_loss": -9.302145004272461, "global_step": 463375, "epoch": 2758} {"train_loss": -9.351398468017578, "global_step": 463376, "epoch": 2758} {"train_loss": -9.65992259979248, "global_step": 463377, "epoch": 2758} {"train_loss": -9.766154289245605, "global_step": 463378, "epoch": 2758} {"train_loss": -10.190672874450684, "global_step": 463379, "epoch": 2758} {"train_loss": -10.231731414794922, "global_step": 463380, "epoch": 2758} {"train_loss": -10.237407684326172, "global_step": 463381, "epoch": 2758} {"train_loss": -10.750367164611816, "global_step": 463382, "epoch": 2758} {"train_loss": -10.987112998962402, "global_step": 463383, "epoch": 2758} {"train_loss": -10.858694076538086, "global_step": 463384, "epoch": 2758} {"train_loss": -10.881326675415039, "global_step": 463385, "epoch": 2758} {"train_loss": -10.93587875366211, "global_step": 463386, "epoch": 2758} {"train_loss": -11.474567413330078, "global_step": 463387, "epoch": 2758} {"train_loss": -11.397513389587402, "global_step": 463388, "epoch": 2758} {"train_loss": -11.133816719055176, "global_step": 463389, "epoch": 2758} {"train_loss": -11.586478233337402, "global_step": 463390, "epoch": 2758} {"train_loss": -11.185507774353027, "global_step": 463391, "epoch": 2758} {"train_loss": -11.923300743103027, "global_step": 463392, "epoch": 2758} {"train_loss": -11.718170166015625, "global_step": 463393, "epoch": 2758} {"train_loss": -11.765498161315918, "global_step": 463394, "epoch": 2758} {"train_loss": -11.494016647338867, "global_step": 463395, "epoch": 2758} {"train_loss": -11.735517501831055, "global_step": 463396, "epoch": 2758} {"train_loss": -12.236825942993164, "global_step": 463397, "epoch": 2758} {"train_loss": -11.936920166015625, "global_step": 463398, "epoch": 2758} {"train_loss": -11.911012649536133, "global_step": 463399, "epoch": 2758} {"train_loss": -12.357906341552734, "global_step": 463400, "epoch": 2758} {"train_loss": -11.903704643249512, "global_step": 463401, "epoch": 2758} {"train_loss": -12.063056945800781, "global_step": 463402, "epoch": 2758} {"train_loss": -12.261208534240723, "global_step": 463403, "epoch": 2758} {"train_loss": -11.656761169433594, "global_step": 463404, "epoch": 2758} {"train_loss": -12.134014129638672, "global_step": 463405, "epoch": 2758} {"train_loss": -11.959716796875, "global_step": 463406, "epoch": 2758} {"train_loss": -12.275426864624023, "global_step": 463407, "epoch": 2758} {"train_loss": -12.162556648254395, "global_step": 463408, "epoch": 2758} {"train_loss": -12.014991760253906, "global_step": 463409, "epoch": 2758} {"train_loss": -12.377020835876465, "global_step": 463410, "epoch": 2758} {"train_loss": -12.428735733032227, "global_step": 463411, "epoch": 2758} {"train_loss": -12.472358703613281, "global_step": 463412, "epoch": 2758} {"train_loss": -12.510889053344727, "global_step": 463413, "epoch": 2758} {"train_loss": -12.435151100158691, "global_step": 463414, "epoch": 2758} {"train_loss": -12.389863967895508, "global_step": 463415, "epoch": 2758} {"train_loss": -12.16356372833252, "global_step": 463416, "epoch": 2758} {"train_loss": -12.485990524291992, "global_step": 463417, "epoch": 2758} {"train_loss": -12.293582916259766, "global_step": 463418, "epoch": 2758} {"train_loss": -12.416801452636719, "global_step": 463419, "epoch": 2758} {"train_loss": -12.752010345458984, "global_step": 463420, "epoch": 2758} {"train_loss": -12.69249439239502, "global_step": 463421, "epoch": 2758} {"train_loss": -12.671875, "global_step": 463422, "epoch": 2758} {"train_loss": -12.50632095336914, "global_step": 463423, "epoch": 2758} {"train_loss": -12.681920051574707, "global_step": 463424, "epoch": 2758} {"train_loss": -12.57204818725586, "global_step": 463425, "epoch": 2758} {"train_loss": -12.676408767700195, "global_step": 463426, "epoch": 2758} {"train_loss": -12.736123085021973, "global_step": 463427, "epoch": 2758} {"train_loss": -12.624540328979492, "global_step": 463428, "epoch": 2758} {"train_loss": -12.545833587646484, "global_step": 463429, "epoch": 2758} {"train_loss": -12.654988288879395, "global_step": 463430, "epoch": 2758} {"train_loss": -12.566742897033691, "global_step": 463431, "epoch": 2758} {"train_loss": -12.701244354248047, "global_step": 463432, "epoch": 2758} {"train_loss": -12.570104598999023, "global_step": 463433, "epoch": 2758} {"train_loss": -12.749628067016602, "global_step": 463434, "epoch": 2758} {"train_loss": -12.830530166625977, "global_step": 463435, "epoch": 2758} {"train_loss": -12.598623275756836, "global_step": 463436, "epoch": 2758} {"train_loss": -12.578433990478516, "global_step": 463437, "epoch": 2758} {"train_loss": -12.742260932922363, "global_step": 463438, "epoch": 2758} {"train_loss": -12.218259811401367, "global_step": 463439, "epoch": 2758} {"train_loss": -12.626957893371582, "global_step": 463440, "epoch": 2758} {"train_loss": -12.370564460754395, "global_step": 463441, "epoch": 2758} {"train_loss": -12.62894058227539, "global_step": 463442, "epoch": 2758} {"train_loss": -12.185895919799805, "global_step": 463443, "epoch": 2758} {"train_loss": -12.64871597290039, "global_step": 463444, "epoch": 2758} {"train_loss": -12.510417938232422, "global_step": 463445, "epoch": 2758} {"train_loss": -12.636809349060059, "global_step": 463446, "epoch": 2758} {"train_loss": -12.581985473632812, "global_step": 463447, "epoch": 2758} {"train_loss": -12.548221588134766, "global_step": 463448, "epoch": 2758} {"train_loss": -11.810464859008789, "global_step": 463449, "epoch": 2758} {"train_loss": -12.405284881591797, "global_step": 463450, "epoch": 2758} {"train_loss": -12.344643592834473, "global_step": 463451, "epoch": 2758} {"train_loss": -12.130351066589355, "global_step": 463452, "epoch": 2758} {"train_loss": -11.807832717895508, "global_step": 463453, "epoch": 2758} {"train_loss": -12.639068603515625, "global_step": 463454, "epoch": 2758} {"train_loss": -10.860918998718262, "global_step": 463455, "epoch": 2758} {"train_loss": -11.773958206176758, "global_step": 463456, "epoch": 2758} {"train_loss": -11.326221466064453, "global_step": 463457, "epoch": 2758} {"train_loss": -12.216848373413086, "global_step": 463458, "epoch": 2758} {"train_loss": -12.473876953125, "global_step": 463459, "epoch": 2758} {"train_loss": -11.559908866882324, "global_step": 463460, "epoch": 2758} {"train_loss": -12.418916702270508, "global_step": 463461, "epoch": 2758} {"train_loss": -11.195491790771484, "global_step": 463462, "epoch": 2758} {"train_loss": -12.238712310791016, "global_step": 463463, "epoch": 2758} {"train_loss": -11.865446090698242, "global_step": 463464, "epoch": 2758} {"train_loss": -12.381304740905762, "global_step": 463465, "epoch": 2758} {"train_loss": -11.317994117736816, "global_step": 463466, "epoch": 2758} {"train_loss": -11.94422721862793, "global_step": 463467, "epoch": 2758} {"train_loss": -11.901582717895508, "global_step": 463468, "epoch": 2758} {"train_loss": -11.769054412841797, "global_step": 463469, "epoch": 2758} {"train_loss": -11.835277557373047, "global_step": 463470, "epoch": 2758} {"train_loss": -12.295272827148438, "global_step": 463471, "epoch": 2758} {"train_loss": -11.892995834350586, "global_step": 463472, "epoch": 2758} {"train_loss": -11.508085250854492, "global_step": 463473, "epoch": 2758} {"train_loss": -12.264166831970215, "global_step": 463474, "epoch": 2758} {"train_loss": -11.937915802001953, "global_step": 463475, "epoch": 2758} {"train_loss": -11.475725173950195, "global_step": 463476, "epoch": 2758} {"train_loss": -12.16625690460205, "global_step": 463477, "epoch": 2758} {"train_loss": -11.613436698913574, "global_step": 463478, "epoch": 2758} {"train_loss": -12.398548126220703, "global_step": 463479, "epoch": 2758} {"train_loss": -11.289867401123047, "global_step": 463480, "epoch": 2758} {"train_loss": -11.518254280090332, "global_step": 463481, "epoch": 2758} {"train_loss": -12.216773986816406, "global_step": 463482, "epoch": 2758} {"train_loss": -10.391999244689941, "global_step": 463483, "epoch": 2758} {"train_loss": -11.323474884033203, "global_step": 463484, "epoch": 2758} {"train_loss": -10.587621688842773, "global_step": 463485, "epoch": 2758} {"train_loss": -10.975637435913086, "global_step": 463486, "epoch": 2758} {"train_loss": -10.56885051727295, "global_step": 463487, "epoch": 2758} {"train_loss": -11.852408409118652, "global_step": 463488, "epoch": 2758} {"train_loss": -11.616327285766602, "global_step": 463489, "epoch": 2758} {"train_loss": -11.781420707702637, "global_step": 463490, "epoch": 2758} {"train_loss": -11.759565353393555, "global_step": 463491, "epoch": 2758} {"train_loss": -10.196622848510742, "global_step": 463492, "epoch": 2758} {"train_loss": -11.695018768310547, "global_step": 463493, "epoch": 2758} {"train_loss": -11.312719345092773, "global_step": 463494, "epoch": 2758} {"train_loss": -12.21101188659668, "global_step": 463495, "epoch": 2758} {"train_loss": -11.920098304748535, "global_step": 463496, "epoch": 2758} {"train_loss": -12.449390411376953, "global_step": 463497, "epoch": 2758} {"train_loss": -12.453557968139648, "global_step": 463498, "epoch": 2758} {"train_loss": -12.029191970825195, "global_step": 463499, "epoch": 2758} {"train_loss": -12.568524360656738, "global_step": 463500, "epoch": 2758} {"train_loss": -12.221832275390625, "global_step": 463501, "epoch": 2758} {"train_loss": -12.469864845275879, "global_step": 463502, "epoch": 2758} {"train_loss": -12.438626289367676, "global_step": 463503, "epoch": 2758} {"train_loss": -12.449203491210938, "global_step": 463504, "epoch": 2758} {"train_loss": -12.705702781677246, "global_step": 463505, "epoch": 2758} {"train_loss": -12.656798362731934, "global_step": 463506, "epoch": 2758} {"train_loss": -12.462398529052734, "global_step": 463507, "epoch": 2758} {"train_loss": -12.699629783630371, "global_step": 463508, "epoch": 2758} {"train_loss": -12.548117637634277, "global_step": 463509, "epoch": 2758} {"train_loss": -12.54252815246582, "global_step": 463510, "epoch": 2758} {"train_loss": -11.65972105662028, "global_step": 463511, "epoch": 2758, "val_loss": 317980.34375} {"train_loss": -12.66669750213623, "global_step": 463512, "epoch": 2759} {"train_loss": -12.46689510345459, "global_step": 463513, "epoch": 2759} {"train_loss": -12.573665618896484, "global_step": 463514, "epoch": 2759} {"train_loss": -12.430318832397461, "global_step": 463515, "epoch": 2759} {"train_loss": -12.475340843200684, "global_step": 463516, "epoch": 2759} {"train_loss": -12.807819366455078, "global_step": 463517, "epoch": 2759} {"train_loss": -12.45236873626709, "global_step": 463518, "epoch": 2759} {"train_loss": -12.562849044799805, "global_step": 463519, "epoch": 2759} {"train_loss": -12.300657272338867, "global_step": 463520, "epoch": 2759} {"train_loss": -12.608866691589355, "global_step": 463521, "epoch": 2759} {"train_loss": -12.759638786315918, "global_step": 463522, "epoch": 2759} {"train_loss": -12.807405471801758, "global_step": 463523, "epoch": 2759} {"train_loss": -12.595707893371582, "global_step": 463524, "epoch": 2759} {"train_loss": -12.454462051391602, "global_step": 463525, "epoch": 2759} {"train_loss": -12.546031951904297, "global_step": 463526, "epoch": 2759} {"train_loss": -12.912691116333008, "global_step": 463527, "epoch": 2759} {"train_loss": -12.633556365966797, "global_step": 463528, "epoch": 2759} {"train_loss": -12.90071964263916, "global_step": 463529, "epoch": 2759} {"train_loss": -12.563594818115234, "global_step": 463530, "epoch": 2759} {"train_loss": -12.768203735351562, "global_step": 463531, "epoch": 2759} {"train_loss": -12.66682243347168, "global_step": 463532, "epoch": 2759} {"train_loss": -12.692543983459473, "global_step": 463533, "epoch": 2759} {"train_loss": -12.691177368164062, "global_step": 463534, "epoch": 2759} {"train_loss": -12.695863723754883, "global_step": 463535, "epoch": 2759} {"train_loss": -12.469970703125, "global_step": 463536, "epoch": 2759} {"train_loss": -12.967203140258789, "global_step": 463537, "epoch": 2759} {"train_loss": -12.446396827697754, "global_step": 463538, "epoch": 2759} {"train_loss": -12.741985321044922, "global_step": 463539, "epoch": 2759} {"train_loss": -12.63625431060791, "global_step": 463540, "epoch": 2759} {"train_loss": -12.771581649780273, "global_step": 463541, "epoch": 2759} {"train_loss": -12.517389297485352, "global_step": 463542, "epoch": 2759} {"train_loss": -12.782062530517578, "global_step": 463543, "epoch": 2759} {"train_loss": -12.740160942077637, "global_step": 463544, "epoch": 2759} {"train_loss": -12.557487487792969, "global_step": 463545, "epoch": 2759} {"train_loss": -12.43841552734375, "global_step": 463546, "epoch": 2759} {"train_loss": -12.737754821777344, "global_step": 463547, "epoch": 2759} {"train_loss": -12.461883544921875, "global_step": 463548, "epoch": 2759} {"train_loss": -12.04581069946289, "global_step": 463549, "epoch": 2759} {"train_loss": -12.810582160949707, "global_step": 463550, "epoch": 2759} {"train_loss": -12.564250946044922, "global_step": 463551, "epoch": 2759} {"train_loss": -12.170637130737305, "global_step": 463552, "epoch": 2759} {"train_loss": -12.658921241760254, "global_step": 463553, "epoch": 2759} {"train_loss": -11.78693675994873, "global_step": 463554, "epoch": 2759} {"train_loss": -12.150873184204102, "global_step": 463555, "epoch": 2759} {"train_loss": -12.831032752990723, "global_step": 463556, "epoch": 2759} {"train_loss": -11.906425476074219, "global_step": 463557, "epoch": 2759} {"train_loss": -12.748087882995605, "global_step": 463558, "epoch": 2759} {"train_loss": -12.126167297363281, "global_step": 463559, "epoch": 2759} {"train_loss": -11.877092361450195, "global_step": 463560, "epoch": 2759} {"train_loss": -12.191167831420898, "global_step": 463561, "epoch": 2759} {"train_loss": -12.323282241821289, "global_step": 463562, "epoch": 2759} {"train_loss": -12.076695442199707, "global_step": 463563, "epoch": 2759} {"train_loss": -12.463208198547363, "global_step": 463564, "epoch": 2759} {"train_loss": -11.608930587768555, "global_step": 463565, "epoch": 2759} {"train_loss": -11.983348846435547, "global_step": 463566, "epoch": 2759} {"train_loss": -12.082696914672852, "global_step": 463567, "epoch": 2759} {"train_loss": -12.362936019897461, "global_step": 463568, "epoch": 2759} {"train_loss": -11.803314208984375, "global_step": 463569, "epoch": 2759} {"train_loss": -10.988082885742188, "global_step": 463570, "epoch": 2759} {"train_loss": -11.988473892211914, "global_step": 463571, "epoch": 2759} {"train_loss": -11.353408813476562, "global_step": 463572, "epoch": 2759} {"train_loss": -10.733894348144531, "global_step": 463573, "epoch": 2759} {"train_loss": -11.572528839111328, "global_step": 463574, "epoch": 2759} {"train_loss": -11.545787811279297, "global_step": 463575, "epoch": 2759} {"train_loss": -12.258353233337402, "global_step": 463576, "epoch": 2759} {"train_loss": -11.536260604858398, "global_step": 463577, "epoch": 2759} {"train_loss": -11.399419784545898, "global_step": 463578, "epoch": 2759} {"train_loss": -12.153583526611328, "global_step": 463579, "epoch": 2759} {"train_loss": -10.658315658569336, "global_step": 463580, "epoch": 2759} {"train_loss": -12.10810661315918, "global_step": 463581, "epoch": 2759} {"train_loss": -11.235584259033203, "global_step": 463582, "epoch": 2759} {"train_loss": -11.240363121032715, "global_step": 463583, "epoch": 2759} {"train_loss": -11.173768997192383, "global_step": 463584, "epoch": 2759} {"train_loss": -11.647717475891113, "global_step": 463585, "epoch": 2759} {"train_loss": -11.512161254882812, "global_step": 463586, "epoch": 2759} {"train_loss": -11.88656234741211, "global_step": 463587, "epoch": 2759} {"train_loss": -11.516654968261719, "global_step": 463588, "epoch": 2759} {"train_loss": -11.740817070007324, "global_step": 463589, "epoch": 2759} {"train_loss": -12.342199325561523, "global_step": 463590, "epoch": 2759} {"train_loss": -11.924249649047852, "global_step": 463591, "epoch": 2759} {"train_loss": -12.26093578338623, "global_step": 463592, "epoch": 2759} {"train_loss": -12.470471382141113, "global_step": 463593, "epoch": 2759} {"train_loss": -12.010732650756836, "global_step": 463594, "epoch": 2759} {"train_loss": -12.386540412902832, "global_step": 463595, "epoch": 2759} {"train_loss": -12.245412826538086, "global_step": 463596, "epoch": 2759} {"train_loss": -11.129095077514648, "global_step": 463597, "epoch": 2759} {"train_loss": -12.446056365966797, "global_step": 463598, "epoch": 2759} {"train_loss": -11.5511474609375, "global_step": 463599, "epoch": 2759} {"train_loss": -12.106754302978516, "global_step": 463600, "epoch": 2759} {"train_loss": -12.183049201965332, "global_step": 463601, "epoch": 2759} {"train_loss": -12.033899307250977, "global_step": 463602, "epoch": 2759} {"train_loss": -12.662332534790039, "global_step": 463603, "epoch": 2759} {"train_loss": -11.420452117919922, "global_step": 463604, "epoch": 2759} {"train_loss": -11.904932022094727, "global_step": 463605, "epoch": 2759} {"train_loss": -11.599149703979492, "global_step": 463606, "epoch": 2759} {"train_loss": -11.815668106079102, "global_step": 463607, "epoch": 2759} {"train_loss": -10.888490676879883, "global_step": 463608, "epoch": 2759} {"train_loss": -11.23314094543457, "global_step": 463609, "epoch": 2759} {"train_loss": -11.366263389587402, "global_step": 463610, "epoch": 2759} {"train_loss": -10.245689392089844, "global_step": 463611, "epoch": 2759} {"train_loss": -11.11108112335205, "global_step": 463612, "epoch": 2759} {"train_loss": -11.59376335144043, "global_step": 463613, "epoch": 2759} {"train_loss": -10.50857925415039, "global_step": 463614, "epoch": 2759} {"train_loss": -11.388219833374023, "global_step": 463615, "epoch": 2759} {"train_loss": -11.779885292053223, "global_step": 463616, "epoch": 2759} {"train_loss": -10.814765930175781, "global_step": 463617, "epoch": 2759} {"train_loss": -11.609914779663086, "global_step": 463618, "epoch": 2759} {"train_loss": -11.990537643432617, "global_step": 463619, "epoch": 2759} {"train_loss": -11.806096076965332, "global_step": 463620, "epoch": 2759} {"train_loss": -12.220077514648438, "global_step": 463621, "epoch": 2759} {"train_loss": -11.849722862243652, "global_step": 463622, "epoch": 2759} {"train_loss": -11.2677583694458, "global_step": 463623, "epoch": 2759} {"train_loss": -11.533670425415039, "global_step": 463624, "epoch": 2759} {"train_loss": -10.963505744934082, "global_step": 463625, "epoch": 2759} {"train_loss": -10.781679153442383, "global_step": 463626, "epoch": 2759} {"train_loss": -11.868806838989258, "global_step": 463627, "epoch": 2759} {"train_loss": -11.00900650024414, "global_step": 463628, "epoch": 2759} {"train_loss": -11.600374221801758, "global_step": 463629, "epoch": 2759} {"train_loss": -11.221630096435547, "global_step": 463630, "epoch": 2759} {"train_loss": -11.385345458984375, "global_step": 463631, "epoch": 2759} {"train_loss": -11.434297561645508, "global_step": 463632, "epoch": 2759} {"train_loss": -11.538307189941406, "global_step": 463633, "epoch": 2759} {"train_loss": -12.087316513061523, "global_step": 463634, "epoch": 2759} {"train_loss": -11.951791763305664, "global_step": 463635, "epoch": 2759} {"train_loss": -11.732712745666504, "global_step": 463636, "epoch": 2759} {"train_loss": -11.888327598571777, "global_step": 463637, "epoch": 2759} {"train_loss": -12.173791885375977, "global_step": 463638, "epoch": 2759} {"train_loss": -12.05654525756836, "global_step": 463639, "epoch": 2759} {"train_loss": -11.82202434539795, "global_step": 463640, "epoch": 2759} {"train_loss": -12.12233829498291, "global_step": 463641, "epoch": 2759} {"train_loss": -11.844440460205078, "global_step": 463642, "epoch": 2759} {"train_loss": -12.416953086853027, "global_step": 463643, "epoch": 2759} {"train_loss": -11.51848030090332, "global_step": 463644, "epoch": 2759} {"train_loss": -12.154351234436035, "global_step": 463645, "epoch": 2759} {"train_loss": -12.183367729187012, "global_step": 463646, "epoch": 2759} {"train_loss": -12.055032730102539, "global_step": 463647, "epoch": 2759} {"train_loss": -12.525634765625, "global_step": 463648, "epoch": 2759} {"train_loss": -12.40053653717041, "global_step": 463649, "epoch": 2759} {"train_loss": -12.404865264892578, "global_step": 463650, "epoch": 2759} {"train_loss": -12.585527420043945, "global_step": 463651, "epoch": 2759} {"train_loss": -12.246116638183594, "global_step": 463652, "epoch": 2759} {"train_loss": -12.180447578430176, "global_step": 463653, "epoch": 2759} {"train_loss": -12.184694290161133, "global_step": 463654, "epoch": 2759} {"train_loss": -11.744020462036133, "global_step": 463655, "epoch": 2759} {"train_loss": -12.385785102844238, "global_step": 463656, "epoch": 2759} {"train_loss": -11.896974563598633, "global_step": 463657, "epoch": 2759} {"train_loss": -11.721075057983398, "global_step": 463658, "epoch": 2759} {"train_loss": -12.246633529663086, "global_step": 463659, "epoch": 2759} {"train_loss": -11.497014999389648, "global_step": 463660, "epoch": 2759} {"train_loss": -12.250657081604004, "global_step": 463661, "epoch": 2759} {"train_loss": -11.685834884643555, "global_step": 463662, "epoch": 2759} {"train_loss": -12.03884506225586, "global_step": 463663, "epoch": 2759} {"train_loss": -11.742013931274414, "global_step": 463664, "epoch": 2759} {"train_loss": -12.24091911315918, "global_step": 463665, "epoch": 2759} {"train_loss": -11.890111923217773, "global_step": 463666, "epoch": 2759} {"train_loss": -12.145318031311035, "global_step": 463667, "epoch": 2759} {"train_loss": -12.090412139892578, "global_step": 463668, "epoch": 2759} {"train_loss": -11.81295394897461, "global_step": 463669, "epoch": 2759} {"train_loss": -12.41142749786377, "global_step": 463670, "epoch": 2759} {"train_loss": -11.748700141906738, "global_step": 463671, "epoch": 2759} {"train_loss": -12.277591705322266, "global_step": 463672, "epoch": 2759} {"train_loss": -12.397834777832031, "global_step": 463673, "epoch": 2759} {"train_loss": -12.245909690856934, "global_step": 463674, "epoch": 2759} {"train_loss": -12.047388076782227, "global_step": 463675, "epoch": 2759} {"train_loss": -12.538990020751953, "global_step": 463676, "epoch": 2759} {"train_loss": -11.78902530670166, "global_step": 463677, "epoch": 2759} {"train_loss": -12.616283416748047, "global_step": 463678, "epoch": 2759} {"train_loss": -12.034346188817706, "global_step": 463679, "epoch": 2759, "val_loss": 317906.25} {"train_loss": -12.119417190551758, "global_step": 463680, "epoch": 2760} {"train_loss": -12.510992050170898, "global_step": 463681, "epoch": 2760} {"train_loss": -12.322815895080566, "global_step": 463682, "epoch": 2760} {"train_loss": -12.67684268951416, "global_step": 463683, "epoch": 2760} {"train_loss": -12.485876083374023, "global_step": 463684, "epoch": 2760} {"train_loss": -12.569684982299805, "global_step": 463685, "epoch": 2760} {"train_loss": -12.647850036621094, "global_step": 463686, "epoch": 2760} {"train_loss": -12.320358276367188, "global_step": 463687, "epoch": 2760} {"train_loss": -12.699851036071777, "global_step": 463688, "epoch": 2760} {"train_loss": -12.554838180541992, "global_step": 463689, "epoch": 2760} {"train_loss": -12.30396556854248, "global_step": 463690, "epoch": 2760} {"train_loss": -12.480825424194336, "global_step": 463691, "epoch": 2760} {"train_loss": -12.563514709472656, "global_step": 463692, "epoch": 2760} {"train_loss": -12.63874626159668, "global_step": 463693, "epoch": 2760} {"train_loss": -12.487690925598145, "global_step": 463694, "epoch": 2760} {"train_loss": -12.551555633544922, "global_step": 463695, "epoch": 2760} {"train_loss": -12.67556381225586, "global_step": 463696, "epoch": 2760} {"train_loss": -12.743942260742188, "global_step": 463697, "epoch": 2760} {"train_loss": -12.48436164855957, "global_step": 463698, "epoch": 2760} {"train_loss": -12.678611755371094, "global_step": 463699, "epoch": 2760} {"train_loss": -12.552173614501953, "global_step": 463700, "epoch": 2760} {"train_loss": -12.609040260314941, "global_step": 463701, "epoch": 2760} {"train_loss": -12.665143966674805, "global_step": 463702, "epoch": 2760} {"train_loss": -12.524641990661621, "global_step": 463703, "epoch": 2760} {"train_loss": -12.588787078857422, "global_step": 463704, "epoch": 2760} {"train_loss": -12.615318298339844, "global_step": 463705, "epoch": 2760} {"train_loss": -12.790875434875488, "global_step": 463706, "epoch": 2760} {"train_loss": -12.682350158691406, "global_step": 463707, "epoch": 2760} {"train_loss": -12.716708183288574, "global_step": 463708, "epoch": 2760} {"train_loss": -12.843542098999023, "global_step": 463709, "epoch": 2760} {"train_loss": -12.740375518798828, "global_step": 463710, "epoch": 2760} {"train_loss": -12.937597274780273, "global_step": 463711, "epoch": 2760} {"train_loss": -13.069188117980957, "global_step": 463712, "epoch": 2760} {"train_loss": -12.670036315917969, "global_step": 463713, "epoch": 2760} {"train_loss": -12.747026443481445, "global_step": 463714, "epoch": 2760} {"train_loss": -12.764792442321777, "global_step": 463715, "epoch": 2760} {"train_loss": -12.663690567016602, "global_step": 463716, "epoch": 2760} {"train_loss": -12.924424171447754, "global_step": 463717, "epoch": 2760} {"train_loss": -12.63426399230957, "global_step": 463718, "epoch": 2760} {"train_loss": -12.594690322875977, "global_step": 463719, "epoch": 2760} {"train_loss": -13.069379806518555, "global_step": 463720, "epoch": 2760} {"train_loss": -12.696235656738281, "global_step": 463721, "epoch": 2760} {"train_loss": -12.74152946472168, "global_step": 463722, "epoch": 2760} {"train_loss": -12.69552993774414, "global_step": 463723, "epoch": 2760} {"train_loss": -12.275369644165039, "global_step": 463724, "epoch": 2760} {"train_loss": -12.592723846435547, "global_step": 463725, "epoch": 2760} {"train_loss": -11.941104888916016, "global_step": 463726, "epoch": 2760} {"train_loss": -11.978120803833008, "global_step": 463727, "epoch": 2760} {"train_loss": -12.302899360656738, "global_step": 463728, "epoch": 2760} {"train_loss": -12.116523742675781, "global_step": 463729, "epoch": 2760} {"train_loss": -11.98759937286377, "global_step": 463730, "epoch": 2760} {"train_loss": -12.440180778503418, "global_step": 463731, "epoch": 2760} {"train_loss": -11.751155853271484, "global_step": 463732, "epoch": 2760} {"train_loss": -12.38499927520752, "global_step": 463733, "epoch": 2760} {"train_loss": -11.783401489257812, "global_step": 463734, "epoch": 2760} {"train_loss": -12.496126174926758, "global_step": 463735, "epoch": 2760} {"train_loss": -12.169292449951172, "global_step": 463736, "epoch": 2760} {"train_loss": -11.989300727844238, "global_step": 463737, "epoch": 2760} {"train_loss": -12.544441223144531, "global_step": 463738, "epoch": 2760} {"train_loss": -11.919520378112793, "global_step": 463739, "epoch": 2760} {"train_loss": -12.567693710327148, "global_step": 463740, "epoch": 2760} {"train_loss": -12.642308235168457, "global_step": 463741, "epoch": 2760} {"train_loss": -12.356931686401367, "global_step": 463742, "epoch": 2760} {"train_loss": -12.395081520080566, "global_step": 463743, "epoch": 2760} {"train_loss": -12.763269424438477, "global_step": 463744, "epoch": 2760} {"train_loss": -11.910017013549805, "global_step": 463745, "epoch": 2760} {"train_loss": -12.68387222290039, "global_step": 463746, "epoch": 2760} {"train_loss": -12.296918869018555, "global_step": 463747, "epoch": 2760} {"train_loss": -12.145576477050781, "global_step": 463748, "epoch": 2760} {"train_loss": -12.56416130065918, "global_step": 463749, "epoch": 2760} {"train_loss": -12.158981323242188, "global_step": 463750, "epoch": 2760} {"train_loss": -12.737714767456055, "global_step": 463751, "epoch": 2760} {"train_loss": -11.890216827392578, "global_step": 463752, "epoch": 2760} {"train_loss": -12.133893966674805, "global_step": 463753, "epoch": 2760} {"train_loss": -12.733010292053223, "global_step": 463754, "epoch": 2760} {"train_loss": -12.381118774414062, "global_step": 463755, "epoch": 2760} {"train_loss": -12.194839477539062, "global_step": 463756, "epoch": 2760} {"train_loss": -12.555980682373047, "global_step": 463757, "epoch": 2760} {"train_loss": -12.38150691986084, "global_step": 463758, "epoch": 2760} {"train_loss": -12.217227935791016, "global_step": 463759, "epoch": 2760} {"train_loss": -12.933481216430664, "global_step": 463760, "epoch": 2760} {"train_loss": -12.632161140441895, "global_step": 463761, "epoch": 2760} {"train_loss": -12.403558731079102, "global_step": 463762, "epoch": 2760} {"train_loss": -12.71435546875, "global_step": 463763, "epoch": 2760} {"train_loss": -12.612396240234375, "global_step": 463764, "epoch": 2760} {"train_loss": -12.373712539672852, "global_step": 463765, "epoch": 2760} {"train_loss": -12.43874740600586, "global_step": 463766, "epoch": 2760} {"train_loss": -12.61059284210205, "global_step": 463767, "epoch": 2760} {"train_loss": -12.54580020904541, "global_step": 463768, "epoch": 2760} {"train_loss": -12.366305351257324, "global_step": 463769, "epoch": 2760} {"train_loss": -12.642468452453613, "global_step": 463770, "epoch": 2760} {"train_loss": -12.653135299682617, "global_step": 463771, "epoch": 2760} {"train_loss": -12.599913597106934, "global_step": 463772, "epoch": 2760} {"train_loss": -13.013996124267578, "global_step": 463773, "epoch": 2760} {"train_loss": -12.67557144165039, "global_step": 463774, "epoch": 2760} {"train_loss": -12.577413558959961, "global_step": 463775, "epoch": 2760} {"train_loss": -12.767332077026367, "global_step": 463776, "epoch": 2760} {"train_loss": -12.638154983520508, "global_step": 463777, "epoch": 2760} {"train_loss": -12.672590255737305, "global_step": 463778, "epoch": 2760} {"train_loss": -12.430673599243164, "global_step": 463779, "epoch": 2760} {"train_loss": -12.631311416625977, "global_step": 463780, "epoch": 2760} {"train_loss": -12.539154052734375, "global_step": 463781, "epoch": 2760} {"train_loss": -12.521761894226074, "global_step": 463782, "epoch": 2760} {"train_loss": -12.685480117797852, "global_step": 463783, "epoch": 2760} {"train_loss": -12.806716918945312, "global_step": 463784, "epoch": 2760} {"train_loss": -12.533233642578125, "global_step": 463785, "epoch": 2760} {"train_loss": -12.354747772216797, "global_step": 463786, "epoch": 2760} {"train_loss": -12.782807350158691, "global_step": 463787, "epoch": 2760} {"train_loss": -11.913135528564453, "global_step": 463788, "epoch": 2760} {"train_loss": -12.316621780395508, "global_step": 463789, "epoch": 2760} {"train_loss": -12.73402214050293, "global_step": 463790, "epoch": 2760} {"train_loss": -12.134586334228516, "global_step": 463791, "epoch": 2760} {"train_loss": -12.817875862121582, "global_step": 463792, "epoch": 2760} {"train_loss": -12.604290008544922, "global_step": 463793, "epoch": 2760} {"train_loss": -12.895565032958984, "global_step": 463794, "epoch": 2760} {"train_loss": -12.895285606384277, "global_step": 463795, "epoch": 2760} {"train_loss": -12.656753540039062, "global_step": 463796, "epoch": 2760} {"train_loss": -12.71337890625, "global_step": 463797, "epoch": 2760} {"train_loss": -12.822864532470703, "global_step": 463798, "epoch": 2760} {"train_loss": -12.776493072509766, "global_step": 463799, "epoch": 2760} {"train_loss": -12.38848876953125, "global_step": 463800, "epoch": 2760} {"train_loss": -12.702960968017578, "global_step": 463801, "epoch": 2760} {"train_loss": -12.743639945983887, "global_step": 463802, "epoch": 2760} {"train_loss": -12.709063529968262, "global_step": 463803, "epoch": 2760} {"train_loss": -12.630866050720215, "global_step": 463804, "epoch": 2760} {"train_loss": -12.524934768676758, "global_step": 463805, "epoch": 2760} {"train_loss": -12.691533088684082, "global_step": 463806, "epoch": 2760} {"train_loss": -12.547601699829102, "global_step": 463807, "epoch": 2760} {"train_loss": -12.523396492004395, "global_step": 463808, "epoch": 2760} {"train_loss": -11.924607276916504, "global_step": 463809, "epoch": 2760} {"train_loss": -11.797844886779785, "global_step": 463810, "epoch": 2760} {"train_loss": -11.777935028076172, "global_step": 463811, "epoch": 2760} {"train_loss": -11.662668228149414, "global_step": 463812, "epoch": 2760} {"train_loss": -12.399063110351562, "global_step": 463813, "epoch": 2760} {"train_loss": -11.880727767944336, "global_step": 463814, "epoch": 2760} {"train_loss": -12.190500259399414, "global_step": 463815, "epoch": 2760} {"train_loss": -12.324068069458008, "global_step": 463816, "epoch": 2760} {"train_loss": -11.133306503295898, "global_step": 463817, "epoch": 2760} {"train_loss": -12.299919128417969, "global_step": 463818, "epoch": 2760} {"train_loss": -11.098970413208008, "global_step": 463819, "epoch": 2760} {"train_loss": -11.661596298217773, "global_step": 463820, "epoch": 2760} {"train_loss": -11.688304901123047, "global_step": 463821, "epoch": 2760} {"train_loss": -11.26893424987793, "global_step": 463822, "epoch": 2760} {"train_loss": -10.967583656311035, "global_step": 463823, "epoch": 2760} {"train_loss": -11.384758949279785, "global_step": 463824, "epoch": 2760} {"train_loss": -11.226842880249023, "global_step": 463825, "epoch": 2760} {"train_loss": -11.786933898925781, "global_step": 463826, "epoch": 2760} {"train_loss": -11.688478469848633, "global_step": 463827, "epoch": 2760} {"train_loss": -11.392410278320312, "global_step": 463828, "epoch": 2760} {"train_loss": -11.623379707336426, "global_step": 463829, "epoch": 2760} {"train_loss": -10.83455753326416, "global_step": 463830, "epoch": 2760} {"train_loss": -11.763843536376953, "global_step": 463831, "epoch": 2760} {"train_loss": -11.600217819213867, "global_step": 463832, "epoch": 2760} {"train_loss": -11.28222942352295, "global_step": 463833, "epoch": 2760} {"train_loss": -12.06241512298584, "global_step": 463834, "epoch": 2760} {"train_loss": -11.430171966552734, "global_step": 463835, "epoch": 2760} {"train_loss": -12.04908275604248, "global_step": 463836, "epoch": 2760} {"train_loss": -12.105112075805664, "global_step": 463837, "epoch": 2760} {"train_loss": -12.625068664550781, "global_step": 463838, "epoch": 2760} {"train_loss": -11.926985740661621, "global_step": 463839, "epoch": 2760} {"train_loss": -12.034351348876953, "global_step": 463840, "epoch": 2760} {"train_loss": -12.568437576293945, "global_step": 463841, "epoch": 2760} {"train_loss": -11.682514190673828, "global_step": 463842, "epoch": 2760} {"train_loss": -11.888609886169434, "global_step": 463843, "epoch": 2760} {"train_loss": -12.39709186553955, "global_step": 463844, "epoch": 2760} {"train_loss": -12.241533279418945, "global_step": 463845, "epoch": 2760} {"train_loss": -12.455387115478516, "global_step": 463846, "epoch": 2760} {"train_loss": -12.361371971312023, "global_step": 463847, "epoch": 2760, "val_loss": 314535.46875, "train_action_mse_error": 0.36803627014160156} {"train_loss": -12.329607009887695, "global_step": 463848, "epoch": 2761} {"train_loss": -12.151551246643066, "global_step": 463849, "epoch": 2761} {"train_loss": -11.329217910766602, "global_step": 463850, "epoch": 2761} {"train_loss": -11.724136352539062, "global_step": 463851, "epoch": 2761} {"train_loss": -11.688365936279297, "global_step": 463852, "epoch": 2761} {"train_loss": -11.951953887939453, "global_step": 463853, "epoch": 2761} {"train_loss": -11.508413314819336, "global_step": 463854, "epoch": 2761} {"train_loss": -11.238967895507812, "global_step": 463855, "epoch": 2761} {"train_loss": -11.909090042114258, "global_step": 463856, "epoch": 2761} {"train_loss": -11.83153247833252, "global_step": 463857, "epoch": 2761} {"train_loss": -10.69309139251709, "global_step": 463858, "epoch": 2761} {"train_loss": -11.416576385498047, "global_step": 463859, "epoch": 2761} {"train_loss": -10.49582576751709, "global_step": 463860, "epoch": 2761} {"train_loss": -11.243962287902832, "global_step": 463861, "epoch": 2761} {"train_loss": -10.096075057983398, "global_step": 463862, "epoch": 2761} {"train_loss": -11.6422119140625, "global_step": 463863, "epoch": 2761} {"train_loss": -11.995823860168457, "global_step": 463864, "epoch": 2761} {"train_loss": -10.760441780090332, "global_step": 463865, "epoch": 2761} {"train_loss": -11.498472213745117, "global_step": 463866, "epoch": 2761} {"train_loss": -11.80429458618164, "global_step": 463867, "epoch": 2761} {"train_loss": -12.205366134643555, "global_step": 463868, "epoch": 2761} {"train_loss": -11.592304229736328, "global_step": 463869, "epoch": 2761} {"train_loss": -12.232443809509277, "global_step": 463870, "epoch": 2761} {"train_loss": -11.957321166992188, "global_step": 463871, "epoch": 2761} {"train_loss": -11.49154281616211, "global_step": 463872, "epoch": 2761} {"train_loss": -12.13117504119873, "global_step": 463873, "epoch": 2761} {"train_loss": -11.66008186340332, "global_step": 463874, "epoch": 2761} {"train_loss": -12.061312675476074, "global_step": 463875, "epoch": 2761} {"train_loss": -11.611528396606445, "global_step": 463876, "epoch": 2761} {"train_loss": -12.381763458251953, "global_step": 463877, "epoch": 2761} {"train_loss": -11.728181838989258, "global_step": 463878, "epoch": 2761} {"train_loss": -12.440909385681152, "global_step": 463879, "epoch": 2761} {"train_loss": -11.816171646118164, "global_step": 463880, "epoch": 2761} {"train_loss": -12.272621154785156, "global_step": 463881, "epoch": 2761} {"train_loss": -12.089990615844727, "global_step": 463882, "epoch": 2761} {"train_loss": -12.441789627075195, "global_step": 463883, "epoch": 2761} {"train_loss": -11.985836029052734, "global_step": 463884, "epoch": 2761} {"train_loss": -12.623027801513672, "global_step": 463885, "epoch": 2761} {"train_loss": -11.838507652282715, "global_step": 463886, "epoch": 2761} {"train_loss": -12.054325103759766, "global_step": 463887, "epoch": 2761} {"train_loss": -12.164017677307129, "global_step": 463888, "epoch": 2761} {"train_loss": -12.257412910461426, "global_step": 463889, "epoch": 2761} {"train_loss": -12.115068435668945, "global_step": 463890, "epoch": 2761} {"train_loss": -11.868813514709473, "global_step": 463891, "epoch": 2761} {"train_loss": -12.339601516723633, "global_step": 463892, "epoch": 2761} {"train_loss": -11.601728439331055, "global_step": 463893, "epoch": 2761} {"train_loss": -12.337566375732422, "global_step": 463894, "epoch": 2761} {"train_loss": -11.897499084472656, "global_step": 463895, "epoch": 2761} {"train_loss": -12.355612754821777, "global_step": 463896, "epoch": 2761} {"train_loss": -12.193981170654297, "global_step": 463897, "epoch": 2761} {"train_loss": -11.20649528503418, "global_step": 463898, "epoch": 2761} {"train_loss": -12.11900520324707, "global_step": 463899, "epoch": 2761} {"train_loss": -11.518783569335938, "global_step": 463900, "epoch": 2761} {"train_loss": -12.374551773071289, "global_step": 463901, "epoch": 2761} {"train_loss": -11.80663776397705, "global_step": 463902, "epoch": 2761} {"train_loss": -12.203195571899414, "global_step": 463903, "epoch": 2761} {"train_loss": -12.31680965423584, "global_step": 463904, "epoch": 2761} {"train_loss": -11.964441299438477, "global_step": 463905, "epoch": 2761} {"train_loss": -12.333144187927246, "global_step": 463906, "epoch": 2761} {"train_loss": -12.31009292602539, "global_step": 463907, "epoch": 2761} {"train_loss": -11.69769287109375, "global_step": 463908, "epoch": 2761} {"train_loss": -12.298574447631836, "global_step": 463909, "epoch": 2761} {"train_loss": -12.207479476928711, "global_step": 463910, "epoch": 2761} {"train_loss": -11.92989730834961, "global_step": 463911, "epoch": 2761} {"train_loss": -12.355951309204102, "global_step": 463912, "epoch": 2761} {"train_loss": -11.828706741333008, "global_step": 463913, "epoch": 2761} {"train_loss": -12.249963760375977, "global_step": 463914, "epoch": 2761} {"train_loss": -12.15031909942627, "global_step": 463915, "epoch": 2761} {"train_loss": -12.325698852539062, "global_step": 463916, "epoch": 2761} {"train_loss": -12.606430053710938, "global_step": 463917, "epoch": 2761} {"train_loss": -12.345582962036133, "global_step": 463918, "epoch": 2761} {"train_loss": -11.896100044250488, "global_step": 463919, "epoch": 2761} {"train_loss": -12.56617546081543, "global_step": 463920, "epoch": 2761} {"train_loss": -12.106172561645508, "global_step": 463921, "epoch": 2761} {"train_loss": -12.238041877746582, "global_step": 463922, "epoch": 2761} {"train_loss": -12.519899368286133, "global_step": 463923, "epoch": 2761} {"train_loss": -12.489532470703125, "global_step": 463924, "epoch": 2761} {"train_loss": -12.244243621826172, "global_step": 463925, "epoch": 2761} {"train_loss": -12.380112648010254, "global_step": 463926, "epoch": 2761} {"train_loss": -12.3778715133667, "global_step": 463927, "epoch": 2761} {"train_loss": -12.364507675170898, "global_step": 463928, "epoch": 2761} {"train_loss": -12.501290321350098, "global_step": 463929, "epoch": 2761} {"train_loss": -12.57652473449707, "global_step": 463930, "epoch": 2761} {"train_loss": -12.599508285522461, "global_step": 463931, "epoch": 2761} {"train_loss": -12.43971061706543, "global_step": 463932, "epoch": 2761} {"train_loss": -12.549095153808594, "global_step": 463933, "epoch": 2761} {"train_loss": -12.564802169799805, "global_step": 463934, "epoch": 2761} {"train_loss": -12.778634071350098, "global_step": 463935, "epoch": 2761} {"train_loss": -12.721824645996094, "global_step": 463936, "epoch": 2761} {"train_loss": -12.79677677154541, "global_step": 463937, "epoch": 2761} {"train_loss": -12.787384033203125, "global_step": 463938, "epoch": 2761} {"train_loss": -12.803715705871582, "global_step": 463939, "epoch": 2761} {"train_loss": -12.88630199432373, "global_step": 463940, "epoch": 2761} {"train_loss": -12.634954452514648, "global_step": 463941, "epoch": 2761} {"train_loss": -12.842439651489258, "global_step": 463942, "epoch": 2761} {"train_loss": -12.746771812438965, "global_step": 463943, "epoch": 2761} {"train_loss": -12.877480506896973, "global_step": 463944, "epoch": 2761} {"train_loss": -12.893802642822266, "global_step": 463945, "epoch": 2761} {"train_loss": -12.78939437866211, "global_step": 463946, "epoch": 2761} {"train_loss": -12.563186645507812, "global_step": 463947, "epoch": 2761} {"train_loss": -12.863343238830566, "global_step": 463948, "epoch": 2761} {"train_loss": -12.992053985595703, "global_step": 463949, "epoch": 2761} {"train_loss": -12.942314147949219, "global_step": 463950, "epoch": 2761} {"train_loss": -12.850004196166992, "global_step": 463951, "epoch": 2761} {"train_loss": -12.99437141418457, "global_step": 463952, "epoch": 2761} {"train_loss": -12.87142276763916, "global_step": 463953, "epoch": 2761} {"train_loss": -12.93478775024414, "global_step": 463954, "epoch": 2761} {"train_loss": -12.914935111999512, "global_step": 463955, "epoch": 2761} {"train_loss": -12.717742919921875, "global_step": 463956, "epoch": 2761} {"train_loss": -12.946037292480469, "global_step": 463957, "epoch": 2761} {"train_loss": -12.945456504821777, "global_step": 463958, "epoch": 2761} {"train_loss": -12.962955474853516, "global_step": 463959, "epoch": 2761} {"train_loss": -13.059596061706543, "global_step": 463960, "epoch": 2761} {"train_loss": -12.798116683959961, "global_step": 463961, "epoch": 2761} {"train_loss": -12.959760665893555, "global_step": 463962, "epoch": 2761} {"train_loss": -12.7647705078125, "global_step": 463963, "epoch": 2761} {"train_loss": -12.721942901611328, "global_step": 463964, "epoch": 2761} {"train_loss": -13.067520141601562, "global_step": 463965, "epoch": 2761} {"train_loss": -12.61855697631836, "global_step": 463966, "epoch": 2761} {"train_loss": -12.649328231811523, "global_step": 463967, "epoch": 2761} {"train_loss": -12.894420623779297, "global_step": 463968, "epoch": 2761} {"train_loss": -12.922051429748535, "global_step": 463969, "epoch": 2761} {"train_loss": -12.813614845275879, "global_step": 463970, "epoch": 2761} {"train_loss": -12.967967987060547, "global_step": 463971, "epoch": 2761} {"train_loss": -12.832206726074219, "global_step": 463972, "epoch": 2761} {"train_loss": -12.956748008728027, "global_step": 463973, "epoch": 2761} {"train_loss": -12.813422203063965, "global_step": 463974, "epoch": 2761} {"train_loss": -13.050963401794434, "global_step": 463975, "epoch": 2761} {"train_loss": -12.84227180480957, "global_step": 463976, "epoch": 2761} {"train_loss": -13.192360877990723, "global_step": 463977, "epoch": 2761} {"train_loss": -13.073495864868164, "global_step": 463978, "epoch": 2761} {"train_loss": -13.079659461975098, "global_step": 463979, "epoch": 2761} {"train_loss": -12.921186447143555, "global_step": 463980, "epoch": 2761} {"train_loss": -12.980561256408691, "global_step": 463981, "epoch": 2761} {"train_loss": -13.163578033447266, "global_step": 463982, "epoch": 2761} {"train_loss": -12.873871803283691, "global_step": 463983, "epoch": 2761} {"train_loss": -12.706930160522461, "global_step": 463984, "epoch": 2761} {"train_loss": -13.125715255737305, "global_step": 463985, "epoch": 2761} {"train_loss": -12.730628967285156, "global_step": 463986, "epoch": 2761} {"train_loss": -12.850425720214844, "global_step": 463987, "epoch": 2761} {"train_loss": -12.516661643981934, "global_step": 463988, "epoch": 2761} {"train_loss": -12.87961196899414, "global_step": 463989, "epoch": 2761} {"train_loss": -12.96925163269043, "global_step": 463990, "epoch": 2761} {"train_loss": -12.556804656982422, "global_step": 463991, "epoch": 2761} {"train_loss": -11.93379020690918, "global_step": 463992, "epoch": 2761} {"train_loss": -10.745805740356445, "global_step": 463993, "epoch": 2761} {"train_loss": -11.455768585205078, "global_step": 463994, "epoch": 2761} {"train_loss": -12.413775444030762, "global_step": 463995, "epoch": 2761} {"train_loss": -12.633094787597656, "global_step": 463996, "epoch": 2761} {"train_loss": -12.631218910217285, "global_step": 463997, "epoch": 2761} {"train_loss": -11.518510818481445, "global_step": 463998, "epoch": 2761} {"train_loss": -11.94082260131836, "global_step": 463999, "epoch": 2761} {"train_loss": -13.121161460876465, "global_step": 464000, "epoch": 2761} {"train_loss": -11.164499282836914, "global_step": 464001, "epoch": 2761} {"train_loss": -10.135770797729492, "global_step": 464002, "epoch": 2761} {"train_loss": -12.500588417053223, "global_step": 464003, "epoch": 2761} {"train_loss": -11.426291465759277, "global_step": 464004, "epoch": 2761} {"train_loss": -10.12999153137207, "global_step": 464005, "epoch": 2761} {"train_loss": -10.098787307739258, "global_step": 464006, "epoch": 2761} {"train_loss": -10.402711868286133, "global_step": 464007, "epoch": 2761} {"train_loss": -9.845048904418945, "global_step": 464008, "epoch": 2761} {"train_loss": -9.425376892089844, "global_step": 464009, "epoch": 2761} {"train_loss": -9.987059593200684, "global_step": 464010, "epoch": 2761} {"train_loss": -12.072400093078613, "global_step": 464011, "epoch": 2761} {"train_loss": -9.82064437866211, "global_step": 464012, "epoch": 2761} {"train_loss": -9.692432403564453, "global_step": 464013, "epoch": 2761} {"train_loss": -11.43173599243164, "global_step": 464014, "epoch": 2761} {"train_loss": -12.168476706459408, "global_step": 464015, "epoch": 2761, "val_loss": 311148.75} {"train_loss": -9.621684074401855, "global_step": 464016, "epoch": 2762} {"train_loss": -12.018999099731445, "global_step": 464017, "epoch": 2762} {"train_loss": -10.692855834960938, "global_step": 464018, "epoch": 2762} {"train_loss": -7.664206027984619, "global_step": 464019, "epoch": 2762} {"train_loss": -9.751544952392578, "global_step": 464020, "epoch": 2762} {"train_loss": -10.807390213012695, "global_step": 464021, "epoch": 2762} {"train_loss": -10.028520584106445, "global_step": 464022, "epoch": 2762} {"train_loss": -9.901766777038574, "global_step": 464023, "epoch": 2762} {"train_loss": -11.094398498535156, "global_step": 464024, "epoch": 2762} {"train_loss": -11.303418159484863, "global_step": 464025, "epoch": 2762} {"train_loss": -11.673171997070312, "global_step": 464026, "epoch": 2762} {"train_loss": -12.013261795043945, "global_step": 464027, "epoch": 2762} {"train_loss": -11.936351776123047, "global_step": 464028, "epoch": 2762} {"train_loss": -11.504119873046875, "global_step": 464029, "epoch": 2762} {"train_loss": -11.63415813446045, "global_step": 464030, "epoch": 2762} {"train_loss": -11.809168815612793, "global_step": 464031, "epoch": 2762} {"train_loss": -12.16329288482666, "global_step": 464032, "epoch": 2762} {"train_loss": -12.2174711227417, "global_step": 464033, "epoch": 2762} {"train_loss": -12.237447738647461, "global_step": 464034, "epoch": 2762} {"train_loss": -12.231292724609375, "global_step": 464035, "epoch": 2762} {"train_loss": -12.362617492675781, "global_step": 464036, "epoch": 2762} {"train_loss": -12.419326782226562, "global_step": 464037, "epoch": 2762} {"train_loss": -12.291849136352539, "global_step": 464038, "epoch": 2762} {"train_loss": -12.460721969604492, "global_step": 464039, "epoch": 2762} {"train_loss": -11.9912109375, "global_step": 464040, "epoch": 2762} {"train_loss": -12.270682334899902, "global_step": 464041, "epoch": 2762} {"train_loss": -12.275198936462402, "global_step": 464042, "epoch": 2762} {"train_loss": -11.501877784729004, "global_step": 464043, "epoch": 2762} {"train_loss": -11.514981269836426, "global_step": 464044, "epoch": 2762} {"train_loss": -12.206876754760742, "global_step": 464045, "epoch": 2762} {"train_loss": -11.782519340515137, "global_step": 464046, "epoch": 2762} {"train_loss": -12.427328109741211, "global_step": 464047, "epoch": 2762} {"train_loss": -12.050251007080078, "global_step": 464048, "epoch": 2762} {"train_loss": -11.16506290435791, "global_step": 464049, "epoch": 2762} {"train_loss": -11.038105010986328, "global_step": 464050, "epoch": 2762} {"train_loss": -11.417023658752441, "global_step": 464051, "epoch": 2762} {"train_loss": -9.871395111083984, "global_step": 464052, "epoch": 2762} {"train_loss": -11.368486404418945, "global_step": 464053, "epoch": 2762} {"train_loss": -10.239381790161133, "global_step": 464054, "epoch": 2762} {"train_loss": -11.642505645751953, "global_step": 464055, "epoch": 2762} {"train_loss": -10.589151382446289, "global_step": 464056, "epoch": 2762} {"train_loss": -11.36233901977539, "global_step": 464057, "epoch": 2762} {"train_loss": -10.999496459960938, "global_step": 464058, "epoch": 2762} {"train_loss": -11.412294387817383, "global_step": 464059, "epoch": 2762} {"train_loss": -11.855714797973633, "global_step": 464060, "epoch": 2762} {"train_loss": -11.032800674438477, "global_step": 464061, "epoch": 2762} {"train_loss": -12.08152961730957, "global_step": 464062, "epoch": 2762} {"train_loss": -11.705299377441406, "global_step": 464063, "epoch": 2762} {"train_loss": -11.745386123657227, "global_step": 464064, "epoch": 2762} {"train_loss": -12.179974555969238, "global_step": 464065, "epoch": 2762} {"train_loss": -11.721531867980957, "global_step": 464066, "epoch": 2762} {"train_loss": -11.90649127960205, "global_step": 464067, "epoch": 2762} {"train_loss": -11.675065994262695, "global_step": 464068, "epoch": 2762} {"train_loss": -11.698070526123047, "global_step": 464069, "epoch": 2762} {"train_loss": -12.384414672851562, "global_step": 464070, "epoch": 2762} {"train_loss": -11.974095344543457, "global_step": 464071, "epoch": 2762} {"train_loss": -11.674776077270508, "global_step": 464072, "epoch": 2762} {"train_loss": -12.292505264282227, "global_step": 464073, "epoch": 2762} {"train_loss": -12.195117950439453, "global_step": 464074, "epoch": 2762} {"train_loss": -12.340973854064941, "global_step": 464075, "epoch": 2762} {"train_loss": -12.266813278198242, "global_step": 464076, "epoch": 2762} {"train_loss": -11.88496208190918, "global_step": 464077, "epoch": 2762} {"train_loss": -12.069064140319824, "global_step": 464078, "epoch": 2762} {"train_loss": -11.992761611938477, "global_step": 464079, "epoch": 2762} {"train_loss": -11.793045043945312, "global_step": 464080, "epoch": 2762} {"train_loss": -11.255521774291992, "global_step": 464081, "epoch": 2762} {"train_loss": -11.89554214477539, "global_step": 464082, "epoch": 2762} {"train_loss": -11.595067977905273, "global_step": 464083, "epoch": 2762} {"train_loss": -11.240117073059082, "global_step": 464084, "epoch": 2762} {"train_loss": -11.91627025604248, "global_step": 464085, "epoch": 2762} {"train_loss": -11.470848083496094, "global_step": 464086, "epoch": 2762} {"train_loss": -10.740965843200684, "global_step": 464087, "epoch": 2762} {"train_loss": -11.363119125366211, "global_step": 464088, "epoch": 2762} {"train_loss": -10.875631332397461, "global_step": 464089, "epoch": 2762} {"train_loss": -11.372888565063477, "global_step": 464090, "epoch": 2762} {"train_loss": -11.165611267089844, "global_step": 464091, "epoch": 2762} {"train_loss": -12.11371898651123, "global_step": 464092, "epoch": 2762} {"train_loss": -11.40929889678955, "global_step": 464093, "epoch": 2762} {"train_loss": -12.173254013061523, "global_step": 464094, "epoch": 2762} {"train_loss": -11.638383865356445, "global_step": 464095, "epoch": 2762} {"train_loss": -11.98251724243164, "global_step": 464096, "epoch": 2762} {"train_loss": -12.010040283203125, "global_step": 464097, "epoch": 2762} {"train_loss": -11.998758316040039, "global_step": 464098, "epoch": 2762} {"train_loss": -12.163025856018066, "global_step": 464099, "epoch": 2762} {"train_loss": -12.13022232055664, "global_step": 464100, "epoch": 2762} {"train_loss": -12.390172004699707, "global_step": 464101, "epoch": 2762} {"train_loss": -11.894948959350586, "global_step": 464102, "epoch": 2762} {"train_loss": -12.361921310424805, "global_step": 464103, "epoch": 2762} {"train_loss": -12.145159721374512, "global_step": 464104, "epoch": 2762} {"train_loss": -12.268014907836914, "global_step": 464105, "epoch": 2762} {"train_loss": -11.884665489196777, "global_step": 464106, "epoch": 2762} {"train_loss": -12.391733169555664, "global_step": 464107, "epoch": 2762} {"train_loss": -12.273988723754883, "global_step": 464108, "epoch": 2762} {"train_loss": -12.338388442993164, "global_step": 464109, "epoch": 2762} {"train_loss": -12.296502113342285, "global_step": 464110, "epoch": 2762} {"train_loss": -12.182271003723145, "global_step": 464111, "epoch": 2762} {"train_loss": -12.124504089355469, "global_step": 464112, "epoch": 2762} {"train_loss": -12.448439598083496, "global_step": 464113, "epoch": 2762} {"train_loss": -12.316854476928711, "global_step": 464114, "epoch": 2762} {"train_loss": -12.478500366210938, "global_step": 464115, "epoch": 2762} {"train_loss": -12.519407272338867, "global_step": 464116, "epoch": 2762} {"train_loss": -12.539228439331055, "global_step": 464117, "epoch": 2762} {"train_loss": -12.457046508789062, "global_step": 464118, "epoch": 2762} {"train_loss": -12.54000473022461, "global_step": 464119, "epoch": 2762} {"train_loss": -12.305109024047852, "global_step": 464120, "epoch": 2762} {"train_loss": -12.464120864868164, "global_step": 464121, "epoch": 2762} {"train_loss": -12.531347274780273, "global_step": 464122, "epoch": 2762} {"train_loss": -12.559379577636719, "global_step": 464123, "epoch": 2762} {"train_loss": -12.781965255737305, "global_step": 464124, "epoch": 2762} {"train_loss": -12.457612991333008, "global_step": 464125, "epoch": 2762} {"train_loss": -12.765615463256836, "global_step": 464126, "epoch": 2762} {"train_loss": -12.179068565368652, "global_step": 464127, "epoch": 2762} {"train_loss": -12.568269729614258, "global_step": 464128, "epoch": 2762} {"train_loss": -12.740877151489258, "global_step": 464129, "epoch": 2762} {"train_loss": -12.351285934448242, "global_step": 464130, "epoch": 2762} {"train_loss": -12.795463562011719, "global_step": 464131, "epoch": 2762} {"train_loss": -12.53669261932373, "global_step": 464132, "epoch": 2762} {"train_loss": -12.353182792663574, "global_step": 464133, "epoch": 2762} {"train_loss": -12.472661972045898, "global_step": 464134, "epoch": 2762} {"train_loss": -11.894740104675293, "global_step": 464135, "epoch": 2762} {"train_loss": -12.425050735473633, "global_step": 464136, "epoch": 2762} {"train_loss": -12.605770111083984, "global_step": 464137, "epoch": 2762} {"train_loss": -12.278520584106445, "global_step": 464138, "epoch": 2762} {"train_loss": -12.76744270324707, "global_step": 464139, "epoch": 2762} {"train_loss": -12.637804985046387, "global_step": 464140, "epoch": 2762} {"train_loss": -12.368642807006836, "global_step": 464141, "epoch": 2762} {"train_loss": -12.581719398498535, "global_step": 464142, "epoch": 2762} {"train_loss": -12.45832633972168, "global_step": 464143, "epoch": 2762} {"train_loss": -12.630680084228516, "global_step": 464144, "epoch": 2762} {"train_loss": -12.671825408935547, "global_step": 464145, "epoch": 2762} {"train_loss": -12.689382553100586, "global_step": 464146, "epoch": 2762} {"train_loss": -12.547605514526367, "global_step": 464147, "epoch": 2762} {"train_loss": -12.803227424621582, "global_step": 464148, "epoch": 2762} {"train_loss": -12.555374145507812, "global_step": 464149, "epoch": 2762} {"train_loss": -12.763053894042969, "global_step": 464150, "epoch": 2762} {"train_loss": -12.524620056152344, "global_step": 464151, "epoch": 2762} {"train_loss": -12.954113006591797, "global_step": 464152, "epoch": 2762} {"train_loss": -12.704975128173828, "global_step": 464153, "epoch": 2762} {"train_loss": -12.372978210449219, "global_step": 464154, "epoch": 2762} {"train_loss": -12.809966087341309, "global_step": 464155, "epoch": 2762} {"train_loss": -12.794422149658203, "global_step": 464156, "epoch": 2762} {"train_loss": -12.643794059753418, "global_step": 464157, "epoch": 2762} {"train_loss": -12.543257713317871, "global_step": 464158, "epoch": 2762} {"train_loss": -13.038843154907227, "global_step": 464159, "epoch": 2762} {"train_loss": -12.814127922058105, "global_step": 464160, "epoch": 2762} {"train_loss": -12.726361274719238, "global_step": 464161, "epoch": 2762} {"train_loss": -12.972736358642578, "global_step": 464162, "epoch": 2762} {"train_loss": -12.936174392700195, "global_step": 464163, "epoch": 2762} {"train_loss": -12.92449951171875, "global_step": 464164, "epoch": 2762} {"train_loss": -12.708707809448242, "global_step": 464165, "epoch": 2762} {"train_loss": -12.748563766479492, "global_step": 464166, "epoch": 2762} {"train_loss": -12.416460990905762, "global_step": 464167, "epoch": 2762} {"train_loss": -12.642367362976074, "global_step": 464168, "epoch": 2762} {"train_loss": -12.861326217651367, "global_step": 464169, "epoch": 2762} {"train_loss": -12.617469787597656, "global_step": 464170, "epoch": 2762} {"train_loss": -12.354991912841797, "global_step": 464171, "epoch": 2762} {"train_loss": -12.99264907836914, "global_step": 464172, "epoch": 2762} {"train_loss": -12.144939422607422, "global_step": 464173, "epoch": 2762} {"train_loss": -12.595643997192383, "global_step": 464174, "epoch": 2762} {"train_loss": -12.32206916809082, "global_step": 464175, "epoch": 2762} {"train_loss": -12.762478828430176, "global_step": 464176, "epoch": 2762} {"train_loss": -12.34890365600586, "global_step": 464177, "epoch": 2762} {"train_loss": -12.714022636413574, "global_step": 464178, "epoch": 2762} {"train_loss": -12.022061347961426, "global_step": 464179, "epoch": 2762} {"train_loss": -12.765793800354004, "global_step": 464180, "epoch": 2762} {"train_loss": -12.370551109313965, "global_step": 464181, "epoch": 2762} {"train_loss": -12.571381568908691, "global_step": 464182, "epoch": 2762} {"train_loss": -12.045130437328702, "global_step": 464183, "epoch": 2762, "val_loss": 316572.0} {"train_loss": -12.345473289489746, "global_step": 464184, "epoch": 2763} {"train_loss": -12.26333999633789, "global_step": 464185, "epoch": 2763} {"train_loss": -12.301807403564453, "global_step": 464186, "epoch": 2763} {"train_loss": -12.226171493530273, "global_step": 464187, "epoch": 2763} {"train_loss": -12.359417915344238, "global_step": 464188, "epoch": 2763} {"train_loss": -12.651898384094238, "global_step": 464189, "epoch": 2763} {"train_loss": -12.475971221923828, "global_step": 464190, "epoch": 2763} {"train_loss": -12.532341003417969, "global_step": 464191, "epoch": 2763} {"train_loss": -12.485306739807129, "global_step": 464192, "epoch": 2763} {"train_loss": -12.347196578979492, "global_step": 464193, "epoch": 2763} {"train_loss": -12.505729675292969, "global_step": 464194, "epoch": 2763} {"train_loss": -12.812540054321289, "global_step": 464195, "epoch": 2763} {"train_loss": -12.546581268310547, "global_step": 464196, "epoch": 2763} {"train_loss": -12.456743240356445, "global_step": 464197, "epoch": 2763} {"train_loss": -12.234010696411133, "global_step": 464198, "epoch": 2763} {"train_loss": -12.469356536865234, "global_step": 464199, "epoch": 2763} {"train_loss": -11.985713958740234, "global_step": 464200, "epoch": 2763} {"train_loss": -12.49237060546875, "global_step": 464201, "epoch": 2763} {"train_loss": -11.567831039428711, "global_step": 464202, "epoch": 2763} {"train_loss": -12.296527862548828, "global_step": 464203, "epoch": 2763} {"train_loss": -11.525324821472168, "global_step": 464204, "epoch": 2763} {"train_loss": -12.521167755126953, "global_step": 464205, "epoch": 2763} {"train_loss": -11.958951950073242, "global_step": 464206, "epoch": 2763} {"train_loss": -11.16710090637207, "global_step": 464207, "epoch": 2763} {"train_loss": -10.691862106323242, "global_step": 464208, "epoch": 2763} {"train_loss": -10.769538879394531, "global_step": 464209, "epoch": 2763} {"train_loss": -12.037954330444336, "global_step": 464210, "epoch": 2763} {"train_loss": -11.389627456665039, "global_step": 464211, "epoch": 2763} {"train_loss": -12.386188507080078, "global_step": 464212, "epoch": 2763} {"train_loss": -10.942461013793945, "global_step": 464213, "epoch": 2763} {"train_loss": -10.950582504272461, "global_step": 464214, "epoch": 2763} {"train_loss": -11.995927810668945, "global_step": 464215, "epoch": 2763} {"train_loss": -10.899298667907715, "global_step": 464216, "epoch": 2763} {"train_loss": -11.954967498779297, "global_step": 464217, "epoch": 2763} {"train_loss": -11.14635181427002, "global_step": 464218, "epoch": 2763} {"train_loss": -11.11935043334961, "global_step": 464219, "epoch": 2763} {"train_loss": -11.514689445495605, "global_step": 464220, "epoch": 2763} {"train_loss": -12.358415603637695, "global_step": 464221, "epoch": 2763} {"train_loss": -11.058249473571777, "global_step": 464222, "epoch": 2763} {"train_loss": -11.678801536560059, "global_step": 464223, "epoch": 2763} {"train_loss": -10.48543930053711, "global_step": 464224, "epoch": 2763} {"train_loss": -11.506319046020508, "global_step": 464225, "epoch": 2763} {"train_loss": -11.78161907196045, "global_step": 464226, "epoch": 2763} {"train_loss": -10.062015533447266, "global_step": 464227, "epoch": 2763} {"train_loss": -12.25551986694336, "global_step": 464228, "epoch": 2763} {"train_loss": -9.936373710632324, "global_step": 464229, "epoch": 2763} {"train_loss": -11.61927604675293, "global_step": 464230, "epoch": 2763} {"train_loss": -10.339519500732422, "global_step": 464231, "epoch": 2763} {"train_loss": -10.520362854003906, "global_step": 464232, "epoch": 2763} {"train_loss": -10.335107803344727, "global_step": 464233, "epoch": 2763} {"train_loss": -10.590360641479492, "global_step": 464234, "epoch": 2763} {"train_loss": -9.687660217285156, "global_step": 464235, "epoch": 2763} {"train_loss": -10.348851203918457, "global_step": 464236, "epoch": 2763} {"train_loss": -11.223051071166992, "global_step": 464237, "epoch": 2763} {"train_loss": -10.923215866088867, "global_step": 464238, "epoch": 2763} {"train_loss": -10.867182731628418, "global_step": 464239, "epoch": 2763} {"train_loss": -11.685047149658203, "global_step": 464240, "epoch": 2763} {"train_loss": -11.21902847290039, "global_step": 464241, "epoch": 2763} {"train_loss": -11.199457168579102, "global_step": 464242, "epoch": 2763} {"train_loss": -10.964162826538086, "global_step": 464243, "epoch": 2763} {"train_loss": -10.953874588012695, "global_step": 464244, "epoch": 2763} {"train_loss": -10.587844848632812, "global_step": 464245, "epoch": 2763} {"train_loss": -11.226905822753906, "global_step": 464246, "epoch": 2763} {"train_loss": -10.850781440734863, "global_step": 464247, "epoch": 2763} {"train_loss": -11.582904815673828, "global_step": 464248, "epoch": 2763} {"train_loss": -10.643213272094727, "global_step": 464249, "epoch": 2763} {"train_loss": -11.635478973388672, "global_step": 464250, "epoch": 2763} {"train_loss": -11.101800918579102, "global_step": 464251, "epoch": 2763} {"train_loss": -10.709970474243164, "global_step": 464252, "epoch": 2763} {"train_loss": -11.019430160522461, "global_step": 464253, "epoch": 2763} {"train_loss": -8.90606689453125, "global_step": 464254, "epoch": 2763} {"train_loss": -10.894050598144531, "global_step": 464255, "epoch": 2763} {"train_loss": -10.689271926879883, "global_step": 464256, "epoch": 2763} {"train_loss": -10.962225914001465, "global_step": 464257, "epoch": 2763} {"train_loss": -10.374780654907227, "global_step": 464258, "epoch": 2763} {"train_loss": -10.777007102966309, "global_step": 464259, "epoch": 2763} {"train_loss": -10.622640609741211, "global_step": 464260, "epoch": 2763} {"train_loss": -11.180322647094727, "global_step": 464261, "epoch": 2763} {"train_loss": -11.450679779052734, "global_step": 464262, "epoch": 2763} {"train_loss": -10.506651878356934, "global_step": 464263, "epoch": 2763} {"train_loss": -11.473176956176758, "global_step": 464264, "epoch": 2763} {"train_loss": -11.006178855895996, "global_step": 464265, "epoch": 2763} {"train_loss": -11.091289520263672, "global_step": 464266, "epoch": 2763} {"train_loss": -11.702195167541504, "global_step": 464267, "epoch": 2763} {"train_loss": -11.629823684692383, "global_step": 464268, "epoch": 2763} {"train_loss": -11.58105754852295, "global_step": 464269, "epoch": 2763} {"train_loss": -11.756340980529785, "global_step": 464270, "epoch": 2763} {"train_loss": -12.057014465332031, "global_step": 464271, "epoch": 2763} {"train_loss": -11.632953643798828, "global_step": 464272, "epoch": 2763} {"train_loss": -12.065898895263672, "global_step": 464273, "epoch": 2763} {"train_loss": -11.558631896972656, "global_step": 464274, "epoch": 2763} {"train_loss": -11.902961730957031, "global_step": 464275, "epoch": 2763} {"train_loss": -12.289369583129883, "global_step": 464276, "epoch": 2763} {"train_loss": -11.804872512817383, "global_step": 464277, "epoch": 2763} {"train_loss": -12.183796882629395, "global_step": 464278, "epoch": 2763} {"train_loss": -12.230521202087402, "global_step": 464279, "epoch": 2763} {"train_loss": -12.37826919555664, "global_step": 464280, "epoch": 2763} {"train_loss": -12.34019660949707, "global_step": 464281, "epoch": 2763} {"train_loss": -12.346136093139648, "global_step": 464282, "epoch": 2763} {"train_loss": -12.290997505187988, "global_step": 464283, "epoch": 2763} {"train_loss": -12.286410331726074, "global_step": 464284, "epoch": 2763} {"train_loss": -12.305182456970215, "global_step": 464285, "epoch": 2763} {"train_loss": -12.219675064086914, "global_step": 464286, "epoch": 2763} {"train_loss": -12.112838745117188, "global_step": 464287, "epoch": 2763} {"train_loss": -12.38930892944336, "global_step": 464288, "epoch": 2763} {"train_loss": -12.595013618469238, "global_step": 464289, "epoch": 2763} {"train_loss": -12.455142974853516, "global_step": 464290, "epoch": 2763} {"train_loss": -12.354442596435547, "global_step": 464291, "epoch": 2763} {"train_loss": -12.357987403869629, "global_step": 464292, "epoch": 2763} {"train_loss": -12.40656852722168, "global_step": 464293, "epoch": 2763} {"train_loss": -12.557563781738281, "global_step": 464294, "epoch": 2763} {"train_loss": -12.610506057739258, "global_step": 464295, "epoch": 2763} {"train_loss": -12.590413093566895, "global_step": 464296, "epoch": 2763} {"train_loss": -12.573314666748047, "global_step": 464297, "epoch": 2763} {"train_loss": -12.625516891479492, "global_step": 464298, "epoch": 2763} {"train_loss": -12.26797103881836, "global_step": 464299, "epoch": 2763} {"train_loss": -12.61856460571289, "global_step": 464300, "epoch": 2763} {"train_loss": -12.489986419677734, "global_step": 464301, "epoch": 2763} {"train_loss": -12.671306610107422, "global_step": 464302, "epoch": 2763} {"train_loss": -12.264440536499023, "global_step": 464303, "epoch": 2763} {"train_loss": -12.623265266418457, "global_step": 464304, "epoch": 2763} {"train_loss": -12.666830062866211, "global_step": 464305, "epoch": 2763} {"train_loss": -12.632782936096191, "global_step": 464306, "epoch": 2763} {"train_loss": -12.530191421508789, "global_step": 464307, "epoch": 2763} {"train_loss": -12.630318641662598, "global_step": 464308, "epoch": 2763} {"train_loss": -12.352304458618164, "global_step": 464309, "epoch": 2763} {"train_loss": -12.74301528930664, "global_step": 464310, "epoch": 2763} {"train_loss": -12.612915992736816, "global_step": 464311, "epoch": 2763} {"train_loss": -12.529853820800781, "global_step": 464312, "epoch": 2763} {"train_loss": -12.760400772094727, "global_step": 464313, "epoch": 2763} {"train_loss": -12.70284652709961, "global_step": 464314, "epoch": 2763} {"train_loss": -12.81030559539795, "global_step": 464315, "epoch": 2763} {"train_loss": -12.643080711364746, "global_step": 464316, "epoch": 2763} {"train_loss": -12.870942115783691, "global_step": 464317, "epoch": 2763} {"train_loss": -12.631595611572266, "global_step": 464318, "epoch": 2763} {"train_loss": -12.529691696166992, "global_step": 464319, "epoch": 2763} {"train_loss": -12.630655288696289, "global_step": 464320, "epoch": 2763} {"train_loss": -12.743741989135742, "global_step": 464321, "epoch": 2763} {"train_loss": -12.659233093261719, "global_step": 464322, "epoch": 2763} {"train_loss": -12.526617050170898, "global_step": 464323, "epoch": 2763} {"train_loss": -12.648595809936523, "global_step": 464324, "epoch": 2763} {"train_loss": -12.625003814697266, "global_step": 464325, "epoch": 2763} {"train_loss": -12.690166473388672, "global_step": 464326, "epoch": 2763} {"train_loss": -12.389060974121094, "global_step": 464327, "epoch": 2763} {"train_loss": -12.753545761108398, "global_step": 464328, "epoch": 2763} {"train_loss": -12.44550895690918, "global_step": 464329, "epoch": 2763} {"train_loss": -12.47836685180664, "global_step": 464330, "epoch": 2763} {"train_loss": -12.534997940063477, "global_step": 464331, "epoch": 2763} {"train_loss": -12.597273826599121, "global_step": 464332, "epoch": 2763} {"train_loss": -12.38562297821045, "global_step": 464333, "epoch": 2763} {"train_loss": -13.052818298339844, "global_step": 464334, "epoch": 2763} {"train_loss": -12.818902969360352, "global_step": 464335, "epoch": 2763} {"train_loss": -12.781692504882812, "global_step": 464336, "epoch": 2763} {"train_loss": -12.662193298339844, "global_step": 464337, "epoch": 2763} {"train_loss": -12.618537902832031, "global_step": 464338, "epoch": 2763} {"train_loss": -12.864986419677734, "global_step": 464339, "epoch": 2763} {"train_loss": -12.754032135009766, "global_step": 464340, "epoch": 2763} {"train_loss": -12.852315902709961, "global_step": 464341, "epoch": 2763} {"train_loss": -12.685087203979492, "global_step": 464342, "epoch": 2763} {"train_loss": -13.018383979797363, "global_step": 464343, "epoch": 2763} {"train_loss": -12.56251335144043, "global_step": 464344, "epoch": 2763} {"train_loss": -12.852731704711914, "global_step": 464345, "epoch": 2763} {"train_loss": -13.089820861816406, "global_step": 464346, "epoch": 2763} {"train_loss": -12.863822937011719, "global_step": 464347, "epoch": 2763} {"train_loss": -12.78170394897461, "global_step": 464348, "epoch": 2763} {"train_loss": -13.005383491516113, "global_step": 464349, "epoch": 2763} {"train_loss": -13.062074661254883, "global_step": 464350, "epoch": 2763} {"train_loss": -11.948027917316981, "global_step": 464351, "epoch": 2763, "val_loss": 317094.6875} {"train_loss": -12.951766967773438, "global_step": 464352, "epoch": 2764} {"train_loss": -13.074064254760742, "global_step": 464353, "epoch": 2764} {"train_loss": -13.05556869506836, "global_step": 464354, "epoch": 2764} {"train_loss": -12.751543998718262, "global_step": 464355, "epoch": 2764} {"train_loss": -13.001291275024414, "global_step": 464356, "epoch": 2764} {"train_loss": -12.950542449951172, "global_step": 464357, "epoch": 2764} {"train_loss": -12.979103088378906, "global_step": 464358, "epoch": 2764} {"train_loss": -12.76226806640625, "global_step": 464359, "epoch": 2764} {"train_loss": -12.662887573242188, "global_step": 464360, "epoch": 2764} {"train_loss": -12.826805114746094, "global_step": 464361, "epoch": 2764} {"train_loss": -12.854076385498047, "global_step": 464362, "epoch": 2764} {"train_loss": -12.34299373626709, "global_step": 464363, "epoch": 2764} {"train_loss": -11.445878982543945, "global_step": 464364, "epoch": 2764} {"train_loss": -12.420044898986816, "global_step": 464365, "epoch": 2764} {"train_loss": -12.2880859375, "global_step": 464366, "epoch": 2764} {"train_loss": -10.81161117553711, "global_step": 464367, "epoch": 2764} {"train_loss": -10.264286994934082, "global_step": 464368, "epoch": 2764} {"train_loss": -10.453746795654297, "global_step": 464369, "epoch": 2764} {"train_loss": -12.124401092529297, "global_step": 464370, "epoch": 2764} {"train_loss": -8.304006576538086, "global_step": 464371, "epoch": 2764} {"train_loss": -8.135590553283691, "global_step": 464372, "epoch": 2764} {"train_loss": -11.336524963378906, "global_step": 464373, "epoch": 2764} {"train_loss": -11.178792953491211, "global_step": 464374, "epoch": 2764} {"train_loss": -8.234949111938477, "global_step": 464375, "epoch": 2764} {"train_loss": -8.059465408325195, "global_step": 464376, "epoch": 2764} {"train_loss": -11.173358917236328, "global_step": 464377, "epoch": 2764} {"train_loss": -9.517152786254883, "global_step": 464378, "epoch": 2764} {"train_loss": -10.740152359008789, "global_step": 464379, "epoch": 2764} {"train_loss": -9.8368558883667, "global_step": 464380, "epoch": 2764} {"train_loss": -8.374641418457031, "global_step": 464381, "epoch": 2764} {"train_loss": -10.005693435668945, "global_step": 464382, "epoch": 2764} {"train_loss": -10.242198944091797, "global_step": 464383, "epoch": 2764} {"train_loss": -9.472774505615234, "global_step": 464384, "epoch": 2764} {"train_loss": -9.824605941772461, "global_step": 464385, "epoch": 2764} {"train_loss": -10.288862228393555, "global_step": 464386, "epoch": 2764} {"train_loss": -10.084430694580078, "global_step": 464387, "epoch": 2764} {"train_loss": -10.736970901489258, "global_step": 464388, "epoch": 2764} {"train_loss": -11.605559349060059, "global_step": 464389, "epoch": 2764} {"train_loss": -9.866069793701172, "global_step": 464390, "epoch": 2764} {"train_loss": -10.956441879272461, "global_step": 464391, "epoch": 2764} {"train_loss": -9.379645347595215, "global_step": 464392, "epoch": 2764} {"train_loss": -9.22903823852539, "global_step": 464393, "epoch": 2764} {"train_loss": -10.775619506835938, "global_step": 464394, "epoch": 2764} {"train_loss": -11.11933708190918, "global_step": 464395, "epoch": 2764} {"train_loss": -10.867692947387695, "global_step": 464396, "epoch": 2764} {"train_loss": -11.66943359375, "global_step": 464397, "epoch": 2764} {"train_loss": -11.129915237426758, "global_step": 464398, "epoch": 2764} {"train_loss": -11.703652381896973, "global_step": 464399, "epoch": 2764} {"train_loss": -11.353805541992188, "global_step": 464400, "epoch": 2764} {"train_loss": -11.47741413116455, "global_step": 464401, "epoch": 2764} {"train_loss": -12.20963191986084, "global_step": 464402, "epoch": 2764} {"train_loss": -11.669585227966309, "global_step": 464403, "epoch": 2764} {"train_loss": -11.713455200195312, "global_step": 464404, "epoch": 2764} {"train_loss": -11.960800170898438, "global_step": 464405, "epoch": 2764} {"train_loss": -11.464433670043945, "global_step": 464406, "epoch": 2764} {"train_loss": -11.873231887817383, "global_step": 464407, "epoch": 2764} {"train_loss": -11.937613487243652, "global_step": 464408, "epoch": 2764} {"train_loss": -11.784515380859375, "global_step": 464409, "epoch": 2764} {"train_loss": -12.587434768676758, "global_step": 464410, "epoch": 2764} {"train_loss": -12.082101821899414, "global_step": 464411, "epoch": 2764} {"train_loss": -12.427865028381348, "global_step": 464412, "epoch": 2764} {"train_loss": -12.380823135375977, "global_step": 464413, "epoch": 2764} {"train_loss": -11.839649200439453, "global_step": 464414, "epoch": 2764} {"train_loss": -12.3206787109375, "global_step": 464415, "epoch": 2764} {"train_loss": -12.060026168823242, "global_step": 464416, "epoch": 2764} {"train_loss": -12.41884994506836, "global_step": 464417, "epoch": 2764} {"train_loss": -12.283246994018555, "global_step": 464418, "epoch": 2764} {"train_loss": -12.158166885375977, "global_step": 464419, "epoch": 2764} {"train_loss": -12.369077682495117, "global_step": 464420, "epoch": 2764} {"train_loss": -12.13476848602295, "global_step": 464421, "epoch": 2764} {"train_loss": -12.352082252502441, "global_step": 464422, "epoch": 2764} {"train_loss": -12.406920433044434, "global_step": 464423, "epoch": 2764} {"train_loss": -12.288534164428711, "global_step": 464424, "epoch": 2764} {"train_loss": -12.261405944824219, "global_step": 464425, "epoch": 2764} {"train_loss": -12.177745819091797, "global_step": 464426, "epoch": 2764} {"train_loss": -12.147342681884766, "global_step": 464427, "epoch": 2764} {"train_loss": -12.540620803833008, "global_step": 464428, "epoch": 2764} {"train_loss": -12.282661437988281, "global_step": 464429, "epoch": 2764} {"train_loss": -12.524310111999512, "global_step": 464430, "epoch": 2764} {"train_loss": -12.233123779296875, "global_step": 464431, "epoch": 2764} {"train_loss": -12.188968658447266, "global_step": 464432, "epoch": 2764} {"train_loss": -12.083620071411133, "global_step": 464433, "epoch": 2764} {"train_loss": -12.47694206237793, "global_step": 464434, "epoch": 2764} {"train_loss": -12.644521713256836, "global_step": 464435, "epoch": 2764} {"train_loss": -12.514198303222656, "global_step": 464436, "epoch": 2764} {"train_loss": -12.353801727294922, "global_step": 464437, "epoch": 2764} {"train_loss": -12.387897491455078, "global_step": 464438, "epoch": 2764} {"train_loss": -12.521461486816406, "global_step": 464439, "epoch": 2764} {"train_loss": -12.686456680297852, "global_step": 464440, "epoch": 2764} {"train_loss": -12.331733703613281, "global_step": 464441, "epoch": 2764} {"train_loss": -12.421483039855957, "global_step": 464442, "epoch": 2764} {"train_loss": -12.686649322509766, "global_step": 464443, "epoch": 2764} {"train_loss": -12.14842414855957, "global_step": 464444, "epoch": 2764} {"train_loss": -12.518930435180664, "global_step": 464445, "epoch": 2764} {"train_loss": -12.2188720703125, "global_step": 464446, "epoch": 2764} {"train_loss": -12.602214813232422, "global_step": 464447, "epoch": 2764} {"train_loss": -12.59876537322998, "global_step": 464448, "epoch": 2764} {"train_loss": -12.691354751586914, "global_step": 464449, "epoch": 2764} {"train_loss": -12.631673812866211, "global_step": 464450, "epoch": 2764} {"train_loss": -12.193244934082031, "global_step": 464451, "epoch": 2764} {"train_loss": -12.297172546386719, "global_step": 464452, "epoch": 2764} {"train_loss": -12.684085845947266, "global_step": 464453, "epoch": 2764} {"train_loss": -12.39434814453125, "global_step": 464454, "epoch": 2764} {"train_loss": -12.722627639770508, "global_step": 464455, "epoch": 2764} {"train_loss": -12.72055435180664, "global_step": 464456, "epoch": 2764} {"train_loss": -12.531000137329102, "global_step": 464457, "epoch": 2764} {"train_loss": -12.730502128601074, "global_step": 464458, "epoch": 2764} {"train_loss": -12.68237590789795, "global_step": 464459, "epoch": 2764} {"train_loss": -12.563358306884766, "global_step": 464460, "epoch": 2764} {"train_loss": -12.573324203491211, "global_step": 464461, "epoch": 2764} {"train_loss": -12.565918922424316, "global_step": 464462, "epoch": 2764} {"train_loss": -12.265605926513672, "global_step": 464463, "epoch": 2764} {"train_loss": -12.607704162597656, "global_step": 464464, "epoch": 2764} {"train_loss": -12.440075874328613, "global_step": 464465, "epoch": 2764} {"train_loss": -12.739032745361328, "global_step": 464466, "epoch": 2764} {"train_loss": -12.620874404907227, "global_step": 464467, "epoch": 2764} {"train_loss": -12.759719848632812, "global_step": 464468, "epoch": 2764} {"train_loss": -12.477273941040039, "global_step": 464469, "epoch": 2764} {"train_loss": -12.323163032531738, "global_step": 464470, "epoch": 2764} {"train_loss": -12.559146881103516, "global_step": 464471, "epoch": 2764} {"train_loss": -12.835123062133789, "global_step": 464472, "epoch": 2764} {"train_loss": -12.798593521118164, "global_step": 464473, "epoch": 2764} {"train_loss": -12.45832347869873, "global_step": 464474, "epoch": 2764} {"train_loss": -12.735827445983887, "global_step": 464475, "epoch": 2764} {"train_loss": -12.535237312316895, "global_step": 464476, "epoch": 2764} {"train_loss": -12.688234329223633, "global_step": 464477, "epoch": 2764} {"train_loss": -12.709640502929688, "global_step": 464478, "epoch": 2764} {"train_loss": -12.590136528015137, "global_step": 464479, "epoch": 2764} {"train_loss": -12.58994197845459, "global_step": 464480, "epoch": 2764} {"train_loss": -12.482423782348633, "global_step": 464481, "epoch": 2764} {"train_loss": -12.347701072692871, "global_step": 464482, "epoch": 2764} {"train_loss": -12.31830883026123, "global_step": 464483, "epoch": 2764} {"train_loss": -12.10421371459961, "global_step": 464484, "epoch": 2764} {"train_loss": -12.022607803344727, "global_step": 464485, "epoch": 2764} {"train_loss": -12.841737747192383, "global_step": 464486, "epoch": 2764} {"train_loss": -12.32514476776123, "global_step": 464487, "epoch": 2764} {"train_loss": -12.728226661682129, "global_step": 464488, "epoch": 2764} {"train_loss": -12.476727485656738, "global_step": 464489, "epoch": 2764} {"train_loss": -11.979145050048828, "global_step": 464490, "epoch": 2764} {"train_loss": -12.535015106201172, "global_step": 464491, "epoch": 2764} {"train_loss": -11.961553573608398, "global_step": 464492, "epoch": 2764} {"train_loss": -12.856271743774414, "global_step": 464493, "epoch": 2764} {"train_loss": -12.510775566101074, "global_step": 464494, "epoch": 2764} {"train_loss": -12.158477783203125, "global_step": 464495, "epoch": 2764} {"train_loss": -12.854323387145996, "global_step": 464496, "epoch": 2764} {"train_loss": -12.681421279907227, "global_step": 464497, "epoch": 2764} {"train_loss": -12.859915733337402, "global_step": 464498, "epoch": 2764} {"train_loss": -12.804252624511719, "global_step": 464499, "epoch": 2764} {"train_loss": -12.590288162231445, "global_step": 464500, "epoch": 2764} {"train_loss": -12.84758186340332, "global_step": 464501, "epoch": 2764} {"train_loss": -12.752378463745117, "global_step": 464502, "epoch": 2764} {"train_loss": -12.317418098449707, "global_step": 464503, "epoch": 2764} {"train_loss": -12.80942153930664, "global_step": 464504, "epoch": 2764} {"train_loss": -12.620107650756836, "global_step": 464505, "epoch": 2764} {"train_loss": -12.81296443939209, "global_step": 464506, "epoch": 2764} {"train_loss": -12.569048881530762, "global_step": 464507, "epoch": 2764} {"train_loss": -12.742682456970215, "global_step": 464508, "epoch": 2764} {"train_loss": -12.888204574584961, "global_step": 464509, "epoch": 2764} {"train_loss": -12.700639724731445, "global_step": 464510, "epoch": 2764} {"train_loss": -12.37198543548584, "global_step": 464511, "epoch": 2764} {"train_loss": -12.787137031555176, "global_step": 464512, "epoch": 2764} {"train_loss": -12.589509963989258, "global_step": 464513, "epoch": 2764} {"train_loss": -12.744346618652344, "global_step": 464514, "epoch": 2764} {"train_loss": -12.930513381958008, "global_step": 464515, "epoch": 2764} {"train_loss": -12.806020736694336, "global_step": 464516, "epoch": 2764} {"train_loss": -12.574092864990234, "global_step": 464517, "epoch": 2764} {"train_loss": -12.466375350952148, "global_step": 464518, "epoch": 2764} {"train_loss": -12.023160281635466, "global_step": 464519, "epoch": 2764, "val_loss": 314480.40625} {"train_loss": -12.748451232910156, "global_step": 464520, "epoch": 2765} {"train_loss": -12.950784683227539, "global_step": 464521, "epoch": 2765} {"train_loss": -12.661970138549805, "global_step": 464522, "epoch": 2765} {"train_loss": -12.44804573059082, "global_step": 464523, "epoch": 2765} {"train_loss": -11.425578117370605, "global_step": 464524, "epoch": 2765} {"train_loss": -12.727519989013672, "global_step": 464525, "epoch": 2765} {"train_loss": -12.651371955871582, "global_step": 464526, "epoch": 2765} {"train_loss": -12.288695335388184, "global_step": 464527, "epoch": 2765} {"train_loss": -11.581197738647461, "global_step": 464528, "epoch": 2765} {"train_loss": -11.3392333984375, "global_step": 464529, "epoch": 2765} {"train_loss": -11.660504341125488, "global_step": 464530, "epoch": 2765} {"train_loss": -11.536221504211426, "global_step": 464531, "epoch": 2765} {"train_loss": -11.29011058807373, "global_step": 464532, "epoch": 2765} {"train_loss": -11.671794891357422, "global_step": 464533, "epoch": 2765} {"train_loss": -12.473724365234375, "global_step": 464534, "epoch": 2765} {"train_loss": -12.243886947631836, "global_step": 464535, "epoch": 2765} {"train_loss": -12.318586349487305, "global_step": 464536, "epoch": 2765} {"train_loss": -12.063023567199707, "global_step": 464537, "epoch": 2765} {"train_loss": -12.269233703613281, "global_step": 464538, "epoch": 2765} {"train_loss": -12.311235427856445, "global_step": 464539, "epoch": 2765} {"train_loss": -12.648200035095215, "global_step": 464540, "epoch": 2765} {"train_loss": -11.881889343261719, "global_step": 464541, "epoch": 2765} {"train_loss": -11.929330825805664, "global_step": 464542, "epoch": 2765} {"train_loss": -12.061260223388672, "global_step": 464543, "epoch": 2765} {"train_loss": -11.903448104858398, "global_step": 464544, "epoch": 2765} {"train_loss": -11.79029369354248, "global_step": 464545, "epoch": 2765} {"train_loss": -11.773685455322266, "global_step": 464546, "epoch": 2765} {"train_loss": -12.332819938659668, "global_step": 464547, "epoch": 2765} {"train_loss": -12.185868263244629, "global_step": 464548, "epoch": 2765} {"train_loss": -12.083154678344727, "global_step": 464549, "epoch": 2765} {"train_loss": -12.130449295043945, "global_step": 464550, "epoch": 2765} {"train_loss": -11.395589828491211, "global_step": 464551, "epoch": 2765} {"train_loss": -11.790486335754395, "global_step": 464552, "epoch": 2765} {"train_loss": -12.359833717346191, "global_step": 464553, "epoch": 2765} {"train_loss": -11.707260131835938, "global_step": 464554, "epoch": 2765} {"train_loss": -12.49521255493164, "global_step": 464555, "epoch": 2765} {"train_loss": -11.339311599731445, "global_step": 464556, "epoch": 2765} {"train_loss": -12.653450012207031, "global_step": 464557, "epoch": 2765} {"train_loss": -11.212691307067871, "global_step": 464558, "epoch": 2765} {"train_loss": -12.184475898742676, "global_step": 464559, "epoch": 2765} {"train_loss": -11.897658348083496, "global_step": 464560, "epoch": 2765} {"train_loss": -12.184133529663086, "global_step": 464561, "epoch": 2765} {"train_loss": -11.936666488647461, "global_step": 464562, "epoch": 2765} {"train_loss": -12.183135032653809, "global_step": 464563, "epoch": 2765} {"train_loss": -11.532785415649414, "global_step": 464564, "epoch": 2765} {"train_loss": -12.216987609863281, "global_step": 464565, "epoch": 2765} {"train_loss": -11.341175079345703, "global_step": 464566, "epoch": 2765} {"train_loss": -12.260467529296875, "global_step": 464567, "epoch": 2765} {"train_loss": -11.736797332763672, "global_step": 464568, "epoch": 2765} {"train_loss": -12.410137176513672, "global_step": 464569, "epoch": 2765} {"train_loss": -11.960042953491211, "global_step": 464570, "epoch": 2765} {"train_loss": -12.536093711853027, "global_step": 464571, "epoch": 2765} {"train_loss": -11.916475296020508, "global_step": 464572, "epoch": 2765} {"train_loss": -12.405794143676758, "global_step": 464573, "epoch": 2765} {"train_loss": -12.348523139953613, "global_step": 464574, "epoch": 2765} {"train_loss": -12.661762237548828, "global_step": 464575, "epoch": 2765} {"train_loss": -12.340498924255371, "global_step": 464576, "epoch": 2765} {"train_loss": -12.22892951965332, "global_step": 464577, "epoch": 2765} {"train_loss": -12.170805931091309, "global_step": 464578, "epoch": 2765} {"train_loss": -12.247357368469238, "global_step": 464579, "epoch": 2765} {"train_loss": -12.333471298217773, "global_step": 464580, "epoch": 2765} {"train_loss": -12.322102546691895, "global_step": 464581, "epoch": 2765} {"train_loss": -11.955442428588867, "global_step": 464582, "epoch": 2765} {"train_loss": -12.284971237182617, "global_step": 464583, "epoch": 2765} {"train_loss": -11.915336608886719, "global_step": 464584, "epoch": 2765} {"train_loss": -12.355660438537598, "global_step": 464585, "epoch": 2765} {"train_loss": -11.80184555053711, "global_step": 464586, "epoch": 2765} {"train_loss": -11.904727935791016, "global_step": 464587, "epoch": 2765} {"train_loss": -12.313310623168945, "global_step": 464588, "epoch": 2765} {"train_loss": -12.00816535949707, "global_step": 464589, "epoch": 2765} {"train_loss": -12.577035903930664, "global_step": 464590, "epoch": 2765} {"train_loss": -12.20430850982666, "global_step": 464591, "epoch": 2765} {"train_loss": -12.457963943481445, "global_step": 464592, "epoch": 2765} {"train_loss": -12.223569869995117, "global_step": 464593, "epoch": 2765} {"train_loss": -12.126301765441895, "global_step": 464594, "epoch": 2765} {"train_loss": -12.397323608398438, "global_step": 464595, "epoch": 2765} {"train_loss": -11.887016296386719, "global_step": 464596, "epoch": 2765} {"train_loss": -12.445792198181152, "global_step": 464597, "epoch": 2765} {"train_loss": -12.260189056396484, "global_step": 464598, "epoch": 2765} {"train_loss": -12.449780464172363, "global_step": 464599, "epoch": 2765} {"train_loss": -11.622328758239746, "global_step": 464600, "epoch": 2765} {"train_loss": -12.642626762390137, "global_step": 464601, "epoch": 2765} {"train_loss": -12.017141342163086, "global_step": 464602, "epoch": 2765} {"train_loss": -12.24240779876709, "global_step": 464603, "epoch": 2765} {"train_loss": -11.856834411621094, "global_step": 464604, "epoch": 2765} {"train_loss": -11.914955139160156, "global_step": 464605, "epoch": 2765} {"train_loss": -12.053519248962402, "global_step": 464606, "epoch": 2765} {"train_loss": -12.067641258239746, "global_step": 464607, "epoch": 2765} {"train_loss": -12.477669715881348, "global_step": 464608, "epoch": 2765} {"train_loss": -12.047768592834473, "global_step": 464609, "epoch": 2765} {"train_loss": -12.328978538513184, "global_step": 464610, "epoch": 2765} {"train_loss": -12.25638198852539, "global_step": 464611, "epoch": 2765} {"train_loss": -12.296356201171875, "global_step": 464612, "epoch": 2765} {"train_loss": -12.101813316345215, "global_step": 464613, "epoch": 2765} {"train_loss": -12.462645530700684, "global_step": 464614, "epoch": 2765} {"train_loss": -12.19107437133789, "global_step": 464615, "epoch": 2765} {"train_loss": -11.957284927368164, "global_step": 464616, "epoch": 2765} {"train_loss": -12.162948608398438, "global_step": 464617, "epoch": 2765} {"train_loss": -11.434120178222656, "global_step": 464618, "epoch": 2765} {"train_loss": -12.286883354187012, "global_step": 464619, "epoch": 2765} {"train_loss": -11.505725860595703, "global_step": 464620, "epoch": 2765} {"train_loss": -12.366640090942383, "global_step": 464621, "epoch": 2765} {"train_loss": -11.875452995300293, "global_step": 464622, "epoch": 2765} {"train_loss": -11.883121490478516, "global_step": 464623, "epoch": 2765} {"train_loss": -12.130504608154297, "global_step": 464624, "epoch": 2765} {"train_loss": -11.310308456420898, "global_step": 464625, "epoch": 2765} {"train_loss": -11.901604652404785, "global_step": 464626, "epoch": 2765} {"train_loss": -11.134435653686523, "global_step": 464627, "epoch": 2765} {"train_loss": -11.815010070800781, "global_step": 464628, "epoch": 2765} {"train_loss": -11.498292922973633, "global_step": 464629, "epoch": 2765} {"train_loss": -11.740869522094727, "global_step": 464630, "epoch": 2765} {"train_loss": -10.979771614074707, "global_step": 464631, "epoch": 2765} {"train_loss": -12.031893730163574, "global_step": 464632, "epoch": 2765} {"train_loss": -11.69482707977295, "global_step": 464633, "epoch": 2765} {"train_loss": -11.899887084960938, "global_step": 464634, "epoch": 2765} {"train_loss": -12.222169876098633, "global_step": 464635, "epoch": 2765} {"train_loss": -11.729034423828125, "global_step": 464636, "epoch": 2765} {"train_loss": -12.200361251831055, "global_step": 464637, "epoch": 2765} {"train_loss": -11.931480407714844, "global_step": 464638, "epoch": 2765} {"train_loss": -12.111156463623047, "global_step": 464639, "epoch": 2765} {"train_loss": -12.114063262939453, "global_step": 464640, "epoch": 2765} {"train_loss": -11.953893661499023, "global_step": 464641, "epoch": 2765} {"train_loss": -12.302511215209961, "global_step": 464642, "epoch": 2765} {"train_loss": -12.267581939697266, "global_step": 464643, "epoch": 2765} {"train_loss": -12.219526290893555, "global_step": 464644, "epoch": 2765} {"train_loss": -12.247289657592773, "global_step": 464645, "epoch": 2765} {"train_loss": -11.984797477722168, "global_step": 464646, "epoch": 2765} {"train_loss": -12.54464054107666, "global_step": 464647, "epoch": 2765} {"train_loss": -11.847434997558594, "global_step": 464648, "epoch": 2765} {"train_loss": -12.185449600219727, "global_step": 464649, "epoch": 2765} {"train_loss": -11.853252410888672, "global_step": 464650, "epoch": 2765} {"train_loss": -12.38814640045166, "global_step": 464651, "epoch": 2765} {"train_loss": -12.208938598632812, "global_step": 464652, "epoch": 2765} {"train_loss": -12.22713851928711, "global_step": 464653, "epoch": 2765} {"train_loss": -12.515880584716797, "global_step": 464654, "epoch": 2765} {"train_loss": -11.837547302246094, "global_step": 464655, "epoch": 2765} {"train_loss": -12.546483993530273, "global_step": 464656, "epoch": 2765} {"train_loss": -12.34302043914795, "global_step": 464657, "epoch": 2765} {"train_loss": -12.254676818847656, "global_step": 464658, "epoch": 2765} {"train_loss": -12.542396545410156, "global_step": 464659, "epoch": 2765} {"train_loss": -12.344076156616211, "global_step": 464660, "epoch": 2765} {"train_loss": -12.147724151611328, "global_step": 464661, "epoch": 2765} {"train_loss": -12.167783737182617, "global_step": 464662, "epoch": 2765} {"train_loss": -11.728195190429688, "global_step": 464663, "epoch": 2765} {"train_loss": -12.604120254516602, "global_step": 464664, "epoch": 2765} {"train_loss": -12.257556915283203, "global_step": 464665, "epoch": 2765} {"train_loss": -12.444357872009277, "global_step": 464666, "epoch": 2765} {"train_loss": -12.74746322631836, "global_step": 464667, "epoch": 2765} {"train_loss": -12.50921630859375, "global_step": 464668, "epoch": 2765} {"train_loss": -12.569873809814453, "global_step": 464669, "epoch": 2765} {"train_loss": -12.462109565734863, "global_step": 464670, "epoch": 2765} {"train_loss": -12.52781867980957, "global_step": 464671, "epoch": 2765} {"train_loss": -12.863870620727539, "global_step": 464672, "epoch": 2765} {"train_loss": -12.687484741210938, "global_step": 464673, "epoch": 2765} {"train_loss": -12.538389205932617, "global_step": 464674, "epoch": 2765} {"train_loss": -12.696730613708496, "global_step": 464675, "epoch": 2765} {"train_loss": -12.643634796142578, "global_step": 464676, "epoch": 2765} {"train_loss": -12.541749000549316, "global_step": 464677, "epoch": 2765} {"train_loss": -12.848470687866211, "global_step": 464678, "epoch": 2765} {"train_loss": -12.69660758972168, "global_step": 464679, "epoch": 2765} {"train_loss": -12.632521629333496, "global_step": 464680, "epoch": 2765} {"train_loss": -12.599237442016602, "global_step": 464681, "epoch": 2765} {"train_loss": -12.506691932678223, "global_step": 464682, "epoch": 2765} {"train_loss": -12.66836929321289, "global_step": 464683, "epoch": 2765} {"train_loss": -12.544866561889648, "global_step": 464684, "epoch": 2765} {"train_loss": -12.753912925720215, "global_step": 464685, "epoch": 2765} {"train_loss": -11.658533096313477, "global_step": 464686, "epoch": 2765} {"train_loss": -12.151213980856395, "global_step": 464687, "epoch": 2765, "val_loss": 317126.09375, "train_action_mse_error": 1.4734963178634644} {"train_loss": -12.584457397460938, "global_step": 464688, "epoch": 2766} {"train_loss": -12.263195037841797, "global_step": 464689, "epoch": 2766} {"train_loss": -12.154243469238281, "global_step": 464690, "epoch": 2766} {"train_loss": -12.726423263549805, "global_step": 464691, "epoch": 2766} {"train_loss": -12.279729843139648, "global_step": 464692, "epoch": 2766} {"train_loss": -11.65566635131836, "global_step": 464693, "epoch": 2766} {"train_loss": -12.601036071777344, "global_step": 464694, "epoch": 2766} {"train_loss": -11.934288024902344, "global_step": 464695, "epoch": 2766} {"train_loss": -11.185696601867676, "global_step": 464696, "epoch": 2766} {"train_loss": -12.569456100463867, "global_step": 464697, "epoch": 2766} {"train_loss": -10.741771697998047, "global_step": 464698, "epoch": 2766} {"train_loss": -11.50282096862793, "global_step": 464699, "epoch": 2766} {"train_loss": -11.722269058227539, "global_step": 464700, "epoch": 2766} {"train_loss": -10.198287963867188, "global_step": 464701, "epoch": 2766} {"train_loss": -11.013669967651367, "global_step": 464702, "epoch": 2766} {"train_loss": -11.66110897064209, "global_step": 464703, "epoch": 2766} {"train_loss": -10.655081748962402, "global_step": 464704, "epoch": 2766} {"train_loss": -9.585565567016602, "global_step": 464705, "epoch": 2766} {"train_loss": -10.917959213256836, "global_step": 464706, "epoch": 2766} {"train_loss": -10.87729263305664, "global_step": 464707, "epoch": 2766} {"train_loss": -10.953144073486328, "global_step": 464708, "epoch": 2766} {"train_loss": -10.569849967956543, "global_step": 464709, "epoch": 2766} {"train_loss": -11.705589294433594, "global_step": 464710, "epoch": 2766} {"train_loss": -10.896292686462402, "global_step": 464711, "epoch": 2766} {"train_loss": -10.92105484008789, "global_step": 464712, "epoch": 2766} {"train_loss": -10.603189468383789, "global_step": 464713, "epoch": 2766} {"train_loss": -10.67880630493164, "global_step": 464714, "epoch": 2766} {"train_loss": -11.126492500305176, "global_step": 464715, "epoch": 2766} {"train_loss": -10.541524887084961, "global_step": 464716, "epoch": 2766} {"train_loss": -11.130428314208984, "global_step": 464717, "epoch": 2766} {"train_loss": -11.658219337463379, "global_step": 464718, "epoch": 2766} {"train_loss": -10.7656888961792, "global_step": 464719, "epoch": 2766} {"train_loss": -11.059354782104492, "global_step": 464720, "epoch": 2766} {"train_loss": -10.758462905883789, "global_step": 464721, "epoch": 2766} {"train_loss": -11.8875732421875, "global_step": 464722, "epoch": 2766} {"train_loss": -11.705511093139648, "global_step": 464723, "epoch": 2766} {"train_loss": -11.549666404724121, "global_step": 464724, "epoch": 2766} {"train_loss": -11.293939590454102, "global_step": 464725, "epoch": 2766} {"train_loss": -12.042036056518555, "global_step": 464726, "epoch": 2766} {"train_loss": -11.21354866027832, "global_step": 464727, "epoch": 2766} {"train_loss": -11.699827194213867, "global_step": 464728, "epoch": 2766} {"train_loss": -11.760108947753906, "global_step": 464729, "epoch": 2766} {"train_loss": -11.979119300842285, "global_step": 464730, "epoch": 2766} {"train_loss": -11.73355484008789, "global_step": 464731, "epoch": 2766} {"train_loss": -11.803332328796387, "global_step": 464732, "epoch": 2766} {"train_loss": -12.195473670959473, "global_step": 464733, "epoch": 2766} {"train_loss": -11.7694730758667, "global_step": 464734, "epoch": 2766} {"train_loss": -12.049521446228027, "global_step": 464735, "epoch": 2766} {"train_loss": -11.764554023742676, "global_step": 464736, "epoch": 2766} {"train_loss": -11.802153587341309, "global_step": 464737, "epoch": 2766} {"train_loss": -11.62451457977295, "global_step": 464738, "epoch": 2766} {"train_loss": -11.905539512634277, "global_step": 464739, "epoch": 2766} {"train_loss": -11.51085090637207, "global_step": 464740, "epoch": 2766} {"train_loss": -12.427379608154297, "global_step": 464741, "epoch": 2766} {"train_loss": -11.486413955688477, "global_step": 464742, "epoch": 2766} {"train_loss": -12.108391761779785, "global_step": 464743, "epoch": 2766} {"train_loss": -11.883453369140625, "global_step": 464744, "epoch": 2766} {"train_loss": -12.024938583374023, "global_step": 464745, "epoch": 2766} {"train_loss": -12.173851013183594, "global_step": 464746, "epoch": 2766} {"train_loss": -11.993011474609375, "global_step": 464747, "epoch": 2766} {"train_loss": -12.15378189086914, "global_step": 464748, "epoch": 2766} {"train_loss": -11.794015884399414, "global_step": 464749, "epoch": 2766} {"train_loss": -11.716148376464844, "global_step": 464750, "epoch": 2766} {"train_loss": -12.138800621032715, "global_step": 464751, "epoch": 2766} {"train_loss": -11.69488525390625, "global_step": 464752, "epoch": 2766} {"train_loss": -12.303024291992188, "global_step": 464753, "epoch": 2766} {"train_loss": -11.795327186584473, "global_step": 464754, "epoch": 2766} {"train_loss": -12.420563697814941, "global_step": 464755, "epoch": 2766} {"train_loss": -11.954229354858398, "global_step": 464756, "epoch": 2766} {"train_loss": -12.448026657104492, "global_step": 464757, "epoch": 2766} {"train_loss": -12.278905868530273, "global_step": 464758, "epoch": 2766} {"train_loss": -12.319595336914062, "global_step": 464759, "epoch": 2766} {"train_loss": -11.792535781860352, "global_step": 464760, "epoch": 2766} {"train_loss": -12.106269836425781, "global_step": 464761, "epoch": 2766} {"train_loss": -12.192422866821289, "global_step": 464762, "epoch": 2766} {"train_loss": -12.267942428588867, "global_step": 464763, "epoch": 2766} {"train_loss": -12.30887508392334, "global_step": 464764, "epoch": 2766} {"train_loss": -12.251502990722656, "global_step": 464765, "epoch": 2766} {"train_loss": -12.342195510864258, "global_step": 464766, "epoch": 2766} {"train_loss": -11.788780212402344, "global_step": 464767, "epoch": 2766} {"train_loss": -12.444724082946777, "global_step": 464768, "epoch": 2766} {"train_loss": -11.80183219909668, "global_step": 464769, "epoch": 2766} {"train_loss": -12.210018157958984, "global_step": 464770, "epoch": 2766} {"train_loss": -12.111469268798828, "global_step": 464771, "epoch": 2766} {"train_loss": -12.341207504272461, "global_step": 464772, "epoch": 2766} {"train_loss": -12.114252090454102, "global_step": 464773, "epoch": 2766} {"train_loss": -12.416718482971191, "global_step": 464774, "epoch": 2766} {"train_loss": -12.146347045898438, "global_step": 464775, "epoch": 2766} {"train_loss": -12.251859664916992, "global_step": 464776, "epoch": 2766} {"train_loss": -11.878961563110352, "global_step": 464777, "epoch": 2766} {"train_loss": -12.21216106414795, "global_step": 464778, "epoch": 2766} {"train_loss": -11.686187744140625, "global_step": 464779, "epoch": 2766} {"train_loss": -12.01524829864502, "global_step": 464780, "epoch": 2766} {"train_loss": -11.797607421875, "global_step": 464781, "epoch": 2766} {"train_loss": -12.031638145446777, "global_step": 464782, "epoch": 2766} {"train_loss": -12.441783905029297, "global_step": 464783, "epoch": 2766} {"train_loss": -11.706193923950195, "global_step": 464784, "epoch": 2766} {"train_loss": -12.489387512207031, "global_step": 464785, "epoch": 2766} {"train_loss": -11.805883407592773, "global_step": 464786, "epoch": 2766} {"train_loss": -12.4260892868042, "global_step": 464787, "epoch": 2766} {"train_loss": -11.960948944091797, "global_step": 464788, "epoch": 2766} {"train_loss": -12.293523788452148, "global_step": 464789, "epoch": 2766} {"train_loss": -11.864702224731445, "global_step": 464790, "epoch": 2766} {"train_loss": -12.14328384399414, "global_step": 464791, "epoch": 2766} {"train_loss": -12.307672500610352, "global_step": 464792, "epoch": 2766} {"train_loss": -12.087677001953125, "global_step": 464793, "epoch": 2766} {"train_loss": -12.320891380310059, "global_step": 464794, "epoch": 2766} {"train_loss": -11.7041015625, "global_step": 464795, "epoch": 2766} {"train_loss": -12.285404205322266, "global_step": 464796, "epoch": 2766} {"train_loss": -12.499202728271484, "global_step": 464797, "epoch": 2766} {"train_loss": -12.26412296295166, "global_step": 464798, "epoch": 2766} {"train_loss": -12.323419570922852, "global_step": 464799, "epoch": 2766} {"train_loss": -12.383488655090332, "global_step": 464800, "epoch": 2766} {"train_loss": -12.490752220153809, "global_step": 464801, "epoch": 2766} {"train_loss": -12.512235641479492, "global_step": 464802, "epoch": 2766} {"train_loss": -12.341180801391602, "global_step": 464803, "epoch": 2766} {"train_loss": -12.545899391174316, "global_step": 464804, "epoch": 2766} {"train_loss": -12.642523765563965, "global_step": 464805, "epoch": 2766} {"train_loss": -12.66170597076416, "global_step": 464806, "epoch": 2766} {"train_loss": -12.545013427734375, "global_step": 464807, "epoch": 2766} {"train_loss": -12.654317855834961, "global_step": 464808, "epoch": 2766} {"train_loss": -12.570011138916016, "global_step": 464809, "epoch": 2766} {"train_loss": -12.776420593261719, "global_step": 464810, "epoch": 2766} {"train_loss": -12.665968894958496, "global_step": 464811, "epoch": 2766} {"train_loss": -12.702695846557617, "global_step": 464812, "epoch": 2766} {"train_loss": -12.801898002624512, "global_step": 464813, "epoch": 2766} {"train_loss": -12.627016067504883, "global_step": 464814, "epoch": 2766} {"train_loss": -12.757984161376953, "global_step": 464815, "epoch": 2766} {"train_loss": -12.798774719238281, "global_step": 464816, "epoch": 2766} {"train_loss": -12.75198745727539, "global_step": 464817, "epoch": 2766} {"train_loss": -12.757814407348633, "global_step": 464818, "epoch": 2766} {"train_loss": -12.429398536682129, "global_step": 464819, "epoch": 2766} {"train_loss": -12.91400146484375, "global_step": 464820, "epoch": 2766} {"train_loss": -12.470085144042969, "global_step": 464821, "epoch": 2766} {"train_loss": -12.69662857055664, "global_step": 464822, "epoch": 2766} {"train_loss": -12.988393783569336, "global_step": 464823, "epoch": 2766} {"train_loss": -12.521978378295898, "global_step": 464824, "epoch": 2766} {"train_loss": -12.788713455200195, "global_step": 464825, "epoch": 2766} {"train_loss": -12.684038162231445, "global_step": 464826, "epoch": 2766} {"train_loss": -12.663047790527344, "global_step": 464827, "epoch": 2766} {"train_loss": -12.793281555175781, "global_step": 464828, "epoch": 2766} {"train_loss": -12.543573379516602, "global_step": 464829, "epoch": 2766} {"train_loss": -12.46181869506836, "global_step": 464830, "epoch": 2766} {"train_loss": -11.776740074157715, "global_step": 464831, "epoch": 2766} {"train_loss": -12.959972381591797, "global_step": 464832, "epoch": 2766} {"train_loss": -12.33198070526123, "global_step": 464833, "epoch": 2766} {"train_loss": -12.423081398010254, "global_step": 464834, "epoch": 2766} {"train_loss": -12.553714752197266, "global_step": 464835, "epoch": 2766} {"train_loss": -12.18441104888916, "global_step": 464836, "epoch": 2766} {"train_loss": -12.702856063842773, "global_step": 464837, "epoch": 2766} {"train_loss": -12.387422561645508, "global_step": 464838, "epoch": 2766} {"train_loss": -12.488753318786621, "global_step": 464839, "epoch": 2766} {"train_loss": -12.522392272949219, "global_step": 464840, "epoch": 2766} {"train_loss": -12.677845001220703, "global_step": 464841, "epoch": 2766} {"train_loss": -12.246864318847656, "global_step": 464842, "epoch": 2766} {"train_loss": -12.725653648376465, "global_step": 464843, "epoch": 2766} {"train_loss": -12.657976150512695, "global_step": 464844, "epoch": 2766} {"train_loss": -12.74063491821289, "global_step": 464845, "epoch": 2766} {"train_loss": -12.917662620544434, "global_step": 464846, "epoch": 2766} {"train_loss": -12.843738555908203, "global_step": 464847, "epoch": 2766} {"train_loss": -12.348281860351562, "global_step": 464848, "epoch": 2766} {"train_loss": -12.861459732055664, "global_step": 464849, "epoch": 2766} {"train_loss": -12.398195266723633, "global_step": 464850, "epoch": 2766} {"train_loss": -12.376592636108398, "global_step": 464851, "epoch": 2766} {"train_loss": -11.967569351196289, "global_step": 464852, "epoch": 2766} {"train_loss": -12.558507919311523, "global_step": 464853, "epoch": 2766} {"train_loss": -11.636491775512695, "global_step": 464854, "epoch": 2766} {"train_loss": -12.059489528338114, "global_step": 464855, "epoch": 2766, "val_loss": 315618.625} {"train_loss": -12.002799987792969, "global_step": 464856, "epoch": 2767} {"train_loss": -12.58198356628418, "global_step": 464857, "epoch": 2767} {"train_loss": -12.119980812072754, "global_step": 464858, "epoch": 2767} {"train_loss": -12.469016075134277, "global_step": 464859, "epoch": 2767} {"train_loss": -12.160152435302734, "global_step": 464860, "epoch": 2767} {"train_loss": -12.259208679199219, "global_step": 464861, "epoch": 2767} {"train_loss": -12.014537811279297, "global_step": 464862, "epoch": 2767} {"train_loss": -12.988523483276367, "global_step": 464863, "epoch": 2767} {"train_loss": -11.586437225341797, "global_step": 464864, "epoch": 2767} {"train_loss": -12.334985733032227, "global_step": 464865, "epoch": 2767} {"train_loss": -11.883234977722168, "global_step": 464866, "epoch": 2767} {"train_loss": -12.29132080078125, "global_step": 464867, "epoch": 2767} {"train_loss": -11.47764778137207, "global_step": 464868, "epoch": 2767} {"train_loss": -12.307229995727539, "global_step": 464869, "epoch": 2767} {"train_loss": -11.5115327835083, "global_step": 464870, "epoch": 2767} {"train_loss": -12.332427978515625, "global_step": 464871, "epoch": 2767} {"train_loss": -12.264963150024414, "global_step": 464872, "epoch": 2767} {"train_loss": -11.392974853515625, "global_step": 464873, "epoch": 2767} {"train_loss": -11.730612754821777, "global_step": 464874, "epoch": 2767} {"train_loss": -12.105927467346191, "global_step": 464875, "epoch": 2767} {"train_loss": -10.978255271911621, "global_step": 464876, "epoch": 2767} {"train_loss": -12.33067512512207, "global_step": 464877, "epoch": 2767} {"train_loss": -11.563263893127441, "global_step": 464878, "epoch": 2767} {"train_loss": -12.138805389404297, "global_step": 464879, "epoch": 2767} {"train_loss": -12.1119966506958, "global_step": 464880, "epoch": 2767} {"train_loss": -11.830057144165039, "global_step": 464881, "epoch": 2767} {"train_loss": -12.357391357421875, "global_step": 464882, "epoch": 2767} {"train_loss": -12.203901290893555, "global_step": 464883, "epoch": 2767} {"train_loss": -12.281907081604004, "global_step": 464884, "epoch": 2767} {"train_loss": -12.23817253112793, "global_step": 464885, "epoch": 2767} {"train_loss": -12.801974296569824, "global_step": 464886, "epoch": 2767} {"train_loss": -11.912145614624023, "global_step": 464887, "epoch": 2767} {"train_loss": -12.419880867004395, "global_step": 464888, "epoch": 2767} {"train_loss": -11.392560005187988, "global_step": 464889, "epoch": 2767} {"train_loss": -11.65969181060791, "global_step": 464890, "epoch": 2767} {"train_loss": -11.941974639892578, "global_step": 464891, "epoch": 2767} {"train_loss": -12.466009140014648, "global_step": 464892, "epoch": 2767} {"train_loss": -12.518537521362305, "global_step": 464893, "epoch": 2767} {"train_loss": -12.260675430297852, "global_step": 464894, "epoch": 2767} {"train_loss": -12.063715934753418, "global_step": 464895, "epoch": 2767} {"train_loss": -12.491039276123047, "global_step": 464896, "epoch": 2767} {"train_loss": -12.465880393981934, "global_step": 464897, "epoch": 2767} {"train_loss": -12.597131729125977, "global_step": 464898, "epoch": 2767} {"train_loss": -12.54959774017334, "global_step": 464899, "epoch": 2767} {"train_loss": -12.305038452148438, "global_step": 464900, "epoch": 2767} {"train_loss": -12.495621681213379, "global_step": 464901, "epoch": 2767} {"train_loss": -12.68122673034668, "global_step": 464902, "epoch": 2767} {"train_loss": -12.251609802246094, "global_step": 464903, "epoch": 2767} {"train_loss": -12.51967716217041, "global_step": 464904, "epoch": 2767} {"train_loss": -12.285642623901367, "global_step": 464905, "epoch": 2767} {"train_loss": -12.100529670715332, "global_step": 464906, "epoch": 2767} {"train_loss": -12.28083610534668, "global_step": 464907, "epoch": 2767} {"train_loss": -12.251861572265625, "global_step": 464908, "epoch": 2767} {"train_loss": -12.317995071411133, "global_step": 464909, "epoch": 2767} {"train_loss": -12.867121696472168, "global_step": 464910, "epoch": 2767} {"train_loss": -11.930996894836426, "global_step": 464911, "epoch": 2767} {"train_loss": -12.458858489990234, "global_step": 464912, "epoch": 2767} {"train_loss": -12.035807609558105, "global_step": 464913, "epoch": 2767} {"train_loss": -11.887626647949219, "global_step": 464914, "epoch": 2767} {"train_loss": -11.538381576538086, "global_step": 464915, "epoch": 2767} {"train_loss": -12.270208358764648, "global_step": 464916, "epoch": 2767} {"train_loss": -11.86945915222168, "global_step": 464917, "epoch": 2767} {"train_loss": -12.208100318908691, "global_step": 464918, "epoch": 2767} {"train_loss": -11.367498397827148, "global_step": 464919, "epoch": 2767} {"train_loss": -12.175803184509277, "global_step": 464920, "epoch": 2767} {"train_loss": -11.569910049438477, "global_step": 464921, "epoch": 2767} {"train_loss": -11.190727233886719, "global_step": 464922, "epoch": 2767} {"train_loss": -11.686059951782227, "global_step": 464923, "epoch": 2767} {"train_loss": -11.7821683883667, "global_step": 464924, "epoch": 2767} {"train_loss": -11.836662292480469, "global_step": 464925, "epoch": 2767} {"train_loss": -12.070322036743164, "global_step": 464926, "epoch": 2767} {"train_loss": -11.972259521484375, "global_step": 464927, "epoch": 2767} {"train_loss": -12.431097984313965, "global_step": 464928, "epoch": 2767} {"train_loss": -11.5181884765625, "global_step": 464929, "epoch": 2767} {"train_loss": -12.136656761169434, "global_step": 464930, "epoch": 2767} {"train_loss": -12.06765079498291, "global_step": 464931, "epoch": 2767} {"train_loss": -11.240690231323242, "global_step": 464932, "epoch": 2767} {"train_loss": -12.436769485473633, "global_step": 464933, "epoch": 2767} {"train_loss": -10.637927055358887, "global_step": 464934, "epoch": 2767} {"train_loss": -9.73691177368164, "global_step": 464935, "epoch": 2767} {"train_loss": -11.416452407836914, "global_step": 464936, "epoch": 2767} {"train_loss": -10.689040184020996, "global_step": 464937, "epoch": 2767} {"train_loss": -10.088441848754883, "global_step": 464938, "epoch": 2767} {"train_loss": -11.555621147155762, "global_step": 464939, "epoch": 2767} {"train_loss": -10.358233451843262, "global_step": 464940, "epoch": 2767} {"train_loss": -11.528075218200684, "global_step": 464941, "epoch": 2767} {"train_loss": -10.536611557006836, "global_step": 464942, "epoch": 2767} {"train_loss": -11.439388275146484, "global_step": 464943, "epoch": 2767} {"train_loss": -10.787370681762695, "global_step": 464944, "epoch": 2767} {"train_loss": -11.000980377197266, "global_step": 464945, "epoch": 2767} {"train_loss": -10.125720977783203, "global_step": 464946, "epoch": 2767} {"train_loss": -11.43642807006836, "global_step": 464947, "epoch": 2767} {"train_loss": -10.353744506835938, "global_step": 464948, "epoch": 2767} {"train_loss": -10.177560806274414, "global_step": 464949, "epoch": 2767} {"train_loss": -10.789554595947266, "global_step": 464950, "epoch": 2767} {"train_loss": -10.413017272949219, "global_step": 464951, "epoch": 2767} {"train_loss": -9.97459602355957, "global_step": 464952, "epoch": 2767} {"train_loss": -9.865203857421875, "global_step": 464953, "epoch": 2767} {"train_loss": -9.431692123413086, "global_step": 464954, "epoch": 2767} {"train_loss": -9.167268753051758, "global_step": 464955, "epoch": 2767} {"train_loss": -11.07143783569336, "global_step": 464956, "epoch": 2767} {"train_loss": -10.34298324584961, "global_step": 464957, "epoch": 2767} {"train_loss": -9.645516395568848, "global_step": 464958, "epoch": 2767} {"train_loss": -11.236278533935547, "global_step": 464959, "epoch": 2767} {"train_loss": -10.835896492004395, "global_step": 464960, "epoch": 2767} {"train_loss": -10.576862335205078, "global_step": 464961, "epoch": 2767} {"train_loss": -11.898811340332031, "global_step": 464962, "epoch": 2767} {"train_loss": -11.096664428710938, "global_step": 464963, "epoch": 2767} {"train_loss": -10.60872745513916, "global_step": 464964, "epoch": 2767} {"train_loss": -11.496737480163574, "global_step": 464965, "epoch": 2767} {"train_loss": -10.766555786132812, "global_step": 464966, "epoch": 2767} {"train_loss": -10.331775665283203, "global_step": 464967, "epoch": 2767} {"train_loss": -11.585365295410156, "global_step": 464968, "epoch": 2767} {"train_loss": -10.593392372131348, "global_step": 464969, "epoch": 2767} {"train_loss": -11.78770637512207, "global_step": 464970, "epoch": 2767} {"train_loss": -10.619599342346191, "global_step": 464971, "epoch": 2767} {"train_loss": -11.922372817993164, "global_step": 464972, "epoch": 2767} {"train_loss": -10.93954086303711, "global_step": 464973, "epoch": 2767} {"train_loss": -11.723091125488281, "global_step": 464974, "epoch": 2767} {"train_loss": -11.425973892211914, "global_step": 464975, "epoch": 2767} {"train_loss": -11.692014694213867, "global_step": 464976, "epoch": 2767} {"train_loss": -12.161161422729492, "global_step": 464977, "epoch": 2767} {"train_loss": -11.699634552001953, "global_step": 464978, "epoch": 2767} {"train_loss": -11.883506774902344, "global_step": 464979, "epoch": 2767} {"train_loss": -11.547733306884766, "global_step": 464980, "epoch": 2767} {"train_loss": -11.918197631835938, "global_step": 464981, "epoch": 2767} {"train_loss": -11.737030029296875, "global_step": 464982, "epoch": 2767} {"train_loss": -12.120718002319336, "global_step": 464983, "epoch": 2767} {"train_loss": -11.915334701538086, "global_step": 464984, "epoch": 2767} {"train_loss": -11.992500305175781, "global_step": 464985, "epoch": 2767} {"train_loss": -12.411690711975098, "global_step": 464986, "epoch": 2767} {"train_loss": -11.67702865600586, "global_step": 464987, "epoch": 2767} {"train_loss": -12.041593551635742, "global_step": 464988, "epoch": 2767} {"train_loss": -12.273460388183594, "global_step": 464989, "epoch": 2767} {"train_loss": -12.144587516784668, "global_step": 464990, "epoch": 2767} {"train_loss": -12.067205429077148, "global_step": 464991, "epoch": 2767} {"train_loss": -12.005826950073242, "global_step": 464992, "epoch": 2767} {"train_loss": -12.110956192016602, "global_step": 464993, "epoch": 2767} {"train_loss": -12.348737716674805, "global_step": 464994, "epoch": 2767} {"train_loss": -12.198488235473633, "global_step": 464995, "epoch": 2767} {"train_loss": -12.617986679077148, "global_step": 464996, "epoch": 2767} {"train_loss": -12.281238555908203, "global_step": 464997, "epoch": 2767} {"train_loss": -12.338150024414062, "global_step": 464998, "epoch": 2767} {"train_loss": -12.401391983032227, "global_step": 464999, "epoch": 2767} {"train_loss": -12.40284538269043, "global_step": 465000, "epoch": 2767} {"train_loss": -12.387648582458496, "global_step": 465001, "epoch": 2767} {"train_loss": -12.014154434204102, "global_step": 465002, "epoch": 2767} {"train_loss": -12.345100402832031, "global_step": 465003, "epoch": 2767} {"train_loss": -12.448629379272461, "global_step": 465004, "epoch": 2767} {"train_loss": -12.289115905761719, "global_step": 465005, "epoch": 2767} {"train_loss": -12.21122932434082, "global_step": 465006, "epoch": 2767} {"train_loss": -12.593438148498535, "global_step": 465007, "epoch": 2767} {"train_loss": -12.389013290405273, "global_step": 465008, "epoch": 2767} {"train_loss": -12.50489330291748, "global_step": 465009, "epoch": 2767} {"train_loss": -12.556817054748535, "global_step": 465010, "epoch": 2767} {"train_loss": -12.502115249633789, "global_step": 465011, "epoch": 2767} {"train_loss": -12.566566467285156, "global_step": 465012, "epoch": 2767} {"train_loss": -12.500020027160645, "global_step": 465013, "epoch": 2767} {"train_loss": -12.113960266113281, "global_step": 465014, "epoch": 2767} {"train_loss": -12.367114067077637, "global_step": 465015, "epoch": 2767} {"train_loss": -12.619266510009766, "global_step": 465016, "epoch": 2767} {"train_loss": -12.413039207458496, "global_step": 465017, "epoch": 2767} {"train_loss": -12.608190536499023, "global_step": 465018, "epoch": 2767} {"train_loss": -12.469823837280273, "global_step": 465019, "epoch": 2767} {"train_loss": -12.579151153564453, "global_step": 465020, "epoch": 2767} {"train_loss": -12.573654174804688, "global_step": 465021, "epoch": 2767} {"train_loss": -12.382075309753418, "global_step": 465022, "epoch": 2767} {"train_loss": -11.805714618592035, "global_step": 465023, "epoch": 2767, "val_loss": 312511.84375} {"train_loss": -12.447110176086426, "global_step": 465024, "epoch": 2768} {"train_loss": -12.633203506469727, "global_step": 465025, "epoch": 2768} {"train_loss": -12.631270408630371, "global_step": 465026, "epoch": 2768} {"train_loss": -12.724342346191406, "global_step": 465027, "epoch": 2768} {"train_loss": -12.666274070739746, "global_step": 465028, "epoch": 2768} {"train_loss": -12.586939811706543, "global_step": 465029, "epoch": 2768} {"train_loss": -12.237256050109863, "global_step": 465030, "epoch": 2768} {"train_loss": -12.522961616516113, "global_step": 465031, "epoch": 2768} {"train_loss": -12.778145790100098, "global_step": 465032, "epoch": 2768} {"train_loss": -12.718817710876465, "global_step": 465033, "epoch": 2768} {"train_loss": -12.606114387512207, "global_step": 465034, "epoch": 2768} {"train_loss": -12.474684715270996, "global_step": 465035, "epoch": 2768} {"train_loss": -12.131404876708984, "global_step": 465036, "epoch": 2768} {"train_loss": -12.654085159301758, "global_step": 465037, "epoch": 2768} {"train_loss": -12.421001434326172, "global_step": 465038, "epoch": 2768} {"train_loss": -12.505992889404297, "global_step": 465039, "epoch": 2768} {"train_loss": -12.689014434814453, "global_step": 465040, "epoch": 2768} {"train_loss": -12.719829559326172, "global_step": 465041, "epoch": 2768} {"train_loss": -12.68966293334961, "global_step": 465042, "epoch": 2768} {"train_loss": -12.71656608581543, "global_step": 465043, "epoch": 2768} {"train_loss": -12.581344604492188, "global_step": 465044, "epoch": 2768} {"train_loss": -12.597270965576172, "global_step": 465045, "epoch": 2768} {"train_loss": -12.707260131835938, "global_step": 465046, "epoch": 2768} {"train_loss": -12.553365707397461, "global_step": 465047, "epoch": 2768} {"train_loss": -12.493175506591797, "global_step": 465048, "epoch": 2768} {"train_loss": -12.57779312133789, "global_step": 465049, "epoch": 2768} {"train_loss": -12.811599731445312, "global_step": 465050, "epoch": 2768} {"train_loss": -12.642376899719238, "global_step": 465051, "epoch": 2768} {"train_loss": -12.9965238571167, "global_step": 465052, "epoch": 2768} {"train_loss": -12.700498580932617, "global_step": 465053, "epoch": 2768} {"train_loss": -12.768959045410156, "global_step": 465054, "epoch": 2768} {"train_loss": -12.722454071044922, "global_step": 465055, "epoch": 2768} {"train_loss": -12.747444152832031, "global_step": 465056, "epoch": 2768} {"train_loss": -12.495153427124023, "global_step": 465057, "epoch": 2768} {"train_loss": -12.671270370483398, "global_step": 465058, "epoch": 2768} {"train_loss": -12.71388053894043, "global_step": 465059, "epoch": 2768} {"train_loss": -12.84049129486084, "global_step": 465060, "epoch": 2768} {"train_loss": -12.779059410095215, "global_step": 465061, "epoch": 2768} {"train_loss": -12.853821754455566, "global_step": 465062, "epoch": 2768} {"train_loss": -12.782183647155762, "global_step": 465063, "epoch": 2768} {"train_loss": -12.655126571655273, "global_step": 465064, "epoch": 2768} {"train_loss": -12.94573974609375, "global_step": 465065, "epoch": 2768} {"train_loss": -12.840092658996582, "global_step": 465066, "epoch": 2768} {"train_loss": -12.89828872680664, "global_step": 465067, "epoch": 2768} {"train_loss": -12.799022674560547, "global_step": 465068, "epoch": 2768} {"train_loss": -12.649768829345703, "global_step": 465069, "epoch": 2768} {"train_loss": -12.92138671875, "global_step": 465070, "epoch": 2768} {"train_loss": -12.794561386108398, "global_step": 465071, "epoch": 2768} {"train_loss": -12.902364730834961, "global_step": 465072, "epoch": 2768} {"train_loss": -12.577194213867188, "global_step": 465073, "epoch": 2768} {"train_loss": -12.837413787841797, "global_step": 465074, "epoch": 2768} {"train_loss": -12.570387840270996, "global_step": 465075, "epoch": 2768} {"train_loss": -12.679666519165039, "global_step": 465076, "epoch": 2768} {"train_loss": -12.254674911499023, "global_step": 465077, "epoch": 2768} {"train_loss": -12.637042999267578, "global_step": 465078, "epoch": 2768} {"train_loss": -12.94137954711914, "global_step": 465079, "epoch": 2768} {"train_loss": -12.612568855285645, "global_step": 465080, "epoch": 2768} {"train_loss": -12.564537048339844, "global_step": 465081, "epoch": 2768} {"train_loss": -12.793655395507812, "global_step": 465082, "epoch": 2768} {"train_loss": -12.800775527954102, "global_step": 465083, "epoch": 2768} {"train_loss": -11.57274341583252, "global_step": 465084, "epoch": 2768} {"train_loss": -12.487369537353516, "global_step": 465085, "epoch": 2768} {"train_loss": -12.559042930603027, "global_step": 465086, "epoch": 2768} {"train_loss": -11.626462936401367, "global_step": 465087, "epoch": 2768} {"train_loss": -10.75307846069336, "global_step": 465088, "epoch": 2768} {"train_loss": -11.8068265914917, "global_step": 465089, "epoch": 2768} {"train_loss": -11.487886428833008, "global_step": 465090, "epoch": 2768} {"train_loss": -10.090620040893555, "global_step": 465091, "epoch": 2768} {"train_loss": -11.598384857177734, "global_step": 465092, "epoch": 2768} {"train_loss": -11.679500579833984, "global_step": 465093, "epoch": 2768} {"train_loss": -11.255121231079102, "global_step": 465094, "epoch": 2768} {"train_loss": -11.117234230041504, "global_step": 465095, "epoch": 2768} {"train_loss": -11.70217227935791, "global_step": 465096, "epoch": 2768} {"train_loss": -10.675118446350098, "global_step": 465097, "epoch": 2768} {"train_loss": -11.963196754455566, "global_step": 465098, "epoch": 2768} {"train_loss": -11.422867774963379, "global_step": 465099, "epoch": 2768} {"train_loss": -11.542089462280273, "global_step": 465100, "epoch": 2768} {"train_loss": -11.654224395751953, "global_step": 465101, "epoch": 2768} {"train_loss": -12.096321105957031, "global_step": 465102, "epoch": 2768} {"train_loss": -11.814698219299316, "global_step": 465103, "epoch": 2768} {"train_loss": -11.762296676635742, "global_step": 465104, "epoch": 2768} {"train_loss": -10.955554962158203, "global_step": 465105, "epoch": 2768} {"train_loss": -11.775463104248047, "global_step": 465106, "epoch": 2768} {"train_loss": -11.07154655456543, "global_step": 465107, "epoch": 2768} {"train_loss": -11.668741226196289, "global_step": 465108, "epoch": 2768} {"train_loss": -11.257378578186035, "global_step": 465109, "epoch": 2768} {"train_loss": -11.385970115661621, "global_step": 465110, "epoch": 2768} {"train_loss": -10.041120529174805, "global_step": 465111, "epoch": 2768} {"train_loss": -11.025796890258789, "global_step": 465112, "epoch": 2768} {"train_loss": -12.07819652557373, "global_step": 465113, "epoch": 2768} {"train_loss": -11.345863342285156, "global_step": 465114, "epoch": 2768} {"train_loss": -10.515838623046875, "global_step": 465115, "epoch": 2768} {"train_loss": -11.568975448608398, "global_step": 465116, "epoch": 2768} {"train_loss": -10.464672088623047, "global_step": 465117, "epoch": 2768} {"train_loss": -11.73222541809082, "global_step": 465118, "epoch": 2768} {"train_loss": -11.216089248657227, "global_step": 465119, "epoch": 2768} {"train_loss": -10.216995239257812, "global_step": 465120, "epoch": 2768} {"train_loss": -11.885051727294922, "global_step": 465121, "epoch": 2768} {"train_loss": -10.197253227233887, "global_step": 465122, "epoch": 2768} {"train_loss": -11.112495422363281, "global_step": 465123, "epoch": 2768} {"train_loss": -10.784405708312988, "global_step": 465124, "epoch": 2768} {"train_loss": -11.188830375671387, "global_step": 465125, "epoch": 2768} {"train_loss": -10.264945983886719, "global_step": 465126, "epoch": 2768} {"train_loss": -11.207230567932129, "global_step": 465127, "epoch": 2768} {"train_loss": -11.221109390258789, "global_step": 465128, "epoch": 2768} {"train_loss": -11.764913558959961, "global_step": 465129, "epoch": 2768} {"train_loss": -11.359023094177246, "global_step": 465130, "epoch": 2768} {"train_loss": -11.56606674194336, "global_step": 465131, "epoch": 2768} {"train_loss": -11.59639835357666, "global_step": 465132, "epoch": 2768} {"train_loss": -11.500090599060059, "global_step": 465133, "epoch": 2768} {"train_loss": -10.363199234008789, "global_step": 465134, "epoch": 2768} {"train_loss": -11.911553382873535, "global_step": 465135, "epoch": 2768} {"train_loss": -11.060846328735352, "global_step": 465136, "epoch": 2768} {"train_loss": -11.388116836547852, "global_step": 465137, "epoch": 2768} {"train_loss": -12.149593353271484, "global_step": 465138, "epoch": 2768} {"train_loss": -10.786869049072266, "global_step": 465139, "epoch": 2768} {"train_loss": -12.314335823059082, "global_step": 465140, "epoch": 2768} {"train_loss": -11.47161865234375, "global_step": 465141, "epoch": 2768} {"train_loss": -12.058698654174805, "global_step": 465142, "epoch": 2768} {"train_loss": -11.586894989013672, "global_step": 465143, "epoch": 2768} {"train_loss": -11.662412643432617, "global_step": 465144, "epoch": 2768} {"train_loss": -11.949712753295898, "global_step": 465145, "epoch": 2768} {"train_loss": -11.996322631835938, "global_step": 465146, "epoch": 2768} {"train_loss": -12.334855079650879, "global_step": 465147, "epoch": 2768} {"train_loss": -12.020683288574219, "global_step": 465148, "epoch": 2768} {"train_loss": -12.1870698928833, "global_step": 465149, "epoch": 2768} {"train_loss": -11.92594051361084, "global_step": 465150, "epoch": 2768} {"train_loss": -12.411154747009277, "global_step": 465151, "epoch": 2768} {"train_loss": -12.260286331176758, "global_step": 465152, "epoch": 2768} {"train_loss": -12.329278945922852, "global_step": 465153, "epoch": 2768} {"train_loss": -12.167289733886719, "global_step": 465154, "epoch": 2768} {"train_loss": -12.506404876708984, "global_step": 465155, "epoch": 2768} {"train_loss": -12.408370971679688, "global_step": 465156, "epoch": 2768} {"train_loss": -12.26903247833252, "global_step": 465157, "epoch": 2768} {"train_loss": -12.353456497192383, "global_step": 465158, "epoch": 2768} {"train_loss": -12.202186584472656, "global_step": 465159, "epoch": 2768} {"train_loss": -12.312986373901367, "global_step": 465160, "epoch": 2768} {"train_loss": -12.098919868469238, "global_step": 465161, "epoch": 2768} {"train_loss": -12.497777938842773, "global_step": 465162, "epoch": 2768} {"train_loss": -12.349629402160645, "global_step": 465163, "epoch": 2768} {"train_loss": -12.113147735595703, "global_step": 465164, "epoch": 2768} {"train_loss": -12.505060195922852, "global_step": 465165, "epoch": 2768} {"train_loss": -12.039934158325195, "global_step": 465166, "epoch": 2768} {"train_loss": -12.313688278198242, "global_step": 465167, "epoch": 2768} {"train_loss": -12.302872657775879, "global_step": 465168, "epoch": 2768} {"train_loss": -12.26041030883789, "global_step": 465169, "epoch": 2768} {"train_loss": -12.368642807006836, "global_step": 465170, "epoch": 2768} {"train_loss": -12.143878936767578, "global_step": 465171, "epoch": 2768} {"train_loss": -12.156362533569336, "global_step": 465172, "epoch": 2768} {"train_loss": -12.1088285446167, "global_step": 465173, "epoch": 2768} {"train_loss": -12.107382774353027, "global_step": 465174, "epoch": 2768} {"train_loss": -12.473920822143555, "global_step": 465175, "epoch": 2768} {"train_loss": -12.315624237060547, "global_step": 465176, "epoch": 2768} {"train_loss": -12.087930679321289, "global_step": 465177, "epoch": 2768} {"train_loss": -12.207962036132812, "global_step": 465178, "epoch": 2768} {"train_loss": -12.244100570678711, "global_step": 465179, "epoch": 2768} {"train_loss": -11.728482246398926, "global_step": 465180, "epoch": 2768} {"train_loss": -12.32219123840332, "global_step": 465181, "epoch": 2768} {"train_loss": -11.396350860595703, "global_step": 465182, "epoch": 2768} {"train_loss": -12.117244720458984, "global_step": 465183, "epoch": 2768} {"train_loss": -12.208566665649414, "global_step": 465184, "epoch": 2768} {"train_loss": -12.281465530395508, "global_step": 465185, "epoch": 2768} {"train_loss": -12.236978530883789, "global_step": 465186, "epoch": 2768} {"train_loss": -12.3369140625, "global_step": 465187, "epoch": 2768} {"train_loss": -12.340819358825684, "global_step": 465188, "epoch": 2768} {"train_loss": -12.520508766174316, "global_step": 465189, "epoch": 2768} {"train_loss": -12.575030326843262, "global_step": 465190, "epoch": 2768} {"train_loss": -12.07129388763791, "global_step": 465191, "epoch": 2768, "val_loss": 317682.78125} {"train_loss": -12.459921836853027, "global_step": 465192, "epoch": 2769} {"train_loss": -12.193368911743164, "global_step": 465193, "epoch": 2769} {"train_loss": -12.499151229858398, "global_step": 465194, "epoch": 2769} {"train_loss": -12.296257019042969, "global_step": 465195, "epoch": 2769} {"train_loss": -12.224563598632812, "global_step": 465196, "epoch": 2769} {"train_loss": -12.61573600769043, "global_step": 465197, "epoch": 2769} {"train_loss": -12.507341384887695, "global_step": 465198, "epoch": 2769} {"train_loss": -12.592536926269531, "global_step": 465199, "epoch": 2769} {"train_loss": -12.621175765991211, "global_step": 465200, "epoch": 2769} {"train_loss": -12.70567798614502, "global_step": 465201, "epoch": 2769} {"train_loss": -12.723026275634766, "global_step": 465202, "epoch": 2769} {"train_loss": -12.562540054321289, "global_step": 465203, "epoch": 2769} {"train_loss": -12.64102840423584, "global_step": 465204, "epoch": 2769} {"train_loss": -12.414114952087402, "global_step": 465205, "epoch": 2769} {"train_loss": -12.638452529907227, "global_step": 465206, "epoch": 2769} {"train_loss": -12.662306785583496, "global_step": 465207, "epoch": 2769} {"train_loss": -12.675069808959961, "global_step": 465208, "epoch": 2769} {"train_loss": -12.619842529296875, "global_step": 465209, "epoch": 2769} {"train_loss": -12.62409496307373, "global_step": 465210, "epoch": 2769} {"train_loss": -12.700214385986328, "global_step": 465211, "epoch": 2769} {"train_loss": -12.941495895385742, "global_step": 465212, "epoch": 2769} {"train_loss": -12.510566711425781, "global_step": 465213, "epoch": 2769} {"train_loss": -12.788532257080078, "global_step": 465214, "epoch": 2769} {"train_loss": -12.820064544677734, "global_step": 465215, "epoch": 2769} {"train_loss": -12.834911346435547, "global_step": 465216, "epoch": 2769} {"train_loss": -12.727580070495605, "global_step": 465217, "epoch": 2769} {"train_loss": -12.606355667114258, "global_step": 465218, "epoch": 2769} {"train_loss": -12.759195327758789, "global_step": 465219, "epoch": 2769} {"train_loss": -12.735549926757812, "global_step": 465220, "epoch": 2769} {"train_loss": -12.793119430541992, "global_step": 465221, "epoch": 2769} {"train_loss": -12.917482376098633, "global_step": 465222, "epoch": 2769} {"train_loss": -12.695145606994629, "global_step": 465223, "epoch": 2769} {"train_loss": -12.886467933654785, "global_step": 465224, "epoch": 2769} {"train_loss": -12.658134460449219, "global_step": 465225, "epoch": 2769} {"train_loss": -12.532888412475586, "global_step": 465226, "epoch": 2769} {"train_loss": -12.708579063415527, "global_step": 465227, "epoch": 2769} {"train_loss": -12.560585021972656, "global_step": 465228, "epoch": 2769} {"train_loss": -12.874753952026367, "global_step": 465229, "epoch": 2769} {"train_loss": -12.791206359863281, "global_step": 465230, "epoch": 2769} {"train_loss": -12.095869064331055, "global_step": 465231, "epoch": 2769} {"train_loss": -12.19723129272461, "global_step": 465232, "epoch": 2769} {"train_loss": -12.24724006652832, "global_step": 465233, "epoch": 2769} {"train_loss": -11.102291107177734, "global_step": 465234, "epoch": 2769} {"train_loss": -12.564681053161621, "global_step": 465235, "epoch": 2769} {"train_loss": -11.709188461303711, "global_step": 465236, "epoch": 2769} {"train_loss": -12.060802459716797, "global_step": 465237, "epoch": 2769} {"train_loss": -12.274173736572266, "global_step": 465238, "epoch": 2769} {"train_loss": -11.152629852294922, "global_step": 465239, "epoch": 2769} {"train_loss": -11.75222110748291, "global_step": 465240, "epoch": 2769} {"train_loss": -11.946501731872559, "global_step": 465241, "epoch": 2769} {"train_loss": -10.91640567779541, "global_step": 465242, "epoch": 2769} {"train_loss": -12.168956756591797, "global_step": 465243, "epoch": 2769} {"train_loss": -10.863344192504883, "global_step": 465244, "epoch": 2769} {"train_loss": -11.902083396911621, "global_step": 465245, "epoch": 2769} {"train_loss": -12.487678527832031, "global_step": 465246, "epoch": 2769} {"train_loss": -11.263580322265625, "global_step": 465247, "epoch": 2769} {"train_loss": -12.275630950927734, "global_step": 465248, "epoch": 2769} {"train_loss": -12.604206085205078, "global_step": 465249, "epoch": 2769} {"train_loss": -11.139336585998535, "global_step": 465250, "epoch": 2769} {"train_loss": -12.603102684020996, "global_step": 465251, "epoch": 2769} {"train_loss": -11.528645515441895, "global_step": 465252, "epoch": 2769} {"train_loss": -12.330499649047852, "global_step": 465253, "epoch": 2769} {"train_loss": -12.546096801757812, "global_step": 465254, "epoch": 2769} {"train_loss": -12.234567642211914, "global_step": 465255, "epoch": 2769} {"train_loss": -12.619114875793457, "global_step": 465256, "epoch": 2769} {"train_loss": -12.259729385375977, "global_step": 465257, "epoch": 2769} {"train_loss": -12.166019439697266, "global_step": 465258, "epoch": 2769} {"train_loss": -12.574701309204102, "global_step": 465259, "epoch": 2769} {"train_loss": -12.388420104980469, "global_step": 465260, "epoch": 2769} {"train_loss": -12.231205940246582, "global_step": 465261, "epoch": 2769} {"train_loss": -12.415449142456055, "global_step": 465262, "epoch": 2769} {"train_loss": -12.817219734191895, "global_step": 465263, "epoch": 2769} {"train_loss": -12.239810943603516, "global_step": 465264, "epoch": 2769} {"train_loss": -12.52930736541748, "global_step": 465265, "epoch": 2769} {"train_loss": -12.667669296264648, "global_step": 465266, "epoch": 2769} {"train_loss": -12.296157836914062, "global_step": 465267, "epoch": 2769} {"train_loss": -12.638500213623047, "global_step": 465268, "epoch": 2769} {"train_loss": -12.305797576904297, "global_step": 465269, "epoch": 2769} {"train_loss": -12.275768280029297, "global_step": 465270, "epoch": 2769} {"train_loss": -12.473396301269531, "global_step": 465271, "epoch": 2769} {"train_loss": -11.975125312805176, "global_step": 465272, "epoch": 2769} {"train_loss": -12.048051834106445, "global_step": 465273, "epoch": 2769} {"train_loss": -12.729880332946777, "global_step": 465274, "epoch": 2769} {"train_loss": -12.083086967468262, "global_step": 465275, "epoch": 2769} {"train_loss": -12.059637069702148, "global_step": 465276, "epoch": 2769} {"train_loss": -12.656993865966797, "global_step": 465277, "epoch": 2769} {"train_loss": -12.187549591064453, "global_step": 465278, "epoch": 2769} {"train_loss": -12.395306587219238, "global_step": 465279, "epoch": 2769} {"train_loss": -12.322394371032715, "global_step": 465280, "epoch": 2769} {"train_loss": -11.71466064453125, "global_step": 465281, "epoch": 2769} {"train_loss": -12.142267227172852, "global_step": 465282, "epoch": 2769} {"train_loss": -12.619730949401855, "global_step": 465283, "epoch": 2769} {"train_loss": -11.831085205078125, "global_step": 465284, "epoch": 2769} {"train_loss": -12.481828689575195, "global_step": 465285, "epoch": 2769} {"train_loss": -12.628951072692871, "global_step": 465286, "epoch": 2769} {"train_loss": -12.237229347229004, "global_step": 465287, "epoch": 2769} {"train_loss": -12.631695747375488, "global_step": 465288, "epoch": 2769} {"train_loss": -12.684198379516602, "global_step": 465289, "epoch": 2769} {"train_loss": -11.8914213180542, "global_step": 465290, "epoch": 2769} {"train_loss": -12.508796691894531, "global_step": 465291, "epoch": 2769} {"train_loss": -12.474727630615234, "global_step": 465292, "epoch": 2769} {"train_loss": -11.829702377319336, "global_step": 465293, "epoch": 2769} {"train_loss": -11.958978652954102, "global_step": 465294, "epoch": 2769} {"train_loss": -12.66690444946289, "global_step": 465295, "epoch": 2769} {"train_loss": -12.568742752075195, "global_step": 465296, "epoch": 2769} {"train_loss": -12.298418045043945, "global_step": 465297, "epoch": 2769} {"train_loss": -12.440908432006836, "global_step": 465298, "epoch": 2769} {"train_loss": -12.420637130737305, "global_step": 465299, "epoch": 2769} {"train_loss": -12.893045425415039, "global_step": 465300, "epoch": 2769} {"train_loss": -12.228724479675293, "global_step": 465301, "epoch": 2769} {"train_loss": -12.756625175476074, "global_step": 465302, "epoch": 2769} {"train_loss": -12.6904935836792, "global_step": 465303, "epoch": 2769} {"train_loss": -12.586156845092773, "global_step": 465304, "epoch": 2769} {"train_loss": -12.655563354492188, "global_step": 465305, "epoch": 2769} {"train_loss": -12.836872100830078, "global_step": 465306, "epoch": 2769} {"train_loss": -12.668373107910156, "global_step": 465307, "epoch": 2769} {"train_loss": -12.939634323120117, "global_step": 465308, "epoch": 2769} {"train_loss": -12.69542407989502, "global_step": 465309, "epoch": 2769} {"train_loss": -12.583328247070312, "global_step": 465310, "epoch": 2769} {"train_loss": -12.818748474121094, "global_step": 465311, "epoch": 2769} {"train_loss": -12.792974472045898, "global_step": 465312, "epoch": 2769} {"train_loss": -12.664773941040039, "global_step": 465313, "epoch": 2769} {"train_loss": -12.634586334228516, "global_step": 465314, "epoch": 2769} {"train_loss": -12.88797664642334, "global_step": 465315, "epoch": 2769} {"train_loss": -12.76772689819336, "global_step": 465316, "epoch": 2769} {"train_loss": -12.460655212402344, "global_step": 465317, "epoch": 2769} {"train_loss": -12.967729568481445, "global_step": 465318, "epoch": 2769} {"train_loss": -12.577348709106445, "global_step": 465319, "epoch": 2769} {"train_loss": -12.740385055541992, "global_step": 465320, "epoch": 2769} {"train_loss": -12.735955238342285, "global_step": 465321, "epoch": 2769} {"train_loss": -12.616170883178711, "global_step": 465322, "epoch": 2769} {"train_loss": -12.192838668823242, "global_step": 465323, "epoch": 2769} {"train_loss": -12.905207633972168, "global_step": 465324, "epoch": 2769} {"train_loss": -12.402910232543945, "global_step": 465325, "epoch": 2769} {"train_loss": -12.057844161987305, "global_step": 465326, "epoch": 2769} {"train_loss": -12.250102996826172, "global_step": 465327, "epoch": 2769} {"train_loss": -12.029003143310547, "global_step": 465328, "epoch": 2769} {"train_loss": -11.594231605529785, "global_step": 465329, "epoch": 2769} {"train_loss": -13.03841781616211, "global_step": 465330, "epoch": 2769} {"train_loss": -11.807705879211426, "global_step": 465331, "epoch": 2769} {"train_loss": -12.5306396484375, "global_step": 465332, "epoch": 2769} {"train_loss": -11.678581237792969, "global_step": 465333, "epoch": 2769} {"train_loss": -12.101962089538574, "global_step": 465334, "epoch": 2769} {"train_loss": -11.85069465637207, "global_step": 465335, "epoch": 2769} {"train_loss": -12.05567741394043, "global_step": 465336, "epoch": 2769} {"train_loss": -11.563976287841797, "global_step": 465337, "epoch": 2769} {"train_loss": -11.863114356994629, "global_step": 465338, "epoch": 2769} {"train_loss": -11.656661987304688, "global_step": 465339, "epoch": 2769} {"train_loss": -11.688228607177734, "global_step": 465340, "epoch": 2769} {"train_loss": -12.326166152954102, "global_step": 465341, "epoch": 2769} {"train_loss": -11.717394828796387, "global_step": 465342, "epoch": 2769} {"train_loss": -12.527559280395508, "global_step": 465343, "epoch": 2769} {"train_loss": -12.113876342773438, "global_step": 465344, "epoch": 2769} {"train_loss": -12.672365188598633, "global_step": 465345, "epoch": 2769} {"train_loss": -12.580081939697266, "global_step": 465346, "epoch": 2769} {"train_loss": -12.690500259399414, "global_step": 465347, "epoch": 2769} {"train_loss": -12.472965240478516, "global_step": 465348, "epoch": 2769} {"train_loss": -12.25654411315918, "global_step": 465349, "epoch": 2769} {"train_loss": -12.214434623718262, "global_step": 465350, "epoch": 2769} {"train_loss": -12.005989074707031, "global_step": 465351, "epoch": 2769} {"train_loss": -12.373713493347168, "global_step": 465352, "epoch": 2769} {"train_loss": -11.667215347290039, "global_step": 465353, "epoch": 2769} {"train_loss": -12.122276306152344, "global_step": 465354, "epoch": 2769} {"train_loss": -11.740875244140625, "global_step": 465355, "epoch": 2769} {"train_loss": -12.497566223144531, "global_step": 465356, "epoch": 2769} {"train_loss": -11.592958450317383, "global_step": 465357, "epoch": 2769} {"train_loss": -12.544901847839355, "global_step": 465358, "epoch": 2769} {"train_loss": -12.35484272525424, "global_step": 465359, "epoch": 2769, "val_loss": 314365.1875} {"train_loss": -12.314101219177246, "global_step": 465360, "epoch": 2770} {"train_loss": -11.684240341186523, "global_step": 465361, "epoch": 2770} {"train_loss": -12.438411712646484, "global_step": 465362, "epoch": 2770} {"train_loss": -12.346992492675781, "global_step": 465363, "epoch": 2770} {"train_loss": -12.253393173217773, "global_step": 465364, "epoch": 2770} {"train_loss": -12.139866828918457, "global_step": 465365, "epoch": 2770} {"train_loss": -12.151251792907715, "global_step": 465366, "epoch": 2770} {"train_loss": -12.658721923828125, "global_step": 465367, "epoch": 2770} {"train_loss": -11.91300106048584, "global_step": 465368, "epoch": 2770} {"train_loss": -12.204338073730469, "global_step": 465369, "epoch": 2770} {"train_loss": -12.549474716186523, "global_step": 465370, "epoch": 2770} {"train_loss": -12.241283416748047, "global_step": 465371, "epoch": 2770} {"train_loss": -12.365785598754883, "global_step": 465372, "epoch": 2770} {"train_loss": -12.366929054260254, "global_step": 465373, "epoch": 2770} {"train_loss": -12.594789505004883, "global_step": 465374, "epoch": 2770} {"train_loss": -12.348970413208008, "global_step": 465375, "epoch": 2770} {"train_loss": -12.545495986938477, "global_step": 465376, "epoch": 2770} {"train_loss": -12.317975997924805, "global_step": 465377, "epoch": 2770} {"train_loss": -12.92183780670166, "global_step": 465378, "epoch": 2770} {"train_loss": -12.237480163574219, "global_step": 465379, "epoch": 2770} {"train_loss": -12.398983001708984, "global_step": 465380, "epoch": 2770} {"train_loss": -11.736824035644531, "global_step": 465381, "epoch": 2770} {"train_loss": -12.40987491607666, "global_step": 465382, "epoch": 2770} {"train_loss": -11.931913375854492, "global_step": 465383, "epoch": 2770} {"train_loss": -12.450693130493164, "global_step": 465384, "epoch": 2770} {"train_loss": -11.863519668579102, "global_step": 465385, "epoch": 2770} {"train_loss": -12.010239601135254, "global_step": 465386, "epoch": 2770} {"train_loss": -12.446935653686523, "global_step": 465387, "epoch": 2770} {"train_loss": -11.401144981384277, "global_step": 465388, "epoch": 2770} {"train_loss": -12.401872634887695, "global_step": 465389, "epoch": 2770} {"train_loss": -12.45305061340332, "global_step": 465390, "epoch": 2770} {"train_loss": -12.47507095336914, "global_step": 465391, "epoch": 2770} {"train_loss": -12.385635375976562, "global_step": 465392, "epoch": 2770} {"train_loss": -12.310995101928711, "global_step": 465393, "epoch": 2770} {"train_loss": -12.223251342773438, "global_step": 465394, "epoch": 2770} {"train_loss": -12.427892684936523, "global_step": 465395, "epoch": 2770} {"train_loss": -12.383932113647461, "global_step": 465396, "epoch": 2770} {"train_loss": -12.340396881103516, "global_step": 465397, "epoch": 2770} {"train_loss": -12.397037506103516, "global_step": 465398, "epoch": 2770} {"train_loss": -12.214866638183594, "global_step": 465399, "epoch": 2770} {"train_loss": -12.476001739501953, "global_step": 465400, "epoch": 2770} {"train_loss": -12.124848365783691, "global_step": 465401, "epoch": 2770} {"train_loss": -12.427252769470215, "global_step": 465402, "epoch": 2770} {"train_loss": -11.5825777053833, "global_step": 465403, "epoch": 2770} {"train_loss": -12.610828399658203, "global_step": 465404, "epoch": 2770} {"train_loss": -12.393196105957031, "global_step": 465405, "epoch": 2770} {"train_loss": -11.842750549316406, "global_step": 465406, "epoch": 2770} {"train_loss": -12.329225540161133, "global_step": 465407, "epoch": 2770} {"train_loss": -12.403066635131836, "global_step": 465408, "epoch": 2770} {"train_loss": -12.474587440490723, "global_step": 465409, "epoch": 2770} {"train_loss": -12.132530212402344, "global_step": 465410, "epoch": 2770} {"train_loss": -12.778253555297852, "global_step": 465411, "epoch": 2770} {"train_loss": -12.57241439819336, "global_step": 465412, "epoch": 2770} {"train_loss": -12.560781478881836, "global_step": 465413, "epoch": 2770} {"train_loss": -12.018312454223633, "global_step": 465414, "epoch": 2770} {"train_loss": -11.687934875488281, "global_step": 465415, "epoch": 2770} {"train_loss": -11.143281936645508, "global_step": 465416, "epoch": 2770} {"train_loss": -11.876015663146973, "global_step": 465417, "epoch": 2770} {"train_loss": -12.549142837524414, "global_step": 465418, "epoch": 2770} {"train_loss": -12.263995170593262, "global_step": 465419, "epoch": 2770} {"train_loss": -12.771044731140137, "global_step": 465420, "epoch": 2770} {"train_loss": -12.192556381225586, "global_step": 465421, "epoch": 2770} {"train_loss": -12.723403930664062, "global_step": 465422, "epoch": 2770} {"train_loss": -12.574222564697266, "global_step": 465423, "epoch": 2770} {"train_loss": -12.57773208618164, "global_step": 465424, "epoch": 2770} {"train_loss": -12.45341682434082, "global_step": 465425, "epoch": 2770} {"train_loss": -12.875293731689453, "global_step": 465426, "epoch": 2770} {"train_loss": -12.605452537536621, "global_step": 465427, "epoch": 2770} {"train_loss": -12.774876594543457, "global_step": 465428, "epoch": 2770} {"train_loss": -12.762670516967773, "global_step": 465429, "epoch": 2770} {"train_loss": -12.558591842651367, "global_step": 465430, "epoch": 2770} {"train_loss": -12.872824668884277, "global_step": 465431, "epoch": 2770} {"train_loss": -12.663408279418945, "global_step": 465432, "epoch": 2770} {"train_loss": -12.732610702514648, "global_step": 465433, "epoch": 2770} {"train_loss": -13.024184226989746, "global_step": 465434, "epoch": 2770} {"train_loss": -12.63962173461914, "global_step": 465435, "epoch": 2770} {"train_loss": -12.643451690673828, "global_step": 465436, "epoch": 2770} {"train_loss": -12.644865989685059, "global_step": 465437, "epoch": 2770} {"train_loss": -12.283135414123535, "global_step": 465438, "epoch": 2770} {"train_loss": -12.116785049438477, "global_step": 465439, "epoch": 2770} {"train_loss": -12.747770309448242, "global_step": 465440, "epoch": 2770} {"train_loss": -12.47481632232666, "global_step": 465441, "epoch": 2770} {"train_loss": -12.125768661499023, "global_step": 465442, "epoch": 2770} {"train_loss": -11.809944152832031, "global_step": 465443, "epoch": 2770} {"train_loss": -12.508868217468262, "global_step": 465444, "epoch": 2770} {"train_loss": -12.4246826171875, "global_step": 465445, "epoch": 2770} {"train_loss": -11.856651306152344, "global_step": 465446, "epoch": 2770} {"train_loss": -11.726715087890625, "global_step": 465447, "epoch": 2770} {"train_loss": -12.730992317199707, "global_step": 465448, "epoch": 2770} {"train_loss": -12.105003356933594, "global_step": 465449, "epoch": 2770} {"train_loss": -11.941831588745117, "global_step": 465450, "epoch": 2770} {"train_loss": -11.851873397827148, "global_step": 465451, "epoch": 2770} {"train_loss": -12.890070915222168, "global_step": 465452, "epoch": 2770} {"train_loss": -11.92675495147705, "global_step": 465453, "epoch": 2770} {"train_loss": -12.209284782409668, "global_step": 465454, "epoch": 2770} {"train_loss": -12.376649856567383, "global_step": 465455, "epoch": 2770} {"train_loss": -12.451957702636719, "global_step": 465456, "epoch": 2770} {"train_loss": -12.165045738220215, "global_step": 465457, "epoch": 2770} {"train_loss": -12.392016410827637, "global_step": 465458, "epoch": 2770} {"train_loss": -12.552362442016602, "global_step": 465459, "epoch": 2770} {"train_loss": -11.830093383789062, "global_step": 465460, "epoch": 2770} {"train_loss": -12.268379211425781, "global_step": 465461, "epoch": 2770} {"train_loss": -12.265122413635254, "global_step": 465462, "epoch": 2770} {"train_loss": -11.992597579956055, "global_step": 465463, "epoch": 2770} {"train_loss": -11.931852340698242, "global_step": 465464, "epoch": 2770} {"train_loss": -12.392844200134277, "global_step": 465465, "epoch": 2770} {"train_loss": -12.334933280944824, "global_step": 465466, "epoch": 2770} {"train_loss": -12.567558288574219, "global_step": 465467, "epoch": 2770} {"train_loss": -12.380447387695312, "global_step": 465468, "epoch": 2770} {"train_loss": -12.461677551269531, "global_step": 465469, "epoch": 2770} {"train_loss": -11.64262580871582, "global_step": 465470, "epoch": 2770} {"train_loss": -11.3571195602417, "global_step": 465471, "epoch": 2770} {"train_loss": -12.402445793151855, "global_step": 465472, "epoch": 2770} {"train_loss": -11.45753288269043, "global_step": 465473, "epoch": 2770} {"train_loss": -11.002424240112305, "global_step": 465474, "epoch": 2770} {"train_loss": -11.77292251586914, "global_step": 465475, "epoch": 2770} {"train_loss": -11.136697769165039, "global_step": 465476, "epoch": 2770} {"train_loss": -11.942782402038574, "global_step": 465477, "epoch": 2770} {"train_loss": -11.748617172241211, "global_step": 465478, "epoch": 2770} {"train_loss": -12.25123119354248, "global_step": 465479, "epoch": 2770} {"train_loss": -11.823118209838867, "global_step": 465480, "epoch": 2770} {"train_loss": -12.320684432983398, "global_step": 465481, "epoch": 2770} {"train_loss": -11.516315460205078, "global_step": 465482, "epoch": 2770} {"train_loss": -12.022685050964355, "global_step": 465483, "epoch": 2770} {"train_loss": -10.888171195983887, "global_step": 465484, "epoch": 2770} {"train_loss": -11.629777908325195, "global_step": 465485, "epoch": 2770} {"train_loss": -11.759870529174805, "global_step": 465486, "epoch": 2770} {"train_loss": -12.047136306762695, "global_step": 465487, "epoch": 2770} {"train_loss": -12.122451782226562, "global_step": 465488, "epoch": 2770} {"train_loss": -12.212722778320312, "global_step": 465489, "epoch": 2770} {"train_loss": -12.174946784973145, "global_step": 465490, "epoch": 2770} {"train_loss": -12.074846267700195, "global_step": 465491, "epoch": 2770} {"train_loss": -11.770078659057617, "global_step": 465492, "epoch": 2770} {"train_loss": -12.199186325073242, "global_step": 465493, "epoch": 2770} {"train_loss": -11.81280517578125, "global_step": 465494, "epoch": 2770} {"train_loss": -12.193368911743164, "global_step": 465495, "epoch": 2770} {"train_loss": -12.03459358215332, "global_step": 465496, "epoch": 2770} {"train_loss": -12.344884872436523, "global_step": 465497, "epoch": 2770} {"train_loss": -12.327336311340332, "global_step": 465498, "epoch": 2770} {"train_loss": -11.98930835723877, "global_step": 465499, "epoch": 2770} {"train_loss": -12.315483093261719, "global_step": 465500, "epoch": 2770} {"train_loss": -12.177142143249512, "global_step": 465501, "epoch": 2770} {"train_loss": -12.415521621704102, "global_step": 465502, "epoch": 2770} {"train_loss": -12.463640213012695, "global_step": 465503, "epoch": 2770} {"train_loss": -11.095443725585938, "global_step": 465504, "epoch": 2770} {"train_loss": -11.894474029541016, "global_step": 465505, "epoch": 2770} {"train_loss": -12.0620698928833, "global_step": 465506, "epoch": 2770} {"train_loss": -11.118494033813477, "global_step": 465507, "epoch": 2770} {"train_loss": -12.454595565795898, "global_step": 465508, "epoch": 2770} {"train_loss": -12.493791580200195, "global_step": 465509, "epoch": 2770} {"train_loss": -12.22688102722168, "global_step": 465510, "epoch": 2770} {"train_loss": -12.367645263671875, "global_step": 465511, "epoch": 2770} {"train_loss": -12.16341781616211, "global_step": 465512, "epoch": 2770} {"train_loss": -12.274255752563477, "global_step": 465513, "epoch": 2770} {"train_loss": -12.246885299682617, "global_step": 465514, "epoch": 2770} {"train_loss": -12.306988716125488, "global_step": 465515, "epoch": 2770} {"train_loss": -12.266718864440918, "global_step": 465516, "epoch": 2770} {"train_loss": -12.543228149414062, "global_step": 465517, "epoch": 2770} {"train_loss": -12.45000171661377, "global_step": 465518, "epoch": 2770} {"train_loss": -12.140935897827148, "global_step": 465519, "epoch": 2770} {"train_loss": -12.48948860168457, "global_step": 465520, "epoch": 2770} {"train_loss": -12.216768264770508, "global_step": 465521, "epoch": 2770} {"train_loss": -12.864752769470215, "global_step": 465522, "epoch": 2770} {"train_loss": -12.410493850708008, "global_step": 465523, "epoch": 2770} {"train_loss": -12.670969009399414, "global_step": 465524, "epoch": 2770} {"train_loss": -12.545848846435547, "global_step": 465525, "epoch": 2770} {"train_loss": -12.319374084472656, "global_step": 465526, "epoch": 2770} {"train_loss": -12.232825182733082, "global_step": 465527, "epoch": 2770, "val_loss": 316103.71875, "train_action_mse_error": 1.397538185119629} {"train_loss": -12.496131896972656, "global_step": 465528, "epoch": 2771} {"train_loss": -12.821836471557617, "global_step": 465529, "epoch": 2771} {"train_loss": -12.757059097290039, "global_step": 465530, "epoch": 2771} {"train_loss": -12.702085494995117, "global_step": 465531, "epoch": 2771} {"train_loss": -12.583041191101074, "global_step": 465532, "epoch": 2771} {"train_loss": -12.704357147216797, "global_step": 465533, "epoch": 2771} {"train_loss": -12.791305541992188, "global_step": 465534, "epoch": 2771} {"train_loss": -12.709589004516602, "global_step": 465535, "epoch": 2771} {"train_loss": -12.88494873046875, "global_step": 465536, "epoch": 2771} {"train_loss": -12.716211318969727, "global_step": 465537, "epoch": 2771} {"train_loss": -12.483718872070312, "global_step": 465538, "epoch": 2771} {"train_loss": -12.813339233398438, "global_step": 465539, "epoch": 2771} {"train_loss": -12.748414039611816, "global_step": 465540, "epoch": 2771} {"train_loss": -12.705221176147461, "global_step": 465541, "epoch": 2771} {"train_loss": -12.796738624572754, "global_step": 465542, "epoch": 2771} {"train_loss": -12.419339179992676, "global_step": 465543, "epoch": 2771} {"train_loss": -12.643600463867188, "global_step": 465544, "epoch": 2771} {"train_loss": -12.853986740112305, "global_step": 465545, "epoch": 2771} {"train_loss": -12.455068588256836, "global_step": 465546, "epoch": 2771} {"train_loss": -12.87647819519043, "global_step": 465547, "epoch": 2771} {"train_loss": -12.798833847045898, "global_step": 465548, "epoch": 2771} {"train_loss": -12.694958686828613, "global_step": 465549, "epoch": 2771} {"train_loss": -12.803309440612793, "global_step": 465550, "epoch": 2771} {"train_loss": -12.872774124145508, "global_step": 465551, "epoch": 2771} {"train_loss": -12.49454402923584, "global_step": 465552, "epoch": 2771} {"train_loss": -12.748102188110352, "global_step": 465553, "epoch": 2771} {"train_loss": -12.504316329956055, "global_step": 465554, "epoch": 2771} {"train_loss": -12.62928581237793, "global_step": 465555, "epoch": 2771} {"train_loss": -12.493441581726074, "global_step": 465556, "epoch": 2771} {"train_loss": -12.593145370483398, "global_step": 465557, "epoch": 2771} {"train_loss": -12.945363998413086, "global_step": 465558, "epoch": 2771} {"train_loss": -12.256753921508789, "global_step": 465559, "epoch": 2771} {"train_loss": -12.544036865234375, "global_step": 465560, "epoch": 2771} {"train_loss": -12.562296867370605, "global_step": 465561, "epoch": 2771} {"train_loss": -12.749892234802246, "global_step": 465562, "epoch": 2771} {"train_loss": -12.556978225708008, "global_step": 465563, "epoch": 2771} {"train_loss": -12.572264671325684, "global_step": 465564, "epoch": 2771} {"train_loss": -12.477550506591797, "global_step": 465565, "epoch": 2771} {"train_loss": -12.815418243408203, "global_step": 465566, "epoch": 2771} {"train_loss": -12.617856979370117, "global_step": 465567, "epoch": 2771} {"train_loss": -12.67975902557373, "global_step": 465568, "epoch": 2771} {"train_loss": -12.694297790527344, "global_step": 465569, "epoch": 2771} {"train_loss": -12.368006706237793, "global_step": 465570, "epoch": 2771} {"train_loss": -12.076093673706055, "global_step": 465571, "epoch": 2771} {"train_loss": -12.683952331542969, "global_step": 465572, "epoch": 2771} {"train_loss": -12.14932918548584, "global_step": 465573, "epoch": 2771} {"train_loss": -12.085958480834961, "global_step": 465574, "epoch": 2771} {"train_loss": -12.542703628540039, "global_step": 465575, "epoch": 2771} {"train_loss": -12.521303176879883, "global_step": 465576, "epoch": 2771} {"train_loss": -12.225971221923828, "global_step": 465577, "epoch": 2771} {"train_loss": -12.246603012084961, "global_step": 465578, "epoch": 2771} {"train_loss": -12.890645980834961, "global_step": 465579, "epoch": 2771} {"train_loss": -11.772263526916504, "global_step": 465580, "epoch": 2771} {"train_loss": -11.641178131103516, "global_step": 465581, "epoch": 2771} {"train_loss": -12.354751586914062, "global_step": 465582, "epoch": 2771} {"train_loss": -12.757465362548828, "global_step": 465583, "epoch": 2771} {"train_loss": -11.887371063232422, "global_step": 465584, "epoch": 2771} {"train_loss": -11.907585144042969, "global_step": 465585, "epoch": 2771} {"train_loss": -12.602590560913086, "global_step": 465586, "epoch": 2771} {"train_loss": -12.3971529006958, "global_step": 465587, "epoch": 2771} {"train_loss": -12.399860382080078, "global_step": 465588, "epoch": 2771} {"train_loss": -12.376800537109375, "global_step": 465589, "epoch": 2771} {"train_loss": -12.409276962280273, "global_step": 465590, "epoch": 2771} {"train_loss": -12.126635551452637, "global_step": 465591, "epoch": 2771} {"train_loss": -12.221853256225586, "global_step": 465592, "epoch": 2771} {"train_loss": -11.866439819335938, "global_step": 465593, "epoch": 2771} {"train_loss": -11.438138008117676, "global_step": 465594, "epoch": 2771} {"train_loss": -12.413330078125, "global_step": 465595, "epoch": 2771} {"train_loss": -11.756919860839844, "global_step": 465596, "epoch": 2771} {"train_loss": -11.042732238769531, "global_step": 465597, "epoch": 2771} {"train_loss": -11.652555465698242, "global_step": 465598, "epoch": 2771} {"train_loss": -11.192694664001465, "global_step": 465599, "epoch": 2771} {"train_loss": -12.045416831970215, "global_step": 465600, "epoch": 2771} {"train_loss": -11.601811408996582, "global_step": 465601, "epoch": 2771} {"train_loss": -10.734464645385742, "global_step": 465602, "epoch": 2771} {"train_loss": -12.110965728759766, "global_step": 465603, "epoch": 2771} {"train_loss": -12.07887077331543, "global_step": 465604, "epoch": 2771} {"train_loss": -11.663714408874512, "global_step": 465605, "epoch": 2771} {"train_loss": -12.091375350952148, "global_step": 465606, "epoch": 2771} {"train_loss": -12.395466804504395, "global_step": 465607, "epoch": 2771} {"train_loss": -11.725570678710938, "global_step": 465608, "epoch": 2771} {"train_loss": -12.222373008728027, "global_step": 465609, "epoch": 2771} {"train_loss": -11.666157722473145, "global_step": 465610, "epoch": 2771} {"train_loss": -11.953058242797852, "global_step": 465611, "epoch": 2771} {"train_loss": -11.690757751464844, "global_step": 465612, "epoch": 2771} {"train_loss": -11.956344604492188, "global_step": 465613, "epoch": 2771} {"train_loss": -12.083070755004883, "global_step": 465614, "epoch": 2771} {"train_loss": -11.337474822998047, "global_step": 465615, "epoch": 2771} {"train_loss": -11.891439437866211, "global_step": 465616, "epoch": 2771} {"train_loss": -12.363619804382324, "global_step": 465617, "epoch": 2771} {"train_loss": -11.886425971984863, "global_step": 465618, "epoch": 2771} {"train_loss": -11.754013061523438, "global_step": 465619, "epoch": 2771} {"train_loss": -11.90916919708252, "global_step": 465620, "epoch": 2771} {"train_loss": -11.531145095825195, "global_step": 465621, "epoch": 2771} {"train_loss": -12.066436767578125, "global_step": 465622, "epoch": 2771} {"train_loss": -11.997264862060547, "global_step": 465623, "epoch": 2771} {"train_loss": -11.44997787475586, "global_step": 465624, "epoch": 2771} {"train_loss": -12.616737365722656, "global_step": 465625, "epoch": 2771} {"train_loss": -11.948609352111816, "global_step": 465626, "epoch": 2771} {"train_loss": -12.30583381652832, "global_step": 465627, "epoch": 2771} {"train_loss": -12.151763916015625, "global_step": 465628, "epoch": 2771} {"train_loss": -12.100411415100098, "global_step": 465629, "epoch": 2771} {"train_loss": -12.373456954956055, "global_step": 465630, "epoch": 2771} {"train_loss": -12.271783828735352, "global_step": 465631, "epoch": 2771} {"train_loss": -12.453177452087402, "global_step": 465632, "epoch": 2771} {"train_loss": -12.439875602722168, "global_step": 465633, "epoch": 2771} {"train_loss": -12.218793869018555, "global_step": 465634, "epoch": 2771} {"train_loss": -12.689142227172852, "global_step": 465635, "epoch": 2771} {"train_loss": -12.262622833251953, "global_step": 465636, "epoch": 2771} {"train_loss": -12.75981330871582, "global_step": 465637, "epoch": 2771} {"train_loss": -12.469244003295898, "global_step": 465638, "epoch": 2771} {"train_loss": -12.515862464904785, "global_step": 465639, "epoch": 2771} {"train_loss": -12.327444076538086, "global_step": 465640, "epoch": 2771} {"train_loss": -12.460250854492188, "global_step": 465641, "epoch": 2771} {"train_loss": -12.574884414672852, "global_step": 465642, "epoch": 2771} {"train_loss": -12.674574851989746, "global_step": 465643, "epoch": 2771} {"train_loss": -12.102807998657227, "global_step": 465644, "epoch": 2771} {"train_loss": -12.035346984863281, "global_step": 465645, "epoch": 2771} {"train_loss": -12.564798355102539, "global_step": 465646, "epoch": 2771} {"train_loss": -11.89605712890625, "global_step": 465647, "epoch": 2771} {"train_loss": -12.807212829589844, "global_step": 465648, "epoch": 2771} {"train_loss": -12.601672172546387, "global_step": 465649, "epoch": 2771} {"train_loss": -12.172637939453125, "global_step": 465650, "epoch": 2771} {"train_loss": -12.42452621459961, "global_step": 465651, "epoch": 2771} {"train_loss": -12.736085891723633, "global_step": 465652, "epoch": 2771} {"train_loss": -12.251957893371582, "global_step": 465653, "epoch": 2771} {"train_loss": -12.281779289245605, "global_step": 465654, "epoch": 2771} {"train_loss": -12.539013862609863, "global_step": 465655, "epoch": 2771} {"train_loss": -12.16288948059082, "global_step": 465656, "epoch": 2771} {"train_loss": -12.569053649902344, "global_step": 465657, "epoch": 2771} {"train_loss": -12.162666320800781, "global_step": 465658, "epoch": 2771} {"train_loss": -12.646200180053711, "global_step": 465659, "epoch": 2771} {"train_loss": -12.043378829956055, "global_step": 465660, "epoch": 2771} {"train_loss": -12.732080459594727, "global_step": 465661, "epoch": 2771} {"train_loss": -12.29029655456543, "global_step": 465662, "epoch": 2771} {"train_loss": -12.418471336364746, "global_step": 465663, "epoch": 2771} {"train_loss": -12.814923286437988, "global_step": 465664, "epoch": 2771} {"train_loss": -12.163165092468262, "global_step": 465665, "epoch": 2771} {"train_loss": -11.635415077209473, "global_step": 465666, "epoch": 2771} {"train_loss": -12.085158348083496, "global_step": 465667, "epoch": 2771} {"train_loss": -11.743824005126953, "global_step": 465668, "epoch": 2771} {"train_loss": -11.668896675109863, "global_step": 465669, "epoch": 2771} {"train_loss": -12.400382995605469, "global_step": 465670, "epoch": 2771} {"train_loss": -11.315914154052734, "global_step": 465671, "epoch": 2771} {"train_loss": -12.418932914733887, "global_step": 465672, "epoch": 2771} {"train_loss": -11.934789657592773, "global_step": 465673, "epoch": 2771} {"train_loss": -12.320951461791992, "global_step": 465674, "epoch": 2771} {"train_loss": -11.340286254882812, "global_step": 465675, "epoch": 2771} {"train_loss": -11.728622436523438, "global_step": 465676, "epoch": 2771} {"train_loss": -11.104290962219238, "global_step": 465677, "epoch": 2771} {"train_loss": -10.620790481567383, "global_step": 465678, "epoch": 2771} {"train_loss": -12.175935745239258, "global_step": 465679, "epoch": 2771} {"train_loss": -11.012389183044434, "global_step": 465680, "epoch": 2771} {"train_loss": -10.745808601379395, "global_step": 465681, "epoch": 2771} {"train_loss": -11.900782585144043, "global_step": 465682, "epoch": 2771} {"train_loss": -11.5640869140625, "global_step": 465683, "epoch": 2771} {"train_loss": -11.896480560302734, "global_step": 465684, "epoch": 2771} {"train_loss": -12.259523391723633, "global_step": 465685, "epoch": 2771} {"train_loss": -11.894037246704102, "global_step": 465686, "epoch": 2771} {"train_loss": -12.200060844421387, "global_step": 465687, "epoch": 2771} {"train_loss": -11.864338874816895, "global_step": 465688, "epoch": 2771} {"train_loss": -12.23652458190918, "global_step": 465689, "epoch": 2771} {"train_loss": -12.554000854492188, "global_step": 465690, "epoch": 2771} {"train_loss": -12.46844482421875, "global_step": 465691, "epoch": 2771} {"train_loss": -12.329358100891113, "global_step": 465692, "epoch": 2771} {"train_loss": -12.580671310424805, "global_step": 465693, "epoch": 2771} {"train_loss": -12.046022415161133, "global_step": 465694, "epoch": 2771} {"train_loss": -12.2439843245915, "global_step": 465695, "epoch": 2771, "val_loss": 317334.09375} {"train_loss": -12.153986930847168, "global_step": 465696, "epoch": 2772} {"train_loss": -12.700124740600586, "global_step": 465697, "epoch": 2772} {"train_loss": -12.375656127929688, "global_step": 465698, "epoch": 2772} {"train_loss": -12.64236068725586, "global_step": 465699, "epoch": 2772} {"train_loss": -12.44391918182373, "global_step": 465700, "epoch": 2772} {"train_loss": -12.648221969604492, "global_step": 465701, "epoch": 2772} {"train_loss": -12.707514762878418, "global_step": 465702, "epoch": 2772} {"train_loss": -12.716333389282227, "global_step": 465703, "epoch": 2772} {"train_loss": -12.677410125732422, "global_step": 465704, "epoch": 2772} {"train_loss": -12.719209671020508, "global_step": 465705, "epoch": 2772} {"train_loss": -12.89844036102295, "global_step": 465706, "epoch": 2772} {"train_loss": -12.646148681640625, "global_step": 465707, "epoch": 2772} {"train_loss": -12.900100708007812, "global_step": 465708, "epoch": 2772} {"train_loss": -12.890677452087402, "global_step": 465709, "epoch": 2772} {"train_loss": -12.586030006408691, "global_step": 465710, "epoch": 2772} {"train_loss": -12.772078514099121, "global_step": 465711, "epoch": 2772} {"train_loss": -12.540708541870117, "global_step": 465712, "epoch": 2772} {"train_loss": -12.801215171813965, "global_step": 465713, "epoch": 2772} {"train_loss": -12.986207962036133, "global_step": 465714, "epoch": 2772} {"train_loss": -12.961645126342773, "global_step": 465715, "epoch": 2772} {"train_loss": -12.884645462036133, "global_step": 465716, "epoch": 2772} {"train_loss": -12.726656913757324, "global_step": 465717, "epoch": 2772} {"train_loss": -12.827348709106445, "global_step": 465718, "epoch": 2772} {"train_loss": -12.672109603881836, "global_step": 465719, "epoch": 2772} {"train_loss": -12.397953033447266, "global_step": 465720, "epoch": 2772} {"train_loss": -12.968805313110352, "global_step": 465721, "epoch": 2772} {"train_loss": -11.832183837890625, "global_step": 465722, "epoch": 2772} {"train_loss": -12.07757568359375, "global_step": 465723, "epoch": 2772} {"train_loss": -12.893180847167969, "global_step": 465724, "epoch": 2772} {"train_loss": -12.390060424804688, "global_step": 465725, "epoch": 2772} {"train_loss": -11.955171585083008, "global_step": 465726, "epoch": 2772} {"train_loss": -13.003744125366211, "global_step": 465727, "epoch": 2772} {"train_loss": -12.3424072265625, "global_step": 465728, "epoch": 2772} {"train_loss": -12.260944366455078, "global_step": 465729, "epoch": 2772} {"train_loss": -12.979528427124023, "global_step": 465730, "epoch": 2772} {"train_loss": -12.705655097961426, "global_step": 465731, "epoch": 2772} {"train_loss": -12.666296005249023, "global_step": 465732, "epoch": 2772} {"train_loss": -12.671875953674316, "global_step": 465733, "epoch": 2772} {"train_loss": -12.760427474975586, "global_step": 465734, "epoch": 2772} {"train_loss": -12.959957122802734, "global_step": 465735, "epoch": 2772} {"train_loss": -12.810311317443848, "global_step": 465736, "epoch": 2772} {"train_loss": -12.979299545288086, "global_step": 465737, "epoch": 2772} {"train_loss": -12.861639022827148, "global_step": 465738, "epoch": 2772} {"train_loss": -12.655248641967773, "global_step": 465739, "epoch": 2772} {"train_loss": -12.824633598327637, "global_step": 465740, "epoch": 2772} {"train_loss": -12.53155517578125, "global_step": 465741, "epoch": 2772} {"train_loss": -12.875402450561523, "global_step": 465742, "epoch": 2772} {"train_loss": -12.775137901306152, "global_step": 465743, "epoch": 2772} {"train_loss": -12.8512601852417, "global_step": 465744, "epoch": 2772} {"train_loss": -12.257863998413086, "global_step": 465745, "epoch": 2772} {"train_loss": -12.100589752197266, "global_step": 465746, "epoch": 2772} {"train_loss": -12.679712295532227, "global_step": 465747, "epoch": 2772} {"train_loss": -12.851044654846191, "global_step": 465748, "epoch": 2772} {"train_loss": -12.660690307617188, "global_step": 465749, "epoch": 2772} {"train_loss": -12.905440330505371, "global_step": 465750, "epoch": 2772} {"train_loss": -12.94542121887207, "global_step": 465751, "epoch": 2772} {"train_loss": -12.665695190429688, "global_step": 465752, "epoch": 2772} {"train_loss": -12.91458797454834, "global_step": 465753, "epoch": 2772} {"train_loss": -12.909423828125, "global_step": 465754, "epoch": 2772} {"train_loss": -12.942605018615723, "global_step": 465755, "epoch": 2772} {"train_loss": -12.694294929504395, "global_step": 465756, "epoch": 2772} {"train_loss": -12.847275733947754, "global_step": 465757, "epoch": 2772} {"train_loss": -12.807849884033203, "global_step": 465758, "epoch": 2772} {"train_loss": -12.466602325439453, "global_step": 465759, "epoch": 2772} {"train_loss": -12.722898483276367, "global_step": 465760, "epoch": 2772} {"train_loss": -12.212946891784668, "global_step": 465761, "epoch": 2772} {"train_loss": -12.708728790283203, "global_step": 465762, "epoch": 2772} {"train_loss": -12.018028259277344, "global_step": 465763, "epoch": 2772} {"train_loss": -12.756855964660645, "global_step": 465764, "epoch": 2772} {"train_loss": -12.10000228881836, "global_step": 465765, "epoch": 2772} {"train_loss": -12.533546447753906, "global_step": 465766, "epoch": 2772} {"train_loss": -12.220990180969238, "global_step": 465767, "epoch": 2772} {"train_loss": -12.742277145385742, "global_step": 465768, "epoch": 2772} {"train_loss": -11.833856582641602, "global_step": 465769, "epoch": 2772} {"train_loss": -12.174793243408203, "global_step": 465770, "epoch": 2772} {"train_loss": -12.041171073913574, "global_step": 465771, "epoch": 2772} {"train_loss": -12.628755569458008, "global_step": 465772, "epoch": 2772} {"train_loss": -12.334219932556152, "global_step": 465773, "epoch": 2772} {"train_loss": -12.839681625366211, "global_step": 465774, "epoch": 2772} {"train_loss": -11.787090301513672, "global_step": 465775, "epoch": 2772} {"train_loss": -11.810087203979492, "global_step": 465776, "epoch": 2772} {"train_loss": -12.115195274353027, "global_step": 465777, "epoch": 2772} {"train_loss": -12.221766471862793, "global_step": 465778, "epoch": 2772} {"train_loss": -12.114416122436523, "global_step": 465779, "epoch": 2772} {"train_loss": -12.428788185119629, "global_step": 465780, "epoch": 2772} {"train_loss": -12.18714714050293, "global_step": 465781, "epoch": 2772} {"train_loss": -12.468199729919434, "global_step": 465782, "epoch": 2772} {"train_loss": -12.718221664428711, "global_step": 465783, "epoch": 2772} {"train_loss": -12.332281112670898, "global_step": 465784, "epoch": 2772} {"train_loss": -11.680900573730469, "global_step": 465785, "epoch": 2772} {"train_loss": -10.116491317749023, "global_step": 465786, "epoch": 2772} {"train_loss": -11.092992782592773, "global_step": 465787, "epoch": 2772} {"train_loss": -11.373245239257812, "global_step": 465788, "epoch": 2772} {"train_loss": -10.88481330871582, "global_step": 465789, "epoch": 2772} {"train_loss": -8.309731483459473, "global_step": 465790, "epoch": 2772} {"train_loss": -10.519561767578125, "global_step": 465791, "epoch": 2772} {"train_loss": -6.561448097229004, "global_step": 465792, "epoch": 2772} {"train_loss": -7.953506946563721, "global_step": 465793, "epoch": 2772} {"train_loss": -6.346963882446289, "global_step": 465794, "epoch": 2772} {"train_loss": -5.824013710021973, "global_step": 465795, "epoch": 2772} {"train_loss": -6.826559543609619, "global_step": 465796, "epoch": 2772} {"train_loss": -6.94757080078125, "global_step": 465797, "epoch": 2772} {"train_loss": -7.041201591491699, "global_step": 465798, "epoch": 2772} {"train_loss": -7.888896942138672, "global_step": 465799, "epoch": 2772} {"train_loss": -7.710651874542236, "global_step": 465800, "epoch": 2772} {"train_loss": -7.212615489959717, "global_step": 465801, "epoch": 2772} {"train_loss": -7.487410545349121, "global_step": 465802, "epoch": 2772} {"train_loss": -8.340351104736328, "global_step": 465803, "epoch": 2772} {"train_loss": -8.443170547485352, "global_step": 465804, "epoch": 2772} {"train_loss": -8.491357803344727, "global_step": 465805, "epoch": 2772} {"train_loss": -8.225666046142578, "global_step": 465806, "epoch": 2772} {"train_loss": -8.707925796508789, "global_step": 465807, "epoch": 2772} {"train_loss": -8.865686416625977, "global_step": 465808, "epoch": 2772} {"train_loss": -8.165124893188477, "global_step": 465809, "epoch": 2772} {"train_loss": -9.473261833190918, "global_step": 465810, "epoch": 2772} {"train_loss": -9.79202938079834, "global_step": 465811, "epoch": 2772} {"train_loss": -9.74630069732666, "global_step": 465812, "epoch": 2772} {"train_loss": -9.452507019042969, "global_step": 465813, "epoch": 2772} {"train_loss": -10.162017822265625, "global_step": 465814, "epoch": 2772} {"train_loss": -10.974878311157227, "global_step": 465815, "epoch": 2772} {"train_loss": -10.715685844421387, "global_step": 465816, "epoch": 2772} {"train_loss": -10.73202133178711, "global_step": 465817, "epoch": 2772} {"train_loss": -11.233181953430176, "global_step": 465818, "epoch": 2772} {"train_loss": -11.408891677856445, "global_step": 465819, "epoch": 2772} {"train_loss": -11.148170471191406, "global_step": 465820, "epoch": 2772} {"train_loss": -11.533413887023926, "global_step": 465821, "epoch": 2772} {"train_loss": -11.199280738830566, "global_step": 465822, "epoch": 2772} {"train_loss": -12.126070022583008, "global_step": 465823, "epoch": 2772} {"train_loss": -11.63595199584961, "global_step": 465824, "epoch": 2772} {"train_loss": -12.165487289428711, "global_step": 465825, "epoch": 2772} {"train_loss": -11.810750007629395, "global_step": 465826, "epoch": 2772} {"train_loss": -11.580904006958008, "global_step": 465827, "epoch": 2772} {"train_loss": -12.006057739257812, "global_step": 465828, "epoch": 2772} {"train_loss": -11.944936752319336, "global_step": 465829, "epoch": 2772} {"train_loss": -12.122143745422363, "global_step": 465830, "epoch": 2772} {"train_loss": -12.116106033325195, "global_step": 465831, "epoch": 2772} {"train_loss": -12.204719543457031, "global_step": 465832, "epoch": 2772} {"train_loss": -11.844709396362305, "global_step": 465833, "epoch": 2772} {"train_loss": -12.102624893188477, "global_step": 465834, "epoch": 2772} {"train_loss": -12.22479248046875, "global_step": 465835, "epoch": 2772} {"train_loss": -12.18916130065918, "global_step": 465836, "epoch": 2772} {"train_loss": -12.543072700500488, "global_step": 465837, "epoch": 2772} {"train_loss": -12.163980484008789, "global_step": 465838, "epoch": 2772} {"train_loss": -12.36063003540039, "global_step": 465839, "epoch": 2772} {"train_loss": -12.150821685791016, "global_step": 465840, "epoch": 2772} {"train_loss": -12.035805702209473, "global_step": 465841, "epoch": 2772} {"train_loss": -12.21119499206543, "global_step": 465842, "epoch": 2772} {"train_loss": -12.070793151855469, "global_step": 465843, "epoch": 2772} {"train_loss": -11.822273254394531, "global_step": 465844, "epoch": 2772} {"train_loss": -12.614624977111816, "global_step": 465845, "epoch": 2772} {"train_loss": -12.518525123596191, "global_step": 465846, "epoch": 2772} {"train_loss": -12.406351089477539, "global_step": 465847, "epoch": 2772} {"train_loss": -12.185640335083008, "global_step": 465848, "epoch": 2772} {"train_loss": -12.06735610961914, "global_step": 465849, "epoch": 2772} {"train_loss": -12.64177131652832, "global_step": 465850, "epoch": 2772} {"train_loss": -12.054924011230469, "global_step": 465851, "epoch": 2772} {"train_loss": -12.377409934997559, "global_step": 465852, "epoch": 2772} {"train_loss": -12.290815353393555, "global_step": 465853, "epoch": 2772} {"train_loss": -11.979181289672852, "global_step": 465854, "epoch": 2772} {"train_loss": -12.41676139831543, "global_step": 465855, "epoch": 2772} {"train_loss": -12.277076721191406, "global_step": 465856, "epoch": 2772} {"train_loss": -12.240901947021484, "global_step": 465857, "epoch": 2772} {"train_loss": -12.285123825073242, "global_step": 465858, "epoch": 2772} {"train_loss": -12.460649490356445, "global_step": 465859, "epoch": 2772} {"train_loss": -12.386987686157227, "global_step": 465860, "epoch": 2772} {"train_loss": -12.399288177490234, "global_step": 465861, "epoch": 2772} {"train_loss": -12.221419334411621, "global_step": 465862, "epoch": 2772} {"train_loss": -11.71350329830533, "global_step": 465863, "epoch": 2772, "val_loss": 312542.9375} {"train_loss": -12.105981826782227, "global_step": 465864, "epoch": 2773} {"train_loss": -12.381349563598633, "global_step": 465865, "epoch": 2773} {"train_loss": -12.442567825317383, "global_step": 465866, "epoch": 2773} {"train_loss": -12.093262672424316, "global_step": 465867, "epoch": 2773} {"train_loss": -12.358699798583984, "global_step": 465868, "epoch": 2773} {"train_loss": -12.123275756835938, "global_step": 465869, "epoch": 2773} {"train_loss": -11.809548377990723, "global_step": 465870, "epoch": 2773} {"train_loss": -12.801605224609375, "global_step": 465871, "epoch": 2773} {"train_loss": -12.10342788696289, "global_step": 465872, "epoch": 2773} {"train_loss": -12.443801879882812, "global_step": 465873, "epoch": 2773} {"train_loss": -12.444314002990723, "global_step": 465874, "epoch": 2773} {"train_loss": -11.722404479980469, "global_step": 465875, "epoch": 2773} {"train_loss": -12.432151794433594, "global_step": 465876, "epoch": 2773} {"train_loss": -11.559677124023438, "global_step": 465877, "epoch": 2773} {"train_loss": -12.20145034790039, "global_step": 465878, "epoch": 2773} {"train_loss": -12.189647674560547, "global_step": 465879, "epoch": 2773} {"train_loss": -12.595647811889648, "global_step": 465880, "epoch": 2773} {"train_loss": -12.294929504394531, "global_step": 465881, "epoch": 2773} {"train_loss": -12.368415832519531, "global_step": 465882, "epoch": 2773} {"train_loss": -12.465802192687988, "global_step": 465883, "epoch": 2773} {"train_loss": -12.615888595581055, "global_step": 465884, "epoch": 2773} {"train_loss": -12.31987476348877, "global_step": 465885, "epoch": 2773} {"train_loss": -12.115577697753906, "global_step": 465886, "epoch": 2773} {"train_loss": -12.424678802490234, "global_step": 465887, "epoch": 2773} {"train_loss": -12.027929306030273, "global_step": 465888, "epoch": 2773} {"train_loss": -11.913209915161133, "global_step": 465889, "epoch": 2773} {"train_loss": -11.838440895080566, "global_step": 465890, "epoch": 2773} {"train_loss": -12.39572525024414, "global_step": 465891, "epoch": 2773} {"train_loss": -11.94786548614502, "global_step": 465892, "epoch": 2773} {"train_loss": -12.538535118103027, "global_step": 465893, "epoch": 2773} {"train_loss": -11.994441032409668, "global_step": 465894, "epoch": 2773} {"train_loss": -12.677289009094238, "global_step": 465895, "epoch": 2773} {"train_loss": -12.207791328430176, "global_step": 465896, "epoch": 2773} {"train_loss": -12.582880020141602, "global_step": 465897, "epoch": 2773} {"train_loss": -12.356107711791992, "global_step": 465898, "epoch": 2773} {"train_loss": -12.565340042114258, "global_step": 465899, "epoch": 2773} {"train_loss": -12.223869323730469, "global_step": 465900, "epoch": 2773} {"train_loss": -12.550610542297363, "global_step": 465901, "epoch": 2773} {"train_loss": -12.331382751464844, "global_step": 465902, "epoch": 2773} {"train_loss": -12.65896987915039, "global_step": 465903, "epoch": 2773} {"train_loss": -12.80274772644043, "global_step": 465904, "epoch": 2773} {"train_loss": -12.338096618652344, "global_step": 465905, "epoch": 2773} {"train_loss": -12.620126724243164, "global_step": 465906, "epoch": 2773} {"train_loss": -12.46838092803955, "global_step": 465907, "epoch": 2773} {"train_loss": -12.658032417297363, "global_step": 465908, "epoch": 2773} {"train_loss": -12.639808654785156, "global_step": 465909, "epoch": 2773} {"train_loss": -12.560890197753906, "global_step": 465910, "epoch": 2773} {"train_loss": -12.752599716186523, "global_step": 465911, "epoch": 2773} {"train_loss": -12.357641220092773, "global_step": 465912, "epoch": 2773} {"train_loss": -12.75288200378418, "global_step": 465913, "epoch": 2773} {"train_loss": -12.572872161865234, "global_step": 465914, "epoch": 2773} {"train_loss": -12.833492279052734, "global_step": 465915, "epoch": 2773} {"train_loss": -12.620576858520508, "global_step": 465916, "epoch": 2773} {"train_loss": -12.464540481567383, "global_step": 465917, "epoch": 2773} {"train_loss": -11.422972679138184, "global_step": 465918, "epoch": 2773} {"train_loss": -12.493819236755371, "global_step": 465919, "epoch": 2773} {"train_loss": -12.40305233001709, "global_step": 465920, "epoch": 2773} {"train_loss": -11.570390701293945, "global_step": 465921, "epoch": 2773} {"train_loss": -12.217373847961426, "global_step": 465922, "epoch": 2773} {"train_loss": -12.202978134155273, "global_step": 465923, "epoch": 2773} {"train_loss": -11.97260856628418, "global_step": 465924, "epoch": 2773} {"train_loss": -11.655128479003906, "global_step": 465925, "epoch": 2773} {"train_loss": -12.687910079956055, "global_step": 465926, "epoch": 2773} {"train_loss": -11.621999740600586, "global_step": 465927, "epoch": 2773} {"train_loss": -12.32046127319336, "global_step": 465928, "epoch": 2773} {"train_loss": -12.20223331451416, "global_step": 465929, "epoch": 2773} {"train_loss": -12.061336517333984, "global_step": 465930, "epoch": 2773} {"train_loss": -11.857358932495117, "global_step": 465931, "epoch": 2773} {"train_loss": -10.117300033569336, "global_step": 465932, "epoch": 2773} {"train_loss": -12.401607513427734, "global_step": 465933, "epoch": 2773} {"train_loss": -10.68232536315918, "global_step": 465934, "epoch": 2773} {"train_loss": -10.80615234375, "global_step": 465935, "epoch": 2773} {"train_loss": -12.294351577758789, "global_step": 465936, "epoch": 2773} {"train_loss": -10.394716262817383, "global_step": 465937, "epoch": 2773} {"train_loss": -10.300420761108398, "global_step": 465938, "epoch": 2773} {"train_loss": -11.770987510681152, "global_step": 465939, "epoch": 2773} {"train_loss": -10.896652221679688, "global_step": 465940, "epoch": 2773} {"train_loss": -11.268943786621094, "global_step": 465941, "epoch": 2773} {"train_loss": -10.2537202835083, "global_step": 465942, "epoch": 2773} {"train_loss": -10.285604476928711, "global_step": 465943, "epoch": 2773} {"train_loss": -10.75879192352295, "global_step": 465944, "epoch": 2773} {"train_loss": -11.83653736114502, "global_step": 465945, "epoch": 2773} {"train_loss": -11.857370376586914, "global_step": 465946, "epoch": 2773} {"train_loss": -12.429431915283203, "global_step": 465947, "epoch": 2773} {"train_loss": -11.802412986755371, "global_step": 465948, "epoch": 2773} {"train_loss": -12.509344100952148, "global_step": 465949, "epoch": 2773} {"train_loss": -11.763504981994629, "global_step": 465950, "epoch": 2773} {"train_loss": -12.042731285095215, "global_step": 465951, "epoch": 2773} {"train_loss": -12.326188087463379, "global_step": 465952, "epoch": 2773} {"train_loss": -12.162552833557129, "global_step": 465953, "epoch": 2773} {"train_loss": -12.488397598266602, "global_step": 465954, "epoch": 2773} {"train_loss": -11.918108940124512, "global_step": 465955, "epoch": 2773} {"train_loss": -12.222785949707031, "global_step": 465956, "epoch": 2773} {"train_loss": -12.291269302368164, "global_step": 465957, "epoch": 2773} {"train_loss": -12.345681190490723, "global_step": 465958, "epoch": 2773} {"train_loss": -12.312620162963867, "global_step": 465959, "epoch": 2773} {"train_loss": -12.228597640991211, "global_step": 465960, "epoch": 2773} {"train_loss": -12.687199592590332, "global_step": 465961, "epoch": 2773} {"train_loss": -12.079829216003418, "global_step": 465962, "epoch": 2773} {"train_loss": -12.499898910522461, "global_step": 465963, "epoch": 2773} {"train_loss": -12.260655403137207, "global_step": 465964, "epoch": 2773} {"train_loss": -12.563312530517578, "global_step": 465965, "epoch": 2773} {"train_loss": -12.352386474609375, "global_step": 465966, "epoch": 2773} {"train_loss": -12.44140911102295, "global_step": 465967, "epoch": 2773} {"train_loss": -12.691062927246094, "global_step": 465968, "epoch": 2773} {"train_loss": -12.317566871643066, "global_step": 465969, "epoch": 2773} {"train_loss": -12.644760131835938, "global_step": 465970, "epoch": 2773} {"train_loss": -12.746694564819336, "global_step": 465971, "epoch": 2773} {"train_loss": -12.451156616210938, "global_step": 465972, "epoch": 2773} {"train_loss": -12.730039596557617, "global_step": 465973, "epoch": 2773} {"train_loss": -12.720885276794434, "global_step": 465974, "epoch": 2773} {"train_loss": -12.813931465148926, "global_step": 465975, "epoch": 2773} {"train_loss": -12.971336364746094, "global_step": 465976, "epoch": 2773} {"train_loss": -12.802007675170898, "global_step": 465977, "epoch": 2773} {"train_loss": -12.906808853149414, "global_step": 465978, "epoch": 2773} {"train_loss": -12.816771507263184, "global_step": 465979, "epoch": 2773} {"train_loss": -12.919365882873535, "global_step": 465980, "epoch": 2773} {"train_loss": -12.765393257141113, "global_step": 465981, "epoch": 2773} {"train_loss": -12.88996696472168, "global_step": 465982, "epoch": 2773} {"train_loss": -12.759425163269043, "global_step": 465983, "epoch": 2773} {"train_loss": -12.907859802246094, "global_step": 465984, "epoch": 2773} {"train_loss": -13.038191795349121, "global_step": 465985, "epoch": 2773} {"train_loss": -12.892789840698242, "global_step": 465986, "epoch": 2773} {"train_loss": -12.879671096801758, "global_step": 465987, "epoch": 2773} {"train_loss": -12.84425163269043, "global_step": 465988, "epoch": 2773} {"train_loss": -13.005629539489746, "global_step": 465989, "epoch": 2773} {"train_loss": -12.85996150970459, "global_step": 465990, "epoch": 2773} {"train_loss": -12.961374282836914, "global_step": 465991, "epoch": 2773} {"train_loss": -12.887811660766602, "global_step": 465992, "epoch": 2773} {"train_loss": -12.705816268920898, "global_step": 465993, "epoch": 2773} {"train_loss": -13.065624237060547, "global_step": 465994, "epoch": 2773} {"train_loss": -12.765792846679688, "global_step": 465995, "epoch": 2773} {"train_loss": -12.774249076843262, "global_step": 465996, "epoch": 2773} {"train_loss": -12.857481002807617, "global_step": 465997, "epoch": 2773} {"train_loss": -12.857677459716797, "global_step": 465998, "epoch": 2773} {"train_loss": -12.759953498840332, "global_step": 465999, "epoch": 2773} {"train_loss": -12.874622344970703, "global_step": 466000, "epoch": 2773} {"train_loss": -13.05514907836914, "global_step": 466001, "epoch": 2773} {"train_loss": -12.915836334228516, "global_step": 466002, "epoch": 2773} {"train_loss": -12.912906646728516, "global_step": 466003, "epoch": 2773} {"train_loss": -12.7808198928833, "global_step": 466004, "epoch": 2773} {"train_loss": -13.108811378479004, "global_step": 466005, "epoch": 2773} {"train_loss": -12.994569778442383, "global_step": 466006, "epoch": 2773} {"train_loss": -12.892572402954102, "global_step": 466007, "epoch": 2773} {"train_loss": -12.839329719543457, "global_step": 466008, "epoch": 2773} {"train_loss": -12.798721313476562, "global_step": 466009, "epoch": 2773} {"train_loss": -12.822795867919922, "global_step": 466010, "epoch": 2773} {"train_loss": -12.877782821655273, "global_step": 466011, "epoch": 2773} {"train_loss": -12.992262840270996, "global_step": 466012, "epoch": 2773} {"train_loss": -12.949315071105957, "global_step": 466013, "epoch": 2773} {"train_loss": -12.720518112182617, "global_step": 466014, "epoch": 2773} {"train_loss": -12.85572624206543, "global_step": 466015, "epoch": 2773} {"train_loss": -13.050882339477539, "global_step": 466016, "epoch": 2773} {"train_loss": -12.757295608520508, "global_step": 466017, "epoch": 2773} {"train_loss": -12.418313026428223, "global_step": 466018, "epoch": 2773} {"train_loss": -12.682901382446289, "global_step": 466019, "epoch": 2773} {"train_loss": -13.134294509887695, "global_step": 466020, "epoch": 2773} {"train_loss": -12.802310943603516, "global_step": 466021, "epoch": 2773} {"train_loss": -11.971864700317383, "global_step": 466022, "epoch": 2773} {"train_loss": -12.41595458984375, "global_step": 466023, "epoch": 2773} {"train_loss": -12.418079376220703, "global_step": 466024, "epoch": 2773} {"train_loss": -12.24793815612793, "global_step": 466025, "epoch": 2773} {"train_loss": -12.257080078125, "global_step": 466026, "epoch": 2773} {"train_loss": -12.104642868041992, "global_step": 466027, "epoch": 2773} {"train_loss": -11.506669044494629, "global_step": 466028, "epoch": 2773} {"train_loss": -11.908231735229492, "global_step": 466029, "epoch": 2773} {"train_loss": -12.127260208129883, "global_step": 466030, "epoch": 2773} {"train_loss": -12.346412982259478, "global_step": 466031, "epoch": 2773, "val_loss": 315815.25} {"train_loss": -12.402334213256836, "global_step": 466032, "epoch": 2774} {"train_loss": -12.471668243408203, "global_step": 466033, "epoch": 2774} {"train_loss": -11.21738052368164, "global_step": 466034, "epoch": 2774} {"train_loss": -11.884466171264648, "global_step": 466035, "epoch": 2774} {"train_loss": -12.685585975646973, "global_step": 466036, "epoch": 2774} {"train_loss": -12.08381462097168, "global_step": 466037, "epoch": 2774} {"train_loss": -12.134435653686523, "global_step": 466038, "epoch": 2774} {"train_loss": -12.639963150024414, "global_step": 466039, "epoch": 2774} {"train_loss": -12.420907974243164, "global_step": 466040, "epoch": 2774} {"train_loss": -11.76957893371582, "global_step": 466041, "epoch": 2774} {"train_loss": -12.4871244430542, "global_step": 466042, "epoch": 2774} {"train_loss": -12.569282531738281, "global_step": 466043, "epoch": 2774} {"train_loss": -12.499863624572754, "global_step": 466044, "epoch": 2774} {"train_loss": -12.60262680053711, "global_step": 466045, "epoch": 2774} {"train_loss": -12.230840682983398, "global_step": 466046, "epoch": 2774} {"train_loss": -12.723660469055176, "global_step": 466047, "epoch": 2774} {"train_loss": -12.401066780090332, "global_step": 466048, "epoch": 2774} {"train_loss": -12.61785888671875, "global_step": 466049, "epoch": 2774} {"train_loss": -12.175615310668945, "global_step": 466050, "epoch": 2774} {"train_loss": -12.505560874938965, "global_step": 466051, "epoch": 2774} {"train_loss": -12.092353820800781, "global_step": 466052, "epoch": 2774} {"train_loss": -11.852073669433594, "global_step": 466053, "epoch": 2774} {"train_loss": -12.697275161743164, "global_step": 466054, "epoch": 2774} {"train_loss": -11.463281631469727, "global_step": 466055, "epoch": 2774} {"train_loss": -12.103271484375, "global_step": 466056, "epoch": 2774} {"train_loss": -12.639344215393066, "global_step": 466057, "epoch": 2774} {"train_loss": -12.608302116394043, "global_step": 466058, "epoch": 2774} {"train_loss": -11.559097290039062, "global_step": 466059, "epoch": 2774} {"train_loss": -11.955423355102539, "global_step": 466060, "epoch": 2774} {"train_loss": -11.289251327514648, "global_step": 466061, "epoch": 2774} {"train_loss": -11.341903686523438, "global_step": 466062, "epoch": 2774} {"train_loss": -11.558868408203125, "global_step": 466063, "epoch": 2774} {"train_loss": -11.37082290649414, "global_step": 466064, "epoch": 2774} {"train_loss": -11.835639953613281, "global_step": 466065, "epoch": 2774} {"train_loss": -12.177181243896484, "global_step": 466066, "epoch": 2774} {"train_loss": -11.988029479980469, "global_step": 466067, "epoch": 2774} {"train_loss": -11.114395141601562, "global_step": 466068, "epoch": 2774} {"train_loss": -12.203639030456543, "global_step": 466069, "epoch": 2774} {"train_loss": -11.217909812927246, "global_step": 466070, "epoch": 2774} {"train_loss": -11.500426292419434, "global_step": 466071, "epoch": 2774} {"train_loss": -11.919923782348633, "global_step": 466072, "epoch": 2774} {"train_loss": -11.521781921386719, "global_step": 466073, "epoch": 2774} {"train_loss": -12.086889266967773, "global_step": 466074, "epoch": 2774} {"train_loss": -10.893835067749023, "global_step": 466075, "epoch": 2774} {"train_loss": -12.430618286132812, "global_step": 466076, "epoch": 2774} {"train_loss": -10.455224990844727, "global_step": 466077, "epoch": 2774} {"train_loss": -11.53765869140625, "global_step": 466078, "epoch": 2774} {"train_loss": -9.83102798461914, "global_step": 466079, "epoch": 2774} {"train_loss": -8.245302200317383, "global_step": 466080, "epoch": 2774} {"train_loss": -8.972074508666992, "global_step": 466081, "epoch": 2774} {"train_loss": -10.289134979248047, "global_step": 466082, "epoch": 2774} {"train_loss": -11.278182029724121, "global_step": 466083, "epoch": 2774} {"train_loss": -7.329558372497559, "global_step": 466084, "epoch": 2774} {"train_loss": -8.419897079467773, "global_step": 466085, "epoch": 2774} {"train_loss": -11.398780822753906, "global_step": 466086, "epoch": 2774} {"train_loss": -8.12004566192627, "global_step": 466087, "epoch": 2774} {"train_loss": -9.076656341552734, "global_step": 466088, "epoch": 2774} {"train_loss": -10.460021018981934, "global_step": 466089, "epoch": 2774} {"train_loss": -9.96395206451416, "global_step": 466090, "epoch": 2774} {"train_loss": -9.795255661010742, "global_step": 466091, "epoch": 2774} {"train_loss": -10.928272247314453, "global_step": 466092, "epoch": 2774} {"train_loss": -10.122669219970703, "global_step": 466093, "epoch": 2774} {"train_loss": -10.945584297180176, "global_step": 466094, "epoch": 2774} {"train_loss": -9.778915405273438, "global_step": 466095, "epoch": 2774} {"train_loss": -10.700864791870117, "global_step": 466096, "epoch": 2774} {"train_loss": -9.611028671264648, "global_step": 466097, "epoch": 2774} {"train_loss": -11.020346641540527, "global_step": 466098, "epoch": 2774} {"train_loss": -9.428441047668457, "global_step": 466099, "epoch": 2774} {"train_loss": -11.388871192932129, "global_step": 466100, "epoch": 2774} {"train_loss": -9.405919075012207, "global_step": 466101, "epoch": 2774} {"train_loss": -11.802434921264648, "global_step": 466102, "epoch": 2774} {"train_loss": -10.035980224609375, "global_step": 466103, "epoch": 2774} {"train_loss": -11.10512924194336, "global_step": 466104, "epoch": 2774} {"train_loss": -11.177608489990234, "global_step": 466105, "epoch": 2774} {"train_loss": -11.411958694458008, "global_step": 466106, "epoch": 2774} {"train_loss": -11.666379928588867, "global_step": 466107, "epoch": 2774} {"train_loss": -10.822627067565918, "global_step": 466108, "epoch": 2774} {"train_loss": -12.210126876831055, "global_step": 466109, "epoch": 2774} {"train_loss": -10.988428115844727, "global_step": 466110, "epoch": 2774} {"train_loss": -12.016357421875, "global_step": 466111, "epoch": 2774} {"train_loss": -11.332338333129883, "global_step": 466112, "epoch": 2774} {"train_loss": -11.070535659790039, "global_step": 466113, "epoch": 2774} {"train_loss": -11.194605827331543, "global_step": 466114, "epoch": 2774} {"train_loss": -11.575353622436523, "global_step": 466115, "epoch": 2774} {"train_loss": -10.436077117919922, "global_step": 466116, "epoch": 2774} {"train_loss": -11.964554786682129, "global_step": 466117, "epoch": 2774} {"train_loss": -10.749090194702148, "global_step": 466118, "epoch": 2774} {"train_loss": -11.536067008972168, "global_step": 466119, "epoch": 2774} {"train_loss": -11.026566505432129, "global_step": 466120, "epoch": 2774} {"train_loss": -11.162416458129883, "global_step": 466121, "epoch": 2774} {"train_loss": -10.589999198913574, "global_step": 466122, "epoch": 2774} {"train_loss": -12.000786781311035, "global_step": 466123, "epoch": 2774} {"train_loss": -10.752537727355957, "global_step": 466124, "epoch": 2774} {"train_loss": -11.123003959655762, "global_step": 466125, "epoch": 2774} {"train_loss": -11.25363540649414, "global_step": 466126, "epoch": 2774} {"train_loss": -11.311717987060547, "global_step": 466127, "epoch": 2774} {"train_loss": -11.262245178222656, "global_step": 466128, "epoch": 2774} {"train_loss": -11.803366661071777, "global_step": 466129, "epoch": 2774} {"train_loss": -11.753698348999023, "global_step": 466130, "epoch": 2774} {"train_loss": -10.93217945098877, "global_step": 466131, "epoch": 2774} {"train_loss": -12.054030418395996, "global_step": 466132, "epoch": 2774} {"train_loss": -11.406518936157227, "global_step": 466133, "epoch": 2774} {"train_loss": -11.51038646697998, "global_step": 466134, "epoch": 2774} {"train_loss": -11.51197624206543, "global_step": 466135, "epoch": 2774} {"train_loss": -12.125341415405273, "global_step": 466136, "epoch": 2774} {"train_loss": -11.495450973510742, "global_step": 466137, "epoch": 2774} {"train_loss": -11.934606552124023, "global_step": 466138, "epoch": 2774} {"train_loss": -11.611793518066406, "global_step": 466139, "epoch": 2774} {"train_loss": -11.51809310913086, "global_step": 466140, "epoch": 2774} {"train_loss": -12.06089973449707, "global_step": 466141, "epoch": 2774} {"train_loss": -11.531085968017578, "global_step": 466142, "epoch": 2774} {"train_loss": -11.761821746826172, "global_step": 466143, "epoch": 2774} {"train_loss": -11.733716011047363, "global_step": 466144, "epoch": 2774} {"train_loss": -12.208842277526855, "global_step": 466145, "epoch": 2774} {"train_loss": -11.93270492553711, "global_step": 466146, "epoch": 2774} {"train_loss": -12.084860801696777, "global_step": 466147, "epoch": 2774} {"train_loss": -11.953774452209473, "global_step": 466148, "epoch": 2774} {"train_loss": -12.159318923950195, "global_step": 466149, "epoch": 2774} {"train_loss": -12.24818229675293, "global_step": 466150, "epoch": 2774} {"train_loss": -12.198320388793945, "global_step": 466151, "epoch": 2774} {"train_loss": -12.173957824707031, "global_step": 466152, "epoch": 2774} {"train_loss": -12.299840927124023, "global_step": 466153, "epoch": 2774} {"train_loss": -12.29973030090332, "global_step": 466154, "epoch": 2774} {"train_loss": -11.836320877075195, "global_step": 466155, "epoch": 2774} {"train_loss": -12.358787536621094, "global_step": 466156, "epoch": 2774} {"train_loss": -12.259931564331055, "global_step": 466157, "epoch": 2774} {"train_loss": -12.464706420898438, "global_step": 466158, "epoch": 2774} {"train_loss": -12.16961669921875, "global_step": 466159, "epoch": 2774} {"train_loss": -12.490493774414062, "global_step": 466160, "epoch": 2774} {"train_loss": -12.576221466064453, "global_step": 466161, "epoch": 2774} {"train_loss": -12.51807975769043, "global_step": 466162, "epoch": 2774} {"train_loss": -12.518976211547852, "global_step": 466163, "epoch": 2774} {"train_loss": -12.49162483215332, "global_step": 466164, "epoch": 2774} {"train_loss": -12.628626823425293, "global_step": 466165, "epoch": 2774} {"train_loss": -12.381623268127441, "global_step": 466166, "epoch": 2774} {"train_loss": -12.41862964630127, "global_step": 466167, "epoch": 2774} {"train_loss": -12.504572868347168, "global_step": 466168, "epoch": 2774} {"train_loss": -12.713447570800781, "global_step": 466169, "epoch": 2774} {"train_loss": -12.460748672485352, "global_step": 466170, "epoch": 2774} {"train_loss": -12.561698913574219, "global_step": 466171, "epoch": 2774} {"train_loss": -12.386507987976074, "global_step": 466172, "epoch": 2774} {"train_loss": -12.802669525146484, "global_step": 466173, "epoch": 2774} {"train_loss": -12.434263229370117, "global_step": 466174, "epoch": 2774} {"train_loss": -12.645666122436523, "global_step": 466175, "epoch": 2774} {"train_loss": -12.74321460723877, "global_step": 466176, "epoch": 2774} {"train_loss": -12.524887084960938, "global_step": 466177, "epoch": 2774} {"train_loss": -12.598735809326172, "global_step": 466178, "epoch": 2774} {"train_loss": -12.66740608215332, "global_step": 466179, "epoch": 2774} {"train_loss": -12.405743598937988, "global_step": 466180, "epoch": 2774} {"train_loss": -12.516155242919922, "global_step": 466181, "epoch": 2774} {"train_loss": -12.570646286010742, "global_step": 466182, "epoch": 2774} {"train_loss": -12.530572891235352, "global_step": 466183, "epoch": 2774} {"train_loss": -12.788665771484375, "global_step": 466184, "epoch": 2774} {"train_loss": -12.576690673828125, "global_step": 466185, "epoch": 2774} {"train_loss": -12.536678314208984, "global_step": 466186, "epoch": 2774} {"train_loss": -12.594852447509766, "global_step": 466187, "epoch": 2774} {"train_loss": -12.666272163391113, "global_step": 466188, "epoch": 2774} {"train_loss": -12.805779457092285, "global_step": 466189, "epoch": 2774} {"train_loss": -12.852447509765625, "global_step": 466190, "epoch": 2774} {"train_loss": -12.832850456237793, "global_step": 466191, "epoch": 2774} {"train_loss": -12.674901962280273, "global_step": 466192, "epoch": 2774} {"train_loss": -12.605615615844727, "global_step": 466193, "epoch": 2774} {"train_loss": -12.68404769897461, "global_step": 466194, "epoch": 2774} {"train_loss": -12.64640998840332, "global_step": 466195, "epoch": 2774} {"train_loss": -12.703367233276367, "global_step": 466196, "epoch": 2774} {"train_loss": -12.740653991699219, "global_step": 466197, "epoch": 2774} {"train_loss": -12.762146949768066, "global_step": 466198, "epoch": 2774} {"train_loss": -11.712130540893192, "global_step": 466199, "epoch": 2774, "val_loss": 309495.9375} {"train_loss": -12.680316925048828, "global_step": 466200, "epoch": 2775} {"train_loss": -12.727867126464844, "global_step": 466201, "epoch": 2775} {"train_loss": -12.698091506958008, "global_step": 466202, "epoch": 2775} {"train_loss": -12.831077575683594, "global_step": 466203, "epoch": 2775} {"train_loss": -12.900285720825195, "global_step": 466204, "epoch": 2775} {"train_loss": -12.86729621887207, "global_step": 466205, "epoch": 2775} {"train_loss": -12.795971870422363, "global_step": 466206, "epoch": 2775} {"train_loss": -12.736509323120117, "global_step": 466207, "epoch": 2775} {"train_loss": -12.783172607421875, "global_step": 466208, "epoch": 2775} {"train_loss": -12.971610069274902, "global_step": 466209, "epoch": 2775} {"train_loss": -13.058077812194824, "global_step": 466210, "epoch": 2775} {"train_loss": -12.762649536132812, "global_step": 466211, "epoch": 2775} {"train_loss": -12.878206253051758, "global_step": 466212, "epoch": 2775} {"train_loss": -12.860894203186035, "global_step": 466213, "epoch": 2775} {"train_loss": -12.724392890930176, "global_step": 466214, "epoch": 2775} {"train_loss": -12.710699081420898, "global_step": 466215, "epoch": 2775} {"train_loss": -12.826601028442383, "global_step": 466216, "epoch": 2775} {"train_loss": -12.961791038513184, "global_step": 466217, "epoch": 2775} {"train_loss": -12.647186279296875, "global_step": 466218, "epoch": 2775} {"train_loss": -12.675117492675781, "global_step": 466219, "epoch": 2775} {"train_loss": -12.935526847839355, "global_step": 466220, "epoch": 2775} {"train_loss": -12.684091567993164, "global_step": 466221, "epoch": 2775} {"train_loss": -12.761761665344238, "global_step": 466222, "epoch": 2775} {"train_loss": -12.640077590942383, "global_step": 466223, "epoch": 2775} {"train_loss": -12.936219215393066, "global_step": 466224, "epoch": 2775} {"train_loss": -12.680667877197266, "global_step": 466225, "epoch": 2775} {"train_loss": -12.989202499389648, "global_step": 466226, "epoch": 2775} {"train_loss": -12.809600830078125, "global_step": 466227, "epoch": 2775} {"train_loss": -13.055925369262695, "global_step": 466228, "epoch": 2775} {"train_loss": -12.756109237670898, "global_step": 466229, "epoch": 2775} {"train_loss": -12.78512191772461, "global_step": 466230, "epoch": 2775} {"train_loss": -12.678855895996094, "global_step": 466231, "epoch": 2775} {"train_loss": -12.998021125793457, "global_step": 466232, "epoch": 2775} {"train_loss": -12.633638381958008, "global_step": 466233, "epoch": 2775} {"train_loss": -11.936575889587402, "global_step": 466234, "epoch": 2775} {"train_loss": -12.596771240234375, "global_step": 466235, "epoch": 2775} {"train_loss": -13.01652717590332, "global_step": 466236, "epoch": 2775} {"train_loss": -12.168047904968262, "global_step": 466237, "epoch": 2775} {"train_loss": -11.553915977478027, "global_step": 466238, "epoch": 2775} {"train_loss": -12.634126663208008, "global_step": 466239, "epoch": 2775} {"train_loss": -11.699861526489258, "global_step": 466240, "epoch": 2775} {"train_loss": -12.423320770263672, "global_step": 466241, "epoch": 2775} {"train_loss": -11.787792205810547, "global_step": 466242, "epoch": 2775} {"train_loss": -12.0784330368042, "global_step": 466243, "epoch": 2775} {"train_loss": -11.906847953796387, "global_step": 466244, "epoch": 2775} {"train_loss": -12.25942611694336, "global_step": 466245, "epoch": 2775} {"train_loss": -11.96232795715332, "global_step": 466246, "epoch": 2775} {"train_loss": -11.65024471282959, "global_step": 466247, "epoch": 2775} {"train_loss": -11.685928344726562, "global_step": 466248, "epoch": 2775} {"train_loss": -11.848461151123047, "global_step": 466249, "epoch": 2775} {"train_loss": -11.704227447509766, "global_step": 466250, "epoch": 2775} {"train_loss": -11.935528755187988, "global_step": 466251, "epoch": 2775} {"train_loss": -11.415789604187012, "global_step": 466252, "epoch": 2775} {"train_loss": -11.591205596923828, "global_step": 466253, "epoch": 2775} {"train_loss": -11.980035781860352, "global_step": 466254, "epoch": 2775} {"train_loss": -11.55517864227295, "global_step": 466255, "epoch": 2775} {"train_loss": -11.372621536254883, "global_step": 466256, "epoch": 2775} {"train_loss": -12.122838020324707, "global_step": 466257, "epoch": 2775} {"train_loss": -10.944456100463867, "global_step": 466258, "epoch": 2775} {"train_loss": -12.149486541748047, "global_step": 466259, "epoch": 2775} {"train_loss": -11.669649124145508, "global_step": 466260, "epoch": 2775} {"train_loss": -11.482542991638184, "global_step": 466261, "epoch": 2775} {"train_loss": -11.46977424621582, "global_step": 466262, "epoch": 2775} {"train_loss": -12.424253463745117, "global_step": 466263, "epoch": 2775} {"train_loss": -11.249849319458008, "global_step": 466264, "epoch": 2775} {"train_loss": -12.263065338134766, "global_step": 466265, "epoch": 2775} {"train_loss": -11.038214683532715, "global_step": 466266, "epoch": 2775} {"train_loss": -11.953218460083008, "global_step": 466267, "epoch": 2775} {"train_loss": -11.624762535095215, "global_step": 466268, "epoch": 2775} {"train_loss": -11.293964385986328, "global_step": 466269, "epoch": 2775} {"train_loss": -11.016440391540527, "global_step": 466270, "epoch": 2775} {"train_loss": -11.509760856628418, "global_step": 466271, "epoch": 2775} {"train_loss": -10.705650329589844, "global_step": 466272, "epoch": 2775} {"train_loss": -11.423770904541016, "global_step": 466273, "epoch": 2775} {"train_loss": -11.55758285522461, "global_step": 466274, "epoch": 2775} {"train_loss": -10.582391738891602, "global_step": 466275, "epoch": 2775} {"train_loss": -11.710187911987305, "global_step": 466276, "epoch": 2775} {"train_loss": -10.562824249267578, "global_step": 466277, "epoch": 2775} {"train_loss": -11.239127159118652, "global_step": 466278, "epoch": 2775} {"train_loss": -11.50473403930664, "global_step": 466279, "epoch": 2775} {"train_loss": -10.27873420715332, "global_step": 466280, "epoch": 2775} {"train_loss": -12.118576049804688, "global_step": 466281, "epoch": 2775} {"train_loss": -11.005752563476562, "global_step": 466282, "epoch": 2775} {"train_loss": -12.263336181640625, "global_step": 466283, "epoch": 2775} {"train_loss": -11.32246208190918, "global_step": 466284, "epoch": 2775} {"train_loss": -12.361589431762695, "global_step": 466285, "epoch": 2775} {"train_loss": -11.560331344604492, "global_step": 466286, "epoch": 2775} {"train_loss": -12.151747703552246, "global_step": 466287, "epoch": 2775} {"train_loss": -12.084243774414062, "global_step": 466288, "epoch": 2775} {"train_loss": -11.802879333496094, "global_step": 466289, "epoch": 2775} {"train_loss": -11.906386375427246, "global_step": 466290, "epoch": 2775} {"train_loss": -12.142173767089844, "global_step": 466291, "epoch": 2775} {"train_loss": -12.048189163208008, "global_step": 466292, "epoch": 2775} {"train_loss": -11.370710372924805, "global_step": 466293, "epoch": 2775} {"train_loss": -12.081544876098633, "global_step": 466294, "epoch": 2775} {"train_loss": -11.728328704833984, "global_step": 466295, "epoch": 2775} {"train_loss": -12.24825668334961, "global_step": 466296, "epoch": 2775} {"train_loss": -11.786722183227539, "global_step": 466297, "epoch": 2775} {"train_loss": -11.960293769836426, "global_step": 466298, "epoch": 2775} {"train_loss": -12.3289794921875, "global_step": 466299, "epoch": 2775} {"train_loss": -11.992677688598633, "global_step": 466300, "epoch": 2775} {"train_loss": -12.352315902709961, "global_step": 466301, "epoch": 2775} {"train_loss": -11.959345817565918, "global_step": 466302, "epoch": 2775} {"train_loss": -12.588888168334961, "global_step": 466303, "epoch": 2775} {"train_loss": -11.758526802062988, "global_step": 466304, "epoch": 2775} {"train_loss": -11.893224716186523, "global_step": 466305, "epoch": 2775} {"train_loss": -12.027231216430664, "global_step": 466306, "epoch": 2775} {"train_loss": -11.72685432434082, "global_step": 466307, "epoch": 2775} {"train_loss": -12.302734375, "global_step": 466308, "epoch": 2775} {"train_loss": -12.160697937011719, "global_step": 466309, "epoch": 2775} {"train_loss": -12.393815994262695, "global_step": 466310, "epoch": 2775} {"train_loss": -11.92910385131836, "global_step": 466311, "epoch": 2775} {"train_loss": -12.077133178710938, "global_step": 466312, "epoch": 2775} {"train_loss": -12.076911926269531, "global_step": 466313, "epoch": 2775} {"train_loss": -12.085151672363281, "global_step": 466314, "epoch": 2775} {"train_loss": -12.424654960632324, "global_step": 466315, "epoch": 2775} {"train_loss": -11.763660430908203, "global_step": 466316, "epoch": 2775} {"train_loss": -12.46929931640625, "global_step": 466317, "epoch": 2775} {"train_loss": -11.988767623901367, "global_step": 466318, "epoch": 2775} {"train_loss": -11.173757553100586, "global_step": 466319, "epoch": 2775} {"train_loss": -11.245185852050781, "global_step": 466320, "epoch": 2775} {"train_loss": -11.290786743164062, "global_step": 466321, "epoch": 2775} {"train_loss": -11.814170837402344, "global_step": 466322, "epoch": 2775} {"train_loss": -11.647454261779785, "global_step": 466323, "epoch": 2775} {"train_loss": -12.329605102539062, "global_step": 466324, "epoch": 2775} {"train_loss": -11.678621292114258, "global_step": 466325, "epoch": 2775} {"train_loss": -11.918603897094727, "global_step": 466326, "epoch": 2775} {"train_loss": -11.877559661865234, "global_step": 466327, "epoch": 2775} {"train_loss": -11.793848037719727, "global_step": 466328, "epoch": 2775} {"train_loss": -11.795642852783203, "global_step": 466329, "epoch": 2775} {"train_loss": -11.99342155456543, "global_step": 466330, "epoch": 2775} {"train_loss": -11.689285278320312, "global_step": 466331, "epoch": 2775} {"train_loss": -12.261159896850586, "global_step": 466332, "epoch": 2775} {"train_loss": -11.854537010192871, "global_step": 466333, "epoch": 2775} {"train_loss": -12.024676322937012, "global_step": 466334, "epoch": 2775} {"train_loss": -11.941929817199707, "global_step": 466335, "epoch": 2775} {"train_loss": -12.000459671020508, "global_step": 466336, "epoch": 2775} {"train_loss": -12.080694198608398, "global_step": 466337, "epoch": 2775} {"train_loss": -12.179037094116211, "global_step": 466338, "epoch": 2775} {"train_loss": -12.153444290161133, "global_step": 466339, "epoch": 2775} {"train_loss": -12.209355354309082, "global_step": 466340, "epoch": 2775} {"train_loss": -12.371505737304688, "global_step": 466341, "epoch": 2775} {"train_loss": -12.262596130371094, "global_step": 466342, "epoch": 2775} {"train_loss": -12.099693298339844, "global_step": 466343, "epoch": 2775} {"train_loss": -12.236885070800781, "global_step": 466344, "epoch": 2775} {"train_loss": -11.737608909606934, "global_step": 466345, "epoch": 2775} {"train_loss": -12.021759033203125, "global_step": 466346, "epoch": 2775} {"train_loss": -12.026565551757812, "global_step": 466347, "epoch": 2775} {"train_loss": -11.794473648071289, "global_step": 466348, "epoch": 2775} {"train_loss": -12.319677352905273, "global_step": 466349, "epoch": 2775} {"train_loss": -11.882375717163086, "global_step": 466350, "epoch": 2775} {"train_loss": -12.042837142944336, "global_step": 466351, "epoch": 2775} {"train_loss": -12.556562423706055, "global_step": 466352, "epoch": 2775} {"train_loss": -12.126983642578125, "global_step": 466353, "epoch": 2775} {"train_loss": -12.226839065551758, "global_step": 466354, "epoch": 2775} {"train_loss": -12.004351615905762, "global_step": 466355, "epoch": 2775} {"train_loss": -12.409905433654785, "global_step": 466356, "epoch": 2775} {"train_loss": -12.391252517700195, "global_step": 466357, "epoch": 2775} {"train_loss": -12.097469329833984, "global_step": 466358, "epoch": 2775} {"train_loss": -12.243005752563477, "global_step": 466359, "epoch": 2775} {"train_loss": -12.277753829956055, "global_step": 466360, "epoch": 2775} {"train_loss": -12.417512893676758, "global_step": 466361, "epoch": 2775} {"train_loss": -12.032428741455078, "global_step": 466362, "epoch": 2775} {"train_loss": -12.173238754272461, "global_step": 466363, "epoch": 2775} {"train_loss": -11.686015129089355, "global_step": 466364, "epoch": 2775} {"train_loss": -12.558921813964844, "global_step": 466365, "epoch": 2775} {"train_loss": -12.024934768676758, "global_step": 466366, "epoch": 2775} {"train_loss": -12.081506808598837, "global_step": 466367, "epoch": 2775, "val_loss": 310597.71875, "train_action_mse_error": 1.2937602996826172} {"train_loss": -12.708536148071289, "global_step": 466368, "epoch": 2776} {"train_loss": -12.227933883666992, "global_step": 466369, "epoch": 2776} {"train_loss": -12.506450653076172, "global_step": 466370, "epoch": 2776} {"train_loss": -11.894804954528809, "global_step": 466371, "epoch": 2776} {"train_loss": -12.307010650634766, "global_step": 466372, "epoch": 2776} {"train_loss": -12.39311408996582, "global_step": 466373, "epoch": 2776} {"train_loss": -12.48145580291748, "global_step": 466374, "epoch": 2776} {"train_loss": -12.258264541625977, "global_step": 466375, "epoch": 2776} {"train_loss": -12.499267578125, "global_step": 466376, "epoch": 2776} {"train_loss": -12.446975708007812, "global_step": 466377, "epoch": 2776} {"train_loss": -12.303085327148438, "global_step": 466378, "epoch": 2776} {"train_loss": -12.766023635864258, "global_step": 466379, "epoch": 2776} {"train_loss": -12.429878234863281, "global_step": 466380, "epoch": 2776} {"train_loss": -12.522640228271484, "global_step": 466381, "epoch": 2776} {"train_loss": -12.732223510742188, "global_step": 466382, "epoch": 2776} {"train_loss": -12.627969741821289, "global_step": 466383, "epoch": 2776} {"train_loss": -12.613114356994629, "global_step": 466384, "epoch": 2776} {"train_loss": -12.52708625793457, "global_step": 466385, "epoch": 2776} {"train_loss": -12.517269134521484, "global_step": 466386, "epoch": 2776} {"train_loss": -12.453534126281738, "global_step": 466387, "epoch": 2776} {"train_loss": -12.403892517089844, "global_step": 466388, "epoch": 2776} {"train_loss": -12.175727844238281, "global_step": 466389, "epoch": 2776} {"train_loss": -12.117166519165039, "global_step": 466390, "epoch": 2776} {"train_loss": -12.323232650756836, "global_step": 466391, "epoch": 2776} {"train_loss": -12.454635620117188, "global_step": 466392, "epoch": 2776} {"train_loss": -12.230647087097168, "global_step": 466393, "epoch": 2776} {"train_loss": -12.161226272583008, "global_step": 466394, "epoch": 2776} {"train_loss": -12.498779296875, "global_step": 466395, "epoch": 2776} {"train_loss": -12.35780143737793, "global_step": 466396, "epoch": 2776} {"train_loss": -12.645751953125, "global_step": 466397, "epoch": 2776} {"train_loss": -11.817749977111816, "global_step": 466398, "epoch": 2776} {"train_loss": -12.577746391296387, "global_step": 466399, "epoch": 2776} {"train_loss": -12.42427921295166, "global_step": 466400, "epoch": 2776} {"train_loss": -12.446463584899902, "global_step": 466401, "epoch": 2776} {"train_loss": -12.501602172851562, "global_step": 466402, "epoch": 2776} {"train_loss": -12.678621292114258, "global_step": 466403, "epoch": 2776} {"train_loss": -12.513718605041504, "global_step": 466404, "epoch": 2776} {"train_loss": -12.376527786254883, "global_step": 466405, "epoch": 2776} {"train_loss": -12.504858016967773, "global_step": 466406, "epoch": 2776} {"train_loss": -12.124817848205566, "global_step": 466407, "epoch": 2776} {"train_loss": -12.035605430603027, "global_step": 466408, "epoch": 2776} {"train_loss": -12.018308639526367, "global_step": 466409, "epoch": 2776} {"train_loss": -12.11555290222168, "global_step": 466410, "epoch": 2776} {"train_loss": -12.301936149597168, "global_step": 466411, "epoch": 2776} {"train_loss": -12.272918701171875, "global_step": 466412, "epoch": 2776} {"train_loss": -11.619830131530762, "global_step": 466413, "epoch": 2776} {"train_loss": -12.34007453918457, "global_step": 466414, "epoch": 2776} {"train_loss": -12.001840591430664, "global_step": 466415, "epoch": 2776} {"train_loss": -12.64086627960205, "global_step": 466416, "epoch": 2776} {"train_loss": -11.805143356323242, "global_step": 466417, "epoch": 2776} {"train_loss": -12.42300796508789, "global_step": 466418, "epoch": 2776} {"train_loss": -12.151187896728516, "global_step": 466419, "epoch": 2776} {"train_loss": -12.48557186126709, "global_step": 466420, "epoch": 2776} {"train_loss": -12.289718627929688, "global_step": 466421, "epoch": 2776} {"train_loss": -12.26468563079834, "global_step": 466422, "epoch": 2776} {"train_loss": -12.289859771728516, "global_step": 466423, "epoch": 2776} {"train_loss": -12.70331859588623, "global_step": 466424, "epoch": 2776} {"train_loss": -11.91928768157959, "global_step": 466425, "epoch": 2776} {"train_loss": -12.051309585571289, "global_step": 466426, "epoch": 2776} {"train_loss": -12.531240463256836, "global_step": 466427, "epoch": 2776} {"train_loss": -12.421135902404785, "global_step": 466428, "epoch": 2776} {"train_loss": -11.852034568786621, "global_step": 466429, "epoch": 2776} {"train_loss": -12.236065864562988, "global_step": 466430, "epoch": 2776} {"train_loss": -12.494481086730957, "global_step": 466431, "epoch": 2776} {"train_loss": -12.673090934753418, "global_step": 466432, "epoch": 2776} {"train_loss": -11.971026420593262, "global_step": 466433, "epoch": 2776} {"train_loss": -12.745091438293457, "global_step": 466434, "epoch": 2776} {"train_loss": -12.266630172729492, "global_step": 466435, "epoch": 2776} {"train_loss": -12.496115684509277, "global_step": 466436, "epoch": 2776} {"train_loss": -12.414104461669922, "global_step": 466437, "epoch": 2776} {"train_loss": -12.668096542358398, "global_step": 466438, "epoch": 2776} {"train_loss": -12.156484603881836, "global_step": 466439, "epoch": 2776} {"train_loss": -12.792976379394531, "global_step": 466440, "epoch": 2776} {"train_loss": -12.201234817504883, "global_step": 466441, "epoch": 2776} {"train_loss": -12.430093765258789, "global_step": 466442, "epoch": 2776} {"train_loss": -12.17951774597168, "global_step": 466443, "epoch": 2776} {"train_loss": -12.355779647827148, "global_step": 466444, "epoch": 2776} {"train_loss": -12.431800842285156, "global_step": 466445, "epoch": 2776} {"train_loss": -12.682100296020508, "global_step": 466446, "epoch": 2776} {"train_loss": -12.27218246459961, "global_step": 466447, "epoch": 2776} {"train_loss": -12.311384201049805, "global_step": 466448, "epoch": 2776} {"train_loss": -12.110804557800293, "global_step": 466449, "epoch": 2776} {"train_loss": -12.023605346679688, "global_step": 466450, "epoch": 2776} {"train_loss": -11.730375289916992, "global_step": 466451, "epoch": 2776} {"train_loss": -12.405193328857422, "global_step": 466452, "epoch": 2776} {"train_loss": -11.802316665649414, "global_step": 466453, "epoch": 2776} {"train_loss": -11.279950141906738, "global_step": 466454, "epoch": 2776} {"train_loss": -11.337613105773926, "global_step": 466455, "epoch": 2776} {"train_loss": -12.231319427490234, "global_step": 466456, "epoch": 2776} {"train_loss": -12.360206604003906, "global_step": 466457, "epoch": 2776} {"train_loss": -12.800947189331055, "global_step": 466458, "epoch": 2776} {"train_loss": -12.694040298461914, "global_step": 466459, "epoch": 2776} {"train_loss": -12.506341934204102, "global_step": 466460, "epoch": 2776} {"train_loss": -12.476831436157227, "global_step": 466461, "epoch": 2776} {"train_loss": -12.255690574645996, "global_step": 466462, "epoch": 2776} {"train_loss": -12.472782135009766, "global_step": 466463, "epoch": 2776} {"train_loss": -12.081276893615723, "global_step": 466464, "epoch": 2776} {"train_loss": -11.852816581726074, "global_step": 466465, "epoch": 2776} {"train_loss": -12.219327926635742, "global_step": 466466, "epoch": 2776} {"train_loss": -12.18567943572998, "global_step": 466467, "epoch": 2776} {"train_loss": -12.079660415649414, "global_step": 466468, "epoch": 2776} {"train_loss": -12.181463241577148, "global_step": 466469, "epoch": 2776} {"train_loss": -11.885324478149414, "global_step": 466470, "epoch": 2776} {"train_loss": -12.184979438781738, "global_step": 466471, "epoch": 2776} {"train_loss": -12.338956832885742, "global_step": 466472, "epoch": 2776} {"train_loss": -11.74402904510498, "global_step": 466473, "epoch": 2776} {"train_loss": -12.149455070495605, "global_step": 466474, "epoch": 2776} {"train_loss": -11.83096981048584, "global_step": 466475, "epoch": 2776} {"train_loss": -12.043560028076172, "global_step": 466476, "epoch": 2776} {"train_loss": -11.39365005493164, "global_step": 466477, "epoch": 2776} {"train_loss": -11.690739631652832, "global_step": 466478, "epoch": 2776} {"train_loss": -10.62086296081543, "global_step": 466479, "epoch": 2776} {"train_loss": -11.727889060974121, "global_step": 466480, "epoch": 2776} {"train_loss": -11.6873779296875, "global_step": 466481, "epoch": 2776} {"train_loss": -12.020181655883789, "global_step": 466482, "epoch": 2776} {"train_loss": -11.602848052978516, "global_step": 466483, "epoch": 2776} {"train_loss": -10.886600494384766, "global_step": 466484, "epoch": 2776} {"train_loss": -12.06721305847168, "global_step": 466485, "epoch": 2776} {"train_loss": -9.602727890014648, "global_step": 466486, "epoch": 2776} {"train_loss": -11.987473487854004, "global_step": 466487, "epoch": 2776} {"train_loss": -10.28642463684082, "global_step": 466488, "epoch": 2776} {"train_loss": -9.981840133666992, "global_step": 466489, "epoch": 2776} {"train_loss": -11.222127914428711, "global_step": 466490, "epoch": 2776} {"train_loss": -9.818758010864258, "global_step": 466491, "epoch": 2776} {"train_loss": -10.901371955871582, "global_step": 466492, "epoch": 2776} {"train_loss": -10.45694351196289, "global_step": 466493, "epoch": 2776} {"train_loss": -11.787357330322266, "global_step": 466494, "epoch": 2776} {"train_loss": -10.89358139038086, "global_step": 466495, "epoch": 2776} {"train_loss": -11.363542556762695, "global_step": 466496, "epoch": 2776} {"train_loss": -11.807571411132812, "global_step": 466497, "epoch": 2776} {"train_loss": -11.588984489440918, "global_step": 466498, "epoch": 2776} {"train_loss": -11.574066162109375, "global_step": 466499, "epoch": 2776} {"train_loss": -10.847681999206543, "global_step": 466500, "epoch": 2776} {"train_loss": -12.283456802368164, "global_step": 466501, "epoch": 2776} {"train_loss": -11.395796775817871, "global_step": 466502, "epoch": 2776} {"train_loss": -12.149596214294434, "global_step": 466503, "epoch": 2776} {"train_loss": -11.24694538116455, "global_step": 466504, "epoch": 2776} {"train_loss": -11.791744232177734, "global_step": 466505, "epoch": 2776} {"train_loss": -10.825645446777344, "global_step": 466506, "epoch": 2776} {"train_loss": -12.227622032165527, "global_step": 466507, "epoch": 2776} {"train_loss": -11.505265235900879, "global_step": 466508, "epoch": 2776} {"train_loss": -12.366052627563477, "global_step": 466509, "epoch": 2776} {"train_loss": -11.638911247253418, "global_step": 466510, "epoch": 2776} {"train_loss": -12.166634559631348, "global_step": 466511, "epoch": 2776} {"train_loss": -11.097393035888672, "global_step": 466512, "epoch": 2776} {"train_loss": -11.527435302734375, "global_step": 466513, "epoch": 2776} {"train_loss": -10.802230834960938, "global_step": 466514, "epoch": 2776} {"train_loss": -11.810202598571777, "global_step": 466515, "epoch": 2776} {"train_loss": -11.138542175292969, "global_step": 466516, "epoch": 2776} {"train_loss": -11.512248992919922, "global_step": 466517, "epoch": 2776} {"train_loss": -11.656591415405273, "global_step": 466518, "epoch": 2776} {"train_loss": -10.982575416564941, "global_step": 466519, "epoch": 2776} {"train_loss": -10.1502685546875, "global_step": 466520, "epoch": 2776} {"train_loss": -11.391371726989746, "global_step": 466521, "epoch": 2776} {"train_loss": -10.916345596313477, "global_step": 466522, "epoch": 2776} {"train_loss": -10.54241943359375, "global_step": 466523, "epoch": 2776} {"train_loss": -10.877252578735352, "global_step": 466524, "epoch": 2776} {"train_loss": -9.728286743164062, "global_step": 466525, "epoch": 2776} {"train_loss": -11.527339935302734, "global_step": 466526, "epoch": 2776} {"train_loss": -10.099486351013184, "global_step": 466527, "epoch": 2776} {"train_loss": -11.332351684570312, "global_step": 466528, "epoch": 2776} {"train_loss": -10.783182144165039, "global_step": 466529, "epoch": 2776} {"train_loss": -11.57110595703125, "global_step": 466530, "epoch": 2776} {"train_loss": -11.262763977050781, "global_step": 466531, "epoch": 2776} {"train_loss": -11.797083854675293, "global_step": 466532, "epoch": 2776} {"train_loss": -11.488178253173828, "global_step": 466533, "epoch": 2776} {"train_loss": -11.319347381591797, "global_step": 466534, "epoch": 2776} {"train_loss": -11.93452677272615, "global_step": 466535, "epoch": 2776, "val_loss": 313362.8125} {"train_loss": -11.433449745178223, "global_step": 466536, "epoch": 2777} {"train_loss": -12.456594467163086, "global_step": 466537, "epoch": 2777} {"train_loss": -11.3634672164917, "global_step": 466538, "epoch": 2777} {"train_loss": -12.167814254760742, "global_step": 466539, "epoch": 2777} {"train_loss": -11.759319305419922, "global_step": 466540, "epoch": 2777} {"train_loss": -11.830535888671875, "global_step": 466541, "epoch": 2777} {"train_loss": -12.155388832092285, "global_step": 466542, "epoch": 2777} {"train_loss": -12.088395118713379, "global_step": 466543, "epoch": 2777} {"train_loss": -11.949417114257812, "global_step": 466544, "epoch": 2777} {"train_loss": -11.708940505981445, "global_step": 466545, "epoch": 2777} {"train_loss": -12.152067184448242, "global_step": 466546, "epoch": 2777} {"train_loss": -12.083475112915039, "global_step": 466547, "epoch": 2777} {"train_loss": -11.970193862915039, "global_step": 466548, "epoch": 2777} {"train_loss": -12.283641815185547, "global_step": 466549, "epoch": 2777} {"train_loss": -11.85311508178711, "global_step": 466550, "epoch": 2777} {"train_loss": -12.21723747253418, "global_step": 466551, "epoch": 2777} {"train_loss": -12.0089693069458, "global_step": 466552, "epoch": 2777} {"train_loss": -12.004571914672852, "global_step": 466553, "epoch": 2777} {"train_loss": -12.167380332946777, "global_step": 466554, "epoch": 2777} {"train_loss": -12.228693008422852, "global_step": 466555, "epoch": 2777} {"train_loss": -12.342385292053223, "global_step": 466556, "epoch": 2777} {"train_loss": -12.21347427368164, "global_step": 466557, "epoch": 2777} {"train_loss": -12.320868492126465, "global_step": 466558, "epoch": 2777} {"train_loss": -12.273551940917969, "global_step": 466559, "epoch": 2777} {"train_loss": -12.236274719238281, "global_step": 466560, "epoch": 2777} {"train_loss": -12.519302368164062, "global_step": 466561, "epoch": 2777} {"train_loss": -12.293317794799805, "global_step": 466562, "epoch": 2777} {"train_loss": -12.432195663452148, "global_step": 466563, "epoch": 2777} {"train_loss": -12.558662414550781, "global_step": 466564, "epoch": 2777} {"train_loss": -12.25623893737793, "global_step": 466565, "epoch": 2777} {"train_loss": -12.65086841583252, "global_step": 466566, "epoch": 2777} {"train_loss": -12.353707313537598, "global_step": 466567, "epoch": 2777} {"train_loss": -12.488601684570312, "global_step": 466568, "epoch": 2777} {"train_loss": -12.648700714111328, "global_step": 466569, "epoch": 2777} {"train_loss": -12.408531188964844, "global_step": 466570, "epoch": 2777} {"train_loss": -12.6212158203125, "global_step": 466571, "epoch": 2777} {"train_loss": -12.606136322021484, "global_step": 466572, "epoch": 2777} {"train_loss": -12.650285720825195, "global_step": 466573, "epoch": 2777} {"train_loss": -12.6444091796875, "global_step": 466574, "epoch": 2777} {"train_loss": -12.565921783447266, "global_step": 466575, "epoch": 2777} {"train_loss": -12.57246208190918, "global_step": 466576, "epoch": 2777} {"train_loss": -12.576186180114746, "global_step": 466577, "epoch": 2777} {"train_loss": -12.619720458984375, "global_step": 466578, "epoch": 2777} {"train_loss": -12.434596061706543, "global_step": 466579, "epoch": 2777} {"train_loss": -12.557140350341797, "global_step": 466580, "epoch": 2777} {"train_loss": -12.303397178649902, "global_step": 466581, "epoch": 2777} {"train_loss": -12.444225311279297, "global_step": 466582, "epoch": 2777} {"train_loss": -12.477399826049805, "global_step": 466583, "epoch": 2777} {"train_loss": -12.460836410522461, "global_step": 466584, "epoch": 2777} {"train_loss": -12.561470031738281, "global_step": 466585, "epoch": 2777} {"train_loss": -12.621856689453125, "global_step": 466586, "epoch": 2777} {"train_loss": -12.53628921508789, "global_step": 466587, "epoch": 2777} {"train_loss": -12.156722068786621, "global_step": 466588, "epoch": 2777} {"train_loss": -12.738698959350586, "global_step": 466589, "epoch": 2777} {"train_loss": -12.08102035522461, "global_step": 466590, "epoch": 2777} {"train_loss": -12.68353271484375, "global_step": 466591, "epoch": 2777} {"train_loss": -12.42274284362793, "global_step": 466592, "epoch": 2777} {"train_loss": -12.614480972290039, "global_step": 466593, "epoch": 2777} {"train_loss": -12.067153930664062, "global_step": 466594, "epoch": 2777} {"train_loss": -12.412700653076172, "global_step": 466595, "epoch": 2777} {"train_loss": -12.66854190826416, "global_step": 466596, "epoch": 2777} {"train_loss": -11.782448768615723, "global_step": 466597, "epoch": 2777} {"train_loss": -12.240818977355957, "global_step": 466598, "epoch": 2777} {"train_loss": -12.423831939697266, "global_step": 466599, "epoch": 2777} {"train_loss": -11.991476058959961, "global_step": 466600, "epoch": 2777} {"train_loss": -12.661409378051758, "global_step": 466601, "epoch": 2777} {"train_loss": -12.333600997924805, "global_step": 466602, "epoch": 2777} {"train_loss": -12.333076477050781, "global_step": 466603, "epoch": 2777} {"train_loss": -12.69593620300293, "global_step": 466604, "epoch": 2777} {"train_loss": -12.551790237426758, "global_step": 466605, "epoch": 2777} {"train_loss": -12.590778350830078, "global_step": 466606, "epoch": 2777} {"train_loss": -12.686531066894531, "global_step": 466607, "epoch": 2777} {"train_loss": -12.534687995910645, "global_step": 466608, "epoch": 2777} {"train_loss": -12.612203598022461, "global_step": 466609, "epoch": 2777} {"train_loss": -12.720550537109375, "global_step": 466610, "epoch": 2777} {"train_loss": -12.622794151306152, "global_step": 466611, "epoch": 2777} {"train_loss": -12.598794937133789, "global_step": 466612, "epoch": 2777} {"train_loss": -12.734094619750977, "global_step": 466613, "epoch": 2777} {"train_loss": -12.606727600097656, "global_step": 466614, "epoch": 2777} {"train_loss": -12.793384552001953, "global_step": 466615, "epoch": 2777} {"train_loss": -12.586021423339844, "global_step": 466616, "epoch": 2777} {"train_loss": -12.828439712524414, "global_step": 466617, "epoch": 2777} {"train_loss": -12.673794746398926, "global_step": 466618, "epoch": 2777} {"train_loss": -12.942827224731445, "global_step": 466619, "epoch": 2777} {"train_loss": -12.809774398803711, "global_step": 466620, "epoch": 2777} {"train_loss": -12.878519058227539, "global_step": 466621, "epoch": 2777} {"train_loss": -12.818029403686523, "global_step": 466622, "epoch": 2777} {"train_loss": -12.935718536376953, "global_step": 466623, "epoch": 2777} {"train_loss": -12.678718566894531, "global_step": 466624, "epoch": 2777} {"train_loss": -12.597726821899414, "global_step": 466625, "epoch": 2777} {"train_loss": -12.840323448181152, "global_step": 466626, "epoch": 2777} {"train_loss": -12.645498275756836, "global_step": 466627, "epoch": 2777} {"train_loss": -12.781160354614258, "global_step": 466628, "epoch": 2777} {"train_loss": -13.023306846618652, "global_step": 466629, "epoch": 2777} {"train_loss": -12.851593017578125, "global_step": 466630, "epoch": 2777} {"train_loss": -12.814046859741211, "global_step": 466631, "epoch": 2777} {"train_loss": -12.809385299682617, "global_step": 466632, "epoch": 2777} {"train_loss": -12.505224227905273, "global_step": 466633, "epoch": 2777} {"train_loss": -12.685053825378418, "global_step": 466634, "epoch": 2777} {"train_loss": -12.938830375671387, "global_step": 466635, "epoch": 2777} {"train_loss": -12.8533353805542, "global_step": 466636, "epoch": 2777} {"train_loss": -12.92935848236084, "global_step": 466637, "epoch": 2777} {"train_loss": -12.804340362548828, "global_step": 466638, "epoch": 2777} {"train_loss": -12.76880931854248, "global_step": 466639, "epoch": 2777} {"train_loss": -12.746227264404297, "global_step": 466640, "epoch": 2777} {"train_loss": -12.753124237060547, "global_step": 466641, "epoch": 2777} {"train_loss": -12.977773666381836, "global_step": 466642, "epoch": 2777} {"train_loss": -12.710155487060547, "global_step": 466643, "epoch": 2777} {"train_loss": -13.052253723144531, "global_step": 466644, "epoch": 2777} {"train_loss": -12.452842712402344, "global_step": 466645, "epoch": 2777} {"train_loss": -12.315656661987305, "global_step": 466646, "epoch": 2777} {"train_loss": -11.61759090423584, "global_step": 466647, "epoch": 2777} {"train_loss": -11.527639389038086, "global_step": 466648, "epoch": 2777} {"train_loss": -11.315467834472656, "global_step": 466649, "epoch": 2777} {"train_loss": -11.371984481811523, "global_step": 466650, "epoch": 2777} {"train_loss": -11.388619422912598, "global_step": 466651, "epoch": 2777} {"train_loss": -10.920095443725586, "global_step": 466652, "epoch": 2777} {"train_loss": -11.240127563476562, "global_step": 466653, "epoch": 2777} {"train_loss": -10.613022804260254, "global_step": 466654, "epoch": 2777} {"train_loss": -7.857126235961914, "global_step": 466655, "epoch": 2777} {"train_loss": -11.679977416992188, "global_step": 466656, "epoch": 2777} {"train_loss": -9.886242866516113, "global_step": 466657, "epoch": 2777} {"train_loss": -9.794894218444824, "global_step": 466658, "epoch": 2777} {"train_loss": -11.210182189941406, "global_step": 466659, "epoch": 2777} {"train_loss": -9.184769630432129, "global_step": 466660, "epoch": 2777} {"train_loss": -10.749619483947754, "global_step": 466661, "epoch": 2777} {"train_loss": -10.386219024658203, "global_step": 466662, "epoch": 2777} {"train_loss": -10.04339599609375, "global_step": 466663, "epoch": 2777} {"train_loss": -9.678735733032227, "global_step": 466664, "epoch": 2777} {"train_loss": -11.113250732421875, "global_step": 466665, "epoch": 2777} {"train_loss": -10.382054328918457, "global_step": 466666, "epoch": 2777} {"train_loss": -11.05311107635498, "global_step": 466667, "epoch": 2777} {"train_loss": -11.447802543640137, "global_step": 466668, "epoch": 2777} {"train_loss": -11.371259689331055, "global_step": 466669, "epoch": 2777} {"train_loss": -11.024413108825684, "global_step": 466670, "epoch": 2777} {"train_loss": -11.39885139465332, "global_step": 466671, "epoch": 2777} {"train_loss": -11.765098571777344, "global_step": 466672, "epoch": 2777} {"train_loss": -11.121813774108887, "global_step": 466673, "epoch": 2777} {"train_loss": -11.251413345336914, "global_step": 466674, "epoch": 2777} {"train_loss": -11.55935001373291, "global_step": 466675, "epoch": 2777} {"train_loss": -11.710756301879883, "global_step": 466676, "epoch": 2777} {"train_loss": -11.652519226074219, "global_step": 466677, "epoch": 2777} {"train_loss": -10.98519515991211, "global_step": 466678, "epoch": 2777} {"train_loss": -11.466634750366211, "global_step": 466679, "epoch": 2777} {"train_loss": -11.273465156555176, "global_step": 466680, "epoch": 2777} {"train_loss": -11.749778747558594, "global_step": 466681, "epoch": 2777} {"train_loss": -11.911478042602539, "global_step": 466682, "epoch": 2777} {"train_loss": -11.187702178955078, "global_step": 466683, "epoch": 2777} {"train_loss": -11.723367691040039, "global_step": 466684, "epoch": 2777} {"train_loss": -11.346179962158203, "global_step": 466685, "epoch": 2777} {"train_loss": -11.716846466064453, "global_step": 466686, "epoch": 2777} {"train_loss": -11.729059219360352, "global_step": 466687, "epoch": 2777} {"train_loss": -11.233431816101074, "global_step": 466688, "epoch": 2777} {"train_loss": -11.832565307617188, "global_step": 466689, "epoch": 2777} {"train_loss": -11.269485473632812, "global_step": 466690, "epoch": 2777} {"train_loss": -11.77839469909668, "global_step": 466691, "epoch": 2777} {"train_loss": -12.215399742126465, "global_step": 466692, "epoch": 2777} {"train_loss": -11.963104248046875, "global_step": 466693, "epoch": 2777} {"train_loss": -12.359085083007812, "global_step": 466694, "epoch": 2777} {"train_loss": -12.311423301696777, "global_step": 466695, "epoch": 2777} {"train_loss": -12.105110168457031, "global_step": 466696, "epoch": 2777} {"train_loss": -12.32767391204834, "global_step": 466697, "epoch": 2777} {"train_loss": -12.158740997314453, "global_step": 466698, "epoch": 2777} {"train_loss": -12.372295379638672, "global_step": 466699, "epoch": 2777} {"train_loss": -12.517245292663574, "global_step": 466700, "epoch": 2777} {"train_loss": -12.088875770568848, "global_step": 466701, "epoch": 2777} {"train_loss": -12.07502555847168, "global_step": 466702, "epoch": 2777} {"train_loss": -12.078730912435622, "global_step": 466703, "epoch": 2777, "val_loss": 315331.78125} {"train_loss": -12.249663352966309, "global_step": 466704, "epoch": 2778} {"train_loss": -12.466083526611328, "global_step": 466705, "epoch": 2778} {"train_loss": -11.968223571777344, "global_step": 466706, "epoch": 2778} {"train_loss": -11.803668022155762, "global_step": 466707, "epoch": 2778} {"train_loss": -12.161376953125, "global_step": 466708, "epoch": 2778} {"train_loss": -11.902767181396484, "global_step": 466709, "epoch": 2778} {"train_loss": -12.028276443481445, "global_step": 466710, "epoch": 2778} {"train_loss": -11.776741027832031, "global_step": 466711, "epoch": 2778} {"train_loss": -12.174027442932129, "global_step": 466712, "epoch": 2778} {"train_loss": -11.978975296020508, "global_step": 466713, "epoch": 2778} {"train_loss": -12.0316743850708, "global_step": 466714, "epoch": 2778} {"train_loss": -12.028358459472656, "global_step": 466715, "epoch": 2778} {"train_loss": -12.308194160461426, "global_step": 466716, "epoch": 2778} {"train_loss": -11.798988342285156, "global_step": 466717, "epoch": 2778} {"train_loss": -12.289451599121094, "global_step": 466718, "epoch": 2778} {"train_loss": -12.111495971679688, "global_step": 466719, "epoch": 2778} {"train_loss": -12.239143371582031, "global_step": 466720, "epoch": 2778} {"train_loss": -12.076784133911133, "global_step": 466721, "epoch": 2778} {"train_loss": -11.850532531738281, "global_step": 466722, "epoch": 2778} {"train_loss": -12.471120834350586, "global_step": 466723, "epoch": 2778} {"train_loss": -12.217498779296875, "global_step": 466724, "epoch": 2778} {"train_loss": -12.406457901000977, "global_step": 466725, "epoch": 2778} {"train_loss": -11.943412780761719, "global_step": 466726, "epoch": 2778} {"train_loss": -12.315849304199219, "global_step": 466727, "epoch": 2778} {"train_loss": -12.093438148498535, "global_step": 466728, "epoch": 2778} {"train_loss": -12.251401901245117, "global_step": 466729, "epoch": 2778} {"train_loss": -12.375717163085938, "global_step": 466730, "epoch": 2778} {"train_loss": -12.337686538696289, "global_step": 466731, "epoch": 2778} {"train_loss": -11.826193809509277, "global_step": 466732, "epoch": 2778} {"train_loss": -12.422550201416016, "global_step": 466733, "epoch": 2778} {"train_loss": -12.273880958557129, "global_step": 466734, "epoch": 2778} {"train_loss": -12.378412246704102, "global_step": 466735, "epoch": 2778} {"train_loss": -12.426275253295898, "global_step": 466736, "epoch": 2778} {"train_loss": -12.473851203918457, "global_step": 466737, "epoch": 2778} {"train_loss": -12.3134183883667, "global_step": 466738, "epoch": 2778} {"train_loss": -12.171408653259277, "global_step": 466739, "epoch": 2778} {"train_loss": -12.409561157226562, "global_step": 466740, "epoch": 2778} {"train_loss": -11.85545539855957, "global_step": 466741, "epoch": 2778} {"train_loss": -12.65471363067627, "global_step": 466742, "epoch": 2778} {"train_loss": -12.340890884399414, "global_step": 466743, "epoch": 2778} {"train_loss": -12.54279899597168, "global_step": 466744, "epoch": 2778} {"train_loss": -12.336935997009277, "global_step": 466745, "epoch": 2778} {"train_loss": -12.428750991821289, "global_step": 466746, "epoch": 2778} {"train_loss": -12.607824325561523, "global_step": 466747, "epoch": 2778} {"train_loss": -12.737634658813477, "global_step": 466748, "epoch": 2778} {"train_loss": -12.63340950012207, "global_step": 466749, "epoch": 2778} {"train_loss": -12.71019172668457, "global_step": 466750, "epoch": 2778} {"train_loss": -12.600781440734863, "global_step": 466751, "epoch": 2778} {"train_loss": -12.65738296508789, "global_step": 466752, "epoch": 2778} {"train_loss": -12.709915161132812, "global_step": 466753, "epoch": 2778} {"train_loss": -12.640478134155273, "global_step": 466754, "epoch": 2778} {"train_loss": -12.717425346374512, "global_step": 466755, "epoch": 2778} {"train_loss": -12.579963684082031, "global_step": 466756, "epoch": 2778} {"train_loss": -12.646123886108398, "global_step": 466757, "epoch": 2778} {"train_loss": -12.98130989074707, "global_step": 466758, "epoch": 2778} {"train_loss": -12.95560359954834, "global_step": 466759, "epoch": 2778} {"train_loss": -12.73831558227539, "global_step": 466760, "epoch": 2778} {"train_loss": -12.639509201049805, "global_step": 466761, "epoch": 2778} {"train_loss": -12.631425857543945, "global_step": 466762, "epoch": 2778} {"train_loss": -12.571897506713867, "global_step": 466763, "epoch": 2778} {"train_loss": -12.694448471069336, "global_step": 466764, "epoch": 2778} {"train_loss": -12.993053436279297, "global_step": 466765, "epoch": 2778} {"train_loss": -12.752394676208496, "global_step": 466766, "epoch": 2778} {"train_loss": -12.593896865844727, "global_step": 466767, "epoch": 2778} {"train_loss": -12.797965049743652, "global_step": 466768, "epoch": 2778} {"train_loss": -12.733407974243164, "global_step": 466769, "epoch": 2778} {"train_loss": -12.80747127532959, "global_step": 466770, "epoch": 2778} {"train_loss": -12.815786361694336, "global_step": 466771, "epoch": 2778} {"train_loss": -12.979598999023438, "global_step": 466772, "epoch": 2778} {"train_loss": -12.595853805541992, "global_step": 466773, "epoch": 2778} {"train_loss": -12.8565092086792, "global_step": 466774, "epoch": 2778} {"train_loss": -12.859907150268555, "global_step": 466775, "epoch": 2778} {"train_loss": -12.463798522949219, "global_step": 466776, "epoch": 2778} {"train_loss": -12.673114776611328, "global_step": 466777, "epoch": 2778} {"train_loss": -12.693178176879883, "global_step": 466778, "epoch": 2778} {"train_loss": -12.342025756835938, "global_step": 466779, "epoch": 2778} {"train_loss": -12.642997741699219, "global_step": 466780, "epoch": 2778} {"train_loss": -12.907625198364258, "global_step": 466781, "epoch": 2778} {"train_loss": -12.023672103881836, "global_step": 466782, "epoch": 2778} {"train_loss": -11.718822479248047, "global_step": 466783, "epoch": 2778} {"train_loss": -12.84649658203125, "global_step": 466784, "epoch": 2778} {"train_loss": -11.8046293258667, "global_step": 466785, "epoch": 2778} {"train_loss": -12.529558181762695, "global_step": 466786, "epoch": 2778} {"train_loss": -12.265182495117188, "global_step": 466787, "epoch": 2778} {"train_loss": -11.759140014648438, "global_step": 466788, "epoch": 2778} {"train_loss": -12.331524848937988, "global_step": 466789, "epoch": 2778} {"train_loss": -11.52203369140625, "global_step": 466790, "epoch": 2778} {"train_loss": -11.545635223388672, "global_step": 466791, "epoch": 2778} {"train_loss": -11.94699478149414, "global_step": 466792, "epoch": 2778} {"train_loss": -10.337041854858398, "global_step": 466793, "epoch": 2778} {"train_loss": -12.964792251586914, "global_step": 466794, "epoch": 2778} {"train_loss": -10.620655059814453, "global_step": 466795, "epoch": 2778} {"train_loss": -11.44076919555664, "global_step": 466796, "epoch": 2778} {"train_loss": -12.171545028686523, "global_step": 466797, "epoch": 2778} {"train_loss": -10.7880859375, "global_step": 466798, "epoch": 2778} {"train_loss": -12.661844253540039, "global_step": 466799, "epoch": 2778} {"train_loss": -11.500860214233398, "global_step": 466800, "epoch": 2778} {"train_loss": -10.819365501403809, "global_step": 466801, "epoch": 2778} {"train_loss": -12.305691719055176, "global_step": 466802, "epoch": 2778} {"train_loss": -11.426718711853027, "global_step": 466803, "epoch": 2778} {"train_loss": -11.57137393951416, "global_step": 466804, "epoch": 2778} {"train_loss": -12.379809379577637, "global_step": 466805, "epoch": 2778} {"train_loss": -11.480785369873047, "global_step": 466806, "epoch": 2778} {"train_loss": -11.465131759643555, "global_step": 466807, "epoch": 2778} {"train_loss": -12.42092514038086, "global_step": 466808, "epoch": 2778} {"train_loss": -11.933493614196777, "global_step": 466809, "epoch": 2778} {"train_loss": -11.957921981811523, "global_step": 466810, "epoch": 2778} {"train_loss": -12.333285331726074, "global_step": 466811, "epoch": 2778} {"train_loss": -11.743131637573242, "global_step": 466812, "epoch": 2778} {"train_loss": -12.275718688964844, "global_step": 466813, "epoch": 2778} {"train_loss": -11.931373596191406, "global_step": 466814, "epoch": 2778} {"train_loss": -12.03335189819336, "global_step": 466815, "epoch": 2778} {"train_loss": -12.096270561218262, "global_step": 466816, "epoch": 2778} {"train_loss": -11.967157363891602, "global_step": 466817, "epoch": 2778} {"train_loss": -12.478166580200195, "global_step": 466818, "epoch": 2778} {"train_loss": -11.920692443847656, "global_step": 466819, "epoch": 2778} {"train_loss": -12.22283935546875, "global_step": 466820, "epoch": 2778} {"train_loss": -11.804744720458984, "global_step": 466821, "epoch": 2778} {"train_loss": -12.450014114379883, "global_step": 466822, "epoch": 2778} {"train_loss": -12.39018440246582, "global_step": 466823, "epoch": 2778} {"train_loss": -12.351123809814453, "global_step": 466824, "epoch": 2778} {"train_loss": -11.936034202575684, "global_step": 466825, "epoch": 2778} {"train_loss": -12.431103706359863, "global_step": 466826, "epoch": 2778} {"train_loss": -12.507894515991211, "global_step": 466827, "epoch": 2778} {"train_loss": -12.58560562133789, "global_step": 466828, "epoch": 2778} {"train_loss": -12.391502380371094, "global_step": 466829, "epoch": 2778} {"train_loss": -12.44464111328125, "global_step": 466830, "epoch": 2778} {"train_loss": -12.189472198486328, "global_step": 466831, "epoch": 2778} {"train_loss": -12.432507514953613, "global_step": 466832, "epoch": 2778} {"train_loss": -12.611795425415039, "global_step": 466833, "epoch": 2778} {"train_loss": -12.618916511535645, "global_step": 466834, "epoch": 2778} {"train_loss": -12.476290702819824, "global_step": 466835, "epoch": 2778} {"train_loss": -12.43989086151123, "global_step": 466836, "epoch": 2778} {"train_loss": -12.753866195678711, "global_step": 466837, "epoch": 2778} {"train_loss": -12.695712089538574, "global_step": 466838, "epoch": 2778} {"train_loss": -12.44610595703125, "global_step": 466839, "epoch": 2778} {"train_loss": -12.653759002685547, "global_step": 466840, "epoch": 2778} {"train_loss": -12.67734146118164, "global_step": 466841, "epoch": 2778} {"train_loss": -12.435689926147461, "global_step": 466842, "epoch": 2778} {"train_loss": -12.422796249389648, "global_step": 466843, "epoch": 2778} {"train_loss": -12.250846862792969, "global_step": 466844, "epoch": 2778} {"train_loss": -10.865557670593262, "global_step": 466845, "epoch": 2778} {"train_loss": -11.89461612701416, "global_step": 466846, "epoch": 2778} {"train_loss": -11.109909057617188, "global_step": 466847, "epoch": 2778} {"train_loss": -10.999293327331543, "global_step": 466848, "epoch": 2778} {"train_loss": -11.564743995666504, "global_step": 466849, "epoch": 2778} {"train_loss": -9.41562271118164, "global_step": 466850, "epoch": 2778} {"train_loss": -10.69406795501709, "global_step": 466851, "epoch": 2778} {"train_loss": -11.068603515625, "global_step": 466852, "epoch": 2778} {"train_loss": -9.81495189666748, "global_step": 466853, "epoch": 2778} {"train_loss": -10.554682731628418, "global_step": 466854, "epoch": 2778} {"train_loss": -11.463911056518555, "global_step": 466855, "epoch": 2778} {"train_loss": -10.913871765136719, "global_step": 466856, "epoch": 2778} {"train_loss": -9.517871856689453, "global_step": 466857, "epoch": 2778} {"train_loss": -10.323874473571777, "global_step": 466858, "epoch": 2778} {"train_loss": -10.242803573608398, "global_step": 466859, "epoch": 2778} {"train_loss": -10.427363395690918, "global_step": 466860, "epoch": 2778} {"train_loss": -10.302014350891113, "global_step": 466861, "epoch": 2778} {"train_loss": -10.961941719055176, "global_step": 466862, "epoch": 2778} {"train_loss": -11.265485763549805, "global_step": 466863, "epoch": 2778} {"train_loss": -11.642345428466797, "global_step": 466864, "epoch": 2778} {"train_loss": -10.603745460510254, "global_step": 466865, "epoch": 2778} {"train_loss": -12.202815055847168, "global_step": 466866, "epoch": 2778} {"train_loss": -10.985797882080078, "global_step": 466867, "epoch": 2778} {"train_loss": -11.83365249633789, "global_step": 466868, "epoch": 2778} {"train_loss": -11.09717082977295, "global_step": 466869, "epoch": 2778} {"train_loss": -11.221927642822266, "global_step": 466870, "epoch": 2778} {"train_loss": -12.059661342984153, "global_step": 466871, "epoch": 2778, "val_loss": 308383.25} {"train_loss": -11.926331520080566, "global_step": 466872, "epoch": 2779} {"train_loss": -11.91602897644043, "global_step": 466873, "epoch": 2779} {"train_loss": -11.589545249938965, "global_step": 466874, "epoch": 2779} {"train_loss": -11.869404792785645, "global_step": 466875, "epoch": 2779} {"train_loss": -10.864118576049805, "global_step": 466876, "epoch": 2779} {"train_loss": -12.036681175231934, "global_step": 466877, "epoch": 2779} {"train_loss": -11.530181884765625, "global_step": 466878, "epoch": 2779} {"train_loss": -10.815997123718262, "global_step": 466879, "epoch": 2779} {"train_loss": -12.275294303894043, "global_step": 466880, "epoch": 2779} {"train_loss": -11.380902290344238, "global_step": 466881, "epoch": 2779} {"train_loss": -12.262153625488281, "global_step": 466882, "epoch": 2779} {"train_loss": -10.734189987182617, "global_step": 466883, "epoch": 2779} {"train_loss": -11.711108207702637, "global_step": 466884, "epoch": 2779} {"train_loss": -11.48307991027832, "global_step": 466885, "epoch": 2779} {"train_loss": -12.17245101928711, "global_step": 466886, "epoch": 2779} {"train_loss": -11.985442161560059, "global_step": 466887, "epoch": 2779} {"train_loss": -11.44968032836914, "global_step": 466888, "epoch": 2779} {"train_loss": -11.657081604003906, "global_step": 466889, "epoch": 2779} {"train_loss": -11.535564422607422, "global_step": 466890, "epoch": 2779} {"train_loss": -12.225576400756836, "global_step": 466891, "epoch": 2779} {"train_loss": -12.006248474121094, "global_step": 466892, "epoch": 2779} {"train_loss": -11.973610877990723, "global_step": 466893, "epoch": 2779} {"train_loss": -12.246192932128906, "global_step": 466894, "epoch": 2779} {"train_loss": -12.208419799804688, "global_step": 466895, "epoch": 2779} {"train_loss": -12.324394226074219, "global_step": 466896, "epoch": 2779} {"train_loss": -12.440764427185059, "global_step": 466897, "epoch": 2779} {"train_loss": -12.25327205657959, "global_step": 466898, "epoch": 2779} {"train_loss": -12.36433219909668, "global_step": 466899, "epoch": 2779} {"train_loss": -12.354974746704102, "global_step": 466900, "epoch": 2779} {"train_loss": -12.459068298339844, "global_step": 466901, "epoch": 2779} {"train_loss": -12.537984848022461, "global_step": 466902, "epoch": 2779} {"train_loss": -12.47317123413086, "global_step": 466903, "epoch": 2779} {"train_loss": -12.765276908874512, "global_step": 466904, "epoch": 2779} {"train_loss": -12.551861763000488, "global_step": 466905, "epoch": 2779} {"train_loss": -12.47225284576416, "global_step": 466906, "epoch": 2779} {"train_loss": -12.617332458496094, "global_step": 466907, "epoch": 2779} {"train_loss": -12.538596153259277, "global_step": 466908, "epoch": 2779} {"train_loss": -12.487326622009277, "global_step": 466909, "epoch": 2779} {"train_loss": -12.418455123901367, "global_step": 466910, "epoch": 2779} {"train_loss": -12.173341751098633, "global_step": 466911, "epoch": 2779} {"train_loss": -12.210926055908203, "global_step": 466912, "epoch": 2779} {"train_loss": -12.447999000549316, "global_step": 466913, "epoch": 2779} {"train_loss": -12.613120079040527, "global_step": 466914, "epoch": 2779} {"train_loss": -12.429205894470215, "global_step": 466915, "epoch": 2779} {"train_loss": -12.296812057495117, "global_step": 466916, "epoch": 2779} {"train_loss": -12.430089950561523, "global_step": 466917, "epoch": 2779} {"train_loss": -12.684267044067383, "global_step": 466918, "epoch": 2779} {"train_loss": -12.423345565795898, "global_step": 466919, "epoch": 2779} {"train_loss": -12.676873207092285, "global_step": 466920, "epoch": 2779} {"train_loss": -12.648176193237305, "global_step": 466921, "epoch": 2779} {"train_loss": -12.383224487304688, "global_step": 466922, "epoch": 2779} {"train_loss": -12.806938171386719, "global_step": 466923, "epoch": 2779} {"train_loss": -12.430206298828125, "global_step": 466924, "epoch": 2779} {"train_loss": -12.569818496704102, "global_step": 466925, "epoch": 2779} {"train_loss": -12.597635269165039, "global_step": 466926, "epoch": 2779} {"train_loss": -12.697212219238281, "global_step": 466927, "epoch": 2779} {"train_loss": -12.712562561035156, "global_step": 466928, "epoch": 2779} {"train_loss": -12.57846450805664, "global_step": 466929, "epoch": 2779} {"train_loss": -12.64578914642334, "global_step": 466930, "epoch": 2779} {"train_loss": -12.533452033996582, "global_step": 466931, "epoch": 2779} {"train_loss": -12.792279243469238, "global_step": 466932, "epoch": 2779} {"train_loss": -12.507833480834961, "global_step": 466933, "epoch": 2779} {"train_loss": -12.673495292663574, "global_step": 466934, "epoch": 2779} {"train_loss": -12.73728084564209, "global_step": 466935, "epoch": 2779} {"train_loss": -12.690444946289062, "global_step": 466936, "epoch": 2779} {"train_loss": -12.76278018951416, "global_step": 466937, "epoch": 2779} {"train_loss": -12.733345031738281, "global_step": 466938, "epoch": 2779} {"train_loss": -12.629420280456543, "global_step": 466939, "epoch": 2779} {"train_loss": -12.875627517700195, "global_step": 466940, "epoch": 2779} {"train_loss": -12.755229949951172, "global_step": 466941, "epoch": 2779} {"train_loss": -12.534788131713867, "global_step": 466942, "epoch": 2779} {"train_loss": -12.67886734008789, "global_step": 466943, "epoch": 2779} {"train_loss": -12.681673049926758, "global_step": 466944, "epoch": 2779} {"train_loss": -12.61596393585205, "global_step": 466945, "epoch": 2779} {"train_loss": -12.370363235473633, "global_step": 466946, "epoch": 2779} {"train_loss": -12.527849197387695, "global_step": 466947, "epoch": 2779} {"train_loss": -12.56229019165039, "global_step": 466948, "epoch": 2779} {"train_loss": -12.405999183654785, "global_step": 466949, "epoch": 2779} {"train_loss": -12.717245101928711, "global_step": 466950, "epoch": 2779} {"train_loss": -12.537952423095703, "global_step": 466951, "epoch": 2779} {"train_loss": -12.857769966125488, "global_step": 466952, "epoch": 2779} {"train_loss": -12.545822143554688, "global_step": 466953, "epoch": 2779} {"train_loss": -12.761697769165039, "global_step": 466954, "epoch": 2779} {"train_loss": -12.703702926635742, "global_step": 466955, "epoch": 2779} {"train_loss": -12.613017082214355, "global_step": 466956, "epoch": 2779} {"train_loss": -12.985118865966797, "global_step": 466957, "epoch": 2779} {"train_loss": -12.805885314941406, "global_step": 466958, "epoch": 2779} {"train_loss": -12.527978897094727, "global_step": 466959, "epoch": 2779} {"train_loss": -12.538268089294434, "global_step": 466960, "epoch": 2779} {"train_loss": -12.55487060546875, "global_step": 466961, "epoch": 2779} {"train_loss": -12.48056411743164, "global_step": 466962, "epoch": 2779} {"train_loss": -12.895645141601562, "global_step": 466963, "epoch": 2779} {"train_loss": -12.69904899597168, "global_step": 466964, "epoch": 2779} {"train_loss": -12.868352890014648, "global_step": 466965, "epoch": 2779} {"train_loss": -12.695571899414062, "global_step": 466966, "epoch": 2779} {"train_loss": -12.620479583740234, "global_step": 466967, "epoch": 2779} {"train_loss": -12.576308250427246, "global_step": 466968, "epoch": 2779} {"train_loss": -13.144990921020508, "global_step": 466969, "epoch": 2779} {"train_loss": -12.600811958312988, "global_step": 466970, "epoch": 2779} {"train_loss": -12.988995552062988, "global_step": 466971, "epoch": 2779} {"train_loss": -12.684082984924316, "global_step": 466972, "epoch": 2779} {"train_loss": -12.836978912353516, "global_step": 466973, "epoch": 2779} {"train_loss": -12.685896873474121, "global_step": 466974, "epoch": 2779} {"train_loss": -12.388711929321289, "global_step": 466975, "epoch": 2779} {"train_loss": -12.622262954711914, "global_step": 466976, "epoch": 2779} {"train_loss": -12.901302337646484, "global_step": 466977, "epoch": 2779} {"train_loss": -12.573814392089844, "global_step": 466978, "epoch": 2779} {"train_loss": -12.461040496826172, "global_step": 466979, "epoch": 2779} {"train_loss": -12.916982650756836, "global_step": 466980, "epoch": 2779} {"train_loss": -12.658434867858887, "global_step": 466981, "epoch": 2779} {"train_loss": -12.749103546142578, "global_step": 466982, "epoch": 2779} {"train_loss": -12.92776107788086, "global_step": 466983, "epoch": 2779} {"train_loss": -12.650754928588867, "global_step": 466984, "epoch": 2779} {"train_loss": -12.459977149963379, "global_step": 466985, "epoch": 2779} {"train_loss": -12.673335075378418, "global_step": 466986, "epoch": 2779} {"train_loss": -13.057657241821289, "global_step": 466987, "epoch": 2779} {"train_loss": -12.494717597961426, "global_step": 466988, "epoch": 2779} {"train_loss": -12.646717071533203, "global_step": 466989, "epoch": 2779} {"train_loss": -12.909411430358887, "global_step": 466990, "epoch": 2779} {"train_loss": -12.694584846496582, "global_step": 466991, "epoch": 2779} {"train_loss": -12.41033935546875, "global_step": 466992, "epoch": 2779} {"train_loss": -12.717708587646484, "global_step": 466993, "epoch": 2779} {"train_loss": -12.560761451721191, "global_step": 466994, "epoch": 2779} {"train_loss": -12.482967376708984, "global_step": 466995, "epoch": 2779} {"train_loss": -12.952666282653809, "global_step": 466996, "epoch": 2779} {"train_loss": -12.771381378173828, "global_step": 466997, "epoch": 2779} {"train_loss": -12.310237884521484, "global_step": 466998, "epoch": 2779} {"train_loss": -12.922369003295898, "global_step": 466999, "epoch": 2779} {"train_loss": -12.367971420288086, "global_step": 467000, "epoch": 2779} {"train_loss": -11.761829376220703, "global_step": 467001, "epoch": 2779} {"train_loss": -12.187769889831543, "global_step": 467002, "epoch": 2779} {"train_loss": -12.752176284790039, "global_step": 467003, "epoch": 2779} {"train_loss": -11.711389541625977, "global_step": 467004, "epoch": 2779} {"train_loss": -12.111775398254395, "global_step": 467005, "epoch": 2779} {"train_loss": -11.2459077835083, "global_step": 467006, "epoch": 2779} {"train_loss": -9.018250465393066, "global_step": 467007, "epoch": 2779} {"train_loss": -12.43746566772461, "global_step": 467008, "epoch": 2779} {"train_loss": -9.549781799316406, "global_step": 467009, "epoch": 2779} {"train_loss": -12.043437004089355, "global_step": 467010, "epoch": 2779} {"train_loss": -9.416084289550781, "global_step": 467011, "epoch": 2779} {"train_loss": -11.448884963989258, "global_step": 467012, "epoch": 2779} {"train_loss": -9.974555969238281, "global_step": 467013, "epoch": 2779} {"train_loss": -9.738999366760254, "global_step": 467014, "epoch": 2779} {"train_loss": -8.085530281066895, "global_step": 467015, "epoch": 2779} {"train_loss": -11.211586952209473, "global_step": 467016, "epoch": 2779} {"train_loss": -6.667571544647217, "global_step": 467017, "epoch": 2779} {"train_loss": -9.383054733276367, "global_step": 467018, "epoch": 2779} {"train_loss": -8.416976928710938, "global_step": 467019, "epoch": 2779} {"train_loss": -9.747379302978516, "global_step": 467020, "epoch": 2779} {"train_loss": -10.220830917358398, "global_step": 467021, "epoch": 2779} {"train_loss": -7.624844074249268, "global_step": 467022, "epoch": 2779} {"train_loss": -7.734692573547363, "global_step": 467023, "epoch": 2779} {"train_loss": -8.349212646484375, "global_step": 467024, "epoch": 2779} {"train_loss": -9.629585266113281, "global_step": 467025, "epoch": 2779} {"train_loss": -10.039251327514648, "global_step": 467026, "epoch": 2779} {"train_loss": -9.618374824523926, "global_step": 467027, "epoch": 2779} {"train_loss": -9.256706237792969, "global_step": 467028, "epoch": 2779} {"train_loss": -11.139392852783203, "global_step": 467029, "epoch": 2779} {"train_loss": -9.77169418334961, "global_step": 467030, "epoch": 2779} {"train_loss": -11.388420104980469, "global_step": 467031, "epoch": 2779} {"train_loss": -10.457511901855469, "global_step": 467032, "epoch": 2779} {"train_loss": -10.384659767150879, "global_step": 467033, "epoch": 2779} {"train_loss": -10.27402114868164, "global_step": 467034, "epoch": 2779} {"train_loss": -11.302960395812988, "global_step": 467035, "epoch": 2779} {"train_loss": -10.37136173248291, "global_step": 467036, "epoch": 2779} {"train_loss": -10.113452911376953, "global_step": 467037, "epoch": 2779} {"train_loss": -11.12123966217041, "global_step": 467038, "epoch": 2779} {"train_loss": -11.929939661707197, "global_step": 467039, "epoch": 2779, "val_loss": 302324.0625} {"train_loss": -10.604959487915039, "global_step": 467040, "epoch": 2780} {"train_loss": -10.058756828308105, "global_step": 467041, "epoch": 2780} {"train_loss": -10.813438415527344, "global_step": 467042, "epoch": 2780} {"train_loss": -10.71658706665039, "global_step": 467043, "epoch": 2780} {"train_loss": -11.747982025146484, "global_step": 467044, "epoch": 2780} {"train_loss": -11.441099166870117, "global_step": 467045, "epoch": 2780} {"train_loss": -11.792254447937012, "global_step": 467046, "epoch": 2780} {"train_loss": -11.757108688354492, "global_step": 467047, "epoch": 2780} {"train_loss": -11.923196792602539, "global_step": 467048, "epoch": 2780} {"train_loss": -11.787168502807617, "global_step": 467049, "epoch": 2780} {"train_loss": -11.8405122756958, "global_step": 467050, "epoch": 2780} {"train_loss": -11.952733039855957, "global_step": 467051, "epoch": 2780} {"train_loss": -11.815650939941406, "global_step": 467052, "epoch": 2780} {"train_loss": -12.11893081665039, "global_step": 467053, "epoch": 2780} {"train_loss": -11.872467041015625, "global_step": 467054, "epoch": 2780} {"train_loss": -12.077573776245117, "global_step": 467055, "epoch": 2780} {"train_loss": -12.291122436523438, "global_step": 467056, "epoch": 2780} {"train_loss": -12.069779396057129, "global_step": 467057, "epoch": 2780} {"train_loss": -12.2377347946167, "global_step": 467058, "epoch": 2780} {"train_loss": -11.942255973815918, "global_step": 467059, "epoch": 2780} {"train_loss": -12.341922760009766, "global_step": 467060, "epoch": 2780} {"train_loss": -12.077140808105469, "global_step": 467061, "epoch": 2780} {"train_loss": -12.49955940246582, "global_step": 467062, "epoch": 2780} {"train_loss": -12.370049476623535, "global_step": 467063, "epoch": 2780} {"train_loss": -12.29555606842041, "global_step": 467064, "epoch": 2780} {"train_loss": -12.102821350097656, "global_step": 467065, "epoch": 2780} {"train_loss": -12.421428680419922, "global_step": 467066, "epoch": 2780} {"train_loss": -12.269468307495117, "global_step": 467067, "epoch": 2780} {"train_loss": -12.440025329589844, "global_step": 467068, "epoch": 2780} {"train_loss": -12.353979110717773, "global_step": 467069, "epoch": 2780} {"train_loss": -12.423693656921387, "global_step": 467070, "epoch": 2780} {"train_loss": -12.4396333694458, "global_step": 467071, "epoch": 2780} {"train_loss": -12.287934303283691, "global_step": 467072, "epoch": 2780} {"train_loss": -12.334901809692383, "global_step": 467073, "epoch": 2780} {"train_loss": -12.49879264831543, "global_step": 467074, "epoch": 2780} {"train_loss": -12.258354187011719, "global_step": 467075, "epoch": 2780} {"train_loss": -12.373884201049805, "global_step": 467076, "epoch": 2780} {"train_loss": -12.58428955078125, "global_step": 467077, "epoch": 2780} {"train_loss": -12.235847473144531, "global_step": 467078, "epoch": 2780} {"train_loss": -12.557308197021484, "global_step": 467079, "epoch": 2780} {"train_loss": -12.532173156738281, "global_step": 467080, "epoch": 2780} {"train_loss": -12.663459777832031, "global_step": 467081, "epoch": 2780} {"train_loss": -12.267560005187988, "global_step": 467082, "epoch": 2780} {"train_loss": -12.343290328979492, "global_step": 467083, "epoch": 2780} {"train_loss": -12.283380508422852, "global_step": 467084, "epoch": 2780} {"train_loss": -12.344854354858398, "global_step": 467085, "epoch": 2780} {"train_loss": -12.488334655761719, "global_step": 467086, "epoch": 2780} {"train_loss": -12.422070503234863, "global_step": 467087, "epoch": 2780} {"train_loss": -12.365028381347656, "global_step": 467088, "epoch": 2780} {"train_loss": -12.401336669921875, "global_step": 467089, "epoch": 2780} {"train_loss": -12.354581832885742, "global_step": 467090, "epoch": 2780} {"train_loss": -12.402944564819336, "global_step": 467091, "epoch": 2780} {"train_loss": -12.349343299865723, "global_step": 467092, "epoch": 2780} {"train_loss": -12.4399995803833, "global_step": 467093, "epoch": 2780} {"train_loss": -12.302433013916016, "global_step": 467094, "epoch": 2780} {"train_loss": -12.593111991882324, "global_step": 467095, "epoch": 2780} {"train_loss": -12.386507987976074, "global_step": 467096, "epoch": 2780} {"train_loss": -12.46457290649414, "global_step": 467097, "epoch": 2780} {"train_loss": -12.5425443649292, "global_step": 467098, "epoch": 2780} {"train_loss": -12.534448623657227, "global_step": 467099, "epoch": 2780} {"train_loss": -12.436699867248535, "global_step": 467100, "epoch": 2780} {"train_loss": -12.728187561035156, "global_step": 467101, "epoch": 2780} {"train_loss": -12.384774208068848, "global_step": 467102, "epoch": 2780} {"train_loss": -12.522905349731445, "global_step": 467103, "epoch": 2780} {"train_loss": -12.351264953613281, "global_step": 467104, "epoch": 2780} {"train_loss": -12.419464111328125, "global_step": 467105, "epoch": 2780} {"train_loss": -12.618983268737793, "global_step": 467106, "epoch": 2780} {"train_loss": -12.632543563842773, "global_step": 467107, "epoch": 2780} {"train_loss": -12.44202709197998, "global_step": 467108, "epoch": 2780} {"train_loss": -12.437210083007812, "global_step": 467109, "epoch": 2780} {"train_loss": -12.460811614990234, "global_step": 467110, "epoch": 2780} {"train_loss": -12.401371002197266, "global_step": 467111, "epoch": 2780} {"train_loss": -12.53027629852295, "global_step": 467112, "epoch": 2780} {"train_loss": -12.590506553649902, "global_step": 467113, "epoch": 2780} {"train_loss": -12.232250213623047, "global_step": 467114, "epoch": 2780} {"train_loss": -12.723125457763672, "global_step": 467115, "epoch": 2780} {"train_loss": -12.368249893188477, "global_step": 467116, "epoch": 2780} {"train_loss": -12.71485710144043, "global_step": 467117, "epoch": 2780} {"train_loss": -12.701360702514648, "global_step": 467118, "epoch": 2780} {"train_loss": -12.857139587402344, "global_step": 467119, "epoch": 2780} {"train_loss": -12.430577278137207, "global_step": 467120, "epoch": 2780} {"train_loss": -12.490518569946289, "global_step": 467121, "epoch": 2780} {"train_loss": -12.49940013885498, "global_step": 467122, "epoch": 2780} {"train_loss": -12.446290969848633, "global_step": 467123, "epoch": 2780} {"train_loss": -12.115718841552734, "global_step": 467124, "epoch": 2780} {"train_loss": -12.596989631652832, "global_step": 467125, "epoch": 2780} {"train_loss": -12.515515327453613, "global_step": 467126, "epoch": 2780} {"train_loss": -12.525659561157227, "global_step": 467127, "epoch": 2780} {"train_loss": -12.258280754089355, "global_step": 467128, "epoch": 2780} {"train_loss": -12.280671119689941, "global_step": 467129, "epoch": 2780} {"train_loss": -11.753653526306152, "global_step": 467130, "epoch": 2780} {"train_loss": -12.50594711303711, "global_step": 467131, "epoch": 2780} {"train_loss": -12.543296813964844, "global_step": 467132, "epoch": 2780} {"train_loss": -12.591547966003418, "global_step": 467133, "epoch": 2780} {"train_loss": -12.48538589477539, "global_step": 467134, "epoch": 2780} {"train_loss": -12.527443885803223, "global_step": 467135, "epoch": 2780} {"train_loss": -12.23241138458252, "global_step": 467136, "epoch": 2780} {"train_loss": -12.23358154296875, "global_step": 467137, "epoch": 2780} {"train_loss": -12.183418273925781, "global_step": 467138, "epoch": 2780} {"train_loss": -11.953180313110352, "global_step": 467139, "epoch": 2780} {"train_loss": -12.31591796875, "global_step": 467140, "epoch": 2780} {"train_loss": -11.765386581420898, "global_step": 467141, "epoch": 2780} {"train_loss": -12.471856117248535, "global_step": 467142, "epoch": 2780} {"train_loss": -12.028038024902344, "global_step": 467143, "epoch": 2780} {"train_loss": -9.981830596923828, "global_step": 467144, "epoch": 2780} {"train_loss": -10.179244995117188, "global_step": 467145, "epoch": 2780} {"train_loss": -12.203056335449219, "global_step": 467146, "epoch": 2780} {"train_loss": -10.603324890136719, "global_step": 467147, "epoch": 2780} {"train_loss": -12.184141159057617, "global_step": 467148, "epoch": 2780} {"train_loss": -11.330370903015137, "global_step": 467149, "epoch": 2780} {"train_loss": -11.432703018188477, "global_step": 467150, "epoch": 2780} {"train_loss": -11.951848983764648, "global_step": 467151, "epoch": 2780} {"train_loss": -11.018884658813477, "global_step": 467152, "epoch": 2780} {"train_loss": -9.894433975219727, "global_step": 467153, "epoch": 2780} {"train_loss": -10.21609878540039, "global_step": 467154, "epoch": 2780} {"train_loss": -11.401017189025879, "global_step": 467155, "epoch": 2780} {"train_loss": -9.464529037475586, "global_step": 467156, "epoch": 2780} {"train_loss": -11.14404296875, "global_step": 467157, "epoch": 2780} {"train_loss": -8.93674087524414, "global_step": 467158, "epoch": 2780} {"train_loss": -9.714764595031738, "global_step": 467159, "epoch": 2780} {"train_loss": -11.566823959350586, "global_step": 467160, "epoch": 2780} {"train_loss": -10.054089546203613, "global_step": 467161, "epoch": 2780} {"train_loss": -9.551019668579102, "global_step": 467162, "epoch": 2780} {"train_loss": -11.693548202514648, "global_step": 467163, "epoch": 2780} {"train_loss": -10.112101554870605, "global_step": 467164, "epoch": 2780} {"train_loss": -11.440093994140625, "global_step": 467165, "epoch": 2780} {"train_loss": -10.940496444702148, "global_step": 467166, "epoch": 2780} {"train_loss": -10.450423240661621, "global_step": 467167, "epoch": 2780} {"train_loss": -11.74328899383545, "global_step": 467168, "epoch": 2780} {"train_loss": -10.963343620300293, "global_step": 467169, "epoch": 2780} {"train_loss": -12.113719940185547, "global_step": 467170, "epoch": 2780} {"train_loss": -11.560602188110352, "global_step": 467171, "epoch": 2780} {"train_loss": -11.142681121826172, "global_step": 467172, "epoch": 2780} {"train_loss": -12.106977462768555, "global_step": 467173, "epoch": 2780} {"train_loss": -11.311026573181152, "global_step": 467174, "epoch": 2780} {"train_loss": -11.731229782104492, "global_step": 467175, "epoch": 2780} {"train_loss": -11.620870590209961, "global_step": 467176, "epoch": 2780} {"train_loss": -11.123268127441406, "global_step": 467177, "epoch": 2780} {"train_loss": -11.559489250183105, "global_step": 467178, "epoch": 2780} {"train_loss": -11.507028579711914, "global_step": 467179, "epoch": 2780} {"train_loss": -11.479728698730469, "global_step": 467180, "epoch": 2780} {"train_loss": -12.03549575805664, "global_step": 467181, "epoch": 2780} {"train_loss": -10.767647743225098, "global_step": 467182, "epoch": 2780} {"train_loss": -11.933385848999023, "global_step": 467183, "epoch": 2780} {"train_loss": -11.491552352905273, "global_step": 467184, "epoch": 2780} {"train_loss": -10.652292251586914, "global_step": 467185, "epoch": 2780} {"train_loss": -11.63947868347168, "global_step": 467186, "epoch": 2780} {"train_loss": -10.329745292663574, "global_step": 467187, "epoch": 2780} {"train_loss": -11.356022834777832, "global_step": 467188, "epoch": 2780} {"train_loss": -11.502317428588867, "global_step": 467189, "epoch": 2780} {"train_loss": -11.37039566040039, "global_step": 467190, "epoch": 2780} {"train_loss": -12.27634048461914, "global_step": 467191, "epoch": 2780} {"train_loss": -11.611287117004395, "global_step": 467192, "epoch": 2780} {"train_loss": -12.181394577026367, "global_step": 467193, "epoch": 2780} {"train_loss": -11.581210136413574, "global_step": 467194, "epoch": 2780} {"train_loss": -11.82603645324707, "global_step": 467195, "epoch": 2780} {"train_loss": -11.864635467529297, "global_step": 467196, "epoch": 2780} {"train_loss": -12.091395378112793, "global_step": 467197, "epoch": 2780} {"train_loss": -11.310226440429688, "global_step": 467198, "epoch": 2780} {"train_loss": -12.14797592163086, "global_step": 467199, "epoch": 2780} {"train_loss": -12.134622573852539, "global_step": 467200, "epoch": 2780} {"train_loss": -11.926355361938477, "global_step": 467201, "epoch": 2780} {"train_loss": -11.944964408874512, "global_step": 467202, "epoch": 2780} {"train_loss": -12.059178352355957, "global_step": 467203, "epoch": 2780} {"train_loss": -12.157448768615723, "global_step": 467204, "epoch": 2780} {"train_loss": -12.264554977416992, "global_step": 467205, "epoch": 2780} {"train_loss": -12.353988647460938, "global_step": 467206, "epoch": 2780} {"train_loss": -11.898954374449593, "global_step": 467207, "epoch": 2780, "val_loss": 308444.96875, "train_action_mse_error": 1.526377558708191} {"train_loss": -12.294017791748047, "global_step": 467208, "epoch": 2781} {"train_loss": -12.139436721801758, "global_step": 467209, "epoch": 2781} {"train_loss": -12.170660972595215, "global_step": 467210, "epoch": 2781} {"train_loss": -12.658039093017578, "global_step": 467211, "epoch": 2781} {"train_loss": -12.075662612915039, "global_step": 467212, "epoch": 2781} {"train_loss": -12.246636390686035, "global_step": 467213, "epoch": 2781} {"train_loss": -12.44017219543457, "global_step": 467214, "epoch": 2781} {"train_loss": -11.725797653198242, "global_step": 467215, "epoch": 2781} {"train_loss": -12.383136749267578, "global_step": 467216, "epoch": 2781} {"train_loss": -12.459033966064453, "global_step": 467217, "epoch": 2781} {"train_loss": -11.95656967163086, "global_step": 467218, "epoch": 2781} {"train_loss": -12.514208793640137, "global_step": 467219, "epoch": 2781} {"train_loss": -12.49110221862793, "global_step": 467220, "epoch": 2781} {"train_loss": -12.42312240600586, "global_step": 467221, "epoch": 2781} {"train_loss": -12.300113677978516, "global_step": 467222, "epoch": 2781} {"train_loss": -12.385391235351562, "global_step": 467223, "epoch": 2781} {"train_loss": -12.222734451293945, "global_step": 467224, "epoch": 2781} {"train_loss": -12.544807434082031, "global_step": 467225, "epoch": 2781} {"train_loss": -12.615459442138672, "global_step": 467226, "epoch": 2781} {"train_loss": -12.380159378051758, "global_step": 467227, "epoch": 2781} {"train_loss": -12.65234375, "global_step": 467228, "epoch": 2781} {"train_loss": -12.525226593017578, "global_step": 467229, "epoch": 2781} {"train_loss": -12.308552742004395, "global_step": 467230, "epoch": 2781} {"train_loss": -12.353260040283203, "global_step": 467231, "epoch": 2781} {"train_loss": -12.492452621459961, "global_step": 467232, "epoch": 2781} {"train_loss": -11.920373916625977, "global_step": 467233, "epoch": 2781} {"train_loss": -11.990372657775879, "global_step": 467234, "epoch": 2781} {"train_loss": -12.28249740600586, "global_step": 467235, "epoch": 2781} {"train_loss": -12.670228004455566, "global_step": 467236, "epoch": 2781} {"train_loss": -12.323548316955566, "global_step": 467237, "epoch": 2781} {"train_loss": -12.608288764953613, "global_step": 467238, "epoch": 2781} {"train_loss": -12.143997192382812, "global_step": 467239, "epoch": 2781} {"train_loss": -12.463769912719727, "global_step": 467240, "epoch": 2781} {"train_loss": -12.385744094848633, "global_step": 467241, "epoch": 2781} {"train_loss": -12.541687965393066, "global_step": 467242, "epoch": 2781} {"train_loss": -12.375384330749512, "global_step": 467243, "epoch": 2781} {"train_loss": -12.261859893798828, "global_step": 467244, "epoch": 2781} {"train_loss": -12.626189231872559, "global_step": 467245, "epoch": 2781} {"train_loss": -12.230255126953125, "global_step": 467246, "epoch": 2781} {"train_loss": -12.410140991210938, "global_step": 467247, "epoch": 2781} {"train_loss": -12.465940475463867, "global_step": 467248, "epoch": 2781} {"train_loss": -12.395177841186523, "global_step": 467249, "epoch": 2781} {"train_loss": -12.215330123901367, "global_step": 467250, "epoch": 2781} {"train_loss": -12.655312538146973, "global_step": 467251, "epoch": 2781} {"train_loss": -12.768893241882324, "global_step": 467252, "epoch": 2781} {"train_loss": -12.0676851272583, "global_step": 467253, "epoch": 2781} {"train_loss": -12.657441139221191, "global_step": 467254, "epoch": 2781} {"train_loss": -12.012371063232422, "global_step": 467255, "epoch": 2781} {"train_loss": -12.476455688476562, "global_step": 467256, "epoch": 2781} {"train_loss": -12.426228523254395, "global_step": 467257, "epoch": 2781} {"train_loss": -12.48056411743164, "global_step": 467258, "epoch": 2781} {"train_loss": -12.393960952758789, "global_step": 467259, "epoch": 2781} {"train_loss": -12.259956359863281, "global_step": 467260, "epoch": 2781} {"train_loss": -12.721395492553711, "global_step": 467261, "epoch": 2781} {"train_loss": -12.3058500289917, "global_step": 467262, "epoch": 2781} {"train_loss": -12.698720932006836, "global_step": 467263, "epoch": 2781} {"train_loss": -12.288167953491211, "global_step": 467264, "epoch": 2781} {"train_loss": -12.592636108398438, "global_step": 467265, "epoch": 2781} {"train_loss": -12.365233421325684, "global_step": 467266, "epoch": 2781} {"train_loss": -12.648635864257812, "global_step": 467267, "epoch": 2781} {"train_loss": -12.252565383911133, "global_step": 467268, "epoch": 2781} {"train_loss": -12.522209167480469, "global_step": 467269, "epoch": 2781} {"train_loss": -12.62496566772461, "global_step": 467270, "epoch": 2781} {"train_loss": -12.400491714477539, "global_step": 467271, "epoch": 2781} {"train_loss": -12.454513549804688, "global_step": 467272, "epoch": 2781} {"train_loss": -12.835172653198242, "global_step": 467273, "epoch": 2781} {"train_loss": -12.487933158874512, "global_step": 467274, "epoch": 2781} {"train_loss": -12.461907386779785, "global_step": 467275, "epoch": 2781} {"train_loss": -11.9866304397583, "global_step": 467276, "epoch": 2781} {"train_loss": -12.686187744140625, "global_step": 467277, "epoch": 2781} {"train_loss": -12.154688835144043, "global_step": 467278, "epoch": 2781} {"train_loss": -12.768543243408203, "global_step": 467279, "epoch": 2781} {"train_loss": -12.596476554870605, "global_step": 467280, "epoch": 2781} {"train_loss": -12.856792449951172, "global_step": 467281, "epoch": 2781} {"train_loss": -12.478059768676758, "global_step": 467282, "epoch": 2781} {"train_loss": -12.763960838317871, "global_step": 467283, "epoch": 2781} {"train_loss": -12.586259841918945, "global_step": 467284, "epoch": 2781} {"train_loss": -12.377742767333984, "global_step": 467285, "epoch": 2781} {"train_loss": -12.488619804382324, "global_step": 467286, "epoch": 2781} {"train_loss": -12.617209434509277, "global_step": 467287, "epoch": 2781} {"train_loss": -12.397964477539062, "global_step": 467288, "epoch": 2781} {"train_loss": -12.447914123535156, "global_step": 467289, "epoch": 2781} {"train_loss": -11.983101844787598, "global_step": 467290, "epoch": 2781} {"train_loss": -12.346427917480469, "global_step": 467291, "epoch": 2781} {"train_loss": -12.629745483398438, "global_step": 467292, "epoch": 2781} {"train_loss": -12.122993469238281, "global_step": 467293, "epoch": 2781} {"train_loss": -12.081886291503906, "global_step": 467294, "epoch": 2781} {"train_loss": -12.713215827941895, "global_step": 467295, "epoch": 2781} {"train_loss": -12.25407886505127, "global_step": 467296, "epoch": 2781} {"train_loss": -12.8333158493042, "global_step": 467297, "epoch": 2781} {"train_loss": -12.291021347045898, "global_step": 467298, "epoch": 2781} {"train_loss": -12.138956069946289, "global_step": 467299, "epoch": 2781} {"train_loss": -12.641375541687012, "global_step": 467300, "epoch": 2781} {"train_loss": -12.284225463867188, "global_step": 467301, "epoch": 2781} {"train_loss": -12.581901550292969, "global_step": 467302, "epoch": 2781} {"train_loss": -12.528666496276855, "global_step": 467303, "epoch": 2781} {"train_loss": -12.535306930541992, "global_step": 467304, "epoch": 2781} {"train_loss": -12.01302719116211, "global_step": 467305, "epoch": 2781} {"train_loss": -12.163002014160156, "global_step": 467306, "epoch": 2781} {"train_loss": -10.626470565795898, "global_step": 467307, "epoch": 2781} {"train_loss": -11.435722351074219, "global_step": 467308, "epoch": 2781} {"train_loss": -11.85627555847168, "global_step": 467309, "epoch": 2781} {"train_loss": -11.566566467285156, "global_step": 467310, "epoch": 2781} {"train_loss": -12.039429664611816, "global_step": 467311, "epoch": 2781} {"train_loss": -11.101402282714844, "global_step": 467312, "epoch": 2781} {"train_loss": -12.33137321472168, "global_step": 467313, "epoch": 2781} {"train_loss": -11.631850242614746, "global_step": 467314, "epoch": 2781} {"train_loss": -12.831235885620117, "global_step": 467315, "epoch": 2781} {"train_loss": -11.265464782714844, "global_step": 467316, "epoch": 2781} {"train_loss": -12.556720733642578, "global_step": 467317, "epoch": 2781} {"train_loss": -12.279799461364746, "global_step": 467318, "epoch": 2781} {"train_loss": -12.786800384521484, "global_step": 467319, "epoch": 2781} {"train_loss": -11.883447647094727, "global_step": 467320, "epoch": 2781} {"train_loss": -12.506603240966797, "global_step": 467321, "epoch": 2781} {"train_loss": -12.016839981079102, "global_step": 467322, "epoch": 2781} {"train_loss": -11.62860107421875, "global_step": 467323, "epoch": 2781} {"train_loss": -12.359667778015137, "global_step": 467324, "epoch": 2781} {"train_loss": -11.822463989257812, "global_step": 467325, "epoch": 2781} {"train_loss": -12.473803520202637, "global_step": 467326, "epoch": 2781} {"train_loss": -12.167902946472168, "global_step": 467327, "epoch": 2781} {"train_loss": -12.335238456726074, "global_step": 467328, "epoch": 2781} {"train_loss": -12.388553619384766, "global_step": 467329, "epoch": 2781} {"train_loss": -11.908576965332031, "global_step": 467330, "epoch": 2781} {"train_loss": -12.031545639038086, "global_step": 467331, "epoch": 2781} {"train_loss": -11.375391960144043, "global_step": 467332, "epoch": 2781} {"train_loss": -10.862556457519531, "global_step": 467333, "epoch": 2781} {"train_loss": -11.776247024536133, "global_step": 467334, "epoch": 2781} {"train_loss": -11.109521865844727, "global_step": 467335, "epoch": 2781} {"train_loss": -11.998527526855469, "global_step": 467336, "epoch": 2781} {"train_loss": -10.941080093383789, "global_step": 467337, "epoch": 2781} {"train_loss": -11.762429237365723, "global_step": 467338, "epoch": 2781} {"train_loss": -11.195178985595703, "global_step": 467339, "epoch": 2781} {"train_loss": -11.196248054504395, "global_step": 467340, "epoch": 2781} {"train_loss": -11.580784797668457, "global_step": 467341, "epoch": 2781} {"train_loss": -11.31710433959961, "global_step": 467342, "epoch": 2781} {"train_loss": -11.561422348022461, "global_step": 467343, "epoch": 2781} {"train_loss": -11.17273998260498, "global_step": 467344, "epoch": 2781} {"train_loss": -12.397759437561035, "global_step": 467345, "epoch": 2781} {"train_loss": -10.664172172546387, "global_step": 467346, "epoch": 2781} {"train_loss": -11.804706573486328, "global_step": 467347, "epoch": 2781} {"train_loss": -10.653829574584961, "global_step": 467348, "epoch": 2781} {"train_loss": -11.796624183654785, "global_step": 467349, "epoch": 2781} {"train_loss": -10.607877731323242, "global_step": 467350, "epoch": 2781} {"train_loss": -11.458524703979492, "global_step": 467351, "epoch": 2781} {"train_loss": -11.761390686035156, "global_step": 467352, "epoch": 2781} {"train_loss": -11.37125015258789, "global_step": 467353, "epoch": 2781} {"train_loss": -11.983013153076172, "global_step": 467354, "epoch": 2781} {"train_loss": -11.147974014282227, "global_step": 467355, "epoch": 2781} {"train_loss": -11.745011329650879, "global_step": 467356, "epoch": 2781} {"train_loss": -11.2514009475708, "global_step": 467357, "epoch": 2781} {"train_loss": -11.562299728393555, "global_step": 467358, "epoch": 2781} {"train_loss": -12.036590576171875, "global_step": 467359, "epoch": 2781} {"train_loss": -11.712808609008789, "global_step": 467360, "epoch": 2781} {"train_loss": -12.187421798706055, "global_step": 467361, "epoch": 2781} {"train_loss": -11.343501091003418, "global_step": 467362, "epoch": 2781} {"train_loss": -12.359050750732422, "global_step": 467363, "epoch": 2781} {"train_loss": -11.614776611328125, "global_step": 467364, "epoch": 2781} {"train_loss": -11.728046417236328, "global_step": 467365, "epoch": 2781} {"train_loss": -11.737898826599121, "global_step": 467366, "epoch": 2781} {"train_loss": -11.75808048248291, "global_step": 467367, "epoch": 2781} {"train_loss": -12.009354591369629, "global_step": 467368, "epoch": 2781} {"train_loss": -12.052928924560547, "global_step": 467369, "epoch": 2781} {"train_loss": -11.923385620117188, "global_step": 467370, "epoch": 2781} {"train_loss": -11.837186813354492, "global_step": 467371, "epoch": 2781} {"train_loss": -11.847616195678711, "global_step": 467372, "epoch": 2781} {"train_loss": -11.889039993286133, "global_step": 467373, "epoch": 2781} {"train_loss": -12.117956161499023, "global_step": 467374, "epoch": 2781} {"train_loss": -12.136265618460518, "global_step": 467375, "epoch": 2781, "val_loss": 313987.875} {"train_loss": -12.216346740722656, "global_step": 467376, "epoch": 2782} {"train_loss": -12.014832496643066, "global_step": 467377, "epoch": 2782} {"train_loss": -12.496199607849121, "global_step": 467378, "epoch": 2782} {"train_loss": -12.36343765258789, "global_step": 467379, "epoch": 2782} {"train_loss": -12.2592191696167, "global_step": 467380, "epoch": 2782} {"train_loss": -12.566057205200195, "global_step": 467381, "epoch": 2782} {"train_loss": -12.110893249511719, "global_step": 467382, "epoch": 2782} {"train_loss": -12.551332473754883, "global_step": 467383, "epoch": 2782} {"train_loss": -12.27035140991211, "global_step": 467384, "epoch": 2782} {"train_loss": -12.520309448242188, "global_step": 467385, "epoch": 2782} {"train_loss": -12.146108627319336, "global_step": 467386, "epoch": 2782} {"train_loss": -12.471017837524414, "global_step": 467387, "epoch": 2782} {"train_loss": -12.41869831085205, "global_step": 467388, "epoch": 2782} {"train_loss": -12.421804428100586, "global_step": 467389, "epoch": 2782} {"train_loss": -12.648387908935547, "global_step": 467390, "epoch": 2782} {"train_loss": -12.633219718933105, "global_step": 467391, "epoch": 2782} {"train_loss": -12.470287322998047, "global_step": 467392, "epoch": 2782} {"train_loss": -12.593062400817871, "global_step": 467393, "epoch": 2782} {"train_loss": -12.650252342224121, "global_step": 467394, "epoch": 2782} {"train_loss": -12.285154342651367, "global_step": 467395, "epoch": 2782} {"train_loss": -12.64787483215332, "global_step": 467396, "epoch": 2782} {"train_loss": -12.485322952270508, "global_step": 467397, "epoch": 2782} {"train_loss": -12.584881782531738, "global_step": 467398, "epoch": 2782} {"train_loss": -12.42384147644043, "global_step": 467399, "epoch": 2782} {"train_loss": -12.403478622436523, "global_step": 467400, "epoch": 2782} {"train_loss": -12.500316619873047, "global_step": 467401, "epoch": 2782} {"train_loss": -12.45906925201416, "global_step": 467402, "epoch": 2782} {"train_loss": -12.4817533493042, "global_step": 467403, "epoch": 2782} {"train_loss": -12.393683433532715, "global_step": 467404, "epoch": 2782} {"train_loss": -12.672996520996094, "global_step": 467405, "epoch": 2782} {"train_loss": -12.434633255004883, "global_step": 467406, "epoch": 2782} {"train_loss": -12.443558692932129, "global_step": 467407, "epoch": 2782} {"train_loss": -12.453124046325684, "global_step": 467408, "epoch": 2782} {"train_loss": -12.437397956848145, "global_step": 467409, "epoch": 2782} {"train_loss": -12.36343765258789, "global_step": 467410, "epoch": 2782} {"train_loss": -12.6535062789917, "global_step": 467411, "epoch": 2782} {"train_loss": -12.201953887939453, "global_step": 467412, "epoch": 2782} {"train_loss": -12.644164085388184, "global_step": 467413, "epoch": 2782} {"train_loss": -12.637893676757812, "global_step": 467414, "epoch": 2782} {"train_loss": -12.523666381835938, "global_step": 467415, "epoch": 2782} {"train_loss": -12.591474533081055, "global_step": 467416, "epoch": 2782} {"train_loss": -11.967376708984375, "global_step": 467417, "epoch": 2782} {"train_loss": -12.779245376586914, "global_step": 467418, "epoch": 2782} {"train_loss": -12.130550384521484, "global_step": 467419, "epoch": 2782} {"train_loss": -12.41868782043457, "global_step": 467420, "epoch": 2782} {"train_loss": -12.276409149169922, "global_step": 467421, "epoch": 2782} {"train_loss": -12.108145713806152, "global_step": 467422, "epoch": 2782} {"train_loss": -12.494738578796387, "global_step": 467423, "epoch": 2782} {"train_loss": -12.267227172851562, "global_step": 467424, "epoch": 2782} {"train_loss": -12.446382522583008, "global_step": 467425, "epoch": 2782} {"train_loss": -12.14632797241211, "global_step": 467426, "epoch": 2782} {"train_loss": -11.602365493774414, "global_step": 467427, "epoch": 2782} {"train_loss": -12.542451858520508, "global_step": 467428, "epoch": 2782} {"train_loss": -12.324105262756348, "global_step": 467429, "epoch": 2782} {"train_loss": -12.368310928344727, "global_step": 467430, "epoch": 2782} {"train_loss": -12.449499130249023, "global_step": 467431, "epoch": 2782} {"train_loss": -11.977487564086914, "global_step": 467432, "epoch": 2782} {"train_loss": -12.714479446411133, "global_step": 467433, "epoch": 2782} {"train_loss": -12.085311889648438, "global_step": 467434, "epoch": 2782} {"train_loss": -12.727972030639648, "global_step": 467435, "epoch": 2782} {"train_loss": -11.934846878051758, "global_step": 467436, "epoch": 2782} {"train_loss": -12.734768867492676, "global_step": 467437, "epoch": 2782} {"train_loss": -12.084495544433594, "global_step": 467438, "epoch": 2782} {"train_loss": -12.277090072631836, "global_step": 467439, "epoch": 2782} {"train_loss": -12.460824966430664, "global_step": 467440, "epoch": 2782} {"train_loss": -12.035444259643555, "global_step": 467441, "epoch": 2782} {"train_loss": -12.777908325195312, "global_step": 467442, "epoch": 2782} {"train_loss": -11.90674114227295, "global_step": 467443, "epoch": 2782} {"train_loss": -12.672876358032227, "global_step": 467444, "epoch": 2782} {"train_loss": -11.953813552856445, "global_step": 467445, "epoch": 2782} {"train_loss": -12.637757301330566, "global_step": 467446, "epoch": 2782} {"train_loss": -12.282474517822266, "global_step": 467447, "epoch": 2782} {"train_loss": -12.645474433898926, "global_step": 467448, "epoch": 2782} {"train_loss": -12.79003620147705, "global_step": 467449, "epoch": 2782} {"train_loss": -12.206494331359863, "global_step": 467450, "epoch": 2782} {"train_loss": -12.912188529968262, "global_step": 467451, "epoch": 2782} {"train_loss": -12.304096221923828, "global_step": 467452, "epoch": 2782} {"train_loss": -12.641439437866211, "global_step": 467453, "epoch": 2782} {"train_loss": -12.380191802978516, "global_step": 467454, "epoch": 2782} {"train_loss": -12.651138305664062, "global_step": 467455, "epoch": 2782} {"train_loss": -12.474123001098633, "global_step": 467456, "epoch": 2782} {"train_loss": -12.231402397155762, "global_step": 467457, "epoch": 2782} {"train_loss": -12.816463470458984, "global_step": 467458, "epoch": 2782} {"train_loss": -12.293712615966797, "global_step": 467459, "epoch": 2782} {"train_loss": -12.691917419433594, "global_step": 467460, "epoch": 2782} {"train_loss": -12.178207397460938, "global_step": 467461, "epoch": 2782} {"train_loss": -12.54114055633545, "global_step": 467462, "epoch": 2782} {"train_loss": -12.276697158813477, "global_step": 467463, "epoch": 2782} {"train_loss": -12.459135055541992, "global_step": 467464, "epoch": 2782} {"train_loss": -12.469226837158203, "global_step": 467465, "epoch": 2782} {"train_loss": -12.4503173828125, "global_step": 467466, "epoch": 2782} {"train_loss": -12.400186538696289, "global_step": 467467, "epoch": 2782} {"train_loss": -12.47372055053711, "global_step": 467468, "epoch": 2782} {"train_loss": -12.371112823486328, "global_step": 467469, "epoch": 2782} {"train_loss": -12.894824981689453, "global_step": 467470, "epoch": 2782} {"train_loss": -12.282947540283203, "global_step": 467471, "epoch": 2782} {"train_loss": -12.264592170715332, "global_step": 467472, "epoch": 2782} {"train_loss": -12.236028671264648, "global_step": 467473, "epoch": 2782} {"train_loss": -12.345508575439453, "global_step": 467474, "epoch": 2782} {"train_loss": -11.430012702941895, "global_step": 467475, "epoch": 2782} {"train_loss": -11.724531173706055, "global_step": 467476, "epoch": 2782} {"train_loss": -11.667888641357422, "global_step": 467477, "epoch": 2782} {"train_loss": -12.086040496826172, "global_step": 467478, "epoch": 2782} {"train_loss": -11.803838729858398, "global_step": 467479, "epoch": 2782} {"train_loss": -11.62913703918457, "global_step": 467480, "epoch": 2782} {"train_loss": -11.767236709594727, "global_step": 467481, "epoch": 2782} {"train_loss": -11.979879379272461, "global_step": 467482, "epoch": 2782} {"train_loss": -12.000945091247559, "global_step": 467483, "epoch": 2782} {"train_loss": -11.651664733886719, "global_step": 467484, "epoch": 2782} {"train_loss": -11.851237297058105, "global_step": 467485, "epoch": 2782} {"train_loss": -11.622150421142578, "global_step": 467486, "epoch": 2782} {"train_loss": -12.185323715209961, "global_step": 467487, "epoch": 2782} {"train_loss": -11.201467514038086, "global_step": 467488, "epoch": 2782} {"train_loss": -12.727787017822266, "global_step": 467489, "epoch": 2782} {"train_loss": -11.679311752319336, "global_step": 467490, "epoch": 2782} {"train_loss": -12.556364059448242, "global_step": 467491, "epoch": 2782} {"train_loss": -11.702585220336914, "global_step": 467492, "epoch": 2782} {"train_loss": -12.639195442199707, "global_step": 467493, "epoch": 2782} {"train_loss": -11.993377685546875, "global_step": 467494, "epoch": 2782} {"train_loss": -12.440290451049805, "global_step": 467495, "epoch": 2782} {"train_loss": -11.403145790100098, "global_step": 467496, "epoch": 2782} {"train_loss": -12.10302734375, "global_step": 467497, "epoch": 2782} {"train_loss": -12.112367630004883, "global_step": 467498, "epoch": 2782} {"train_loss": -12.158506393432617, "global_step": 467499, "epoch": 2782} {"train_loss": -12.089815139770508, "global_step": 467500, "epoch": 2782} {"train_loss": -12.326980590820312, "global_step": 467501, "epoch": 2782} {"train_loss": -12.391024589538574, "global_step": 467502, "epoch": 2782} {"train_loss": -12.268463134765625, "global_step": 467503, "epoch": 2782} {"train_loss": -12.514932632446289, "global_step": 467504, "epoch": 2782} {"train_loss": -12.124191284179688, "global_step": 467505, "epoch": 2782} {"train_loss": -12.716983795166016, "global_step": 467506, "epoch": 2782} {"train_loss": -12.805573463439941, "global_step": 467507, "epoch": 2782} {"train_loss": -12.505595207214355, "global_step": 467508, "epoch": 2782} {"train_loss": -12.686915397644043, "global_step": 467509, "epoch": 2782} {"train_loss": -12.583330154418945, "global_step": 467510, "epoch": 2782} {"train_loss": -12.70704460144043, "global_step": 467511, "epoch": 2782} {"train_loss": -12.666888236999512, "global_step": 467512, "epoch": 2782} {"train_loss": -12.326648712158203, "global_step": 467513, "epoch": 2782} {"train_loss": -12.741242408752441, "global_step": 467514, "epoch": 2782} {"train_loss": -12.345717430114746, "global_step": 467515, "epoch": 2782} {"train_loss": -12.755945205688477, "global_step": 467516, "epoch": 2782} {"train_loss": -12.53055191040039, "global_step": 467517, "epoch": 2782} {"train_loss": -12.403936386108398, "global_step": 467518, "epoch": 2782} {"train_loss": -12.564200401306152, "global_step": 467519, "epoch": 2782} {"train_loss": -12.478706359863281, "global_step": 467520, "epoch": 2782} {"train_loss": -12.678129196166992, "global_step": 467521, "epoch": 2782} {"train_loss": -12.592399597167969, "global_step": 467522, "epoch": 2782} {"train_loss": -12.797698020935059, "global_step": 467523, "epoch": 2782} {"train_loss": -12.538567543029785, "global_step": 467524, "epoch": 2782} {"train_loss": -12.633702278137207, "global_step": 467525, "epoch": 2782} {"train_loss": -12.679911613464355, "global_step": 467526, "epoch": 2782} {"train_loss": -12.395142555236816, "global_step": 467527, "epoch": 2782} {"train_loss": -12.647459030151367, "global_step": 467528, "epoch": 2782} {"train_loss": -12.647950172424316, "global_step": 467529, "epoch": 2782} {"train_loss": -12.67540168762207, "global_step": 467530, "epoch": 2782} {"train_loss": -12.703939437866211, "global_step": 467531, "epoch": 2782} {"train_loss": -12.948505401611328, "global_step": 467532, "epoch": 2782} {"train_loss": -12.603336334228516, "global_step": 467533, "epoch": 2782} {"train_loss": -13.008079528808594, "global_step": 467534, "epoch": 2782} {"train_loss": -12.647860527038574, "global_step": 467535, "epoch": 2782} {"train_loss": -12.87981128692627, "global_step": 467536, "epoch": 2782} {"train_loss": -12.972925186157227, "global_step": 467537, "epoch": 2782} {"train_loss": -12.826908111572266, "global_step": 467538, "epoch": 2782} {"train_loss": -12.883718490600586, "global_step": 467539, "epoch": 2782} {"train_loss": -12.721747398376465, "global_step": 467540, "epoch": 2782} {"train_loss": -12.893972396850586, "global_step": 467541, "epoch": 2782} {"train_loss": -12.802200317382812, "global_step": 467542, "epoch": 2782} {"train_loss": -12.39552470615932, "global_step": 467543, "epoch": 2782, "val_loss": 312984.25} {"train_loss": -12.515033721923828, "global_step": 467544, "epoch": 2783} {"train_loss": -12.572320938110352, "global_step": 467545, "epoch": 2783} {"train_loss": -12.826601028442383, "global_step": 467546, "epoch": 2783} {"train_loss": -12.690157890319824, "global_step": 467547, "epoch": 2783} {"train_loss": -12.819086074829102, "global_step": 467548, "epoch": 2783} {"train_loss": -12.919404029846191, "global_step": 467549, "epoch": 2783} {"train_loss": -12.832901000976562, "global_step": 467550, "epoch": 2783} {"train_loss": -12.494623184204102, "global_step": 467551, "epoch": 2783} {"train_loss": -12.60916519165039, "global_step": 467552, "epoch": 2783} {"train_loss": -12.457025527954102, "global_step": 467553, "epoch": 2783} {"train_loss": -12.21613597869873, "global_step": 467554, "epoch": 2783} {"train_loss": -12.336856842041016, "global_step": 467555, "epoch": 2783} {"train_loss": -12.724903106689453, "global_step": 467556, "epoch": 2783} {"train_loss": -12.958837509155273, "global_step": 467557, "epoch": 2783} {"train_loss": -12.439962387084961, "global_step": 467558, "epoch": 2783} {"train_loss": -12.511375427246094, "global_step": 467559, "epoch": 2783} {"train_loss": -12.808115005493164, "global_step": 467560, "epoch": 2783} {"train_loss": -12.717451095581055, "global_step": 467561, "epoch": 2783} {"train_loss": -12.543342590332031, "global_step": 467562, "epoch": 2783} {"train_loss": -12.754888534545898, "global_step": 467563, "epoch": 2783} {"train_loss": -12.209815979003906, "global_step": 467564, "epoch": 2783} {"train_loss": -11.899654388427734, "global_step": 467565, "epoch": 2783} {"train_loss": -11.931171417236328, "global_step": 467566, "epoch": 2783} {"train_loss": -12.15806770324707, "global_step": 467567, "epoch": 2783} {"train_loss": -12.550265312194824, "global_step": 467568, "epoch": 2783} {"train_loss": -12.109026908874512, "global_step": 467569, "epoch": 2783} {"train_loss": -11.475969314575195, "global_step": 467570, "epoch": 2783} {"train_loss": -12.025514602661133, "global_step": 467571, "epoch": 2783} {"train_loss": -12.678487777709961, "global_step": 467572, "epoch": 2783} {"train_loss": -11.90298080444336, "global_step": 467573, "epoch": 2783} {"train_loss": -11.752898216247559, "global_step": 467574, "epoch": 2783} {"train_loss": -12.366323471069336, "global_step": 467575, "epoch": 2783} {"train_loss": -12.03813362121582, "global_step": 467576, "epoch": 2783} {"train_loss": -12.324085235595703, "global_step": 467577, "epoch": 2783} {"train_loss": -11.351641654968262, "global_step": 467578, "epoch": 2783} {"train_loss": -12.231521606445312, "global_step": 467579, "epoch": 2783} {"train_loss": -12.071052551269531, "global_step": 467580, "epoch": 2783} {"train_loss": -11.860681533813477, "global_step": 467581, "epoch": 2783} {"train_loss": -12.152694702148438, "global_step": 467582, "epoch": 2783} {"train_loss": -11.021463394165039, "global_step": 467583, "epoch": 2783} {"train_loss": -10.882291793823242, "global_step": 467584, "epoch": 2783} {"train_loss": -12.075945854187012, "global_step": 467585, "epoch": 2783} {"train_loss": -10.125858306884766, "global_step": 467586, "epoch": 2783} {"train_loss": -12.006453514099121, "global_step": 467587, "epoch": 2783} {"train_loss": -10.719608306884766, "global_step": 467588, "epoch": 2783} {"train_loss": -11.804476737976074, "global_step": 467589, "epoch": 2783} {"train_loss": -9.993785858154297, "global_step": 467590, "epoch": 2783} {"train_loss": -10.646928787231445, "global_step": 467591, "epoch": 2783} {"train_loss": -11.653772354125977, "global_step": 467592, "epoch": 2783} {"train_loss": -9.731328964233398, "global_step": 467593, "epoch": 2783} {"train_loss": -10.806804656982422, "global_step": 467594, "epoch": 2783} {"train_loss": -8.316262245178223, "global_step": 467595, "epoch": 2783} {"train_loss": -9.311442375183105, "global_step": 467596, "epoch": 2783} {"train_loss": -8.615497589111328, "global_step": 467597, "epoch": 2783} {"train_loss": -7.602865695953369, "global_step": 467598, "epoch": 2783} {"train_loss": -8.437408447265625, "global_step": 467599, "epoch": 2783} {"train_loss": -10.321107864379883, "global_step": 467600, "epoch": 2783} {"train_loss": -8.714193344116211, "global_step": 467601, "epoch": 2783} {"train_loss": -9.557405471801758, "global_step": 467602, "epoch": 2783} {"train_loss": -9.158391952514648, "global_step": 467603, "epoch": 2783} {"train_loss": -10.26727294921875, "global_step": 467604, "epoch": 2783} {"train_loss": -10.135181427001953, "global_step": 467605, "epoch": 2783} {"train_loss": -11.439895629882812, "global_step": 467606, "epoch": 2783} {"train_loss": -10.748891830444336, "global_step": 467607, "epoch": 2783} {"train_loss": -10.354475975036621, "global_step": 467608, "epoch": 2783} {"train_loss": -11.574764251708984, "global_step": 467609, "epoch": 2783} {"train_loss": -11.366060256958008, "global_step": 467610, "epoch": 2783} {"train_loss": -11.851846694946289, "global_step": 467611, "epoch": 2783} {"train_loss": -11.942089080810547, "global_step": 467612, "epoch": 2783} {"train_loss": -11.697954177856445, "global_step": 467613, "epoch": 2783} {"train_loss": -12.15239143371582, "global_step": 467614, "epoch": 2783} {"train_loss": -11.708805084228516, "global_step": 467615, "epoch": 2783} {"train_loss": -11.974759101867676, "global_step": 467616, "epoch": 2783} {"train_loss": -11.838441848754883, "global_step": 467617, "epoch": 2783} {"train_loss": -12.196752548217773, "global_step": 467618, "epoch": 2783} {"train_loss": -11.94014835357666, "global_step": 467619, "epoch": 2783} {"train_loss": -11.755657196044922, "global_step": 467620, "epoch": 2783} {"train_loss": -11.975785255432129, "global_step": 467621, "epoch": 2783} {"train_loss": -11.98531723022461, "global_step": 467622, "epoch": 2783} {"train_loss": -12.429141998291016, "global_step": 467623, "epoch": 2783} {"train_loss": -12.07929801940918, "global_step": 467624, "epoch": 2783} {"train_loss": -12.53911018371582, "global_step": 467625, "epoch": 2783} {"train_loss": -12.106163024902344, "global_step": 467626, "epoch": 2783} {"train_loss": -12.34896469116211, "global_step": 467627, "epoch": 2783} {"train_loss": -12.367209434509277, "global_step": 467628, "epoch": 2783} {"train_loss": -12.44007682800293, "global_step": 467629, "epoch": 2783} {"train_loss": -12.253728866577148, "global_step": 467630, "epoch": 2783} {"train_loss": -12.198967933654785, "global_step": 467631, "epoch": 2783} {"train_loss": -12.361437797546387, "global_step": 467632, "epoch": 2783} {"train_loss": -12.312651634216309, "global_step": 467633, "epoch": 2783} {"train_loss": -12.235507011413574, "global_step": 467634, "epoch": 2783} {"train_loss": -12.379919052124023, "global_step": 467635, "epoch": 2783} {"train_loss": -12.615196228027344, "global_step": 467636, "epoch": 2783} {"train_loss": -12.441106796264648, "global_step": 467637, "epoch": 2783} {"train_loss": -12.482882499694824, "global_step": 467638, "epoch": 2783} {"train_loss": -12.38464069366455, "global_step": 467639, "epoch": 2783} {"train_loss": -12.415925979614258, "global_step": 467640, "epoch": 2783} {"train_loss": -12.435243606567383, "global_step": 467641, "epoch": 2783} {"train_loss": -12.002558708190918, "global_step": 467642, "epoch": 2783} {"train_loss": -12.517890930175781, "global_step": 467643, "epoch": 2783} {"train_loss": -12.179117202758789, "global_step": 467644, "epoch": 2783} {"train_loss": -12.590198516845703, "global_step": 467645, "epoch": 2783} {"train_loss": -11.93517017364502, "global_step": 467646, "epoch": 2783} {"train_loss": -12.543497085571289, "global_step": 467647, "epoch": 2783} {"train_loss": -12.367806434631348, "global_step": 467648, "epoch": 2783} {"train_loss": -12.103009223937988, "global_step": 467649, "epoch": 2783} {"train_loss": -12.480428695678711, "global_step": 467650, "epoch": 2783} {"train_loss": -12.3035888671875, "global_step": 467651, "epoch": 2783} {"train_loss": -12.471850395202637, "global_step": 467652, "epoch": 2783} {"train_loss": -12.478629112243652, "global_step": 467653, "epoch": 2783} {"train_loss": -12.16933822631836, "global_step": 467654, "epoch": 2783} {"train_loss": -12.624490737915039, "global_step": 467655, "epoch": 2783} {"train_loss": -12.238130569458008, "global_step": 467656, "epoch": 2783} {"train_loss": -12.47558879852295, "global_step": 467657, "epoch": 2783} {"train_loss": -12.534313201904297, "global_step": 467658, "epoch": 2783} {"train_loss": -12.207769393920898, "global_step": 467659, "epoch": 2783} {"train_loss": -12.248435974121094, "global_step": 467660, "epoch": 2783} {"train_loss": -12.41352653503418, "global_step": 467661, "epoch": 2783} {"train_loss": -12.0612211227417, "global_step": 467662, "epoch": 2783} {"train_loss": -12.137975692749023, "global_step": 467663, "epoch": 2783} {"train_loss": -12.100593566894531, "global_step": 467664, "epoch": 2783} {"train_loss": -12.120199203491211, "global_step": 467665, "epoch": 2783} {"train_loss": -12.293754577636719, "global_step": 467666, "epoch": 2783} {"train_loss": -12.141127586364746, "global_step": 467667, "epoch": 2783} {"train_loss": -12.628209114074707, "global_step": 467668, "epoch": 2783} {"train_loss": -12.199825286865234, "global_step": 467669, "epoch": 2783} {"train_loss": -12.41617202758789, "global_step": 467670, "epoch": 2783} {"train_loss": -12.114775657653809, "global_step": 467671, "epoch": 2783} {"train_loss": -12.60198974609375, "global_step": 467672, "epoch": 2783} {"train_loss": -12.458990097045898, "global_step": 467673, "epoch": 2783} {"train_loss": -12.061417579650879, "global_step": 467674, "epoch": 2783} {"train_loss": -12.308337211608887, "global_step": 467675, "epoch": 2783} {"train_loss": -12.024430274963379, "global_step": 467676, "epoch": 2783} {"train_loss": -12.31940746307373, "global_step": 467677, "epoch": 2783} {"train_loss": -12.558176040649414, "global_step": 467678, "epoch": 2783} {"train_loss": -11.781469345092773, "global_step": 467679, "epoch": 2783} {"train_loss": -12.44876480102539, "global_step": 467680, "epoch": 2783} {"train_loss": -12.55068588256836, "global_step": 467681, "epoch": 2783} {"train_loss": -12.505510330200195, "global_step": 467682, "epoch": 2783} {"train_loss": -12.476045608520508, "global_step": 467683, "epoch": 2783} {"train_loss": -12.445022583007812, "global_step": 467684, "epoch": 2783} {"train_loss": -12.558012962341309, "global_step": 467685, "epoch": 2783} {"train_loss": -12.39754867553711, "global_step": 467686, "epoch": 2783} {"train_loss": -12.517470359802246, "global_step": 467687, "epoch": 2783} {"train_loss": -12.461965560913086, "global_step": 467688, "epoch": 2783} {"train_loss": -12.195091247558594, "global_step": 467689, "epoch": 2783} {"train_loss": -12.447568893432617, "global_step": 467690, "epoch": 2783} {"train_loss": -12.1757230758667, "global_step": 467691, "epoch": 2783} {"train_loss": -12.372482299804688, "global_step": 467692, "epoch": 2783} {"train_loss": -12.369393348693848, "global_step": 467693, "epoch": 2783} {"train_loss": -12.249443054199219, "global_step": 467694, "epoch": 2783} {"train_loss": -12.342723846435547, "global_step": 467695, "epoch": 2783} {"train_loss": -12.7474946975708, "global_step": 467696, "epoch": 2783} {"train_loss": -12.699934005737305, "global_step": 467697, "epoch": 2783} {"train_loss": -12.822491645812988, "global_step": 467698, "epoch": 2783} {"train_loss": -12.380910873413086, "global_step": 467699, "epoch": 2783} {"train_loss": -12.56754207611084, "global_step": 467700, "epoch": 2783} {"train_loss": -11.997357368469238, "global_step": 467701, "epoch": 2783} {"train_loss": -12.449681282043457, "global_step": 467702, "epoch": 2783} {"train_loss": -12.239137649536133, "global_step": 467703, "epoch": 2783} {"train_loss": -12.085861206054688, "global_step": 467704, "epoch": 2783} {"train_loss": -12.29037857055664, "global_step": 467705, "epoch": 2783} {"train_loss": -12.18340015411377, "global_step": 467706, "epoch": 2783} {"train_loss": -12.27409553527832, "global_step": 467707, "epoch": 2783} {"train_loss": -11.39957332611084, "global_step": 467708, "epoch": 2783} {"train_loss": -12.172004699707031, "global_step": 467709, "epoch": 2783} {"train_loss": -11.424127578735352, "global_step": 467710, "epoch": 2783} {"train_loss": -11.954124850886208, "global_step": 467711, "epoch": 2783, "val_loss": 317656.34375} {"train_loss": -10.701480865478516, "global_step": 467712, "epoch": 2784} {"train_loss": -10.708724975585938, "global_step": 467713, "epoch": 2784} {"train_loss": -12.168659210205078, "global_step": 467714, "epoch": 2784} {"train_loss": -11.308913230895996, "global_step": 467715, "epoch": 2784} {"train_loss": -11.24356746673584, "global_step": 467716, "epoch": 2784} {"train_loss": -11.978904724121094, "global_step": 467717, "epoch": 2784} {"train_loss": -10.685880661010742, "global_step": 467718, "epoch": 2784} {"train_loss": -11.495203018188477, "global_step": 467719, "epoch": 2784} {"train_loss": -12.00474739074707, "global_step": 467720, "epoch": 2784} {"train_loss": -10.121685981750488, "global_step": 467721, "epoch": 2784} {"train_loss": -12.596482276916504, "global_step": 467722, "epoch": 2784} {"train_loss": -11.7133150100708, "global_step": 467723, "epoch": 2784} {"train_loss": -11.678433418273926, "global_step": 467724, "epoch": 2784} {"train_loss": -12.623873710632324, "global_step": 467725, "epoch": 2784} {"train_loss": -11.256132125854492, "global_step": 467726, "epoch": 2784} {"train_loss": -12.122812271118164, "global_step": 467727, "epoch": 2784} {"train_loss": -12.000662803649902, "global_step": 467728, "epoch": 2784} {"train_loss": -12.022966384887695, "global_step": 467729, "epoch": 2784} {"train_loss": -12.34939193725586, "global_step": 467730, "epoch": 2784} {"train_loss": -12.264732360839844, "global_step": 467731, "epoch": 2784} {"train_loss": -12.255168914794922, "global_step": 467732, "epoch": 2784} {"train_loss": -12.078350067138672, "global_step": 467733, "epoch": 2784} {"train_loss": -12.061954498291016, "global_step": 467734, "epoch": 2784} {"train_loss": -12.367015838623047, "global_step": 467735, "epoch": 2784} {"train_loss": -12.239654541015625, "global_step": 467736, "epoch": 2784} {"train_loss": -12.6064453125, "global_step": 467737, "epoch": 2784} {"train_loss": -12.427478790283203, "global_step": 467738, "epoch": 2784} {"train_loss": -12.7967529296875, "global_step": 467739, "epoch": 2784} {"train_loss": -12.553962707519531, "global_step": 467740, "epoch": 2784} {"train_loss": -12.35694408416748, "global_step": 467741, "epoch": 2784} {"train_loss": -12.527591705322266, "global_step": 467742, "epoch": 2784} {"train_loss": -12.314111709594727, "global_step": 467743, "epoch": 2784} {"train_loss": -12.657389640808105, "global_step": 467744, "epoch": 2784} {"train_loss": -12.760030746459961, "global_step": 467745, "epoch": 2784} {"train_loss": -12.631179809570312, "global_step": 467746, "epoch": 2784} {"train_loss": -12.441956520080566, "global_step": 467747, "epoch": 2784} {"train_loss": -12.749320983886719, "global_step": 467748, "epoch": 2784} {"train_loss": -12.678499221801758, "global_step": 467749, "epoch": 2784} {"train_loss": -12.786733627319336, "global_step": 467750, "epoch": 2784} {"train_loss": -12.264853477478027, "global_step": 467751, "epoch": 2784} {"train_loss": -12.66955280303955, "global_step": 467752, "epoch": 2784} {"train_loss": -12.630839347839355, "global_step": 467753, "epoch": 2784} {"train_loss": -12.645259857177734, "global_step": 467754, "epoch": 2784} {"train_loss": -12.668986320495605, "global_step": 467755, "epoch": 2784} {"train_loss": -12.634912490844727, "global_step": 467756, "epoch": 2784} {"train_loss": -12.689204216003418, "global_step": 467757, "epoch": 2784} {"train_loss": -12.817630767822266, "global_step": 467758, "epoch": 2784} {"train_loss": -12.75900650024414, "global_step": 467759, "epoch": 2784} {"train_loss": -12.818647384643555, "global_step": 467760, "epoch": 2784} {"train_loss": -12.923412322998047, "global_step": 467761, "epoch": 2784} {"train_loss": -12.669718742370605, "global_step": 467762, "epoch": 2784} {"train_loss": -12.78647232055664, "global_step": 467763, "epoch": 2784} {"train_loss": -12.471246719360352, "global_step": 467764, "epoch": 2784} {"train_loss": -12.193821907043457, "global_step": 467765, "epoch": 2784} {"train_loss": -12.715479850769043, "global_step": 467766, "epoch": 2784} {"train_loss": -12.608022689819336, "global_step": 467767, "epoch": 2784} {"train_loss": -12.544395446777344, "global_step": 467768, "epoch": 2784} {"train_loss": -12.784608840942383, "global_step": 467769, "epoch": 2784} {"train_loss": -12.226608276367188, "global_step": 467770, "epoch": 2784} {"train_loss": -12.576610565185547, "global_step": 467771, "epoch": 2784} {"train_loss": -11.7952880859375, "global_step": 467772, "epoch": 2784} {"train_loss": -11.624680519104004, "global_step": 467773, "epoch": 2784} {"train_loss": -12.547880172729492, "global_step": 467774, "epoch": 2784} {"train_loss": -11.627470970153809, "global_step": 467775, "epoch": 2784} {"train_loss": -11.292327880859375, "global_step": 467776, "epoch": 2784} {"train_loss": -12.16537857055664, "global_step": 467777, "epoch": 2784} {"train_loss": -9.827600479125977, "global_step": 467778, "epoch": 2784} {"train_loss": -11.261658668518066, "global_step": 467779, "epoch": 2784} {"train_loss": -11.50046157836914, "global_step": 467780, "epoch": 2784} {"train_loss": -11.401171684265137, "global_step": 467781, "epoch": 2784} {"train_loss": -11.571109771728516, "global_step": 467782, "epoch": 2784} {"train_loss": -11.561561584472656, "global_step": 467783, "epoch": 2784} {"train_loss": -11.677263259887695, "global_step": 467784, "epoch": 2784} {"train_loss": -10.354409217834473, "global_step": 467785, "epoch": 2784} {"train_loss": -11.864316940307617, "global_step": 467786, "epoch": 2784} {"train_loss": -9.296754837036133, "global_step": 467787, "epoch": 2784} {"train_loss": -12.487553596496582, "global_step": 467788, "epoch": 2784} {"train_loss": -10.0587158203125, "global_step": 467789, "epoch": 2784} {"train_loss": -11.963813781738281, "global_step": 467790, "epoch": 2784} {"train_loss": -10.93213176727295, "global_step": 467791, "epoch": 2784} {"train_loss": -10.307502746582031, "global_step": 467792, "epoch": 2784} {"train_loss": -11.701204299926758, "global_step": 467793, "epoch": 2784} {"train_loss": -10.011314392089844, "global_step": 467794, "epoch": 2784} {"train_loss": -11.817054748535156, "global_step": 467795, "epoch": 2784} {"train_loss": -10.21252155303955, "global_step": 467796, "epoch": 2784} {"train_loss": -10.583401679992676, "global_step": 467797, "epoch": 2784} {"train_loss": -11.617816925048828, "global_step": 467798, "epoch": 2784} {"train_loss": -10.960733413696289, "global_step": 467799, "epoch": 2784} {"train_loss": -11.259284973144531, "global_step": 467800, "epoch": 2784} {"train_loss": -11.390857696533203, "global_step": 467801, "epoch": 2784} {"train_loss": -10.512587547302246, "global_step": 467802, "epoch": 2784} {"train_loss": -11.61063003540039, "global_step": 467803, "epoch": 2784} {"train_loss": -11.144318580627441, "global_step": 467804, "epoch": 2784} {"train_loss": -11.798362731933594, "global_step": 467805, "epoch": 2784} {"train_loss": -11.809436798095703, "global_step": 467806, "epoch": 2784} {"train_loss": -11.945685386657715, "global_step": 467807, "epoch": 2784} {"train_loss": -11.583274841308594, "global_step": 467808, "epoch": 2784} {"train_loss": -11.720715522766113, "global_step": 467809, "epoch": 2784} {"train_loss": -11.882452964782715, "global_step": 467810, "epoch": 2784} {"train_loss": -11.493509292602539, "global_step": 467811, "epoch": 2784} {"train_loss": -12.100555419921875, "global_step": 467812, "epoch": 2784} {"train_loss": -12.323556900024414, "global_step": 467813, "epoch": 2784} {"train_loss": -12.401318550109863, "global_step": 467814, "epoch": 2784} {"train_loss": -11.978386878967285, "global_step": 467815, "epoch": 2784} {"train_loss": -12.16048812866211, "global_step": 467816, "epoch": 2784} {"train_loss": -12.165992736816406, "global_step": 467817, "epoch": 2784} {"train_loss": -12.34239387512207, "global_step": 467818, "epoch": 2784} {"train_loss": -12.53506088256836, "global_step": 467819, "epoch": 2784} {"train_loss": -12.358663558959961, "global_step": 467820, "epoch": 2784} {"train_loss": -11.657833099365234, "global_step": 467821, "epoch": 2784} {"train_loss": -12.413665771484375, "global_step": 467822, "epoch": 2784} {"train_loss": -12.1754150390625, "global_step": 467823, "epoch": 2784} {"train_loss": -12.679770469665527, "global_step": 467824, "epoch": 2784} {"train_loss": -12.48544692993164, "global_step": 467825, "epoch": 2784} {"train_loss": -12.408333778381348, "global_step": 467826, "epoch": 2784} {"train_loss": -12.20146369934082, "global_step": 467827, "epoch": 2784} {"train_loss": -12.432001113891602, "global_step": 467828, "epoch": 2784} {"train_loss": -12.572339057922363, "global_step": 467829, "epoch": 2784} {"train_loss": -12.382586479187012, "global_step": 467830, "epoch": 2784} {"train_loss": -12.518960952758789, "global_step": 467831, "epoch": 2784} {"train_loss": -12.528255462646484, "global_step": 467832, "epoch": 2784} {"train_loss": -12.671728134155273, "global_step": 467833, "epoch": 2784} {"train_loss": -12.397550582885742, "global_step": 467834, "epoch": 2784} {"train_loss": -12.638460159301758, "global_step": 467835, "epoch": 2784} {"train_loss": -12.387447357177734, "global_step": 467836, "epoch": 2784} {"train_loss": -12.452926635742188, "global_step": 467837, "epoch": 2784} {"train_loss": -12.723320007324219, "global_step": 467838, "epoch": 2784} {"train_loss": -12.777594566345215, "global_step": 467839, "epoch": 2784} {"train_loss": -12.921016693115234, "global_step": 467840, "epoch": 2784} {"train_loss": -12.44115161895752, "global_step": 467841, "epoch": 2784} {"train_loss": -12.814065933227539, "global_step": 467842, "epoch": 2784} {"train_loss": -12.777825355529785, "global_step": 467843, "epoch": 2784} {"train_loss": -12.607141494750977, "global_step": 467844, "epoch": 2784} {"train_loss": -12.800159454345703, "global_step": 467845, "epoch": 2784} {"train_loss": -12.68381118774414, "global_step": 467846, "epoch": 2784} {"train_loss": -12.747096061706543, "global_step": 467847, "epoch": 2784} {"train_loss": -12.717510223388672, "global_step": 467848, "epoch": 2784} {"train_loss": -12.704334259033203, "global_step": 467849, "epoch": 2784} {"train_loss": -12.746267318725586, "global_step": 467850, "epoch": 2784} {"train_loss": -12.85054874420166, "global_step": 467851, "epoch": 2784} {"train_loss": -12.681049346923828, "global_step": 467852, "epoch": 2784} {"train_loss": -12.8502836227417, "global_step": 467853, "epoch": 2784} {"train_loss": -12.81312084197998, "global_step": 467854, "epoch": 2784} {"train_loss": -12.922821044921875, "global_step": 467855, "epoch": 2784} {"train_loss": -12.716139793395996, "global_step": 467856, "epoch": 2784} {"train_loss": -12.917794227600098, "global_step": 467857, "epoch": 2784} {"train_loss": -12.779712677001953, "global_step": 467858, "epoch": 2784} {"train_loss": -12.699849128723145, "global_step": 467859, "epoch": 2784} {"train_loss": -12.698958396911621, "global_step": 467860, "epoch": 2784} {"train_loss": -12.811370849609375, "global_step": 467861, "epoch": 2784} {"train_loss": -12.988751411437988, "global_step": 467862, "epoch": 2784} {"train_loss": -12.702468872070312, "global_step": 467863, "epoch": 2784} {"train_loss": -12.47715950012207, "global_step": 467864, "epoch": 2784} {"train_loss": -12.762598037719727, "global_step": 467865, "epoch": 2784} {"train_loss": -12.99481201171875, "global_step": 467866, "epoch": 2784} {"train_loss": -12.926416397094727, "global_step": 467867, "epoch": 2784} {"train_loss": -12.682828903198242, "global_step": 467868, "epoch": 2784} {"train_loss": -12.75556755065918, "global_step": 467869, "epoch": 2784} {"train_loss": -12.626166343688965, "global_step": 467870, "epoch": 2784} {"train_loss": -12.705533027648926, "global_step": 467871, "epoch": 2784} {"train_loss": -12.909271240234375, "global_step": 467872, "epoch": 2784} {"train_loss": -12.662553787231445, "global_step": 467873, "epoch": 2784} {"train_loss": -12.949003219604492, "global_step": 467874, "epoch": 2784} {"train_loss": -12.73363208770752, "global_step": 467875, "epoch": 2784} {"train_loss": -12.600735664367676, "global_step": 467876, "epoch": 2784} {"train_loss": -12.624612808227539, "global_step": 467877, "epoch": 2784} {"train_loss": -12.569112777709961, "global_step": 467878, "epoch": 2784} {"train_loss": -12.16684739362626, "global_step": 467879, "epoch": 2784, "val_loss": 315569.5625} {"train_loss": -12.461673736572266, "global_step": 467880, "epoch": 2785} {"train_loss": -12.279520988464355, "global_step": 467881, "epoch": 2785} {"train_loss": -12.30141830444336, "global_step": 467882, "epoch": 2785} {"train_loss": -12.43524169921875, "global_step": 467883, "epoch": 2785} {"train_loss": -11.836156845092773, "global_step": 467884, "epoch": 2785} {"train_loss": -12.36518383026123, "global_step": 467885, "epoch": 2785} {"train_loss": -12.586552619934082, "global_step": 467886, "epoch": 2785} {"train_loss": -12.246099472045898, "global_step": 467887, "epoch": 2785} {"train_loss": -12.556502342224121, "global_step": 467888, "epoch": 2785} {"train_loss": -12.856077194213867, "global_step": 467889, "epoch": 2785} {"train_loss": -12.248504638671875, "global_step": 467890, "epoch": 2785} {"train_loss": -12.111886978149414, "global_step": 467891, "epoch": 2785} {"train_loss": -12.113046646118164, "global_step": 467892, "epoch": 2785} {"train_loss": -12.373900413513184, "global_step": 467893, "epoch": 2785} {"train_loss": -11.587080001831055, "global_step": 467894, "epoch": 2785} {"train_loss": -11.966432571411133, "global_step": 467895, "epoch": 2785} {"train_loss": -12.044675827026367, "global_step": 467896, "epoch": 2785} {"train_loss": -11.734416007995605, "global_step": 467897, "epoch": 2785} {"train_loss": -12.195646286010742, "global_step": 467898, "epoch": 2785} {"train_loss": -11.414000511169434, "global_step": 467899, "epoch": 2785} {"train_loss": -11.789097785949707, "global_step": 467900, "epoch": 2785} {"train_loss": -12.073332786560059, "global_step": 467901, "epoch": 2785} {"train_loss": -10.839325904846191, "global_step": 467902, "epoch": 2785} {"train_loss": -12.00397777557373, "global_step": 467903, "epoch": 2785} {"train_loss": -11.652793884277344, "global_step": 467904, "epoch": 2785} {"train_loss": -12.424077987670898, "global_step": 467905, "epoch": 2785} {"train_loss": -12.409812927246094, "global_step": 467906, "epoch": 2785} {"train_loss": -11.767173767089844, "global_step": 467907, "epoch": 2785} {"train_loss": -12.353483200073242, "global_step": 467908, "epoch": 2785} {"train_loss": -12.159683227539062, "global_step": 467909, "epoch": 2785} {"train_loss": -11.177729606628418, "global_step": 467910, "epoch": 2785} {"train_loss": -12.548627853393555, "global_step": 467911, "epoch": 2785} {"train_loss": -11.083761215209961, "global_step": 467912, "epoch": 2785} {"train_loss": -11.52663803100586, "global_step": 467913, "epoch": 2785} {"train_loss": -12.271743774414062, "global_step": 467914, "epoch": 2785} {"train_loss": -10.70429801940918, "global_step": 467915, "epoch": 2785} {"train_loss": -11.310529708862305, "global_step": 467916, "epoch": 2785} {"train_loss": -10.521591186523438, "global_step": 467917, "epoch": 2785} {"train_loss": -10.739530563354492, "global_step": 467918, "epoch": 2785} {"train_loss": -11.443075180053711, "global_step": 467919, "epoch": 2785} {"train_loss": -10.273003578186035, "global_step": 467920, "epoch": 2785} {"train_loss": -10.606267929077148, "global_step": 467921, "epoch": 2785} {"train_loss": -11.310990333557129, "global_step": 467922, "epoch": 2785} {"train_loss": -9.69659423828125, "global_step": 467923, "epoch": 2785} {"train_loss": -11.256357192993164, "global_step": 467924, "epoch": 2785} {"train_loss": -9.85871696472168, "global_step": 467925, "epoch": 2785} {"train_loss": -9.823661804199219, "global_step": 467926, "epoch": 2785} {"train_loss": -10.501423835754395, "global_step": 467927, "epoch": 2785} {"train_loss": -11.266351699829102, "global_step": 467928, "epoch": 2785} {"train_loss": -10.71247673034668, "global_step": 467929, "epoch": 2785} {"train_loss": -9.926774024963379, "global_step": 467930, "epoch": 2785} {"train_loss": -10.79597282409668, "global_step": 467931, "epoch": 2785} {"train_loss": -11.55707836151123, "global_step": 467932, "epoch": 2785} {"train_loss": -11.567449569702148, "global_step": 467933, "epoch": 2785} {"train_loss": -11.804924011230469, "global_step": 467934, "epoch": 2785} {"train_loss": -11.675806999206543, "global_step": 467935, "epoch": 2785} {"train_loss": -10.833674430847168, "global_step": 467936, "epoch": 2785} {"train_loss": -11.433509826660156, "global_step": 467937, "epoch": 2785} {"train_loss": -11.330074310302734, "global_step": 467938, "epoch": 2785} {"train_loss": -11.280056953430176, "global_step": 467939, "epoch": 2785} {"train_loss": -12.114320755004883, "global_step": 467940, "epoch": 2785} {"train_loss": -11.619878768920898, "global_step": 467941, "epoch": 2785} {"train_loss": -11.661517143249512, "global_step": 467942, "epoch": 2785} {"train_loss": -11.793262481689453, "global_step": 467943, "epoch": 2785} {"train_loss": -11.699820518493652, "global_step": 467944, "epoch": 2785} {"train_loss": -12.075738906860352, "global_step": 467945, "epoch": 2785} {"train_loss": -11.74612045288086, "global_step": 467946, "epoch": 2785} {"train_loss": -12.498929023742676, "global_step": 467947, "epoch": 2785} {"train_loss": -12.046783447265625, "global_step": 467948, "epoch": 2785} {"train_loss": -12.292855262756348, "global_step": 467949, "epoch": 2785} {"train_loss": -12.289117813110352, "global_step": 467950, "epoch": 2785} {"train_loss": -12.318815231323242, "global_step": 467951, "epoch": 2785} {"train_loss": -12.4420747756958, "global_step": 467952, "epoch": 2785} {"train_loss": -12.427543640136719, "global_step": 467953, "epoch": 2785} {"train_loss": -12.530174255371094, "global_step": 467954, "epoch": 2785} {"train_loss": -12.504912376403809, "global_step": 467955, "epoch": 2785} {"train_loss": -12.53302001953125, "global_step": 467956, "epoch": 2785} {"train_loss": -12.303495407104492, "global_step": 467957, "epoch": 2785} {"train_loss": -12.522527694702148, "global_step": 467958, "epoch": 2785} {"train_loss": -12.71664810180664, "global_step": 467959, "epoch": 2785} {"train_loss": -12.582914352416992, "global_step": 467960, "epoch": 2785} {"train_loss": -12.519548416137695, "global_step": 467961, "epoch": 2785} {"train_loss": -12.81734561920166, "global_step": 467962, "epoch": 2785} {"train_loss": -12.582728385925293, "global_step": 467963, "epoch": 2785} {"train_loss": -12.705041885375977, "global_step": 467964, "epoch": 2785} {"train_loss": -12.423040390014648, "global_step": 467965, "epoch": 2785} {"train_loss": -12.308334350585938, "global_step": 467966, "epoch": 2785} {"train_loss": -12.454193115234375, "global_step": 467967, "epoch": 2785} {"train_loss": -12.601404190063477, "global_step": 467968, "epoch": 2785} {"train_loss": -12.485695838928223, "global_step": 467969, "epoch": 2785} {"train_loss": -12.73481559753418, "global_step": 467970, "epoch": 2785} {"train_loss": -12.449284553527832, "global_step": 467971, "epoch": 2785} {"train_loss": -12.73033332824707, "global_step": 467972, "epoch": 2785} {"train_loss": -12.37453842163086, "global_step": 467973, "epoch": 2785} {"train_loss": -12.670037269592285, "global_step": 467974, "epoch": 2785} {"train_loss": -12.606849670410156, "global_step": 467975, "epoch": 2785} {"train_loss": -12.671064376831055, "global_step": 467976, "epoch": 2785} {"train_loss": -12.76068115234375, "global_step": 467977, "epoch": 2785} {"train_loss": -12.658727645874023, "global_step": 467978, "epoch": 2785} {"train_loss": -12.516597747802734, "global_step": 467979, "epoch": 2785} {"train_loss": -12.741729736328125, "global_step": 467980, "epoch": 2785} {"train_loss": -12.683938980102539, "global_step": 467981, "epoch": 2785} {"train_loss": -12.712966918945312, "global_step": 467982, "epoch": 2785} {"train_loss": -12.42884635925293, "global_step": 467983, "epoch": 2785} {"train_loss": -12.774421691894531, "global_step": 467984, "epoch": 2785} {"train_loss": -12.672122955322266, "global_step": 467985, "epoch": 2785} {"train_loss": -12.782602310180664, "global_step": 467986, "epoch": 2785} {"train_loss": -12.549636840820312, "global_step": 467987, "epoch": 2785} {"train_loss": -13.030097961425781, "global_step": 467988, "epoch": 2785} {"train_loss": -12.464437484741211, "global_step": 467989, "epoch": 2785} {"train_loss": -12.837635040283203, "global_step": 467990, "epoch": 2785} {"train_loss": -12.673242568969727, "global_step": 467991, "epoch": 2785} {"train_loss": -12.690975189208984, "global_step": 467992, "epoch": 2785} {"train_loss": -12.641193389892578, "global_step": 467993, "epoch": 2785} {"train_loss": -12.841985702514648, "global_step": 467994, "epoch": 2785} {"train_loss": -12.838031768798828, "global_step": 467995, "epoch": 2785} {"train_loss": -12.317002296447754, "global_step": 467996, "epoch": 2785} {"train_loss": -12.04944896697998, "global_step": 467997, "epoch": 2785} {"train_loss": -12.698480606079102, "global_step": 467998, "epoch": 2785} {"train_loss": -12.618520736694336, "global_step": 467999, "epoch": 2785} {"train_loss": -12.092458724975586, "global_step": 468000, "epoch": 2785} {"train_loss": -12.402179718017578, "global_step": 468001, "epoch": 2785} {"train_loss": -12.36842155456543, "global_step": 468002, "epoch": 2785} {"train_loss": -12.626049041748047, "global_step": 468003, "epoch": 2785} {"train_loss": -12.23830795288086, "global_step": 468004, "epoch": 2785} {"train_loss": -12.550369262695312, "global_step": 468005, "epoch": 2785} {"train_loss": -12.110584259033203, "global_step": 468006, "epoch": 2785} {"train_loss": -12.334614753723145, "global_step": 468007, "epoch": 2785} {"train_loss": -12.723020553588867, "global_step": 468008, "epoch": 2785} {"train_loss": -12.32180404663086, "global_step": 468009, "epoch": 2785} {"train_loss": -12.702974319458008, "global_step": 468010, "epoch": 2785} {"train_loss": -12.851238250732422, "global_step": 468011, "epoch": 2785} {"train_loss": -12.56619644165039, "global_step": 468012, "epoch": 2785} {"train_loss": -12.29952621459961, "global_step": 468013, "epoch": 2785} {"train_loss": -12.534812927246094, "global_step": 468014, "epoch": 2785} {"train_loss": -12.181459426879883, "global_step": 468015, "epoch": 2785} {"train_loss": -12.274801254272461, "global_step": 468016, "epoch": 2785} {"train_loss": -11.97541332244873, "global_step": 468017, "epoch": 2785} {"train_loss": -12.809556007385254, "global_step": 468018, "epoch": 2785} {"train_loss": -12.368432998657227, "global_step": 468019, "epoch": 2785} {"train_loss": -12.144195556640625, "global_step": 468020, "epoch": 2785} {"train_loss": -12.330791473388672, "global_step": 468021, "epoch": 2785} {"train_loss": -12.64141845703125, "global_step": 468022, "epoch": 2785} {"train_loss": -12.145835876464844, "global_step": 468023, "epoch": 2785} {"train_loss": -12.181619644165039, "global_step": 468024, "epoch": 2785} {"train_loss": -11.862876892089844, "global_step": 468025, "epoch": 2785} {"train_loss": -12.144058227539062, "global_step": 468026, "epoch": 2785} {"train_loss": -11.521341323852539, "global_step": 468027, "epoch": 2785} {"train_loss": -12.057071685791016, "global_step": 468028, "epoch": 2785} {"train_loss": -12.415705680847168, "global_step": 468029, "epoch": 2785} {"train_loss": -12.054680824279785, "global_step": 468030, "epoch": 2785} {"train_loss": -11.97142219543457, "global_step": 468031, "epoch": 2785} {"train_loss": -12.34259033203125, "global_step": 468032, "epoch": 2785} {"train_loss": -12.395047187805176, "global_step": 468033, "epoch": 2785} {"train_loss": -12.010517120361328, "global_step": 468034, "epoch": 2785} {"train_loss": -11.8693265914917, "global_step": 468035, "epoch": 2785} {"train_loss": -11.804034233093262, "global_step": 468036, "epoch": 2785} {"train_loss": -10.92623233795166, "global_step": 468037, "epoch": 2785} {"train_loss": -11.804727554321289, "global_step": 468038, "epoch": 2785} {"train_loss": -11.434765815734863, "global_step": 468039, "epoch": 2785} {"train_loss": -11.677774429321289, "global_step": 468040, "epoch": 2785} {"train_loss": -11.92418098449707, "global_step": 468041, "epoch": 2785} {"train_loss": -11.694816589355469, "global_step": 468042, "epoch": 2785} {"train_loss": -11.642565727233887, "global_step": 468043, "epoch": 2785} {"train_loss": -12.811410903930664, "global_step": 468044, "epoch": 2785} {"train_loss": -11.321070671081543, "global_step": 468045, "epoch": 2785} {"train_loss": -12.509134292602539, "global_step": 468046, "epoch": 2785} {"train_loss": -12.063246199062892, "global_step": 468047, "epoch": 2785, "val_loss": 313524.84375, "train_action_mse_error": 1.383443832397461} {"train_loss": -11.548940658569336, "global_step": 468048, "epoch": 2786} {"train_loss": -12.506771087646484, "global_step": 468049, "epoch": 2786} {"train_loss": -11.336792945861816, "global_step": 468050, "epoch": 2786} {"train_loss": -11.263978004455566, "global_step": 468051, "epoch": 2786} {"train_loss": -10.507495880126953, "global_step": 468052, "epoch": 2786} {"train_loss": -11.57858657836914, "global_step": 468053, "epoch": 2786} {"train_loss": -10.970523834228516, "global_step": 468054, "epoch": 2786} {"train_loss": -11.904960632324219, "global_step": 468055, "epoch": 2786} {"train_loss": -11.722220420837402, "global_step": 468056, "epoch": 2786} {"train_loss": -10.538649559020996, "global_step": 468057, "epoch": 2786} {"train_loss": -12.121207237243652, "global_step": 468058, "epoch": 2786} {"train_loss": -11.619470596313477, "global_step": 468059, "epoch": 2786} {"train_loss": -11.148348808288574, "global_step": 468060, "epoch": 2786} {"train_loss": -10.856001853942871, "global_step": 468061, "epoch": 2786} {"train_loss": -11.59711742401123, "global_step": 468062, "epoch": 2786} {"train_loss": -10.473737716674805, "global_step": 468063, "epoch": 2786} {"train_loss": -10.267891883850098, "global_step": 468064, "epoch": 2786} {"train_loss": -10.952054977416992, "global_step": 468065, "epoch": 2786} {"train_loss": -11.241089820861816, "global_step": 468066, "epoch": 2786} {"train_loss": -9.964067459106445, "global_step": 468067, "epoch": 2786} {"train_loss": -9.609050750732422, "global_step": 468068, "epoch": 2786} {"train_loss": -10.559833526611328, "global_step": 468069, "epoch": 2786} {"train_loss": -9.922285079956055, "global_step": 468070, "epoch": 2786} {"train_loss": -10.570170402526855, "global_step": 468071, "epoch": 2786} {"train_loss": -9.89687728881836, "global_step": 468072, "epoch": 2786} {"train_loss": -10.937995910644531, "global_step": 468073, "epoch": 2786} {"train_loss": -10.99148178100586, "global_step": 468074, "epoch": 2786} {"train_loss": -11.96990966796875, "global_step": 468075, "epoch": 2786} {"train_loss": -11.369682312011719, "global_step": 468076, "epoch": 2786} {"train_loss": -11.684795379638672, "global_step": 468077, "epoch": 2786} {"train_loss": -11.360837936401367, "global_step": 468078, "epoch": 2786} {"train_loss": -11.53349494934082, "global_step": 468079, "epoch": 2786} {"train_loss": -11.184906005859375, "global_step": 468080, "epoch": 2786} {"train_loss": -11.585107803344727, "global_step": 468081, "epoch": 2786} {"train_loss": -11.378825187683105, "global_step": 468082, "epoch": 2786} {"train_loss": -11.50417423248291, "global_step": 468083, "epoch": 2786} {"train_loss": -11.671228408813477, "global_step": 468084, "epoch": 2786} {"train_loss": -12.19265079498291, "global_step": 468085, "epoch": 2786} {"train_loss": -11.738480567932129, "global_step": 468086, "epoch": 2786} {"train_loss": -12.270795822143555, "global_step": 468087, "epoch": 2786} {"train_loss": -11.83841323852539, "global_step": 468088, "epoch": 2786} {"train_loss": -11.837166786193848, "global_step": 468089, "epoch": 2786} {"train_loss": -12.253181457519531, "global_step": 468090, "epoch": 2786} {"train_loss": -11.380241394042969, "global_step": 468091, "epoch": 2786} {"train_loss": -12.134733200073242, "global_step": 468092, "epoch": 2786} {"train_loss": -11.795331954956055, "global_step": 468093, "epoch": 2786} {"train_loss": -12.088945388793945, "global_step": 468094, "epoch": 2786} {"train_loss": -12.277341842651367, "global_step": 468095, "epoch": 2786} {"train_loss": -11.550274848937988, "global_step": 468096, "epoch": 2786} {"train_loss": -12.402276039123535, "global_step": 468097, "epoch": 2786} {"train_loss": -11.982416152954102, "global_step": 468098, "epoch": 2786} {"train_loss": -12.063202857971191, "global_step": 468099, "epoch": 2786} {"train_loss": -12.321807861328125, "global_step": 468100, "epoch": 2786} {"train_loss": -11.938426971435547, "global_step": 468101, "epoch": 2786} {"train_loss": -12.375703811645508, "global_step": 468102, "epoch": 2786} {"train_loss": -12.182378768920898, "global_step": 468103, "epoch": 2786} {"train_loss": -12.299736022949219, "global_step": 468104, "epoch": 2786} {"train_loss": -12.348556518554688, "global_step": 468105, "epoch": 2786} {"train_loss": -12.350131034851074, "global_step": 468106, "epoch": 2786} {"train_loss": -12.779962539672852, "global_step": 468107, "epoch": 2786} {"train_loss": -12.526151657104492, "global_step": 468108, "epoch": 2786} {"train_loss": -12.823169708251953, "global_step": 468109, "epoch": 2786} {"train_loss": -12.538755416870117, "global_step": 468110, "epoch": 2786} {"train_loss": -12.678343772888184, "global_step": 468111, "epoch": 2786} {"train_loss": -12.542889595031738, "global_step": 468112, "epoch": 2786} {"train_loss": -12.585887908935547, "global_step": 468113, "epoch": 2786} {"train_loss": -12.804098129272461, "global_step": 468114, "epoch": 2786} {"train_loss": -12.797231674194336, "global_step": 468115, "epoch": 2786} {"train_loss": -12.531129837036133, "global_step": 468116, "epoch": 2786} {"train_loss": -12.704568862915039, "global_step": 468117, "epoch": 2786} {"train_loss": -12.521200180053711, "global_step": 468118, "epoch": 2786} {"train_loss": -12.241921424865723, "global_step": 468119, "epoch": 2786} {"train_loss": -12.473960876464844, "global_step": 468120, "epoch": 2786} {"train_loss": -12.391786575317383, "global_step": 468121, "epoch": 2786} {"train_loss": -12.79172134399414, "global_step": 468122, "epoch": 2786} {"train_loss": -12.405281066894531, "global_step": 468123, "epoch": 2786} {"train_loss": -12.678436279296875, "global_step": 468124, "epoch": 2786} {"train_loss": -12.4971923828125, "global_step": 468125, "epoch": 2786} {"train_loss": -12.624866485595703, "global_step": 468126, "epoch": 2786} {"train_loss": -12.54146957397461, "global_step": 468127, "epoch": 2786} {"train_loss": -12.614466667175293, "global_step": 468128, "epoch": 2786} {"train_loss": -12.844533920288086, "global_step": 468129, "epoch": 2786} {"train_loss": -12.041948318481445, "global_step": 468130, "epoch": 2786} {"train_loss": -12.713163375854492, "global_step": 468131, "epoch": 2786} {"train_loss": -12.51453971862793, "global_step": 468132, "epoch": 2786} {"train_loss": -12.623255729675293, "global_step": 468133, "epoch": 2786} {"train_loss": -12.87054443359375, "global_step": 468134, "epoch": 2786} {"train_loss": -12.388648986816406, "global_step": 468135, "epoch": 2786} {"train_loss": -12.647875785827637, "global_step": 468136, "epoch": 2786} {"train_loss": -12.581512451171875, "global_step": 468137, "epoch": 2786} {"train_loss": -12.77702808380127, "global_step": 468138, "epoch": 2786} {"train_loss": -12.915630340576172, "global_step": 468139, "epoch": 2786} {"train_loss": -12.609886169433594, "global_step": 468140, "epoch": 2786} {"train_loss": -12.694879531860352, "global_step": 468141, "epoch": 2786} {"train_loss": -12.530455589294434, "global_step": 468142, "epoch": 2786} {"train_loss": -12.504404067993164, "global_step": 468143, "epoch": 2786} {"train_loss": -12.71912956237793, "global_step": 468144, "epoch": 2786} {"train_loss": -12.53194808959961, "global_step": 468145, "epoch": 2786} {"train_loss": -12.797637939453125, "global_step": 468146, "epoch": 2786} {"train_loss": -12.297205924987793, "global_step": 468147, "epoch": 2786} {"train_loss": -12.653726577758789, "global_step": 468148, "epoch": 2786} {"train_loss": -12.556327819824219, "global_step": 468149, "epoch": 2786} {"train_loss": -12.728533744812012, "global_step": 468150, "epoch": 2786} {"train_loss": -12.495620727539062, "global_step": 468151, "epoch": 2786} {"train_loss": -12.639678001403809, "global_step": 468152, "epoch": 2786} {"train_loss": -12.522388458251953, "global_step": 468153, "epoch": 2786} {"train_loss": -12.47993278503418, "global_step": 468154, "epoch": 2786} {"train_loss": -12.614664077758789, "global_step": 468155, "epoch": 2786} {"train_loss": -12.651676177978516, "global_step": 468156, "epoch": 2786} {"train_loss": -12.656376838684082, "global_step": 468157, "epoch": 2786} {"train_loss": -12.886590957641602, "global_step": 468158, "epoch": 2786} {"train_loss": -12.717063903808594, "global_step": 468159, "epoch": 2786} {"train_loss": -12.68867015838623, "global_step": 468160, "epoch": 2786} {"train_loss": -12.654461860656738, "global_step": 468161, "epoch": 2786} {"train_loss": -12.797858238220215, "global_step": 468162, "epoch": 2786} {"train_loss": -12.72833251953125, "global_step": 468163, "epoch": 2786} {"train_loss": -12.8517484664917, "global_step": 468164, "epoch": 2786} {"train_loss": -13.10753059387207, "global_step": 468165, "epoch": 2786} {"train_loss": -12.754390716552734, "global_step": 468166, "epoch": 2786} {"train_loss": -12.6798095703125, "global_step": 468167, "epoch": 2786} {"train_loss": -12.795524597167969, "global_step": 468168, "epoch": 2786} {"train_loss": -12.858161926269531, "global_step": 468169, "epoch": 2786} {"train_loss": -12.80894660949707, "global_step": 468170, "epoch": 2786} {"train_loss": -13.025239944458008, "global_step": 468171, "epoch": 2786} {"train_loss": -12.744699478149414, "global_step": 468172, "epoch": 2786} {"train_loss": -12.87069320678711, "global_step": 468173, "epoch": 2786} {"train_loss": -12.707676887512207, "global_step": 468174, "epoch": 2786} {"train_loss": -12.877969741821289, "global_step": 468175, "epoch": 2786} {"train_loss": -13.057908058166504, "global_step": 468176, "epoch": 2786} {"train_loss": -12.550752639770508, "global_step": 468177, "epoch": 2786} {"train_loss": -12.737353324890137, "global_step": 468178, "epoch": 2786} {"train_loss": -12.745113372802734, "global_step": 468179, "epoch": 2786} {"train_loss": -12.762956619262695, "global_step": 468180, "epoch": 2786} {"train_loss": -13.07676887512207, "global_step": 468181, "epoch": 2786} {"train_loss": -12.727453231811523, "global_step": 468182, "epoch": 2786} {"train_loss": -12.792479515075684, "global_step": 468183, "epoch": 2786} {"train_loss": -12.937417030334473, "global_step": 468184, "epoch": 2786} {"train_loss": -12.59432601928711, "global_step": 468185, "epoch": 2786} {"train_loss": -12.884481430053711, "global_step": 468186, "epoch": 2786} {"train_loss": -12.803049087524414, "global_step": 468187, "epoch": 2786} {"train_loss": -12.74436092376709, "global_step": 468188, "epoch": 2786} {"train_loss": -12.30194091796875, "global_step": 468189, "epoch": 2786} {"train_loss": -12.300932884216309, "global_step": 468190, "epoch": 2786} {"train_loss": -12.232580184936523, "global_step": 468191, "epoch": 2786} {"train_loss": -13.124269485473633, "global_step": 468192, "epoch": 2786} {"train_loss": -12.62940502166748, "global_step": 468193, "epoch": 2786} {"train_loss": -12.985641479492188, "global_step": 468194, "epoch": 2786} {"train_loss": -12.74464225769043, "global_step": 468195, "epoch": 2786} {"train_loss": -12.265634536743164, "global_step": 468196, "epoch": 2786} {"train_loss": -12.032394409179688, "global_step": 468197, "epoch": 2786} {"train_loss": -12.470178604125977, "global_step": 468198, "epoch": 2786} {"train_loss": -12.238053321838379, "global_step": 468199, "epoch": 2786} {"train_loss": -12.223684310913086, "global_step": 468200, "epoch": 2786} {"train_loss": -12.60558795928955, "global_step": 468201, "epoch": 2786} {"train_loss": -11.199970245361328, "global_step": 468202, "epoch": 2786} {"train_loss": -11.8121919631958, "global_step": 468203, "epoch": 2786} {"train_loss": -12.917827606201172, "global_step": 468204, "epoch": 2786} {"train_loss": -11.380438804626465, "global_step": 468205, "epoch": 2786} {"train_loss": -11.822518348693848, "global_step": 468206, "epoch": 2786} {"train_loss": -12.459671020507812, "global_step": 468207, "epoch": 2786} {"train_loss": -12.153587341308594, "global_step": 468208, "epoch": 2786} {"train_loss": -11.94573974609375, "global_step": 468209, "epoch": 2786} {"train_loss": -12.091026306152344, "global_step": 468210, "epoch": 2786} {"train_loss": -11.029151916503906, "global_step": 468211, "epoch": 2786} {"train_loss": -11.38680648803711, "global_step": 468212, "epoch": 2786} {"train_loss": -12.298299789428711, "global_step": 468213, "epoch": 2786} {"train_loss": -11.506202697753906, "global_step": 468214, "epoch": 2786} {"train_loss": -12.173485120137533, "global_step": 468215, "epoch": 2786, "val_loss": 315142.25} {"train_loss": -12.54450798034668, "global_step": 468216, "epoch": 2787} {"train_loss": -12.479658126831055, "global_step": 468217, "epoch": 2787} {"train_loss": -11.74705696105957, "global_step": 468218, "epoch": 2787} {"train_loss": -12.284645080566406, "global_step": 468219, "epoch": 2787} {"train_loss": -12.506113052368164, "global_step": 468220, "epoch": 2787} {"train_loss": -12.380682945251465, "global_step": 468221, "epoch": 2787} {"train_loss": -12.374563217163086, "global_step": 468222, "epoch": 2787} {"train_loss": -12.730045318603516, "global_step": 468223, "epoch": 2787} {"train_loss": -12.247358322143555, "global_step": 468224, "epoch": 2787} {"train_loss": -12.246271133422852, "global_step": 468225, "epoch": 2787} {"train_loss": -12.715418815612793, "global_step": 468226, "epoch": 2787} {"train_loss": -12.359015464782715, "global_step": 468227, "epoch": 2787} {"train_loss": -12.42607307434082, "global_step": 468228, "epoch": 2787} {"train_loss": -12.263599395751953, "global_step": 468229, "epoch": 2787} {"train_loss": -12.721343040466309, "global_step": 468230, "epoch": 2787} {"train_loss": -12.106138229370117, "global_step": 468231, "epoch": 2787} {"train_loss": -12.37604808807373, "global_step": 468232, "epoch": 2787} {"train_loss": -11.721148490905762, "global_step": 468233, "epoch": 2787} {"train_loss": -12.508801460266113, "global_step": 468234, "epoch": 2787} {"train_loss": -11.81277084350586, "global_step": 468235, "epoch": 2787} {"train_loss": -11.702166557312012, "global_step": 468236, "epoch": 2787} {"train_loss": -11.831365585327148, "global_step": 468237, "epoch": 2787} {"train_loss": -11.70309066772461, "global_step": 468238, "epoch": 2787} {"train_loss": -11.70981216430664, "global_step": 468239, "epoch": 2787} {"train_loss": -11.7353515625, "global_step": 468240, "epoch": 2787} {"train_loss": -12.05533218383789, "global_step": 468241, "epoch": 2787} {"train_loss": -12.104256629943848, "global_step": 468242, "epoch": 2787} {"train_loss": -12.189582824707031, "global_step": 468243, "epoch": 2787} {"train_loss": -12.41071605682373, "global_step": 468244, "epoch": 2787} {"train_loss": -12.312213897705078, "global_step": 468245, "epoch": 2787} {"train_loss": -12.331598281860352, "global_step": 468246, "epoch": 2787} {"train_loss": -12.409531593322754, "global_step": 468247, "epoch": 2787} {"train_loss": -12.459956169128418, "global_step": 468248, "epoch": 2787} {"train_loss": -12.552955627441406, "global_step": 468249, "epoch": 2787} {"train_loss": -12.526721954345703, "global_step": 468250, "epoch": 2787} {"train_loss": -12.417375564575195, "global_step": 468251, "epoch": 2787} {"train_loss": -12.434906005859375, "global_step": 468252, "epoch": 2787} {"train_loss": -12.392793655395508, "global_step": 468253, "epoch": 2787} {"train_loss": -12.3295259475708, "global_step": 468254, "epoch": 2787} {"train_loss": -12.32101821899414, "global_step": 468255, "epoch": 2787} {"train_loss": -12.311346054077148, "global_step": 468256, "epoch": 2787} {"train_loss": -12.58503532409668, "global_step": 468257, "epoch": 2787} {"train_loss": -12.493879318237305, "global_step": 468258, "epoch": 2787} {"train_loss": -12.568838119506836, "global_step": 468259, "epoch": 2787} {"train_loss": -12.707138061523438, "global_step": 468260, "epoch": 2787} {"train_loss": -12.8158540725708, "global_step": 468261, "epoch": 2787} {"train_loss": -12.272815704345703, "global_step": 468262, "epoch": 2787} {"train_loss": -12.690838813781738, "global_step": 468263, "epoch": 2787} {"train_loss": -12.59686279296875, "global_step": 468264, "epoch": 2787} {"train_loss": -12.008466720581055, "global_step": 468265, "epoch": 2787} {"train_loss": -12.416788101196289, "global_step": 468266, "epoch": 2787} {"train_loss": -12.472785949707031, "global_step": 468267, "epoch": 2787} {"train_loss": -11.323589324951172, "global_step": 468268, "epoch": 2787} {"train_loss": -12.204410552978516, "global_step": 468269, "epoch": 2787} {"train_loss": -12.27619743347168, "global_step": 468270, "epoch": 2787} {"train_loss": -12.183113098144531, "global_step": 468271, "epoch": 2787} {"train_loss": -11.632145881652832, "global_step": 468272, "epoch": 2787} {"train_loss": -12.181526184082031, "global_step": 468273, "epoch": 2787} {"train_loss": -10.470342636108398, "global_step": 468274, "epoch": 2787} {"train_loss": -12.777077674865723, "global_step": 468275, "epoch": 2787} {"train_loss": -10.97688102722168, "global_step": 468276, "epoch": 2787} {"train_loss": -11.404317855834961, "global_step": 468277, "epoch": 2787} {"train_loss": -12.417831420898438, "global_step": 468278, "epoch": 2787} {"train_loss": -10.915849685668945, "global_step": 468279, "epoch": 2787} {"train_loss": -11.333873748779297, "global_step": 468280, "epoch": 2787} {"train_loss": -11.238292694091797, "global_step": 468281, "epoch": 2787} {"train_loss": -10.683748245239258, "global_step": 468282, "epoch": 2787} {"train_loss": -10.327438354492188, "global_step": 468283, "epoch": 2787} {"train_loss": -11.52611255645752, "global_step": 468284, "epoch": 2787} {"train_loss": -10.23583984375, "global_step": 468285, "epoch": 2787} {"train_loss": -11.013630867004395, "global_step": 468286, "epoch": 2787} {"train_loss": -11.076753616333008, "global_step": 468287, "epoch": 2787} {"train_loss": -10.713937759399414, "global_step": 468288, "epoch": 2787} {"train_loss": -11.666128158569336, "global_step": 468289, "epoch": 2787} {"train_loss": -9.944945335388184, "global_step": 468290, "epoch": 2787} {"train_loss": -10.91295051574707, "global_step": 468291, "epoch": 2787} {"train_loss": -11.18588638305664, "global_step": 468292, "epoch": 2787} {"train_loss": -10.831510543823242, "global_step": 468293, "epoch": 2787} {"train_loss": -11.60396671295166, "global_step": 468294, "epoch": 2787} {"train_loss": -11.39162826538086, "global_step": 468295, "epoch": 2787} {"train_loss": -11.335014343261719, "global_step": 468296, "epoch": 2787} {"train_loss": -11.218856811523438, "global_step": 468297, "epoch": 2787} {"train_loss": -11.525984764099121, "global_step": 468298, "epoch": 2787} {"train_loss": -12.386531829833984, "global_step": 468299, "epoch": 2787} {"train_loss": -11.384354591369629, "global_step": 468300, "epoch": 2787} {"train_loss": -12.173723220825195, "global_step": 468301, "epoch": 2787} {"train_loss": -11.763525009155273, "global_step": 468302, "epoch": 2787} {"train_loss": -12.25568962097168, "global_step": 468303, "epoch": 2787} {"train_loss": -12.180244445800781, "global_step": 468304, "epoch": 2787} {"train_loss": -12.277446746826172, "global_step": 468305, "epoch": 2787} {"train_loss": -12.458813667297363, "global_step": 468306, "epoch": 2787} {"train_loss": -11.827652931213379, "global_step": 468307, "epoch": 2787} {"train_loss": -11.955364227294922, "global_step": 468308, "epoch": 2787} {"train_loss": -12.281598091125488, "global_step": 468309, "epoch": 2787} {"train_loss": -12.391712188720703, "global_step": 468310, "epoch": 2787} {"train_loss": -12.217720031738281, "global_step": 468311, "epoch": 2787} {"train_loss": -12.265578269958496, "global_step": 468312, "epoch": 2787} {"train_loss": -12.296571731567383, "global_step": 468313, "epoch": 2787} {"train_loss": -12.346452713012695, "global_step": 468314, "epoch": 2787} {"train_loss": -12.43985652923584, "global_step": 468315, "epoch": 2787} {"train_loss": -12.034660339355469, "global_step": 468316, "epoch": 2787} {"train_loss": -12.153593063354492, "global_step": 468317, "epoch": 2787} {"train_loss": -11.745534896850586, "global_step": 468318, "epoch": 2787} {"train_loss": -11.946444511413574, "global_step": 468319, "epoch": 2787} {"train_loss": -12.054200172424316, "global_step": 468320, "epoch": 2787} {"train_loss": -11.878216743469238, "global_step": 468321, "epoch": 2787} {"train_loss": -11.698721885681152, "global_step": 468322, "epoch": 2787} {"train_loss": -12.530491828918457, "global_step": 468323, "epoch": 2787} {"train_loss": -11.38078498840332, "global_step": 468324, "epoch": 2787} {"train_loss": -12.551979064941406, "global_step": 468325, "epoch": 2787} {"train_loss": -11.554088592529297, "global_step": 468326, "epoch": 2787} {"train_loss": -12.02424430847168, "global_step": 468327, "epoch": 2787} {"train_loss": -12.36362075805664, "global_step": 468328, "epoch": 2787} {"train_loss": -11.419979095458984, "global_step": 468329, "epoch": 2787} {"train_loss": -12.7310791015625, "global_step": 468330, "epoch": 2787} {"train_loss": -11.695232391357422, "global_step": 468331, "epoch": 2787} {"train_loss": -12.250020027160645, "global_step": 468332, "epoch": 2787} {"train_loss": -12.18237590789795, "global_step": 468333, "epoch": 2787} {"train_loss": -12.186820983886719, "global_step": 468334, "epoch": 2787} {"train_loss": -12.62501049041748, "global_step": 468335, "epoch": 2787} {"train_loss": -12.190322875976562, "global_step": 468336, "epoch": 2787} {"train_loss": -12.517546653747559, "global_step": 468337, "epoch": 2787} {"train_loss": -12.595819473266602, "global_step": 468338, "epoch": 2787} {"train_loss": -12.52922248840332, "global_step": 468339, "epoch": 2787} {"train_loss": -12.705306053161621, "global_step": 468340, "epoch": 2787} {"train_loss": -12.557554244995117, "global_step": 468341, "epoch": 2787} {"train_loss": -12.55433464050293, "global_step": 468342, "epoch": 2787} {"train_loss": -12.656545639038086, "global_step": 468343, "epoch": 2787} {"train_loss": -12.57058048248291, "global_step": 468344, "epoch": 2787} {"train_loss": -12.670093536376953, "global_step": 468345, "epoch": 2787} {"train_loss": -12.45654010772705, "global_step": 468346, "epoch": 2787} {"train_loss": -12.648427963256836, "global_step": 468347, "epoch": 2787} {"train_loss": -12.460336685180664, "global_step": 468348, "epoch": 2787} {"train_loss": -12.750572204589844, "global_step": 468349, "epoch": 2787} {"train_loss": -12.559213638305664, "global_step": 468350, "epoch": 2787} {"train_loss": -12.68136215209961, "global_step": 468351, "epoch": 2787} {"train_loss": -12.398040771484375, "global_step": 468352, "epoch": 2787} {"train_loss": -12.784666061401367, "global_step": 468353, "epoch": 2787} {"train_loss": -12.402008056640625, "global_step": 468354, "epoch": 2787} {"train_loss": -12.53767204284668, "global_step": 468355, "epoch": 2787} {"train_loss": -12.455036163330078, "global_step": 468356, "epoch": 2787} {"train_loss": -12.418100357055664, "global_step": 468357, "epoch": 2787} {"train_loss": -12.701751708984375, "global_step": 468358, "epoch": 2787} {"train_loss": -12.681129455566406, "global_step": 468359, "epoch": 2787} {"train_loss": -12.75671100616455, "global_step": 468360, "epoch": 2787} {"train_loss": -12.70394515991211, "global_step": 468361, "epoch": 2787} {"train_loss": -12.660797119140625, "global_step": 468362, "epoch": 2787} {"train_loss": -12.646337509155273, "global_step": 468363, "epoch": 2787} {"train_loss": -12.836437225341797, "global_step": 468364, "epoch": 2787} {"train_loss": -12.754823684692383, "global_step": 468365, "epoch": 2787} {"train_loss": -12.812176704406738, "global_step": 468366, "epoch": 2787} {"train_loss": -12.756114959716797, "global_step": 468367, "epoch": 2787} {"train_loss": -12.78807544708252, "global_step": 468368, "epoch": 2787} {"train_loss": -12.756362915039062, "global_step": 468369, "epoch": 2787} {"train_loss": -12.654650688171387, "global_step": 468370, "epoch": 2787} {"train_loss": -12.801959037780762, "global_step": 468371, "epoch": 2787} {"train_loss": -12.872725486755371, "global_step": 468372, "epoch": 2787} {"train_loss": -12.935742378234863, "global_step": 468373, "epoch": 2787} {"train_loss": -12.82771110534668, "global_step": 468374, "epoch": 2787} {"train_loss": -12.751482963562012, "global_step": 468375, "epoch": 2787} {"train_loss": -12.710760116577148, "global_step": 468376, "epoch": 2787} {"train_loss": -12.895014762878418, "global_step": 468377, "epoch": 2787} {"train_loss": -12.773504257202148, "global_step": 468378, "epoch": 2787} {"train_loss": -12.696165084838867, "global_step": 468379, "epoch": 2787} {"train_loss": -12.955584526062012, "global_step": 468380, "epoch": 2787} {"train_loss": -12.623406410217285, "global_step": 468381, "epoch": 2787} {"train_loss": -12.828590393066406, "global_step": 468382, "epoch": 2787} {"train_loss": -12.185039361317953, "global_step": 468383, "epoch": 2787, "val_loss": 314507.46875} {"train_loss": -12.631193161010742, "global_step": 468384, "epoch": 2788} {"train_loss": -12.476978302001953, "global_step": 468385, "epoch": 2788} {"train_loss": -12.73104190826416, "global_step": 468386, "epoch": 2788} {"train_loss": -12.429010391235352, "global_step": 468387, "epoch": 2788} {"train_loss": -12.762990951538086, "global_step": 468388, "epoch": 2788} {"train_loss": -12.544349670410156, "global_step": 468389, "epoch": 2788} {"train_loss": -12.879631996154785, "global_step": 468390, "epoch": 2788} {"train_loss": -12.262005805969238, "global_step": 468391, "epoch": 2788} {"train_loss": -12.400050163269043, "global_step": 468392, "epoch": 2788} {"train_loss": -12.75263500213623, "global_step": 468393, "epoch": 2788} {"train_loss": -12.059549331665039, "global_step": 468394, "epoch": 2788} {"train_loss": -12.389548301696777, "global_step": 468395, "epoch": 2788} {"train_loss": -12.39614486694336, "global_step": 468396, "epoch": 2788} {"train_loss": -12.449752807617188, "global_step": 468397, "epoch": 2788} {"train_loss": -12.582676887512207, "global_step": 468398, "epoch": 2788} {"train_loss": -12.809316635131836, "global_step": 468399, "epoch": 2788} {"train_loss": -12.485062599182129, "global_step": 468400, "epoch": 2788} {"train_loss": -12.181840896606445, "global_step": 468401, "epoch": 2788} {"train_loss": -12.126541137695312, "global_step": 468402, "epoch": 2788} {"train_loss": -12.739094734191895, "global_step": 468403, "epoch": 2788} {"train_loss": -12.20329475402832, "global_step": 468404, "epoch": 2788} {"train_loss": -12.731245040893555, "global_step": 468405, "epoch": 2788} {"train_loss": -12.429994583129883, "global_step": 468406, "epoch": 2788} {"train_loss": -12.590542793273926, "global_step": 468407, "epoch": 2788} {"train_loss": -12.260406494140625, "global_step": 468408, "epoch": 2788} {"train_loss": -13.004204750061035, "global_step": 468409, "epoch": 2788} {"train_loss": -12.34467601776123, "global_step": 468410, "epoch": 2788} {"train_loss": -12.610915184020996, "global_step": 468411, "epoch": 2788} {"train_loss": -11.755318641662598, "global_step": 468412, "epoch": 2788} {"train_loss": -11.930683135986328, "global_step": 468413, "epoch": 2788} {"train_loss": -12.153264999389648, "global_step": 468414, "epoch": 2788} {"train_loss": -12.059732437133789, "global_step": 468415, "epoch": 2788} {"train_loss": -11.165971755981445, "global_step": 468416, "epoch": 2788} {"train_loss": -12.491767883300781, "global_step": 468417, "epoch": 2788} {"train_loss": -10.948087692260742, "global_step": 468418, "epoch": 2788} {"train_loss": -12.012224197387695, "global_step": 468419, "epoch": 2788} {"train_loss": -11.937651634216309, "global_step": 468420, "epoch": 2788} {"train_loss": -10.711427688598633, "global_step": 468421, "epoch": 2788} {"train_loss": -12.216573715209961, "global_step": 468422, "epoch": 2788} {"train_loss": -10.665519714355469, "global_step": 468423, "epoch": 2788} {"train_loss": -10.78385066986084, "global_step": 468424, "epoch": 2788} {"train_loss": -9.919906616210938, "global_step": 468425, "epoch": 2788} {"train_loss": -10.895998001098633, "global_step": 468426, "epoch": 2788} {"train_loss": -11.41114330291748, "global_step": 468427, "epoch": 2788} {"train_loss": -10.560861587524414, "global_step": 468428, "epoch": 2788} {"train_loss": -12.094343185424805, "global_step": 468429, "epoch": 2788} {"train_loss": -10.93834400177002, "global_step": 468430, "epoch": 2788} {"train_loss": -12.229106903076172, "global_step": 468431, "epoch": 2788} {"train_loss": -10.247011184692383, "global_step": 468432, "epoch": 2788} {"train_loss": -11.508538246154785, "global_step": 468433, "epoch": 2788} {"train_loss": -11.622386932373047, "global_step": 468434, "epoch": 2788} {"train_loss": -10.860713005065918, "global_step": 468435, "epoch": 2788} {"train_loss": -11.471281051635742, "global_step": 468436, "epoch": 2788} {"train_loss": -11.301846504211426, "global_step": 468437, "epoch": 2788} {"train_loss": -11.473367691040039, "global_step": 468438, "epoch": 2788} {"train_loss": -10.378229141235352, "global_step": 468439, "epoch": 2788} {"train_loss": -11.030744552612305, "global_step": 468440, "epoch": 2788} {"train_loss": -9.423797607421875, "global_step": 468441, "epoch": 2788} {"train_loss": -9.537620544433594, "global_step": 468442, "epoch": 2788} {"train_loss": -9.495532989501953, "global_step": 468443, "epoch": 2788} {"train_loss": -10.449226379394531, "global_step": 468444, "epoch": 2788} {"train_loss": -10.247343063354492, "global_step": 468445, "epoch": 2788} {"train_loss": -11.724531173706055, "global_step": 468446, "epoch": 2788} {"train_loss": -10.293355941772461, "global_step": 468447, "epoch": 2788} {"train_loss": -11.746813774108887, "global_step": 468448, "epoch": 2788} {"train_loss": -10.516434669494629, "global_step": 468449, "epoch": 2788} {"train_loss": -10.689704895019531, "global_step": 468450, "epoch": 2788} {"train_loss": -11.647793769836426, "global_step": 468451, "epoch": 2788} {"train_loss": -10.696391105651855, "global_step": 468452, "epoch": 2788} {"train_loss": -11.47732925415039, "global_step": 468453, "epoch": 2788} {"train_loss": -11.831214904785156, "global_step": 468454, "epoch": 2788} {"train_loss": -10.990564346313477, "global_step": 468455, "epoch": 2788} {"train_loss": -10.971796989440918, "global_step": 468456, "epoch": 2788} {"train_loss": -11.78718090057373, "global_step": 468457, "epoch": 2788} {"train_loss": -10.948808670043945, "global_step": 468458, "epoch": 2788} {"train_loss": -11.36961555480957, "global_step": 468459, "epoch": 2788} {"train_loss": -10.914666175842285, "global_step": 468460, "epoch": 2788} {"train_loss": -11.890504837036133, "global_step": 468461, "epoch": 2788} {"train_loss": -11.032596588134766, "global_step": 468462, "epoch": 2788} {"train_loss": -11.625877380371094, "global_step": 468463, "epoch": 2788} {"train_loss": -11.731199264526367, "global_step": 468464, "epoch": 2788} {"train_loss": -11.650158882141113, "global_step": 468465, "epoch": 2788} {"train_loss": -11.914118766784668, "global_step": 468466, "epoch": 2788} {"train_loss": -11.59007453918457, "global_step": 468467, "epoch": 2788} {"train_loss": -12.31704330444336, "global_step": 468468, "epoch": 2788} {"train_loss": -12.180727005004883, "global_step": 468469, "epoch": 2788} {"train_loss": -12.019728660583496, "global_step": 468470, "epoch": 2788} {"train_loss": -12.25544548034668, "global_step": 468471, "epoch": 2788} {"train_loss": -11.878092765808105, "global_step": 468472, "epoch": 2788} {"train_loss": -12.202497482299805, "global_step": 468473, "epoch": 2788} {"train_loss": -12.242605209350586, "global_step": 468474, "epoch": 2788} {"train_loss": -12.327312469482422, "global_step": 468475, "epoch": 2788} {"train_loss": -12.56712532043457, "global_step": 468476, "epoch": 2788} {"train_loss": -12.10212516784668, "global_step": 468477, "epoch": 2788} {"train_loss": -12.287721633911133, "global_step": 468478, "epoch": 2788} {"train_loss": -12.570295333862305, "global_step": 468479, "epoch": 2788} {"train_loss": -12.191458702087402, "global_step": 468480, "epoch": 2788} {"train_loss": -12.370038986206055, "global_step": 468481, "epoch": 2788} {"train_loss": -12.49758529663086, "global_step": 468482, "epoch": 2788} {"train_loss": -11.956871032714844, "global_step": 468483, "epoch": 2788} {"train_loss": -12.214390754699707, "global_step": 468484, "epoch": 2788} {"train_loss": -12.444862365722656, "global_step": 468485, "epoch": 2788} {"train_loss": -12.358987808227539, "global_step": 468486, "epoch": 2788} {"train_loss": -12.376304626464844, "global_step": 468487, "epoch": 2788} {"train_loss": -12.417411804199219, "global_step": 468488, "epoch": 2788} {"train_loss": -12.531768798828125, "global_step": 468489, "epoch": 2788} {"train_loss": -12.76977252960205, "global_step": 468490, "epoch": 2788} {"train_loss": -12.549850463867188, "global_step": 468491, "epoch": 2788} {"train_loss": -12.757747650146484, "global_step": 468492, "epoch": 2788} {"train_loss": -12.450765609741211, "global_step": 468493, "epoch": 2788} {"train_loss": -12.466451644897461, "global_step": 468494, "epoch": 2788} {"train_loss": -12.510587692260742, "global_step": 468495, "epoch": 2788} {"train_loss": -12.65518569946289, "global_step": 468496, "epoch": 2788} {"train_loss": -12.355655670166016, "global_step": 468497, "epoch": 2788} {"train_loss": -12.612788200378418, "global_step": 468498, "epoch": 2788} {"train_loss": -12.564338684082031, "global_step": 468499, "epoch": 2788} {"train_loss": -12.717041015625, "global_step": 468500, "epoch": 2788} {"train_loss": -12.654559135437012, "global_step": 468501, "epoch": 2788} {"train_loss": -12.588451385498047, "global_step": 468502, "epoch": 2788} {"train_loss": -12.657878875732422, "global_step": 468503, "epoch": 2788} {"train_loss": -12.680171966552734, "global_step": 468504, "epoch": 2788} {"train_loss": -12.90063762664795, "global_step": 468505, "epoch": 2788} {"train_loss": -12.75796890258789, "global_step": 468506, "epoch": 2788} {"train_loss": -12.923635482788086, "global_step": 468507, "epoch": 2788} {"train_loss": -12.663542747497559, "global_step": 468508, "epoch": 2788} {"train_loss": -12.946508407592773, "global_step": 468509, "epoch": 2788} {"train_loss": -12.74490737915039, "global_step": 468510, "epoch": 2788} {"train_loss": -12.737258911132812, "global_step": 468511, "epoch": 2788} {"train_loss": -12.77195930480957, "global_step": 468512, "epoch": 2788} {"train_loss": -12.562246322631836, "global_step": 468513, "epoch": 2788} {"train_loss": -12.645893096923828, "global_step": 468514, "epoch": 2788} {"train_loss": -12.60157585144043, "global_step": 468515, "epoch": 2788} {"train_loss": -12.716645240783691, "global_step": 468516, "epoch": 2788} {"train_loss": -12.588313102722168, "global_step": 468517, "epoch": 2788} {"train_loss": -12.768847465515137, "global_step": 468518, "epoch": 2788} {"train_loss": -12.549439430236816, "global_step": 468519, "epoch": 2788} {"train_loss": -12.753578186035156, "global_step": 468520, "epoch": 2788} {"train_loss": -12.861239433288574, "global_step": 468521, "epoch": 2788} {"train_loss": -12.40705680847168, "global_step": 468522, "epoch": 2788} {"train_loss": -13.028217315673828, "global_step": 468523, "epoch": 2788} {"train_loss": -12.586737632751465, "global_step": 468524, "epoch": 2788} {"train_loss": -12.634830474853516, "global_step": 468525, "epoch": 2788} {"train_loss": -12.906184196472168, "global_step": 468526, "epoch": 2788} {"train_loss": -12.545433044433594, "global_step": 468527, "epoch": 2788} {"train_loss": -12.872864723205566, "global_step": 468528, "epoch": 2788} {"train_loss": -12.613117218017578, "global_step": 468529, "epoch": 2788} {"train_loss": -12.934492111206055, "global_step": 468530, "epoch": 2788} {"train_loss": -12.792583465576172, "global_step": 468531, "epoch": 2788} {"train_loss": -12.916326522827148, "global_step": 468532, "epoch": 2788} {"train_loss": -12.928701400756836, "global_step": 468533, "epoch": 2788} {"train_loss": -12.73128890991211, "global_step": 468534, "epoch": 2788} {"train_loss": -12.834779739379883, "global_step": 468535, "epoch": 2788} {"train_loss": -12.955740928649902, "global_step": 468536, "epoch": 2788} {"train_loss": -12.928322792053223, "global_step": 468537, "epoch": 2788} {"train_loss": -12.757152557373047, "global_step": 468538, "epoch": 2788} {"train_loss": -12.87620735168457, "global_step": 468539, "epoch": 2788} {"train_loss": -12.920161247253418, "global_step": 468540, "epoch": 2788} {"train_loss": -12.76662540435791, "global_step": 468541, "epoch": 2788} {"train_loss": -12.769569396972656, "global_step": 468542, "epoch": 2788} {"train_loss": -12.974405288696289, "global_step": 468543, "epoch": 2788} {"train_loss": -12.847869873046875, "global_step": 468544, "epoch": 2788} {"train_loss": -12.82894515991211, "global_step": 468545, "epoch": 2788} {"train_loss": -12.694272994995117, "global_step": 468546, "epoch": 2788} {"train_loss": -11.903362274169922, "global_step": 468547, "epoch": 2788} {"train_loss": -11.474231719970703, "global_step": 468548, "epoch": 2788} {"train_loss": -12.29914665222168, "global_step": 468549, "epoch": 2788} {"train_loss": -12.807109832763672, "global_step": 468550, "epoch": 2788} {"train_loss": -12.107306139809745, "global_step": 468551, "epoch": 2788, "val_loss": 315646.0625} {"train_loss": -12.676599502563477, "global_step": 468552, "epoch": 2789} {"train_loss": -12.52048110961914, "global_step": 468553, "epoch": 2789} {"train_loss": -12.722892761230469, "global_step": 468554, "epoch": 2789} {"train_loss": -12.688703536987305, "global_step": 468555, "epoch": 2789} {"train_loss": -12.581135749816895, "global_step": 468556, "epoch": 2789} {"train_loss": -12.311623573303223, "global_step": 468557, "epoch": 2789} {"train_loss": -12.59315013885498, "global_step": 468558, "epoch": 2789} {"train_loss": -12.541465759277344, "global_step": 468559, "epoch": 2789} {"train_loss": -12.69982624053955, "global_step": 468560, "epoch": 2789} {"train_loss": -12.652050018310547, "global_step": 468561, "epoch": 2789} {"train_loss": -12.551349639892578, "global_step": 468562, "epoch": 2789} {"train_loss": -12.79715633392334, "global_step": 468563, "epoch": 2789} {"train_loss": -12.20892333984375, "global_step": 468564, "epoch": 2789} {"train_loss": -12.281234741210938, "global_step": 468565, "epoch": 2789} {"train_loss": -12.801197052001953, "global_step": 468566, "epoch": 2789} {"train_loss": -11.764871597290039, "global_step": 468567, "epoch": 2789} {"train_loss": -12.610376358032227, "global_step": 468568, "epoch": 2789} {"train_loss": -11.95534896850586, "global_step": 468569, "epoch": 2789} {"train_loss": -11.630332946777344, "global_step": 468570, "epoch": 2789} {"train_loss": -10.79448127746582, "global_step": 468571, "epoch": 2789} {"train_loss": -11.807368278503418, "global_step": 468572, "epoch": 2789} {"train_loss": -10.560297012329102, "global_step": 468573, "epoch": 2789} {"train_loss": -10.835939407348633, "global_step": 468574, "epoch": 2789} {"train_loss": -10.754203796386719, "global_step": 468575, "epoch": 2789} {"train_loss": -9.974159240722656, "global_step": 468576, "epoch": 2789} {"train_loss": -10.315361976623535, "global_step": 468577, "epoch": 2789} {"train_loss": -9.137447357177734, "global_step": 468578, "epoch": 2789} {"train_loss": -10.769001007080078, "global_step": 468579, "epoch": 2789} {"train_loss": -10.855432510375977, "global_step": 468580, "epoch": 2789} {"train_loss": -8.312018394470215, "global_step": 468581, "epoch": 2789} {"train_loss": -11.753341674804688, "global_step": 468582, "epoch": 2789} {"train_loss": -10.989973068237305, "global_step": 468583, "epoch": 2789} {"train_loss": -9.198832511901855, "global_step": 468584, "epoch": 2789} {"train_loss": -10.508952140808105, "global_step": 468585, "epoch": 2789} {"train_loss": -10.97633171081543, "global_step": 468586, "epoch": 2789} {"train_loss": -10.745660781860352, "global_step": 468587, "epoch": 2789} {"train_loss": -10.213861465454102, "global_step": 468588, "epoch": 2789} {"train_loss": -11.488791465759277, "global_step": 468589, "epoch": 2789} {"train_loss": -9.95022201538086, "global_step": 468590, "epoch": 2789} {"train_loss": -11.317325592041016, "global_step": 468591, "epoch": 2789} {"train_loss": -10.2154541015625, "global_step": 468592, "epoch": 2789} {"train_loss": -9.767634391784668, "global_step": 468593, "epoch": 2789} {"train_loss": -11.620774269104004, "global_step": 468594, "epoch": 2789} {"train_loss": -11.286340713500977, "global_step": 468595, "epoch": 2789} {"train_loss": -11.90225601196289, "global_step": 468596, "epoch": 2789} {"train_loss": -10.979100227355957, "global_step": 468597, "epoch": 2789} {"train_loss": -11.836296081542969, "global_step": 468598, "epoch": 2789} {"train_loss": -11.574542999267578, "global_step": 468599, "epoch": 2789} {"train_loss": -11.825258255004883, "global_step": 468600, "epoch": 2789} {"train_loss": -11.091869354248047, "global_step": 468601, "epoch": 2789} {"train_loss": -12.088006973266602, "global_step": 468602, "epoch": 2789} {"train_loss": -11.736837387084961, "global_step": 468603, "epoch": 2789} {"train_loss": -11.778826713562012, "global_step": 468604, "epoch": 2789} {"train_loss": -11.941493034362793, "global_step": 468605, "epoch": 2789} {"train_loss": -11.96328353881836, "global_step": 468606, "epoch": 2789} {"train_loss": -11.864778518676758, "global_step": 468607, "epoch": 2789} {"train_loss": -11.744686126708984, "global_step": 468608, "epoch": 2789} {"train_loss": -11.882745742797852, "global_step": 468609, "epoch": 2789} {"train_loss": -11.854659080505371, "global_step": 468610, "epoch": 2789} {"train_loss": -11.754973411560059, "global_step": 468611, "epoch": 2789} {"train_loss": -12.047920227050781, "global_step": 468612, "epoch": 2789} {"train_loss": -11.77853012084961, "global_step": 468613, "epoch": 2789} {"train_loss": -12.283323287963867, "global_step": 468614, "epoch": 2789} {"train_loss": -11.628805160522461, "global_step": 468615, "epoch": 2789} {"train_loss": -11.755131721496582, "global_step": 468616, "epoch": 2789} {"train_loss": -11.854413032531738, "global_step": 468617, "epoch": 2789} {"train_loss": -11.249351501464844, "global_step": 468618, "epoch": 2789} {"train_loss": -12.491632461547852, "global_step": 468619, "epoch": 2789} {"train_loss": -11.817562103271484, "global_step": 468620, "epoch": 2789} {"train_loss": -12.168469429016113, "global_step": 468621, "epoch": 2789} {"train_loss": -12.307419776916504, "global_step": 468622, "epoch": 2789} {"train_loss": -11.9205322265625, "global_step": 468623, "epoch": 2789} {"train_loss": -12.381180763244629, "global_step": 468624, "epoch": 2789} {"train_loss": -11.842994689941406, "global_step": 468625, "epoch": 2789} {"train_loss": -12.471750259399414, "global_step": 468626, "epoch": 2789} {"train_loss": -11.961285591125488, "global_step": 468627, "epoch": 2789} {"train_loss": -12.2689208984375, "global_step": 468628, "epoch": 2789} {"train_loss": -11.734956741333008, "global_step": 468629, "epoch": 2789} {"train_loss": -11.783121109008789, "global_step": 468630, "epoch": 2789} {"train_loss": -12.319280624389648, "global_step": 468631, "epoch": 2789} {"train_loss": -11.585128784179688, "global_step": 468632, "epoch": 2789} {"train_loss": -12.024726867675781, "global_step": 468633, "epoch": 2789} {"train_loss": -12.437379837036133, "global_step": 468634, "epoch": 2789} {"train_loss": -12.525556564331055, "global_step": 468635, "epoch": 2789} {"train_loss": -12.394436836242676, "global_step": 468636, "epoch": 2789} {"train_loss": -12.334406852722168, "global_step": 468637, "epoch": 2789} {"train_loss": -12.4896240234375, "global_step": 468638, "epoch": 2789} {"train_loss": -12.458222389221191, "global_step": 468639, "epoch": 2789} {"train_loss": -12.603912353515625, "global_step": 468640, "epoch": 2789} {"train_loss": -12.426717758178711, "global_step": 468641, "epoch": 2789} {"train_loss": -12.65571403503418, "global_step": 468642, "epoch": 2789} {"train_loss": -12.399499893188477, "global_step": 468643, "epoch": 2789} {"train_loss": -12.422760009765625, "global_step": 468644, "epoch": 2789} {"train_loss": -12.739775657653809, "global_step": 468645, "epoch": 2789} {"train_loss": -12.393080711364746, "global_step": 468646, "epoch": 2789} {"train_loss": -12.422381401062012, "global_step": 468647, "epoch": 2789} {"train_loss": -12.712299346923828, "global_step": 468648, "epoch": 2789} {"train_loss": -12.653036117553711, "global_step": 468649, "epoch": 2789} {"train_loss": -12.681695938110352, "global_step": 468650, "epoch": 2789} {"train_loss": -12.742809295654297, "global_step": 468651, "epoch": 2789} {"train_loss": -12.778907775878906, "global_step": 468652, "epoch": 2789} {"train_loss": -12.678767204284668, "global_step": 468653, "epoch": 2789} {"train_loss": -12.599173545837402, "global_step": 468654, "epoch": 2789} {"train_loss": -12.958721160888672, "global_step": 468655, "epoch": 2789} {"train_loss": -12.453750610351562, "global_step": 468656, "epoch": 2789} {"train_loss": -12.747364044189453, "global_step": 468657, "epoch": 2789} {"train_loss": -12.66533374786377, "global_step": 468658, "epoch": 2789} {"train_loss": -12.882268905639648, "global_step": 468659, "epoch": 2789} {"train_loss": -12.895102500915527, "global_step": 468660, "epoch": 2789} {"train_loss": -12.738653182983398, "global_step": 468661, "epoch": 2789} {"train_loss": -12.741912841796875, "global_step": 468662, "epoch": 2789} {"train_loss": -13.012762069702148, "global_step": 468663, "epoch": 2789} {"train_loss": -12.854238510131836, "global_step": 468664, "epoch": 2789} {"train_loss": -12.920425415039062, "global_step": 468665, "epoch": 2789} {"train_loss": -12.914753913879395, "global_step": 468666, "epoch": 2789} {"train_loss": -12.76636028289795, "global_step": 468667, "epoch": 2789} {"train_loss": -12.896404266357422, "global_step": 468668, "epoch": 2789} {"train_loss": -12.802823066711426, "global_step": 468669, "epoch": 2789} {"train_loss": -12.79944133758545, "global_step": 468670, "epoch": 2789} {"train_loss": -12.805468559265137, "global_step": 468671, "epoch": 2789} {"train_loss": -13.000131607055664, "global_step": 468672, "epoch": 2789} {"train_loss": -12.836129188537598, "global_step": 468673, "epoch": 2789} {"train_loss": -13.036094665527344, "global_step": 468674, "epoch": 2789} {"train_loss": -12.68723201751709, "global_step": 468675, "epoch": 2789} {"train_loss": -12.921131134033203, "global_step": 468676, "epoch": 2789} {"train_loss": -12.96856689453125, "global_step": 468677, "epoch": 2789} {"train_loss": -12.803998947143555, "global_step": 468678, "epoch": 2789} {"train_loss": -12.835515975952148, "global_step": 468679, "epoch": 2789} {"train_loss": -13.055549621582031, "global_step": 468680, "epoch": 2789} {"train_loss": -12.827908515930176, "global_step": 468681, "epoch": 2789} {"train_loss": -12.928007125854492, "global_step": 468682, "epoch": 2789} {"train_loss": -13.070110321044922, "global_step": 468683, "epoch": 2789} {"train_loss": -12.89477825164795, "global_step": 468684, "epoch": 2789} {"train_loss": -12.86806583404541, "global_step": 468685, "epoch": 2789} {"train_loss": -13.04440975189209, "global_step": 468686, "epoch": 2789} {"train_loss": -13.087607383728027, "global_step": 468687, "epoch": 2789} {"train_loss": -12.977590560913086, "global_step": 468688, "epoch": 2789} {"train_loss": -12.846786499023438, "global_step": 468689, "epoch": 2789} {"train_loss": -12.818865776062012, "global_step": 468690, "epoch": 2789} {"train_loss": -12.999829292297363, "global_step": 468691, "epoch": 2789} {"train_loss": -12.89688491821289, "global_step": 468692, "epoch": 2789} {"train_loss": -12.927223205566406, "global_step": 468693, "epoch": 2789} {"train_loss": -12.851808547973633, "global_step": 468694, "epoch": 2789} {"train_loss": -12.961963653564453, "global_step": 468695, "epoch": 2789} {"train_loss": -12.974594116210938, "global_step": 468696, "epoch": 2789} {"train_loss": -12.970416069030762, "global_step": 468697, "epoch": 2789} {"train_loss": -12.81437873840332, "global_step": 468698, "epoch": 2789} {"train_loss": -12.70776653289795, "global_step": 468699, "epoch": 2789} {"train_loss": -12.972565650939941, "global_step": 468700, "epoch": 2789} {"train_loss": -12.999473571777344, "global_step": 468701, "epoch": 2789} {"train_loss": -13.022339820861816, "global_step": 468702, "epoch": 2789} {"train_loss": -12.893875122070312, "global_step": 468703, "epoch": 2789} {"train_loss": -12.234081268310547, "global_step": 468704, "epoch": 2789} {"train_loss": -10.498847961425781, "global_step": 468705, "epoch": 2789} {"train_loss": -11.14974594116211, "global_step": 468706, "epoch": 2789} {"train_loss": -8.84660530090332, "global_step": 468707, "epoch": 2789} {"train_loss": -11.453014373779297, "global_step": 468708, "epoch": 2789} {"train_loss": -9.623210906982422, "global_step": 468709, "epoch": 2789} {"train_loss": -10.89065933227539, "global_step": 468710, "epoch": 2789} {"train_loss": -10.934432029724121, "global_step": 468711, "epoch": 2789} {"train_loss": -11.029563903808594, "global_step": 468712, "epoch": 2789} {"train_loss": -10.700384140014648, "global_step": 468713, "epoch": 2789} {"train_loss": -11.906429290771484, "global_step": 468714, "epoch": 2789} {"train_loss": -9.886947631835938, "global_step": 468715, "epoch": 2789} {"train_loss": -9.284890174865723, "global_step": 468716, "epoch": 2789} {"train_loss": -11.356023788452148, "global_step": 468717, "epoch": 2789} {"train_loss": -11.051856994628906, "global_step": 468718, "epoch": 2789} {"train_loss": -12.019965046928043, "global_step": 468719, "epoch": 2789, "val_loss": 313916.03125} {"train_loss": -11.40699291229248, "global_step": 468720, "epoch": 2790} {"train_loss": -11.058210372924805, "global_step": 468721, "epoch": 2790} {"train_loss": -10.672794342041016, "global_step": 468722, "epoch": 2790} {"train_loss": -9.861955642700195, "global_step": 468723, "epoch": 2790} {"train_loss": -11.43904972076416, "global_step": 468724, "epoch": 2790} {"train_loss": -11.28526496887207, "global_step": 468725, "epoch": 2790} {"train_loss": -11.428372383117676, "global_step": 468726, "epoch": 2790} {"train_loss": -11.2427339553833, "global_step": 468727, "epoch": 2790} {"train_loss": -11.722312927246094, "global_step": 468728, "epoch": 2790} {"train_loss": -10.658193588256836, "global_step": 468729, "epoch": 2790} {"train_loss": -12.277880668640137, "global_step": 468730, "epoch": 2790} {"train_loss": -11.606767654418945, "global_step": 468731, "epoch": 2790} {"train_loss": -11.59051513671875, "global_step": 468732, "epoch": 2790} {"train_loss": -11.7669677734375, "global_step": 468733, "epoch": 2790} {"train_loss": -11.476598739624023, "global_step": 468734, "epoch": 2790} {"train_loss": -12.119257926940918, "global_step": 468735, "epoch": 2790} {"train_loss": -11.04092788696289, "global_step": 468736, "epoch": 2790} {"train_loss": -11.601152420043945, "global_step": 468737, "epoch": 2790} {"train_loss": -10.95637035369873, "global_step": 468738, "epoch": 2790} {"train_loss": -12.232068061828613, "global_step": 468739, "epoch": 2790} {"train_loss": -11.66537094116211, "global_step": 468740, "epoch": 2790} {"train_loss": -11.772167205810547, "global_step": 468741, "epoch": 2790} {"train_loss": -11.76461124420166, "global_step": 468742, "epoch": 2790} {"train_loss": -12.34537410736084, "global_step": 468743, "epoch": 2790} {"train_loss": -11.971685409545898, "global_step": 468744, "epoch": 2790} {"train_loss": -11.777097702026367, "global_step": 468745, "epoch": 2790} {"train_loss": -11.66016960144043, "global_step": 468746, "epoch": 2790} {"train_loss": -11.369752883911133, "global_step": 468747, "epoch": 2790} {"train_loss": -12.298134803771973, "global_step": 468748, "epoch": 2790} {"train_loss": -11.385854721069336, "global_step": 468749, "epoch": 2790} {"train_loss": -12.16444206237793, "global_step": 468750, "epoch": 2790} {"train_loss": -11.654336929321289, "global_step": 468751, "epoch": 2790} {"train_loss": -11.691665649414062, "global_step": 468752, "epoch": 2790} {"train_loss": -11.535998344421387, "global_step": 468753, "epoch": 2790} {"train_loss": -11.616619110107422, "global_step": 468754, "epoch": 2790} {"train_loss": -10.752713203430176, "global_step": 468755, "epoch": 2790} {"train_loss": -11.158092498779297, "global_step": 468756, "epoch": 2790} {"train_loss": -11.084962844848633, "global_step": 468757, "epoch": 2790} {"train_loss": -9.25493335723877, "global_step": 468758, "epoch": 2790} {"train_loss": -11.560871124267578, "global_step": 468759, "epoch": 2790} {"train_loss": -8.180339813232422, "global_step": 468760, "epoch": 2790} {"train_loss": -10.218862533569336, "global_step": 468761, "epoch": 2790} {"train_loss": -9.844453811645508, "global_step": 468762, "epoch": 2790} {"train_loss": -10.07077693939209, "global_step": 468763, "epoch": 2790} {"train_loss": -8.886927604675293, "global_step": 468764, "epoch": 2790} {"train_loss": -9.345317840576172, "global_step": 468765, "epoch": 2790} {"train_loss": -11.422863006591797, "global_step": 468766, "epoch": 2790} {"train_loss": -9.688343048095703, "global_step": 468767, "epoch": 2790} {"train_loss": -10.542476654052734, "global_step": 468768, "epoch": 2790} {"train_loss": -10.352090835571289, "global_step": 468769, "epoch": 2790} {"train_loss": -11.639601707458496, "global_step": 468770, "epoch": 2790} {"train_loss": -10.551054000854492, "global_step": 468771, "epoch": 2790} {"train_loss": -10.80760383605957, "global_step": 468772, "epoch": 2790} {"train_loss": -11.470659255981445, "global_step": 468773, "epoch": 2790} {"train_loss": -10.946203231811523, "global_step": 468774, "epoch": 2790} {"train_loss": -11.247369766235352, "global_step": 468775, "epoch": 2790} {"train_loss": -11.51815128326416, "global_step": 468776, "epoch": 2790} {"train_loss": -11.258410453796387, "global_step": 468777, "epoch": 2790} {"train_loss": -10.457322120666504, "global_step": 468778, "epoch": 2790} {"train_loss": -11.794473648071289, "global_step": 468779, "epoch": 2790} {"train_loss": -11.405485153198242, "global_step": 468780, "epoch": 2790} {"train_loss": -11.326231956481934, "global_step": 468781, "epoch": 2790} {"train_loss": -11.635028839111328, "global_step": 468782, "epoch": 2790} {"train_loss": -11.634279251098633, "global_step": 468783, "epoch": 2790} {"train_loss": -11.217582702636719, "global_step": 468784, "epoch": 2790} {"train_loss": -11.711066246032715, "global_step": 468785, "epoch": 2790} {"train_loss": -11.479557037353516, "global_step": 468786, "epoch": 2790} {"train_loss": -11.145378112792969, "global_step": 468787, "epoch": 2790} {"train_loss": -11.139564514160156, "global_step": 468788, "epoch": 2790} {"train_loss": -11.594023704528809, "global_step": 468789, "epoch": 2790} {"train_loss": -11.106803894042969, "global_step": 468790, "epoch": 2790} {"train_loss": -11.496906280517578, "global_step": 468791, "epoch": 2790} {"train_loss": -11.835954666137695, "global_step": 468792, "epoch": 2790} {"train_loss": -11.445150375366211, "global_step": 468793, "epoch": 2790} {"train_loss": -11.968778610229492, "global_step": 468794, "epoch": 2790} {"train_loss": -12.07551383972168, "global_step": 468795, "epoch": 2790} {"train_loss": -11.692689895629883, "global_step": 468796, "epoch": 2790} {"train_loss": -12.345199584960938, "global_step": 468797, "epoch": 2790} {"train_loss": -11.969184875488281, "global_step": 468798, "epoch": 2790} {"train_loss": -12.258116722106934, "global_step": 468799, "epoch": 2790} {"train_loss": -11.918554306030273, "global_step": 468800, "epoch": 2790} {"train_loss": -12.120800018310547, "global_step": 468801, "epoch": 2790} {"train_loss": -12.190204620361328, "global_step": 468802, "epoch": 2790} {"train_loss": -11.927193641662598, "global_step": 468803, "epoch": 2790} {"train_loss": -12.364378929138184, "global_step": 468804, "epoch": 2790} {"train_loss": -12.327410697937012, "global_step": 468805, "epoch": 2790} {"train_loss": -12.344610214233398, "global_step": 468806, "epoch": 2790} {"train_loss": -12.309026718139648, "global_step": 468807, "epoch": 2790} {"train_loss": -12.475204467773438, "global_step": 468808, "epoch": 2790} {"train_loss": -12.447015762329102, "global_step": 468809, "epoch": 2790} {"train_loss": -12.445952415466309, "global_step": 468810, "epoch": 2790} {"train_loss": -12.440285682678223, "global_step": 468811, "epoch": 2790} {"train_loss": -12.444491386413574, "global_step": 468812, "epoch": 2790} {"train_loss": -12.521409034729004, "global_step": 468813, "epoch": 2790} {"train_loss": -12.385054588317871, "global_step": 468814, "epoch": 2790} {"train_loss": -12.430042266845703, "global_step": 468815, "epoch": 2790} {"train_loss": -12.38797378540039, "global_step": 468816, "epoch": 2790} {"train_loss": -12.57805347442627, "global_step": 468817, "epoch": 2790} {"train_loss": -12.42109489440918, "global_step": 468818, "epoch": 2790} {"train_loss": -12.22110366821289, "global_step": 468819, "epoch": 2790} {"train_loss": -12.744773864746094, "global_step": 468820, "epoch": 2790} {"train_loss": -12.58738899230957, "global_step": 468821, "epoch": 2790} {"train_loss": -12.314851760864258, "global_step": 468822, "epoch": 2790} {"train_loss": -12.594697952270508, "global_step": 468823, "epoch": 2790} {"train_loss": -12.679594039916992, "global_step": 468824, "epoch": 2790} {"train_loss": -12.737741470336914, "global_step": 468825, "epoch": 2790} {"train_loss": -12.755636215209961, "global_step": 468826, "epoch": 2790} {"train_loss": -12.502811431884766, "global_step": 468827, "epoch": 2790} {"train_loss": -12.738414764404297, "global_step": 468828, "epoch": 2790} {"train_loss": -12.498023986816406, "global_step": 468829, "epoch": 2790} {"train_loss": -12.787276268005371, "global_step": 468830, "epoch": 2790} {"train_loss": -12.799104690551758, "global_step": 468831, "epoch": 2790} {"train_loss": -12.749225616455078, "global_step": 468832, "epoch": 2790} {"train_loss": -12.830987930297852, "global_step": 468833, "epoch": 2790} {"train_loss": -12.846443176269531, "global_step": 468834, "epoch": 2790} {"train_loss": -12.741498947143555, "global_step": 468835, "epoch": 2790} {"train_loss": -12.587291717529297, "global_step": 468836, "epoch": 2790} {"train_loss": -12.850894927978516, "global_step": 468837, "epoch": 2790} {"train_loss": -12.535587310791016, "global_step": 468838, "epoch": 2790} {"train_loss": -12.608381271362305, "global_step": 468839, "epoch": 2790} {"train_loss": -12.791290283203125, "global_step": 468840, "epoch": 2790} {"train_loss": -12.900087356567383, "global_step": 468841, "epoch": 2790} {"train_loss": -12.851675987243652, "global_step": 468842, "epoch": 2790} {"train_loss": -12.750791549682617, "global_step": 468843, "epoch": 2790} {"train_loss": -12.593341827392578, "global_step": 468844, "epoch": 2790} {"train_loss": -12.78889274597168, "global_step": 468845, "epoch": 2790} {"train_loss": -12.614611625671387, "global_step": 468846, "epoch": 2790} {"train_loss": -12.768009185791016, "global_step": 468847, "epoch": 2790} {"train_loss": -12.597585678100586, "global_step": 468848, "epoch": 2790} {"train_loss": -12.760026931762695, "global_step": 468849, "epoch": 2790} {"train_loss": -12.688650131225586, "global_step": 468850, "epoch": 2790} {"train_loss": -12.582479476928711, "global_step": 468851, "epoch": 2790} {"train_loss": -12.760997772216797, "global_step": 468852, "epoch": 2790} {"train_loss": -12.713619232177734, "global_step": 468853, "epoch": 2790} {"train_loss": -12.561220169067383, "global_step": 468854, "epoch": 2790} {"train_loss": -12.803606033325195, "global_step": 468855, "epoch": 2790} {"train_loss": -12.798446655273438, "global_step": 468856, "epoch": 2790} {"train_loss": -12.678030014038086, "global_step": 468857, "epoch": 2790} {"train_loss": -12.691885948181152, "global_step": 468858, "epoch": 2790} {"train_loss": -12.823539733886719, "global_step": 468859, "epoch": 2790} {"train_loss": -12.660787582397461, "global_step": 468860, "epoch": 2790} {"train_loss": -12.646413803100586, "global_step": 468861, "epoch": 2790} {"train_loss": -12.660839080810547, "global_step": 468862, "epoch": 2790} {"train_loss": -12.155848503112793, "global_step": 468863, "epoch": 2790} {"train_loss": -12.643451690673828, "global_step": 468864, "epoch": 2790} {"train_loss": -12.430334091186523, "global_step": 468865, "epoch": 2790} {"train_loss": -12.712074279785156, "global_step": 468866, "epoch": 2790} {"train_loss": -12.658294677734375, "global_step": 468867, "epoch": 2790} {"train_loss": -12.46479320526123, "global_step": 468868, "epoch": 2790} {"train_loss": -12.759791374206543, "global_step": 468869, "epoch": 2790} {"train_loss": -12.432494163513184, "global_step": 468870, "epoch": 2790} {"train_loss": -12.703886032104492, "global_step": 468871, "epoch": 2790} {"train_loss": -12.560672760009766, "global_step": 468872, "epoch": 2790} {"train_loss": -12.34499740600586, "global_step": 468873, "epoch": 2790} {"train_loss": -12.673006057739258, "global_step": 468874, "epoch": 2790} {"train_loss": -12.071428298950195, "global_step": 468875, "epoch": 2790} {"train_loss": -12.383353233337402, "global_step": 468876, "epoch": 2790} {"train_loss": -12.387496948242188, "global_step": 468877, "epoch": 2790} {"train_loss": -12.103517532348633, "global_step": 468878, "epoch": 2790} {"train_loss": -12.716968536376953, "global_step": 468879, "epoch": 2790} {"train_loss": -12.159324645996094, "global_step": 468880, "epoch": 2790} {"train_loss": -12.457507133483887, "global_step": 468881, "epoch": 2790} {"train_loss": -12.501504898071289, "global_step": 468882, "epoch": 2790} {"train_loss": -11.998031616210938, "global_step": 468883, "epoch": 2790} {"train_loss": -11.590127944946289, "global_step": 468884, "epoch": 2790} {"train_loss": -12.375909805297852, "global_step": 468885, "epoch": 2790} {"train_loss": -11.846649169921875, "global_step": 468886, "epoch": 2790} {"train_loss": -11.918015145120167, "global_step": 468887, "epoch": 2790, "val_loss": 315221.40625, "train_action_mse_error": 1.6380069255828857} {"train_loss": -12.499500274658203, "global_step": 468888, "epoch": 2791} {"train_loss": -11.806796073913574, "global_step": 468889, "epoch": 2791} {"train_loss": -12.252775192260742, "global_step": 468890, "epoch": 2791} {"train_loss": -12.030837059020996, "global_step": 468891, "epoch": 2791} {"train_loss": -11.12809944152832, "global_step": 468892, "epoch": 2791} {"train_loss": -11.900247573852539, "global_step": 468893, "epoch": 2791} {"train_loss": -12.166692733764648, "global_step": 468894, "epoch": 2791} {"train_loss": -11.714885711669922, "global_step": 468895, "epoch": 2791} {"train_loss": -12.317537307739258, "global_step": 468896, "epoch": 2791} {"train_loss": -11.378988265991211, "global_step": 468897, "epoch": 2791} {"train_loss": -11.595804214477539, "global_step": 468898, "epoch": 2791} {"train_loss": -10.589564323425293, "global_step": 468899, "epoch": 2791} {"train_loss": -10.32349967956543, "global_step": 468900, "epoch": 2791} {"train_loss": -10.540781021118164, "global_step": 468901, "epoch": 2791} {"train_loss": -10.44206428527832, "global_step": 468902, "epoch": 2791} {"train_loss": -9.068964004516602, "global_step": 468903, "epoch": 2791} {"train_loss": -9.29964828491211, "global_step": 468904, "epoch": 2791} {"train_loss": -10.018077850341797, "global_step": 468905, "epoch": 2791} {"train_loss": -10.058658599853516, "global_step": 468906, "epoch": 2791} {"train_loss": -9.380099296569824, "global_step": 468907, "epoch": 2791} {"train_loss": -8.737363815307617, "global_step": 468908, "epoch": 2791} {"train_loss": -8.596526145935059, "global_step": 468909, "epoch": 2791} {"train_loss": -10.283961296081543, "global_step": 468910, "epoch": 2791} {"train_loss": -10.059383392333984, "global_step": 468911, "epoch": 2791} {"train_loss": -10.35757827758789, "global_step": 468912, "epoch": 2791} {"train_loss": -10.428983688354492, "global_step": 468913, "epoch": 2791} {"train_loss": -10.589115142822266, "global_step": 468914, "epoch": 2791} {"train_loss": -11.707234382629395, "global_step": 468915, "epoch": 2791} {"train_loss": -11.125542640686035, "global_step": 468916, "epoch": 2791} {"train_loss": -11.501744270324707, "global_step": 468917, "epoch": 2791} {"train_loss": -11.558399200439453, "global_step": 468918, "epoch": 2791} {"train_loss": -11.309257507324219, "global_step": 468919, "epoch": 2791} {"train_loss": -11.113975524902344, "global_step": 468920, "epoch": 2791} {"train_loss": -11.194870948791504, "global_step": 468921, "epoch": 2791} {"train_loss": -11.299046516418457, "global_step": 468922, "epoch": 2791} {"train_loss": -11.165393829345703, "global_step": 468923, "epoch": 2791} {"train_loss": -11.225862503051758, "global_step": 468924, "epoch": 2791} {"train_loss": -11.157642364501953, "global_step": 468925, "epoch": 2791} {"train_loss": -11.443130493164062, "global_step": 468926, "epoch": 2791} {"train_loss": -11.856559753417969, "global_step": 468927, "epoch": 2791} {"train_loss": -11.508770942687988, "global_step": 468928, "epoch": 2791} {"train_loss": -11.795008659362793, "global_step": 468929, "epoch": 2791} {"train_loss": -11.900473594665527, "global_step": 468930, "epoch": 2791} {"train_loss": -11.81662368774414, "global_step": 468931, "epoch": 2791} {"train_loss": -11.555316925048828, "global_step": 468932, "epoch": 2791} {"train_loss": -11.411487579345703, "global_step": 468933, "epoch": 2791} {"train_loss": -11.663152694702148, "global_step": 468934, "epoch": 2791} {"train_loss": -11.889286994934082, "global_step": 468935, "epoch": 2791} {"train_loss": -11.801263809204102, "global_step": 468936, "epoch": 2791} {"train_loss": -11.981590270996094, "global_step": 468937, "epoch": 2791} {"train_loss": -12.074702262878418, "global_step": 468938, "epoch": 2791} {"train_loss": -11.993255615234375, "global_step": 468939, "epoch": 2791} {"train_loss": -12.019563674926758, "global_step": 468940, "epoch": 2791} {"train_loss": -12.040398597717285, "global_step": 468941, "epoch": 2791} {"train_loss": -12.093206405639648, "global_step": 468942, "epoch": 2791} {"train_loss": -12.132366180419922, "global_step": 468943, "epoch": 2791} {"train_loss": -12.077116012573242, "global_step": 468944, "epoch": 2791} {"train_loss": -12.051888465881348, "global_step": 468945, "epoch": 2791} {"train_loss": -12.332941055297852, "global_step": 468946, "epoch": 2791} {"train_loss": -12.1836519241333, "global_step": 468947, "epoch": 2791} {"train_loss": -12.350851058959961, "global_step": 468948, "epoch": 2791} {"train_loss": -12.483163833618164, "global_step": 468949, "epoch": 2791} {"train_loss": -12.280121803283691, "global_step": 468950, "epoch": 2791} {"train_loss": -12.552675247192383, "global_step": 468951, "epoch": 2791} {"train_loss": -12.44976806640625, "global_step": 468952, "epoch": 2791} {"train_loss": -12.264392852783203, "global_step": 468953, "epoch": 2791} {"train_loss": -12.541808128356934, "global_step": 468954, "epoch": 2791} {"train_loss": -12.294646263122559, "global_step": 468955, "epoch": 2791} {"train_loss": -12.419163703918457, "global_step": 468956, "epoch": 2791} {"train_loss": -12.481132507324219, "global_step": 468957, "epoch": 2791} {"train_loss": -12.31577205657959, "global_step": 468958, "epoch": 2791} {"train_loss": -12.413803100585938, "global_step": 468959, "epoch": 2791} {"train_loss": -12.116172790527344, "global_step": 468960, "epoch": 2791} {"train_loss": -12.515008926391602, "global_step": 468961, "epoch": 2791} {"train_loss": -12.035664558410645, "global_step": 468962, "epoch": 2791} {"train_loss": -12.505807876586914, "global_step": 468963, "epoch": 2791} {"train_loss": -12.60334587097168, "global_step": 468964, "epoch": 2791} {"train_loss": -12.428109169006348, "global_step": 468965, "epoch": 2791} {"train_loss": -12.48465347290039, "global_step": 468966, "epoch": 2791} {"train_loss": -12.637285232543945, "global_step": 468967, "epoch": 2791} {"train_loss": -12.256082534790039, "global_step": 468968, "epoch": 2791} {"train_loss": -12.475189208984375, "global_step": 468969, "epoch": 2791} {"train_loss": -12.291078567504883, "global_step": 468970, "epoch": 2791} {"train_loss": -12.594855308532715, "global_step": 468971, "epoch": 2791} {"train_loss": -12.435911178588867, "global_step": 468972, "epoch": 2791} {"train_loss": -12.095001220703125, "global_step": 468973, "epoch": 2791} {"train_loss": -12.610248565673828, "global_step": 468974, "epoch": 2791} {"train_loss": -12.52352523803711, "global_step": 468975, "epoch": 2791} {"train_loss": -12.866382598876953, "global_step": 468976, "epoch": 2791} {"train_loss": -12.528844833374023, "global_step": 468977, "epoch": 2791} {"train_loss": -12.646265029907227, "global_step": 468978, "epoch": 2791} {"train_loss": -12.646357536315918, "global_step": 468979, "epoch": 2791} {"train_loss": -12.713769912719727, "global_step": 468980, "epoch": 2791} {"train_loss": -12.63874340057373, "global_step": 468981, "epoch": 2791} {"train_loss": -12.739204406738281, "global_step": 468982, "epoch": 2791} {"train_loss": -12.93303108215332, "global_step": 468983, "epoch": 2791} {"train_loss": -12.678431510925293, "global_step": 468984, "epoch": 2791} {"train_loss": -12.68819522857666, "global_step": 468985, "epoch": 2791} {"train_loss": -12.941160202026367, "global_step": 468986, "epoch": 2791} {"train_loss": -12.774534225463867, "global_step": 468987, "epoch": 2791} {"train_loss": -12.867609024047852, "global_step": 468988, "epoch": 2791} {"train_loss": -12.673223495483398, "global_step": 468989, "epoch": 2791} {"train_loss": -12.798798561096191, "global_step": 468990, "epoch": 2791} {"train_loss": -12.75698471069336, "global_step": 468991, "epoch": 2791} {"train_loss": -12.7965087890625, "global_step": 468992, "epoch": 2791} {"train_loss": -12.938535690307617, "global_step": 468993, "epoch": 2791} {"train_loss": -12.627557754516602, "global_step": 468994, "epoch": 2791} {"train_loss": -12.935501098632812, "global_step": 468995, "epoch": 2791} {"train_loss": -12.8199462890625, "global_step": 468996, "epoch": 2791} {"train_loss": -12.759729385375977, "global_step": 468997, "epoch": 2791} {"train_loss": -12.882193565368652, "global_step": 468998, "epoch": 2791} {"train_loss": -12.909366607666016, "global_step": 468999, "epoch": 2791} {"train_loss": -12.885308265686035, "global_step": 469000, "epoch": 2791} {"train_loss": -12.763982772827148, "global_step": 469001, "epoch": 2791} {"train_loss": -12.728281021118164, "global_step": 469002, "epoch": 2791} {"train_loss": -12.469901084899902, "global_step": 469003, "epoch": 2791} {"train_loss": -12.856668472290039, "global_step": 469004, "epoch": 2791} {"train_loss": -12.650952339172363, "global_step": 469005, "epoch": 2791} {"train_loss": -12.89932918548584, "global_step": 469006, "epoch": 2791} {"train_loss": -12.840149879455566, "global_step": 469007, "epoch": 2791} {"train_loss": -12.834160804748535, "global_step": 469008, "epoch": 2791} {"train_loss": -12.663759231567383, "global_step": 469009, "epoch": 2791} {"train_loss": -12.685152053833008, "global_step": 469010, "epoch": 2791} {"train_loss": -12.454206466674805, "global_step": 469011, "epoch": 2791} {"train_loss": -12.941547393798828, "global_step": 469012, "epoch": 2791} {"train_loss": -12.832258224487305, "global_step": 469013, "epoch": 2791} {"train_loss": -13.023015022277832, "global_step": 469014, "epoch": 2791} {"train_loss": -12.764432907104492, "global_step": 469015, "epoch": 2791} {"train_loss": -12.653787612915039, "global_step": 469016, "epoch": 2791} {"train_loss": -12.976337432861328, "global_step": 469017, "epoch": 2791} {"train_loss": -12.923554420471191, "global_step": 469018, "epoch": 2791} {"train_loss": -12.960538864135742, "global_step": 469019, "epoch": 2791} {"train_loss": -12.983116149902344, "global_step": 469020, "epoch": 2791} {"train_loss": -12.682197570800781, "global_step": 469021, "epoch": 2791} {"train_loss": -12.599702835083008, "global_step": 469022, "epoch": 2791} {"train_loss": -12.408735275268555, "global_step": 469023, "epoch": 2791} {"train_loss": -12.830976486206055, "global_step": 469024, "epoch": 2791} {"train_loss": -12.636041641235352, "global_step": 469025, "epoch": 2791} {"train_loss": -12.317505836486816, "global_step": 469026, "epoch": 2791} {"train_loss": -11.470898628234863, "global_step": 469027, "epoch": 2791} {"train_loss": -12.054817199707031, "global_step": 469028, "epoch": 2791} {"train_loss": -12.444368362426758, "global_step": 469029, "epoch": 2791} {"train_loss": -12.403022766113281, "global_step": 469030, "epoch": 2791} {"train_loss": -12.737794876098633, "global_step": 469031, "epoch": 2791} {"train_loss": -12.016533851623535, "global_step": 469032, "epoch": 2791} {"train_loss": -12.866842269897461, "global_step": 469033, "epoch": 2791} {"train_loss": -12.299478530883789, "global_step": 469034, "epoch": 2791} {"train_loss": -12.558713912963867, "global_step": 469035, "epoch": 2791} {"train_loss": -11.697856903076172, "global_step": 469036, "epoch": 2791} {"train_loss": -11.806915283203125, "global_step": 469037, "epoch": 2791} {"train_loss": -12.87700080871582, "global_step": 469038, "epoch": 2791} {"train_loss": -12.079096794128418, "global_step": 469039, "epoch": 2791} {"train_loss": -11.67898941040039, "global_step": 469040, "epoch": 2791} {"train_loss": -13.076505661010742, "global_step": 469041, "epoch": 2791} {"train_loss": -11.896295547485352, "global_step": 469042, "epoch": 2791} {"train_loss": -12.007345199584961, "global_step": 469043, "epoch": 2791} {"train_loss": -12.71656322479248, "global_step": 469044, "epoch": 2791} {"train_loss": -12.820940971374512, "global_step": 469045, "epoch": 2791} {"train_loss": -12.768277168273926, "global_step": 469046, "epoch": 2791} {"train_loss": -12.79228687286377, "global_step": 469047, "epoch": 2791} {"train_loss": -12.831291198730469, "global_step": 469048, "epoch": 2791} {"train_loss": -12.662673950195312, "global_step": 469049, "epoch": 2791} {"train_loss": -12.737253189086914, "global_step": 469050, "epoch": 2791} {"train_loss": -13.124185562133789, "global_step": 469051, "epoch": 2791} {"train_loss": -12.43541145324707, "global_step": 469052, "epoch": 2791} {"train_loss": -12.445428848266602, "global_step": 469053, "epoch": 2791} {"train_loss": -12.699423789978027, "global_step": 469054, "epoch": 2791} {"train_loss": -12.109812560535612, "global_step": 469055, "epoch": 2791, "val_loss": 317295.40625} {"train_loss": -12.767502784729004, "global_step": 469056, "epoch": 2792} {"train_loss": -12.634161949157715, "global_step": 469057, "epoch": 2792} {"train_loss": -12.307296752929688, "global_step": 469058, "epoch": 2792} {"train_loss": -12.455519676208496, "global_step": 469059, "epoch": 2792} {"train_loss": -12.513652801513672, "global_step": 469060, "epoch": 2792} {"train_loss": -12.913588523864746, "global_step": 469061, "epoch": 2792} {"train_loss": -12.235930442810059, "global_step": 469062, "epoch": 2792} {"train_loss": -11.940387725830078, "global_step": 469063, "epoch": 2792} {"train_loss": -12.056217193603516, "global_step": 469064, "epoch": 2792} {"train_loss": -12.13435173034668, "global_step": 469065, "epoch": 2792} {"train_loss": -12.532797813415527, "global_step": 469066, "epoch": 2792} {"train_loss": -12.598331451416016, "global_step": 469067, "epoch": 2792} {"train_loss": -12.640946388244629, "global_step": 469068, "epoch": 2792} {"train_loss": -12.041227340698242, "global_step": 469069, "epoch": 2792} {"train_loss": -12.554971694946289, "global_step": 469070, "epoch": 2792} {"train_loss": -12.446425437927246, "global_step": 469071, "epoch": 2792} {"train_loss": -12.314203262329102, "global_step": 469072, "epoch": 2792} {"train_loss": -12.352718353271484, "global_step": 469073, "epoch": 2792} {"train_loss": -12.363910675048828, "global_step": 469074, "epoch": 2792} {"train_loss": -12.177248001098633, "global_step": 469075, "epoch": 2792} {"train_loss": -11.758313179016113, "global_step": 469076, "epoch": 2792} {"train_loss": -12.48010540008545, "global_step": 469077, "epoch": 2792} {"train_loss": -12.018146514892578, "global_step": 469078, "epoch": 2792} {"train_loss": -12.426591873168945, "global_step": 469079, "epoch": 2792} {"train_loss": -12.349987030029297, "global_step": 469080, "epoch": 2792} {"train_loss": -11.477374076843262, "global_step": 469081, "epoch": 2792} {"train_loss": -11.970005989074707, "global_step": 469082, "epoch": 2792} {"train_loss": -11.779674530029297, "global_step": 469083, "epoch": 2792} {"train_loss": -11.893884658813477, "global_step": 469084, "epoch": 2792} {"train_loss": -11.255426406860352, "global_step": 469085, "epoch": 2792} {"train_loss": -10.565451622009277, "global_step": 469086, "epoch": 2792} {"train_loss": -11.685590744018555, "global_step": 469087, "epoch": 2792} {"train_loss": -11.131311416625977, "global_step": 469088, "epoch": 2792} {"train_loss": -11.176027297973633, "global_step": 469089, "epoch": 2792} {"train_loss": -11.469077110290527, "global_step": 469090, "epoch": 2792} {"train_loss": -11.764310836791992, "global_step": 469091, "epoch": 2792} {"train_loss": -11.951591491699219, "global_step": 469092, "epoch": 2792} {"train_loss": -11.618842124938965, "global_step": 469093, "epoch": 2792} {"train_loss": -11.83488655090332, "global_step": 469094, "epoch": 2792} {"train_loss": -11.388774871826172, "global_step": 469095, "epoch": 2792} {"train_loss": -12.21847915649414, "global_step": 469096, "epoch": 2792} {"train_loss": -11.466611862182617, "global_step": 469097, "epoch": 2792} {"train_loss": -11.695840835571289, "global_step": 469098, "epoch": 2792} {"train_loss": -11.240129470825195, "global_step": 469099, "epoch": 2792} {"train_loss": -12.516352653503418, "global_step": 469100, "epoch": 2792} {"train_loss": -11.797586441040039, "global_step": 469101, "epoch": 2792} {"train_loss": -11.924352645874023, "global_step": 469102, "epoch": 2792} {"train_loss": -10.922220230102539, "global_step": 469103, "epoch": 2792} {"train_loss": -10.86247444152832, "global_step": 469104, "epoch": 2792} {"train_loss": -12.095531463623047, "global_step": 469105, "epoch": 2792} {"train_loss": -10.630634307861328, "global_step": 469106, "epoch": 2792} {"train_loss": -11.098444938659668, "global_step": 469107, "epoch": 2792} {"train_loss": -11.46737289428711, "global_step": 469108, "epoch": 2792} {"train_loss": -11.202102661132812, "global_step": 469109, "epoch": 2792} {"train_loss": -10.343852996826172, "global_step": 469110, "epoch": 2792} {"train_loss": -11.784663200378418, "global_step": 469111, "epoch": 2792} {"train_loss": -10.053417205810547, "global_step": 469112, "epoch": 2792} {"train_loss": -11.239046096801758, "global_step": 469113, "epoch": 2792} {"train_loss": -10.673360824584961, "global_step": 469114, "epoch": 2792} {"train_loss": -11.66555404663086, "global_step": 469115, "epoch": 2792} {"train_loss": -11.262407302856445, "global_step": 469116, "epoch": 2792} {"train_loss": -11.33254623413086, "global_step": 469117, "epoch": 2792} {"train_loss": -11.667710304260254, "global_step": 469118, "epoch": 2792} {"train_loss": -11.378520011901855, "global_step": 469119, "epoch": 2792} {"train_loss": -12.058183670043945, "global_step": 469120, "epoch": 2792} {"train_loss": -11.557657241821289, "global_step": 469121, "epoch": 2792} {"train_loss": -11.666777610778809, "global_step": 469122, "epoch": 2792} {"train_loss": -10.918725967407227, "global_step": 469123, "epoch": 2792} {"train_loss": -11.544764518737793, "global_step": 469124, "epoch": 2792} {"train_loss": -11.631352424621582, "global_step": 469125, "epoch": 2792} {"train_loss": -10.445727348327637, "global_step": 469126, "epoch": 2792} {"train_loss": -11.072184562683105, "global_step": 469127, "epoch": 2792} {"train_loss": -10.924105644226074, "global_step": 469128, "epoch": 2792} {"train_loss": -10.876867294311523, "global_step": 469129, "epoch": 2792} {"train_loss": -10.598434448242188, "global_step": 469130, "epoch": 2792} {"train_loss": -11.987569808959961, "global_step": 469131, "epoch": 2792} {"train_loss": -10.281291961669922, "global_step": 469132, "epoch": 2792} {"train_loss": -11.854955673217773, "global_step": 469133, "epoch": 2792} {"train_loss": -11.883794784545898, "global_step": 469134, "epoch": 2792} {"train_loss": -11.387723922729492, "global_step": 469135, "epoch": 2792} {"train_loss": -11.404731750488281, "global_step": 469136, "epoch": 2792} {"train_loss": -12.428646087646484, "global_step": 469137, "epoch": 2792} {"train_loss": -11.381500244140625, "global_step": 469138, "epoch": 2792} {"train_loss": -12.078741073608398, "global_step": 469139, "epoch": 2792} {"train_loss": -11.885075569152832, "global_step": 469140, "epoch": 2792} {"train_loss": -11.719125747680664, "global_step": 469141, "epoch": 2792} {"train_loss": -12.521821975708008, "global_step": 469142, "epoch": 2792} {"train_loss": -12.408225059509277, "global_step": 469143, "epoch": 2792} {"train_loss": -12.22687816619873, "global_step": 469144, "epoch": 2792} {"train_loss": -12.353082656860352, "global_step": 469145, "epoch": 2792} {"train_loss": -12.097408294677734, "global_step": 469146, "epoch": 2792} {"train_loss": -11.879524230957031, "global_step": 469147, "epoch": 2792} {"train_loss": -12.577259063720703, "global_step": 469148, "epoch": 2792} {"train_loss": -11.564981460571289, "global_step": 469149, "epoch": 2792} {"train_loss": -12.332797050476074, "global_step": 469150, "epoch": 2792} {"train_loss": -11.746976852416992, "global_step": 469151, "epoch": 2792} {"train_loss": -11.92570686340332, "global_step": 469152, "epoch": 2792} {"train_loss": -11.97264289855957, "global_step": 469153, "epoch": 2792} {"train_loss": -12.013147354125977, "global_step": 469154, "epoch": 2792} {"train_loss": -12.05197811126709, "global_step": 469155, "epoch": 2792} {"train_loss": -12.125276565551758, "global_step": 469156, "epoch": 2792} {"train_loss": -12.061119079589844, "global_step": 469157, "epoch": 2792} {"train_loss": -12.01680850982666, "global_step": 469158, "epoch": 2792} {"train_loss": -12.197202682495117, "global_step": 469159, "epoch": 2792} {"train_loss": -11.906331062316895, "global_step": 469160, "epoch": 2792} {"train_loss": -12.377849578857422, "global_step": 469161, "epoch": 2792} {"train_loss": -12.074536323547363, "global_step": 469162, "epoch": 2792} {"train_loss": -12.261273384094238, "global_step": 469163, "epoch": 2792} {"train_loss": -12.121627807617188, "global_step": 469164, "epoch": 2792} {"train_loss": -12.352167129516602, "global_step": 469165, "epoch": 2792} {"train_loss": -12.194058418273926, "global_step": 469166, "epoch": 2792} {"train_loss": -12.328737258911133, "global_step": 469167, "epoch": 2792} {"train_loss": -11.957491874694824, "global_step": 469168, "epoch": 2792} {"train_loss": -11.974859237670898, "global_step": 469169, "epoch": 2792} {"train_loss": -12.188045501708984, "global_step": 469170, "epoch": 2792} {"train_loss": -12.195101737976074, "global_step": 469171, "epoch": 2792} {"train_loss": -12.285538673400879, "global_step": 469172, "epoch": 2792} {"train_loss": -12.281801223754883, "global_step": 469173, "epoch": 2792} {"train_loss": -12.361146926879883, "global_step": 469174, "epoch": 2792} {"train_loss": -12.519613265991211, "global_step": 469175, "epoch": 2792} {"train_loss": -12.688189506530762, "global_step": 469176, "epoch": 2792} {"train_loss": -12.501338005065918, "global_step": 469177, "epoch": 2792} {"train_loss": -12.395841598510742, "global_step": 469178, "epoch": 2792} {"train_loss": -12.57023811340332, "global_step": 469179, "epoch": 2792} {"train_loss": -12.507741928100586, "global_step": 469180, "epoch": 2792} {"train_loss": -12.638673782348633, "global_step": 469181, "epoch": 2792} {"train_loss": -12.603867530822754, "global_step": 469182, "epoch": 2792} {"train_loss": -12.674036979675293, "global_step": 469183, "epoch": 2792} {"train_loss": -12.531722068786621, "global_step": 469184, "epoch": 2792} {"train_loss": -12.795113563537598, "global_step": 469185, "epoch": 2792} {"train_loss": -12.371322631835938, "global_step": 469186, "epoch": 2792} {"train_loss": -12.680436134338379, "global_step": 469187, "epoch": 2792} {"train_loss": -12.695155143737793, "global_step": 469188, "epoch": 2792} {"train_loss": -12.38788890838623, "global_step": 469189, "epoch": 2792} {"train_loss": -12.538504600524902, "global_step": 469190, "epoch": 2792} {"train_loss": -12.6099271774292, "global_step": 469191, "epoch": 2792} {"train_loss": -12.74854564666748, "global_step": 469192, "epoch": 2792} {"train_loss": -12.14086627960205, "global_step": 469193, "epoch": 2792} {"train_loss": -11.677664756774902, "global_step": 469194, "epoch": 2792} {"train_loss": -12.515002250671387, "global_step": 469195, "epoch": 2792} {"train_loss": -12.336614608764648, "global_step": 469196, "epoch": 2792} {"train_loss": -11.765083312988281, "global_step": 469197, "epoch": 2792} {"train_loss": -12.550207138061523, "global_step": 469198, "epoch": 2792} {"train_loss": -12.343714714050293, "global_step": 469199, "epoch": 2792} {"train_loss": -12.264519691467285, "global_step": 469200, "epoch": 2792} {"train_loss": -12.609631538391113, "global_step": 469201, "epoch": 2792} {"train_loss": -12.429951667785645, "global_step": 469202, "epoch": 2792} {"train_loss": -12.541034698486328, "global_step": 469203, "epoch": 2792} {"train_loss": -12.663323402404785, "global_step": 469204, "epoch": 2792} {"train_loss": -12.809991836547852, "global_step": 469205, "epoch": 2792} {"train_loss": -12.61276626586914, "global_step": 469206, "epoch": 2792} {"train_loss": -12.85728645324707, "global_step": 469207, "epoch": 2792} {"train_loss": -12.735250473022461, "global_step": 469208, "epoch": 2792} {"train_loss": -12.752989768981934, "global_step": 469209, "epoch": 2792} {"train_loss": -12.610595703125, "global_step": 469210, "epoch": 2792} {"train_loss": -12.787773132324219, "global_step": 469211, "epoch": 2792} {"train_loss": -12.642160415649414, "global_step": 469212, "epoch": 2792} {"train_loss": -12.841039657592773, "global_step": 469213, "epoch": 2792} {"train_loss": -12.871833801269531, "global_step": 469214, "epoch": 2792} {"train_loss": -12.914506912231445, "global_step": 469215, "epoch": 2792} {"train_loss": -12.847476959228516, "global_step": 469216, "epoch": 2792} {"train_loss": -12.741846084594727, "global_step": 469217, "epoch": 2792} {"train_loss": -12.627656936645508, "global_step": 469218, "epoch": 2792} {"train_loss": -12.676610946655273, "global_step": 469219, "epoch": 2792} {"train_loss": -12.936691284179688, "global_step": 469220, "epoch": 2792} {"train_loss": -12.709901809692383, "global_step": 469221, "epoch": 2792} {"train_loss": -12.719362258911133, "global_step": 469222, "epoch": 2792} {"train_loss": -12.047794801848275, "global_step": 469223, "epoch": 2792, "val_loss": 316534.8125} {"train_loss": -12.670934677124023, "global_step": 469224, "epoch": 2793} {"train_loss": -12.665497779846191, "global_step": 469225, "epoch": 2793} {"train_loss": -12.903097152709961, "global_step": 469226, "epoch": 2793} {"train_loss": -12.808572769165039, "global_step": 469227, "epoch": 2793} {"train_loss": -12.989480018615723, "global_step": 469228, "epoch": 2793} {"train_loss": -12.818132400512695, "global_step": 469229, "epoch": 2793} {"train_loss": -12.920775413513184, "global_step": 469230, "epoch": 2793} {"train_loss": -12.871454238891602, "global_step": 469231, "epoch": 2793} {"train_loss": -12.867574691772461, "global_step": 469232, "epoch": 2793} {"train_loss": -12.834444046020508, "global_step": 469233, "epoch": 2793} {"train_loss": -12.859989166259766, "global_step": 469234, "epoch": 2793} {"train_loss": -13.038896560668945, "global_step": 469235, "epoch": 2793} {"train_loss": -12.838678359985352, "global_step": 469236, "epoch": 2793} {"train_loss": -12.877267837524414, "global_step": 469237, "epoch": 2793} {"train_loss": -12.793058395385742, "global_step": 469238, "epoch": 2793} {"train_loss": -13.035638809204102, "global_step": 469239, "epoch": 2793} {"train_loss": -12.853185653686523, "global_step": 469240, "epoch": 2793} {"train_loss": -12.411067008972168, "global_step": 469241, "epoch": 2793} {"train_loss": -12.672343254089355, "global_step": 469242, "epoch": 2793} {"train_loss": -13.007871627807617, "global_step": 469243, "epoch": 2793} {"train_loss": -12.393743515014648, "global_step": 469244, "epoch": 2793} {"train_loss": -11.884900093078613, "global_step": 469245, "epoch": 2793} {"train_loss": -11.314085006713867, "global_step": 469246, "epoch": 2793} {"train_loss": -11.243894577026367, "global_step": 469247, "epoch": 2793} {"train_loss": -12.123924255371094, "global_step": 469248, "epoch": 2793} {"train_loss": -10.444960594177246, "global_step": 469249, "epoch": 2793} {"train_loss": -12.289400100708008, "global_step": 469250, "epoch": 2793} {"train_loss": -10.256760597229004, "global_step": 469251, "epoch": 2793} {"train_loss": -11.842203140258789, "global_step": 469252, "epoch": 2793} {"train_loss": -11.670902252197266, "global_step": 469253, "epoch": 2793} {"train_loss": -11.228372573852539, "global_step": 469254, "epoch": 2793} {"train_loss": -11.20941162109375, "global_step": 469255, "epoch": 2793} {"train_loss": -12.00239372253418, "global_step": 469256, "epoch": 2793} {"train_loss": -11.75958251953125, "global_step": 469257, "epoch": 2793} {"train_loss": -11.041292190551758, "global_step": 469258, "epoch": 2793} {"train_loss": -10.56959056854248, "global_step": 469259, "epoch": 2793} {"train_loss": -11.226997375488281, "global_step": 469260, "epoch": 2793} {"train_loss": -11.29179573059082, "global_step": 469261, "epoch": 2793} {"train_loss": -11.724966049194336, "global_step": 469262, "epoch": 2793} {"train_loss": -11.503580093383789, "global_step": 469263, "epoch": 2793} {"train_loss": -11.869248390197754, "global_step": 469264, "epoch": 2793} {"train_loss": -11.429698944091797, "global_step": 469265, "epoch": 2793} {"train_loss": -11.033462524414062, "global_step": 469266, "epoch": 2793} {"train_loss": -11.456974029541016, "global_step": 469267, "epoch": 2793} {"train_loss": -10.671178817749023, "global_step": 469268, "epoch": 2793} {"train_loss": -11.810063362121582, "global_step": 469269, "epoch": 2793} {"train_loss": -9.209503173828125, "global_step": 469270, "epoch": 2793} {"train_loss": -9.964550971984863, "global_step": 469271, "epoch": 2793} {"train_loss": -10.084005355834961, "global_step": 469272, "epoch": 2793} {"train_loss": -11.528183937072754, "global_step": 469273, "epoch": 2793} {"train_loss": -11.118921279907227, "global_step": 469274, "epoch": 2793} {"train_loss": -9.54655933380127, "global_step": 469275, "epoch": 2793} {"train_loss": -9.394134521484375, "global_step": 469276, "epoch": 2793} {"train_loss": -9.270092010498047, "global_step": 469277, "epoch": 2793} {"train_loss": -10.351418495178223, "global_step": 469278, "epoch": 2793} {"train_loss": -10.017416954040527, "global_step": 469279, "epoch": 2793} {"train_loss": -10.090263366699219, "global_step": 469280, "epoch": 2793} {"train_loss": -10.877080917358398, "global_step": 469281, "epoch": 2793} {"train_loss": -11.069740295410156, "global_step": 469282, "epoch": 2793} {"train_loss": -10.804463386535645, "global_step": 469283, "epoch": 2793} {"train_loss": -11.705488204956055, "global_step": 469284, "epoch": 2793} {"train_loss": -11.472674369812012, "global_step": 469285, "epoch": 2793} {"train_loss": -11.340838432312012, "global_step": 469286, "epoch": 2793} {"train_loss": -11.437923431396484, "global_step": 469287, "epoch": 2793} {"train_loss": -10.993487358093262, "global_step": 469288, "epoch": 2793} {"train_loss": -11.488250732421875, "global_step": 469289, "epoch": 2793} {"train_loss": -11.401947021484375, "global_step": 469290, "epoch": 2793} {"train_loss": -11.206984519958496, "global_step": 469291, "epoch": 2793} {"train_loss": -11.516411781311035, "global_step": 469292, "epoch": 2793} {"train_loss": -11.6353120803833, "global_step": 469293, "epoch": 2793} {"train_loss": -11.523380279541016, "global_step": 469294, "epoch": 2793} {"train_loss": -11.06834602355957, "global_step": 469295, "epoch": 2793} {"train_loss": -11.558614730834961, "global_step": 469296, "epoch": 2793} {"train_loss": -11.696212768554688, "global_step": 469297, "epoch": 2793} {"train_loss": -11.339096069335938, "global_step": 469298, "epoch": 2793} {"train_loss": -11.867000579833984, "global_step": 469299, "epoch": 2793} {"train_loss": -11.775968551635742, "global_step": 469300, "epoch": 2793} {"train_loss": -11.999824523925781, "global_step": 469301, "epoch": 2793} {"train_loss": -12.355449676513672, "global_step": 469302, "epoch": 2793} {"train_loss": -11.914152145385742, "global_step": 469303, "epoch": 2793} {"train_loss": -12.047294616699219, "global_step": 469304, "epoch": 2793} {"train_loss": -12.302401542663574, "global_step": 469305, "epoch": 2793} {"train_loss": -11.700384140014648, "global_step": 469306, "epoch": 2793} {"train_loss": -11.683341979980469, "global_step": 469307, "epoch": 2793} {"train_loss": -12.154008865356445, "global_step": 469308, "epoch": 2793} {"train_loss": -11.67101001739502, "global_step": 469309, "epoch": 2793} {"train_loss": -11.960180282592773, "global_step": 469310, "epoch": 2793} {"train_loss": -11.960319519042969, "global_step": 469311, "epoch": 2793} {"train_loss": -12.253422737121582, "global_step": 469312, "epoch": 2793} {"train_loss": -11.767240524291992, "global_step": 469313, "epoch": 2793} {"train_loss": -11.766090393066406, "global_step": 469314, "epoch": 2793} {"train_loss": -12.297364234924316, "global_step": 469315, "epoch": 2793} {"train_loss": -12.111580848693848, "global_step": 469316, "epoch": 2793} {"train_loss": -12.131572723388672, "global_step": 469317, "epoch": 2793} {"train_loss": -11.693286895751953, "global_step": 469318, "epoch": 2793} {"train_loss": -12.40456771850586, "global_step": 469319, "epoch": 2793} {"train_loss": -11.628387451171875, "global_step": 469320, "epoch": 2793} {"train_loss": -12.227502822875977, "global_step": 469321, "epoch": 2793} {"train_loss": -11.3910551071167, "global_step": 469322, "epoch": 2793} {"train_loss": -12.369483947753906, "global_step": 469323, "epoch": 2793} {"train_loss": -11.862987518310547, "global_step": 469324, "epoch": 2793} {"train_loss": -12.199189186096191, "global_step": 469325, "epoch": 2793} {"train_loss": -12.113340377807617, "global_step": 469326, "epoch": 2793} {"train_loss": -12.405526161193848, "global_step": 469327, "epoch": 2793} {"train_loss": -12.369383811950684, "global_step": 469328, "epoch": 2793} {"train_loss": -12.20236587524414, "global_step": 469329, "epoch": 2793} {"train_loss": -12.449016571044922, "global_step": 469330, "epoch": 2793} {"train_loss": -12.47590446472168, "global_step": 469331, "epoch": 2793} {"train_loss": -12.400278091430664, "global_step": 469332, "epoch": 2793} {"train_loss": -12.594548225402832, "global_step": 469333, "epoch": 2793} {"train_loss": -12.438879013061523, "global_step": 469334, "epoch": 2793} {"train_loss": -12.568021774291992, "global_step": 469335, "epoch": 2793} {"train_loss": -12.471782684326172, "global_step": 469336, "epoch": 2793} {"train_loss": -12.744197845458984, "global_step": 469337, "epoch": 2793} {"train_loss": -12.483502388000488, "global_step": 469338, "epoch": 2793} {"train_loss": -12.850698471069336, "global_step": 469339, "epoch": 2793} {"train_loss": -12.6066255569458, "global_step": 469340, "epoch": 2793} {"train_loss": -12.781896591186523, "global_step": 469341, "epoch": 2793} {"train_loss": -12.433770179748535, "global_step": 469342, "epoch": 2793} {"train_loss": -12.647333145141602, "global_step": 469343, "epoch": 2793} {"train_loss": -12.708198547363281, "global_step": 469344, "epoch": 2793} {"train_loss": -12.888648986816406, "global_step": 469345, "epoch": 2793} {"train_loss": -12.795377731323242, "global_step": 469346, "epoch": 2793} {"train_loss": -12.910348892211914, "global_step": 469347, "epoch": 2793} {"train_loss": -12.779438018798828, "global_step": 469348, "epoch": 2793} {"train_loss": -12.844476699829102, "global_step": 469349, "epoch": 2793} {"train_loss": -12.632668495178223, "global_step": 469350, "epoch": 2793} {"train_loss": -12.868316650390625, "global_step": 469351, "epoch": 2793} {"train_loss": -12.566484451293945, "global_step": 469352, "epoch": 2793} {"train_loss": -12.531854629516602, "global_step": 469353, "epoch": 2793} {"train_loss": -12.811779022216797, "global_step": 469354, "epoch": 2793} {"train_loss": -12.734525680541992, "global_step": 469355, "epoch": 2793} {"train_loss": -12.793755531311035, "global_step": 469356, "epoch": 2793} {"train_loss": -12.753108978271484, "global_step": 469357, "epoch": 2793} {"train_loss": -12.777326583862305, "global_step": 469358, "epoch": 2793} {"train_loss": -12.847587585449219, "global_step": 469359, "epoch": 2793} {"train_loss": -12.951504707336426, "global_step": 469360, "epoch": 2793} {"train_loss": -12.839301109313965, "global_step": 469361, "epoch": 2793} {"train_loss": -13.010293960571289, "global_step": 469362, "epoch": 2793} {"train_loss": -12.674360275268555, "global_step": 469363, "epoch": 2793} {"train_loss": -12.857379913330078, "global_step": 469364, "epoch": 2793} {"train_loss": -12.956844329833984, "global_step": 469365, "epoch": 2793} {"train_loss": -12.904548645019531, "global_step": 469366, "epoch": 2793} {"train_loss": -12.736808776855469, "global_step": 469367, "epoch": 2793} {"train_loss": -12.94720458984375, "global_step": 469368, "epoch": 2793} {"train_loss": -12.911386489868164, "global_step": 469369, "epoch": 2793} {"train_loss": -12.876426696777344, "global_step": 469370, "epoch": 2793} {"train_loss": -12.871222496032715, "global_step": 469371, "epoch": 2793} {"train_loss": -12.76041316986084, "global_step": 469372, "epoch": 2793} {"train_loss": -12.545058250427246, "global_step": 469373, "epoch": 2793} {"train_loss": -12.510124206542969, "global_step": 469374, "epoch": 2793} {"train_loss": -13.015958786010742, "global_step": 469375, "epoch": 2793} {"train_loss": -12.400887489318848, "global_step": 469376, "epoch": 2793} {"train_loss": -12.701055526733398, "global_step": 469377, "epoch": 2793} {"train_loss": -12.8650541305542, "global_step": 469378, "epoch": 2793} {"train_loss": -12.701604843139648, "global_step": 469379, "epoch": 2793} {"train_loss": -12.584113121032715, "global_step": 469380, "epoch": 2793} {"train_loss": -12.660926818847656, "global_step": 469381, "epoch": 2793} {"train_loss": -12.92240047454834, "global_step": 469382, "epoch": 2793} {"train_loss": -13.002446174621582, "global_step": 469383, "epoch": 2793} {"train_loss": -12.645735740661621, "global_step": 469384, "epoch": 2793} {"train_loss": -12.69456958770752, "global_step": 469385, "epoch": 2793} {"train_loss": -12.973041534423828, "global_step": 469386, "epoch": 2793} {"train_loss": -12.832257270812988, "global_step": 469387, "epoch": 2793} {"train_loss": -12.882387161254883, "global_step": 469388, "epoch": 2793} {"train_loss": -12.687801361083984, "global_step": 469389, "epoch": 2793} {"train_loss": -12.83825397491455, "global_step": 469390, "epoch": 2793} {"train_loss": -12.089541963168553, "global_step": 469391, "epoch": 2793, "val_loss": 317312.15625} {"train_loss": -12.772872924804688, "global_step": 469392, "epoch": 2794} {"train_loss": -13.083581924438477, "global_step": 469393, "epoch": 2794} {"train_loss": -13.02484130859375, "global_step": 469394, "epoch": 2794} {"train_loss": -12.787755966186523, "global_step": 469395, "epoch": 2794} {"train_loss": -12.918922424316406, "global_step": 469396, "epoch": 2794} {"train_loss": -12.959848403930664, "global_step": 469397, "epoch": 2794} {"train_loss": -12.39881706237793, "global_step": 469398, "epoch": 2794} {"train_loss": -12.764873504638672, "global_step": 469399, "epoch": 2794} {"train_loss": -12.82400894165039, "global_step": 469400, "epoch": 2794} {"train_loss": -12.946941375732422, "global_step": 469401, "epoch": 2794} {"train_loss": -12.897285461425781, "global_step": 469402, "epoch": 2794} {"train_loss": -13.08737564086914, "global_step": 469403, "epoch": 2794} {"train_loss": -12.782491683959961, "global_step": 469404, "epoch": 2794} {"train_loss": -12.668593406677246, "global_step": 469405, "epoch": 2794} {"train_loss": -12.75912094116211, "global_step": 469406, "epoch": 2794} {"train_loss": -12.918925285339355, "global_step": 469407, "epoch": 2794} {"train_loss": -12.730106353759766, "global_step": 469408, "epoch": 2794} {"train_loss": -12.514583587646484, "global_step": 469409, "epoch": 2794} {"train_loss": -11.960406303405762, "global_step": 469410, "epoch": 2794} {"train_loss": -11.733076095581055, "global_step": 469411, "epoch": 2794} {"train_loss": -12.313823699951172, "global_step": 469412, "epoch": 2794} {"train_loss": -12.24833869934082, "global_step": 469413, "epoch": 2794} {"train_loss": -11.36306095123291, "global_step": 469414, "epoch": 2794} {"train_loss": -9.721416473388672, "global_step": 469415, "epoch": 2794} {"train_loss": -10.564624786376953, "global_step": 469416, "epoch": 2794} {"train_loss": -12.582378387451172, "global_step": 469417, "epoch": 2794} {"train_loss": -9.539258003234863, "global_step": 469418, "epoch": 2794} {"train_loss": -11.1821870803833, "global_step": 469419, "epoch": 2794} {"train_loss": -10.674383163452148, "global_step": 469420, "epoch": 2794} {"train_loss": -9.378618240356445, "global_step": 469421, "epoch": 2794} {"train_loss": -12.348270416259766, "global_step": 469422, "epoch": 2794} {"train_loss": -9.604743957519531, "global_step": 469423, "epoch": 2794} {"train_loss": -10.555492401123047, "global_step": 469424, "epoch": 2794} {"train_loss": -11.749747276306152, "global_step": 469425, "epoch": 2794} {"train_loss": -10.074528694152832, "global_step": 469426, "epoch": 2794} {"train_loss": -11.251029014587402, "global_step": 469427, "epoch": 2794} {"train_loss": -11.438417434692383, "global_step": 469428, "epoch": 2794} {"train_loss": -10.658857345581055, "global_step": 469429, "epoch": 2794} {"train_loss": -10.569093704223633, "global_step": 469430, "epoch": 2794} {"train_loss": -8.736701965332031, "global_step": 469431, "epoch": 2794} {"train_loss": -7.883788585662842, "global_step": 469432, "epoch": 2794} {"train_loss": -9.209593772888184, "global_step": 469433, "epoch": 2794} {"train_loss": -9.459293365478516, "global_step": 469434, "epoch": 2794} {"train_loss": -9.007614135742188, "global_step": 469435, "epoch": 2794} {"train_loss": -8.981554985046387, "global_step": 469436, "epoch": 2794} {"train_loss": -10.28927993774414, "global_step": 469437, "epoch": 2794} {"train_loss": -9.634208679199219, "global_step": 469438, "epoch": 2794} {"train_loss": -11.506213188171387, "global_step": 469439, "epoch": 2794} {"train_loss": -11.274553298950195, "global_step": 469440, "epoch": 2794} {"train_loss": -10.816234588623047, "global_step": 469441, "epoch": 2794} {"train_loss": -11.645456314086914, "global_step": 469442, "epoch": 2794} {"train_loss": -10.973320007324219, "global_step": 469443, "epoch": 2794} {"train_loss": -11.413439750671387, "global_step": 469444, "epoch": 2794} {"train_loss": -11.363040924072266, "global_step": 469445, "epoch": 2794} {"train_loss": -11.355031967163086, "global_step": 469446, "epoch": 2794} {"train_loss": -11.72571086883545, "global_step": 469447, "epoch": 2794} {"train_loss": -11.818342208862305, "global_step": 469448, "epoch": 2794} {"train_loss": -11.264104843139648, "global_step": 469449, "epoch": 2794} {"train_loss": -11.114603042602539, "global_step": 469450, "epoch": 2794} {"train_loss": -11.192142486572266, "global_step": 469451, "epoch": 2794} {"train_loss": -11.007408142089844, "global_step": 469452, "epoch": 2794} {"train_loss": -12.066024780273438, "global_step": 469453, "epoch": 2794} {"train_loss": -10.926271438598633, "global_step": 469454, "epoch": 2794} {"train_loss": -11.169733047485352, "global_step": 469455, "epoch": 2794} {"train_loss": -11.559713363647461, "global_step": 469456, "epoch": 2794} {"train_loss": -11.053287506103516, "global_step": 469457, "epoch": 2794} {"train_loss": -11.76388931274414, "global_step": 469458, "epoch": 2794} {"train_loss": -11.426223754882812, "global_step": 469459, "epoch": 2794} {"train_loss": -11.657588005065918, "global_step": 469460, "epoch": 2794} {"train_loss": -11.478194236755371, "global_step": 469461, "epoch": 2794} {"train_loss": -11.640195846557617, "global_step": 469462, "epoch": 2794} {"train_loss": -11.449504852294922, "global_step": 469463, "epoch": 2794} {"train_loss": -11.202281951904297, "global_step": 469464, "epoch": 2794} {"train_loss": -11.19478702545166, "global_step": 469465, "epoch": 2794} {"train_loss": -11.452510833740234, "global_step": 469466, "epoch": 2794} {"train_loss": -10.555486679077148, "global_step": 469467, "epoch": 2794} {"train_loss": -10.69951057434082, "global_step": 469468, "epoch": 2794} {"train_loss": -11.641148567199707, "global_step": 469469, "epoch": 2794} {"train_loss": -10.99258804321289, "global_step": 469470, "epoch": 2794} {"train_loss": -11.005475997924805, "global_step": 469471, "epoch": 2794} {"train_loss": -11.31837272644043, "global_step": 469472, "epoch": 2794} {"train_loss": -11.168787002563477, "global_step": 469473, "epoch": 2794} {"train_loss": -11.552927017211914, "global_step": 469474, "epoch": 2794} {"train_loss": -11.643417358398438, "global_step": 469475, "epoch": 2794} {"train_loss": -11.544031143188477, "global_step": 469476, "epoch": 2794} {"train_loss": -11.74022102355957, "global_step": 469477, "epoch": 2794} {"train_loss": -11.019916534423828, "global_step": 469478, "epoch": 2794} {"train_loss": -11.833967208862305, "global_step": 469479, "epoch": 2794} {"train_loss": -12.132941246032715, "global_step": 469480, "epoch": 2794} {"train_loss": -11.944034576416016, "global_step": 469481, "epoch": 2794} {"train_loss": -12.138934135437012, "global_step": 469482, "epoch": 2794} {"train_loss": -12.218713760375977, "global_step": 469483, "epoch": 2794} {"train_loss": -12.022224426269531, "global_step": 469484, "epoch": 2794} {"train_loss": -12.2471342086792, "global_step": 469485, "epoch": 2794} {"train_loss": -11.790340423583984, "global_step": 469486, "epoch": 2794} {"train_loss": -12.354427337646484, "global_step": 469487, "epoch": 2794} {"train_loss": -12.03126335144043, "global_step": 469488, "epoch": 2794} {"train_loss": -12.163923263549805, "global_step": 469489, "epoch": 2794} {"train_loss": -11.540777206420898, "global_step": 469490, "epoch": 2794} {"train_loss": -11.632146835327148, "global_step": 469491, "epoch": 2794} {"train_loss": -11.404417037963867, "global_step": 469492, "epoch": 2794} {"train_loss": -12.00120735168457, "global_step": 469493, "epoch": 2794} {"train_loss": -11.7686185836792, "global_step": 469494, "epoch": 2794} {"train_loss": -12.296066284179688, "global_step": 469495, "epoch": 2794} {"train_loss": -11.491464614868164, "global_step": 469496, "epoch": 2794} {"train_loss": -12.180146217346191, "global_step": 469497, "epoch": 2794} {"train_loss": -11.692522048950195, "global_step": 469498, "epoch": 2794} {"train_loss": -12.410812377929688, "global_step": 469499, "epoch": 2794} {"train_loss": -11.739058494567871, "global_step": 469500, "epoch": 2794} {"train_loss": -11.933180809020996, "global_step": 469501, "epoch": 2794} {"train_loss": -11.54018783569336, "global_step": 469502, "epoch": 2794} {"train_loss": -11.958858489990234, "global_step": 469503, "epoch": 2794} {"train_loss": -11.884840965270996, "global_step": 469504, "epoch": 2794} {"train_loss": -11.999711990356445, "global_step": 469505, "epoch": 2794} {"train_loss": -11.955371856689453, "global_step": 469506, "epoch": 2794} {"train_loss": -11.969085693359375, "global_step": 469507, "epoch": 2794} {"train_loss": -12.209220886230469, "global_step": 469508, "epoch": 2794} {"train_loss": -12.212533950805664, "global_step": 469509, "epoch": 2794} {"train_loss": -12.601852416992188, "global_step": 469510, "epoch": 2794} {"train_loss": -12.091455459594727, "global_step": 469511, "epoch": 2794} {"train_loss": -12.423230171203613, "global_step": 469512, "epoch": 2794} {"train_loss": -12.18656063079834, "global_step": 469513, "epoch": 2794} {"train_loss": -12.209298133850098, "global_step": 469514, "epoch": 2794} {"train_loss": -12.156441688537598, "global_step": 469515, "epoch": 2794} {"train_loss": -12.393943786621094, "global_step": 469516, "epoch": 2794} {"train_loss": -12.441669464111328, "global_step": 469517, "epoch": 2794} {"train_loss": -12.472639083862305, "global_step": 469518, "epoch": 2794} {"train_loss": -12.186564445495605, "global_step": 469519, "epoch": 2794} {"train_loss": -12.678914070129395, "global_step": 469520, "epoch": 2794} {"train_loss": -12.277687072753906, "global_step": 469521, "epoch": 2794} {"train_loss": -12.421951293945312, "global_step": 469522, "epoch": 2794} {"train_loss": -12.471866607666016, "global_step": 469523, "epoch": 2794} {"train_loss": -12.395223617553711, "global_step": 469524, "epoch": 2794} {"train_loss": -12.363983154296875, "global_step": 469525, "epoch": 2794} {"train_loss": -12.507944107055664, "global_step": 469526, "epoch": 2794} {"train_loss": -12.316845893859863, "global_step": 469527, "epoch": 2794} {"train_loss": -12.58546257019043, "global_step": 469528, "epoch": 2794} {"train_loss": -12.510688781738281, "global_step": 469529, "epoch": 2794} {"train_loss": -12.566194534301758, "global_step": 469530, "epoch": 2794} {"train_loss": -12.519942283630371, "global_step": 469531, "epoch": 2794} {"train_loss": -12.714305877685547, "global_step": 469532, "epoch": 2794} {"train_loss": -12.34154987335205, "global_step": 469533, "epoch": 2794} {"train_loss": -12.61501693725586, "global_step": 469534, "epoch": 2794} {"train_loss": -12.55052375793457, "global_step": 469535, "epoch": 2794} {"train_loss": -12.884597778320312, "global_step": 469536, "epoch": 2794} {"train_loss": -12.54455852508545, "global_step": 469537, "epoch": 2794} {"train_loss": -12.29386043548584, "global_step": 469538, "epoch": 2794} {"train_loss": -12.608004570007324, "global_step": 469539, "epoch": 2794} {"train_loss": -12.725940704345703, "global_step": 469540, "epoch": 2794} {"train_loss": -12.744467735290527, "global_step": 469541, "epoch": 2794} {"train_loss": -12.58085823059082, "global_step": 469542, "epoch": 2794} {"train_loss": -12.606637954711914, "global_step": 469543, "epoch": 2794} {"train_loss": -12.55793285369873, "global_step": 469544, "epoch": 2794} {"train_loss": -12.54895305633545, "global_step": 469545, "epoch": 2794} {"train_loss": -12.520471572875977, "global_step": 469546, "epoch": 2794} {"train_loss": -12.620689392089844, "global_step": 469547, "epoch": 2794} {"train_loss": -12.808271408081055, "global_step": 469548, "epoch": 2794} {"train_loss": -12.614673614501953, "global_step": 469549, "epoch": 2794} {"train_loss": -12.541179656982422, "global_step": 469550, "epoch": 2794} {"train_loss": -12.773944854736328, "global_step": 469551, "epoch": 2794} {"train_loss": -12.508659362792969, "global_step": 469552, "epoch": 2794} {"train_loss": -12.544662475585938, "global_step": 469553, "epoch": 2794} {"train_loss": -12.81010627746582, "global_step": 469554, "epoch": 2794} {"train_loss": -12.224589347839355, "global_step": 469555, "epoch": 2794} {"train_loss": -12.680301666259766, "global_step": 469556, "epoch": 2794} {"train_loss": -12.751241683959961, "global_step": 469557, "epoch": 2794} {"train_loss": -12.808292388916016, "global_step": 469558, "epoch": 2794} {"train_loss": -11.81887358994711, "global_step": 469559, "epoch": 2794, "val_loss": 314361.40625} {"train_loss": -12.770073890686035, "global_step": 469560, "epoch": 2795} {"train_loss": -12.644033432006836, "global_step": 469561, "epoch": 2795} {"train_loss": -12.891683578491211, "global_step": 469562, "epoch": 2795} {"train_loss": -12.574493408203125, "global_step": 469563, "epoch": 2795} {"train_loss": -12.581581115722656, "global_step": 469564, "epoch": 2795} {"train_loss": -12.717306137084961, "global_step": 469565, "epoch": 2795} {"train_loss": -12.794811248779297, "global_step": 469566, "epoch": 2795} {"train_loss": -12.882524490356445, "global_step": 469567, "epoch": 2795} {"train_loss": -12.585235595703125, "global_step": 469568, "epoch": 2795} {"train_loss": -12.816526412963867, "global_step": 469569, "epoch": 2795} {"train_loss": -13.06474494934082, "global_step": 469570, "epoch": 2795} {"train_loss": -12.870296478271484, "global_step": 469571, "epoch": 2795} {"train_loss": -12.849366188049316, "global_step": 469572, "epoch": 2795} {"train_loss": -12.959991455078125, "global_step": 469573, "epoch": 2795} {"train_loss": -12.897405624389648, "global_step": 469574, "epoch": 2795} {"train_loss": -12.934246063232422, "global_step": 469575, "epoch": 2795} {"train_loss": -13.118524551391602, "global_step": 469576, "epoch": 2795} {"train_loss": -12.811888694763184, "global_step": 469577, "epoch": 2795} {"train_loss": -12.916986465454102, "global_step": 469578, "epoch": 2795} {"train_loss": -13.169859886169434, "global_step": 469579, "epoch": 2795} {"train_loss": -12.942440032958984, "global_step": 469580, "epoch": 2795} {"train_loss": -12.915806770324707, "global_step": 469581, "epoch": 2795} {"train_loss": -12.380176544189453, "global_step": 469582, "epoch": 2795} {"train_loss": -12.770837783813477, "global_step": 469583, "epoch": 2795} {"train_loss": -12.83731460571289, "global_step": 469584, "epoch": 2795} {"train_loss": -12.607294082641602, "global_step": 469585, "epoch": 2795} {"train_loss": -12.803550720214844, "global_step": 469586, "epoch": 2795} {"train_loss": -13.022980690002441, "global_step": 469587, "epoch": 2795} {"train_loss": -12.970808982849121, "global_step": 469588, "epoch": 2795} {"train_loss": -13.083074569702148, "global_step": 469589, "epoch": 2795} {"train_loss": -12.42557144165039, "global_step": 469590, "epoch": 2795} {"train_loss": -12.978330612182617, "global_step": 469591, "epoch": 2795} {"train_loss": -12.893465995788574, "global_step": 469592, "epoch": 2795} {"train_loss": -12.806665420532227, "global_step": 469593, "epoch": 2795} {"train_loss": -12.93639087677002, "global_step": 469594, "epoch": 2795} {"train_loss": -13.037991523742676, "global_step": 469595, "epoch": 2795} {"train_loss": -12.888404846191406, "global_step": 469596, "epoch": 2795} {"train_loss": -12.962430953979492, "global_step": 469597, "epoch": 2795} {"train_loss": -12.942817687988281, "global_step": 469598, "epoch": 2795} {"train_loss": -12.84600830078125, "global_step": 469599, "epoch": 2795} {"train_loss": -12.550736427307129, "global_step": 469600, "epoch": 2795} {"train_loss": -12.973352432250977, "global_step": 469601, "epoch": 2795} {"train_loss": -12.890857696533203, "global_step": 469602, "epoch": 2795} {"train_loss": -12.847322463989258, "global_step": 469603, "epoch": 2795} {"train_loss": -12.739952087402344, "global_step": 469604, "epoch": 2795} {"train_loss": -12.790689468383789, "global_step": 469605, "epoch": 2795} {"train_loss": -12.594144821166992, "global_step": 469606, "epoch": 2795} {"train_loss": -12.810794830322266, "global_step": 469607, "epoch": 2795} {"train_loss": -12.830574035644531, "global_step": 469608, "epoch": 2795} {"train_loss": -13.064973831176758, "global_step": 469609, "epoch": 2795} {"train_loss": -11.58869743347168, "global_step": 469610, "epoch": 2795} {"train_loss": -12.474740982055664, "global_step": 469611, "epoch": 2795} {"train_loss": -12.677816390991211, "global_step": 469612, "epoch": 2795} {"train_loss": -12.781075477600098, "global_step": 469613, "epoch": 2795} {"train_loss": -12.015432357788086, "global_step": 469614, "epoch": 2795} {"train_loss": -12.426097869873047, "global_step": 469615, "epoch": 2795} {"train_loss": -12.896368980407715, "global_step": 469616, "epoch": 2795} {"train_loss": -12.181941986083984, "global_step": 469617, "epoch": 2795} {"train_loss": -9.96679973602295, "global_step": 469618, "epoch": 2795} {"train_loss": -12.311973571777344, "global_step": 469619, "epoch": 2795} {"train_loss": -8.629167556762695, "global_step": 469620, "epoch": 2795} {"train_loss": -7.436692237854004, "global_step": 469621, "epoch": 2795} {"train_loss": -8.072525978088379, "global_step": 469622, "epoch": 2795} {"train_loss": -9.316110610961914, "global_step": 469623, "epoch": 2795} {"train_loss": -8.87423324584961, "global_step": 469624, "epoch": 2795} {"train_loss": -9.493603706359863, "global_step": 469625, "epoch": 2795} {"train_loss": -9.171799659729004, "global_step": 469626, "epoch": 2795} {"train_loss": -9.221025466918945, "global_step": 469627, "epoch": 2795} {"train_loss": -10.529775619506836, "global_step": 469628, "epoch": 2795} {"train_loss": -10.55866527557373, "global_step": 469629, "epoch": 2795} {"train_loss": -8.884834289550781, "global_step": 469630, "epoch": 2795} {"train_loss": -9.722375869750977, "global_step": 469631, "epoch": 2795} {"train_loss": -7.003174781799316, "global_step": 469632, "epoch": 2795} {"train_loss": -7.71044921875, "global_step": 469633, "epoch": 2795} {"train_loss": -7.117890357971191, "global_step": 469634, "epoch": 2795} {"train_loss": -7.4714460372924805, "global_step": 469635, "epoch": 2795} {"train_loss": -6.550053119659424, "global_step": 469636, "epoch": 2795} {"train_loss": -7.26792573928833, "global_step": 469637, "epoch": 2795} {"train_loss": -7.177221298217773, "global_step": 469638, "epoch": 2795} {"train_loss": -7.209311485290527, "global_step": 469639, "epoch": 2795} {"train_loss": -7.682270050048828, "global_step": 469640, "epoch": 2795} {"train_loss": -7.752007484436035, "global_step": 469641, "epoch": 2795} {"train_loss": -7.3245158195495605, "global_step": 469642, "epoch": 2795} {"train_loss": -7.567095756530762, "global_step": 469643, "epoch": 2795} {"train_loss": -7.95245885848999, "global_step": 469644, "epoch": 2795} {"train_loss": -8.121391296386719, "global_step": 469645, "epoch": 2795} {"train_loss": -8.35418701171875, "global_step": 469646, "epoch": 2795} {"train_loss": -8.249549865722656, "global_step": 469647, "epoch": 2795} {"train_loss": -8.135278701782227, "global_step": 469648, "epoch": 2795} {"train_loss": -8.504423141479492, "global_step": 469649, "epoch": 2795} {"train_loss": -8.927764892578125, "global_step": 469650, "epoch": 2795} {"train_loss": -8.606634140014648, "global_step": 469651, "epoch": 2795} {"train_loss": -8.535663604736328, "global_step": 469652, "epoch": 2795} {"train_loss": -8.81741714477539, "global_step": 469653, "epoch": 2795} {"train_loss": -9.012948989868164, "global_step": 469654, "epoch": 2795} {"train_loss": -9.402478218078613, "global_step": 469655, "epoch": 2795} {"train_loss": -9.292247772216797, "global_step": 469656, "epoch": 2795} {"train_loss": -10.403643608093262, "global_step": 469657, "epoch": 2795} {"train_loss": -9.842150688171387, "global_step": 469658, "epoch": 2795} {"train_loss": -9.951102256774902, "global_step": 469659, "epoch": 2795} {"train_loss": -10.097085952758789, "global_step": 469660, "epoch": 2795} {"train_loss": -10.547103881835938, "global_step": 469661, "epoch": 2795} {"train_loss": -10.652267456054688, "global_step": 469662, "epoch": 2795} {"train_loss": -10.427602767944336, "global_step": 469663, "epoch": 2795} {"train_loss": -10.257472038269043, "global_step": 469664, "epoch": 2795} {"train_loss": -10.760147094726562, "global_step": 469665, "epoch": 2795} {"train_loss": -10.641471862792969, "global_step": 469666, "epoch": 2795} {"train_loss": -10.969797134399414, "global_step": 469667, "epoch": 2795} {"train_loss": -10.936594009399414, "global_step": 469668, "epoch": 2795} {"train_loss": -11.152889251708984, "global_step": 469669, "epoch": 2795} {"train_loss": -11.30859088897705, "global_step": 469670, "epoch": 2795} {"train_loss": -11.168403625488281, "global_step": 469671, "epoch": 2795} {"train_loss": -11.669525146484375, "global_step": 469672, "epoch": 2795} {"train_loss": -11.41926383972168, "global_step": 469673, "epoch": 2795} {"train_loss": -11.521099090576172, "global_step": 469674, "epoch": 2795} {"train_loss": -11.664770126342773, "global_step": 469675, "epoch": 2795} {"train_loss": -11.588237762451172, "global_step": 469676, "epoch": 2795} {"train_loss": -11.821126937866211, "global_step": 469677, "epoch": 2795} {"train_loss": -11.879911422729492, "global_step": 469678, "epoch": 2795} {"train_loss": -11.891925811767578, "global_step": 469679, "epoch": 2795} {"train_loss": -12.05550479888916, "global_step": 469680, "epoch": 2795} {"train_loss": -12.119871139526367, "global_step": 469681, "epoch": 2795} {"train_loss": -12.045974731445312, "global_step": 469682, "epoch": 2795} {"train_loss": -11.894858360290527, "global_step": 469683, "epoch": 2795} {"train_loss": -12.077714920043945, "global_step": 469684, "epoch": 2795} {"train_loss": -12.022417068481445, "global_step": 469685, "epoch": 2795} {"train_loss": -12.00285530090332, "global_step": 469686, "epoch": 2795} {"train_loss": -12.140619277954102, "global_step": 469687, "epoch": 2795} {"train_loss": -12.092384338378906, "global_step": 469688, "epoch": 2795} {"train_loss": -12.307228088378906, "global_step": 469689, "epoch": 2795} {"train_loss": -12.416261672973633, "global_step": 469690, "epoch": 2795} {"train_loss": -12.261899948120117, "global_step": 469691, "epoch": 2795} {"train_loss": -12.374259948730469, "global_step": 469692, "epoch": 2795} {"train_loss": -12.331750869750977, "global_step": 469693, "epoch": 2795} {"train_loss": -12.17611312866211, "global_step": 469694, "epoch": 2795} {"train_loss": -12.538131713867188, "global_step": 469695, "epoch": 2795} {"train_loss": -12.404884338378906, "global_step": 469696, "epoch": 2795} {"train_loss": -12.292913436889648, "global_step": 469697, "epoch": 2795} {"train_loss": -12.468727111816406, "global_step": 469698, "epoch": 2795} {"train_loss": -12.556410789489746, "global_step": 469699, "epoch": 2795} {"train_loss": -12.567039489746094, "global_step": 469700, "epoch": 2795} {"train_loss": -12.381488800048828, "global_step": 469701, "epoch": 2795} {"train_loss": -12.472503662109375, "global_step": 469702, "epoch": 2795} {"train_loss": -12.447153091430664, "global_step": 469703, "epoch": 2795} {"train_loss": -12.424956321716309, "global_step": 469704, "epoch": 2795} {"train_loss": -12.290569305419922, "global_step": 469705, "epoch": 2795} {"train_loss": -12.410593032836914, "global_step": 469706, "epoch": 2795} {"train_loss": -12.387632369995117, "global_step": 469707, "epoch": 2795} {"train_loss": -12.22199821472168, "global_step": 469708, "epoch": 2795} {"train_loss": -12.497172355651855, "global_step": 469709, "epoch": 2795} {"train_loss": -12.289396286010742, "global_step": 469710, "epoch": 2795} {"train_loss": -12.578695297241211, "global_step": 469711, "epoch": 2795} {"train_loss": -12.47714614868164, "global_step": 469712, "epoch": 2795} {"train_loss": -12.558833122253418, "global_step": 469713, "epoch": 2795} {"train_loss": -12.353994369506836, "global_step": 469714, "epoch": 2795} {"train_loss": -12.406070709228516, "global_step": 469715, "epoch": 2795} {"train_loss": -12.618618965148926, "global_step": 469716, "epoch": 2795} {"train_loss": -12.478221893310547, "global_step": 469717, "epoch": 2795} {"train_loss": -12.459220886230469, "global_step": 469718, "epoch": 2795} {"train_loss": -12.598260879516602, "global_step": 469719, "epoch": 2795} {"train_loss": -12.597856521606445, "global_step": 469720, "epoch": 2795} {"train_loss": -12.593807220458984, "global_step": 469721, "epoch": 2795} {"train_loss": -12.306697845458984, "global_step": 469722, "epoch": 2795} {"train_loss": -12.055334091186523, "global_step": 469723, "epoch": 2795} {"train_loss": -12.484169006347656, "global_step": 469724, "epoch": 2795} {"train_loss": -12.74232292175293, "global_step": 469725, "epoch": 2795} {"train_loss": -12.584599494934082, "global_step": 469726, "epoch": 2795} {"train_loss": -11.423324794996352, "global_step": 469727, "epoch": 2795, "val_loss": 316971.09375, "train_action_mse_error": 1.9530807733535767} {"train_loss": -12.671235084533691, "global_step": 469728, "epoch": 2796} {"train_loss": -12.63072681427002, "global_step": 469729, "epoch": 2796} {"train_loss": -12.75794792175293, "global_step": 469730, "epoch": 2796} {"train_loss": -12.695487022399902, "global_step": 469731, "epoch": 2796} {"train_loss": -12.670989990234375, "global_step": 469732, "epoch": 2796} {"train_loss": -12.69125747680664, "global_step": 469733, "epoch": 2796} {"train_loss": -12.480463981628418, "global_step": 469734, "epoch": 2796} {"train_loss": -12.221683502197266, "global_step": 469735, "epoch": 2796} {"train_loss": -12.365234375, "global_step": 469736, "epoch": 2796} {"train_loss": -12.726058959960938, "global_step": 469737, "epoch": 2796} {"train_loss": -12.447399139404297, "global_step": 469738, "epoch": 2796} {"train_loss": -12.510797500610352, "global_step": 469739, "epoch": 2796} {"train_loss": -12.895822525024414, "global_step": 469740, "epoch": 2796} {"train_loss": -12.054561614990234, "global_step": 469741, "epoch": 2796} {"train_loss": -11.826072692871094, "global_step": 469742, "epoch": 2796} {"train_loss": -12.754924774169922, "global_step": 469743, "epoch": 2796} {"train_loss": -11.49614143371582, "global_step": 469744, "epoch": 2796} {"train_loss": -12.733673095703125, "global_step": 469745, "epoch": 2796} {"train_loss": -12.185376167297363, "global_step": 469746, "epoch": 2796} {"train_loss": -12.538724899291992, "global_step": 469747, "epoch": 2796} {"train_loss": -12.677295684814453, "global_step": 469748, "epoch": 2796} {"train_loss": -11.367557525634766, "global_step": 469749, "epoch": 2796} {"train_loss": -12.08615493774414, "global_step": 469750, "epoch": 2796} {"train_loss": -12.495219230651855, "global_step": 469751, "epoch": 2796} {"train_loss": -11.984979629516602, "global_step": 469752, "epoch": 2796} {"train_loss": -12.426495552062988, "global_step": 469753, "epoch": 2796} {"train_loss": -12.799677848815918, "global_step": 469754, "epoch": 2796} {"train_loss": -12.539825439453125, "global_step": 469755, "epoch": 2796} {"train_loss": -12.530525207519531, "global_step": 469756, "epoch": 2796} {"train_loss": -12.420937538146973, "global_step": 469757, "epoch": 2796} {"train_loss": -12.322041511535645, "global_step": 469758, "epoch": 2796} {"train_loss": -12.434364318847656, "global_step": 469759, "epoch": 2796} {"train_loss": -12.66360092163086, "global_step": 469760, "epoch": 2796} {"train_loss": -12.429943084716797, "global_step": 469761, "epoch": 2796} {"train_loss": -12.702714920043945, "global_step": 469762, "epoch": 2796} {"train_loss": -12.402402877807617, "global_step": 469763, "epoch": 2796} {"train_loss": -12.230998039245605, "global_step": 469764, "epoch": 2796} {"train_loss": -12.847017288208008, "global_step": 469765, "epoch": 2796} {"train_loss": -12.082985877990723, "global_step": 469766, "epoch": 2796} {"train_loss": -12.27065658569336, "global_step": 469767, "epoch": 2796} {"train_loss": -12.737757682800293, "global_step": 469768, "epoch": 2796} {"train_loss": -12.237472534179688, "global_step": 469769, "epoch": 2796} {"train_loss": -12.429779052734375, "global_step": 469770, "epoch": 2796} {"train_loss": -12.845476150512695, "global_step": 469771, "epoch": 2796} {"train_loss": -11.932550430297852, "global_step": 469772, "epoch": 2796} {"train_loss": -12.369688034057617, "global_step": 469773, "epoch": 2796} {"train_loss": -12.397130012512207, "global_step": 469774, "epoch": 2796} {"train_loss": -12.692808151245117, "global_step": 469775, "epoch": 2796} {"train_loss": -12.806791305541992, "global_step": 469776, "epoch": 2796} {"train_loss": -12.28188705444336, "global_step": 469777, "epoch": 2796} {"train_loss": -12.805904388427734, "global_step": 469778, "epoch": 2796} {"train_loss": -12.604982376098633, "global_step": 469779, "epoch": 2796} {"train_loss": -12.948650360107422, "global_step": 469780, "epoch": 2796} {"train_loss": -12.495790481567383, "global_step": 469781, "epoch": 2796} {"train_loss": -12.708724975585938, "global_step": 469782, "epoch": 2796} {"train_loss": -12.805559158325195, "global_step": 469783, "epoch": 2796} {"train_loss": -12.663542747497559, "global_step": 469784, "epoch": 2796} {"train_loss": -12.686494827270508, "global_step": 469785, "epoch": 2796} {"train_loss": -12.481679916381836, "global_step": 469786, "epoch": 2796} {"train_loss": -12.99674129486084, "global_step": 469787, "epoch": 2796} {"train_loss": -12.476841926574707, "global_step": 469788, "epoch": 2796} {"train_loss": -12.147968292236328, "global_step": 469789, "epoch": 2796} {"train_loss": -11.36551284790039, "global_step": 469790, "epoch": 2796} {"train_loss": -12.491636276245117, "global_step": 469791, "epoch": 2796} {"train_loss": -11.273685455322266, "global_step": 469792, "epoch": 2796} {"train_loss": -12.076394081115723, "global_step": 469793, "epoch": 2796} {"train_loss": -9.445245742797852, "global_step": 469794, "epoch": 2796} {"train_loss": -8.639493942260742, "global_step": 469795, "epoch": 2796} {"train_loss": -9.965165138244629, "global_step": 469796, "epoch": 2796} {"train_loss": -10.354412078857422, "global_step": 469797, "epoch": 2796} {"train_loss": -10.443994522094727, "global_step": 469798, "epoch": 2796} {"train_loss": -9.409796714782715, "global_step": 469799, "epoch": 2796} {"train_loss": -9.629293441772461, "global_step": 469800, "epoch": 2796} {"train_loss": -10.140732765197754, "global_step": 469801, "epoch": 2796} {"train_loss": -10.45347785949707, "global_step": 469802, "epoch": 2796} {"train_loss": -9.481605529785156, "global_step": 469803, "epoch": 2796} {"train_loss": -9.812278747558594, "global_step": 469804, "epoch": 2796} {"train_loss": -9.801843643188477, "global_step": 469805, "epoch": 2796} {"train_loss": -9.659728050231934, "global_step": 469806, "epoch": 2796} {"train_loss": -10.734635353088379, "global_step": 469807, "epoch": 2796} {"train_loss": -9.603687286376953, "global_step": 469808, "epoch": 2796} {"train_loss": -10.279582023620605, "global_step": 469809, "epoch": 2796} {"train_loss": -9.319759368896484, "global_step": 469810, "epoch": 2796} {"train_loss": -9.516700744628906, "global_step": 469811, "epoch": 2796} {"train_loss": -10.181869506835938, "global_step": 469812, "epoch": 2796} {"train_loss": -9.99681568145752, "global_step": 469813, "epoch": 2796} {"train_loss": -10.538322448730469, "global_step": 469814, "epoch": 2796} {"train_loss": -9.745718955993652, "global_step": 469815, "epoch": 2796} {"train_loss": -9.894857406616211, "global_step": 469816, "epoch": 2796} {"train_loss": -10.721939086914062, "global_step": 469817, "epoch": 2796} {"train_loss": -10.632781028747559, "global_step": 469818, "epoch": 2796} {"train_loss": -10.185050964355469, "global_step": 469819, "epoch": 2796} {"train_loss": -11.32533073425293, "global_step": 469820, "epoch": 2796} {"train_loss": -10.835819244384766, "global_step": 469821, "epoch": 2796} {"train_loss": -10.742630004882812, "global_step": 469822, "epoch": 2796} {"train_loss": -10.751728057861328, "global_step": 469823, "epoch": 2796} {"train_loss": -11.463441848754883, "global_step": 469824, "epoch": 2796} {"train_loss": -10.808660507202148, "global_step": 469825, "epoch": 2796} {"train_loss": -11.805353164672852, "global_step": 469826, "epoch": 2796} {"train_loss": -11.545980453491211, "global_step": 469827, "epoch": 2796} {"train_loss": -11.571111679077148, "global_step": 469828, "epoch": 2796} {"train_loss": -11.75893783569336, "global_step": 469829, "epoch": 2796} {"train_loss": -11.279203414916992, "global_step": 469830, "epoch": 2796} {"train_loss": -11.9365816116333, "global_step": 469831, "epoch": 2796} {"train_loss": -11.739376068115234, "global_step": 469832, "epoch": 2796} {"train_loss": -11.832324981689453, "global_step": 469833, "epoch": 2796} {"train_loss": -12.105931282043457, "global_step": 469834, "epoch": 2796} {"train_loss": -11.403874397277832, "global_step": 469835, "epoch": 2796} {"train_loss": -12.259520530700684, "global_step": 469836, "epoch": 2796} {"train_loss": -11.783016204833984, "global_step": 469837, "epoch": 2796} {"train_loss": -11.78788948059082, "global_step": 469838, "epoch": 2796} {"train_loss": -12.219390869140625, "global_step": 469839, "epoch": 2796} {"train_loss": -11.770417213439941, "global_step": 469840, "epoch": 2796} {"train_loss": -12.27194881439209, "global_step": 469841, "epoch": 2796} {"train_loss": -12.200691223144531, "global_step": 469842, "epoch": 2796} {"train_loss": -11.934502601623535, "global_step": 469843, "epoch": 2796} {"train_loss": -12.212510108947754, "global_step": 469844, "epoch": 2796} {"train_loss": -11.812576293945312, "global_step": 469845, "epoch": 2796} {"train_loss": -11.86639404296875, "global_step": 469846, "epoch": 2796} {"train_loss": -11.632335662841797, "global_step": 469847, "epoch": 2796} {"train_loss": -12.11122989654541, "global_step": 469848, "epoch": 2796} {"train_loss": -12.365137100219727, "global_step": 469849, "epoch": 2796} {"train_loss": -12.308128356933594, "global_step": 469850, "epoch": 2796} {"train_loss": -12.247093200683594, "global_step": 469851, "epoch": 2796} {"train_loss": -12.226845741271973, "global_step": 469852, "epoch": 2796} {"train_loss": -12.634023666381836, "global_step": 469853, "epoch": 2796} {"train_loss": -11.764984130859375, "global_step": 469854, "epoch": 2796} {"train_loss": -12.280884742736816, "global_step": 469855, "epoch": 2796} {"train_loss": -12.155826568603516, "global_step": 469856, "epoch": 2796} {"train_loss": -12.237541198730469, "global_step": 469857, "epoch": 2796} {"train_loss": -12.496894836425781, "global_step": 469858, "epoch": 2796} {"train_loss": -12.541566848754883, "global_step": 469859, "epoch": 2796} {"train_loss": -12.416683197021484, "global_step": 469860, "epoch": 2796} {"train_loss": -12.60954761505127, "global_step": 469861, "epoch": 2796} {"train_loss": -12.48481559753418, "global_step": 469862, "epoch": 2796} {"train_loss": -12.55558967590332, "global_step": 469863, "epoch": 2796} {"train_loss": -12.478726387023926, "global_step": 469864, "epoch": 2796} {"train_loss": -12.480935096740723, "global_step": 469865, "epoch": 2796} {"train_loss": -12.539446830749512, "global_step": 469866, "epoch": 2796} {"train_loss": -12.229686737060547, "global_step": 469867, "epoch": 2796} {"train_loss": -12.415121078491211, "global_step": 469868, "epoch": 2796} {"train_loss": -12.445287704467773, "global_step": 469869, "epoch": 2796} {"train_loss": -12.401419639587402, "global_step": 469870, "epoch": 2796} {"train_loss": -12.445764541625977, "global_step": 469871, "epoch": 2796} {"train_loss": -12.520797729492188, "global_step": 469872, "epoch": 2796} {"train_loss": -12.667133331298828, "global_step": 469873, "epoch": 2796} {"train_loss": -12.543964385986328, "global_step": 469874, "epoch": 2796} {"train_loss": -12.778282165527344, "global_step": 469875, "epoch": 2796} {"train_loss": -12.512796401977539, "global_step": 469876, "epoch": 2796} {"train_loss": -12.710309982299805, "global_step": 469877, "epoch": 2796} {"train_loss": -12.568893432617188, "global_step": 469878, "epoch": 2796} {"train_loss": -12.72223949432373, "global_step": 469879, "epoch": 2796} {"train_loss": -12.529743194580078, "global_step": 469880, "epoch": 2796} {"train_loss": -12.606510162353516, "global_step": 469881, "epoch": 2796} {"train_loss": -12.429302215576172, "global_step": 469882, "epoch": 2796} {"train_loss": -12.469491958618164, "global_step": 469883, "epoch": 2796} {"train_loss": -12.757469177246094, "global_step": 469884, "epoch": 2796} {"train_loss": -12.436513900756836, "global_step": 469885, "epoch": 2796} {"train_loss": -12.518814086914062, "global_step": 469886, "epoch": 2796} {"train_loss": -12.862740516662598, "global_step": 469887, "epoch": 2796} {"train_loss": -12.707185745239258, "global_step": 469888, "epoch": 2796} {"train_loss": -12.639619827270508, "global_step": 469889, "epoch": 2796} {"train_loss": -12.711033821105957, "global_step": 469890, "epoch": 2796} {"train_loss": -12.669319152832031, "global_step": 469891, "epoch": 2796} {"train_loss": -12.782712936401367, "global_step": 469892, "epoch": 2796} {"train_loss": -12.652624130249023, "global_step": 469893, "epoch": 2796} {"train_loss": -12.57430362701416, "global_step": 469894, "epoch": 2796} {"train_loss": -11.940902437482562, "global_step": 469895, "epoch": 2796, "val_loss": 313980.46875} {"train_loss": -12.593013763427734, "global_step": 469896, "epoch": 2797} {"train_loss": -12.841567993164062, "global_step": 469897, "epoch": 2797} {"train_loss": -12.687234878540039, "global_step": 469898, "epoch": 2797} {"train_loss": -12.820295333862305, "global_step": 469899, "epoch": 2797} {"train_loss": -12.739179611206055, "global_step": 469900, "epoch": 2797} {"train_loss": -12.937187194824219, "global_step": 469901, "epoch": 2797} {"train_loss": -12.809589385986328, "global_step": 469902, "epoch": 2797} {"train_loss": -12.941522598266602, "global_step": 469903, "epoch": 2797} {"train_loss": -12.715078353881836, "global_step": 469904, "epoch": 2797} {"train_loss": -12.68376350402832, "global_step": 469905, "epoch": 2797} {"train_loss": -12.921314239501953, "global_step": 469906, "epoch": 2797} {"train_loss": -12.728483200073242, "global_step": 469907, "epoch": 2797} {"train_loss": -12.921823501586914, "global_step": 469908, "epoch": 2797} {"train_loss": -12.872038841247559, "global_step": 469909, "epoch": 2797} {"train_loss": -12.732754707336426, "global_step": 469910, "epoch": 2797} {"train_loss": -12.704977035522461, "global_step": 469911, "epoch": 2797} {"train_loss": -12.867629051208496, "global_step": 469912, "epoch": 2797} {"train_loss": -12.926177978515625, "global_step": 469913, "epoch": 2797} {"train_loss": -12.803094863891602, "global_step": 469914, "epoch": 2797} {"train_loss": -12.91263198852539, "global_step": 469915, "epoch": 2797} {"train_loss": -12.744563102722168, "global_step": 469916, "epoch": 2797} {"train_loss": -12.870359420776367, "global_step": 469917, "epoch": 2797} {"train_loss": -12.839494705200195, "global_step": 469918, "epoch": 2797} {"train_loss": -12.859535217285156, "global_step": 469919, "epoch": 2797} {"train_loss": -12.625951766967773, "global_step": 469920, "epoch": 2797} {"train_loss": -12.979177474975586, "global_step": 469921, "epoch": 2797} {"train_loss": -12.94919490814209, "global_step": 469922, "epoch": 2797} {"train_loss": -12.84316635131836, "global_step": 469923, "epoch": 2797} {"train_loss": -12.754507064819336, "global_step": 469924, "epoch": 2797} {"train_loss": -12.33953857421875, "global_step": 469925, "epoch": 2797} {"train_loss": -12.595941543579102, "global_step": 469926, "epoch": 2797} {"train_loss": -12.90301513671875, "global_step": 469927, "epoch": 2797} {"train_loss": -12.722755432128906, "global_step": 469928, "epoch": 2797} {"train_loss": -12.69550609588623, "global_step": 469929, "epoch": 2797} {"train_loss": -12.657464027404785, "global_step": 469930, "epoch": 2797} {"train_loss": -12.659116744995117, "global_step": 469931, "epoch": 2797} {"train_loss": -12.776019096374512, "global_step": 469932, "epoch": 2797} {"train_loss": -12.78909969329834, "global_step": 469933, "epoch": 2797} {"train_loss": -12.733535766601562, "global_step": 469934, "epoch": 2797} {"train_loss": -12.633207321166992, "global_step": 469935, "epoch": 2797} {"train_loss": -11.820094108581543, "global_step": 469936, "epoch": 2797} {"train_loss": -11.931376457214355, "global_step": 469937, "epoch": 2797} {"train_loss": -12.727476119995117, "global_step": 469938, "epoch": 2797} {"train_loss": -12.767539978027344, "global_step": 469939, "epoch": 2797} {"train_loss": -11.130766868591309, "global_step": 469940, "epoch": 2797} {"train_loss": -11.691768646240234, "global_step": 469941, "epoch": 2797} {"train_loss": -12.013690948486328, "global_step": 469942, "epoch": 2797} {"train_loss": -11.196134567260742, "global_step": 469943, "epoch": 2797} {"train_loss": -11.933563232421875, "global_step": 469944, "epoch": 2797} {"train_loss": -11.044059753417969, "global_step": 469945, "epoch": 2797} {"train_loss": -11.022184371948242, "global_step": 469946, "epoch": 2797} {"train_loss": -12.354623794555664, "global_step": 469947, "epoch": 2797} {"train_loss": -11.46822452545166, "global_step": 469948, "epoch": 2797} {"train_loss": -11.450803756713867, "global_step": 469949, "epoch": 2797} {"train_loss": -12.023263931274414, "global_step": 469950, "epoch": 2797} {"train_loss": -11.924610137939453, "global_step": 469951, "epoch": 2797} {"train_loss": -11.260730743408203, "global_step": 469952, "epoch": 2797} {"train_loss": -12.443456649780273, "global_step": 469953, "epoch": 2797} {"train_loss": -11.302286148071289, "global_step": 469954, "epoch": 2797} {"train_loss": -11.235860824584961, "global_step": 469955, "epoch": 2797} {"train_loss": -11.697147369384766, "global_step": 469956, "epoch": 2797} {"train_loss": -10.500776290893555, "global_step": 469957, "epoch": 2797} {"train_loss": -10.426493644714355, "global_step": 469958, "epoch": 2797} {"train_loss": -11.234230041503906, "global_step": 469959, "epoch": 2797} {"train_loss": -10.766853332519531, "global_step": 469960, "epoch": 2797} {"train_loss": -11.870044708251953, "global_step": 469961, "epoch": 2797} {"train_loss": -10.637404441833496, "global_step": 469962, "epoch": 2797} {"train_loss": -12.101668357849121, "global_step": 469963, "epoch": 2797} {"train_loss": -10.431377410888672, "global_step": 469964, "epoch": 2797} {"train_loss": -10.276809692382812, "global_step": 469965, "epoch": 2797} {"train_loss": -11.712508201599121, "global_step": 469966, "epoch": 2797} {"train_loss": -9.76700210571289, "global_step": 469967, "epoch": 2797} {"train_loss": -11.668340682983398, "global_step": 469968, "epoch": 2797} {"train_loss": -10.942245483398438, "global_step": 469969, "epoch": 2797} {"train_loss": -11.689064025878906, "global_step": 469970, "epoch": 2797} {"train_loss": -10.992913246154785, "global_step": 469971, "epoch": 2797} {"train_loss": -11.328530311584473, "global_step": 469972, "epoch": 2797} {"train_loss": -11.151159286499023, "global_step": 469973, "epoch": 2797} {"train_loss": -11.230101585388184, "global_step": 469974, "epoch": 2797} {"train_loss": -11.503763198852539, "global_step": 469975, "epoch": 2797} {"train_loss": -10.980910301208496, "global_step": 469976, "epoch": 2797} {"train_loss": -12.062199592590332, "global_step": 469977, "epoch": 2797} {"train_loss": -11.20806884765625, "global_step": 469978, "epoch": 2797} {"train_loss": -12.108470916748047, "global_step": 469979, "epoch": 2797} {"train_loss": -11.141287803649902, "global_step": 469980, "epoch": 2797} {"train_loss": -11.701180458068848, "global_step": 469981, "epoch": 2797} {"train_loss": -11.639017105102539, "global_step": 469982, "epoch": 2797} {"train_loss": -12.024645805358887, "global_step": 469983, "epoch": 2797} {"train_loss": -11.602102279663086, "global_step": 469984, "epoch": 2797} {"train_loss": -11.592836380004883, "global_step": 469985, "epoch": 2797} {"train_loss": -11.352368354797363, "global_step": 469986, "epoch": 2797} {"train_loss": -12.209701538085938, "global_step": 469987, "epoch": 2797} {"train_loss": -11.539684295654297, "global_step": 469988, "epoch": 2797} {"train_loss": -12.203712463378906, "global_step": 469989, "epoch": 2797} {"train_loss": -11.416248321533203, "global_step": 469990, "epoch": 2797} {"train_loss": -11.246175765991211, "global_step": 469991, "epoch": 2797} {"train_loss": -11.18316650390625, "global_step": 469992, "epoch": 2797} {"train_loss": -11.494680404663086, "global_step": 469993, "epoch": 2797} {"train_loss": -10.788286209106445, "global_step": 469994, "epoch": 2797} {"train_loss": -12.044187545776367, "global_step": 469995, "epoch": 2797} {"train_loss": -11.61111831665039, "global_step": 469996, "epoch": 2797} {"train_loss": -11.25229263305664, "global_step": 469997, "epoch": 2797} {"train_loss": -11.650094985961914, "global_step": 469998, "epoch": 2797} {"train_loss": -11.638601303100586, "global_step": 469999, "epoch": 2797} {"train_loss": -11.142705917358398, "global_step": 470000, "epoch": 2797} {"train_loss": -11.73542594909668, "global_step": 470001, "epoch": 2797} {"train_loss": -11.33895492553711, "global_step": 470002, "epoch": 2797} {"train_loss": -10.963062286376953, "global_step": 470003, "epoch": 2797} {"train_loss": -11.780893325805664, "global_step": 470004, "epoch": 2797} {"train_loss": -11.76341438293457, "global_step": 470005, "epoch": 2797} {"train_loss": -10.98089599609375, "global_step": 470006, "epoch": 2797} {"train_loss": -11.936480522155762, "global_step": 470007, "epoch": 2797} {"train_loss": -12.01553726196289, "global_step": 470008, "epoch": 2797} {"train_loss": -11.721412658691406, "global_step": 470009, "epoch": 2797} {"train_loss": -12.151495933532715, "global_step": 470010, "epoch": 2797} {"train_loss": -12.010490417480469, "global_step": 470011, "epoch": 2797} {"train_loss": -12.02083969116211, "global_step": 470012, "epoch": 2797} {"train_loss": -12.311119079589844, "global_step": 470013, "epoch": 2797} {"train_loss": -12.061470031738281, "global_step": 470014, "epoch": 2797} {"train_loss": -12.519472122192383, "global_step": 470015, "epoch": 2797} {"train_loss": -12.135614395141602, "global_step": 470016, "epoch": 2797} {"train_loss": -12.369150161743164, "global_step": 470017, "epoch": 2797} {"train_loss": -12.40041732788086, "global_step": 470018, "epoch": 2797} {"train_loss": -12.468324661254883, "global_step": 470019, "epoch": 2797} {"train_loss": -12.22606372833252, "global_step": 470020, "epoch": 2797} {"train_loss": -12.390649795532227, "global_step": 470021, "epoch": 2797} {"train_loss": -12.466460227966309, "global_step": 470022, "epoch": 2797} {"train_loss": -12.459933280944824, "global_step": 470023, "epoch": 2797} {"train_loss": -12.3202486038208, "global_step": 470024, "epoch": 2797} {"train_loss": -12.296527862548828, "global_step": 470025, "epoch": 2797} {"train_loss": -11.831329345703125, "global_step": 470026, "epoch": 2797} {"train_loss": -12.088542938232422, "global_step": 470027, "epoch": 2797} {"train_loss": -12.177070617675781, "global_step": 470028, "epoch": 2797} {"train_loss": -12.03567886352539, "global_step": 470029, "epoch": 2797} {"train_loss": -12.289277076721191, "global_step": 470030, "epoch": 2797} {"train_loss": -12.182804107666016, "global_step": 470031, "epoch": 2797} {"train_loss": -12.030064582824707, "global_step": 470032, "epoch": 2797} {"train_loss": -12.237617492675781, "global_step": 470033, "epoch": 2797} {"train_loss": -12.450738906860352, "global_step": 470034, "epoch": 2797} {"train_loss": -12.145270347595215, "global_step": 470035, "epoch": 2797} {"train_loss": -12.66779899597168, "global_step": 470036, "epoch": 2797} {"train_loss": -12.27716064453125, "global_step": 470037, "epoch": 2797} {"train_loss": -12.496628761291504, "global_step": 470038, "epoch": 2797} {"train_loss": -12.31826114654541, "global_step": 470039, "epoch": 2797} {"train_loss": -12.259842872619629, "global_step": 470040, "epoch": 2797} {"train_loss": -12.674537658691406, "global_step": 470041, "epoch": 2797} {"train_loss": -12.04369831085205, "global_step": 470042, "epoch": 2797} {"train_loss": -12.591028213500977, "global_step": 470043, "epoch": 2797} {"train_loss": -12.302513122558594, "global_step": 470044, "epoch": 2797} {"train_loss": -12.230813980102539, "global_step": 470045, "epoch": 2797} {"train_loss": -12.390209197998047, "global_step": 470046, "epoch": 2797} {"train_loss": -12.641961097717285, "global_step": 470047, "epoch": 2797} {"train_loss": -12.142950057983398, "global_step": 470048, "epoch": 2797} {"train_loss": -12.186363220214844, "global_step": 470049, "epoch": 2797} {"train_loss": -12.348077774047852, "global_step": 470050, "epoch": 2797} {"train_loss": -11.872990608215332, "global_step": 470051, "epoch": 2797} {"train_loss": -12.040849685668945, "global_step": 470052, "epoch": 2797} {"train_loss": -12.5184326171875, "global_step": 470053, "epoch": 2797} {"train_loss": -12.476622581481934, "global_step": 470054, "epoch": 2797} {"train_loss": -11.5426025390625, "global_step": 470055, "epoch": 2797} {"train_loss": -12.088671684265137, "global_step": 470056, "epoch": 2797} {"train_loss": -12.044147491455078, "global_step": 470057, "epoch": 2797} {"train_loss": -10.742962837219238, "global_step": 470058, "epoch": 2797} {"train_loss": -11.868404388427734, "global_step": 470059, "epoch": 2797} {"train_loss": -10.607973098754883, "global_step": 470060, "epoch": 2797} {"train_loss": -11.25881576538086, "global_step": 470061, "epoch": 2797} {"train_loss": -11.011741638183594, "global_step": 470062, "epoch": 2797} {"train_loss": -11.99855243024372, "global_step": 470063, "epoch": 2797, "val_loss": 318174.71875} {"train_loss": -11.915338516235352, "global_step": 470064, "epoch": 2798} {"train_loss": -11.647140502929688, "global_step": 470065, "epoch": 2798} {"train_loss": -11.748327255249023, "global_step": 470066, "epoch": 2798} {"train_loss": -11.558263778686523, "global_step": 470067, "epoch": 2798} {"train_loss": -11.359107971191406, "global_step": 470068, "epoch": 2798} {"train_loss": -12.00810432434082, "global_step": 470069, "epoch": 2798} {"train_loss": -10.763629913330078, "global_step": 470070, "epoch": 2798} {"train_loss": -12.314308166503906, "global_step": 470071, "epoch": 2798} {"train_loss": -11.531288146972656, "global_step": 470072, "epoch": 2798} {"train_loss": -11.352373123168945, "global_step": 470073, "epoch": 2798} {"train_loss": -11.149640083312988, "global_step": 470074, "epoch": 2798} {"train_loss": -11.209127426147461, "global_step": 470075, "epoch": 2798} {"train_loss": -11.046507835388184, "global_step": 470076, "epoch": 2798} {"train_loss": -11.229466438293457, "global_step": 470077, "epoch": 2798} {"train_loss": -10.410441398620605, "global_step": 470078, "epoch": 2798} {"train_loss": -12.525805473327637, "global_step": 470079, "epoch": 2798} {"train_loss": -11.074865341186523, "global_step": 470080, "epoch": 2798} {"train_loss": -11.364107131958008, "global_step": 470081, "epoch": 2798} {"train_loss": -11.454734802246094, "global_step": 470082, "epoch": 2798} {"train_loss": -11.44038200378418, "global_step": 470083, "epoch": 2798} {"train_loss": -11.531158447265625, "global_step": 470084, "epoch": 2798} {"train_loss": -11.043437957763672, "global_step": 470085, "epoch": 2798} {"train_loss": -10.987682342529297, "global_step": 470086, "epoch": 2798} {"train_loss": -11.925683975219727, "global_step": 470087, "epoch": 2798} {"train_loss": -10.47872543334961, "global_step": 470088, "epoch": 2798} {"train_loss": -10.83238410949707, "global_step": 470089, "epoch": 2798} {"train_loss": -10.880353927612305, "global_step": 470090, "epoch": 2798} {"train_loss": -10.551336288452148, "global_step": 470091, "epoch": 2798} {"train_loss": -10.31882095336914, "global_step": 470092, "epoch": 2798} {"train_loss": -11.433113098144531, "global_step": 470093, "epoch": 2798} {"train_loss": -10.787761688232422, "global_step": 470094, "epoch": 2798} {"train_loss": -9.593236923217773, "global_step": 470095, "epoch": 2798} {"train_loss": -9.815078735351562, "global_step": 470096, "epoch": 2798} {"train_loss": -11.846386909484863, "global_step": 470097, "epoch": 2798} {"train_loss": -9.963630676269531, "global_step": 470098, "epoch": 2798} {"train_loss": -10.524961471557617, "global_step": 470099, "epoch": 2798} {"train_loss": -9.342249870300293, "global_step": 470100, "epoch": 2798} {"train_loss": -9.852295875549316, "global_step": 470101, "epoch": 2798} {"train_loss": -11.028223037719727, "global_step": 470102, "epoch": 2798} {"train_loss": -9.419974327087402, "global_step": 470103, "epoch": 2798} {"train_loss": -11.020423889160156, "global_step": 470104, "epoch": 2798} {"train_loss": -9.899002075195312, "global_step": 470105, "epoch": 2798} {"train_loss": -9.92780590057373, "global_step": 470106, "epoch": 2798} {"train_loss": -10.461000442504883, "global_step": 470107, "epoch": 2798} {"train_loss": -10.785204887390137, "global_step": 470108, "epoch": 2798} {"train_loss": -11.655721664428711, "global_step": 470109, "epoch": 2798} {"train_loss": -10.759570121765137, "global_step": 470110, "epoch": 2798} {"train_loss": -11.471050262451172, "global_step": 470111, "epoch": 2798} {"train_loss": -11.178018569946289, "global_step": 470112, "epoch": 2798} {"train_loss": -11.265704154968262, "global_step": 470113, "epoch": 2798} {"train_loss": -11.660163879394531, "global_step": 470114, "epoch": 2798} {"train_loss": -11.362311363220215, "global_step": 470115, "epoch": 2798} {"train_loss": -11.020275115966797, "global_step": 470116, "epoch": 2798} {"train_loss": -11.229158401489258, "global_step": 470117, "epoch": 2798} {"train_loss": -11.454047203063965, "global_step": 470118, "epoch": 2798} {"train_loss": -11.438604354858398, "global_step": 470119, "epoch": 2798} {"train_loss": -12.166210174560547, "global_step": 470120, "epoch": 2798} {"train_loss": -11.77983570098877, "global_step": 470121, "epoch": 2798} {"train_loss": -11.51300048828125, "global_step": 470122, "epoch": 2798} {"train_loss": -12.070513725280762, "global_step": 470123, "epoch": 2798} {"train_loss": -11.783222198486328, "global_step": 470124, "epoch": 2798} {"train_loss": -12.225061416625977, "global_step": 470125, "epoch": 2798} {"train_loss": -12.182110786437988, "global_step": 470126, "epoch": 2798} {"train_loss": -12.132935523986816, "global_step": 470127, "epoch": 2798} {"train_loss": -12.057638168334961, "global_step": 470128, "epoch": 2798} {"train_loss": -12.104820251464844, "global_step": 470129, "epoch": 2798} {"train_loss": -12.152732849121094, "global_step": 470130, "epoch": 2798} {"train_loss": -12.305553436279297, "global_step": 470131, "epoch": 2798} {"train_loss": -12.147012710571289, "global_step": 470132, "epoch": 2798} {"train_loss": -12.435319900512695, "global_step": 470133, "epoch": 2798} {"train_loss": -12.364147186279297, "global_step": 470134, "epoch": 2798} {"train_loss": -12.340751647949219, "global_step": 470135, "epoch": 2798} {"train_loss": -12.39864730834961, "global_step": 470136, "epoch": 2798} {"train_loss": -12.391876220703125, "global_step": 470137, "epoch": 2798} {"train_loss": -12.328941345214844, "global_step": 470138, "epoch": 2798} {"train_loss": -12.224644660949707, "global_step": 470139, "epoch": 2798} {"train_loss": -12.328900337219238, "global_step": 470140, "epoch": 2798} {"train_loss": -12.289761543273926, "global_step": 470141, "epoch": 2798} {"train_loss": -12.482185363769531, "global_step": 470142, "epoch": 2798} {"train_loss": -12.328336715698242, "global_step": 470143, "epoch": 2798} {"train_loss": -12.511960983276367, "global_step": 470144, "epoch": 2798} {"train_loss": -12.500394821166992, "global_step": 470145, "epoch": 2798} {"train_loss": -12.537158966064453, "global_step": 470146, "epoch": 2798} {"train_loss": -12.459138870239258, "global_step": 470147, "epoch": 2798} {"train_loss": -12.565224647521973, "global_step": 470148, "epoch": 2798} {"train_loss": -12.349167823791504, "global_step": 470149, "epoch": 2798} {"train_loss": -12.381074905395508, "global_step": 470150, "epoch": 2798} {"train_loss": -12.609749794006348, "global_step": 470151, "epoch": 2798} {"train_loss": -12.612313270568848, "global_step": 470152, "epoch": 2798} {"train_loss": -12.698333740234375, "global_step": 470153, "epoch": 2798} {"train_loss": -12.727733612060547, "global_step": 470154, "epoch": 2798} {"train_loss": -12.610077857971191, "global_step": 470155, "epoch": 2798} {"train_loss": -12.61430549621582, "global_step": 470156, "epoch": 2798} {"train_loss": -12.797449111938477, "global_step": 470157, "epoch": 2798} {"train_loss": -12.602025985717773, "global_step": 470158, "epoch": 2798} {"train_loss": -12.586679458618164, "global_step": 470159, "epoch": 2798} {"train_loss": -12.617596626281738, "global_step": 470160, "epoch": 2798} {"train_loss": -12.529285430908203, "global_step": 470161, "epoch": 2798} {"train_loss": -12.64719009399414, "global_step": 470162, "epoch": 2798} {"train_loss": -12.52562141418457, "global_step": 470163, "epoch": 2798} {"train_loss": -12.662153244018555, "global_step": 470164, "epoch": 2798} {"train_loss": -12.885953903198242, "global_step": 470165, "epoch": 2798} {"train_loss": -12.71790885925293, "global_step": 470166, "epoch": 2798} {"train_loss": -12.853523254394531, "global_step": 470167, "epoch": 2798} {"train_loss": -12.441386222839355, "global_step": 470168, "epoch": 2798} {"train_loss": -12.854524612426758, "global_step": 470169, "epoch": 2798} {"train_loss": -12.472851753234863, "global_step": 470170, "epoch": 2798} {"train_loss": -12.704118728637695, "global_step": 470171, "epoch": 2798} {"train_loss": -12.506974220275879, "global_step": 470172, "epoch": 2798} {"train_loss": -12.765857696533203, "global_step": 470173, "epoch": 2798} {"train_loss": -12.587162017822266, "global_step": 470174, "epoch": 2798} {"train_loss": -12.761696815490723, "global_step": 470175, "epoch": 2798} {"train_loss": -12.776089668273926, "global_step": 470176, "epoch": 2798} {"train_loss": -12.719805717468262, "global_step": 470177, "epoch": 2798} {"train_loss": -12.687963485717773, "global_step": 470178, "epoch": 2798} {"train_loss": -12.544170379638672, "global_step": 470179, "epoch": 2798} {"train_loss": -12.613216400146484, "global_step": 470180, "epoch": 2798} {"train_loss": -12.782696723937988, "global_step": 470181, "epoch": 2798} {"train_loss": -12.86572265625, "global_step": 470182, "epoch": 2798} {"train_loss": -12.914138793945312, "global_step": 470183, "epoch": 2798} {"train_loss": -12.736676216125488, "global_step": 470184, "epoch": 2798} {"train_loss": -12.641578674316406, "global_step": 470185, "epoch": 2798} {"train_loss": -12.81212043762207, "global_step": 470186, "epoch": 2798} {"train_loss": -12.535686492919922, "global_step": 470187, "epoch": 2798} {"train_loss": -12.272125244140625, "global_step": 470188, "epoch": 2798} {"train_loss": -12.859821319580078, "global_step": 470189, "epoch": 2798} {"train_loss": -12.725747108459473, "global_step": 470190, "epoch": 2798} {"train_loss": -12.478181838989258, "global_step": 470191, "epoch": 2798} {"train_loss": -12.860832214355469, "global_step": 470192, "epoch": 2798} {"train_loss": -12.410529136657715, "global_step": 470193, "epoch": 2798} {"train_loss": -11.952347755432129, "global_step": 470194, "epoch": 2798} {"train_loss": -12.194686889648438, "global_step": 470195, "epoch": 2798} {"train_loss": -12.323099136352539, "global_step": 470196, "epoch": 2798} {"train_loss": -12.60854721069336, "global_step": 470197, "epoch": 2798} {"train_loss": -12.321414947509766, "global_step": 470198, "epoch": 2798} {"train_loss": -12.633450508117676, "global_step": 470199, "epoch": 2798} {"train_loss": -12.392175674438477, "global_step": 470200, "epoch": 2798} {"train_loss": -12.677196502685547, "global_step": 470201, "epoch": 2798} {"train_loss": -12.479291915893555, "global_step": 470202, "epoch": 2798} {"train_loss": -12.507087707519531, "global_step": 470203, "epoch": 2798} {"train_loss": -12.612428665161133, "global_step": 470204, "epoch": 2798} {"train_loss": -12.393136978149414, "global_step": 470205, "epoch": 2798} {"train_loss": -12.450916290283203, "global_step": 470206, "epoch": 2798} {"train_loss": -12.648896217346191, "global_step": 470207, "epoch": 2798} {"train_loss": -12.627504348754883, "global_step": 470208, "epoch": 2798} {"train_loss": -12.619647979736328, "global_step": 470209, "epoch": 2798} {"train_loss": -12.859087944030762, "global_step": 470210, "epoch": 2798} {"train_loss": -12.566802024841309, "global_step": 470211, "epoch": 2798} {"train_loss": -12.762609481811523, "global_step": 470212, "epoch": 2798} {"train_loss": -12.502718925476074, "global_step": 470213, "epoch": 2798} {"train_loss": -12.75826644897461, "global_step": 470214, "epoch": 2798} {"train_loss": -12.926286697387695, "global_step": 470215, "epoch": 2798} {"train_loss": -12.739669799804688, "global_step": 470216, "epoch": 2798} {"train_loss": -12.655131340026855, "global_step": 470217, "epoch": 2798} {"train_loss": -12.904363632202148, "global_step": 470218, "epoch": 2798} {"train_loss": -13.097073554992676, "global_step": 470219, "epoch": 2798} {"train_loss": -12.749479293823242, "global_step": 470220, "epoch": 2798} {"train_loss": -13.081700325012207, "global_step": 470221, "epoch": 2798} {"train_loss": -12.809885025024414, "global_step": 470222, "epoch": 2798} {"train_loss": -12.586424827575684, "global_step": 470223, "epoch": 2798} {"train_loss": -12.747126579284668, "global_step": 470224, "epoch": 2798} {"train_loss": -12.697747230529785, "global_step": 470225, "epoch": 2798} {"train_loss": -12.596418380737305, "global_step": 470226, "epoch": 2798} {"train_loss": -12.59531021118164, "global_step": 470227, "epoch": 2798} {"train_loss": -12.477253913879395, "global_step": 470228, "epoch": 2798} {"train_loss": -12.731927871704102, "global_step": 470229, "epoch": 2798} {"train_loss": -12.410263061523438, "global_step": 470230, "epoch": 2798} {"train_loss": -12.034409500303722, "global_step": 470231, "epoch": 2798, "val_loss": 313174.625} {"train_loss": -12.316411018371582, "global_step": 470232, "epoch": 2799} {"train_loss": -12.928690910339355, "global_step": 470233, "epoch": 2799} {"train_loss": -12.345460891723633, "global_step": 470234, "epoch": 2799} {"train_loss": -12.885723114013672, "global_step": 470235, "epoch": 2799} {"train_loss": -12.385198593139648, "global_step": 470236, "epoch": 2799} {"train_loss": -12.72690200805664, "global_step": 470237, "epoch": 2799} {"train_loss": -12.023214340209961, "global_step": 470238, "epoch": 2799} {"train_loss": -12.448701858520508, "global_step": 470239, "epoch": 2799} {"train_loss": -12.07923698425293, "global_step": 470240, "epoch": 2799} {"train_loss": -12.4609375, "global_step": 470241, "epoch": 2799} {"train_loss": -11.996313095092773, "global_step": 470242, "epoch": 2799} {"train_loss": -11.67774772644043, "global_step": 470243, "epoch": 2799} {"train_loss": -11.065042495727539, "global_step": 470244, "epoch": 2799} {"train_loss": -12.887201309204102, "global_step": 470245, "epoch": 2799} {"train_loss": -11.285730361938477, "global_step": 470246, "epoch": 2799} {"train_loss": -10.419013023376465, "global_step": 470247, "epoch": 2799} {"train_loss": -10.838619232177734, "global_step": 470248, "epoch": 2799} {"train_loss": -11.577812194824219, "global_step": 470249, "epoch": 2799} {"train_loss": -11.021552085876465, "global_step": 470250, "epoch": 2799} {"train_loss": -10.16229248046875, "global_step": 470251, "epoch": 2799} {"train_loss": -10.980128288269043, "global_step": 470252, "epoch": 2799} {"train_loss": -10.150381088256836, "global_step": 470253, "epoch": 2799} {"train_loss": -9.5813570022583, "global_step": 470254, "epoch": 2799} {"train_loss": -10.957298278808594, "global_step": 470255, "epoch": 2799} {"train_loss": -10.768672943115234, "global_step": 470256, "epoch": 2799} {"train_loss": -10.346961975097656, "global_step": 470257, "epoch": 2799} {"train_loss": -9.415546417236328, "global_step": 470258, "epoch": 2799} {"train_loss": -9.753275871276855, "global_step": 470259, "epoch": 2799} {"train_loss": -10.887733459472656, "global_step": 470260, "epoch": 2799} {"train_loss": -10.32345199584961, "global_step": 470261, "epoch": 2799} {"train_loss": -10.522490501403809, "global_step": 470262, "epoch": 2799} {"train_loss": -9.276273727416992, "global_step": 470263, "epoch": 2799} {"train_loss": -10.331296920776367, "global_step": 470264, "epoch": 2799} {"train_loss": -11.123077392578125, "global_step": 470265, "epoch": 2799} {"train_loss": -10.763046264648438, "global_step": 470266, "epoch": 2799} {"train_loss": -11.418649673461914, "global_step": 470267, "epoch": 2799} {"train_loss": -11.66348648071289, "global_step": 470268, "epoch": 2799} {"train_loss": -11.040043830871582, "global_step": 470269, "epoch": 2799} {"train_loss": -11.816112518310547, "global_step": 470270, "epoch": 2799} {"train_loss": -11.12420654296875, "global_step": 470271, "epoch": 2799} {"train_loss": -11.905976295471191, "global_step": 470272, "epoch": 2799} {"train_loss": -11.086984634399414, "global_step": 470273, "epoch": 2799} {"train_loss": -11.783836364746094, "global_step": 470274, "epoch": 2799} {"train_loss": -11.715147972106934, "global_step": 470275, "epoch": 2799} {"train_loss": -11.835824966430664, "global_step": 470276, "epoch": 2799} {"train_loss": -12.320223808288574, "global_step": 470277, "epoch": 2799} {"train_loss": -10.984354972839355, "global_step": 470278, "epoch": 2799} {"train_loss": -12.032549858093262, "global_step": 470279, "epoch": 2799} {"train_loss": -11.684739112854004, "global_step": 470280, "epoch": 2799} {"train_loss": -11.71888542175293, "global_step": 470281, "epoch": 2799} {"train_loss": -11.774139404296875, "global_step": 470282, "epoch": 2799} {"train_loss": -11.536113739013672, "global_step": 470283, "epoch": 2799} {"train_loss": -12.249446868896484, "global_step": 470284, "epoch": 2799} {"train_loss": -11.643913269042969, "global_step": 470285, "epoch": 2799} {"train_loss": -12.056154251098633, "global_step": 470286, "epoch": 2799} {"train_loss": -11.855276107788086, "global_step": 470287, "epoch": 2799} {"train_loss": -11.664592742919922, "global_step": 470288, "epoch": 2799} {"train_loss": -11.8115816116333, "global_step": 470289, "epoch": 2799} {"train_loss": -11.38549518585205, "global_step": 470290, "epoch": 2799} {"train_loss": -12.0228271484375, "global_step": 470291, "epoch": 2799} {"train_loss": -11.730463027954102, "global_step": 470292, "epoch": 2799} {"train_loss": -12.31584358215332, "global_step": 470293, "epoch": 2799} {"train_loss": -12.532909393310547, "global_step": 470294, "epoch": 2799} {"train_loss": -11.869548797607422, "global_step": 470295, "epoch": 2799} {"train_loss": -12.232379913330078, "global_step": 470296, "epoch": 2799} {"train_loss": -12.246315002441406, "global_step": 470297, "epoch": 2799} {"train_loss": -12.194733619689941, "global_step": 470298, "epoch": 2799} {"train_loss": -12.326947212219238, "global_step": 470299, "epoch": 2799} {"train_loss": -12.516258239746094, "global_step": 470300, "epoch": 2799} {"train_loss": -12.143783569335938, "global_step": 470301, "epoch": 2799} {"train_loss": -12.284483909606934, "global_step": 470302, "epoch": 2799} {"train_loss": -12.15902328491211, "global_step": 470303, "epoch": 2799} {"train_loss": -12.396561622619629, "global_step": 470304, "epoch": 2799} {"train_loss": -12.432839393615723, "global_step": 470305, "epoch": 2799} {"train_loss": -12.515701293945312, "global_step": 470306, "epoch": 2799} {"train_loss": -12.49069595336914, "global_step": 470307, "epoch": 2799} {"train_loss": -12.307332038879395, "global_step": 470308, "epoch": 2799} {"train_loss": -12.566844940185547, "global_step": 470309, "epoch": 2799} {"train_loss": -12.31036376953125, "global_step": 470310, "epoch": 2799} {"train_loss": -12.610515594482422, "global_step": 470311, "epoch": 2799} {"train_loss": -12.413837432861328, "global_step": 470312, "epoch": 2799} {"train_loss": -12.668193817138672, "global_step": 470313, "epoch": 2799} {"train_loss": -12.47166633605957, "global_step": 470314, "epoch": 2799} {"train_loss": -12.509256362915039, "global_step": 470315, "epoch": 2799} {"train_loss": -12.335457801818848, "global_step": 470316, "epoch": 2799} {"train_loss": -12.430366516113281, "global_step": 470317, "epoch": 2799} {"train_loss": -12.816841125488281, "global_step": 470318, "epoch": 2799} {"train_loss": -12.349944114685059, "global_step": 470319, "epoch": 2799} {"train_loss": -12.512540817260742, "global_step": 470320, "epoch": 2799} {"train_loss": -12.617855072021484, "global_step": 470321, "epoch": 2799} {"train_loss": -12.664056777954102, "global_step": 470322, "epoch": 2799} {"train_loss": -12.791248321533203, "global_step": 470323, "epoch": 2799} {"train_loss": -12.644624710083008, "global_step": 470324, "epoch": 2799} {"train_loss": -12.625597953796387, "global_step": 470325, "epoch": 2799} {"train_loss": -12.687393188476562, "global_step": 470326, "epoch": 2799} {"train_loss": -12.726478576660156, "global_step": 470327, "epoch": 2799} {"train_loss": -12.596458435058594, "global_step": 470328, "epoch": 2799} {"train_loss": -12.485330581665039, "global_step": 470329, "epoch": 2799} {"train_loss": -12.647737503051758, "global_step": 470330, "epoch": 2799} {"train_loss": -12.899007797241211, "global_step": 470331, "epoch": 2799} {"train_loss": -12.810333251953125, "global_step": 470332, "epoch": 2799} {"train_loss": -12.79012680053711, "global_step": 470333, "epoch": 2799} {"train_loss": -12.744754791259766, "global_step": 470334, "epoch": 2799} {"train_loss": -12.59615421295166, "global_step": 470335, "epoch": 2799} {"train_loss": -12.816734313964844, "global_step": 470336, "epoch": 2799} {"train_loss": -12.908758163452148, "global_step": 470337, "epoch": 2799} {"train_loss": -12.740713119506836, "global_step": 470338, "epoch": 2799} {"train_loss": -12.840681076049805, "global_step": 470339, "epoch": 2799} {"train_loss": -12.503612518310547, "global_step": 470340, "epoch": 2799} {"train_loss": -12.490242958068848, "global_step": 470341, "epoch": 2799} {"train_loss": -12.38160514831543, "global_step": 470342, "epoch": 2799} {"train_loss": -12.873605728149414, "global_step": 470343, "epoch": 2799} {"train_loss": -12.613310813903809, "global_step": 470344, "epoch": 2799} {"train_loss": -12.45850944519043, "global_step": 470345, "epoch": 2799} {"train_loss": -12.647217750549316, "global_step": 470346, "epoch": 2799} {"train_loss": -12.690673828125, "global_step": 470347, "epoch": 2799} {"train_loss": -12.069509506225586, "global_step": 470348, "epoch": 2799} {"train_loss": -12.555482864379883, "global_step": 470349, "epoch": 2799} {"train_loss": -12.849674224853516, "global_step": 470350, "epoch": 2799} {"train_loss": -12.824867248535156, "global_step": 470351, "epoch": 2799} {"train_loss": -12.092035293579102, "global_step": 470352, "epoch": 2799} {"train_loss": -12.267532348632812, "global_step": 470353, "epoch": 2799} {"train_loss": -12.632377624511719, "global_step": 470354, "epoch": 2799} {"train_loss": -12.704456329345703, "global_step": 470355, "epoch": 2799} {"train_loss": -12.726495742797852, "global_step": 470356, "epoch": 2799} {"train_loss": -12.225284576416016, "global_step": 470357, "epoch": 2799} {"train_loss": -12.389403343200684, "global_step": 470358, "epoch": 2799} {"train_loss": -12.68057632446289, "global_step": 470359, "epoch": 2799} {"train_loss": -12.6895751953125, "global_step": 470360, "epoch": 2799} {"train_loss": -12.104990005493164, "global_step": 470361, "epoch": 2799} {"train_loss": -12.58934211730957, "global_step": 470362, "epoch": 2799} {"train_loss": -12.801689147949219, "global_step": 470363, "epoch": 2799} {"train_loss": -12.699834823608398, "global_step": 470364, "epoch": 2799} {"train_loss": -12.041318893432617, "global_step": 470365, "epoch": 2799} {"train_loss": -11.898547172546387, "global_step": 470366, "epoch": 2799} {"train_loss": -12.452783584594727, "global_step": 470367, "epoch": 2799} {"train_loss": -12.68875789642334, "global_step": 470368, "epoch": 2799} {"train_loss": -12.509603500366211, "global_step": 470369, "epoch": 2799} {"train_loss": -12.705114364624023, "global_step": 470370, "epoch": 2799} {"train_loss": -11.95311450958252, "global_step": 470371, "epoch": 2799} {"train_loss": -12.26194953918457, "global_step": 470372, "epoch": 2799} {"train_loss": -11.828651428222656, "global_step": 470373, "epoch": 2799} {"train_loss": -12.277679443359375, "global_step": 470374, "epoch": 2799} {"train_loss": -11.398778915405273, "global_step": 470375, "epoch": 2799} {"train_loss": -12.006834983825684, "global_step": 470376, "epoch": 2799} {"train_loss": -12.400199890136719, "global_step": 470377, "epoch": 2799} {"train_loss": -12.057587623596191, "global_step": 470378, "epoch": 2799} {"train_loss": -11.278614044189453, "global_step": 470379, "epoch": 2799} {"train_loss": -11.884855270385742, "global_step": 470380, "epoch": 2799} {"train_loss": -12.578493118286133, "global_step": 470381, "epoch": 2799} {"train_loss": -11.37910270690918, "global_step": 470382, "epoch": 2799} {"train_loss": -11.939516067504883, "global_step": 470383, "epoch": 2799} {"train_loss": -12.273399353027344, "global_step": 470384, "epoch": 2799} {"train_loss": -11.986227035522461, "global_step": 470385, "epoch": 2799} {"train_loss": -11.64883041381836, "global_step": 470386, "epoch": 2799} {"train_loss": -12.23189926147461, "global_step": 470387, "epoch": 2799} {"train_loss": -12.31463623046875, "global_step": 470388, "epoch": 2799} {"train_loss": -12.289660453796387, "global_step": 470389, "epoch": 2799} {"train_loss": -12.546747207641602, "global_step": 470390, "epoch": 2799} {"train_loss": -12.285324096679688, "global_step": 470391, "epoch": 2799} {"train_loss": -11.353765487670898, "global_step": 470392, "epoch": 2799} {"train_loss": -11.708386421203613, "global_step": 470393, "epoch": 2799} {"train_loss": -12.34221363067627, "global_step": 470394, "epoch": 2799} {"train_loss": -10.616777420043945, "global_step": 470395, "epoch": 2799} {"train_loss": -12.077488899230957, "global_step": 470396, "epoch": 2799} {"train_loss": -9.606731414794922, "global_step": 470397, "epoch": 2799} {"train_loss": -11.196723937988281, "global_step": 470398, "epoch": 2799} {"train_loss": -11.995736553555442, "global_step": 470399, "epoch": 2799, "val_loss": 313252.53125} {"train_loss": -9.941604614257812, "global_step": 470400, "epoch": 2800} {"train_loss": -8.716219902038574, "global_step": 470401, "epoch": 2800} {"train_loss": -11.516315460205078, "global_step": 470402, "epoch": 2800} {"train_loss": -7.797947883605957, "global_step": 470403, "epoch": 2800} {"train_loss": -8.82143783569336, "global_step": 470404, "epoch": 2800} {"train_loss": -9.828120231628418, "global_step": 470405, "epoch": 2800} {"train_loss": -9.085373878479004, "global_step": 470406, "epoch": 2800} {"train_loss": -10.681295394897461, "global_step": 470407, "epoch": 2800} {"train_loss": -8.413463592529297, "global_step": 470408, "epoch": 2800} {"train_loss": -8.100728988647461, "global_step": 470409, "epoch": 2800} {"train_loss": -9.045381546020508, "global_step": 470410, "epoch": 2800} {"train_loss": -9.139430046081543, "global_step": 470411, "epoch": 2800} {"train_loss": -9.845394134521484, "global_step": 470412, "epoch": 2800} {"train_loss": -10.27254867553711, "global_step": 470413, "epoch": 2800} {"train_loss": -9.841120719909668, "global_step": 470414, "epoch": 2800} {"train_loss": -9.497411727905273, "global_step": 470415, "epoch": 2800} {"train_loss": -10.330206871032715, "global_step": 470416, "epoch": 2800} {"train_loss": -10.310566902160645, "global_step": 470417, "epoch": 2800} {"train_loss": -9.6834716796875, "global_step": 470418, "epoch": 2800} {"train_loss": -9.335684776306152, "global_step": 470419, "epoch": 2800} {"train_loss": -10.300786018371582, "global_step": 470420, "epoch": 2800} {"train_loss": -11.166287422180176, "global_step": 470421, "epoch": 2800} {"train_loss": -10.224148750305176, "global_step": 470422, "epoch": 2800} {"train_loss": -10.290781021118164, "global_step": 470423, "epoch": 2800} {"train_loss": -9.597052574157715, "global_step": 470424, "epoch": 2800} {"train_loss": -10.422654151916504, "global_step": 470425, "epoch": 2800} {"train_loss": -11.189903259277344, "global_step": 470426, "epoch": 2800} {"train_loss": -10.162751197814941, "global_step": 470427, "epoch": 2800} {"train_loss": -11.050361633300781, "global_step": 470428, "epoch": 2800} {"train_loss": -10.551054000854492, "global_step": 470429, "epoch": 2800} {"train_loss": -11.444530487060547, "global_step": 470430, "epoch": 2800} {"train_loss": -10.123044967651367, "global_step": 470431, "epoch": 2800} {"train_loss": -11.450725555419922, "global_step": 470432, "epoch": 2800} {"train_loss": -11.258901596069336, "global_step": 470433, "epoch": 2800} {"train_loss": -11.245944023132324, "global_step": 470434, "epoch": 2800} {"train_loss": -11.65446662902832, "global_step": 470435, "epoch": 2800} {"train_loss": -11.474000930786133, "global_step": 470436, "epoch": 2800} {"train_loss": -11.626315116882324, "global_step": 470437, "epoch": 2800} {"train_loss": -11.71658706665039, "global_step": 470438, "epoch": 2800} {"train_loss": -11.802138328552246, "global_step": 470439, "epoch": 2800} {"train_loss": -11.516889572143555, "global_step": 470440, "epoch": 2800} {"train_loss": -12.151104927062988, "global_step": 470441, "epoch": 2800} {"train_loss": -11.50643539428711, "global_step": 470442, "epoch": 2800} {"train_loss": -12.041314125061035, "global_step": 470443, "epoch": 2800} {"train_loss": -11.685553550720215, "global_step": 470444, "epoch": 2800} {"train_loss": -11.697038650512695, "global_step": 470445, "epoch": 2800} {"train_loss": -11.679673194885254, "global_step": 470446, "epoch": 2800} {"train_loss": -11.335309028625488, "global_step": 470447, "epoch": 2800} {"train_loss": -11.795761108398438, "global_step": 470448, "epoch": 2800} {"train_loss": -12.041397094726562, "global_step": 470449, "epoch": 2800} {"train_loss": -11.750274658203125, "global_step": 470450, "epoch": 2800} {"train_loss": -11.794981002807617, "global_step": 470451, "epoch": 2800} {"train_loss": -12.07856559753418, "global_step": 470452, "epoch": 2800} {"train_loss": -11.61635971069336, "global_step": 470453, "epoch": 2800} {"train_loss": -11.91313362121582, "global_step": 470454, "epoch": 2800} {"train_loss": -11.564018249511719, "global_step": 470455, "epoch": 2800} {"train_loss": -12.46987533569336, "global_step": 470456, "epoch": 2800} {"train_loss": -11.595907211303711, "global_step": 470457, "epoch": 2800} {"train_loss": -12.347627639770508, "global_step": 470458, "epoch": 2800} {"train_loss": -12.01658821105957, "global_step": 470459, "epoch": 2800} {"train_loss": -12.383909225463867, "global_step": 470460, "epoch": 2800} {"train_loss": -12.178325653076172, "global_step": 470461, "epoch": 2800} {"train_loss": -12.491655349731445, "global_step": 470462, "epoch": 2800} {"train_loss": -12.369375228881836, "global_step": 470463, "epoch": 2800} {"train_loss": -12.462931632995605, "global_step": 470464, "epoch": 2800} {"train_loss": -12.296021461486816, "global_step": 470465, "epoch": 2800} {"train_loss": -12.189142227172852, "global_step": 470466, "epoch": 2800} {"train_loss": -12.31693172454834, "global_step": 470467, "epoch": 2800} {"train_loss": -12.087898254394531, "global_step": 470468, "epoch": 2800} {"train_loss": -12.424430847167969, "global_step": 470469, "epoch": 2800} {"train_loss": -12.384740829467773, "global_step": 470470, "epoch": 2800} {"train_loss": -12.331382751464844, "global_step": 470471, "epoch": 2800} {"train_loss": -12.36764144897461, "global_step": 470472, "epoch": 2800} {"train_loss": -12.347973823547363, "global_step": 470473, "epoch": 2800} {"train_loss": -12.391717910766602, "global_step": 470474, "epoch": 2800} {"train_loss": -12.382406234741211, "global_step": 470475, "epoch": 2800} {"train_loss": -12.328254699707031, "global_step": 470476, "epoch": 2800} {"train_loss": -12.535765647888184, "global_step": 470477, "epoch": 2800} {"train_loss": -12.376480102539062, "global_step": 470478, "epoch": 2800} {"train_loss": -12.316314697265625, "global_step": 470479, "epoch": 2800} {"train_loss": -12.417879104614258, "global_step": 470480, "epoch": 2800} {"train_loss": -12.366447448730469, "global_step": 470481, "epoch": 2800} {"train_loss": -12.554224967956543, "global_step": 470482, "epoch": 2800} {"train_loss": -12.383536338806152, "global_step": 470483, "epoch": 2800} {"train_loss": -12.542738914489746, "global_step": 470484, "epoch": 2800} {"train_loss": -12.429922103881836, "global_step": 470485, "epoch": 2800} {"train_loss": -12.476980209350586, "global_step": 470486, "epoch": 2800} {"train_loss": -12.279422760009766, "global_step": 470487, "epoch": 2800} {"train_loss": -12.51779556274414, "global_step": 470488, "epoch": 2800} {"train_loss": -12.422316551208496, "global_step": 470489, "epoch": 2800} {"train_loss": -12.694995880126953, "global_step": 470490, "epoch": 2800} {"train_loss": -12.485971450805664, "global_step": 470491, "epoch": 2800} {"train_loss": -12.484045028686523, "global_step": 470492, "epoch": 2800} {"train_loss": -12.566802024841309, "global_step": 470493, "epoch": 2800} {"train_loss": -12.643917083740234, "global_step": 470494, "epoch": 2800} {"train_loss": -12.674463272094727, "global_step": 470495, "epoch": 2800} {"train_loss": -12.721285820007324, "global_step": 470496, "epoch": 2800} {"train_loss": -12.635562896728516, "global_step": 470497, "epoch": 2800} {"train_loss": -12.774568557739258, "global_step": 470498, "epoch": 2800} {"train_loss": -12.780271530151367, "global_step": 470499, "epoch": 2800} {"train_loss": -12.78570556640625, "global_step": 470500, "epoch": 2800} {"train_loss": -12.799276351928711, "global_step": 470501, "epoch": 2800} {"train_loss": -12.881444931030273, "global_step": 470502, "epoch": 2800} {"train_loss": -12.693138122558594, "global_step": 470503, "epoch": 2800} {"train_loss": -12.656373977661133, "global_step": 470504, "epoch": 2800} {"train_loss": -12.535385131835938, "global_step": 470505, "epoch": 2800} {"train_loss": -12.713401794433594, "global_step": 470506, "epoch": 2800} {"train_loss": -12.596826553344727, "global_step": 470507, "epoch": 2800} {"train_loss": -12.561178207397461, "global_step": 470508, "epoch": 2800} {"train_loss": -12.626640319824219, "global_step": 470509, "epoch": 2800} {"train_loss": -12.742973327636719, "global_step": 470510, "epoch": 2800} {"train_loss": -12.671125411987305, "global_step": 470511, "epoch": 2800} {"train_loss": -12.563085556030273, "global_step": 470512, "epoch": 2800} {"train_loss": -12.789438247680664, "global_step": 470513, "epoch": 2800} {"train_loss": -12.77873706817627, "global_step": 470514, "epoch": 2800} {"train_loss": -12.638468742370605, "global_step": 470515, "epoch": 2800} {"train_loss": -12.791139602661133, "global_step": 470516, "epoch": 2800} {"train_loss": -12.557165145874023, "global_step": 470517, "epoch": 2800} {"train_loss": -12.802282333374023, "global_step": 470518, "epoch": 2800} {"train_loss": -12.394782066345215, "global_step": 470519, "epoch": 2800} {"train_loss": -13.111214637756348, "global_step": 470520, "epoch": 2800} {"train_loss": -12.707669258117676, "global_step": 470521, "epoch": 2800} {"train_loss": -12.622495651245117, "global_step": 470522, "epoch": 2800} {"train_loss": -12.944729804992676, "global_step": 470523, "epoch": 2800} {"train_loss": -12.471851348876953, "global_step": 470524, "epoch": 2800} {"train_loss": -12.544233322143555, "global_step": 470525, "epoch": 2800} {"train_loss": -12.86689567565918, "global_step": 470526, "epoch": 2800} {"train_loss": -12.685693740844727, "global_step": 470527, "epoch": 2800} {"train_loss": -12.567344665527344, "global_step": 470528, "epoch": 2800} {"train_loss": -12.853214263916016, "global_step": 470529, "epoch": 2800} {"train_loss": -12.88216781616211, "global_step": 470530, "epoch": 2800} {"train_loss": -12.84528636932373, "global_step": 470531, "epoch": 2800} {"train_loss": -12.813143730163574, "global_step": 470532, "epoch": 2800} {"train_loss": -12.932378768920898, "global_step": 470533, "epoch": 2800} {"train_loss": -12.846452713012695, "global_step": 470534, "epoch": 2800} {"train_loss": -12.828898429870605, "global_step": 470535, "epoch": 2800} {"train_loss": -12.459526062011719, "global_step": 470536, "epoch": 2800} {"train_loss": -12.757603645324707, "global_step": 470537, "epoch": 2800} {"train_loss": -12.81222915649414, "global_step": 470538, "epoch": 2800} {"train_loss": -12.328113555908203, "global_step": 470539, "epoch": 2800} {"train_loss": -12.481534004211426, "global_step": 470540, "epoch": 2800} {"train_loss": -12.843706130981445, "global_step": 470541, "epoch": 2800} {"train_loss": -12.174922943115234, "global_step": 470542, "epoch": 2800} {"train_loss": -11.503547668457031, "global_step": 470543, "epoch": 2800} {"train_loss": -10.956558227539062, "global_step": 470544, "epoch": 2800} {"train_loss": -12.49474811553955, "global_step": 470545, "epoch": 2800} {"train_loss": -11.73158073425293, "global_step": 470546, "epoch": 2800} {"train_loss": -12.26470947265625, "global_step": 470547, "epoch": 2800} {"train_loss": -10.863946914672852, "global_step": 470548, "epoch": 2800} {"train_loss": -12.851997375488281, "global_step": 470549, "epoch": 2800} {"train_loss": -11.760726928710938, "global_step": 470550, "epoch": 2800} {"train_loss": -12.703529357910156, "global_step": 470551, "epoch": 2800} {"train_loss": -12.187268257141113, "global_step": 470552, "epoch": 2800} {"train_loss": -12.27723503112793, "global_step": 470553, "epoch": 2800} {"train_loss": -12.564108848571777, "global_step": 470554, "epoch": 2800} {"train_loss": -12.632987976074219, "global_step": 470555, "epoch": 2800} {"train_loss": -12.358829498291016, "global_step": 470556, "epoch": 2800} {"train_loss": -12.207307815551758, "global_step": 470557, "epoch": 2800} {"train_loss": -12.620984077453613, "global_step": 470558, "epoch": 2800} {"train_loss": -12.147972106933594, "global_step": 470559, "epoch": 2800} {"train_loss": -11.758804321289062, "global_step": 470560, "epoch": 2800} {"train_loss": -12.16522216796875, "global_step": 470561, "epoch": 2800} {"train_loss": -12.768941879272461, "global_step": 470562, "epoch": 2800} {"train_loss": -11.848454475402832, "global_step": 470563, "epoch": 2800} {"train_loss": -11.753210067749023, "global_step": 470564, "epoch": 2800} {"train_loss": -12.549612045288086, "global_step": 470565, "epoch": 2800} {"train_loss": -12.188047409057617, "global_step": 470566, "epoch": 2800} {"train_loss": -11.858343436604454, "global_step": 470567, "epoch": 2800, "train/sim_max_reward_0": 0.9661883089952304, "train/sim_max_reward_1": 0.9740154230986803, "train/sim_max_reward_2": 0.010220101185939133, "train/sim_max_reward_3": 0.9903900285114584, "train/sim_max_reward_4": 0.9954242983347943, "train/sim_max_reward_5": 0.9538088779459318, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.37264795390205385, "test/sim_max_reward_4400002": 0.38157683218838034, "test/sim_max_reward_4400003": 0.29025578738900304, "test/sim_max_reward_4400004": 0.45824440996632987, "test/sim_max_reward_4400005": 0.9801503368362486, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 0.5079562096744125, "test/sim_max_reward_4400008": 0.590571979603581, "test/sim_max_reward_4400009": 0.37984272945645814, "test/sim_max_reward_4400010": 0.6830595029587002, "test/sim_max_reward_4400011": 0.5212018045611804, "test/sim_max_reward_4400012": 0.9348248190444561, "test/sim_max_reward_4400013": 0.6273958401668541, "test/sim_max_reward_4400014": 0.6138073777964355, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.10213108926081868, "test/sim_max_reward_4400018": 0.9964690438311807, "test/sim_max_reward_4400019": 0.3430903298058805, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.6868732159734513, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.09830664682164232, "test/sim_max_reward_4400025": 0.5394118332730102, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.41880979153606207, "test/sim_max_reward_4400028": 0.6710179797220805, "test/sim_max_reward_4400029": 0.7074930686726076, "test/sim_max_reward_4400030": 0.9654976332391657, "test/sim_max_reward_4400031": 0.5867932877930847, "test/sim_max_reward_4400032": 0.1559472612624738, "test/sim_max_reward_4400033": 0.5823259466961334, "test/sim_max_reward_4400034": 0.44999870845165807, "test/sim_max_reward_4400035": 0.5709301630995051, "test/sim_max_reward_4400036": 0.35679807165097127, "test/sim_max_reward_4400037": 0.9797159689929297, "test/sim_max_reward_4400038": 1.0, "test/sim_max_reward_4400039": 0.41168222469845567, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 1.0, "test/sim_max_reward_4400042": 0.031979760844644524, "test/sim_max_reward_4400043": 0.024860084988166994, "test/sim_max_reward_4400044": 0.9592631696708931, "test/sim_max_reward_4400045": 0.42131265841958077, "test/sim_max_reward_4400046": 0.7302820554130839, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.8150078396786723, "test/mean_score": 0.5026547200653579, "val_loss": 316675.0, "train_action_mse_error": 2.127493143081665} {"train_loss": -12.669390678405762, "global_step": 470568, "epoch": 2801} {"train_loss": -12.22078800201416, "global_step": 470569, "epoch": 2801} {"train_loss": -11.768306732177734, "global_step": 470570, "epoch": 2801} {"train_loss": -12.109884262084961, "global_step": 470571, "epoch": 2801} {"train_loss": -12.376348495483398, "global_step": 470572, "epoch": 2801} {"train_loss": -11.888524055480957, "global_step": 470573, "epoch": 2801} {"train_loss": -12.289981842041016, "global_step": 470574, "epoch": 2801} {"train_loss": -11.75177001953125, "global_step": 470575, "epoch": 2801} {"train_loss": -12.171632766723633, "global_step": 470576, "epoch": 2801} {"train_loss": -11.807757377624512, "global_step": 470577, "epoch": 2801} {"train_loss": -11.882844924926758, "global_step": 470578, "epoch": 2801} {"train_loss": -11.961503982543945, "global_step": 470579, "epoch": 2801} {"train_loss": -12.380850791931152, "global_step": 470580, "epoch": 2801} {"train_loss": -11.480539321899414, "global_step": 470581, "epoch": 2801} {"train_loss": -12.551492691040039, "global_step": 470582, "epoch": 2801} {"train_loss": -11.709818840026855, "global_step": 470583, "epoch": 2801} {"train_loss": -11.646156311035156, "global_step": 470584, "epoch": 2801} {"train_loss": -11.18149185180664, "global_step": 470585, "epoch": 2801} {"train_loss": -11.917919158935547, "global_step": 470586, "epoch": 2801} {"train_loss": -10.667213439941406, "global_step": 470587, "epoch": 2801} {"train_loss": -12.587348937988281, "global_step": 470588, "epoch": 2801} {"train_loss": -11.737939834594727, "global_step": 470589, "epoch": 2801} {"train_loss": -11.94345760345459, "global_step": 470590, "epoch": 2801} {"train_loss": -12.120018005371094, "global_step": 470591, "epoch": 2801} {"train_loss": -12.43828010559082, "global_step": 470592, "epoch": 2801} {"train_loss": -11.910316467285156, "global_step": 470593, "epoch": 2801} {"train_loss": -12.098030090332031, "global_step": 470594, "epoch": 2801} {"train_loss": -12.232409477233887, "global_step": 470595, "epoch": 2801} {"train_loss": -12.120098114013672, "global_step": 470596, "epoch": 2801} {"train_loss": -12.006355285644531, "global_step": 470597, "epoch": 2801} {"train_loss": -12.229787826538086, "global_step": 470598, "epoch": 2801} {"train_loss": -11.841951370239258, "global_step": 470599, "epoch": 2801} {"train_loss": -12.152753829956055, "global_step": 470600, "epoch": 2801} {"train_loss": -11.705907821655273, "global_step": 470601, "epoch": 2801} {"train_loss": -11.130720138549805, "global_step": 470602, "epoch": 2801} {"train_loss": -11.54623031616211, "global_step": 470603, "epoch": 2801} {"train_loss": -10.385567665100098, "global_step": 470604, "epoch": 2801} {"train_loss": -11.312024116516113, "global_step": 470605, "epoch": 2801} {"train_loss": -10.960922241210938, "global_step": 470606, "epoch": 2801} {"train_loss": -11.58485221862793, "global_step": 470607, "epoch": 2801} {"train_loss": -12.100400924682617, "global_step": 470608, "epoch": 2801} {"train_loss": -11.316555976867676, "global_step": 470609, "epoch": 2801} {"train_loss": -11.813591003417969, "global_step": 470610, "epoch": 2801} {"train_loss": -11.861724853515625, "global_step": 470611, "epoch": 2801} {"train_loss": -11.583106994628906, "global_step": 470612, "epoch": 2801} {"train_loss": -11.645002365112305, "global_step": 470613, "epoch": 2801} {"train_loss": -12.223821640014648, "global_step": 470614, "epoch": 2801} {"train_loss": -12.340394973754883, "global_step": 470615, "epoch": 2801} {"train_loss": -12.355938911437988, "global_step": 470616, "epoch": 2801} {"train_loss": -12.400808334350586, "global_step": 470617, "epoch": 2801} {"train_loss": -12.203567504882812, "global_step": 470618, "epoch": 2801} {"train_loss": -12.26148796081543, "global_step": 470619, "epoch": 2801} {"train_loss": -12.187511444091797, "global_step": 470620, "epoch": 2801} {"train_loss": -12.032515525817871, "global_step": 470621, "epoch": 2801} {"train_loss": -12.257856369018555, "global_step": 470622, "epoch": 2801} {"train_loss": -12.149049758911133, "global_step": 470623, "epoch": 2801} {"train_loss": -12.164070129394531, "global_step": 470624, "epoch": 2801} {"train_loss": -11.996206283569336, "global_step": 470625, "epoch": 2801} {"train_loss": -11.737716674804688, "global_step": 470626, "epoch": 2801} {"train_loss": -12.168828964233398, "global_step": 470627, "epoch": 2801} {"train_loss": -11.649750709533691, "global_step": 470628, "epoch": 2801} {"train_loss": -12.088606834411621, "global_step": 470629, "epoch": 2801} {"train_loss": -12.333356857299805, "global_step": 470630, "epoch": 2801} {"train_loss": -11.76797866821289, "global_step": 470631, "epoch": 2801} {"train_loss": -12.4048490524292, "global_step": 470632, "epoch": 2801} {"train_loss": -12.305048942565918, "global_step": 470633, "epoch": 2801} {"train_loss": -12.3197021484375, "global_step": 470634, "epoch": 2801} {"train_loss": -11.953414916992188, "global_step": 470635, "epoch": 2801} {"train_loss": -12.287761688232422, "global_step": 470636, "epoch": 2801} {"train_loss": -12.156192779541016, "global_step": 470637, "epoch": 2801} {"train_loss": -12.276043891906738, "global_step": 470638, "epoch": 2801} {"train_loss": -12.36570930480957, "global_step": 470639, "epoch": 2801} {"train_loss": -12.200905799865723, "global_step": 470640, "epoch": 2801} {"train_loss": -12.504776954650879, "global_step": 470641, "epoch": 2801} {"train_loss": -11.986442565917969, "global_step": 470642, "epoch": 2801} {"train_loss": -12.34377670288086, "global_step": 470643, "epoch": 2801} {"train_loss": -11.87037467956543, "global_step": 470644, "epoch": 2801} {"train_loss": -12.342519760131836, "global_step": 470645, "epoch": 2801} {"train_loss": -12.594526290893555, "global_step": 470646, "epoch": 2801} {"train_loss": -11.039681434631348, "global_step": 470647, "epoch": 2801} {"train_loss": -12.732820510864258, "global_step": 470648, "epoch": 2801} {"train_loss": -12.370582580566406, "global_step": 470649, "epoch": 2801} {"train_loss": -11.834869384765625, "global_step": 470650, "epoch": 2801} {"train_loss": -12.551254272460938, "global_step": 470651, "epoch": 2801} {"train_loss": -11.971794128417969, "global_step": 470652, "epoch": 2801} {"train_loss": -12.016042709350586, "global_step": 470653, "epoch": 2801} {"train_loss": -12.386005401611328, "global_step": 470654, "epoch": 2801} {"train_loss": -11.944583892822266, "global_step": 470655, "epoch": 2801} {"train_loss": -12.227007865905762, "global_step": 470656, "epoch": 2801} {"train_loss": -12.712835311889648, "global_step": 470657, "epoch": 2801} {"train_loss": -12.413253784179688, "global_step": 470658, "epoch": 2801} {"train_loss": -12.455878257751465, "global_step": 470659, "epoch": 2801} {"train_loss": -12.420446395874023, "global_step": 470660, "epoch": 2801} {"train_loss": -11.996940612792969, "global_step": 470661, "epoch": 2801} {"train_loss": -12.347970962524414, "global_step": 470662, "epoch": 2801} {"train_loss": -11.710034370422363, "global_step": 470663, "epoch": 2801} {"train_loss": -11.937500953674316, "global_step": 470664, "epoch": 2801} {"train_loss": -12.43668270111084, "global_step": 470665, "epoch": 2801} {"train_loss": -12.441082000732422, "global_step": 470666, "epoch": 2801} {"train_loss": -12.267372131347656, "global_step": 470667, "epoch": 2801} {"train_loss": -12.332992553710938, "global_step": 470668, "epoch": 2801} {"train_loss": -11.672374725341797, "global_step": 470669, "epoch": 2801} {"train_loss": -11.956671714782715, "global_step": 470670, "epoch": 2801} {"train_loss": -12.152490615844727, "global_step": 470671, "epoch": 2801} {"train_loss": -11.42854118347168, "global_step": 470672, "epoch": 2801} {"train_loss": -12.050168991088867, "global_step": 470673, "epoch": 2801} {"train_loss": -11.777791976928711, "global_step": 470674, "epoch": 2801} {"train_loss": -12.59570026397705, "global_step": 470675, "epoch": 2801} {"train_loss": -12.187779426574707, "global_step": 470676, "epoch": 2801} {"train_loss": -12.391212463378906, "global_step": 470677, "epoch": 2801} {"train_loss": -12.367616653442383, "global_step": 470678, "epoch": 2801} {"train_loss": -12.432762145996094, "global_step": 470679, "epoch": 2801} {"train_loss": -12.310644149780273, "global_step": 470680, "epoch": 2801} {"train_loss": -12.144760131835938, "global_step": 470681, "epoch": 2801} {"train_loss": -12.377500534057617, "global_step": 470682, "epoch": 2801} {"train_loss": -12.614542007446289, "global_step": 470683, "epoch": 2801} {"train_loss": -12.515829086303711, "global_step": 470684, "epoch": 2801} {"train_loss": -12.592058181762695, "global_step": 470685, "epoch": 2801} {"train_loss": -12.401809692382812, "global_step": 470686, "epoch": 2801} {"train_loss": -12.648900985717773, "global_step": 470687, "epoch": 2801} {"train_loss": -12.520530700683594, "global_step": 470688, "epoch": 2801} {"train_loss": -12.469205856323242, "global_step": 470689, "epoch": 2801} {"train_loss": -12.546651840209961, "global_step": 470690, "epoch": 2801} {"train_loss": -12.766855239868164, "global_step": 470691, "epoch": 2801} {"train_loss": -12.130979537963867, "global_step": 470692, "epoch": 2801} {"train_loss": -12.631629943847656, "global_step": 470693, "epoch": 2801} {"train_loss": -12.496471405029297, "global_step": 470694, "epoch": 2801} {"train_loss": -12.344054222106934, "global_step": 470695, "epoch": 2801} {"train_loss": -12.454577445983887, "global_step": 470696, "epoch": 2801} {"train_loss": -12.25943374633789, "global_step": 470697, "epoch": 2801} {"train_loss": -11.81886100769043, "global_step": 470698, "epoch": 2801} {"train_loss": -12.52088737487793, "global_step": 470699, "epoch": 2801} {"train_loss": -12.069820404052734, "global_step": 470700, "epoch": 2801} {"train_loss": -12.018832206726074, "global_step": 470701, "epoch": 2801} {"train_loss": -12.184285163879395, "global_step": 470702, "epoch": 2801} {"train_loss": -11.579689025878906, "global_step": 470703, "epoch": 2801} {"train_loss": -12.661979675292969, "global_step": 470704, "epoch": 2801} {"train_loss": -11.797462463378906, "global_step": 470705, "epoch": 2801} {"train_loss": -11.977961540222168, "global_step": 470706, "epoch": 2801} {"train_loss": -12.379158020019531, "global_step": 470707, "epoch": 2801} {"train_loss": -12.001583099365234, "global_step": 470708, "epoch": 2801} {"train_loss": -11.378676414489746, "global_step": 470709, "epoch": 2801} {"train_loss": -12.277769088745117, "global_step": 470710, "epoch": 2801} {"train_loss": -12.087451934814453, "global_step": 470711, "epoch": 2801} {"train_loss": -12.248455047607422, "global_step": 470712, "epoch": 2801} {"train_loss": -12.294862747192383, "global_step": 470713, "epoch": 2801} {"train_loss": -11.794014930725098, "global_step": 470714, "epoch": 2801} {"train_loss": -11.627166748046875, "global_step": 470715, "epoch": 2801} {"train_loss": -12.556163787841797, "global_step": 470716, "epoch": 2801} {"train_loss": -12.037022590637207, "global_step": 470717, "epoch": 2801} {"train_loss": -12.28395938873291, "global_step": 470718, "epoch": 2801} {"train_loss": -12.212443351745605, "global_step": 470719, "epoch": 2801} {"train_loss": -11.020965576171875, "global_step": 470720, "epoch": 2801} {"train_loss": -11.711971282958984, "global_step": 470721, "epoch": 2801} {"train_loss": -11.210891723632812, "global_step": 470722, "epoch": 2801} {"train_loss": -10.781513214111328, "global_step": 470723, "epoch": 2801} {"train_loss": -11.915218353271484, "global_step": 470724, "epoch": 2801} {"train_loss": -11.538934707641602, "global_step": 470725, "epoch": 2801} {"train_loss": -11.57841682434082, "global_step": 470726, "epoch": 2801} {"train_loss": -11.081083297729492, "global_step": 470727, "epoch": 2801} {"train_loss": -9.839653015136719, "global_step": 470728, "epoch": 2801} {"train_loss": -10.479384422302246, "global_step": 470729, "epoch": 2801} {"train_loss": -10.882709503173828, "global_step": 470730, "epoch": 2801} {"train_loss": -9.945364952087402, "global_step": 470731, "epoch": 2801} {"train_loss": -9.007257461547852, "global_step": 470732, "epoch": 2801} {"train_loss": -10.492287635803223, "global_step": 470733, "epoch": 2801} {"train_loss": -9.314119338989258, "global_step": 470734, "epoch": 2801} {"train_loss": -11.952325610887437, "global_step": 470735, "epoch": 2801, "val_loss": 316580.46875} {"train_loss": -9.263921737670898, "global_step": 470736, "epoch": 2802} {"train_loss": -8.889790534973145, "global_step": 470737, "epoch": 2802} {"train_loss": -9.5238037109375, "global_step": 470738, "epoch": 2802} {"train_loss": -10.727914810180664, "global_step": 470739, "epoch": 2802} {"train_loss": -10.32912826538086, "global_step": 470740, "epoch": 2802} {"train_loss": -10.595643043518066, "global_step": 470741, "epoch": 2802} {"train_loss": -10.810214042663574, "global_step": 470742, "epoch": 2802} {"train_loss": -11.164313316345215, "global_step": 470743, "epoch": 2802} {"train_loss": -9.962185859680176, "global_step": 470744, "epoch": 2802} {"train_loss": -10.596887588500977, "global_step": 470745, "epoch": 2802} {"train_loss": -10.862396240234375, "global_step": 470746, "epoch": 2802} {"train_loss": -10.98355770111084, "global_step": 470747, "epoch": 2802} {"train_loss": -10.399585723876953, "global_step": 470748, "epoch": 2802} {"train_loss": -11.998700141906738, "global_step": 470749, "epoch": 2802} {"train_loss": -10.254659652709961, "global_step": 470750, "epoch": 2802} {"train_loss": -11.214244842529297, "global_step": 470751, "epoch": 2802} {"train_loss": -10.927411079406738, "global_step": 470752, "epoch": 2802} {"train_loss": -10.755901336669922, "global_step": 470753, "epoch": 2802} {"train_loss": -11.440155029296875, "global_step": 470754, "epoch": 2802} {"train_loss": -11.323403358459473, "global_step": 470755, "epoch": 2802} {"train_loss": -10.932344436645508, "global_step": 470756, "epoch": 2802} {"train_loss": -11.836799621582031, "global_step": 470757, "epoch": 2802} {"train_loss": -10.808268547058105, "global_step": 470758, "epoch": 2802} {"train_loss": -12.194761276245117, "global_step": 470759, "epoch": 2802} {"train_loss": -11.205663681030273, "global_step": 470760, "epoch": 2802} {"train_loss": -11.88213062286377, "global_step": 470761, "epoch": 2802} {"train_loss": -11.537734031677246, "global_step": 470762, "epoch": 2802} {"train_loss": -11.728852272033691, "global_step": 470763, "epoch": 2802} {"train_loss": -11.63792896270752, "global_step": 470764, "epoch": 2802} {"train_loss": -11.4006929397583, "global_step": 470765, "epoch": 2802} {"train_loss": -12.02857780456543, "global_step": 470766, "epoch": 2802} {"train_loss": -11.938638687133789, "global_step": 470767, "epoch": 2802} {"train_loss": -12.18875789642334, "global_step": 470768, "epoch": 2802} {"train_loss": -11.945243835449219, "global_step": 470769, "epoch": 2802} {"train_loss": -12.245969772338867, "global_step": 470770, "epoch": 2802} {"train_loss": -11.78994369506836, "global_step": 470771, "epoch": 2802} {"train_loss": -11.974817276000977, "global_step": 470772, "epoch": 2802} {"train_loss": -11.71302604675293, "global_step": 470773, "epoch": 2802} {"train_loss": -12.238876342773438, "global_step": 470774, "epoch": 2802} {"train_loss": -11.975605010986328, "global_step": 470775, "epoch": 2802} {"train_loss": -12.207538604736328, "global_step": 470776, "epoch": 2802} {"train_loss": -12.17858600616455, "global_step": 470777, "epoch": 2802} {"train_loss": -12.237606048583984, "global_step": 470778, "epoch": 2802} {"train_loss": -12.456117630004883, "global_step": 470779, "epoch": 2802} {"train_loss": -12.188247680664062, "global_step": 470780, "epoch": 2802} {"train_loss": -12.450002670288086, "global_step": 470781, "epoch": 2802} {"train_loss": -12.185410499572754, "global_step": 470782, "epoch": 2802} {"train_loss": -12.495611190795898, "global_step": 470783, "epoch": 2802} {"train_loss": -12.140031814575195, "global_step": 470784, "epoch": 2802} {"train_loss": -12.437387466430664, "global_step": 470785, "epoch": 2802} {"train_loss": -12.11799144744873, "global_step": 470786, "epoch": 2802} {"train_loss": -12.392053604125977, "global_step": 470787, "epoch": 2802} {"train_loss": -12.413997650146484, "global_step": 470788, "epoch": 2802} {"train_loss": -12.520734786987305, "global_step": 470789, "epoch": 2802} {"train_loss": -12.395137786865234, "global_step": 470790, "epoch": 2802} {"train_loss": -12.494851112365723, "global_step": 470791, "epoch": 2802} {"train_loss": -12.556215286254883, "global_step": 470792, "epoch": 2802} {"train_loss": -12.50369930267334, "global_step": 470793, "epoch": 2802} {"train_loss": -12.615570068359375, "global_step": 470794, "epoch": 2802} {"train_loss": -12.520919799804688, "global_step": 470795, "epoch": 2802} {"train_loss": -12.59525203704834, "global_step": 470796, "epoch": 2802} {"train_loss": -12.507844924926758, "global_step": 470797, "epoch": 2802} {"train_loss": -12.468168258666992, "global_step": 470798, "epoch": 2802} {"train_loss": -12.752941131591797, "global_step": 470799, "epoch": 2802} {"train_loss": -12.679786682128906, "global_step": 470800, "epoch": 2802} {"train_loss": -12.475288391113281, "global_step": 470801, "epoch": 2802} {"train_loss": -12.409759521484375, "global_step": 470802, "epoch": 2802} {"train_loss": -12.74756145477295, "global_step": 470803, "epoch": 2802} {"train_loss": -12.56142807006836, "global_step": 470804, "epoch": 2802} {"train_loss": -12.597929000854492, "global_step": 470805, "epoch": 2802} {"train_loss": -12.615445137023926, "global_step": 470806, "epoch": 2802} {"train_loss": -12.718281745910645, "global_step": 470807, "epoch": 2802} {"train_loss": -12.740344047546387, "global_step": 470808, "epoch": 2802} {"train_loss": -12.749753952026367, "global_step": 470809, "epoch": 2802} {"train_loss": -12.680891036987305, "global_step": 470810, "epoch": 2802} {"train_loss": -12.81397533416748, "global_step": 470811, "epoch": 2802} {"train_loss": -12.896833419799805, "global_step": 470812, "epoch": 2802} {"train_loss": -12.738779067993164, "global_step": 470813, "epoch": 2802} {"train_loss": -12.823500633239746, "global_step": 470814, "epoch": 2802} {"train_loss": -12.794833183288574, "global_step": 470815, "epoch": 2802} {"train_loss": -12.752361297607422, "global_step": 470816, "epoch": 2802} {"train_loss": -12.882568359375, "global_step": 470817, "epoch": 2802} {"train_loss": -12.768152236938477, "global_step": 470818, "epoch": 2802} {"train_loss": -12.877474784851074, "global_step": 470819, "epoch": 2802} {"train_loss": -12.655869483947754, "global_step": 470820, "epoch": 2802} {"train_loss": -12.912894248962402, "global_step": 470821, "epoch": 2802} {"train_loss": -12.950023651123047, "global_step": 470822, "epoch": 2802} {"train_loss": -12.767866134643555, "global_step": 470823, "epoch": 2802} {"train_loss": -12.938304901123047, "global_step": 470824, "epoch": 2802} {"train_loss": -12.612459182739258, "global_step": 470825, "epoch": 2802} {"train_loss": -12.716236114501953, "global_step": 470826, "epoch": 2802} {"train_loss": -12.910476684570312, "global_step": 470827, "epoch": 2802} {"train_loss": -12.969449043273926, "global_step": 470828, "epoch": 2802} {"train_loss": -12.891225814819336, "global_step": 470829, "epoch": 2802} {"train_loss": -12.775863647460938, "global_step": 470830, "epoch": 2802} {"train_loss": -12.951371192932129, "global_step": 470831, "epoch": 2802} {"train_loss": -12.882515907287598, "global_step": 470832, "epoch": 2802} {"train_loss": -13.063285827636719, "global_step": 470833, "epoch": 2802} {"train_loss": -13.113545417785645, "global_step": 470834, "epoch": 2802} {"train_loss": -12.829357147216797, "global_step": 470835, "epoch": 2802} {"train_loss": -12.779474258422852, "global_step": 470836, "epoch": 2802} {"train_loss": -12.919607162475586, "global_step": 470837, "epoch": 2802} {"train_loss": -12.792717933654785, "global_step": 470838, "epoch": 2802} {"train_loss": -12.869470596313477, "global_step": 470839, "epoch": 2802} {"train_loss": -12.83871841430664, "global_step": 470840, "epoch": 2802} {"train_loss": -12.877986907958984, "global_step": 470841, "epoch": 2802} {"train_loss": -13.043497085571289, "global_step": 470842, "epoch": 2802} {"train_loss": -13.026287078857422, "global_step": 470843, "epoch": 2802} {"train_loss": -13.114590644836426, "global_step": 470844, "epoch": 2802} {"train_loss": -12.880203247070312, "global_step": 470845, "epoch": 2802} {"train_loss": -12.989625930786133, "global_step": 470846, "epoch": 2802} {"train_loss": -13.245584487915039, "global_step": 470847, "epoch": 2802} {"train_loss": -13.033946990966797, "global_step": 470848, "epoch": 2802} {"train_loss": -13.045684814453125, "global_step": 470849, "epoch": 2802} {"train_loss": -12.985458374023438, "global_step": 470850, "epoch": 2802} {"train_loss": -12.989300727844238, "global_step": 470851, "epoch": 2802} {"train_loss": -13.065135955810547, "global_step": 470852, "epoch": 2802} {"train_loss": -13.066328048706055, "global_step": 470853, "epoch": 2802} {"train_loss": -12.955289840698242, "global_step": 470854, "epoch": 2802} {"train_loss": -12.97044563293457, "global_step": 470855, "epoch": 2802} {"train_loss": -12.892931938171387, "global_step": 470856, "epoch": 2802} {"train_loss": -12.807693481445312, "global_step": 470857, "epoch": 2802} {"train_loss": -12.940532684326172, "global_step": 470858, "epoch": 2802} {"train_loss": -12.968873977661133, "global_step": 470859, "epoch": 2802} {"train_loss": -12.295829772949219, "global_step": 470860, "epoch": 2802} {"train_loss": -12.886878967285156, "global_step": 470861, "epoch": 2802} {"train_loss": -13.070159912109375, "global_step": 470862, "epoch": 2802} {"train_loss": -12.328333854675293, "global_step": 470863, "epoch": 2802} {"train_loss": -12.51303768157959, "global_step": 470864, "epoch": 2802} {"train_loss": -12.34257698059082, "global_step": 470865, "epoch": 2802} {"train_loss": -12.621402740478516, "global_step": 470866, "epoch": 2802} {"train_loss": -12.681636810302734, "global_step": 470867, "epoch": 2802} {"train_loss": -12.312042236328125, "global_step": 470868, "epoch": 2802} {"train_loss": -11.791471481323242, "global_step": 470869, "epoch": 2802} {"train_loss": -12.320581436157227, "global_step": 470870, "epoch": 2802} {"train_loss": -11.43824291229248, "global_step": 470871, "epoch": 2802} {"train_loss": -9.666725158691406, "global_step": 470872, "epoch": 2802} {"train_loss": -10.7595853805542, "global_step": 470873, "epoch": 2802} {"train_loss": -9.504226684570312, "global_step": 470874, "epoch": 2802} {"train_loss": -11.300941467285156, "global_step": 470875, "epoch": 2802} {"train_loss": -9.653648376464844, "global_step": 470876, "epoch": 2802} {"train_loss": -11.884502410888672, "global_step": 470877, "epoch": 2802} {"train_loss": -10.042889595031738, "global_step": 470878, "epoch": 2802} {"train_loss": -10.573861122131348, "global_step": 470879, "epoch": 2802} {"train_loss": -12.106488227844238, "global_step": 470880, "epoch": 2802} {"train_loss": -10.369260787963867, "global_step": 470881, "epoch": 2802} {"train_loss": -11.623617172241211, "global_step": 470882, "epoch": 2802} {"train_loss": -11.41189956665039, "global_step": 470883, "epoch": 2802} {"train_loss": -11.082403182983398, "global_step": 470884, "epoch": 2802} {"train_loss": -11.871169090270996, "global_step": 470885, "epoch": 2802} {"train_loss": -10.365171432495117, "global_step": 470886, "epoch": 2802} {"train_loss": -10.863525390625, "global_step": 470887, "epoch": 2802} {"train_loss": -11.218194961547852, "global_step": 470888, "epoch": 2802} {"train_loss": -10.225709915161133, "global_step": 470889, "epoch": 2802} {"train_loss": -11.40898323059082, "global_step": 470890, "epoch": 2802} {"train_loss": -11.593316078186035, "global_step": 470891, "epoch": 2802} {"train_loss": -11.46030330657959, "global_step": 470892, "epoch": 2802} {"train_loss": -11.998751640319824, "global_step": 470893, "epoch": 2802} {"train_loss": -11.751327514648438, "global_step": 470894, "epoch": 2802} {"train_loss": -11.894227981567383, "global_step": 470895, "epoch": 2802} {"train_loss": -12.045490264892578, "global_step": 470896, "epoch": 2802} {"train_loss": -11.895599365234375, "global_step": 470897, "epoch": 2802} {"train_loss": -11.738058090209961, "global_step": 470898, "epoch": 2802} {"train_loss": -12.190595626831055, "global_step": 470899, "epoch": 2802} {"train_loss": -12.072164535522461, "global_step": 470900, "epoch": 2802} {"train_loss": -12.373204231262207, "global_step": 470901, "epoch": 2802} {"train_loss": -11.976325988769531, "global_step": 470902, "epoch": 2802} {"train_loss": -12.062122027079264, "global_step": 470903, "epoch": 2802, "val_loss": 313693.75} {"train_loss": -11.998641967773438, "global_step": 470904, "epoch": 2803} {"train_loss": -12.34054183959961, "global_step": 470905, "epoch": 2803} {"train_loss": -12.448108673095703, "global_step": 470906, "epoch": 2803} {"train_loss": -12.365157127380371, "global_step": 470907, "epoch": 2803} {"train_loss": -12.684549331665039, "global_step": 470908, "epoch": 2803} {"train_loss": -12.674609184265137, "global_step": 470909, "epoch": 2803} {"train_loss": -12.225301742553711, "global_step": 470910, "epoch": 2803} {"train_loss": -12.55858325958252, "global_step": 470911, "epoch": 2803} {"train_loss": -12.244422912597656, "global_step": 470912, "epoch": 2803} {"train_loss": -12.349798202514648, "global_step": 470913, "epoch": 2803} {"train_loss": -12.596348762512207, "global_step": 470914, "epoch": 2803} {"train_loss": -12.155035972595215, "global_step": 470915, "epoch": 2803} {"train_loss": -12.419981002807617, "global_step": 470916, "epoch": 2803} {"train_loss": -12.514410972595215, "global_step": 470917, "epoch": 2803} {"train_loss": -12.135786056518555, "global_step": 470918, "epoch": 2803} {"train_loss": -12.137935638427734, "global_step": 470919, "epoch": 2803} {"train_loss": -12.473148345947266, "global_step": 470920, "epoch": 2803} {"train_loss": -12.4100341796875, "global_step": 470921, "epoch": 2803} {"train_loss": -11.13037395477295, "global_step": 470922, "epoch": 2803} {"train_loss": -12.119983673095703, "global_step": 470923, "epoch": 2803} {"train_loss": -11.590205192565918, "global_step": 470924, "epoch": 2803} {"train_loss": -12.188152313232422, "global_step": 470925, "epoch": 2803} {"train_loss": -11.627727508544922, "global_step": 470926, "epoch": 2803} {"train_loss": -12.32253646850586, "global_step": 470927, "epoch": 2803} {"train_loss": -12.060628890991211, "global_step": 470928, "epoch": 2803} {"train_loss": -12.240056037902832, "global_step": 470929, "epoch": 2803} {"train_loss": -12.107828140258789, "global_step": 470930, "epoch": 2803} {"train_loss": -12.334003448486328, "global_step": 470931, "epoch": 2803} {"train_loss": -11.9469575881958, "global_step": 470932, "epoch": 2803} {"train_loss": -11.696942329406738, "global_step": 470933, "epoch": 2803} {"train_loss": -12.451702117919922, "global_step": 470934, "epoch": 2803} {"train_loss": -12.245989799499512, "global_step": 470935, "epoch": 2803} {"train_loss": -12.737974166870117, "global_step": 470936, "epoch": 2803} {"train_loss": -12.176739692687988, "global_step": 470937, "epoch": 2803} {"train_loss": -12.139358520507812, "global_step": 470938, "epoch": 2803} {"train_loss": -12.393178939819336, "global_step": 470939, "epoch": 2803} {"train_loss": -11.9199857711792, "global_step": 470940, "epoch": 2803} {"train_loss": -12.200835227966309, "global_step": 470941, "epoch": 2803} {"train_loss": -12.477546691894531, "global_step": 470942, "epoch": 2803} {"train_loss": -11.99146556854248, "global_step": 470943, "epoch": 2803} {"train_loss": -11.601324081420898, "global_step": 470944, "epoch": 2803} {"train_loss": -12.162534713745117, "global_step": 470945, "epoch": 2803} {"train_loss": -12.222942352294922, "global_step": 470946, "epoch": 2803} {"train_loss": -12.173797607421875, "global_step": 470947, "epoch": 2803} {"train_loss": -12.387660026550293, "global_step": 470948, "epoch": 2803} {"train_loss": -12.206222534179688, "global_step": 470949, "epoch": 2803} {"train_loss": -11.913984298706055, "global_step": 470950, "epoch": 2803} {"train_loss": -12.405765533447266, "global_step": 470951, "epoch": 2803} {"train_loss": -12.394390106201172, "global_step": 470952, "epoch": 2803} {"train_loss": -12.240736961364746, "global_step": 470953, "epoch": 2803} {"train_loss": -12.031832695007324, "global_step": 470954, "epoch": 2803} {"train_loss": -12.563390731811523, "global_step": 470955, "epoch": 2803} {"train_loss": -12.747407913208008, "global_step": 470956, "epoch": 2803} {"train_loss": -11.88247299194336, "global_step": 470957, "epoch": 2803} {"train_loss": -12.190759658813477, "global_step": 470958, "epoch": 2803} {"train_loss": -12.76711654663086, "global_step": 470959, "epoch": 2803} {"train_loss": -12.383567810058594, "global_step": 470960, "epoch": 2803} {"train_loss": -12.258979797363281, "global_step": 470961, "epoch": 2803} {"train_loss": -12.555135726928711, "global_step": 470962, "epoch": 2803} {"train_loss": -12.356705665588379, "global_step": 470963, "epoch": 2803} {"train_loss": -11.951632499694824, "global_step": 470964, "epoch": 2803} {"train_loss": -12.778356552124023, "global_step": 470965, "epoch": 2803} {"train_loss": -12.190327644348145, "global_step": 470966, "epoch": 2803} {"train_loss": -12.625171661376953, "global_step": 470967, "epoch": 2803} {"train_loss": -12.453450202941895, "global_step": 470968, "epoch": 2803} {"train_loss": -12.418577194213867, "global_step": 470969, "epoch": 2803} {"train_loss": -12.50776195526123, "global_step": 470970, "epoch": 2803} {"train_loss": -12.418733596801758, "global_step": 470971, "epoch": 2803} {"train_loss": -12.073822975158691, "global_step": 470972, "epoch": 2803} {"train_loss": -12.303997039794922, "global_step": 470973, "epoch": 2803} {"train_loss": -12.866744041442871, "global_step": 470974, "epoch": 2803} {"train_loss": -12.293865203857422, "global_step": 470975, "epoch": 2803} {"train_loss": -11.983400344848633, "global_step": 470976, "epoch": 2803} {"train_loss": -12.588078498840332, "global_step": 470977, "epoch": 2803} {"train_loss": -12.429340362548828, "global_step": 470978, "epoch": 2803} {"train_loss": -11.280552864074707, "global_step": 470979, "epoch": 2803} {"train_loss": -12.662605285644531, "global_step": 470980, "epoch": 2803} {"train_loss": -12.448714256286621, "global_step": 470981, "epoch": 2803} {"train_loss": -11.39024829864502, "global_step": 470982, "epoch": 2803} {"train_loss": -11.392141342163086, "global_step": 470983, "epoch": 2803} {"train_loss": -12.19490909576416, "global_step": 470984, "epoch": 2803} {"train_loss": -10.412517547607422, "global_step": 470985, "epoch": 2803} {"train_loss": -11.884748458862305, "global_step": 470986, "epoch": 2803} {"train_loss": -12.09646987915039, "global_step": 470987, "epoch": 2803} {"train_loss": -11.706077575683594, "global_step": 470988, "epoch": 2803} {"train_loss": -11.44751262664795, "global_step": 470989, "epoch": 2803} {"train_loss": -11.191262245178223, "global_step": 470990, "epoch": 2803} {"train_loss": -11.472233772277832, "global_step": 470991, "epoch": 2803} {"train_loss": -12.134319305419922, "global_step": 470992, "epoch": 2803} {"train_loss": -10.686126708984375, "global_step": 470993, "epoch": 2803} {"train_loss": -12.392610549926758, "global_step": 470994, "epoch": 2803} {"train_loss": -10.66369915008545, "global_step": 470995, "epoch": 2803} {"train_loss": -12.483051300048828, "global_step": 470996, "epoch": 2803} {"train_loss": -11.677191734313965, "global_step": 470997, "epoch": 2803} {"train_loss": -11.87997817993164, "global_step": 470998, "epoch": 2803} {"train_loss": -11.765556335449219, "global_step": 470999, "epoch": 2803} {"train_loss": -11.449438095092773, "global_step": 471000, "epoch": 2803} {"train_loss": -12.367115020751953, "global_step": 471001, "epoch": 2803} {"train_loss": -11.941534042358398, "global_step": 471002, "epoch": 2803} {"train_loss": -11.944347381591797, "global_step": 471003, "epoch": 2803} {"train_loss": -12.530512809753418, "global_step": 471004, "epoch": 2803} {"train_loss": -11.918245315551758, "global_step": 471005, "epoch": 2803} {"train_loss": -12.263385772705078, "global_step": 471006, "epoch": 2803} {"train_loss": -12.199235916137695, "global_step": 471007, "epoch": 2803} {"train_loss": -11.860816955566406, "global_step": 471008, "epoch": 2803} {"train_loss": -12.592254638671875, "global_step": 471009, "epoch": 2803} {"train_loss": -12.140436172485352, "global_step": 471010, "epoch": 2803} {"train_loss": -12.652416229248047, "global_step": 471011, "epoch": 2803} {"train_loss": -12.12009048461914, "global_step": 471012, "epoch": 2803} {"train_loss": -12.161968231201172, "global_step": 471013, "epoch": 2803} {"train_loss": -12.429941177368164, "global_step": 471014, "epoch": 2803} {"train_loss": -11.661234855651855, "global_step": 471015, "epoch": 2803} {"train_loss": -11.810501098632812, "global_step": 471016, "epoch": 2803} {"train_loss": -12.32042121887207, "global_step": 471017, "epoch": 2803} {"train_loss": -11.814908981323242, "global_step": 471018, "epoch": 2803} {"train_loss": -12.454639434814453, "global_step": 471019, "epoch": 2803} {"train_loss": -12.153314590454102, "global_step": 471020, "epoch": 2803} {"train_loss": -12.576884269714355, "global_step": 471021, "epoch": 2803} {"train_loss": -12.274580001831055, "global_step": 471022, "epoch": 2803} {"train_loss": -12.050673484802246, "global_step": 471023, "epoch": 2803} {"train_loss": -12.623241424560547, "global_step": 471024, "epoch": 2803} {"train_loss": -11.727069854736328, "global_step": 471025, "epoch": 2803} {"train_loss": -12.65445327758789, "global_step": 471026, "epoch": 2803} {"train_loss": -12.138782501220703, "global_step": 471027, "epoch": 2803} {"train_loss": -12.129287719726562, "global_step": 471028, "epoch": 2803} {"train_loss": -12.437698364257812, "global_step": 471029, "epoch": 2803} {"train_loss": -12.181529998779297, "global_step": 471030, "epoch": 2803} {"train_loss": -12.148775100708008, "global_step": 471031, "epoch": 2803} {"train_loss": -12.645116806030273, "global_step": 471032, "epoch": 2803} {"train_loss": -12.467918395996094, "global_step": 471033, "epoch": 2803} {"train_loss": -12.293987274169922, "global_step": 471034, "epoch": 2803} {"train_loss": -12.387690544128418, "global_step": 471035, "epoch": 2803} {"train_loss": -12.175821304321289, "global_step": 471036, "epoch": 2803} {"train_loss": -12.529949188232422, "global_step": 471037, "epoch": 2803} {"train_loss": -12.167354583740234, "global_step": 471038, "epoch": 2803} {"train_loss": -12.843597412109375, "global_step": 471039, "epoch": 2803} {"train_loss": -12.514062881469727, "global_step": 471040, "epoch": 2803} {"train_loss": -12.534059524536133, "global_step": 471041, "epoch": 2803} {"train_loss": -12.44039249420166, "global_step": 471042, "epoch": 2803} {"train_loss": -12.655671119689941, "global_step": 471043, "epoch": 2803} {"train_loss": -12.569758415222168, "global_step": 471044, "epoch": 2803} {"train_loss": -12.526420593261719, "global_step": 471045, "epoch": 2803} {"train_loss": -12.632583618164062, "global_step": 471046, "epoch": 2803} {"train_loss": -12.4384765625, "global_step": 471047, "epoch": 2803} {"train_loss": -12.245355606079102, "global_step": 471048, "epoch": 2803} {"train_loss": -12.477397918701172, "global_step": 471049, "epoch": 2803} {"train_loss": -12.639638900756836, "global_step": 471050, "epoch": 2803} {"train_loss": -12.530975341796875, "global_step": 471051, "epoch": 2803} {"train_loss": -12.658735275268555, "global_step": 471052, "epoch": 2803} {"train_loss": -12.717785835266113, "global_step": 471053, "epoch": 2803} {"train_loss": -12.666336059570312, "global_step": 471054, "epoch": 2803} {"train_loss": -12.606367111206055, "global_step": 471055, "epoch": 2803} {"train_loss": -12.608404159545898, "global_step": 471056, "epoch": 2803} {"train_loss": -12.682918548583984, "global_step": 471057, "epoch": 2803} {"train_loss": -12.917845726013184, "global_step": 471058, "epoch": 2803} {"train_loss": -12.685628890991211, "global_step": 471059, "epoch": 2803} {"train_loss": -12.753242492675781, "global_step": 471060, "epoch": 2803} {"train_loss": -12.506464004516602, "global_step": 471061, "epoch": 2803} {"train_loss": -12.647990226745605, "global_step": 471062, "epoch": 2803} {"train_loss": -12.844564437866211, "global_step": 471063, "epoch": 2803} {"train_loss": -12.703285217285156, "global_step": 471064, "epoch": 2803} {"train_loss": -12.644219398498535, "global_step": 471065, "epoch": 2803} {"train_loss": -12.774263381958008, "global_step": 471066, "epoch": 2803} {"train_loss": -12.35179328918457, "global_step": 471067, "epoch": 2803} {"train_loss": -12.637338638305664, "global_step": 471068, "epoch": 2803} {"train_loss": -12.560678482055664, "global_step": 471069, "epoch": 2803} {"train_loss": -12.70987319946289, "global_step": 471070, "epoch": 2803} {"train_loss": -12.251358656656175, "global_step": 471071, "epoch": 2803, "val_loss": 318734.6875} {"train_loss": -12.860715866088867, "global_step": 471072, "epoch": 2804} {"train_loss": -12.668209075927734, "global_step": 471073, "epoch": 2804} {"train_loss": -12.909828186035156, "global_step": 471074, "epoch": 2804} {"train_loss": -12.875899314880371, "global_step": 471075, "epoch": 2804} {"train_loss": -12.720203399658203, "global_step": 471076, "epoch": 2804} {"train_loss": -12.509565353393555, "global_step": 471077, "epoch": 2804} {"train_loss": -12.563798904418945, "global_step": 471078, "epoch": 2804} {"train_loss": -12.550707817077637, "global_step": 471079, "epoch": 2804} {"train_loss": -12.784013748168945, "global_step": 471080, "epoch": 2804} {"train_loss": -12.669918060302734, "global_step": 471081, "epoch": 2804} {"train_loss": -12.616474151611328, "global_step": 471082, "epoch": 2804} {"train_loss": -12.353086471557617, "global_step": 471083, "epoch": 2804} {"train_loss": -12.619619369506836, "global_step": 471084, "epoch": 2804} {"train_loss": -12.488401412963867, "global_step": 471085, "epoch": 2804} {"train_loss": -12.24496078491211, "global_step": 471086, "epoch": 2804} {"train_loss": -12.637535095214844, "global_step": 471087, "epoch": 2804} {"train_loss": -12.601993560791016, "global_step": 471088, "epoch": 2804} {"train_loss": -12.70651912689209, "global_step": 471089, "epoch": 2804} {"train_loss": -12.891167640686035, "global_step": 471090, "epoch": 2804} {"train_loss": -12.345020294189453, "global_step": 471091, "epoch": 2804} {"train_loss": -12.643571853637695, "global_step": 471092, "epoch": 2804} {"train_loss": -12.172868728637695, "global_step": 471093, "epoch": 2804} {"train_loss": -12.667903900146484, "global_step": 471094, "epoch": 2804} {"train_loss": -12.81317138671875, "global_step": 471095, "epoch": 2804} {"train_loss": -12.383193969726562, "global_step": 471096, "epoch": 2804} {"train_loss": -12.594156265258789, "global_step": 471097, "epoch": 2804} {"train_loss": -11.760754585266113, "global_step": 471098, "epoch": 2804} {"train_loss": -12.327367782592773, "global_step": 471099, "epoch": 2804} {"train_loss": -12.708805084228516, "global_step": 471100, "epoch": 2804} {"train_loss": -12.38525104522705, "global_step": 471101, "epoch": 2804} {"train_loss": -12.839765548706055, "global_step": 471102, "epoch": 2804} {"train_loss": -11.608036041259766, "global_step": 471103, "epoch": 2804} {"train_loss": -12.913644790649414, "global_step": 471104, "epoch": 2804} {"train_loss": -11.954676628112793, "global_step": 471105, "epoch": 2804} {"train_loss": -12.286540985107422, "global_step": 471106, "epoch": 2804} {"train_loss": -12.66132926940918, "global_step": 471107, "epoch": 2804} {"train_loss": -11.977677345275879, "global_step": 471108, "epoch": 2804} {"train_loss": -12.414031982421875, "global_step": 471109, "epoch": 2804} {"train_loss": -12.356863021850586, "global_step": 471110, "epoch": 2804} {"train_loss": -12.130334854125977, "global_step": 471111, "epoch": 2804} {"train_loss": -11.836099624633789, "global_step": 471112, "epoch": 2804} {"train_loss": -10.350686073303223, "global_step": 471113, "epoch": 2804} {"train_loss": -10.849284172058105, "global_step": 471114, "epoch": 2804} {"train_loss": -12.369976043701172, "global_step": 471115, "epoch": 2804} {"train_loss": -10.097528457641602, "global_step": 471116, "epoch": 2804} {"train_loss": -10.834049224853516, "global_step": 471117, "epoch": 2804} {"train_loss": -10.498369216918945, "global_step": 471118, "epoch": 2804} {"train_loss": -11.287232398986816, "global_step": 471119, "epoch": 2804} {"train_loss": -10.592397689819336, "global_step": 471120, "epoch": 2804} {"train_loss": -11.512264251708984, "global_step": 471121, "epoch": 2804} {"train_loss": -10.723138809204102, "global_step": 471122, "epoch": 2804} {"train_loss": -10.723077774047852, "global_step": 471123, "epoch": 2804} {"train_loss": -10.620752334594727, "global_step": 471124, "epoch": 2804} {"train_loss": -10.16425895690918, "global_step": 471125, "epoch": 2804} {"train_loss": -11.728866577148438, "global_step": 471126, "epoch": 2804} {"train_loss": -9.722314834594727, "global_step": 471127, "epoch": 2804} {"train_loss": -11.43838882446289, "global_step": 471128, "epoch": 2804} {"train_loss": -11.263916969299316, "global_step": 471129, "epoch": 2804} {"train_loss": -11.066984176635742, "global_step": 471130, "epoch": 2804} {"train_loss": -11.766382217407227, "global_step": 471131, "epoch": 2804} {"train_loss": -10.330543518066406, "global_step": 471132, "epoch": 2804} {"train_loss": -12.093684196472168, "global_step": 471133, "epoch": 2804} {"train_loss": -11.026219367980957, "global_step": 471134, "epoch": 2804} {"train_loss": -11.353458404541016, "global_step": 471135, "epoch": 2804} {"train_loss": -11.06875228881836, "global_step": 471136, "epoch": 2804} {"train_loss": -9.761195182800293, "global_step": 471137, "epoch": 2804} {"train_loss": -10.201231956481934, "global_step": 471138, "epoch": 2804} {"train_loss": -11.862313270568848, "global_step": 471139, "epoch": 2804} {"train_loss": -11.05028247833252, "global_step": 471140, "epoch": 2804} {"train_loss": -10.355451583862305, "global_step": 471141, "epoch": 2804} {"train_loss": -11.893379211425781, "global_step": 471142, "epoch": 2804} {"train_loss": -10.592950820922852, "global_step": 471143, "epoch": 2804} {"train_loss": -11.10747241973877, "global_step": 471144, "epoch": 2804} {"train_loss": -11.472654342651367, "global_step": 471145, "epoch": 2804} {"train_loss": -11.639880180358887, "global_step": 471146, "epoch": 2804} {"train_loss": -11.899874687194824, "global_step": 471147, "epoch": 2804} {"train_loss": -12.1210355758667, "global_step": 471148, "epoch": 2804} {"train_loss": -11.422381401062012, "global_step": 471149, "epoch": 2804} {"train_loss": -11.982097625732422, "global_step": 471150, "epoch": 2804} {"train_loss": -11.764209747314453, "global_step": 471151, "epoch": 2804} {"train_loss": -11.400411605834961, "global_step": 471152, "epoch": 2804} {"train_loss": -12.091184616088867, "global_step": 471153, "epoch": 2804} {"train_loss": -11.698410034179688, "global_step": 471154, "epoch": 2804} {"train_loss": -11.884866714477539, "global_step": 471155, "epoch": 2804} {"train_loss": -12.0860595703125, "global_step": 471156, "epoch": 2804} {"train_loss": -11.644309043884277, "global_step": 471157, "epoch": 2804} {"train_loss": -12.359926223754883, "global_step": 471158, "epoch": 2804} {"train_loss": -11.668241500854492, "global_step": 471159, "epoch": 2804} {"train_loss": -12.193994522094727, "global_step": 471160, "epoch": 2804} {"train_loss": -12.209710121154785, "global_step": 471161, "epoch": 2804} {"train_loss": -12.026063919067383, "global_step": 471162, "epoch": 2804} {"train_loss": -12.299683570861816, "global_step": 471163, "epoch": 2804} {"train_loss": -11.959346771240234, "global_step": 471164, "epoch": 2804} {"train_loss": -12.155677795410156, "global_step": 471165, "epoch": 2804} {"train_loss": -12.121319770812988, "global_step": 471166, "epoch": 2804} {"train_loss": -11.890275955200195, "global_step": 471167, "epoch": 2804} {"train_loss": -12.574564933776855, "global_step": 471168, "epoch": 2804} {"train_loss": -12.198158264160156, "global_step": 471169, "epoch": 2804} {"train_loss": -11.885515213012695, "global_step": 471170, "epoch": 2804} {"train_loss": -12.36600399017334, "global_step": 471171, "epoch": 2804} {"train_loss": -12.098579406738281, "global_step": 471172, "epoch": 2804} {"train_loss": -12.300050735473633, "global_step": 471173, "epoch": 2804} {"train_loss": -11.731324195861816, "global_step": 471174, "epoch": 2804} {"train_loss": -11.964391708374023, "global_step": 471175, "epoch": 2804} {"train_loss": -11.516398429870605, "global_step": 471176, "epoch": 2804} {"train_loss": -12.223944664001465, "global_step": 471177, "epoch": 2804} {"train_loss": -12.1636962890625, "global_step": 471178, "epoch": 2804} {"train_loss": -12.163640975952148, "global_step": 471179, "epoch": 2804} {"train_loss": -12.13375473022461, "global_step": 471180, "epoch": 2804} {"train_loss": -11.563820838928223, "global_step": 471181, "epoch": 2804} {"train_loss": -12.067634582519531, "global_step": 471182, "epoch": 2804} {"train_loss": -11.784765243530273, "global_step": 471183, "epoch": 2804} {"train_loss": -11.88235855102539, "global_step": 471184, "epoch": 2804} {"train_loss": -11.936528205871582, "global_step": 471185, "epoch": 2804} {"train_loss": -11.806766510009766, "global_step": 471186, "epoch": 2804} {"train_loss": -11.904632568359375, "global_step": 471187, "epoch": 2804} {"train_loss": -12.38357162475586, "global_step": 471188, "epoch": 2804} {"train_loss": -12.110921859741211, "global_step": 471189, "epoch": 2804} {"train_loss": -12.221429824829102, "global_step": 471190, "epoch": 2804} {"train_loss": -12.159880638122559, "global_step": 471191, "epoch": 2804} {"train_loss": -12.153486251831055, "global_step": 471192, "epoch": 2804} {"train_loss": -12.164456367492676, "global_step": 471193, "epoch": 2804} {"train_loss": -11.818925857543945, "global_step": 471194, "epoch": 2804} {"train_loss": -12.622173309326172, "global_step": 471195, "epoch": 2804} {"train_loss": -12.125011444091797, "global_step": 471196, "epoch": 2804} {"train_loss": -12.561939239501953, "global_step": 471197, "epoch": 2804} {"train_loss": -12.02499008178711, "global_step": 471198, "epoch": 2804} {"train_loss": -12.35750961303711, "global_step": 471199, "epoch": 2804} {"train_loss": -12.070760726928711, "global_step": 471200, "epoch": 2804} {"train_loss": -12.081754684448242, "global_step": 471201, "epoch": 2804} {"train_loss": -12.300532341003418, "global_step": 471202, "epoch": 2804} {"train_loss": -12.072212219238281, "global_step": 471203, "epoch": 2804} {"train_loss": -12.568130493164062, "global_step": 471204, "epoch": 2804} {"train_loss": -12.393730163574219, "global_step": 471205, "epoch": 2804} {"train_loss": -12.577021598815918, "global_step": 471206, "epoch": 2804} {"train_loss": -12.66482925415039, "global_step": 471207, "epoch": 2804} {"train_loss": -12.491312026977539, "global_step": 471208, "epoch": 2804} {"train_loss": -12.444931983947754, "global_step": 471209, "epoch": 2804} {"train_loss": -12.489830017089844, "global_step": 471210, "epoch": 2804} {"train_loss": -12.365917205810547, "global_step": 471211, "epoch": 2804} {"train_loss": -12.566169738769531, "global_step": 471212, "epoch": 2804} {"train_loss": -12.666106224060059, "global_step": 471213, "epoch": 2804} {"train_loss": -12.764616012573242, "global_step": 471214, "epoch": 2804} {"train_loss": -12.56793212890625, "global_step": 471215, "epoch": 2804} {"train_loss": -12.616250991821289, "global_step": 471216, "epoch": 2804} {"train_loss": -12.709283828735352, "global_step": 471217, "epoch": 2804} {"train_loss": -12.608556747436523, "global_step": 471218, "epoch": 2804} {"train_loss": -12.507414817810059, "global_step": 471219, "epoch": 2804} {"train_loss": -12.388880729675293, "global_step": 471220, "epoch": 2804} {"train_loss": -12.549097061157227, "global_step": 471221, "epoch": 2804} {"train_loss": -12.795217514038086, "global_step": 471222, "epoch": 2804} {"train_loss": -12.78378677368164, "global_step": 471223, "epoch": 2804} {"train_loss": -12.89457893371582, "global_step": 471224, "epoch": 2804} {"train_loss": -12.604609489440918, "global_step": 471225, "epoch": 2804} {"train_loss": -12.60488510131836, "global_step": 471226, "epoch": 2804} {"train_loss": -12.804023742675781, "global_step": 471227, "epoch": 2804} {"train_loss": -12.947320938110352, "global_step": 471228, "epoch": 2804} {"train_loss": -12.485158920288086, "global_step": 471229, "epoch": 2804} {"train_loss": -12.7302885055542, "global_step": 471230, "epoch": 2804} {"train_loss": -12.665704727172852, "global_step": 471231, "epoch": 2804} {"train_loss": -12.519047737121582, "global_step": 471232, "epoch": 2804} {"train_loss": -12.645298957824707, "global_step": 471233, "epoch": 2804} {"train_loss": -12.682710647583008, "global_step": 471234, "epoch": 2804} {"train_loss": -12.860029220581055, "global_step": 471235, "epoch": 2804} {"train_loss": -12.746329307556152, "global_step": 471236, "epoch": 2804} {"train_loss": -12.753194808959961, "global_step": 471237, "epoch": 2804} {"train_loss": -12.802112579345703, "global_step": 471238, "epoch": 2804} {"train_loss": -12.062858513423375, "global_step": 471239, "epoch": 2804, "val_loss": 318600.71875} {"train_loss": -12.913528442382812, "global_step": 471240, "epoch": 2805} {"train_loss": -12.592029571533203, "global_step": 471241, "epoch": 2805} {"train_loss": -12.53807544708252, "global_step": 471242, "epoch": 2805} {"train_loss": -12.866009712219238, "global_step": 471243, "epoch": 2805} {"train_loss": -12.498640060424805, "global_step": 471244, "epoch": 2805} {"train_loss": -12.897247314453125, "global_step": 471245, "epoch": 2805} {"train_loss": -12.302386283874512, "global_step": 471246, "epoch": 2805} {"train_loss": -12.231374740600586, "global_step": 471247, "epoch": 2805} {"train_loss": -12.852614402770996, "global_step": 471248, "epoch": 2805} {"train_loss": -12.157331466674805, "global_step": 471249, "epoch": 2805} {"train_loss": -12.333246231079102, "global_step": 471250, "epoch": 2805} {"train_loss": -12.445167541503906, "global_step": 471251, "epoch": 2805} {"train_loss": -11.242890357971191, "global_step": 471252, "epoch": 2805} {"train_loss": -12.325176239013672, "global_step": 471253, "epoch": 2805} {"train_loss": -11.863384246826172, "global_step": 471254, "epoch": 2805} {"train_loss": -12.238205909729004, "global_step": 471255, "epoch": 2805} {"train_loss": -12.80235481262207, "global_step": 471256, "epoch": 2805} {"train_loss": -12.346870422363281, "global_step": 471257, "epoch": 2805} {"train_loss": -12.913763046264648, "global_step": 471258, "epoch": 2805} {"train_loss": -12.195823669433594, "global_step": 471259, "epoch": 2805} {"train_loss": -12.48056411743164, "global_step": 471260, "epoch": 2805} {"train_loss": -12.925996780395508, "global_step": 471261, "epoch": 2805} {"train_loss": -12.66225814819336, "global_step": 471262, "epoch": 2805} {"train_loss": -12.434942245483398, "global_step": 471263, "epoch": 2805} {"train_loss": -12.66989803314209, "global_step": 471264, "epoch": 2805} {"train_loss": -12.002734184265137, "global_step": 471265, "epoch": 2805} {"train_loss": -12.494598388671875, "global_step": 471266, "epoch": 2805} {"train_loss": -12.594523429870605, "global_step": 471267, "epoch": 2805} {"train_loss": -12.674470901489258, "global_step": 471268, "epoch": 2805} {"train_loss": -12.471553802490234, "global_step": 471269, "epoch": 2805} {"train_loss": -12.253437042236328, "global_step": 471270, "epoch": 2805} {"train_loss": -12.348640441894531, "global_step": 471271, "epoch": 2805} {"train_loss": -12.72005844116211, "global_step": 471272, "epoch": 2805} {"train_loss": -12.555401802062988, "global_step": 471273, "epoch": 2805} {"train_loss": -12.509943962097168, "global_step": 471274, "epoch": 2805} {"train_loss": -12.474119186401367, "global_step": 471275, "epoch": 2805} {"train_loss": -12.866039276123047, "global_step": 471276, "epoch": 2805} {"train_loss": -12.452320098876953, "global_step": 471277, "epoch": 2805} {"train_loss": -12.636189460754395, "global_step": 471278, "epoch": 2805} {"train_loss": -12.306381225585938, "global_step": 471279, "epoch": 2805} {"train_loss": -12.385699272155762, "global_step": 471280, "epoch": 2805} {"train_loss": -12.694252014160156, "global_step": 471281, "epoch": 2805} {"train_loss": -12.245908737182617, "global_step": 471282, "epoch": 2805} {"train_loss": -12.603484153747559, "global_step": 471283, "epoch": 2805} {"train_loss": -12.371545791625977, "global_step": 471284, "epoch": 2805} {"train_loss": -10.811661720275879, "global_step": 471285, "epoch": 2805} {"train_loss": -11.894426345825195, "global_step": 471286, "epoch": 2805} {"train_loss": -11.76552963256836, "global_step": 471287, "epoch": 2805} {"train_loss": -10.761908531188965, "global_step": 471288, "epoch": 2805} {"train_loss": -11.174086570739746, "global_step": 471289, "epoch": 2805} {"train_loss": -10.161784172058105, "global_step": 471290, "epoch": 2805} {"train_loss": -11.334688186645508, "global_step": 471291, "epoch": 2805} {"train_loss": -10.357585906982422, "global_step": 471292, "epoch": 2805} {"train_loss": -11.909500122070312, "global_step": 471293, "epoch": 2805} {"train_loss": -10.602699279785156, "global_step": 471294, "epoch": 2805} {"train_loss": -11.735862731933594, "global_step": 471295, "epoch": 2805} {"train_loss": -11.599739074707031, "global_step": 471296, "epoch": 2805} {"train_loss": -10.863724708557129, "global_step": 471297, "epoch": 2805} {"train_loss": -12.086591720581055, "global_step": 471298, "epoch": 2805} {"train_loss": -10.887866973876953, "global_step": 471299, "epoch": 2805} {"train_loss": -11.80398178100586, "global_step": 471300, "epoch": 2805} {"train_loss": -11.398458480834961, "global_step": 471301, "epoch": 2805} {"train_loss": -11.322376251220703, "global_step": 471302, "epoch": 2805} {"train_loss": -11.703617095947266, "global_step": 471303, "epoch": 2805} {"train_loss": -9.981578826904297, "global_step": 471304, "epoch": 2805} {"train_loss": -11.475395202636719, "global_step": 471305, "epoch": 2805} {"train_loss": -10.780729293823242, "global_step": 471306, "epoch": 2805} {"train_loss": -11.247190475463867, "global_step": 471307, "epoch": 2805} {"train_loss": -10.992758750915527, "global_step": 471308, "epoch": 2805} {"train_loss": -11.550544738769531, "global_step": 471309, "epoch": 2805} {"train_loss": -11.831380844116211, "global_step": 471310, "epoch": 2805} {"train_loss": -11.005471229553223, "global_step": 471311, "epoch": 2805} {"train_loss": -11.81583023071289, "global_step": 471312, "epoch": 2805} {"train_loss": -12.478564262390137, "global_step": 471313, "epoch": 2805} {"train_loss": -11.836230278015137, "global_step": 471314, "epoch": 2805} {"train_loss": -12.577930450439453, "global_step": 471315, "epoch": 2805} {"train_loss": -12.393268585205078, "global_step": 471316, "epoch": 2805} {"train_loss": -12.596232414245605, "global_step": 471317, "epoch": 2805} {"train_loss": -12.360052108764648, "global_step": 471318, "epoch": 2805} {"train_loss": -12.442975997924805, "global_step": 471319, "epoch": 2805} {"train_loss": -12.489399909973145, "global_step": 471320, "epoch": 2805} {"train_loss": -12.381454467773438, "global_step": 471321, "epoch": 2805} {"train_loss": -12.4339017868042, "global_step": 471322, "epoch": 2805} {"train_loss": -12.157732009887695, "global_step": 471323, "epoch": 2805} {"train_loss": -12.38887882232666, "global_step": 471324, "epoch": 2805} {"train_loss": -12.510086059570312, "global_step": 471325, "epoch": 2805} {"train_loss": -12.526531219482422, "global_step": 471326, "epoch": 2805} {"train_loss": -12.403164863586426, "global_step": 471327, "epoch": 2805} {"train_loss": -12.71045970916748, "global_step": 471328, "epoch": 2805} {"train_loss": -12.495647430419922, "global_step": 471329, "epoch": 2805} {"train_loss": -12.583491325378418, "global_step": 471330, "epoch": 2805} {"train_loss": -12.585210800170898, "global_step": 471331, "epoch": 2805} {"train_loss": -12.682412147521973, "global_step": 471332, "epoch": 2805} {"train_loss": -12.794541358947754, "global_step": 471333, "epoch": 2805} {"train_loss": -12.594277381896973, "global_step": 471334, "epoch": 2805} {"train_loss": -12.691518783569336, "global_step": 471335, "epoch": 2805} {"train_loss": -12.780977249145508, "global_step": 471336, "epoch": 2805} {"train_loss": -12.411340713500977, "global_step": 471337, "epoch": 2805} {"train_loss": -12.593218803405762, "global_step": 471338, "epoch": 2805} {"train_loss": -12.44355583190918, "global_step": 471339, "epoch": 2805} {"train_loss": -12.821690559387207, "global_step": 471340, "epoch": 2805} {"train_loss": -12.676312446594238, "global_step": 471341, "epoch": 2805} {"train_loss": -12.676746368408203, "global_step": 471342, "epoch": 2805} {"train_loss": -12.730077743530273, "global_step": 471343, "epoch": 2805} {"train_loss": -12.401531219482422, "global_step": 471344, "epoch": 2805} {"train_loss": -12.647104263305664, "global_step": 471345, "epoch": 2805} {"train_loss": -12.538839340209961, "global_step": 471346, "epoch": 2805} {"train_loss": -12.67851734161377, "global_step": 471347, "epoch": 2805} {"train_loss": -12.581634521484375, "global_step": 471348, "epoch": 2805} {"train_loss": -12.864119529724121, "global_step": 471349, "epoch": 2805} {"train_loss": -12.876932144165039, "global_step": 471350, "epoch": 2805} {"train_loss": -12.700031280517578, "global_step": 471351, "epoch": 2805} {"train_loss": -12.748077392578125, "global_step": 471352, "epoch": 2805} {"train_loss": -12.465161323547363, "global_step": 471353, "epoch": 2805} {"train_loss": -12.325695037841797, "global_step": 471354, "epoch": 2805} {"train_loss": -12.427408218383789, "global_step": 471355, "epoch": 2805} {"train_loss": -12.690338134765625, "global_step": 471356, "epoch": 2805} {"train_loss": -12.942903518676758, "global_step": 471357, "epoch": 2805} {"train_loss": -12.467538833618164, "global_step": 471358, "epoch": 2805} {"train_loss": -12.612532615661621, "global_step": 471359, "epoch": 2805} {"train_loss": -12.42708969116211, "global_step": 471360, "epoch": 2805} {"train_loss": -12.69253158569336, "global_step": 471361, "epoch": 2805} {"train_loss": -12.318241119384766, "global_step": 471362, "epoch": 2805} {"train_loss": -12.049690246582031, "global_step": 471363, "epoch": 2805} {"train_loss": -12.43769645690918, "global_step": 471364, "epoch": 2805} {"train_loss": -12.494226455688477, "global_step": 471365, "epoch": 2805} {"train_loss": -12.073546409606934, "global_step": 471366, "epoch": 2805} {"train_loss": -11.946627616882324, "global_step": 471367, "epoch": 2805} {"train_loss": -12.623785018920898, "global_step": 471368, "epoch": 2805} {"train_loss": -12.669733047485352, "global_step": 471369, "epoch": 2805} {"train_loss": -12.381800651550293, "global_step": 471370, "epoch": 2805} {"train_loss": -12.71566104888916, "global_step": 471371, "epoch": 2805} {"train_loss": -12.807555198669434, "global_step": 471372, "epoch": 2805} {"train_loss": -12.503942489624023, "global_step": 471373, "epoch": 2805} {"train_loss": -12.278057098388672, "global_step": 471374, "epoch": 2805} {"train_loss": -12.323417663574219, "global_step": 471375, "epoch": 2805} {"train_loss": -12.27063274383545, "global_step": 471376, "epoch": 2805} {"train_loss": -12.15738296508789, "global_step": 471377, "epoch": 2805} {"train_loss": -12.746753692626953, "global_step": 471378, "epoch": 2805} {"train_loss": -12.26428508758545, "global_step": 471379, "epoch": 2805} {"train_loss": -12.769207000732422, "global_step": 471380, "epoch": 2805} {"train_loss": -11.764008522033691, "global_step": 471381, "epoch": 2805} {"train_loss": -12.281628608703613, "global_step": 471382, "epoch": 2805} {"train_loss": -12.502496719360352, "global_step": 471383, "epoch": 2805} {"train_loss": -12.139228820800781, "global_step": 471384, "epoch": 2805} {"train_loss": -12.447593688964844, "global_step": 471385, "epoch": 2805} {"train_loss": -11.241809844970703, "global_step": 471386, "epoch": 2805} {"train_loss": -12.231847763061523, "global_step": 471387, "epoch": 2805} {"train_loss": -11.582845687866211, "global_step": 471388, "epoch": 2805} {"train_loss": -11.801641464233398, "global_step": 471389, "epoch": 2805} {"train_loss": -9.048044204711914, "global_step": 471390, "epoch": 2805} {"train_loss": -11.707164764404297, "global_step": 471391, "epoch": 2805} {"train_loss": -8.957571983337402, "global_step": 471392, "epoch": 2805} {"train_loss": -10.52529525756836, "global_step": 471393, "epoch": 2805} {"train_loss": -9.9257173538208, "global_step": 471394, "epoch": 2805} {"train_loss": -9.83411979675293, "global_step": 471395, "epoch": 2805} {"train_loss": -9.983007431030273, "global_step": 471396, "epoch": 2805} {"train_loss": -9.169183731079102, "global_step": 471397, "epoch": 2805} {"train_loss": -9.323802947998047, "global_step": 471398, "epoch": 2805} {"train_loss": -9.383867263793945, "global_step": 471399, "epoch": 2805} {"train_loss": -11.113670349121094, "global_step": 471400, "epoch": 2805} {"train_loss": -10.961284637451172, "global_step": 471401, "epoch": 2805} {"train_loss": -8.371969223022461, "global_step": 471402, "epoch": 2805} {"train_loss": -9.415007591247559, "global_step": 471403, "epoch": 2805} {"train_loss": -10.644927978515625, "global_step": 471404, "epoch": 2805} {"train_loss": -10.1514892578125, "global_step": 471405, "epoch": 2805} {"train_loss": -9.667850494384766, "global_step": 471406, "epoch": 2805} {"train_loss": -11.985764424006144, "global_step": 471407, "epoch": 2805, "val_loss": 313956.59375, "train_action_mse_error": 1.84517502784729} {"train_loss": -10.510316848754883, "global_step": 471408, "epoch": 2806} {"train_loss": -11.125007629394531, "global_step": 471409, "epoch": 2806} {"train_loss": -9.557419776916504, "global_step": 471410, "epoch": 2806} {"train_loss": -9.777815818786621, "global_step": 471411, "epoch": 2806} {"train_loss": -9.228540420532227, "global_step": 471412, "epoch": 2806} {"train_loss": -10.523883819580078, "global_step": 471413, "epoch": 2806} {"train_loss": -10.090200424194336, "global_step": 471414, "epoch": 2806} {"train_loss": -10.582172393798828, "global_step": 471415, "epoch": 2806} {"train_loss": -11.376614570617676, "global_step": 471416, "epoch": 2806} {"train_loss": -11.487831115722656, "global_step": 471417, "epoch": 2806} {"train_loss": -11.280765533447266, "global_step": 471418, "epoch": 2806} {"train_loss": -11.451971054077148, "global_step": 471419, "epoch": 2806} {"train_loss": -11.724300384521484, "global_step": 471420, "epoch": 2806} {"train_loss": -11.653048515319824, "global_step": 471421, "epoch": 2806} {"train_loss": -11.665658950805664, "global_step": 471422, "epoch": 2806} {"train_loss": -11.827130317687988, "global_step": 471423, "epoch": 2806} {"train_loss": -12.108367919921875, "global_step": 471424, "epoch": 2806} {"train_loss": -11.787397384643555, "global_step": 471425, "epoch": 2806} {"train_loss": -12.097434997558594, "global_step": 471426, "epoch": 2806} {"train_loss": -12.038753509521484, "global_step": 471427, "epoch": 2806} {"train_loss": -12.020605087280273, "global_step": 471428, "epoch": 2806} {"train_loss": -11.724708557128906, "global_step": 471429, "epoch": 2806} {"train_loss": -12.138581275939941, "global_step": 471430, "epoch": 2806} {"train_loss": -12.204069137573242, "global_step": 471431, "epoch": 2806} {"train_loss": -12.510791778564453, "global_step": 471432, "epoch": 2806} {"train_loss": -11.650686264038086, "global_step": 471433, "epoch": 2806} {"train_loss": -12.427699089050293, "global_step": 471434, "epoch": 2806} {"train_loss": -12.15863037109375, "global_step": 471435, "epoch": 2806} {"train_loss": -12.037569046020508, "global_step": 471436, "epoch": 2806} {"train_loss": -12.322364807128906, "global_step": 471437, "epoch": 2806} {"train_loss": -12.145601272583008, "global_step": 471438, "epoch": 2806} {"train_loss": -12.105621337890625, "global_step": 471439, "epoch": 2806} {"train_loss": -12.01753044128418, "global_step": 471440, "epoch": 2806} {"train_loss": -12.130420684814453, "global_step": 471441, "epoch": 2806} {"train_loss": -12.165533065795898, "global_step": 471442, "epoch": 2806} {"train_loss": -12.266729354858398, "global_step": 471443, "epoch": 2806} {"train_loss": -12.458393096923828, "global_step": 471444, "epoch": 2806} {"train_loss": -12.356203079223633, "global_step": 471445, "epoch": 2806} {"train_loss": -12.360715866088867, "global_step": 471446, "epoch": 2806} {"train_loss": -12.291868209838867, "global_step": 471447, "epoch": 2806} {"train_loss": -11.903051376342773, "global_step": 471448, "epoch": 2806} {"train_loss": -12.471264839172363, "global_step": 471449, "epoch": 2806} {"train_loss": -12.614333152770996, "global_step": 471450, "epoch": 2806} {"train_loss": -12.5427827835083, "global_step": 471451, "epoch": 2806} {"train_loss": -12.083831787109375, "global_step": 471452, "epoch": 2806} {"train_loss": -11.953468322753906, "global_step": 471453, "epoch": 2806} {"train_loss": -12.54281997680664, "global_step": 471454, "epoch": 2806} {"train_loss": -12.2303466796875, "global_step": 471455, "epoch": 2806} {"train_loss": -12.56207275390625, "global_step": 471456, "epoch": 2806} {"train_loss": -12.121830940246582, "global_step": 471457, "epoch": 2806} {"train_loss": -12.652227401733398, "global_step": 471458, "epoch": 2806} {"train_loss": -12.525640487670898, "global_step": 471459, "epoch": 2806} {"train_loss": -12.512792587280273, "global_step": 471460, "epoch": 2806} {"train_loss": -12.470366477966309, "global_step": 471461, "epoch": 2806} {"train_loss": -12.535245895385742, "global_step": 471462, "epoch": 2806} {"train_loss": -12.440613746643066, "global_step": 471463, "epoch": 2806} {"train_loss": -12.545003890991211, "global_step": 471464, "epoch": 2806} {"train_loss": -12.414144515991211, "global_step": 471465, "epoch": 2806} {"train_loss": -12.795607566833496, "global_step": 471466, "epoch": 2806} {"train_loss": -12.533578872680664, "global_step": 471467, "epoch": 2806} {"train_loss": -12.7398099899292, "global_step": 471468, "epoch": 2806} {"train_loss": -12.579261779785156, "global_step": 471469, "epoch": 2806} {"train_loss": -12.722084045410156, "global_step": 471470, "epoch": 2806} {"train_loss": -12.648433685302734, "global_step": 471471, "epoch": 2806} {"train_loss": -12.616004943847656, "global_step": 471472, "epoch": 2806} {"train_loss": -12.632829666137695, "global_step": 471473, "epoch": 2806} {"train_loss": -12.586687088012695, "global_step": 471474, "epoch": 2806} {"train_loss": -12.733060836791992, "global_step": 471475, "epoch": 2806} {"train_loss": -12.759521484375, "global_step": 471476, "epoch": 2806} {"train_loss": -12.735912322998047, "global_step": 471477, "epoch": 2806} {"train_loss": -12.703234672546387, "global_step": 471478, "epoch": 2806} {"train_loss": -12.884333610534668, "global_step": 471479, "epoch": 2806} {"train_loss": -12.812784194946289, "global_step": 471480, "epoch": 2806} {"train_loss": -12.958345413208008, "global_step": 471481, "epoch": 2806} {"train_loss": -12.732011795043945, "global_step": 471482, "epoch": 2806} {"train_loss": -12.945999145507812, "global_step": 471483, "epoch": 2806} {"train_loss": -12.807596206665039, "global_step": 471484, "epoch": 2806} {"train_loss": -12.695316314697266, "global_step": 471485, "epoch": 2806} {"train_loss": -12.595861434936523, "global_step": 471486, "epoch": 2806} {"train_loss": -12.756579399108887, "global_step": 471487, "epoch": 2806} {"train_loss": -12.719032287597656, "global_step": 471488, "epoch": 2806} {"train_loss": -12.916336059570312, "global_step": 471489, "epoch": 2806} {"train_loss": -12.832186698913574, "global_step": 471490, "epoch": 2806} {"train_loss": -12.874231338500977, "global_step": 471491, "epoch": 2806} {"train_loss": -12.682016372680664, "global_step": 471492, "epoch": 2806} {"train_loss": -13.008480072021484, "global_step": 471493, "epoch": 2806} {"train_loss": -12.657459259033203, "global_step": 471494, "epoch": 2806} {"train_loss": -12.814325332641602, "global_step": 471495, "epoch": 2806} {"train_loss": -12.82037353515625, "global_step": 471496, "epoch": 2806} {"train_loss": -12.827421188354492, "global_step": 471497, "epoch": 2806} {"train_loss": -12.736513137817383, "global_step": 471498, "epoch": 2806} {"train_loss": -12.862028121948242, "global_step": 471499, "epoch": 2806} {"train_loss": -12.944801330566406, "global_step": 471500, "epoch": 2806} {"train_loss": -12.690719604492188, "global_step": 471501, "epoch": 2806} {"train_loss": -12.37562084197998, "global_step": 471502, "epoch": 2806} {"train_loss": -12.768773078918457, "global_step": 471503, "epoch": 2806} {"train_loss": -12.818681716918945, "global_step": 471504, "epoch": 2806} {"train_loss": -12.820450782775879, "global_step": 471505, "epoch": 2806} {"train_loss": -12.852104187011719, "global_step": 471506, "epoch": 2806} {"train_loss": -12.762415885925293, "global_step": 471507, "epoch": 2806} {"train_loss": -12.694723129272461, "global_step": 471508, "epoch": 2806} {"train_loss": -12.386330604553223, "global_step": 471509, "epoch": 2806} {"train_loss": -12.49387264251709, "global_step": 471510, "epoch": 2806} {"train_loss": -12.273408889770508, "global_step": 471511, "epoch": 2806} {"train_loss": -12.375492095947266, "global_step": 471512, "epoch": 2806} {"train_loss": -10.998053550720215, "global_step": 471513, "epoch": 2806} {"train_loss": -12.640928268432617, "global_step": 471514, "epoch": 2806} {"train_loss": -12.13890266418457, "global_step": 471515, "epoch": 2806} {"train_loss": -11.850561141967773, "global_step": 471516, "epoch": 2806} {"train_loss": -12.145975112915039, "global_step": 471517, "epoch": 2806} {"train_loss": -12.224305152893066, "global_step": 471518, "epoch": 2806} {"train_loss": -11.344544410705566, "global_step": 471519, "epoch": 2806} {"train_loss": -12.785717010498047, "global_step": 471520, "epoch": 2806} {"train_loss": -12.56379508972168, "global_step": 471521, "epoch": 2806} {"train_loss": -12.610618591308594, "global_step": 471522, "epoch": 2806} {"train_loss": -12.335566520690918, "global_step": 471523, "epoch": 2806} {"train_loss": -12.247836112976074, "global_step": 471524, "epoch": 2806} {"train_loss": -12.300024032592773, "global_step": 471525, "epoch": 2806} {"train_loss": -12.409860610961914, "global_step": 471526, "epoch": 2806} {"train_loss": -11.625227928161621, "global_step": 471527, "epoch": 2806} {"train_loss": -12.307306289672852, "global_step": 471528, "epoch": 2806} {"train_loss": -11.483396530151367, "global_step": 471529, "epoch": 2806} {"train_loss": -12.470802307128906, "global_step": 471530, "epoch": 2806} {"train_loss": -11.985644340515137, "global_step": 471531, "epoch": 2806} {"train_loss": -11.546348571777344, "global_step": 471532, "epoch": 2806} {"train_loss": -12.123039245605469, "global_step": 471533, "epoch": 2806} {"train_loss": -11.504288673400879, "global_step": 471534, "epoch": 2806} {"train_loss": -12.194835662841797, "global_step": 471535, "epoch": 2806} {"train_loss": -11.503047943115234, "global_step": 471536, "epoch": 2806} {"train_loss": -11.385584831237793, "global_step": 471537, "epoch": 2806} {"train_loss": -11.038091659545898, "global_step": 471538, "epoch": 2806} {"train_loss": -11.852424621582031, "global_step": 471539, "epoch": 2806} {"train_loss": -11.894596099853516, "global_step": 471540, "epoch": 2806} {"train_loss": -9.96693229675293, "global_step": 471541, "epoch": 2806} {"train_loss": -12.277172088623047, "global_step": 471542, "epoch": 2806} {"train_loss": -11.332756042480469, "global_step": 471543, "epoch": 2806} {"train_loss": -11.503019332885742, "global_step": 471544, "epoch": 2806} {"train_loss": -10.881868362426758, "global_step": 471545, "epoch": 2806} {"train_loss": -11.471312522888184, "global_step": 471546, "epoch": 2806} {"train_loss": -11.353864669799805, "global_step": 471547, "epoch": 2806} {"train_loss": -11.45140266418457, "global_step": 471548, "epoch": 2806} {"train_loss": -10.49509048461914, "global_step": 471549, "epoch": 2806} {"train_loss": -11.579967498779297, "global_step": 471550, "epoch": 2806} {"train_loss": -10.332230567932129, "global_step": 471551, "epoch": 2806} {"train_loss": -10.872831344604492, "global_step": 471552, "epoch": 2806} {"train_loss": -11.282364845275879, "global_step": 471553, "epoch": 2806} {"train_loss": -9.702963829040527, "global_step": 471554, "epoch": 2806} {"train_loss": -12.084487915039062, "global_step": 471555, "epoch": 2806} {"train_loss": -10.051356315612793, "global_step": 471556, "epoch": 2806} {"train_loss": -10.782514572143555, "global_step": 471557, "epoch": 2806} {"train_loss": -11.47337532043457, "global_step": 471558, "epoch": 2806} {"train_loss": -10.036945343017578, "global_step": 471559, "epoch": 2806} {"train_loss": -10.967150688171387, "global_step": 471560, "epoch": 2806} {"train_loss": -10.336688995361328, "global_step": 471561, "epoch": 2806} {"train_loss": -9.72557258605957, "global_step": 471562, "epoch": 2806} {"train_loss": -11.203116416931152, "global_step": 471563, "epoch": 2806} {"train_loss": -9.824605941772461, "global_step": 471564, "epoch": 2806} {"train_loss": -10.314303398132324, "global_step": 471565, "epoch": 2806} {"train_loss": -10.985498428344727, "global_step": 471566, "epoch": 2806} {"train_loss": -11.318916320800781, "global_step": 471567, "epoch": 2806} {"train_loss": -10.939393043518066, "global_step": 471568, "epoch": 2806} {"train_loss": -10.184221267700195, "global_step": 471569, "epoch": 2806} {"train_loss": -11.503089904785156, "global_step": 471570, "epoch": 2806} {"train_loss": -10.869909286499023, "global_step": 471571, "epoch": 2806} {"train_loss": -10.738161087036133, "global_step": 471572, "epoch": 2806} {"train_loss": -10.947339057922363, "global_step": 471573, "epoch": 2806} {"train_loss": -10.500226974487305, "global_step": 471574, "epoch": 2806} {"train_loss": -11.91641236486889, "global_step": 471575, "epoch": 2806, "val_loss": 315651.59375} {"train_loss": -10.508550643920898, "global_step": 471576, "epoch": 2807} {"train_loss": -10.667818069458008, "global_step": 471577, "epoch": 2807} {"train_loss": -10.163026809692383, "global_step": 471578, "epoch": 2807} {"train_loss": -11.594524383544922, "global_step": 471579, "epoch": 2807} {"train_loss": -9.420373916625977, "global_step": 471580, "epoch": 2807} {"train_loss": -11.315216064453125, "global_step": 471581, "epoch": 2807} {"train_loss": -10.437058448791504, "global_step": 471582, "epoch": 2807} {"train_loss": -10.582117080688477, "global_step": 471583, "epoch": 2807} {"train_loss": -11.3731689453125, "global_step": 471584, "epoch": 2807} {"train_loss": -11.108949661254883, "global_step": 471585, "epoch": 2807} {"train_loss": -11.23008918762207, "global_step": 471586, "epoch": 2807} {"train_loss": -12.012338638305664, "global_step": 471587, "epoch": 2807} {"train_loss": -11.249515533447266, "global_step": 471588, "epoch": 2807} {"train_loss": -12.005699157714844, "global_step": 471589, "epoch": 2807} {"train_loss": -11.720762252807617, "global_step": 471590, "epoch": 2807} {"train_loss": -11.344524383544922, "global_step": 471591, "epoch": 2807} {"train_loss": -12.211446762084961, "global_step": 471592, "epoch": 2807} {"train_loss": -11.696507453918457, "global_step": 471593, "epoch": 2807} {"train_loss": -11.807872772216797, "global_step": 471594, "epoch": 2807} {"train_loss": -11.981367111206055, "global_step": 471595, "epoch": 2807} {"train_loss": -11.980596542358398, "global_step": 471596, "epoch": 2807} {"train_loss": -12.18336296081543, "global_step": 471597, "epoch": 2807} {"train_loss": -12.005001068115234, "global_step": 471598, "epoch": 2807} {"train_loss": -12.224578857421875, "global_step": 471599, "epoch": 2807} {"train_loss": -12.065790176391602, "global_step": 471600, "epoch": 2807} {"train_loss": -12.454395294189453, "global_step": 471601, "epoch": 2807} {"train_loss": -12.14101791381836, "global_step": 471602, "epoch": 2807} {"train_loss": -12.40213394165039, "global_step": 471603, "epoch": 2807} {"train_loss": -12.013547897338867, "global_step": 471604, "epoch": 2807} {"train_loss": -12.3095064163208, "global_step": 471605, "epoch": 2807} {"train_loss": -11.883760452270508, "global_step": 471606, "epoch": 2807} {"train_loss": -12.342174530029297, "global_step": 471607, "epoch": 2807} {"train_loss": -12.481555938720703, "global_step": 471608, "epoch": 2807} {"train_loss": -12.249948501586914, "global_step": 471609, "epoch": 2807} {"train_loss": -12.235021591186523, "global_step": 471610, "epoch": 2807} {"train_loss": -12.348548889160156, "global_step": 471611, "epoch": 2807} {"train_loss": -12.062288284301758, "global_step": 471612, "epoch": 2807} {"train_loss": -12.382402420043945, "global_step": 471613, "epoch": 2807} {"train_loss": -12.201374053955078, "global_step": 471614, "epoch": 2807} {"train_loss": -12.577661514282227, "global_step": 471615, "epoch": 2807} {"train_loss": -12.38543701171875, "global_step": 471616, "epoch": 2807} {"train_loss": -12.33792495727539, "global_step": 471617, "epoch": 2807} {"train_loss": -12.294844627380371, "global_step": 471618, "epoch": 2807} {"train_loss": -12.44886589050293, "global_step": 471619, "epoch": 2807} {"train_loss": -12.373298645019531, "global_step": 471620, "epoch": 2807} {"train_loss": -12.305395126342773, "global_step": 471621, "epoch": 2807} {"train_loss": -12.083863258361816, "global_step": 471622, "epoch": 2807} {"train_loss": -12.418691635131836, "global_step": 471623, "epoch": 2807} {"train_loss": -11.986515045166016, "global_step": 471624, "epoch": 2807} {"train_loss": -12.414360046386719, "global_step": 471625, "epoch": 2807} {"train_loss": -12.433490753173828, "global_step": 471626, "epoch": 2807} {"train_loss": -12.273238182067871, "global_step": 471627, "epoch": 2807} {"train_loss": -12.374689102172852, "global_step": 471628, "epoch": 2807} {"train_loss": -12.40871810913086, "global_step": 471629, "epoch": 2807} {"train_loss": -12.475035667419434, "global_step": 471630, "epoch": 2807} {"train_loss": -12.644393920898438, "global_step": 471631, "epoch": 2807} {"train_loss": -12.41826057434082, "global_step": 471632, "epoch": 2807} {"train_loss": -12.684473037719727, "global_step": 471633, "epoch": 2807} {"train_loss": -12.369222640991211, "global_step": 471634, "epoch": 2807} {"train_loss": -12.658567428588867, "global_step": 471635, "epoch": 2807} {"train_loss": -12.706602096557617, "global_step": 471636, "epoch": 2807} {"train_loss": -12.38355541229248, "global_step": 471637, "epoch": 2807} {"train_loss": -12.621938705444336, "global_step": 471638, "epoch": 2807} {"train_loss": -12.371028900146484, "global_step": 471639, "epoch": 2807} {"train_loss": -12.424461364746094, "global_step": 471640, "epoch": 2807} {"train_loss": -12.683382034301758, "global_step": 471641, "epoch": 2807} {"train_loss": -12.5377197265625, "global_step": 471642, "epoch": 2807} {"train_loss": -12.544027328491211, "global_step": 471643, "epoch": 2807} {"train_loss": -12.673195838928223, "global_step": 471644, "epoch": 2807} {"train_loss": -12.70798110961914, "global_step": 471645, "epoch": 2807} {"train_loss": -12.737375259399414, "global_step": 471646, "epoch": 2807} {"train_loss": -12.608146667480469, "global_step": 471647, "epoch": 2807} {"train_loss": -12.945992469787598, "global_step": 471648, "epoch": 2807} {"train_loss": -12.650847434997559, "global_step": 471649, "epoch": 2807} {"train_loss": -12.798039436340332, "global_step": 471650, "epoch": 2807} {"train_loss": -12.911148071289062, "global_step": 471651, "epoch": 2807} {"train_loss": -12.545921325683594, "global_step": 471652, "epoch": 2807} {"train_loss": -12.73232650756836, "global_step": 471653, "epoch": 2807} {"train_loss": -12.863139152526855, "global_step": 471654, "epoch": 2807} {"train_loss": -12.707996368408203, "global_step": 471655, "epoch": 2807} {"train_loss": -12.779825210571289, "global_step": 471656, "epoch": 2807} {"train_loss": -12.7059326171875, "global_step": 471657, "epoch": 2807} {"train_loss": -12.740620613098145, "global_step": 471658, "epoch": 2807} {"train_loss": -12.888099670410156, "global_step": 471659, "epoch": 2807} {"train_loss": -12.78148365020752, "global_step": 471660, "epoch": 2807} {"train_loss": -12.886941909790039, "global_step": 471661, "epoch": 2807} {"train_loss": -12.856212615966797, "global_step": 471662, "epoch": 2807} {"train_loss": -12.58239459991455, "global_step": 471663, "epoch": 2807} {"train_loss": -12.736906051635742, "global_step": 471664, "epoch": 2807} {"train_loss": -12.832667350769043, "global_step": 471665, "epoch": 2807} {"train_loss": -12.622532844543457, "global_step": 471666, "epoch": 2807} {"train_loss": -12.847633361816406, "global_step": 471667, "epoch": 2807} {"train_loss": -12.653083801269531, "global_step": 471668, "epoch": 2807} {"train_loss": -12.857328414916992, "global_step": 471669, "epoch": 2807} {"train_loss": -12.878625869750977, "global_step": 471670, "epoch": 2807} {"train_loss": -12.704553604125977, "global_step": 471671, "epoch": 2807} {"train_loss": -12.817781448364258, "global_step": 471672, "epoch": 2807} {"train_loss": -12.881635665893555, "global_step": 471673, "epoch": 2807} {"train_loss": -13.024869918823242, "global_step": 471674, "epoch": 2807} {"train_loss": -12.906091690063477, "global_step": 471675, "epoch": 2807} {"train_loss": -12.998775482177734, "global_step": 471676, "epoch": 2807} {"train_loss": -13.096627235412598, "global_step": 471677, "epoch": 2807} {"train_loss": -13.060298919677734, "global_step": 471678, "epoch": 2807} {"train_loss": -12.87525749206543, "global_step": 471679, "epoch": 2807} {"train_loss": -12.756271362304688, "global_step": 471680, "epoch": 2807} {"train_loss": -12.897555351257324, "global_step": 471681, "epoch": 2807} {"train_loss": -12.910575866699219, "global_step": 471682, "epoch": 2807} {"train_loss": -12.851455688476562, "global_step": 471683, "epoch": 2807} {"train_loss": -12.94528579711914, "global_step": 471684, "epoch": 2807} {"train_loss": -12.850234985351562, "global_step": 471685, "epoch": 2807} {"train_loss": -12.877185821533203, "global_step": 471686, "epoch": 2807} {"train_loss": -13.115558624267578, "global_step": 471687, "epoch": 2807} {"train_loss": -13.027698516845703, "global_step": 471688, "epoch": 2807} {"train_loss": -12.705723762512207, "global_step": 471689, "epoch": 2807} {"train_loss": -12.980291366577148, "global_step": 471690, "epoch": 2807} {"train_loss": -13.078851699829102, "global_step": 471691, "epoch": 2807} {"train_loss": -12.818748474121094, "global_step": 471692, "epoch": 2807} {"train_loss": -13.019784927368164, "global_step": 471693, "epoch": 2807} {"train_loss": -12.542250633239746, "global_step": 471694, "epoch": 2807} {"train_loss": -13.00069808959961, "global_step": 471695, "epoch": 2807} {"train_loss": -12.69216537475586, "global_step": 471696, "epoch": 2807} {"train_loss": -13.002620697021484, "global_step": 471697, "epoch": 2807} {"train_loss": -13.018739700317383, "global_step": 471698, "epoch": 2807} {"train_loss": -13.217170715332031, "global_step": 471699, "epoch": 2807} {"train_loss": -12.992928504943848, "global_step": 471700, "epoch": 2807} {"train_loss": -13.023725509643555, "global_step": 471701, "epoch": 2807} {"train_loss": -12.957212448120117, "global_step": 471702, "epoch": 2807} {"train_loss": -12.800884246826172, "global_step": 471703, "epoch": 2807} {"train_loss": -13.317663192749023, "global_step": 471704, "epoch": 2807} {"train_loss": -12.983354568481445, "global_step": 471705, "epoch": 2807} {"train_loss": -12.817503929138184, "global_step": 471706, "epoch": 2807} {"train_loss": -12.611927032470703, "global_step": 471707, "epoch": 2807} {"train_loss": -12.43527603149414, "global_step": 471708, "epoch": 2807} {"train_loss": -12.75857162475586, "global_step": 471709, "epoch": 2807} {"train_loss": -12.649044036865234, "global_step": 471710, "epoch": 2807} {"train_loss": -12.225226402282715, "global_step": 471711, "epoch": 2807} {"train_loss": -12.597012519836426, "global_step": 471712, "epoch": 2807} {"train_loss": -12.187183380126953, "global_step": 471713, "epoch": 2807} {"train_loss": -12.274551391601562, "global_step": 471714, "epoch": 2807} {"train_loss": -12.665042877197266, "global_step": 471715, "epoch": 2807} {"train_loss": -12.691900253295898, "global_step": 471716, "epoch": 2807} {"train_loss": -12.711307525634766, "global_step": 471717, "epoch": 2807} {"train_loss": -12.7327299118042, "global_step": 471718, "epoch": 2807} {"train_loss": -12.833992004394531, "global_step": 471719, "epoch": 2807} {"train_loss": -13.055498123168945, "global_step": 471720, "epoch": 2807} {"train_loss": -12.702436447143555, "global_step": 471721, "epoch": 2807} {"train_loss": -12.6196928024292, "global_step": 471722, "epoch": 2807} {"train_loss": -12.617171287536621, "global_step": 471723, "epoch": 2807} {"train_loss": -12.46474552154541, "global_step": 471724, "epoch": 2807} {"train_loss": -12.864992141723633, "global_step": 471725, "epoch": 2807} {"train_loss": -12.601239204406738, "global_step": 471726, "epoch": 2807} {"train_loss": -11.861002922058105, "global_step": 471727, "epoch": 2807} {"train_loss": -10.693038940429688, "global_step": 471728, "epoch": 2807} {"train_loss": -12.013853073120117, "global_step": 471729, "epoch": 2807} {"train_loss": -12.287193298339844, "global_step": 471730, "epoch": 2807} {"train_loss": -11.118843078613281, "global_step": 471731, "epoch": 2807} {"train_loss": -11.154254913330078, "global_step": 471732, "epoch": 2807} {"train_loss": -11.266569137573242, "global_step": 471733, "epoch": 2807} {"train_loss": -10.841304779052734, "global_step": 471734, "epoch": 2807} {"train_loss": -11.14672565460205, "global_step": 471735, "epoch": 2807} {"train_loss": -11.579166412353516, "global_step": 471736, "epoch": 2807} {"train_loss": -11.742830276489258, "global_step": 471737, "epoch": 2807} {"train_loss": -11.393754959106445, "global_step": 471738, "epoch": 2807} {"train_loss": -11.757936477661133, "global_step": 471739, "epoch": 2807} {"train_loss": -10.589252471923828, "global_step": 471740, "epoch": 2807} {"train_loss": -10.742100715637207, "global_step": 471741, "epoch": 2807} {"train_loss": -11.496795654296875, "global_step": 471742, "epoch": 2807} {"train_loss": -12.33461738768078, "global_step": 471743, "epoch": 2807, "val_loss": 313744.34375} {"train_loss": -11.115804672241211, "global_step": 471744, "epoch": 2808} {"train_loss": -11.522369384765625, "global_step": 471745, "epoch": 2808} {"train_loss": -11.85128116607666, "global_step": 471746, "epoch": 2808} {"train_loss": -11.562555313110352, "global_step": 471747, "epoch": 2808} {"train_loss": -11.28359317779541, "global_step": 471748, "epoch": 2808} {"train_loss": -11.383819580078125, "global_step": 471749, "epoch": 2808} {"train_loss": -11.990607261657715, "global_step": 471750, "epoch": 2808} {"train_loss": -11.385775566101074, "global_step": 471751, "epoch": 2808} {"train_loss": -9.99151611328125, "global_step": 471752, "epoch": 2808} {"train_loss": -11.543825149536133, "global_step": 471753, "epoch": 2808} {"train_loss": -11.23324203491211, "global_step": 471754, "epoch": 2808} {"train_loss": -11.75128173828125, "global_step": 471755, "epoch": 2808} {"train_loss": -11.587543487548828, "global_step": 471756, "epoch": 2808} {"train_loss": -11.28283405303955, "global_step": 471757, "epoch": 2808} {"train_loss": -11.846413612365723, "global_step": 471758, "epoch": 2808} {"train_loss": -11.86124324798584, "global_step": 471759, "epoch": 2808} {"train_loss": -12.092742919921875, "global_step": 471760, "epoch": 2808} {"train_loss": -11.636992454528809, "global_step": 471761, "epoch": 2808} {"train_loss": -11.726253509521484, "global_step": 471762, "epoch": 2808} {"train_loss": -11.586179733276367, "global_step": 471763, "epoch": 2808} {"train_loss": -11.69362735748291, "global_step": 471764, "epoch": 2808} {"train_loss": -11.136024475097656, "global_step": 471765, "epoch": 2808} {"train_loss": -10.553688049316406, "global_step": 471766, "epoch": 2808} {"train_loss": -10.822540283203125, "global_step": 471767, "epoch": 2808} {"train_loss": -9.817949295043945, "global_step": 471768, "epoch": 2808} {"train_loss": -9.370809555053711, "global_step": 471769, "epoch": 2808} {"train_loss": -9.872690200805664, "global_step": 471770, "epoch": 2808} {"train_loss": -9.66748046875, "global_step": 471771, "epoch": 2808} {"train_loss": -10.700727462768555, "global_step": 471772, "epoch": 2808} {"train_loss": -10.208673477172852, "global_step": 471773, "epoch": 2808} {"train_loss": -10.241130828857422, "global_step": 471774, "epoch": 2808} {"train_loss": -10.044702529907227, "global_step": 471775, "epoch": 2808} {"train_loss": -10.118348121643066, "global_step": 471776, "epoch": 2808} {"train_loss": -11.291587829589844, "global_step": 471777, "epoch": 2808} {"train_loss": -11.479537963867188, "global_step": 471778, "epoch": 2808} {"train_loss": -11.29172420501709, "global_step": 471779, "epoch": 2808} {"train_loss": -11.773799896240234, "global_step": 471780, "epoch": 2808} {"train_loss": -11.097951889038086, "global_step": 471781, "epoch": 2808} {"train_loss": -11.907452583312988, "global_step": 471782, "epoch": 2808} {"train_loss": -11.466079711914062, "global_step": 471783, "epoch": 2808} {"train_loss": -11.900609970092773, "global_step": 471784, "epoch": 2808} {"train_loss": -11.766735076904297, "global_step": 471785, "epoch": 2808} {"train_loss": -11.888922691345215, "global_step": 471786, "epoch": 2808} {"train_loss": -11.340551376342773, "global_step": 471787, "epoch": 2808} {"train_loss": -11.612884521484375, "global_step": 471788, "epoch": 2808} {"train_loss": -12.096540451049805, "global_step": 471789, "epoch": 2808} {"train_loss": -12.128547668457031, "global_step": 471790, "epoch": 2808} {"train_loss": -12.016948699951172, "global_step": 471791, "epoch": 2808} {"train_loss": -11.9986572265625, "global_step": 471792, "epoch": 2808} {"train_loss": -12.228694915771484, "global_step": 471793, "epoch": 2808} {"train_loss": -12.09154224395752, "global_step": 471794, "epoch": 2808} {"train_loss": -12.039166450500488, "global_step": 471795, "epoch": 2808} {"train_loss": -12.064151763916016, "global_step": 471796, "epoch": 2808} {"train_loss": -12.195911407470703, "global_step": 471797, "epoch": 2808} {"train_loss": -12.064152717590332, "global_step": 471798, "epoch": 2808} {"train_loss": -12.17325210571289, "global_step": 471799, "epoch": 2808} {"train_loss": -12.027643203735352, "global_step": 471800, "epoch": 2808} {"train_loss": -11.880449295043945, "global_step": 471801, "epoch": 2808} {"train_loss": -12.174394607543945, "global_step": 471802, "epoch": 2808} {"train_loss": -12.046243667602539, "global_step": 471803, "epoch": 2808} {"train_loss": -12.542703628540039, "global_step": 471804, "epoch": 2808} {"train_loss": -12.146976470947266, "global_step": 471805, "epoch": 2808} {"train_loss": -12.254638671875, "global_step": 471806, "epoch": 2808} {"train_loss": -12.24282169342041, "global_step": 471807, "epoch": 2808} {"train_loss": -11.954265594482422, "global_step": 471808, "epoch": 2808} {"train_loss": -12.390176773071289, "global_step": 471809, "epoch": 2808} {"train_loss": -12.308210372924805, "global_step": 471810, "epoch": 2808} {"train_loss": -12.075860023498535, "global_step": 471811, "epoch": 2808} {"train_loss": -12.499515533447266, "global_step": 471812, "epoch": 2808} {"train_loss": -12.326335906982422, "global_step": 471813, "epoch": 2808} {"train_loss": -12.464073181152344, "global_step": 471814, "epoch": 2808} {"train_loss": -12.52039909362793, "global_step": 471815, "epoch": 2808} {"train_loss": -12.508800506591797, "global_step": 471816, "epoch": 2808} {"train_loss": -12.460137367248535, "global_step": 471817, "epoch": 2808} {"train_loss": -12.54045295715332, "global_step": 471818, "epoch": 2808} {"train_loss": -12.30486011505127, "global_step": 471819, "epoch": 2808} {"train_loss": -12.224255561828613, "global_step": 471820, "epoch": 2808} {"train_loss": -12.557510375976562, "global_step": 471821, "epoch": 2808} {"train_loss": -12.305489540100098, "global_step": 471822, "epoch": 2808} {"train_loss": -12.93725872039795, "global_step": 471823, "epoch": 2808} {"train_loss": -12.519598007202148, "global_step": 471824, "epoch": 2808} {"train_loss": -12.537347793579102, "global_step": 471825, "epoch": 2808} {"train_loss": -12.661109924316406, "global_step": 471826, "epoch": 2808} {"train_loss": -12.384960174560547, "global_step": 471827, "epoch": 2808} {"train_loss": -12.587480545043945, "global_step": 471828, "epoch": 2808} {"train_loss": -12.542919158935547, "global_step": 471829, "epoch": 2808} {"train_loss": -12.833483695983887, "global_step": 471830, "epoch": 2808} {"train_loss": -12.566547393798828, "global_step": 471831, "epoch": 2808} {"train_loss": -12.649603843688965, "global_step": 471832, "epoch": 2808} {"train_loss": -12.642302513122559, "global_step": 471833, "epoch": 2808} {"train_loss": -12.607977867126465, "global_step": 471834, "epoch": 2808} {"train_loss": -13.004646301269531, "global_step": 471835, "epoch": 2808} {"train_loss": -12.745673179626465, "global_step": 471836, "epoch": 2808} {"train_loss": -12.706656455993652, "global_step": 471837, "epoch": 2808} {"train_loss": -12.957084655761719, "global_step": 471838, "epoch": 2808} {"train_loss": -12.617295265197754, "global_step": 471839, "epoch": 2808} {"train_loss": -12.711629867553711, "global_step": 471840, "epoch": 2808} {"train_loss": -12.60712718963623, "global_step": 471841, "epoch": 2808} {"train_loss": -12.67112922668457, "global_step": 471842, "epoch": 2808} {"train_loss": -12.934823036193848, "global_step": 471843, "epoch": 2808} {"train_loss": -12.43450927734375, "global_step": 471844, "epoch": 2808} {"train_loss": -12.563164710998535, "global_step": 471845, "epoch": 2808} {"train_loss": -12.71376895904541, "global_step": 471846, "epoch": 2808} {"train_loss": -12.740201950073242, "global_step": 471847, "epoch": 2808} {"train_loss": -12.823272705078125, "global_step": 471848, "epoch": 2808} {"train_loss": -12.70290756225586, "global_step": 471849, "epoch": 2808} {"train_loss": -12.834218978881836, "global_step": 471850, "epoch": 2808} {"train_loss": -12.867301940917969, "global_step": 471851, "epoch": 2808} {"train_loss": -12.581854820251465, "global_step": 471852, "epoch": 2808} {"train_loss": -12.76097583770752, "global_step": 471853, "epoch": 2808} {"train_loss": -12.516426086425781, "global_step": 471854, "epoch": 2808} {"train_loss": -12.737043380737305, "global_step": 471855, "epoch": 2808} {"train_loss": -12.89708137512207, "global_step": 471856, "epoch": 2808} {"train_loss": -12.869451522827148, "global_step": 471857, "epoch": 2808} {"train_loss": -12.368508338928223, "global_step": 471858, "epoch": 2808} {"train_loss": -12.366952896118164, "global_step": 471859, "epoch": 2808} {"train_loss": -12.662171363830566, "global_step": 471860, "epoch": 2808} {"train_loss": -12.514030456542969, "global_step": 471861, "epoch": 2808} {"train_loss": -12.557149887084961, "global_step": 471862, "epoch": 2808} {"train_loss": -12.289892196655273, "global_step": 471863, "epoch": 2808} {"train_loss": -12.670357704162598, "global_step": 471864, "epoch": 2808} {"train_loss": -12.5606689453125, "global_step": 471865, "epoch": 2808} {"train_loss": -12.692021369934082, "global_step": 471866, "epoch": 2808} {"train_loss": -12.67741584777832, "global_step": 471867, "epoch": 2808} {"train_loss": -13.008428573608398, "global_step": 471868, "epoch": 2808} {"train_loss": -12.744022369384766, "global_step": 471869, "epoch": 2808} {"train_loss": -12.595199584960938, "global_step": 471870, "epoch": 2808} {"train_loss": -12.488369941711426, "global_step": 471871, "epoch": 2808} {"train_loss": -12.940515518188477, "global_step": 471872, "epoch": 2808} {"train_loss": -12.144050598144531, "global_step": 471873, "epoch": 2808} {"train_loss": -12.248028755187988, "global_step": 471874, "epoch": 2808} {"train_loss": -12.666635513305664, "global_step": 471875, "epoch": 2808} {"train_loss": -12.304763793945312, "global_step": 471876, "epoch": 2808} {"train_loss": -10.356494903564453, "global_step": 471877, "epoch": 2808} {"train_loss": -12.337614059448242, "global_step": 471878, "epoch": 2808} {"train_loss": -12.601140975952148, "global_step": 471879, "epoch": 2808} {"train_loss": -11.585431098937988, "global_step": 471880, "epoch": 2808} {"train_loss": -11.164544105529785, "global_step": 471881, "epoch": 2808} {"train_loss": -12.787910461425781, "global_step": 471882, "epoch": 2808} {"train_loss": -11.9906644821167, "global_step": 471883, "epoch": 2808} {"train_loss": -11.16739559173584, "global_step": 471884, "epoch": 2808} {"train_loss": -11.602306365966797, "global_step": 471885, "epoch": 2808} {"train_loss": -12.48087215423584, "global_step": 471886, "epoch": 2808} {"train_loss": -11.18882942199707, "global_step": 471887, "epoch": 2808} {"train_loss": -11.148622512817383, "global_step": 471888, "epoch": 2808} {"train_loss": -12.723666191101074, "global_step": 471889, "epoch": 2808} {"train_loss": -10.052966117858887, "global_step": 471890, "epoch": 2808} {"train_loss": -11.747346878051758, "global_step": 471891, "epoch": 2808} {"train_loss": -12.185897827148438, "global_step": 471892, "epoch": 2808} {"train_loss": -11.264274597167969, "global_step": 471893, "epoch": 2808} {"train_loss": -12.09475326538086, "global_step": 471894, "epoch": 2808} {"train_loss": -12.028963088989258, "global_step": 471895, "epoch": 2808} {"train_loss": -11.793442726135254, "global_step": 471896, "epoch": 2808} {"train_loss": -12.467743873596191, "global_step": 471897, "epoch": 2808} {"train_loss": -12.614923477172852, "global_step": 471898, "epoch": 2808} {"train_loss": -12.013535499572754, "global_step": 471899, "epoch": 2808} {"train_loss": -12.562244415283203, "global_step": 471900, "epoch": 2808} {"train_loss": -12.537826538085938, "global_step": 471901, "epoch": 2808} {"train_loss": -11.98111629486084, "global_step": 471902, "epoch": 2808} {"train_loss": -12.683475494384766, "global_step": 471903, "epoch": 2808} {"train_loss": -11.954224586486816, "global_step": 471904, "epoch": 2808} {"train_loss": -12.546751022338867, "global_step": 471905, "epoch": 2808} {"train_loss": -12.115249633789062, "global_step": 471906, "epoch": 2808} {"train_loss": -12.100436210632324, "global_step": 471907, "epoch": 2808} {"train_loss": -12.112457275390625, "global_step": 471908, "epoch": 2808} {"train_loss": -12.075736045837402, "global_step": 471909, "epoch": 2808} {"train_loss": -11.591291427612305, "global_step": 471910, "epoch": 2808} {"train_loss": -12.023897165343875, "global_step": 471911, "epoch": 2808, "val_loss": 315834.09375} {"train_loss": -11.492971420288086, "global_step": 471912, "epoch": 2809} {"train_loss": -12.058571815490723, "global_step": 471913, "epoch": 2809} {"train_loss": -12.107085227966309, "global_step": 471914, "epoch": 2809} {"train_loss": -11.398365020751953, "global_step": 471915, "epoch": 2809} {"train_loss": -12.076693534851074, "global_step": 471916, "epoch": 2809} {"train_loss": -11.822890281677246, "global_step": 471917, "epoch": 2809} {"train_loss": -11.867657661437988, "global_step": 471918, "epoch": 2809} {"train_loss": -11.620588302612305, "global_step": 471919, "epoch": 2809} {"train_loss": -12.053901672363281, "global_step": 471920, "epoch": 2809} {"train_loss": -11.82962417602539, "global_step": 471921, "epoch": 2809} {"train_loss": -10.89177131652832, "global_step": 471922, "epoch": 2809} {"train_loss": -11.512018203735352, "global_step": 471923, "epoch": 2809} {"train_loss": -12.031526565551758, "global_step": 471924, "epoch": 2809} {"train_loss": -11.692688941955566, "global_step": 471925, "epoch": 2809} {"train_loss": -11.516622543334961, "global_step": 471926, "epoch": 2809} {"train_loss": -12.003437995910645, "global_step": 471927, "epoch": 2809} {"train_loss": -11.707263946533203, "global_step": 471928, "epoch": 2809} {"train_loss": -11.698912620544434, "global_step": 471929, "epoch": 2809} {"train_loss": -12.52467155456543, "global_step": 471930, "epoch": 2809} {"train_loss": -10.9175386428833, "global_step": 471931, "epoch": 2809} {"train_loss": -12.317792892456055, "global_step": 471932, "epoch": 2809} {"train_loss": -11.40913200378418, "global_step": 471933, "epoch": 2809} {"train_loss": -12.09347915649414, "global_step": 471934, "epoch": 2809} {"train_loss": -11.796215057373047, "global_step": 471935, "epoch": 2809} {"train_loss": -12.145798683166504, "global_step": 471936, "epoch": 2809} {"train_loss": -11.80994987487793, "global_step": 471937, "epoch": 2809} {"train_loss": -12.184008598327637, "global_step": 471938, "epoch": 2809} {"train_loss": -12.074625015258789, "global_step": 471939, "epoch": 2809} {"train_loss": -11.78585433959961, "global_step": 471940, "epoch": 2809} {"train_loss": -11.973976135253906, "global_step": 471941, "epoch": 2809} {"train_loss": -12.142723083496094, "global_step": 471942, "epoch": 2809} {"train_loss": -11.234153747558594, "global_step": 471943, "epoch": 2809} {"train_loss": -12.326107025146484, "global_step": 471944, "epoch": 2809} {"train_loss": -12.086808204650879, "global_step": 471945, "epoch": 2809} {"train_loss": -11.966402053833008, "global_step": 471946, "epoch": 2809} {"train_loss": -12.174379348754883, "global_step": 471947, "epoch": 2809} {"train_loss": -12.092304229736328, "global_step": 471948, "epoch": 2809} {"train_loss": -12.65270709991455, "global_step": 471949, "epoch": 2809} {"train_loss": -11.762542724609375, "global_step": 471950, "epoch": 2809} {"train_loss": -12.690945625305176, "global_step": 471951, "epoch": 2809} {"train_loss": -12.017935752868652, "global_step": 471952, "epoch": 2809} {"train_loss": -12.454806327819824, "global_step": 471953, "epoch": 2809} {"train_loss": -11.96220588684082, "global_step": 471954, "epoch": 2809} {"train_loss": -12.337051391601562, "global_step": 471955, "epoch": 2809} {"train_loss": -12.05313777923584, "global_step": 471956, "epoch": 2809} {"train_loss": -12.063861846923828, "global_step": 471957, "epoch": 2809} {"train_loss": -11.988054275512695, "global_step": 471958, "epoch": 2809} {"train_loss": -11.96058464050293, "global_step": 471959, "epoch": 2809} {"train_loss": -11.343428611755371, "global_step": 471960, "epoch": 2809} {"train_loss": -12.072541236877441, "global_step": 471961, "epoch": 2809} {"train_loss": -11.862418174743652, "global_step": 471962, "epoch": 2809} {"train_loss": -11.730610847473145, "global_step": 471963, "epoch": 2809} {"train_loss": -12.60886001586914, "global_step": 471964, "epoch": 2809} {"train_loss": -11.613073348999023, "global_step": 471965, "epoch": 2809} {"train_loss": -12.14584732055664, "global_step": 471966, "epoch": 2809} {"train_loss": -10.754352569580078, "global_step": 471967, "epoch": 2809} {"train_loss": -11.630221366882324, "global_step": 471968, "epoch": 2809} {"train_loss": -11.676002502441406, "global_step": 471969, "epoch": 2809} {"train_loss": -11.93539810180664, "global_step": 471970, "epoch": 2809} {"train_loss": -12.232912063598633, "global_step": 471971, "epoch": 2809} {"train_loss": -12.40107536315918, "global_step": 471972, "epoch": 2809} {"train_loss": -12.123306274414062, "global_step": 471973, "epoch": 2809} {"train_loss": -12.508878707885742, "global_step": 471974, "epoch": 2809} {"train_loss": -11.808598518371582, "global_step": 471975, "epoch": 2809} {"train_loss": -12.607816696166992, "global_step": 471976, "epoch": 2809} {"train_loss": -12.26696491241455, "global_step": 471977, "epoch": 2809} {"train_loss": -12.567964553833008, "global_step": 471978, "epoch": 2809} {"train_loss": -12.462897300720215, "global_step": 471979, "epoch": 2809} {"train_loss": -12.72610092163086, "global_step": 471980, "epoch": 2809} {"train_loss": -12.701742172241211, "global_step": 471981, "epoch": 2809} {"train_loss": -12.265477180480957, "global_step": 471982, "epoch": 2809} {"train_loss": -12.588075637817383, "global_step": 471983, "epoch": 2809} {"train_loss": -12.732189178466797, "global_step": 471984, "epoch": 2809} {"train_loss": -12.570510864257812, "global_step": 471985, "epoch": 2809} {"train_loss": -12.414566040039062, "global_step": 471986, "epoch": 2809} {"train_loss": -12.640106201171875, "global_step": 471987, "epoch": 2809} {"train_loss": -12.801750183105469, "global_step": 471988, "epoch": 2809} {"train_loss": -12.57786750793457, "global_step": 471989, "epoch": 2809} {"train_loss": -12.641572952270508, "global_step": 471990, "epoch": 2809} {"train_loss": -12.579500198364258, "global_step": 471991, "epoch": 2809} {"train_loss": -12.719379425048828, "global_step": 471992, "epoch": 2809} {"train_loss": -12.451364517211914, "global_step": 471993, "epoch": 2809} {"train_loss": -12.536087036132812, "global_step": 471994, "epoch": 2809} {"train_loss": -12.361852645874023, "global_step": 471995, "epoch": 2809} {"train_loss": -12.27993392944336, "global_step": 471996, "epoch": 2809} {"train_loss": -12.759506225585938, "global_step": 471997, "epoch": 2809} {"train_loss": -12.597156524658203, "global_step": 471998, "epoch": 2809} {"train_loss": -12.691795349121094, "global_step": 471999, "epoch": 2809} {"train_loss": -12.521261215209961, "global_step": 472000, "epoch": 2809} {"train_loss": -12.847512245178223, "global_step": 472001, "epoch": 2809} {"train_loss": -12.711523056030273, "global_step": 472002, "epoch": 2809} {"train_loss": -12.544291496276855, "global_step": 472003, "epoch": 2809} {"train_loss": -12.46107006072998, "global_step": 472004, "epoch": 2809} {"train_loss": -12.651968955993652, "global_step": 472005, "epoch": 2809} {"train_loss": -12.767855644226074, "global_step": 472006, "epoch": 2809} {"train_loss": -12.642751693725586, "global_step": 472007, "epoch": 2809} {"train_loss": -12.617406845092773, "global_step": 472008, "epoch": 2809} {"train_loss": -12.608817100524902, "global_step": 472009, "epoch": 2809} {"train_loss": -12.628700256347656, "global_step": 472010, "epoch": 2809} {"train_loss": -12.751670837402344, "global_step": 472011, "epoch": 2809} {"train_loss": -12.903387069702148, "global_step": 472012, "epoch": 2809} {"train_loss": -12.662208557128906, "global_step": 472013, "epoch": 2809} {"train_loss": -12.869839668273926, "global_step": 472014, "epoch": 2809} {"train_loss": -12.514986038208008, "global_step": 472015, "epoch": 2809} {"train_loss": -12.499114990234375, "global_step": 472016, "epoch": 2809} {"train_loss": -12.283681869506836, "global_step": 472017, "epoch": 2809} {"train_loss": -12.77020263671875, "global_step": 472018, "epoch": 2809} {"train_loss": -12.791804313659668, "global_step": 472019, "epoch": 2809} {"train_loss": -12.907316207885742, "global_step": 472020, "epoch": 2809} {"train_loss": -12.442453384399414, "global_step": 472021, "epoch": 2809} {"train_loss": -12.729604721069336, "global_step": 472022, "epoch": 2809} {"train_loss": -12.78325080871582, "global_step": 472023, "epoch": 2809} {"train_loss": -12.782052040100098, "global_step": 472024, "epoch": 2809} {"train_loss": -13.021615028381348, "global_step": 472025, "epoch": 2809} {"train_loss": -12.544486999511719, "global_step": 472026, "epoch": 2809} {"train_loss": -12.152593612670898, "global_step": 472027, "epoch": 2809} {"train_loss": -12.275627136230469, "global_step": 472028, "epoch": 2809} {"train_loss": -12.810686111450195, "global_step": 472029, "epoch": 2809} {"train_loss": -12.073810577392578, "global_step": 472030, "epoch": 2809} {"train_loss": -12.214680671691895, "global_step": 472031, "epoch": 2809} {"train_loss": -12.451251029968262, "global_step": 472032, "epoch": 2809} {"train_loss": -12.505029678344727, "global_step": 472033, "epoch": 2809} {"train_loss": -11.804166793823242, "global_step": 472034, "epoch": 2809} {"train_loss": -11.970926284790039, "global_step": 472035, "epoch": 2809} {"train_loss": -12.011045455932617, "global_step": 472036, "epoch": 2809} {"train_loss": -10.391801834106445, "global_step": 472037, "epoch": 2809} {"train_loss": -11.253684043884277, "global_step": 472038, "epoch": 2809} {"train_loss": -11.618854522705078, "global_step": 472039, "epoch": 2809} {"train_loss": -11.50167179107666, "global_step": 472040, "epoch": 2809} {"train_loss": -10.00072956085205, "global_step": 472041, "epoch": 2809} {"train_loss": -12.009624481201172, "global_step": 472042, "epoch": 2809} {"train_loss": -12.434135437011719, "global_step": 472043, "epoch": 2809} {"train_loss": -11.201685905456543, "global_step": 472044, "epoch": 2809} {"train_loss": -12.146909713745117, "global_step": 472045, "epoch": 2809} {"train_loss": -12.38534164428711, "global_step": 472046, "epoch": 2809} {"train_loss": -10.623437881469727, "global_step": 472047, "epoch": 2809} {"train_loss": -11.286094665527344, "global_step": 472048, "epoch": 2809} {"train_loss": -11.39006233215332, "global_step": 472049, "epoch": 2809} {"train_loss": -9.195982933044434, "global_step": 472050, "epoch": 2809} {"train_loss": -9.464693069458008, "global_step": 472051, "epoch": 2809} {"train_loss": -11.046377182006836, "global_step": 472052, "epoch": 2809} {"train_loss": -10.966630935668945, "global_step": 472053, "epoch": 2809} {"train_loss": -9.48460865020752, "global_step": 472054, "epoch": 2809} {"train_loss": -10.815488815307617, "global_step": 472055, "epoch": 2809} {"train_loss": -11.01546573638916, "global_step": 472056, "epoch": 2809} {"train_loss": -11.73519515991211, "global_step": 472057, "epoch": 2809} {"train_loss": -11.459335327148438, "global_step": 472058, "epoch": 2809} {"train_loss": -11.619718551635742, "global_step": 472059, "epoch": 2809} {"train_loss": -12.081439018249512, "global_step": 472060, "epoch": 2809} {"train_loss": -11.066904067993164, "global_step": 472061, "epoch": 2809} {"train_loss": -10.685246467590332, "global_step": 472062, "epoch": 2809} {"train_loss": -10.728530883789062, "global_step": 472063, "epoch": 2809} {"train_loss": -9.946102142333984, "global_step": 472064, "epoch": 2809} {"train_loss": -10.561834335327148, "global_step": 472065, "epoch": 2809} {"train_loss": -11.756523132324219, "global_step": 472066, "epoch": 2809} {"train_loss": -11.097532272338867, "global_step": 472067, "epoch": 2809} {"train_loss": -12.098688125610352, "global_step": 472068, "epoch": 2809} {"train_loss": -11.149243354797363, "global_step": 472069, "epoch": 2809} {"train_loss": -11.63361930847168, "global_step": 472070, "epoch": 2809} {"train_loss": -11.664041519165039, "global_step": 472071, "epoch": 2809} {"train_loss": -11.448233604431152, "global_step": 472072, "epoch": 2809} {"train_loss": -11.923896789550781, "global_step": 472073, "epoch": 2809} {"train_loss": -11.078506469726562, "global_step": 472074, "epoch": 2809} {"train_loss": -12.308114051818848, "global_step": 472075, "epoch": 2809} {"train_loss": -11.26032829284668, "global_step": 472076, "epoch": 2809} {"train_loss": -11.5643310546875, "global_step": 472077, "epoch": 2809} {"train_loss": -11.595769882202148, "global_step": 472078, "epoch": 2809} {"train_loss": -11.970733767464047, "global_step": 472079, "epoch": 2809, "val_loss": 306361.03125} {"train_loss": -10.834507942199707, "global_step": 472080, "epoch": 2810} {"train_loss": -11.119255065917969, "global_step": 472081, "epoch": 2810} {"train_loss": -11.432182312011719, "global_step": 472082, "epoch": 2810} {"train_loss": -11.038362503051758, "global_step": 472083, "epoch": 2810} {"train_loss": -11.80340576171875, "global_step": 472084, "epoch": 2810} {"train_loss": -11.503196716308594, "global_step": 472085, "epoch": 2810} {"train_loss": -11.922189712524414, "global_step": 472086, "epoch": 2810} {"train_loss": -11.349908828735352, "global_step": 472087, "epoch": 2810} {"train_loss": -12.028653144836426, "global_step": 472088, "epoch": 2810} {"train_loss": -11.735233306884766, "global_step": 472089, "epoch": 2810} {"train_loss": -11.973928451538086, "global_step": 472090, "epoch": 2810} {"train_loss": -11.913846969604492, "global_step": 472091, "epoch": 2810} {"train_loss": -12.014625549316406, "global_step": 472092, "epoch": 2810} {"train_loss": -12.104290008544922, "global_step": 472093, "epoch": 2810} {"train_loss": -11.566583633422852, "global_step": 472094, "epoch": 2810} {"train_loss": -11.577162742614746, "global_step": 472095, "epoch": 2810} {"train_loss": -11.62867546081543, "global_step": 472096, "epoch": 2810} {"train_loss": -11.775649070739746, "global_step": 472097, "epoch": 2810} {"train_loss": -11.717920303344727, "global_step": 472098, "epoch": 2810} {"train_loss": -11.63318920135498, "global_step": 472099, "epoch": 2810} {"train_loss": -11.257397651672363, "global_step": 472100, "epoch": 2810} {"train_loss": -11.296814918518066, "global_step": 472101, "epoch": 2810} {"train_loss": -11.347177505493164, "global_step": 472102, "epoch": 2810} {"train_loss": -11.088491439819336, "global_step": 472103, "epoch": 2810} {"train_loss": -10.92306137084961, "global_step": 472104, "epoch": 2810} {"train_loss": -11.610251426696777, "global_step": 472105, "epoch": 2810} {"train_loss": -10.60418701171875, "global_step": 472106, "epoch": 2810} {"train_loss": -12.188879013061523, "global_step": 472107, "epoch": 2810} {"train_loss": -11.754608154296875, "global_step": 472108, "epoch": 2810} {"train_loss": -12.2064790725708, "global_step": 472109, "epoch": 2810} {"train_loss": -11.826969146728516, "global_step": 472110, "epoch": 2810} {"train_loss": -11.922069549560547, "global_step": 472111, "epoch": 2810} {"train_loss": -11.896732330322266, "global_step": 472112, "epoch": 2810} {"train_loss": -12.198062896728516, "global_step": 472113, "epoch": 2810} {"train_loss": -12.035845756530762, "global_step": 472114, "epoch": 2810} {"train_loss": -12.330110549926758, "global_step": 472115, "epoch": 2810} {"train_loss": -12.29779052734375, "global_step": 472116, "epoch": 2810} {"train_loss": -11.952838897705078, "global_step": 472117, "epoch": 2810} {"train_loss": -12.386303901672363, "global_step": 472118, "epoch": 2810} {"train_loss": -12.294646263122559, "global_step": 472119, "epoch": 2810} {"train_loss": -12.405357360839844, "global_step": 472120, "epoch": 2810} {"train_loss": -12.102265357971191, "global_step": 472121, "epoch": 2810} {"train_loss": -12.130109786987305, "global_step": 472122, "epoch": 2810} {"train_loss": -12.256753921508789, "global_step": 472123, "epoch": 2810} {"train_loss": -12.495269775390625, "global_step": 472124, "epoch": 2810} {"train_loss": -12.494805335998535, "global_step": 472125, "epoch": 2810} {"train_loss": -12.5792818069458, "global_step": 472126, "epoch": 2810} {"train_loss": -12.269038200378418, "global_step": 472127, "epoch": 2810} {"train_loss": -12.387028694152832, "global_step": 472128, "epoch": 2810} {"train_loss": -12.466458320617676, "global_step": 472129, "epoch": 2810} {"train_loss": -12.296250343322754, "global_step": 472130, "epoch": 2810} {"train_loss": -12.310684204101562, "global_step": 472131, "epoch": 2810} {"train_loss": -12.609230041503906, "global_step": 472132, "epoch": 2810} {"train_loss": -12.375240325927734, "global_step": 472133, "epoch": 2810} {"train_loss": -12.469770431518555, "global_step": 472134, "epoch": 2810} {"train_loss": -12.417908668518066, "global_step": 472135, "epoch": 2810} {"train_loss": -12.725688934326172, "global_step": 472136, "epoch": 2810} {"train_loss": -12.665422439575195, "global_step": 472137, "epoch": 2810} {"train_loss": -12.771763801574707, "global_step": 472138, "epoch": 2810} {"train_loss": -12.634143829345703, "global_step": 472139, "epoch": 2810} {"train_loss": -12.425426483154297, "global_step": 472140, "epoch": 2810} {"train_loss": -12.589324951171875, "global_step": 472141, "epoch": 2810} {"train_loss": -12.568254470825195, "global_step": 472142, "epoch": 2810} {"train_loss": -12.63615608215332, "global_step": 472143, "epoch": 2810} {"train_loss": -12.635984420776367, "global_step": 472144, "epoch": 2810} {"train_loss": -12.56724739074707, "global_step": 472145, "epoch": 2810} {"train_loss": -12.589396476745605, "global_step": 472146, "epoch": 2810} {"train_loss": -12.603019714355469, "global_step": 472147, "epoch": 2810} {"train_loss": -12.554922103881836, "global_step": 472148, "epoch": 2810} {"train_loss": -12.673601150512695, "global_step": 472149, "epoch": 2810} {"train_loss": -12.519648551940918, "global_step": 472150, "epoch": 2810} {"train_loss": -12.388225555419922, "global_step": 472151, "epoch": 2810} {"train_loss": -12.575359344482422, "global_step": 472152, "epoch": 2810} {"train_loss": -12.64925765991211, "global_step": 472153, "epoch": 2810} {"train_loss": -12.637449264526367, "global_step": 472154, "epoch": 2810} {"train_loss": -12.753551483154297, "global_step": 472155, "epoch": 2810} {"train_loss": -12.802634239196777, "global_step": 472156, "epoch": 2810} {"train_loss": -12.6532564163208, "global_step": 472157, "epoch": 2810} {"train_loss": -12.779254913330078, "global_step": 472158, "epoch": 2810} {"train_loss": -12.543601989746094, "global_step": 472159, "epoch": 2810} {"train_loss": -12.624523162841797, "global_step": 472160, "epoch": 2810} {"train_loss": -12.800949096679688, "global_step": 472161, "epoch": 2810} {"train_loss": -12.616151809692383, "global_step": 472162, "epoch": 2810} {"train_loss": -12.7400541305542, "global_step": 472163, "epoch": 2810} {"train_loss": -12.648492813110352, "global_step": 472164, "epoch": 2810} {"train_loss": -12.595701217651367, "global_step": 472165, "epoch": 2810} {"train_loss": -12.721362113952637, "global_step": 472166, "epoch": 2810} {"train_loss": -12.733968734741211, "global_step": 472167, "epoch": 2810} {"train_loss": -12.874723434448242, "global_step": 472168, "epoch": 2810} {"train_loss": -12.698297500610352, "global_step": 472169, "epoch": 2810} {"train_loss": -12.663812637329102, "global_step": 472170, "epoch": 2810} {"train_loss": -12.791351318359375, "global_step": 472171, "epoch": 2810} {"train_loss": -12.971115112304688, "global_step": 472172, "epoch": 2810} {"train_loss": -12.591106414794922, "global_step": 472173, "epoch": 2810} {"train_loss": -12.993611335754395, "global_step": 472174, "epoch": 2810} {"train_loss": -12.517227172851562, "global_step": 472175, "epoch": 2810} {"train_loss": -12.801593780517578, "global_step": 472176, "epoch": 2810} {"train_loss": -12.811470031738281, "global_step": 472177, "epoch": 2810} {"train_loss": -12.492208480834961, "global_step": 472178, "epoch": 2810} {"train_loss": -12.932955741882324, "global_step": 472179, "epoch": 2810} {"train_loss": -12.53919792175293, "global_step": 472180, "epoch": 2810} {"train_loss": -12.59447956085205, "global_step": 472181, "epoch": 2810} {"train_loss": -12.795492172241211, "global_step": 472182, "epoch": 2810} {"train_loss": -12.491775512695312, "global_step": 472183, "epoch": 2810} {"train_loss": -12.830901145935059, "global_step": 472184, "epoch": 2810} {"train_loss": -13.16289234161377, "global_step": 472185, "epoch": 2810} {"train_loss": -12.85263442993164, "global_step": 472186, "epoch": 2810} {"train_loss": -12.954829216003418, "global_step": 472187, "epoch": 2810} {"train_loss": -12.629512786865234, "global_step": 472188, "epoch": 2810} {"train_loss": -12.523513793945312, "global_step": 472189, "epoch": 2810} {"train_loss": -12.947346687316895, "global_step": 472190, "epoch": 2810} {"train_loss": -12.676485061645508, "global_step": 472191, "epoch": 2810} {"train_loss": -12.511251449584961, "global_step": 472192, "epoch": 2810} {"train_loss": -12.866094589233398, "global_step": 472193, "epoch": 2810} {"train_loss": -12.816591262817383, "global_step": 472194, "epoch": 2810} {"train_loss": -12.785524368286133, "global_step": 472195, "epoch": 2810} {"train_loss": -12.68439769744873, "global_step": 472196, "epoch": 2810} {"train_loss": -12.610538482666016, "global_step": 472197, "epoch": 2810} {"train_loss": -12.883310317993164, "global_step": 472198, "epoch": 2810} {"train_loss": -12.724557876586914, "global_step": 472199, "epoch": 2810} {"train_loss": -12.847405433654785, "global_step": 472200, "epoch": 2810} {"train_loss": -12.835323333740234, "global_step": 472201, "epoch": 2810} {"train_loss": -12.571605682373047, "global_step": 472202, "epoch": 2810} {"train_loss": -12.905631065368652, "global_step": 472203, "epoch": 2810} {"train_loss": -12.70149040222168, "global_step": 472204, "epoch": 2810} {"train_loss": -12.896194458007812, "global_step": 472205, "epoch": 2810} {"train_loss": -12.600975036621094, "global_step": 472206, "epoch": 2810} {"train_loss": -12.407733917236328, "global_step": 472207, "epoch": 2810} {"train_loss": -12.647136688232422, "global_step": 472208, "epoch": 2810} {"train_loss": -12.767621040344238, "global_step": 472209, "epoch": 2810} {"train_loss": -12.604378700256348, "global_step": 472210, "epoch": 2810} {"train_loss": -12.725872039794922, "global_step": 472211, "epoch": 2810} {"train_loss": -12.479541778564453, "global_step": 472212, "epoch": 2810} {"train_loss": -12.656009674072266, "global_step": 472213, "epoch": 2810} {"train_loss": -12.52979850769043, "global_step": 472214, "epoch": 2810} {"train_loss": -12.779443740844727, "global_step": 472215, "epoch": 2810} {"train_loss": -12.42870044708252, "global_step": 472216, "epoch": 2810} {"train_loss": -11.97611141204834, "global_step": 472217, "epoch": 2810} {"train_loss": -12.46346664428711, "global_step": 472218, "epoch": 2810} {"train_loss": -12.323990821838379, "global_step": 472219, "epoch": 2810} {"train_loss": -12.699296951293945, "global_step": 472220, "epoch": 2810} {"train_loss": -12.896319389343262, "global_step": 472221, "epoch": 2810} {"train_loss": -12.060498237609863, "global_step": 472222, "epoch": 2810} {"train_loss": -11.618450164794922, "global_step": 472223, "epoch": 2810} {"train_loss": -11.360544204711914, "global_step": 472224, "epoch": 2810} {"train_loss": -12.080198287963867, "global_step": 472225, "epoch": 2810} {"train_loss": -10.652984619140625, "global_step": 472226, "epoch": 2810} {"train_loss": -11.064966201782227, "global_step": 472227, "epoch": 2810} {"train_loss": -12.364316940307617, "global_step": 472228, "epoch": 2810} {"train_loss": -9.754457473754883, "global_step": 472229, "epoch": 2810} {"train_loss": -10.328214645385742, "global_step": 472230, "epoch": 2810} {"train_loss": -11.545585632324219, "global_step": 472231, "epoch": 2810} {"train_loss": -9.385443687438965, "global_step": 472232, "epoch": 2810} {"train_loss": -11.344921112060547, "global_step": 472233, "epoch": 2810} {"train_loss": -4.8040900230407715, "global_step": 472234, "epoch": 2810} {"train_loss": -8.39334487915039, "global_step": 472235, "epoch": 2810} {"train_loss": -6.042411804199219, "global_step": 472236, "epoch": 2810} {"train_loss": -6.739373207092285, "global_step": 472237, "epoch": 2810} {"train_loss": -7.397830009460449, "global_step": 472238, "epoch": 2810} {"train_loss": -7.373580455780029, "global_step": 472239, "epoch": 2810} {"train_loss": -7.244668006896973, "global_step": 472240, "epoch": 2810} {"train_loss": -6.949367523193359, "global_step": 472241, "epoch": 2810} {"train_loss": -6.956526756286621, "global_step": 472242, "epoch": 2810} {"train_loss": -7.249295234680176, "global_step": 472243, "epoch": 2810} {"train_loss": -8.279684066772461, "global_step": 472244, "epoch": 2810} {"train_loss": -8.981618881225586, "global_step": 472245, "epoch": 2810} {"train_loss": -8.809480667114258, "global_step": 472246, "epoch": 2810} {"train_loss": -11.876595457394918, "global_step": 472247, "epoch": 2810, "val_loss": 311020.6875, "train_action_mse_error": 2.32718563079834} {"train_loss": -9.28706169128418, "global_step": 472248, "epoch": 2811} {"train_loss": -9.67662239074707, "global_step": 472249, "epoch": 2811} {"train_loss": -10.473776817321777, "global_step": 472250, "epoch": 2811} {"train_loss": -10.497359275817871, "global_step": 472251, "epoch": 2811} {"train_loss": -10.590896606445312, "global_step": 472252, "epoch": 2811} {"train_loss": -10.356491088867188, "global_step": 472253, "epoch": 2811} {"train_loss": -10.542102813720703, "global_step": 472254, "epoch": 2811} {"train_loss": -11.091360092163086, "global_step": 472255, "epoch": 2811} {"train_loss": -9.922264099121094, "global_step": 472256, "epoch": 2811} {"train_loss": -10.850118637084961, "global_step": 472257, "epoch": 2811} {"train_loss": -10.951018333435059, "global_step": 472258, "epoch": 2811} {"train_loss": -11.47604751586914, "global_step": 472259, "epoch": 2811} {"train_loss": -11.619463920593262, "global_step": 472260, "epoch": 2811} {"train_loss": -10.70843505859375, "global_step": 472261, "epoch": 2811} {"train_loss": -11.045631408691406, "global_step": 472262, "epoch": 2811} {"train_loss": -11.323086738586426, "global_step": 472263, "epoch": 2811} {"train_loss": -11.173048973083496, "global_step": 472264, "epoch": 2811} {"train_loss": -11.29258918762207, "global_step": 472265, "epoch": 2811} {"train_loss": -11.400784492492676, "global_step": 472266, "epoch": 2811} {"train_loss": -10.997133255004883, "global_step": 472267, "epoch": 2811} {"train_loss": -11.345120429992676, "global_step": 472268, "epoch": 2811} {"train_loss": -11.101762771606445, "global_step": 472269, "epoch": 2811} {"train_loss": -11.52036190032959, "global_step": 472270, "epoch": 2811} {"train_loss": -11.282058715820312, "global_step": 472271, "epoch": 2811} {"train_loss": -12.022359848022461, "global_step": 472272, "epoch": 2811} {"train_loss": -11.435813903808594, "global_step": 472273, "epoch": 2811} {"train_loss": -12.17873764038086, "global_step": 472274, "epoch": 2811} {"train_loss": -11.74150562286377, "global_step": 472275, "epoch": 2811} {"train_loss": -11.79530143737793, "global_step": 472276, "epoch": 2811} {"train_loss": -12.215487480163574, "global_step": 472277, "epoch": 2811} {"train_loss": -11.605186462402344, "global_step": 472278, "epoch": 2811} {"train_loss": -12.242643356323242, "global_step": 472279, "epoch": 2811} {"train_loss": -11.871930122375488, "global_step": 472280, "epoch": 2811} {"train_loss": -11.597219467163086, "global_step": 472281, "epoch": 2811} {"train_loss": -11.800117492675781, "global_step": 472282, "epoch": 2811} {"train_loss": -12.100127220153809, "global_step": 472283, "epoch": 2811} {"train_loss": -11.911582946777344, "global_step": 472284, "epoch": 2811} {"train_loss": -12.230796813964844, "global_step": 472285, "epoch": 2811} {"train_loss": -11.498208999633789, "global_step": 472286, "epoch": 2811} {"train_loss": -12.378667831420898, "global_step": 472287, "epoch": 2811} {"train_loss": -11.688331604003906, "global_step": 472288, "epoch": 2811} {"train_loss": -11.843226432800293, "global_step": 472289, "epoch": 2811} {"train_loss": -11.393346786499023, "global_step": 472290, "epoch": 2811} {"train_loss": -12.124073028564453, "global_step": 472291, "epoch": 2811} {"train_loss": -12.127610206604004, "global_step": 472292, "epoch": 2811} {"train_loss": -12.061697959899902, "global_step": 472293, "epoch": 2811} {"train_loss": -12.001569747924805, "global_step": 472294, "epoch": 2811} {"train_loss": -12.272486686706543, "global_step": 472295, "epoch": 2811} {"train_loss": -11.810531616210938, "global_step": 472296, "epoch": 2811} {"train_loss": -12.025543212890625, "global_step": 472297, "epoch": 2811} {"train_loss": -11.889483451843262, "global_step": 472298, "epoch": 2811} {"train_loss": -12.398964881896973, "global_step": 472299, "epoch": 2811} {"train_loss": -12.039369583129883, "global_step": 472300, "epoch": 2811} {"train_loss": -12.433366775512695, "global_step": 472301, "epoch": 2811} {"train_loss": -12.156993865966797, "global_step": 472302, "epoch": 2811} {"train_loss": -12.443716049194336, "global_step": 472303, "epoch": 2811} {"train_loss": -12.375057220458984, "global_step": 472304, "epoch": 2811} {"train_loss": -12.43062973022461, "global_step": 472305, "epoch": 2811} {"train_loss": -12.49852466583252, "global_step": 472306, "epoch": 2811} {"train_loss": -12.395386695861816, "global_step": 472307, "epoch": 2811} {"train_loss": -12.485608100891113, "global_step": 472308, "epoch": 2811} {"train_loss": -12.64300537109375, "global_step": 472309, "epoch": 2811} {"train_loss": -12.508696556091309, "global_step": 472310, "epoch": 2811} {"train_loss": -12.431089401245117, "global_step": 472311, "epoch": 2811} {"train_loss": -12.659795761108398, "global_step": 472312, "epoch": 2811} {"train_loss": -12.38772201538086, "global_step": 472313, "epoch": 2811} {"train_loss": -12.672405242919922, "global_step": 472314, "epoch": 2811} {"train_loss": -12.396210670471191, "global_step": 472315, "epoch": 2811} {"train_loss": -12.548245429992676, "global_step": 472316, "epoch": 2811} {"train_loss": -12.522573471069336, "global_step": 472317, "epoch": 2811} {"train_loss": -12.41496753692627, "global_step": 472318, "epoch": 2811} {"train_loss": -12.401869773864746, "global_step": 472319, "epoch": 2811} {"train_loss": -12.329971313476562, "global_step": 472320, "epoch": 2811} {"train_loss": -12.683154106140137, "global_step": 472321, "epoch": 2811} {"train_loss": -12.456504821777344, "global_step": 472322, "epoch": 2811} {"train_loss": -12.250093460083008, "global_step": 472323, "epoch": 2811} {"train_loss": -12.540517807006836, "global_step": 472324, "epoch": 2811} {"train_loss": -12.312675476074219, "global_step": 472325, "epoch": 2811} {"train_loss": -12.104019165039062, "global_step": 472326, "epoch": 2811} {"train_loss": -12.608346939086914, "global_step": 472327, "epoch": 2811} {"train_loss": -12.120576858520508, "global_step": 472328, "epoch": 2811} {"train_loss": -12.623004913330078, "global_step": 472329, "epoch": 2811} {"train_loss": -12.39512825012207, "global_step": 472330, "epoch": 2811} {"train_loss": -12.40643310546875, "global_step": 472331, "epoch": 2811} {"train_loss": -12.2823486328125, "global_step": 472332, "epoch": 2811} {"train_loss": -12.261592864990234, "global_step": 472333, "epoch": 2811} {"train_loss": -12.250978469848633, "global_step": 472334, "epoch": 2811} {"train_loss": -12.236896514892578, "global_step": 472335, "epoch": 2811} {"train_loss": -11.693338394165039, "global_step": 472336, "epoch": 2811} {"train_loss": -12.38055419921875, "global_step": 472337, "epoch": 2811} {"train_loss": -11.956092834472656, "global_step": 472338, "epoch": 2811} {"train_loss": -12.32963752746582, "global_step": 472339, "epoch": 2811} {"train_loss": -12.331878662109375, "global_step": 472340, "epoch": 2811} {"train_loss": -11.685224533081055, "global_step": 472341, "epoch": 2811} {"train_loss": -12.339710235595703, "global_step": 472342, "epoch": 2811} {"train_loss": -12.462703704833984, "global_step": 472343, "epoch": 2811} {"train_loss": -12.39933967590332, "global_step": 472344, "epoch": 2811} {"train_loss": -12.693435668945312, "global_step": 472345, "epoch": 2811} {"train_loss": -12.525253295898438, "global_step": 472346, "epoch": 2811} {"train_loss": -12.647703170776367, "global_step": 472347, "epoch": 2811} {"train_loss": -12.390154838562012, "global_step": 472348, "epoch": 2811} {"train_loss": -12.417783737182617, "global_step": 472349, "epoch": 2811} {"train_loss": -12.53311538696289, "global_step": 472350, "epoch": 2811} {"train_loss": -11.704927444458008, "global_step": 472351, "epoch": 2811} {"train_loss": -12.43634033203125, "global_step": 472352, "epoch": 2811} {"train_loss": -12.37014389038086, "global_step": 472353, "epoch": 2811} {"train_loss": -12.617685317993164, "global_step": 472354, "epoch": 2811} {"train_loss": -12.661423683166504, "global_step": 472355, "epoch": 2811} {"train_loss": -12.737306594848633, "global_step": 472356, "epoch": 2811} {"train_loss": -12.793478965759277, "global_step": 472357, "epoch": 2811} {"train_loss": -12.778800010681152, "global_step": 472358, "epoch": 2811} {"train_loss": -12.590627670288086, "global_step": 472359, "epoch": 2811} {"train_loss": -12.81895923614502, "global_step": 472360, "epoch": 2811} {"train_loss": -12.886139869689941, "global_step": 472361, "epoch": 2811} {"train_loss": -12.665454864501953, "global_step": 472362, "epoch": 2811} {"train_loss": -12.618566513061523, "global_step": 472363, "epoch": 2811} {"train_loss": -12.646062850952148, "global_step": 472364, "epoch": 2811} {"train_loss": -12.64628791809082, "global_step": 472365, "epoch": 2811} {"train_loss": -12.672155380249023, "global_step": 472366, "epoch": 2811} {"train_loss": -12.578337669372559, "global_step": 472367, "epoch": 2811} {"train_loss": -12.841501235961914, "global_step": 472368, "epoch": 2811} {"train_loss": -12.658063888549805, "global_step": 472369, "epoch": 2811} {"train_loss": -12.7994384765625, "global_step": 472370, "epoch": 2811} {"train_loss": -12.69898509979248, "global_step": 472371, "epoch": 2811} {"train_loss": -12.60746955871582, "global_step": 472372, "epoch": 2811} {"train_loss": -12.855620384216309, "global_step": 472373, "epoch": 2811} {"train_loss": -12.773006439208984, "global_step": 472374, "epoch": 2811} {"train_loss": -12.73337459564209, "global_step": 472375, "epoch": 2811} {"train_loss": -12.916117668151855, "global_step": 472376, "epoch": 2811} {"train_loss": -12.774211883544922, "global_step": 472377, "epoch": 2811} {"train_loss": -12.766417503356934, "global_step": 472378, "epoch": 2811} {"train_loss": -12.725320816040039, "global_step": 472379, "epoch": 2811} {"train_loss": -12.709531784057617, "global_step": 472380, "epoch": 2811} {"train_loss": -12.874725341796875, "global_step": 472381, "epoch": 2811} {"train_loss": -12.718469619750977, "global_step": 472382, "epoch": 2811} {"train_loss": -12.816368103027344, "global_step": 472383, "epoch": 2811} {"train_loss": -12.908224105834961, "global_step": 472384, "epoch": 2811} {"train_loss": -12.765496253967285, "global_step": 472385, "epoch": 2811} {"train_loss": -12.919576644897461, "global_step": 472386, "epoch": 2811} {"train_loss": -12.91048526763916, "global_step": 472387, "epoch": 2811} {"train_loss": -12.699053764343262, "global_step": 472388, "epoch": 2811} {"train_loss": -12.851630210876465, "global_step": 472389, "epoch": 2811} {"train_loss": -12.910112380981445, "global_step": 472390, "epoch": 2811} {"train_loss": -12.833919525146484, "global_step": 472391, "epoch": 2811} {"train_loss": -12.927986145019531, "global_step": 472392, "epoch": 2811} {"train_loss": -12.920694351196289, "global_step": 472393, "epoch": 2811} {"train_loss": -13.002718925476074, "global_step": 472394, "epoch": 2811} {"train_loss": -13.052162170410156, "global_step": 472395, "epoch": 2811} {"train_loss": -12.762228012084961, "global_step": 472396, "epoch": 2811} {"train_loss": -12.783685684204102, "global_step": 472397, "epoch": 2811} {"train_loss": -12.866523742675781, "global_step": 472398, "epoch": 2811} {"train_loss": -12.989265441894531, "global_step": 472399, "epoch": 2811} {"train_loss": -12.887105941772461, "global_step": 472400, "epoch": 2811} {"train_loss": -13.021740913391113, "global_step": 472401, "epoch": 2811} {"train_loss": -12.877704620361328, "global_step": 472402, "epoch": 2811} {"train_loss": -12.722211837768555, "global_step": 472403, "epoch": 2811} {"train_loss": -12.796104431152344, "global_step": 472404, "epoch": 2811} {"train_loss": -12.770915985107422, "global_step": 472405, "epoch": 2811} {"train_loss": -12.185476303100586, "global_step": 472406, "epoch": 2811} {"train_loss": -13.052694320678711, "global_step": 472407, "epoch": 2811} {"train_loss": -12.658370971679688, "global_step": 472408, "epoch": 2811} {"train_loss": -12.360782623291016, "global_step": 472409, "epoch": 2811} {"train_loss": -12.668710708618164, "global_step": 472410, "epoch": 2811} {"train_loss": -12.419740676879883, "global_step": 472411, "epoch": 2811} {"train_loss": -12.385177612304688, "global_step": 472412, "epoch": 2811} {"train_loss": -12.503178596496582, "global_step": 472413, "epoch": 2811} {"train_loss": -12.934820175170898, "global_step": 472414, "epoch": 2811} {"train_loss": -12.224923792339506, "global_step": 472415, "epoch": 2811, "val_loss": 312835.96875} {"train_loss": -12.50214958190918, "global_step": 472416, "epoch": 2812} {"train_loss": -12.84328842163086, "global_step": 472417, "epoch": 2812} {"train_loss": -12.638379096984863, "global_step": 472418, "epoch": 2812} {"train_loss": -12.614439010620117, "global_step": 472419, "epoch": 2812} {"train_loss": -12.647537231445312, "global_step": 472420, "epoch": 2812} {"train_loss": -12.687311172485352, "global_step": 472421, "epoch": 2812} {"train_loss": -12.505767822265625, "global_step": 472422, "epoch": 2812} {"train_loss": -12.398331642150879, "global_step": 472423, "epoch": 2812} {"train_loss": -11.799853324890137, "global_step": 472424, "epoch": 2812} {"train_loss": -12.07186508178711, "global_step": 472425, "epoch": 2812} {"train_loss": -11.438289642333984, "global_step": 472426, "epoch": 2812} {"train_loss": -10.604772567749023, "global_step": 472427, "epoch": 2812} {"train_loss": -12.245805740356445, "global_step": 472428, "epoch": 2812} {"train_loss": -10.77486801147461, "global_step": 472429, "epoch": 2812} {"train_loss": -11.193055152893066, "global_step": 472430, "epoch": 2812} {"train_loss": -10.767823219299316, "global_step": 472431, "epoch": 2812} {"train_loss": -12.054426193237305, "global_step": 472432, "epoch": 2812} {"train_loss": -10.970298767089844, "global_step": 472433, "epoch": 2812} {"train_loss": -11.1864652633667, "global_step": 472434, "epoch": 2812} {"train_loss": -11.417379379272461, "global_step": 472435, "epoch": 2812} {"train_loss": -11.338407516479492, "global_step": 472436, "epoch": 2812} {"train_loss": -11.426839828491211, "global_step": 472437, "epoch": 2812} {"train_loss": -11.261109352111816, "global_step": 472438, "epoch": 2812} {"train_loss": -12.361629486083984, "global_step": 472439, "epoch": 2812} {"train_loss": -10.921890258789062, "global_step": 472440, "epoch": 2812} {"train_loss": -11.313488006591797, "global_step": 472441, "epoch": 2812} {"train_loss": -11.704059600830078, "global_step": 472442, "epoch": 2812} {"train_loss": -11.48297119140625, "global_step": 472443, "epoch": 2812} {"train_loss": -12.170955657958984, "global_step": 472444, "epoch": 2812} {"train_loss": -10.145484924316406, "global_step": 472445, "epoch": 2812} {"train_loss": -10.656637191772461, "global_step": 472446, "epoch": 2812} {"train_loss": -10.231807708740234, "global_step": 472447, "epoch": 2812} {"train_loss": -11.507080078125, "global_step": 472448, "epoch": 2812} {"train_loss": -10.80329704284668, "global_step": 472449, "epoch": 2812} {"train_loss": -11.764248847961426, "global_step": 472450, "epoch": 2812} {"train_loss": -9.89805793762207, "global_step": 472451, "epoch": 2812} {"train_loss": -10.886966705322266, "global_step": 472452, "epoch": 2812} {"train_loss": -11.768924713134766, "global_step": 472453, "epoch": 2812} {"train_loss": -10.81804370880127, "global_step": 472454, "epoch": 2812} {"train_loss": -11.59447193145752, "global_step": 472455, "epoch": 2812} {"train_loss": -11.200919151306152, "global_step": 472456, "epoch": 2812} {"train_loss": -11.37852668762207, "global_step": 472457, "epoch": 2812} {"train_loss": -11.964807510375977, "global_step": 472458, "epoch": 2812} {"train_loss": -11.247859001159668, "global_step": 472459, "epoch": 2812} {"train_loss": -12.023592948913574, "global_step": 472460, "epoch": 2812} {"train_loss": -11.373842239379883, "global_step": 472461, "epoch": 2812} {"train_loss": -12.322856903076172, "global_step": 472462, "epoch": 2812} {"train_loss": -11.620823860168457, "global_step": 472463, "epoch": 2812} {"train_loss": -11.508734703063965, "global_step": 472464, "epoch": 2812} {"train_loss": -12.147737503051758, "global_step": 472465, "epoch": 2812} {"train_loss": -11.456226348876953, "global_step": 472466, "epoch": 2812} {"train_loss": -12.25552749633789, "global_step": 472467, "epoch": 2812} {"train_loss": -11.882745742797852, "global_step": 472468, "epoch": 2812} {"train_loss": -11.822795867919922, "global_step": 472469, "epoch": 2812} {"train_loss": -12.002115249633789, "global_step": 472470, "epoch": 2812} {"train_loss": -11.779928207397461, "global_step": 472471, "epoch": 2812} {"train_loss": -12.18471908569336, "global_step": 472472, "epoch": 2812} {"train_loss": -12.109831809997559, "global_step": 472473, "epoch": 2812} {"train_loss": -11.90229606628418, "global_step": 472474, "epoch": 2812} {"train_loss": -11.560468673706055, "global_step": 472475, "epoch": 2812} {"train_loss": -10.68678092956543, "global_step": 472476, "epoch": 2812} {"train_loss": -11.847556114196777, "global_step": 472477, "epoch": 2812} {"train_loss": -10.978906631469727, "global_step": 472478, "epoch": 2812} {"train_loss": -11.08458423614502, "global_step": 472479, "epoch": 2812} {"train_loss": -11.142190933227539, "global_step": 472480, "epoch": 2812} {"train_loss": -11.488448143005371, "global_step": 472481, "epoch": 2812} {"train_loss": -10.160398483276367, "global_step": 472482, "epoch": 2812} {"train_loss": -12.154715538024902, "global_step": 472483, "epoch": 2812} {"train_loss": -10.421239852905273, "global_step": 472484, "epoch": 2812} {"train_loss": -10.322609901428223, "global_step": 472485, "epoch": 2812} {"train_loss": -10.691469192504883, "global_step": 472486, "epoch": 2812} {"train_loss": -11.510530471801758, "global_step": 472487, "epoch": 2812} {"train_loss": -10.738737106323242, "global_step": 472488, "epoch": 2812} {"train_loss": -9.403465270996094, "global_step": 472489, "epoch": 2812} {"train_loss": -11.424200057983398, "global_step": 472490, "epoch": 2812} {"train_loss": -10.488483428955078, "global_step": 472491, "epoch": 2812} {"train_loss": -9.831731796264648, "global_step": 472492, "epoch": 2812} {"train_loss": -10.728635787963867, "global_step": 472493, "epoch": 2812} {"train_loss": -10.691666603088379, "global_step": 472494, "epoch": 2812} {"train_loss": -10.321481704711914, "global_step": 472495, "epoch": 2812} {"train_loss": -10.262588500976562, "global_step": 472496, "epoch": 2812} {"train_loss": -10.283284187316895, "global_step": 472497, "epoch": 2812} {"train_loss": -10.916988372802734, "global_step": 472498, "epoch": 2812} {"train_loss": -9.890870094299316, "global_step": 472499, "epoch": 2812} {"train_loss": -11.497536659240723, "global_step": 472500, "epoch": 2812} {"train_loss": -10.880526542663574, "global_step": 472501, "epoch": 2812} {"train_loss": -11.62365436553955, "global_step": 472502, "epoch": 2812} {"train_loss": -11.791950225830078, "global_step": 472503, "epoch": 2812} {"train_loss": -11.736648559570312, "global_step": 472504, "epoch": 2812} {"train_loss": -11.968528747558594, "global_step": 472505, "epoch": 2812} {"train_loss": -11.749963760375977, "global_step": 472506, "epoch": 2812} {"train_loss": -11.512463569641113, "global_step": 472507, "epoch": 2812} {"train_loss": -12.286285400390625, "global_step": 472508, "epoch": 2812} {"train_loss": -11.764793395996094, "global_step": 472509, "epoch": 2812} {"train_loss": -11.966264724731445, "global_step": 472510, "epoch": 2812} {"train_loss": -11.861343383789062, "global_step": 472511, "epoch": 2812} {"train_loss": -11.8037691116333, "global_step": 472512, "epoch": 2812} {"train_loss": -12.268190383911133, "global_step": 472513, "epoch": 2812} {"train_loss": -11.755303382873535, "global_step": 472514, "epoch": 2812} {"train_loss": -11.913626670837402, "global_step": 472515, "epoch": 2812} {"train_loss": -12.006842613220215, "global_step": 472516, "epoch": 2812} {"train_loss": -12.225658416748047, "global_step": 472517, "epoch": 2812} {"train_loss": -11.891814231872559, "global_step": 472518, "epoch": 2812} {"train_loss": -12.16727066040039, "global_step": 472519, "epoch": 2812} {"train_loss": -11.165735244750977, "global_step": 472520, "epoch": 2812} {"train_loss": -12.221410751342773, "global_step": 472521, "epoch": 2812} {"train_loss": -12.087532997131348, "global_step": 472522, "epoch": 2812} {"train_loss": -12.470674514770508, "global_step": 472523, "epoch": 2812} {"train_loss": -12.013082504272461, "global_step": 472524, "epoch": 2812} {"train_loss": -12.286209106445312, "global_step": 472525, "epoch": 2812} {"train_loss": -12.128633499145508, "global_step": 472526, "epoch": 2812} {"train_loss": -12.128393173217773, "global_step": 472527, "epoch": 2812} {"train_loss": -12.252401351928711, "global_step": 472528, "epoch": 2812} {"train_loss": -11.83355712890625, "global_step": 472529, "epoch": 2812} {"train_loss": -12.148000717163086, "global_step": 472530, "epoch": 2812} {"train_loss": -11.973684310913086, "global_step": 472531, "epoch": 2812} {"train_loss": -12.38349437713623, "global_step": 472532, "epoch": 2812} {"train_loss": -12.058632850646973, "global_step": 472533, "epoch": 2812} {"train_loss": -12.43923568725586, "global_step": 472534, "epoch": 2812} {"train_loss": -12.479039192199707, "global_step": 472535, "epoch": 2812} {"train_loss": -12.281793594360352, "global_step": 472536, "epoch": 2812} {"train_loss": -12.183835983276367, "global_step": 472537, "epoch": 2812} {"train_loss": -12.405241966247559, "global_step": 472538, "epoch": 2812} {"train_loss": -12.287824630737305, "global_step": 472539, "epoch": 2812} {"train_loss": -11.921128273010254, "global_step": 472540, "epoch": 2812} {"train_loss": -12.572124481201172, "global_step": 472541, "epoch": 2812} {"train_loss": -12.167976379394531, "global_step": 472542, "epoch": 2812} {"train_loss": -12.404312133789062, "global_step": 472543, "epoch": 2812} {"train_loss": -12.235956192016602, "global_step": 472544, "epoch": 2812} {"train_loss": -12.256084442138672, "global_step": 472545, "epoch": 2812} {"train_loss": -12.31978988647461, "global_step": 472546, "epoch": 2812} {"train_loss": -12.490233421325684, "global_step": 472547, "epoch": 2812} {"train_loss": -12.442554473876953, "global_step": 472548, "epoch": 2812} {"train_loss": -12.554828643798828, "global_step": 472549, "epoch": 2812} {"train_loss": -12.329801559448242, "global_step": 472550, "epoch": 2812} {"train_loss": -12.52505874633789, "global_step": 472551, "epoch": 2812} {"train_loss": -12.482327461242676, "global_step": 472552, "epoch": 2812} {"train_loss": -12.2512845993042, "global_step": 472553, "epoch": 2812} {"train_loss": -12.582611083984375, "global_step": 472554, "epoch": 2812} {"train_loss": -12.402257919311523, "global_step": 472555, "epoch": 2812} {"train_loss": -12.302726745605469, "global_step": 472556, "epoch": 2812} {"train_loss": -12.411312103271484, "global_step": 472557, "epoch": 2812} {"train_loss": -12.371782302856445, "global_step": 472558, "epoch": 2812} {"train_loss": -12.368083000183105, "global_step": 472559, "epoch": 2812} {"train_loss": -12.666362762451172, "global_step": 472560, "epoch": 2812} {"train_loss": -12.588603019714355, "global_step": 472561, "epoch": 2812} {"train_loss": -12.41441535949707, "global_step": 472562, "epoch": 2812} {"train_loss": -12.388967514038086, "global_step": 472563, "epoch": 2812} {"train_loss": -12.671615600585938, "global_step": 472564, "epoch": 2812} {"train_loss": -12.750847816467285, "global_step": 472565, "epoch": 2812} {"train_loss": -12.723993301391602, "global_step": 472566, "epoch": 2812} {"train_loss": -12.437450408935547, "global_step": 472567, "epoch": 2812} {"train_loss": -12.684255599975586, "global_step": 472568, "epoch": 2812} {"train_loss": -12.555606842041016, "global_step": 472569, "epoch": 2812} {"train_loss": -12.726322174072266, "global_step": 472570, "epoch": 2812} {"train_loss": -12.665128707885742, "global_step": 472571, "epoch": 2812} {"train_loss": -12.677881240844727, "global_step": 472572, "epoch": 2812} {"train_loss": -12.822259902954102, "global_step": 472573, "epoch": 2812} {"train_loss": -12.71497917175293, "global_step": 472574, "epoch": 2812} {"train_loss": -12.617720603942871, "global_step": 472575, "epoch": 2812} {"train_loss": -12.630664825439453, "global_step": 472576, "epoch": 2812} {"train_loss": -12.873215675354004, "global_step": 472577, "epoch": 2812} {"train_loss": -12.699441909790039, "global_step": 472578, "epoch": 2812} {"train_loss": -12.633049011230469, "global_step": 472579, "epoch": 2812} {"train_loss": -12.766026496887207, "global_step": 472580, "epoch": 2812} {"train_loss": -12.807632446289062, "global_step": 472581, "epoch": 2812} {"train_loss": -12.869730949401855, "global_step": 472582, "epoch": 2812} {"train_loss": -11.820431158656167, "global_step": 472583, "epoch": 2812, "val_loss": 318069.125} {"train_loss": -12.844388961791992, "global_step": 472584, "epoch": 2813} {"train_loss": -12.757906913757324, "global_step": 472585, "epoch": 2813} {"train_loss": -12.52001667022705, "global_step": 472586, "epoch": 2813} {"train_loss": -12.746953964233398, "global_step": 472587, "epoch": 2813} {"train_loss": -12.557806015014648, "global_step": 472588, "epoch": 2813} {"train_loss": -12.408557891845703, "global_step": 472589, "epoch": 2813} {"train_loss": -12.7310791015625, "global_step": 472590, "epoch": 2813} {"train_loss": -12.359391212463379, "global_step": 472591, "epoch": 2813} {"train_loss": -12.679529190063477, "global_step": 472592, "epoch": 2813} {"train_loss": -12.391813278198242, "global_step": 472593, "epoch": 2813} {"train_loss": -12.34927749633789, "global_step": 472594, "epoch": 2813} {"train_loss": -12.702861785888672, "global_step": 472595, "epoch": 2813} {"train_loss": -12.364699363708496, "global_step": 472596, "epoch": 2813} {"train_loss": -12.879690170288086, "global_step": 472597, "epoch": 2813} {"train_loss": -12.503768920898438, "global_step": 472598, "epoch": 2813} {"train_loss": -12.722644805908203, "global_step": 472599, "epoch": 2813} {"train_loss": -12.490038871765137, "global_step": 472600, "epoch": 2813} {"train_loss": -12.407632827758789, "global_step": 472601, "epoch": 2813} {"train_loss": -12.728967666625977, "global_step": 472602, "epoch": 2813} {"train_loss": -12.846395492553711, "global_step": 472603, "epoch": 2813} {"train_loss": -12.885271072387695, "global_step": 472604, "epoch": 2813} {"train_loss": -12.740555763244629, "global_step": 472605, "epoch": 2813} {"train_loss": -12.772746086120605, "global_step": 472606, "epoch": 2813} {"train_loss": -12.868406295776367, "global_step": 472607, "epoch": 2813} {"train_loss": -12.894298553466797, "global_step": 472608, "epoch": 2813} {"train_loss": -12.480804443359375, "global_step": 472609, "epoch": 2813} {"train_loss": -11.327142715454102, "global_step": 472610, "epoch": 2813} {"train_loss": -11.868707656860352, "global_step": 472611, "epoch": 2813} {"train_loss": -12.875158309936523, "global_step": 472612, "epoch": 2813} {"train_loss": -11.736361503601074, "global_step": 472613, "epoch": 2813} {"train_loss": -11.25547981262207, "global_step": 472614, "epoch": 2813} {"train_loss": -11.575928688049316, "global_step": 472615, "epoch": 2813} {"train_loss": -11.842630386352539, "global_step": 472616, "epoch": 2813} {"train_loss": -12.644514083862305, "global_step": 472617, "epoch": 2813} {"train_loss": -11.053081512451172, "global_step": 472618, "epoch": 2813} {"train_loss": -12.13149356842041, "global_step": 472619, "epoch": 2813} {"train_loss": -12.111612319946289, "global_step": 472620, "epoch": 2813} {"train_loss": -12.474984169006348, "global_step": 472621, "epoch": 2813} {"train_loss": -11.458629608154297, "global_step": 472622, "epoch": 2813} {"train_loss": -12.796480178833008, "global_step": 472623, "epoch": 2813} {"train_loss": -11.51591682434082, "global_step": 472624, "epoch": 2813} {"train_loss": -11.783141136169434, "global_step": 472625, "epoch": 2813} {"train_loss": -12.666199684143066, "global_step": 472626, "epoch": 2813} {"train_loss": -11.84666633605957, "global_step": 472627, "epoch": 2813} {"train_loss": -11.838180541992188, "global_step": 472628, "epoch": 2813} {"train_loss": -12.476072311401367, "global_step": 472629, "epoch": 2813} {"train_loss": -11.246988296508789, "global_step": 472630, "epoch": 2813} {"train_loss": -11.925457000732422, "global_step": 472631, "epoch": 2813} {"train_loss": -12.538209915161133, "global_step": 472632, "epoch": 2813} {"train_loss": -11.993337631225586, "global_step": 472633, "epoch": 2813} {"train_loss": -12.844690322875977, "global_step": 472634, "epoch": 2813} {"train_loss": -11.846242904663086, "global_step": 472635, "epoch": 2813} {"train_loss": -12.164896011352539, "global_step": 472636, "epoch": 2813} {"train_loss": -11.5956449508667, "global_step": 472637, "epoch": 2813} {"train_loss": -12.865351676940918, "global_step": 472638, "epoch": 2813} {"train_loss": -11.973443984985352, "global_step": 472639, "epoch": 2813} {"train_loss": -12.457673072814941, "global_step": 472640, "epoch": 2813} {"train_loss": -12.409928321838379, "global_step": 472641, "epoch": 2813} {"train_loss": -12.318199157714844, "global_step": 472642, "epoch": 2813} {"train_loss": -12.098859786987305, "global_step": 472643, "epoch": 2813} {"train_loss": -11.856870651245117, "global_step": 472644, "epoch": 2813} {"train_loss": -12.050453186035156, "global_step": 472645, "epoch": 2813} {"train_loss": -11.669930458068848, "global_step": 472646, "epoch": 2813} {"train_loss": -12.320377349853516, "global_step": 472647, "epoch": 2813} {"train_loss": -11.387228012084961, "global_step": 472648, "epoch": 2813} {"train_loss": -12.790119171142578, "global_step": 472649, "epoch": 2813} {"train_loss": -11.700623512268066, "global_step": 472650, "epoch": 2813} {"train_loss": -12.382795333862305, "global_step": 472651, "epoch": 2813} {"train_loss": -11.475190162658691, "global_step": 472652, "epoch": 2813} {"train_loss": -12.447288513183594, "global_step": 472653, "epoch": 2813} {"train_loss": -12.057280540466309, "global_step": 472654, "epoch": 2813} {"train_loss": -12.020967483520508, "global_step": 472655, "epoch": 2813} {"train_loss": -12.620189666748047, "global_step": 472656, "epoch": 2813} {"train_loss": -11.603409767150879, "global_step": 472657, "epoch": 2813} {"train_loss": -12.819219589233398, "global_step": 472658, "epoch": 2813} {"train_loss": -12.029525756835938, "global_step": 472659, "epoch": 2813} {"train_loss": -12.50827407836914, "global_step": 472660, "epoch": 2813} {"train_loss": -12.685285568237305, "global_step": 472661, "epoch": 2813} {"train_loss": -12.11379623413086, "global_step": 472662, "epoch": 2813} {"train_loss": -12.625753402709961, "global_step": 472663, "epoch": 2813} {"train_loss": -11.722444534301758, "global_step": 472664, "epoch": 2813} {"train_loss": -12.611895561218262, "global_step": 472665, "epoch": 2813} {"train_loss": -12.288656234741211, "global_step": 472666, "epoch": 2813} {"train_loss": -12.108043670654297, "global_step": 472667, "epoch": 2813} {"train_loss": -11.8787260055542, "global_step": 472668, "epoch": 2813} {"train_loss": -11.751408576965332, "global_step": 472669, "epoch": 2813} {"train_loss": -12.05984878540039, "global_step": 472670, "epoch": 2813} {"train_loss": -11.584285736083984, "global_step": 472671, "epoch": 2813} {"train_loss": -12.238252639770508, "global_step": 472672, "epoch": 2813} {"train_loss": -12.258403778076172, "global_step": 472673, "epoch": 2813} {"train_loss": -11.123625755310059, "global_step": 472674, "epoch": 2813} {"train_loss": -11.196019172668457, "global_step": 472675, "epoch": 2813} {"train_loss": -12.290872573852539, "global_step": 472676, "epoch": 2813} {"train_loss": -11.702817916870117, "global_step": 472677, "epoch": 2813} {"train_loss": -10.938192367553711, "global_step": 472678, "epoch": 2813} {"train_loss": -11.759838104248047, "global_step": 472679, "epoch": 2813} {"train_loss": -10.208345413208008, "global_step": 472680, "epoch": 2813} {"train_loss": -11.563525199890137, "global_step": 472681, "epoch": 2813} {"train_loss": -10.82009220123291, "global_step": 472682, "epoch": 2813} {"train_loss": -10.625690460205078, "global_step": 472683, "epoch": 2813} {"train_loss": -11.575091361999512, "global_step": 472684, "epoch": 2813} {"train_loss": -11.355079650878906, "global_step": 472685, "epoch": 2813} {"train_loss": -12.061482429504395, "global_step": 472686, "epoch": 2813} {"train_loss": -12.106855392456055, "global_step": 472687, "epoch": 2813} {"train_loss": -12.254655838012695, "global_step": 472688, "epoch": 2813} {"train_loss": -12.06941032409668, "global_step": 472689, "epoch": 2813} {"train_loss": -12.174483299255371, "global_step": 472690, "epoch": 2813} {"train_loss": -11.948652267456055, "global_step": 472691, "epoch": 2813} {"train_loss": -12.591690063476562, "global_step": 472692, "epoch": 2813} {"train_loss": -12.08302116394043, "global_step": 472693, "epoch": 2813} {"train_loss": -12.06325912475586, "global_step": 472694, "epoch": 2813} {"train_loss": -12.090662002563477, "global_step": 472695, "epoch": 2813} {"train_loss": -11.686798095703125, "global_step": 472696, "epoch": 2813} {"train_loss": -11.328607559204102, "global_step": 472697, "epoch": 2813} {"train_loss": -12.117177963256836, "global_step": 472698, "epoch": 2813} {"train_loss": -11.913604736328125, "global_step": 472699, "epoch": 2813} {"train_loss": -12.420341491699219, "global_step": 472700, "epoch": 2813} {"train_loss": -11.780378341674805, "global_step": 472701, "epoch": 2813} {"train_loss": -12.253166198730469, "global_step": 472702, "epoch": 2813} {"train_loss": -12.075057983398438, "global_step": 472703, "epoch": 2813} {"train_loss": -12.39608383178711, "global_step": 472704, "epoch": 2813} {"train_loss": -12.392799377441406, "global_step": 472705, "epoch": 2813} {"train_loss": -12.402735710144043, "global_step": 472706, "epoch": 2813} {"train_loss": -12.66388988494873, "global_step": 472707, "epoch": 2813} {"train_loss": -12.173891067504883, "global_step": 472708, "epoch": 2813} {"train_loss": -12.456960678100586, "global_step": 472709, "epoch": 2813} {"train_loss": -12.365575790405273, "global_step": 472710, "epoch": 2813} {"train_loss": -12.330408096313477, "global_step": 472711, "epoch": 2813} {"train_loss": -12.36165714263916, "global_step": 472712, "epoch": 2813} {"train_loss": -12.126764297485352, "global_step": 472713, "epoch": 2813} {"train_loss": -12.345136642456055, "global_step": 472714, "epoch": 2813} {"train_loss": -12.22315502166748, "global_step": 472715, "epoch": 2813} {"train_loss": -12.308987617492676, "global_step": 472716, "epoch": 2813} {"train_loss": -12.388965606689453, "global_step": 472717, "epoch": 2813} {"train_loss": -12.604742050170898, "global_step": 472718, "epoch": 2813} {"train_loss": -12.212356567382812, "global_step": 472719, "epoch": 2813} {"train_loss": -12.19835090637207, "global_step": 472720, "epoch": 2813} {"train_loss": -12.387531280517578, "global_step": 472721, "epoch": 2813} {"train_loss": -11.74951457977295, "global_step": 472722, "epoch": 2813} {"train_loss": -12.336673736572266, "global_step": 472723, "epoch": 2813} {"train_loss": -11.542407035827637, "global_step": 472724, "epoch": 2813} {"train_loss": -12.179911613464355, "global_step": 472725, "epoch": 2813} {"train_loss": -11.999629974365234, "global_step": 472726, "epoch": 2813} {"train_loss": -12.414040565490723, "global_step": 472727, "epoch": 2813} {"train_loss": -12.394359588623047, "global_step": 472728, "epoch": 2813} {"train_loss": -11.945405006408691, "global_step": 472729, "epoch": 2813} {"train_loss": -12.655356407165527, "global_step": 472730, "epoch": 2813} {"train_loss": -11.983417510986328, "global_step": 472731, "epoch": 2813} {"train_loss": -12.321247100830078, "global_step": 472732, "epoch": 2813} {"train_loss": -12.254880905151367, "global_step": 472733, "epoch": 2813} {"train_loss": -12.05789566040039, "global_step": 472734, "epoch": 2813} {"train_loss": -12.49616813659668, "global_step": 472735, "epoch": 2813} {"train_loss": -12.608091354370117, "global_step": 472736, "epoch": 2813} {"train_loss": -12.492573738098145, "global_step": 472737, "epoch": 2813} {"train_loss": -12.422639846801758, "global_step": 472738, "epoch": 2813} {"train_loss": -12.430213928222656, "global_step": 472739, "epoch": 2813} {"train_loss": -12.09554672241211, "global_step": 472740, "epoch": 2813} {"train_loss": -12.610432624816895, "global_step": 472741, "epoch": 2813} {"train_loss": -12.442975044250488, "global_step": 472742, "epoch": 2813} {"train_loss": -11.770711898803711, "global_step": 472743, "epoch": 2813} {"train_loss": -12.767913818359375, "global_step": 472744, "epoch": 2813} {"train_loss": -11.641433715820312, "global_step": 472745, "epoch": 2813} {"train_loss": -12.323278427124023, "global_step": 472746, "epoch": 2813} {"train_loss": -12.267589569091797, "global_step": 472747, "epoch": 2813} {"train_loss": -11.678655624389648, "global_step": 472748, "epoch": 2813} {"train_loss": -12.552916526794434, "global_step": 472749, "epoch": 2813} {"train_loss": -12.333356857299805, "global_step": 472750, "epoch": 2813} {"train_loss": -12.164938869930449, "global_step": 472751, "epoch": 2813, "val_loss": 317014.46875} {"train_loss": -12.111730575561523, "global_step": 472752, "epoch": 2814} {"train_loss": -12.356746673583984, "global_step": 472753, "epoch": 2814} {"train_loss": -12.054007530212402, "global_step": 472754, "epoch": 2814} {"train_loss": -12.564645767211914, "global_step": 472755, "epoch": 2814} {"train_loss": -12.442127227783203, "global_step": 472756, "epoch": 2814} {"train_loss": -12.197125434875488, "global_step": 472757, "epoch": 2814} {"train_loss": -12.581633567810059, "global_step": 472758, "epoch": 2814} {"train_loss": -12.103837966918945, "global_step": 472759, "epoch": 2814} {"train_loss": -12.543140411376953, "global_step": 472760, "epoch": 2814} {"train_loss": -11.47081184387207, "global_step": 472761, "epoch": 2814} {"train_loss": -12.11575698852539, "global_step": 472762, "epoch": 2814} {"train_loss": -12.5779447555542, "global_step": 472763, "epoch": 2814} {"train_loss": -11.42195987701416, "global_step": 472764, "epoch": 2814} {"train_loss": -12.22779369354248, "global_step": 472765, "epoch": 2814} {"train_loss": -11.892330169677734, "global_step": 472766, "epoch": 2814} {"train_loss": -11.860160827636719, "global_step": 472767, "epoch": 2814} {"train_loss": -12.613040924072266, "global_step": 472768, "epoch": 2814} {"train_loss": -12.319153785705566, "global_step": 472769, "epoch": 2814} {"train_loss": -12.546501159667969, "global_step": 472770, "epoch": 2814} {"train_loss": -12.477950096130371, "global_step": 472771, "epoch": 2814} {"train_loss": -12.501157760620117, "global_step": 472772, "epoch": 2814} {"train_loss": -12.290321350097656, "global_step": 472773, "epoch": 2814} {"train_loss": -12.62547492980957, "global_step": 472774, "epoch": 2814} {"train_loss": -12.52935791015625, "global_step": 472775, "epoch": 2814} {"train_loss": -12.296625137329102, "global_step": 472776, "epoch": 2814} {"train_loss": -12.594783782958984, "global_step": 472777, "epoch": 2814} {"train_loss": -11.98331069946289, "global_step": 472778, "epoch": 2814} {"train_loss": -12.330848693847656, "global_step": 472779, "epoch": 2814} {"train_loss": -12.466978073120117, "global_step": 472780, "epoch": 2814} {"train_loss": -12.43748664855957, "global_step": 472781, "epoch": 2814} {"train_loss": -11.917516708374023, "global_step": 472782, "epoch": 2814} {"train_loss": -12.077603340148926, "global_step": 472783, "epoch": 2814} {"train_loss": -12.230598449707031, "global_step": 472784, "epoch": 2814} {"train_loss": -11.887002944946289, "global_step": 472785, "epoch": 2814} {"train_loss": -12.252996444702148, "global_step": 472786, "epoch": 2814} {"train_loss": -12.247440338134766, "global_step": 472787, "epoch": 2814} {"train_loss": -12.509242057800293, "global_step": 472788, "epoch": 2814} {"train_loss": -11.797450065612793, "global_step": 472789, "epoch": 2814} {"train_loss": -12.545150756835938, "global_step": 472790, "epoch": 2814} {"train_loss": -11.876578330993652, "global_step": 472791, "epoch": 2814} {"train_loss": -12.419241905212402, "global_step": 472792, "epoch": 2814} {"train_loss": -12.091469764709473, "global_step": 472793, "epoch": 2814} {"train_loss": -12.395540237426758, "global_step": 472794, "epoch": 2814} {"train_loss": -12.344720840454102, "global_step": 472795, "epoch": 2814} {"train_loss": -11.495996475219727, "global_step": 472796, "epoch": 2814} {"train_loss": -12.630552291870117, "global_step": 472797, "epoch": 2814} {"train_loss": -11.422760963439941, "global_step": 472798, "epoch": 2814} {"train_loss": -12.688492774963379, "global_step": 472799, "epoch": 2814} {"train_loss": -11.978279113769531, "global_step": 472800, "epoch": 2814} {"train_loss": -12.170769691467285, "global_step": 472801, "epoch": 2814} {"train_loss": -12.394186973571777, "global_step": 472802, "epoch": 2814} {"train_loss": -12.52309799194336, "global_step": 472803, "epoch": 2814} {"train_loss": -12.329036712646484, "global_step": 472804, "epoch": 2814} {"train_loss": -12.345130920410156, "global_step": 472805, "epoch": 2814} {"train_loss": -12.567946434020996, "global_step": 472806, "epoch": 2814} {"train_loss": -12.317148208618164, "global_step": 472807, "epoch": 2814} {"train_loss": -12.790092468261719, "global_step": 472808, "epoch": 2814} {"train_loss": -12.638104438781738, "global_step": 472809, "epoch": 2814} {"train_loss": -12.432978630065918, "global_step": 472810, "epoch": 2814} {"train_loss": -12.69577407836914, "global_step": 472811, "epoch": 2814} {"train_loss": -12.510808944702148, "global_step": 472812, "epoch": 2814} {"train_loss": -12.761767387390137, "global_step": 472813, "epoch": 2814} {"train_loss": -12.566620826721191, "global_step": 472814, "epoch": 2814} {"train_loss": -12.618413925170898, "global_step": 472815, "epoch": 2814} {"train_loss": -12.485725402832031, "global_step": 472816, "epoch": 2814} {"train_loss": -12.538209915161133, "global_step": 472817, "epoch": 2814} {"train_loss": -12.56671142578125, "global_step": 472818, "epoch": 2814} {"train_loss": -12.836831092834473, "global_step": 472819, "epoch": 2814} {"train_loss": -12.362213134765625, "global_step": 472820, "epoch": 2814} {"train_loss": -12.773996353149414, "global_step": 472821, "epoch": 2814} {"train_loss": -12.646016120910645, "global_step": 472822, "epoch": 2814} {"train_loss": -12.720924377441406, "global_step": 472823, "epoch": 2814} {"train_loss": -12.336568832397461, "global_step": 472824, "epoch": 2814} {"train_loss": -12.70542049407959, "global_step": 472825, "epoch": 2814} {"train_loss": -12.604795455932617, "global_step": 472826, "epoch": 2814} {"train_loss": -12.765125274658203, "global_step": 472827, "epoch": 2814} {"train_loss": -12.737991333007812, "global_step": 472828, "epoch": 2814} {"train_loss": -12.805266380310059, "global_step": 472829, "epoch": 2814} {"train_loss": -12.62273120880127, "global_step": 472830, "epoch": 2814} {"train_loss": -12.754826545715332, "global_step": 472831, "epoch": 2814} {"train_loss": -12.213149070739746, "global_step": 472832, "epoch": 2814} {"train_loss": -12.762580871582031, "global_step": 472833, "epoch": 2814} {"train_loss": -12.735161781311035, "global_step": 472834, "epoch": 2814} {"train_loss": -12.685953140258789, "global_step": 472835, "epoch": 2814} {"train_loss": -12.890829086303711, "global_step": 472836, "epoch": 2814} {"train_loss": -12.502424240112305, "global_step": 472837, "epoch": 2814} {"train_loss": -12.70281982421875, "global_step": 472838, "epoch": 2814} {"train_loss": -12.685379028320312, "global_step": 472839, "epoch": 2814} {"train_loss": -12.705022811889648, "global_step": 472840, "epoch": 2814} {"train_loss": -12.437318801879883, "global_step": 472841, "epoch": 2814} {"train_loss": -12.552587509155273, "global_step": 472842, "epoch": 2814} {"train_loss": -12.451187133789062, "global_step": 472843, "epoch": 2814} {"train_loss": -12.825691223144531, "global_step": 472844, "epoch": 2814} {"train_loss": -12.394190788269043, "global_step": 472845, "epoch": 2814} {"train_loss": -12.639350891113281, "global_step": 472846, "epoch": 2814} {"train_loss": -12.19743537902832, "global_step": 472847, "epoch": 2814} {"train_loss": -12.936989784240723, "global_step": 472848, "epoch": 2814} {"train_loss": -12.318944931030273, "global_step": 472849, "epoch": 2814} {"train_loss": -12.66554069519043, "global_step": 472850, "epoch": 2814} {"train_loss": -12.41712760925293, "global_step": 472851, "epoch": 2814} {"train_loss": -12.372312545776367, "global_step": 472852, "epoch": 2814} {"train_loss": -12.556957244873047, "global_step": 472853, "epoch": 2814} {"train_loss": -12.609668731689453, "global_step": 472854, "epoch": 2814} {"train_loss": -12.377695083618164, "global_step": 472855, "epoch": 2814} {"train_loss": -11.887153625488281, "global_step": 472856, "epoch": 2814} {"train_loss": -10.751404762268066, "global_step": 472857, "epoch": 2814} {"train_loss": -11.023353576660156, "global_step": 472858, "epoch": 2814} {"train_loss": -11.640321731567383, "global_step": 472859, "epoch": 2814} {"train_loss": -9.98985481262207, "global_step": 472860, "epoch": 2814} {"train_loss": -11.883563995361328, "global_step": 472861, "epoch": 2814} {"train_loss": -11.032247543334961, "global_step": 472862, "epoch": 2814} {"train_loss": -12.071194648742676, "global_step": 472863, "epoch": 2814} {"train_loss": -11.742587089538574, "global_step": 472864, "epoch": 2814} {"train_loss": -11.684171676635742, "global_step": 472865, "epoch": 2814} {"train_loss": -11.135292053222656, "global_step": 472866, "epoch": 2814} {"train_loss": -10.980714797973633, "global_step": 472867, "epoch": 2814} {"train_loss": -11.682999610900879, "global_step": 472868, "epoch": 2814} {"train_loss": -11.192756652832031, "global_step": 472869, "epoch": 2814} {"train_loss": -11.668930053710938, "global_step": 472870, "epoch": 2814} {"train_loss": -11.547616004943848, "global_step": 472871, "epoch": 2814} {"train_loss": -10.427131652832031, "global_step": 472872, "epoch": 2814} {"train_loss": -11.346761703491211, "global_step": 472873, "epoch": 2814} {"train_loss": -10.770002365112305, "global_step": 472874, "epoch": 2814} {"train_loss": -11.44626522064209, "global_step": 472875, "epoch": 2814} {"train_loss": -10.866676330566406, "global_step": 472876, "epoch": 2814} {"train_loss": -10.997359275817871, "global_step": 472877, "epoch": 2814} {"train_loss": -11.168098449707031, "global_step": 472878, "epoch": 2814} {"train_loss": -10.768213272094727, "global_step": 472879, "epoch": 2814} {"train_loss": -10.464876174926758, "global_step": 472880, "epoch": 2814} {"train_loss": -11.607857704162598, "global_step": 472881, "epoch": 2814} {"train_loss": -10.871617317199707, "global_step": 472882, "epoch": 2814} {"train_loss": -9.44273567199707, "global_step": 472883, "epoch": 2814} {"train_loss": -11.672576904296875, "global_step": 472884, "epoch": 2814} {"train_loss": -10.771428108215332, "global_step": 472885, "epoch": 2814} {"train_loss": -12.038278579711914, "global_step": 472886, "epoch": 2814} {"train_loss": -10.927051544189453, "global_step": 472887, "epoch": 2814} {"train_loss": -11.70170783996582, "global_step": 472888, "epoch": 2814} {"train_loss": -12.29023265838623, "global_step": 472889, "epoch": 2814} {"train_loss": -11.674395561218262, "global_step": 472890, "epoch": 2814} {"train_loss": -12.367691993713379, "global_step": 472891, "epoch": 2814} {"train_loss": -11.833952903747559, "global_step": 472892, "epoch": 2814} {"train_loss": -12.163087844848633, "global_step": 472893, "epoch": 2814} {"train_loss": -12.007553100585938, "global_step": 472894, "epoch": 2814} {"train_loss": -12.383420944213867, "global_step": 472895, "epoch": 2814} {"train_loss": -12.011926651000977, "global_step": 472896, "epoch": 2814} {"train_loss": -12.441165924072266, "global_step": 472897, "epoch": 2814} {"train_loss": -11.855876922607422, "global_step": 472898, "epoch": 2814} {"train_loss": -12.32082748413086, "global_step": 472899, "epoch": 2814} {"train_loss": -12.54782485961914, "global_step": 472900, "epoch": 2814} {"train_loss": -11.90374755859375, "global_step": 472901, "epoch": 2814} {"train_loss": -12.459239959716797, "global_step": 472902, "epoch": 2814} {"train_loss": -11.926612854003906, "global_step": 472903, "epoch": 2814} {"train_loss": -12.370193481445312, "global_step": 472904, "epoch": 2814} {"train_loss": -12.425246238708496, "global_step": 472905, "epoch": 2814} {"train_loss": -11.951086044311523, "global_step": 472906, "epoch": 2814} {"train_loss": -11.916959762573242, "global_step": 472907, "epoch": 2814} {"train_loss": -12.775182723999023, "global_step": 472908, "epoch": 2814} {"train_loss": -12.446576118469238, "global_step": 472909, "epoch": 2814} {"train_loss": -12.421638488769531, "global_step": 472910, "epoch": 2814} {"train_loss": -12.457802772521973, "global_step": 472911, "epoch": 2814} {"train_loss": -12.728006362915039, "global_step": 472912, "epoch": 2814} {"train_loss": -12.631481170654297, "global_step": 472913, "epoch": 2814} {"train_loss": -12.577685356140137, "global_step": 472914, "epoch": 2814} {"train_loss": -12.720710754394531, "global_step": 472915, "epoch": 2814} {"train_loss": -12.6031494140625, "global_step": 472916, "epoch": 2814} {"train_loss": -12.867935180664062, "global_step": 472917, "epoch": 2814} {"train_loss": -12.317970275878906, "global_step": 472918, "epoch": 2814} {"train_loss": -12.154841496830894, "global_step": 472919, "epoch": 2814, "val_loss": 316605.53125} {"train_loss": -12.561019897460938, "global_step": 472920, "epoch": 2815} {"train_loss": -12.17684268951416, "global_step": 472921, "epoch": 2815} {"train_loss": -12.614513397216797, "global_step": 472922, "epoch": 2815} {"train_loss": -12.51236343383789, "global_step": 472923, "epoch": 2815} {"train_loss": -11.867105484008789, "global_step": 472924, "epoch": 2815} {"train_loss": -12.728759765625, "global_step": 472925, "epoch": 2815} {"train_loss": -12.075901985168457, "global_step": 472926, "epoch": 2815} {"train_loss": -11.993240356445312, "global_step": 472927, "epoch": 2815} {"train_loss": -12.728338241577148, "global_step": 472928, "epoch": 2815} {"train_loss": -11.980780601501465, "global_step": 472929, "epoch": 2815} {"train_loss": -12.571950912475586, "global_step": 472930, "epoch": 2815} {"train_loss": -12.433467864990234, "global_step": 472931, "epoch": 2815} {"train_loss": -12.25694751739502, "global_step": 472932, "epoch": 2815} {"train_loss": -12.805107116699219, "global_step": 472933, "epoch": 2815} {"train_loss": -12.421096801757812, "global_step": 472934, "epoch": 2815} {"train_loss": -12.338294982910156, "global_step": 472935, "epoch": 2815} {"train_loss": -12.579934120178223, "global_step": 472936, "epoch": 2815} {"train_loss": -12.33156967163086, "global_step": 472937, "epoch": 2815} {"train_loss": -12.492365837097168, "global_step": 472938, "epoch": 2815} {"train_loss": -12.899575233459473, "global_step": 472939, "epoch": 2815} {"train_loss": -12.426630020141602, "global_step": 472940, "epoch": 2815} {"train_loss": -12.35249137878418, "global_step": 472941, "epoch": 2815} {"train_loss": -12.693584442138672, "global_step": 472942, "epoch": 2815} {"train_loss": -12.649030685424805, "global_step": 472943, "epoch": 2815} {"train_loss": -12.537212371826172, "global_step": 472944, "epoch": 2815} {"train_loss": -12.469449996948242, "global_step": 472945, "epoch": 2815} {"train_loss": -12.825257301330566, "global_step": 472946, "epoch": 2815} {"train_loss": -12.55601978302002, "global_step": 472947, "epoch": 2815} {"train_loss": -12.766623497009277, "global_step": 472948, "epoch": 2815} {"train_loss": -12.505077362060547, "global_step": 472949, "epoch": 2815} {"train_loss": -13.007551193237305, "global_step": 472950, "epoch": 2815} {"train_loss": -12.595793724060059, "global_step": 472951, "epoch": 2815} {"train_loss": -12.632386207580566, "global_step": 472952, "epoch": 2815} {"train_loss": -12.792519569396973, "global_step": 472953, "epoch": 2815} {"train_loss": -12.683241844177246, "global_step": 472954, "epoch": 2815} {"train_loss": -12.603035926818848, "global_step": 472955, "epoch": 2815} {"train_loss": -12.969151496887207, "global_step": 472956, "epoch": 2815} {"train_loss": -12.375030517578125, "global_step": 472957, "epoch": 2815} {"train_loss": -12.787583351135254, "global_step": 472958, "epoch": 2815} {"train_loss": -12.42011833190918, "global_step": 472959, "epoch": 2815} {"train_loss": -12.748315811157227, "global_step": 472960, "epoch": 2815} {"train_loss": -12.616945266723633, "global_step": 472961, "epoch": 2815} {"train_loss": -12.017960548400879, "global_step": 472962, "epoch": 2815} {"train_loss": -12.374063491821289, "global_step": 472963, "epoch": 2815} {"train_loss": -12.845755577087402, "global_step": 472964, "epoch": 2815} {"train_loss": -12.464178085327148, "global_step": 472965, "epoch": 2815} {"train_loss": -12.418219566345215, "global_step": 472966, "epoch": 2815} {"train_loss": -12.675381660461426, "global_step": 472967, "epoch": 2815} {"train_loss": -12.866361618041992, "global_step": 472968, "epoch": 2815} {"train_loss": -12.43370246887207, "global_step": 472969, "epoch": 2815} {"train_loss": -12.556807518005371, "global_step": 472970, "epoch": 2815} {"train_loss": -12.865110397338867, "global_step": 472971, "epoch": 2815} {"train_loss": -12.910828590393066, "global_step": 472972, "epoch": 2815} {"train_loss": -12.678976058959961, "global_step": 472973, "epoch": 2815} {"train_loss": -12.60867691040039, "global_step": 472974, "epoch": 2815} {"train_loss": -12.83356761932373, "global_step": 472975, "epoch": 2815} {"train_loss": -12.630096435546875, "global_step": 472976, "epoch": 2815} {"train_loss": -12.44886589050293, "global_step": 472977, "epoch": 2815} {"train_loss": -12.54582405090332, "global_step": 472978, "epoch": 2815} {"train_loss": -12.530393600463867, "global_step": 472979, "epoch": 2815} {"train_loss": -12.407115936279297, "global_step": 472980, "epoch": 2815} {"train_loss": -12.1053466796875, "global_step": 472981, "epoch": 2815} {"train_loss": -12.80038833618164, "global_step": 472982, "epoch": 2815} {"train_loss": -12.437707901000977, "global_step": 472983, "epoch": 2815} {"train_loss": -12.452598571777344, "global_step": 472984, "epoch": 2815} {"train_loss": -12.118367195129395, "global_step": 472985, "epoch": 2815} {"train_loss": -12.55728530883789, "global_step": 472986, "epoch": 2815} {"train_loss": -12.144417762756348, "global_step": 472987, "epoch": 2815} {"train_loss": -12.658092498779297, "global_step": 472988, "epoch": 2815} {"train_loss": -12.626502990722656, "global_step": 472989, "epoch": 2815} {"train_loss": -12.077363967895508, "global_step": 472990, "epoch": 2815} {"train_loss": -11.859634399414062, "global_step": 472991, "epoch": 2815} {"train_loss": -12.804082870483398, "global_step": 472992, "epoch": 2815} {"train_loss": -12.232505798339844, "global_step": 472993, "epoch": 2815} {"train_loss": -12.69294548034668, "global_step": 472994, "epoch": 2815} {"train_loss": -12.261711120605469, "global_step": 472995, "epoch": 2815} {"train_loss": -12.745138168334961, "global_step": 472996, "epoch": 2815} {"train_loss": -12.382001876831055, "global_step": 472997, "epoch": 2815} {"train_loss": -12.097765922546387, "global_step": 472998, "epoch": 2815} {"train_loss": -12.538185119628906, "global_step": 472999, "epoch": 2815} {"train_loss": -12.894701957702637, "global_step": 473000, "epoch": 2815} {"train_loss": -12.958738327026367, "global_step": 473001, "epoch": 2815} {"train_loss": -12.687426567077637, "global_step": 473002, "epoch": 2815} {"train_loss": -12.150215148925781, "global_step": 473003, "epoch": 2815} {"train_loss": -11.800094604492188, "global_step": 473004, "epoch": 2815} {"train_loss": -12.705011367797852, "global_step": 473005, "epoch": 2815} {"train_loss": -12.887904167175293, "global_step": 473006, "epoch": 2815} {"train_loss": -11.93597412109375, "global_step": 473007, "epoch": 2815} {"train_loss": -11.1895751953125, "global_step": 473008, "epoch": 2815} {"train_loss": -12.341642379760742, "global_step": 473009, "epoch": 2815} {"train_loss": -11.126626968383789, "global_step": 473010, "epoch": 2815} {"train_loss": -10.90833854675293, "global_step": 473011, "epoch": 2815} {"train_loss": -12.452503204345703, "global_step": 473012, "epoch": 2815} {"train_loss": -10.212292671203613, "global_step": 473013, "epoch": 2815} {"train_loss": -12.106792449951172, "global_step": 473014, "epoch": 2815} {"train_loss": -12.038219451904297, "global_step": 473015, "epoch": 2815} {"train_loss": -11.678442001342773, "global_step": 473016, "epoch": 2815} {"train_loss": -10.465108871459961, "global_step": 473017, "epoch": 2815} {"train_loss": -11.638528823852539, "global_step": 473018, "epoch": 2815} {"train_loss": -9.858537673950195, "global_step": 473019, "epoch": 2815} {"train_loss": -8.613212585449219, "global_step": 473020, "epoch": 2815} {"train_loss": -10.510401725769043, "global_step": 473021, "epoch": 2815} {"train_loss": -9.462457656860352, "global_step": 473022, "epoch": 2815} {"train_loss": -9.337791442871094, "global_step": 473023, "epoch": 2815} {"train_loss": -9.614767074584961, "global_step": 473024, "epoch": 2815} {"train_loss": -8.652166366577148, "global_step": 473025, "epoch": 2815} {"train_loss": -9.493152618408203, "global_step": 473026, "epoch": 2815} {"train_loss": -9.20417594909668, "global_step": 473027, "epoch": 2815} {"train_loss": -8.240701675415039, "global_step": 473028, "epoch": 2815} {"train_loss": -8.195601463317871, "global_step": 473029, "epoch": 2815} {"train_loss": -8.629133224487305, "global_step": 473030, "epoch": 2815} {"train_loss": -8.112464904785156, "global_step": 473031, "epoch": 2815} {"train_loss": -8.709012031555176, "global_step": 473032, "epoch": 2815} {"train_loss": -8.703662872314453, "global_step": 473033, "epoch": 2815} {"train_loss": -9.785435676574707, "global_step": 473034, "epoch": 2815} {"train_loss": -10.215980529785156, "global_step": 473035, "epoch": 2815} {"train_loss": -10.717679023742676, "global_step": 473036, "epoch": 2815} {"train_loss": -10.024374961853027, "global_step": 473037, "epoch": 2815} {"train_loss": -10.575750350952148, "global_step": 473038, "epoch": 2815} {"train_loss": -10.215022087097168, "global_step": 473039, "epoch": 2815} {"train_loss": -11.071496963500977, "global_step": 473040, "epoch": 2815} {"train_loss": -10.173609733581543, "global_step": 473041, "epoch": 2815} {"train_loss": -11.442338943481445, "global_step": 473042, "epoch": 2815} {"train_loss": -10.826229095458984, "global_step": 473043, "epoch": 2815} {"train_loss": -11.66681957244873, "global_step": 473044, "epoch": 2815} {"train_loss": -11.13890266418457, "global_step": 473045, "epoch": 2815} {"train_loss": -11.672271728515625, "global_step": 473046, "epoch": 2815} {"train_loss": -10.597070693969727, "global_step": 473047, "epoch": 2815} {"train_loss": -11.113481521606445, "global_step": 473048, "epoch": 2815} {"train_loss": -11.472232818603516, "global_step": 473049, "epoch": 2815} {"train_loss": -11.284972190856934, "global_step": 473050, "epoch": 2815} {"train_loss": -11.540933609008789, "global_step": 473051, "epoch": 2815} {"train_loss": -11.865081787109375, "global_step": 473052, "epoch": 2815} {"train_loss": -10.640682220458984, "global_step": 473053, "epoch": 2815} {"train_loss": -12.048604011535645, "global_step": 473054, "epoch": 2815} {"train_loss": -10.0126953125, "global_step": 473055, "epoch": 2815} {"train_loss": -12.037768363952637, "global_step": 473056, "epoch": 2815} {"train_loss": -11.12775993347168, "global_step": 473057, "epoch": 2815} {"train_loss": -11.45461654663086, "global_step": 473058, "epoch": 2815} {"train_loss": -11.164148330688477, "global_step": 473059, "epoch": 2815} {"train_loss": -11.686752319335938, "global_step": 473060, "epoch": 2815} {"train_loss": -11.39615249633789, "global_step": 473061, "epoch": 2815} {"train_loss": -11.9143648147583, "global_step": 473062, "epoch": 2815} {"train_loss": -11.78369140625, "global_step": 473063, "epoch": 2815} {"train_loss": -12.042096138000488, "global_step": 473064, "epoch": 2815} {"train_loss": -11.642441749572754, "global_step": 473065, "epoch": 2815} {"train_loss": -11.61799144744873, "global_step": 473066, "epoch": 2815} {"train_loss": -12.008010864257812, "global_step": 473067, "epoch": 2815} {"train_loss": -11.513203620910645, "global_step": 473068, "epoch": 2815} {"train_loss": -11.839919090270996, "global_step": 473069, "epoch": 2815} {"train_loss": -11.95224380493164, "global_step": 473070, "epoch": 2815} {"train_loss": -11.799308776855469, "global_step": 473071, "epoch": 2815} {"train_loss": -11.687628746032715, "global_step": 473072, "epoch": 2815} {"train_loss": -11.998130798339844, "global_step": 473073, "epoch": 2815} {"train_loss": -11.39516830444336, "global_step": 473074, "epoch": 2815} {"train_loss": -12.235501289367676, "global_step": 473075, "epoch": 2815} {"train_loss": -11.616687774658203, "global_step": 473076, "epoch": 2815} {"train_loss": -12.106805801391602, "global_step": 473077, "epoch": 2815} {"train_loss": -11.978139877319336, "global_step": 473078, "epoch": 2815} {"train_loss": -12.151485443115234, "global_step": 473079, "epoch": 2815} {"train_loss": -11.645652770996094, "global_step": 473080, "epoch": 2815} {"train_loss": -12.40613842010498, "global_step": 473081, "epoch": 2815} {"train_loss": -11.97702407836914, "global_step": 473082, "epoch": 2815} {"train_loss": -12.288270950317383, "global_step": 473083, "epoch": 2815} {"train_loss": -12.14864444732666, "global_step": 473084, "epoch": 2815} {"train_loss": -12.384065628051758, "global_step": 473085, "epoch": 2815} {"train_loss": -12.373149871826172, "global_step": 473086, "epoch": 2815} {"train_loss": -11.800869243485588, "global_step": 473087, "epoch": 2815, "val_loss": 309003.09375, "train_action_mse_error": 1.9222922325134277} {"train_loss": -12.453958511352539, "global_step": 473088, "epoch": 2816} {"train_loss": -12.395711898803711, "global_step": 473089, "epoch": 2816} {"train_loss": -12.536253929138184, "global_step": 473090, "epoch": 2816} {"train_loss": -12.400225639343262, "global_step": 473091, "epoch": 2816} {"train_loss": -12.541923522949219, "global_step": 473092, "epoch": 2816} {"train_loss": -12.341164588928223, "global_step": 473093, "epoch": 2816} {"train_loss": -12.5243501663208, "global_step": 473094, "epoch": 2816} {"train_loss": -12.525716781616211, "global_step": 473095, "epoch": 2816} {"train_loss": -12.701844215393066, "global_step": 473096, "epoch": 2816} {"train_loss": -12.555208206176758, "global_step": 473097, "epoch": 2816} {"train_loss": -12.550825119018555, "global_step": 473098, "epoch": 2816} {"train_loss": -12.451740264892578, "global_step": 473099, "epoch": 2816} {"train_loss": -12.556833267211914, "global_step": 473100, "epoch": 2816} {"train_loss": -12.553688049316406, "global_step": 473101, "epoch": 2816} {"train_loss": -12.677565574645996, "global_step": 473102, "epoch": 2816} {"train_loss": -12.581793785095215, "global_step": 473103, "epoch": 2816} {"train_loss": -12.747777938842773, "global_step": 473104, "epoch": 2816} {"train_loss": -12.493664741516113, "global_step": 473105, "epoch": 2816} {"train_loss": -12.64150619506836, "global_step": 473106, "epoch": 2816} {"train_loss": -12.468198776245117, "global_step": 473107, "epoch": 2816} {"train_loss": -12.594425201416016, "global_step": 473108, "epoch": 2816} {"train_loss": -12.190561294555664, "global_step": 473109, "epoch": 2816} {"train_loss": -12.659708976745605, "global_step": 473110, "epoch": 2816} {"train_loss": -12.524950981140137, "global_step": 473111, "epoch": 2816} {"train_loss": -12.548868179321289, "global_step": 473112, "epoch": 2816} {"train_loss": -12.502647399902344, "global_step": 473113, "epoch": 2816} {"train_loss": -12.296070098876953, "global_step": 473114, "epoch": 2816} {"train_loss": -12.623857498168945, "global_step": 473115, "epoch": 2816} {"train_loss": -12.441106796264648, "global_step": 473116, "epoch": 2816} {"train_loss": -12.620328903198242, "global_step": 473117, "epoch": 2816} {"train_loss": -12.599502563476562, "global_step": 473118, "epoch": 2816} {"train_loss": -12.61696720123291, "global_step": 473119, "epoch": 2816} {"train_loss": -12.70344352722168, "global_step": 473120, "epoch": 2816} {"train_loss": -12.63534164428711, "global_step": 473121, "epoch": 2816} {"train_loss": -12.44307804107666, "global_step": 473122, "epoch": 2816} {"train_loss": -12.617120742797852, "global_step": 473123, "epoch": 2816} {"train_loss": -12.517280578613281, "global_step": 473124, "epoch": 2816} {"train_loss": -12.589777946472168, "global_step": 473125, "epoch": 2816} {"train_loss": -12.401069641113281, "global_step": 473126, "epoch": 2816} {"train_loss": -12.54037094116211, "global_step": 473127, "epoch": 2816} {"train_loss": -12.16919994354248, "global_step": 473128, "epoch": 2816} {"train_loss": -12.384533882141113, "global_step": 473129, "epoch": 2816} {"train_loss": -12.636468887329102, "global_step": 473130, "epoch": 2816} {"train_loss": -12.689154624938965, "global_step": 473131, "epoch": 2816} {"train_loss": -12.566500663757324, "global_step": 473132, "epoch": 2816} {"train_loss": -12.641647338867188, "global_step": 473133, "epoch": 2816} {"train_loss": -12.592844009399414, "global_step": 473134, "epoch": 2816} {"train_loss": -12.608561515808105, "global_step": 473135, "epoch": 2816} {"train_loss": -12.832340240478516, "global_step": 473136, "epoch": 2816} {"train_loss": -12.754779815673828, "global_step": 473137, "epoch": 2816} {"train_loss": -12.474701881408691, "global_step": 473138, "epoch": 2816} {"train_loss": -12.826339721679688, "global_step": 473139, "epoch": 2816} {"train_loss": -12.63565444946289, "global_step": 473140, "epoch": 2816} {"train_loss": -12.501388549804688, "global_step": 473141, "epoch": 2816} {"train_loss": -12.733110427856445, "global_step": 473142, "epoch": 2816} {"train_loss": -12.726343154907227, "global_step": 473143, "epoch": 2816} {"train_loss": -12.529467582702637, "global_step": 473144, "epoch": 2816} {"train_loss": -12.55756664276123, "global_step": 473145, "epoch": 2816} {"train_loss": -12.104021072387695, "global_step": 473146, "epoch": 2816} {"train_loss": -12.923957824707031, "global_step": 473147, "epoch": 2816} {"train_loss": -12.420421600341797, "global_step": 473148, "epoch": 2816} {"train_loss": -12.087944030761719, "global_step": 473149, "epoch": 2816} {"train_loss": -11.646071434020996, "global_step": 473150, "epoch": 2816} {"train_loss": -12.833230972290039, "global_step": 473151, "epoch": 2816} {"train_loss": -11.385824203491211, "global_step": 473152, "epoch": 2816} {"train_loss": -12.232196807861328, "global_step": 473153, "epoch": 2816} {"train_loss": -12.47603988647461, "global_step": 473154, "epoch": 2816} {"train_loss": -11.521295547485352, "global_step": 473155, "epoch": 2816} {"train_loss": -12.16275405883789, "global_step": 473156, "epoch": 2816} {"train_loss": -11.951719284057617, "global_step": 473157, "epoch": 2816} {"train_loss": -11.694608688354492, "global_step": 473158, "epoch": 2816} {"train_loss": -12.075723648071289, "global_step": 473159, "epoch": 2816} {"train_loss": -11.662416458129883, "global_step": 473160, "epoch": 2816} {"train_loss": -11.875062942504883, "global_step": 473161, "epoch": 2816} {"train_loss": -11.406606674194336, "global_step": 473162, "epoch": 2816} {"train_loss": -11.929265975952148, "global_step": 473163, "epoch": 2816} {"train_loss": -11.508637428283691, "global_step": 473164, "epoch": 2816} {"train_loss": -12.445247650146484, "global_step": 473165, "epoch": 2816} {"train_loss": -11.877359390258789, "global_step": 473166, "epoch": 2816} {"train_loss": -12.27957820892334, "global_step": 473167, "epoch": 2816} {"train_loss": -12.514073371887207, "global_step": 473168, "epoch": 2816} {"train_loss": -11.592767715454102, "global_step": 473169, "epoch": 2816} {"train_loss": -12.173219680786133, "global_step": 473170, "epoch": 2816} {"train_loss": -12.580244064331055, "global_step": 473171, "epoch": 2816} {"train_loss": -11.670406341552734, "global_step": 473172, "epoch": 2816} {"train_loss": -12.685179710388184, "global_step": 473173, "epoch": 2816} {"train_loss": -11.942224502563477, "global_step": 473174, "epoch": 2816} {"train_loss": -12.812352180480957, "global_step": 473175, "epoch": 2816} {"train_loss": -12.099271774291992, "global_step": 473176, "epoch": 2816} {"train_loss": -12.456867218017578, "global_step": 473177, "epoch": 2816} {"train_loss": -11.554906845092773, "global_step": 473178, "epoch": 2816} {"train_loss": -12.63428020477295, "global_step": 473179, "epoch": 2816} {"train_loss": -11.978309631347656, "global_step": 473180, "epoch": 2816} {"train_loss": -12.435922622680664, "global_step": 473181, "epoch": 2816} {"train_loss": -12.211073875427246, "global_step": 473182, "epoch": 2816} {"train_loss": -12.367975234985352, "global_step": 473183, "epoch": 2816} {"train_loss": -12.42182731628418, "global_step": 473184, "epoch": 2816} {"train_loss": -12.108964920043945, "global_step": 473185, "epoch": 2816} {"train_loss": -12.69216251373291, "global_step": 473186, "epoch": 2816} {"train_loss": -12.268792152404785, "global_step": 473187, "epoch": 2816} {"train_loss": -12.469402313232422, "global_step": 473188, "epoch": 2816} {"train_loss": -12.385834693908691, "global_step": 473189, "epoch": 2816} {"train_loss": -12.779327392578125, "global_step": 473190, "epoch": 2816} {"train_loss": -12.631723403930664, "global_step": 473191, "epoch": 2816} {"train_loss": -12.680939674377441, "global_step": 473192, "epoch": 2816} {"train_loss": -12.4199857711792, "global_step": 473193, "epoch": 2816} {"train_loss": -12.866852760314941, "global_step": 473194, "epoch": 2816} {"train_loss": -12.682313919067383, "global_step": 473195, "epoch": 2816} {"train_loss": -12.68935489654541, "global_step": 473196, "epoch": 2816} {"train_loss": -12.58051872253418, "global_step": 473197, "epoch": 2816} {"train_loss": -12.692075729370117, "global_step": 473198, "epoch": 2816} {"train_loss": -12.608592987060547, "global_step": 473199, "epoch": 2816} {"train_loss": -12.753305435180664, "global_step": 473200, "epoch": 2816} {"train_loss": -12.539273262023926, "global_step": 473201, "epoch": 2816} {"train_loss": -12.22775650024414, "global_step": 473202, "epoch": 2816} {"train_loss": -12.440858840942383, "global_step": 473203, "epoch": 2816} {"train_loss": -12.703849792480469, "global_step": 473204, "epoch": 2816} {"train_loss": -12.717761993408203, "global_step": 473205, "epoch": 2816} {"train_loss": -12.407421112060547, "global_step": 473206, "epoch": 2816} {"train_loss": -12.368075370788574, "global_step": 473207, "epoch": 2816} {"train_loss": -12.646209716796875, "global_step": 473208, "epoch": 2816} {"train_loss": -12.527591705322266, "global_step": 473209, "epoch": 2816} {"train_loss": -12.473437309265137, "global_step": 473210, "epoch": 2816} {"train_loss": -12.577093124389648, "global_step": 473211, "epoch": 2816} {"train_loss": -12.402559280395508, "global_step": 473212, "epoch": 2816} {"train_loss": -12.58209228515625, "global_step": 473213, "epoch": 2816} {"train_loss": -12.636777877807617, "global_step": 473214, "epoch": 2816} {"train_loss": -12.642707824707031, "global_step": 473215, "epoch": 2816} {"train_loss": -12.753528594970703, "global_step": 473216, "epoch": 2816} {"train_loss": -12.896986961364746, "global_step": 473217, "epoch": 2816} {"train_loss": -12.670278549194336, "global_step": 473218, "epoch": 2816} {"train_loss": -12.62071418762207, "global_step": 473219, "epoch": 2816} {"train_loss": -12.77326774597168, "global_step": 473220, "epoch": 2816} {"train_loss": -13.05000114440918, "global_step": 473221, "epoch": 2816} {"train_loss": -12.940387725830078, "global_step": 473222, "epoch": 2816} {"train_loss": -13.017327308654785, "global_step": 473223, "epoch": 2816} {"train_loss": -12.715435981750488, "global_step": 473224, "epoch": 2816} {"train_loss": -12.904645919799805, "global_step": 473225, "epoch": 2816} {"train_loss": -12.922736167907715, "global_step": 473226, "epoch": 2816} {"train_loss": -12.557175636291504, "global_step": 473227, "epoch": 2816} {"train_loss": -12.320371627807617, "global_step": 473228, "epoch": 2816} {"train_loss": -12.693668365478516, "global_step": 473229, "epoch": 2816} {"train_loss": -12.590893745422363, "global_step": 473230, "epoch": 2816} {"train_loss": -11.826974868774414, "global_step": 473231, "epoch": 2816} {"train_loss": -11.827713012695312, "global_step": 473232, "epoch": 2816} {"train_loss": -12.257094383239746, "global_step": 473233, "epoch": 2816} {"train_loss": -12.250588417053223, "global_step": 473234, "epoch": 2816} {"train_loss": -10.064658164978027, "global_step": 473235, "epoch": 2816} {"train_loss": -12.650903701782227, "global_step": 473236, "epoch": 2816} {"train_loss": -11.62374496459961, "global_step": 473237, "epoch": 2816} {"train_loss": -10.298957824707031, "global_step": 473238, "epoch": 2816} {"train_loss": -12.519242286682129, "global_step": 473239, "epoch": 2816} {"train_loss": -9.180168151855469, "global_step": 473240, "epoch": 2816} {"train_loss": -10.348929405212402, "global_step": 473241, "epoch": 2816} {"train_loss": -9.976801872253418, "global_step": 473242, "epoch": 2816} {"train_loss": -9.550369262695312, "global_step": 473243, "epoch": 2816} {"train_loss": -11.568873405456543, "global_step": 473244, "epoch": 2816} {"train_loss": -10.326072692871094, "global_step": 473245, "epoch": 2816} {"train_loss": -9.527814865112305, "global_step": 473246, "epoch": 2816} {"train_loss": -10.393049240112305, "global_step": 473247, "epoch": 2816} {"train_loss": -11.477725982666016, "global_step": 473248, "epoch": 2816} {"train_loss": -11.844586372375488, "global_step": 473249, "epoch": 2816} {"train_loss": -11.657724380493164, "global_step": 473250, "epoch": 2816} {"train_loss": -11.744924545288086, "global_step": 473251, "epoch": 2816} {"train_loss": -11.568367004394531, "global_step": 473252, "epoch": 2816} {"train_loss": -11.815960884094238, "global_step": 473253, "epoch": 2816} {"train_loss": -11.568704605102539, "global_step": 473254, "epoch": 2816} {"train_loss": -12.267760844457717, "global_step": 473255, "epoch": 2816, "val_loss": 311452.8125} {"train_loss": -12.256002426147461, "global_step": 473256, "epoch": 2817} {"train_loss": -11.368896484375, "global_step": 473257, "epoch": 2817} {"train_loss": -11.512689590454102, "global_step": 473258, "epoch": 2817} {"train_loss": -12.050586700439453, "global_step": 473259, "epoch": 2817} {"train_loss": -10.272476196289062, "global_step": 473260, "epoch": 2817} {"train_loss": -11.84183120727539, "global_step": 473261, "epoch": 2817} {"train_loss": -11.290297508239746, "global_step": 473262, "epoch": 2817} {"train_loss": -11.71405029296875, "global_step": 473263, "epoch": 2817} {"train_loss": -12.064725875854492, "global_step": 473264, "epoch": 2817} {"train_loss": -11.47839641571045, "global_step": 473265, "epoch": 2817} {"train_loss": -11.700965881347656, "global_step": 473266, "epoch": 2817} {"train_loss": -11.97096061706543, "global_step": 473267, "epoch": 2817} {"train_loss": -12.230859756469727, "global_step": 473268, "epoch": 2817} {"train_loss": -11.761754989624023, "global_step": 473269, "epoch": 2817} {"train_loss": -12.036238670349121, "global_step": 473270, "epoch": 2817} {"train_loss": -11.581982612609863, "global_step": 473271, "epoch": 2817} {"train_loss": -11.69495964050293, "global_step": 473272, "epoch": 2817} {"train_loss": -11.763574600219727, "global_step": 473273, "epoch": 2817} {"train_loss": -11.325654029846191, "global_step": 473274, "epoch": 2817} {"train_loss": -12.00808334350586, "global_step": 473275, "epoch": 2817} {"train_loss": -12.285467147827148, "global_step": 473276, "epoch": 2817} {"train_loss": -12.331634521484375, "global_step": 473277, "epoch": 2817} {"train_loss": -12.13795280456543, "global_step": 473278, "epoch": 2817} {"train_loss": -11.843704223632812, "global_step": 473279, "epoch": 2817} {"train_loss": -11.625947952270508, "global_step": 473280, "epoch": 2817} {"train_loss": -12.179482460021973, "global_step": 473281, "epoch": 2817} {"train_loss": -11.90492057800293, "global_step": 473282, "epoch": 2817} {"train_loss": -12.2772855758667, "global_step": 473283, "epoch": 2817} {"train_loss": -11.915973663330078, "global_step": 473284, "epoch": 2817} {"train_loss": -12.473397254943848, "global_step": 473285, "epoch": 2817} {"train_loss": -12.147954940795898, "global_step": 473286, "epoch": 2817} {"train_loss": -12.448263168334961, "global_step": 473287, "epoch": 2817} {"train_loss": -12.005683898925781, "global_step": 473288, "epoch": 2817} {"train_loss": -12.509153366088867, "global_step": 473289, "epoch": 2817} {"train_loss": -12.414464950561523, "global_step": 473290, "epoch": 2817} {"train_loss": -12.59616756439209, "global_step": 473291, "epoch": 2817} {"train_loss": -12.298028945922852, "global_step": 473292, "epoch": 2817} {"train_loss": -12.432485580444336, "global_step": 473293, "epoch": 2817} {"train_loss": -12.669429779052734, "global_step": 473294, "epoch": 2817} {"train_loss": -12.18143081665039, "global_step": 473295, "epoch": 2817} {"train_loss": -12.656473159790039, "global_step": 473296, "epoch": 2817} {"train_loss": -12.315542221069336, "global_step": 473297, "epoch": 2817} {"train_loss": -12.33076000213623, "global_step": 473298, "epoch": 2817} {"train_loss": -12.379148483276367, "global_step": 473299, "epoch": 2817} {"train_loss": -12.164225578308105, "global_step": 473300, "epoch": 2817} {"train_loss": -12.37756633758545, "global_step": 473301, "epoch": 2817} {"train_loss": -12.416528701782227, "global_step": 473302, "epoch": 2817} {"train_loss": -12.392816543579102, "global_step": 473303, "epoch": 2817} {"train_loss": -12.225996017456055, "global_step": 473304, "epoch": 2817} {"train_loss": -12.435623168945312, "global_step": 473305, "epoch": 2817} {"train_loss": -12.598146438598633, "global_step": 473306, "epoch": 2817} {"train_loss": -12.704327583312988, "global_step": 473307, "epoch": 2817} {"train_loss": -12.71413516998291, "global_step": 473308, "epoch": 2817} {"train_loss": -12.731752395629883, "global_step": 473309, "epoch": 2817} {"train_loss": -12.453211784362793, "global_step": 473310, "epoch": 2817} {"train_loss": -12.444730758666992, "global_step": 473311, "epoch": 2817} {"train_loss": -12.600589752197266, "global_step": 473312, "epoch": 2817} {"train_loss": -12.801188468933105, "global_step": 473313, "epoch": 2817} {"train_loss": -12.665576934814453, "global_step": 473314, "epoch": 2817} {"train_loss": -12.715484619140625, "global_step": 473315, "epoch": 2817} {"train_loss": -12.8638916015625, "global_step": 473316, "epoch": 2817} {"train_loss": -12.756309509277344, "global_step": 473317, "epoch": 2817} {"train_loss": -12.728730201721191, "global_step": 473318, "epoch": 2817} {"train_loss": -12.680477142333984, "global_step": 473319, "epoch": 2817} {"train_loss": -12.67480182647705, "global_step": 473320, "epoch": 2817} {"train_loss": -12.71574592590332, "global_step": 473321, "epoch": 2817} {"train_loss": -12.771797180175781, "global_step": 473322, "epoch": 2817} {"train_loss": -12.632123947143555, "global_step": 473323, "epoch": 2817} {"train_loss": -12.584228515625, "global_step": 473324, "epoch": 2817} {"train_loss": -12.837207794189453, "global_step": 473325, "epoch": 2817} {"train_loss": -12.610349655151367, "global_step": 473326, "epoch": 2817} {"train_loss": -12.383306503295898, "global_step": 473327, "epoch": 2817} {"train_loss": -12.350273132324219, "global_step": 473328, "epoch": 2817} {"train_loss": -12.86355209350586, "global_step": 473329, "epoch": 2817} {"train_loss": -12.785622596740723, "global_step": 473330, "epoch": 2817} {"train_loss": -12.560365676879883, "global_step": 473331, "epoch": 2817} {"train_loss": -12.890642166137695, "global_step": 473332, "epoch": 2817} {"train_loss": -12.865653991699219, "global_step": 473333, "epoch": 2817} {"train_loss": -12.620550155639648, "global_step": 473334, "epoch": 2817} {"train_loss": -12.610709190368652, "global_step": 473335, "epoch": 2817} {"train_loss": -12.624090194702148, "global_step": 473336, "epoch": 2817} {"train_loss": -12.665750503540039, "global_step": 473337, "epoch": 2817} {"train_loss": -12.595090866088867, "global_step": 473338, "epoch": 2817} {"train_loss": -12.748669624328613, "global_step": 473339, "epoch": 2817} {"train_loss": -12.376340866088867, "global_step": 473340, "epoch": 2817} {"train_loss": -12.567296981811523, "global_step": 473341, "epoch": 2817} {"train_loss": -12.482418060302734, "global_step": 473342, "epoch": 2817} {"train_loss": -12.70545768737793, "global_step": 473343, "epoch": 2817} {"train_loss": -12.555702209472656, "global_step": 473344, "epoch": 2817} {"train_loss": -12.530485153198242, "global_step": 473345, "epoch": 2817} {"train_loss": -13.054811477661133, "global_step": 473346, "epoch": 2817} {"train_loss": -12.345480918884277, "global_step": 473347, "epoch": 2817} {"train_loss": -12.367088317871094, "global_step": 473348, "epoch": 2817} {"train_loss": -12.551980972290039, "global_step": 473349, "epoch": 2817} {"train_loss": -12.237881660461426, "global_step": 473350, "epoch": 2817} {"train_loss": -12.22628402709961, "global_step": 473351, "epoch": 2817} {"train_loss": -11.865067481994629, "global_step": 473352, "epoch": 2817} {"train_loss": -11.426180839538574, "global_step": 473353, "epoch": 2817} {"train_loss": -12.349408149719238, "global_step": 473354, "epoch": 2817} {"train_loss": -11.713085174560547, "global_step": 473355, "epoch": 2817} {"train_loss": -11.448413848876953, "global_step": 473356, "epoch": 2817} {"train_loss": -12.225285530090332, "global_step": 473357, "epoch": 2817} {"train_loss": -11.800987243652344, "global_step": 473358, "epoch": 2817} {"train_loss": -10.49205493927002, "global_step": 473359, "epoch": 2817} {"train_loss": -11.522845268249512, "global_step": 473360, "epoch": 2817} {"train_loss": -11.943913459777832, "global_step": 473361, "epoch": 2817} {"train_loss": -12.115829467773438, "global_step": 473362, "epoch": 2817} {"train_loss": -12.075295448303223, "global_step": 473363, "epoch": 2817} {"train_loss": -11.844122886657715, "global_step": 473364, "epoch": 2817} {"train_loss": -12.433443069458008, "global_step": 473365, "epoch": 2817} {"train_loss": -12.246103286743164, "global_step": 473366, "epoch": 2817} {"train_loss": -12.231398582458496, "global_step": 473367, "epoch": 2817} {"train_loss": -12.57313346862793, "global_step": 473368, "epoch": 2817} {"train_loss": -12.235223770141602, "global_step": 473369, "epoch": 2817} {"train_loss": -12.26063346862793, "global_step": 473370, "epoch": 2817} {"train_loss": -12.59280776977539, "global_step": 473371, "epoch": 2817} {"train_loss": -12.308316230773926, "global_step": 473372, "epoch": 2817} {"train_loss": -12.455605506896973, "global_step": 473373, "epoch": 2817} {"train_loss": -12.378020286560059, "global_step": 473374, "epoch": 2817} {"train_loss": -12.338141441345215, "global_step": 473375, "epoch": 2817} {"train_loss": -11.88668441772461, "global_step": 473376, "epoch": 2817} {"train_loss": -12.213794708251953, "global_step": 473377, "epoch": 2817} {"train_loss": -11.958094596862793, "global_step": 473378, "epoch": 2817} {"train_loss": -11.529962539672852, "global_step": 473379, "epoch": 2817} {"train_loss": -12.41092300415039, "global_step": 473380, "epoch": 2817} {"train_loss": -11.602106094360352, "global_step": 473381, "epoch": 2817} {"train_loss": -12.113990783691406, "global_step": 473382, "epoch": 2817} {"train_loss": -11.59720516204834, "global_step": 473383, "epoch": 2817} {"train_loss": -12.047189712524414, "global_step": 473384, "epoch": 2817} {"train_loss": -11.904420852661133, "global_step": 473385, "epoch": 2817} {"train_loss": -12.190934181213379, "global_step": 473386, "epoch": 2817} {"train_loss": -12.070758819580078, "global_step": 473387, "epoch": 2817} {"train_loss": -12.270686149597168, "global_step": 473388, "epoch": 2817} {"train_loss": -12.336336135864258, "global_step": 473389, "epoch": 2817} {"train_loss": -12.552532196044922, "global_step": 473390, "epoch": 2817} {"train_loss": -12.358799934387207, "global_step": 473391, "epoch": 2817} {"train_loss": -12.66416072845459, "global_step": 473392, "epoch": 2817} {"train_loss": -12.506832122802734, "global_step": 473393, "epoch": 2817} {"train_loss": -13.082329750061035, "global_step": 473394, "epoch": 2817} {"train_loss": -12.487710952758789, "global_step": 473395, "epoch": 2817} {"train_loss": -12.562326431274414, "global_step": 473396, "epoch": 2817} {"train_loss": -12.647761344909668, "global_step": 473397, "epoch": 2817} {"train_loss": -12.645721435546875, "global_step": 473398, "epoch": 2817} {"train_loss": -12.333826065063477, "global_step": 473399, "epoch": 2817} {"train_loss": -12.426156997680664, "global_step": 473400, "epoch": 2817} {"train_loss": -12.52491569519043, "global_step": 473401, "epoch": 2817} {"train_loss": -12.211324691772461, "global_step": 473402, "epoch": 2817} {"train_loss": -12.01380443572998, "global_step": 473403, "epoch": 2817} {"train_loss": -12.296653747558594, "global_step": 473404, "epoch": 2817} {"train_loss": -12.314048767089844, "global_step": 473405, "epoch": 2817} {"train_loss": -12.003421783447266, "global_step": 473406, "epoch": 2817} {"train_loss": -12.256147384643555, "global_step": 473407, "epoch": 2817} {"train_loss": -11.794677734375, "global_step": 473408, "epoch": 2817} {"train_loss": -11.788738250732422, "global_step": 473409, "epoch": 2817} {"train_loss": -12.216593742370605, "global_step": 473410, "epoch": 2817} {"train_loss": -12.446229934692383, "global_step": 473411, "epoch": 2817} {"train_loss": -11.406899452209473, "global_step": 473412, "epoch": 2817} {"train_loss": -12.44029426574707, "global_step": 473413, "epoch": 2817} {"train_loss": -12.108039855957031, "global_step": 473414, "epoch": 2817} {"train_loss": -11.471370697021484, "global_step": 473415, "epoch": 2817} {"train_loss": -10.843772888183594, "global_step": 473416, "epoch": 2817} {"train_loss": -12.12535285949707, "global_step": 473417, "epoch": 2817} {"train_loss": -11.195854187011719, "global_step": 473418, "epoch": 2817} {"train_loss": -11.883976936340332, "global_step": 473419, "epoch": 2817} {"train_loss": -10.741809844970703, "global_step": 473420, "epoch": 2817} {"train_loss": -11.139242172241211, "global_step": 473421, "epoch": 2817} {"train_loss": -10.05257797241211, "global_step": 473422, "epoch": 2817} {"train_loss": -12.201329884074983, "global_step": 473423, "epoch": 2817, "val_loss": 310124.40625} {"train_loss": -10.922863006591797, "global_step": 473424, "epoch": 2818} {"train_loss": -12.219209671020508, "global_step": 473425, "epoch": 2818} {"train_loss": -11.607011795043945, "global_step": 473426, "epoch": 2818} {"train_loss": -12.351032257080078, "global_step": 473427, "epoch": 2818} {"train_loss": -11.51171875, "global_step": 473428, "epoch": 2818} {"train_loss": -12.638033866882324, "global_step": 473429, "epoch": 2818} {"train_loss": -12.133995056152344, "global_step": 473430, "epoch": 2818} {"train_loss": -12.262504577636719, "global_step": 473431, "epoch": 2818} {"train_loss": -12.209382057189941, "global_step": 473432, "epoch": 2818} {"train_loss": -12.257204055786133, "global_step": 473433, "epoch": 2818} {"train_loss": -12.026227951049805, "global_step": 473434, "epoch": 2818} {"train_loss": -12.009918212890625, "global_step": 473435, "epoch": 2818} {"train_loss": -12.185811996459961, "global_step": 473436, "epoch": 2818} {"train_loss": -12.530811309814453, "global_step": 473437, "epoch": 2818} {"train_loss": -12.16305923461914, "global_step": 473438, "epoch": 2818} {"train_loss": -12.375720977783203, "global_step": 473439, "epoch": 2818} {"train_loss": -12.483634948730469, "global_step": 473440, "epoch": 2818} {"train_loss": -12.100180625915527, "global_step": 473441, "epoch": 2818} {"train_loss": -12.430397033691406, "global_step": 473442, "epoch": 2818} {"train_loss": -12.137168884277344, "global_step": 473443, "epoch": 2818} {"train_loss": -12.635826110839844, "global_step": 473444, "epoch": 2818} {"train_loss": -12.336421012878418, "global_step": 473445, "epoch": 2818} {"train_loss": -12.525390625, "global_step": 473446, "epoch": 2818} {"train_loss": -12.679386138916016, "global_step": 473447, "epoch": 2818} {"train_loss": -12.636879920959473, "global_step": 473448, "epoch": 2818} {"train_loss": -12.603399276733398, "global_step": 473449, "epoch": 2818} {"train_loss": -12.58263111114502, "global_step": 473450, "epoch": 2818} {"train_loss": -12.486705780029297, "global_step": 473451, "epoch": 2818} {"train_loss": -12.603075981140137, "global_step": 473452, "epoch": 2818} {"train_loss": -12.494550704956055, "global_step": 473453, "epoch": 2818} {"train_loss": -12.44723129272461, "global_step": 473454, "epoch": 2818} {"train_loss": -12.467580795288086, "global_step": 473455, "epoch": 2818} {"train_loss": -12.67077350616455, "global_step": 473456, "epoch": 2818} {"train_loss": -12.629495620727539, "global_step": 473457, "epoch": 2818} {"train_loss": -12.402604103088379, "global_step": 473458, "epoch": 2818} {"train_loss": -12.466259956359863, "global_step": 473459, "epoch": 2818} {"train_loss": -12.450910568237305, "global_step": 473460, "epoch": 2818} {"train_loss": -12.527820587158203, "global_step": 473461, "epoch": 2818} {"train_loss": -12.474736213684082, "global_step": 473462, "epoch": 2818} {"train_loss": -12.451940536499023, "global_step": 473463, "epoch": 2818} {"train_loss": -12.554325103759766, "global_step": 473464, "epoch": 2818} {"train_loss": -12.285383224487305, "global_step": 473465, "epoch": 2818} {"train_loss": -12.792842864990234, "global_step": 473466, "epoch": 2818} {"train_loss": -12.83057975769043, "global_step": 473467, "epoch": 2818} {"train_loss": -12.443721771240234, "global_step": 473468, "epoch": 2818} {"train_loss": -12.740347862243652, "global_step": 473469, "epoch": 2818} {"train_loss": -12.621259689331055, "global_step": 473470, "epoch": 2818} {"train_loss": -12.578206062316895, "global_step": 473471, "epoch": 2818} {"train_loss": -12.77767276763916, "global_step": 473472, "epoch": 2818} {"train_loss": -12.550191879272461, "global_step": 473473, "epoch": 2818} {"train_loss": -12.569923400878906, "global_step": 473474, "epoch": 2818} {"train_loss": -12.694159507751465, "global_step": 473475, "epoch": 2818} {"train_loss": -12.582724571228027, "global_step": 473476, "epoch": 2818} {"train_loss": -12.74673080444336, "global_step": 473477, "epoch": 2818} {"train_loss": -12.406160354614258, "global_step": 473478, "epoch": 2818} {"train_loss": -12.473381042480469, "global_step": 473479, "epoch": 2818} {"train_loss": -12.856622695922852, "global_step": 473480, "epoch": 2818} {"train_loss": -12.691122055053711, "global_step": 473481, "epoch": 2818} {"train_loss": -12.510113716125488, "global_step": 473482, "epoch": 2818} {"train_loss": -12.781012535095215, "global_step": 473483, "epoch": 2818} {"train_loss": -12.628166198730469, "global_step": 473484, "epoch": 2818} {"train_loss": -11.889287948608398, "global_step": 473485, "epoch": 2818} {"train_loss": -10.47740364074707, "global_step": 473486, "epoch": 2818} {"train_loss": -12.554442405700684, "global_step": 473487, "epoch": 2818} {"train_loss": -12.22618293762207, "global_step": 473488, "epoch": 2818} {"train_loss": -11.454618453979492, "global_step": 473489, "epoch": 2818} {"train_loss": -12.567811012268066, "global_step": 473490, "epoch": 2818} {"train_loss": -11.985756874084473, "global_step": 473491, "epoch": 2818} {"train_loss": -10.899137496948242, "global_step": 473492, "epoch": 2818} {"train_loss": -12.550239562988281, "global_step": 473493, "epoch": 2818} {"train_loss": -11.816056251525879, "global_step": 473494, "epoch": 2818} {"train_loss": -11.348798751831055, "global_step": 473495, "epoch": 2818} {"train_loss": -12.56700325012207, "global_step": 473496, "epoch": 2818} {"train_loss": -11.49874210357666, "global_step": 473497, "epoch": 2818} {"train_loss": -11.363116264343262, "global_step": 473498, "epoch": 2818} {"train_loss": -11.645172119140625, "global_step": 473499, "epoch": 2818} {"train_loss": -9.2089204788208, "global_step": 473500, "epoch": 2818} {"train_loss": -12.19473648071289, "global_step": 473501, "epoch": 2818} {"train_loss": -10.277445793151855, "global_step": 473502, "epoch": 2818} {"train_loss": -10.940352439880371, "global_step": 473503, "epoch": 2818} {"train_loss": -11.923712730407715, "global_step": 473504, "epoch": 2818} {"train_loss": -11.0745849609375, "global_step": 473505, "epoch": 2818} {"train_loss": -12.086613655090332, "global_step": 473506, "epoch": 2818} {"train_loss": -10.381229400634766, "global_step": 473507, "epoch": 2818} {"train_loss": -11.93579387664795, "global_step": 473508, "epoch": 2818} {"train_loss": -10.902227401733398, "global_step": 473509, "epoch": 2818} {"train_loss": -11.930074691772461, "global_step": 473510, "epoch": 2818} {"train_loss": -11.916715621948242, "global_step": 473511, "epoch": 2818} {"train_loss": -11.67119026184082, "global_step": 473512, "epoch": 2818} {"train_loss": -12.487564086914062, "global_step": 473513, "epoch": 2818} {"train_loss": -11.671850204467773, "global_step": 473514, "epoch": 2818} {"train_loss": -12.17498779296875, "global_step": 473515, "epoch": 2818} {"train_loss": -12.517029762268066, "global_step": 473516, "epoch": 2818} {"train_loss": -12.08279037475586, "global_step": 473517, "epoch": 2818} {"train_loss": -12.624259948730469, "global_step": 473518, "epoch": 2818} {"train_loss": -12.431848526000977, "global_step": 473519, "epoch": 2818} {"train_loss": -11.966264724731445, "global_step": 473520, "epoch": 2818} {"train_loss": -11.902276039123535, "global_step": 473521, "epoch": 2818} {"train_loss": -12.007696151733398, "global_step": 473522, "epoch": 2818} {"train_loss": -11.67519760131836, "global_step": 473523, "epoch": 2818} {"train_loss": -11.91153335571289, "global_step": 473524, "epoch": 2818} {"train_loss": -12.266071319580078, "global_step": 473525, "epoch": 2818} {"train_loss": -12.140358924865723, "global_step": 473526, "epoch": 2818} {"train_loss": -11.743709564208984, "global_step": 473527, "epoch": 2818} {"train_loss": -12.026517868041992, "global_step": 473528, "epoch": 2818} {"train_loss": -11.41589069366455, "global_step": 473529, "epoch": 2818} {"train_loss": -12.474088668823242, "global_step": 473530, "epoch": 2818} {"train_loss": -10.945793151855469, "global_step": 473531, "epoch": 2818} {"train_loss": -11.271772384643555, "global_step": 473532, "epoch": 2818} {"train_loss": -10.193876266479492, "global_step": 473533, "epoch": 2818} {"train_loss": -10.464409828186035, "global_step": 473534, "epoch": 2818} {"train_loss": -11.54803466796875, "global_step": 473535, "epoch": 2818} {"train_loss": -11.836204528808594, "global_step": 473536, "epoch": 2818} {"train_loss": -11.551437377929688, "global_step": 473537, "epoch": 2818} {"train_loss": -12.592828750610352, "global_step": 473538, "epoch": 2818} {"train_loss": -11.595900535583496, "global_step": 473539, "epoch": 2818} {"train_loss": -11.552654266357422, "global_step": 473540, "epoch": 2818} {"train_loss": -11.867403030395508, "global_step": 473541, "epoch": 2818} {"train_loss": -11.470152854919434, "global_step": 473542, "epoch": 2818} {"train_loss": -11.614755630493164, "global_step": 473543, "epoch": 2818} {"train_loss": -11.546979904174805, "global_step": 473544, "epoch": 2818} {"train_loss": -11.60474681854248, "global_step": 473545, "epoch": 2818} {"train_loss": -11.995144844055176, "global_step": 473546, "epoch": 2818} {"train_loss": -11.374244689941406, "global_step": 473547, "epoch": 2818} {"train_loss": -11.624595642089844, "global_step": 473548, "epoch": 2818} {"train_loss": -11.603031158447266, "global_step": 473549, "epoch": 2818} {"train_loss": -11.563374519348145, "global_step": 473550, "epoch": 2818} {"train_loss": -11.92191219329834, "global_step": 473551, "epoch": 2818} {"train_loss": -11.217987060546875, "global_step": 473552, "epoch": 2818} {"train_loss": -12.608268737792969, "global_step": 473553, "epoch": 2818} {"train_loss": -11.56123161315918, "global_step": 473554, "epoch": 2818} {"train_loss": -12.534688949584961, "global_step": 473555, "epoch": 2818} {"train_loss": -12.105301856994629, "global_step": 473556, "epoch": 2818} {"train_loss": -12.20986557006836, "global_step": 473557, "epoch": 2818} {"train_loss": -12.34369945526123, "global_step": 473558, "epoch": 2818} {"train_loss": -12.052002906799316, "global_step": 473559, "epoch": 2818} {"train_loss": -12.263628005981445, "global_step": 473560, "epoch": 2818} {"train_loss": -12.191722869873047, "global_step": 473561, "epoch": 2818} {"train_loss": -11.784001350402832, "global_step": 473562, "epoch": 2818} {"train_loss": -12.403881072998047, "global_step": 473563, "epoch": 2818} {"train_loss": -11.76475715637207, "global_step": 473564, "epoch": 2818} {"train_loss": -11.953208923339844, "global_step": 473565, "epoch": 2818} {"train_loss": -12.239328384399414, "global_step": 473566, "epoch": 2818} {"train_loss": -11.63720703125, "global_step": 473567, "epoch": 2818} {"train_loss": -11.919464111328125, "global_step": 473568, "epoch": 2818} {"train_loss": -11.786127090454102, "global_step": 473569, "epoch": 2818} {"train_loss": -12.24610710144043, "global_step": 473570, "epoch": 2818} {"train_loss": -11.865325927734375, "global_step": 473571, "epoch": 2818} {"train_loss": -12.295768737792969, "global_step": 473572, "epoch": 2818} {"train_loss": -11.399977684020996, "global_step": 473573, "epoch": 2818} {"train_loss": -11.979791641235352, "global_step": 473574, "epoch": 2818} {"train_loss": -11.912394523620605, "global_step": 473575, "epoch": 2818} {"train_loss": -12.319659233093262, "global_step": 473576, "epoch": 2818} {"train_loss": -12.14733600616455, "global_step": 473577, "epoch": 2818} {"train_loss": -12.340846061706543, "global_step": 473578, "epoch": 2818} {"train_loss": -12.23890209197998, "global_step": 473579, "epoch": 2818} {"train_loss": -12.434185028076172, "global_step": 473580, "epoch": 2818} {"train_loss": -12.212713241577148, "global_step": 473581, "epoch": 2818} {"train_loss": -12.330976486206055, "global_step": 473582, "epoch": 2818} {"train_loss": -12.331972122192383, "global_step": 473583, "epoch": 2818} {"train_loss": -12.333497047424316, "global_step": 473584, "epoch": 2818} {"train_loss": -12.513843536376953, "global_step": 473585, "epoch": 2818} {"train_loss": -12.595195770263672, "global_step": 473586, "epoch": 2818} {"train_loss": -12.527056694030762, "global_step": 473587, "epoch": 2818} {"train_loss": -12.5146484375, "global_step": 473588, "epoch": 2818} {"train_loss": -12.66491413116455, "global_step": 473589, "epoch": 2818} {"train_loss": -12.570576667785645, "global_step": 473590, "epoch": 2818} {"train_loss": -12.068820107550849, "global_step": 473591, "epoch": 2818, "val_loss": 314575.84375} {"train_loss": -12.373394012451172, "global_step": 473592, "epoch": 2819} {"train_loss": -12.484642028808594, "global_step": 473593, "epoch": 2819} {"train_loss": -12.65693473815918, "global_step": 473594, "epoch": 2819} {"train_loss": -12.509343147277832, "global_step": 473595, "epoch": 2819} {"train_loss": -12.816530227661133, "global_step": 473596, "epoch": 2819} {"train_loss": -12.545883178710938, "global_step": 473597, "epoch": 2819} {"train_loss": -12.668350219726562, "global_step": 473598, "epoch": 2819} {"train_loss": -12.531464576721191, "global_step": 473599, "epoch": 2819} {"train_loss": -12.531789779663086, "global_step": 473600, "epoch": 2819} {"train_loss": -12.734830856323242, "global_step": 473601, "epoch": 2819} {"train_loss": -12.57968807220459, "global_step": 473602, "epoch": 2819} {"train_loss": -12.665508270263672, "global_step": 473603, "epoch": 2819} {"train_loss": -12.54568862915039, "global_step": 473604, "epoch": 2819} {"train_loss": -12.566061019897461, "global_step": 473605, "epoch": 2819} {"train_loss": -12.658927917480469, "global_step": 473606, "epoch": 2819} {"train_loss": -12.586662292480469, "global_step": 473607, "epoch": 2819} {"train_loss": -12.789738655090332, "global_step": 473608, "epoch": 2819} {"train_loss": -12.787717819213867, "global_step": 473609, "epoch": 2819} {"train_loss": -12.776350021362305, "global_step": 473610, "epoch": 2819} {"train_loss": -12.741902351379395, "global_step": 473611, "epoch": 2819} {"train_loss": -12.625357627868652, "global_step": 473612, "epoch": 2819} {"train_loss": -12.728706359863281, "global_step": 473613, "epoch": 2819} {"train_loss": -12.73733139038086, "global_step": 473614, "epoch": 2819} {"train_loss": -12.884252548217773, "global_step": 473615, "epoch": 2819} {"train_loss": -12.963431358337402, "global_step": 473616, "epoch": 2819} {"train_loss": -12.892019271850586, "global_step": 473617, "epoch": 2819} {"train_loss": -12.765840530395508, "global_step": 473618, "epoch": 2819} {"train_loss": -12.741655349731445, "global_step": 473619, "epoch": 2819} {"train_loss": -12.824281692504883, "global_step": 473620, "epoch": 2819} {"train_loss": -12.977533340454102, "global_step": 473621, "epoch": 2819} {"train_loss": -12.923803329467773, "global_step": 473622, "epoch": 2819} {"train_loss": -12.855403900146484, "global_step": 473623, "epoch": 2819} {"train_loss": -12.81181812286377, "global_step": 473624, "epoch": 2819} {"train_loss": -12.877517700195312, "global_step": 473625, "epoch": 2819} {"train_loss": -12.844703674316406, "global_step": 473626, "epoch": 2819} {"train_loss": -13.031392097473145, "global_step": 473627, "epoch": 2819} {"train_loss": -12.964207649230957, "global_step": 473628, "epoch": 2819} {"train_loss": -12.694652557373047, "global_step": 473629, "epoch": 2819} {"train_loss": -12.656700134277344, "global_step": 473630, "epoch": 2819} {"train_loss": -13.097925186157227, "global_step": 473631, "epoch": 2819} {"train_loss": -12.923330307006836, "global_step": 473632, "epoch": 2819} {"train_loss": -12.523736953735352, "global_step": 473633, "epoch": 2819} {"train_loss": -12.594783782958984, "global_step": 473634, "epoch": 2819} {"train_loss": -12.697845458984375, "global_step": 473635, "epoch": 2819} {"train_loss": -12.69759750366211, "global_step": 473636, "epoch": 2819} {"train_loss": -12.51108169555664, "global_step": 473637, "epoch": 2819} {"train_loss": -12.376712799072266, "global_step": 473638, "epoch": 2819} {"train_loss": -12.754358291625977, "global_step": 473639, "epoch": 2819} {"train_loss": -12.379023551940918, "global_step": 473640, "epoch": 2819} {"train_loss": -12.12876033782959, "global_step": 473641, "epoch": 2819} {"train_loss": -11.70707893371582, "global_step": 473642, "epoch": 2819} {"train_loss": -12.369928359985352, "global_step": 473643, "epoch": 2819} {"train_loss": -9.78983211517334, "global_step": 473644, "epoch": 2819} {"train_loss": -11.117439270019531, "global_step": 473645, "epoch": 2819} {"train_loss": -12.55429744720459, "global_step": 473646, "epoch": 2819} {"train_loss": -11.355154991149902, "global_step": 473647, "epoch": 2819} {"train_loss": -10.674766540527344, "global_step": 473648, "epoch": 2819} {"train_loss": -11.97977066040039, "global_step": 473649, "epoch": 2819} {"train_loss": -11.268501281738281, "global_step": 473650, "epoch": 2819} {"train_loss": -9.426868438720703, "global_step": 473651, "epoch": 2819} {"train_loss": -12.231827735900879, "global_step": 473652, "epoch": 2819} {"train_loss": -10.08911418914795, "global_step": 473653, "epoch": 2819} {"train_loss": -12.276956558227539, "global_step": 473654, "epoch": 2819} {"train_loss": -11.27248764038086, "global_step": 473655, "epoch": 2819} {"train_loss": -11.09982681274414, "global_step": 473656, "epoch": 2819} {"train_loss": -12.533540725708008, "global_step": 473657, "epoch": 2819} {"train_loss": -10.76872444152832, "global_step": 473658, "epoch": 2819} {"train_loss": -12.357569694519043, "global_step": 473659, "epoch": 2819} {"train_loss": -11.742246627807617, "global_step": 473660, "epoch": 2819} {"train_loss": -11.075263023376465, "global_step": 473661, "epoch": 2819} {"train_loss": -12.402769088745117, "global_step": 473662, "epoch": 2819} {"train_loss": -10.940522193908691, "global_step": 473663, "epoch": 2819} {"train_loss": -12.101911544799805, "global_step": 473664, "epoch": 2819} {"train_loss": -10.883645057678223, "global_step": 473665, "epoch": 2819} {"train_loss": -11.183238983154297, "global_step": 473666, "epoch": 2819} {"train_loss": -10.40985107421875, "global_step": 473667, "epoch": 2819} {"train_loss": -11.12509536743164, "global_step": 473668, "epoch": 2819} {"train_loss": -10.357830047607422, "global_step": 473669, "epoch": 2819} {"train_loss": -10.536885261535645, "global_step": 473670, "epoch": 2819} {"train_loss": -10.627912521362305, "global_step": 473671, "epoch": 2819} {"train_loss": -11.21694278717041, "global_step": 473672, "epoch": 2819} {"train_loss": -10.960536003112793, "global_step": 473673, "epoch": 2819} {"train_loss": -11.968709945678711, "global_step": 473674, "epoch": 2819} {"train_loss": -11.595109939575195, "global_step": 473675, "epoch": 2819} {"train_loss": -11.681171417236328, "global_step": 473676, "epoch": 2819} {"train_loss": -12.034588813781738, "global_step": 473677, "epoch": 2819} {"train_loss": -10.688043594360352, "global_step": 473678, "epoch": 2819} {"train_loss": -11.988944053649902, "global_step": 473679, "epoch": 2819} {"train_loss": -11.102056503295898, "global_step": 473680, "epoch": 2819} {"train_loss": -12.410261154174805, "global_step": 473681, "epoch": 2819} {"train_loss": -11.379326820373535, "global_step": 473682, "epoch": 2819} {"train_loss": -12.045263290405273, "global_step": 473683, "epoch": 2819} {"train_loss": -12.282910346984863, "global_step": 473684, "epoch": 2819} {"train_loss": -11.857797622680664, "global_step": 473685, "epoch": 2819} {"train_loss": -12.343929290771484, "global_step": 473686, "epoch": 2819} {"train_loss": -12.034271240234375, "global_step": 473687, "epoch": 2819} {"train_loss": -12.532831192016602, "global_step": 473688, "epoch": 2819} {"train_loss": -12.277771949768066, "global_step": 473689, "epoch": 2819} {"train_loss": -12.29820728302002, "global_step": 473690, "epoch": 2819} {"train_loss": -12.378488540649414, "global_step": 473691, "epoch": 2819} {"train_loss": -12.087408065795898, "global_step": 473692, "epoch": 2819} {"train_loss": -12.239526748657227, "global_step": 473693, "epoch": 2819} {"train_loss": -12.342545509338379, "global_step": 473694, "epoch": 2819} {"train_loss": -12.264472007751465, "global_step": 473695, "epoch": 2819} {"train_loss": -12.371963500976562, "global_step": 473696, "epoch": 2819} {"train_loss": -12.324660301208496, "global_step": 473697, "epoch": 2819} {"train_loss": -12.674850463867188, "global_step": 473698, "epoch": 2819} {"train_loss": -12.382948875427246, "global_step": 473699, "epoch": 2819} {"train_loss": -12.525115966796875, "global_step": 473700, "epoch": 2819} {"train_loss": -12.116127014160156, "global_step": 473701, "epoch": 2819} {"train_loss": -12.608654022216797, "global_step": 473702, "epoch": 2819} {"train_loss": -12.46100902557373, "global_step": 473703, "epoch": 2819} {"train_loss": -12.72765827178955, "global_step": 473704, "epoch": 2819} {"train_loss": -12.223586082458496, "global_step": 473705, "epoch": 2819} {"train_loss": -12.269245147705078, "global_step": 473706, "epoch": 2819} {"train_loss": -12.498973846435547, "global_step": 473707, "epoch": 2819} {"train_loss": -12.632264137268066, "global_step": 473708, "epoch": 2819} {"train_loss": -12.386962890625, "global_step": 473709, "epoch": 2819} {"train_loss": -12.677618026733398, "global_step": 473710, "epoch": 2819} {"train_loss": -12.656793594360352, "global_step": 473711, "epoch": 2819} {"train_loss": -12.789685249328613, "global_step": 473712, "epoch": 2819} {"train_loss": -12.705831527709961, "global_step": 473713, "epoch": 2819} {"train_loss": -12.605927467346191, "global_step": 473714, "epoch": 2819} {"train_loss": -12.502306938171387, "global_step": 473715, "epoch": 2819} {"train_loss": -12.469633102416992, "global_step": 473716, "epoch": 2819} {"train_loss": -12.484329223632812, "global_step": 473717, "epoch": 2819} {"train_loss": -12.513694763183594, "global_step": 473718, "epoch": 2819} {"train_loss": -12.852838516235352, "global_step": 473719, "epoch": 2819} {"train_loss": -12.534220695495605, "global_step": 473720, "epoch": 2819} {"train_loss": -12.412007331848145, "global_step": 473721, "epoch": 2819} {"train_loss": -12.571250915527344, "global_step": 473722, "epoch": 2819} {"train_loss": -12.405320167541504, "global_step": 473723, "epoch": 2819} {"train_loss": -12.499070167541504, "global_step": 473724, "epoch": 2819} {"train_loss": -12.634025573730469, "global_step": 473725, "epoch": 2819} {"train_loss": -12.531906127929688, "global_step": 473726, "epoch": 2819} {"train_loss": -12.714312553405762, "global_step": 473727, "epoch": 2819} {"train_loss": -12.000904083251953, "global_step": 473728, "epoch": 2819} {"train_loss": -12.043024063110352, "global_step": 473729, "epoch": 2819} {"train_loss": -12.289851188659668, "global_step": 473730, "epoch": 2819} {"train_loss": -12.284984588623047, "global_step": 473731, "epoch": 2819} {"train_loss": -12.390989303588867, "global_step": 473732, "epoch": 2819} {"train_loss": -12.350741386413574, "global_step": 473733, "epoch": 2819} {"train_loss": -12.90936279296875, "global_step": 473734, "epoch": 2819} {"train_loss": -12.407760620117188, "global_step": 473735, "epoch": 2819} {"train_loss": -12.654520034790039, "global_step": 473736, "epoch": 2819} {"train_loss": -12.753595352172852, "global_step": 473737, "epoch": 2819} {"train_loss": -12.884834289550781, "global_step": 473738, "epoch": 2819} {"train_loss": -12.676448822021484, "global_step": 473739, "epoch": 2819} {"train_loss": -12.7028226852417, "global_step": 473740, "epoch": 2819} {"train_loss": -12.924686431884766, "global_step": 473741, "epoch": 2819} {"train_loss": -12.624824523925781, "global_step": 473742, "epoch": 2819} {"train_loss": -12.70828628540039, "global_step": 473743, "epoch": 2819} {"train_loss": -12.799369812011719, "global_step": 473744, "epoch": 2819} {"train_loss": -12.783300399780273, "global_step": 473745, "epoch": 2819} {"train_loss": -12.328600883483887, "global_step": 473746, "epoch": 2819} {"train_loss": -12.20242691040039, "global_step": 473747, "epoch": 2819} {"train_loss": -12.802574157714844, "global_step": 473748, "epoch": 2819} {"train_loss": -12.430931091308594, "global_step": 473749, "epoch": 2819} {"train_loss": -12.317312240600586, "global_step": 473750, "epoch": 2819} {"train_loss": -12.415508270263672, "global_step": 473751, "epoch": 2819} {"train_loss": -11.869638442993164, "global_step": 473752, "epoch": 2819} {"train_loss": -10.932502746582031, "global_step": 473753, "epoch": 2819} {"train_loss": -12.632816314697266, "global_step": 473754, "epoch": 2819} {"train_loss": -11.141913414001465, "global_step": 473755, "epoch": 2819} {"train_loss": -12.348247528076172, "global_step": 473756, "epoch": 2819} {"train_loss": -11.768106460571289, "global_step": 473757, "epoch": 2819} {"train_loss": -11.923118591308594, "global_step": 473758, "epoch": 2819} {"train_loss": -12.236287412189302, "global_step": 473759, "epoch": 2819, "val_loss": 313206.53125} {"train_loss": -12.401435852050781, "global_step": 473760, "epoch": 2820} {"train_loss": -11.563262939453125, "global_step": 473761, "epoch": 2820} {"train_loss": -11.382404327392578, "global_step": 473762, "epoch": 2820} {"train_loss": -11.860520362854004, "global_step": 473763, "epoch": 2820} {"train_loss": -12.471759796142578, "global_step": 473764, "epoch": 2820} {"train_loss": -11.236719131469727, "global_step": 473765, "epoch": 2820} {"train_loss": -10.774923324584961, "global_step": 473766, "epoch": 2820} {"train_loss": -11.168954849243164, "global_step": 473767, "epoch": 2820} {"train_loss": -9.994918823242188, "global_step": 473768, "epoch": 2820} {"train_loss": -11.349954605102539, "global_step": 473769, "epoch": 2820} {"train_loss": -10.711823463439941, "global_step": 473770, "epoch": 2820} {"train_loss": -11.174488067626953, "global_step": 473771, "epoch": 2820} {"train_loss": -12.21152114868164, "global_step": 473772, "epoch": 2820} {"train_loss": -10.641155242919922, "global_step": 473773, "epoch": 2820} {"train_loss": -12.331012725830078, "global_step": 473774, "epoch": 2820} {"train_loss": -10.981109619140625, "global_step": 473775, "epoch": 2820} {"train_loss": -11.467462539672852, "global_step": 473776, "epoch": 2820} {"train_loss": -11.877015113830566, "global_step": 473777, "epoch": 2820} {"train_loss": -12.123056411743164, "global_step": 473778, "epoch": 2820} {"train_loss": -12.247838020324707, "global_step": 473779, "epoch": 2820} {"train_loss": -12.37721061706543, "global_step": 473780, "epoch": 2820} {"train_loss": -11.705072402954102, "global_step": 473781, "epoch": 2820} {"train_loss": -12.434814453125, "global_step": 473782, "epoch": 2820} {"train_loss": -12.178216934204102, "global_step": 473783, "epoch": 2820} {"train_loss": -12.27725601196289, "global_step": 473784, "epoch": 2820} {"train_loss": -12.446791648864746, "global_step": 473785, "epoch": 2820} {"train_loss": -12.02112102508545, "global_step": 473786, "epoch": 2820} {"train_loss": -12.478605270385742, "global_step": 473787, "epoch": 2820} {"train_loss": -12.028572082519531, "global_step": 473788, "epoch": 2820} {"train_loss": -12.557632446289062, "global_step": 473789, "epoch": 2820} {"train_loss": -12.066272735595703, "global_step": 473790, "epoch": 2820} {"train_loss": -12.190984725952148, "global_step": 473791, "epoch": 2820} {"train_loss": -12.342605590820312, "global_step": 473792, "epoch": 2820} {"train_loss": -12.21557331085205, "global_step": 473793, "epoch": 2820} {"train_loss": -12.384113311767578, "global_step": 473794, "epoch": 2820} {"train_loss": -11.947517395019531, "global_step": 473795, "epoch": 2820} {"train_loss": -12.185611724853516, "global_step": 473796, "epoch": 2820} {"train_loss": -12.681045532226562, "global_step": 473797, "epoch": 2820} {"train_loss": -12.427759170532227, "global_step": 473798, "epoch": 2820} {"train_loss": -12.662878036499023, "global_step": 473799, "epoch": 2820} {"train_loss": -12.498296737670898, "global_step": 473800, "epoch": 2820} {"train_loss": -12.435723304748535, "global_step": 473801, "epoch": 2820} {"train_loss": -12.61578369140625, "global_step": 473802, "epoch": 2820} {"train_loss": -12.239011764526367, "global_step": 473803, "epoch": 2820} {"train_loss": -12.773340225219727, "global_step": 473804, "epoch": 2820} {"train_loss": -12.468941688537598, "global_step": 473805, "epoch": 2820} {"train_loss": -11.90099048614502, "global_step": 473806, "epoch": 2820} {"train_loss": -12.392030715942383, "global_step": 473807, "epoch": 2820} {"train_loss": -12.082540512084961, "global_step": 473808, "epoch": 2820} {"train_loss": -12.39683723449707, "global_step": 473809, "epoch": 2820} {"train_loss": -12.335074424743652, "global_step": 473810, "epoch": 2820} {"train_loss": -12.347673416137695, "global_step": 473811, "epoch": 2820} {"train_loss": -12.4121675491333, "global_step": 473812, "epoch": 2820} {"train_loss": -11.870054244995117, "global_step": 473813, "epoch": 2820} {"train_loss": -12.491565704345703, "global_step": 473814, "epoch": 2820} {"train_loss": -12.048700332641602, "global_step": 473815, "epoch": 2820} {"train_loss": -11.610157012939453, "global_step": 473816, "epoch": 2820} {"train_loss": -12.367517471313477, "global_step": 473817, "epoch": 2820} {"train_loss": -11.94412899017334, "global_step": 473818, "epoch": 2820} {"train_loss": -12.170938491821289, "global_step": 473819, "epoch": 2820} {"train_loss": -12.388646125793457, "global_step": 473820, "epoch": 2820} {"train_loss": -11.985467910766602, "global_step": 473821, "epoch": 2820} {"train_loss": -12.3507080078125, "global_step": 473822, "epoch": 2820} {"train_loss": -12.523797988891602, "global_step": 473823, "epoch": 2820} {"train_loss": -11.997075080871582, "global_step": 473824, "epoch": 2820} {"train_loss": -11.64232063293457, "global_step": 473825, "epoch": 2820} {"train_loss": -12.21230697631836, "global_step": 473826, "epoch": 2820} {"train_loss": -11.294801712036133, "global_step": 473827, "epoch": 2820} {"train_loss": -11.673454284667969, "global_step": 473828, "epoch": 2820} {"train_loss": -10.751646995544434, "global_step": 473829, "epoch": 2820} {"train_loss": -11.361016273498535, "global_step": 473830, "epoch": 2820} {"train_loss": -11.587428092956543, "global_step": 473831, "epoch": 2820} {"train_loss": -10.12608528137207, "global_step": 473832, "epoch": 2820} {"train_loss": -11.273618698120117, "global_step": 473833, "epoch": 2820} {"train_loss": -11.508480072021484, "global_step": 473834, "epoch": 2820} {"train_loss": -9.861629486083984, "global_step": 473835, "epoch": 2820} {"train_loss": -12.177371978759766, "global_step": 473836, "epoch": 2820} {"train_loss": -10.576799392700195, "global_step": 473837, "epoch": 2820} {"train_loss": -11.758865356445312, "global_step": 473838, "epoch": 2820} {"train_loss": -10.462739944458008, "global_step": 473839, "epoch": 2820} {"train_loss": -11.559011459350586, "global_step": 473840, "epoch": 2820} {"train_loss": -11.672889709472656, "global_step": 473841, "epoch": 2820} {"train_loss": -11.53924560546875, "global_step": 473842, "epoch": 2820} {"train_loss": -11.034317016601562, "global_step": 473843, "epoch": 2820} {"train_loss": -11.620397567749023, "global_step": 473844, "epoch": 2820} {"train_loss": -11.515459060668945, "global_step": 473845, "epoch": 2820} {"train_loss": -11.827186584472656, "global_step": 473846, "epoch": 2820} {"train_loss": -11.62263011932373, "global_step": 473847, "epoch": 2820} {"train_loss": -12.05424690246582, "global_step": 473848, "epoch": 2820} {"train_loss": -11.039582252502441, "global_step": 473849, "epoch": 2820} {"train_loss": -12.034127235412598, "global_step": 473850, "epoch": 2820} {"train_loss": -11.243581771850586, "global_step": 473851, "epoch": 2820} {"train_loss": -12.09561538696289, "global_step": 473852, "epoch": 2820} {"train_loss": -11.619518280029297, "global_step": 473853, "epoch": 2820} {"train_loss": -11.941650390625, "global_step": 473854, "epoch": 2820} {"train_loss": -11.910311698913574, "global_step": 473855, "epoch": 2820} {"train_loss": -12.041958808898926, "global_step": 473856, "epoch": 2820} {"train_loss": -11.838379859924316, "global_step": 473857, "epoch": 2820} {"train_loss": -12.314901351928711, "global_step": 473858, "epoch": 2820} {"train_loss": -11.482446670532227, "global_step": 473859, "epoch": 2820} {"train_loss": -12.208041191101074, "global_step": 473860, "epoch": 2820} {"train_loss": -11.888848304748535, "global_step": 473861, "epoch": 2820} {"train_loss": -12.232425689697266, "global_step": 473862, "epoch": 2820} {"train_loss": -12.052579879760742, "global_step": 473863, "epoch": 2820} {"train_loss": -12.176469802856445, "global_step": 473864, "epoch": 2820} {"train_loss": -11.845857620239258, "global_step": 473865, "epoch": 2820} {"train_loss": -12.63811206817627, "global_step": 473866, "epoch": 2820} {"train_loss": -11.934720993041992, "global_step": 473867, "epoch": 2820} {"train_loss": -12.620006561279297, "global_step": 473868, "epoch": 2820} {"train_loss": -11.968095779418945, "global_step": 473869, "epoch": 2820} {"train_loss": -12.34205436706543, "global_step": 473870, "epoch": 2820} {"train_loss": -12.27369213104248, "global_step": 473871, "epoch": 2820} {"train_loss": -12.38266658782959, "global_step": 473872, "epoch": 2820} {"train_loss": -12.041204452514648, "global_step": 473873, "epoch": 2820} {"train_loss": -12.612282752990723, "global_step": 473874, "epoch": 2820} {"train_loss": -12.146206855773926, "global_step": 473875, "epoch": 2820} {"train_loss": -12.566126823425293, "global_step": 473876, "epoch": 2820} {"train_loss": -12.36350154876709, "global_step": 473877, "epoch": 2820} {"train_loss": -12.655620574951172, "global_step": 473878, "epoch": 2820} {"train_loss": -12.375070571899414, "global_step": 473879, "epoch": 2820} {"train_loss": -12.534939765930176, "global_step": 473880, "epoch": 2820} {"train_loss": -12.347244262695312, "global_step": 473881, "epoch": 2820} {"train_loss": -12.552395820617676, "global_step": 473882, "epoch": 2820} {"train_loss": -12.523883819580078, "global_step": 473883, "epoch": 2820} {"train_loss": -12.519495010375977, "global_step": 473884, "epoch": 2820} {"train_loss": -12.455852508544922, "global_step": 473885, "epoch": 2820} {"train_loss": -12.511032104492188, "global_step": 473886, "epoch": 2820} {"train_loss": -12.486621856689453, "global_step": 473887, "epoch": 2820} {"train_loss": -12.368385314941406, "global_step": 473888, "epoch": 2820} {"train_loss": -12.543333053588867, "global_step": 473889, "epoch": 2820} {"train_loss": -12.797117233276367, "global_step": 473890, "epoch": 2820} {"train_loss": -12.549686431884766, "global_step": 473891, "epoch": 2820} {"train_loss": -12.737778663635254, "global_step": 473892, "epoch": 2820} {"train_loss": -12.629692077636719, "global_step": 473893, "epoch": 2820} {"train_loss": -12.45211410522461, "global_step": 473894, "epoch": 2820} {"train_loss": -12.92593765258789, "global_step": 473895, "epoch": 2820} {"train_loss": -12.564348220825195, "global_step": 473896, "epoch": 2820} {"train_loss": -12.60861873626709, "global_step": 473897, "epoch": 2820} {"train_loss": -12.779447555541992, "global_step": 473898, "epoch": 2820} {"train_loss": -12.639781951904297, "global_step": 473899, "epoch": 2820} {"train_loss": -12.807600021362305, "global_step": 473900, "epoch": 2820} {"train_loss": -12.814737319946289, "global_step": 473901, "epoch": 2820} {"train_loss": -12.66602897644043, "global_step": 473902, "epoch": 2820} {"train_loss": -12.939374923706055, "global_step": 473903, "epoch": 2820} {"train_loss": -12.791915893554688, "global_step": 473904, "epoch": 2820} {"train_loss": -12.771358489990234, "global_step": 473905, "epoch": 2820} {"train_loss": -12.702346801757812, "global_step": 473906, "epoch": 2820} {"train_loss": -12.840803146362305, "global_step": 473907, "epoch": 2820} {"train_loss": -12.671367645263672, "global_step": 473908, "epoch": 2820} {"train_loss": -12.584041595458984, "global_step": 473909, "epoch": 2820} {"train_loss": -12.911161422729492, "global_step": 473910, "epoch": 2820} {"train_loss": -12.850252151489258, "global_step": 473911, "epoch": 2820} {"train_loss": -12.914575576782227, "global_step": 473912, "epoch": 2820} {"train_loss": -12.891441345214844, "global_step": 473913, "epoch": 2820} {"train_loss": -12.904924392700195, "global_step": 473914, "epoch": 2820} {"train_loss": -12.69182014465332, "global_step": 473915, "epoch": 2820} {"train_loss": -12.902511596679688, "global_step": 473916, "epoch": 2820} {"train_loss": -12.704201698303223, "global_step": 473917, "epoch": 2820} {"train_loss": -12.760747909545898, "global_step": 473918, "epoch": 2820} {"train_loss": -12.75020694732666, "global_step": 473919, "epoch": 2820} {"train_loss": -12.86415958404541, "global_step": 473920, "epoch": 2820} {"train_loss": -12.697940826416016, "global_step": 473921, "epoch": 2820} {"train_loss": -13.128986358642578, "global_step": 473922, "epoch": 2820} {"train_loss": -12.888141632080078, "global_step": 473923, "epoch": 2820} {"train_loss": -12.40318489074707, "global_step": 473924, "epoch": 2820} {"train_loss": -12.252878189086914, "global_step": 473925, "epoch": 2820} {"train_loss": -12.78981876373291, "global_step": 473926, "epoch": 2820} {"train_loss": -12.136840564864022, "global_step": 473927, "epoch": 2820, "val_loss": 310971.15625, "train_action_mse_error": 2.046494245529175} {"train_loss": -12.341572761535645, "global_step": 473928, "epoch": 2821} {"train_loss": -12.047771453857422, "global_step": 473929, "epoch": 2821} {"train_loss": -12.814254760742188, "global_step": 473930, "epoch": 2821} {"train_loss": -12.48587417602539, "global_step": 473931, "epoch": 2821} {"train_loss": -12.350366592407227, "global_step": 473932, "epoch": 2821} {"train_loss": -11.626358032226562, "global_step": 473933, "epoch": 2821} {"train_loss": -12.379232406616211, "global_step": 473934, "epoch": 2821} {"train_loss": -12.444774627685547, "global_step": 473935, "epoch": 2821} {"train_loss": -11.883617401123047, "global_step": 473936, "epoch": 2821} {"train_loss": -12.319746017456055, "global_step": 473937, "epoch": 2821} {"train_loss": -12.434974670410156, "global_step": 473938, "epoch": 2821} {"train_loss": -11.541359901428223, "global_step": 473939, "epoch": 2821} {"train_loss": -12.324281692504883, "global_step": 473940, "epoch": 2821} {"train_loss": -11.748981475830078, "global_step": 473941, "epoch": 2821} {"train_loss": -11.150426864624023, "global_step": 473942, "epoch": 2821} {"train_loss": -11.386104583740234, "global_step": 473943, "epoch": 2821} {"train_loss": -11.677059173583984, "global_step": 473944, "epoch": 2821} {"train_loss": -11.363785743713379, "global_step": 473945, "epoch": 2821} {"train_loss": -11.707003593444824, "global_step": 473946, "epoch": 2821} {"train_loss": -11.960909843444824, "global_step": 473947, "epoch": 2821} {"train_loss": -12.412893295288086, "global_step": 473948, "epoch": 2821} {"train_loss": -11.909910202026367, "global_step": 473949, "epoch": 2821} {"train_loss": -12.2950439453125, "global_step": 473950, "epoch": 2821} {"train_loss": -11.816591262817383, "global_step": 473951, "epoch": 2821} {"train_loss": -12.19455337524414, "global_step": 473952, "epoch": 2821} {"train_loss": -11.839550018310547, "global_step": 473953, "epoch": 2821} {"train_loss": -10.700183868408203, "global_step": 473954, "epoch": 2821} {"train_loss": -10.952727317810059, "global_step": 473955, "epoch": 2821} {"train_loss": -11.09400749206543, "global_step": 473956, "epoch": 2821} {"train_loss": -11.507311820983887, "global_step": 473957, "epoch": 2821} {"train_loss": -11.106582641601562, "global_step": 473958, "epoch": 2821} {"train_loss": -12.260607719421387, "global_step": 473959, "epoch": 2821} {"train_loss": -11.707530975341797, "global_step": 473960, "epoch": 2821} {"train_loss": -12.068925857543945, "global_step": 473961, "epoch": 2821} {"train_loss": -11.45401382446289, "global_step": 473962, "epoch": 2821} {"train_loss": -11.326526641845703, "global_step": 473963, "epoch": 2821} {"train_loss": -12.227851867675781, "global_step": 473964, "epoch": 2821} {"train_loss": -11.662837982177734, "global_step": 473965, "epoch": 2821} {"train_loss": -11.33142375946045, "global_step": 473966, "epoch": 2821} {"train_loss": -11.72825813293457, "global_step": 473967, "epoch": 2821} {"train_loss": -11.4217529296875, "global_step": 473968, "epoch": 2821} {"train_loss": -12.142951965332031, "global_step": 473969, "epoch": 2821} {"train_loss": -11.140403747558594, "global_step": 473970, "epoch": 2821} {"train_loss": -12.275840759277344, "global_step": 473971, "epoch": 2821} {"train_loss": -11.510726928710938, "global_step": 473972, "epoch": 2821} {"train_loss": -12.090797424316406, "global_step": 473973, "epoch": 2821} {"train_loss": -12.257696151733398, "global_step": 473974, "epoch": 2821} {"train_loss": -12.001150131225586, "global_step": 473975, "epoch": 2821} {"train_loss": -12.231205940246582, "global_step": 473976, "epoch": 2821} {"train_loss": -11.785469055175781, "global_step": 473977, "epoch": 2821} {"train_loss": -11.665411949157715, "global_step": 473978, "epoch": 2821} {"train_loss": -11.954131126403809, "global_step": 473979, "epoch": 2821} {"train_loss": -11.359630584716797, "global_step": 473980, "epoch": 2821} {"train_loss": -12.360347747802734, "global_step": 473981, "epoch": 2821} {"train_loss": -11.626547813415527, "global_step": 473982, "epoch": 2821} {"train_loss": -12.408604621887207, "global_step": 473983, "epoch": 2821} {"train_loss": -11.607244491577148, "global_step": 473984, "epoch": 2821} {"train_loss": -11.632591247558594, "global_step": 473985, "epoch": 2821} {"train_loss": -12.20813274383545, "global_step": 473986, "epoch": 2821} {"train_loss": -11.467716217041016, "global_step": 473987, "epoch": 2821} {"train_loss": -12.302040100097656, "global_step": 473988, "epoch": 2821} {"train_loss": -12.07433032989502, "global_step": 473989, "epoch": 2821} {"train_loss": -11.959354400634766, "global_step": 473990, "epoch": 2821} {"train_loss": -11.87034797668457, "global_step": 473991, "epoch": 2821} {"train_loss": -12.103261947631836, "global_step": 473992, "epoch": 2821} {"train_loss": -12.141532897949219, "global_step": 473993, "epoch": 2821} {"train_loss": -11.554269790649414, "global_step": 473994, "epoch": 2821} {"train_loss": -12.371572494506836, "global_step": 473995, "epoch": 2821} {"train_loss": -11.763387680053711, "global_step": 473996, "epoch": 2821} {"train_loss": -11.964862823486328, "global_step": 473997, "epoch": 2821} {"train_loss": -12.037428855895996, "global_step": 473998, "epoch": 2821} {"train_loss": -11.579778671264648, "global_step": 473999, "epoch": 2821} {"train_loss": -12.13174057006836, "global_step": 474000, "epoch": 2821} {"train_loss": -11.206631660461426, "global_step": 474001, "epoch": 2821} {"train_loss": -11.624181747436523, "global_step": 474002, "epoch": 2821} {"train_loss": -10.54484748840332, "global_step": 474003, "epoch": 2821} {"train_loss": -11.600354194641113, "global_step": 474004, "epoch": 2821} {"train_loss": -10.176916122436523, "global_step": 474005, "epoch": 2821} {"train_loss": -10.436504364013672, "global_step": 474006, "epoch": 2821} {"train_loss": -11.012823104858398, "global_step": 474007, "epoch": 2821} {"train_loss": -10.40835952758789, "global_step": 474008, "epoch": 2821} {"train_loss": -9.68958568572998, "global_step": 474009, "epoch": 2821} {"train_loss": -9.486729621887207, "global_step": 474010, "epoch": 2821} {"train_loss": -11.495399475097656, "global_step": 474011, "epoch": 2821} {"train_loss": -9.737038612365723, "global_step": 474012, "epoch": 2821} {"train_loss": -10.56697940826416, "global_step": 474013, "epoch": 2821} {"train_loss": -9.950621604919434, "global_step": 474014, "epoch": 2821} {"train_loss": -10.451343536376953, "global_step": 474015, "epoch": 2821} {"train_loss": -10.082033157348633, "global_step": 474016, "epoch": 2821} {"train_loss": -12.033442497253418, "global_step": 474017, "epoch": 2821} {"train_loss": -10.415489196777344, "global_step": 474018, "epoch": 2821} {"train_loss": -10.0970458984375, "global_step": 474019, "epoch": 2821} {"train_loss": -11.844108581542969, "global_step": 474020, "epoch": 2821} {"train_loss": -10.250469207763672, "global_step": 474021, "epoch": 2821} {"train_loss": -10.21311092376709, "global_step": 474022, "epoch": 2821} {"train_loss": -11.653913497924805, "global_step": 474023, "epoch": 2821} {"train_loss": -11.73978042602539, "global_step": 474024, "epoch": 2821} {"train_loss": -11.297388076782227, "global_step": 474025, "epoch": 2821} {"train_loss": -11.950464248657227, "global_step": 474026, "epoch": 2821} {"train_loss": -11.844146728515625, "global_step": 474027, "epoch": 2821} {"train_loss": -11.108621597290039, "global_step": 474028, "epoch": 2821} {"train_loss": -12.030532836914062, "global_step": 474029, "epoch": 2821} {"train_loss": -11.871524810791016, "global_step": 474030, "epoch": 2821} {"train_loss": -11.592923164367676, "global_step": 474031, "epoch": 2821} {"train_loss": -12.28636360168457, "global_step": 474032, "epoch": 2821} {"train_loss": -11.552057266235352, "global_step": 474033, "epoch": 2821} {"train_loss": -12.129022598266602, "global_step": 474034, "epoch": 2821} {"train_loss": -12.19986629486084, "global_step": 474035, "epoch": 2821} {"train_loss": -12.328717231750488, "global_step": 474036, "epoch": 2821} {"train_loss": -11.973246574401855, "global_step": 474037, "epoch": 2821} {"train_loss": -12.388204574584961, "global_step": 474038, "epoch": 2821} {"train_loss": -12.134721755981445, "global_step": 474039, "epoch": 2821} {"train_loss": -12.091923713684082, "global_step": 474040, "epoch": 2821} {"train_loss": -12.241554260253906, "global_step": 474041, "epoch": 2821} {"train_loss": -11.928868293762207, "global_step": 474042, "epoch": 2821} {"train_loss": -12.22785758972168, "global_step": 474043, "epoch": 2821} {"train_loss": -12.52010726928711, "global_step": 474044, "epoch": 2821} {"train_loss": -12.321895599365234, "global_step": 474045, "epoch": 2821} {"train_loss": -12.39723014831543, "global_step": 474046, "epoch": 2821} {"train_loss": -12.269821166992188, "global_step": 474047, "epoch": 2821} {"train_loss": -12.584587097167969, "global_step": 474048, "epoch": 2821} {"train_loss": -12.357880592346191, "global_step": 474049, "epoch": 2821} {"train_loss": -12.553533554077148, "global_step": 474050, "epoch": 2821} {"train_loss": -12.354873657226562, "global_step": 474051, "epoch": 2821} {"train_loss": -12.411243438720703, "global_step": 474052, "epoch": 2821} {"train_loss": -12.526015281677246, "global_step": 474053, "epoch": 2821} {"train_loss": -12.604780197143555, "global_step": 474054, "epoch": 2821} {"train_loss": -12.413846015930176, "global_step": 474055, "epoch": 2821} {"train_loss": -12.679527282714844, "global_step": 474056, "epoch": 2821} {"train_loss": -12.476613998413086, "global_step": 474057, "epoch": 2821} {"train_loss": -12.441566467285156, "global_step": 474058, "epoch": 2821} {"train_loss": -12.48316764831543, "global_step": 474059, "epoch": 2821} {"train_loss": -12.655830383300781, "global_step": 474060, "epoch": 2821} {"train_loss": -12.650724411010742, "global_step": 474061, "epoch": 2821} {"train_loss": -12.5003662109375, "global_step": 474062, "epoch": 2821} {"train_loss": -12.658262252807617, "global_step": 474063, "epoch": 2821} {"train_loss": -12.601639747619629, "global_step": 474064, "epoch": 2821} {"train_loss": -12.580202102661133, "global_step": 474065, "epoch": 2821} {"train_loss": -12.757851600646973, "global_step": 474066, "epoch": 2821} {"train_loss": -12.798564910888672, "global_step": 474067, "epoch": 2821} {"train_loss": -12.679644584655762, "global_step": 474068, "epoch": 2821} {"train_loss": -12.75224494934082, "global_step": 474069, "epoch": 2821} {"train_loss": -12.555490493774414, "global_step": 474070, "epoch": 2821} {"train_loss": -12.778947830200195, "global_step": 474071, "epoch": 2821} {"train_loss": -12.776077270507812, "global_step": 474072, "epoch": 2821} {"train_loss": -12.672639846801758, "global_step": 474073, "epoch": 2821} {"train_loss": -12.84565544128418, "global_step": 474074, "epoch": 2821} {"train_loss": -12.771535873413086, "global_step": 474075, "epoch": 2821} {"train_loss": -12.886882781982422, "global_step": 474076, "epoch": 2821} {"train_loss": -12.795783042907715, "global_step": 474077, "epoch": 2821} {"train_loss": -12.79011344909668, "global_step": 474078, "epoch": 2821} {"train_loss": -12.746750831604004, "global_step": 474079, "epoch": 2821} {"train_loss": -12.679214477539062, "global_step": 474080, "epoch": 2821} {"train_loss": -12.686634063720703, "global_step": 474081, "epoch": 2821} {"train_loss": -12.579303741455078, "global_step": 474082, "epoch": 2821} {"train_loss": -12.577674865722656, "global_step": 474083, "epoch": 2821} {"train_loss": -12.921688079833984, "global_step": 474084, "epoch": 2821} {"train_loss": -12.697807312011719, "global_step": 474085, "epoch": 2821} {"train_loss": -12.476778030395508, "global_step": 474086, "epoch": 2821} {"train_loss": -12.825788497924805, "global_step": 474087, "epoch": 2821} {"train_loss": -12.701653480529785, "global_step": 474088, "epoch": 2821} {"train_loss": -12.584083557128906, "global_step": 474089, "epoch": 2821} {"train_loss": -12.822153091430664, "global_step": 474090, "epoch": 2821} {"train_loss": -12.38560676574707, "global_step": 474091, "epoch": 2821} {"train_loss": -12.984725952148438, "global_step": 474092, "epoch": 2821} {"train_loss": -12.973104476928711, "global_step": 474093, "epoch": 2821} {"train_loss": -12.62231159210205, "global_step": 474094, "epoch": 2821} {"train_loss": -11.950610870406742, "global_step": 474095, "epoch": 2821, "val_loss": 315790.75} {"train_loss": -12.283441543579102, "global_step": 474096, "epoch": 2822} {"train_loss": -12.596890449523926, "global_step": 474097, "epoch": 2822} {"train_loss": -12.928245544433594, "global_step": 474098, "epoch": 2822} {"train_loss": -12.73161792755127, "global_step": 474099, "epoch": 2822} {"train_loss": -12.658906936645508, "global_step": 474100, "epoch": 2822} {"train_loss": -12.425174713134766, "global_step": 474101, "epoch": 2822} {"train_loss": -12.935906410217285, "global_step": 474102, "epoch": 2822} {"train_loss": -12.596819877624512, "global_step": 474103, "epoch": 2822} {"train_loss": -12.645293235778809, "global_step": 474104, "epoch": 2822} {"train_loss": -13.128023147583008, "global_step": 474105, "epoch": 2822} {"train_loss": -12.84176254272461, "global_step": 474106, "epoch": 2822} {"train_loss": -12.681169509887695, "global_step": 474107, "epoch": 2822} {"train_loss": -12.530488014221191, "global_step": 474108, "epoch": 2822} {"train_loss": -12.917223930358887, "global_step": 474109, "epoch": 2822} {"train_loss": -12.653125762939453, "global_step": 474110, "epoch": 2822} {"train_loss": -12.75680923461914, "global_step": 474111, "epoch": 2822} {"train_loss": -12.866376876831055, "global_step": 474112, "epoch": 2822} {"train_loss": -12.789833068847656, "global_step": 474113, "epoch": 2822} {"train_loss": -12.880783081054688, "global_step": 474114, "epoch": 2822} {"train_loss": -12.714263916015625, "global_step": 474115, "epoch": 2822} {"train_loss": -12.752816200256348, "global_step": 474116, "epoch": 2822} {"train_loss": -12.51419448852539, "global_step": 474117, "epoch": 2822} {"train_loss": -12.778854370117188, "global_step": 474118, "epoch": 2822} {"train_loss": -12.898823738098145, "global_step": 474119, "epoch": 2822} {"train_loss": -12.498527526855469, "global_step": 474120, "epoch": 2822} {"train_loss": -12.5277681350708, "global_step": 474121, "epoch": 2822} {"train_loss": -12.295615196228027, "global_step": 474122, "epoch": 2822} {"train_loss": -12.150997161865234, "global_step": 474123, "epoch": 2822} {"train_loss": -12.601495742797852, "global_step": 474124, "epoch": 2822} {"train_loss": -12.297128677368164, "global_step": 474125, "epoch": 2822} {"train_loss": -11.573945999145508, "global_step": 474126, "epoch": 2822} {"train_loss": -11.246601104736328, "global_step": 474127, "epoch": 2822} {"train_loss": -11.842513084411621, "global_step": 474128, "epoch": 2822} {"train_loss": -12.82177448272705, "global_step": 474129, "epoch": 2822} {"train_loss": -12.31704044342041, "global_step": 474130, "epoch": 2822} {"train_loss": -12.086701393127441, "global_step": 474131, "epoch": 2822} {"train_loss": -12.388803482055664, "global_step": 474132, "epoch": 2822} {"train_loss": -12.055809020996094, "global_step": 474133, "epoch": 2822} {"train_loss": -11.733444213867188, "global_step": 474134, "epoch": 2822} {"train_loss": -12.469649314880371, "global_step": 474135, "epoch": 2822} {"train_loss": -11.783411979675293, "global_step": 474136, "epoch": 2822} {"train_loss": -11.845306396484375, "global_step": 474137, "epoch": 2822} {"train_loss": -12.481670379638672, "global_step": 474138, "epoch": 2822} {"train_loss": -11.34075927734375, "global_step": 474139, "epoch": 2822} {"train_loss": -11.348623275756836, "global_step": 474140, "epoch": 2822} {"train_loss": -12.706916809082031, "global_step": 474141, "epoch": 2822} {"train_loss": -11.765192985534668, "global_step": 474142, "epoch": 2822} {"train_loss": -11.934581756591797, "global_step": 474143, "epoch": 2822} {"train_loss": -12.198141098022461, "global_step": 474144, "epoch": 2822} {"train_loss": -12.389517784118652, "global_step": 474145, "epoch": 2822} {"train_loss": -11.772586822509766, "global_step": 474146, "epoch": 2822} {"train_loss": -12.21640396118164, "global_step": 474147, "epoch": 2822} {"train_loss": -12.785516738891602, "global_step": 474148, "epoch": 2822} {"train_loss": -12.00067138671875, "global_step": 474149, "epoch": 2822} {"train_loss": -11.543206214904785, "global_step": 474150, "epoch": 2822} {"train_loss": -12.468111038208008, "global_step": 474151, "epoch": 2822} {"train_loss": -12.11742115020752, "global_step": 474152, "epoch": 2822} {"train_loss": -11.692214965820312, "global_step": 474153, "epoch": 2822} {"train_loss": -12.378572463989258, "global_step": 474154, "epoch": 2822} {"train_loss": -12.058639526367188, "global_step": 474155, "epoch": 2822} {"train_loss": -11.895549774169922, "global_step": 474156, "epoch": 2822} {"train_loss": -12.638509750366211, "global_step": 474157, "epoch": 2822} {"train_loss": -11.08894157409668, "global_step": 474158, "epoch": 2822} {"train_loss": -11.28671646118164, "global_step": 474159, "epoch": 2822} {"train_loss": -12.262327194213867, "global_step": 474160, "epoch": 2822} {"train_loss": -11.697473526000977, "global_step": 474161, "epoch": 2822} {"train_loss": -11.825492858886719, "global_step": 474162, "epoch": 2822} {"train_loss": -10.487340927124023, "global_step": 474163, "epoch": 2822} {"train_loss": -10.384092330932617, "global_step": 474164, "epoch": 2822} {"train_loss": -11.579046249389648, "global_step": 474165, "epoch": 2822} {"train_loss": -11.111019134521484, "global_step": 474166, "epoch": 2822} {"train_loss": -11.835941314697266, "global_step": 474167, "epoch": 2822} {"train_loss": -11.031118392944336, "global_step": 474168, "epoch": 2822} {"train_loss": -10.781661987304688, "global_step": 474169, "epoch": 2822} {"train_loss": -9.628740310668945, "global_step": 474170, "epoch": 2822} {"train_loss": -10.62248706817627, "global_step": 474171, "epoch": 2822} {"train_loss": -11.691994667053223, "global_step": 474172, "epoch": 2822} {"train_loss": -10.15989875793457, "global_step": 474173, "epoch": 2822} {"train_loss": -12.020008087158203, "global_step": 474174, "epoch": 2822} {"train_loss": -11.312543869018555, "global_step": 474175, "epoch": 2822} {"train_loss": -11.47273063659668, "global_step": 474176, "epoch": 2822} {"train_loss": -11.52299690246582, "global_step": 474177, "epoch": 2822} {"train_loss": -11.81982421875, "global_step": 474178, "epoch": 2822} {"train_loss": -12.397406578063965, "global_step": 474179, "epoch": 2822} {"train_loss": -11.783853530883789, "global_step": 474180, "epoch": 2822} {"train_loss": -12.383134841918945, "global_step": 474181, "epoch": 2822} {"train_loss": -12.115010261535645, "global_step": 474182, "epoch": 2822} {"train_loss": -12.062764167785645, "global_step": 474183, "epoch": 2822} {"train_loss": -11.971616744995117, "global_step": 474184, "epoch": 2822} {"train_loss": -12.238752365112305, "global_step": 474185, "epoch": 2822} {"train_loss": -12.159154891967773, "global_step": 474186, "epoch": 2822} {"train_loss": -12.066484451293945, "global_step": 474187, "epoch": 2822} {"train_loss": -12.14431381225586, "global_step": 474188, "epoch": 2822} {"train_loss": -12.201921463012695, "global_step": 474189, "epoch": 2822} {"train_loss": -12.204536437988281, "global_step": 474190, "epoch": 2822} {"train_loss": -12.217506408691406, "global_step": 474191, "epoch": 2822} {"train_loss": -12.706489562988281, "global_step": 474192, "epoch": 2822} {"train_loss": -12.127713203430176, "global_step": 474193, "epoch": 2822} {"train_loss": -12.273407936096191, "global_step": 474194, "epoch": 2822} {"train_loss": -12.076513290405273, "global_step": 474195, "epoch": 2822} {"train_loss": -12.44751262664795, "global_step": 474196, "epoch": 2822} {"train_loss": -11.982095718383789, "global_step": 474197, "epoch": 2822} {"train_loss": -12.124136924743652, "global_step": 474198, "epoch": 2822} {"train_loss": -12.112582206726074, "global_step": 474199, "epoch": 2822} {"train_loss": -11.543656349182129, "global_step": 474200, "epoch": 2822} {"train_loss": -12.167627334594727, "global_step": 474201, "epoch": 2822} {"train_loss": -11.92265510559082, "global_step": 474202, "epoch": 2822} {"train_loss": -12.26318645477295, "global_step": 474203, "epoch": 2822} {"train_loss": -11.716622352600098, "global_step": 474204, "epoch": 2822} {"train_loss": -12.32510757446289, "global_step": 474205, "epoch": 2822} {"train_loss": -12.447002410888672, "global_step": 474206, "epoch": 2822} {"train_loss": -11.961545944213867, "global_step": 474207, "epoch": 2822} {"train_loss": -12.646051406860352, "global_step": 474208, "epoch": 2822} {"train_loss": -12.07400894165039, "global_step": 474209, "epoch": 2822} {"train_loss": -11.973737716674805, "global_step": 474210, "epoch": 2822} {"train_loss": -12.451190948486328, "global_step": 474211, "epoch": 2822} {"train_loss": -11.868165969848633, "global_step": 474212, "epoch": 2822} {"train_loss": -11.676435470581055, "global_step": 474213, "epoch": 2822} {"train_loss": -12.284470558166504, "global_step": 474214, "epoch": 2822} {"train_loss": -11.727005004882812, "global_step": 474215, "epoch": 2822} {"train_loss": -12.267959594726562, "global_step": 474216, "epoch": 2822} {"train_loss": -12.147638320922852, "global_step": 474217, "epoch": 2822} {"train_loss": -11.290493965148926, "global_step": 474218, "epoch": 2822} {"train_loss": -12.566747665405273, "global_step": 474219, "epoch": 2822} {"train_loss": -11.461007118225098, "global_step": 474220, "epoch": 2822} {"train_loss": -11.539081573486328, "global_step": 474221, "epoch": 2822} {"train_loss": -12.051958084106445, "global_step": 474222, "epoch": 2822} {"train_loss": -11.191537857055664, "global_step": 474223, "epoch": 2822} {"train_loss": -12.40578842163086, "global_step": 474224, "epoch": 2822} {"train_loss": -11.671737670898438, "global_step": 474225, "epoch": 2822} {"train_loss": -11.501151084899902, "global_step": 474226, "epoch": 2822} {"train_loss": -11.6707763671875, "global_step": 474227, "epoch": 2822} {"train_loss": -11.952698707580566, "global_step": 474228, "epoch": 2822} {"train_loss": -11.650858879089355, "global_step": 474229, "epoch": 2822} {"train_loss": -12.120566368103027, "global_step": 474230, "epoch": 2822} {"train_loss": -11.668478012084961, "global_step": 474231, "epoch": 2822} {"train_loss": -11.374284744262695, "global_step": 474232, "epoch": 2822} {"train_loss": -12.120206832885742, "global_step": 474233, "epoch": 2822} {"train_loss": -11.922332763671875, "global_step": 474234, "epoch": 2822} {"train_loss": -12.137414932250977, "global_step": 474235, "epoch": 2822} {"train_loss": -11.912683486938477, "global_step": 474236, "epoch": 2822} {"train_loss": -12.221094131469727, "global_step": 474237, "epoch": 2822} {"train_loss": -11.874659538269043, "global_step": 474238, "epoch": 2822} {"train_loss": -12.440227508544922, "global_step": 474239, "epoch": 2822} {"train_loss": -11.868326187133789, "global_step": 474240, "epoch": 2822} {"train_loss": -12.247912406921387, "global_step": 474241, "epoch": 2822} {"train_loss": -12.216032028198242, "global_step": 474242, "epoch": 2822} {"train_loss": -12.617603302001953, "global_step": 474243, "epoch": 2822} {"train_loss": -12.267544746398926, "global_step": 474244, "epoch": 2822} {"train_loss": -12.422460556030273, "global_step": 474245, "epoch": 2822} {"train_loss": -12.107702255249023, "global_step": 474246, "epoch": 2822} {"train_loss": -12.249748229980469, "global_step": 474247, "epoch": 2822} {"train_loss": -12.330192565917969, "global_step": 474248, "epoch": 2822} {"train_loss": -12.409027099609375, "global_step": 474249, "epoch": 2822} {"train_loss": -12.644909858703613, "global_step": 474250, "epoch": 2822} {"train_loss": -12.528295516967773, "global_step": 474251, "epoch": 2822} {"train_loss": -12.344348907470703, "global_step": 474252, "epoch": 2822} {"train_loss": -12.472986221313477, "global_step": 474253, "epoch": 2822} {"train_loss": -12.704290390014648, "global_step": 474254, "epoch": 2822} {"train_loss": -12.652084350585938, "global_step": 474255, "epoch": 2822} {"train_loss": -12.46937370300293, "global_step": 474256, "epoch": 2822} {"train_loss": -12.69841480255127, "global_step": 474257, "epoch": 2822} {"train_loss": -12.35176944732666, "global_step": 474258, "epoch": 2822} {"train_loss": -12.650846481323242, "global_step": 474259, "epoch": 2822} {"train_loss": -12.38673210144043, "global_step": 474260, "epoch": 2822} {"train_loss": -12.729240417480469, "global_step": 474261, "epoch": 2822} {"train_loss": -12.234809875488281, "global_step": 474262, "epoch": 2822} {"train_loss": -12.102479633830843, "global_step": 474263, "epoch": 2822, "val_loss": 312563.40625} {"train_loss": -12.435302734375, "global_step": 474264, "epoch": 2823} {"train_loss": -12.469615936279297, "global_step": 474265, "epoch": 2823} {"train_loss": -12.58928108215332, "global_step": 474266, "epoch": 2823} {"train_loss": -12.484977722167969, "global_step": 474267, "epoch": 2823} {"train_loss": -12.617259979248047, "global_step": 474268, "epoch": 2823} {"train_loss": -12.339746475219727, "global_step": 474269, "epoch": 2823} {"train_loss": -12.413946151733398, "global_step": 474270, "epoch": 2823} {"train_loss": -12.915206909179688, "global_step": 474271, "epoch": 2823} {"train_loss": -12.5092134475708, "global_step": 474272, "epoch": 2823} {"train_loss": -12.558573722839355, "global_step": 474273, "epoch": 2823} {"train_loss": -12.43824291229248, "global_step": 474274, "epoch": 2823} {"train_loss": -12.494525909423828, "global_step": 474275, "epoch": 2823} {"train_loss": -12.604504585266113, "global_step": 474276, "epoch": 2823} {"train_loss": -12.704544067382812, "global_step": 474277, "epoch": 2823} {"train_loss": -12.158896446228027, "global_step": 474278, "epoch": 2823} {"train_loss": -12.882040023803711, "global_step": 474279, "epoch": 2823} {"train_loss": -12.42852783203125, "global_step": 474280, "epoch": 2823} {"train_loss": -12.778094291687012, "global_step": 474281, "epoch": 2823} {"train_loss": -12.766912460327148, "global_step": 474282, "epoch": 2823} {"train_loss": -11.984918594360352, "global_step": 474283, "epoch": 2823} {"train_loss": -12.31606674194336, "global_step": 474284, "epoch": 2823} {"train_loss": -12.630805015563965, "global_step": 474285, "epoch": 2823} {"train_loss": -12.518206596374512, "global_step": 474286, "epoch": 2823} {"train_loss": -12.11705493927002, "global_step": 474287, "epoch": 2823} {"train_loss": -12.103737831115723, "global_step": 474288, "epoch": 2823} {"train_loss": -12.635747909545898, "global_step": 474289, "epoch": 2823} {"train_loss": -12.084653854370117, "global_step": 474290, "epoch": 2823} {"train_loss": -12.147953987121582, "global_step": 474291, "epoch": 2823} {"train_loss": -11.989705085754395, "global_step": 474292, "epoch": 2823} {"train_loss": -12.254353523254395, "global_step": 474293, "epoch": 2823} {"train_loss": -12.21693229675293, "global_step": 474294, "epoch": 2823} {"train_loss": -12.690454483032227, "global_step": 474295, "epoch": 2823} {"train_loss": -11.985289573669434, "global_step": 474296, "epoch": 2823} {"train_loss": -12.438573837280273, "global_step": 474297, "epoch": 2823} {"train_loss": -12.07518482208252, "global_step": 474298, "epoch": 2823} {"train_loss": -12.712514877319336, "global_step": 474299, "epoch": 2823} {"train_loss": -12.052000045776367, "global_step": 474300, "epoch": 2823} {"train_loss": -12.380231857299805, "global_step": 474301, "epoch": 2823} {"train_loss": -12.544759750366211, "global_step": 474302, "epoch": 2823} {"train_loss": -11.719524383544922, "global_step": 474303, "epoch": 2823} {"train_loss": -12.315879821777344, "global_step": 474304, "epoch": 2823} {"train_loss": -11.909706115722656, "global_step": 474305, "epoch": 2823} {"train_loss": -12.290135383605957, "global_step": 474306, "epoch": 2823} {"train_loss": -12.234609603881836, "global_step": 474307, "epoch": 2823} {"train_loss": -12.328706741333008, "global_step": 474308, "epoch": 2823} {"train_loss": -12.014810562133789, "global_step": 474309, "epoch": 2823} {"train_loss": -12.405996322631836, "global_step": 474310, "epoch": 2823} {"train_loss": -12.108516693115234, "global_step": 474311, "epoch": 2823} {"train_loss": -12.550382614135742, "global_step": 474312, "epoch": 2823} {"train_loss": -12.089337348937988, "global_step": 474313, "epoch": 2823} {"train_loss": -12.550596237182617, "global_step": 474314, "epoch": 2823} {"train_loss": -12.208874702453613, "global_step": 474315, "epoch": 2823} {"train_loss": -12.44156265258789, "global_step": 474316, "epoch": 2823} {"train_loss": -12.458000183105469, "global_step": 474317, "epoch": 2823} {"train_loss": -12.065553665161133, "global_step": 474318, "epoch": 2823} {"train_loss": -12.393006324768066, "global_step": 474319, "epoch": 2823} {"train_loss": -12.635693550109863, "global_step": 474320, "epoch": 2823} {"train_loss": -12.349533081054688, "global_step": 474321, "epoch": 2823} {"train_loss": -11.943689346313477, "global_step": 474322, "epoch": 2823} {"train_loss": -12.516852378845215, "global_step": 474323, "epoch": 2823} {"train_loss": -12.694326400756836, "global_step": 474324, "epoch": 2823} {"train_loss": -12.429753303527832, "global_step": 474325, "epoch": 2823} {"train_loss": -12.559391021728516, "global_step": 474326, "epoch": 2823} {"train_loss": -12.467164993286133, "global_step": 474327, "epoch": 2823} {"train_loss": -12.524409294128418, "global_step": 474328, "epoch": 2823} {"train_loss": -12.685653686523438, "global_step": 474329, "epoch": 2823} {"train_loss": -12.49978256225586, "global_step": 474330, "epoch": 2823} {"train_loss": -12.653461456298828, "global_step": 474331, "epoch": 2823} {"train_loss": -12.551651954650879, "global_step": 474332, "epoch": 2823} {"train_loss": -12.475117683410645, "global_step": 474333, "epoch": 2823} {"train_loss": -12.80259895324707, "global_step": 474334, "epoch": 2823} {"train_loss": -12.554457664489746, "global_step": 474335, "epoch": 2823} {"train_loss": -12.420320510864258, "global_step": 474336, "epoch": 2823} {"train_loss": -12.967489242553711, "global_step": 474337, "epoch": 2823} {"train_loss": -12.669037818908691, "global_step": 474338, "epoch": 2823} {"train_loss": -12.635615348815918, "global_step": 474339, "epoch": 2823} {"train_loss": -12.676498413085938, "global_step": 474340, "epoch": 2823} {"train_loss": -12.442815780639648, "global_step": 474341, "epoch": 2823} {"train_loss": -12.465664863586426, "global_step": 474342, "epoch": 2823} {"train_loss": -12.406251907348633, "global_step": 474343, "epoch": 2823} {"train_loss": -11.84817886352539, "global_step": 474344, "epoch": 2823} {"train_loss": -11.332128524780273, "global_step": 474345, "epoch": 2823} {"train_loss": -12.608929634094238, "global_step": 474346, "epoch": 2823} {"train_loss": -12.13840103149414, "global_step": 474347, "epoch": 2823} {"train_loss": -11.446609497070312, "global_step": 474348, "epoch": 2823} {"train_loss": -12.450479507446289, "global_step": 474349, "epoch": 2823} {"train_loss": -11.930493354797363, "global_step": 474350, "epoch": 2823} {"train_loss": -11.973175048828125, "global_step": 474351, "epoch": 2823} {"train_loss": -12.270870208740234, "global_step": 474352, "epoch": 2823} {"train_loss": -11.277612686157227, "global_step": 474353, "epoch": 2823} {"train_loss": -11.870734214782715, "global_step": 474354, "epoch": 2823} {"train_loss": -11.684192657470703, "global_step": 474355, "epoch": 2823} {"train_loss": -12.514225006103516, "global_step": 474356, "epoch": 2823} {"train_loss": -12.04265308380127, "global_step": 474357, "epoch": 2823} {"train_loss": -12.412313461303711, "global_step": 474358, "epoch": 2823} {"train_loss": -12.250015258789062, "global_step": 474359, "epoch": 2823} {"train_loss": -12.504377365112305, "global_step": 474360, "epoch": 2823} {"train_loss": -12.322025299072266, "global_step": 474361, "epoch": 2823} {"train_loss": -12.544767379760742, "global_step": 474362, "epoch": 2823} {"train_loss": -12.15168571472168, "global_step": 474363, "epoch": 2823} {"train_loss": -12.525588035583496, "global_step": 474364, "epoch": 2823} {"train_loss": -12.145666122436523, "global_step": 474365, "epoch": 2823} {"train_loss": -12.654462814331055, "global_step": 474366, "epoch": 2823} {"train_loss": -12.094332695007324, "global_step": 474367, "epoch": 2823} {"train_loss": -11.924951553344727, "global_step": 474368, "epoch": 2823} {"train_loss": -11.687829971313477, "global_step": 474369, "epoch": 2823} {"train_loss": -11.648796081542969, "global_step": 474370, "epoch": 2823} {"train_loss": -9.959787368774414, "global_step": 474371, "epoch": 2823} {"train_loss": -11.058984756469727, "global_step": 474372, "epoch": 2823} {"train_loss": -11.200494766235352, "global_step": 474373, "epoch": 2823} {"train_loss": -11.065164566040039, "global_step": 474374, "epoch": 2823} {"train_loss": -11.178067207336426, "global_step": 474375, "epoch": 2823} {"train_loss": -11.894624710083008, "global_step": 474376, "epoch": 2823} {"train_loss": -12.166215896606445, "global_step": 474377, "epoch": 2823} {"train_loss": -12.566534996032715, "global_step": 474378, "epoch": 2823} {"train_loss": -12.526092529296875, "global_step": 474379, "epoch": 2823} {"train_loss": -12.48382568359375, "global_step": 474380, "epoch": 2823} {"train_loss": -12.801494598388672, "global_step": 474381, "epoch": 2823} {"train_loss": -12.528238296508789, "global_step": 474382, "epoch": 2823} {"train_loss": -12.640779495239258, "global_step": 474383, "epoch": 2823} {"train_loss": -12.587034225463867, "global_step": 474384, "epoch": 2823} {"train_loss": -12.379112243652344, "global_step": 474385, "epoch": 2823} {"train_loss": -12.310815811157227, "global_step": 474386, "epoch": 2823} {"train_loss": -12.739959716796875, "global_step": 474387, "epoch": 2823} {"train_loss": -12.117643356323242, "global_step": 474388, "epoch": 2823} {"train_loss": -11.832880020141602, "global_step": 474389, "epoch": 2823} {"train_loss": -12.258410453796387, "global_step": 474390, "epoch": 2823} {"train_loss": -12.086803436279297, "global_step": 474391, "epoch": 2823} {"train_loss": -11.463479995727539, "global_step": 474392, "epoch": 2823} {"train_loss": -11.746307373046875, "global_step": 474393, "epoch": 2823} {"train_loss": -11.863958358764648, "global_step": 474394, "epoch": 2823} {"train_loss": -11.85523796081543, "global_step": 474395, "epoch": 2823} {"train_loss": -12.109742164611816, "global_step": 474396, "epoch": 2823} {"train_loss": -12.042913436889648, "global_step": 474397, "epoch": 2823} {"train_loss": -11.957805633544922, "global_step": 474398, "epoch": 2823} {"train_loss": -12.144511222839355, "global_step": 474399, "epoch": 2823} {"train_loss": -11.947185516357422, "global_step": 474400, "epoch": 2823} {"train_loss": -11.66637897491455, "global_step": 474401, "epoch": 2823} {"train_loss": -11.887112617492676, "global_step": 474402, "epoch": 2823} {"train_loss": -11.801570892333984, "global_step": 474403, "epoch": 2823} {"train_loss": -11.553004264831543, "global_step": 474404, "epoch": 2823} {"train_loss": -12.460182189941406, "global_step": 474405, "epoch": 2823} {"train_loss": -11.718709945678711, "global_step": 474406, "epoch": 2823} {"train_loss": -12.201932907104492, "global_step": 474407, "epoch": 2823} {"train_loss": -12.34750747680664, "global_step": 474408, "epoch": 2823} {"train_loss": -12.14069938659668, "global_step": 474409, "epoch": 2823} {"train_loss": -11.831100463867188, "global_step": 474410, "epoch": 2823} {"train_loss": -11.823498725891113, "global_step": 474411, "epoch": 2823} {"train_loss": -11.924217224121094, "global_step": 474412, "epoch": 2823} {"train_loss": -11.878080368041992, "global_step": 474413, "epoch": 2823} {"train_loss": -12.187077522277832, "global_step": 474414, "epoch": 2823} {"train_loss": -12.014202117919922, "global_step": 474415, "epoch": 2823} {"train_loss": -11.581164360046387, "global_step": 474416, "epoch": 2823} {"train_loss": -12.249229431152344, "global_step": 474417, "epoch": 2823} {"train_loss": -10.713335037231445, "global_step": 474418, "epoch": 2823} {"train_loss": -11.830779075622559, "global_step": 474419, "epoch": 2823} {"train_loss": -10.151935577392578, "global_step": 474420, "epoch": 2823} {"train_loss": -11.033402442932129, "global_step": 474421, "epoch": 2823} {"train_loss": -10.998720169067383, "global_step": 474422, "epoch": 2823} {"train_loss": -11.044607162475586, "global_step": 474423, "epoch": 2823} {"train_loss": -11.90638256072998, "global_step": 474424, "epoch": 2823} {"train_loss": -10.780616760253906, "global_step": 474425, "epoch": 2823} {"train_loss": -11.819292068481445, "global_step": 474426, "epoch": 2823} {"train_loss": -11.349296569824219, "global_step": 474427, "epoch": 2823} {"train_loss": -11.490779876708984, "global_step": 474428, "epoch": 2823} {"train_loss": -12.170442581176758, "global_step": 474429, "epoch": 2823} {"train_loss": -11.303918838500977, "global_step": 474430, "epoch": 2823} {"train_loss": -12.150975323858715, "global_step": 474431, "epoch": 2823, "val_loss": 313687.0625} {"train_loss": -11.161178588867188, "global_step": 474432, "epoch": 2824} {"train_loss": -11.510454177856445, "global_step": 474433, "epoch": 2824} {"train_loss": -11.123678207397461, "global_step": 474434, "epoch": 2824} {"train_loss": -11.978968620300293, "global_step": 474435, "epoch": 2824} {"train_loss": -11.44127082824707, "global_step": 474436, "epoch": 2824} {"train_loss": -11.803069114685059, "global_step": 474437, "epoch": 2824} {"train_loss": -11.639181137084961, "global_step": 474438, "epoch": 2824} {"train_loss": -12.312064170837402, "global_step": 474439, "epoch": 2824} {"train_loss": -11.956623077392578, "global_step": 474440, "epoch": 2824} {"train_loss": -12.066972732543945, "global_step": 474441, "epoch": 2824} {"train_loss": -12.11833381652832, "global_step": 474442, "epoch": 2824} {"train_loss": -11.748332023620605, "global_step": 474443, "epoch": 2824} {"train_loss": -11.917171478271484, "global_step": 474444, "epoch": 2824} {"train_loss": -12.07809829711914, "global_step": 474445, "epoch": 2824} {"train_loss": -11.93366813659668, "global_step": 474446, "epoch": 2824} {"train_loss": -12.338579177856445, "global_step": 474447, "epoch": 2824} {"train_loss": -12.334321975708008, "global_step": 474448, "epoch": 2824} {"train_loss": -12.019925117492676, "global_step": 474449, "epoch": 2824} {"train_loss": -12.29500675201416, "global_step": 474450, "epoch": 2824} {"train_loss": -12.532835006713867, "global_step": 474451, "epoch": 2824} {"train_loss": -12.555423736572266, "global_step": 474452, "epoch": 2824} {"train_loss": -12.036367416381836, "global_step": 474453, "epoch": 2824} {"train_loss": -12.526390075683594, "global_step": 474454, "epoch": 2824} {"train_loss": -12.44247055053711, "global_step": 474455, "epoch": 2824} {"train_loss": -12.399872779846191, "global_step": 474456, "epoch": 2824} {"train_loss": -12.09503173828125, "global_step": 474457, "epoch": 2824} {"train_loss": -12.438057899475098, "global_step": 474458, "epoch": 2824} {"train_loss": -12.28281021118164, "global_step": 474459, "epoch": 2824} {"train_loss": -11.990589141845703, "global_step": 474460, "epoch": 2824} {"train_loss": -12.520614624023438, "global_step": 474461, "epoch": 2824} {"train_loss": -12.278911590576172, "global_step": 474462, "epoch": 2824} {"train_loss": -12.383357048034668, "global_step": 474463, "epoch": 2824} {"train_loss": -12.053309440612793, "global_step": 474464, "epoch": 2824} {"train_loss": -12.22049331665039, "global_step": 474465, "epoch": 2824} {"train_loss": -12.042316436767578, "global_step": 474466, "epoch": 2824} {"train_loss": -12.296745300292969, "global_step": 474467, "epoch": 2824} {"train_loss": -12.321327209472656, "global_step": 474468, "epoch": 2824} {"train_loss": -12.504512786865234, "global_step": 474469, "epoch": 2824} {"train_loss": -12.43585205078125, "global_step": 474470, "epoch": 2824} {"train_loss": -12.404195785522461, "global_step": 474471, "epoch": 2824} {"train_loss": -12.568038940429688, "global_step": 474472, "epoch": 2824} {"train_loss": -12.56344223022461, "global_step": 474473, "epoch": 2824} {"train_loss": -12.482640266418457, "global_step": 474474, "epoch": 2824} {"train_loss": -12.565431594848633, "global_step": 474475, "epoch": 2824} {"train_loss": -12.157524108886719, "global_step": 474476, "epoch": 2824} {"train_loss": -12.102816581726074, "global_step": 474477, "epoch": 2824} {"train_loss": -12.41867446899414, "global_step": 474478, "epoch": 2824} {"train_loss": -12.626723289489746, "global_step": 474479, "epoch": 2824} {"train_loss": -12.578962326049805, "global_step": 474480, "epoch": 2824} {"train_loss": -12.637656211853027, "global_step": 474481, "epoch": 2824} {"train_loss": -12.566463470458984, "global_step": 474482, "epoch": 2824} {"train_loss": -12.583608627319336, "global_step": 474483, "epoch": 2824} {"train_loss": -12.468158721923828, "global_step": 474484, "epoch": 2824} {"train_loss": -12.726615905761719, "global_step": 474485, "epoch": 2824} {"train_loss": -12.334799766540527, "global_step": 474486, "epoch": 2824} {"train_loss": -12.468841552734375, "global_step": 474487, "epoch": 2824} {"train_loss": -12.532615661621094, "global_step": 474488, "epoch": 2824} {"train_loss": -12.853479385375977, "global_step": 474489, "epoch": 2824} {"train_loss": -12.770269393920898, "global_step": 474490, "epoch": 2824} {"train_loss": -12.613055229187012, "global_step": 474491, "epoch": 2824} {"train_loss": -12.788592338562012, "global_step": 474492, "epoch": 2824} {"train_loss": -12.704833030700684, "global_step": 474493, "epoch": 2824} {"train_loss": -12.633743286132812, "global_step": 474494, "epoch": 2824} {"train_loss": -12.50335693359375, "global_step": 474495, "epoch": 2824} {"train_loss": -12.574808120727539, "global_step": 474496, "epoch": 2824} {"train_loss": -12.544904708862305, "global_step": 474497, "epoch": 2824} {"train_loss": -12.461980819702148, "global_step": 474498, "epoch": 2824} {"train_loss": -12.909761428833008, "global_step": 474499, "epoch": 2824} {"train_loss": -12.625842094421387, "global_step": 474500, "epoch": 2824} {"train_loss": -12.700241088867188, "global_step": 474501, "epoch": 2824} {"train_loss": -12.486129760742188, "global_step": 474502, "epoch": 2824} {"train_loss": -12.594940185546875, "global_step": 474503, "epoch": 2824} {"train_loss": -12.631326675415039, "global_step": 474504, "epoch": 2824} {"train_loss": -12.890250205993652, "global_step": 474505, "epoch": 2824} {"train_loss": -12.421592712402344, "global_step": 474506, "epoch": 2824} {"train_loss": -12.70626449584961, "global_step": 474507, "epoch": 2824} {"train_loss": -12.695180892944336, "global_step": 474508, "epoch": 2824} {"train_loss": -12.601325035095215, "global_step": 474509, "epoch": 2824} {"train_loss": -12.912099838256836, "global_step": 474510, "epoch": 2824} {"train_loss": -12.777189254760742, "global_step": 474511, "epoch": 2824} {"train_loss": -12.641471862792969, "global_step": 474512, "epoch": 2824} {"train_loss": -12.776299476623535, "global_step": 474513, "epoch": 2824} {"train_loss": -12.715399742126465, "global_step": 474514, "epoch": 2824} {"train_loss": -12.813533782958984, "global_step": 474515, "epoch": 2824} {"train_loss": -12.441635131835938, "global_step": 474516, "epoch": 2824} {"train_loss": -13.007098197937012, "global_step": 474517, "epoch": 2824} {"train_loss": -12.48190975189209, "global_step": 474518, "epoch": 2824} {"train_loss": -12.818267822265625, "global_step": 474519, "epoch": 2824} {"train_loss": -12.916305541992188, "global_step": 474520, "epoch": 2824} {"train_loss": -12.806648254394531, "global_step": 474521, "epoch": 2824} {"train_loss": -12.612345695495605, "global_step": 474522, "epoch": 2824} {"train_loss": -12.838859558105469, "global_step": 474523, "epoch": 2824} {"train_loss": -12.559316635131836, "global_step": 474524, "epoch": 2824} {"train_loss": -12.714275360107422, "global_step": 474525, "epoch": 2824} {"train_loss": -12.60733699798584, "global_step": 474526, "epoch": 2824} {"train_loss": -12.629249572753906, "global_step": 474527, "epoch": 2824} {"train_loss": -12.922534942626953, "global_step": 474528, "epoch": 2824} {"train_loss": -12.616195678710938, "global_step": 474529, "epoch": 2824} {"train_loss": -12.348881721496582, "global_step": 474530, "epoch": 2824} {"train_loss": -12.339803695678711, "global_step": 474531, "epoch": 2824} {"train_loss": -12.942869186401367, "global_step": 474532, "epoch": 2824} {"train_loss": -11.701626777648926, "global_step": 474533, "epoch": 2824} {"train_loss": -11.993492126464844, "global_step": 474534, "epoch": 2824} {"train_loss": -12.770295143127441, "global_step": 474535, "epoch": 2824} {"train_loss": -11.84536361694336, "global_step": 474536, "epoch": 2824} {"train_loss": -9.81991958618164, "global_step": 474537, "epoch": 2824} {"train_loss": -12.697122573852539, "global_step": 474538, "epoch": 2824} {"train_loss": -9.903459548950195, "global_step": 474539, "epoch": 2824} {"train_loss": -11.25941276550293, "global_step": 474540, "epoch": 2824} {"train_loss": -12.055416107177734, "global_step": 474541, "epoch": 2824} {"train_loss": -10.956428527832031, "global_step": 474542, "epoch": 2824} {"train_loss": -11.861125946044922, "global_step": 474543, "epoch": 2824} {"train_loss": -10.003202438354492, "global_step": 474544, "epoch": 2824} {"train_loss": -10.556049346923828, "global_step": 474545, "epoch": 2824} {"train_loss": -10.085132598876953, "global_step": 474546, "epoch": 2824} {"train_loss": -10.515053749084473, "global_step": 474547, "epoch": 2824} {"train_loss": -8.970059394836426, "global_step": 474548, "epoch": 2824} {"train_loss": -9.963044166564941, "global_step": 474549, "epoch": 2824} {"train_loss": -9.357937812805176, "global_step": 474550, "epoch": 2824} {"train_loss": -8.481891632080078, "global_step": 474551, "epoch": 2824} {"train_loss": -8.699418067932129, "global_step": 474552, "epoch": 2824} {"train_loss": -9.800806999206543, "global_step": 474553, "epoch": 2824} {"train_loss": -10.007674217224121, "global_step": 474554, "epoch": 2824} {"train_loss": -9.942296981811523, "global_step": 474555, "epoch": 2824} {"train_loss": -9.690677642822266, "global_step": 474556, "epoch": 2824} {"train_loss": -10.078413963317871, "global_step": 474557, "epoch": 2824} {"train_loss": -10.065435409545898, "global_step": 474558, "epoch": 2824} {"train_loss": -10.289318084716797, "global_step": 474559, "epoch": 2824} {"train_loss": -11.176385879516602, "global_step": 474560, "epoch": 2824} {"train_loss": -10.911462783813477, "global_step": 474561, "epoch": 2824} {"train_loss": -11.753019332885742, "global_step": 474562, "epoch": 2824} {"train_loss": -11.120416641235352, "global_step": 474563, "epoch": 2824} {"train_loss": -11.199359893798828, "global_step": 474564, "epoch": 2824} {"train_loss": -11.394002914428711, "global_step": 474565, "epoch": 2824} {"train_loss": -11.238252639770508, "global_step": 474566, "epoch": 2824} {"train_loss": -11.82983112335205, "global_step": 474567, "epoch": 2824} {"train_loss": -11.472085952758789, "global_step": 474568, "epoch": 2824} {"train_loss": -11.689125061035156, "global_step": 474569, "epoch": 2824} {"train_loss": -11.357443809509277, "global_step": 474570, "epoch": 2824} {"train_loss": -11.30283260345459, "global_step": 474571, "epoch": 2824} {"train_loss": -10.99612808227539, "global_step": 474572, "epoch": 2824} {"train_loss": -11.12337875366211, "global_step": 474573, "epoch": 2824} {"train_loss": -11.717459678649902, "global_step": 474574, "epoch": 2824} {"train_loss": -11.03201961517334, "global_step": 474575, "epoch": 2824} {"train_loss": -12.187732696533203, "global_step": 474576, "epoch": 2824} {"train_loss": -10.950882911682129, "global_step": 474577, "epoch": 2824} {"train_loss": -11.815147399902344, "global_step": 474578, "epoch": 2824} {"train_loss": -11.76723861694336, "global_step": 474579, "epoch": 2824} {"train_loss": -11.747047424316406, "global_step": 474580, "epoch": 2824} {"train_loss": -11.636348724365234, "global_step": 474581, "epoch": 2824} {"train_loss": -11.206350326538086, "global_step": 474582, "epoch": 2824} {"train_loss": -12.102096557617188, "global_step": 474583, "epoch": 2824} {"train_loss": -11.166755676269531, "global_step": 474584, "epoch": 2824} {"train_loss": -12.003791809082031, "global_step": 474585, "epoch": 2824} {"train_loss": -12.133769035339355, "global_step": 474586, "epoch": 2824} {"train_loss": -11.680032730102539, "global_step": 474587, "epoch": 2824} {"train_loss": -12.557025909423828, "global_step": 474588, "epoch": 2824} {"train_loss": -12.07758903503418, "global_step": 474589, "epoch": 2824} {"train_loss": -12.27713394165039, "global_step": 474590, "epoch": 2824} {"train_loss": -11.8964204788208, "global_step": 474591, "epoch": 2824} {"train_loss": -12.149955749511719, "global_step": 474592, "epoch": 2824} {"train_loss": -12.248895645141602, "global_step": 474593, "epoch": 2824} {"train_loss": -12.281963348388672, "global_step": 474594, "epoch": 2824} {"train_loss": -12.11845874786377, "global_step": 474595, "epoch": 2824} {"train_loss": -12.213761329650879, "global_step": 474596, "epoch": 2824} {"train_loss": -12.394137382507324, "global_step": 474597, "epoch": 2824} {"train_loss": -12.444632530212402, "global_step": 474598, "epoch": 2824} {"train_loss": -11.945644509224664, "global_step": 474599, "epoch": 2824, "val_loss": 316722.09375} {"train_loss": -12.342930793762207, "global_step": 474600, "epoch": 2825} {"train_loss": -12.592252731323242, "global_step": 474601, "epoch": 2825} {"train_loss": -12.313898086547852, "global_step": 474602, "epoch": 2825} {"train_loss": -12.451560974121094, "global_step": 474603, "epoch": 2825} {"train_loss": -12.591094970703125, "global_step": 474604, "epoch": 2825} {"train_loss": -12.540868759155273, "global_step": 474605, "epoch": 2825} {"train_loss": -12.665868759155273, "global_step": 474606, "epoch": 2825} {"train_loss": -12.549215316772461, "global_step": 474607, "epoch": 2825} {"train_loss": -12.537694931030273, "global_step": 474608, "epoch": 2825} {"train_loss": -12.790163040161133, "global_step": 474609, "epoch": 2825} {"train_loss": -12.726152420043945, "global_step": 474610, "epoch": 2825} {"train_loss": -12.744674682617188, "global_step": 474611, "epoch": 2825} {"train_loss": -12.430817604064941, "global_step": 474612, "epoch": 2825} {"train_loss": -12.60123062133789, "global_step": 474613, "epoch": 2825} {"train_loss": -12.093061447143555, "global_step": 474614, "epoch": 2825} {"train_loss": -12.542854309082031, "global_step": 474615, "epoch": 2825} {"train_loss": -12.145648956298828, "global_step": 474616, "epoch": 2825} {"train_loss": -12.384902954101562, "global_step": 474617, "epoch": 2825} {"train_loss": -12.444036483764648, "global_step": 474618, "epoch": 2825} {"train_loss": -12.278619766235352, "global_step": 474619, "epoch": 2825} {"train_loss": -12.689814567565918, "global_step": 474620, "epoch": 2825} {"train_loss": -12.636955261230469, "global_step": 474621, "epoch": 2825} {"train_loss": -12.51192569732666, "global_step": 474622, "epoch": 2825} {"train_loss": -12.53438949584961, "global_step": 474623, "epoch": 2825} {"train_loss": -12.29318618774414, "global_step": 474624, "epoch": 2825} {"train_loss": -12.669507026672363, "global_step": 474625, "epoch": 2825} {"train_loss": -12.67380428314209, "global_step": 474626, "epoch": 2825} {"train_loss": -12.427507400512695, "global_step": 474627, "epoch": 2825} {"train_loss": -12.463363647460938, "global_step": 474628, "epoch": 2825} {"train_loss": -12.672712326049805, "global_step": 474629, "epoch": 2825} {"train_loss": -12.672179222106934, "global_step": 474630, "epoch": 2825} {"train_loss": -12.752645492553711, "global_step": 474631, "epoch": 2825} {"train_loss": -12.240336418151855, "global_step": 474632, "epoch": 2825} {"train_loss": -12.516572952270508, "global_step": 474633, "epoch": 2825} {"train_loss": -12.801139831542969, "global_step": 474634, "epoch": 2825} {"train_loss": -12.543978691101074, "global_step": 474635, "epoch": 2825} {"train_loss": -12.509270668029785, "global_step": 474636, "epoch": 2825} {"train_loss": -12.329061508178711, "global_step": 474637, "epoch": 2825} {"train_loss": -11.725777626037598, "global_step": 474638, "epoch": 2825} {"train_loss": -12.444620132446289, "global_step": 474639, "epoch": 2825} {"train_loss": -11.57994270324707, "global_step": 474640, "epoch": 2825} {"train_loss": -12.542174339294434, "global_step": 474641, "epoch": 2825} {"train_loss": -12.527312278747559, "global_step": 474642, "epoch": 2825} {"train_loss": -11.099218368530273, "global_step": 474643, "epoch": 2825} {"train_loss": -12.770627975463867, "global_step": 474644, "epoch": 2825} {"train_loss": -11.477872848510742, "global_step": 474645, "epoch": 2825} {"train_loss": -12.067689895629883, "global_step": 474646, "epoch": 2825} {"train_loss": -12.467470169067383, "global_step": 474647, "epoch": 2825} {"train_loss": -11.277915000915527, "global_step": 474648, "epoch": 2825} {"train_loss": -12.621688842773438, "global_step": 474649, "epoch": 2825} {"train_loss": -11.89910888671875, "global_step": 474650, "epoch": 2825} {"train_loss": -12.688863754272461, "global_step": 474651, "epoch": 2825} {"train_loss": -12.401410102844238, "global_step": 474652, "epoch": 2825} {"train_loss": -12.461301803588867, "global_step": 474653, "epoch": 2825} {"train_loss": -12.651524543762207, "global_step": 474654, "epoch": 2825} {"train_loss": -12.198409080505371, "global_step": 474655, "epoch": 2825} {"train_loss": -12.269124984741211, "global_step": 474656, "epoch": 2825} {"train_loss": -12.362174034118652, "global_step": 474657, "epoch": 2825} {"train_loss": -11.947063446044922, "global_step": 474658, "epoch": 2825} {"train_loss": -11.784269332885742, "global_step": 474659, "epoch": 2825} {"train_loss": -12.303266525268555, "global_step": 474660, "epoch": 2825} {"train_loss": -12.389503479003906, "global_step": 474661, "epoch": 2825} {"train_loss": -12.144515991210938, "global_step": 474662, "epoch": 2825} {"train_loss": -12.258651733398438, "global_step": 474663, "epoch": 2825} {"train_loss": -12.118148803710938, "global_step": 474664, "epoch": 2825} {"train_loss": -12.613818168640137, "global_step": 474665, "epoch": 2825} {"train_loss": -12.440296173095703, "global_step": 474666, "epoch": 2825} {"train_loss": -12.473909378051758, "global_step": 474667, "epoch": 2825} {"train_loss": -12.72254753112793, "global_step": 474668, "epoch": 2825} {"train_loss": -12.665295600891113, "global_step": 474669, "epoch": 2825} {"train_loss": -12.635013580322266, "global_step": 474670, "epoch": 2825} {"train_loss": -12.395783424377441, "global_step": 474671, "epoch": 2825} {"train_loss": -12.590620040893555, "global_step": 474672, "epoch": 2825} {"train_loss": -12.494436264038086, "global_step": 474673, "epoch": 2825} {"train_loss": -12.634330749511719, "global_step": 474674, "epoch": 2825} {"train_loss": -12.761737823486328, "global_step": 474675, "epoch": 2825} {"train_loss": -12.612310409545898, "global_step": 474676, "epoch": 2825} {"train_loss": -12.702934265136719, "global_step": 474677, "epoch": 2825} {"train_loss": -12.713879585266113, "global_step": 474678, "epoch": 2825} {"train_loss": -12.529186248779297, "global_step": 474679, "epoch": 2825} {"train_loss": -12.532469749450684, "global_step": 474680, "epoch": 2825} {"train_loss": -12.48970890045166, "global_step": 474681, "epoch": 2825} {"train_loss": -12.4732666015625, "global_step": 474682, "epoch": 2825} {"train_loss": -12.385168075561523, "global_step": 474683, "epoch": 2825} {"train_loss": -12.659194946289062, "global_step": 474684, "epoch": 2825} {"train_loss": -12.562971115112305, "global_step": 474685, "epoch": 2825} {"train_loss": -12.623405456542969, "global_step": 474686, "epoch": 2825} {"train_loss": -12.435890197753906, "global_step": 474687, "epoch": 2825} {"train_loss": -12.786676406860352, "global_step": 474688, "epoch": 2825} {"train_loss": -12.534351348876953, "global_step": 474689, "epoch": 2825} {"train_loss": -12.64115047454834, "global_step": 474690, "epoch": 2825} {"train_loss": -12.244463920593262, "global_step": 474691, "epoch": 2825} {"train_loss": -12.683717727661133, "global_step": 474692, "epoch": 2825} {"train_loss": -12.519420623779297, "global_step": 474693, "epoch": 2825} {"train_loss": -12.497314453125, "global_step": 474694, "epoch": 2825} {"train_loss": -12.712224960327148, "global_step": 474695, "epoch": 2825} {"train_loss": -12.82126522064209, "global_step": 474696, "epoch": 2825} {"train_loss": -12.529757499694824, "global_step": 474697, "epoch": 2825} {"train_loss": -12.80246353149414, "global_step": 474698, "epoch": 2825} {"train_loss": -12.841386795043945, "global_step": 474699, "epoch": 2825} {"train_loss": -12.828845024108887, "global_step": 474700, "epoch": 2825} {"train_loss": -12.488612174987793, "global_step": 474701, "epoch": 2825} {"train_loss": -13.043506622314453, "global_step": 474702, "epoch": 2825} {"train_loss": -12.450318336486816, "global_step": 474703, "epoch": 2825} {"train_loss": -12.747037887573242, "global_step": 474704, "epoch": 2825} {"train_loss": -12.483810424804688, "global_step": 474705, "epoch": 2825} {"train_loss": -12.871732711791992, "global_step": 474706, "epoch": 2825} {"train_loss": -12.74016284942627, "global_step": 474707, "epoch": 2825} {"train_loss": -12.768301010131836, "global_step": 474708, "epoch": 2825} {"train_loss": -12.76253604888916, "global_step": 474709, "epoch": 2825} {"train_loss": -12.784991264343262, "global_step": 474710, "epoch": 2825} {"train_loss": -12.704814910888672, "global_step": 474711, "epoch": 2825} {"train_loss": -12.929903030395508, "global_step": 474712, "epoch": 2825} {"train_loss": -12.85807991027832, "global_step": 474713, "epoch": 2825} {"train_loss": -12.749810218811035, "global_step": 474714, "epoch": 2825} {"train_loss": -12.743850708007812, "global_step": 474715, "epoch": 2825} {"train_loss": -12.938033103942871, "global_step": 474716, "epoch": 2825} {"train_loss": -13.063488960266113, "global_step": 474717, "epoch": 2825} {"train_loss": -12.682456970214844, "global_step": 474718, "epoch": 2825} {"train_loss": -12.823125839233398, "global_step": 474719, "epoch": 2825} {"train_loss": -12.866321563720703, "global_step": 474720, "epoch": 2825} {"train_loss": -12.901102066040039, "global_step": 474721, "epoch": 2825} {"train_loss": -12.631219863891602, "global_step": 474722, "epoch": 2825} {"train_loss": -12.98831558227539, "global_step": 474723, "epoch": 2825} {"train_loss": -13.103734970092773, "global_step": 474724, "epoch": 2825} {"train_loss": -12.617452621459961, "global_step": 474725, "epoch": 2825} {"train_loss": -12.548833847045898, "global_step": 474726, "epoch": 2825} {"train_loss": -12.582206726074219, "global_step": 474727, "epoch": 2825} {"train_loss": -12.580015182495117, "global_step": 474728, "epoch": 2825} {"train_loss": -12.4586181640625, "global_step": 474729, "epoch": 2825} {"train_loss": -12.839191436767578, "global_step": 474730, "epoch": 2825} {"train_loss": -12.722819328308105, "global_step": 474731, "epoch": 2825} {"train_loss": -11.742411613464355, "global_step": 474732, "epoch": 2825} {"train_loss": -12.349918365478516, "global_step": 474733, "epoch": 2825} {"train_loss": -12.751574516296387, "global_step": 474734, "epoch": 2825} {"train_loss": -12.133407592773438, "global_step": 474735, "epoch": 2825} {"train_loss": -11.939885139465332, "global_step": 474736, "epoch": 2825} {"train_loss": -11.912210464477539, "global_step": 474737, "epoch": 2825} {"train_loss": -12.936822891235352, "global_step": 474738, "epoch": 2825} {"train_loss": -11.627504348754883, "global_step": 474739, "epoch": 2825} {"train_loss": -11.529144287109375, "global_step": 474740, "epoch": 2825} {"train_loss": -11.04440689086914, "global_step": 474741, "epoch": 2825} {"train_loss": -12.645500183105469, "global_step": 474742, "epoch": 2825} {"train_loss": -8.997138977050781, "global_step": 474743, "epoch": 2825} {"train_loss": -11.492286682128906, "global_step": 474744, "epoch": 2825} {"train_loss": -10.807962417602539, "global_step": 474745, "epoch": 2825} {"train_loss": -9.6033296585083, "global_step": 474746, "epoch": 2825} {"train_loss": -9.830490112304688, "global_step": 474747, "epoch": 2825} {"train_loss": -9.528899192810059, "global_step": 474748, "epoch": 2825} {"train_loss": -12.076107025146484, "global_step": 474749, "epoch": 2825} {"train_loss": -9.503227233886719, "global_step": 474750, "epoch": 2825} {"train_loss": -11.508331298828125, "global_step": 474751, "epoch": 2825} {"train_loss": -10.833623886108398, "global_step": 474752, "epoch": 2825} {"train_loss": -9.536600112915039, "global_step": 474753, "epoch": 2825} {"train_loss": -12.156881332397461, "global_step": 474754, "epoch": 2825} {"train_loss": -9.761076927185059, "global_step": 474755, "epoch": 2825} {"train_loss": -10.992149353027344, "global_step": 474756, "epoch": 2825} {"train_loss": -10.721657752990723, "global_step": 474757, "epoch": 2825} {"train_loss": -9.980772972106934, "global_step": 474758, "epoch": 2825} {"train_loss": -11.559755325317383, "global_step": 474759, "epoch": 2825} {"train_loss": -10.036556243896484, "global_step": 474760, "epoch": 2825} {"train_loss": -10.989608764648438, "global_step": 474761, "epoch": 2825} {"train_loss": -10.509794235229492, "global_step": 474762, "epoch": 2825} {"train_loss": -11.697481155395508, "global_step": 474763, "epoch": 2825} {"train_loss": -11.35792350769043, "global_step": 474764, "epoch": 2825} {"train_loss": -11.19314193725586, "global_step": 474765, "epoch": 2825} {"train_loss": -11.372178077697754, "global_step": 474766, "epoch": 2825} {"train_loss": -12.222322026888529, "global_step": 474767, "epoch": 2825, "val_loss": 315022.96875, "train_action_mse_error": 0.8420184254646301} {"train_loss": -11.074522018432617, "global_step": 474768, "epoch": 2826} {"train_loss": -12.378726959228516, "global_step": 474769, "epoch": 2826} {"train_loss": -11.562273025512695, "global_step": 474770, "epoch": 2826} {"train_loss": -11.875154495239258, "global_step": 474771, "epoch": 2826} {"train_loss": -12.024232864379883, "global_step": 474772, "epoch": 2826} {"train_loss": -11.796394348144531, "global_step": 474773, "epoch": 2826} {"train_loss": -11.740232467651367, "global_step": 474774, "epoch": 2826} {"train_loss": -11.81151294708252, "global_step": 474775, "epoch": 2826} {"train_loss": -11.836601257324219, "global_step": 474776, "epoch": 2826} {"train_loss": -11.60628890991211, "global_step": 474777, "epoch": 2826} {"train_loss": -12.26341438293457, "global_step": 474778, "epoch": 2826} {"train_loss": -11.669439315795898, "global_step": 474779, "epoch": 2826} {"train_loss": -11.95478630065918, "global_step": 474780, "epoch": 2826} {"train_loss": -11.890911102294922, "global_step": 474781, "epoch": 2826} {"train_loss": -11.828271865844727, "global_step": 474782, "epoch": 2826} {"train_loss": -11.867560386657715, "global_step": 474783, "epoch": 2826} {"train_loss": -12.12226676940918, "global_step": 474784, "epoch": 2826} {"train_loss": -12.257009506225586, "global_step": 474785, "epoch": 2826} {"train_loss": -12.256717681884766, "global_step": 474786, "epoch": 2826} {"train_loss": -12.223268508911133, "global_step": 474787, "epoch": 2826} {"train_loss": -12.514686584472656, "global_step": 474788, "epoch": 2826} {"train_loss": -12.455920219421387, "global_step": 474789, "epoch": 2826} {"train_loss": -12.110208511352539, "global_step": 474790, "epoch": 2826} {"train_loss": -12.451333999633789, "global_step": 474791, "epoch": 2826} {"train_loss": -12.353311538696289, "global_step": 474792, "epoch": 2826} {"train_loss": -12.683216094970703, "global_step": 474793, "epoch": 2826} {"train_loss": -12.022394180297852, "global_step": 474794, "epoch": 2826} {"train_loss": -12.400283813476562, "global_step": 474795, "epoch": 2826} {"train_loss": -12.282672882080078, "global_step": 474796, "epoch": 2826} {"train_loss": -12.691181182861328, "global_step": 474797, "epoch": 2826} {"train_loss": -12.416276931762695, "global_step": 474798, "epoch": 2826} {"train_loss": -12.515247344970703, "global_step": 474799, "epoch": 2826} {"train_loss": -12.589983940124512, "global_step": 474800, "epoch": 2826} {"train_loss": -12.59981632232666, "global_step": 474801, "epoch": 2826} {"train_loss": -12.716985702514648, "global_step": 474802, "epoch": 2826} {"train_loss": -12.404879570007324, "global_step": 474803, "epoch": 2826} {"train_loss": -12.718313217163086, "global_step": 474804, "epoch": 2826} {"train_loss": -12.56002426147461, "global_step": 474805, "epoch": 2826} {"train_loss": -12.702845573425293, "global_step": 474806, "epoch": 2826} {"train_loss": -12.464836120605469, "global_step": 474807, "epoch": 2826} {"train_loss": -12.640701293945312, "global_step": 474808, "epoch": 2826} {"train_loss": -12.435526847839355, "global_step": 474809, "epoch": 2826} {"train_loss": -12.509370803833008, "global_step": 474810, "epoch": 2826} {"train_loss": -12.468433380126953, "global_step": 474811, "epoch": 2826} {"train_loss": -12.353001594543457, "global_step": 474812, "epoch": 2826} {"train_loss": -12.523486137390137, "global_step": 474813, "epoch": 2826} {"train_loss": -12.789571762084961, "global_step": 474814, "epoch": 2826} {"train_loss": -12.292764663696289, "global_step": 474815, "epoch": 2826} {"train_loss": -12.337163925170898, "global_step": 474816, "epoch": 2826} {"train_loss": -12.698446273803711, "global_step": 474817, "epoch": 2826} {"train_loss": -12.641780853271484, "global_step": 474818, "epoch": 2826} {"train_loss": -12.725826263427734, "global_step": 474819, "epoch": 2826} {"train_loss": -12.912351608276367, "global_step": 474820, "epoch": 2826} {"train_loss": -12.676420211791992, "global_step": 474821, "epoch": 2826} {"train_loss": -12.827936172485352, "global_step": 474822, "epoch": 2826} {"train_loss": -12.689973831176758, "global_step": 474823, "epoch": 2826} {"train_loss": -12.778706550598145, "global_step": 474824, "epoch": 2826} {"train_loss": -12.593287467956543, "global_step": 474825, "epoch": 2826} {"train_loss": -12.440893173217773, "global_step": 474826, "epoch": 2826} {"train_loss": -12.773232460021973, "global_step": 474827, "epoch": 2826} {"train_loss": -12.753175735473633, "global_step": 474828, "epoch": 2826} {"train_loss": -12.425804138183594, "global_step": 474829, "epoch": 2826} {"train_loss": -12.812248229980469, "global_step": 474830, "epoch": 2826} {"train_loss": -12.711243629455566, "global_step": 474831, "epoch": 2826} {"train_loss": -12.642060279846191, "global_step": 474832, "epoch": 2826} {"train_loss": -12.550056457519531, "global_step": 474833, "epoch": 2826} {"train_loss": -12.754959106445312, "global_step": 474834, "epoch": 2826} {"train_loss": -12.509855270385742, "global_step": 474835, "epoch": 2826} {"train_loss": -12.739076614379883, "global_step": 474836, "epoch": 2826} {"train_loss": -12.879016876220703, "global_step": 474837, "epoch": 2826} {"train_loss": -12.670082092285156, "global_step": 474838, "epoch": 2826} {"train_loss": -12.797050476074219, "global_step": 474839, "epoch": 2826} {"train_loss": -12.930137634277344, "global_step": 474840, "epoch": 2826} {"train_loss": -12.923141479492188, "global_step": 474841, "epoch": 2826} {"train_loss": -12.52286148071289, "global_step": 474842, "epoch": 2826} {"train_loss": -13.074735641479492, "global_step": 474843, "epoch": 2826} {"train_loss": -12.721384048461914, "global_step": 474844, "epoch": 2826} {"train_loss": -12.856761932373047, "global_step": 474845, "epoch": 2826} {"train_loss": -12.97496509552002, "global_step": 474846, "epoch": 2826} {"train_loss": -12.926095962524414, "global_step": 474847, "epoch": 2826} {"train_loss": -12.866094589233398, "global_step": 474848, "epoch": 2826} {"train_loss": -12.850737571716309, "global_step": 474849, "epoch": 2826} {"train_loss": -12.839778900146484, "global_step": 474850, "epoch": 2826} {"train_loss": -12.305205345153809, "global_step": 474851, "epoch": 2826} {"train_loss": -12.79127311706543, "global_step": 474852, "epoch": 2826} {"train_loss": -12.648799896240234, "global_step": 474853, "epoch": 2826} {"train_loss": -12.723474502563477, "global_step": 474854, "epoch": 2826} {"train_loss": -12.461577415466309, "global_step": 474855, "epoch": 2826} {"train_loss": -12.717488288879395, "global_step": 474856, "epoch": 2826} {"train_loss": -12.421753883361816, "global_step": 474857, "epoch": 2826} {"train_loss": -12.516164779663086, "global_step": 474858, "epoch": 2826} {"train_loss": -12.373529434204102, "global_step": 474859, "epoch": 2826} {"train_loss": -12.386503219604492, "global_step": 474860, "epoch": 2826} {"train_loss": -12.304948806762695, "global_step": 474861, "epoch": 2826} {"train_loss": -11.553237915039062, "global_step": 474862, "epoch": 2826} {"train_loss": -11.519432067871094, "global_step": 474863, "epoch": 2826} {"train_loss": -12.634971618652344, "global_step": 474864, "epoch": 2826} {"train_loss": -11.54623031616211, "global_step": 474865, "epoch": 2826} {"train_loss": -10.046411514282227, "global_step": 474866, "epoch": 2826} {"train_loss": -12.31183910369873, "global_step": 474867, "epoch": 2826} {"train_loss": -10.20886516571045, "global_step": 474868, "epoch": 2826} {"train_loss": -11.78935718536377, "global_step": 474869, "epoch": 2826} {"train_loss": -11.643956184387207, "global_step": 474870, "epoch": 2826} {"train_loss": -10.238639831542969, "global_step": 474871, "epoch": 2826} {"train_loss": -12.432196617126465, "global_step": 474872, "epoch": 2826} {"train_loss": -11.51720142364502, "global_step": 474873, "epoch": 2826} {"train_loss": -10.279970169067383, "global_step": 474874, "epoch": 2826} {"train_loss": -12.003170013427734, "global_step": 474875, "epoch": 2826} {"train_loss": -11.87094497680664, "global_step": 474876, "epoch": 2826} {"train_loss": -11.791097640991211, "global_step": 474877, "epoch": 2826} {"train_loss": -12.249954223632812, "global_step": 474878, "epoch": 2826} {"train_loss": -11.542539596557617, "global_step": 474879, "epoch": 2826} {"train_loss": -12.081558227539062, "global_step": 474880, "epoch": 2826} {"train_loss": -11.984885215759277, "global_step": 474881, "epoch": 2826} {"train_loss": -11.776115417480469, "global_step": 474882, "epoch": 2826} {"train_loss": -11.66346549987793, "global_step": 474883, "epoch": 2826} {"train_loss": -11.957674980163574, "global_step": 474884, "epoch": 2826} {"train_loss": -11.195172309875488, "global_step": 474885, "epoch": 2826} {"train_loss": -11.463815689086914, "global_step": 474886, "epoch": 2826} {"train_loss": -11.454963684082031, "global_step": 474887, "epoch": 2826} {"train_loss": -11.545511245727539, "global_step": 474888, "epoch": 2826} {"train_loss": -12.136009216308594, "global_step": 474889, "epoch": 2826} {"train_loss": -11.827425003051758, "global_step": 474890, "epoch": 2826} {"train_loss": -12.155899047851562, "global_step": 474891, "epoch": 2826} {"train_loss": -11.986370086669922, "global_step": 474892, "epoch": 2826} {"train_loss": -12.099960327148438, "global_step": 474893, "epoch": 2826} {"train_loss": -11.8613862991333, "global_step": 474894, "epoch": 2826} {"train_loss": -12.186894416809082, "global_step": 474895, "epoch": 2826} {"train_loss": -11.306951522827148, "global_step": 474896, "epoch": 2826} {"train_loss": -11.917825698852539, "global_step": 474897, "epoch": 2826} {"train_loss": -12.319839477539062, "global_step": 474898, "epoch": 2826} {"train_loss": -12.303718566894531, "global_step": 474899, "epoch": 2826} {"train_loss": -12.086593627929688, "global_step": 474900, "epoch": 2826} {"train_loss": -12.107722282409668, "global_step": 474901, "epoch": 2826} {"train_loss": -12.52058219909668, "global_step": 474902, "epoch": 2826} {"train_loss": -12.425899505615234, "global_step": 474903, "epoch": 2826} {"train_loss": -12.373562812805176, "global_step": 474904, "epoch": 2826} {"train_loss": -12.525093078613281, "global_step": 474905, "epoch": 2826} {"train_loss": -12.204200744628906, "global_step": 474906, "epoch": 2826} {"train_loss": -12.362544059753418, "global_step": 474907, "epoch": 2826} {"train_loss": -12.55013656616211, "global_step": 474908, "epoch": 2826} {"train_loss": -11.936214447021484, "global_step": 474909, "epoch": 2826} {"train_loss": -11.78886604309082, "global_step": 474910, "epoch": 2826} {"train_loss": -12.062439918518066, "global_step": 474911, "epoch": 2826} {"train_loss": -12.237968444824219, "global_step": 474912, "epoch": 2826} {"train_loss": -10.945693969726562, "global_step": 474913, "epoch": 2826} {"train_loss": -12.029745101928711, "global_step": 474914, "epoch": 2826} {"train_loss": -11.771631240844727, "global_step": 474915, "epoch": 2826} {"train_loss": -11.910263061523438, "global_step": 474916, "epoch": 2826} {"train_loss": -12.424127578735352, "global_step": 474917, "epoch": 2826} {"train_loss": -11.327902793884277, "global_step": 474918, "epoch": 2826} {"train_loss": -12.206108093261719, "global_step": 474919, "epoch": 2826} {"train_loss": -11.468367576599121, "global_step": 474920, "epoch": 2826} {"train_loss": -11.252756118774414, "global_step": 474921, "epoch": 2826} {"train_loss": -12.53266716003418, "global_step": 474922, "epoch": 2826} {"train_loss": -10.983062744140625, "global_step": 474923, "epoch": 2826} {"train_loss": -12.168591499328613, "global_step": 474924, "epoch": 2826} {"train_loss": -10.293325424194336, "global_step": 474925, "epoch": 2826} {"train_loss": -11.012246131896973, "global_step": 474926, "epoch": 2826} {"train_loss": -11.261667251586914, "global_step": 474927, "epoch": 2826} {"train_loss": -11.153308868408203, "global_step": 474928, "epoch": 2826} {"train_loss": -11.000256538391113, "global_step": 474929, "epoch": 2826} {"train_loss": -12.048548698425293, "global_step": 474930, "epoch": 2826} {"train_loss": -11.444711685180664, "global_step": 474931, "epoch": 2826} {"train_loss": -12.42739486694336, "global_step": 474932, "epoch": 2826} {"train_loss": -11.191123962402344, "global_step": 474933, "epoch": 2826} {"train_loss": -11.831745147705078, "global_step": 474934, "epoch": 2826} {"train_loss": -12.151401922816323, "global_step": 474935, "epoch": 2826, "val_loss": 316365.75} {"train_loss": -11.658827781677246, "global_step": 474936, "epoch": 2827} {"train_loss": -11.984502792358398, "global_step": 474937, "epoch": 2827} {"train_loss": -10.950589179992676, "global_step": 474938, "epoch": 2827} {"train_loss": -12.161369323730469, "global_step": 474939, "epoch": 2827} {"train_loss": -11.8328275680542, "global_step": 474940, "epoch": 2827} {"train_loss": -11.803201675415039, "global_step": 474941, "epoch": 2827} {"train_loss": -11.863929748535156, "global_step": 474942, "epoch": 2827} {"train_loss": -12.32370662689209, "global_step": 474943, "epoch": 2827} {"train_loss": -11.619269371032715, "global_step": 474944, "epoch": 2827} {"train_loss": -12.442510604858398, "global_step": 474945, "epoch": 2827} {"train_loss": -11.872323989868164, "global_step": 474946, "epoch": 2827} {"train_loss": -12.451745986938477, "global_step": 474947, "epoch": 2827} {"train_loss": -12.18358039855957, "global_step": 474948, "epoch": 2827} {"train_loss": -12.031718254089355, "global_step": 474949, "epoch": 2827} {"train_loss": -12.342079162597656, "global_step": 474950, "epoch": 2827} {"train_loss": -12.040521621704102, "global_step": 474951, "epoch": 2827} {"train_loss": -12.101116180419922, "global_step": 474952, "epoch": 2827} {"train_loss": -11.967391967773438, "global_step": 474953, "epoch": 2827} {"train_loss": -12.290782928466797, "global_step": 474954, "epoch": 2827} {"train_loss": -12.27483081817627, "global_step": 474955, "epoch": 2827} {"train_loss": -12.137703895568848, "global_step": 474956, "epoch": 2827} {"train_loss": -12.691391944885254, "global_step": 474957, "epoch": 2827} {"train_loss": -12.12407112121582, "global_step": 474958, "epoch": 2827} {"train_loss": -12.412919044494629, "global_step": 474959, "epoch": 2827} {"train_loss": -12.275712966918945, "global_step": 474960, "epoch": 2827} {"train_loss": -12.288761138916016, "global_step": 474961, "epoch": 2827} {"train_loss": -12.5335111618042, "global_step": 474962, "epoch": 2827} {"train_loss": -11.892894744873047, "global_step": 474963, "epoch": 2827} {"train_loss": -12.463134765625, "global_step": 474964, "epoch": 2827} {"train_loss": -12.522075653076172, "global_step": 474965, "epoch": 2827} {"train_loss": -12.459978103637695, "global_step": 474966, "epoch": 2827} {"train_loss": -12.746030807495117, "global_step": 474967, "epoch": 2827} {"train_loss": -12.516447067260742, "global_step": 474968, "epoch": 2827} {"train_loss": -12.598742485046387, "global_step": 474969, "epoch": 2827} {"train_loss": -12.477245330810547, "global_step": 474970, "epoch": 2827} {"train_loss": -12.662627220153809, "global_step": 474971, "epoch": 2827} {"train_loss": -12.368316650390625, "global_step": 474972, "epoch": 2827} {"train_loss": -12.594317436218262, "global_step": 474973, "epoch": 2827} {"train_loss": -12.502021789550781, "global_step": 474974, "epoch": 2827} {"train_loss": -12.508420944213867, "global_step": 474975, "epoch": 2827} {"train_loss": -12.413581848144531, "global_step": 474976, "epoch": 2827} {"train_loss": -12.364398002624512, "global_step": 474977, "epoch": 2827} {"train_loss": -12.59410285949707, "global_step": 474978, "epoch": 2827} {"train_loss": -12.501081466674805, "global_step": 474979, "epoch": 2827} {"train_loss": -12.77871322631836, "global_step": 474980, "epoch": 2827} {"train_loss": -12.343631744384766, "global_step": 474981, "epoch": 2827} {"train_loss": -12.65852165222168, "global_step": 474982, "epoch": 2827} {"train_loss": -12.586153984069824, "global_step": 474983, "epoch": 2827} {"train_loss": -12.920132637023926, "global_step": 474984, "epoch": 2827} {"train_loss": -12.899247169494629, "global_step": 474985, "epoch": 2827} {"train_loss": -12.600132942199707, "global_step": 474986, "epoch": 2827} {"train_loss": -12.924705505371094, "global_step": 474987, "epoch": 2827} {"train_loss": -12.74293327331543, "global_step": 474988, "epoch": 2827} {"train_loss": -12.671070098876953, "global_step": 474989, "epoch": 2827} {"train_loss": -12.991632461547852, "global_step": 474990, "epoch": 2827} {"train_loss": -12.77902603149414, "global_step": 474991, "epoch": 2827} {"train_loss": -12.999876022338867, "global_step": 474992, "epoch": 2827} {"train_loss": -12.862710952758789, "global_step": 474993, "epoch": 2827} {"train_loss": -12.793270111083984, "global_step": 474994, "epoch": 2827} {"train_loss": -13.047861099243164, "global_step": 474995, "epoch": 2827} {"train_loss": -12.759210586547852, "global_step": 474996, "epoch": 2827} {"train_loss": -12.884310722351074, "global_step": 474997, "epoch": 2827} {"train_loss": -12.757871627807617, "global_step": 474998, "epoch": 2827} {"train_loss": -12.868886947631836, "global_step": 474999, "epoch": 2827} {"train_loss": -12.831560134887695, "global_step": 475000, "epoch": 2827} {"train_loss": -12.939863204956055, "global_step": 475001, "epoch": 2827} {"train_loss": -12.841069221496582, "global_step": 475002, "epoch": 2827} {"train_loss": -13.027643203735352, "global_step": 475003, "epoch": 2827} {"train_loss": -12.867927551269531, "global_step": 475004, "epoch": 2827} {"train_loss": -13.077071189880371, "global_step": 475005, "epoch": 2827} {"train_loss": -13.131339073181152, "global_step": 475006, "epoch": 2827} {"train_loss": -12.918252944946289, "global_step": 475007, "epoch": 2827} {"train_loss": -12.981205940246582, "global_step": 475008, "epoch": 2827} {"train_loss": -13.059467315673828, "global_step": 475009, "epoch": 2827} {"train_loss": -12.844976425170898, "global_step": 475010, "epoch": 2827} {"train_loss": -12.566204071044922, "global_step": 475011, "epoch": 2827} {"train_loss": -12.720975875854492, "global_step": 475012, "epoch": 2827} {"train_loss": -12.933298110961914, "global_step": 475013, "epoch": 2827} {"train_loss": -12.67559814453125, "global_step": 475014, "epoch": 2827} {"train_loss": -12.95341682434082, "global_step": 475015, "epoch": 2827} {"train_loss": -12.841243743896484, "global_step": 475016, "epoch": 2827} {"train_loss": -13.087389945983887, "global_step": 475017, "epoch": 2827} {"train_loss": -12.938494682312012, "global_step": 475018, "epoch": 2827} {"train_loss": -12.997344017028809, "global_step": 475019, "epoch": 2827} {"train_loss": -12.794527053833008, "global_step": 475020, "epoch": 2827} {"train_loss": -12.753570556640625, "global_step": 475021, "epoch": 2827} {"train_loss": -12.986194610595703, "global_step": 475022, "epoch": 2827} {"train_loss": -12.745035171508789, "global_step": 475023, "epoch": 2827} {"train_loss": -12.522457122802734, "global_step": 475024, "epoch": 2827} {"train_loss": -12.954036712646484, "global_step": 475025, "epoch": 2827} {"train_loss": -12.36484432220459, "global_step": 475026, "epoch": 2827} {"train_loss": -12.050528526306152, "global_step": 475027, "epoch": 2827} {"train_loss": -12.616411209106445, "global_step": 475028, "epoch": 2827} {"train_loss": -12.842453002929688, "global_step": 475029, "epoch": 2827} {"train_loss": -11.672752380371094, "global_step": 475030, "epoch": 2827} {"train_loss": -11.848251342773438, "global_step": 475031, "epoch": 2827} {"train_loss": -12.678403854370117, "global_step": 475032, "epoch": 2827} {"train_loss": -11.277502059936523, "global_step": 475033, "epoch": 2827} {"train_loss": -11.559757232666016, "global_step": 475034, "epoch": 2827} {"train_loss": -12.004034042358398, "global_step": 475035, "epoch": 2827} {"train_loss": -11.611631393432617, "global_step": 475036, "epoch": 2827} {"train_loss": -11.880378723144531, "global_step": 475037, "epoch": 2827} {"train_loss": -12.183921813964844, "global_step": 475038, "epoch": 2827} {"train_loss": -11.531471252441406, "global_step": 475039, "epoch": 2827} {"train_loss": -12.00013542175293, "global_step": 475040, "epoch": 2827} {"train_loss": -12.052875518798828, "global_step": 475041, "epoch": 2827} {"train_loss": -11.974857330322266, "global_step": 475042, "epoch": 2827} {"train_loss": -11.688718795776367, "global_step": 475043, "epoch": 2827} {"train_loss": -11.623001098632812, "global_step": 475044, "epoch": 2827} {"train_loss": -10.513395309448242, "global_step": 475045, "epoch": 2827} {"train_loss": -11.118696212768555, "global_step": 475046, "epoch": 2827} {"train_loss": -11.890609741210938, "global_step": 475047, "epoch": 2827} {"train_loss": -11.077372550964355, "global_step": 475048, "epoch": 2827} {"train_loss": -11.5367431640625, "global_step": 475049, "epoch": 2827} {"train_loss": -11.958218574523926, "global_step": 475050, "epoch": 2827} {"train_loss": -11.777989387512207, "global_step": 475051, "epoch": 2827} {"train_loss": -11.794717788696289, "global_step": 475052, "epoch": 2827} {"train_loss": -12.627432823181152, "global_step": 475053, "epoch": 2827} {"train_loss": -11.96870231628418, "global_step": 475054, "epoch": 2827} {"train_loss": -11.628840446472168, "global_step": 475055, "epoch": 2827} {"train_loss": -11.830855369567871, "global_step": 475056, "epoch": 2827} {"train_loss": -11.721122741699219, "global_step": 475057, "epoch": 2827} {"train_loss": -11.935096740722656, "global_step": 475058, "epoch": 2827} {"train_loss": -11.867267608642578, "global_step": 475059, "epoch": 2827} {"train_loss": -11.274605751037598, "global_step": 475060, "epoch": 2827} {"train_loss": -11.901448249816895, "global_step": 475061, "epoch": 2827} {"train_loss": -10.982905387878418, "global_step": 475062, "epoch": 2827} {"train_loss": -11.497049331665039, "global_step": 475063, "epoch": 2827} {"train_loss": -11.555400848388672, "global_step": 475064, "epoch": 2827} {"train_loss": -11.62797737121582, "global_step": 475065, "epoch": 2827} {"train_loss": -12.102080345153809, "global_step": 475066, "epoch": 2827} {"train_loss": -11.88337230682373, "global_step": 475067, "epoch": 2827} {"train_loss": -12.338160514831543, "global_step": 475068, "epoch": 2827} {"train_loss": -12.018806457519531, "global_step": 475069, "epoch": 2827} {"train_loss": -12.123590469360352, "global_step": 475070, "epoch": 2827} {"train_loss": -11.778692245483398, "global_step": 475071, "epoch": 2827} {"train_loss": -12.23752212524414, "global_step": 475072, "epoch": 2827} {"train_loss": -12.101089477539062, "global_step": 475073, "epoch": 2827} {"train_loss": -12.535858154296875, "global_step": 475074, "epoch": 2827} {"train_loss": -12.523067474365234, "global_step": 475075, "epoch": 2827} {"train_loss": -12.102148056030273, "global_step": 475076, "epoch": 2827} {"train_loss": -12.655525207519531, "global_step": 475077, "epoch": 2827} {"train_loss": -12.556403160095215, "global_step": 475078, "epoch": 2827} {"train_loss": -12.724034309387207, "global_step": 475079, "epoch": 2827} {"train_loss": -12.362987518310547, "global_step": 475080, "epoch": 2827} {"train_loss": -12.623997688293457, "global_step": 475081, "epoch": 2827} {"train_loss": -12.484816551208496, "global_step": 475082, "epoch": 2827} {"train_loss": -12.477405548095703, "global_step": 475083, "epoch": 2827} {"train_loss": -12.732129096984863, "global_step": 475084, "epoch": 2827} {"train_loss": -12.643321990966797, "global_step": 475085, "epoch": 2827} {"train_loss": -12.760782241821289, "global_step": 475086, "epoch": 2827} {"train_loss": -12.680316925048828, "global_step": 475087, "epoch": 2827} {"train_loss": -12.59682559967041, "global_step": 475088, "epoch": 2827} {"train_loss": -12.911975860595703, "global_step": 475089, "epoch": 2827} {"train_loss": -12.448568344116211, "global_step": 475090, "epoch": 2827} {"train_loss": -12.672765731811523, "global_step": 475091, "epoch": 2827} {"train_loss": -12.436676025390625, "global_step": 475092, "epoch": 2827} {"train_loss": -12.676185607910156, "global_step": 475093, "epoch": 2827} {"train_loss": -12.767936706542969, "global_step": 475094, "epoch": 2827} {"train_loss": -12.714908599853516, "global_step": 475095, "epoch": 2827} {"train_loss": -12.76838493347168, "global_step": 475096, "epoch": 2827} {"train_loss": -12.832939147949219, "global_step": 475097, "epoch": 2827} {"train_loss": -12.696147918701172, "global_step": 475098, "epoch": 2827} {"train_loss": -12.987399101257324, "global_step": 475099, "epoch": 2827} {"train_loss": -12.724891662597656, "global_step": 475100, "epoch": 2827} {"train_loss": -12.354496002197266, "global_step": 475101, "epoch": 2827} {"train_loss": -12.315835952758789, "global_step": 475102, "epoch": 2827} {"train_loss": -12.36100839433216, "global_step": 475103, "epoch": 2827, "val_loss": 316252.1875} {"train_loss": -12.690165519714355, "global_step": 475104, "epoch": 2828} {"train_loss": -12.982986450195312, "global_step": 475105, "epoch": 2828} {"train_loss": -12.310506820678711, "global_step": 475106, "epoch": 2828} {"train_loss": -12.705169677734375, "global_step": 475107, "epoch": 2828} {"train_loss": -12.601003646850586, "global_step": 475108, "epoch": 2828} {"train_loss": -12.301250457763672, "global_step": 475109, "epoch": 2828} {"train_loss": -12.68605899810791, "global_step": 475110, "epoch": 2828} {"train_loss": -12.151203155517578, "global_step": 475111, "epoch": 2828} {"train_loss": -12.2442045211792, "global_step": 475112, "epoch": 2828} {"train_loss": -12.614611625671387, "global_step": 475113, "epoch": 2828} {"train_loss": -12.86515998840332, "global_step": 475114, "epoch": 2828} {"train_loss": -12.561958312988281, "global_step": 475115, "epoch": 2828} {"train_loss": -12.878357887268066, "global_step": 475116, "epoch": 2828} {"train_loss": -12.603755950927734, "global_step": 475117, "epoch": 2828} {"train_loss": -12.990415573120117, "global_step": 475118, "epoch": 2828} {"train_loss": -12.588748931884766, "global_step": 475119, "epoch": 2828} {"train_loss": -12.632111549377441, "global_step": 475120, "epoch": 2828} {"train_loss": -12.69407844543457, "global_step": 475121, "epoch": 2828} {"train_loss": -12.53144645690918, "global_step": 475122, "epoch": 2828} {"train_loss": -12.859186172485352, "global_step": 475123, "epoch": 2828} {"train_loss": -12.525766372680664, "global_step": 475124, "epoch": 2828} {"train_loss": -12.6290864944458, "global_step": 475125, "epoch": 2828} {"train_loss": -12.589377403259277, "global_step": 475126, "epoch": 2828} {"train_loss": -12.760003089904785, "global_step": 475127, "epoch": 2828} {"train_loss": -12.018135070800781, "global_step": 475128, "epoch": 2828} {"train_loss": -11.64760684967041, "global_step": 475129, "epoch": 2828} {"train_loss": -12.395326614379883, "global_step": 475130, "epoch": 2828} {"train_loss": -12.12124252319336, "global_step": 475131, "epoch": 2828} {"train_loss": -11.178657531738281, "global_step": 475132, "epoch": 2828} {"train_loss": -10.462218284606934, "global_step": 475133, "epoch": 2828} {"train_loss": -11.4892578125, "global_step": 475134, "epoch": 2828} {"train_loss": -12.255706787109375, "global_step": 475135, "epoch": 2828} {"train_loss": -10.385808944702148, "global_step": 475136, "epoch": 2828} {"train_loss": -11.951862335205078, "global_step": 475137, "epoch": 2828} {"train_loss": -9.943182945251465, "global_step": 475138, "epoch": 2828} {"train_loss": -10.340252876281738, "global_step": 475139, "epoch": 2828} {"train_loss": -8.770055770874023, "global_step": 475140, "epoch": 2828} {"train_loss": -7.619719505310059, "global_step": 475141, "epoch": 2828} {"train_loss": -8.198179244995117, "global_step": 475142, "epoch": 2828} {"train_loss": -8.208944320678711, "global_step": 475143, "epoch": 2828} {"train_loss": -7.767706394195557, "global_step": 475144, "epoch": 2828} {"train_loss": -8.381866455078125, "global_step": 475145, "epoch": 2828} {"train_loss": -8.644301414489746, "global_step": 475146, "epoch": 2828} {"train_loss": -8.573278427124023, "global_step": 475147, "epoch": 2828} {"train_loss": -8.792155265808105, "global_step": 475148, "epoch": 2828} {"train_loss": -8.554586410522461, "global_step": 475149, "epoch": 2828} {"train_loss": -9.27513313293457, "global_step": 475150, "epoch": 2828} {"train_loss": -9.009989738464355, "global_step": 475151, "epoch": 2828} {"train_loss": -9.070186614990234, "global_step": 475152, "epoch": 2828} {"train_loss": -9.421578407287598, "global_step": 475153, "epoch": 2828} {"train_loss": -9.455181121826172, "global_step": 475154, "epoch": 2828} {"train_loss": -9.612068176269531, "global_step": 475155, "epoch": 2828} {"train_loss": -9.25695514678955, "global_step": 475156, "epoch": 2828} {"train_loss": -10.502180099487305, "global_step": 475157, "epoch": 2828} {"train_loss": -10.076945304870605, "global_step": 475158, "epoch": 2828} {"train_loss": -10.543149948120117, "global_step": 475159, "epoch": 2828} {"train_loss": -10.896787643432617, "global_step": 475160, "epoch": 2828} {"train_loss": -10.582647323608398, "global_step": 475161, "epoch": 2828} {"train_loss": -10.616762161254883, "global_step": 475162, "epoch": 2828} {"train_loss": -10.821587562561035, "global_step": 475163, "epoch": 2828} {"train_loss": -10.49211597442627, "global_step": 475164, "epoch": 2828} {"train_loss": -11.669496536254883, "global_step": 475165, "epoch": 2828} {"train_loss": -11.300007820129395, "global_step": 475166, "epoch": 2828} {"train_loss": -11.653244972229004, "global_step": 475167, "epoch": 2828} {"train_loss": -11.719804763793945, "global_step": 475168, "epoch": 2828} {"train_loss": -11.19206428527832, "global_step": 475169, "epoch": 2828} {"train_loss": -11.920251846313477, "global_step": 475170, "epoch": 2828} {"train_loss": -11.735767364501953, "global_step": 475171, "epoch": 2828} {"train_loss": -12.200296401977539, "global_step": 475172, "epoch": 2828} {"train_loss": -12.134038925170898, "global_step": 475173, "epoch": 2828} {"train_loss": -11.794561386108398, "global_step": 475174, "epoch": 2828} {"train_loss": -12.152298927307129, "global_step": 475175, "epoch": 2828} {"train_loss": -11.723483085632324, "global_step": 475176, "epoch": 2828} {"train_loss": -12.056707382202148, "global_step": 475177, "epoch": 2828} {"train_loss": -11.976419448852539, "global_step": 475178, "epoch": 2828} {"train_loss": -12.10915756225586, "global_step": 475179, "epoch": 2828} {"train_loss": -12.106159210205078, "global_step": 475180, "epoch": 2828} {"train_loss": -12.109981536865234, "global_step": 475181, "epoch": 2828} {"train_loss": -12.453819274902344, "global_step": 475182, "epoch": 2828} {"train_loss": -12.178860664367676, "global_step": 475183, "epoch": 2828} {"train_loss": -12.175981521606445, "global_step": 475184, "epoch": 2828} {"train_loss": -12.271299362182617, "global_step": 475185, "epoch": 2828} {"train_loss": -12.507301330566406, "global_step": 475186, "epoch": 2828} {"train_loss": -12.292000770568848, "global_step": 475187, "epoch": 2828} {"train_loss": -12.467159271240234, "global_step": 475188, "epoch": 2828} {"train_loss": -12.616459846496582, "global_step": 475189, "epoch": 2828} {"train_loss": -12.393000602722168, "global_step": 475190, "epoch": 2828} {"train_loss": -12.584409713745117, "global_step": 475191, "epoch": 2828} {"train_loss": -12.25497817993164, "global_step": 475192, "epoch": 2828} {"train_loss": -12.410653114318848, "global_step": 475193, "epoch": 2828} {"train_loss": -12.497724533081055, "global_step": 475194, "epoch": 2828} {"train_loss": -12.467775344848633, "global_step": 475195, "epoch": 2828} {"train_loss": -12.60145378112793, "global_step": 475196, "epoch": 2828} {"train_loss": -12.415934562683105, "global_step": 475197, "epoch": 2828} {"train_loss": -12.603313446044922, "global_step": 475198, "epoch": 2828} {"train_loss": -12.827914237976074, "global_step": 475199, "epoch": 2828} {"train_loss": -12.694555282592773, "global_step": 475200, "epoch": 2828} {"train_loss": -12.87614631652832, "global_step": 475201, "epoch": 2828} {"train_loss": -12.496538162231445, "global_step": 475202, "epoch": 2828} {"train_loss": -12.980239868164062, "global_step": 475203, "epoch": 2828} {"train_loss": -12.781848907470703, "global_step": 475204, "epoch": 2828} {"train_loss": -12.749127388000488, "global_step": 475205, "epoch": 2828} {"train_loss": -12.676474571228027, "global_step": 475206, "epoch": 2828} {"train_loss": -12.693999290466309, "global_step": 475207, "epoch": 2828} {"train_loss": -12.787117958068848, "global_step": 475208, "epoch": 2828} {"train_loss": -12.886796951293945, "global_step": 475209, "epoch": 2828} {"train_loss": -12.700742721557617, "global_step": 475210, "epoch": 2828} {"train_loss": -12.83842658996582, "global_step": 475211, "epoch": 2828} {"train_loss": -12.78465461730957, "global_step": 475212, "epoch": 2828} {"train_loss": -12.801898002624512, "global_step": 475213, "epoch": 2828} {"train_loss": -12.753522872924805, "global_step": 475214, "epoch": 2828} {"train_loss": -12.715925216674805, "global_step": 475215, "epoch": 2828} {"train_loss": -12.853803634643555, "global_step": 475216, "epoch": 2828} {"train_loss": -12.990456581115723, "global_step": 475217, "epoch": 2828} {"train_loss": -12.471636772155762, "global_step": 475218, "epoch": 2828} {"train_loss": -12.906075477600098, "global_step": 475219, "epoch": 2828} {"train_loss": -12.860307693481445, "global_step": 475220, "epoch": 2828} {"train_loss": -12.933980941772461, "global_step": 475221, "epoch": 2828} {"train_loss": -12.941001892089844, "global_step": 475222, "epoch": 2828} {"train_loss": -13.063043594360352, "global_step": 475223, "epoch": 2828} {"train_loss": -12.959941864013672, "global_step": 475224, "epoch": 2828} {"train_loss": -12.93387222290039, "global_step": 475225, "epoch": 2828} {"train_loss": -12.957098007202148, "global_step": 475226, "epoch": 2828} {"train_loss": -13.002859115600586, "global_step": 475227, "epoch": 2828} {"train_loss": -13.004512786865234, "global_step": 475228, "epoch": 2828} {"train_loss": -12.760412216186523, "global_step": 475229, "epoch": 2828} {"train_loss": -13.008005142211914, "global_step": 475230, "epoch": 2828} {"train_loss": -13.007698059082031, "global_step": 475231, "epoch": 2828} {"train_loss": -12.77446174621582, "global_step": 475232, "epoch": 2828} {"train_loss": -12.680160522460938, "global_step": 475233, "epoch": 2828} {"train_loss": -12.914220809936523, "global_step": 475234, "epoch": 2828} {"train_loss": -12.843021392822266, "global_step": 475235, "epoch": 2828} {"train_loss": -12.260643005371094, "global_step": 475236, "epoch": 2828} {"train_loss": -12.206741333007812, "global_step": 475237, "epoch": 2828} {"train_loss": -12.790075302124023, "global_step": 475238, "epoch": 2828} {"train_loss": -10.861847877502441, "global_step": 475239, "epoch": 2828} {"train_loss": -10.956998825073242, "global_step": 475240, "epoch": 2828} {"train_loss": -12.215333938598633, "global_step": 475241, "epoch": 2828} {"train_loss": -10.89816665649414, "global_step": 475242, "epoch": 2828} {"train_loss": -10.452718734741211, "global_step": 475243, "epoch": 2828} {"train_loss": -10.396219253540039, "global_step": 475244, "epoch": 2828} {"train_loss": -12.633674621582031, "global_step": 475245, "epoch": 2828} {"train_loss": -10.649145126342773, "global_step": 475246, "epoch": 2828} {"train_loss": -12.659024238586426, "global_step": 475247, "epoch": 2828} {"train_loss": -11.603349685668945, "global_step": 475248, "epoch": 2828} {"train_loss": -11.445952415466309, "global_step": 475249, "epoch": 2828} {"train_loss": -10.661355018615723, "global_step": 475250, "epoch": 2828} {"train_loss": -9.388288497924805, "global_step": 475251, "epoch": 2828} {"train_loss": -10.23157787322998, "global_step": 475252, "epoch": 2828} {"train_loss": -11.655613899230957, "global_step": 475253, "epoch": 2828} {"train_loss": -9.934069633483887, "global_step": 475254, "epoch": 2828} {"train_loss": -10.903629302978516, "global_step": 475255, "epoch": 2828} {"train_loss": -10.959257125854492, "global_step": 475256, "epoch": 2828} {"train_loss": -11.580577850341797, "global_step": 475257, "epoch": 2828} {"train_loss": -10.858370780944824, "global_step": 475258, "epoch": 2828} {"train_loss": -11.543604850769043, "global_step": 475259, "epoch": 2828} {"train_loss": -11.998018264770508, "global_step": 475260, "epoch": 2828} {"train_loss": -11.384323120117188, "global_step": 475261, "epoch": 2828} {"train_loss": -11.815811157226562, "global_step": 475262, "epoch": 2828} {"train_loss": -11.526126861572266, "global_step": 475263, "epoch": 2828} {"train_loss": -12.106768608093262, "global_step": 475264, "epoch": 2828} {"train_loss": -11.71330451965332, "global_step": 475265, "epoch": 2828} {"train_loss": -11.824179649353027, "global_step": 475266, "epoch": 2828} {"train_loss": -11.73522663116455, "global_step": 475267, "epoch": 2828} {"train_loss": -12.148211479187012, "global_step": 475268, "epoch": 2828} {"train_loss": -11.589447021484375, "global_step": 475269, "epoch": 2828} {"train_loss": -12.12150764465332, "global_step": 475270, "epoch": 2828} {"train_loss": -11.735943626789819, "global_step": 475271, "epoch": 2828, "val_loss": 309999.78125} {"train_loss": -12.065082550048828, "global_step": 475272, "epoch": 2829} {"train_loss": -11.721307754516602, "global_step": 475273, "epoch": 2829} {"train_loss": -11.670464515686035, "global_step": 475274, "epoch": 2829} {"train_loss": -11.46164321899414, "global_step": 475275, "epoch": 2829} {"train_loss": -11.10638427734375, "global_step": 475276, "epoch": 2829} {"train_loss": -11.768290519714355, "global_step": 475277, "epoch": 2829} {"train_loss": -11.8192720413208, "global_step": 475278, "epoch": 2829} {"train_loss": -11.387463569641113, "global_step": 475279, "epoch": 2829} {"train_loss": -12.491683006286621, "global_step": 475280, "epoch": 2829} {"train_loss": -10.951711654663086, "global_step": 475281, "epoch": 2829} {"train_loss": -12.196395874023438, "global_step": 475282, "epoch": 2829} {"train_loss": -12.199054718017578, "global_step": 475283, "epoch": 2829} {"train_loss": -12.09263801574707, "global_step": 475284, "epoch": 2829} {"train_loss": -12.51147174835205, "global_step": 475285, "epoch": 2829} {"train_loss": -11.874235153198242, "global_step": 475286, "epoch": 2829} {"train_loss": -12.420185089111328, "global_step": 475287, "epoch": 2829} {"train_loss": -12.271388053894043, "global_step": 475288, "epoch": 2829} {"train_loss": -12.576854705810547, "global_step": 475289, "epoch": 2829} {"train_loss": -12.254877090454102, "global_step": 475290, "epoch": 2829} {"train_loss": -11.854748725891113, "global_step": 475291, "epoch": 2829} {"train_loss": -12.295902252197266, "global_step": 475292, "epoch": 2829} {"train_loss": -11.624814987182617, "global_step": 475293, "epoch": 2829} {"train_loss": -11.77376937866211, "global_step": 475294, "epoch": 2829} {"train_loss": -12.062576293945312, "global_step": 475295, "epoch": 2829} {"train_loss": -12.187337875366211, "global_step": 475296, "epoch": 2829} {"train_loss": -12.488166809082031, "global_step": 475297, "epoch": 2829} {"train_loss": -12.03530502319336, "global_step": 475298, "epoch": 2829} {"train_loss": -12.568571090698242, "global_step": 475299, "epoch": 2829} {"train_loss": -12.405010223388672, "global_step": 475300, "epoch": 2829} {"train_loss": -12.466230392456055, "global_step": 475301, "epoch": 2829} {"train_loss": -12.515092849731445, "global_step": 475302, "epoch": 2829} {"train_loss": -12.532116889953613, "global_step": 475303, "epoch": 2829} {"train_loss": -12.827144622802734, "global_step": 475304, "epoch": 2829} {"train_loss": -12.200331687927246, "global_step": 475305, "epoch": 2829} {"train_loss": -12.837709426879883, "global_step": 475306, "epoch": 2829} {"train_loss": -12.143074035644531, "global_step": 475307, "epoch": 2829} {"train_loss": -12.281349182128906, "global_step": 475308, "epoch": 2829} {"train_loss": -12.473581314086914, "global_step": 475309, "epoch": 2829} {"train_loss": -11.721012115478516, "global_step": 475310, "epoch": 2829} {"train_loss": -12.885688781738281, "global_step": 475311, "epoch": 2829} {"train_loss": -11.662412643432617, "global_step": 475312, "epoch": 2829} {"train_loss": -12.243470191955566, "global_step": 475313, "epoch": 2829} {"train_loss": -12.135988235473633, "global_step": 475314, "epoch": 2829} {"train_loss": -12.056844711303711, "global_step": 475315, "epoch": 2829} {"train_loss": -12.225507736206055, "global_step": 475316, "epoch": 2829} {"train_loss": -12.060443878173828, "global_step": 475317, "epoch": 2829} {"train_loss": -12.64796257019043, "global_step": 475318, "epoch": 2829} {"train_loss": -11.920099258422852, "global_step": 475319, "epoch": 2829} {"train_loss": -12.252923965454102, "global_step": 475320, "epoch": 2829} {"train_loss": -12.334217071533203, "global_step": 475321, "epoch": 2829} {"train_loss": -12.06814193725586, "global_step": 475322, "epoch": 2829} {"train_loss": -12.502309799194336, "global_step": 475323, "epoch": 2829} {"train_loss": -11.386601448059082, "global_step": 475324, "epoch": 2829} {"train_loss": -12.25103759765625, "global_step": 475325, "epoch": 2829} {"train_loss": -11.590974807739258, "global_step": 475326, "epoch": 2829} {"train_loss": -11.690492630004883, "global_step": 475327, "epoch": 2829} {"train_loss": -11.379404067993164, "global_step": 475328, "epoch": 2829} {"train_loss": -12.237289428710938, "global_step": 475329, "epoch": 2829} {"train_loss": -11.53648853302002, "global_step": 475330, "epoch": 2829} {"train_loss": -12.343679428100586, "global_step": 475331, "epoch": 2829} {"train_loss": -11.638212203979492, "global_step": 475332, "epoch": 2829} {"train_loss": -11.698871612548828, "global_step": 475333, "epoch": 2829} {"train_loss": -12.555116653442383, "global_step": 475334, "epoch": 2829} {"train_loss": -11.281270027160645, "global_step": 475335, "epoch": 2829} {"train_loss": -11.846760749816895, "global_step": 475336, "epoch": 2829} {"train_loss": -11.824892044067383, "global_step": 475337, "epoch": 2829} {"train_loss": -12.075413703918457, "global_step": 475338, "epoch": 2829} {"train_loss": -11.463753700256348, "global_step": 475339, "epoch": 2829} {"train_loss": -11.41254997253418, "global_step": 475340, "epoch": 2829} {"train_loss": -12.108665466308594, "global_step": 475341, "epoch": 2829} {"train_loss": -11.355457305908203, "global_step": 475342, "epoch": 2829} {"train_loss": -12.602214813232422, "global_step": 475343, "epoch": 2829} {"train_loss": -11.687889099121094, "global_step": 475344, "epoch": 2829} {"train_loss": -12.470135688781738, "global_step": 475345, "epoch": 2829} {"train_loss": -12.417189598083496, "global_step": 475346, "epoch": 2829} {"train_loss": -12.251611709594727, "global_step": 475347, "epoch": 2829} {"train_loss": -12.624115943908691, "global_step": 475348, "epoch": 2829} {"train_loss": -12.12460994720459, "global_step": 475349, "epoch": 2829} {"train_loss": -11.951969146728516, "global_step": 475350, "epoch": 2829} {"train_loss": -12.425848960876465, "global_step": 475351, "epoch": 2829} {"train_loss": -11.622442245483398, "global_step": 475352, "epoch": 2829} {"train_loss": -12.608368873596191, "global_step": 475353, "epoch": 2829} {"train_loss": -11.942813873291016, "global_step": 475354, "epoch": 2829} {"train_loss": -12.598949432373047, "global_step": 475355, "epoch": 2829} {"train_loss": -12.149686813354492, "global_step": 475356, "epoch": 2829} {"train_loss": -12.696520805358887, "global_step": 475357, "epoch": 2829} {"train_loss": -12.286310195922852, "global_step": 475358, "epoch": 2829} {"train_loss": -12.50607681274414, "global_step": 475359, "epoch": 2829} {"train_loss": -12.46554946899414, "global_step": 475360, "epoch": 2829} {"train_loss": -12.544072151184082, "global_step": 475361, "epoch": 2829} {"train_loss": -12.493799209594727, "global_step": 475362, "epoch": 2829} {"train_loss": -12.750335693359375, "global_step": 475363, "epoch": 2829} {"train_loss": -12.377153396606445, "global_step": 475364, "epoch": 2829} {"train_loss": -12.599797248840332, "global_step": 475365, "epoch": 2829} {"train_loss": -12.498298645019531, "global_step": 475366, "epoch": 2829} {"train_loss": -12.68255615234375, "global_step": 475367, "epoch": 2829} {"train_loss": -12.347273826599121, "global_step": 475368, "epoch": 2829} {"train_loss": -12.51298713684082, "global_step": 475369, "epoch": 2829} {"train_loss": -12.505846977233887, "global_step": 475370, "epoch": 2829} {"train_loss": -12.470890045166016, "global_step": 475371, "epoch": 2829} {"train_loss": -12.612049102783203, "global_step": 475372, "epoch": 2829} {"train_loss": -12.328888893127441, "global_step": 475373, "epoch": 2829} {"train_loss": -12.698408126831055, "global_step": 475374, "epoch": 2829} {"train_loss": -12.443964004516602, "global_step": 475375, "epoch": 2829} {"train_loss": -12.719072341918945, "global_step": 475376, "epoch": 2829} {"train_loss": -12.489181518554688, "global_step": 475377, "epoch": 2829} {"train_loss": -12.901632308959961, "global_step": 475378, "epoch": 2829} {"train_loss": -12.49341106414795, "global_step": 475379, "epoch": 2829} {"train_loss": -12.537437438964844, "global_step": 475380, "epoch": 2829} {"train_loss": -12.741691589355469, "global_step": 475381, "epoch": 2829} {"train_loss": -12.864294052124023, "global_step": 475382, "epoch": 2829} {"train_loss": -12.748141288757324, "global_step": 475383, "epoch": 2829} {"train_loss": -12.700276374816895, "global_step": 475384, "epoch": 2829} {"train_loss": -12.820108413696289, "global_step": 475385, "epoch": 2829} {"train_loss": -12.707120895385742, "global_step": 475386, "epoch": 2829} {"train_loss": -12.91275691986084, "global_step": 475387, "epoch": 2829} {"train_loss": -12.589563369750977, "global_step": 475388, "epoch": 2829} {"train_loss": -12.743086814880371, "global_step": 475389, "epoch": 2829} {"train_loss": -12.515176773071289, "global_step": 475390, "epoch": 2829} {"train_loss": -12.50590705871582, "global_step": 475391, "epoch": 2829} {"train_loss": -12.770822525024414, "global_step": 475392, "epoch": 2829} {"train_loss": -12.74262809753418, "global_step": 475393, "epoch": 2829} {"train_loss": -13.014142990112305, "global_step": 475394, "epoch": 2829} {"train_loss": -12.742265701293945, "global_step": 475395, "epoch": 2829} {"train_loss": -12.727338790893555, "global_step": 475396, "epoch": 2829} {"train_loss": -12.640983581542969, "global_step": 475397, "epoch": 2829} {"train_loss": -12.66757869720459, "global_step": 475398, "epoch": 2829} {"train_loss": -12.655405044555664, "global_step": 475399, "epoch": 2829} {"train_loss": -12.340934753417969, "global_step": 475400, "epoch": 2829} {"train_loss": -12.90217399597168, "global_step": 475401, "epoch": 2829} {"train_loss": -12.768058776855469, "global_step": 475402, "epoch": 2829} {"train_loss": -12.852254867553711, "global_step": 475403, "epoch": 2829} {"train_loss": -12.305036544799805, "global_step": 475404, "epoch": 2829} {"train_loss": -12.19283390045166, "global_step": 475405, "epoch": 2829} {"train_loss": -12.255914688110352, "global_step": 475406, "epoch": 2829} {"train_loss": -12.31674575805664, "global_step": 475407, "epoch": 2829} {"train_loss": -12.517072677612305, "global_step": 475408, "epoch": 2829} {"train_loss": -12.192073822021484, "global_step": 475409, "epoch": 2829} {"train_loss": -12.717284202575684, "global_step": 475410, "epoch": 2829} {"train_loss": -11.642547607421875, "global_step": 475411, "epoch": 2829} {"train_loss": -12.503447532653809, "global_step": 475412, "epoch": 2829} {"train_loss": -11.304588317871094, "global_step": 475413, "epoch": 2829} {"train_loss": -10.509958267211914, "global_step": 475414, "epoch": 2829} {"train_loss": -11.045989990234375, "global_step": 475415, "epoch": 2829} {"train_loss": -10.2684907913208, "global_step": 475416, "epoch": 2829} {"train_loss": -8.627275466918945, "global_step": 475417, "epoch": 2829} {"train_loss": -9.153614044189453, "global_step": 475418, "epoch": 2829} {"train_loss": -9.029061317443848, "global_step": 475419, "epoch": 2829} {"train_loss": -9.668546676635742, "global_step": 475420, "epoch": 2829} {"train_loss": -9.367168426513672, "global_step": 475421, "epoch": 2829} {"train_loss": -10.470634460449219, "global_step": 475422, "epoch": 2829} {"train_loss": -10.16059684753418, "global_step": 475423, "epoch": 2829} {"train_loss": -9.946708679199219, "global_step": 475424, "epoch": 2829} {"train_loss": -10.257336616516113, "global_step": 475425, "epoch": 2829} {"train_loss": -9.4339599609375, "global_step": 475426, "epoch": 2829} {"train_loss": -10.299884796142578, "global_step": 475427, "epoch": 2829} {"train_loss": -9.575551986694336, "global_step": 475428, "epoch": 2829} {"train_loss": -9.698901176452637, "global_step": 475429, "epoch": 2829} {"train_loss": -10.599815368652344, "global_step": 475430, "epoch": 2829} {"train_loss": -11.396663665771484, "global_step": 475431, "epoch": 2829} {"train_loss": -10.915630340576172, "global_step": 475432, "epoch": 2829} {"train_loss": -11.839917182922363, "global_step": 475433, "epoch": 2829} {"train_loss": -11.744949340820312, "global_step": 475434, "epoch": 2829} {"train_loss": -12.082232475280762, "global_step": 475435, "epoch": 2829} {"train_loss": -11.648768424987793, "global_step": 475436, "epoch": 2829} {"train_loss": -11.356582641601562, "global_step": 475437, "epoch": 2829} {"train_loss": -10.996399879455566, "global_step": 475438, "epoch": 2829} {"train_loss": -11.983331782477242, "global_step": 475439, "epoch": 2829, "val_loss": 311100.875} {"train_loss": -11.331010818481445, "global_step": 475440, "epoch": 2830} {"train_loss": -10.842121124267578, "global_step": 475441, "epoch": 2830} {"train_loss": -11.508424758911133, "global_step": 475442, "epoch": 2830} {"train_loss": -10.438340187072754, "global_step": 475443, "epoch": 2830} {"train_loss": -11.591594696044922, "global_step": 475444, "epoch": 2830} {"train_loss": -10.744087219238281, "global_step": 475445, "epoch": 2830} {"train_loss": -10.32196044921875, "global_step": 475446, "epoch": 2830} {"train_loss": -11.826166152954102, "global_step": 475447, "epoch": 2830} {"train_loss": -11.949286460876465, "global_step": 475448, "epoch": 2830} {"train_loss": -10.878366470336914, "global_step": 475449, "epoch": 2830} {"train_loss": -11.767260551452637, "global_step": 475450, "epoch": 2830} {"train_loss": -11.208359718322754, "global_step": 475451, "epoch": 2830} {"train_loss": -11.41153335571289, "global_step": 475452, "epoch": 2830} {"train_loss": -12.01806926727295, "global_step": 475453, "epoch": 2830} {"train_loss": -11.271404266357422, "global_step": 475454, "epoch": 2830} {"train_loss": -11.292468070983887, "global_step": 475455, "epoch": 2830} {"train_loss": -10.780668258666992, "global_step": 475456, "epoch": 2830} {"train_loss": -10.992037773132324, "global_step": 475457, "epoch": 2830} {"train_loss": -12.300880432128906, "global_step": 475458, "epoch": 2830} {"train_loss": -11.027202606201172, "global_step": 475459, "epoch": 2830} {"train_loss": -11.706894874572754, "global_step": 475460, "epoch": 2830} {"train_loss": -11.235273361206055, "global_step": 475461, "epoch": 2830} {"train_loss": -11.56105899810791, "global_step": 475462, "epoch": 2830} {"train_loss": -11.836626052856445, "global_step": 475463, "epoch": 2830} {"train_loss": -11.82978630065918, "global_step": 475464, "epoch": 2830} {"train_loss": -12.026873588562012, "global_step": 475465, "epoch": 2830} {"train_loss": -11.38776683807373, "global_step": 475466, "epoch": 2830} {"train_loss": -11.722108840942383, "global_step": 475467, "epoch": 2830} {"train_loss": -12.412303924560547, "global_step": 475468, "epoch": 2830} {"train_loss": -12.065185546875, "global_step": 475469, "epoch": 2830} {"train_loss": -11.807882308959961, "global_step": 475470, "epoch": 2830} {"train_loss": -11.842323303222656, "global_step": 475471, "epoch": 2830} {"train_loss": -12.110118865966797, "global_step": 475472, "epoch": 2830} {"train_loss": -12.382782936096191, "global_step": 475473, "epoch": 2830} {"train_loss": -11.927677154541016, "global_step": 475474, "epoch": 2830} {"train_loss": -12.02781867980957, "global_step": 475475, "epoch": 2830} {"train_loss": -12.46783447265625, "global_step": 475476, "epoch": 2830} {"train_loss": -12.299274444580078, "global_step": 475477, "epoch": 2830} {"train_loss": -12.505115509033203, "global_step": 475478, "epoch": 2830} {"train_loss": -12.453166961669922, "global_step": 475479, "epoch": 2830} {"train_loss": -12.177776336669922, "global_step": 475480, "epoch": 2830} {"train_loss": -12.446911811828613, "global_step": 475481, "epoch": 2830} {"train_loss": -12.386350631713867, "global_step": 475482, "epoch": 2830} {"train_loss": -12.316802978515625, "global_step": 475483, "epoch": 2830} {"train_loss": -12.423746109008789, "global_step": 475484, "epoch": 2830} {"train_loss": -12.441234588623047, "global_step": 475485, "epoch": 2830} {"train_loss": -12.162742614746094, "global_step": 475486, "epoch": 2830} {"train_loss": -12.42635726928711, "global_step": 475487, "epoch": 2830} {"train_loss": -12.33697509765625, "global_step": 475488, "epoch": 2830} {"train_loss": -12.514646530151367, "global_step": 475489, "epoch": 2830} {"train_loss": -12.500066757202148, "global_step": 475490, "epoch": 2830} {"train_loss": -12.491350173950195, "global_step": 475491, "epoch": 2830} {"train_loss": -12.442042350769043, "global_step": 475492, "epoch": 2830} {"train_loss": -12.620702743530273, "global_step": 475493, "epoch": 2830} {"train_loss": -12.560443878173828, "global_step": 475494, "epoch": 2830} {"train_loss": -12.539657592773438, "global_step": 475495, "epoch": 2830} {"train_loss": -12.712672233581543, "global_step": 475496, "epoch": 2830} {"train_loss": -12.771669387817383, "global_step": 475497, "epoch": 2830} {"train_loss": -12.68862533569336, "global_step": 475498, "epoch": 2830} {"train_loss": -12.84587287902832, "global_step": 475499, "epoch": 2830} {"train_loss": -12.648917198181152, "global_step": 475500, "epoch": 2830} {"train_loss": -12.725563049316406, "global_step": 475501, "epoch": 2830} {"train_loss": -12.94999885559082, "global_step": 475502, "epoch": 2830} {"train_loss": -12.834917068481445, "global_step": 475503, "epoch": 2830} {"train_loss": -12.651611328125, "global_step": 475504, "epoch": 2830} {"train_loss": -12.630569458007812, "global_step": 475505, "epoch": 2830} {"train_loss": -12.488090515136719, "global_step": 475506, "epoch": 2830} {"train_loss": -12.843719482421875, "global_step": 475507, "epoch": 2830} {"train_loss": -12.715404510498047, "global_step": 475508, "epoch": 2830} {"train_loss": -12.493906021118164, "global_step": 475509, "epoch": 2830} {"train_loss": -12.926980972290039, "global_step": 475510, "epoch": 2830} {"train_loss": -12.466087341308594, "global_step": 475511, "epoch": 2830} {"train_loss": -12.660466194152832, "global_step": 475512, "epoch": 2830} {"train_loss": -12.554938316345215, "global_step": 475513, "epoch": 2830} {"train_loss": -12.566533088684082, "global_step": 475514, "epoch": 2830} {"train_loss": -12.619209289550781, "global_step": 475515, "epoch": 2830} {"train_loss": -13.03162956237793, "global_step": 475516, "epoch": 2830} {"train_loss": -12.604390144348145, "global_step": 475517, "epoch": 2830} {"train_loss": -12.801054000854492, "global_step": 475518, "epoch": 2830} {"train_loss": -12.728662490844727, "global_step": 475519, "epoch": 2830} {"train_loss": -12.890859603881836, "global_step": 475520, "epoch": 2830} {"train_loss": -12.928313255310059, "global_step": 475521, "epoch": 2830} {"train_loss": -12.581306457519531, "global_step": 475522, "epoch": 2830} {"train_loss": -12.69119644165039, "global_step": 475523, "epoch": 2830} {"train_loss": -12.876460075378418, "global_step": 475524, "epoch": 2830} {"train_loss": -12.87773609161377, "global_step": 475525, "epoch": 2830} {"train_loss": -12.526200294494629, "global_step": 475526, "epoch": 2830} {"train_loss": -12.954471588134766, "global_step": 475527, "epoch": 2830} {"train_loss": -12.78523063659668, "global_step": 475528, "epoch": 2830} {"train_loss": -12.749470710754395, "global_step": 475529, "epoch": 2830} {"train_loss": -12.814298629760742, "global_step": 475530, "epoch": 2830} {"train_loss": -12.52022933959961, "global_step": 475531, "epoch": 2830} {"train_loss": -12.567261695861816, "global_step": 475532, "epoch": 2830} {"train_loss": -12.69314193725586, "global_step": 475533, "epoch": 2830} {"train_loss": -12.714217185974121, "global_step": 475534, "epoch": 2830} {"train_loss": -12.885577201843262, "global_step": 475535, "epoch": 2830} {"train_loss": -12.828508377075195, "global_step": 475536, "epoch": 2830} {"train_loss": -12.783388137817383, "global_step": 475537, "epoch": 2830} {"train_loss": -12.119446754455566, "global_step": 475538, "epoch": 2830} {"train_loss": -12.732911109924316, "global_step": 475539, "epoch": 2830} {"train_loss": -12.3349609375, "global_step": 475540, "epoch": 2830} {"train_loss": -12.898740768432617, "global_step": 475541, "epoch": 2830} {"train_loss": -12.664905548095703, "global_step": 475542, "epoch": 2830} {"train_loss": -12.631685256958008, "global_step": 475543, "epoch": 2830} {"train_loss": -12.52787971496582, "global_step": 475544, "epoch": 2830} {"train_loss": -12.774038314819336, "global_step": 475545, "epoch": 2830} {"train_loss": -12.402641296386719, "global_step": 475546, "epoch": 2830} {"train_loss": -12.372200012207031, "global_step": 475547, "epoch": 2830} {"train_loss": -12.580839157104492, "global_step": 475548, "epoch": 2830} {"train_loss": -12.866056442260742, "global_step": 475549, "epoch": 2830} {"train_loss": -12.705557823181152, "global_step": 475550, "epoch": 2830} {"train_loss": -12.72542667388916, "global_step": 475551, "epoch": 2830} {"train_loss": -12.810511589050293, "global_step": 475552, "epoch": 2830} {"train_loss": -12.916595458984375, "global_step": 475553, "epoch": 2830} {"train_loss": -12.662809371948242, "global_step": 475554, "epoch": 2830} {"train_loss": -12.808208465576172, "global_step": 475555, "epoch": 2830} {"train_loss": -12.394289016723633, "global_step": 475556, "epoch": 2830} {"train_loss": -12.676026344299316, "global_step": 475557, "epoch": 2830} {"train_loss": -11.89339542388916, "global_step": 475558, "epoch": 2830} {"train_loss": -12.104496002197266, "global_step": 475559, "epoch": 2830} {"train_loss": -12.022104263305664, "global_step": 475560, "epoch": 2830} {"train_loss": -11.684033393859863, "global_step": 475561, "epoch": 2830} {"train_loss": -11.414628028869629, "global_step": 475562, "epoch": 2830} {"train_loss": -12.706464767456055, "global_step": 475563, "epoch": 2830} {"train_loss": -12.07608413696289, "global_step": 475564, "epoch": 2830} {"train_loss": -11.577018737792969, "global_step": 475565, "epoch": 2830} {"train_loss": -11.55592155456543, "global_step": 475566, "epoch": 2830} {"train_loss": -12.061175346374512, "global_step": 475567, "epoch": 2830} {"train_loss": -11.618951797485352, "global_step": 475568, "epoch": 2830} {"train_loss": -11.960208892822266, "global_step": 475569, "epoch": 2830} {"train_loss": -11.734939575195312, "global_step": 475570, "epoch": 2830} {"train_loss": -11.339578628540039, "global_step": 475571, "epoch": 2830} {"train_loss": -11.45161247253418, "global_step": 475572, "epoch": 2830} {"train_loss": -12.171745300292969, "global_step": 475573, "epoch": 2830} {"train_loss": -11.555968284606934, "global_step": 475574, "epoch": 2830} {"train_loss": -11.618766784667969, "global_step": 475575, "epoch": 2830} {"train_loss": -12.126367568969727, "global_step": 475576, "epoch": 2830} {"train_loss": -10.905610084533691, "global_step": 475577, "epoch": 2830} {"train_loss": -11.616960525512695, "global_step": 475578, "epoch": 2830} {"train_loss": -11.731826782226562, "global_step": 475579, "epoch": 2830} {"train_loss": -10.815444946289062, "global_step": 475580, "epoch": 2830} {"train_loss": -11.891478538513184, "global_step": 475581, "epoch": 2830} {"train_loss": -11.410621643066406, "global_step": 475582, "epoch": 2830} {"train_loss": -11.449481964111328, "global_step": 475583, "epoch": 2830} {"train_loss": -10.69817066192627, "global_step": 475584, "epoch": 2830} {"train_loss": -11.193017959594727, "global_step": 475585, "epoch": 2830} {"train_loss": -11.654816627502441, "global_step": 475586, "epoch": 2830} {"train_loss": -10.755132675170898, "global_step": 475587, "epoch": 2830} {"train_loss": -11.404985427856445, "global_step": 475588, "epoch": 2830} {"train_loss": -10.518074989318848, "global_step": 475589, "epoch": 2830} {"train_loss": -10.93077278137207, "global_step": 475590, "epoch": 2830} {"train_loss": -11.558778762817383, "global_step": 475591, "epoch": 2830} {"train_loss": -10.403966903686523, "global_step": 475592, "epoch": 2830} {"train_loss": -12.491830825805664, "global_step": 475593, "epoch": 2830} {"train_loss": -11.19939136505127, "global_step": 475594, "epoch": 2830} {"train_loss": -10.860089302062988, "global_step": 475595, "epoch": 2830} {"train_loss": -12.063981056213379, "global_step": 475596, "epoch": 2830} {"train_loss": -11.539194107055664, "global_step": 475597, "epoch": 2830} {"train_loss": -11.698356628417969, "global_step": 475598, "epoch": 2830} {"train_loss": -11.983243942260742, "global_step": 475599, "epoch": 2830} {"train_loss": -11.2091064453125, "global_step": 475600, "epoch": 2830} {"train_loss": -11.704263687133789, "global_step": 475601, "epoch": 2830} {"train_loss": -11.918516159057617, "global_step": 475602, "epoch": 2830} {"train_loss": -11.875114440917969, "global_step": 475603, "epoch": 2830} {"train_loss": -12.028369903564453, "global_step": 475604, "epoch": 2830} {"train_loss": -12.327995300292969, "global_step": 475605, "epoch": 2830} {"train_loss": -11.739803314208984, "global_step": 475606, "epoch": 2830} {"train_loss": -12.09051665805635, "global_step": 475607, "epoch": 2830, "val_loss": 319648.03125, "train_action_mse_error": 1.4208253622055054} {"train_loss": -11.3037109375, "global_step": 475608, "epoch": 2831} {"train_loss": -11.781761169433594, "global_step": 475609, "epoch": 2831} {"train_loss": -11.17123031616211, "global_step": 475610, "epoch": 2831} {"train_loss": -12.108256340026855, "global_step": 475611, "epoch": 2831} {"train_loss": -11.891075134277344, "global_step": 475612, "epoch": 2831} {"train_loss": -11.973447799682617, "global_step": 475613, "epoch": 2831} {"train_loss": -11.503079414367676, "global_step": 475614, "epoch": 2831} {"train_loss": -11.898298263549805, "global_step": 475615, "epoch": 2831} {"train_loss": -11.312093734741211, "global_step": 475616, "epoch": 2831} {"train_loss": -11.485548973083496, "global_step": 475617, "epoch": 2831} {"train_loss": -11.799520492553711, "global_step": 475618, "epoch": 2831} {"train_loss": -12.011338233947754, "global_step": 475619, "epoch": 2831} {"train_loss": -12.249332427978516, "global_step": 475620, "epoch": 2831} {"train_loss": -12.486349105834961, "global_step": 475621, "epoch": 2831} {"train_loss": -12.205650329589844, "global_step": 475622, "epoch": 2831} {"train_loss": -12.25375747680664, "global_step": 475623, "epoch": 2831} {"train_loss": -11.974088668823242, "global_step": 475624, "epoch": 2831} {"train_loss": -12.354921340942383, "global_step": 475625, "epoch": 2831} {"train_loss": -12.199610710144043, "global_step": 475626, "epoch": 2831} {"train_loss": -12.483978271484375, "global_step": 475627, "epoch": 2831} {"train_loss": -12.363179206848145, "global_step": 475628, "epoch": 2831} {"train_loss": -12.52822494506836, "global_step": 475629, "epoch": 2831} {"train_loss": -12.394084930419922, "global_step": 475630, "epoch": 2831} {"train_loss": -12.52354621887207, "global_step": 475631, "epoch": 2831} {"train_loss": -12.307977676391602, "global_step": 475632, "epoch": 2831} {"train_loss": -12.812891006469727, "global_step": 475633, "epoch": 2831} {"train_loss": -11.951181411743164, "global_step": 475634, "epoch": 2831} {"train_loss": -12.461740493774414, "global_step": 475635, "epoch": 2831} {"train_loss": -12.097017288208008, "global_step": 475636, "epoch": 2831} {"train_loss": -12.404901504516602, "global_step": 475637, "epoch": 2831} {"train_loss": -11.59200382232666, "global_step": 475638, "epoch": 2831} {"train_loss": -11.954060554504395, "global_step": 475639, "epoch": 2831} {"train_loss": -12.117149353027344, "global_step": 475640, "epoch": 2831} {"train_loss": -11.382606506347656, "global_step": 475641, "epoch": 2831} {"train_loss": -12.266019821166992, "global_step": 475642, "epoch": 2831} {"train_loss": -11.826679229736328, "global_step": 475643, "epoch": 2831} {"train_loss": -12.132978439331055, "global_step": 475644, "epoch": 2831} {"train_loss": -11.747488021850586, "global_step": 475645, "epoch": 2831} {"train_loss": -12.284612655639648, "global_step": 475646, "epoch": 2831} {"train_loss": -12.430824279785156, "global_step": 475647, "epoch": 2831} {"train_loss": -12.344627380371094, "global_step": 475648, "epoch": 2831} {"train_loss": -12.224233627319336, "global_step": 475649, "epoch": 2831} {"train_loss": -12.317525863647461, "global_step": 475650, "epoch": 2831} {"train_loss": -12.286354064941406, "global_step": 475651, "epoch": 2831} {"train_loss": -12.36655044555664, "global_step": 475652, "epoch": 2831} {"train_loss": -11.986472129821777, "global_step": 475653, "epoch": 2831} {"train_loss": -12.535316467285156, "global_step": 475654, "epoch": 2831} {"train_loss": -12.428091049194336, "global_step": 475655, "epoch": 2831} {"train_loss": -12.310526847839355, "global_step": 475656, "epoch": 2831} {"train_loss": -12.690163612365723, "global_step": 475657, "epoch": 2831} {"train_loss": -12.23597526550293, "global_step": 475658, "epoch": 2831} {"train_loss": -12.535149574279785, "global_step": 475659, "epoch": 2831} {"train_loss": -12.049318313598633, "global_step": 475660, "epoch": 2831} {"train_loss": -12.47786808013916, "global_step": 475661, "epoch": 2831} {"train_loss": -12.449565887451172, "global_step": 475662, "epoch": 2831} {"train_loss": -12.138129234313965, "global_step": 475663, "epoch": 2831} {"train_loss": -12.734542846679688, "global_step": 475664, "epoch": 2831} {"train_loss": -12.082805633544922, "global_step": 475665, "epoch": 2831} {"train_loss": -12.480666160583496, "global_step": 475666, "epoch": 2831} {"train_loss": -12.243629455566406, "global_step": 475667, "epoch": 2831} {"train_loss": -11.979450225830078, "global_step": 475668, "epoch": 2831} {"train_loss": -12.536161422729492, "global_step": 475669, "epoch": 2831} {"train_loss": -12.337337493896484, "global_step": 475670, "epoch": 2831} {"train_loss": -12.054153442382812, "global_step": 475671, "epoch": 2831} {"train_loss": -12.180508613586426, "global_step": 475672, "epoch": 2831} {"train_loss": -12.436387062072754, "global_step": 475673, "epoch": 2831} {"train_loss": -12.318880081176758, "global_step": 475674, "epoch": 2831} {"train_loss": -12.567329406738281, "global_step": 475675, "epoch": 2831} {"train_loss": -12.41446304321289, "global_step": 475676, "epoch": 2831} {"train_loss": -12.47551155090332, "global_step": 475677, "epoch": 2831} {"train_loss": -12.048995971679688, "global_step": 475678, "epoch": 2831} {"train_loss": -12.827147483825684, "global_step": 475679, "epoch": 2831} {"train_loss": -12.321025848388672, "global_step": 475680, "epoch": 2831} {"train_loss": -12.493919372558594, "global_step": 475681, "epoch": 2831} {"train_loss": -12.305353164672852, "global_step": 475682, "epoch": 2831} {"train_loss": -11.675008773803711, "global_step": 475683, "epoch": 2831} {"train_loss": -12.265586853027344, "global_step": 475684, "epoch": 2831} {"train_loss": -12.244548797607422, "global_step": 475685, "epoch": 2831} {"train_loss": -12.045536041259766, "global_step": 475686, "epoch": 2831} {"train_loss": -12.296034812927246, "global_step": 475687, "epoch": 2831} {"train_loss": -12.440195083618164, "global_step": 475688, "epoch": 2831} {"train_loss": -12.17077922821045, "global_step": 475689, "epoch": 2831} {"train_loss": -12.458166122436523, "global_step": 475690, "epoch": 2831} {"train_loss": -12.487472534179688, "global_step": 475691, "epoch": 2831} {"train_loss": -12.340230941772461, "global_step": 475692, "epoch": 2831} {"train_loss": -12.35801887512207, "global_step": 475693, "epoch": 2831} {"train_loss": -12.430766105651855, "global_step": 475694, "epoch": 2831} {"train_loss": -11.861392974853516, "global_step": 475695, "epoch": 2831} {"train_loss": -12.599775314331055, "global_step": 475696, "epoch": 2831} {"train_loss": -12.466371536254883, "global_step": 475697, "epoch": 2831} {"train_loss": -11.462627410888672, "global_step": 475698, "epoch": 2831} {"train_loss": -12.723055839538574, "global_step": 475699, "epoch": 2831} {"train_loss": -12.059477806091309, "global_step": 475700, "epoch": 2831} {"train_loss": -12.217824935913086, "global_step": 475701, "epoch": 2831} {"train_loss": -12.384912490844727, "global_step": 475702, "epoch": 2831} {"train_loss": -11.263248443603516, "global_step": 475703, "epoch": 2831} {"train_loss": -12.188074111938477, "global_step": 475704, "epoch": 2831} {"train_loss": -11.634510040283203, "global_step": 475705, "epoch": 2831} {"train_loss": -11.287908554077148, "global_step": 475706, "epoch": 2831} {"train_loss": -12.402202606201172, "global_step": 475707, "epoch": 2831} {"train_loss": -10.63448715209961, "global_step": 475708, "epoch": 2831} {"train_loss": -12.54134750366211, "global_step": 475709, "epoch": 2831} {"train_loss": -11.715165138244629, "global_step": 475710, "epoch": 2831} {"train_loss": -11.724977493286133, "global_step": 475711, "epoch": 2831} {"train_loss": -11.765430450439453, "global_step": 475712, "epoch": 2831} {"train_loss": -11.6156005859375, "global_step": 475713, "epoch": 2831} {"train_loss": -12.531936645507812, "global_step": 475714, "epoch": 2831} {"train_loss": -11.778517723083496, "global_step": 475715, "epoch": 2831} {"train_loss": -12.547158241271973, "global_step": 475716, "epoch": 2831} {"train_loss": -12.017278671264648, "global_step": 475717, "epoch": 2831} {"train_loss": -10.955842971801758, "global_step": 475718, "epoch": 2831} {"train_loss": -12.289859771728516, "global_step": 475719, "epoch": 2831} {"train_loss": -11.857595443725586, "global_step": 475720, "epoch": 2831} {"train_loss": -11.834064483642578, "global_step": 475721, "epoch": 2831} {"train_loss": -11.755868911743164, "global_step": 475722, "epoch": 2831} {"train_loss": -11.543304443359375, "global_step": 475723, "epoch": 2831} {"train_loss": -11.60389518737793, "global_step": 475724, "epoch": 2831} {"train_loss": -11.88325309753418, "global_step": 475725, "epoch": 2831} {"train_loss": -11.850994110107422, "global_step": 475726, "epoch": 2831} {"train_loss": -10.997498512268066, "global_step": 475727, "epoch": 2831} {"train_loss": -10.849796295166016, "global_step": 475728, "epoch": 2831} {"train_loss": -11.055896759033203, "global_step": 475729, "epoch": 2831} {"train_loss": -11.333819389343262, "global_step": 475730, "epoch": 2831} {"train_loss": -11.79831314086914, "global_step": 475731, "epoch": 2831} {"train_loss": -11.318794250488281, "global_step": 475732, "epoch": 2831} {"train_loss": -11.596168518066406, "global_step": 475733, "epoch": 2831} {"train_loss": -11.510857582092285, "global_step": 475734, "epoch": 2831} {"train_loss": -11.759653091430664, "global_step": 475735, "epoch": 2831} {"train_loss": -10.968668937683105, "global_step": 475736, "epoch": 2831} {"train_loss": -11.949790000915527, "global_step": 475737, "epoch": 2831} {"train_loss": -11.707317352294922, "global_step": 475738, "epoch": 2831} {"train_loss": -11.712748527526855, "global_step": 475739, "epoch": 2831} {"train_loss": -12.076704978942871, "global_step": 475740, "epoch": 2831} {"train_loss": -11.977056503295898, "global_step": 475741, "epoch": 2831} {"train_loss": -12.104808807373047, "global_step": 475742, "epoch": 2831} {"train_loss": -12.336792945861816, "global_step": 475743, "epoch": 2831} {"train_loss": -12.029986381530762, "global_step": 475744, "epoch": 2831} {"train_loss": -12.136194229125977, "global_step": 475745, "epoch": 2831} {"train_loss": -12.195446014404297, "global_step": 475746, "epoch": 2831} {"train_loss": -12.187027931213379, "global_step": 475747, "epoch": 2831} {"train_loss": -12.439434051513672, "global_step": 475748, "epoch": 2831} {"train_loss": -12.559549331665039, "global_step": 475749, "epoch": 2831} {"train_loss": -12.236383438110352, "global_step": 475750, "epoch": 2831} {"train_loss": -12.367971420288086, "global_step": 475751, "epoch": 2831} {"train_loss": -12.175750732421875, "global_step": 475752, "epoch": 2831} {"train_loss": -12.340253829956055, "global_step": 475753, "epoch": 2831} {"train_loss": -12.719064712524414, "global_step": 475754, "epoch": 2831} {"train_loss": -12.268342971801758, "global_step": 475755, "epoch": 2831} {"train_loss": -12.525455474853516, "global_step": 475756, "epoch": 2831} {"train_loss": -12.016143798828125, "global_step": 475757, "epoch": 2831} {"train_loss": -12.312965393066406, "global_step": 475758, "epoch": 2831} {"train_loss": -12.59129524230957, "global_step": 475759, "epoch": 2831} {"train_loss": -12.249164581298828, "global_step": 475760, "epoch": 2831} {"train_loss": -12.250985145568848, "global_step": 475761, "epoch": 2831} {"train_loss": -12.372149467468262, "global_step": 475762, "epoch": 2831} {"train_loss": -12.171579360961914, "global_step": 475763, "epoch": 2831} {"train_loss": -12.359067916870117, "global_step": 475764, "epoch": 2831} {"train_loss": -12.500377655029297, "global_step": 475765, "epoch": 2831} {"train_loss": -12.074556350708008, "global_step": 475766, "epoch": 2831} {"train_loss": -12.59525203704834, "global_step": 475767, "epoch": 2831} {"train_loss": -12.531916618347168, "global_step": 475768, "epoch": 2831} {"train_loss": -12.531518936157227, "global_step": 475769, "epoch": 2831} {"train_loss": -12.989356994628906, "global_step": 475770, "epoch": 2831} {"train_loss": -12.48554801940918, "global_step": 475771, "epoch": 2831} {"train_loss": -12.660459518432617, "global_step": 475772, "epoch": 2831} {"train_loss": -12.851737022399902, "global_step": 475773, "epoch": 2831} {"train_loss": -12.59602165222168, "global_step": 475774, "epoch": 2831} {"train_loss": -12.123716853913807, "global_step": 475775, "epoch": 2831, "val_loss": 316074.65625} {"train_loss": -12.563796043395996, "global_step": 475776, "epoch": 2832} {"train_loss": -12.524187088012695, "global_step": 475777, "epoch": 2832} {"train_loss": -12.570805549621582, "global_step": 475778, "epoch": 2832} {"train_loss": -12.757678985595703, "global_step": 475779, "epoch": 2832} {"train_loss": -12.647064208984375, "global_step": 475780, "epoch": 2832} {"train_loss": -12.67715835571289, "global_step": 475781, "epoch": 2832} {"train_loss": -12.691424369812012, "global_step": 475782, "epoch": 2832} {"train_loss": -12.706710815429688, "global_step": 475783, "epoch": 2832} {"train_loss": -12.71986198425293, "global_step": 475784, "epoch": 2832} {"train_loss": -12.685522079467773, "global_step": 475785, "epoch": 2832} {"train_loss": -12.839138984680176, "global_step": 475786, "epoch": 2832} {"train_loss": -12.757613182067871, "global_step": 475787, "epoch": 2832} {"train_loss": -12.588279724121094, "global_step": 475788, "epoch": 2832} {"train_loss": -12.782085418701172, "global_step": 475789, "epoch": 2832} {"train_loss": -12.689579010009766, "global_step": 475790, "epoch": 2832} {"train_loss": -12.816486358642578, "global_step": 475791, "epoch": 2832} {"train_loss": -12.852949142456055, "global_step": 475792, "epoch": 2832} {"train_loss": -12.653634071350098, "global_step": 475793, "epoch": 2832} {"train_loss": -12.836357116699219, "global_step": 475794, "epoch": 2832} {"train_loss": -12.696746826171875, "global_step": 475795, "epoch": 2832} {"train_loss": -13.04311752319336, "global_step": 475796, "epoch": 2832} {"train_loss": -12.838996887207031, "global_step": 475797, "epoch": 2832} {"train_loss": -12.823060989379883, "global_step": 475798, "epoch": 2832} {"train_loss": -12.952169418334961, "global_step": 475799, "epoch": 2832} {"train_loss": -13.005356788635254, "global_step": 475800, "epoch": 2832} {"train_loss": -12.912720680236816, "global_step": 475801, "epoch": 2832} {"train_loss": -12.828425407409668, "global_step": 475802, "epoch": 2832} {"train_loss": -12.632614135742188, "global_step": 475803, "epoch": 2832} {"train_loss": -12.830854415893555, "global_step": 475804, "epoch": 2832} {"train_loss": -12.760791778564453, "global_step": 475805, "epoch": 2832} {"train_loss": -12.669913291931152, "global_step": 475806, "epoch": 2832} {"train_loss": -12.904305458068848, "global_step": 475807, "epoch": 2832} {"train_loss": -12.744894027709961, "global_step": 475808, "epoch": 2832} {"train_loss": -13.045675277709961, "global_step": 475809, "epoch": 2832} {"train_loss": -12.811857223510742, "global_step": 475810, "epoch": 2832} {"train_loss": -12.669387817382812, "global_step": 475811, "epoch": 2832} {"train_loss": -12.958839416503906, "global_step": 475812, "epoch": 2832} {"train_loss": -13.068904876708984, "global_step": 475813, "epoch": 2832} {"train_loss": -12.919632911682129, "global_step": 475814, "epoch": 2832} {"train_loss": -12.792016983032227, "global_step": 475815, "epoch": 2832} {"train_loss": -13.038751602172852, "global_step": 475816, "epoch": 2832} {"train_loss": -12.930461883544922, "global_step": 475817, "epoch": 2832} {"train_loss": -13.08765983581543, "global_step": 475818, "epoch": 2832} {"train_loss": -13.033860206604004, "global_step": 475819, "epoch": 2832} {"train_loss": -12.872579574584961, "global_step": 475820, "epoch": 2832} {"train_loss": -12.968622207641602, "global_step": 475821, "epoch": 2832} {"train_loss": -13.098943710327148, "global_step": 475822, "epoch": 2832} {"train_loss": -12.772027969360352, "global_step": 475823, "epoch": 2832} {"train_loss": -13.138650894165039, "global_step": 475824, "epoch": 2832} {"train_loss": -12.835588455200195, "global_step": 475825, "epoch": 2832} {"train_loss": -12.721899032592773, "global_step": 475826, "epoch": 2832} {"train_loss": -13.09736442565918, "global_step": 475827, "epoch": 2832} {"train_loss": -12.854212760925293, "global_step": 475828, "epoch": 2832} {"train_loss": -12.839523315429688, "global_step": 475829, "epoch": 2832} {"train_loss": -12.683685302734375, "global_step": 475830, "epoch": 2832} {"train_loss": -13.206334114074707, "global_step": 475831, "epoch": 2832} {"train_loss": -12.753074645996094, "global_step": 475832, "epoch": 2832} {"train_loss": -13.05127239227295, "global_step": 475833, "epoch": 2832} {"train_loss": -13.162797927856445, "global_step": 475834, "epoch": 2832} {"train_loss": -13.135238647460938, "global_step": 475835, "epoch": 2832} {"train_loss": -12.995706558227539, "global_step": 475836, "epoch": 2832} {"train_loss": -13.070521354675293, "global_step": 475837, "epoch": 2832} {"train_loss": -13.224119186401367, "global_step": 475838, "epoch": 2832} {"train_loss": -12.881422996520996, "global_step": 475839, "epoch": 2832} {"train_loss": -12.793668746948242, "global_step": 475840, "epoch": 2832} {"train_loss": -12.826797485351562, "global_step": 475841, "epoch": 2832} {"train_loss": -12.985177993774414, "global_step": 475842, "epoch": 2832} {"train_loss": -12.058032989501953, "global_step": 475843, "epoch": 2832} {"train_loss": -10.181507110595703, "global_step": 475844, "epoch": 2832} {"train_loss": -11.466453552246094, "global_step": 475845, "epoch": 2832} {"train_loss": -11.018904685974121, "global_step": 475846, "epoch": 2832} {"train_loss": -11.38853645324707, "global_step": 475847, "epoch": 2832} {"train_loss": -10.725035667419434, "global_step": 475848, "epoch": 2832} {"train_loss": -7.987884521484375, "global_step": 475849, "epoch": 2832} {"train_loss": -8.516817092895508, "global_step": 475850, "epoch": 2832} {"train_loss": -8.574146270751953, "global_step": 475851, "epoch": 2832} {"train_loss": -7.85923433303833, "global_step": 475852, "epoch": 2832} {"train_loss": -9.304913520812988, "global_step": 475853, "epoch": 2832} {"train_loss": -9.269247055053711, "global_step": 475854, "epoch": 2832} {"train_loss": -10.420866966247559, "global_step": 475855, "epoch": 2832} {"train_loss": -9.437520980834961, "global_step": 475856, "epoch": 2832} {"train_loss": -9.570159912109375, "global_step": 475857, "epoch": 2832} {"train_loss": -9.275354385375977, "global_step": 475858, "epoch": 2832} {"train_loss": -9.881702423095703, "global_step": 475859, "epoch": 2832} {"train_loss": -10.336349487304688, "global_step": 475860, "epoch": 2832} {"train_loss": -9.15898323059082, "global_step": 475861, "epoch": 2832} {"train_loss": -10.686384201049805, "global_step": 475862, "epoch": 2832} {"train_loss": -11.484572410583496, "global_step": 475863, "epoch": 2832} {"train_loss": -10.370819091796875, "global_step": 475864, "epoch": 2832} {"train_loss": -10.775035858154297, "global_step": 475865, "epoch": 2832} {"train_loss": -11.27696418762207, "global_step": 475866, "epoch": 2832} {"train_loss": -10.444345474243164, "global_step": 475867, "epoch": 2832} {"train_loss": -10.50804328918457, "global_step": 475868, "epoch": 2832} {"train_loss": -11.380284309387207, "global_step": 475869, "epoch": 2832} {"train_loss": -12.091498374938965, "global_step": 475870, "epoch": 2832} {"train_loss": -11.453144073486328, "global_step": 475871, "epoch": 2832} {"train_loss": -11.15475845336914, "global_step": 475872, "epoch": 2832} {"train_loss": -11.733896255493164, "global_step": 475873, "epoch": 2832} {"train_loss": -11.561517715454102, "global_step": 475874, "epoch": 2832} {"train_loss": -11.135692596435547, "global_step": 475875, "epoch": 2832} {"train_loss": -12.156791687011719, "global_step": 475876, "epoch": 2832} {"train_loss": -11.646787643432617, "global_step": 475877, "epoch": 2832} {"train_loss": -11.79554557800293, "global_step": 475878, "epoch": 2832} {"train_loss": -12.041959762573242, "global_step": 475879, "epoch": 2832} {"train_loss": -11.915149688720703, "global_step": 475880, "epoch": 2832} {"train_loss": -12.117777824401855, "global_step": 475881, "epoch": 2832} {"train_loss": -11.865583419799805, "global_step": 475882, "epoch": 2832} {"train_loss": -12.080395698547363, "global_step": 475883, "epoch": 2832} {"train_loss": -11.82286262512207, "global_step": 475884, "epoch": 2832} {"train_loss": -12.111577033996582, "global_step": 475885, "epoch": 2832} {"train_loss": -12.403261184692383, "global_step": 475886, "epoch": 2832} {"train_loss": -12.143941879272461, "global_step": 475887, "epoch": 2832} {"train_loss": -12.200119972229004, "global_step": 475888, "epoch": 2832} {"train_loss": -12.3073091506958, "global_step": 475889, "epoch": 2832} {"train_loss": -12.033788681030273, "global_step": 475890, "epoch": 2832} {"train_loss": -12.25986099243164, "global_step": 475891, "epoch": 2832} {"train_loss": -11.749044418334961, "global_step": 475892, "epoch": 2832} {"train_loss": -12.062522888183594, "global_step": 475893, "epoch": 2832} {"train_loss": -12.220705032348633, "global_step": 475894, "epoch": 2832} {"train_loss": -12.284685134887695, "global_step": 475895, "epoch": 2832} {"train_loss": -12.399410247802734, "global_step": 475896, "epoch": 2832} {"train_loss": -12.556673049926758, "global_step": 475897, "epoch": 2832} {"train_loss": -12.209880828857422, "global_step": 475898, "epoch": 2832} {"train_loss": -12.298776626586914, "global_step": 475899, "epoch": 2832} {"train_loss": -12.200995445251465, "global_step": 475900, "epoch": 2832} {"train_loss": -12.46566104888916, "global_step": 475901, "epoch": 2832} {"train_loss": -12.575550079345703, "global_step": 475902, "epoch": 2832} {"train_loss": -12.321061134338379, "global_step": 475903, "epoch": 2832} {"train_loss": -12.521978378295898, "global_step": 475904, "epoch": 2832} {"train_loss": -12.653648376464844, "global_step": 475905, "epoch": 2832} {"train_loss": -12.522924423217773, "global_step": 475906, "epoch": 2832} {"train_loss": -12.529613494873047, "global_step": 475907, "epoch": 2832} {"train_loss": -12.25556468963623, "global_step": 475908, "epoch": 2832} {"train_loss": -12.882837295532227, "global_step": 475909, "epoch": 2832} {"train_loss": -12.570066452026367, "global_step": 475910, "epoch": 2832} {"train_loss": -12.458466529846191, "global_step": 475911, "epoch": 2832} {"train_loss": -12.608455657958984, "global_step": 475912, "epoch": 2832} {"train_loss": -12.669234275817871, "global_step": 475913, "epoch": 2832} {"train_loss": -12.559394836425781, "global_step": 475914, "epoch": 2832} {"train_loss": -12.797416687011719, "global_step": 475915, "epoch": 2832} {"train_loss": -12.663568496704102, "global_step": 475916, "epoch": 2832} {"train_loss": -12.862310409545898, "global_step": 475917, "epoch": 2832} {"train_loss": -12.70407485961914, "global_step": 475918, "epoch": 2832} {"train_loss": -12.720531463623047, "global_step": 475919, "epoch": 2832} {"train_loss": -12.803657531738281, "global_step": 475920, "epoch": 2832} {"train_loss": -12.737509727478027, "global_step": 475921, "epoch": 2832} {"train_loss": -12.543365478515625, "global_step": 475922, "epoch": 2832} {"train_loss": -12.717766761779785, "global_step": 475923, "epoch": 2832} {"train_loss": -12.760331153869629, "global_step": 475924, "epoch": 2832} {"train_loss": -12.730228424072266, "global_step": 475925, "epoch": 2832} {"train_loss": -12.772649765014648, "global_step": 475926, "epoch": 2832} {"train_loss": -12.831705093383789, "global_step": 475927, "epoch": 2832} {"train_loss": -12.861740112304688, "global_step": 475928, "epoch": 2832} {"train_loss": -12.678686141967773, "global_step": 475929, "epoch": 2832} {"train_loss": -12.882184982299805, "global_step": 475930, "epoch": 2832} {"train_loss": -12.718952178955078, "global_step": 475931, "epoch": 2832} {"train_loss": -12.899596214294434, "global_step": 475932, "epoch": 2832} {"train_loss": -12.722689628601074, "global_step": 475933, "epoch": 2832} {"train_loss": -12.48157024383545, "global_step": 475934, "epoch": 2832} {"train_loss": -12.765579223632812, "global_step": 475935, "epoch": 2832} {"train_loss": -12.872414588928223, "global_step": 475936, "epoch": 2832} {"train_loss": -12.403045654296875, "global_step": 475937, "epoch": 2832} {"train_loss": -12.667991638183594, "global_step": 475938, "epoch": 2832} {"train_loss": -12.817892074584961, "global_step": 475939, "epoch": 2832} {"train_loss": -12.555517196655273, "global_step": 475940, "epoch": 2832} {"train_loss": -12.491500854492188, "global_step": 475941, "epoch": 2832} {"train_loss": -12.654703140258789, "global_step": 475942, "epoch": 2832} {"train_loss": -12.207975589093708, "global_step": 475943, "epoch": 2832, "val_loss": 316798.6875} {"train_loss": -11.46318244934082, "global_step": 475944, "epoch": 2833} {"train_loss": -11.036264419555664, "global_step": 475945, "epoch": 2833} {"train_loss": -11.552095413208008, "global_step": 475946, "epoch": 2833} {"train_loss": -12.677533149719238, "global_step": 475947, "epoch": 2833} {"train_loss": -10.55811882019043, "global_step": 475948, "epoch": 2833} {"train_loss": -12.285321235656738, "global_step": 475949, "epoch": 2833} {"train_loss": -11.30716323852539, "global_step": 475950, "epoch": 2833} {"train_loss": -10.69612979888916, "global_step": 475951, "epoch": 2833} {"train_loss": -11.110904693603516, "global_step": 475952, "epoch": 2833} {"train_loss": -10.547045707702637, "global_step": 475953, "epoch": 2833} {"train_loss": -11.512834548950195, "global_step": 475954, "epoch": 2833} {"train_loss": -10.15916633605957, "global_step": 475955, "epoch": 2833} {"train_loss": -9.921632766723633, "global_step": 475956, "epoch": 2833} {"train_loss": -10.670894622802734, "global_step": 475957, "epoch": 2833} {"train_loss": -11.576957702636719, "global_step": 475958, "epoch": 2833} {"train_loss": -11.641227722167969, "global_step": 475959, "epoch": 2833} {"train_loss": -11.151689529418945, "global_step": 475960, "epoch": 2833} {"train_loss": -11.233955383300781, "global_step": 475961, "epoch": 2833} {"train_loss": -9.562346458435059, "global_step": 475962, "epoch": 2833} {"train_loss": -12.130243301391602, "global_step": 475963, "epoch": 2833} {"train_loss": -9.992586135864258, "global_step": 475964, "epoch": 2833} {"train_loss": -9.28615951538086, "global_step": 475965, "epoch": 2833} {"train_loss": -11.361671447753906, "global_step": 475966, "epoch": 2833} {"train_loss": -9.372346878051758, "global_step": 475967, "epoch": 2833} {"train_loss": -9.41236400604248, "global_step": 475968, "epoch": 2833} {"train_loss": -9.152477264404297, "global_step": 475969, "epoch": 2833} {"train_loss": -11.260784149169922, "global_step": 475970, "epoch": 2833} {"train_loss": -9.682579040527344, "global_step": 475971, "epoch": 2833} {"train_loss": -11.508621215820312, "global_step": 475972, "epoch": 2833} {"train_loss": -9.654090881347656, "global_step": 475973, "epoch": 2833} {"train_loss": -11.126668930053711, "global_step": 475974, "epoch": 2833} {"train_loss": -11.431625366210938, "global_step": 475975, "epoch": 2833} {"train_loss": -11.068185806274414, "global_step": 475976, "epoch": 2833} {"train_loss": -11.949106216430664, "global_step": 475977, "epoch": 2833} {"train_loss": -11.156366348266602, "global_step": 475978, "epoch": 2833} {"train_loss": -11.319704055786133, "global_step": 475979, "epoch": 2833} {"train_loss": -11.25168514251709, "global_step": 475980, "epoch": 2833} {"train_loss": -11.295923233032227, "global_step": 475981, "epoch": 2833} {"train_loss": -11.704977035522461, "global_step": 475982, "epoch": 2833} {"train_loss": -11.764528274536133, "global_step": 475983, "epoch": 2833} {"train_loss": -12.202985763549805, "global_step": 475984, "epoch": 2833} {"train_loss": -11.04112720489502, "global_step": 475985, "epoch": 2833} {"train_loss": -11.957990646362305, "global_step": 475986, "epoch": 2833} {"train_loss": -10.44212532043457, "global_step": 475987, "epoch": 2833} {"train_loss": -11.863143920898438, "global_step": 475988, "epoch": 2833} {"train_loss": -11.189249038696289, "global_step": 475989, "epoch": 2833} {"train_loss": -11.441844940185547, "global_step": 475990, "epoch": 2833} {"train_loss": -11.935298919677734, "global_step": 475991, "epoch": 2833} {"train_loss": -11.021071434020996, "global_step": 475992, "epoch": 2833} {"train_loss": -11.71385669708252, "global_step": 475993, "epoch": 2833} {"train_loss": -12.31357192993164, "global_step": 475994, "epoch": 2833} {"train_loss": -11.702655792236328, "global_step": 475995, "epoch": 2833} {"train_loss": -12.235660552978516, "global_step": 475996, "epoch": 2833} {"train_loss": -12.006620407104492, "global_step": 475997, "epoch": 2833} {"train_loss": -12.095232009887695, "global_step": 475998, "epoch": 2833} {"train_loss": -12.37946891784668, "global_step": 475999, "epoch": 2833} {"train_loss": -12.153205871582031, "global_step": 476000, "epoch": 2833} {"train_loss": -12.394768714904785, "global_step": 476001, "epoch": 2833} {"train_loss": -12.330018997192383, "global_step": 476002, "epoch": 2833} {"train_loss": -12.1693754196167, "global_step": 476003, "epoch": 2833} {"train_loss": -12.330329895019531, "global_step": 476004, "epoch": 2833} {"train_loss": -12.157127380371094, "global_step": 476005, "epoch": 2833} {"train_loss": -12.45090103149414, "global_step": 476006, "epoch": 2833} {"train_loss": -12.398256301879883, "global_step": 476007, "epoch": 2833} {"train_loss": -12.155600547790527, "global_step": 476008, "epoch": 2833} {"train_loss": -12.53326416015625, "global_step": 476009, "epoch": 2833} {"train_loss": -12.281330108642578, "global_step": 476010, "epoch": 2833} {"train_loss": -12.255016326904297, "global_step": 476011, "epoch": 2833} {"train_loss": -12.210443496704102, "global_step": 476012, "epoch": 2833} {"train_loss": -12.157094955444336, "global_step": 476013, "epoch": 2833} {"train_loss": -12.429511070251465, "global_step": 476014, "epoch": 2833} {"train_loss": -12.170711517333984, "global_step": 476015, "epoch": 2833} {"train_loss": -12.398771286010742, "global_step": 476016, "epoch": 2833} {"train_loss": -12.477733612060547, "global_step": 476017, "epoch": 2833} {"train_loss": -12.392559051513672, "global_step": 476018, "epoch": 2833} {"train_loss": -12.324121475219727, "global_step": 476019, "epoch": 2833} {"train_loss": -12.109224319458008, "global_step": 476020, "epoch": 2833} {"train_loss": -12.506078720092773, "global_step": 476021, "epoch": 2833} {"train_loss": -12.165037155151367, "global_step": 476022, "epoch": 2833} {"train_loss": -12.525106430053711, "global_step": 476023, "epoch": 2833} {"train_loss": -12.160115242004395, "global_step": 476024, "epoch": 2833} {"train_loss": -12.408515930175781, "global_step": 476025, "epoch": 2833} {"train_loss": -12.166236877441406, "global_step": 476026, "epoch": 2833} {"train_loss": -12.607444763183594, "global_step": 476027, "epoch": 2833} {"train_loss": -12.16170597076416, "global_step": 476028, "epoch": 2833} {"train_loss": -12.426513671875, "global_step": 476029, "epoch": 2833} {"train_loss": -12.456859588623047, "global_step": 476030, "epoch": 2833} {"train_loss": -12.041194915771484, "global_step": 476031, "epoch": 2833} {"train_loss": -12.600813865661621, "global_step": 476032, "epoch": 2833} {"train_loss": -11.998739242553711, "global_step": 476033, "epoch": 2833} {"train_loss": -12.33696174621582, "global_step": 476034, "epoch": 2833} {"train_loss": -12.557268142700195, "global_step": 476035, "epoch": 2833} {"train_loss": -12.55681037902832, "global_step": 476036, "epoch": 2833} {"train_loss": -12.140079498291016, "global_step": 476037, "epoch": 2833} {"train_loss": -12.77048110961914, "global_step": 476038, "epoch": 2833} {"train_loss": -12.536018371582031, "global_step": 476039, "epoch": 2833} {"train_loss": -12.45102596282959, "global_step": 476040, "epoch": 2833} {"train_loss": -12.559651374816895, "global_step": 476041, "epoch": 2833} {"train_loss": -12.712006568908691, "global_step": 476042, "epoch": 2833} {"train_loss": -12.74044418334961, "global_step": 476043, "epoch": 2833} {"train_loss": -12.41031265258789, "global_step": 476044, "epoch": 2833} {"train_loss": -12.710330963134766, "global_step": 476045, "epoch": 2833} {"train_loss": -12.523065567016602, "global_step": 476046, "epoch": 2833} {"train_loss": -12.557883262634277, "global_step": 476047, "epoch": 2833} {"train_loss": -12.328241348266602, "global_step": 476048, "epoch": 2833} {"train_loss": -12.507048606872559, "global_step": 476049, "epoch": 2833} {"train_loss": -12.66610336303711, "global_step": 476050, "epoch": 2833} {"train_loss": -12.527841567993164, "global_step": 476051, "epoch": 2833} {"train_loss": -11.994366645812988, "global_step": 476052, "epoch": 2833} {"train_loss": -12.611120223999023, "global_step": 476053, "epoch": 2833} {"train_loss": -12.543136596679688, "global_step": 476054, "epoch": 2833} {"train_loss": -12.221780776977539, "global_step": 476055, "epoch": 2833} {"train_loss": -12.467015266418457, "global_step": 476056, "epoch": 2833} {"train_loss": -12.348532676696777, "global_step": 476057, "epoch": 2833} {"train_loss": -12.786957740783691, "global_step": 476058, "epoch": 2833} {"train_loss": -12.696572303771973, "global_step": 476059, "epoch": 2833} {"train_loss": -12.377240180969238, "global_step": 476060, "epoch": 2833} {"train_loss": -12.129865646362305, "global_step": 476061, "epoch": 2833} {"train_loss": -11.854072570800781, "global_step": 476062, "epoch": 2833} {"train_loss": -11.637297630310059, "global_step": 476063, "epoch": 2833} {"train_loss": -11.863788604736328, "global_step": 476064, "epoch": 2833} {"train_loss": -12.007160186767578, "global_step": 476065, "epoch": 2833} {"train_loss": -11.924139022827148, "global_step": 476066, "epoch": 2833} {"train_loss": -11.998306274414062, "global_step": 476067, "epoch": 2833} {"train_loss": -12.42347526550293, "global_step": 476068, "epoch": 2833} {"train_loss": -12.351333618164062, "global_step": 476069, "epoch": 2833} {"train_loss": -11.707294464111328, "global_step": 476070, "epoch": 2833} {"train_loss": -11.807974815368652, "global_step": 476071, "epoch": 2833} {"train_loss": -12.402690887451172, "global_step": 476072, "epoch": 2833} {"train_loss": -12.293392181396484, "global_step": 476073, "epoch": 2833} {"train_loss": -11.847908020019531, "global_step": 476074, "epoch": 2833} {"train_loss": -12.267301559448242, "global_step": 476075, "epoch": 2833} {"train_loss": -12.300789833068848, "global_step": 476076, "epoch": 2833} {"train_loss": -12.346461296081543, "global_step": 476077, "epoch": 2833} {"train_loss": -12.663339614868164, "global_step": 476078, "epoch": 2833} {"train_loss": -12.218585968017578, "global_step": 476079, "epoch": 2833} {"train_loss": -12.41663932800293, "global_step": 476080, "epoch": 2833} {"train_loss": -12.309774398803711, "global_step": 476081, "epoch": 2833} {"train_loss": -12.431709289550781, "global_step": 476082, "epoch": 2833} {"train_loss": -12.712373733520508, "global_step": 476083, "epoch": 2833} {"train_loss": -12.385063171386719, "global_step": 476084, "epoch": 2833} {"train_loss": -12.445091247558594, "global_step": 476085, "epoch": 2833} {"train_loss": -12.292533874511719, "global_step": 476086, "epoch": 2833} {"train_loss": -12.357841491699219, "global_step": 476087, "epoch": 2833} {"train_loss": -12.379669189453125, "global_step": 476088, "epoch": 2833} {"train_loss": -12.482454299926758, "global_step": 476089, "epoch": 2833} {"train_loss": -12.324291229248047, "global_step": 476090, "epoch": 2833} {"train_loss": -12.651884078979492, "global_step": 476091, "epoch": 2833} {"train_loss": -12.68390941619873, "global_step": 476092, "epoch": 2833} {"train_loss": -12.800684928894043, "global_step": 476093, "epoch": 2833} {"train_loss": -12.824807167053223, "global_step": 476094, "epoch": 2833} {"train_loss": -12.200389862060547, "global_step": 476095, "epoch": 2833} {"train_loss": -11.98887825012207, "global_step": 476096, "epoch": 2833} {"train_loss": -12.646012306213379, "global_step": 476097, "epoch": 2833} {"train_loss": -12.743070602416992, "global_step": 476098, "epoch": 2833} {"train_loss": -12.33204174041748, "global_step": 476099, "epoch": 2833} {"train_loss": -12.717039108276367, "global_step": 476100, "epoch": 2833} {"train_loss": -12.527933120727539, "global_step": 476101, "epoch": 2833} {"train_loss": -12.756233215332031, "global_step": 476102, "epoch": 2833} {"train_loss": -12.709732055664062, "global_step": 476103, "epoch": 2833} {"train_loss": -12.558571815490723, "global_step": 476104, "epoch": 2833} {"train_loss": -12.596362113952637, "global_step": 476105, "epoch": 2833} {"train_loss": -12.220504760742188, "global_step": 476106, "epoch": 2833} {"train_loss": -12.71918773651123, "global_step": 476107, "epoch": 2833} {"train_loss": -12.630538940429688, "global_step": 476108, "epoch": 2833} {"train_loss": -12.053258895874023, "global_step": 476109, "epoch": 2833} {"train_loss": -11.640433311462402, "global_step": 476110, "epoch": 2833} {"train_loss": -11.966221985362825, "global_step": 476111, "epoch": 2833, "val_loss": 315450.0} {"train_loss": -12.319292068481445, "global_step": 476112, "epoch": 2834} {"train_loss": -11.769235610961914, "global_step": 476113, "epoch": 2834} {"train_loss": -12.275561332702637, "global_step": 476114, "epoch": 2834} {"train_loss": -12.49374008178711, "global_step": 476115, "epoch": 2834} {"train_loss": -11.617015838623047, "global_step": 476116, "epoch": 2834} {"train_loss": -12.446956634521484, "global_step": 476117, "epoch": 2834} {"train_loss": -11.953857421875, "global_step": 476118, "epoch": 2834} {"train_loss": -12.355804443359375, "global_step": 476119, "epoch": 2834} {"train_loss": -12.282356262207031, "global_step": 476120, "epoch": 2834} {"train_loss": -12.642704963684082, "global_step": 476121, "epoch": 2834} {"train_loss": -12.394750595092773, "global_step": 476122, "epoch": 2834} {"train_loss": -12.765922546386719, "global_step": 476123, "epoch": 2834} {"train_loss": -12.45722484588623, "global_step": 476124, "epoch": 2834} {"train_loss": -12.501177787780762, "global_step": 476125, "epoch": 2834} {"train_loss": -12.527019500732422, "global_step": 476126, "epoch": 2834} {"train_loss": -12.873795509338379, "global_step": 476127, "epoch": 2834} {"train_loss": -12.636289596557617, "global_step": 476128, "epoch": 2834} {"train_loss": -12.514318466186523, "global_step": 476129, "epoch": 2834} {"train_loss": -12.525710105895996, "global_step": 476130, "epoch": 2834} {"train_loss": -12.685489654541016, "global_step": 476131, "epoch": 2834} {"train_loss": -12.464971542358398, "global_step": 476132, "epoch": 2834} {"train_loss": -12.501884460449219, "global_step": 476133, "epoch": 2834} {"train_loss": -12.411185264587402, "global_step": 476134, "epoch": 2834} {"train_loss": -11.973045349121094, "global_step": 476135, "epoch": 2834} {"train_loss": -12.428094863891602, "global_step": 476136, "epoch": 2834} {"train_loss": -12.170526504516602, "global_step": 476137, "epoch": 2834} {"train_loss": -12.747016906738281, "global_step": 476138, "epoch": 2834} {"train_loss": -12.00021743774414, "global_step": 476139, "epoch": 2834} {"train_loss": -12.247014999389648, "global_step": 476140, "epoch": 2834} {"train_loss": -12.505867958068848, "global_step": 476141, "epoch": 2834} {"train_loss": -12.319441795349121, "global_step": 476142, "epoch": 2834} {"train_loss": -12.55638313293457, "global_step": 476143, "epoch": 2834} {"train_loss": -12.202672958374023, "global_step": 476144, "epoch": 2834} {"train_loss": -12.312206268310547, "global_step": 476145, "epoch": 2834} {"train_loss": -12.61455249786377, "global_step": 476146, "epoch": 2834} {"train_loss": -12.411334037780762, "global_step": 476147, "epoch": 2834} {"train_loss": -12.894006729125977, "global_step": 476148, "epoch": 2834} {"train_loss": -12.151105880737305, "global_step": 476149, "epoch": 2834} {"train_loss": -11.854450225830078, "global_step": 476150, "epoch": 2834} {"train_loss": -12.283988952636719, "global_step": 476151, "epoch": 2834} {"train_loss": -11.779054641723633, "global_step": 476152, "epoch": 2834} {"train_loss": -11.466261863708496, "global_step": 476153, "epoch": 2834} {"train_loss": -12.559053421020508, "global_step": 476154, "epoch": 2834} {"train_loss": -12.426420211791992, "global_step": 476155, "epoch": 2834} {"train_loss": -12.677118301391602, "global_step": 476156, "epoch": 2834} {"train_loss": -12.533207893371582, "global_step": 476157, "epoch": 2834} {"train_loss": -12.475495338439941, "global_step": 476158, "epoch": 2834} {"train_loss": -12.729093551635742, "global_step": 476159, "epoch": 2834} {"train_loss": -12.231467247009277, "global_step": 476160, "epoch": 2834} {"train_loss": -12.189155578613281, "global_step": 476161, "epoch": 2834} {"train_loss": -12.44743537902832, "global_step": 476162, "epoch": 2834} {"train_loss": -12.359277725219727, "global_step": 476163, "epoch": 2834} {"train_loss": -12.05402946472168, "global_step": 476164, "epoch": 2834} {"train_loss": -12.390504837036133, "global_step": 476165, "epoch": 2834} {"train_loss": -12.299983024597168, "global_step": 476166, "epoch": 2834} {"train_loss": -12.378498077392578, "global_step": 476167, "epoch": 2834} {"train_loss": -12.290040016174316, "global_step": 476168, "epoch": 2834} {"train_loss": -12.354679107666016, "global_step": 476169, "epoch": 2834} {"train_loss": -12.368843078613281, "global_step": 476170, "epoch": 2834} {"train_loss": -12.562333106994629, "global_step": 476171, "epoch": 2834} {"train_loss": -12.178878784179688, "global_step": 476172, "epoch": 2834} {"train_loss": -12.66193675994873, "global_step": 476173, "epoch": 2834} {"train_loss": -12.2307710647583, "global_step": 476174, "epoch": 2834} {"train_loss": -12.574247360229492, "global_step": 476175, "epoch": 2834} {"train_loss": -12.880206108093262, "global_step": 476176, "epoch": 2834} {"train_loss": -12.786632537841797, "global_step": 476177, "epoch": 2834} {"train_loss": -12.570442199707031, "global_step": 476178, "epoch": 2834} {"train_loss": -12.780181884765625, "global_step": 476179, "epoch": 2834} {"train_loss": -12.675032615661621, "global_step": 476180, "epoch": 2834} {"train_loss": -12.66675090789795, "global_step": 476181, "epoch": 2834} {"train_loss": -12.748051643371582, "global_step": 476182, "epoch": 2834} {"train_loss": -12.585997581481934, "global_step": 476183, "epoch": 2834} {"train_loss": -12.82241439819336, "global_step": 476184, "epoch": 2834} {"train_loss": -12.69096565246582, "global_step": 476185, "epoch": 2834} {"train_loss": -12.919322967529297, "global_step": 476186, "epoch": 2834} {"train_loss": -12.539268493652344, "global_step": 476187, "epoch": 2834} {"train_loss": -12.9361572265625, "global_step": 476188, "epoch": 2834} {"train_loss": -12.654375076293945, "global_step": 476189, "epoch": 2834} {"train_loss": -12.716853141784668, "global_step": 476190, "epoch": 2834} {"train_loss": -12.814669609069824, "global_step": 476191, "epoch": 2834} {"train_loss": -12.662891387939453, "global_step": 476192, "epoch": 2834} {"train_loss": -12.667734146118164, "global_step": 476193, "epoch": 2834} {"train_loss": -12.602264404296875, "global_step": 476194, "epoch": 2834} {"train_loss": -12.801379203796387, "global_step": 476195, "epoch": 2834} {"train_loss": -12.933059692382812, "global_step": 476196, "epoch": 2834} {"train_loss": -12.70877456665039, "global_step": 476197, "epoch": 2834} {"train_loss": -12.767576217651367, "global_step": 476198, "epoch": 2834} {"train_loss": -12.802444458007812, "global_step": 476199, "epoch": 2834} {"train_loss": -12.871968269348145, "global_step": 476200, "epoch": 2834} {"train_loss": -12.40854549407959, "global_step": 476201, "epoch": 2834} {"train_loss": -12.819066047668457, "global_step": 476202, "epoch": 2834} {"train_loss": -12.747795104980469, "global_step": 476203, "epoch": 2834} {"train_loss": -12.061634063720703, "global_step": 476204, "epoch": 2834} {"train_loss": -11.736591339111328, "global_step": 476205, "epoch": 2834} {"train_loss": -12.482439994812012, "global_step": 476206, "epoch": 2834} {"train_loss": -12.861398696899414, "global_step": 476207, "epoch": 2834} {"train_loss": -12.294882774353027, "global_step": 476208, "epoch": 2834} {"train_loss": -12.699128150939941, "global_step": 476209, "epoch": 2834} {"train_loss": -12.891552925109863, "global_step": 476210, "epoch": 2834} {"train_loss": -12.991350173950195, "global_step": 476211, "epoch": 2834} {"train_loss": -12.452507019042969, "global_step": 476212, "epoch": 2834} {"train_loss": -12.39105224609375, "global_step": 476213, "epoch": 2834} {"train_loss": -12.759763717651367, "global_step": 476214, "epoch": 2834} {"train_loss": -12.45601749420166, "global_step": 476215, "epoch": 2834} {"train_loss": -12.936020851135254, "global_step": 476216, "epoch": 2834} {"train_loss": -12.141976356506348, "global_step": 476217, "epoch": 2834} {"train_loss": -12.200582504272461, "global_step": 476218, "epoch": 2834} {"train_loss": -12.62252426147461, "global_step": 476219, "epoch": 2834} {"train_loss": -11.667235374450684, "global_step": 476220, "epoch": 2834} {"train_loss": -12.182573318481445, "global_step": 476221, "epoch": 2834} {"train_loss": -11.183547973632812, "global_step": 476222, "epoch": 2834} {"train_loss": -12.45854377746582, "global_step": 476223, "epoch": 2834} {"train_loss": -11.766630172729492, "global_step": 476224, "epoch": 2834} {"train_loss": -12.350485801696777, "global_step": 476225, "epoch": 2834} {"train_loss": -11.565868377685547, "global_step": 476226, "epoch": 2834} {"train_loss": -12.340336799621582, "global_step": 476227, "epoch": 2834} {"train_loss": -10.854158401489258, "global_step": 476228, "epoch": 2834} {"train_loss": -12.585371017456055, "global_step": 476229, "epoch": 2834} {"train_loss": -10.917916297912598, "global_step": 476230, "epoch": 2834} {"train_loss": -12.027295112609863, "global_step": 476231, "epoch": 2834} {"train_loss": -10.70852279663086, "global_step": 476232, "epoch": 2834} {"train_loss": -10.886992454528809, "global_step": 476233, "epoch": 2834} {"train_loss": -11.841028213500977, "global_step": 476234, "epoch": 2834} {"train_loss": -9.399099349975586, "global_step": 476235, "epoch": 2834} {"train_loss": -9.538558006286621, "global_step": 476236, "epoch": 2834} {"train_loss": -11.791640281677246, "global_step": 476237, "epoch": 2834} {"train_loss": -9.886281967163086, "global_step": 476238, "epoch": 2834} {"train_loss": -9.10999584197998, "global_step": 476239, "epoch": 2834} {"train_loss": -9.137983322143555, "global_step": 476240, "epoch": 2834} {"train_loss": -11.360138893127441, "global_step": 476241, "epoch": 2834} {"train_loss": -8.385329246520996, "global_step": 476242, "epoch": 2834} {"train_loss": -10.047837257385254, "global_step": 476243, "epoch": 2834} {"train_loss": -10.7811918258667, "global_step": 476244, "epoch": 2834} {"train_loss": -9.902596473693848, "global_step": 476245, "epoch": 2834} {"train_loss": -10.246831893920898, "global_step": 476246, "epoch": 2834} {"train_loss": -11.038304328918457, "global_step": 476247, "epoch": 2834} {"train_loss": -10.815589904785156, "global_step": 476248, "epoch": 2834} {"train_loss": -11.949188232421875, "global_step": 476249, "epoch": 2834} {"train_loss": -11.576482772827148, "global_step": 476250, "epoch": 2834} {"train_loss": -9.892934799194336, "global_step": 476251, "epoch": 2834} {"train_loss": -12.114603996276855, "global_step": 476252, "epoch": 2834} {"train_loss": -10.98225212097168, "global_step": 476253, "epoch": 2834} {"train_loss": -10.503185272216797, "global_step": 476254, "epoch": 2834} {"train_loss": -11.726428985595703, "global_step": 476255, "epoch": 2834} {"train_loss": -10.885200500488281, "global_step": 476256, "epoch": 2834} {"train_loss": -10.296789169311523, "global_step": 476257, "epoch": 2834} {"train_loss": -11.57386589050293, "global_step": 476258, "epoch": 2834} {"train_loss": -11.744160652160645, "global_step": 476259, "epoch": 2834} {"train_loss": -10.93310546875, "global_step": 476260, "epoch": 2834} {"train_loss": -12.213730812072754, "global_step": 476261, "epoch": 2834} {"train_loss": -11.208561897277832, "global_step": 476262, "epoch": 2834} {"train_loss": -11.562784194946289, "global_step": 476263, "epoch": 2834} {"train_loss": -11.826265335083008, "global_step": 476264, "epoch": 2834} {"train_loss": -11.071002960205078, "global_step": 476265, "epoch": 2834} {"train_loss": -11.985713005065918, "global_step": 476266, "epoch": 2834} {"train_loss": -11.849127769470215, "global_step": 476267, "epoch": 2834} {"train_loss": -11.913467407226562, "global_step": 476268, "epoch": 2834} {"train_loss": -12.217399597167969, "global_step": 476269, "epoch": 2834} {"train_loss": -11.808591842651367, "global_step": 476270, "epoch": 2834} {"train_loss": -12.408863067626953, "global_step": 476271, "epoch": 2834} {"train_loss": -12.06928825378418, "global_step": 476272, "epoch": 2834} {"train_loss": -11.482892990112305, "global_step": 476273, "epoch": 2834} {"train_loss": -12.26657485961914, "global_step": 476274, "epoch": 2834} {"train_loss": -11.666610717773438, "global_step": 476275, "epoch": 2834} {"train_loss": -11.892842292785645, "global_step": 476276, "epoch": 2834} {"train_loss": -12.16101360321045, "global_step": 476277, "epoch": 2834} {"train_loss": -11.49717903137207, "global_step": 476278, "epoch": 2834} {"train_loss": -12.046567831720624, "global_step": 476279, "epoch": 2834, "val_loss": 311304.65625} {"train_loss": -11.778861999511719, "global_step": 476280, "epoch": 2835} {"train_loss": -12.145069122314453, "global_step": 476281, "epoch": 2835} {"train_loss": -11.95290756225586, "global_step": 476282, "epoch": 2835} {"train_loss": -12.312540054321289, "global_step": 476283, "epoch": 2835} {"train_loss": -12.084861755371094, "global_step": 476284, "epoch": 2835} {"train_loss": -12.292859077453613, "global_step": 476285, "epoch": 2835} {"train_loss": -12.033140182495117, "global_step": 476286, "epoch": 2835} {"train_loss": -12.20967960357666, "global_step": 476287, "epoch": 2835} {"train_loss": -12.338741302490234, "global_step": 476288, "epoch": 2835} {"train_loss": -12.328388214111328, "global_step": 476289, "epoch": 2835} {"train_loss": -11.854878425598145, "global_step": 476290, "epoch": 2835} {"train_loss": -12.252235412597656, "global_step": 476291, "epoch": 2835} {"train_loss": -12.089910507202148, "global_step": 476292, "epoch": 2835} {"train_loss": -12.354987144470215, "global_step": 476293, "epoch": 2835} {"train_loss": -12.330392837524414, "global_step": 476294, "epoch": 2835} {"train_loss": -11.844595909118652, "global_step": 476295, "epoch": 2835} {"train_loss": -12.566217422485352, "global_step": 476296, "epoch": 2835} {"train_loss": -12.131963729858398, "global_step": 476297, "epoch": 2835} {"train_loss": -12.494555473327637, "global_step": 476298, "epoch": 2835} {"train_loss": -11.88033676147461, "global_step": 476299, "epoch": 2835} {"train_loss": -12.438297271728516, "global_step": 476300, "epoch": 2835} {"train_loss": -12.11181640625, "global_step": 476301, "epoch": 2835} {"train_loss": -12.108341217041016, "global_step": 476302, "epoch": 2835} {"train_loss": -12.496527671813965, "global_step": 476303, "epoch": 2835} {"train_loss": -11.3300142288208, "global_step": 476304, "epoch": 2835} {"train_loss": -11.717195510864258, "global_step": 476305, "epoch": 2835} {"train_loss": -12.154022216796875, "global_step": 476306, "epoch": 2835} {"train_loss": -12.139230728149414, "global_step": 476307, "epoch": 2835} {"train_loss": -12.095250129699707, "global_step": 476308, "epoch": 2835} {"train_loss": -11.820228576660156, "global_step": 476309, "epoch": 2835} {"train_loss": -11.9189453125, "global_step": 476310, "epoch": 2835} {"train_loss": -11.744384765625, "global_step": 476311, "epoch": 2835} {"train_loss": -11.308406829833984, "global_step": 476312, "epoch": 2835} {"train_loss": -11.725479125976562, "global_step": 476313, "epoch": 2835} {"train_loss": -10.655218124389648, "global_step": 476314, "epoch": 2835} {"train_loss": -10.85527229309082, "global_step": 476315, "epoch": 2835} {"train_loss": -12.354033470153809, "global_step": 476316, "epoch": 2835} {"train_loss": -10.850360870361328, "global_step": 476317, "epoch": 2835} {"train_loss": -12.333900451660156, "global_step": 476318, "epoch": 2835} {"train_loss": -11.341625213623047, "global_step": 476319, "epoch": 2835} {"train_loss": -11.061737060546875, "global_step": 476320, "epoch": 2835} {"train_loss": -12.53311538696289, "global_step": 476321, "epoch": 2835} {"train_loss": -11.277210235595703, "global_step": 476322, "epoch": 2835} {"train_loss": -12.574719429016113, "global_step": 476323, "epoch": 2835} {"train_loss": -11.882655143737793, "global_step": 476324, "epoch": 2835} {"train_loss": -11.601776123046875, "global_step": 476325, "epoch": 2835} {"train_loss": -12.372733116149902, "global_step": 476326, "epoch": 2835} {"train_loss": -11.67466926574707, "global_step": 476327, "epoch": 2835} {"train_loss": -11.578197479248047, "global_step": 476328, "epoch": 2835} {"train_loss": -12.48193645477295, "global_step": 476329, "epoch": 2835} {"train_loss": -11.653696060180664, "global_step": 476330, "epoch": 2835} {"train_loss": -12.42390251159668, "global_step": 476331, "epoch": 2835} {"train_loss": -11.599607467651367, "global_step": 476332, "epoch": 2835} {"train_loss": -11.857649803161621, "global_step": 476333, "epoch": 2835} {"train_loss": -11.941059112548828, "global_step": 476334, "epoch": 2835} {"train_loss": -10.835831642150879, "global_step": 476335, "epoch": 2835} {"train_loss": -11.927650451660156, "global_step": 476336, "epoch": 2835} {"train_loss": -12.03905963897705, "global_step": 476337, "epoch": 2835} {"train_loss": -12.007011413574219, "global_step": 476338, "epoch": 2835} {"train_loss": -11.908343315124512, "global_step": 476339, "epoch": 2835} {"train_loss": -12.018402099609375, "global_step": 476340, "epoch": 2835} {"train_loss": -12.190967559814453, "global_step": 476341, "epoch": 2835} {"train_loss": -11.757438659667969, "global_step": 476342, "epoch": 2835} {"train_loss": -11.969348907470703, "global_step": 476343, "epoch": 2835} {"train_loss": -11.961752891540527, "global_step": 476344, "epoch": 2835} {"train_loss": -12.042308807373047, "global_step": 476345, "epoch": 2835} {"train_loss": -11.806249618530273, "global_step": 476346, "epoch": 2835} {"train_loss": -12.452617645263672, "global_step": 476347, "epoch": 2835} {"train_loss": -11.875158309936523, "global_step": 476348, "epoch": 2835} {"train_loss": -11.988176345825195, "global_step": 476349, "epoch": 2835} {"train_loss": -12.380598068237305, "global_step": 476350, "epoch": 2835} {"train_loss": -12.09676742553711, "global_step": 476351, "epoch": 2835} {"train_loss": -12.570491790771484, "global_step": 476352, "epoch": 2835} {"train_loss": -12.060184478759766, "global_step": 476353, "epoch": 2835} {"train_loss": -12.207777976989746, "global_step": 476354, "epoch": 2835} {"train_loss": -12.443771362304688, "global_step": 476355, "epoch": 2835} {"train_loss": -12.07662582397461, "global_step": 476356, "epoch": 2835} {"train_loss": -12.632760047912598, "global_step": 476357, "epoch": 2835} {"train_loss": -12.305670738220215, "global_step": 476358, "epoch": 2835} {"train_loss": -12.544349670410156, "global_step": 476359, "epoch": 2835} {"train_loss": -12.356197357177734, "global_step": 476360, "epoch": 2835} {"train_loss": -12.436829566955566, "global_step": 476361, "epoch": 2835} {"train_loss": -12.277032852172852, "global_step": 476362, "epoch": 2835} {"train_loss": -12.334110260009766, "global_step": 476363, "epoch": 2835} {"train_loss": -12.505362510681152, "global_step": 476364, "epoch": 2835} {"train_loss": -12.405486106872559, "global_step": 476365, "epoch": 2835} {"train_loss": -12.674898147583008, "global_step": 476366, "epoch": 2835} {"train_loss": -12.306346893310547, "global_step": 476367, "epoch": 2835} {"train_loss": -12.871349334716797, "global_step": 476368, "epoch": 2835} {"train_loss": -12.522241592407227, "global_step": 476369, "epoch": 2835} {"train_loss": -12.68893814086914, "global_step": 476370, "epoch": 2835} {"train_loss": -12.592265129089355, "global_step": 476371, "epoch": 2835} {"train_loss": -12.507848739624023, "global_step": 476372, "epoch": 2835} {"train_loss": -12.765846252441406, "global_step": 476373, "epoch": 2835} {"train_loss": -12.769905090332031, "global_step": 476374, "epoch": 2835} {"train_loss": -12.737627983093262, "global_step": 476375, "epoch": 2835} {"train_loss": -12.757240295410156, "global_step": 476376, "epoch": 2835} {"train_loss": -12.770918846130371, "global_step": 476377, "epoch": 2835} {"train_loss": -12.802997589111328, "global_step": 476378, "epoch": 2835} {"train_loss": -12.755118370056152, "global_step": 476379, "epoch": 2835} {"train_loss": -12.851278305053711, "global_step": 476380, "epoch": 2835} {"train_loss": -12.856843948364258, "global_step": 476381, "epoch": 2835} {"train_loss": -12.526840209960938, "global_step": 476382, "epoch": 2835} {"train_loss": -12.743766784667969, "global_step": 476383, "epoch": 2835} {"train_loss": -12.76417350769043, "global_step": 476384, "epoch": 2835} {"train_loss": -12.738640785217285, "global_step": 476385, "epoch": 2835} {"train_loss": -12.830011367797852, "global_step": 476386, "epoch": 2835} {"train_loss": -12.800506591796875, "global_step": 476387, "epoch": 2835} {"train_loss": -12.914100646972656, "global_step": 476388, "epoch": 2835} {"train_loss": -12.710794448852539, "global_step": 476389, "epoch": 2835} {"train_loss": -12.568735122680664, "global_step": 476390, "epoch": 2835} {"train_loss": -12.979720115661621, "global_step": 476391, "epoch": 2835} {"train_loss": -12.6400146484375, "global_step": 476392, "epoch": 2835} {"train_loss": -12.761898040771484, "global_step": 476393, "epoch": 2835} {"train_loss": -12.531732559204102, "global_step": 476394, "epoch": 2835} {"train_loss": -12.818941116333008, "global_step": 476395, "epoch": 2835} {"train_loss": -12.711130142211914, "global_step": 476396, "epoch": 2835} {"train_loss": -12.787941932678223, "global_step": 476397, "epoch": 2835} {"train_loss": -12.55282211303711, "global_step": 476398, "epoch": 2835} {"train_loss": -12.592986106872559, "global_step": 476399, "epoch": 2835} {"train_loss": -12.601313591003418, "global_step": 476400, "epoch": 2835} {"train_loss": -12.653458595275879, "global_step": 476401, "epoch": 2835} {"train_loss": -12.699992179870605, "global_step": 476402, "epoch": 2835} {"train_loss": -12.706888198852539, "global_step": 476403, "epoch": 2835} {"train_loss": -12.786569595336914, "global_step": 476404, "epoch": 2835} {"train_loss": -12.973596572875977, "global_step": 476405, "epoch": 2835} {"train_loss": -12.75737190246582, "global_step": 476406, "epoch": 2835} {"train_loss": -12.667842864990234, "global_step": 476407, "epoch": 2835} {"train_loss": -12.774432182312012, "global_step": 476408, "epoch": 2835} {"train_loss": -12.787179946899414, "global_step": 476409, "epoch": 2835} {"train_loss": -12.777315139770508, "global_step": 476410, "epoch": 2835} {"train_loss": -12.604878425598145, "global_step": 476411, "epoch": 2835} {"train_loss": -12.74171257019043, "global_step": 476412, "epoch": 2835} {"train_loss": -12.542989730834961, "global_step": 476413, "epoch": 2835} {"train_loss": -12.658803939819336, "global_step": 476414, "epoch": 2835} {"train_loss": -12.693954467773438, "global_step": 476415, "epoch": 2835} {"train_loss": -12.701471328735352, "global_step": 476416, "epoch": 2835} {"train_loss": -12.245271682739258, "global_step": 476417, "epoch": 2835} {"train_loss": -12.9386568069458, "global_step": 476418, "epoch": 2835} {"train_loss": -12.17214584350586, "global_step": 476419, "epoch": 2835} {"train_loss": -12.359716415405273, "global_step": 476420, "epoch": 2835} {"train_loss": -12.420696258544922, "global_step": 476421, "epoch": 2835} {"train_loss": -12.93970012664795, "global_step": 476422, "epoch": 2835} {"train_loss": -12.72374153137207, "global_step": 476423, "epoch": 2835} {"train_loss": -12.519657135009766, "global_step": 476424, "epoch": 2835} {"train_loss": -12.546231269836426, "global_step": 476425, "epoch": 2835} {"train_loss": -12.85781192779541, "global_step": 476426, "epoch": 2835} {"train_loss": -12.8349027633667, "global_step": 476427, "epoch": 2835} {"train_loss": -12.980348587036133, "global_step": 476428, "epoch": 2835} {"train_loss": -12.915420532226562, "global_step": 476429, "epoch": 2835} {"train_loss": -12.692878723144531, "global_step": 476430, "epoch": 2835} {"train_loss": -12.792139053344727, "global_step": 476431, "epoch": 2835} {"train_loss": -12.160416603088379, "global_step": 476432, "epoch": 2835} {"train_loss": -12.031721115112305, "global_step": 476433, "epoch": 2835} {"train_loss": -12.359798431396484, "global_step": 476434, "epoch": 2835} {"train_loss": -12.212750434875488, "global_step": 476435, "epoch": 2835} {"train_loss": -11.404264450073242, "global_step": 476436, "epoch": 2835} {"train_loss": -12.70923900604248, "global_step": 476437, "epoch": 2835} {"train_loss": -12.038576126098633, "global_step": 476438, "epoch": 2835} {"train_loss": -10.76773452758789, "global_step": 476439, "epoch": 2835} {"train_loss": -12.739595413208008, "global_step": 476440, "epoch": 2835} {"train_loss": -10.832408905029297, "global_step": 476441, "epoch": 2835} {"train_loss": -9.819513320922852, "global_step": 476442, "epoch": 2835} {"train_loss": -11.279657363891602, "global_step": 476443, "epoch": 2835} {"train_loss": -7.648115158081055, "global_step": 476444, "epoch": 2835} {"train_loss": -7.937142372131348, "global_step": 476445, "epoch": 2835} {"train_loss": -8.844688415527344, "global_step": 476446, "epoch": 2835} {"train_loss": -12.165066071919032, "global_step": 476447, "epoch": 2835, "val_loss": 314463.3125, "train_action_mse_error": 2.776259422302246} {"train_loss": -6.812312126159668, "global_step": 476448, "epoch": 2836} {"train_loss": -8.560432434082031, "global_step": 476449, "epoch": 2836} {"train_loss": -8.187957763671875, "global_step": 476450, "epoch": 2836} {"train_loss": -8.909917831420898, "global_step": 476451, "epoch": 2836} {"train_loss": -8.388399124145508, "global_step": 476452, "epoch": 2836} {"train_loss": -10.096034049987793, "global_step": 476453, "epoch": 2836} {"train_loss": -10.201252937316895, "global_step": 476454, "epoch": 2836} {"train_loss": -9.743213653564453, "global_step": 476455, "epoch": 2836} {"train_loss": -9.618759155273438, "global_step": 476456, "epoch": 2836} {"train_loss": -10.034372329711914, "global_step": 476457, "epoch": 2836} {"train_loss": -11.34450912475586, "global_step": 476458, "epoch": 2836} {"train_loss": -10.973440170288086, "global_step": 476459, "epoch": 2836} {"train_loss": -11.38906478881836, "global_step": 476460, "epoch": 2836} {"train_loss": -10.750429153442383, "global_step": 476461, "epoch": 2836} {"train_loss": -10.937265396118164, "global_step": 476462, "epoch": 2836} {"train_loss": -11.414899826049805, "global_step": 476463, "epoch": 2836} {"train_loss": -10.073551177978516, "global_step": 476464, "epoch": 2836} {"train_loss": -10.819587707519531, "global_step": 476465, "epoch": 2836} {"train_loss": -10.656657218933105, "global_step": 476466, "epoch": 2836} {"train_loss": -10.532200813293457, "global_step": 476467, "epoch": 2836} {"train_loss": -11.76029109954834, "global_step": 476468, "epoch": 2836} {"train_loss": -11.400181770324707, "global_step": 476469, "epoch": 2836} {"train_loss": -11.127584457397461, "global_step": 476470, "epoch": 2836} {"train_loss": -11.694549560546875, "global_step": 476471, "epoch": 2836} {"train_loss": -11.447408676147461, "global_step": 476472, "epoch": 2836} {"train_loss": -11.387182235717773, "global_step": 476473, "epoch": 2836} {"train_loss": -11.535440444946289, "global_step": 476474, "epoch": 2836} {"train_loss": -12.088858604431152, "global_step": 476475, "epoch": 2836} {"train_loss": -11.132044792175293, "global_step": 476476, "epoch": 2836} {"train_loss": -11.998366355895996, "global_step": 476477, "epoch": 2836} {"train_loss": -11.618059158325195, "global_step": 476478, "epoch": 2836} {"train_loss": -11.61712646484375, "global_step": 476479, "epoch": 2836} {"train_loss": -12.234400749206543, "global_step": 476480, "epoch": 2836} {"train_loss": -11.455598831176758, "global_step": 476481, "epoch": 2836} {"train_loss": -12.246328353881836, "global_step": 476482, "epoch": 2836} {"train_loss": -11.174018859863281, "global_step": 476483, "epoch": 2836} {"train_loss": -11.845154762268066, "global_step": 476484, "epoch": 2836} {"train_loss": -12.068069458007812, "global_step": 476485, "epoch": 2836} {"train_loss": -11.52898120880127, "global_step": 476486, "epoch": 2836} {"train_loss": -12.172076225280762, "global_step": 476487, "epoch": 2836} {"train_loss": -11.87656021118164, "global_step": 476488, "epoch": 2836} {"train_loss": -12.153675079345703, "global_step": 476489, "epoch": 2836} {"train_loss": -12.225790023803711, "global_step": 476490, "epoch": 2836} {"train_loss": -12.182021141052246, "global_step": 476491, "epoch": 2836} {"train_loss": -12.165579795837402, "global_step": 476492, "epoch": 2836} {"train_loss": -12.261979103088379, "global_step": 476493, "epoch": 2836} {"train_loss": -12.345139503479004, "global_step": 476494, "epoch": 2836} {"train_loss": -12.459932327270508, "global_step": 476495, "epoch": 2836} {"train_loss": -11.80863094329834, "global_step": 476496, "epoch": 2836} {"train_loss": -12.555546760559082, "global_step": 476497, "epoch": 2836} {"train_loss": -12.375036239624023, "global_step": 476498, "epoch": 2836} {"train_loss": -12.629610061645508, "global_step": 476499, "epoch": 2836} {"train_loss": -12.569889068603516, "global_step": 476500, "epoch": 2836} {"train_loss": -12.282550811767578, "global_step": 476501, "epoch": 2836} {"train_loss": -12.7142333984375, "global_step": 476502, "epoch": 2836} {"train_loss": -12.319931030273438, "global_step": 476503, "epoch": 2836} {"train_loss": -12.618356704711914, "global_step": 476504, "epoch": 2836} {"train_loss": -12.500709533691406, "global_step": 476505, "epoch": 2836} {"train_loss": -12.484526634216309, "global_step": 476506, "epoch": 2836} {"train_loss": -12.517986297607422, "global_step": 476507, "epoch": 2836} {"train_loss": -12.42850112915039, "global_step": 476508, "epoch": 2836} {"train_loss": -12.621614456176758, "global_step": 476509, "epoch": 2836} {"train_loss": -12.260889053344727, "global_step": 476510, "epoch": 2836} {"train_loss": -12.652725219726562, "global_step": 476511, "epoch": 2836} {"train_loss": -12.619430541992188, "global_step": 476512, "epoch": 2836} {"train_loss": -12.709721565246582, "global_step": 476513, "epoch": 2836} {"train_loss": -12.647717475891113, "global_step": 476514, "epoch": 2836} {"train_loss": -12.513334274291992, "global_step": 476515, "epoch": 2836} {"train_loss": -12.563657760620117, "global_step": 476516, "epoch": 2836} {"train_loss": -12.577693939208984, "global_step": 476517, "epoch": 2836} {"train_loss": -12.585453033447266, "global_step": 476518, "epoch": 2836} {"train_loss": -12.447542190551758, "global_step": 476519, "epoch": 2836} {"train_loss": -12.207756042480469, "global_step": 476520, "epoch": 2836} {"train_loss": -12.75010871887207, "global_step": 476521, "epoch": 2836} {"train_loss": -12.587708473205566, "global_step": 476522, "epoch": 2836} {"train_loss": -12.795543670654297, "global_step": 476523, "epoch": 2836} {"train_loss": -12.729291915893555, "global_step": 476524, "epoch": 2836} {"train_loss": -12.761042594909668, "global_step": 476525, "epoch": 2836} {"train_loss": -12.576797485351562, "global_step": 476526, "epoch": 2836} {"train_loss": -12.86312484741211, "global_step": 476527, "epoch": 2836} {"train_loss": -12.71146297454834, "global_step": 476528, "epoch": 2836} {"train_loss": -12.761360168457031, "global_step": 476529, "epoch": 2836} {"train_loss": -12.587797164916992, "global_step": 476530, "epoch": 2836} {"train_loss": -12.617005348205566, "global_step": 476531, "epoch": 2836} {"train_loss": -12.930587768554688, "global_step": 476532, "epoch": 2836} {"train_loss": -12.557304382324219, "global_step": 476533, "epoch": 2836} {"train_loss": -12.849187850952148, "global_step": 476534, "epoch": 2836} {"train_loss": -12.597309112548828, "global_step": 476535, "epoch": 2836} {"train_loss": -12.860848426818848, "global_step": 476536, "epoch": 2836} {"train_loss": -12.780298233032227, "global_step": 476537, "epoch": 2836} {"train_loss": -12.802602767944336, "global_step": 476538, "epoch": 2836} {"train_loss": -12.798981666564941, "global_step": 476539, "epoch": 2836} {"train_loss": -12.73869514465332, "global_step": 476540, "epoch": 2836} {"train_loss": -12.715190887451172, "global_step": 476541, "epoch": 2836} {"train_loss": -12.68459415435791, "global_step": 476542, "epoch": 2836} {"train_loss": -12.57847785949707, "global_step": 476543, "epoch": 2836} {"train_loss": -12.766128540039062, "global_step": 476544, "epoch": 2836} {"train_loss": -12.61268424987793, "global_step": 476545, "epoch": 2836} {"train_loss": -12.917903900146484, "global_step": 476546, "epoch": 2836} {"train_loss": -12.620579719543457, "global_step": 476547, "epoch": 2836} {"train_loss": -12.713796615600586, "global_step": 476548, "epoch": 2836} {"train_loss": -12.607044219970703, "global_step": 476549, "epoch": 2836} {"train_loss": -12.89077091217041, "global_step": 476550, "epoch": 2836} {"train_loss": -12.652482986450195, "global_step": 476551, "epoch": 2836} {"train_loss": -12.938945770263672, "global_step": 476552, "epoch": 2836} {"train_loss": -12.627630233764648, "global_step": 476553, "epoch": 2836} {"train_loss": -12.904539108276367, "global_step": 476554, "epoch": 2836} {"train_loss": -12.97665786743164, "global_step": 476555, "epoch": 2836} {"train_loss": -12.794322967529297, "global_step": 476556, "epoch": 2836} {"train_loss": -12.76577377319336, "global_step": 476557, "epoch": 2836} {"train_loss": -12.533554077148438, "global_step": 476558, "epoch": 2836} {"train_loss": -12.630401611328125, "global_step": 476559, "epoch": 2836} {"train_loss": -12.642284393310547, "global_step": 476560, "epoch": 2836} {"train_loss": -12.742557525634766, "global_step": 476561, "epoch": 2836} {"train_loss": -12.927002906799316, "global_step": 476562, "epoch": 2836} {"train_loss": -12.879350662231445, "global_step": 476563, "epoch": 2836} {"train_loss": -12.563495635986328, "global_step": 476564, "epoch": 2836} {"train_loss": -12.681678771972656, "global_step": 476565, "epoch": 2836} {"train_loss": -12.815336227416992, "global_step": 476566, "epoch": 2836} {"train_loss": -12.628355979919434, "global_step": 476567, "epoch": 2836} {"train_loss": -12.6721773147583, "global_step": 476568, "epoch": 2836} {"train_loss": -12.395565032958984, "global_step": 476569, "epoch": 2836} {"train_loss": -12.752235412597656, "global_step": 476570, "epoch": 2836} {"train_loss": -12.664495468139648, "global_step": 476571, "epoch": 2836} {"train_loss": -12.555420875549316, "global_step": 476572, "epoch": 2836} {"train_loss": -12.518329620361328, "global_step": 476573, "epoch": 2836} {"train_loss": -12.243450164794922, "global_step": 476574, "epoch": 2836} {"train_loss": -12.55516529083252, "global_step": 476575, "epoch": 2836} {"train_loss": -12.589839935302734, "global_step": 476576, "epoch": 2836} {"train_loss": -11.311765670776367, "global_step": 476577, "epoch": 2836} {"train_loss": -8.690876007080078, "global_step": 476578, "epoch": 2836} {"train_loss": -10.328786849975586, "global_step": 476579, "epoch": 2836} {"train_loss": -11.014867782592773, "global_step": 476580, "epoch": 2836} {"train_loss": -11.193792343139648, "global_step": 476581, "epoch": 2836} {"train_loss": -10.636253356933594, "global_step": 476582, "epoch": 2836} {"train_loss": -12.328076362609863, "global_step": 476583, "epoch": 2836} {"train_loss": -11.457008361816406, "global_step": 476584, "epoch": 2836} {"train_loss": -11.036561012268066, "global_step": 476585, "epoch": 2836} {"train_loss": -10.290738105773926, "global_step": 476586, "epoch": 2836} {"train_loss": -12.213918685913086, "global_step": 476587, "epoch": 2836} {"train_loss": -11.274171829223633, "global_step": 476588, "epoch": 2836} {"train_loss": -11.122965812683105, "global_step": 476589, "epoch": 2836} {"train_loss": -10.894689559936523, "global_step": 476590, "epoch": 2836} {"train_loss": -11.002189636230469, "global_step": 476591, "epoch": 2836} {"train_loss": -11.085441589355469, "global_step": 476592, "epoch": 2836} {"train_loss": -10.447944641113281, "global_step": 476593, "epoch": 2836} {"train_loss": -10.011151313781738, "global_step": 476594, "epoch": 2836} {"train_loss": -11.441978454589844, "global_step": 476595, "epoch": 2836} {"train_loss": -10.829336166381836, "global_step": 476596, "epoch": 2836} {"train_loss": -9.77888298034668, "global_step": 476597, "epoch": 2836} {"train_loss": -11.32706069946289, "global_step": 476598, "epoch": 2836} {"train_loss": -9.954606056213379, "global_step": 476599, "epoch": 2836} {"train_loss": -9.174690246582031, "global_step": 476600, "epoch": 2836} {"train_loss": -9.935100555419922, "global_step": 476601, "epoch": 2836} {"train_loss": -10.166825294494629, "global_step": 476602, "epoch": 2836} {"train_loss": -11.223861694335938, "global_step": 476603, "epoch": 2836} {"train_loss": -11.201895713806152, "global_step": 476604, "epoch": 2836} {"train_loss": -11.504514694213867, "global_step": 476605, "epoch": 2836} {"train_loss": -12.18871021270752, "global_step": 476606, "epoch": 2836} {"train_loss": -10.97325611114502, "global_step": 476607, "epoch": 2836} {"train_loss": -12.160906791687012, "global_step": 476608, "epoch": 2836} {"train_loss": -12.086313247680664, "global_step": 476609, "epoch": 2836} {"train_loss": -12.225436210632324, "global_step": 476610, "epoch": 2836} {"train_loss": -12.157662391662598, "global_step": 476611, "epoch": 2836} {"train_loss": -12.378191947937012, "global_step": 476612, "epoch": 2836} {"train_loss": -12.384052276611328, "global_step": 476613, "epoch": 2836} {"train_loss": -12.263355255126953, "global_step": 476614, "epoch": 2836} {"train_loss": -11.835277648199172, "global_step": 476615, "epoch": 2836, "val_loss": 314421.21875} {"train_loss": -12.19271469116211, "global_step": 476616, "epoch": 2837} {"train_loss": -12.10268783569336, "global_step": 476617, "epoch": 2837} {"train_loss": -12.280909538269043, "global_step": 476618, "epoch": 2837} {"train_loss": -11.571802139282227, "global_step": 476619, "epoch": 2837} {"train_loss": -12.523082733154297, "global_step": 476620, "epoch": 2837} {"train_loss": -11.938131332397461, "global_step": 476621, "epoch": 2837} {"train_loss": -12.684894561767578, "global_step": 476622, "epoch": 2837} {"train_loss": -12.144533157348633, "global_step": 476623, "epoch": 2837} {"train_loss": -12.439567565917969, "global_step": 476624, "epoch": 2837} {"train_loss": -12.2572021484375, "global_step": 476625, "epoch": 2837} {"train_loss": -12.046822547912598, "global_step": 476626, "epoch": 2837} {"train_loss": -12.271075248718262, "global_step": 476627, "epoch": 2837} {"train_loss": -12.550436019897461, "global_step": 476628, "epoch": 2837} {"train_loss": -12.474270820617676, "global_step": 476629, "epoch": 2837} {"train_loss": -12.28485107421875, "global_step": 476630, "epoch": 2837} {"train_loss": -12.606136322021484, "global_step": 476631, "epoch": 2837} {"train_loss": -12.363377571105957, "global_step": 476632, "epoch": 2837} {"train_loss": -12.631134986877441, "global_step": 476633, "epoch": 2837} {"train_loss": -12.538766860961914, "global_step": 476634, "epoch": 2837} {"train_loss": -12.724584579467773, "global_step": 476635, "epoch": 2837} {"train_loss": -12.597234725952148, "global_step": 476636, "epoch": 2837} {"train_loss": -12.51539421081543, "global_step": 476637, "epoch": 2837} {"train_loss": -12.723319053649902, "global_step": 476638, "epoch": 2837} {"train_loss": -12.617639541625977, "global_step": 476639, "epoch": 2837} {"train_loss": -12.615767478942871, "global_step": 476640, "epoch": 2837} {"train_loss": -12.600440979003906, "global_step": 476641, "epoch": 2837} {"train_loss": -12.688104629516602, "global_step": 476642, "epoch": 2837} {"train_loss": -12.4974365234375, "global_step": 476643, "epoch": 2837} {"train_loss": -12.760618209838867, "global_step": 476644, "epoch": 2837} {"train_loss": -12.54124641418457, "global_step": 476645, "epoch": 2837} {"train_loss": -12.917218208312988, "global_step": 476646, "epoch": 2837} {"train_loss": -12.545124053955078, "global_step": 476647, "epoch": 2837} {"train_loss": -12.749307632446289, "global_step": 476648, "epoch": 2837} {"train_loss": -12.816274642944336, "global_step": 476649, "epoch": 2837} {"train_loss": -12.818936347961426, "global_step": 476650, "epoch": 2837} {"train_loss": -12.590581893920898, "global_step": 476651, "epoch": 2837} {"train_loss": -12.824559211730957, "global_step": 476652, "epoch": 2837} {"train_loss": -12.852651596069336, "global_step": 476653, "epoch": 2837} {"train_loss": -12.766936302185059, "global_step": 476654, "epoch": 2837} {"train_loss": -12.7296724319458, "global_step": 476655, "epoch": 2837} {"train_loss": -12.884041786193848, "global_step": 476656, "epoch": 2837} {"train_loss": -12.729328155517578, "global_step": 476657, "epoch": 2837} {"train_loss": -12.796854019165039, "global_step": 476658, "epoch": 2837} {"train_loss": -12.906339645385742, "global_step": 476659, "epoch": 2837} {"train_loss": -12.49501895904541, "global_step": 476660, "epoch": 2837} {"train_loss": -12.512502670288086, "global_step": 476661, "epoch": 2837} {"train_loss": -12.920063018798828, "global_step": 476662, "epoch": 2837} {"train_loss": -12.54049301147461, "global_step": 476663, "epoch": 2837} {"train_loss": -12.948087692260742, "global_step": 476664, "epoch": 2837} {"train_loss": -12.859613418579102, "global_step": 476665, "epoch": 2837} {"train_loss": -12.804595947265625, "global_step": 476666, "epoch": 2837} {"train_loss": -12.848941802978516, "global_step": 476667, "epoch": 2837} {"train_loss": -12.68271255493164, "global_step": 476668, "epoch": 2837} {"train_loss": -12.929559707641602, "global_step": 476669, "epoch": 2837} {"train_loss": -12.739396095275879, "global_step": 476670, "epoch": 2837} {"train_loss": -12.608682632446289, "global_step": 476671, "epoch": 2837} {"train_loss": -12.711095809936523, "global_step": 476672, "epoch": 2837} {"train_loss": -13.051138877868652, "global_step": 476673, "epoch": 2837} {"train_loss": -12.538619995117188, "global_step": 476674, "epoch": 2837} {"train_loss": -12.437576293945312, "global_step": 476675, "epoch": 2837} {"train_loss": -12.562154769897461, "global_step": 476676, "epoch": 2837} {"train_loss": -12.456390380859375, "global_step": 476677, "epoch": 2837} {"train_loss": -12.561859130859375, "global_step": 476678, "epoch": 2837} {"train_loss": -12.437829971313477, "global_step": 476679, "epoch": 2837} {"train_loss": -12.517915725708008, "global_step": 476680, "epoch": 2837} {"train_loss": -11.18385124206543, "global_step": 476681, "epoch": 2837} {"train_loss": -11.846004486083984, "global_step": 476682, "epoch": 2837} {"train_loss": -11.002689361572266, "global_step": 476683, "epoch": 2837} {"train_loss": -11.291776657104492, "global_step": 476684, "epoch": 2837} {"train_loss": -11.278097152709961, "global_step": 476685, "epoch": 2837} {"train_loss": -11.642054557800293, "global_step": 476686, "epoch": 2837} {"train_loss": -10.887319564819336, "global_step": 476687, "epoch": 2837} {"train_loss": -12.221905708312988, "global_step": 476688, "epoch": 2837} {"train_loss": -11.118184089660645, "global_step": 476689, "epoch": 2837} {"train_loss": -11.602466583251953, "global_step": 476690, "epoch": 2837} {"train_loss": -9.70234489440918, "global_step": 476691, "epoch": 2837} {"train_loss": -11.88956069946289, "global_step": 476692, "epoch": 2837} {"train_loss": -9.81927490234375, "global_step": 476693, "epoch": 2837} {"train_loss": -10.140853881835938, "global_step": 476694, "epoch": 2837} {"train_loss": -10.792351722717285, "global_step": 476695, "epoch": 2837} {"train_loss": -10.062585830688477, "global_step": 476696, "epoch": 2837} {"train_loss": -11.60841178894043, "global_step": 476697, "epoch": 2837} {"train_loss": -10.457155227661133, "global_step": 476698, "epoch": 2837} {"train_loss": -11.849201202392578, "global_step": 476699, "epoch": 2837} {"train_loss": -10.830509185791016, "global_step": 476700, "epoch": 2837} {"train_loss": -11.40992259979248, "global_step": 476701, "epoch": 2837} {"train_loss": -10.382148742675781, "global_step": 476702, "epoch": 2837} {"train_loss": -11.459517478942871, "global_step": 476703, "epoch": 2837} {"train_loss": -11.28681755065918, "global_step": 476704, "epoch": 2837} {"train_loss": -11.047310829162598, "global_step": 476705, "epoch": 2837} {"train_loss": -11.752920150756836, "global_step": 476706, "epoch": 2837} {"train_loss": -10.482980728149414, "global_step": 476707, "epoch": 2837} {"train_loss": -11.235429763793945, "global_step": 476708, "epoch": 2837} {"train_loss": -11.85738468170166, "global_step": 476709, "epoch": 2837} {"train_loss": -11.156024932861328, "global_step": 476710, "epoch": 2837} {"train_loss": -11.348727226257324, "global_step": 476711, "epoch": 2837} {"train_loss": -12.007257461547852, "global_step": 476712, "epoch": 2837} {"train_loss": -11.266971588134766, "global_step": 476713, "epoch": 2837} {"train_loss": -10.84388542175293, "global_step": 476714, "epoch": 2837} {"train_loss": -12.16379165649414, "global_step": 476715, "epoch": 2837} {"train_loss": -10.827638626098633, "global_step": 476716, "epoch": 2837} {"train_loss": -11.42823600769043, "global_step": 476717, "epoch": 2837} {"train_loss": -11.746803283691406, "global_step": 476718, "epoch": 2837} {"train_loss": -10.732479095458984, "global_step": 476719, "epoch": 2837} {"train_loss": -12.087900161743164, "global_step": 476720, "epoch": 2837} {"train_loss": -11.306243896484375, "global_step": 476721, "epoch": 2837} {"train_loss": -11.392818450927734, "global_step": 476722, "epoch": 2837} {"train_loss": -12.392583847045898, "global_step": 476723, "epoch": 2837} {"train_loss": -11.914382934570312, "global_step": 476724, "epoch": 2837} {"train_loss": -11.565009117126465, "global_step": 476725, "epoch": 2837} {"train_loss": -12.591760635375977, "global_step": 476726, "epoch": 2837} {"train_loss": -11.614140510559082, "global_step": 476727, "epoch": 2837} {"train_loss": -12.489800453186035, "global_step": 476728, "epoch": 2837} {"train_loss": -12.257285118103027, "global_step": 476729, "epoch": 2837} {"train_loss": -12.293869018554688, "global_step": 476730, "epoch": 2837} {"train_loss": -12.333151817321777, "global_step": 476731, "epoch": 2837} {"train_loss": -12.374103546142578, "global_step": 476732, "epoch": 2837} {"train_loss": -12.109016418457031, "global_step": 476733, "epoch": 2837} {"train_loss": -12.522794723510742, "global_step": 476734, "epoch": 2837} {"train_loss": -12.374120712280273, "global_step": 476735, "epoch": 2837} {"train_loss": -12.470475196838379, "global_step": 476736, "epoch": 2837} {"train_loss": -12.770960807800293, "global_step": 476737, "epoch": 2837} {"train_loss": -12.349946975708008, "global_step": 476738, "epoch": 2837} {"train_loss": -12.476417541503906, "global_step": 476739, "epoch": 2837} {"train_loss": -12.535374641418457, "global_step": 476740, "epoch": 2837} {"train_loss": -12.492731094360352, "global_step": 476741, "epoch": 2837} {"train_loss": -11.849821090698242, "global_step": 476742, "epoch": 2837} {"train_loss": -12.483254432678223, "global_step": 476743, "epoch": 2837} {"train_loss": -12.075618743896484, "global_step": 476744, "epoch": 2837} {"train_loss": -12.149049758911133, "global_step": 476745, "epoch": 2837} {"train_loss": -12.138835906982422, "global_step": 476746, "epoch": 2837} {"train_loss": -12.47854232788086, "global_step": 476747, "epoch": 2837} {"train_loss": -12.038212776184082, "global_step": 476748, "epoch": 2837} {"train_loss": -12.614655494689941, "global_step": 476749, "epoch": 2837} {"train_loss": -12.329776763916016, "global_step": 476750, "epoch": 2837} {"train_loss": -12.323509216308594, "global_step": 476751, "epoch": 2837} {"train_loss": -12.488052368164062, "global_step": 476752, "epoch": 2837} {"train_loss": -12.270939826965332, "global_step": 476753, "epoch": 2837} {"train_loss": -12.390215873718262, "global_step": 476754, "epoch": 2837} {"train_loss": -11.934174537658691, "global_step": 476755, "epoch": 2837} {"train_loss": -12.246413230895996, "global_step": 476756, "epoch": 2837} {"train_loss": -11.737544059753418, "global_step": 476757, "epoch": 2837} {"train_loss": -12.640195846557617, "global_step": 476758, "epoch": 2837} {"train_loss": -11.954166412353516, "global_step": 476759, "epoch": 2837} {"train_loss": -12.49429702758789, "global_step": 476760, "epoch": 2837} {"train_loss": -12.49582576751709, "global_step": 476761, "epoch": 2837} {"train_loss": -12.58857536315918, "global_step": 476762, "epoch": 2837} {"train_loss": -12.651390075683594, "global_step": 476763, "epoch": 2837} {"train_loss": -12.484055519104004, "global_step": 476764, "epoch": 2837} {"train_loss": -12.692634582519531, "global_step": 476765, "epoch": 2837} {"train_loss": -12.568212509155273, "global_step": 476766, "epoch": 2837} {"train_loss": -12.425955772399902, "global_step": 476767, "epoch": 2837} {"train_loss": -12.684503555297852, "global_step": 476768, "epoch": 2837} {"train_loss": -12.68709945678711, "global_step": 476769, "epoch": 2837} {"train_loss": -12.61373519897461, "global_step": 476770, "epoch": 2837} {"train_loss": -12.664590835571289, "global_step": 476771, "epoch": 2837} {"train_loss": -12.83393669128418, "global_step": 476772, "epoch": 2837} {"train_loss": -12.77798843383789, "global_step": 476773, "epoch": 2837} {"train_loss": -12.701555252075195, "global_step": 476774, "epoch": 2837} {"train_loss": -12.74213981628418, "global_step": 476775, "epoch": 2837} {"train_loss": -12.849325180053711, "global_step": 476776, "epoch": 2837} {"train_loss": -12.748786926269531, "global_step": 476777, "epoch": 2837} {"train_loss": -12.915580749511719, "global_step": 476778, "epoch": 2837} {"train_loss": -12.572319030761719, "global_step": 476779, "epoch": 2837} {"train_loss": -12.658084869384766, "global_step": 476780, "epoch": 2837} {"train_loss": -12.616828918457031, "global_step": 476781, "epoch": 2837} {"train_loss": -12.520687103271484, "global_step": 476782, "epoch": 2837} {"train_loss": -12.18034365063622, "global_step": 476783, "epoch": 2837, "val_loss": 314762.53125} {"train_loss": -12.52001953125, "global_step": 476784, "epoch": 2838} {"train_loss": -12.505819320678711, "global_step": 476785, "epoch": 2838} {"train_loss": -12.247597694396973, "global_step": 476786, "epoch": 2838} {"train_loss": -12.446349143981934, "global_step": 476787, "epoch": 2838} {"train_loss": -12.51595687866211, "global_step": 476788, "epoch": 2838} {"train_loss": -12.744100570678711, "global_step": 476789, "epoch": 2838} {"train_loss": -12.768898010253906, "global_step": 476790, "epoch": 2838} {"train_loss": -12.710432052612305, "global_step": 476791, "epoch": 2838} {"train_loss": -12.532867431640625, "global_step": 476792, "epoch": 2838} {"train_loss": -12.81776237487793, "global_step": 476793, "epoch": 2838} {"train_loss": -12.805087089538574, "global_step": 476794, "epoch": 2838} {"train_loss": -12.712827682495117, "global_step": 476795, "epoch": 2838} {"train_loss": -12.548124313354492, "global_step": 476796, "epoch": 2838} {"train_loss": -12.701593399047852, "global_step": 476797, "epoch": 2838} {"train_loss": -12.696955680847168, "global_step": 476798, "epoch": 2838} {"train_loss": -12.731889724731445, "global_step": 476799, "epoch": 2838} {"train_loss": -12.660993576049805, "global_step": 476800, "epoch": 2838} {"train_loss": -12.819710731506348, "global_step": 476801, "epoch": 2838} {"train_loss": -12.823929786682129, "global_step": 476802, "epoch": 2838} {"train_loss": -12.56945514678955, "global_step": 476803, "epoch": 2838} {"train_loss": -12.795010566711426, "global_step": 476804, "epoch": 2838} {"train_loss": -12.681316375732422, "global_step": 476805, "epoch": 2838} {"train_loss": -12.853292465209961, "global_step": 476806, "epoch": 2838} {"train_loss": -13.058419227600098, "global_step": 476807, "epoch": 2838} {"train_loss": -12.827346801757812, "global_step": 476808, "epoch": 2838} {"train_loss": -12.323564529418945, "global_step": 476809, "epoch": 2838} {"train_loss": -11.884521484375, "global_step": 476810, "epoch": 2838} {"train_loss": -11.825312614440918, "global_step": 476811, "epoch": 2838} {"train_loss": -12.1625337600708, "global_step": 476812, "epoch": 2838} {"train_loss": -12.006074905395508, "global_step": 476813, "epoch": 2838} {"train_loss": -12.812607765197754, "global_step": 476814, "epoch": 2838} {"train_loss": -12.2127685546875, "global_step": 476815, "epoch": 2838} {"train_loss": -12.405511856079102, "global_step": 476816, "epoch": 2838} {"train_loss": -12.457351684570312, "global_step": 476817, "epoch": 2838} {"train_loss": -12.843783378601074, "global_step": 476818, "epoch": 2838} {"train_loss": -11.857446670532227, "global_step": 476819, "epoch": 2838} {"train_loss": -12.150354385375977, "global_step": 476820, "epoch": 2838} {"train_loss": -11.808547973632812, "global_step": 476821, "epoch": 2838} {"train_loss": -12.386937141418457, "global_step": 476822, "epoch": 2838} {"train_loss": -12.710528373718262, "global_step": 476823, "epoch": 2838} {"train_loss": -12.514067649841309, "global_step": 476824, "epoch": 2838} {"train_loss": -12.687664985656738, "global_step": 476825, "epoch": 2838} {"train_loss": -12.337035179138184, "global_step": 476826, "epoch": 2838} {"train_loss": -12.77505874633789, "global_step": 476827, "epoch": 2838} {"train_loss": -12.191621780395508, "global_step": 476828, "epoch": 2838} {"train_loss": -12.430858612060547, "global_step": 476829, "epoch": 2838} {"train_loss": -12.394661903381348, "global_step": 476830, "epoch": 2838} {"train_loss": -12.745499610900879, "global_step": 476831, "epoch": 2838} {"train_loss": -12.234580039978027, "global_step": 476832, "epoch": 2838} {"train_loss": -12.582377433776855, "global_step": 476833, "epoch": 2838} {"train_loss": -12.326467514038086, "global_step": 476834, "epoch": 2838} {"train_loss": -12.763250350952148, "global_step": 476835, "epoch": 2838} {"train_loss": -12.342203140258789, "global_step": 476836, "epoch": 2838} {"train_loss": -12.466242790222168, "global_step": 476837, "epoch": 2838} {"train_loss": -12.775467872619629, "global_step": 476838, "epoch": 2838} {"train_loss": -12.779092788696289, "global_step": 476839, "epoch": 2838} {"train_loss": -12.490133285522461, "global_step": 476840, "epoch": 2838} {"train_loss": -11.401474952697754, "global_step": 476841, "epoch": 2838} {"train_loss": -10.477128982543945, "global_step": 476842, "epoch": 2838} {"train_loss": -12.27081298828125, "global_step": 476843, "epoch": 2838} {"train_loss": -12.680215835571289, "global_step": 476844, "epoch": 2838} {"train_loss": -12.574990272521973, "global_step": 476845, "epoch": 2838} {"train_loss": -12.201887130737305, "global_step": 476846, "epoch": 2838} {"train_loss": -12.401128768920898, "global_step": 476847, "epoch": 2838} {"train_loss": -11.633066177368164, "global_step": 476848, "epoch": 2838} {"train_loss": -12.880069732666016, "global_step": 476849, "epoch": 2838} {"train_loss": -12.071966171264648, "global_step": 476850, "epoch": 2838} {"train_loss": -11.717848777770996, "global_step": 476851, "epoch": 2838} {"train_loss": -12.223146438598633, "global_step": 476852, "epoch": 2838} {"train_loss": -11.758209228515625, "global_step": 476853, "epoch": 2838} {"train_loss": -11.269378662109375, "global_step": 476854, "epoch": 2838} {"train_loss": -12.751623153686523, "global_step": 476855, "epoch": 2838} {"train_loss": -11.51469612121582, "global_step": 476856, "epoch": 2838} {"train_loss": -12.312533378601074, "global_step": 476857, "epoch": 2838} {"train_loss": -12.459428787231445, "global_step": 476858, "epoch": 2838} {"train_loss": -12.71558952331543, "global_step": 476859, "epoch": 2838} {"train_loss": -12.45341968536377, "global_step": 476860, "epoch": 2838} {"train_loss": -12.810311317443848, "global_step": 476861, "epoch": 2838} {"train_loss": -12.553075790405273, "global_step": 476862, "epoch": 2838} {"train_loss": -12.521711349487305, "global_step": 476863, "epoch": 2838} {"train_loss": -12.571755409240723, "global_step": 476864, "epoch": 2838} {"train_loss": -12.805729866027832, "global_step": 476865, "epoch": 2838} {"train_loss": -12.326577186584473, "global_step": 476866, "epoch": 2838} {"train_loss": -12.651358604431152, "global_step": 476867, "epoch": 2838} {"train_loss": -12.322595596313477, "global_step": 476868, "epoch": 2838} {"train_loss": -12.519250869750977, "global_step": 476869, "epoch": 2838} {"train_loss": -12.503827095031738, "global_step": 476870, "epoch": 2838} {"train_loss": -12.352242469787598, "global_step": 476871, "epoch": 2838} {"train_loss": -11.91889762878418, "global_step": 476872, "epoch": 2838} {"train_loss": -12.30905532836914, "global_step": 476873, "epoch": 2838} {"train_loss": -12.142722129821777, "global_step": 476874, "epoch": 2838} {"train_loss": -11.950370788574219, "global_step": 476875, "epoch": 2838} {"train_loss": -12.261616706848145, "global_step": 476876, "epoch": 2838} {"train_loss": -11.618314743041992, "global_step": 476877, "epoch": 2838} {"train_loss": -11.365267753601074, "global_step": 476878, "epoch": 2838} {"train_loss": -11.247627258300781, "global_step": 476879, "epoch": 2838} {"train_loss": -11.839499473571777, "global_step": 476880, "epoch": 2838} {"train_loss": -9.685632705688477, "global_step": 476881, "epoch": 2838} {"train_loss": -11.127055168151855, "global_step": 476882, "epoch": 2838} {"train_loss": -10.923517227172852, "global_step": 476883, "epoch": 2838} {"train_loss": -11.371402740478516, "global_step": 476884, "epoch": 2838} {"train_loss": -11.927552223205566, "global_step": 476885, "epoch": 2838} {"train_loss": -10.464616775512695, "global_step": 476886, "epoch": 2838} {"train_loss": -10.128599166870117, "global_step": 476887, "epoch": 2838} {"train_loss": -10.713308334350586, "global_step": 476888, "epoch": 2838} {"train_loss": -11.260169982910156, "global_step": 476889, "epoch": 2838} {"train_loss": -11.194482803344727, "global_step": 476890, "epoch": 2838} {"train_loss": -11.611381530761719, "global_step": 476891, "epoch": 2838} {"train_loss": -12.484535217285156, "global_step": 476892, "epoch": 2838} {"train_loss": -12.056973457336426, "global_step": 476893, "epoch": 2838} {"train_loss": -11.778963088989258, "global_step": 476894, "epoch": 2838} {"train_loss": -12.421546936035156, "global_step": 476895, "epoch": 2838} {"train_loss": -11.578080177307129, "global_step": 476896, "epoch": 2838} {"train_loss": -11.742828369140625, "global_step": 476897, "epoch": 2838} {"train_loss": -11.73348331451416, "global_step": 476898, "epoch": 2838} {"train_loss": -12.192639350891113, "global_step": 476899, "epoch": 2838} {"train_loss": -11.887338638305664, "global_step": 476900, "epoch": 2838} {"train_loss": -12.405220031738281, "global_step": 476901, "epoch": 2838} {"train_loss": -12.098893165588379, "global_step": 476902, "epoch": 2838} {"train_loss": -12.194137573242188, "global_step": 476903, "epoch": 2838} {"train_loss": -12.372010231018066, "global_step": 476904, "epoch": 2838} {"train_loss": -11.952997207641602, "global_step": 476905, "epoch": 2838} {"train_loss": -12.37919807434082, "global_step": 476906, "epoch": 2838} {"train_loss": -12.564168930053711, "global_step": 476907, "epoch": 2838} {"train_loss": -12.684867858886719, "global_step": 476908, "epoch": 2838} {"train_loss": -12.634071350097656, "global_step": 476909, "epoch": 2838} {"train_loss": -12.576007843017578, "global_step": 476910, "epoch": 2838} {"train_loss": -12.596975326538086, "global_step": 476911, "epoch": 2838} {"train_loss": -12.167888641357422, "global_step": 476912, "epoch": 2838} {"train_loss": -12.279644012451172, "global_step": 476913, "epoch": 2838} {"train_loss": -12.221396446228027, "global_step": 476914, "epoch": 2838} {"train_loss": -11.731122016906738, "global_step": 476915, "epoch": 2838} {"train_loss": -12.530807495117188, "global_step": 476916, "epoch": 2838} {"train_loss": -12.049598693847656, "global_step": 476917, "epoch": 2838} {"train_loss": -11.834431648254395, "global_step": 476918, "epoch": 2838} {"train_loss": -12.440829277038574, "global_step": 476919, "epoch": 2838} {"train_loss": -12.0398588180542, "global_step": 476920, "epoch": 2838} {"train_loss": -11.83803939819336, "global_step": 476921, "epoch": 2838} {"train_loss": -12.533357620239258, "global_step": 476922, "epoch": 2838} {"train_loss": -12.206384658813477, "global_step": 476923, "epoch": 2838} {"train_loss": -12.271271705627441, "global_step": 476924, "epoch": 2838} {"train_loss": -12.50823974609375, "global_step": 476925, "epoch": 2838} {"train_loss": -12.21595287322998, "global_step": 476926, "epoch": 2838} {"train_loss": -12.263921737670898, "global_step": 476927, "epoch": 2838} {"train_loss": -12.586252212524414, "global_step": 476928, "epoch": 2838} {"train_loss": -12.190544128417969, "global_step": 476929, "epoch": 2838} {"train_loss": -12.191967964172363, "global_step": 476930, "epoch": 2838} {"train_loss": -12.832416534423828, "global_step": 476931, "epoch": 2838} {"train_loss": -12.469783782958984, "global_step": 476932, "epoch": 2838} {"train_loss": -12.611928939819336, "global_step": 476933, "epoch": 2838} {"train_loss": -12.687984466552734, "global_step": 476934, "epoch": 2838} {"train_loss": -12.550607681274414, "global_step": 476935, "epoch": 2838} {"train_loss": -12.90986442565918, "global_step": 476936, "epoch": 2838} {"train_loss": -12.546501159667969, "global_step": 476937, "epoch": 2838} {"train_loss": -12.64715576171875, "global_step": 476938, "epoch": 2838} {"train_loss": -12.75891399383545, "global_step": 476939, "epoch": 2838} {"train_loss": -12.60993766784668, "global_step": 476940, "epoch": 2838} {"train_loss": -12.675838470458984, "global_step": 476941, "epoch": 2838} {"train_loss": -12.741135597229004, "global_step": 476942, "epoch": 2838} {"train_loss": -12.654594421386719, "global_step": 476943, "epoch": 2838} {"train_loss": -12.859067916870117, "global_step": 476944, "epoch": 2838} {"train_loss": -12.897089004516602, "global_step": 476945, "epoch": 2838} {"train_loss": -12.678635597229004, "global_step": 476946, "epoch": 2838} {"train_loss": -12.764007568359375, "global_step": 476947, "epoch": 2838} {"train_loss": -12.83149528503418, "global_step": 476948, "epoch": 2838} {"train_loss": -12.483352661132812, "global_step": 476949, "epoch": 2838} {"train_loss": -12.686784744262695, "global_step": 476950, "epoch": 2838} {"train_loss": -12.282216679482232, "global_step": 476951, "epoch": 2838, "val_loss": 318519.28125} {"train_loss": -12.786700248718262, "global_step": 476952, "epoch": 2839} {"train_loss": -12.69316291809082, "global_step": 476953, "epoch": 2839} {"train_loss": -12.607059478759766, "global_step": 476954, "epoch": 2839} {"train_loss": -12.796834945678711, "global_step": 476955, "epoch": 2839} {"train_loss": -12.822534561157227, "global_step": 476956, "epoch": 2839} {"train_loss": -12.5911283493042, "global_step": 476957, "epoch": 2839} {"train_loss": -12.684480667114258, "global_step": 476958, "epoch": 2839} {"train_loss": -12.320442199707031, "global_step": 476959, "epoch": 2839} {"train_loss": -12.866254806518555, "global_step": 476960, "epoch": 2839} {"train_loss": -12.639519691467285, "global_step": 476961, "epoch": 2839} {"train_loss": -12.401548385620117, "global_step": 476962, "epoch": 2839} {"train_loss": -12.732738494873047, "global_step": 476963, "epoch": 2839} {"train_loss": -12.862725257873535, "global_step": 476964, "epoch": 2839} {"train_loss": -11.94261646270752, "global_step": 476965, "epoch": 2839} {"train_loss": -11.580928802490234, "global_step": 476966, "epoch": 2839} {"train_loss": -11.895145416259766, "global_step": 476967, "epoch": 2839} {"train_loss": -12.178573608398438, "global_step": 476968, "epoch": 2839} {"train_loss": -10.867757797241211, "global_step": 476969, "epoch": 2839} {"train_loss": -12.328542709350586, "global_step": 476970, "epoch": 2839} {"train_loss": -11.762046813964844, "global_step": 476971, "epoch": 2839} {"train_loss": -12.231864929199219, "global_step": 476972, "epoch": 2839} {"train_loss": -11.488470077514648, "global_step": 476973, "epoch": 2839} {"train_loss": -11.91006851196289, "global_step": 476974, "epoch": 2839} {"train_loss": -11.53068733215332, "global_step": 476975, "epoch": 2839} {"train_loss": -12.546839714050293, "global_step": 476976, "epoch": 2839} {"train_loss": -11.63235855102539, "global_step": 476977, "epoch": 2839} {"train_loss": -11.883089065551758, "global_step": 476978, "epoch": 2839} {"train_loss": -12.076647758483887, "global_step": 476979, "epoch": 2839} {"train_loss": -12.108538627624512, "global_step": 476980, "epoch": 2839} {"train_loss": -12.302451133728027, "global_step": 476981, "epoch": 2839} {"train_loss": -11.94416618347168, "global_step": 476982, "epoch": 2839} {"train_loss": -12.19832992553711, "global_step": 476983, "epoch": 2839} {"train_loss": -12.270609855651855, "global_step": 476984, "epoch": 2839} {"train_loss": -12.170432090759277, "global_step": 476985, "epoch": 2839} {"train_loss": -12.248930931091309, "global_step": 476986, "epoch": 2839} {"train_loss": -11.490232467651367, "global_step": 476987, "epoch": 2839} {"train_loss": -12.306503295898438, "global_step": 476988, "epoch": 2839} {"train_loss": -11.800076484680176, "global_step": 476989, "epoch": 2839} {"train_loss": -12.018138885498047, "global_step": 476990, "epoch": 2839} {"train_loss": -12.202423095703125, "global_step": 476991, "epoch": 2839} {"train_loss": -12.44279670715332, "global_step": 476992, "epoch": 2839} {"train_loss": -12.306309700012207, "global_step": 476993, "epoch": 2839} {"train_loss": -12.30788803100586, "global_step": 476994, "epoch": 2839} {"train_loss": -12.429622650146484, "global_step": 476995, "epoch": 2839} {"train_loss": -12.253612518310547, "global_step": 476996, "epoch": 2839} {"train_loss": -12.589092254638672, "global_step": 476997, "epoch": 2839} {"train_loss": -12.11375617980957, "global_step": 476998, "epoch": 2839} {"train_loss": -11.920743942260742, "global_step": 476999, "epoch": 2839} {"train_loss": -12.041412353515625, "global_step": 477000, "epoch": 2839} {"train_loss": -12.518697738647461, "global_step": 477001, "epoch": 2839} {"train_loss": -11.84610366821289, "global_step": 477002, "epoch": 2839} {"train_loss": -12.28814697265625, "global_step": 477003, "epoch": 2839} {"train_loss": -12.051589012145996, "global_step": 477004, "epoch": 2839} {"train_loss": -12.153644561767578, "global_step": 477005, "epoch": 2839} {"train_loss": -12.608834266662598, "global_step": 477006, "epoch": 2839} {"train_loss": -12.607463836669922, "global_step": 477007, "epoch": 2839} {"train_loss": -12.036515235900879, "global_step": 477008, "epoch": 2839} {"train_loss": -12.579025268554688, "global_step": 477009, "epoch": 2839} {"train_loss": -12.105398178100586, "global_step": 477010, "epoch": 2839} {"train_loss": -12.069112777709961, "global_step": 477011, "epoch": 2839} {"train_loss": -12.3336820602417, "global_step": 477012, "epoch": 2839} {"train_loss": -12.4142484664917, "global_step": 477013, "epoch": 2839} {"train_loss": -12.193185806274414, "global_step": 477014, "epoch": 2839} {"train_loss": -11.977682113647461, "global_step": 477015, "epoch": 2839} {"train_loss": -11.827981948852539, "global_step": 477016, "epoch": 2839} {"train_loss": -11.96572494506836, "global_step": 477017, "epoch": 2839} {"train_loss": -11.450370788574219, "global_step": 477018, "epoch": 2839} {"train_loss": -11.268905639648438, "global_step": 477019, "epoch": 2839} {"train_loss": -11.511472702026367, "global_step": 477020, "epoch": 2839} {"train_loss": -11.489884376525879, "global_step": 477021, "epoch": 2839} {"train_loss": -12.269956588745117, "global_step": 477022, "epoch": 2839} {"train_loss": -11.921308517456055, "global_step": 477023, "epoch": 2839} {"train_loss": -12.015097618103027, "global_step": 477024, "epoch": 2839} {"train_loss": -10.902559280395508, "global_step": 477025, "epoch": 2839} {"train_loss": -12.273386001586914, "global_step": 477026, "epoch": 2839} {"train_loss": -10.8148832321167, "global_step": 477027, "epoch": 2839} {"train_loss": -11.169797897338867, "global_step": 477028, "epoch": 2839} {"train_loss": -11.46236801147461, "global_step": 477029, "epoch": 2839} {"train_loss": -10.862154960632324, "global_step": 477030, "epoch": 2839} {"train_loss": -11.806304931640625, "global_step": 477031, "epoch": 2839} {"train_loss": -11.560568809509277, "global_step": 477032, "epoch": 2839} {"train_loss": -11.824861526489258, "global_step": 477033, "epoch": 2839} {"train_loss": -11.119142532348633, "global_step": 477034, "epoch": 2839} {"train_loss": -11.78105640411377, "global_step": 477035, "epoch": 2839} {"train_loss": -11.814458847045898, "global_step": 477036, "epoch": 2839} {"train_loss": -11.204580307006836, "global_step": 477037, "epoch": 2839} {"train_loss": -12.117447853088379, "global_step": 477038, "epoch": 2839} {"train_loss": -11.136092185974121, "global_step": 477039, "epoch": 2839} {"train_loss": -11.52419662475586, "global_step": 477040, "epoch": 2839} {"train_loss": -12.047237396240234, "global_step": 477041, "epoch": 2839} {"train_loss": -11.708276748657227, "global_step": 477042, "epoch": 2839} {"train_loss": -11.96843147277832, "global_step": 477043, "epoch": 2839} {"train_loss": -12.110645294189453, "global_step": 477044, "epoch": 2839} {"train_loss": -12.093010902404785, "global_step": 477045, "epoch": 2839} {"train_loss": -11.330073356628418, "global_step": 477046, "epoch": 2839} {"train_loss": -11.483051300048828, "global_step": 477047, "epoch": 2839} {"train_loss": -11.507065773010254, "global_step": 477048, "epoch": 2839} {"train_loss": -12.264431953430176, "global_step": 477049, "epoch": 2839} {"train_loss": -11.846077919006348, "global_step": 477050, "epoch": 2839} {"train_loss": -12.072663307189941, "global_step": 477051, "epoch": 2839} {"train_loss": -12.449207305908203, "global_step": 477052, "epoch": 2839} {"train_loss": -12.11715316772461, "global_step": 477053, "epoch": 2839} {"train_loss": -12.282301902770996, "global_step": 477054, "epoch": 2839} {"train_loss": -12.120080947875977, "global_step": 477055, "epoch": 2839} {"train_loss": -12.158937454223633, "global_step": 477056, "epoch": 2839} {"train_loss": -11.48234748840332, "global_step": 477057, "epoch": 2839} {"train_loss": -11.790124893188477, "global_step": 477058, "epoch": 2839} {"train_loss": -11.711820602416992, "global_step": 477059, "epoch": 2839} {"train_loss": -11.799225807189941, "global_step": 477060, "epoch": 2839} {"train_loss": -11.291678428649902, "global_step": 477061, "epoch": 2839} {"train_loss": -11.539104461669922, "global_step": 477062, "epoch": 2839} {"train_loss": -11.871979713439941, "global_step": 477063, "epoch": 2839} {"train_loss": -11.9364013671875, "global_step": 477064, "epoch": 2839} {"train_loss": -12.44148063659668, "global_step": 477065, "epoch": 2839} {"train_loss": -11.214557647705078, "global_step": 477066, "epoch": 2839} {"train_loss": -11.879608154296875, "global_step": 477067, "epoch": 2839} {"train_loss": -12.368515014648438, "global_step": 477068, "epoch": 2839} {"train_loss": -11.934015274047852, "global_step": 477069, "epoch": 2839} {"train_loss": -12.26061725616455, "global_step": 477070, "epoch": 2839} {"train_loss": -12.140524864196777, "global_step": 477071, "epoch": 2839} {"train_loss": -12.224740028381348, "global_step": 477072, "epoch": 2839} {"train_loss": -12.583864212036133, "global_step": 477073, "epoch": 2839} {"train_loss": -12.298789024353027, "global_step": 477074, "epoch": 2839} {"train_loss": -12.446161270141602, "global_step": 477075, "epoch": 2839} {"train_loss": -12.34190845489502, "global_step": 477076, "epoch": 2839} {"train_loss": -12.651710510253906, "global_step": 477077, "epoch": 2839} {"train_loss": -12.412667274475098, "global_step": 477078, "epoch": 2839} {"train_loss": -12.367172241210938, "global_step": 477079, "epoch": 2839} {"train_loss": -12.310364723205566, "global_step": 477080, "epoch": 2839} {"train_loss": -12.573870658874512, "global_step": 477081, "epoch": 2839} {"train_loss": -12.498023986816406, "global_step": 477082, "epoch": 2839} {"train_loss": -12.173059463500977, "global_step": 477083, "epoch": 2839} {"train_loss": -12.493249893188477, "global_step": 477084, "epoch": 2839} {"train_loss": -12.14803695678711, "global_step": 477085, "epoch": 2839} {"train_loss": -12.63577651977539, "global_step": 477086, "epoch": 2839} {"train_loss": -11.881271362304688, "global_step": 477087, "epoch": 2839} {"train_loss": -12.353339195251465, "global_step": 477088, "epoch": 2839} {"train_loss": -12.055566787719727, "global_step": 477089, "epoch": 2839} {"train_loss": -11.856796264648438, "global_step": 477090, "epoch": 2839} {"train_loss": -12.104755401611328, "global_step": 477091, "epoch": 2839} {"train_loss": -12.091469764709473, "global_step": 477092, "epoch": 2839} {"train_loss": -12.125215530395508, "global_step": 477093, "epoch": 2839} {"train_loss": -12.490194320678711, "global_step": 477094, "epoch": 2839} {"train_loss": -11.712212562561035, "global_step": 477095, "epoch": 2839} {"train_loss": -12.436408996582031, "global_step": 477096, "epoch": 2839} {"train_loss": -11.68954849243164, "global_step": 477097, "epoch": 2839} {"train_loss": -12.415159225463867, "global_step": 477098, "epoch": 2839} {"train_loss": -12.43661117553711, "global_step": 477099, "epoch": 2839} {"train_loss": -12.072376251220703, "global_step": 477100, "epoch": 2839} {"train_loss": -12.494356155395508, "global_step": 477101, "epoch": 2839} {"train_loss": -12.185213088989258, "global_step": 477102, "epoch": 2839} {"train_loss": -12.06167984008789, "global_step": 477103, "epoch": 2839} {"train_loss": -12.728202819824219, "global_step": 477104, "epoch": 2839} {"train_loss": -12.271060943603516, "global_step": 477105, "epoch": 2839} {"train_loss": -12.328007698059082, "global_step": 477106, "epoch": 2839} {"train_loss": -12.469966888427734, "global_step": 477107, "epoch": 2839} {"train_loss": -12.311841011047363, "global_step": 477108, "epoch": 2839} {"train_loss": -12.481422424316406, "global_step": 477109, "epoch": 2839} {"train_loss": -12.338052749633789, "global_step": 477110, "epoch": 2839} {"train_loss": -12.307698249816895, "global_step": 477111, "epoch": 2839} {"train_loss": -12.048967361450195, "global_step": 477112, "epoch": 2839} {"train_loss": -12.395194053649902, "global_step": 477113, "epoch": 2839} {"train_loss": -12.370030403137207, "global_step": 477114, "epoch": 2839} {"train_loss": -12.762739181518555, "global_step": 477115, "epoch": 2839} {"train_loss": -12.176780700683594, "global_step": 477116, "epoch": 2839} {"train_loss": -12.765878677368164, "global_step": 477117, "epoch": 2839} {"train_loss": -12.428535461425781, "global_step": 477118, "epoch": 2839} {"train_loss": -12.092952943983532, "global_step": 477119, "epoch": 2839, "val_loss": 317775.6875} {"train_loss": -12.70737075805664, "global_step": 477120, "epoch": 2840} {"train_loss": -12.246715545654297, "global_step": 477121, "epoch": 2840} {"train_loss": -12.818792343139648, "global_step": 477122, "epoch": 2840} {"train_loss": -12.578149795532227, "global_step": 477123, "epoch": 2840} {"train_loss": -12.70869255065918, "global_step": 477124, "epoch": 2840} {"train_loss": -12.557645797729492, "global_step": 477125, "epoch": 2840} {"train_loss": -12.500446319580078, "global_step": 477126, "epoch": 2840} {"train_loss": -12.770650863647461, "global_step": 477127, "epoch": 2840} {"train_loss": -12.721284866333008, "global_step": 477128, "epoch": 2840} {"train_loss": -12.719121932983398, "global_step": 477129, "epoch": 2840} {"train_loss": -12.667440414428711, "global_step": 477130, "epoch": 2840} {"train_loss": -12.593944549560547, "global_step": 477131, "epoch": 2840} {"train_loss": -12.665949821472168, "global_step": 477132, "epoch": 2840} {"train_loss": -12.429585456848145, "global_step": 477133, "epoch": 2840} {"train_loss": -12.429500579833984, "global_step": 477134, "epoch": 2840} {"train_loss": -12.667522430419922, "global_step": 477135, "epoch": 2840} {"train_loss": -12.644523620605469, "global_step": 477136, "epoch": 2840} {"train_loss": -12.569660186767578, "global_step": 477137, "epoch": 2840} {"train_loss": -12.81008529663086, "global_step": 477138, "epoch": 2840} {"train_loss": -12.53515625, "global_step": 477139, "epoch": 2840} {"train_loss": -12.496444702148438, "global_step": 477140, "epoch": 2840} {"train_loss": -12.55904483795166, "global_step": 477141, "epoch": 2840} {"train_loss": -12.518845558166504, "global_step": 477142, "epoch": 2840} {"train_loss": -12.145355224609375, "global_step": 477143, "epoch": 2840} {"train_loss": -12.525318145751953, "global_step": 477144, "epoch": 2840} {"train_loss": -12.087665557861328, "global_step": 477145, "epoch": 2840} {"train_loss": -12.42507266998291, "global_step": 477146, "epoch": 2840} {"train_loss": -12.69155502319336, "global_step": 477147, "epoch": 2840} {"train_loss": -12.097878456115723, "global_step": 477148, "epoch": 2840} {"train_loss": -12.545568466186523, "global_step": 477149, "epoch": 2840} {"train_loss": -12.49703598022461, "global_step": 477150, "epoch": 2840} {"train_loss": -11.997733116149902, "global_step": 477151, "epoch": 2840} {"train_loss": -12.373080253601074, "global_step": 477152, "epoch": 2840} {"train_loss": -12.846827507019043, "global_step": 477153, "epoch": 2840} {"train_loss": -12.270478248596191, "global_step": 477154, "epoch": 2840} {"train_loss": -12.297219276428223, "global_step": 477155, "epoch": 2840} {"train_loss": -12.888315200805664, "global_step": 477156, "epoch": 2840} {"train_loss": -12.284997940063477, "global_step": 477157, "epoch": 2840} {"train_loss": -12.407815933227539, "global_step": 477158, "epoch": 2840} {"train_loss": -12.770532608032227, "global_step": 477159, "epoch": 2840} {"train_loss": -12.726699829101562, "global_step": 477160, "epoch": 2840} {"train_loss": -12.485757827758789, "global_step": 477161, "epoch": 2840} {"train_loss": -12.721776008605957, "global_step": 477162, "epoch": 2840} {"train_loss": -12.943524360656738, "global_step": 477163, "epoch": 2840} {"train_loss": -12.883920669555664, "global_step": 477164, "epoch": 2840} {"train_loss": -12.826103210449219, "global_step": 477165, "epoch": 2840} {"train_loss": -12.706827163696289, "global_step": 477166, "epoch": 2840} {"train_loss": -12.830912590026855, "global_step": 477167, "epoch": 2840} {"train_loss": -12.767400741577148, "global_step": 477168, "epoch": 2840} {"train_loss": -12.992965698242188, "global_step": 477169, "epoch": 2840} {"train_loss": -13.033329010009766, "global_step": 477170, "epoch": 2840} {"train_loss": -12.993650436401367, "global_step": 477171, "epoch": 2840} {"train_loss": -12.92365550994873, "global_step": 477172, "epoch": 2840} {"train_loss": -12.976759910583496, "global_step": 477173, "epoch": 2840} {"train_loss": -13.043880462646484, "global_step": 477174, "epoch": 2840} {"train_loss": -12.874954223632812, "global_step": 477175, "epoch": 2840} {"train_loss": -12.902416229248047, "global_step": 477176, "epoch": 2840} {"train_loss": -12.856729507446289, "global_step": 477177, "epoch": 2840} {"train_loss": -13.002769470214844, "global_step": 477178, "epoch": 2840} {"train_loss": -12.88261604309082, "global_step": 477179, "epoch": 2840} {"train_loss": -12.952654838562012, "global_step": 477180, "epoch": 2840} {"train_loss": -13.099357604980469, "global_step": 477181, "epoch": 2840} {"train_loss": -13.1196928024292, "global_step": 477182, "epoch": 2840} {"train_loss": -13.091939926147461, "global_step": 477183, "epoch": 2840} {"train_loss": -13.069079399108887, "global_step": 477184, "epoch": 2840} {"train_loss": -12.729228973388672, "global_step": 477185, "epoch": 2840} {"train_loss": -12.873435974121094, "global_step": 477186, "epoch": 2840} {"train_loss": -13.00212574005127, "global_step": 477187, "epoch": 2840} {"train_loss": -13.013345718383789, "global_step": 477188, "epoch": 2840} {"train_loss": -12.577667236328125, "global_step": 477189, "epoch": 2840} {"train_loss": -12.235677719116211, "global_step": 477190, "epoch": 2840} {"train_loss": -12.267672538757324, "global_step": 477191, "epoch": 2840} {"train_loss": -12.588077545166016, "global_step": 477192, "epoch": 2840} {"train_loss": -12.62401294708252, "global_step": 477193, "epoch": 2840} {"train_loss": -12.968476295471191, "global_step": 477194, "epoch": 2840} {"train_loss": -12.473286628723145, "global_step": 477195, "epoch": 2840} {"train_loss": -12.077495574951172, "global_step": 477196, "epoch": 2840} {"train_loss": -11.871315002441406, "global_step": 477197, "epoch": 2840} {"train_loss": -12.671480178833008, "global_step": 477198, "epoch": 2840} {"train_loss": -12.440910339355469, "global_step": 477199, "epoch": 2840} {"train_loss": -12.013420104980469, "global_step": 477200, "epoch": 2840} {"train_loss": -10.958582878112793, "global_step": 477201, "epoch": 2840} {"train_loss": -11.990802764892578, "global_step": 477202, "epoch": 2840} {"train_loss": -11.684686660766602, "global_step": 477203, "epoch": 2840} {"train_loss": -10.961601257324219, "global_step": 477204, "epoch": 2840} {"train_loss": -11.333723068237305, "global_step": 477205, "epoch": 2840} {"train_loss": -12.416120529174805, "global_step": 477206, "epoch": 2840} {"train_loss": -12.134498596191406, "global_step": 477207, "epoch": 2840} {"train_loss": -12.287652015686035, "global_step": 477208, "epoch": 2840} {"train_loss": -12.313051223754883, "global_step": 477209, "epoch": 2840} {"train_loss": -12.64929485321045, "global_step": 477210, "epoch": 2840} {"train_loss": -12.526594161987305, "global_step": 477211, "epoch": 2840} {"train_loss": -12.295585632324219, "global_step": 477212, "epoch": 2840} {"train_loss": -12.605890274047852, "global_step": 477213, "epoch": 2840} {"train_loss": -12.049601554870605, "global_step": 477214, "epoch": 2840} {"train_loss": -12.789533615112305, "global_step": 477215, "epoch": 2840} {"train_loss": -12.409832000732422, "global_step": 477216, "epoch": 2840} {"train_loss": -12.276344299316406, "global_step": 477217, "epoch": 2840} {"train_loss": -11.72111701965332, "global_step": 477218, "epoch": 2840} {"train_loss": -12.323731422424316, "global_step": 477219, "epoch": 2840} {"train_loss": -11.747737884521484, "global_step": 477220, "epoch": 2840} {"train_loss": -11.12971019744873, "global_step": 477221, "epoch": 2840} {"train_loss": -11.07080078125, "global_step": 477222, "epoch": 2840} {"train_loss": -11.043218612670898, "global_step": 477223, "epoch": 2840} {"train_loss": -11.227259635925293, "global_step": 477224, "epoch": 2840} {"train_loss": -11.838401794433594, "global_step": 477225, "epoch": 2840} {"train_loss": -11.683820724487305, "global_step": 477226, "epoch": 2840} {"train_loss": -10.186531066894531, "global_step": 477227, "epoch": 2840} {"train_loss": -11.387526512145996, "global_step": 477228, "epoch": 2840} {"train_loss": -11.492142677307129, "global_step": 477229, "epoch": 2840} {"train_loss": -10.784530639648438, "global_step": 477230, "epoch": 2840} {"train_loss": -10.901774406433105, "global_step": 477231, "epoch": 2840} {"train_loss": -10.257298469543457, "global_step": 477232, "epoch": 2840} {"train_loss": -10.382760047912598, "global_step": 477233, "epoch": 2840} {"train_loss": -10.93095588684082, "global_step": 477234, "epoch": 2840} {"train_loss": -9.666702270507812, "global_step": 477235, "epoch": 2840} {"train_loss": -10.091514587402344, "global_step": 477236, "epoch": 2840} {"train_loss": -9.139579772949219, "global_step": 477237, "epoch": 2840} {"train_loss": -9.457952499389648, "global_step": 477238, "epoch": 2840} {"train_loss": -9.948490142822266, "global_step": 477239, "epoch": 2840} {"train_loss": -9.613932609558105, "global_step": 477240, "epoch": 2840} {"train_loss": -9.928581237792969, "global_step": 477241, "epoch": 2840} {"train_loss": -11.032511711120605, "global_step": 477242, "epoch": 2840} {"train_loss": -10.018735885620117, "global_step": 477243, "epoch": 2840} {"train_loss": -9.658330917358398, "global_step": 477244, "epoch": 2840} {"train_loss": -11.588458061218262, "global_step": 477245, "epoch": 2840} {"train_loss": -9.919265747070312, "global_step": 477246, "epoch": 2840} {"train_loss": -10.952089309692383, "global_step": 477247, "epoch": 2840} {"train_loss": -11.291272163391113, "global_step": 477248, "epoch": 2840} {"train_loss": -11.219651222229004, "global_step": 477249, "epoch": 2840} {"train_loss": -11.009988784790039, "global_step": 477250, "epoch": 2840} {"train_loss": -11.283618927001953, "global_step": 477251, "epoch": 2840} {"train_loss": -11.673648834228516, "global_step": 477252, "epoch": 2840} {"train_loss": -11.031208038330078, "global_step": 477253, "epoch": 2840} {"train_loss": -11.68618392944336, "global_step": 477254, "epoch": 2840} {"train_loss": -11.076299667358398, "global_step": 477255, "epoch": 2840} {"train_loss": -11.644271850585938, "global_step": 477256, "epoch": 2840} {"train_loss": -11.245543479919434, "global_step": 477257, "epoch": 2840} {"train_loss": -11.70732307434082, "global_step": 477258, "epoch": 2840} {"train_loss": -12.132734298706055, "global_step": 477259, "epoch": 2840} {"train_loss": -11.370122909545898, "global_step": 477260, "epoch": 2840} {"train_loss": -11.655133247375488, "global_step": 477261, "epoch": 2840} {"train_loss": -11.788707733154297, "global_step": 477262, "epoch": 2840} {"train_loss": -11.656940460205078, "global_step": 477263, "epoch": 2840} {"train_loss": -11.05324935913086, "global_step": 477264, "epoch": 2840} {"train_loss": -12.098254203796387, "global_step": 477265, "epoch": 2840} {"train_loss": -11.337315559387207, "global_step": 477266, "epoch": 2840} {"train_loss": -11.695444107055664, "global_step": 477267, "epoch": 2840} {"train_loss": -11.58523178100586, "global_step": 477268, "epoch": 2840} {"train_loss": -11.932394027709961, "global_step": 477269, "epoch": 2840} {"train_loss": -11.271833419799805, "global_step": 477270, "epoch": 2840} {"train_loss": -12.15147590637207, "global_step": 477271, "epoch": 2840} {"train_loss": -11.49534797668457, "global_step": 477272, "epoch": 2840} {"train_loss": -12.456600189208984, "global_step": 477273, "epoch": 2840} {"train_loss": -11.903036117553711, "global_step": 477274, "epoch": 2840} {"train_loss": -12.171335220336914, "global_step": 477275, "epoch": 2840} {"train_loss": -12.260152816772461, "global_step": 477276, "epoch": 2840} {"train_loss": -11.757678031921387, "global_step": 477277, "epoch": 2840} {"train_loss": -12.252082824707031, "global_step": 477278, "epoch": 2840} {"train_loss": -12.18332290649414, "global_step": 477279, "epoch": 2840} {"train_loss": -12.529449462890625, "global_step": 477280, "epoch": 2840} {"train_loss": -12.17567253112793, "global_step": 477281, "epoch": 2840} {"train_loss": -12.495988845825195, "global_step": 477282, "epoch": 2840} {"train_loss": -12.155529022216797, "global_step": 477283, "epoch": 2840} {"train_loss": -12.479589462280273, "global_step": 477284, "epoch": 2840} {"train_loss": -12.098755836486816, "global_step": 477285, "epoch": 2840} {"train_loss": -12.520929336547852, "global_step": 477286, "epoch": 2840} {"train_loss": -12.041426045554024, "global_step": 477287, "epoch": 2840, "val_loss": 312197.1875, "train_action_mse_error": 1.792036533355713} {"train_loss": -12.547218322753906, "global_step": 477288, "epoch": 2841} {"train_loss": -12.34787368774414, "global_step": 477289, "epoch": 2841} {"train_loss": -12.471282958984375, "global_step": 477290, "epoch": 2841} {"train_loss": -12.388370513916016, "global_step": 477291, "epoch": 2841} {"train_loss": -12.083172798156738, "global_step": 477292, "epoch": 2841} {"train_loss": -12.5494384765625, "global_step": 477293, "epoch": 2841} {"train_loss": -12.223560333251953, "global_step": 477294, "epoch": 2841} {"train_loss": -12.506635665893555, "global_step": 477295, "epoch": 2841} {"train_loss": -12.134626388549805, "global_step": 477296, "epoch": 2841} {"train_loss": -12.586139678955078, "global_step": 477297, "epoch": 2841} {"train_loss": -12.595724105834961, "global_step": 477298, "epoch": 2841} {"train_loss": -12.448902130126953, "global_step": 477299, "epoch": 2841} {"train_loss": -12.744842529296875, "global_step": 477300, "epoch": 2841} {"train_loss": -12.700370788574219, "global_step": 477301, "epoch": 2841} {"train_loss": -12.741941452026367, "global_step": 477302, "epoch": 2841} {"train_loss": -12.574594497680664, "global_step": 477303, "epoch": 2841} {"train_loss": -12.21062183380127, "global_step": 477304, "epoch": 2841} {"train_loss": -12.74766731262207, "global_step": 477305, "epoch": 2841} {"train_loss": -12.732423782348633, "global_step": 477306, "epoch": 2841} {"train_loss": -12.637563705444336, "global_step": 477307, "epoch": 2841} {"train_loss": -12.767902374267578, "global_step": 477308, "epoch": 2841} {"train_loss": -12.57233715057373, "global_step": 477309, "epoch": 2841} {"train_loss": -12.806680679321289, "global_step": 477310, "epoch": 2841} {"train_loss": -12.66270637512207, "global_step": 477311, "epoch": 2841} {"train_loss": -12.670387268066406, "global_step": 477312, "epoch": 2841} {"train_loss": -12.933967590332031, "global_step": 477313, "epoch": 2841} {"train_loss": -12.680293083190918, "global_step": 477314, "epoch": 2841} {"train_loss": -12.66387939453125, "global_step": 477315, "epoch": 2841} {"train_loss": -12.804876327514648, "global_step": 477316, "epoch": 2841} {"train_loss": -12.731128692626953, "global_step": 477317, "epoch": 2841} {"train_loss": -12.673540115356445, "global_step": 477318, "epoch": 2841} {"train_loss": -12.85037899017334, "global_step": 477319, "epoch": 2841} {"train_loss": -12.906936645507812, "global_step": 477320, "epoch": 2841} {"train_loss": -12.63644790649414, "global_step": 477321, "epoch": 2841} {"train_loss": -12.729509353637695, "global_step": 477322, "epoch": 2841} {"train_loss": -12.570154190063477, "global_step": 477323, "epoch": 2841} {"train_loss": -12.772995948791504, "global_step": 477324, "epoch": 2841} {"train_loss": -12.659911155700684, "global_step": 477325, "epoch": 2841} {"train_loss": -12.66867446899414, "global_step": 477326, "epoch": 2841} {"train_loss": -12.902718544006348, "global_step": 477327, "epoch": 2841} {"train_loss": -12.839737892150879, "global_step": 477328, "epoch": 2841} {"train_loss": -12.275389671325684, "global_step": 477329, "epoch": 2841} {"train_loss": -12.924951553344727, "global_step": 477330, "epoch": 2841} {"train_loss": -12.877331733703613, "global_step": 477331, "epoch": 2841} {"train_loss": -12.405949592590332, "global_step": 477332, "epoch": 2841} {"train_loss": -12.743368148803711, "global_step": 477333, "epoch": 2841} {"train_loss": -12.69462776184082, "global_step": 477334, "epoch": 2841} {"train_loss": -12.313228607177734, "global_step": 477335, "epoch": 2841} {"train_loss": -12.614457130432129, "global_step": 477336, "epoch": 2841} {"train_loss": -12.242044448852539, "global_step": 477337, "epoch": 2841} {"train_loss": -12.32400894165039, "global_step": 477338, "epoch": 2841} {"train_loss": -12.79356861114502, "global_step": 477339, "epoch": 2841} {"train_loss": -12.283548355102539, "global_step": 477340, "epoch": 2841} {"train_loss": -12.094404220581055, "global_step": 477341, "epoch": 2841} {"train_loss": -12.51817512512207, "global_step": 477342, "epoch": 2841} {"train_loss": -11.849610328674316, "global_step": 477343, "epoch": 2841} {"train_loss": -12.339719772338867, "global_step": 477344, "epoch": 2841} {"train_loss": -12.278820037841797, "global_step": 477345, "epoch": 2841} {"train_loss": -12.239526748657227, "global_step": 477346, "epoch": 2841} {"train_loss": -12.496126174926758, "global_step": 477347, "epoch": 2841} {"train_loss": -12.4191255569458, "global_step": 477348, "epoch": 2841} {"train_loss": -12.45418930053711, "global_step": 477349, "epoch": 2841} {"train_loss": -12.467903137207031, "global_step": 477350, "epoch": 2841} {"train_loss": -12.454330444335938, "global_step": 477351, "epoch": 2841} {"train_loss": -12.361679077148438, "global_step": 477352, "epoch": 2841} {"train_loss": -12.24609375, "global_step": 477353, "epoch": 2841} {"train_loss": -12.617753982543945, "global_step": 477354, "epoch": 2841} {"train_loss": -12.675182342529297, "global_step": 477355, "epoch": 2841} {"train_loss": -12.313941955566406, "global_step": 477356, "epoch": 2841} {"train_loss": -12.636642456054688, "global_step": 477357, "epoch": 2841} {"train_loss": -12.290654182434082, "global_step": 477358, "epoch": 2841} {"train_loss": -12.671037673950195, "global_step": 477359, "epoch": 2841} {"train_loss": -12.204150199890137, "global_step": 477360, "epoch": 2841} {"train_loss": -11.352569580078125, "global_step": 477361, "epoch": 2841} {"train_loss": -12.736570358276367, "global_step": 477362, "epoch": 2841} {"train_loss": -12.096931457519531, "global_step": 477363, "epoch": 2841} {"train_loss": -11.995256423950195, "global_step": 477364, "epoch": 2841} {"train_loss": -12.04145622253418, "global_step": 477365, "epoch": 2841} {"train_loss": -12.05832290649414, "global_step": 477366, "epoch": 2841} {"train_loss": -11.565695762634277, "global_step": 477367, "epoch": 2841} {"train_loss": -12.399396896362305, "global_step": 477368, "epoch": 2841} {"train_loss": -12.564764022827148, "global_step": 477369, "epoch": 2841} {"train_loss": -12.290728569030762, "global_step": 477370, "epoch": 2841} {"train_loss": -12.461366653442383, "global_step": 477371, "epoch": 2841} {"train_loss": -12.664639472961426, "global_step": 477372, "epoch": 2841} {"train_loss": -12.680788040161133, "global_step": 477373, "epoch": 2841} {"train_loss": -12.213602066040039, "global_step": 477374, "epoch": 2841} {"train_loss": -12.03603744506836, "global_step": 477375, "epoch": 2841} {"train_loss": -11.923675537109375, "global_step": 477376, "epoch": 2841} {"train_loss": -12.239482879638672, "global_step": 477377, "epoch": 2841} {"train_loss": -12.16148853302002, "global_step": 477378, "epoch": 2841} {"train_loss": -10.46807861328125, "global_step": 477379, "epoch": 2841} {"train_loss": -12.042848587036133, "global_step": 477380, "epoch": 2841} {"train_loss": -11.6070556640625, "global_step": 477381, "epoch": 2841} {"train_loss": -11.347832679748535, "global_step": 477382, "epoch": 2841} {"train_loss": -12.076682090759277, "global_step": 477383, "epoch": 2841} {"train_loss": -11.668764114379883, "global_step": 477384, "epoch": 2841} {"train_loss": -12.450841903686523, "global_step": 477385, "epoch": 2841} {"train_loss": -11.741853713989258, "global_step": 477386, "epoch": 2841} {"train_loss": -11.735507011413574, "global_step": 477387, "epoch": 2841} {"train_loss": -11.49604606628418, "global_step": 477388, "epoch": 2841} {"train_loss": -12.317550659179688, "global_step": 477389, "epoch": 2841} {"train_loss": -11.934642791748047, "global_step": 477390, "epoch": 2841} {"train_loss": -12.687256813049316, "global_step": 477391, "epoch": 2841} {"train_loss": -12.167494773864746, "global_step": 477392, "epoch": 2841} {"train_loss": -12.233609199523926, "global_step": 477393, "epoch": 2841} {"train_loss": -12.243608474731445, "global_step": 477394, "epoch": 2841} {"train_loss": -11.892778396606445, "global_step": 477395, "epoch": 2841} {"train_loss": -12.564739227294922, "global_step": 477396, "epoch": 2841} {"train_loss": -12.001578330993652, "global_step": 477397, "epoch": 2841} {"train_loss": -12.519186973571777, "global_step": 477398, "epoch": 2841} {"train_loss": -12.184812545776367, "global_step": 477399, "epoch": 2841} {"train_loss": -12.72046184539795, "global_step": 477400, "epoch": 2841} {"train_loss": -12.256279945373535, "global_step": 477401, "epoch": 2841} {"train_loss": -12.537757873535156, "global_step": 477402, "epoch": 2841} {"train_loss": -12.238165855407715, "global_step": 477403, "epoch": 2841} {"train_loss": -12.532231330871582, "global_step": 477404, "epoch": 2841} {"train_loss": -12.50716495513916, "global_step": 477405, "epoch": 2841} {"train_loss": -12.214576721191406, "global_step": 477406, "epoch": 2841} {"train_loss": -12.745132446289062, "global_step": 477407, "epoch": 2841} {"train_loss": -12.514472007751465, "global_step": 477408, "epoch": 2841} {"train_loss": -12.75750732421875, "global_step": 477409, "epoch": 2841} {"train_loss": -12.468257904052734, "global_step": 477410, "epoch": 2841} {"train_loss": -12.971714973449707, "global_step": 477411, "epoch": 2841} {"train_loss": -12.512970924377441, "global_step": 477412, "epoch": 2841} {"train_loss": -12.492548942565918, "global_step": 477413, "epoch": 2841} {"train_loss": -12.424982070922852, "global_step": 477414, "epoch": 2841} {"train_loss": -12.481937408447266, "global_step": 477415, "epoch": 2841} {"train_loss": -12.634102821350098, "global_step": 477416, "epoch": 2841} {"train_loss": -12.184892654418945, "global_step": 477417, "epoch": 2841} {"train_loss": -12.434051513671875, "global_step": 477418, "epoch": 2841} {"train_loss": -12.239473342895508, "global_step": 477419, "epoch": 2841} {"train_loss": -12.012922286987305, "global_step": 477420, "epoch": 2841} {"train_loss": -12.648138046264648, "global_step": 477421, "epoch": 2841} {"train_loss": -12.326166152954102, "global_step": 477422, "epoch": 2841} {"train_loss": -12.756563186645508, "global_step": 477423, "epoch": 2841} {"train_loss": -12.479448318481445, "global_step": 477424, "epoch": 2841} {"train_loss": -12.691913604736328, "global_step": 477425, "epoch": 2841} {"train_loss": -12.577001571655273, "global_step": 477426, "epoch": 2841} {"train_loss": -12.64638900756836, "global_step": 477427, "epoch": 2841} {"train_loss": -12.391853332519531, "global_step": 477428, "epoch": 2841} {"train_loss": -12.602991104125977, "global_step": 477429, "epoch": 2841} {"train_loss": -12.117976188659668, "global_step": 477430, "epoch": 2841} {"train_loss": -12.270039558410645, "global_step": 477431, "epoch": 2841} {"train_loss": -12.404560089111328, "global_step": 477432, "epoch": 2841} {"train_loss": -11.976221084594727, "global_step": 477433, "epoch": 2841} {"train_loss": -12.575599670410156, "global_step": 477434, "epoch": 2841} {"train_loss": -12.447413444519043, "global_step": 477435, "epoch": 2841} {"train_loss": -11.154373168945312, "global_step": 477436, "epoch": 2841} {"train_loss": -12.28164291381836, "global_step": 477437, "epoch": 2841} {"train_loss": -12.732558250427246, "global_step": 477438, "epoch": 2841} {"train_loss": -11.557107925415039, "global_step": 477439, "epoch": 2841} {"train_loss": -11.779916763305664, "global_step": 477440, "epoch": 2841} {"train_loss": -12.325109481811523, "global_step": 477441, "epoch": 2841} {"train_loss": -12.918281555175781, "global_step": 477442, "epoch": 2841} {"train_loss": -12.493429183959961, "global_step": 477443, "epoch": 2841} {"train_loss": -12.745641708374023, "global_step": 477444, "epoch": 2841} {"train_loss": -12.46200180053711, "global_step": 477445, "epoch": 2841} {"train_loss": -12.393716812133789, "global_step": 477446, "epoch": 2841} {"train_loss": -12.606414794921875, "global_step": 477447, "epoch": 2841} {"train_loss": -12.156612396240234, "global_step": 477448, "epoch": 2841} {"train_loss": -11.959905624389648, "global_step": 477449, "epoch": 2841} {"train_loss": -12.089113235473633, "global_step": 477450, "epoch": 2841} {"train_loss": -12.057138442993164, "global_step": 477451, "epoch": 2841} {"train_loss": -11.588897705078125, "global_step": 477452, "epoch": 2841} {"train_loss": -12.217828750610352, "global_step": 477453, "epoch": 2841} {"train_loss": -12.161779403686523, "global_step": 477454, "epoch": 2841} {"train_loss": -12.376925491151356, "global_step": 477455, "epoch": 2841, "val_loss": 318261.9375} {"train_loss": -12.310432434082031, "global_step": 477456, "epoch": 2842} {"train_loss": -12.229018211364746, "global_step": 477457, "epoch": 2842} {"train_loss": -11.693970680236816, "global_step": 477458, "epoch": 2842} {"train_loss": -12.629814147949219, "global_step": 477459, "epoch": 2842} {"train_loss": -11.56241226196289, "global_step": 477460, "epoch": 2842} {"train_loss": -12.211135864257812, "global_step": 477461, "epoch": 2842} {"train_loss": -12.32984733581543, "global_step": 477462, "epoch": 2842} {"train_loss": -12.544881820678711, "global_step": 477463, "epoch": 2842} {"train_loss": -11.93328857421875, "global_step": 477464, "epoch": 2842} {"train_loss": -12.475589752197266, "global_step": 477465, "epoch": 2842} {"train_loss": -11.868877410888672, "global_step": 477466, "epoch": 2842} {"train_loss": -12.521894454956055, "global_step": 477467, "epoch": 2842} {"train_loss": -11.466715812683105, "global_step": 477468, "epoch": 2842} {"train_loss": -11.991844177246094, "global_step": 477469, "epoch": 2842} {"train_loss": -12.335599899291992, "global_step": 477470, "epoch": 2842} {"train_loss": -12.238460540771484, "global_step": 477471, "epoch": 2842} {"train_loss": -11.700956344604492, "global_step": 477472, "epoch": 2842} {"train_loss": -12.40821647644043, "global_step": 477473, "epoch": 2842} {"train_loss": -10.287586212158203, "global_step": 477474, "epoch": 2842} {"train_loss": -12.144586563110352, "global_step": 477475, "epoch": 2842} {"train_loss": -12.300698280334473, "global_step": 477476, "epoch": 2842} {"train_loss": -11.720012664794922, "global_step": 477477, "epoch": 2842} {"train_loss": -11.962416648864746, "global_step": 477478, "epoch": 2842} {"train_loss": -12.141767501831055, "global_step": 477479, "epoch": 2842} {"train_loss": -10.925387382507324, "global_step": 477480, "epoch": 2842} {"train_loss": -12.151351928710938, "global_step": 477481, "epoch": 2842} {"train_loss": -12.628931045532227, "global_step": 477482, "epoch": 2842} {"train_loss": -11.886717796325684, "global_step": 477483, "epoch": 2842} {"train_loss": -12.214733123779297, "global_step": 477484, "epoch": 2842} {"train_loss": -10.023366928100586, "global_step": 477485, "epoch": 2842} {"train_loss": -12.033914566040039, "global_step": 477486, "epoch": 2842} {"train_loss": -11.867597579956055, "global_step": 477487, "epoch": 2842} {"train_loss": -11.166740417480469, "global_step": 477488, "epoch": 2842} {"train_loss": -11.395208358764648, "global_step": 477489, "epoch": 2842} {"train_loss": -10.656661987304688, "global_step": 477490, "epoch": 2842} {"train_loss": -10.366094589233398, "global_step": 477491, "epoch": 2842} {"train_loss": -11.018712997436523, "global_step": 477492, "epoch": 2842} {"train_loss": -11.358341217041016, "global_step": 477493, "epoch": 2842} {"train_loss": -11.733297348022461, "global_step": 477494, "epoch": 2842} {"train_loss": -11.696516990661621, "global_step": 477495, "epoch": 2842} {"train_loss": -12.090511322021484, "global_step": 477496, "epoch": 2842} {"train_loss": -11.609455108642578, "global_step": 477497, "epoch": 2842} {"train_loss": -12.32302188873291, "global_step": 477498, "epoch": 2842} {"train_loss": -12.245489120483398, "global_step": 477499, "epoch": 2842} {"train_loss": -11.936278343200684, "global_step": 477500, "epoch": 2842} {"train_loss": -12.00388240814209, "global_step": 477501, "epoch": 2842} {"train_loss": -11.633893013000488, "global_step": 477502, "epoch": 2842} {"train_loss": -11.687070846557617, "global_step": 477503, "epoch": 2842} {"train_loss": -12.20309829711914, "global_step": 477504, "epoch": 2842} {"train_loss": -11.295249938964844, "global_step": 477505, "epoch": 2842} {"train_loss": -12.046538352966309, "global_step": 477506, "epoch": 2842} {"train_loss": -11.497925758361816, "global_step": 477507, "epoch": 2842} {"train_loss": -12.48180866241455, "global_step": 477508, "epoch": 2842} {"train_loss": -11.579025268554688, "global_step": 477509, "epoch": 2842} {"train_loss": -12.363598823547363, "global_step": 477510, "epoch": 2842} {"train_loss": -12.109838485717773, "global_step": 477511, "epoch": 2842} {"train_loss": -11.717991828918457, "global_step": 477512, "epoch": 2842} {"train_loss": -12.25383472442627, "global_step": 477513, "epoch": 2842} {"train_loss": -11.545757293701172, "global_step": 477514, "epoch": 2842} {"train_loss": -12.515226364135742, "global_step": 477515, "epoch": 2842} {"train_loss": -12.044355392456055, "global_step": 477516, "epoch": 2842} {"train_loss": -12.387822151184082, "global_step": 477517, "epoch": 2842} {"train_loss": -12.153956413269043, "global_step": 477518, "epoch": 2842} {"train_loss": -12.057294845581055, "global_step": 477519, "epoch": 2842} {"train_loss": -12.090656280517578, "global_step": 477520, "epoch": 2842} {"train_loss": -12.419998168945312, "global_step": 477521, "epoch": 2842} {"train_loss": -12.369373321533203, "global_step": 477522, "epoch": 2842} {"train_loss": -12.42503547668457, "global_step": 477523, "epoch": 2842} {"train_loss": -12.5007905960083, "global_step": 477524, "epoch": 2842} {"train_loss": -12.086902618408203, "global_step": 477525, "epoch": 2842} {"train_loss": -12.647263526916504, "global_step": 477526, "epoch": 2842} {"train_loss": -12.424341201782227, "global_step": 477527, "epoch": 2842} {"train_loss": -12.362516403198242, "global_step": 477528, "epoch": 2842} {"train_loss": -12.865309715270996, "global_step": 477529, "epoch": 2842} {"train_loss": -12.562274932861328, "global_step": 477530, "epoch": 2842} {"train_loss": -12.49233627319336, "global_step": 477531, "epoch": 2842} {"train_loss": -12.468619346618652, "global_step": 477532, "epoch": 2842} {"train_loss": -12.613191604614258, "global_step": 477533, "epoch": 2842} {"train_loss": -12.737635612487793, "global_step": 477534, "epoch": 2842} {"train_loss": -12.660375595092773, "global_step": 477535, "epoch": 2842} {"train_loss": -12.696440696716309, "global_step": 477536, "epoch": 2842} {"train_loss": -12.75979232788086, "global_step": 477537, "epoch": 2842} {"train_loss": -12.571803092956543, "global_step": 477538, "epoch": 2842} {"train_loss": -12.717517852783203, "global_step": 477539, "epoch": 2842} {"train_loss": -12.732515335083008, "global_step": 477540, "epoch": 2842} {"train_loss": -12.823928833007812, "global_step": 477541, "epoch": 2842} {"train_loss": -12.69194221496582, "global_step": 477542, "epoch": 2842} {"train_loss": -12.652190208435059, "global_step": 477543, "epoch": 2842} {"train_loss": -12.680774688720703, "global_step": 477544, "epoch": 2842} {"train_loss": -12.578614234924316, "global_step": 477545, "epoch": 2842} {"train_loss": -12.520421981811523, "global_step": 477546, "epoch": 2842} {"train_loss": -12.824982643127441, "global_step": 477547, "epoch": 2842} {"train_loss": -12.777145385742188, "global_step": 477548, "epoch": 2842} {"train_loss": -12.472553253173828, "global_step": 477549, "epoch": 2842} {"train_loss": -12.884371757507324, "global_step": 477550, "epoch": 2842} {"train_loss": -12.460586547851562, "global_step": 477551, "epoch": 2842} {"train_loss": -13.039649963378906, "global_step": 477552, "epoch": 2842} {"train_loss": -12.718608856201172, "global_step": 477553, "epoch": 2842} {"train_loss": -12.674561500549316, "global_step": 477554, "epoch": 2842} {"train_loss": -12.729272842407227, "global_step": 477555, "epoch": 2842} {"train_loss": -12.958250999450684, "global_step": 477556, "epoch": 2842} {"train_loss": -12.539949417114258, "global_step": 477557, "epoch": 2842} {"train_loss": -12.864914894104004, "global_step": 477558, "epoch": 2842} {"train_loss": -12.91649055480957, "global_step": 477559, "epoch": 2842} {"train_loss": -12.78853702545166, "global_step": 477560, "epoch": 2842} {"train_loss": -13.034440994262695, "global_step": 477561, "epoch": 2842} {"train_loss": -12.85893440246582, "global_step": 477562, "epoch": 2842} {"train_loss": -12.57995891571045, "global_step": 477563, "epoch": 2842} {"train_loss": -12.458070755004883, "global_step": 477564, "epoch": 2842} {"train_loss": -12.993046760559082, "global_step": 477565, "epoch": 2842} {"train_loss": -12.519905090332031, "global_step": 477566, "epoch": 2842} {"train_loss": -12.38642692565918, "global_step": 477567, "epoch": 2842} {"train_loss": -12.854165077209473, "global_step": 477568, "epoch": 2842} {"train_loss": -12.948344230651855, "global_step": 477569, "epoch": 2842} {"train_loss": -12.627010345458984, "global_step": 477570, "epoch": 2842} {"train_loss": -12.805488586425781, "global_step": 477571, "epoch": 2842} {"train_loss": -12.571821212768555, "global_step": 477572, "epoch": 2842} {"train_loss": -12.31386661529541, "global_step": 477573, "epoch": 2842} {"train_loss": -12.578837394714355, "global_step": 477574, "epoch": 2842} {"train_loss": -12.399988174438477, "global_step": 477575, "epoch": 2842} {"train_loss": -12.269766807556152, "global_step": 477576, "epoch": 2842} {"train_loss": -12.801334381103516, "global_step": 477577, "epoch": 2842} {"train_loss": -12.286120414733887, "global_step": 477578, "epoch": 2842} {"train_loss": -12.01129150390625, "global_step": 477579, "epoch": 2842} {"train_loss": -12.450555801391602, "global_step": 477580, "epoch": 2842} {"train_loss": -12.901352882385254, "global_step": 477581, "epoch": 2842} {"train_loss": -12.45964527130127, "global_step": 477582, "epoch": 2842} {"train_loss": -12.609214782714844, "global_step": 477583, "epoch": 2842} {"train_loss": -12.966894149780273, "global_step": 477584, "epoch": 2842} {"train_loss": -12.80125904083252, "global_step": 477585, "epoch": 2842} {"train_loss": -12.738186836242676, "global_step": 477586, "epoch": 2842} {"train_loss": -12.740765571594238, "global_step": 477587, "epoch": 2842} {"train_loss": -12.161685943603516, "global_step": 477588, "epoch": 2842} {"train_loss": -12.610431671142578, "global_step": 477589, "epoch": 2842} {"train_loss": -12.298856735229492, "global_step": 477590, "epoch": 2842} {"train_loss": -10.560365676879883, "global_step": 477591, "epoch": 2842} {"train_loss": -11.46550178527832, "global_step": 477592, "epoch": 2842} {"train_loss": -12.450352668762207, "global_step": 477593, "epoch": 2842} {"train_loss": -9.828516006469727, "global_step": 477594, "epoch": 2842} {"train_loss": -11.924469947814941, "global_step": 477595, "epoch": 2842} {"train_loss": -11.956212997436523, "global_step": 477596, "epoch": 2842} {"train_loss": -11.12098503112793, "global_step": 477597, "epoch": 2842} {"train_loss": -11.827777862548828, "global_step": 477598, "epoch": 2842} {"train_loss": -10.254486083984375, "global_step": 477599, "epoch": 2842} {"train_loss": -11.861373901367188, "global_step": 477600, "epoch": 2842} {"train_loss": -11.475954055786133, "global_step": 477601, "epoch": 2842} {"train_loss": -10.913111686706543, "global_step": 477602, "epoch": 2842} {"train_loss": -12.341832160949707, "global_step": 477603, "epoch": 2842} {"train_loss": -11.072851181030273, "global_step": 477604, "epoch": 2842} {"train_loss": -12.136245727539062, "global_step": 477605, "epoch": 2842} {"train_loss": -10.995833396911621, "global_step": 477606, "epoch": 2842} {"train_loss": -11.031149864196777, "global_step": 477607, "epoch": 2842} {"train_loss": -11.780887603759766, "global_step": 477608, "epoch": 2842} {"train_loss": -10.472883224487305, "global_step": 477609, "epoch": 2842} {"train_loss": -11.222204208374023, "global_step": 477610, "epoch": 2842} {"train_loss": -10.95465087890625, "global_step": 477611, "epoch": 2842} {"train_loss": -10.477436065673828, "global_step": 477612, "epoch": 2842} {"train_loss": -10.525298118591309, "global_step": 477613, "epoch": 2842} {"train_loss": -10.859831809997559, "global_step": 477614, "epoch": 2842} {"train_loss": -9.862930297851562, "global_step": 477615, "epoch": 2842} {"train_loss": -10.382318496704102, "global_step": 477616, "epoch": 2842} {"train_loss": -9.94480037689209, "global_step": 477617, "epoch": 2842} {"train_loss": -11.105443000793457, "global_step": 477618, "epoch": 2842} {"train_loss": -10.096185684204102, "global_step": 477619, "epoch": 2842} {"train_loss": -10.22704792022705, "global_step": 477620, "epoch": 2842} {"train_loss": -10.804794311523438, "global_step": 477621, "epoch": 2842} {"train_loss": -10.375019073486328, "global_step": 477622, "epoch": 2842} {"train_loss": -12.012262395450048, "global_step": 477623, "epoch": 2842, "val_loss": 313940.09375} {"train_loss": -11.992591857910156, "global_step": 477624, "epoch": 2843} {"train_loss": -10.64610481262207, "global_step": 477625, "epoch": 2843} {"train_loss": -11.327010154724121, "global_step": 477626, "epoch": 2843} {"train_loss": -11.720991134643555, "global_step": 477627, "epoch": 2843} {"train_loss": -11.462608337402344, "global_step": 477628, "epoch": 2843} {"train_loss": -12.021993637084961, "global_step": 477629, "epoch": 2843} {"train_loss": -11.38308334350586, "global_step": 477630, "epoch": 2843} {"train_loss": -11.224207878112793, "global_step": 477631, "epoch": 2843} {"train_loss": -12.333271980285645, "global_step": 477632, "epoch": 2843} {"train_loss": -11.278736114501953, "global_step": 477633, "epoch": 2843} {"train_loss": -12.064149856567383, "global_step": 477634, "epoch": 2843} {"train_loss": -11.606801986694336, "global_step": 477635, "epoch": 2843} {"train_loss": -11.890592575073242, "global_step": 477636, "epoch": 2843} {"train_loss": -12.221939086914062, "global_step": 477637, "epoch": 2843} {"train_loss": -12.135688781738281, "global_step": 477638, "epoch": 2843} {"train_loss": -12.351613998413086, "global_step": 477639, "epoch": 2843} {"train_loss": -12.169563293457031, "global_step": 477640, "epoch": 2843} {"train_loss": -12.303529739379883, "global_step": 477641, "epoch": 2843} {"train_loss": -11.887384414672852, "global_step": 477642, "epoch": 2843} {"train_loss": -12.299515724182129, "global_step": 477643, "epoch": 2843} {"train_loss": -12.138570785522461, "global_step": 477644, "epoch": 2843} {"train_loss": -12.177003860473633, "global_step": 477645, "epoch": 2843} {"train_loss": -11.89356803894043, "global_step": 477646, "epoch": 2843} {"train_loss": -12.288975715637207, "global_step": 477647, "epoch": 2843} {"train_loss": -12.11392593383789, "global_step": 477648, "epoch": 2843} {"train_loss": -12.221431732177734, "global_step": 477649, "epoch": 2843} {"train_loss": -12.359657287597656, "global_step": 477650, "epoch": 2843} {"train_loss": -12.226906776428223, "global_step": 477651, "epoch": 2843} {"train_loss": -12.276238441467285, "global_step": 477652, "epoch": 2843} {"train_loss": -12.46077823638916, "global_step": 477653, "epoch": 2843} {"train_loss": -12.468807220458984, "global_step": 477654, "epoch": 2843} {"train_loss": -12.665921211242676, "global_step": 477655, "epoch": 2843} {"train_loss": -12.565515518188477, "global_step": 477656, "epoch": 2843} {"train_loss": -12.41909408569336, "global_step": 477657, "epoch": 2843} {"train_loss": -12.724536895751953, "global_step": 477658, "epoch": 2843} {"train_loss": -12.379050254821777, "global_step": 477659, "epoch": 2843} {"train_loss": -12.573229789733887, "global_step": 477660, "epoch": 2843} {"train_loss": -12.475320816040039, "global_step": 477661, "epoch": 2843} {"train_loss": -12.669393539428711, "global_step": 477662, "epoch": 2843} {"train_loss": -12.569775581359863, "global_step": 477663, "epoch": 2843} {"train_loss": -12.746822357177734, "global_step": 477664, "epoch": 2843} {"train_loss": -12.675045013427734, "global_step": 477665, "epoch": 2843} {"train_loss": -12.592264175415039, "global_step": 477666, "epoch": 2843} {"train_loss": -12.578154563903809, "global_step": 477667, "epoch": 2843} {"train_loss": -12.83143138885498, "global_step": 477668, "epoch": 2843} {"train_loss": -12.415556907653809, "global_step": 477669, "epoch": 2843} {"train_loss": -12.882643699645996, "global_step": 477670, "epoch": 2843} {"train_loss": -12.817968368530273, "global_step": 477671, "epoch": 2843} {"train_loss": -12.882112503051758, "global_step": 477672, "epoch": 2843} {"train_loss": -12.795312881469727, "global_step": 477673, "epoch": 2843} {"train_loss": -12.723432540893555, "global_step": 477674, "epoch": 2843} {"train_loss": -12.835933685302734, "global_step": 477675, "epoch": 2843} {"train_loss": -12.76852035522461, "global_step": 477676, "epoch": 2843} {"train_loss": -12.738643646240234, "global_step": 477677, "epoch": 2843} {"train_loss": -13.011972427368164, "global_step": 477678, "epoch": 2843} {"train_loss": -12.840690612792969, "global_step": 477679, "epoch": 2843} {"train_loss": -12.926669120788574, "global_step": 477680, "epoch": 2843} {"train_loss": -12.739530563354492, "global_step": 477681, "epoch": 2843} {"train_loss": -12.666060447692871, "global_step": 477682, "epoch": 2843} {"train_loss": -12.890804290771484, "global_step": 477683, "epoch": 2843} {"train_loss": -12.943256378173828, "global_step": 477684, "epoch": 2843} {"train_loss": -12.891766548156738, "global_step": 477685, "epoch": 2843} {"train_loss": -12.492977142333984, "global_step": 477686, "epoch": 2843} {"train_loss": -12.704280853271484, "global_step": 477687, "epoch": 2843} {"train_loss": -13.015181541442871, "global_step": 477688, "epoch": 2843} {"train_loss": -12.627090454101562, "global_step": 477689, "epoch": 2843} {"train_loss": -12.573202133178711, "global_step": 477690, "epoch": 2843} {"train_loss": -12.665698051452637, "global_step": 477691, "epoch": 2843} {"train_loss": -12.412073135375977, "global_step": 477692, "epoch": 2843} {"train_loss": -12.421089172363281, "global_step": 477693, "epoch": 2843} {"train_loss": -12.911541938781738, "global_step": 477694, "epoch": 2843} {"train_loss": -12.385254859924316, "global_step": 477695, "epoch": 2843} {"train_loss": -11.298154830932617, "global_step": 477696, "epoch": 2843} {"train_loss": -12.437299728393555, "global_step": 477697, "epoch": 2843} {"train_loss": -12.690656661987305, "global_step": 477698, "epoch": 2843} {"train_loss": -12.259908676147461, "global_step": 477699, "epoch": 2843} {"train_loss": -12.302111625671387, "global_step": 477700, "epoch": 2843} {"train_loss": -12.545406341552734, "global_step": 477701, "epoch": 2843} {"train_loss": -12.792606353759766, "global_step": 477702, "epoch": 2843} {"train_loss": -12.698774337768555, "global_step": 477703, "epoch": 2843} {"train_loss": -12.751445770263672, "global_step": 477704, "epoch": 2843} {"train_loss": -12.901941299438477, "global_step": 477705, "epoch": 2843} {"train_loss": -12.541727066040039, "global_step": 477706, "epoch": 2843} {"train_loss": -12.131439208984375, "global_step": 477707, "epoch": 2843} {"train_loss": -12.802401542663574, "global_step": 477708, "epoch": 2843} {"train_loss": -12.807535171508789, "global_step": 477709, "epoch": 2843} {"train_loss": -12.541088104248047, "global_step": 477710, "epoch": 2843} {"train_loss": -12.997673034667969, "global_step": 477711, "epoch": 2843} {"train_loss": -12.979133605957031, "global_step": 477712, "epoch": 2843} {"train_loss": -12.717421531677246, "global_step": 477713, "epoch": 2843} {"train_loss": -12.996297836303711, "global_step": 477714, "epoch": 2843} {"train_loss": -12.579992294311523, "global_step": 477715, "epoch": 2843} {"train_loss": -12.886528015136719, "global_step": 477716, "epoch": 2843} {"train_loss": -12.267818450927734, "global_step": 477717, "epoch": 2843} {"train_loss": -12.771486282348633, "global_step": 477718, "epoch": 2843} {"train_loss": -12.78585433959961, "global_step": 477719, "epoch": 2843} {"train_loss": -12.609569549560547, "global_step": 477720, "epoch": 2843} {"train_loss": -12.859888076782227, "global_step": 477721, "epoch": 2843} {"train_loss": -12.751971244812012, "global_step": 477722, "epoch": 2843} {"train_loss": -12.801185607910156, "global_step": 477723, "epoch": 2843} {"train_loss": -12.52033519744873, "global_step": 477724, "epoch": 2843} {"train_loss": -12.474360466003418, "global_step": 477725, "epoch": 2843} {"train_loss": -12.257296562194824, "global_step": 477726, "epoch": 2843} {"train_loss": -12.709237098693848, "global_step": 477727, "epoch": 2843} {"train_loss": -12.148622512817383, "global_step": 477728, "epoch": 2843} {"train_loss": -11.894960403442383, "global_step": 477729, "epoch": 2843} {"train_loss": -12.566999435424805, "global_step": 477730, "epoch": 2843} {"train_loss": -11.708742141723633, "global_step": 477731, "epoch": 2843} {"train_loss": -12.123339653015137, "global_step": 477732, "epoch": 2843} {"train_loss": -12.678081512451172, "global_step": 477733, "epoch": 2843} {"train_loss": -12.219554901123047, "global_step": 477734, "epoch": 2843} {"train_loss": -12.493267059326172, "global_step": 477735, "epoch": 2843} {"train_loss": -12.366908073425293, "global_step": 477736, "epoch": 2843} {"train_loss": -12.689413070678711, "global_step": 477737, "epoch": 2843} {"train_loss": -12.789199829101562, "global_step": 477738, "epoch": 2843} {"train_loss": -12.927498817443848, "global_step": 477739, "epoch": 2843} {"train_loss": -12.711950302124023, "global_step": 477740, "epoch": 2843} {"train_loss": -12.6925048828125, "global_step": 477741, "epoch": 2843} {"train_loss": -12.556276321411133, "global_step": 477742, "epoch": 2843} {"train_loss": -11.914409637451172, "global_step": 477743, "epoch": 2843} {"train_loss": -12.14185905456543, "global_step": 477744, "epoch": 2843} {"train_loss": -10.891311645507812, "global_step": 477745, "epoch": 2843} {"train_loss": -11.689288139343262, "global_step": 477746, "epoch": 2843} {"train_loss": -11.665229797363281, "global_step": 477747, "epoch": 2843} {"train_loss": -10.20744800567627, "global_step": 477748, "epoch": 2843} {"train_loss": -11.88554573059082, "global_step": 477749, "epoch": 2843} {"train_loss": -10.353510856628418, "global_step": 477750, "epoch": 2843} {"train_loss": -11.063226699829102, "global_step": 477751, "epoch": 2843} {"train_loss": -11.535173416137695, "global_step": 477752, "epoch": 2843} {"train_loss": -10.751653671264648, "global_step": 477753, "epoch": 2843} {"train_loss": -11.611827850341797, "global_step": 477754, "epoch": 2843} {"train_loss": -11.294611930847168, "global_step": 477755, "epoch": 2843} {"train_loss": -11.778326034545898, "global_step": 477756, "epoch": 2843} {"train_loss": -12.023344039916992, "global_step": 477757, "epoch": 2843} {"train_loss": -11.839580535888672, "global_step": 477758, "epoch": 2843} {"train_loss": -11.896888732910156, "global_step": 477759, "epoch": 2843} {"train_loss": -12.075307846069336, "global_step": 477760, "epoch": 2843} {"train_loss": -11.492569923400879, "global_step": 477761, "epoch": 2843} {"train_loss": -12.449779510498047, "global_step": 477762, "epoch": 2843} {"train_loss": -11.753324508666992, "global_step": 477763, "epoch": 2843} {"train_loss": -12.662059783935547, "global_step": 477764, "epoch": 2843} {"train_loss": -12.243093490600586, "global_step": 477765, "epoch": 2843} {"train_loss": -12.596168518066406, "global_step": 477766, "epoch": 2843} {"train_loss": -12.038477897644043, "global_step": 477767, "epoch": 2843} {"train_loss": -12.165030479431152, "global_step": 477768, "epoch": 2843} {"train_loss": -12.158169746398926, "global_step": 477769, "epoch": 2843} {"train_loss": -12.452953338623047, "global_step": 477770, "epoch": 2843} {"train_loss": -11.91153621673584, "global_step": 477771, "epoch": 2843} {"train_loss": -12.447826385498047, "global_step": 477772, "epoch": 2843} {"train_loss": -11.955678939819336, "global_step": 477773, "epoch": 2843} {"train_loss": -12.11504077911377, "global_step": 477774, "epoch": 2843} {"train_loss": -12.447052001953125, "global_step": 477775, "epoch": 2843} {"train_loss": -12.305219650268555, "global_step": 477776, "epoch": 2843} {"train_loss": -12.30339241027832, "global_step": 477777, "epoch": 2843} {"train_loss": -12.730636596679688, "global_step": 477778, "epoch": 2843} {"train_loss": -12.217767715454102, "global_step": 477779, "epoch": 2843} {"train_loss": -12.493345260620117, "global_step": 477780, "epoch": 2843} {"train_loss": -12.766114234924316, "global_step": 477781, "epoch": 2843} {"train_loss": -12.444330215454102, "global_step": 477782, "epoch": 2843} {"train_loss": -12.393281936645508, "global_step": 477783, "epoch": 2843} {"train_loss": -12.792081832885742, "global_step": 477784, "epoch": 2843} {"train_loss": -12.055112838745117, "global_step": 477785, "epoch": 2843} {"train_loss": -12.70094108581543, "global_step": 477786, "epoch": 2843} {"train_loss": -11.998798370361328, "global_step": 477787, "epoch": 2843} {"train_loss": -11.454482078552246, "global_step": 477788, "epoch": 2843} {"train_loss": -12.184188842773438, "global_step": 477789, "epoch": 2843} {"train_loss": -11.672384262084961, "global_step": 477790, "epoch": 2843} {"train_loss": -12.299392666135516, "global_step": 477791, "epoch": 2843, "val_loss": 315843.78125} {"train_loss": -11.127080917358398, "global_step": 477792, "epoch": 2844} {"train_loss": -11.082206726074219, "global_step": 477793, "epoch": 2844} {"train_loss": -11.610845565795898, "global_step": 477794, "epoch": 2844} {"train_loss": -10.97906494140625, "global_step": 477795, "epoch": 2844} {"train_loss": -11.621370315551758, "global_step": 477796, "epoch": 2844} {"train_loss": -11.614097595214844, "global_step": 477797, "epoch": 2844} {"train_loss": -12.105100631713867, "global_step": 477798, "epoch": 2844} {"train_loss": -11.900960922241211, "global_step": 477799, "epoch": 2844} {"train_loss": -11.303832054138184, "global_step": 477800, "epoch": 2844} {"train_loss": -12.220174789428711, "global_step": 477801, "epoch": 2844} {"train_loss": -11.333030700683594, "global_step": 477802, "epoch": 2844} {"train_loss": -11.734014511108398, "global_step": 477803, "epoch": 2844} {"train_loss": -11.038697242736816, "global_step": 477804, "epoch": 2844} {"train_loss": -12.257862091064453, "global_step": 477805, "epoch": 2844} {"train_loss": -11.868515014648438, "global_step": 477806, "epoch": 2844} {"train_loss": -12.25006103515625, "global_step": 477807, "epoch": 2844} {"train_loss": -11.776102066040039, "global_step": 477808, "epoch": 2844} {"train_loss": -11.982047080993652, "global_step": 477809, "epoch": 2844} {"train_loss": -12.214481353759766, "global_step": 477810, "epoch": 2844} {"train_loss": -12.01609992980957, "global_step": 477811, "epoch": 2844} {"train_loss": -12.422443389892578, "global_step": 477812, "epoch": 2844} {"train_loss": -12.010369300842285, "global_step": 477813, "epoch": 2844} {"train_loss": -12.246515274047852, "global_step": 477814, "epoch": 2844} {"train_loss": -12.244050979614258, "global_step": 477815, "epoch": 2844} {"train_loss": -12.352328300476074, "global_step": 477816, "epoch": 2844} {"train_loss": -12.037872314453125, "global_step": 477817, "epoch": 2844} {"train_loss": -12.369634628295898, "global_step": 477818, "epoch": 2844} {"train_loss": -12.14661979675293, "global_step": 477819, "epoch": 2844} {"train_loss": -12.242868423461914, "global_step": 477820, "epoch": 2844} {"train_loss": -12.207803726196289, "global_step": 477821, "epoch": 2844} {"train_loss": -12.480104446411133, "global_step": 477822, "epoch": 2844} {"train_loss": -12.140247344970703, "global_step": 477823, "epoch": 2844} {"train_loss": -12.538484573364258, "global_step": 477824, "epoch": 2844} {"train_loss": -12.127228736877441, "global_step": 477825, "epoch": 2844} {"train_loss": -12.008176803588867, "global_step": 477826, "epoch": 2844} {"train_loss": -12.096569061279297, "global_step": 477827, "epoch": 2844} {"train_loss": -11.880937576293945, "global_step": 477828, "epoch": 2844} {"train_loss": -12.239333152770996, "global_step": 477829, "epoch": 2844} {"train_loss": -11.6210355758667, "global_step": 477830, "epoch": 2844} {"train_loss": -12.704756736755371, "global_step": 477831, "epoch": 2844} {"train_loss": -11.618465423583984, "global_step": 477832, "epoch": 2844} {"train_loss": -12.429723739624023, "global_step": 477833, "epoch": 2844} {"train_loss": -11.8994779586792, "global_step": 477834, "epoch": 2844} {"train_loss": -11.798139572143555, "global_step": 477835, "epoch": 2844} {"train_loss": -11.878650665283203, "global_step": 477836, "epoch": 2844} {"train_loss": -12.053741455078125, "global_step": 477837, "epoch": 2844} {"train_loss": -10.432559967041016, "global_step": 477838, "epoch": 2844} {"train_loss": -11.927290916442871, "global_step": 477839, "epoch": 2844} {"train_loss": -11.372281074523926, "global_step": 477840, "epoch": 2844} {"train_loss": -11.619449615478516, "global_step": 477841, "epoch": 2844} {"train_loss": -12.198715209960938, "global_step": 477842, "epoch": 2844} {"train_loss": -11.241612434387207, "global_step": 477843, "epoch": 2844} {"train_loss": -11.949949264526367, "global_step": 477844, "epoch": 2844} {"train_loss": -11.639135360717773, "global_step": 477845, "epoch": 2844} {"train_loss": -11.805414199829102, "global_step": 477846, "epoch": 2844} {"train_loss": -11.970602035522461, "global_step": 477847, "epoch": 2844} {"train_loss": -12.121478080749512, "global_step": 477848, "epoch": 2844} {"train_loss": -11.981548309326172, "global_step": 477849, "epoch": 2844} {"train_loss": -12.490153312683105, "global_step": 477850, "epoch": 2844} {"train_loss": -12.061285018920898, "global_step": 477851, "epoch": 2844} {"train_loss": -12.126802444458008, "global_step": 477852, "epoch": 2844} {"train_loss": -12.37394905090332, "global_step": 477853, "epoch": 2844} {"train_loss": -12.34385871887207, "global_step": 477854, "epoch": 2844} {"train_loss": -12.220450401306152, "global_step": 477855, "epoch": 2844} {"train_loss": -12.225849151611328, "global_step": 477856, "epoch": 2844} {"train_loss": -12.176153182983398, "global_step": 477857, "epoch": 2844} {"train_loss": -12.149564743041992, "global_step": 477858, "epoch": 2844} {"train_loss": -12.316789627075195, "global_step": 477859, "epoch": 2844} {"train_loss": -12.447061538696289, "global_step": 477860, "epoch": 2844} {"train_loss": -12.151692390441895, "global_step": 477861, "epoch": 2844} {"train_loss": -12.430723190307617, "global_step": 477862, "epoch": 2844} {"train_loss": -12.466723442077637, "global_step": 477863, "epoch": 2844} {"train_loss": -12.301918029785156, "global_step": 477864, "epoch": 2844} {"train_loss": -11.878351211547852, "global_step": 477865, "epoch": 2844} {"train_loss": -12.516220092773438, "global_step": 477866, "epoch": 2844} {"train_loss": -12.096872329711914, "global_step": 477867, "epoch": 2844} {"train_loss": -12.430593490600586, "global_step": 477868, "epoch": 2844} {"train_loss": -11.78869342803955, "global_step": 477869, "epoch": 2844} {"train_loss": -12.221410751342773, "global_step": 477870, "epoch": 2844} {"train_loss": -11.833208084106445, "global_step": 477871, "epoch": 2844} {"train_loss": -11.769411087036133, "global_step": 477872, "epoch": 2844} {"train_loss": -11.554032325744629, "global_step": 477873, "epoch": 2844} {"train_loss": -11.459325790405273, "global_step": 477874, "epoch": 2844} {"train_loss": -11.239164352416992, "global_step": 477875, "epoch": 2844} {"train_loss": -10.917896270751953, "global_step": 477876, "epoch": 2844} {"train_loss": -11.826421737670898, "global_step": 477877, "epoch": 2844} {"train_loss": -10.295758247375488, "global_step": 477878, "epoch": 2844} {"train_loss": -12.195688247680664, "global_step": 477879, "epoch": 2844} {"train_loss": -10.540714263916016, "global_step": 477880, "epoch": 2844} {"train_loss": -12.197046279907227, "global_step": 477881, "epoch": 2844} {"train_loss": -10.871356964111328, "global_step": 477882, "epoch": 2844} {"train_loss": -12.256790161132812, "global_step": 477883, "epoch": 2844} {"train_loss": -11.505155563354492, "global_step": 477884, "epoch": 2844} {"train_loss": -12.392868041992188, "global_step": 477885, "epoch": 2844} {"train_loss": -12.112344741821289, "global_step": 477886, "epoch": 2844} {"train_loss": -11.956108093261719, "global_step": 477887, "epoch": 2844} {"train_loss": -11.855956077575684, "global_step": 477888, "epoch": 2844} {"train_loss": -12.32243537902832, "global_step": 477889, "epoch": 2844} {"train_loss": -11.572422981262207, "global_step": 477890, "epoch": 2844} {"train_loss": -12.250812530517578, "global_step": 477891, "epoch": 2844} {"train_loss": -11.934853553771973, "global_step": 477892, "epoch": 2844} {"train_loss": -12.309120178222656, "global_step": 477893, "epoch": 2844} {"train_loss": -12.490933418273926, "global_step": 477894, "epoch": 2844} {"train_loss": -12.511767387390137, "global_step": 477895, "epoch": 2844} {"train_loss": -12.533205032348633, "global_step": 477896, "epoch": 2844} {"train_loss": -12.193192481994629, "global_step": 477897, "epoch": 2844} {"train_loss": -12.613003730773926, "global_step": 477898, "epoch": 2844} {"train_loss": -12.764320373535156, "global_step": 477899, "epoch": 2844} {"train_loss": -12.400941848754883, "global_step": 477900, "epoch": 2844} {"train_loss": -12.48034954071045, "global_step": 477901, "epoch": 2844} {"train_loss": -12.46613883972168, "global_step": 477902, "epoch": 2844} {"train_loss": -12.663796424865723, "global_step": 477903, "epoch": 2844} {"train_loss": -12.259710311889648, "global_step": 477904, "epoch": 2844} {"train_loss": -12.549242973327637, "global_step": 477905, "epoch": 2844} {"train_loss": -12.657703399658203, "global_step": 477906, "epoch": 2844} {"train_loss": -12.563264846801758, "global_step": 477907, "epoch": 2844} {"train_loss": -12.708948135375977, "global_step": 477908, "epoch": 2844} {"train_loss": -12.540117263793945, "global_step": 477909, "epoch": 2844} {"train_loss": -12.557464599609375, "global_step": 477910, "epoch": 2844} {"train_loss": -12.510841369628906, "global_step": 477911, "epoch": 2844} {"train_loss": -12.657176971435547, "global_step": 477912, "epoch": 2844} {"train_loss": -12.50448989868164, "global_step": 477913, "epoch": 2844} {"train_loss": -12.58426284790039, "global_step": 477914, "epoch": 2844} {"train_loss": -12.633590698242188, "global_step": 477915, "epoch": 2844} {"train_loss": -12.622880935668945, "global_step": 477916, "epoch": 2844} {"train_loss": -12.683111190795898, "global_step": 477917, "epoch": 2844} {"train_loss": -12.83588981628418, "global_step": 477918, "epoch": 2844} {"train_loss": -12.835357666015625, "global_step": 477919, "epoch": 2844} {"train_loss": -12.68894100189209, "global_step": 477920, "epoch": 2844} {"train_loss": -12.97551155090332, "global_step": 477921, "epoch": 2844} {"train_loss": -12.602720260620117, "global_step": 477922, "epoch": 2844} {"train_loss": -12.744595527648926, "global_step": 477923, "epoch": 2844} {"train_loss": -12.716448783874512, "global_step": 477924, "epoch": 2844} {"train_loss": -12.863487243652344, "global_step": 477925, "epoch": 2844} {"train_loss": -12.809226989746094, "global_step": 477926, "epoch": 2844} {"train_loss": -12.721065521240234, "global_step": 477927, "epoch": 2844} {"train_loss": -12.650364875793457, "global_step": 477928, "epoch": 2844} {"train_loss": -12.829151153564453, "global_step": 477929, "epoch": 2844} {"train_loss": -12.848834991455078, "global_step": 477930, "epoch": 2844} {"train_loss": -13.107918739318848, "global_step": 477931, "epoch": 2844} {"train_loss": -12.62271499633789, "global_step": 477932, "epoch": 2844} {"train_loss": -12.854061126708984, "global_step": 477933, "epoch": 2844} {"train_loss": -12.88548755645752, "global_step": 477934, "epoch": 2844} {"train_loss": -12.629008293151855, "global_step": 477935, "epoch": 2844} {"train_loss": -12.739730834960938, "global_step": 477936, "epoch": 2844} {"train_loss": -12.601058959960938, "global_step": 477937, "epoch": 2844} {"train_loss": -12.904132843017578, "global_step": 477938, "epoch": 2844} {"train_loss": -12.666041374206543, "global_step": 477939, "epoch": 2844} {"train_loss": -12.849286079406738, "global_step": 477940, "epoch": 2844} {"train_loss": -12.660022735595703, "global_step": 477941, "epoch": 2844} {"train_loss": -12.652871131896973, "global_step": 477942, "epoch": 2844} {"train_loss": -12.742170333862305, "global_step": 477943, "epoch": 2844} {"train_loss": -12.64362907409668, "global_step": 477944, "epoch": 2844} {"train_loss": -12.660394668579102, "global_step": 477945, "epoch": 2844} {"train_loss": -12.373098373413086, "global_step": 477946, "epoch": 2844} {"train_loss": -12.774179458618164, "global_step": 477947, "epoch": 2844} {"train_loss": -12.513829231262207, "global_step": 477948, "epoch": 2844} {"train_loss": -12.774237632751465, "global_step": 477949, "epoch": 2844} {"train_loss": -12.729440689086914, "global_step": 477950, "epoch": 2844} {"train_loss": -12.724264144897461, "global_step": 477951, "epoch": 2844} {"train_loss": -12.822857856750488, "global_step": 477952, "epoch": 2844} {"train_loss": -12.874570846557617, "global_step": 477953, "epoch": 2844} {"train_loss": -12.941352844238281, "global_step": 477954, "epoch": 2844} {"train_loss": -12.65823745727539, "global_step": 477955, "epoch": 2844} {"train_loss": -12.850970268249512, "global_step": 477956, "epoch": 2844} {"train_loss": -12.840855598449707, "global_step": 477957, "epoch": 2844} {"train_loss": -12.85036849975586, "global_step": 477958, "epoch": 2844} {"train_loss": -12.22250671613784, "global_step": 477959, "epoch": 2844, "val_loss": 319111.46875} {"train_loss": -12.253864288330078, "global_step": 477960, "epoch": 2845} {"train_loss": -12.471940040588379, "global_step": 477961, "epoch": 2845} {"train_loss": -12.802370071411133, "global_step": 477962, "epoch": 2845} {"train_loss": -11.74102783203125, "global_step": 477963, "epoch": 2845} {"train_loss": -12.825796127319336, "global_step": 477964, "epoch": 2845} {"train_loss": -12.134923934936523, "global_step": 477965, "epoch": 2845} {"train_loss": -12.46157455444336, "global_step": 477966, "epoch": 2845} {"train_loss": -12.368085861206055, "global_step": 477967, "epoch": 2845} {"train_loss": -12.243437767028809, "global_step": 477968, "epoch": 2845} {"train_loss": -12.505755424499512, "global_step": 477969, "epoch": 2845} {"train_loss": -12.821390151977539, "global_step": 477970, "epoch": 2845} {"train_loss": -12.111087799072266, "global_step": 477971, "epoch": 2845} {"train_loss": -12.424591064453125, "global_step": 477972, "epoch": 2845} {"train_loss": -12.5342378616333, "global_step": 477973, "epoch": 2845} {"train_loss": -11.87299919128418, "global_step": 477974, "epoch": 2845} {"train_loss": -12.398746490478516, "global_step": 477975, "epoch": 2845} {"train_loss": -12.222541809082031, "global_step": 477976, "epoch": 2845} {"train_loss": -11.602153778076172, "global_step": 477977, "epoch": 2845} {"train_loss": -12.602428436279297, "global_step": 477978, "epoch": 2845} {"train_loss": -12.025270462036133, "global_step": 477979, "epoch": 2845} {"train_loss": -12.082511901855469, "global_step": 477980, "epoch": 2845} {"train_loss": -11.933441162109375, "global_step": 477981, "epoch": 2845} {"train_loss": -11.45952320098877, "global_step": 477982, "epoch": 2845} {"train_loss": -12.462285041809082, "global_step": 477983, "epoch": 2845} {"train_loss": -11.39291763305664, "global_step": 477984, "epoch": 2845} {"train_loss": -12.208958625793457, "global_step": 477985, "epoch": 2845} {"train_loss": -11.297544479370117, "global_step": 477986, "epoch": 2845} {"train_loss": -10.394672393798828, "global_step": 477987, "epoch": 2845} {"train_loss": -11.864730834960938, "global_step": 477988, "epoch": 2845} {"train_loss": -10.829765319824219, "global_step": 477989, "epoch": 2845} {"train_loss": -11.580670356750488, "global_step": 477990, "epoch": 2845} {"train_loss": -10.960151672363281, "global_step": 477991, "epoch": 2845} {"train_loss": -11.573343276977539, "global_step": 477992, "epoch": 2845} {"train_loss": -10.65378475189209, "global_step": 477993, "epoch": 2845} {"train_loss": -12.241474151611328, "global_step": 477994, "epoch": 2845} {"train_loss": -11.644062042236328, "global_step": 477995, "epoch": 2845} {"train_loss": -11.664380073547363, "global_step": 477996, "epoch": 2845} {"train_loss": -12.266317367553711, "global_step": 477997, "epoch": 2845} {"train_loss": -11.636802673339844, "global_step": 477998, "epoch": 2845} {"train_loss": -11.819588661193848, "global_step": 477999, "epoch": 2845} {"train_loss": -12.063409805297852, "global_step": 478000, "epoch": 2845} {"train_loss": -12.262956619262695, "global_step": 478001, "epoch": 2845} {"train_loss": -12.11092758178711, "global_step": 478002, "epoch": 2845} {"train_loss": -12.730585098266602, "global_step": 478003, "epoch": 2845} {"train_loss": -12.332252502441406, "global_step": 478004, "epoch": 2845} {"train_loss": -12.521732330322266, "global_step": 478005, "epoch": 2845} {"train_loss": -11.913915634155273, "global_step": 478006, "epoch": 2845} {"train_loss": -12.039491653442383, "global_step": 478007, "epoch": 2845} {"train_loss": -12.213299751281738, "global_step": 478008, "epoch": 2845} {"train_loss": -11.871543884277344, "global_step": 478009, "epoch": 2845} {"train_loss": -12.172595024108887, "global_step": 478010, "epoch": 2845} {"train_loss": -12.033662796020508, "global_step": 478011, "epoch": 2845} {"train_loss": -12.17275619506836, "global_step": 478012, "epoch": 2845} {"train_loss": -11.72150993347168, "global_step": 478013, "epoch": 2845} {"train_loss": -11.94736385345459, "global_step": 478014, "epoch": 2845} {"train_loss": -12.249198913574219, "global_step": 478015, "epoch": 2845} {"train_loss": -11.35201644897461, "global_step": 478016, "epoch": 2845} {"train_loss": -11.583112716674805, "global_step": 478017, "epoch": 2845} {"train_loss": -11.83647346496582, "global_step": 478018, "epoch": 2845} {"train_loss": -11.207756042480469, "global_step": 478019, "epoch": 2845} {"train_loss": -12.501895904541016, "global_step": 478020, "epoch": 2845} {"train_loss": -11.228014945983887, "global_step": 478021, "epoch": 2845} {"train_loss": -11.700416564941406, "global_step": 478022, "epoch": 2845} {"train_loss": -11.31818675994873, "global_step": 478023, "epoch": 2845} {"train_loss": -12.429984092712402, "global_step": 478024, "epoch": 2845} {"train_loss": -11.720562934875488, "global_step": 478025, "epoch": 2845} {"train_loss": -12.524465560913086, "global_step": 478026, "epoch": 2845} {"train_loss": -11.96760368347168, "global_step": 478027, "epoch": 2845} {"train_loss": -12.327692985534668, "global_step": 478028, "epoch": 2845} {"train_loss": -11.964875221252441, "global_step": 478029, "epoch": 2845} {"train_loss": -12.197290420532227, "global_step": 478030, "epoch": 2845} {"train_loss": -12.23587417602539, "global_step": 478031, "epoch": 2845} {"train_loss": -12.03400993347168, "global_step": 478032, "epoch": 2845} {"train_loss": -12.306537628173828, "global_step": 478033, "epoch": 2845} {"train_loss": -11.802179336547852, "global_step": 478034, "epoch": 2845} {"train_loss": -10.35343074798584, "global_step": 478035, "epoch": 2845} {"train_loss": -11.993927001953125, "global_step": 478036, "epoch": 2845} {"train_loss": -11.54986572265625, "global_step": 478037, "epoch": 2845} {"train_loss": -10.912044525146484, "global_step": 478038, "epoch": 2845} {"train_loss": -12.412879943847656, "global_step": 478039, "epoch": 2845} {"train_loss": -10.57892894744873, "global_step": 478040, "epoch": 2845} {"train_loss": -12.261486053466797, "global_step": 478041, "epoch": 2845} {"train_loss": -10.817937850952148, "global_step": 478042, "epoch": 2845} {"train_loss": -11.59898567199707, "global_step": 478043, "epoch": 2845} {"train_loss": -11.972444534301758, "global_step": 478044, "epoch": 2845} {"train_loss": -11.045415878295898, "global_step": 478045, "epoch": 2845} {"train_loss": -12.46003246307373, "global_step": 478046, "epoch": 2845} {"train_loss": -11.425704002380371, "global_step": 478047, "epoch": 2845} {"train_loss": -12.246686935424805, "global_step": 478048, "epoch": 2845} {"train_loss": -11.938897132873535, "global_step": 478049, "epoch": 2845} {"train_loss": -12.033514976501465, "global_step": 478050, "epoch": 2845} {"train_loss": -12.290528297424316, "global_step": 478051, "epoch": 2845} {"train_loss": -12.03378677368164, "global_step": 478052, "epoch": 2845} {"train_loss": -11.853965759277344, "global_step": 478053, "epoch": 2845} {"train_loss": -12.073945999145508, "global_step": 478054, "epoch": 2845} {"train_loss": -12.076742172241211, "global_step": 478055, "epoch": 2845} {"train_loss": -11.93925666809082, "global_step": 478056, "epoch": 2845} {"train_loss": -11.73606014251709, "global_step": 478057, "epoch": 2845} {"train_loss": -12.309049606323242, "global_step": 478058, "epoch": 2845} {"train_loss": -11.574623107910156, "global_step": 478059, "epoch": 2845} {"train_loss": -12.09603500366211, "global_step": 478060, "epoch": 2845} {"train_loss": -12.231232643127441, "global_step": 478061, "epoch": 2845} {"train_loss": -12.263086318969727, "global_step": 478062, "epoch": 2845} {"train_loss": -11.859704971313477, "global_step": 478063, "epoch": 2845} {"train_loss": -12.414556503295898, "global_step": 478064, "epoch": 2845} {"train_loss": -12.421076774597168, "global_step": 478065, "epoch": 2845} {"train_loss": -12.341408729553223, "global_step": 478066, "epoch": 2845} {"train_loss": -12.199054718017578, "global_step": 478067, "epoch": 2845} {"train_loss": -11.862373352050781, "global_step": 478068, "epoch": 2845} {"train_loss": -12.196069717407227, "global_step": 478069, "epoch": 2845} {"train_loss": -12.349556922912598, "global_step": 478070, "epoch": 2845} {"train_loss": -12.120729446411133, "global_step": 478071, "epoch": 2845} {"train_loss": -12.540782928466797, "global_step": 478072, "epoch": 2845} {"train_loss": -12.386116981506348, "global_step": 478073, "epoch": 2845} {"train_loss": -12.421086311340332, "global_step": 478074, "epoch": 2845} {"train_loss": -12.185137748718262, "global_step": 478075, "epoch": 2845} {"train_loss": -12.801528930664062, "global_step": 478076, "epoch": 2845} {"train_loss": -12.569269180297852, "global_step": 478077, "epoch": 2845} {"train_loss": -12.518877029418945, "global_step": 478078, "epoch": 2845} {"train_loss": -12.441032409667969, "global_step": 478079, "epoch": 2845} {"train_loss": -12.659807205200195, "global_step": 478080, "epoch": 2845} {"train_loss": -12.579376220703125, "global_step": 478081, "epoch": 2845} {"train_loss": -12.558761596679688, "global_step": 478082, "epoch": 2845} {"train_loss": -12.877960205078125, "global_step": 478083, "epoch": 2845} {"train_loss": -12.273076057434082, "global_step": 478084, "epoch": 2845} {"train_loss": -12.57208251953125, "global_step": 478085, "epoch": 2845} {"train_loss": -12.629719734191895, "global_step": 478086, "epoch": 2845} {"train_loss": -12.752942085266113, "global_step": 478087, "epoch": 2845} {"train_loss": -12.71306037902832, "global_step": 478088, "epoch": 2845} {"train_loss": -12.83946704864502, "global_step": 478089, "epoch": 2845} {"train_loss": -12.890436172485352, "global_step": 478090, "epoch": 2845} {"train_loss": -12.80381965637207, "global_step": 478091, "epoch": 2845} {"train_loss": -12.965614318847656, "global_step": 478092, "epoch": 2845} {"train_loss": -12.952414512634277, "global_step": 478093, "epoch": 2845} {"train_loss": -12.743558883666992, "global_step": 478094, "epoch": 2845} {"train_loss": -12.897357940673828, "global_step": 478095, "epoch": 2845} {"train_loss": -12.640631675720215, "global_step": 478096, "epoch": 2845} {"train_loss": -12.732364654541016, "global_step": 478097, "epoch": 2845} {"train_loss": -12.827213287353516, "global_step": 478098, "epoch": 2845} {"train_loss": -12.567621231079102, "global_step": 478099, "epoch": 2845} {"train_loss": -12.6388578414917, "global_step": 478100, "epoch": 2845} {"train_loss": -12.899685859680176, "global_step": 478101, "epoch": 2845} {"train_loss": -12.782793045043945, "global_step": 478102, "epoch": 2845} {"train_loss": -12.673532485961914, "global_step": 478103, "epoch": 2845} {"train_loss": -12.745126724243164, "global_step": 478104, "epoch": 2845} {"train_loss": -12.79315185546875, "global_step": 478105, "epoch": 2845} {"train_loss": -13.160921096801758, "global_step": 478106, "epoch": 2845} {"train_loss": -12.846128463745117, "global_step": 478107, "epoch": 2845} {"train_loss": -12.769599914550781, "global_step": 478108, "epoch": 2845} {"train_loss": -12.772344589233398, "global_step": 478109, "epoch": 2845} {"train_loss": -12.572635650634766, "global_step": 478110, "epoch": 2845} {"train_loss": -12.762430191040039, "global_step": 478111, "epoch": 2845} {"train_loss": -12.467796325683594, "global_step": 478112, "epoch": 2845} {"train_loss": -12.938446998596191, "global_step": 478113, "epoch": 2845} {"train_loss": -12.691333770751953, "global_step": 478114, "epoch": 2845} {"train_loss": -12.725327491760254, "global_step": 478115, "epoch": 2845} {"train_loss": -12.719001770019531, "global_step": 478116, "epoch": 2845} {"train_loss": -12.815103530883789, "global_step": 478117, "epoch": 2845} {"train_loss": -13.014188766479492, "global_step": 478118, "epoch": 2845} {"train_loss": -12.709650039672852, "global_step": 478119, "epoch": 2845} {"train_loss": -12.767804145812988, "global_step": 478120, "epoch": 2845} {"train_loss": -12.475690841674805, "global_step": 478121, "epoch": 2845} {"train_loss": -12.175235748291016, "global_step": 478122, "epoch": 2845} {"train_loss": -12.681074142456055, "global_step": 478123, "epoch": 2845} {"train_loss": -12.815817832946777, "global_step": 478124, "epoch": 2845} {"train_loss": -12.176450729370117, "global_step": 478125, "epoch": 2845} {"train_loss": -12.600845336914062, "global_step": 478126, "epoch": 2845} {"train_loss": -12.19700204758417, "global_step": 478127, "epoch": 2845, "val_loss": 316538.125, "train_action_mse_error": 2.8381378650665283} {"train_loss": -12.011188507080078, "global_step": 478128, "epoch": 2846} {"train_loss": -12.625595092773438, "global_step": 478129, "epoch": 2846} {"train_loss": -12.210108757019043, "global_step": 478130, "epoch": 2846} {"train_loss": -11.842771530151367, "global_step": 478131, "epoch": 2846} {"train_loss": -12.729019165039062, "global_step": 478132, "epoch": 2846} {"train_loss": -11.678030014038086, "global_step": 478133, "epoch": 2846} {"train_loss": -12.548727989196777, "global_step": 478134, "epoch": 2846} {"train_loss": -12.724491119384766, "global_step": 478135, "epoch": 2846} {"train_loss": -12.723346710205078, "global_step": 478136, "epoch": 2846} {"train_loss": -12.807784080505371, "global_step": 478137, "epoch": 2846} {"train_loss": -12.75175666809082, "global_step": 478138, "epoch": 2846} {"train_loss": -12.7736177444458, "global_step": 478139, "epoch": 2846} {"train_loss": -12.762748718261719, "global_step": 478140, "epoch": 2846} {"train_loss": -12.608626365661621, "global_step": 478141, "epoch": 2846} {"train_loss": -12.56466007232666, "global_step": 478142, "epoch": 2846} {"train_loss": -12.917020797729492, "global_step": 478143, "epoch": 2846} {"train_loss": -12.665335655212402, "global_step": 478144, "epoch": 2846} {"train_loss": -12.071582794189453, "global_step": 478145, "epoch": 2846} {"train_loss": -12.242391586303711, "global_step": 478146, "epoch": 2846} {"train_loss": -12.557005882263184, "global_step": 478147, "epoch": 2846} {"train_loss": -12.26610279083252, "global_step": 478148, "epoch": 2846} {"train_loss": -12.294504165649414, "global_step": 478149, "epoch": 2846} {"train_loss": -12.838397979736328, "global_step": 478150, "epoch": 2846} {"train_loss": -12.438909530639648, "global_step": 478151, "epoch": 2846} {"train_loss": -12.44068717956543, "global_step": 478152, "epoch": 2846} {"train_loss": -12.495341300964355, "global_step": 478153, "epoch": 2846} {"train_loss": -12.071526527404785, "global_step": 478154, "epoch": 2846} {"train_loss": -12.582340240478516, "global_step": 478155, "epoch": 2846} {"train_loss": -12.72806167602539, "global_step": 478156, "epoch": 2846} {"train_loss": -12.18716049194336, "global_step": 478157, "epoch": 2846} {"train_loss": -12.733390808105469, "global_step": 478158, "epoch": 2846} {"train_loss": -12.39666748046875, "global_step": 478159, "epoch": 2846} {"train_loss": -12.704599380493164, "global_step": 478160, "epoch": 2846} {"train_loss": -12.554825782775879, "global_step": 478161, "epoch": 2846} {"train_loss": -12.209028244018555, "global_step": 478162, "epoch": 2846} {"train_loss": -12.43748664855957, "global_step": 478163, "epoch": 2846} {"train_loss": -12.097734451293945, "global_step": 478164, "epoch": 2846} {"train_loss": -12.54300308227539, "global_step": 478165, "epoch": 2846} {"train_loss": -12.594768524169922, "global_step": 478166, "epoch": 2846} {"train_loss": -12.642130851745605, "global_step": 478167, "epoch": 2846} {"train_loss": -12.876201629638672, "global_step": 478168, "epoch": 2846} {"train_loss": -12.238458633422852, "global_step": 478169, "epoch": 2846} {"train_loss": -12.872751235961914, "global_step": 478170, "epoch": 2846} {"train_loss": -12.551431655883789, "global_step": 478171, "epoch": 2846} {"train_loss": -12.234038352966309, "global_step": 478172, "epoch": 2846} {"train_loss": -12.066502571105957, "global_step": 478173, "epoch": 2846} {"train_loss": -12.985586166381836, "global_step": 478174, "epoch": 2846} {"train_loss": -12.554413795471191, "global_step": 478175, "epoch": 2846} {"train_loss": -12.698509216308594, "global_step": 478176, "epoch": 2846} {"train_loss": -12.080154418945312, "global_step": 478177, "epoch": 2846} {"train_loss": -12.155860900878906, "global_step": 478178, "epoch": 2846} {"train_loss": -11.448322296142578, "global_step": 478179, "epoch": 2846} {"train_loss": -12.569278717041016, "global_step": 478180, "epoch": 2846} {"train_loss": -11.368253707885742, "global_step": 478181, "epoch": 2846} {"train_loss": -11.389063835144043, "global_step": 478182, "epoch": 2846} {"train_loss": -11.988784790039062, "global_step": 478183, "epoch": 2846} {"train_loss": -11.277926445007324, "global_step": 478184, "epoch": 2846} {"train_loss": -11.972705841064453, "global_step": 478185, "epoch": 2846} {"train_loss": -10.19825553894043, "global_step": 478186, "epoch": 2846} {"train_loss": -10.571273803710938, "global_step": 478187, "epoch": 2846} {"train_loss": -12.192426681518555, "global_step": 478188, "epoch": 2846} {"train_loss": -9.726943969726562, "global_step": 478189, "epoch": 2846} {"train_loss": -12.457792282104492, "global_step": 478190, "epoch": 2846} {"train_loss": -11.001396179199219, "global_step": 478191, "epoch": 2846} {"train_loss": -11.178675651550293, "global_step": 478192, "epoch": 2846} {"train_loss": -11.55272388458252, "global_step": 478193, "epoch": 2846} {"train_loss": -10.340810775756836, "global_step": 478194, "epoch": 2846} {"train_loss": -11.188331604003906, "global_step": 478195, "epoch": 2846} {"train_loss": -11.827322959899902, "global_step": 478196, "epoch": 2846} {"train_loss": -11.248516082763672, "global_step": 478197, "epoch": 2846} {"train_loss": -10.418073654174805, "global_step": 478198, "epoch": 2846} {"train_loss": -11.545991897583008, "global_step": 478199, "epoch": 2846} {"train_loss": -10.637411117553711, "global_step": 478200, "epoch": 2846} {"train_loss": -11.535118103027344, "global_step": 478201, "epoch": 2846} {"train_loss": -10.4456205368042, "global_step": 478202, "epoch": 2846} {"train_loss": -11.940903663635254, "global_step": 478203, "epoch": 2846} {"train_loss": -10.018566131591797, "global_step": 478204, "epoch": 2846} {"train_loss": -9.509187698364258, "global_step": 478205, "epoch": 2846} {"train_loss": -12.07136344909668, "global_step": 478206, "epoch": 2846} {"train_loss": -10.526291847229004, "global_step": 478207, "epoch": 2846} {"train_loss": -11.815485000610352, "global_step": 478208, "epoch": 2846} {"train_loss": -11.280462265014648, "global_step": 478209, "epoch": 2846} {"train_loss": -11.381672859191895, "global_step": 478210, "epoch": 2846} {"train_loss": -11.84829330444336, "global_step": 478211, "epoch": 2846} {"train_loss": -11.281961441040039, "global_step": 478212, "epoch": 2846} {"train_loss": -12.215801239013672, "global_step": 478213, "epoch": 2846} {"train_loss": -12.169979095458984, "global_step": 478214, "epoch": 2846} {"train_loss": -11.693705558776855, "global_step": 478215, "epoch": 2846} {"train_loss": -12.35877513885498, "global_step": 478216, "epoch": 2846} {"train_loss": -11.356380462646484, "global_step": 478217, "epoch": 2846} {"train_loss": -12.403234481811523, "global_step": 478218, "epoch": 2846} {"train_loss": -11.898305892944336, "global_step": 478219, "epoch": 2846} {"train_loss": -11.749849319458008, "global_step": 478220, "epoch": 2846} {"train_loss": -12.13592529296875, "global_step": 478221, "epoch": 2846} {"train_loss": -11.867095947265625, "global_step": 478222, "epoch": 2846} {"train_loss": -12.528242111206055, "global_step": 478223, "epoch": 2846} {"train_loss": -12.092220306396484, "global_step": 478224, "epoch": 2846} {"train_loss": -12.342981338500977, "global_step": 478225, "epoch": 2846} {"train_loss": -12.386371612548828, "global_step": 478226, "epoch": 2846} {"train_loss": -12.09605884552002, "global_step": 478227, "epoch": 2846} {"train_loss": -12.416179656982422, "global_step": 478228, "epoch": 2846} {"train_loss": -11.962797164916992, "global_step": 478229, "epoch": 2846} {"train_loss": -11.931964874267578, "global_step": 478230, "epoch": 2846} {"train_loss": -12.052488327026367, "global_step": 478231, "epoch": 2846} {"train_loss": -12.128507614135742, "global_step": 478232, "epoch": 2846} {"train_loss": -12.38309097290039, "global_step": 478233, "epoch": 2846} {"train_loss": -12.038284301757812, "global_step": 478234, "epoch": 2846} {"train_loss": -12.502252578735352, "global_step": 478235, "epoch": 2846} {"train_loss": -12.56998062133789, "global_step": 478236, "epoch": 2846} {"train_loss": -12.442882537841797, "global_step": 478237, "epoch": 2846} {"train_loss": -12.3112154006958, "global_step": 478238, "epoch": 2846} {"train_loss": -12.51446533203125, "global_step": 478239, "epoch": 2846} {"train_loss": -12.642539978027344, "global_step": 478240, "epoch": 2846} {"train_loss": -12.47900390625, "global_step": 478241, "epoch": 2846} {"train_loss": -12.696839332580566, "global_step": 478242, "epoch": 2846} {"train_loss": -12.657894134521484, "global_step": 478243, "epoch": 2846} {"train_loss": -12.582301139831543, "global_step": 478244, "epoch": 2846} {"train_loss": -12.559287071228027, "global_step": 478245, "epoch": 2846} {"train_loss": -12.768259048461914, "global_step": 478246, "epoch": 2846} {"train_loss": -12.670759201049805, "global_step": 478247, "epoch": 2846} {"train_loss": -12.603960037231445, "global_step": 478248, "epoch": 2846} {"train_loss": -12.528305053710938, "global_step": 478249, "epoch": 2846} {"train_loss": -12.762365341186523, "global_step": 478250, "epoch": 2846} {"train_loss": -12.68852424621582, "global_step": 478251, "epoch": 2846} {"train_loss": -12.612165451049805, "global_step": 478252, "epoch": 2846} {"train_loss": -12.791990280151367, "global_step": 478253, "epoch": 2846} {"train_loss": -12.82673454284668, "global_step": 478254, "epoch": 2846} {"train_loss": -12.990144729614258, "global_step": 478255, "epoch": 2846} {"train_loss": -12.794962882995605, "global_step": 478256, "epoch": 2846} {"train_loss": -12.688678741455078, "global_step": 478257, "epoch": 2846} {"train_loss": -12.98854923248291, "global_step": 478258, "epoch": 2846} {"train_loss": -13.087449073791504, "global_step": 478259, "epoch": 2846} {"train_loss": -12.782584190368652, "global_step": 478260, "epoch": 2846} {"train_loss": -12.8569974899292, "global_step": 478261, "epoch": 2846} {"train_loss": -12.855621337890625, "global_step": 478262, "epoch": 2846} {"train_loss": -12.627664566040039, "global_step": 478263, "epoch": 2846} {"train_loss": -13.093305587768555, "global_step": 478264, "epoch": 2846} {"train_loss": -12.65986442565918, "global_step": 478265, "epoch": 2846} {"train_loss": -12.721020698547363, "global_step": 478266, "epoch": 2846} {"train_loss": -12.696925163269043, "global_step": 478267, "epoch": 2846} {"train_loss": -12.588020324707031, "global_step": 478268, "epoch": 2846} {"train_loss": -12.521536827087402, "global_step": 478269, "epoch": 2846} {"train_loss": -13.027681350708008, "global_step": 478270, "epoch": 2846} {"train_loss": -12.483627319335938, "global_step": 478271, "epoch": 2846} {"train_loss": -12.813493728637695, "global_step": 478272, "epoch": 2846} {"train_loss": -12.717466354370117, "global_step": 478273, "epoch": 2846} {"train_loss": -12.842538833618164, "global_step": 478274, "epoch": 2846} {"train_loss": -12.685342788696289, "global_step": 478275, "epoch": 2846} {"train_loss": -12.606734275817871, "global_step": 478276, "epoch": 2846} {"train_loss": -12.58498764038086, "global_step": 478277, "epoch": 2846} {"train_loss": -12.95988941192627, "global_step": 478278, "epoch": 2846} {"train_loss": -12.75898551940918, "global_step": 478279, "epoch": 2846} {"train_loss": -13.115440368652344, "global_step": 478280, "epoch": 2846} {"train_loss": -12.716264724731445, "global_step": 478281, "epoch": 2846} {"train_loss": -12.707509994506836, "global_step": 478282, "epoch": 2846} {"train_loss": -12.739445686340332, "global_step": 478283, "epoch": 2846} {"train_loss": -12.767936706542969, "global_step": 478284, "epoch": 2846} {"train_loss": -12.32451057434082, "global_step": 478285, "epoch": 2846} {"train_loss": -12.674477577209473, "global_step": 478286, "epoch": 2846} {"train_loss": -12.974272727966309, "global_step": 478287, "epoch": 2846} {"train_loss": -13.038576126098633, "global_step": 478288, "epoch": 2846} {"train_loss": -12.801572799682617, "global_step": 478289, "epoch": 2846} {"train_loss": -12.837080001831055, "global_step": 478290, "epoch": 2846} {"train_loss": -12.903305053710938, "global_step": 478291, "epoch": 2846} {"train_loss": -12.688232421875, "global_step": 478292, "epoch": 2846} {"train_loss": -12.455533027648926, "global_step": 478293, "epoch": 2846} {"train_loss": -12.81299114227295, "global_step": 478294, "epoch": 2846} {"train_loss": -12.259298710595994, "global_step": 478295, "epoch": 2846, "val_loss": 314189.21875} {"train_loss": -12.246817588806152, "global_step": 478296, "epoch": 2847} {"train_loss": -12.358137130737305, "global_step": 478297, "epoch": 2847} {"train_loss": -12.643829345703125, "global_step": 478298, "epoch": 2847} {"train_loss": -12.142112731933594, "global_step": 478299, "epoch": 2847} {"train_loss": -12.120668411254883, "global_step": 478300, "epoch": 2847} {"train_loss": -12.049398422241211, "global_step": 478301, "epoch": 2847} {"train_loss": -12.983476638793945, "global_step": 478302, "epoch": 2847} {"train_loss": -12.432796478271484, "global_step": 478303, "epoch": 2847} {"train_loss": -12.665910720825195, "global_step": 478304, "epoch": 2847} {"train_loss": -12.296249389648438, "global_step": 478305, "epoch": 2847} {"train_loss": -12.304409980773926, "global_step": 478306, "epoch": 2847} {"train_loss": -12.082473754882812, "global_step": 478307, "epoch": 2847} {"train_loss": -12.703519821166992, "global_step": 478308, "epoch": 2847} {"train_loss": -12.351497650146484, "global_step": 478309, "epoch": 2847} {"train_loss": -12.234491348266602, "global_step": 478310, "epoch": 2847} {"train_loss": -11.975973129272461, "global_step": 478311, "epoch": 2847} {"train_loss": -12.12949275970459, "global_step": 478312, "epoch": 2847} {"train_loss": -10.79519271850586, "global_step": 478313, "epoch": 2847} {"train_loss": -11.292556762695312, "global_step": 478314, "epoch": 2847} {"train_loss": -11.045656204223633, "global_step": 478315, "epoch": 2847} {"train_loss": -12.29831314086914, "global_step": 478316, "epoch": 2847} {"train_loss": -10.624829292297363, "global_step": 478317, "epoch": 2847} {"train_loss": -12.133018493652344, "global_step": 478318, "epoch": 2847} {"train_loss": -11.561175346374512, "global_step": 478319, "epoch": 2847} {"train_loss": -10.206124305725098, "global_step": 478320, "epoch": 2847} {"train_loss": -11.923480987548828, "global_step": 478321, "epoch": 2847} {"train_loss": -10.121658325195312, "global_step": 478322, "epoch": 2847} {"train_loss": -9.07392692565918, "global_step": 478323, "epoch": 2847} {"train_loss": -11.858329772949219, "global_step": 478324, "epoch": 2847} {"train_loss": -9.287832260131836, "global_step": 478325, "epoch": 2847} {"train_loss": -10.76839828491211, "global_step": 478326, "epoch": 2847} {"train_loss": -10.527962684631348, "global_step": 478327, "epoch": 2847} {"train_loss": -9.981466293334961, "global_step": 478328, "epoch": 2847} {"train_loss": -10.962696075439453, "global_step": 478329, "epoch": 2847} {"train_loss": -11.048282623291016, "global_step": 478330, "epoch": 2847} {"train_loss": -10.443405151367188, "global_step": 478331, "epoch": 2847} {"train_loss": -11.027515411376953, "global_step": 478332, "epoch": 2847} {"train_loss": -10.547744750976562, "global_step": 478333, "epoch": 2847} {"train_loss": -9.503595352172852, "global_step": 478334, "epoch": 2847} {"train_loss": -10.195358276367188, "global_step": 478335, "epoch": 2847} {"train_loss": -9.328479766845703, "global_step": 478336, "epoch": 2847} {"train_loss": -9.995901107788086, "global_step": 478337, "epoch": 2847} {"train_loss": -10.745438575744629, "global_step": 478338, "epoch": 2847} {"train_loss": -10.362985610961914, "global_step": 478339, "epoch": 2847} {"train_loss": -10.906652450561523, "global_step": 478340, "epoch": 2847} {"train_loss": -10.058807373046875, "global_step": 478341, "epoch": 2847} {"train_loss": -11.409592628479004, "global_step": 478342, "epoch": 2847} {"train_loss": -11.127195358276367, "global_step": 478343, "epoch": 2847} {"train_loss": -10.815884590148926, "global_step": 478344, "epoch": 2847} {"train_loss": -11.924064636230469, "global_step": 478345, "epoch": 2847} {"train_loss": -11.474715232849121, "global_step": 478346, "epoch": 2847} {"train_loss": -11.25729751586914, "global_step": 478347, "epoch": 2847} {"train_loss": -11.055471420288086, "global_step": 478348, "epoch": 2847} {"train_loss": -11.670072555541992, "global_step": 478349, "epoch": 2847} {"train_loss": -11.629728317260742, "global_step": 478350, "epoch": 2847} {"train_loss": -11.604056358337402, "global_step": 478351, "epoch": 2847} {"train_loss": -11.731903076171875, "global_step": 478352, "epoch": 2847} {"train_loss": -11.297237396240234, "global_step": 478353, "epoch": 2847} {"train_loss": -11.791213989257812, "global_step": 478354, "epoch": 2847} {"train_loss": -11.670403480529785, "global_step": 478355, "epoch": 2847} {"train_loss": -11.662723541259766, "global_step": 478356, "epoch": 2847} {"train_loss": -11.851278305053711, "global_step": 478357, "epoch": 2847} {"train_loss": -11.444621086120605, "global_step": 478358, "epoch": 2847} {"train_loss": -11.949907302856445, "global_step": 478359, "epoch": 2847} {"train_loss": -11.879427909851074, "global_step": 478360, "epoch": 2847} {"train_loss": -11.915176391601562, "global_step": 478361, "epoch": 2847} {"train_loss": -11.734889030456543, "global_step": 478362, "epoch": 2847} {"train_loss": -11.994123458862305, "global_step": 478363, "epoch": 2847} {"train_loss": -11.966026306152344, "global_step": 478364, "epoch": 2847} {"train_loss": -12.230978965759277, "global_step": 478365, "epoch": 2847} {"train_loss": -12.028694152832031, "global_step": 478366, "epoch": 2847} {"train_loss": -12.180033683776855, "global_step": 478367, "epoch": 2847} {"train_loss": -12.089447021484375, "global_step": 478368, "epoch": 2847} {"train_loss": -12.257966995239258, "global_step": 478369, "epoch": 2847} {"train_loss": -12.430413246154785, "global_step": 478370, "epoch": 2847} {"train_loss": -12.457298278808594, "global_step": 478371, "epoch": 2847} {"train_loss": -12.246254920959473, "global_step": 478372, "epoch": 2847} {"train_loss": -12.351017951965332, "global_step": 478373, "epoch": 2847} {"train_loss": -12.48187255859375, "global_step": 478374, "epoch": 2847} {"train_loss": -12.62691879272461, "global_step": 478375, "epoch": 2847} {"train_loss": -12.450523376464844, "global_step": 478376, "epoch": 2847} {"train_loss": -12.41292953491211, "global_step": 478377, "epoch": 2847} {"train_loss": -12.749643325805664, "global_step": 478378, "epoch": 2847} {"train_loss": -12.371360778808594, "global_step": 478379, "epoch": 2847} {"train_loss": -12.53645133972168, "global_step": 478380, "epoch": 2847} {"train_loss": -12.528112411499023, "global_step": 478381, "epoch": 2847} {"train_loss": -12.342784881591797, "global_step": 478382, "epoch": 2847} {"train_loss": -12.405330657958984, "global_step": 478383, "epoch": 2847} {"train_loss": -12.601343154907227, "global_step": 478384, "epoch": 2847} {"train_loss": -12.34598159790039, "global_step": 478385, "epoch": 2847} {"train_loss": -12.493474960327148, "global_step": 478386, "epoch": 2847} {"train_loss": -12.321989059448242, "global_step": 478387, "epoch": 2847} {"train_loss": -12.690155029296875, "global_step": 478388, "epoch": 2847} {"train_loss": -12.26688289642334, "global_step": 478389, "epoch": 2847} {"train_loss": -12.689691543579102, "global_step": 478390, "epoch": 2847} {"train_loss": -12.379796028137207, "global_step": 478391, "epoch": 2847} {"train_loss": -12.832216262817383, "global_step": 478392, "epoch": 2847} {"train_loss": -12.528022766113281, "global_step": 478393, "epoch": 2847} {"train_loss": -12.621017456054688, "global_step": 478394, "epoch": 2847} {"train_loss": -12.512197494506836, "global_step": 478395, "epoch": 2847} {"train_loss": -12.692920684814453, "global_step": 478396, "epoch": 2847} {"train_loss": -12.832547187805176, "global_step": 478397, "epoch": 2847} {"train_loss": -12.56338119506836, "global_step": 478398, "epoch": 2847} {"train_loss": -12.724635124206543, "global_step": 478399, "epoch": 2847} {"train_loss": -12.745767593383789, "global_step": 478400, "epoch": 2847} {"train_loss": -12.704726219177246, "global_step": 478401, "epoch": 2847} {"train_loss": -12.821311950683594, "global_step": 478402, "epoch": 2847} {"train_loss": -12.771187782287598, "global_step": 478403, "epoch": 2847} {"train_loss": -12.735791206359863, "global_step": 478404, "epoch": 2847} {"train_loss": -12.833097457885742, "global_step": 478405, "epoch": 2847} {"train_loss": -12.755630493164062, "global_step": 478406, "epoch": 2847} {"train_loss": -12.885600090026855, "global_step": 478407, "epoch": 2847} {"train_loss": -12.55888557434082, "global_step": 478408, "epoch": 2847} {"train_loss": -12.900525093078613, "global_step": 478409, "epoch": 2847} {"train_loss": -12.59984016418457, "global_step": 478410, "epoch": 2847} {"train_loss": -12.524274826049805, "global_step": 478411, "epoch": 2847} {"train_loss": -12.873289108276367, "global_step": 478412, "epoch": 2847} {"train_loss": -12.849814414978027, "global_step": 478413, "epoch": 2847} {"train_loss": -12.909650802612305, "global_step": 478414, "epoch": 2847} {"train_loss": -12.895156860351562, "global_step": 478415, "epoch": 2847} {"train_loss": -12.918907165527344, "global_step": 478416, "epoch": 2847} {"train_loss": -12.932246208190918, "global_step": 478417, "epoch": 2847} {"train_loss": -13.164942741394043, "global_step": 478418, "epoch": 2847} {"train_loss": -12.79013442993164, "global_step": 478419, "epoch": 2847} {"train_loss": -12.960477828979492, "global_step": 478420, "epoch": 2847} {"train_loss": -12.875619888305664, "global_step": 478421, "epoch": 2847} {"train_loss": -12.839019775390625, "global_step": 478422, "epoch": 2847} {"train_loss": -12.905206680297852, "global_step": 478423, "epoch": 2847} {"train_loss": -13.03902816772461, "global_step": 478424, "epoch": 2847} {"train_loss": -12.742925643920898, "global_step": 478425, "epoch": 2847} {"train_loss": -12.966071128845215, "global_step": 478426, "epoch": 2847} {"train_loss": -12.980376243591309, "global_step": 478427, "epoch": 2847} {"train_loss": -12.788627624511719, "global_step": 478428, "epoch": 2847} {"train_loss": -12.950831413269043, "global_step": 478429, "epoch": 2847} {"train_loss": -12.956418991088867, "global_step": 478430, "epoch": 2847} {"train_loss": -13.045989990234375, "global_step": 478431, "epoch": 2847} {"train_loss": -12.979255676269531, "global_step": 478432, "epoch": 2847} {"train_loss": -12.966814041137695, "global_step": 478433, "epoch": 2847} {"train_loss": -13.04768180847168, "global_step": 478434, "epoch": 2847} {"train_loss": -12.8079252243042, "global_step": 478435, "epoch": 2847} {"train_loss": -12.986298561096191, "global_step": 478436, "epoch": 2847} {"train_loss": -12.995454788208008, "global_step": 478437, "epoch": 2847} {"train_loss": -12.797215461730957, "global_step": 478438, "epoch": 2847} {"train_loss": -12.96592903137207, "global_step": 478439, "epoch": 2847} {"train_loss": -13.070074081420898, "global_step": 478440, "epoch": 2847} {"train_loss": -12.903501510620117, "global_step": 478441, "epoch": 2847} {"train_loss": -12.956037521362305, "global_step": 478442, "epoch": 2847} {"train_loss": -13.073392868041992, "global_step": 478443, "epoch": 2847} {"train_loss": -12.933612823486328, "global_step": 478444, "epoch": 2847} {"train_loss": -12.943140983581543, "global_step": 478445, "epoch": 2847} {"train_loss": -13.001728057861328, "global_step": 478446, "epoch": 2847} {"train_loss": -12.750338554382324, "global_step": 478447, "epoch": 2847} {"train_loss": -12.834486961364746, "global_step": 478448, "epoch": 2847} {"train_loss": -12.812309265136719, "global_step": 478449, "epoch": 2847} {"train_loss": -12.461748123168945, "global_step": 478450, "epoch": 2847} {"train_loss": -12.552753448486328, "global_step": 478451, "epoch": 2847} {"train_loss": -12.940628051757812, "global_step": 478452, "epoch": 2847} {"train_loss": -12.78564167022705, "global_step": 478453, "epoch": 2847} {"train_loss": -13.012703895568848, "global_step": 478454, "epoch": 2847} {"train_loss": -12.714174270629883, "global_step": 478455, "epoch": 2847} {"train_loss": -13.10153865814209, "global_step": 478456, "epoch": 2847} {"train_loss": -13.032966613769531, "global_step": 478457, "epoch": 2847} {"train_loss": -12.74125862121582, "global_step": 478458, "epoch": 2847} {"train_loss": -12.787786483764648, "global_step": 478459, "epoch": 2847} {"train_loss": -12.811742782592773, "global_step": 478460, "epoch": 2847} {"train_loss": -13.03126335144043, "global_step": 478461, "epoch": 2847} {"train_loss": -12.982004165649414, "global_step": 478462, "epoch": 2847} {"train_loss": -12.17454821722848, "global_step": 478463, "epoch": 2847, "val_loss": 315403.84375} {"train_loss": -12.488542556762695, "global_step": 478464, "epoch": 2848} {"train_loss": -12.750633239746094, "global_step": 478465, "epoch": 2848} {"train_loss": -12.70179557800293, "global_step": 478466, "epoch": 2848} {"train_loss": -11.779987335205078, "global_step": 478467, "epoch": 2848} {"train_loss": -12.000064849853516, "global_step": 478468, "epoch": 2848} {"train_loss": -12.495857238769531, "global_step": 478469, "epoch": 2848} {"train_loss": -12.547658920288086, "global_step": 478470, "epoch": 2848} {"train_loss": -12.32070541381836, "global_step": 478471, "epoch": 2848} {"train_loss": -12.479743003845215, "global_step": 478472, "epoch": 2848} {"train_loss": -12.398811340332031, "global_step": 478473, "epoch": 2848} {"train_loss": -12.284425735473633, "global_step": 478474, "epoch": 2848} {"train_loss": -12.007802963256836, "global_step": 478475, "epoch": 2848} {"train_loss": -12.337575912475586, "global_step": 478476, "epoch": 2848} {"train_loss": -12.732398986816406, "global_step": 478477, "epoch": 2848} {"train_loss": -12.098867416381836, "global_step": 478478, "epoch": 2848} {"train_loss": -12.27383804321289, "global_step": 478479, "epoch": 2848} {"train_loss": -11.879152297973633, "global_step": 478480, "epoch": 2848} {"train_loss": -11.962242126464844, "global_step": 478481, "epoch": 2848} {"train_loss": -11.877555847167969, "global_step": 478482, "epoch": 2848} {"train_loss": -9.946845054626465, "global_step": 478483, "epoch": 2848} {"train_loss": -12.477898597717285, "global_step": 478484, "epoch": 2848} {"train_loss": -10.276762962341309, "global_step": 478485, "epoch": 2848} {"train_loss": -9.014907836914062, "global_step": 478486, "epoch": 2848} {"train_loss": -12.168925285339355, "global_step": 478487, "epoch": 2848} {"train_loss": -8.361743927001953, "global_step": 478488, "epoch": 2848} {"train_loss": -10.899553298950195, "global_step": 478489, "epoch": 2848} {"train_loss": -10.118102073669434, "global_step": 478490, "epoch": 2848} {"train_loss": -10.130914688110352, "global_step": 478491, "epoch": 2848} {"train_loss": -9.417753219604492, "global_step": 478492, "epoch": 2848} {"train_loss": -8.939884185791016, "global_step": 478493, "epoch": 2848} {"train_loss": -10.253357887268066, "global_step": 478494, "epoch": 2848} {"train_loss": -8.769250869750977, "global_step": 478495, "epoch": 2848} {"train_loss": -9.882471084594727, "global_step": 478496, "epoch": 2848} {"train_loss": -8.800220489501953, "global_step": 478497, "epoch": 2848} {"train_loss": -10.468351364135742, "global_step": 478498, "epoch": 2848} {"train_loss": -10.464509010314941, "global_step": 478499, "epoch": 2848} {"train_loss": -11.990314483642578, "global_step": 478500, "epoch": 2848} {"train_loss": -10.137031555175781, "global_step": 478501, "epoch": 2848} {"train_loss": -10.950706481933594, "global_step": 478502, "epoch": 2848} {"train_loss": -11.423528671264648, "global_step": 478503, "epoch": 2848} {"train_loss": -10.886625289916992, "global_step": 478504, "epoch": 2848} {"train_loss": -11.812606811523438, "global_step": 478505, "epoch": 2848} {"train_loss": -11.14088249206543, "global_step": 478506, "epoch": 2848} {"train_loss": -12.149656295776367, "global_step": 478507, "epoch": 2848} {"train_loss": -11.495476722717285, "global_step": 478508, "epoch": 2848} {"train_loss": -11.987494468688965, "global_step": 478509, "epoch": 2848} {"train_loss": -12.165670394897461, "global_step": 478510, "epoch": 2848} {"train_loss": -11.690349578857422, "global_step": 478511, "epoch": 2848} {"train_loss": -12.110713958740234, "global_step": 478512, "epoch": 2848} {"train_loss": -12.229692459106445, "global_step": 478513, "epoch": 2848} {"train_loss": -12.121221542358398, "global_step": 478514, "epoch": 2848} {"train_loss": -12.053020477294922, "global_step": 478515, "epoch": 2848} {"train_loss": -12.061408996582031, "global_step": 478516, "epoch": 2848} {"train_loss": -12.481306076049805, "global_step": 478517, "epoch": 2848} {"train_loss": -11.920880317687988, "global_step": 478518, "epoch": 2848} {"train_loss": -12.017073631286621, "global_step": 478519, "epoch": 2848} {"train_loss": -11.934422492980957, "global_step": 478520, "epoch": 2848} {"train_loss": -12.444543838500977, "global_step": 478521, "epoch": 2848} {"train_loss": -12.51126480102539, "global_step": 478522, "epoch": 2848} {"train_loss": -12.216392517089844, "global_step": 478523, "epoch": 2848} {"train_loss": -12.216056823730469, "global_step": 478524, "epoch": 2848} {"train_loss": -12.382657051086426, "global_step": 478525, "epoch": 2848} {"train_loss": -12.523824691772461, "global_step": 478526, "epoch": 2848} {"train_loss": -12.372163772583008, "global_step": 478527, "epoch": 2848} {"train_loss": -12.191019058227539, "global_step": 478528, "epoch": 2848} {"train_loss": -12.41696548461914, "global_step": 478529, "epoch": 2848} {"train_loss": -12.35600471496582, "global_step": 478530, "epoch": 2848} {"train_loss": -12.762914657592773, "global_step": 478531, "epoch": 2848} {"train_loss": -12.150221824645996, "global_step": 478532, "epoch": 2848} {"train_loss": -12.41622543334961, "global_step": 478533, "epoch": 2848} {"train_loss": -12.447982788085938, "global_step": 478534, "epoch": 2848} {"train_loss": -12.56245231628418, "global_step": 478535, "epoch": 2848} {"train_loss": -12.538434982299805, "global_step": 478536, "epoch": 2848} {"train_loss": -12.661507606506348, "global_step": 478537, "epoch": 2848} {"train_loss": -12.663520812988281, "global_step": 478538, "epoch": 2848} {"train_loss": -12.804971694946289, "global_step": 478539, "epoch": 2848} {"train_loss": -12.594464302062988, "global_step": 478540, "epoch": 2848} {"train_loss": -12.566091537475586, "global_step": 478541, "epoch": 2848} {"train_loss": -12.46377944946289, "global_step": 478542, "epoch": 2848} {"train_loss": -12.508277893066406, "global_step": 478543, "epoch": 2848} {"train_loss": -12.56247329711914, "global_step": 478544, "epoch": 2848} {"train_loss": -12.448529243469238, "global_step": 478545, "epoch": 2848} {"train_loss": -12.559139251708984, "global_step": 478546, "epoch": 2848} {"train_loss": -12.554361343383789, "global_step": 478547, "epoch": 2848} {"train_loss": -12.575603485107422, "global_step": 478548, "epoch": 2848} {"train_loss": -12.420799255371094, "global_step": 478549, "epoch": 2848} {"train_loss": -12.660455703735352, "global_step": 478550, "epoch": 2848} {"train_loss": -12.132932662963867, "global_step": 478551, "epoch": 2848} {"train_loss": -12.664651870727539, "global_step": 478552, "epoch": 2848} {"train_loss": -12.585474014282227, "global_step": 478553, "epoch": 2848} {"train_loss": -12.582481384277344, "global_step": 478554, "epoch": 2848} {"train_loss": -12.510210037231445, "global_step": 478555, "epoch": 2848} {"train_loss": -12.71058464050293, "global_step": 478556, "epoch": 2848} {"train_loss": -12.713371276855469, "global_step": 478557, "epoch": 2848} {"train_loss": -12.663960456848145, "global_step": 478558, "epoch": 2848} {"train_loss": -12.91925048828125, "global_step": 478559, "epoch": 2848} {"train_loss": -12.716531753540039, "global_step": 478560, "epoch": 2848} {"train_loss": -12.901165008544922, "global_step": 478561, "epoch": 2848} {"train_loss": -12.602476119995117, "global_step": 478562, "epoch": 2848} {"train_loss": -12.550065040588379, "global_step": 478563, "epoch": 2848} {"train_loss": -12.744377136230469, "global_step": 478564, "epoch": 2848} {"train_loss": -12.303837776184082, "global_step": 478565, "epoch": 2848} {"train_loss": -12.726638793945312, "global_step": 478566, "epoch": 2848} {"train_loss": -12.149264335632324, "global_step": 478567, "epoch": 2848} {"train_loss": -12.658963203430176, "global_step": 478568, "epoch": 2848} {"train_loss": -12.306901931762695, "global_step": 478569, "epoch": 2848} {"train_loss": -12.127007484436035, "global_step": 478570, "epoch": 2848} {"train_loss": -11.147773742675781, "global_step": 478571, "epoch": 2848} {"train_loss": -12.490397453308105, "global_step": 478572, "epoch": 2848} {"train_loss": -11.46146011352539, "global_step": 478573, "epoch": 2848} {"train_loss": -10.557186126708984, "global_step": 478574, "epoch": 2848} {"train_loss": -11.177793502807617, "global_step": 478575, "epoch": 2848} {"train_loss": -11.692838668823242, "global_step": 478576, "epoch": 2848} {"train_loss": -10.477777481079102, "global_step": 478577, "epoch": 2848} {"train_loss": -12.404763221740723, "global_step": 478578, "epoch": 2848} {"train_loss": -11.355239868164062, "global_step": 478579, "epoch": 2848} {"train_loss": -11.484482765197754, "global_step": 478580, "epoch": 2848} {"train_loss": -12.631752967834473, "global_step": 478581, "epoch": 2848} {"train_loss": -11.166646957397461, "global_step": 478582, "epoch": 2848} {"train_loss": -12.282852172851562, "global_step": 478583, "epoch": 2848} {"train_loss": -12.162569999694824, "global_step": 478584, "epoch": 2848} {"train_loss": -11.8403902053833, "global_step": 478585, "epoch": 2848} {"train_loss": -12.363119125366211, "global_step": 478586, "epoch": 2848} {"train_loss": -11.955413818359375, "global_step": 478587, "epoch": 2848} {"train_loss": -12.500513076782227, "global_step": 478588, "epoch": 2848} {"train_loss": -12.246119499206543, "global_step": 478589, "epoch": 2848} {"train_loss": -12.32068157196045, "global_step": 478590, "epoch": 2848} {"train_loss": -12.468965530395508, "global_step": 478591, "epoch": 2848} {"train_loss": -12.238585472106934, "global_step": 478592, "epoch": 2848} {"train_loss": -12.080453872680664, "global_step": 478593, "epoch": 2848} {"train_loss": -12.339727401733398, "global_step": 478594, "epoch": 2848} {"train_loss": -12.467191696166992, "global_step": 478595, "epoch": 2848} {"train_loss": -12.522613525390625, "global_step": 478596, "epoch": 2848} {"train_loss": -11.891164779663086, "global_step": 478597, "epoch": 2848} {"train_loss": -12.486553192138672, "global_step": 478598, "epoch": 2848} {"train_loss": -12.222169876098633, "global_step": 478599, "epoch": 2848} {"train_loss": -12.644169807434082, "global_step": 478600, "epoch": 2848} {"train_loss": -12.45088005065918, "global_step": 478601, "epoch": 2848} {"train_loss": -12.455291748046875, "global_step": 478602, "epoch": 2848} {"train_loss": -11.818498611450195, "global_step": 478603, "epoch": 2848} {"train_loss": -12.658578872680664, "global_step": 478604, "epoch": 2848} {"train_loss": -11.827190399169922, "global_step": 478605, "epoch": 2848} {"train_loss": -12.152584075927734, "global_step": 478606, "epoch": 2848} {"train_loss": -12.579566955566406, "global_step": 478607, "epoch": 2848} {"train_loss": -12.374105453491211, "global_step": 478608, "epoch": 2848} {"train_loss": -12.447478294372559, "global_step": 478609, "epoch": 2848} {"train_loss": -12.400712966918945, "global_step": 478610, "epoch": 2848} {"train_loss": -12.507701873779297, "global_step": 478611, "epoch": 2848} {"train_loss": -12.388984680175781, "global_step": 478612, "epoch": 2848} {"train_loss": -12.311619758605957, "global_step": 478613, "epoch": 2848} {"train_loss": -12.242776870727539, "global_step": 478614, "epoch": 2848} {"train_loss": -12.710594177246094, "global_step": 478615, "epoch": 2848} {"train_loss": -12.213374137878418, "global_step": 478616, "epoch": 2848} {"train_loss": -12.026216506958008, "global_step": 478617, "epoch": 2848} {"train_loss": -12.108437538146973, "global_step": 478618, "epoch": 2848} {"train_loss": -12.455484390258789, "global_step": 478619, "epoch": 2848} {"train_loss": -12.151688575744629, "global_step": 478620, "epoch": 2848} {"train_loss": -12.3872709274292, "global_step": 478621, "epoch": 2848} {"train_loss": -12.528417587280273, "global_step": 478622, "epoch": 2848} {"train_loss": -12.268659591674805, "global_step": 478623, "epoch": 2848} {"train_loss": -12.332513809204102, "global_step": 478624, "epoch": 2848} {"train_loss": -12.358439445495605, "global_step": 478625, "epoch": 2848} {"train_loss": -12.258642196655273, "global_step": 478626, "epoch": 2848} {"train_loss": -11.789827346801758, "global_step": 478627, "epoch": 2848} {"train_loss": -12.517457008361816, "global_step": 478628, "epoch": 2848} {"train_loss": -11.957170486450195, "global_step": 478629, "epoch": 2848} {"train_loss": -12.162128448486328, "global_step": 478630, "epoch": 2848} {"train_loss": -12.003776317551022, "global_step": 478631, "epoch": 2848, "val_loss": 317971.84375} {"train_loss": -12.489243507385254, "global_step": 478632, "epoch": 2849} {"train_loss": -12.374933242797852, "global_step": 478633, "epoch": 2849} {"train_loss": -12.720839500427246, "global_step": 478634, "epoch": 2849} {"train_loss": -12.455699920654297, "global_step": 478635, "epoch": 2849} {"train_loss": -12.207010269165039, "global_step": 478636, "epoch": 2849} {"train_loss": -12.695741653442383, "global_step": 478637, "epoch": 2849} {"train_loss": -12.5440673828125, "global_step": 478638, "epoch": 2849} {"train_loss": -12.378874778747559, "global_step": 478639, "epoch": 2849} {"train_loss": -12.614298820495605, "global_step": 478640, "epoch": 2849} {"train_loss": -12.36541748046875, "global_step": 478641, "epoch": 2849} {"train_loss": -12.648178100585938, "global_step": 478642, "epoch": 2849} {"train_loss": -12.286457061767578, "global_step": 478643, "epoch": 2849} {"train_loss": -12.642123222351074, "global_step": 478644, "epoch": 2849} {"train_loss": -12.051076889038086, "global_step": 478645, "epoch": 2849} {"train_loss": -12.580448150634766, "global_step": 478646, "epoch": 2849} {"train_loss": -11.967870712280273, "global_step": 478647, "epoch": 2849} {"train_loss": -12.251611709594727, "global_step": 478648, "epoch": 2849} {"train_loss": -12.603004455566406, "global_step": 478649, "epoch": 2849} {"train_loss": -12.519651412963867, "global_step": 478650, "epoch": 2849} {"train_loss": -12.189981460571289, "global_step": 478651, "epoch": 2849} {"train_loss": -12.49405288696289, "global_step": 478652, "epoch": 2849} {"train_loss": -12.403900146484375, "global_step": 478653, "epoch": 2849} {"train_loss": -12.368171691894531, "global_step": 478654, "epoch": 2849} {"train_loss": -12.66140079498291, "global_step": 478655, "epoch": 2849} {"train_loss": -12.46581745147705, "global_step": 478656, "epoch": 2849} {"train_loss": -12.47610092163086, "global_step": 478657, "epoch": 2849} {"train_loss": -12.559956550598145, "global_step": 478658, "epoch": 2849} {"train_loss": -12.259876251220703, "global_step": 478659, "epoch": 2849} {"train_loss": -12.048402786254883, "global_step": 478660, "epoch": 2849} {"train_loss": -12.657336235046387, "global_step": 478661, "epoch": 2849} {"train_loss": -12.588123321533203, "global_step": 478662, "epoch": 2849} {"train_loss": -12.694801330566406, "global_step": 478663, "epoch": 2849} {"train_loss": -12.55025863647461, "global_step": 478664, "epoch": 2849} {"train_loss": -12.739839553833008, "global_step": 478665, "epoch": 2849} {"train_loss": -12.523406028747559, "global_step": 478666, "epoch": 2849} {"train_loss": -12.720643997192383, "global_step": 478667, "epoch": 2849} {"train_loss": -12.15257453918457, "global_step": 478668, "epoch": 2849} {"train_loss": -12.523508071899414, "global_step": 478669, "epoch": 2849} {"train_loss": -12.543381690979004, "global_step": 478670, "epoch": 2849} {"train_loss": -12.258899688720703, "global_step": 478671, "epoch": 2849} {"train_loss": -12.263004302978516, "global_step": 478672, "epoch": 2849} {"train_loss": -11.925451278686523, "global_step": 478673, "epoch": 2849} {"train_loss": -11.968912124633789, "global_step": 478674, "epoch": 2849} {"train_loss": -12.345248222351074, "global_step": 478675, "epoch": 2849} {"train_loss": -12.131704330444336, "global_step": 478676, "epoch": 2849} {"train_loss": -12.396025657653809, "global_step": 478677, "epoch": 2849} {"train_loss": -12.267261505126953, "global_step": 478678, "epoch": 2849} {"train_loss": -12.220520973205566, "global_step": 478679, "epoch": 2849} {"train_loss": -12.475255966186523, "global_step": 478680, "epoch": 2849} {"train_loss": -11.905111312866211, "global_step": 478681, "epoch": 2849} {"train_loss": -11.768112182617188, "global_step": 478682, "epoch": 2849} {"train_loss": -12.08997631072998, "global_step": 478683, "epoch": 2849} {"train_loss": -12.062211990356445, "global_step": 478684, "epoch": 2849} {"train_loss": -12.5737943649292, "global_step": 478685, "epoch": 2849} {"train_loss": -11.87441635131836, "global_step": 478686, "epoch": 2849} {"train_loss": -12.659046173095703, "global_step": 478687, "epoch": 2849} {"train_loss": -11.582953453063965, "global_step": 478688, "epoch": 2849} {"train_loss": -12.93562126159668, "global_step": 478689, "epoch": 2849} {"train_loss": -11.841292381286621, "global_step": 478690, "epoch": 2849} {"train_loss": -12.696378707885742, "global_step": 478691, "epoch": 2849} {"train_loss": -12.050267219543457, "global_step": 478692, "epoch": 2849} {"train_loss": -12.31994915008545, "global_step": 478693, "epoch": 2849} {"train_loss": -12.624598503112793, "global_step": 478694, "epoch": 2849} {"train_loss": -12.406877517700195, "global_step": 478695, "epoch": 2849} {"train_loss": -12.689435958862305, "global_step": 478696, "epoch": 2849} {"train_loss": -12.573009490966797, "global_step": 478697, "epoch": 2849} {"train_loss": -12.689713478088379, "global_step": 478698, "epoch": 2849} {"train_loss": -12.572439193725586, "global_step": 478699, "epoch": 2849} {"train_loss": -12.249685287475586, "global_step": 478700, "epoch": 2849} {"train_loss": -12.437527656555176, "global_step": 478701, "epoch": 2849} {"train_loss": -12.65902328491211, "global_step": 478702, "epoch": 2849} {"train_loss": -12.550113677978516, "global_step": 478703, "epoch": 2849} {"train_loss": -12.589019775390625, "global_step": 478704, "epoch": 2849} {"train_loss": -12.850334167480469, "global_step": 478705, "epoch": 2849} {"train_loss": -12.406335830688477, "global_step": 478706, "epoch": 2849} {"train_loss": -12.674553871154785, "global_step": 478707, "epoch": 2849} {"train_loss": -12.748306274414062, "global_step": 478708, "epoch": 2849} {"train_loss": -12.58839225769043, "global_step": 478709, "epoch": 2849} {"train_loss": -12.713799476623535, "global_step": 478710, "epoch": 2849} {"train_loss": -12.869476318359375, "global_step": 478711, "epoch": 2849} {"train_loss": -12.437250137329102, "global_step": 478712, "epoch": 2849} {"train_loss": -12.62250804901123, "global_step": 478713, "epoch": 2849} {"train_loss": -12.5247220993042, "global_step": 478714, "epoch": 2849} {"train_loss": -12.826009750366211, "global_step": 478715, "epoch": 2849} {"train_loss": -12.893657684326172, "global_step": 478716, "epoch": 2849} {"train_loss": -12.751214027404785, "global_step": 478717, "epoch": 2849} {"train_loss": -12.726337432861328, "global_step": 478718, "epoch": 2849} {"train_loss": -12.997196197509766, "global_step": 478719, "epoch": 2849} {"train_loss": -12.549108505249023, "global_step": 478720, "epoch": 2849} {"train_loss": -12.743372917175293, "global_step": 478721, "epoch": 2849} {"train_loss": -12.99355411529541, "global_step": 478722, "epoch": 2849} {"train_loss": -12.849651336669922, "global_step": 478723, "epoch": 2849} {"train_loss": -12.93720817565918, "global_step": 478724, "epoch": 2849} {"train_loss": -12.944150924682617, "global_step": 478725, "epoch": 2849} {"train_loss": -12.88711166381836, "global_step": 478726, "epoch": 2849} {"train_loss": -12.715909004211426, "global_step": 478727, "epoch": 2849} {"train_loss": -12.805097579956055, "global_step": 478728, "epoch": 2849} {"train_loss": -12.832303047180176, "global_step": 478729, "epoch": 2849} {"train_loss": -12.776496887207031, "global_step": 478730, "epoch": 2849} {"train_loss": -12.742145538330078, "global_step": 478731, "epoch": 2849} {"train_loss": -12.743093490600586, "global_step": 478732, "epoch": 2849} {"train_loss": -13.07203483581543, "global_step": 478733, "epoch": 2849} {"train_loss": -12.409038543701172, "global_step": 478734, "epoch": 2849} {"train_loss": -12.95855712890625, "global_step": 478735, "epoch": 2849} {"train_loss": -12.809999465942383, "global_step": 478736, "epoch": 2849} {"train_loss": -12.8814058303833, "global_step": 478737, "epoch": 2849} {"train_loss": -12.865920066833496, "global_step": 478738, "epoch": 2849} {"train_loss": -13.109172821044922, "global_step": 478739, "epoch": 2849} {"train_loss": -12.503029823303223, "global_step": 478740, "epoch": 2849} {"train_loss": -12.705795288085938, "global_step": 478741, "epoch": 2849} {"train_loss": -12.801057815551758, "global_step": 478742, "epoch": 2849} {"train_loss": -12.695355415344238, "global_step": 478743, "epoch": 2849} {"train_loss": -12.677864074707031, "global_step": 478744, "epoch": 2849} {"train_loss": -11.654424667358398, "global_step": 478745, "epoch": 2849} {"train_loss": -12.518962860107422, "global_step": 478746, "epoch": 2849} {"train_loss": -12.706308364868164, "global_step": 478747, "epoch": 2849} {"train_loss": -12.584131240844727, "global_step": 478748, "epoch": 2849} {"train_loss": -12.586130142211914, "global_step": 478749, "epoch": 2849} {"train_loss": -12.269271850585938, "global_step": 478750, "epoch": 2849} {"train_loss": -12.129182815551758, "global_step": 478751, "epoch": 2849} {"train_loss": -11.505046844482422, "global_step": 478752, "epoch": 2849} {"train_loss": -12.104534149169922, "global_step": 478753, "epoch": 2849} {"train_loss": -11.850475311279297, "global_step": 478754, "epoch": 2849} {"train_loss": -12.874589920043945, "global_step": 478755, "epoch": 2849} {"train_loss": -11.976968765258789, "global_step": 478756, "epoch": 2849} {"train_loss": -11.542530059814453, "global_step": 478757, "epoch": 2849} {"train_loss": -12.204944610595703, "global_step": 478758, "epoch": 2849} {"train_loss": -12.857498168945312, "global_step": 478759, "epoch": 2849} {"train_loss": -11.527677536010742, "global_step": 478760, "epoch": 2849} {"train_loss": -12.370180130004883, "global_step": 478761, "epoch": 2849} {"train_loss": -11.275043487548828, "global_step": 478762, "epoch": 2849} {"train_loss": -11.41163158416748, "global_step": 478763, "epoch": 2849} {"train_loss": -10.90318489074707, "global_step": 478764, "epoch": 2849} {"train_loss": -11.162734985351562, "global_step": 478765, "epoch": 2849} {"train_loss": -8.892223358154297, "global_step": 478766, "epoch": 2849} {"train_loss": -8.247160911560059, "global_step": 478767, "epoch": 2849} {"train_loss": -8.397000312805176, "global_step": 478768, "epoch": 2849} {"train_loss": -8.419053077697754, "global_step": 478769, "epoch": 2849} {"train_loss": -9.24656867980957, "global_step": 478770, "epoch": 2849} {"train_loss": -10.04311752319336, "global_step": 478771, "epoch": 2849} {"train_loss": -10.603987693786621, "global_step": 478772, "epoch": 2849} {"train_loss": -9.345483779907227, "global_step": 478773, "epoch": 2849} {"train_loss": -11.741369247436523, "global_step": 478774, "epoch": 2849} {"train_loss": -10.657281875610352, "global_step": 478775, "epoch": 2849} {"train_loss": -11.766120910644531, "global_step": 478776, "epoch": 2849} {"train_loss": -11.311726570129395, "global_step": 478777, "epoch": 2849} {"train_loss": -10.743581771850586, "global_step": 478778, "epoch": 2849} {"train_loss": -11.578346252441406, "global_step": 478779, "epoch": 2849} {"train_loss": -11.880162239074707, "global_step": 478780, "epoch": 2849} {"train_loss": -10.517589569091797, "global_step": 478781, "epoch": 2849} {"train_loss": -10.859342575073242, "global_step": 478782, "epoch": 2849} {"train_loss": -11.482246398925781, "global_step": 478783, "epoch": 2849} {"train_loss": -10.472082138061523, "global_step": 478784, "epoch": 2849} {"train_loss": -12.586307525634766, "global_step": 478785, "epoch": 2849} {"train_loss": -10.511580467224121, "global_step": 478786, "epoch": 2849} {"train_loss": -11.148775100708008, "global_step": 478787, "epoch": 2849} {"train_loss": -12.035175323486328, "global_step": 478788, "epoch": 2849} {"train_loss": -10.985459327697754, "global_step": 478789, "epoch": 2849} {"train_loss": -12.020099639892578, "global_step": 478790, "epoch": 2849} {"train_loss": -12.32145881652832, "global_step": 478791, "epoch": 2849} {"train_loss": -12.045578002929688, "global_step": 478792, "epoch": 2849} {"train_loss": -12.448921203613281, "global_step": 478793, "epoch": 2849} {"train_loss": -11.477334976196289, "global_step": 478794, "epoch": 2849} {"train_loss": -12.112017631530762, "global_step": 478795, "epoch": 2849} {"train_loss": -11.643230438232422, "global_step": 478796, "epoch": 2849} {"train_loss": -11.864192008972168, "global_step": 478797, "epoch": 2849} {"train_loss": -11.797988891601562, "global_step": 478798, "epoch": 2849} {"train_loss": -12.146908856573559, "global_step": 478799, "epoch": 2849, "val_loss": 313378.96875} {"train_loss": -11.943572998046875, "global_step": 478800, "epoch": 2850} {"train_loss": -11.382660865783691, "global_step": 478801, "epoch": 2850} {"train_loss": -12.626426696777344, "global_step": 478802, "epoch": 2850} {"train_loss": -11.428255081176758, "global_step": 478803, "epoch": 2850} {"train_loss": -12.145362854003906, "global_step": 478804, "epoch": 2850} {"train_loss": -12.38087272644043, "global_step": 478805, "epoch": 2850} {"train_loss": -11.910959243774414, "global_step": 478806, "epoch": 2850} {"train_loss": -12.417503356933594, "global_step": 478807, "epoch": 2850} {"train_loss": -11.835502624511719, "global_step": 478808, "epoch": 2850} {"train_loss": -12.151447296142578, "global_step": 478809, "epoch": 2850} {"train_loss": -12.054001808166504, "global_step": 478810, "epoch": 2850} {"train_loss": -11.616159439086914, "global_step": 478811, "epoch": 2850} {"train_loss": -12.036457061767578, "global_step": 478812, "epoch": 2850} {"train_loss": -11.637689590454102, "global_step": 478813, "epoch": 2850} {"train_loss": -11.747758865356445, "global_step": 478814, "epoch": 2850} {"train_loss": -12.206075668334961, "global_step": 478815, "epoch": 2850} {"train_loss": -11.35197925567627, "global_step": 478816, "epoch": 2850} {"train_loss": -11.818435668945312, "global_step": 478817, "epoch": 2850} {"train_loss": -11.753564834594727, "global_step": 478818, "epoch": 2850} {"train_loss": -12.336219787597656, "global_step": 478819, "epoch": 2850} {"train_loss": -12.312408447265625, "global_step": 478820, "epoch": 2850} {"train_loss": -11.840705871582031, "global_step": 478821, "epoch": 2850} {"train_loss": -12.334268569946289, "global_step": 478822, "epoch": 2850} {"train_loss": -11.357324600219727, "global_step": 478823, "epoch": 2850} {"train_loss": -12.052587509155273, "global_step": 478824, "epoch": 2850} {"train_loss": -11.906152725219727, "global_step": 478825, "epoch": 2850} {"train_loss": -11.964642524719238, "global_step": 478826, "epoch": 2850} {"train_loss": -12.11821174621582, "global_step": 478827, "epoch": 2850} {"train_loss": -11.517668724060059, "global_step": 478828, "epoch": 2850} {"train_loss": -11.512246131896973, "global_step": 478829, "epoch": 2850} {"train_loss": -12.335411071777344, "global_step": 478830, "epoch": 2850} {"train_loss": -11.657063484191895, "global_step": 478831, "epoch": 2850} {"train_loss": -12.151326179504395, "global_step": 478832, "epoch": 2850} {"train_loss": -11.781959533691406, "global_step": 478833, "epoch": 2850} {"train_loss": -11.471900939941406, "global_step": 478834, "epoch": 2850} {"train_loss": -12.618412971496582, "global_step": 478835, "epoch": 2850} {"train_loss": -11.719860076904297, "global_step": 478836, "epoch": 2850} {"train_loss": -12.448979377746582, "global_step": 478837, "epoch": 2850} {"train_loss": -12.18027114868164, "global_step": 478838, "epoch": 2850} {"train_loss": -12.234468460083008, "global_step": 478839, "epoch": 2850} {"train_loss": -12.197500228881836, "global_step": 478840, "epoch": 2850} {"train_loss": -12.408591270446777, "global_step": 478841, "epoch": 2850} {"train_loss": -12.408002853393555, "global_step": 478842, "epoch": 2850} {"train_loss": -12.592079162597656, "global_step": 478843, "epoch": 2850} {"train_loss": -12.3139066696167, "global_step": 478844, "epoch": 2850} {"train_loss": -12.671422004699707, "global_step": 478845, "epoch": 2850} {"train_loss": -12.43769645690918, "global_step": 478846, "epoch": 2850} {"train_loss": -12.392867088317871, "global_step": 478847, "epoch": 2850} {"train_loss": -12.489969253540039, "global_step": 478848, "epoch": 2850} {"train_loss": -12.507415771484375, "global_step": 478849, "epoch": 2850} {"train_loss": -12.594600677490234, "global_step": 478850, "epoch": 2850} {"train_loss": -12.50160026550293, "global_step": 478851, "epoch": 2850} {"train_loss": -12.597150802612305, "global_step": 478852, "epoch": 2850} {"train_loss": -11.891558647155762, "global_step": 478853, "epoch": 2850} {"train_loss": -12.50828742980957, "global_step": 478854, "epoch": 2850} {"train_loss": -12.201642990112305, "global_step": 478855, "epoch": 2850} {"train_loss": -12.524748802185059, "global_step": 478856, "epoch": 2850} {"train_loss": -12.325996398925781, "global_step": 478857, "epoch": 2850} {"train_loss": -12.323348999023438, "global_step": 478858, "epoch": 2850} {"train_loss": -12.603078842163086, "global_step": 478859, "epoch": 2850} {"train_loss": -12.298687934875488, "global_step": 478860, "epoch": 2850} {"train_loss": -12.408713340759277, "global_step": 478861, "epoch": 2850} {"train_loss": -12.516396522521973, "global_step": 478862, "epoch": 2850} {"train_loss": -12.635607719421387, "global_step": 478863, "epoch": 2850} {"train_loss": -12.800300598144531, "global_step": 478864, "epoch": 2850} {"train_loss": -12.558175086975098, "global_step": 478865, "epoch": 2850} {"train_loss": -12.74346923828125, "global_step": 478866, "epoch": 2850} {"train_loss": -12.686834335327148, "global_step": 478867, "epoch": 2850} {"train_loss": -12.702411651611328, "global_step": 478868, "epoch": 2850} {"train_loss": -12.841863632202148, "global_step": 478869, "epoch": 2850} {"train_loss": -12.501138687133789, "global_step": 478870, "epoch": 2850} {"train_loss": -12.516247749328613, "global_step": 478871, "epoch": 2850} {"train_loss": -12.8831205368042, "global_step": 478872, "epoch": 2850} {"train_loss": -12.568801879882812, "global_step": 478873, "epoch": 2850} {"train_loss": -12.595907211303711, "global_step": 478874, "epoch": 2850} {"train_loss": -12.525718688964844, "global_step": 478875, "epoch": 2850} {"train_loss": -12.703655242919922, "global_step": 478876, "epoch": 2850} {"train_loss": -12.76999282836914, "global_step": 478877, "epoch": 2850} {"train_loss": -12.75320053100586, "global_step": 478878, "epoch": 2850} {"train_loss": -12.766769409179688, "global_step": 478879, "epoch": 2850} {"train_loss": -12.867168426513672, "global_step": 478880, "epoch": 2850} {"train_loss": -12.87954330444336, "global_step": 478881, "epoch": 2850} {"train_loss": -12.90498161315918, "global_step": 478882, "epoch": 2850} {"train_loss": -12.504545211791992, "global_step": 478883, "epoch": 2850} {"train_loss": -12.739303588867188, "global_step": 478884, "epoch": 2850} {"train_loss": -12.833450317382812, "global_step": 478885, "epoch": 2850} {"train_loss": -12.757692337036133, "global_step": 478886, "epoch": 2850} {"train_loss": -12.84742546081543, "global_step": 478887, "epoch": 2850} {"train_loss": -12.891298294067383, "global_step": 478888, "epoch": 2850} {"train_loss": -12.607019424438477, "global_step": 478889, "epoch": 2850} {"train_loss": -12.176748275756836, "global_step": 478890, "epoch": 2850} {"train_loss": -11.994840621948242, "global_step": 478891, "epoch": 2850} {"train_loss": -12.103827476501465, "global_step": 478892, "epoch": 2850} {"train_loss": -11.908272743225098, "global_step": 478893, "epoch": 2850} {"train_loss": -12.066502571105957, "global_step": 478894, "epoch": 2850} {"train_loss": -11.774951934814453, "global_step": 478895, "epoch": 2850} {"train_loss": -12.264403343200684, "global_step": 478896, "epoch": 2850} {"train_loss": -12.124174118041992, "global_step": 478897, "epoch": 2850} {"train_loss": -11.497798919677734, "global_step": 478898, "epoch": 2850} {"train_loss": -12.25341510772705, "global_step": 478899, "epoch": 2850} {"train_loss": -12.207027435302734, "global_step": 478900, "epoch": 2850} {"train_loss": -11.362900733947754, "global_step": 478901, "epoch": 2850} {"train_loss": -11.875299453735352, "global_step": 478902, "epoch": 2850} {"train_loss": -11.500967025756836, "global_step": 478903, "epoch": 2850} {"train_loss": -10.345142364501953, "global_step": 478904, "epoch": 2850} {"train_loss": -12.733312606811523, "global_step": 478905, "epoch": 2850} {"train_loss": -10.473211288452148, "global_step": 478906, "epoch": 2850} {"train_loss": -12.104276657104492, "global_step": 478907, "epoch": 2850} {"train_loss": -12.453593254089355, "global_step": 478908, "epoch": 2850} {"train_loss": -12.03963851928711, "global_step": 478909, "epoch": 2850} {"train_loss": -12.521965980529785, "global_step": 478910, "epoch": 2850} {"train_loss": -12.188858985900879, "global_step": 478911, "epoch": 2850} {"train_loss": -12.217778205871582, "global_step": 478912, "epoch": 2850} {"train_loss": -11.749595642089844, "global_step": 478913, "epoch": 2850} {"train_loss": -12.556406021118164, "global_step": 478914, "epoch": 2850} {"train_loss": -11.947532653808594, "global_step": 478915, "epoch": 2850} {"train_loss": -12.589715003967285, "global_step": 478916, "epoch": 2850} {"train_loss": -12.680900573730469, "global_step": 478917, "epoch": 2850} {"train_loss": -12.342100143432617, "global_step": 478918, "epoch": 2850} {"train_loss": -12.004773139953613, "global_step": 478919, "epoch": 2850} {"train_loss": -12.75389289855957, "global_step": 478920, "epoch": 2850} {"train_loss": -12.670821189880371, "global_step": 478921, "epoch": 2850} {"train_loss": -12.07078742980957, "global_step": 478922, "epoch": 2850} {"train_loss": -12.238607406616211, "global_step": 478923, "epoch": 2850} {"train_loss": -12.951271057128906, "global_step": 478924, "epoch": 2850} {"train_loss": -12.201532363891602, "global_step": 478925, "epoch": 2850} {"train_loss": -12.561641693115234, "global_step": 478926, "epoch": 2850} {"train_loss": -12.705737113952637, "global_step": 478927, "epoch": 2850} {"train_loss": -12.227378845214844, "global_step": 478928, "epoch": 2850} {"train_loss": -12.583908081054688, "global_step": 478929, "epoch": 2850} {"train_loss": -12.428420066833496, "global_step": 478930, "epoch": 2850} {"train_loss": -12.026155471801758, "global_step": 478931, "epoch": 2850} {"train_loss": -12.680262565612793, "global_step": 478932, "epoch": 2850} {"train_loss": -12.136037826538086, "global_step": 478933, "epoch": 2850} {"train_loss": -12.338776588439941, "global_step": 478934, "epoch": 2850} {"train_loss": -12.169817924499512, "global_step": 478935, "epoch": 2850} {"train_loss": -12.610071182250977, "global_step": 478936, "epoch": 2850} {"train_loss": -12.211060523986816, "global_step": 478937, "epoch": 2850} {"train_loss": -11.736493110656738, "global_step": 478938, "epoch": 2850} {"train_loss": -12.339767456054688, "global_step": 478939, "epoch": 2850} {"train_loss": -10.574362754821777, "global_step": 478940, "epoch": 2850} {"train_loss": -11.836755752563477, "global_step": 478941, "epoch": 2850} {"train_loss": -11.175003051757812, "global_step": 478942, "epoch": 2850} {"train_loss": -10.900409698486328, "global_step": 478943, "epoch": 2850} {"train_loss": -9.693689346313477, "global_step": 478944, "epoch": 2850} {"train_loss": -10.260543823242188, "global_step": 478945, "epoch": 2850} {"train_loss": -9.782992362976074, "global_step": 478946, "epoch": 2850} {"train_loss": -10.704925537109375, "global_step": 478947, "epoch": 2850} {"train_loss": -10.406942367553711, "global_step": 478948, "epoch": 2850} {"train_loss": -9.812135696411133, "global_step": 478949, "epoch": 2850} {"train_loss": -11.00421142578125, "global_step": 478950, "epoch": 2850} {"train_loss": -9.541053771972656, "global_step": 478951, "epoch": 2850} {"train_loss": -9.684565544128418, "global_step": 478952, "epoch": 2850} {"train_loss": -11.25661849975586, "global_step": 478953, "epoch": 2850} {"train_loss": -10.434325218200684, "global_step": 478954, "epoch": 2850} {"train_loss": -10.471746444702148, "global_step": 478955, "epoch": 2850} {"train_loss": -11.667123794555664, "global_step": 478956, "epoch": 2850} {"train_loss": -10.252920150756836, "global_step": 478957, "epoch": 2850} {"train_loss": -11.119483947753906, "global_step": 478958, "epoch": 2850} {"train_loss": -9.955160140991211, "global_step": 478959, "epoch": 2850} {"train_loss": -10.098743438720703, "global_step": 478960, "epoch": 2850} {"train_loss": -10.06679916381836, "global_step": 478961, "epoch": 2850} {"train_loss": -12.070106506347656, "global_step": 478962, "epoch": 2850} {"train_loss": -10.680400848388672, "global_step": 478963, "epoch": 2850} {"train_loss": -10.906838417053223, "global_step": 478964, "epoch": 2850} {"train_loss": -11.933843612670898, "global_step": 478965, "epoch": 2850} {"train_loss": -11.307886123657227, "global_step": 478966, "epoch": 2850} {"train_loss": -11.987322648366293, "global_step": 478967, "epoch": 2850, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 0.9763782792860016, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.7254024367461138, "train/sim_max_reward_4": 0.961018694106263, "train/sim_max_reward_5": 0.7077363234404243, "test/sim_max_reward_4400000": 0.8245479685193334, "test/sim_max_reward_4400001": 0.34524959106572084, "test/sim_max_reward_4400002": 0.09782455886636791, "test/sim_max_reward_4400003": 0.09756925254059329, "test/sim_max_reward_4400004": 0.6431499770875544, "test/sim_max_reward_4400005": 0.9954260677289916, "test/sim_max_reward_4400006": 0.9405356995014595, "test/sim_max_reward_4400007": 0.49313120061135146, "test/sim_max_reward_4400008": 0.633425384576026, "test/sim_max_reward_4400009": 0.4059235426138988, "test/sim_max_reward_4400010": 0.2595396738118182, "test/sim_max_reward_4400011": 0.9440226308508067, "test/sim_max_reward_4400012": 0.14110722128947978, "test/sim_max_reward_4400013": 0.9901977812393463, "test/sim_max_reward_4400014": 0.5185038892198328, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9761703771241853, "test/sim_max_reward_4400019": 0.5961209303133523, "test/sim_max_reward_4400020": 2.576982773665235e-05, "test/sim_max_reward_4400021": 0.6907542422245356, "test/sim_max_reward_4400022": 0.0, "test/sim_max_reward_4400023": 0.0, "test/sim_max_reward_4400024": 0.9975756832332776, "test/sim_max_reward_4400025": 0.5215358859694778, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.9699855257419512, "test/sim_max_reward_4400028": 0.9925717081886651, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 0.9869496005889453, "test/sim_max_reward_4400031": 0.6922987917789706, "test/sim_max_reward_4400032": 0.36027243422954786, "test/sim_max_reward_4400033": 0.6707387034622546, "test/sim_max_reward_4400034": 0.6864772185794789, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.36771900390989315, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.300428709203356, "test/sim_max_reward_4400039": 0.959570571290169, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.16555849196911157, "test/sim_max_reward_4400042": 0.5182080011170447, "test/sim_max_reward_4400043": 0.2594167115293713, "test/sim_max_reward_4400044": 0.9970442947320878, "test/sim_max_reward_4400045": 0.6532449229156869, "test/sim_max_reward_4400046": 0.9932706054697406, "test/sim_max_reward_4400047": 1.0, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.33055503713539686, "train/mean_score": 0.7284226222631337, "test/mean_score": 0.5260194648885769, "val_loss": 317523.5, "train_action_mse_error": 1.6881942749023438} {"train_loss": -12.181801795959473, "global_step": 478968, "epoch": 2851} {"train_loss": -10.64954948425293, "global_step": 478969, "epoch": 2851} {"train_loss": -11.336827278137207, "global_step": 478970, "epoch": 2851} {"train_loss": -10.911754608154297, "global_step": 478971, "epoch": 2851} {"train_loss": -10.993171691894531, "global_step": 478972, "epoch": 2851} {"train_loss": -10.692675590515137, "global_step": 478973, "epoch": 2851} {"train_loss": -11.270031929016113, "global_step": 478974, "epoch": 2851} {"train_loss": -11.534666061401367, "global_step": 478975, "epoch": 2851} {"train_loss": -10.496623992919922, "global_step": 478976, "epoch": 2851} {"train_loss": -11.191217422485352, "global_step": 478977, "epoch": 2851} {"train_loss": -12.26707649230957, "global_step": 478978, "epoch": 2851} {"train_loss": -10.96769905090332, "global_step": 478979, "epoch": 2851} {"train_loss": -12.08200454711914, "global_step": 478980, "epoch": 2851} {"train_loss": -11.079445838928223, "global_step": 478981, "epoch": 2851} {"train_loss": -11.625874519348145, "global_step": 478982, "epoch": 2851} {"train_loss": -11.558156967163086, "global_step": 478983, "epoch": 2851} {"train_loss": -11.865796089172363, "global_step": 478984, "epoch": 2851} {"train_loss": -11.505151748657227, "global_step": 478985, "epoch": 2851} {"train_loss": -12.238800048828125, "global_step": 478986, "epoch": 2851} {"train_loss": -11.217247009277344, "global_step": 478987, "epoch": 2851} {"train_loss": -11.976795196533203, "global_step": 478988, "epoch": 2851} {"train_loss": -11.93498706817627, "global_step": 478989, "epoch": 2851} {"train_loss": -11.352884292602539, "global_step": 478990, "epoch": 2851} {"train_loss": -12.128389358520508, "global_step": 478991, "epoch": 2851} {"train_loss": -11.588481903076172, "global_step": 478992, "epoch": 2851} {"train_loss": -12.075382232666016, "global_step": 478993, "epoch": 2851} {"train_loss": -12.229375839233398, "global_step": 478994, "epoch": 2851} {"train_loss": -12.099523544311523, "global_step": 478995, "epoch": 2851} {"train_loss": -12.303797721862793, "global_step": 478996, "epoch": 2851} {"train_loss": -12.152082443237305, "global_step": 478997, "epoch": 2851} {"train_loss": -12.229089736938477, "global_step": 478998, "epoch": 2851} {"train_loss": -12.53462028503418, "global_step": 478999, "epoch": 2851} {"train_loss": -12.296462059020996, "global_step": 479000, "epoch": 2851} {"train_loss": -12.171218872070312, "global_step": 479001, "epoch": 2851} {"train_loss": -12.3576078414917, "global_step": 479002, "epoch": 2851} {"train_loss": -12.223068237304688, "global_step": 479003, "epoch": 2851} {"train_loss": -12.261739730834961, "global_step": 479004, "epoch": 2851} {"train_loss": -12.343814849853516, "global_step": 479005, "epoch": 2851} {"train_loss": -12.437835693359375, "global_step": 479006, "epoch": 2851} {"train_loss": -12.604940414428711, "global_step": 479007, "epoch": 2851} {"train_loss": -12.51180648803711, "global_step": 479008, "epoch": 2851} {"train_loss": -12.7232084274292, "global_step": 479009, "epoch": 2851} {"train_loss": -12.554668426513672, "global_step": 479010, "epoch": 2851} {"train_loss": -12.60361385345459, "global_step": 479011, "epoch": 2851} {"train_loss": -12.663932800292969, "global_step": 479012, "epoch": 2851} {"train_loss": -12.502789497375488, "global_step": 479013, "epoch": 2851} {"train_loss": -12.501704216003418, "global_step": 479014, "epoch": 2851} {"train_loss": -12.353553771972656, "global_step": 479015, "epoch": 2851} {"train_loss": -12.580648422241211, "global_step": 479016, "epoch": 2851} {"train_loss": -12.47443962097168, "global_step": 479017, "epoch": 2851} {"train_loss": -12.589447975158691, "global_step": 479018, "epoch": 2851} {"train_loss": -12.799188613891602, "global_step": 479019, "epoch": 2851} {"train_loss": -12.55850887298584, "global_step": 479020, "epoch": 2851} {"train_loss": -12.476583480834961, "global_step": 479021, "epoch": 2851} {"train_loss": -12.748699188232422, "global_step": 479022, "epoch": 2851} {"train_loss": -12.428560256958008, "global_step": 479023, "epoch": 2851} {"train_loss": -12.578213691711426, "global_step": 479024, "epoch": 2851} {"train_loss": -12.569332122802734, "global_step": 479025, "epoch": 2851} {"train_loss": -12.616096496582031, "global_step": 479026, "epoch": 2851} {"train_loss": -12.714081764221191, "global_step": 479027, "epoch": 2851} {"train_loss": -12.717681884765625, "global_step": 479028, "epoch": 2851} {"train_loss": -12.580385208129883, "global_step": 479029, "epoch": 2851} {"train_loss": -12.565138816833496, "global_step": 479030, "epoch": 2851} {"train_loss": -12.757333755493164, "global_step": 479031, "epoch": 2851} {"train_loss": -12.878619194030762, "global_step": 479032, "epoch": 2851} {"train_loss": -12.791125297546387, "global_step": 479033, "epoch": 2851} {"train_loss": -12.788036346435547, "global_step": 479034, "epoch": 2851} {"train_loss": -12.724733352661133, "global_step": 479035, "epoch": 2851} {"train_loss": -12.638286590576172, "global_step": 479036, "epoch": 2851} {"train_loss": -12.78129768371582, "global_step": 479037, "epoch": 2851} {"train_loss": -12.80459213256836, "global_step": 479038, "epoch": 2851} {"train_loss": -12.690973281860352, "global_step": 479039, "epoch": 2851} {"train_loss": -12.80292797088623, "global_step": 479040, "epoch": 2851} {"train_loss": -12.858378410339355, "global_step": 479041, "epoch": 2851} {"train_loss": -12.610977172851562, "global_step": 479042, "epoch": 2851} {"train_loss": -12.709463119506836, "global_step": 479043, "epoch": 2851} {"train_loss": -12.713504791259766, "global_step": 479044, "epoch": 2851} {"train_loss": -12.828941345214844, "global_step": 479045, "epoch": 2851} {"train_loss": -12.738595962524414, "global_step": 479046, "epoch": 2851} {"train_loss": -12.745416641235352, "global_step": 479047, "epoch": 2851} {"train_loss": -12.850067138671875, "global_step": 479048, "epoch": 2851} {"train_loss": -12.70828628540039, "global_step": 479049, "epoch": 2851} {"train_loss": -12.504480361938477, "global_step": 479050, "epoch": 2851} {"train_loss": -12.773300170898438, "global_step": 479051, "epoch": 2851} {"train_loss": -12.94822883605957, "global_step": 479052, "epoch": 2851} {"train_loss": -13.0148286819458, "global_step": 479053, "epoch": 2851} {"train_loss": -12.673842430114746, "global_step": 479054, "epoch": 2851} {"train_loss": -12.952259063720703, "global_step": 479055, "epoch": 2851} {"train_loss": -12.790416717529297, "global_step": 479056, "epoch": 2851} {"train_loss": -12.716899871826172, "global_step": 479057, "epoch": 2851} {"train_loss": -12.62549877166748, "global_step": 479058, "epoch": 2851} {"train_loss": -12.81722640991211, "global_step": 479059, "epoch": 2851} {"train_loss": -12.778756141662598, "global_step": 479060, "epoch": 2851} {"train_loss": -12.873516082763672, "global_step": 479061, "epoch": 2851} {"train_loss": -12.895612716674805, "global_step": 479062, "epoch": 2851} {"train_loss": -12.933527946472168, "global_step": 479063, "epoch": 2851} {"train_loss": -12.861092567443848, "global_step": 479064, "epoch": 2851} {"train_loss": -13.063282012939453, "global_step": 479065, "epoch": 2851} {"train_loss": -12.79749870300293, "global_step": 479066, "epoch": 2851} {"train_loss": -12.90660285949707, "global_step": 479067, "epoch": 2851} {"train_loss": -12.894682884216309, "global_step": 479068, "epoch": 2851} {"train_loss": -12.90371322631836, "global_step": 479069, "epoch": 2851} {"train_loss": -13.028678894042969, "global_step": 479070, "epoch": 2851} {"train_loss": -12.731637954711914, "global_step": 479071, "epoch": 2851} {"train_loss": -12.960453033447266, "global_step": 479072, "epoch": 2851} {"train_loss": -12.709503173828125, "global_step": 479073, "epoch": 2851} {"train_loss": -12.691177368164062, "global_step": 479074, "epoch": 2851} {"train_loss": -12.805163383483887, "global_step": 479075, "epoch": 2851} {"train_loss": -12.676347732543945, "global_step": 479076, "epoch": 2851} {"train_loss": -12.605222702026367, "global_step": 479077, "epoch": 2851} {"train_loss": -12.589595794677734, "global_step": 479078, "epoch": 2851} {"train_loss": -13.114913940429688, "global_step": 479079, "epoch": 2851} {"train_loss": -12.882396697998047, "global_step": 479080, "epoch": 2851} {"train_loss": -12.97868537902832, "global_step": 479081, "epoch": 2851} {"train_loss": -12.548580169677734, "global_step": 479082, "epoch": 2851} {"train_loss": -12.519073486328125, "global_step": 479083, "epoch": 2851} {"train_loss": -11.669550895690918, "global_step": 479084, "epoch": 2851} {"train_loss": -12.240829467773438, "global_step": 479085, "epoch": 2851} {"train_loss": -12.71860122680664, "global_step": 479086, "epoch": 2851} {"train_loss": -11.543022155761719, "global_step": 479087, "epoch": 2851} {"train_loss": -12.096890449523926, "global_step": 479088, "epoch": 2851} {"train_loss": -12.402482032775879, "global_step": 479089, "epoch": 2851} {"train_loss": -11.766728401184082, "global_step": 479090, "epoch": 2851} {"train_loss": -12.268169403076172, "global_step": 479091, "epoch": 2851} {"train_loss": -11.64426326751709, "global_step": 479092, "epoch": 2851} {"train_loss": -12.4436616897583, "global_step": 479093, "epoch": 2851} {"train_loss": -12.477413177490234, "global_step": 479094, "epoch": 2851} {"train_loss": -12.01390552520752, "global_step": 479095, "epoch": 2851} {"train_loss": -12.02981185913086, "global_step": 479096, "epoch": 2851} {"train_loss": -12.425949096679688, "global_step": 479097, "epoch": 2851} {"train_loss": -11.794921875, "global_step": 479098, "epoch": 2851} {"train_loss": -12.181529998779297, "global_step": 479099, "epoch": 2851} {"train_loss": -12.680976867675781, "global_step": 479100, "epoch": 2851} {"train_loss": -12.327411651611328, "global_step": 479101, "epoch": 2851} {"train_loss": -12.607611656188965, "global_step": 479102, "epoch": 2851} {"train_loss": -12.530618667602539, "global_step": 479103, "epoch": 2851} {"train_loss": -12.048904418945312, "global_step": 479104, "epoch": 2851} {"train_loss": -11.585541725158691, "global_step": 479105, "epoch": 2851} {"train_loss": -11.925516128540039, "global_step": 479106, "epoch": 2851} {"train_loss": -11.796683311462402, "global_step": 479107, "epoch": 2851} {"train_loss": -11.203640937805176, "global_step": 479108, "epoch": 2851} {"train_loss": -12.081327438354492, "global_step": 479109, "epoch": 2851} {"train_loss": -11.975173950195312, "global_step": 479110, "epoch": 2851} {"train_loss": -11.040639877319336, "global_step": 479111, "epoch": 2851} {"train_loss": -11.917712211608887, "global_step": 479112, "epoch": 2851} {"train_loss": -10.704545974731445, "global_step": 479113, "epoch": 2851} {"train_loss": -12.35566520690918, "global_step": 479114, "epoch": 2851} {"train_loss": -12.243545532226562, "global_step": 479115, "epoch": 2851} {"train_loss": -11.60008716583252, "global_step": 479116, "epoch": 2851} {"train_loss": -12.65761661529541, "global_step": 479117, "epoch": 2851} {"train_loss": -12.18339729309082, "global_step": 479118, "epoch": 2851} {"train_loss": -11.87755012512207, "global_step": 479119, "epoch": 2851} {"train_loss": -12.109172821044922, "global_step": 479120, "epoch": 2851} {"train_loss": -12.284488677978516, "global_step": 479121, "epoch": 2851} {"train_loss": -11.668233871459961, "global_step": 479122, "epoch": 2851} {"train_loss": -12.418027877807617, "global_step": 479123, "epoch": 2851} {"train_loss": -12.581706047058105, "global_step": 479124, "epoch": 2851} {"train_loss": -12.014891624450684, "global_step": 479125, "epoch": 2851} {"train_loss": -12.295631408691406, "global_step": 479126, "epoch": 2851} {"train_loss": -12.802241325378418, "global_step": 479127, "epoch": 2851} {"train_loss": -11.843172073364258, "global_step": 479128, "epoch": 2851} {"train_loss": -12.641061782836914, "global_step": 479129, "epoch": 2851} {"train_loss": -12.883749008178711, "global_step": 479130, "epoch": 2851} {"train_loss": -12.647714614868164, "global_step": 479131, "epoch": 2851} {"train_loss": -12.76959228515625, "global_step": 479132, "epoch": 2851} {"train_loss": -12.564130783081055, "global_step": 479133, "epoch": 2851} {"train_loss": -12.819341659545898, "global_step": 479134, "epoch": 2851} {"train_loss": -12.323229426429386, "global_step": 479135, "epoch": 2851, "val_loss": 316664.40625} {"train_loss": -12.751304626464844, "global_step": 479136, "epoch": 2852} {"train_loss": -12.533480644226074, "global_step": 479137, "epoch": 2852} {"train_loss": -12.22314739227295, "global_step": 479138, "epoch": 2852} {"train_loss": -12.483987808227539, "global_step": 479139, "epoch": 2852} {"train_loss": -12.266311645507812, "global_step": 479140, "epoch": 2852} {"train_loss": -12.70687198638916, "global_step": 479141, "epoch": 2852} {"train_loss": -12.53956413269043, "global_step": 479142, "epoch": 2852} {"train_loss": -12.696043014526367, "global_step": 479143, "epoch": 2852} {"train_loss": -12.907785415649414, "global_step": 479144, "epoch": 2852} {"train_loss": -12.733707427978516, "global_step": 479145, "epoch": 2852} {"train_loss": -12.299808502197266, "global_step": 479146, "epoch": 2852} {"train_loss": -12.63768196105957, "global_step": 479147, "epoch": 2852} {"train_loss": -12.811393737792969, "global_step": 479148, "epoch": 2852} {"train_loss": -12.610184669494629, "global_step": 479149, "epoch": 2852} {"train_loss": -12.774513244628906, "global_step": 479150, "epoch": 2852} {"train_loss": -12.736262321472168, "global_step": 479151, "epoch": 2852} {"train_loss": -12.635172843933105, "global_step": 479152, "epoch": 2852} {"train_loss": -12.357634544372559, "global_step": 479153, "epoch": 2852} {"train_loss": -12.756633758544922, "global_step": 479154, "epoch": 2852} {"train_loss": -12.114557266235352, "global_step": 479155, "epoch": 2852} {"train_loss": -12.210075378417969, "global_step": 479156, "epoch": 2852} {"train_loss": -12.29399299621582, "global_step": 479157, "epoch": 2852} {"train_loss": -11.458544731140137, "global_step": 479158, "epoch": 2852} {"train_loss": -10.955791473388672, "global_step": 479159, "epoch": 2852} {"train_loss": -12.570355415344238, "global_step": 479160, "epoch": 2852} {"train_loss": -11.324115753173828, "global_step": 479161, "epoch": 2852} {"train_loss": -11.194768905639648, "global_step": 479162, "epoch": 2852} {"train_loss": -12.407429695129395, "global_step": 479163, "epoch": 2852} {"train_loss": -11.744489669799805, "global_step": 479164, "epoch": 2852} {"train_loss": -11.664878845214844, "global_step": 479165, "epoch": 2852} {"train_loss": -12.511048316955566, "global_step": 479166, "epoch": 2852} {"train_loss": -11.792094230651855, "global_step": 479167, "epoch": 2852} {"train_loss": -11.678821563720703, "global_step": 479168, "epoch": 2852} {"train_loss": -12.789072036743164, "global_step": 479169, "epoch": 2852} {"train_loss": -11.62743091583252, "global_step": 479170, "epoch": 2852} {"train_loss": -12.071023941040039, "global_step": 479171, "epoch": 2852} {"train_loss": -12.112264633178711, "global_step": 479172, "epoch": 2852} {"train_loss": -12.09490966796875, "global_step": 479173, "epoch": 2852} {"train_loss": -12.086458206176758, "global_step": 479174, "epoch": 2852} {"train_loss": -12.630139350891113, "global_step": 479175, "epoch": 2852} {"train_loss": -11.521069526672363, "global_step": 479176, "epoch": 2852} {"train_loss": -12.627710342407227, "global_step": 479177, "epoch": 2852} {"train_loss": -11.85002326965332, "global_step": 479178, "epoch": 2852} {"train_loss": -12.071391105651855, "global_step": 479179, "epoch": 2852} {"train_loss": -12.497886657714844, "global_step": 479180, "epoch": 2852} {"train_loss": -12.170215606689453, "global_step": 479181, "epoch": 2852} {"train_loss": -12.622159957885742, "global_step": 479182, "epoch": 2852} {"train_loss": -12.561888694763184, "global_step": 479183, "epoch": 2852} {"train_loss": -12.691695213317871, "global_step": 479184, "epoch": 2852} {"train_loss": -12.772098541259766, "global_step": 479185, "epoch": 2852} {"train_loss": -12.439542770385742, "global_step": 479186, "epoch": 2852} {"train_loss": -12.721283912658691, "global_step": 479187, "epoch": 2852} {"train_loss": -12.315146446228027, "global_step": 479188, "epoch": 2852} {"train_loss": -12.51738166809082, "global_step": 479189, "epoch": 2852} {"train_loss": -12.812577247619629, "global_step": 479190, "epoch": 2852} {"train_loss": -12.601022720336914, "global_step": 479191, "epoch": 2852} {"train_loss": -12.635028839111328, "global_step": 479192, "epoch": 2852} {"train_loss": -12.675463676452637, "global_step": 479193, "epoch": 2852} {"train_loss": -12.845829010009766, "global_step": 479194, "epoch": 2852} {"train_loss": -12.653523445129395, "global_step": 479195, "epoch": 2852} {"train_loss": -12.97536849975586, "global_step": 479196, "epoch": 2852} {"train_loss": -12.650618553161621, "global_step": 479197, "epoch": 2852} {"train_loss": -12.849079132080078, "global_step": 479198, "epoch": 2852} {"train_loss": -12.565201759338379, "global_step": 479199, "epoch": 2852} {"train_loss": -12.639114379882812, "global_step": 479200, "epoch": 2852} {"train_loss": -12.761229515075684, "global_step": 479201, "epoch": 2852} {"train_loss": -12.804997444152832, "global_step": 479202, "epoch": 2852} {"train_loss": -12.688138961791992, "global_step": 479203, "epoch": 2852} {"train_loss": -12.559321403503418, "global_step": 479204, "epoch": 2852} {"train_loss": -12.642585754394531, "global_step": 479205, "epoch": 2852} {"train_loss": -12.769891738891602, "global_step": 479206, "epoch": 2852} {"train_loss": -12.423133850097656, "global_step": 479207, "epoch": 2852} {"train_loss": -12.875190734863281, "global_step": 479208, "epoch": 2852} {"train_loss": -12.755607604980469, "global_step": 479209, "epoch": 2852} {"train_loss": -12.793207168579102, "global_step": 479210, "epoch": 2852} {"train_loss": -12.432830810546875, "global_step": 479211, "epoch": 2852} {"train_loss": -12.821596145629883, "global_step": 479212, "epoch": 2852} {"train_loss": -12.625044822692871, "global_step": 479213, "epoch": 2852} {"train_loss": -12.280210494995117, "global_step": 479214, "epoch": 2852} {"train_loss": -12.474231719970703, "global_step": 479215, "epoch": 2852} {"train_loss": -11.958810806274414, "global_step": 479216, "epoch": 2852} {"train_loss": -11.88021183013916, "global_step": 479217, "epoch": 2852} {"train_loss": -11.479116439819336, "global_step": 479218, "epoch": 2852} {"train_loss": -11.161649703979492, "global_step": 479219, "epoch": 2852} {"train_loss": -12.15252685546875, "global_step": 479220, "epoch": 2852} {"train_loss": -9.210983276367188, "global_step": 479221, "epoch": 2852} {"train_loss": -10.466257095336914, "global_step": 479222, "epoch": 2852} {"train_loss": -11.791351318359375, "global_step": 479223, "epoch": 2852} {"train_loss": -10.869895935058594, "global_step": 479224, "epoch": 2852} {"train_loss": -11.358026504516602, "global_step": 479225, "epoch": 2852} {"train_loss": -11.254902839660645, "global_step": 479226, "epoch": 2852} {"train_loss": -11.382266998291016, "global_step": 479227, "epoch": 2852} {"train_loss": -11.065084457397461, "global_step": 479228, "epoch": 2852} {"train_loss": -10.04621696472168, "global_step": 479229, "epoch": 2852} {"train_loss": -10.68716812133789, "global_step": 479230, "epoch": 2852} {"train_loss": -11.047483444213867, "global_step": 479231, "epoch": 2852} {"train_loss": -9.742301940917969, "global_step": 479232, "epoch": 2852} {"train_loss": -11.306148529052734, "global_step": 479233, "epoch": 2852} {"train_loss": -9.395049095153809, "global_step": 479234, "epoch": 2852} {"train_loss": -11.01126480102539, "global_step": 479235, "epoch": 2852} {"train_loss": -9.598621368408203, "global_step": 479236, "epoch": 2852} {"train_loss": -10.792120933532715, "global_step": 479237, "epoch": 2852} {"train_loss": -10.323698043823242, "global_step": 479238, "epoch": 2852} {"train_loss": -11.05524730682373, "global_step": 479239, "epoch": 2852} {"train_loss": -10.537030220031738, "global_step": 479240, "epoch": 2852} {"train_loss": -10.808242797851562, "global_step": 479241, "epoch": 2852} {"train_loss": -10.296319961547852, "global_step": 479242, "epoch": 2852} {"train_loss": -11.516054153442383, "global_step": 479243, "epoch": 2852} {"train_loss": -11.360230445861816, "global_step": 479244, "epoch": 2852} {"train_loss": -11.78976821899414, "global_step": 479245, "epoch": 2852} {"train_loss": -11.382519721984863, "global_step": 479246, "epoch": 2852} {"train_loss": -11.040828704833984, "global_step": 479247, "epoch": 2852} {"train_loss": -11.527898788452148, "global_step": 479248, "epoch": 2852} {"train_loss": -11.150053977966309, "global_step": 479249, "epoch": 2852} {"train_loss": -11.881650924682617, "global_step": 479250, "epoch": 2852} {"train_loss": -11.551176071166992, "global_step": 479251, "epoch": 2852} {"train_loss": -11.893945693969727, "global_step": 479252, "epoch": 2852} {"train_loss": -11.95989990234375, "global_step": 479253, "epoch": 2852} {"train_loss": -12.15129566192627, "global_step": 479254, "epoch": 2852} {"train_loss": -11.927902221679688, "global_step": 479255, "epoch": 2852} {"train_loss": -12.02254867553711, "global_step": 479256, "epoch": 2852} {"train_loss": -12.221027374267578, "global_step": 479257, "epoch": 2852} {"train_loss": -11.958858489990234, "global_step": 479258, "epoch": 2852} {"train_loss": -12.117006301879883, "global_step": 479259, "epoch": 2852} {"train_loss": -11.757041931152344, "global_step": 479260, "epoch": 2852} {"train_loss": -12.625297546386719, "global_step": 479261, "epoch": 2852} {"train_loss": -12.068288803100586, "global_step": 479262, "epoch": 2852} {"train_loss": -12.279890060424805, "global_step": 479263, "epoch": 2852} {"train_loss": -12.477193832397461, "global_step": 479264, "epoch": 2852} {"train_loss": -12.296947479248047, "global_step": 479265, "epoch": 2852} {"train_loss": -12.342866897583008, "global_step": 479266, "epoch": 2852} {"train_loss": -12.229026794433594, "global_step": 479267, "epoch": 2852} {"train_loss": -12.13389778137207, "global_step": 479268, "epoch": 2852} {"train_loss": -11.891901016235352, "global_step": 479269, "epoch": 2852} {"train_loss": -11.987068176269531, "global_step": 479270, "epoch": 2852} {"train_loss": -12.081161499023438, "global_step": 479271, "epoch": 2852} {"train_loss": -11.947917938232422, "global_step": 479272, "epoch": 2852} {"train_loss": -12.232490539550781, "global_step": 479273, "epoch": 2852} {"train_loss": -11.611108779907227, "global_step": 479274, "epoch": 2852} {"train_loss": -11.630561828613281, "global_step": 479275, "epoch": 2852} {"train_loss": -12.035862922668457, "global_step": 479276, "epoch": 2852} {"train_loss": -11.503894805908203, "global_step": 479277, "epoch": 2852} {"train_loss": -11.588336944580078, "global_step": 479278, "epoch": 2852} {"train_loss": -10.922287940979004, "global_step": 479279, "epoch": 2852} {"train_loss": -11.368070602416992, "global_step": 479280, "epoch": 2852} {"train_loss": -11.53036880493164, "global_step": 479281, "epoch": 2852} {"train_loss": -11.903566360473633, "global_step": 479282, "epoch": 2852} {"train_loss": -10.791728019714355, "global_step": 479283, "epoch": 2852} {"train_loss": -12.545454025268555, "global_step": 479284, "epoch": 2852} {"train_loss": -11.270037651062012, "global_step": 479285, "epoch": 2852} {"train_loss": -11.84736442565918, "global_step": 479286, "epoch": 2852} {"train_loss": -11.675846099853516, "global_step": 479287, "epoch": 2852} {"train_loss": -11.121790885925293, "global_step": 479288, "epoch": 2852} {"train_loss": -11.725830078125, "global_step": 479289, "epoch": 2852} {"train_loss": -11.519832611083984, "global_step": 479290, "epoch": 2852} {"train_loss": -11.608087539672852, "global_step": 479291, "epoch": 2852} {"train_loss": -12.10285758972168, "global_step": 479292, "epoch": 2852} {"train_loss": -11.694632530212402, "global_step": 479293, "epoch": 2852} {"train_loss": -11.388707160949707, "global_step": 479294, "epoch": 2852} {"train_loss": -12.243770599365234, "global_step": 479295, "epoch": 2852} {"train_loss": -12.04184341430664, "global_step": 479296, "epoch": 2852} {"train_loss": -12.024112701416016, "global_step": 479297, "epoch": 2852} {"train_loss": -12.315513610839844, "global_step": 479298, "epoch": 2852} {"train_loss": -11.945825576782227, "global_step": 479299, "epoch": 2852} {"train_loss": -12.56710433959961, "global_step": 479300, "epoch": 2852} {"train_loss": -12.228582382202148, "global_step": 479301, "epoch": 2852} {"train_loss": -12.436004638671875, "global_step": 479302, "epoch": 2852} {"train_loss": -11.96333672886803, "global_step": 479303, "epoch": 2852, "val_loss": 319141.375} {"train_loss": -12.230372428894043, "global_step": 479304, "epoch": 2853} {"train_loss": -12.027103424072266, "global_step": 479305, "epoch": 2853} {"train_loss": -12.167707443237305, "global_step": 479306, "epoch": 2853} {"train_loss": -12.303722381591797, "global_step": 479307, "epoch": 2853} {"train_loss": -12.080520629882812, "global_step": 479308, "epoch": 2853} {"train_loss": -12.36251449584961, "global_step": 479309, "epoch": 2853} {"train_loss": -12.24612045288086, "global_step": 479310, "epoch": 2853} {"train_loss": -12.386869430541992, "global_step": 479311, "epoch": 2853} {"train_loss": -12.331279754638672, "global_step": 479312, "epoch": 2853} {"train_loss": -12.437223434448242, "global_step": 479313, "epoch": 2853} {"train_loss": -12.667142868041992, "global_step": 479314, "epoch": 2853} {"train_loss": -12.468109130859375, "global_step": 479315, "epoch": 2853} {"train_loss": -12.164302825927734, "global_step": 479316, "epoch": 2853} {"train_loss": -12.623886108398438, "global_step": 479317, "epoch": 2853} {"train_loss": -12.418668746948242, "global_step": 479318, "epoch": 2853} {"train_loss": -12.466547012329102, "global_step": 479319, "epoch": 2853} {"train_loss": -12.57748031616211, "global_step": 479320, "epoch": 2853} {"train_loss": -12.46700382232666, "global_step": 479321, "epoch": 2853} {"train_loss": -12.24523639678955, "global_step": 479322, "epoch": 2853} {"train_loss": -12.693727493286133, "global_step": 479323, "epoch": 2853} {"train_loss": -12.298370361328125, "global_step": 479324, "epoch": 2853} {"train_loss": -12.792468070983887, "global_step": 479325, "epoch": 2853} {"train_loss": -12.13825511932373, "global_step": 479326, "epoch": 2853} {"train_loss": -12.463933944702148, "global_step": 479327, "epoch": 2853} {"train_loss": -12.439823150634766, "global_step": 479328, "epoch": 2853} {"train_loss": -12.286649703979492, "global_step": 479329, "epoch": 2853} {"train_loss": -12.717605590820312, "global_step": 479330, "epoch": 2853} {"train_loss": -12.321060180664062, "global_step": 479331, "epoch": 2853} {"train_loss": -12.712684631347656, "global_step": 479332, "epoch": 2853} {"train_loss": -12.196100234985352, "global_step": 479333, "epoch": 2853} {"train_loss": -12.22813606262207, "global_step": 479334, "epoch": 2853} {"train_loss": -12.448065757751465, "global_step": 479335, "epoch": 2853} {"train_loss": -11.740612030029297, "global_step": 479336, "epoch": 2853} {"train_loss": -12.625835418701172, "global_step": 479337, "epoch": 2853} {"train_loss": -12.14509391784668, "global_step": 479338, "epoch": 2853} {"train_loss": -11.657958984375, "global_step": 479339, "epoch": 2853} {"train_loss": -12.200485229492188, "global_step": 479340, "epoch": 2853} {"train_loss": -11.008536338806152, "global_step": 479341, "epoch": 2853} {"train_loss": -11.86556339263916, "global_step": 479342, "epoch": 2853} {"train_loss": -12.449023246765137, "global_step": 479343, "epoch": 2853} {"train_loss": -11.670647621154785, "global_step": 479344, "epoch": 2853} {"train_loss": -11.612930297851562, "global_step": 479345, "epoch": 2853} {"train_loss": -12.13006591796875, "global_step": 479346, "epoch": 2853} {"train_loss": -11.57432746887207, "global_step": 479347, "epoch": 2853} {"train_loss": -12.149909973144531, "global_step": 479348, "epoch": 2853} {"train_loss": -11.794078826904297, "global_step": 479349, "epoch": 2853} {"train_loss": -12.037628173828125, "global_step": 479350, "epoch": 2853} {"train_loss": -11.655144691467285, "global_step": 479351, "epoch": 2853} {"train_loss": -12.172571182250977, "global_step": 479352, "epoch": 2853} {"train_loss": -11.171304702758789, "global_step": 479353, "epoch": 2853} {"train_loss": -12.16160774230957, "global_step": 479354, "epoch": 2853} {"train_loss": -11.747713088989258, "global_step": 479355, "epoch": 2853} {"train_loss": -11.62539291381836, "global_step": 479356, "epoch": 2853} {"train_loss": -12.101909637451172, "global_step": 479357, "epoch": 2853} {"train_loss": -11.542875289916992, "global_step": 479358, "epoch": 2853} {"train_loss": -11.201261520385742, "global_step": 479359, "epoch": 2853} {"train_loss": -12.5121488571167, "global_step": 479360, "epoch": 2853} {"train_loss": -11.678038597106934, "global_step": 479361, "epoch": 2853} {"train_loss": -12.314603805541992, "global_step": 479362, "epoch": 2853} {"train_loss": -11.862096786499023, "global_step": 479363, "epoch": 2853} {"train_loss": -12.021383285522461, "global_step": 479364, "epoch": 2853} {"train_loss": -12.130462646484375, "global_step": 479365, "epoch": 2853} {"train_loss": -11.895277976989746, "global_step": 479366, "epoch": 2853} {"train_loss": -12.621288299560547, "global_step": 479367, "epoch": 2853} {"train_loss": -11.757450103759766, "global_step": 479368, "epoch": 2853} {"train_loss": -12.419536590576172, "global_step": 479369, "epoch": 2853} {"train_loss": -12.079543113708496, "global_step": 479370, "epoch": 2853} {"train_loss": -12.421079635620117, "global_step": 479371, "epoch": 2853} {"train_loss": -12.374408721923828, "global_step": 479372, "epoch": 2853} {"train_loss": -12.507091522216797, "global_step": 479373, "epoch": 2853} {"train_loss": -12.223045349121094, "global_step": 479374, "epoch": 2853} {"train_loss": -12.372146606445312, "global_step": 479375, "epoch": 2853} {"train_loss": -12.652944564819336, "global_step": 479376, "epoch": 2853} {"train_loss": -12.410749435424805, "global_step": 479377, "epoch": 2853} {"train_loss": -12.327180862426758, "global_step": 479378, "epoch": 2853} {"train_loss": -12.026060104370117, "global_step": 479379, "epoch": 2853} {"train_loss": -12.560362815856934, "global_step": 479380, "epoch": 2853} {"train_loss": -12.38747787475586, "global_step": 479381, "epoch": 2853} {"train_loss": -12.380609512329102, "global_step": 479382, "epoch": 2853} {"train_loss": -12.68929386138916, "global_step": 479383, "epoch": 2853} {"train_loss": -12.320676803588867, "global_step": 479384, "epoch": 2853} {"train_loss": -12.56460189819336, "global_step": 479385, "epoch": 2853} {"train_loss": -12.64599609375, "global_step": 479386, "epoch": 2853} {"train_loss": -12.595739364624023, "global_step": 479387, "epoch": 2853} {"train_loss": -12.601253509521484, "global_step": 479388, "epoch": 2853} {"train_loss": -12.669344902038574, "global_step": 479389, "epoch": 2853} {"train_loss": -12.841009140014648, "global_step": 479390, "epoch": 2853} {"train_loss": -12.413750648498535, "global_step": 479391, "epoch": 2853} {"train_loss": -12.751007080078125, "global_step": 479392, "epoch": 2853} {"train_loss": -12.730799674987793, "global_step": 479393, "epoch": 2853} {"train_loss": -12.667131423950195, "global_step": 479394, "epoch": 2853} {"train_loss": -12.653139114379883, "global_step": 479395, "epoch": 2853} {"train_loss": -12.84636402130127, "global_step": 479396, "epoch": 2853} {"train_loss": -12.616137504577637, "global_step": 479397, "epoch": 2853} {"train_loss": -12.979004859924316, "global_step": 479398, "epoch": 2853} {"train_loss": -12.664989471435547, "global_step": 479399, "epoch": 2853} {"train_loss": -12.966413497924805, "global_step": 479400, "epoch": 2853} {"train_loss": -12.709978103637695, "global_step": 479401, "epoch": 2853} {"train_loss": -12.74150562286377, "global_step": 479402, "epoch": 2853} {"train_loss": -12.705371856689453, "global_step": 479403, "epoch": 2853} {"train_loss": -12.75548267364502, "global_step": 479404, "epoch": 2853} {"train_loss": -12.676309585571289, "global_step": 479405, "epoch": 2853} {"train_loss": -12.816335678100586, "global_step": 479406, "epoch": 2853} {"train_loss": -12.740809440612793, "global_step": 479407, "epoch": 2853} {"train_loss": -12.67381763458252, "global_step": 479408, "epoch": 2853} {"train_loss": -12.720479965209961, "global_step": 479409, "epoch": 2853} {"train_loss": -12.736686706542969, "global_step": 479410, "epoch": 2853} {"train_loss": -12.812051773071289, "global_step": 479411, "epoch": 2853} {"train_loss": -12.613143920898438, "global_step": 479412, "epoch": 2853} {"train_loss": -12.760664939880371, "global_step": 479413, "epoch": 2853} {"train_loss": -12.651750564575195, "global_step": 479414, "epoch": 2853} {"train_loss": -12.89089584350586, "global_step": 479415, "epoch": 2853} {"train_loss": -12.817678451538086, "global_step": 479416, "epoch": 2853} {"train_loss": -12.761041641235352, "global_step": 479417, "epoch": 2853} {"train_loss": -12.94543743133545, "global_step": 479418, "epoch": 2853} {"train_loss": -12.919809341430664, "global_step": 479419, "epoch": 2853} {"train_loss": -12.710426330566406, "global_step": 479420, "epoch": 2853} {"train_loss": -12.876775741577148, "global_step": 479421, "epoch": 2853} {"train_loss": -12.902006149291992, "global_step": 479422, "epoch": 2853} {"train_loss": -12.800963401794434, "global_step": 479423, "epoch": 2853} {"train_loss": -12.684542655944824, "global_step": 479424, "epoch": 2853} {"train_loss": -12.796941757202148, "global_step": 479425, "epoch": 2853} {"train_loss": -12.669814109802246, "global_step": 479426, "epoch": 2853} {"train_loss": -12.699506759643555, "global_step": 479427, "epoch": 2853} {"train_loss": -12.888490676879883, "global_step": 479428, "epoch": 2853} {"train_loss": -12.322632789611816, "global_step": 479429, "epoch": 2853} {"train_loss": -12.442523956298828, "global_step": 479430, "epoch": 2853} {"train_loss": -12.665031433105469, "global_step": 479431, "epoch": 2853} {"train_loss": -12.565820693969727, "global_step": 479432, "epoch": 2853} {"train_loss": -12.724176406860352, "global_step": 479433, "epoch": 2853} {"train_loss": -12.706029891967773, "global_step": 479434, "epoch": 2853} {"train_loss": -12.572498321533203, "global_step": 479435, "epoch": 2853} {"train_loss": -12.60702133178711, "global_step": 479436, "epoch": 2853} {"train_loss": -12.325078964233398, "global_step": 479437, "epoch": 2853} {"train_loss": -11.334285736083984, "global_step": 479438, "epoch": 2853} {"train_loss": -12.819829940795898, "global_step": 479439, "epoch": 2853} {"train_loss": -11.196279525756836, "global_step": 479440, "epoch": 2853} {"train_loss": -12.595979690551758, "global_step": 479441, "epoch": 2853} {"train_loss": -11.541382789611816, "global_step": 479442, "epoch": 2853} {"train_loss": -11.356582641601562, "global_step": 479443, "epoch": 2853} {"train_loss": -12.698928833007812, "global_step": 479444, "epoch": 2853} {"train_loss": -11.127843856811523, "global_step": 479445, "epoch": 2853} {"train_loss": -10.975017547607422, "global_step": 479446, "epoch": 2853} {"train_loss": -12.452829360961914, "global_step": 479447, "epoch": 2853} {"train_loss": -12.419589042663574, "global_step": 479448, "epoch": 2853} {"train_loss": -12.040885925292969, "global_step": 479449, "epoch": 2853} {"train_loss": -12.540318489074707, "global_step": 479450, "epoch": 2853} {"train_loss": -11.445064544677734, "global_step": 479451, "epoch": 2853} {"train_loss": -12.394227981567383, "global_step": 479452, "epoch": 2853} {"train_loss": -11.40888786315918, "global_step": 479453, "epoch": 2853} {"train_loss": -10.97691535949707, "global_step": 479454, "epoch": 2853} {"train_loss": -11.994977951049805, "global_step": 479455, "epoch": 2853} {"train_loss": -10.228727340698242, "global_step": 479456, "epoch": 2853} {"train_loss": -10.72036075592041, "global_step": 479457, "epoch": 2853} {"train_loss": -10.954126358032227, "global_step": 479458, "epoch": 2853} {"train_loss": -11.171003341674805, "global_step": 479459, "epoch": 2853} {"train_loss": -11.66328239440918, "global_step": 479460, "epoch": 2853} {"train_loss": -11.366132736206055, "global_step": 479461, "epoch": 2853} {"train_loss": -10.986089706420898, "global_step": 479462, "epoch": 2853} {"train_loss": -11.459471702575684, "global_step": 479463, "epoch": 2853} {"train_loss": -10.741272926330566, "global_step": 479464, "epoch": 2853} {"train_loss": -12.440691947937012, "global_step": 479465, "epoch": 2853} {"train_loss": -11.864252090454102, "global_step": 479466, "epoch": 2853} {"train_loss": -12.170158386230469, "global_step": 479467, "epoch": 2853} {"train_loss": -11.188911437988281, "global_step": 479468, "epoch": 2853} {"train_loss": -11.378974914550781, "global_step": 479469, "epoch": 2853} {"train_loss": -11.904228210449219, "global_step": 479470, "epoch": 2853} {"train_loss": -12.240339983077277, "global_step": 479471, "epoch": 2853, "val_loss": 318745.375} {"train_loss": -12.13020133972168, "global_step": 479472, "epoch": 2854} {"train_loss": -12.201120376586914, "global_step": 479473, "epoch": 2854} {"train_loss": -12.038797378540039, "global_step": 479474, "epoch": 2854} {"train_loss": -12.317459106445312, "global_step": 479475, "epoch": 2854} {"train_loss": -11.95704174041748, "global_step": 479476, "epoch": 2854} {"train_loss": -12.007020950317383, "global_step": 479477, "epoch": 2854} {"train_loss": -12.216377258300781, "global_step": 479478, "epoch": 2854} {"train_loss": -12.33514404296875, "global_step": 479479, "epoch": 2854} {"train_loss": -12.599031448364258, "global_step": 479480, "epoch": 2854} {"train_loss": -12.340795516967773, "global_step": 479481, "epoch": 2854} {"train_loss": -12.1362943649292, "global_step": 479482, "epoch": 2854} {"train_loss": -12.540457725524902, "global_step": 479483, "epoch": 2854} {"train_loss": -12.191183090209961, "global_step": 479484, "epoch": 2854} {"train_loss": -12.363737106323242, "global_step": 479485, "epoch": 2854} {"train_loss": -12.1889066696167, "global_step": 479486, "epoch": 2854} {"train_loss": -12.023303985595703, "global_step": 479487, "epoch": 2854} {"train_loss": -12.76151180267334, "global_step": 479488, "epoch": 2854} {"train_loss": -12.139320373535156, "global_step": 479489, "epoch": 2854} {"train_loss": -12.36837100982666, "global_step": 479490, "epoch": 2854} {"train_loss": -11.982452392578125, "global_step": 479491, "epoch": 2854} {"train_loss": -12.269107818603516, "global_step": 479492, "epoch": 2854} {"train_loss": -12.464956283569336, "global_step": 479493, "epoch": 2854} {"train_loss": -12.403417587280273, "global_step": 479494, "epoch": 2854} {"train_loss": -12.4273681640625, "global_step": 479495, "epoch": 2854} {"train_loss": -12.286688804626465, "global_step": 479496, "epoch": 2854} {"train_loss": -12.274948120117188, "global_step": 479497, "epoch": 2854} {"train_loss": -12.096677780151367, "global_step": 479498, "epoch": 2854} {"train_loss": -11.91387939453125, "global_step": 479499, "epoch": 2854} {"train_loss": -12.199199676513672, "global_step": 479500, "epoch": 2854} {"train_loss": -12.30098819732666, "global_step": 479501, "epoch": 2854} {"train_loss": -12.450766563415527, "global_step": 479502, "epoch": 2854} {"train_loss": -12.288660049438477, "global_step": 479503, "epoch": 2854} {"train_loss": -12.3804349899292, "global_step": 479504, "epoch": 2854} {"train_loss": -12.62797737121582, "global_step": 479505, "epoch": 2854} {"train_loss": -12.401517868041992, "global_step": 479506, "epoch": 2854} {"train_loss": -12.602558135986328, "global_step": 479507, "epoch": 2854} {"train_loss": -12.347036361694336, "global_step": 479508, "epoch": 2854} {"train_loss": -12.810287475585938, "global_step": 479509, "epoch": 2854} {"train_loss": -12.533199310302734, "global_step": 479510, "epoch": 2854} {"train_loss": -11.979982376098633, "global_step": 479511, "epoch": 2854} {"train_loss": -12.541399002075195, "global_step": 479512, "epoch": 2854} {"train_loss": -12.37794017791748, "global_step": 479513, "epoch": 2854} {"train_loss": -12.714797019958496, "global_step": 479514, "epoch": 2854} {"train_loss": -12.151638984680176, "global_step": 479515, "epoch": 2854} {"train_loss": -12.354866027832031, "global_step": 479516, "epoch": 2854} {"train_loss": -12.060857772827148, "global_step": 479517, "epoch": 2854} {"train_loss": -12.370410919189453, "global_step": 479518, "epoch": 2854} {"train_loss": -12.364526748657227, "global_step": 479519, "epoch": 2854} {"train_loss": -12.478161811828613, "global_step": 479520, "epoch": 2854} {"train_loss": -12.73713207244873, "global_step": 479521, "epoch": 2854} {"train_loss": -12.493368148803711, "global_step": 479522, "epoch": 2854} {"train_loss": -12.628073692321777, "global_step": 479523, "epoch": 2854} {"train_loss": -12.752943992614746, "global_step": 479524, "epoch": 2854} {"train_loss": -12.585657119750977, "global_step": 479525, "epoch": 2854} {"train_loss": -12.672131538391113, "global_step": 479526, "epoch": 2854} {"train_loss": -12.76894760131836, "global_step": 479527, "epoch": 2854} {"train_loss": -12.632649421691895, "global_step": 479528, "epoch": 2854} {"train_loss": -12.653709411621094, "global_step": 479529, "epoch": 2854} {"train_loss": -12.85865306854248, "global_step": 479530, "epoch": 2854} {"train_loss": -12.859590530395508, "global_step": 479531, "epoch": 2854} {"train_loss": -12.73811149597168, "global_step": 479532, "epoch": 2854} {"train_loss": -12.900678634643555, "global_step": 479533, "epoch": 2854} {"train_loss": -12.694921493530273, "global_step": 479534, "epoch": 2854} {"train_loss": -12.546712875366211, "global_step": 479535, "epoch": 2854} {"train_loss": -12.821115493774414, "global_step": 479536, "epoch": 2854} {"train_loss": -12.473296165466309, "global_step": 479537, "epoch": 2854} {"train_loss": -12.903631210327148, "global_step": 479538, "epoch": 2854} {"train_loss": -12.740281105041504, "global_step": 479539, "epoch": 2854} {"train_loss": -12.685548782348633, "global_step": 479540, "epoch": 2854} {"train_loss": -12.646501541137695, "global_step": 479541, "epoch": 2854} {"train_loss": -13.041582107543945, "global_step": 479542, "epoch": 2854} {"train_loss": -13.070047378540039, "global_step": 479543, "epoch": 2854} {"train_loss": -12.793212890625, "global_step": 479544, "epoch": 2854} {"train_loss": -12.942712783813477, "global_step": 479545, "epoch": 2854} {"train_loss": -12.86326789855957, "global_step": 479546, "epoch": 2854} {"train_loss": -12.864408493041992, "global_step": 479547, "epoch": 2854} {"train_loss": -12.86844253540039, "global_step": 479548, "epoch": 2854} {"train_loss": -12.648889541625977, "global_step": 479549, "epoch": 2854} {"train_loss": -12.588632583618164, "global_step": 479550, "epoch": 2854} {"train_loss": -12.758625984191895, "global_step": 479551, "epoch": 2854} {"train_loss": -12.925799369812012, "global_step": 479552, "epoch": 2854} {"train_loss": -12.687609672546387, "global_step": 479553, "epoch": 2854} {"train_loss": -13.014915466308594, "global_step": 479554, "epoch": 2854} {"train_loss": -12.762659072875977, "global_step": 479555, "epoch": 2854} {"train_loss": -12.649085998535156, "global_step": 479556, "epoch": 2854} {"train_loss": -12.750076293945312, "global_step": 479557, "epoch": 2854} {"train_loss": -12.865915298461914, "global_step": 479558, "epoch": 2854} {"train_loss": -13.110912322998047, "global_step": 479559, "epoch": 2854} {"train_loss": -12.912141799926758, "global_step": 479560, "epoch": 2854} {"train_loss": -12.596946716308594, "global_step": 479561, "epoch": 2854} {"train_loss": -12.601665496826172, "global_step": 479562, "epoch": 2854} {"train_loss": -12.417160034179688, "global_step": 479563, "epoch": 2854} {"train_loss": -12.825855255126953, "global_step": 479564, "epoch": 2854} {"train_loss": -12.904058456420898, "global_step": 479565, "epoch": 2854} {"train_loss": -12.827006340026855, "global_step": 479566, "epoch": 2854} {"train_loss": -12.516639709472656, "global_step": 479567, "epoch": 2854} {"train_loss": -12.696921348571777, "global_step": 479568, "epoch": 2854} {"train_loss": -13.133723258972168, "global_step": 479569, "epoch": 2854} {"train_loss": -12.67135238647461, "global_step": 479570, "epoch": 2854} {"train_loss": -12.114065170288086, "global_step": 479571, "epoch": 2854} {"train_loss": -12.155172348022461, "global_step": 479572, "epoch": 2854} {"train_loss": -12.75967788696289, "global_step": 479573, "epoch": 2854} {"train_loss": -12.679341316223145, "global_step": 479574, "epoch": 2854} {"train_loss": -12.771217346191406, "global_step": 479575, "epoch": 2854} {"train_loss": -12.639695167541504, "global_step": 479576, "epoch": 2854} {"train_loss": -13.035072326660156, "global_step": 479577, "epoch": 2854} {"train_loss": -12.767400741577148, "global_step": 479578, "epoch": 2854} {"train_loss": -12.647064208984375, "global_step": 479579, "epoch": 2854} {"train_loss": -12.77961540222168, "global_step": 479580, "epoch": 2854} {"train_loss": -12.147184371948242, "global_step": 479581, "epoch": 2854} {"train_loss": -12.193414688110352, "global_step": 479582, "epoch": 2854} {"train_loss": -10.72956371307373, "global_step": 479583, "epoch": 2854} {"train_loss": -11.595597267150879, "global_step": 479584, "epoch": 2854} {"train_loss": -11.718928337097168, "global_step": 479585, "epoch": 2854} {"train_loss": -10.851227760314941, "global_step": 479586, "epoch": 2854} {"train_loss": -10.817867279052734, "global_step": 479587, "epoch": 2854} {"train_loss": -10.126970291137695, "global_step": 479588, "epoch": 2854} {"train_loss": -12.02896499633789, "global_step": 479589, "epoch": 2854} {"train_loss": -10.939874649047852, "global_step": 479590, "epoch": 2854} {"train_loss": -9.018850326538086, "global_step": 479591, "epoch": 2854} {"train_loss": -10.4305419921875, "global_step": 479592, "epoch": 2854} {"train_loss": -10.630658149719238, "global_step": 479593, "epoch": 2854} {"train_loss": -10.944429397583008, "global_step": 479594, "epoch": 2854} {"train_loss": -10.78814697265625, "global_step": 479595, "epoch": 2854} {"train_loss": -11.906624794006348, "global_step": 479596, "epoch": 2854} {"train_loss": -11.138711929321289, "global_step": 479597, "epoch": 2854} {"train_loss": -10.871315956115723, "global_step": 479598, "epoch": 2854} {"train_loss": -10.816133499145508, "global_step": 479599, "epoch": 2854} {"train_loss": -11.253849029541016, "global_step": 479600, "epoch": 2854} {"train_loss": -10.462279319763184, "global_step": 479601, "epoch": 2854} {"train_loss": -10.901237487792969, "global_step": 479602, "epoch": 2854} {"train_loss": -10.982490539550781, "global_step": 479603, "epoch": 2854} {"train_loss": -10.161038398742676, "global_step": 479604, "epoch": 2854} {"train_loss": -11.880830764770508, "global_step": 479605, "epoch": 2854} {"train_loss": -11.345569610595703, "global_step": 479606, "epoch": 2854} {"train_loss": -11.01829719543457, "global_step": 479607, "epoch": 2854} {"train_loss": -12.161640167236328, "global_step": 479608, "epoch": 2854} {"train_loss": -11.397963523864746, "global_step": 479609, "epoch": 2854} {"train_loss": -11.82650375366211, "global_step": 479610, "epoch": 2854} {"train_loss": -12.268087387084961, "global_step": 479611, "epoch": 2854} {"train_loss": -11.743511199951172, "global_step": 479612, "epoch": 2854} {"train_loss": -11.197931289672852, "global_step": 479613, "epoch": 2854} {"train_loss": -12.305497169494629, "global_step": 479614, "epoch": 2854} {"train_loss": -11.267663955688477, "global_step": 479615, "epoch": 2854} {"train_loss": -11.197245597839355, "global_step": 479616, "epoch": 2854} {"train_loss": -11.81208324432373, "global_step": 479617, "epoch": 2854} {"train_loss": -11.204521179199219, "global_step": 479618, "epoch": 2854} {"train_loss": -11.999135971069336, "global_step": 479619, "epoch": 2854} {"train_loss": -11.979019165039062, "global_step": 479620, "epoch": 2854} {"train_loss": -12.019908905029297, "global_step": 479621, "epoch": 2854} {"train_loss": -11.49205207824707, "global_step": 479622, "epoch": 2854} {"train_loss": -12.123870849609375, "global_step": 479623, "epoch": 2854} {"train_loss": -11.86872673034668, "global_step": 479624, "epoch": 2854} {"train_loss": -12.007343292236328, "global_step": 479625, "epoch": 2854} {"train_loss": -11.837835311889648, "global_step": 479626, "epoch": 2854} {"train_loss": -11.981646537780762, "global_step": 479627, "epoch": 2854} {"train_loss": -12.034358978271484, "global_step": 479628, "epoch": 2854} {"train_loss": -11.670458793640137, "global_step": 479629, "epoch": 2854} {"train_loss": -12.321659088134766, "global_step": 479630, "epoch": 2854} {"train_loss": -11.522263526916504, "global_step": 479631, "epoch": 2854} {"train_loss": -12.2769193649292, "global_step": 479632, "epoch": 2854} {"train_loss": -11.848861694335938, "global_step": 479633, "epoch": 2854} {"train_loss": -11.903857231140137, "global_step": 479634, "epoch": 2854} {"train_loss": -11.974519729614258, "global_step": 479635, "epoch": 2854} {"train_loss": -12.002161026000977, "global_step": 479636, "epoch": 2854} {"train_loss": -11.999926567077637, "global_step": 479637, "epoch": 2854} {"train_loss": -11.86956787109375, "global_step": 479638, "epoch": 2854} {"train_loss": -12.173169561794825, "global_step": 479639, "epoch": 2854, "val_loss": 313291.09375} {"train_loss": -11.52569580078125, "global_step": 479640, "epoch": 2855} {"train_loss": -12.156007766723633, "global_step": 479641, "epoch": 2855} {"train_loss": -11.81165885925293, "global_step": 479642, "epoch": 2855} {"train_loss": -12.382476806640625, "global_step": 479643, "epoch": 2855} {"train_loss": -11.55738639831543, "global_step": 479644, "epoch": 2855} {"train_loss": -11.824070930480957, "global_step": 479645, "epoch": 2855} {"train_loss": -12.077494621276855, "global_step": 479646, "epoch": 2855} {"train_loss": -11.993938446044922, "global_step": 479647, "epoch": 2855} {"train_loss": -11.509054183959961, "global_step": 479648, "epoch": 2855} {"train_loss": -11.482269287109375, "global_step": 479649, "epoch": 2855} {"train_loss": -12.051493644714355, "global_step": 479650, "epoch": 2855} {"train_loss": -11.422607421875, "global_step": 479651, "epoch": 2855} {"train_loss": -12.006684303283691, "global_step": 479652, "epoch": 2855} {"train_loss": -10.970633506774902, "global_step": 479653, "epoch": 2855} {"train_loss": -12.155376434326172, "global_step": 479654, "epoch": 2855} {"train_loss": -11.458501815795898, "global_step": 479655, "epoch": 2855} {"train_loss": -11.648513793945312, "global_step": 479656, "epoch": 2855} {"train_loss": -10.935556411743164, "global_step": 479657, "epoch": 2855} {"train_loss": -10.703913688659668, "global_step": 479658, "epoch": 2855} {"train_loss": -11.482658386230469, "global_step": 479659, "epoch": 2855} {"train_loss": -11.310033798217773, "global_step": 479660, "epoch": 2855} {"train_loss": -11.429193496704102, "global_step": 479661, "epoch": 2855} {"train_loss": -11.828350067138672, "global_step": 479662, "epoch": 2855} {"train_loss": -11.706951141357422, "global_step": 479663, "epoch": 2855} {"train_loss": -12.32004165649414, "global_step": 479664, "epoch": 2855} {"train_loss": -11.845531463623047, "global_step": 479665, "epoch": 2855} {"train_loss": -12.432234764099121, "global_step": 479666, "epoch": 2855} {"train_loss": -11.865951538085938, "global_step": 479667, "epoch": 2855} {"train_loss": -12.25191593170166, "global_step": 479668, "epoch": 2855} {"train_loss": -12.276266098022461, "global_step": 479669, "epoch": 2855} {"train_loss": -12.067304611206055, "global_step": 479670, "epoch": 2855} {"train_loss": -12.205554962158203, "global_step": 479671, "epoch": 2855} {"train_loss": -11.80720329284668, "global_step": 479672, "epoch": 2855} {"train_loss": -12.338969230651855, "global_step": 479673, "epoch": 2855} {"train_loss": -11.484360694885254, "global_step": 479674, "epoch": 2855} {"train_loss": -11.820436477661133, "global_step": 479675, "epoch": 2855} {"train_loss": -12.195901870727539, "global_step": 479676, "epoch": 2855} {"train_loss": -12.056974411010742, "global_step": 479677, "epoch": 2855} {"train_loss": -12.325372695922852, "global_step": 479678, "epoch": 2855} {"train_loss": -12.23664665222168, "global_step": 479679, "epoch": 2855} {"train_loss": -12.513432502746582, "global_step": 479680, "epoch": 2855} {"train_loss": -12.319724082946777, "global_step": 479681, "epoch": 2855} {"train_loss": -12.348129272460938, "global_step": 479682, "epoch": 2855} {"train_loss": -12.373221397399902, "global_step": 479683, "epoch": 2855} {"train_loss": -12.282064437866211, "global_step": 479684, "epoch": 2855} {"train_loss": -12.603650093078613, "global_step": 479685, "epoch": 2855} {"train_loss": -12.341161727905273, "global_step": 479686, "epoch": 2855} {"train_loss": -12.691923141479492, "global_step": 479687, "epoch": 2855} {"train_loss": -12.531597137451172, "global_step": 479688, "epoch": 2855} {"train_loss": -12.753375053405762, "global_step": 479689, "epoch": 2855} {"train_loss": -12.652860641479492, "global_step": 479690, "epoch": 2855} {"train_loss": -12.55243968963623, "global_step": 479691, "epoch": 2855} {"train_loss": -12.707282066345215, "global_step": 479692, "epoch": 2855} {"train_loss": -12.786861419677734, "global_step": 479693, "epoch": 2855} {"train_loss": -12.454715728759766, "global_step": 479694, "epoch": 2855} {"train_loss": -12.66569995880127, "global_step": 479695, "epoch": 2855} {"train_loss": -12.747275352478027, "global_step": 479696, "epoch": 2855} {"train_loss": -12.78904914855957, "global_step": 479697, "epoch": 2855} {"train_loss": -12.865452766418457, "global_step": 479698, "epoch": 2855} {"train_loss": -12.733040809631348, "global_step": 479699, "epoch": 2855} {"train_loss": -12.74869441986084, "global_step": 479700, "epoch": 2855} {"train_loss": -12.590265274047852, "global_step": 479701, "epoch": 2855} {"train_loss": -12.73331356048584, "global_step": 479702, "epoch": 2855} {"train_loss": -12.617999076843262, "global_step": 479703, "epoch": 2855} {"train_loss": -12.624305725097656, "global_step": 479704, "epoch": 2855} {"train_loss": -12.628669738769531, "global_step": 479705, "epoch": 2855} {"train_loss": -12.588088035583496, "global_step": 479706, "epoch": 2855} {"train_loss": -12.49453353881836, "global_step": 479707, "epoch": 2855} {"train_loss": -12.45353889465332, "global_step": 479708, "epoch": 2855} {"train_loss": -12.804044723510742, "global_step": 479709, "epoch": 2855} {"train_loss": -12.43421745300293, "global_step": 479710, "epoch": 2855} {"train_loss": -12.924065589904785, "global_step": 479711, "epoch": 2855} {"train_loss": -12.7360200881958, "global_step": 479712, "epoch": 2855} {"train_loss": -12.638444900512695, "global_step": 479713, "epoch": 2855} {"train_loss": -12.70460319519043, "global_step": 479714, "epoch": 2855} {"train_loss": -12.71615982055664, "global_step": 479715, "epoch": 2855} {"train_loss": -12.680240631103516, "global_step": 479716, "epoch": 2855} {"train_loss": -12.786130905151367, "global_step": 479717, "epoch": 2855} {"train_loss": -12.653824806213379, "global_step": 479718, "epoch": 2855} {"train_loss": -12.952356338500977, "global_step": 479719, "epoch": 2855} {"train_loss": -12.693016052246094, "global_step": 479720, "epoch": 2855} {"train_loss": -12.86295223236084, "global_step": 479721, "epoch": 2855} {"train_loss": -12.50143814086914, "global_step": 479722, "epoch": 2855} {"train_loss": -12.733895301818848, "global_step": 479723, "epoch": 2855} {"train_loss": -12.64285659790039, "global_step": 479724, "epoch": 2855} {"train_loss": -12.907102584838867, "global_step": 479725, "epoch": 2855} {"train_loss": -12.651830673217773, "global_step": 479726, "epoch": 2855} {"train_loss": -12.84797191619873, "global_step": 479727, "epoch": 2855} {"train_loss": -12.782254219055176, "global_step": 479728, "epoch": 2855} {"train_loss": -12.829473495483398, "global_step": 479729, "epoch": 2855} {"train_loss": -12.874814987182617, "global_step": 479730, "epoch": 2855} {"train_loss": -12.576841354370117, "global_step": 479731, "epoch": 2855} {"train_loss": -12.924846649169922, "global_step": 479732, "epoch": 2855} {"train_loss": -12.425518989562988, "global_step": 479733, "epoch": 2855} {"train_loss": -12.826513290405273, "global_step": 479734, "epoch": 2855} {"train_loss": -12.876506805419922, "global_step": 479735, "epoch": 2855} {"train_loss": -12.853147506713867, "global_step": 479736, "epoch": 2855} {"train_loss": -12.988188743591309, "global_step": 479737, "epoch": 2855} {"train_loss": -12.703749656677246, "global_step": 479738, "epoch": 2855} {"train_loss": -12.681083679199219, "global_step": 479739, "epoch": 2855} {"train_loss": -13.040586471557617, "global_step": 479740, "epoch": 2855} {"train_loss": -12.723384857177734, "global_step": 479741, "epoch": 2855} {"train_loss": -12.928348541259766, "global_step": 479742, "epoch": 2855} {"train_loss": -12.798766136169434, "global_step": 479743, "epoch": 2855} {"train_loss": -12.628747940063477, "global_step": 479744, "epoch": 2855} {"train_loss": -12.746438980102539, "global_step": 479745, "epoch": 2855} {"train_loss": -12.684597969055176, "global_step": 479746, "epoch": 2855} {"train_loss": -13.060263633728027, "global_step": 479747, "epoch": 2855} {"train_loss": -12.699151992797852, "global_step": 479748, "epoch": 2855} {"train_loss": -12.622543334960938, "global_step": 479749, "epoch": 2855} {"train_loss": -12.959714889526367, "global_step": 479750, "epoch": 2855} {"train_loss": -12.656387329101562, "global_step": 479751, "epoch": 2855} {"train_loss": -12.927176475524902, "global_step": 479752, "epoch": 2855} {"train_loss": -11.55669116973877, "global_step": 479753, "epoch": 2855} {"train_loss": -11.807779312133789, "global_step": 479754, "epoch": 2855} {"train_loss": -12.52357292175293, "global_step": 479755, "epoch": 2855} {"train_loss": -12.347221374511719, "global_step": 479756, "epoch": 2855} {"train_loss": -12.66458797454834, "global_step": 479757, "epoch": 2855} {"train_loss": -12.175529479980469, "global_step": 479758, "epoch": 2855} {"train_loss": -12.195060729980469, "global_step": 479759, "epoch": 2855} {"train_loss": -12.838271141052246, "global_step": 479760, "epoch": 2855} {"train_loss": -12.431622505187988, "global_step": 479761, "epoch": 2855} {"train_loss": -12.602025985717773, "global_step": 479762, "epoch": 2855} {"train_loss": -12.183897018432617, "global_step": 479763, "epoch": 2855} {"train_loss": -13.000391006469727, "global_step": 479764, "epoch": 2855} {"train_loss": -12.391874313354492, "global_step": 479765, "epoch": 2855} {"train_loss": -12.27083969116211, "global_step": 479766, "epoch": 2855} {"train_loss": -13.062702178955078, "global_step": 479767, "epoch": 2855} {"train_loss": -12.571331977844238, "global_step": 479768, "epoch": 2855} {"train_loss": -12.766742706298828, "global_step": 479769, "epoch": 2855} {"train_loss": -12.587305068969727, "global_step": 479770, "epoch": 2855} {"train_loss": -12.44387435913086, "global_step": 479771, "epoch": 2855} {"train_loss": -12.598688125610352, "global_step": 479772, "epoch": 2855} {"train_loss": -12.344657897949219, "global_step": 479773, "epoch": 2855} {"train_loss": -12.423858642578125, "global_step": 479774, "epoch": 2855} {"train_loss": -12.554633140563965, "global_step": 479775, "epoch": 2855} {"train_loss": -13.007049560546875, "global_step": 479776, "epoch": 2855} {"train_loss": -12.550302505493164, "global_step": 479777, "epoch": 2855} {"train_loss": -12.380599975585938, "global_step": 479778, "epoch": 2855} {"train_loss": -12.594892501831055, "global_step": 479779, "epoch": 2855} {"train_loss": -12.137984275817871, "global_step": 479780, "epoch": 2855} {"train_loss": -11.982216835021973, "global_step": 479781, "epoch": 2855} {"train_loss": -12.897241592407227, "global_step": 479782, "epoch": 2855} {"train_loss": -12.141288757324219, "global_step": 479783, "epoch": 2855} {"train_loss": -12.471774101257324, "global_step": 479784, "epoch": 2855} {"train_loss": -12.193083763122559, "global_step": 479785, "epoch": 2855} {"train_loss": -12.79190731048584, "global_step": 479786, "epoch": 2855} {"train_loss": -12.100858688354492, "global_step": 479787, "epoch": 2855} {"train_loss": -12.540645599365234, "global_step": 479788, "epoch": 2855} {"train_loss": -11.611681938171387, "global_step": 479789, "epoch": 2855} {"train_loss": -12.3526611328125, "global_step": 479790, "epoch": 2855} {"train_loss": -12.407865524291992, "global_step": 479791, "epoch": 2855} {"train_loss": -12.465458869934082, "global_step": 479792, "epoch": 2855} {"train_loss": -11.61862564086914, "global_step": 479793, "epoch": 2855} {"train_loss": -10.435328483581543, "global_step": 479794, "epoch": 2855} {"train_loss": -11.839655876159668, "global_step": 479795, "epoch": 2855} {"train_loss": -10.612512588500977, "global_step": 479796, "epoch": 2855} {"train_loss": -11.354154586791992, "global_step": 479797, "epoch": 2855} {"train_loss": -9.764699935913086, "global_step": 479798, "epoch": 2855} {"train_loss": -11.255302429199219, "global_step": 479799, "epoch": 2855} {"train_loss": -8.476334571838379, "global_step": 479800, "epoch": 2855} {"train_loss": -10.221771240234375, "global_step": 479801, "epoch": 2855} {"train_loss": -9.472583770751953, "global_step": 479802, "epoch": 2855} {"train_loss": -8.524782180786133, "global_step": 479803, "epoch": 2855} {"train_loss": -7.953302383422852, "global_step": 479804, "epoch": 2855} {"train_loss": -8.172794342041016, "global_step": 479805, "epoch": 2855} {"train_loss": -8.103838920593262, "global_step": 479806, "epoch": 2855} {"train_loss": -12.157574679170336, "global_step": 479807, "epoch": 2855, "val_loss": 315666.9375, "train_action_mse_error": 3.951493740081787} {"train_loss": -8.288187026977539, "global_step": 479808, "epoch": 2856} {"train_loss": -7.959434509277344, "global_step": 479809, "epoch": 2856} {"train_loss": -8.36111831665039, "global_step": 479810, "epoch": 2856} {"train_loss": -7.950634479522705, "global_step": 479811, "epoch": 2856} {"train_loss": -8.444323539733887, "global_step": 479812, "epoch": 2856} {"train_loss": -8.98501205444336, "global_step": 479813, "epoch": 2856} {"train_loss": -8.899173736572266, "global_step": 479814, "epoch": 2856} {"train_loss": -9.234392166137695, "global_step": 479815, "epoch": 2856} {"train_loss": -9.02073860168457, "global_step": 479816, "epoch": 2856} {"train_loss": -9.138030052185059, "global_step": 479817, "epoch": 2856} {"train_loss": -8.702994346618652, "global_step": 479818, "epoch": 2856} {"train_loss": -9.004629135131836, "global_step": 479819, "epoch": 2856} {"train_loss": -9.13442611694336, "global_step": 479820, "epoch": 2856} {"train_loss": -9.62421989440918, "global_step": 479821, "epoch": 2856} {"train_loss": -9.946699142456055, "global_step": 479822, "epoch": 2856} {"train_loss": -10.767621994018555, "global_step": 479823, "epoch": 2856} {"train_loss": -10.765103340148926, "global_step": 479824, "epoch": 2856} {"train_loss": -10.48338508605957, "global_step": 479825, "epoch": 2856} {"train_loss": -11.346750259399414, "global_step": 479826, "epoch": 2856} {"train_loss": -11.669000625610352, "global_step": 479827, "epoch": 2856} {"train_loss": -11.217721939086914, "global_step": 479828, "epoch": 2856} {"train_loss": -10.172386169433594, "global_step": 479829, "epoch": 2856} {"train_loss": -11.012811660766602, "global_step": 479830, "epoch": 2856} {"train_loss": -11.09593391418457, "global_step": 479831, "epoch": 2856} {"train_loss": -11.099893569946289, "global_step": 479832, "epoch": 2856} {"train_loss": -11.378931045532227, "global_step": 479833, "epoch": 2856} {"train_loss": -11.468963623046875, "global_step": 479834, "epoch": 2856} {"train_loss": -10.33933162689209, "global_step": 479835, "epoch": 2856} {"train_loss": -11.187215805053711, "global_step": 479836, "epoch": 2856} {"train_loss": -10.950111389160156, "global_step": 479837, "epoch": 2856} {"train_loss": -10.516677856445312, "global_step": 479838, "epoch": 2856} {"train_loss": -11.539018630981445, "global_step": 479839, "epoch": 2856} {"train_loss": -11.301146507263184, "global_step": 479840, "epoch": 2856} {"train_loss": -11.141706466674805, "global_step": 479841, "epoch": 2856} {"train_loss": -11.236570358276367, "global_step": 479842, "epoch": 2856} {"train_loss": -11.29379653930664, "global_step": 479843, "epoch": 2856} {"train_loss": -11.796932220458984, "global_step": 479844, "epoch": 2856} {"train_loss": -12.159452438354492, "global_step": 479845, "epoch": 2856} {"train_loss": -11.226515769958496, "global_step": 479846, "epoch": 2856} {"train_loss": -11.567949295043945, "global_step": 479847, "epoch": 2856} {"train_loss": -11.50777816772461, "global_step": 479848, "epoch": 2856} {"train_loss": -11.712909698486328, "global_step": 479849, "epoch": 2856} {"train_loss": -11.721841812133789, "global_step": 479850, "epoch": 2856} {"train_loss": -11.991985321044922, "global_step": 479851, "epoch": 2856} {"train_loss": -11.468193054199219, "global_step": 479852, "epoch": 2856} {"train_loss": -11.92270278930664, "global_step": 479853, "epoch": 2856} {"train_loss": -11.814105987548828, "global_step": 479854, "epoch": 2856} {"train_loss": -12.329103469848633, "global_step": 479855, "epoch": 2856} {"train_loss": -12.340860366821289, "global_step": 479856, "epoch": 2856} {"train_loss": -12.416751861572266, "global_step": 479857, "epoch": 2856} {"train_loss": -12.344914436340332, "global_step": 479858, "epoch": 2856} {"train_loss": -12.42791748046875, "global_step": 479859, "epoch": 2856} {"train_loss": -12.194297790527344, "global_step": 479860, "epoch": 2856} {"train_loss": -12.204814910888672, "global_step": 479861, "epoch": 2856} {"train_loss": -12.368114471435547, "global_step": 479862, "epoch": 2856} {"train_loss": -12.112687110900879, "global_step": 479863, "epoch": 2856} {"train_loss": -12.660136222839355, "global_step": 479864, "epoch": 2856} {"train_loss": -12.336252212524414, "global_step": 479865, "epoch": 2856} {"train_loss": -12.188617706298828, "global_step": 479866, "epoch": 2856} {"train_loss": -12.230985641479492, "global_step": 479867, "epoch": 2856} {"train_loss": -12.43610668182373, "global_step": 479868, "epoch": 2856} {"train_loss": -12.521021842956543, "global_step": 479869, "epoch": 2856} {"train_loss": -12.447989463806152, "global_step": 479870, "epoch": 2856} {"train_loss": -12.40987777709961, "global_step": 479871, "epoch": 2856} {"train_loss": -12.532121658325195, "global_step": 479872, "epoch": 2856} {"train_loss": -12.339265823364258, "global_step": 479873, "epoch": 2856} {"train_loss": -12.505536079406738, "global_step": 479874, "epoch": 2856} {"train_loss": -12.480927467346191, "global_step": 479875, "epoch": 2856} {"train_loss": -12.727494239807129, "global_step": 479876, "epoch": 2856} {"train_loss": -12.790882110595703, "global_step": 479877, "epoch": 2856} {"train_loss": -12.545320510864258, "global_step": 479878, "epoch": 2856} {"train_loss": -12.369585037231445, "global_step": 479879, "epoch": 2856} {"train_loss": -12.785757064819336, "global_step": 479880, "epoch": 2856} {"train_loss": -12.42387866973877, "global_step": 479881, "epoch": 2856} {"train_loss": -12.804738998413086, "global_step": 479882, "epoch": 2856} {"train_loss": -12.720468521118164, "global_step": 479883, "epoch": 2856} {"train_loss": -12.479698181152344, "global_step": 479884, "epoch": 2856} {"train_loss": -12.523792266845703, "global_step": 479885, "epoch": 2856} {"train_loss": -12.516885757446289, "global_step": 479886, "epoch": 2856} {"train_loss": -12.300792694091797, "global_step": 479887, "epoch": 2856} {"train_loss": -12.346695899963379, "global_step": 479888, "epoch": 2856} {"train_loss": -12.93935775756836, "global_step": 479889, "epoch": 2856} {"train_loss": -12.489091873168945, "global_step": 479890, "epoch": 2856} {"train_loss": -12.598785400390625, "global_step": 479891, "epoch": 2856} {"train_loss": -12.300519943237305, "global_step": 479892, "epoch": 2856} {"train_loss": -12.705289840698242, "global_step": 479893, "epoch": 2856} {"train_loss": -12.532003402709961, "global_step": 479894, "epoch": 2856} {"train_loss": -12.672806739807129, "global_step": 479895, "epoch": 2856} {"train_loss": -12.632244110107422, "global_step": 479896, "epoch": 2856} {"train_loss": -12.58963680267334, "global_step": 479897, "epoch": 2856} {"train_loss": -12.845730781555176, "global_step": 479898, "epoch": 2856} {"train_loss": -12.623310089111328, "global_step": 479899, "epoch": 2856} {"train_loss": -13.017838478088379, "global_step": 479900, "epoch": 2856} {"train_loss": -12.672593116760254, "global_step": 479901, "epoch": 2856} {"train_loss": -12.733930587768555, "global_step": 479902, "epoch": 2856} {"train_loss": -12.858317375183105, "global_step": 479903, "epoch": 2856} {"train_loss": -12.727739334106445, "global_step": 479904, "epoch": 2856} {"train_loss": -12.937427520751953, "global_step": 479905, "epoch": 2856} {"train_loss": -12.714536666870117, "global_step": 479906, "epoch": 2856} {"train_loss": -12.729957580566406, "global_step": 479907, "epoch": 2856} {"train_loss": -12.697700500488281, "global_step": 479908, "epoch": 2856} {"train_loss": -12.681961059570312, "global_step": 479909, "epoch": 2856} {"train_loss": -12.866865158081055, "global_step": 479910, "epoch": 2856} {"train_loss": -12.628266334533691, "global_step": 479911, "epoch": 2856} {"train_loss": -12.646944999694824, "global_step": 479912, "epoch": 2856} {"train_loss": -12.65829849243164, "global_step": 479913, "epoch": 2856} {"train_loss": -12.599405288696289, "global_step": 479914, "epoch": 2856} {"train_loss": -12.921134948730469, "global_step": 479915, "epoch": 2856} {"train_loss": -12.789863586425781, "global_step": 479916, "epoch": 2856} {"train_loss": -12.887693405151367, "global_step": 479917, "epoch": 2856} {"train_loss": -12.839094161987305, "global_step": 479918, "epoch": 2856} {"train_loss": -12.963926315307617, "global_step": 479919, "epoch": 2856} {"train_loss": -12.638164520263672, "global_step": 479920, "epoch": 2856} {"train_loss": -12.830364227294922, "global_step": 479921, "epoch": 2856} {"train_loss": -12.4552001953125, "global_step": 479922, "epoch": 2856} {"train_loss": -12.869728088378906, "global_step": 479923, "epoch": 2856} {"train_loss": -12.915886878967285, "global_step": 479924, "epoch": 2856} {"train_loss": -12.691393852233887, "global_step": 479925, "epoch": 2856} {"train_loss": -12.77574634552002, "global_step": 479926, "epoch": 2856} {"train_loss": -12.850286483764648, "global_step": 479927, "epoch": 2856} {"train_loss": -12.829802513122559, "global_step": 479928, "epoch": 2856} {"train_loss": -12.926605224609375, "global_step": 479929, "epoch": 2856} {"train_loss": -12.821331024169922, "global_step": 479930, "epoch": 2856} {"train_loss": -12.894023895263672, "global_step": 479931, "epoch": 2856} {"train_loss": -13.004557609558105, "global_step": 479932, "epoch": 2856} {"train_loss": -12.643692016601562, "global_step": 479933, "epoch": 2856} {"train_loss": -12.613838195800781, "global_step": 479934, "epoch": 2856} {"train_loss": -12.51116943359375, "global_step": 479935, "epoch": 2856} {"train_loss": -12.562545776367188, "global_step": 479936, "epoch": 2856} {"train_loss": -12.696406364440918, "global_step": 479937, "epoch": 2856} {"train_loss": -12.585226058959961, "global_step": 479938, "epoch": 2856} {"train_loss": -12.463460922241211, "global_step": 479939, "epoch": 2856} {"train_loss": -12.93680191040039, "global_step": 479940, "epoch": 2856} {"train_loss": -12.275042533874512, "global_step": 479941, "epoch": 2856} {"train_loss": -12.628900527954102, "global_step": 479942, "epoch": 2856} {"train_loss": -12.998321533203125, "global_step": 479943, "epoch": 2856} {"train_loss": -12.603399276733398, "global_step": 479944, "epoch": 2856} {"train_loss": -12.599918365478516, "global_step": 479945, "epoch": 2856} {"train_loss": -12.766927719116211, "global_step": 479946, "epoch": 2856} {"train_loss": -12.73714828491211, "global_step": 479947, "epoch": 2856} {"train_loss": -12.593729019165039, "global_step": 479948, "epoch": 2856} {"train_loss": -12.42466926574707, "global_step": 479949, "epoch": 2856} {"train_loss": -12.507966995239258, "global_step": 479950, "epoch": 2856} {"train_loss": -11.965319633483887, "global_step": 479951, "epoch": 2856} {"train_loss": -11.987314224243164, "global_step": 479952, "epoch": 2856} {"train_loss": -12.059106826782227, "global_step": 479953, "epoch": 2856} {"train_loss": -12.62755298614502, "global_step": 479954, "epoch": 2856} {"train_loss": -11.079133987426758, "global_step": 479955, "epoch": 2856} {"train_loss": -12.771398544311523, "global_step": 479956, "epoch": 2856} {"train_loss": -11.553738594055176, "global_step": 479957, "epoch": 2856} {"train_loss": -10.166485786437988, "global_step": 479958, "epoch": 2856} {"train_loss": -12.739852905273438, "global_step": 479959, "epoch": 2856} {"train_loss": -10.795228958129883, "global_step": 479960, "epoch": 2856} {"train_loss": -11.380739212036133, "global_step": 479961, "epoch": 2856} {"train_loss": -10.810293197631836, "global_step": 479962, "epoch": 2856} {"train_loss": -10.187891006469727, "global_step": 479963, "epoch": 2856} {"train_loss": -10.539963722229004, "global_step": 479964, "epoch": 2856} {"train_loss": -12.116288185119629, "global_step": 479965, "epoch": 2856} {"train_loss": -11.741811752319336, "global_step": 479966, "epoch": 2856} {"train_loss": -11.552743911743164, "global_step": 479967, "epoch": 2856} {"train_loss": -11.97308349609375, "global_step": 479968, "epoch": 2856} {"train_loss": -11.34203052520752, "global_step": 479969, "epoch": 2856} {"train_loss": -10.67253303527832, "global_step": 479970, "epoch": 2856} {"train_loss": -11.985294342041016, "global_step": 479971, "epoch": 2856} {"train_loss": -11.100173950195312, "global_step": 479972, "epoch": 2856} {"train_loss": -9.963661193847656, "global_step": 479973, "epoch": 2856} {"train_loss": -11.822240829467773, "global_step": 479974, "epoch": 2856} {"train_loss": -11.847003468445369, "global_step": 479975, "epoch": 2856, "val_loss": 313295.40625} {"train_loss": -11.76577377319336, "global_step": 479976, "epoch": 2857} {"train_loss": -11.503752708435059, "global_step": 479977, "epoch": 2857} {"train_loss": -11.083147048950195, "global_step": 479978, "epoch": 2857} {"train_loss": -11.906044006347656, "global_step": 479979, "epoch": 2857} {"train_loss": -11.472501754760742, "global_step": 479980, "epoch": 2857} {"train_loss": -11.784406661987305, "global_step": 479981, "epoch": 2857} {"train_loss": -12.079224586486816, "global_step": 479982, "epoch": 2857} {"train_loss": -10.785602569580078, "global_step": 479983, "epoch": 2857} {"train_loss": -12.355864524841309, "global_step": 479984, "epoch": 2857} {"train_loss": -10.959814071655273, "global_step": 479985, "epoch": 2857} {"train_loss": -12.443521499633789, "global_step": 479986, "epoch": 2857} {"train_loss": -11.651590347290039, "global_step": 479987, "epoch": 2857} {"train_loss": -11.719292640686035, "global_step": 479988, "epoch": 2857} {"train_loss": -11.73917007446289, "global_step": 479989, "epoch": 2857} {"train_loss": -11.871072769165039, "global_step": 479990, "epoch": 2857} {"train_loss": -11.526229858398438, "global_step": 479991, "epoch": 2857} {"train_loss": -11.961414337158203, "global_step": 479992, "epoch": 2857} {"train_loss": -11.641839981079102, "global_step": 479993, "epoch": 2857} {"train_loss": -12.016790390014648, "global_step": 479994, "epoch": 2857} {"train_loss": -12.040069580078125, "global_step": 479995, "epoch": 2857} {"train_loss": -11.656957626342773, "global_step": 479996, "epoch": 2857} {"train_loss": -11.621114730834961, "global_step": 479997, "epoch": 2857} {"train_loss": -12.023265838623047, "global_step": 479998, "epoch": 2857} {"train_loss": -11.977413177490234, "global_step": 479999, "epoch": 2857} {"train_loss": -12.027231216430664, "global_step": 480000, "epoch": 2857} {"train_loss": -11.986322402954102, "global_step": 480001, "epoch": 2857} {"train_loss": -12.215996742248535, "global_step": 480002, "epoch": 2857} {"train_loss": -12.321414947509766, "global_step": 480003, "epoch": 2857} {"train_loss": -12.002298355102539, "global_step": 480004, "epoch": 2857} {"train_loss": -12.29435920715332, "global_step": 480005, "epoch": 2857} {"train_loss": -11.776543617248535, "global_step": 480006, "epoch": 2857} {"train_loss": -12.309089660644531, "global_step": 480007, "epoch": 2857} {"train_loss": -12.105326652526855, "global_step": 480008, "epoch": 2857} {"train_loss": -12.242695808410645, "global_step": 480009, "epoch": 2857} {"train_loss": -12.233200073242188, "global_step": 480010, "epoch": 2857} {"train_loss": -11.597410202026367, "global_step": 480011, "epoch": 2857} {"train_loss": -12.459207534790039, "global_step": 480012, "epoch": 2857} {"train_loss": -12.00460433959961, "global_step": 480013, "epoch": 2857} {"train_loss": -11.731219291687012, "global_step": 480014, "epoch": 2857} {"train_loss": -12.34482479095459, "global_step": 480015, "epoch": 2857} {"train_loss": -11.831488609313965, "global_step": 480016, "epoch": 2857} {"train_loss": -12.082937240600586, "global_step": 480017, "epoch": 2857} {"train_loss": -12.02904224395752, "global_step": 480018, "epoch": 2857} {"train_loss": -11.853063583374023, "global_step": 480019, "epoch": 2857} {"train_loss": -12.653191566467285, "global_step": 480020, "epoch": 2857} {"train_loss": -11.700526237487793, "global_step": 480021, "epoch": 2857} {"train_loss": -11.731409072875977, "global_step": 480022, "epoch": 2857} {"train_loss": -11.754438400268555, "global_step": 480023, "epoch": 2857} {"train_loss": -11.666868209838867, "global_step": 480024, "epoch": 2857} {"train_loss": -12.241195678710938, "global_step": 480025, "epoch": 2857} {"train_loss": -12.273791313171387, "global_step": 480026, "epoch": 2857} {"train_loss": -12.202218055725098, "global_step": 480027, "epoch": 2857} {"train_loss": -12.121734619140625, "global_step": 480028, "epoch": 2857} {"train_loss": -11.66019058227539, "global_step": 480029, "epoch": 2857} {"train_loss": -12.152801513671875, "global_step": 480030, "epoch": 2857} {"train_loss": -12.332975387573242, "global_step": 480031, "epoch": 2857} {"train_loss": -12.009989738464355, "global_step": 480032, "epoch": 2857} {"train_loss": -12.198405265808105, "global_step": 480033, "epoch": 2857} {"train_loss": -12.157770156860352, "global_step": 480034, "epoch": 2857} {"train_loss": -12.316336631774902, "global_step": 480035, "epoch": 2857} {"train_loss": -12.206928253173828, "global_step": 480036, "epoch": 2857} {"train_loss": -12.271392822265625, "global_step": 480037, "epoch": 2857} {"train_loss": -12.317729949951172, "global_step": 480038, "epoch": 2857} {"train_loss": -12.336414337158203, "global_step": 480039, "epoch": 2857} {"train_loss": -12.148377418518066, "global_step": 480040, "epoch": 2857} {"train_loss": -12.219953536987305, "global_step": 480041, "epoch": 2857} {"train_loss": -12.254426956176758, "global_step": 480042, "epoch": 2857} {"train_loss": -12.32695198059082, "global_step": 480043, "epoch": 2857} {"train_loss": -12.392072677612305, "global_step": 480044, "epoch": 2857} {"train_loss": -12.304972648620605, "global_step": 480045, "epoch": 2857} {"train_loss": -12.532072067260742, "global_step": 480046, "epoch": 2857} {"train_loss": -12.317172050476074, "global_step": 480047, "epoch": 2857} {"train_loss": -12.364990234375, "global_step": 480048, "epoch": 2857} {"train_loss": -12.607122421264648, "global_step": 480049, "epoch": 2857} {"train_loss": -12.381576538085938, "global_step": 480050, "epoch": 2857} {"train_loss": -12.856973648071289, "global_step": 480051, "epoch": 2857} {"train_loss": -12.66632080078125, "global_step": 480052, "epoch": 2857} {"train_loss": -12.346733093261719, "global_step": 480053, "epoch": 2857} {"train_loss": -12.309991836547852, "global_step": 480054, "epoch": 2857} {"train_loss": -12.619949340820312, "global_step": 480055, "epoch": 2857} {"train_loss": -12.433687210083008, "global_step": 480056, "epoch": 2857} {"train_loss": -12.627565383911133, "global_step": 480057, "epoch": 2857} {"train_loss": -12.28026008605957, "global_step": 480058, "epoch": 2857} {"train_loss": -12.425657272338867, "global_step": 480059, "epoch": 2857} {"train_loss": -12.870412826538086, "global_step": 480060, "epoch": 2857} {"train_loss": -12.13339614868164, "global_step": 480061, "epoch": 2857} {"train_loss": -12.660041809082031, "global_step": 480062, "epoch": 2857} {"train_loss": -12.534008026123047, "global_step": 480063, "epoch": 2857} {"train_loss": -12.260065078735352, "global_step": 480064, "epoch": 2857} {"train_loss": -12.747400283813477, "global_step": 480065, "epoch": 2857} {"train_loss": -12.269342422485352, "global_step": 480066, "epoch": 2857} {"train_loss": -12.707589149475098, "global_step": 480067, "epoch": 2857} {"train_loss": -12.375530242919922, "global_step": 480068, "epoch": 2857} {"train_loss": -12.098930358886719, "global_step": 480069, "epoch": 2857} {"train_loss": -12.600555419921875, "global_step": 480070, "epoch": 2857} {"train_loss": -12.369084358215332, "global_step": 480071, "epoch": 2857} {"train_loss": -12.235185623168945, "global_step": 480072, "epoch": 2857} {"train_loss": -12.78329086303711, "global_step": 480073, "epoch": 2857} {"train_loss": -12.40772819519043, "global_step": 480074, "epoch": 2857} {"train_loss": -12.403392791748047, "global_step": 480075, "epoch": 2857} {"train_loss": -12.479427337646484, "global_step": 480076, "epoch": 2857} {"train_loss": -12.270123481750488, "global_step": 480077, "epoch": 2857} {"train_loss": -12.003168106079102, "global_step": 480078, "epoch": 2857} {"train_loss": -12.616092681884766, "global_step": 480079, "epoch": 2857} {"train_loss": -12.3054838180542, "global_step": 480080, "epoch": 2857} {"train_loss": -12.538755416870117, "global_step": 480081, "epoch": 2857} {"train_loss": -12.315823554992676, "global_step": 480082, "epoch": 2857} {"train_loss": -12.246379852294922, "global_step": 480083, "epoch": 2857} {"train_loss": -12.505997657775879, "global_step": 480084, "epoch": 2857} {"train_loss": -12.330611228942871, "global_step": 480085, "epoch": 2857} {"train_loss": -12.63821029663086, "global_step": 480086, "epoch": 2857} {"train_loss": -12.38514518737793, "global_step": 480087, "epoch": 2857} {"train_loss": -12.509986877441406, "global_step": 480088, "epoch": 2857} {"train_loss": -12.388664245605469, "global_step": 480089, "epoch": 2857} {"train_loss": -12.053049087524414, "global_step": 480090, "epoch": 2857} {"train_loss": -11.966560363769531, "global_step": 480091, "epoch": 2857} {"train_loss": -12.240214347839355, "global_step": 480092, "epoch": 2857} {"train_loss": -12.293610572814941, "global_step": 480093, "epoch": 2857} {"train_loss": -12.233275413513184, "global_step": 480094, "epoch": 2857} {"train_loss": -12.050761222839355, "global_step": 480095, "epoch": 2857} {"train_loss": -12.180610656738281, "global_step": 480096, "epoch": 2857} {"train_loss": -12.155069351196289, "global_step": 480097, "epoch": 2857} {"train_loss": -11.572693824768066, "global_step": 480098, "epoch": 2857} {"train_loss": -12.105295181274414, "global_step": 480099, "epoch": 2857} {"train_loss": -11.631027221679688, "global_step": 480100, "epoch": 2857} {"train_loss": -11.841089248657227, "global_step": 480101, "epoch": 2857} {"train_loss": -11.55837345123291, "global_step": 480102, "epoch": 2857} {"train_loss": -11.995903015136719, "global_step": 480103, "epoch": 2857} {"train_loss": -12.103523254394531, "global_step": 480104, "epoch": 2857} {"train_loss": -11.608009338378906, "global_step": 480105, "epoch": 2857} {"train_loss": -12.18795394897461, "global_step": 480106, "epoch": 2857} {"train_loss": -12.320754051208496, "global_step": 480107, "epoch": 2857} {"train_loss": -12.418323516845703, "global_step": 480108, "epoch": 2857} {"train_loss": -11.82185173034668, "global_step": 480109, "epoch": 2857} {"train_loss": -11.657939910888672, "global_step": 480110, "epoch": 2857} {"train_loss": -12.228878021240234, "global_step": 480111, "epoch": 2857} {"train_loss": -10.57088851928711, "global_step": 480112, "epoch": 2857} {"train_loss": -11.995170593261719, "global_step": 480113, "epoch": 2857} {"train_loss": -10.341421127319336, "global_step": 480114, "epoch": 2857} {"train_loss": -10.984107971191406, "global_step": 480115, "epoch": 2857} {"train_loss": -9.254161834716797, "global_step": 480116, "epoch": 2857} {"train_loss": -11.736441612243652, "global_step": 480117, "epoch": 2857} {"train_loss": -11.343000411987305, "global_step": 480118, "epoch": 2857} {"train_loss": -11.737255096435547, "global_step": 480119, "epoch": 2857} {"train_loss": -11.440589904785156, "global_step": 480120, "epoch": 2857} {"train_loss": -10.841767311096191, "global_step": 480121, "epoch": 2857} {"train_loss": -12.584479331970215, "global_step": 480122, "epoch": 2857} {"train_loss": -10.656655311584473, "global_step": 480123, "epoch": 2857} {"train_loss": -12.30197525024414, "global_step": 480124, "epoch": 2857} {"train_loss": -11.49240493774414, "global_step": 480125, "epoch": 2857} {"train_loss": -11.987457275390625, "global_step": 480126, "epoch": 2857} {"train_loss": -12.119619369506836, "global_step": 480127, "epoch": 2857} {"train_loss": -11.511075973510742, "global_step": 480128, "epoch": 2857} {"train_loss": -12.263409614562988, "global_step": 480129, "epoch": 2857} {"train_loss": -11.432440757751465, "global_step": 480130, "epoch": 2857} {"train_loss": -12.426396369934082, "global_step": 480131, "epoch": 2857} {"train_loss": -11.372023582458496, "global_step": 480132, "epoch": 2857} {"train_loss": -12.362226486206055, "global_step": 480133, "epoch": 2857} {"train_loss": -12.138525009155273, "global_step": 480134, "epoch": 2857} {"train_loss": -12.340639114379883, "global_step": 480135, "epoch": 2857} {"train_loss": -12.402010917663574, "global_step": 480136, "epoch": 2857} {"train_loss": -12.431222915649414, "global_step": 480137, "epoch": 2857} {"train_loss": -12.430490493774414, "global_step": 480138, "epoch": 2857} {"train_loss": -12.339174270629883, "global_step": 480139, "epoch": 2857} {"train_loss": -12.300617218017578, "global_step": 480140, "epoch": 2857} {"train_loss": -12.18940544128418, "global_step": 480141, "epoch": 2857} {"train_loss": -12.387540817260742, "global_step": 480142, "epoch": 2857} {"train_loss": -12.068258592060634, "global_step": 480143, "epoch": 2857, "val_loss": 320231.78125} {"train_loss": -12.29102897644043, "global_step": 480144, "epoch": 2858} {"train_loss": -12.530130386352539, "global_step": 480145, "epoch": 2858} {"train_loss": -11.994770050048828, "global_step": 480146, "epoch": 2858} {"train_loss": -12.575318336486816, "global_step": 480147, "epoch": 2858} {"train_loss": -12.613114356994629, "global_step": 480148, "epoch": 2858} {"train_loss": -12.573567390441895, "global_step": 480149, "epoch": 2858} {"train_loss": -12.522479057312012, "global_step": 480150, "epoch": 2858} {"train_loss": -12.576316833496094, "global_step": 480151, "epoch": 2858} {"train_loss": -12.641861915588379, "global_step": 480152, "epoch": 2858} {"train_loss": -12.731178283691406, "global_step": 480153, "epoch": 2858} {"train_loss": -12.461820602416992, "global_step": 480154, "epoch": 2858} {"train_loss": -12.669502258300781, "global_step": 480155, "epoch": 2858} {"train_loss": -12.738687515258789, "global_step": 480156, "epoch": 2858} {"train_loss": -12.840362548828125, "global_step": 480157, "epoch": 2858} {"train_loss": -12.648882865905762, "global_step": 480158, "epoch": 2858} {"train_loss": -12.736032485961914, "global_step": 480159, "epoch": 2858} {"train_loss": -12.620874404907227, "global_step": 480160, "epoch": 2858} {"train_loss": -12.601446151733398, "global_step": 480161, "epoch": 2858} {"train_loss": -12.479375839233398, "global_step": 480162, "epoch": 2858} {"train_loss": -12.670812606811523, "global_step": 480163, "epoch": 2858} {"train_loss": -12.708744049072266, "global_step": 480164, "epoch": 2858} {"train_loss": -12.780500411987305, "global_step": 480165, "epoch": 2858} {"train_loss": -12.637581825256348, "global_step": 480166, "epoch": 2858} {"train_loss": -12.39527702331543, "global_step": 480167, "epoch": 2858} {"train_loss": -12.723979949951172, "global_step": 480168, "epoch": 2858} {"train_loss": -12.525033950805664, "global_step": 480169, "epoch": 2858} {"train_loss": -12.702807426452637, "global_step": 480170, "epoch": 2858} {"train_loss": -12.852685928344727, "global_step": 480171, "epoch": 2858} {"train_loss": -12.390348434448242, "global_step": 480172, "epoch": 2858} {"train_loss": -12.486945152282715, "global_step": 480173, "epoch": 2858} {"train_loss": -12.567222595214844, "global_step": 480174, "epoch": 2858} {"train_loss": -12.801029205322266, "global_step": 480175, "epoch": 2858} {"train_loss": -12.776582717895508, "global_step": 480176, "epoch": 2858} {"train_loss": -12.653088569641113, "global_step": 480177, "epoch": 2858} {"train_loss": -12.909912109375, "global_step": 480178, "epoch": 2858} {"train_loss": -12.407143592834473, "global_step": 480179, "epoch": 2858} {"train_loss": -12.807672500610352, "global_step": 480180, "epoch": 2858} {"train_loss": -12.907159805297852, "global_step": 480181, "epoch": 2858} {"train_loss": -12.802953720092773, "global_step": 480182, "epoch": 2858} {"train_loss": -12.435481071472168, "global_step": 480183, "epoch": 2858} {"train_loss": -12.8469820022583, "global_step": 480184, "epoch": 2858} {"train_loss": -12.810688018798828, "global_step": 480185, "epoch": 2858} {"train_loss": -12.918600082397461, "global_step": 480186, "epoch": 2858} {"train_loss": -12.78365421295166, "global_step": 480187, "epoch": 2858} {"train_loss": -12.716869354248047, "global_step": 480188, "epoch": 2858} {"train_loss": -12.813827514648438, "global_step": 480189, "epoch": 2858} {"train_loss": -12.682090759277344, "global_step": 480190, "epoch": 2858} {"train_loss": -12.603364944458008, "global_step": 480191, "epoch": 2858} {"train_loss": -12.781668663024902, "global_step": 480192, "epoch": 2858} {"train_loss": -12.485614776611328, "global_step": 480193, "epoch": 2858} {"train_loss": -12.616859436035156, "global_step": 480194, "epoch": 2858} {"train_loss": -12.690187454223633, "global_step": 480195, "epoch": 2858} {"train_loss": -12.833592414855957, "global_step": 480196, "epoch": 2858} {"train_loss": -12.481468200683594, "global_step": 480197, "epoch": 2858} {"train_loss": -12.704660415649414, "global_step": 480198, "epoch": 2858} {"train_loss": -12.836841583251953, "global_step": 480199, "epoch": 2858} {"train_loss": -12.053367614746094, "global_step": 480200, "epoch": 2858} {"train_loss": -12.899825096130371, "global_step": 480201, "epoch": 2858} {"train_loss": -12.51123046875, "global_step": 480202, "epoch": 2858} {"train_loss": -12.80932903289795, "global_step": 480203, "epoch": 2858} {"train_loss": -12.658243179321289, "global_step": 480204, "epoch": 2858} {"train_loss": -12.667859077453613, "global_step": 480205, "epoch": 2858} {"train_loss": -12.642288208007812, "global_step": 480206, "epoch": 2858} {"train_loss": -12.67832088470459, "global_step": 480207, "epoch": 2858} {"train_loss": -12.79162311553955, "global_step": 480208, "epoch": 2858} {"train_loss": -12.724246978759766, "global_step": 480209, "epoch": 2858} {"train_loss": -12.803573608398438, "global_step": 480210, "epoch": 2858} {"train_loss": -12.656065940856934, "global_step": 480211, "epoch": 2858} {"train_loss": -12.83687973022461, "global_step": 480212, "epoch": 2858} {"train_loss": -12.747882843017578, "global_step": 480213, "epoch": 2858} {"train_loss": -12.38892936706543, "global_step": 480214, "epoch": 2858} {"train_loss": -12.44376277923584, "global_step": 480215, "epoch": 2858} {"train_loss": -12.39091968536377, "global_step": 480216, "epoch": 2858} {"train_loss": -12.814262390136719, "global_step": 480217, "epoch": 2858} {"train_loss": -12.583253860473633, "global_step": 480218, "epoch": 2858} {"train_loss": -12.575774192810059, "global_step": 480219, "epoch": 2858} {"train_loss": -12.501117706298828, "global_step": 480220, "epoch": 2858} {"train_loss": -12.64940357208252, "global_step": 480221, "epoch": 2858} {"train_loss": -12.752326965332031, "global_step": 480222, "epoch": 2858} {"train_loss": -12.713836669921875, "global_step": 480223, "epoch": 2858} {"train_loss": -12.460147857666016, "global_step": 480224, "epoch": 2858} {"train_loss": -12.444780349731445, "global_step": 480225, "epoch": 2858} {"train_loss": -12.699728012084961, "global_step": 480226, "epoch": 2858} {"train_loss": -12.718467712402344, "global_step": 480227, "epoch": 2858} {"train_loss": -12.656793594360352, "global_step": 480228, "epoch": 2858} {"train_loss": -12.185066223144531, "global_step": 480229, "epoch": 2858} {"train_loss": -12.59062385559082, "global_step": 480230, "epoch": 2858} {"train_loss": -12.91079330444336, "global_step": 480231, "epoch": 2858} {"train_loss": -11.942935943603516, "global_step": 480232, "epoch": 2858} {"train_loss": -11.78249740600586, "global_step": 480233, "epoch": 2858} {"train_loss": -12.362251281738281, "global_step": 480234, "epoch": 2858} {"train_loss": -12.026925086975098, "global_step": 480235, "epoch": 2858} {"train_loss": -11.419212341308594, "global_step": 480236, "epoch": 2858} {"train_loss": -11.985361099243164, "global_step": 480237, "epoch": 2858} {"train_loss": -11.457571983337402, "global_step": 480238, "epoch": 2858} {"train_loss": -9.011284828186035, "global_step": 480239, "epoch": 2858} {"train_loss": -10.156526565551758, "global_step": 480240, "epoch": 2858} {"train_loss": -10.674664497375488, "global_step": 480241, "epoch": 2858} {"train_loss": -11.51531982421875, "global_step": 480242, "epoch": 2858} {"train_loss": -10.129938125610352, "global_step": 480243, "epoch": 2858} {"train_loss": -11.045052528381348, "global_step": 480244, "epoch": 2858} {"train_loss": -11.553171157836914, "global_step": 480245, "epoch": 2858} {"train_loss": -10.920820236206055, "global_step": 480246, "epoch": 2858} {"train_loss": -11.784199714660645, "global_step": 480247, "epoch": 2858} {"train_loss": -10.467086791992188, "global_step": 480248, "epoch": 2858} {"train_loss": -11.133866310119629, "global_step": 480249, "epoch": 2858} {"train_loss": -11.310142517089844, "global_step": 480250, "epoch": 2858} {"train_loss": -9.89569091796875, "global_step": 480251, "epoch": 2858} {"train_loss": -10.726591110229492, "global_step": 480252, "epoch": 2858} {"train_loss": -9.999868392944336, "global_step": 480253, "epoch": 2858} {"train_loss": -8.64000415802002, "global_step": 480254, "epoch": 2858} {"train_loss": -8.988004684448242, "global_step": 480255, "epoch": 2858} {"train_loss": -9.056234359741211, "global_step": 480256, "epoch": 2858} {"train_loss": -9.527986526489258, "global_step": 480257, "epoch": 2858} {"train_loss": -10.586965560913086, "global_step": 480258, "epoch": 2858} {"train_loss": -8.640385627746582, "global_step": 480259, "epoch": 2858} {"train_loss": -9.885486602783203, "global_step": 480260, "epoch": 2858} {"train_loss": -8.891634941101074, "global_step": 480261, "epoch": 2858} {"train_loss": -11.27754020690918, "global_step": 480262, "epoch": 2858} {"train_loss": -8.362648010253906, "global_step": 480263, "epoch": 2858} {"train_loss": -10.735193252563477, "global_step": 480264, "epoch": 2858} {"train_loss": -9.651247024536133, "global_step": 480265, "epoch": 2858} {"train_loss": -10.957151412963867, "global_step": 480266, "epoch": 2858} {"train_loss": -10.423429489135742, "global_step": 480267, "epoch": 2858} {"train_loss": -10.83314037322998, "global_step": 480268, "epoch": 2858} {"train_loss": -11.239202499389648, "global_step": 480269, "epoch": 2858} {"train_loss": -11.073932647705078, "global_step": 480270, "epoch": 2858} {"train_loss": -11.497964859008789, "global_step": 480271, "epoch": 2858} {"train_loss": -11.12310791015625, "global_step": 480272, "epoch": 2858} {"train_loss": -12.003144264221191, "global_step": 480273, "epoch": 2858} {"train_loss": -10.883033752441406, "global_step": 480274, "epoch": 2858} {"train_loss": -12.163105010986328, "global_step": 480275, "epoch": 2858} {"train_loss": -11.059900283813477, "global_step": 480276, "epoch": 2858} {"train_loss": -12.271625518798828, "global_step": 480277, "epoch": 2858} {"train_loss": -11.37175178527832, "global_step": 480278, "epoch": 2858} {"train_loss": -11.825292587280273, "global_step": 480279, "epoch": 2858} {"train_loss": -11.689613342285156, "global_step": 480280, "epoch": 2858} {"train_loss": -11.762419700622559, "global_step": 480281, "epoch": 2858} {"train_loss": -11.338760375976562, "global_step": 480282, "epoch": 2858} {"train_loss": -11.70121955871582, "global_step": 480283, "epoch": 2858} {"train_loss": -11.650978088378906, "global_step": 480284, "epoch": 2858} {"train_loss": -11.5596923828125, "global_step": 480285, "epoch": 2858} {"train_loss": -12.24875545501709, "global_step": 480286, "epoch": 2858} {"train_loss": -11.578031539916992, "global_step": 480287, "epoch": 2858} {"train_loss": -11.978445053100586, "global_step": 480288, "epoch": 2858} {"train_loss": -12.154077529907227, "global_step": 480289, "epoch": 2858} {"train_loss": -11.781858444213867, "global_step": 480290, "epoch": 2858} {"train_loss": -11.974790573120117, "global_step": 480291, "epoch": 2858} {"train_loss": -12.300090789794922, "global_step": 480292, "epoch": 2858} {"train_loss": -11.872112274169922, "global_step": 480293, "epoch": 2858} {"train_loss": -12.344085693359375, "global_step": 480294, "epoch": 2858} {"train_loss": -12.070414543151855, "global_step": 480295, "epoch": 2858} {"train_loss": -12.181417465209961, "global_step": 480296, "epoch": 2858} {"train_loss": -12.205060958862305, "global_step": 480297, "epoch": 2858} {"train_loss": -11.97816276550293, "global_step": 480298, "epoch": 2858} {"train_loss": -12.375816345214844, "global_step": 480299, "epoch": 2858} {"train_loss": -12.37322998046875, "global_step": 480300, "epoch": 2858} {"train_loss": -12.294382095336914, "global_step": 480301, "epoch": 2858} {"train_loss": -12.144351959228516, "global_step": 480302, "epoch": 2858} {"train_loss": -12.374256134033203, "global_step": 480303, "epoch": 2858} {"train_loss": -12.001124382019043, "global_step": 480304, "epoch": 2858} {"train_loss": -12.461318969726562, "global_step": 480305, "epoch": 2858} {"train_loss": -12.322665214538574, "global_step": 480306, "epoch": 2858} {"train_loss": -11.954561233520508, "global_step": 480307, "epoch": 2858} {"train_loss": -12.577749252319336, "global_step": 480308, "epoch": 2858} {"train_loss": -12.396600723266602, "global_step": 480309, "epoch": 2858} {"train_loss": -12.209573745727539, "global_step": 480310, "epoch": 2858} {"train_loss": -11.993950208028158, "global_step": 480311, "epoch": 2858, "val_loss": 320240.25} {"train_loss": -12.359426498413086, "global_step": 480312, "epoch": 2859} {"train_loss": -12.325312614440918, "global_step": 480313, "epoch": 2859} {"train_loss": -12.586488723754883, "global_step": 480314, "epoch": 2859} {"train_loss": -12.471360206604004, "global_step": 480315, "epoch": 2859} {"train_loss": -12.42878532409668, "global_step": 480316, "epoch": 2859} {"train_loss": -12.653695106506348, "global_step": 480317, "epoch": 2859} {"train_loss": -12.630393981933594, "global_step": 480318, "epoch": 2859} {"train_loss": -12.51713752746582, "global_step": 480319, "epoch": 2859} {"train_loss": -12.356101989746094, "global_step": 480320, "epoch": 2859} {"train_loss": -12.482050895690918, "global_step": 480321, "epoch": 2859} {"train_loss": -12.46615982055664, "global_step": 480322, "epoch": 2859} {"train_loss": -12.458280563354492, "global_step": 480323, "epoch": 2859} {"train_loss": -12.497108459472656, "global_step": 480324, "epoch": 2859} {"train_loss": -12.468624114990234, "global_step": 480325, "epoch": 2859} {"train_loss": -12.541357040405273, "global_step": 480326, "epoch": 2859} {"train_loss": -12.409181594848633, "global_step": 480327, "epoch": 2859} {"train_loss": -12.573728561401367, "global_step": 480328, "epoch": 2859} {"train_loss": -12.505876541137695, "global_step": 480329, "epoch": 2859} {"train_loss": -12.737428665161133, "global_step": 480330, "epoch": 2859} {"train_loss": -12.495594024658203, "global_step": 480331, "epoch": 2859} {"train_loss": -12.533203125, "global_step": 480332, "epoch": 2859} {"train_loss": -12.46439266204834, "global_step": 480333, "epoch": 2859} {"train_loss": -12.736045837402344, "global_step": 480334, "epoch": 2859} {"train_loss": -12.70888900756836, "global_step": 480335, "epoch": 2859} {"train_loss": -12.656126976013184, "global_step": 480336, "epoch": 2859} {"train_loss": -12.625040054321289, "global_step": 480337, "epoch": 2859} {"train_loss": -12.785490036010742, "global_step": 480338, "epoch": 2859} {"train_loss": -12.527006149291992, "global_step": 480339, "epoch": 2859} {"train_loss": -12.683204650878906, "global_step": 480340, "epoch": 2859} {"train_loss": -12.7717866897583, "global_step": 480341, "epoch": 2859} {"train_loss": -12.67251205444336, "global_step": 480342, "epoch": 2859} {"train_loss": -12.749106407165527, "global_step": 480343, "epoch": 2859} {"train_loss": -12.688608169555664, "global_step": 480344, "epoch": 2859} {"train_loss": -12.706527709960938, "global_step": 480345, "epoch": 2859} {"train_loss": -12.720926284790039, "global_step": 480346, "epoch": 2859} {"train_loss": -12.759385108947754, "global_step": 480347, "epoch": 2859} {"train_loss": -12.692817687988281, "global_step": 480348, "epoch": 2859} {"train_loss": -12.56673812866211, "global_step": 480349, "epoch": 2859} {"train_loss": -12.603668212890625, "global_step": 480350, "epoch": 2859} {"train_loss": -12.737312316894531, "global_step": 480351, "epoch": 2859} {"train_loss": -12.913640022277832, "global_step": 480352, "epoch": 2859} {"train_loss": -12.751814842224121, "global_step": 480353, "epoch": 2859} {"train_loss": -12.903430938720703, "global_step": 480354, "epoch": 2859} {"train_loss": -12.958076477050781, "global_step": 480355, "epoch": 2859} {"train_loss": -13.139360427856445, "global_step": 480356, "epoch": 2859} {"train_loss": -12.791720390319824, "global_step": 480357, "epoch": 2859} {"train_loss": -12.836857795715332, "global_step": 480358, "epoch": 2859} {"train_loss": -12.882555961608887, "global_step": 480359, "epoch": 2859} {"train_loss": -12.847146987915039, "global_step": 480360, "epoch": 2859} {"train_loss": -12.85597038269043, "global_step": 480361, "epoch": 2859} {"train_loss": -13.03392505645752, "global_step": 480362, "epoch": 2859} {"train_loss": -12.653695106506348, "global_step": 480363, "epoch": 2859} {"train_loss": -12.71945571899414, "global_step": 480364, "epoch": 2859} {"train_loss": -12.774131774902344, "global_step": 480365, "epoch": 2859} {"train_loss": -12.899768829345703, "global_step": 480366, "epoch": 2859} {"train_loss": -12.938285827636719, "global_step": 480367, "epoch": 2859} {"train_loss": -12.643306732177734, "global_step": 480368, "epoch": 2859} {"train_loss": -12.976242065429688, "global_step": 480369, "epoch": 2859} {"train_loss": -12.92257308959961, "global_step": 480370, "epoch": 2859} {"train_loss": -12.782615661621094, "global_step": 480371, "epoch": 2859} {"train_loss": -12.910642623901367, "global_step": 480372, "epoch": 2859} {"train_loss": -12.590120315551758, "global_step": 480373, "epoch": 2859} {"train_loss": -12.789170265197754, "global_step": 480374, "epoch": 2859} {"train_loss": -12.708077430725098, "global_step": 480375, "epoch": 2859} {"train_loss": -12.804071426391602, "global_step": 480376, "epoch": 2859} {"train_loss": -12.5845308303833, "global_step": 480377, "epoch": 2859} {"train_loss": -12.77012825012207, "global_step": 480378, "epoch": 2859} {"train_loss": -12.891205787658691, "global_step": 480379, "epoch": 2859} {"train_loss": -12.921631813049316, "global_step": 480380, "epoch": 2859} {"train_loss": -12.836735725402832, "global_step": 480381, "epoch": 2859} {"train_loss": -13.004554748535156, "global_step": 480382, "epoch": 2859} {"train_loss": -12.903030395507812, "global_step": 480383, "epoch": 2859} {"train_loss": -12.867499351501465, "global_step": 480384, "epoch": 2859} {"train_loss": -13.09597110748291, "global_step": 480385, "epoch": 2859} {"train_loss": -12.859155654907227, "global_step": 480386, "epoch": 2859} {"train_loss": -13.105840682983398, "global_step": 480387, "epoch": 2859} {"train_loss": -12.77241325378418, "global_step": 480388, "epoch": 2859} {"train_loss": -12.963811874389648, "global_step": 480389, "epoch": 2859} {"train_loss": -12.581291198730469, "global_step": 480390, "epoch": 2859} {"train_loss": -13.268019676208496, "global_step": 480391, "epoch": 2859} {"train_loss": -13.001066207885742, "global_step": 480392, "epoch": 2859} {"train_loss": -11.91423511505127, "global_step": 480393, "epoch": 2859} {"train_loss": -12.538382530212402, "global_step": 480394, "epoch": 2859} {"train_loss": -12.404289245605469, "global_step": 480395, "epoch": 2859} {"train_loss": -12.768417358398438, "global_step": 480396, "epoch": 2859} {"train_loss": -11.656712532043457, "global_step": 480397, "epoch": 2859} {"train_loss": -12.405233383178711, "global_step": 480398, "epoch": 2859} {"train_loss": -12.464273452758789, "global_step": 480399, "epoch": 2859} {"train_loss": -12.20504379272461, "global_step": 480400, "epoch": 2859} {"train_loss": -12.761377334594727, "global_step": 480401, "epoch": 2859} {"train_loss": -11.997869491577148, "global_step": 480402, "epoch": 2859} {"train_loss": -13.047818183898926, "global_step": 480403, "epoch": 2859} {"train_loss": -12.039344787597656, "global_step": 480404, "epoch": 2859} {"train_loss": -12.672561645507812, "global_step": 480405, "epoch": 2859} {"train_loss": -12.005908966064453, "global_step": 480406, "epoch": 2859} {"train_loss": -12.339738845825195, "global_step": 480407, "epoch": 2859} {"train_loss": -12.546785354614258, "global_step": 480408, "epoch": 2859} {"train_loss": -12.532114028930664, "global_step": 480409, "epoch": 2859} {"train_loss": -12.576400756835938, "global_step": 480410, "epoch": 2859} {"train_loss": -12.947378158569336, "global_step": 480411, "epoch": 2859} {"train_loss": -12.622119903564453, "global_step": 480412, "epoch": 2859} {"train_loss": -12.683633804321289, "global_step": 480413, "epoch": 2859} {"train_loss": -12.536727905273438, "global_step": 480414, "epoch": 2859} {"train_loss": -12.78177547454834, "global_step": 480415, "epoch": 2859} {"train_loss": -12.542835235595703, "global_step": 480416, "epoch": 2859} {"train_loss": -12.782470703125, "global_step": 480417, "epoch": 2859} {"train_loss": -12.28947639465332, "global_step": 480418, "epoch": 2859} {"train_loss": -12.797134399414062, "global_step": 480419, "epoch": 2859} {"train_loss": -12.119949340820312, "global_step": 480420, "epoch": 2859} {"train_loss": -12.944494247436523, "global_step": 480421, "epoch": 2859} {"train_loss": -11.620156288146973, "global_step": 480422, "epoch": 2859} {"train_loss": -12.1409273147583, "global_step": 480423, "epoch": 2859} {"train_loss": -12.439790725708008, "global_step": 480424, "epoch": 2859} {"train_loss": -11.900028228759766, "global_step": 480425, "epoch": 2859} {"train_loss": -12.017948150634766, "global_step": 480426, "epoch": 2859} {"train_loss": -11.689311981201172, "global_step": 480427, "epoch": 2859} {"train_loss": -11.503900527954102, "global_step": 480428, "epoch": 2859} {"train_loss": -10.270771026611328, "global_step": 480429, "epoch": 2859} {"train_loss": -10.638511657714844, "global_step": 480430, "epoch": 2859} {"train_loss": -9.336475372314453, "global_step": 480431, "epoch": 2859} {"train_loss": -9.482980728149414, "global_step": 480432, "epoch": 2859} {"train_loss": -9.560770034790039, "global_step": 480433, "epoch": 2859} {"train_loss": -10.907804489135742, "global_step": 480434, "epoch": 2859} {"train_loss": -9.304906845092773, "global_step": 480435, "epoch": 2859} {"train_loss": -10.800012588500977, "global_step": 480436, "epoch": 2859} {"train_loss": -11.475475311279297, "global_step": 480437, "epoch": 2859} {"train_loss": -10.948050498962402, "global_step": 480438, "epoch": 2859} {"train_loss": -10.494876861572266, "global_step": 480439, "epoch": 2859} {"train_loss": -11.57696533203125, "global_step": 480440, "epoch": 2859} {"train_loss": -10.884723663330078, "global_step": 480441, "epoch": 2859} {"train_loss": -10.641250610351562, "global_step": 480442, "epoch": 2859} {"train_loss": -11.748559951782227, "global_step": 480443, "epoch": 2859} {"train_loss": -9.831850051879883, "global_step": 480444, "epoch": 2859} {"train_loss": -11.252055168151855, "global_step": 480445, "epoch": 2859} {"train_loss": -10.396358489990234, "global_step": 480446, "epoch": 2859} {"train_loss": -9.395954132080078, "global_step": 480447, "epoch": 2859} {"train_loss": -10.232391357421875, "global_step": 480448, "epoch": 2859} {"train_loss": -11.635517120361328, "global_step": 480449, "epoch": 2859} {"train_loss": -10.631237983703613, "global_step": 480450, "epoch": 2859} {"train_loss": -11.401388168334961, "global_step": 480451, "epoch": 2859} {"train_loss": -11.069124221801758, "global_step": 480452, "epoch": 2859} {"train_loss": -11.004293441772461, "global_step": 480453, "epoch": 2859} {"train_loss": -11.790688514709473, "global_step": 480454, "epoch": 2859} {"train_loss": -10.613426208496094, "global_step": 480455, "epoch": 2859} {"train_loss": -12.252555847167969, "global_step": 480456, "epoch": 2859} {"train_loss": -11.095358848571777, "global_step": 480457, "epoch": 2859} {"train_loss": -11.84865665435791, "global_step": 480458, "epoch": 2859} {"train_loss": -11.581659317016602, "global_step": 480459, "epoch": 2859} {"train_loss": -11.575031280517578, "global_step": 480460, "epoch": 2859} {"train_loss": -11.255943298339844, "global_step": 480461, "epoch": 2859} {"train_loss": -11.564833641052246, "global_step": 480462, "epoch": 2859} {"train_loss": -11.682554244995117, "global_step": 480463, "epoch": 2859} {"train_loss": -11.506860733032227, "global_step": 480464, "epoch": 2859} {"train_loss": -10.801389694213867, "global_step": 480465, "epoch": 2859} {"train_loss": -11.470626831054688, "global_step": 480466, "epoch": 2859} {"train_loss": -11.33728313446045, "global_step": 480467, "epoch": 2859} {"train_loss": -12.267913818359375, "global_step": 480468, "epoch": 2859} {"train_loss": -11.067983627319336, "global_step": 480469, "epoch": 2859} {"train_loss": -12.072299003601074, "global_step": 480470, "epoch": 2859} {"train_loss": -12.137646675109863, "global_step": 480471, "epoch": 2859} {"train_loss": -11.957456588745117, "global_step": 480472, "epoch": 2859} {"train_loss": -12.173788070678711, "global_step": 480473, "epoch": 2859} {"train_loss": -11.806198120117188, "global_step": 480474, "epoch": 2859} {"train_loss": -11.944435119628906, "global_step": 480475, "epoch": 2859} {"train_loss": -11.99138069152832, "global_step": 480476, "epoch": 2859} {"train_loss": -12.063962936401367, "global_step": 480477, "epoch": 2859} {"train_loss": -11.974916458129883, "global_step": 480478, "epoch": 2859} {"train_loss": -12.173382571765355, "global_step": 480479, "epoch": 2859, "val_loss": 313526.71875} {"train_loss": -11.46231460571289, "global_step": 480480, "epoch": 2860} {"train_loss": -12.409706115722656, "global_step": 480481, "epoch": 2860} {"train_loss": -11.682378768920898, "global_step": 480482, "epoch": 2860} {"train_loss": -12.183189392089844, "global_step": 480483, "epoch": 2860} {"train_loss": -12.057499885559082, "global_step": 480484, "epoch": 2860} {"train_loss": -12.121953964233398, "global_step": 480485, "epoch": 2860} {"train_loss": -12.091672897338867, "global_step": 480486, "epoch": 2860} {"train_loss": -12.23333740234375, "global_step": 480487, "epoch": 2860} {"train_loss": -12.40542221069336, "global_step": 480488, "epoch": 2860} {"train_loss": -12.651403427124023, "global_step": 480489, "epoch": 2860} {"train_loss": -12.322811126708984, "global_step": 480490, "epoch": 2860} {"train_loss": -12.323780059814453, "global_step": 480491, "epoch": 2860} {"train_loss": -12.540882110595703, "global_step": 480492, "epoch": 2860} {"train_loss": -12.208717346191406, "global_step": 480493, "epoch": 2860} {"train_loss": -12.409021377563477, "global_step": 480494, "epoch": 2860} {"train_loss": -12.335152626037598, "global_step": 480495, "epoch": 2860} {"train_loss": -12.463051795959473, "global_step": 480496, "epoch": 2860} {"train_loss": -12.547961235046387, "global_step": 480497, "epoch": 2860} {"train_loss": -12.47422981262207, "global_step": 480498, "epoch": 2860} {"train_loss": -12.577408790588379, "global_step": 480499, "epoch": 2860} {"train_loss": -12.37666130065918, "global_step": 480500, "epoch": 2860} {"train_loss": -12.350790977478027, "global_step": 480501, "epoch": 2860} {"train_loss": -12.6350679397583, "global_step": 480502, "epoch": 2860} {"train_loss": -12.535529136657715, "global_step": 480503, "epoch": 2860} {"train_loss": -12.581302642822266, "global_step": 480504, "epoch": 2860} {"train_loss": -12.59873104095459, "global_step": 480505, "epoch": 2860} {"train_loss": -12.37441635131836, "global_step": 480506, "epoch": 2860} {"train_loss": -12.80561637878418, "global_step": 480507, "epoch": 2860} {"train_loss": -12.52834701538086, "global_step": 480508, "epoch": 2860} {"train_loss": -12.483977317810059, "global_step": 480509, "epoch": 2860} {"train_loss": -12.781927108764648, "global_step": 480510, "epoch": 2860} {"train_loss": -12.76591968536377, "global_step": 480511, "epoch": 2860} {"train_loss": -12.757104873657227, "global_step": 480512, "epoch": 2860} {"train_loss": -12.554767608642578, "global_step": 480513, "epoch": 2860} {"train_loss": -12.706709861755371, "global_step": 480514, "epoch": 2860} {"train_loss": -12.387174606323242, "global_step": 480515, "epoch": 2860} {"train_loss": -12.689838409423828, "global_step": 480516, "epoch": 2860} {"train_loss": -12.537565231323242, "global_step": 480517, "epoch": 2860} {"train_loss": -12.831411361694336, "global_step": 480518, "epoch": 2860} {"train_loss": -12.54659366607666, "global_step": 480519, "epoch": 2860} {"train_loss": -12.88676929473877, "global_step": 480520, "epoch": 2860} {"train_loss": -12.851223945617676, "global_step": 480521, "epoch": 2860} {"train_loss": -12.728585243225098, "global_step": 480522, "epoch": 2860} {"train_loss": -12.78569507598877, "global_step": 480523, "epoch": 2860} {"train_loss": -12.840794563293457, "global_step": 480524, "epoch": 2860} {"train_loss": -12.494839668273926, "global_step": 480525, "epoch": 2860} {"train_loss": -12.708008766174316, "global_step": 480526, "epoch": 2860} {"train_loss": -12.867744445800781, "global_step": 480527, "epoch": 2860} {"train_loss": -12.872157096862793, "global_step": 480528, "epoch": 2860} {"train_loss": -12.706340789794922, "global_step": 480529, "epoch": 2860} {"train_loss": -12.712841033935547, "global_step": 480530, "epoch": 2860} {"train_loss": -12.73331069946289, "global_step": 480531, "epoch": 2860} {"train_loss": -12.950447082519531, "global_step": 480532, "epoch": 2860} {"train_loss": -12.657079696655273, "global_step": 480533, "epoch": 2860} {"train_loss": -12.942438125610352, "global_step": 480534, "epoch": 2860} {"train_loss": -12.553781509399414, "global_step": 480535, "epoch": 2860} {"train_loss": -12.75309944152832, "global_step": 480536, "epoch": 2860} {"train_loss": -12.826034545898438, "global_step": 480537, "epoch": 2860} {"train_loss": -12.82715892791748, "global_step": 480538, "epoch": 2860} {"train_loss": -12.956449508666992, "global_step": 480539, "epoch": 2860} {"train_loss": -12.616693496704102, "global_step": 480540, "epoch": 2860} {"train_loss": -12.712797164916992, "global_step": 480541, "epoch": 2860} {"train_loss": -13.022502899169922, "global_step": 480542, "epoch": 2860} {"train_loss": -12.883601188659668, "global_step": 480543, "epoch": 2860} {"train_loss": -13.019054412841797, "global_step": 480544, "epoch": 2860} {"train_loss": -12.965193748474121, "global_step": 480545, "epoch": 2860} {"train_loss": -13.055389404296875, "global_step": 480546, "epoch": 2860} {"train_loss": -12.681621551513672, "global_step": 480547, "epoch": 2860} {"train_loss": -12.832097053527832, "global_step": 480548, "epoch": 2860} {"train_loss": -12.662044525146484, "global_step": 480549, "epoch": 2860} {"train_loss": -12.685920715332031, "global_step": 480550, "epoch": 2860} {"train_loss": -12.724225044250488, "global_step": 480551, "epoch": 2860} {"train_loss": -12.810726165771484, "global_step": 480552, "epoch": 2860} {"train_loss": -12.65628433227539, "global_step": 480553, "epoch": 2860} {"train_loss": -12.843117713928223, "global_step": 480554, "epoch": 2860} {"train_loss": -13.052122116088867, "global_step": 480555, "epoch": 2860} {"train_loss": -13.018251419067383, "global_step": 480556, "epoch": 2860} {"train_loss": -12.610538482666016, "global_step": 480557, "epoch": 2860} {"train_loss": -12.836742401123047, "global_step": 480558, "epoch": 2860} {"train_loss": -12.87890625, "global_step": 480559, "epoch": 2860} {"train_loss": -12.826356887817383, "global_step": 480560, "epoch": 2860} {"train_loss": -12.634546279907227, "global_step": 480561, "epoch": 2860} {"train_loss": -12.432836532592773, "global_step": 480562, "epoch": 2860} {"train_loss": -12.258974075317383, "global_step": 480563, "epoch": 2860} {"train_loss": -12.530511856079102, "global_step": 480564, "epoch": 2860} {"train_loss": -13.032526016235352, "global_step": 480565, "epoch": 2860} {"train_loss": -12.815969467163086, "global_step": 480566, "epoch": 2860} {"train_loss": -12.89683723449707, "global_step": 480567, "epoch": 2860} {"train_loss": -13.032081604003906, "global_step": 480568, "epoch": 2860} {"train_loss": -12.894341468811035, "global_step": 480569, "epoch": 2860} {"train_loss": -12.592962265014648, "global_step": 480570, "epoch": 2860} {"train_loss": -12.540571212768555, "global_step": 480571, "epoch": 2860} {"train_loss": -12.916055679321289, "global_step": 480572, "epoch": 2860} {"train_loss": -12.21328067779541, "global_step": 480573, "epoch": 2860} {"train_loss": -11.751090049743652, "global_step": 480574, "epoch": 2860} {"train_loss": -12.262229919433594, "global_step": 480575, "epoch": 2860} {"train_loss": -12.840051651000977, "global_step": 480576, "epoch": 2860} {"train_loss": -12.800485610961914, "global_step": 480577, "epoch": 2860} {"train_loss": -11.828556060791016, "global_step": 480578, "epoch": 2860} {"train_loss": -11.673998832702637, "global_step": 480579, "epoch": 2860} {"train_loss": -11.9530029296875, "global_step": 480580, "epoch": 2860} {"train_loss": -12.667438507080078, "global_step": 480581, "epoch": 2860} {"train_loss": -12.494527816772461, "global_step": 480582, "epoch": 2860} {"train_loss": -12.504926681518555, "global_step": 480583, "epoch": 2860} {"train_loss": -12.94825267791748, "global_step": 480584, "epoch": 2860} {"train_loss": -12.370573997497559, "global_step": 480585, "epoch": 2860} {"train_loss": -11.382360458374023, "global_step": 480586, "epoch": 2860} {"train_loss": -11.944421768188477, "global_step": 480587, "epoch": 2860} {"train_loss": -13.110450744628906, "global_step": 480588, "epoch": 2860} {"train_loss": -12.162883758544922, "global_step": 480589, "epoch": 2860} {"train_loss": -11.572453498840332, "global_step": 480590, "epoch": 2860} {"train_loss": -12.593993186950684, "global_step": 480591, "epoch": 2860} {"train_loss": -12.409112930297852, "global_step": 480592, "epoch": 2860} {"train_loss": -11.362001419067383, "global_step": 480593, "epoch": 2860} {"train_loss": -11.684006690979004, "global_step": 480594, "epoch": 2860} {"train_loss": -12.724889755249023, "global_step": 480595, "epoch": 2860} {"train_loss": -12.466495513916016, "global_step": 480596, "epoch": 2860} {"train_loss": -12.21757984161377, "global_step": 480597, "epoch": 2860} {"train_loss": -12.16279411315918, "global_step": 480598, "epoch": 2860} {"train_loss": -12.610763549804688, "global_step": 480599, "epoch": 2860} {"train_loss": -12.63119125366211, "global_step": 480600, "epoch": 2860} {"train_loss": -12.639713287353516, "global_step": 480601, "epoch": 2860} {"train_loss": -12.724897384643555, "global_step": 480602, "epoch": 2860} {"train_loss": -12.38945198059082, "global_step": 480603, "epoch": 2860} {"train_loss": -12.329668045043945, "global_step": 480604, "epoch": 2860} {"train_loss": -12.54030990600586, "global_step": 480605, "epoch": 2860} {"train_loss": -11.938243865966797, "global_step": 480606, "epoch": 2860} {"train_loss": -12.054876327514648, "global_step": 480607, "epoch": 2860} {"train_loss": -12.147134780883789, "global_step": 480608, "epoch": 2860} {"train_loss": -10.897031784057617, "global_step": 480609, "epoch": 2860} {"train_loss": -11.427204132080078, "global_step": 480610, "epoch": 2860} {"train_loss": -10.753639221191406, "global_step": 480611, "epoch": 2860} {"train_loss": -10.75286865234375, "global_step": 480612, "epoch": 2860} {"train_loss": -11.940689086914062, "global_step": 480613, "epoch": 2860} {"train_loss": -9.756038665771484, "global_step": 480614, "epoch": 2860} {"train_loss": -12.17953109741211, "global_step": 480615, "epoch": 2860} {"train_loss": -11.640535354614258, "global_step": 480616, "epoch": 2860} {"train_loss": -10.797843933105469, "global_step": 480617, "epoch": 2860} {"train_loss": -12.414976119995117, "global_step": 480618, "epoch": 2860} {"train_loss": -11.88366413116455, "global_step": 480619, "epoch": 2860} {"train_loss": -11.450759887695312, "global_step": 480620, "epoch": 2860} {"train_loss": -11.514631271362305, "global_step": 480621, "epoch": 2860} {"train_loss": -11.951616287231445, "global_step": 480622, "epoch": 2860} {"train_loss": -12.169681549072266, "global_step": 480623, "epoch": 2860} {"train_loss": -12.04429817199707, "global_step": 480624, "epoch": 2860} {"train_loss": -12.004341125488281, "global_step": 480625, "epoch": 2860} {"train_loss": -11.46861743927002, "global_step": 480626, "epoch": 2860} {"train_loss": -11.642483711242676, "global_step": 480627, "epoch": 2860} {"train_loss": -12.009166717529297, "global_step": 480628, "epoch": 2860} {"train_loss": -11.739444732666016, "global_step": 480629, "epoch": 2860} {"train_loss": -12.166263580322266, "global_step": 480630, "epoch": 2860} {"train_loss": -11.97097396850586, "global_step": 480631, "epoch": 2860} {"train_loss": -11.61044692993164, "global_step": 480632, "epoch": 2860} {"train_loss": -11.99949836730957, "global_step": 480633, "epoch": 2860} {"train_loss": -11.752300262451172, "global_step": 480634, "epoch": 2860} {"train_loss": -12.421808242797852, "global_step": 480635, "epoch": 2860} {"train_loss": -11.728858947753906, "global_step": 480636, "epoch": 2860} {"train_loss": -12.437041282653809, "global_step": 480637, "epoch": 2860} {"train_loss": -12.028009414672852, "global_step": 480638, "epoch": 2860} {"train_loss": -12.4253568649292, "global_step": 480639, "epoch": 2860} {"train_loss": -12.053363800048828, "global_step": 480640, "epoch": 2860} {"train_loss": -12.481452941894531, "global_step": 480641, "epoch": 2860} {"train_loss": -12.328232765197754, "global_step": 480642, "epoch": 2860} {"train_loss": -11.978591918945312, "global_step": 480643, "epoch": 2860} {"train_loss": -12.507877349853516, "global_step": 480644, "epoch": 2860} {"train_loss": -12.496273040771484, "global_step": 480645, "epoch": 2860} {"train_loss": -12.618803024291992, "global_step": 480646, "epoch": 2860} {"train_loss": -12.37475898152306, "global_step": 480647, "epoch": 2860, "val_loss": 313836.5625, "train_action_mse_error": 1.050759196281433} {"train_loss": -12.522101402282715, "global_step": 480648, "epoch": 2861} {"train_loss": -12.597647666931152, "global_step": 480649, "epoch": 2861} {"train_loss": -12.93276309967041, "global_step": 480650, "epoch": 2861} {"train_loss": -12.264505386352539, "global_step": 480651, "epoch": 2861} {"train_loss": -12.850801467895508, "global_step": 480652, "epoch": 2861} {"train_loss": -12.596991539001465, "global_step": 480653, "epoch": 2861} {"train_loss": -12.7679443359375, "global_step": 480654, "epoch": 2861} {"train_loss": -12.680051803588867, "global_step": 480655, "epoch": 2861} {"train_loss": -12.352411270141602, "global_step": 480656, "epoch": 2861} {"train_loss": -12.738444328308105, "global_step": 480657, "epoch": 2861} {"train_loss": -12.45451831817627, "global_step": 480658, "epoch": 2861} {"train_loss": -12.450345039367676, "global_step": 480659, "epoch": 2861} {"train_loss": -12.256567001342773, "global_step": 480660, "epoch": 2861} {"train_loss": -11.439878463745117, "global_step": 480661, "epoch": 2861} {"train_loss": -12.537108421325684, "global_step": 480662, "epoch": 2861} {"train_loss": -11.795669555664062, "global_step": 480663, "epoch": 2861} {"train_loss": -10.815389633178711, "global_step": 480664, "epoch": 2861} {"train_loss": -12.282554626464844, "global_step": 480665, "epoch": 2861} {"train_loss": -9.953472137451172, "global_step": 480666, "epoch": 2861} {"train_loss": -12.840692520141602, "global_step": 480667, "epoch": 2861} {"train_loss": -11.18451976776123, "global_step": 480668, "epoch": 2861} {"train_loss": -10.400726318359375, "global_step": 480669, "epoch": 2861} {"train_loss": -10.91220760345459, "global_step": 480670, "epoch": 2861} {"train_loss": -12.148277282714844, "global_step": 480671, "epoch": 2861} {"train_loss": -10.802882194519043, "global_step": 480672, "epoch": 2861} {"train_loss": -12.05656623840332, "global_step": 480673, "epoch": 2861} {"train_loss": -10.063163757324219, "global_step": 480674, "epoch": 2861} {"train_loss": -10.802962303161621, "global_step": 480675, "epoch": 2861} {"train_loss": -11.922310829162598, "global_step": 480676, "epoch": 2861} {"train_loss": -11.298162460327148, "global_step": 480677, "epoch": 2861} {"train_loss": -11.313092231750488, "global_step": 480678, "epoch": 2861} {"train_loss": -11.83226203918457, "global_step": 480679, "epoch": 2861} {"train_loss": -11.892992973327637, "global_step": 480680, "epoch": 2861} {"train_loss": -11.73089599609375, "global_step": 480681, "epoch": 2861} {"train_loss": -12.045303344726562, "global_step": 480682, "epoch": 2861} {"train_loss": -11.944644927978516, "global_step": 480683, "epoch": 2861} {"train_loss": -11.221034049987793, "global_step": 480684, "epoch": 2861} {"train_loss": -12.010664939880371, "global_step": 480685, "epoch": 2861} {"train_loss": -12.016336441040039, "global_step": 480686, "epoch": 2861} {"train_loss": -12.111166000366211, "global_step": 480687, "epoch": 2861} {"train_loss": -12.166741371154785, "global_step": 480688, "epoch": 2861} {"train_loss": -11.323410034179688, "global_step": 480689, "epoch": 2861} {"train_loss": -11.523092269897461, "global_step": 480690, "epoch": 2861} {"train_loss": -11.503811836242676, "global_step": 480691, "epoch": 2861} {"train_loss": -11.909154891967773, "global_step": 480692, "epoch": 2861} {"train_loss": -10.681777000427246, "global_step": 480693, "epoch": 2861} {"train_loss": -10.883113861083984, "global_step": 480694, "epoch": 2861} {"train_loss": -11.17105770111084, "global_step": 480695, "epoch": 2861} {"train_loss": -10.68913459777832, "global_step": 480696, "epoch": 2861} {"train_loss": -11.671165466308594, "global_step": 480697, "epoch": 2861} {"train_loss": -11.288761138916016, "global_step": 480698, "epoch": 2861} {"train_loss": -10.976591110229492, "global_step": 480699, "epoch": 2861} {"train_loss": -12.003464698791504, "global_step": 480700, "epoch": 2861} {"train_loss": -11.417771339416504, "global_step": 480701, "epoch": 2861} {"train_loss": -11.577033996582031, "global_step": 480702, "epoch": 2861} {"train_loss": -11.902822494506836, "global_step": 480703, "epoch": 2861} {"train_loss": -11.454029083251953, "global_step": 480704, "epoch": 2861} {"train_loss": -11.651984214782715, "global_step": 480705, "epoch": 2861} {"train_loss": -11.898756980895996, "global_step": 480706, "epoch": 2861} {"train_loss": -11.948473930358887, "global_step": 480707, "epoch": 2861} {"train_loss": -12.286140441894531, "global_step": 480708, "epoch": 2861} {"train_loss": -12.055890083312988, "global_step": 480709, "epoch": 2861} {"train_loss": -12.141361236572266, "global_step": 480710, "epoch": 2861} {"train_loss": -12.267301559448242, "global_step": 480711, "epoch": 2861} {"train_loss": -12.048700332641602, "global_step": 480712, "epoch": 2861} {"train_loss": -12.623062133789062, "global_step": 480713, "epoch": 2861} {"train_loss": -12.100932121276855, "global_step": 480714, "epoch": 2861} {"train_loss": -12.488794326782227, "global_step": 480715, "epoch": 2861} {"train_loss": -12.12083625793457, "global_step": 480716, "epoch": 2861} {"train_loss": -12.00582504272461, "global_step": 480717, "epoch": 2861} {"train_loss": -12.65638542175293, "global_step": 480718, "epoch": 2861} {"train_loss": -12.303444862365723, "global_step": 480719, "epoch": 2861} {"train_loss": -12.529223442077637, "global_step": 480720, "epoch": 2861} {"train_loss": -12.258437156677246, "global_step": 480721, "epoch": 2861} {"train_loss": -12.381012916564941, "global_step": 480722, "epoch": 2861} {"train_loss": -12.41316032409668, "global_step": 480723, "epoch": 2861} {"train_loss": -12.454099655151367, "global_step": 480724, "epoch": 2861} {"train_loss": -12.381967544555664, "global_step": 480725, "epoch": 2861} {"train_loss": -12.603804588317871, "global_step": 480726, "epoch": 2861} {"train_loss": -12.556610107421875, "global_step": 480727, "epoch": 2861} {"train_loss": -12.413835525512695, "global_step": 480728, "epoch": 2861} {"train_loss": -12.555414199829102, "global_step": 480729, "epoch": 2861} {"train_loss": -12.738550186157227, "global_step": 480730, "epoch": 2861} {"train_loss": -12.853672981262207, "global_step": 480731, "epoch": 2861} {"train_loss": -12.506904602050781, "global_step": 480732, "epoch": 2861} {"train_loss": -12.448017120361328, "global_step": 480733, "epoch": 2861} {"train_loss": -12.47615909576416, "global_step": 480734, "epoch": 2861} {"train_loss": -12.529976844787598, "global_step": 480735, "epoch": 2861} {"train_loss": -12.375136375427246, "global_step": 480736, "epoch": 2861} {"train_loss": -12.752758026123047, "global_step": 480737, "epoch": 2861} {"train_loss": -12.36583137512207, "global_step": 480738, "epoch": 2861} {"train_loss": -12.561445236206055, "global_step": 480739, "epoch": 2861} {"train_loss": -12.185657501220703, "global_step": 480740, "epoch": 2861} {"train_loss": -12.791654586791992, "global_step": 480741, "epoch": 2861} {"train_loss": -12.522712707519531, "global_step": 480742, "epoch": 2861} {"train_loss": -12.682668685913086, "global_step": 480743, "epoch": 2861} {"train_loss": -12.679059982299805, "global_step": 480744, "epoch": 2861} {"train_loss": -12.722894668579102, "global_step": 480745, "epoch": 2861} {"train_loss": -12.733077049255371, "global_step": 480746, "epoch": 2861} {"train_loss": -12.570591926574707, "global_step": 480747, "epoch": 2861} {"train_loss": -12.721318244934082, "global_step": 480748, "epoch": 2861} {"train_loss": -12.781243324279785, "global_step": 480749, "epoch": 2861} {"train_loss": -12.441191673278809, "global_step": 480750, "epoch": 2861} {"train_loss": -12.908703804016113, "global_step": 480751, "epoch": 2861} {"train_loss": -12.538444519042969, "global_step": 480752, "epoch": 2861} {"train_loss": -12.930025100708008, "global_step": 480753, "epoch": 2861} {"train_loss": -12.830707550048828, "global_step": 480754, "epoch": 2861} {"train_loss": -12.743626594543457, "global_step": 480755, "epoch": 2861} {"train_loss": -12.706352233886719, "global_step": 480756, "epoch": 2861} {"train_loss": -12.86402416229248, "global_step": 480757, "epoch": 2861} {"train_loss": -12.787252426147461, "global_step": 480758, "epoch": 2861} {"train_loss": -12.69422721862793, "global_step": 480759, "epoch": 2861} {"train_loss": -12.811599731445312, "global_step": 480760, "epoch": 2861} {"train_loss": -12.896139144897461, "global_step": 480761, "epoch": 2861} {"train_loss": -12.801262855529785, "global_step": 480762, "epoch": 2861} {"train_loss": -12.862691879272461, "global_step": 480763, "epoch": 2861} {"train_loss": -12.363388061523438, "global_step": 480764, "epoch": 2861} {"train_loss": -12.605985641479492, "global_step": 480765, "epoch": 2861} {"train_loss": -12.773602485656738, "global_step": 480766, "epoch": 2861} {"train_loss": -12.080558776855469, "global_step": 480767, "epoch": 2861} {"train_loss": -12.409538269042969, "global_step": 480768, "epoch": 2861} {"train_loss": -12.96885871887207, "global_step": 480769, "epoch": 2861} {"train_loss": -12.756939888000488, "global_step": 480770, "epoch": 2861} {"train_loss": -12.648794174194336, "global_step": 480771, "epoch": 2861} {"train_loss": -12.843437194824219, "global_step": 480772, "epoch": 2861} {"train_loss": -12.804609298706055, "global_step": 480773, "epoch": 2861} {"train_loss": -12.847189903259277, "global_step": 480774, "epoch": 2861} {"train_loss": -13.022746086120605, "global_step": 480775, "epoch": 2861} {"train_loss": -12.784807205200195, "global_step": 480776, "epoch": 2861} {"train_loss": -12.676708221435547, "global_step": 480777, "epoch": 2861} {"train_loss": -13.103948593139648, "global_step": 480778, "epoch": 2861} {"train_loss": -12.802824020385742, "global_step": 480779, "epoch": 2861} {"train_loss": -12.91370964050293, "global_step": 480780, "epoch": 2861} {"train_loss": -12.997905731201172, "global_step": 480781, "epoch": 2861} {"train_loss": -12.914936065673828, "global_step": 480782, "epoch": 2861} {"train_loss": -13.005903244018555, "global_step": 480783, "epoch": 2861} {"train_loss": -13.012290954589844, "global_step": 480784, "epoch": 2861} {"train_loss": -12.880125999450684, "global_step": 480785, "epoch": 2861} {"train_loss": -12.987152099609375, "global_step": 480786, "epoch": 2861} {"train_loss": -12.91917610168457, "global_step": 480787, "epoch": 2861} {"train_loss": -12.98379135131836, "global_step": 480788, "epoch": 2861} {"train_loss": -13.083711624145508, "global_step": 480789, "epoch": 2861} {"train_loss": -13.078710556030273, "global_step": 480790, "epoch": 2861} {"train_loss": -13.230010032653809, "global_step": 480791, "epoch": 2861} {"train_loss": -13.143917083740234, "global_step": 480792, "epoch": 2861} {"train_loss": -13.029788970947266, "global_step": 480793, "epoch": 2861} {"train_loss": -12.863057136535645, "global_step": 480794, "epoch": 2861} {"train_loss": -12.921524047851562, "global_step": 480795, "epoch": 2861} {"train_loss": -12.892210006713867, "global_step": 480796, "epoch": 2861} {"train_loss": -12.864990234375, "global_step": 480797, "epoch": 2861} {"train_loss": -13.029050827026367, "global_step": 480798, "epoch": 2861} {"train_loss": -13.097393035888672, "global_step": 480799, "epoch": 2861} {"train_loss": -12.738604545593262, "global_step": 480800, "epoch": 2861} {"train_loss": -12.979755401611328, "global_step": 480801, "epoch": 2861} {"train_loss": -13.238576889038086, "global_step": 480802, "epoch": 2861} {"train_loss": -12.84833812713623, "global_step": 480803, "epoch": 2861} {"train_loss": -12.990413665771484, "global_step": 480804, "epoch": 2861} {"train_loss": -13.259563446044922, "global_step": 480805, "epoch": 2861} {"train_loss": -12.910605430603027, "global_step": 480806, "epoch": 2861} {"train_loss": -12.95312786102295, "global_step": 480807, "epoch": 2861} {"train_loss": -12.876320838928223, "global_step": 480808, "epoch": 2861} {"train_loss": -12.885995864868164, "global_step": 480809, "epoch": 2861} {"train_loss": -12.7321195602417, "global_step": 480810, "epoch": 2861} {"train_loss": -12.978462219238281, "global_step": 480811, "epoch": 2861} {"train_loss": -12.848161697387695, "global_step": 480812, "epoch": 2861} {"train_loss": -12.30289077758789, "global_step": 480813, "epoch": 2861} {"train_loss": -11.678718566894531, "global_step": 480814, "epoch": 2861} {"train_loss": -12.349648657299223, "global_step": 480815, "epoch": 2861, "val_loss": 315673.59375} {"train_loss": -12.294731140136719, "global_step": 480816, "epoch": 2862} {"train_loss": -12.638705253601074, "global_step": 480817, "epoch": 2862} {"train_loss": -12.291397094726562, "global_step": 480818, "epoch": 2862} {"train_loss": -12.704265594482422, "global_step": 480819, "epoch": 2862} {"train_loss": -12.155806541442871, "global_step": 480820, "epoch": 2862} {"train_loss": -11.605561256408691, "global_step": 480821, "epoch": 2862} {"train_loss": -10.60928726196289, "global_step": 480822, "epoch": 2862} {"train_loss": -8.982211112976074, "global_step": 480823, "epoch": 2862} {"train_loss": -10.146771430969238, "global_step": 480824, "epoch": 2862} {"train_loss": -11.064212799072266, "global_step": 480825, "epoch": 2862} {"train_loss": -10.079710006713867, "global_step": 480826, "epoch": 2862} {"train_loss": -10.210805892944336, "global_step": 480827, "epoch": 2862} {"train_loss": -11.292035102844238, "global_step": 480828, "epoch": 2862} {"train_loss": -10.582315444946289, "global_step": 480829, "epoch": 2862} {"train_loss": -11.280536651611328, "global_step": 480830, "epoch": 2862} {"train_loss": -11.582919120788574, "global_step": 480831, "epoch": 2862} {"train_loss": -10.499979019165039, "global_step": 480832, "epoch": 2862} {"train_loss": -9.814657211303711, "global_step": 480833, "epoch": 2862} {"train_loss": -11.343218803405762, "global_step": 480834, "epoch": 2862} {"train_loss": -9.309144020080566, "global_step": 480835, "epoch": 2862} {"train_loss": -10.317903518676758, "global_step": 480836, "epoch": 2862} {"train_loss": -10.27149772644043, "global_step": 480837, "epoch": 2862} {"train_loss": -9.9657621383667, "global_step": 480838, "epoch": 2862} {"train_loss": -9.623237609863281, "global_step": 480839, "epoch": 2862} {"train_loss": -10.734975814819336, "global_step": 480840, "epoch": 2862} {"train_loss": -11.394423484802246, "global_step": 480841, "epoch": 2862} {"train_loss": -10.964762687683105, "global_step": 480842, "epoch": 2862} {"train_loss": -11.012063980102539, "global_step": 480843, "epoch": 2862} {"train_loss": -11.452966690063477, "global_step": 480844, "epoch": 2862} {"train_loss": -10.580338478088379, "global_step": 480845, "epoch": 2862} {"train_loss": -11.016459465026855, "global_step": 480846, "epoch": 2862} {"train_loss": -10.964990615844727, "global_step": 480847, "epoch": 2862} {"train_loss": -11.541556358337402, "global_step": 480848, "epoch": 2862} {"train_loss": -11.471291542053223, "global_step": 480849, "epoch": 2862} {"train_loss": -11.585012435913086, "global_step": 480850, "epoch": 2862} {"train_loss": -12.504682540893555, "global_step": 480851, "epoch": 2862} {"train_loss": -12.23475456237793, "global_step": 480852, "epoch": 2862} {"train_loss": -11.877685546875, "global_step": 480853, "epoch": 2862} {"train_loss": -11.853392601013184, "global_step": 480854, "epoch": 2862} {"train_loss": -11.890323638916016, "global_step": 480855, "epoch": 2862} {"train_loss": -12.233704566955566, "global_step": 480856, "epoch": 2862} {"train_loss": -12.148062705993652, "global_step": 480857, "epoch": 2862} {"train_loss": -12.344159126281738, "global_step": 480858, "epoch": 2862} {"train_loss": -12.055992126464844, "global_step": 480859, "epoch": 2862} {"train_loss": -11.88747501373291, "global_step": 480860, "epoch": 2862} {"train_loss": -12.11082649230957, "global_step": 480861, "epoch": 2862} {"train_loss": -12.013843536376953, "global_step": 480862, "epoch": 2862} {"train_loss": -12.304000854492188, "global_step": 480863, "epoch": 2862} {"train_loss": -11.913872718811035, "global_step": 480864, "epoch": 2862} {"train_loss": -12.343622207641602, "global_step": 480865, "epoch": 2862} {"train_loss": -12.018966674804688, "global_step": 480866, "epoch": 2862} {"train_loss": -12.793927192687988, "global_step": 480867, "epoch": 2862} {"train_loss": -12.302295684814453, "global_step": 480868, "epoch": 2862} {"train_loss": -12.568540573120117, "global_step": 480869, "epoch": 2862} {"train_loss": -12.352542877197266, "global_step": 480870, "epoch": 2862} {"train_loss": -12.262212753295898, "global_step": 480871, "epoch": 2862} {"train_loss": -12.506114959716797, "global_step": 480872, "epoch": 2862} {"train_loss": -12.317586898803711, "global_step": 480873, "epoch": 2862} {"train_loss": -12.722806930541992, "global_step": 480874, "epoch": 2862} {"train_loss": -12.423310279846191, "global_step": 480875, "epoch": 2862} {"train_loss": -12.384712219238281, "global_step": 480876, "epoch": 2862} {"train_loss": -12.383285522460938, "global_step": 480877, "epoch": 2862} {"train_loss": -12.512598037719727, "global_step": 480878, "epoch": 2862} {"train_loss": -12.541597366333008, "global_step": 480879, "epoch": 2862} {"train_loss": -12.463888168334961, "global_step": 480880, "epoch": 2862} {"train_loss": -12.643253326416016, "global_step": 480881, "epoch": 2862} {"train_loss": -12.580867767333984, "global_step": 480882, "epoch": 2862} {"train_loss": -12.79395580291748, "global_step": 480883, "epoch": 2862} {"train_loss": -12.482590675354004, "global_step": 480884, "epoch": 2862} {"train_loss": -12.63958740234375, "global_step": 480885, "epoch": 2862} {"train_loss": -12.614030838012695, "global_step": 480886, "epoch": 2862} {"train_loss": -12.611066818237305, "global_step": 480887, "epoch": 2862} {"train_loss": -12.646562576293945, "global_step": 480888, "epoch": 2862} {"train_loss": -12.680904388427734, "global_step": 480889, "epoch": 2862} {"train_loss": -12.603072166442871, "global_step": 480890, "epoch": 2862} {"train_loss": -12.562829971313477, "global_step": 480891, "epoch": 2862} {"train_loss": -12.353492736816406, "global_step": 480892, "epoch": 2862} {"train_loss": -12.641271591186523, "global_step": 480893, "epoch": 2862} {"train_loss": -12.712701797485352, "global_step": 480894, "epoch": 2862} {"train_loss": -12.370490074157715, "global_step": 480895, "epoch": 2862} {"train_loss": -12.849027633666992, "global_step": 480896, "epoch": 2862} {"train_loss": -12.770276069641113, "global_step": 480897, "epoch": 2862} {"train_loss": -12.373570442199707, "global_step": 480898, "epoch": 2862} {"train_loss": -12.656627655029297, "global_step": 480899, "epoch": 2862} {"train_loss": -12.846222877502441, "global_step": 480900, "epoch": 2862} {"train_loss": -12.385730743408203, "global_step": 480901, "epoch": 2862} {"train_loss": -12.509689331054688, "global_step": 480902, "epoch": 2862} {"train_loss": -12.354782104492188, "global_step": 480903, "epoch": 2862} {"train_loss": -12.378217697143555, "global_step": 480904, "epoch": 2862} {"train_loss": -11.976493835449219, "global_step": 480905, "epoch": 2862} {"train_loss": -12.744848251342773, "global_step": 480906, "epoch": 2862} {"train_loss": -11.7008056640625, "global_step": 480907, "epoch": 2862} {"train_loss": -11.896564483642578, "global_step": 480908, "epoch": 2862} {"train_loss": -11.969350814819336, "global_step": 480909, "epoch": 2862} {"train_loss": -11.52686882019043, "global_step": 480910, "epoch": 2862} {"train_loss": -12.834199905395508, "global_step": 480911, "epoch": 2862} {"train_loss": -11.479881286621094, "global_step": 480912, "epoch": 2862} {"train_loss": -12.503767013549805, "global_step": 480913, "epoch": 2862} {"train_loss": -12.600045204162598, "global_step": 480914, "epoch": 2862} {"train_loss": -11.545938491821289, "global_step": 480915, "epoch": 2862} {"train_loss": -12.291448593139648, "global_step": 480916, "epoch": 2862} {"train_loss": -11.740086555480957, "global_step": 480917, "epoch": 2862} {"train_loss": -11.16457748413086, "global_step": 480918, "epoch": 2862} {"train_loss": -11.780557632446289, "global_step": 480919, "epoch": 2862} {"train_loss": -12.686439514160156, "global_step": 480920, "epoch": 2862} {"train_loss": -11.527158737182617, "global_step": 480921, "epoch": 2862} {"train_loss": -12.324633598327637, "global_step": 480922, "epoch": 2862} {"train_loss": -11.992263793945312, "global_step": 480923, "epoch": 2862} {"train_loss": -11.260536193847656, "global_step": 480924, "epoch": 2862} {"train_loss": -12.644625663757324, "global_step": 480925, "epoch": 2862} {"train_loss": -11.99548053741455, "global_step": 480926, "epoch": 2862} {"train_loss": -12.166131973266602, "global_step": 480927, "epoch": 2862} {"train_loss": -12.558683395385742, "global_step": 480928, "epoch": 2862} {"train_loss": -11.915225982666016, "global_step": 480929, "epoch": 2862} {"train_loss": -12.418201446533203, "global_step": 480930, "epoch": 2862} {"train_loss": -11.914012908935547, "global_step": 480931, "epoch": 2862} {"train_loss": -11.221067428588867, "global_step": 480932, "epoch": 2862} {"train_loss": -12.399415969848633, "global_step": 480933, "epoch": 2862} {"train_loss": -11.456308364868164, "global_step": 480934, "epoch": 2862} {"train_loss": -12.206195831298828, "global_step": 480935, "epoch": 2862} {"train_loss": -12.469071388244629, "global_step": 480936, "epoch": 2862} {"train_loss": -11.896639823913574, "global_step": 480937, "epoch": 2862} {"train_loss": -12.240034103393555, "global_step": 480938, "epoch": 2862} {"train_loss": -12.027307510375977, "global_step": 480939, "epoch": 2862} {"train_loss": -11.956562042236328, "global_step": 480940, "epoch": 2862} {"train_loss": -12.458442687988281, "global_step": 480941, "epoch": 2862} {"train_loss": -11.532403945922852, "global_step": 480942, "epoch": 2862} {"train_loss": -12.475208282470703, "global_step": 480943, "epoch": 2862} {"train_loss": -12.079684257507324, "global_step": 480944, "epoch": 2862} {"train_loss": -12.554085731506348, "global_step": 480945, "epoch": 2862} {"train_loss": -12.746444702148438, "global_step": 480946, "epoch": 2862} {"train_loss": -12.198729515075684, "global_step": 480947, "epoch": 2862} {"train_loss": -12.705223083496094, "global_step": 480948, "epoch": 2862} {"train_loss": -11.931870460510254, "global_step": 480949, "epoch": 2862} {"train_loss": -12.475525856018066, "global_step": 480950, "epoch": 2862} {"train_loss": -12.51613998413086, "global_step": 480951, "epoch": 2862} {"train_loss": -12.262263298034668, "global_step": 480952, "epoch": 2862} {"train_loss": -12.331510543823242, "global_step": 480953, "epoch": 2862} {"train_loss": -12.140607833862305, "global_step": 480954, "epoch": 2862} {"train_loss": -12.259025573730469, "global_step": 480955, "epoch": 2862} {"train_loss": -12.361710548400879, "global_step": 480956, "epoch": 2862} {"train_loss": -12.445966720581055, "global_step": 480957, "epoch": 2862} {"train_loss": -12.71735668182373, "global_step": 480958, "epoch": 2862} {"train_loss": -11.987785339355469, "global_step": 480959, "epoch": 2862} {"train_loss": -12.088676452636719, "global_step": 480960, "epoch": 2862} {"train_loss": -12.54930305480957, "global_step": 480961, "epoch": 2862} {"train_loss": -12.493693351745605, "global_step": 480962, "epoch": 2862} {"train_loss": -12.533981323242188, "global_step": 480963, "epoch": 2862} {"train_loss": -12.601160049438477, "global_step": 480964, "epoch": 2862} {"train_loss": -12.227351188659668, "global_step": 480965, "epoch": 2862} {"train_loss": -12.797843933105469, "global_step": 480966, "epoch": 2862} {"train_loss": -12.617020606994629, "global_step": 480967, "epoch": 2862} {"train_loss": -12.908324241638184, "global_step": 480968, "epoch": 2862} {"train_loss": -12.544118881225586, "global_step": 480969, "epoch": 2862} {"train_loss": -12.610289573669434, "global_step": 480970, "epoch": 2862} {"train_loss": -12.76091194152832, "global_step": 480971, "epoch": 2862} {"train_loss": -12.717575073242188, "global_step": 480972, "epoch": 2862} {"train_loss": -12.511741638183594, "global_step": 480973, "epoch": 2862} {"train_loss": -12.646495819091797, "global_step": 480974, "epoch": 2862} {"train_loss": -12.714898109436035, "global_step": 480975, "epoch": 2862} {"train_loss": -12.69945240020752, "global_step": 480976, "epoch": 2862} {"train_loss": -12.878905296325684, "global_step": 480977, "epoch": 2862} {"train_loss": -12.393537521362305, "global_step": 480978, "epoch": 2862} {"train_loss": -12.81658935546875, "global_step": 480979, "epoch": 2862} {"train_loss": -12.452642440795898, "global_step": 480980, "epoch": 2862} {"train_loss": -12.70184326171875, "global_step": 480981, "epoch": 2862} {"train_loss": -12.798382759094238, "global_step": 480982, "epoch": 2862} {"train_loss": -12.044538219769796, "global_step": 480983, "epoch": 2862, "val_loss": 312200.375} {"train_loss": -12.673047065734863, "global_step": 480984, "epoch": 2863} {"train_loss": -12.252824783325195, "global_step": 480985, "epoch": 2863} {"train_loss": -12.586823463439941, "global_step": 480986, "epoch": 2863} {"train_loss": -12.32300853729248, "global_step": 480987, "epoch": 2863} {"train_loss": -12.481221199035645, "global_step": 480988, "epoch": 2863} {"train_loss": -12.667778968811035, "global_step": 480989, "epoch": 2863} {"train_loss": -12.623050689697266, "global_step": 480990, "epoch": 2863} {"train_loss": -12.393701553344727, "global_step": 480991, "epoch": 2863} {"train_loss": -12.620706558227539, "global_step": 480992, "epoch": 2863} {"train_loss": -12.506141662597656, "global_step": 480993, "epoch": 2863} {"train_loss": -12.710596084594727, "global_step": 480994, "epoch": 2863} {"train_loss": -12.278358459472656, "global_step": 480995, "epoch": 2863} {"train_loss": -12.802498817443848, "global_step": 480996, "epoch": 2863} {"train_loss": -12.344465255737305, "global_step": 480997, "epoch": 2863} {"train_loss": -12.787092208862305, "global_step": 480998, "epoch": 2863} {"train_loss": -12.802386283874512, "global_step": 480999, "epoch": 2863} {"train_loss": -12.816091537475586, "global_step": 481000, "epoch": 2863} {"train_loss": -12.746312141418457, "global_step": 481001, "epoch": 2863} {"train_loss": -12.478221893310547, "global_step": 481002, "epoch": 2863} {"train_loss": -12.797735214233398, "global_step": 481003, "epoch": 2863} {"train_loss": -12.95196533203125, "global_step": 481004, "epoch": 2863} {"train_loss": -13.01739501953125, "global_step": 481005, "epoch": 2863} {"train_loss": -12.82748031616211, "global_step": 481006, "epoch": 2863} {"train_loss": -12.837644577026367, "global_step": 481007, "epoch": 2863} {"train_loss": -12.835046768188477, "global_step": 481008, "epoch": 2863} {"train_loss": -12.946733474731445, "global_step": 481009, "epoch": 2863} {"train_loss": -12.896078109741211, "global_step": 481010, "epoch": 2863} {"train_loss": -13.090917587280273, "global_step": 481011, "epoch": 2863} {"train_loss": -12.893550872802734, "global_step": 481012, "epoch": 2863} {"train_loss": -12.880758285522461, "global_step": 481013, "epoch": 2863} {"train_loss": -12.978363037109375, "global_step": 481014, "epoch": 2863} {"train_loss": -12.893144607543945, "global_step": 481015, "epoch": 2863} {"train_loss": -12.815183639526367, "global_step": 481016, "epoch": 2863} {"train_loss": -12.983903884887695, "global_step": 481017, "epoch": 2863} {"train_loss": -12.663395881652832, "global_step": 481018, "epoch": 2863} {"train_loss": -12.908184051513672, "global_step": 481019, "epoch": 2863} {"train_loss": -12.741422653198242, "global_step": 481020, "epoch": 2863} {"train_loss": -12.784831047058105, "global_step": 481021, "epoch": 2863} {"train_loss": -12.976306915283203, "global_step": 481022, "epoch": 2863} {"train_loss": -12.903997421264648, "global_step": 481023, "epoch": 2863} {"train_loss": -12.669633865356445, "global_step": 481024, "epoch": 2863} {"train_loss": -13.007661819458008, "global_step": 481025, "epoch": 2863} {"train_loss": -12.7693510055542, "global_step": 481026, "epoch": 2863} {"train_loss": -12.834550857543945, "global_step": 481027, "epoch": 2863} {"train_loss": -12.436897277832031, "global_step": 481028, "epoch": 2863} {"train_loss": -12.667562484741211, "global_step": 481029, "epoch": 2863} {"train_loss": -12.604143142700195, "global_step": 481030, "epoch": 2863} {"train_loss": -12.662002563476562, "global_step": 481031, "epoch": 2863} {"train_loss": -12.257743835449219, "global_step": 481032, "epoch": 2863} {"train_loss": -11.911989212036133, "global_step": 481033, "epoch": 2863} {"train_loss": -12.452239036560059, "global_step": 481034, "epoch": 2863} {"train_loss": -12.23935317993164, "global_step": 481035, "epoch": 2863} {"train_loss": -11.770914077758789, "global_step": 481036, "epoch": 2863} {"train_loss": -12.91373348236084, "global_step": 481037, "epoch": 2863} {"train_loss": -12.118532180786133, "global_step": 481038, "epoch": 2863} {"train_loss": -12.650506973266602, "global_step": 481039, "epoch": 2863} {"train_loss": -12.669018745422363, "global_step": 481040, "epoch": 2863} {"train_loss": -13.175922393798828, "global_step": 481041, "epoch": 2863} {"train_loss": -12.596468925476074, "global_step": 481042, "epoch": 2863} {"train_loss": -12.590836524963379, "global_step": 481043, "epoch": 2863} {"train_loss": -12.724824905395508, "global_step": 481044, "epoch": 2863} {"train_loss": -12.203631401062012, "global_step": 481045, "epoch": 2863} {"train_loss": -12.110330581665039, "global_step": 481046, "epoch": 2863} {"train_loss": -12.181587219238281, "global_step": 481047, "epoch": 2863} {"train_loss": -12.485889434814453, "global_step": 481048, "epoch": 2863} {"train_loss": -11.734017372131348, "global_step": 481049, "epoch": 2863} {"train_loss": -11.401755332946777, "global_step": 481050, "epoch": 2863} {"train_loss": -12.175429344177246, "global_step": 481051, "epoch": 2863} {"train_loss": -11.738195419311523, "global_step": 481052, "epoch": 2863} {"train_loss": -10.853584289550781, "global_step": 481053, "epoch": 2863} {"train_loss": -10.624141693115234, "global_step": 481054, "epoch": 2863} {"train_loss": -10.118730545043945, "global_step": 481055, "epoch": 2863} {"train_loss": -11.278036117553711, "global_step": 481056, "epoch": 2863} {"train_loss": -10.467927932739258, "global_step": 481057, "epoch": 2863} {"train_loss": -9.695054054260254, "global_step": 481058, "epoch": 2863} {"train_loss": -10.356891632080078, "global_step": 481059, "epoch": 2863} {"train_loss": -9.797357559204102, "global_step": 481060, "epoch": 2863} {"train_loss": -9.588689804077148, "global_step": 481061, "epoch": 2863} {"train_loss": -8.591882705688477, "global_step": 481062, "epoch": 2863} {"train_loss": -9.776726722717285, "global_step": 481063, "epoch": 2863} {"train_loss": -10.556657791137695, "global_step": 481064, "epoch": 2863} {"train_loss": -8.671866416931152, "global_step": 481065, "epoch": 2863} {"train_loss": -8.78764820098877, "global_step": 481066, "epoch": 2863} {"train_loss": -9.755731582641602, "global_step": 481067, "epoch": 2863} {"train_loss": -10.781441688537598, "global_step": 481068, "epoch": 2863} {"train_loss": -10.111273765563965, "global_step": 481069, "epoch": 2863} {"train_loss": -11.226051330566406, "global_step": 481070, "epoch": 2863} {"train_loss": -10.700335502624512, "global_step": 481071, "epoch": 2863} {"train_loss": -11.417095184326172, "global_step": 481072, "epoch": 2863} {"train_loss": -10.7305908203125, "global_step": 481073, "epoch": 2863} {"train_loss": -11.369763374328613, "global_step": 481074, "epoch": 2863} {"train_loss": -11.316407203674316, "global_step": 481075, "epoch": 2863} {"train_loss": -11.454341888427734, "global_step": 481076, "epoch": 2863} {"train_loss": -12.451936721801758, "global_step": 481077, "epoch": 2863} {"train_loss": -11.787193298339844, "global_step": 481078, "epoch": 2863} {"train_loss": -12.052225112915039, "global_step": 481079, "epoch": 2863} {"train_loss": -12.095322608947754, "global_step": 481080, "epoch": 2863} {"train_loss": -11.898578643798828, "global_step": 481081, "epoch": 2863} {"train_loss": -11.828712463378906, "global_step": 481082, "epoch": 2863} {"train_loss": -12.340862274169922, "global_step": 481083, "epoch": 2863} {"train_loss": -12.377182960510254, "global_step": 481084, "epoch": 2863} {"train_loss": -12.232175827026367, "global_step": 481085, "epoch": 2863} {"train_loss": -12.23283576965332, "global_step": 481086, "epoch": 2863} {"train_loss": -12.2313232421875, "global_step": 481087, "epoch": 2863} {"train_loss": -12.665206909179688, "global_step": 481088, "epoch": 2863} {"train_loss": -12.513263702392578, "global_step": 481089, "epoch": 2863} {"train_loss": -12.606091499328613, "global_step": 481090, "epoch": 2863} {"train_loss": -12.594045639038086, "global_step": 481091, "epoch": 2863} {"train_loss": -12.661088943481445, "global_step": 481092, "epoch": 2863} {"train_loss": -12.61789321899414, "global_step": 481093, "epoch": 2863} {"train_loss": -12.259554862976074, "global_step": 481094, "epoch": 2863} {"train_loss": -12.540124893188477, "global_step": 481095, "epoch": 2863} {"train_loss": -12.394651412963867, "global_step": 481096, "epoch": 2863} {"train_loss": -12.451643943786621, "global_step": 481097, "epoch": 2863} {"train_loss": -12.539177894592285, "global_step": 481098, "epoch": 2863} {"train_loss": -12.391170501708984, "global_step": 481099, "epoch": 2863} {"train_loss": -12.64463996887207, "global_step": 481100, "epoch": 2863} {"train_loss": -12.413508415222168, "global_step": 481101, "epoch": 2863} {"train_loss": -12.715065956115723, "global_step": 481102, "epoch": 2863} {"train_loss": -12.326089859008789, "global_step": 481103, "epoch": 2863} {"train_loss": -12.688483238220215, "global_step": 481104, "epoch": 2863} {"train_loss": -12.55134105682373, "global_step": 481105, "epoch": 2863} {"train_loss": -12.651065826416016, "global_step": 481106, "epoch": 2863} {"train_loss": -12.741659164428711, "global_step": 481107, "epoch": 2863} {"train_loss": -12.660789489746094, "global_step": 481108, "epoch": 2863} {"train_loss": -12.815898895263672, "global_step": 481109, "epoch": 2863} {"train_loss": -12.375778198242188, "global_step": 481110, "epoch": 2863} {"train_loss": -12.8296480178833, "global_step": 481111, "epoch": 2863} {"train_loss": -12.769401550292969, "global_step": 481112, "epoch": 2863} {"train_loss": -12.676986694335938, "global_step": 481113, "epoch": 2863} {"train_loss": -12.396984100341797, "global_step": 481114, "epoch": 2863} {"train_loss": -12.710254669189453, "global_step": 481115, "epoch": 2863} {"train_loss": -12.562149047851562, "global_step": 481116, "epoch": 2863} {"train_loss": -12.596664428710938, "global_step": 481117, "epoch": 2863} {"train_loss": -12.18106460571289, "global_step": 481118, "epoch": 2863} {"train_loss": -12.708354949951172, "global_step": 481119, "epoch": 2863} {"train_loss": -12.47144889831543, "global_step": 481120, "epoch": 2863} {"train_loss": -12.625750541687012, "global_step": 481121, "epoch": 2863} {"train_loss": -12.378253936767578, "global_step": 481122, "epoch": 2863} {"train_loss": -11.713089942932129, "global_step": 481123, "epoch": 2863} {"train_loss": -11.937873840332031, "global_step": 481124, "epoch": 2863} {"train_loss": -12.178183555603027, "global_step": 481125, "epoch": 2863} {"train_loss": -12.517263412475586, "global_step": 481126, "epoch": 2863} {"train_loss": -12.366806030273438, "global_step": 481127, "epoch": 2863} {"train_loss": -12.55893611907959, "global_step": 481128, "epoch": 2863} {"train_loss": -11.449370384216309, "global_step": 481129, "epoch": 2863} {"train_loss": -12.760818481445312, "global_step": 481130, "epoch": 2863} {"train_loss": -12.425503730773926, "global_step": 481131, "epoch": 2863} {"train_loss": -12.332598686218262, "global_step": 481132, "epoch": 2863} {"train_loss": -12.442072868347168, "global_step": 481133, "epoch": 2863} {"train_loss": -11.505433082580566, "global_step": 481134, "epoch": 2863} {"train_loss": -11.560100555419922, "global_step": 481135, "epoch": 2863} {"train_loss": -12.252494812011719, "global_step": 481136, "epoch": 2863} {"train_loss": -9.569652557373047, "global_step": 481137, "epoch": 2863} {"train_loss": -10.973730087280273, "global_step": 481138, "epoch": 2863} {"train_loss": -11.63118839263916, "global_step": 481139, "epoch": 2863} {"train_loss": -11.135709762573242, "global_step": 481140, "epoch": 2863} {"train_loss": -11.152497291564941, "global_step": 481141, "epoch": 2863} {"train_loss": -10.2279052734375, "global_step": 481142, "epoch": 2863} {"train_loss": -10.764890670776367, "global_step": 481143, "epoch": 2863} {"train_loss": -9.365975379943848, "global_step": 481144, "epoch": 2863} {"train_loss": -12.010699272155762, "global_step": 481145, "epoch": 2863} {"train_loss": -10.350244522094727, "global_step": 481146, "epoch": 2863} {"train_loss": -10.182596206665039, "global_step": 481147, "epoch": 2863} {"train_loss": -9.603797912597656, "global_step": 481148, "epoch": 2863} {"train_loss": -11.371573448181152, "global_step": 481149, "epoch": 2863} {"train_loss": -10.844478607177734, "global_step": 481150, "epoch": 2863} {"train_loss": -12.02675169422513, "global_step": 481151, "epoch": 2863, "val_loss": 316092.625} {"train_loss": -11.445030212402344, "global_step": 481152, "epoch": 2864} {"train_loss": -10.570520401000977, "global_step": 481153, "epoch": 2864} {"train_loss": -11.725996971130371, "global_step": 481154, "epoch": 2864} {"train_loss": -11.064897537231445, "global_step": 481155, "epoch": 2864} {"train_loss": -11.849103927612305, "global_step": 481156, "epoch": 2864} {"train_loss": -10.03122615814209, "global_step": 481157, "epoch": 2864} {"train_loss": -11.745528221130371, "global_step": 481158, "epoch": 2864} {"train_loss": -10.9307861328125, "global_step": 481159, "epoch": 2864} {"train_loss": -11.746219635009766, "global_step": 481160, "epoch": 2864} {"train_loss": -11.135599136352539, "global_step": 481161, "epoch": 2864} {"train_loss": -11.815381050109863, "global_step": 481162, "epoch": 2864} {"train_loss": -10.730792999267578, "global_step": 481163, "epoch": 2864} {"train_loss": -12.079639434814453, "global_step": 481164, "epoch": 2864} {"train_loss": -11.012908935546875, "global_step": 481165, "epoch": 2864} {"train_loss": -11.803398132324219, "global_step": 481166, "epoch": 2864} {"train_loss": -11.830069541931152, "global_step": 481167, "epoch": 2864} {"train_loss": -11.773711204528809, "global_step": 481168, "epoch": 2864} {"train_loss": -11.835205078125, "global_step": 481169, "epoch": 2864} {"train_loss": -11.653345108032227, "global_step": 481170, "epoch": 2864} {"train_loss": -12.029770851135254, "global_step": 481171, "epoch": 2864} {"train_loss": -11.700294494628906, "global_step": 481172, "epoch": 2864} {"train_loss": -12.396747589111328, "global_step": 481173, "epoch": 2864} {"train_loss": -12.049596786499023, "global_step": 481174, "epoch": 2864} {"train_loss": -12.021625518798828, "global_step": 481175, "epoch": 2864} {"train_loss": -12.129450798034668, "global_step": 481176, "epoch": 2864} {"train_loss": -12.201959609985352, "global_step": 481177, "epoch": 2864} {"train_loss": -12.449695587158203, "global_step": 481178, "epoch": 2864} {"train_loss": -12.320152282714844, "global_step": 481179, "epoch": 2864} {"train_loss": -12.236327171325684, "global_step": 481180, "epoch": 2864} {"train_loss": -12.370214462280273, "global_step": 481181, "epoch": 2864} {"train_loss": -12.434669494628906, "global_step": 481182, "epoch": 2864} {"train_loss": -12.366104125976562, "global_step": 481183, "epoch": 2864} {"train_loss": -12.475225448608398, "global_step": 481184, "epoch": 2864} {"train_loss": -12.14859390258789, "global_step": 481185, "epoch": 2864} {"train_loss": -12.27566146850586, "global_step": 481186, "epoch": 2864} {"train_loss": -12.445547103881836, "global_step": 481187, "epoch": 2864} {"train_loss": -12.552001953125, "global_step": 481188, "epoch": 2864} {"train_loss": -12.41429328918457, "global_step": 481189, "epoch": 2864} {"train_loss": -12.170411109924316, "global_step": 481190, "epoch": 2864} {"train_loss": -12.311983108520508, "global_step": 481191, "epoch": 2864} {"train_loss": -12.39052963256836, "global_step": 481192, "epoch": 2864} {"train_loss": -12.510599136352539, "global_step": 481193, "epoch": 2864} {"train_loss": -12.275038719177246, "global_step": 481194, "epoch": 2864} {"train_loss": -12.360730171203613, "global_step": 481195, "epoch": 2864} {"train_loss": -12.117438316345215, "global_step": 481196, "epoch": 2864} {"train_loss": -12.639387130737305, "global_step": 481197, "epoch": 2864} {"train_loss": -12.03657341003418, "global_step": 481198, "epoch": 2864} {"train_loss": -12.729816436767578, "global_step": 481199, "epoch": 2864} {"train_loss": -11.782005310058594, "global_step": 481200, "epoch": 2864} {"train_loss": -12.531033515930176, "global_step": 481201, "epoch": 2864} {"train_loss": -12.208059310913086, "global_step": 481202, "epoch": 2864} {"train_loss": -12.644611358642578, "global_step": 481203, "epoch": 2864} {"train_loss": -12.424123764038086, "global_step": 481204, "epoch": 2864} {"train_loss": -12.508600234985352, "global_step": 481205, "epoch": 2864} {"train_loss": -12.625032424926758, "global_step": 481206, "epoch": 2864} {"train_loss": -12.511106491088867, "global_step": 481207, "epoch": 2864} {"train_loss": -12.780699729919434, "global_step": 481208, "epoch": 2864} {"train_loss": -12.580122947692871, "global_step": 481209, "epoch": 2864} {"train_loss": -12.817214012145996, "global_step": 481210, "epoch": 2864} {"train_loss": -12.278657913208008, "global_step": 481211, "epoch": 2864} {"train_loss": -12.654045104980469, "global_step": 481212, "epoch": 2864} {"train_loss": -12.725973129272461, "global_step": 481213, "epoch": 2864} {"train_loss": -12.697744369506836, "global_step": 481214, "epoch": 2864} {"train_loss": -12.56425666809082, "global_step": 481215, "epoch": 2864} {"train_loss": -12.4447021484375, "global_step": 481216, "epoch": 2864} {"train_loss": -12.305875778198242, "global_step": 481217, "epoch": 2864} {"train_loss": -12.499348640441895, "global_step": 481218, "epoch": 2864} {"train_loss": -12.608743667602539, "global_step": 481219, "epoch": 2864} {"train_loss": -12.374471664428711, "global_step": 481220, "epoch": 2864} {"train_loss": -12.698100090026855, "global_step": 481221, "epoch": 2864} {"train_loss": -12.625310897827148, "global_step": 481222, "epoch": 2864} {"train_loss": -12.646096229553223, "global_step": 481223, "epoch": 2864} {"train_loss": -12.712366104125977, "global_step": 481224, "epoch": 2864} {"train_loss": -12.305803298950195, "global_step": 481225, "epoch": 2864} {"train_loss": -12.589536666870117, "global_step": 481226, "epoch": 2864} {"train_loss": -12.513964653015137, "global_step": 481227, "epoch": 2864} {"train_loss": -12.857595443725586, "global_step": 481228, "epoch": 2864} {"train_loss": -12.42156982421875, "global_step": 481229, "epoch": 2864} {"train_loss": -12.76812744140625, "global_step": 481230, "epoch": 2864} {"train_loss": -12.770771026611328, "global_step": 481231, "epoch": 2864} {"train_loss": -12.688468933105469, "global_step": 481232, "epoch": 2864} {"train_loss": -12.65762996673584, "global_step": 481233, "epoch": 2864} {"train_loss": -12.614195823669434, "global_step": 481234, "epoch": 2864} {"train_loss": -12.529685020446777, "global_step": 481235, "epoch": 2864} {"train_loss": -12.64756965637207, "global_step": 481236, "epoch": 2864} {"train_loss": -12.442121505737305, "global_step": 481237, "epoch": 2864} {"train_loss": -12.650601387023926, "global_step": 481238, "epoch": 2864} {"train_loss": -12.366191864013672, "global_step": 481239, "epoch": 2864} {"train_loss": -11.682887077331543, "global_step": 481240, "epoch": 2864} {"train_loss": -12.559768676757812, "global_step": 481241, "epoch": 2864} {"train_loss": -12.671835899353027, "global_step": 481242, "epoch": 2864} {"train_loss": -12.506450653076172, "global_step": 481243, "epoch": 2864} {"train_loss": -12.907629013061523, "global_step": 481244, "epoch": 2864} {"train_loss": -12.449905395507812, "global_step": 481245, "epoch": 2864} {"train_loss": -12.834137916564941, "global_step": 481246, "epoch": 2864} {"train_loss": -12.403425216674805, "global_step": 481247, "epoch": 2864} {"train_loss": -12.36412239074707, "global_step": 481248, "epoch": 2864} {"train_loss": -12.801176071166992, "global_step": 481249, "epoch": 2864} {"train_loss": -12.428689956665039, "global_step": 481250, "epoch": 2864} {"train_loss": -12.277411460876465, "global_step": 481251, "epoch": 2864} {"train_loss": -12.74909496307373, "global_step": 481252, "epoch": 2864} {"train_loss": -12.89880084991455, "global_step": 481253, "epoch": 2864} {"train_loss": -12.478655815124512, "global_step": 481254, "epoch": 2864} {"train_loss": -12.721256256103516, "global_step": 481255, "epoch": 2864} {"train_loss": -12.597400665283203, "global_step": 481256, "epoch": 2864} {"train_loss": -12.55302906036377, "global_step": 481257, "epoch": 2864} {"train_loss": -12.65963363647461, "global_step": 481258, "epoch": 2864} {"train_loss": -12.834061622619629, "global_step": 481259, "epoch": 2864} {"train_loss": -12.40888500213623, "global_step": 481260, "epoch": 2864} {"train_loss": -12.677616119384766, "global_step": 481261, "epoch": 2864} {"train_loss": -12.10418701171875, "global_step": 481262, "epoch": 2864} {"train_loss": -12.662275314331055, "global_step": 481263, "epoch": 2864} {"train_loss": -12.459378242492676, "global_step": 481264, "epoch": 2864} {"train_loss": -12.64354133605957, "global_step": 481265, "epoch": 2864} {"train_loss": -12.64969253540039, "global_step": 481266, "epoch": 2864} {"train_loss": -12.495611190795898, "global_step": 481267, "epoch": 2864} {"train_loss": -12.03593921661377, "global_step": 481268, "epoch": 2864} {"train_loss": -12.93721866607666, "global_step": 481269, "epoch": 2864} {"train_loss": -11.979949951171875, "global_step": 481270, "epoch": 2864} {"train_loss": -12.703686714172363, "global_step": 481271, "epoch": 2864} {"train_loss": -12.568319320678711, "global_step": 481272, "epoch": 2864} {"train_loss": -12.927263259887695, "global_step": 481273, "epoch": 2864} {"train_loss": -12.7115478515625, "global_step": 481274, "epoch": 2864} {"train_loss": -12.642606735229492, "global_step": 481275, "epoch": 2864} {"train_loss": -12.749130249023438, "global_step": 481276, "epoch": 2864} {"train_loss": -12.521528244018555, "global_step": 481277, "epoch": 2864} {"train_loss": -12.709632873535156, "global_step": 481278, "epoch": 2864} {"train_loss": -12.333620071411133, "global_step": 481279, "epoch": 2864} {"train_loss": -12.573678970336914, "global_step": 481280, "epoch": 2864} {"train_loss": -12.794503211975098, "global_step": 481281, "epoch": 2864} {"train_loss": -12.443835258483887, "global_step": 481282, "epoch": 2864} {"train_loss": -12.678897857666016, "global_step": 481283, "epoch": 2864} {"train_loss": -12.801069259643555, "global_step": 481284, "epoch": 2864} {"train_loss": -12.655047416687012, "global_step": 481285, "epoch": 2864} {"train_loss": -12.557857513427734, "global_step": 481286, "epoch": 2864} {"train_loss": -12.899609565734863, "global_step": 481287, "epoch": 2864} {"train_loss": -12.849296569824219, "global_step": 481288, "epoch": 2864} {"train_loss": -13.047478675842285, "global_step": 481289, "epoch": 2864} {"train_loss": -12.685113906860352, "global_step": 481290, "epoch": 2864} {"train_loss": -12.82471752166748, "global_step": 481291, "epoch": 2864} {"train_loss": -12.799445152282715, "global_step": 481292, "epoch": 2864} {"train_loss": -12.921720504760742, "global_step": 481293, "epoch": 2864} {"train_loss": -12.763626098632812, "global_step": 481294, "epoch": 2864} {"train_loss": -12.606200218200684, "global_step": 481295, "epoch": 2864} {"train_loss": -12.852073669433594, "global_step": 481296, "epoch": 2864} {"train_loss": -12.761312484741211, "global_step": 481297, "epoch": 2864} {"train_loss": -12.545740127563477, "global_step": 481298, "epoch": 2864} {"train_loss": -12.600872039794922, "global_step": 481299, "epoch": 2864} {"train_loss": -12.741374969482422, "global_step": 481300, "epoch": 2864} {"train_loss": -12.594295501708984, "global_step": 481301, "epoch": 2864} {"train_loss": -12.27549934387207, "global_step": 481302, "epoch": 2864} {"train_loss": -11.553586959838867, "global_step": 481303, "epoch": 2864} {"train_loss": -12.191699028015137, "global_step": 481304, "epoch": 2864} {"train_loss": -11.210992813110352, "global_step": 481305, "epoch": 2864} {"train_loss": -11.649271011352539, "global_step": 481306, "epoch": 2864} {"train_loss": -10.917630195617676, "global_step": 481307, "epoch": 2864} {"train_loss": -10.700579643249512, "global_step": 481308, "epoch": 2864} {"train_loss": -12.142998695373535, "global_step": 481309, "epoch": 2864} {"train_loss": -10.694522857666016, "global_step": 481310, "epoch": 2864} {"train_loss": -9.623634338378906, "global_step": 481311, "epoch": 2864} {"train_loss": -11.359274864196777, "global_step": 481312, "epoch": 2864} {"train_loss": -11.620969772338867, "global_step": 481313, "epoch": 2864} {"train_loss": -10.114092826843262, "global_step": 481314, "epoch": 2864} {"train_loss": -10.599048614501953, "global_step": 481315, "epoch": 2864} {"train_loss": -10.917871475219727, "global_step": 481316, "epoch": 2864} {"train_loss": -11.243974685668945, "global_step": 481317, "epoch": 2864} {"train_loss": -10.631237030029297, "global_step": 481318, "epoch": 2864} {"train_loss": -12.250245037532988, "global_step": 481319, "epoch": 2864, "val_loss": 312342.09375} {"train_loss": -11.213066101074219, "global_step": 481320, "epoch": 2865} {"train_loss": -11.002297401428223, "global_step": 481321, "epoch": 2865} {"train_loss": -11.004063606262207, "global_step": 481322, "epoch": 2865} {"train_loss": -10.620458602905273, "global_step": 481323, "epoch": 2865} {"train_loss": -10.393320083618164, "global_step": 481324, "epoch": 2865} {"train_loss": -10.55966567993164, "global_step": 481325, "epoch": 2865} {"train_loss": -10.805919647216797, "global_step": 481326, "epoch": 2865} {"train_loss": -10.06729793548584, "global_step": 481327, "epoch": 2865} {"train_loss": -11.548892974853516, "global_step": 481328, "epoch": 2865} {"train_loss": -10.42387580871582, "global_step": 481329, "epoch": 2865} {"train_loss": -10.982332229614258, "global_step": 481330, "epoch": 2865} {"train_loss": -11.27778148651123, "global_step": 481331, "epoch": 2865} {"train_loss": -10.286970138549805, "global_step": 481332, "epoch": 2865} {"train_loss": -10.632158279418945, "global_step": 481333, "epoch": 2865} {"train_loss": -10.703108787536621, "global_step": 481334, "epoch": 2865} {"train_loss": -10.831308364868164, "global_step": 481335, "epoch": 2865} {"train_loss": -11.577999114990234, "global_step": 481336, "epoch": 2865} {"train_loss": -11.322530746459961, "global_step": 481337, "epoch": 2865} {"train_loss": -11.496434211730957, "global_step": 481338, "epoch": 2865} {"train_loss": -12.242551803588867, "global_step": 481339, "epoch": 2865} {"train_loss": -11.76675033569336, "global_step": 481340, "epoch": 2865} {"train_loss": -12.102359771728516, "global_step": 481341, "epoch": 2865} {"train_loss": -11.82225227355957, "global_step": 481342, "epoch": 2865} {"train_loss": -11.999322891235352, "global_step": 481343, "epoch": 2865} {"train_loss": -11.564346313476562, "global_step": 481344, "epoch": 2865} {"train_loss": -12.27704906463623, "global_step": 481345, "epoch": 2865} {"train_loss": -11.648895263671875, "global_step": 481346, "epoch": 2865} {"train_loss": -12.262582778930664, "global_step": 481347, "epoch": 2865} {"train_loss": -11.461009979248047, "global_step": 481348, "epoch": 2865} {"train_loss": -12.096151351928711, "global_step": 481349, "epoch": 2865} {"train_loss": -11.92203140258789, "global_step": 481350, "epoch": 2865} {"train_loss": -12.216614723205566, "global_step": 481351, "epoch": 2865} {"train_loss": -12.045114517211914, "global_step": 481352, "epoch": 2865} {"train_loss": -11.758066177368164, "global_step": 481353, "epoch": 2865} {"train_loss": -12.348569869995117, "global_step": 481354, "epoch": 2865} {"train_loss": -11.933052062988281, "global_step": 481355, "epoch": 2865} {"train_loss": -12.14262580871582, "global_step": 481356, "epoch": 2865} {"train_loss": -11.963111877441406, "global_step": 481357, "epoch": 2865} {"train_loss": -11.552032470703125, "global_step": 481358, "epoch": 2865} {"train_loss": -12.480400085449219, "global_step": 481359, "epoch": 2865} {"train_loss": -12.249526977539062, "global_step": 481360, "epoch": 2865} {"train_loss": -12.36989688873291, "global_step": 481361, "epoch": 2865} {"train_loss": -12.50912857055664, "global_step": 481362, "epoch": 2865} {"train_loss": -12.267168045043945, "global_step": 481363, "epoch": 2865} {"train_loss": -12.447441101074219, "global_step": 481364, "epoch": 2865} {"train_loss": -12.590709686279297, "global_step": 481365, "epoch": 2865} {"train_loss": -12.326648712158203, "global_step": 481366, "epoch": 2865} {"train_loss": -12.432186126708984, "global_step": 481367, "epoch": 2865} {"train_loss": -12.331252098083496, "global_step": 481368, "epoch": 2865} {"train_loss": -12.368268013000488, "global_step": 481369, "epoch": 2865} {"train_loss": -12.59398078918457, "global_step": 481370, "epoch": 2865} {"train_loss": -12.358474731445312, "global_step": 481371, "epoch": 2865} {"train_loss": -12.455485343933105, "global_step": 481372, "epoch": 2865} {"train_loss": -12.434700965881348, "global_step": 481373, "epoch": 2865} {"train_loss": -12.312472343444824, "global_step": 481374, "epoch": 2865} {"train_loss": -12.536165237426758, "global_step": 481375, "epoch": 2865} {"train_loss": -12.355096817016602, "global_step": 481376, "epoch": 2865} {"train_loss": -12.386984825134277, "global_step": 481377, "epoch": 2865} {"train_loss": -12.534215927124023, "global_step": 481378, "epoch": 2865} {"train_loss": -12.644547462463379, "global_step": 481379, "epoch": 2865} {"train_loss": -12.505938529968262, "global_step": 481380, "epoch": 2865} {"train_loss": -12.591806411743164, "global_step": 481381, "epoch": 2865} {"train_loss": -12.82603645324707, "global_step": 481382, "epoch": 2865} {"train_loss": -12.54133129119873, "global_step": 481383, "epoch": 2865} {"train_loss": -12.782546043395996, "global_step": 481384, "epoch": 2865} {"train_loss": -12.750307083129883, "global_step": 481385, "epoch": 2865} {"train_loss": -12.738105773925781, "global_step": 481386, "epoch": 2865} {"train_loss": -12.541749954223633, "global_step": 481387, "epoch": 2865} {"train_loss": -12.813511848449707, "global_step": 481388, "epoch": 2865} {"train_loss": -12.647380828857422, "global_step": 481389, "epoch": 2865} {"train_loss": -12.802570343017578, "global_step": 481390, "epoch": 2865} {"train_loss": -12.636153221130371, "global_step": 481391, "epoch": 2865} {"train_loss": -12.658329963684082, "global_step": 481392, "epoch": 2865} {"train_loss": -12.693805694580078, "global_step": 481393, "epoch": 2865} {"train_loss": -12.691869735717773, "global_step": 481394, "epoch": 2865} {"train_loss": -12.860625267028809, "global_step": 481395, "epoch": 2865} {"train_loss": -12.611207962036133, "global_step": 481396, "epoch": 2865} {"train_loss": -12.788294792175293, "global_step": 481397, "epoch": 2865} {"train_loss": -12.790725708007812, "global_step": 481398, "epoch": 2865} {"train_loss": -12.95291805267334, "global_step": 481399, "epoch": 2865} {"train_loss": -12.807182312011719, "global_step": 481400, "epoch": 2865} {"train_loss": -12.932373046875, "global_step": 481401, "epoch": 2865} {"train_loss": -12.931446075439453, "global_step": 481402, "epoch": 2865} {"train_loss": -12.943390846252441, "global_step": 481403, "epoch": 2865} {"train_loss": -12.820232391357422, "global_step": 481404, "epoch": 2865} {"train_loss": -12.847709655761719, "global_step": 481405, "epoch": 2865} {"train_loss": -12.744119644165039, "global_step": 481406, "epoch": 2865} {"train_loss": -12.968338012695312, "global_step": 481407, "epoch": 2865} {"train_loss": -12.777963638305664, "global_step": 481408, "epoch": 2865} {"train_loss": -12.823385238647461, "global_step": 481409, "epoch": 2865} {"train_loss": -12.783419609069824, "global_step": 481410, "epoch": 2865} {"train_loss": -12.803170204162598, "global_step": 481411, "epoch": 2865} {"train_loss": -13.030208587646484, "global_step": 481412, "epoch": 2865} {"train_loss": -12.618910789489746, "global_step": 481413, "epoch": 2865} {"train_loss": -12.86009693145752, "global_step": 481414, "epoch": 2865} {"train_loss": -12.695815086364746, "global_step": 481415, "epoch": 2865} {"train_loss": -12.465019226074219, "global_step": 481416, "epoch": 2865} {"train_loss": -12.666051864624023, "global_step": 481417, "epoch": 2865} {"train_loss": -12.782135963439941, "global_step": 481418, "epoch": 2865} {"train_loss": -12.049925804138184, "global_step": 481419, "epoch": 2865} {"train_loss": -11.756336212158203, "global_step": 481420, "epoch": 2865} {"train_loss": -12.430870056152344, "global_step": 481421, "epoch": 2865} {"train_loss": -12.059530258178711, "global_step": 481422, "epoch": 2865} {"train_loss": -12.072683334350586, "global_step": 481423, "epoch": 2865} {"train_loss": -12.090200424194336, "global_step": 481424, "epoch": 2865} {"train_loss": -12.592201232910156, "global_step": 481425, "epoch": 2865} {"train_loss": -11.536006927490234, "global_step": 481426, "epoch": 2865} {"train_loss": -11.937108993530273, "global_step": 481427, "epoch": 2865} {"train_loss": -12.524781227111816, "global_step": 481428, "epoch": 2865} {"train_loss": -12.240177154541016, "global_step": 481429, "epoch": 2865} {"train_loss": -12.447397232055664, "global_step": 481430, "epoch": 2865} {"train_loss": -12.550081253051758, "global_step": 481431, "epoch": 2865} {"train_loss": -11.548274993896484, "global_step": 481432, "epoch": 2865} {"train_loss": -11.509796142578125, "global_step": 481433, "epoch": 2865} {"train_loss": -10.363327026367188, "global_step": 481434, "epoch": 2865} {"train_loss": -11.873214721679688, "global_step": 481435, "epoch": 2865} {"train_loss": -9.505636215209961, "global_step": 481436, "epoch": 2865} {"train_loss": -10.209053039550781, "global_step": 481437, "epoch": 2865} {"train_loss": -10.016189575195312, "global_step": 481438, "epoch": 2865} {"train_loss": -12.39374828338623, "global_step": 481439, "epoch": 2865} {"train_loss": -11.456216812133789, "global_step": 481440, "epoch": 2865} {"train_loss": -11.882030487060547, "global_step": 481441, "epoch": 2865} {"train_loss": -11.880332946777344, "global_step": 481442, "epoch": 2865} {"train_loss": -11.725579261779785, "global_step": 481443, "epoch": 2865} {"train_loss": -11.849976539611816, "global_step": 481444, "epoch": 2865} {"train_loss": -10.97264289855957, "global_step": 481445, "epoch": 2865} {"train_loss": -12.082447052001953, "global_step": 481446, "epoch": 2865} {"train_loss": -11.555025100708008, "global_step": 481447, "epoch": 2865} {"train_loss": -12.079814910888672, "global_step": 481448, "epoch": 2865} {"train_loss": -10.857242584228516, "global_step": 481449, "epoch": 2865} {"train_loss": -11.978797912597656, "global_step": 481450, "epoch": 2865} {"train_loss": -11.445186614990234, "global_step": 481451, "epoch": 2865} {"train_loss": -11.140668869018555, "global_step": 481452, "epoch": 2865} {"train_loss": -12.633071899414062, "global_step": 481453, "epoch": 2865} {"train_loss": -11.415438652038574, "global_step": 481454, "epoch": 2865} {"train_loss": -11.504329681396484, "global_step": 481455, "epoch": 2865} {"train_loss": -11.031425476074219, "global_step": 481456, "epoch": 2865} {"train_loss": -12.086753845214844, "global_step": 481457, "epoch": 2865} {"train_loss": -11.585867881774902, "global_step": 481458, "epoch": 2865} {"train_loss": -12.067761421203613, "global_step": 481459, "epoch": 2865} {"train_loss": -12.01009750366211, "global_step": 481460, "epoch": 2865} {"train_loss": -11.894550323486328, "global_step": 481461, "epoch": 2865} {"train_loss": -11.697317123413086, "global_step": 481462, "epoch": 2865} {"train_loss": -12.437482833862305, "global_step": 481463, "epoch": 2865} {"train_loss": -11.295686721801758, "global_step": 481464, "epoch": 2865} {"train_loss": -11.663860321044922, "global_step": 481465, "epoch": 2865} {"train_loss": -12.137621879577637, "global_step": 481466, "epoch": 2865} {"train_loss": -11.945899963378906, "global_step": 481467, "epoch": 2865} {"train_loss": -12.126616477966309, "global_step": 481468, "epoch": 2865} {"train_loss": -11.95291805267334, "global_step": 481469, "epoch": 2865} {"train_loss": -12.397690773010254, "global_step": 481470, "epoch": 2865} {"train_loss": -11.569635391235352, "global_step": 481471, "epoch": 2865} {"train_loss": -12.538470268249512, "global_step": 481472, "epoch": 2865} {"train_loss": -11.895612716674805, "global_step": 481473, "epoch": 2865} {"train_loss": -12.366455078125, "global_step": 481474, "epoch": 2865} {"train_loss": -12.0069580078125, "global_step": 481475, "epoch": 2865} {"train_loss": -12.148687362670898, "global_step": 481476, "epoch": 2865} {"train_loss": -11.617431640625, "global_step": 481477, "epoch": 2865} {"train_loss": -12.047175407409668, "global_step": 481478, "epoch": 2865} {"train_loss": -11.464599609375, "global_step": 481479, "epoch": 2865} {"train_loss": -12.582798957824707, "global_step": 481480, "epoch": 2865} {"train_loss": -11.799703598022461, "global_step": 481481, "epoch": 2865} {"train_loss": -12.139698028564453, "global_step": 481482, "epoch": 2865} {"train_loss": -12.174330711364746, "global_step": 481483, "epoch": 2865} {"train_loss": -11.765132904052734, "global_step": 481484, "epoch": 2865} {"train_loss": -12.105743408203125, "global_step": 481485, "epoch": 2865} {"train_loss": -11.713935852050781, "global_step": 481486, "epoch": 2865} {"train_loss": -12.017334773426963, "global_step": 481487, "epoch": 2865, "val_loss": 313719.4375, "train_action_mse_error": 1.5440847873687744} {"train_loss": -12.193434715270996, "global_step": 481488, "epoch": 2866} {"train_loss": -12.134299278259277, "global_step": 481489, "epoch": 2866} {"train_loss": -11.963003158569336, "global_step": 481490, "epoch": 2866} {"train_loss": -12.56567096710205, "global_step": 481491, "epoch": 2866} {"train_loss": -11.70531940460205, "global_step": 481492, "epoch": 2866} {"train_loss": -12.789386749267578, "global_step": 481493, "epoch": 2866} {"train_loss": -11.903236389160156, "global_step": 481494, "epoch": 2866} {"train_loss": -12.318979263305664, "global_step": 481495, "epoch": 2866} {"train_loss": -12.007831573486328, "global_step": 481496, "epoch": 2866} {"train_loss": -12.062999725341797, "global_step": 481497, "epoch": 2866} {"train_loss": -12.34727668762207, "global_step": 481498, "epoch": 2866} {"train_loss": -12.39311408996582, "global_step": 481499, "epoch": 2866} {"train_loss": -12.448598861694336, "global_step": 481500, "epoch": 2866} {"train_loss": -12.571311950683594, "global_step": 481501, "epoch": 2866} {"train_loss": -12.424544334411621, "global_step": 481502, "epoch": 2866} {"train_loss": -12.745203018188477, "global_step": 481503, "epoch": 2866} {"train_loss": -12.234689712524414, "global_step": 481504, "epoch": 2866} {"train_loss": -12.563764572143555, "global_step": 481505, "epoch": 2866} {"train_loss": -12.255420684814453, "global_step": 481506, "epoch": 2866} {"train_loss": -12.58624267578125, "global_step": 481507, "epoch": 2866} {"train_loss": -12.229024887084961, "global_step": 481508, "epoch": 2866} {"train_loss": -12.802262306213379, "global_step": 481509, "epoch": 2866} {"train_loss": -12.368080139160156, "global_step": 481510, "epoch": 2866} {"train_loss": -12.568990707397461, "global_step": 481511, "epoch": 2866} {"train_loss": -12.52188491821289, "global_step": 481512, "epoch": 2866} {"train_loss": -12.487001419067383, "global_step": 481513, "epoch": 2866} {"train_loss": -12.42357063293457, "global_step": 481514, "epoch": 2866} {"train_loss": -12.574228286743164, "global_step": 481515, "epoch": 2866} {"train_loss": -12.383221626281738, "global_step": 481516, "epoch": 2866} {"train_loss": -12.660676002502441, "global_step": 481517, "epoch": 2866} {"train_loss": -12.34268569946289, "global_step": 481518, "epoch": 2866} {"train_loss": -12.510849952697754, "global_step": 481519, "epoch": 2866} {"train_loss": -12.463788032531738, "global_step": 481520, "epoch": 2866} {"train_loss": -12.7191801071167, "global_step": 481521, "epoch": 2866} {"train_loss": -12.509276390075684, "global_step": 481522, "epoch": 2866} {"train_loss": -12.479534149169922, "global_step": 481523, "epoch": 2866} {"train_loss": -12.314811706542969, "global_step": 481524, "epoch": 2866} {"train_loss": -12.300772666931152, "global_step": 481525, "epoch": 2866} {"train_loss": -12.5045804977417, "global_step": 481526, "epoch": 2866} {"train_loss": -12.551383972167969, "global_step": 481527, "epoch": 2866} {"train_loss": -12.63029670715332, "global_step": 481528, "epoch": 2866} {"train_loss": -12.73088264465332, "global_step": 481529, "epoch": 2866} {"train_loss": -12.797200202941895, "global_step": 481530, "epoch": 2866} {"train_loss": -12.47368049621582, "global_step": 481531, "epoch": 2866} {"train_loss": -12.728729248046875, "global_step": 481532, "epoch": 2866} {"train_loss": -12.62990951538086, "global_step": 481533, "epoch": 2866} {"train_loss": -12.750727653503418, "global_step": 481534, "epoch": 2866} {"train_loss": -12.8231201171875, "global_step": 481535, "epoch": 2866} {"train_loss": -13.006193161010742, "global_step": 481536, "epoch": 2866} {"train_loss": -12.534856796264648, "global_step": 481537, "epoch": 2866} {"train_loss": -12.754135131835938, "global_step": 481538, "epoch": 2866} {"train_loss": -12.654829025268555, "global_step": 481539, "epoch": 2866} {"train_loss": -12.788503646850586, "global_step": 481540, "epoch": 2866} {"train_loss": -12.746997833251953, "global_step": 481541, "epoch": 2866} {"train_loss": -12.873233795166016, "global_step": 481542, "epoch": 2866} {"train_loss": -12.750894546508789, "global_step": 481543, "epoch": 2866} {"train_loss": -13.033659934997559, "global_step": 481544, "epoch": 2866} {"train_loss": -12.765445709228516, "global_step": 481545, "epoch": 2866} {"train_loss": -12.475619316101074, "global_step": 481546, "epoch": 2866} {"train_loss": -12.405325889587402, "global_step": 481547, "epoch": 2866} {"train_loss": -12.474205017089844, "global_step": 481548, "epoch": 2866} {"train_loss": -11.94936752319336, "global_step": 481549, "epoch": 2866} {"train_loss": -10.101818084716797, "global_step": 481550, "epoch": 2866} {"train_loss": -12.3181791305542, "global_step": 481551, "epoch": 2866} {"train_loss": -11.772132873535156, "global_step": 481552, "epoch": 2866} {"train_loss": -11.156415939331055, "global_step": 481553, "epoch": 2866} {"train_loss": -10.577407836914062, "global_step": 481554, "epoch": 2866} {"train_loss": -10.023763656616211, "global_step": 481555, "epoch": 2866} {"train_loss": -11.247838020324707, "global_step": 481556, "epoch": 2866} {"train_loss": -10.807743072509766, "global_step": 481557, "epoch": 2866} {"train_loss": -11.764460563659668, "global_step": 481558, "epoch": 2866} {"train_loss": -11.78005599975586, "global_step": 481559, "epoch": 2866} {"train_loss": -11.445375442504883, "global_step": 481560, "epoch": 2866} {"train_loss": -10.07284164428711, "global_step": 481561, "epoch": 2866} {"train_loss": -11.043102264404297, "global_step": 481562, "epoch": 2866} {"train_loss": -11.485136032104492, "global_step": 481563, "epoch": 2866} {"train_loss": -10.369816780090332, "global_step": 481564, "epoch": 2866} {"train_loss": -12.133075714111328, "global_step": 481565, "epoch": 2866} {"train_loss": -10.051912307739258, "global_step": 481566, "epoch": 2866} {"train_loss": -10.969690322875977, "global_step": 481567, "epoch": 2866} {"train_loss": -11.203363418579102, "global_step": 481568, "epoch": 2866} {"train_loss": -9.226104736328125, "global_step": 481569, "epoch": 2866} {"train_loss": -11.544116020202637, "global_step": 481570, "epoch": 2866} {"train_loss": -10.402351379394531, "global_step": 481571, "epoch": 2866} {"train_loss": -10.321056365966797, "global_step": 481572, "epoch": 2866} {"train_loss": -11.620591163635254, "global_step": 481573, "epoch": 2866} {"train_loss": -10.573762893676758, "global_step": 481574, "epoch": 2866} {"train_loss": -10.315898895263672, "global_step": 481575, "epoch": 2866} {"train_loss": -10.03411865234375, "global_step": 481576, "epoch": 2866} {"train_loss": -8.965594291687012, "global_step": 481577, "epoch": 2866} {"train_loss": -10.949298858642578, "global_step": 481578, "epoch": 2866} {"train_loss": -10.50676155090332, "global_step": 481579, "epoch": 2866} {"train_loss": -9.866753578186035, "global_step": 481580, "epoch": 2866} {"train_loss": -10.325750350952148, "global_step": 481581, "epoch": 2866} {"train_loss": -10.569694519042969, "global_step": 481582, "epoch": 2866} {"train_loss": -10.82094955444336, "global_step": 481583, "epoch": 2866} {"train_loss": -10.030977249145508, "global_step": 481584, "epoch": 2866} {"train_loss": -9.8172607421875, "global_step": 481585, "epoch": 2866} {"train_loss": -10.419906616210938, "global_step": 481586, "epoch": 2866} {"train_loss": -11.090145111083984, "global_step": 481587, "epoch": 2866} {"train_loss": -11.262136459350586, "global_step": 481588, "epoch": 2866} {"train_loss": -12.044239044189453, "global_step": 481589, "epoch": 2866} {"train_loss": -11.393765449523926, "global_step": 481590, "epoch": 2866} {"train_loss": -11.894177436828613, "global_step": 481591, "epoch": 2866} {"train_loss": -11.878520965576172, "global_step": 481592, "epoch": 2866} {"train_loss": -12.080184936523438, "global_step": 481593, "epoch": 2866} {"train_loss": -12.039202690124512, "global_step": 481594, "epoch": 2866} {"train_loss": -11.566041946411133, "global_step": 481595, "epoch": 2866} {"train_loss": -12.287910461425781, "global_step": 481596, "epoch": 2866} {"train_loss": -11.98782730102539, "global_step": 481597, "epoch": 2866} {"train_loss": -12.237319946289062, "global_step": 481598, "epoch": 2866} {"train_loss": -11.564230918884277, "global_step": 481599, "epoch": 2866} {"train_loss": -12.180996894836426, "global_step": 481600, "epoch": 2866} {"train_loss": -11.983633041381836, "global_step": 481601, "epoch": 2866} {"train_loss": -11.943028450012207, "global_step": 481602, "epoch": 2866} {"train_loss": -12.297733306884766, "global_step": 481603, "epoch": 2866} {"train_loss": -12.172896385192871, "global_step": 481604, "epoch": 2866} {"train_loss": -12.390913009643555, "global_step": 481605, "epoch": 2866} {"train_loss": -12.46877384185791, "global_step": 481606, "epoch": 2866} {"train_loss": -12.180624008178711, "global_step": 481607, "epoch": 2866} {"train_loss": -12.400687217712402, "global_step": 481608, "epoch": 2866} {"train_loss": -12.334980010986328, "global_step": 481609, "epoch": 2866} {"train_loss": -12.367156982421875, "global_step": 481610, "epoch": 2866} {"train_loss": -12.384761810302734, "global_step": 481611, "epoch": 2866} {"train_loss": -12.495869636535645, "global_step": 481612, "epoch": 2866} {"train_loss": -12.581005096435547, "global_step": 481613, "epoch": 2866} {"train_loss": -12.411314010620117, "global_step": 481614, "epoch": 2866} {"train_loss": -12.384916305541992, "global_step": 481615, "epoch": 2866} {"train_loss": -12.434206008911133, "global_step": 481616, "epoch": 2866} {"train_loss": -12.319046020507812, "global_step": 481617, "epoch": 2866} {"train_loss": -12.49866008758545, "global_step": 481618, "epoch": 2866} {"train_loss": -12.529158592224121, "global_step": 481619, "epoch": 2866} {"train_loss": -12.192548751831055, "global_step": 481620, "epoch": 2866} {"train_loss": -12.306161880493164, "global_step": 481621, "epoch": 2866} {"train_loss": -12.140864372253418, "global_step": 481622, "epoch": 2866} {"train_loss": -12.698831558227539, "global_step": 481623, "epoch": 2866} {"train_loss": -12.518942832946777, "global_step": 481624, "epoch": 2866} {"train_loss": -12.281978607177734, "global_step": 481625, "epoch": 2866} {"train_loss": -12.596890449523926, "global_step": 481626, "epoch": 2866} {"train_loss": -12.45068359375, "global_step": 481627, "epoch": 2866} {"train_loss": -12.435175895690918, "global_step": 481628, "epoch": 2866} {"train_loss": -12.584615707397461, "global_step": 481629, "epoch": 2866} {"train_loss": -12.339202880859375, "global_step": 481630, "epoch": 2866} {"train_loss": -12.506118774414062, "global_step": 481631, "epoch": 2866} {"train_loss": -12.383699417114258, "global_step": 481632, "epoch": 2866} {"train_loss": -12.620515823364258, "global_step": 481633, "epoch": 2866} {"train_loss": -12.464930534362793, "global_step": 481634, "epoch": 2866} {"train_loss": -12.529370307922363, "global_step": 481635, "epoch": 2866} {"train_loss": -12.547768592834473, "global_step": 481636, "epoch": 2866} {"train_loss": -12.476775169372559, "global_step": 481637, "epoch": 2866} {"train_loss": -12.444581985473633, "global_step": 481638, "epoch": 2866} {"train_loss": -12.596576690673828, "global_step": 481639, "epoch": 2866} {"train_loss": -12.377286911010742, "global_step": 481640, "epoch": 2866} {"train_loss": -12.285822868347168, "global_step": 481641, "epoch": 2866} {"train_loss": -12.486907958984375, "global_step": 481642, "epoch": 2866} {"train_loss": -12.784099578857422, "global_step": 481643, "epoch": 2866} {"train_loss": -12.502055168151855, "global_step": 481644, "epoch": 2866} {"train_loss": -12.758659362792969, "global_step": 481645, "epoch": 2866} {"train_loss": -12.573230743408203, "global_step": 481646, "epoch": 2866} {"train_loss": -12.466161727905273, "global_step": 481647, "epoch": 2866} {"train_loss": -12.510364532470703, "global_step": 481648, "epoch": 2866} {"train_loss": -12.565784454345703, "global_step": 481649, "epoch": 2866} {"train_loss": -12.531984329223633, "global_step": 481650, "epoch": 2866} {"train_loss": -12.484764099121094, "global_step": 481651, "epoch": 2866} {"train_loss": -12.63011360168457, "global_step": 481652, "epoch": 2866} {"train_loss": -12.57424545288086, "global_step": 481653, "epoch": 2866} {"train_loss": -12.62712287902832, "global_step": 481654, "epoch": 2866} {"train_loss": -12.028463414737157, "global_step": 481655, "epoch": 2866, "val_loss": 313562.84375} {"train_loss": -12.791051864624023, "global_step": 481656, "epoch": 2867} {"train_loss": -12.432209968566895, "global_step": 481657, "epoch": 2867} {"train_loss": -12.66154670715332, "global_step": 481658, "epoch": 2867} {"train_loss": -12.590020179748535, "global_step": 481659, "epoch": 2867} {"train_loss": -12.844512939453125, "global_step": 481660, "epoch": 2867} {"train_loss": -12.300662994384766, "global_step": 481661, "epoch": 2867} {"train_loss": -12.786820411682129, "global_step": 481662, "epoch": 2867} {"train_loss": -12.840869903564453, "global_step": 481663, "epoch": 2867} {"train_loss": -12.722003936767578, "global_step": 481664, "epoch": 2867} {"train_loss": -12.717464447021484, "global_step": 481665, "epoch": 2867} {"train_loss": -12.711380004882812, "global_step": 481666, "epoch": 2867} {"train_loss": -12.773125648498535, "global_step": 481667, "epoch": 2867} {"train_loss": -12.764885902404785, "global_step": 481668, "epoch": 2867} {"train_loss": -12.659052848815918, "global_step": 481669, "epoch": 2867} {"train_loss": -12.786792755126953, "global_step": 481670, "epoch": 2867} {"train_loss": -12.776679039001465, "global_step": 481671, "epoch": 2867} {"train_loss": -12.695032119750977, "global_step": 481672, "epoch": 2867} {"train_loss": -13.005444526672363, "global_step": 481673, "epoch": 2867} {"train_loss": -12.825257301330566, "global_step": 481674, "epoch": 2867} {"train_loss": -13.049881935119629, "global_step": 481675, "epoch": 2867} {"train_loss": -12.902162551879883, "global_step": 481676, "epoch": 2867} {"train_loss": -12.802801132202148, "global_step": 481677, "epoch": 2867} {"train_loss": -12.899848937988281, "global_step": 481678, "epoch": 2867} {"train_loss": -12.976417541503906, "global_step": 481679, "epoch": 2867} {"train_loss": -12.945982933044434, "global_step": 481680, "epoch": 2867} {"train_loss": -12.85204792022705, "global_step": 481681, "epoch": 2867} {"train_loss": -13.011598587036133, "global_step": 481682, "epoch": 2867} {"train_loss": -12.965011596679688, "global_step": 481683, "epoch": 2867} {"train_loss": -12.950967788696289, "global_step": 481684, "epoch": 2867} {"train_loss": -12.912543296813965, "global_step": 481685, "epoch": 2867} {"train_loss": -12.895976066589355, "global_step": 481686, "epoch": 2867} {"train_loss": -13.077123641967773, "global_step": 481687, "epoch": 2867} {"train_loss": -12.563980102539062, "global_step": 481688, "epoch": 2867} {"train_loss": -12.983011245727539, "global_step": 481689, "epoch": 2867} {"train_loss": -12.884203910827637, "global_step": 481690, "epoch": 2867} {"train_loss": -12.973189353942871, "global_step": 481691, "epoch": 2867} {"train_loss": -12.923624038696289, "global_step": 481692, "epoch": 2867} {"train_loss": -13.004146575927734, "global_step": 481693, "epoch": 2867} {"train_loss": -12.918128967285156, "global_step": 481694, "epoch": 2867} {"train_loss": -13.03254508972168, "global_step": 481695, "epoch": 2867} {"train_loss": -12.89560604095459, "global_step": 481696, "epoch": 2867} {"train_loss": -12.879105567932129, "global_step": 481697, "epoch": 2867} {"train_loss": -12.923705101013184, "global_step": 481698, "epoch": 2867} {"train_loss": -12.49563980102539, "global_step": 481699, "epoch": 2867} {"train_loss": -12.699644088745117, "global_step": 481700, "epoch": 2867} {"train_loss": -12.88438606262207, "global_step": 481701, "epoch": 2867} {"train_loss": -12.54420280456543, "global_step": 481702, "epoch": 2867} {"train_loss": -13.001182556152344, "global_step": 481703, "epoch": 2867} {"train_loss": -12.721981048583984, "global_step": 481704, "epoch": 2867} {"train_loss": -12.553653717041016, "global_step": 481705, "epoch": 2867} {"train_loss": -12.422982215881348, "global_step": 481706, "epoch": 2867} {"train_loss": -12.428756713867188, "global_step": 481707, "epoch": 2867} {"train_loss": -12.135576248168945, "global_step": 481708, "epoch": 2867} {"train_loss": -11.97436809539795, "global_step": 481709, "epoch": 2867} {"train_loss": -11.874882698059082, "global_step": 481710, "epoch": 2867} {"train_loss": -11.692920684814453, "global_step": 481711, "epoch": 2867} {"train_loss": -12.715680122375488, "global_step": 481712, "epoch": 2867} {"train_loss": -11.368738174438477, "global_step": 481713, "epoch": 2867} {"train_loss": -12.36855697631836, "global_step": 481714, "epoch": 2867} {"train_loss": -12.346739768981934, "global_step": 481715, "epoch": 2867} {"train_loss": -11.003531455993652, "global_step": 481716, "epoch": 2867} {"train_loss": -10.625589370727539, "global_step": 481717, "epoch": 2867} {"train_loss": -10.131364822387695, "global_step": 481718, "epoch": 2867} {"train_loss": -10.001346588134766, "global_step": 481719, "epoch": 2867} {"train_loss": -10.187423706054688, "global_step": 481720, "epoch": 2867} {"train_loss": -9.347125053405762, "global_step": 481721, "epoch": 2867} {"train_loss": -10.722861289978027, "global_step": 481722, "epoch": 2867} {"train_loss": -9.527039527893066, "global_step": 481723, "epoch": 2867} {"train_loss": -10.532296180725098, "global_step": 481724, "epoch": 2867} {"train_loss": -10.161880493164062, "global_step": 481725, "epoch": 2867} {"train_loss": -10.712068557739258, "global_step": 481726, "epoch": 2867} {"train_loss": -10.79163932800293, "global_step": 481727, "epoch": 2867} {"train_loss": -11.215856552124023, "global_step": 481728, "epoch": 2867} {"train_loss": -11.095270156860352, "global_step": 481729, "epoch": 2867} {"train_loss": -10.864664077758789, "global_step": 481730, "epoch": 2867} {"train_loss": -11.718118667602539, "global_step": 481731, "epoch": 2867} {"train_loss": -11.793462753295898, "global_step": 481732, "epoch": 2867} {"train_loss": -11.413822174072266, "global_step": 481733, "epoch": 2867} {"train_loss": -10.411860466003418, "global_step": 481734, "epoch": 2867} {"train_loss": -11.538963317871094, "global_step": 481735, "epoch": 2867} {"train_loss": -10.828302383422852, "global_step": 481736, "epoch": 2867} {"train_loss": -11.806289672851562, "global_step": 481737, "epoch": 2867} {"train_loss": -11.332351684570312, "global_step": 481738, "epoch": 2867} {"train_loss": -11.211386680603027, "global_step": 481739, "epoch": 2867} {"train_loss": -11.82194709777832, "global_step": 481740, "epoch": 2867} {"train_loss": -11.54880142211914, "global_step": 481741, "epoch": 2867} {"train_loss": -11.541441917419434, "global_step": 481742, "epoch": 2867} {"train_loss": -12.018936157226562, "global_step": 481743, "epoch": 2867} {"train_loss": -11.706853866577148, "global_step": 481744, "epoch": 2867} {"train_loss": -10.725465774536133, "global_step": 481745, "epoch": 2867} {"train_loss": -10.899820327758789, "global_step": 481746, "epoch": 2867} {"train_loss": -11.142500877380371, "global_step": 481747, "epoch": 2867} {"train_loss": -11.826335906982422, "global_step": 481748, "epoch": 2867} {"train_loss": -11.365609169006348, "global_step": 481749, "epoch": 2867} {"train_loss": -11.224727630615234, "global_step": 481750, "epoch": 2867} {"train_loss": -12.052543640136719, "global_step": 481751, "epoch": 2867} {"train_loss": -11.404508590698242, "global_step": 481752, "epoch": 2867} {"train_loss": -12.37060546875, "global_step": 481753, "epoch": 2867} {"train_loss": -11.489864349365234, "global_step": 481754, "epoch": 2867} {"train_loss": -12.18210220336914, "global_step": 481755, "epoch": 2867} {"train_loss": -11.113969802856445, "global_step": 481756, "epoch": 2867} {"train_loss": -11.912649154663086, "global_step": 481757, "epoch": 2867} {"train_loss": -11.632926940917969, "global_step": 481758, "epoch": 2867} {"train_loss": -12.169132232666016, "global_step": 481759, "epoch": 2867} {"train_loss": -12.11624526977539, "global_step": 481760, "epoch": 2867} {"train_loss": -12.699825286865234, "global_step": 481761, "epoch": 2867} {"train_loss": -11.720146179199219, "global_step": 481762, "epoch": 2867} {"train_loss": -12.162348747253418, "global_step": 481763, "epoch": 2867} {"train_loss": -12.452018737792969, "global_step": 481764, "epoch": 2867} {"train_loss": -12.463235855102539, "global_step": 481765, "epoch": 2867} {"train_loss": -12.170944213867188, "global_step": 481766, "epoch": 2867} {"train_loss": -12.449968338012695, "global_step": 481767, "epoch": 2867} {"train_loss": -12.257011413574219, "global_step": 481768, "epoch": 2867} {"train_loss": -12.393993377685547, "global_step": 481769, "epoch": 2867} {"train_loss": -12.0130615234375, "global_step": 481770, "epoch": 2867} {"train_loss": -12.127008438110352, "global_step": 481771, "epoch": 2867} {"train_loss": -12.536446571350098, "global_step": 481772, "epoch": 2867} {"train_loss": -11.98286247253418, "global_step": 481773, "epoch": 2867} {"train_loss": -12.582029342651367, "global_step": 481774, "epoch": 2867} {"train_loss": -12.039867401123047, "global_step": 481775, "epoch": 2867} {"train_loss": -12.655477523803711, "global_step": 481776, "epoch": 2867} {"train_loss": -11.98452377319336, "global_step": 481777, "epoch": 2867} {"train_loss": -12.647783279418945, "global_step": 481778, "epoch": 2867} {"train_loss": -12.29616928100586, "global_step": 481779, "epoch": 2867} {"train_loss": -12.453924179077148, "global_step": 481780, "epoch": 2867} {"train_loss": -12.459198951721191, "global_step": 481781, "epoch": 2867} {"train_loss": -12.747459411621094, "global_step": 481782, "epoch": 2867} {"train_loss": -12.357734680175781, "global_step": 481783, "epoch": 2867} {"train_loss": -12.690685272216797, "global_step": 481784, "epoch": 2867} {"train_loss": -12.675004959106445, "global_step": 481785, "epoch": 2867} {"train_loss": -12.877702713012695, "global_step": 481786, "epoch": 2867} {"train_loss": -12.77222728729248, "global_step": 481787, "epoch": 2867} {"train_loss": -12.550373077392578, "global_step": 481788, "epoch": 2867} {"train_loss": -12.666473388671875, "global_step": 481789, "epoch": 2867} {"train_loss": -12.922331809997559, "global_step": 481790, "epoch": 2867} {"train_loss": -12.882328987121582, "global_step": 481791, "epoch": 2867} {"train_loss": -12.775856018066406, "global_step": 481792, "epoch": 2867} {"train_loss": -13.049762725830078, "global_step": 481793, "epoch": 2867} {"train_loss": -12.941699028015137, "global_step": 481794, "epoch": 2867} {"train_loss": -12.721012115478516, "global_step": 481795, "epoch": 2867} {"train_loss": -12.925394058227539, "global_step": 481796, "epoch": 2867} {"train_loss": -12.739850044250488, "global_step": 481797, "epoch": 2867} {"train_loss": -12.671904563903809, "global_step": 481798, "epoch": 2867} {"train_loss": -12.892173767089844, "global_step": 481799, "epoch": 2867} {"train_loss": -12.93171215057373, "global_step": 481800, "epoch": 2867} {"train_loss": -12.758121490478516, "global_step": 481801, "epoch": 2867} {"train_loss": -12.791996002197266, "global_step": 481802, "epoch": 2867} {"train_loss": -12.876233100891113, "global_step": 481803, "epoch": 2867} {"train_loss": -13.05373764038086, "global_step": 481804, "epoch": 2867} {"train_loss": -12.798020362854004, "global_step": 481805, "epoch": 2867} {"train_loss": -12.955962181091309, "global_step": 481806, "epoch": 2867} {"train_loss": -12.864404678344727, "global_step": 481807, "epoch": 2867} {"train_loss": -12.823436737060547, "global_step": 481808, "epoch": 2867} {"train_loss": -12.896711349487305, "global_step": 481809, "epoch": 2867} {"train_loss": -13.076498031616211, "global_step": 481810, "epoch": 2867} {"train_loss": -12.652263641357422, "global_step": 481811, "epoch": 2867} {"train_loss": -13.118369102478027, "global_step": 481812, "epoch": 2867} {"train_loss": -12.931520462036133, "global_step": 481813, "epoch": 2867} {"train_loss": -12.90229320526123, "global_step": 481814, "epoch": 2867} {"train_loss": -12.917893409729004, "global_step": 481815, "epoch": 2867} {"train_loss": -13.01523208618164, "global_step": 481816, "epoch": 2867} {"train_loss": -12.937702178955078, "global_step": 481817, "epoch": 2867} {"train_loss": -13.021183013916016, "global_step": 481818, "epoch": 2867} {"train_loss": -12.84316635131836, "global_step": 481819, "epoch": 2867} {"train_loss": -12.884933471679688, "global_step": 481820, "epoch": 2867} {"train_loss": -12.442648887634277, "global_step": 481821, "epoch": 2867} {"train_loss": -12.538215637207031, "global_step": 481822, "epoch": 2867} {"train_loss": -12.27770357472556, "global_step": 481823, "epoch": 2867, "val_loss": 316968.6875} {"train_loss": -12.228134155273438, "global_step": 481824, "epoch": 2868} {"train_loss": -11.016790390014648, "global_step": 481825, "epoch": 2868} {"train_loss": -11.679262161254883, "global_step": 481826, "epoch": 2868} {"train_loss": -12.190389633178711, "global_step": 481827, "epoch": 2868} {"train_loss": -12.270626068115234, "global_step": 481828, "epoch": 2868} {"train_loss": -12.813169479370117, "global_step": 481829, "epoch": 2868} {"train_loss": -12.136898040771484, "global_step": 481830, "epoch": 2868} {"train_loss": -12.589418411254883, "global_step": 481831, "epoch": 2868} {"train_loss": -12.207223892211914, "global_step": 481832, "epoch": 2868} {"train_loss": -12.740360260009766, "global_step": 481833, "epoch": 2868} {"train_loss": -12.508970260620117, "global_step": 481834, "epoch": 2868} {"train_loss": -12.589107513427734, "global_step": 481835, "epoch": 2868} {"train_loss": -12.017936706542969, "global_step": 481836, "epoch": 2868} {"train_loss": -11.641746520996094, "global_step": 481837, "epoch": 2868} {"train_loss": -11.231290817260742, "global_step": 481838, "epoch": 2868} {"train_loss": -12.004611015319824, "global_step": 481839, "epoch": 2868} {"train_loss": -11.481298446655273, "global_step": 481840, "epoch": 2868} {"train_loss": -10.199589729309082, "global_step": 481841, "epoch": 2868} {"train_loss": -11.739847183227539, "global_step": 481842, "epoch": 2868} {"train_loss": -12.795831680297852, "global_step": 481843, "epoch": 2868} {"train_loss": -12.12977409362793, "global_step": 481844, "epoch": 2868} {"train_loss": -11.695503234863281, "global_step": 481845, "epoch": 2868} {"train_loss": -12.083087921142578, "global_step": 481846, "epoch": 2868} {"train_loss": -12.620689392089844, "global_step": 481847, "epoch": 2868} {"train_loss": -11.750892639160156, "global_step": 481848, "epoch": 2868} {"train_loss": -11.395942687988281, "global_step": 481849, "epoch": 2868} {"train_loss": -12.728374481201172, "global_step": 481850, "epoch": 2868} {"train_loss": -12.026552200317383, "global_step": 481851, "epoch": 2868} {"train_loss": -11.585626602172852, "global_step": 481852, "epoch": 2868} {"train_loss": -12.236286163330078, "global_step": 481853, "epoch": 2868} {"train_loss": -12.552356719970703, "global_step": 481854, "epoch": 2868} {"train_loss": -12.344922065734863, "global_step": 481855, "epoch": 2868} {"train_loss": -12.332954406738281, "global_step": 481856, "epoch": 2868} {"train_loss": -12.733644485473633, "global_step": 481857, "epoch": 2868} {"train_loss": -12.015710830688477, "global_step": 481858, "epoch": 2868} {"train_loss": -12.437355041503906, "global_step": 481859, "epoch": 2868} {"train_loss": -12.754016876220703, "global_step": 481860, "epoch": 2868} {"train_loss": -11.988908767700195, "global_step": 481861, "epoch": 2868} {"train_loss": -12.73183536529541, "global_step": 481862, "epoch": 2868} {"train_loss": -12.603422164916992, "global_step": 481863, "epoch": 2868} {"train_loss": -12.571434020996094, "global_step": 481864, "epoch": 2868} {"train_loss": -12.597162246704102, "global_step": 481865, "epoch": 2868} {"train_loss": -12.928299903869629, "global_step": 481866, "epoch": 2868} {"train_loss": -12.314661979675293, "global_step": 481867, "epoch": 2868} {"train_loss": -12.477699279785156, "global_step": 481868, "epoch": 2868} {"train_loss": -12.571052551269531, "global_step": 481869, "epoch": 2868} {"train_loss": -12.734657287597656, "global_step": 481870, "epoch": 2868} {"train_loss": -11.923551559448242, "global_step": 481871, "epoch": 2868} {"train_loss": -12.607735633850098, "global_step": 481872, "epoch": 2868} {"train_loss": -12.602088928222656, "global_step": 481873, "epoch": 2868} {"train_loss": -12.724237442016602, "global_step": 481874, "epoch": 2868} {"train_loss": -12.414334297180176, "global_step": 481875, "epoch": 2868} {"train_loss": -12.370138168334961, "global_step": 481876, "epoch": 2868} {"train_loss": -12.468735694885254, "global_step": 481877, "epoch": 2868} {"train_loss": -12.616532325744629, "global_step": 481878, "epoch": 2868} {"train_loss": -12.783498764038086, "global_step": 481879, "epoch": 2868} {"train_loss": -12.774412155151367, "global_step": 481880, "epoch": 2868} {"train_loss": -12.275091171264648, "global_step": 481881, "epoch": 2868} {"train_loss": -12.823836326599121, "global_step": 481882, "epoch": 2868} {"train_loss": -12.693458557128906, "global_step": 481883, "epoch": 2868} {"train_loss": -12.68618106842041, "global_step": 481884, "epoch": 2868} {"train_loss": -12.460530281066895, "global_step": 481885, "epoch": 2868} {"train_loss": -12.252577781677246, "global_step": 481886, "epoch": 2868} {"train_loss": -12.593073844909668, "global_step": 481887, "epoch": 2868} {"train_loss": -11.771583557128906, "global_step": 481888, "epoch": 2868} {"train_loss": -12.782251358032227, "global_step": 481889, "epoch": 2868} {"train_loss": -12.189067840576172, "global_step": 481890, "epoch": 2868} {"train_loss": -12.232231140136719, "global_step": 481891, "epoch": 2868} {"train_loss": -11.959494590759277, "global_step": 481892, "epoch": 2868} {"train_loss": -12.61246109008789, "global_step": 481893, "epoch": 2868} {"train_loss": -12.72439193725586, "global_step": 481894, "epoch": 2868} {"train_loss": -12.683834075927734, "global_step": 481895, "epoch": 2868} {"train_loss": -12.527952194213867, "global_step": 481896, "epoch": 2868} {"train_loss": -12.624095916748047, "global_step": 481897, "epoch": 2868} {"train_loss": -11.835847854614258, "global_step": 481898, "epoch": 2868} {"train_loss": -12.182104110717773, "global_step": 481899, "epoch": 2868} {"train_loss": -11.816344261169434, "global_step": 481900, "epoch": 2868} {"train_loss": -11.801037788391113, "global_step": 481901, "epoch": 2868} {"train_loss": -11.224506378173828, "global_step": 481902, "epoch": 2868} {"train_loss": -10.959738731384277, "global_step": 481903, "epoch": 2868} {"train_loss": -11.499300003051758, "global_step": 481904, "epoch": 2868} {"train_loss": -10.746475219726562, "global_step": 481905, "epoch": 2868} {"train_loss": -11.848245620727539, "global_step": 481906, "epoch": 2868} {"train_loss": -10.672520637512207, "global_step": 481907, "epoch": 2868} {"train_loss": -11.117067337036133, "global_step": 481908, "epoch": 2868} {"train_loss": -11.469623565673828, "global_step": 481909, "epoch": 2868} {"train_loss": -11.025642395019531, "global_step": 481910, "epoch": 2868} {"train_loss": -11.046221733093262, "global_step": 481911, "epoch": 2868} {"train_loss": -10.620384216308594, "global_step": 481912, "epoch": 2868} {"train_loss": -9.915231704711914, "global_step": 481913, "epoch": 2868} {"train_loss": -12.001364707946777, "global_step": 481914, "epoch": 2868} {"train_loss": -10.471111297607422, "global_step": 481915, "epoch": 2868} {"train_loss": -11.632723808288574, "global_step": 481916, "epoch": 2868} {"train_loss": -11.796308517456055, "global_step": 481917, "epoch": 2868} {"train_loss": -11.444364547729492, "global_step": 481918, "epoch": 2868} {"train_loss": -11.812134742736816, "global_step": 481919, "epoch": 2868} {"train_loss": -11.719743728637695, "global_step": 481920, "epoch": 2868} {"train_loss": -11.729490280151367, "global_step": 481921, "epoch": 2868} {"train_loss": -11.598093032836914, "global_step": 481922, "epoch": 2868} {"train_loss": -12.019917488098145, "global_step": 481923, "epoch": 2868} {"train_loss": -12.326824188232422, "global_step": 481924, "epoch": 2868} {"train_loss": -11.510316848754883, "global_step": 481925, "epoch": 2868} {"train_loss": -12.405603408813477, "global_step": 481926, "epoch": 2868} {"train_loss": -11.761575698852539, "global_step": 481927, "epoch": 2868} {"train_loss": -12.261388778686523, "global_step": 481928, "epoch": 2868} {"train_loss": -11.789819717407227, "global_step": 481929, "epoch": 2868} {"train_loss": -12.480380058288574, "global_step": 481930, "epoch": 2868} {"train_loss": -11.983949661254883, "global_step": 481931, "epoch": 2868} {"train_loss": -11.850496292114258, "global_step": 481932, "epoch": 2868} {"train_loss": -12.03538703918457, "global_step": 481933, "epoch": 2868} {"train_loss": -12.249808311462402, "global_step": 481934, "epoch": 2868} {"train_loss": -12.456595420837402, "global_step": 481935, "epoch": 2868} {"train_loss": -12.418302536010742, "global_step": 481936, "epoch": 2868} {"train_loss": -12.378456115722656, "global_step": 481937, "epoch": 2868} {"train_loss": -12.014342308044434, "global_step": 481938, "epoch": 2868} {"train_loss": -12.254867553710938, "global_step": 481939, "epoch": 2868} {"train_loss": -12.226594924926758, "global_step": 481940, "epoch": 2868} {"train_loss": -12.525911331176758, "global_step": 481941, "epoch": 2868} {"train_loss": -12.233236312866211, "global_step": 481942, "epoch": 2868} {"train_loss": -12.376264572143555, "global_step": 481943, "epoch": 2868} {"train_loss": -12.313905715942383, "global_step": 481944, "epoch": 2868} {"train_loss": -12.672483444213867, "global_step": 481945, "epoch": 2868} {"train_loss": -12.201684951782227, "global_step": 481946, "epoch": 2868} {"train_loss": -12.25501823425293, "global_step": 481947, "epoch": 2868} {"train_loss": -12.435186386108398, "global_step": 481948, "epoch": 2868} {"train_loss": -12.356616973876953, "global_step": 481949, "epoch": 2868} {"train_loss": -12.435768127441406, "global_step": 481950, "epoch": 2868} {"train_loss": -12.696319580078125, "global_step": 481951, "epoch": 2868} {"train_loss": -12.552724838256836, "global_step": 481952, "epoch": 2868} {"train_loss": -12.431760787963867, "global_step": 481953, "epoch": 2868} {"train_loss": -12.4113130569458, "global_step": 481954, "epoch": 2868} {"train_loss": -12.394670486450195, "global_step": 481955, "epoch": 2868} {"train_loss": -12.394333839416504, "global_step": 481956, "epoch": 2868} {"train_loss": -12.438398361206055, "global_step": 481957, "epoch": 2868} {"train_loss": -12.732369422912598, "global_step": 481958, "epoch": 2868} {"train_loss": -12.367301940917969, "global_step": 481959, "epoch": 2868} {"train_loss": -12.683732986450195, "global_step": 481960, "epoch": 2868} {"train_loss": -12.23338508605957, "global_step": 481961, "epoch": 2868} {"train_loss": -12.612709045410156, "global_step": 481962, "epoch": 2868} {"train_loss": -12.852523803710938, "global_step": 481963, "epoch": 2868} {"train_loss": -12.331266403198242, "global_step": 481964, "epoch": 2868} {"train_loss": -12.631704330444336, "global_step": 481965, "epoch": 2868} {"train_loss": -12.059297561645508, "global_step": 481966, "epoch": 2868} {"train_loss": -12.442110061645508, "global_step": 481967, "epoch": 2868} {"train_loss": -12.669121742248535, "global_step": 481968, "epoch": 2868} {"train_loss": -12.339211463928223, "global_step": 481969, "epoch": 2868} {"train_loss": -12.723355293273926, "global_step": 481970, "epoch": 2868} {"train_loss": -12.789751052856445, "global_step": 481971, "epoch": 2868} {"train_loss": -12.609786987304688, "global_step": 481972, "epoch": 2868} {"train_loss": -12.763608932495117, "global_step": 481973, "epoch": 2868} {"train_loss": -12.739482879638672, "global_step": 481974, "epoch": 2868} {"train_loss": -12.680545806884766, "global_step": 481975, "epoch": 2868} {"train_loss": -12.686393737792969, "global_step": 481976, "epoch": 2868} {"train_loss": -12.503472328186035, "global_step": 481977, "epoch": 2868} {"train_loss": -12.552367210388184, "global_step": 481978, "epoch": 2868} {"train_loss": -12.629377365112305, "global_step": 481979, "epoch": 2868} {"train_loss": -12.451111793518066, "global_step": 481980, "epoch": 2868} {"train_loss": -12.65030574798584, "global_step": 481981, "epoch": 2868} {"train_loss": -12.618260383605957, "global_step": 481982, "epoch": 2868} {"train_loss": -12.634675979614258, "global_step": 481983, "epoch": 2868} {"train_loss": -12.809560775756836, "global_step": 481984, "epoch": 2868} {"train_loss": -12.389715194702148, "global_step": 481985, "epoch": 2868} {"train_loss": -12.756096839904785, "global_step": 481986, "epoch": 2868} {"train_loss": -12.53740119934082, "global_step": 481987, "epoch": 2868} {"train_loss": -12.561868667602539, "global_step": 481988, "epoch": 2868} {"train_loss": -12.802931785583496, "global_step": 481989, "epoch": 2868} {"train_loss": -12.519180297851562, "global_step": 481990, "epoch": 2868} {"train_loss": -12.214011226381574, "global_step": 481991, "epoch": 2868, "val_loss": 316793.5625} {"train_loss": -12.81076717376709, "global_step": 481992, "epoch": 2869} {"train_loss": -12.823080062866211, "global_step": 481993, "epoch": 2869} {"train_loss": -12.525955200195312, "global_step": 481994, "epoch": 2869} {"train_loss": -12.831993103027344, "global_step": 481995, "epoch": 2869} {"train_loss": -12.839284896850586, "global_step": 481996, "epoch": 2869} {"train_loss": -12.738241195678711, "global_step": 481997, "epoch": 2869} {"train_loss": -12.617826461791992, "global_step": 481998, "epoch": 2869} {"train_loss": -12.76346492767334, "global_step": 481999, "epoch": 2869} {"train_loss": -12.45888614654541, "global_step": 482000, "epoch": 2869} {"train_loss": -12.511739730834961, "global_step": 482001, "epoch": 2869} {"train_loss": -12.831896781921387, "global_step": 482002, "epoch": 2869} {"train_loss": -12.789164543151855, "global_step": 482003, "epoch": 2869} {"train_loss": -12.69344711303711, "global_step": 482004, "epoch": 2869} {"train_loss": -13.107728958129883, "global_step": 482005, "epoch": 2869} {"train_loss": -12.679808616638184, "global_step": 482006, "epoch": 2869} {"train_loss": -12.924477577209473, "global_step": 482007, "epoch": 2869} {"train_loss": -12.885808944702148, "global_step": 482008, "epoch": 2869} {"train_loss": -12.821677207946777, "global_step": 482009, "epoch": 2869} {"train_loss": -12.74627685546875, "global_step": 482010, "epoch": 2869} {"train_loss": -12.55394172668457, "global_step": 482011, "epoch": 2869} {"train_loss": -12.195764541625977, "global_step": 482012, "epoch": 2869} {"train_loss": -12.70153522491455, "global_step": 482013, "epoch": 2869} {"train_loss": -12.796052932739258, "global_step": 482014, "epoch": 2869} {"train_loss": -11.766359329223633, "global_step": 482015, "epoch": 2869} {"train_loss": -11.493268966674805, "global_step": 482016, "epoch": 2869} {"train_loss": -11.383443832397461, "global_step": 482017, "epoch": 2869} {"train_loss": -12.815701484680176, "global_step": 482018, "epoch": 2869} {"train_loss": -10.44956111907959, "global_step": 482019, "epoch": 2869} {"train_loss": -11.274259567260742, "global_step": 482020, "epoch": 2869} {"train_loss": -11.021263122558594, "global_step": 482021, "epoch": 2869} {"train_loss": -10.96484088897705, "global_step": 482022, "epoch": 2869} {"train_loss": -11.004137992858887, "global_step": 482023, "epoch": 2869} {"train_loss": -12.121610641479492, "global_step": 482024, "epoch": 2869} {"train_loss": -11.206642150878906, "global_step": 482025, "epoch": 2869} {"train_loss": -10.883269309997559, "global_step": 482026, "epoch": 2869} {"train_loss": -10.02929401397705, "global_step": 482027, "epoch": 2869} {"train_loss": -11.64715576171875, "global_step": 482028, "epoch": 2869} {"train_loss": -10.326313972473145, "global_step": 482029, "epoch": 2869} {"train_loss": -10.88364315032959, "global_step": 482030, "epoch": 2869} {"train_loss": -11.366662979125977, "global_step": 482031, "epoch": 2869} {"train_loss": -11.281614303588867, "global_step": 482032, "epoch": 2869} {"train_loss": -12.042502403259277, "global_step": 482033, "epoch": 2869} {"train_loss": -11.715044021606445, "global_step": 482034, "epoch": 2869} {"train_loss": -12.029766082763672, "global_step": 482035, "epoch": 2869} {"train_loss": -11.652633666992188, "global_step": 482036, "epoch": 2869} {"train_loss": -11.52696418762207, "global_step": 482037, "epoch": 2869} {"train_loss": -11.550066947937012, "global_step": 482038, "epoch": 2869} {"train_loss": -11.524270057678223, "global_step": 482039, "epoch": 2869} {"train_loss": -11.102357864379883, "global_step": 482040, "epoch": 2869} {"train_loss": -10.579458236694336, "global_step": 482041, "epoch": 2869} {"train_loss": -12.132745742797852, "global_step": 482042, "epoch": 2869} {"train_loss": -10.018856048583984, "global_step": 482043, "epoch": 2869} {"train_loss": -12.138612747192383, "global_step": 482044, "epoch": 2869} {"train_loss": -10.750017166137695, "global_step": 482045, "epoch": 2869} {"train_loss": -11.416680335998535, "global_step": 482046, "epoch": 2869} {"train_loss": -11.811206817626953, "global_step": 482047, "epoch": 2869} {"train_loss": -11.574195861816406, "global_step": 482048, "epoch": 2869} {"train_loss": -11.061101913452148, "global_step": 482049, "epoch": 2869} {"train_loss": -11.524230003356934, "global_step": 482050, "epoch": 2869} {"train_loss": -11.37739372253418, "global_step": 482051, "epoch": 2869} {"train_loss": -11.969483375549316, "global_step": 482052, "epoch": 2869} {"train_loss": -11.265204429626465, "global_step": 482053, "epoch": 2869} {"train_loss": -11.473709106445312, "global_step": 482054, "epoch": 2869} {"train_loss": -11.822052001953125, "global_step": 482055, "epoch": 2869} {"train_loss": -11.296747207641602, "global_step": 482056, "epoch": 2869} {"train_loss": -11.227287292480469, "global_step": 482057, "epoch": 2869} {"train_loss": -12.308670043945312, "global_step": 482058, "epoch": 2869} {"train_loss": -11.798298835754395, "global_step": 482059, "epoch": 2869} {"train_loss": -12.16360092163086, "global_step": 482060, "epoch": 2869} {"train_loss": -12.346853256225586, "global_step": 482061, "epoch": 2869} {"train_loss": -11.814467430114746, "global_step": 482062, "epoch": 2869} {"train_loss": -12.421126365661621, "global_step": 482063, "epoch": 2869} {"train_loss": -11.69145393371582, "global_step": 482064, "epoch": 2869} {"train_loss": -12.456282615661621, "global_step": 482065, "epoch": 2869} {"train_loss": -12.238951683044434, "global_step": 482066, "epoch": 2869} {"train_loss": -11.89632797241211, "global_step": 482067, "epoch": 2869} {"train_loss": -12.161030769348145, "global_step": 482068, "epoch": 2869} {"train_loss": -12.272115707397461, "global_step": 482069, "epoch": 2869} {"train_loss": -12.185434341430664, "global_step": 482070, "epoch": 2869} {"train_loss": -12.200140953063965, "global_step": 482071, "epoch": 2869} {"train_loss": -12.578811645507812, "global_step": 482072, "epoch": 2869} {"train_loss": -12.559782028198242, "global_step": 482073, "epoch": 2869} {"train_loss": -12.68359375, "global_step": 482074, "epoch": 2869} {"train_loss": -12.457944869995117, "global_step": 482075, "epoch": 2869} {"train_loss": -12.403826713562012, "global_step": 482076, "epoch": 2869} {"train_loss": -12.536550521850586, "global_step": 482077, "epoch": 2869} {"train_loss": -12.33342170715332, "global_step": 482078, "epoch": 2869} {"train_loss": -12.52688980102539, "global_step": 482079, "epoch": 2869} {"train_loss": -12.57524585723877, "global_step": 482080, "epoch": 2869} {"train_loss": -12.572864532470703, "global_step": 482081, "epoch": 2869} {"train_loss": -12.747844696044922, "global_step": 482082, "epoch": 2869} {"train_loss": -12.36108684539795, "global_step": 482083, "epoch": 2869} {"train_loss": -12.737154960632324, "global_step": 482084, "epoch": 2869} {"train_loss": -12.678077697753906, "global_step": 482085, "epoch": 2869} {"train_loss": -12.64747428894043, "global_step": 482086, "epoch": 2869} {"train_loss": -12.810558319091797, "global_step": 482087, "epoch": 2869} {"train_loss": -12.531072616577148, "global_step": 482088, "epoch": 2869} {"train_loss": -12.71723747253418, "global_step": 482089, "epoch": 2869} {"train_loss": -12.702741622924805, "global_step": 482090, "epoch": 2869} {"train_loss": -12.867975234985352, "global_step": 482091, "epoch": 2869} {"train_loss": -12.77427864074707, "global_step": 482092, "epoch": 2869} {"train_loss": -12.712940216064453, "global_step": 482093, "epoch": 2869} {"train_loss": -12.710405349731445, "global_step": 482094, "epoch": 2869} {"train_loss": -12.688741683959961, "global_step": 482095, "epoch": 2869} {"train_loss": -12.809494018554688, "global_step": 482096, "epoch": 2869} {"train_loss": -12.940135955810547, "global_step": 482097, "epoch": 2869} {"train_loss": -12.715099334716797, "global_step": 482098, "epoch": 2869} {"train_loss": -12.845487594604492, "global_step": 482099, "epoch": 2869} {"train_loss": -12.802286148071289, "global_step": 482100, "epoch": 2869} {"train_loss": -12.707130432128906, "global_step": 482101, "epoch": 2869} {"train_loss": -12.90888786315918, "global_step": 482102, "epoch": 2869} {"train_loss": -12.763978958129883, "global_step": 482103, "epoch": 2869} {"train_loss": -12.82137393951416, "global_step": 482104, "epoch": 2869} {"train_loss": -12.839498519897461, "global_step": 482105, "epoch": 2869} {"train_loss": -12.852092742919922, "global_step": 482106, "epoch": 2869} {"train_loss": -12.894898414611816, "global_step": 482107, "epoch": 2869} {"train_loss": -13.018634796142578, "global_step": 482108, "epoch": 2869} {"train_loss": -12.825827598571777, "global_step": 482109, "epoch": 2869} {"train_loss": -12.906753540039062, "global_step": 482110, "epoch": 2869} {"train_loss": -13.004964828491211, "global_step": 482111, "epoch": 2869} {"train_loss": -12.515721321105957, "global_step": 482112, "epoch": 2869} {"train_loss": -12.78985595703125, "global_step": 482113, "epoch": 2869} {"train_loss": -12.691510200500488, "global_step": 482114, "epoch": 2869} {"train_loss": -12.623961448669434, "global_step": 482115, "epoch": 2869} {"train_loss": -13.04327392578125, "global_step": 482116, "epoch": 2869} {"train_loss": -12.779525756835938, "global_step": 482117, "epoch": 2869} {"train_loss": -12.7435302734375, "global_step": 482118, "epoch": 2869} {"train_loss": -12.867804527282715, "global_step": 482119, "epoch": 2869} {"train_loss": -12.22758960723877, "global_step": 482120, "epoch": 2869} {"train_loss": -12.858234405517578, "global_step": 482121, "epoch": 2869} {"train_loss": -12.656508445739746, "global_step": 482122, "epoch": 2869} {"train_loss": -12.551450729370117, "global_step": 482123, "epoch": 2869} {"train_loss": -12.149910926818848, "global_step": 482124, "epoch": 2869} {"train_loss": -12.856159210205078, "global_step": 482125, "epoch": 2869} {"train_loss": -12.321235656738281, "global_step": 482126, "epoch": 2869} {"train_loss": -12.915231704711914, "global_step": 482127, "epoch": 2869} {"train_loss": -12.667771339416504, "global_step": 482128, "epoch": 2869} {"train_loss": -12.876019477844238, "global_step": 482129, "epoch": 2869} {"train_loss": -12.733766555786133, "global_step": 482130, "epoch": 2869} {"train_loss": -12.800857543945312, "global_step": 482131, "epoch": 2869} {"train_loss": -12.766517639160156, "global_step": 482132, "epoch": 2869} {"train_loss": -12.63142204284668, "global_step": 482133, "epoch": 2869} {"train_loss": -12.632323265075684, "global_step": 482134, "epoch": 2869} {"train_loss": -12.726667404174805, "global_step": 482135, "epoch": 2869} {"train_loss": -12.52383041381836, "global_step": 482136, "epoch": 2869} {"train_loss": -12.545042037963867, "global_step": 482137, "epoch": 2869} {"train_loss": -12.83444881439209, "global_step": 482138, "epoch": 2869} {"train_loss": -12.576041221618652, "global_step": 482139, "epoch": 2869} {"train_loss": -13.000205993652344, "global_step": 482140, "epoch": 2869} {"train_loss": -13.083537101745605, "global_step": 482141, "epoch": 2869} {"train_loss": -12.6216459274292, "global_step": 482142, "epoch": 2869} {"train_loss": -13.047122955322266, "global_step": 482143, "epoch": 2869} {"train_loss": -12.759281158447266, "global_step": 482144, "epoch": 2869} {"train_loss": -12.380857467651367, "global_step": 482145, "epoch": 2869} {"train_loss": -12.32904052734375, "global_step": 482146, "epoch": 2869} {"train_loss": -11.881089210510254, "global_step": 482147, "epoch": 2869} {"train_loss": -11.763673782348633, "global_step": 482148, "epoch": 2869} {"train_loss": -12.67447280883789, "global_step": 482149, "epoch": 2869} {"train_loss": -11.078113555908203, "global_step": 482150, "epoch": 2869} {"train_loss": -11.017560958862305, "global_step": 482151, "epoch": 2869} {"train_loss": -11.809085845947266, "global_step": 482152, "epoch": 2869} {"train_loss": -12.458057403564453, "global_step": 482153, "epoch": 2869} {"train_loss": -11.01701545715332, "global_step": 482154, "epoch": 2869} {"train_loss": -11.87674331665039, "global_step": 482155, "epoch": 2869} {"train_loss": -10.22846794128418, "global_step": 482156, "epoch": 2869} {"train_loss": -11.405405044555664, "global_step": 482157, "epoch": 2869} {"train_loss": -11.55019760131836, "global_step": 482158, "epoch": 2869} {"train_loss": -12.229820768038431, "global_step": 482159, "epoch": 2869, "val_loss": 317930.90625} {"train_loss": -11.167930603027344, "global_step": 482160, "epoch": 2870} {"train_loss": -12.683794021606445, "global_step": 482161, "epoch": 2870} {"train_loss": -11.26258659362793, "global_step": 482162, "epoch": 2870} {"train_loss": -11.763001441955566, "global_step": 482163, "epoch": 2870} {"train_loss": -11.601909637451172, "global_step": 482164, "epoch": 2870} {"train_loss": -11.959769248962402, "global_step": 482165, "epoch": 2870} {"train_loss": -11.63685417175293, "global_step": 482166, "epoch": 2870} {"train_loss": -12.527979850769043, "global_step": 482167, "epoch": 2870} {"train_loss": -12.076606750488281, "global_step": 482168, "epoch": 2870} {"train_loss": -12.437837600708008, "global_step": 482169, "epoch": 2870} {"train_loss": -11.771761894226074, "global_step": 482170, "epoch": 2870} {"train_loss": -12.49730396270752, "global_step": 482171, "epoch": 2870} {"train_loss": -11.9890718460083, "global_step": 482172, "epoch": 2870} {"train_loss": -12.491400718688965, "global_step": 482173, "epoch": 2870} {"train_loss": -11.553305625915527, "global_step": 482174, "epoch": 2870} {"train_loss": -12.307130813598633, "global_step": 482175, "epoch": 2870} {"train_loss": -12.37535285949707, "global_step": 482176, "epoch": 2870} {"train_loss": -12.57909870147705, "global_step": 482177, "epoch": 2870} {"train_loss": -12.279050827026367, "global_step": 482178, "epoch": 2870} {"train_loss": -12.898273468017578, "global_step": 482179, "epoch": 2870} {"train_loss": -12.423955917358398, "global_step": 482180, "epoch": 2870} {"train_loss": -12.553080558776855, "global_step": 482181, "epoch": 2870} {"train_loss": -11.964957237243652, "global_step": 482182, "epoch": 2870} {"train_loss": -12.588090896606445, "global_step": 482183, "epoch": 2870} {"train_loss": -12.472521781921387, "global_step": 482184, "epoch": 2870} {"train_loss": -12.267680168151855, "global_step": 482185, "epoch": 2870} {"train_loss": -12.336421966552734, "global_step": 482186, "epoch": 2870} {"train_loss": -12.113372802734375, "global_step": 482187, "epoch": 2870} {"train_loss": -11.289669036865234, "global_step": 482188, "epoch": 2870} {"train_loss": -12.578718185424805, "global_step": 482189, "epoch": 2870} {"train_loss": -11.55508041381836, "global_step": 482190, "epoch": 2870} {"train_loss": -12.129556655883789, "global_step": 482191, "epoch": 2870} {"train_loss": -12.564534187316895, "global_step": 482192, "epoch": 2870} {"train_loss": -12.034656524658203, "global_step": 482193, "epoch": 2870} {"train_loss": -12.41618537902832, "global_step": 482194, "epoch": 2870} {"train_loss": -12.126506805419922, "global_step": 482195, "epoch": 2870} {"train_loss": -12.340368270874023, "global_step": 482196, "epoch": 2870} {"train_loss": -12.469257354736328, "global_step": 482197, "epoch": 2870} {"train_loss": -12.422611236572266, "global_step": 482198, "epoch": 2870} {"train_loss": -12.615632057189941, "global_step": 482199, "epoch": 2870} {"train_loss": -12.385384559631348, "global_step": 482200, "epoch": 2870} {"train_loss": -12.356700897216797, "global_step": 482201, "epoch": 2870} {"train_loss": -12.437873840332031, "global_step": 482202, "epoch": 2870} {"train_loss": -12.660818099975586, "global_step": 482203, "epoch": 2870} {"train_loss": -12.467053413391113, "global_step": 482204, "epoch": 2870} {"train_loss": -12.476327896118164, "global_step": 482205, "epoch": 2870} {"train_loss": -12.477008819580078, "global_step": 482206, "epoch": 2870} {"train_loss": -12.580913543701172, "global_step": 482207, "epoch": 2870} {"train_loss": -12.433712005615234, "global_step": 482208, "epoch": 2870} {"train_loss": -12.594379425048828, "global_step": 482209, "epoch": 2870} {"train_loss": -12.612903594970703, "global_step": 482210, "epoch": 2870} {"train_loss": -12.517050743103027, "global_step": 482211, "epoch": 2870} {"train_loss": -12.5758056640625, "global_step": 482212, "epoch": 2870} {"train_loss": -12.561745643615723, "global_step": 482213, "epoch": 2870} {"train_loss": -12.65090560913086, "global_step": 482214, "epoch": 2870} {"train_loss": -12.495768547058105, "global_step": 482215, "epoch": 2870} {"train_loss": -12.468005180358887, "global_step": 482216, "epoch": 2870} {"train_loss": -12.774486541748047, "global_step": 482217, "epoch": 2870} {"train_loss": -12.39686393737793, "global_step": 482218, "epoch": 2870} {"train_loss": -12.820917129516602, "global_step": 482219, "epoch": 2870} {"train_loss": -12.627952575683594, "global_step": 482220, "epoch": 2870} {"train_loss": -12.423506736755371, "global_step": 482221, "epoch": 2870} {"train_loss": -12.43724250793457, "global_step": 482222, "epoch": 2870} {"train_loss": -12.175003051757812, "global_step": 482223, "epoch": 2870} {"train_loss": -12.395719528198242, "global_step": 482224, "epoch": 2870} {"train_loss": -11.959785461425781, "global_step": 482225, "epoch": 2870} {"train_loss": -12.717079162597656, "global_step": 482226, "epoch": 2870} {"train_loss": -11.806059837341309, "global_step": 482227, "epoch": 2870} {"train_loss": -12.320722579956055, "global_step": 482228, "epoch": 2870} {"train_loss": -12.31110954284668, "global_step": 482229, "epoch": 2870} {"train_loss": -12.799457550048828, "global_step": 482230, "epoch": 2870} {"train_loss": -12.393661499023438, "global_step": 482231, "epoch": 2870} {"train_loss": -12.61838150024414, "global_step": 482232, "epoch": 2870} {"train_loss": -12.49712085723877, "global_step": 482233, "epoch": 2870} {"train_loss": -12.730552673339844, "global_step": 482234, "epoch": 2870} {"train_loss": -12.412480354309082, "global_step": 482235, "epoch": 2870} {"train_loss": -11.85980224609375, "global_step": 482236, "epoch": 2870} {"train_loss": -12.223617553710938, "global_step": 482237, "epoch": 2870} {"train_loss": -12.653043746948242, "global_step": 482238, "epoch": 2870} {"train_loss": -12.099519729614258, "global_step": 482239, "epoch": 2870} {"train_loss": -12.714570045471191, "global_step": 482240, "epoch": 2870} {"train_loss": -12.321767807006836, "global_step": 482241, "epoch": 2870} {"train_loss": -12.24338150024414, "global_step": 482242, "epoch": 2870} {"train_loss": -12.327781677246094, "global_step": 482243, "epoch": 2870} {"train_loss": -12.08307933807373, "global_step": 482244, "epoch": 2870} {"train_loss": -11.606098175048828, "global_step": 482245, "epoch": 2870} {"train_loss": -12.088716506958008, "global_step": 482246, "epoch": 2870} {"train_loss": -10.418800354003906, "global_step": 482247, "epoch": 2870} {"train_loss": -11.5668306350708, "global_step": 482248, "epoch": 2870} {"train_loss": -10.15535831451416, "global_step": 482249, "epoch": 2870} {"train_loss": -10.20395565032959, "global_step": 482250, "epoch": 2870} {"train_loss": -10.714302062988281, "global_step": 482251, "epoch": 2870} {"train_loss": -10.582237243652344, "global_step": 482252, "epoch": 2870} {"train_loss": -11.801933288574219, "global_step": 482253, "epoch": 2870} {"train_loss": -11.077539443969727, "global_step": 482254, "epoch": 2870} {"train_loss": -11.586311340332031, "global_step": 482255, "epoch": 2870} {"train_loss": -10.470399856567383, "global_step": 482256, "epoch": 2870} {"train_loss": -12.043846130371094, "global_step": 482257, "epoch": 2870} {"train_loss": -10.322628021240234, "global_step": 482258, "epoch": 2870} {"train_loss": -10.84885025024414, "global_step": 482259, "epoch": 2870} {"train_loss": -10.604482650756836, "global_step": 482260, "epoch": 2870} {"train_loss": -9.914947509765625, "global_step": 482261, "epoch": 2870} {"train_loss": -10.89981460571289, "global_step": 482262, "epoch": 2870} {"train_loss": -10.483686447143555, "global_step": 482263, "epoch": 2870} {"train_loss": -11.089743614196777, "global_step": 482264, "epoch": 2870} {"train_loss": -11.04783821105957, "global_step": 482265, "epoch": 2870} {"train_loss": -11.282365798950195, "global_step": 482266, "epoch": 2870} {"train_loss": -10.577896118164062, "global_step": 482267, "epoch": 2870} {"train_loss": -10.592883110046387, "global_step": 482268, "epoch": 2870} {"train_loss": -11.81312370300293, "global_step": 482269, "epoch": 2870} {"train_loss": -11.34859848022461, "global_step": 482270, "epoch": 2870} {"train_loss": -10.755660057067871, "global_step": 482271, "epoch": 2870} {"train_loss": -12.14816665649414, "global_step": 482272, "epoch": 2870} {"train_loss": -10.496955871582031, "global_step": 482273, "epoch": 2870} {"train_loss": -11.840669631958008, "global_step": 482274, "epoch": 2870} {"train_loss": -11.248514175415039, "global_step": 482275, "epoch": 2870} {"train_loss": -11.232534408569336, "global_step": 482276, "epoch": 2870} {"train_loss": -11.736659049987793, "global_step": 482277, "epoch": 2870} {"train_loss": -11.136479377746582, "global_step": 482278, "epoch": 2870} {"train_loss": -11.954497337341309, "global_step": 482279, "epoch": 2870} {"train_loss": -12.134000778198242, "global_step": 482280, "epoch": 2870} {"train_loss": -12.078521728515625, "global_step": 482281, "epoch": 2870} {"train_loss": -11.980481147766113, "global_step": 482282, "epoch": 2870} {"train_loss": -12.080513954162598, "global_step": 482283, "epoch": 2870} {"train_loss": -11.922750473022461, "global_step": 482284, "epoch": 2870} {"train_loss": -12.225746154785156, "global_step": 482285, "epoch": 2870} {"train_loss": -11.427967071533203, "global_step": 482286, "epoch": 2870} {"train_loss": -12.365578651428223, "global_step": 482287, "epoch": 2870} {"train_loss": -11.997416496276855, "global_step": 482288, "epoch": 2870} {"train_loss": -12.446453094482422, "global_step": 482289, "epoch": 2870} {"train_loss": -11.981756210327148, "global_step": 482290, "epoch": 2870} {"train_loss": -12.418069839477539, "global_step": 482291, "epoch": 2870} {"train_loss": -11.427714347839355, "global_step": 482292, "epoch": 2870} {"train_loss": -12.11861801147461, "global_step": 482293, "epoch": 2870} {"train_loss": -11.638689041137695, "global_step": 482294, "epoch": 2870} {"train_loss": -11.872953414916992, "global_step": 482295, "epoch": 2870} {"train_loss": -12.182641983032227, "global_step": 482296, "epoch": 2870} {"train_loss": -11.60472583770752, "global_step": 482297, "epoch": 2870} {"train_loss": -12.544265747070312, "global_step": 482298, "epoch": 2870} {"train_loss": -11.602051734924316, "global_step": 482299, "epoch": 2870} {"train_loss": -12.148252487182617, "global_step": 482300, "epoch": 2870} {"train_loss": -12.233068466186523, "global_step": 482301, "epoch": 2870} {"train_loss": -12.251898765563965, "global_step": 482302, "epoch": 2870} {"train_loss": -12.07563591003418, "global_step": 482303, "epoch": 2870} {"train_loss": -12.18822956085205, "global_step": 482304, "epoch": 2870} {"train_loss": -12.000251770019531, "global_step": 482305, "epoch": 2870} {"train_loss": -12.49030876159668, "global_step": 482306, "epoch": 2870} {"train_loss": -11.84532356262207, "global_step": 482307, "epoch": 2870} {"train_loss": -12.073600769042969, "global_step": 482308, "epoch": 2870} {"train_loss": -12.007960319519043, "global_step": 482309, "epoch": 2870} {"train_loss": -12.213071823120117, "global_step": 482310, "epoch": 2870} {"train_loss": -12.156270980834961, "global_step": 482311, "epoch": 2870} {"train_loss": -12.067401885986328, "global_step": 482312, "epoch": 2870} {"train_loss": -11.77969741821289, "global_step": 482313, "epoch": 2870} {"train_loss": -11.919185638427734, "global_step": 482314, "epoch": 2870} {"train_loss": -11.818154335021973, "global_step": 482315, "epoch": 2870} {"train_loss": -12.296793937683105, "global_step": 482316, "epoch": 2870} {"train_loss": -11.997915267944336, "global_step": 482317, "epoch": 2870} {"train_loss": -12.332148551940918, "global_step": 482318, "epoch": 2870} {"train_loss": -11.920185089111328, "global_step": 482319, "epoch": 2870} {"train_loss": -12.398995399475098, "global_step": 482320, "epoch": 2870} {"train_loss": -12.631355285644531, "global_step": 482321, "epoch": 2870} {"train_loss": -12.171714782714844, "global_step": 482322, "epoch": 2870} {"train_loss": -12.730645179748535, "global_step": 482323, "epoch": 2870} {"train_loss": -12.061439514160156, "global_step": 482324, "epoch": 2870} {"train_loss": -12.667386054992676, "global_step": 482325, "epoch": 2870} {"train_loss": -12.506267547607422, "global_step": 482326, "epoch": 2870} {"train_loss": -12.000419332867576, "global_step": 482327, "epoch": 2870, "val_loss": 319476.375, "train_action_mse_error": 1.859667420387268} {"train_loss": -12.535188674926758, "global_step": 482328, "epoch": 2871} {"train_loss": -12.35389232635498, "global_step": 482329, "epoch": 2871} {"train_loss": -12.67939567565918, "global_step": 482330, "epoch": 2871} {"train_loss": -12.455398559570312, "global_step": 482331, "epoch": 2871} {"train_loss": -12.499592781066895, "global_step": 482332, "epoch": 2871} {"train_loss": -12.643718719482422, "global_step": 482333, "epoch": 2871} {"train_loss": -12.650985717773438, "global_step": 482334, "epoch": 2871} {"train_loss": -12.525327682495117, "global_step": 482335, "epoch": 2871} {"train_loss": -12.755590438842773, "global_step": 482336, "epoch": 2871} {"train_loss": -12.569836616516113, "global_step": 482337, "epoch": 2871} {"train_loss": -12.630594253540039, "global_step": 482338, "epoch": 2871} {"train_loss": -12.770088195800781, "global_step": 482339, "epoch": 2871} {"train_loss": -12.72706127166748, "global_step": 482340, "epoch": 2871} {"train_loss": -12.713827133178711, "global_step": 482341, "epoch": 2871} {"train_loss": -13.002273559570312, "global_step": 482342, "epoch": 2871} {"train_loss": -12.67310905456543, "global_step": 482343, "epoch": 2871} {"train_loss": -12.722779273986816, "global_step": 482344, "epoch": 2871} {"train_loss": -12.946477890014648, "global_step": 482345, "epoch": 2871} {"train_loss": -12.709296226501465, "global_step": 482346, "epoch": 2871} {"train_loss": -12.769796371459961, "global_step": 482347, "epoch": 2871} {"train_loss": -12.832317352294922, "global_step": 482348, "epoch": 2871} {"train_loss": -12.77702522277832, "global_step": 482349, "epoch": 2871} {"train_loss": -12.661788940429688, "global_step": 482350, "epoch": 2871} {"train_loss": -12.949645042419434, "global_step": 482351, "epoch": 2871} {"train_loss": -12.929927825927734, "global_step": 482352, "epoch": 2871} {"train_loss": -12.82284164428711, "global_step": 482353, "epoch": 2871} {"train_loss": -12.891366958618164, "global_step": 482354, "epoch": 2871} {"train_loss": -12.944087028503418, "global_step": 482355, "epoch": 2871} {"train_loss": -12.950349807739258, "global_step": 482356, "epoch": 2871} {"train_loss": -12.812084197998047, "global_step": 482357, "epoch": 2871} {"train_loss": -12.828365325927734, "global_step": 482358, "epoch": 2871} {"train_loss": -12.836140632629395, "global_step": 482359, "epoch": 2871} {"train_loss": -12.803773880004883, "global_step": 482360, "epoch": 2871} {"train_loss": -12.837236404418945, "global_step": 482361, "epoch": 2871} {"train_loss": -12.719612121582031, "global_step": 482362, "epoch": 2871} {"train_loss": -12.83870792388916, "global_step": 482363, "epoch": 2871} {"train_loss": -12.929766654968262, "global_step": 482364, "epoch": 2871} {"train_loss": -12.806270599365234, "global_step": 482365, "epoch": 2871} {"train_loss": -13.003700256347656, "global_step": 482366, "epoch": 2871} {"train_loss": -12.81488037109375, "global_step": 482367, "epoch": 2871} {"train_loss": -13.022876739501953, "global_step": 482368, "epoch": 2871} {"train_loss": -12.753839492797852, "global_step": 482369, "epoch": 2871} {"train_loss": -12.899873733520508, "global_step": 482370, "epoch": 2871} {"train_loss": -12.715804100036621, "global_step": 482371, "epoch": 2871} {"train_loss": -12.598062515258789, "global_step": 482372, "epoch": 2871} {"train_loss": -12.834052085876465, "global_step": 482373, "epoch": 2871} {"train_loss": -12.7240629196167, "global_step": 482374, "epoch": 2871} {"train_loss": -12.89626693725586, "global_step": 482375, "epoch": 2871} {"train_loss": -12.8634033203125, "global_step": 482376, "epoch": 2871} {"train_loss": -12.768889427185059, "global_step": 482377, "epoch": 2871} {"train_loss": -12.680244445800781, "global_step": 482378, "epoch": 2871} {"train_loss": -13.050798416137695, "global_step": 482379, "epoch": 2871} {"train_loss": -12.790298461914062, "global_step": 482380, "epoch": 2871} {"train_loss": -12.959083557128906, "global_step": 482381, "epoch": 2871} {"train_loss": -12.950970649719238, "global_step": 482382, "epoch": 2871} {"train_loss": -13.19320011138916, "global_step": 482383, "epoch": 2871} {"train_loss": -12.96763801574707, "global_step": 482384, "epoch": 2871} {"train_loss": -12.854778289794922, "global_step": 482385, "epoch": 2871} {"train_loss": -13.070186614990234, "global_step": 482386, "epoch": 2871} {"train_loss": -12.617441177368164, "global_step": 482387, "epoch": 2871} {"train_loss": -13.004388809204102, "global_step": 482388, "epoch": 2871} {"train_loss": -12.857012748718262, "global_step": 482389, "epoch": 2871} {"train_loss": -12.988540649414062, "global_step": 482390, "epoch": 2871} {"train_loss": -12.408439636230469, "global_step": 482391, "epoch": 2871} {"train_loss": -12.869625091552734, "global_step": 482392, "epoch": 2871} {"train_loss": -12.717612266540527, "global_step": 482393, "epoch": 2871} {"train_loss": -13.061614036560059, "global_step": 482394, "epoch": 2871} {"train_loss": -12.729639053344727, "global_step": 482395, "epoch": 2871} {"train_loss": -12.493352890014648, "global_step": 482396, "epoch": 2871} {"train_loss": -12.418153762817383, "global_step": 482397, "epoch": 2871} {"train_loss": -12.302587509155273, "global_step": 482398, "epoch": 2871} {"train_loss": -12.357573509216309, "global_step": 482399, "epoch": 2871} {"train_loss": -12.28433895111084, "global_step": 482400, "epoch": 2871} {"train_loss": -12.66677474975586, "global_step": 482401, "epoch": 2871} {"train_loss": -11.818887710571289, "global_step": 482402, "epoch": 2871} {"train_loss": -11.571986198425293, "global_step": 482403, "epoch": 2871} {"train_loss": -12.404448509216309, "global_step": 482404, "epoch": 2871} {"train_loss": -12.358993530273438, "global_step": 482405, "epoch": 2871} {"train_loss": -10.956110000610352, "global_step": 482406, "epoch": 2871} {"train_loss": -11.774589538574219, "global_step": 482407, "epoch": 2871} {"train_loss": -11.960416793823242, "global_step": 482408, "epoch": 2871} {"train_loss": -12.6326904296875, "global_step": 482409, "epoch": 2871} {"train_loss": -12.239749908447266, "global_step": 482410, "epoch": 2871} {"train_loss": -12.739177703857422, "global_step": 482411, "epoch": 2871} {"train_loss": -12.42315673828125, "global_step": 482412, "epoch": 2871} {"train_loss": -12.945473670959473, "global_step": 482413, "epoch": 2871} {"train_loss": -12.49818229675293, "global_step": 482414, "epoch": 2871} {"train_loss": -12.299905776977539, "global_step": 482415, "epoch": 2871} {"train_loss": -12.71101188659668, "global_step": 482416, "epoch": 2871} {"train_loss": -12.698240280151367, "global_step": 482417, "epoch": 2871} {"train_loss": -12.636528968811035, "global_step": 482418, "epoch": 2871} {"train_loss": -12.938960075378418, "global_step": 482419, "epoch": 2871} {"train_loss": -12.78312873840332, "global_step": 482420, "epoch": 2871} {"train_loss": -12.856767654418945, "global_step": 482421, "epoch": 2871} {"train_loss": -12.656534194946289, "global_step": 482422, "epoch": 2871} {"train_loss": -12.576488494873047, "global_step": 482423, "epoch": 2871} {"train_loss": -12.286966323852539, "global_step": 482424, "epoch": 2871} {"train_loss": -12.58892822265625, "global_step": 482425, "epoch": 2871} {"train_loss": -12.755672454833984, "global_step": 482426, "epoch": 2871} {"train_loss": -12.214042663574219, "global_step": 482427, "epoch": 2871} {"train_loss": -12.238198280334473, "global_step": 482428, "epoch": 2871} {"train_loss": -12.272284507751465, "global_step": 482429, "epoch": 2871} {"train_loss": -12.138187408447266, "global_step": 482430, "epoch": 2871} {"train_loss": -11.952735900878906, "global_step": 482431, "epoch": 2871} {"train_loss": -12.011350631713867, "global_step": 482432, "epoch": 2871} {"train_loss": -12.025141716003418, "global_step": 482433, "epoch": 2871} {"train_loss": -12.347972869873047, "global_step": 482434, "epoch": 2871} {"train_loss": -11.321364402770996, "global_step": 482435, "epoch": 2871} {"train_loss": -12.124015808105469, "global_step": 482436, "epoch": 2871} {"train_loss": -11.662365913391113, "global_step": 482437, "epoch": 2871} {"train_loss": -11.842048645019531, "global_step": 482438, "epoch": 2871} {"train_loss": -11.444276809692383, "global_step": 482439, "epoch": 2871} {"train_loss": -11.804749488830566, "global_step": 482440, "epoch": 2871} {"train_loss": -11.355408668518066, "global_step": 482441, "epoch": 2871} {"train_loss": -11.672622680664062, "global_step": 482442, "epoch": 2871} {"train_loss": -11.570085525512695, "global_step": 482443, "epoch": 2871} {"train_loss": -11.493537902832031, "global_step": 482444, "epoch": 2871} {"train_loss": -11.918752670288086, "global_step": 482445, "epoch": 2871} {"train_loss": -11.692646026611328, "global_step": 482446, "epoch": 2871} {"train_loss": -11.79500675201416, "global_step": 482447, "epoch": 2871} {"train_loss": -11.658160209655762, "global_step": 482448, "epoch": 2871} {"train_loss": -12.144216537475586, "global_step": 482449, "epoch": 2871} {"train_loss": -11.823480606079102, "global_step": 482450, "epoch": 2871} {"train_loss": -11.535168647766113, "global_step": 482451, "epoch": 2871} {"train_loss": -11.385290145874023, "global_step": 482452, "epoch": 2871} {"train_loss": -11.522626876831055, "global_step": 482453, "epoch": 2871} {"train_loss": -10.733514785766602, "global_step": 482454, "epoch": 2871} {"train_loss": -11.883222579956055, "global_step": 482455, "epoch": 2871} {"train_loss": -10.805560111999512, "global_step": 482456, "epoch": 2871} {"train_loss": -11.746914863586426, "global_step": 482457, "epoch": 2871} {"train_loss": -11.772823333740234, "global_step": 482458, "epoch": 2871} {"train_loss": -12.084199905395508, "global_step": 482459, "epoch": 2871} {"train_loss": -12.26699447631836, "global_step": 482460, "epoch": 2871} {"train_loss": -12.07512378692627, "global_step": 482461, "epoch": 2871} {"train_loss": -12.354199409484863, "global_step": 482462, "epoch": 2871} {"train_loss": -12.224162101745605, "global_step": 482463, "epoch": 2871} {"train_loss": -12.166732788085938, "global_step": 482464, "epoch": 2871} {"train_loss": -12.519240379333496, "global_step": 482465, "epoch": 2871} {"train_loss": -12.463993072509766, "global_step": 482466, "epoch": 2871} {"train_loss": -12.504528045654297, "global_step": 482467, "epoch": 2871} {"train_loss": -12.363053321838379, "global_step": 482468, "epoch": 2871} {"train_loss": -12.780463218688965, "global_step": 482469, "epoch": 2871} {"train_loss": -12.457256317138672, "global_step": 482470, "epoch": 2871} {"train_loss": -12.748262405395508, "global_step": 482471, "epoch": 2871} {"train_loss": -12.518590927124023, "global_step": 482472, "epoch": 2871} {"train_loss": -12.733807563781738, "global_step": 482473, "epoch": 2871} {"train_loss": -12.560134887695312, "global_step": 482474, "epoch": 2871} {"train_loss": -12.432154655456543, "global_step": 482475, "epoch": 2871} {"train_loss": -12.831412315368652, "global_step": 482476, "epoch": 2871} {"train_loss": -12.90773868560791, "global_step": 482477, "epoch": 2871} {"train_loss": -12.720115661621094, "global_step": 482478, "epoch": 2871} {"train_loss": -12.777347564697266, "global_step": 482479, "epoch": 2871} {"train_loss": -12.623031616210938, "global_step": 482480, "epoch": 2871} {"train_loss": -12.938772201538086, "global_step": 482481, "epoch": 2871} {"train_loss": -12.845093727111816, "global_step": 482482, "epoch": 2871} {"train_loss": -12.785918235778809, "global_step": 482483, "epoch": 2871} {"train_loss": -12.867877960205078, "global_step": 482484, "epoch": 2871} {"train_loss": -12.736464500427246, "global_step": 482485, "epoch": 2871} {"train_loss": -12.79465389251709, "global_step": 482486, "epoch": 2871} {"train_loss": -12.62225341796875, "global_step": 482487, "epoch": 2871} {"train_loss": -13.038551330566406, "global_step": 482488, "epoch": 2871} {"train_loss": -12.554462432861328, "global_step": 482489, "epoch": 2871} {"train_loss": -12.598743438720703, "global_step": 482490, "epoch": 2871} {"train_loss": -12.667694091796875, "global_step": 482491, "epoch": 2871} {"train_loss": -12.444267272949219, "global_step": 482492, "epoch": 2871} {"train_loss": -12.51202392578125, "global_step": 482493, "epoch": 2871} {"train_loss": -12.761133193969727, "global_step": 482494, "epoch": 2871} {"train_loss": -12.474058872177487, "global_step": 482495, "epoch": 2871, "val_loss": 318581.1875} {"train_loss": -11.775214195251465, "global_step": 482496, "epoch": 2872} {"train_loss": -12.328268051147461, "global_step": 482497, "epoch": 2872} {"train_loss": -12.004709243774414, "global_step": 482498, "epoch": 2872} {"train_loss": -12.131092071533203, "global_step": 482499, "epoch": 2872} {"train_loss": -11.004244804382324, "global_step": 482500, "epoch": 2872} {"train_loss": -10.54557991027832, "global_step": 482501, "epoch": 2872} {"train_loss": -11.011789321899414, "global_step": 482502, "epoch": 2872} {"train_loss": -9.54830551147461, "global_step": 482503, "epoch": 2872} {"train_loss": -11.921769142150879, "global_step": 482504, "epoch": 2872} {"train_loss": -10.16321086883545, "global_step": 482505, "epoch": 2872} {"train_loss": -12.131514549255371, "global_step": 482506, "epoch": 2872} {"train_loss": -10.535360336303711, "global_step": 482507, "epoch": 2872} {"train_loss": -11.665245056152344, "global_step": 482508, "epoch": 2872} {"train_loss": -10.409759521484375, "global_step": 482509, "epoch": 2872} {"train_loss": -10.794524192810059, "global_step": 482510, "epoch": 2872} {"train_loss": -10.900832176208496, "global_step": 482511, "epoch": 2872} {"train_loss": -11.469712257385254, "global_step": 482512, "epoch": 2872} {"train_loss": -11.926066398620605, "global_step": 482513, "epoch": 2872} {"train_loss": -12.34640884399414, "global_step": 482514, "epoch": 2872} {"train_loss": -11.28834342956543, "global_step": 482515, "epoch": 2872} {"train_loss": -11.857057571411133, "global_step": 482516, "epoch": 2872} {"train_loss": -11.53195571899414, "global_step": 482517, "epoch": 2872} {"train_loss": -12.066313743591309, "global_step": 482518, "epoch": 2872} {"train_loss": -12.71322250366211, "global_step": 482519, "epoch": 2872} {"train_loss": -11.815792083740234, "global_step": 482520, "epoch": 2872} {"train_loss": -12.327522277832031, "global_step": 482521, "epoch": 2872} {"train_loss": -12.036391258239746, "global_step": 482522, "epoch": 2872} {"train_loss": -12.491250991821289, "global_step": 482523, "epoch": 2872} {"train_loss": -12.618112564086914, "global_step": 482524, "epoch": 2872} {"train_loss": -11.908041000366211, "global_step": 482525, "epoch": 2872} {"train_loss": -12.690967559814453, "global_step": 482526, "epoch": 2872} {"train_loss": -12.215128898620605, "global_step": 482527, "epoch": 2872} {"train_loss": -12.34034538269043, "global_step": 482528, "epoch": 2872} {"train_loss": -11.803510665893555, "global_step": 482529, "epoch": 2872} {"train_loss": -12.304217338562012, "global_step": 482530, "epoch": 2872} {"train_loss": -11.709516525268555, "global_step": 482531, "epoch": 2872} {"train_loss": -12.115964889526367, "global_step": 482532, "epoch": 2872} {"train_loss": -11.790766716003418, "global_step": 482533, "epoch": 2872} {"train_loss": -11.63007926940918, "global_step": 482534, "epoch": 2872} {"train_loss": -11.501976013183594, "global_step": 482535, "epoch": 2872} {"train_loss": -11.604925155639648, "global_step": 482536, "epoch": 2872} {"train_loss": -11.8687105178833, "global_step": 482537, "epoch": 2872} {"train_loss": -11.752039909362793, "global_step": 482538, "epoch": 2872} {"train_loss": -11.298681259155273, "global_step": 482539, "epoch": 2872} {"train_loss": -12.249232292175293, "global_step": 482540, "epoch": 2872} {"train_loss": -11.6439208984375, "global_step": 482541, "epoch": 2872} {"train_loss": -11.385960578918457, "global_step": 482542, "epoch": 2872} {"train_loss": -11.714376449584961, "global_step": 482543, "epoch": 2872} {"train_loss": -11.911417007446289, "global_step": 482544, "epoch": 2872} {"train_loss": -11.642463684082031, "global_step": 482545, "epoch": 2872} {"train_loss": -12.181585311889648, "global_step": 482546, "epoch": 2872} {"train_loss": -12.07274055480957, "global_step": 482547, "epoch": 2872} {"train_loss": -11.664446830749512, "global_step": 482548, "epoch": 2872} {"train_loss": -12.075542449951172, "global_step": 482549, "epoch": 2872} {"train_loss": -12.06937026977539, "global_step": 482550, "epoch": 2872} {"train_loss": -11.60566520690918, "global_step": 482551, "epoch": 2872} {"train_loss": -12.649935722351074, "global_step": 482552, "epoch": 2872} {"train_loss": -11.92878246307373, "global_step": 482553, "epoch": 2872} {"train_loss": -12.19968032836914, "global_step": 482554, "epoch": 2872} {"train_loss": -12.449251174926758, "global_step": 482555, "epoch": 2872} {"train_loss": -12.224235534667969, "global_step": 482556, "epoch": 2872} {"train_loss": -12.416306495666504, "global_step": 482557, "epoch": 2872} {"train_loss": -12.53425407409668, "global_step": 482558, "epoch": 2872} {"train_loss": -11.752187728881836, "global_step": 482559, "epoch": 2872} {"train_loss": -12.48337173461914, "global_step": 482560, "epoch": 2872} {"train_loss": -12.043920516967773, "global_step": 482561, "epoch": 2872} {"train_loss": -12.479564666748047, "global_step": 482562, "epoch": 2872} {"train_loss": -12.184432983398438, "global_step": 482563, "epoch": 2872} {"train_loss": -12.61512565612793, "global_step": 482564, "epoch": 2872} {"train_loss": -12.33725643157959, "global_step": 482565, "epoch": 2872} {"train_loss": -12.279767036437988, "global_step": 482566, "epoch": 2872} {"train_loss": -12.301471710205078, "global_step": 482567, "epoch": 2872} {"train_loss": -12.200621604919434, "global_step": 482568, "epoch": 2872} {"train_loss": -11.71116828918457, "global_step": 482569, "epoch": 2872} {"train_loss": -12.314361572265625, "global_step": 482570, "epoch": 2872} {"train_loss": -12.11307144165039, "global_step": 482571, "epoch": 2872} {"train_loss": -12.029892921447754, "global_step": 482572, "epoch": 2872} {"train_loss": -12.351749420166016, "global_step": 482573, "epoch": 2872} {"train_loss": -11.742427825927734, "global_step": 482574, "epoch": 2872} {"train_loss": -12.576464653015137, "global_step": 482575, "epoch": 2872} {"train_loss": -11.988630294799805, "global_step": 482576, "epoch": 2872} {"train_loss": -12.338884353637695, "global_step": 482577, "epoch": 2872} {"train_loss": -11.698148727416992, "global_step": 482578, "epoch": 2872} {"train_loss": -12.21357536315918, "global_step": 482579, "epoch": 2872} {"train_loss": -12.270453453063965, "global_step": 482580, "epoch": 2872} {"train_loss": -11.981027603149414, "global_step": 482581, "epoch": 2872} {"train_loss": -12.44676685333252, "global_step": 482582, "epoch": 2872} {"train_loss": -12.408238410949707, "global_step": 482583, "epoch": 2872} {"train_loss": -12.461480140686035, "global_step": 482584, "epoch": 2872} {"train_loss": -12.708770751953125, "global_step": 482585, "epoch": 2872} {"train_loss": -12.533862113952637, "global_step": 482586, "epoch": 2872} {"train_loss": -12.689348220825195, "global_step": 482587, "epoch": 2872} {"train_loss": -12.474318504333496, "global_step": 482588, "epoch": 2872} {"train_loss": -12.647969245910645, "global_step": 482589, "epoch": 2872} {"train_loss": -12.524702072143555, "global_step": 482590, "epoch": 2872} {"train_loss": -12.422473907470703, "global_step": 482591, "epoch": 2872} {"train_loss": -12.482707023620605, "global_step": 482592, "epoch": 2872} {"train_loss": -12.678485870361328, "global_step": 482593, "epoch": 2872} {"train_loss": -12.19273567199707, "global_step": 482594, "epoch": 2872} {"train_loss": -12.750444412231445, "global_step": 482595, "epoch": 2872} {"train_loss": -12.347219467163086, "global_step": 482596, "epoch": 2872} {"train_loss": -12.37495231628418, "global_step": 482597, "epoch": 2872} {"train_loss": -12.589471817016602, "global_step": 482598, "epoch": 2872} {"train_loss": -12.201614379882812, "global_step": 482599, "epoch": 2872} {"train_loss": -12.399068832397461, "global_step": 482600, "epoch": 2872} {"train_loss": -12.42479133605957, "global_step": 482601, "epoch": 2872} {"train_loss": -12.715251922607422, "global_step": 482602, "epoch": 2872} {"train_loss": -12.76551628112793, "global_step": 482603, "epoch": 2872} {"train_loss": -12.635147094726562, "global_step": 482604, "epoch": 2872} {"train_loss": -12.927032470703125, "global_step": 482605, "epoch": 2872} {"train_loss": -12.72852611541748, "global_step": 482606, "epoch": 2872} {"train_loss": -12.755203247070312, "global_step": 482607, "epoch": 2872} {"train_loss": -12.857734680175781, "global_step": 482608, "epoch": 2872} {"train_loss": -12.590786933898926, "global_step": 482609, "epoch": 2872} {"train_loss": -12.747014045715332, "global_step": 482610, "epoch": 2872} {"train_loss": -12.507640838623047, "global_step": 482611, "epoch": 2872} {"train_loss": -12.635869979858398, "global_step": 482612, "epoch": 2872} {"train_loss": -12.720878601074219, "global_step": 482613, "epoch": 2872} {"train_loss": -12.496986389160156, "global_step": 482614, "epoch": 2872} {"train_loss": -12.572031021118164, "global_step": 482615, "epoch": 2872} {"train_loss": -12.598625183105469, "global_step": 482616, "epoch": 2872} {"train_loss": -12.371156692504883, "global_step": 482617, "epoch": 2872} {"train_loss": -12.425447463989258, "global_step": 482618, "epoch": 2872} {"train_loss": -12.560091972351074, "global_step": 482619, "epoch": 2872} {"train_loss": -12.636155128479004, "global_step": 482620, "epoch": 2872} {"train_loss": -12.738183975219727, "global_step": 482621, "epoch": 2872} {"train_loss": -12.51941204071045, "global_step": 482622, "epoch": 2872} {"train_loss": -12.687579154968262, "global_step": 482623, "epoch": 2872} {"train_loss": -12.595979690551758, "global_step": 482624, "epoch": 2872} {"train_loss": -12.61263656616211, "global_step": 482625, "epoch": 2872} {"train_loss": -13.098495483398438, "global_step": 482626, "epoch": 2872} {"train_loss": -12.79122543334961, "global_step": 482627, "epoch": 2872} {"train_loss": -12.910909652709961, "global_step": 482628, "epoch": 2872} {"train_loss": -12.608193397521973, "global_step": 482629, "epoch": 2872} {"train_loss": -12.70341682434082, "global_step": 482630, "epoch": 2872} {"train_loss": -12.574136734008789, "global_step": 482631, "epoch": 2872} {"train_loss": -12.775288581848145, "global_step": 482632, "epoch": 2872} {"train_loss": -12.669023513793945, "global_step": 482633, "epoch": 2872} {"train_loss": -12.70533561706543, "global_step": 482634, "epoch": 2872} {"train_loss": -12.961799621582031, "global_step": 482635, "epoch": 2872} {"train_loss": -12.185955047607422, "global_step": 482636, "epoch": 2872} {"train_loss": -12.804525375366211, "global_step": 482637, "epoch": 2872} {"train_loss": -12.479867935180664, "global_step": 482638, "epoch": 2872} {"train_loss": -12.465131759643555, "global_step": 482639, "epoch": 2872} {"train_loss": -12.461564064025879, "global_step": 482640, "epoch": 2872} {"train_loss": -12.725550651550293, "global_step": 482641, "epoch": 2872} {"train_loss": -12.747475624084473, "global_step": 482642, "epoch": 2872} {"train_loss": -12.27484130859375, "global_step": 482643, "epoch": 2872} {"train_loss": -12.728711128234863, "global_step": 482644, "epoch": 2872} {"train_loss": -12.530332565307617, "global_step": 482645, "epoch": 2872} {"train_loss": -12.47960090637207, "global_step": 482646, "epoch": 2872} {"train_loss": -11.808895111083984, "global_step": 482647, "epoch": 2872} {"train_loss": -12.730100631713867, "global_step": 482648, "epoch": 2872} {"train_loss": -11.762819290161133, "global_step": 482649, "epoch": 2872} {"train_loss": -12.403948783874512, "global_step": 482650, "epoch": 2872} {"train_loss": -11.977195739746094, "global_step": 482651, "epoch": 2872} {"train_loss": -11.764785766601562, "global_step": 482652, "epoch": 2872} {"train_loss": -11.593524932861328, "global_step": 482653, "epoch": 2872} {"train_loss": -10.997896194458008, "global_step": 482654, "epoch": 2872} {"train_loss": -10.699688911437988, "global_step": 482655, "epoch": 2872} {"train_loss": -10.830968856811523, "global_step": 482656, "epoch": 2872} {"train_loss": -11.855792999267578, "global_step": 482657, "epoch": 2872} {"train_loss": -11.29252815246582, "global_step": 482658, "epoch": 2872} {"train_loss": -12.133051872253418, "global_step": 482659, "epoch": 2872} {"train_loss": -10.832557678222656, "global_step": 482660, "epoch": 2872} {"train_loss": -11.82424545288086, "global_step": 482661, "epoch": 2872} {"train_loss": -11.543839454650879, "global_step": 482662, "epoch": 2872} {"train_loss": -12.137737120900836, "global_step": 482663, "epoch": 2872, "val_loss": 317053.71875} {"train_loss": -11.736772537231445, "global_step": 482664, "epoch": 2873} {"train_loss": -11.631468772888184, "global_step": 482665, "epoch": 2873} {"train_loss": -12.226968765258789, "global_step": 482666, "epoch": 2873} {"train_loss": -11.70279312133789, "global_step": 482667, "epoch": 2873} {"train_loss": -11.408575057983398, "global_step": 482668, "epoch": 2873} {"train_loss": -10.756735801696777, "global_step": 482669, "epoch": 2873} {"train_loss": -11.899059295654297, "global_step": 482670, "epoch": 2873} {"train_loss": -11.33907699584961, "global_step": 482671, "epoch": 2873} {"train_loss": -11.560172080993652, "global_step": 482672, "epoch": 2873} {"train_loss": -11.12105941772461, "global_step": 482673, "epoch": 2873} {"train_loss": -10.304447174072266, "global_step": 482674, "epoch": 2873} {"train_loss": -10.671059608459473, "global_step": 482675, "epoch": 2873} {"train_loss": -11.495874404907227, "global_step": 482676, "epoch": 2873} {"train_loss": -10.185667037963867, "global_step": 482677, "epoch": 2873} {"train_loss": -10.744455337524414, "global_step": 482678, "epoch": 2873} {"train_loss": -11.763166427612305, "global_step": 482679, "epoch": 2873} {"train_loss": -10.213940620422363, "global_step": 482680, "epoch": 2873} {"train_loss": -11.831326484680176, "global_step": 482681, "epoch": 2873} {"train_loss": -10.775324821472168, "global_step": 482682, "epoch": 2873} {"train_loss": -11.141239166259766, "global_step": 482683, "epoch": 2873} {"train_loss": -10.351198196411133, "global_step": 482684, "epoch": 2873} {"train_loss": -11.373207092285156, "global_step": 482685, "epoch": 2873} {"train_loss": -10.816893577575684, "global_step": 482686, "epoch": 2873} {"train_loss": -11.051782608032227, "global_step": 482687, "epoch": 2873} {"train_loss": -12.218666076660156, "global_step": 482688, "epoch": 2873} {"train_loss": -11.342706680297852, "global_step": 482689, "epoch": 2873} {"train_loss": -11.700969696044922, "global_step": 482690, "epoch": 2873} {"train_loss": -11.518709182739258, "global_step": 482691, "epoch": 2873} {"train_loss": -11.961624145507812, "global_step": 482692, "epoch": 2873} {"train_loss": -11.927743911743164, "global_step": 482693, "epoch": 2873} {"train_loss": -11.94331169128418, "global_step": 482694, "epoch": 2873} {"train_loss": -12.022375106811523, "global_step": 482695, "epoch": 2873} {"train_loss": -11.526402473449707, "global_step": 482696, "epoch": 2873} {"train_loss": -12.26768684387207, "global_step": 482697, "epoch": 2873} {"train_loss": -11.671463966369629, "global_step": 482698, "epoch": 2873} {"train_loss": -12.159826278686523, "global_step": 482699, "epoch": 2873} {"train_loss": -11.888232231140137, "global_step": 482700, "epoch": 2873} {"train_loss": -12.126642227172852, "global_step": 482701, "epoch": 2873} {"train_loss": -11.80077838897705, "global_step": 482702, "epoch": 2873} {"train_loss": -12.276516914367676, "global_step": 482703, "epoch": 2873} {"train_loss": -11.95020866394043, "global_step": 482704, "epoch": 2873} {"train_loss": -11.788379669189453, "global_step": 482705, "epoch": 2873} {"train_loss": -12.126453399658203, "global_step": 482706, "epoch": 2873} {"train_loss": -11.782630920410156, "global_step": 482707, "epoch": 2873} {"train_loss": -12.462991714477539, "global_step": 482708, "epoch": 2873} {"train_loss": -11.57073974609375, "global_step": 482709, "epoch": 2873} {"train_loss": -12.239090919494629, "global_step": 482710, "epoch": 2873} {"train_loss": -11.60110092163086, "global_step": 482711, "epoch": 2873} {"train_loss": -12.343807220458984, "global_step": 482712, "epoch": 2873} {"train_loss": -12.455253601074219, "global_step": 482713, "epoch": 2873} {"train_loss": -11.897390365600586, "global_step": 482714, "epoch": 2873} {"train_loss": -12.597387313842773, "global_step": 482715, "epoch": 2873} {"train_loss": -11.840178489685059, "global_step": 482716, "epoch": 2873} {"train_loss": -12.315152168273926, "global_step": 482717, "epoch": 2873} {"train_loss": -11.52071475982666, "global_step": 482718, "epoch": 2873} {"train_loss": -12.631733894348145, "global_step": 482719, "epoch": 2873} {"train_loss": -12.071216583251953, "global_step": 482720, "epoch": 2873} {"train_loss": -12.335970878601074, "global_step": 482721, "epoch": 2873} {"train_loss": -12.132110595703125, "global_step": 482722, "epoch": 2873} {"train_loss": -12.405248641967773, "global_step": 482723, "epoch": 2873} {"train_loss": -12.394498825073242, "global_step": 482724, "epoch": 2873} {"train_loss": -12.387401580810547, "global_step": 482725, "epoch": 2873} {"train_loss": -12.527396202087402, "global_step": 482726, "epoch": 2873} {"train_loss": -11.944229125976562, "global_step": 482727, "epoch": 2873} {"train_loss": -12.588043212890625, "global_step": 482728, "epoch": 2873} {"train_loss": -12.379779815673828, "global_step": 482729, "epoch": 2873} {"train_loss": -12.522073745727539, "global_step": 482730, "epoch": 2873} {"train_loss": -12.031841278076172, "global_step": 482731, "epoch": 2873} {"train_loss": -12.589241027832031, "global_step": 482732, "epoch": 2873} {"train_loss": -12.376445770263672, "global_step": 482733, "epoch": 2873} {"train_loss": -12.5744047164917, "global_step": 482734, "epoch": 2873} {"train_loss": -12.654183387756348, "global_step": 482735, "epoch": 2873} {"train_loss": -12.267389297485352, "global_step": 482736, "epoch": 2873} {"train_loss": -12.756914138793945, "global_step": 482737, "epoch": 2873} {"train_loss": -12.514348030090332, "global_step": 482738, "epoch": 2873} {"train_loss": -12.646686553955078, "global_step": 482739, "epoch": 2873} {"train_loss": -12.277098655700684, "global_step": 482740, "epoch": 2873} {"train_loss": -12.583430290222168, "global_step": 482741, "epoch": 2873} {"train_loss": -12.262457847595215, "global_step": 482742, "epoch": 2873} {"train_loss": -12.512535095214844, "global_step": 482743, "epoch": 2873} {"train_loss": -12.483238220214844, "global_step": 482744, "epoch": 2873} {"train_loss": -12.79549503326416, "global_step": 482745, "epoch": 2873} {"train_loss": -12.57158088684082, "global_step": 482746, "epoch": 2873} {"train_loss": -12.41390323638916, "global_step": 482747, "epoch": 2873} {"train_loss": -12.668045043945312, "global_step": 482748, "epoch": 2873} {"train_loss": -12.60228443145752, "global_step": 482749, "epoch": 2873} {"train_loss": -12.753894805908203, "global_step": 482750, "epoch": 2873} {"train_loss": -12.472076416015625, "global_step": 482751, "epoch": 2873} {"train_loss": -12.466913223266602, "global_step": 482752, "epoch": 2873} {"train_loss": -12.764141082763672, "global_step": 482753, "epoch": 2873} {"train_loss": -12.639455795288086, "global_step": 482754, "epoch": 2873} {"train_loss": -12.918941497802734, "global_step": 482755, "epoch": 2873} {"train_loss": -12.622425079345703, "global_step": 482756, "epoch": 2873} {"train_loss": -12.661928176879883, "global_step": 482757, "epoch": 2873} {"train_loss": -12.664979934692383, "global_step": 482758, "epoch": 2873} {"train_loss": -12.51843547821045, "global_step": 482759, "epoch": 2873} {"train_loss": -12.755663871765137, "global_step": 482760, "epoch": 2873} {"train_loss": -12.702295303344727, "global_step": 482761, "epoch": 2873} {"train_loss": -12.621776580810547, "global_step": 482762, "epoch": 2873} {"train_loss": -12.928068161010742, "global_step": 482763, "epoch": 2873} {"train_loss": -12.648046493530273, "global_step": 482764, "epoch": 2873} {"train_loss": -12.85343074798584, "global_step": 482765, "epoch": 2873} {"train_loss": -12.857627868652344, "global_step": 482766, "epoch": 2873} {"train_loss": -12.75377368927002, "global_step": 482767, "epoch": 2873} {"train_loss": -12.6914701461792, "global_step": 482768, "epoch": 2873} {"train_loss": -12.923955917358398, "global_step": 482769, "epoch": 2873} {"train_loss": -12.874825477600098, "global_step": 482770, "epoch": 2873} {"train_loss": -12.742376327514648, "global_step": 482771, "epoch": 2873} {"train_loss": -12.750120162963867, "global_step": 482772, "epoch": 2873} {"train_loss": -12.972476959228516, "global_step": 482773, "epoch": 2873} {"train_loss": -12.632295608520508, "global_step": 482774, "epoch": 2873} {"train_loss": -12.537400245666504, "global_step": 482775, "epoch": 2873} {"train_loss": -12.929303169250488, "global_step": 482776, "epoch": 2873} {"train_loss": -13.053000450134277, "global_step": 482777, "epoch": 2873} {"train_loss": -12.968490600585938, "global_step": 482778, "epoch": 2873} {"train_loss": -12.959371566772461, "global_step": 482779, "epoch": 2873} {"train_loss": -12.974485397338867, "global_step": 482780, "epoch": 2873} {"train_loss": -12.873961448669434, "global_step": 482781, "epoch": 2873} {"train_loss": -12.966909408569336, "global_step": 482782, "epoch": 2873} {"train_loss": -12.998035430908203, "global_step": 482783, "epoch": 2873} {"train_loss": -13.108834266662598, "global_step": 482784, "epoch": 2873} {"train_loss": -13.02743148803711, "global_step": 482785, "epoch": 2873} {"train_loss": -13.078248023986816, "global_step": 482786, "epoch": 2873} {"train_loss": -13.07890510559082, "global_step": 482787, "epoch": 2873} {"train_loss": -13.053787231445312, "global_step": 482788, "epoch": 2873} {"train_loss": -13.123933792114258, "global_step": 482789, "epoch": 2873} {"train_loss": -12.933990478515625, "global_step": 482790, "epoch": 2873} {"train_loss": -12.82599925994873, "global_step": 482791, "epoch": 2873} {"train_loss": -12.89655876159668, "global_step": 482792, "epoch": 2873} {"train_loss": -12.989788055419922, "global_step": 482793, "epoch": 2873} {"train_loss": -13.00838565826416, "global_step": 482794, "epoch": 2873} {"train_loss": -12.973630905151367, "global_step": 482795, "epoch": 2873} {"train_loss": -12.933303833007812, "global_step": 482796, "epoch": 2873} {"train_loss": -13.088645935058594, "global_step": 482797, "epoch": 2873} {"train_loss": -12.833736419677734, "global_step": 482798, "epoch": 2873} {"train_loss": -12.718354225158691, "global_step": 482799, "epoch": 2873} {"train_loss": -12.816527366638184, "global_step": 482800, "epoch": 2873} {"train_loss": -13.05272388458252, "global_step": 482801, "epoch": 2873} {"train_loss": -13.233331680297852, "global_step": 482802, "epoch": 2873} {"train_loss": -13.03404426574707, "global_step": 482803, "epoch": 2873} {"train_loss": -13.068798065185547, "global_step": 482804, "epoch": 2873} {"train_loss": -12.821619033813477, "global_step": 482805, "epoch": 2873} {"train_loss": -12.832889556884766, "global_step": 482806, "epoch": 2873} {"train_loss": -13.199411392211914, "global_step": 482807, "epoch": 2873} {"train_loss": -12.907379150390625, "global_step": 482808, "epoch": 2873} {"train_loss": -12.930103302001953, "global_step": 482809, "epoch": 2873} {"train_loss": -12.524311065673828, "global_step": 482810, "epoch": 2873} {"train_loss": -12.187643051147461, "global_step": 482811, "epoch": 2873} {"train_loss": -12.646851539611816, "global_step": 482812, "epoch": 2873} {"train_loss": -12.897581100463867, "global_step": 482813, "epoch": 2873} {"train_loss": -12.475906372070312, "global_step": 482814, "epoch": 2873} {"train_loss": -11.931181907653809, "global_step": 482815, "epoch": 2873} {"train_loss": -11.690381050109863, "global_step": 482816, "epoch": 2873} {"train_loss": -11.989863395690918, "global_step": 482817, "epoch": 2873} {"train_loss": -12.757793426513672, "global_step": 482818, "epoch": 2873} {"train_loss": -12.737543106079102, "global_step": 482819, "epoch": 2873} {"train_loss": -12.74954605102539, "global_step": 482820, "epoch": 2873} {"train_loss": -12.944421768188477, "global_step": 482821, "epoch": 2873} {"train_loss": -12.88661003112793, "global_step": 482822, "epoch": 2873} {"train_loss": -12.642922401428223, "global_step": 482823, "epoch": 2873} {"train_loss": -12.830154418945312, "global_step": 482824, "epoch": 2873} {"train_loss": -11.853907585144043, "global_step": 482825, "epoch": 2873} {"train_loss": -10.665006637573242, "global_step": 482826, "epoch": 2873} {"train_loss": -10.282181739807129, "global_step": 482827, "epoch": 2873} {"train_loss": -12.039812088012695, "global_step": 482828, "epoch": 2873} {"train_loss": -10.092947006225586, "global_step": 482829, "epoch": 2873} {"train_loss": -9.733375549316406, "global_step": 482830, "epoch": 2873} {"train_loss": -12.259423806553794, "global_step": 482831, "epoch": 2873, "val_loss": 317773.1875} {"train_loss": -10.8804931640625, "global_step": 482832, "epoch": 2874} {"train_loss": -9.37514877319336, "global_step": 482833, "epoch": 2874} {"train_loss": -10.639078140258789, "global_step": 482834, "epoch": 2874} {"train_loss": -10.58667278289795, "global_step": 482835, "epoch": 2874} {"train_loss": -10.947420120239258, "global_step": 482836, "epoch": 2874} {"train_loss": -12.255487442016602, "global_step": 482837, "epoch": 2874} {"train_loss": -11.178760528564453, "global_step": 482838, "epoch": 2874} {"train_loss": -10.69348430633545, "global_step": 482839, "epoch": 2874} {"train_loss": -10.698446273803711, "global_step": 482840, "epoch": 2874} {"train_loss": -10.01115608215332, "global_step": 482841, "epoch": 2874} {"train_loss": -10.251288414001465, "global_step": 482842, "epoch": 2874} {"train_loss": -9.87155818939209, "global_step": 482843, "epoch": 2874} {"train_loss": -10.095434188842773, "global_step": 482844, "epoch": 2874} {"train_loss": -11.002433776855469, "global_step": 482845, "epoch": 2874} {"train_loss": -10.09041690826416, "global_step": 482846, "epoch": 2874} {"train_loss": -9.985105514526367, "global_step": 482847, "epoch": 2874} {"train_loss": -9.957773208618164, "global_step": 482848, "epoch": 2874} {"train_loss": -9.89076042175293, "global_step": 482849, "epoch": 2874} {"train_loss": -10.663707733154297, "global_step": 482850, "epoch": 2874} {"train_loss": -9.596532821655273, "global_step": 482851, "epoch": 2874} {"train_loss": -10.421072006225586, "global_step": 482852, "epoch": 2874} {"train_loss": -8.83622932434082, "global_step": 482853, "epoch": 2874} {"train_loss": -10.849166870117188, "global_step": 482854, "epoch": 2874} {"train_loss": -9.677499771118164, "global_step": 482855, "epoch": 2874} {"train_loss": -10.276534080505371, "global_step": 482856, "epoch": 2874} {"train_loss": -8.761361122131348, "global_step": 482857, "epoch": 2874} {"train_loss": -9.454301834106445, "global_step": 482858, "epoch": 2874} {"train_loss": -11.519609451293945, "global_step": 482859, "epoch": 2874} {"train_loss": -9.515453338623047, "global_step": 482860, "epoch": 2874} {"train_loss": -11.255705833435059, "global_step": 482861, "epoch": 2874} {"train_loss": -10.134039878845215, "global_step": 482862, "epoch": 2874} {"train_loss": -11.501070976257324, "global_step": 482863, "epoch": 2874} {"train_loss": -10.319188117980957, "global_step": 482864, "epoch": 2874} {"train_loss": -11.61275577545166, "global_step": 482865, "epoch": 2874} {"train_loss": -10.696931838989258, "global_step": 482866, "epoch": 2874} {"train_loss": -11.242742538452148, "global_step": 482867, "epoch": 2874} {"train_loss": -11.241320610046387, "global_step": 482868, "epoch": 2874} {"train_loss": -11.506837844848633, "global_step": 482869, "epoch": 2874} {"train_loss": -11.623346328735352, "global_step": 482870, "epoch": 2874} {"train_loss": -11.346196174621582, "global_step": 482871, "epoch": 2874} {"train_loss": -11.670731544494629, "global_step": 482872, "epoch": 2874} {"train_loss": -10.92949104309082, "global_step": 482873, "epoch": 2874} {"train_loss": -12.296160697937012, "global_step": 482874, "epoch": 2874} {"train_loss": -11.833283424377441, "global_step": 482875, "epoch": 2874} {"train_loss": -11.75441837310791, "global_step": 482876, "epoch": 2874} {"train_loss": -11.811318397521973, "global_step": 482877, "epoch": 2874} {"train_loss": -12.12210464477539, "global_step": 482878, "epoch": 2874} {"train_loss": -11.450544357299805, "global_step": 482879, "epoch": 2874} {"train_loss": -12.413776397705078, "global_step": 482880, "epoch": 2874} {"train_loss": -11.975630760192871, "global_step": 482881, "epoch": 2874} {"train_loss": -11.75816535949707, "global_step": 482882, "epoch": 2874} {"train_loss": -12.177276611328125, "global_step": 482883, "epoch": 2874} {"train_loss": -11.945231437683105, "global_step": 482884, "epoch": 2874} {"train_loss": -12.089134216308594, "global_step": 482885, "epoch": 2874} {"train_loss": -12.193714141845703, "global_step": 482886, "epoch": 2874} {"train_loss": -12.245484352111816, "global_step": 482887, "epoch": 2874} {"train_loss": -12.276927947998047, "global_step": 482888, "epoch": 2874} {"train_loss": -12.521004676818848, "global_step": 482889, "epoch": 2874} {"train_loss": -12.285870552062988, "global_step": 482890, "epoch": 2874} {"train_loss": -12.415099143981934, "global_step": 482891, "epoch": 2874} {"train_loss": -12.366854667663574, "global_step": 482892, "epoch": 2874} {"train_loss": -12.281671524047852, "global_step": 482893, "epoch": 2874} {"train_loss": -12.348821640014648, "global_step": 482894, "epoch": 2874} {"train_loss": -12.40771484375, "global_step": 482895, "epoch": 2874} {"train_loss": -12.519914627075195, "global_step": 482896, "epoch": 2874} {"train_loss": -12.331735610961914, "global_step": 482897, "epoch": 2874} {"train_loss": -12.577095985412598, "global_step": 482898, "epoch": 2874} {"train_loss": -12.210334777832031, "global_step": 482899, "epoch": 2874} {"train_loss": -12.67839241027832, "global_step": 482900, "epoch": 2874} {"train_loss": -12.203920364379883, "global_step": 482901, "epoch": 2874} {"train_loss": -12.512863159179688, "global_step": 482902, "epoch": 2874} {"train_loss": -12.32513427734375, "global_step": 482903, "epoch": 2874} {"train_loss": -12.469257354736328, "global_step": 482904, "epoch": 2874} {"train_loss": -12.453676223754883, "global_step": 482905, "epoch": 2874} {"train_loss": -12.54023551940918, "global_step": 482906, "epoch": 2874} {"train_loss": -12.626287460327148, "global_step": 482907, "epoch": 2874} {"train_loss": -11.97518253326416, "global_step": 482908, "epoch": 2874} {"train_loss": -12.599008560180664, "global_step": 482909, "epoch": 2874} {"train_loss": -12.276969909667969, "global_step": 482910, "epoch": 2874} {"train_loss": -12.535171508789062, "global_step": 482911, "epoch": 2874} {"train_loss": -12.458900451660156, "global_step": 482912, "epoch": 2874} {"train_loss": -12.295722961425781, "global_step": 482913, "epoch": 2874} {"train_loss": -12.523663520812988, "global_step": 482914, "epoch": 2874} {"train_loss": -12.634068489074707, "global_step": 482915, "epoch": 2874} {"train_loss": -12.477334976196289, "global_step": 482916, "epoch": 2874} {"train_loss": -12.461217880249023, "global_step": 482917, "epoch": 2874} {"train_loss": -12.437658309936523, "global_step": 482918, "epoch": 2874} {"train_loss": -12.478330612182617, "global_step": 482919, "epoch": 2874} {"train_loss": -12.70101261138916, "global_step": 482920, "epoch": 2874} {"train_loss": -12.586374282836914, "global_step": 482921, "epoch": 2874} {"train_loss": -12.552373886108398, "global_step": 482922, "epoch": 2874} {"train_loss": -12.76237678527832, "global_step": 482923, "epoch": 2874} {"train_loss": -12.644729614257812, "global_step": 482924, "epoch": 2874} {"train_loss": -12.573594093322754, "global_step": 482925, "epoch": 2874} {"train_loss": -12.418750762939453, "global_step": 482926, "epoch": 2874} {"train_loss": -12.783594131469727, "global_step": 482927, "epoch": 2874} {"train_loss": -12.629158020019531, "global_step": 482928, "epoch": 2874} {"train_loss": -12.823677062988281, "global_step": 482929, "epoch": 2874} {"train_loss": -12.667452812194824, "global_step": 482930, "epoch": 2874} {"train_loss": -12.693740844726562, "global_step": 482931, "epoch": 2874} {"train_loss": -12.746212005615234, "global_step": 482932, "epoch": 2874} {"train_loss": -12.666868209838867, "global_step": 482933, "epoch": 2874} {"train_loss": -12.54684829711914, "global_step": 482934, "epoch": 2874} {"train_loss": -12.604301452636719, "global_step": 482935, "epoch": 2874} {"train_loss": -12.84626579284668, "global_step": 482936, "epoch": 2874} {"train_loss": -12.6700439453125, "global_step": 482937, "epoch": 2874} {"train_loss": -12.748359680175781, "global_step": 482938, "epoch": 2874} {"train_loss": -12.596870422363281, "global_step": 482939, "epoch": 2874} {"train_loss": -12.805614471435547, "global_step": 482940, "epoch": 2874} {"train_loss": -12.699762344360352, "global_step": 482941, "epoch": 2874} {"train_loss": -12.94802188873291, "global_step": 482942, "epoch": 2874} {"train_loss": -12.726483345031738, "global_step": 482943, "epoch": 2874} {"train_loss": -12.678239822387695, "global_step": 482944, "epoch": 2874} {"train_loss": -12.700980186462402, "global_step": 482945, "epoch": 2874} {"train_loss": -12.789322853088379, "global_step": 482946, "epoch": 2874} {"train_loss": -12.841669082641602, "global_step": 482947, "epoch": 2874} {"train_loss": -12.705766677856445, "global_step": 482948, "epoch": 2874} {"train_loss": -12.627995491027832, "global_step": 482949, "epoch": 2874} {"train_loss": -13.065155982971191, "global_step": 482950, "epoch": 2874} {"train_loss": -12.769111633300781, "global_step": 482951, "epoch": 2874} {"train_loss": -12.87492561340332, "global_step": 482952, "epoch": 2874} {"train_loss": -12.883716583251953, "global_step": 482953, "epoch": 2874} {"train_loss": -12.953962326049805, "global_step": 482954, "epoch": 2874} {"train_loss": -12.892984390258789, "global_step": 482955, "epoch": 2874} {"train_loss": -12.888664245605469, "global_step": 482956, "epoch": 2874} {"train_loss": -12.803986549377441, "global_step": 482957, "epoch": 2874} {"train_loss": -12.830524444580078, "global_step": 482958, "epoch": 2874} {"train_loss": -12.987701416015625, "global_step": 482959, "epoch": 2874} {"train_loss": -12.696823120117188, "global_step": 482960, "epoch": 2874} {"train_loss": -12.767520904541016, "global_step": 482961, "epoch": 2874} {"train_loss": -12.941766738891602, "global_step": 482962, "epoch": 2874} {"train_loss": -12.861774444580078, "global_step": 482963, "epoch": 2874} {"train_loss": -12.582913398742676, "global_step": 482964, "epoch": 2874} {"train_loss": -12.92236614227295, "global_step": 482965, "epoch": 2874} {"train_loss": -12.751140594482422, "global_step": 482966, "epoch": 2874} {"train_loss": -12.731710433959961, "global_step": 482967, "epoch": 2874} {"train_loss": -12.764140129089355, "global_step": 482968, "epoch": 2874} {"train_loss": -12.566290855407715, "global_step": 482969, "epoch": 2874} {"train_loss": -12.481622695922852, "global_step": 482970, "epoch": 2874} {"train_loss": -12.738153457641602, "global_step": 482971, "epoch": 2874} {"train_loss": -12.80521297454834, "global_step": 482972, "epoch": 2874} {"train_loss": -12.589866638183594, "global_step": 482973, "epoch": 2874} {"train_loss": -12.734628677368164, "global_step": 482974, "epoch": 2874} {"train_loss": -12.81002426147461, "global_step": 482975, "epoch": 2874} {"train_loss": -12.616362571716309, "global_step": 482976, "epoch": 2874} {"train_loss": -12.529932022094727, "global_step": 482977, "epoch": 2874} {"train_loss": -12.999276161193848, "global_step": 482978, "epoch": 2874} {"train_loss": -12.664026260375977, "global_step": 482979, "epoch": 2874} {"train_loss": -12.145770072937012, "global_step": 482980, "epoch": 2874} {"train_loss": -12.212017059326172, "global_step": 482981, "epoch": 2874} {"train_loss": -12.623024940490723, "global_step": 482982, "epoch": 2874} {"train_loss": -11.933051109313965, "global_step": 482983, "epoch": 2874} {"train_loss": -12.102334976196289, "global_step": 482984, "epoch": 2874} {"train_loss": -11.860424041748047, "global_step": 482985, "epoch": 2874} {"train_loss": -12.134742736816406, "global_step": 482986, "epoch": 2874} {"train_loss": -12.246162414550781, "global_step": 482987, "epoch": 2874} {"train_loss": -11.780801773071289, "global_step": 482988, "epoch": 2874} {"train_loss": -12.781656265258789, "global_step": 482989, "epoch": 2874} {"train_loss": -11.827859878540039, "global_step": 482990, "epoch": 2874} {"train_loss": -11.905527114868164, "global_step": 482991, "epoch": 2874} {"train_loss": -11.543527603149414, "global_step": 482992, "epoch": 2874} {"train_loss": -12.511597633361816, "global_step": 482993, "epoch": 2874} {"train_loss": -10.829887390136719, "global_step": 482994, "epoch": 2874} {"train_loss": -12.393792152404785, "global_step": 482995, "epoch": 2874} {"train_loss": -11.360565185546875, "global_step": 482996, "epoch": 2874} {"train_loss": -11.68867301940918, "global_step": 482997, "epoch": 2874} {"train_loss": -10.81240463256836, "global_step": 482998, "epoch": 2874} {"train_loss": -11.97807548727308, "global_step": 482999, "epoch": 2874, "val_loss": 318540.5} {"train_loss": -9.607752799987793, "global_step": 483000, "epoch": 2875} {"train_loss": -11.329439163208008, "global_step": 483001, "epoch": 2875} {"train_loss": -10.930767059326172, "global_step": 483002, "epoch": 2875} {"train_loss": -11.811050415039062, "global_step": 483003, "epoch": 2875} {"train_loss": -10.678641319274902, "global_step": 483004, "epoch": 2875} {"train_loss": -11.324089050292969, "global_step": 483005, "epoch": 2875} {"train_loss": -10.413393020629883, "global_step": 483006, "epoch": 2875} {"train_loss": -9.880510330200195, "global_step": 483007, "epoch": 2875} {"train_loss": -9.169268608093262, "global_step": 483008, "epoch": 2875} {"train_loss": -9.168758392333984, "global_step": 483009, "epoch": 2875} {"train_loss": -8.919103622436523, "global_step": 483010, "epoch": 2875} {"train_loss": -10.269979476928711, "global_step": 483011, "epoch": 2875} {"train_loss": -10.065893173217773, "global_step": 483012, "epoch": 2875} {"train_loss": -9.445555686950684, "global_step": 483013, "epoch": 2875} {"train_loss": -10.20147705078125, "global_step": 483014, "epoch": 2875} {"train_loss": -11.456014633178711, "global_step": 483015, "epoch": 2875} {"train_loss": -10.534429550170898, "global_step": 483016, "epoch": 2875} {"train_loss": -11.336423873901367, "global_step": 483017, "epoch": 2875} {"train_loss": -11.457301139831543, "global_step": 483018, "epoch": 2875} {"train_loss": -10.872238159179688, "global_step": 483019, "epoch": 2875} {"train_loss": -11.271829605102539, "global_step": 483020, "epoch": 2875} {"train_loss": -10.833175659179688, "global_step": 483021, "epoch": 2875} {"train_loss": -11.321977615356445, "global_step": 483022, "epoch": 2875} {"train_loss": -11.566995620727539, "global_step": 483023, "epoch": 2875} {"train_loss": -11.179193496704102, "global_step": 483024, "epoch": 2875} {"train_loss": -11.673763275146484, "global_step": 483025, "epoch": 2875} {"train_loss": -11.265425682067871, "global_step": 483026, "epoch": 2875} {"train_loss": -11.171130180358887, "global_step": 483027, "epoch": 2875} {"train_loss": -11.244523048400879, "global_step": 483028, "epoch": 2875} {"train_loss": -10.989473342895508, "global_step": 483029, "epoch": 2875} {"train_loss": -10.38355827331543, "global_step": 483030, "epoch": 2875} {"train_loss": -9.697010040283203, "global_step": 483031, "epoch": 2875} {"train_loss": -10.11130142211914, "global_step": 483032, "epoch": 2875} {"train_loss": -11.835562705993652, "global_step": 483033, "epoch": 2875} {"train_loss": -9.774247169494629, "global_step": 483034, "epoch": 2875} {"train_loss": -10.9421968460083, "global_step": 483035, "epoch": 2875} {"train_loss": -10.942028045654297, "global_step": 483036, "epoch": 2875} {"train_loss": -10.820186614990234, "global_step": 483037, "epoch": 2875} {"train_loss": -12.071701049804688, "global_step": 483038, "epoch": 2875} {"train_loss": -10.635055541992188, "global_step": 483039, "epoch": 2875} {"train_loss": -11.268413543701172, "global_step": 483040, "epoch": 2875} {"train_loss": -11.380424499511719, "global_step": 483041, "epoch": 2875} {"train_loss": -10.445134162902832, "global_step": 483042, "epoch": 2875} {"train_loss": -11.941190719604492, "global_step": 483043, "epoch": 2875} {"train_loss": -10.566600799560547, "global_step": 483044, "epoch": 2875} {"train_loss": -11.832417488098145, "global_step": 483045, "epoch": 2875} {"train_loss": -11.583942413330078, "global_step": 483046, "epoch": 2875} {"train_loss": -11.475886344909668, "global_step": 483047, "epoch": 2875} {"train_loss": -12.142183303833008, "global_step": 483048, "epoch": 2875} {"train_loss": -11.66661548614502, "global_step": 483049, "epoch": 2875} {"train_loss": -11.862058639526367, "global_step": 483050, "epoch": 2875} {"train_loss": -12.054231643676758, "global_step": 483051, "epoch": 2875} {"train_loss": -11.831308364868164, "global_step": 483052, "epoch": 2875} {"train_loss": -12.260831832885742, "global_step": 483053, "epoch": 2875} {"train_loss": -11.996269226074219, "global_step": 483054, "epoch": 2875} {"train_loss": -11.813583374023438, "global_step": 483055, "epoch": 2875} {"train_loss": -12.274652481079102, "global_step": 483056, "epoch": 2875} {"train_loss": -12.072113037109375, "global_step": 483057, "epoch": 2875} {"train_loss": -12.335067749023438, "global_step": 483058, "epoch": 2875} {"train_loss": -12.056203842163086, "global_step": 483059, "epoch": 2875} {"train_loss": -12.07745361328125, "global_step": 483060, "epoch": 2875} {"train_loss": -12.027076721191406, "global_step": 483061, "epoch": 2875} {"train_loss": -12.048738479614258, "global_step": 483062, "epoch": 2875} {"train_loss": -12.308337211608887, "global_step": 483063, "epoch": 2875} {"train_loss": -12.026815414428711, "global_step": 483064, "epoch": 2875} {"train_loss": -12.389430046081543, "global_step": 483065, "epoch": 2875} {"train_loss": -12.139139175415039, "global_step": 483066, "epoch": 2875} {"train_loss": -12.453203201293945, "global_step": 483067, "epoch": 2875} {"train_loss": -12.325738906860352, "global_step": 483068, "epoch": 2875} {"train_loss": -11.98115348815918, "global_step": 483069, "epoch": 2875} {"train_loss": -12.420740127563477, "global_step": 483070, "epoch": 2875} {"train_loss": -12.40920639038086, "global_step": 483071, "epoch": 2875} {"train_loss": -12.419210433959961, "global_step": 483072, "epoch": 2875} {"train_loss": -12.137381553649902, "global_step": 483073, "epoch": 2875} {"train_loss": -12.34837532043457, "global_step": 483074, "epoch": 2875} {"train_loss": -12.425874710083008, "global_step": 483075, "epoch": 2875} {"train_loss": -12.450630187988281, "global_step": 483076, "epoch": 2875} {"train_loss": -12.496516227722168, "global_step": 483077, "epoch": 2875} {"train_loss": -12.226896286010742, "global_step": 483078, "epoch": 2875} {"train_loss": -12.136219024658203, "global_step": 483079, "epoch": 2875} {"train_loss": -12.641035079956055, "global_step": 483080, "epoch": 2875} {"train_loss": -12.247244834899902, "global_step": 483081, "epoch": 2875} {"train_loss": -12.537161827087402, "global_step": 483082, "epoch": 2875} {"train_loss": -12.260113716125488, "global_step": 483083, "epoch": 2875} {"train_loss": -12.370223045349121, "global_step": 483084, "epoch": 2875} {"train_loss": -12.324986457824707, "global_step": 483085, "epoch": 2875} {"train_loss": -12.322759628295898, "global_step": 483086, "epoch": 2875} {"train_loss": -12.332622528076172, "global_step": 483087, "epoch": 2875} {"train_loss": -12.50046157836914, "global_step": 483088, "epoch": 2875} {"train_loss": -12.62257194519043, "global_step": 483089, "epoch": 2875} {"train_loss": -12.727931022644043, "global_step": 483090, "epoch": 2875} {"train_loss": -12.709294319152832, "global_step": 483091, "epoch": 2875} {"train_loss": -12.519926071166992, "global_step": 483092, "epoch": 2875} {"train_loss": -12.570749282836914, "global_step": 483093, "epoch": 2875} {"train_loss": -12.7575044631958, "global_step": 483094, "epoch": 2875} {"train_loss": -12.734560012817383, "global_step": 483095, "epoch": 2875} {"train_loss": -12.6246976852417, "global_step": 483096, "epoch": 2875} {"train_loss": -12.811239242553711, "global_step": 483097, "epoch": 2875} {"train_loss": -12.573982238769531, "global_step": 483098, "epoch": 2875} {"train_loss": -12.713113784790039, "global_step": 483099, "epoch": 2875} {"train_loss": -12.600403785705566, "global_step": 483100, "epoch": 2875} {"train_loss": -12.765920639038086, "global_step": 483101, "epoch": 2875} {"train_loss": -12.73918342590332, "global_step": 483102, "epoch": 2875} {"train_loss": -12.592142105102539, "global_step": 483103, "epoch": 2875} {"train_loss": -12.789552688598633, "global_step": 483104, "epoch": 2875} {"train_loss": -12.713929176330566, "global_step": 483105, "epoch": 2875} {"train_loss": -12.803874969482422, "global_step": 483106, "epoch": 2875} {"train_loss": -12.808366775512695, "global_step": 483107, "epoch": 2875} {"train_loss": -12.739262580871582, "global_step": 483108, "epoch": 2875} {"train_loss": -12.548593521118164, "global_step": 483109, "epoch": 2875} {"train_loss": -12.81836223602295, "global_step": 483110, "epoch": 2875} {"train_loss": -12.716862678527832, "global_step": 483111, "epoch": 2875} {"train_loss": -12.91115951538086, "global_step": 483112, "epoch": 2875} {"train_loss": -12.96049976348877, "global_step": 483113, "epoch": 2875} {"train_loss": -12.843408584594727, "global_step": 483114, "epoch": 2875} {"train_loss": -12.73185920715332, "global_step": 483115, "epoch": 2875} {"train_loss": -12.863468170166016, "global_step": 483116, "epoch": 2875} {"train_loss": -12.896472930908203, "global_step": 483117, "epoch": 2875} {"train_loss": -12.811389923095703, "global_step": 483118, "epoch": 2875} {"train_loss": -13.058174133300781, "global_step": 483119, "epoch": 2875} {"train_loss": -12.816530227661133, "global_step": 483120, "epoch": 2875} {"train_loss": -12.7913818359375, "global_step": 483121, "epoch": 2875} {"train_loss": -12.765640258789062, "global_step": 483122, "epoch": 2875} {"train_loss": -13.038561820983887, "global_step": 483123, "epoch": 2875} {"train_loss": -12.53430461883545, "global_step": 483124, "epoch": 2875} {"train_loss": -12.975207328796387, "global_step": 483125, "epoch": 2875} {"train_loss": -12.887038230895996, "global_step": 483126, "epoch": 2875} {"train_loss": -12.783628463745117, "global_step": 483127, "epoch": 2875} {"train_loss": -12.850910186767578, "global_step": 483128, "epoch": 2875} {"train_loss": -12.86474609375, "global_step": 483129, "epoch": 2875} {"train_loss": -12.80931282043457, "global_step": 483130, "epoch": 2875} {"train_loss": -12.788707733154297, "global_step": 483131, "epoch": 2875} {"train_loss": -12.707002639770508, "global_step": 483132, "epoch": 2875} {"train_loss": -12.958892822265625, "global_step": 483133, "epoch": 2875} {"train_loss": -12.958755493164062, "global_step": 483134, "epoch": 2875} {"train_loss": -12.732074737548828, "global_step": 483135, "epoch": 2875} {"train_loss": -12.872444152832031, "global_step": 483136, "epoch": 2875} {"train_loss": -12.955944061279297, "global_step": 483137, "epoch": 2875} {"train_loss": -12.780101776123047, "global_step": 483138, "epoch": 2875} {"train_loss": -12.679895401000977, "global_step": 483139, "epoch": 2875} {"train_loss": -13.01826286315918, "global_step": 483140, "epoch": 2875} {"train_loss": -12.76020622253418, "global_step": 483141, "epoch": 2875} {"train_loss": -12.776763916015625, "global_step": 483142, "epoch": 2875} {"train_loss": -12.83497428894043, "global_step": 483143, "epoch": 2875} {"train_loss": -12.83531379699707, "global_step": 483144, "epoch": 2875} {"train_loss": -12.818230628967285, "global_step": 483145, "epoch": 2875} {"train_loss": -12.90665054321289, "global_step": 483146, "epoch": 2875} {"train_loss": -12.827922821044922, "global_step": 483147, "epoch": 2875} {"train_loss": -12.782702445983887, "global_step": 483148, "epoch": 2875} {"train_loss": -13.013017654418945, "global_step": 483149, "epoch": 2875} {"train_loss": -12.90636920928955, "global_step": 483150, "epoch": 2875} {"train_loss": -12.768379211425781, "global_step": 483151, "epoch": 2875} {"train_loss": -12.881153106689453, "global_step": 483152, "epoch": 2875} {"train_loss": -12.818061828613281, "global_step": 483153, "epoch": 2875} {"train_loss": -13.080818176269531, "global_step": 483154, "epoch": 2875} {"train_loss": -12.942037582397461, "global_step": 483155, "epoch": 2875} {"train_loss": -12.963432312011719, "global_step": 483156, "epoch": 2875} {"train_loss": -12.652301788330078, "global_step": 483157, "epoch": 2875} {"train_loss": -12.872298240661621, "global_step": 483158, "epoch": 2875} {"train_loss": -12.86812686920166, "global_step": 483159, "epoch": 2875} {"train_loss": -12.850912094116211, "global_step": 483160, "epoch": 2875} {"train_loss": -12.96999740600586, "global_step": 483161, "epoch": 2875} {"train_loss": -13.071168899536133, "global_step": 483162, "epoch": 2875} {"train_loss": -12.868497848510742, "global_step": 483163, "epoch": 2875} {"train_loss": -12.643856048583984, "global_step": 483164, "epoch": 2875} {"train_loss": -13.020442962646484, "global_step": 483165, "epoch": 2875} {"train_loss": -12.759936332702637, "global_step": 483166, "epoch": 2875} {"train_loss": -12.094007304736547, "global_step": 483167, "epoch": 2875, "val_loss": 312827.09375, "train_action_mse_error": 1.396962285041809} {"train_loss": -11.02720832824707, "global_step": 483168, "epoch": 2876} {"train_loss": -12.624176025390625, "global_step": 483169, "epoch": 2876} {"train_loss": -12.903873443603516, "global_step": 483170, "epoch": 2876} {"train_loss": -12.598941802978516, "global_step": 483171, "epoch": 2876} {"train_loss": -12.565673828125, "global_step": 483172, "epoch": 2876} {"train_loss": -12.286861419677734, "global_step": 483173, "epoch": 2876} {"train_loss": -12.168647766113281, "global_step": 483174, "epoch": 2876} {"train_loss": -12.68150520324707, "global_step": 483175, "epoch": 2876} {"train_loss": -12.37127685546875, "global_step": 483176, "epoch": 2876} {"train_loss": -12.552603721618652, "global_step": 483177, "epoch": 2876} {"train_loss": -11.624435424804688, "global_step": 483178, "epoch": 2876} {"train_loss": -12.159638404846191, "global_step": 483179, "epoch": 2876} {"train_loss": -10.714921951293945, "global_step": 483180, "epoch": 2876} {"train_loss": -12.005464553833008, "global_step": 483181, "epoch": 2876} {"train_loss": -11.80129623413086, "global_step": 483182, "epoch": 2876} {"train_loss": -11.184915542602539, "global_step": 483183, "epoch": 2876} {"train_loss": -12.011983871459961, "global_step": 483184, "epoch": 2876} {"train_loss": -11.531295776367188, "global_step": 483185, "epoch": 2876} {"train_loss": -11.17197036743164, "global_step": 483186, "epoch": 2876} {"train_loss": -11.47722053527832, "global_step": 483187, "epoch": 2876} {"train_loss": -11.811789512634277, "global_step": 483188, "epoch": 2876} {"train_loss": -9.493486404418945, "global_step": 483189, "epoch": 2876} {"train_loss": -9.3696928024292, "global_step": 483190, "epoch": 2876} {"train_loss": -10.446138381958008, "global_step": 483191, "epoch": 2876} {"train_loss": -10.571211814880371, "global_step": 483192, "epoch": 2876} {"train_loss": -10.63492202758789, "global_step": 483193, "epoch": 2876} {"train_loss": -10.530658721923828, "global_step": 483194, "epoch": 2876} {"train_loss": -11.09196662902832, "global_step": 483195, "epoch": 2876} {"train_loss": -11.409440040588379, "global_step": 483196, "epoch": 2876} {"train_loss": -10.772808074951172, "global_step": 483197, "epoch": 2876} {"train_loss": -11.414970397949219, "global_step": 483198, "epoch": 2876} {"train_loss": -10.868570327758789, "global_step": 483199, "epoch": 2876} {"train_loss": -11.427963256835938, "global_step": 483200, "epoch": 2876} {"train_loss": -11.28439712524414, "global_step": 483201, "epoch": 2876} {"train_loss": -11.087900161743164, "global_step": 483202, "epoch": 2876} {"train_loss": -10.552347183227539, "global_step": 483203, "epoch": 2876} {"train_loss": -10.70877456665039, "global_step": 483204, "epoch": 2876} {"train_loss": -10.766165733337402, "global_step": 483205, "epoch": 2876} {"train_loss": -9.321767807006836, "global_step": 483206, "epoch": 2876} {"train_loss": -11.387864112854004, "global_step": 483207, "epoch": 2876} {"train_loss": -8.499879837036133, "global_step": 483208, "epoch": 2876} {"train_loss": -9.327234268188477, "global_step": 483209, "epoch": 2876} {"train_loss": -9.980972290039062, "global_step": 483210, "epoch": 2876} {"train_loss": -10.392435073852539, "global_step": 483211, "epoch": 2876} {"train_loss": -9.472349166870117, "global_step": 483212, "epoch": 2876} {"train_loss": -10.058314323425293, "global_step": 483213, "epoch": 2876} {"train_loss": -9.595884323120117, "global_step": 483214, "epoch": 2876} {"train_loss": -9.424291610717773, "global_step": 483215, "epoch": 2876} {"train_loss": -10.908919334411621, "global_step": 483216, "epoch": 2876} {"train_loss": -10.094748497009277, "global_step": 483217, "epoch": 2876} {"train_loss": -10.395153045654297, "global_step": 483218, "epoch": 2876} {"train_loss": -11.34496021270752, "global_step": 483219, "epoch": 2876} {"train_loss": -9.758045196533203, "global_step": 483220, "epoch": 2876} {"train_loss": -10.713836669921875, "global_step": 483221, "epoch": 2876} {"train_loss": -10.550936698913574, "global_step": 483222, "epoch": 2876} {"train_loss": -10.352558135986328, "global_step": 483223, "epoch": 2876} {"train_loss": -11.361616134643555, "global_step": 483224, "epoch": 2876} {"train_loss": -10.95511245727539, "global_step": 483225, "epoch": 2876} {"train_loss": -11.482088088989258, "global_step": 483226, "epoch": 2876} {"train_loss": -11.622697830200195, "global_step": 483227, "epoch": 2876} {"train_loss": -11.581463813781738, "global_step": 483228, "epoch": 2876} {"train_loss": -11.430658340454102, "global_step": 483229, "epoch": 2876} {"train_loss": -11.714639663696289, "global_step": 483230, "epoch": 2876} {"train_loss": -11.431598663330078, "global_step": 483231, "epoch": 2876} {"train_loss": -11.581833839416504, "global_step": 483232, "epoch": 2876} {"train_loss": -11.761795043945312, "global_step": 483233, "epoch": 2876} {"train_loss": -10.97192096710205, "global_step": 483234, "epoch": 2876} {"train_loss": -11.335832595825195, "global_step": 483235, "epoch": 2876} {"train_loss": -11.415769577026367, "global_step": 483236, "epoch": 2876} {"train_loss": -10.929325103759766, "global_step": 483237, "epoch": 2876} {"train_loss": -12.103767395019531, "global_step": 483238, "epoch": 2876} {"train_loss": -11.272321701049805, "global_step": 483239, "epoch": 2876} {"train_loss": -12.228693008422852, "global_step": 483240, "epoch": 2876} {"train_loss": -11.586305618286133, "global_step": 483241, "epoch": 2876} {"train_loss": -11.907959938049316, "global_step": 483242, "epoch": 2876} {"train_loss": -11.718338966369629, "global_step": 483243, "epoch": 2876} {"train_loss": -12.245437622070312, "global_step": 483244, "epoch": 2876} {"train_loss": -11.85584831237793, "global_step": 483245, "epoch": 2876} {"train_loss": -12.210646629333496, "global_step": 483246, "epoch": 2876} {"train_loss": -11.801837921142578, "global_step": 483247, "epoch": 2876} {"train_loss": -11.860352516174316, "global_step": 483248, "epoch": 2876} {"train_loss": -11.984806060791016, "global_step": 483249, "epoch": 2876} {"train_loss": -12.244938850402832, "global_step": 483250, "epoch": 2876} {"train_loss": -12.120296478271484, "global_step": 483251, "epoch": 2876} {"train_loss": -11.74142074584961, "global_step": 483252, "epoch": 2876} {"train_loss": -11.92597770690918, "global_step": 483253, "epoch": 2876} {"train_loss": -11.951476097106934, "global_step": 483254, "epoch": 2876} {"train_loss": -12.333511352539062, "global_step": 483255, "epoch": 2876} {"train_loss": -12.338006019592285, "global_step": 483256, "epoch": 2876} {"train_loss": -12.127335548400879, "global_step": 483257, "epoch": 2876} {"train_loss": -12.274782180786133, "global_step": 483258, "epoch": 2876} {"train_loss": -12.238569259643555, "global_step": 483259, "epoch": 2876} {"train_loss": -12.477715492248535, "global_step": 483260, "epoch": 2876} {"train_loss": -12.009828567504883, "global_step": 483261, "epoch": 2876} {"train_loss": -12.342927932739258, "global_step": 483262, "epoch": 2876} {"train_loss": -12.294923782348633, "global_step": 483263, "epoch": 2876} {"train_loss": -12.441631317138672, "global_step": 483264, "epoch": 2876} {"train_loss": -12.094254493713379, "global_step": 483265, "epoch": 2876} {"train_loss": -12.453958511352539, "global_step": 483266, "epoch": 2876} {"train_loss": -12.46803092956543, "global_step": 483267, "epoch": 2876} {"train_loss": -12.519777297973633, "global_step": 483268, "epoch": 2876} {"train_loss": -12.504194259643555, "global_step": 483269, "epoch": 2876} {"train_loss": -12.182833671569824, "global_step": 483270, "epoch": 2876} {"train_loss": -12.66054916381836, "global_step": 483271, "epoch": 2876} {"train_loss": -12.427446365356445, "global_step": 483272, "epoch": 2876} {"train_loss": -12.433745384216309, "global_step": 483273, "epoch": 2876} {"train_loss": -12.396711349487305, "global_step": 483274, "epoch": 2876} {"train_loss": -12.656370162963867, "global_step": 483275, "epoch": 2876} {"train_loss": -12.533585548400879, "global_step": 483276, "epoch": 2876} {"train_loss": -12.486446380615234, "global_step": 483277, "epoch": 2876} {"train_loss": -12.473504066467285, "global_step": 483278, "epoch": 2876} {"train_loss": -12.566323280334473, "global_step": 483279, "epoch": 2876} {"train_loss": -12.38931655883789, "global_step": 483280, "epoch": 2876} {"train_loss": -12.431936264038086, "global_step": 483281, "epoch": 2876} {"train_loss": -12.150030136108398, "global_step": 483282, "epoch": 2876} {"train_loss": -12.606714248657227, "global_step": 483283, "epoch": 2876} {"train_loss": -12.33816909790039, "global_step": 483284, "epoch": 2876} {"train_loss": -12.513604164123535, "global_step": 483285, "epoch": 2876} {"train_loss": -12.462936401367188, "global_step": 483286, "epoch": 2876} {"train_loss": -12.396446228027344, "global_step": 483287, "epoch": 2876} {"train_loss": -12.737876892089844, "global_step": 483288, "epoch": 2876} {"train_loss": -12.600223541259766, "global_step": 483289, "epoch": 2876} {"train_loss": -12.693729400634766, "global_step": 483290, "epoch": 2876} {"train_loss": -12.590276718139648, "global_step": 483291, "epoch": 2876} {"train_loss": -12.469844818115234, "global_step": 483292, "epoch": 2876} {"train_loss": -12.66200065612793, "global_step": 483293, "epoch": 2876} {"train_loss": -12.520943641662598, "global_step": 483294, "epoch": 2876} {"train_loss": -12.529048919677734, "global_step": 483295, "epoch": 2876} {"train_loss": -12.5825834274292, "global_step": 483296, "epoch": 2876} {"train_loss": -12.79109001159668, "global_step": 483297, "epoch": 2876} {"train_loss": -12.481950759887695, "global_step": 483298, "epoch": 2876} {"train_loss": -12.657930374145508, "global_step": 483299, "epoch": 2876} {"train_loss": -12.730269432067871, "global_step": 483300, "epoch": 2876} {"train_loss": -12.765352249145508, "global_step": 483301, "epoch": 2876} {"train_loss": -12.74443244934082, "global_step": 483302, "epoch": 2876} {"train_loss": -12.57421875, "global_step": 483303, "epoch": 2876} {"train_loss": -12.67375373840332, "global_step": 483304, "epoch": 2876} {"train_loss": -12.806982040405273, "global_step": 483305, "epoch": 2876} {"train_loss": -12.866317749023438, "global_step": 483306, "epoch": 2876} {"train_loss": -12.835899353027344, "global_step": 483307, "epoch": 2876} {"train_loss": -12.438105583190918, "global_step": 483308, "epoch": 2876} {"train_loss": -12.940180778503418, "global_step": 483309, "epoch": 2876} {"train_loss": -12.624238014221191, "global_step": 483310, "epoch": 2876} {"train_loss": -12.683297157287598, "global_step": 483311, "epoch": 2876} {"train_loss": -12.786523818969727, "global_step": 483312, "epoch": 2876} {"train_loss": -12.478921890258789, "global_step": 483313, "epoch": 2876} {"train_loss": -12.84305477142334, "global_step": 483314, "epoch": 2876} {"train_loss": -12.556829452514648, "global_step": 483315, "epoch": 2876} {"train_loss": -13.051886558532715, "global_step": 483316, "epoch": 2876} {"train_loss": -12.963508605957031, "global_step": 483317, "epoch": 2876} {"train_loss": -12.69239330291748, "global_step": 483318, "epoch": 2876} {"train_loss": -12.937166213989258, "global_step": 483319, "epoch": 2876} {"train_loss": -12.853548049926758, "global_step": 483320, "epoch": 2876} {"train_loss": -12.708765029907227, "global_step": 483321, "epoch": 2876} {"train_loss": -12.900650978088379, "global_step": 483322, "epoch": 2876} {"train_loss": -12.941753387451172, "global_step": 483323, "epoch": 2876} {"train_loss": -12.760072708129883, "global_step": 483324, "epoch": 2876} {"train_loss": -12.879558563232422, "global_step": 483325, "epoch": 2876} {"train_loss": -12.845922470092773, "global_step": 483326, "epoch": 2876} {"train_loss": -13.01312255859375, "global_step": 483327, "epoch": 2876} {"train_loss": -12.692888259887695, "global_step": 483328, "epoch": 2876} {"train_loss": -12.789613723754883, "global_step": 483329, "epoch": 2876} {"train_loss": -13.02203369140625, "global_step": 483330, "epoch": 2876} {"train_loss": -12.766338348388672, "global_step": 483331, "epoch": 2876} {"train_loss": -12.938812255859375, "global_step": 483332, "epoch": 2876} {"train_loss": -12.912611961364746, "global_step": 483333, "epoch": 2876} {"train_loss": -12.472159385681152, "global_step": 483334, "epoch": 2876} {"train_loss": -11.89573853924161, "global_step": 483335, "epoch": 2876, "val_loss": 315385.8125} {"train_loss": -12.637378692626953, "global_step": 483336, "epoch": 2877} {"train_loss": -12.237993240356445, "global_step": 483337, "epoch": 2877} {"train_loss": -12.935831069946289, "global_step": 483338, "epoch": 2877} {"train_loss": -12.162410736083984, "global_step": 483339, "epoch": 2877} {"train_loss": -12.314952850341797, "global_step": 483340, "epoch": 2877} {"train_loss": -11.936002731323242, "global_step": 483341, "epoch": 2877} {"train_loss": -12.44849967956543, "global_step": 483342, "epoch": 2877} {"train_loss": -11.046926498413086, "global_step": 483343, "epoch": 2877} {"train_loss": -11.305829048156738, "global_step": 483344, "epoch": 2877} {"train_loss": -11.299783706665039, "global_step": 483345, "epoch": 2877} {"train_loss": -12.027361869812012, "global_step": 483346, "epoch": 2877} {"train_loss": -12.206704139709473, "global_step": 483347, "epoch": 2877} {"train_loss": -11.459009170532227, "global_step": 483348, "epoch": 2877} {"train_loss": -12.527021408081055, "global_step": 483349, "epoch": 2877} {"train_loss": -12.102627754211426, "global_step": 483350, "epoch": 2877} {"train_loss": -12.16092300415039, "global_step": 483351, "epoch": 2877} {"train_loss": -12.676963806152344, "global_step": 483352, "epoch": 2877} {"train_loss": -12.710759162902832, "global_step": 483353, "epoch": 2877} {"train_loss": -11.93424129486084, "global_step": 483354, "epoch": 2877} {"train_loss": -12.418479919433594, "global_step": 483355, "epoch": 2877} {"train_loss": -12.418692588806152, "global_step": 483356, "epoch": 2877} {"train_loss": -12.612505912780762, "global_step": 483357, "epoch": 2877} {"train_loss": -12.882894515991211, "global_step": 483358, "epoch": 2877} {"train_loss": -12.336430549621582, "global_step": 483359, "epoch": 2877} {"train_loss": -11.816267013549805, "global_step": 483360, "epoch": 2877} {"train_loss": -12.561197280883789, "global_step": 483361, "epoch": 2877} {"train_loss": -12.391712188720703, "global_step": 483362, "epoch": 2877} {"train_loss": -12.336274147033691, "global_step": 483363, "epoch": 2877} {"train_loss": -12.198053359985352, "global_step": 483364, "epoch": 2877} {"train_loss": -11.436630249023438, "global_step": 483365, "epoch": 2877} {"train_loss": -12.298320770263672, "global_step": 483366, "epoch": 2877} {"train_loss": -12.304880142211914, "global_step": 483367, "epoch": 2877} {"train_loss": -11.933551788330078, "global_step": 483368, "epoch": 2877} {"train_loss": -12.30328369140625, "global_step": 483369, "epoch": 2877} {"train_loss": -12.19228458404541, "global_step": 483370, "epoch": 2877} {"train_loss": -11.633508682250977, "global_step": 483371, "epoch": 2877} {"train_loss": -11.91250228881836, "global_step": 483372, "epoch": 2877} {"train_loss": -12.02090835571289, "global_step": 483373, "epoch": 2877} {"train_loss": -12.206483840942383, "global_step": 483374, "epoch": 2877} {"train_loss": -11.291396141052246, "global_step": 483375, "epoch": 2877} {"train_loss": -12.28715705871582, "global_step": 483376, "epoch": 2877} {"train_loss": -11.557781219482422, "global_step": 483377, "epoch": 2877} {"train_loss": -11.068059921264648, "global_step": 483378, "epoch": 2877} {"train_loss": -12.16946029663086, "global_step": 483379, "epoch": 2877} {"train_loss": -9.696104049682617, "global_step": 483380, "epoch": 2877} {"train_loss": -10.92715072631836, "global_step": 483381, "epoch": 2877} {"train_loss": -10.764628410339355, "global_step": 483382, "epoch": 2877} {"train_loss": -10.704461097717285, "global_step": 483383, "epoch": 2877} {"train_loss": -11.677929878234863, "global_step": 483384, "epoch": 2877} {"train_loss": -11.69493579864502, "global_step": 483385, "epoch": 2877} {"train_loss": -11.709738731384277, "global_step": 483386, "epoch": 2877} {"train_loss": -11.964530944824219, "global_step": 483387, "epoch": 2877} {"train_loss": -11.470869064331055, "global_step": 483388, "epoch": 2877} {"train_loss": -12.049171447753906, "global_step": 483389, "epoch": 2877} {"train_loss": -11.607627868652344, "global_step": 483390, "epoch": 2877} {"train_loss": -11.828786849975586, "global_step": 483391, "epoch": 2877} {"train_loss": -12.010847091674805, "global_step": 483392, "epoch": 2877} {"train_loss": -11.536109924316406, "global_step": 483393, "epoch": 2877} {"train_loss": -12.15045166015625, "global_step": 483394, "epoch": 2877} {"train_loss": -11.36402416229248, "global_step": 483395, "epoch": 2877} {"train_loss": -12.588225364685059, "global_step": 483396, "epoch": 2877} {"train_loss": -11.462356567382812, "global_step": 483397, "epoch": 2877} {"train_loss": -11.52942180633545, "global_step": 483398, "epoch": 2877} {"train_loss": -11.941089630126953, "global_step": 483399, "epoch": 2877} {"train_loss": -11.905961990356445, "global_step": 483400, "epoch": 2877} {"train_loss": -11.681526184082031, "global_step": 483401, "epoch": 2877} {"train_loss": -11.678178787231445, "global_step": 483402, "epoch": 2877} {"train_loss": -12.35427188873291, "global_step": 483403, "epoch": 2877} {"train_loss": -11.636848449707031, "global_step": 483404, "epoch": 2877} {"train_loss": -12.33337116241455, "global_step": 483405, "epoch": 2877} {"train_loss": -11.30267333984375, "global_step": 483406, "epoch": 2877} {"train_loss": -12.263128280639648, "global_step": 483407, "epoch": 2877} {"train_loss": -11.883695602416992, "global_step": 483408, "epoch": 2877} {"train_loss": -11.590970993041992, "global_step": 483409, "epoch": 2877} {"train_loss": -11.968828201293945, "global_step": 483410, "epoch": 2877} {"train_loss": -12.395971298217773, "global_step": 483411, "epoch": 2877} {"train_loss": -12.085376739501953, "global_step": 483412, "epoch": 2877} {"train_loss": -12.346146583557129, "global_step": 483413, "epoch": 2877} {"train_loss": -11.510385513305664, "global_step": 483414, "epoch": 2877} {"train_loss": -12.317205429077148, "global_step": 483415, "epoch": 2877} {"train_loss": -12.057538986206055, "global_step": 483416, "epoch": 2877} {"train_loss": -12.058938980102539, "global_step": 483417, "epoch": 2877} {"train_loss": -12.29159927368164, "global_step": 483418, "epoch": 2877} {"train_loss": -12.25255012512207, "global_step": 483419, "epoch": 2877} {"train_loss": -11.453149795532227, "global_step": 483420, "epoch": 2877} {"train_loss": -12.12628173828125, "global_step": 483421, "epoch": 2877} {"train_loss": -11.34648609161377, "global_step": 483422, "epoch": 2877} {"train_loss": -12.016576766967773, "global_step": 483423, "epoch": 2877} {"train_loss": -12.18136978149414, "global_step": 483424, "epoch": 2877} {"train_loss": -11.294172286987305, "global_step": 483425, "epoch": 2877} {"train_loss": -12.580455780029297, "global_step": 483426, "epoch": 2877} {"train_loss": -11.512984275817871, "global_step": 483427, "epoch": 2877} {"train_loss": -11.971662521362305, "global_step": 483428, "epoch": 2877} {"train_loss": -11.92111587524414, "global_step": 483429, "epoch": 2877} {"train_loss": -11.998645782470703, "global_step": 483430, "epoch": 2877} {"train_loss": -12.357646942138672, "global_step": 483431, "epoch": 2877} {"train_loss": -11.70744800567627, "global_step": 483432, "epoch": 2877} {"train_loss": -12.207908630371094, "global_step": 483433, "epoch": 2877} {"train_loss": -12.160446166992188, "global_step": 483434, "epoch": 2877} {"train_loss": -12.239117622375488, "global_step": 483435, "epoch": 2877} {"train_loss": -12.705902099609375, "global_step": 483436, "epoch": 2877} {"train_loss": -12.310286521911621, "global_step": 483437, "epoch": 2877} {"train_loss": -12.560128211975098, "global_step": 483438, "epoch": 2877} {"train_loss": -12.549433708190918, "global_step": 483439, "epoch": 2877} {"train_loss": -12.706815719604492, "global_step": 483440, "epoch": 2877} {"train_loss": -12.635181427001953, "global_step": 483441, "epoch": 2877} {"train_loss": -12.624492645263672, "global_step": 483442, "epoch": 2877} {"train_loss": -12.72181510925293, "global_step": 483443, "epoch": 2877} {"train_loss": -12.860130310058594, "global_step": 483444, "epoch": 2877} {"train_loss": -12.683368682861328, "global_step": 483445, "epoch": 2877} {"train_loss": -12.80036735534668, "global_step": 483446, "epoch": 2877} {"train_loss": -12.808913230895996, "global_step": 483447, "epoch": 2877} {"train_loss": -12.696735382080078, "global_step": 483448, "epoch": 2877} {"train_loss": -12.680201530456543, "global_step": 483449, "epoch": 2877} {"train_loss": -12.801000595092773, "global_step": 483450, "epoch": 2877} {"train_loss": -12.851438522338867, "global_step": 483451, "epoch": 2877} {"train_loss": -12.8375244140625, "global_step": 483452, "epoch": 2877} {"train_loss": -12.96053695678711, "global_step": 483453, "epoch": 2877} {"train_loss": -12.774418830871582, "global_step": 483454, "epoch": 2877} {"train_loss": -12.856637954711914, "global_step": 483455, "epoch": 2877} {"train_loss": -13.020427703857422, "global_step": 483456, "epoch": 2877} {"train_loss": -13.044410705566406, "global_step": 483457, "epoch": 2877} {"train_loss": -12.89716625213623, "global_step": 483458, "epoch": 2877} {"train_loss": -12.611793518066406, "global_step": 483459, "epoch": 2877} {"train_loss": -12.98731803894043, "global_step": 483460, "epoch": 2877} {"train_loss": -12.933345794677734, "global_step": 483461, "epoch": 2877} {"train_loss": -12.905092239379883, "global_step": 483462, "epoch": 2877} {"train_loss": -12.74980354309082, "global_step": 483463, "epoch": 2877} {"train_loss": -12.623884201049805, "global_step": 483464, "epoch": 2877} {"train_loss": -12.779308319091797, "global_step": 483465, "epoch": 2877} {"train_loss": -13.025714874267578, "global_step": 483466, "epoch": 2877} {"train_loss": -12.731051445007324, "global_step": 483467, "epoch": 2877} {"train_loss": -12.940398216247559, "global_step": 483468, "epoch": 2877} {"train_loss": -12.510088920593262, "global_step": 483469, "epoch": 2877} {"train_loss": -13.033096313476562, "global_step": 483470, "epoch": 2877} {"train_loss": -13.057598114013672, "global_step": 483471, "epoch": 2877} {"train_loss": -13.012977600097656, "global_step": 483472, "epoch": 2877} {"train_loss": -12.889043807983398, "global_step": 483473, "epoch": 2877} {"train_loss": -13.088119506835938, "global_step": 483474, "epoch": 2877} {"train_loss": -12.781232833862305, "global_step": 483475, "epoch": 2877} {"train_loss": -13.087285995483398, "global_step": 483476, "epoch": 2877} {"train_loss": -12.869359970092773, "global_step": 483477, "epoch": 2877} {"train_loss": -12.836469650268555, "global_step": 483478, "epoch": 2877} {"train_loss": -12.835813522338867, "global_step": 483479, "epoch": 2877} {"train_loss": -12.83137321472168, "global_step": 483480, "epoch": 2877} {"train_loss": -12.774168014526367, "global_step": 483481, "epoch": 2877} {"train_loss": -12.851773262023926, "global_step": 483482, "epoch": 2877} {"train_loss": -12.866679191589355, "global_step": 483483, "epoch": 2877} {"train_loss": -12.840505599975586, "global_step": 483484, "epoch": 2877} {"train_loss": -12.880157470703125, "global_step": 483485, "epoch": 2877} {"train_loss": -12.895727157592773, "global_step": 483486, "epoch": 2877} {"train_loss": -12.830050468444824, "global_step": 483487, "epoch": 2877} {"train_loss": -13.009256362915039, "global_step": 483488, "epoch": 2877} {"train_loss": -12.957027435302734, "global_step": 483489, "epoch": 2877} {"train_loss": -12.772222518920898, "global_step": 483490, "epoch": 2877} {"train_loss": -12.772248268127441, "global_step": 483491, "epoch": 2877} {"train_loss": -12.799646377563477, "global_step": 483492, "epoch": 2877} {"train_loss": -12.99477767944336, "global_step": 483493, "epoch": 2877} {"train_loss": -13.050934791564941, "global_step": 483494, "epoch": 2877} {"train_loss": -13.021208763122559, "global_step": 483495, "epoch": 2877} {"train_loss": -12.791887283325195, "global_step": 483496, "epoch": 2877} {"train_loss": -12.93075942993164, "global_step": 483497, "epoch": 2877} {"train_loss": -12.861272811889648, "global_step": 483498, "epoch": 2877} {"train_loss": -13.106576919555664, "global_step": 483499, "epoch": 2877} {"train_loss": -12.896196365356445, "global_step": 483500, "epoch": 2877} {"train_loss": -12.843185424804688, "global_step": 483501, "epoch": 2877} {"train_loss": -12.897850036621094, "global_step": 483502, "epoch": 2877} {"train_loss": -12.305210976373582, "global_step": 483503, "epoch": 2877, "val_loss": 319679.15625} {"train_loss": -12.08875560760498, "global_step": 483504, "epoch": 2878} {"train_loss": -11.822035789489746, "global_step": 483505, "epoch": 2878} {"train_loss": -12.720833778381348, "global_step": 483506, "epoch": 2878} {"train_loss": -12.513445854187012, "global_step": 483507, "epoch": 2878} {"train_loss": -12.552374839782715, "global_step": 483508, "epoch": 2878} {"train_loss": -13.022720336914062, "global_step": 483509, "epoch": 2878} {"train_loss": -12.985515594482422, "global_step": 483510, "epoch": 2878} {"train_loss": -12.439849853515625, "global_step": 483511, "epoch": 2878} {"train_loss": -12.590167045593262, "global_step": 483512, "epoch": 2878} {"train_loss": -12.894344329833984, "global_step": 483513, "epoch": 2878} {"train_loss": -12.881498336791992, "global_step": 483514, "epoch": 2878} {"train_loss": -12.710468292236328, "global_step": 483515, "epoch": 2878} {"train_loss": -12.581025123596191, "global_step": 483516, "epoch": 2878} {"train_loss": -12.569514274597168, "global_step": 483517, "epoch": 2878} {"train_loss": -12.455842971801758, "global_step": 483518, "epoch": 2878} {"train_loss": -12.717863082885742, "global_step": 483519, "epoch": 2878} {"train_loss": -12.089775085449219, "global_step": 483520, "epoch": 2878} {"train_loss": -12.589021682739258, "global_step": 483521, "epoch": 2878} {"train_loss": -12.784380912780762, "global_step": 483522, "epoch": 2878} {"train_loss": -12.584975242614746, "global_step": 483523, "epoch": 2878} {"train_loss": -12.324990272521973, "global_step": 483524, "epoch": 2878} {"train_loss": -11.660408973693848, "global_step": 483525, "epoch": 2878} {"train_loss": -11.877496719360352, "global_step": 483526, "epoch": 2878} {"train_loss": -12.797338485717773, "global_step": 483527, "epoch": 2878} {"train_loss": -11.936410903930664, "global_step": 483528, "epoch": 2878} {"train_loss": -11.737970352172852, "global_step": 483529, "epoch": 2878} {"train_loss": -10.944718360900879, "global_step": 483530, "epoch": 2878} {"train_loss": -12.211454391479492, "global_step": 483531, "epoch": 2878} {"train_loss": -11.859703063964844, "global_step": 483532, "epoch": 2878} {"train_loss": -11.375718116760254, "global_step": 483533, "epoch": 2878} {"train_loss": -12.631729125976562, "global_step": 483534, "epoch": 2878} {"train_loss": -12.003402709960938, "global_step": 483535, "epoch": 2878} {"train_loss": -12.089567184448242, "global_step": 483536, "epoch": 2878} {"train_loss": -11.781922340393066, "global_step": 483537, "epoch": 2878} {"train_loss": -12.098388671875, "global_step": 483538, "epoch": 2878} {"train_loss": -11.633785247802734, "global_step": 483539, "epoch": 2878} {"train_loss": -11.65951919555664, "global_step": 483540, "epoch": 2878} {"train_loss": -10.889690399169922, "global_step": 483541, "epoch": 2878} {"train_loss": -9.709741592407227, "global_step": 483542, "epoch": 2878} {"train_loss": -11.722932815551758, "global_step": 483543, "epoch": 2878} {"train_loss": -9.690939903259277, "global_step": 483544, "epoch": 2878} {"train_loss": -9.988393783569336, "global_step": 483545, "epoch": 2878} {"train_loss": -11.646002769470215, "global_step": 483546, "epoch": 2878} {"train_loss": -8.649944305419922, "global_step": 483547, "epoch": 2878} {"train_loss": -11.467935562133789, "global_step": 483548, "epoch": 2878} {"train_loss": -10.358492851257324, "global_step": 483549, "epoch": 2878} {"train_loss": -10.720796585083008, "global_step": 483550, "epoch": 2878} {"train_loss": -11.570096969604492, "global_step": 483551, "epoch": 2878} {"train_loss": -10.664587020874023, "global_step": 483552, "epoch": 2878} {"train_loss": -11.914794921875, "global_step": 483553, "epoch": 2878} {"train_loss": -10.488716125488281, "global_step": 483554, "epoch": 2878} {"train_loss": -11.429004669189453, "global_step": 483555, "epoch": 2878} {"train_loss": -12.082647323608398, "global_step": 483556, "epoch": 2878} {"train_loss": -10.946516036987305, "global_step": 483557, "epoch": 2878} {"train_loss": -11.93838119506836, "global_step": 483558, "epoch": 2878} {"train_loss": -11.053564071655273, "global_step": 483559, "epoch": 2878} {"train_loss": -11.184453964233398, "global_step": 483560, "epoch": 2878} {"train_loss": -12.173755645751953, "global_step": 483561, "epoch": 2878} {"train_loss": -11.338247299194336, "global_step": 483562, "epoch": 2878} {"train_loss": -11.451522827148438, "global_step": 483563, "epoch": 2878} {"train_loss": -11.920053482055664, "global_step": 483564, "epoch": 2878} {"train_loss": -11.117133140563965, "global_step": 483565, "epoch": 2878} {"train_loss": -11.618520736694336, "global_step": 483566, "epoch": 2878} {"train_loss": -11.059551239013672, "global_step": 483567, "epoch": 2878} {"train_loss": -11.025922775268555, "global_step": 483568, "epoch": 2878} {"train_loss": -11.444543838500977, "global_step": 483569, "epoch": 2878} {"train_loss": -11.83180046081543, "global_step": 483570, "epoch": 2878} {"train_loss": -12.126995086669922, "global_step": 483571, "epoch": 2878} {"train_loss": -11.518182754516602, "global_step": 483572, "epoch": 2878} {"train_loss": -12.066900253295898, "global_step": 483573, "epoch": 2878} {"train_loss": -12.00449275970459, "global_step": 483574, "epoch": 2878} {"train_loss": -11.687088012695312, "global_step": 483575, "epoch": 2878} {"train_loss": -12.138081550598145, "global_step": 483576, "epoch": 2878} {"train_loss": -12.26960563659668, "global_step": 483577, "epoch": 2878} {"train_loss": -11.98896598815918, "global_step": 483578, "epoch": 2878} {"train_loss": -11.918394088745117, "global_step": 483579, "epoch": 2878} {"train_loss": -12.07746696472168, "global_step": 483580, "epoch": 2878} {"train_loss": -12.32061767578125, "global_step": 483581, "epoch": 2878} {"train_loss": -11.464876174926758, "global_step": 483582, "epoch": 2878} {"train_loss": -12.172561645507812, "global_step": 483583, "epoch": 2878} {"train_loss": -12.17856216430664, "global_step": 483584, "epoch": 2878} {"train_loss": -12.44783878326416, "global_step": 483585, "epoch": 2878} {"train_loss": -12.338889122009277, "global_step": 483586, "epoch": 2878} {"train_loss": -11.955503463745117, "global_step": 483587, "epoch": 2878} {"train_loss": -12.638294219970703, "global_step": 483588, "epoch": 2878} {"train_loss": -12.09115219116211, "global_step": 483589, "epoch": 2878} {"train_loss": -12.318126678466797, "global_step": 483590, "epoch": 2878} {"train_loss": -12.491352081298828, "global_step": 483591, "epoch": 2878} {"train_loss": -12.207672119140625, "global_step": 483592, "epoch": 2878} {"train_loss": -12.561723709106445, "global_step": 483593, "epoch": 2878} {"train_loss": -12.372138977050781, "global_step": 483594, "epoch": 2878} {"train_loss": -12.696098327636719, "global_step": 483595, "epoch": 2878} {"train_loss": -12.460681915283203, "global_step": 483596, "epoch": 2878} {"train_loss": -12.179527282714844, "global_step": 483597, "epoch": 2878} {"train_loss": -12.432799339294434, "global_step": 483598, "epoch": 2878} {"train_loss": -12.517719268798828, "global_step": 483599, "epoch": 2878} {"train_loss": -12.591545104980469, "global_step": 483600, "epoch": 2878} {"train_loss": -12.61095142364502, "global_step": 483601, "epoch": 2878} {"train_loss": -12.520383834838867, "global_step": 483602, "epoch": 2878} {"train_loss": -12.687782287597656, "global_step": 483603, "epoch": 2878} {"train_loss": -12.19688606262207, "global_step": 483604, "epoch": 2878} {"train_loss": -12.802839279174805, "global_step": 483605, "epoch": 2878} {"train_loss": -12.253740310668945, "global_step": 483606, "epoch": 2878} {"train_loss": -12.678751945495605, "global_step": 483607, "epoch": 2878} {"train_loss": -12.686413764953613, "global_step": 483608, "epoch": 2878} {"train_loss": -12.55312728881836, "global_step": 483609, "epoch": 2878} {"train_loss": -12.440549850463867, "global_step": 483610, "epoch": 2878} {"train_loss": -12.728738784790039, "global_step": 483611, "epoch": 2878} {"train_loss": -12.755938529968262, "global_step": 483612, "epoch": 2878} {"train_loss": -12.493439674377441, "global_step": 483613, "epoch": 2878} {"train_loss": -12.758525848388672, "global_step": 483614, "epoch": 2878} {"train_loss": -12.564058303833008, "global_step": 483615, "epoch": 2878} {"train_loss": -12.577119827270508, "global_step": 483616, "epoch": 2878} {"train_loss": -12.757164001464844, "global_step": 483617, "epoch": 2878} {"train_loss": -12.166125297546387, "global_step": 483618, "epoch": 2878} {"train_loss": -12.575069427490234, "global_step": 483619, "epoch": 2878} {"train_loss": -12.594734191894531, "global_step": 483620, "epoch": 2878} {"train_loss": -12.863964080810547, "global_step": 483621, "epoch": 2878} {"train_loss": -12.50545883178711, "global_step": 483622, "epoch": 2878} {"train_loss": -12.8941650390625, "global_step": 483623, "epoch": 2878} {"train_loss": -12.481740951538086, "global_step": 483624, "epoch": 2878} {"train_loss": -12.642568588256836, "global_step": 483625, "epoch": 2878} {"train_loss": -12.66723918914795, "global_step": 483626, "epoch": 2878} {"train_loss": -12.597843170166016, "global_step": 483627, "epoch": 2878} {"train_loss": -12.54460620880127, "global_step": 483628, "epoch": 2878} {"train_loss": -12.67424201965332, "global_step": 483629, "epoch": 2878} {"train_loss": -12.344696044921875, "global_step": 483630, "epoch": 2878} {"train_loss": -12.060647964477539, "global_step": 483631, "epoch": 2878} {"train_loss": -12.524417877197266, "global_step": 483632, "epoch": 2878} {"train_loss": -12.427721977233887, "global_step": 483633, "epoch": 2878} {"train_loss": -12.169069290161133, "global_step": 483634, "epoch": 2878} {"train_loss": -12.825450897216797, "global_step": 483635, "epoch": 2878} {"train_loss": -11.946369171142578, "global_step": 483636, "epoch": 2878} {"train_loss": -11.589953422546387, "global_step": 483637, "epoch": 2878} {"train_loss": -12.813141822814941, "global_step": 483638, "epoch": 2878} {"train_loss": -12.359312057495117, "global_step": 483639, "epoch": 2878} {"train_loss": -11.162178039550781, "global_step": 483640, "epoch": 2878} {"train_loss": -12.634687423706055, "global_step": 483641, "epoch": 2878} {"train_loss": -12.055338859558105, "global_step": 483642, "epoch": 2878} {"train_loss": -12.221063613891602, "global_step": 483643, "epoch": 2878} {"train_loss": -12.451194763183594, "global_step": 483644, "epoch": 2878} {"train_loss": -11.28890609741211, "global_step": 483645, "epoch": 2878} {"train_loss": -12.540542602539062, "global_step": 483646, "epoch": 2878} {"train_loss": -12.002939224243164, "global_step": 483647, "epoch": 2878} {"train_loss": -11.85507583618164, "global_step": 483648, "epoch": 2878} {"train_loss": -12.319740295410156, "global_step": 483649, "epoch": 2878} {"train_loss": -12.477895736694336, "global_step": 483650, "epoch": 2878} {"train_loss": -12.17188835144043, "global_step": 483651, "epoch": 2878} {"train_loss": -12.496763229370117, "global_step": 483652, "epoch": 2878} {"train_loss": -12.410887718200684, "global_step": 483653, "epoch": 2878} {"train_loss": -12.523791313171387, "global_step": 483654, "epoch": 2878} {"train_loss": -12.271817207336426, "global_step": 483655, "epoch": 2878} {"train_loss": -12.082037925720215, "global_step": 483656, "epoch": 2878} {"train_loss": -12.445734024047852, "global_step": 483657, "epoch": 2878} {"train_loss": -11.946602821350098, "global_step": 483658, "epoch": 2878} {"train_loss": -11.992822647094727, "global_step": 483659, "epoch": 2878} {"train_loss": -12.40135383605957, "global_step": 483660, "epoch": 2878} {"train_loss": -11.962287902832031, "global_step": 483661, "epoch": 2878} {"train_loss": -11.934305191040039, "global_step": 483662, "epoch": 2878} {"train_loss": -12.393623352050781, "global_step": 483663, "epoch": 2878} {"train_loss": -11.536873817443848, "global_step": 483664, "epoch": 2878} {"train_loss": -12.590978622436523, "global_step": 483665, "epoch": 2878} {"train_loss": -12.153695106506348, "global_step": 483666, "epoch": 2878} {"train_loss": -12.147248268127441, "global_step": 483667, "epoch": 2878} {"train_loss": -12.494244575500488, "global_step": 483668, "epoch": 2878} {"train_loss": -12.130754470825195, "global_step": 483669, "epoch": 2878} {"train_loss": -12.26505184173584, "global_step": 483670, "epoch": 2878} {"train_loss": -12.092304695220221, "global_step": 483671, "epoch": 2878, "val_loss": 317265.0625} {"train_loss": -12.474119186401367, "global_step": 483672, "epoch": 2879} {"train_loss": -12.45456314086914, "global_step": 483673, "epoch": 2879} {"train_loss": -12.146503448486328, "global_step": 483674, "epoch": 2879} {"train_loss": -12.316210746765137, "global_step": 483675, "epoch": 2879} {"train_loss": -11.183939933776855, "global_step": 483676, "epoch": 2879} {"train_loss": -11.26791000366211, "global_step": 483677, "epoch": 2879} {"train_loss": -12.504655838012695, "global_step": 483678, "epoch": 2879} {"train_loss": -10.990925788879395, "global_step": 483679, "epoch": 2879} {"train_loss": -12.339743614196777, "global_step": 483680, "epoch": 2879} {"train_loss": -11.530609130859375, "global_step": 483681, "epoch": 2879} {"train_loss": -11.344823837280273, "global_step": 483682, "epoch": 2879} {"train_loss": -11.837508201599121, "global_step": 483683, "epoch": 2879} {"train_loss": -10.781025886535645, "global_step": 483684, "epoch": 2879} {"train_loss": -11.609271049499512, "global_step": 483685, "epoch": 2879} {"train_loss": -10.930821418762207, "global_step": 483686, "epoch": 2879} {"train_loss": -11.674182891845703, "global_step": 483687, "epoch": 2879} {"train_loss": -12.160545349121094, "global_step": 483688, "epoch": 2879} {"train_loss": -11.944079399108887, "global_step": 483689, "epoch": 2879} {"train_loss": -12.102519989013672, "global_step": 483690, "epoch": 2879} {"train_loss": -11.23358154296875, "global_step": 483691, "epoch": 2879} {"train_loss": -11.667864799499512, "global_step": 483692, "epoch": 2879} {"train_loss": -11.846303939819336, "global_step": 483693, "epoch": 2879} {"train_loss": -11.656482696533203, "global_step": 483694, "epoch": 2879} {"train_loss": -11.600211143493652, "global_step": 483695, "epoch": 2879} {"train_loss": -12.35544204711914, "global_step": 483696, "epoch": 2879} {"train_loss": -11.345111846923828, "global_step": 483697, "epoch": 2879} {"train_loss": -12.24069881439209, "global_step": 483698, "epoch": 2879} {"train_loss": -11.73395824432373, "global_step": 483699, "epoch": 2879} {"train_loss": -12.496615409851074, "global_step": 483700, "epoch": 2879} {"train_loss": -11.742603302001953, "global_step": 483701, "epoch": 2879} {"train_loss": -12.135350227355957, "global_step": 483702, "epoch": 2879} {"train_loss": -12.263859748840332, "global_step": 483703, "epoch": 2879} {"train_loss": -12.260651588439941, "global_step": 483704, "epoch": 2879} {"train_loss": -12.447051048278809, "global_step": 483705, "epoch": 2879} {"train_loss": -12.188499450683594, "global_step": 483706, "epoch": 2879} {"train_loss": -12.75119686126709, "global_step": 483707, "epoch": 2879} {"train_loss": -11.964540481567383, "global_step": 483708, "epoch": 2879} {"train_loss": -12.222221374511719, "global_step": 483709, "epoch": 2879} {"train_loss": -12.064838409423828, "global_step": 483710, "epoch": 2879} {"train_loss": -11.706618309020996, "global_step": 483711, "epoch": 2879} {"train_loss": -11.961841583251953, "global_step": 483712, "epoch": 2879} {"train_loss": -11.706809997558594, "global_step": 483713, "epoch": 2879} {"train_loss": -11.94775104522705, "global_step": 483714, "epoch": 2879} {"train_loss": -12.286737442016602, "global_step": 483715, "epoch": 2879} {"train_loss": -11.925812721252441, "global_step": 483716, "epoch": 2879} {"train_loss": -12.38352108001709, "global_step": 483717, "epoch": 2879} {"train_loss": -11.934279441833496, "global_step": 483718, "epoch": 2879} {"train_loss": -11.31988525390625, "global_step": 483719, "epoch": 2879} {"train_loss": -12.132366180419922, "global_step": 483720, "epoch": 2879} {"train_loss": -11.030803680419922, "global_step": 483721, "epoch": 2879} {"train_loss": -12.56807804107666, "global_step": 483722, "epoch": 2879} {"train_loss": -11.059677124023438, "global_step": 483723, "epoch": 2879} {"train_loss": -12.375340461730957, "global_step": 483724, "epoch": 2879} {"train_loss": -11.209014892578125, "global_step": 483725, "epoch": 2879} {"train_loss": -11.515888214111328, "global_step": 483726, "epoch": 2879} {"train_loss": -12.033381462097168, "global_step": 483727, "epoch": 2879} {"train_loss": -11.973121643066406, "global_step": 483728, "epoch": 2879} {"train_loss": -12.288633346557617, "global_step": 483729, "epoch": 2879} {"train_loss": -11.951559066772461, "global_step": 483730, "epoch": 2879} {"train_loss": -12.031229019165039, "global_step": 483731, "epoch": 2879} {"train_loss": -12.225278854370117, "global_step": 483732, "epoch": 2879} {"train_loss": -11.989734649658203, "global_step": 483733, "epoch": 2879} {"train_loss": -12.671913146972656, "global_step": 483734, "epoch": 2879} {"train_loss": -12.049619674682617, "global_step": 483735, "epoch": 2879} {"train_loss": -12.344188690185547, "global_step": 483736, "epoch": 2879} {"train_loss": -12.27695083618164, "global_step": 483737, "epoch": 2879} {"train_loss": -12.382631301879883, "global_step": 483738, "epoch": 2879} {"train_loss": -12.631973266601562, "global_step": 483739, "epoch": 2879} {"train_loss": -12.221756935119629, "global_step": 483740, "epoch": 2879} {"train_loss": -12.604769706726074, "global_step": 483741, "epoch": 2879} {"train_loss": -12.647090911865234, "global_step": 483742, "epoch": 2879} {"train_loss": -12.345600128173828, "global_step": 483743, "epoch": 2879} {"train_loss": -12.521036148071289, "global_step": 483744, "epoch": 2879} {"train_loss": -12.612468719482422, "global_step": 483745, "epoch": 2879} {"train_loss": -12.522656440734863, "global_step": 483746, "epoch": 2879} {"train_loss": -12.788911819458008, "global_step": 483747, "epoch": 2879} {"train_loss": -12.855751991271973, "global_step": 483748, "epoch": 2879} {"train_loss": -12.806251525878906, "global_step": 483749, "epoch": 2879} {"train_loss": -12.776601791381836, "global_step": 483750, "epoch": 2879} {"train_loss": -12.525899887084961, "global_step": 483751, "epoch": 2879} {"train_loss": -12.585064888000488, "global_step": 483752, "epoch": 2879} {"train_loss": -12.784456253051758, "global_step": 483753, "epoch": 2879} {"train_loss": -12.733725547790527, "global_step": 483754, "epoch": 2879} {"train_loss": -12.625009536743164, "global_step": 483755, "epoch": 2879} {"train_loss": -12.845865249633789, "global_step": 483756, "epoch": 2879} {"train_loss": -12.864344596862793, "global_step": 483757, "epoch": 2879} {"train_loss": -12.804686546325684, "global_step": 483758, "epoch": 2879} {"train_loss": -12.804969787597656, "global_step": 483759, "epoch": 2879} {"train_loss": -12.739603042602539, "global_step": 483760, "epoch": 2879} {"train_loss": -12.915191650390625, "global_step": 483761, "epoch": 2879} {"train_loss": -12.70168399810791, "global_step": 483762, "epoch": 2879} {"train_loss": -12.811273574829102, "global_step": 483763, "epoch": 2879} {"train_loss": -12.840059280395508, "global_step": 483764, "epoch": 2879} {"train_loss": -12.962404251098633, "global_step": 483765, "epoch": 2879} {"train_loss": -13.040578842163086, "global_step": 483766, "epoch": 2879} {"train_loss": -12.968751907348633, "global_step": 483767, "epoch": 2879} {"train_loss": -12.923785209655762, "global_step": 483768, "epoch": 2879} {"train_loss": -12.857791900634766, "global_step": 483769, "epoch": 2879} {"train_loss": -13.006364822387695, "global_step": 483770, "epoch": 2879} {"train_loss": -13.021357536315918, "global_step": 483771, "epoch": 2879} {"train_loss": -12.530126571655273, "global_step": 483772, "epoch": 2879} {"train_loss": -12.924187660217285, "global_step": 483773, "epoch": 2879} {"train_loss": -12.733570098876953, "global_step": 483774, "epoch": 2879} {"train_loss": -12.739187240600586, "global_step": 483775, "epoch": 2879} {"train_loss": -13.084190368652344, "global_step": 483776, "epoch": 2879} {"train_loss": -12.744012832641602, "global_step": 483777, "epoch": 2879} {"train_loss": -12.703508377075195, "global_step": 483778, "epoch": 2879} {"train_loss": -12.681705474853516, "global_step": 483779, "epoch": 2879} {"train_loss": -12.71575927734375, "global_step": 483780, "epoch": 2879} {"train_loss": -12.696589469909668, "global_step": 483781, "epoch": 2879} {"train_loss": -12.589544296264648, "global_step": 483782, "epoch": 2879} {"train_loss": -12.248821258544922, "global_step": 483783, "epoch": 2879} {"train_loss": -12.887269973754883, "global_step": 483784, "epoch": 2879} {"train_loss": -12.518157958984375, "global_step": 483785, "epoch": 2879} {"train_loss": -12.413999557495117, "global_step": 483786, "epoch": 2879} {"train_loss": -12.500226974487305, "global_step": 483787, "epoch": 2879} {"train_loss": -12.653397560119629, "global_step": 483788, "epoch": 2879} {"train_loss": -12.735057830810547, "global_step": 483789, "epoch": 2879} {"train_loss": -12.807697296142578, "global_step": 483790, "epoch": 2879} {"train_loss": -12.572038650512695, "global_step": 483791, "epoch": 2879} {"train_loss": -13.046112060546875, "global_step": 483792, "epoch": 2879} {"train_loss": -12.805116653442383, "global_step": 483793, "epoch": 2879} {"train_loss": -12.939349174499512, "global_step": 483794, "epoch": 2879} {"train_loss": -12.845462799072266, "global_step": 483795, "epoch": 2879} {"train_loss": -12.421839714050293, "global_step": 483796, "epoch": 2879} {"train_loss": -12.502306938171387, "global_step": 483797, "epoch": 2879} {"train_loss": -12.680349349975586, "global_step": 483798, "epoch": 2879} {"train_loss": -12.849883079528809, "global_step": 483799, "epoch": 2879} {"train_loss": -12.48715877532959, "global_step": 483800, "epoch": 2879} {"train_loss": -12.7325439453125, "global_step": 483801, "epoch": 2879} {"train_loss": -12.39529037475586, "global_step": 483802, "epoch": 2879} {"train_loss": -12.899772644042969, "global_step": 483803, "epoch": 2879} {"train_loss": -12.529252052307129, "global_step": 483804, "epoch": 2879} {"train_loss": -12.701431274414062, "global_step": 483805, "epoch": 2879} {"train_loss": -12.084613800048828, "global_step": 483806, "epoch": 2879} {"train_loss": -12.512462615966797, "global_step": 483807, "epoch": 2879} {"train_loss": -12.612661361694336, "global_step": 483808, "epoch": 2879} {"train_loss": -12.675917625427246, "global_step": 483809, "epoch": 2879} {"train_loss": -12.437172889709473, "global_step": 483810, "epoch": 2879} {"train_loss": -12.939876556396484, "global_step": 483811, "epoch": 2879} {"train_loss": -12.513080596923828, "global_step": 483812, "epoch": 2879} {"train_loss": -12.69326400756836, "global_step": 483813, "epoch": 2879} {"train_loss": -12.319807052612305, "global_step": 483814, "epoch": 2879} {"train_loss": -12.71766471862793, "global_step": 483815, "epoch": 2879} {"train_loss": -12.7600679397583, "global_step": 483816, "epoch": 2879} {"train_loss": -12.79726791381836, "global_step": 483817, "epoch": 2879} {"train_loss": -11.955728530883789, "global_step": 483818, "epoch": 2879} {"train_loss": -11.795173645019531, "global_step": 483819, "epoch": 2879} {"train_loss": -12.057077407836914, "global_step": 483820, "epoch": 2879} {"train_loss": -10.7855863571167, "global_step": 483821, "epoch": 2879} {"train_loss": -12.241622924804688, "global_step": 483822, "epoch": 2879} {"train_loss": -11.823221206665039, "global_step": 483823, "epoch": 2879} {"train_loss": -10.833885192871094, "global_step": 483824, "epoch": 2879} {"train_loss": -10.915153503417969, "global_step": 483825, "epoch": 2879} {"train_loss": -10.833622932434082, "global_step": 483826, "epoch": 2879} {"train_loss": -11.894328117370605, "global_step": 483827, "epoch": 2879} {"train_loss": -12.029102325439453, "global_step": 483828, "epoch": 2879} {"train_loss": -11.468878746032715, "global_step": 483829, "epoch": 2879} {"train_loss": -12.728351593017578, "global_step": 483830, "epoch": 2879} {"train_loss": -12.482625961303711, "global_step": 483831, "epoch": 2879} {"train_loss": -12.130571365356445, "global_step": 483832, "epoch": 2879} {"train_loss": -12.51307487487793, "global_step": 483833, "epoch": 2879} {"train_loss": -12.141845703125, "global_step": 483834, "epoch": 2879} {"train_loss": -12.212200164794922, "global_step": 483835, "epoch": 2879} {"train_loss": -12.19045639038086, "global_step": 483836, "epoch": 2879} {"train_loss": -12.347675323486328, "global_step": 483837, "epoch": 2879} {"train_loss": -12.145156860351562, "global_step": 483838, "epoch": 2879} {"train_loss": -12.285859925406319, "global_step": 483839, "epoch": 2879, "val_loss": 314777.25} {"train_loss": -11.69068717956543, "global_step": 483840, "epoch": 2880} {"train_loss": -11.451685905456543, "global_step": 483841, "epoch": 2880} {"train_loss": -12.380573272705078, "global_step": 483842, "epoch": 2880} {"train_loss": -10.821855545043945, "global_step": 483843, "epoch": 2880} {"train_loss": -12.172060012817383, "global_step": 483844, "epoch": 2880} {"train_loss": -12.216147422790527, "global_step": 483845, "epoch": 2880} {"train_loss": -12.017024993896484, "global_step": 483846, "epoch": 2880} {"train_loss": -12.035604476928711, "global_step": 483847, "epoch": 2880} {"train_loss": -11.829483985900879, "global_step": 483848, "epoch": 2880} {"train_loss": -11.783098220825195, "global_step": 483849, "epoch": 2880} {"train_loss": -11.886327743530273, "global_step": 483850, "epoch": 2880} {"train_loss": -12.412548065185547, "global_step": 483851, "epoch": 2880} {"train_loss": -11.797327041625977, "global_step": 483852, "epoch": 2880} {"train_loss": -12.625410079956055, "global_step": 483853, "epoch": 2880} {"train_loss": -11.98926067352295, "global_step": 483854, "epoch": 2880} {"train_loss": -12.194998741149902, "global_step": 483855, "epoch": 2880} {"train_loss": -12.092982292175293, "global_step": 483856, "epoch": 2880} {"train_loss": -12.135869979858398, "global_step": 483857, "epoch": 2880} {"train_loss": -12.14673137664795, "global_step": 483858, "epoch": 2880} {"train_loss": -11.752283096313477, "global_step": 483859, "epoch": 2880} {"train_loss": -12.003134727478027, "global_step": 483860, "epoch": 2880} {"train_loss": -12.222127914428711, "global_step": 483861, "epoch": 2880} {"train_loss": -12.223819732666016, "global_step": 483862, "epoch": 2880} {"train_loss": -12.188729286193848, "global_step": 483863, "epoch": 2880} {"train_loss": -12.533998489379883, "global_step": 483864, "epoch": 2880} {"train_loss": -12.448528289794922, "global_step": 483865, "epoch": 2880} {"train_loss": -12.712761878967285, "global_step": 483866, "epoch": 2880} {"train_loss": -12.18819522857666, "global_step": 483867, "epoch": 2880} {"train_loss": -12.605619430541992, "global_step": 483868, "epoch": 2880} {"train_loss": -12.201337814331055, "global_step": 483869, "epoch": 2880} {"train_loss": -12.469708442687988, "global_step": 483870, "epoch": 2880} {"train_loss": -12.438199996948242, "global_step": 483871, "epoch": 2880} {"train_loss": -12.490484237670898, "global_step": 483872, "epoch": 2880} {"train_loss": -12.791318893432617, "global_step": 483873, "epoch": 2880} {"train_loss": -12.275044441223145, "global_step": 483874, "epoch": 2880} {"train_loss": -12.455093383789062, "global_step": 483875, "epoch": 2880} {"train_loss": -12.864990234375, "global_step": 483876, "epoch": 2880} {"train_loss": -12.517606735229492, "global_step": 483877, "epoch": 2880} {"train_loss": -12.876787185668945, "global_step": 483878, "epoch": 2880} {"train_loss": -12.37667179107666, "global_step": 483879, "epoch": 2880} {"train_loss": -12.432674407958984, "global_step": 483880, "epoch": 2880} {"train_loss": -12.40920639038086, "global_step": 483881, "epoch": 2880} {"train_loss": -11.981172561645508, "global_step": 483882, "epoch": 2880} {"train_loss": -12.55800724029541, "global_step": 483883, "epoch": 2880} {"train_loss": -12.01803970336914, "global_step": 483884, "epoch": 2880} {"train_loss": -12.306015968322754, "global_step": 483885, "epoch": 2880} {"train_loss": -12.235511779785156, "global_step": 483886, "epoch": 2880} {"train_loss": -12.495386123657227, "global_step": 483887, "epoch": 2880} {"train_loss": -12.672735214233398, "global_step": 483888, "epoch": 2880} {"train_loss": -12.466212272644043, "global_step": 483889, "epoch": 2880} {"train_loss": -12.692846298217773, "global_step": 483890, "epoch": 2880} {"train_loss": -12.63271713256836, "global_step": 483891, "epoch": 2880} {"train_loss": -12.487602233886719, "global_step": 483892, "epoch": 2880} {"train_loss": -12.67953872680664, "global_step": 483893, "epoch": 2880} {"train_loss": -12.64034652709961, "global_step": 483894, "epoch": 2880} {"train_loss": -12.616329193115234, "global_step": 483895, "epoch": 2880} {"train_loss": -12.663142204284668, "global_step": 483896, "epoch": 2880} {"train_loss": -12.851512908935547, "global_step": 483897, "epoch": 2880} {"train_loss": -12.669380187988281, "global_step": 483898, "epoch": 2880} {"train_loss": -12.906850814819336, "global_step": 483899, "epoch": 2880} {"train_loss": -12.68195629119873, "global_step": 483900, "epoch": 2880} {"train_loss": -12.953866004943848, "global_step": 483901, "epoch": 2880} {"train_loss": -12.745182037353516, "global_step": 483902, "epoch": 2880} {"train_loss": -12.364113807678223, "global_step": 483903, "epoch": 2880} {"train_loss": -12.134279251098633, "global_step": 483904, "epoch": 2880} {"train_loss": -11.954187393188477, "global_step": 483905, "epoch": 2880} {"train_loss": -11.259552001953125, "global_step": 483906, "epoch": 2880} {"train_loss": -11.400701522827148, "global_step": 483907, "epoch": 2880} {"train_loss": -12.230472564697266, "global_step": 483908, "epoch": 2880} {"train_loss": -11.330015182495117, "global_step": 483909, "epoch": 2880} {"train_loss": -12.488476753234863, "global_step": 483910, "epoch": 2880} {"train_loss": -11.236085891723633, "global_step": 483911, "epoch": 2880} {"train_loss": -11.932522773742676, "global_step": 483912, "epoch": 2880} {"train_loss": -12.020760536193848, "global_step": 483913, "epoch": 2880} {"train_loss": -12.460054397583008, "global_step": 483914, "epoch": 2880} {"train_loss": -12.085063934326172, "global_step": 483915, "epoch": 2880} {"train_loss": -12.256900787353516, "global_step": 483916, "epoch": 2880} {"train_loss": -12.366816520690918, "global_step": 483917, "epoch": 2880} {"train_loss": -12.271333694458008, "global_step": 483918, "epoch": 2880} {"train_loss": -12.492194175720215, "global_step": 483919, "epoch": 2880} {"train_loss": -12.442949295043945, "global_step": 483920, "epoch": 2880} {"train_loss": -12.851751327514648, "global_step": 483921, "epoch": 2880} {"train_loss": -12.634183883666992, "global_step": 483922, "epoch": 2880} {"train_loss": -12.722442626953125, "global_step": 483923, "epoch": 2880} {"train_loss": -12.707977294921875, "global_step": 483924, "epoch": 2880} {"train_loss": -12.742186546325684, "global_step": 483925, "epoch": 2880} {"train_loss": -12.649248123168945, "global_step": 483926, "epoch": 2880} {"train_loss": -12.591867446899414, "global_step": 483927, "epoch": 2880} {"train_loss": -12.063321113586426, "global_step": 483928, "epoch": 2880} {"train_loss": -12.30249309539795, "global_step": 483929, "epoch": 2880} {"train_loss": -11.896438598632812, "global_step": 483930, "epoch": 2880} {"train_loss": -11.912210464477539, "global_step": 483931, "epoch": 2880} {"train_loss": -10.643643379211426, "global_step": 483932, "epoch": 2880} {"train_loss": -11.579377174377441, "global_step": 483933, "epoch": 2880} {"train_loss": -10.491691589355469, "global_step": 483934, "epoch": 2880} {"train_loss": -11.155417442321777, "global_step": 483935, "epoch": 2880} {"train_loss": -11.112077713012695, "global_step": 483936, "epoch": 2880} {"train_loss": -10.38772201538086, "global_step": 483937, "epoch": 2880} {"train_loss": -11.36424446105957, "global_step": 483938, "epoch": 2880} {"train_loss": -11.390247344970703, "global_step": 483939, "epoch": 2880} {"train_loss": -10.847530364990234, "global_step": 483940, "epoch": 2880} {"train_loss": -11.550055503845215, "global_step": 483941, "epoch": 2880} {"train_loss": -10.98652458190918, "global_step": 483942, "epoch": 2880} {"train_loss": -9.98250961303711, "global_step": 483943, "epoch": 2880} {"train_loss": -11.394980430603027, "global_step": 483944, "epoch": 2880} {"train_loss": -10.816587448120117, "global_step": 483945, "epoch": 2880} {"train_loss": -9.833467483520508, "global_step": 483946, "epoch": 2880} {"train_loss": -11.558784484863281, "global_step": 483947, "epoch": 2880} {"train_loss": -11.21327018737793, "global_step": 483948, "epoch": 2880} {"train_loss": -10.305353164672852, "global_step": 483949, "epoch": 2880} {"train_loss": -11.837753295898438, "global_step": 483950, "epoch": 2880} {"train_loss": -10.934409141540527, "global_step": 483951, "epoch": 2880} {"train_loss": -11.90979290008545, "global_step": 483952, "epoch": 2880} {"train_loss": -12.019376754760742, "global_step": 483953, "epoch": 2880} {"train_loss": -11.701984405517578, "global_step": 483954, "epoch": 2880} {"train_loss": -11.702913284301758, "global_step": 483955, "epoch": 2880} {"train_loss": -11.579301834106445, "global_step": 483956, "epoch": 2880} {"train_loss": -11.3259859085083, "global_step": 483957, "epoch": 2880} {"train_loss": -11.535391807556152, "global_step": 483958, "epoch": 2880} {"train_loss": -11.447604179382324, "global_step": 483959, "epoch": 2880} {"train_loss": -10.058815956115723, "global_step": 483960, "epoch": 2880} {"train_loss": -11.291910171508789, "global_step": 483961, "epoch": 2880} {"train_loss": -10.698863983154297, "global_step": 483962, "epoch": 2880} {"train_loss": -10.983912467956543, "global_step": 483963, "epoch": 2880} {"train_loss": -9.766580581665039, "global_step": 483964, "epoch": 2880} {"train_loss": -9.41734504699707, "global_step": 483965, "epoch": 2880} {"train_loss": -10.098076820373535, "global_step": 483966, "epoch": 2880} {"train_loss": -9.14222240447998, "global_step": 483967, "epoch": 2880} {"train_loss": -9.7158842086792, "global_step": 483968, "epoch": 2880} {"train_loss": -9.68136215209961, "global_step": 483969, "epoch": 2880} {"train_loss": -9.334933280944824, "global_step": 483970, "epoch": 2880} {"train_loss": -9.903996467590332, "global_step": 483971, "epoch": 2880} {"train_loss": -9.880725860595703, "global_step": 483972, "epoch": 2880} {"train_loss": -9.616744995117188, "global_step": 483973, "epoch": 2880} {"train_loss": -9.921440124511719, "global_step": 483974, "epoch": 2880} {"train_loss": -10.446690559387207, "global_step": 483975, "epoch": 2880} {"train_loss": -10.86182689666748, "global_step": 483976, "epoch": 2880} {"train_loss": -10.902421951293945, "global_step": 483977, "epoch": 2880} {"train_loss": -10.933793067932129, "global_step": 483978, "epoch": 2880} {"train_loss": -11.759658813476562, "global_step": 483979, "epoch": 2880} {"train_loss": -10.841730117797852, "global_step": 483980, "epoch": 2880} {"train_loss": -10.593260765075684, "global_step": 483981, "epoch": 2880} {"train_loss": -11.415569305419922, "global_step": 483982, "epoch": 2880} {"train_loss": -11.440872192382812, "global_step": 483983, "epoch": 2880} {"train_loss": -10.608704566955566, "global_step": 483984, "epoch": 2880} {"train_loss": -11.96850872039795, "global_step": 483985, "epoch": 2880} {"train_loss": -11.303047180175781, "global_step": 483986, "epoch": 2880} {"train_loss": -10.804128646850586, "global_step": 483987, "epoch": 2880} {"train_loss": -11.955431938171387, "global_step": 483988, "epoch": 2880} {"train_loss": -10.689800262451172, "global_step": 483989, "epoch": 2880} {"train_loss": -11.229764938354492, "global_step": 483990, "epoch": 2880} {"train_loss": -11.40247917175293, "global_step": 483991, "epoch": 2880} {"train_loss": -11.268253326416016, "global_step": 483992, "epoch": 2880} {"train_loss": -11.574607849121094, "global_step": 483993, "epoch": 2880} {"train_loss": -11.697591781616211, "global_step": 483994, "epoch": 2880} {"train_loss": -11.737614631652832, "global_step": 483995, "epoch": 2880} {"train_loss": -12.058757781982422, "global_step": 483996, "epoch": 2880} {"train_loss": -12.012413024902344, "global_step": 483997, "epoch": 2880} {"train_loss": -11.802834510803223, "global_step": 483998, "epoch": 2880} {"train_loss": -12.132319450378418, "global_step": 483999, "epoch": 2880} {"train_loss": -12.204442977905273, "global_step": 484000, "epoch": 2880} {"train_loss": -11.998933792114258, "global_step": 484001, "epoch": 2880} {"train_loss": -11.824493408203125, "global_step": 484002, "epoch": 2880} {"train_loss": -12.264310836791992, "global_step": 484003, "epoch": 2880} {"train_loss": -12.160453796386719, "global_step": 484004, "epoch": 2880} {"train_loss": -12.208847999572754, "global_step": 484005, "epoch": 2880} {"train_loss": -12.134490966796875, "global_step": 484006, "epoch": 2880} {"train_loss": -11.748059454418364, "global_step": 484007, "epoch": 2880, "val_loss": 317378.71875, "train_action_mse_error": 1.4111206531524658} {"train_loss": -11.8877592086792, "global_step": 484008, "epoch": 2881} {"train_loss": -12.433338165283203, "global_step": 484009, "epoch": 2881} {"train_loss": -12.099082946777344, "global_step": 484010, "epoch": 2881} {"train_loss": -12.070294380187988, "global_step": 484011, "epoch": 2881} {"train_loss": -12.212303161621094, "global_step": 484012, "epoch": 2881} {"train_loss": -12.37791919708252, "global_step": 484013, "epoch": 2881} {"train_loss": -12.407890319824219, "global_step": 484014, "epoch": 2881} {"train_loss": -12.254356384277344, "global_step": 484015, "epoch": 2881} {"train_loss": -12.528398513793945, "global_step": 484016, "epoch": 2881} {"train_loss": -12.448183059692383, "global_step": 484017, "epoch": 2881} {"train_loss": -12.52406120300293, "global_step": 484018, "epoch": 2881} {"train_loss": -12.415793418884277, "global_step": 484019, "epoch": 2881} {"train_loss": -12.698553085327148, "global_step": 484020, "epoch": 2881} {"train_loss": -12.389655113220215, "global_step": 484021, "epoch": 2881} {"train_loss": -12.678943634033203, "global_step": 484022, "epoch": 2881} {"train_loss": -12.836204528808594, "global_step": 484023, "epoch": 2881} {"train_loss": -12.67266845703125, "global_step": 484024, "epoch": 2881} {"train_loss": -12.650144577026367, "global_step": 484025, "epoch": 2881} {"train_loss": -12.883980751037598, "global_step": 484026, "epoch": 2881} {"train_loss": -12.558879852294922, "global_step": 484027, "epoch": 2881} {"train_loss": -12.672874450683594, "global_step": 484028, "epoch": 2881} {"train_loss": -12.60584545135498, "global_step": 484029, "epoch": 2881} {"train_loss": -12.671844482421875, "global_step": 484030, "epoch": 2881} {"train_loss": -12.671758651733398, "global_step": 484031, "epoch": 2881} {"train_loss": -12.68209457397461, "global_step": 484032, "epoch": 2881} {"train_loss": -12.790138244628906, "global_step": 484033, "epoch": 2881} {"train_loss": -12.692012786865234, "global_step": 484034, "epoch": 2881} {"train_loss": -12.867196083068848, "global_step": 484035, "epoch": 2881} {"train_loss": -12.638917922973633, "global_step": 484036, "epoch": 2881} {"train_loss": -12.638970375061035, "global_step": 484037, "epoch": 2881} {"train_loss": -12.645027160644531, "global_step": 484038, "epoch": 2881} {"train_loss": -12.91203498840332, "global_step": 484039, "epoch": 2881} {"train_loss": -12.790163040161133, "global_step": 484040, "epoch": 2881} {"train_loss": -12.72913932800293, "global_step": 484041, "epoch": 2881} {"train_loss": -12.627467155456543, "global_step": 484042, "epoch": 2881} {"train_loss": -12.697440147399902, "global_step": 484043, "epoch": 2881} {"train_loss": -12.789753913879395, "global_step": 484044, "epoch": 2881} {"train_loss": -12.618400573730469, "global_step": 484045, "epoch": 2881} {"train_loss": -12.724302291870117, "global_step": 484046, "epoch": 2881} {"train_loss": -12.70173454284668, "global_step": 484047, "epoch": 2881} {"train_loss": -12.71059513092041, "global_step": 484048, "epoch": 2881} {"train_loss": -13.077775001525879, "global_step": 484049, "epoch": 2881} {"train_loss": -12.87121295928955, "global_step": 484050, "epoch": 2881} {"train_loss": -13.005315780639648, "global_step": 484051, "epoch": 2881} {"train_loss": -12.890052795410156, "global_step": 484052, "epoch": 2881} {"train_loss": -12.907958984375, "global_step": 484053, "epoch": 2881} {"train_loss": -12.755796432495117, "global_step": 484054, "epoch": 2881} {"train_loss": -12.580183982849121, "global_step": 484055, "epoch": 2881} {"train_loss": -12.90615463256836, "global_step": 484056, "epoch": 2881} {"train_loss": -12.928267478942871, "global_step": 484057, "epoch": 2881} {"train_loss": -12.95986270904541, "global_step": 484058, "epoch": 2881} {"train_loss": -12.721244812011719, "global_step": 484059, "epoch": 2881} {"train_loss": -13.056618690490723, "global_step": 484060, "epoch": 2881} {"train_loss": -12.8804349899292, "global_step": 484061, "epoch": 2881} {"train_loss": -12.965993881225586, "global_step": 484062, "epoch": 2881} {"train_loss": -12.932873725891113, "global_step": 484063, "epoch": 2881} {"train_loss": -12.949483871459961, "global_step": 484064, "epoch": 2881} {"train_loss": -12.964937210083008, "global_step": 484065, "epoch": 2881} {"train_loss": -12.82748031616211, "global_step": 484066, "epoch": 2881} {"train_loss": -12.793816566467285, "global_step": 484067, "epoch": 2881} {"train_loss": -12.821680068969727, "global_step": 484068, "epoch": 2881} {"train_loss": -12.869441986083984, "global_step": 484069, "epoch": 2881} {"train_loss": -12.984193801879883, "global_step": 484070, "epoch": 2881} {"train_loss": -12.949188232421875, "global_step": 484071, "epoch": 2881} {"train_loss": -12.814574241638184, "global_step": 484072, "epoch": 2881} {"train_loss": -12.757123947143555, "global_step": 484073, "epoch": 2881} {"train_loss": -13.077754020690918, "global_step": 484074, "epoch": 2881} {"train_loss": -12.867233276367188, "global_step": 484075, "epoch": 2881} {"train_loss": -12.888246536254883, "global_step": 484076, "epoch": 2881} {"train_loss": -12.656759262084961, "global_step": 484077, "epoch": 2881} {"train_loss": -12.716062545776367, "global_step": 484078, "epoch": 2881} {"train_loss": -12.755067825317383, "global_step": 484079, "epoch": 2881} {"train_loss": -12.948809623718262, "global_step": 484080, "epoch": 2881} {"train_loss": -12.954475402832031, "global_step": 484081, "epoch": 2881} {"train_loss": -13.002279281616211, "global_step": 484082, "epoch": 2881} {"train_loss": -12.752071380615234, "global_step": 484083, "epoch": 2881} {"train_loss": -12.8728666305542, "global_step": 484084, "epoch": 2881} {"train_loss": -12.777328491210938, "global_step": 484085, "epoch": 2881} {"train_loss": -13.147515296936035, "global_step": 484086, "epoch": 2881} {"train_loss": -12.710702896118164, "global_step": 484087, "epoch": 2881} {"train_loss": -12.929454803466797, "global_step": 484088, "epoch": 2881} {"train_loss": -12.694045066833496, "global_step": 484089, "epoch": 2881} {"train_loss": -12.41683578491211, "global_step": 484090, "epoch": 2881} {"train_loss": -12.513246536254883, "global_step": 484091, "epoch": 2881} {"train_loss": -12.472537994384766, "global_step": 484092, "epoch": 2881} {"train_loss": -12.917530059814453, "global_step": 484093, "epoch": 2881} {"train_loss": -12.452353477478027, "global_step": 484094, "epoch": 2881} {"train_loss": -12.984689712524414, "global_step": 484095, "epoch": 2881} {"train_loss": -12.413409233093262, "global_step": 484096, "epoch": 2881} {"train_loss": -12.608283996582031, "global_step": 484097, "epoch": 2881} {"train_loss": -12.576169967651367, "global_step": 484098, "epoch": 2881} {"train_loss": -12.816329956054688, "global_step": 484099, "epoch": 2881} {"train_loss": -12.69725513458252, "global_step": 484100, "epoch": 2881} {"train_loss": -12.641764640808105, "global_step": 484101, "epoch": 2881} {"train_loss": -12.505487442016602, "global_step": 484102, "epoch": 2881} {"train_loss": -12.228067398071289, "global_step": 484103, "epoch": 2881} {"train_loss": -11.953580856323242, "global_step": 484104, "epoch": 2881} {"train_loss": -12.786348342895508, "global_step": 484105, "epoch": 2881} {"train_loss": -12.689920425415039, "global_step": 484106, "epoch": 2881} {"train_loss": -11.6727294921875, "global_step": 484107, "epoch": 2881} {"train_loss": -11.981217384338379, "global_step": 484108, "epoch": 2881} {"train_loss": -12.410346984863281, "global_step": 484109, "epoch": 2881} {"train_loss": -11.2802095413208, "global_step": 484110, "epoch": 2881} {"train_loss": -9.453556060791016, "global_step": 484111, "epoch": 2881} {"train_loss": -11.912668228149414, "global_step": 484112, "epoch": 2881} {"train_loss": -8.386711120605469, "global_step": 484113, "epoch": 2881} {"train_loss": -9.336586952209473, "global_step": 484114, "epoch": 2881} {"train_loss": -9.754545211791992, "global_step": 484115, "epoch": 2881} {"train_loss": -11.127631187438965, "global_step": 484116, "epoch": 2881} {"train_loss": -8.664217948913574, "global_step": 484117, "epoch": 2881} {"train_loss": -10.659479141235352, "global_step": 484118, "epoch": 2881} {"train_loss": -9.68874740600586, "global_step": 484119, "epoch": 2881} {"train_loss": -9.403430938720703, "global_step": 484120, "epoch": 2881} {"train_loss": -8.153944969177246, "global_step": 484121, "epoch": 2881} {"train_loss": -9.624454498291016, "global_step": 484122, "epoch": 2881} {"train_loss": -10.980941772460938, "global_step": 484123, "epoch": 2881} {"train_loss": -10.663644790649414, "global_step": 484124, "epoch": 2881} {"train_loss": -10.472318649291992, "global_step": 484125, "epoch": 2881} {"train_loss": -11.54570484161377, "global_step": 484126, "epoch": 2881} {"train_loss": -10.867347717285156, "global_step": 484127, "epoch": 2881} {"train_loss": -11.98134708404541, "global_step": 484128, "epoch": 2881} {"train_loss": -11.25115966796875, "global_step": 484129, "epoch": 2881} {"train_loss": -10.884599685668945, "global_step": 484130, "epoch": 2881} {"train_loss": -11.097076416015625, "global_step": 484131, "epoch": 2881} {"train_loss": -11.894267082214355, "global_step": 484132, "epoch": 2881} {"train_loss": -11.595263481140137, "global_step": 484133, "epoch": 2881} {"train_loss": -11.64508056640625, "global_step": 484134, "epoch": 2881} {"train_loss": -11.981223106384277, "global_step": 484135, "epoch": 2881} {"train_loss": -11.471153259277344, "global_step": 484136, "epoch": 2881} {"train_loss": -11.590909957885742, "global_step": 484137, "epoch": 2881} {"train_loss": -11.551763534545898, "global_step": 484138, "epoch": 2881} {"train_loss": -12.25575065612793, "global_step": 484139, "epoch": 2881} {"train_loss": -11.88473892211914, "global_step": 484140, "epoch": 2881} {"train_loss": -11.725360870361328, "global_step": 484141, "epoch": 2881} {"train_loss": -11.96953296661377, "global_step": 484142, "epoch": 2881} {"train_loss": -11.535650253295898, "global_step": 484143, "epoch": 2881} {"train_loss": -12.14766788482666, "global_step": 484144, "epoch": 2881} {"train_loss": -11.715927124023438, "global_step": 484145, "epoch": 2881} {"train_loss": -12.304830551147461, "global_step": 484146, "epoch": 2881} {"train_loss": -11.282059669494629, "global_step": 484147, "epoch": 2881} {"train_loss": -12.262533187866211, "global_step": 484148, "epoch": 2881} {"train_loss": -12.065167427062988, "global_step": 484149, "epoch": 2881} {"train_loss": -11.950201034545898, "global_step": 484150, "epoch": 2881} {"train_loss": -12.510976791381836, "global_step": 484151, "epoch": 2881} {"train_loss": -11.933980941772461, "global_step": 484152, "epoch": 2881} {"train_loss": -12.08991813659668, "global_step": 484153, "epoch": 2881} {"train_loss": -12.289870262145996, "global_step": 484154, "epoch": 2881} {"train_loss": -12.456302642822266, "global_step": 484155, "epoch": 2881} {"train_loss": -12.360044479370117, "global_step": 484156, "epoch": 2881} {"train_loss": -12.209132194519043, "global_step": 484157, "epoch": 2881} {"train_loss": -12.381654739379883, "global_step": 484158, "epoch": 2881} {"train_loss": -12.370399475097656, "global_step": 484159, "epoch": 2881} {"train_loss": -12.239584922790527, "global_step": 484160, "epoch": 2881} {"train_loss": -12.446368217468262, "global_step": 484161, "epoch": 2881} {"train_loss": -12.668490409851074, "global_step": 484162, "epoch": 2881} {"train_loss": -12.555746078491211, "global_step": 484163, "epoch": 2881} {"train_loss": -12.650833129882812, "global_step": 484164, "epoch": 2881} {"train_loss": -12.744121551513672, "global_step": 484165, "epoch": 2881} {"train_loss": -12.696880340576172, "global_step": 484166, "epoch": 2881} {"train_loss": -12.790704727172852, "global_step": 484167, "epoch": 2881} {"train_loss": -12.56370735168457, "global_step": 484168, "epoch": 2881} {"train_loss": -12.800333023071289, "global_step": 484169, "epoch": 2881} {"train_loss": -12.823333740234375, "global_step": 484170, "epoch": 2881} {"train_loss": -12.856212615966797, "global_step": 484171, "epoch": 2881} {"train_loss": -12.49787712097168, "global_step": 484172, "epoch": 2881} {"train_loss": -12.899782180786133, "global_step": 484173, "epoch": 2881} {"train_loss": -12.914840698242188, "global_step": 484174, "epoch": 2881} {"train_loss": -12.255704732168288, "global_step": 484175, "epoch": 2881, "val_loss": 311954.875} {"train_loss": -12.869688034057617, "global_step": 484176, "epoch": 2882} {"train_loss": -12.618509292602539, "global_step": 484177, "epoch": 2882} {"train_loss": -12.673871994018555, "global_step": 484178, "epoch": 2882} {"train_loss": -12.60586166381836, "global_step": 484179, "epoch": 2882} {"train_loss": -12.541415214538574, "global_step": 484180, "epoch": 2882} {"train_loss": -12.574701309204102, "global_step": 484181, "epoch": 2882} {"train_loss": -12.792131423950195, "global_step": 484182, "epoch": 2882} {"train_loss": -12.788459777832031, "global_step": 484183, "epoch": 2882} {"train_loss": -12.539142608642578, "global_step": 484184, "epoch": 2882} {"train_loss": -12.767812728881836, "global_step": 484185, "epoch": 2882} {"train_loss": -12.665593147277832, "global_step": 484186, "epoch": 2882} {"train_loss": -12.922403335571289, "global_step": 484187, "epoch": 2882} {"train_loss": -12.54127311706543, "global_step": 484188, "epoch": 2882} {"train_loss": -12.461591720581055, "global_step": 484189, "epoch": 2882} {"train_loss": -13.031025886535645, "global_step": 484190, "epoch": 2882} {"train_loss": -12.766704559326172, "global_step": 484191, "epoch": 2882} {"train_loss": -12.852872848510742, "global_step": 484192, "epoch": 2882} {"train_loss": -12.564311981201172, "global_step": 484193, "epoch": 2882} {"train_loss": -12.770830154418945, "global_step": 484194, "epoch": 2882} {"train_loss": -12.793679237365723, "global_step": 484195, "epoch": 2882} {"train_loss": -12.588541030883789, "global_step": 484196, "epoch": 2882} {"train_loss": -12.527016639709473, "global_step": 484197, "epoch": 2882} {"train_loss": -12.876120567321777, "global_step": 484198, "epoch": 2882} {"train_loss": -12.416419982910156, "global_step": 484199, "epoch": 2882} {"train_loss": -12.382498741149902, "global_step": 484200, "epoch": 2882} {"train_loss": -12.51953125, "global_step": 484201, "epoch": 2882} {"train_loss": -12.363247871398926, "global_step": 484202, "epoch": 2882} {"train_loss": -12.520118713378906, "global_step": 484203, "epoch": 2882} {"train_loss": -12.572702407836914, "global_step": 484204, "epoch": 2882} {"train_loss": -12.704928398132324, "global_step": 484205, "epoch": 2882} {"train_loss": -12.299176216125488, "global_step": 484206, "epoch": 2882} {"train_loss": -12.641905784606934, "global_step": 484207, "epoch": 2882} {"train_loss": -12.677104949951172, "global_step": 484208, "epoch": 2882} {"train_loss": -12.75306510925293, "global_step": 484209, "epoch": 2882} {"train_loss": -12.514657020568848, "global_step": 484210, "epoch": 2882} {"train_loss": -12.83663558959961, "global_step": 484211, "epoch": 2882} {"train_loss": -12.580000877380371, "global_step": 484212, "epoch": 2882} {"train_loss": -12.736082077026367, "global_step": 484213, "epoch": 2882} {"train_loss": -12.524564743041992, "global_step": 484214, "epoch": 2882} {"train_loss": -12.522294044494629, "global_step": 484215, "epoch": 2882} {"train_loss": -12.221202850341797, "global_step": 484216, "epoch": 2882} {"train_loss": -11.454988479614258, "global_step": 484217, "epoch": 2882} {"train_loss": -11.820127487182617, "global_step": 484218, "epoch": 2882} {"train_loss": -11.586065292358398, "global_step": 484219, "epoch": 2882} {"train_loss": -11.459742546081543, "global_step": 484220, "epoch": 2882} {"train_loss": -10.924156188964844, "global_step": 484221, "epoch": 2882} {"train_loss": -11.482980728149414, "global_step": 484222, "epoch": 2882} {"train_loss": -10.843100547790527, "global_step": 484223, "epoch": 2882} {"train_loss": -12.291580200195312, "global_step": 484224, "epoch": 2882} {"train_loss": -11.753183364868164, "global_step": 484225, "epoch": 2882} {"train_loss": -12.401632308959961, "global_step": 484226, "epoch": 2882} {"train_loss": -11.62177562713623, "global_step": 484227, "epoch": 2882} {"train_loss": -11.498397827148438, "global_step": 484228, "epoch": 2882} {"train_loss": -12.435033798217773, "global_step": 484229, "epoch": 2882} {"train_loss": -12.036527633666992, "global_step": 484230, "epoch": 2882} {"train_loss": -12.51754379272461, "global_step": 484231, "epoch": 2882} {"train_loss": -11.30321979522705, "global_step": 484232, "epoch": 2882} {"train_loss": -12.264016151428223, "global_step": 484233, "epoch": 2882} {"train_loss": -12.353177070617676, "global_step": 484234, "epoch": 2882} {"train_loss": -12.65974235534668, "global_step": 484235, "epoch": 2882} {"train_loss": -12.37806224822998, "global_step": 484236, "epoch": 2882} {"train_loss": -12.634401321411133, "global_step": 484237, "epoch": 2882} {"train_loss": -11.966206550598145, "global_step": 484238, "epoch": 2882} {"train_loss": -11.925994873046875, "global_step": 484239, "epoch": 2882} {"train_loss": -12.771635055541992, "global_step": 484240, "epoch": 2882} {"train_loss": -11.893054008483887, "global_step": 484241, "epoch": 2882} {"train_loss": -11.383642196655273, "global_step": 484242, "epoch": 2882} {"train_loss": -12.478759765625, "global_step": 484243, "epoch": 2882} {"train_loss": -11.86520767211914, "global_step": 484244, "epoch": 2882} {"train_loss": -11.878690719604492, "global_step": 484245, "epoch": 2882} {"train_loss": -12.184837341308594, "global_step": 484246, "epoch": 2882} {"train_loss": -12.474739074707031, "global_step": 484247, "epoch": 2882} {"train_loss": -12.301844596862793, "global_step": 484248, "epoch": 2882} {"train_loss": -12.187801361083984, "global_step": 484249, "epoch": 2882} {"train_loss": -12.076226234436035, "global_step": 484250, "epoch": 2882} {"train_loss": -12.289291381835938, "global_step": 484251, "epoch": 2882} {"train_loss": -11.829633712768555, "global_step": 484252, "epoch": 2882} {"train_loss": -12.453777313232422, "global_step": 484253, "epoch": 2882} {"train_loss": -11.922069549560547, "global_step": 484254, "epoch": 2882} {"train_loss": -12.575127601623535, "global_step": 484255, "epoch": 2882} {"train_loss": -11.93541145324707, "global_step": 484256, "epoch": 2882} {"train_loss": -11.941404342651367, "global_step": 484257, "epoch": 2882} {"train_loss": -12.409191131591797, "global_step": 484258, "epoch": 2882} {"train_loss": -12.469276428222656, "global_step": 484259, "epoch": 2882} {"train_loss": -12.461170196533203, "global_step": 484260, "epoch": 2882} {"train_loss": -12.586213111877441, "global_step": 484261, "epoch": 2882} {"train_loss": -12.559199333190918, "global_step": 484262, "epoch": 2882} {"train_loss": -12.55507755279541, "global_step": 484263, "epoch": 2882} {"train_loss": -12.484317779541016, "global_step": 484264, "epoch": 2882} {"train_loss": -11.494359970092773, "global_step": 484265, "epoch": 2882} {"train_loss": -12.091641426086426, "global_step": 484266, "epoch": 2882} {"train_loss": -12.39912223815918, "global_step": 484267, "epoch": 2882} {"train_loss": -11.886946678161621, "global_step": 484268, "epoch": 2882} {"train_loss": -12.084087371826172, "global_step": 484269, "epoch": 2882} {"train_loss": -12.450761795043945, "global_step": 484270, "epoch": 2882} {"train_loss": -12.247330665588379, "global_step": 484271, "epoch": 2882} {"train_loss": -12.330511093139648, "global_step": 484272, "epoch": 2882} {"train_loss": -12.228708267211914, "global_step": 484273, "epoch": 2882} {"train_loss": -12.362418174743652, "global_step": 484274, "epoch": 2882} {"train_loss": -12.489021301269531, "global_step": 484275, "epoch": 2882} {"train_loss": -12.202093124389648, "global_step": 484276, "epoch": 2882} {"train_loss": -12.450050354003906, "global_step": 484277, "epoch": 2882} {"train_loss": -12.505563735961914, "global_step": 484278, "epoch": 2882} {"train_loss": -12.311362266540527, "global_step": 484279, "epoch": 2882} {"train_loss": -12.671693801879883, "global_step": 484280, "epoch": 2882} {"train_loss": -12.536630630493164, "global_step": 484281, "epoch": 2882} {"train_loss": -11.920980453491211, "global_step": 484282, "epoch": 2882} {"train_loss": -12.151573181152344, "global_step": 484283, "epoch": 2882} {"train_loss": -12.54328727722168, "global_step": 484284, "epoch": 2882} {"train_loss": -11.679147720336914, "global_step": 484285, "epoch": 2882} {"train_loss": -12.242130279541016, "global_step": 484286, "epoch": 2882} {"train_loss": -12.330442428588867, "global_step": 484287, "epoch": 2882} {"train_loss": -12.24705696105957, "global_step": 484288, "epoch": 2882} {"train_loss": -12.776763916015625, "global_step": 484289, "epoch": 2882} {"train_loss": -12.66316032409668, "global_step": 484290, "epoch": 2882} {"train_loss": -12.543562889099121, "global_step": 484291, "epoch": 2882} {"train_loss": -12.583942413330078, "global_step": 484292, "epoch": 2882} {"train_loss": -12.900211334228516, "global_step": 484293, "epoch": 2882} {"train_loss": -12.571954727172852, "global_step": 484294, "epoch": 2882} {"train_loss": -12.634475708007812, "global_step": 484295, "epoch": 2882} {"train_loss": -12.295223236083984, "global_step": 484296, "epoch": 2882} {"train_loss": -12.075982093811035, "global_step": 484297, "epoch": 2882} {"train_loss": -11.796337127685547, "global_step": 484298, "epoch": 2882} {"train_loss": -12.741473197937012, "global_step": 484299, "epoch": 2882} {"train_loss": -11.823210716247559, "global_step": 484300, "epoch": 2882} {"train_loss": -12.036523818969727, "global_step": 484301, "epoch": 2882} {"train_loss": -12.697881698608398, "global_step": 484302, "epoch": 2882} {"train_loss": -11.865854263305664, "global_step": 484303, "epoch": 2882} {"train_loss": -12.272089004516602, "global_step": 484304, "epoch": 2882} {"train_loss": -12.879124641418457, "global_step": 484305, "epoch": 2882} {"train_loss": -12.453399658203125, "global_step": 484306, "epoch": 2882} {"train_loss": -11.89503288269043, "global_step": 484307, "epoch": 2882} {"train_loss": -12.585505485534668, "global_step": 484308, "epoch": 2882} {"train_loss": -12.623464584350586, "global_step": 484309, "epoch": 2882} {"train_loss": -12.363038063049316, "global_step": 484310, "epoch": 2882} {"train_loss": -12.655550003051758, "global_step": 484311, "epoch": 2882} {"train_loss": -12.474798202514648, "global_step": 484312, "epoch": 2882} {"train_loss": -12.25306510925293, "global_step": 484313, "epoch": 2882} {"train_loss": -12.953362464904785, "global_step": 484314, "epoch": 2882} {"train_loss": -12.291542053222656, "global_step": 484315, "epoch": 2882} {"train_loss": -12.784077644348145, "global_step": 484316, "epoch": 2882} {"train_loss": -12.558813095092773, "global_step": 484317, "epoch": 2882} {"train_loss": -12.717050552368164, "global_step": 484318, "epoch": 2882} {"train_loss": -12.612736701965332, "global_step": 484319, "epoch": 2882} {"train_loss": -12.356351852416992, "global_step": 484320, "epoch": 2882} {"train_loss": -12.691232681274414, "global_step": 484321, "epoch": 2882} {"train_loss": -12.582650184631348, "global_step": 484322, "epoch": 2882} {"train_loss": -12.119359970092773, "global_step": 484323, "epoch": 2882} {"train_loss": -12.734296798706055, "global_step": 484324, "epoch": 2882} {"train_loss": -12.467357635498047, "global_step": 484325, "epoch": 2882} {"train_loss": -11.888251304626465, "global_step": 484326, "epoch": 2882} {"train_loss": -12.417508125305176, "global_step": 484327, "epoch": 2882} {"train_loss": -11.930370330810547, "global_step": 484328, "epoch": 2882} {"train_loss": -12.510720252990723, "global_step": 484329, "epoch": 2882} {"train_loss": -12.464897155761719, "global_step": 484330, "epoch": 2882} {"train_loss": -11.990537643432617, "global_step": 484331, "epoch": 2882} {"train_loss": -11.718461036682129, "global_step": 484332, "epoch": 2882} {"train_loss": -12.661514282226562, "global_step": 484333, "epoch": 2882} {"train_loss": -12.701562881469727, "global_step": 484334, "epoch": 2882} {"train_loss": -12.581165313720703, "global_step": 484335, "epoch": 2882} {"train_loss": -12.644319534301758, "global_step": 484336, "epoch": 2882} {"train_loss": -12.724815368652344, "global_step": 484337, "epoch": 2882} {"train_loss": -12.523929595947266, "global_step": 484338, "epoch": 2882} {"train_loss": -12.753890991210938, "global_step": 484339, "epoch": 2882} {"train_loss": -12.45776653289795, "global_step": 484340, "epoch": 2882} {"train_loss": -12.810559272766113, "global_step": 484341, "epoch": 2882} {"train_loss": -12.506975173950195, "global_step": 484342, "epoch": 2882} {"train_loss": -12.356906067757379, "global_step": 484343, "epoch": 2882, "val_loss": 316688.84375} {"train_loss": -12.84132194519043, "global_step": 484344, "epoch": 2883} {"train_loss": -12.274582862854004, "global_step": 484345, "epoch": 2883} {"train_loss": -12.297781944274902, "global_step": 484346, "epoch": 2883} {"train_loss": -12.764759063720703, "global_step": 484347, "epoch": 2883} {"train_loss": -12.652929306030273, "global_step": 484348, "epoch": 2883} {"train_loss": -12.80842399597168, "global_step": 484349, "epoch": 2883} {"train_loss": -12.912789344787598, "global_step": 484350, "epoch": 2883} {"train_loss": -12.685338973999023, "global_step": 484351, "epoch": 2883} {"train_loss": -12.56884765625, "global_step": 484352, "epoch": 2883} {"train_loss": -12.857782363891602, "global_step": 484353, "epoch": 2883} {"train_loss": -12.369461059570312, "global_step": 484354, "epoch": 2883} {"train_loss": -12.717782020568848, "global_step": 484355, "epoch": 2883} {"train_loss": -12.641676902770996, "global_step": 484356, "epoch": 2883} {"train_loss": -12.784513473510742, "global_step": 484357, "epoch": 2883} {"train_loss": -12.569311141967773, "global_step": 484358, "epoch": 2883} {"train_loss": -12.710123062133789, "global_step": 484359, "epoch": 2883} {"train_loss": -12.710243225097656, "global_step": 484360, "epoch": 2883} {"train_loss": -12.8720121383667, "global_step": 484361, "epoch": 2883} {"train_loss": -12.052970886230469, "global_step": 484362, "epoch": 2883} {"train_loss": -12.360148429870605, "global_step": 484363, "epoch": 2883} {"train_loss": -12.517812728881836, "global_step": 484364, "epoch": 2883} {"train_loss": -12.4422025680542, "global_step": 484365, "epoch": 2883} {"train_loss": -12.7684326171875, "global_step": 484366, "epoch": 2883} {"train_loss": -12.148207664489746, "global_step": 484367, "epoch": 2883} {"train_loss": -12.692970275878906, "global_step": 484368, "epoch": 2883} {"train_loss": -12.378974914550781, "global_step": 484369, "epoch": 2883} {"train_loss": -12.573968887329102, "global_step": 484370, "epoch": 2883} {"train_loss": -12.113164901733398, "global_step": 484371, "epoch": 2883} {"train_loss": -12.960692405700684, "global_step": 484372, "epoch": 2883} {"train_loss": -12.007966995239258, "global_step": 484373, "epoch": 2883} {"train_loss": -11.855703353881836, "global_step": 484374, "epoch": 2883} {"train_loss": -11.925322532653809, "global_step": 484375, "epoch": 2883} {"train_loss": -12.688071250915527, "global_step": 484376, "epoch": 2883} {"train_loss": -11.19087028503418, "global_step": 484377, "epoch": 2883} {"train_loss": -12.23664379119873, "global_step": 484378, "epoch": 2883} {"train_loss": -12.087760925292969, "global_step": 484379, "epoch": 2883} {"train_loss": -12.101228713989258, "global_step": 484380, "epoch": 2883} {"train_loss": -12.519548416137695, "global_step": 484381, "epoch": 2883} {"train_loss": -11.748615264892578, "global_step": 484382, "epoch": 2883} {"train_loss": -12.7127685546875, "global_step": 484383, "epoch": 2883} {"train_loss": -11.553430557250977, "global_step": 484384, "epoch": 2883} {"train_loss": -10.223544120788574, "global_step": 484385, "epoch": 2883} {"train_loss": -12.245079040527344, "global_step": 484386, "epoch": 2883} {"train_loss": -11.482392311096191, "global_step": 484387, "epoch": 2883} {"train_loss": -12.271617889404297, "global_step": 484388, "epoch": 2883} {"train_loss": -11.670560836791992, "global_step": 484389, "epoch": 2883} {"train_loss": -12.188941955566406, "global_step": 484390, "epoch": 2883} {"train_loss": -12.004779815673828, "global_step": 484391, "epoch": 2883} {"train_loss": -11.991888999938965, "global_step": 484392, "epoch": 2883} {"train_loss": -12.105199813842773, "global_step": 484393, "epoch": 2883} {"train_loss": -12.423135757446289, "global_step": 484394, "epoch": 2883} {"train_loss": -12.233325958251953, "global_step": 484395, "epoch": 2883} {"train_loss": -12.323405265808105, "global_step": 484396, "epoch": 2883} {"train_loss": -12.32642936706543, "global_step": 484397, "epoch": 2883} {"train_loss": -12.294307708740234, "global_step": 484398, "epoch": 2883} {"train_loss": -12.138397216796875, "global_step": 484399, "epoch": 2883} {"train_loss": -12.653971672058105, "global_step": 484400, "epoch": 2883} {"train_loss": -12.654267311096191, "global_step": 484401, "epoch": 2883} {"train_loss": -12.332359313964844, "global_step": 484402, "epoch": 2883} {"train_loss": -12.283910751342773, "global_step": 484403, "epoch": 2883} {"train_loss": -12.69948959350586, "global_step": 484404, "epoch": 2883} {"train_loss": -12.19140911102295, "global_step": 484405, "epoch": 2883} {"train_loss": -12.725775718688965, "global_step": 484406, "epoch": 2883} {"train_loss": -12.80514907836914, "global_step": 484407, "epoch": 2883} {"train_loss": -12.091268539428711, "global_step": 484408, "epoch": 2883} {"train_loss": -12.168234825134277, "global_step": 484409, "epoch": 2883} {"train_loss": -12.55935001373291, "global_step": 484410, "epoch": 2883} {"train_loss": -12.683467864990234, "global_step": 484411, "epoch": 2883} {"train_loss": -12.61949348449707, "global_step": 484412, "epoch": 2883} {"train_loss": -12.450875282287598, "global_step": 484413, "epoch": 2883} {"train_loss": -12.618637084960938, "global_step": 484414, "epoch": 2883} {"train_loss": -12.453832626342773, "global_step": 484415, "epoch": 2883} {"train_loss": -12.565155029296875, "global_step": 484416, "epoch": 2883} {"train_loss": -12.506270408630371, "global_step": 484417, "epoch": 2883} {"train_loss": -12.797727584838867, "global_step": 484418, "epoch": 2883} {"train_loss": -12.845582962036133, "global_step": 484419, "epoch": 2883} {"train_loss": -12.590209007263184, "global_step": 484420, "epoch": 2883} {"train_loss": -12.747735977172852, "global_step": 484421, "epoch": 2883} {"train_loss": -12.601211547851562, "global_step": 484422, "epoch": 2883} {"train_loss": -11.905885696411133, "global_step": 484423, "epoch": 2883} {"train_loss": -12.365922927856445, "global_step": 484424, "epoch": 2883} {"train_loss": -12.853949546813965, "global_step": 484425, "epoch": 2883} {"train_loss": -12.129522323608398, "global_step": 484426, "epoch": 2883} {"train_loss": -11.802656173706055, "global_step": 484427, "epoch": 2883} {"train_loss": -11.086828231811523, "global_step": 484428, "epoch": 2883} {"train_loss": -12.028541564941406, "global_step": 484429, "epoch": 2883} {"train_loss": -12.668402671813965, "global_step": 484430, "epoch": 2883} {"train_loss": -11.740745544433594, "global_step": 484431, "epoch": 2883} {"train_loss": -11.877811431884766, "global_step": 484432, "epoch": 2883} {"train_loss": -12.85754108428955, "global_step": 484433, "epoch": 2883} {"train_loss": -11.671490669250488, "global_step": 484434, "epoch": 2883} {"train_loss": -11.303983688354492, "global_step": 484435, "epoch": 2883} {"train_loss": -12.287857055664062, "global_step": 484436, "epoch": 2883} {"train_loss": -11.691940307617188, "global_step": 484437, "epoch": 2883} {"train_loss": -11.58156967163086, "global_step": 484438, "epoch": 2883} {"train_loss": -12.134395599365234, "global_step": 484439, "epoch": 2883} {"train_loss": -11.77039623260498, "global_step": 484440, "epoch": 2883} {"train_loss": -11.69192123413086, "global_step": 484441, "epoch": 2883} {"train_loss": -11.494606018066406, "global_step": 484442, "epoch": 2883} {"train_loss": -11.771562576293945, "global_step": 484443, "epoch": 2883} {"train_loss": -12.183856010437012, "global_step": 484444, "epoch": 2883} {"train_loss": -11.58841323852539, "global_step": 484445, "epoch": 2883} {"train_loss": -12.226534843444824, "global_step": 484446, "epoch": 2883} {"train_loss": -12.246021270751953, "global_step": 484447, "epoch": 2883} {"train_loss": -12.166976928710938, "global_step": 484448, "epoch": 2883} {"train_loss": -12.265616416931152, "global_step": 484449, "epoch": 2883} {"train_loss": -12.529729843139648, "global_step": 484450, "epoch": 2883} {"train_loss": -12.810958862304688, "global_step": 484451, "epoch": 2883} {"train_loss": -12.706243515014648, "global_step": 484452, "epoch": 2883} {"train_loss": -12.316282272338867, "global_step": 484453, "epoch": 2883} {"train_loss": -12.5613431930542, "global_step": 484454, "epoch": 2883} {"train_loss": -12.315303802490234, "global_step": 484455, "epoch": 2883} {"train_loss": -12.359006881713867, "global_step": 484456, "epoch": 2883} {"train_loss": -12.49228286743164, "global_step": 484457, "epoch": 2883} {"train_loss": -12.450518608093262, "global_step": 484458, "epoch": 2883} {"train_loss": -12.431879043579102, "global_step": 484459, "epoch": 2883} {"train_loss": -12.480920791625977, "global_step": 484460, "epoch": 2883} {"train_loss": -12.76809024810791, "global_step": 484461, "epoch": 2883} {"train_loss": -12.47226333618164, "global_step": 484462, "epoch": 2883} {"train_loss": -12.38913345336914, "global_step": 484463, "epoch": 2883} {"train_loss": -12.714926719665527, "global_step": 484464, "epoch": 2883} {"train_loss": -12.087068557739258, "global_step": 484465, "epoch": 2883} {"train_loss": -12.416658401489258, "global_step": 484466, "epoch": 2883} {"train_loss": -11.663333892822266, "global_step": 484467, "epoch": 2883} {"train_loss": -12.63335132598877, "global_step": 484468, "epoch": 2883} {"train_loss": -12.372573852539062, "global_step": 484469, "epoch": 2883} {"train_loss": -11.891748428344727, "global_step": 484470, "epoch": 2883} {"train_loss": -12.390233993530273, "global_step": 484471, "epoch": 2883} {"train_loss": -12.545193672180176, "global_step": 484472, "epoch": 2883} {"train_loss": -12.684165000915527, "global_step": 484473, "epoch": 2883} {"train_loss": -12.567377090454102, "global_step": 484474, "epoch": 2883} {"train_loss": -12.556251525878906, "global_step": 484475, "epoch": 2883} {"train_loss": -12.490551948547363, "global_step": 484476, "epoch": 2883} {"train_loss": -12.71468448638916, "global_step": 484477, "epoch": 2883} {"train_loss": -12.922554016113281, "global_step": 484478, "epoch": 2883} {"train_loss": -12.752021789550781, "global_step": 484479, "epoch": 2883} {"train_loss": -12.358184814453125, "global_step": 484480, "epoch": 2883} {"train_loss": -12.716690063476562, "global_step": 484481, "epoch": 2883} {"train_loss": -12.461432456970215, "global_step": 484482, "epoch": 2883} {"train_loss": -12.69919204711914, "global_step": 484483, "epoch": 2883} {"train_loss": -12.66984748840332, "global_step": 484484, "epoch": 2883} {"train_loss": -12.215770721435547, "global_step": 484485, "epoch": 2883} {"train_loss": -12.86250114440918, "global_step": 484486, "epoch": 2883} {"train_loss": -12.532328605651855, "global_step": 484487, "epoch": 2883} {"train_loss": -12.920208930969238, "global_step": 484488, "epoch": 2883} {"train_loss": -12.314901351928711, "global_step": 484489, "epoch": 2883} {"train_loss": -13.060370445251465, "global_step": 484490, "epoch": 2883} {"train_loss": -12.757445335388184, "global_step": 484491, "epoch": 2883} {"train_loss": -12.788414001464844, "global_step": 484492, "epoch": 2883} {"train_loss": -12.944925308227539, "global_step": 484493, "epoch": 2883} {"train_loss": -12.858560562133789, "global_step": 484494, "epoch": 2883} {"train_loss": -12.848751068115234, "global_step": 484495, "epoch": 2883} {"train_loss": -12.904854774475098, "global_step": 484496, "epoch": 2883} {"train_loss": -13.037395477294922, "global_step": 484497, "epoch": 2883} {"train_loss": -12.718230247497559, "global_step": 484498, "epoch": 2883} {"train_loss": -12.909978866577148, "global_step": 484499, "epoch": 2883} {"train_loss": -12.792694091796875, "global_step": 484500, "epoch": 2883} {"train_loss": -12.664265632629395, "global_step": 484501, "epoch": 2883} {"train_loss": -12.871614456176758, "global_step": 484502, "epoch": 2883} {"train_loss": -12.836713790893555, "global_step": 484503, "epoch": 2883} {"train_loss": -12.350251197814941, "global_step": 484504, "epoch": 2883} {"train_loss": -12.168113708496094, "global_step": 484505, "epoch": 2883} {"train_loss": -12.21441650390625, "global_step": 484506, "epoch": 2883} {"train_loss": -12.453086853027344, "global_step": 484507, "epoch": 2883} {"train_loss": -12.722110748291016, "global_step": 484508, "epoch": 2883} {"train_loss": -11.774365425109863, "global_step": 484509, "epoch": 2883} {"train_loss": -11.671493530273438, "global_step": 484510, "epoch": 2883} {"train_loss": -12.377254713149298, "global_step": 484511, "epoch": 2883, "val_loss": 318239.46875} {"train_loss": -12.456539154052734, "global_step": 484512, "epoch": 2884} {"train_loss": -11.426445007324219, "global_step": 484513, "epoch": 2884} {"train_loss": -12.147956848144531, "global_step": 484514, "epoch": 2884} {"train_loss": -11.327808380126953, "global_step": 484515, "epoch": 2884} {"train_loss": -11.525145530700684, "global_step": 484516, "epoch": 2884} {"train_loss": -11.238805770874023, "global_step": 484517, "epoch": 2884} {"train_loss": -12.226485252380371, "global_step": 484518, "epoch": 2884} {"train_loss": -12.054342269897461, "global_step": 484519, "epoch": 2884} {"train_loss": -11.51862907409668, "global_step": 484520, "epoch": 2884} {"train_loss": -11.424306869506836, "global_step": 484521, "epoch": 2884} {"train_loss": -11.97999382019043, "global_step": 484522, "epoch": 2884} {"train_loss": -12.010295867919922, "global_step": 484523, "epoch": 2884} {"train_loss": -11.953357696533203, "global_step": 484524, "epoch": 2884} {"train_loss": -11.95108413696289, "global_step": 484525, "epoch": 2884} {"train_loss": -12.208463668823242, "global_step": 484526, "epoch": 2884} {"train_loss": -12.175684928894043, "global_step": 484527, "epoch": 2884} {"train_loss": -12.314573287963867, "global_step": 484528, "epoch": 2884} {"train_loss": -12.52481460571289, "global_step": 484529, "epoch": 2884} {"train_loss": -12.386489868164062, "global_step": 484530, "epoch": 2884} {"train_loss": -12.835989952087402, "global_step": 484531, "epoch": 2884} {"train_loss": -12.342001914978027, "global_step": 484532, "epoch": 2884} {"train_loss": -12.794469833374023, "global_step": 484533, "epoch": 2884} {"train_loss": -12.321268081665039, "global_step": 484534, "epoch": 2884} {"train_loss": -12.418279647827148, "global_step": 484535, "epoch": 2884} {"train_loss": -12.89393138885498, "global_step": 484536, "epoch": 2884} {"train_loss": -12.901865005493164, "global_step": 484537, "epoch": 2884} {"train_loss": -12.68833065032959, "global_step": 484538, "epoch": 2884} {"train_loss": -12.8147611618042, "global_step": 484539, "epoch": 2884} {"train_loss": -12.843389511108398, "global_step": 484540, "epoch": 2884} {"train_loss": -12.614583969116211, "global_step": 484541, "epoch": 2884} {"train_loss": -12.57699966430664, "global_step": 484542, "epoch": 2884} {"train_loss": -13.04227352142334, "global_step": 484543, "epoch": 2884} {"train_loss": -12.271268844604492, "global_step": 484544, "epoch": 2884} {"train_loss": -12.156044960021973, "global_step": 484545, "epoch": 2884} {"train_loss": -12.56417465209961, "global_step": 484546, "epoch": 2884} {"train_loss": -12.504806518554688, "global_step": 484547, "epoch": 2884} {"train_loss": -12.261484146118164, "global_step": 484548, "epoch": 2884} {"train_loss": -11.753917694091797, "global_step": 484549, "epoch": 2884} {"train_loss": -12.193631172180176, "global_step": 484550, "epoch": 2884} {"train_loss": -11.908607482910156, "global_step": 484551, "epoch": 2884} {"train_loss": -12.187223434448242, "global_step": 484552, "epoch": 2884} {"train_loss": -11.66055679321289, "global_step": 484553, "epoch": 2884} {"train_loss": -12.37218952178955, "global_step": 484554, "epoch": 2884} {"train_loss": -12.162479400634766, "global_step": 484555, "epoch": 2884} {"train_loss": -12.248899459838867, "global_step": 484556, "epoch": 2884} {"train_loss": -11.904419898986816, "global_step": 484557, "epoch": 2884} {"train_loss": -12.539667129516602, "global_step": 484558, "epoch": 2884} {"train_loss": -11.7259521484375, "global_step": 484559, "epoch": 2884} {"train_loss": -12.37063980102539, "global_step": 484560, "epoch": 2884} {"train_loss": -12.278696060180664, "global_step": 484561, "epoch": 2884} {"train_loss": -12.28886604309082, "global_step": 484562, "epoch": 2884} {"train_loss": -12.459653854370117, "global_step": 484563, "epoch": 2884} {"train_loss": -12.526985168457031, "global_step": 484564, "epoch": 2884} {"train_loss": -12.518136024475098, "global_step": 484565, "epoch": 2884} {"train_loss": -12.66830825805664, "global_step": 484566, "epoch": 2884} {"train_loss": -12.571681022644043, "global_step": 484567, "epoch": 2884} {"train_loss": -12.4871244430542, "global_step": 484568, "epoch": 2884} {"train_loss": -12.771708488464355, "global_step": 484569, "epoch": 2884} {"train_loss": -12.553268432617188, "global_step": 484570, "epoch": 2884} {"train_loss": -12.869961738586426, "global_step": 484571, "epoch": 2884} {"train_loss": -12.559530258178711, "global_step": 484572, "epoch": 2884} {"train_loss": -12.831805229187012, "global_step": 484573, "epoch": 2884} {"train_loss": -12.719291687011719, "global_step": 484574, "epoch": 2884} {"train_loss": -12.723529815673828, "global_step": 484575, "epoch": 2884} {"train_loss": -12.776880264282227, "global_step": 484576, "epoch": 2884} {"train_loss": -12.769289016723633, "global_step": 484577, "epoch": 2884} {"train_loss": -12.837801933288574, "global_step": 484578, "epoch": 2884} {"train_loss": -12.810237884521484, "global_step": 484579, "epoch": 2884} {"train_loss": -12.931158065795898, "global_step": 484580, "epoch": 2884} {"train_loss": -12.739974021911621, "global_step": 484581, "epoch": 2884} {"train_loss": -12.910139083862305, "global_step": 484582, "epoch": 2884} {"train_loss": -12.764951705932617, "global_step": 484583, "epoch": 2884} {"train_loss": -12.953275680541992, "global_step": 484584, "epoch": 2884} {"train_loss": -12.9658203125, "global_step": 484585, "epoch": 2884} {"train_loss": -12.828402519226074, "global_step": 484586, "epoch": 2884} {"train_loss": -12.738855361938477, "global_step": 484587, "epoch": 2884} {"train_loss": -12.895065307617188, "global_step": 484588, "epoch": 2884} {"train_loss": -12.763565063476562, "global_step": 484589, "epoch": 2884} {"train_loss": -12.857526779174805, "global_step": 484590, "epoch": 2884} {"train_loss": -12.66411304473877, "global_step": 484591, "epoch": 2884} {"train_loss": -12.368488311767578, "global_step": 484592, "epoch": 2884} {"train_loss": -12.732076644897461, "global_step": 484593, "epoch": 2884} {"train_loss": -12.137876510620117, "global_step": 484594, "epoch": 2884} {"train_loss": -10.866107940673828, "global_step": 484595, "epoch": 2884} {"train_loss": -12.242061614990234, "global_step": 484596, "epoch": 2884} {"train_loss": -10.918553352355957, "global_step": 484597, "epoch": 2884} {"train_loss": -12.012433052062988, "global_step": 484598, "epoch": 2884} {"train_loss": -12.269436836242676, "global_step": 484599, "epoch": 2884} {"train_loss": -12.38417911529541, "global_step": 484600, "epoch": 2884} {"train_loss": -12.484942436218262, "global_step": 484601, "epoch": 2884} {"train_loss": -11.950708389282227, "global_step": 484602, "epoch": 2884} {"train_loss": -12.349949836730957, "global_step": 484603, "epoch": 2884} {"train_loss": -11.488507270812988, "global_step": 484604, "epoch": 2884} {"train_loss": -11.969064712524414, "global_step": 484605, "epoch": 2884} {"train_loss": -12.088918685913086, "global_step": 484606, "epoch": 2884} {"train_loss": -11.82103157043457, "global_step": 484607, "epoch": 2884} {"train_loss": -12.273085594177246, "global_step": 484608, "epoch": 2884} {"train_loss": -11.672189712524414, "global_step": 484609, "epoch": 2884} {"train_loss": -11.875953674316406, "global_step": 484610, "epoch": 2884} {"train_loss": -12.542142868041992, "global_step": 484611, "epoch": 2884} {"train_loss": -12.045839309692383, "global_step": 484612, "epoch": 2884} {"train_loss": -12.649221420288086, "global_step": 484613, "epoch": 2884} {"train_loss": -11.847756385803223, "global_step": 484614, "epoch": 2884} {"train_loss": -11.964115142822266, "global_step": 484615, "epoch": 2884} {"train_loss": -12.42131519317627, "global_step": 484616, "epoch": 2884} {"train_loss": -11.39350414276123, "global_step": 484617, "epoch": 2884} {"train_loss": -12.081280708312988, "global_step": 484618, "epoch": 2884} {"train_loss": -11.480300903320312, "global_step": 484619, "epoch": 2884} {"train_loss": -12.33005142211914, "global_step": 484620, "epoch": 2884} {"train_loss": -11.77138614654541, "global_step": 484621, "epoch": 2884} {"train_loss": -12.358689308166504, "global_step": 484622, "epoch": 2884} {"train_loss": -12.694482803344727, "global_step": 484623, "epoch": 2884} {"train_loss": -11.674324035644531, "global_step": 484624, "epoch": 2884} {"train_loss": -12.192415237426758, "global_step": 484625, "epoch": 2884} {"train_loss": -12.032257080078125, "global_step": 484626, "epoch": 2884} {"train_loss": -11.223831176757812, "global_step": 484627, "epoch": 2884} {"train_loss": -11.891417503356934, "global_step": 484628, "epoch": 2884} {"train_loss": -12.212113380432129, "global_step": 484629, "epoch": 2884} {"train_loss": -11.269821166992188, "global_step": 484630, "epoch": 2884} {"train_loss": -12.566399574279785, "global_step": 484631, "epoch": 2884} {"train_loss": -11.903366088867188, "global_step": 484632, "epoch": 2884} {"train_loss": -12.306519508361816, "global_step": 484633, "epoch": 2884} {"train_loss": -12.146328926086426, "global_step": 484634, "epoch": 2884} {"train_loss": -11.97561264038086, "global_step": 484635, "epoch": 2884} {"train_loss": -12.494213104248047, "global_step": 484636, "epoch": 2884} {"train_loss": -12.230659484863281, "global_step": 484637, "epoch": 2884} {"train_loss": -12.509478569030762, "global_step": 484638, "epoch": 2884} {"train_loss": -12.393320083618164, "global_step": 484639, "epoch": 2884} {"train_loss": -12.318380355834961, "global_step": 484640, "epoch": 2884} {"train_loss": -12.739128112792969, "global_step": 484641, "epoch": 2884} {"train_loss": -12.181934356689453, "global_step": 484642, "epoch": 2884} {"train_loss": -12.567753791809082, "global_step": 484643, "epoch": 2884} {"train_loss": -12.584973335266113, "global_step": 484644, "epoch": 2884} {"train_loss": -12.314041137695312, "global_step": 484645, "epoch": 2884} {"train_loss": -12.516263961791992, "global_step": 484646, "epoch": 2884} {"train_loss": -12.039652824401855, "global_step": 484647, "epoch": 2884} {"train_loss": -12.091514587402344, "global_step": 484648, "epoch": 2884} {"train_loss": -12.360031127929688, "global_step": 484649, "epoch": 2884} {"train_loss": -12.330488204956055, "global_step": 484650, "epoch": 2884} {"train_loss": -12.435529708862305, "global_step": 484651, "epoch": 2884} {"train_loss": -12.697189331054688, "global_step": 484652, "epoch": 2884} {"train_loss": -12.187148094177246, "global_step": 484653, "epoch": 2884} {"train_loss": -11.869588851928711, "global_step": 484654, "epoch": 2884} {"train_loss": -12.836095809936523, "global_step": 484655, "epoch": 2884} {"train_loss": -12.134279251098633, "global_step": 484656, "epoch": 2884} {"train_loss": -12.767426490783691, "global_step": 484657, "epoch": 2884} {"train_loss": -12.780720710754395, "global_step": 484658, "epoch": 2884} {"train_loss": -12.279946327209473, "global_step": 484659, "epoch": 2884} {"train_loss": -12.845077514648438, "global_step": 484660, "epoch": 2884} {"train_loss": -12.172046661376953, "global_step": 484661, "epoch": 2884} {"train_loss": -12.75709342956543, "global_step": 484662, "epoch": 2884} {"train_loss": -12.500608444213867, "global_step": 484663, "epoch": 2884} {"train_loss": -12.529436111450195, "global_step": 484664, "epoch": 2884} {"train_loss": -12.673373222351074, "global_step": 484665, "epoch": 2884} {"train_loss": -12.400397300720215, "global_step": 484666, "epoch": 2884} {"train_loss": -12.672883987426758, "global_step": 484667, "epoch": 2884} {"train_loss": -12.473024368286133, "global_step": 484668, "epoch": 2884} {"train_loss": -12.387829780578613, "global_step": 484669, "epoch": 2884} {"train_loss": -12.923870086669922, "global_step": 484670, "epoch": 2884} {"train_loss": -12.45949935913086, "global_step": 484671, "epoch": 2884} {"train_loss": -12.720210075378418, "global_step": 484672, "epoch": 2884} {"train_loss": -12.723265647888184, "global_step": 484673, "epoch": 2884} {"train_loss": -12.584661483764648, "global_step": 484674, "epoch": 2884} {"train_loss": -12.818915367126465, "global_step": 484675, "epoch": 2884} {"train_loss": -12.571155548095703, "global_step": 484676, "epoch": 2884} {"train_loss": -12.49859619140625, "global_step": 484677, "epoch": 2884} {"train_loss": -12.64234733581543, "global_step": 484678, "epoch": 2884} {"train_loss": -12.32899078301021, "global_step": 484679, "epoch": 2884, "val_loss": 324228.6875} {"train_loss": -12.564582824707031, "global_step": 484680, "epoch": 2885} {"train_loss": -13.041356086730957, "global_step": 484681, "epoch": 2885} {"train_loss": -12.666800498962402, "global_step": 484682, "epoch": 2885} {"train_loss": -12.82094955444336, "global_step": 484683, "epoch": 2885} {"train_loss": -12.529155731201172, "global_step": 484684, "epoch": 2885} {"train_loss": -12.493268013000488, "global_step": 484685, "epoch": 2885} {"train_loss": -12.4729642868042, "global_step": 484686, "epoch": 2885} {"train_loss": -12.490818977355957, "global_step": 484687, "epoch": 2885} {"train_loss": -12.022274017333984, "global_step": 484688, "epoch": 2885} {"train_loss": -11.992534637451172, "global_step": 484689, "epoch": 2885} {"train_loss": -12.758630752563477, "global_step": 484690, "epoch": 2885} {"train_loss": -12.110572814941406, "global_step": 484691, "epoch": 2885} {"train_loss": -11.323270797729492, "global_step": 484692, "epoch": 2885} {"train_loss": -11.846572875976562, "global_step": 484693, "epoch": 2885} {"train_loss": -12.225921630859375, "global_step": 484694, "epoch": 2885} {"train_loss": -11.73253059387207, "global_step": 484695, "epoch": 2885} {"train_loss": -11.864853858947754, "global_step": 484696, "epoch": 2885} {"train_loss": -11.9126558303833, "global_step": 484697, "epoch": 2885} {"train_loss": -12.039915084838867, "global_step": 484698, "epoch": 2885} {"train_loss": -11.442035675048828, "global_step": 484699, "epoch": 2885} {"train_loss": -11.512242317199707, "global_step": 484700, "epoch": 2885} {"train_loss": -11.670639038085938, "global_step": 484701, "epoch": 2885} {"train_loss": -11.725845336914062, "global_step": 484702, "epoch": 2885} {"train_loss": -10.962867736816406, "global_step": 484703, "epoch": 2885} {"train_loss": -10.487876892089844, "global_step": 484704, "epoch": 2885} {"train_loss": -11.07874870300293, "global_step": 484705, "epoch": 2885} {"train_loss": -9.520486831665039, "global_step": 484706, "epoch": 2885} {"train_loss": -11.00527572631836, "global_step": 484707, "epoch": 2885} {"train_loss": -11.211902618408203, "global_step": 484708, "epoch": 2885} {"train_loss": -9.742866516113281, "global_step": 484709, "epoch": 2885} {"train_loss": -9.551206588745117, "global_step": 484710, "epoch": 2885} {"train_loss": -10.440109252929688, "global_step": 484711, "epoch": 2885} {"train_loss": -11.425537109375, "global_step": 484712, "epoch": 2885} {"train_loss": -9.172016143798828, "global_step": 484713, "epoch": 2885} {"train_loss": -9.515399932861328, "global_step": 484714, "epoch": 2885} {"train_loss": -11.205598831176758, "global_step": 484715, "epoch": 2885} {"train_loss": -7.304952144622803, "global_step": 484716, "epoch": 2885} {"train_loss": -9.01385498046875, "global_step": 484717, "epoch": 2885} {"train_loss": -11.10013198852539, "global_step": 484718, "epoch": 2885} {"train_loss": -9.779365539550781, "global_step": 484719, "epoch": 2885} {"train_loss": -10.242387771606445, "global_step": 484720, "epoch": 2885} {"train_loss": -10.917817115783691, "global_step": 484721, "epoch": 2885} {"train_loss": -11.151460647583008, "global_step": 484722, "epoch": 2885} {"train_loss": -9.924812316894531, "global_step": 484723, "epoch": 2885} {"train_loss": -12.3233060836792, "global_step": 484724, "epoch": 2885} {"train_loss": -11.080008506774902, "global_step": 484725, "epoch": 2885} {"train_loss": -11.488370895385742, "global_step": 484726, "epoch": 2885} {"train_loss": -11.65134048461914, "global_step": 484727, "epoch": 2885} {"train_loss": -11.245269775390625, "global_step": 484728, "epoch": 2885} {"train_loss": -11.564401626586914, "global_step": 484729, "epoch": 2885} {"train_loss": -11.433534622192383, "global_step": 484730, "epoch": 2885} {"train_loss": -11.63896369934082, "global_step": 484731, "epoch": 2885} {"train_loss": -12.132051467895508, "global_step": 484732, "epoch": 2885} {"train_loss": -12.065363883972168, "global_step": 484733, "epoch": 2885} {"train_loss": -12.251867294311523, "global_step": 484734, "epoch": 2885} {"train_loss": -11.780407905578613, "global_step": 484735, "epoch": 2885} {"train_loss": -11.854059219360352, "global_step": 484736, "epoch": 2885} {"train_loss": -11.739522933959961, "global_step": 484737, "epoch": 2885} {"train_loss": -12.299322128295898, "global_step": 484738, "epoch": 2885} {"train_loss": -11.936426162719727, "global_step": 484739, "epoch": 2885} {"train_loss": -11.939821243286133, "global_step": 484740, "epoch": 2885} {"train_loss": -12.139829635620117, "global_step": 484741, "epoch": 2885} {"train_loss": -12.208223342895508, "global_step": 484742, "epoch": 2885} {"train_loss": -12.402790069580078, "global_step": 484743, "epoch": 2885} {"train_loss": -12.059219360351562, "global_step": 484744, "epoch": 2885} {"train_loss": -12.4638671875, "global_step": 484745, "epoch": 2885} {"train_loss": -12.252975463867188, "global_step": 484746, "epoch": 2885} {"train_loss": -12.313444137573242, "global_step": 484747, "epoch": 2885} {"train_loss": -12.441385269165039, "global_step": 484748, "epoch": 2885} {"train_loss": -12.536449432373047, "global_step": 484749, "epoch": 2885} {"train_loss": -12.606578826904297, "global_step": 484750, "epoch": 2885} {"train_loss": -12.563632011413574, "global_step": 484751, "epoch": 2885} {"train_loss": -12.377326965332031, "global_step": 484752, "epoch": 2885} {"train_loss": -12.757819175720215, "global_step": 484753, "epoch": 2885} {"train_loss": -12.481203079223633, "global_step": 484754, "epoch": 2885} {"train_loss": -12.747533798217773, "global_step": 484755, "epoch": 2885} {"train_loss": -12.586898803710938, "global_step": 484756, "epoch": 2885} {"train_loss": -12.573409080505371, "global_step": 484757, "epoch": 2885} {"train_loss": -12.868552207946777, "global_step": 484758, "epoch": 2885} {"train_loss": -12.912327766418457, "global_step": 484759, "epoch": 2885} {"train_loss": -12.85101318359375, "global_step": 484760, "epoch": 2885} {"train_loss": -12.763063430786133, "global_step": 484761, "epoch": 2885} {"train_loss": -12.837196350097656, "global_step": 484762, "epoch": 2885} {"train_loss": -12.793746948242188, "global_step": 484763, "epoch": 2885} {"train_loss": -12.721074104309082, "global_step": 484764, "epoch": 2885} {"train_loss": -12.80887222290039, "global_step": 484765, "epoch": 2885} {"train_loss": -12.804807662963867, "global_step": 484766, "epoch": 2885} {"train_loss": -12.990402221679688, "global_step": 484767, "epoch": 2885} {"train_loss": -12.775613784790039, "global_step": 484768, "epoch": 2885} {"train_loss": -12.861577033996582, "global_step": 484769, "epoch": 2885} {"train_loss": -13.065940856933594, "global_step": 484770, "epoch": 2885} {"train_loss": -12.893067359924316, "global_step": 484771, "epoch": 2885} {"train_loss": -12.752321243286133, "global_step": 484772, "epoch": 2885} {"train_loss": -12.651466369628906, "global_step": 484773, "epoch": 2885} {"train_loss": -12.86785888671875, "global_step": 484774, "epoch": 2885} {"train_loss": -12.927274703979492, "global_step": 484775, "epoch": 2885} {"train_loss": -12.864287376403809, "global_step": 484776, "epoch": 2885} {"train_loss": -12.738340377807617, "global_step": 484777, "epoch": 2885} {"train_loss": -12.711867332458496, "global_step": 484778, "epoch": 2885} {"train_loss": -12.976295471191406, "global_step": 484779, "epoch": 2885} {"train_loss": -12.756662368774414, "global_step": 484780, "epoch": 2885} {"train_loss": -12.90947437286377, "global_step": 484781, "epoch": 2885} {"train_loss": -12.76244831085205, "global_step": 484782, "epoch": 2885} {"train_loss": -12.851980209350586, "global_step": 484783, "epoch": 2885} {"train_loss": -12.779369354248047, "global_step": 484784, "epoch": 2885} {"train_loss": -12.727333068847656, "global_step": 484785, "epoch": 2885} {"train_loss": -12.595598220825195, "global_step": 484786, "epoch": 2885} {"train_loss": -12.502099990844727, "global_step": 484787, "epoch": 2885} {"train_loss": -12.826787948608398, "global_step": 484788, "epoch": 2885} {"train_loss": -12.13092041015625, "global_step": 484789, "epoch": 2885} {"train_loss": -12.732020378112793, "global_step": 484790, "epoch": 2885} {"train_loss": -12.145936012268066, "global_step": 484791, "epoch": 2885} {"train_loss": -12.623380661010742, "global_step": 484792, "epoch": 2885} {"train_loss": -12.232070922851562, "global_step": 484793, "epoch": 2885} {"train_loss": -12.268774032592773, "global_step": 484794, "epoch": 2885} {"train_loss": -12.728032112121582, "global_step": 484795, "epoch": 2885} {"train_loss": -12.182662963867188, "global_step": 484796, "epoch": 2885} {"train_loss": -12.554728507995605, "global_step": 484797, "epoch": 2885} {"train_loss": -12.628888130187988, "global_step": 484798, "epoch": 2885} {"train_loss": -12.380197525024414, "global_step": 484799, "epoch": 2885} {"train_loss": -12.267053604125977, "global_step": 484800, "epoch": 2885} {"train_loss": -12.190805435180664, "global_step": 484801, "epoch": 2885} {"train_loss": -12.898140907287598, "global_step": 484802, "epoch": 2885} {"train_loss": -12.514974594116211, "global_step": 484803, "epoch": 2885} {"train_loss": -12.839042663574219, "global_step": 484804, "epoch": 2885} {"train_loss": -12.517504692077637, "global_step": 484805, "epoch": 2885} {"train_loss": -12.370040893554688, "global_step": 484806, "epoch": 2885} {"train_loss": -12.411687850952148, "global_step": 484807, "epoch": 2885} {"train_loss": -12.722951889038086, "global_step": 484808, "epoch": 2885} {"train_loss": -12.860292434692383, "global_step": 484809, "epoch": 2885} {"train_loss": -12.697021484375, "global_step": 484810, "epoch": 2885} {"train_loss": -12.904975891113281, "global_step": 484811, "epoch": 2885} {"train_loss": -12.735115051269531, "global_step": 484812, "epoch": 2885} {"train_loss": -12.733141899108887, "global_step": 484813, "epoch": 2885} {"train_loss": -12.969429016113281, "global_step": 484814, "epoch": 2885} {"train_loss": -12.581220626831055, "global_step": 484815, "epoch": 2885} {"train_loss": -12.833003997802734, "global_step": 484816, "epoch": 2885} {"train_loss": -12.858772277832031, "global_step": 484817, "epoch": 2885} {"train_loss": -12.660600662231445, "global_step": 484818, "epoch": 2885} {"train_loss": -12.712970733642578, "global_step": 484819, "epoch": 2885} {"train_loss": -12.31807804107666, "global_step": 484820, "epoch": 2885} {"train_loss": -12.904205322265625, "global_step": 484821, "epoch": 2885} {"train_loss": -12.786161422729492, "global_step": 484822, "epoch": 2885} {"train_loss": -12.416016578674316, "global_step": 484823, "epoch": 2885} {"train_loss": -12.732884407043457, "global_step": 484824, "epoch": 2885} {"train_loss": -12.551482200622559, "global_step": 484825, "epoch": 2885} {"train_loss": -11.874320030212402, "global_step": 484826, "epoch": 2885} {"train_loss": -12.912109375, "global_step": 484827, "epoch": 2885} {"train_loss": -12.305465698242188, "global_step": 484828, "epoch": 2885} {"train_loss": -11.40477180480957, "global_step": 484829, "epoch": 2885} {"train_loss": -11.595918655395508, "global_step": 484830, "epoch": 2885} {"train_loss": -12.449834823608398, "global_step": 484831, "epoch": 2885} {"train_loss": -11.275096893310547, "global_step": 484832, "epoch": 2885} {"train_loss": -10.501317977905273, "global_step": 484833, "epoch": 2885} {"train_loss": -12.450372695922852, "global_step": 484834, "epoch": 2885} {"train_loss": -11.491697311401367, "global_step": 484835, "epoch": 2885} {"train_loss": -9.614954948425293, "global_step": 484836, "epoch": 2885} {"train_loss": -12.086987495422363, "global_step": 484837, "epoch": 2885} {"train_loss": -6.795825481414795, "global_step": 484838, "epoch": 2885} {"train_loss": -9.512333869934082, "global_step": 484839, "epoch": 2885} {"train_loss": -10.864917755126953, "global_step": 484840, "epoch": 2885} {"train_loss": -8.69647216796875, "global_step": 484841, "epoch": 2885} {"train_loss": -11.848350524902344, "global_step": 484842, "epoch": 2885} {"train_loss": -11.039285659790039, "global_step": 484843, "epoch": 2885} {"train_loss": -10.950034141540527, "global_step": 484844, "epoch": 2885} {"train_loss": -12.111895561218262, "global_step": 484845, "epoch": 2885} {"train_loss": -10.494214057922363, "global_step": 484846, "epoch": 2885} {"train_loss": -11.978053740092687, "global_step": 484847, "epoch": 2885, "val_loss": 312229.625, "train_action_mse_error": 2.4698824882507324} {"train_loss": -11.03756332397461, "global_step": 484848, "epoch": 2886} {"train_loss": -12.08564567565918, "global_step": 484849, "epoch": 2886} {"train_loss": -11.376739501953125, "global_step": 484850, "epoch": 2886} {"train_loss": -12.312435150146484, "global_step": 484851, "epoch": 2886} {"train_loss": -11.993135452270508, "global_step": 484852, "epoch": 2886} {"train_loss": -12.088008880615234, "global_step": 484853, "epoch": 2886} {"train_loss": -12.465730667114258, "global_step": 484854, "epoch": 2886} {"train_loss": -12.00649642944336, "global_step": 484855, "epoch": 2886} {"train_loss": -12.021568298339844, "global_step": 484856, "epoch": 2886} {"train_loss": -12.179336547851562, "global_step": 484857, "epoch": 2886} {"train_loss": -11.859943389892578, "global_step": 484858, "epoch": 2886} {"train_loss": -12.382719039916992, "global_step": 484859, "epoch": 2886} {"train_loss": -11.813741683959961, "global_step": 484860, "epoch": 2886} {"train_loss": -12.275762557983398, "global_step": 484861, "epoch": 2886} {"train_loss": -11.796887397766113, "global_step": 484862, "epoch": 2886} {"train_loss": -12.572120666503906, "global_step": 484863, "epoch": 2886} {"train_loss": -12.110298156738281, "global_step": 484864, "epoch": 2886} {"train_loss": -12.350014686584473, "global_step": 484865, "epoch": 2886} {"train_loss": -11.434311866760254, "global_step": 484866, "epoch": 2886} {"train_loss": -12.596378326416016, "global_step": 484867, "epoch": 2886} {"train_loss": -11.808759689331055, "global_step": 484868, "epoch": 2886} {"train_loss": -12.653064727783203, "global_step": 484869, "epoch": 2886} {"train_loss": -11.727145195007324, "global_step": 484870, "epoch": 2886} {"train_loss": -12.557538032531738, "global_step": 484871, "epoch": 2886} {"train_loss": -12.181992530822754, "global_step": 484872, "epoch": 2886} {"train_loss": -12.158906936645508, "global_step": 484873, "epoch": 2886} {"train_loss": -12.284175872802734, "global_step": 484874, "epoch": 2886} {"train_loss": -12.345614433288574, "global_step": 484875, "epoch": 2886} {"train_loss": -12.465301513671875, "global_step": 484876, "epoch": 2886} {"train_loss": -12.263524055480957, "global_step": 484877, "epoch": 2886} {"train_loss": -12.61691665649414, "global_step": 484878, "epoch": 2886} {"train_loss": -12.571914672851562, "global_step": 484879, "epoch": 2886} {"train_loss": -12.427106857299805, "global_step": 484880, "epoch": 2886} {"train_loss": -12.522950172424316, "global_step": 484881, "epoch": 2886} {"train_loss": -12.609800338745117, "global_step": 484882, "epoch": 2886} {"train_loss": -12.603261947631836, "global_step": 484883, "epoch": 2886} {"train_loss": -12.434796333312988, "global_step": 484884, "epoch": 2886} {"train_loss": -12.616582870483398, "global_step": 484885, "epoch": 2886} {"train_loss": -12.141901969909668, "global_step": 484886, "epoch": 2886} {"train_loss": -12.201364517211914, "global_step": 484887, "epoch": 2886} {"train_loss": -12.698873519897461, "global_step": 484888, "epoch": 2886} {"train_loss": -11.91561508178711, "global_step": 484889, "epoch": 2886} {"train_loss": -12.769838333129883, "global_step": 484890, "epoch": 2886} {"train_loss": -12.267887115478516, "global_step": 484891, "epoch": 2886} {"train_loss": -12.612560272216797, "global_step": 484892, "epoch": 2886} {"train_loss": -12.611799240112305, "global_step": 484893, "epoch": 2886} {"train_loss": -12.651291847229004, "global_step": 484894, "epoch": 2886} {"train_loss": -12.679632186889648, "global_step": 484895, "epoch": 2886} {"train_loss": -12.481069564819336, "global_step": 484896, "epoch": 2886} {"train_loss": -12.348587036132812, "global_step": 484897, "epoch": 2886} {"train_loss": -12.383079528808594, "global_step": 484898, "epoch": 2886} {"train_loss": -12.51028060913086, "global_step": 484899, "epoch": 2886} {"train_loss": -12.733844757080078, "global_step": 484900, "epoch": 2886} {"train_loss": -12.346969604492188, "global_step": 484901, "epoch": 2886} {"train_loss": -12.640349388122559, "global_step": 484902, "epoch": 2886} {"train_loss": -12.2647705078125, "global_step": 484903, "epoch": 2886} {"train_loss": -12.652339935302734, "global_step": 484904, "epoch": 2886} {"train_loss": -12.324581146240234, "global_step": 484905, "epoch": 2886} {"train_loss": -12.802696228027344, "global_step": 484906, "epoch": 2886} {"train_loss": -12.379137992858887, "global_step": 484907, "epoch": 2886} {"train_loss": -12.642707824707031, "global_step": 484908, "epoch": 2886} {"train_loss": -12.709532737731934, "global_step": 484909, "epoch": 2886} {"train_loss": -12.376636505126953, "global_step": 484910, "epoch": 2886} {"train_loss": -12.664285659790039, "global_step": 484911, "epoch": 2886} {"train_loss": -12.441473007202148, "global_step": 484912, "epoch": 2886} {"train_loss": -12.875775337219238, "global_step": 484913, "epoch": 2886} {"train_loss": -12.619778633117676, "global_step": 484914, "epoch": 2886} {"train_loss": -12.857857704162598, "global_step": 484915, "epoch": 2886} {"train_loss": -12.737953186035156, "global_step": 484916, "epoch": 2886} {"train_loss": -12.68912410736084, "global_step": 484917, "epoch": 2886} {"train_loss": -12.758440971374512, "global_step": 484918, "epoch": 2886} {"train_loss": -12.734724044799805, "global_step": 484919, "epoch": 2886} {"train_loss": -12.742597579956055, "global_step": 484920, "epoch": 2886} {"train_loss": -12.818004608154297, "global_step": 484921, "epoch": 2886} {"train_loss": -12.744266510009766, "global_step": 484922, "epoch": 2886} {"train_loss": -12.776473999023438, "global_step": 484923, "epoch": 2886} {"train_loss": -12.738333702087402, "global_step": 484924, "epoch": 2886} {"train_loss": -12.976448059082031, "global_step": 484925, "epoch": 2886} {"train_loss": -12.688285827636719, "global_step": 484926, "epoch": 2886} {"train_loss": -13.073685646057129, "global_step": 484927, "epoch": 2886} {"train_loss": -12.84933853149414, "global_step": 484928, "epoch": 2886} {"train_loss": -13.025949478149414, "global_step": 484929, "epoch": 2886} {"train_loss": -12.68332290649414, "global_step": 484930, "epoch": 2886} {"train_loss": -12.880487442016602, "global_step": 484931, "epoch": 2886} {"train_loss": -12.680416107177734, "global_step": 484932, "epoch": 2886} {"train_loss": -12.746858596801758, "global_step": 484933, "epoch": 2886} {"train_loss": -12.769876480102539, "global_step": 484934, "epoch": 2886} {"train_loss": -13.014299392700195, "global_step": 484935, "epoch": 2886} {"train_loss": -12.839299201965332, "global_step": 484936, "epoch": 2886} {"train_loss": -12.862062454223633, "global_step": 484937, "epoch": 2886} {"train_loss": -12.945011138916016, "global_step": 484938, "epoch": 2886} {"train_loss": -12.846677780151367, "global_step": 484939, "epoch": 2886} {"train_loss": -12.779314994812012, "global_step": 484940, "epoch": 2886} {"train_loss": -12.79128646850586, "global_step": 484941, "epoch": 2886} {"train_loss": -12.822309494018555, "global_step": 484942, "epoch": 2886} {"train_loss": -12.64599323272705, "global_step": 484943, "epoch": 2886} {"train_loss": -12.853069305419922, "global_step": 484944, "epoch": 2886} {"train_loss": -12.883733749389648, "global_step": 484945, "epoch": 2886} {"train_loss": -12.244146347045898, "global_step": 484946, "epoch": 2886} {"train_loss": -11.820898056030273, "global_step": 484947, "epoch": 2886} {"train_loss": -12.674478530883789, "global_step": 484948, "epoch": 2886} {"train_loss": -12.042506217956543, "global_step": 484949, "epoch": 2886} {"train_loss": -10.397981643676758, "global_step": 484950, "epoch": 2886} {"train_loss": -11.750598907470703, "global_step": 484951, "epoch": 2886} {"train_loss": -12.956780433654785, "global_step": 484952, "epoch": 2886} {"train_loss": -12.774170875549316, "global_step": 484953, "epoch": 2886} {"train_loss": -12.177743911743164, "global_step": 484954, "epoch": 2886} {"train_loss": -12.46219539642334, "global_step": 484955, "epoch": 2886} {"train_loss": -12.65135383605957, "global_step": 484956, "epoch": 2886} {"train_loss": -12.510255813598633, "global_step": 484957, "epoch": 2886} {"train_loss": -12.221171379089355, "global_step": 484958, "epoch": 2886} {"train_loss": -12.095436096191406, "global_step": 484959, "epoch": 2886} {"train_loss": -11.587486267089844, "global_step": 484960, "epoch": 2886} {"train_loss": -11.979569435119629, "global_step": 484961, "epoch": 2886} {"train_loss": -12.459720611572266, "global_step": 484962, "epoch": 2886} {"train_loss": -12.480905532836914, "global_step": 484963, "epoch": 2886} {"train_loss": -12.657339096069336, "global_step": 484964, "epoch": 2886} {"train_loss": -12.692729949951172, "global_step": 484965, "epoch": 2886} {"train_loss": -12.872709274291992, "global_step": 484966, "epoch": 2886} {"train_loss": -12.778257369995117, "global_step": 484967, "epoch": 2886} {"train_loss": -12.85637092590332, "global_step": 484968, "epoch": 2886} {"train_loss": -12.723016738891602, "global_step": 484969, "epoch": 2886} {"train_loss": -12.855755805969238, "global_step": 484970, "epoch": 2886} {"train_loss": -12.851263046264648, "global_step": 484971, "epoch": 2886} {"train_loss": -12.560707092285156, "global_step": 484972, "epoch": 2886} {"train_loss": -12.855973243713379, "global_step": 484973, "epoch": 2886} {"train_loss": -12.630000114440918, "global_step": 484974, "epoch": 2886} {"train_loss": -12.87114143371582, "global_step": 484975, "epoch": 2886} {"train_loss": -12.245437622070312, "global_step": 484976, "epoch": 2886} {"train_loss": -12.591367721557617, "global_step": 484977, "epoch": 2886} {"train_loss": -12.951970100402832, "global_step": 484978, "epoch": 2886} {"train_loss": -12.879258155822754, "global_step": 484979, "epoch": 2886} {"train_loss": -12.888579368591309, "global_step": 484980, "epoch": 2886} {"train_loss": -12.717671394348145, "global_step": 484981, "epoch": 2886} {"train_loss": -12.811843872070312, "global_step": 484982, "epoch": 2886} {"train_loss": -12.951181411743164, "global_step": 484983, "epoch": 2886} {"train_loss": -12.981826782226562, "global_step": 484984, "epoch": 2886} {"train_loss": -12.768206596374512, "global_step": 484985, "epoch": 2886} {"train_loss": -12.646492004394531, "global_step": 484986, "epoch": 2886} {"train_loss": -12.869564056396484, "global_step": 484987, "epoch": 2886} {"train_loss": -12.755011558532715, "global_step": 484988, "epoch": 2886} {"train_loss": -12.468843460083008, "global_step": 484989, "epoch": 2886} {"train_loss": -12.869430541992188, "global_step": 484990, "epoch": 2886} {"train_loss": -12.456161499023438, "global_step": 484991, "epoch": 2886} {"train_loss": -12.770334243774414, "global_step": 484992, "epoch": 2886} {"train_loss": -12.636258125305176, "global_step": 484993, "epoch": 2886} {"train_loss": -12.709736824035645, "global_step": 484994, "epoch": 2886} {"train_loss": -12.60867691040039, "global_step": 484995, "epoch": 2886} {"train_loss": -12.958843231201172, "global_step": 484996, "epoch": 2886} {"train_loss": -12.886579513549805, "global_step": 484997, "epoch": 2886} {"train_loss": -12.953374862670898, "global_step": 484998, "epoch": 2886} {"train_loss": -12.919743537902832, "global_step": 484999, "epoch": 2886} {"train_loss": -12.35860824584961, "global_step": 485000, "epoch": 2886} {"train_loss": -12.668741226196289, "global_step": 485001, "epoch": 2886} {"train_loss": -12.386302947998047, "global_step": 485002, "epoch": 2886} {"train_loss": -11.734992980957031, "global_step": 485003, "epoch": 2886} {"train_loss": -12.340953826904297, "global_step": 485004, "epoch": 2886} {"train_loss": -12.489328384399414, "global_step": 485005, "epoch": 2886} {"train_loss": -12.371369361877441, "global_step": 485006, "epoch": 2886} {"train_loss": -12.083645820617676, "global_step": 485007, "epoch": 2886} {"train_loss": -12.614127159118652, "global_step": 485008, "epoch": 2886} {"train_loss": -12.578985214233398, "global_step": 485009, "epoch": 2886} {"train_loss": -12.815542221069336, "global_step": 485010, "epoch": 2886} {"train_loss": -12.523101806640625, "global_step": 485011, "epoch": 2886} {"train_loss": -12.182832717895508, "global_step": 485012, "epoch": 2886} {"train_loss": -12.357343673706055, "global_step": 485013, "epoch": 2886} {"train_loss": -12.296700477600098, "global_step": 485014, "epoch": 2886} {"train_loss": -12.502839008967081, "global_step": 485015, "epoch": 2886, "val_loss": 311538.46875} {"train_loss": -11.960002899169922, "global_step": 485016, "epoch": 2887} {"train_loss": -12.023050308227539, "global_step": 485017, "epoch": 2887} {"train_loss": -11.802118301391602, "global_step": 485018, "epoch": 2887} {"train_loss": -11.8907470703125, "global_step": 485019, "epoch": 2887} {"train_loss": -12.509251594543457, "global_step": 485020, "epoch": 2887} {"train_loss": -11.605062484741211, "global_step": 485021, "epoch": 2887} {"train_loss": -12.59781551361084, "global_step": 485022, "epoch": 2887} {"train_loss": -11.824471473693848, "global_step": 485023, "epoch": 2887} {"train_loss": -12.046825408935547, "global_step": 485024, "epoch": 2887} {"train_loss": -10.788848876953125, "global_step": 485025, "epoch": 2887} {"train_loss": -11.647205352783203, "global_step": 485026, "epoch": 2887} {"train_loss": -11.636537551879883, "global_step": 485027, "epoch": 2887} {"train_loss": -12.03389835357666, "global_step": 485028, "epoch": 2887} {"train_loss": -10.893463134765625, "global_step": 485029, "epoch": 2887} {"train_loss": -11.939128875732422, "global_step": 485030, "epoch": 2887} {"train_loss": -10.750042915344238, "global_step": 485031, "epoch": 2887} {"train_loss": -10.133329391479492, "global_step": 485032, "epoch": 2887} {"train_loss": -11.870967864990234, "global_step": 485033, "epoch": 2887} {"train_loss": -10.483226776123047, "global_step": 485034, "epoch": 2887} {"train_loss": -9.264963150024414, "global_step": 485035, "epoch": 2887} {"train_loss": -11.887746810913086, "global_step": 485036, "epoch": 2887} {"train_loss": -9.697595596313477, "global_step": 485037, "epoch": 2887} {"train_loss": -9.509750366210938, "global_step": 485038, "epoch": 2887} {"train_loss": -11.022027969360352, "global_step": 485039, "epoch": 2887} {"train_loss": -11.31928539276123, "global_step": 485040, "epoch": 2887} {"train_loss": -11.098608016967773, "global_step": 485041, "epoch": 2887} {"train_loss": -12.034832000732422, "global_step": 485042, "epoch": 2887} {"train_loss": -10.920635223388672, "global_step": 485043, "epoch": 2887} {"train_loss": -11.419380187988281, "global_step": 485044, "epoch": 2887} {"train_loss": -11.794655799865723, "global_step": 485045, "epoch": 2887} {"train_loss": -10.796404838562012, "global_step": 485046, "epoch": 2887} {"train_loss": -11.712604522705078, "global_step": 485047, "epoch": 2887} {"train_loss": -12.127168655395508, "global_step": 485048, "epoch": 2887} {"train_loss": -10.745746612548828, "global_step": 485049, "epoch": 2887} {"train_loss": -12.000648498535156, "global_step": 485050, "epoch": 2887} {"train_loss": -10.768898010253906, "global_step": 485051, "epoch": 2887} {"train_loss": -11.607818603515625, "global_step": 485052, "epoch": 2887} {"train_loss": -11.791611671447754, "global_step": 485053, "epoch": 2887} {"train_loss": -11.886959075927734, "global_step": 485054, "epoch": 2887} {"train_loss": -12.082324981689453, "global_step": 485055, "epoch": 2887} {"train_loss": -11.658873558044434, "global_step": 485056, "epoch": 2887} {"train_loss": -11.22026252746582, "global_step": 485057, "epoch": 2887} {"train_loss": -11.888470649719238, "global_step": 485058, "epoch": 2887} {"train_loss": -11.300840377807617, "global_step": 485059, "epoch": 2887} {"train_loss": -10.351648330688477, "global_step": 485060, "epoch": 2887} {"train_loss": -12.286677360534668, "global_step": 485061, "epoch": 2887} {"train_loss": -10.586139678955078, "global_step": 485062, "epoch": 2887} {"train_loss": -12.073522567749023, "global_step": 485063, "epoch": 2887} {"train_loss": -11.796012878417969, "global_step": 485064, "epoch": 2887} {"train_loss": -11.352831840515137, "global_step": 485065, "epoch": 2887} {"train_loss": -11.862299919128418, "global_step": 485066, "epoch": 2887} {"train_loss": -11.642729759216309, "global_step": 485067, "epoch": 2887} {"train_loss": -12.011677742004395, "global_step": 485068, "epoch": 2887} {"train_loss": -11.477495193481445, "global_step": 485069, "epoch": 2887} {"train_loss": -12.162830352783203, "global_step": 485070, "epoch": 2887} {"train_loss": -11.844375610351562, "global_step": 485071, "epoch": 2887} {"train_loss": -12.414146423339844, "global_step": 485072, "epoch": 2887} {"train_loss": -11.718498229980469, "global_step": 485073, "epoch": 2887} {"train_loss": -12.600896835327148, "global_step": 485074, "epoch": 2887} {"train_loss": -11.960132598876953, "global_step": 485075, "epoch": 2887} {"train_loss": -12.269111633300781, "global_step": 485076, "epoch": 2887} {"train_loss": -11.926788330078125, "global_step": 485077, "epoch": 2887} {"train_loss": -12.042488098144531, "global_step": 485078, "epoch": 2887} {"train_loss": -12.018826484680176, "global_step": 485079, "epoch": 2887} {"train_loss": -11.916449546813965, "global_step": 485080, "epoch": 2887} {"train_loss": -12.389924049377441, "global_step": 485081, "epoch": 2887} {"train_loss": -11.740447998046875, "global_step": 485082, "epoch": 2887} {"train_loss": -12.310135841369629, "global_step": 485083, "epoch": 2887} {"train_loss": -12.14493179321289, "global_step": 485084, "epoch": 2887} {"train_loss": -12.161376953125, "global_step": 485085, "epoch": 2887} {"train_loss": -12.440939903259277, "global_step": 485086, "epoch": 2887} {"train_loss": -12.07238483428955, "global_step": 485087, "epoch": 2887} {"train_loss": -12.54830265045166, "global_step": 485088, "epoch": 2887} {"train_loss": -12.540153503417969, "global_step": 485089, "epoch": 2887} {"train_loss": -12.38133716583252, "global_step": 485090, "epoch": 2887} {"train_loss": -12.447306632995605, "global_step": 485091, "epoch": 2887} {"train_loss": -12.41485595703125, "global_step": 485092, "epoch": 2887} {"train_loss": -12.722383499145508, "global_step": 485093, "epoch": 2887} {"train_loss": -12.587236404418945, "global_step": 485094, "epoch": 2887} {"train_loss": -12.487129211425781, "global_step": 485095, "epoch": 2887} {"train_loss": -12.607912063598633, "global_step": 485096, "epoch": 2887} {"train_loss": -12.606084823608398, "global_step": 485097, "epoch": 2887} {"train_loss": -12.474028587341309, "global_step": 485098, "epoch": 2887} {"train_loss": -12.658935546875, "global_step": 485099, "epoch": 2887} {"train_loss": -12.761253356933594, "global_step": 485100, "epoch": 2887} {"train_loss": -12.629219055175781, "global_step": 485101, "epoch": 2887} {"train_loss": -12.626506805419922, "global_step": 485102, "epoch": 2887} {"train_loss": -12.706717491149902, "global_step": 485103, "epoch": 2887} {"train_loss": -12.803183555603027, "global_step": 485104, "epoch": 2887} {"train_loss": -12.639877319335938, "global_step": 485105, "epoch": 2887} {"train_loss": -12.864310264587402, "global_step": 485106, "epoch": 2887} {"train_loss": -12.787115097045898, "global_step": 485107, "epoch": 2887} {"train_loss": -12.412595748901367, "global_step": 485108, "epoch": 2887} {"train_loss": -12.708558082580566, "global_step": 485109, "epoch": 2887} {"train_loss": -12.650847434997559, "global_step": 485110, "epoch": 2887} {"train_loss": -12.673860549926758, "global_step": 485111, "epoch": 2887} {"train_loss": -12.786907196044922, "global_step": 485112, "epoch": 2887} {"train_loss": -12.81895923614502, "global_step": 485113, "epoch": 2887} {"train_loss": -12.706857681274414, "global_step": 485114, "epoch": 2887} {"train_loss": -12.742963790893555, "global_step": 485115, "epoch": 2887} {"train_loss": -12.838285446166992, "global_step": 485116, "epoch": 2887} {"train_loss": -12.722901344299316, "global_step": 485117, "epoch": 2887} {"train_loss": -12.882502555847168, "global_step": 485118, "epoch": 2887} {"train_loss": -12.852090835571289, "global_step": 485119, "epoch": 2887} {"train_loss": -12.910430908203125, "global_step": 485120, "epoch": 2887} {"train_loss": -12.717613220214844, "global_step": 485121, "epoch": 2887} {"train_loss": -12.786325454711914, "global_step": 485122, "epoch": 2887} {"train_loss": -12.834172248840332, "global_step": 485123, "epoch": 2887} {"train_loss": -12.824614524841309, "global_step": 485124, "epoch": 2887} {"train_loss": -12.759267807006836, "global_step": 485125, "epoch": 2887} {"train_loss": -12.828105926513672, "global_step": 485126, "epoch": 2887} {"train_loss": -12.810254096984863, "global_step": 485127, "epoch": 2887} {"train_loss": -12.762079238891602, "global_step": 485128, "epoch": 2887} {"train_loss": -13.097906112670898, "global_step": 485129, "epoch": 2887} {"train_loss": -12.988829612731934, "global_step": 485130, "epoch": 2887} {"train_loss": -12.913305282592773, "global_step": 485131, "epoch": 2887} {"train_loss": -13.013163566589355, "global_step": 485132, "epoch": 2887} {"train_loss": -12.997842788696289, "global_step": 485133, "epoch": 2887} {"train_loss": -12.637493133544922, "global_step": 485134, "epoch": 2887} {"train_loss": -12.963069915771484, "global_step": 485135, "epoch": 2887} {"train_loss": -12.786749839782715, "global_step": 485136, "epoch": 2887} {"train_loss": -12.638943672180176, "global_step": 485137, "epoch": 2887} {"train_loss": -13.031413078308105, "global_step": 485138, "epoch": 2887} {"train_loss": -12.964700698852539, "global_step": 485139, "epoch": 2887} {"train_loss": -12.983026504516602, "global_step": 485140, "epoch": 2887} {"train_loss": -12.917409896850586, "global_step": 485141, "epoch": 2887} {"train_loss": -13.048583984375, "global_step": 485142, "epoch": 2887} {"train_loss": -13.006532669067383, "global_step": 485143, "epoch": 2887} {"train_loss": -13.025585174560547, "global_step": 485144, "epoch": 2887} {"train_loss": -13.023691177368164, "global_step": 485145, "epoch": 2887} {"train_loss": -13.018888473510742, "global_step": 485146, "epoch": 2887} {"train_loss": -13.091259002685547, "global_step": 485147, "epoch": 2887} {"train_loss": -13.20820426940918, "global_step": 485148, "epoch": 2887} {"train_loss": -13.02060317993164, "global_step": 485149, "epoch": 2887} {"train_loss": -13.014188766479492, "global_step": 485150, "epoch": 2887} {"train_loss": -13.197668075561523, "global_step": 485151, "epoch": 2887} {"train_loss": -13.065055847167969, "global_step": 485152, "epoch": 2887} {"train_loss": -13.13941764831543, "global_step": 485153, "epoch": 2887} {"train_loss": -13.086997985839844, "global_step": 485154, "epoch": 2887} {"train_loss": -13.041654586791992, "global_step": 485155, "epoch": 2887} {"train_loss": -12.94066047668457, "global_step": 485156, "epoch": 2887} {"train_loss": -13.253063201904297, "global_step": 485157, "epoch": 2887} {"train_loss": -12.842854499816895, "global_step": 485158, "epoch": 2887} {"train_loss": -12.753915786743164, "global_step": 485159, "epoch": 2887} {"train_loss": -13.022263526916504, "global_step": 485160, "epoch": 2887} {"train_loss": -12.70244026184082, "global_step": 485161, "epoch": 2887} {"train_loss": -13.056038856506348, "global_step": 485162, "epoch": 2887} {"train_loss": -12.69595718383789, "global_step": 485163, "epoch": 2887} {"train_loss": -12.508203506469727, "global_step": 485164, "epoch": 2887} {"train_loss": -12.645973205566406, "global_step": 485165, "epoch": 2887} {"train_loss": -12.900612831115723, "global_step": 485166, "epoch": 2887} {"train_loss": -12.849136352539062, "global_step": 485167, "epoch": 2887} {"train_loss": -12.277339935302734, "global_step": 485168, "epoch": 2887} {"train_loss": -12.925578117370605, "global_step": 485169, "epoch": 2887} {"train_loss": -12.75965690612793, "global_step": 485170, "epoch": 2887} {"train_loss": -12.222128868103027, "global_step": 485171, "epoch": 2887} {"train_loss": -11.99308967590332, "global_step": 485172, "epoch": 2887} {"train_loss": -12.368880271911621, "global_step": 485173, "epoch": 2887} {"train_loss": -12.536795616149902, "global_step": 485174, "epoch": 2887} {"train_loss": -13.159896850585938, "global_step": 485175, "epoch": 2887} {"train_loss": -12.742350578308105, "global_step": 485176, "epoch": 2887} {"train_loss": -12.595081329345703, "global_step": 485177, "epoch": 2887} {"train_loss": -12.704458236694336, "global_step": 485178, "epoch": 2887} {"train_loss": -13.033817291259766, "global_step": 485179, "epoch": 2887} {"train_loss": -13.009727478027344, "global_step": 485180, "epoch": 2887} {"train_loss": -12.901799201965332, "global_step": 485181, "epoch": 2887} {"train_loss": -13.009469985961914, "global_step": 485182, "epoch": 2887} {"train_loss": -12.283367667879377, "global_step": 485183, "epoch": 2887, "val_loss": 313112.59375} {"train_loss": -11.609403610229492, "global_step": 485184, "epoch": 2888} {"train_loss": -10.333932876586914, "global_step": 485185, "epoch": 2888} {"train_loss": -11.072247505187988, "global_step": 485186, "epoch": 2888} {"train_loss": -12.443196296691895, "global_step": 485187, "epoch": 2888} {"train_loss": -8.888503074645996, "global_step": 485188, "epoch": 2888} {"train_loss": -9.402167320251465, "global_step": 485189, "epoch": 2888} {"train_loss": -8.64896297454834, "global_step": 485190, "epoch": 2888} {"train_loss": -10.129188537597656, "global_step": 485191, "epoch": 2888} {"train_loss": -10.062675476074219, "global_step": 485192, "epoch": 2888} {"train_loss": -11.059603691101074, "global_step": 485193, "epoch": 2888} {"train_loss": -9.691768646240234, "global_step": 485194, "epoch": 2888} {"train_loss": -10.324241638183594, "global_step": 485195, "epoch": 2888} {"train_loss": -11.53219985961914, "global_step": 485196, "epoch": 2888} {"train_loss": -9.33206558227539, "global_step": 485197, "epoch": 2888} {"train_loss": -10.714871406555176, "global_step": 485198, "epoch": 2888} {"train_loss": -9.43604564666748, "global_step": 485199, "epoch": 2888} {"train_loss": -8.354239463806152, "global_step": 485200, "epoch": 2888} {"train_loss": -10.941493034362793, "global_step": 485201, "epoch": 2888} {"train_loss": -7.831530570983887, "global_step": 485202, "epoch": 2888} {"train_loss": -7.466434955596924, "global_step": 485203, "epoch": 2888} {"train_loss": -8.821155548095703, "global_step": 485204, "epoch": 2888} {"train_loss": -9.879032135009766, "global_step": 485205, "epoch": 2888} {"train_loss": -8.320862770080566, "global_step": 485206, "epoch": 2888} {"train_loss": -10.458415985107422, "global_step": 485207, "epoch": 2888} {"train_loss": -9.713375091552734, "global_step": 485208, "epoch": 2888} {"train_loss": -10.396453857421875, "global_step": 485209, "epoch": 2888} {"train_loss": -9.248934745788574, "global_step": 485210, "epoch": 2888} {"train_loss": -11.143400192260742, "global_step": 485211, "epoch": 2888} {"train_loss": -9.888664245605469, "global_step": 485212, "epoch": 2888} {"train_loss": -10.377069473266602, "global_step": 485213, "epoch": 2888} {"train_loss": -11.597640991210938, "global_step": 485214, "epoch": 2888} {"train_loss": -11.058653831481934, "global_step": 485215, "epoch": 2888} {"train_loss": -11.286214828491211, "global_step": 485216, "epoch": 2888} {"train_loss": -11.628026962280273, "global_step": 485217, "epoch": 2888} {"train_loss": -11.237369537353516, "global_step": 485218, "epoch": 2888} {"train_loss": -11.667465209960938, "global_step": 485219, "epoch": 2888} {"train_loss": -12.1864013671875, "global_step": 485220, "epoch": 2888} {"train_loss": -12.030016899108887, "global_step": 485221, "epoch": 2888} {"train_loss": -12.325027465820312, "global_step": 485222, "epoch": 2888} {"train_loss": -11.85861587524414, "global_step": 485223, "epoch": 2888} {"train_loss": -12.38611888885498, "global_step": 485224, "epoch": 2888} {"train_loss": -12.143043518066406, "global_step": 485225, "epoch": 2888} {"train_loss": -12.364544868469238, "global_step": 485226, "epoch": 2888} {"train_loss": -12.458569526672363, "global_step": 485227, "epoch": 2888} {"train_loss": -12.223809242248535, "global_step": 485228, "epoch": 2888} {"train_loss": -12.345181465148926, "global_step": 485229, "epoch": 2888} {"train_loss": -12.073654174804688, "global_step": 485230, "epoch": 2888} {"train_loss": -12.281356811523438, "global_step": 485231, "epoch": 2888} {"train_loss": -12.319042205810547, "global_step": 485232, "epoch": 2888} {"train_loss": -12.369747161865234, "global_step": 485233, "epoch": 2888} {"train_loss": -12.173450469970703, "global_step": 485234, "epoch": 2888} {"train_loss": -12.159950256347656, "global_step": 485235, "epoch": 2888} {"train_loss": -12.452705383300781, "global_step": 485236, "epoch": 2888} {"train_loss": -12.543970108032227, "global_step": 485237, "epoch": 2888} {"train_loss": -12.319887161254883, "global_step": 485238, "epoch": 2888} {"train_loss": -12.37773323059082, "global_step": 485239, "epoch": 2888} {"train_loss": -12.48210334777832, "global_step": 485240, "epoch": 2888} {"train_loss": -12.437719345092773, "global_step": 485241, "epoch": 2888} {"train_loss": -12.430384635925293, "global_step": 485242, "epoch": 2888} {"train_loss": -12.495697975158691, "global_step": 485243, "epoch": 2888} {"train_loss": -12.595342636108398, "global_step": 485244, "epoch": 2888} {"train_loss": -12.419780731201172, "global_step": 485245, "epoch": 2888} {"train_loss": -12.54300308227539, "global_step": 485246, "epoch": 2888} {"train_loss": -12.44710922241211, "global_step": 485247, "epoch": 2888} {"train_loss": -12.555119514465332, "global_step": 485248, "epoch": 2888} {"train_loss": -12.489952087402344, "global_step": 485249, "epoch": 2888} {"train_loss": -12.478423118591309, "global_step": 485250, "epoch": 2888} {"train_loss": -12.565614700317383, "global_step": 485251, "epoch": 2888} {"train_loss": -12.496625900268555, "global_step": 485252, "epoch": 2888} {"train_loss": -12.731130599975586, "global_step": 485253, "epoch": 2888} {"train_loss": -12.668606758117676, "global_step": 485254, "epoch": 2888} {"train_loss": -12.677383422851562, "global_step": 485255, "epoch": 2888} {"train_loss": -12.548596382141113, "global_step": 485256, "epoch": 2888} {"train_loss": -12.65078353881836, "global_step": 485257, "epoch": 2888} {"train_loss": -12.545434951782227, "global_step": 485258, "epoch": 2888} {"train_loss": -12.578598022460938, "global_step": 485259, "epoch": 2888} {"train_loss": -12.609935760498047, "global_step": 485260, "epoch": 2888} {"train_loss": -12.538665771484375, "global_step": 485261, "epoch": 2888} {"train_loss": -12.33427619934082, "global_step": 485262, "epoch": 2888} {"train_loss": -12.634492874145508, "global_step": 485263, "epoch": 2888} {"train_loss": -12.497915267944336, "global_step": 485264, "epoch": 2888} {"train_loss": -12.689952850341797, "global_step": 485265, "epoch": 2888} {"train_loss": -12.666194915771484, "global_step": 485266, "epoch": 2888} {"train_loss": -12.46153450012207, "global_step": 485267, "epoch": 2888} {"train_loss": -12.473066329956055, "global_step": 485268, "epoch": 2888} {"train_loss": -12.665620803833008, "global_step": 485269, "epoch": 2888} {"train_loss": -12.543825149536133, "global_step": 485270, "epoch": 2888} {"train_loss": -12.552824974060059, "global_step": 485271, "epoch": 2888} {"train_loss": -12.477727890014648, "global_step": 485272, "epoch": 2888} {"train_loss": -11.894859313964844, "global_step": 485273, "epoch": 2888} {"train_loss": -12.554963111877441, "global_step": 485274, "epoch": 2888} {"train_loss": -12.165037155151367, "global_step": 485275, "epoch": 2888} {"train_loss": -12.210929870605469, "global_step": 485276, "epoch": 2888} {"train_loss": -12.308069229125977, "global_step": 485277, "epoch": 2888} {"train_loss": -11.979162216186523, "global_step": 485278, "epoch": 2888} {"train_loss": -12.34095573425293, "global_step": 485279, "epoch": 2888} {"train_loss": -12.50701904296875, "global_step": 485280, "epoch": 2888} {"train_loss": -12.144495010375977, "global_step": 485281, "epoch": 2888} {"train_loss": -12.405601501464844, "global_step": 485282, "epoch": 2888} {"train_loss": -12.466545104980469, "global_step": 485283, "epoch": 2888} {"train_loss": -12.602494239807129, "global_step": 485284, "epoch": 2888} {"train_loss": -12.00514030456543, "global_step": 485285, "epoch": 2888} {"train_loss": -12.660226821899414, "global_step": 485286, "epoch": 2888} {"train_loss": -12.487648010253906, "global_step": 485287, "epoch": 2888} {"train_loss": -12.266769409179688, "global_step": 485288, "epoch": 2888} {"train_loss": -12.78801155090332, "global_step": 485289, "epoch": 2888} {"train_loss": -12.170116424560547, "global_step": 485290, "epoch": 2888} {"train_loss": -12.298078536987305, "global_step": 485291, "epoch": 2888} {"train_loss": -12.487425804138184, "global_step": 485292, "epoch": 2888} {"train_loss": -12.178787231445312, "global_step": 485293, "epoch": 2888} {"train_loss": -11.925662994384766, "global_step": 485294, "epoch": 2888} {"train_loss": -12.459097862243652, "global_step": 485295, "epoch": 2888} {"train_loss": -12.230249404907227, "global_step": 485296, "epoch": 2888} {"train_loss": -10.424734115600586, "global_step": 485297, "epoch": 2888} {"train_loss": -12.516827583312988, "global_step": 485298, "epoch": 2888} {"train_loss": -11.235340118408203, "global_step": 485299, "epoch": 2888} {"train_loss": -11.475302696228027, "global_step": 485300, "epoch": 2888} {"train_loss": -11.995306015014648, "global_step": 485301, "epoch": 2888} {"train_loss": -11.648185729980469, "global_step": 485302, "epoch": 2888} {"train_loss": -11.532308578491211, "global_step": 485303, "epoch": 2888} {"train_loss": -11.5914888381958, "global_step": 485304, "epoch": 2888} {"train_loss": -11.992773056030273, "global_step": 485305, "epoch": 2888} {"train_loss": -11.649490356445312, "global_step": 485306, "epoch": 2888} {"train_loss": -12.658382415771484, "global_step": 485307, "epoch": 2888} {"train_loss": -12.22052001953125, "global_step": 485308, "epoch": 2888} {"train_loss": -12.32607650756836, "global_step": 485309, "epoch": 2888} {"train_loss": -12.09280776977539, "global_step": 485310, "epoch": 2888} {"train_loss": -12.372808456420898, "global_step": 485311, "epoch": 2888} {"train_loss": -12.288727760314941, "global_step": 485312, "epoch": 2888} {"train_loss": -12.413728713989258, "global_step": 485313, "epoch": 2888} {"train_loss": -12.16506290435791, "global_step": 485314, "epoch": 2888} {"train_loss": -12.467781066894531, "global_step": 485315, "epoch": 2888} {"train_loss": -12.166101455688477, "global_step": 485316, "epoch": 2888} {"train_loss": -11.509153366088867, "global_step": 485317, "epoch": 2888} {"train_loss": -12.498902320861816, "global_step": 485318, "epoch": 2888} {"train_loss": -11.92735481262207, "global_step": 485319, "epoch": 2888} {"train_loss": -11.865713119506836, "global_step": 485320, "epoch": 2888} {"train_loss": -12.274799346923828, "global_step": 485321, "epoch": 2888} {"train_loss": -11.602258682250977, "global_step": 485322, "epoch": 2888} {"train_loss": -12.565289497375488, "global_step": 485323, "epoch": 2888} {"train_loss": -12.11381721496582, "global_step": 485324, "epoch": 2888} {"train_loss": -12.038902282714844, "global_step": 485325, "epoch": 2888} {"train_loss": -12.634866714477539, "global_step": 485326, "epoch": 2888} {"train_loss": -11.912768363952637, "global_step": 485327, "epoch": 2888} {"train_loss": -12.527128219604492, "global_step": 485328, "epoch": 2888} {"train_loss": -12.389045715332031, "global_step": 485329, "epoch": 2888} {"train_loss": -12.311059951782227, "global_step": 485330, "epoch": 2888} {"train_loss": -12.679363250732422, "global_step": 485331, "epoch": 2888} {"train_loss": -12.246824264526367, "global_step": 485332, "epoch": 2888} {"train_loss": -12.705463409423828, "global_step": 485333, "epoch": 2888} {"train_loss": -12.513861656188965, "global_step": 485334, "epoch": 2888} {"train_loss": -12.642696380615234, "global_step": 485335, "epoch": 2888} {"train_loss": -12.455949783325195, "global_step": 485336, "epoch": 2888} {"train_loss": -12.516666412353516, "global_step": 485337, "epoch": 2888} {"train_loss": -12.24753189086914, "global_step": 485338, "epoch": 2888} {"train_loss": -12.486234664916992, "global_step": 485339, "epoch": 2888} {"train_loss": -12.697851181030273, "global_step": 485340, "epoch": 2888} {"train_loss": -12.611895561218262, "global_step": 485341, "epoch": 2888} {"train_loss": -12.290987014770508, "global_step": 485342, "epoch": 2888} {"train_loss": -12.694192886352539, "global_step": 485343, "epoch": 2888} {"train_loss": -12.387275695800781, "global_step": 485344, "epoch": 2888} {"train_loss": -12.11508846282959, "global_step": 485345, "epoch": 2888} {"train_loss": -12.657291412353516, "global_step": 485346, "epoch": 2888} {"train_loss": -12.524258613586426, "global_step": 485347, "epoch": 2888} {"train_loss": -12.495059967041016, "global_step": 485348, "epoch": 2888} {"train_loss": -12.711572647094727, "global_step": 485349, "epoch": 2888} {"train_loss": -12.66433334350586, "global_step": 485350, "epoch": 2888} {"train_loss": -11.866727184681665, "global_step": 485351, "epoch": 2888, "val_loss": 316686.03125} {"train_loss": -12.616480827331543, "global_step": 485352, "epoch": 2889} {"train_loss": -12.548763275146484, "global_step": 485353, "epoch": 2889} {"train_loss": -12.360862731933594, "global_step": 485354, "epoch": 2889} {"train_loss": -12.009475708007812, "global_step": 485355, "epoch": 2889} {"train_loss": -12.058895111083984, "global_step": 485356, "epoch": 2889} {"train_loss": -12.09823989868164, "global_step": 485357, "epoch": 2889} {"train_loss": -12.488393783569336, "global_step": 485358, "epoch": 2889} {"train_loss": -12.173734664916992, "global_step": 485359, "epoch": 2889} {"train_loss": -12.579435348510742, "global_step": 485360, "epoch": 2889} {"train_loss": -12.13117504119873, "global_step": 485361, "epoch": 2889} {"train_loss": -12.423686981201172, "global_step": 485362, "epoch": 2889} {"train_loss": -12.233409881591797, "global_step": 485363, "epoch": 2889} {"train_loss": -12.097234725952148, "global_step": 485364, "epoch": 2889} {"train_loss": -11.515484809875488, "global_step": 485365, "epoch": 2889} {"train_loss": -12.32150650024414, "global_step": 485366, "epoch": 2889} {"train_loss": -12.230716705322266, "global_step": 485367, "epoch": 2889} {"train_loss": -12.46621036529541, "global_step": 485368, "epoch": 2889} {"train_loss": -12.266372680664062, "global_step": 485369, "epoch": 2889} {"train_loss": -12.139158248901367, "global_step": 485370, "epoch": 2889} {"train_loss": -12.240160942077637, "global_step": 485371, "epoch": 2889} {"train_loss": -12.629268646240234, "global_step": 485372, "epoch": 2889} {"train_loss": -12.070636749267578, "global_step": 485373, "epoch": 2889} {"train_loss": -11.956168174743652, "global_step": 485374, "epoch": 2889} {"train_loss": -12.397863388061523, "global_step": 485375, "epoch": 2889} {"train_loss": -12.362890243530273, "global_step": 485376, "epoch": 2889} {"train_loss": -12.257909774780273, "global_step": 485377, "epoch": 2889} {"train_loss": -12.505965232849121, "global_step": 485378, "epoch": 2889} {"train_loss": -12.349766731262207, "global_step": 485379, "epoch": 2889} {"train_loss": -12.344339370727539, "global_step": 485380, "epoch": 2889} {"train_loss": -12.35427474975586, "global_step": 485381, "epoch": 2889} {"train_loss": -12.167745590209961, "global_step": 485382, "epoch": 2889} {"train_loss": -12.816720008850098, "global_step": 485383, "epoch": 2889} {"train_loss": -12.233991622924805, "global_step": 485384, "epoch": 2889} {"train_loss": -12.216930389404297, "global_step": 485385, "epoch": 2889} {"train_loss": -12.312726974487305, "global_step": 485386, "epoch": 2889} {"train_loss": -12.808822631835938, "global_step": 485387, "epoch": 2889} {"train_loss": -12.691328048706055, "global_step": 485388, "epoch": 2889} {"train_loss": -12.580608367919922, "global_step": 485389, "epoch": 2889} {"train_loss": -12.780315399169922, "global_step": 485390, "epoch": 2889} {"train_loss": -12.209714889526367, "global_step": 485391, "epoch": 2889} {"train_loss": -12.7874116897583, "global_step": 485392, "epoch": 2889} {"train_loss": -12.199004173278809, "global_step": 485393, "epoch": 2889} {"train_loss": -12.449891090393066, "global_step": 485394, "epoch": 2889} {"train_loss": -12.227731704711914, "global_step": 485395, "epoch": 2889} {"train_loss": -12.267251014709473, "global_step": 485396, "epoch": 2889} {"train_loss": -12.122234344482422, "global_step": 485397, "epoch": 2889} {"train_loss": -10.858644485473633, "global_step": 485398, "epoch": 2889} {"train_loss": -11.398296356201172, "global_step": 485399, "epoch": 2889} {"train_loss": -12.269779205322266, "global_step": 485400, "epoch": 2889} {"train_loss": -9.907617568969727, "global_step": 485401, "epoch": 2889} {"train_loss": -10.18713665008545, "global_step": 485402, "epoch": 2889} {"train_loss": -11.500847816467285, "global_step": 485403, "epoch": 2889} {"train_loss": -11.528926849365234, "global_step": 485404, "epoch": 2889} {"train_loss": -11.864524841308594, "global_step": 485405, "epoch": 2889} {"train_loss": -11.79837417602539, "global_step": 485406, "epoch": 2889} {"train_loss": -11.356389999389648, "global_step": 485407, "epoch": 2889} {"train_loss": -10.573467254638672, "global_step": 485408, "epoch": 2889} {"train_loss": -8.636249542236328, "global_step": 485409, "epoch": 2889} {"train_loss": -9.96949577331543, "global_step": 485410, "epoch": 2889} {"train_loss": -11.097034454345703, "global_step": 485411, "epoch": 2889} {"train_loss": -11.200851440429688, "global_step": 485412, "epoch": 2889} {"train_loss": -10.712091445922852, "global_step": 485413, "epoch": 2889} {"train_loss": -9.853972434997559, "global_step": 485414, "epoch": 2889} {"train_loss": -10.335328102111816, "global_step": 485415, "epoch": 2889} {"train_loss": -10.661042213439941, "global_step": 485416, "epoch": 2889} {"train_loss": -11.541093826293945, "global_step": 485417, "epoch": 2889} {"train_loss": -12.076056480407715, "global_step": 485418, "epoch": 2889} {"train_loss": -11.462287902832031, "global_step": 485419, "epoch": 2889} {"train_loss": -12.061931610107422, "global_step": 485420, "epoch": 2889} {"train_loss": -11.575464248657227, "global_step": 485421, "epoch": 2889} {"train_loss": -11.666303634643555, "global_step": 485422, "epoch": 2889} {"train_loss": -11.776158332824707, "global_step": 485423, "epoch": 2889} {"train_loss": -11.512186050415039, "global_step": 485424, "epoch": 2889} {"train_loss": -12.136934280395508, "global_step": 485425, "epoch": 2889} {"train_loss": -11.458074569702148, "global_step": 485426, "epoch": 2889} {"train_loss": -11.103105545043945, "global_step": 485427, "epoch": 2889} {"train_loss": -11.940509796142578, "global_step": 485428, "epoch": 2889} {"train_loss": -11.513374328613281, "global_step": 485429, "epoch": 2889} {"train_loss": -11.91372013092041, "global_step": 485430, "epoch": 2889} {"train_loss": -11.941056251525879, "global_step": 485431, "epoch": 2889} {"train_loss": -11.996814727783203, "global_step": 485432, "epoch": 2889} {"train_loss": -11.90961742401123, "global_step": 485433, "epoch": 2889} {"train_loss": -11.820557594299316, "global_step": 485434, "epoch": 2889} {"train_loss": -12.121020317077637, "global_step": 485435, "epoch": 2889} {"train_loss": -11.646520614624023, "global_step": 485436, "epoch": 2889} {"train_loss": -12.383541107177734, "global_step": 485437, "epoch": 2889} {"train_loss": -11.994270324707031, "global_step": 485438, "epoch": 2889} {"train_loss": -12.136337280273438, "global_step": 485439, "epoch": 2889} {"train_loss": -12.103553771972656, "global_step": 485440, "epoch": 2889} {"train_loss": -12.018875122070312, "global_step": 485441, "epoch": 2889} {"train_loss": -12.190675735473633, "global_step": 485442, "epoch": 2889} {"train_loss": -11.807063102722168, "global_step": 485443, "epoch": 2889} {"train_loss": -11.791314125061035, "global_step": 485444, "epoch": 2889} {"train_loss": -12.304763793945312, "global_step": 485445, "epoch": 2889} {"train_loss": -11.97024917602539, "global_step": 485446, "epoch": 2889} {"train_loss": -12.344715118408203, "global_step": 485447, "epoch": 2889} {"train_loss": -11.912825584411621, "global_step": 485448, "epoch": 2889} {"train_loss": -12.087169647216797, "global_step": 485449, "epoch": 2889} {"train_loss": -12.276212692260742, "global_step": 485450, "epoch": 2889} {"train_loss": -12.09469223022461, "global_step": 485451, "epoch": 2889} {"train_loss": -12.369638442993164, "global_step": 485452, "epoch": 2889} {"train_loss": -11.670232772827148, "global_step": 485453, "epoch": 2889} {"train_loss": -12.238688468933105, "global_step": 485454, "epoch": 2889} {"train_loss": -11.431844711303711, "global_step": 485455, "epoch": 2889} {"train_loss": -11.37510871887207, "global_step": 485456, "epoch": 2889} {"train_loss": -10.857498168945312, "global_step": 485457, "epoch": 2889} {"train_loss": -11.423913955688477, "global_step": 485458, "epoch": 2889} {"train_loss": -10.615798950195312, "global_step": 485459, "epoch": 2889} {"train_loss": -11.614922523498535, "global_step": 485460, "epoch": 2889} {"train_loss": -11.289763450622559, "global_step": 485461, "epoch": 2889} {"train_loss": -10.801715850830078, "global_step": 485462, "epoch": 2889} {"train_loss": -12.433154106140137, "global_step": 485463, "epoch": 2889} {"train_loss": -11.006891250610352, "global_step": 485464, "epoch": 2889} {"train_loss": -12.41581916809082, "global_step": 485465, "epoch": 2889} {"train_loss": -11.569535255432129, "global_step": 485466, "epoch": 2889} {"train_loss": -12.094054222106934, "global_step": 485467, "epoch": 2889} {"train_loss": -12.205266952514648, "global_step": 485468, "epoch": 2889} {"train_loss": -12.55128002166748, "global_step": 485469, "epoch": 2889} {"train_loss": -12.28190803527832, "global_step": 485470, "epoch": 2889} {"train_loss": -12.53883171081543, "global_step": 485471, "epoch": 2889} {"train_loss": -12.415115356445312, "global_step": 485472, "epoch": 2889} {"train_loss": -12.587532043457031, "global_step": 485473, "epoch": 2889} {"train_loss": -12.477676391601562, "global_step": 485474, "epoch": 2889} {"train_loss": -12.438997268676758, "global_step": 485475, "epoch": 2889} {"train_loss": -12.621699333190918, "global_step": 485476, "epoch": 2889} {"train_loss": -12.589151382446289, "global_step": 485477, "epoch": 2889} {"train_loss": -12.50145149230957, "global_step": 485478, "epoch": 2889} {"train_loss": -12.552412033081055, "global_step": 485479, "epoch": 2889} {"train_loss": -12.4125394821167, "global_step": 485480, "epoch": 2889} {"train_loss": -12.485413551330566, "global_step": 485481, "epoch": 2889} {"train_loss": -12.668487548828125, "global_step": 485482, "epoch": 2889} {"train_loss": -12.524778366088867, "global_step": 485483, "epoch": 2889} {"train_loss": -12.564786911010742, "global_step": 485484, "epoch": 2889} {"train_loss": -12.303946495056152, "global_step": 485485, "epoch": 2889} {"train_loss": -12.607803344726562, "global_step": 485486, "epoch": 2889} {"train_loss": -12.607776641845703, "global_step": 485487, "epoch": 2889} {"train_loss": -12.44909954071045, "global_step": 485488, "epoch": 2889} {"train_loss": -12.619365692138672, "global_step": 485489, "epoch": 2889} {"train_loss": -12.550564765930176, "global_step": 485490, "epoch": 2889} {"train_loss": -12.532159805297852, "global_step": 485491, "epoch": 2889} {"train_loss": -12.69017219543457, "global_step": 485492, "epoch": 2889} {"train_loss": -12.59219741821289, "global_step": 485493, "epoch": 2889} {"train_loss": -12.74173641204834, "global_step": 485494, "epoch": 2889} {"train_loss": -12.585906028747559, "global_step": 485495, "epoch": 2889} {"train_loss": -12.460297584533691, "global_step": 485496, "epoch": 2889} {"train_loss": -12.547826766967773, "global_step": 485497, "epoch": 2889} {"train_loss": -12.496831893920898, "global_step": 485498, "epoch": 2889} {"train_loss": -12.603801727294922, "global_step": 485499, "epoch": 2889} {"train_loss": -12.455371856689453, "global_step": 485500, "epoch": 2889} {"train_loss": -12.707015991210938, "global_step": 485501, "epoch": 2889} {"train_loss": -12.694042205810547, "global_step": 485502, "epoch": 2889} {"train_loss": -12.675000190734863, "global_step": 485503, "epoch": 2889} {"train_loss": -12.70862865447998, "global_step": 485504, "epoch": 2889} {"train_loss": -12.635822296142578, "global_step": 485505, "epoch": 2889} {"train_loss": -12.75001335144043, "global_step": 485506, "epoch": 2889} {"train_loss": -12.537408828735352, "global_step": 485507, "epoch": 2889} {"train_loss": -12.548903465270996, "global_step": 485508, "epoch": 2889} {"train_loss": -12.551128387451172, "global_step": 485509, "epoch": 2889} {"train_loss": -12.13041877746582, "global_step": 485510, "epoch": 2889} {"train_loss": -12.504372596740723, "global_step": 485511, "epoch": 2889} {"train_loss": -12.483560562133789, "global_step": 485512, "epoch": 2889} {"train_loss": -12.533708572387695, "global_step": 485513, "epoch": 2889} {"train_loss": -12.629169464111328, "global_step": 485514, "epoch": 2889} {"train_loss": -12.473556518554688, "global_step": 485515, "epoch": 2889} {"train_loss": -12.836179733276367, "global_step": 485516, "epoch": 2889} {"train_loss": -12.710775375366211, "global_step": 485517, "epoch": 2889} {"train_loss": -12.56060791015625, "global_step": 485518, "epoch": 2889} {"train_loss": -12.068008371761866, "global_step": 485519, "epoch": 2889, "val_loss": 313770.15625} {"train_loss": -12.443931579589844, "global_step": 485520, "epoch": 2890} {"train_loss": -12.767929077148438, "global_step": 485521, "epoch": 2890} {"train_loss": -12.873602867126465, "global_step": 485522, "epoch": 2890} {"train_loss": -12.794568061828613, "global_step": 485523, "epoch": 2890} {"train_loss": -12.70372200012207, "global_step": 485524, "epoch": 2890} {"train_loss": -12.575113296508789, "global_step": 485525, "epoch": 2890} {"train_loss": -12.451751708984375, "global_step": 485526, "epoch": 2890} {"train_loss": -12.573850631713867, "global_step": 485527, "epoch": 2890} {"train_loss": -12.727795600891113, "global_step": 485528, "epoch": 2890} {"train_loss": -12.805721282958984, "global_step": 485529, "epoch": 2890} {"train_loss": -12.793824195861816, "global_step": 485530, "epoch": 2890} {"train_loss": -12.747762680053711, "global_step": 485531, "epoch": 2890} {"train_loss": -12.796957969665527, "global_step": 485532, "epoch": 2890} {"train_loss": -12.767789840698242, "global_step": 485533, "epoch": 2890} {"train_loss": -13.010955810546875, "global_step": 485534, "epoch": 2890} {"train_loss": -12.493261337280273, "global_step": 485535, "epoch": 2890} {"train_loss": -12.940608978271484, "global_step": 485536, "epoch": 2890} {"train_loss": -12.8500337600708, "global_step": 485537, "epoch": 2890} {"train_loss": -12.95806884765625, "global_step": 485538, "epoch": 2890} {"train_loss": -12.920299530029297, "global_step": 485539, "epoch": 2890} {"train_loss": -12.888534545898438, "global_step": 485540, "epoch": 2890} {"train_loss": -12.800697326660156, "global_step": 485541, "epoch": 2890} {"train_loss": -12.850082397460938, "global_step": 485542, "epoch": 2890} {"train_loss": -12.833517074584961, "global_step": 485543, "epoch": 2890} {"train_loss": -13.173402786254883, "global_step": 485544, "epoch": 2890} {"train_loss": -12.913290977478027, "global_step": 485545, "epoch": 2890} {"train_loss": -12.963461875915527, "global_step": 485546, "epoch": 2890} {"train_loss": -13.077924728393555, "global_step": 485547, "epoch": 2890} {"train_loss": -12.861824989318848, "global_step": 485548, "epoch": 2890} {"train_loss": -13.043746948242188, "global_step": 485549, "epoch": 2890} {"train_loss": -12.86292552947998, "global_step": 485550, "epoch": 2890} {"train_loss": -13.083072662353516, "global_step": 485551, "epoch": 2890} {"train_loss": -12.773467063903809, "global_step": 485552, "epoch": 2890} {"train_loss": -12.658666610717773, "global_step": 485553, "epoch": 2890} {"train_loss": -12.971677780151367, "global_step": 485554, "epoch": 2890} {"train_loss": -12.467403411865234, "global_step": 485555, "epoch": 2890} {"train_loss": -12.339231491088867, "global_step": 485556, "epoch": 2890} {"train_loss": -12.542051315307617, "global_step": 485557, "epoch": 2890} {"train_loss": -12.401968002319336, "global_step": 485558, "epoch": 2890} {"train_loss": -11.189574241638184, "global_step": 485559, "epoch": 2890} {"train_loss": -12.025705337524414, "global_step": 485560, "epoch": 2890} {"train_loss": -12.3116455078125, "global_step": 485561, "epoch": 2890} {"train_loss": -10.516500473022461, "global_step": 485562, "epoch": 2890} {"train_loss": -11.991244316101074, "global_step": 485563, "epoch": 2890} {"train_loss": -11.963689804077148, "global_step": 485564, "epoch": 2890} {"train_loss": -11.140600204467773, "global_step": 485565, "epoch": 2890} {"train_loss": -12.566526412963867, "global_step": 485566, "epoch": 2890} {"train_loss": -11.547292709350586, "global_step": 485567, "epoch": 2890} {"train_loss": -11.941093444824219, "global_step": 485568, "epoch": 2890} {"train_loss": -10.86819076538086, "global_step": 485569, "epoch": 2890} {"train_loss": -11.88878345489502, "global_step": 485570, "epoch": 2890} {"train_loss": -12.075058937072754, "global_step": 485571, "epoch": 2890} {"train_loss": -12.166857719421387, "global_step": 485572, "epoch": 2890} {"train_loss": -10.913803100585938, "global_step": 485573, "epoch": 2890} {"train_loss": -12.486377716064453, "global_step": 485574, "epoch": 2890} {"train_loss": -12.07286262512207, "global_step": 485575, "epoch": 2890} {"train_loss": -12.510784149169922, "global_step": 485576, "epoch": 2890} {"train_loss": -12.467630386352539, "global_step": 485577, "epoch": 2890} {"train_loss": -11.904468536376953, "global_step": 485578, "epoch": 2890} {"train_loss": -11.822896957397461, "global_step": 485579, "epoch": 2890} {"train_loss": -12.700279235839844, "global_step": 485580, "epoch": 2890} {"train_loss": -12.548887252807617, "global_step": 485581, "epoch": 2890} {"train_loss": -12.231340408325195, "global_step": 485582, "epoch": 2890} {"train_loss": -11.553766250610352, "global_step": 485583, "epoch": 2890} {"train_loss": -12.513897895812988, "global_step": 485584, "epoch": 2890} {"train_loss": -12.280702590942383, "global_step": 485585, "epoch": 2890} {"train_loss": -12.039823532104492, "global_step": 485586, "epoch": 2890} {"train_loss": -12.640946388244629, "global_step": 485587, "epoch": 2890} {"train_loss": -12.400615692138672, "global_step": 485588, "epoch": 2890} {"train_loss": -11.941162109375, "global_step": 485589, "epoch": 2890} {"train_loss": -11.770734786987305, "global_step": 485590, "epoch": 2890} {"train_loss": -12.528182029724121, "global_step": 485591, "epoch": 2890} {"train_loss": -12.02160358428955, "global_step": 485592, "epoch": 2890} {"train_loss": -12.369258880615234, "global_step": 485593, "epoch": 2890} {"train_loss": -12.16806411743164, "global_step": 485594, "epoch": 2890} {"train_loss": -12.033072471618652, "global_step": 485595, "epoch": 2890} {"train_loss": -12.361730575561523, "global_step": 485596, "epoch": 2890} {"train_loss": -12.043928146362305, "global_step": 485597, "epoch": 2890} {"train_loss": -12.756246566772461, "global_step": 485598, "epoch": 2890} {"train_loss": -12.21667766571045, "global_step": 485599, "epoch": 2890} {"train_loss": -12.853446960449219, "global_step": 485600, "epoch": 2890} {"train_loss": -12.229069709777832, "global_step": 485601, "epoch": 2890} {"train_loss": -12.308860778808594, "global_step": 485602, "epoch": 2890} {"train_loss": -11.629826545715332, "global_step": 485603, "epoch": 2890} {"train_loss": -12.561318397521973, "global_step": 485604, "epoch": 2890} {"train_loss": -11.94854736328125, "global_step": 485605, "epoch": 2890} {"train_loss": -12.476048469543457, "global_step": 485606, "epoch": 2890} {"train_loss": -12.269501686096191, "global_step": 485607, "epoch": 2890} {"train_loss": -12.239522933959961, "global_step": 485608, "epoch": 2890} {"train_loss": -12.346343994140625, "global_step": 485609, "epoch": 2890} {"train_loss": -11.967659950256348, "global_step": 485610, "epoch": 2890} {"train_loss": -12.644515991210938, "global_step": 485611, "epoch": 2890} {"train_loss": -11.505748748779297, "global_step": 485612, "epoch": 2890} {"train_loss": -12.360366821289062, "global_step": 485613, "epoch": 2890} {"train_loss": -12.02709674835205, "global_step": 485614, "epoch": 2890} {"train_loss": -12.272051811218262, "global_step": 485615, "epoch": 2890} {"train_loss": -12.16724967956543, "global_step": 485616, "epoch": 2890} {"train_loss": -12.376951217651367, "global_step": 485617, "epoch": 2890} {"train_loss": -11.5047025680542, "global_step": 485618, "epoch": 2890} {"train_loss": -12.663968086242676, "global_step": 485619, "epoch": 2890} {"train_loss": -12.386273384094238, "global_step": 485620, "epoch": 2890} {"train_loss": -12.227890968322754, "global_step": 485621, "epoch": 2890} {"train_loss": -12.158559799194336, "global_step": 485622, "epoch": 2890} {"train_loss": -11.75495719909668, "global_step": 485623, "epoch": 2890} {"train_loss": -11.735668182373047, "global_step": 485624, "epoch": 2890} {"train_loss": -12.275068283081055, "global_step": 485625, "epoch": 2890} {"train_loss": -10.973587036132812, "global_step": 485626, "epoch": 2890} {"train_loss": -12.409278869628906, "global_step": 485627, "epoch": 2890} {"train_loss": -12.02098274230957, "global_step": 485628, "epoch": 2890} {"train_loss": -12.27981948852539, "global_step": 485629, "epoch": 2890} {"train_loss": -12.320053100585938, "global_step": 485630, "epoch": 2890} {"train_loss": -11.991971969604492, "global_step": 485631, "epoch": 2890} {"train_loss": -11.534334182739258, "global_step": 485632, "epoch": 2890} {"train_loss": -11.271265983581543, "global_step": 485633, "epoch": 2890} {"train_loss": -10.831816673278809, "global_step": 485634, "epoch": 2890} {"train_loss": -11.531207084655762, "global_step": 485635, "epoch": 2890} {"train_loss": -11.097335815429688, "global_step": 485636, "epoch": 2890} {"train_loss": -10.208080291748047, "global_step": 485637, "epoch": 2890} {"train_loss": -12.0305814743042, "global_step": 485638, "epoch": 2890} {"train_loss": -10.266057014465332, "global_step": 485639, "epoch": 2890} {"train_loss": -12.102205276489258, "global_step": 485640, "epoch": 2890} {"train_loss": -11.225324630737305, "global_step": 485641, "epoch": 2890} {"train_loss": -10.955726623535156, "global_step": 485642, "epoch": 2890} {"train_loss": -9.979783058166504, "global_step": 485643, "epoch": 2890} {"train_loss": -11.653861045837402, "global_step": 485644, "epoch": 2890} {"train_loss": -9.490009307861328, "global_step": 485645, "epoch": 2890} {"train_loss": -10.616816520690918, "global_step": 485646, "epoch": 2890} {"train_loss": -10.95047378540039, "global_step": 485647, "epoch": 2890} {"train_loss": -9.80637264251709, "global_step": 485648, "epoch": 2890} {"train_loss": -10.980440139770508, "global_step": 485649, "epoch": 2890} {"train_loss": -11.102252960205078, "global_step": 485650, "epoch": 2890} {"train_loss": -10.611004829406738, "global_step": 485651, "epoch": 2890} {"train_loss": -12.270491600036621, "global_step": 485652, "epoch": 2890} {"train_loss": -10.03861141204834, "global_step": 485653, "epoch": 2890} {"train_loss": -12.30423355102539, "global_step": 485654, "epoch": 2890} {"train_loss": -10.967842102050781, "global_step": 485655, "epoch": 2890} {"train_loss": -11.765592575073242, "global_step": 485656, "epoch": 2890} {"train_loss": -12.070940017700195, "global_step": 485657, "epoch": 2890} {"train_loss": -11.654516220092773, "global_step": 485658, "epoch": 2890} {"train_loss": -12.051759719848633, "global_step": 485659, "epoch": 2890} {"train_loss": -12.055124282836914, "global_step": 485660, "epoch": 2890} {"train_loss": -12.045124053955078, "global_step": 485661, "epoch": 2890} {"train_loss": -12.165771484375, "global_step": 485662, "epoch": 2890} {"train_loss": -12.28597354888916, "global_step": 485663, "epoch": 2890} {"train_loss": -12.252886772155762, "global_step": 485664, "epoch": 2890} {"train_loss": -12.015995979309082, "global_step": 485665, "epoch": 2890} {"train_loss": -12.381871223449707, "global_step": 485666, "epoch": 2890} {"train_loss": -12.101551055908203, "global_step": 485667, "epoch": 2890} {"train_loss": -12.198333740234375, "global_step": 485668, "epoch": 2890} {"train_loss": -12.469345092773438, "global_step": 485669, "epoch": 2890} {"train_loss": -12.354984283447266, "global_step": 485670, "epoch": 2890} {"train_loss": -12.377388000488281, "global_step": 485671, "epoch": 2890} {"train_loss": -12.662095069885254, "global_step": 485672, "epoch": 2890} {"train_loss": -12.231073379516602, "global_step": 485673, "epoch": 2890} {"train_loss": -12.3649263381958, "global_step": 485674, "epoch": 2890} {"train_loss": -12.20669174194336, "global_step": 485675, "epoch": 2890} {"train_loss": -12.477697372436523, "global_step": 485676, "epoch": 2890} {"train_loss": -12.669607162475586, "global_step": 485677, "epoch": 2890} {"train_loss": -12.629199981689453, "global_step": 485678, "epoch": 2890} {"train_loss": -12.708377838134766, "global_step": 485679, "epoch": 2890} {"train_loss": -12.599332809448242, "global_step": 485680, "epoch": 2890} {"train_loss": -12.532289505004883, "global_step": 485681, "epoch": 2890} {"train_loss": -12.875909805297852, "global_step": 485682, "epoch": 2890} {"train_loss": -12.840124130249023, "global_step": 485683, "epoch": 2890} {"train_loss": -12.791939735412598, "global_step": 485684, "epoch": 2890} {"train_loss": -12.71957778930664, "global_step": 485685, "epoch": 2890} {"train_loss": -12.843365669250488, "global_step": 485686, "epoch": 2890} {"train_loss": -12.146401825405302, "global_step": 485687, "epoch": 2890, "val_loss": 314307.96875, "train_action_mse_error": 0.4863646626472473} {"train_loss": -12.865032196044922, "global_step": 485688, "epoch": 2891} {"train_loss": -12.685617446899414, "global_step": 485689, "epoch": 2891} {"train_loss": -12.63304328918457, "global_step": 485690, "epoch": 2891} {"train_loss": -12.742286682128906, "global_step": 485691, "epoch": 2891} {"train_loss": -12.792895317077637, "global_step": 485692, "epoch": 2891} {"train_loss": -12.684040069580078, "global_step": 485693, "epoch": 2891} {"train_loss": -12.666901588439941, "global_step": 485694, "epoch": 2891} {"train_loss": -12.630457878112793, "global_step": 485695, "epoch": 2891} {"train_loss": -12.708209991455078, "global_step": 485696, "epoch": 2891} {"train_loss": -12.626683235168457, "global_step": 485697, "epoch": 2891} {"train_loss": -12.50224494934082, "global_step": 485698, "epoch": 2891} {"train_loss": -12.234682083129883, "global_step": 485699, "epoch": 2891} {"train_loss": -12.885257720947266, "global_step": 485700, "epoch": 2891} {"train_loss": -12.558892250061035, "global_step": 485701, "epoch": 2891} {"train_loss": -12.741703033447266, "global_step": 485702, "epoch": 2891} {"train_loss": -12.758774757385254, "global_step": 485703, "epoch": 2891} {"train_loss": -12.424222946166992, "global_step": 485704, "epoch": 2891} {"train_loss": -12.823163986206055, "global_step": 485705, "epoch": 2891} {"train_loss": -12.458438873291016, "global_step": 485706, "epoch": 2891} {"train_loss": -12.820980072021484, "global_step": 485707, "epoch": 2891} {"train_loss": -12.57537841796875, "global_step": 485708, "epoch": 2891} {"train_loss": -12.832053184509277, "global_step": 485709, "epoch": 2891} {"train_loss": -12.765087127685547, "global_step": 485710, "epoch": 2891} {"train_loss": -12.7391357421875, "global_step": 485711, "epoch": 2891} {"train_loss": -12.667106628417969, "global_step": 485712, "epoch": 2891} {"train_loss": -12.515235900878906, "global_step": 485713, "epoch": 2891} {"train_loss": -12.649085998535156, "global_step": 485714, "epoch": 2891} {"train_loss": -12.448848724365234, "global_step": 485715, "epoch": 2891} {"train_loss": -12.562612533569336, "global_step": 485716, "epoch": 2891} {"train_loss": -12.887516021728516, "global_step": 485717, "epoch": 2891} {"train_loss": -12.688041687011719, "global_step": 485718, "epoch": 2891} {"train_loss": -12.644655227661133, "global_step": 485719, "epoch": 2891} {"train_loss": -12.779741287231445, "global_step": 485720, "epoch": 2891} {"train_loss": -12.607921600341797, "global_step": 485721, "epoch": 2891} {"train_loss": -12.539958000183105, "global_step": 485722, "epoch": 2891} {"train_loss": -12.725391387939453, "global_step": 485723, "epoch": 2891} {"train_loss": -12.997960090637207, "global_step": 485724, "epoch": 2891} {"train_loss": -12.904138565063477, "global_step": 485725, "epoch": 2891} {"train_loss": -12.498835563659668, "global_step": 485726, "epoch": 2891} {"train_loss": -12.728463172912598, "global_step": 485727, "epoch": 2891} {"train_loss": -12.657989501953125, "global_step": 485728, "epoch": 2891} {"train_loss": -12.72964096069336, "global_step": 485729, "epoch": 2891} {"train_loss": -12.816183090209961, "global_step": 485730, "epoch": 2891} {"train_loss": -12.731459617614746, "global_step": 485731, "epoch": 2891} {"train_loss": -12.599218368530273, "global_step": 485732, "epoch": 2891} {"train_loss": -12.681844711303711, "global_step": 485733, "epoch": 2891} {"train_loss": -13.08439826965332, "global_step": 485734, "epoch": 2891} {"train_loss": -12.378706932067871, "global_step": 485735, "epoch": 2891} {"train_loss": -12.333303451538086, "global_step": 485736, "epoch": 2891} {"train_loss": -12.90254020690918, "global_step": 485737, "epoch": 2891} {"train_loss": -12.413999557495117, "global_step": 485738, "epoch": 2891} {"train_loss": -12.670389175415039, "global_step": 485739, "epoch": 2891} {"train_loss": -13.1336030960083, "global_step": 485740, "epoch": 2891} {"train_loss": -12.541712760925293, "global_step": 485741, "epoch": 2891} {"train_loss": -12.743741989135742, "global_step": 485742, "epoch": 2891} {"train_loss": -12.841035842895508, "global_step": 485743, "epoch": 2891} {"train_loss": -12.723793983459473, "global_step": 485744, "epoch": 2891} {"train_loss": -12.743253707885742, "global_step": 485745, "epoch": 2891} {"train_loss": -12.733613014221191, "global_step": 485746, "epoch": 2891} {"train_loss": -12.37843132019043, "global_step": 485747, "epoch": 2891} {"train_loss": -13.134013175964355, "global_step": 485748, "epoch": 2891} {"train_loss": -12.597602844238281, "global_step": 485749, "epoch": 2891} {"train_loss": -12.638642311096191, "global_step": 485750, "epoch": 2891} {"train_loss": -12.813983917236328, "global_step": 485751, "epoch": 2891} {"train_loss": -12.597779273986816, "global_step": 485752, "epoch": 2891} {"train_loss": -12.199422836303711, "global_step": 485753, "epoch": 2891} {"train_loss": -12.435030937194824, "global_step": 485754, "epoch": 2891} {"train_loss": -12.665855407714844, "global_step": 485755, "epoch": 2891} {"train_loss": -12.768985748291016, "global_step": 485756, "epoch": 2891} {"train_loss": -12.030080795288086, "global_step": 485757, "epoch": 2891} {"train_loss": -12.913606643676758, "global_step": 485758, "epoch": 2891} {"train_loss": -12.836615562438965, "global_step": 485759, "epoch": 2891} {"train_loss": -12.814955711364746, "global_step": 485760, "epoch": 2891} {"train_loss": -12.365827560424805, "global_step": 485761, "epoch": 2891} {"train_loss": -12.670320510864258, "global_step": 485762, "epoch": 2891} {"train_loss": -12.732328414916992, "global_step": 485763, "epoch": 2891} {"train_loss": -12.946549415588379, "global_step": 485764, "epoch": 2891} {"train_loss": -12.72526741027832, "global_step": 485765, "epoch": 2891} {"train_loss": -12.620341300964355, "global_step": 485766, "epoch": 2891} {"train_loss": -12.6917085647583, "global_step": 485767, "epoch": 2891} {"train_loss": -12.471056938171387, "global_step": 485768, "epoch": 2891} {"train_loss": -12.327686309814453, "global_step": 485769, "epoch": 2891} {"train_loss": -12.619847297668457, "global_step": 485770, "epoch": 2891} {"train_loss": -12.788569450378418, "global_step": 485771, "epoch": 2891} {"train_loss": -12.475719451904297, "global_step": 485772, "epoch": 2891} {"train_loss": -12.177827835083008, "global_step": 485773, "epoch": 2891} {"train_loss": -13.032094955444336, "global_step": 485774, "epoch": 2891} {"train_loss": -11.249019622802734, "global_step": 485775, "epoch": 2891} {"train_loss": -11.43278694152832, "global_step": 485776, "epoch": 2891} {"train_loss": -12.959283828735352, "global_step": 485777, "epoch": 2891} {"train_loss": -10.305619239807129, "global_step": 485778, "epoch": 2891} {"train_loss": -11.793651580810547, "global_step": 485779, "epoch": 2891} {"train_loss": -12.188005447387695, "global_step": 485780, "epoch": 2891} {"train_loss": -11.37466812133789, "global_step": 485781, "epoch": 2891} {"train_loss": -12.386157989501953, "global_step": 485782, "epoch": 2891} {"train_loss": -10.486888885498047, "global_step": 485783, "epoch": 2891} {"train_loss": -10.346541404724121, "global_step": 485784, "epoch": 2891} {"train_loss": -12.051910400390625, "global_step": 485785, "epoch": 2891} {"train_loss": -10.907448768615723, "global_step": 485786, "epoch": 2891} {"train_loss": -11.85676383972168, "global_step": 485787, "epoch": 2891} {"train_loss": -11.382766723632812, "global_step": 485788, "epoch": 2891} {"train_loss": -11.451181411743164, "global_step": 485789, "epoch": 2891} {"train_loss": -11.213285446166992, "global_step": 485790, "epoch": 2891} {"train_loss": -11.399847984313965, "global_step": 485791, "epoch": 2891} {"train_loss": -11.404714584350586, "global_step": 485792, "epoch": 2891} {"train_loss": -12.241809844970703, "global_step": 485793, "epoch": 2891} {"train_loss": -10.92208480834961, "global_step": 485794, "epoch": 2891} {"train_loss": -12.248903274536133, "global_step": 485795, "epoch": 2891} {"train_loss": -11.53269100189209, "global_step": 485796, "epoch": 2891} {"train_loss": -11.725569725036621, "global_step": 485797, "epoch": 2891} {"train_loss": -11.975160598754883, "global_step": 485798, "epoch": 2891} {"train_loss": -11.568113327026367, "global_step": 485799, "epoch": 2891} {"train_loss": -12.323074340820312, "global_step": 485800, "epoch": 2891} {"train_loss": -11.821653366088867, "global_step": 485801, "epoch": 2891} {"train_loss": -12.069913864135742, "global_step": 485802, "epoch": 2891} {"train_loss": -12.148361206054688, "global_step": 485803, "epoch": 2891} {"train_loss": -11.833312034606934, "global_step": 485804, "epoch": 2891} {"train_loss": -12.080689430236816, "global_step": 485805, "epoch": 2891} {"train_loss": -12.08996295928955, "global_step": 485806, "epoch": 2891} {"train_loss": -12.557523727416992, "global_step": 485807, "epoch": 2891} {"train_loss": -11.652338981628418, "global_step": 485808, "epoch": 2891} {"train_loss": -11.25864028930664, "global_step": 485809, "epoch": 2891} {"train_loss": -11.940513610839844, "global_step": 485810, "epoch": 2891} {"train_loss": -10.85428237915039, "global_step": 485811, "epoch": 2891} {"train_loss": -11.674400329589844, "global_step": 485812, "epoch": 2891} {"train_loss": -9.665536880493164, "global_step": 485813, "epoch": 2891} {"train_loss": -10.46042251586914, "global_step": 485814, "epoch": 2891} {"train_loss": -10.803741455078125, "global_step": 485815, "epoch": 2891} {"train_loss": -9.601107597351074, "global_step": 485816, "epoch": 2891} {"train_loss": -11.690872192382812, "global_step": 485817, "epoch": 2891} {"train_loss": -9.07823657989502, "global_step": 485818, "epoch": 2891} {"train_loss": -11.107086181640625, "global_step": 485819, "epoch": 2891} {"train_loss": -8.63813591003418, "global_step": 485820, "epoch": 2891} {"train_loss": -8.464025497436523, "global_step": 485821, "epoch": 2891} {"train_loss": -12.03449821472168, "global_step": 485822, "epoch": 2891} {"train_loss": -8.878717422485352, "global_step": 485823, "epoch": 2891} {"train_loss": -10.957748413085938, "global_step": 485824, "epoch": 2891} {"train_loss": -8.896095275878906, "global_step": 485825, "epoch": 2891} {"train_loss": -10.225927352905273, "global_step": 485826, "epoch": 2891} {"train_loss": -9.826412200927734, "global_step": 485827, "epoch": 2891} {"train_loss": -10.512147903442383, "global_step": 485828, "epoch": 2891} {"train_loss": -11.461991310119629, "global_step": 485829, "epoch": 2891} {"train_loss": -10.115769386291504, "global_step": 485830, "epoch": 2891} {"train_loss": -11.374205589294434, "global_step": 485831, "epoch": 2891} {"train_loss": -10.727509498596191, "global_step": 485832, "epoch": 2891} {"train_loss": -11.065971374511719, "global_step": 485833, "epoch": 2891} {"train_loss": -10.647680282592773, "global_step": 485834, "epoch": 2891} {"train_loss": -11.879653930664062, "global_step": 485835, "epoch": 2891} {"train_loss": -11.28502368927002, "global_step": 485836, "epoch": 2891} {"train_loss": -11.227581977844238, "global_step": 485837, "epoch": 2891} {"train_loss": -11.759166717529297, "global_step": 485838, "epoch": 2891} {"train_loss": -11.493093490600586, "global_step": 485839, "epoch": 2891} {"train_loss": -11.939117431640625, "global_step": 485840, "epoch": 2891} {"train_loss": -11.301297187805176, "global_step": 485841, "epoch": 2891} {"train_loss": -12.19671630859375, "global_step": 485842, "epoch": 2891} {"train_loss": -11.55881118774414, "global_step": 485843, "epoch": 2891} {"train_loss": -11.499650001525879, "global_step": 485844, "epoch": 2891} {"train_loss": -12.02687931060791, "global_step": 485845, "epoch": 2891} {"train_loss": -11.789606094360352, "global_step": 485846, "epoch": 2891} {"train_loss": -11.659097671508789, "global_step": 485847, "epoch": 2891} {"train_loss": -11.78897762298584, "global_step": 485848, "epoch": 2891} {"train_loss": -11.903528213500977, "global_step": 485849, "epoch": 2891} {"train_loss": -12.07807445526123, "global_step": 485850, "epoch": 2891} {"train_loss": -12.496358871459961, "global_step": 485851, "epoch": 2891} {"train_loss": -11.93983268737793, "global_step": 485852, "epoch": 2891} {"train_loss": -12.014472007751465, "global_step": 485853, "epoch": 2891} {"train_loss": -12.39596939086914, "global_step": 485854, "epoch": 2891} {"train_loss": -12.016214558056422, "global_step": 485855, "epoch": 2891, "val_loss": 319653.40625} {"train_loss": -12.42974853515625, "global_step": 485856, "epoch": 2892} {"train_loss": -12.1879243850708, "global_step": 485857, "epoch": 2892} {"train_loss": -12.401408195495605, "global_step": 485858, "epoch": 2892} {"train_loss": -12.392844200134277, "global_step": 485859, "epoch": 2892} {"train_loss": -12.502286911010742, "global_step": 485860, "epoch": 2892} {"train_loss": -12.261152267456055, "global_step": 485861, "epoch": 2892} {"train_loss": -12.332999229431152, "global_step": 485862, "epoch": 2892} {"train_loss": -12.408974647521973, "global_step": 485863, "epoch": 2892} {"train_loss": -12.431924819946289, "global_step": 485864, "epoch": 2892} {"train_loss": -12.57923698425293, "global_step": 485865, "epoch": 2892} {"train_loss": -12.574444770812988, "global_step": 485866, "epoch": 2892} {"train_loss": -12.579566955566406, "global_step": 485867, "epoch": 2892} {"train_loss": -12.45654296875, "global_step": 485868, "epoch": 2892} {"train_loss": -12.442126274108887, "global_step": 485869, "epoch": 2892} {"train_loss": -12.683341026306152, "global_step": 485870, "epoch": 2892} {"train_loss": -12.733022689819336, "global_step": 485871, "epoch": 2892} {"train_loss": -12.673911094665527, "global_step": 485872, "epoch": 2892} {"train_loss": -12.681621551513672, "global_step": 485873, "epoch": 2892} {"train_loss": -12.724227905273438, "global_step": 485874, "epoch": 2892} {"train_loss": -12.600235939025879, "global_step": 485875, "epoch": 2892} {"train_loss": -12.596163749694824, "global_step": 485876, "epoch": 2892} {"train_loss": -12.633014678955078, "global_step": 485877, "epoch": 2892} {"train_loss": -12.704167366027832, "global_step": 485878, "epoch": 2892} {"train_loss": -12.626379013061523, "global_step": 485879, "epoch": 2892} {"train_loss": -12.582541465759277, "global_step": 485880, "epoch": 2892} {"train_loss": -12.839635848999023, "global_step": 485881, "epoch": 2892} {"train_loss": -12.761981964111328, "global_step": 485882, "epoch": 2892} {"train_loss": -12.787162780761719, "global_step": 485883, "epoch": 2892} {"train_loss": -12.685803413391113, "global_step": 485884, "epoch": 2892} {"train_loss": -12.55238151550293, "global_step": 485885, "epoch": 2892} {"train_loss": -12.586040496826172, "global_step": 485886, "epoch": 2892} {"train_loss": -12.615081787109375, "global_step": 485887, "epoch": 2892} {"train_loss": -12.797653198242188, "global_step": 485888, "epoch": 2892} {"train_loss": -12.775601387023926, "global_step": 485889, "epoch": 2892} {"train_loss": -12.637029647827148, "global_step": 485890, "epoch": 2892} {"train_loss": -12.624872207641602, "global_step": 485891, "epoch": 2892} {"train_loss": -12.68552017211914, "global_step": 485892, "epoch": 2892} {"train_loss": -12.796897888183594, "global_step": 485893, "epoch": 2892} {"train_loss": -12.798036575317383, "global_step": 485894, "epoch": 2892} {"train_loss": -12.888614654541016, "global_step": 485895, "epoch": 2892} {"train_loss": -12.699042320251465, "global_step": 485896, "epoch": 2892} {"train_loss": -12.827152252197266, "global_step": 485897, "epoch": 2892} {"train_loss": -12.953824043273926, "global_step": 485898, "epoch": 2892} {"train_loss": -12.818726539611816, "global_step": 485899, "epoch": 2892} {"train_loss": -12.891267776489258, "global_step": 485900, "epoch": 2892} {"train_loss": -12.780557632446289, "global_step": 485901, "epoch": 2892} {"train_loss": -12.583807945251465, "global_step": 485902, "epoch": 2892} {"train_loss": -12.764944076538086, "global_step": 485903, "epoch": 2892} {"train_loss": -12.775650024414062, "global_step": 485904, "epoch": 2892} {"train_loss": -12.695524215698242, "global_step": 485905, "epoch": 2892} {"train_loss": -12.820357322692871, "global_step": 485906, "epoch": 2892} {"train_loss": -12.546910285949707, "global_step": 485907, "epoch": 2892} {"train_loss": -12.75550651550293, "global_step": 485908, "epoch": 2892} {"train_loss": -12.789531707763672, "global_step": 485909, "epoch": 2892} {"train_loss": -12.928153991699219, "global_step": 485910, "epoch": 2892} {"train_loss": -12.703140258789062, "global_step": 485911, "epoch": 2892} {"train_loss": -12.786450386047363, "global_step": 485912, "epoch": 2892} {"train_loss": -12.913989067077637, "global_step": 485913, "epoch": 2892} {"train_loss": -12.907691955566406, "global_step": 485914, "epoch": 2892} {"train_loss": -12.367290496826172, "global_step": 485915, "epoch": 2892} {"train_loss": -13.07418441772461, "global_step": 485916, "epoch": 2892} {"train_loss": -12.452910423278809, "global_step": 485917, "epoch": 2892} {"train_loss": -12.662727355957031, "global_step": 485918, "epoch": 2892} {"train_loss": -12.7695894241333, "global_step": 485919, "epoch": 2892} {"train_loss": -12.752056121826172, "global_step": 485920, "epoch": 2892} {"train_loss": -12.84951400756836, "global_step": 485921, "epoch": 2892} {"train_loss": -12.950430870056152, "global_step": 485922, "epoch": 2892} {"train_loss": -12.878395080566406, "global_step": 485923, "epoch": 2892} {"train_loss": -13.083269119262695, "global_step": 485924, "epoch": 2892} {"train_loss": -12.814590454101562, "global_step": 485925, "epoch": 2892} {"train_loss": -12.844881057739258, "global_step": 485926, "epoch": 2892} {"train_loss": -12.802993774414062, "global_step": 485927, "epoch": 2892} {"train_loss": -12.712367057800293, "global_step": 485928, "epoch": 2892} {"train_loss": -12.881624221801758, "global_step": 485929, "epoch": 2892} {"train_loss": -12.995187759399414, "global_step": 485930, "epoch": 2892} {"train_loss": -12.750251770019531, "global_step": 485931, "epoch": 2892} {"train_loss": -12.557570457458496, "global_step": 485932, "epoch": 2892} {"train_loss": -12.621908187866211, "global_step": 485933, "epoch": 2892} {"train_loss": -12.600605010986328, "global_step": 485934, "epoch": 2892} {"train_loss": -12.173516273498535, "global_step": 485935, "epoch": 2892} {"train_loss": -12.073493957519531, "global_step": 485936, "epoch": 2892} {"train_loss": -12.558050155639648, "global_step": 485937, "epoch": 2892} {"train_loss": -11.612585067749023, "global_step": 485938, "epoch": 2892} {"train_loss": -10.877326965332031, "global_step": 485939, "epoch": 2892} {"train_loss": -12.758560180664062, "global_step": 485940, "epoch": 2892} {"train_loss": -11.485976219177246, "global_step": 485941, "epoch": 2892} {"train_loss": -12.102432250976562, "global_step": 485942, "epoch": 2892} {"train_loss": -12.709059715270996, "global_step": 485943, "epoch": 2892} {"train_loss": -12.616113662719727, "global_step": 485944, "epoch": 2892} {"train_loss": -12.319982528686523, "global_step": 485945, "epoch": 2892} {"train_loss": -12.859830856323242, "global_step": 485946, "epoch": 2892} {"train_loss": -12.782514572143555, "global_step": 485947, "epoch": 2892} {"train_loss": -12.380537986755371, "global_step": 485948, "epoch": 2892} {"train_loss": -12.356995582580566, "global_step": 485949, "epoch": 2892} {"train_loss": -12.900838851928711, "global_step": 485950, "epoch": 2892} {"train_loss": -12.73768138885498, "global_step": 485951, "epoch": 2892} {"train_loss": -12.697230339050293, "global_step": 485952, "epoch": 2892} {"train_loss": -12.512175559997559, "global_step": 485953, "epoch": 2892} {"train_loss": -12.721822738647461, "global_step": 485954, "epoch": 2892} {"train_loss": -12.666498184204102, "global_step": 485955, "epoch": 2892} {"train_loss": -12.915361404418945, "global_step": 485956, "epoch": 2892} {"train_loss": -12.521376609802246, "global_step": 485957, "epoch": 2892} {"train_loss": -12.832048416137695, "global_step": 485958, "epoch": 2892} {"train_loss": -12.920331954956055, "global_step": 485959, "epoch": 2892} {"train_loss": -13.000541687011719, "global_step": 485960, "epoch": 2892} {"train_loss": -12.815065383911133, "global_step": 485961, "epoch": 2892} {"train_loss": -12.856672286987305, "global_step": 485962, "epoch": 2892} {"train_loss": -12.756717681884766, "global_step": 485963, "epoch": 2892} {"train_loss": -12.631118774414062, "global_step": 485964, "epoch": 2892} {"train_loss": -12.505659103393555, "global_step": 485965, "epoch": 2892} {"train_loss": -12.721975326538086, "global_step": 485966, "epoch": 2892} {"train_loss": -12.483999252319336, "global_step": 485967, "epoch": 2892} {"train_loss": -12.482787132263184, "global_step": 485968, "epoch": 2892} {"train_loss": -12.415332794189453, "global_step": 485969, "epoch": 2892} {"train_loss": -12.434483528137207, "global_step": 485970, "epoch": 2892} {"train_loss": -11.972668647766113, "global_step": 485971, "epoch": 2892} {"train_loss": -12.550061225891113, "global_step": 485972, "epoch": 2892} {"train_loss": -11.774969100952148, "global_step": 485973, "epoch": 2892} {"train_loss": -12.514139175415039, "global_step": 485974, "epoch": 2892} {"train_loss": -12.510421752929688, "global_step": 485975, "epoch": 2892} {"train_loss": -12.358906745910645, "global_step": 485976, "epoch": 2892} {"train_loss": -12.286515235900879, "global_step": 485977, "epoch": 2892} {"train_loss": -12.671327590942383, "global_step": 485978, "epoch": 2892} {"train_loss": -12.606033325195312, "global_step": 485979, "epoch": 2892} {"train_loss": -12.355901718139648, "global_step": 485980, "epoch": 2892} {"train_loss": -12.104244232177734, "global_step": 485981, "epoch": 2892} {"train_loss": -11.407483100891113, "global_step": 485982, "epoch": 2892} {"train_loss": -10.971561431884766, "global_step": 485983, "epoch": 2892} {"train_loss": -9.860361099243164, "global_step": 485984, "epoch": 2892} {"train_loss": -10.00792407989502, "global_step": 485985, "epoch": 2892} {"train_loss": -10.807632446289062, "global_step": 485986, "epoch": 2892} {"train_loss": -10.787788391113281, "global_step": 485987, "epoch": 2892} {"train_loss": -10.159116744995117, "global_step": 485988, "epoch": 2892} {"train_loss": -9.52802562713623, "global_step": 485989, "epoch": 2892} {"train_loss": -10.191492080688477, "global_step": 485990, "epoch": 2892} {"train_loss": -11.03188705444336, "global_step": 485991, "epoch": 2892} {"train_loss": -11.652292251586914, "global_step": 485992, "epoch": 2892} {"train_loss": -10.608047485351562, "global_step": 485993, "epoch": 2892} {"train_loss": -11.46567440032959, "global_step": 485994, "epoch": 2892} {"train_loss": -11.504161834716797, "global_step": 485995, "epoch": 2892} {"train_loss": -11.736099243164062, "global_step": 485996, "epoch": 2892} {"train_loss": -11.53568172454834, "global_step": 485997, "epoch": 2892} {"train_loss": -10.695257186889648, "global_step": 485998, "epoch": 2892} {"train_loss": -11.616597175598145, "global_step": 485999, "epoch": 2892} {"train_loss": -11.207478523254395, "global_step": 486000, "epoch": 2892} {"train_loss": -11.806434631347656, "global_step": 486001, "epoch": 2892} {"train_loss": -10.824174880981445, "global_step": 486002, "epoch": 2892} {"train_loss": -11.442131042480469, "global_step": 486003, "epoch": 2892} {"train_loss": -11.275960922241211, "global_step": 486004, "epoch": 2892} {"train_loss": -9.65390396118164, "global_step": 486005, "epoch": 2892} {"train_loss": -12.018552780151367, "global_step": 486006, "epoch": 2892} {"train_loss": -9.335050582885742, "global_step": 486007, "epoch": 2892} {"train_loss": -12.099752426147461, "global_step": 486008, "epoch": 2892} {"train_loss": -9.545816421508789, "global_step": 486009, "epoch": 2892} {"train_loss": -10.985148429870605, "global_step": 486010, "epoch": 2892} {"train_loss": -10.363933563232422, "global_step": 486011, "epoch": 2892} {"train_loss": -11.411810874938965, "global_step": 486012, "epoch": 2892} {"train_loss": -10.320928573608398, "global_step": 486013, "epoch": 2892} {"train_loss": -10.569717407226562, "global_step": 486014, "epoch": 2892} {"train_loss": -10.876306533813477, "global_step": 486015, "epoch": 2892} {"train_loss": -11.205698013305664, "global_step": 486016, "epoch": 2892} {"train_loss": -11.020024299621582, "global_step": 486017, "epoch": 2892} {"train_loss": -11.387056350708008, "global_step": 486018, "epoch": 2892} {"train_loss": -11.356578826904297, "global_step": 486019, "epoch": 2892} {"train_loss": -11.554399490356445, "global_step": 486020, "epoch": 2892} {"train_loss": -11.567139625549316, "global_step": 486021, "epoch": 2892} {"train_loss": -11.561460494995117, "global_step": 486022, "epoch": 2892} {"train_loss": -12.196031610171, "global_step": 486023, "epoch": 2892, "val_loss": 313644.15625} {"train_loss": -11.349809646606445, "global_step": 486024, "epoch": 2893} {"train_loss": -11.426338195800781, "global_step": 486025, "epoch": 2893} {"train_loss": -11.690603256225586, "global_step": 486026, "epoch": 2893} {"train_loss": -11.83228588104248, "global_step": 486027, "epoch": 2893} {"train_loss": -11.593904495239258, "global_step": 486028, "epoch": 2893} {"train_loss": -11.993874549865723, "global_step": 486029, "epoch": 2893} {"train_loss": -12.060571670532227, "global_step": 486030, "epoch": 2893} {"train_loss": -11.875609397888184, "global_step": 486031, "epoch": 2893} {"train_loss": -11.941442489624023, "global_step": 486032, "epoch": 2893} {"train_loss": -12.28192138671875, "global_step": 486033, "epoch": 2893} {"train_loss": -11.817262649536133, "global_step": 486034, "epoch": 2893} {"train_loss": -12.0769681930542, "global_step": 486035, "epoch": 2893} {"train_loss": -12.233649253845215, "global_step": 486036, "epoch": 2893} {"train_loss": -11.795610427856445, "global_step": 486037, "epoch": 2893} {"train_loss": -12.223867416381836, "global_step": 486038, "epoch": 2893} {"train_loss": -12.084640502929688, "global_step": 486039, "epoch": 2893} {"train_loss": -12.149274826049805, "global_step": 486040, "epoch": 2893} {"train_loss": -12.028460502624512, "global_step": 486041, "epoch": 2893} {"train_loss": -12.248476028442383, "global_step": 486042, "epoch": 2893} {"train_loss": -12.062774658203125, "global_step": 486043, "epoch": 2893} {"train_loss": -12.643868446350098, "global_step": 486044, "epoch": 2893} {"train_loss": -12.121326446533203, "global_step": 486045, "epoch": 2893} {"train_loss": -12.235173225402832, "global_step": 486046, "epoch": 2893} {"train_loss": -12.42070484161377, "global_step": 486047, "epoch": 2893} {"train_loss": -12.098438262939453, "global_step": 486048, "epoch": 2893} {"train_loss": -12.647584915161133, "global_step": 486049, "epoch": 2893} {"train_loss": -12.424468040466309, "global_step": 486050, "epoch": 2893} {"train_loss": -12.410829544067383, "global_step": 486051, "epoch": 2893} {"train_loss": -12.26479434967041, "global_step": 486052, "epoch": 2893} {"train_loss": -12.577482223510742, "global_step": 486053, "epoch": 2893} {"train_loss": -12.276508331298828, "global_step": 486054, "epoch": 2893} {"train_loss": -12.42031192779541, "global_step": 486055, "epoch": 2893} {"train_loss": -12.571887969970703, "global_step": 486056, "epoch": 2893} {"train_loss": -12.062498092651367, "global_step": 486057, "epoch": 2893} {"train_loss": -12.843731880187988, "global_step": 486058, "epoch": 2893} {"train_loss": -12.340692520141602, "global_step": 486059, "epoch": 2893} {"train_loss": -12.246442794799805, "global_step": 486060, "epoch": 2893} {"train_loss": -12.733579635620117, "global_step": 486061, "epoch": 2893} {"train_loss": -12.302434921264648, "global_step": 486062, "epoch": 2893} {"train_loss": -12.497814178466797, "global_step": 486063, "epoch": 2893} {"train_loss": -12.683351516723633, "global_step": 486064, "epoch": 2893} {"train_loss": -12.391965866088867, "global_step": 486065, "epoch": 2893} {"train_loss": -12.597909927368164, "global_step": 486066, "epoch": 2893} {"train_loss": -12.636870384216309, "global_step": 486067, "epoch": 2893} {"train_loss": -12.530319213867188, "global_step": 486068, "epoch": 2893} {"train_loss": -12.818559646606445, "global_step": 486069, "epoch": 2893} {"train_loss": -12.624898910522461, "global_step": 486070, "epoch": 2893} {"train_loss": -12.518056869506836, "global_step": 486071, "epoch": 2893} {"train_loss": -12.97109317779541, "global_step": 486072, "epoch": 2893} {"train_loss": -12.524592399597168, "global_step": 486073, "epoch": 2893} {"train_loss": -12.746374130249023, "global_step": 486074, "epoch": 2893} {"train_loss": -12.713668823242188, "global_step": 486075, "epoch": 2893} {"train_loss": -12.470376014709473, "global_step": 486076, "epoch": 2893} {"train_loss": -12.811113357543945, "global_step": 486077, "epoch": 2893} {"train_loss": -12.700282096862793, "global_step": 486078, "epoch": 2893} {"train_loss": -12.463713645935059, "global_step": 486079, "epoch": 2893} {"train_loss": -12.81836223602295, "global_step": 486080, "epoch": 2893} {"train_loss": -12.522106170654297, "global_step": 486081, "epoch": 2893} {"train_loss": -12.74284839630127, "global_step": 486082, "epoch": 2893} {"train_loss": -12.673134803771973, "global_step": 486083, "epoch": 2893} {"train_loss": -12.425747871398926, "global_step": 486084, "epoch": 2893} {"train_loss": -12.497982025146484, "global_step": 486085, "epoch": 2893} {"train_loss": -12.433801651000977, "global_step": 486086, "epoch": 2893} {"train_loss": -12.38321590423584, "global_step": 486087, "epoch": 2893} {"train_loss": -12.611800193786621, "global_step": 486088, "epoch": 2893} {"train_loss": -12.601919174194336, "global_step": 486089, "epoch": 2893} {"train_loss": -12.37814712524414, "global_step": 486090, "epoch": 2893} {"train_loss": -12.67841911315918, "global_step": 486091, "epoch": 2893} {"train_loss": -12.282100677490234, "global_step": 486092, "epoch": 2893} {"train_loss": -12.642349243164062, "global_step": 486093, "epoch": 2893} {"train_loss": -12.185791015625, "global_step": 486094, "epoch": 2893} {"train_loss": -12.64155387878418, "global_step": 486095, "epoch": 2893} {"train_loss": -12.498345375061035, "global_step": 486096, "epoch": 2893} {"train_loss": -12.789690017700195, "global_step": 486097, "epoch": 2893} {"train_loss": -12.599737167358398, "global_step": 486098, "epoch": 2893} {"train_loss": -12.49814224243164, "global_step": 486099, "epoch": 2893} {"train_loss": -12.369100570678711, "global_step": 486100, "epoch": 2893} {"train_loss": -12.649491310119629, "global_step": 486101, "epoch": 2893} {"train_loss": -12.642108917236328, "global_step": 486102, "epoch": 2893} {"train_loss": -12.4196138381958, "global_step": 486103, "epoch": 2893} {"train_loss": -12.630090713500977, "global_step": 486104, "epoch": 2893} {"train_loss": -12.334063529968262, "global_step": 486105, "epoch": 2893} {"train_loss": -12.567763328552246, "global_step": 486106, "epoch": 2893} {"train_loss": -12.213693618774414, "global_step": 486107, "epoch": 2893} {"train_loss": -12.745410919189453, "global_step": 486108, "epoch": 2893} {"train_loss": -12.33584976196289, "global_step": 486109, "epoch": 2893} {"train_loss": -12.600276947021484, "global_step": 486110, "epoch": 2893} {"train_loss": -12.565160751342773, "global_step": 486111, "epoch": 2893} {"train_loss": -12.432913780212402, "global_step": 486112, "epoch": 2893} {"train_loss": -12.375557899475098, "global_step": 486113, "epoch": 2893} {"train_loss": -12.25782585144043, "global_step": 486114, "epoch": 2893} {"train_loss": -12.533523559570312, "global_step": 486115, "epoch": 2893} {"train_loss": -12.501565933227539, "global_step": 486116, "epoch": 2893} {"train_loss": -12.7191162109375, "global_step": 486117, "epoch": 2893} {"train_loss": -12.527851104736328, "global_step": 486118, "epoch": 2893} {"train_loss": -12.879324913024902, "global_step": 486119, "epoch": 2893} {"train_loss": -12.269865036010742, "global_step": 486120, "epoch": 2893} {"train_loss": -12.512651443481445, "global_step": 486121, "epoch": 2893} {"train_loss": -12.609825134277344, "global_step": 486122, "epoch": 2893} {"train_loss": -12.350950241088867, "global_step": 486123, "epoch": 2893} {"train_loss": -12.82585334777832, "global_step": 486124, "epoch": 2893} {"train_loss": -12.653600692749023, "global_step": 486125, "epoch": 2893} {"train_loss": -11.990009307861328, "global_step": 486126, "epoch": 2893} {"train_loss": -12.469340324401855, "global_step": 486127, "epoch": 2893} {"train_loss": -12.141911506652832, "global_step": 486128, "epoch": 2893} {"train_loss": -12.473419189453125, "global_step": 486129, "epoch": 2893} {"train_loss": -12.229765892028809, "global_step": 486130, "epoch": 2893} {"train_loss": -12.536741256713867, "global_step": 486131, "epoch": 2893} {"train_loss": -12.502406120300293, "global_step": 486132, "epoch": 2893} {"train_loss": -12.449588775634766, "global_step": 486133, "epoch": 2893} {"train_loss": -11.957530975341797, "global_step": 486134, "epoch": 2893} {"train_loss": -12.494392395019531, "global_step": 486135, "epoch": 2893} {"train_loss": -12.521088600158691, "global_step": 486136, "epoch": 2893} {"train_loss": -12.195209503173828, "global_step": 486137, "epoch": 2893} {"train_loss": -12.609329223632812, "global_step": 486138, "epoch": 2893} {"train_loss": -12.47210693359375, "global_step": 486139, "epoch": 2893} {"train_loss": -12.609550476074219, "global_step": 486140, "epoch": 2893} {"train_loss": -12.423749923706055, "global_step": 486141, "epoch": 2893} {"train_loss": -12.740564346313477, "global_step": 486142, "epoch": 2893} {"train_loss": -12.768083572387695, "global_step": 486143, "epoch": 2893} {"train_loss": -12.504898071289062, "global_step": 486144, "epoch": 2893} {"train_loss": -12.806309700012207, "global_step": 486145, "epoch": 2893} {"train_loss": -12.58198070526123, "global_step": 486146, "epoch": 2893} {"train_loss": -12.738161087036133, "global_step": 486147, "epoch": 2893} {"train_loss": -12.453425407409668, "global_step": 486148, "epoch": 2893} {"train_loss": -12.48156452178955, "global_step": 486149, "epoch": 2893} {"train_loss": -12.37261962890625, "global_step": 486150, "epoch": 2893} {"train_loss": -12.929250717163086, "global_step": 486151, "epoch": 2893} {"train_loss": -12.75886344909668, "global_step": 486152, "epoch": 2893} {"train_loss": -12.313151359558105, "global_step": 486153, "epoch": 2893} {"train_loss": -12.625846862792969, "global_step": 486154, "epoch": 2893} {"train_loss": -12.3666410446167, "global_step": 486155, "epoch": 2893} {"train_loss": -12.089855194091797, "global_step": 486156, "epoch": 2893} {"train_loss": -12.088523864746094, "global_step": 486157, "epoch": 2893} {"train_loss": -12.52801513671875, "global_step": 486158, "epoch": 2893} {"train_loss": -12.258691787719727, "global_step": 486159, "epoch": 2893} {"train_loss": -10.696624755859375, "global_step": 486160, "epoch": 2893} {"train_loss": -11.884166717529297, "global_step": 486161, "epoch": 2893} {"train_loss": -12.57421875, "global_step": 486162, "epoch": 2893} {"train_loss": -12.099885940551758, "global_step": 486163, "epoch": 2893} {"train_loss": -11.933387756347656, "global_step": 486164, "epoch": 2893} {"train_loss": -12.646059036254883, "global_step": 486165, "epoch": 2893} {"train_loss": -12.198633193969727, "global_step": 486166, "epoch": 2893} {"train_loss": -11.4568510055542, "global_step": 486167, "epoch": 2893} {"train_loss": -12.425056457519531, "global_step": 486168, "epoch": 2893} {"train_loss": -12.375123023986816, "global_step": 486169, "epoch": 2893} {"train_loss": -11.670546531677246, "global_step": 486170, "epoch": 2893} {"train_loss": -12.703947067260742, "global_step": 486171, "epoch": 2893} {"train_loss": -12.072532653808594, "global_step": 486172, "epoch": 2893} {"train_loss": -12.113370895385742, "global_step": 486173, "epoch": 2893} {"train_loss": -12.02165412902832, "global_step": 486174, "epoch": 2893} {"train_loss": -12.360054016113281, "global_step": 486175, "epoch": 2893} {"train_loss": -11.348455429077148, "global_step": 486176, "epoch": 2893} {"train_loss": -12.117945671081543, "global_step": 486177, "epoch": 2893} {"train_loss": -12.087276458740234, "global_step": 486178, "epoch": 2893} {"train_loss": -11.45848274230957, "global_step": 486179, "epoch": 2893} {"train_loss": -12.578526496887207, "global_step": 486180, "epoch": 2893} {"train_loss": -11.265241622924805, "global_step": 486181, "epoch": 2893} {"train_loss": -12.012417793273926, "global_step": 486182, "epoch": 2893} {"train_loss": -11.576093673706055, "global_step": 486183, "epoch": 2893} {"train_loss": -11.801824569702148, "global_step": 486184, "epoch": 2893} {"train_loss": -12.18680191040039, "global_step": 486185, "epoch": 2893} {"train_loss": -12.217706680297852, "global_step": 486186, "epoch": 2893} {"train_loss": -12.133918762207031, "global_step": 486187, "epoch": 2893} {"train_loss": -12.753175735473633, "global_step": 486188, "epoch": 2893} {"train_loss": -12.079934120178223, "global_step": 486189, "epoch": 2893} {"train_loss": -12.737449645996094, "global_step": 486190, "epoch": 2893} {"train_loss": -12.348560815765744, "global_step": 486191, "epoch": 2893, "val_loss": 314396.5625} {"train_loss": -12.689628601074219, "global_step": 486192, "epoch": 2894} {"train_loss": -12.140380859375, "global_step": 486193, "epoch": 2894} {"train_loss": -12.46210765838623, "global_step": 486194, "epoch": 2894} {"train_loss": -12.412202835083008, "global_step": 486195, "epoch": 2894} {"train_loss": -12.345169067382812, "global_step": 486196, "epoch": 2894} {"train_loss": -12.006759643554688, "global_step": 486197, "epoch": 2894} {"train_loss": -12.225305557250977, "global_step": 486198, "epoch": 2894} {"train_loss": -11.952669143676758, "global_step": 486199, "epoch": 2894} {"train_loss": -12.53038215637207, "global_step": 486200, "epoch": 2894} {"train_loss": -12.183161735534668, "global_step": 486201, "epoch": 2894} {"train_loss": -12.003471374511719, "global_step": 486202, "epoch": 2894} {"train_loss": -12.427557945251465, "global_step": 486203, "epoch": 2894} {"train_loss": -12.098206520080566, "global_step": 486204, "epoch": 2894} {"train_loss": -12.010476112365723, "global_step": 486205, "epoch": 2894} {"train_loss": -12.340253829956055, "global_step": 486206, "epoch": 2894} {"train_loss": -12.217692375183105, "global_step": 486207, "epoch": 2894} {"train_loss": -12.64639663696289, "global_step": 486208, "epoch": 2894} {"train_loss": -12.096458435058594, "global_step": 486209, "epoch": 2894} {"train_loss": -11.00253677368164, "global_step": 486210, "epoch": 2894} {"train_loss": -12.212533950805664, "global_step": 486211, "epoch": 2894} {"train_loss": -11.85940933227539, "global_step": 486212, "epoch": 2894} {"train_loss": -11.680919647216797, "global_step": 486213, "epoch": 2894} {"train_loss": -12.14569091796875, "global_step": 486214, "epoch": 2894} {"train_loss": -10.19639778137207, "global_step": 486215, "epoch": 2894} {"train_loss": -12.165081024169922, "global_step": 486216, "epoch": 2894} {"train_loss": -11.121540069580078, "global_step": 486217, "epoch": 2894} {"train_loss": -12.363139152526855, "global_step": 486218, "epoch": 2894} {"train_loss": -12.11369514465332, "global_step": 486219, "epoch": 2894} {"train_loss": -11.870128631591797, "global_step": 486220, "epoch": 2894} {"train_loss": -12.324182510375977, "global_step": 486221, "epoch": 2894} {"train_loss": -12.29149055480957, "global_step": 486222, "epoch": 2894} {"train_loss": -12.261429786682129, "global_step": 486223, "epoch": 2894} {"train_loss": -12.099438667297363, "global_step": 486224, "epoch": 2894} {"train_loss": -12.654094696044922, "global_step": 486225, "epoch": 2894} {"train_loss": -12.0488920211792, "global_step": 486226, "epoch": 2894} {"train_loss": -11.405384063720703, "global_step": 486227, "epoch": 2894} {"train_loss": -11.633054733276367, "global_step": 486228, "epoch": 2894} {"train_loss": -11.866796493530273, "global_step": 486229, "epoch": 2894} {"train_loss": -11.128375053405762, "global_step": 486230, "epoch": 2894} {"train_loss": -12.2955904006958, "global_step": 486231, "epoch": 2894} {"train_loss": -11.33182144165039, "global_step": 486232, "epoch": 2894} {"train_loss": -12.724737167358398, "global_step": 486233, "epoch": 2894} {"train_loss": -11.448246002197266, "global_step": 486234, "epoch": 2894} {"train_loss": -12.083022117614746, "global_step": 486235, "epoch": 2894} {"train_loss": -11.338703155517578, "global_step": 486236, "epoch": 2894} {"train_loss": -12.179277420043945, "global_step": 486237, "epoch": 2894} {"train_loss": -11.651949882507324, "global_step": 486238, "epoch": 2894} {"train_loss": -11.972467422485352, "global_step": 486239, "epoch": 2894} {"train_loss": -12.278890609741211, "global_step": 486240, "epoch": 2894} {"train_loss": -12.065022468566895, "global_step": 486241, "epoch": 2894} {"train_loss": -12.317672729492188, "global_step": 486242, "epoch": 2894} {"train_loss": -11.653363227844238, "global_step": 486243, "epoch": 2894} {"train_loss": -12.741727828979492, "global_step": 486244, "epoch": 2894} {"train_loss": -11.630782127380371, "global_step": 486245, "epoch": 2894} {"train_loss": -12.369308471679688, "global_step": 486246, "epoch": 2894} {"train_loss": -11.949125289916992, "global_step": 486247, "epoch": 2894} {"train_loss": -12.372241973876953, "global_step": 486248, "epoch": 2894} {"train_loss": -12.031595230102539, "global_step": 486249, "epoch": 2894} {"train_loss": -12.231338500976562, "global_step": 486250, "epoch": 2894} {"train_loss": -12.550209999084473, "global_step": 486251, "epoch": 2894} {"train_loss": -12.18585205078125, "global_step": 486252, "epoch": 2894} {"train_loss": -12.651376724243164, "global_step": 486253, "epoch": 2894} {"train_loss": -12.270066261291504, "global_step": 486254, "epoch": 2894} {"train_loss": -12.675500869750977, "global_step": 486255, "epoch": 2894} {"train_loss": -12.565519332885742, "global_step": 486256, "epoch": 2894} {"train_loss": -12.52304458618164, "global_step": 486257, "epoch": 2894} {"train_loss": -12.615035057067871, "global_step": 486258, "epoch": 2894} {"train_loss": -12.02027702331543, "global_step": 486259, "epoch": 2894} {"train_loss": -12.596213340759277, "global_step": 486260, "epoch": 2894} {"train_loss": -12.277389526367188, "global_step": 486261, "epoch": 2894} {"train_loss": -12.555861473083496, "global_step": 486262, "epoch": 2894} {"train_loss": -12.155677795410156, "global_step": 486263, "epoch": 2894} {"train_loss": -12.523740768432617, "global_step": 486264, "epoch": 2894} {"train_loss": -12.581613540649414, "global_step": 486265, "epoch": 2894} {"train_loss": -12.393566131591797, "global_step": 486266, "epoch": 2894} {"train_loss": -12.281217575073242, "global_step": 486267, "epoch": 2894} {"train_loss": -11.931654930114746, "global_step": 486268, "epoch": 2894} {"train_loss": -12.131836891174316, "global_step": 486269, "epoch": 2894} {"train_loss": -11.923994064331055, "global_step": 486270, "epoch": 2894} {"train_loss": -11.747962951660156, "global_step": 486271, "epoch": 2894} {"train_loss": -12.30492877960205, "global_step": 486272, "epoch": 2894} {"train_loss": -11.580846786499023, "global_step": 486273, "epoch": 2894} {"train_loss": -12.692413330078125, "global_step": 486274, "epoch": 2894} {"train_loss": -11.90884780883789, "global_step": 486275, "epoch": 2894} {"train_loss": -12.650197982788086, "global_step": 486276, "epoch": 2894} {"train_loss": -12.207595825195312, "global_step": 486277, "epoch": 2894} {"train_loss": -12.368048667907715, "global_step": 486278, "epoch": 2894} {"train_loss": -12.471139907836914, "global_step": 486279, "epoch": 2894} {"train_loss": -12.239114761352539, "global_step": 486280, "epoch": 2894} {"train_loss": -12.37662410736084, "global_step": 486281, "epoch": 2894} {"train_loss": -12.409379959106445, "global_step": 486282, "epoch": 2894} {"train_loss": -12.231084823608398, "global_step": 486283, "epoch": 2894} {"train_loss": -12.579233169555664, "global_step": 486284, "epoch": 2894} {"train_loss": -12.56359577178955, "global_step": 486285, "epoch": 2894} {"train_loss": -12.508841514587402, "global_step": 486286, "epoch": 2894} {"train_loss": -12.585241317749023, "global_step": 486287, "epoch": 2894} {"train_loss": -12.507343292236328, "global_step": 486288, "epoch": 2894} {"train_loss": -12.79796314239502, "global_step": 486289, "epoch": 2894} {"train_loss": -12.580944061279297, "global_step": 486290, "epoch": 2894} {"train_loss": -12.885351181030273, "global_step": 486291, "epoch": 2894} {"train_loss": -12.744071006774902, "global_step": 486292, "epoch": 2894} {"train_loss": -12.60053825378418, "global_step": 486293, "epoch": 2894} {"train_loss": -12.86844253540039, "global_step": 486294, "epoch": 2894} {"train_loss": -12.77646541595459, "global_step": 486295, "epoch": 2894} {"train_loss": -12.875102043151855, "global_step": 486296, "epoch": 2894} {"train_loss": -12.303961753845215, "global_step": 486297, "epoch": 2894} {"train_loss": -12.637300491333008, "global_step": 486298, "epoch": 2894} {"train_loss": -12.480401992797852, "global_step": 486299, "epoch": 2894} {"train_loss": -12.273200988769531, "global_step": 486300, "epoch": 2894} {"train_loss": -12.371600151062012, "global_step": 486301, "epoch": 2894} {"train_loss": -12.108551025390625, "global_step": 486302, "epoch": 2894} {"train_loss": -12.105433464050293, "global_step": 486303, "epoch": 2894} {"train_loss": -11.994434356689453, "global_step": 486304, "epoch": 2894} {"train_loss": -12.129015922546387, "global_step": 486305, "epoch": 2894} {"train_loss": -12.060400009155273, "global_step": 486306, "epoch": 2894} {"train_loss": -12.365392684936523, "global_step": 486307, "epoch": 2894} {"train_loss": -11.937467575073242, "global_step": 486308, "epoch": 2894} {"train_loss": -12.135416030883789, "global_step": 486309, "epoch": 2894} {"train_loss": -12.032981872558594, "global_step": 486310, "epoch": 2894} {"train_loss": -12.679534912109375, "global_step": 486311, "epoch": 2894} {"train_loss": -12.253551483154297, "global_step": 486312, "epoch": 2894} {"train_loss": -12.29435920715332, "global_step": 486313, "epoch": 2894} {"train_loss": -12.366996765136719, "global_step": 486314, "epoch": 2894} {"train_loss": -12.298579216003418, "global_step": 486315, "epoch": 2894} {"train_loss": -12.635393142700195, "global_step": 486316, "epoch": 2894} {"train_loss": -12.485614776611328, "global_step": 486317, "epoch": 2894} {"train_loss": -12.638679504394531, "global_step": 486318, "epoch": 2894} {"train_loss": -12.593286514282227, "global_step": 486319, "epoch": 2894} {"train_loss": -12.392677307128906, "global_step": 486320, "epoch": 2894} {"train_loss": -12.692285537719727, "global_step": 486321, "epoch": 2894} {"train_loss": -12.851290702819824, "global_step": 486322, "epoch": 2894} {"train_loss": -12.42909049987793, "global_step": 486323, "epoch": 2894} {"train_loss": -12.749441146850586, "global_step": 486324, "epoch": 2894} {"train_loss": -12.75398063659668, "global_step": 486325, "epoch": 2894} {"train_loss": -12.368326187133789, "global_step": 486326, "epoch": 2894} {"train_loss": -12.757468223571777, "global_step": 486327, "epoch": 2894} {"train_loss": -12.605252265930176, "global_step": 486328, "epoch": 2894} {"train_loss": -12.500953674316406, "global_step": 486329, "epoch": 2894} {"train_loss": -12.709539413452148, "global_step": 486330, "epoch": 2894} {"train_loss": -12.70001220703125, "global_step": 486331, "epoch": 2894} {"train_loss": -12.647427558898926, "global_step": 486332, "epoch": 2894} {"train_loss": -12.509316444396973, "global_step": 486333, "epoch": 2894} {"train_loss": -12.871465682983398, "global_step": 486334, "epoch": 2894} {"train_loss": -12.959890365600586, "global_step": 486335, "epoch": 2894} {"train_loss": -12.832939147949219, "global_step": 486336, "epoch": 2894} {"train_loss": -12.946447372436523, "global_step": 486337, "epoch": 2894} {"train_loss": -12.446962356567383, "global_step": 486338, "epoch": 2894} {"train_loss": -12.642943382263184, "global_step": 486339, "epoch": 2894} {"train_loss": -12.4599609375, "global_step": 486340, "epoch": 2894} {"train_loss": -12.774223327636719, "global_step": 486341, "epoch": 2894} {"train_loss": -12.543401718139648, "global_step": 486342, "epoch": 2894} {"train_loss": -12.614988327026367, "global_step": 486343, "epoch": 2894} {"train_loss": -12.774666786193848, "global_step": 486344, "epoch": 2894} {"train_loss": -12.89289379119873, "global_step": 486345, "epoch": 2894} {"train_loss": -12.755218505859375, "global_step": 486346, "epoch": 2894} {"train_loss": -12.871837615966797, "global_step": 486347, "epoch": 2894} {"train_loss": -12.527399063110352, "global_step": 486348, "epoch": 2894} {"train_loss": -12.322895050048828, "global_step": 486349, "epoch": 2894} {"train_loss": -12.731789588928223, "global_step": 486350, "epoch": 2894} {"train_loss": -12.847467422485352, "global_step": 486351, "epoch": 2894} {"train_loss": -12.466856002807617, "global_step": 486352, "epoch": 2894} {"train_loss": -12.633275032043457, "global_step": 486353, "epoch": 2894} {"train_loss": -12.593877792358398, "global_step": 486354, "epoch": 2894} {"train_loss": -12.41247844696045, "global_step": 486355, "epoch": 2894} {"train_loss": -12.647711753845215, "global_step": 486356, "epoch": 2894} {"train_loss": -12.647711753845215, "global_step": 486357, "epoch": 2894} {"train_loss": -12.556951522827148, "global_step": 486358, "epoch": 2894} {"train_loss": -12.324714030538287, "global_step": 486359, "epoch": 2894, "val_loss": 314663.40625} {"train_loss": -12.635493278503418, "global_step": 486360, "epoch": 2895} {"train_loss": -12.77424430847168, "global_step": 486361, "epoch": 2895} {"train_loss": -12.633232116699219, "global_step": 486362, "epoch": 2895} {"train_loss": -12.933404922485352, "global_step": 486363, "epoch": 2895} {"train_loss": -12.715093612670898, "global_step": 486364, "epoch": 2895} {"train_loss": -12.606316566467285, "global_step": 486365, "epoch": 2895} {"train_loss": -12.57708740234375, "global_step": 486366, "epoch": 2895} {"train_loss": -12.608346939086914, "global_step": 486367, "epoch": 2895} {"train_loss": -12.773062705993652, "global_step": 486368, "epoch": 2895} {"train_loss": -12.576773643493652, "global_step": 486369, "epoch": 2895} {"train_loss": -12.49005126953125, "global_step": 486370, "epoch": 2895} {"train_loss": -12.355414390563965, "global_step": 486371, "epoch": 2895} {"train_loss": -12.667740821838379, "global_step": 486372, "epoch": 2895} {"train_loss": -12.557082176208496, "global_step": 486373, "epoch": 2895} {"train_loss": -12.003535270690918, "global_step": 486374, "epoch": 2895} {"train_loss": -12.75926399230957, "global_step": 486375, "epoch": 2895} {"train_loss": -12.41416072845459, "global_step": 486376, "epoch": 2895} {"train_loss": -12.30671215057373, "global_step": 486377, "epoch": 2895} {"train_loss": -12.661581993103027, "global_step": 486378, "epoch": 2895} {"train_loss": -12.560380935668945, "global_step": 486379, "epoch": 2895} {"train_loss": -11.877191543579102, "global_step": 486380, "epoch": 2895} {"train_loss": -12.256269454956055, "global_step": 486381, "epoch": 2895} {"train_loss": -12.466033935546875, "global_step": 486382, "epoch": 2895} {"train_loss": -12.007349967956543, "global_step": 486383, "epoch": 2895} {"train_loss": -12.556623458862305, "global_step": 486384, "epoch": 2895} {"train_loss": -11.821648597717285, "global_step": 486385, "epoch": 2895} {"train_loss": -12.86136245727539, "global_step": 486386, "epoch": 2895} {"train_loss": -11.63705825805664, "global_step": 486387, "epoch": 2895} {"train_loss": -11.21070384979248, "global_step": 486388, "epoch": 2895} {"train_loss": -11.798948287963867, "global_step": 486389, "epoch": 2895} {"train_loss": -12.141143798828125, "global_step": 486390, "epoch": 2895} {"train_loss": -10.8182373046875, "global_step": 486391, "epoch": 2895} {"train_loss": -11.426864624023438, "global_step": 486392, "epoch": 2895} {"train_loss": -11.273382186889648, "global_step": 486393, "epoch": 2895} {"train_loss": -10.328872680664062, "global_step": 486394, "epoch": 2895} {"train_loss": -12.041420936584473, "global_step": 486395, "epoch": 2895} {"train_loss": -10.769474029541016, "global_step": 486396, "epoch": 2895} {"train_loss": -11.454705238342285, "global_step": 486397, "epoch": 2895} {"train_loss": -10.08993148803711, "global_step": 486398, "epoch": 2895} {"train_loss": -11.298930168151855, "global_step": 486399, "epoch": 2895} {"train_loss": -11.06679916381836, "global_step": 486400, "epoch": 2895} {"train_loss": -10.405517578125, "global_step": 486401, "epoch": 2895} {"train_loss": -10.333242416381836, "global_step": 486402, "epoch": 2895} {"train_loss": -10.780771255493164, "global_step": 486403, "epoch": 2895} {"train_loss": -11.02623176574707, "global_step": 486404, "epoch": 2895} {"train_loss": -10.119418144226074, "global_step": 486405, "epoch": 2895} {"train_loss": -11.114473342895508, "global_step": 486406, "epoch": 2895} {"train_loss": -11.295388221740723, "global_step": 486407, "epoch": 2895} {"train_loss": -11.204309463500977, "global_step": 486408, "epoch": 2895} {"train_loss": -11.522602081298828, "global_step": 486409, "epoch": 2895} {"train_loss": -12.02491283416748, "global_step": 486410, "epoch": 2895} {"train_loss": -11.740222930908203, "global_step": 486411, "epoch": 2895} {"train_loss": -11.75818920135498, "global_step": 486412, "epoch": 2895} {"train_loss": -10.168537139892578, "global_step": 486413, "epoch": 2895} {"train_loss": -10.485271453857422, "global_step": 486414, "epoch": 2895} {"train_loss": -12.084716796875, "global_step": 486415, "epoch": 2895} {"train_loss": -10.81640625, "global_step": 486416, "epoch": 2895} {"train_loss": -11.400861740112305, "global_step": 486417, "epoch": 2895} {"train_loss": -11.22738265991211, "global_step": 486418, "epoch": 2895} {"train_loss": -11.3887300491333, "global_step": 486419, "epoch": 2895} {"train_loss": -12.288829803466797, "global_step": 486420, "epoch": 2895} {"train_loss": -11.534528732299805, "global_step": 486421, "epoch": 2895} {"train_loss": -11.850820541381836, "global_step": 486422, "epoch": 2895} {"train_loss": -12.259467124938965, "global_step": 486423, "epoch": 2895} {"train_loss": -11.680347442626953, "global_step": 486424, "epoch": 2895} {"train_loss": -12.150106430053711, "global_step": 486425, "epoch": 2895} {"train_loss": -11.776599884033203, "global_step": 486426, "epoch": 2895} {"train_loss": -11.39937973022461, "global_step": 486427, "epoch": 2895} {"train_loss": -11.185903549194336, "global_step": 486428, "epoch": 2895} {"train_loss": -11.736319541931152, "global_step": 486429, "epoch": 2895} {"train_loss": -11.579668045043945, "global_step": 486430, "epoch": 2895} {"train_loss": -11.76752758026123, "global_step": 486431, "epoch": 2895} {"train_loss": -12.021435737609863, "global_step": 486432, "epoch": 2895} {"train_loss": -11.959428787231445, "global_step": 486433, "epoch": 2895} {"train_loss": -12.028013229370117, "global_step": 486434, "epoch": 2895} {"train_loss": -11.436393737792969, "global_step": 486435, "epoch": 2895} {"train_loss": -11.661304473876953, "global_step": 486436, "epoch": 2895} {"train_loss": -12.174789428710938, "global_step": 486437, "epoch": 2895} {"train_loss": -11.531842231750488, "global_step": 486438, "epoch": 2895} {"train_loss": -11.62738037109375, "global_step": 486439, "epoch": 2895} {"train_loss": -11.899242401123047, "global_step": 486440, "epoch": 2895} {"train_loss": -11.723358154296875, "global_step": 486441, "epoch": 2895} {"train_loss": -11.644465446472168, "global_step": 486442, "epoch": 2895} {"train_loss": -12.192998886108398, "global_step": 486443, "epoch": 2895} {"train_loss": -11.497110366821289, "global_step": 486444, "epoch": 2895} {"train_loss": -12.038583755493164, "global_step": 486445, "epoch": 2895} {"train_loss": -11.887699127197266, "global_step": 486446, "epoch": 2895} {"train_loss": -11.187686920166016, "global_step": 486447, "epoch": 2895} {"train_loss": -12.16758918762207, "global_step": 486448, "epoch": 2895} {"train_loss": -11.943739891052246, "global_step": 486449, "epoch": 2895} {"train_loss": -11.899568557739258, "global_step": 486450, "epoch": 2895} {"train_loss": -12.386730194091797, "global_step": 486451, "epoch": 2895} {"train_loss": -11.32605266571045, "global_step": 486452, "epoch": 2895} {"train_loss": -12.265353202819824, "global_step": 486453, "epoch": 2895} {"train_loss": -11.942798614501953, "global_step": 486454, "epoch": 2895} {"train_loss": -11.69471549987793, "global_step": 486455, "epoch": 2895} {"train_loss": -12.268688201904297, "global_step": 486456, "epoch": 2895} {"train_loss": -11.605792999267578, "global_step": 486457, "epoch": 2895} {"train_loss": -11.402345657348633, "global_step": 486458, "epoch": 2895} {"train_loss": -11.834434509277344, "global_step": 486459, "epoch": 2895} {"train_loss": -11.392176628112793, "global_step": 486460, "epoch": 2895} {"train_loss": -11.896209716796875, "global_step": 486461, "epoch": 2895} {"train_loss": -11.880260467529297, "global_step": 486462, "epoch": 2895} {"train_loss": -12.192845344543457, "global_step": 486463, "epoch": 2895} {"train_loss": -11.636438369750977, "global_step": 486464, "epoch": 2895} {"train_loss": -12.386475563049316, "global_step": 486465, "epoch": 2895} {"train_loss": -11.648414611816406, "global_step": 486466, "epoch": 2895} {"train_loss": -12.225194931030273, "global_step": 486467, "epoch": 2895} {"train_loss": -12.200103759765625, "global_step": 486468, "epoch": 2895} {"train_loss": -12.272134780883789, "global_step": 486469, "epoch": 2895} {"train_loss": -12.379270553588867, "global_step": 486470, "epoch": 2895} {"train_loss": -12.468496322631836, "global_step": 486471, "epoch": 2895} {"train_loss": -12.04311466217041, "global_step": 486472, "epoch": 2895} {"train_loss": -12.593088150024414, "global_step": 486473, "epoch": 2895} {"train_loss": -12.386117935180664, "global_step": 486474, "epoch": 2895} {"train_loss": -12.432480812072754, "global_step": 486475, "epoch": 2895} {"train_loss": -12.605010032653809, "global_step": 486476, "epoch": 2895} {"train_loss": -12.636796951293945, "global_step": 486477, "epoch": 2895} {"train_loss": -12.465341567993164, "global_step": 486478, "epoch": 2895} {"train_loss": -12.508119583129883, "global_step": 486479, "epoch": 2895} {"train_loss": -12.69642162322998, "global_step": 486480, "epoch": 2895} {"train_loss": -12.560346603393555, "global_step": 486481, "epoch": 2895} {"train_loss": -12.612106323242188, "global_step": 486482, "epoch": 2895} {"train_loss": -12.719578742980957, "global_step": 486483, "epoch": 2895} {"train_loss": -12.714954376220703, "global_step": 486484, "epoch": 2895} {"train_loss": -12.743467330932617, "global_step": 486485, "epoch": 2895} {"train_loss": -12.545904159545898, "global_step": 486486, "epoch": 2895} {"train_loss": -12.628832817077637, "global_step": 486487, "epoch": 2895} {"train_loss": -12.622846603393555, "global_step": 486488, "epoch": 2895} {"train_loss": -12.451042175292969, "global_step": 486489, "epoch": 2895} {"train_loss": -12.632364273071289, "global_step": 486490, "epoch": 2895} {"train_loss": -12.40931510925293, "global_step": 486491, "epoch": 2895} {"train_loss": -12.441939353942871, "global_step": 486492, "epoch": 2895} {"train_loss": -12.372034072875977, "global_step": 486493, "epoch": 2895} {"train_loss": -12.209249496459961, "global_step": 486494, "epoch": 2895} {"train_loss": -12.773370742797852, "global_step": 486495, "epoch": 2895} {"train_loss": -12.397308349609375, "global_step": 486496, "epoch": 2895} {"train_loss": -12.573822975158691, "global_step": 486497, "epoch": 2895} {"train_loss": -12.736498832702637, "global_step": 486498, "epoch": 2895} {"train_loss": -12.492268562316895, "global_step": 486499, "epoch": 2895} {"train_loss": -12.803547859191895, "global_step": 486500, "epoch": 2895} {"train_loss": -12.436820030212402, "global_step": 486501, "epoch": 2895} {"train_loss": -12.71894359588623, "global_step": 486502, "epoch": 2895} {"train_loss": -12.661877632141113, "global_step": 486503, "epoch": 2895} {"train_loss": -12.687606811523438, "global_step": 486504, "epoch": 2895} {"train_loss": -12.51136589050293, "global_step": 486505, "epoch": 2895} {"train_loss": -12.693470001220703, "global_step": 486506, "epoch": 2895} {"train_loss": -12.594651222229004, "global_step": 486507, "epoch": 2895} {"train_loss": -12.28116226196289, "global_step": 486508, "epoch": 2895} {"train_loss": -12.686399459838867, "global_step": 486509, "epoch": 2895} {"train_loss": -12.617463111877441, "global_step": 486510, "epoch": 2895} {"train_loss": -12.599132537841797, "global_step": 486511, "epoch": 2895} {"train_loss": -12.805315017700195, "global_step": 486512, "epoch": 2895} {"train_loss": -12.511146545410156, "global_step": 486513, "epoch": 2895} {"train_loss": -12.544445991516113, "global_step": 486514, "epoch": 2895} {"train_loss": -12.821246147155762, "global_step": 486515, "epoch": 2895} {"train_loss": -12.831222534179688, "global_step": 486516, "epoch": 2895} {"train_loss": -12.747842788696289, "global_step": 486517, "epoch": 2895} {"train_loss": -12.601421356201172, "global_step": 486518, "epoch": 2895} {"train_loss": -12.759376525878906, "global_step": 486519, "epoch": 2895} {"train_loss": -12.997227668762207, "global_step": 486520, "epoch": 2895} {"train_loss": -12.87814712524414, "global_step": 486521, "epoch": 2895} {"train_loss": -12.944931983947754, "global_step": 486522, "epoch": 2895} {"train_loss": -12.842591285705566, "global_step": 486523, "epoch": 2895} {"train_loss": -12.8714599609375, "global_step": 486524, "epoch": 2895} {"train_loss": -12.699790000915527, "global_step": 486525, "epoch": 2895} {"train_loss": -12.666119575500488, "global_step": 486526, "epoch": 2895} {"train_loss": -12.078904651460194, "global_step": 486527, "epoch": 2895, "val_loss": 317314.8125, "train_action_mse_error": 1.479439377784729} {"train_loss": -12.609761238098145, "global_step": 486528, "epoch": 2896} {"train_loss": -12.69842529296875, "global_step": 486529, "epoch": 2896} {"train_loss": -12.50928783416748, "global_step": 486530, "epoch": 2896} {"train_loss": -11.765634536743164, "global_step": 486531, "epoch": 2896} {"train_loss": -12.562251091003418, "global_step": 486532, "epoch": 2896} {"train_loss": -11.796332359313965, "global_step": 486533, "epoch": 2896} {"train_loss": -12.489599227905273, "global_step": 486534, "epoch": 2896} {"train_loss": -12.078165054321289, "global_step": 486535, "epoch": 2896} {"train_loss": -11.862776756286621, "global_step": 486536, "epoch": 2896} {"train_loss": -12.720254898071289, "global_step": 486537, "epoch": 2896} {"train_loss": -12.125770568847656, "global_step": 486538, "epoch": 2896} {"train_loss": -11.542610168457031, "global_step": 486539, "epoch": 2896} {"train_loss": -12.75991153717041, "global_step": 486540, "epoch": 2896} {"train_loss": -11.747005462646484, "global_step": 486541, "epoch": 2896} {"train_loss": -12.38558578491211, "global_step": 486542, "epoch": 2896} {"train_loss": -12.487833976745605, "global_step": 486543, "epoch": 2896} {"train_loss": -12.07809829711914, "global_step": 486544, "epoch": 2896} {"train_loss": -11.254871368408203, "global_step": 486545, "epoch": 2896} {"train_loss": -12.598020553588867, "global_step": 486546, "epoch": 2896} {"train_loss": -10.948270797729492, "global_step": 486547, "epoch": 2896} {"train_loss": -12.065932273864746, "global_step": 486548, "epoch": 2896} {"train_loss": -12.03317928314209, "global_step": 486549, "epoch": 2896} {"train_loss": -11.518110275268555, "global_step": 486550, "epoch": 2896} {"train_loss": -12.657422065734863, "global_step": 486551, "epoch": 2896} {"train_loss": -12.380929946899414, "global_step": 486552, "epoch": 2896} {"train_loss": -12.662860870361328, "global_step": 486553, "epoch": 2896} {"train_loss": -12.48182487487793, "global_step": 486554, "epoch": 2896} {"train_loss": -12.584982872009277, "global_step": 486555, "epoch": 2896} {"train_loss": -12.112997055053711, "global_step": 486556, "epoch": 2896} {"train_loss": -12.725811004638672, "global_step": 486557, "epoch": 2896} {"train_loss": -11.933053970336914, "global_step": 486558, "epoch": 2896} {"train_loss": -12.594827651977539, "global_step": 486559, "epoch": 2896} {"train_loss": -11.706555366516113, "global_step": 486560, "epoch": 2896} {"train_loss": -12.766594886779785, "global_step": 486561, "epoch": 2896} {"train_loss": -11.453584671020508, "global_step": 486562, "epoch": 2896} {"train_loss": -11.902804374694824, "global_step": 486563, "epoch": 2896} {"train_loss": -12.108036041259766, "global_step": 486564, "epoch": 2896} {"train_loss": -10.010003089904785, "global_step": 486565, "epoch": 2896} {"train_loss": -12.58891487121582, "global_step": 486566, "epoch": 2896} {"train_loss": -10.431732177734375, "global_step": 486567, "epoch": 2896} {"train_loss": -12.455123901367188, "global_step": 486568, "epoch": 2896} {"train_loss": -10.74637222290039, "global_step": 486569, "epoch": 2896} {"train_loss": -12.336095809936523, "global_step": 486570, "epoch": 2896} {"train_loss": -11.065267562866211, "global_step": 486571, "epoch": 2896} {"train_loss": -12.41483211517334, "global_step": 486572, "epoch": 2896} {"train_loss": -11.752464294433594, "global_step": 486573, "epoch": 2896} {"train_loss": -11.94461727142334, "global_step": 486574, "epoch": 2896} {"train_loss": -12.08934211730957, "global_step": 486575, "epoch": 2896} {"train_loss": -12.033099174499512, "global_step": 486576, "epoch": 2896} {"train_loss": -12.297677040100098, "global_step": 486577, "epoch": 2896} {"train_loss": -11.89057731628418, "global_step": 486578, "epoch": 2896} {"train_loss": -12.426942825317383, "global_step": 486579, "epoch": 2896} {"train_loss": -11.528532028198242, "global_step": 486580, "epoch": 2896} {"train_loss": -12.378116607666016, "global_step": 486581, "epoch": 2896} {"train_loss": -12.100459098815918, "global_step": 486582, "epoch": 2896} {"train_loss": -12.282173156738281, "global_step": 486583, "epoch": 2896} {"train_loss": -12.21738338470459, "global_step": 486584, "epoch": 2896} {"train_loss": -12.173257827758789, "global_step": 486585, "epoch": 2896} {"train_loss": -12.14181137084961, "global_step": 486586, "epoch": 2896} {"train_loss": -12.029657363891602, "global_step": 486587, "epoch": 2896} {"train_loss": -12.478584289550781, "global_step": 486588, "epoch": 2896} {"train_loss": -12.196270942687988, "global_step": 486589, "epoch": 2896} {"train_loss": -12.626482009887695, "global_step": 486590, "epoch": 2896} {"train_loss": -11.323564529418945, "global_step": 486591, "epoch": 2896} {"train_loss": -12.093653678894043, "global_step": 486592, "epoch": 2896} {"train_loss": -11.857151985168457, "global_step": 486593, "epoch": 2896} {"train_loss": -11.975101470947266, "global_step": 486594, "epoch": 2896} {"train_loss": -12.631404876708984, "global_step": 486595, "epoch": 2896} {"train_loss": -12.060050964355469, "global_step": 486596, "epoch": 2896} {"train_loss": -12.69240665435791, "global_step": 486597, "epoch": 2896} {"train_loss": -12.02554702758789, "global_step": 486598, "epoch": 2896} {"train_loss": -12.829265594482422, "global_step": 486599, "epoch": 2896} {"train_loss": -12.394363403320312, "global_step": 486600, "epoch": 2896} {"train_loss": -12.367120742797852, "global_step": 486601, "epoch": 2896} {"train_loss": -12.57111930847168, "global_step": 486602, "epoch": 2896} {"train_loss": -12.19556999206543, "global_step": 486603, "epoch": 2896} {"train_loss": -12.787949562072754, "global_step": 486604, "epoch": 2896} {"train_loss": -12.674036026000977, "global_step": 486605, "epoch": 2896} {"train_loss": -12.493850708007812, "global_step": 486606, "epoch": 2896} {"train_loss": -12.658723831176758, "global_step": 486607, "epoch": 2896} {"train_loss": -12.298643112182617, "global_step": 486608, "epoch": 2896} {"train_loss": -12.548715591430664, "global_step": 486609, "epoch": 2896} {"train_loss": -12.31376838684082, "global_step": 486610, "epoch": 2896} {"train_loss": -12.480622291564941, "global_step": 486611, "epoch": 2896} {"train_loss": -12.723005294799805, "global_step": 486612, "epoch": 2896} {"train_loss": -12.240865707397461, "global_step": 486613, "epoch": 2896} {"train_loss": -12.738618850708008, "global_step": 486614, "epoch": 2896} {"train_loss": -11.875242233276367, "global_step": 486615, "epoch": 2896} {"train_loss": -12.396677017211914, "global_step": 486616, "epoch": 2896} {"train_loss": -12.420997619628906, "global_step": 486617, "epoch": 2896} {"train_loss": -12.568495750427246, "global_step": 486618, "epoch": 2896} {"train_loss": -12.537842750549316, "global_step": 486619, "epoch": 2896} {"train_loss": -12.55102825164795, "global_step": 486620, "epoch": 2896} {"train_loss": -12.563249588012695, "global_step": 486621, "epoch": 2896} {"train_loss": -12.489375114440918, "global_step": 486622, "epoch": 2896} {"train_loss": -12.622787475585938, "global_step": 486623, "epoch": 2896} {"train_loss": -12.63101577758789, "global_step": 486624, "epoch": 2896} {"train_loss": -12.287137985229492, "global_step": 486625, "epoch": 2896} {"train_loss": -12.73110580444336, "global_step": 486626, "epoch": 2896} {"train_loss": -12.61834716796875, "global_step": 486627, "epoch": 2896} {"train_loss": -12.465864181518555, "global_step": 486628, "epoch": 2896} {"train_loss": -12.72207260131836, "global_step": 486629, "epoch": 2896} {"train_loss": -12.638208389282227, "global_step": 486630, "epoch": 2896} {"train_loss": -12.593280792236328, "global_step": 486631, "epoch": 2896} {"train_loss": -12.54726791381836, "global_step": 486632, "epoch": 2896} {"train_loss": -12.914958000183105, "global_step": 486633, "epoch": 2896} {"train_loss": -12.661818504333496, "global_step": 486634, "epoch": 2896} {"train_loss": -12.699175834655762, "global_step": 486635, "epoch": 2896} {"train_loss": -12.737022399902344, "global_step": 486636, "epoch": 2896} {"train_loss": -12.89913558959961, "global_step": 486637, "epoch": 2896} {"train_loss": -12.989893913269043, "global_step": 486638, "epoch": 2896} {"train_loss": -12.895801544189453, "global_step": 486639, "epoch": 2896} {"train_loss": -12.734339714050293, "global_step": 486640, "epoch": 2896} {"train_loss": -12.646469116210938, "global_step": 486641, "epoch": 2896} {"train_loss": -12.89793872833252, "global_step": 486642, "epoch": 2896} {"train_loss": -12.576695442199707, "global_step": 486643, "epoch": 2896} {"train_loss": -12.69377326965332, "global_step": 486644, "epoch": 2896} {"train_loss": -12.37454605102539, "global_step": 486645, "epoch": 2896} {"train_loss": -12.813089370727539, "global_step": 486646, "epoch": 2896} {"train_loss": -11.962578773498535, "global_step": 486647, "epoch": 2896} {"train_loss": -12.148234367370605, "global_step": 486648, "epoch": 2896} {"train_loss": -12.683004379272461, "global_step": 486649, "epoch": 2896} {"train_loss": -12.507028579711914, "global_step": 486650, "epoch": 2896} {"train_loss": -12.475020408630371, "global_step": 486651, "epoch": 2896} {"train_loss": -12.831371307373047, "global_step": 486652, "epoch": 2896} {"train_loss": -12.317346572875977, "global_step": 486653, "epoch": 2896} {"train_loss": -12.589241027832031, "global_step": 486654, "epoch": 2896} {"train_loss": -12.502054214477539, "global_step": 486655, "epoch": 2896} {"train_loss": -11.827103614807129, "global_step": 486656, "epoch": 2896} {"train_loss": -12.325902938842773, "global_step": 486657, "epoch": 2896} {"train_loss": -12.829259872436523, "global_step": 486658, "epoch": 2896} {"train_loss": -12.374746322631836, "global_step": 486659, "epoch": 2896} {"train_loss": -12.13300609588623, "global_step": 486660, "epoch": 2896} {"train_loss": -12.902101516723633, "global_step": 486661, "epoch": 2896} {"train_loss": -12.559080123901367, "global_step": 486662, "epoch": 2896} {"train_loss": -12.100114822387695, "global_step": 486663, "epoch": 2896} {"train_loss": -12.198951721191406, "global_step": 486664, "epoch": 2896} {"train_loss": -10.51666259765625, "global_step": 486665, "epoch": 2896} {"train_loss": -12.348133087158203, "global_step": 486666, "epoch": 2896} {"train_loss": -12.24001693725586, "global_step": 486667, "epoch": 2896} {"train_loss": -11.183605194091797, "global_step": 486668, "epoch": 2896} {"train_loss": -12.076587677001953, "global_step": 486669, "epoch": 2896} {"train_loss": -11.89256763458252, "global_step": 486670, "epoch": 2896} {"train_loss": -12.355307579040527, "global_step": 486671, "epoch": 2896} {"train_loss": -12.42840576171875, "global_step": 486672, "epoch": 2896} {"train_loss": -11.387004852294922, "global_step": 486673, "epoch": 2896} {"train_loss": -11.94577407836914, "global_step": 486674, "epoch": 2896} {"train_loss": -10.588793754577637, "global_step": 486675, "epoch": 2896} {"train_loss": -11.61854362487793, "global_step": 486676, "epoch": 2896} {"train_loss": -11.857683181762695, "global_step": 486677, "epoch": 2896} {"train_loss": -10.840604782104492, "global_step": 486678, "epoch": 2896} {"train_loss": -12.178169250488281, "global_step": 486679, "epoch": 2896} {"train_loss": -11.530449867248535, "global_step": 486680, "epoch": 2896} {"train_loss": -12.090656280517578, "global_step": 486681, "epoch": 2896} {"train_loss": -11.012529373168945, "global_step": 486682, "epoch": 2896} {"train_loss": -12.123825073242188, "global_step": 486683, "epoch": 2896} {"train_loss": -11.642993927001953, "global_step": 486684, "epoch": 2896} {"train_loss": -12.25253677368164, "global_step": 486685, "epoch": 2896} {"train_loss": -12.552050590515137, "global_step": 486686, "epoch": 2896} {"train_loss": -12.138446807861328, "global_step": 486687, "epoch": 2896} {"train_loss": -12.386770248413086, "global_step": 486688, "epoch": 2896} {"train_loss": -11.982780456542969, "global_step": 486689, "epoch": 2896} {"train_loss": -12.645633697509766, "global_step": 486690, "epoch": 2896} {"train_loss": -12.052976608276367, "global_step": 486691, "epoch": 2896} {"train_loss": -12.452836990356445, "global_step": 486692, "epoch": 2896} {"train_loss": -12.6541109085083, "global_step": 486693, "epoch": 2896} {"train_loss": -12.41497802734375, "global_step": 486694, "epoch": 2896} {"train_loss": -12.235244989395142, "global_step": 486695, "epoch": 2896, "val_loss": 319896.34375} {"train_loss": -12.574613571166992, "global_step": 486696, "epoch": 2897} {"train_loss": -12.44644546508789, "global_step": 486697, "epoch": 2897} {"train_loss": -12.23206615447998, "global_step": 486698, "epoch": 2897} {"train_loss": -12.632010459899902, "global_step": 486699, "epoch": 2897} {"train_loss": -12.462557792663574, "global_step": 486700, "epoch": 2897} {"train_loss": -12.669831275939941, "global_step": 486701, "epoch": 2897} {"train_loss": -12.266199111938477, "global_step": 486702, "epoch": 2897} {"train_loss": -12.769506454467773, "global_step": 486703, "epoch": 2897} {"train_loss": -12.361135482788086, "global_step": 486704, "epoch": 2897} {"train_loss": -12.629383087158203, "global_step": 486705, "epoch": 2897} {"train_loss": -12.571182250976562, "global_step": 486706, "epoch": 2897} {"train_loss": -12.57940673828125, "global_step": 486707, "epoch": 2897} {"train_loss": -12.647268295288086, "global_step": 486708, "epoch": 2897} {"train_loss": -12.535436630249023, "global_step": 486709, "epoch": 2897} {"train_loss": -12.67971134185791, "global_step": 486710, "epoch": 2897} {"train_loss": -12.700350761413574, "global_step": 486711, "epoch": 2897} {"train_loss": -12.815818786621094, "global_step": 486712, "epoch": 2897} {"train_loss": -12.585268020629883, "global_step": 486713, "epoch": 2897} {"train_loss": -12.492050170898438, "global_step": 486714, "epoch": 2897} {"train_loss": -12.721063613891602, "global_step": 486715, "epoch": 2897} {"train_loss": -12.98709487915039, "global_step": 486716, "epoch": 2897} {"train_loss": -12.351829528808594, "global_step": 486717, "epoch": 2897} {"train_loss": -12.885343551635742, "global_step": 486718, "epoch": 2897} {"train_loss": -12.837404251098633, "global_step": 486719, "epoch": 2897} {"train_loss": -12.868230819702148, "global_step": 486720, "epoch": 2897} {"train_loss": -12.916719436645508, "global_step": 486721, "epoch": 2897} {"train_loss": -12.70595645904541, "global_step": 486722, "epoch": 2897} {"train_loss": -12.890854835510254, "global_step": 486723, "epoch": 2897} {"train_loss": -12.97022819519043, "global_step": 486724, "epoch": 2897} {"train_loss": -12.756659507751465, "global_step": 486725, "epoch": 2897} {"train_loss": -13.055534362792969, "global_step": 486726, "epoch": 2897} {"train_loss": -12.880460739135742, "global_step": 486727, "epoch": 2897} {"train_loss": -12.745922088623047, "global_step": 486728, "epoch": 2897} {"train_loss": -13.146001815795898, "global_step": 486729, "epoch": 2897} {"train_loss": -12.782389640808105, "global_step": 486730, "epoch": 2897} {"train_loss": -12.929667472839355, "global_step": 486731, "epoch": 2897} {"train_loss": -12.813606262207031, "global_step": 486732, "epoch": 2897} {"train_loss": -12.858824729919434, "global_step": 486733, "epoch": 2897} {"train_loss": -12.93427848815918, "global_step": 486734, "epoch": 2897} {"train_loss": -12.790033340454102, "global_step": 486735, "epoch": 2897} {"train_loss": -12.928079605102539, "global_step": 486736, "epoch": 2897} {"train_loss": -13.118402481079102, "global_step": 486737, "epoch": 2897} {"train_loss": -12.860000610351562, "global_step": 486738, "epoch": 2897} {"train_loss": -13.083839416503906, "global_step": 486739, "epoch": 2897} {"train_loss": -13.09263801574707, "global_step": 486740, "epoch": 2897} {"train_loss": -12.891165733337402, "global_step": 486741, "epoch": 2897} {"train_loss": -12.670103073120117, "global_step": 486742, "epoch": 2897} {"train_loss": -12.997771263122559, "global_step": 486743, "epoch": 2897} {"train_loss": -13.175073623657227, "global_step": 486744, "epoch": 2897} {"train_loss": -13.05770492553711, "global_step": 486745, "epoch": 2897} {"train_loss": -13.12014389038086, "global_step": 486746, "epoch": 2897} {"train_loss": -12.930749893188477, "global_step": 486747, "epoch": 2897} {"train_loss": -12.992323875427246, "global_step": 486748, "epoch": 2897} {"train_loss": -12.921875, "global_step": 486749, "epoch": 2897} {"train_loss": -13.104765892028809, "global_step": 486750, "epoch": 2897} {"train_loss": -13.00145435333252, "global_step": 486751, "epoch": 2897} {"train_loss": -13.194055557250977, "global_step": 486752, "epoch": 2897} {"train_loss": -12.796046257019043, "global_step": 486753, "epoch": 2897} {"train_loss": -13.000772476196289, "global_step": 486754, "epoch": 2897} {"train_loss": -12.479132652282715, "global_step": 486755, "epoch": 2897} {"train_loss": -11.635964393615723, "global_step": 486756, "epoch": 2897} {"train_loss": -12.758404731750488, "global_step": 486757, "epoch": 2897} {"train_loss": -12.449186325073242, "global_step": 486758, "epoch": 2897} {"train_loss": -10.615605354309082, "global_step": 486759, "epoch": 2897} {"train_loss": -10.825464248657227, "global_step": 486760, "epoch": 2897} {"train_loss": -12.764508247375488, "global_step": 486761, "epoch": 2897} {"train_loss": -9.662042617797852, "global_step": 486762, "epoch": 2897} {"train_loss": -12.517365455627441, "global_step": 486763, "epoch": 2897} {"train_loss": -8.714122772216797, "global_step": 486764, "epoch": 2897} {"train_loss": -10.15060806274414, "global_step": 486765, "epoch": 2897} {"train_loss": -11.394926071166992, "global_step": 486766, "epoch": 2897} {"train_loss": -10.733205795288086, "global_step": 486767, "epoch": 2897} {"train_loss": -12.229578971862793, "global_step": 486768, "epoch": 2897} {"train_loss": -11.651593208312988, "global_step": 486769, "epoch": 2897} {"train_loss": -12.571725845336914, "global_step": 486770, "epoch": 2897} {"train_loss": -11.621697425842285, "global_step": 486771, "epoch": 2897} {"train_loss": -12.88442611694336, "global_step": 486772, "epoch": 2897} {"train_loss": -11.042028427124023, "global_step": 486773, "epoch": 2897} {"train_loss": -12.379365921020508, "global_step": 486774, "epoch": 2897} {"train_loss": -11.632055282592773, "global_step": 486775, "epoch": 2897} {"train_loss": -12.491460800170898, "global_step": 486776, "epoch": 2897} {"train_loss": -11.582895278930664, "global_step": 486777, "epoch": 2897} {"train_loss": -12.60720157623291, "global_step": 486778, "epoch": 2897} {"train_loss": -11.733125686645508, "global_step": 486779, "epoch": 2897} {"train_loss": -11.938454627990723, "global_step": 486780, "epoch": 2897} {"train_loss": -12.425026893615723, "global_step": 486781, "epoch": 2897} {"train_loss": -11.651248931884766, "global_step": 486782, "epoch": 2897} {"train_loss": -11.163966178894043, "global_step": 486783, "epoch": 2897} {"train_loss": -11.948939323425293, "global_step": 486784, "epoch": 2897} {"train_loss": -11.8646240234375, "global_step": 486785, "epoch": 2897} {"train_loss": -10.83288288116455, "global_step": 486786, "epoch": 2897} {"train_loss": -12.549507141113281, "global_step": 486787, "epoch": 2897} {"train_loss": -10.945573806762695, "global_step": 486788, "epoch": 2897} {"train_loss": -12.284294128417969, "global_step": 486789, "epoch": 2897} {"train_loss": -11.31511402130127, "global_step": 486790, "epoch": 2897} {"train_loss": -10.890678405761719, "global_step": 486791, "epoch": 2897} {"train_loss": -12.066071510314941, "global_step": 486792, "epoch": 2897} {"train_loss": -10.254049301147461, "global_step": 486793, "epoch": 2897} {"train_loss": -11.979487419128418, "global_step": 486794, "epoch": 2897} {"train_loss": -11.419804573059082, "global_step": 486795, "epoch": 2897} {"train_loss": -11.213751792907715, "global_step": 486796, "epoch": 2897} {"train_loss": -11.682835578918457, "global_step": 486797, "epoch": 2897} {"train_loss": -10.135089874267578, "global_step": 486798, "epoch": 2897} {"train_loss": -10.643136978149414, "global_step": 486799, "epoch": 2897} {"train_loss": -10.307859420776367, "global_step": 486800, "epoch": 2897} {"train_loss": -9.208381652832031, "global_step": 486801, "epoch": 2897} {"train_loss": -10.605010986328125, "global_step": 486802, "epoch": 2897} {"train_loss": -11.373440742492676, "global_step": 486803, "epoch": 2897} {"train_loss": -10.413981437683105, "global_step": 486804, "epoch": 2897} {"train_loss": -11.501797676086426, "global_step": 486805, "epoch": 2897} {"train_loss": -11.119354248046875, "global_step": 486806, "epoch": 2897} {"train_loss": -11.226249694824219, "global_step": 486807, "epoch": 2897} {"train_loss": -12.220870971679688, "global_step": 486808, "epoch": 2897} {"train_loss": -11.3074312210083, "global_step": 486809, "epoch": 2897} {"train_loss": -11.456400871276855, "global_step": 486810, "epoch": 2897} {"train_loss": -11.9273681640625, "global_step": 486811, "epoch": 2897} {"train_loss": -11.664948463439941, "global_step": 486812, "epoch": 2897} {"train_loss": -11.755228042602539, "global_step": 486813, "epoch": 2897} {"train_loss": -11.663936614990234, "global_step": 486814, "epoch": 2897} {"train_loss": -11.166847229003906, "global_step": 486815, "epoch": 2897} {"train_loss": -10.966513633728027, "global_step": 486816, "epoch": 2897} {"train_loss": -11.76853084564209, "global_step": 486817, "epoch": 2897} {"train_loss": -11.110551834106445, "global_step": 486818, "epoch": 2897} {"train_loss": -11.585275650024414, "global_step": 486819, "epoch": 2897} {"train_loss": -11.676716804504395, "global_step": 486820, "epoch": 2897} {"train_loss": -11.326423645019531, "global_step": 486821, "epoch": 2897} {"train_loss": -11.53195571899414, "global_step": 486822, "epoch": 2897} {"train_loss": -11.428342819213867, "global_step": 486823, "epoch": 2897} {"train_loss": -11.85238265991211, "global_step": 486824, "epoch": 2897} {"train_loss": -12.09245777130127, "global_step": 486825, "epoch": 2897} {"train_loss": -11.512325286865234, "global_step": 486826, "epoch": 2897} {"train_loss": -11.983724594116211, "global_step": 486827, "epoch": 2897} {"train_loss": -11.540882110595703, "global_step": 486828, "epoch": 2897} {"train_loss": -12.300432205200195, "global_step": 486829, "epoch": 2897} {"train_loss": -12.01409912109375, "global_step": 486830, "epoch": 2897} {"train_loss": -12.052165031433105, "global_step": 486831, "epoch": 2897} {"train_loss": -12.20643138885498, "global_step": 486832, "epoch": 2897} {"train_loss": -12.160444259643555, "global_step": 486833, "epoch": 2897} {"train_loss": -12.046379089355469, "global_step": 486834, "epoch": 2897} {"train_loss": -12.324024200439453, "global_step": 486835, "epoch": 2897} {"train_loss": -12.00949478149414, "global_step": 486836, "epoch": 2897} {"train_loss": -12.338960647583008, "global_step": 486837, "epoch": 2897} {"train_loss": -12.567500114440918, "global_step": 486838, "epoch": 2897} {"train_loss": -12.10732364654541, "global_step": 486839, "epoch": 2897} {"train_loss": -12.403454780578613, "global_step": 486840, "epoch": 2897} {"train_loss": -12.463854789733887, "global_step": 486841, "epoch": 2897} {"train_loss": -12.570882797241211, "global_step": 486842, "epoch": 2897} {"train_loss": -12.394469261169434, "global_step": 486843, "epoch": 2897} {"train_loss": -12.503679275512695, "global_step": 486844, "epoch": 2897} {"train_loss": -12.443181991577148, "global_step": 486845, "epoch": 2897} {"train_loss": -12.401527404785156, "global_step": 486846, "epoch": 2897} {"train_loss": -12.4448881149292, "global_step": 486847, "epoch": 2897} {"train_loss": -12.41122817993164, "global_step": 486848, "epoch": 2897} {"train_loss": -12.736837387084961, "global_step": 486849, "epoch": 2897} {"train_loss": -12.258481979370117, "global_step": 486850, "epoch": 2897} {"train_loss": -12.659198760986328, "global_step": 486851, "epoch": 2897} {"train_loss": -12.645493507385254, "global_step": 486852, "epoch": 2897} {"train_loss": -12.651224136352539, "global_step": 486853, "epoch": 2897} {"train_loss": -12.762906074523926, "global_step": 486854, "epoch": 2897} {"train_loss": -12.438446044921875, "global_step": 486855, "epoch": 2897} {"train_loss": -12.740617752075195, "global_step": 486856, "epoch": 2897} {"train_loss": -12.884947776794434, "global_step": 486857, "epoch": 2897} {"train_loss": -12.797889709472656, "global_step": 486858, "epoch": 2897} {"train_loss": -12.760401725769043, "global_step": 486859, "epoch": 2897} {"train_loss": -12.672239303588867, "global_step": 486860, "epoch": 2897} {"train_loss": -12.89313793182373, "global_step": 486861, "epoch": 2897} {"train_loss": -12.760887145996094, "global_step": 486862, "epoch": 2897} {"train_loss": -12.151773418698992, "global_step": 486863, "epoch": 2897, "val_loss": 317492.3125} {"train_loss": -12.825160026550293, "global_step": 486864, "epoch": 2898} {"train_loss": -12.789081573486328, "global_step": 486865, "epoch": 2898} {"train_loss": -12.619150161743164, "global_step": 486866, "epoch": 2898} {"train_loss": -12.78663444519043, "global_step": 486867, "epoch": 2898} {"train_loss": -12.7767333984375, "global_step": 486868, "epoch": 2898} {"train_loss": -12.851397514343262, "global_step": 486869, "epoch": 2898} {"train_loss": -12.861091613769531, "global_step": 486870, "epoch": 2898} {"train_loss": -12.73837947845459, "global_step": 486871, "epoch": 2898} {"train_loss": -12.92034912109375, "global_step": 486872, "epoch": 2898} {"train_loss": -12.88380241394043, "global_step": 486873, "epoch": 2898} {"train_loss": -12.885225296020508, "global_step": 486874, "epoch": 2898} {"train_loss": -13.016216278076172, "global_step": 486875, "epoch": 2898} {"train_loss": -12.719175338745117, "global_step": 486876, "epoch": 2898} {"train_loss": -13.011210441589355, "global_step": 486877, "epoch": 2898} {"train_loss": -12.967977523803711, "global_step": 486878, "epoch": 2898} {"train_loss": -12.97891902923584, "global_step": 486879, "epoch": 2898} {"train_loss": -12.990674018859863, "global_step": 486880, "epoch": 2898} {"train_loss": -12.827485084533691, "global_step": 486881, "epoch": 2898} {"train_loss": -12.941169738769531, "global_step": 486882, "epoch": 2898} {"train_loss": -12.729193687438965, "global_step": 486883, "epoch": 2898} {"train_loss": -12.898271560668945, "global_step": 486884, "epoch": 2898} {"train_loss": -12.81437873840332, "global_step": 486885, "epoch": 2898} {"train_loss": -12.76436996459961, "global_step": 486886, "epoch": 2898} {"train_loss": -12.681905746459961, "global_step": 486887, "epoch": 2898} {"train_loss": -12.789738655090332, "global_step": 486888, "epoch": 2898} {"train_loss": -12.743654251098633, "global_step": 486889, "epoch": 2898} {"train_loss": -12.695754051208496, "global_step": 486890, "epoch": 2898} {"train_loss": -12.485013008117676, "global_step": 486891, "epoch": 2898} {"train_loss": -12.828822135925293, "global_step": 486892, "epoch": 2898} {"train_loss": -12.989933967590332, "global_step": 486893, "epoch": 2898} {"train_loss": -12.843940734863281, "global_step": 486894, "epoch": 2898} {"train_loss": -12.865163803100586, "global_step": 486895, "epoch": 2898} {"train_loss": -12.730104446411133, "global_step": 486896, "epoch": 2898} {"train_loss": -12.663390159606934, "global_step": 486897, "epoch": 2898} {"train_loss": -12.877567291259766, "global_step": 486898, "epoch": 2898} {"train_loss": -12.543035507202148, "global_step": 486899, "epoch": 2898} {"train_loss": -12.81097412109375, "global_step": 486900, "epoch": 2898} {"train_loss": -12.63770580291748, "global_step": 486901, "epoch": 2898} {"train_loss": -12.377443313598633, "global_step": 486902, "epoch": 2898} {"train_loss": -12.51210880279541, "global_step": 486903, "epoch": 2898} {"train_loss": -12.621341705322266, "global_step": 486904, "epoch": 2898} {"train_loss": -12.900285720825195, "global_step": 486905, "epoch": 2898} {"train_loss": -12.282610893249512, "global_step": 486906, "epoch": 2898} {"train_loss": -12.471603393554688, "global_step": 486907, "epoch": 2898} {"train_loss": -12.815279006958008, "global_step": 486908, "epoch": 2898} {"train_loss": -12.245410919189453, "global_step": 486909, "epoch": 2898} {"train_loss": -12.224172592163086, "global_step": 486910, "epoch": 2898} {"train_loss": -12.390785217285156, "global_step": 486911, "epoch": 2898} {"train_loss": -12.6636381149292, "global_step": 486912, "epoch": 2898} {"train_loss": -12.507444381713867, "global_step": 486913, "epoch": 2898} {"train_loss": -12.819311141967773, "global_step": 486914, "epoch": 2898} {"train_loss": -12.855058670043945, "global_step": 486915, "epoch": 2898} {"train_loss": -12.471275329589844, "global_step": 486916, "epoch": 2898} {"train_loss": -12.771921157836914, "global_step": 486917, "epoch": 2898} {"train_loss": -12.726248741149902, "global_step": 486918, "epoch": 2898} {"train_loss": -12.535808563232422, "global_step": 486919, "epoch": 2898} {"train_loss": -12.776046752929688, "global_step": 486920, "epoch": 2898} {"train_loss": -12.244636535644531, "global_step": 486921, "epoch": 2898} {"train_loss": -12.053321838378906, "global_step": 486922, "epoch": 2898} {"train_loss": -12.693595886230469, "global_step": 486923, "epoch": 2898} {"train_loss": -12.29013729095459, "global_step": 486924, "epoch": 2898} {"train_loss": -12.566658973693848, "global_step": 486925, "epoch": 2898} {"train_loss": -12.29764461517334, "global_step": 486926, "epoch": 2898} {"train_loss": -13.041139602661133, "global_step": 486927, "epoch": 2898} {"train_loss": -12.266911506652832, "global_step": 486928, "epoch": 2898} {"train_loss": -12.648141860961914, "global_step": 486929, "epoch": 2898} {"train_loss": -12.643953323364258, "global_step": 486930, "epoch": 2898} {"train_loss": -12.292469024658203, "global_step": 486931, "epoch": 2898} {"train_loss": -12.3493013381958, "global_step": 486932, "epoch": 2898} {"train_loss": -12.409759521484375, "global_step": 486933, "epoch": 2898} {"train_loss": -12.889458656311035, "global_step": 486934, "epoch": 2898} {"train_loss": -12.427928924560547, "global_step": 486935, "epoch": 2898} {"train_loss": -12.39989948272705, "global_step": 486936, "epoch": 2898} {"train_loss": -12.638677597045898, "global_step": 486937, "epoch": 2898} {"train_loss": -12.442389488220215, "global_step": 486938, "epoch": 2898} {"train_loss": -12.346158981323242, "global_step": 486939, "epoch": 2898} {"train_loss": -12.386945724487305, "global_step": 486940, "epoch": 2898} {"train_loss": -12.89966869354248, "global_step": 486941, "epoch": 2898} {"train_loss": -12.738702774047852, "global_step": 486942, "epoch": 2898} {"train_loss": -12.608699798583984, "global_step": 486943, "epoch": 2898} {"train_loss": -12.560530662536621, "global_step": 486944, "epoch": 2898} {"train_loss": -12.763648986816406, "global_step": 486945, "epoch": 2898} {"train_loss": -12.64026165008545, "global_step": 486946, "epoch": 2898} {"train_loss": -12.308589935302734, "global_step": 486947, "epoch": 2898} {"train_loss": -12.308815002441406, "global_step": 486948, "epoch": 2898} {"train_loss": -11.841938018798828, "global_step": 486949, "epoch": 2898} {"train_loss": -11.706972122192383, "global_step": 486950, "epoch": 2898} {"train_loss": -12.428356170654297, "global_step": 486951, "epoch": 2898} {"train_loss": -12.996003150939941, "global_step": 486952, "epoch": 2898} {"train_loss": -12.609516143798828, "global_step": 486953, "epoch": 2898} {"train_loss": -12.643570899963379, "global_step": 486954, "epoch": 2898} {"train_loss": -12.374044418334961, "global_step": 486955, "epoch": 2898} {"train_loss": -12.555449485778809, "global_step": 486956, "epoch": 2898} {"train_loss": -12.530450820922852, "global_step": 486957, "epoch": 2898} {"train_loss": -12.31324577331543, "global_step": 486958, "epoch": 2898} {"train_loss": -11.756698608398438, "global_step": 486959, "epoch": 2898} {"train_loss": -12.693120002746582, "global_step": 486960, "epoch": 2898} {"train_loss": -10.415975570678711, "global_step": 486961, "epoch": 2898} {"train_loss": -11.543354034423828, "global_step": 486962, "epoch": 2898} {"train_loss": -11.25528335571289, "global_step": 486963, "epoch": 2898} {"train_loss": -11.190921783447266, "global_step": 486964, "epoch": 2898} {"train_loss": -12.03712272644043, "global_step": 486965, "epoch": 2898} {"train_loss": -11.607198715209961, "global_step": 486966, "epoch": 2898} {"train_loss": -10.502822875976562, "global_step": 486967, "epoch": 2898} {"train_loss": -12.338809967041016, "global_step": 486968, "epoch": 2898} {"train_loss": -10.616345405578613, "global_step": 486969, "epoch": 2898} {"train_loss": -10.942713737487793, "global_step": 486970, "epoch": 2898} {"train_loss": -8.749980926513672, "global_step": 486971, "epoch": 2898} {"train_loss": -8.963685989379883, "global_step": 486972, "epoch": 2898} {"train_loss": -9.666505813598633, "global_step": 486973, "epoch": 2898} {"train_loss": -10.282955169677734, "global_step": 486974, "epoch": 2898} {"train_loss": -9.36532974243164, "global_step": 486975, "epoch": 2898} {"train_loss": -8.10328483581543, "global_step": 486976, "epoch": 2898} {"train_loss": -8.570281982421875, "global_step": 486977, "epoch": 2898} {"train_loss": -8.762239456176758, "global_step": 486978, "epoch": 2898} {"train_loss": -10.34328556060791, "global_step": 486979, "epoch": 2898} {"train_loss": -9.507535934448242, "global_step": 486980, "epoch": 2898} {"train_loss": -9.61762809753418, "global_step": 486981, "epoch": 2898} {"train_loss": -9.401827812194824, "global_step": 486982, "epoch": 2898} {"train_loss": -9.27608871459961, "global_step": 486983, "epoch": 2898} {"train_loss": -9.686781883239746, "global_step": 486984, "epoch": 2898} {"train_loss": -10.079351425170898, "global_step": 486985, "epoch": 2898} {"train_loss": -11.225696563720703, "global_step": 486986, "epoch": 2898} {"train_loss": -10.726341247558594, "global_step": 486987, "epoch": 2898} {"train_loss": -10.604782104492188, "global_step": 486988, "epoch": 2898} {"train_loss": -10.679457664489746, "global_step": 486989, "epoch": 2898} {"train_loss": -10.674202919006348, "global_step": 486990, "epoch": 2898} {"train_loss": -10.471122741699219, "global_step": 486991, "epoch": 2898} {"train_loss": -10.110663414001465, "global_step": 486992, "epoch": 2898} {"train_loss": -10.96673583984375, "global_step": 486993, "epoch": 2898} {"train_loss": -10.203105926513672, "global_step": 486994, "epoch": 2898} {"train_loss": -10.944189071655273, "global_step": 486995, "epoch": 2898} {"train_loss": -10.614945411682129, "global_step": 486996, "epoch": 2898} {"train_loss": -10.511398315429688, "global_step": 486997, "epoch": 2898} {"train_loss": -11.272823333740234, "global_step": 486998, "epoch": 2898} {"train_loss": -11.461132049560547, "global_step": 486999, "epoch": 2898} {"train_loss": -11.311229705810547, "global_step": 487000, "epoch": 2898} {"train_loss": -11.354323387145996, "global_step": 487001, "epoch": 2898} {"train_loss": -11.9854736328125, "global_step": 487002, "epoch": 2898} {"train_loss": -11.651406288146973, "global_step": 487003, "epoch": 2898} {"train_loss": -11.50473403930664, "global_step": 487004, "epoch": 2898} {"train_loss": -11.63214111328125, "global_step": 487005, "epoch": 2898} {"train_loss": -11.898478507995605, "global_step": 487006, "epoch": 2898} {"train_loss": -12.19677734375, "global_step": 487007, "epoch": 2898} {"train_loss": -12.40435791015625, "global_step": 487008, "epoch": 2898} {"train_loss": -12.159366607666016, "global_step": 487009, "epoch": 2898} {"train_loss": -12.144489288330078, "global_step": 487010, "epoch": 2898} {"train_loss": -11.774552345275879, "global_step": 487011, "epoch": 2898} {"train_loss": -12.358023643493652, "global_step": 487012, "epoch": 2898} {"train_loss": -12.090683937072754, "global_step": 487013, "epoch": 2898} {"train_loss": -11.993624687194824, "global_step": 487014, "epoch": 2898} {"train_loss": -12.400784492492676, "global_step": 487015, "epoch": 2898} {"train_loss": -11.909029006958008, "global_step": 487016, "epoch": 2898} {"train_loss": -12.136751174926758, "global_step": 487017, "epoch": 2898} {"train_loss": -12.268363952636719, "global_step": 487018, "epoch": 2898} {"train_loss": -11.894500732421875, "global_step": 487019, "epoch": 2898} {"train_loss": -12.302093505859375, "global_step": 487020, "epoch": 2898} {"train_loss": -12.208425521850586, "global_step": 487021, "epoch": 2898} {"train_loss": -11.830221176147461, "global_step": 487022, "epoch": 2898} {"train_loss": -12.526228904724121, "global_step": 487023, "epoch": 2898} {"train_loss": -11.988863945007324, "global_step": 487024, "epoch": 2898} {"train_loss": -12.272233963012695, "global_step": 487025, "epoch": 2898} {"train_loss": -12.451550483703613, "global_step": 487026, "epoch": 2898} {"train_loss": -12.272382736206055, "global_step": 487027, "epoch": 2898} {"train_loss": -12.40218448638916, "global_step": 487028, "epoch": 2898} {"train_loss": -12.417203903198242, "global_step": 487029, "epoch": 2898} {"train_loss": -12.289398193359375, "global_step": 487030, "epoch": 2898} {"train_loss": -11.98988986582983, "global_step": 487031, "epoch": 2898, "val_loss": 315983.5} {"train_loss": -12.606738090515137, "global_step": 487032, "epoch": 2899} {"train_loss": -12.492197036743164, "global_step": 487033, "epoch": 2899} {"train_loss": -12.608555793762207, "global_step": 487034, "epoch": 2899} {"train_loss": -12.580336570739746, "global_step": 487035, "epoch": 2899} {"train_loss": -12.465214729309082, "global_step": 487036, "epoch": 2899} {"train_loss": -12.340007781982422, "global_step": 487037, "epoch": 2899} {"train_loss": -12.550516128540039, "global_step": 487038, "epoch": 2899} {"train_loss": -12.729507446289062, "global_step": 487039, "epoch": 2899} {"train_loss": -12.611794471740723, "global_step": 487040, "epoch": 2899} {"train_loss": -12.731487274169922, "global_step": 487041, "epoch": 2899} {"train_loss": -12.763160705566406, "global_step": 487042, "epoch": 2899} {"train_loss": -12.493133544921875, "global_step": 487043, "epoch": 2899} {"train_loss": -12.817161560058594, "global_step": 487044, "epoch": 2899} {"train_loss": -12.77920913696289, "global_step": 487045, "epoch": 2899} {"train_loss": -12.637914657592773, "global_step": 487046, "epoch": 2899} {"train_loss": -12.946157455444336, "global_step": 487047, "epoch": 2899} {"train_loss": -12.685944557189941, "global_step": 487048, "epoch": 2899} {"train_loss": -12.689108848571777, "global_step": 487049, "epoch": 2899} {"train_loss": -12.898926734924316, "global_step": 487050, "epoch": 2899} {"train_loss": -12.71670150756836, "global_step": 487051, "epoch": 2899} {"train_loss": -12.666051864624023, "global_step": 487052, "epoch": 2899} {"train_loss": -12.638437271118164, "global_step": 487053, "epoch": 2899} {"train_loss": -12.550288200378418, "global_step": 487054, "epoch": 2899} {"train_loss": -12.568814277648926, "global_step": 487055, "epoch": 2899} {"train_loss": -12.517786979675293, "global_step": 487056, "epoch": 2899} {"train_loss": -12.870979309082031, "global_step": 487057, "epoch": 2899} {"train_loss": -12.929525375366211, "global_step": 487058, "epoch": 2899} {"train_loss": -12.921516418457031, "global_step": 487059, "epoch": 2899} {"train_loss": -12.750133514404297, "global_step": 487060, "epoch": 2899} {"train_loss": -12.852457046508789, "global_step": 487061, "epoch": 2899} {"train_loss": -12.943191528320312, "global_step": 487062, "epoch": 2899} {"train_loss": -12.70071029663086, "global_step": 487063, "epoch": 2899} {"train_loss": -12.948648452758789, "global_step": 487064, "epoch": 2899} {"train_loss": -12.749324798583984, "global_step": 487065, "epoch": 2899} {"train_loss": -12.544699668884277, "global_step": 487066, "epoch": 2899} {"train_loss": -12.806968688964844, "global_step": 487067, "epoch": 2899} {"train_loss": -12.812091827392578, "global_step": 487068, "epoch": 2899} {"train_loss": -12.552698135375977, "global_step": 487069, "epoch": 2899} {"train_loss": -12.862812042236328, "global_step": 487070, "epoch": 2899} {"train_loss": -12.958765983581543, "global_step": 487071, "epoch": 2899} {"train_loss": -12.95628833770752, "global_step": 487072, "epoch": 2899} {"train_loss": -12.79450798034668, "global_step": 487073, "epoch": 2899} {"train_loss": -12.958270072937012, "global_step": 487074, "epoch": 2899} {"train_loss": -13.044469833374023, "global_step": 487075, "epoch": 2899} {"train_loss": -13.055103302001953, "global_step": 487076, "epoch": 2899} {"train_loss": -12.984683990478516, "global_step": 487077, "epoch": 2899} {"train_loss": -12.910968780517578, "global_step": 487078, "epoch": 2899} {"train_loss": -13.04836654663086, "global_step": 487079, "epoch": 2899} {"train_loss": -12.880334854125977, "global_step": 487080, "epoch": 2899} {"train_loss": -12.933011054992676, "global_step": 487081, "epoch": 2899} {"train_loss": -12.683450698852539, "global_step": 487082, "epoch": 2899} {"train_loss": -12.604379653930664, "global_step": 487083, "epoch": 2899} {"train_loss": -12.982097625732422, "global_step": 487084, "epoch": 2899} {"train_loss": -12.745323181152344, "global_step": 487085, "epoch": 2899} {"train_loss": -12.860299110412598, "global_step": 487086, "epoch": 2899} {"train_loss": -13.140907287597656, "global_step": 487087, "epoch": 2899} {"train_loss": -13.072643280029297, "global_step": 487088, "epoch": 2899} {"train_loss": -12.926820755004883, "global_step": 487089, "epoch": 2899} {"train_loss": -12.806224822998047, "global_step": 487090, "epoch": 2899} {"train_loss": -13.062085151672363, "global_step": 487091, "epoch": 2899} {"train_loss": -12.563325881958008, "global_step": 487092, "epoch": 2899} {"train_loss": -12.227176666259766, "global_step": 487093, "epoch": 2899} {"train_loss": -12.151381492614746, "global_step": 487094, "epoch": 2899} {"train_loss": -12.741073608398438, "global_step": 487095, "epoch": 2899} {"train_loss": -12.56727409362793, "global_step": 487096, "epoch": 2899} {"train_loss": -11.911881446838379, "global_step": 487097, "epoch": 2899} {"train_loss": -12.508922576904297, "global_step": 487098, "epoch": 2899} {"train_loss": -12.857038497924805, "global_step": 487099, "epoch": 2899} {"train_loss": -12.19920539855957, "global_step": 487100, "epoch": 2899} {"train_loss": -11.356057167053223, "global_step": 487101, "epoch": 2899} {"train_loss": -11.96479320526123, "global_step": 487102, "epoch": 2899} {"train_loss": -12.377196311950684, "global_step": 487103, "epoch": 2899} {"train_loss": -11.8561429977417, "global_step": 487104, "epoch": 2899} {"train_loss": -11.367772102355957, "global_step": 487105, "epoch": 2899} {"train_loss": -11.698956489562988, "global_step": 487106, "epoch": 2899} {"train_loss": -12.565570831298828, "global_step": 487107, "epoch": 2899} {"train_loss": -11.536924362182617, "global_step": 487108, "epoch": 2899} {"train_loss": -11.080443382263184, "global_step": 487109, "epoch": 2899} {"train_loss": -11.340276718139648, "global_step": 487110, "epoch": 2899} {"train_loss": -10.450098037719727, "global_step": 487111, "epoch": 2899} {"train_loss": -10.659147262573242, "global_step": 487112, "epoch": 2899} {"train_loss": -12.113927841186523, "global_step": 487113, "epoch": 2899} {"train_loss": -10.61557388305664, "global_step": 487114, "epoch": 2899} {"train_loss": -12.086012840270996, "global_step": 487115, "epoch": 2899} {"train_loss": -11.02400016784668, "global_step": 487116, "epoch": 2899} {"train_loss": -12.287393569946289, "global_step": 487117, "epoch": 2899} {"train_loss": -12.221027374267578, "global_step": 487118, "epoch": 2899} {"train_loss": -11.796622276306152, "global_step": 487119, "epoch": 2899} {"train_loss": -12.1000337600708, "global_step": 487120, "epoch": 2899} {"train_loss": -12.254837036132812, "global_step": 487121, "epoch": 2899} {"train_loss": -11.31525993347168, "global_step": 487122, "epoch": 2899} {"train_loss": -12.205207824707031, "global_step": 487123, "epoch": 2899} {"train_loss": -11.983869552612305, "global_step": 487124, "epoch": 2899} {"train_loss": -11.965230941772461, "global_step": 487125, "epoch": 2899} {"train_loss": -12.077415466308594, "global_step": 487126, "epoch": 2899} {"train_loss": -12.320608139038086, "global_step": 487127, "epoch": 2899} {"train_loss": -12.253023147583008, "global_step": 487128, "epoch": 2899} {"train_loss": -12.269477844238281, "global_step": 487129, "epoch": 2899} {"train_loss": -11.91213321685791, "global_step": 487130, "epoch": 2899} {"train_loss": -11.360410690307617, "global_step": 487131, "epoch": 2899} {"train_loss": -12.304006576538086, "global_step": 487132, "epoch": 2899} {"train_loss": -11.338346481323242, "global_step": 487133, "epoch": 2899} {"train_loss": -11.422735214233398, "global_step": 487134, "epoch": 2899} {"train_loss": -12.113554000854492, "global_step": 487135, "epoch": 2899} {"train_loss": -11.128063201904297, "global_step": 487136, "epoch": 2899} {"train_loss": -12.171045303344727, "global_step": 487137, "epoch": 2899} {"train_loss": -10.131775856018066, "global_step": 487138, "epoch": 2899} {"train_loss": -11.386575698852539, "global_step": 487139, "epoch": 2899} {"train_loss": -10.36539077758789, "global_step": 487140, "epoch": 2899} {"train_loss": -11.774887084960938, "global_step": 487141, "epoch": 2899} {"train_loss": -9.802200317382812, "global_step": 487142, "epoch": 2899} {"train_loss": -10.196075439453125, "global_step": 487143, "epoch": 2899} {"train_loss": -11.614587783813477, "global_step": 487144, "epoch": 2899} {"train_loss": -11.312356948852539, "global_step": 487145, "epoch": 2899} {"train_loss": -11.16484260559082, "global_step": 487146, "epoch": 2899} {"train_loss": -12.457632064819336, "global_step": 487147, "epoch": 2899} {"train_loss": -10.725761413574219, "global_step": 487148, "epoch": 2899} {"train_loss": -11.825441360473633, "global_step": 487149, "epoch": 2899} {"train_loss": -10.021713256835938, "global_step": 487150, "epoch": 2899} {"train_loss": -9.123472213745117, "global_step": 487151, "epoch": 2899} {"train_loss": -11.068902015686035, "global_step": 487152, "epoch": 2899} {"train_loss": -10.348688125610352, "global_step": 487153, "epoch": 2899} {"train_loss": -10.770641326904297, "global_step": 487154, "epoch": 2899} {"train_loss": -10.411738395690918, "global_step": 487155, "epoch": 2899} {"train_loss": -11.195989608764648, "global_step": 487156, "epoch": 2899} {"train_loss": -10.863784790039062, "global_step": 487157, "epoch": 2899} {"train_loss": -12.275894165039062, "global_step": 487158, "epoch": 2899} {"train_loss": -11.022134780883789, "global_step": 487159, "epoch": 2899} {"train_loss": -11.672891616821289, "global_step": 487160, "epoch": 2899} {"train_loss": -11.593704223632812, "global_step": 487161, "epoch": 2899} {"train_loss": -11.154315948486328, "global_step": 487162, "epoch": 2899} {"train_loss": -11.809310913085938, "global_step": 487163, "epoch": 2899} {"train_loss": -11.88383674621582, "global_step": 487164, "epoch": 2899} {"train_loss": -11.551311492919922, "global_step": 487165, "epoch": 2899} {"train_loss": -12.020078659057617, "global_step": 487166, "epoch": 2899} {"train_loss": -11.612616539001465, "global_step": 487167, "epoch": 2899} {"train_loss": -11.642723083496094, "global_step": 487168, "epoch": 2899} {"train_loss": -12.215224266052246, "global_step": 487169, "epoch": 2899} {"train_loss": -11.302531242370605, "global_step": 487170, "epoch": 2899} {"train_loss": -12.401140213012695, "global_step": 487171, "epoch": 2899} {"train_loss": -12.036975860595703, "global_step": 487172, "epoch": 2899} {"train_loss": -12.221260070800781, "global_step": 487173, "epoch": 2899} {"train_loss": -11.94327163696289, "global_step": 487174, "epoch": 2899} {"train_loss": -12.009321212768555, "global_step": 487175, "epoch": 2899} {"train_loss": -11.94246768951416, "global_step": 487176, "epoch": 2899} {"train_loss": -12.119816780090332, "global_step": 487177, "epoch": 2899} {"train_loss": -11.838303565979004, "global_step": 487178, "epoch": 2899} {"train_loss": -12.300339698791504, "global_step": 487179, "epoch": 2899} {"train_loss": -11.183067321777344, "global_step": 487180, "epoch": 2899} {"train_loss": -12.505424499511719, "global_step": 487181, "epoch": 2899} {"train_loss": -11.645855903625488, "global_step": 487182, "epoch": 2899} {"train_loss": -12.23665714263916, "global_step": 487183, "epoch": 2899} {"train_loss": -11.826580047607422, "global_step": 487184, "epoch": 2899} {"train_loss": -12.339147567749023, "global_step": 487185, "epoch": 2899} {"train_loss": -12.00326156616211, "global_step": 487186, "epoch": 2899} {"train_loss": -12.200801849365234, "global_step": 487187, "epoch": 2899} {"train_loss": -11.62129020690918, "global_step": 487188, "epoch": 2899} {"train_loss": -11.993365287780762, "global_step": 487189, "epoch": 2899} {"train_loss": -11.528247833251953, "global_step": 487190, "epoch": 2899} {"train_loss": -11.79227352142334, "global_step": 487191, "epoch": 2899} {"train_loss": -11.731444358825684, "global_step": 487192, "epoch": 2899} {"train_loss": -11.8843994140625, "global_step": 487193, "epoch": 2899} {"train_loss": -11.818435668945312, "global_step": 487194, "epoch": 2899} {"train_loss": -11.909046173095703, "global_step": 487195, "epoch": 2899} {"train_loss": -11.699928283691406, "global_step": 487196, "epoch": 2899} {"train_loss": -11.915681838989258, "global_step": 487197, "epoch": 2899} {"train_loss": -11.29161262512207, "global_step": 487198, "epoch": 2899} {"train_loss": -12.068754707063947, "global_step": 487199, "epoch": 2899, "val_loss": 318323.21875} {"train_loss": -11.734484672546387, "global_step": 487200, "epoch": 2900} {"train_loss": -11.91573429107666, "global_step": 487201, "epoch": 2900} {"train_loss": -11.756766319274902, "global_step": 487202, "epoch": 2900} {"train_loss": -11.982767105102539, "global_step": 487203, "epoch": 2900} {"train_loss": -11.628080368041992, "global_step": 487204, "epoch": 2900} {"train_loss": -12.136600494384766, "global_step": 487205, "epoch": 2900} {"train_loss": -11.94528579711914, "global_step": 487206, "epoch": 2900} {"train_loss": -12.206403732299805, "global_step": 487207, "epoch": 2900} {"train_loss": -12.071721076965332, "global_step": 487208, "epoch": 2900} {"train_loss": -12.312170028686523, "global_step": 487209, "epoch": 2900} {"train_loss": -12.16472053527832, "global_step": 487210, "epoch": 2900} {"train_loss": -12.425739288330078, "global_step": 487211, "epoch": 2900} {"train_loss": -12.105140686035156, "global_step": 487212, "epoch": 2900} {"train_loss": -12.18502426147461, "global_step": 487213, "epoch": 2900} {"train_loss": -12.579957008361816, "global_step": 487214, "epoch": 2900} {"train_loss": -12.203742027282715, "global_step": 487215, "epoch": 2900} {"train_loss": -12.541728973388672, "global_step": 487216, "epoch": 2900} {"train_loss": -12.326774597167969, "global_step": 487217, "epoch": 2900} {"train_loss": -12.380817413330078, "global_step": 487218, "epoch": 2900} {"train_loss": -12.58674430847168, "global_step": 487219, "epoch": 2900} {"train_loss": -12.547966957092285, "global_step": 487220, "epoch": 2900} {"train_loss": -12.372444152832031, "global_step": 487221, "epoch": 2900} {"train_loss": -12.555623054504395, "global_step": 487222, "epoch": 2900} {"train_loss": -12.442138671875, "global_step": 487223, "epoch": 2900} {"train_loss": -12.299481391906738, "global_step": 487224, "epoch": 2900} {"train_loss": -12.596116065979004, "global_step": 487225, "epoch": 2900} {"train_loss": -12.72823715209961, "global_step": 487226, "epoch": 2900} {"train_loss": -12.689245223999023, "global_step": 487227, "epoch": 2900} {"train_loss": -12.604448318481445, "global_step": 487228, "epoch": 2900} {"train_loss": -12.55251693725586, "global_step": 487229, "epoch": 2900} {"train_loss": -12.741257667541504, "global_step": 487230, "epoch": 2900} {"train_loss": -12.8414888381958, "global_step": 487231, "epoch": 2900} {"train_loss": -12.716665267944336, "global_step": 487232, "epoch": 2900} {"train_loss": -12.76544189453125, "global_step": 487233, "epoch": 2900} {"train_loss": -12.644244194030762, "global_step": 487234, "epoch": 2900} {"train_loss": -12.900259971618652, "global_step": 487235, "epoch": 2900} {"train_loss": -12.646567344665527, "global_step": 487236, "epoch": 2900} {"train_loss": -12.708222389221191, "global_step": 487237, "epoch": 2900} {"train_loss": -12.76960563659668, "global_step": 487238, "epoch": 2900} {"train_loss": -12.637981414794922, "global_step": 487239, "epoch": 2900} {"train_loss": -12.77334976196289, "global_step": 487240, "epoch": 2900} {"train_loss": -12.626633644104004, "global_step": 487241, "epoch": 2900} {"train_loss": -12.715767860412598, "global_step": 487242, "epoch": 2900} {"train_loss": -12.784406661987305, "global_step": 487243, "epoch": 2900} {"train_loss": -12.851766586303711, "global_step": 487244, "epoch": 2900} {"train_loss": -12.67110538482666, "global_step": 487245, "epoch": 2900} {"train_loss": -12.828989028930664, "global_step": 487246, "epoch": 2900} {"train_loss": -12.717275619506836, "global_step": 487247, "epoch": 2900} {"train_loss": -12.934112548828125, "global_step": 487248, "epoch": 2900} {"train_loss": -12.628817558288574, "global_step": 487249, "epoch": 2900} {"train_loss": -12.886335372924805, "global_step": 487250, "epoch": 2900} {"train_loss": -12.737052917480469, "global_step": 487251, "epoch": 2900} {"train_loss": -12.97673225402832, "global_step": 487252, "epoch": 2900} {"train_loss": -12.813935279846191, "global_step": 487253, "epoch": 2900} {"train_loss": -12.793427467346191, "global_step": 487254, "epoch": 2900} {"train_loss": -12.766536712646484, "global_step": 487255, "epoch": 2900} {"train_loss": -12.861583709716797, "global_step": 487256, "epoch": 2900} {"train_loss": -12.962438583374023, "global_step": 487257, "epoch": 2900} {"train_loss": -12.681906700134277, "global_step": 487258, "epoch": 2900} {"train_loss": -12.971305847167969, "global_step": 487259, "epoch": 2900} {"train_loss": -12.771133422851562, "global_step": 487260, "epoch": 2900} {"train_loss": -12.915202140808105, "global_step": 487261, "epoch": 2900} {"train_loss": -12.610713958740234, "global_step": 487262, "epoch": 2900} {"train_loss": -12.846759796142578, "global_step": 487263, "epoch": 2900} {"train_loss": -13.030210494995117, "global_step": 487264, "epoch": 2900} {"train_loss": -12.843194961547852, "global_step": 487265, "epoch": 2900} {"train_loss": -12.885322570800781, "global_step": 487266, "epoch": 2900} {"train_loss": -12.776769638061523, "global_step": 487267, "epoch": 2900} {"train_loss": -12.98619556427002, "global_step": 487268, "epoch": 2900} {"train_loss": -12.69610595703125, "global_step": 487269, "epoch": 2900} {"train_loss": -13.0499906539917, "global_step": 487270, "epoch": 2900} {"train_loss": -12.893455505371094, "global_step": 487271, "epoch": 2900} {"train_loss": -12.879316329956055, "global_step": 487272, "epoch": 2900} {"train_loss": -12.929132461547852, "global_step": 487273, "epoch": 2900} {"train_loss": -13.007987976074219, "global_step": 487274, "epoch": 2900} {"train_loss": -12.934064865112305, "global_step": 487275, "epoch": 2900} {"train_loss": -12.854072570800781, "global_step": 487276, "epoch": 2900} {"train_loss": -12.974376678466797, "global_step": 487277, "epoch": 2900} {"train_loss": -12.85518741607666, "global_step": 487278, "epoch": 2900} {"train_loss": -13.021883010864258, "global_step": 487279, "epoch": 2900} {"train_loss": -12.947898864746094, "global_step": 487280, "epoch": 2900} {"train_loss": -12.903156280517578, "global_step": 487281, "epoch": 2900} {"train_loss": -12.909381866455078, "global_step": 487282, "epoch": 2900} {"train_loss": -12.945066452026367, "global_step": 487283, "epoch": 2900} {"train_loss": -13.036334991455078, "global_step": 487284, "epoch": 2900} {"train_loss": -13.094348907470703, "global_step": 487285, "epoch": 2900} {"train_loss": -12.837532043457031, "global_step": 487286, "epoch": 2900} {"train_loss": -12.941699981689453, "global_step": 487287, "epoch": 2900} {"train_loss": -12.992889404296875, "global_step": 487288, "epoch": 2900} {"train_loss": -13.05811882019043, "global_step": 487289, "epoch": 2900} {"train_loss": -13.012259483337402, "global_step": 487290, "epoch": 2900} {"train_loss": -13.132600784301758, "global_step": 487291, "epoch": 2900} {"train_loss": -12.910652160644531, "global_step": 487292, "epoch": 2900} {"train_loss": -12.63884162902832, "global_step": 487293, "epoch": 2900} {"train_loss": -12.543891906738281, "global_step": 487294, "epoch": 2900} {"train_loss": -12.894198417663574, "global_step": 487295, "epoch": 2900} {"train_loss": -12.855257034301758, "global_step": 487296, "epoch": 2900} {"train_loss": -12.838630676269531, "global_step": 487297, "epoch": 2900} {"train_loss": -12.762782096862793, "global_step": 487298, "epoch": 2900} {"train_loss": -12.96156120300293, "global_step": 487299, "epoch": 2900} {"train_loss": -12.744863510131836, "global_step": 487300, "epoch": 2900} {"train_loss": -12.872406005859375, "global_step": 487301, "epoch": 2900} {"train_loss": -12.894270896911621, "global_step": 487302, "epoch": 2900} {"train_loss": -12.190450668334961, "global_step": 487303, "epoch": 2900} {"train_loss": -12.757425308227539, "global_step": 487304, "epoch": 2900} {"train_loss": -13.048846244812012, "global_step": 487305, "epoch": 2900} {"train_loss": -12.901544570922852, "global_step": 487306, "epoch": 2900} {"train_loss": -12.116965293884277, "global_step": 487307, "epoch": 2900} {"train_loss": -12.053269386291504, "global_step": 487308, "epoch": 2900} {"train_loss": -12.449042320251465, "global_step": 487309, "epoch": 2900} {"train_loss": -12.777355194091797, "global_step": 487310, "epoch": 2900} {"train_loss": -12.815040588378906, "global_step": 487311, "epoch": 2900} {"train_loss": -11.769140243530273, "global_step": 487312, "epoch": 2900} {"train_loss": -11.286056518554688, "global_step": 487313, "epoch": 2900} {"train_loss": -12.264241218566895, "global_step": 487314, "epoch": 2900} {"train_loss": -10.504172325134277, "global_step": 487315, "epoch": 2900} {"train_loss": -11.360688209533691, "global_step": 487316, "epoch": 2900} {"train_loss": -12.384638786315918, "global_step": 487317, "epoch": 2900} {"train_loss": -11.52462387084961, "global_step": 487318, "epoch": 2900} {"train_loss": -12.239740371704102, "global_step": 487319, "epoch": 2900} {"train_loss": -11.837684631347656, "global_step": 487320, "epoch": 2900} {"train_loss": -12.10295295715332, "global_step": 487321, "epoch": 2900} {"train_loss": -12.041230201721191, "global_step": 487322, "epoch": 2900} {"train_loss": -12.34524917602539, "global_step": 487323, "epoch": 2900} {"train_loss": -12.624982833862305, "global_step": 487324, "epoch": 2900} {"train_loss": -12.097126007080078, "global_step": 487325, "epoch": 2900} {"train_loss": -12.615884780883789, "global_step": 487326, "epoch": 2900} {"train_loss": -11.984636306762695, "global_step": 487327, "epoch": 2900} {"train_loss": -12.327033996582031, "global_step": 487328, "epoch": 2900} {"train_loss": -11.866337776184082, "global_step": 487329, "epoch": 2900} {"train_loss": -11.486516952514648, "global_step": 487330, "epoch": 2900} {"train_loss": -11.918560028076172, "global_step": 487331, "epoch": 2900} {"train_loss": -12.558616638183594, "global_step": 487332, "epoch": 2900} {"train_loss": -10.916921615600586, "global_step": 487333, "epoch": 2900} {"train_loss": -12.117179870605469, "global_step": 487334, "epoch": 2900} {"train_loss": -11.774751663208008, "global_step": 487335, "epoch": 2900} {"train_loss": -10.579800605773926, "global_step": 487336, "epoch": 2900} {"train_loss": -11.447555541992188, "global_step": 487337, "epoch": 2900} {"train_loss": -9.601876258850098, "global_step": 487338, "epoch": 2900} {"train_loss": -9.672126770019531, "global_step": 487339, "epoch": 2900} {"train_loss": -10.48838996887207, "global_step": 487340, "epoch": 2900} {"train_loss": -10.921805381774902, "global_step": 487341, "epoch": 2900} {"train_loss": -10.600506782531738, "global_step": 487342, "epoch": 2900} {"train_loss": -10.270753860473633, "global_step": 487343, "epoch": 2900} {"train_loss": -11.11886215209961, "global_step": 487344, "epoch": 2900} {"train_loss": -11.393367767333984, "global_step": 487345, "epoch": 2900} {"train_loss": -11.817776679992676, "global_step": 487346, "epoch": 2900} {"train_loss": -11.598388671875, "global_step": 487347, "epoch": 2900} {"train_loss": -11.754150390625, "global_step": 487348, "epoch": 2900} {"train_loss": -11.04513931274414, "global_step": 487349, "epoch": 2900} {"train_loss": -10.51997184753418, "global_step": 487350, "epoch": 2900} {"train_loss": -11.605555534362793, "global_step": 487351, "epoch": 2900} {"train_loss": -11.361164093017578, "global_step": 487352, "epoch": 2900} {"train_loss": -11.967227935791016, "global_step": 487353, "epoch": 2900} {"train_loss": -11.749229431152344, "global_step": 487354, "epoch": 2900} {"train_loss": -12.160745620727539, "global_step": 487355, "epoch": 2900} {"train_loss": -12.108978271484375, "global_step": 487356, "epoch": 2900} {"train_loss": -11.968031883239746, "global_step": 487357, "epoch": 2900} {"train_loss": -11.822538375854492, "global_step": 487358, "epoch": 2900} {"train_loss": -12.262956619262695, "global_step": 487359, "epoch": 2900} {"train_loss": -12.452110290527344, "global_step": 487360, "epoch": 2900} {"train_loss": -12.456951141357422, "global_step": 487361, "epoch": 2900} {"train_loss": -12.206613540649414, "global_step": 487362, "epoch": 2900} {"train_loss": -12.409367561340332, "global_step": 487363, "epoch": 2900} {"train_loss": -12.219799041748047, "global_step": 487364, "epoch": 2900} {"train_loss": -12.237548828125, "global_step": 487365, "epoch": 2900} {"train_loss": -11.91650390625, "global_step": 487366, "epoch": 2900} {"train_loss": -12.339512404941377, "global_step": 487367, "epoch": 2900, "train/sim_max_reward_0": 0.672941098535715, "train/sim_max_reward_1": 0.9264829238093458, "train/sim_max_reward_2": 0.0017109907202362135, "train/sim_max_reward_3": 0.5760481799649857, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.5379504941972564, "test/sim_max_reward_4400000": 0.9898289012125807, "test/sim_max_reward_4400001": 0.2003303460256237, "test/sim_max_reward_4400002": 0.3944025176795975, "test/sim_max_reward_4400003": 0.999786366870105, "test/sim_max_reward_4400004": 0.49596606712092856, "test/sim_max_reward_4400005": 0.968215553371518, "test/sim_max_reward_4400006": 0.1325151621523208, "test/sim_max_reward_4400007": 0.63901446857453, "test/sim_max_reward_4400008": 0.6968460599754291, "test/sim_max_reward_4400009": 0.028730941858026975, "test/sim_max_reward_4400010": 0.43403330303865806, "test/sim_max_reward_4400011": 0.303720287213991, "test/sim_max_reward_4400012": 0.9228738505497237, "test/sim_max_reward_4400013": 0.9961534475331353, "test/sim_max_reward_4400014": 0.3957045531214321, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.9819195252392772, "test/sim_max_reward_4400019": 0.20043527533352465, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.6735688696552679, "test/sim_max_reward_4400022": 0.9603947428448203, "test/sim_max_reward_4400023": 0.15052560565719766, "test/sim_max_reward_4400024": 1.0, "test/sim_max_reward_4400025": 0.5602135158908965, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.17288664795780845, "test/sim_max_reward_4400028": 1.0, "test/sim_max_reward_4400029": 1.0, "test/sim_max_reward_4400030": 0.9800517442077514, "test/sim_max_reward_4400031": 0.6556553343424175, "test/sim_max_reward_4400032": 0.04190002516070465, "test/sim_max_reward_4400033": 0.1395532021994166, "test/sim_max_reward_4400034": 0.500276454678336, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.9653672068621248, "test/sim_max_reward_4400037": 0.980591799688598, "test/sim_max_reward_4400038": 0.2898641254301575, "test/sim_max_reward_4400039": 0.4117319922459178, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.4344581211359747, "test/sim_max_reward_4400042": 0.34045338974955314, "test/sim_max_reward_4400043": 0.011032022751590697, "test/sim_max_reward_4400044": 0.9458143886512808, "test/sim_max_reward_4400045": 0.9961855821697708, "test/sim_max_reward_4400046": 0.9852786778626359, "test/sim_max_reward_4400047": 0.9925879562557803, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.6191889478712566, "test/mean_score": 0.5050680808449352, "val_loss": 313993.375, "train_action_mse_error": 1.274232029914856} {"train_loss": -12.352909088134766, "global_step": 487368, "epoch": 2901} {"train_loss": -12.105323791503906, "global_step": 487369, "epoch": 2901} {"train_loss": -12.39686393737793, "global_step": 487370, "epoch": 2901} {"train_loss": -12.324135780334473, "global_step": 487371, "epoch": 2901} {"train_loss": -12.417425155639648, "global_step": 487372, "epoch": 2901} {"train_loss": -12.580078125, "global_step": 487373, "epoch": 2901} {"train_loss": -12.642382621765137, "global_step": 487374, "epoch": 2901} {"train_loss": -12.45317268371582, "global_step": 487375, "epoch": 2901} {"train_loss": -12.163958549499512, "global_step": 487376, "epoch": 2901} {"train_loss": -12.446571350097656, "global_step": 487377, "epoch": 2901} {"train_loss": -12.350639343261719, "global_step": 487378, "epoch": 2901} {"train_loss": -12.509321212768555, "global_step": 487379, "epoch": 2901} {"train_loss": -12.423538208007812, "global_step": 487380, "epoch": 2901} {"train_loss": -12.36220932006836, "global_step": 487381, "epoch": 2901} {"train_loss": -12.388748168945312, "global_step": 487382, "epoch": 2901} {"train_loss": -12.563881874084473, "global_step": 487383, "epoch": 2901} {"train_loss": -12.424226760864258, "global_step": 487384, "epoch": 2901} {"train_loss": -12.598859786987305, "global_step": 487385, "epoch": 2901} {"train_loss": -12.465578079223633, "global_step": 487386, "epoch": 2901} {"train_loss": -12.67391586303711, "global_step": 487387, "epoch": 2901} {"train_loss": -12.29053020477295, "global_step": 487388, "epoch": 2901} {"train_loss": -12.79403018951416, "global_step": 487389, "epoch": 2901} {"train_loss": -12.553681373596191, "global_step": 487390, "epoch": 2901} {"train_loss": -12.698705673217773, "global_step": 487391, "epoch": 2901} {"train_loss": -12.666387557983398, "global_step": 487392, "epoch": 2901} {"train_loss": -12.546852111816406, "global_step": 487393, "epoch": 2901} {"train_loss": -12.819087982177734, "global_step": 487394, "epoch": 2901} {"train_loss": -12.569253921508789, "global_step": 487395, "epoch": 2901} {"train_loss": -12.79729175567627, "global_step": 487396, "epoch": 2901} {"train_loss": -12.707846641540527, "global_step": 487397, "epoch": 2901} {"train_loss": -12.641523361206055, "global_step": 487398, "epoch": 2901} {"train_loss": -12.576005935668945, "global_step": 487399, "epoch": 2901} {"train_loss": -12.236842155456543, "global_step": 487400, "epoch": 2901} {"train_loss": -12.713497161865234, "global_step": 487401, "epoch": 2901} {"train_loss": -12.800504684448242, "global_step": 487402, "epoch": 2901} {"train_loss": -12.262616157531738, "global_step": 487403, "epoch": 2901} {"train_loss": -12.855547904968262, "global_step": 487404, "epoch": 2901} {"train_loss": -12.509969711303711, "global_step": 487405, "epoch": 2901} {"train_loss": -12.974411010742188, "global_step": 487406, "epoch": 2901} {"train_loss": -12.608235359191895, "global_step": 487407, "epoch": 2901} {"train_loss": -12.562087059020996, "global_step": 487408, "epoch": 2901} {"train_loss": -12.725082397460938, "global_step": 487409, "epoch": 2901} {"train_loss": -12.544193267822266, "global_step": 487410, "epoch": 2901} {"train_loss": -12.669881820678711, "global_step": 487411, "epoch": 2901} {"train_loss": -12.698598861694336, "global_step": 487412, "epoch": 2901} {"train_loss": -12.849327087402344, "global_step": 487413, "epoch": 2901} {"train_loss": -12.575239181518555, "global_step": 487414, "epoch": 2901} {"train_loss": -12.65818977355957, "global_step": 487415, "epoch": 2901} {"train_loss": -12.663992881774902, "global_step": 487416, "epoch": 2901} {"train_loss": -12.27621841430664, "global_step": 487417, "epoch": 2901} {"train_loss": -11.861364364624023, "global_step": 487418, "epoch": 2901} {"train_loss": -12.67350959777832, "global_step": 487419, "epoch": 2901} {"train_loss": -12.19228744506836, "global_step": 487420, "epoch": 2901} {"train_loss": -12.497549057006836, "global_step": 487421, "epoch": 2901} {"train_loss": -12.200590133666992, "global_step": 487422, "epoch": 2901} {"train_loss": -12.760992050170898, "global_step": 487423, "epoch": 2901} {"train_loss": -11.656604766845703, "global_step": 487424, "epoch": 2901} {"train_loss": -11.81182861328125, "global_step": 487425, "epoch": 2901} {"train_loss": -12.238252639770508, "global_step": 487426, "epoch": 2901} {"train_loss": -11.94174575805664, "global_step": 487427, "epoch": 2901} {"train_loss": -11.596558570861816, "global_step": 487428, "epoch": 2901} {"train_loss": -12.217103958129883, "global_step": 487429, "epoch": 2901} {"train_loss": -12.000667572021484, "global_step": 487430, "epoch": 2901} {"train_loss": -12.250792503356934, "global_step": 487431, "epoch": 2901} {"train_loss": -11.56009292602539, "global_step": 487432, "epoch": 2901} {"train_loss": -12.162612915039062, "global_step": 487433, "epoch": 2901} {"train_loss": -11.948869705200195, "global_step": 487434, "epoch": 2901} {"train_loss": -11.441902160644531, "global_step": 487435, "epoch": 2901} {"train_loss": -11.961021423339844, "global_step": 487436, "epoch": 2901} {"train_loss": -12.508391380310059, "global_step": 487437, "epoch": 2901} {"train_loss": -11.446540832519531, "global_step": 487438, "epoch": 2901} {"train_loss": -12.291438102722168, "global_step": 487439, "epoch": 2901} {"train_loss": -11.393046379089355, "global_step": 487440, "epoch": 2901} {"train_loss": -12.240516662597656, "global_step": 487441, "epoch": 2901} {"train_loss": -11.195047378540039, "global_step": 487442, "epoch": 2901} {"train_loss": -12.644003868103027, "global_step": 487443, "epoch": 2901} {"train_loss": -11.704239845275879, "global_step": 487444, "epoch": 2901} {"train_loss": -12.275114059448242, "global_step": 487445, "epoch": 2901} {"train_loss": -11.546388626098633, "global_step": 487446, "epoch": 2901} {"train_loss": -12.438152313232422, "global_step": 487447, "epoch": 2901} {"train_loss": -12.373981475830078, "global_step": 487448, "epoch": 2901} {"train_loss": -11.982361793518066, "global_step": 487449, "epoch": 2901} {"train_loss": -11.279797554016113, "global_step": 487450, "epoch": 2901} {"train_loss": -11.731151580810547, "global_step": 487451, "epoch": 2901} {"train_loss": -12.264480590820312, "global_step": 487452, "epoch": 2901} {"train_loss": -11.781800270080566, "global_step": 487453, "epoch": 2901} {"train_loss": -12.48386001586914, "global_step": 487454, "epoch": 2901} {"train_loss": -12.344714164733887, "global_step": 487455, "epoch": 2901} {"train_loss": -12.326899528503418, "global_step": 487456, "epoch": 2901} {"train_loss": -12.373910903930664, "global_step": 487457, "epoch": 2901} {"train_loss": -12.457108497619629, "global_step": 487458, "epoch": 2901} {"train_loss": -12.599465370178223, "global_step": 487459, "epoch": 2901} {"train_loss": -12.657485008239746, "global_step": 487460, "epoch": 2901} {"train_loss": -12.37719440460205, "global_step": 487461, "epoch": 2901} {"train_loss": -12.349408149719238, "global_step": 487462, "epoch": 2901} {"train_loss": -12.264738082885742, "global_step": 487463, "epoch": 2901} {"train_loss": -12.32691764831543, "global_step": 487464, "epoch": 2901} {"train_loss": -12.362140655517578, "global_step": 487465, "epoch": 2901} {"train_loss": -12.403708457946777, "global_step": 487466, "epoch": 2901} {"train_loss": -12.407398223876953, "global_step": 487467, "epoch": 2901} {"train_loss": -11.760551452636719, "global_step": 487468, "epoch": 2901} {"train_loss": -11.346576690673828, "global_step": 487469, "epoch": 2901} {"train_loss": -11.341809272766113, "global_step": 487470, "epoch": 2901} {"train_loss": -11.531116485595703, "global_step": 487471, "epoch": 2901} {"train_loss": -10.611013412475586, "global_step": 487472, "epoch": 2901} {"train_loss": -10.39385986328125, "global_step": 487473, "epoch": 2901} {"train_loss": -10.908177375793457, "global_step": 487474, "epoch": 2901} {"train_loss": -10.204156875610352, "global_step": 487475, "epoch": 2901} {"train_loss": -11.415029525756836, "global_step": 487476, "epoch": 2901} {"train_loss": -10.611838340759277, "global_step": 487477, "epoch": 2901} {"train_loss": -11.106584548950195, "global_step": 487478, "epoch": 2901} {"train_loss": -10.787760734558105, "global_step": 487479, "epoch": 2901} {"train_loss": -11.296802520751953, "global_step": 487480, "epoch": 2901} {"train_loss": -11.51073169708252, "global_step": 487481, "epoch": 2901} {"train_loss": -10.801393508911133, "global_step": 487482, "epoch": 2901} {"train_loss": -11.260807037353516, "global_step": 487483, "epoch": 2901} {"train_loss": -11.179515838623047, "global_step": 487484, "epoch": 2901} {"train_loss": -11.986896514892578, "global_step": 487485, "epoch": 2901} {"train_loss": -11.763914108276367, "global_step": 487486, "epoch": 2901} {"train_loss": -11.532147407531738, "global_step": 487487, "epoch": 2901} {"train_loss": -11.172464370727539, "global_step": 487488, "epoch": 2901} {"train_loss": -11.944229125976562, "global_step": 487489, "epoch": 2901} {"train_loss": -11.487282752990723, "global_step": 487490, "epoch": 2901} {"train_loss": -11.541398048400879, "global_step": 487491, "epoch": 2901} {"train_loss": -11.617389678955078, "global_step": 487492, "epoch": 2901} {"train_loss": -11.39968490600586, "global_step": 487493, "epoch": 2901} {"train_loss": -11.465047836303711, "global_step": 487494, "epoch": 2901} {"train_loss": -11.447778701782227, "global_step": 487495, "epoch": 2901} {"train_loss": -11.427762985229492, "global_step": 487496, "epoch": 2901} {"train_loss": -12.10641860961914, "global_step": 487497, "epoch": 2901} {"train_loss": -11.90229606628418, "global_step": 487498, "epoch": 2901} {"train_loss": -12.134970664978027, "global_step": 487499, "epoch": 2901} {"train_loss": -12.150334358215332, "global_step": 487500, "epoch": 2901} {"train_loss": -12.20663833618164, "global_step": 487501, "epoch": 2901} {"train_loss": -12.223007202148438, "global_step": 487502, "epoch": 2901} {"train_loss": -12.147549629211426, "global_step": 487503, "epoch": 2901} {"train_loss": -11.998069763183594, "global_step": 487504, "epoch": 2901} {"train_loss": -12.202581405639648, "global_step": 487505, "epoch": 2901} {"train_loss": -12.571627616882324, "global_step": 487506, "epoch": 2901} {"train_loss": -12.116315841674805, "global_step": 487507, "epoch": 2901} {"train_loss": -12.688514709472656, "global_step": 487508, "epoch": 2901} {"train_loss": -12.339040756225586, "global_step": 487509, "epoch": 2901} {"train_loss": -12.487112998962402, "global_step": 487510, "epoch": 2901} {"train_loss": -12.552057266235352, "global_step": 487511, "epoch": 2901} {"train_loss": -12.639606475830078, "global_step": 487512, "epoch": 2901} {"train_loss": -12.713476181030273, "global_step": 487513, "epoch": 2901} {"train_loss": -12.48092269897461, "global_step": 487514, "epoch": 2901} {"train_loss": -12.45085334777832, "global_step": 487515, "epoch": 2901} {"train_loss": -12.674467086791992, "global_step": 487516, "epoch": 2901} {"train_loss": -12.443836212158203, "global_step": 487517, "epoch": 2901} {"train_loss": -12.62295150756836, "global_step": 487518, "epoch": 2901} {"train_loss": -12.661659240722656, "global_step": 487519, "epoch": 2901} {"train_loss": -12.649795532226562, "global_step": 487520, "epoch": 2901} {"train_loss": -12.7803373336792, "global_step": 487521, "epoch": 2901} {"train_loss": -12.440370559692383, "global_step": 487522, "epoch": 2901} {"train_loss": -12.354406356811523, "global_step": 487523, "epoch": 2901} {"train_loss": -12.056926727294922, "global_step": 487524, "epoch": 2901} {"train_loss": -12.725875854492188, "global_step": 487525, "epoch": 2901} {"train_loss": -12.280153274536133, "global_step": 487526, "epoch": 2901} {"train_loss": -12.749883651733398, "global_step": 487527, "epoch": 2901} {"train_loss": -12.427988052368164, "global_step": 487528, "epoch": 2901} {"train_loss": -12.78726863861084, "global_step": 487529, "epoch": 2901} {"train_loss": -12.58346176147461, "global_step": 487530, "epoch": 2901} {"train_loss": -12.58846664428711, "global_step": 487531, "epoch": 2901} {"train_loss": -12.776725769042969, "global_step": 487532, "epoch": 2901} {"train_loss": -12.826641082763672, "global_step": 487533, "epoch": 2901} {"train_loss": -12.780599594116211, "global_step": 487534, "epoch": 2901} {"train_loss": -12.180195223717462, "global_step": 487535, "epoch": 2901, "val_loss": 316498.78125} {"train_loss": -12.912466049194336, "global_step": 487536, "epoch": 2902} {"train_loss": -12.933187484741211, "global_step": 487537, "epoch": 2902} {"train_loss": -12.74020004272461, "global_step": 487538, "epoch": 2902} {"train_loss": -12.724200248718262, "global_step": 487539, "epoch": 2902} {"train_loss": -12.842662811279297, "global_step": 487540, "epoch": 2902} {"train_loss": -12.74629020690918, "global_step": 487541, "epoch": 2902} {"train_loss": -12.716551780700684, "global_step": 487542, "epoch": 2902} {"train_loss": -12.73141098022461, "global_step": 487543, "epoch": 2902} {"train_loss": -12.796993255615234, "global_step": 487544, "epoch": 2902} {"train_loss": -12.777772903442383, "global_step": 487545, "epoch": 2902} {"train_loss": -12.612070083618164, "global_step": 487546, "epoch": 2902} {"train_loss": -12.700098991394043, "global_step": 487547, "epoch": 2902} {"train_loss": -12.95993709564209, "global_step": 487548, "epoch": 2902} {"train_loss": -12.865702629089355, "global_step": 487549, "epoch": 2902} {"train_loss": -12.425546646118164, "global_step": 487550, "epoch": 2902} {"train_loss": -12.649041175842285, "global_step": 487551, "epoch": 2902} {"train_loss": -12.879127502441406, "global_step": 487552, "epoch": 2902} {"train_loss": -12.688209533691406, "global_step": 487553, "epoch": 2902} {"train_loss": -12.791264533996582, "global_step": 487554, "epoch": 2902} {"train_loss": -12.843231201171875, "global_step": 487555, "epoch": 2902} {"train_loss": -12.54671859741211, "global_step": 487556, "epoch": 2902} {"train_loss": -12.78615951538086, "global_step": 487557, "epoch": 2902} {"train_loss": -12.785857200622559, "global_step": 487558, "epoch": 2902} {"train_loss": -12.124143600463867, "global_step": 487559, "epoch": 2902} {"train_loss": -12.845459938049316, "global_step": 487560, "epoch": 2902} {"train_loss": -12.455202102661133, "global_step": 487561, "epoch": 2902} {"train_loss": -12.16323471069336, "global_step": 487562, "epoch": 2902} {"train_loss": -12.765239715576172, "global_step": 487563, "epoch": 2902} {"train_loss": -12.579294204711914, "global_step": 487564, "epoch": 2902} {"train_loss": -12.70793342590332, "global_step": 487565, "epoch": 2902} {"train_loss": -12.857253074645996, "global_step": 487566, "epoch": 2902} {"train_loss": -12.531194686889648, "global_step": 487567, "epoch": 2902} {"train_loss": -12.953230857849121, "global_step": 487568, "epoch": 2902} {"train_loss": -12.858925819396973, "global_step": 487569, "epoch": 2902} {"train_loss": -12.785818099975586, "global_step": 487570, "epoch": 2902} {"train_loss": -12.944485664367676, "global_step": 487571, "epoch": 2902} {"train_loss": -12.74720573425293, "global_step": 487572, "epoch": 2902} {"train_loss": -12.76253890991211, "global_step": 487573, "epoch": 2902} {"train_loss": -12.808107376098633, "global_step": 487574, "epoch": 2902} {"train_loss": -12.953707695007324, "global_step": 487575, "epoch": 2902} {"train_loss": -12.8756103515625, "global_step": 487576, "epoch": 2902} {"train_loss": -12.804741859436035, "global_step": 487577, "epoch": 2902} {"train_loss": -13.173233032226562, "global_step": 487578, "epoch": 2902} {"train_loss": -12.909408569335938, "global_step": 487579, "epoch": 2902} {"train_loss": -12.714303970336914, "global_step": 487580, "epoch": 2902} {"train_loss": -12.935712814331055, "global_step": 487581, "epoch": 2902} {"train_loss": -12.894756317138672, "global_step": 487582, "epoch": 2902} {"train_loss": -12.44211196899414, "global_step": 487583, "epoch": 2902} {"train_loss": -12.891989707946777, "global_step": 487584, "epoch": 2902} {"train_loss": -12.266361236572266, "global_step": 487585, "epoch": 2902} {"train_loss": -12.630254745483398, "global_step": 487586, "epoch": 2902} {"train_loss": -12.695926666259766, "global_step": 487587, "epoch": 2902} {"train_loss": -12.139198303222656, "global_step": 487588, "epoch": 2902} {"train_loss": -12.633245468139648, "global_step": 487589, "epoch": 2902} {"train_loss": -13.018327713012695, "global_step": 487590, "epoch": 2902} {"train_loss": -11.69328784942627, "global_step": 487591, "epoch": 2902} {"train_loss": -12.580954551696777, "global_step": 487592, "epoch": 2902} {"train_loss": -12.600604057312012, "global_step": 487593, "epoch": 2902} {"train_loss": -12.275246620178223, "global_step": 487594, "epoch": 2902} {"train_loss": -12.104927062988281, "global_step": 487595, "epoch": 2902} {"train_loss": -12.440632820129395, "global_step": 487596, "epoch": 2902} {"train_loss": -12.61429214477539, "global_step": 487597, "epoch": 2902} {"train_loss": -12.437921524047852, "global_step": 487598, "epoch": 2902} {"train_loss": -12.213105201721191, "global_step": 487599, "epoch": 2902} {"train_loss": -12.388580322265625, "global_step": 487600, "epoch": 2902} {"train_loss": -12.817275047302246, "global_step": 487601, "epoch": 2902} {"train_loss": -12.677967071533203, "global_step": 487602, "epoch": 2902} {"train_loss": -12.590621948242188, "global_step": 487603, "epoch": 2902} {"train_loss": -12.748318672180176, "global_step": 487604, "epoch": 2902} {"train_loss": -12.657440185546875, "global_step": 487605, "epoch": 2902} {"train_loss": -12.561734199523926, "global_step": 487606, "epoch": 2902} {"train_loss": -12.612807273864746, "global_step": 487607, "epoch": 2902} {"train_loss": -11.96845531463623, "global_step": 487608, "epoch": 2902} {"train_loss": -12.401477813720703, "global_step": 487609, "epoch": 2902} {"train_loss": -12.115266799926758, "global_step": 487610, "epoch": 2902} {"train_loss": -10.450098037719727, "global_step": 487611, "epoch": 2902} {"train_loss": -12.618194580078125, "global_step": 487612, "epoch": 2902} {"train_loss": -11.390409469604492, "global_step": 487613, "epoch": 2902} {"train_loss": -10.109890937805176, "global_step": 487614, "epoch": 2902} {"train_loss": -12.111723899841309, "global_step": 487615, "epoch": 2902} {"train_loss": -9.424860954284668, "global_step": 487616, "epoch": 2902} {"train_loss": -9.602266311645508, "global_step": 487617, "epoch": 2902} {"train_loss": -10.867687225341797, "global_step": 487618, "epoch": 2902} {"train_loss": -11.111273765563965, "global_step": 487619, "epoch": 2902} {"train_loss": -10.183815956115723, "global_step": 487620, "epoch": 2902} {"train_loss": -9.386667251586914, "global_step": 487621, "epoch": 2902} {"train_loss": -9.97706413269043, "global_step": 487622, "epoch": 2902} {"train_loss": -10.786951065063477, "global_step": 487623, "epoch": 2902} {"train_loss": -10.412761688232422, "global_step": 487624, "epoch": 2902} {"train_loss": -10.511934280395508, "global_step": 487625, "epoch": 2902} {"train_loss": -11.6874418258667, "global_step": 487626, "epoch": 2902} {"train_loss": -11.298648834228516, "global_step": 487627, "epoch": 2902} {"train_loss": -10.711933135986328, "global_step": 487628, "epoch": 2902} {"train_loss": -10.846169471740723, "global_step": 487629, "epoch": 2902} {"train_loss": -10.448789596557617, "global_step": 487630, "epoch": 2902} {"train_loss": -11.810091018676758, "global_step": 487631, "epoch": 2902} {"train_loss": -9.9876127243042, "global_step": 487632, "epoch": 2902} {"train_loss": -11.288763999938965, "global_step": 487633, "epoch": 2902} {"train_loss": -10.770895957946777, "global_step": 487634, "epoch": 2902} {"train_loss": -11.810117721557617, "global_step": 487635, "epoch": 2902} {"train_loss": -11.407816886901855, "global_step": 487636, "epoch": 2902} {"train_loss": -11.238245010375977, "global_step": 487637, "epoch": 2902} {"train_loss": -11.541824340820312, "global_step": 487638, "epoch": 2902} {"train_loss": -11.450645446777344, "global_step": 487639, "epoch": 2902} {"train_loss": -10.907509803771973, "global_step": 487640, "epoch": 2902} {"train_loss": -11.639852523803711, "global_step": 487641, "epoch": 2902} {"train_loss": -11.077346801757812, "global_step": 487642, "epoch": 2902} {"train_loss": -11.204575538635254, "global_step": 487643, "epoch": 2902} {"train_loss": -11.487457275390625, "global_step": 487644, "epoch": 2902} {"train_loss": -11.676300048828125, "global_step": 487645, "epoch": 2902} {"train_loss": -12.102873802185059, "global_step": 487646, "epoch": 2902} {"train_loss": -12.142888069152832, "global_step": 487647, "epoch": 2902} {"train_loss": -11.594305038452148, "global_step": 487648, "epoch": 2902} {"train_loss": -11.61536693572998, "global_step": 487649, "epoch": 2902} {"train_loss": -11.359907150268555, "global_step": 487650, "epoch": 2902} {"train_loss": -11.899717330932617, "global_step": 487651, "epoch": 2902} {"train_loss": -10.599958419799805, "global_step": 487652, "epoch": 2902} {"train_loss": -11.557012557983398, "global_step": 487653, "epoch": 2902} {"train_loss": -11.565940856933594, "global_step": 487654, "epoch": 2902} {"train_loss": -11.377443313598633, "global_step": 487655, "epoch": 2902} {"train_loss": -12.341110229492188, "global_step": 487656, "epoch": 2902} {"train_loss": -11.401657104492188, "global_step": 487657, "epoch": 2902} {"train_loss": -11.960116386413574, "global_step": 487658, "epoch": 2902} {"train_loss": -12.409151077270508, "global_step": 487659, "epoch": 2902} {"train_loss": -12.04975700378418, "global_step": 487660, "epoch": 2902} {"train_loss": -12.275060653686523, "global_step": 487661, "epoch": 2902} {"train_loss": -12.201990127563477, "global_step": 487662, "epoch": 2902} {"train_loss": -12.32116985321045, "global_step": 487663, "epoch": 2902} {"train_loss": -11.90999984741211, "global_step": 487664, "epoch": 2902} {"train_loss": -12.657743453979492, "global_step": 487665, "epoch": 2902} {"train_loss": -12.291220664978027, "global_step": 487666, "epoch": 2902} {"train_loss": -12.255664825439453, "global_step": 487667, "epoch": 2902} {"train_loss": -12.532876014709473, "global_step": 487668, "epoch": 2902} {"train_loss": -12.47719955444336, "global_step": 487669, "epoch": 2902} {"train_loss": -12.514501571655273, "global_step": 487670, "epoch": 2902} {"train_loss": -12.321955680847168, "global_step": 487671, "epoch": 2902} {"train_loss": -12.462587356567383, "global_step": 487672, "epoch": 2902} {"train_loss": -12.816787719726562, "global_step": 487673, "epoch": 2902} {"train_loss": -12.436073303222656, "global_step": 487674, "epoch": 2902} {"train_loss": -12.425065040588379, "global_step": 487675, "epoch": 2902} {"train_loss": -12.394689559936523, "global_step": 487676, "epoch": 2902} {"train_loss": -12.868711471557617, "global_step": 487677, "epoch": 2902} {"train_loss": -12.405155181884766, "global_step": 487678, "epoch": 2902} {"train_loss": -12.33175277709961, "global_step": 487679, "epoch": 2902} {"train_loss": -12.314416885375977, "global_step": 487680, "epoch": 2902} {"train_loss": -12.413411140441895, "global_step": 487681, "epoch": 2902} {"train_loss": -12.391719818115234, "global_step": 487682, "epoch": 2902} {"train_loss": -12.448171615600586, "global_step": 487683, "epoch": 2902} {"train_loss": -12.402567863464355, "global_step": 487684, "epoch": 2902} {"train_loss": -12.182515144348145, "global_step": 487685, "epoch": 2902} {"train_loss": -12.514095306396484, "global_step": 487686, "epoch": 2902} {"train_loss": -12.5550537109375, "global_step": 487687, "epoch": 2902} {"train_loss": -12.542655944824219, "global_step": 487688, "epoch": 2902} {"train_loss": -12.358844757080078, "global_step": 487689, "epoch": 2902} {"train_loss": -12.674460411071777, "global_step": 487690, "epoch": 2902} {"train_loss": -12.545244216918945, "global_step": 487691, "epoch": 2902} {"train_loss": -12.736580848693848, "global_step": 487692, "epoch": 2902} {"train_loss": -12.50741958618164, "global_step": 487693, "epoch": 2902} {"train_loss": -12.782207489013672, "global_step": 487694, "epoch": 2902} {"train_loss": -12.782328605651855, "global_step": 487695, "epoch": 2902} {"train_loss": -12.591644287109375, "global_step": 487696, "epoch": 2902} {"train_loss": -12.5958251953125, "global_step": 487697, "epoch": 2902} {"train_loss": -12.908614158630371, "global_step": 487698, "epoch": 2902} {"train_loss": -12.579975128173828, "global_step": 487699, "epoch": 2902} {"train_loss": -12.94047737121582, "global_step": 487700, "epoch": 2902} {"train_loss": -12.72427749633789, "global_step": 487701, "epoch": 2902} {"train_loss": -12.683481216430664, "global_step": 487702, "epoch": 2902} {"train_loss": -12.176573821476527, "global_step": 487703, "epoch": 2902, "val_loss": 313808.25} {"train_loss": -12.666260719299316, "global_step": 487704, "epoch": 2903} {"train_loss": -12.599482536315918, "global_step": 487705, "epoch": 2903} {"train_loss": -12.687801361083984, "global_step": 487706, "epoch": 2903} {"train_loss": -12.815933227539062, "global_step": 487707, "epoch": 2903} {"train_loss": -12.808438301086426, "global_step": 487708, "epoch": 2903} {"train_loss": -12.694765090942383, "global_step": 487709, "epoch": 2903} {"train_loss": -12.76251220703125, "global_step": 487710, "epoch": 2903} {"train_loss": -12.357760429382324, "global_step": 487711, "epoch": 2903} {"train_loss": -12.866825103759766, "global_step": 487712, "epoch": 2903} {"train_loss": -12.630653381347656, "global_step": 487713, "epoch": 2903} {"train_loss": -12.837492942810059, "global_step": 487714, "epoch": 2903} {"train_loss": -12.712654113769531, "global_step": 487715, "epoch": 2903} {"train_loss": -12.763672828674316, "global_step": 487716, "epoch": 2903} {"train_loss": -12.639034271240234, "global_step": 487717, "epoch": 2903} {"train_loss": -12.816580772399902, "global_step": 487718, "epoch": 2903} {"train_loss": -12.743419647216797, "global_step": 487719, "epoch": 2903} {"train_loss": -12.760008811950684, "global_step": 487720, "epoch": 2903} {"train_loss": -12.848231315612793, "global_step": 487721, "epoch": 2903} {"train_loss": -12.912176132202148, "global_step": 487722, "epoch": 2903} {"train_loss": -12.76364803314209, "global_step": 487723, "epoch": 2903} {"train_loss": -12.885503768920898, "global_step": 487724, "epoch": 2903} {"train_loss": -12.640790939331055, "global_step": 487725, "epoch": 2903} {"train_loss": -12.564699172973633, "global_step": 487726, "epoch": 2903} {"train_loss": -13.049182891845703, "global_step": 487727, "epoch": 2903} {"train_loss": -12.82725715637207, "global_step": 487728, "epoch": 2903} {"train_loss": -12.834741592407227, "global_step": 487729, "epoch": 2903} {"train_loss": -12.937171936035156, "global_step": 487730, "epoch": 2903} {"train_loss": -12.829176902770996, "global_step": 487731, "epoch": 2903} {"train_loss": -12.908477783203125, "global_step": 487732, "epoch": 2903} {"train_loss": -12.873725891113281, "global_step": 487733, "epoch": 2903} {"train_loss": -13.031126022338867, "global_step": 487734, "epoch": 2903} {"train_loss": -12.925148010253906, "global_step": 487735, "epoch": 2903} {"train_loss": -13.016376495361328, "global_step": 487736, "epoch": 2903} {"train_loss": -12.869930267333984, "global_step": 487737, "epoch": 2903} {"train_loss": -13.063963890075684, "global_step": 487738, "epoch": 2903} {"train_loss": -12.728919982910156, "global_step": 487739, "epoch": 2903} {"train_loss": -12.930484771728516, "global_step": 487740, "epoch": 2903} {"train_loss": -12.948465347290039, "global_step": 487741, "epoch": 2903} {"train_loss": -13.088662147521973, "global_step": 487742, "epoch": 2903} {"train_loss": -13.076330184936523, "global_step": 487743, "epoch": 2903} {"train_loss": -12.975517272949219, "global_step": 487744, "epoch": 2903} {"train_loss": -12.767477989196777, "global_step": 487745, "epoch": 2903} {"train_loss": -12.925578117370605, "global_step": 487746, "epoch": 2903} {"train_loss": -12.841733932495117, "global_step": 487747, "epoch": 2903} {"train_loss": -13.016227722167969, "global_step": 487748, "epoch": 2903} {"train_loss": -13.090877532958984, "global_step": 487749, "epoch": 2903} {"train_loss": -12.853214263916016, "global_step": 487750, "epoch": 2903} {"train_loss": -12.966453552246094, "global_step": 487751, "epoch": 2903} {"train_loss": -13.014025688171387, "global_step": 487752, "epoch": 2903} {"train_loss": -12.998954772949219, "global_step": 487753, "epoch": 2903} {"train_loss": -12.972450256347656, "global_step": 487754, "epoch": 2903} {"train_loss": -13.03724479675293, "global_step": 487755, "epoch": 2903} {"train_loss": -13.147409439086914, "global_step": 487756, "epoch": 2903} {"train_loss": -13.02238655090332, "global_step": 487757, "epoch": 2903} {"train_loss": -12.554498672485352, "global_step": 487758, "epoch": 2903} {"train_loss": -12.308486938476562, "global_step": 487759, "epoch": 2903} {"train_loss": -12.951925277709961, "global_step": 487760, "epoch": 2903} {"train_loss": -12.627748489379883, "global_step": 487761, "epoch": 2903} {"train_loss": -12.933122634887695, "global_step": 487762, "epoch": 2903} {"train_loss": -12.884510040283203, "global_step": 487763, "epoch": 2903} {"train_loss": -13.034028053283691, "global_step": 487764, "epoch": 2903} {"train_loss": -13.072900772094727, "global_step": 487765, "epoch": 2903} {"train_loss": -12.937664985656738, "global_step": 487766, "epoch": 2903} {"train_loss": -12.920604705810547, "global_step": 487767, "epoch": 2903} {"train_loss": -12.901473999023438, "global_step": 487768, "epoch": 2903} {"train_loss": -12.328439712524414, "global_step": 487769, "epoch": 2903} {"train_loss": -12.492115020751953, "global_step": 487770, "epoch": 2903} {"train_loss": -11.467310905456543, "global_step": 487771, "epoch": 2903} {"train_loss": -12.812344551086426, "global_step": 487772, "epoch": 2903} {"train_loss": -11.834003448486328, "global_step": 487773, "epoch": 2903} {"train_loss": -11.936582565307617, "global_step": 487774, "epoch": 2903} {"train_loss": -12.396746635437012, "global_step": 487775, "epoch": 2903} {"train_loss": -11.781499862670898, "global_step": 487776, "epoch": 2903} {"train_loss": -10.414710998535156, "global_step": 487777, "epoch": 2903} {"train_loss": -10.158031463623047, "global_step": 487778, "epoch": 2903} {"train_loss": -9.571659088134766, "global_step": 487779, "epoch": 2903} {"train_loss": -11.863667488098145, "global_step": 487780, "epoch": 2903} {"train_loss": -10.04067611694336, "global_step": 487781, "epoch": 2903} {"train_loss": -9.39651870727539, "global_step": 487782, "epoch": 2903} {"train_loss": -10.558839797973633, "global_step": 487783, "epoch": 2903} {"train_loss": -7.9237775802612305, "global_step": 487784, "epoch": 2903} {"train_loss": -9.175495147705078, "global_step": 487785, "epoch": 2903} {"train_loss": -8.532998085021973, "global_step": 487786, "epoch": 2903} {"train_loss": -9.780356407165527, "global_step": 487787, "epoch": 2903} {"train_loss": -9.323662757873535, "global_step": 487788, "epoch": 2903} {"train_loss": -10.015787124633789, "global_step": 487789, "epoch": 2903} {"train_loss": -10.178095817565918, "global_step": 487790, "epoch": 2903} {"train_loss": -9.989744186401367, "global_step": 487791, "epoch": 2903} {"train_loss": -11.470327377319336, "global_step": 487792, "epoch": 2903} {"train_loss": -9.638948440551758, "global_step": 487793, "epoch": 2903} {"train_loss": -11.42985725402832, "global_step": 487794, "epoch": 2903} {"train_loss": -10.30068302154541, "global_step": 487795, "epoch": 2903} {"train_loss": -10.622512817382812, "global_step": 487796, "epoch": 2903} {"train_loss": -10.818282127380371, "global_step": 487797, "epoch": 2903} {"train_loss": -9.943403244018555, "global_step": 487798, "epoch": 2903} {"train_loss": -11.437400817871094, "global_step": 487799, "epoch": 2903} {"train_loss": -10.572748184204102, "global_step": 487800, "epoch": 2903} {"train_loss": -11.93763542175293, "global_step": 487801, "epoch": 2903} {"train_loss": -9.900350570678711, "global_step": 487802, "epoch": 2903} {"train_loss": -10.469541549682617, "global_step": 487803, "epoch": 2903} {"train_loss": -11.343881607055664, "global_step": 487804, "epoch": 2903} {"train_loss": -10.137359619140625, "global_step": 487805, "epoch": 2903} {"train_loss": -11.428784370422363, "global_step": 487806, "epoch": 2903} {"train_loss": -8.768702507019043, "global_step": 487807, "epoch": 2903} {"train_loss": -11.533477783203125, "global_step": 487808, "epoch": 2903} {"train_loss": -8.899150848388672, "global_step": 487809, "epoch": 2903} {"train_loss": -9.819087028503418, "global_step": 487810, "epoch": 2903} {"train_loss": -9.863462448120117, "global_step": 487811, "epoch": 2903} {"train_loss": -10.644548416137695, "global_step": 487812, "epoch": 2903} {"train_loss": -8.78841495513916, "global_step": 487813, "epoch": 2903} {"train_loss": -8.742820739746094, "global_step": 487814, "epoch": 2903} {"train_loss": -7.109076499938965, "global_step": 487815, "epoch": 2903} {"train_loss": -9.834638595581055, "global_step": 487816, "epoch": 2903} {"train_loss": -10.584490776062012, "global_step": 487817, "epoch": 2903} {"train_loss": -8.078426361083984, "global_step": 487818, "epoch": 2903} {"train_loss": -8.543338775634766, "global_step": 487819, "epoch": 2903} {"train_loss": -10.463823318481445, "global_step": 487820, "epoch": 2903} {"train_loss": -10.568782806396484, "global_step": 487821, "epoch": 2903} {"train_loss": -10.198437690734863, "global_step": 487822, "epoch": 2903} {"train_loss": -10.754609107971191, "global_step": 487823, "epoch": 2903} {"train_loss": -10.642778396606445, "global_step": 487824, "epoch": 2903} {"train_loss": -9.830846786499023, "global_step": 487825, "epoch": 2903} {"train_loss": -10.234991073608398, "global_step": 487826, "epoch": 2903} {"train_loss": -11.234580039978027, "global_step": 487827, "epoch": 2903} {"train_loss": -11.077818870544434, "global_step": 487828, "epoch": 2903} {"train_loss": -11.251477241516113, "global_step": 487829, "epoch": 2903} {"train_loss": -11.653681755065918, "global_step": 487830, "epoch": 2903} {"train_loss": -11.371545791625977, "global_step": 487831, "epoch": 2903} {"train_loss": -11.099416732788086, "global_step": 487832, "epoch": 2903} {"train_loss": -11.430402755737305, "global_step": 487833, "epoch": 2903} {"train_loss": -11.254341125488281, "global_step": 487834, "epoch": 2903} {"train_loss": -11.75135612487793, "global_step": 487835, "epoch": 2903} {"train_loss": -11.82923412322998, "global_step": 487836, "epoch": 2903} {"train_loss": -11.609304428100586, "global_step": 487837, "epoch": 2903} {"train_loss": -12.015070915222168, "global_step": 487838, "epoch": 2903} {"train_loss": -11.725807189941406, "global_step": 487839, "epoch": 2903} {"train_loss": -11.855461120605469, "global_step": 487840, "epoch": 2903} {"train_loss": -11.95970344543457, "global_step": 487841, "epoch": 2903} {"train_loss": -11.75495719909668, "global_step": 487842, "epoch": 2903} {"train_loss": -12.038869857788086, "global_step": 487843, "epoch": 2903} {"train_loss": -12.01783275604248, "global_step": 487844, "epoch": 2903} {"train_loss": -11.77453899383545, "global_step": 487845, "epoch": 2903} {"train_loss": -12.176468849182129, "global_step": 487846, "epoch": 2903} {"train_loss": -12.431621551513672, "global_step": 487847, "epoch": 2903} {"train_loss": -12.206189155578613, "global_step": 487848, "epoch": 2903} {"train_loss": -12.302581787109375, "global_step": 487849, "epoch": 2903} {"train_loss": -12.213057518005371, "global_step": 487850, "epoch": 2903} {"train_loss": -11.949434280395508, "global_step": 487851, "epoch": 2903} {"train_loss": -12.034852027893066, "global_step": 487852, "epoch": 2903} {"train_loss": -12.275373458862305, "global_step": 487853, "epoch": 2903} {"train_loss": -12.35804557800293, "global_step": 487854, "epoch": 2903} {"train_loss": -12.203028678894043, "global_step": 487855, "epoch": 2903} {"train_loss": -12.267461776733398, "global_step": 487856, "epoch": 2903} {"train_loss": -12.349691390991211, "global_step": 487857, "epoch": 2903} {"train_loss": -12.438420295715332, "global_step": 487858, "epoch": 2903} {"train_loss": -12.347352981567383, "global_step": 487859, "epoch": 2903} {"train_loss": -12.417577743530273, "global_step": 487860, "epoch": 2903} {"train_loss": -12.388172149658203, "global_step": 487861, "epoch": 2903} {"train_loss": -12.5263671875, "global_step": 487862, "epoch": 2903} {"train_loss": -12.225123405456543, "global_step": 487863, "epoch": 2903} {"train_loss": -12.402579307556152, "global_step": 487864, "epoch": 2903} {"train_loss": -12.360041618347168, "global_step": 487865, "epoch": 2903} {"train_loss": -12.480984687805176, "global_step": 487866, "epoch": 2903} {"train_loss": -12.285490989685059, "global_step": 487867, "epoch": 2903} {"train_loss": -12.520811080932617, "global_step": 487868, "epoch": 2903} {"train_loss": -12.565717697143555, "global_step": 487869, "epoch": 2903} {"train_loss": -12.487384796142578, "global_step": 487870, "epoch": 2903} {"train_loss": -11.764848731812977, "global_step": 487871, "epoch": 2903, "val_loss": 308187.90625} {"train_loss": -12.449895858764648, "global_step": 487872, "epoch": 2904} {"train_loss": -12.412888526916504, "global_step": 487873, "epoch": 2904} {"train_loss": -12.594202041625977, "global_step": 487874, "epoch": 2904} {"train_loss": -12.439101219177246, "global_step": 487875, "epoch": 2904} {"train_loss": -12.442358016967773, "global_step": 487876, "epoch": 2904} {"train_loss": -12.698740005493164, "global_step": 487877, "epoch": 2904} {"train_loss": -12.684402465820312, "global_step": 487878, "epoch": 2904} {"train_loss": -12.674395561218262, "global_step": 487879, "epoch": 2904} {"train_loss": -12.52160358428955, "global_step": 487880, "epoch": 2904} {"train_loss": -12.709142684936523, "global_step": 487881, "epoch": 2904} {"train_loss": -12.74893856048584, "global_step": 487882, "epoch": 2904} {"train_loss": -12.716241836547852, "global_step": 487883, "epoch": 2904} {"train_loss": -12.650274276733398, "global_step": 487884, "epoch": 2904} {"train_loss": -12.60267162322998, "global_step": 487885, "epoch": 2904} {"train_loss": -12.508623123168945, "global_step": 487886, "epoch": 2904} {"train_loss": -12.67755126953125, "global_step": 487887, "epoch": 2904} {"train_loss": -12.685312271118164, "global_step": 487888, "epoch": 2904} {"train_loss": -12.608924865722656, "global_step": 487889, "epoch": 2904} {"train_loss": -12.623668670654297, "global_step": 487890, "epoch": 2904} {"train_loss": -12.547739028930664, "global_step": 487891, "epoch": 2904} {"train_loss": -12.719950675964355, "global_step": 487892, "epoch": 2904} {"train_loss": -12.488709449768066, "global_step": 487893, "epoch": 2904} {"train_loss": -12.87216567993164, "global_step": 487894, "epoch": 2904} {"train_loss": -12.632813453674316, "global_step": 487895, "epoch": 2904} {"train_loss": -12.853231430053711, "global_step": 487896, "epoch": 2904} {"train_loss": -12.685556411743164, "global_step": 487897, "epoch": 2904} {"train_loss": -12.925102233886719, "global_step": 487898, "epoch": 2904} {"train_loss": -12.753201484680176, "global_step": 487899, "epoch": 2904} {"train_loss": -12.854412078857422, "global_step": 487900, "epoch": 2904} {"train_loss": -12.728997230529785, "global_step": 487901, "epoch": 2904} {"train_loss": -12.86672592163086, "global_step": 487902, "epoch": 2904} {"train_loss": -12.921300888061523, "global_step": 487903, "epoch": 2904} {"train_loss": -12.733019828796387, "global_step": 487904, "epoch": 2904} {"train_loss": -12.773685455322266, "global_step": 487905, "epoch": 2904} {"train_loss": -12.782154083251953, "global_step": 487906, "epoch": 2904} {"train_loss": -12.764431953430176, "global_step": 487907, "epoch": 2904} {"train_loss": -12.711989402770996, "global_step": 487908, "epoch": 2904} {"train_loss": -12.820194244384766, "global_step": 487909, "epoch": 2904} {"train_loss": -12.951969146728516, "global_step": 487910, "epoch": 2904} {"train_loss": -12.588408470153809, "global_step": 487911, "epoch": 2904} {"train_loss": -12.750984191894531, "global_step": 487912, "epoch": 2904} {"train_loss": -12.801843643188477, "global_step": 487913, "epoch": 2904} {"train_loss": -12.896880149841309, "global_step": 487914, "epoch": 2904} {"train_loss": -12.89401626586914, "global_step": 487915, "epoch": 2904} {"train_loss": -12.757834434509277, "global_step": 487916, "epoch": 2904} {"train_loss": -12.717376708984375, "global_step": 487917, "epoch": 2904} {"train_loss": -12.897978782653809, "global_step": 487918, "epoch": 2904} {"train_loss": -12.776107788085938, "global_step": 487919, "epoch": 2904} {"train_loss": -12.486675262451172, "global_step": 487920, "epoch": 2904} {"train_loss": -12.486688613891602, "global_step": 487921, "epoch": 2904} {"train_loss": -12.619386672973633, "global_step": 487922, "epoch": 2904} {"train_loss": -12.839707374572754, "global_step": 487923, "epoch": 2904} {"train_loss": -12.276131629943848, "global_step": 487924, "epoch": 2904} {"train_loss": -11.880818367004395, "global_step": 487925, "epoch": 2904} {"train_loss": -12.91147518157959, "global_step": 487926, "epoch": 2904} {"train_loss": -12.485330581665039, "global_step": 487927, "epoch": 2904} {"train_loss": -12.762960433959961, "global_step": 487928, "epoch": 2904} {"train_loss": -12.753328323364258, "global_step": 487929, "epoch": 2904} {"train_loss": -12.765446662902832, "global_step": 487930, "epoch": 2904} {"train_loss": -12.611738204956055, "global_step": 487931, "epoch": 2904} {"train_loss": -12.603191375732422, "global_step": 487932, "epoch": 2904} {"train_loss": -12.746225357055664, "global_step": 487933, "epoch": 2904} {"train_loss": -12.86825942993164, "global_step": 487934, "epoch": 2904} {"train_loss": -12.369291305541992, "global_step": 487935, "epoch": 2904} {"train_loss": -12.842323303222656, "global_step": 487936, "epoch": 2904} {"train_loss": -12.764049530029297, "global_step": 487937, "epoch": 2904} {"train_loss": -12.288559913635254, "global_step": 487938, "epoch": 2904} {"train_loss": -12.108264923095703, "global_step": 487939, "epoch": 2904} {"train_loss": -12.820976257324219, "global_step": 487940, "epoch": 2904} {"train_loss": -11.925816535949707, "global_step": 487941, "epoch": 2904} {"train_loss": -11.29738712310791, "global_step": 487942, "epoch": 2904} {"train_loss": -10.858485221862793, "global_step": 487943, "epoch": 2904} {"train_loss": -12.556639671325684, "global_step": 487944, "epoch": 2904} {"train_loss": -11.997194290161133, "global_step": 487945, "epoch": 2904} {"train_loss": -12.507302284240723, "global_step": 487946, "epoch": 2904} {"train_loss": -12.033807754516602, "global_step": 487947, "epoch": 2904} {"train_loss": -12.43093490600586, "global_step": 487948, "epoch": 2904} {"train_loss": -12.081596374511719, "global_step": 487949, "epoch": 2904} {"train_loss": -12.329635620117188, "global_step": 487950, "epoch": 2904} {"train_loss": -11.986342430114746, "global_step": 487951, "epoch": 2904} {"train_loss": -11.44094181060791, "global_step": 487952, "epoch": 2904} {"train_loss": -12.800689697265625, "global_step": 487953, "epoch": 2904} {"train_loss": -11.837111473083496, "global_step": 487954, "epoch": 2904} {"train_loss": -12.076911926269531, "global_step": 487955, "epoch": 2904} {"train_loss": -12.095619201660156, "global_step": 487956, "epoch": 2904} {"train_loss": -12.820755958557129, "global_step": 487957, "epoch": 2904} {"train_loss": -11.779857635498047, "global_step": 487958, "epoch": 2904} {"train_loss": -11.996264457702637, "global_step": 487959, "epoch": 2904} {"train_loss": -12.639359474182129, "global_step": 487960, "epoch": 2904} {"train_loss": -12.548946380615234, "global_step": 487961, "epoch": 2904} {"train_loss": -12.5814208984375, "global_step": 487962, "epoch": 2904} {"train_loss": -12.540390968322754, "global_step": 487963, "epoch": 2904} {"train_loss": -12.813679695129395, "global_step": 487964, "epoch": 2904} {"train_loss": -12.692398071289062, "global_step": 487965, "epoch": 2904} {"train_loss": -12.76439094543457, "global_step": 487966, "epoch": 2904} {"train_loss": -12.483345031738281, "global_step": 487967, "epoch": 2904} {"train_loss": -12.884264945983887, "global_step": 487968, "epoch": 2904} {"train_loss": -12.872591018676758, "global_step": 487969, "epoch": 2904} {"train_loss": -12.869930267333984, "global_step": 487970, "epoch": 2904} {"train_loss": -12.750462532043457, "global_step": 487971, "epoch": 2904} {"train_loss": -12.663854598999023, "global_step": 487972, "epoch": 2904} {"train_loss": -12.580554962158203, "global_step": 487973, "epoch": 2904} {"train_loss": -12.868167877197266, "global_step": 487974, "epoch": 2904} {"train_loss": -12.753274917602539, "global_step": 487975, "epoch": 2904} {"train_loss": -12.625732421875, "global_step": 487976, "epoch": 2904} {"train_loss": -12.89168930053711, "global_step": 487977, "epoch": 2904} {"train_loss": -12.730243682861328, "global_step": 487978, "epoch": 2904} {"train_loss": -12.643505096435547, "global_step": 487979, "epoch": 2904} {"train_loss": -12.864607810974121, "global_step": 487980, "epoch": 2904} {"train_loss": -12.715119361877441, "global_step": 487981, "epoch": 2904} {"train_loss": -12.397045135498047, "global_step": 487982, "epoch": 2904} {"train_loss": -12.652944564819336, "global_step": 487983, "epoch": 2904} {"train_loss": -12.667828559875488, "global_step": 487984, "epoch": 2904} {"train_loss": -12.424378395080566, "global_step": 487985, "epoch": 2904} {"train_loss": -12.810554504394531, "global_step": 487986, "epoch": 2904} {"train_loss": -12.889200210571289, "global_step": 487987, "epoch": 2904} {"train_loss": -12.788246154785156, "global_step": 487988, "epoch": 2904} {"train_loss": -13.008455276489258, "global_step": 487989, "epoch": 2904} {"train_loss": -12.75778865814209, "global_step": 487990, "epoch": 2904} {"train_loss": -12.666961669921875, "global_step": 487991, "epoch": 2904} {"train_loss": -12.427356719970703, "global_step": 487992, "epoch": 2904} {"train_loss": -12.813249588012695, "global_step": 487993, "epoch": 2904} {"train_loss": -12.49403190612793, "global_step": 487994, "epoch": 2904} {"train_loss": -11.998125076293945, "global_step": 487995, "epoch": 2904} {"train_loss": -12.461186408996582, "global_step": 487996, "epoch": 2904} {"train_loss": -12.556178092956543, "global_step": 487997, "epoch": 2904} {"train_loss": -12.67460823059082, "global_step": 487998, "epoch": 2904} {"train_loss": -12.392114639282227, "global_step": 487999, "epoch": 2904} {"train_loss": -12.762479782104492, "global_step": 488000, "epoch": 2904} {"train_loss": -12.592456817626953, "global_step": 488001, "epoch": 2904} {"train_loss": -12.728344917297363, "global_step": 488002, "epoch": 2904} {"train_loss": -12.436395645141602, "global_step": 488003, "epoch": 2904} {"train_loss": -12.497468948364258, "global_step": 488004, "epoch": 2904} {"train_loss": -12.347522735595703, "global_step": 488005, "epoch": 2904} {"train_loss": -12.769784927368164, "global_step": 488006, "epoch": 2904} {"train_loss": -11.968076705932617, "global_step": 488007, "epoch": 2904} {"train_loss": -12.538772583007812, "global_step": 488008, "epoch": 2904} {"train_loss": -11.379770278930664, "global_step": 488009, "epoch": 2904} {"train_loss": -11.293368339538574, "global_step": 488010, "epoch": 2904} {"train_loss": -11.503719329833984, "global_step": 488011, "epoch": 2904} {"train_loss": -12.608992576599121, "global_step": 488012, "epoch": 2904} {"train_loss": -11.914045333862305, "global_step": 488013, "epoch": 2904} {"train_loss": -11.214395523071289, "global_step": 488014, "epoch": 2904} {"train_loss": -11.071035385131836, "global_step": 488015, "epoch": 2904} {"train_loss": -10.716339111328125, "global_step": 488016, "epoch": 2904} {"train_loss": -11.598767280578613, "global_step": 488017, "epoch": 2904} {"train_loss": -11.655529022216797, "global_step": 488018, "epoch": 2904} {"train_loss": -11.698734283447266, "global_step": 488019, "epoch": 2904} {"train_loss": -10.471824645996094, "global_step": 488020, "epoch": 2904} {"train_loss": -11.025006294250488, "global_step": 488021, "epoch": 2904} {"train_loss": -9.747026443481445, "global_step": 488022, "epoch": 2904} {"train_loss": -10.78083324432373, "global_step": 488023, "epoch": 2904} {"train_loss": -9.643211364746094, "global_step": 488024, "epoch": 2904} {"train_loss": -10.48879623413086, "global_step": 488025, "epoch": 2904} {"train_loss": -10.328275680541992, "global_step": 488026, "epoch": 2904} {"train_loss": -10.356128692626953, "global_step": 488027, "epoch": 2904} {"train_loss": -9.4873046875, "global_step": 488028, "epoch": 2904} {"train_loss": -9.118265151977539, "global_step": 488029, "epoch": 2904} {"train_loss": -10.868904113769531, "global_step": 488030, "epoch": 2904} {"train_loss": -10.37993335723877, "global_step": 488031, "epoch": 2904} {"train_loss": -10.824766159057617, "global_step": 488032, "epoch": 2904} {"train_loss": -11.463115692138672, "global_step": 488033, "epoch": 2904} {"train_loss": -9.807313919067383, "global_step": 488034, "epoch": 2904} {"train_loss": -12.070850372314453, "global_step": 488035, "epoch": 2904} {"train_loss": -11.090372085571289, "global_step": 488036, "epoch": 2904} {"train_loss": -11.090929985046387, "global_step": 488037, "epoch": 2904} {"train_loss": -11.081151962280273, "global_step": 488038, "epoch": 2904} {"train_loss": -12.264136666343326, "global_step": 488039, "epoch": 2904, "val_loss": 313102.21875} {"train_loss": -10.898159980773926, "global_step": 488040, "epoch": 2905} {"train_loss": -11.89727783203125, "global_step": 488041, "epoch": 2905} {"train_loss": -10.800529479980469, "global_step": 488042, "epoch": 2905} {"train_loss": -10.265630722045898, "global_step": 488043, "epoch": 2905} {"train_loss": -11.190125465393066, "global_step": 488044, "epoch": 2905} {"train_loss": -11.79197883605957, "global_step": 488045, "epoch": 2905} {"train_loss": -11.443685531616211, "global_step": 488046, "epoch": 2905} {"train_loss": -10.991065979003906, "global_step": 488047, "epoch": 2905} {"train_loss": -11.923948287963867, "global_step": 488048, "epoch": 2905} {"train_loss": -10.868074417114258, "global_step": 488049, "epoch": 2905} {"train_loss": -11.72575569152832, "global_step": 488050, "epoch": 2905} {"train_loss": -11.579426765441895, "global_step": 488051, "epoch": 2905} {"train_loss": -11.110861778259277, "global_step": 488052, "epoch": 2905} {"train_loss": -11.338079452514648, "global_step": 488053, "epoch": 2905} {"train_loss": -11.67020034790039, "global_step": 488054, "epoch": 2905} {"train_loss": -11.317028045654297, "global_step": 488055, "epoch": 2905} {"train_loss": -11.955552101135254, "global_step": 488056, "epoch": 2905} {"train_loss": -11.739043235778809, "global_step": 488057, "epoch": 2905} {"train_loss": -11.769403457641602, "global_step": 488058, "epoch": 2905} {"train_loss": -12.073196411132812, "global_step": 488059, "epoch": 2905} {"train_loss": -11.591733932495117, "global_step": 488060, "epoch": 2905} {"train_loss": -11.434481620788574, "global_step": 488061, "epoch": 2905} {"train_loss": -12.14525032043457, "global_step": 488062, "epoch": 2905} {"train_loss": -11.68100643157959, "global_step": 488063, "epoch": 2905} {"train_loss": -12.519445419311523, "global_step": 488064, "epoch": 2905} {"train_loss": -12.009148597717285, "global_step": 488065, "epoch": 2905} {"train_loss": -12.158819198608398, "global_step": 488066, "epoch": 2905} {"train_loss": -12.313238143920898, "global_step": 488067, "epoch": 2905} {"train_loss": -11.866439819335938, "global_step": 488068, "epoch": 2905} {"train_loss": -12.279590606689453, "global_step": 488069, "epoch": 2905} {"train_loss": -12.089348793029785, "global_step": 488070, "epoch": 2905} {"train_loss": -11.91164779663086, "global_step": 488071, "epoch": 2905} {"train_loss": -12.330851554870605, "global_step": 488072, "epoch": 2905} {"train_loss": -12.059530258178711, "global_step": 488073, "epoch": 2905} {"train_loss": -12.258002281188965, "global_step": 488074, "epoch": 2905} {"train_loss": -12.523698806762695, "global_step": 488075, "epoch": 2905} {"train_loss": -12.072101593017578, "global_step": 488076, "epoch": 2905} {"train_loss": -12.57387924194336, "global_step": 488077, "epoch": 2905} {"train_loss": -12.163875579833984, "global_step": 488078, "epoch": 2905} {"train_loss": -12.314227104187012, "global_step": 488079, "epoch": 2905} {"train_loss": -12.526519775390625, "global_step": 488080, "epoch": 2905} {"train_loss": -12.375585556030273, "global_step": 488081, "epoch": 2905} {"train_loss": -12.630661010742188, "global_step": 488082, "epoch": 2905} {"train_loss": -12.16061782836914, "global_step": 488083, "epoch": 2905} {"train_loss": -12.392866134643555, "global_step": 488084, "epoch": 2905} {"train_loss": -12.425973892211914, "global_step": 488085, "epoch": 2905} {"train_loss": -12.472139358520508, "global_step": 488086, "epoch": 2905} {"train_loss": -12.415777206420898, "global_step": 488087, "epoch": 2905} {"train_loss": -12.404870986938477, "global_step": 488088, "epoch": 2905} {"train_loss": -12.28724479675293, "global_step": 488089, "epoch": 2905} {"train_loss": -12.338695526123047, "global_step": 488090, "epoch": 2905} {"train_loss": -12.13595962524414, "global_step": 488091, "epoch": 2905} {"train_loss": -12.444347381591797, "global_step": 488092, "epoch": 2905} {"train_loss": -12.4045991897583, "global_step": 488093, "epoch": 2905} {"train_loss": -12.173102378845215, "global_step": 488094, "epoch": 2905} {"train_loss": -12.526915550231934, "global_step": 488095, "epoch": 2905} {"train_loss": -12.418856620788574, "global_step": 488096, "epoch": 2905} {"train_loss": -12.538540840148926, "global_step": 488097, "epoch": 2905} {"train_loss": -12.623181343078613, "global_step": 488098, "epoch": 2905} {"train_loss": -12.242487907409668, "global_step": 488099, "epoch": 2905} {"train_loss": -12.472381591796875, "global_step": 488100, "epoch": 2905} {"train_loss": -12.78227424621582, "global_step": 488101, "epoch": 2905} {"train_loss": -12.514020919799805, "global_step": 488102, "epoch": 2905} {"train_loss": -12.695720672607422, "global_step": 488103, "epoch": 2905} {"train_loss": -12.650776863098145, "global_step": 488104, "epoch": 2905} {"train_loss": -12.48373794555664, "global_step": 488105, "epoch": 2905} {"train_loss": -12.82943344116211, "global_step": 488106, "epoch": 2905} {"train_loss": -12.458084106445312, "global_step": 488107, "epoch": 2905} {"train_loss": -12.839498519897461, "global_step": 488108, "epoch": 2905} {"train_loss": -12.666236877441406, "global_step": 488109, "epoch": 2905} {"train_loss": -12.529839515686035, "global_step": 488110, "epoch": 2905} {"train_loss": -12.85273551940918, "global_step": 488111, "epoch": 2905} {"train_loss": -12.581253051757812, "global_step": 488112, "epoch": 2905} {"train_loss": -12.932816505432129, "global_step": 488113, "epoch": 2905} {"train_loss": -12.475970268249512, "global_step": 488114, "epoch": 2905} {"train_loss": -12.805461883544922, "global_step": 488115, "epoch": 2905} {"train_loss": -12.625016212463379, "global_step": 488116, "epoch": 2905} {"train_loss": -12.711750030517578, "global_step": 488117, "epoch": 2905} {"train_loss": -12.753681182861328, "global_step": 488118, "epoch": 2905} {"train_loss": -12.67077922821045, "global_step": 488119, "epoch": 2905} {"train_loss": -12.757417678833008, "global_step": 488120, "epoch": 2905} {"train_loss": -12.680183410644531, "global_step": 488121, "epoch": 2905} {"train_loss": -12.770153999328613, "global_step": 488122, "epoch": 2905} {"train_loss": -12.7809419631958, "global_step": 488123, "epoch": 2905} {"train_loss": -12.89645767211914, "global_step": 488124, "epoch": 2905} {"train_loss": -12.884523391723633, "global_step": 488125, "epoch": 2905} {"train_loss": -12.720027923583984, "global_step": 488126, "epoch": 2905} {"train_loss": -12.727031707763672, "global_step": 488127, "epoch": 2905} {"train_loss": -12.752767562866211, "global_step": 488128, "epoch": 2905} {"train_loss": -12.506606101989746, "global_step": 488129, "epoch": 2905} {"train_loss": -12.664319038391113, "global_step": 488130, "epoch": 2905} {"train_loss": -12.678974151611328, "global_step": 488131, "epoch": 2905} {"train_loss": -12.465572357177734, "global_step": 488132, "epoch": 2905} {"train_loss": -12.897729873657227, "global_step": 488133, "epoch": 2905} {"train_loss": -12.928716659545898, "global_step": 488134, "epoch": 2905} {"train_loss": -12.703641891479492, "global_step": 488135, "epoch": 2905} {"train_loss": -12.951953887939453, "global_step": 488136, "epoch": 2905} {"train_loss": -12.810232162475586, "global_step": 488137, "epoch": 2905} {"train_loss": -12.789925575256348, "global_step": 488138, "epoch": 2905} {"train_loss": -12.948507308959961, "global_step": 488139, "epoch": 2905} {"train_loss": -12.893106460571289, "global_step": 488140, "epoch": 2905} {"train_loss": -12.630163192749023, "global_step": 488141, "epoch": 2905} {"train_loss": -12.445953369140625, "global_step": 488142, "epoch": 2905} {"train_loss": -12.876258850097656, "global_step": 488143, "epoch": 2905} {"train_loss": -12.786090850830078, "global_step": 488144, "epoch": 2905} {"train_loss": -12.965085983276367, "global_step": 488145, "epoch": 2905} {"train_loss": -13.136832237243652, "global_step": 488146, "epoch": 2905} {"train_loss": -13.14582633972168, "global_step": 488147, "epoch": 2905} {"train_loss": -13.10173225402832, "global_step": 488148, "epoch": 2905} {"train_loss": -13.129522323608398, "global_step": 488149, "epoch": 2905} {"train_loss": -12.742677688598633, "global_step": 488150, "epoch": 2905} {"train_loss": -12.983549118041992, "global_step": 488151, "epoch": 2905} {"train_loss": -12.846755981445312, "global_step": 488152, "epoch": 2905} {"train_loss": -13.025413513183594, "global_step": 488153, "epoch": 2905} {"train_loss": -12.675764083862305, "global_step": 488154, "epoch": 2905} {"train_loss": -13.012524604797363, "global_step": 488155, "epoch": 2905} {"train_loss": -12.948381423950195, "global_step": 488156, "epoch": 2905} {"train_loss": -12.906399726867676, "global_step": 488157, "epoch": 2905} {"train_loss": -12.66213607788086, "global_step": 488158, "epoch": 2905} {"train_loss": -12.589370727539062, "global_step": 488159, "epoch": 2905} {"train_loss": -13.097795486450195, "global_step": 488160, "epoch": 2905} {"train_loss": -12.897336959838867, "global_step": 488161, "epoch": 2905} {"train_loss": -12.912432670593262, "global_step": 488162, "epoch": 2905} {"train_loss": -12.783223152160645, "global_step": 488163, "epoch": 2905} {"train_loss": -12.773003578186035, "global_step": 488164, "epoch": 2905} {"train_loss": -12.698250770568848, "global_step": 488165, "epoch": 2905} {"train_loss": -12.638023376464844, "global_step": 488166, "epoch": 2905} {"train_loss": -13.105301856994629, "global_step": 488167, "epoch": 2905} {"train_loss": -12.639629364013672, "global_step": 488168, "epoch": 2905} {"train_loss": -12.48051643371582, "global_step": 488169, "epoch": 2905} {"train_loss": -12.967220306396484, "global_step": 488170, "epoch": 2905} {"train_loss": -12.855692863464355, "global_step": 488171, "epoch": 2905} {"train_loss": -12.111638069152832, "global_step": 488172, "epoch": 2905} {"train_loss": -11.051331520080566, "global_step": 488173, "epoch": 2905} {"train_loss": -11.70277214050293, "global_step": 488174, "epoch": 2905} {"train_loss": -12.4904146194458, "global_step": 488175, "epoch": 2905} {"train_loss": -12.6618013381958, "global_step": 488176, "epoch": 2905} {"train_loss": -11.301910400390625, "global_step": 488177, "epoch": 2905} {"train_loss": -12.204597473144531, "global_step": 488178, "epoch": 2905} {"train_loss": -12.444673538208008, "global_step": 488179, "epoch": 2905} {"train_loss": -10.70838451385498, "global_step": 488180, "epoch": 2905} {"train_loss": -12.693345069885254, "global_step": 488181, "epoch": 2905} {"train_loss": -11.95407772064209, "global_step": 488182, "epoch": 2905} {"train_loss": -10.947269439697266, "global_step": 488183, "epoch": 2905} {"train_loss": -11.339387893676758, "global_step": 488184, "epoch": 2905} {"train_loss": -10.243234634399414, "global_step": 488185, "epoch": 2905} {"train_loss": -10.9738187789917, "global_step": 488186, "epoch": 2905} {"train_loss": -7.9466552734375, "global_step": 488187, "epoch": 2905} {"train_loss": -9.212023735046387, "global_step": 488188, "epoch": 2905} {"train_loss": -8.189432144165039, "global_step": 488189, "epoch": 2905} {"train_loss": -8.476426124572754, "global_step": 488190, "epoch": 2905} {"train_loss": -10.577093124389648, "global_step": 488191, "epoch": 2905} {"train_loss": -10.431906700134277, "global_step": 488192, "epoch": 2905} {"train_loss": -9.759073257446289, "global_step": 488193, "epoch": 2905} {"train_loss": -9.954113006591797, "global_step": 488194, "epoch": 2905} {"train_loss": -11.07533073425293, "global_step": 488195, "epoch": 2905} {"train_loss": -11.345686912536621, "global_step": 488196, "epoch": 2905} {"train_loss": -11.319008827209473, "global_step": 488197, "epoch": 2905} {"train_loss": -10.789063453674316, "global_step": 488198, "epoch": 2905} {"train_loss": -10.509212493896484, "global_step": 488199, "epoch": 2905} {"train_loss": -11.087142944335938, "global_step": 488200, "epoch": 2905} {"train_loss": -11.07553482055664, "global_step": 488201, "epoch": 2905} {"train_loss": -11.033646583557129, "global_step": 488202, "epoch": 2905} {"train_loss": -11.256245613098145, "global_step": 488203, "epoch": 2905} {"train_loss": -11.588859558105469, "global_step": 488204, "epoch": 2905} {"train_loss": -11.195438385009766, "global_step": 488205, "epoch": 2905} {"train_loss": -11.148207664489746, "global_step": 488206, "epoch": 2905} {"train_loss": -12.103111925579253, "global_step": 488207, "epoch": 2905, "val_loss": 317243.46875, "train_action_mse_error": 1.8765068054199219} {"train_loss": -10.476150512695312, "global_step": 488208, "epoch": 2906} {"train_loss": -12.010750770568848, "global_step": 488209, "epoch": 2906} {"train_loss": -10.934219360351562, "global_step": 488210, "epoch": 2906} {"train_loss": -11.346904754638672, "global_step": 488211, "epoch": 2906} {"train_loss": -11.991144180297852, "global_step": 488212, "epoch": 2906} {"train_loss": -11.204601287841797, "global_step": 488213, "epoch": 2906} {"train_loss": -12.534911155700684, "global_step": 488214, "epoch": 2906} {"train_loss": -11.11927318572998, "global_step": 488215, "epoch": 2906} {"train_loss": -12.12816047668457, "global_step": 488216, "epoch": 2906} {"train_loss": -11.616048812866211, "global_step": 488217, "epoch": 2906} {"train_loss": -12.271676063537598, "global_step": 488218, "epoch": 2906} {"train_loss": -12.142297744750977, "global_step": 488219, "epoch": 2906} {"train_loss": -11.891843795776367, "global_step": 488220, "epoch": 2906} {"train_loss": -12.041313171386719, "global_step": 488221, "epoch": 2906} {"train_loss": -12.466672897338867, "global_step": 488222, "epoch": 2906} {"train_loss": -12.169136047363281, "global_step": 488223, "epoch": 2906} {"train_loss": -12.277997016906738, "global_step": 488224, "epoch": 2906} {"train_loss": -12.33840560913086, "global_step": 488225, "epoch": 2906} {"train_loss": -12.199613571166992, "global_step": 488226, "epoch": 2906} {"train_loss": -12.15877914428711, "global_step": 488227, "epoch": 2906} {"train_loss": -12.356416702270508, "global_step": 488228, "epoch": 2906} {"train_loss": -12.382477760314941, "global_step": 488229, "epoch": 2906} {"train_loss": -12.385476112365723, "global_step": 488230, "epoch": 2906} {"train_loss": -12.409377098083496, "global_step": 488231, "epoch": 2906} {"train_loss": -12.121870040893555, "global_step": 488232, "epoch": 2906} {"train_loss": -11.993680000305176, "global_step": 488233, "epoch": 2906} {"train_loss": -12.151660919189453, "global_step": 488234, "epoch": 2906} {"train_loss": -12.282607078552246, "global_step": 488235, "epoch": 2906} {"train_loss": -12.195402145385742, "global_step": 488236, "epoch": 2906} {"train_loss": -12.493526458740234, "global_step": 488237, "epoch": 2906} {"train_loss": -11.981151580810547, "global_step": 488238, "epoch": 2906} {"train_loss": -12.436809539794922, "global_step": 488239, "epoch": 2906} {"train_loss": -11.85738468170166, "global_step": 488240, "epoch": 2906} {"train_loss": -12.671135902404785, "global_step": 488241, "epoch": 2906} {"train_loss": -12.430913925170898, "global_step": 488242, "epoch": 2906} {"train_loss": -12.383245468139648, "global_step": 488243, "epoch": 2906} {"train_loss": -12.496134757995605, "global_step": 488244, "epoch": 2906} {"train_loss": -12.464151382446289, "global_step": 488245, "epoch": 2906} {"train_loss": -12.48236083984375, "global_step": 488246, "epoch": 2906} {"train_loss": -12.541748046875, "global_step": 488247, "epoch": 2906} {"train_loss": -12.57691764831543, "global_step": 488248, "epoch": 2906} {"train_loss": -12.441798210144043, "global_step": 488249, "epoch": 2906} {"train_loss": -12.629868507385254, "global_step": 488250, "epoch": 2906} {"train_loss": -12.584394454956055, "global_step": 488251, "epoch": 2906} {"train_loss": -12.772855758666992, "global_step": 488252, "epoch": 2906} {"train_loss": -12.79876708984375, "global_step": 488253, "epoch": 2906} {"train_loss": -12.679190635681152, "global_step": 488254, "epoch": 2906} {"train_loss": -12.685527801513672, "global_step": 488255, "epoch": 2906} {"train_loss": -12.779510498046875, "global_step": 488256, "epoch": 2906} {"train_loss": -12.728927612304688, "global_step": 488257, "epoch": 2906} {"train_loss": -12.717087745666504, "global_step": 488258, "epoch": 2906} {"train_loss": -12.557268142700195, "global_step": 488259, "epoch": 2906} {"train_loss": -12.65866470336914, "global_step": 488260, "epoch": 2906} {"train_loss": -12.526198387145996, "global_step": 488261, "epoch": 2906} {"train_loss": -12.645169258117676, "global_step": 488262, "epoch": 2906} {"train_loss": -12.611231803894043, "global_step": 488263, "epoch": 2906} {"train_loss": -12.807171821594238, "global_step": 488264, "epoch": 2906} {"train_loss": -12.930547714233398, "global_step": 488265, "epoch": 2906} {"train_loss": -12.804736137390137, "global_step": 488266, "epoch": 2906} {"train_loss": -12.764735221862793, "global_step": 488267, "epoch": 2906} {"train_loss": -12.701433181762695, "global_step": 488268, "epoch": 2906} {"train_loss": -12.729524612426758, "global_step": 488269, "epoch": 2906} {"train_loss": -12.669456481933594, "global_step": 488270, "epoch": 2906} {"train_loss": -12.570907592773438, "global_step": 488271, "epoch": 2906} {"train_loss": -12.778022766113281, "global_step": 488272, "epoch": 2906} {"train_loss": -12.757346153259277, "global_step": 488273, "epoch": 2906} {"train_loss": -12.485538482666016, "global_step": 488274, "epoch": 2906} {"train_loss": -12.497312545776367, "global_step": 488275, "epoch": 2906} {"train_loss": -12.948902130126953, "global_step": 488276, "epoch": 2906} {"train_loss": -12.549731254577637, "global_step": 488277, "epoch": 2906} {"train_loss": -12.467026710510254, "global_step": 488278, "epoch": 2906} {"train_loss": -12.769538879394531, "global_step": 488279, "epoch": 2906} {"train_loss": -12.5986909866333, "global_step": 488280, "epoch": 2906} {"train_loss": -12.20504093170166, "global_step": 488281, "epoch": 2906} {"train_loss": -12.436264991760254, "global_step": 488282, "epoch": 2906} {"train_loss": -12.223869323730469, "global_step": 488283, "epoch": 2906} {"train_loss": -12.415411949157715, "global_step": 488284, "epoch": 2906} {"train_loss": -11.128087997436523, "global_step": 488285, "epoch": 2906} {"train_loss": -12.199179649353027, "global_step": 488286, "epoch": 2906} {"train_loss": -11.995275497436523, "global_step": 488287, "epoch": 2906} {"train_loss": -11.66245174407959, "global_step": 488288, "epoch": 2906} {"train_loss": -12.318940162658691, "global_step": 488289, "epoch": 2906} {"train_loss": -10.610067367553711, "global_step": 488290, "epoch": 2906} {"train_loss": -10.694719314575195, "global_step": 488291, "epoch": 2906} {"train_loss": -11.146764755249023, "global_step": 488292, "epoch": 2906} {"train_loss": -10.990756034851074, "global_step": 488293, "epoch": 2906} {"train_loss": -12.219573020935059, "global_step": 488294, "epoch": 2906} {"train_loss": -11.902706146240234, "global_step": 488295, "epoch": 2906} {"train_loss": -11.596219062805176, "global_step": 488296, "epoch": 2906} {"train_loss": -12.143592834472656, "global_step": 488297, "epoch": 2906} {"train_loss": -12.381850242614746, "global_step": 488298, "epoch": 2906} {"train_loss": -11.777839660644531, "global_step": 488299, "epoch": 2906} {"train_loss": -12.593023300170898, "global_step": 488300, "epoch": 2906} {"train_loss": -12.564909934997559, "global_step": 488301, "epoch": 2906} {"train_loss": -12.763635635375977, "global_step": 488302, "epoch": 2906} {"train_loss": -12.538848876953125, "global_step": 488303, "epoch": 2906} {"train_loss": -12.629799842834473, "global_step": 488304, "epoch": 2906} {"train_loss": -12.482353210449219, "global_step": 488305, "epoch": 2906} {"train_loss": -12.679279327392578, "global_step": 488306, "epoch": 2906} {"train_loss": -12.559926986694336, "global_step": 488307, "epoch": 2906} {"train_loss": -12.61025333404541, "global_step": 488308, "epoch": 2906} {"train_loss": -12.570478439331055, "global_step": 488309, "epoch": 2906} {"train_loss": -12.335580825805664, "global_step": 488310, "epoch": 2906} {"train_loss": -12.721856117248535, "global_step": 488311, "epoch": 2906} {"train_loss": -12.573022842407227, "global_step": 488312, "epoch": 2906} {"train_loss": -12.473028182983398, "global_step": 488313, "epoch": 2906} {"train_loss": -12.58556842803955, "global_step": 488314, "epoch": 2906} {"train_loss": -12.498483657836914, "global_step": 488315, "epoch": 2906} {"train_loss": -12.686981201171875, "global_step": 488316, "epoch": 2906} {"train_loss": -12.555550575256348, "global_step": 488317, "epoch": 2906} {"train_loss": -12.538411140441895, "global_step": 488318, "epoch": 2906} {"train_loss": -12.509998321533203, "global_step": 488319, "epoch": 2906} {"train_loss": -12.578765869140625, "global_step": 488320, "epoch": 2906} {"train_loss": -12.670120239257812, "global_step": 488321, "epoch": 2906} {"train_loss": -12.213479995727539, "global_step": 488322, "epoch": 2906} {"train_loss": -12.486717224121094, "global_step": 488323, "epoch": 2906} {"train_loss": -12.257267951965332, "global_step": 488324, "epoch": 2906} {"train_loss": -11.488749504089355, "global_step": 488325, "epoch": 2906} {"train_loss": -12.670221328735352, "global_step": 488326, "epoch": 2906} {"train_loss": -11.413562774658203, "global_step": 488327, "epoch": 2906} {"train_loss": -12.218358039855957, "global_step": 488328, "epoch": 2906} {"train_loss": -12.094677925109863, "global_step": 488329, "epoch": 2906} {"train_loss": -11.674236297607422, "global_step": 488330, "epoch": 2906} {"train_loss": -12.848493576049805, "global_step": 488331, "epoch": 2906} {"train_loss": -12.3958740234375, "global_step": 488332, "epoch": 2906} {"train_loss": -12.716170310974121, "global_step": 488333, "epoch": 2906} {"train_loss": -12.418617248535156, "global_step": 488334, "epoch": 2906} {"train_loss": -12.674835205078125, "global_step": 488335, "epoch": 2906} {"train_loss": -12.39578914642334, "global_step": 488336, "epoch": 2906} {"train_loss": -12.579708099365234, "global_step": 488337, "epoch": 2906} {"train_loss": -13.053850173950195, "global_step": 488338, "epoch": 2906} {"train_loss": -12.726545333862305, "global_step": 488339, "epoch": 2906} {"train_loss": -12.567525863647461, "global_step": 488340, "epoch": 2906} {"train_loss": -12.629670143127441, "global_step": 488341, "epoch": 2906} {"train_loss": -12.905563354492188, "global_step": 488342, "epoch": 2906} {"train_loss": -12.690498352050781, "global_step": 488343, "epoch": 2906} {"train_loss": -12.810872077941895, "global_step": 488344, "epoch": 2906} {"train_loss": -12.813831329345703, "global_step": 488345, "epoch": 2906} {"train_loss": -12.976842880249023, "global_step": 488346, "epoch": 2906} {"train_loss": -12.558196067810059, "global_step": 488347, "epoch": 2906} {"train_loss": -12.691170692443848, "global_step": 488348, "epoch": 2906} {"train_loss": -12.734681129455566, "global_step": 488349, "epoch": 2906} {"train_loss": -12.868188858032227, "global_step": 488350, "epoch": 2906} {"train_loss": -12.659940719604492, "global_step": 488351, "epoch": 2906} {"train_loss": -12.625741004943848, "global_step": 488352, "epoch": 2906} {"train_loss": -12.413264274597168, "global_step": 488353, "epoch": 2906} {"train_loss": -12.683389663696289, "global_step": 488354, "epoch": 2906} {"train_loss": -12.744939804077148, "global_step": 488355, "epoch": 2906} {"train_loss": -12.78410530090332, "global_step": 488356, "epoch": 2906} {"train_loss": -12.894704818725586, "global_step": 488357, "epoch": 2906} {"train_loss": -12.666536331176758, "global_step": 488358, "epoch": 2906} {"train_loss": -12.795598983764648, "global_step": 488359, "epoch": 2906} {"train_loss": -12.551244735717773, "global_step": 488360, "epoch": 2906} {"train_loss": -12.75081729888916, "global_step": 488361, "epoch": 2906} {"train_loss": -12.644256591796875, "global_step": 488362, "epoch": 2906} {"train_loss": -12.880940437316895, "global_step": 488363, "epoch": 2906} {"train_loss": -12.868745803833008, "global_step": 488364, "epoch": 2906} {"train_loss": -13.045616149902344, "global_step": 488365, "epoch": 2906} {"train_loss": -12.816760063171387, "global_step": 488366, "epoch": 2906} {"train_loss": -12.541245460510254, "global_step": 488367, "epoch": 2906} {"train_loss": -12.71864128112793, "global_step": 488368, "epoch": 2906} {"train_loss": -12.429649353027344, "global_step": 488369, "epoch": 2906} {"train_loss": -10.86108112335205, "global_step": 488370, "epoch": 2906} {"train_loss": -12.304702758789062, "global_step": 488371, "epoch": 2906} {"train_loss": -12.133023262023926, "global_step": 488372, "epoch": 2906} {"train_loss": -12.048599243164062, "global_step": 488373, "epoch": 2906} {"train_loss": -12.671131134033203, "global_step": 488374, "epoch": 2906} {"train_loss": -12.373691093353997, "global_step": 488375, "epoch": 2906, "val_loss": 317182.875} {"train_loss": -11.413999557495117, "global_step": 488376, "epoch": 2907} {"train_loss": -12.673957824707031, "global_step": 488377, "epoch": 2907} {"train_loss": -11.609452247619629, "global_step": 488378, "epoch": 2907} {"train_loss": -11.876023292541504, "global_step": 488379, "epoch": 2907} {"train_loss": -12.430614471435547, "global_step": 488380, "epoch": 2907} {"train_loss": -11.27766227722168, "global_step": 488381, "epoch": 2907} {"train_loss": -11.70107650756836, "global_step": 488382, "epoch": 2907} {"train_loss": -12.391971588134766, "global_step": 488383, "epoch": 2907} {"train_loss": -11.623201370239258, "global_step": 488384, "epoch": 2907} {"train_loss": -11.549076080322266, "global_step": 488385, "epoch": 2907} {"train_loss": -12.428750991821289, "global_step": 488386, "epoch": 2907} {"train_loss": -11.399164199829102, "global_step": 488387, "epoch": 2907} {"train_loss": -11.991155624389648, "global_step": 488388, "epoch": 2907} {"train_loss": -11.988359451293945, "global_step": 488389, "epoch": 2907} {"train_loss": -12.319387435913086, "global_step": 488390, "epoch": 2907} {"train_loss": -11.86038589477539, "global_step": 488391, "epoch": 2907} {"train_loss": -12.796846389770508, "global_step": 488392, "epoch": 2907} {"train_loss": -11.807723045349121, "global_step": 488393, "epoch": 2907} {"train_loss": -12.683093070983887, "global_step": 488394, "epoch": 2907} {"train_loss": -12.667520523071289, "global_step": 488395, "epoch": 2907} {"train_loss": -12.108567237854004, "global_step": 488396, "epoch": 2907} {"train_loss": -12.017783164978027, "global_step": 488397, "epoch": 2907} {"train_loss": -12.460943222045898, "global_step": 488398, "epoch": 2907} {"train_loss": -12.468343734741211, "global_step": 488399, "epoch": 2907} {"train_loss": -12.45367431640625, "global_step": 488400, "epoch": 2907} {"train_loss": -12.605558395385742, "global_step": 488401, "epoch": 2907} {"train_loss": -12.342414855957031, "global_step": 488402, "epoch": 2907} {"train_loss": -12.519218444824219, "global_step": 488403, "epoch": 2907} {"train_loss": -12.66513729095459, "global_step": 488404, "epoch": 2907} {"train_loss": -12.218441009521484, "global_step": 488405, "epoch": 2907} {"train_loss": -12.627635955810547, "global_step": 488406, "epoch": 2907} {"train_loss": -11.925466537475586, "global_step": 488407, "epoch": 2907} {"train_loss": -12.627485275268555, "global_step": 488408, "epoch": 2907} {"train_loss": -12.222162246704102, "global_step": 488409, "epoch": 2907} {"train_loss": -12.521865844726562, "global_step": 488410, "epoch": 2907} {"train_loss": -12.618270874023438, "global_step": 488411, "epoch": 2907} {"train_loss": -12.428133010864258, "global_step": 488412, "epoch": 2907} {"train_loss": -12.069925308227539, "global_step": 488413, "epoch": 2907} {"train_loss": -12.521153450012207, "global_step": 488414, "epoch": 2907} {"train_loss": -12.758172035217285, "global_step": 488415, "epoch": 2907} {"train_loss": -12.497285842895508, "global_step": 488416, "epoch": 2907} {"train_loss": -12.300521850585938, "global_step": 488417, "epoch": 2907} {"train_loss": -12.67406177520752, "global_step": 488418, "epoch": 2907} {"train_loss": -12.170239448547363, "global_step": 488419, "epoch": 2907} {"train_loss": -12.411324501037598, "global_step": 488420, "epoch": 2907} {"train_loss": -12.704784393310547, "global_step": 488421, "epoch": 2907} {"train_loss": -12.267175674438477, "global_step": 488422, "epoch": 2907} {"train_loss": -12.64523983001709, "global_step": 488423, "epoch": 2907} {"train_loss": -12.6326904296875, "global_step": 488424, "epoch": 2907} {"train_loss": -12.447431564331055, "global_step": 488425, "epoch": 2907} {"train_loss": -12.422357559204102, "global_step": 488426, "epoch": 2907} {"train_loss": -12.171225547790527, "global_step": 488427, "epoch": 2907} {"train_loss": -12.56570816040039, "global_step": 488428, "epoch": 2907} {"train_loss": -12.075522422790527, "global_step": 488429, "epoch": 2907} {"train_loss": -11.93893051147461, "global_step": 488430, "epoch": 2907} {"train_loss": -12.728670120239258, "global_step": 488431, "epoch": 2907} {"train_loss": -12.192548751831055, "global_step": 488432, "epoch": 2907} {"train_loss": -12.319927215576172, "global_step": 488433, "epoch": 2907} {"train_loss": -12.306039810180664, "global_step": 488434, "epoch": 2907} {"train_loss": -12.718563079833984, "global_step": 488435, "epoch": 2907} {"train_loss": -12.378801345825195, "global_step": 488436, "epoch": 2907} {"train_loss": -12.388533592224121, "global_step": 488437, "epoch": 2907} {"train_loss": -12.662835121154785, "global_step": 488438, "epoch": 2907} {"train_loss": -12.313404083251953, "global_step": 488439, "epoch": 2907} {"train_loss": -11.250991821289062, "global_step": 488440, "epoch": 2907} {"train_loss": -12.411901473999023, "global_step": 488441, "epoch": 2907} {"train_loss": -11.829240798950195, "global_step": 488442, "epoch": 2907} {"train_loss": -10.329981803894043, "global_step": 488443, "epoch": 2907} {"train_loss": -10.317052841186523, "global_step": 488444, "epoch": 2907} {"train_loss": -9.852731704711914, "global_step": 488445, "epoch": 2907} {"train_loss": -11.445516586303711, "global_step": 488446, "epoch": 2907} {"train_loss": -8.74250602722168, "global_step": 488447, "epoch": 2907} {"train_loss": -11.516509056091309, "global_step": 488448, "epoch": 2907} {"train_loss": -8.243322372436523, "global_step": 488449, "epoch": 2907} {"train_loss": -8.40372085571289, "global_step": 488450, "epoch": 2907} {"train_loss": -8.252446174621582, "global_step": 488451, "epoch": 2907} {"train_loss": -7.660114288330078, "global_step": 488452, "epoch": 2907} {"train_loss": -8.561866760253906, "global_step": 488453, "epoch": 2907} {"train_loss": -10.515093803405762, "global_step": 488454, "epoch": 2907} {"train_loss": -10.71858024597168, "global_step": 488455, "epoch": 2907} {"train_loss": -9.723250389099121, "global_step": 488456, "epoch": 2907} {"train_loss": -11.050642013549805, "global_step": 488457, "epoch": 2907} {"train_loss": -10.502105712890625, "global_step": 488458, "epoch": 2907} {"train_loss": -10.261419296264648, "global_step": 488459, "epoch": 2907} {"train_loss": -10.640701293945312, "global_step": 488460, "epoch": 2907} {"train_loss": -11.447074890136719, "global_step": 488461, "epoch": 2907} {"train_loss": -10.578509330749512, "global_step": 488462, "epoch": 2907} {"train_loss": -11.1445894241333, "global_step": 488463, "epoch": 2907} {"train_loss": -11.512194633483887, "global_step": 488464, "epoch": 2907} {"train_loss": -11.041407585144043, "global_step": 488465, "epoch": 2907} {"train_loss": -10.708494186401367, "global_step": 488466, "epoch": 2907} {"train_loss": -11.237393379211426, "global_step": 488467, "epoch": 2907} {"train_loss": -11.041996002197266, "global_step": 488468, "epoch": 2907} {"train_loss": -11.928688049316406, "global_step": 488469, "epoch": 2907} {"train_loss": -12.032459259033203, "global_step": 488470, "epoch": 2907} {"train_loss": -12.055034637451172, "global_step": 488471, "epoch": 2907} {"train_loss": -11.885393142700195, "global_step": 488472, "epoch": 2907} {"train_loss": -11.392603874206543, "global_step": 488473, "epoch": 2907} {"train_loss": -12.077970504760742, "global_step": 488474, "epoch": 2907} {"train_loss": -11.832937240600586, "global_step": 488475, "epoch": 2907} {"train_loss": -11.990924835205078, "global_step": 488476, "epoch": 2907} {"train_loss": -12.03957462310791, "global_step": 488477, "epoch": 2907} {"train_loss": -11.478034019470215, "global_step": 488478, "epoch": 2907} {"train_loss": -12.574990272521973, "global_step": 488479, "epoch": 2907} {"train_loss": -12.067405700683594, "global_step": 488480, "epoch": 2907} {"train_loss": -12.566366195678711, "global_step": 488481, "epoch": 2907} {"train_loss": -12.30186653137207, "global_step": 488482, "epoch": 2907} {"train_loss": -12.414097785949707, "global_step": 488483, "epoch": 2907} {"train_loss": -12.366758346557617, "global_step": 488484, "epoch": 2907} {"train_loss": -12.104541778564453, "global_step": 488485, "epoch": 2907} {"train_loss": -12.553741455078125, "global_step": 488486, "epoch": 2907} {"train_loss": -12.345550537109375, "global_step": 488487, "epoch": 2907} {"train_loss": -12.552571296691895, "global_step": 488488, "epoch": 2907} {"train_loss": -12.268330574035645, "global_step": 488489, "epoch": 2907} {"train_loss": -12.461835861206055, "global_step": 488490, "epoch": 2907} {"train_loss": -12.668990135192871, "global_step": 488491, "epoch": 2907} {"train_loss": -12.572516441345215, "global_step": 488492, "epoch": 2907} {"train_loss": -12.805350303649902, "global_step": 488493, "epoch": 2907} {"train_loss": -12.466314315795898, "global_step": 488494, "epoch": 2907} {"train_loss": -12.707574844360352, "global_step": 488495, "epoch": 2907} {"train_loss": -12.277172088623047, "global_step": 488496, "epoch": 2907} {"train_loss": -12.463665962219238, "global_step": 488497, "epoch": 2907} {"train_loss": -12.357528686523438, "global_step": 488498, "epoch": 2907} {"train_loss": -12.153288841247559, "global_step": 488499, "epoch": 2907} {"train_loss": -12.822916030883789, "global_step": 488500, "epoch": 2907} {"train_loss": -12.436599731445312, "global_step": 488501, "epoch": 2907} {"train_loss": -12.552603721618652, "global_step": 488502, "epoch": 2907} {"train_loss": -12.436436653137207, "global_step": 488503, "epoch": 2907} {"train_loss": -12.442681312561035, "global_step": 488504, "epoch": 2907} {"train_loss": -12.414896965026855, "global_step": 488505, "epoch": 2907} {"train_loss": -12.495479583740234, "global_step": 488506, "epoch": 2907} {"train_loss": -12.871841430664062, "global_step": 488507, "epoch": 2907} {"train_loss": -12.565439224243164, "global_step": 488508, "epoch": 2907} {"train_loss": -12.773103713989258, "global_step": 488509, "epoch": 2907} {"train_loss": -12.687955856323242, "global_step": 488510, "epoch": 2907} {"train_loss": -12.577790260314941, "global_step": 488511, "epoch": 2907} {"train_loss": -12.776065826416016, "global_step": 488512, "epoch": 2907} {"train_loss": -12.679988861083984, "global_step": 488513, "epoch": 2907} {"train_loss": -12.838508605957031, "global_step": 488514, "epoch": 2907} {"train_loss": -12.951342582702637, "global_step": 488515, "epoch": 2907} {"train_loss": -12.548409461975098, "global_step": 488516, "epoch": 2907} {"train_loss": -12.728189468383789, "global_step": 488517, "epoch": 2907} {"train_loss": -12.798680305480957, "global_step": 488518, "epoch": 2907} {"train_loss": -12.904861450195312, "global_step": 488519, "epoch": 2907} {"train_loss": -12.829374313354492, "global_step": 488520, "epoch": 2907} {"train_loss": -12.91299819946289, "global_step": 488521, "epoch": 2907} {"train_loss": -12.74581527709961, "global_step": 488522, "epoch": 2907} {"train_loss": -12.72807788848877, "global_step": 488523, "epoch": 2907} {"train_loss": -13.016632080078125, "global_step": 488524, "epoch": 2907} {"train_loss": -12.913004875183105, "global_step": 488525, "epoch": 2907} {"train_loss": -12.796304702758789, "global_step": 488526, "epoch": 2907} {"train_loss": -12.742936134338379, "global_step": 488527, "epoch": 2907} {"train_loss": -12.435168266296387, "global_step": 488528, "epoch": 2907} {"train_loss": -12.765912055969238, "global_step": 488529, "epoch": 2907} {"train_loss": -12.824531555175781, "global_step": 488530, "epoch": 2907} {"train_loss": -12.504814147949219, "global_step": 488531, "epoch": 2907} {"train_loss": -12.740830421447754, "global_step": 488532, "epoch": 2907} {"train_loss": -12.712174415588379, "global_step": 488533, "epoch": 2907} {"train_loss": -12.567688941955566, "global_step": 488534, "epoch": 2907} {"train_loss": -12.889028549194336, "global_step": 488535, "epoch": 2907} {"train_loss": -12.477302551269531, "global_step": 488536, "epoch": 2907} {"train_loss": -12.835000991821289, "global_step": 488537, "epoch": 2907} {"train_loss": -12.872326850891113, "global_step": 488538, "epoch": 2907} {"train_loss": -12.87843132019043, "global_step": 488539, "epoch": 2907} {"train_loss": -12.585678100585938, "global_step": 488540, "epoch": 2907} {"train_loss": -12.728879928588867, "global_step": 488541, "epoch": 2907} {"train_loss": -12.73399829864502, "global_step": 488542, "epoch": 2907} {"train_loss": -12.064432467733111, "global_step": 488543, "epoch": 2907, "val_loss": 314247.34375} {"train_loss": -12.71553897857666, "global_step": 488544, "epoch": 2908} {"train_loss": -12.980308532714844, "global_step": 488545, "epoch": 2908} {"train_loss": -12.71994400024414, "global_step": 488546, "epoch": 2908} {"train_loss": -12.472676277160645, "global_step": 488547, "epoch": 2908} {"train_loss": -12.735136032104492, "global_step": 488548, "epoch": 2908} {"train_loss": -12.786725997924805, "global_step": 488549, "epoch": 2908} {"train_loss": -12.53081226348877, "global_step": 488550, "epoch": 2908} {"train_loss": -12.699092864990234, "global_step": 488551, "epoch": 2908} {"train_loss": -12.724929809570312, "global_step": 488552, "epoch": 2908} {"train_loss": -12.859915733337402, "global_step": 488553, "epoch": 2908} {"train_loss": -12.762804985046387, "global_step": 488554, "epoch": 2908} {"train_loss": -12.734281539916992, "global_step": 488555, "epoch": 2908} {"train_loss": -12.79448127746582, "global_step": 488556, "epoch": 2908} {"train_loss": -12.716615676879883, "global_step": 488557, "epoch": 2908} {"train_loss": -12.740760803222656, "global_step": 488558, "epoch": 2908} {"train_loss": -13.040596008300781, "global_step": 488559, "epoch": 2908} {"train_loss": -12.495436668395996, "global_step": 488560, "epoch": 2908} {"train_loss": -12.087053298950195, "global_step": 488561, "epoch": 2908} {"train_loss": -11.914073944091797, "global_step": 488562, "epoch": 2908} {"train_loss": -11.707535743713379, "global_step": 488563, "epoch": 2908} {"train_loss": -12.663802146911621, "global_step": 488564, "epoch": 2908} {"train_loss": -12.504368782043457, "global_step": 488565, "epoch": 2908} {"train_loss": -11.052316665649414, "global_step": 488566, "epoch": 2908} {"train_loss": -8.976024627685547, "global_step": 488567, "epoch": 2908} {"train_loss": -9.90023422241211, "global_step": 488568, "epoch": 2908} {"train_loss": -10.778289794921875, "global_step": 488569, "epoch": 2908} {"train_loss": -10.589014053344727, "global_step": 488570, "epoch": 2908} {"train_loss": -9.029701232910156, "global_step": 488571, "epoch": 2908} {"train_loss": -10.399806022644043, "global_step": 488572, "epoch": 2908} {"train_loss": -8.454816818237305, "global_step": 488573, "epoch": 2908} {"train_loss": -9.345752716064453, "global_step": 488574, "epoch": 2908} {"train_loss": -8.0416259765625, "global_step": 488575, "epoch": 2908} {"train_loss": -9.470579147338867, "global_step": 488576, "epoch": 2908} {"train_loss": -9.522822380065918, "global_step": 488577, "epoch": 2908} {"train_loss": -8.744213104248047, "global_step": 488578, "epoch": 2908} {"train_loss": -8.531524658203125, "global_step": 488579, "epoch": 2908} {"train_loss": -8.737255096435547, "global_step": 488580, "epoch": 2908} {"train_loss": -10.444173812866211, "global_step": 488581, "epoch": 2908} {"train_loss": -9.530769348144531, "global_step": 488582, "epoch": 2908} {"train_loss": -8.668010711669922, "global_step": 488583, "epoch": 2908} {"train_loss": -10.373344421386719, "global_step": 488584, "epoch": 2908} {"train_loss": -10.781850814819336, "global_step": 488585, "epoch": 2908} {"train_loss": -9.306526184082031, "global_step": 488586, "epoch": 2908} {"train_loss": -10.554437637329102, "global_step": 488587, "epoch": 2908} {"train_loss": -9.422491073608398, "global_step": 488588, "epoch": 2908} {"train_loss": -9.694011688232422, "global_step": 488589, "epoch": 2908} {"train_loss": -10.450029373168945, "global_step": 488590, "epoch": 2908} {"train_loss": -10.803285598754883, "global_step": 488591, "epoch": 2908} {"train_loss": -9.593162536621094, "global_step": 488592, "epoch": 2908} {"train_loss": -11.647629737854004, "global_step": 488593, "epoch": 2908} {"train_loss": -10.50009536743164, "global_step": 488594, "epoch": 2908} {"train_loss": -10.957597732543945, "global_step": 488595, "epoch": 2908} {"train_loss": -11.862646102905273, "global_step": 488596, "epoch": 2908} {"train_loss": -11.175970077514648, "global_step": 488597, "epoch": 2908} {"train_loss": -12.166557312011719, "global_step": 488598, "epoch": 2908} {"train_loss": -11.391096115112305, "global_step": 488599, "epoch": 2908} {"train_loss": -11.916566848754883, "global_step": 488600, "epoch": 2908} {"train_loss": -11.54757308959961, "global_step": 488601, "epoch": 2908} {"train_loss": -11.64204216003418, "global_step": 488602, "epoch": 2908} {"train_loss": -11.936376571655273, "global_step": 488603, "epoch": 2908} {"train_loss": -12.181436538696289, "global_step": 488604, "epoch": 2908} {"train_loss": -12.196104049682617, "global_step": 488605, "epoch": 2908} {"train_loss": -12.095571517944336, "global_step": 488606, "epoch": 2908} {"train_loss": -12.287280082702637, "global_step": 488607, "epoch": 2908} {"train_loss": -11.890233039855957, "global_step": 488608, "epoch": 2908} {"train_loss": -12.199287414550781, "global_step": 488609, "epoch": 2908} {"train_loss": -12.20395565032959, "global_step": 488610, "epoch": 2908} {"train_loss": -11.981796264648438, "global_step": 488611, "epoch": 2908} {"train_loss": -12.223733901977539, "global_step": 488612, "epoch": 2908} {"train_loss": -12.004304885864258, "global_step": 488613, "epoch": 2908} {"train_loss": -11.971945762634277, "global_step": 488614, "epoch": 2908} {"train_loss": -12.167745590209961, "global_step": 488615, "epoch": 2908} {"train_loss": -12.167875289916992, "global_step": 488616, "epoch": 2908} {"train_loss": -12.093774795532227, "global_step": 488617, "epoch": 2908} {"train_loss": -11.783757209777832, "global_step": 488618, "epoch": 2908} {"train_loss": -12.00668716430664, "global_step": 488619, "epoch": 2908} {"train_loss": -11.95437240600586, "global_step": 488620, "epoch": 2908} {"train_loss": -12.02232551574707, "global_step": 488621, "epoch": 2908} {"train_loss": -12.060752868652344, "global_step": 488622, "epoch": 2908} {"train_loss": -11.941703796386719, "global_step": 488623, "epoch": 2908} {"train_loss": -12.066404342651367, "global_step": 488624, "epoch": 2908} {"train_loss": -12.044873237609863, "global_step": 488625, "epoch": 2908} {"train_loss": -12.170930862426758, "global_step": 488626, "epoch": 2908} {"train_loss": -12.50448989868164, "global_step": 488627, "epoch": 2908} {"train_loss": -12.18527889251709, "global_step": 488628, "epoch": 2908} {"train_loss": -12.474207878112793, "global_step": 488629, "epoch": 2908} {"train_loss": -12.432073593139648, "global_step": 488630, "epoch": 2908} {"train_loss": -12.265487670898438, "global_step": 488631, "epoch": 2908} {"train_loss": -12.266729354858398, "global_step": 488632, "epoch": 2908} {"train_loss": -12.2407808303833, "global_step": 488633, "epoch": 2908} {"train_loss": -12.57486343383789, "global_step": 488634, "epoch": 2908} {"train_loss": -12.492202758789062, "global_step": 488635, "epoch": 2908} {"train_loss": -12.515536308288574, "global_step": 488636, "epoch": 2908} {"train_loss": -12.70947551727295, "global_step": 488637, "epoch": 2908} {"train_loss": -12.58461856842041, "global_step": 488638, "epoch": 2908} {"train_loss": -12.689797401428223, "global_step": 488639, "epoch": 2908} {"train_loss": -12.654426574707031, "global_step": 488640, "epoch": 2908} {"train_loss": -12.714839935302734, "global_step": 488641, "epoch": 2908} {"train_loss": -12.873530387878418, "global_step": 488642, "epoch": 2908} {"train_loss": -12.830530166625977, "global_step": 488643, "epoch": 2908} {"train_loss": -12.57899284362793, "global_step": 488644, "epoch": 2908} {"train_loss": -12.767751693725586, "global_step": 488645, "epoch": 2908} {"train_loss": -12.682615280151367, "global_step": 488646, "epoch": 2908} {"train_loss": -12.681589126586914, "global_step": 488647, "epoch": 2908} {"train_loss": -12.70034408569336, "global_step": 488648, "epoch": 2908} {"train_loss": -12.832939147949219, "global_step": 488649, "epoch": 2908} {"train_loss": -12.670463562011719, "global_step": 488650, "epoch": 2908} {"train_loss": -12.814470291137695, "global_step": 488651, "epoch": 2908} {"train_loss": -12.774864196777344, "global_step": 488652, "epoch": 2908} {"train_loss": -12.85883903503418, "global_step": 488653, "epoch": 2908} {"train_loss": -12.652767181396484, "global_step": 488654, "epoch": 2908} {"train_loss": -12.765735626220703, "global_step": 488655, "epoch": 2908} {"train_loss": -12.787042617797852, "global_step": 488656, "epoch": 2908} {"train_loss": -12.840518951416016, "global_step": 488657, "epoch": 2908} {"train_loss": -12.586141586303711, "global_step": 488658, "epoch": 2908} {"train_loss": -13.009836196899414, "global_step": 488659, "epoch": 2908} {"train_loss": -12.79043197631836, "global_step": 488660, "epoch": 2908} {"train_loss": -12.851110458374023, "global_step": 488661, "epoch": 2908} {"train_loss": -12.957549095153809, "global_step": 488662, "epoch": 2908} {"train_loss": -12.85735034942627, "global_step": 488663, "epoch": 2908} {"train_loss": -12.953271865844727, "global_step": 488664, "epoch": 2908} {"train_loss": -12.913562774658203, "global_step": 488665, "epoch": 2908} {"train_loss": -12.6510009765625, "global_step": 488666, "epoch": 2908} {"train_loss": -12.934736251831055, "global_step": 488667, "epoch": 2908} {"train_loss": -12.832160949707031, "global_step": 488668, "epoch": 2908} {"train_loss": -12.83613395690918, "global_step": 488669, "epoch": 2908} {"train_loss": -12.849902153015137, "global_step": 488670, "epoch": 2908} {"train_loss": -13.014760971069336, "global_step": 488671, "epoch": 2908} {"train_loss": -12.969127655029297, "global_step": 488672, "epoch": 2908} {"train_loss": -12.666215896606445, "global_step": 488673, "epoch": 2908} {"train_loss": -12.983139038085938, "global_step": 488674, "epoch": 2908} {"train_loss": -13.01327896118164, "global_step": 488675, "epoch": 2908} {"train_loss": -13.006782531738281, "global_step": 488676, "epoch": 2908} {"train_loss": -12.96424674987793, "global_step": 488677, "epoch": 2908} {"train_loss": -12.94216537475586, "global_step": 488678, "epoch": 2908} {"train_loss": -12.819343566894531, "global_step": 488679, "epoch": 2908} {"train_loss": -13.048940658569336, "global_step": 488680, "epoch": 2908} {"train_loss": -12.833911895751953, "global_step": 488681, "epoch": 2908} {"train_loss": -12.695623397827148, "global_step": 488682, "epoch": 2908} {"train_loss": -12.365463256835938, "global_step": 488683, "epoch": 2908} {"train_loss": -12.952448844909668, "global_step": 488684, "epoch": 2908} {"train_loss": -12.787652969360352, "global_step": 488685, "epoch": 2908} {"train_loss": -12.391894340515137, "global_step": 488686, "epoch": 2908} {"train_loss": -12.743118286132812, "global_step": 488687, "epoch": 2908} {"train_loss": -13.039739608764648, "global_step": 488688, "epoch": 2908} {"train_loss": -12.42042064666748, "global_step": 488689, "epoch": 2908} {"train_loss": -12.497700691223145, "global_step": 488690, "epoch": 2908} {"train_loss": -12.946434020996094, "global_step": 488691, "epoch": 2908} {"train_loss": -12.802728652954102, "global_step": 488692, "epoch": 2908} {"train_loss": -12.342419624328613, "global_step": 488693, "epoch": 2908} {"train_loss": -12.241686820983887, "global_step": 488694, "epoch": 2908} {"train_loss": -12.787431716918945, "global_step": 488695, "epoch": 2908} {"train_loss": -12.64525032043457, "global_step": 488696, "epoch": 2908} {"train_loss": -11.452259063720703, "global_step": 488697, "epoch": 2908} {"train_loss": -12.40092658996582, "global_step": 488698, "epoch": 2908} {"train_loss": -12.512624740600586, "global_step": 488699, "epoch": 2908} {"train_loss": -12.526899337768555, "global_step": 488700, "epoch": 2908} {"train_loss": -12.207940101623535, "global_step": 488701, "epoch": 2908} {"train_loss": -12.576179504394531, "global_step": 488702, "epoch": 2908} {"train_loss": -12.12048625946045, "global_step": 488703, "epoch": 2908} {"train_loss": -11.56580924987793, "global_step": 488704, "epoch": 2908} {"train_loss": -11.842309951782227, "global_step": 488705, "epoch": 2908} {"train_loss": -11.788758277893066, "global_step": 488706, "epoch": 2908} {"train_loss": -11.790508270263672, "global_step": 488707, "epoch": 2908} {"train_loss": -11.23830509185791, "global_step": 488708, "epoch": 2908} {"train_loss": -12.383611679077148, "global_step": 488709, "epoch": 2908} {"train_loss": -11.672996520996094, "global_step": 488710, "epoch": 2908} {"train_loss": -11.98098683924902, "global_step": 488711, "epoch": 2908, "val_loss": 317572.96875} {"train_loss": -11.037095069885254, "global_step": 488712, "epoch": 2909} {"train_loss": -10.813944816589355, "global_step": 488713, "epoch": 2909} {"train_loss": -11.635634422302246, "global_step": 488714, "epoch": 2909} {"train_loss": -11.466052055358887, "global_step": 488715, "epoch": 2909} {"train_loss": -11.354082107543945, "global_step": 488716, "epoch": 2909} {"train_loss": -10.598403930664062, "global_step": 488717, "epoch": 2909} {"train_loss": -11.126399040222168, "global_step": 488718, "epoch": 2909} {"train_loss": -11.061322212219238, "global_step": 488719, "epoch": 2909} {"train_loss": -11.12771987915039, "global_step": 488720, "epoch": 2909} {"train_loss": -11.568373680114746, "global_step": 488721, "epoch": 2909} {"train_loss": -11.326759338378906, "global_step": 488722, "epoch": 2909} {"train_loss": -10.667716026306152, "global_step": 488723, "epoch": 2909} {"train_loss": -10.196626663208008, "global_step": 488724, "epoch": 2909} {"train_loss": -11.351463317871094, "global_step": 488725, "epoch": 2909} {"train_loss": -10.668997764587402, "global_step": 488726, "epoch": 2909} {"train_loss": -10.316237449645996, "global_step": 488727, "epoch": 2909} {"train_loss": -11.66880989074707, "global_step": 488728, "epoch": 2909} {"train_loss": -11.240182876586914, "global_step": 488729, "epoch": 2909} {"train_loss": -11.97981071472168, "global_step": 488730, "epoch": 2909} {"train_loss": -11.263511657714844, "global_step": 488731, "epoch": 2909} {"train_loss": -11.794702529907227, "global_step": 488732, "epoch": 2909} {"train_loss": -11.818853378295898, "global_step": 488733, "epoch": 2909} {"train_loss": -11.3287353515625, "global_step": 488734, "epoch": 2909} {"train_loss": -12.112839698791504, "global_step": 488735, "epoch": 2909} {"train_loss": -11.485382080078125, "global_step": 488736, "epoch": 2909} {"train_loss": -12.273187637329102, "global_step": 488737, "epoch": 2909} {"train_loss": -11.852422714233398, "global_step": 488738, "epoch": 2909} {"train_loss": -12.347021102905273, "global_step": 488739, "epoch": 2909} {"train_loss": -11.883014678955078, "global_step": 488740, "epoch": 2909} {"train_loss": -11.57020092010498, "global_step": 488741, "epoch": 2909} {"train_loss": -12.270007133483887, "global_step": 488742, "epoch": 2909} {"train_loss": -12.143835067749023, "global_step": 488743, "epoch": 2909} {"train_loss": -11.924734115600586, "global_step": 488744, "epoch": 2909} {"train_loss": -12.05253791809082, "global_step": 488745, "epoch": 2909} {"train_loss": -11.578369140625, "global_step": 488746, "epoch": 2909} {"train_loss": -12.501133918762207, "global_step": 488747, "epoch": 2909} {"train_loss": -12.262627601623535, "global_step": 488748, "epoch": 2909} {"train_loss": -11.89706802368164, "global_step": 488749, "epoch": 2909} {"train_loss": -11.94784164428711, "global_step": 488750, "epoch": 2909} {"train_loss": -11.308050155639648, "global_step": 488751, "epoch": 2909} {"train_loss": -11.241844177246094, "global_step": 488752, "epoch": 2909} {"train_loss": -11.201693534851074, "global_step": 488753, "epoch": 2909} {"train_loss": -11.558156967163086, "global_step": 488754, "epoch": 2909} {"train_loss": -11.53770637512207, "global_step": 488755, "epoch": 2909} {"train_loss": -11.989730834960938, "global_step": 488756, "epoch": 2909} {"train_loss": -11.133499145507812, "global_step": 488757, "epoch": 2909} {"train_loss": -12.275755882263184, "global_step": 488758, "epoch": 2909} {"train_loss": -11.553272247314453, "global_step": 488759, "epoch": 2909} {"train_loss": -11.744983673095703, "global_step": 488760, "epoch": 2909} {"train_loss": -11.789854049682617, "global_step": 488761, "epoch": 2909} {"train_loss": -11.897241592407227, "global_step": 488762, "epoch": 2909} {"train_loss": -12.087614059448242, "global_step": 488763, "epoch": 2909} {"train_loss": -11.864381790161133, "global_step": 488764, "epoch": 2909} {"train_loss": -12.11694049835205, "global_step": 488765, "epoch": 2909} {"train_loss": -12.042205810546875, "global_step": 488766, "epoch": 2909} {"train_loss": -12.163556098937988, "global_step": 488767, "epoch": 2909} {"train_loss": -12.034059524536133, "global_step": 488768, "epoch": 2909} {"train_loss": -12.456496238708496, "global_step": 488769, "epoch": 2909} {"train_loss": -12.085464477539062, "global_step": 488770, "epoch": 2909} {"train_loss": -12.258831977844238, "global_step": 488771, "epoch": 2909} {"train_loss": -12.424825668334961, "global_step": 488772, "epoch": 2909} {"train_loss": -12.196516036987305, "global_step": 488773, "epoch": 2909} {"train_loss": -12.45620346069336, "global_step": 488774, "epoch": 2909} {"train_loss": -12.298964500427246, "global_step": 488775, "epoch": 2909} {"train_loss": -12.36379623413086, "global_step": 488776, "epoch": 2909} {"train_loss": -12.263654708862305, "global_step": 488777, "epoch": 2909} {"train_loss": -12.267860412597656, "global_step": 488778, "epoch": 2909} {"train_loss": -12.514044761657715, "global_step": 488779, "epoch": 2909} {"train_loss": -12.356606483459473, "global_step": 488780, "epoch": 2909} {"train_loss": -12.618453979492188, "global_step": 488781, "epoch": 2909} {"train_loss": -12.497867584228516, "global_step": 488782, "epoch": 2909} {"train_loss": -12.467697143554688, "global_step": 488783, "epoch": 2909} {"train_loss": -12.416706085205078, "global_step": 488784, "epoch": 2909} {"train_loss": -11.853443145751953, "global_step": 488785, "epoch": 2909} {"train_loss": -12.635706901550293, "global_step": 488786, "epoch": 2909} {"train_loss": -12.081999778747559, "global_step": 488787, "epoch": 2909} {"train_loss": -12.677724838256836, "global_step": 488788, "epoch": 2909} {"train_loss": -12.123313903808594, "global_step": 488789, "epoch": 2909} {"train_loss": -12.199914932250977, "global_step": 488790, "epoch": 2909} {"train_loss": -12.352459907531738, "global_step": 488791, "epoch": 2909} {"train_loss": -12.53128433227539, "global_step": 488792, "epoch": 2909} {"train_loss": -12.534472465515137, "global_step": 488793, "epoch": 2909} {"train_loss": -12.320568084716797, "global_step": 488794, "epoch": 2909} {"train_loss": -12.656890869140625, "global_step": 488795, "epoch": 2909} {"train_loss": -12.224839210510254, "global_step": 488796, "epoch": 2909} {"train_loss": -12.563887596130371, "global_step": 488797, "epoch": 2909} {"train_loss": -12.250051498413086, "global_step": 488798, "epoch": 2909} {"train_loss": -12.649497032165527, "global_step": 488799, "epoch": 2909} {"train_loss": -12.415205955505371, "global_step": 488800, "epoch": 2909} {"train_loss": -12.782760620117188, "global_step": 488801, "epoch": 2909} {"train_loss": -12.402923583984375, "global_step": 488802, "epoch": 2909} {"train_loss": -12.829602241516113, "global_step": 488803, "epoch": 2909} {"train_loss": -12.362922668457031, "global_step": 488804, "epoch": 2909} {"train_loss": -12.682469367980957, "global_step": 488805, "epoch": 2909} {"train_loss": -12.488260269165039, "global_step": 488806, "epoch": 2909} {"train_loss": -12.925959587097168, "global_step": 488807, "epoch": 2909} {"train_loss": -12.720362663269043, "global_step": 488808, "epoch": 2909} {"train_loss": -12.512385368347168, "global_step": 488809, "epoch": 2909} {"train_loss": -12.902708053588867, "global_step": 488810, "epoch": 2909} {"train_loss": -12.759989738464355, "global_step": 488811, "epoch": 2909} {"train_loss": -12.463028907775879, "global_step": 488812, "epoch": 2909} {"train_loss": -12.72883415222168, "global_step": 488813, "epoch": 2909} {"train_loss": -12.83493709564209, "global_step": 488814, "epoch": 2909} {"train_loss": -12.814934730529785, "global_step": 488815, "epoch": 2909} {"train_loss": -12.824109077453613, "global_step": 488816, "epoch": 2909} {"train_loss": -12.870024681091309, "global_step": 488817, "epoch": 2909} {"train_loss": -12.946537017822266, "global_step": 488818, "epoch": 2909} {"train_loss": -12.793521881103516, "global_step": 488819, "epoch": 2909} {"train_loss": -12.823685646057129, "global_step": 488820, "epoch": 2909} {"train_loss": -12.73598861694336, "global_step": 488821, "epoch": 2909} {"train_loss": -12.841047286987305, "global_step": 488822, "epoch": 2909} {"train_loss": -12.70009994506836, "global_step": 488823, "epoch": 2909} {"train_loss": -13.037195205688477, "global_step": 488824, "epoch": 2909} {"train_loss": -12.999073028564453, "global_step": 488825, "epoch": 2909} {"train_loss": -13.044317245483398, "global_step": 488826, "epoch": 2909} {"train_loss": -12.641616821289062, "global_step": 488827, "epoch": 2909} {"train_loss": -12.72627067565918, "global_step": 488828, "epoch": 2909} {"train_loss": -12.807111740112305, "global_step": 488829, "epoch": 2909} {"train_loss": -12.831034660339355, "global_step": 488830, "epoch": 2909} {"train_loss": -12.87710952758789, "global_step": 488831, "epoch": 2909} {"train_loss": -12.565206527709961, "global_step": 488832, "epoch": 2909} {"train_loss": -12.850492477416992, "global_step": 488833, "epoch": 2909} {"train_loss": -12.786771774291992, "global_step": 488834, "epoch": 2909} {"train_loss": -12.908648490905762, "global_step": 488835, "epoch": 2909} {"train_loss": -12.803055763244629, "global_step": 488836, "epoch": 2909} {"train_loss": -13.057527542114258, "global_step": 488837, "epoch": 2909} {"train_loss": -12.918651580810547, "global_step": 488838, "epoch": 2909} {"train_loss": -12.877506256103516, "global_step": 488839, "epoch": 2909} {"train_loss": -13.058025360107422, "global_step": 488840, "epoch": 2909} {"train_loss": -12.863930702209473, "global_step": 488841, "epoch": 2909} {"train_loss": -12.814035415649414, "global_step": 488842, "epoch": 2909} {"train_loss": -12.928442001342773, "global_step": 488843, "epoch": 2909} {"train_loss": -12.864953994750977, "global_step": 488844, "epoch": 2909} {"train_loss": -12.898619651794434, "global_step": 488845, "epoch": 2909} {"train_loss": -12.722122192382812, "global_step": 488846, "epoch": 2909} {"train_loss": -13.001273155212402, "global_step": 488847, "epoch": 2909} {"train_loss": -13.031107902526855, "global_step": 488848, "epoch": 2909} {"train_loss": -12.737190246582031, "global_step": 488849, "epoch": 2909} {"train_loss": -12.529464721679688, "global_step": 488850, "epoch": 2909} {"train_loss": -12.527658462524414, "global_step": 488851, "epoch": 2909} {"train_loss": -12.916111946105957, "global_step": 488852, "epoch": 2909} {"train_loss": -12.739791870117188, "global_step": 488853, "epoch": 2909} {"train_loss": -12.974781036376953, "global_step": 488854, "epoch": 2909} {"train_loss": -12.830761909484863, "global_step": 488855, "epoch": 2909} {"train_loss": -12.505228042602539, "global_step": 488856, "epoch": 2909} {"train_loss": -12.680747032165527, "global_step": 488857, "epoch": 2909} {"train_loss": -12.772343635559082, "global_step": 488858, "epoch": 2909} {"train_loss": -12.380265235900879, "global_step": 488859, "epoch": 2909} {"train_loss": -12.036401748657227, "global_step": 488860, "epoch": 2909} {"train_loss": -12.66666030883789, "global_step": 488861, "epoch": 2909} {"train_loss": -12.940715789794922, "global_step": 488862, "epoch": 2909} {"train_loss": -11.93710708618164, "global_step": 488863, "epoch": 2909} {"train_loss": -11.54875373840332, "global_step": 488864, "epoch": 2909} {"train_loss": -12.223590850830078, "global_step": 488865, "epoch": 2909} {"train_loss": -10.606433868408203, "global_step": 488866, "epoch": 2909} {"train_loss": -11.641551971435547, "global_step": 488867, "epoch": 2909} {"train_loss": -12.366619110107422, "global_step": 488868, "epoch": 2909} {"train_loss": -9.904735565185547, "global_step": 488869, "epoch": 2909} {"train_loss": -10.185174942016602, "global_step": 488870, "epoch": 2909} {"train_loss": -9.997057914733887, "global_step": 488871, "epoch": 2909} {"train_loss": -10.037879943847656, "global_step": 488872, "epoch": 2909} {"train_loss": -9.006261825561523, "global_step": 488873, "epoch": 2909} {"train_loss": -9.026037216186523, "global_step": 488874, "epoch": 2909} {"train_loss": -9.04403305053711, "global_step": 488875, "epoch": 2909} {"train_loss": -9.75619888305664, "global_step": 488876, "epoch": 2909} {"train_loss": -8.79762077331543, "global_step": 488877, "epoch": 2909} {"train_loss": -9.689861297607422, "global_step": 488878, "epoch": 2909} {"train_loss": -12.048775990804037, "global_step": 488879, "epoch": 2909, "val_loss": 318050.25} {"train_loss": -9.813863754272461, "global_step": 488880, "epoch": 2910} {"train_loss": -9.990493774414062, "global_step": 488881, "epoch": 2910} {"train_loss": -10.772180557250977, "global_step": 488882, "epoch": 2910} {"train_loss": -10.736961364746094, "global_step": 488883, "epoch": 2910} {"train_loss": -10.473003387451172, "global_step": 488884, "epoch": 2910} {"train_loss": -11.30233383178711, "global_step": 488885, "epoch": 2910} {"train_loss": -10.238906860351562, "global_step": 488886, "epoch": 2910} {"train_loss": -10.150362014770508, "global_step": 488887, "epoch": 2910} {"train_loss": -10.247016906738281, "global_step": 488888, "epoch": 2910} {"train_loss": -10.0540771484375, "global_step": 488889, "epoch": 2910} {"train_loss": -10.711071014404297, "global_step": 488890, "epoch": 2910} {"train_loss": -11.010855674743652, "global_step": 488891, "epoch": 2910} {"train_loss": -10.584939956665039, "global_step": 488892, "epoch": 2910} {"train_loss": -11.195652961730957, "global_step": 488893, "epoch": 2910} {"train_loss": -11.187543869018555, "global_step": 488894, "epoch": 2910} {"train_loss": -11.40731430053711, "global_step": 488895, "epoch": 2910} {"train_loss": -11.81907844543457, "global_step": 488896, "epoch": 2910} {"train_loss": -10.921085357666016, "global_step": 488897, "epoch": 2910} {"train_loss": -11.742585182189941, "global_step": 488898, "epoch": 2910} {"train_loss": -11.758543014526367, "global_step": 488899, "epoch": 2910} {"train_loss": -11.69560432434082, "global_step": 488900, "epoch": 2910} {"train_loss": -12.228662490844727, "global_step": 488901, "epoch": 2910} {"train_loss": -12.193389892578125, "global_step": 488902, "epoch": 2910} {"train_loss": -12.27260971069336, "global_step": 488903, "epoch": 2910} {"train_loss": -12.317843437194824, "global_step": 488904, "epoch": 2910} {"train_loss": -11.99498176574707, "global_step": 488905, "epoch": 2910} {"train_loss": -12.341156005859375, "global_step": 488906, "epoch": 2910} {"train_loss": -12.401798248291016, "global_step": 488907, "epoch": 2910} {"train_loss": -12.36301040649414, "global_step": 488908, "epoch": 2910} {"train_loss": -12.357097625732422, "global_step": 488909, "epoch": 2910} {"train_loss": -12.517916679382324, "global_step": 488910, "epoch": 2910} {"train_loss": -12.421941757202148, "global_step": 488911, "epoch": 2910} {"train_loss": -12.582341194152832, "global_step": 488912, "epoch": 2910} {"train_loss": -12.194805145263672, "global_step": 488913, "epoch": 2910} {"train_loss": -12.419050216674805, "global_step": 488914, "epoch": 2910} {"train_loss": -12.586065292358398, "global_step": 488915, "epoch": 2910} {"train_loss": -12.795852661132812, "global_step": 488916, "epoch": 2910} {"train_loss": -12.475648880004883, "global_step": 488917, "epoch": 2910} {"train_loss": -12.825879096984863, "global_step": 488918, "epoch": 2910} {"train_loss": -12.635040283203125, "global_step": 488919, "epoch": 2910} {"train_loss": -12.47340202331543, "global_step": 488920, "epoch": 2910} {"train_loss": -12.428159713745117, "global_step": 488921, "epoch": 2910} {"train_loss": -12.476274490356445, "global_step": 488922, "epoch": 2910} {"train_loss": -12.574854850769043, "global_step": 488923, "epoch": 2910} {"train_loss": -12.841386795043945, "global_step": 488924, "epoch": 2910} {"train_loss": -12.800310134887695, "global_step": 488925, "epoch": 2910} {"train_loss": -12.677837371826172, "global_step": 488926, "epoch": 2910} {"train_loss": -12.799497604370117, "global_step": 488927, "epoch": 2910} {"train_loss": -12.694271087646484, "global_step": 488928, "epoch": 2910} {"train_loss": -12.74869441986084, "global_step": 488929, "epoch": 2910} {"train_loss": -12.646089553833008, "global_step": 488930, "epoch": 2910} {"train_loss": -12.38253402709961, "global_step": 488931, "epoch": 2910} {"train_loss": -12.820291519165039, "global_step": 488932, "epoch": 2910} {"train_loss": -12.685410499572754, "global_step": 488933, "epoch": 2910} {"train_loss": -12.846372604370117, "global_step": 488934, "epoch": 2910} {"train_loss": -12.392549514770508, "global_step": 488935, "epoch": 2910} {"train_loss": -12.480656623840332, "global_step": 488936, "epoch": 2910} {"train_loss": -12.696839332580566, "global_step": 488937, "epoch": 2910} {"train_loss": -12.688465118408203, "global_step": 488938, "epoch": 2910} {"train_loss": -12.756094932556152, "global_step": 488939, "epoch": 2910} {"train_loss": -12.749818801879883, "global_step": 488940, "epoch": 2910} {"train_loss": -12.91081714630127, "global_step": 488941, "epoch": 2910} {"train_loss": -12.726513862609863, "global_step": 488942, "epoch": 2910} {"train_loss": -12.90559196472168, "global_step": 488943, "epoch": 2910} {"train_loss": -12.650927543640137, "global_step": 488944, "epoch": 2910} {"train_loss": -12.748855590820312, "global_step": 488945, "epoch": 2910} {"train_loss": -12.818796157836914, "global_step": 488946, "epoch": 2910} {"train_loss": -12.531435012817383, "global_step": 488947, "epoch": 2910} {"train_loss": -12.509519577026367, "global_step": 488948, "epoch": 2910} {"train_loss": -12.799646377563477, "global_step": 488949, "epoch": 2910} {"train_loss": -12.8134765625, "global_step": 488950, "epoch": 2910} {"train_loss": -12.78504753112793, "global_step": 488951, "epoch": 2910} {"train_loss": -12.384474754333496, "global_step": 488952, "epoch": 2910} {"train_loss": -12.841796875, "global_step": 488953, "epoch": 2910} {"train_loss": -12.565110206604004, "global_step": 488954, "epoch": 2910} {"train_loss": -12.168933868408203, "global_step": 488955, "epoch": 2910} {"train_loss": -11.608957290649414, "global_step": 488956, "epoch": 2910} {"train_loss": -11.943416595458984, "global_step": 488957, "epoch": 2910} {"train_loss": -12.380013465881348, "global_step": 488958, "epoch": 2910} {"train_loss": -12.925018310546875, "global_step": 488959, "epoch": 2910} {"train_loss": -11.72224235534668, "global_step": 488960, "epoch": 2910} {"train_loss": -12.196046829223633, "global_step": 488961, "epoch": 2910} {"train_loss": -12.62247371673584, "global_step": 488962, "epoch": 2910} {"train_loss": -12.485440254211426, "global_step": 488963, "epoch": 2910} {"train_loss": -12.23463249206543, "global_step": 488964, "epoch": 2910} {"train_loss": -12.381132125854492, "global_step": 488965, "epoch": 2910} {"train_loss": -12.770914077758789, "global_step": 488966, "epoch": 2910} {"train_loss": -12.546974182128906, "global_step": 488967, "epoch": 2910} {"train_loss": -12.190082550048828, "global_step": 488968, "epoch": 2910} {"train_loss": -10.99795913696289, "global_step": 488969, "epoch": 2910} {"train_loss": -11.956799507141113, "global_step": 488970, "epoch": 2910} {"train_loss": -10.321584701538086, "global_step": 488971, "epoch": 2910} {"train_loss": -10.565584182739258, "global_step": 488972, "epoch": 2910} {"train_loss": -12.332145690917969, "global_step": 488973, "epoch": 2910} {"train_loss": -10.924887657165527, "global_step": 488974, "epoch": 2910} {"train_loss": -11.26762580871582, "global_step": 488975, "epoch": 2910} {"train_loss": -12.64716911315918, "global_step": 488976, "epoch": 2910} {"train_loss": -10.794134140014648, "global_step": 488977, "epoch": 2910} {"train_loss": -12.215093612670898, "global_step": 488978, "epoch": 2910} {"train_loss": -12.094401359558105, "global_step": 488979, "epoch": 2910} {"train_loss": -11.574604034423828, "global_step": 488980, "epoch": 2910} {"train_loss": -11.658697128295898, "global_step": 488981, "epoch": 2910} {"train_loss": -11.866891860961914, "global_step": 488982, "epoch": 2910} {"train_loss": -12.172843933105469, "global_step": 488983, "epoch": 2910} {"train_loss": -12.407230377197266, "global_step": 488984, "epoch": 2910} {"train_loss": -12.567323684692383, "global_step": 488985, "epoch": 2910} {"train_loss": -12.033670425415039, "global_step": 488986, "epoch": 2910} {"train_loss": -12.746589660644531, "global_step": 488987, "epoch": 2910} {"train_loss": -12.342355728149414, "global_step": 488988, "epoch": 2910} {"train_loss": -12.58845329284668, "global_step": 488989, "epoch": 2910} {"train_loss": -12.162078857421875, "global_step": 488990, "epoch": 2910} {"train_loss": -12.537757873535156, "global_step": 488991, "epoch": 2910} {"train_loss": -12.394147872924805, "global_step": 488992, "epoch": 2910} {"train_loss": -12.631982803344727, "global_step": 488993, "epoch": 2910} {"train_loss": -12.376167297363281, "global_step": 488994, "epoch": 2910} {"train_loss": -12.476371765136719, "global_step": 488995, "epoch": 2910} {"train_loss": -11.85688591003418, "global_step": 488996, "epoch": 2910} {"train_loss": -12.559057235717773, "global_step": 488997, "epoch": 2910} {"train_loss": -12.03305435180664, "global_step": 488998, "epoch": 2910} {"train_loss": -12.500457763671875, "global_step": 488999, "epoch": 2910} {"train_loss": -11.937467575073242, "global_step": 489000, "epoch": 2910} {"train_loss": -12.098557472229004, "global_step": 489001, "epoch": 2910} {"train_loss": -12.469202041625977, "global_step": 489002, "epoch": 2910} {"train_loss": -12.249741554260254, "global_step": 489003, "epoch": 2910} {"train_loss": -12.163687705993652, "global_step": 489004, "epoch": 2910} {"train_loss": -12.180486679077148, "global_step": 489005, "epoch": 2910} {"train_loss": -12.087297439575195, "global_step": 489006, "epoch": 2910} {"train_loss": -11.151538848876953, "global_step": 489007, "epoch": 2910} {"train_loss": -12.200628280639648, "global_step": 489008, "epoch": 2910} {"train_loss": -12.225021362304688, "global_step": 489009, "epoch": 2910} {"train_loss": -11.841511726379395, "global_step": 489010, "epoch": 2910} {"train_loss": -12.223726272583008, "global_step": 489011, "epoch": 2910} {"train_loss": -12.33139705657959, "global_step": 489012, "epoch": 2910} {"train_loss": -12.25879955291748, "global_step": 489013, "epoch": 2910} {"train_loss": -11.934054374694824, "global_step": 489014, "epoch": 2910} {"train_loss": -12.292030334472656, "global_step": 489015, "epoch": 2910} {"train_loss": -12.151217460632324, "global_step": 489016, "epoch": 2910} {"train_loss": -12.541780471801758, "global_step": 489017, "epoch": 2910} {"train_loss": -12.353031158447266, "global_step": 489018, "epoch": 2910} {"train_loss": -12.571863174438477, "global_step": 489019, "epoch": 2910} {"train_loss": -12.392204284667969, "global_step": 489020, "epoch": 2910} {"train_loss": -12.646477699279785, "global_step": 489021, "epoch": 2910} {"train_loss": -12.198461532592773, "global_step": 489022, "epoch": 2910} {"train_loss": -12.184898376464844, "global_step": 489023, "epoch": 2910} {"train_loss": -12.740467071533203, "global_step": 489024, "epoch": 2910} {"train_loss": -12.024248123168945, "global_step": 489025, "epoch": 2910} {"train_loss": -12.838438034057617, "global_step": 489026, "epoch": 2910} {"train_loss": -12.453531265258789, "global_step": 489027, "epoch": 2910} {"train_loss": -12.358564376831055, "global_step": 489028, "epoch": 2910} {"train_loss": -12.647342681884766, "global_step": 489029, "epoch": 2910} {"train_loss": -12.553905487060547, "global_step": 489030, "epoch": 2910} {"train_loss": -12.671220779418945, "global_step": 489031, "epoch": 2910} {"train_loss": -12.290904998779297, "global_step": 489032, "epoch": 2910} {"train_loss": -12.4055814743042, "global_step": 489033, "epoch": 2910} {"train_loss": -12.321024894714355, "global_step": 489034, "epoch": 2910} {"train_loss": -12.799959182739258, "global_step": 489035, "epoch": 2910} {"train_loss": -12.551543235778809, "global_step": 489036, "epoch": 2910} {"train_loss": -12.639228820800781, "global_step": 489037, "epoch": 2910} {"train_loss": -12.83240795135498, "global_step": 489038, "epoch": 2910} {"train_loss": -12.276311874389648, "global_step": 489039, "epoch": 2910} {"train_loss": -12.58205509185791, "global_step": 489040, "epoch": 2910} {"train_loss": -12.248321533203125, "global_step": 489041, "epoch": 2910} {"train_loss": -12.742144584655762, "global_step": 489042, "epoch": 2910} {"train_loss": -12.679320335388184, "global_step": 489043, "epoch": 2910} {"train_loss": -12.235111236572266, "global_step": 489044, "epoch": 2910} {"train_loss": -12.681378364562988, "global_step": 489045, "epoch": 2910} {"train_loss": -12.153157234191895, "global_step": 489046, "epoch": 2910} {"train_loss": -12.164856621197291, "global_step": 489047, "epoch": 2910, "val_loss": 318436.75, "train_action_mse_error": 2.1358935832977295} {"train_loss": -12.095702171325684, "global_step": 489048, "epoch": 2911} {"train_loss": -12.397603988647461, "global_step": 489049, "epoch": 2911} {"train_loss": -12.552000999450684, "global_step": 489050, "epoch": 2911} {"train_loss": -12.390737533569336, "global_step": 489051, "epoch": 2911} {"train_loss": -11.75088882446289, "global_step": 489052, "epoch": 2911} {"train_loss": -12.415842056274414, "global_step": 489053, "epoch": 2911} {"train_loss": -12.54875659942627, "global_step": 489054, "epoch": 2911} {"train_loss": -12.26083755493164, "global_step": 489055, "epoch": 2911} {"train_loss": -12.58061695098877, "global_step": 489056, "epoch": 2911} {"train_loss": -12.275015830993652, "global_step": 489057, "epoch": 2911} {"train_loss": -11.81517219543457, "global_step": 489058, "epoch": 2911} {"train_loss": -12.439091682434082, "global_step": 489059, "epoch": 2911} {"train_loss": -12.382460594177246, "global_step": 489060, "epoch": 2911} {"train_loss": -12.689610481262207, "global_step": 489061, "epoch": 2911} {"train_loss": -12.327905654907227, "global_step": 489062, "epoch": 2911} {"train_loss": -12.634600639343262, "global_step": 489063, "epoch": 2911} {"train_loss": -12.479008674621582, "global_step": 489064, "epoch": 2911} {"train_loss": -12.719072341918945, "global_step": 489065, "epoch": 2911} {"train_loss": -12.483274459838867, "global_step": 489066, "epoch": 2911} {"train_loss": -12.52631950378418, "global_step": 489067, "epoch": 2911} {"train_loss": -12.597982406616211, "global_step": 489068, "epoch": 2911} {"train_loss": -12.83033561706543, "global_step": 489069, "epoch": 2911} {"train_loss": -12.439559936523438, "global_step": 489070, "epoch": 2911} {"train_loss": -12.58176040649414, "global_step": 489071, "epoch": 2911} {"train_loss": -12.689594268798828, "global_step": 489072, "epoch": 2911} {"train_loss": -12.416812896728516, "global_step": 489073, "epoch": 2911} {"train_loss": -12.357303619384766, "global_step": 489074, "epoch": 2911} {"train_loss": -12.243213653564453, "global_step": 489075, "epoch": 2911} {"train_loss": -12.555651664733887, "global_step": 489076, "epoch": 2911} {"train_loss": -12.586471557617188, "global_step": 489077, "epoch": 2911} {"train_loss": -12.169013977050781, "global_step": 489078, "epoch": 2911} {"train_loss": -12.500434875488281, "global_step": 489079, "epoch": 2911} {"train_loss": -12.058138847351074, "global_step": 489080, "epoch": 2911} {"train_loss": -11.667999267578125, "global_step": 489081, "epoch": 2911} {"train_loss": -12.957122802734375, "global_step": 489082, "epoch": 2911} {"train_loss": -12.233699798583984, "global_step": 489083, "epoch": 2911} {"train_loss": -12.063505172729492, "global_step": 489084, "epoch": 2911} {"train_loss": -12.325604438781738, "global_step": 489085, "epoch": 2911} {"train_loss": -11.549540519714355, "global_step": 489086, "epoch": 2911} {"train_loss": -12.575400352478027, "global_step": 489087, "epoch": 2911} {"train_loss": -11.610478401184082, "global_step": 489088, "epoch": 2911} {"train_loss": -11.579659461975098, "global_step": 489089, "epoch": 2911} {"train_loss": -12.109033584594727, "global_step": 489090, "epoch": 2911} {"train_loss": -11.146476745605469, "global_step": 489091, "epoch": 2911} {"train_loss": -10.65396499633789, "global_step": 489092, "epoch": 2911} {"train_loss": -10.860857963562012, "global_step": 489093, "epoch": 2911} {"train_loss": -11.247613906860352, "global_step": 489094, "epoch": 2911} {"train_loss": -11.992111206054688, "global_step": 489095, "epoch": 2911} {"train_loss": -11.553056716918945, "global_step": 489096, "epoch": 2911} {"train_loss": -11.36433219909668, "global_step": 489097, "epoch": 2911} {"train_loss": -12.175680160522461, "global_step": 489098, "epoch": 2911} {"train_loss": -11.918212890625, "global_step": 489099, "epoch": 2911} {"train_loss": -11.32148551940918, "global_step": 489100, "epoch": 2911} {"train_loss": -11.609174728393555, "global_step": 489101, "epoch": 2911} {"train_loss": -12.603371620178223, "global_step": 489102, "epoch": 2911} {"train_loss": -12.363069534301758, "global_step": 489103, "epoch": 2911} {"train_loss": -12.118558883666992, "global_step": 489104, "epoch": 2911} {"train_loss": -12.565285682678223, "global_step": 489105, "epoch": 2911} {"train_loss": -12.597644805908203, "global_step": 489106, "epoch": 2911} {"train_loss": -12.298908233642578, "global_step": 489107, "epoch": 2911} {"train_loss": -12.404146194458008, "global_step": 489108, "epoch": 2911} {"train_loss": -12.05837631225586, "global_step": 489109, "epoch": 2911} {"train_loss": -12.550932884216309, "global_step": 489110, "epoch": 2911} {"train_loss": -12.096292495727539, "global_step": 489111, "epoch": 2911} {"train_loss": -12.478042602539062, "global_step": 489112, "epoch": 2911} {"train_loss": -12.170089721679688, "global_step": 489113, "epoch": 2911} {"train_loss": -12.556085586547852, "global_step": 489114, "epoch": 2911} {"train_loss": -12.324480056762695, "global_step": 489115, "epoch": 2911} {"train_loss": -11.987157821655273, "global_step": 489116, "epoch": 2911} {"train_loss": -12.290261268615723, "global_step": 489117, "epoch": 2911} {"train_loss": -10.908732414245605, "global_step": 489118, "epoch": 2911} {"train_loss": -11.60562515258789, "global_step": 489119, "epoch": 2911} {"train_loss": -12.067248344421387, "global_step": 489120, "epoch": 2911} {"train_loss": -12.24081039428711, "global_step": 489121, "epoch": 2911} {"train_loss": -11.930055618286133, "global_step": 489122, "epoch": 2911} {"train_loss": -12.407318115234375, "global_step": 489123, "epoch": 2911} {"train_loss": -12.040472030639648, "global_step": 489124, "epoch": 2911} {"train_loss": -12.161191940307617, "global_step": 489125, "epoch": 2911} {"train_loss": -12.734781265258789, "global_step": 489126, "epoch": 2911} {"train_loss": -12.288276672363281, "global_step": 489127, "epoch": 2911} {"train_loss": -12.080887794494629, "global_step": 489128, "epoch": 2911} {"train_loss": -12.338277816772461, "global_step": 489129, "epoch": 2911} {"train_loss": -12.386738777160645, "global_step": 489130, "epoch": 2911} {"train_loss": -12.146835327148438, "global_step": 489131, "epoch": 2911} {"train_loss": -12.71066665649414, "global_step": 489132, "epoch": 2911} {"train_loss": -12.063132286071777, "global_step": 489133, "epoch": 2911} {"train_loss": -12.26852798461914, "global_step": 489134, "epoch": 2911} {"train_loss": -12.212236404418945, "global_step": 489135, "epoch": 2911} {"train_loss": -12.432063102722168, "global_step": 489136, "epoch": 2911} {"train_loss": -12.497169494628906, "global_step": 489137, "epoch": 2911} {"train_loss": -11.886838912963867, "global_step": 489138, "epoch": 2911} {"train_loss": -12.298349380493164, "global_step": 489139, "epoch": 2911} {"train_loss": -11.982281684875488, "global_step": 489140, "epoch": 2911} {"train_loss": -12.479934692382812, "global_step": 489141, "epoch": 2911} {"train_loss": -12.396015167236328, "global_step": 489142, "epoch": 2911} {"train_loss": -12.235246658325195, "global_step": 489143, "epoch": 2911} {"train_loss": -12.222585678100586, "global_step": 489144, "epoch": 2911} {"train_loss": -12.234652519226074, "global_step": 489145, "epoch": 2911} {"train_loss": -12.299461364746094, "global_step": 489146, "epoch": 2911} {"train_loss": -12.423852920532227, "global_step": 489147, "epoch": 2911} {"train_loss": -12.572059631347656, "global_step": 489148, "epoch": 2911} {"train_loss": -12.470601081848145, "global_step": 489149, "epoch": 2911} {"train_loss": -12.363533020019531, "global_step": 489150, "epoch": 2911} {"train_loss": -12.525856018066406, "global_step": 489151, "epoch": 2911} {"train_loss": -12.801255226135254, "global_step": 489152, "epoch": 2911} {"train_loss": -12.53891372680664, "global_step": 489153, "epoch": 2911} {"train_loss": -12.325977325439453, "global_step": 489154, "epoch": 2911} {"train_loss": -12.49017333984375, "global_step": 489155, "epoch": 2911} {"train_loss": -12.391756057739258, "global_step": 489156, "epoch": 2911} {"train_loss": -12.26634407043457, "global_step": 489157, "epoch": 2911} {"train_loss": -12.020471572875977, "global_step": 489158, "epoch": 2911} {"train_loss": -11.450092315673828, "global_step": 489159, "epoch": 2911} {"train_loss": -12.217109680175781, "global_step": 489160, "epoch": 2911} {"train_loss": -11.52107048034668, "global_step": 489161, "epoch": 2911} {"train_loss": -12.137128829956055, "global_step": 489162, "epoch": 2911} {"train_loss": -12.117385864257812, "global_step": 489163, "epoch": 2911} {"train_loss": -11.44503402709961, "global_step": 489164, "epoch": 2911} {"train_loss": -10.819012641906738, "global_step": 489165, "epoch": 2911} {"train_loss": -10.825522422790527, "global_step": 489166, "epoch": 2911} {"train_loss": -11.658662796020508, "global_step": 489167, "epoch": 2911} {"train_loss": -8.895503044128418, "global_step": 489168, "epoch": 2911} {"train_loss": -10.562215805053711, "global_step": 489169, "epoch": 2911} {"train_loss": -9.679985046386719, "global_step": 489170, "epoch": 2911} {"train_loss": -9.05180549621582, "global_step": 489171, "epoch": 2911} {"train_loss": -11.825138092041016, "global_step": 489172, "epoch": 2911} {"train_loss": -9.664582252502441, "global_step": 489173, "epoch": 2911} {"train_loss": -11.89912223815918, "global_step": 489174, "epoch": 2911} {"train_loss": -9.569549560546875, "global_step": 489175, "epoch": 2911} {"train_loss": -10.301840782165527, "global_step": 489176, "epoch": 2911} {"train_loss": -10.545135498046875, "global_step": 489177, "epoch": 2911} {"train_loss": -8.759702682495117, "global_step": 489178, "epoch": 2911} {"train_loss": -10.771379470825195, "global_step": 489179, "epoch": 2911} {"train_loss": -7.749223232269287, "global_step": 489180, "epoch": 2911} {"train_loss": -8.79828929901123, "global_step": 489181, "epoch": 2911} {"train_loss": -10.47353744506836, "global_step": 489182, "epoch": 2911} {"train_loss": -9.667802810668945, "global_step": 489183, "epoch": 2911} {"train_loss": -10.988077163696289, "global_step": 489184, "epoch": 2911} {"train_loss": -9.798221588134766, "global_step": 489185, "epoch": 2911} {"train_loss": -9.532670021057129, "global_step": 489186, "epoch": 2911} {"train_loss": -10.790494918823242, "global_step": 489187, "epoch": 2911} {"train_loss": -11.279312133789062, "global_step": 489188, "epoch": 2911} {"train_loss": -10.616732597351074, "global_step": 489189, "epoch": 2911} {"train_loss": -11.499000549316406, "global_step": 489190, "epoch": 2911} {"train_loss": -11.109613418579102, "global_step": 489191, "epoch": 2911} {"train_loss": -11.006711959838867, "global_step": 489192, "epoch": 2911} {"train_loss": -11.296110153198242, "global_step": 489193, "epoch": 2911} {"train_loss": -11.019658088684082, "global_step": 489194, "epoch": 2911} {"train_loss": -10.930709838867188, "global_step": 489195, "epoch": 2911} {"train_loss": -11.978208541870117, "global_step": 489196, "epoch": 2911} {"train_loss": -11.324499130249023, "global_step": 489197, "epoch": 2911} {"train_loss": -11.565164566040039, "global_step": 489198, "epoch": 2911} {"train_loss": -12.03996753692627, "global_step": 489199, "epoch": 2911} {"train_loss": -11.926855087280273, "global_step": 489200, "epoch": 2911} {"train_loss": -11.807955741882324, "global_step": 489201, "epoch": 2911} {"train_loss": -12.152838706970215, "global_step": 489202, "epoch": 2911} {"train_loss": -11.740362167358398, "global_step": 489203, "epoch": 2911} {"train_loss": -11.879855155944824, "global_step": 489204, "epoch": 2911} {"train_loss": -12.371370315551758, "global_step": 489205, "epoch": 2911} {"train_loss": -11.756782531738281, "global_step": 489206, "epoch": 2911} {"train_loss": -12.375667572021484, "global_step": 489207, "epoch": 2911} {"train_loss": -12.16712760925293, "global_step": 489208, "epoch": 2911} {"train_loss": -12.08534049987793, "global_step": 489209, "epoch": 2911} {"train_loss": -11.97750473022461, "global_step": 489210, "epoch": 2911} {"train_loss": -12.388404846191406, "global_step": 489211, "epoch": 2911} {"train_loss": -12.217192649841309, "global_step": 489212, "epoch": 2911} {"train_loss": -12.133268356323242, "global_step": 489213, "epoch": 2911} {"train_loss": -12.555431365966797, "global_step": 489214, "epoch": 2911} {"train_loss": -11.839736333915166, "global_step": 489215, "epoch": 2911, "val_loss": 316178.03125} {"train_loss": -12.351994514465332, "global_step": 489216, "epoch": 2912} {"train_loss": -12.403371810913086, "global_step": 489217, "epoch": 2912} {"train_loss": -12.178045272827148, "global_step": 489218, "epoch": 2912} {"train_loss": -12.080024719238281, "global_step": 489219, "epoch": 2912} {"train_loss": -12.369277954101562, "global_step": 489220, "epoch": 2912} {"train_loss": -12.461368560791016, "global_step": 489221, "epoch": 2912} {"train_loss": -12.129706382751465, "global_step": 489222, "epoch": 2912} {"train_loss": -12.516225814819336, "global_step": 489223, "epoch": 2912} {"train_loss": -12.075767517089844, "global_step": 489224, "epoch": 2912} {"train_loss": -12.3896484375, "global_step": 489225, "epoch": 2912} {"train_loss": -12.41124153137207, "global_step": 489226, "epoch": 2912} {"train_loss": -11.987924575805664, "global_step": 489227, "epoch": 2912} {"train_loss": -12.407696723937988, "global_step": 489228, "epoch": 2912} {"train_loss": -12.363822937011719, "global_step": 489229, "epoch": 2912} {"train_loss": -12.480886459350586, "global_step": 489230, "epoch": 2912} {"train_loss": -12.376330375671387, "global_step": 489231, "epoch": 2912} {"train_loss": -12.702905654907227, "global_step": 489232, "epoch": 2912} {"train_loss": -12.385709762573242, "global_step": 489233, "epoch": 2912} {"train_loss": -12.620893478393555, "global_step": 489234, "epoch": 2912} {"train_loss": -12.503847122192383, "global_step": 489235, "epoch": 2912} {"train_loss": -12.51897144317627, "global_step": 489236, "epoch": 2912} {"train_loss": -12.677106857299805, "global_step": 489237, "epoch": 2912} {"train_loss": -12.546613693237305, "global_step": 489238, "epoch": 2912} {"train_loss": -12.453439712524414, "global_step": 489239, "epoch": 2912} {"train_loss": -12.398370742797852, "global_step": 489240, "epoch": 2912} {"train_loss": -12.593270301818848, "global_step": 489241, "epoch": 2912} {"train_loss": -12.440585136413574, "global_step": 489242, "epoch": 2912} {"train_loss": -12.615313529968262, "global_step": 489243, "epoch": 2912} {"train_loss": -12.565597534179688, "global_step": 489244, "epoch": 2912} {"train_loss": -12.470229148864746, "global_step": 489245, "epoch": 2912} {"train_loss": -12.733335494995117, "global_step": 489246, "epoch": 2912} {"train_loss": -12.648588180541992, "global_step": 489247, "epoch": 2912} {"train_loss": -12.722650527954102, "global_step": 489248, "epoch": 2912} {"train_loss": -12.555834770202637, "global_step": 489249, "epoch": 2912} {"train_loss": -12.646990776062012, "global_step": 489250, "epoch": 2912} {"train_loss": -12.487003326416016, "global_step": 489251, "epoch": 2912} {"train_loss": -12.786276817321777, "global_step": 489252, "epoch": 2912} {"train_loss": -12.643451690673828, "global_step": 489253, "epoch": 2912} {"train_loss": -12.767000198364258, "global_step": 489254, "epoch": 2912} {"train_loss": -12.555889129638672, "global_step": 489255, "epoch": 2912} {"train_loss": -12.685141563415527, "global_step": 489256, "epoch": 2912} {"train_loss": -12.613626480102539, "global_step": 489257, "epoch": 2912} {"train_loss": -12.75089168548584, "global_step": 489258, "epoch": 2912} {"train_loss": -12.741256713867188, "global_step": 489259, "epoch": 2912} {"train_loss": -12.656429290771484, "global_step": 489260, "epoch": 2912} {"train_loss": -12.811163902282715, "global_step": 489261, "epoch": 2912} {"train_loss": -12.635842323303223, "global_step": 489262, "epoch": 2912} {"train_loss": -12.505213737487793, "global_step": 489263, "epoch": 2912} {"train_loss": -12.780098915100098, "global_step": 489264, "epoch": 2912} {"train_loss": -12.52348804473877, "global_step": 489265, "epoch": 2912} {"train_loss": -12.677770614624023, "global_step": 489266, "epoch": 2912} {"train_loss": -12.358491897583008, "global_step": 489267, "epoch": 2912} {"train_loss": -12.637467384338379, "global_step": 489268, "epoch": 2912} {"train_loss": -12.399225234985352, "global_step": 489269, "epoch": 2912} {"train_loss": -12.816645622253418, "global_step": 489270, "epoch": 2912} {"train_loss": -12.348796844482422, "global_step": 489271, "epoch": 2912} {"train_loss": -12.902874946594238, "global_step": 489272, "epoch": 2912} {"train_loss": -12.565638542175293, "global_step": 489273, "epoch": 2912} {"train_loss": -12.685718536376953, "global_step": 489274, "epoch": 2912} {"train_loss": -12.56766128540039, "global_step": 489275, "epoch": 2912} {"train_loss": -12.518272399902344, "global_step": 489276, "epoch": 2912} {"train_loss": -12.384073257446289, "global_step": 489277, "epoch": 2912} {"train_loss": -12.294498443603516, "global_step": 489278, "epoch": 2912} {"train_loss": -12.497001647949219, "global_step": 489279, "epoch": 2912} {"train_loss": -12.458675384521484, "global_step": 489280, "epoch": 2912} {"train_loss": -12.623455047607422, "global_step": 489281, "epoch": 2912} {"train_loss": -12.141304016113281, "global_step": 489282, "epoch": 2912} {"train_loss": -12.124187469482422, "global_step": 489283, "epoch": 2912} {"train_loss": -12.775578498840332, "global_step": 489284, "epoch": 2912} {"train_loss": -12.335886001586914, "global_step": 489285, "epoch": 2912} {"train_loss": -11.769537925720215, "global_step": 489286, "epoch": 2912} {"train_loss": -12.546902656555176, "global_step": 489287, "epoch": 2912} {"train_loss": -12.764461517333984, "global_step": 489288, "epoch": 2912} {"train_loss": -12.629426956176758, "global_step": 489289, "epoch": 2912} {"train_loss": -12.56090259552002, "global_step": 489290, "epoch": 2912} {"train_loss": -12.522720336914062, "global_step": 489291, "epoch": 2912} {"train_loss": -12.791177749633789, "global_step": 489292, "epoch": 2912} {"train_loss": -12.442229270935059, "global_step": 489293, "epoch": 2912} {"train_loss": -12.656728744506836, "global_step": 489294, "epoch": 2912} {"train_loss": -12.512900352478027, "global_step": 489295, "epoch": 2912} {"train_loss": -12.375211715698242, "global_step": 489296, "epoch": 2912} {"train_loss": -12.449411392211914, "global_step": 489297, "epoch": 2912} {"train_loss": -12.50635051727295, "global_step": 489298, "epoch": 2912} {"train_loss": -12.612351417541504, "global_step": 489299, "epoch": 2912} {"train_loss": -12.429500579833984, "global_step": 489300, "epoch": 2912} {"train_loss": -12.143875122070312, "global_step": 489301, "epoch": 2912} {"train_loss": -12.443927764892578, "global_step": 489302, "epoch": 2912} {"train_loss": -12.319051742553711, "global_step": 489303, "epoch": 2912} {"train_loss": -12.237344741821289, "global_step": 489304, "epoch": 2912} {"train_loss": -12.323923110961914, "global_step": 489305, "epoch": 2912} {"train_loss": -12.062919616699219, "global_step": 489306, "epoch": 2912} {"train_loss": -11.601935386657715, "global_step": 489307, "epoch": 2912} {"train_loss": -11.171562194824219, "global_step": 489308, "epoch": 2912} {"train_loss": -11.904472351074219, "global_step": 489309, "epoch": 2912} {"train_loss": -12.510662078857422, "global_step": 489310, "epoch": 2912} {"train_loss": -11.76774787902832, "global_step": 489311, "epoch": 2912} {"train_loss": -12.203227996826172, "global_step": 489312, "epoch": 2912} {"train_loss": -12.59361457824707, "global_step": 489313, "epoch": 2912} {"train_loss": -12.261804580688477, "global_step": 489314, "epoch": 2912} {"train_loss": -12.08644962310791, "global_step": 489315, "epoch": 2912} {"train_loss": -12.052705764770508, "global_step": 489316, "epoch": 2912} {"train_loss": -12.489907264709473, "global_step": 489317, "epoch": 2912} {"train_loss": -12.030235290527344, "global_step": 489318, "epoch": 2912} {"train_loss": -12.24247932434082, "global_step": 489319, "epoch": 2912} {"train_loss": -12.9341459274292, "global_step": 489320, "epoch": 2912} {"train_loss": -12.546462059020996, "global_step": 489321, "epoch": 2912} {"train_loss": -12.798276901245117, "global_step": 489322, "epoch": 2912} {"train_loss": -12.420125961303711, "global_step": 489323, "epoch": 2912} {"train_loss": -12.866278648376465, "global_step": 489324, "epoch": 2912} {"train_loss": -12.471231460571289, "global_step": 489325, "epoch": 2912} {"train_loss": -12.491769790649414, "global_step": 489326, "epoch": 2912} {"train_loss": -12.936700820922852, "global_step": 489327, "epoch": 2912} {"train_loss": -12.535005569458008, "global_step": 489328, "epoch": 2912} {"train_loss": -12.347640037536621, "global_step": 489329, "epoch": 2912} {"train_loss": -12.945813179016113, "global_step": 489330, "epoch": 2912} {"train_loss": -12.651785850524902, "global_step": 489331, "epoch": 2912} {"train_loss": -12.057592391967773, "global_step": 489332, "epoch": 2912} {"train_loss": -12.634998321533203, "global_step": 489333, "epoch": 2912} {"train_loss": -12.71798038482666, "global_step": 489334, "epoch": 2912} {"train_loss": -12.285615921020508, "global_step": 489335, "epoch": 2912} {"train_loss": -12.809576034545898, "global_step": 489336, "epoch": 2912} {"train_loss": -12.550996780395508, "global_step": 489337, "epoch": 2912} {"train_loss": -12.554043769836426, "global_step": 489338, "epoch": 2912} {"train_loss": -12.266822814941406, "global_step": 489339, "epoch": 2912} {"train_loss": -12.673736572265625, "global_step": 489340, "epoch": 2912} {"train_loss": -12.10533618927002, "global_step": 489341, "epoch": 2912} {"train_loss": -10.171982765197754, "global_step": 489342, "epoch": 2912} {"train_loss": -12.108692169189453, "global_step": 489343, "epoch": 2912} {"train_loss": -11.95976448059082, "global_step": 489344, "epoch": 2912} {"train_loss": -12.150968551635742, "global_step": 489345, "epoch": 2912} {"train_loss": -12.340397834777832, "global_step": 489346, "epoch": 2912} {"train_loss": -12.053768157958984, "global_step": 489347, "epoch": 2912} {"train_loss": -11.866172790527344, "global_step": 489348, "epoch": 2912} {"train_loss": -12.380300521850586, "global_step": 489349, "epoch": 2912} {"train_loss": -12.36917495727539, "global_step": 489350, "epoch": 2912} {"train_loss": -12.699743270874023, "global_step": 489351, "epoch": 2912} {"train_loss": -12.72714614868164, "global_step": 489352, "epoch": 2912} {"train_loss": -12.625327110290527, "global_step": 489353, "epoch": 2912} {"train_loss": -12.45997428894043, "global_step": 489354, "epoch": 2912} {"train_loss": -12.570701599121094, "global_step": 489355, "epoch": 2912} {"train_loss": -12.317471504211426, "global_step": 489356, "epoch": 2912} {"train_loss": -12.390546798706055, "global_step": 489357, "epoch": 2912} {"train_loss": -12.858003616333008, "global_step": 489358, "epoch": 2912} {"train_loss": -12.543779373168945, "global_step": 489359, "epoch": 2912} {"train_loss": -11.982275009155273, "global_step": 489360, "epoch": 2912} {"train_loss": -12.380979537963867, "global_step": 489361, "epoch": 2912} {"train_loss": -12.642702102661133, "global_step": 489362, "epoch": 2912} {"train_loss": -11.664224624633789, "global_step": 489363, "epoch": 2912} {"train_loss": -12.45634651184082, "global_step": 489364, "epoch": 2912} {"train_loss": -12.4721040725708, "global_step": 489365, "epoch": 2912} {"train_loss": -12.185670852661133, "global_step": 489366, "epoch": 2912} {"train_loss": -11.780036926269531, "global_step": 489367, "epoch": 2912} {"train_loss": -12.389982223510742, "global_step": 489368, "epoch": 2912} {"train_loss": -12.611425399780273, "global_step": 489369, "epoch": 2912} {"train_loss": -12.651588439941406, "global_step": 489370, "epoch": 2912} {"train_loss": -12.650579452514648, "global_step": 489371, "epoch": 2912} {"train_loss": -12.501826286315918, "global_step": 489372, "epoch": 2912} {"train_loss": -12.818225860595703, "global_step": 489373, "epoch": 2912} {"train_loss": -12.65345287322998, "global_step": 489374, "epoch": 2912} {"train_loss": -12.80628776550293, "global_step": 489375, "epoch": 2912} {"train_loss": -12.06801700592041, "global_step": 489376, "epoch": 2912} {"train_loss": -12.606269836425781, "global_step": 489377, "epoch": 2912} {"train_loss": -12.146381378173828, "global_step": 489378, "epoch": 2912} {"train_loss": -12.064435958862305, "global_step": 489379, "epoch": 2912} {"train_loss": -12.396440505981445, "global_step": 489380, "epoch": 2912} {"train_loss": -12.233905792236328, "global_step": 489381, "epoch": 2912} {"train_loss": -11.461343765258789, "global_step": 489382, "epoch": 2912} {"train_loss": -12.422524259203957, "global_step": 489383, "epoch": 2912, "val_loss": 320699.75} {"train_loss": -11.980134963989258, "global_step": 489384, "epoch": 2913} {"train_loss": -12.283334732055664, "global_step": 489385, "epoch": 2913} {"train_loss": -11.888378143310547, "global_step": 489386, "epoch": 2913} {"train_loss": -11.896876335144043, "global_step": 489387, "epoch": 2913} {"train_loss": -12.443275451660156, "global_step": 489388, "epoch": 2913} {"train_loss": -12.445991516113281, "global_step": 489389, "epoch": 2913} {"train_loss": -12.165557861328125, "global_step": 489390, "epoch": 2913} {"train_loss": -12.663750648498535, "global_step": 489391, "epoch": 2913} {"train_loss": -12.143183708190918, "global_step": 489392, "epoch": 2913} {"train_loss": -12.482625961303711, "global_step": 489393, "epoch": 2913} {"train_loss": -12.44720458984375, "global_step": 489394, "epoch": 2913} {"train_loss": -12.330312728881836, "global_step": 489395, "epoch": 2913} {"train_loss": -12.584299087524414, "global_step": 489396, "epoch": 2913} {"train_loss": -12.558913230895996, "global_step": 489397, "epoch": 2913} {"train_loss": -12.59813117980957, "global_step": 489398, "epoch": 2913} {"train_loss": -12.19083023071289, "global_step": 489399, "epoch": 2913} {"train_loss": -12.830354690551758, "global_step": 489400, "epoch": 2913} {"train_loss": -12.519996643066406, "global_step": 489401, "epoch": 2913} {"train_loss": -12.380757331848145, "global_step": 489402, "epoch": 2913} {"train_loss": -12.383857727050781, "global_step": 489403, "epoch": 2913} {"train_loss": -12.215557098388672, "global_step": 489404, "epoch": 2913} {"train_loss": -12.407276153564453, "global_step": 489405, "epoch": 2913} {"train_loss": -12.51095199584961, "global_step": 489406, "epoch": 2913} {"train_loss": -12.576024055480957, "global_step": 489407, "epoch": 2913} {"train_loss": -12.607755661010742, "global_step": 489408, "epoch": 2913} {"train_loss": -12.414493560791016, "global_step": 489409, "epoch": 2913} {"train_loss": -12.348140716552734, "global_step": 489410, "epoch": 2913} {"train_loss": -12.297911643981934, "global_step": 489411, "epoch": 2913} {"train_loss": -12.78637981414795, "global_step": 489412, "epoch": 2913} {"train_loss": -12.299640655517578, "global_step": 489413, "epoch": 2913} {"train_loss": -12.434450149536133, "global_step": 489414, "epoch": 2913} {"train_loss": -12.525970458984375, "global_step": 489415, "epoch": 2913} {"train_loss": -12.623165130615234, "global_step": 489416, "epoch": 2913} {"train_loss": -11.805644989013672, "global_step": 489417, "epoch": 2913} {"train_loss": -12.67292594909668, "global_step": 489418, "epoch": 2913} {"train_loss": -12.730439186096191, "global_step": 489419, "epoch": 2913} {"train_loss": -12.43408203125, "global_step": 489420, "epoch": 2913} {"train_loss": -12.167121887207031, "global_step": 489421, "epoch": 2913} {"train_loss": -12.35759162902832, "global_step": 489422, "epoch": 2913} {"train_loss": -12.591558456420898, "global_step": 489423, "epoch": 2913} {"train_loss": -12.377198219299316, "global_step": 489424, "epoch": 2913} {"train_loss": -11.837139129638672, "global_step": 489425, "epoch": 2913} {"train_loss": -11.720403671264648, "global_step": 489426, "epoch": 2913} {"train_loss": -12.522744178771973, "global_step": 489427, "epoch": 2913} {"train_loss": -12.334511756896973, "global_step": 489428, "epoch": 2913} {"train_loss": -11.235713005065918, "global_step": 489429, "epoch": 2913} {"train_loss": -12.531525611877441, "global_step": 489430, "epoch": 2913} {"train_loss": -12.458154678344727, "global_step": 489431, "epoch": 2913} {"train_loss": -11.579432487487793, "global_step": 489432, "epoch": 2913} {"train_loss": -12.65639877319336, "global_step": 489433, "epoch": 2913} {"train_loss": -12.281098365783691, "global_step": 489434, "epoch": 2913} {"train_loss": -12.320192337036133, "global_step": 489435, "epoch": 2913} {"train_loss": -12.301901817321777, "global_step": 489436, "epoch": 2913} {"train_loss": -12.549097061157227, "global_step": 489437, "epoch": 2913} {"train_loss": -12.017437934875488, "global_step": 489438, "epoch": 2913} {"train_loss": -12.391733169555664, "global_step": 489439, "epoch": 2913} {"train_loss": -11.566558837890625, "global_step": 489440, "epoch": 2913} {"train_loss": -12.345800399780273, "global_step": 489441, "epoch": 2913} {"train_loss": -11.930070877075195, "global_step": 489442, "epoch": 2913} {"train_loss": -12.098745346069336, "global_step": 489443, "epoch": 2913} {"train_loss": -12.695566177368164, "global_step": 489444, "epoch": 2913} {"train_loss": -11.925979614257812, "global_step": 489445, "epoch": 2913} {"train_loss": -12.41543197631836, "global_step": 489446, "epoch": 2913} {"train_loss": -12.37823486328125, "global_step": 489447, "epoch": 2913} {"train_loss": -12.42451286315918, "global_step": 489448, "epoch": 2913} {"train_loss": -12.449338912963867, "global_step": 489449, "epoch": 2913} {"train_loss": -12.178902626037598, "global_step": 489450, "epoch": 2913} {"train_loss": -11.906098365783691, "global_step": 489451, "epoch": 2913} {"train_loss": -12.504785537719727, "global_step": 489452, "epoch": 2913} {"train_loss": -12.035958290100098, "global_step": 489453, "epoch": 2913} {"train_loss": -11.992043495178223, "global_step": 489454, "epoch": 2913} {"train_loss": -12.531098365783691, "global_step": 489455, "epoch": 2913} {"train_loss": -11.861146926879883, "global_step": 489456, "epoch": 2913} {"train_loss": -12.074607849121094, "global_step": 489457, "epoch": 2913} {"train_loss": -11.48888111114502, "global_step": 489458, "epoch": 2913} {"train_loss": -12.78736686706543, "global_step": 489459, "epoch": 2913} {"train_loss": -11.90286922454834, "global_step": 489460, "epoch": 2913} {"train_loss": -12.145186424255371, "global_step": 489461, "epoch": 2913} {"train_loss": -12.14583969116211, "global_step": 489462, "epoch": 2913} {"train_loss": -11.886083602905273, "global_step": 489463, "epoch": 2913} {"train_loss": -12.956470489501953, "global_step": 489464, "epoch": 2913} {"train_loss": -12.10887336730957, "global_step": 489465, "epoch": 2913} {"train_loss": -12.8042631149292, "global_step": 489466, "epoch": 2913} {"train_loss": -12.368948936462402, "global_step": 489467, "epoch": 2913} {"train_loss": -12.936650276184082, "global_step": 489468, "epoch": 2913} {"train_loss": -12.792886734008789, "global_step": 489469, "epoch": 2913} {"train_loss": -12.826408386230469, "global_step": 489470, "epoch": 2913} {"train_loss": -12.714923858642578, "global_step": 489471, "epoch": 2913} {"train_loss": -12.967998504638672, "global_step": 489472, "epoch": 2913} {"train_loss": -12.577131271362305, "global_step": 489473, "epoch": 2913} {"train_loss": -12.681339263916016, "global_step": 489474, "epoch": 2913} {"train_loss": -12.88906478881836, "global_step": 489475, "epoch": 2913} {"train_loss": -12.718585014343262, "global_step": 489476, "epoch": 2913} {"train_loss": -13.030988693237305, "global_step": 489477, "epoch": 2913} {"train_loss": -12.823356628417969, "global_step": 489478, "epoch": 2913} {"train_loss": -13.046272277832031, "global_step": 489479, "epoch": 2913} {"train_loss": -12.78653335571289, "global_step": 489480, "epoch": 2913} {"train_loss": -12.881624221801758, "global_step": 489481, "epoch": 2913} {"train_loss": -13.004670143127441, "global_step": 489482, "epoch": 2913} {"train_loss": -12.773908615112305, "global_step": 489483, "epoch": 2913} {"train_loss": -12.636672019958496, "global_step": 489484, "epoch": 2913} {"train_loss": -12.734365463256836, "global_step": 489485, "epoch": 2913} {"train_loss": -12.726676940917969, "global_step": 489486, "epoch": 2913} {"train_loss": -12.677209854125977, "global_step": 489487, "epoch": 2913} {"train_loss": -12.970139503479004, "global_step": 489488, "epoch": 2913} {"train_loss": -12.560388565063477, "global_step": 489489, "epoch": 2913} {"train_loss": -12.462961196899414, "global_step": 489490, "epoch": 2913} {"train_loss": -12.517623901367188, "global_step": 489491, "epoch": 2913} {"train_loss": -12.698877334594727, "global_step": 489492, "epoch": 2913} {"train_loss": -12.580545425415039, "global_step": 489493, "epoch": 2913} {"train_loss": -12.050920486450195, "global_step": 489494, "epoch": 2913} {"train_loss": -12.111335754394531, "global_step": 489495, "epoch": 2913} {"train_loss": -12.774431228637695, "global_step": 489496, "epoch": 2913} {"train_loss": -12.021587371826172, "global_step": 489497, "epoch": 2913} {"train_loss": -12.816573143005371, "global_step": 489498, "epoch": 2913} {"train_loss": -12.438817977905273, "global_step": 489499, "epoch": 2913} {"train_loss": -12.976826667785645, "global_step": 489500, "epoch": 2913} {"train_loss": -12.502723693847656, "global_step": 489501, "epoch": 2913} {"train_loss": -12.839298248291016, "global_step": 489502, "epoch": 2913} {"train_loss": -12.511009216308594, "global_step": 489503, "epoch": 2913} {"train_loss": -12.880819320678711, "global_step": 489504, "epoch": 2913} {"train_loss": -12.585087776184082, "global_step": 489505, "epoch": 2913} {"train_loss": -12.523271560668945, "global_step": 489506, "epoch": 2913} {"train_loss": -12.221383094787598, "global_step": 489507, "epoch": 2913} {"train_loss": -12.520212173461914, "global_step": 489508, "epoch": 2913} {"train_loss": -12.895825386047363, "global_step": 489509, "epoch": 2913} {"train_loss": -12.703729629516602, "global_step": 489510, "epoch": 2913} {"train_loss": -12.787674903869629, "global_step": 489511, "epoch": 2913} {"train_loss": -12.793383598327637, "global_step": 489512, "epoch": 2913} {"train_loss": -12.472582817077637, "global_step": 489513, "epoch": 2913} {"train_loss": -12.607612609863281, "global_step": 489514, "epoch": 2913} {"train_loss": -12.55371379852295, "global_step": 489515, "epoch": 2913} {"train_loss": -12.618597984313965, "global_step": 489516, "epoch": 2913} {"train_loss": -12.46287727355957, "global_step": 489517, "epoch": 2913} {"train_loss": -12.418923377990723, "global_step": 489518, "epoch": 2913} {"train_loss": -12.43952751159668, "global_step": 489519, "epoch": 2913} {"train_loss": -12.502884864807129, "global_step": 489520, "epoch": 2913} {"train_loss": -12.60545539855957, "global_step": 489521, "epoch": 2913} {"train_loss": -12.232937812805176, "global_step": 489522, "epoch": 2913} {"train_loss": -12.892696380615234, "global_step": 489523, "epoch": 2913} {"train_loss": -11.997787475585938, "global_step": 489524, "epoch": 2913} {"train_loss": -12.189927101135254, "global_step": 489525, "epoch": 2913} {"train_loss": -12.768739700317383, "global_step": 489526, "epoch": 2913} {"train_loss": -12.307615280151367, "global_step": 489527, "epoch": 2913} {"train_loss": -12.475497245788574, "global_step": 489528, "epoch": 2913} {"train_loss": -12.677366256713867, "global_step": 489529, "epoch": 2913} {"train_loss": -12.231292724609375, "global_step": 489530, "epoch": 2913} {"train_loss": -12.236379623413086, "global_step": 489531, "epoch": 2913} {"train_loss": -12.407987594604492, "global_step": 489532, "epoch": 2913} {"train_loss": -11.748416900634766, "global_step": 489533, "epoch": 2913} {"train_loss": -10.300918579101562, "global_step": 489534, "epoch": 2913} {"train_loss": -12.293131828308105, "global_step": 489535, "epoch": 2913} {"train_loss": -11.212458610534668, "global_step": 489536, "epoch": 2913} {"train_loss": -10.849617958068848, "global_step": 489537, "epoch": 2913} {"train_loss": -11.76518440246582, "global_step": 489538, "epoch": 2913} {"train_loss": -11.016487121582031, "global_step": 489539, "epoch": 2913} {"train_loss": -10.929035186767578, "global_step": 489540, "epoch": 2913} {"train_loss": -11.206623077392578, "global_step": 489541, "epoch": 2913} {"train_loss": -11.89642333984375, "global_step": 489542, "epoch": 2913} {"train_loss": -10.343802452087402, "global_step": 489543, "epoch": 2913} {"train_loss": -12.284562110900879, "global_step": 489544, "epoch": 2913} {"train_loss": -11.898941993713379, "global_step": 489545, "epoch": 2913} {"train_loss": -12.178905487060547, "global_step": 489546, "epoch": 2913} {"train_loss": -11.508827209472656, "global_step": 489547, "epoch": 2913} {"train_loss": -12.620283126831055, "global_step": 489548, "epoch": 2913} {"train_loss": -12.006245613098145, "global_step": 489549, "epoch": 2913} {"train_loss": -11.69728946685791, "global_step": 489550, "epoch": 2913} {"train_loss": -12.338714247658139, "global_step": 489551, "epoch": 2913, "val_loss": 317919.40625} {"train_loss": -11.957468032836914, "global_step": 489552, "epoch": 2914} {"train_loss": -11.698387145996094, "global_step": 489553, "epoch": 2914} {"train_loss": -12.108379364013672, "global_step": 489554, "epoch": 2914} {"train_loss": -11.541902542114258, "global_step": 489555, "epoch": 2914} {"train_loss": -11.909950256347656, "global_step": 489556, "epoch": 2914} {"train_loss": -12.007152557373047, "global_step": 489557, "epoch": 2914} {"train_loss": -10.977540969848633, "global_step": 489558, "epoch": 2914} {"train_loss": -12.141189575195312, "global_step": 489559, "epoch": 2914} {"train_loss": -11.972346305847168, "global_step": 489560, "epoch": 2914} {"train_loss": -12.042054176330566, "global_step": 489561, "epoch": 2914} {"train_loss": -12.439451217651367, "global_step": 489562, "epoch": 2914} {"train_loss": -11.772750854492188, "global_step": 489563, "epoch": 2914} {"train_loss": -12.287776947021484, "global_step": 489564, "epoch": 2914} {"train_loss": -12.161092758178711, "global_step": 489565, "epoch": 2914} {"train_loss": -12.652633666992188, "global_step": 489566, "epoch": 2914} {"train_loss": -11.467278480529785, "global_step": 489567, "epoch": 2914} {"train_loss": -12.511078834533691, "global_step": 489568, "epoch": 2914} {"train_loss": -12.070026397705078, "global_step": 489569, "epoch": 2914} {"train_loss": -12.408203125, "global_step": 489570, "epoch": 2914} {"train_loss": -12.44548511505127, "global_step": 489571, "epoch": 2914} {"train_loss": -12.101490020751953, "global_step": 489572, "epoch": 2914} {"train_loss": -12.522514343261719, "global_step": 489573, "epoch": 2914} {"train_loss": -12.329795837402344, "global_step": 489574, "epoch": 2914} {"train_loss": -12.411680221557617, "global_step": 489575, "epoch": 2914} {"train_loss": -12.644979476928711, "global_step": 489576, "epoch": 2914} {"train_loss": -12.64628791809082, "global_step": 489577, "epoch": 2914} {"train_loss": -12.639440536499023, "global_step": 489578, "epoch": 2914} {"train_loss": -12.412049293518066, "global_step": 489579, "epoch": 2914} {"train_loss": -12.58752727508545, "global_step": 489580, "epoch": 2914} {"train_loss": -12.744436264038086, "global_step": 489581, "epoch": 2914} {"train_loss": -12.649185180664062, "global_step": 489582, "epoch": 2914} {"train_loss": -12.789867401123047, "global_step": 489583, "epoch": 2914} {"train_loss": -12.619422912597656, "global_step": 489584, "epoch": 2914} {"train_loss": -12.62225341796875, "global_step": 489585, "epoch": 2914} {"train_loss": -12.319364547729492, "global_step": 489586, "epoch": 2914} {"train_loss": -12.808874130249023, "global_step": 489587, "epoch": 2914} {"train_loss": -12.570271492004395, "global_step": 489588, "epoch": 2914} {"train_loss": -12.626462936401367, "global_step": 489589, "epoch": 2914} {"train_loss": -12.756409645080566, "global_step": 489590, "epoch": 2914} {"train_loss": -12.665771484375, "global_step": 489591, "epoch": 2914} {"train_loss": -12.514836311340332, "global_step": 489592, "epoch": 2914} {"train_loss": -12.582916259765625, "global_step": 489593, "epoch": 2914} {"train_loss": -12.4058198928833, "global_step": 489594, "epoch": 2914} {"train_loss": -12.192713737487793, "global_step": 489595, "epoch": 2914} {"train_loss": -12.173672676086426, "global_step": 489596, "epoch": 2914} {"train_loss": -12.729050636291504, "global_step": 489597, "epoch": 2914} {"train_loss": -12.175207138061523, "global_step": 489598, "epoch": 2914} {"train_loss": -12.572477340698242, "global_step": 489599, "epoch": 2914} {"train_loss": -12.897099494934082, "global_step": 489600, "epoch": 2914} {"train_loss": -12.616276741027832, "global_step": 489601, "epoch": 2914} {"train_loss": -12.379619598388672, "global_step": 489602, "epoch": 2914} {"train_loss": -12.599392890930176, "global_step": 489603, "epoch": 2914} {"train_loss": -12.539587020874023, "global_step": 489604, "epoch": 2914} {"train_loss": -12.1453218460083, "global_step": 489605, "epoch": 2914} {"train_loss": -12.720185279846191, "global_step": 489606, "epoch": 2914} {"train_loss": -12.01425838470459, "global_step": 489607, "epoch": 2914} {"train_loss": -12.085554122924805, "global_step": 489608, "epoch": 2914} {"train_loss": -12.038192749023438, "global_step": 489609, "epoch": 2914} {"train_loss": -12.073163032531738, "global_step": 489610, "epoch": 2914} {"train_loss": -11.939324378967285, "global_step": 489611, "epoch": 2914} {"train_loss": -12.595065116882324, "global_step": 489612, "epoch": 2914} {"train_loss": -11.882445335388184, "global_step": 489613, "epoch": 2914} {"train_loss": -11.85084342956543, "global_step": 489614, "epoch": 2914} {"train_loss": -12.637166023254395, "global_step": 489615, "epoch": 2914} {"train_loss": -11.228050231933594, "global_step": 489616, "epoch": 2914} {"train_loss": -12.702141761779785, "global_step": 489617, "epoch": 2914} {"train_loss": -12.362956047058105, "global_step": 489618, "epoch": 2914} {"train_loss": -12.255138397216797, "global_step": 489619, "epoch": 2914} {"train_loss": -12.636918067932129, "global_step": 489620, "epoch": 2914} {"train_loss": -12.469640731811523, "global_step": 489621, "epoch": 2914} {"train_loss": -12.45136833190918, "global_step": 489622, "epoch": 2914} {"train_loss": -12.608026504516602, "global_step": 489623, "epoch": 2914} {"train_loss": -11.733612060546875, "global_step": 489624, "epoch": 2914} {"train_loss": -12.442306518554688, "global_step": 489625, "epoch": 2914} {"train_loss": -12.649789810180664, "global_step": 489626, "epoch": 2914} {"train_loss": -12.262557983398438, "global_step": 489627, "epoch": 2914} {"train_loss": -12.285839080810547, "global_step": 489628, "epoch": 2914} {"train_loss": -12.681867599487305, "global_step": 489629, "epoch": 2914} {"train_loss": -12.396273612976074, "global_step": 489630, "epoch": 2914} {"train_loss": -12.517285346984863, "global_step": 489631, "epoch": 2914} {"train_loss": -12.637126922607422, "global_step": 489632, "epoch": 2914} {"train_loss": -12.424184799194336, "global_step": 489633, "epoch": 2914} {"train_loss": -12.498188972473145, "global_step": 489634, "epoch": 2914} {"train_loss": -12.569173812866211, "global_step": 489635, "epoch": 2914} {"train_loss": -12.23142147064209, "global_step": 489636, "epoch": 2914} {"train_loss": -12.350215911865234, "global_step": 489637, "epoch": 2914} {"train_loss": -12.111726760864258, "global_step": 489638, "epoch": 2914} {"train_loss": -11.948055267333984, "global_step": 489639, "epoch": 2914} {"train_loss": -11.931340217590332, "global_step": 489640, "epoch": 2914} {"train_loss": -12.816217422485352, "global_step": 489641, "epoch": 2914} {"train_loss": -11.340707778930664, "global_step": 489642, "epoch": 2914} {"train_loss": -12.416650772094727, "global_step": 489643, "epoch": 2914} {"train_loss": -12.400640487670898, "global_step": 489644, "epoch": 2914} {"train_loss": -12.226398468017578, "global_step": 489645, "epoch": 2914} {"train_loss": -12.931983947753906, "global_step": 489646, "epoch": 2914} {"train_loss": -12.535324096679688, "global_step": 489647, "epoch": 2914} {"train_loss": -12.934511184692383, "global_step": 489648, "epoch": 2914} {"train_loss": -12.593433380126953, "global_step": 489649, "epoch": 2914} {"train_loss": -12.866788864135742, "global_step": 489650, "epoch": 2914} {"train_loss": -12.760526657104492, "global_step": 489651, "epoch": 2914} {"train_loss": -12.699731826782227, "global_step": 489652, "epoch": 2914} {"train_loss": -12.560819625854492, "global_step": 489653, "epoch": 2914} {"train_loss": -12.623784065246582, "global_step": 489654, "epoch": 2914} {"train_loss": -12.204169273376465, "global_step": 489655, "epoch": 2914} {"train_loss": -12.571306228637695, "global_step": 489656, "epoch": 2914} {"train_loss": -12.333395004272461, "global_step": 489657, "epoch": 2914} {"train_loss": -11.904163360595703, "global_step": 489658, "epoch": 2914} {"train_loss": -11.889823913574219, "global_step": 489659, "epoch": 2914} {"train_loss": -12.541631698608398, "global_step": 489660, "epoch": 2914} {"train_loss": -12.112194061279297, "global_step": 489661, "epoch": 2914} {"train_loss": -12.381810188293457, "global_step": 489662, "epoch": 2914} {"train_loss": -12.261911392211914, "global_step": 489663, "epoch": 2914} {"train_loss": -11.797350883483887, "global_step": 489664, "epoch": 2914} {"train_loss": -12.689603805541992, "global_step": 489665, "epoch": 2914} {"train_loss": -12.558235168457031, "global_step": 489666, "epoch": 2914} {"train_loss": -12.184488296508789, "global_step": 489667, "epoch": 2914} {"train_loss": -12.356180191040039, "global_step": 489668, "epoch": 2914} {"train_loss": -12.532907485961914, "global_step": 489669, "epoch": 2914} {"train_loss": -11.65810489654541, "global_step": 489670, "epoch": 2914} {"train_loss": -12.32894515991211, "global_step": 489671, "epoch": 2914} {"train_loss": -11.735725402832031, "global_step": 489672, "epoch": 2914} {"train_loss": -11.9912691116333, "global_step": 489673, "epoch": 2914} {"train_loss": -12.621379852294922, "global_step": 489674, "epoch": 2914} {"train_loss": -12.440631866455078, "global_step": 489675, "epoch": 2914} {"train_loss": -12.084073066711426, "global_step": 489676, "epoch": 2914} {"train_loss": -12.327938079833984, "global_step": 489677, "epoch": 2914} {"train_loss": -12.37408447265625, "global_step": 489678, "epoch": 2914} {"train_loss": -12.380584716796875, "global_step": 489679, "epoch": 2914} {"train_loss": -12.570317268371582, "global_step": 489680, "epoch": 2914} {"train_loss": -12.69375228881836, "global_step": 489681, "epoch": 2914} {"train_loss": -12.572725296020508, "global_step": 489682, "epoch": 2914} {"train_loss": -12.885168075561523, "global_step": 489683, "epoch": 2914} {"train_loss": -12.582785606384277, "global_step": 489684, "epoch": 2914} {"train_loss": -12.569188117980957, "global_step": 489685, "epoch": 2914} {"train_loss": -12.84079360961914, "global_step": 489686, "epoch": 2914} {"train_loss": -12.387402534484863, "global_step": 489687, "epoch": 2914} {"train_loss": -12.537179946899414, "global_step": 489688, "epoch": 2914} {"train_loss": -12.413612365722656, "global_step": 489689, "epoch": 2914} {"train_loss": -12.700020790100098, "global_step": 489690, "epoch": 2914} {"train_loss": -12.862164497375488, "global_step": 489691, "epoch": 2914} {"train_loss": -12.72468090057373, "global_step": 489692, "epoch": 2914} {"train_loss": -12.482540130615234, "global_step": 489693, "epoch": 2914} {"train_loss": -12.970905303955078, "global_step": 489694, "epoch": 2914} {"train_loss": -12.73031234741211, "global_step": 489695, "epoch": 2914} {"train_loss": -12.488940238952637, "global_step": 489696, "epoch": 2914} {"train_loss": -12.627729415893555, "global_step": 489697, "epoch": 2914} {"train_loss": -12.805065155029297, "global_step": 489698, "epoch": 2914} {"train_loss": -12.65675163269043, "global_step": 489699, "epoch": 2914} {"train_loss": -12.63332748413086, "global_step": 489700, "epoch": 2914} {"train_loss": -12.84898567199707, "global_step": 489701, "epoch": 2914} {"train_loss": -12.724153518676758, "global_step": 489702, "epoch": 2914} {"train_loss": -12.657422065734863, "global_step": 489703, "epoch": 2914} {"train_loss": -12.764670372009277, "global_step": 489704, "epoch": 2914} {"train_loss": -12.770432472229004, "global_step": 489705, "epoch": 2914} {"train_loss": -12.595819473266602, "global_step": 489706, "epoch": 2914} {"train_loss": -12.439787864685059, "global_step": 489707, "epoch": 2914} {"train_loss": -12.747576713562012, "global_step": 489708, "epoch": 2914} {"train_loss": -12.727230072021484, "global_step": 489709, "epoch": 2914} {"train_loss": -12.209933280944824, "global_step": 489710, "epoch": 2914} {"train_loss": -12.654823303222656, "global_step": 489711, "epoch": 2914} {"train_loss": -12.883312225341797, "global_step": 489712, "epoch": 2914} {"train_loss": -12.640644073486328, "global_step": 489713, "epoch": 2914} {"train_loss": -12.498226165771484, "global_step": 489714, "epoch": 2914} {"train_loss": -12.6878662109375, "global_step": 489715, "epoch": 2914} {"train_loss": -12.598739624023438, "global_step": 489716, "epoch": 2914} {"train_loss": -11.926837921142578, "global_step": 489717, "epoch": 2914} {"train_loss": -12.410473823547363, "global_step": 489718, "epoch": 2914} {"train_loss": -12.405948071252732, "global_step": 489719, "epoch": 2914, "val_loss": 318522.78125} {"train_loss": -12.538712501525879, "global_step": 489720, "epoch": 2915} {"train_loss": -12.37330150604248, "global_step": 489721, "epoch": 2915} {"train_loss": -12.356884002685547, "global_step": 489722, "epoch": 2915} {"train_loss": -10.922286987304688, "global_step": 489723, "epoch": 2915} {"train_loss": -12.455489158630371, "global_step": 489724, "epoch": 2915} {"train_loss": -10.699789047241211, "global_step": 489725, "epoch": 2915} {"train_loss": -11.550809860229492, "global_step": 489726, "epoch": 2915} {"train_loss": -10.610597610473633, "global_step": 489727, "epoch": 2915} {"train_loss": -10.402106285095215, "global_step": 489728, "epoch": 2915} {"train_loss": -11.783801078796387, "global_step": 489729, "epoch": 2915} {"train_loss": -8.775245666503906, "global_step": 489730, "epoch": 2915} {"train_loss": -9.264693260192871, "global_step": 489731, "epoch": 2915} {"train_loss": -10.27055835723877, "global_step": 489732, "epoch": 2915} {"train_loss": -10.812664031982422, "global_step": 489733, "epoch": 2915} {"train_loss": -10.455854415893555, "global_step": 489734, "epoch": 2915} {"train_loss": -10.71391773223877, "global_step": 489735, "epoch": 2915} {"train_loss": -11.208934783935547, "global_step": 489736, "epoch": 2915} {"train_loss": -9.876245498657227, "global_step": 489737, "epoch": 2915} {"train_loss": -12.0258207321167, "global_step": 489738, "epoch": 2915} {"train_loss": -11.49299430847168, "global_step": 489739, "epoch": 2915} {"train_loss": -10.938847541809082, "global_step": 489740, "epoch": 2915} {"train_loss": -12.159980773925781, "global_step": 489741, "epoch": 2915} {"train_loss": -11.517536163330078, "global_step": 489742, "epoch": 2915} {"train_loss": -11.964655876159668, "global_step": 489743, "epoch": 2915} {"train_loss": -11.630706787109375, "global_step": 489744, "epoch": 2915} {"train_loss": -12.340163230895996, "global_step": 489745, "epoch": 2915} {"train_loss": -12.040773391723633, "global_step": 489746, "epoch": 2915} {"train_loss": -12.193029403686523, "global_step": 489747, "epoch": 2915} {"train_loss": -12.210624694824219, "global_step": 489748, "epoch": 2915} {"train_loss": -12.070345878601074, "global_step": 489749, "epoch": 2915} {"train_loss": -12.474771499633789, "global_step": 489750, "epoch": 2915} {"train_loss": -12.426788330078125, "global_step": 489751, "epoch": 2915} {"train_loss": -12.345728874206543, "global_step": 489752, "epoch": 2915} {"train_loss": -11.900964736938477, "global_step": 489753, "epoch": 2915} {"train_loss": -12.004999160766602, "global_step": 489754, "epoch": 2915} {"train_loss": -12.443778991699219, "global_step": 489755, "epoch": 2915} {"train_loss": -12.381053924560547, "global_step": 489756, "epoch": 2915} {"train_loss": -11.880380630493164, "global_step": 489757, "epoch": 2915} {"train_loss": -12.677423477172852, "global_step": 489758, "epoch": 2915} {"train_loss": -11.579753875732422, "global_step": 489759, "epoch": 2915} {"train_loss": -12.430177688598633, "global_step": 489760, "epoch": 2915} {"train_loss": -12.230892181396484, "global_step": 489761, "epoch": 2915} {"train_loss": -12.465145111083984, "global_step": 489762, "epoch": 2915} {"train_loss": -12.17907428741455, "global_step": 489763, "epoch": 2915} {"train_loss": -12.046972274780273, "global_step": 489764, "epoch": 2915} {"train_loss": -12.460348129272461, "global_step": 489765, "epoch": 2915} {"train_loss": -11.757976531982422, "global_step": 489766, "epoch": 2915} {"train_loss": -12.151416778564453, "global_step": 489767, "epoch": 2915} {"train_loss": -11.758118629455566, "global_step": 489768, "epoch": 2915} {"train_loss": -11.509035110473633, "global_step": 489769, "epoch": 2915} {"train_loss": -11.685653686523438, "global_step": 489770, "epoch": 2915} {"train_loss": -11.140714645385742, "global_step": 489771, "epoch": 2915} {"train_loss": -11.907354354858398, "global_step": 489772, "epoch": 2915} {"train_loss": -11.978723526000977, "global_step": 489773, "epoch": 2915} {"train_loss": -12.41695499420166, "global_step": 489774, "epoch": 2915} {"train_loss": -11.716814994812012, "global_step": 489775, "epoch": 2915} {"train_loss": -12.384552001953125, "global_step": 489776, "epoch": 2915} {"train_loss": -12.24573040008545, "global_step": 489777, "epoch": 2915} {"train_loss": -13.027618408203125, "global_step": 489778, "epoch": 2915} {"train_loss": -11.92750072479248, "global_step": 489779, "epoch": 2915} {"train_loss": -12.278207778930664, "global_step": 489780, "epoch": 2915} {"train_loss": -12.432275772094727, "global_step": 489781, "epoch": 2915} {"train_loss": -11.952337265014648, "global_step": 489782, "epoch": 2915} {"train_loss": -12.550100326538086, "global_step": 489783, "epoch": 2915} {"train_loss": -12.008546829223633, "global_step": 489784, "epoch": 2915} {"train_loss": -12.499451637268066, "global_step": 489785, "epoch": 2915} {"train_loss": -11.94904899597168, "global_step": 489786, "epoch": 2915} {"train_loss": -11.05174446105957, "global_step": 489787, "epoch": 2915} {"train_loss": -11.86562728881836, "global_step": 489788, "epoch": 2915} {"train_loss": -11.422082901000977, "global_step": 489789, "epoch": 2915} {"train_loss": -10.989091873168945, "global_step": 489790, "epoch": 2915} {"train_loss": -11.668035507202148, "global_step": 489791, "epoch": 2915} {"train_loss": -11.086570739746094, "global_step": 489792, "epoch": 2915} {"train_loss": -12.090021133422852, "global_step": 489793, "epoch": 2915} {"train_loss": -11.173882484436035, "global_step": 489794, "epoch": 2915} {"train_loss": -11.437347412109375, "global_step": 489795, "epoch": 2915} {"train_loss": -12.083444595336914, "global_step": 489796, "epoch": 2915} {"train_loss": -10.51049518585205, "global_step": 489797, "epoch": 2915} {"train_loss": -12.464479446411133, "global_step": 489798, "epoch": 2915} {"train_loss": -11.378482818603516, "global_step": 489799, "epoch": 2915} {"train_loss": -11.761343002319336, "global_step": 489800, "epoch": 2915} {"train_loss": -11.934513092041016, "global_step": 489801, "epoch": 2915} {"train_loss": -10.518704414367676, "global_step": 489802, "epoch": 2915} {"train_loss": -12.340927124023438, "global_step": 489803, "epoch": 2915} {"train_loss": -11.793342590332031, "global_step": 489804, "epoch": 2915} {"train_loss": -12.47929573059082, "global_step": 489805, "epoch": 2915} {"train_loss": -12.58224868774414, "global_step": 489806, "epoch": 2915} {"train_loss": -12.197078704833984, "global_step": 489807, "epoch": 2915} {"train_loss": -12.146564483642578, "global_step": 489808, "epoch": 2915} {"train_loss": -12.132147789001465, "global_step": 489809, "epoch": 2915} {"train_loss": -12.736263275146484, "global_step": 489810, "epoch": 2915} {"train_loss": -12.61900520324707, "global_step": 489811, "epoch": 2915} {"train_loss": -12.431190490722656, "global_step": 489812, "epoch": 2915} {"train_loss": -12.331819534301758, "global_step": 489813, "epoch": 2915} {"train_loss": -12.533622741699219, "global_step": 489814, "epoch": 2915} {"train_loss": -12.454824447631836, "global_step": 489815, "epoch": 2915} {"train_loss": -12.797048568725586, "global_step": 489816, "epoch": 2915} {"train_loss": -12.65424919128418, "global_step": 489817, "epoch": 2915} {"train_loss": -12.653146743774414, "global_step": 489818, "epoch": 2915} {"train_loss": -12.342009544372559, "global_step": 489819, "epoch": 2915} {"train_loss": -12.577230453491211, "global_step": 489820, "epoch": 2915} {"train_loss": -12.519937515258789, "global_step": 489821, "epoch": 2915} {"train_loss": -12.374895095825195, "global_step": 489822, "epoch": 2915} {"train_loss": -12.65513801574707, "global_step": 489823, "epoch": 2915} {"train_loss": -12.344749450683594, "global_step": 489824, "epoch": 2915} {"train_loss": -12.544933319091797, "global_step": 489825, "epoch": 2915} {"train_loss": -12.718828201293945, "global_step": 489826, "epoch": 2915} {"train_loss": -12.657232284545898, "global_step": 489827, "epoch": 2915} {"train_loss": -12.852294921875, "global_step": 489828, "epoch": 2915} {"train_loss": -12.639568328857422, "global_step": 489829, "epoch": 2915} {"train_loss": -12.889200210571289, "global_step": 489830, "epoch": 2915} {"train_loss": -12.469719886779785, "global_step": 489831, "epoch": 2915} {"train_loss": -12.725502014160156, "global_step": 489832, "epoch": 2915} {"train_loss": -12.545588493347168, "global_step": 489833, "epoch": 2915} {"train_loss": -12.8794584274292, "global_step": 489834, "epoch": 2915} {"train_loss": -12.65092658996582, "global_step": 489835, "epoch": 2915} {"train_loss": -12.978759765625, "global_step": 489836, "epoch": 2915} {"train_loss": -12.750085830688477, "global_step": 489837, "epoch": 2915} {"train_loss": -12.797266960144043, "global_step": 489838, "epoch": 2915} {"train_loss": -12.885457992553711, "global_step": 489839, "epoch": 2915} {"train_loss": -12.719932556152344, "global_step": 489840, "epoch": 2915} {"train_loss": -12.745563507080078, "global_step": 489841, "epoch": 2915} {"train_loss": -12.813766479492188, "global_step": 489842, "epoch": 2915} {"train_loss": -12.669028282165527, "global_step": 489843, "epoch": 2915} {"train_loss": -12.714759826660156, "global_step": 489844, "epoch": 2915} {"train_loss": -12.758359909057617, "global_step": 489845, "epoch": 2915} {"train_loss": -12.876001358032227, "global_step": 489846, "epoch": 2915} {"train_loss": -12.7897310256958, "global_step": 489847, "epoch": 2915} {"train_loss": -12.995083808898926, "global_step": 489848, "epoch": 2915} {"train_loss": -12.770142555236816, "global_step": 489849, "epoch": 2915} {"train_loss": -12.999677658081055, "global_step": 489850, "epoch": 2915} {"train_loss": -12.969038963317871, "global_step": 489851, "epoch": 2915} {"train_loss": -13.076276779174805, "global_step": 489852, "epoch": 2915} {"train_loss": -13.037984848022461, "global_step": 489853, "epoch": 2915} {"train_loss": -13.012722969055176, "global_step": 489854, "epoch": 2915} {"train_loss": -12.84499740600586, "global_step": 489855, "epoch": 2915} {"train_loss": -13.04372787475586, "global_step": 489856, "epoch": 2915} {"train_loss": -12.864574432373047, "global_step": 489857, "epoch": 2915} {"train_loss": -13.090043067932129, "global_step": 489858, "epoch": 2915} {"train_loss": -12.659098625183105, "global_step": 489859, "epoch": 2915} {"train_loss": -12.854613304138184, "global_step": 489860, "epoch": 2915} {"train_loss": -13.124479293823242, "global_step": 489861, "epoch": 2915} {"train_loss": -13.000368118286133, "global_step": 489862, "epoch": 2915} {"train_loss": -12.771852493286133, "global_step": 489863, "epoch": 2915} {"train_loss": -12.969886779785156, "global_step": 489864, "epoch": 2915} {"train_loss": -13.068556785583496, "global_step": 489865, "epoch": 2915} {"train_loss": -13.158472061157227, "global_step": 489866, "epoch": 2915} {"train_loss": -12.876989364624023, "global_step": 489867, "epoch": 2915} {"train_loss": -12.946382522583008, "global_step": 489868, "epoch": 2915} {"train_loss": -12.898344039916992, "global_step": 489869, "epoch": 2915} {"train_loss": -13.13795280456543, "global_step": 489870, "epoch": 2915} {"train_loss": -12.973976135253906, "global_step": 489871, "epoch": 2915} {"train_loss": -12.888465881347656, "global_step": 489872, "epoch": 2915} {"train_loss": -12.881867408752441, "global_step": 489873, "epoch": 2915} {"train_loss": -12.881780624389648, "global_step": 489874, "epoch": 2915} {"train_loss": -13.076322555541992, "global_step": 489875, "epoch": 2915} {"train_loss": -12.768510818481445, "global_step": 489876, "epoch": 2915} {"train_loss": -12.592425346374512, "global_step": 489877, "epoch": 2915} {"train_loss": -12.20886516571045, "global_step": 489878, "epoch": 2915} {"train_loss": -12.74416446685791, "global_step": 489879, "epoch": 2915} {"train_loss": -11.76534652709961, "global_step": 489880, "epoch": 2915} {"train_loss": -12.066035270690918, "global_step": 489881, "epoch": 2915} {"train_loss": -12.30976676940918, "global_step": 489882, "epoch": 2915} {"train_loss": -11.61990737915039, "global_step": 489883, "epoch": 2915} {"train_loss": -11.478533744812012, "global_step": 489884, "epoch": 2915} {"train_loss": -12.415245056152344, "global_step": 489885, "epoch": 2915} {"train_loss": -12.363658905029297, "global_step": 489886, "epoch": 2915} {"train_loss": -12.198041955629984, "global_step": 489887, "epoch": 2915, "val_loss": 318298.625, "train_action_mse_error": 1.1838586330413818} {"train_loss": -12.256282806396484, "global_step": 489888, "epoch": 2916} {"train_loss": -11.978581428527832, "global_step": 489889, "epoch": 2916} {"train_loss": -11.601999282836914, "global_step": 489890, "epoch": 2916} {"train_loss": -11.900527000427246, "global_step": 489891, "epoch": 2916} {"train_loss": -10.65269947052002, "global_step": 489892, "epoch": 2916} {"train_loss": -10.887263298034668, "global_step": 489893, "epoch": 2916} {"train_loss": -12.475085258483887, "global_step": 489894, "epoch": 2916} {"train_loss": -10.96755313873291, "global_step": 489895, "epoch": 2916} {"train_loss": -12.337770462036133, "global_step": 489896, "epoch": 2916} {"train_loss": -10.731403350830078, "global_step": 489897, "epoch": 2916} {"train_loss": -12.12442398071289, "global_step": 489898, "epoch": 2916} {"train_loss": -11.028976440429688, "global_step": 489899, "epoch": 2916} {"train_loss": -10.5318021774292, "global_step": 489900, "epoch": 2916} {"train_loss": -12.348224639892578, "global_step": 489901, "epoch": 2916} {"train_loss": -10.173456192016602, "global_step": 489902, "epoch": 2916} {"train_loss": -10.214651107788086, "global_step": 489903, "epoch": 2916} {"train_loss": -11.551712036132812, "global_step": 489904, "epoch": 2916} {"train_loss": -9.02331256866455, "global_step": 489905, "epoch": 2916} {"train_loss": -7.440031051635742, "global_step": 489906, "epoch": 2916} {"train_loss": -7.784097671508789, "global_step": 489907, "epoch": 2916} {"train_loss": -8.121570587158203, "global_step": 489908, "epoch": 2916} {"train_loss": -7.531190872192383, "global_step": 489909, "epoch": 2916} {"train_loss": -8.018881797790527, "global_step": 489910, "epoch": 2916} {"train_loss": -8.212564468383789, "global_step": 489911, "epoch": 2916} {"train_loss": -8.855449676513672, "global_step": 489912, "epoch": 2916} {"train_loss": -8.67304801940918, "global_step": 489913, "epoch": 2916} {"train_loss": -8.628973960876465, "global_step": 489914, "epoch": 2916} {"train_loss": -8.711119651794434, "global_step": 489915, "epoch": 2916} {"train_loss": -8.157437324523926, "global_step": 489916, "epoch": 2916} {"train_loss": -8.137516021728516, "global_step": 489917, "epoch": 2916} {"train_loss": -9.36893367767334, "global_step": 489918, "epoch": 2916} {"train_loss": -8.359447479248047, "global_step": 489919, "epoch": 2916} {"train_loss": -8.713508605957031, "global_step": 489920, "epoch": 2916} {"train_loss": -9.139183044433594, "global_step": 489921, "epoch": 2916} {"train_loss": -9.142068862915039, "global_step": 489922, "epoch": 2916} {"train_loss": -9.178333282470703, "global_step": 489923, "epoch": 2916} {"train_loss": -9.333932876586914, "global_step": 489924, "epoch": 2916} {"train_loss": -9.756949424743652, "global_step": 489925, "epoch": 2916} {"train_loss": -10.046178817749023, "global_step": 489926, "epoch": 2916} {"train_loss": -10.460103988647461, "global_step": 489927, "epoch": 2916} {"train_loss": -10.879295349121094, "global_step": 489928, "epoch": 2916} {"train_loss": -10.340235710144043, "global_step": 489929, "epoch": 2916} {"train_loss": -11.24040412902832, "global_step": 489930, "epoch": 2916} {"train_loss": -10.83028793334961, "global_step": 489931, "epoch": 2916} {"train_loss": -10.948325157165527, "global_step": 489932, "epoch": 2916} {"train_loss": -10.914637565612793, "global_step": 489933, "epoch": 2916} {"train_loss": -11.212244987487793, "global_step": 489934, "epoch": 2916} {"train_loss": -11.616000175476074, "global_step": 489935, "epoch": 2916} {"train_loss": -11.674132347106934, "global_step": 489936, "epoch": 2916} {"train_loss": -11.509809494018555, "global_step": 489937, "epoch": 2916} {"train_loss": -11.359479904174805, "global_step": 489938, "epoch": 2916} {"train_loss": -11.559822082519531, "global_step": 489939, "epoch": 2916} {"train_loss": -11.799592971801758, "global_step": 489940, "epoch": 2916} {"train_loss": -11.323049545288086, "global_step": 489941, "epoch": 2916} {"train_loss": -11.790576934814453, "global_step": 489942, "epoch": 2916} {"train_loss": -11.717056274414062, "global_step": 489943, "epoch": 2916} {"train_loss": -11.73707103729248, "global_step": 489944, "epoch": 2916} {"train_loss": -12.168233871459961, "global_step": 489945, "epoch": 2916} {"train_loss": -11.934219360351562, "global_step": 489946, "epoch": 2916} {"train_loss": -11.999099731445312, "global_step": 489947, "epoch": 2916} {"train_loss": -11.887947082519531, "global_step": 489948, "epoch": 2916} {"train_loss": -11.752008438110352, "global_step": 489949, "epoch": 2916} {"train_loss": -12.018962860107422, "global_step": 489950, "epoch": 2916} {"train_loss": -11.797613143920898, "global_step": 489951, "epoch": 2916} {"train_loss": -12.174389839172363, "global_step": 489952, "epoch": 2916} {"train_loss": -11.53768539428711, "global_step": 489953, "epoch": 2916} {"train_loss": -11.735490798950195, "global_step": 489954, "epoch": 2916} {"train_loss": -11.618202209472656, "global_step": 489955, "epoch": 2916} {"train_loss": -11.630895614624023, "global_step": 489956, "epoch": 2916} {"train_loss": -11.846054077148438, "global_step": 489957, "epoch": 2916} {"train_loss": -11.9710693359375, "global_step": 489958, "epoch": 2916} {"train_loss": -12.108396530151367, "global_step": 489959, "epoch": 2916} {"train_loss": -12.121297836303711, "global_step": 489960, "epoch": 2916} {"train_loss": -11.966955184936523, "global_step": 489961, "epoch": 2916} {"train_loss": -12.006811141967773, "global_step": 489962, "epoch": 2916} {"train_loss": -12.130350112915039, "global_step": 489963, "epoch": 2916} {"train_loss": -12.04810905456543, "global_step": 489964, "epoch": 2916} {"train_loss": -12.421751976013184, "global_step": 489965, "epoch": 2916} {"train_loss": -12.209068298339844, "global_step": 489966, "epoch": 2916} {"train_loss": -12.32749080657959, "global_step": 489967, "epoch": 2916} {"train_loss": -12.202957153320312, "global_step": 489968, "epoch": 2916} {"train_loss": -12.418109893798828, "global_step": 489969, "epoch": 2916} {"train_loss": -12.350290298461914, "global_step": 489970, "epoch": 2916} {"train_loss": -12.364750862121582, "global_step": 489971, "epoch": 2916} {"train_loss": -12.713459014892578, "global_step": 489972, "epoch": 2916} {"train_loss": -12.47095012664795, "global_step": 489973, "epoch": 2916} {"train_loss": -12.527792930603027, "global_step": 489974, "epoch": 2916} {"train_loss": -12.520275115966797, "global_step": 489975, "epoch": 2916} {"train_loss": -12.609418869018555, "global_step": 489976, "epoch": 2916} {"train_loss": -12.740501403808594, "global_step": 489977, "epoch": 2916} {"train_loss": -12.480367660522461, "global_step": 489978, "epoch": 2916} {"train_loss": -12.577250480651855, "global_step": 489979, "epoch": 2916} {"train_loss": -12.379121780395508, "global_step": 489980, "epoch": 2916} {"train_loss": -12.914701461791992, "global_step": 489981, "epoch": 2916} {"train_loss": -12.370555877685547, "global_step": 489982, "epoch": 2916} {"train_loss": -12.608272552490234, "global_step": 489983, "epoch": 2916} {"train_loss": -12.781854629516602, "global_step": 489984, "epoch": 2916} {"train_loss": -12.525144577026367, "global_step": 489985, "epoch": 2916} {"train_loss": -12.740931510925293, "global_step": 489986, "epoch": 2916} {"train_loss": -12.66014289855957, "global_step": 489987, "epoch": 2916} {"train_loss": -12.561488151550293, "global_step": 489988, "epoch": 2916} {"train_loss": -12.790531158447266, "global_step": 489989, "epoch": 2916} {"train_loss": -12.559623718261719, "global_step": 489990, "epoch": 2916} {"train_loss": -12.64803409576416, "global_step": 489991, "epoch": 2916} {"train_loss": -12.795928955078125, "global_step": 489992, "epoch": 2916} {"train_loss": -12.824760437011719, "global_step": 489993, "epoch": 2916} {"train_loss": -12.660271644592285, "global_step": 489994, "epoch": 2916} {"train_loss": -12.989957809448242, "global_step": 489995, "epoch": 2916} {"train_loss": -12.81785774230957, "global_step": 489996, "epoch": 2916} {"train_loss": -12.832969665527344, "global_step": 489997, "epoch": 2916} {"train_loss": -12.754035949707031, "global_step": 489998, "epoch": 2916} {"train_loss": -12.756497383117676, "global_step": 489999, "epoch": 2916} {"train_loss": -12.95602035522461, "global_step": 490000, "epoch": 2916} {"train_loss": -12.666064262390137, "global_step": 490001, "epoch": 2916} {"train_loss": -12.777443885803223, "global_step": 490002, "epoch": 2916} {"train_loss": -12.813274383544922, "global_step": 490003, "epoch": 2916} {"train_loss": -12.872055053710938, "global_step": 490004, "epoch": 2916} {"train_loss": -12.766493797302246, "global_step": 490005, "epoch": 2916} {"train_loss": -12.729646682739258, "global_step": 490006, "epoch": 2916} {"train_loss": -12.793750762939453, "global_step": 490007, "epoch": 2916} {"train_loss": -12.672897338867188, "global_step": 490008, "epoch": 2916} {"train_loss": -12.988364219665527, "global_step": 490009, "epoch": 2916} {"train_loss": -12.687677383422852, "global_step": 490010, "epoch": 2916} {"train_loss": -12.738922119140625, "global_step": 490011, "epoch": 2916} {"train_loss": -12.705301284790039, "global_step": 490012, "epoch": 2916} {"train_loss": -12.93703556060791, "global_step": 490013, "epoch": 2916} {"train_loss": -12.671208381652832, "global_step": 490014, "epoch": 2916} {"train_loss": -12.982933044433594, "global_step": 490015, "epoch": 2916} {"train_loss": -12.693986892700195, "global_step": 490016, "epoch": 2916} {"train_loss": -12.770994186401367, "global_step": 490017, "epoch": 2916} {"train_loss": -12.766683578491211, "global_step": 490018, "epoch": 2916} {"train_loss": -12.678600311279297, "global_step": 490019, "epoch": 2916} {"train_loss": -12.884173393249512, "global_step": 490020, "epoch": 2916} {"train_loss": -12.733349800109863, "global_step": 490021, "epoch": 2916} {"train_loss": -13.027915000915527, "global_step": 490022, "epoch": 2916} {"train_loss": -12.455456733703613, "global_step": 490023, "epoch": 2916} {"train_loss": -12.833066940307617, "global_step": 490024, "epoch": 2916} {"train_loss": -12.913416862487793, "global_step": 490025, "epoch": 2916} {"train_loss": -13.103891372680664, "global_step": 490026, "epoch": 2916} {"train_loss": -12.905817031860352, "global_step": 490027, "epoch": 2916} {"train_loss": -12.79452896118164, "global_step": 490028, "epoch": 2916} {"train_loss": -12.977263450622559, "global_step": 490029, "epoch": 2916} {"train_loss": -12.75516128540039, "global_step": 490030, "epoch": 2916} {"train_loss": -12.500584602355957, "global_step": 490031, "epoch": 2916} {"train_loss": -12.444510459899902, "global_step": 490032, "epoch": 2916} {"train_loss": -12.57882308959961, "global_step": 490033, "epoch": 2916} {"train_loss": -12.691634178161621, "global_step": 490034, "epoch": 2916} {"train_loss": -12.739887237548828, "global_step": 490035, "epoch": 2916} {"train_loss": -12.812000274658203, "global_step": 490036, "epoch": 2916} {"train_loss": -12.701240539550781, "global_step": 490037, "epoch": 2916} {"train_loss": -12.783512115478516, "global_step": 490038, "epoch": 2916} {"train_loss": -12.776571273803711, "global_step": 490039, "epoch": 2916} {"train_loss": -12.875200271606445, "global_step": 490040, "epoch": 2916} {"train_loss": -12.630849838256836, "global_step": 490041, "epoch": 2916} {"train_loss": -12.535797119140625, "global_step": 490042, "epoch": 2916} {"train_loss": -12.66931438446045, "global_step": 490043, "epoch": 2916} {"train_loss": -12.911635398864746, "global_step": 490044, "epoch": 2916} {"train_loss": -12.610563278198242, "global_step": 490045, "epoch": 2916} {"train_loss": -12.581958770751953, "global_step": 490046, "epoch": 2916} {"train_loss": -12.973901748657227, "global_step": 490047, "epoch": 2916} {"train_loss": -13.158346176147461, "global_step": 490048, "epoch": 2916} {"train_loss": -12.938159942626953, "global_step": 490049, "epoch": 2916} {"train_loss": -12.556391716003418, "global_step": 490050, "epoch": 2916} {"train_loss": -12.828166007995605, "global_step": 490051, "epoch": 2916} {"train_loss": -12.789137840270996, "global_step": 490052, "epoch": 2916} {"train_loss": -13.024955749511719, "global_step": 490053, "epoch": 2916} {"train_loss": -13.045319557189941, "global_step": 490054, "epoch": 2916} {"train_loss": -11.800164500872294, "global_step": 490055, "epoch": 2916, "val_loss": 315654.28125} {"train_loss": -12.125438690185547, "global_step": 490056, "epoch": 2917} {"train_loss": -12.902273178100586, "global_step": 490057, "epoch": 2917} {"train_loss": -12.605630874633789, "global_step": 490058, "epoch": 2917} {"train_loss": -13.032121658325195, "global_step": 490059, "epoch": 2917} {"train_loss": -13.127721786499023, "global_step": 490060, "epoch": 2917} {"train_loss": -12.67844295501709, "global_step": 490061, "epoch": 2917} {"train_loss": -12.591012954711914, "global_step": 490062, "epoch": 2917} {"train_loss": -12.448707580566406, "global_step": 490063, "epoch": 2917} {"train_loss": -12.857220649719238, "global_step": 490064, "epoch": 2917} {"train_loss": -12.720890045166016, "global_step": 490065, "epoch": 2917} {"train_loss": -12.247262954711914, "global_step": 490066, "epoch": 2917} {"train_loss": -11.632972717285156, "global_step": 490067, "epoch": 2917} {"train_loss": -11.350977897644043, "global_step": 490068, "epoch": 2917} {"train_loss": -12.15484619140625, "global_step": 490069, "epoch": 2917} {"train_loss": -12.683064460754395, "global_step": 490070, "epoch": 2917} {"train_loss": -11.92381477355957, "global_step": 490071, "epoch": 2917} {"train_loss": -12.652076721191406, "global_step": 490072, "epoch": 2917} {"train_loss": -11.207341194152832, "global_step": 490073, "epoch": 2917} {"train_loss": -12.304930686950684, "global_step": 490074, "epoch": 2917} {"train_loss": -11.210195541381836, "global_step": 490075, "epoch": 2917} {"train_loss": -12.130607604980469, "global_step": 490076, "epoch": 2917} {"train_loss": -11.816431045532227, "global_step": 490077, "epoch": 2917} {"train_loss": -12.613390922546387, "global_step": 490078, "epoch": 2917} {"train_loss": -10.830944061279297, "global_step": 490079, "epoch": 2917} {"train_loss": -11.083667755126953, "global_step": 490080, "epoch": 2917} {"train_loss": -11.313735008239746, "global_step": 490081, "epoch": 2917} {"train_loss": -11.146800994873047, "global_step": 490082, "epoch": 2917} {"train_loss": -11.506357192993164, "global_step": 490083, "epoch": 2917} {"train_loss": -12.047557830810547, "global_step": 490084, "epoch": 2917} {"train_loss": -11.289676666259766, "global_step": 490085, "epoch": 2917} {"train_loss": -11.842506408691406, "global_step": 490086, "epoch": 2917} {"train_loss": -11.933348655700684, "global_step": 490087, "epoch": 2917} {"train_loss": -11.564414978027344, "global_step": 490088, "epoch": 2917} {"train_loss": -11.788908004760742, "global_step": 490089, "epoch": 2917} {"train_loss": -11.648681640625, "global_step": 490090, "epoch": 2917} {"train_loss": -11.973587036132812, "global_step": 490091, "epoch": 2917} {"train_loss": -11.25526237487793, "global_step": 490092, "epoch": 2917} {"train_loss": -11.923213958740234, "global_step": 490093, "epoch": 2917} {"train_loss": -11.499402046203613, "global_step": 490094, "epoch": 2917} {"train_loss": -11.423787117004395, "global_step": 490095, "epoch": 2917} {"train_loss": -12.11440372467041, "global_step": 490096, "epoch": 2917} {"train_loss": -11.732361793518066, "global_step": 490097, "epoch": 2917} {"train_loss": -11.907074928283691, "global_step": 490098, "epoch": 2917} {"train_loss": -10.932652473449707, "global_step": 490099, "epoch": 2917} {"train_loss": -11.06263542175293, "global_step": 490100, "epoch": 2917} {"train_loss": -12.254438400268555, "global_step": 490101, "epoch": 2917} {"train_loss": -10.843815803527832, "global_step": 490102, "epoch": 2917} {"train_loss": -12.359382629394531, "global_step": 490103, "epoch": 2917} {"train_loss": -12.083860397338867, "global_step": 490104, "epoch": 2917} {"train_loss": -11.081228256225586, "global_step": 490105, "epoch": 2917} {"train_loss": -11.708505630493164, "global_step": 490106, "epoch": 2917} {"train_loss": -10.793403625488281, "global_step": 490107, "epoch": 2917} {"train_loss": -11.123661994934082, "global_step": 490108, "epoch": 2917} {"train_loss": -10.724827766418457, "global_step": 490109, "epoch": 2917} {"train_loss": -12.473753929138184, "global_step": 490110, "epoch": 2917} {"train_loss": -11.40005874633789, "global_step": 490111, "epoch": 2917} {"train_loss": -11.955284118652344, "global_step": 490112, "epoch": 2917} {"train_loss": -12.086112976074219, "global_step": 490113, "epoch": 2917} {"train_loss": -11.908979415893555, "global_step": 490114, "epoch": 2917} {"train_loss": -11.992298126220703, "global_step": 490115, "epoch": 2917} {"train_loss": -12.333160400390625, "global_step": 490116, "epoch": 2917} {"train_loss": -11.105850219726562, "global_step": 490117, "epoch": 2917} {"train_loss": -11.791779518127441, "global_step": 490118, "epoch": 2917} {"train_loss": -11.592891693115234, "global_step": 490119, "epoch": 2917} {"train_loss": -11.678008079528809, "global_step": 490120, "epoch": 2917} {"train_loss": -12.089499473571777, "global_step": 490121, "epoch": 2917} {"train_loss": -11.845011711120605, "global_step": 490122, "epoch": 2917} {"train_loss": -12.252201080322266, "global_step": 490123, "epoch": 2917} {"train_loss": -11.666557312011719, "global_step": 490124, "epoch": 2917} {"train_loss": -12.105295181274414, "global_step": 490125, "epoch": 2917} {"train_loss": -12.230039596557617, "global_step": 490126, "epoch": 2917} {"train_loss": -12.38450813293457, "global_step": 490127, "epoch": 2917} {"train_loss": -11.946392059326172, "global_step": 490128, "epoch": 2917} {"train_loss": -12.219026565551758, "global_step": 490129, "epoch": 2917} {"train_loss": -12.649750709533691, "global_step": 490130, "epoch": 2917} {"train_loss": -12.031973838806152, "global_step": 490131, "epoch": 2917} {"train_loss": -12.463471412658691, "global_step": 490132, "epoch": 2917} {"train_loss": -12.390705108642578, "global_step": 490133, "epoch": 2917} {"train_loss": -12.830392837524414, "global_step": 490134, "epoch": 2917} {"train_loss": -12.337459564208984, "global_step": 490135, "epoch": 2917} {"train_loss": -12.573493957519531, "global_step": 490136, "epoch": 2917} {"train_loss": -12.548389434814453, "global_step": 490137, "epoch": 2917} {"train_loss": -12.612860679626465, "global_step": 490138, "epoch": 2917} {"train_loss": -12.691693305969238, "global_step": 490139, "epoch": 2917} {"train_loss": -12.698050498962402, "global_step": 490140, "epoch": 2917} {"train_loss": -12.5863037109375, "global_step": 490141, "epoch": 2917} {"train_loss": -12.549399375915527, "global_step": 490142, "epoch": 2917} {"train_loss": -12.846855163574219, "global_step": 490143, "epoch": 2917} {"train_loss": -12.782347679138184, "global_step": 490144, "epoch": 2917} {"train_loss": -12.585336685180664, "global_step": 490145, "epoch": 2917} {"train_loss": -12.800058364868164, "global_step": 490146, "epoch": 2917} {"train_loss": -12.517406463623047, "global_step": 490147, "epoch": 2917} {"train_loss": -12.853702545166016, "global_step": 490148, "epoch": 2917} {"train_loss": -12.52943229675293, "global_step": 490149, "epoch": 2917} {"train_loss": -12.53963851928711, "global_step": 490150, "epoch": 2917} {"train_loss": -12.662775039672852, "global_step": 490151, "epoch": 2917} {"train_loss": -12.89285659790039, "global_step": 490152, "epoch": 2917} {"train_loss": -12.559734344482422, "global_step": 490153, "epoch": 2917} {"train_loss": -12.844552993774414, "global_step": 490154, "epoch": 2917} {"train_loss": -12.62388801574707, "global_step": 490155, "epoch": 2917} {"train_loss": -12.914627075195312, "global_step": 490156, "epoch": 2917} {"train_loss": -12.885774612426758, "global_step": 490157, "epoch": 2917} {"train_loss": -12.802521705627441, "global_step": 490158, "epoch": 2917} {"train_loss": -12.897308349609375, "global_step": 490159, "epoch": 2917} {"train_loss": -12.69749927520752, "global_step": 490160, "epoch": 2917} {"train_loss": -12.672554016113281, "global_step": 490161, "epoch": 2917} {"train_loss": -12.659828186035156, "global_step": 490162, "epoch": 2917} {"train_loss": -12.769420623779297, "global_step": 490163, "epoch": 2917} {"train_loss": -12.95038890838623, "global_step": 490164, "epoch": 2917} {"train_loss": -12.896797180175781, "global_step": 490165, "epoch": 2917} {"train_loss": -12.592267990112305, "global_step": 490166, "epoch": 2917} {"train_loss": -12.824831008911133, "global_step": 490167, "epoch": 2917} {"train_loss": -12.860727310180664, "global_step": 490168, "epoch": 2917} {"train_loss": -12.646553993225098, "global_step": 490169, "epoch": 2917} {"train_loss": -13.061164855957031, "global_step": 490170, "epoch": 2917} {"train_loss": -12.679304122924805, "global_step": 490171, "epoch": 2917} {"train_loss": -12.441043853759766, "global_step": 490172, "epoch": 2917} {"train_loss": -12.94722843170166, "global_step": 490173, "epoch": 2917} {"train_loss": -12.81013011932373, "global_step": 490174, "epoch": 2917} {"train_loss": -12.417531967163086, "global_step": 490175, "epoch": 2917} {"train_loss": -12.695780754089355, "global_step": 490176, "epoch": 2917} {"train_loss": -12.72966194152832, "global_step": 490177, "epoch": 2917} {"train_loss": -12.67180061340332, "global_step": 490178, "epoch": 2917} {"train_loss": -12.119549751281738, "global_step": 490179, "epoch": 2917} {"train_loss": -12.845857620239258, "global_step": 490180, "epoch": 2917} {"train_loss": -12.3251953125, "global_step": 490181, "epoch": 2917} {"train_loss": -12.473437309265137, "global_step": 490182, "epoch": 2917} {"train_loss": -12.084606170654297, "global_step": 490183, "epoch": 2917} {"train_loss": -11.041421890258789, "global_step": 490184, "epoch": 2917} {"train_loss": -11.425403594970703, "global_step": 490185, "epoch": 2917} {"train_loss": -11.559083938598633, "global_step": 490186, "epoch": 2917} {"train_loss": -10.991795539855957, "global_step": 490187, "epoch": 2917} {"train_loss": -10.633956909179688, "global_step": 490188, "epoch": 2917} {"train_loss": -11.270943641662598, "global_step": 490189, "epoch": 2917} {"train_loss": -10.331487655639648, "global_step": 490190, "epoch": 2917} {"train_loss": -12.031253814697266, "global_step": 490191, "epoch": 2917} {"train_loss": -9.667362213134766, "global_step": 490192, "epoch": 2917} {"train_loss": -9.903947830200195, "global_step": 490193, "epoch": 2917} {"train_loss": -9.344853401184082, "global_step": 490194, "epoch": 2917} {"train_loss": -10.647567749023438, "global_step": 490195, "epoch": 2917} {"train_loss": -10.412185668945312, "global_step": 490196, "epoch": 2917} {"train_loss": -9.753767967224121, "global_step": 490197, "epoch": 2917} {"train_loss": -10.189774513244629, "global_step": 490198, "epoch": 2917} {"train_loss": -10.478583335876465, "global_step": 490199, "epoch": 2917} {"train_loss": -10.502793312072754, "global_step": 490200, "epoch": 2917} {"train_loss": -8.96125316619873, "global_step": 490201, "epoch": 2917} {"train_loss": -9.732386589050293, "global_step": 490202, "epoch": 2917} {"train_loss": -11.520386695861816, "global_step": 490203, "epoch": 2917} {"train_loss": -9.38998031616211, "global_step": 490204, "epoch": 2917} {"train_loss": -9.847148895263672, "global_step": 490205, "epoch": 2917} {"train_loss": -10.738798141479492, "global_step": 490206, "epoch": 2917} {"train_loss": -11.43721866607666, "global_step": 490207, "epoch": 2917} {"train_loss": -11.190106391906738, "global_step": 490208, "epoch": 2917} {"train_loss": -11.827983856201172, "global_step": 490209, "epoch": 2917} {"train_loss": -11.878164291381836, "global_step": 490210, "epoch": 2917} {"train_loss": -11.92719841003418, "global_step": 490211, "epoch": 2917} {"train_loss": -11.517742156982422, "global_step": 490212, "epoch": 2917} {"train_loss": -11.498006820678711, "global_step": 490213, "epoch": 2917} {"train_loss": -12.01906681060791, "global_step": 490214, "epoch": 2917} {"train_loss": -11.976181030273438, "global_step": 490215, "epoch": 2917} {"train_loss": -11.86931324005127, "global_step": 490216, "epoch": 2917} {"train_loss": -12.186447143554688, "global_step": 490217, "epoch": 2917} {"train_loss": -12.018555641174316, "global_step": 490218, "epoch": 2917} {"train_loss": -12.424910545349121, "global_step": 490219, "epoch": 2917} {"train_loss": -11.970230102539062, "global_step": 490220, "epoch": 2917} {"train_loss": -12.502845764160156, "global_step": 490221, "epoch": 2917} {"train_loss": -12.059418678283691, "global_step": 490222, "epoch": 2917} {"train_loss": -11.935565942809696, "global_step": 490223, "epoch": 2917, "val_loss": 310522.6875} {"train_loss": -12.138748168945312, "global_step": 490224, "epoch": 2918} {"train_loss": -12.128787994384766, "global_step": 490225, "epoch": 2918} {"train_loss": -12.341596603393555, "global_step": 490226, "epoch": 2918} {"train_loss": -12.092540740966797, "global_step": 490227, "epoch": 2918} {"train_loss": -11.940715789794922, "global_step": 490228, "epoch": 2918} {"train_loss": -12.398560523986816, "global_step": 490229, "epoch": 2918} {"train_loss": -12.234588623046875, "global_step": 490230, "epoch": 2918} {"train_loss": -12.576082229614258, "global_step": 490231, "epoch": 2918} {"train_loss": -12.507973670959473, "global_step": 490232, "epoch": 2918} {"train_loss": -12.362335205078125, "global_step": 490233, "epoch": 2918} {"train_loss": -12.263943672180176, "global_step": 490234, "epoch": 2918} {"train_loss": -12.184060096740723, "global_step": 490235, "epoch": 2918} {"train_loss": -12.626150131225586, "global_step": 490236, "epoch": 2918} {"train_loss": -12.319985389709473, "global_step": 490237, "epoch": 2918} {"train_loss": -12.428889274597168, "global_step": 490238, "epoch": 2918} {"train_loss": -11.84914493560791, "global_step": 490239, "epoch": 2918} {"train_loss": -12.639527320861816, "global_step": 490240, "epoch": 2918} {"train_loss": -12.245330810546875, "global_step": 490241, "epoch": 2918} {"train_loss": -12.603405952453613, "global_step": 490242, "epoch": 2918} {"train_loss": -12.367593765258789, "global_step": 490243, "epoch": 2918} {"train_loss": -12.494806289672852, "global_step": 490244, "epoch": 2918} {"train_loss": -12.640401840209961, "global_step": 490245, "epoch": 2918} {"train_loss": -12.592287063598633, "global_step": 490246, "epoch": 2918} {"train_loss": -12.862773895263672, "global_step": 490247, "epoch": 2918} {"train_loss": -12.60682201385498, "global_step": 490248, "epoch": 2918} {"train_loss": -12.503284454345703, "global_step": 490249, "epoch": 2918} {"train_loss": -12.777101516723633, "global_step": 490250, "epoch": 2918} {"train_loss": -12.533380508422852, "global_step": 490251, "epoch": 2918} {"train_loss": -12.687030792236328, "global_step": 490252, "epoch": 2918} {"train_loss": -12.369547843933105, "global_step": 490253, "epoch": 2918} {"train_loss": -12.86281681060791, "global_step": 490254, "epoch": 2918} {"train_loss": -12.886529922485352, "global_step": 490255, "epoch": 2918} {"train_loss": -12.67016887664795, "global_step": 490256, "epoch": 2918} {"train_loss": -12.713876724243164, "global_step": 490257, "epoch": 2918} {"train_loss": -12.637378692626953, "global_step": 490258, "epoch": 2918} {"train_loss": -12.706889152526855, "global_step": 490259, "epoch": 2918} {"train_loss": -12.734688758850098, "global_step": 490260, "epoch": 2918} {"train_loss": -12.891366004943848, "global_step": 490261, "epoch": 2918} {"train_loss": -12.315503120422363, "global_step": 490262, "epoch": 2918} {"train_loss": -12.492273330688477, "global_step": 490263, "epoch": 2918} {"train_loss": -12.67795467376709, "global_step": 490264, "epoch": 2918} {"train_loss": -12.417436599731445, "global_step": 490265, "epoch": 2918} {"train_loss": -12.718315124511719, "global_step": 490266, "epoch": 2918} {"train_loss": -11.912690162658691, "global_step": 490267, "epoch": 2918} {"train_loss": -12.74681282043457, "global_step": 490268, "epoch": 2918} {"train_loss": -11.932168006896973, "global_step": 490269, "epoch": 2918} {"train_loss": -12.202226638793945, "global_step": 490270, "epoch": 2918} {"train_loss": -12.632644653320312, "global_step": 490271, "epoch": 2918} {"train_loss": -11.750425338745117, "global_step": 490272, "epoch": 2918} {"train_loss": -12.369007110595703, "global_step": 490273, "epoch": 2918} {"train_loss": -12.005735397338867, "global_step": 490274, "epoch": 2918} {"train_loss": -10.939838409423828, "global_step": 490275, "epoch": 2918} {"train_loss": -10.900932312011719, "global_step": 490276, "epoch": 2918} {"train_loss": -10.598051071166992, "global_step": 490277, "epoch": 2918} {"train_loss": -12.10449504852295, "global_step": 490278, "epoch": 2918} {"train_loss": -11.428354263305664, "global_step": 490279, "epoch": 2918} {"train_loss": -11.307536125183105, "global_step": 490280, "epoch": 2918} {"train_loss": -11.88913345336914, "global_step": 490281, "epoch": 2918} {"train_loss": -11.423307418823242, "global_step": 490282, "epoch": 2918} {"train_loss": -11.215948104858398, "global_step": 490283, "epoch": 2918} {"train_loss": -10.72872543334961, "global_step": 490284, "epoch": 2918} {"train_loss": -11.863029479980469, "global_step": 490285, "epoch": 2918} {"train_loss": -12.152235984802246, "global_step": 490286, "epoch": 2918} {"train_loss": -12.174988746643066, "global_step": 490287, "epoch": 2918} {"train_loss": -12.351483345031738, "global_step": 490288, "epoch": 2918} {"train_loss": -11.733094215393066, "global_step": 490289, "epoch": 2918} {"train_loss": -12.004804611206055, "global_step": 490290, "epoch": 2918} {"train_loss": -12.062875747680664, "global_step": 490291, "epoch": 2918} {"train_loss": -11.848737716674805, "global_step": 490292, "epoch": 2918} {"train_loss": -12.323406219482422, "global_step": 490293, "epoch": 2918} {"train_loss": -11.552202224731445, "global_step": 490294, "epoch": 2918} {"train_loss": -11.940851211547852, "global_step": 490295, "epoch": 2918} {"train_loss": -11.73110580444336, "global_step": 490296, "epoch": 2918} {"train_loss": -12.027120590209961, "global_step": 490297, "epoch": 2918} {"train_loss": -12.378776550292969, "global_step": 490298, "epoch": 2918} {"train_loss": -12.26553726196289, "global_step": 490299, "epoch": 2918} {"train_loss": -12.180360794067383, "global_step": 490300, "epoch": 2918} {"train_loss": -11.410013198852539, "global_step": 490301, "epoch": 2918} {"train_loss": -11.950955390930176, "global_step": 490302, "epoch": 2918} {"train_loss": -11.693682670593262, "global_step": 490303, "epoch": 2918} {"train_loss": -12.741021156311035, "global_step": 490304, "epoch": 2918} {"train_loss": -11.930007934570312, "global_step": 490305, "epoch": 2918} {"train_loss": -12.322118759155273, "global_step": 490306, "epoch": 2918} {"train_loss": -11.871944427490234, "global_step": 490307, "epoch": 2918} {"train_loss": -12.307892799377441, "global_step": 490308, "epoch": 2918} {"train_loss": -12.414567947387695, "global_step": 490309, "epoch": 2918} {"train_loss": -12.229781150817871, "global_step": 490310, "epoch": 2918} {"train_loss": -12.357061386108398, "global_step": 490311, "epoch": 2918} {"train_loss": -11.87668514251709, "global_step": 490312, "epoch": 2918} {"train_loss": -12.751554489135742, "global_step": 490313, "epoch": 2918} {"train_loss": -12.111368179321289, "global_step": 490314, "epoch": 2918} {"train_loss": -12.368156433105469, "global_step": 490315, "epoch": 2918} {"train_loss": -12.200932502746582, "global_step": 490316, "epoch": 2918} {"train_loss": -12.45592975616455, "global_step": 490317, "epoch": 2918} {"train_loss": -12.711122512817383, "global_step": 490318, "epoch": 2918} {"train_loss": -12.212246894836426, "global_step": 490319, "epoch": 2918} {"train_loss": -12.56814193725586, "global_step": 490320, "epoch": 2918} {"train_loss": -12.066826820373535, "global_step": 490321, "epoch": 2918} {"train_loss": -12.641738891601562, "global_step": 490322, "epoch": 2918} {"train_loss": -11.711782455444336, "global_step": 490323, "epoch": 2918} {"train_loss": -12.260234832763672, "global_step": 490324, "epoch": 2918} {"train_loss": -12.264354705810547, "global_step": 490325, "epoch": 2918} {"train_loss": -12.486729621887207, "global_step": 490326, "epoch": 2918} {"train_loss": -12.547584533691406, "global_step": 490327, "epoch": 2918} {"train_loss": -12.445077896118164, "global_step": 490328, "epoch": 2918} {"train_loss": -12.596941947937012, "global_step": 490329, "epoch": 2918} {"train_loss": -12.45902156829834, "global_step": 490330, "epoch": 2918} {"train_loss": -12.53815746307373, "global_step": 490331, "epoch": 2918} {"train_loss": -12.739874839782715, "global_step": 490332, "epoch": 2918} {"train_loss": -12.32305908203125, "global_step": 490333, "epoch": 2918} {"train_loss": -12.460037231445312, "global_step": 490334, "epoch": 2918} {"train_loss": -12.555068969726562, "global_step": 490335, "epoch": 2918} {"train_loss": -12.618606567382812, "global_step": 490336, "epoch": 2918} {"train_loss": -12.79869556427002, "global_step": 490337, "epoch": 2918} {"train_loss": -12.530439376831055, "global_step": 490338, "epoch": 2918} {"train_loss": -12.796709060668945, "global_step": 490339, "epoch": 2918} {"train_loss": -12.56428050994873, "global_step": 490340, "epoch": 2918} {"train_loss": -12.489999771118164, "global_step": 490341, "epoch": 2918} {"train_loss": -12.848007202148438, "global_step": 490342, "epoch": 2918} {"train_loss": -12.39210319519043, "global_step": 490343, "epoch": 2918} {"train_loss": -12.840654373168945, "global_step": 490344, "epoch": 2918} {"train_loss": -12.531201362609863, "global_step": 490345, "epoch": 2918} {"train_loss": -12.473662376403809, "global_step": 490346, "epoch": 2918} {"train_loss": -12.644976615905762, "global_step": 490347, "epoch": 2918} {"train_loss": -12.056159973144531, "global_step": 490348, "epoch": 2918} {"train_loss": -12.64702033996582, "global_step": 490349, "epoch": 2918} {"train_loss": -12.674619674682617, "global_step": 490350, "epoch": 2918} {"train_loss": -12.645689964294434, "global_step": 490351, "epoch": 2918} {"train_loss": -12.901342391967773, "global_step": 490352, "epoch": 2918} {"train_loss": -12.484203338623047, "global_step": 490353, "epoch": 2918} {"train_loss": -12.518980026245117, "global_step": 490354, "epoch": 2918} {"train_loss": -12.862848281860352, "global_step": 490355, "epoch": 2918} {"train_loss": -12.824262619018555, "global_step": 490356, "epoch": 2918} {"train_loss": -13.091962814331055, "global_step": 490357, "epoch": 2918} {"train_loss": -12.703181266784668, "global_step": 490358, "epoch": 2918} {"train_loss": -12.625297546386719, "global_step": 490359, "epoch": 2918} {"train_loss": -12.6497163772583, "global_step": 490360, "epoch": 2918} {"train_loss": -12.93875503540039, "global_step": 490361, "epoch": 2918} {"train_loss": -12.966390609741211, "global_step": 490362, "epoch": 2918} {"train_loss": -12.885828018188477, "global_step": 490363, "epoch": 2918} {"train_loss": -12.87181568145752, "global_step": 490364, "epoch": 2918} {"train_loss": -12.879728317260742, "global_step": 490365, "epoch": 2918} {"train_loss": -12.947257995605469, "global_step": 490366, "epoch": 2918} {"train_loss": -12.93165397644043, "global_step": 490367, "epoch": 2918} {"train_loss": -12.920429229736328, "global_step": 490368, "epoch": 2918} {"train_loss": -12.920489311218262, "global_step": 490369, "epoch": 2918} {"train_loss": -12.78365421295166, "global_step": 490370, "epoch": 2918} {"train_loss": -13.01622200012207, "global_step": 490371, "epoch": 2918} {"train_loss": -12.806802749633789, "global_step": 490372, "epoch": 2918} {"train_loss": -12.875150680541992, "global_step": 490373, "epoch": 2918} {"train_loss": -13.030904769897461, "global_step": 490374, "epoch": 2918} {"train_loss": -12.80150032043457, "global_step": 490375, "epoch": 2918} {"train_loss": -12.972175598144531, "global_step": 490376, "epoch": 2918} {"train_loss": -12.862869262695312, "global_step": 490377, "epoch": 2918} {"train_loss": -12.896332740783691, "global_step": 490378, "epoch": 2918} {"train_loss": -12.699808120727539, "global_step": 490379, "epoch": 2918} {"train_loss": -12.798322677612305, "global_step": 490380, "epoch": 2918} {"train_loss": -12.120295524597168, "global_step": 490381, "epoch": 2918} {"train_loss": -12.366205215454102, "global_step": 490382, "epoch": 2918} {"train_loss": -13.085315704345703, "global_step": 490383, "epoch": 2918} {"train_loss": -12.631093978881836, "global_step": 490384, "epoch": 2918} {"train_loss": -12.383925437927246, "global_step": 490385, "epoch": 2918} {"train_loss": -12.269737243652344, "global_step": 490386, "epoch": 2918} {"train_loss": -12.89002799987793, "global_step": 490387, "epoch": 2918} {"train_loss": -12.629899978637695, "global_step": 490388, "epoch": 2918} {"train_loss": -12.684389114379883, "global_step": 490389, "epoch": 2918} {"train_loss": -12.659106254577637, "global_step": 490390, "epoch": 2918} {"train_loss": -12.397752710751124, "global_step": 490391, "epoch": 2918, "val_loss": 313517.0} {"train_loss": -12.622942924499512, "global_step": 490392, "epoch": 2919} {"train_loss": -12.481013298034668, "global_step": 490393, "epoch": 2919} {"train_loss": -12.79638957977295, "global_step": 490394, "epoch": 2919} {"train_loss": -12.334514617919922, "global_step": 490395, "epoch": 2919} {"train_loss": -12.58779525756836, "global_step": 490396, "epoch": 2919} {"train_loss": -12.815649032592773, "global_step": 490397, "epoch": 2919} {"train_loss": -12.433248519897461, "global_step": 490398, "epoch": 2919} {"train_loss": -12.564485549926758, "global_step": 490399, "epoch": 2919} {"train_loss": -12.966169357299805, "global_step": 490400, "epoch": 2919} {"train_loss": -12.897573471069336, "global_step": 490401, "epoch": 2919} {"train_loss": -12.378589630126953, "global_step": 490402, "epoch": 2919} {"train_loss": -12.384330749511719, "global_step": 490403, "epoch": 2919} {"train_loss": -12.267753601074219, "global_step": 490404, "epoch": 2919} {"train_loss": -12.572225570678711, "global_step": 490405, "epoch": 2919} {"train_loss": -11.491020202636719, "global_step": 490406, "epoch": 2919} {"train_loss": -11.252516746520996, "global_step": 490407, "epoch": 2919} {"train_loss": -12.029626846313477, "global_step": 490408, "epoch": 2919} {"train_loss": -12.802135467529297, "global_step": 490409, "epoch": 2919} {"train_loss": -11.004800796508789, "global_step": 490410, "epoch": 2919} {"train_loss": -11.731656074523926, "global_step": 490411, "epoch": 2919} {"train_loss": -11.337652206420898, "global_step": 490412, "epoch": 2919} {"train_loss": -12.293210983276367, "global_step": 490413, "epoch": 2919} {"train_loss": -12.58861255645752, "global_step": 490414, "epoch": 2919} {"train_loss": -12.690003395080566, "global_step": 490415, "epoch": 2919} {"train_loss": -11.551858901977539, "global_step": 490416, "epoch": 2919} {"train_loss": -11.196285247802734, "global_step": 490417, "epoch": 2919} {"train_loss": -12.16616153717041, "global_step": 490418, "epoch": 2919} {"train_loss": -11.20907974243164, "global_step": 490419, "epoch": 2919} {"train_loss": -11.64441204071045, "global_step": 490420, "epoch": 2919} {"train_loss": -12.06969165802002, "global_step": 490421, "epoch": 2919} {"train_loss": -11.44150161743164, "global_step": 490422, "epoch": 2919} {"train_loss": -11.872233390808105, "global_step": 490423, "epoch": 2919} {"train_loss": -11.808416366577148, "global_step": 490424, "epoch": 2919} {"train_loss": -12.335476875305176, "global_step": 490425, "epoch": 2919} {"train_loss": -12.149267196655273, "global_step": 490426, "epoch": 2919} {"train_loss": -12.127220153808594, "global_step": 490427, "epoch": 2919} {"train_loss": -12.277551651000977, "global_step": 490428, "epoch": 2919} {"train_loss": -12.615078926086426, "global_step": 490429, "epoch": 2919} {"train_loss": -11.60921859741211, "global_step": 490430, "epoch": 2919} {"train_loss": -11.931693077087402, "global_step": 490431, "epoch": 2919} {"train_loss": -12.367204666137695, "global_step": 490432, "epoch": 2919} {"train_loss": -12.160629272460938, "global_step": 490433, "epoch": 2919} {"train_loss": -11.531938552856445, "global_step": 490434, "epoch": 2919} {"train_loss": -12.605169296264648, "global_step": 490435, "epoch": 2919} {"train_loss": -11.451255798339844, "global_step": 490436, "epoch": 2919} {"train_loss": -12.764410018920898, "global_step": 490437, "epoch": 2919} {"train_loss": -12.196864128112793, "global_step": 490438, "epoch": 2919} {"train_loss": -12.159762382507324, "global_step": 490439, "epoch": 2919} {"train_loss": -12.17055892944336, "global_step": 490440, "epoch": 2919} {"train_loss": -12.298913955688477, "global_step": 490441, "epoch": 2919} {"train_loss": -12.362228393554688, "global_step": 490442, "epoch": 2919} {"train_loss": -11.641854286193848, "global_step": 490443, "epoch": 2919} {"train_loss": -11.817411422729492, "global_step": 490444, "epoch": 2919} {"train_loss": -11.308931350708008, "global_step": 490445, "epoch": 2919} {"train_loss": -11.650289535522461, "global_step": 490446, "epoch": 2919} {"train_loss": -10.599534034729004, "global_step": 490447, "epoch": 2919} {"train_loss": -10.865276336669922, "global_step": 490448, "epoch": 2919} {"train_loss": -10.836335182189941, "global_step": 490449, "epoch": 2919} {"train_loss": -11.203271865844727, "global_step": 490450, "epoch": 2919} {"train_loss": -10.667896270751953, "global_step": 490451, "epoch": 2919} {"train_loss": -12.504809379577637, "global_step": 490452, "epoch": 2919} {"train_loss": -11.046806335449219, "global_step": 490453, "epoch": 2919} {"train_loss": -11.826353073120117, "global_step": 490454, "epoch": 2919} {"train_loss": -11.557289123535156, "global_step": 490455, "epoch": 2919} {"train_loss": -11.545756340026855, "global_step": 490456, "epoch": 2919} {"train_loss": -11.335841178894043, "global_step": 490457, "epoch": 2919} {"train_loss": -11.174463272094727, "global_step": 490458, "epoch": 2919} {"train_loss": -10.565505981445312, "global_step": 490459, "epoch": 2919} {"train_loss": -11.917296409606934, "global_step": 490460, "epoch": 2919} {"train_loss": -11.490498542785645, "global_step": 490461, "epoch": 2919} {"train_loss": -11.991704940795898, "global_step": 490462, "epoch": 2919} {"train_loss": -11.880839347839355, "global_step": 490463, "epoch": 2919} {"train_loss": -11.991613388061523, "global_step": 490464, "epoch": 2919} {"train_loss": -12.10380744934082, "global_step": 490465, "epoch": 2919} {"train_loss": -12.29968547821045, "global_step": 490466, "epoch": 2919} {"train_loss": -11.837838172912598, "global_step": 490467, "epoch": 2919} {"train_loss": -12.476446151733398, "global_step": 490468, "epoch": 2919} {"train_loss": -12.095170974731445, "global_step": 490469, "epoch": 2919} {"train_loss": -12.388461112976074, "global_step": 490470, "epoch": 2919} {"train_loss": -12.128247261047363, "global_step": 490471, "epoch": 2919} {"train_loss": -11.994197845458984, "global_step": 490472, "epoch": 2919} {"train_loss": -12.598323822021484, "global_step": 490473, "epoch": 2919} {"train_loss": -12.010994911193848, "global_step": 490474, "epoch": 2919} {"train_loss": -12.385642051696777, "global_step": 490475, "epoch": 2919} {"train_loss": -12.264280319213867, "global_step": 490476, "epoch": 2919} {"train_loss": -12.421257019042969, "global_step": 490477, "epoch": 2919} {"train_loss": -12.187658309936523, "global_step": 490478, "epoch": 2919} {"train_loss": -12.564167976379395, "global_step": 490479, "epoch": 2919} {"train_loss": -12.662496566772461, "global_step": 490480, "epoch": 2919} {"train_loss": -12.855993270874023, "global_step": 490481, "epoch": 2919} {"train_loss": -12.775718688964844, "global_step": 490482, "epoch": 2919} {"train_loss": -12.666059494018555, "global_step": 490483, "epoch": 2919} {"train_loss": -12.855762481689453, "global_step": 490484, "epoch": 2919} {"train_loss": -12.862932205200195, "global_step": 490485, "epoch": 2919} {"train_loss": -12.849197387695312, "global_step": 490486, "epoch": 2919} {"train_loss": -12.753999710083008, "global_step": 490487, "epoch": 2919} {"train_loss": -12.889705657958984, "global_step": 490488, "epoch": 2919} {"train_loss": -12.882040023803711, "global_step": 490489, "epoch": 2919} {"train_loss": -12.734665870666504, "global_step": 490490, "epoch": 2919} {"train_loss": -12.80262565612793, "global_step": 490491, "epoch": 2919} {"train_loss": -12.793220520019531, "global_step": 490492, "epoch": 2919} {"train_loss": -12.59775161743164, "global_step": 490493, "epoch": 2919} {"train_loss": -12.64113998413086, "global_step": 490494, "epoch": 2919} {"train_loss": -12.54300594329834, "global_step": 490495, "epoch": 2919} {"train_loss": -12.513757705688477, "global_step": 490496, "epoch": 2919} {"train_loss": -12.741682052612305, "global_step": 490497, "epoch": 2919} {"train_loss": -12.833382606506348, "global_step": 490498, "epoch": 2919} {"train_loss": -12.617547988891602, "global_step": 490499, "epoch": 2919} {"train_loss": -12.995468139648438, "global_step": 490500, "epoch": 2919} {"train_loss": -12.807088851928711, "global_step": 490501, "epoch": 2919} {"train_loss": -12.840934753417969, "global_step": 490502, "epoch": 2919} {"train_loss": -12.842400550842285, "global_step": 490503, "epoch": 2919} {"train_loss": -12.823001861572266, "global_step": 490504, "epoch": 2919} {"train_loss": -13.105386734008789, "global_step": 490505, "epoch": 2919} {"train_loss": -12.90257453918457, "global_step": 490506, "epoch": 2919} {"train_loss": -12.854366302490234, "global_step": 490507, "epoch": 2919} {"train_loss": -12.916996002197266, "global_step": 490508, "epoch": 2919} {"train_loss": -12.861384391784668, "global_step": 490509, "epoch": 2919} {"train_loss": -13.017128944396973, "global_step": 490510, "epoch": 2919} {"train_loss": -13.066783905029297, "global_step": 490511, "epoch": 2919} {"train_loss": -12.869379997253418, "global_step": 490512, "epoch": 2919} {"train_loss": -12.79323959350586, "global_step": 490513, "epoch": 2919} {"train_loss": -12.872291564941406, "global_step": 490514, "epoch": 2919} {"train_loss": -13.018341064453125, "global_step": 490515, "epoch": 2919} {"train_loss": -13.015670776367188, "global_step": 490516, "epoch": 2919} {"train_loss": -13.00738525390625, "global_step": 490517, "epoch": 2919} {"train_loss": -13.075596809387207, "global_step": 490518, "epoch": 2919} {"train_loss": -12.961606979370117, "global_step": 490519, "epoch": 2919} {"train_loss": -13.148265838623047, "global_step": 490520, "epoch": 2919} {"train_loss": -13.055646896362305, "global_step": 490521, "epoch": 2919} {"train_loss": -12.864320755004883, "global_step": 490522, "epoch": 2919} {"train_loss": -12.674337387084961, "global_step": 490523, "epoch": 2919} {"train_loss": -12.898405075073242, "global_step": 490524, "epoch": 2919} {"train_loss": -12.927298545837402, "global_step": 490525, "epoch": 2919} {"train_loss": -13.014877319335938, "global_step": 490526, "epoch": 2919} {"train_loss": -13.071680068969727, "global_step": 490527, "epoch": 2919} {"train_loss": -13.084802627563477, "global_step": 490528, "epoch": 2919} {"train_loss": -13.073432922363281, "global_step": 490529, "epoch": 2919} {"train_loss": -13.194648742675781, "global_step": 490530, "epoch": 2919} {"train_loss": -13.08051872253418, "global_step": 490531, "epoch": 2919} {"train_loss": -13.242654800415039, "global_step": 490532, "epoch": 2919} {"train_loss": -12.970354080200195, "global_step": 490533, "epoch": 2919} {"train_loss": -12.859257698059082, "global_step": 490534, "epoch": 2919} {"train_loss": -12.972650527954102, "global_step": 490535, "epoch": 2919} {"train_loss": -12.457941055297852, "global_step": 490536, "epoch": 2919} {"train_loss": -13.021039962768555, "global_step": 490537, "epoch": 2919} {"train_loss": -12.500781059265137, "global_step": 490538, "epoch": 2919} {"train_loss": -11.541418075561523, "global_step": 490539, "epoch": 2919} {"train_loss": -10.041047096252441, "global_step": 490540, "epoch": 2919} {"train_loss": -10.208579063415527, "global_step": 490541, "epoch": 2919} {"train_loss": -11.763957023620605, "global_step": 490542, "epoch": 2919} {"train_loss": -11.468031883239746, "global_step": 490543, "epoch": 2919} {"train_loss": -10.195606231689453, "global_step": 490544, "epoch": 2919} {"train_loss": -10.470292091369629, "global_step": 490545, "epoch": 2919} {"train_loss": -10.818987846374512, "global_step": 490546, "epoch": 2919} {"train_loss": -10.969661712646484, "global_step": 490547, "epoch": 2919} {"train_loss": -11.576338768005371, "global_step": 490548, "epoch": 2919} {"train_loss": -11.098556518554688, "global_step": 490549, "epoch": 2919} {"train_loss": -11.925849914550781, "global_step": 490550, "epoch": 2919} {"train_loss": -11.146357536315918, "global_step": 490551, "epoch": 2919} {"train_loss": -11.24074935913086, "global_step": 490552, "epoch": 2919} {"train_loss": -11.201879501342773, "global_step": 490553, "epoch": 2919} {"train_loss": -12.108728408813477, "global_step": 490554, "epoch": 2919} {"train_loss": -10.814117431640625, "global_step": 490555, "epoch": 2919} {"train_loss": -10.041425704956055, "global_step": 490556, "epoch": 2919} {"train_loss": -11.109824180603027, "global_step": 490557, "epoch": 2919} {"train_loss": -10.722912788391113, "global_step": 490558, "epoch": 2919} {"train_loss": -12.17681782586234, "global_step": 490559, "epoch": 2919, "val_loss": 315039.5} {"train_loss": -11.740964889526367, "global_step": 490560, "epoch": 2920} {"train_loss": -11.682181358337402, "global_step": 490561, "epoch": 2920} {"train_loss": -11.933523178100586, "global_step": 490562, "epoch": 2920} {"train_loss": -11.070075988769531, "global_step": 490563, "epoch": 2920} {"train_loss": -11.478888511657715, "global_step": 490564, "epoch": 2920} {"train_loss": -11.501785278320312, "global_step": 490565, "epoch": 2920} {"train_loss": -9.923637390136719, "global_step": 490566, "epoch": 2920} {"train_loss": -11.804311752319336, "global_step": 490567, "epoch": 2920} {"train_loss": -10.640552520751953, "global_step": 490568, "epoch": 2920} {"train_loss": -12.028204917907715, "global_step": 490569, "epoch": 2920} {"train_loss": -10.463640213012695, "global_step": 490570, "epoch": 2920} {"train_loss": -10.246408462524414, "global_step": 490571, "epoch": 2920} {"train_loss": -11.346317291259766, "global_step": 490572, "epoch": 2920} {"train_loss": -8.86375617980957, "global_step": 490573, "epoch": 2920} {"train_loss": -10.687644958496094, "global_step": 490574, "epoch": 2920} {"train_loss": -10.825202941894531, "global_step": 490575, "epoch": 2920} {"train_loss": -9.552595138549805, "global_step": 490576, "epoch": 2920} {"train_loss": -9.378052711486816, "global_step": 490577, "epoch": 2920} {"train_loss": -9.252609252929688, "global_step": 490578, "epoch": 2920} {"train_loss": -9.268510818481445, "global_step": 490579, "epoch": 2920} {"train_loss": -11.34918212890625, "global_step": 490580, "epoch": 2920} {"train_loss": -10.22730827331543, "global_step": 490581, "epoch": 2920} {"train_loss": -10.085116386413574, "global_step": 490582, "epoch": 2920} {"train_loss": -11.1463623046875, "global_step": 490583, "epoch": 2920} {"train_loss": -10.190946578979492, "global_step": 490584, "epoch": 2920} {"train_loss": -10.453810691833496, "global_step": 490585, "epoch": 2920} {"train_loss": -10.712503433227539, "global_step": 490586, "epoch": 2920} {"train_loss": -10.457752227783203, "global_step": 490587, "epoch": 2920} {"train_loss": -10.924558639526367, "global_step": 490588, "epoch": 2920} {"train_loss": -11.143289566040039, "global_step": 490589, "epoch": 2920} {"train_loss": -11.378423690795898, "global_step": 490590, "epoch": 2920} {"train_loss": -11.909040451049805, "global_step": 490591, "epoch": 2920} {"train_loss": -10.995210647583008, "global_step": 490592, "epoch": 2920} {"train_loss": -11.400681495666504, "global_step": 490593, "epoch": 2920} {"train_loss": -12.049759864807129, "global_step": 490594, "epoch": 2920} {"train_loss": -11.52308464050293, "global_step": 490595, "epoch": 2920} {"train_loss": -11.720630645751953, "global_step": 490596, "epoch": 2920} {"train_loss": -11.606206893920898, "global_step": 490597, "epoch": 2920} {"train_loss": -12.223592758178711, "global_step": 490598, "epoch": 2920} {"train_loss": -11.87172794342041, "global_step": 490599, "epoch": 2920} {"train_loss": -12.089923858642578, "global_step": 490600, "epoch": 2920} {"train_loss": -11.619083404541016, "global_step": 490601, "epoch": 2920} {"train_loss": -12.018664360046387, "global_step": 490602, "epoch": 2920} {"train_loss": -11.887287139892578, "global_step": 490603, "epoch": 2920} {"train_loss": -12.432340621948242, "global_step": 490604, "epoch": 2920} {"train_loss": -12.086545944213867, "global_step": 490605, "epoch": 2920} {"train_loss": -12.423851013183594, "global_step": 490606, "epoch": 2920} {"train_loss": -11.790458679199219, "global_step": 490607, "epoch": 2920} {"train_loss": -12.355085372924805, "global_step": 490608, "epoch": 2920} {"train_loss": -12.363360404968262, "global_step": 490609, "epoch": 2920} {"train_loss": -12.291457176208496, "global_step": 490610, "epoch": 2920} {"train_loss": -12.404029846191406, "global_step": 490611, "epoch": 2920} {"train_loss": -12.431316375732422, "global_step": 490612, "epoch": 2920} {"train_loss": -12.248042106628418, "global_step": 490613, "epoch": 2920} {"train_loss": -12.33884334564209, "global_step": 490614, "epoch": 2920} {"train_loss": -12.642309188842773, "global_step": 490615, "epoch": 2920} {"train_loss": -12.475690841674805, "global_step": 490616, "epoch": 2920} {"train_loss": -12.534427642822266, "global_step": 490617, "epoch": 2920} {"train_loss": -12.600858688354492, "global_step": 490618, "epoch": 2920} {"train_loss": -12.390426635742188, "global_step": 490619, "epoch": 2920} {"train_loss": -12.566671371459961, "global_step": 490620, "epoch": 2920} {"train_loss": -12.5516939163208, "global_step": 490621, "epoch": 2920} {"train_loss": -12.639261245727539, "global_step": 490622, "epoch": 2920} {"train_loss": -12.63392162322998, "global_step": 490623, "epoch": 2920} {"train_loss": -12.735892295837402, "global_step": 490624, "epoch": 2920} {"train_loss": -12.80140495300293, "global_step": 490625, "epoch": 2920} {"train_loss": -12.609599113464355, "global_step": 490626, "epoch": 2920} {"train_loss": -12.408525466918945, "global_step": 490627, "epoch": 2920} {"train_loss": -12.648031234741211, "global_step": 490628, "epoch": 2920} {"train_loss": -12.84731674194336, "global_step": 490629, "epoch": 2920} {"train_loss": -12.673018455505371, "global_step": 490630, "epoch": 2920} {"train_loss": -12.807622909545898, "global_step": 490631, "epoch": 2920} {"train_loss": -12.713977813720703, "global_step": 490632, "epoch": 2920} {"train_loss": -12.608634948730469, "global_step": 490633, "epoch": 2920} {"train_loss": -12.711678504943848, "global_step": 490634, "epoch": 2920} {"train_loss": -12.86397933959961, "global_step": 490635, "epoch": 2920} {"train_loss": -12.768730163574219, "global_step": 490636, "epoch": 2920} {"train_loss": -12.822912216186523, "global_step": 490637, "epoch": 2920} {"train_loss": -12.68004322052002, "global_step": 490638, "epoch": 2920} {"train_loss": -12.893409729003906, "global_step": 490639, "epoch": 2920} {"train_loss": -12.769353866577148, "global_step": 490640, "epoch": 2920} {"train_loss": -12.840154647827148, "global_step": 490641, "epoch": 2920} {"train_loss": -12.478666305541992, "global_step": 490642, "epoch": 2920} {"train_loss": -12.661893844604492, "global_step": 490643, "epoch": 2920} {"train_loss": -12.749502182006836, "global_step": 490644, "epoch": 2920} {"train_loss": -12.625480651855469, "global_step": 490645, "epoch": 2920} {"train_loss": -12.35898208618164, "global_step": 490646, "epoch": 2920} {"train_loss": -12.740251541137695, "global_step": 490647, "epoch": 2920} {"train_loss": -12.573373794555664, "global_step": 490648, "epoch": 2920} {"train_loss": -12.646774291992188, "global_step": 490649, "epoch": 2920} {"train_loss": -12.798946380615234, "global_step": 490650, "epoch": 2920} {"train_loss": -12.886114120483398, "global_step": 490651, "epoch": 2920} {"train_loss": -12.742219924926758, "global_step": 490652, "epoch": 2920} {"train_loss": -12.587711334228516, "global_step": 490653, "epoch": 2920} {"train_loss": -12.688475608825684, "global_step": 490654, "epoch": 2920} {"train_loss": -12.806017875671387, "global_step": 490655, "epoch": 2920} {"train_loss": -12.427252769470215, "global_step": 490656, "epoch": 2920} {"train_loss": -12.979593276977539, "global_step": 490657, "epoch": 2920} {"train_loss": -12.908748626708984, "global_step": 490658, "epoch": 2920} {"train_loss": -12.83220386505127, "global_step": 490659, "epoch": 2920} {"train_loss": -12.787216186523438, "global_step": 490660, "epoch": 2920} {"train_loss": -12.694583892822266, "global_step": 490661, "epoch": 2920} {"train_loss": -13.009044647216797, "global_step": 490662, "epoch": 2920} {"train_loss": -12.821788787841797, "global_step": 490663, "epoch": 2920} {"train_loss": -12.923828125, "global_step": 490664, "epoch": 2920} {"train_loss": -13.032886505126953, "global_step": 490665, "epoch": 2920} {"train_loss": -12.956271171569824, "global_step": 490666, "epoch": 2920} {"train_loss": -13.109512329101562, "global_step": 490667, "epoch": 2920} {"train_loss": -12.893425941467285, "global_step": 490668, "epoch": 2920} {"train_loss": -12.822633743286133, "global_step": 490669, "epoch": 2920} {"train_loss": -12.966187477111816, "global_step": 490670, "epoch": 2920} {"train_loss": -13.164647102355957, "global_step": 490671, "epoch": 2920} {"train_loss": -12.822218894958496, "global_step": 490672, "epoch": 2920} {"train_loss": -12.675146102905273, "global_step": 490673, "epoch": 2920} {"train_loss": -12.993919372558594, "global_step": 490674, "epoch": 2920} {"train_loss": -12.774307250976562, "global_step": 490675, "epoch": 2920} {"train_loss": -12.478212356567383, "global_step": 490676, "epoch": 2920} {"train_loss": -12.948127746582031, "global_step": 490677, "epoch": 2920} {"train_loss": -12.738648414611816, "global_step": 490678, "epoch": 2920} {"train_loss": -12.769755363464355, "global_step": 490679, "epoch": 2920} {"train_loss": -12.31462287902832, "global_step": 490680, "epoch": 2920} {"train_loss": -12.661308288574219, "global_step": 490681, "epoch": 2920} {"train_loss": -12.420088768005371, "global_step": 490682, "epoch": 2920} {"train_loss": -12.369645118713379, "global_step": 490683, "epoch": 2920} {"train_loss": -11.35287857055664, "global_step": 490684, "epoch": 2920} {"train_loss": -12.030508995056152, "global_step": 490685, "epoch": 2920} {"train_loss": -12.282405853271484, "global_step": 490686, "epoch": 2920} {"train_loss": -11.78111743927002, "global_step": 490687, "epoch": 2920} {"train_loss": -10.664436340332031, "global_step": 490688, "epoch": 2920} {"train_loss": -11.907323837280273, "global_step": 490689, "epoch": 2920} {"train_loss": -11.84780216217041, "global_step": 490690, "epoch": 2920} {"train_loss": -10.556207656860352, "global_step": 490691, "epoch": 2920} {"train_loss": -9.865686416625977, "global_step": 490692, "epoch": 2920} {"train_loss": -9.291210174560547, "global_step": 490693, "epoch": 2920} {"train_loss": -10.681715965270996, "global_step": 490694, "epoch": 2920} {"train_loss": -11.183597564697266, "global_step": 490695, "epoch": 2920} {"train_loss": -10.73863410949707, "global_step": 490696, "epoch": 2920} {"train_loss": -11.805532455444336, "global_step": 490697, "epoch": 2920} {"train_loss": -10.306673049926758, "global_step": 490698, "epoch": 2920} {"train_loss": -11.17405891418457, "global_step": 490699, "epoch": 2920} {"train_loss": -11.162532806396484, "global_step": 490700, "epoch": 2920} {"train_loss": -9.951791763305664, "global_step": 490701, "epoch": 2920} {"train_loss": -11.901527404785156, "global_step": 490702, "epoch": 2920} {"train_loss": -10.75013542175293, "global_step": 490703, "epoch": 2920} {"train_loss": -10.383125305175781, "global_step": 490704, "epoch": 2920} {"train_loss": -10.910054206848145, "global_step": 490705, "epoch": 2920} {"train_loss": -11.305461883544922, "global_step": 490706, "epoch": 2920} {"train_loss": -10.675153732299805, "global_step": 490707, "epoch": 2920} {"train_loss": -11.299444198608398, "global_step": 490708, "epoch": 2920} {"train_loss": -11.016729354858398, "global_step": 490709, "epoch": 2920} {"train_loss": -11.514436721801758, "global_step": 490710, "epoch": 2920} {"train_loss": -12.049824714660645, "global_step": 490711, "epoch": 2920} {"train_loss": -11.767626762390137, "global_step": 490712, "epoch": 2920} {"train_loss": -11.591036796569824, "global_step": 490713, "epoch": 2920} {"train_loss": -11.541327476501465, "global_step": 490714, "epoch": 2920} {"train_loss": -11.960378646850586, "global_step": 490715, "epoch": 2920} {"train_loss": -11.995339393615723, "global_step": 490716, "epoch": 2920} {"train_loss": -11.55529499053955, "global_step": 490717, "epoch": 2920} {"train_loss": -12.444388389587402, "global_step": 490718, "epoch": 2920} {"train_loss": -10.996116638183594, "global_step": 490719, "epoch": 2920} {"train_loss": -11.566454887390137, "global_step": 490720, "epoch": 2920} {"train_loss": -11.686419486999512, "global_step": 490721, "epoch": 2920} {"train_loss": -11.809309959411621, "global_step": 490722, "epoch": 2920} {"train_loss": -12.11012077331543, "global_step": 490723, "epoch": 2920} {"train_loss": -11.974021911621094, "global_step": 490724, "epoch": 2920} {"train_loss": -12.405380249023438, "global_step": 490725, "epoch": 2920} {"train_loss": -12.087234497070312, "global_step": 490726, "epoch": 2920} {"train_loss": -11.891973029999505, "global_step": 490727, "epoch": 2920, "val_loss": 322397.09375, "train_action_mse_error": 1.8346261978149414} {"train_loss": -12.293050765991211, "global_step": 490728, "epoch": 2921} {"train_loss": -12.254803657531738, "global_step": 490729, "epoch": 2921} {"train_loss": -12.39988899230957, "global_step": 490730, "epoch": 2921} {"train_loss": -12.313039779663086, "global_step": 490731, "epoch": 2921} {"train_loss": -12.43139934539795, "global_step": 490732, "epoch": 2921} {"train_loss": -12.449304580688477, "global_step": 490733, "epoch": 2921} {"train_loss": -12.473599433898926, "global_step": 490734, "epoch": 2921} {"train_loss": -12.368734359741211, "global_step": 490735, "epoch": 2921} {"train_loss": -12.226698875427246, "global_step": 490736, "epoch": 2921} {"train_loss": -12.362505912780762, "global_step": 490737, "epoch": 2921} {"train_loss": -12.477206230163574, "global_step": 490738, "epoch": 2921} {"train_loss": -12.21535873413086, "global_step": 490739, "epoch": 2921} {"train_loss": -12.730827331542969, "global_step": 490740, "epoch": 2921} {"train_loss": -12.139480590820312, "global_step": 490741, "epoch": 2921} {"train_loss": -12.451373100280762, "global_step": 490742, "epoch": 2921} {"train_loss": -12.37755298614502, "global_step": 490743, "epoch": 2921} {"train_loss": -12.385177612304688, "global_step": 490744, "epoch": 2921} {"train_loss": -12.693061828613281, "global_step": 490745, "epoch": 2921} {"train_loss": -12.10491943359375, "global_step": 490746, "epoch": 2921} {"train_loss": -12.461977005004883, "global_step": 490747, "epoch": 2921} {"train_loss": -12.345877647399902, "global_step": 490748, "epoch": 2921} {"train_loss": -12.698088645935059, "global_step": 490749, "epoch": 2921} {"train_loss": -12.737239837646484, "global_step": 490750, "epoch": 2921} {"train_loss": -12.5044527053833, "global_step": 490751, "epoch": 2921} {"train_loss": -12.583526611328125, "global_step": 490752, "epoch": 2921} {"train_loss": -12.662044525146484, "global_step": 490753, "epoch": 2921} {"train_loss": -12.421055793762207, "global_step": 490754, "epoch": 2921} {"train_loss": -12.652478218078613, "global_step": 490755, "epoch": 2921} {"train_loss": -12.625391006469727, "global_step": 490756, "epoch": 2921} {"train_loss": -12.496965408325195, "global_step": 490757, "epoch": 2921} {"train_loss": -12.654674530029297, "global_step": 490758, "epoch": 2921} {"train_loss": -12.834150314331055, "global_step": 490759, "epoch": 2921} {"train_loss": -12.732940673828125, "global_step": 490760, "epoch": 2921} {"train_loss": -12.7280855178833, "global_step": 490761, "epoch": 2921} {"train_loss": -12.596396446228027, "global_step": 490762, "epoch": 2921} {"train_loss": -12.89111614227295, "global_step": 490763, "epoch": 2921} {"train_loss": -12.632539749145508, "global_step": 490764, "epoch": 2921} {"train_loss": -12.475132942199707, "global_step": 490765, "epoch": 2921} {"train_loss": -12.904640197753906, "global_step": 490766, "epoch": 2921} {"train_loss": -12.78274154663086, "global_step": 490767, "epoch": 2921} {"train_loss": -12.635683059692383, "global_step": 490768, "epoch": 2921} {"train_loss": -12.74018383026123, "global_step": 490769, "epoch": 2921} {"train_loss": -12.249313354492188, "global_step": 490770, "epoch": 2921} {"train_loss": -12.44344425201416, "global_step": 490771, "epoch": 2921} {"train_loss": -12.879081726074219, "global_step": 490772, "epoch": 2921} {"train_loss": -12.448371887207031, "global_step": 490773, "epoch": 2921} {"train_loss": -12.7328519821167, "global_step": 490774, "epoch": 2921} {"train_loss": -12.767337799072266, "global_step": 490775, "epoch": 2921} {"train_loss": -12.9466552734375, "global_step": 490776, "epoch": 2921} {"train_loss": -12.770922660827637, "global_step": 490777, "epoch": 2921} {"train_loss": -12.636590957641602, "global_step": 490778, "epoch": 2921} {"train_loss": -12.195792198181152, "global_step": 490779, "epoch": 2921} {"train_loss": -12.90859603881836, "global_step": 490780, "epoch": 2921} {"train_loss": -11.92785358428955, "global_step": 490781, "epoch": 2921} {"train_loss": -12.05721378326416, "global_step": 490782, "epoch": 2921} {"train_loss": -12.5708646774292, "global_step": 490783, "epoch": 2921} {"train_loss": -11.614096641540527, "global_step": 490784, "epoch": 2921} {"train_loss": -12.296219825744629, "global_step": 490785, "epoch": 2921} {"train_loss": -12.086151123046875, "global_step": 490786, "epoch": 2921} {"train_loss": -9.732152938842773, "global_step": 490787, "epoch": 2921} {"train_loss": -10.52481746673584, "global_step": 490788, "epoch": 2921} {"train_loss": -10.149091720581055, "global_step": 490789, "epoch": 2921} {"train_loss": -11.644827842712402, "global_step": 490790, "epoch": 2921} {"train_loss": -8.731330871582031, "global_step": 490791, "epoch": 2921} {"train_loss": -8.081769943237305, "global_step": 490792, "epoch": 2921} {"train_loss": -10.620058059692383, "global_step": 490793, "epoch": 2921} {"train_loss": -8.72216796875, "global_step": 490794, "epoch": 2921} {"train_loss": -8.455180168151855, "global_step": 490795, "epoch": 2921} {"train_loss": -7.6100873947143555, "global_step": 490796, "epoch": 2921} {"train_loss": -8.576794624328613, "global_step": 490797, "epoch": 2921} {"train_loss": -8.909799575805664, "global_step": 490798, "epoch": 2921} {"train_loss": -10.428057670593262, "global_step": 490799, "epoch": 2921} {"train_loss": -10.643132209777832, "global_step": 490800, "epoch": 2921} {"train_loss": -10.32989501953125, "global_step": 490801, "epoch": 2921} {"train_loss": -10.680322647094727, "global_step": 490802, "epoch": 2921} {"train_loss": -11.08560562133789, "global_step": 490803, "epoch": 2921} {"train_loss": -11.3782958984375, "global_step": 490804, "epoch": 2921} {"train_loss": -10.5772066116333, "global_step": 490805, "epoch": 2921} {"train_loss": -10.644622802734375, "global_step": 490806, "epoch": 2921} {"train_loss": -11.377946853637695, "global_step": 490807, "epoch": 2921} {"train_loss": -9.75663948059082, "global_step": 490808, "epoch": 2921} {"train_loss": -10.463193893432617, "global_step": 490809, "epoch": 2921} {"train_loss": -12.023136138916016, "global_step": 490810, "epoch": 2921} {"train_loss": -10.612869262695312, "global_step": 490811, "epoch": 2921} {"train_loss": -11.115720748901367, "global_step": 490812, "epoch": 2921} {"train_loss": -10.743074417114258, "global_step": 490813, "epoch": 2921} {"train_loss": -11.506113052368164, "global_step": 490814, "epoch": 2921} {"train_loss": -10.862810134887695, "global_step": 490815, "epoch": 2921} {"train_loss": -11.603057861328125, "global_step": 490816, "epoch": 2921} {"train_loss": -10.020874977111816, "global_step": 490817, "epoch": 2921} {"train_loss": -11.37800121307373, "global_step": 490818, "epoch": 2921} {"train_loss": -11.595996856689453, "global_step": 490819, "epoch": 2921} {"train_loss": -11.629434585571289, "global_step": 490820, "epoch": 2921} {"train_loss": -11.58570671081543, "global_step": 490821, "epoch": 2921} {"train_loss": -11.554506301879883, "global_step": 490822, "epoch": 2921} {"train_loss": -11.816789627075195, "global_step": 490823, "epoch": 2921} {"train_loss": -11.371994018554688, "global_step": 490824, "epoch": 2921} {"train_loss": -10.626386642456055, "global_step": 490825, "epoch": 2921} {"train_loss": -11.90672492980957, "global_step": 490826, "epoch": 2921} {"train_loss": -11.333641052246094, "global_step": 490827, "epoch": 2921} {"train_loss": -11.83721923828125, "global_step": 490828, "epoch": 2921} {"train_loss": -11.511592864990234, "global_step": 490829, "epoch": 2921} {"train_loss": -11.923165321350098, "global_step": 490830, "epoch": 2921} {"train_loss": -11.80156135559082, "global_step": 490831, "epoch": 2921} {"train_loss": -11.65959644317627, "global_step": 490832, "epoch": 2921} {"train_loss": -11.908032417297363, "global_step": 490833, "epoch": 2921} {"train_loss": -12.01962661743164, "global_step": 490834, "epoch": 2921} {"train_loss": -11.962125778198242, "global_step": 490835, "epoch": 2921} {"train_loss": -12.065939903259277, "global_step": 490836, "epoch": 2921} {"train_loss": -12.021242141723633, "global_step": 490837, "epoch": 2921} {"train_loss": -12.547598838806152, "global_step": 490838, "epoch": 2921} {"train_loss": -11.654369354248047, "global_step": 490839, "epoch": 2921} {"train_loss": -12.461480140686035, "global_step": 490840, "epoch": 2921} {"train_loss": -12.186113357543945, "global_step": 490841, "epoch": 2921} {"train_loss": -12.190792083740234, "global_step": 490842, "epoch": 2921} {"train_loss": -12.452743530273438, "global_step": 490843, "epoch": 2921} {"train_loss": -12.369235038757324, "global_step": 490844, "epoch": 2921} {"train_loss": -12.322139739990234, "global_step": 490845, "epoch": 2921} {"train_loss": -12.375481605529785, "global_step": 490846, "epoch": 2921} {"train_loss": -12.129122734069824, "global_step": 490847, "epoch": 2921} {"train_loss": -12.054596900939941, "global_step": 490848, "epoch": 2921} {"train_loss": -12.168052673339844, "global_step": 490849, "epoch": 2921} {"train_loss": -12.106746673583984, "global_step": 490850, "epoch": 2921} {"train_loss": -12.128202438354492, "global_step": 490851, "epoch": 2921} {"train_loss": -12.114923477172852, "global_step": 490852, "epoch": 2921} {"train_loss": -11.973933219909668, "global_step": 490853, "epoch": 2921} {"train_loss": -12.5111665725708, "global_step": 490854, "epoch": 2921} {"train_loss": -12.248764038085938, "global_step": 490855, "epoch": 2921} {"train_loss": -12.563039779663086, "global_step": 490856, "epoch": 2921} {"train_loss": -12.486713409423828, "global_step": 490857, "epoch": 2921} {"train_loss": -12.33139419555664, "global_step": 490858, "epoch": 2921} {"train_loss": -12.570754051208496, "global_step": 490859, "epoch": 2921} {"train_loss": -12.1776123046875, "global_step": 490860, "epoch": 2921} {"train_loss": -12.530574798583984, "global_step": 490861, "epoch": 2921} {"train_loss": -12.28973388671875, "global_step": 490862, "epoch": 2921} {"train_loss": -12.24493408203125, "global_step": 490863, "epoch": 2921} {"train_loss": -12.340620994567871, "global_step": 490864, "epoch": 2921} {"train_loss": -12.393284797668457, "global_step": 490865, "epoch": 2921} {"train_loss": -12.178646087646484, "global_step": 490866, "epoch": 2921} {"train_loss": -12.439162254333496, "global_step": 490867, "epoch": 2921} {"train_loss": -12.22488021850586, "global_step": 490868, "epoch": 2921} {"train_loss": -12.406627655029297, "global_step": 490869, "epoch": 2921} {"train_loss": -12.382442474365234, "global_step": 490870, "epoch": 2921} {"train_loss": -12.472065925598145, "global_step": 490871, "epoch": 2921} {"train_loss": -12.55248737335205, "global_step": 490872, "epoch": 2921} {"train_loss": -12.284002304077148, "global_step": 490873, "epoch": 2921} {"train_loss": -12.693681716918945, "global_step": 490874, "epoch": 2921} {"train_loss": -12.540237426757812, "global_step": 490875, "epoch": 2921} {"train_loss": -12.47783088684082, "global_step": 490876, "epoch": 2921} {"train_loss": -12.718423843383789, "global_step": 490877, "epoch": 2921} {"train_loss": -12.508646011352539, "global_step": 490878, "epoch": 2921} {"train_loss": -12.576656341552734, "global_step": 490879, "epoch": 2921} {"train_loss": -12.573526382446289, "global_step": 490880, "epoch": 2921} {"train_loss": -12.355122566223145, "global_step": 490881, "epoch": 2921} {"train_loss": -12.473018646240234, "global_step": 490882, "epoch": 2921} {"train_loss": -12.58473014831543, "global_step": 490883, "epoch": 2921} {"train_loss": -12.409915924072266, "global_step": 490884, "epoch": 2921} {"train_loss": -12.325153350830078, "global_step": 490885, "epoch": 2921} {"train_loss": -12.761528015136719, "global_step": 490886, "epoch": 2921} {"train_loss": -12.506671905517578, "global_step": 490887, "epoch": 2921} {"train_loss": -12.730405807495117, "global_step": 490888, "epoch": 2921} {"train_loss": -12.553417205810547, "global_step": 490889, "epoch": 2921} {"train_loss": -12.58115005493164, "global_step": 490890, "epoch": 2921} {"train_loss": -12.535666465759277, "global_step": 490891, "epoch": 2921} {"train_loss": -12.351547241210938, "global_step": 490892, "epoch": 2921} {"train_loss": -12.6044921875, "global_step": 490893, "epoch": 2921} {"train_loss": -12.615354537963867, "global_step": 490894, "epoch": 2921} {"train_loss": -11.950041458720253, "global_step": 490895, "epoch": 2921, "val_loss": 317557.09375} {"train_loss": -12.457128524780273, "global_step": 490896, "epoch": 2922} {"train_loss": -12.439006805419922, "global_step": 490897, "epoch": 2922} {"train_loss": -12.701354026794434, "global_step": 490898, "epoch": 2922} {"train_loss": -12.848922729492188, "global_step": 490899, "epoch": 2922} {"train_loss": -12.67698860168457, "global_step": 490900, "epoch": 2922} {"train_loss": -12.516857147216797, "global_step": 490901, "epoch": 2922} {"train_loss": -12.784603118896484, "global_step": 490902, "epoch": 2922} {"train_loss": -12.865640640258789, "global_step": 490903, "epoch": 2922} {"train_loss": -12.62895393371582, "global_step": 490904, "epoch": 2922} {"train_loss": -12.706562042236328, "global_step": 490905, "epoch": 2922} {"train_loss": -12.834558486938477, "global_step": 490906, "epoch": 2922} {"train_loss": -12.71180534362793, "global_step": 490907, "epoch": 2922} {"train_loss": -12.858404159545898, "global_step": 490908, "epoch": 2922} {"train_loss": -12.555055618286133, "global_step": 490909, "epoch": 2922} {"train_loss": -12.131487846374512, "global_step": 490910, "epoch": 2922} {"train_loss": -12.52882194519043, "global_step": 490911, "epoch": 2922} {"train_loss": -12.545896530151367, "global_step": 490912, "epoch": 2922} {"train_loss": -11.868341445922852, "global_step": 490913, "epoch": 2922} {"train_loss": -12.67221450805664, "global_step": 490914, "epoch": 2922} {"train_loss": -12.109308242797852, "global_step": 490915, "epoch": 2922} {"train_loss": -12.251304626464844, "global_step": 490916, "epoch": 2922} {"train_loss": -12.357070922851562, "global_step": 490917, "epoch": 2922} {"train_loss": -12.396564483642578, "global_step": 490918, "epoch": 2922} {"train_loss": -12.10008430480957, "global_step": 490919, "epoch": 2922} {"train_loss": -12.272649765014648, "global_step": 490920, "epoch": 2922} {"train_loss": -12.462377548217773, "global_step": 490921, "epoch": 2922} {"train_loss": -12.082338333129883, "global_step": 490922, "epoch": 2922} {"train_loss": -12.002296447753906, "global_step": 490923, "epoch": 2922} {"train_loss": -12.309039115905762, "global_step": 490924, "epoch": 2922} {"train_loss": -12.295291900634766, "global_step": 490925, "epoch": 2922} {"train_loss": -12.521580696105957, "global_step": 490926, "epoch": 2922} {"train_loss": -12.492700576782227, "global_step": 490927, "epoch": 2922} {"train_loss": -12.294258117675781, "global_step": 490928, "epoch": 2922} {"train_loss": -11.93549919128418, "global_step": 490929, "epoch": 2922} {"train_loss": -12.73961067199707, "global_step": 490930, "epoch": 2922} {"train_loss": -12.094995498657227, "global_step": 490931, "epoch": 2922} {"train_loss": -12.77963638305664, "global_step": 490932, "epoch": 2922} {"train_loss": -12.075922012329102, "global_step": 490933, "epoch": 2922} {"train_loss": -12.55691146850586, "global_step": 490934, "epoch": 2922} {"train_loss": -12.4425630569458, "global_step": 490935, "epoch": 2922} {"train_loss": -12.562358856201172, "global_step": 490936, "epoch": 2922} {"train_loss": -12.558948516845703, "global_step": 490937, "epoch": 2922} {"train_loss": -12.065961837768555, "global_step": 490938, "epoch": 2922} {"train_loss": -12.469155311584473, "global_step": 490939, "epoch": 2922} {"train_loss": -11.883687973022461, "global_step": 490940, "epoch": 2922} {"train_loss": -12.616868019104004, "global_step": 490941, "epoch": 2922} {"train_loss": -12.281181335449219, "global_step": 490942, "epoch": 2922} {"train_loss": -12.341329574584961, "global_step": 490943, "epoch": 2922} {"train_loss": -12.580601692199707, "global_step": 490944, "epoch": 2922} {"train_loss": -11.44907283782959, "global_step": 490945, "epoch": 2922} {"train_loss": -11.706844329833984, "global_step": 490946, "epoch": 2922} {"train_loss": -10.188985824584961, "global_step": 490947, "epoch": 2922} {"train_loss": -9.834389686584473, "global_step": 490948, "epoch": 2922} {"train_loss": -10.274980545043945, "global_step": 490949, "epoch": 2922} {"train_loss": -12.253371238708496, "global_step": 490950, "epoch": 2922} {"train_loss": -10.752525329589844, "global_step": 490951, "epoch": 2922} {"train_loss": -10.788677215576172, "global_step": 490952, "epoch": 2922} {"train_loss": -10.90361213684082, "global_step": 490953, "epoch": 2922} {"train_loss": -11.30941390991211, "global_step": 490954, "epoch": 2922} {"train_loss": -11.193313598632812, "global_step": 490955, "epoch": 2922} {"train_loss": -10.651277542114258, "global_step": 490956, "epoch": 2922} {"train_loss": -11.568843841552734, "global_step": 490957, "epoch": 2922} {"train_loss": -11.387958526611328, "global_step": 490958, "epoch": 2922} {"train_loss": -12.02290153503418, "global_step": 490959, "epoch": 2922} {"train_loss": -11.570425987243652, "global_step": 490960, "epoch": 2922} {"train_loss": -12.354154586791992, "global_step": 490961, "epoch": 2922} {"train_loss": -11.697537422180176, "global_step": 490962, "epoch": 2922} {"train_loss": -12.431781768798828, "global_step": 490963, "epoch": 2922} {"train_loss": -12.254887580871582, "global_step": 490964, "epoch": 2922} {"train_loss": -12.572283744812012, "global_step": 490965, "epoch": 2922} {"train_loss": -12.494575500488281, "global_step": 490966, "epoch": 2922} {"train_loss": -12.337696075439453, "global_step": 490967, "epoch": 2922} {"train_loss": -12.075363159179688, "global_step": 490968, "epoch": 2922} {"train_loss": -12.404199600219727, "global_step": 490969, "epoch": 2922} {"train_loss": -12.137958526611328, "global_step": 490970, "epoch": 2922} {"train_loss": -12.545215606689453, "global_step": 490971, "epoch": 2922} {"train_loss": -12.551945686340332, "global_step": 490972, "epoch": 2922} {"train_loss": -12.50982666015625, "global_step": 490973, "epoch": 2922} {"train_loss": -12.48266315460205, "global_step": 490974, "epoch": 2922} {"train_loss": -12.893172264099121, "global_step": 490975, "epoch": 2922} {"train_loss": -12.356414794921875, "global_step": 490976, "epoch": 2922} {"train_loss": -12.269292831420898, "global_step": 490977, "epoch": 2922} {"train_loss": -12.41918659210205, "global_step": 490978, "epoch": 2922} {"train_loss": -12.712699890136719, "global_step": 490979, "epoch": 2922} {"train_loss": -12.728998184204102, "global_step": 490980, "epoch": 2922} {"train_loss": -12.636218070983887, "global_step": 490981, "epoch": 2922} {"train_loss": -12.556522369384766, "global_step": 490982, "epoch": 2922} {"train_loss": -12.272933959960938, "global_step": 490983, "epoch": 2922} {"train_loss": -12.56389045715332, "global_step": 490984, "epoch": 2922} {"train_loss": -12.449857711791992, "global_step": 490985, "epoch": 2922} {"train_loss": -12.628914833068848, "global_step": 490986, "epoch": 2922} {"train_loss": -12.509721755981445, "global_step": 490987, "epoch": 2922} {"train_loss": -12.137855529785156, "global_step": 490988, "epoch": 2922} {"train_loss": -12.677515029907227, "global_step": 490989, "epoch": 2922} {"train_loss": -12.434959411621094, "global_step": 490990, "epoch": 2922} {"train_loss": -12.699349403381348, "global_step": 490991, "epoch": 2922} {"train_loss": -12.77907943725586, "global_step": 490992, "epoch": 2922} {"train_loss": -12.776238441467285, "global_step": 490993, "epoch": 2922} {"train_loss": -12.656222343444824, "global_step": 490994, "epoch": 2922} {"train_loss": -12.646397590637207, "global_step": 490995, "epoch": 2922} {"train_loss": -12.825116157531738, "global_step": 490996, "epoch": 2922} {"train_loss": -12.563382148742676, "global_step": 490997, "epoch": 2922} {"train_loss": -12.668527603149414, "global_step": 490998, "epoch": 2922} {"train_loss": -12.704277038574219, "global_step": 490999, "epoch": 2922} {"train_loss": -12.71476936340332, "global_step": 491000, "epoch": 2922} {"train_loss": -12.594874382019043, "global_step": 491001, "epoch": 2922} {"train_loss": -12.921337127685547, "global_step": 491002, "epoch": 2922} {"train_loss": -12.622285842895508, "global_step": 491003, "epoch": 2922} {"train_loss": -12.583983421325684, "global_step": 491004, "epoch": 2922} {"train_loss": -12.767358779907227, "global_step": 491005, "epoch": 2922} {"train_loss": -12.816019058227539, "global_step": 491006, "epoch": 2922} {"train_loss": -12.522125244140625, "global_step": 491007, "epoch": 2922} {"train_loss": -12.584522247314453, "global_step": 491008, "epoch": 2922} {"train_loss": -12.467682838439941, "global_step": 491009, "epoch": 2922} {"train_loss": -12.721773147583008, "global_step": 491010, "epoch": 2922} {"train_loss": -12.745956420898438, "global_step": 491011, "epoch": 2922} {"train_loss": -12.839020729064941, "global_step": 491012, "epoch": 2922} {"train_loss": -12.557865142822266, "global_step": 491013, "epoch": 2922} {"train_loss": -12.383695602416992, "global_step": 491014, "epoch": 2922} {"train_loss": -12.46493911743164, "global_step": 491015, "epoch": 2922} {"train_loss": -12.543943405151367, "global_step": 491016, "epoch": 2922} {"train_loss": -12.525105476379395, "global_step": 491017, "epoch": 2922} {"train_loss": -12.612462997436523, "global_step": 491018, "epoch": 2922} {"train_loss": -12.310053825378418, "global_step": 491019, "epoch": 2922} {"train_loss": -12.560513496398926, "global_step": 491020, "epoch": 2922} {"train_loss": -12.6779146194458, "global_step": 491021, "epoch": 2922} {"train_loss": -12.808189392089844, "global_step": 491022, "epoch": 2922} {"train_loss": -12.984241485595703, "global_step": 491023, "epoch": 2922} {"train_loss": -12.806147575378418, "global_step": 491024, "epoch": 2922} {"train_loss": -12.83081340789795, "global_step": 491025, "epoch": 2922} {"train_loss": -12.806831359863281, "global_step": 491026, "epoch": 2922} {"train_loss": -12.954554557800293, "global_step": 491027, "epoch": 2922} {"train_loss": -13.112506866455078, "global_step": 491028, "epoch": 2922} {"train_loss": -12.802160263061523, "global_step": 491029, "epoch": 2922} {"train_loss": -12.957984924316406, "global_step": 491030, "epoch": 2922} {"train_loss": -12.720743179321289, "global_step": 491031, "epoch": 2922} {"train_loss": -12.798860549926758, "global_step": 491032, "epoch": 2922} {"train_loss": -12.87382698059082, "global_step": 491033, "epoch": 2922} {"train_loss": -12.961282730102539, "global_step": 491034, "epoch": 2922} {"train_loss": -12.682254791259766, "global_step": 491035, "epoch": 2922} {"train_loss": -12.697545051574707, "global_step": 491036, "epoch": 2922} {"train_loss": -13.075981140136719, "global_step": 491037, "epoch": 2922} {"train_loss": -12.577710151672363, "global_step": 491038, "epoch": 2922} {"train_loss": -12.669259071350098, "global_step": 491039, "epoch": 2922} {"train_loss": -12.548574447631836, "global_step": 491040, "epoch": 2922} {"train_loss": -12.652727127075195, "global_step": 491041, "epoch": 2922} {"train_loss": -13.010824203491211, "global_step": 491042, "epoch": 2922} {"train_loss": -11.613738059997559, "global_step": 491043, "epoch": 2922} {"train_loss": -11.81489372253418, "global_step": 491044, "epoch": 2922} {"train_loss": -12.229618072509766, "global_step": 491045, "epoch": 2922} {"train_loss": -12.250642776489258, "global_step": 491046, "epoch": 2922} {"train_loss": -11.021564483642578, "global_step": 491047, "epoch": 2922} {"train_loss": -9.294275283813477, "global_step": 491048, "epoch": 2922} {"train_loss": -8.501169204711914, "global_step": 491049, "epoch": 2922} {"train_loss": -9.31029987335205, "global_step": 491050, "epoch": 2922} {"train_loss": -9.132710456848145, "global_step": 491051, "epoch": 2922} {"train_loss": -10.030645370483398, "global_step": 491052, "epoch": 2922} {"train_loss": -10.698742866516113, "global_step": 491053, "epoch": 2922} {"train_loss": -10.23723030090332, "global_step": 491054, "epoch": 2922} {"train_loss": -9.58709716796875, "global_step": 491055, "epoch": 2922} {"train_loss": -9.948650360107422, "global_step": 491056, "epoch": 2922} {"train_loss": -9.952064514160156, "global_step": 491057, "epoch": 2922} {"train_loss": -10.779748916625977, "global_step": 491058, "epoch": 2922} {"train_loss": -11.734892845153809, "global_step": 491059, "epoch": 2922} {"train_loss": -10.79964542388916, "global_step": 491060, "epoch": 2922} {"train_loss": -11.739189147949219, "global_step": 491061, "epoch": 2922} {"train_loss": -10.780546188354492, "global_step": 491062, "epoch": 2922} {"train_loss": -12.16093285310836, "global_step": 491063, "epoch": 2922, "val_loss": 317876.84375} {"train_loss": -11.973807334899902, "global_step": 491064, "epoch": 2923} {"train_loss": -9.961397171020508, "global_step": 491065, "epoch": 2923} {"train_loss": -11.781204223632812, "global_step": 491066, "epoch": 2923} {"train_loss": -11.055169105529785, "global_step": 491067, "epoch": 2923} {"train_loss": -10.844446182250977, "global_step": 491068, "epoch": 2923} {"train_loss": -11.574956893920898, "global_step": 491069, "epoch": 2923} {"train_loss": -10.507615089416504, "global_step": 491070, "epoch": 2923} {"train_loss": -11.136438369750977, "global_step": 491071, "epoch": 2923} {"train_loss": -11.598081588745117, "global_step": 491072, "epoch": 2923} {"train_loss": -11.021846771240234, "global_step": 491073, "epoch": 2923} {"train_loss": -11.928621292114258, "global_step": 491074, "epoch": 2923} {"train_loss": -11.906312942504883, "global_step": 491075, "epoch": 2923} {"train_loss": -11.745063781738281, "global_step": 491076, "epoch": 2923} {"train_loss": -11.311698913574219, "global_step": 491077, "epoch": 2923} {"train_loss": -12.022570610046387, "global_step": 491078, "epoch": 2923} {"train_loss": -12.223320007324219, "global_step": 491079, "epoch": 2923} {"train_loss": -12.446578979492188, "global_step": 491080, "epoch": 2923} {"train_loss": -12.260871887207031, "global_step": 491081, "epoch": 2923} {"train_loss": -12.107221603393555, "global_step": 491082, "epoch": 2923} {"train_loss": -12.263092041015625, "global_step": 491083, "epoch": 2923} {"train_loss": -12.113120079040527, "global_step": 491084, "epoch": 2923} {"train_loss": -12.413816452026367, "global_step": 491085, "epoch": 2923} {"train_loss": -12.406560897827148, "global_step": 491086, "epoch": 2923} {"train_loss": -12.046777725219727, "global_step": 491087, "epoch": 2923} {"train_loss": -12.250566482543945, "global_step": 491088, "epoch": 2923} {"train_loss": -11.87457275390625, "global_step": 491089, "epoch": 2923} {"train_loss": -11.634586334228516, "global_step": 491090, "epoch": 2923} {"train_loss": -12.169575691223145, "global_step": 491091, "epoch": 2923} {"train_loss": -11.57747745513916, "global_step": 491092, "epoch": 2923} {"train_loss": -12.078840255737305, "global_step": 491093, "epoch": 2923} {"train_loss": -12.014606475830078, "global_step": 491094, "epoch": 2923} {"train_loss": -11.971738815307617, "global_step": 491095, "epoch": 2923} {"train_loss": -12.44127368927002, "global_step": 491096, "epoch": 2923} {"train_loss": -12.202285766601562, "global_step": 491097, "epoch": 2923} {"train_loss": -12.256612777709961, "global_step": 491098, "epoch": 2923} {"train_loss": -12.323369026184082, "global_step": 491099, "epoch": 2923} {"train_loss": -12.227104187011719, "global_step": 491100, "epoch": 2923} {"train_loss": -12.436394691467285, "global_step": 491101, "epoch": 2923} {"train_loss": -12.182388305664062, "global_step": 491102, "epoch": 2923} {"train_loss": -12.53795337677002, "global_step": 491103, "epoch": 2923} {"train_loss": -12.193195343017578, "global_step": 491104, "epoch": 2923} {"train_loss": -11.672521591186523, "global_step": 491105, "epoch": 2923} {"train_loss": -12.279603958129883, "global_step": 491106, "epoch": 2923} {"train_loss": -11.963502883911133, "global_step": 491107, "epoch": 2923} {"train_loss": -12.133115768432617, "global_step": 491108, "epoch": 2923} {"train_loss": -11.860719680786133, "global_step": 491109, "epoch": 2923} {"train_loss": -11.930855751037598, "global_step": 491110, "epoch": 2923} {"train_loss": -12.383377075195312, "global_step": 491111, "epoch": 2923} {"train_loss": -10.961064338684082, "global_step": 491112, "epoch": 2923} {"train_loss": -11.654438018798828, "global_step": 491113, "epoch": 2923} {"train_loss": -11.829641342163086, "global_step": 491114, "epoch": 2923} {"train_loss": -12.109003067016602, "global_step": 491115, "epoch": 2923} {"train_loss": -11.88105583190918, "global_step": 491116, "epoch": 2923} {"train_loss": -11.123146057128906, "global_step": 491117, "epoch": 2923} {"train_loss": -11.592056274414062, "global_step": 491118, "epoch": 2923} {"train_loss": -11.604114532470703, "global_step": 491119, "epoch": 2923} {"train_loss": -12.240582466125488, "global_step": 491120, "epoch": 2923} {"train_loss": -11.337621688842773, "global_step": 491121, "epoch": 2923} {"train_loss": -12.243227005004883, "global_step": 491122, "epoch": 2923} {"train_loss": -11.381372451782227, "global_step": 491123, "epoch": 2923} {"train_loss": -12.497666358947754, "global_step": 491124, "epoch": 2923} {"train_loss": -11.848224639892578, "global_step": 491125, "epoch": 2923} {"train_loss": -12.100522994995117, "global_step": 491126, "epoch": 2923} {"train_loss": -12.002290725708008, "global_step": 491127, "epoch": 2923} {"train_loss": -12.244461059570312, "global_step": 491128, "epoch": 2923} {"train_loss": -12.010385513305664, "global_step": 491129, "epoch": 2923} {"train_loss": -12.126984596252441, "global_step": 491130, "epoch": 2923} {"train_loss": -12.175760269165039, "global_step": 491131, "epoch": 2923} {"train_loss": -11.913026809692383, "global_step": 491132, "epoch": 2923} {"train_loss": -12.069348335266113, "global_step": 491133, "epoch": 2923} {"train_loss": -11.876224517822266, "global_step": 491134, "epoch": 2923} {"train_loss": -12.419170379638672, "global_step": 491135, "epoch": 2923} {"train_loss": -11.669027328491211, "global_step": 491136, "epoch": 2923} {"train_loss": -12.073835372924805, "global_step": 491137, "epoch": 2923} {"train_loss": -11.68351936340332, "global_step": 491138, "epoch": 2923} {"train_loss": -12.361242294311523, "global_step": 491139, "epoch": 2923} {"train_loss": -12.062875747680664, "global_step": 491140, "epoch": 2923} {"train_loss": -12.315826416015625, "global_step": 491141, "epoch": 2923} {"train_loss": -12.076269149780273, "global_step": 491142, "epoch": 2923} {"train_loss": -11.883376121520996, "global_step": 491143, "epoch": 2923} {"train_loss": -12.430303573608398, "global_step": 491144, "epoch": 2923} {"train_loss": -12.447380065917969, "global_step": 491145, "epoch": 2923} {"train_loss": -12.11751651763916, "global_step": 491146, "epoch": 2923} {"train_loss": -12.629283905029297, "global_step": 491147, "epoch": 2923} {"train_loss": -12.086181640625, "global_step": 491148, "epoch": 2923} {"train_loss": -12.118139266967773, "global_step": 491149, "epoch": 2923} {"train_loss": -11.862434387207031, "global_step": 491150, "epoch": 2923} {"train_loss": -12.15621566772461, "global_step": 491151, "epoch": 2923} {"train_loss": -12.287071228027344, "global_step": 491152, "epoch": 2923} {"train_loss": -11.510319709777832, "global_step": 491153, "epoch": 2923} {"train_loss": -11.983617782592773, "global_step": 491154, "epoch": 2923} {"train_loss": -11.753982543945312, "global_step": 491155, "epoch": 2923} {"train_loss": -11.721664428710938, "global_step": 491156, "epoch": 2923} {"train_loss": -12.114544868469238, "global_step": 491157, "epoch": 2923} {"train_loss": -10.585670471191406, "global_step": 491158, "epoch": 2923} {"train_loss": -11.558250427246094, "global_step": 491159, "epoch": 2923} {"train_loss": -10.587943077087402, "global_step": 491160, "epoch": 2923} {"train_loss": -10.246091842651367, "global_step": 491161, "epoch": 2923} {"train_loss": -9.960002899169922, "global_step": 491162, "epoch": 2923} {"train_loss": -11.854581832885742, "global_step": 491163, "epoch": 2923} {"train_loss": -10.652291297912598, "global_step": 491164, "epoch": 2923} {"train_loss": -10.162956237792969, "global_step": 491165, "epoch": 2923} {"train_loss": -11.825392723083496, "global_step": 491166, "epoch": 2923} {"train_loss": -10.431742668151855, "global_step": 491167, "epoch": 2923} {"train_loss": -12.032312393188477, "global_step": 491168, "epoch": 2923} {"train_loss": -9.431421279907227, "global_step": 491169, "epoch": 2923} {"train_loss": -12.179887771606445, "global_step": 491170, "epoch": 2923} {"train_loss": -11.050888061523438, "global_step": 491171, "epoch": 2923} {"train_loss": -11.873407363891602, "global_step": 491172, "epoch": 2923} {"train_loss": -11.99496841430664, "global_step": 491173, "epoch": 2923} {"train_loss": -11.782167434692383, "global_step": 491174, "epoch": 2923} {"train_loss": -11.912206649780273, "global_step": 491175, "epoch": 2923} {"train_loss": -11.855293273925781, "global_step": 491176, "epoch": 2923} {"train_loss": -11.326278686523438, "global_step": 491177, "epoch": 2923} {"train_loss": -12.26978588104248, "global_step": 491178, "epoch": 2923} {"train_loss": -12.05036735534668, "global_step": 491179, "epoch": 2923} {"train_loss": -12.131237983703613, "global_step": 491180, "epoch": 2923} {"train_loss": -12.132286071777344, "global_step": 491181, "epoch": 2923} {"train_loss": -12.061199188232422, "global_step": 491182, "epoch": 2923} {"train_loss": -12.451936721801758, "global_step": 491183, "epoch": 2923} {"train_loss": -12.248802185058594, "global_step": 491184, "epoch": 2923} {"train_loss": -12.400463104248047, "global_step": 491185, "epoch": 2923} {"train_loss": -11.987998962402344, "global_step": 491186, "epoch": 2923} {"train_loss": -12.309164047241211, "global_step": 491187, "epoch": 2923} {"train_loss": -12.36269760131836, "global_step": 491188, "epoch": 2923} {"train_loss": -12.229979515075684, "global_step": 491189, "epoch": 2923} {"train_loss": -12.328826904296875, "global_step": 491190, "epoch": 2923} {"train_loss": -12.450878143310547, "global_step": 491191, "epoch": 2923} {"train_loss": -12.557563781738281, "global_step": 491192, "epoch": 2923} {"train_loss": -12.463332176208496, "global_step": 491193, "epoch": 2923} {"train_loss": -12.297473907470703, "global_step": 491194, "epoch": 2923} {"train_loss": -12.548624038696289, "global_step": 491195, "epoch": 2923} {"train_loss": -12.407402038574219, "global_step": 491196, "epoch": 2923} {"train_loss": -12.708038330078125, "global_step": 491197, "epoch": 2923} {"train_loss": -12.463872909545898, "global_step": 491198, "epoch": 2923} {"train_loss": -12.239326477050781, "global_step": 491199, "epoch": 2923} {"train_loss": -12.680489540100098, "global_step": 491200, "epoch": 2923} {"train_loss": -12.476444244384766, "global_step": 491201, "epoch": 2923} {"train_loss": -12.562516212463379, "global_step": 491202, "epoch": 2923} {"train_loss": -12.41784381866455, "global_step": 491203, "epoch": 2923} {"train_loss": -12.623679161071777, "global_step": 491204, "epoch": 2923} {"train_loss": -12.74715805053711, "global_step": 491205, "epoch": 2923} {"train_loss": -12.543401718139648, "global_step": 491206, "epoch": 2923} {"train_loss": -12.857486724853516, "global_step": 491207, "epoch": 2923} {"train_loss": -12.582439422607422, "global_step": 491208, "epoch": 2923} {"train_loss": -12.731977462768555, "global_step": 491209, "epoch": 2923} {"train_loss": -12.665969848632812, "global_step": 491210, "epoch": 2923} {"train_loss": -12.681285858154297, "global_step": 491211, "epoch": 2923} {"train_loss": -12.782195091247559, "global_step": 491212, "epoch": 2923} {"train_loss": -12.686010360717773, "global_step": 491213, "epoch": 2923} {"train_loss": -12.656551361083984, "global_step": 491214, "epoch": 2923} {"train_loss": -12.609708786010742, "global_step": 491215, "epoch": 2923} {"train_loss": -12.754350662231445, "global_step": 491216, "epoch": 2923} {"train_loss": -12.747132301330566, "global_step": 491217, "epoch": 2923} {"train_loss": -12.482105255126953, "global_step": 491218, "epoch": 2923} {"train_loss": -12.849481582641602, "global_step": 491219, "epoch": 2923} {"train_loss": -12.681329727172852, "global_step": 491220, "epoch": 2923} {"train_loss": -12.940289497375488, "global_step": 491221, "epoch": 2923} {"train_loss": -12.811180114746094, "global_step": 491222, "epoch": 2923} {"train_loss": -12.681968688964844, "global_step": 491223, "epoch": 2923} {"train_loss": -12.967510223388672, "global_step": 491224, "epoch": 2923} {"train_loss": -12.85767936706543, "global_step": 491225, "epoch": 2923} {"train_loss": -12.826772689819336, "global_step": 491226, "epoch": 2923} {"train_loss": -12.771488189697266, "global_step": 491227, "epoch": 2923} {"train_loss": -12.827003479003906, "global_step": 491228, "epoch": 2923} {"train_loss": -12.796731948852539, "global_step": 491229, "epoch": 2923} {"train_loss": -12.835617065429688, "global_step": 491230, "epoch": 2923} {"train_loss": -12.043249107542492, "global_step": 491231, "epoch": 2923, "val_loss": 320591.59375} {"train_loss": -13.062067031860352, "global_step": 491232, "epoch": 2924} {"train_loss": -13.01869010925293, "global_step": 491233, "epoch": 2924} {"train_loss": -12.707221984863281, "global_step": 491234, "epoch": 2924} {"train_loss": -13.007389068603516, "global_step": 491235, "epoch": 2924} {"train_loss": -12.979715347290039, "global_step": 491236, "epoch": 2924} {"train_loss": -12.854613304138184, "global_step": 491237, "epoch": 2924} {"train_loss": -13.163765907287598, "global_step": 491238, "epoch": 2924} {"train_loss": -12.705808639526367, "global_step": 491239, "epoch": 2924} {"train_loss": -12.944826126098633, "global_step": 491240, "epoch": 2924} {"train_loss": -13.035258293151855, "global_step": 491241, "epoch": 2924} {"train_loss": -12.96461009979248, "global_step": 491242, "epoch": 2924} {"train_loss": -13.054559707641602, "global_step": 491243, "epoch": 2924} {"train_loss": -13.233911514282227, "global_step": 491244, "epoch": 2924} {"train_loss": -12.999849319458008, "global_step": 491245, "epoch": 2924} {"train_loss": -12.734973907470703, "global_step": 491246, "epoch": 2924} {"train_loss": -12.942695617675781, "global_step": 491247, "epoch": 2924} {"train_loss": -12.94039249420166, "global_step": 491248, "epoch": 2924} {"train_loss": -12.784250259399414, "global_step": 491249, "epoch": 2924} {"train_loss": -13.040790557861328, "global_step": 491250, "epoch": 2924} {"train_loss": -12.754219055175781, "global_step": 491251, "epoch": 2924} {"train_loss": -12.708221435546875, "global_step": 491252, "epoch": 2924} {"train_loss": -13.07635498046875, "global_step": 491253, "epoch": 2924} {"train_loss": -12.728933334350586, "global_step": 491254, "epoch": 2924} {"train_loss": -12.767980575561523, "global_step": 491255, "epoch": 2924} {"train_loss": -12.833268165588379, "global_step": 491256, "epoch": 2924} {"train_loss": -12.790739059448242, "global_step": 491257, "epoch": 2924} {"train_loss": -12.886024475097656, "global_step": 491258, "epoch": 2924} {"train_loss": -12.900514602661133, "global_step": 491259, "epoch": 2924} {"train_loss": -12.482674598693848, "global_step": 491260, "epoch": 2924} {"train_loss": -12.79794692993164, "global_step": 491261, "epoch": 2924} {"train_loss": -12.705116271972656, "global_step": 491262, "epoch": 2924} {"train_loss": -12.39706802368164, "global_step": 491263, "epoch": 2924} {"train_loss": -12.554841995239258, "global_step": 491264, "epoch": 2924} {"train_loss": -12.42087173461914, "global_step": 491265, "epoch": 2924} {"train_loss": -12.047849655151367, "global_step": 491266, "epoch": 2924} {"train_loss": -12.333120346069336, "global_step": 491267, "epoch": 2924} {"train_loss": -12.326311111450195, "global_step": 491268, "epoch": 2924} {"train_loss": -12.161057472229004, "global_step": 491269, "epoch": 2924} {"train_loss": -12.18742561340332, "global_step": 491270, "epoch": 2924} {"train_loss": -12.669570922851562, "global_step": 491271, "epoch": 2924} {"train_loss": -12.704133987426758, "global_step": 491272, "epoch": 2924} {"train_loss": -12.687021255493164, "global_step": 491273, "epoch": 2924} {"train_loss": -12.795751571655273, "global_step": 491274, "epoch": 2924} {"train_loss": -11.824082374572754, "global_step": 491275, "epoch": 2924} {"train_loss": -11.896541595458984, "global_step": 491276, "epoch": 2924} {"train_loss": -11.938528060913086, "global_step": 491277, "epoch": 2924} {"train_loss": -11.916243553161621, "global_step": 491278, "epoch": 2924} {"train_loss": -11.081281661987305, "global_step": 491279, "epoch": 2924} {"train_loss": -10.164182662963867, "global_step": 491280, "epoch": 2924} {"train_loss": -10.751235961914062, "global_step": 491281, "epoch": 2924} {"train_loss": -11.059185981750488, "global_step": 491282, "epoch": 2924} {"train_loss": -10.994020462036133, "global_step": 491283, "epoch": 2924} {"train_loss": -10.644713401794434, "global_step": 491284, "epoch": 2924} {"train_loss": -10.936763763427734, "global_step": 491285, "epoch": 2924} {"train_loss": -12.100271224975586, "global_step": 491286, "epoch": 2924} {"train_loss": -10.414287567138672, "global_step": 491287, "epoch": 2924} {"train_loss": -10.523316383361816, "global_step": 491288, "epoch": 2924} {"train_loss": -11.195009231567383, "global_step": 491289, "epoch": 2924} {"train_loss": -10.589876174926758, "global_step": 491290, "epoch": 2924} {"train_loss": -10.307767868041992, "global_step": 491291, "epoch": 2924} {"train_loss": -11.25454330444336, "global_step": 491292, "epoch": 2924} {"train_loss": -9.926979064941406, "global_step": 491293, "epoch": 2924} {"train_loss": -10.108386993408203, "global_step": 491294, "epoch": 2924} {"train_loss": -11.804512023925781, "global_step": 491295, "epoch": 2924} {"train_loss": -10.61143970489502, "global_step": 491296, "epoch": 2924} {"train_loss": -10.904687881469727, "global_step": 491297, "epoch": 2924} {"train_loss": -11.309222221374512, "global_step": 491298, "epoch": 2924} {"train_loss": -10.226688385009766, "global_step": 491299, "epoch": 2924} {"train_loss": -11.43710708618164, "global_step": 491300, "epoch": 2924} {"train_loss": -11.448616027832031, "global_step": 491301, "epoch": 2924} {"train_loss": -9.880796432495117, "global_step": 491302, "epoch": 2924} {"train_loss": -11.852272033691406, "global_step": 491303, "epoch": 2924} {"train_loss": -10.370458602905273, "global_step": 491304, "epoch": 2924} {"train_loss": -10.790546417236328, "global_step": 491305, "epoch": 2924} {"train_loss": -11.398780822753906, "global_step": 491306, "epoch": 2924} {"train_loss": -11.149789810180664, "global_step": 491307, "epoch": 2924} {"train_loss": -11.320556640625, "global_step": 491308, "epoch": 2924} {"train_loss": -12.135544776916504, "global_step": 491309, "epoch": 2924} {"train_loss": -11.44735336303711, "global_step": 491310, "epoch": 2924} {"train_loss": -11.975754737854004, "global_step": 491311, "epoch": 2924} {"train_loss": -11.496820449829102, "global_step": 491312, "epoch": 2924} {"train_loss": -11.096273422241211, "global_step": 491313, "epoch": 2924} {"train_loss": -11.393165588378906, "global_step": 491314, "epoch": 2924} {"train_loss": -11.733668327331543, "global_step": 491315, "epoch": 2924} {"train_loss": -11.475648880004883, "global_step": 491316, "epoch": 2924} {"train_loss": -11.535228729248047, "global_step": 491317, "epoch": 2924} {"train_loss": -12.093191146850586, "global_step": 491318, "epoch": 2924} {"train_loss": -11.812355041503906, "global_step": 491319, "epoch": 2924} {"train_loss": -12.22778034210205, "global_step": 491320, "epoch": 2924} {"train_loss": -11.919526100158691, "global_step": 491321, "epoch": 2924} {"train_loss": -12.204949378967285, "global_step": 491322, "epoch": 2924} {"train_loss": -12.111994743347168, "global_step": 491323, "epoch": 2924} {"train_loss": -12.435093879699707, "global_step": 491324, "epoch": 2924} {"train_loss": -11.878762245178223, "global_step": 491325, "epoch": 2924} {"train_loss": -12.478798866271973, "global_step": 491326, "epoch": 2924} {"train_loss": -12.332185745239258, "global_step": 491327, "epoch": 2924} {"train_loss": -12.452142715454102, "global_step": 491328, "epoch": 2924} {"train_loss": -12.361410140991211, "global_step": 491329, "epoch": 2924} {"train_loss": -12.357755661010742, "global_step": 491330, "epoch": 2924} {"train_loss": -12.325950622558594, "global_step": 491331, "epoch": 2924} {"train_loss": -12.411749839782715, "global_step": 491332, "epoch": 2924} {"train_loss": -12.513727188110352, "global_step": 491333, "epoch": 2924} {"train_loss": -12.349328994750977, "global_step": 491334, "epoch": 2924} {"train_loss": -12.371267318725586, "global_step": 491335, "epoch": 2924} {"train_loss": -12.209518432617188, "global_step": 491336, "epoch": 2924} {"train_loss": -12.517847061157227, "global_step": 491337, "epoch": 2924} {"train_loss": -12.414475440979004, "global_step": 491338, "epoch": 2924} {"train_loss": -12.034218788146973, "global_step": 491339, "epoch": 2924} {"train_loss": -12.290904998779297, "global_step": 491340, "epoch": 2924} {"train_loss": -12.438655853271484, "global_step": 491341, "epoch": 2924} {"train_loss": -12.238618850708008, "global_step": 491342, "epoch": 2924} {"train_loss": -12.362359046936035, "global_step": 491343, "epoch": 2924} {"train_loss": -12.119915962219238, "global_step": 491344, "epoch": 2924} {"train_loss": -12.229753494262695, "global_step": 491345, "epoch": 2924} {"train_loss": -12.22355842590332, "global_step": 491346, "epoch": 2924} {"train_loss": -12.061986923217773, "global_step": 491347, "epoch": 2924} {"train_loss": -12.132606506347656, "global_step": 491348, "epoch": 2924} {"train_loss": -12.523649215698242, "global_step": 491349, "epoch": 2924} {"train_loss": -12.513565063476562, "global_step": 491350, "epoch": 2924} {"train_loss": -12.498339653015137, "global_step": 491351, "epoch": 2924} {"train_loss": -12.41050910949707, "global_step": 491352, "epoch": 2924} {"train_loss": -12.566272735595703, "global_step": 491353, "epoch": 2924} {"train_loss": -12.366243362426758, "global_step": 491354, "epoch": 2924} {"train_loss": -12.409573554992676, "global_step": 491355, "epoch": 2924} {"train_loss": -12.441237449645996, "global_step": 491356, "epoch": 2924} {"train_loss": -12.480019569396973, "global_step": 491357, "epoch": 2924} {"train_loss": -12.176674842834473, "global_step": 491358, "epoch": 2924} {"train_loss": -12.506942749023438, "global_step": 491359, "epoch": 2924} {"train_loss": -12.465312004089355, "global_step": 491360, "epoch": 2924} {"train_loss": -12.406633377075195, "global_step": 491361, "epoch": 2924} {"train_loss": -12.584527969360352, "global_step": 491362, "epoch": 2924} {"train_loss": -12.314870834350586, "global_step": 491363, "epoch": 2924} {"train_loss": -12.608543395996094, "global_step": 491364, "epoch": 2924} {"train_loss": -12.375659942626953, "global_step": 491365, "epoch": 2924} {"train_loss": -12.413928985595703, "global_step": 491366, "epoch": 2924} {"train_loss": -12.54197883605957, "global_step": 491367, "epoch": 2924} {"train_loss": -12.066993713378906, "global_step": 491368, "epoch": 2924} {"train_loss": -12.789240837097168, "global_step": 491369, "epoch": 2924} {"train_loss": -12.34469985961914, "global_step": 491370, "epoch": 2924} {"train_loss": -12.621070861816406, "global_step": 491371, "epoch": 2924} {"train_loss": -12.521820068359375, "global_step": 491372, "epoch": 2924} {"train_loss": -12.292625427246094, "global_step": 491373, "epoch": 2924} {"train_loss": -12.862180709838867, "global_step": 491374, "epoch": 2924} {"train_loss": -12.216697692871094, "global_step": 491375, "epoch": 2924} {"train_loss": -12.682153701782227, "global_step": 491376, "epoch": 2924} {"train_loss": -12.599899291992188, "global_step": 491377, "epoch": 2924} {"train_loss": -12.537275314331055, "global_step": 491378, "epoch": 2924} {"train_loss": -12.588178634643555, "global_step": 491379, "epoch": 2924} {"train_loss": -12.8170804977417, "global_step": 491380, "epoch": 2924} {"train_loss": -12.68227767944336, "global_step": 491381, "epoch": 2924} {"train_loss": -12.878131866455078, "global_step": 491382, "epoch": 2924} {"train_loss": -12.269315719604492, "global_step": 491383, "epoch": 2924} {"train_loss": -12.739679336547852, "global_step": 491384, "epoch": 2924} {"train_loss": -12.294591903686523, "global_step": 491385, "epoch": 2924} {"train_loss": -13.001102447509766, "global_step": 491386, "epoch": 2924} {"train_loss": -12.322420120239258, "global_step": 491387, "epoch": 2924} {"train_loss": -12.63843059539795, "global_step": 491388, "epoch": 2924} {"train_loss": -12.814789772033691, "global_step": 491389, "epoch": 2924} {"train_loss": -12.769761085510254, "global_step": 491390, "epoch": 2924} {"train_loss": -12.812828063964844, "global_step": 491391, "epoch": 2924} {"train_loss": -12.684440612792969, "global_step": 491392, "epoch": 2924} {"train_loss": -12.968149185180664, "global_step": 491393, "epoch": 2924} {"train_loss": -12.667612075805664, "global_step": 491394, "epoch": 2924} {"train_loss": -12.888944625854492, "global_step": 491395, "epoch": 2924} {"train_loss": -12.708383560180664, "global_step": 491396, "epoch": 2924} {"train_loss": -12.659584045410156, "global_step": 491397, "epoch": 2924} {"train_loss": -12.572212219238281, "global_step": 491398, "epoch": 2924} {"train_loss": -12.189606785774231, "global_step": 491399, "epoch": 2924, "val_loss": 319692.21875} {"train_loss": -12.713069915771484, "global_step": 491400, "epoch": 2925} {"train_loss": -12.58453369140625, "global_step": 491401, "epoch": 2925} {"train_loss": -12.860852241516113, "global_step": 491402, "epoch": 2925} {"train_loss": -12.574012756347656, "global_step": 491403, "epoch": 2925} {"train_loss": -12.538721084594727, "global_step": 491404, "epoch": 2925} {"train_loss": -12.823099136352539, "global_step": 491405, "epoch": 2925} {"train_loss": -12.576106071472168, "global_step": 491406, "epoch": 2925} {"train_loss": -12.558121681213379, "global_step": 491407, "epoch": 2925} {"train_loss": -12.889653205871582, "global_step": 491408, "epoch": 2925} {"train_loss": -12.736775398254395, "global_step": 491409, "epoch": 2925} {"train_loss": -12.841143608093262, "global_step": 491410, "epoch": 2925} {"train_loss": -12.912569046020508, "global_step": 491411, "epoch": 2925} {"train_loss": -12.61482048034668, "global_step": 491412, "epoch": 2925} {"train_loss": -13.123941421508789, "global_step": 491413, "epoch": 2925} {"train_loss": -12.076974868774414, "global_step": 491414, "epoch": 2925} {"train_loss": -12.541196823120117, "global_step": 491415, "epoch": 2925} {"train_loss": -12.65914249420166, "global_step": 491416, "epoch": 2925} {"train_loss": -12.306474685668945, "global_step": 491417, "epoch": 2925} {"train_loss": -12.257509231567383, "global_step": 491418, "epoch": 2925} {"train_loss": -12.413256645202637, "global_step": 491419, "epoch": 2925} {"train_loss": -11.306747436523438, "global_step": 491420, "epoch": 2925} {"train_loss": -12.447850227355957, "global_step": 491421, "epoch": 2925} {"train_loss": -10.590587615966797, "global_step": 491422, "epoch": 2925} {"train_loss": -11.540852546691895, "global_step": 491423, "epoch": 2925} {"train_loss": -11.600224494934082, "global_step": 491424, "epoch": 2925} {"train_loss": -11.624351501464844, "global_step": 491425, "epoch": 2925} {"train_loss": -11.289953231811523, "global_step": 491426, "epoch": 2925} {"train_loss": -10.584988594055176, "global_step": 491427, "epoch": 2925} {"train_loss": -10.51016616821289, "global_step": 491428, "epoch": 2925} {"train_loss": -11.763345718383789, "global_step": 491429, "epoch": 2925} {"train_loss": -11.004133224487305, "global_step": 491430, "epoch": 2925} {"train_loss": -11.280536651611328, "global_step": 491431, "epoch": 2925} {"train_loss": -11.12276840209961, "global_step": 491432, "epoch": 2925} {"train_loss": -11.767943382263184, "global_step": 491433, "epoch": 2925} {"train_loss": -11.366806030273438, "global_step": 491434, "epoch": 2925} {"train_loss": -11.984469413757324, "global_step": 491435, "epoch": 2925} {"train_loss": -10.938531875610352, "global_step": 491436, "epoch": 2925} {"train_loss": -11.942108154296875, "global_step": 491437, "epoch": 2925} {"train_loss": -11.691431045532227, "global_step": 491438, "epoch": 2925} {"train_loss": -11.463607788085938, "global_step": 491439, "epoch": 2925} {"train_loss": -12.095972061157227, "global_step": 491440, "epoch": 2925} {"train_loss": -11.221260070800781, "global_step": 491441, "epoch": 2925} {"train_loss": -11.489286422729492, "global_step": 491442, "epoch": 2925} {"train_loss": -12.007207870483398, "global_step": 491443, "epoch": 2925} {"train_loss": -11.544031143188477, "global_step": 491444, "epoch": 2925} {"train_loss": -11.68190860748291, "global_step": 491445, "epoch": 2925} {"train_loss": -11.687446594238281, "global_step": 491446, "epoch": 2925} {"train_loss": -12.53641128540039, "global_step": 491447, "epoch": 2925} {"train_loss": -11.803267478942871, "global_step": 491448, "epoch": 2925} {"train_loss": -12.51062297821045, "global_step": 491449, "epoch": 2925} {"train_loss": -12.436735153198242, "global_step": 491450, "epoch": 2925} {"train_loss": -12.284876823425293, "global_step": 491451, "epoch": 2925} {"train_loss": -12.600641250610352, "global_step": 491452, "epoch": 2925} {"train_loss": -12.23280143737793, "global_step": 491453, "epoch": 2925} {"train_loss": -12.344892501831055, "global_step": 491454, "epoch": 2925} {"train_loss": -12.2100830078125, "global_step": 491455, "epoch": 2925} {"train_loss": -12.317617416381836, "global_step": 491456, "epoch": 2925} {"train_loss": -12.215621948242188, "global_step": 491457, "epoch": 2925} {"train_loss": -12.573884963989258, "global_step": 491458, "epoch": 2925} {"train_loss": -12.53268814086914, "global_step": 491459, "epoch": 2925} {"train_loss": -12.549116134643555, "global_step": 491460, "epoch": 2925} {"train_loss": -12.588980674743652, "global_step": 491461, "epoch": 2925} {"train_loss": -12.354650497436523, "global_step": 491462, "epoch": 2925} {"train_loss": -12.469033241271973, "global_step": 491463, "epoch": 2925} {"train_loss": -12.6256742477417, "global_step": 491464, "epoch": 2925} {"train_loss": -12.411087036132812, "global_step": 491465, "epoch": 2925} {"train_loss": -12.44157886505127, "global_step": 491466, "epoch": 2925} {"train_loss": -12.594837188720703, "global_step": 491467, "epoch": 2925} {"train_loss": -12.297036170959473, "global_step": 491468, "epoch": 2925} {"train_loss": -12.491111755371094, "global_step": 491469, "epoch": 2925} {"train_loss": -12.660459518432617, "global_step": 491470, "epoch": 2925} {"train_loss": -12.856246948242188, "global_step": 491471, "epoch": 2925} {"train_loss": -12.862021446228027, "global_step": 491472, "epoch": 2925} {"train_loss": -12.729989051818848, "global_step": 491473, "epoch": 2925} {"train_loss": -12.714971542358398, "global_step": 491474, "epoch": 2925} {"train_loss": -12.701447486877441, "global_step": 491475, "epoch": 2925} {"train_loss": -12.7789945602417, "global_step": 491476, "epoch": 2925} {"train_loss": -12.235904693603516, "global_step": 491477, "epoch": 2925} {"train_loss": -12.680330276489258, "global_step": 491478, "epoch": 2925} {"train_loss": -12.881450653076172, "global_step": 491479, "epoch": 2925} {"train_loss": -12.852607727050781, "global_step": 491480, "epoch": 2925} {"train_loss": -12.53471565246582, "global_step": 491481, "epoch": 2925} {"train_loss": -12.599870681762695, "global_step": 491482, "epoch": 2925} {"train_loss": -12.879554748535156, "global_step": 491483, "epoch": 2925} {"train_loss": -12.73889446258545, "global_step": 491484, "epoch": 2925} {"train_loss": -12.803618431091309, "global_step": 491485, "epoch": 2925} {"train_loss": -12.866976737976074, "global_step": 491486, "epoch": 2925} {"train_loss": -12.763507843017578, "global_step": 491487, "epoch": 2925} {"train_loss": -12.930265426635742, "global_step": 491488, "epoch": 2925} {"train_loss": -12.87767219543457, "global_step": 491489, "epoch": 2925} {"train_loss": -12.870624542236328, "global_step": 491490, "epoch": 2925} {"train_loss": -12.656911849975586, "global_step": 491491, "epoch": 2925} {"train_loss": -12.797571182250977, "global_step": 491492, "epoch": 2925} {"train_loss": -12.74135971069336, "global_step": 491493, "epoch": 2925} {"train_loss": -12.90034294128418, "global_step": 491494, "epoch": 2925} {"train_loss": -12.83060359954834, "global_step": 491495, "epoch": 2925} {"train_loss": -12.874990463256836, "global_step": 491496, "epoch": 2925} {"train_loss": -12.990066528320312, "global_step": 491497, "epoch": 2925} {"train_loss": -12.857181549072266, "global_step": 491498, "epoch": 2925} {"train_loss": -12.895339012145996, "global_step": 491499, "epoch": 2925} {"train_loss": -12.81169319152832, "global_step": 491500, "epoch": 2925} {"train_loss": -12.761877059936523, "global_step": 491501, "epoch": 2925} {"train_loss": -12.617403984069824, "global_step": 491502, "epoch": 2925} {"train_loss": -12.753565788269043, "global_step": 491503, "epoch": 2925} {"train_loss": -12.991201400756836, "global_step": 491504, "epoch": 2925} {"train_loss": -12.837957382202148, "global_step": 491505, "epoch": 2925} {"train_loss": -12.25198745727539, "global_step": 491506, "epoch": 2925} {"train_loss": -11.946405410766602, "global_step": 491507, "epoch": 2925} {"train_loss": -12.761080741882324, "global_step": 491508, "epoch": 2925} {"train_loss": -12.177204132080078, "global_step": 491509, "epoch": 2925} {"train_loss": -12.561697006225586, "global_step": 491510, "epoch": 2925} {"train_loss": -12.400635719299316, "global_step": 491511, "epoch": 2925} {"train_loss": -12.410350799560547, "global_step": 491512, "epoch": 2925} {"train_loss": -12.688508987426758, "global_step": 491513, "epoch": 2925} {"train_loss": -12.25963020324707, "global_step": 491514, "epoch": 2925} {"train_loss": -12.460317611694336, "global_step": 491515, "epoch": 2925} {"train_loss": -12.743603706359863, "global_step": 491516, "epoch": 2925} {"train_loss": -12.426671981811523, "global_step": 491517, "epoch": 2925} {"train_loss": -11.968149185180664, "global_step": 491518, "epoch": 2925} {"train_loss": -12.314713478088379, "global_step": 491519, "epoch": 2925} {"train_loss": -12.152326583862305, "global_step": 491520, "epoch": 2925} {"train_loss": -12.2781982421875, "global_step": 491521, "epoch": 2925} {"train_loss": -11.843177795410156, "global_step": 491522, "epoch": 2925} {"train_loss": -12.517053604125977, "global_step": 491523, "epoch": 2925} {"train_loss": -11.644615173339844, "global_step": 491524, "epoch": 2925} {"train_loss": -12.300874710083008, "global_step": 491525, "epoch": 2925} {"train_loss": -11.18111515045166, "global_step": 491526, "epoch": 2925} {"train_loss": -12.604854583740234, "global_step": 491527, "epoch": 2925} {"train_loss": -11.211015701293945, "global_step": 491528, "epoch": 2925} {"train_loss": -12.343570709228516, "global_step": 491529, "epoch": 2925} {"train_loss": -11.65286636352539, "global_step": 491530, "epoch": 2925} {"train_loss": -11.375223159790039, "global_step": 491531, "epoch": 2925} {"train_loss": -11.100107192993164, "global_step": 491532, "epoch": 2925} {"train_loss": -11.119879722595215, "global_step": 491533, "epoch": 2925} {"train_loss": -12.244752883911133, "global_step": 491534, "epoch": 2925} {"train_loss": -11.209129333496094, "global_step": 491535, "epoch": 2925} {"train_loss": -11.978399276733398, "global_step": 491536, "epoch": 2925} {"train_loss": -11.208688735961914, "global_step": 491537, "epoch": 2925} {"train_loss": -11.5614013671875, "global_step": 491538, "epoch": 2925} {"train_loss": -10.728620529174805, "global_step": 491539, "epoch": 2925} {"train_loss": -11.061201095581055, "global_step": 491540, "epoch": 2925} {"train_loss": -11.475225448608398, "global_step": 491541, "epoch": 2925} {"train_loss": -10.412256240844727, "global_step": 491542, "epoch": 2925} {"train_loss": -11.308845520019531, "global_step": 491543, "epoch": 2925} {"train_loss": -10.71642017364502, "global_step": 491544, "epoch": 2925} {"train_loss": -11.37283992767334, "global_step": 491545, "epoch": 2925} {"train_loss": -12.150007247924805, "global_step": 491546, "epoch": 2925} {"train_loss": -10.508150100708008, "global_step": 491547, "epoch": 2925} {"train_loss": -12.545622825622559, "global_step": 491548, "epoch": 2925} {"train_loss": -11.776004791259766, "global_step": 491549, "epoch": 2925} {"train_loss": -11.506667137145996, "global_step": 491550, "epoch": 2925} {"train_loss": -12.427237510681152, "global_step": 491551, "epoch": 2925} {"train_loss": -11.505278587341309, "global_step": 491552, "epoch": 2925} {"train_loss": -12.102041244506836, "global_step": 491553, "epoch": 2925} {"train_loss": -10.889243125915527, "global_step": 491554, "epoch": 2925} {"train_loss": -11.722789764404297, "global_step": 491555, "epoch": 2925} {"train_loss": -11.415660858154297, "global_step": 491556, "epoch": 2925} {"train_loss": -11.392870903015137, "global_step": 491557, "epoch": 2925} {"train_loss": -11.8998384475708, "global_step": 491558, "epoch": 2925} {"train_loss": -11.608397483825684, "global_step": 491559, "epoch": 2925} {"train_loss": -11.750946998596191, "global_step": 491560, "epoch": 2925} {"train_loss": -11.810937881469727, "global_step": 491561, "epoch": 2925} {"train_loss": -11.435052871704102, "global_step": 491562, "epoch": 2925} {"train_loss": -10.947250366210938, "global_step": 491563, "epoch": 2925} {"train_loss": -12.124113082885742, "global_step": 491564, "epoch": 2925} {"train_loss": -11.140687942504883, "global_step": 491565, "epoch": 2925} {"train_loss": -11.934783935546875, "global_step": 491566, "epoch": 2925} {"train_loss": -12.128602482023693, "global_step": 491567, "epoch": 2925, "val_loss": 320559.875, "train_action_mse_error": 1.1562210321426392} {"train_loss": -10.940423965454102, "global_step": 491568, "epoch": 2926} {"train_loss": -12.225003242492676, "global_step": 491569, "epoch": 2926} {"train_loss": -11.268386840820312, "global_step": 491570, "epoch": 2926} {"train_loss": -12.221263885498047, "global_step": 491571, "epoch": 2926} {"train_loss": -11.489910125732422, "global_step": 491572, "epoch": 2926} {"train_loss": -11.615055084228516, "global_step": 491573, "epoch": 2926} {"train_loss": -12.135344505310059, "global_step": 491574, "epoch": 2926} {"train_loss": -11.159540176391602, "global_step": 491575, "epoch": 2926} {"train_loss": -12.362634658813477, "global_step": 491576, "epoch": 2926} {"train_loss": -10.87531852722168, "global_step": 491577, "epoch": 2926} {"train_loss": -12.576944351196289, "global_step": 491578, "epoch": 2926} {"train_loss": -11.69588851928711, "global_step": 491579, "epoch": 2926} {"train_loss": -12.11231517791748, "global_step": 491580, "epoch": 2926} {"train_loss": -11.51797866821289, "global_step": 491581, "epoch": 2926} {"train_loss": -12.09972858428955, "global_step": 491582, "epoch": 2926} {"train_loss": -12.226558685302734, "global_step": 491583, "epoch": 2926} {"train_loss": -11.820491790771484, "global_step": 491584, "epoch": 2926} {"train_loss": -12.165855407714844, "global_step": 491585, "epoch": 2926} {"train_loss": -11.49583625793457, "global_step": 491586, "epoch": 2926} {"train_loss": -11.967798233032227, "global_step": 491587, "epoch": 2926} {"train_loss": -12.17618465423584, "global_step": 491588, "epoch": 2926} {"train_loss": -11.711403846740723, "global_step": 491589, "epoch": 2926} {"train_loss": -12.600709915161133, "global_step": 491590, "epoch": 2926} {"train_loss": -11.937084197998047, "global_step": 491591, "epoch": 2926} {"train_loss": -12.34414291381836, "global_step": 491592, "epoch": 2926} {"train_loss": -12.284223556518555, "global_step": 491593, "epoch": 2926} {"train_loss": -12.393943786621094, "global_step": 491594, "epoch": 2926} {"train_loss": -12.627859115600586, "global_step": 491595, "epoch": 2926} {"train_loss": -12.39227294921875, "global_step": 491596, "epoch": 2926} {"train_loss": -12.654747009277344, "global_step": 491597, "epoch": 2926} {"train_loss": -12.426414489746094, "global_step": 491598, "epoch": 2926} {"train_loss": -12.636281967163086, "global_step": 491599, "epoch": 2926} {"train_loss": -12.577749252319336, "global_step": 491600, "epoch": 2926} {"train_loss": -12.276846885681152, "global_step": 491601, "epoch": 2926} {"train_loss": -12.381218910217285, "global_step": 491602, "epoch": 2926} {"train_loss": -12.618995666503906, "global_step": 491603, "epoch": 2926} {"train_loss": -12.508682250976562, "global_step": 491604, "epoch": 2926} {"train_loss": -12.818303108215332, "global_step": 491605, "epoch": 2926} {"train_loss": -12.520759582519531, "global_step": 491606, "epoch": 2926} {"train_loss": -12.583833694458008, "global_step": 491607, "epoch": 2926} {"train_loss": -12.611148834228516, "global_step": 491608, "epoch": 2926} {"train_loss": -12.540027618408203, "global_step": 491609, "epoch": 2926} {"train_loss": -12.71993637084961, "global_step": 491610, "epoch": 2926} {"train_loss": -12.831740379333496, "global_step": 491611, "epoch": 2926} {"train_loss": -12.750280380249023, "global_step": 491612, "epoch": 2926} {"train_loss": -12.553764343261719, "global_step": 491613, "epoch": 2926} {"train_loss": -12.779838562011719, "global_step": 491614, "epoch": 2926} {"train_loss": -12.475992202758789, "global_step": 491615, "epoch": 2926} {"train_loss": -12.764017105102539, "global_step": 491616, "epoch": 2926} {"train_loss": -12.550352096557617, "global_step": 491617, "epoch": 2926} {"train_loss": -12.87304973602295, "global_step": 491618, "epoch": 2926} {"train_loss": -12.7916259765625, "global_step": 491619, "epoch": 2926} {"train_loss": -12.617941856384277, "global_step": 491620, "epoch": 2926} {"train_loss": -12.825822830200195, "global_step": 491621, "epoch": 2926} {"train_loss": -13.000732421875, "global_step": 491622, "epoch": 2926} {"train_loss": -12.770121574401855, "global_step": 491623, "epoch": 2926} {"train_loss": -12.829937934875488, "global_step": 491624, "epoch": 2926} {"train_loss": -12.61835765838623, "global_step": 491625, "epoch": 2926} {"train_loss": -13.042375564575195, "global_step": 491626, "epoch": 2926} {"train_loss": -12.633976936340332, "global_step": 491627, "epoch": 2926} {"train_loss": -12.93332576751709, "global_step": 491628, "epoch": 2926} {"train_loss": -12.897520065307617, "global_step": 491629, "epoch": 2926} {"train_loss": -12.993785858154297, "global_step": 491630, "epoch": 2926} {"train_loss": -13.097878456115723, "global_step": 491631, "epoch": 2926} {"train_loss": -13.071128845214844, "global_step": 491632, "epoch": 2926} {"train_loss": -12.899288177490234, "global_step": 491633, "epoch": 2926} {"train_loss": -12.831365585327148, "global_step": 491634, "epoch": 2926} {"train_loss": -12.802711486816406, "global_step": 491635, "epoch": 2926} {"train_loss": -12.983247756958008, "global_step": 491636, "epoch": 2926} {"train_loss": -12.985008239746094, "global_step": 491637, "epoch": 2926} {"train_loss": -12.832235336303711, "global_step": 491638, "epoch": 2926} {"train_loss": -13.056404113769531, "global_step": 491639, "epoch": 2926} {"train_loss": -12.978230476379395, "global_step": 491640, "epoch": 2926} {"train_loss": -12.78370475769043, "global_step": 491641, "epoch": 2926} {"train_loss": -13.043140411376953, "global_step": 491642, "epoch": 2926} {"train_loss": -12.928224563598633, "global_step": 491643, "epoch": 2926} {"train_loss": -12.876733779907227, "global_step": 491644, "epoch": 2926} {"train_loss": -12.964237213134766, "global_step": 491645, "epoch": 2926} {"train_loss": -12.914589881896973, "global_step": 491646, "epoch": 2926} {"train_loss": -12.830955505371094, "global_step": 491647, "epoch": 2926} {"train_loss": -13.021778106689453, "global_step": 491648, "epoch": 2926} {"train_loss": -12.797582626342773, "global_step": 491649, "epoch": 2926} {"train_loss": -12.815971374511719, "global_step": 491650, "epoch": 2926} {"train_loss": -13.09332275390625, "global_step": 491651, "epoch": 2926} {"train_loss": -12.858827590942383, "global_step": 491652, "epoch": 2926} {"train_loss": -12.906415939331055, "global_step": 491653, "epoch": 2926} {"train_loss": -12.911998748779297, "global_step": 491654, "epoch": 2926} {"train_loss": -12.839134216308594, "global_step": 491655, "epoch": 2926} {"train_loss": -12.836214065551758, "global_step": 491656, "epoch": 2926} {"train_loss": -12.701911926269531, "global_step": 491657, "epoch": 2926} {"train_loss": -13.07608413696289, "global_step": 491658, "epoch": 2926} {"train_loss": -12.921273231506348, "global_step": 491659, "epoch": 2926} {"train_loss": -12.896533966064453, "global_step": 491660, "epoch": 2926} {"train_loss": -12.947511672973633, "global_step": 491661, "epoch": 2926} {"train_loss": -12.836982727050781, "global_step": 491662, "epoch": 2926} {"train_loss": -12.858133316040039, "global_step": 491663, "epoch": 2926} {"train_loss": -12.752449035644531, "global_step": 491664, "epoch": 2926} {"train_loss": -12.20626163482666, "global_step": 491665, "epoch": 2926} {"train_loss": -12.03812026977539, "global_step": 491666, "epoch": 2926} {"train_loss": -12.373254776000977, "global_step": 491667, "epoch": 2926} {"train_loss": -12.931187629699707, "global_step": 491668, "epoch": 2926} {"train_loss": -11.922211647033691, "global_step": 491669, "epoch": 2926} {"train_loss": -11.965461730957031, "global_step": 491670, "epoch": 2926} {"train_loss": -12.716323852539062, "global_step": 491671, "epoch": 2926} {"train_loss": -12.581357955932617, "global_step": 491672, "epoch": 2926} {"train_loss": -12.117973327636719, "global_step": 491673, "epoch": 2926} {"train_loss": -12.733095169067383, "global_step": 491674, "epoch": 2926} {"train_loss": -12.641502380371094, "global_step": 491675, "epoch": 2926} {"train_loss": -12.126291275024414, "global_step": 491676, "epoch": 2926} {"train_loss": -12.276432037353516, "global_step": 491677, "epoch": 2926} {"train_loss": -12.610529899597168, "global_step": 491678, "epoch": 2926} {"train_loss": -12.742629051208496, "global_step": 491679, "epoch": 2926} {"train_loss": -11.857399940490723, "global_step": 491680, "epoch": 2926} {"train_loss": -12.292242050170898, "global_step": 491681, "epoch": 2926} {"train_loss": -12.392448425292969, "global_step": 491682, "epoch": 2926} {"train_loss": -12.237091064453125, "global_step": 491683, "epoch": 2926} {"train_loss": -11.915384292602539, "global_step": 491684, "epoch": 2926} {"train_loss": -11.895007133483887, "global_step": 491685, "epoch": 2926} {"train_loss": -12.726217269897461, "global_step": 491686, "epoch": 2926} {"train_loss": -11.506047248840332, "global_step": 491687, "epoch": 2926} {"train_loss": -12.518117904663086, "global_step": 491688, "epoch": 2926} {"train_loss": -12.17232894897461, "global_step": 491689, "epoch": 2926} {"train_loss": -12.608451843261719, "global_step": 491690, "epoch": 2926} {"train_loss": -12.212194442749023, "global_step": 491691, "epoch": 2926} {"train_loss": -12.286736488342285, "global_step": 491692, "epoch": 2926} {"train_loss": -11.774651527404785, "global_step": 491693, "epoch": 2926} {"train_loss": -12.223369598388672, "global_step": 491694, "epoch": 2926} {"train_loss": -11.735166549682617, "global_step": 491695, "epoch": 2926} {"train_loss": -11.549235343933105, "global_step": 491696, "epoch": 2926} {"train_loss": -11.857213973999023, "global_step": 491697, "epoch": 2926} {"train_loss": -11.509665489196777, "global_step": 491698, "epoch": 2926} {"train_loss": -11.181422233581543, "global_step": 491699, "epoch": 2926} {"train_loss": -11.175165176391602, "global_step": 491700, "epoch": 2926} {"train_loss": -10.45008659362793, "global_step": 491701, "epoch": 2926} {"train_loss": -11.116074562072754, "global_step": 491702, "epoch": 2926} {"train_loss": -10.173645973205566, "global_step": 491703, "epoch": 2926} {"train_loss": -12.329107284545898, "global_step": 491704, "epoch": 2926} {"train_loss": -11.771554946899414, "global_step": 491705, "epoch": 2926} {"train_loss": -11.831186294555664, "global_step": 491706, "epoch": 2926} {"train_loss": -12.36339282989502, "global_step": 491707, "epoch": 2926} {"train_loss": -12.255711555480957, "global_step": 491708, "epoch": 2926} {"train_loss": -11.845346450805664, "global_step": 491709, "epoch": 2926} {"train_loss": -12.165515899658203, "global_step": 491710, "epoch": 2926} {"train_loss": -11.705397605895996, "global_step": 491711, "epoch": 2926} {"train_loss": -11.448259353637695, "global_step": 491712, "epoch": 2926} {"train_loss": -12.017755508422852, "global_step": 491713, "epoch": 2926} {"train_loss": -12.207059860229492, "global_step": 491714, "epoch": 2926} {"train_loss": -11.90025520324707, "global_step": 491715, "epoch": 2926} {"train_loss": -12.74371337890625, "global_step": 491716, "epoch": 2926} {"train_loss": -11.808629989624023, "global_step": 491717, "epoch": 2926} {"train_loss": -11.843291282653809, "global_step": 491718, "epoch": 2926} {"train_loss": -12.304393768310547, "global_step": 491719, "epoch": 2926} {"train_loss": -12.140453338623047, "global_step": 491720, "epoch": 2926} {"train_loss": -12.478752136230469, "global_step": 491721, "epoch": 2926} {"train_loss": -12.264148712158203, "global_step": 491722, "epoch": 2926} {"train_loss": -12.627742767333984, "global_step": 491723, "epoch": 2926} {"train_loss": -12.26922607421875, "global_step": 491724, "epoch": 2926} {"train_loss": -12.781110763549805, "global_step": 491725, "epoch": 2926} {"train_loss": -12.164924621582031, "global_step": 491726, "epoch": 2926} {"train_loss": -12.608419418334961, "global_step": 491727, "epoch": 2926} {"train_loss": -12.399317741394043, "global_step": 491728, "epoch": 2926} {"train_loss": -12.401647567749023, "global_step": 491729, "epoch": 2926} {"train_loss": -12.080524444580078, "global_step": 491730, "epoch": 2926} {"train_loss": -12.824947357177734, "global_step": 491731, "epoch": 2926} {"train_loss": -12.179217338562012, "global_step": 491732, "epoch": 2926} {"train_loss": -12.573829650878906, "global_step": 491733, "epoch": 2926} {"train_loss": -12.542912483215332, "global_step": 491734, "epoch": 2926} {"train_loss": -12.364799868492852, "global_step": 491735, "epoch": 2926, "val_loss": 322452.6875} {"train_loss": -12.568090438842773, "global_step": 491736, "epoch": 2927} {"train_loss": -12.500267028808594, "global_step": 491737, "epoch": 2927} {"train_loss": -12.612037658691406, "global_step": 491738, "epoch": 2927} {"train_loss": -12.544981002807617, "global_step": 491739, "epoch": 2927} {"train_loss": -12.03869915008545, "global_step": 491740, "epoch": 2927} {"train_loss": -12.230962753295898, "global_step": 491741, "epoch": 2927} {"train_loss": -12.259193420410156, "global_step": 491742, "epoch": 2927} {"train_loss": -12.489082336425781, "global_step": 491743, "epoch": 2927} {"train_loss": -12.251485824584961, "global_step": 491744, "epoch": 2927} {"train_loss": -12.449239730834961, "global_step": 491745, "epoch": 2927} {"train_loss": -11.302314758300781, "global_step": 491746, "epoch": 2927} {"train_loss": -12.404155731201172, "global_step": 491747, "epoch": 2927} {"train_loss": -11.941787719726562, "global_step": 491748, "epoch": 2927} {"train_loss": -12.548152923583984, "global_step": 491749, "epoch": 2927} {"train_loss": -11.533138275146484, "global_step": 491750, "epoch": 2927} {"train_loss": -12.546991348266602, "global_step": 491751, "epoch": 2927} {"train_loss": -12.209760665893555, "global_step": 491752, "epoch": 2927} {"train_loss": -11.907569885253906, "global_step": 491753, "epoch": 2927} {"train_loss": -12.685786247253418, "global_step": 491754, "epoch": 2927} {"train_loss": -11.969635963439941, "global_step": 491755, "epoch": 2927} {"train_loss": -12.098854064941406, "global_step": 491756, "epoch": 2927} {"train_loss": -11.735017776489258, "global_step": 491757, "epoch": 2927} {"train_loss": -12.407264709472656, "global_step": 491758, "epoch": 2927} {"train_loss": -12.315132141113281, "global_step": 491759, "epoch": 2927} {"train_loss": -12.096542358398438, "global_step": 491760, "epoch": 2927} {"train_loss": -12.179906845092773, "global_step": 491761, "epoch": 2927} {"train_loss": -11.854466438293457, "global_step": 491762, "epoch": 2927} {"train_loss": -11.766294479370117, "global_step": 491763, "epoch": 2927} {"train_loss": -11.22024154663086, "global_step": 491764, "epoch": 2927} {"train_loss": -12.059088706970215, "global_step": 491765, "epoch": 2927} {"train_loss": -12.084610939025879, "global_step": 491766, "epoch": 2927} {"train_loss": -11.537083625793457, "global_step": 491767, "epoch": 2927} {"train_loss": -12.012020111083984, "global_step": 491768, "epoch": 2927} {"train_loss": -11.458919525146484, "global_step": 491769, "epoch": 2927} {"train_loss": -12.081780433654785, "global_step": 491770, "epoch": 2927} {"train_loss": -12.249439239501953, "global_step": 491771, "epoch": 2927} {"train_loss": -11.512113571166992, "global_step": 491772, "epoch": 2927} {"train_loss": -12.043087005615234, "global_step": 491773, "epoch": 2927} {"train_loss": -11.088043212890625, "global_step": 491774, "epoch": 2927} {"train_loss": -10.857919692993164, "global_step": 491775, "epoch": 2927} {"train_loss": -11.8374662399292, "global_step": 491776, "epoch": 2927} {"train_loss": -10.61265754699707, "global_step": 491777, "epoch": 2927} {"train_loss": -10.289339065551758, "global_step": 491778, "epoch": 2927} {"train_loss": -10.672281265258789, "global_step": 491779, "epoch": 2927} {"train_loss": -10.900590896606445, "global_step": 491780, "epoch": 2927} {"train_loss": -11.090279579162598, "global_step": 491781, "epoch": 2927} {"train_loss": -10.916194915771484, "global_step": 491782, "epoch": 2927} {"train_loss": -11.848655700683594, "global_step": 491783, "epoch": 2927} {"train_loss": -11.429125785827637, "global_step": 491784, "epoch": 2927} {"train_loss": -10.907617568969727, "global_step": 491785, "epoch": 2927} {"train_loss": -10.366155624389648, "global_step": 491786, "epoch": 2927} {"train_loss": -12.014762878417969, "global_step": 491787, "epoch": 2927} {"train_loss": -11.325395584106445, "global_step": 491788, "epoch": 2927} {"train_loss": -12.025564193725586, "global_step": 491789, "epoch": 2927} {"train_loss": -11.211958885192871, "global_step": 491790, "epoch": 2927} {"train_loss": -11.149364471435547, "global_step": 491791, "epoch": 2927} {"train_loss": -11.960733413696289, "global_step": 491792, "epoch": 2927} {"train_loss": -10.886161804199219, "global_step": 491793, "epoch": 2927} {"train_loss": -11.850160598754883, "global_step": 491794, "epoch": 2927} {"train_loss": -11.399291038513184, "global_step": 491795, "epoch": 2927} {"train_loss": -10.974017143249512, "global_step": 491796, "epoch": 2927} {"train_loss": -11.925403594970703, "global_step": 491797, "epoch": 2927} {"train_loss": -11.454429626464844, "global_step": 491798, "epoch": 2927} {"train_loss": -12.149356842041016, "global_step": 491799, "epoch": 2927} {"train_loss": -11.781157493591309, "global_step": 491800, "epoch": 2927} {"train_loss": -12.228046417236328, "global_step": 491801, "epoch": 2927} {"train_loss": -12.230881690979004, "global_step": 491802, "epoch": 2927} {"train_loss": -12.211593627929688, "global_step": 491803, "epoch": 2927} {"train_loss": -12.321889877319336, "global_step": 491804, "epoch": 2927} {"train_loss": -11.900899887084961, "global_step": 491805, "epoch": 2927} {"train_loss": -12.405871391296387, "global_step": 491806, "epoch": 2927} {"train_loss": -12.104391098022461, "global_step": 491807, "epoch": 2927} {"train_loss": -12.336738586425781, "global_step": 491808, "epoch": 2927} {"train_loss": -12.2548828125, "global_step": 491809, "epoch": 2927} {"train_loss": -12.437447547912598, "global_step": 491810, "epoch": 2927} {"train_loss": -12.357450485229492, "global_step": 491811, "epoch": 2927} {"train_loss": -12.147087097167969, "global_step": 491812, "epoch": 2927} {"train_loss": -12.397134780883789, "global_step": 491813, "epoch": 2927} {"train_loss": -12.403070449829102, "global_step": 491814, "epoch": 2927} {"train_loss": -12.659780502319336, "global_step": 491815, "epoch": 2927} {"train_loss": -12.47833251953125, "global_step": 491816, "epoch": 2927} {"train_loss": -12.444245338439941, "global_step": 491817, "epoch": 2927} {"train_loss": -12.362726211547852, "global_step": 491818, "epoch": 2927} {"train_loss": -12.559260368347168, "global_step": 491819, "epoch": 2927} {"train_loss": -12.732357025146484, "global_step": 491820, "epoch": 2927} {"train_loss": -12.505958557128906, "global_step": 491821, "epoch": 2927} {"train_loss": -12.714702606201172, "global_step": 491822, "epoch": 2927} {"train_loss": -12.650232315063477, "global_step": 491823, "epoch": 2927} {"train_loss": -12.344313621520996, "global_step": 491824, "epoch": 2927} {"train_loss": -12.653106689453125, "global_step": 491825, "epoch": 2927} {"train_loss": -12.739187240600586, "global_step": 491826, "epoch": 2927} {"train_loss": -12.377023696899414, "global_step": 491827, "epoch": 2927} {"train_loss": -12.636836051940918, "global_step": 491828, "epoch": 2927} {"train_loss": -12.837906837463379, "global_step": 491829, "epoch": 2927} {"train_loss": -12.666790008544922, "global_step": 491830, "epoch": 2927} {"train_loss": -12.617624282836914, "global_step": 491831, "epoch": 2927} {"train_loss": -12.616625785827637, "global_step": 491832, "epoch": 2927} {"train_loss": -12.632081985473633, "global_step": 491833, "epoch": 2927} {"train_loss": -12.614858627319336, "global_step": 491834, "epoch": 2927} {"train_loss": -12.60673713684082, "global_step": 491835, "epoch": 2927} {"train_loss": -12.95361328125, "global_step": 491836, "epoch": 2927} {"train_loss": -12.74449348449707, "global_step": 491837, "epoch": 2927} {"train_loss": -12.893769264221191, "global_step": 491838, "epoch": 2927} {"train_loss": -12.758633613586426, "global_step": 491839, "epoch": 2927} {"train_loss": -12.771001815795898, "global_step": 491840, "epoch": 2927} {"train_loss": -12.7431058883667, "global_step": 491841, "epoch": 2927} {"train_loss": -12.72844123840332, "global_step": 491842, "epoch": 2927} {"train_loss": -12.801058769226074, "global_step": 491843, "epoch": 2927} {"train_loss": -12.63245964050293, "global_step": 491844, "epoch": 2927} {"train_loss": -12.885381698608398, "global_step": 491845, "epoch": 2927} {"train_loss": -12.9273681640625, "global_step": 491846, "epoch": 2927} {"train_loss": -12.925865173339844, "global_step": 491847, "epoch": 2927} {"train_loss": -12.838991165161133, "global_step": 491848, "epoch": 2927} {"train_loss": -12.735098838806152, "global_step": 491849, "epoch": 2927} {"train_loss": -12.532024383544922, "global_step": 491850, "epoch": 2927} {"train_loss": -12.456184387207031, "global_step": 491851, "epoch": 2927} {"train_loss": -12.61620044708252, "global_step": 491852, "epoch": 2927} {"train_loss": -12.5938081741333, "global_step": 491853, "epoch": 2927} {"train_loss": -12.633445739746094, "global_step": 491854, "epoch": 2927} {"train_loss": -12.869755744934082, "global_step": 491855, "epoch": 2927} {"train_loss": -12.555599212646484, "global_step": 491856, "epoch": 2927} {"train_loss": -12.714211463928223, "global_step": 491857, "epoch": 2927} {"train_loss": -12.800910949707031, "global_step": 491858, "epoch": 2927} {"train_loss": -12.924643516540527, "global_step": 491859, "epoch": 2927} {"train_loss": -12.900594711303711, "global_step": 491860, "epoch": 2927} {"train_loss": -12.727188110351562, "global_step": 491861, "epoch": 2927} {"train_loss": -12.829444885253906, "global_step": 491862, "epoch": 2927} {"train_loss": -12.591766357421875, "global_step": 491863, "epoch": 2927} {"train_loss": -12.948854446411133, "global_step": 491864, "epoch": 2927} {"train_loss": -12.416833877563477, "global_step": 491865, "epoch": 2927} {"train_loss": -12.560062408447266, "global_step": 491866, "epoch": 2927} {"train_loss": -12.183809280395508, "global_step": 491867, "epoch": 2927} {"train_loss": -11.29065227508545, "global_step": 491868, "epoch": 2927} {"train_loss": -12.533876419067383, "global_step": 491869, "epoch": 2927} {"train_loss": -10.385976791381836, "global_step": 491870, "epoch": 2927} {"train_loss": -11.557302474975586, "global_step": 491871, "epoch": 2927} {"train_loss": -10.273563385009766, "global_step": 491872, "epoch": 2927} {"train_loss": -11.174810409545898, "global_step": 491873, "epoch": 2927} {"train_loss": -9.862316131591797, "global_step": 491874, "epoch": 2927} {"train_loss": -10.625621795654297, "global_step": 491875, "epoch": 2927} {"train_loss": -9.606887817382812, "global_step": 491876, "epoch": 2927} {"train_loss": -11.097122192382812, "global_step": 491877, "epoch": 2927} {"train_loss": -8.233292579650879, "global_step": 491878, "epoch": 2927} {"train_loss": -9.06432056427002, "global_step": 491879, "epoch": 2927} {"train_loss": -8.243886947631836, "global_step": 491880, "epoch": 2927} {"train_loss": -7.923403263092041, "global_step": 491881, "epoch": 2927} {"train_loss": -8.65955638885498, "global_step": 491882, "epoch": 2927} {"train_loss": -9.282998085021973, "global_step": 491883, "epoch": 2927} {"train_loss": -7.845685005187988, "global_step": 491884, "epoch": 2927} {"train_loss": -7.686667442321777, "global_step": 491885, "epoch": 2927} {"train_loss": -8.835196495056152, "global_step": 491886, "epoch": 2927} {"train_loss": -8.445551872253418, "global_step": 491887, "epoch": 2927} {"train_loss": -8.785243034362793, "global_step": 491888, "epoch": 2927} {"train_loss": -8.36614990234375, "global_step": 491889, "epoch": 2927} {"train_loss": -8.881332397460938, "global_step": 491890, "epoch": 2927} {"train_loss": -8.965094566345215, "global_step": 491891, "epoch": 2927} {"train_loss": -8.744612693786621, "global_step": 491892, "epoch": 2927} {"train_loss": -8.958131790161133, "global_step": 491893, "epoch": 2927} {"train_loss": -9.659497261047363, "global_step": 491894, "epoch": 2927} {"train_loss": -9.472360610961914, "global_step": 491895, "epoch": 2927} {"train_loss": -9.658076286315918, "global_step": 491896, "epoch": 2927} {"train_loss": -10.320055961608887, "global_step": 491897, "epoch": 2927} {"train_loss": -10.180337905883789, "global_step": 491898, "epoch": 2927} {"train_loss": -10.327194213867188, "global_step": 491899, "epoch": 2927} {"train_loss": -10.451522827148438, "global_step": 491900, "epoch": 2927} {"train_loss": -10.730375289916992, "global_step": 491901, "epoch": 2927} {"train_loss": -10.302421569824219, "global_step": 491902, "epoch": 2927} {"train_loss": -11.641439576943716, "global_step": 491903, "epoch": 2927, "val_loss": 321496.6875} {"train_loss": -10.932873725891113, "global_step": 491904, "epoch": 2928} {"train_loss": -11.17579174041748, "global_step": 491905, "epoch": 2928} {"train_loss": -11.360383987426758, "global_step": 491906, "epoch": 2928} {"train_loss": -11.464259147644043, "global_step": 491907, "epoch": 2928} {"train_loss": -11.21056842803955, "global_step": 491908, "epoch": 2928} {"train_loss": -11.35555648803711, "global_step": 491909, "epoch": 2928} {"train_loss": -11.616806983947754, "global_step": 491910, "epoch": 2928} {"train_loss": -11.75129222869873, "global_step": 491911, "epoch": 2928} {"train_loss": -11.816946029663086, "global_step": 491912, "epoch": 2928} {"train_loss": -11.933036804199219, "global_step": 491913, "epoch": 2928} {"train_loss": -12.027848243713379, "global_step": 491914, "epoch": 2928} {"train_loss": -12.007137298583984, "global_step": 491915, "epoch": 2928} {"train_loss": -12.076025009155273, "global_step": 491916, "epoch": 2928} {"train_loss": -11.92919921875, "global_step": 491917, "epoch": 2928} {"train_loss": -11.989747047424316, "global_step": 491918, "epoch": 2928} {"train_loss": -12.351751327514648, "global_step": 491919, "epoch": 2928} {"train_loss": -12.186749458312988, "global_step": 491920, "epoch": 2928} {"train_loss": -12.165292739868164, "global_step": 491921, "epoch": 2928} {"train_loss": -12.357244491577148, "global_step": 491922, "epoch": 2928} {"train_loss": -12.178485870361328, "global_step": 491923, "epoch": 2928} {"train_loss": -12.495340347290039, "global_step": 491924, "epoch": 2928} {"train_loss": -12.181509017944336, "global_step": 491925, "epoch": 2928} {"train_loss": -12.40673828125, "global_step": 491926, "epoch": 2928} {"train_loss": -12.041749000549316, "global_step": 491927, "epoch": 2928} {"train_loss": -12.271795272827148, "global_step": 491928, "epoch": 2928} {"train_loss": -12.141311645507812, "global_step": 491929, "epoch": 2928} {"train_loss": -12.604480743408203, "global_step": 491930, "epoch": 2928} {"train_loss": -12.356847763061523, "global_step": 491931, "epoch": 2928} {"train_loss": -12.586524963378906, "global_step": 491932, "epoch": 2928} {"train_loss": -12.41234016418457, "global_step": 491933, "epoch": 2928} {"train_loss": -12.690839767456055, "global_step": 491934, "epoch": 2928} {"train_loss": -12.7178316116333, "global_step": 491935, "epoch": 2928} {"train_loss": -12.51930046081543, "global_step": 491936, "epoch": 2928} {"train_loss": -12.68588638305664, "global_step": 491937, "epoch": 2928} {"train_loss": -12.580358505249023, "global_step": 491938, "epoch": 2928} {"train_loss": -12.467955589294434, "global_step": 491939, "epoch": 2928} {"train_loss": -12.606008529663086, "global_step": 491940, "epoch": 2928} {"train_loss": -12.67705249786377, "global_step": 491941, "epoch": 2928} {"train_loss": -12.77747631072998, "global_step": 491942, "epoch": 2928} {"train_loss": -12.667346000671387, "global_step": 491943, "epoch": 2928} {"train_loss": -12.48696517944336, "global_step": 491944, "epoch": 2928} {"train_loss": -12.742792129516602, "global_step": 491945, "epoch": 2928} {"train_loss": -12.802154541015625, "global_step": 491946, "epoch": 2928} {"train_loss": -12.619562149047852, "global_step": 491947, "epoch": 2928} {"train_loss": -12.58962631225586, "global_step": 491948, "epoch": 2928} {"train_loss": -12.803629875183105, "global_step": 491949, "epoch": 2928} {"train_loss": -12.444917678833008, "global_step": 491950, "epoch": 2928} {"train_loss": -12.757009506225586, "global_step": 491951, "epoch": 2928} {"train_loss": -12.706364631652832, "global_step": 491952, "epoch": 2928} {"train_loss": -12.596181869506836, "global_step": 491953, "epoch": 2928} {"train_loss": -12.752435684204102, "global_step": 491954, "epoch": 2928} {"train_loss": -12.843681335449219, "global_step": 491955, "epoch": 2928} {"train_loss": -12.85487174987793, "global_step": 491956, "epoch": 2928} {"train_loss": -12.953165054321289, "global_step": 491957, "epoch": 2928} {"train_loss": -12.817371368408203, "global_step": 491958, "epoch": 2928} {"train_loss": -12.748444557189941, "global_step": 491959, "epoch": 2928} {"train_loss": -12.799495697021484, "global_step": 491960, "epoch": 2928} {"train_loss": -12.73214054107666, "global_step": 491961, "epoch": 2928} {"train_loss": -12.866189956665039, "global_step": 491962, "epoch": 2928} {"train_loss": -12.84678840637207, "global_step": 491963, "epoch": 2928} {"train_loss": -12.987832069396973, "global_step": 491964, "epoch": 2928} {"train_loss": -12.815263748168945, "global_step": 491965, "epoch": 2928} {"train_loss": -13.049970626831055, "global_step": 491966, "epoch": 2928} {"train_loss": -12.876346588134766, "global_step": 491967, "epoch": 2928} {"train_loss": -12.872111320495605, "global_step": 491968, "epoch": 2928} {"train_loss": -13.051643371582031, "global_step": 491969, "epoch": 2928} {"train_loss": -12.850473403930664, "global_step": 491970, "epoch": 2928} {"train_loss": -12.797394752502441, "global_step": 491971, "epoch": 2928} {"train_loss": -12.62102222442627, "global_step": 491972, "epoch": 2928} {"train_loss": -12.884129524230957, "global_step": 491973, "epoch": 2928} {"train_loss": -12.731316566467285, "global_step": 491974, "epoch": 2928} {"train_loss": -13.041202545166016, "global_step": 491975, "epoch": 2928} {"train_loss": -13.174805641174316, "global_step": 491976, "epoch": 2928} {"train_loss": -13.073548316955566, "global_step": 491977, "epoch": 2928} {"train_loss": -12.931400299072266, "global_step": 491978, "epoch": 2928} {"train_loss": -13.030505180358887, "global_step": 491979, "epoch": 2928} {"train_loss": -12.978015899658203, "global_step": 491980, "epoch": 2928} {"train_loss": -12.900049209594727, "global_step": 491981, "epoch": 2928} {"train_loss": -12.984646797180176, "global_step": 491982, "epoch": 2928} {"train_loss": -13.139082908630371, "global_step": 491983, "epoch": 2928} {"train_loss": -13.041200637817383, "global_step": 491984, "epoch": 2928} {"train_loss": -12.7988920211792, "global_step": 491985, "epoch": 2928} {"train_loss": -12.934056282043457, "global_step": 491986, "epoch": 2928} {"train_loss": -12.74515438079834, "global_step": 491987, "epoch": 2928} {"train_loss": -13.110902786254883, "global_step": 491988, "epoch": 2928} {"train_loss": -12.912996292114258, "global_step": 491989, "epoch": 2928} {"train_loss": -13.09929084777832, "global_step": 491990, "epoch": 2928} {"train_loss": -12.941261291503906, "global_step": 491991, "epoch": 2928} {"train_loss": -13.179712295532227, "global_step": 491992, "epoch": 2928} {"train_loss": -13.027730941772461, "global_step": 491993, "epoch": 2928} {"train_loss": -13.104700088500977, "global_step": 491994, "epoch": 2928} {"train_loss": -13.045108795166016, "global_step": 491995, "epoch": 2928} {"train_loss": -12.99455451965332, "global_step": 491996, "epoch": 2928} {"train_loss": -12.792819023132324, "global_step": 491997, "epoch": 2928} {"train_loss": -12.806869506835938, "global_step": 491998, "epoch": 2928} {"train_loss": -13.028995513916016, "global_step": 491999, "epoch": 2928} {"train_loss": -12.842937469482422, "global_step": 492000, "epoch": 2928} {"train_loss": -12.717071533203125, "global_step": 492001, "epoch": 2928} {"train_loss": -12.975915908813477, "global_step": 492002, "epoch": 2928} {"train_loss": -12.57620620727539, "global_step": 492003, "epoch": 2928} {"train_loss": -12.93614673614502, "global_step": 492004, "epoch": 2928} {"train_loss": -10.88882064819336, "global_step": 492005, "epoch": 2928} {"train_loss": -12.590185165405273, "global_step": 492006, "epoch": 2928} {"train_loss": -11.831892013549805, "global_step": 492007, "epoch": 2928} {"train_loss": -12.73457145690918, "global_step": 492008, "epoch": 2928} {"train_loss": -11.542905807495117, "global_step": 492009, "epoch": 2928} {"train_loss": -12.579404830932617, "global_step": 492010, "epoch": 2928} {"train_loss": -12.29102897644043, "global_step": 492011, "epoch": 2928} {"train_loss": -12.21145248413086, "global_step": 492012, "epoch": 2928} {"train_loss": -10.954134941101074, "global_step": 492013, "epoch": 2928} {"train_loss": -12.341165542602539, "global_step": 492014, "epoch": 2928} {"train_loss": -10.425775527954102, "global_step": 492015, "epoch": 2928} {"train_loss": -11.188440322875977, "global_step": 492016, "epoch": 2928} {"train_loss": -11.714921951293945, "global_step": 492017, "epoch": 2928} {"train_loss": -11.139341354370117, "global_step": 492018, "epoch": 2928} {"train_loss": -11.673849105834961, "global_step": 492019, "epoch": 2928} {"train_loss": -11.966656684875488, "global_step": 492020, "epoch": 2928} {"train_loss": -12.034194946289062, "global_step": 492021, "epoch": 2928} {"train_loss": -11.729530334472656, "global_step": 492022, "epoch": 2928} {"train_loss": -10.85221004486084, "global_step": 492023, "epoch": 2928} {"train_loss": -11.584019660949707, "global_step": 492024, "epoch": 2928} {"train_loss": -11.53625774383545, "global_step": 492025, "epoch": 2928} {"train_loss": -12.183534622192383, "global_step": 492026, "epoch": 2928} {"train_loss": -11.631072998046875, "global_step": 492027, "epoch": 2928} {"train_loss": -10.574798583984375, "global_step": 492028, "epoch": 2928} {"train_loss": -10.333351135253906, "global_step": 492029, "epoch": 2928} {"train_loss": -10.469221115112305, "global_step": 492030, "epoch": 2928} {"train_loss": -11.396998405456543, "global_step": 492031, "epoch": 2928} {"train_loss": -10.38264274597168, "global_step": 492032, "epoch": 2928} {"train_loss": -10.218717575073242, "global_step": 492033, "epoch": 2928} {"train_loss": -10.677929878234863, "global_step": 492034, "epoch": 2928} {"train_loss": -10.314828872680664, "global_step": 492035, "epoch": 2928} {"train_loss": -10.207304000854492, "global_step": 492036, "epoch": 2928} {"train_loss": -10.843579292297363, "global_step": 492037, "epoch": 2928} {"train_loss": -10.810263633728027, "global_step": 492038, "epoch": 2928} {"train_loss": -7.853965759277344, "global_step": 492039, "epoch": 2928} {"train_loss": -9.328274726867676, "global_step": 492040, "epoch": 2928} {"train_loss": -9.371522903442383, "global_step": 492041, "epoch": 2928} {"train_loss": -8.933065414428711, "global_step": 492042, "epoch": 2928} {"train_loss": -9.134603500366211, "global_step": 492043, "epoch": 2928} {"train_loss": -10.2906494140625, "global_step": 492044, "epoch": 2928} {"train_loss": -10.12228012084961, "global_step": 492045, "epoch": 2928} {"train_loss": -10.704010009765625, "global_step": 492046, "epoch": 2928} {"train_loss": -10.689353942871094, "global_step": 492047, "epoch": 2928} {"train_loss": -11.28111457824707, "global_step": 492048, "epoch": 2928} {"train_loss": -10.398181915283203, "global_step": 492049, "epoch": 2928} {"train_loss": -10.704072952270508, "global_step": 492050, "epoch": 2928} {"train_loss": -11.17636775970459, "global_step": 492051, "epoch": 2928} {"train_loss": -10.589569091796875, "global_step": 492052, "epoch": 2928} {"train_loss": -11.195440292358398, "global_step": 492053, "epoch": 2928} {"train_loss": -11.082161903381348, "global_step": 492054, "epoch": 2928} {"train_loss": -10.832208633422852, "global_step": 492055, "epoch": 2928} {"train_loss": -11.333536148071289, "global_step": 492056, "epoch": 2928} {"train_loss": -11.078057289123535, "global_step": 492057, "epoch": 2928} {"train_loss": -10.369491577148438, "global_step": 492058, "epoch": 2928} {"train_loss": -10.8726806640625, "global_step": 492059, "epoch": 2928} {"train_loss": -11.425275802612305, "global_step": 492060, "epoch": 2928} {"train_loss": -11.635872840881348, "global_step": 492061, "epoch": 2928} {"train_loss": -11.181293487548828, "global_step": 492062, "epoch": 2928} {"train_loss": -12.056476593017578, "global_step": 492063, "epoch": 2928} {"train_loss": -11.417349815368652, "global_step": 492064, "epoch": 2928} {"train_loss": -12.076804161071777, "global_step": 492065, "epoch": 2928} {"train_loss": -11.379436492919922, "global_step": 492066, "epoch": 2928} {"train_loss": -11.659656524658203, "global_step": 492067, "epoch": 2928} {"train_loss": -12.195141792297363, "global_step": 492068, "epoch": 2928} {"train_loss": -11.157384872436523, "global_step": 492069, "epoch": 2928} {"train_loss": -12.468476295471191, "global_step": 492070, "epoch": 2928} {"train_loss": -11.990388296899342, "global_step": 492071, "epoch": 2928, "val_loss": 319101.1875} {"train_loss": -12.520750999450684, "global_step": 492072, "epoch": 2929} {"train_loss": -11.551275253295898, "global_step": 492073, "epoch": 2929} {"train_loss": -12.2108154296875, "global_step": 492074, "epoch": 2929} {"train_loss": -11.721031188964844, "global_step": 492075, "epoch": 2929} {"train_loss": -12.048728942871094, "global_step": 492076, "epoch": 2929} {"train_loss": -11.885567665100098, "global_step": 492077, "epoch": 2929} {"train_loss": -12.079656600952148, "global_step": 492078, "epoch": 2929} {"train_loss": -11.95244026184082, "global_step": 492079, "epoch": 2929} {"train_loss": -12.61087417602539, "global_step": 492080, "epoch": 2929} {"train_loss": -12.286857604980469, "global_step": 492081, "epoch": 2929} {"train_loss": -12.269529342651367, "global_step": 492082, "epoch": 2929} {"train_loss": -12.125726699829102, "global_step": 492083, "epoch": 2929} {"train_loss": -12.277603149414062, "global_step": 492084, "epoch": 2929} {"train_loss": -12.384886741638184, "global_step": 492085, "epoch": 2929} {"train_loss": -12.067996978759766, "global_step": 492086, "epoch": 2929} {"train_loss": -12.482730865478516, "global_step": 492087, "epoch": 2929} {"train_loss": -12.140273094177246, "global_step": 492088, "epoch": 2929} {"train_loss": -12.592682838439941, "global_step": 492089, "epoch": 2929} {"train_loss": -11.842381477355957, "global_step": 492090, "epoch": 2929} {"train_loss": -12.793073654174805, "global_step": 492091, "epoch": 2929} {"train_loss": -12.153144836425781, "global_step": 492092, "epoch": 2929} {"train_loss": -12.782005310058594, "global_step": 492093, "epoch": 2929} {"train_loss": -12.071094512939453, "global_step": 492094, "epoch": 2929} {"train_loss": -12.437386512756348, "global_step": 492095, "epoch": 2929} {"train_loss": -12.17175006866455, "global_step": 492096, "epoch": 2929} {"train_loss": -12.629171371459961, "global_step": 492097, "epoch": 2929} {"train_loss": -12.204751968383789, "global_step": 492098, "epoch": 2929} {"train_loss": -12.290879249572754, "global_step": 492099, "epoch": 2929} {"train_loss": -12.494348526000977, "global_step": 492100, "epoch": 2929} {"train_loss": -12.424362182617188, "global_step": 492101, "epoch": 2929} {"train_loss": -12.393861770629883, "global_step": 492102, "epoch": 2929} {"train_loss": -12.488719940185547, "global_step": 492103, "epoch": 2929} {"train_loss": -12.494218826293945, "global_step": 492104, "epoch": 2929} {"train_loss": -12.572641372680664, "global_step": 492105, "epoch": 2929} {"train_loss": -12.201753616333008, "global_step": 492106, "epoch": 2929} {"train_loss": -12.467483520507812, "global_step": 492107, "epoch": 2929} {"train_loss": -12.182065963745117, "global_step": 492108, "epoch": 2929} {"train_loss": -12.244734764099121, "global_step": 492109, "epoch": 2929} {"train_loss": -12.302263259887695, "global_step": 492110, "epoch": 2929} {"train_loss": -12.157855987548828, "global_step": 492111, "epoch": 2929} {"train_loss": -12.311205863952637, "global_step": 492112, "epoch": 2929} {"train_loss": -12.273958206176758, "global_step": 492113, "epoch": 2929} {"train_loss": -12.36867904663086, "global_step": 492114, "epoch": 2929} {"train_loss": -12.526605606079102, "global_step": 492115, "epoch": 2929} {"train_loss": -12.137563705444336, "global_step": 492116, "epoch": 2929} {"train_loss": -12.636445999145508, "global_step": 492117, "epoch": 2929} {"train_loss": -12.410876274108887, "global_step": 492118, "epoch": 2929} {"train_loss": -12.70306396484375, "global_step": 492119, "epoch": 2929} {"train_loss": -12.4371976852417, "global_step": 492120, "epoch": 2929} {"train_loss": -12.397829055786133, "global_step": 492121, "epoch": 2929} {"train_loss": -12.437812805175781, "global_step": 492122, "epoch": 2929} {"train_loss": -12.108302116394043, "global_step": 492123, "epoch": 2929} {"train_loss": -12.649763107299805, "global_step": 492124, "epoch": 2929} {"train_loss": -12.363627433776855, "global_step": 492125, "epoch": 2929} {"train_loss": -12.429191589355469, "global_step": 492126, "epoch": 2929} {"train_loss": -12.80327033996582, "global_step": 492127, "epoch": 2929} {"train_loss": -12.67242431640625, "global_step": 492128, "epoch": 2929} {"train_loss": -12.902885437011719, "global_step": 492129, "epoch": 2929} {"train_loss": -12.613446235656738, "global_step": 492130, "epoch": 2929} {"train_loss": -12.739011764526367, "global_step": 492131, "epoch": 2929} {"train_loss": -12.480443954467773, "global_step": 492132, "epoch": 2929} {"train_loss": -12.859491348266602, "global_step": 492133, "epoch": 2929} {"train_loss": -12.652667045593262, "global_step": 492134, "epoch": 2929} {"train_loss": -12.775575637817383, "global_step": 492135, "epoch": 2929} {"train_loss": -12.665680885314941, "global_step": 492136, "epoch": 2929} {"train_loss": -12.65989875793457, "global_step": 492137, "epoch": 2929} {"train_loss": -12.835373878479004, "global_step": 492138, "epoch": 2929} {"train_loss": -12.555562019348145, "global_step": 492139, "epoch": 2929} {"train_loss": -12.726338386535645, "global_step": 492140, "epoch": 2929} {"train_loss": -12.580989837646484, "global_step": 492141, "epoch": 2929} {"train_loss": -12.623970985412598, "global_step": 492142, "epoch": 2929} {"train_loss": -12.640083312988281, "global_step": 492143, "epoch": 2929} {"train_loss": -12.542360305786133, "global_step": 492144, "epoch": 2929} {"train_loss": -11.80506706237793, "global_step": 492145, "epoch": 2929} {"train_loss": -12.304229736328125, "global_step": 492146, "epoch": 2929} {"train_loss": -12.350059509277344, "global_step": 492147, "epoch": 2929} {"train_loss": -11.492992401123047, "global_step": 492148, "epoch": 2929} {"train_loss": -12.805001258850098, "global_step": 492149, "epoch": 2929} {"train_loss": -11.707035064697266, "global_step": 492150, "epoch": 2929} {"train_loss": -11.793208122253418, "global_step": 492151, "epoch": 2929} {"train_loss": -12.667905807495117, "global_step": 492152, "epoch": 2929} {"train_loss": -11.977945327758789, "global_step": 492153, "epoch": 2929} {"train_loss": -12.381977081298828, "global_step": 492154, "epoch": 2929} {"train_loss": -12.639991760253906, "global_step": 492155, "epoch": 2929} {"train_loss": -12.623380661010742, "global_step": 492156, "epoch": 2929} {"train_loss": -12.431608200073242, "global_step": 492157, "epoch": 2929} {"train_loss": -12.903751373291016, "global_step": 492158, "epoch": 2929} {"train_loss": -12.689401626586914, "global_step": 492159, "epoch": 2929} {"train_loss": -12.749226570129395, "global_step": 492160, "epoch": 2929} {"train_loss": -12.680087089538574, "global_step": 492161, "epoch": 2929} {"train_loss": -12.547718048095703, "global_step": 492162, "epoch": 2929} {"train_loss": -12.60464096069336, "global_step": 492163, "epoch": 2929} {"train_loss": -12.936182022094727, "global_step": 492164, "epoch": 2929} {"train_loss": -12.698755264282227, "global_step": 492165, "epoch": 2929} {"train_loss": -12.886789321899414, "global_step": 492166, "epoch": 2929} {"train_loss": -12.637727737426758, "global_step": 492167, "epoch": 2929} {"train_loss": -12.632869720458984, "global_step": 492168, "epoch": 2929} {"train_loss": -13.009963989257812, "global_step": 492169, "epoch": 2929} {"train_loss": -12.790557861328125, "global_step": 492170, "epoch": 2929} {"train_loss": -12.896539688110352, "global_step": 492171, "epoch": 2929} {"train_loss": -13.062019348144531, "global_step": 492172, "epoch": 2929} {"train_loss": -13.01335620880127, "global_step": 492173, "epoch": 2929} {"train_loss": -12.703960418701172, "global_step": 492174, "epoch": 2929} {"train_loss": -12.669364929199219, "global_step": 492175, "epoch": 2929} {"train_loss": -12.332138061523438, "global_step": 492176, "epoch": 2929} {"train_loss": -13.03921890258789, "global_step": 492177, "epoch": 2929} {"train_loss": -12.545697212219238, "global_step": 492178, "epoch": 2929} {"train_loss": -12.895729064941406, "global_step": 492179, "epoch": 2929} {"train_loss": -12.729215621948242, "global_step": 492180, "epoch": 2929} {"train_loss": -12.593461036682129, "global_step": 492181, "epoch": 2929} {"train_loss": -12.28976821899414, "global_step": 492182, "epoch": 2929} {"train_loss": -12.84190559387207, "global_step": 492183, "epoch": 2929} {"train_loss": -12.645891189575195, "global_step": 492184, "epoch": 2929} {"train_loss": -12.631867408752441, "global_step": 492185, "epoch": 2929} {"train_loss": -12.372363090515137, "global_step": 492186, "epoch": 2929} {"train_loss": -12.990461349487305, "global_step": 492187, "epoch": 2929} {"train_loss": -12.350273132324219, "global_step": 492188, "epoch": 2929} {"train_loss": -11.913922309875488, "global_step": 492189, "epoch": 2929} {"train_loss": -11.76639175415039, "global_step": 492190, "epoch": 2929} {"train_loss": -12.647406578063965, "global_step": 492191, "epoch": 2929} {"train_loss": -11.655607223510742, "global_step": 492192, "epoch": 2929} {"train_loss": -11.306255340576172, "global_step": 492193, "epoch": 2929} {"train_loss": -12.298540115356445, "global_step": 492194, "epoch": 2929} {"train_loss": -10.23010540008545, "global_step": 492195, "epoch": 2929} {"train_loss": -10.801582336425781, "global_step": 492196, "epoch": 2929} {"train_loss": -11.720480918884277, "global_step": 492197, "epoch": 2929} {"train_loss": -9.595497131347656, "global_step": 492198, "epoch": 2929} {"train_loss": -10.033729553222656, "global_step": 492199, "epoch": 2929} {"train_loss": -11.171466827392578, "global_step": 492200, "epoch": 2929} {"train_loss": -8.27271842956543, "global_step": 492201, "epoch": 2929} {"train_loss": -8.358758926391602, "global_step": 492202, "epoch": 2929} {"train_loss": -8.333528518676758, "global_step": 492203, "epoch": 2929} {"train_loss": -7.695913314819336, "global_step": 492204, "epoch": 2929} {"train_loss": -9.800446510314941, "global_step": 492205, "epoch": 2929} {"train_loss": -9.475198745727539, "global_step": 492206, "epoch": 2929} {"train_loss": -8.6776762008667, "global_step": 492207, "epoch": 2929} {"train_loss": -9.442798614501953, "global_step": 492208, "epoch": 2929} {"train_loss": -10.466036796569824, "global_step": 492209, "epoch": 2929} {"train_loss": -10.316900253295898, "global_step": 492210, "epoch": 2929} {"train_loss": -11.953571319580078, "global_step": 492211, "epoch": 2929} {"train_loss": -10.325185775756836, "global_step": 492212, "epoch": 2929} {"train_loss": -11.574569702148438, "global_step": 492213, "epoch": 2929} {"train_loss": -10.558525085449219, "global_step": 492214, "epoch": 2929} {"train_loss": -11.574013710021973, "global_step": 492215, "epoch": 2929} {"train_loss": -11.717552185058594, "global_step": 492216, "epoch": 2929} {"train_loss": -11.859288215637207, "global_step": 492217, "epoch": 2929} {"train_loss": -12.300820350646973, "global_step": 492218, "epoch": 2929} {"train_loss": -11.022784233093262, "global_step": 492219, "epoch": 2929} {"train_loss": -11.77055549621582, "global_step": 492220, "epoch": 2929} {"train_loss": -11.228857040405273, "global_step": 492221, "epoch": 2929} {"train_loss": -10.362077713012695, "global_step": 492222, "epoch": 2929} {"train_loss": -11.897749900817871, "global_step": 492223, "epoch": 2929} {"train_loss": -10.681939125061035, "global_step": 492224, "epoch": 2929} {"train_loss": -11.711153984069824, "global_step": 492225, "epoch": 2929} {"train_loss": -11.589037895202637, "global_step": 492226, "epoch": 2929} {"train_loss": -11.693910598754883, "global_step": 492227, "epoch": 2929} {"train_loss": -12.171635627746582, "global_step": 492228, "epoch": 2929} {"train_loss": -11.520383834838867, "global_step": 492229, "epoch": 2929} {"train_loss": -12.179160118103027, "global_step": 492230, "epoch": 2929} {"train_loss": -11.717151641845703, "global_step": 492231, "epoch": 2929} {"train_loss": -12.069808006286621, "global_step": 492232, "epoch": 2929} {"train_loss": -11.256699562072754, "global_step": 492233, "epoch": 2929} {"train_loss": -11.748461723327637, "global_step": 492234, "epoch": 2929} {"train_loss": -11.636749267578125, "global_step": 492235, "epoch": 2929} {"train_loss": -11.45884895324707, "global_step": 492236, "epoch": 2929} {"train_loss": -12.00885009765625, "global_step": 492237, "epoch": 2929} {"train_loss": -11.405488014221191, "global_step": 492238, "epoch": 2929} {"train_loss": -12.023648551532201, "global_step": 492239, "epoch": 2929, "val_loss": 316301.5625} {"train_loss": -11.866153717041016, "global_step": 492240, "epoch": 2930} {"train_loss": -11.990922927856445, "global_step": 492241, "epoch": 2930} {"train_loss": -12.086088180541992, "global_step": 492242, "epoch": 2930} {"train_loss": -11.719578742980957, "global_step": 492243, "epoch": 2930} {"train_loss": -12.430258750915527, "global_step": 492244, "epoch": 2930} {"train_loss": -11.674997329711914, "global_step": 492245, "epoch": 2930} {"train_loss": -12.50216293334961, "global_step": 492246, "epoch": 2930} {"train_loss": -11.916024208068848, "global_step": 492247, "epoch": 2930} {"train_loss": -12.181297302246094, "global_step": 492248, "epoch": 2930} {"train_loss": -12.253320693969727, "global_step": 492249, "epoch": 2930} {"train_loss": -12.070119857788086, "global_step": 492250, "epoch": 2930} {"train_loss": -12.335641860961914, "global_step": 492251, "epoch": 2930} {"train_loss": -12.239583969116211, "global_step": 492252, "epoch": 2930} {"train_loss": -12.350343704223633, "global_step": 492253, "epoch": 2930} {"train_loss": -12.207895278930664, "global_step": 492254, "epoch": 2930} {"train_loss": -12.282926559448242, "global_step": 492255, "epoch": 2930} {"train_loss": -12.191644668579102, "global_step": 492256, "epoch": 2930} {"train_loss": -11.88281536102295, "global_step": 492257, "epoch": 2930} {"train_loss": -12.338207244873047, "global_step": 492258, "epoch": 2930} {"train_loss": -11.987119674682617, "global_step": 492259, "epoch": 2930} {"train_loss": -12.50345230102539, "global_step": 492260, "epoch": 2930} {"train_loss": -12.198257446289062, "global_step": 492261, "epoch": 2930} {"train_loss": -12.385242462158203, "global_step": 492262, "epoch": 2930} {"train_loss": -12.315990447998047, "global_step": 492263, "epoch": 2930} {"train_loss": -12.448143005371094, "global_step": 492264, "epoch": 2930} {"train_loss": -12.181831359863281, "global_step": 492265, "epoch": 2930} {"train_loss": -12.099135398864746, "global_step": 492266, "epoch": 2930} {"train_loss": -12.295747756958008, "global_step": 492267, "epoch": 2930} {"train_loss": -12.373285293579102, "global_step": 492268, "epoch": 2930} {"train_loss": -12.079412460327148, "global_step": 492269, "epoch": 2930} {"train_loss": -12.267511367797852, "global_step": 492270, "epoch": 2930} {"train_loss": -12.570379257202148, "global_step": 492271, "epoch": 2930} {"train_loss": -12.096307754516602, "global_step": 492272, "epoch": 2930} {"train_loss": -12.658018112182617, "global_step": 492273, "epoch": 2930} {"train_loss": -12.102367401123047, "global_step": 492274, "epoch": 2930} {"train_loss": -12.652606964111328, "global_step": 492275, "epoch": 2930} {"train_loss": -12.529975891113281, "global_step": 492276, "epoch": 2930} {"train_loss": -12.546825408935547, "global_step": 492277, "epoch": 2930} {"train_loss": -12.515815734863281, "global_step": 492278, "epoch": 2930} {"train_loss": -12.298796653747559, "global_step": 492279, "epoch": 2930} {"train_loss": -12.670578002929688, "global_step": 492280, "epoch": 2930} {"train_loss": -12.66693115234375, "global_step": 492281, "epoch": 2930} {"train_loss": -12.710949897766113, "global_step": 492282, "epoch": 2930} {"train_loss": -12.755454063415527, "global_step": 492283, "epoch": 2930} {"train_loss": -12.588427543640137, "global_step": 492284, "epoch": 2930} {"train_loss": -12.806379318237305, "global_step": 492285, "epoch": 2930} {"train_loss": -12.606483459472656, "global_step": 492286, "epoch": 2930} {"train_loss": -12.63812255859375, "global_step": 492287, "epoch": 2930} {"train_loss": -12.58355712890625, "global_step": 492288, "epoch": 2930} {"train_loss": -12.840498924255371, "global_step": 492289, "epoch": 2930} {"train_loss": -12.761159896850586, "global_step": 492290, "epoch": 2930} {"train_loss": -12.77107048034668, "global_step": 492291, "epoch": 2930} {"train_loss": -12.883644104003906, "global_step": 492292, "epoch": 2930} {"train_loss": -12.480525970458984, "global_step": 492293, "epoch": 2930} {"train_loss": -12.88935375213623, "global_step": 492294, "epoch": 2930} {"train_loss": -12.613807678222656, "global_step": 492295, "epoch": 2930} {"train_loss": -12.771639823913574, "global_step": 492296, "epoch": 2930} {"train_loss": -12.665115356445312, "global_step": 492297, "epoch": 2930} {"train_loss": -12.860520362854004, "global_step": 492298, "epoch": 2930} {"train_loss": -12.909807205200195, "global_step": 492299, "epoch": 2930} {"train_loss": -12.867988586425781, "global_step": 492300, "epoch": 2930} {"train_loss": -13.062214851379395, "global_step": 492301, "epoch": 2930} {"train_loss": -12.792547225952148, "global_step": 492302, "epoch": 2930} {"train_loss": -12.782316207885742, "global_step": 492303, "epoch": 2930} {"train_loss": -12.774070739746094, "global_step": 492304, "epoch": 2930} {"train_loss": -12.818941116333008, "global_step": 492305, "epoch": 2930} {"train_loss": -12.510477066040039, "global_step": 492306, "epoch": 2930} {"train_loss": -12.705717086791992, "global_step": 492307, "epoch": 2930} {"train_loss": -12.903974533081055, "global_step": 492308, "epoch": 2930} {"train_loss": -12.692331314086914, "global_step": 492309, "epoch": 2930} {"train_loss": -12.763120651245117, "global_step": 492310, "epoch": 2930} {"train_loss": -12.688383102416992, "global_step": 492311, "epoch": 2930} {"train_loss": -12.886554718017578, "global_step": 492312, "epoch": 2930} {"train_loss": -12.852928161621094, "global_step": 492313, "epoch": 2930} {"train_loss": -12.779685020446777, "global_step": 492314, "epoch": 2930} {"train_loss": -12.86865234375, "global_step": 492315, "epoch": 2930} {"train_loss": -12.70863151550293, "global_step": 492316, "epoch": 2930} {"train_loss": -12.9507474899292, "global_step": 492317, "epoch": 2930} {"train_loss": -12.752283096313477, "global_step": 492318, "epoch": 2930} {"train_loss": -12.723941802978516, "global_step": 492319, "epoch": 2930} {"train_loss": -12.82351303100586, "global_step": 492320, "epoch": 2930} {"train_loss": -12.96029281616211, "global_step": 492321, "epoch": 2930} {"train_loss": -12.990063667297363, "global_step": 492322, "epoch": 2930} {"train_loss": -12.83303165435791, "global_step": 492323, "epoch": 2930} {"train_loss": -13.092370986938477, "global_step": 492324, "epoch": 2930} {"train_loss": -13.01962661743164, "global_step": 492325, "epoch": 2930} {"train_loss": -12.817947387695312, "global_step": 492326, "epoch": 2930} {"train_loss": -12.713495254516602, "global_step": 492327, "epoch": 2930} {"train_loss": -12.895910263061523, "global_step": 492328, "epoch": 2930} {"train_loss": -12.805755615234375, "global_step": 492329, "epoch": 2930} {"train_loss": -12.992316246032715, "global_step": 492330, "epoch": 2930} {"train_loss": -12.931446075439453, "global_step": 492331, "epoch": 2930} {"train_loss": -12.930449485778809, "global_step": 492332, "epoch": 2930} {"train_loss": -12.460003852844238, "global_step": 492333, "epoch": 2930} {"train_loss": -13.185680389404297, "global_step": 492334, "epoch": 2930} {"train_loss": -12.761594772338867, "global_step": 492335, "epoch": 2930} {"train_loss": -12.038379669189453, "global_step": 492336, "epoch": 2930} {"train_loss": -12.422025680541992, "global_step": 492337, "epoch": 2930} {"train_loss": -12.809306144714355, "global_step": 492338, "epoch": 2930} {"train_loss": -12.266999244689941, "global_step": 492339, "epoch": 2930} {"train_loss": -12.474597930908203, "global_step": 492340, "epoch": 2930} {"train_loss": -12.583612442016602, "global_step": 492341, "epoch": 2930} {"train_loss": -11.89348316192627, "global_step": 492342, "epoch": 2930} {"train_loss": -11.800070762634277, "global_step": 492343, "epoch": 2930} {"train_loss": -12.782747268676758, "global_step": 492344, "epoch": 2930} {"train_loss": -11.531991958618164, "global_step": 492345, "epoch": 2930} {"train_loss": -12.554494857788086, "global_step": 492346, "epoch": 2930} {"train_loss": -12.45799446105957, "global_step": 492347, "epoch": 2930} {"train_loss": -11.697429656982422, "global_step": 492348, "epoch": 2930} {"train_loss": -12.433198928833008, "global_step": 492349, "epoch": 2930} {"train_loss": -12.331239700317383, "global_step": 492350, "epoch": 2930} {"train_loss": -11.671185493469238, "global_step": 492351, "epoch": 2930} {"train_loss": -12.046061515808105, "global_step": 492352, "epoch": 2930} {"train_loss": -9.863641738891602, "global_step": 492353, "epoch": 2930} {"train_loss": -10.53859806060791, "global_step": 492354, "epoch": 2930} {"train_loss": -11.234231948852539, "global_step": 492355, "epoch": 2930} {"train_loss": -11.276327133178711, "global_step": 492356, "epoch": 2930} {"train_loss": -10.349306106567383, "global_step": 492357, "epoch": 2930} {"train_loss": -10.692243576049805, "global_step": 492358, "epoch": 2930} {"train_loss": -10.423110008239746, "global_step": 492359, "epoch": 2930} {"train_loss": -11.7620849609375, "global_step": 492360, "epoch": 2930} {"train_loss": -10.234905242919922, "global_step": 492361, "epoch": 2930} {"train_loss": -10.432180404663086, "global_step": 492362, "epoch": 2930} {"train_loss": -11.009603500366211, "global_step": 492363, "epoch": 2930} {"train_loss": -11.22048568725586, "global_step": 492364, "epoch": 2930} {"train_loss": -11.706177711486816, "global_step": 492365, "epoch": 2930} {"train_loss": -11.404781341552734, "global_step": 492366, "epoch": 2930} {"train_loss": -10.767297744750977, "global_step": 492367, "epoch": 2930} {"train_loss": -11.411527633666992, "global_step": 492368, "epoch": 2930} {"train_loss": -10.973587989807129, "global_step": 492369, "epoch": 2930} {"train_loss": -11.342748641967773, "global_step": 492370, "epoch": 2930} {"train_loss": -11.119319915771484, "global_step": 492371, "epoch": 2930} {"train_loss": -11.333446502685547, "global_step": 492372, "epoch": 2930} {"train_loss": -10.987920761108398, "global_step": 492373, "epoch": 2930} {"train_loss": -11.701593399047852, "global_step": 492374, "epoch": 2930} {"train_loss": -11.538872718811035, "global_step": 492375, "epoch": 2930} {"train_loss": -11.893074035644531, "global_step": 492376, "epoch": 2930} {"train_loss": -11.79865550994873, "global_step": 492377, "epoch": 2930} {"train_loss": -11.50469970703125, "global_step": 492378, "epoch": 2930} {"train_loss": -11.75309944152832, "global_step": 492379, "epoch": 2930} {"train_loss": -11.60564136505127, "global_step": 492380, "epoch": 2930} {"train_loss": -11.696359634399414, "global_step": 492381, "epoch": 2930} {"train_loss": -12.28770637512207, "global_step": 492382, "epoch": 2930} {"train_loss": -11.863441467285156, "global_step": 492383, "epoch": 2930} {"train_loss": -12.36660385131836, "global_step": 492384, "epoch": 2930} {"train_loss": -12.103635787963867, "global_step": 492385, "epoch": 2930} {"train_loss": -12.40103530883789, "global_step": 492386, "epoch": 2930} {"train_loss": -12.30557918548584, "global_step": 492387, "epoch": 2930} {"train_loss": -12.252097129821777, "global_step": 492388, "epoch": 2930} {"train_loss": -12.065884590148926, "global_step": 492389, "epoch": 2930} {"train_loss": -12.299175262451172, "global_step": 492390, "epoch": 2930} {"train_loss": -12.122364044189453, "global_step": 492391, "epoch": 2930} {"train_loss": -11.978497505187988, "global_step": 492392, "epoch": 2930} {"train_loss": -12.34394645690918, "global_step": 492393, "epoch": 2930} {"train_loss": -12.056224822998047, "global_step": 492394, "epoch": 2930} {"train_loss": -12.415996551513672, "global_step": 492395, "epoch": 2930} {"train_loss": -12.223395347595215, "global_step": 492396, "epoch": 2930} {"train_loss": -12.589445114135742, "global_step": 492397, "epoch": 2930} {"train_loss": -12.653202056884766, "global_step": 492398, "epoch": 2930} {"train_loss": -12.207366943359375, "global_step": 492399, "epoch": 2930} {"train_loss": -12.40937614440918, "global_step": 492400, "epoch": 2930} {"train_loss": -12.386432647705078, "global_step": 492401, "epoch": 2930} {"train_loss": -12.391014099121094, "global_step": 492402, "epoch": 2930} {"train_loss": -12.213374137878418, "global_step": 492403, "epoch": 2930} {"train_loss": -12.28156852722168, "global_step": 492404, "epoch": 2930} {"train_loss": -12.301996231079102, "global_step": 492405, "epoch": 2930} {"train_loss": -12.156972885131836, "global_step": 492406, "epoch": 2930} {"train_loss": -12.243702235675993, "global_step": 492407, "epoch": 2930, "val_loss": 322374.90625, "train_action_mse_error": 1.2979596853256226} {"train_loss": -12.291694641113281, "global_step": 492408, "epoch": 2931} {"train_loss": -12.77613353729248, "global_step": 492409, "epoch": 2931} {"train_loss": -12.476665496826172, "global_step": 492410, "epoch": 2931} {"train_loss": -12.231943130493164, "global_step": 492411, "epoch": 2931} {"train_loss": -12.607942581176758, "global_step": 492412, "epoch": 2931} {"train_loss": -12.538175582885742, "global_step": 492413, "epoch": 2931} {"train_loss": -12.63723087310791, "global_step": 492414, "epoch": 2931} {"train_loss": -12.736554145812988, "global_step": 492415, "epoch": 2931} {"train_loss": -12.719602584838867, "global_step": 492416, "epoch": 2931} {"train_loss": -12.805926322937012, "global_step": 492417, "epoch": 2931} {"train_loss": -12.546111106872559, "global_step": 492418, "epoch": 2931} {"train_loss": -12.79256820678711, "global_step": 492419, "epoch": 2931} {"train_loss": -12.852165222167969, "global_step": 492420, "epoch": 2931} {"train_loss": -12.52875804901123, "global_step": 492421, "epoch": 2931} {"train_loss": -12.74420166015625, "global_step": 492422, "epoch": 2931} {"train_loss": -12.747305870056152, "global_step": 492423, "epoch": 2931} {"train_loss": -12.329595565795898, "global_step": 492424, "epoch": 2931} {"train_loss": -12.326898574829102, "global_step": 492425, "epoch": 2931} {"train_loss": -12.79542064666748, "global_step": 492426, "epoch": 2931} {"train_loss": -11.884764671325684, "global_step": 492427, "epoch": 2931} {"train_loss": -12.826985359191895, "global_step": 492428, "epoch": 2931} {"train_loss": -12.367408752441406, "global_step": 492429, "epoch": 2931} {"train_loss": -12.221661567687988, "global_step": 492430, "epoch": 2931} {"train_loss": -12.768970489501953, "global_step": 492431, "epoch": 2931} {"train_loss": -12.698982238769531, "global_step": 492432, "epoch": 2931} {"train_loss": -12.568668365478516, "global_step": 492433, "epoch": 2931} {"train_loss": -12.333454132080078, "global_step": 492434, "epoch": 2931} {"train_loss": -12.139471054077148, "global_step": 492435, "epoch": 2931} {"train_loss": -12.808540344238281, "global_step": 492436, "epoch": 2931} {"train_loss": -12.665241241455078, "global_step": 492437, "epoch": 2931} {"train_loss": -12.444376945495605, "global_step": 492438, "epoch": 2931} {"train_loss": -12.805584907531738, "global_step": 492439, "epoch": 2931} {"train_loss": -12.641975402832031, "global_step": 492440, "epoch": 2931} {"train_loss": -12.532781600952148, "global_step": 492441, "epoch": 2931} {"train_loss": -12.759886741638184, "global_step": 492442, "epoch": 2931} {"train_loss": -12.710454940795898, "global_step": 492443, "epoch": 2931} {"train_loss": -12.524314880371094, "global_step": 492444, "epoch": 2931} {"train_loss": -12.61001205444336, "global_step": 492445, "epoch": 2931} {"train_loss": -12.92998218536377, "global_step": 492446, "epoch": 2931} {"train_loss": -12.932162284851074, "global_step": 492447, "epoch": 2931} {"train_loss": -12.527164459228516, "global_step": 492448, "epoch": 2931} {"train_loss": -12.74748420715332, "global_step": 492449, "epoch": 2931} {"train_loss": -12.910131454467773, "global_step": 492450, "epoch": 2931} {"train_loss": -12.718694686889648, "global_step": 492451, "epoch": 2931} {"train_loss": -12.75490951538086, "global_step": 492452, "epoch": 2931} {"train_loss": -12.801753044128418, "global_step": 492453, "epoch": 2931} {"train_loss": -12.837859153747559, "global_step": 492454, "epoch": 2931} {"train_loss": -12.774324417114258, "global_step": 492455, "epoch": 2931} {"train_loss": -13.146608352661133, "global_step": 492456, "epoch": 2931} {"train_loss": -12.859618186950684, "global_step": 492457, "epoch": 2931} {"train_loss": -12.899380683898926, "global_step": 492458, "epoch": 2931} {"train_loss": -12.924752235412598, "global_step": 492459, "epoch": 2931} {"train_loss": -12.999917030334473, "global_step": 492460, "epoch": 2931} {"train_loss": -13.051673889160156, "global_step": 492461, "epoch": 2931} {"train_loss": -12.950499534606934, "global_step": 492462, "epoch": 2931} {"train_loss": -12.777097702026367, "global_step": 492463, "epoch": 2931} {"train_loss": -13.024463653564453, "global_step": 492464, "epoch": 2931} {"train_loss": -12.893856048583984, "global_step": 492465, "epoch": 2931} {"train_loss": -12.90859603881836, "global_step": 492466, "epoch": 2931} {"train_loss": -12.706372261047363, "global_step": 492467, "epoch": 2931} {"train_loss": -12.909808158874512, "global_step": 492468, "epoch": 2931} {"train_loss": -12.905251502990723, "global_step": 492469, "epoch": 2931} {"train_loss": -12.927841186523438, "global_step": 492470, "epoch": 2931} {"train_loss": -12.803276062011719, "global_step": 492471, "epoch": 2931} {"train_loss": -12.892929077148438, "global_step": 492472, "epoch": 2931} {"train_loss": -12.912260055541992, "global_step": 492473, "epoch": 2931} {"train_loss": -12.994632720947266, "global_step": 492474, "epoch": 2931} {"train_loss": -12.262396812438965, "global_step": 492475, "epoch": 2931} {"train_loss": -12.432754516601562, "global_step": 492476, "epoch": 2931} {"train_loss": -12.625773429870605, "global_step": 492477, "epoch": 2931} {"train_loss": -12.694718360900879, "global_step": 492478, "epoch": 2931} {"train_loss": -12.759531021118164, "global_step": 492479, "epoch": 2931} {"train_loss": -12.059353828430176, "global_step": 492480, "epoch": 2931} {"train_loss": -11.698305130004883, "global_step": 492481, "epoch": 2931} {"train_loss": -11.652140617370605, "global_step": 492482, "epoch": 2931} {"train_loss": -12.590835571289062, "global_step": 492483, "epoch": 2931} {"train_loss": -11.035148620605469, "global_step": 492484, "epoch": 2931} {"train_loss": -11.32291030883789, "global_step": 492485, "epoch": 2931} {"train_loss": -12.331321716308594, "global_step": 492486, "epoch": 2931} {"train_loss": -11.944002151489258, "global_step": 492487, "epoch": 2931} {"train_loss": -12.449999809265137, "global_step": 492488, "epoch": 2931} {"train_loss": -12.27502155303955, "global_step": 492489, "epoch": 2931} {"train_loss": -12.216215133666992, "global_step": 492490, "epoch": 2931} {"train_loss": -12.241355895996094, "global_step": 492491, "epoch": 2931} {"train_loss": -12.567885398864746, "global_step": 492492, "epoch": 2931} {"train_loss": -12.019588470458984, "global_step": 492493, "epoch": 2931} {"train_loss": -12.405660629272461, "global_step": 492494, "epoch": 2931} {"train_loss": -12.262645721435547, "global_step": 492495, "epoch": 2931} {"train_loss": -11.371973991394043, "global_step": 492496, "epoch": 2931} {"train_loss": -12.178009033203125, "global_step": 492497, "epoch": 2931} {"train_loss": -12.444448471069336, "global_step": 492498, "epoch": 2931} {"train_loss": -11.852350234985352, "global_step": 492499, "epoch": 2931} {"train_loss": -11.161943435668945, "global_step": 492500, "epoch": 2931} {"train_loss": -11.28510856628418, "global_step": 492501, "epoch": 2931} {"train_loss": -11.776899337768555, "global_step": 492502, "epoch": 2931} {"train_loss": -11.203336715698242, "global_step": 492503, "epoch": 2931} {"train_loss": -11.318029403686523, "global_step": 492504, "epoch": 2931} {"train_loss": -10.753901481628418, "global_step": 492505, "epoch": 2931} {"train_loss": -11.328794479370117, "global_step": 492506, "epoch": 2931} {"train_loss": -10.322684288024902, "global_step": 492507, "epoch": 2931} {"train_loss": -11.059866905212402, "global_step": 492508, "epoch": 2931} {"train_loss": -11.780701637268066, "global_step": 492509, "epoch": 2931} {"train_loss": -10.264277458190918, "global_step": 492510, "epoch": 2931} {"train_loss": -11.823782920837402, "global_step": 492511, "epoch": 2931} {"train_loss": -10.412317276000977, "global_step": 492512, "epoch": 2931} {"train_loss": -10.0989990234375, "global_step": 492513, "epoch": 2931} {"train_loss": -11.479059219360352, "global_step": 492514, "epoch": 2931} {"train_loss": -8.6876220703125, "global_step": 492515, "epoch": 2931} {"train_loss": -10.672403335571289, "global_step": 492516, "epoch": 2931} {"train_loss": -10.243112564086914, "global_step": 492517, "epoch": 2931} {"train_loss": -10.79173469543457, "global_step": 492518, "epoch": 2931} {"train_loss": -10.786314010620117, "global_step": 492519, "epoch": 2931} {"train_loss": -10.381203651428223, "global_step": 492520, "epoch": 2931} {"train_loss": -11.226624488830566, "global_step": 492521, "epoch": 2931} {"train_loss": -10.802630424499512, "global_step": 492522, "epoch": 2931} {"train_loss": -10.49173355102539, "global_step": 492523, "epoch": 2931} {"train_loss": -11.796001434326172, "global_step": 492524, "epoch": 2931} {"train_loss": -10.250667572021484, "global_step": 492525, "epoch": 2931} {"train_loss": -11.102142333984375, "global_step": 492526, "epoch": 2931} {"train_loss": -11.533551216125488, "global_step": 492527, "epoch": 2931} {"train_loss": -11.200267791748047, "global_step": 492528, "epoch": 2931} {"train_loss": -11.708778381347656, "global_step": 492529, "epoch": 2931} {"train_loss": -10.503667831420898, "global_step": 492530, "epoch": 2931} {"train_loss": -12.218049049377441, "global_step": 492531, "epoch": 2931} {"train_loss": -11.472465515136719, "global_step": 492532, "epoch": 2931} {"train_loss": -12.347139358520508, "global_step": 492533, "epoch": 2931} {"train_loss": -11.917764663696289, "global_step": 492534, "epoch": 2931} {"train_loss": -12.279626846313477, "global_step": 492535, "epoch": 2931} {"train_loss": -11.796801567077637, "global_step": 492536, "epoch": 2931} {"train_loss": -12.185275077819824, "global_step": 492537, "epoch": 2931} {"train_loss": -12.248525619506836, "global_step": 492538, "epoch": 2931} {"train_loss": -11.992334365844727, "global_step": 492539, "epoch": 2931} {"train_loss": -12.338817596435547, "global_step": 492540, "epoch": 2931} {"train_loss": -11.792814254760742, "global_step": 492541, "epoch": 2931} {"train_loss": -12.244949340820312, "global_step": 492542, "epoch": 2931} {"train_loss": -12.208948135375977, "global_step": 492543, "epoch": 2931} {"train_loss": -12.278644561767578, "global_step": 492544, "epoch": 2931} {"train_loss": -11.993232727050781, "global_step": 492545, "epoch": 2931} {"train_loss": -11.975955963134766, "global_step": 492546, "epoch": 2931} {"train_loss": -12.603995323181152, "global_step": 492547, "epoch": 2931} {"train_loss": -12.118640899658203, "global_step": 492548, "epoch": 2931} {"train_loss": -12.31496810913086, "global_step": 492549, "epoch": 2931} {"train_loss": -11.97130298614502, "global_step": 492550, "epoch": 2931} {"train_loss": -12.52728271484375, "global_step": 492551, "epoch": 2931} {"train_loss": -12.324992179870605, "global_step": 492552, "epoch": 2931} {"train_loss": -12.153340339660645, "global_step": 492553, "epoch": 2931} {"train_loss": -12.140432357788086, "global_step": 492554, "epoch": 2931} {"train_loss": -12.29640007019043, "global_step": 492555, "epoch": 2931} {"train_loss": -12.016318321228027, "global_step": 492556, "epoch": 2931} {"train_loss": -12.4677152633667, "global_step": 492557, "epoch": 2931} {"train_loss": -11.524349212646484, "global_step": 492558, "epoch": 2931} {"train_loss": -12.10066032409668, "global_step": 492559, "epoch": 2931} {"train_loss": -12.02029800415039, "global_step": 492560, "epoch": 2931} {"train_loss": -11.955293655395508, "global_step": 492561, "epoch": 2931} {"train_loss": -12.414777755737305, "global_step": 492562, "epoch": 2931} {"train_loss": -11.83248519897461, "global_step": 492563, "epoch": 2931} {"train_loss": -12.301810264587402, "global_step": 492564, "epoch": 2931} {"train_loss": -11.676149368286133, "global_step": 492565, "epoch": 2931} {"train_loss": -11.908607482910156, "global_step": 492566, "epoch": 2931} {"train_loss": -12.110054016113281, "global_step": 492567, "epoch": 2931} {"train_loss": -11.979145050048828, "global_step": 492568, "epoch": 2931} {"train_loss": -12.2719087600708, "global_step": 492569, "epoch": 2931} {"train_loss": -11.998294830322266, "global_step": 492570, "epoch": 2931} {"train_loss": -12.164470672607422, "global_step": 492571, "epoch": 2931} {"train_loss": -12.324151992797852, "global_step": 492572, "epoch": 2931} {"train_loss": -11.992039680480957, "global_step": 492573, "epoch": 2931} {"train_loss": -12.515892028808594, "global_step": 492574, "epoch": 2931} {"train_loss": -12.135653745560418, "global_step": 492575, "epoch": 2931, "val_loss": 318978.875} {"train_loss": -12.440571784973145, "global_step": 492576, "epoch": 2932} {"train_loss": -12.137825965881348, "global_step": 492577, "epoch": 2932} {"train_loss": -12.39913558959961, "global_step": 492578, "epoch": 2932} {"train_loss": -11.9774169921875, "global_step": 492579, "epoch": 2932} {"train_loss": -12.20664119720459, "global_step": 492580, "epoch": 2932} {"train_loss": -12.122325897216797, "global_step": 492581, "epoch": 2932} {"train_loss": -11.747579574584961, "global_step": 492582, "epoch": 2932} {"train_loss": -12.317692756652832, "global_step": 492583, "epoch": 2932} {"train_loss": -11.858781814575195, "global_step": 492584, "epoch": 2932} {"train_loss": -11.720758438110352, "global_step": 492585, "epoch": 2932} {"train_loss": -11.758234024047852, "global_step": 492586, "epoch": 2932} {"train_loss": -12.18096923828125, "global_step": 492587, "epoch": 2932} {"train_loss": -11.830072402954102, "global_step": 492588, "epoch": 2932} {"train_loss": -12.610729217529297, "global_step": 492589, "epoch": 2932} {"train_loss": -11.998631477355957, "global_step": 492590, "epoch": 2932} {"train_loss": -12.406759262084961, "global_step": 492591, "epoch": 2932} {"train_loss": -12.406564712524414, "global_step": 492592, "epoch": 2932} {"train_loss": -12.789289474487305, "global_step": 492593, "epoch": 2932} {"train_loss": -12.605819702148438, "global_step": 492594, "epoch": 2932} {"train_loss": -12.524117469787598, "global_step": 492595, "epoch": 2932} {"train_loss": -12.710111618041992, "global_step": 492596, "epoch": 2932} {"train_loss": -12.392410278320312, "global_step": 492597, "epoch": 2932} {"train_loss": -12.723493576049805, "global_step": 492598, "epoch": 2932} {"train_loss": -12.588570594787598, "global_step": 492599, "epoch": 2932} {"train_loss": -12.691851615905762, "global_step": 492600, "epoch": 2932} {"train_loss": -12.441885948181152, "global_step": 492601, "epoch": 2932} {"train_loss": -12.400769233703613, "global_step": 492602, "epoch": 2932} {"train_loss": -12.637277603149414, "global_step": 492603, "epoch": 2932} {"train_loss": -12.707855224609375, "global_step": 492604, "epoch": 2932} {"train_loss": -12.489054679870605, "global_step": 492605, "epoch": 2932} {"train_loss": -12.605274200439453, "global_step": 492606, "epoch": 2932} {"train_loss": -12.590167045593262, "global_step": 492607, "epoch": 2932} {"train_loss": -12.547100067138672, "global_step": 492608, "epoch": 2932} {"train_loss": -12.732255935668945, "global_step": 492609, "epoch": 2932} {"train_loss": -12.864887237548828, "global_step": 492610, "epoch": 2932} {"train_loss": -12.617168426513672, "global_step": 492611, "epoch": 2932} {"train_loss": -12.733683586120605, "global_step": 492612, "epoch": 2932} {"train_loss": -12.94614028930664, "global_step": 492613, "epoch": 2932} {"train_loss": -12.805424690246582, "global_step": 492614, "epoch": 2932} {"train_loss": -12.636098861694336, "global_step": 492615, "epoch": 2932} {"train_loss": -12.708169937133789, "global_step": 492616, "epoch": 2932} {"train_loss": -12.621148109436035, "global_step": 492617, "epoch": 2932} {"train_loss": -12.771829605102539, "global_step": 492618, "epoch": 2932} {"train_loss": -12.740582466125488, "global_step": 492619, "epoch": 2932} {"train_loss": -12.631452560424805, "global_step": 492620, "epoch": 2932} {"train_loss": -12.729836463928223, "global_step": 492621, "epoch": 2932} {"train_loss": -12.588888168334961, "global_step": 492622, "epoch": 2932} {"train_loss": -12.744710922241211, "global_step": 492623, "epoch": 2932} {"train_loss": -12.858304977416992, "global_step": 492624, "epoch": 2932} {"train_loss": -12.775178909301758, "global_step": 492625, "epoch": 2932} {"train_loss": -12.721240043640137, "global_step": 492626, "epoch": 2932} {"train_loss": -13.024596214294434, "global_step": 492627, "epoch": 2932} {"train_loss": -12.66308307647705, "global_step": 492628, "epoch": 2932} {"train_loss": -12.46723747253418, "global_step": 492629, "epoch": 2932} {"train_loss": -12.936480522155762, "global_step": 492630, "epoch": 2932} {"train_loss": -12.445981979370117, "global_step": 492631, "epoch": 2932} {"train_loss": -12.334712982177734, "global_step": 492632, "epoch": 2932} {"train_loss": -13.129133224487305, "global_step": 492633, "epoch": 2932} {"train_loss": -12.350786209106445, "global_step": 492634, "epoch": 2932} {"train_loss": -12.728772163391113, "global_step": 492635, "epoch": 2932} {"train_loss": -12.774810791015625, "global_step": 492636, "epoch": 2932} {"train_loss": -12.50936508178711, "global_step": 492637, "epoch": 2932} {"train_loss": -12.482412338256836, "global_step": 492638, "epoch": 2932} {"train_loss": -12.753703117370605, "global_step": 492639, "epoch": 2932} {"train_loss": -12.299766540527344, "global_step": 492640, "epoch": 2932} {"train_loss": -11.992326736450195, "global_step": 492641, "epoch": 2932} {"train_loss": -12.359272003173828, "global_step": 492642, "epoch": 2932} {"train_loss": -12.263025283813477, "global_step": 492643, "epoch": 2932} {"train_loss": -11.907419204711914, "global_step": 492644, "epoch": 2932} {"train_loss": -13.051265716552734, "global_step": 492645, "epoch": 2932} {"train_loss": -11.944828033447266, "global_step": 492646, "epoch": 2932} {"train_loss": -12.307823181152344, "global_step": 492647, "epoch": 2932} {"train_loss": -12.637989044189453, "global_step": 492648, "epoch": 2932} {"train_loss": -12.60956859588623, "global_step": 492649, "epoch": 2932} {"train_loss": -12.29206371307373, "global_step": 492650, "epoch": 2932} {"train_loss": -12.695584297180176, "global_step": 492651, "epoch": 2932} {"train_loss": -12.732937812805176, "global_step": 492652, "epoch": 2932} {"train_loss": -12.633172988891602, "global_step": 492653, "epoch": 2932} {"train_loss": -12.740293502807617, "global_step": 492654, "epoch": 2932} {"train_loss": -12.699352264404297, "global_step": 492655, "epoch": 2932} {"train_loss": -12.816712379455566, "global_step": 492656, "epoch": 2932} {"train_loss": -12.929581642150879, "global_step": 492657, "epoch": 2932} {"train_loss": -12.911735534667969, "global_step": 492658, "epoch": 2932} {"train_loss": -12.63599681854248, "global_step": 492659, "epoch": 2932} {"train_loss": -12.915987014770508, "global_step": 492660, "epoch": 2932} {"train_loss": -12.911270141601562, "global_step": 492661, "epoch": 2932} {"train_loss": -12.849616050720215, "global_step": 492662, "epoch": 2932} {"train_loss": -12.924171447753906, "global_step": 492663, "epoch": 2932} {"train_loss": -12.864839553833008, "global_step": 492664, "epoch": 2932} {"train_loss": -13.005316734313965, "global_step": 492665, "epoch": 2932} {"train_loss": -12.889741897583008, "global_step": 492666, "epoch": 2932} {"train_loss": -12.881532669067383, "global_step": 492667, "epoch": 2932} {"train_loss": -13.040013313293457, "global_step": 492668, "epoch": 2932} {"train_loss": -12.757499694824219, "global_step": 492669, "epoch": 2932} {"train_loss": -13.06664752960205, "global_step": 492670, "epoch": 2932} {"train_loss": -12.771950721740723, "global_step": 492671, "epoch": 2932} {"train_loss": -12.984299659729004, "global_step": 492672, "epoch": 2932} {"train_loss": -12.626371383666992, "global_step": 492673, "epoch": 2932} {"train_loss": -12.33745002746582, "global_step": 492674, "epoch": 2932} {"train_loss": -12.867314338684082, "global_step": 492675, "epoch": 2932} {"train_loss": -12.764253616333008, "global_step": 492676, "epoch": 2932} {"train_loss": -12.839469909667969, "global_step": 492677, "epoch": 2932} {"train_loss": -12.882476806640625, "global_step": 492678, "epoch": 2932} {"train_loss": -12.793354988098145, "global_step": 492679, "epoch": 2932} {"train_loss": -12.729548454284668, "global_step": 492680, "epoch": 2932} {"train_loss": -12.467812538146973, "global_step": 492681, "epoch": 2932} {"train_loss": -12.739198684692383, "global_step": 492682, "epoch": 2932} {"train_loss": -13.041812896728516, "global_step": 492683, "epoch": 2932} {"train_loss": -12.70776653289795, "global_step": 492684, "epoch": 2932} {"train_loss": -12.995092391967773, "global_step": 492685, "epoch": 2932} {"train_loss": -12.765213012695312, "global_step": 492686, "epoch": 2932} {"train_loss": -12.74454116821289, "global_step": 492687, "epoch": 2932} {"train_loss": -12.762579917907715, "global_step": 492688, "epoch": 2932} {"train_loss": -12.824934005737305, "global_step": 492689, "epoch": 2932} {"train_loss": -12.343685150146484, "global_step": 492690, "epoch": 2932} {"train_loss": -12.197505950927734, "global_step": 492691, "epoch": 2932} {"train_loss": -12.52219009399414, "global_step": 492692, "epoch": 2932} {"train_loss": -12.731414794921875, "global_step": 492693, "epoch": 2932} {"train_loss": -12.715822219848633, "global_step": 492694, "epoch": 2932} {"train_loss": -12.233871459960938, "global_step": 492695, "epoch": 2932} {"train_loss": -13.135616302490234, "global_step": 492696, "epoch": 2932} {"train_loss": -12.4378080368042, "global_step": 492697, "epoch": 2932} {"train_loss": -12.747247695922852, "global_step": 492698, "epoch": 2932} {"train_loss": -12.784914016723633, "global_step": 492699, "epoch": 2932} {"train_loss": -12.930130004882812, "global_step": 492700, "epoch": 2932} {"train_loss": -12.890555381774902, "global_step": 492701, "epoch": 2932} {"train_loss": -12.436359405517578, "global_step": 492702, "epoch": 2932} {"train_loss": -12.839140892028809, "global_step": 492703, "epoch": 2932} {"train_loss": -12.867630004882812, "global_step": 492704, "epoch": 2932} {"train_loss": -12.516328811645508, "global_step": 492705, "epoch": 2932} {"train_loss": -12.065735816955566, "global_step": 492706, "epoch": 2932} {"train_loss": -11.896438598632812, "global_step": 492707, "epoch": 2932} {"train_loss": -12.43277359008789, "global_step": 492708, "epoch": 2932} {"train_loss": -12.734537124633789, "global_step": 492709, "epoch": 2932} {"train_loss": -12.570417404174805, "global_step": 492710, "epoch": 2932} {"train_loss": -12.09935474395752, "global_step": 492711, "epoch": 2932} {"train_loss": -11.453104019165039, "global_step": 492712, "epoch": 2932} {"train_loss": -12.257734298706055, "global_step": 492713, "epoch": 2932} {"train_loss": -12.500053405761719, "global_step": 492714, "epoch": 2932} {"train_loss": -12.898123741149902, "global_step": 492715, "epoch": 2932} {"train_loss": -12.234481811523438, "global_step": 492716, "epoch": 2932} {"train_loss": -12.50505256652832, "global_step": 492717, "epoch": 2932} {"train_loss": -12.436904907226562, "global_step": 492718, "epoch": 2932} {"train_loss": -12.634782791137695, "global_step": 492719, "epoch": 2932} {"train_loss": -11.502888679504395, "global_step": 492720, "epoch": 2932} {"train_loss": -9.821435928344727, "global_step": 492721, "epoch": 2932} {"train_loss": -10.329255104064941, "global_step": 492722, "epoch": 2932} {"train_loss": -10.364442825317383, "global_step": 492723, "epoch": 2932} {"train_loss": -10.743391036987305, "global_step": 492724, "epoch": 2932} {"train_loss": -10.92582893371582, "global_step": 492725, "epoch": 2932} {"train_loss": -10.48482894897461, "global_step": 492726, "epoch": 2932} {"train_loss": -10.912874221801758, "global_step": 492727, "epoch": 2932} {"train_loss": -11.78799819946289, "global_step": 492728, "epoch": 2932} {"train_loss": -11.334890365600586, "global_step": 492729, "epoch": 2932} {"train_loss": -11.74731159210205, "global_step": 492730, "epoch": 2932} {"train_loss": -11.452263832092285, "global_step": 492731, "epoch": 2932} {"train_loss": -11.673803329467773, "global_step": 492732, "epoch": 2932} {"train_loss": -11.845678329467773, "global_step": 492733, "epoch": 2932} {"train_loss": -11.166008949279785, "global_step": 492734, "epoch": 2932} {"train_loss": -11.327695846557617, "global_step": 492735, "epoch": 2932} {"train_loss": -12.192535400390625, "global_step": 492736, "epoch": 2932} {"train_loss": -12.178415298461914, "global_step": 492737, "epoch": 2932} {"train_loss": -11.42855453491211, "global_step": 492738, "epoch": 2932} {"train_loss": -11.767141342163086, "global_step": 492739, "epoch": 2932} {"train_loss": -11.831073760986328, "global_step": 492740, "epoch": 2932} {"train_loss": -10.859638214111328, "global_step": 492741, "epoch": 2932} {"train_loss": -10.064203262329102, "global_step": 492742, "epoch": 2932} {"train_loss": -12.385410218011765, "global_step": 492743, "epoch": 2932, "val_loss": 320189.0} {"train_loss": -9.223772048950195, "global_step": 492744, "epoch": 2933} {"train_loss": -9.677125930786133, "global_step": 492745, "epoch": 2933} {"train_loss": -9.5653076171875, "global_step": 492746, "epoch": 2933} {"train_loss": -11.300413131713867, "global_step": 492747, "epoch": 2933} {"train_loss": -10.08104419708252, "global_step": 492748, "epoch": 2933} {"train_loss": -10.208917617797852, "global_step": 492749, "epoch": 2933} {"train_loss": -9.991874694824219, "global_step": 492750, "epoch": 2933} {"train_loss": -11.698440551757812, "global_step": 492751, "epoch": 2933} {"train_loss": -9.976242065429688, "global_step": 492752, "epoch": 2933} {"train_loss": -11.700096130371094, "global_step": 492753, "epoch": 2933} {"train_loss": -11.39358139038086, "global_step": 492754, "epoch": 2933} {"train_loss": -11.523009300231934, "global_step": 492755, "epoch": 2933} {"train_loss": -11.59689998626709, "global_step": 492756, "epoch": 2933} {"train_loss": -11.401741981506348, "global_step": 492757, "epoch": 2933} {"train_loss": -11.994646072387695, "global_step": 492758, "epoch": 2933} {"train_loss": -11.589268684387207, "global_step": 492759, "epoch": 2933} {"train_loss": -11.93673324584961, "global_step": 492760, "epoch": 2933} {"train_loss": -11.296491622924805, "global_step": 492761, "epoch": 2933} {"train_loss": -12.165815353393555, "global_step": 492762, "epoch": 2933} {"train_loss": -11.48206901550293, "global_step": 492763, "epoch": 2933} {"train_loss": -11.873071670532227, "global_step": 492764, "epoch": 2933} {"train_loss": -11.834453582763672, "global_step": 492765, "epoch": 2933} {"train_loss": -11.884910583496094, "global_step": 492766, "epoch": 2933} {"train_loss": -12.16915512084961, "global_step": 492767, "epoch": 2933} {"train_loss": -12.180465698242188, "global_step": 492768, "epoch": 2933} {"train_loss": -12.109882354736328, "global_step": 492769, "epoch": 2933} {"train_loss": -12.411195755004883, "global_step": 492770, "epoch": 2933} {"train_loss": -12.550687789916992, "global_step": 492771, "epoch": 2933} {"train_loss": -12.31032943725586, "global_step": 492772, "epoch": 2933} {"train_loss": -12.537208557128906, "global_step": 492773, "epoch": 2933} {"train_loss": -12.282278060913086, "global_step": 492774, "epoch": 2933} {"train_loss": -12.476736068725586, "global_step": 492775, "epoch": 2933} {"train_loss": -12.30272102355957, "global_step": 492776, "epoch": 2933} {"train_loss": -12.626510620117188, "global_step": 492777, "epoch": 2933} {"train_loss": -12.447263717651367, "global_step": 492778, "epoch": 2933} {"train_loss": -12.562675476074219, "global_step": 492779, "epoch": 2933} {"train_loss": -12.44167423248291, "global_step": 492780, "epoch": 2933} {"train_loss": -12.523123741149902, "global_step": 492781, "epoch": 2933} {"train_loss": -12.627031326293945, "global_step": 492782, "epoch": 2933} {"train_loss": -12.641510009765625, "global_step": 492783, "epoch": 2933} {"train_loss": -12.775985717773438, "global_step": 492784, "epoch": 2933} {"train_loss": -12.557355880737305, "global_step": 492785, "epoch": 2933} {"train_loss": -12.653857231140137, "global_step": 492786, "epoch": 2933} {"train_loss": -12.795757293701172, "global_step": 492787, "epoch": 2933} {"train_loss": -12.497077941894531, "global_step": 492788, "epoch": 2933} {"train_loss": -12.585362434387207, "global_step": 492789, "epoch": 2933} {"train_loss": -12.815754890441895, "global_step": 492790, "epoch": 2933} {"train_loss": -12.805842399597168, "global_step": 492791, "epoch": 2933} {"train_loss": -12.807120323181152, "global_step": 492792, "epoch": 2933} {"train_loss": -12.953766822814941, "global_step": 492793, "epoch": 2933} {"train_loss": -12.740556716918945, "global_step": 492794, "epoch": 2933} {"train_loss": -12.70001220703125, "global_step": 492795, "epoch": 2933} {"train_loss": -12.752251625061035, "global_step": 492796, "epoch": 2933} {"train_loss": -12.638726234436035, "global_step": 492797, "epoch": 2933} {"train_loss": -12.982809066772461, "global_step": 492798, "epoch": 2933} {"train_loss": -12.546966552734375, "global_step": 492799, "epoch": 2933} {"train_loss": -12.873992919921875, "global_step": 492800, "epoch": 2933} {"train_loss": -12.9232816696167, "global_step": 492801, "epoch": 2933} {"train_loss": -12.420416831970215, "global_step": 492802, "epoch": 2933} {"train_loss": -12.891031265258789, "global_step": 492803, "epoch": 2933} {"train_loss": -12.754051208496094, "global_step": 492804, "epoch": 2933} {"train_loss": -12.865516662597656, "global_step": 492805, "epoch": 2933} {"train_loss": -12.896646499633789, "global_step": 492806, "epoch": 2933} {"train_loss": -13.038274765014648, "global_step": 492807, "epoch": 2933} {"train_loss": -12.740942001342773, "global_step": 492808, "epoch": 2933} {"train_loss": -12.733217239379883, "global_step": 492809, "epoch": 2933} {"train_loss": -12.77829647064209, "global_step": 492810, "epoch": 2933} {"train_loss": -12.387453079223633, "global_step": 492811, "epoch": 2933} {"train_loss": -12.84980297088623, "global_step": 492812, "epoch": 2933} {"train_loss": -12.846840858459473, "global_step": 492813, "epoch": 2933} {"train_loss": -12.744029998779297, "global_step": 492814, "epoch": 2933} {"train_loss": -12.821622848510742, "global_step": 492815, "epoch": 2933} {"train_loss": -12.927255630493164, "global_step": 492816, "epoch": 2933} {"train_loss": -12.928768157958984, "global_step": 492817, "epoch": 2933} {"train_loss": -12.800130844116211, "global_step": 492818, "epoch": 2933} {"train_loss": -12.928266525268555, "global_step": 492819, "epoch": 2933} {"train_loss": -12.714118957519531, "global_step": 492820, "epoch": 2933} {"train_loss": -13.077457427978516, "global_step": 492821, "epoch": 2933} {"train_loss": -12.710171699523926, "global_step": 492822, "epoch": 2933} {"train_loss": -12.974662780761719, "global_step": 492823, "epoch": 2933} {"train_loss": -12.626911163330078, "global_step": 492824, "epoch": 2933} {"train_loss": -12.848650932312012, "global_step": 492825, "epoch": 2933} {"train_loss": -12.878507614135742, "global_step": 492826, "epoch": 2933} {"train_loss": -12.857666969299316, "global_step": 492827, "epoch": 2933} {"train_loss": -13.116914749145508, "global_step": 492828, "epoch": 2933} {"train_loss": -12.346193313598633, "global_step": 492829, "epoch": 2933} {"train_loss": -12.331064224243164, "global_step": 492830, "epoch": 2933} {"train_loss": -12.854389190673828, "global_step": 492831, "epoch": 2933} {"train_loss": -13.113812446594238, "global_step": 492832, "epoch": 2933} {"train_loss": -12.66861343383789, "global_step": 492833, "epoch": 2933} {"train_loss": -12.376548767089844, "global_step": 492834, "epoch": 2933} {"train_loss": -12.895479202270508, "global_step": 492835, "epoch": 2933} {"train_loss": -12.902846336364746, "global_step": 492836, "epoch": 2933} {"train_loss": -12.192602157592773, "global_step": 492837, "epoch": 2933} {"train_loss": -11.698912620544434, "global_step": 492838, "epoch": 2933} {"train_loss": -12.216331481933594, "global_step": 492839, "epoch": 2933} {"train_loss": -12.913549423217773, "global_step": 492840, "epoch": 2933} {"train_loss": -12.545000076293945, "global_step": 492841, "epoch": 2933} {"train_loss": -12.458015441894531, "global_step": 492842, "epoch": 2933} {"train_loss": -12.457366943359375, "global_step": 492843, "epoch": 2933} {"train_loss": -11.346120834350586, "global_step": 492844, "epoch": 2933} {"train_loss": -11.254173278808594, "global_step": 492845, "epoch": 2933} {"train_loss": -12.308859825134277, "global_step": 492846, "epoch": 2933} {"train_loss": -12.149494171142578, "global_step": 492847, "epoch": 2933} {"train_loss": -11.84882926940918, "global_step": 492848, "epoch": 2933} {"train_loss": -11.771028518676758, "global_step": 492849, "epoch": 2933} {"train_loss": -11.576261520385742, "global_step": 492850, "epoch": 2933} {"train_loss": -11.573945045471191, "global_step": 492851, "epoch": 2933} {"train_loss": -11.405949592590332, "global_step": 492852, "epoch": 2933} {"train_loss": -11.32752513885498, "global_step": 492853, "epoch": 2933} {"train_loss": -11.434898376464844, "global_step": 492854, "epoch": 2933} {"train_loss": -12.164775848388672, "global_step": 492855, "epoch": 2933} {"train_loss": -11.165030479431152, "global_step": 492856, "epoch": 2933} {"train_loss": -11.73779582977295, "global_step": 492857, "epoch": 2933} {"train_loss": -11.747474670410156, "global_step": 492858, "epoch": 2933} {"train_loss": -11.809513092041016, "global_step": 492859, "epoch": 2933} {"train_loss": -12.002845764160156, "global_step": 492860, "epoch": 2933} {"train_loss": -12.230175018310547, "global_step": 492861, "epoch": 2933} {"train_loss": -12.095992088317871, "global_step": 492862, "epoch": 2933} {"train_loss": -11.963850021362305, "global_step": 492863, "epoch": 2933} {"train_loss": -12.470468521118164, "global_step": 492864, "epoch": 2933} {"train_loss": -11.046914100646973, "global_step": 492865, "epoch": 2933} {"train_loss": -12.204553604125977, "global_step": 492866, "epoch": 2933} {"train_loss": -10.608025550842285, "global_step": 492867, "epoch": 2933} {"train_loss": -11.322471618652344, "global_step": 492868, "epoch": 2933} {"train_loss": -11.675585746765137, "global_step": 492869, "epoch": 2933} {"train_loss": -11.268804550170898, "global_step": 492870, "epoch": 2933} {"train_loss": -12.297952651977539, "global_step": 492871, "epoch": 2933} {"train_loss": -11.248279571533203, "global_step": 492872, "epoch": 2933} {"train_loss": -12.513838768005371, "global_step": 492873, "epoch": 2933} {"train_loss": -11.890884399414062, "global_step": 492874, "epoch": 2933} {"train_loss": -11.71514892578125, "global_step": 492875, "epoch": 2933} {"train_loss": -12.556506156921387, "global_step": 492876, "epoch": 2933} {"train_loss": -12.407297134399414, "global_step": 492877, "epoch": 2933} {"train_loss": -12.359682083129883, "global_step": 492878, "epoch": 2933} {"train_loss": -12.42689323425293, "global_step": 492879, "epoch": 2933} {"train_loss": -12.315134048461914, "global_step": 492880, "epoch": 2933} {"train_loss": -12.466508865356445, "global_step": 492881, "epoch": 2933} {"train_loss": -12.507162094116211, "global_step": 492882, "epoch": 2933} {"train_loss": -12.149127960205078, "global_step": 492883, "epoch": 2933} {"train_loss": -12.716202735900879, "global_step": 492884, "epoch": 2933} {"train_loss": -12.502646446228027, "global_step": 492885, "epoch": 2933} {"train_loss": -12.414144515991211, "global_step": 492886, "epoch": 2933} {"train_loss": -12.514103889465332, "global_step": 492887, "epoch": 2933} {"train_loss": -12.096879959106445, "global_step": 492888, "epoch": 2933} {"train_loss": -12.51056957244873, "global_step": 492889, "epoch": 2933} {"train_loss": -12.476165771484375, "global_step": 492890, "epoch": 2933} {"train_loss": -12.463678359985352, "global_step": 492891, "epoch": 2933} {"train_loss": -12.415189743041992, "global_step": 492892, "epoch": 2933} {"train_loss": -12.398694038391113, "global_step": 492893, "epoch": 2933} {"train_loss": -12.548802375793457, "global_step": 492894, "epoch": 2933} {"train_loss": -12.555326461791992, "global_step": 492895, "epoch": 2933} {"train_loss": -12.745985984802246, "global_step": 492896, "epoch": 2933} {"train_loss": -12.485584259033203, "global_step": 492897, "epoch": 2933} {"train_loss": -12.627599716186523, "global_step": 492898, "epoch": 2933} {"train_loss": -12.47725772857666, "global_step": 492899, "epoch": 2933} {"train_loss": -12.813653945922852, "global_step": 492900, "epoch": 2933} {"train_loss": -12.410040855407715, "global_step": 492901, "epoch": 2933} {"train_loss": -12.725749015808105, "global_step": 492902, "epoch": 2933} {"train_loss": -12.509052276611328, "global_step": 492903, "epoch": 2933} {"train_loss": -12.736180305480957, "global_step": 492904, "epoch": 2933} {"train_loss": -12.872583389282227, "global_step": 492905, "epoch": 2933} {"train_loss": -12.571571350097656, "global_step": 492906, "epoch": 2933} {"train_loss": -12.614825248718262, "global_step": 492907, "epoch": 2933} {"train_loss": -12.286988258361816, "global_step": 492908, "epoch": 2933} {"train_loss": -12.52505111694336, "global_step": 492909, "epoch": 2933} {"train_loss": -12.534891128540039, "global_step": 492910, "epoch": 2933} {"train_loss": -12.237479283696128, "global_step": 492911, "epoch": 2933, "val_loss": 318692.6875} {"train_loss": -12.774824142456055, "global_step": 492912, "epoch": 2934} {"train_loss": -12.912067413330078, "global_step": 492913, "epoch": 2934} {"train_loss": -12.692447662353516, "global_step": 492914, "epoch": 2934} {"train_loss": -12.79447078704834, "global_step": 492915, "epoch": 2934} {"train_loss": -12.787313461303711, "global_step": 492916, "epoch": 2934} {"train_loss": -12.915705680847168, "global_step": 492917, "epoch": 2934} {"train_loss": -12.7374906539917, "global_step": 492918, "epoch": 2934} {"train_loss": -12.800130844116211, "global_step": 492919, "epoch": 2934} {"train_loss": -12.415390014648438, "global_step": 492920, "epoch": 2934} {"train_loss": -12.470892906188965, "global_step": 492921, "epoch": 2934} {"train_loss": -12.711896896362305, "global_step": 492922, "epoch": 2934} {"train_loss": -12.582694053649902, "global_step": 492923, "epoch": 2934} {"train_loss": -12.584857940673828, "global_step": 492924, "epoch": 2934} {"train_loss": -12.793932914733887, "global_step": 492925, "epoch": 2934} {"train_loss": -12.784597396850586, "global_step": 492926, "epoch": 2934} {"train_loss": -12.963319778442383, "global_step": 492927, "epoch": 2934} {"train_loss": -12.7576904296875, "global_step": 492928, "epoch": 2934} {"train_loss": -12.76451587677002, "global_step": 492929, "epoch": 2934} {"train_loss": -12.662155151367188, "global_step": 492930, "epoch": 2934} {"train_loss": -12.990139961242676, "global_step": 492931, "epoch": 2934} {"train_loss": -13.1036376953125, "global_step": 492932, "epoch": 2934} {"train_loss": -12.686824798583984, "global_step": 492933, "epoch": 2934} {"train_loss": -13.008073806762695, "global_step": 492934, "epoch": 2934} {"train_loss": -13.044525146484375, "global_step": 492935, "epoch": 2934} {"train_loss": -12.870513916015625, "global_step": 492936, "epoch": 2934} {"train_loss": -12.8745698928833, "global_step": 492937, "epoch": 2934} {"train_loss": -12.910264015197754, "global_step": 492938, "epoch": 2934} {"train_loss": -13.08064079284668, "global_step": 492939, "epoch": 2934} {"train_loss": -13.090019226074219, "global_step": 492940, "epoch": 2934} {"train_loss": -13.003170013427734, "global_step": 492941, "epoch": 2934} {"train_loss": -12.927691459655762, "global_step": 492942, "epoch": 2934} {"train_loss": -13.084184646606445, "global_step": 492943, "epoch": 2934} {"train_loss": -13.224172592163086, "global_step": 492944, "epoch": 2934} {"train_loss": -13.167779922485352, "global_step": 492945, "epoch": 2934} {"train_loss": -12.964139938354492, "global_step": 492946, "epoch": 2934} {"train_loss": -12.942468643188477, "global_step": 492947, "epoch": 2934} {"train_loss": -12.902029037475586, "global_step": 492948, "epoch": 2934} {"train_loss": -13.019369125366211, "global_step": 492949, "epoch": 2934} {"train_loss": -12.928852081298828, "global_step": 492950, "epoch": 2934} {"train_loss": -12.836115837097168, "global_step": 492951, "epoch": 2934} {"train_loss": -12.639592170715332, "global_step": 492952, "epoch": 2934} {"train_loss": -12.978659629821777, "global_step": 492953, "epoch": 2934} {"train_loss": -12.954324722290039, "global_step": 492954, "epoch": 2934} {"train_loss": -12.990318298339844, "global_step": 492955, "epoch": 2934} {"train_loss": -12.761213302612305, "global_step": 492956, "epoch": 2934} {"train_loss": -12.459894180297852, "global_step": 492957, "epoch": 2934} {"train_loss": -12.594528198242188, "global_step": 492958, "epoch": 2934} {"train_loss": -12.84563159942627, "global_step": 492959, "epoch": 2934} {"train_loss": -12.290494918823242, "global_step": 492960, "epoch": 2934} {"train_loss": -10.926701545715332, "global_step": 492961, "epoch": 2934} {"train_loss": -11.130224227905273, "global_step": 492962, "epoch": 2934} {"train_loss": -12.526447296142578, "global_step": 492963, "epoch": 2934} {"train_loss": -11.515165328979492, "global_step": 492964, "epoch": 2934} {"train_loss": -12.530250549316406, "global_step": 492965, "epoch": 2934} {"train_loss": -11.431734085083008, "global_step": 492966, "epoch": 2934} {"train_loss": -12.771907806396484, "global_step": 492967, "epoch": 2934} {"train_loss": -12.582942962646484, "global_step": 492968, "epoch": 2934} {"train_loss": -12.634830474853516, "global_step": 492969, "epoch": 2934} {"train_loss": -12.299633026123047, "global_step": 492970, "epoch": 2934} {"train_loss": -12.665796279907227, "global_step": 492971, "epoch": 2934} {"train_loss": -12.029683113098145, "global_step": 492972, "epoch": 2934} {"train_loss": -12.052104949951172, "global_step": 492973, "epoch": 2934} {"train_loss": -11.444652557373047, "global_step": 492974, "epoch": 2934} {"train_loss": -11.465673446655273, "global_step": 492975, "epoch": 2934} {"train_loss": -11.673354148864746, "global_step": 492976, "epoch": 2934} {"train_loss": -12.49019718170166, "global_step": 492977, "epoch": 2934} {"train_loss": -10.758018493652344, "global_step": 492978, "epoch": 2934} {"train_loss": -11.817169189453125, "global_step": 492979, "epoch": 2934} {"train_loss": -8.096561431884766, "global_step": 492980, "epoch": 2934} {"train_loss": -8.617034912109375, "global_step": 492981, "epoch": 2934} {"train_loss": -9.816947937011719, "global_step": 492982, "epoch": 2934} {"train_loss": -8.827866554260254, "global_step": 492983, "epoch": 2934} {"train_loss": -8.646063804626465, "global_step": 492984, "epoch": 2934} {"train_loss": -9.997314453125, "global_step": 492985, "epoch": 2934} {"train_loss": -9.912704467773438, "global_step": 492986, "epoch": 2934} {"train_loss": -7.858699798583984, "global_step": 492987, "epoch": 2934} {"train_loss": -9.535993576049805, "global_step": 492988, "epoch": 2934} {"train_loss": -8.377485275268555, "global_step": 492989, "epoch": 2934} {"train_loss": -8.598615646362305, "global_step": 492990, "epoch": 2934} {"train_loss": -8.074949264526367, "global_step": 492991, "epoch": 2934} {"train_loss": -8.541903495788574, "global_step": 492992, "epoch": 2934} {"train_loss": -10.370027542114258, "global_step": 492993, "epoch": 2934} {"train_loss": -10.295469284057617, "global_step": 492994, "epoch": 2934} {"train_loss": -9.847146987915039, "global_step": 492995, "epoch": 2934} {"train_loss": -9.74513053894043, "global_step": 492996, "epoch": 2934} {"train_loss": -11.287321090698242, "global_step": 492997, "epoch": 2934} {"train_loss": -10.152978897094727, "global_step": 492998, "epoch": 2934} {"train_loss": -11.113426208496094, "global_step": 492999, "epoch": 2934} {"train_loss": -11.134370803833008, "global_step": 493000, "epoch": 2934} {"train_loss": -10.558528900146484, "global_step": 493001, "epoch": 2934} {"train_loss": -11.278383255004883, "global_step": 493002, "epoch": 2934} {"train_loss": -10.447012901306152, "global_step": 493003, "epoch": 2934} {"train_loss": -10.508448600769043, "global_step": 493004, "epoch": 2934} {"train_loss": -11.646791458129883, "global_step": 493005, "epoch": 2934} {"train_loss": -11.696038246154785, "global_step": 493006, "epoch": 2934} {"train_loss": -10.837522506713867, "global_step": 493007, "epoch": 2934} {"train_loss": -11.79085922241211, "global_step": 493008, "epoch": 2934} {"train_loss": -11.025801658630371, "global_step": 493009, "epoch": 2934} {"train_loss": -11.044330596923828, "global_step": 493010, "epoch": 2934} {"train_loss": -11.978126525878906, "global_step": 493011, "epoch": 2934} {"train_loss": -11.061960220336914, "global_step": 493012, "epoch": 2934} {"train_loss": -11.75780963897705, "global_step": 493013, "epoch": 2934} {"train_loss": -11.770307540893555, "global_step": 493014, "epoch": 2934} {"train_loss": -10.923734664916992, "global_step": 493015, "epoch": 2934} {"train_loss": -11.434181213378906, "global_step": 493016, "epoch": 2934} {"train_loss": -11.454584121704102, "global_step": 493017, "epoch": 2934} {"train_loss": -11.387198448181152, "global_step": 493018, "epoch": 2934} {"train_loss": -11.983798027038574, "global_step": 493019, "epoch": 2934} {"train_loss": -11.430822372436523, "global_step": 493020, "epoch": 2934} {"train_loss": -12.308893203735352, "global_step": 493021, "epoch": 2934} {"train_loss": -11.72750473022461, "global_step": 493022, "epoch": 2934} {"train_loss": -11.58658218383789, "global_step": 493023, "epoch": 2934} {"train_loss": -11.816150665283203, "global_step": 493024, "epoch": 2934} {"train_loss": -11.258169174194336, "global_step": 493025, "epoch": 2934} {"train_loss": -11.84017276763916, "global_step": 493026, "epoch": 2934} {"train_loss": -11.898818969726562, "global_step": 493027, "epoch": 2934} {"train_loss": -12.125126838684082, "global_step": 493028, "epoch": 2934} {"train_loss": -12.007619857788086, "global_step": 493029, "epoch": 2934} {"train_loss": -12.34756851196289, "global_step": 493030, "epoch": 2934} {"train_loss": -11.591156959533691, "global_step": 493031, "epoch": 2934} {"train_loss": -12.293723106384277, "global_step": 493032, "epoch": 2934} {"train_loss": -12.269694328308105, "global_step": 493033, "epoch": 2934} {"train_loss": -12.092305183410645, "global_step": 493034, "epoch": 2934} {"train_loss": -12.404091835021973, "global_step": 493035, "epoch": 2934} {"train_loss": -12.152734756469727, "global_step": 493036, "epoch": 2934} {"train_loss": -12.410050392150879, "global_step": 493037, "epoch": 2934} {"train_loss": -12.078432083129883, "global_step": 493038, "epoch": 2934} {"train_loss": -12.47872543334961, "global_step": 493039, "epoch": 2934} {"train_loss": -12.358863830566406, "global_step": 493040, "epoch": 2934} {"train_loss": -12.359248161315918, "global_step": 493041, "epoch": 2934} {"train_loss": -12.379682540893555, "global_step": 493042, "epoch": 2934} {"train_loss": -12.625038146972656, "global_step": 493043, "epoch": 2934} {"train_loss": -12.519330978393555, "global_step": 493044, "epoch": 2934} {"train_loss": -12.547690391540527, "global_step": 493045, "epoch": 2934} {"train_loss": -12.331228256225586, "global_step": 493046, "epoch": 2934} {"train_loss": -12.332160949707031, "global_step": 493047, "epoch": 2934} {"train_loss": -12.519291877746582, "global_step": 493048, "epoch": 2934} {"train_loss": -12.507970809936523, "global_step": 493049, "epoch": 2934} {"train_loss": -12.614869117736816, "global_step": 493050, "epoch": 2934} {"train_loss": -12.788507461547852, "global_step": 493051, "epoch": 2934} {"train_loss": -12.622589111328125, "global_step": 493052, "epoch": 2934} {"train_loss": -12.626361846923828, "global_step": 493053, "epoch": 2934} {"train_loss": -12.22054386138916, "global_step": 493054, "epoch": 2934} {"train_loss": -12.710247039794922, "global_step": 493055, "epoch": 2934} {"train_loss": -12.352615356445312, "global_step": 493056, "epoch": 2934} {"train_loss": -12.599613189697266, "global_step": 493057, "epoch": 2934} {"train_loss": -12.328252792358398, "global_step": 493058, "epoch": 2934} {"train_loss": -12.252851486206055, "global_step": 493059, "epoch": 2934} {"train_loss": -11.986047744750977, "global_step": 493060, "epoch": 2934} {"train_loss": -12.448309898376465, "global_step": 493061, "epoch": 2934} {"train_loss": -11.92722225189209, "global_step": 493062, "epoch": 2934} {"train_loss": -12.725135803222656, "global_step": 493063, "epoch": 2934} {"train_loss": -11.485627174377441, "global_step": 493064, "epoch": 2934} {"train_loss": -12.092945098876953, "global_step": 493065, "epoch": 2934} {"train_loss": -12.37771224975586, "global_step": 493066, "epoch": 2934} {"train_loss": -12.1581392288208, "global_step": 493067, "epoch": 2934} {"train_loss": -12.586103439331055, "global_step": 493068, "epoch": 2934} {"train_loss": -12.164558410644531, "global_step": 493069, "epoch": 2934} {"train_loss": -11.64719295501709, "global_step": 493070, "epoch": 2934} {"train_loss": -12.549066543579102, "global_step": 493071, "epoch": 2934} {"train_loss": -11.261320114135742, "global_step": 493072, "epoch": 2934} {"train_loss": -12.13412857055664, "global_step": 493073, "epoch": 2934} {"train_loss": -11.753658294677734, "global_step": 493074, "epoch": 2934} {"train_loss": -10.540755271911621, "global_step": 493075, "epoch": 2934} {"train_loss": -11.589154243469238, "global_step": 493076, "epoch": 2934} {"train_loss": -10.039560317993164, "global_step": 493077, "epoch": 2934} {"train_loss": -11.873605728149414, "global_step": 493078, "epoch": 2934} {"train_loss": -11.8642144714083, "global_step": 493079, "epoch": 2934, "val_loss": 315081.0625} {"train_loss": -10.52806282043457, "global_step": 493080, "epoch": 2935} {"train_loss": -9.392355918884277, "global_step": 493081, "epoch": 2935} {"train_loss": -9.799514770507812, "global_step": 493082, "epoch": 2935} {"train_loss": -10.072858810424805, "global_step": 493083, "epoch": 2935} {"train_loss": -9.823604583740234, "global_step": 493084, "epoch": 2935} {"train_loss": -9.546045303344727, "global_step": 493085, "epoch": 2935} {"train_loss": -9.631465911865234, "global_step": 493086, "epoch": 2935} {"train_loss": -11.15647029876709, "global_step": 493087, "epoch": 2935} {"train_loss": -10.130292892456055, "global_step": 493088, "epoch": 2935} {"train_loss": -10.956024169921875, "global_step": 493089, "epoch": 2935} {"train_loss": -11.243791580200195, "global_step": 493090, "epoch": 2935} {"train_loss": -10.975059509277344, "global_step": 493091, "epoch": 2935} {"train_loss": -11.746304512023926, "global_step": 493092, "epoch": 2935} {"train_loss": -11.533323287963867, "global_step": 493093, "epoch": 2935} {"train_loss": -11.634958267211914, "global_step": 493094, "epoch": 2935} {"train_loss": -11.714801788330078, "global_step": 493095, "epoch": 2935} {"train_loss": -11.961603164672852, "global_step": 493096, "epoch": 2935} {"train_loss": -11.547070503234863, "global_step": 493097, "epoch": 2935} {"train_loss": -12.155647277832031, "global_step": 493098, "epoch": 2935} {"train_loss": -11.806662559509277, "global_step": 493099, "epoch": 2935} {"train_loss": -11.818864822387695, "global_step": 493100, "epoch": 2935} {"train_loss": -12.115287780761719, "global_step": 493101, "epoch": 2935} {"train_loss": -11.908917427062988, "global_step": 493102, "epoch": 2935} {"train_loss": -12.135080337524414, "global_step": 493103, "epoch": 2935} {"train_loss": -12.036787033081055, "global_step": 493104, "epoch": 2935} {"train_loss": -11.949274063110352, "global_step": 493105, "epoch": 2935} {"train_loss": -12.21390151977539, "global_step": 493106, "epoch": 2935} {"train_loss": -12.307512283325195, "global_step": 493107, "epoch": 2935} {"train_loss": -12.251880645751953, "global_step": 493108, "epoch": 2935} {"train_loss": -12.316812515258789, "global_step": 493109, "epoch": 2935} {"train_loss": -12.230376243591309, "global_step": 493110, "epoch": 2935} {"train_loss": -12.356792449951172, "global_step": 493111, "epoch": 2935} {"train_loss": -12.364760398864746, "global_step": 493112, "epoch": 2935} {"train_loss": -12.649295806884766, "global_step": 493113, "epoch": 2935} {"train_loss": -12.231634140014648, "global_step": 493114, "epoch": 2935} {"train_loss": -12.242684364318848, "global_step": 493115, "epoch": 2935} {"train_loss": -12.340856552124023, "global_step": 493116, "epoch": 2935} {"train_loss": -12.332497596740723, "global_step": 493117, "epoch": 2935} {"train_loss": -12.478974342346191, "global_step": 493118, "epoch": 2935} {"train_loss": -12.430171966552734, "global_step": 493119, "epoch": 2935} {"train_loss": -12.461103439331055, "global_step": 493120, "epoch": 2935} {"train_loss": -12.304033279418945, "global_step": 493121, "epoch": 2935} {"train_loss": -12.721426963806152, "global_step": 493122, "epoch": 2935} {"train_loss": -12.588414192199707, "global_step": 493123, "epoch": 2935} {"train_loss": -12.713704109191895, "global_step": 493124, "epoch": 2935} {"train_loss": -12.719478607177734, "global_step": 493125, "epoch": 2935} {"train_loss": -12.731046676635742, "global_step": 493126, "epoch": 2935} {"train_loss": -12.737154006958008, "global_step": 493127, "epoch": 2935} {"train_loss": -12.512370109558105, "global_step": 493128, "epoch": 2935} {"train_loss": -12.673530578613281, "global_step": 493129, "epoch": 2935} {"train_loss": -12.762605667114258, "global_step": 493130, "epoch": 2935} {"train_loss": -12.679672241210938, "global_step": 493131, "epoch": 2935} {"train_loss": -12.835833549499512, "global_step": 493132, "epoch": 2935} {"train_loss": -12.657472610473633, "global_step": 493133, "epoch": 2935} {"train_loss": -12.701000213623047, "global_step": 493134, "epoch": 2935} {"train_loss": -12.683198928833008, "global_step": 493135, "epoch": 2935} {"train_loss": -12.81309700012207, "global_step": 493136, "epoch": 2935} {"train_loss": -12.627412796020508, "global_step": 493137, "epoch": 2935} {"train_loss": -12.759921073913574, "global_step": 493138, "epoch": 2935} {"train_loss": -12.833351135253906, "global_step": 493139, "epoch": 2935} {"train_loss": -12.810689926147461, "global_step": 493140, "epoch": 2935} {"train_loss": -12.627740859985352, "global_step": 493141, "epoch": 2935} {"train_loss": -12.724102020263672, "global_step": 493142, "epoch": 2935} {"train_loss": -12.602362632751465, "global_step": 493143, "epoch": 2935} {"train_loss": -12.920570373535156, "global_step": 493144, "epoch": 2935} {"train_loss": -12.657390594482422, "global_step": 493145, "epoch": 2935} {"train_loss": -13.001860618591309, "global_step": 493146, "epoch": 2935} {"train_loss": -12.759061813354492, "global_step": 493147, "epoch": 2935} {"train_loss": -12.72334098815918, "global_step": 493148, "epoch": 2935} {"train_loss": -12.606507301330566, "global_step": 493149, "epoch": 2935} {"train_loss": -12.733270645141602, "global_step": 493150, "epoch": 2935} {"train_loss": -12.71898365020752, "global_step": 493151, "epoch": 2935} {"train_loss": -12.763021469116211, "global_step": 493152, "epoch": 2935} {"train_loss": -12.714348793029785, "global_step": 493153, "epoch": 2935} {"train_loss": -12.706653594970703, "global_step": 493154, "epoch": 2935} {"train_loss": -12.725834846496582, "global_step": 493155, "epoch": 2935} {"train_loss": -12.923637390136719, "global_step": 493156, "epoch": 2935} {"train_loss": -12.912508010864258, "global_step": 493157, "epoch": 2935} {"train_loss": -12.695332527160645, "global_step": 493158, "epoch": 2935} {"train_loss": -12.917863845825195, "global_step": 493159, "epoch": 2935} {"train_loss": -12.981170654296875, "global_step": 493160, "epoch": 2935} {"train_loss": -12.978696823120117, "global_step": 493161, "epoch": 2935} {"train_loss": -12.929183959960938, "global_step": 493162, "epoch": 2935} {"train_loss": -12.778746604919434, "global_step": 493163, "epoch": 2935} {"train_loss": -13.012899398803711, "global_step": 493164, "epoch": 2935} {"train_loss": -13.001993179321289, "global_step": 493165, "epoch": 2935} {"train_loss": -12.960697174072266, "global_step": 493166, "epoch": 2935} {"train_loss": -12.931417465209961, "global_step": 493167, "epoch": 2935} {"train_loss": -13.0082368850708, "global_step": 493168, "epoch": 2935} {"train_loss": -12.955781936645508, "global_step": 493169, "epoch": 2935} {"train_loss": -13.028804779052734, "global_step": 493170, "epoch": 2935} {"train_loss": -12.91762638092041, "global_step": 493171, "epoch": 2935} {"train_loss": -13.058738708496094, "global_step": 493172, "epoch": 2935} {"train_loss": -12.975271224975586, "global_step": 493173, "epoch": 2935} {"train_loss": -12.756957054138184, "global_step": 493174, "epoch": 2935} {"train_loss": -13.075725555419922, "global_step": 493175, "epoch": 2935} {"train_loss": -13.061697006225586, "global_step": 493176, "epoch": 2935} {"train_loss": -12.525676727294922, "global_step": 493177, "epoch": 2935} {"train_loss": -12.618436813354492, "global_step": 493178, "epoch": 2935} {"train_loss": -13.015069961547852, "global_step": 493179, "epoch": 2935} {"train_loss": -12.413541793823242, "global_step": 493180, "epoch": 2935} {"train_loss": -12.799663543701172, "global_step": 493181, "epoch": 2935} {"train_loss": -12.276567459106445, "global_step": 493182, "epoch": 2935} {"train_loss": -12.68321418762207, "global_step": 493183, "epoch": 2935} {"train_loss": -12.788776397705078, "global_step": 493184, "epoch": 2935} {"train_loss": -12.60383129119873, "global_step": 493185, "epoch": 2935} {"train_loss": -12.534845352172852, "global_step": 493186, "epoch": 2935} {"train_loss": -12.927980422973633, "global_step": 493187, "epoch": 2935} {"train_loss": -12.938227653503418, "global_step": 493188, "epoch": 2935} {"train_loss": -12.278608322143555, "global_step": 493189, "epoch": 2935} {"train_loss": -12.242295265197754, "global_step": 493190, "epoch": 2935} {"train_loss": -12.680137634277344, "global_step": 493191, "epoch": 2935} {"train_loss": -12.431482315063477, "global_step": 493192, "epoch": 2935} {"train_loss": -12.933525085449219, "global_step": 493193, "epoch": 2935} {"train_loss": -12.752511024475098, "global_step": 493194, "epoch": 2935} {"train_loss": -12.8908109664917, "global_step": 493195, "epoch": 2935} {"train_loss": -12.834094047546387, "global_step": 493196, "epoch": 2935} {"train_loss": -12.326303482055664, "global_step": 493197, "epoch": 2935} {"train_loss": -12.00674057006836, "global_step": 493198, "epoch": 2935} {"train_loss": -12.825261116027832, "global_step": 493199, "epoch": 2935} {"train_loss": -12.258901596069336, "global_step": 493200, "epoch": 2935} {"train_loss": -12.270048141479492, "global_step": 493201, "epoch": 2935} {"train_loss": -11.499368667602539, "global_step": 493202, "epoch": 2935} {"train_loss": -10.981280326843262, "global_step": 493203, "epoch": 2935} {"train_loss": -12.36455249786377, "global_step": 493204, "epoch": 2935} {"train_loss": -10.012441635131836, "global_step": 493205, "epoch": 2935} {"train_loss": -12.216238021850586, "global_step": 493206, "epoch": 2935} {"train_loss": -12.089475631713867, "global_step": 493207, "epoch": 2935} {"train_loss": -10.675529479980469, "global_step": 493208, "epoch": 2935} {"train_loss": -11.950946807861328, "global_step": 493209, "epoch": 2935} {"train_loss": -11.281793594360352, "global_step": 493210, "epoch": 2935} {"train_loss": -12.554963111877441, "global_step": 493211, "epoch": 2935} {"train_loss": -10.312902450561523, "global_step": 493212, "epoch": 2935} {"train_loss": -11.71871566772461, "global_step": 493213, "epoch": 2935} {"train_loss": -11.584912300109863, "global_step": 493214, "epoch": 2935} {"train_loss": -10.879205703735352, "global_step": 493215, "epoch": 2935} {"train_loss": -12.084394454956055, "global_step": 493216, "epoch": 2935} {"train_loss": -11.985549926757812, "global_step": 493217, "epoch": 2935} {"train_loss": -12.148392677307129, "global_step": 493218, "epoch": 2935} {"train_loss": -12.13296890258789, "global_step": 493219, "epoch": 2935} {"train_loss": -12.07279109954834, "global_step": 493220, "epoch": 2935} {"train_loss": -12.336503028869629, "global_step": 493221, "epoch": 2935} {"train_loss": -11.91731071472168, "global_step": 493222, "epoch": 2935} {"train_loss": -11.787952423095703, "global_step": 493223, "epoch": 2935} {"train_loss": -12.092988967895508, "global_step": 493224, "epoch": 2935} {"train_loss": -12.460298538208008, "global_step": 493225, "epoch": 2935} {"train_loss": -12.3477783203125, "global_step": 493226, "epoch": 2935} {"train_loss": -12.247940063476562, "global_step": 493227, "epoch": 2935} {"train_loss": -12.414186477661133, "global_step": 493228, "epoch": 2935} {"train_loss": -12.082054138183594, "global_step": 493229, "epoch": 2935} {"train_loss": -12.12997055053711, "global_step": 493230, "epoch": 2935} {"train_loss": -12.150171279907227, "global_step": 493231, "epoch": 2935} {"train_loss": -12.58095932006836, "global_step": 493232, "epoch": 2935} {"train_loss": -12.31351375579834, "global_step": 493233, "epoch": 2935} {"train_loss": -11.814324378967285, "global_step": 493234, "epoch": 2935} {"train_loss": -12.455401420593262, "global_step": 493235, "epoch": 2935} {"train_loss": -12.245445251464844, "global_step": 493236, "epoch": 2935} {"train_loss": -11.970202445983887, "global_step": 493237, "epoch": 2935} {"train_loss": -12.613438606262207, "global_step": 493238, "epoch": 2935} {"train_loss": -12.061481475830078, "global_step": 493239, "epoch": 2935} {"train_loss": -12.402185440063477, "global_step": 493240, "epoch": 2935} {"train_loss": -12.199662208557129, "global_step": 493241, "epoch": 2935} {"train_loss": -11.57155990600586, "global_step": 493242, "epoch": 2935} {"train_loss": -12.219793319702148, "global_step": 493243, "epoch": 2935} {"train_loss": -12.390421867370605, "global_step": 493244, "epoch": 2935} {"train_loss": -12.06982421875, "global_step": 493245, "epoch": 2935} {"train_loss": -11.976259231567383, "global_step": 493246, "epoch": 2935} {"train_loss": -12.240004936854044, "global_step": 493247, "epoch": 2935, "val_loss": 315951.875, "train_action_mse_error": 0.3596646785736084} {"train_loss": -12.331989288330078, "global_step": 493248, "epoch": 2936} {"train_loss": -12.528335571289062, "global_step": 493249, "epoch": 2936} {"train_loss": -12.06258773803711, "global_step": 493250, "epoch": 2936} {"train_loss": -12.78947925567627, "global_step": 493251, "epoch": 2936} {"train_loss": -12.411317825317383, "global_step": 493252, "epoch": 2936} {"train_loss": -12.259597778320312, "global_step": 493253, "epoch": 2936} {"train_loss": -11.539701461791992, "global_step": 493254, "epoch": 2936} {"train_loss": -11.246087074279785, "global_step": 493255, "epoch": 2936} {"train_loss": -11.475383758544922, "global_step": 493256, "epoch": 2936} {"train_loss": -10.398609161376953, "global_step": 493257, "epoch": 2936} {"train_loss": -10.46965217590332, "global_step": 493258, "epoch": 2936} {"train_loss": -10.934948921203613, "global_step": 493259, "epoch": 2936} {"train_loss": -11.027565956115723, "global_step": 493260, "epoch": 2936} {"train_loss": -11.198013305664062, "global_step": 493261, "epoch": 2936} {"train_loss": -9.903349876403809, "global_step": 493262, "epoch": 2936} {"train_loss": -10.672883987426758, "global_step": 493263, "epoch": 2936} {"train_loss": -11.302088737487793, "global_step": 493264, "epoch": 2936} {"train_loss": -11.218875885009766, "global_step": 493265, "epoch": 2936} {"train_loss": -11.229913711547852, "global_step": 493266, "epoch": 2936} {"train_loss": -10.831846237182617, "global_step": 493267, "epoch": 2936} {"train_loss": -11.65880012512207, "global_step": 493268, "epoch": 2936} {"train_loss": -11.704119682312012, "global_step": 493269, "epoch": 2936} {"train_loss": -11.466445922851562, "global_step": 493270, "epoch": 2936} {"train_loss": -11.498454093933105, "global_step": 493271, "epoch": 2936} {"train_loss": -11.078086853027344, "global_step": 493272, "epoch": 2936} {"train_loss": -12.012104034423828, "global_step": 493273, "epoch": 2936} {"train_loss": -11.568975448608398, "global_step": 493274, "epoch": 2936} {"train_loss": -12.445297241210938, "global_step": 493275, "epoch": 2936} {"train_loss": -11.748902320861816, "global_step": 493276, "epoch": 2936} {"train_loss": -12.211462020874023, "global_step": 493277, "epoch": 2936} {"train_loss": -11.56793212890625, "global_step": 493278, "epoch": 2936} {"train_loss": -12.412527084350586, "global_step": 493279, "epoch": 2936} {"train_loss": -12.105932235717773, "global_step": 493280, "epoch": 2936} {"train_loss": -12.080649375915527, "global_step": 493281, "epoch": 2936} {"train_loss": -12.220932006835938, "global_step": 493282, "epoch": 2936} {"train_loss": -12.211631774902344, "global_step": 493283, "epoch": 2936} {"train_loss": -12.239790916442871, "global_step": 493284, "epoch": 2936} {"train_loss": -12.04715347290039, "global_step": 493285, "epoch": 2936} {"train_loss": -12.378403663635254, "global_step": 493286, "epoch": 2936} {"train_loss": -11.942649841308594, "global_step": 493287, "epoch": 2936} {"train_loss": -12.469148635864258, "global_step": 493288, "epoch": 2936} {"train_loss": -12.249395370483398, "global_step": 493289, "epoch": 2936} {"train_loss": -12.210376739501953, "global_step": 493290, "epoch": 2936} {"train_loss": -12.45166301727295, "global_step": 493291, "epoch": 2936} {"train_loss": -12.10938835144043, "global_step": 493292, "epoch": 2936} {"train_loss": -12.624658584594727, "global_step": 493293, "epoch": 2936} {"train_loss": -12.330324172973633, "global_step": 493294, "epoch": 2936} {"train_loss": -12.599809646606445, "global_step": 493295, "epoch": 2936} {"train_loss": -12.517704010009766, "global_step": 493296, "epoch": 2936} {"train_loss": -12.808728218078613, "global_step": 493297, "epoch": 2936} {"train_loss": -12.548624038696289, "global_step": 493298, "epoch": 2936} {"train_loss": -12.487726211547852, "global_step": 493299, "epoch": 2936} {"train_loss": -12.619264602661133, "global_step": 493300, "epoch": 2936} {"train_loss": -12.555854797363281, "global_step": 493301, "epoch": 2936} {"train_loss": -12.689553260803223, "global_step": 493302, "epoch": 2936} {"train_loss": -12.567743301391602, "global_step": 493303, "epoch": 2936} {"train_loss": -12.565274238586426, "global_step": 493304, "epoch": 2936} {"train_loss": -12.613286972045898, "global_step": 493305, "epoch": 2936} {"train_loss": -12.679384231567383, "global_step": 493306, "epoch": 2936} {"train_loss": -12.366973876953125, "global_step": 493307, "epoch": 2936} {"train_loss": -12.437127113342285, "global_step": 493308, "epoch": 2936} {"train_loss": -12.748842239379883, "global_step": 493309, "epoch": 2936} {"train_loss": -12.447373390197754, "global_step": 493310, "epoch": 2936} {"train_loss": -12.787025451660156, "global_step": 493311, "epoch": 2936} {"train_loss": -12.359241485595703, "global_step": 493312, "epoch": 2936} {"train_loss": -12.5379056930542, "global_step": 493313, "epoch": 2936} {"train_loss": -12.772930145263672, "global_step": 493314, "epoch": 2936} {"train_loss": -12.246895790100098, "global_step": 493315, "epoch": 2936} {"train_loss": -12.553515434265137, "global_step": 493316, "epoch": 2936} {"train_loss": -12.754973411560059, "global_step": 493317, "epoch": 2936} {"train_loss": -12.504517555236816, "global_step": 493318, "epoch": 2936} {"train_loss": -12.626930236816406, "global_step": 493319, "epoch": 2936} {"train_loss": -12.6351957321167, "global_step": 493320, "epoch": 2936} {"train_loss": -12.687925338745117, "global_step": 493321, "epoch": 2936} {"train_loss": -12.905643463134766, "global_step": 493322, "epoch": 2936} {"train_loss": -12.753837585449219, "global_step": 493323, "epoch": 2936} {"train_loss": -12.573538780212402, "global_step": 493324, "epoch": 2936} {"train_loss": -12.855745315551758, "global_step": 493325, "epoch": 2936} {"train_loss": -12.938423156738281, "global_step": 493326, "epoch": 2936} {"train_loss": -12.936272621154785, "global_step": 493327, "epoch": 2936} {"train_loss": -13.027718544006348, "global_step": 493328, "epoch": 2936} {"train_loss": -12.917898178100586, "global_step": 493329, "epoch": 2936} {"train_loss": -12.960591316223145, "global_step": 493330, "epoch": 2936} {"train_loss": -12.870368957519531, "global_step": 493331, "epoch": 2936} {"train_loss": -12.716251373291016, "global_step": 493332, "epoch": 2936} {"train_loss": -12.922910690307617, "global_step": 493333, "epoch": 2936} {"train_loss": -13.015979766845703, "global_step": 493334, "epoch": 2936} {"train_loss": -12.853212356567383, "global_step": 493335, "epoch": 2936} {"train_loss": -12.675729751586914, "global_step": 493336, "epoch": 2936} {"train_loss": -12.753369331359863, "global_step": 493337, "epoch": 2936} {"train_loss": -12.837142944335938, "global_step": 493338, "epoch": 2936} {"train_loss": -12.80978775024414, "global_step": 493339, "epoch": 2936} {"train_loss": -12.956110000610352, "global_step": 493340, "epoch": 2936} {"train_loss": -12.601552963256836, "global_step": 493341, "epoch": 2936} {"train_loss": -12.493149757385254, "global_step": 493342, "epoch": 2936} {"train_loss": -12.962503433227539, "global_step": 493343, "epoch": 2936} {"train_loss": -12.53791618347168, "global_step": 493344, "epoch": 2936} {"train_loss": -12.165145874023438, "global_step": 493345, "epoch": 2936} {"train_loss": -12.120441436767578, "global_step": 493346, "epoch": 2936} {"train_loss": -12.72805404663086, "global_step": 493347, "epoch": 2936} {"train_loss": -12.233739852905273, "global_step": 493348, "epoch": 2936} {"train_loss": -11.989096641540527, "global_step": 493349, "epoch": 2936} {"train_loss": -12.286274909973145, "global_step": 493350, "epoch": 2936} {"train_loss": -12.79791259765625, "global_step": 493351, "epoch": 2936} {"train_loss": -12.4518461227417, "global_step": 493352, "epoch": 2936} {"train_loss": -12.623737335205078, "global_step": 493353, "epoch": 2936} {"train_loss": -12.02631950378418, "global_step": 493354, "epoch": 2936} {"train_loss": -11.985151290893555, "global_step": 493355, "epoch": 2936} {"train_loss": -12.693790435791016, "global_step": 493356, "epoch": 2936} {"train_loss": -12.625837326049805, "global_step": 493357, "epoch": 2936} {"train_loss": -12.599201202392578, "global_step": 493358, "epoch": 2936} {"train_loss": -11.79193115234375, "global_step": 493359, "epoch": 2936} {"train_loss": -11.85757064819336, "global_step": 493360, "epoch": 2936} {"train_loss": -12.778907775878906, "global_step": 493361, "epoch": 2936} {"train_loss": -12.306806564331055, "global_step": 493362, "epoch": 2936} {"train_loss": -12.78264331817627, "global_step": 493363, "epoch": 2936} {"train_loss": -11.879950523376465, "global_step": 493364, "epoch": 2936} {"train_loss": -12.78840446472168, "global_step": 493365, "epoch": 2936} {"train_loss": -11.722006797790527, "global_step": 493366, "epoch": 2936} {"train_loss": -11.670144081115723, "global_step": 493367, "epoch": 2936} {"train_loss": -11.726438522338867, "global_step": 493368, "epoch": 2936} {"train_loss": -12.40987777709961, "global_step": 493369, "epoch": 2936} {"train_loss": -11.653411865234375, "global_step": 493370, "epoch": 2936} {"train_loss": -11.908178329467773, "global_step": 493371, "epoch": 2936} {"train_loss": -11.07497501373291, "global_step": 493372, "epoch": 2936} {"train_loss": -12.494396209716797, "global_step": 493373, "epoch": 2936} {"train_loss": -11.610791206359863, "global_step": 493374, "epoch": 2936} {"train_loss": -12.363557815551758, "global_step": 493375, "epoch": 2936} {"train_loss": -11.899234771728516, "global_step": 493376, "epoch": 2936} {"train_loss": -11.825407028198242, "global_step": 493377, "epoch": 2936} {"train_loss": -11.894048690795898, "global_step": 493378, "epoch": 2936} {"train_loss": -12.625123977661133, "global_step": 493379, "epoch": 2936} {"train_loss": -12.005674362182617, "global_step": 493380, "epoch": 2936} {"train_loss": -12.799137115478516, "global_step": 493381, "epoch": 2936} {"train_loss": -12.093561172485352, "global_step": 493382, "epoch": 2936} {"train_loss": -12.038346290588379, "global_step": 493383, "epoch": 2936} {"train_loss": -11.783143997192383, "global_step": 493384, "epoch": 2936} {"train_loss": -12.440780639648438, "global_step": 493385, "epoch": 2936} {"train_loss": -11.42353630065918, "global_step": 493386, "epoch": 2936} {"train_loss": -12.705187797546387, "global_step": 493387, "epoch": 2936} {"train_loss": -11.809427261352539, "global_step": 493388, "epoch": 2936} {"train_loss": -11.981216430664062, "global_step": 493389, "epoch": 2936} {"train_loss": -12.358230590820312, "global_step": 493390, "epoch": 2936} {"train_loss": -12.215082168579102, "global_step": 493391, "epoch": 2936} {"train_loss": -11.200498580932617, "global_step": 493392, "epoch": 2936} {"train_loss": -12.804561614990234, "global_step": 493393, "epoch": 2936} {"train_loss": -9.83301830291748, "global_step": 493394, "epoch": 2936} {"train_loss": -11.663227081298828, "global_step": 493395, "epoch": 2936} {"train_loss": -12.209123611450195, "global_step": 493396, "epoch": 2936} {"train_loss": -11.187564849853516, "global_step": 493397, "epoch": 2936} {"train_loss": -12.719086647033691, "global_step": 493398, "epoch": 2936} {"train_loss": -12.537673950195312, "global_step": 493399, "epoch": 2936} {"train_loss": -12.893657684326172, "global_step": 493400, "epoch": 2936} {"train_loss": -12.743948936462402, "global_step": 493401, "epoch": 2936} {"train_loss": -12.577166557312012, "global_step": 493402, "epoch": 2936} {"train_loss": -12.958243370056152, "global_step": 493403, "epoch": 2936} {"train_loss": -12.844396591186523, "global_step": 493404, "epoch": 2936} {"train_loss": -12.853166580200195, "global_step": 493405, "epoch": 2936} {"train_loss": -12.782757759094238, "global_step": 493406, "epoch": 2936} {"train_loss": -12.832342147827148, "global_step": 493407, "epoch": 2936} {"train_loss": -12.888650894165039, "global_step": 493408, "epoch": 2936} {"train_loss": -12.479499816894531, "global_step": 493409, "epoch": 2936} {"train_loss": -13.08321762084961, "global_step": 493410, "epoch": 2936} {"train_loss": -13.075584411621094, "global_step": 493411, "epoch": 2936} {"train_loss": -12.760269165039062, "global_step": 493412, "epoch": 2936} {"train_loss": -12.751175880432129, "global_step": 493413, "epoch": 2936} {"train_loss": -12.997282028198242, "global_step": 493414, "epoch": 2936} {"train_loss": -12.256479711759658, "global_step": 493415, "epoch": 2936, "val_loss": 318081.65625} {"train_loss": -12.71458625793457, "global_step": 493416, "epoch": 2937} {"train_loss": -12.893209457397461, "global_step": 493417, "epoch": 2937} {"train_loss": -12.97653579711914, "global_step": 493418, "epoch": 2937} {"train_loss": -12.778159141540527, "global_step": 493419, "epoch": 2937} {"train_loss": -12.846925735473633, "global_step": 493420, "epoch": 2937} {"train_loss": -12.808404922485352, "global_step": 493421, "epoch": 2937} {"train_loss": -12.878131866455078, "global_step": 493422, "epoch": 2937} {"train_loss": -12.46536922454834, "global_step": 493423, "epoch": 2937} {"train_loss": -12.831066131591797, "global_step": 493424, "epoch": 2937} {"train_loss": -12.717674255371094, "global_step": 493425, "epoch": 2937} {"train_loss": -12.858617782592773, "global_step": 493426, "epoch": 2937} {"train_loss": -12.79378890991211, "global_step": 493427, "epoch": 2937} {"train_loss": -12.514741897583008, "global_step": 493428, "epoch": 2937} {"train_loss": -12.24077033996582, "global_step": 493429, "epoch": 2937} {"train_loss": -12.747859954833984, "global_step": 493430, "epoch": 2937} {"train_loss": -12.550701141357422, "global_step": 493431, "epoch": 2937} {"train_loss": -11.696660995483398, "global_step": 493432, "epoch": 2937} {"train_loss": -12.782809257507324, "global_step": 493433, "epoch": 2937} {"train_loss": -12.680997848510742, "global_step": 493434, "epoch": 2937} {"train_loss": -12.575346946716309, "global_step": 493435, "epoch": 2937} {"train_loss": -12.854347229003906, "global_step": 493436, "epoch": 2937} {"train_loss": -12.765204429626465, "global_step": 493437, "epoch": 2937} {"train_loss": -12.847491264343262, "global_step": 493438, "epoch": 2937} {"train_loss": -12.898055076599121, "global_step": 493439, "epoch": 2937} {"train_loss": -12.420571327209473, "global_step": 493440, "epoch": 2937} {"train_loss": -12.801575660705566, "global_step": 493441, "epoch": 2937} {"train_loss": -12.828118324279785, "global_step": 493442, "epoch": 2937} {"train_loss": -12.888988494873047, "global_step": 493443, "epoch": 2937} {"train_loss": -12.846919059753418, "global_step": 493444, "epoch": 2937} {"train_loss": -12.565886497497559, "global_step": 493445, "epoch": 2937} {"train_loss": -12.931137084960938, "global_step": 493446, "epoch": 2937} {"train_loss": -12.853557586669922, "global_step": 493447, "epoch": 2937} {"train_loss": -12.921411514282227, "global_step": 493448, "epoch": 2937} {"train_loss": -12.527997016906738, "global_step": 493449, "epoch": 2937} {"train_loss": -12.852339744567871, "global_step": 493450, "epoch": 2937} {"train_loss": -12.411470413208008, "global_step": 493451, "epoch": 2937} {"train_loss": -12.449142456054688, "global_step": 493452, "epoch": 2937} {"train_loss": -12.34001350402832, "global_step": 493453, "epoch": 2937} {"train_loss": -12.96825122833252, "global_step": 493454, "epoch": 2937} {"train_loss": -12.809728622436523, "global_step": 493455, "epoch": 2937} {"train_loss": -12.43114185333252, "global_step": 493456, "epoch": 2937} {"train_loss": -12.661324501037598, "global_step": 493457, "epoch": 2937} {"train_loss": -12.679889678955078, "global_step": 493458, "epoch": 2937} {"train_loss": -12.414588928222656, "global_step": 493459, "epoch": 2937} {"train_loss": -12.410143852233887, "global_step": 493460, "epoch": 2937} {"train_loss": -12.913407325744629, "global_step": 493461, "epoch": 2937} {"train_loss": -12.800859451293945, "global_step": 493462, "epoch": 2937} {"train_loss": -12.636171340942383, "global_step": 493463, "epoch": 2937} {"train_loss": -11.59730052947998, "global_step": 493464, "epoch": 2937} {"train_loss": -12.102048873901367, "global_step": 493465, "epoch": 2937} {"train_loss": -12.309736251831055, "global_step": 493466, "epoch": 2937} {"train_loss": -12.403199195861816, "global_step": 493467, "epoch": 2937} {"train_loss": -11.729185104370117, "global_step": 493468, "epoch": 2937} {"train_loss": -12.354029655456543, "global_step": 493469, "epoch": 2937} {"train_loss": -11.525606155395508, "global_step": 493470, "epoch": 2937} {"train_loss": -11.996526718139648, "global_step": 493471, "epoch": 2937} {"train_loss": -11.74302864074707, "global_step": 493472, "epoch": 2937} {"train_loss": -12.067790985107422, "global_step": 493473, "epoch": 2937} {"train_loss": -12.050853729248047, "global_step": 493474, "epoch": 2937} {"train_loss": -10.628904342651367, "global_step": 493475, "epoch": 2937} {"train_loss": -12.029128074645996, "global_step": 493476, "epoch": 2937} {"train_loss": -11.195935249328613, "global_step": 493477, "epoch": 2937} {"train_loss": -12.361882209777832, "global_step": 493478, "epoch": 2937} {"train_loss": -11.595620155334473, "global_step": 493479, "epoch": 2937} {"train_loss": -12.044453620910645, "global_step": 493480, "epoch": 2937} {"train_loss": -12.303808212280273, "global_step": 493481, "epoch": 2937} {"train_loss": -12.305329322814941, "global_step": 493482, "epoch": 2937} {"train_loss": -11.087508201599121, "global_step": 493483, "epoch": 2937} {"train_loss": -11.175697326660156, "global_step": 493484, "epoch": 2937} {"train_loss": -11.450637817382812, "global_step": 493485, "epoch": 2937} {"train_loss": -11.530912399291992, "global_step": 493486, "epoch": 2937} {"train_loss": -11.299257278442383, "global_step": 493487, "epoch": 2937} {"train_loss": -10.609090805053711, "global_step": 493488, "epoch": 2937} {"train_loss": -9.607660293579102, "global_step": 493489, "epoch": 2937} {"train_loss": -11.693852424621582, "global_step": 493490, "epoch": 2937} {"train_loss": -11.134119033813477, "global_step": 493491, "epoch": 2937} {"train_loss": -11.30026626586914, "global_step": 493492, "epoch": 2937} {"train_loss": -11.84323501586914, "global_step": 493493, "epoch": 2937} {"train_loss": -11.203157424926758, "global_step": 493494, "epoch": 2937} {"train_loss": -10.178293228149414, "global_step": 493495, "epoch": 2937} {"train_loss": -11.602432250976562, "global_step": 493496, "epoch": 2937} {"train_loss": -10.899787902832031, "global_step": 493497, "epoch": 2937} {"train_loss": -11.585972785949707, "global_step": 493498, "epoch": 2937} {"train_loss": -10.70077133178711, "global_step": 493499, "epoch": 2937} {"train_loss": -11.584851264953613, "global_step": 493500, "epoch": 2937} {"train_loss": -10.822656631469727, "global_step": 493501, "epoch": 2937} {"train_loss": -11.600105285644531, "global_step": 493502, "epoch": 2937} {"train_loss": -11.086795806884766, "global_step": 493503, "epoch": 2937} {"train_loss": -11.213479995727539, "global_step": 493504, "epoch": 2937} {"train_loss": -11.874031066894531, "global_step": 493505, "epoch": 2937} {"train_loss": -11.634979248046875, "global_step": 493506, "epoch": 2937} {"train_loss": -12.279325485229492, "global_step": 493507, "epoch": 2937} {"train_loss": -11.560762405395508, "global_step": 493508, "epoch": 2937} {"train_loss": -12.171797752380371, "global_step": 493509, "epoch": 2937} {"train_loss": -11.911077499389648, "global_step": 493510, "epoch": 2937} {"train_loss": -12.345422744750977, "global_step": 493511, "epoch": 2937} {"train_loss": -11.701519012451172, "global_step": 493512, "epoch": 2937} {"train_loss": -12.549853324890137, "global_step": 493513, "epoch": 2937} {"train_loss": -12.073339462280273, "global_step": 493514, "epoch": 2937} {"train_loss": -12.506317138671875, "global_step": 493515, "epoch": 2937} {"train_loss": -12.330862045288086, "global_step": 493516, "epoch": 2937} {"train_loss": -12.190473556518555, "global_step": 493517, "epoch": 2937} {"train_loss": -12.13779067993164, "global_step": 493518, "epoch": 2937} {"train_loss": -12.243621826171875, "global_step": 493519, "epoch": 2937} {"train_loss": -12.129941940307617, "global_step": 493520, "epoch": 2937} {"train_loss": -12.105874061584473, "global_step": 493521, "epoch": 2937} {"train_loss": -11.831388473510742, "global_step": 493522, "epoch": 2937} {"train_loss": -12.151687622070312, "global_step": 493523, "epoch": 2937} {"train_loss": -12.042242050170898, "global_step": 493524, "epoch": 2937} {"train_loss": -12.019866943359375, "global_step": 493525, "epoch": 2937} {"train_loss": -12.538286209106445, "global_step": 493526, "epoch": 2937} {"train_loss": -12.142433166503906, "global_step": 493527, "epoch": 2937} {"train_loss": -12.43644905090332, "global_step": 493528, "epoch": 2937} {"train_loss": -12.361274719238281, "global_step": 493529, "epoch": 2937} {"train_loss": -12.31404972076416, "global_step": 493530, "epoch": 2937} {"train_loss": -12.409465789794922, "global_step": 493531, "epoch": 2937} {"train_loss": -12.490883827209473, "global_step": 493532, "epoch": 2937} {"train_loss": -12.198009490966797, "global_step": 493533, "epoch": 2937} {"train_loss": -12.711356163024902, "global_step": 493534, "epoch": 2937} {"train_loss": -12.653349876403809, "global_step": 493535, "epoch": 2937} {"train_loss": -12.578822135925293, "global_step": 493536, "epoch": 2937} {"train_loss": -12.737274169921875, "global_step": 493537, "epoch": 2937} {"train_loss": -12.949859619140625, "global_step": 493538, "epoch": 2937} {"train_loss": -12.682146072387695, "global_step": 493539, "epoch": 2937} {"train_loss": -12.746545791625977, "global_step": 493540, "epoch": 2937} {"train_loss": -12.7064208984375, "global_step": 493541, "epoch": 2937} {"train_loss": -12.773289680480957, "global_step": 493542, "epoch": 2937} {"train_loss": -12.729978561401367, "global_step": 493543, "epoch": 2937} {"train_loss": -12.392525672912598, "global_step": 493544, "epoch": 2937} {"train_loss": -12.718481063842773, "global_step": 493545, "epoch": 2937} {"train_loss": -12.241537094116211, "global_step": 493546, "epoch": 2937} {"train_loss": -12.551680564880371, "global_step": 493547, "epoch": 2937} {"train_loss": -12.661967277526855, "global_step": 493548, "epoch": 2937} {"train_loss": -12.587554931640625, "global_step": 493549, "epoch": 2937} {"train_loss": -12.6267671585083, "global_step": 493550, "epoch": 2937} {"train_loss": -12.340021133422852, "global_step": 493551, "epoch": 2937} {"train_loss": -12.497274398803711, "global_step": 493552, "epoch": 2937} {"train_loss": -12.11979866027832, "global_step": 493553, "epoch": 2937} {"train_loss": -12.616974830627441, "global_step": 493554, "epoch": 2937} {"train_loss": -12.192044258117676, "global_step": 493555, "epoch": 2937} {"train_loss": -11.869933128356934, "global_step": 493556, "epoch": 2937} {"train_loss": -12.418512344360352, "global_step": 493557, "epoch": 2937} {"train_loss": -12.418611526489258, "global_step": 493558, "epoch": 2937} {"train_loss": -12.399802207946777, "global_step": 493559, "epoch": 2937} {"train_loss": -12.608940124511719, "global_step": 493560, "epoch": 2937} {"train_loss": -12.119556427001953, "global_step": 493561, "epoch": 2937} {"train_loss": -12.083486557006836, "global_step": 493562, "epoch": 2937} {"train_loss": -12.42484188079834, "global_step": 493563, "epoch": 2937} {"train_loss": -12.095080375671387, "global_step": 493564, "epoch": 2937} {"train_loss": -11.520841598510742, "global_step": 493565, "epoch": 2937} {"train_loss": -12.49993896484375, "global_step": 493566, "epoch": 2937} {"train_loss": -11.343384742736816, "global_step": 493567, "epoch": 2937} {"train_loss": -11.423847198486328, "global_step": 493568, "epoch": 2937} {"train_loss": -12.254498481750488, "global_step": 493569, "epoch": 2937} {"train_loss": -11.252622604370117, "global_step": 493570, "epoch": 2937} {"train_loss": -12.295969009399414, "global_step": 493571, "epoch": 2937} {"train_loss": -10.885490417480469, "global_step": 493572, "epoch": 2937} {"train_loss": -11.759777069091797, "global_step": 493573, "epoch": 2937} {"train_loss": -12.105904579162598, "global_step": 493574, "epoch": 2937} {"train_loss": -11.190858840942383, "global_step": 493575, "epoch": 2937} {"train_loss": -12.374152183532715, "global_step": 493576, "epoch": 2937} {"train_loss": -11.846342086791992, "global_step": 493577, "epoch": 2937} {"train_loss": -12.187097549438477, "global_step": 493578, "epoch": 2937} {"train_loss": -11.604743957519531, "global_step": 493579, "epoch": 2937} {"train_loss": -12.139507293701172, "global_step": 493580, "epoch": 2937} {"train_loss": -12.556333541870117, "global_step": 493581, "epoch": 2937} {"train_loss": -12.113468170166016, "global_step": 493582, "epoch": 2937} {"train_loss": -12.17871295838129, "global_step": 493583, "epoch": 2937, "val_loss": 313281.375} {"train_loss": -11.880657196044922, "global_step": 493584, "epoch": 2938} {"train_loss": -12.175265312194824, "global_step": 493585, "epoch": 2938} {"train_loss": -12.490140914916992, "global_step": 493586, "epoch": 2938} {"train_loss": -12.217409133911133, "global_step": 493587, "epoch": 2938} {"train_loss": -12.581548690795898, "global_step": 493588, "epoch": 2938} {"train_loss": -12.016608238220215, "global_step": 493589, "epoch": 2938} {"train_loss": -12.275556564331055, "global_step": 493590, "epoch": 2938} {"train_loss": -11.855806350708008, "global_step": 493591, "epoch": 2938} {"train_loss": -11.86803150177002, "global_step": 493592, "epoch": 2938} {"train_loss": -12.124481201171875, "global_step": 493593, "epoch": 2938} {"train_loss": -11.53683090209961, "global_step": 493594, "epoch": 2938} {"train_loss": -12.5204439163208, "global_step": 493595, "epoch": 2938} {"train_loss": -12.065120697021484, "global_step": 493596, "epoch": 2938} {"train_loss": -12.021583557128906, "global_step": 493597, "epoch": 2938} {"train_loss": -12.199804306030273, "global_step": 493598, "epoch": 2938} {"train_loss": -12.27405834197998, "global_step": 493599, "epoch": 2938} {"train_loss": -12.00796890258789, "global_step": 493600, "epoch": 2938} {"train_loss": -12.254104614257812, "global_step": 493601, "epoch": 2938} {"train_loss": -12.311747550964355, "global_step": 493602, "epoch": 2938} {"train_loss": -12.243429183959961, "global_step": 493603, "epoch": 2938} {"train_loss": -11.759927749633789, "global_step": 493604, "epoch": 2938} {"train_loss": -11.228761672973633, "global_step": 493605, "epoch": 2938} {"train_loss": -12.018937110900879, "global_step": 493606, "epoch": 2938} {"train_loss": -11.57845687866211, "global_step": 493607, "epoch": 2938} {"train_loss": -10.966232299804688, "global_step": 493608, "epoch": 2938} {"train_loss": -11.038206100463867, "global_step": 493609, "epoch": 2938} {"train_loss": -10.279077529907227, "global_step": 493610, "epoch": 2938} {"train_loss": -12.262283325195312, "global_step": 493611, "epoch": 2938} {"train_loss": -10.945047378540039, "global_step": 493612, "epoch": 2938} {"train_loss": -10.623542785644531, "global_step": 493613, "epoch": 2938} {"train_loss": -12.054403305053711, "global_step": 493614, "epoch": 2938} {"train_loss": -11.373950958251953, "global_step": 493615, "epoch": 2938} {"train_loss": -10.604340553283691, "global_step": 493616, "epoch": 2938} {"train_loss": -11.852315902709961, "global_step": 493617, "epoch": 2938} {"train_loss": -9.75984001159668, "global_step": 493618, "epoch": 2938} {"train_loss": -8.784765243530273, "global_step": 493619, "epoch": 2938} {"train_loss": -10.084953308105469, "global_step": 493620, "epoch": 2938} {"train_loss": -10.183652877807617, "global_step": 493621, "epoch": 2938} {"train_loss": -10.975610733032227, "global_step": 493622, "epoch": 2938} {"train_loss": -10.392425537109375, "global_step": 493623, "epoch": 2938} {"train_loss": -9.719169616699219, "global_step": 493624, "epoch": 2938} {"train_loss": -10.435700416564941, "global_step": 493625, "epoch": 2938} {"train_loss": -11.165014266967773, "global_step": 493626, "epoch": 2938} {"train_loss": -11.417682647705078, "global_step": 493627, "epoch": 2938} {"train_loss": -11.368864059448242, "global_step": 493628, "epoch": 2938} {"train_loss": -11.160755157470703, "global_step": 493629, "epoch": 2938} {"train_loss": -11.834868431091309, "global_step": 493630, "epoch": 2938} {"train_loss": -10.804112434387207, "global_step": 493631, "epoch": 2938} {"train_loss": -11.813486099243164, "global_step": 493632, "epoch": 2938} {"train_loss": -11.29458999633789, "global_step": 493633, "epoch": 2938} {"train_loss": -11.755990982055664, "global_step": 493634, "epoch": 2938} {"train_loss": -11.940719604492188, "global_step": 493635, "epoch": 2938} {"train_loss": -12.202163696289062, "global_step": 493636, "epoch": 2938} {"train_loss": -12.046504974365234, "global_step": 493637, "epoch": 2938} {"train_loss": -12.338611602783203, "global_step": 493638, "epoch": 2938} {"train_loss": -11.702255249023438, "global_step": 493639, "epoch": 2938} {"train_loss": -12.390382766723633, "global_step": 493640, "epoch": 2938} {"train_loss": -12.224983215332031, "global_step": 493641, "epoch": 2938} {"train_loss": -12.274641036987305, "global_step": 493642, "epoch": 2938} {"train_loss": -12.038504600524902, "global_step": 493643, "epoch": 2938} {"train_loss": -12.229474067687988, "global_step": 493644, "epoch": 2938} {"train_loss": -11.992502212524414, "global_step": 493645, "epoch": 2938} {"train_loss": -12.47153091430664, "global_step": 493646, "epoch": 2938} {"train_loss": -12.130775451660156, "global_step": 493647, "epoch": 2938} {"train_loss": -12.542939186096191, "global_step": 493648, "epoch": 2938} {"train_loss": -11.806478500366211, "global_step": 493649, "epoch": 2938} {"train_loss": -12.490468978881836, "global_step": 493650, "epoch": 2938} {"train_loss": -12.175379753112793, "global_step": 493651, "epoch": 2938} {"train_loss": -12.697550773620605, "global_step": 493652, "epoch": 2938} {"train_loss": -12.312613487243652, "global_step": 493653, "epoch": 2938} {"train_loss": -12.54498291015625, "global_step": 493654, "epoch": 2938} {"train_loss": -12.486082077026367, "global_step": 493655, "epoch": 2938} {"train_loss": -12.581226348876953, "global_step": 493656, "epoch": 2938} {"train_loss": -12.422443389892578, "global_step": 493657, "epoch": 2938} {"train_loss": -12.347532272338867, "global_step": 493658, "epoch": 2938} {"train_loss": -11.996856689453125, "global_step": 493659, "epoch": 2938} {"train_loss": -12.544952392578125, "global_step": 493660, "epoch": 2938} {"train_loss": -12.378917694091797, "global_step": 493661, "epoch": 2938} {"train_loss": -12.41493034362793, "global_step": 493662, "epoch": 2938} {"train_loss": -12.328871726989746, "global_step": 493663, "epoch": 2938} {"train_loss": -12.617364883422852, "global_step": 493664, "epoch": 2938} {"train_loss": -12.41124439239502, "global_step": 493665, "epoch": 2938} {"train_loss": -12.574492454528809, "global_step": 493666, "epoch": 2938} {"train_loss": -12.817180633544922, "global_step": 493667, "epoch": 2938} {"train_loss": -12.698175430297852, "global_step": 493668, "epoch": 2938} {"train_loss": -12.58165168762207, "global_step": 493669, "epoch": 2938} {"train_loss": -12.488544464111328, "global_step": 493670, "epoch": 2938} {"train_loss": -12.556097030639648, "global_step": 493671, "epoch": 2938} {"train_loss": -12.663393020629883, "global_step": 493672, "epoch": 2938} {"train_loss": -12.580350875854492, "global_step": 493673, "epoch": 2938} {"train_loss": -12.594670295715332, "global_step": 493674, "epoch": 2938} {"train_loss": -12.621267318725586, "global_step": 493675, "epoch": 2938} {"train_loss": -12.711562156677246, "global_step": 493676, "epoch": 2938} {"train_loss": -12.54977798461914, "global_step": 493677, "epoch": 2938} {"train_loss": -12.920982360839844, "global_step": 493678, "epoch": 2938} {"train_loss": -12.789058685302734, "global_step": 493679, "epoch": 2938} {"train_loss": -12.832210540771484, "global_step": 493680, "epoch": 2938} {"train_loss": -12.471760749816895, "global_step": 493681, "epoch": 2938} {"train_loss": -12.759227752685547, "global_step": 493682, "epoch": 2938} {"train_loss": -12.671018600463867, "global_step": 493683, "epoch": 2938} {"train_loss": -12.588167190551758, "global_step": 493684, "epoch": 2938} {"train_loss": -12.565938949584961, "global_step": 493685, "epoch": 2938} {"train_loss": -12.64236831665039, "global_step": 493686, "epoch": 2938} {"train_loss": -12.537468910217285, "global_step": 493687, "epoch": 2938} {"train_loss": -12.716021537780762, "global_step": 493688, "epoch": 2938} {"train_loss": -12.632811546325684, "global_step": 493689, "epoch": 2938} {"train_loss": -12.606050491333008, "global_step": 493690, "epoch": 2938} {"train_loss": -12.685358047485352, "global_step": 493691, "epoch": 2938} {"train_loss": -12.156686782836914, "global_step": 493692, "epoch": 2938} {"train_loss": -12.58065128326416, "global_step": 493693, "epoch": 2938} {"train_loss": -12.237991333007812, "global_step": 493694, "epoch": 2938} {"train_loss": -12.572343826293945, "global_step": 493695, "epoch": 2938} {"train_loss": -12.55289077758789, "global_step": 493696, "epoch": 2938} {"train_loss": -12.386110305786133, "global_step": 493697, "epoch": 2938} {"train_loss": -12.800910949707031, "global_step": 493698, "epoch": 2938} {"train_loss": -12.211904525756836, "global_step": 493699, "epoch": 2938} {"train_loss": -12.510568618774414, "global_step": 493700, "epoch": 2938} {"train_loss": -12.481542587280273, "global_step": 493701, "epoch": 2938} {"train_loss": -11.938067436218262, "global_step": 493702, "epoch": 2938} {"train_loss": -12.659547805786133, "global_step": 493703, "epoch": 2938} {"train_loss": -11.862345695495605, "global_step": 493704, "epoch": 2938} {"train_loss": -11.187368392944336, "global_step": 493705, "epoch": 2938} {"train_loss": -12.44608211517334, "global_step": 493706, "epoch": 2938} {"train_loss": -11.370975494384766, "global_step": 493707, "epoch": 2938} {"train_loss": -12.196374893188477, "global_step": 493708, "epoch": 2938} {"train_loss": -11.461325645446777, "global_step": 493709, "epoch": 2938} {"train_loss": -11.993928909301758, "global_step": 493710, "epoch": 2938} {"train_loss": -11.36363410949707, "global_step": 493711, "epoch": 2938} {"train_loss": -11.436568260192871, "global_step": 493712, "epoch": 2938} {"train_loss": -12.34631633758545, "global_step": 493713, "epoch": 2938} {"train_loss": -11.277677536010742, "global_step": 493714, "epoch": 2938} {"train_loss": -12.347426414489746, "global_step": 493715, "epoch": 2938} {"train_loss": -11.494549751281738, "global_step": 493716, "epoch": 2938} {"train_loss": -12.332023620605469, "global_step": 493717, "epoch": 2938} {"train_loss": -12.50966739654541, "global_step": 493718, "epoch": 2938} {"train_loss": -12.592588424682617, "global_step": 493719, "epoch": 2938} {"train_loss": -12.738329887390137, "global_step": 493720, "epoch": 2938} {"train_loss": -12.70256233215332, "global_step": 493721, "epoch": 2938} {"train_loss": -12.414275169372559, "global_step": 493722, "epoch": 2938} {"train_loss": -12.318811416625977, "global_step": 493723, "epoch": 2938} {"train_loss": -12.501482009887695, "global_step": 493724, "epoch": 2938} {"train_loss": -12.120647430419922, "global_step": 493725, "epoch": 2938} {"train_loss": -12.638724327087402, "global_step": 493726, "epoch": 2938} {"train_loss": -12.443584442138672, "global_step": 493727, "epoch": 2938} {"train_loss": -12.157974243164062, "global_step": 493728, "epoch": 2938} {"train_loss": -12.710741996765137, "global_step": 493729, "epoch": 2938} {"train_loss": -12.258739471435547, "global_step": 493730, "epoch": 2938} {"train_loss": -12.640663146972656, "global_step": 493731, "epoch": 2938} {"train_loss": -12.006227493286133, "global_step": 493732, "epoch": 2938} {"train_loss": -12.623251914978027, "global_step": 493733, "epoch": 2938} {"train_loss": -12.205375671386719, "global_step": 493734, "epoch": 2938} {"train_loss": -12.318641662597656, "global_step": 493735, "epoch": 2938} {"train_loss": -12.256612777709961, "global_step": 493736, "epoch": 2938} {"train_loss": -12.582294464111328, "global_step": 493737, "epoch": 2938} {"train_loss": -12.71536636352539, "global_step": 493738, "epoch": 2938} {"train_loss": -12.28887939453125, "global_step": 493739, "epoch": 2938} {"train_loss": -12.73169231414795, "global_step": 493740, "epoch": 2938} {"train_loss": -12.21742057800293, "global_step": 493741, "epoch": 2938} {"train_loss": -12.78250503540039, "global_step": 493742, "epoch": 2938} {"train_loss": -12.575695037841797, "global_step": 493743, "epoch": 2938} {"train_loss": -12.508058547973633, "global_step": 493744, "epoch": 2938} {"train_loss": -12.623104095458984, "global_step": 493745, "epoch": 2938} {"train_loss": -12.307575225830078, "global_step": 493746, "epoch": 2938} {"train_loss": -12.33871841430664, "global_step": 493747, "epoch": 2938} {"train_loss": -12.495989799499512, "global_step": 493748, "epoch": 2938} {"train_loss": -12.415389060974121, "global_step": 493749, "epoch": 2938} {"train_loss": -12.689783096313477, "global_step": 493750, "epoch": 2938} {"train_loss": -12.097697411264692, "global_step": 493751, "epoch": 2938, "val_loss": 321393.78125} {"train_loss": -11.656893730163574, "global_step": 493752, "epoch": 2939} {"train_loss": -12.660942077636719, "global_step": 493753, "epoch": 2939} {"train_loss": -11.965261459350586, "global_step": 493754, "epoch": 2939} {"train_loss": -12.537904739379883, "global_step": 493755, "epoch": 2939} {"train_loss": -12.105016708374023, "global_step": 493756, "epoch": 2939} {"train_loss": -12.440479278564453, "global_step": 493757, "epoch": 2939} {"train_loss": -12.425735473632812, "global_step": 493758, "epoch": 2939} {"train_loss": -12.423128128051758, "global_step": 493759, "epoch": 2939} {"train_loss": -12.402121543884277, "global_step": 493760, "epoch": 2939} {"train_loss": -12.4908447265625, "global_step": 493761, "epoch": 2939} {"train_loss": -12.02064323425293, "global_step": 493762, "epoch": 2939} {"train_loss": -12.060447692871094, "global_step": 493763, "epoch": 2939} {"train_loss": -12.576639175415039, "global_step": 493764, "epoch": 2939} {"train_loss": -12.369827270507812, "global_step": 493765, "epoch": 2939} {"train_loss": -12.288618087768555, "global_step": 493766, "epoch": 2939} {"train_loss": -12.723275184631348, "global_step": 493767, "epoch": 2939} {"train_loss": -12.653547286987305, "global_step": 493768, "epoch": 2939} {"train_loss": -12.47429084777832, "global_step": 493769, "epoch": 2939} {"train_loss": -12.772493362426758, "global_step": 493770, "epoch": 2939} {"train_loss": -12.523792266845703, "global_step": 493771, "epoch": 2939} {"train_loss": -12.833562850952148, "global_step": 493772, "epoch": 2939} {"train_loss": -12.607268333435059, "global_step": 493773, "epoch": 2939} {"train_loss": -12.786184310913086, "global_step": 493774, "epoch": 2939} {"train_loss": -12.543729782104492, "global_step": 493775, "epoch": 2939} {"train_loss": -12.82438850402832, "global_step": 493776, "epoch": 2939} {"train_loss": -12.36296272277832, "global_step": 493777, "epoch": 2939} {"train_loss": -12.870648384094238, "global_step": 493778, "epoch": 2939} {"train_loss": -12.556560516357422, "global_step": 493779, "epoch": 2939} {"train_loss": -12.431001663208008, "global_step": 493780, "epoch": 2939} {"train_loss": -12.004281044006348, "global_step": 493781, "epoch": 2939} {"train_loss": -12.190811157226562, "global_step": 493782, "epoch": 2939} {"train_loss": -12.661834716796875, "global_step": 493783, "epoch": 2939} {"train_loss": -11.943028450012207, "global_step": 493784, "epoch": 2939} {"train_loss": -12.247692108154297, "global_step": 493785, "epoch": 2939} {"train_loss": -12.453088760375977, "global_step": 493786, "epoch": 2939} {"train_loss": -12.625640869140625, "global_step": 493787, "epoch": 2939} {"train_loss": -12.4041748046875, "global_step": 493788, "epoch": 2939} {"train_loss": -12.122079849243164, "global_step": 493789, "epoch": 2939} {"train_loss": -12.091337203979492, "global_step": 493790, "epoch": 2939} {"train_loss": -12.906768798828125, "global_step": 493791, "epoch": 2939} {"train_loss": -11.986461639404297, "global_step": 493792, "epoch": 2939} {"train_loss": -12.778688430786133, "global_step": 493793, "epoch": 2939} {"train_loss": -11.50960636138916, "global_step": 493794, "epoch": 2939} {"train_loss": -11.323454856872559, "global_step": 493795, "epoch": 2939} {"train_loss": -12.205460548400879, "global_step": 493796, "epoch": 2939} {"train_loss": -11.67611026763916, "global_step": 493797, "epoch": 2939} {"train_loss": -11.388769149780273, "global_step": 493798, "epoch": 2939} {"train_loss": -12.321557998657227, "global_step": 493799, "epoch": 2939} {"train_loss": -11.685256958007812, "global_step": 493800, "epoch": 2939} {"train_loss": -10.883733749389648, "global_step": 493801, "epoch": 2939} {"train_loss": -12.815768241882324, "global_step": 493802, "epoch": 2939} {"train_loss": -10.91989803314209, "global_step": 493803, "epoch": 2939} {"train_loss": -12.332267761230469, "global_step": 493804, "epoch": 2939} {"train_loss": -11.73708438873291, "global_step": 493805, "epoch": 2939} {"train_loss": -11.536772727966309, "global_step": 493806, "epoch": 2939} {"train_loss": -12.016769409179688, "global_step": 493807, "epoch": 2939} {"train_loss": -12.271886825561523, "global_step": 493808, "epoch": 2939} {"train_loss": -11.018722534179688, "global_step": 493809, "epoch": 2939} {"train_loss": -12.14431381225586, "global_step": 493810, "epoch": 2939} {"train_loss": -12.071338653564453, "global_step": 493811, "epoch": 2939} {"train_loss": -11.658731460571289, "global_step": 493812, "epoch": 2939} {"train_loss": -11.973226547241211, "global_step": 493813, "epoch": 2939} {"train_loss": -11.143972396850586, "global_step": 493814, "epoch": 2939} {"train_loss": -11.969939231872559, "global_step": 493815, "epoch": 2939} {"train_loss": -11.905767440795898, "global_step": 493816, "epoch": 2939} {"train_loss": -10.959808349609375, "global_step": 493817, "epoch": 2939} {"train_loss": -12.212833404541016, "global_step": 493818, "epoch": 2939} {"train_loss": -10.917400360107422, "global_step": 493819, "epoch": 2939} {"train_loss": -11.609392166137695, "global_step": 493820, "epoch": 2939} {"train_loss": -12.295004844665527, "global_step": 493821, "epoch": 2939} {"train_loss": -11.338556289672852, "global_step": 493822, "epoch": 2939} {"train_loss": -12.61063003540039, "global_step": 493823, "epoch": 2939} {"train_loss": -11.577600479125977, "global_step": 493824, "epoch": 2939} {"train_loss": -12.424426078796387, "global_step": 493825, "epoch": 2939} {"train_loss": -11.66667366027832, "global_step": 493826, "epoch": 2939} {"train_loss": -12.351188659667969, "global_step": 493827, "epoch": 2939} {"train_loss": -12.249923706054688, "global_step": 493828, "epoch": 2939} {"train_loss": -11.447305679321289, "global_step": 493829, "epoch": 2939} {"train_loss": -12.149492263793945, "global_step": 493830, "epoch": 2939} {"train_loss": -12.222697257995605, "global_step": 493831, "epoch": 2939} {"train_loss": -11.755594253540039, "global_step": 493832, "epoch": 2939} {"train_loss": -12.439827919006348, "global_step": 493833, "epoch": 2939} {"train_loss": -12.301044464111328, "global_step": 493834, "epoch": 2939} {"train_loss": -12.370905876159668, "global_step": 493835, "epoch": 2939} {"train_loss": -12.079154968261719, "global_step": 493836, "epoch": 2939} {"train_loss": -12.29362678527832, "global_step": 493837, "epoch": 2939} {"train_loss": -12.392433166503906, "global_step": 493838, "epoch": 2939} {"train_loss": -12.024940490722656, "global_step": 493839, "epoch": 2939} {"train_loss": -11.999770164489746, "global_step": 493840, "epoch": 2939} {"train_loss": -12.199344635009766, "global_step": 493841, "epoch": 2939} {"train_loss": -12.173707008361816, "global_step": 493842, "epoch": 2939} {"train_loss": -11.909920692443848, "global_step": 493843, "epoch": 2939} {"train_loss": -12.070037841796875, "global_step": 493844, "epoch": 2939} {"train_loss": -12.259798049926758, "global_step": 493845, "epoch": 2939} {"train_loss": -11.891780853271484, "global_step": 493846, "epoch": 2939} {"train_loss": -12.15262222290039, "global_step": 493847, "epoch": 2939} {"train_loss": -11.920943260192871, "global_step": 493848, "epoch": 2939} {"train_loss": -11.996034622192383, "global_step": 493849, "epoch": 2939} {"train_loss": -12.36465072631836, "global_step": 493850, "epoch": 2939} {"train_loss": -11.962366104125977, "global_step": 493851, "epoch": 2939} {"train_loss": -12.51763916015625, "global_step": 493852, "epoch": 2939} {"train_loss": -12.117172241210938, "global_step": 493853, "epoch": 2939} {"train_loss": -12.532110214233398, "global_step": 493854, "epoch": 2939} {"train_loss": -12.23005485534668, "global_step": 493855, "epoch": 2939} {"train_loss": -12.142717361450195, "global_step": 493856, "epoch": 2939} {"train_loss": -12.352802276611328, "global_step": 493857, "epoch": 2939} {"train_loss": -12.34292984008789, "global_step": 493858, "epoch": 2939} {"train_loss": -12.345833778381348, "global_step": 493859, "epoch": 2939} {"train_loss": -12.606453895568848, "global_step": 493860, "epoch": 2939} {"train_loss": -12.4158935546875, "global_step": 493861, "epoch": 2939} {"train_loss": -12.295547485351562, "global_step": 493862, "epoch": 2939} {"train_loss": -12.475915908813477, "global_step": 493863, "epoch": 2939} {"train_loss": -12.394021987915039, "global_step": 493864, "epoch": 2939} {"train_loss": -12.671455383300781, "global_step": 493865, "epoch": 2939} {"train_loss": -12.41429328918457, "global_step": 493866, "epoch": 2939} {"train_loss": -12.659749031066895, "global_step": 493867, "epoch": 2939} {"train_loss": -12.610109329223633, "global_step": 493868, "epoch": 2939} {"train_loss": -12.640970230102539, "global_step": 493869, "epoch": 2939} {"train_loss": -12.818445205688477, "global_step": 493870, "epoch": 2939} {"train_loss": -12.715311050415039, "global_step": 493871, "epoch": 2939} {"train_loss": -12.519636154174805, "global_step": 493872, "epoch": 2939} {"train_loss": -12.729324340820312, "global_step": 493873, "epoch": 2939} {"train_loss": -12.67463493347168, "global_step": 493874, "epoch": 2939} {"train_loss": -12.794916152954102, "global_step": 493875, "epoch": 2939} {"train_loss": -12.886054992675781, "global_step": 493876, "epoch": 2939} {"train_loss": -12.999505043029785, "global_step": 493877, "epoch": 2939} {"train_loss": -12.98546314239502, "global_step": 493878, "epoch": 2939} {"train_loss": -12.980072021484375, "global_step": 493879, "epoch": 2939} {"train_loss": -12.806937217712402, "global_step": 493880, "epoch": 2939} {"train_loss": -12.764042854309082, "global_step": 493881, "epoch": 2939} {"train_loss": -12.881635665893555, "global_step": 493882, "epoch": 2939} {"train_loss": -12.77669620513916, "global_step": 493883, "epoch": 2939} {"train_loss": -12.77140998840332, "global_step": 493884, "epoch": 2939} {"train_loss": -12.935322761535645, "global_step": 493885, "epoch": 2939} {"train_loss": -12.859514236450195, "global_step": 493886, "epoch": 2939} {"train_loss": -12.828791618347168, "global_step": 493887, "epoch": 2939} {"train_loss": -12.995282173156738, "global_step": 493888, "epoch": 2939} {"train_loss": -12.930004119873047, "global_step": 493889, "epoch": 2939} {"train_loss": -12.506338119506836, "global_step": 493890, "epoch": 2939} {"train_loss": -12.720446586608887, "global_step": 493891, "epoch": 2939} {"train_loss": -12.960687637329102, "global_step": 493892, "epoch": 2939} {"train_loss": -12.759794235229492, "global_step": 493893, "epoch": 2939} {"train_loss": -13.09500503540039, "global_step": 493894, "epoch": 2939} {"train_loss": -12.95841121673584, "global_step": 493895, "epoch": 2939} {"train_loss": -12.925251007080078, "global_step": 493896, "epoch": 2939} {"train_loss": -12.914785385131836, "global_step": 493897, "epoch": 2939} {"train_loss": -12.96298885345459, "global_step": 493898, "epoch": 2939} {"train_loss": -13.134963989257812, "global_step": 493899, "epoch": 2939} {"train_loss": -12.868928909301758, "global_step": 493900, "epoch": 2939} {"train_loss": -13.096563339233398, "global_step": 493901, "epoch": 2939} {"train_loss": -13.055767059326172, "global_step": 493902, "epoch": 2939} {"train_loss": -12.901067733764648, "global_step": 493903, "epoch": 2939} {"train_loss": -12.723932266235352, "global_step": 493904, "epoch": 2939} {"train_loss": -12.98708724975586, "global_step": 493905, "epoch": 2939} {"train_loss": -12.875274658203125, "global_step": 493906, "epoch": 2939} {"train_loss": -12.516890525817871, "global_step": 493907, "epoch": 2939} {"train_loss": -13.0211181640625, "global_step": 493908, "epoch": 2939} {"train_loss": -12.864747047424316, "global_step": 493909, "epoch": 2939} {"train_loss": -12.497478485107422, "global_step": 493910, "epoch": 2939} {"train_loss": -12.56400203704834, "global_step": 493911, "epoch": 2939} {"train_loss": -12.919639587402344, "global_step": 493912, "epoch": 2939} {"train_loss": -12.942546844482422, "global_step": 493913, "epoch": 2939} {"train_loss": -12.460820198059082, "global_step": 493914, "epoch": 2939} {"train_loss": -12.331220626831055, "global_step": 493915, "epoch": 2939} {"train_loss": -13.210058212280273, "global_step": 493916, "epoch": 2939} {"train_loss": -12.831663131713867, "global_step": 493917, "epoch": 2939} {"train_loss": -12.292994499206543, "global_step": 493918, "epoch": 2939} {"train_loss": -12.366887620517186, "global_step": 493919, "epoch": 2939, "val_loss": 321309.71875} {"train_loss": -12.686408996582031, "global_step": 493920, "epoch": 2940} {"train_loss": -11.387295722961426, "global_step": 493921, "epoch": 2940} {"train_loss": -11.971280097961426, "global_step": 493922, "epoch": 2940} {"train_loss": -12.497969627380371, "global_step": 493923, "epoch": 2940} {"train_loss": -11.389086723327637, "global_step": 493924, "epoch": 2940} {"train_loss": -10.209470748901367, "global_step": 493925, "epoch": 2940} {"train_loss": -10.659985542297363, "global_step": 493926, "epoch": 2940} {"train_loss": -10.726653099060059, "global_step": 493927, "epoch": 2940} {"train_loss": -9.716690063476562, "global_step": 493928, "epoch": 2940} {"train_loss": -9.5110502243042, "global_step": 493929, "epoch": 2940} {"train_loss": -9.165027618408203, "global_step": 493930, "epoch": 2940} {"train_loss": -8.396549224853516, "global_step": 493931, "epoch": 2940} {"train_loss": -10.584210395812988, "global_step": 493932, "epoch": 2940} {"train_loss": -10.436976432800293, "global_step": 493933, "epoch": 2940} {"train_loss": -9.937248229980469, "global_step": 493934, "epoch": 2940} {"train_loss": -10.818183898925781, "global_step": 493935, "epoch": 2940} {"train_loss": -11.14677906036377, "global_step": 493936, "epoch": 2940} {"train_loss": -10.708244323730469, "global_step": 493937, "epoch": 2940} {"train_loss": -10.748485565185547, "global_step": 493938, "epoch": 2940} {"train_loss": -11.44660758972168, "global_step": 493939, "epoch": 2940} {"train_loss": -10.266014099121094, "global_step": 493940, "epoch": 2940} {"train_loss": -11.136713027954102, "global_step": 493941, "epoch": 2940} {"train_loss": -10.020559310913086, "global_step": 493942, "epoch": 2940} {"train_loss": -11.412763595581055, "global_step": 493943, "epoch": 2940} {"train_loss": -11.889192581176758, "global_step": 493944, "epoch": 2940} {"train_loss": -10.334038734436035, "global_step": 493945, "epoch": 2940} {"train_loss": -11.894294738769531, "global_step": 493946, "epoch": 2940} {"train_loss": -10.163558959960938, "global_step": 493947, "epoch": 2940} {"train_loss": -11.218467712402344, "global_step": 493948, "epoch": 2940} {"train_loss": -10.886990547180176, "global_step": 493949, "epoch": 2940} {"train_loss": -10.100361824035645, "global_step": 493950, "epoch": 2940} {"train_loss": -10.983131408691406, "global_step": 493951, "epoch": 2940} {"train_loss": -11.296138763427734, "global_step": 493952, "epoch": 2940} {"train_loss": -11.437929153442383, "global_step": 493953, "epoch": 2940} {"train_loss": -11.697868347167969, "global_step": 493954, "epoch": 2940} {"train_loss": -11.057170867919922, "global_step": 493955, "epoch": 2940} {"train_loss": -11.985393524169922, "global_step": 493956, "epoch": 2940} {"train_loss": -12.15836238861084, "global_step": 493957, "epoch": 2940} {"train_loss": -11.849197387695312, "global_step": 493958, "epoch": 2940} {"train_loss": -11.898171424865723, "global_step": 493959, "epoch": 2940} {"train_loss": -11.416115760803223, "global_step": 493960, "epoch": 2940} {"train_loss": -11.896369934082031, "global_step": 493961, "epoch": 2940} {"train_loss": -12.430376052856445, "global_step": 493962, "epoch": 2940} {"train_loss": -12.012727737426758, "global_step": 493963, "epoch": 2940} {"train_loss": -12.00282096862793, "global_step": 493964, "epoch": 2940} {"train_loss": -11.824264526367188, "global_step": 493965, "epoch": 2940} {"train_loss": -11.84757137298584, "global_step": 493966, "epoch": 2940} {"train_loss": -12.040616989135742, "global_step": 493967, "epoch": 2940} {"train_loss": -11.12838363647461, "global_step": 493968, "epoch": 2940} {"train_loss": -12.045743942260742, "global_step": 493969, "epoch": 2940} {"train_loss": -12.170493125915527, "global_step": 493970, "epoch": 2940} {"train_loss": -11.559650421142578, "global_step": 493971, "epoch": 2940} {"train_loss": -12.229730606079102, "global_step": 493972, "epoch": 2940} {"train_loss": -12.10146427154541, "global_step": 493973, "epoch": 2940} {"train_loss": -12.318729400634766, "global_step": 493974, "epoch": 2940} {"train_loss": -12.30191707611084, "global_step": 493975, "epoch": 2940} {"train_loss": -11.58677864074707, "global_step": 493976, "epoch": 2940} {"train_loss": -11.815128326416016, "global_step": 493977, "epoch": 2940} {"train_loss": -12.295802116394043, "global_step": 493978, "epoch": 2940} {"train_loss": -12.111734390258789, "global_step": 493979, "epoch": 2940} {"train_loss": -11.9031400680542, "global_step": 493980, "epoch": 2940} {"train_loss": -11.436936378479004, "global_step": 493981, "epoch": 2940} {"train_loss": -12.289015769958496, "global_step": 493982, "epoch": 2940} {"train_loss": -12.214022636413574, "global_step": 493983, "epoch": 2940} {"train_loss": -12.464127540588379, "global_step": 493984, "epoch": 2940} {"train_loss": -12.437178611755371, "global_step": 493985, "epoch": 2940} {"train_loss": -12.303894996643066, "global_step": 493986, "epoch": 2940} {"train_loss": -12.486392974853516, "global_step": 493987, "epoch": 2940} {"train_loss": -12.46922492980957, "global_step": 493988, "epoch": 2940} {"train_loss": -12.481664657592773, "global_step": 493989, "epoch": 2940} {"train_loss": -12.557746887207031, "global_step": 493990, "epoch": 2940} {"train_loss": -12.28183364868164, "global_step": 493991, "epoch": 2940} {"train_loss": -12.207952499389648, "global_step": 493992, "epoch": 2940} {"train_loss": -12.175966262817383, "global_step": 493993, "epoch": 2940} {"train_loss": -12.64468765258789, "global_step": 493994, "epoch": 2940} {"train_loss": -12.353771209716797, "global_step": 493995, "epoch": 2940} {"train_loss": -12.541400909423828, "global_step": 493996, "epoch": 2940} {"train_loss": -12.536152839660645, "global_step": 493997, "epoch": 2940} {"train_loss": -12.747459411621094, "global_step": 493998, "epoch": 2940} {"train_loss": -12.78805160522461, "global_step": 493999, "epoch": 2940} {"train_loss": -12.62492561340332, "global_step": 494000, "epoch": 2940} {"train_loss": -12.542976379394531, "global_step": 494001, "epoch": 2940} {"train_loss": -12.727212905883789, "global_step": 494002, "epoch": 2940} {"train_loss": -12.72067642211914, "global_step": 494003, "epoch": 2940} {"train_loss": -12.86043930053711, "global_step": 494004, "epoch": 2940} {"train_loss": -12.206275939941406, "global_step": 494005, "epoch": 2940} {"train_loss": -12.743147850036621, "global_step": 494006, "epoch": 2940} {"train_loss": -12.636908531188965, "global_step": 494007, "epoch": 2940} {"train_loss": -12.428611755371094, "global_step": 494008, "epoch": 2940} {"train_loss": -12.691031455993652, "global_step": 494009, "epoch": 2940} {"train_loss": -12.566761016845703, "global_step": 494010, "epoch": 2940} {"train_loss": -12.822543144226074, "global_step": 494011, "epoch": 2940} {"train_loss": -12.519102096557617, "global_step": 494012, "epoch": 2940} {"train_loss": -12.921152114868164, "global_step": 494013, "epoch": 2940} {"train_loss": -12.78039264678955, "global_step": 494014, "epoch": 2940} {"train_loss": -12.518913269042969, "global_step": 494015, "epoch": 2940} {"train_loss": -12.402254104614258, "global_step": 494016, "epoch": 2940} {"train_loss": -12.61900806427002, "global_step": 494017, "epoch": 2940} {"train_loss": -12.808908462524414, "global_step": 494018, "epoch": 2940} {"train_loss": -12.913772583007812, "global_step": 494019, "epoch": 2940} {"train_loss": -12.853672981262207, "global_step": 494020, "epoch": 2940} {"train_loss": -12.888712882995605, "global_step": 494021, "epoch": 2940} {"train_loss": -13.028034210205078, "global_step": 494022, "epoch": 2940} {"train_loss": -12.890026092529297, "global_step": 494023, "epoch": 2940} {"train_loss": -12.93679141998291, "global_step": 494024, "epoch": 2940} {"train_loss": -13.023664474487305, "global_step": 494025, "epoch": 2940} {"train_loss": -12.898908615112305, "global_step": 494026, "epoch": 2940} {"train_loss": -12.91978645324707, "global_step": 494027, "epoch": 2940} {"train_loss": -12.899740219116211, "global_step": 494028, "epoch": 2940} {"train_loss": -12.965901374816895, "global_step": 494029, "epoch": 2940} {"train_loss": -12.970626831054688, "global_step": 494030, "epoch": 2940} {"train_loss": -12.917328834533691, "global_step": 494031, "epoch": 2940} {"train_loss": -12.97461223602295, "global_step": 494032, "epoch": 2940} {"train_loss": -12.782063484191895, "global_step": 494033, "epoch": 2940} {"train_loss": -13.084522247314453, "global_step": 494034, "epoch": 2940} {"train_loss": -12.85628604888916, "global_step": 494035, "epoch": 2940} {"train_loss": -12.78544807434082, "global_step": 494036, "epoch": 2940} {"train_loss": -12.76842975616455, "global_step": 494037, "epoch": 2940} {"train_loss": -12.534846305847168, "global_step": 494038, "epoch": 2940} {"train_loss": -12.489921569824219, "global_step": 494039, "epoch": 2940} {"train_loss": -12.825728416442871, "global_step": 494040, "epoch": 2940} {"train_loss": -13.099679946899414, "global_step": 494041, "epoch": 2940} {"train_loss": -12.997819900512695, "global_step": 494042, "epoch": 2940} {"train_loss": -12.989710807800293, "global_step": 494043, "epoch": 2940} {"train_loss": -12.756345748901367, "global_step": 494044, "epoch": 2940} {"train_loss": -12.966673851013184, "global_step": 494045, "epoch": 2940} {"train_loss": -12.937768936157227, "global_step": 494046, "epoch": 2940} {"train_loss": -12.86267375946045, "global_step": 494047, "epoch": 2940} {"train_loss": -12.921804428100586, "global_step": 494048, "epoch": 2940} {"train_loss": -12.992269515991211, "global_step": 494049, "epoch": 2940} {"train_loss": -12.946052551269531, "global_step": 494050, "epoch": 2940} {"train_loss": -13.098672866821289, "global_step": 494051, "epoch": 2940} {"train_loss": -12.64896011352539, "global_step": 494052, "epoch": 2940} {"train_loss": -12.936847686767578, "global_step": 494053, "epoch": 2940} {"train_loss": -12.606334686279297, "global_step": 494054, "epoch": 2940} {"train_loss": -13.002764701843262, "global_step": 494055, "epoch": 2940} {"train_loss": -12.671503067016602, "global_step": 494056, "epoch": 2940} {"train_loss": -12.988829612731934, "global_step": 494057, "epoch": 2940} {"train_loss": -12.742574691772461, "global_step": 494058, "epoch": 2940} {"train_loss": -12.851299285888672, "global_step": 494059, "epoch": 2940} {"train_loss": -13.033368110656738, "global_step": 494060, "epoch": 2940} {"train_loss": -12.532052993774414, "global_step": 494061, "epoch": 2940} {"train_loss": -11.13723373413086, "global_step": 494062, "epoch": 2940} {"train_loss": -12.558197021484375, "global_step": 494063, "epoch": 2940} {"train_loss": -11.61128044128418, "global_step": 494064, "epoch": 2940} {"train_loss": -9.553918838500977, "global_step": 494065, "epoch": 2940} {"train_loss": -11.5625638961792, "global_step": 494066, "epoch": 2940} {"train_loss": -7.996230602264404, "global_step": 494067, "epoch": 2940} {"train_loss": -9.555585861206055, "global_step": 494068, "epoch": 2940} {"train_loss": -9.259123802185059, "global_step": 494069, "epoch": 2940} {"train_loss": -9.859378814697266, "global_step": 494070, "epoch": 2940} {"train_loss": -9.495560646057129, "global_step": 494071, "epoch": 2940} {"train_loss": -9.711977005004883, "global_step": 494072, "epoch": 2940} {"train_loss": -9.590289115905762, "global_step": 494073, "epoch": 2940} {"train_loss": -9.506689071655273, "global_step": 494074, "epoch": 2940} {"train_loss": -9.640519142150879, "global_step": 494075, "epoch": 2940} {"train_loss": -9.820813179016113, "global_step": 494076, "epoch": 2940} {"train_loss": -10.38833236694336, "global_step": 494077, "epoch": 2940} {"train_loss": -10.638053894042969, "global_step": 494078, "epoch": 2940} {"train_loss": -11.681490898132324, "global_step": 494079, "epoch": 2940} {"train_loss": -11.724266052246094, "global_step": 494080, "epoch": 2940} {"train_loss": -11.3875093460083, "global_step": 494081, "epoch": 2940} {"train_loss": -11.99107837677002, "global_step": 494082, "epoch": 2940} {"train_loss": -11.314658164978027, "global_step": 494083, "epoch": 2940} {"train_loss": -11.096580505371094, "global_step": 494084, "epoch": 2940} {"train_loss": -11.067283630371094, "global_step": 494085, "epoch": 2940} {"train_loss": -11.702255249023438, "global_step": 494086, "epoch": 2940} {"train_loss": -11.867975646541232, "global_step": 494087, "epoch": 2940, "val_loss": 313740.96875, "train_action_mse_error": 1.8220672607421875} {"train_loss": -11.96917724609375, "global_step": 494088, "epoch": 2941} {"train_loss": -11.032241821289062, "global_step": 494089, "epoch": 2941} {"train_loss": -12.328646659851074, "global_step": 494090, "epoch": 2941} {"train_loss": -10.842957496643066, "global_step": 494091, "epoch": 2941} {"train_loss": -12.027929306030273, "global_step": 494092, "epoch": 2941} {"train_loss": -11.04830551147461, "global_step": 494093, "epoch": 2941} {"train_loss": -11.615102767944336, "global_step": 494094, "epoch": 2941} {"train_loss": -11.741336822509766, "global_step": 494095, "epoch": 2941} {"train_loss": -11.858909606933594, "global_step": 494096, "epoch": 2941} {"train_loss": -11.321281433105469, "global_step": 494097, "epoch": 2941} {"train_loss": -10.836173057556152, "global_step": 494098, "epoch": 2941} {"train_loss": -11.284187316894531, "global_step": 494099, "epoch": 2941} {"train_loss": -11.248621940612793, "global_step": 494100, "epoch": 2941} {"train_loss": -10.312090873718262, "global_step": 494101, "epoch": 2941} {"train_loss": -11.781631469726562, "global_step": 494102, "epoch": 2941} {"train_loss": -10.463315963745117, "global_step": 494103, "epoch": 2941} {"train_loss": -10.796072006225586, "global_step": 494104, "epoch": 2941} {"train_loss": -11.165288925170898, "global_step": 494105, "epoch": 2941} {"train_loss": -11.59933090209961, "global_step": 494106, "epoch": 2941} {"train_loss": -10.60382080078125, "global_step": 494107, "epoch": 2941} {"train_loss": -11.806705474853516, "global_step": 494108, "epoch": 2941} {"train_loss": -11.416427612304688, "global_step": 494109, "epoch": 2941} {"train_loss": -11.539109230041504, "global_step": 494110, "epoch": 2941} {"train_loss": -11.738130569458008, "global_step": 494111, "epoch": 2941} {"train_loss": -12.003316879272461, "global_step": 494112, "epoch": 2941} {"train_loss": -11.96963119506836, "global_step": 494113, "epoch": 2941} {"train_loss": -11.868202209472656, "global_step": 494114, "epoch": 2941} {"train_loss": -12.099291801452637, "global_step": 494115, "epoch": 2941} {"train_loss": -12.015185356140137, "global_step": 494116, "epoch": 2941} {"train_loss": -12.23167610168457, "global_step": 494117, "epoch": 2941} {"train_loss": -12.231599807739258, "global_step": 494118, "epoch": 2941} {"train_loss": -12.334856986999512, "global_step": 494119, "epoch": 2941} {"train_loss": -12.501673698425293, "global_step": 494120, "epoch": 2941} {"train_loss": -12.37603759765625, "global_step": 494121, "epoch": 2941} {"train_loss": -12.49544906616211, "global_step": 494122, "epoch": 2941} {"train_loss": -12.362747192382812, "global_step": 494123, "epoch": 2941} {"train_loss": -12.570108413696289, "global_step": 494124, "epoch": 2941} {"train_loss": -12.309467315673828, "global_step": 494125, "epoch": 2941} {"train_loss": -12.683476448059082, "global_step": 494126, "epoch": 2941} {"train_loss": -12.558530807495117, "global_step": 494127, "epoch": 2941} {"train_loss": -12.402742385864258, "global_step": 494128, "epoch": 2941} {"train_loss": -12.827465057373047, "global_step": 494129, "epoch": 2941} {"train_loss": -12.487348556518555, "global_step": 494130, "epoch": 2941} {"train_loss": -12.713123321533203, "global_step": 494131, "epoch": 2941} {"train_loss": -12.680242538452148, "global_step": 494132, "epoch": 2941} {"train_loss": -12.580280303955078, "global_step": 494133, "epoch": 2941} {"train_loss": -12.796730995178223, "global_step": 494134, "epoch": 2941} {"train_loss": -12.593873977661133, "global_step": 494135, "epoch": 2941} {"train_loss": -12.672499656677246, "global_step": 494136, "epoch": 2941} {"train_loss": -12.708267211914062, "global_step": 494137, "epoch": 2941} {"train_loss": -12.806143760681152, "global_step": 494138, "epoch": 2941} {"train_loss": -12.716053009033203, "global_step": 494139, "epoch": 2941} {"train_loss": -12.759145736694336, "global_step": 494140, "epoch": 2941} {"train_loss": -12.64217472076416, "global_step": 494141, "epoch": 2941} {"train_loss": -12.701162338256836, "global_step": 494142, "epoch": 2941} {"train_loss": -12.994575500488281, "global_step": 494143, "epoch": 2941} {"train_loss": -12.805355072021484, "global_step": 494144, "epoch": 2941} {"train_loss": -12.858259201049805, "global_step": 494145, "epoch": 2941} {"train_loss": -12.838889122009277, "global_step": 494146, "epoch": 2941} {"train_loss": -12.919358253479004, "global_step": 494147, "epoch": 2941} {"train_loss": -12.933515548706055, "global_step": 494148, "epoch": 2941} {"train_loss": -12.801773071289062, "global_step": 494149, "epoch": 2941} {"train_loss": -12.888842582702637, "global_step": 494150, "epoch": 2941} {"train_loss": -12.810654640197754, "global_step": 494151, "epoch": 2941} {"train_loss": -12.990818977355957, "global_step": 494152, "epoch": 2941} {"train_loss": -12.798473358154297, "global_step": 494153, "epoch": 2941} {"train_loss": -12.858599662780762, "global_step": 494154, "epoch": 2941} {"train_loss": -12.78512954711914, "global_step": 494155, "epoch": 2941} {"train_loss": -12.860820770263672, "global_step": 494156, "epoch": 2941} {"train_loss": -12.864694595336914, "global_step": 494157, "epoch": 2941} {"train_loss": -12.783912658691406, "global_step": 494158, "epoch": 2941} {"train_loss": -12.62370777130127, "global_step": 494159, "epoch": 2941} {"train_loss": -12.814335823059082, "global_step": 494160, "epoch": 2941} {"train_loss": -12.774428367614746, "global_step": 494161, "epoch": 2941} {"train_loss": -13.076351165771484, "global_step": 494162, "epoch": 2941} {"train_loss": -12.430500030517578, "global_step": 494163, "epoch": 2941} {"train_loss": -12.501935005187988, "global_step": 494164, "epoch": 2941} {"train_loss": -12.89865493774414, "global_step": 494165, "epoch": 2941} {"train_loss": -12.608192443847656, "global_step": 494166, "epoch": 2941} {"train_loss": -12.552268981933594, "global_step": 494167, "epoch": 2941} {"train_loss": -12.902924537658691, "global_step": 494168, "epoch": 2941} {"train_loss": -12.615928649902344, "global_step": 494169, "epoch": 2941} {"train_loss": -12.90218448638916, "global_step": 494170, "epoch": 2941} {"train_loss": -12.736990928649902, "global_step": 494171, "epoch": 2941} {"train_loss": -12.824283599853516, "global_step": 494172, "epoch": 2941} {"train_loss": -12.830360412597656, "global_step": 494173, "epoch": 2941} {"train_loss": -12.459321975708008, "global_step": 494174, "epoch": 2941} {"train_loss": -12.836310386657715, "global_step": 494175, "epoch": 2941} {"train_loss": -12.87256145477295, "global_step": 494176, "epoch": 2941} {"train_loss": -12.996393203735352, "global_step": 494177, "epoch": 2941} {"train_loss": -12.955845832824707, "global_step": 494178, "epoch": 2941} {"train_loss": -13.06396198272705, "global_step": 494179, "epoch": 2941} {"train_loss": -13.195107460021973, "global_step": 494180, "epoch": 2941} {"train_loss": -12.842475891113281, "global_step": 494181, "epoch": 2941} {"train_loss": -12.966206550598145, "global_step": 494182, "epoch": 2941} {"train_loss": -12.958331108093262, "global_step": 494183, "epoch": 2941} {"train_loss": -13.052850723266602, "global_step": 494184, "epoch": 2941} {"train_loss": -12.784643173217773, "global_step": 494185, "epoch": 2941} {"train_loss": -12.880233764648438, "global_step": 494186, "epoch": 2941} {"train_loss": -13.18446159362793, "global_step": 494187, "epoch": 2941} {"train_loss": -13.235994338989258, "global_step": 494188, "epoch": 2941} {"train_loss": -12.844616889953613, "global_step": 494189, "epoch": 2941} {"train_loss": -12.802806854248047, "global_step": 494190, "epoch": 2941} {"train_loss": -12.96630859375, "global_step": 494191, "epoch": 2941} {"train_loss": -12.910440444946289, "global_step": 494192, "epoch": 2941} {"train_loss": -13.15414047241211, "global_step": 494193, "epoch": 2941} {"train_loss": -12.915767669677734, "global_step": 494194, "epoch": 2941} {"train_loss": -12.873603820800781, "global_step": 494195, "epoch": 2941} {"train_loss": -12.841955184936523, "global_step": 494196, "epoch": 2941} {"train_loss": -13.082855224609375, "global_step": 494197, "epoch": 2941} {"train_loss": -12.992183685302734, "global_step": 494198, "epoch": 2941} {"train_loss": -12.539249420166016, "global_step": 494199, "epoch": 2941} {"train_loss": -12.568310737609863, "global_step": 494200, "epoch": 2941} {"train_loss": -12.547183990478516, "global_step": 494201, "epoch": 2941} {"train_loss": -12.832504272460938, "global_step": 494202, "epoch": 2941} {"train_loss": -12.897666931152344, "global_step": 494203, "epoch": 2941} {"train_loss": -12.713525772094727, "global_step": 494204, "epoch": 2941} {"train_loss": -12.338651657104492, "global_step": 494205, "epoch": 2941} {"train_loss": -12.654790878295898, "global_step": 494206, "epoch": 2941} {"train_loss": -12.768362045288086, "global_step": 494207, "epoch": 2941} {"train_loss": -12.7318754196167, "global_step": 494208, "epoch": 2941} {"train_loss": -12.664095878601074, "global_step": 494209, "epoch": 2941} {"train_loss": -12.323848724365234, "global_step": 494210, "epoch": 2941} {"train_loss": -12.453692436218262, "global_step": 494211, "epoch": 2941} {"train_loss": -12.285406112670898, "global_step": 494212, "epoch": 2941} {"train_loss": -12.100090980529785, "global_step": 494213, "epoch": 2941} {"train_loss": -12.359272003173828, "global_step": 494214, "epoch": 2941} {"train_loss": -11.753926277160645, "global_step": 494215, "epoch": 2941} {"train_loss": -12.229278564453125, "global_step": 494216, "epoch": 2941} {"train_loss": -12.2785062789917, "global_step": 494217, "epoch": 2941} {"train_loss": -12.171465873718262, "global_step": 494218, "epoch": 2941} {"train_loss": -12.43667984008789, "global_step": 494219, "epoch": 2941} {"train_loss": -12.287846565246582, "global_step": 494220, "epoch": 2941} {"train_loss": -12.699966430664062, "global_step": 494221, "epoch": 2941} {"train_loss": -11.965333938598633, "global_step": 494222, "epoch": 2941} {"train_loss": -11.380738258361816, "global_step": 494223, "epoch": 2941} {"train_loss": -12.85505485534668, "global_step": 494224, "epoch": 2941} {"train_loss": -11.705587387084961, "global_step": 494225, "epoch": 2941} {"train_loss": -11.838434219360352, "global_step": 494226, "epoch": 2941} {"train_loss": -12.303742408752441, "global_step": 494227, "epoch": 2941} {"train_loss": -12.335716247558594, "global_step": 494228, "epoch": 2941} {"train_loss": -12.026185035705566, "global_step": 494229, "epoch": 2941} {"train_loss": -12.416397094726562, "global_step": 494230, "epoch": 2941} {"train_loss": -12.374841690063477, "global_step": 494231, "epoch": 2941} {"train_loss": -11.835647583007812, "global_step": 494232, "epoch": 2941} {"train_loss": -11.997583389282227, "global_step": 494233, "epoch": 2941} {"train_loss": -12.50344467163086, "global_step": 494234, "epoch": 2941} {"train_loss": -10.733748435974121, "global_step": 494235, "epoch": 2941} {"train_loss": -12.130620956420898, "global_step": 494236, "epoch": 2941} {"train_loss": -11.455883026123047, "global_step": 494237, "epoch": 2941} {"train_loss": -12.484344482421875, "global_step": 494238, "epoch": 2941} {"train_loss": -10.757540702819824, "global_step": 494239, "epoch": 2941} {"train_loss": -11.416251182556152, "global_step": 494240, "epoch": 2941} {"train_loss": -11.370308876037598, "global_step": 494241, "epoch": 2941} {"train_loss": -11.859086036682129, "global_step": 494242, "epoch": 2941} {"train_loss": -11.266582489013672, "global_step": 494243, "epoch": 2941} {"train_loss": -11.178964614868164, "global_step": 494244, "epoch": 2941} {"train_loss": -10.865570068359375, "global_step": 494245, "epoch": 2941} {"train_loss": -11.030353546142578, "global_step": 494246, "epoch": 2941} {"train_loss": -9.721484184265137, "global_step": 494247, "epoch": 2941} {"train_loss": -9.13924789428711, "global_step": 494248, "epoch": 2941} {"train_loss": -11.31433391571045, "global_step": 494249, "epoch": 2941} {"train_loss": -10.594494819641113, "global_step": 494250, "epoch": 2941} {"train_loss": -10.582021713256836, "global_step": 494251, "epoch": 2941} {"train_loss": -8.989554405212402, "global_step": 494252, "epoch": 2941} {"train_loss": -9.356605529785156, "global_step": 494253, "epoch": 2941} {"train_loss": -9.055234909057617, "global_step": 494254, "epoch": 2941} {"train_loss": -12.198616856620426, "global_step": 494255, "epoch": 2941, "val_loss": 315485.1875} {"train_loss": -9.32911205291748, "global_step": 494256, "epoch": 2942} {"train_loss": -8.616336822509766, "global_step": 494257, "epoch": 2942} {"train_loss": -10.661749839782715, "global_step": 494258, "epoch": 2942} {"train_loss": -9.59829330444336, "global_step": 494259, "epoch": 2942} {"train_loss": -9.249232292175293, "global_step": 494260, "epoch": 2942} {"train_loss": -10.902276992797852, "global_step": 494261, "epoch": 2942} {"train_loss": -9.438339233398438, "global_step": 494262, "epoch": 2942} {"train_loss": -8.846227645874023, "global_step": 494263, "epoch": 2942} {"train_loss": -10.659168243408203, "global_step": 494264, "epoch": 2942} {"train_loss": -10.498066902160645, "global_step": 494265, "epoch": 2942} {"train_loss": -11.024557113647461, "global_step": 494266, "epoch": 2942} {"train_loss": -9.624771118164062, "global_step": 494267, "epoch": 2942} {"train_loss": -11.03152084350586, "global_step": 494268, "epoch": 2942} {"train_loss": -10.689037322998047, "global_step": 494269, "epoch": 2942} {"train_loss": -11.431405067443848, "global_step": 494270, "epoch": 2942} {"train_loss": -11.503802299499512, "global_step": 494271, "epoch": 2942} {"train_loss": -11.642744064331055, "global_step": 494272, "epoch": 2942} {"train_loss": -11.49874496459961, "global_step": 494273, "epoch": 2942} {"train_loss": -11.644542694091797, "global_step": 494274, "epoch": 2942} {"train_loss": -11.880106925964355, "global_step": 494275, "epoch": 2942} {"train_loss": -11.09178352355957, "global_step": 494276, "epoch": 2942} {"train_loss": -11.834707260131836, "global_step": 494277, "epoch": 2942} {"train_loss": -12.195731163024902, "global_step": 494278, "epoch": 2942} {"train_loss": -11.602392196655273, "global_step": 494279, "epoch": 2942} {"train_loss": -12.016839981079102, "global_step": 494280, "epoch": 2942} {"train_loss": -11.869970321655273, "global_step": 494281, "epoch": 2942} {"train_loss": -11.767776489257812, "global_step": 494282, "epoch": 2942} {"train_loss": -11.541280746459961, "global_step": 494283, "epoch": 2942} {"train_loss": -12.156105995178223, "global_step": 494284, "epoch": 2942} {"train_loss": -11.906329154968262, "global_step": 494285, "epoch": 2942} {"train_loss": -12.518695831298828, "global_step": 494286, "epoch": 2942} {"train_loss": -11.824119567871094, "global_step": 494287, "epoch": 2942} {"train_loss": -12.387519836425781, "global_step": 494288, "epoch": 2942} {"train_loss": -12.016120910644531, "global_step": 494289, "epoch": 2942} {"train_loss": -12.284313201904297, "global_step": 494290, "epoch": 2942} {"train_loss": -11.761162757873535, "global_step": 494291, "epoch": 2942} {"train_loss": -12.331588745117188, "global_step": 494292, "epoch": 2942} {"train_loss": -12.210573196411133, "global_step": 494293, "epoch": 2942} {"train_loss": -12.281282424926758, "global_step": 494294, "epoch": 2942} {"train_loss": -12.199819564819336, "global_step": 494295, "epoch": 2942} {"train_loss": -12.381401062011719, "global_step": 494296, "epoch": 2942} {"train_loss": -12.416845321655273, "global_step": 494297, "epoch": 2942} {"train_loss": -11.856083869934082, "global_step": 494298, "epoch": 2942} {"train_loss": -12.598199844360352, "global_step": 494299, "epoch": 2942} {"train_loss": -11.981952667236328, "global_step": 494300, "epoch": 2942} {"train_loss": -12.286194801330566, "global_step": 494301, "epoch": 2942} {"train_loss": -12.152158737182617, "global_step": 494302, "epoch": 2942} {"train_loss": -12.426231384277344, "global_step": 494303, "epoch": 2942} {"train_loss": -12.175117492675781, "global_step": 494304, "epoch": 2942} {"train_loss": -12.308125495910645, "global_step": 494305, "epoch": 2942} {"train_loss": -12.220510482788086, "global_step": 494306, "epoch": 2942} {"train_loss": -12.428013801574707, "global_step": 494307, "epoch": 2942} {"train_loss": -12.35377025604248, "global_step": 494308, "epoch": 2942} {"train_loss": -12.403772354125977, "global_step": 494309, "epoch": 2942} {"train_loss": -12.274641990661621, "global_step": 494310, "epoch": 2942} {"train_loss": -12.354229927062988, "global_step": 494311, "epoch": 2942} {"train_loss": -12.621391296386719, "global_step": 494312, "epoch": 2942} {"train_loss": -12.512954711914062, "global_step": 494313, "epoch": 2942} {"train_loss": -12.542811393737793, "global_step": 494314, "epoch": 2942} {"train_loss": -12.385282516479492, "global_step": 494315, "epoch": 2942} {"train_loss": -12.529806137084961, "global_step": 494316, "epoch": 2942} {"train_loss": -12.542182922363281, "global_step": 494317, "epoch": 2942} {"train_loss": -12.448748588562012, "global_step": 494318, "epoch": 2942} {"train_loss": -12.419829368591309, "global_step": 494319, "epoch": 2942} {"train_loss": -12.689821243286133, "global_step": 494320, "epoch": 2942} {"train_loss": -12.268922805786133, "global_step": 494321, "epoch": 2942} {"train_loss": -12.683691024780273, "global_step": 494322, "epoch": 2942} {"train_loss": -12.425627708435059, "global_step": 494323, "epoch": 2942} {"train_loss": -12.268183708190918, "global_step": 494324, "epoch": 2942} {"train_loss": -12.630956649780273, "global_step": 494325, "epoch": 2942} {"train_loss": -12.501836776733398, "global_step": 494326, "epoch": 2942} {"train_loss": -12.648397445678711, "global_step": 494327, "epoch": 2942} {"train_loss": -12.363042831420898, "global_step": 494328, "epoch": 2942} {"train_loss": -12.595809936523438, "global_step": 494329, "epoch": 2942} {"train_loss": -12.66775894165039, "global_step": 494330, "epoch": 2942} {"train_loss": -12.119837760925293, "global_step": 494331, "epoch": 2942} {"train_loss": -12.403741836547852, "global_step": 494332, "epoch": 2942} {"train_loss": -12.185908317565918, "global_step": 494333, "epoch": 2942} {"train_loss": -12.09885025024414, "global_step": 494334, "epoch": 2942} {"train_loss": -11.999629974365234, "global_step": 494335, "epoch": 2942} {"train_loss": -11.98536491394043, "global_step": 494336, "epoch": 2942} {"train_loss": -11.855490684509277, "global_step": 494337, "epoch": 2942} {"train_loss": -12.4091157913208, "global_step": 494338, "epoch": 2942} {"train_loss": -11.979822158813477, "global_step": 494339, "epoch": 2942} {"train_loss": -12.642080307006836, "global_step": 494340, "epoch": 2942} {"train_loss": -12.588738441467285, "global_step": 494341, "epoch": 2942} {"train_loss": -12.314299583435059, "global_step": 494342, "epoch": 2942} {"train_loss": -12.716570854187012, "global_step": 494343, "epoch": 2942} {"train_loss": -12.226522445678711, "global_step": 494344, "epoch": 2942} {"train_loss": -12.625879287719727, "global_step": 494345, "epoch": 2942} {"train_loss": -12.663002014160156, "global_step": 494346, "epoch": 2942} {"train_loss": -12.318098068237305, "global_step": 494347, "epoch": 2942} {"train_loss": -12.578369140625, "global_step": 494348, "epoch": 2942} {"train_loss": -12.38765811920166, "global_step": 494349, "epoch": 2942} {"train_loss": -12.586017608642578, "global_step": 494350, "epoch": 2942} {"train_loss": -12.459749221801758, "global_step": 494351, "epoch": 2942} {"train_loss": -12.316762924194336, "global_step": 494352, "epoch": 2942} {"train_loss": -12.499343872070312, "global_step": 494353, "epoch": 2942} {"train_loss": -12.022544860839844, "global_step": 494354, "epoch": 2942} {"train_loss": -12.393472671508789, "global_step": 494355, "epoch": 2942} {"train_loss": -11.956193923950195, "global_step": 494356, "epoch": 2942} {"train_loss": -12.807778358459473, "global_step": 494357, "epoch": 2942} {"train_loss": -12.106487274169922, "global_step": 494358, "epoch": 2942} {"train_loss": -12.652904510498047, "global_step": 494359, "epoch": 2942} {"train_loss": -12.538240432739258, "global_step": 494360, "epoch": 2942} {"train_loss": -12.47136116027832, "global_step": 494361, "epoch": 2942} {"train_loss": -12.707250595092773, "global_step": 494362, "epoch": 2942} {"train_loss": -12.63193130493164, "global_step": 494363, "epoch": 2942} {"train_loss": -12.831652641296387, "global_step": 494364, "epoch": 2942} {"train_loss": -12.771273612976074, "global_step": 494365, "epoch": 2942} {"train_loss": -12.803655624389648, "global_step": 494366, "epoch": 2942} {"train_loss": -12.709511756896973, "global_step": 494367, "epoch": 2942} {"train_loss": -12.617112159729004, "global_step": 494368, "epoch": 2942} {"train_loss": -12.994963645935059, "global_step": 494369, "epoch": 2942} {"train_loss": -12.786870956420898, "global_step": 494370, "epoch": 2942} {"train_loss": -12.638684272766113, "global_step": 494371, "epoch": 2942} {"train_loss": -12.771241188049316, "global_step": 494372, "epoch": 2942} {"train_loss": -12.68886947631836, "global_step": 494373, "epoch": 2942} {"train_loss": -12.926031112670898, "global_step": 494374, "epoch": 2942} {"train_loss": -12.895770072937012, "global_step": 494375, "epoch": 2942} {"train_loss": -12.654861450195312, "global_step": 494376, "epoch": 2942} {"train_loss": -13.011805534362793, "global_step": 494377, "epoch": 2942} {"train_loss": -12.806862831115723, "global_step": 494378, "epoch": 2942} {"train_loss": -12.846923828125, "global_step": 494379, "epoch": 2942} {"train_loss": -13.036741256713867, "global_step": 494380, "epoch": 2942} {"train_loss": -12.798492431640625, "global_step": 494381, "epoch": 2942} {"train_loss": -12.89948558807373, "global_step": 494382, "epoch": 2942} {"train_loss": -12.83215045928955, "global_step": 494383, "epoch": 2942} {"train_loss": -12.899737358093262, "global_step": 494384, "epoch": 2942} {"train_loss": -12.69979476928711, "global_step": 494385, "epoch": 2942} {"train_loss": -12.928445816040039, "global_step": 494386, "epoch": 2942} {"train_loss": -12.627742767333984, "global_step": 494387, "epoch": 2942} {"train_loss": -12.975300788879395, "global_step": 494388, "epoch": 2942} {"train_loss": -13.06299114227295, "global_step": 494389, "epoch": 2942} {"train_loss": -13.084228515625, "global_step": 494390, "epoch": 2942} {"train_loss": -12.516281127929688, "global_step": 494391, "epoch": 2942} {"train_loss": -12.808488845825195, "global_step": 494392, "epoch": 2942} {"train_loss": -12.771129608154297, "global_step": 494393, "epoch": 2942} {"train_loss": -12.646637916564941, "global_step": 494394, "epoch": 2942} {"train_loss": -12.810060501098633, "global_step": 494395, "epoch": 2942} {"train_loss": -13.047601699829102, "global_step": 494396, "epoch": 2942} {"train_loss": -12.294614791870117, "global_step": 494397, "epoch": 2942} {"train_loss": -13.076074600219727, "global_step": 494398, "epoch": 2942} {"train_loss": -12.354387283325195, "global_step": 494399, "epoch": 2942} {"train_loss": -12.47911262512207, "global_step": 494400, "epoch": 2942} {"train_loss": -12.758447647094727, "global_step": 494401, "epoch": 2942} {"train_loss": -12.668664932250977, "global_step": 494402, "epoch": 2942} {"train_loss": -12.600659370422363, "global_step": 494403, "epoch": 2942} {"train_loss": -12.533160209655762, "global_step": 494404, "epoch": 2942} {"train_loss": -12.162178039550781, "global_step": 494405, "epoch": 2942} {"train_loss": -12.55942153930664, "global_step": 494406, "epoch": 2942} {"train_loss": -12.470849990844727, "global_step": 494407, "epoch": 2942} {"train_loss": -12.232769012451172, "global_step": 494408, "epoch": 2942} {"train_loss": -11.99461555480957, "global_step": 494409, "epoch": 2942} {"train_loss": -12.480607986450195, "global_step": 494410, "epoch": 2942} {"train_loss": -12.453418731689453, "global_step": 494411, "epoch": 2942} {"train_loss": -12.585824966430664, "global_step": 494412, "epoch": 2942} {"train_loss": -12.593635559082031, "global_step": 494413, "epoch": 2942} {"train_loss": -12.376980781555176, "global_step": 494414, "epoch": 2942} {"train_loss": -12.401718139648438, "global_step": 494415, "epoch": 2942} {"train_loss": -12.669134140014648, "global_step": 494416, "epoch": 2942} {"train_loss": -12.734720230102539, "global_step": 494417, "epoch": 2942} {"train_loss": -12.728837966918945, "global_step": 494418, "epoch": 2942} {"train_loss": -12.778958320617676, "global_step": 494419, "epoch": 2942} {"train_loss": -12.78125286102295, "global_step": 494420, "epoch": 2942} {"train_loss": -12.866899490356445, "global_step": 494421, "epoch": 2942} {"train_loss": -12.296510696411133, "global_step": 494422, "epoch": 2942} {"train_loss": -12.227114382244292, "global_step": 494423, "epoch": 2942, "val_loss": 320353.9375} {"train_loss": -12.818277359008789, "global_step": 494424, "epoch": 2943} {"train_loss": -12.489751815795898, "global_step": 494425, "epoch": 2943} {"train_loss": -11.939066886901855, "global_step": 494426, "epoch": 2943} {"train_loss": -12.799964904785156, "global_step": 494427, "epoch": 2943} {"train_loss": -11.87651252746582, "global_step": 494428, "epoch": 2943} {"train_loss": -12.190624237060547, "global_step": 494429, "epoch": 2943} {"train_loss": -11.428502082824707, "global_step": 494430, "epoch": 2943} {"train_loss": -12.047298431396484, "global_step": 494431, "epoch": 2943} {"train_loss": -11.038461685180664, "global_step": 494432, "epoch": 2943} {"train_loss": -11.851226806640625, "global_step": 494433, "epoch": 2943} {"train_loss": -11.312541007995605, "global_step": 494434, "epoch": 2943} {"train_loss": -12.153264999389648, "global_step": 494435, "epoch": 2943} {"train_loss": -11.690004348754883, "global_step": 494436, "epoch": 2943} {"train_loss": -11.609621047973633, "global_step": 494437, "epoch": 2943} {"train_loss": -10.689011573791504, "global_step": 494438, "epoch": 2943} {"train_loss": -12.346746444702148, "global_step": 494439, "epoch": 2943} {"train_loss": -11.118032455444336, "global_step": 494440, "epoch": 2943} {"train_loss": -11.510400772094727, "global_step": 494441, "epoch": 2943} {"train_loss": -12.065116882324219, "global_step": 494442, "epoch": 2943} {"train_loss": -10.45406436920166, "global_step": 494443, "epoch": 2943} {"train_loss": -11.774524688720703, "global_step": 494444, "epoch": 2943} {"train_loss": -11.783346176147461, "global_step": 494445, "epoch": 2943} {"train_loss": -10.707486152648926, "global_step": 494446, "epoch": 2943} {"train_loss": -12.242536544799805, "global_step": 494447, "epoch": 2943} {"train_loss": -10.873730659484863, "global_step": 494448, "epoch": 2943} {"train_loss": -11.861217498779297, "global_step": 494449, "epoch": 2943} {"train_loss": -11.590290069580078, "global_step": 494450, "epoch": 2943} {"train_loss": -11.656244277954102, "global_step": 494451, "epoch": 2943} {"train_loss": -12.10219669342041, "global_step": 494452, "epoch": 2943} {"train_loss": -11.886770248413086, "global_step": 494453, "epoch": 2943} {"train_loss": -12.323424339294434, "global_step": 494454, "epoch": 2943} {"train_loss": -12.192218780517578, "global_step": 494455, "epoch": 2943} {"train_loss": -11.920888900756836, "global_step": 494456, "epoch": 2943} {"train_loss": -12.154603958129883, "global_step": 494457, "epoch": 2943} {"train_loss": -11.92410659790039, "global_step": 494458, "epoch": 2943} {"train_loss": -12.303136825561523, "global_step": 494459, "epoch": 2943} {"train_loss": -11.713380813598633, "global_step": 494460, "epoch": 2943} {"train_loss": -12.153712272644043, "global_step": 494461, "epoch": 2943} {"train_loss": -12.5093994140625, "global_step": 494462, "epoch": 2943} {"train_loss": -12.20961856842041, "global_step": 494463, "epoch": 2943} {"train_loss": -11.51537799835205, "global_step": 494464, "epoch": 2943} {"train_loss": -10.991134643554688, "global_step": 494465, "epoch": 2943} {"train_loss": -11.391420364379883, "global_step": 494466, "epoch": 2943} {"train_loss": -11.63036823272705, "global_step": 494467, "epoch": 2943} {"train_loss": -11.86274528503418, "global_step": 494468, "epoch": 2943} {"train_loss": -11.637953758239746, "global_step": 494469, "epoch": 2943} {"train_loss": -11.265907287597656, "global_step": 494470, "epoch": 2943} {"train_loss": -11.544321060180664, "global_step": 494471, "epoch": 2943} {"train_loss": -11.606168746948242, "global_step": 494472, "epoch": 2943} {"train_loss": -11.347275733947754, "global_step": 494473, "epoch": 2943} {"train_loss": -12.13306999206543, "global_step": 494474, "epoch": 2943} {"train_loss": -11.389840126037598, "global_step": 494475, "epoch": 2943} {"train_loss": -12.04672622680664, "global_step": 494476, "epoch": 2943} {"train_loss": -11.401851654052734, "global_step": 494477, "epoch": 2943} {"train_loss": -12.197738647460938, "global_step": 494478, "epoch": 2943} {"train_loss": -11.039962768554688, "global_step": 494479, "epoch": 2943} {"train_loss": -11.098477363586426, "global_step": 494480, "epoch": 2943} {"train_loss": -12.053665161132812, "global_step": 494481, "epoch": 2943} {"train_loss": -11.561964988708496, "global_step": 494482, "epoch": 2943} {"train_loss": -12.1927490234375, "global_step": 494483, "epoch": 2943} {"train_loss": -12.31559944152832, "global_step": 494484, "epoch": 2943} {"train_loss": -11.792258262634277, "global_step": 494485, "epoch": 2943} {"train_loss": -11.792019844055176, "global_step": 494486, "epoch": 2943} {"train_loss": -11.55202579498291, "global_step": 494487, "epoch": 2943} {"train_loss": -11.801919937133789, "global_step": 494488, "epoch": 2943} {"train_loss": -11.550291061401367, "global_step": 494489, "epoch": 2943} {"train_loss": -11.172530174255371, "global_step": 494490, "epoch": 2943} {"train_loss": -11.65671443939209, "global_step": 494491, "epoch": 2943} {"train_loss": -11.722753524780273, "global_step": 494492, "epoch": 2943} {"train_loss": -11.862958908081055, "global_step": 494493, "epoch": 2943} {"train_loss": -12.508564949035645, "global_step": 494494, "epoch": 2943} {"train_loss": -12.216800689697266, "global_step": 494495, "epoch": 2943} {"train_loss": -12.319931030273438, "global_step": 494496, "epoch": 2943} {"train_loss": -11.912713050842285, "global_step": 494497, "epoch": 2943} {"train_loss": -12.097368240356445, "global_step": 494498, "epoch": 2943} {"train_loss": -12.4556245803833, "global_step": 494499, "epoch": 2943} {"train_loss": -12.196331024169922, "global_step": 494500, "epoch": 2943} {"train_loss": -12.405181884765625, "global_step": 494501, "epoch": 2943} {"train_loss": -12.350092887878418, "global_step": 494502, "epoch": 2943} {"train_loss": -12.364885330200195, "global_step": 494503, "epoch": 2943} {"train_loss": -12.220792770385742, "global_step": 494504, "epoch": 2943} {"train_loss": -12.395013809204102, "global_step": 494505, "epoch": 2943} {"train_loss": -12.379877090454102, "global_step": 494506, "epoch": 2943} {"train_loss": -12.185192108154297, "global_step": 494507, "epoch": 2943} {"train_loss": -12.42052173614502, "global_step": 494508, "epoch": 2943} {"train_loss": -12.361970901489258, "global_step": 494509, "epoch": 2943} {"train_loss": -12.130772590637207, "global_step": 494510, "epoch": 2943} {"train_loss": -12.29304313659668, "global_step": 494511, "epoch": 2943} {"train_loss": -12.47050666809082, "global_step": 494512, "epoch": 2943} {"train_loss": -12.356199264526367, "global_step": 494513, "epoch": 2943} {"train_loss": -11.720626831054688, "global_step": 494514, "epoch": 2943} {"train_loss": -10.900167465209961, "global_step": 494515, "epoch": 2943} {"train_loss": -12.155243873596191, "global_step": 494516, "epoch": 2943} {"train_loss": -10.943267822265625, "global_step": 494517, "epoch": 2943} {"train_loss": -12.29873275756836, "global_step": 494518, "epoch": 2943} {"train_loss": -11.294620513916016, "global_step": 494519, "epoch": 2943} {"train_loss": -12.286001205444336, "global_step": 494520, "epoch": 2943} {"train_loss": -11.715925216674805, "global_step": 494521, "epoch": 2943} {"train_loss": -11.74842643737793, "global_step": 494522, "epoch": 2943} {"train_loss": -12.126178741455078, "global_step": 494523, "epoch": 2943} {"train_loss": -11.905689239501953, "global_step": 494524, "epoch": 2943} {"train_loss": -12.397027969360352, "global_step": 494525, "epoch": 2943} {"train_loss": -11.606086730957031, "global_step": 494526, "epoch": 2943} {"train_loss": -12.597455024719238, "global_step": 494527, "epoch": 2943} {"train_loss": -11.518845558166504, "global_step": 494528, "epoch": 2943} {"train_loss": -12.617830276489258, "global_step": 494529, "epoch": 2943} {"train_loss": -12.205606460571289, "global_step": 494530, "epoch": 2943} {"train_loss": -12.438737869262695, "global_step": 494531, "epoch": 2943} {"train_loss": -12.328866004943848, "global_step": 494532, "epoch": 2943} {"train_loss": -11.870880126953125, "global_step": 494533, "epoch": 2943} {"train_loss": -12.47130012512207, "global_step": 494534, "epoch": 2943} {"train_loss": -12.539833068847656, "global_step": 494535, "epoch": 2943} {"train_loss": -12.535094261169434, "global_step": 494536, "epoch": 2943} {"train_loss": -12.532151222229004, "global_step": 494537, "epoch": 2943} {"train_loss": -12.542024612426758, "global_step": 494538, "epoch": 2943} {"train_loss": -12.589698791503906, "global_step": 494539, "epoch": 2943} {"train_loss": -12.591034889221191, "global_step": 494540, "epoch": 2943} {"train_loss": -12.813140869140625, "global_step": 494541, "epoch": 2943} {"train_loss": -12.523244857788086, "global_step": 494542, "epoch": 2943} {"train_loss": -12.753235816955566, "global_step": 494543, "epoch": 2943} {"train_loss": -12.782112121582031, "global_step": 494544, "epoch": 2943} {"train_loss": -12.324475288391113, "global_step": 494545, "epoch": 2943} {"train_loss": -12.8002290725708, "global_step": 494546, "epoch": 2943} {"train_loss": -12.793094635009766, "global_step": 494547, "epoch": 2943} {"train_loss": -12.73604679107666, "global_step": 494548, "epoch": 2943} {"train_loss": -12.723651885986328, "global_step": 494549, "epoch": 2943} {"train_loss": -12.565935134887695, "global_step": 494550, "epoch": 2943} {"train_loss": -12.590142250061035, "global_step": 494551, "epoch": 2943} {"train_loss": -12.295480728149414, "global_step": 494552, "epoch": 2943} {"train_loss": -12.853466033935547, "global_step": 494553, "epoch": 2943} {"train_loss": -12.763785362243652, "global_step": 494554, "epoch": 2943} {"train_loss": -12.541362762451172, "global_step": 494555, "epoch": 2943} {"train_loss": -12.669912338256836, "global_step": 494556, "epoch": 2943} {"train_loss": -12.190041542053223, "global_step": 494557, "epoch": 2943} {"train_loss": -12.912857055664062, "global_step": 494558, "epoch": 2943} {"train_loss": -12.247159004211426, "global_step": 494559, "epoch": 2943} {"train_loss": -12.511558532714844, "global_step": 494560, "epoch": 2943} {"train_loss": -12.552135467529297, "global_step": 494561, "epoch": 2943} {"train_loss": -12.782814025878906, "global_step": 494562, "epoch": 2943} {"train_loss": -12.65350341796875, "global_step": 494563, "epoch": 2943} {"train_loss": -12.676209449768066, "global_step": 494564, "epoch": 2943} {"train_loss": -12.413804054260254, "global_step": 494565, "epoch": 2943} {"train_loss": -12.770431518554688, "global_step": 494566, "epoch": 2943} {"train_loss": -12.65518856048584, "global_step": 494567, "epoch": 2943} {"train_loss": -12.718944549560547, "global_step": 494568, "epoch": 2943} {"train_loss": -12.503629684448242, "global_step": 494569, "epoch": 2943} {"train_loss": -12.781773567199707, "global_step": 494570, "epoch": 2943} {"train_loss": -12.105691909790039, "global_step": 494571, "epoch": 2943} {"train_loss": -12.769744873046875, "global_step": 494572, "epoch": 2943} {"train_loss": -12.860322952270508, "global_step": 494573, "epoch": 2943} {"train_loss": -12.713421821594238, "global_step": 494574, "epoch": 2943} {"train_loss": -12.8034029006958, "global_step": 494575, "epoch": 2943} {"train_loss": -12.778826713562012, "global_step": 494576, "epoch": 2943} {"train_loss": -12.730440139770508, "global_step": 494577, "epoch": 2943} {"train_loss": -12.581853866577148, "global_step": 494578, "epoch": 2943} {"train_loss": -12.594147682189941, "global_step": 494579, "epoch": 2943} {"train_loss": -12.943201065063477, "global_step": 494580, "epoch": 2943} {"train_loss": -12.58693790435791, "global_step": 494581, "epoch": 2943} {"train_loss": -12.942337036132812, "global_step": 494582, "epoch": 2943} {"train_loss": -12.751938819885254, "global_step": 494583, "epoch": 2943} {"train_loss": -12.815916061401367, "global_step": 494584, "epoch": 2943} {"train_loss": -12.731593132019043, "global_step": 494585, "epoch": 2943} {"train_loss": -12.736026763916016, "global_step": 494586, "epoch": 2943} {"train_loss": -12.818075180053711, "global_step": 494587, "epoch": 2943} {"train_loss": -12.87596607208252, "global_step": 494588, "epoch": 2943} {"train_loss": -12.793210983276367, "global_step": 494589, "epoch": 2943} {"train_loss": -12.898147583007812, "global_step": 494590, "epoch": 2943} {"train_loss": -12.153491133735294, "global_step": 494591, "epoch": 2943, "val_loss": 318778.78125} {"train_loss": -13.145883560180664, "global_step": 494592, "epoch": 2944} {"train_loss": -13.018016815185547, "global_step": 494593, "epoch": 2944} {"train_loss": -12.873828887939453, "global_step": 494594, "epoch": 2944} {"train_loss": -13.036811828613281, "global_step": 494595, "epoch": 2944} {"train_loss": -12.875845909118652, "global_step": 494596, "epoch": 2944} {"train_loss": -12.586883544921875, "global_step": 494597, "epoch": 2944} {"train_loss": -12.88228988647461, "global_step": 494598, "epoch": 2944} {"train_loss": -13.09515380859375, "global_step": 494599, "epoch": 2944} {"train_loss": -12.48173713684082, "global_step": 494600, "epoch": 2944} {"train_loss": -12.562997817993164, "global_step": 494601, "epoch": 2944} {"train_loss": -12.907198905944824, "global_step": 494602, "epoch": 2944} {"train_loss": -12.634809494018555, "global_step": 494603, "epoch": 2944} {"train_loss": -12.804254531860352, "global_step": 494604, "epoch": 2944} {"train_loss": -12.31159782409668, "global_step": 494605, "epoch": 2944} {"train_loss": -13.054411888122559, "global_step": 494606, "epoch": 2944} {"train_loss": -12.340986251831055, "global_step": 494607, "epoch": 2944} {"train_loss": -12.467904090881348, "global_step": 494608, "epoch": 2944} {"train_loss": -12.478156089782715, "global_step": 494609, "epoch": 2944} {"train_loss": -11.893059730529785, "global_step": 494610, "epoch": 2944} {"train_loss": -12.379125595092773, "global_step": 494611, "epoch": 2944} {"train_loss": -12.490605354309082, "global_step": 494612, "epoch": 2944} {"train_loss": -11.695350646972656, "global_step": 494613, "epoch": 2944} {"train_loss": -11.781190872192383, "global_step": 494614, "epoch": 2944} {"train_loss": -9.986875534057617, "global_step": 494615, "epoch": 2944} {"train_loss": -11.372312545776367, "global_step": 494616, "epoch": 2944} {"train_loss": -12.641500473022461, "global_step": 494617, "epoch": 2944} {"train_loss": -11.853330612182617, "global_step": 494618, "epoch": 2944} {"train_loss": -12.826042175292969, "global_step": 494619, "epoch": 2944} {"train_loss": -12.301006317138672, "global_step": 494620, "epoch": 2944} {"train_loss": -11.991071701049805, "global_step": 494621, "epoch": 2944} {"train_loss": -12.748490333557129, "global_step": 494622, "epoch": 2944} {"train_loss": -12.47067642211914, "global_step": 494623, "epoch": 2944} {"train_loss": -12.603668212890625, "global_step": 494624, "epoch": 2944} {"train_loss": -12.369121551513672, "global_step": 494625, "epoch": 2944} {"train_loss": -12.72579574584961, "global_step": 494626, "epoch": 2944} {"train_loss": -12.493316650390625, "global_step": 494627, "epoch": 2944} {"train_loss": -12.542262077331543, "global_step": 494628, "epoch": 2944} {"train_loss": -12.031492233276367, "global_step": 494629, "epoch": 2944} {"train_loss": -11.695073127746582, "global_step": 494630, "epoch": 2944} {"train_loss": -12.64389419555664, "global_step": 494631, "epoch": 2944} {"train_loss": -11.64875602722168, "global_step": 494632, "epoch": 2944} {"train_loss": -11.703758239746094, "global_step": 494633, "epoch": 2944} {"train_loss": -11.82241439819336, "global_step": 494634, "epoch": 2944} {"train_loss": -10.371580123901367, "global_step": 494635, "epoch": 2944} {"train_loss": -11.749134063720703, "global_step": 494636, "epoch": 2944} {"train_loss": -10.49903678894043, "global_step": 494637, "epoch": 2944} {"train_loss": -10.527060508728027, "global_step": 494638, "epoch": 2944} {"train_loss": -11.318567276000977, "global_step": 494639, "epoch": 2944} {"train_loss": -11.444766998291016, "global_step": 494640, "epoch": 2944} {"train_loss": -11.24108600616455, "global_step": 494641, "epoch": 2944} {"train_loss": -11.998902320861816, "global_step": 494642, "epoch": 2944} {"train_loss": -11.184982299804688, "global_step": 494643, "epoch": 2944} {"train_loss": -12.325931549072266, "global_step": 494644, "epoch": 2944} {"train_loss": -10.720154762268066, "global_step": 494645, "epoch": 2944} {"train_loss": -11.48563003540039, "global_step": 494646, "epoch": 2944} {"train_loss": -11.48121452331543, "global_step": 494647, "epoch": 2944} {"train_loss": -11.531342506408691, "global_step": 494648, "epoch": 2944} {"train_loss": -12.10120677947998, "global_step": 494649, "epoch": 2944} {"train_loss": -11.632776260375977, "global_step": 494650, "epoch": 2944} {"train_loss": -12.395898818969727, "global_step": 494651, "epoch": 2944} {"train_loss": -12.166374206542969, "global_step": 494652, "epoch": 2944} {"train_loss": -11.934431076049805, "global_step": 494653, "epoch": 2944} {"train_loss": -12.154292106628418, "global_step": 494654, "epoch": 2944} {"train_loss": -12.262574195861816, "global_step": 494655, "epoch": 2944} {"train_loss": -12.62896728515625, "global_step": 494656, "epoch": 2944} {"train_loss": -12.617841720581055, "global_step": 494657, "epoch": 2944} {"train_loss": -12.777740478515625, "global_step": 494658, "epoch": 2944} {"train_loss": -12.522878646850586, "global_step": 494659, "epoch": 2944} {"train_loss": -12.69631290435791, "global_step": 494660, "epoch": 2944} {"train_loss": -12.76010513305664, "global_step": 494661, "epoch": 2944} {"train_loss": -12.72804069519043, "global_step": 494662, "epoch": 2944} {"train_loss": -12.815483093261719, "global_step": 494663, "epoch": 2944} {"train_loss": -12.598749160766602, "global_step": 494664, "epoch": 2944} {"train_loss": -12.78664779663086, "global_step": 494665, "epoch": 2944} {"train_loss": -12.580673217773438, "global_step": 494666, "epoch": 2944} {"train_loss": -12.520813941955566, "global_step": 494667, "epoch": 2944} {"train_loss": -12.871088027954102, "global_step": 494668, "epoch": 2944} {"train_loss": -12.674022674560547, "global_step": 494669, "epoch": 2944} {"train_loss": -12.767037391662598, "global_step": 494670, "epoch": 2944} {"train_loss": -12.941930770874023, "global_step": 494671, "epoch": 2944} {"train_loss": -12.560741424560547, "global_step": 494672, "epoch": 2944} {"train_loss": -12.629615783691406, "global_step": 494673, "epoch": 2944} {"train_loss": -12.737001419067383, "global_step": 494674, "epoch": 2944} {"train_loss": -12.630622863769531, "global_step": 494675, "epoch": 2944} {"train_loss": -12.813106536865234, "global_step": 494676, "epoch": 2944} {"train_loss": -12.748676300048828, "global_step": 494677, "epoch": 2944} {"train_loss": -12.531991004943848, "global_step": 494678, "epoch": 2944} {"train_loss": -12.734830856323242, "global_step": 494679, "epoch": 2944} {"train_loss": -12.690250396728516, "global_step": 494680, "epoch": 2944} {"train_loss": -12.737020492553711, "global_step": 494681, "epoch": 2944} {"train_loss": -12.690383911132812, "global_step": 494682, "epoch": 2944} {"train_loss": -12.757909774780273, "global_step": 494683, "epoch": 2944} {"train_loss": -12.596272468566895, "global_step": 494684, "epoch": 2944} {"train_loss": -13.138105392456055, "global_step": 494685, "epoch": 2944} {"train_loss": -12.789661407470703, "global_step": 494686, "epoch": 2944} {"train_loss": -13.020318031311035, "global_step": 494687, "epoch": 2944} {"train_loss": -12.945232391357422, "global_step": 494688, "epoch": 2944} {"train_loss": -12.912463188171387, "global_step": 494689, "epoch": 2944} {"train_loss": -12.852073669433594, "global_step": 494690, "epoch": 2944} {"train_loss": -13.098060607910156, "global_step": 494691, "epoch": 2944} {"train_loss": -12.915494918823242, "global_step": 494692, "epoch": 2944} {"train_loss": -12.775659561157227, "global_step": 494693, "epoch": 2944} {"train_loss": -13.050917625427246, "global_step": 494694, "epoch": 2944} {"train_loss": -13.164664268493652, "global_step": 494695, "epoch": 2944} {"train_loss": -13.196971893310547, "global_step": 494696, "epoch": 2944} {"train_loss": -13.177689552307129, "global_step": 494697, "epoch": 2944} {"train_loss": -13.132010459899902, "global_step": 494698, "epoch": 2944} {"train_loss": -12.71273422241211, "global_step": 494699, "epoch": 2944} {"train_loss": -12.523809432983398, "global_step": 494700, "epoch": 2944} {"train_loss": -12.568483352661133, "global_step": 494701, "epoch": 2944} {"train_loss": -12.461958885192871, "global_step": 494702, "epoch": 2944} {"train_loss": -12.618102073669434, "global_step": 494703, "epoch": 2944} {"train_loss": -13.10326099395752, "global_step": 494704, "epoch": 2944} {"train_loss": -12.971025466918945, "global_step": 494705, "epoch": 2944} {"train_loss": -12.582932472229004, "global_step": 494706, "epoch": 2944} {"train_loss": -12.188192367553711, "global_step": 494707, "epoch": 2944} {"train_loss": -12.839115142822266, "global_step": 494708, "epoch": 2944} {"train_loss": -12.421903610229492, "global_step": 494709, "epoch": 2944} {"train_loss": -12.067737579345703, "global_step": 494710, "epoch": 2944} {"train_loss": -11.31360912322998, "global_step": 494711, "epoch": 2944} {"train_loss": -11.512897491455078, "global_step": 494712, "epoch": 2944} {"train_loss": -11.695213317871094, "global_step": 494713, "epoch": 2944} {"train_loss": -12.702762603759766, "global_step": 494714, "epoch": 2944} {"train_loss": -10.853597640991211, "global_step": 494715, "epoch": 2944} {"train_loss": -9.893157005310059, "global_step": 494716, "epoch": 2944} {"train_loss": -12.574333190917969, "global_step": 494717, "epoch": 2944} {"train_loss": -9.463349342346191, "global_step": 494718, "epoch": 2944} {"train_loss": -11.68785285949707, "global_step": 494719, "epoch": 2944} {"train_loss": -9.542007446289062, "global_step": 494720, "epoch": 2944} {"train_loss": -10.873587608337402, "global_step": 494721, "epoch": 2944} {"train_loss": -8.937461853027344, "global_step": 494722, "epoch": 2944} {"train_loss": -11.411660194396973, "global_step": 494723, "epoch": 2944} {"train_loss": -8.125264167785645, "global_step": 494724, "epoch": 2944} {"train_loss": -9.393906593322754, "global_step": 494725, "epoch": 2944} {"train_loss": -9.28544807434082, "global_step": 494726, "epoch": 2944} {"train_loss": -8.373560905456543, "global_step": 494727, "epoch": 2944} {"train_loss": -8.242110252380371, "global_step": 494728, "epoch": 2944} {"train_loss": -8.69703483581543, "global_step": 494729, "epoch": 2944} {"train_loss": -9.032142639160156, "global_step": 494730, "epoch": 2944} {"train_loss": -8.852072715759277, "global_step": 494731, "epoch": 2944} {"train_loss": -8.649837493896484, "global_step": 494732, "epoch": 2944} {"train_loss": -7.838872909545898, "global_step": 494733, "epoch": 2944} {"train_loss": -8.388348579406738, "global_step": 494734, "epoch": 2944} {"train_loss": -9.844499588012695, "global_step": 494735, "epoch": 2944} {"train_loss": -10.130099296569824, "global_step": 494736, "epoch": 2944} {"train_loss": -10.427020072937012, "global_step": 494737, "epoch": 2944} {"train_loss": -10.905937194824219, "global_step": 494738, "epoch": 2944} {"train_loss": -9.10824203491211, "global_step": 494739, "epoch": 2944} {"train_loss": -10.342999458312988, "global_step": 494740, "epoch": 2944} {"train_loss": -10.342964172363281, "global_step": 494741, "epoch": 2944} {"train_loss": -9.860479354858398, "global_step": 494742, "epoch": 2944} {"train_loss": -11.440301895141602, "global_step": 494743, "epoch": 2944} {"train_loss": -10.64609432220459, "global_step": 494744, "epoch": 2944} {"train_loss": -9.959689140319824, "global_step": 494745, "epoch": 2944} {"train_loss": -11.304572105407715, "global_step": 494746, "epoch": 2944} {"train_loss": -9.411398887634277, "global_step": 494747, "epoch": 2944} {"train_loss": -10.588627815246582, "global_step": 494748, "epoch": 2944} {"train_loss": -10.8280029296875, "global_step": 494749, "epoch": 2944} {"train_loss": -10.809257507324219, "global_step": 494750, "epoch": 2944} {"train_loss": -10.263822555541992, "global_step": 494751, "epoch": 2944} {"train_loss": -11.532707214355469, "global_step": 494752, "epoch": 2944} {"train_loss": -9.406012535095215, "global_step": 494753, "epoch": 2944} {"train_loss": -10.201447486877441, "global_step": 494754, "epoch": 2944} {"train_loss": -10.727746963500977, "global_step": 494755, "epoch": 2944} {"train_loss": -10.403810501098633, "global_step": 494756, "epoch": 2944} {"train_loss": -11.125171661376953, "global_step": 494757, "epoch": 2944} {"train_loss": -11.334724426269531, "global_step": 494758, "epoch": 2944} {"train_loss": -11.761602532295953, "global_step": 494759, "epoch": 2944, "val_loss": 316696.125} {"train_loss": -11.214500427246094, "global_step": 494760, "epoch": 2945} {"train_loss": -11.848875045776367, "global_step": 494761, "epoch": 2945} {"train_loss": -11.100460052490234, "global_step": 494762, "epoch": 2945} {"train_loss": -11.945969581604004, "global_step": 494763, "epoch": 2945} {"train_loss": -11.510599136352539, "global_step": 494764, "epoch": 2945} {"train_loss": -12.046175003051758, "global_step": 494765, "epoch": 2945} {"train_loss": -12.087905883789062, "global_step": 494766, "epoch": 2945} {"train_loss": -11.893917083740234, "global_step": 494767, "epoch": 2945} {"train_loss": -12.14674186706543, "global_step": 494768, "epoch": 2945} {"train_loss": -12.178152084350586, "global_step": 494769, "epoch": 2945} {"train_loss": -12.246201515197754, "global_step": 494770, "epoch": 2945} {"train_loss": -12.3343505859375, "global_step": 494771, "epoch": 2945} {"train_loss": -12.064020156860352, "global_step": 494772, "epoch": 2945} {"train_loss": -12.234106063842773, "global_step": 494773, "epoch": 2945} {"train_loss": -12.270563125610352, "global_step": 494774, "epoch": 2945} {"train_loss": -12.260927200317383, "global_step": 494775, "epoch": 2945} {"train_loss": -12.285272598266602, "global_step": 494776, "epoch": 2945} {"train_loss": -12.416105270385742, "global_step": 494777, "epoch": 2945} {"train_loss": -12.5428466796875, "global_step": 494778, "epoch": 2945} {"train_loss": -12.528535842895508, "global_step": 494779, "epoch": 2945} {"train_loss": -12.534088134765625, "global_step": 494780, "epoch": 2945} {"train_loss": -12.472129821777344, "global_step": 494781, "epoch": 2945} {"train_loss": -12.288373947143555, "global_step": 494782, "epoch": 2945} {"train_loss": -12.648548126220703, "global_step": 494783, "epoch": 2945} {"train_loss": -12.326488494873047, "global_step": 494784, "epoch": 2945} {"train_loss": -12.566184997558594, "global_step": 494785, "epoch": 2945} {"train_loss": -12.555688858032227, "global_step": 494786, "epoch": 2945} {"train_loss": -12.666837692260742, "global_step": 494787, "epoch": 2945} {"train_loss": -12.530447006225586, "global_step": 494788, "epoch": 2945} {"train_loss": -12.58650016784668, "global_step": 494789, "epoch": 2945} {"train_loss": -12.548711776733398, "global_step": 494790, "epoch": 2945} {"train_loss": -12.667759895324707, "global_step": 494791, "epoch": 2945} {"train_loss": -12.558144569396973, "global_step": 494792, "epoch": 2945} {"train_loss": -12.65142822265625, "global_step": 494793, "epoch": 2945} {"train_loss": -12.529157638549805, "global_step": 494794, "epoch": 2945} {"train_loss": -12.719409942626953, "global_step": 494795, "epoch": 2945} {"train_loss": -12.618949890136719, "global_step": 494796, "epoch": 2945} {"train_loss": -12.546323776245117, "global_step": 494797, "epoch": 2945} {"train_loss": -12.50094223022461, "global_step": 494798, "epoch": 2945} {"train_loss": -12.62496566772461, "global_step": 494799, "epoch": 2945} {"train_loss": -12.543315887451172, "global_step": 494800, "epoch": 2945} {"train_loss": -12.595673561096191, "global_step": 494801, "epoch": 2945} {"train_loss": -12.72008228302002, "global_step": 494802, "epoch": 2945} {"train_loss": -12.61665153503418, "global_step": 494803, "epoch": 2945} {"train_loss": -12.681228637695312, "global_step": 494804, "epoch": 2945} {"train_loss": -12.828422546386719, "global_step": 494805, "epoch": 2945} {"train_loss": -12.51923656463623, "global_step": 494806, "epoch": 2945} {"train_loss": -12.518774032592773, "global_step": 494807, "epoch": 2945} {"train_loss": -12.597503662109375, "global_step": 494808, "epoch": 2945} {"train_loss": -12.502771377563477, "global_step": 494809, "epoch": 2945} {"train_loss": -12.777769088745117, "global_step": 494810, "epoch": 2945} {"train_loss": -12.92192268371582, "global_step": 494811, "epoch": 2945} {"train_loss": -12.763898849487305, "global_step": 494812, "epoch": 2945} {"train_loss": -12.7264404296875, "global_step": 494813, "epoch": 2945} {"train_loss": -12.70592975616455, "global_step": 494814, "epoch": 2945} {"train_loss": -12.590056419372559, "global_step": 494815, "epoch": 2945} {"train_loss": -12.684274673461914, "global_step": 494816, "epoch": 2945} {"train_loss": -12.803115844726562, "global_step": 494817, "epoch": 2945} {"train_loss": -12.637895584106445, "global_step": 494818, "epoch": 2945} {"train_loss": -12.741917610168457, "global_step": 494819, "epoch": 2945} {"train_loss": -12.845327377319336, "global_step": 494820, "epoch": 2945} {"train_loss": -12.795171737670898, "global_step": 494821, "epoch": 2945} {"train_loss": -12.77528190612793, "global_step": 494822, "epoch": 2945} {"train_loss": -12.804952621459961, "global_step": 494823, "epoch": 2945} {"train_loss": -12.647416114807129, "global_step": 494824, "epoch": 2945} {"train_loss": -12.83949089050293, "global_step": 494825, "epoch": 2945} {"train_loss": -12.933280944824219, "global_step": 494826, "epoch": 2945} {"train_loss": -12.64846420288086, "global_step": 494827, "epoch": 2945} {"train_loss": -12.859195709228516, "global_step": 494828, "epoch": 2945} {"train_loss": -12.992608070373535, "global_step": 494829, "epoch": 2945} {"train_loss": -12.797103881835938, "global_step": 494830, "epoch": 2945} {"train_loss": -12.646242141723633, "global_step": 494831, "epoch": 2945} {"train_loss": -12.716218948364258, "global_step": 494832, "epoch": 2945} {"train_loss": -12.831153869628906, "global_step": 494833, "epoch": 2945} {"train_loss": -12.321050643920898, "global_step": 494834, "epoch": 2945} {"train_loss": -12.488199234008789, "global_step": 494835, "epoch": 2945} {"train_loss": -12.734111785888672, "global_step": 494836, "epoch": 2945} {"train_loss": -12.98835563659668, "global_step": 494837, "epoch": 2945} {"train_loss": -12.62784194946289, "global_step": 494838, "epoch": 2945} {"train_loss": -12.267057418823242, "global_step": 494839, "epoch": 2945} {"train_loss": -12.202346801757812, "global_step": 494840, "epoch": 2945} {"train_loss": -12.924190521240234, "global_step": 494841, "epoch": 2945} {"train_loss": -11.186567306518555, "global_step": 494842, "epoch": 2945} {"train_loss": -12.628437995910645, "global_step": 494843, "epoch": 2945} {"train_loss": -10.966459274291992, "global_step": 494844, "epoch": 2945} {"train_loss": -11.748262405395508, "global_step": 494845, "epoch": 2945} {"train_loss": -12.347930908203125, "global_step": 494846, "epoch": 2945} {"train_loss": -11.453699111938477, "global_step": 494847, "epoch": 2945} {"train_loss": -11.601539611816406, "global_step": 494848, "epoch": 2945} {"train_loss": -12.433677673339844, "global_step": 494849, "epoch": 2945} {"train_loss": -11.437395095825195, "global_step": 494850, "epoch": 2945} {"train_loss": -12.473499298095703, "global_step": 494851, "epoch": 2945} {"train_loss": -11.679155349731445, "global_step": 494852, "epoch": 2945} {"train_loss": -11.645599365234375, "global_step": 494853, "epoch": 2945} {"train_loss": -11.892593383789062, "global_step": 494854, "epoch": 2945} {"train_loss": -12.241575241088867, "global_step": 494855, "epoch": 2945} {"train_loss": -11.408184051513672, "global_step": 494856, "epoch": 2945} {"train_loss": -12.065084457397461, "global_step": 494857, "epoch": 2945} {"train_loss": -11.643998146057129, "global_step": 494858, "epoch": 2945} {"train_loss": -11.926534652709961, "global_step": 494859, "epoch": 2945} {"train_loss": -11.853113174438477, "global_step": 494860, "epoch": 2945} {"train_loss": -11.752338409423828, "global_step": 494861, "epoch": 2945} {"train_loss": -11.93297004699707, "global_step": 494862, "epoch": 2945} {"train_loss": -11.872676849365234, "global_step": 494863, "epoch": 2945} {"train_loss": -12.339702606201172, "global_step": 494864, "epoch": 2945} {"train_loss": -12.033702850341797, "global_step": 494865, "epoch": 2945} {"train_loss": -12.575072288513184, "global_step": 494866, "epoch": 2945} {"train_loss": -12.399765014648438, "global_step": 494867, "epoch": 2945} {"train_loss": -12.390670776367188, "global_step": 494868, "epoch": 2945} {"train_loss": -12.743383407592773, "global_step": 494869, "epoch": 2945} {"train_loss": -12.219133377075195, "global_step": 494870, "epoch": 2945} {"train_loss": -12.402444839477539, "global_step": 494871, "epoch": 2945} {"train_loss": -12.58800220489502, "global_step": 494872, "epoch": 2945} {"train_loss": -12.521199226379395, "global_step": 494873, "epoch": 2945} {"train_loss": -12.241475105285645, "global_step": 494874, "epoch": 2945} {"train_loss": -12.53636360168457, "global_step": 494875, "epoch": 2945} {"train_loss": -12.707913398742676, "global_step": 494876, "epoch": 2945} {"train_loss": -12.209358215332031, "global_step": 494877, "epoch": 2945} {"train_loss": -12.413241386413574, "global_step": 494878, "epoch": 2945} {"train_loss": -12.756814956665039, "global_step": 494879, "epoch": 2945} {"train_loss": -12.637460708618164, "global_step": 494880, "epoch": 2945} {"train_loss": -12.712360382080078, "global_step": 494881, "epoch": 2945} {"train_loss": -12.773332595825195, "global_step": 494882, "epoch": 2945} {"train_loss": -12.731103897094727, "global_step": 494883, "epoch": 2945} {"train_loss": -12.655170440673828, "global_step": 494884, "epoch": 2945} {"train_loss": -12.664420127868652, "global_step": 494885, "epoch": 2945} {"train_loss": -12.967992782592773, "global_step": 494886, "epoch": 2945} {"train_loss": -12.59351634979248, "global_step": 494887, "epoch": 2945} {"train_loss": -12.79745101928711, "global_step": 494888, "epoch": 2945} {"train_loss": -12.841985702514648, "global_step": 494889, "epoch": 2945} {"train_loss": -12.64548110961914, "global_step": 494890, "epoch": 2945} {"train_loss": -12.802209854125977, "global_step": 494891, "epoch": 2945} {"train_loss": -12.937411308288574, "global_step": 494892, "epoch": 2945} {"train_loss": -12.719411849975586, "global_step": 494893, "epoch": 2945} {"train_loss": -12.54858684539795, "global_step": 494894, "epoch": 2945} {"train_loss": -12.747901916503906, "global_step": 494895, "epoch": 2945} {"train_loss": -12.814741134643555, "global_step": 494896, "epoch": 2945} {"train_loss": -12.682707786560059, "global_step": 494897, "epoch": 2945} {"train_loss": -12.675619125366211, "global_step": 494898, "epoch": 2945} {"train_loss": -12.803953170776367, "global_step": 494899, "epoch": 2945} {"train_loss": -12.747846603393555, "global_step": 494900, "epoch": 2945} {"train_loss": -12.768970489501953, "global_step": 494901, "epoch": 2945} {"train_loss": -12.758469581604004, "global_step": 494902, "epoch": 2945} {"train_loss": -12.719073295593262, "global_step": 494903, "epoch": 2945} {"train_loss": -12.949239730834961, "global_step": 494904, "epoch": 2945} {"train_loss": -12.94888687133789, "global_step": 494905, "epoch": 2945} {"train_loss": -12.901262283325195, "global_step": 494906, "epoch": 2945} {"train_loss": -12.933177947998047, "global_step": 494907, "epoch": 2945} {"train_loss": -12.44943618774414, "global_step": 494908, "epoch": 2945} {"train_loss": -12.584757804870605, "global_step": 494909, "epoch": 2945} {"train_loss": -12.842180252075195, "global_step": 494910, "epoch": 2945} {"train_loss": -12.410100936889648, "global_step": 494911, "epoch": 2945} {"train_loss": -12.75673770904541, "global_step": 494912, "epoch": 2945} {"train_loss": -12.379316329956055, "global_step": 494913, "epoch": 2945} {"train_loss": -12.88580322265625, "global_step": 494914, "epoch": 2945} {"train_loss": -12.691197395324707, "global_step": 494915, "epoch": 2945} {"train_loss": -12.761987686157227, "global_step": 494916, "epoch": 2945} {"train_loss": -12.748236656188965, "global_step": 494917, "epoch": 2945} {"train_loss": -12.543594360351562, "global_step": 494918, "epoch": 2945} {"train_loss": -12.740127563476562, "global_step": 494919, "epoch": 2945} {"train_loss": -12.208856582641602, "global_step": 494920, "epoch": 2945} {"train_loss": -12.148723602294922, "global_step": 494921, "epoch": 2945} {"train_loss": -12.61606216430664, "global_step": 494922, "epoch": 2945} {"train_loss": -12.494596481323242, "global_step": 494923, "epoch": 2945} {"train_loss": -12.138198852539062, "global_step": 494924, "epoch": 2945} {"train_loss": -12.195721626281738, "global_step": 494925, "epoch": 2945} {"train_loss": -12.663542747497559, "global_step": 494926, "epoch": 2945} {"train_loss": -12.45513824054173, "global_step": 494927, "epoch": 2945, "val_loss": 319934.25, "train_action_mse_error": 0.3456695079803467} {"train_loss": -10.590551376342773, "global_step": 494928, "epoch": 2946} {"train_loss": -10.105995178222656, "global_step": 494929, "epoch": 2946} {"train_loss": -10.8780517578125, "global_step": 494930, "epoch": 2946} {"train_loss": -9.753374099731445, "global_step": 494931, "epoch": 2946} {"train_loss": -11.535325050354004, "global_step": 494932, "epoch": 2946} {"train_loss": -10.58662223815918, "global_step": 494933, "epoch": 2946} {"train_loss": -9.313154220581055, "global_step": 494934, "epoch": 2946} {"train_loss": -9.771713256835938, "global_step": 494935, "epoch": 2946} {"train_loss": -9.504644393920898, "global_step": 494936, "epoch": 2946} {"train_loss": -10.109161376953125, "global_step": 494937, "epoch": 2946} {"train_loss": -9.460058212280273, "global_step": 494938, "epoch": 2946} {"train_loss": -9.526750564575195, "global_step": 494939, "epoch": 2946} {"train_loss": -9.857912063598633, "global_step": 494940, "epoch": 2946} {"train_loss": -10.897124290466309, "global_step": 494941, "epoch": 2946} {"train_loss": -11.043028831481934, "global_step": 494942, "epoch": 2946} {"train_loss": -9.779046058654785, "global_step": 494943, "epoch": 2946} {"train_loss": -10.83505630493164, "global_step": 494944, "epoch": 2946} {"train_loss": -9.527519226074219, "global_step": 494945, "epoch": 2946} {"train_loss": -11.637994766235352, "global_step": 494946, "epoch": 2946} {"train_loss": -10.002330780029297, "global_step": 494947, "epoch": 2946} {"train_loss": -10.009564399719238, "global_step": 494948, "epoch": 2946} {"train_loss": -11.777708053588867, "global_step": 494949, "epoch": 2946} {"train_loss": -10.04699993133545, "global_step": 494950, "epoch": 2946} {"train_loss": -11.927116394042969, "global_step": 494951, "epoch": 2946} {"train_loss": -11.970011711120605, "global_step": 494952, "epoch": 2946} {"train_loss": -12.11369514465332, "global_step": 494953, "epoch": 2946} {"train_loss": -11.83547592163086, "global_step": 494954, "epoch": 2946} {"train_loss": -11.948546409606934, "global_step": 494955, "epoch": 2946} {"train_loss": -12.298372268676758, "global_step": 494956, "epoch": 2946} {"train_loss": -12.196235656738281, "global_step": 494957, "epoch": 2946} {"train_loss": -12.374828338623047, "global_step": 494958, "epoch": 2946} {"train_loss": -12.168437957763672, "global_step": 494959, "epoch": 2946} {"train_loss": -12.18077278137207, "global_step": 494960, "epoch": 2946} {"train_loss": -12.18294906616211, "global_step": 494961, "epoch": 2946} {"train_loss": -12.027534484863281, "global_step": 494962, "epoch": 2946} {"train_loss": -12.039508819580078, "global_step": 494963, "epoch": 2946} {"train_loss": -12.197498321533203, "global_step": 494964, "epoch": 2946} {"train_loss": -11.862113952636719, "global_step": 494965, "epoch": 2946} {"train_loss": -12.172239303588867, "global_step": 494966, "epoch": 2946} {"train_loss": -12.21541690826416, "global_step": 494967, "epoch": 2946} {"train_loss": -12.255364418029785, "global_step": 494968, "epoch": 2946} {"train_loss": -12.215625762939453, "global_step": 494969, "epoch": 2946} {"train_loss": -12.200960159301758, "global_step": 494970, "epoch": 2946} {"train_loss": -12.159900665283203, "global_step": 494971, "epoch": 2946} {"train_loss": -12.2420654296875, "global_step": 494972, "epoch": 2946} {"train_loss": -11.894853591918945, "global_step": 494973, "epoch": 2946} {"train_loss": -12.208185195922852, "global_step": 494974, "epoch": 2946} {"train_loss": -11.646764755249023, "global_step": 494975, "epoch": 2946} {"train_loss": -12.176464080810547, "global_step": 494976, "epoch": 2946} {"train_loss": -12.088238716125488, "global_step": 494977, "epoch": 2946} {"train_loss": -12.137910842895508, "global_step": 494978, "epoch": 2946} {"train_loss": -12.076301574707031, "global_step": 494979, "epoch": 2946} {"train_loss": -11.636741638183594, "global_step": 494980, "epoch": 2946} {"train_loss": -12.457754135131836, "global_step": 494981, "epoch": 2946} {"train_loss": -11.82406997680664, "global_step": 494982, "epoch": 2946} {"train_loss": -12.392663955688477, "global_step": 494983, "epoch": 2946} {"train_loss": -11.80018424987793, "global_step": 494984, "epoch": 2946} {"train_loss": -12.512420654296875, "global_step": 494985, "epoch": 2946} {"train_loss": -12.358922958374023, "global_step": 494986, "epoch": 2946} {"train_loss": -12.231449127197266, "global_step": 494987, "epoch": 2946} {"train_loss": -12.167203903198242, "global_step": 494988, "epoch": 2946} {"train_loss": -12.526358604431152, "global_step": 494989, "epoch": 2946} {"train_loss": -12.149480819702148, "global_step": 494990, "epoch": 2946} {"train_loss": -12.253032684326172, "global_step": 494991, "epoch": 2946} {"train_loss": -12.187777519226074, "global_step": 494992, "epoch": 2946} {"train_loss": -12.395303726196289, "global_step": 494993, "epoch": 2946} {"train_loss": -12.240251541137695, "global_step": 494994, "epoch": 2946} {"train_loss": -12.529924392700195, "global_step": 494995, "epoch": 2946} {"train_loss": -12.531231880187988, "global_step": 494996, "epoch": 2946} {"train_loss": -12.223932266235352, "global_step": 494997, "epoch": 2946} {"train_loss": -12.552366256713867, "global_step": 494998, "epoch": 2946} {"train_loss": -12.2122802734375, "global_step": 494999, "epoch": 2946} {"train_loss": -12.119585037231445, "global_step": 495000, "epoch": 2946} {"train_loss": -12.190780639648438, "global_step": 495001, "epoch": 2946} {"train_loss": -12.054072380065918, "global_step": 495002, "epoch": 2946} {"train_loss": -12.118568420410156, "global_step": 495003, "epoch": 2946} {"train_loss": -12.189582824707031, "global_step": 495004, "epoch": 2946} {"train_loss": -12.152058601379395, "global_step": 495005, "epoch": 2946} {"train_loss": -12.447630882263184, "global_step": 495006, "epoch": 2946} {"train_loss": -12.615571975708008, "global_step": 495007, "epoch": 2946} {"train_loss": -12.246414184570312, "global_step": 495008, "epoch": 2946} {"train_loss": -12.673810005187988, "global_step": 495009, "epoch": 2946} {"train_loss": -12.179101943969727, "global_step": 495010, "epoch": 2946} {"train_loss": -12.498291015625, "global_step": 495011, "epoch": 2946} {"train_loss": -12.294912338256836, "global_step": 495012, "epoch": 2946} {"train_loss": -12.607868194580078, "global_step": 495013, "epoch": 2946} {"train_loss": -12.248984336853027, "global_step": 495014, "epoch": 2946} {"train_loss": -12.588069915771484, "global_step": 495015, "epoch": 2946} {"train_loss": -12.404176712036133, "global_step": 495016, "epoch": 2946} {"train_loss": -12.311729431152344, "global_step": 495017, "epoch": 2946} {"train_loss": -12.612665176391602, "global_step": 495018, "epoch": 2946} {"train_loss": -12.516410827636719, "global_step": 495019, "epoch": 2946} {"train_loss": -12.559282302856445, "global_step": 495020, "epoch": 2946} {"train_loss": -12.56369686126709, "global_step": 495021, "epoch": 2946} {"train_loss": -12.717325210571289, "global_step": 495022, "epoch": 2946} {"train_loss": -12.529838562011719, "global_step": 495023, "epoch": 2946} {"train_loss": -12.842323303222656, "global_step": 495024, "epoch": 2946} {"train_loss": -12.740499496459961, "global_step": 495025, "epoch": 2946} {"train_loss": -12.632426261901855, "global_step": 495026, "epoch": 2946} {"train_loss": -12.677891731262207, "global_step": 495027, "epoch": 2946} {"train_loss": -12.614368438720703, "global_step": 495028, "epoch": 2946} {"train_loss": -12.811870574951172, "global_step": 495029, "epoch": 2946} {"train_loss": -12.844266891479492, "global_step": 495030, "epoch": 2946} {"train_loss": -12.655920028686523, "global_step": 495031, "epoch": 2946} {"train_loss": -12.797199249267578, "global_step": 495032, "epoch": 2946} {"train_loss": -12.687333106994629, "global_step": 495033, "epoch": 2946} {"train_loss": -12.845255851745605, "global_step": 495034, "epoch": 2946} {"train_loss": -12.670757293701172, "global_step": 495035, "epoch": 2946} {"train_loss": -12.837748527526855, "global_step": 495036, "epoch": 2946} {"train_loss": -12.761198997497559, "global_step": 495037, "epoch": 2946} {"train_loss": -12.952768325805664, "global_step": 495038, "epoch": 2946} {"train_loss": -12.824864387512207, "global_step": 495039, "epoch": 2946} {"train_loss": -13.087421417236328, "global_step": 495040, "epoch": 2946} {"train_loss": -12.739896774291992, "global_step": 495041, "epoch": 2946} {"train_loss": -12.647958755493164, "global_step": 495042, "epoch": 2946} {"train_loss": -13.074156761169434, "global_step": 495043, "epoch": 2946} {"train_loss": -12.80586051940918, "global_step": 495044, "epoch": 2946} {"train_loss": -12.949779510498047, "global_step": 495045, "epoch": 2946} {"train_loss": -12.881179809570312, "global_step": 495046, "epoch": 2946} {"train_loss": -12.933187484741211, "global_step": 495047, "epoch": 2946} {"train_loss": -12.816900253295898, "global_step": 495048, "epoch": 2946} {"train_loss": -12.871015548706055, "global_step": 495049, "epoch": 2946} {"train_loss": -13.104121208190918, "global_step": 495050, "epoch": 2946} {"train_loss": -12.900007247924805, "global_step": 495051, "epoch": 2946} {"train_loss": -12.94679069519043, "global_step": 495052, "epoch": 2946} {"train_loss": -12.88725471496582, "global_step": 495053, "epoch": 2946} {"train_loss": -12.7411470413208, "global_step": 495054, "epoch": 2946} {"train_loss": -12.753742218017578, "global_step": 495055, "epoch": 2946} {"train_loss": -12.997784614562988, "global_step": 495056, "epoch": 2946} {"train_loss": -12.649360656738281, "global_step": 495057, "epoch": 2946} {"train_loss": -12.537006378173828, "global_step": 495058, "epoch": 2946} {"train_loss": -12.540254592895508, "global_step": 495059, "epoch": 2946} {"train_loss": -12.326764106750488, "global_step": 495060, "epoch": 2946} {"train_loss": -12.462981224060059, "global_step": 495061, "epoch": 2946} {"train_loss": -12.042428970336914, "global_step": 495062, "epoch": 2946} {"train_loss": -12.647046089172363, "global_step": 495063, "epoch": 2946} {"train_loss": -11.849433898925781, "global_step": 495064, "epoch": 2946} {"train_loss": -13.028823852539062, "global_step": 495065, "epoch": 2946} {"train_loss": -12.235578536987305, "global_step": 495066, "epoch": 2946} {"train_loss": -12.806499481201172, "global_step": 495067, "epoch": 2946} {"train_loss": -12.548227310180664, "global_step": 495068, "epoch": 2946} {"train_loss": -12.70733642578125, "global_step": 495069, "epoch": 2946} {"train_loss": -12.771100044250488, "global_step": 495070, "epoch": 2946} {"train_loss": -12.417316436767578, "global_step": 495071, "epoch": 2946} {"train_loss": -12.3008394241333, "global_step": 495072, "epoch": 2946} {"train_loss": -12.555330276489258, "global_step": 495073, "epoch": 2946} {"train_loss": -12.626792907714844, "global_step": 495074, "epoch": 2946} {"train_loss": -11.710805892944336, "global_step": 495075, "epoch": 2946} {"train_loss": -12.001856803894043, "global_step": 495076, "epoch": 2946} {"train_loss": -12.659849166870117, "global_step": 495077, "epoch": 2946} {"train_loss": -11.902397155761719, "global_step": 495078, "epoch": 2946} {"train_loss": -12.382255554199219, "global_step": 495079, "epoch": 2946} {"train_loss": -12.25802230834961, "global_step": 495080, "epoch": 2946} {"train_loss": -12.412250518798828, "global_step": 495081, "epoch": 2946} {"train_loss": -11.942726135253906, "global_step": 495082, "epoch": 2946} {"train_loss": -12.2938232421875, "global_step": 495083, "epoch": 2946} {"train_loss": -12.217386245727539, "global_step": 495084, "epoch": 2946} {"train_loss": -12.58005142211914, "global_step": 495085, "epoch": 2946} {"train_loss": -12.618443489074707, "global_step": 495086, "epoch": 2946} {"train_loss": -12.547759056091309, "global_step": 495087, "epoch": 2946} {"train_loss": -12.638097763061523, "global_step": 495088, "epoch": 2946} {"train_loss": -12.460027694702148, "global_step": 495089, "epoch": 2946} {"train_loss": -12.768271446228027, "global_step": 495090, "epoch": 2946} {"train_loss": -12.555028915405273, "global_step": 495091, "epoch": 2946} {"train_loss": -12.792366981506348, "global_step": 495092, "epoch": 2946} {"train_loss": -12.575066566467285, "global_step": 495093, "epoch": 2946} {"train_loss": -12.789507865905762, "global_step": 495094, "epoch": 2946} {"train_loss": -12.137221228508722, "global_step": 495095, "epoch": 2946, "val_loss": 312764.59375} {"train_loss": -12.665168762207031, "global_step": 495096, "epoch": 2947} {"train_loss": -12.59267520904541, "global_step": 495097, "epoch": 2947} {"train_loss": -12.702831268310547, "global_step": 495098, "epoch": 2947} {"train_loss": -12.78023624420166, "global_step": 495099, "epoch": 2947} {"train_loss": -12.21654987335205, "global_step": 495100, "epoch": 2947} {"train_loss": -11.705198287963867, "global_step": 495101, "epoch": 2947} {"train_loss": -12.08642578125, "global_step": 495102, "epoch": 2947} {"train_loss": -12.666097640991211, "global_step": 495103, "epoch": 2947} {"train_loss": -11.34241008758545, "global_step": 495104, "epoch": 2947} {"train_loss": -9.807395935058594, "global_step": 495105, "epoch": 2947} {"train_loss": -11.057798385620117, "global_step": 495106, "epoch": 2947} {"train_loss": -8.748144149780273, "global_step": 495107, "epoch": 2947} {"train_loss": -10.010130882263184, "global_step": 495108, "epoch": 2947} {"train_loss": -11.628293991088867, "global_step": 495109, "epoch": 2947} {"train_loss": -9.282639503479004, "global_step": 495110, "epoch": 2947} {"train_loss": -10.481582641601562, "global_step": 495111, "epoch": 2947} {"train_loss": -10.065618515014648, "global_step": 495112, "epoch": 2947} {"train_loss": -10.09764289855957, "global_step": 495113, "epoch": 2947} {"train_loss": -9.582148551940918, "global_step": 495114, "epoch": 2947} {"train_loss": -8.005746841430664, "global_step": 495115, "epoch": 2947} {"train_loss": -9.363093376159668, "global_step": 495116, "epoch": 2947} {"train_loss": -9.239670753479004, "global_step": 495117, "epoch": 2947} {"train_loss": -8.6588716506958, "global_step": 495118, "epoch": 2947} {"train_loss": -9.660948753356934, "global_step": 495119, "epoch": 2947} {"train_loss": -9.351941108703613, "global_step": 495120, "epoch": 2947} {"train_loss": -10.151477813720703, "global_step": 495121, "epoch": 2947} {"train_loss": -10.485353469848633, "global_step": 495122, "epoch": 2947} {"train_loss": -9.252782821655273, "global_step": 495123, "epoch": 2947} {"train_loss": -9.703351020812988, "global_step": 495124, "epoch": 2947} {"train_loss": -9.725799560546875, "global_step": 495125, "epoch": 2947} {"train_loss": -10.033527374267578, "global_step": 495126, "epoch": 2947} {"train_loss": -9.006523132324219, "global_step": 495127, "epoch": 2947} {"train_loss": -9.737704277038574, "global_step": 495128, "epoch": 2947} {"train_loss": -10.969858169555664, "global_step": 495129, "epoch": 2947} {"train_loss": -9.924886703491211, "global_step": 495130, "epoch": 2947} {"train_loss": -9.066009521484375, "global_step": 495131, "epoch": 2947} {"train_loss": -10.408904075622559, "global_step": 495132, "epoch": 2947} {"train_loss": -9.779504776000977, "global_step": 495133, "epoch": 2947} {"train_loss": -9.66684341430664, "global_step": 495134, "epoch": 2947} {"train_loss": -9.692365646362305, "global_step": 495135, "epoch": 2947} {"train_loss": -9.772125244140625, "global_step": 495136, "epoch": 2947} {"train_loss": -10.493278503417969, "global_step": 495137, "epoch": 2947} {"train_loss": -10.297174453735352, "global_step": 495138, "epoch": 2947} {"train_loss": -11.372430801391602, "global_step": 495139, "epoch": 2947} {"train_loss": -10.022997856140137, "global_step": 495140, "epoch": 2947} {"train_loss": -10.167035102844238, "global_step": 495141, "epoch": 2947} {"train_loss": -10.640373229980469, "global_step": 495142, "epoch": 2947} {"train_loss": -11.447205543518066, "global_step": 495143, "epoch": 2947} {"train_loss": -11.318406105041504, "global_step": 495144, "epoch": 2947} {"train_loss": -10.4269380569458, "global_step": 495145, "epoch": 2947} {"train_loss": -11.267936706542969, "global_step": 495146, "epoch": 2947} {"train_loss": -11.397912979125977, "global_step": 495147, "epoch": 2947} {"train_loss": -11.0708646774292, "global_step": 495148, "epoch": 2947} {"train_loss": -12.080371856689453, "global_step": 495149, "epoch": 2947} {"train_loss": -11.171648025512695, "global_step": 495150, "epoch": 2947} {"train_loss": -11.599800109863281, "global_step": 495151, "epoch": 2947} {"train_loss": -12.03361988067627, "global_step": 495152, "epoch": 2947} {"train_loss": -11.281262397766113, "global_step": 495153, "epoch": 2947} {"train_loss": -12.031646728515625, "global_step": 495154, "epoch": 2947} {"train_loss": -12.278682708740234, "global_step": 495155, "epoch": 2947} {"train_loss": -11.469375610351562, "global_step": 495156, "epoch": 2947} {"train_loss": -11.849534034729004, "global_step": 495157, "epoch": 2947} {"train_loss": -12.246841430664062, "global_step": 495158, "epoch": 2947} {"train_loss": -11.606278419494629, "global_step": 495159, "epoch": 2947} {"train_loss": -11.876112937927246, "global_step": 495160, "epoch": 2947} {"train_loss": -11.972983360290527, "global_step": 495161, "epoch": 2947} {"train_loss": -11.780023574829102, "global_step": 495162, "epoch": 2947} {"train_loss": -12.179983139038086, "global_step": 495163, "epoch": 2947} {"train_loss": -12.107529640197754, "global_step": 495164, "epoch": 2947} {"train_loss": -11.80478286743164, "global_step": 495165, "epoch": 2947} {"train_loss": -11.945497512817383, "global_step": 495166, "epoch": 2947} {"train_loss": -12.125293731689453, "global_step": 495167, "epoch": 2947} {"train_loss": -11.70264720916748, "global_step": 495168, "epoch": 2947} {"train_loss": -12.41457748413086, "global_step": 495169, "epoch": 2947} {"train_loss": -12.06673812866211, "global_step": 495170, "epoch": 2947} {"train_loss": -12.097893714904785, "global_step": 495171, "epoch": 2947} {"train_loss": -12.241552352905273, "global_step": 495172, "epoch": 2947} {"train_loss": -11.808637619018555, "global_step": 495173, "epoch": 2947} {"train_loss": -12.322017669677734, "global_step": 495174, "epoch": 2947} {"train_loss": -12.198150634765625, "global_step": 495175, "epoch": 2947} {"train_loss": -12.217878341674805, "global_step": 495176, "epoch": 2947} {"train_loss": -11.896188735961914, "global_step": 495177, "epoch": 2947} {"train_loss": -12.390989303588867, "global_step": 495178, "epoch": 2947} {"train_loss": -11.71072006225586, "global_step": 495179, "epoch": 2947} {"train_loss": -12.275524139404297, "global_step": 495180, "epoch": 2947} {"train_loss": -12.080716133117676, "global_step": 495181, "epoch": 2947} {"train_loss": -11.97979736328125, "global_step": 495182, "epoch": 2947} {"train_loss": -12.228781700134277, "global_step": 495183, "epoch": 2947} {"train_loss": -11.806148529052734, "global_step": 495184, "epoch": 2947} {"train_loss": -12.239673614501953, "global_step": 495185, "epoch": 2947} {"train_loss": -11.618218421936035, "global_step": 495186, "epoch": 2947} {"train_loss": -12.177749633789062, "global_step": 495187, "epoch": 2947} {"train_loss": -12.207244873046875, "global_step": 495188, "epoch": 2947} {"train_loss": -12.382274627685547, "global_step": 495189, "epoch": 2947} {"train_loss": -12.254486083984375, "global_step": 495190, "epoch": 2947} {"train_loss": -12.476484298706055, "global_step": 495191, "epoch": 2947} {"train_loss": -12.366626739501953, "global_step": 495192, "epoch": 2947} {"train_loss": -12.545631408691406, "global_step": 495193, "epoch": 2947} {"train_loss": -12.108111381530762, "global_step": 495194, "epoch": 2947} {"train_loss": -12.374378204345703, "global_step": 495195, "epoch": 2947} {"train_loss": -12.406633377075195, "global_step": 495196, "epoch": 2947} {"train_loss": -12.639871597290039, "global_step": 495197, "epoch": 2947} {"train_loss": -12.287494659423828, "global_step": 495198, "epoch": 2947} {"train_loss": -12.521464347839355, "global_step": 495199, "epoch": 2947} {"train_loss": -12.689414978027344, "global_step": 495200, "epoch": 2947} {"train_loss": -12.511703491210938, "global_step": 495201, "epoch": 2947} {"train_loss": -12.274057388305664, "global_step": 495202, "epoch": 2947} {"train_loss": -12.481334686279297, "global_step": 495203, "epoch": 2947} {"train_loss": -12.43769645690918, "global_step": 495204, "epoch": 2947} {"train_loss": -12.669111251831055, "global_step": 495205, "epoch": 2947} {"train_loss": -12.378982543945312, "global_step": 495206, "epoch": 2947} {"train_loss": -12.371892929077148, "global_step": 495207, "epoch": 2947} {"train_loss": -12.628450393676758, "global_step": 495208, "epoch": 2947} {"train_loss": -12.411056518554688, "global_step": 495209, "epoch": 2947} {"train_loss": -12.454439163208008, "global_step": 495210, "epoch": 2947} {"train_loss": -12.65787124633789, "global_step": 495211, "epoch": 2947} {"train_loss": -12.419479370117188, "global_step": 495212, "epoch": 2947} {"train_loss": -12.728799819946289, "global_step": 495213, "epoch": 2947} {"train_loss": -12.305339813232422, "global_step": 495214, "epoch": 2947} {"train_loss": -12.697746276855469, "global_step": 495215, "epoch": 2947} {"train_loss": -12.761214256286621, "global_step": 495216, "epoch": 2947} {"train_loss": -12.796201705932617, "global_step": 495217, "epoch": 2947} {"train_loss": -12.793474197387695, "global_step": 495218, "epoch": 2947} {"train_loss": -12.71910285949707, "global_step": 495219, "epoch": 2947} {"train_loss": -12.61109733581543, "global_step": 495220, "epoch": 2947} {"train_loss": -12.785646438598633, "global_step": 495221, "epoch": 2947} {"train_loss": -12.72110366821289, "global_step": 495222, "epoch": 2947} {"train_loss": -12.816226959228516, "global_step": 495223, "epoch": 2947} {"train_loss": -12.78758430480957, "global_step": 495224, "epoch": 2947} {"train_loss": -12.852174758911133, "global_step": 495225, "epoch": 2947} {"train_loss": -12.916537284851074, "global_step": 495226, "epoch": 2947} {"train_loss": -12.938220024108887, "global_step": 495227, "epoch": 2947} {"train_loss": -12.76736831665039, "global_step": 495228, "epoch": 2947} {"train_loss": -12.709028244018555, "global_step": 495229, "epoch": 2947} {"train_loss": -12.813114166259766, "global_step": 495230, "epoch": 2947} {"train_loss": -12.911840438842773, "global_step": 495231, "epoch": 2947} {"train_loss": -13.009571075439453, "global_step": 495232, "epoch": 2947} {"train_loss": -12.693185806274414, "global_step": 495233, "epoch": 2947} {"train_loss": -12.92093563079834, "global_step": 495234, "epoch": 2947} {"train_loss": -13.010812759399414, "global_step": 495235, "epoch": 2947} {"train_loss": -12.852150917053223, "global_step": 495236, "epoch": 2947} {"train_loss": -12.530830383300781, "global_step": 495237, "epoch": 2947} {"train_loss": -12.802494049072266, "global_step": 495238, "epoch": 2947} {"train_loss": -12.792207717895508, "global_step": 495239, "epoch": 2947} {"train_loss": -12.912134170532227, "global_step": 495240, "epoch": 2947} {"train_loss": -12.969406127929688, "global_step": 495241, "epoch": 2947} {"train_loss": -12.835250854492188, "global_step": 495242, "epoch": 2947} {"train_loss": -12.727548599243164, "global_step": 495243, "epoch": 2947} {"train_loss": -12.743416786193848, "global_step": 495244, "epoch": 2947} {"train_loss": -12.989261627197266, "global_step": 495245, "epoch": 2947} {"train_loss": -12.755255699157715, "global_step": 495246, "epoch": 2947} {"train_loss": -12.871221542358398, "global_step": 495247, "epoch": 2947} {"train_loss": -12.911115646362305, "global_step": 495248, "epoch": 2947} {"train_loss": -12.862396240234375, "global_step": 495249, "epoch": 2947} {"train_loss": -12.795554161071777, "global_step": 495250, "epoch": 2947} {"train_loss": -12.91378116607666, "global_step": 495251, "epoch": 2947} {"train_loss": -12.753339767456055, "global_step": 495252, "epoch": 2947} {"train_loss": -12.830416679382324, "global_step": 495253, "epoch": 2947} {"train_loss": -12.766517639160156, "global_step": 495254, "epoch": 2947} {"train_loss": -12.908615112304688, "global_step": 495255, "epoch": 2947} {"train_loss": -12.882598876953125, "global_step": 495256, "epoch": 2947} {"train_loss": -12.798676490783691, "global_step": 495257, "epoch": 2947} {"train_loss": -12.923969268798828, "global_step": 495258, "epoch": 2947} {"train_loss": -13.080950736999512, "global_step": 495259, "epoch": 2947} {"train_loss": -12.752059936523438, "global_step": 495260, "epoch": 2947} {"train_loss": -12.808626174926758, "global_step": 495261, "epoch": 2947} {"train_loss": -12.563905715942383, "global_step": 495262, "epoch": 2947} {"train_loss": -11.809780416034517, "global_step": 495263, "epoch": 2947, "val_loss": 317532.09375} {"train_loss": -12.822796821594238, "global_step": 495264, "epoch": 2948} {"train_loss": -13.089155197143555, "global_step": 495265, "epoch": 2948} {"train_loss": -12.968786239624023, "global_step": 495266, "epoch": 2948} {"train_loss": -12.962516784667969, "global_step": 495267, "epoch": 2948} {"train_loss": -12.82908821105957, "global_step": 495268, "epoch": 2948} {"train_loss": -12.806109428405762, "global_step": 495269, "epoch": 2948} {"train_loss": -12.981546401977539, "global_step": 495270, "epoch": 2948} {"train_loss": -12.70184326171875, "global_step": 495271, "epoch": 2948} {"train_loss": -12.365510940551758, "global_step": 495272, "epoch": 2948} {"train_loss": -12.845991134643555, "global_step": 495273, "epoch": 2948} {"train_loss": -12.11864185333252, "global_step": 495274, "epoch": 2948} {"train_loss": -12.916269302368164, "global_step": 495275, "epoch": 2948} {"train_loss": -12.371105194091797, "global_step": 495276, "epoch": 2948} {"train_loss": -11.828813552856445, "global_step": 495277, "epoch": 2948} {"train_loss": -12.545740127563477, "global_step": 495278, "epoch": 2948} {"train_loss": -12.012462615966797, "global_step": 495279, "epoch": 2948} {"train_loss": -11.366924285888672, "global_step": 495280, "epoch": 2948} {"train_loss": -11.760857582092285, "global_step": 495281, "epoch": 2948} {"train_loss": -12.11636734008789, "global_step": 495282, "epoch": 2948} {"train_loss": -11.498664855957031, "global_step": 495283, "epoch": 2948} {"train_loss": -11.165767669677734, "global_step": 495284, "epoch": 2948} {"train_loss": -9.658941268920898, "global_step": 495285, "epoch": 2948} {"train_loss": -10.834881782531738, "global_step": 495286, "epoch": 2948} {"train_loss": -10.970441818237305, "global_step": 495287, "epoch": 2948} {"train_loss": -11.012938499450684, "global_step": 495288, "epoch": 2948} {"train_loss": -11.394542694091797, "global_step": 495289, "epoch": 2948} {"train_loss": -11.0122652053833, "global_step": 495290, "epoch": 2948} {"train_loss": -9.656780242919922, "global_step": 495291, "epoch": 2948} {"train_loss": -10.614423751831055, "global_step": 495292, "epoch": 2948} {"train_loss": -10.553388595581055, "global_step": 495293, "epoch": 2948} {"train_loss": -8.853100776672363, "global_step": 495294, "epoch": 2948} {"train_loss": -10.48916244506836, "global_step": 495295, "epoch": 2948} {"train_loss": -9.872392654418945, "global_step": 495296, "epoch": 2948} {"train_loss": -9.889467239379883, "global_step": 495297, "epoch": 2948} {"train_loss": -10.142744064331055, "global_step": 495298, "epoch": 2948} {"train_loss": -11.156722068786621, "global_step": 495299, "epoch": 2948} {"train_loss": -10.068670272827148, "global_step": 495300, "epoch": 2948} {"train_loss": -9.085933685302734, "global_step": 495301, "epoch": 2948} {"train_loss": -9.211238861083984, "global_step": 495302, "epoch": 2948} {"train_loss": -10.929699897766113, "global_step": 495303, "epoch": 2948} {"train_loss": -8.479225158691406, "global_step": 495304, "epoch": 2948} {"train_loss": -9.3748779296875, "global_step": 495305, "epoch": 2948} {"train_loss": -8.776100158691406, "global_step": 495306, "epoch": 2948} {"train_loss": -10.480810165405273, "global_step": 495307, "epoch": 2948} {"train_loss": -9.603799819946289, "global_step": 495308, "epoch": 2948} {"train_loss": -10.763875007629395, "global_step": 495309, "epoch": 2948} {"train_loss": -10.11050033569336, "global_step": 495310, "epoch": 2948} {"train_loss": -10.142230987548828, "global_step": 495311, "epoch": 2948} {"train_loss": -10.869041442871094, "global_step": 495312, "epoch": 2948} {"train_loss": -10.209199905395508, "global_step": 495313, "epoch": 2948} {"train_loss": -10.941680908203125, "global_step": 495314, "epoch": 2948} {"train_loss": -10.585562705993652, "global_step": 495315, "epoch": 2948} {"train_loss": -11.710694313049316, "global_step": 495316, "epoch": 2948} {"train_loss": -11.123807907104492, "global_step": 495317, "epoch": 2948} {"train_loss": -11.422666549682617, "global_step": 495318, "epoch": 2948} {"train_loss": -10.631570816040039, "global_step": 495319, "epoch": 2948} {"train_loss": -11.5450439453125, "global_step": 495320, "epoch": 2948} {"train_loss": -10.75955581665039, "global_step": 495321, "epoch": 2948} {"train_loss": -11.983802795410156, "global_step": 495322, "epoch": 2948} {"train_loss": -11.498554229736328, "global_step": 495323, "epoch": 2948} {"train_loss": -11.881860733032227, "global_step": 495324, "epoch": 2948} {"train_loss": -11.897729873657227, "global_step": 495325, "epoch": 2948} {"train_loss": -11.686174392700195, "global_step": 495326, "epoch": 2948} {"train_loss": -11.8946533203125, "global_step": 495327, "epoch": 2948} {"train_loss": -12.206279754638672, "global_step": 495328, "epoch": 2948} {"train_loss": -11.94387435913086, "global_step": 495329, "epoch": 2948} {"train_loss": -12.481094360351562, "global_step": 495330, "epoch": 2948} {"train_loss": -12.018942832946777, "global_step": 495331, "epoch": 2948} {"train_loss": -12.337339401245117, "global_step": 495332, "epoch": 2948} {"train_loss": -12.286909103393555, "global_step": 495333, "epoch": 2948} {"train_loss": -12.003080368041992, "global_step": 495334, "epoch": 2948} {"train_loss": -12.402454376220703, "global_step": 495335, "epoch": 2948} {"train_loss": -11.90524959564209, "global_step": 495336, "epoch": 2948} {"train_loss": -12.343484878540039, "global_step": 495337, "epoch": 2948} {"train_loss": -12.237052917480469, "global_step": 495338, "epoch": 2948} {"train_loss": -12.359888076782227, "global_step": 495339, "epoch": 2948} {"train_loss": -12.262460708618164, "global_step": 495340, "epoch": 2948} {"train_loss": -12.138011932373047, "global_step": 495341, "epoch": 2948} {"train_loss": -12.674235343933105, "global_step": 495342, "epoch": 2948} {"train_loss": -11.962182998657227, "global_step": 495343, "epoch": 2948} {"train_loss": -12.334583282470703, "global_step": 495344, "epoch": 2948} {"train_loss": -12.404648780822754, "global_step": 495345, "epoch": 2948} {"train_loss": -12.020866394042969, "global_step": 495346, "epoch": 2948} {"train_loss": -12.658488273620605, "global_step": 495347, "epoch": 2948} {"train_loss": -12.57560920715332, "global_step": 495348, "epoch": 2948} {"train_loss": -12.609952926635742, "global_step": 495349, "epoch": 2948} {"train_loss": -12.608098983764648, "global_step": 495350, "epoch": 2948} {"train_loss": -12.337678909301758, "global_step": 495351, "epoch": 2948} {"train_loss": -12.642716407775879, "global_step": 495352, "epoch": 2948} {"train_loss": -12.495278358459473, "global_step": 495353, "epoch": 2948} {"train_loss": -12.433954238891602, "global_step": 495354, "epoch": 2948} {"train_loss": -12.533550262451172, "global_step": 495355, "epoch": 2948} {"train_loss": -12.390240669250488, "global_step": 495356, "epoch": 2948} {"train_loss": -12.821914672851562, "global_step": 495357, "epoch": 2948} {"train_loss": -12.598223686218262, "global_step": 495358, "epoch": 2948} {"train_loss": -12.606989860534668, "global_step": 495359, "epoch": 2948} {"train_loss": -12.441529273986816, "global_step": 495360, "epoch": 2948} {"train_loss": -12.746438980102539, "global_step": 495361, "epoch": 2948} {"train_loss": -12.635049819946289, "global_step": 495362, "epoch": 2948} {"train_loss": -12.630558013916016, "global_step": 495363, "epoch": 2948} {"train_loss": -12.51687240600586, "global_step": 495364, "epoch": 2948} {"train_loss": -12.555288314819336, "global_step": 495365, "epoch": 2948} {"train_loss": -12.56076431274414, "global_step": 495366, "epoch": 2948} {"train_loss": -12.487791061401367, "global_step": 495367, "epoch": 2948} {"train_loss": -12.590909957885742, "global_step": 495368, "epoch": 2948} {"train_loss": -12.428823471069336, "global_step": 495369, "epoch": 2948} {"train_loss": -12.534491539001465, "global_step": 495370, "epoch": 2948} {"train_loss": -12.741097450256348, "global_step": 495371, "epoch": 2948} {"train_loss": -12.528009414672852, "global_step": 495372, "epoch": 2948} {"train_loss": -12.499752044677734, "global_step": 495373, "epoch": 2948} {"train_loss": -12.72492504119873, "global_step": 495374, "epoch": 2948} {"train_loss": -12.538629531860352, "global_step": 495375, "epoch": 2948} {"train_loss": -12.622086524963379, "global_step": 495376, "epoch": 2948} {"train_loss": -12.70645523071289, "global_step": 495377, "epoch": 2948} {"train_loss": -12.720470428466797, "global_step": 495378, "epoch": 2948} {"train_loss": -12.698770523071289, "global_step": 495379, "epoch": 2948} {"train_loss": -12.636491775512695, "global_step": 495380, "epoch": 2948} {"train_loss": -12.78968334197998, "global_step": 495381, "epoch": 2948} {"train_loss": -12.694114685058594, "global_step": 495382, "epoch": 2948} {"train_loss": -12.747303009033203, "global_step": 495383, "epoch": 2948} {"train_loss": -12.725730895996094, "global_step": 495384, "epoch": 2948} {"train_loss": -12.72773265838623, "global_step": 495385, "epoch": 2948} {"train_loss": -12.997105598449707, "global_step": 495386, "epoch": 2948} {"train_loss": -12.712057113647461, "global_step": 495387, "epoch": 2948} {"train_loss": -12.967569351196289, "global_step": 495388, "epoch": 2948} {"train_loss": -12.718036651611328, "global_step": 495389, "epoch": 2948} {"train_loss": -12.794690132141113, "global_step": 495390, "epoch": 2948} {"train_loss": -12.761585235595703, "global_step": 495391, "epoch": 2948} {"train_loss": -12.714275360107422, "global_step": 495392, "epoch": 2948} {"train_loss": -12.693192481994629, "global_step": 495393, "epoch": 2948} {"train_loss": -12.941503524780273, "global_step": 495394, "epoch": 2948} {"train_loss": -12.682284355163574, "global_step": 495395, "epoch": 2948} {"train_loss": -12.887791633605957, "global_step": 495396, "epoch": 2948} {"train_loss": -12.882110595703125, "global_step": 495397, "epoch": 2948} {"train_loss": -13.056259155273438, "global_step": 495398, "epoch": 2948} {"train_loss": -12.976262092590332, "global_step": 495399, "epoch": 2948} {"train_loss": -13.029071807861328, "global_step": 495400, "epoch": 2948} {"train_loss": -12.891868591308594, "global_step": 495401, "epoch": 2948} {"train_loss": -12.892648696899414, "global_step": 495402, "epoch": 2948} {"train_loss": -12.82677936553955, "global_step": 495403, "epoch": 2948} {"train_loss": -12.97679328918457, "global_step": 495404, "epoch": 2948} {"train_loss": -13.014114379882812, "global_step": 495405, "epoch": 2948} {"train_loss": -12.99859619140625, "global_step": 495406, "epoch": 2948} {"train_loss": -12.787042617797852, "global_step": 495407, "epoch": 2948} {"train_loss": -13.000955581665039, "global_step": 495408, "epoch": 2948} {"train_loss": -12.772588729858398, "global_step": 495409, "epoch": 2948} {"train_loss": -12.925297737121582, "global_step": 495410, "epoch": 2948} {"train_loss": -12.702561378479004, "global_step": 495411, "epoch": 2948} {"train_loss": -12.424827575683594, "global_step": 495412, "epoch": 2948} {"train_loss": -12.351097106933594, "global_step": 495413, "epoch": 2948} {"train_loss": -12.520856857299805, "global_step": 495414, "epoch": 2948} {"train_loss": -12.407517433166504, "global_step": 495415, "epoch": 2948} {"train_loss": -12.559499740600586, "global_step": 495416, "epoch": 2948} {"train_loss": -11.974832534790039, "global_step": 495417, "epoch": 2948} {"train_loss": -12.415508270263672, "global_step": 495418, "epoch": 2948} {"train_loss": -12.568599700927734, "global_step": 495419, "epoch": 2948} {"train_loss": -12.399112701416016, "global_step": 495420, "epoch": 2948} {"train_loss": -12.377573013305664, "global_step": 495421, "epoch": 2948} {"train_loss": -12.722082138061523, "global_step": 495422, "epoch": 2948} {"train_loss": -12.304357528686523, "global_step": 495423, "epoch": 2948} {"train_loss": -12.88713264465332, "global_step": 495424, "epoch": 2948} {"train_loss": -12.474559783935547, "global_step": 495425, "epoch": 2948} {"train_loss": -12.13228702545166, "global_step": 495426, "epoch": 2948} {"train_loss": -12.3905029296875, "global_step": 495427, "epoch": 2948} {"train_loss": -12.426555633544922, "global_step": 495428, "epoch": 2948} {"train_loss": -11.708963394165039, "global_step": 495429, "epoch": 2948} {"train_loss": -12.177400588989258, "global_step": 495430, "epoch": 2948} {"train_loss": -12.021025686036973, "global_step": 495431, "epoch": 2948, "val_loss": 316882.75} {"train_loss": -11.507268905639648, "global_step": 495432, "epoch": 2949} {"train_loss": -12.858859062194824, "global_step": 495433, "epoch": 2949} {"train_loss": -11.653240203857422, "global_step": 495434, "epoch": 2949} {"train_loss": -12.023355484008789, "global_step": 495435, "epoch": 2949} {"train_loss": -11.592010498046875, "global_step": 495436, "epoch": 2949} {"train_loss": -12.184955596923828, "global_step": 495437, "epoch": 2949} {"train_loss": -11.371129035949707, "global_step": 495438, "epoch": 2949} {"train_loss": -11.64381217956543, "global_step": 495439, "epoch": 2949} {"train_loss": -11.778414726257324, "global_step": 495440, "epoch": 2949} {"train_loss": -12.040655136108398, "global_step": 495441, "epoch": 2949} {"train_loss": -10.773197174072266, "global_step": 495442, "epoch": 2949} {"train_loss": -11.678544044494629, "global_step": 495443, "epoch": 2949} {"train_loss": -11.196147918701172, "global_step": 495444, "epoch": 2949} {"train_loss": -10.339856147766113, "global_step": 495445, "epoch": 2949} {"train_loss": -10.968866348266602, "global_step": 495446, "epoch": 2949} {"train_loss": -11.076086044311523, "global_step": 495447, "epoch": 2949} {"train_loss": -9.68710708618164, "global_step": 495448, "epoch": 2949} {"train_loss": -12.085851669311523, "global_step": 495449, "epoch": 2949} {"train_loss": -9.491519927978516, "global_step": 495450, "epoch": 2949} {"train_loss": -10.343345642089844, "global_step": 495451, "epoch": 2949} {"train_loss": -9.317922592163086, "global_step": 495452, "epoch": 2949} {"train_loss": -10.354086875915527, "global_step": 495453, "epoch": 2949} {"train_loss": -10.346031188964844, "global_step": 495454, "epoch": 2949} {"train_loss": -9.597383499145508, "global_step": 495455, "epoch": 2949} {"train_loss": -10.77524471282959, "global_step": 495456, "epoch": 2949} {"train_loss": -9.760716438293457, "global_step": 495457, "epoch": 2949} {"train_loss": -10.398919105529785, "global_step": 495458, "epoch": 2949} {"train_loss": -10.783946990966797, "global_step": 495459, "epoch": 2949} {"train_loss": -10.256814002990723, "global_step": 495460, "epoch": 2949} {"train_loss": -10.343097686767578, "global_step": 495461, "epoch": 2949} {"train_loss": -11.456731796264648, "global_step": 495462, "epoch": 2949} {"train_loss": -10.955007553100586, "global_step": 495463, "epoch": 2949} {"train_loss": -11.853670120239258, "global_step": 495464, "epoch": 2949} {"train_loss": -11.657410621643066, "global_step": 495465, "epoch": 2949} {"train_loss": -12.163057327270508, "global_step": 495466, "epoch": 2949} {"train_loss": -11.409404754638672, "global_step": 495467, "epoch": 2949} {"train_loss": -11.718391418457031, "global_step": 495468, "epoch": 2949} {"train_loss": -12.247214317321777, "global_step": 495469, "epoch": 2949} {"train_loss": -12.398200988769531, "global_step": 495470, "epoch": 2949} {"train_loss": -12.295703887939453, "global_step": 495471, "epoch": 2949} {"train_loss": -12.482995986938477, "global_step": 495472, "epoch": 2949} {"train_loss": -12.17340087890625, "global_step": 495473, "epoch": 2949} {"train_loss": -12.385917663574219, "global_step": 495474, "epoch": 2949} {"train_loss": -12.031500816345215, "global_step": 495475, "epoch": 2949} {"train_loss": -11.842655181884766, "global_step": 495476, "epoch": 2949} {"train_loss": -12.352790832519531, "global_step": 495477, "epoch": 2949} {"train_loss": -12.250043869018555, "global_step": 495478, "epoch": 2949} {"train_loss": -12.472599029541016, "global_step": 495479, "epoch": 2949} {"train_loss": -11.824063301086426, "global_step": 495480, "epoch": 2949} {"train_loss": -12.624197006225586, "global_step": 495481, "epoch": 2949} {"train_loss": -11.743602752685547, "global_step": 495482, "epoch": 2949} {"train_loss": -12.356036186218262, "global_step": 495483, "epoch": 2949} {"train_loss": -11.995078086853027, "global_step": 495484, "epoch": 2949} {"train_loss": -12.483258247375488, "global_step": 495485, "epoch": 2949} {"train_loss": -11.998258590698242, "global_step": 495486, "epoch": 2949} {"train_loss": -12.403958320617676, "global_step": 495487, "epoch": 2949} {"train_loss": -12.358383178710938, "global_step": 495488, "epoch": 2949} {"train_loss": -12.199915885925293, "global_step": 495489, "epoch": 2949} {"train_loss": -12.59022331237793, "global_step": 495490, "epoch": 2949} {"train_loss": -12.071650505065918, "global_step": 495491, "epoch": 2949} {"train_loss": -12.262420654296875, "global_step": 495492, "epoch": 2949} {"train_loss": -12.341449737548828, "global_step": 495493, "epoch": 2949} {"train_loss": -12.113052368164062, "global_step": 495494, "epoch": 2949} {"train_loss": -12.597501754760742, "global_step": 495495, "epoch": 2949} {"train_loss": -11.945503234863281, "global_step": 495496, "epoch": 2949} {"train_loss": -12.420771598815918, "global_step": 495497, "epoch": 2949} {"train_loss": -12.17111873626709, "global_step": 495498, "epoch": 2949} {"train_loss": -12.515861511230469, "global_step": 495499, "epoch": 2949} {"train_loss": -12.107778549194336, "global_step": 495500, "epoch": 2949} {"train_loss": -12.46800422668457, "global_step": 495501, "epoch": 2949} {"train_loss": -11.97896957397461, "global_step": 495502, "epoch": 2949} {"train_loss": -12.269216537475586, "global_step": 495503, "epoch": 2949} {"train_loss": -11.93355655670166, "global_step": 495504, "epoch": 2949} {"train_loss": -12.328506469726562, "global_step": 495505, "epoch": 2949} {"train_loss": -12.497312545776367, "global_step": 495506, "epoch": 2949} {"train_loss": -12.106856346130371, "global_step": 495507, "epoch": 2949} {"train_loss": -12.723993301391602, "global_step": 495508, "epoch": 2949} {"train_loss": -12.478336334228516, "global_step": 495509, "epoch": 2949} {"train_loss": -12.425793647766113, "global_step": 495510, "epoch": 2949} {"train_loss": -12.668953895568848, "global_step": 495511, "epoch": 2949} {"train_loss": -12.42197036743164, "global_step": 495512, "epoch": 2949} {"train_loss": -12.689387321472168, "global_step": 495513, "epoch": 2949} {"train_loss": -12.428450584411621, "global_step": 495514, "epoch": 2949} {"train_loss": -12.599058151245117, "global_step": 495515, "epoch": 2949} {"train_loss": -12.381208419799805, "global_step": 495516, "epoch": 2949} {"train_loss": -12.84262466430664, "global_step": 495517, "epoch": 2949} {"train_loss": -12.621936798095703, "global_step": 495518, "epoch": 2949} {"train_loss": -12.515178680419922, "global_step": 495519, "epoch": 2949} {"train_loss": -12.633461952209473, "global_step": 495520, "epoch": 2949} {"train_loss": -12.095559120178223, "global_step": 495521, "epoch": 2949} {"train_loss": -12.468456268310547, "global_step": 495522, "epoch": 2949} {"train_loss": -12.619222640991211, "global_step": 495523, "epoch": 2949} {"train_loss": -12.263181686401367, "global_step": 495524, "epoch": 2949} {"train_loss": -12.689395904541016, "global_step": 495525, "epoch": 2949} {"train_loss": -12.286130905151367, "global_step": 495526, "epoch": 2949} {"train_loss": -12.319976806640625, "global_step": 495527, "epoch": 2949} {"train_loss": -12.634928703308105, "global_step": 495528, "epoch": 2949} {"train_loss": -12.477838516235352, "global_step": 495529, "epoch": 2949} {"train_loss": -12.602787017822266, "global_step": 495530, "epoch": 2949} {"train_loss": -12.211464881896973, "global_step": 495531, "epoch": 2949} {"train_loss": -12.365913391113281, "global_step": 495532, "epoch": 2949} {"train_loss": -12.228483200073242, "global_step": 495533, "epoch": 2949} {"train_loss": -12.020805358886719, "global_step": 495534, "epoch": 2949} {"train_loss": -12.928925514221191, "global_step": 495535, "epoch": 2949} {"train_loss": -12.708614349365234, "global_step": 495536, "epoch": 2949} {"train_loss": -12.750089645385742, "global_step": 495537, "epoch": 2949} {"train_loss": -12.583672523498535, "global_step": 495538, "epoch": 2949} {"train_loss": -12.467757225036621, "global_step": 495539, "epoch": 2949} {"train_loss": -12.568832397460938, "global_step": 495540, "epoch": 2949} {"train_loss": -12.471918106079102, "global_step": 495541, "epoch": 2949} {"train_loss": -12.571638107299805, "global_step": 495542, "epoch": 2949} {"train_loss": -12.546191215515137, "global_step": 495543, "epoch": 2949} {"train_loss": -12.8486328125, "global_step": 495544, "epoch": 2949} {"train_loss": -12.67044448852539, "global_step": 495545, "epoch": 2949} {"train_loss": -12.499631881713867, "global_step": 495546, "epoch": 2949} {"train_loss": -12.772842407226562, "global_step": 495547, "epoch": 2949} {"train_loss": -12.873327255249023, "global_step": 495548, "epoch": 2949} {"train_loss": -12.885686874389648, "global_step": 495549, "epoch": 2949} {"train_loss": -12.643136978149414, "global_step": 495550, "epoch": 2949} {"train_loss": -13.017745971679688, "global_step": 495551, "epoch": 2949} {"train_loss": -12.546732902526855, "global_step": 495552, "epoch": 2949} {"train_loss": -12.820704460144043, "global_step": 495553, "epoch": 2949} {"train_loss": -12.799718856811523, "global_step": 495554, "epoch": 2949} {"train_loss": -12.601149559020996, "global_step": 495555, "epoch": 2949} {"train_loss": -12.859670639038086, "global_step": 495556, "epoch": 2949} {"train_loss": -12.614019393920898, "global_step": 495557, "epoch": 2949} {"train_loss": -12.948009490966797, "global_step": 495558, "epoch": 2949} {"train_loss": -12.633150100708008, "global_step": 495559, "epoch": 2949} {"train_loss": -12.725493431091309, "global_step": 495560, "epoch": 2949} {"train_loss": -12.629716873168945, "global_step": 495561, "epoch": 2949} {"train_loss": -12.886837005615234, "global_step": 495562, "epoch": 2949} {"train_loss": -12.683258056640625, "global_step": 495563, "epoch": 2949} {"train_loss": -12.876811027526855, "global_step": 495564, "epoch": 2949} {"train_loss": -12.81740665435791, "global_step": 495565, "epoch": 2949} {"train_loss": -12.941125869750977, "global_step": 495566, "epoch": 2949} {"train_loss": -12.75560188293457, "global_step": 495567, "epoch": 2949} {"train_loss": -12.976081848144531, "global_step": 495568, "epoch": 2949} {"train_loss": -13.026742935180664, "global_step": 495569, "epoch": 2949} {"train_loss": -12.940136909484863, "global_step": 495570, "epoch": 2949} {"train_loss": -12.927492141723633, "global_step": 495571, "epoch": 2949} {"train_loss": -12.965822219848633, "global_step": 495572, "epoch": 2949} {"train_loss": -12.887120246887207, "global_step": 495573, "epoch": 2949} {"train_loss": -12.940216064453125, "global_step": 495574, "epoch": 2949} {"train_loss": -12.900506973266602, "global_step": 495575, "epoch": 2949} {"train_loss": -13.107294082641602, "global_step": 495576, "epoch": 2949} {"train_loss": -13.020246505737305, "global_step": 495577, "epoch": 2949} {"train_loss": -13.039899826049805, "global_step": 495578, "epoch": 2949} {"train_loss": -12.942060470581055, "global_step": 495579, "epoch": 2949} {"train_loss": -12.887778282165527, "global_step": 495580, "epoch": 2949} {"train_loss": -12.827713012695312, "global_step": 495581, "epoch": 2949} {"train_loss": -12.999335289001465, "global_step": 495582, "epoch": 2949} {"train_loss": -13.134322166442871, "global_step": 495583, "epoch": 2949} {"train_loss": -12.831990242004395, "global_step": 495584, "epoch": 2949} {"train_loss": -12.671038627624512, "global_step": 495585, "epoch": 2949} {"train_loss": -12.891668319702148, "global_step": 495586, "epoch": 2949} {"train_loss": -12.734674453735352, "global_step": 495587, "epoch": 2949} {"train_loss": -12.716818809509277, "global_step": 495588, "epoch": 2949} {"train_loss": -12.588252067565918, "global_step": 495589, "epoch": 2949} {"train_loss": -12.358770370483398, "global_step": 495590, "epoch": 2949} {"train_loss": -12.352946281433105, "global_step": 495591, "epoch": 2949} {"train_loss": -12.662299156188965, "global_step": 495592, "epoch": 2949} {"train_loss": -12.166399955749512, "global_step": 495593, "epoch": 2949} {"train_loss": -11.17507266998291, "global_step": 495594, "epoch": 2949} {"train_loss": -10.054916381835938, "global_step": 495595, "epoch": 2949} {"train_loss": -9.990545272827148, "global_step": 495596, "epoch": 2949} {"train_loss": -11.02212905883789, "global_step": 495597, "epoch": 2949} {"train_loss": -10.716390609741211, "global_step": 495598, "epoch": 2949} {"train_loss": -12.144244682221185, "global_step": 495599, "epoch": 2949, "val_loss": 319918.40625} {"train_loss": -11.823293685913086, "global_step": 495600, "epoch": 2950} {"train_loss": -10.916818618774414, "global_step": 495601, "epoch": 2950} {"train_loss": -10.344001770019531, "global_step": 495602, "epoch": 2950} {"train_loss": -11.015837669372559, "global_step": 495603, "epoch": 2950} {"train_loss": -10.162104606628418, "global_step": 495604, "epoch": 2950} {"train_loss": -10.407793045043945, "global_step": 495605, "epoch": 2950} {"train_loss": -9.211078643798828, "global_step": 495606, "epoch": 2950} {"train_loss": -7.447774410247803, "global_step": 495607, "epoch": 2950} {"train_loss": -7.408260822296143, "global_step": 495608, "epoch": 2950} {"train_loss": -6.7731709480285645, "global_step": 495609, "epoch": 2950} {"train_loss": -7.081761360168457, "global_step": 495610, "epoch": 2950} {"train_loss": -7.185637950897217, "global_step": 495611, "epoch": 2950} {"train_loss": -7.211395263671875, "global_step": 495612, "epoch": 2950} {"train_loss": -7.296016693115234, "global_step": 495613, "epoch": 2950} {"train_loss": -7.553774356842041, "global_step": 495614, "epoch": 2950} {"train_loss": -8.131416320800781, "global_step": 495615, "epoch": 2950} {"train_loss": -8.10226058959961, "global_step": 495616, "epoch": 2950} {"train_loss": -8.289426803588867, "global_step": 495617, "epoch": 2950} {"train_loss": -8.227910995483398, "global_step": 495618, "epoch": 2950} {"train_loss": -7.983139514923096, "global_step": 495619, "epoch": 2950} {"train_loss": -8.58029556274414, "global_step": 495620, "epoch": 2950} {"train_loss": -8.73121452331543, "global_step": 495621, "epoch": 2950} {"train_loss": -8.710766792297363, "global_step": 495622, "epoch": 2950} {"train_loss": -9.2798490524292, "global_step": 495623, "epoch": 2950} {"train_loss": -8.996580123901367, "global_step": 495624, "epoch": 2950} {"train_loss": -8.963277816772461, "global_step": 495625, "epoch": 2950} {"train_loss": -9.282793998718262, "global_step": 495626, "epoch": 2950} {"train_loss": -9.156242370605469, "global_step": 495627, "epoch": 2950} {"train_loss": -9.168865203857422, "global_step": 495628, "epoch": 2950} {"train_loss": -9.593931198120117, "global_step": 495629, "epoch": 2950} {"train_loss": -9.856115341186523, "global_step": 495630, "epoch": 2950} {"train_loss": -9.445405960083008, "global_step": 495631, "epoch": 2950} {"train_loss": -9.696734428405762, "global_step": 495632, "epoch": 2950} {"train_loss": -9.814531326293945, "global_step": 495633, "epoch": 2950} {"train_loss": -10.401355743408203, "global_step": 495634, "epoch": 2950} {"train_loss": -10.116579055786133, "global_step": 495635, "epoch": 2950} {"train_loss": -11.323410987854004, "global_step": 495636, "epoch": 2950} {"train_loss": -10.809813499450684, "global_step": 495637, "epoch": 2950} {"train_loss": -11.262174606323242, "global_step": 495638, "epoch": 2950} {"train_loss": -11.42396068572998, "global_step": 495639, "epoch": 2950} {"train_loss": -11.354222297668457, "global_step": 495640, "epoch": 2950} {"train_loss": -11.48115348815918, "global_step": 495641, "epoch": 2950} {"train_loss": -11.516401290893555, "global_step": 495642, "epoch": 2950} {"train_loss": -11.631616592407227, "global_step": 495643, "epoch": 2950} {"train_loss": -11.498795509338379, "global_step": 495644, "epoch": 2950} {"train_loss": -11.706962585449219, "global_step": 495645, "epoch": 2950} {"train_loss": -11.501800537109375, "global_step": 495646, "epoch": 2950} {"train_loss": -12.092742919921875, "global_step": 495647, "epoch": 2950} {"train_loss": -11.57244873046875, "global_step": 495648, "epoch": 2950} {"train_loss": -12.125815391540527, "global_step": 495649, "epoch": 2950} {"train_loss": -11.6474609375, "global_step": 495650, "epoch": 2950} {"train_loss": -11.89443588256836, "global_step": 495651, "epoch": 2950} {"train_loss": -11.903107643127441, "global_step": 495652, "epoch": 2950} {"train_loss": -12.338753700256348, "global_step": 495653, "epoch": 2950} {"train_loss": -12.084840774536133, "global_step": 495654, "epoch": 2950} {"train_loss": -12.10912799835205, "global_step": 495655, "epoch": 2950} {"train_loss": -12.251476287841797, "global_step": 495656, "epoch": 2950} {"train_loss": -12.146034240722656, "global_step": 495657, "epoch": 2950} {"train_loss": -12.127021789550781, "global_step": 495658, "epoch": 2950} {"train_loss": -12.270456314086914, "global_step": 495659, "epoch": 2950} {"train_loss": -12.17254638671875, "global_step": 495660, "epoch": 2950} {"train_loss": -12.41767692565918, "global_step": 495661, "epoch": 2950} {"train_loss": -12.351847648620605, "global_step": 495662, "epoch": 2950} {"train_loss": -12.337681770324707, "global_step": 495663, "epoch": 2950} {"train_loss": -12.533705711364746, "global_step": 495664, "epoch": 2950} {"train_loss": -12.080560684204102, "global_step": 495665, "epoch": 2950} {"train_loss": -12.74293327331543, "global_step": 495666, "epoch": 2950} {"train_loss": -12.526163101196289, "global_step": 495667, "epoch": 2950} {"train_loss": -12.575397491455078, "global_step": 495668, "epoch": 2950} {"train_loss": -12.439159393310547, "global_step": 495669, "epoch": 2950} {"train_loss": -12.595415115356445, "global_step": 495670, "epoch": 2950} {"train_loss": -12.552652359008789, "global_step": 495671, "epoch": 2950} {"train_loss": -12.488161087036133, "global_step": 495672, "epoch": 2950} {"train_loss": -12.453540802001953, "global_step": 495673, "epoch": 2950} {"train_loss": -12.72986125946045, "global_step": 495674, "epoch": 2950} {"train_loss": -12.688289642333984, "global_step": 495675, "epoch": 2950} {"train_loss": -12.725709915161133, "global_step": 495676, "epoch": 2950} {"train_loss": -12.498056411743164, "global_step": 495677, "epoch": 2950} {"train_loss": -12.604606628417969, "global_step": 495678, "epoch": 2950} {"train_loss": -12.489480972290039, "global_step": 495679, "epoch": 2950} {"train_loss": -12.664023399353027, "global_step": 495680, "epoch": 2950} {"train_loss": -12.308835983276367, "global_step": 495681, "epoch": 2950} {"train_loss": -12.692967414855957, "global_step": 495682, "epoch": 2950} {"train_loss": -12.268308639526367, "global_step": 495683, "epoch": 2950} {"train_loss": -12.532209396362305, "global_step": 495684, "epoch": 2950} {"train_loss": -12.671063423156738, "global_step": 495685, "epoch": 2950} {"train_loss": -12.318944931030273, "global_step": 495686, "epoch": 2950} {"train_loss": -11.925966262817383, "global_step": 495687, "epoch": 2950} {"train_loss": -12.685382843017578, "global_step": 495688, "epoch": 2950} {"train_loss": -12.350064277648926, "global_step": 495689, "epoch": 2950} {"train_loss": -12.19195556640625, "global_step": 495690, "epoch": 2950} {"train_loss": -12.049159049987793, "global_step": 495691, "epoch": 2950} {"train_loss": -12.77137565612793, "global_step": 495692, "epoch": 2950} {"train_loss": -12.117937088012695, "global_step": 495693, "epoch": 2950} {"train_loss": -11.877279281616211, "global_step": 495694, "epoch": 2950} {"train_loss": -12.336431503295898, "global_step": 495695, "epoch": 2950} {"train_loss": -11.748281478881836, "global_step": 495696, "epoch": 2950} {"train_loss": -12.283186912536621, "global_step": 495697, "epoch": 2950} {"train_loss": -12.082014083862305, "global_step": 495698, "epoch": 2950} {"train_loss": -12.222314834594727, "global_step": 495699, "epoch": 2950} {"train_loss": -12.149547576904297, "global_step": 495700, "epoch": 2950} {"train_loss": -12.450987815856934, "global_step": 495701, "epoch": 2950} {"train_loss": -12.36824893951416, "global_step": 495702, "epoch": 2950} {"train_loss": -12.656761169433594, "global_step": 495703, "epoch": 2950} {"train_loss": -12.19488525390625, "global_step": 495704, "epoch": 2950} {"train_loss": -12.406856536865234, "global_step": 495705, "epoch": 2950} {"train_loss": -11.951089859008789, "global_step": 495706, "epoch": 2950} {"train_loss": -12.492657661437988, "global_step": 495707, "epoch": 2950} {"train_loss": -12.175267219543457, "global_step": 495708, "epoch": 2950} {"train_loss": -12.452856063842773, "global_step": 495709, "epoch": 2950} {"train_loss": -12.114950180053711, "global_step": 495710, "epoch": 2950} {"train_loss": -12.42151165008545, "global_step": 495711, "epoch": 2950} {"train_loss": -12.0963716506958, "global_step": 495712, "epoch": 2950} {"train_loss": -12.040407180786133, "global_step": 495713, "epoch": 2950} {"train_loss": -11.095983505249023, "global_step": 495714, "epoch": 2950} {"train_loss": -12.065374374389648, "global_step": 495715, "epoch": 2950} {"train_loss": -11.232650756835938, "global_step": 495716, "epoch": 2950} {"train_loss": -12.046791076660156, "global_step": 495717, "epoch": 2950} {"train_loss": -10.966556549072266, "global_step": 495718, "epoch": 2950} {"train_loss": -12.158487319946289, "global_step": 495719, "epoch": 2950} {"train_loss": -11.849881172180176, "global_step": 495720, "epoch": 2950} {"train_loss": -12.545401573181152, "global_step": 495721, "epoch": 2950} {"train_loss": -11.518107414245605, "global_step": 495722, "epoch": 2950} {"train_loss": -10.977910995483398, "global_step": 495723, "epoch": 2950} {"train_loss": -11.966253280639648, "global_step": 495724, "epoch": 2950} {"train_loss": -11.865909576416016, "global_step": 495725, "epoch": 2950} {"train_loss": -11.32941722869873, "global_step": 495726, "epoch": 2950} {"train_loss": -11.134893417358398, "global_step": 495727, "epoch": 2950} {"train_loss": -10.816309928894043, "global_step": 495728, "epoch": 2950} {"train_loss": -10.732770919799805, "global_step": 495729, "epoch": 2950} {"train_loss": -10.320984840393066, "global_step": 495730, "epoch": 2950} {"train_loss": -10.766680717468262, "global_step": 495731, "epoch": 2950} {"train_loss": -11.222354888916016, "global_step": 495732, "epoch": 2950} {"train_loss": -12.14872932434082, "global_step": 495733, "epoch": 2950} {"train_loss": -11.483352661132812, "global_step": 495734, "epoch": 2950} {"train_loss": -11.849706649780273, "global_step": 495735, "epoch": 2950} {"train_loss": -11.73082160949707, "global_step": 495736, "epoch": 2950} {"train_loss": -12.108184814453125, "global_step": 495737, "epoch": 2950} {"train_loss": -11.382858276367188, "global_step": 495738, "epoch": 2950} {"train_loss": -12.07707405090332, "global_step": 495739, "epoch": 2950} {"train_loss": -11.99993896484375, "global_step": 495740, "epoch": 2950} {"train_loss": -11.79703140258789, "global_step": 495741, "epoch": 2950} {"train_loss": -12.051725387573242, "global_step": 495742, "epoch": 2950} {"train_loss": -10.713333129882812, "global_step": 495743, "epoch": 2950} {"train_loss": -11.193028450012207, "global_step": 495744, "epoch": 2950} {"train_loss": -10.7445068359375, "global_step": 495745, "epoch": 2950} {"train_loss": -11.782751083374023, "global_step": 495746, "epoch": 2950} {"train_loss": -11.881150245666504, "global_step": 495747, "epoch": 2950} {"train_loss": -11.357126235961914, "global_step": 495748, "epoch": 2950} {"train_loss": -11.963918685913086, "global_step": 495749, "epoch": 2950} {"train_loss": -11.358531951904297, "global_step": 495750, "epoch": 2950} {"train_loss": -11.821074485778809, "global_step": 495751, "epoch": 2950} {"train_loss": -12.032402038574219, "global_step": 495752, "epoch": 2950} {"train_loss": -11.974687576293945, "global_step": 495753, "epoch": 2950} {"train_loss": -12.570990562438965, "global_step": 495754, "epoch": 2950} {"train_loss": -12.039708137512207, "global_step": 495755, "epoch": 2950} {"train_loss": -11.884330749511719, "global_step": 495756, "epoch": 2950} {"train_loss": -12.242257118225098, "global_step": 495757, "epoch": 2950} {"train_loss": -12.071258544921875, "global_step": 495758, "epoch": 2950} {"train_loss": -12.358784675598145, "global_step": 495759, "epoch": 2950} {"train_loss": -11.989635467529297, "global_step": 495760, "epoch": 2950} {"train_loss": -12.450515747070312, "global_step": 495761, "epoch": 2950} {"train_loss": -12.257120132446289, "global_step": 495762, "epoch": 2950} {"train_loss": -12.541677474975586, "global_step": 495763, "epoch": 2950} {"train_loss": -12.096406936645508, "global_step": 495764, "epoch": 2950} {"train_loss": -12.323083877563477, "global_step": 495765, "epoch": 2950} {"train_loss": -12.152844429016113, "global_step": 495766, "epoch": 2950} {"train_loss": -11.346194891702561, "global_step": 495767, "epoch": 2950, "train/sim_max_reward_0": 0.5223346460149615, "train/sim_max_reward_1": 0.9158905666976199, "train/sim_max_reward_2": 0.010533626131068133, "train/sim_max_reward_3": 0.5964612426960473, "train/sim_max_reward_4": 0.4866332088477317, "train/sim_max_reward_5": 0.9579717781842964, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.36924293444838857, "test/sim_max_reward_4400002": 0.48099818558981755, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.5383708041715976, "test/sim_max_reward_4400005": 0.33563549497571343, "test/sim_max_reward_4400006": 0.5471507736346567, "test/sim_max_reward_4400007": 0.9861444778773175, "test/sim_max_reward_4400008": 0.5662833119919264, "test/sim_max_reward_4400009": 0.35355830251705933, "test/sim_max_reward_4400010": 0.687125001659276, "test/sim_max_reward_4400011": 0.296347197406832, "test/sim_max_reward_4400012": 0.9494281824545745, "test/sim_max_reward_4400013": 0.9544564085810939, "test/sim_max_reward_4400014": 0.9629562045666608, "test/sim_max_reward_4400015": 0.3407029926414314, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.9980783020657832, "test/sim_max_reward_4400018": 0.9945974412648052, "test/sim_max_reward_4400019": 0.22996071622075154, "test/sim_max_reward_4400020": 0.00021042560632409413, "test/sim_max_reward_4400021": 0.6920069562224769, "test/sim_max_reward_4400022": 0.945691477656678, "test/sim_max_reward_4400023": 0.1508976006686911, "test/sim_max_reward_4400024": 0.943280310183993, "test/sim_max_reward_4400025": 0.6416841035176565, "test/sim_max_reward_4400026": 0.9716969683669325, "test/sim_max_reward_4400027": 0.1657870485928917, "test/sim_max_reward_4400028": 0.709403641406481, "test/sim_max_reward_4400029": 0.8580640523878121, "test/sim_max_reward_4400030": 0.9779781649351755, "test/sim_max_reward_4400031": 0.536301020701373, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.13975954442219524, "test/sim_max_reward_4400034": 0.7054325772177193, "test/sim_max_reward_4400035": 0.9475875360464991, "test/sim_max_reward_4400036": 0.3715826803870978, "test/sim_max_reward_4400037": 1.0, "test/sim_max_reward_4400038": 0.3252040579503638, "test/sim_max_reward_4400039": 0.4115442382477297, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.1666686710391285, "test/sim_max_reward_4400042": 0.9807062808992403, "test/sim_max_reward_4400043": 0.026861411251511556, "test/sim_max_reward_4400044": 0.46719677340195226, "test/sim_max_reward_4400045": 1.0, "test/sim_max_reward_4400046": 0.3353046570945017, "test/sim_max_reward_4400047": 0.9972421696261634, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.5816375114286209, "test/mean_score": 0.5411825819979654, "val_loss": 316857.75, "train_action_mse_error": 0.767711341381073} {"train_loss": -12.43808364868164, "global_step": 495768, "epoch": 2951} {"train_loss": -12.547224044799805, "global_step": 495769, "epoch": 2951} {"train_loss": -12.281825065612793, "global_step": 495770, "epoch": 2951} {"train_loss": -12.471580505371094, "global_step": 495771, "epoch": 2951} {"train_loss": -12.146438598632812, "global_step": 495772, "epoch": 2951} {"train_loss": -12.63769245147705, "global_step": 495773, "epoch": 2951} {"train_loss": -12.509065628051758, "global_step": 495774, "epoch": 2951} {"train_loss": -12.523756980895996, "global_step": 495775, "epoch": 2951} {"train_loss": -12.811328887939453, "global_step": 495776, "epoch": 2951} {"train_loss": -12.663992881774902, "global_step": 495777, "epoch": 2951} {"train_loss": -12.793929100036621, "global_step": 495778, "epoch": 2951} {"train_loss": -12.473699569702148, "global_step": 495779, "epoch": 2951} {"train_loss": -12.584976196289062, "global_step": 495780, "epoch": 2951} {"train_loss": -12.91915512084961, "global_step": 495781, "epoch": 2951} {"train_loss": -12.917393684387207, "global_step": 495782, "epoch": 2951} {"train_loss": -12.599552154541016, "global_step": 495783, "epoch": 2951} {"train_loss": -12.647022247314453, "global_step": 495784, "epoch": 2951} {"train_loss": -12.578592300415039, "global_step": 495785, "epoch": 2951} {"train_loss": -12.402397155761719, "global_step": 495786, "epoch": 2951} {"train_loss": -12.804752349853516, "global_step": 495787, "epoch": 2951} {"train_loss": -12.516910552978516, "global_step": 495788, "epoch": 2951} {"train_loss": -12.488485336303711, "global_step": 495789, "epoch": 2951} {"train_loss": -12.82874870300293, "global_step": 495790, "epoch": 2951} {"train_loss": -12.551958084106445, "global_step": 495791, "epoch": 2951} {"train_loss": -12.640417098999023, "global_step": 495792, "epoch": 2951} {"train_loss": -12.190217018127441, "global_step": 495793, "epoch": 2951} {"train_loss": -12.242549896240234, "global_step": 495794, "epoch": 2951} {"train_loss": -12.501922607421875, "global_step": 495795, "epoch": 2951} {"train_loss": -12.470780372619629, "global_step": 495796, "epoch": 2951} {"train_loss": -12.24966049194336, "global_step": 495797, "epoch": 2951} {"train_loss": -12.70846939086914, "global_step": 495798, "epoch": 2951} {"train_loss": -12.663744926452637, "global_step": 495799, "epoch": 2951} {"train_loss": -12.496990203857422, "global_step": 495800, "epoch": 2951} {"train_loss": -12.115434646606445, "global_step": 495801, "epoch": 2951} {"train_loss": -12.467010498046875, "global_step": 495802, "epoch": 2951} {"train_loss": -12.443065643310547, "global_step": 495803, "epoch": 2951} {"train_loss": -12.815557479858398, "global_step": 495804, "epoch": 2951} {"train_loss": -12.66836166381836, "global_step": 495805, "epoch": 2951} {"train_loss": -12.81764030456543, "global_step": 495806, "epoch": 2951} {"train_loss": -12.599079132080078, "global_step": 495807, "epoch": 2951} {"train_loss": -12.656877517700195, "global_step": 495808, "epoch": 2951} {"train_loss": -12.624805450439453, "global_step": 495809, "epoch": 2951} {"train_loss": -12.682392120361328, "global_step": 495810, "epoch": 2951} {"train_loss": -12.588956832885742, "global_step": 495811, "epoch": 2951} {"train_loss": -12.588569641113281, "global_step": 495812, "epoch": 2951} {"train_loss": -12.571942329406738, "global_step": 495813, "epoch": 2951} {"train_loss": -12.448688507080078, "global_step": 495814, "epoch": 2951} {"train_loss": -12.607521057128906, "global_step": 495815, "epoch": 2951} {"train_loss": -12.249580383300781, "global_step": 495816, "epoch": 2951} {"train_loss": -12.773849487304688, "global_step": 495817, "epoch": 2951} {"train_loss": -12.867777824401855, "global_step": 495818, "epoch": 2951} {"train_loss": -12.484424591064453, "global_step": 495819, "epoch": 2951} {"train_loss": -12.266031265258789, "global_step": 495820, "epoch": 2951} {"train_loss": -12.621011734008789, "global_step": 495821, "epoch": 2951} {"train_loss": -12.229015350341797, "global_step": 495822, "epoch": 2951} {"train_loss": -12.721282958984375, "global_step": 495823, "epoch": 2951} {"train_loss": -12.500497817993164, "global_step": 495824, "epoch": 2951} {"train_loss": -12.302380561828613, "global_step": 495825, "epoch": 2951} {"train_loss": -12.62680435180664, "global_step": 495826, "epoch": 2951} {"train_loss": -12.698634147644043, "global_step": 495827, "epoch": 2951} {"train_loss": -11.804370880126953, "global_step": 495828, "epoch": 2951} {"train_loss": -12.388256072998047, "global_step": 495829, "epoch": 2951} {"train_loss": -12.294208526611328, "global_step": 495830, "epoch": 2951} {"train_loss": -11.775064468383789, "global_step": 495831, "epoch": 2951} {"train_loss": -11.557695388793945, "global_step": 495832, "epoch": 2951} {"train_loss": -11.795647621154785, "global_step": 495833, "epoch": 2951} {"train_loss": -11.390215873718262, "global_step": 495834, "epoch": 2951} {"train_loss": -11.831903457641602, "global_step": 495835, "epoch": 2951} {"train_loss": -10.431302070617676, "global_step": 495836, "epoch": 2951} {"train_loss": -11.482425689697266, "global_step": 495837, "epoch": 2951} {"train_loss": -11.966567993164062, "global_step": 495838, "epoch": 2951} {"train_loss": -11.048498153686523, "global_step": 495839, "epoch": 2951} {"train_loss": -12.392624855041504, "global_step": 495840, "epoch": 2951} {"train_loss": -10.67790412902832, "global_step": 495841, "epoch": 2951} {"train_loss": -11.794951438903809, "global_step": 495842, "epoch": 2951} {"train_loss": -12.030755996704102, "global_step": 495843, "epoch": 2951} {"train_loss": -11.69534683227539, "global_step": 495844, "epoch": 2951} {"train_loss": -11.902022361755371, "global_step": 495845, "epoch": 2951} {"train_loss": -11.786806106567383, "global_step": 495846, "epoch": 2951} {"train_loss": -12.474590301513672, "global_step": 495847, "epoch": 2951} {"train_loss": -12.010035514831543, "global_step": 495848, "epoch": 2951} {"train_loss": -12.21502685546875, "global_step": 495849, "epoch": 2951} {"train_loss": -12.419734001159668, "global_step": 495850, "epoch": 2951} {"train_loss": -11.552148818969727, "global_step": 495851, "epoch": 2951} {"train_loss": -12.206094741821289, "global_step": 495852, "epoch": 2951} {"train_loss": -10.949456214904785, "global_step": 495853, "epoch": 2951} {"train_loss": -11.555203437805176, "global_step": 495854, "epoch": 2951} {"train_loss": -11.670546531677246, "global_step": 495855, "epoch": 2951} {"train_loss": -10.907720565795898, "global_step": 495856, "epoch": 2951} {"train_loss": -12.600358963012695, "global_step": 495857, "epoch": 2951} {"train_loss": -11.749160766601562, "global_step": 495858, "epoch": 2951} {"train_loss": -11.781436920166016, "global_step": 495859, "epoch": 2951} {"train_loss": -12.604292869567871, "global_step": 495860, "epoch": 2951} {"train_loss": -12.015052795410156, "global_step": 495861, "epoch": 2951} {"train_loss": -11.822086334228516, "global_step": 495862, "epoch": 2951} {"train_loss": -12.672835350036621, "global_step": 495863, "epoch": 2951} {"train_loss": -12.240577697753906, "global_step": 495864, "epoch": 2951} {"train_loss": -12.1884183883667, "global_step": 495865, "epoch": 2951} {"train_loss": -12.312638282775879, "global_step": 495866, "epoch": 2951} {"train_loss": -10.983534812927246, "global_step": 495867, "epoch": 2951} {"train_loss": -12.071296691894531, "global_step": 495868, "epoch": 2951} {"train_loss": -10.316221237182617, "global_step": 495869, "epoch": 2951} {"train_loss": -11.9581298828125, "global_step": 495870, "epoch": 2951} {"train_loss": -9.874454498291016, "global_step": 495871, "epoch": 2951} {"train_loss": -12.535284996032715, "global_step": 495872, "epoch": 2951} {"train_loss": -9.698362350463867, "global_step": 495873, "epoch": 2951} {"train_loss": -11.849187850952148, "global_step": 495874, "epoch": 2951} {"train_loss": -10.372013092041016, "global_step": 495875, "epoch": 2951} {"train_loss": -10.068440437316895, "global_step": 495876, "epoch": 2951} {"train_loss": -10.96922492980957, "global_step": 495877, "epoch": 2951} {"train_loss": -11.257343292236328, "global_step": 495878, "epoch": 2951} {"train_loss": -11.245025634765625, "global_step": 495879, "epoch": 2951} {"train_loss": -9.925811767578125, "global_step": 495880, "epoch": 2951} {"train_loss": -11.638131141662598, "global_step": 495881, "epoch": 2951} {"train_loss": -10.96407413482666, "global_step": 495882, "epoch": 2951} {"train_loss": -11.64897632598877, "global_step": 495883, "epoch": 2951} {"train_loss": -11.232820510864258, "global_step": 495884, "epoch": 2951} {"train_loss": -11.493714332580566, "global_step": 495885, "epoch": 2951} {"train_loss": -10.966853141784668, "global_step": 495886, "epoch": 2951} {"train_loss": -11.157785415649414, "global_step": 495887, "epoch": 2951} {"train_loss": -10.51544189453125, "global_step": 495888, "epoch": 2951} {"train_loss": -11.460417747497559, "global_step": 495889, "epoch": 2951} {"train_loss": -11.416778564453125, "global_step": 495890, "epoch": 2951} {"train_loss": -10.261566162109375, "global_step": 495891, "epoch": 2951} {"train_loss": -11.905515670776367, "global_step": 495892, "epoch": 2951} {"train_loss": -11.010614395141602, "global_step": 495893, "epoch": 2951} {"train_loss": -12.093881607055664, "global_step": 495894, "epoch": 2951} {"train_loss": -11.066719055175781, "global_step": 495895, "epoch": 2951} {"train_loss": -12.48849105834961, "global_step": 495896, "epoch": 2951} {"train_loss": -11.060422897338867, "global_step": 495897, "epoch": 2951} {"train_loss": -12.05477523803711, "global_step": 495898, "epoch": 2951} {"train_loss": -11.502113342285156, "global_step": 495899, "epoch": 2951} {"train_loss": -12.235023498535156, "global_step": 495900, "epoch": 2951} {"train_loss": -11.27207088470459, "global_step": 495901, "epoch": 2951} {"train_loss": -12.17138957977295, "global_step": 495902, "epoch": 2951} {"train_loss": -11.748733520507812, "global_step": 495903, "epoch": 2951} {"train_loss": -12.367712020874023, "global_step": 495904, "epoch": 2951} {"train_loss": -12.348660469055176, "global_step": 495905, "epoch": 2951} {"train_loss": -12.368203163146973, "global_step": 495906, "epoch": 2951} {"train_loss": -12.366357803344727, "global_step": 495907, "epoch": 2951} {"train_loss": -12.459195137023926, "global_step": 495908, "epoch": 2951} {"train_loss": -12.018965721130371, "global_step": 495909, "epoch": 2951} {"train_loss": -12.300722122192383, "global_step": 495910, "epoch": 2951} {"train_loss": -12.188335418701172, "global_step": 495911, "epoch": 2951} {"train_loss": -12.436251640319824, "global_step": 495912, "epoch": 2951} {"train_loss": -12.321313858032227, "global_step": 495913, "epoch": 2951} {"train_loss": -12.391824722290039, "global_step": 495914, "epoch": 2951} {"train_loss": -12.455049514770508, "global_step": 495915, "epoch": 2951} {"train_loss": -12.580617904663086, "global_step": 495916, "epoch": 2951} {"train_loss": -12.54927921295166, "global_step": 495917, "epoch": 2951} {"train_loss": -12.503791809082031, "global_step": 495918, "epoch": 2951} {"train_loss": -12.467439651489258, "global_step": 495919, "epoch": 2951} {"train_loss": -12.522857666015625, "global_step": 495920, "epoch": 2951} {"train_loss": -12.411699295043945, "global_step": 495921, "epoch": 2951} {"train_loss": -12.687427520751953, "global_step": 495922, "epoch": 2951} {"train_loss": -12.533737182617188, "global_step": 495923, "epoch": 2951} {"train_loss": -12.600744247436523, "global_step": 495924, "epoch": 2951} {"train_loss": -12.626235961914062, "global_step": 495925, "epoch": 2951} {"train_loss": -12.680427551269531, "global_step": 495926, "epoch": 2951} {"train_loss": -12.66074275970459, "global_step": 495927, "epoch": 2951} {"train_loss": -12.717744827270508, "global_step": 495928, "epoch": 2951} {"train_loss": -12.513766288757324, "global_step": 495929, "epoch": 2951} {"train_loss": -12.748969078063965, "global_step": 495930, "epoch": 2951} {"train_loss": -12.837841033935547, "global_step": 495931, "epoch": 2951} {"train_loss": -12.785726547241211, "global_step": 495932, "epoch": 2951} {"train_loss": -12.753645896911621, "global_step": 495933, "epoch": 2951} {"train_loss": -12.666133880615234, "global_step": 495934, "epoch": 2951} {"train_loss": -12.097469886144003, "global_step": 495935, "epoch": 2951, "val_loss": 321034.96875} {"train_loss": -12.664718627929688, "global_step": 495936, "epoch": 2952} {"train_loss": -12.854524612426758, "global_step": 495937, "epoch": 2952} {"train_loss": -12.72649097442627, "global_step": 495938, "epoch": 2952} {"train_loss": -12.750001907348633, "global_step": 495939, "epoch": 2952} {"train_loss": -12.753058433532715, "global_step": 495940, "epoch": 2952} {"train_loss": -12.797256469726562, "global_step": 495941, "epoch": 2952} {"train_loss": -12.937768936157227, "global_step": 495942, "epoch": 2952} {"train_loss": -12.916009902954102, "global_step": 495943, "epoch": 2952} {"train_loss": -12.918462753295898, "global_step": 495944, "epoch": 2952} {"train_loss": -12.743173599243164, "global_step": 495945, "epoch": 2952} {"train_loss": -12.434501647949219, "global_step": 495946, "epoch": 2952} {"train_loss": -12.825345993041992, "global_step": 495947, "epoch": 2952} {"train_loss": -12.85761833190918, "global_step": 495948, "epoch": 2952} {"train_loss": -12.793920516967773, "global_step": 495949, "epoch": 2952} {"train_loss": -12.725830078125, "global_step": 495950, "epoch": 2952} {"train_loss": -12.804523468017578, "global_step": 495951, "epoch": 2952} {"train_loss": -12.767045974731445, "global_step": 495952, "epoch": 2952} {"train_loss": -13.005187034606934, "global_step": 495953, "epoch": 2952} {"train_loss": -12.879536628723145, "global_step": 495954, "epoch": 2952} {"train_loss": -12.818550109863281, "global_step": 495955, "epoch": 2952} {"train_loss": -12.789567947387695, "global_step": 495956, "epoch": 2952} {"train_loss": -12.675386428833008, "global_step": 495957, "epoch": 2952} {"train_loss": -12.901545524597168, "global_step": 495958, "epoch": 2952} {"train_loss": -12.65701961517334, "global_step": 495959, "epoch": 2952} {"train_loss": -12.451762199401855, "global_step": 495960, "epoch": 2952} {"train_loss": -12.764274597167969, "global_step": 495961, "epoch": 2952} {"train_loss": -12.700963973999023, "global_step": 495962, "epoch": 2952} {"train_loss": -12.753968238830566, "global_step": 495963, "epoch": 2952} {"train_loss": -12.808135986328125, "global_step": 495964, "epoch": 2952} {"train_loss": -12.74515438079834, "global_step": 495965, "epoch": 2952} {"train_loss": -12.696428298950195, "global_step": 495966, "epoch": 2952} {"train_loss": -12.942085266113281, "global_step": 495967, "epoch": 2952} {"train_loss": -12.707437515258789, "global_step": 495968, "epoch": 2952} {"train_loss": -12.215059280395508, "global_step": 495969, "epoch": 2952} {"train_loss": -12.259642601013184, "global_step": 495970, "epoch": 2952} {"train_loss": -12.029682159423828, "global_step": 495971, "epoch": 2952} {"train_loss": -12.374889373779297, "global_step": 495972, "epoch": 2952} {"train_loss": -11.52595329284668, "global_step": 495973, "epoch": 2952} {"train_loss": -11.984663009643555, "global_step": 495974, "epoch": 2952} {"train_loss": -12.463804244995117, "global_step": 495975, "epoch": 2952} {"train_loss": -12.356430053710938, "global_step": 495976, "epoch": 2952} {"train_loss": -12.220861434936523, "global_step": 495977, "epoch": 2952} {"train_loss": -11.895777702331543, "global_step": 495978, "epoch": 2952} {"train_loss": -12.78006649017334, "global_step": 495979, "epoch": 2952} {"train_loss": -12.010379791259766, "global_step": 495980, "epoch": 2952} {"train_loss": -13.045879364013672, "global_step": 495981, "epoch": 2952} {"train_loss": -11.841591835021973, "global_step": 495982, "epoch": 2952} {"train_loss": -12.785401344299316, "global_step": 495983, "epoch": 2952} {"train_loss": -12.386134147644043, "global_step": 495984, "epoch": 2952} {"train_loss": -12.38601303100586, "global_step": 495985, "epoch": 2952} {"train_loss": -11.899112701416016, "global_step": 495986, "epoch": 2952} {"train_loss": -12.862445831298828, "global_step": 495987, "epoch": 2952} {"train_loss": -12.543258666992188, "global_step": 495988, "epoch": 2952} {"train_loss": -12.335814476013184, "global_step": 495989, "epoch": 2952} {"train_loss": -12.713090896606445, "global_step": 495990, "epoch": 2952} {"train_loss": -12.742937088012695, "global_step": 495991, "epoch": 2952} {"train_loss": -12.08892822265625, "global_step": 495992, "epoch": 2952} {"train_loss": -12.187813758850098, "global_step": 495993, "epoch": 2952} {"train_loss": -12.34367561340332, "global_step": 495994, "epoch": 2952} {"train_loss": -12.31685733795166, "global_step": 495995, "epoch": 2952} {"train_loss": -10.959962844848633, "global_step": 495996, "epoch": 2952} {"train_loss": -12.088261604309082, "global_step": 495997, "epoch": 2952} {"train_loss": -10.482234954833984, "global_step": 495998, "epoch": 2952} {"train_loss": -11.97795581817627, "global_step": 495999, "epoch": 2952} {"train_loss": -11.676963806152344, "global_step": 496000, "epoch": 2952} {"train_loss": -11.671911239624023, "global_step": 496001, "epoch": 2952} {"train_loss": -12.31766414642334, "global_step": 496002, "epoch": 2952} {"train_loss": -11.148017883300781, "global_step": 496003, "epoch": 2952} {"train_loss": -11.64293098449707, "global_step": 496004, "epoch": 2952} {"train_loss": -12.42088508605957, "global_step": 496005, "epoch": 2952} {"train_loss": -11.882501602172852, "global_step": 496006, "epoch": 2952} {"train_loss": -11.551043510437012, "global_step": 496007, "epoch": 2952} {"train_loss": -12.160089492797852, "global_step": 496008, "epoch": 2952} {"train_loss": -12.313362121582031, "global_step": 496009, "epoch": 2952} {"train_loss": -12.458230018615723, "global_step": 496010, "epoch": 2952} {"train_loss": -11.748602867126465, "global_step": 496011, "epoch": 2952} {"train_loss": -12.629537582397461, "global_step": 496012, "epoch": 2952} {"train_loss": -12.133244514465332, "global_step": 496013, "epoch": 2952} {"train_loss": -12.458368301391602, "global_step": 496014, "epoch": 2952} {"train_loss": -12.676736831665039, "global_step": 496015, "epoch": 2952} {"train_loss": -12.493683815002441, "global_step": 496016, "epoch": 2952} {"train_loss": -12.627128601074219, "global_step": 496017, "epoch": 2952} {"train_loss": -12.553914070129395, "global_step": 496018, "epoch": 2952} {"train_loss": -12.789894104003906, "global_step": 496019, "epoch": 2952} {"train_loss": -12.933050155639648, "global_step": 496020, "epoch": 2952} {"train_loss": -12.54008674621582, "global_step": 496021, "epoch": 2952} {"train_loss": -12.79395580291748, "global_step": 496022, "epoch": 2952} {"train_loss": -12.597785949707031, "global_step": 496023, "epoch": 2952} {"train_loss": -13.062812805175781, "global_step": 496024, "epoch": 2952} {"train_loss": -12.82794189453125, "global_step": 496025, "epoch": 2952} {"train_loss": -12.86795711517334, "global_step": 496026, "epoch": 2952} {"train_loss": -12.48215389251709, "global_step": 496027, "epoch": 2952} {"train_loss": -12.783267974853516, "global_step": 496028, "epoch": 2952} {"train_loss": -12.739811897277832, "global_step": 496029, "epoch": 2952} {"train_loss": -12.796242713928223, "global_step": 496030, "epoch": 2952} {"train_loss": -12.74582576751709, "global_step": 496031, "epoch": 2952} {"train_loss": -12.708704948425293, "global_step": 496032, "epoch": 2952} {"train_loss": -12.957170486450195, "global_step": 496033, "epoch": 2952} {"train_loss": -12.778696060180664, "global_step": 496034, "epoch": 2952} {"train_loss": -12.496522903442383, "global_step": 496035, "epoch": 2952} {"train_loss": -13.056118965148926, "global_step": 496036, "epoch": 2952} {"train_loss": -12.752565383911133, "global_step": 496037, "epoch": 2952} {"train_loss": -12.756194114685059, "global_step": 496038, "epoch": 2952} {"train_loss": -12.966390609741211, "global_step": 496039, "epoch": 2952} {"train_loss": -12.956398010253906, "global_step": 496040, "epoch": 2952} {"train_loss": -12.907076835632324, "global_step": 496041, "epoch": 2952} {"train_loss": -12.885064125061035, "global_step": 496042, "epoch": 2952} {"train_loss": -12.806163787841797, "global_step": 496043, "epoch": 2952} {"train_loss": -12.861886978149414, "global_step": 496044, "epoch": 2952} {"train_loss": -12.672052383422852, "global_step": 496045, "epoch": 2952} {"train_loss": -12.929214477539062, "global_step": 496046, "epoch": 2952} {"train_loss": -12.912859916687012, "global_step": 496047, "epoch": 2952} {"train_loss": -12.720064163208008, "global_step": 496048, "epoch": 2952} {"train_loss": -12.65857219696045, "global_step": 496049, "epoch": 2952} {"train_loss": -11.850343704223633, "global_step": 496050, "epoch": 2952} {"train_loss": -12.298357009887695, "global_step": 496051, "epoch": 2952} {"train_loss": -12.470335006713867, "global_step": 496052, "epoch": 2952} {"train_loss": -12.233890533447266, "global_step": 496053, "epoch": 2952} {"train_loss": -11.881540298461914, "global_step": 496054, "epoch": 2952} {"train_loss": -11.989425659179688, "global_step": 496055, "epoch": 2952} {"train_loss": -12.442571640014648, "global_step": 496056, "epoch": 2952} {"train_loss": -11.736026763916016, "global_step": 496057, "epoch": 2952} {"train_loss": -12.7886962890625, "global_step": 496058, "epoch": 2952} {"train_loss": -11.916994094848633, "global_step": 496059, "epoch": 2952} {"train_loss": -11.874387741088867, "global_step": 496060, "epoch": 2952} {"train_loss": -11.297735214233398, "global_step": 496061, "epoch": 2952} {"train_loss": -12.199155807495117, "global_step": 496062, "epoch": 2952} {"train_loss": -11.869836807250977, "global_step": 496063, "epoch": 2952} {"train_loss": -11.638980865478516, "global_step": 496064, "epoch": 2952} {"train_loss": -11.78196907043457, "global_step": 496065, "epoch": 2952} {"train_loss": -11.870234489440918, "global_step": 496066, "epoch": 2952} {"train_loss": -11.24793529510498, "global_step": 496067, "epoch": 2952} {"train_loss": -11.452341079711914, "global_step": 496068, "epoch": 2952} {"train_loss": -12.021122932434082, "global_step": 496069, "epoch": 2952} {"train_loss": -10.926814079284668, "global_step": 496070, "epoch": 2952} {"train_loss": -12.327497482299805, "global_step": 496071, "epoch": 2952} {"train_loss": -11.539796829223633, "global_step": 496072, "epoch": 2952} {"train_loss": -11.689962387084961, "global_step": 496073, "epoch": 2952} {"train_loss": -11.85867691040039, "global_step": 496074, "epoch": 2952} {"train_loss": -11.759223937988281, "global_step": 496075, "epoch": 2952} {"train_loss": -11.37177848815918, "global_step": 496076, "epoch": 2952} {"train_loss": -12.199462890625, "global_step": 496077, "epoch": 2952} {"train_loss": -11.95244026184082, "global_step": 496078, "epoch": 2952} {"train_loss": -11.462503433227539, "global_step": 496079, "epoch": 2952} {"train_loss": -12.194076538085938, "global_step": 496080, "epoch": 2952} {"train_loss": -11.241247177124023, "global_step": 496081, "epoch": 2952} {"train_loss": -11.713251113891602, "global_step": 496082, "epoch": 2952} {"train_loss": -11.30551528930664, "global_step": 496083, "epoch": 2952} {"train_loss": -11.533414840698242, "global_step": 496084, "epoch": 2952} {"train_loss": -10.707799911499023, "global_step": 496085, "epoch": 2952} {"train_loss": -11.488263130187988, "global_step": 496086, "epoch": 2952} {"train_loss": -11.260069847106934, "global_step": 496087, "epoch": 2952} {"train_loss": -11.18973159790039, "global_step": 496088, "epoch": 2952} {"train_loss": -11.697601318359375, "global_step": 496089, "epoch": 2952} {"train_loss": -11.287839889526367, "global_step": 496090, "epoch": 2952} {"train_loss": -11.383880615234375, "global_step": 496091, "epoch": 2952} {"train_loss": -11.701180458068848, "global_step": 496092, "epoch": 2952} {"train_loss": -11.355206489562988, "global_step": 496093, "epoch": 2952} {"train_loss": -11.735139846801758, "global_step": 496094, "epoch": 2952} {"train_loss": -11.701042175292969, "global_step": 496095, "epoch": 2952} {"train_loss": -11.710041999816895, "global_step": 496096, "epoch": 2952} {"train_loss": -11.595969200134277, "global_step": 496097, "epoch": 2952} {"train_loss": -12.059683799743652, "global_step": 496098, "epoch": 2952} {"train_loss": -11.54951286315918, "global_step": 496099, "epoch": 2952} {"train_loss": -11.594853401184082, "global_step": 496100, "epoch": 2952} {"train_loss": -12.029622077941895, "global_step": 496101, "epoch": 2952} {"train_loss": -11.884419441223145, "global_step": 496102, "epoch": 2952} {"train_loss": -12.266832601456414, "global_step": 496103, "epoch": 2952, "val_loss": 323386.875} {"train_loss": -11.82962417602539, "global_step": 496104, "epoch": 2953} {"train_loss": -11.393795013427734, "global_step": 496105, "epoch": 2953} {"train_loss": -12.23779296875, "global_step": 496106, "epoch": 2953} {"train_loss": -12.004199981689453, "global_step": 496107, "epoch": 2953} {"train_loss": -12.148197174072266, "global_step": 496108, "epoch": 2953} {"train_loss": -12.117136001586914, "global_step": 496109, "epoch": 2953} {"train_loss": -11.834383010864258, "global_step": 496110, "epoch": 2953} {"train_loss": -12.245565414428711, "global_step": 496111, "epoch": 2953} {"train_loss": -11.771026611328125, "global_step": 496112, "epoch": 2953} {"train_loss": -12.713294982910156, "global_step": 496113, "epoch": 2953} {"train_loss": -12.084659576416016, "global_step": 496114, "epoch": 2953} {"train_loss": -12.487123489379883, "global_step": 496115, "epoch": 2953} {"train_loss": -12.348512649536133, "global_step": 496116, "epoch": 2953} {"train_loss": -12.060850143432617, "global_step": 496117, "epoch": 2953} {"train_loss": -12.409616470336914, "global_step": 496118, "epoch": 2953} {"train_loss": -12.076093673706055, "global_step": 496119, "epoch": 2953} {"train_loss": -12.350173950195312, "global_step": 496120, "epoch": 2953} {"train_loss": -12.307186126708984, "global_step": 496121, "epoch": 2953} {"train_loss": -12.13537883758545, "global_step": 496122, "epoch": 2953} {"train_loss": -12.047859191894531, "global_step": 496123, "epoch": 2953} {"train_loss": -11.912151336669922, "global_step": 496124, "epoch": 2953} {"train_loss": -12.422351837158203, "global_step": 496125, "epoch": 2953} {"train_loss": -11.606670379638672, "global_step": 496126, "epoch": 2953} {"train_loss": -12.438451766967773, "global_step": 496127, "epoch": 2953} {"train_loss": -11.028039932250977, "global_step": 496128, "epoch": 2953} {"train_loss": -12.33626937866211, "global_step": 496129, "epoch": 2953} {"train_loss": -11.649465560913086, "global_step": 496130, "epoch": 2953} {"train_loss": -11.992708206176758, "global_step": 496131, "epoch": 2953} {"train_loss": -11.904410362243652, "global_step": 496132, "epoch": 2953} {"train_loss": -12.079349517822266, "global_step": 496133, "epoch": 2953} {"train_loss": -11.892618179321289, "global_step": 496134, "epoch": 2953} {"train_loss": -11.868785858154297, "global_step": 496135, "epoch": 2953} {"train_loss": -12.289653778076172, "global_step": 496136, "epoch": 2953} {"train_loss": -12.330334663391113, "global_step": 496137, "epoch": 2953} {"train_loss": -12.534566879272461, "global_step": 496138, "epoch": 2953} {"train_loss": -12.20604133605957, "global_step": 496139, "epoch": 2953} {"train_loss": -12.56865119934082, "global_step": 496140, "epoch": 2953} {"train_loss": -12.334248542785645, "global_step": 496141, "epoch": 2953} {"train_loss": -12.088033676147461, "global_step": 496142, "epoch": 2953} {"train_loss": -12.314626693725586, "global_step": 496143, "epoch": 2953} {"train_loss": -11.792621612548828, "global_step": 496144, "epoch": 2953} {"train_loss": -12.36114501953125, "global_step": 496145, "epoch": 2953} {"train_loss": -11.944915771484375, "global_step": 496146, "epoch": 2953} {"train_loss": -12.583993911743164, "global_step": 496147, "epoch": 2953} {"train_loss": -11.922086715698242, "global_step": 496148, "epoch": 2953} {"train_loss": -12.658071517944336, "global_step": 496149, "epoch": 2953} {"train_loss": -12.42196273803711, "global_step": 496150, "epoch": 2953} {"train_loss": -12.227579116821289, "global_step": 496151, "epoch": 2953} {"train_loss": -12.819299697875977, "global_step": 496152, "epoch": 2953} {"train_loss": -12.520942687988281, "global_step": 496153, "epoch": 2953} {"train_loss": -12.780858993530273, "global_step": 496154, "epoch": 2953} {"train_loss": -12.451557159423828, "global_step": 496155, "epoch": 2953} {"train_loss": -12.733499526977539, "global_step": 496156, "epoch": 2953} {"train_loss": -12.35763931274414, "global_step": 496157, "epoch": 2953} {"train_loss": -12.655617713928223, "global_step": 496158, "epoch": 2953} {"train_loss": -12.240276336669922, "global_step": 496159, "epoch": 2953} {"train_loss": -12.313494682312012, "global_step": 496160, "epoch": 2953} {"train_loss": -12.765203475952148, "global_step": 496161, "epoch": 2953} {"train_loss": -12.162096977233887, "global_step": 496162, "epoch": 2953} {"train_loss": -11.948720932006836, "global_step": 496163, "epoch": 2953} {"train_loss": -12.264698028564453, "global_step": 496164, "epoch": 2953} {"train_loss": -11.747910499572754, "global_step": 496165, "epoch": 2953} {"train_loss": -12.467314720153809, "global_step": 496166, "epoch": 2953} {"train_loss": -12.079753875732422, "global_step": 496167, "epoch": 2953} {"train_loss": -12.675887107849121, "global_step": 496168, "epoch": 2953} {"train_loss": -12.339800834655762, "global_step": 496169, "epoch": 2953} {"train_loss": -12.577049255371094, "global_step": 496170, "epoch": 2953} {"train_loss": -12.268071174621582, "global_step": 496171, "epoch": 2953} {"train_loss": -12.132558822631836, "global_step": 496172, "epoch": 2953} {"train_loss": -12.526205062866211, "global_step": 496173, "epoch": 2953} {"train_loss": -12.254169464111328, "global_step": 496174, "epoch": 2953} {"train_loss": -12.642335891723633, "global_step": 496175, "epoch": 2953} {"train_loss": -12.167213439941406, "global_step": 496176, "epoch": 2953} {"train_loss": -12.303483963012695, "global_step": 496177, "epoch": 2953} {"train_loss": -12.78550910949707, "global_step": 496178, "epoch": 2953} {"train_loss": -12.090017318725586, "global_step": 496179, "epoch": 2953} {"train_loss": -12.465673446655273, "global_step": 496180, "epoch": 2953} {"train_loss": -12.034561157226562, "global_step": 496181, "epoch": 2953} {"train_loss": -11.925854682922363, "global_step": 496182, "epoch": 2953} {"train_loss": -12.415409088134766, "global_step": 496183, "epoch": 2953} {"train_loss": -12.084844589233398, "global_step": 496184, "epoch": 2953} {"train_loss": -12.373215675354004, "global_step": 496185, "epoch": 2953} {"train_loss": -12.238965034484863, "global_step": 496186, "epoch": 2953} {"train_loss": -12.637513160705566, "global_step": 496187, "epoch": 2953} {"train_loss": -11.756851196289062, "global_step": 496188, "epoch": 2953} {"train_loss": -12.620044708251953, "global_step": 496189, "epoch": 2953} {"train_loss": -12.284069061279297, "global_step": 496190, "epoch": 2953} {"train_loss": -12.332853317260742, "global_step": 496191, "epoch": 2953} {"train_loss": -12.486282348632812, "global_step": 496192, "epoch": 2953} {"train_loss": -12.246915817260742, "global_step": 496193, "epoch": 2953} {"train_loss": -12.7634916305542, "global_step": 496194, "epoch": 2953} {"train_loss": -12.207075119018555, "global_step": 496195, "epoch": 2953} {"train_loss": -12.655327796936035, "global_step": 496196, "epoch": 2953} {"train_loss": -12.102575302124023, "global_step": 496197, "epoch": 2953} {"train_loss": -12.29466724395752, "global_step": 496198, "epoch": 2953} {"train_loss": -12.402313232421875, "global_step": 496199, "epoch": 2953} {"train_loss": -12.118659973144531, "global_step": 496200, "epoch": 2953} {"train_loss": -11.620782852172852, "global_step": 496201, "epoch": 2953} {"train_loss": -12.033979415893555, "global_step": 496202, "epoch": 2953} {"train_loss": -12.315759658813477, "global_step": 496203, "epoch": 2953} {"train_loss": -11.669102668762207, "global_step": 496204, "epoch": 2953} {"train_loss": -12.46731185913086, "global_step": 496205, "epoch": 2953} {"train_loss": -12.130290031433105, "global_step": 496206, "epoch": 2953} {"train_loss": -12.135625839233398, "global_step": 496207, "epoch": 2953} {"train_loss": -12.670241355895996, "global_step": 496208, "epoch": 2953} {"train_loss": -11.974849700927734, "global_step": 496209, "epoch": 2953} {"train_loss": -12.31283950805664, "global_step": 496210, "epoch": 2953} {"train_loss": -11.783363342285156, "global_step": 496211, "epoch": 2953} {"train_loss": -11.950820922851562, "global_step": 496212, "epoch": 2953} {"train_loss": -12.117509841918945, "global_step": 496213, "epoch": 2953} {"train_loss": -12.271204948425293, "global_step": 496214, "epoch": 2953} {"train_loss": -12.292142868041992, "global_step": 496215, "epoch": 2953} {"train_loss": -12.045312881469727, "global_step": 496216, "epoch": 2953} {"train_loss": -12.102861404418945, "global_step": 496217, "epoch": 2953} {"train_loss": -11.830068588256836, "global_step": 496218, "epoch": 2953} {"train_loss": -12.794116973876953, "global_step": 496219, "epoch": 2953} {"train_loss": -11.715438842773438, "global_step": 496220, "epoch": 2953} {"train_loss": -12.491925239562988, "global_step": 496221, "epoch": 2953} {"train_loss": -12.245526313781738, "global_step": 496222, "epoch": 2953} {"train_loss": -12.038697242736816, "global_step": 496223, "epoch": 2953} {"train_loss": -12.365617752075195, "global_step": 496224, "epoch": 2953} {"train_loss": -12.48482894897461, "global_step": 496225, "epoch": 2953} {"train_loss": -11.829345703125, "global_step": 496226, "epoch": 2953} {"train_loss": -12.233003616333008, "global_step": 496227, "epoch": 2953} {"train_loss": -12.498424530029297, "global_step": 496228, "epoch": 2953} {"train_loss": -11.953550338745117, "global_step": 496229, "epoch": 2953} {"train_loss": -11.987512588500977, "global_step": 496230, "epoch": 2953} {"train_loss": -12.467141151428223, "global_step": 496231, "epoch": 2953} {"train_loss": -11.862652778625488, "global_step": 496232, "epoch": 2953} {"train_loss": -11.91041374206543, "global_step": 496233, "epoch": 2953} {"train_loss": -12.671926498413086, "global_step": 496234, "epoch": 2953} {"train_loss": -11.732352256774902, "global_step": 496235, "epoch": 2953} {"train_loss": -12.060857772827148, "global_step": 496236, "epoch": 2953} {"train_loss": -12.322494506835938, "global_step": 496237, "epoch": 2953} {"train_loss": -11.50394058227539, "global_step": 496238, "epoch": 2953} {"train_loss": -12.460390090942383, "global_step": 496239, "epoch": 2953} {"train_loss": -12.145761489868164, "global_step": 496240, "epoch": 2953} {"train_loss": -11.900390625, "global_step": 496241, "epoch": 2953} {"train_loss": -12.465718269348145, "global_step": 496242, "epoch": 2953} {"train_loss": -11.942609786987305, "global_step": 496243, "epoch": 2953} {"train_loss": -11.778188705444336, "global_step": 496244, "epoch": 2953} {"train_loss": -12.679033279418945, "global_step": 496245, "epoch": 2953} {"train_loss": -11.971996307373047, "global_step": 496246, "epoch": 2953} {"train_loss": -11.858277320861816, "global_step": 496247, "epoch": 2953} {"train_loss": -12.096866607666016, "global_step": 496248, "epoch": 2953} {"train_loss": -12.021175384521484, "global_step": 496249, "epoch": 2953} {"train_loss": -11.48666763305664, "global_step": 496250, "epoch": 2953} {"train_loss": -12.175070762634277, "global_step": 496251, "epoch": 2953} {"train_loss": -11.279203414916992, "global_step": 496252, "epoch": 2953} {"train_loss": -12.556143760681152, "global_step": 496253, "epoch": 2953} {"train_loss": -10.949769973754883, "global_step": 496254, "epoch": 2953} {"train_loss": -12.59719181060791, "global_step": 496255, "epoch": 2953} {"train_loss": -11.87489128112793, "global_step": 496256, "epoch": 2953} {"train_loss": -12.10240364074707, "global_step": 496257, "epoch": 2953} {"train_loss": -12.140873908996582, "global_step": 496258, "epoch": 2953} {"train_loss": -12.354544639587402, "global_step": 496259, "epoch": 2953} {"train_loss": -12.229105949401855, "global_step": 496260, "epoch": 2953} {"train_loss": -12.509944915771484, "global_step": 496261, "epoch": 2953} {"train_loss": -11.770400047302246, "global_step": 496262, "epoch": 2953} {"train_loss": -12.435873031616211, "global_step": 496263, "epoch": 2953} {"train_loss": -12.147945404052734, "global_step": 496264, "epoch": 2953} {"train_loss": -12.502778053283691, "global_step": 496265, "epoch": 2953} {"train_loss": -12.373336791992188, "global_step": 496266, "epoch": 2953} {"train_loss": -11.946698188781738, "global_step": 496267, "epoch": 2953} {"train_loss": -12.101861953735352, "global_step": 496268, "epoch": 2953} {"train_loss": -12.148635864257812, "global_step": 496269, "epoch": 2953} {"train_loss": -12.575090408325195, "global_step": 496270, "epoch": 2953} {"train_loss": -12.195035599526905, "global_step": 496271, "epoch": 2953, "val_loss": 317131.96875} {"train_loss": -12.520111083984375, "global_step": 496272, "epoch": 2954} {"train_loss": -12.196388244628906, "global_step": 496273, "epoch": 2954} {"train_loss": -12.77658748626709, "global_step": 496274, "epoch": 2954} {"train_loss": -12.433835983276367, "global_step": 496275, "epoch": 2954} {"train_loss": -12.62913703918457, "global_step": 496276, "epoch": 2954} {"train_loss": -12.544321060180664, "global_step": 496277, "epoch": 2954} {"train_loss": -12.733953475952148, "global_step": 496278, "epoch": 2954} {"train_loss": -12.520742416381836, "global_step": 496279, "epoch": 2954} {"train_loss": -12.612504959106445, "global_step": 496280, "epoch": 2954} {"train_loss": -12.661491394042969, "global_step": 496281, "epoch": 2954} {"train_loss": -12.461605072021484, "global_step": 496282, "epoch": 2954} {"train_loss": -12.663290977478027, "global_step": 496283, "epoch": 2954} {"train_loss": -12.656435012817383, "global_step": 496284, "epoch": 2954} {"train_loss": -12.178140640258789, "global_step": 496285, "epoch": 2954} {"train_loss": -12.446602821350098, "global_step": 496286, "epoch": 2954} {"train_loss": -12.77728271484375, "global_step": 496287, "epoch": 2954} {"train_loss": -12.599327087402344, "global_step": 496288, "epoch": 2954} {"train_loss": -12.735877990722656, "global_step": 496289, "epoch": 2954} {"train_loss": -12.855106353759766, "global_step": 496290, "epoch": 2954} {"train_loss": -12.136260986328125, "global_step": 496291, "epoch": 2954} {"train_loss": -12.55259895324707, "global_step": 496292, "epoch": 2954} {"train_loss": -12.479631423950195, "global_step": 496293, "epoch": 2954} {"train_loss": -12.25200080871582, "global_step": 496294, "epoch": 2954} {"train_loss": -12.5701904296875, "global_step": 496295, "epoch": 2954} {"train_loss": -12.69300365447998, "global_step": 496296, "epoch": 2954} {"train_loss": -12.807765007019043, "global_step": 496297, "epoch": 2954} {"train_loss": -12.712218284606934, "global_step": 496298, "epoch": 2954} {"train_loss": -12.476557731628418, "global_step": 496299, "epoch": 2954} {"train_loss": -12.695473670959473, "global_step": 496300, "epoch": 2954} {"train_loss": -12.551748275756836, "global_step": 496301, "epoch": 2954} {"train_loss": -12.540104866027832, "global_step": 496302, "epoch": 2954} {"train_loss": -12.512727737426758, "global_step": 496303, "epoch": 2954} {"train_loss": -12.449966430664062, "global_step": 496304, "epoch": 2954} {"train_loss": -12.587398529052734, "global_step": 496305, "epoch": 2954} {"train_loss": -12.649506568908691, "global_step": 496306, "epoch": 2954} {"train_loss": -12.718064308166504, "global_step": 496307, "epoch": 2954} {"train_loss": -12.657958984375, "global_step": 496308, "epoch": 2954} {"train_loss": -12.955392837524414, "global_step": 496309, "epoch": 2954} {"train_loss": -12.626896858215332, "global_step": 496310, "epoch": 2954} {"train_loss": -12.701921463012695, "global_step": 496311, "epoch": 2954} {"train_loss": -12.28091049194336, "global_step": 496312, "epoch": 2954} {"train_loss": -11.679424285888672, "global_step": 496313, "epoch": 2954} {"train_loss": -11.666646957397461, "global_step": 496314, "epoch": 2954} {"train_loss": -12.476655960083008, "global_step": 496315, "epoch": 2954} {"train_loss": -11.646768569946289, "global_step": 496316, "epoch": 2954} {"train_loss": -11.99073600769043, "global_step": 496317, "epoch": 2954} {"train_loss": -12.401788711547852, "global_step": 496318, "epoch": 2954} {"train_loss": -11.461877822875977, "global_step": 496319, "epoch": 2954} {"train_loss": -11.07056999206543, "global_step": 496320, "epoch": 2954} {"train_loss": -11.95501708984375, "global_step": 496321, "epoch": 2954} {"train_loss": -11.720559120178223, "global_step": 496322, "epoch": 2954} {"train_loss": -11.271953582763672, "global_step": 496323, "epoch": 2954} {"train_loss": -12.362588882446289, "global_step": 496324, "epoch": 2954} {"train_loss": -11.473003387451172, "global_step": 496325, "epoch": 2954} {"train_loss": -11.963354110717773, "global_step": 496326, "epoch": 2954} {"train_loss": -12.38963508605957, "global_step": 496327, "epoch": 2954} {"train_loss": -11.955583572387695, "global_step": 496328, "epoch": 2954} {"train_loss": -12.376296043395996, "global_step": 496329, "epoch": 2954} {"train_loss": -12.298334121704102, "global_step": 496330, "epoch": 2954} {"train_loss": -12.568832397460938, "global_step": 496331, "epoch": 2954} {"train_loss": -12.06847095489502, "global_step": 496332, "epoch": 2954} {"train_loss": -12.659514427185059, "global_step": 496333, "epoch": 2954} {"train_loss": -12.515996932983398, "global_step": 496334, "epoch": 2954} {"train_loss": -12.418821334838867, "global_step": 496335, "epoch": 2954} {"train_loss": -12.4777250289917, "global_step": 496336, "epoch": 2954} {"train_loss": -12.630945205688477, "global_step": 496337, "epoch": 2954} {"train_loss": -12.45565414428711, "global_step": 496338, "epoch": 2954} {"train_loss": -12.683345794677734, "global_step": 496339, "epoch": 2954} {"train_loss": -12.682987213134766, "global_step": 496340, "epoch": 2954} {"train_loss": -12.528997421264648, "global_step": 496341, "epoch": 2954} {"train_loss": -12.371898651123047, "global_step": 496342, "epoch": 2954} {"train_loss": -12.501357078552246, "global_step": 496343, "epoch": 2954} {"train_loss": -12.512678146362305, "global_step": 496344, "epoch": 2954} {"train_loss": -12.585977554321289, "global_step": 496345, "epoch": 2954} {"train_loss": -12.780820846557617, "global_step": 496346, "epoch": 2954} {"train_loss": -12.74172592163086, "global_step": 496347, "epoch": 2954} {"train_loss": -12.719294548034668, "global_step": 496348, "epoch": 2954} {"train_loss": -12.746021270751953, "global_step": 496349, "epoch": 2954} {"train_loss": -12.723169326782227, "global_step": 496350, "epoch": 2954} {"train_loss": -12.546565055847168, "global_step": 496351, "epoch": 2954} {"train_loss": -12.86942195892334, "global_step": 496352, "epoch": 2954} {"train_loss": -12.710890769958496, "global_step": 496353, "epoch": 2954} {"train_loss": -12.566038131713867, "global_step": 496354, "epoch": 2954} {"train_loss": -12.684024810791016, "global_step": 496355, "epoch": 2954} {"train_loss": -12.660501480102539, "global_step": 496356, "epoch": 2954} {"train_loss": -12.33415412902832, "global_step": 496357, "epoch": 2954} {"train_loss": -12.769671440124512, "global_step": 496358, "epoch": 2954} {"train_loss": -12.45846176147461, "global_step": 496359, "epoch": 2954} {"train_loss": -12.10678482055664, "global_step": 496360, "epoch": 2954} {"train_loss": -12.927032470703125, "global_step": 496361, "epoch": 2954} {"train_loss": -12.317350387573242, "global_step": 496362, "epoch": 2954} {"train_loss": -12.986754417419434, "global_step": 496363, "epoch": 2954} {"train_loss": -12.613624572753906, "global_step": 496364, "epoch": 2954} {"train_loss": -11.846978187561035, "global_step": 496365, "epoch": 2954} {"train_loss": -12.45283317565918, "global_step": 496366, "epoch": 2954} {"train_loss": -12.212185859680176, "global_step": 496367, "epoch": 2954} {"train_loss": -11.55196762084961, "global_step": 496368, "epoch": 2954} {"train_loss": -12.17711067199707, "global_step": 496369, "epoch": 2954} {"train_loss": -11.925785064697266, "global_step": 496370, "epoch": 2954} {"train_loss": -12.482141494750977, "global_step": 496371, "epoch": 2954} {"train_loss": -12.43331527709961, "global_step": 496372, "epoch": 2954} {"train_loss": -11.859119415283203, "global_step": 496373, "epoch": 2954} {"train_loss": -12.209420204162598, "global_step": 496374, "epoch": 2954} {"train_loss": -12.226001739501953, "global_step": 496375, "epoch": 2954} {"train_loss": -12.753120422363281, "global_step": 496376, "epoch": 2954} {"train_loss": -11.507705688476562, "global_step": 496377, "epoch": 2954} {"train_loss": -11.937173843383789, "global_step": 496378, "epoch": 2954} {"train_loss": -11.994695663452148, "global_step": 496379, "epoch": 2954} {"train_loss": -12.57038688659668, "global_step": 496380, "epoch": 2954} {"train_loss": -12.542673110961914, "global_step": 496381, "epoch": 2954} {"train_loss": -12.444948196411133, "global_step": 496382, "epoch": 2954} {"train_loss": -12.033645629882812, "global_step": 496383, "epoch": 2954} {"train_loss": -12.376546859741211, "global_step": 496384, "epoch": 2954} {"train_loss": -11.650135040283203, "global_step": 496385, "epoch": 2954} {"train_loss": -11.83237361907959, "global_step": 496386, "epoch": 2954} {"train_loss": -12.704689025878906, "global_step": 496387, "epoch": 2954} {"train_loss": -11.483373641967773, "global_step": 496388, "epoch": 2954} {"train_loss": -12.659578323364258, "global_step": 496389, "epoch": 2954} {"train_loss": -11.317376136779785, "global_step": 496390, "epoch": 2954} {"train_loss": -11.668785095214844, "global_step": 496391, "epoch": 2954} {"train_loss": -12.088884353637695, "global_step": 496392, "epoch": 2954} {"train_loss": -10.538503646850586, "global_step": 496393, "epoch": 2954} {"train_loss": -11.733514785766602, "global_step": 496394, "epoch": 2954} {"train_loss": -12.176423072814941, "global_step": 496395, "epoch": 2954} {"train_loss": -11.161638259887695, "global_step": 496396, "epoch": 2954} {"train_loss": -11.914454460144043, "global_step": 496397, "epoch": 2954} {"train_loss": -12.125421524047852, "global_step": 496398, "epoch": 2954} {"train_loss": -11.315654754638672, "global_step": 496399, "epoch": 2954} {"train_loss": -10.910167694091797, "global_step": 496400, "epoch": 2954} {"train_loss": -11.166221618652344, "global_step": 496401, "epoch": 2954} {"train_loss": -10.554569244384766, "global_step": 496402, "epoch": 2954} {"train_loss": -9.799844741821289, "global_step": 496403, "epoch": 2954} {"train_loss": -10.84749984741211, "global_step": 496404, "epoch": 2954} {"train_loss": -11.311037063598633, "global_step": 496405, "epoch": 2954} {"train_loss": -10.678590774536133, "global_step": 496406, "epoch": 2954} {"train_loss": -10.18911361694336, "global_step": 496407, "epoch": 2954} {"train_loss": -10.047472953796387, "global_step": 496408, "epoch": 2954} {"train_loss": -11.490604400634766, "global_step": 496409, "epoch": 2954} {"train_loss": -11.260819435119629, "global_step": 496410, "epoch": 2954} {"train_loss": -10.829262733459473, "global_step": 496411, "epoch": 2954} {"train_loss": -10.253803253173828, "global_step": 496412, "epoch": 2954} {"train_loss": -9.816033363342285, "global_step": 496413, "epoch": 2954} {"train_loss": -10.302407264709473, "global_step": 496414, "epoch": 2954} {"train_loss": -10.794591903686523, "global_step": 496415, "epoch": 2954} {"train_loss": -9.103026390075684, "global_step": 496416, "epoch": 2954} {"train_loss": -10.642745018005371, "global_step": 496417, "epoch": 2954} {"train_loss": -10.882776260375977, "global_step": 496418, "epoch": 2954} {"train_loss": -10.89628791809082, "global_step": 496419, "epoch": 2954} {"train_loss": -11.253408432006836, "global_step": 496420, "epoch": 2954} {"train_loss": -10.769153594970703, "global_step": 496421, "epoch": 2954} {"train_loss": -11.367984771728516, "global_step": 496422, "epoch": 2954} {"train_loss": -11.621906280517578, "global_step": 496423, "epoch": 2954} {"train_loss": -11.560016632080078, "global_step": 496424, "epoch": 2954} {"train_loss": -11.790489196777344, "global_step": 496425, "epoch": 2954} {"train_loss": -11.236571311950684, "global_step": 496426, "epoch": 2954} {"train_loss": -11.89013957977295, "global_step": 496427, "epoch": 2954} {"train_loss": -11.724069595336914, "global_step": 496428, "epoch": 2954} {"train_loss": -11.890143394470215, "global_step": 496429, "epoch": 2954} {"train_loss": -12.046810150146484, "global_step": 496430, "epoch": 2954} {"train_loss": -11.674077033996582, "global_step": 496431, "epoch": 2954} {"train_loss": -11.6360445022583, "global_step": 496432, "epoch": 2954} {"train_loss": -11.707154273986816, "global_step": 496433, "epoch": 2954} {"train_loss": -12.44630241394043, "global_step": 496434, "epoch": 2954} {"train_loss": -11.645956039428711, "global_step": 496435, "epoch": 2954} {"train_loss": -12.408876419067383, "global_step": 496436, "epoch": 2954} {"train_loss": -11.630596160888672, "global_step": 496437, "epoch": 2954} {"train_loss": -12.022005081176758, "global_step": 496438, "epoch": 2954} {"train_loss": -12.044748096239, "global_step": 496439, "epoch": 2954, "val_loss": 317682.46875} {"train_loss": -11.929272651672363, "global_step": 496440, "epoch": 2955} {"train_loss": -12.103303909301758, "global_step": 496441, "epoch": 2955} {"train_loss": -11.83558464050293, "global_step": 496442, "epoch": 2955} {"train_loss": -12.381322860717773, "global_step": 496443, "epoch": 2955} {"train_loss": -12.309330940246582, "global_step": 496444, "epoch": 2955} {"train_loss": -12.153047561645508, "global_step": 496445, "epoch": 2955} {"train_loss": -12.219019889831543, "global_step": 496446, "epoch": 2955} {"train_loss": -12.370798110961914, "global_step": 496447, "epoch": 2955} {"train_loss": -12.151894569396973, "global_step": 496448, "epoch": 2955} {"train_loss": -12.3521728515625, "global_step": 496449, "epoch": 2955} {"train_loss": -12.069852828979492, "global_step": 496450, "epoch": 2955} {"train_loss": -12.455257415771484, "global_step": 496451, "epoch": 2955} {"train_loss": -11.985715866088867, "global_step": 496452, "epoch": 2955} {"train_loss": -12.490676879882812, "global_step": 496453, "epoch": 2955} {"train_loss": -12.267353057861328, "global_step": 496454, "epoch": 2955} {"train_loss": -12.226961135864258, "global_step": 496455, "epoch": 2955} {"train_loss": -12.5433349609375, "global_step": 496456, "epoch": 2955} {"train_loss": -12.528583526611328, "global_step": 496457, "epoch": 2955} {"train_loss": -12.603076934814453, "global_step": 496458, "epoch": 2955} {"train_loss": -12.685956954956055, "global_step": 496459, "epoch": 2955} {"train_loss": -12.283018112182617, "global_step": 496460, "epoch": 2955} {"train_loss": -12.595952987670898, "global_step": 496461, "epoch": 2955} {"train_loss": -12.271745681762695, "global_step": 496462, "epoch": 2955} {"train_loss": -12.612641334533691, "global_step": 496463, "epoch": 2955} {"train_loss": -12.437339782714844, "global_step": 496464, "epoch": 2955} {"train_loss": -12.585437774658203, "global_step": 496465, "epoch": 2955} {"train_loss": -12.557101249694824, "global_step": 496466, "epoch": 2955} {"train_loss": -12.520277976989746, "global_step": 496467, "epoch": 2955} {"train_loss": -12.757563591003418, "global_step": 496468, "epoch": 2955} {"train_loss": -12.413463592529297, "global_step": 496469, "epoch": 2955} {"train_loss": -12.822612762451172, "global_step": 496470, "epoch": 2955} {"train_loss": -12.490931510925293, "global_step": 496471, "epoch": 2955} {"train_loss": -12.568986892700195, "global_step": 496472, "epoch": 2955} {"train_loss": -12.663490295410156, "global_step": 496473, "epoch": 2955} {"train_loss": -12.619680404663086, "global_step": 496474, "epoch": 2955} {"train_loss": -12.724493026733398, "global_step": 496475, "epoch": 2955} {"train_loss": -12.720932006835938, "global_step": 496476, "epoch": 2955} {"train_loss": -12.780139923095703, "global_step": 496477, "epoch": 2955} {"train_loss": -12.550376892089844, "global_step": 496478, "epoch": 2955} {"train_loss": -12.87358283996582, "global_step": 496479, "epoch": 2955} {"train_loss": -12.605602264404297, "global_step": 496480, "epoch": 2955} {"train_loss": -12.655648231506348, "global_step": 496481, "epoch": 2955} {"train_loss": -12.815061569213867, "global_step": 496482, "epoch": 2955} {"train_loss": -12.777396202087402, "global_step": 496483, "epoch": 2955} {"train_loss": -12.763076782226562, "global_step": 496484, "epoch": 2955} {"train_loss": -12.723220825195312, "global_step": 496485, "epoch": 2955} {"train_loss": -12.736778259277344, "global_step": 496486, "epoch": 2955} {"train_loss": -12.868152618408203, "global_step": 496487, "epoch": 2955} {"train_loss": -12.94271183013916, "global_step": 496488, "epoch": 2955} {"train_loss": -12.527910232543945, "global_step": 496489, "epoch": 2955} {"train_loss": -12.732335090637207, "global_step": 496490, "epoch": 2955} {"train_loss": -12.534631729125977, "global_step": 496491, "epoch": 2955} {"train_loss": -12.700714111328125, "global_step": 496492, "epoch": 2955} {"train_loss": -12.79277229309082, "global_step": 496493, "epoch": 2955} {"train_loss": -12.702655792236328, "global_step": 496494, "epoch": 2955} {"train_loss": -12.910901069641113, "global_step": 496495, "epoch": 2955} {"train_loss": -12.808704376220703, "global_step": 496496, "epoch": 2955} {"train_loss": -12.718938827514648, "global_step": 496497, "epoch": 2955} {"train_loss": -12.891048431396484, "global_step": 496498, "epoch": 2955} {"train_loss": -12.719039916992188, "global_step": 496499, "epoch": 2955} {"train_loss": -12.745630264282227, "global_step": 496500, "epoch": 2955} {"train_loss": -11.727072715759277, "global_step": 496501, "epoch": 2955} {"train_loss": -12.798005104064941, "global_step": 496502, "epoch": 2955} {"train_loss": -12.235755920410156, "global_step": 496503, "epoch": 2955} {"train_loss": -12.307796478271484, "global_step": 496504, "epoch": 2955} {"train_loss": -12.40481948852539, "global_step": 496505, "epoch": 2955} {"train_loss": -11.920417785644531, "global_step": 496506, "epoch": 2955} {"train_loss": -12.50851058959961, "global_step": 496507, "epoch": 2955} {"train_loss": -11.487892150878906, "global_step": 496508, "epoch": 2955} {"train_loss": -11.413751602172852, "global_step": 496509, "epoch": 2955} {"train_loss": -12.252577781677246, "global_step": 496510, "epoch": 2955} {"train_loss": -11.284689903259277, "global_step": 496511, "epoch": 2955} {"train_loss": -12.117765426635742, "global_step": 496512, "epoch": 2955} {"train_loss": -10.92399787902832, "global_step": 496513, "epoch": 2955} {"train_loss": -12.324760437011719, "global_step": 496514, "epoch": 2955} {"train_loss": -11.592292785644531, "global_step": 496515, "epoch": 2955} {"train_loss": -11.952033996582031, "global_step": 496516, "epoch": 2955} {"train_loss": -11.992690086364746, "global_step": 496517, "epoch": 2955} {"train_loss": -11.545737266540527, "global_step": 496518, "epoch": 2955} {"train_loss": -12.064109802246094, "global_step": 496519, "epoch": 2955} {"train_loss": -11.484384536743164, "global_step": 496520, "epoch": 2955} {"train_loss": -12.450653076171875, "global_step": 496521, "epoch": 2955} {"train_loss": -11.281490325927734, "global_step": 496522, "epoch": 2955} {"train_loss": -12.493922233581543, "global_step": 496523, "epoch": 2955} {"train_loss": -11.481390953063965, "global_step": 496524, "epoch": 2955} {"train_loss": -11.375900268554688, "global_step": 496525, "epoch": 2955} {"train_loss": -12.007560729980469, "global_step": 496526, "epoch": 2955} {"train_loss": -11.515687942504883, "global_step": 496527, "epoch": 2955} {"train_loss": -11.26093578338623, "global_step": 496528, "epoch": 2955} {"train_loss": -12.034530639648438, "global_step": 496529, "epoch": 2955} {"train_loss": -11.054815292358398, "global_step": 496530, "epoch": 2955} {"train_loss": -12.379522323608398, "global_step": 496531, "epoch": 2955} {"train_loss": -11.80856990814209, "global_step": 496532, "epoch": 2955} {"train_loss": -11.730850219726562, "global_step": 496533, "epoch": 2955} {"train_loss": -12.18520736694336, "global_step": 496534, "epoch": 2955} {"train_loss": -11.425820350646973, "global_step": 496535, "epoch": 2955} {"train_loss": -12.38913345336914, "global_step": 496536, "epoch": 2955} {"train_loss": -11.681296348571777, "global_step": 496537, "epoch": 2955} {"train_loss": -12.203664779663086, "global_step": 496538, "epoch": 2955} {"train_loss": -12.509846687316895, "global_step": 496539, "epoch": 2955} {"train_loss": -12.011188507080078, "global_step": 496540, "epoch": 2955} {"train_loss": -12.417438507080078, "global_step": 496541, "epoch": 2955} {"train_loss": -12.356664657592773, "global_step": 496542, "epoch": 2955} {"train_loss": -12.30404281616211, "global_step": 496543, "epoch": 2955} {"train_loss": -12.305730819702148, "global_step": 496544, "epoch": 2955} {"train_loss": -12.338438987731934, "global_step": 496545, "epoch": 2955} {"train_loss": -12.552168846130371, "global_step": 496546, "epoch": 2955} {"train_loss": -12.490955352783203, "global_step": 496547, "epoch": 2955} {"train_loss": -12.696327209472656, "global_step": 496548, "epoch": 2955} {"train_loss": -12.558263778686523, "global_step": 496549, "epoch": 2955} {"train_loss": -12.680060386657715, "global_step": 496550, "epoch": 2955} {"train_loss": -12.513906478881836, "global_step": 496551, "epoch": 2955} {"train_loss": -12.677240371704102, "global_step": 496552, "epoch": 2955} {"train_loss": -12.336058616638184, "global_step": 496553, "epoch": 2955} {"train_loss": -12.796481132507324, "global_step": 496554, "epoch": 2955} {"train_loss": -12.921531677246094, "global_step": 496555, "epoch": 2955} {"train_loss": -12.674266815185547, "global_step": 496556, "epoch": 2955} {"train_loss": -12.931877136230469, "global_step": 496557, "epoch": 2955} {"train_loss": -12.818693161010742, "global_step": 496558, "epoch": 2955} {"train_loss": -12.718181610107422, "global_step": 496559, "epoch": 2955} {"train_loss": -12.794657707214355, "global_step": 496560, "epoch": 2955} {"train_loss": -12.822649002075195, "global_step": 496561, "epoch": 2955} {"train_loss": -12.868650436401367, "global_step": 496562, "epoch": 2955} {"train_loss": -12.690749168395996, "global_step": 496563, "epoch": 2955} {"train_loss": -12.877073287963867, "global_step": 496564, "epoch": 2955} {"train_loss": -12.705451011657715, "global_step": 496565, "epoch": 2955} {"train_loss": -12.885544776916504, "global_step": 496566, "epoch": 2955} {"train_loss": -12.996590614318848, "global_step": 496567, "epoch": 2955} {"train_loss": -12.762304306030273, "global_step": 496568, "epoch": 2955} {"train_loss": -12.938909530639648, "global_step": 496569, "epoch": 2955} {"train_loss": -12.746612548828125, "global_step": 496570, "epoch": 2955} {"train_loss": -12.359410285949707, "global_step": 496571, "epoch": 2955} {"train_loss": -12.77347469329834, "global_step": 496572, "epoch": 2955} {"train_loss": -12.869434356689453, "global_step": 496573, "epoch": 2955} {"train_loss": -12.73013973236084, "global_step": 496574, "epoch": 2955} {"train_loss": -13.073330879211426, "global_step": 496575, "epoch": 2955} {"train_loss": -12.759025573730469, "global_step": 496576, "epoch": 2955} {"train_loss": -12.76864242553711, "global_step": 496577, "epoch": 2955} {"train_loss": -12.793851852416992, "global_step": 496578, "epoch": 2955} {"train_loss": -12.55603313446045, "global_step": 496579, "epoch": 2955} {"train_loss": -12.972309112548828, "global_step": 496580, "epoch": 2955} {"train_loss": -13.050573348999023, "global_step": 496581, "epoch": 2955} {"train_loss": -12.643867492675781, "global_step": 496582, "epoch": 2955} {"train_loss": -12.925387382507324, "global_step": 496583, "epoch": 2955} {"train_loss": -12.957910537719727, "global_step": 496584, "epoch": 2955} {"train_loss": -13.048873901367188, "global_step": 496585, "epoch": 2955} {"train_loss": -12.666280746459961, "global_step": 496586, "epoch": 2955} {"train_loss": -13.11043930053711, "global_step": 496587, "epoch": 2955} {"train_loss": -12.872568130493164, "global_step": 496588, "epoch": 2955} {"train_loss": -12.825553894042969, "global_step": 496589, "epoch": 2955} {"train_loss": -12.92894172668457, "global_step": 496590, "epoch": 2955} {"train_loss": -12.759779930114746, "global_step": 496591, "epoch": 2955} {"train_loss": -12.836780548095703, "global_step": 496592, "epoch": 2955} {"train_loss": -12.947088241577148, "global_step": 496593, "epoch": 2955} {"train_loss": -13.070573806762695, "global_step": 496594, "epoch": 2955} {"train_loss": -12.742411613464355, "global_step": 496595, "epoch": 2955} {"train_loss": -11.613414764404297, "global_step": 496596, "epoch": 2955} {"train_loss": -10.401124954223633, "global_step": 496597, "epoch": 2955} {"train_loss": -12.663839340209961, "global_step": 496598, "epoch": 2955} {"train_loss": -12.144006729125977, "global_step": 496599, "epoch": 2955} {"train_loss": -12.422245025634766, "global_step": 496600, "epoch": 2955} {"train_loss": -11.948685646057129, "global_step": 496601, "epoch": 2955} {"train_loss": -12.435720443725586, "global_step": 496602, "epoch": 2955} {"train_loss": -12.357996940612793, "global_step": 496603, "epoch": 2955} {"train_loss": -12.507492065429688, "global_step": 496604, "epoch": 2955} {"train_loss": -12.219863891601562, "global_step": 496605, "epoch": 2955} {"train_loss": -12.143555641174316, "global_step": 496606, "epoch": 2955} {"train_loss": -12.42562056723095, "global_step": 496607, "epoch": 2955, "val_loss": 321037.34375, "train_action_mse_error": 1.2615636587142944} {"train_loss": -11.677556991577148, "global_step": 496608, "epoch": 2956} {"train_loss": -12.294840812683105, "global_step": 496609, "epoch": 2956} {"train_loss": -12.51427173614502, "global_step": 496610, "epoch": 2956} {"train_loss": -12.758956909179688, "global_step": 496611, "epoch": 2956} {"train_loss": -12.306478500366211, "global_step": 496612, "epoch": 2956} {"train_loss": -12.50289535522461, "global_step": 496613, "epoch": 2956} {"train_loss": -12.156013488769531, "global_step": 496614, "epoch": 2956} {"train_loss": -12.33515453338623, "global_step": 496615, "epoch": 2956} {"train_loss": -12.262081146240234, "global_step": 496616, "epoch": 2956} {"train_loss": -12.55761432647705, "global_step": 496617, "epoch": 2956} {"train_loss": -10.514364242553711, "global_step": 496618, "epoch": 2956} {"train_loss": -10.554156303405762, "global_step": 496619, "epoch": 2956} {"train_loss": -11.321733474731445, "global_step": 496620, "epoch": 2956} {"train_loss": -9.986719131469727, "global_step": 496621, "epoch": 2956} {"train_loss": -12.159076690673828, "global_step": 496622, "epoch": 2956} {"train_loss": -10.287363052368164, "global_step": 496623, "epoch": 2956} {"train_loss": -10.645186424255371, "global_step": 496624, "epoch": 2956} {"train_loss": -10.397820472717285, "global_step": 496625, "epoch": 2956} {"train_loss": -11.120805740356445, "global_step": 496626, "epoch": 2956} {"train_loss": -11.740686416625977, "global_step": 496627, "epoch": 2956} {"train_loss": -10.67481803894043, "global_step": 496628, "epoch": 2956} {"train_loss": -11.634967803955078, "global_step": 496629, "epoch": 2956} {"train_loss": -10.065113067626953, "global_step": 496630, "epoch": 2956} {"train_loss": -10.12991714477539, "global_step": 496631, "epoch": 2956} {"train_loss": -9.016595840454102, "global_step": 496632, "epoch": 2956} {"train_loss": -10.423408508300781, "global_step": 496633, "epoch": 2956} {"train_loss": -11.911498069763184, "global_step": 496634, "epoch": 2956} {"train_loss": -10.425323486328125, "global_step": 496635, "epoch": 2956} {"train_loss": -11.419272422790527, "global_step": 496636, "epoch": 2956} {"train_loss": -11.135856628417969, "global_step": 496637, "epoch": 2956} {"train_loss": -10.534838676452637, "global_step": 496638, "epoch": 2956} {"train_loss": -10.125045776367188, "global_step": 496639, "epoch": 2956} {"train_loss": -10.84126091003418, "global_step": 496640, "epoch": 2956} {"train_loss": -11.267271041870117, "global_step": 496641, "epoch": 2956} {"train_loss": -10.741131782531738, "global_step": 496642, "epoch": 2956} {"train_loss": -10.618887901306152, "global_step": 496643, "epoch": 2956} {"train_loss": -11.267180442810059, "global_step": 496644, "epoch": 2956} {"train_loss": -11.318228721618652, "global_step": 496645, "epoch": 2956} {"train_loss": -11.724953651428223, "global_step": 496646, "epoch": 2956} {"train_loss": -10.666145324707031, "global_step": 496647, "epoch": 2956} {"train_loss": -11.915301322937012, "global_step": 496648, "epoch": 2956} {"train_loss": -11.057793617248535, "global_step": 496649, "epoch": 2956} {"train_loss": -11.44723892211914, "global_step": 496650, "epoch": 2956} {"train_loss": -10.66196060180664, "global_step": 496651, "epoch": 2956} {"train_loss": -11.784438133239746, "global_step": 496652, "epoch": 2956} {"train_loss": -11.050592422485352, "global_step": 496653, "epoch": 2956} {"train_loss": -11.63440990447998, "global_step": 496654, "epoch": 2956} {"train_loss": -11.157305717468262, "global_step": 496655, "epoch": 2956} {"train_loss": -11.701427459716797, "global_step": 496656, "epoch": 2956} {"train_loss": -11.287802696228027, "global_step": 496657, "epoch": 2956} {"train_loss": -12.256118774414062, "global_step": 496658, "epoch": 2956} {"train_loss": -11.400206565856934, "global_step": 496659, "epoch": 2956} {"train_loss": -12.051864624023438, "global_step": 496660, "epoch": 2956} {"train_loss": -11.819034576416016, "global_step": 496661, "epoch": 2956} {"train_loss": -11.55102825164795, "global_step": 496662, "epoch": 2956} {"train_loss": -11.739768028259277, "global_step": 496663, "epoch": 2956} {"train_loss": -11.608806610107422, "global_step": 496664, "epoch": 2956} {"train_loss": -11.900300025939941, "global_step": 496665, "epoch": 2956} {"train_loss": -11.999835968017578, "global_step": 496666, "epoch": 2956} {"train_loss": -10.949531555175781, "global_step": 496667, "epoch": 2956} {"train_loss": -12.448223114013672, "global_step": 496668, "epoch": 2956} {"train_loss": -11.6228609085083, "global_step": 496669, "epoch": 2956} {"train_loss": -11.275846481323242, "global_step": 496670, "epoch": 2956} {"train_loss": -11.695640563964844, "global_step": 496671, "epoch": 2956} {"train_loss": -11.210472106933594, "global_step": 496672, "epoch": 2956} {"train_loss": -11.516087532043457, "global_step": 496673, "epoch": 2956} {"train_loss": -11.93094253540039, "global_step": 496674, "epoch": 2956} {"train_loss": -11.881622314453125, "global_step": 496675, "epoch": 2956} {"train_loss": -12.124605178833008, "global_step": 496676, "epoch": 2956} {"train_loss": -12.185798645019531, "global_step": 496677, "epoch": 2956} {"train_loss": -11.736310958862305, "global_step": 496678, "epoch": 2956} {"train_loss": -12.355937957763672, "global_step": 496679, "epoch": 2956} {"train_loss": -12.096711158752441, "global_step": 496680, "epoch": 2956} {"train_loss": -12.181070327758789, "global_step": 496681, "epoch": 2956} {"train_loss": -12.269676208496094, "global_step": 496682, "epoch": 2956} {"train_loss": -12.296326637268066, "global_step": 496683, "epoch": 2956} {"train_loss": -12.137231826782227, "global_step": 496684, "epoch": 2956} {"train_loss": -12.272568702697754, "global_step": 496685, "epoch": 2956} {"train_loss": -12.026698112487793, "global_step": 496686, "epoch": 2956} {"train_loss": -11.701969146728516, "global_step": 496687, "epoch": 2956} {"train_loss": -12.298196792602539, "global_step": 496688, "epoch": 2956} {"train_loss": -11.965435028076172, "global_step": 496689, "epoch": 2956} {"train_loss": -12.358633995056152, "global_step": 496690, "epoch": 2956} {"train_loss": -12.437036514282227, "global_step": 496691, "epoch": 2956} {"train_loss": -12.274763107299805, "global_step": 496692, "epoch": 2956} {"train_loss": -12.594585418701172, "global_step": 496693, "epoch": 2956} {"train_loss": -11.926456451416016, "global_step": 496694, "epoch": 2956} {"train_loss": -12.264350891113281, "global_step": 496695, "epoch": 2956} {"train_loss": -12.469524383544922, "global_step": 496696, "epoch": 2956} {"train_loss": -12.171710014343262, "global_step": 496697, "epoch": 2956} {"train_loss": -12.139110565185547, "global_step": 496698, "epoch": 2956} {"train_loss": -12.495192527770996, "global_step": 496699, "epoch": 2956} {"train_loss": -11.963155746459961, "global_step": 496700, "epoch": 2956} {"train_loss": -12.769893646240234, "global_step": 496701, "epoch": 2956} {"train_loss": -11.96596908569336, "global_step": 496702, "epoch": 2956} {"train_loss": -12.324407577514648, "global_step": 496703, "epoch": 2956} {"train_loss": -12.672440528869629, "global_step": 496704, "epoch": 2956} {"train_loss": -12.291950225830078, "global_step": 496705, "epoch": 2956} {"train_loss": -12.5577974319458, "global_step": 496706, "epoch": 2956} {"train_loss": -12.542957305908203, "global_step": 496707, "epoch": 2956} {"train_loss": -12.476688385009766, "global_step": 496708, "epoch": 2956} {"train_loss": -12.374839782714844, "global_step": 496709, "epoch": 2956} {"train_loss": -12.73139762878418, "global_step": 496710, "epoch": 2956} {"train_loss": -12.41328239440918, "global_step": 496711, "epoch": 2956} {"train_loss": -12.78282356262207, "global_step": 496712, "epoch": 2956} {"train_loss": -12.754770278930664, "global_step": 496713, "epoch": 2956} {"train_loss": -12.613540649414062, "global_step": 496714, "epoch": 2956} {"train_loss": -12.864725112915039, "global_step": 496715, "epoch": 2956} {"train_loss": -12.623553276062012, "global_step": 496716, "epoch": 2956} {"train_loss": -12.779692649841309, "global_step": 496717, "epoch": 2956} {"train_loss": -12.50395679473877, "global_step": 496718, "epoch": 2956} {"train_loss": -12.705686569213867, "global_step": 496719, "epoch": 2956} {"train_loss": -12.859140396118164, "global_step": 496720, "epoch": 2956} {"train_loss": -12.810846328735352, "global_step": 496721, "epoch": 2956} {"train_loss": -12.841049194335938, "global_step": 496722, "epoch": 2956} {"train_loss": -12.866052627563477, "global_step": 496723, "epoch": 2956} {"train_loss": -12.780976295471191, "global_step": 496724, "epoch": 2956} {"train_loss": -12.774476051330566, "global_step": 496725, "epoch": 2956} {"train_loss": -12.689517974853516, "global_step": 496726, "epoch": 2956} {"train_loss": -12.92850112915039, "global_step": 496727, "epoch": 2956} {"train_loss": -12.77237319946289, "global_step": 496728, "epoch": 2956} {"train_loss": -12.875917434692383, "global_step": 496729, "epoch": 2956} {"train_loss": -12.73480224609375, "global_step": 496730, "epoch": 2956} {"train_loss": -12.852506637573242, "global_step": 496731, "epoch": 2956} {"train_loss": -12.80904769897461, "global_step": 496732, "epoch": 2956} {"train_loss": -12.84883975982666, "global_step": 496733, "epoch": 2956} {"train_loss": -12.859809875488281, "global_step": 496734, "epoch": 2956} {"train_loss": -12.799065589904785, "global_step": 496735, "epoch": 2956} {"train_loss": -12.918519973754883, "global_step": 496736, "epoch": 2956} {"train_loss": -12.821239471435547, "global_step": 496737, "epoch": 2956} {"train_loss": -12.801902770996094, "global_step": 496738, "epoch": 2956} {"train_loss": -12.789328575134277, "global_step": 496739, "epoch": 2956} {"train_loss": -12.865406036376953, "global_step": 496740, "epoch": 2956} {"train_loss": -12.914623260498047, "global_step": 496741, "epoch": 2956} {"train_loss": -12.612600326538086, "global_step": 496742, "epoch": 2956} {"train_loss": -12.896775245666504, "global_step": 496743, "epoch": 2956} {"train_loss": -12.813880920410156, "global_step": 496744, "epoch": 2956} {"train_loss": -12.771808624267578, "global_step": 496745, "epoch": 2956} {"train_loss": -12.835509300231934, "global_step": 496746, "epoch": 2956} {"train_loss": -12.73555850982666, "global_step": 496747, "epoch": 2956} {"train_loss": -12.941535949707031, "global_step": 496748, "epoch": 2956} {"train_loss": -12.856578826904297, "global_step": 496749, "epoch": 2956} {"train_loss": -12.980411529541016, "global_step": 496750, "epoch": 2956} {"train_loss": -12.737823486328125, "global_step": 496751, "epoch": 2956} {"train_loss": -12.06840705871582, "global_step": 496752, "epoch": 2956} {"train_loss": -12.289352416992188, "global_step": 496753, "epoch": 2956} {"train_loss": -12.406173706054688, "global_step": 496754, "epoch": 2956} {"train_loss": -12.664529800415039, "global_step": 496755, "epoch": 2956} {"train_loss": -12.400652885437012, "global_step": 496756, "epoch": 2956} {"train_loss": -12.373579025268555, "global_step": 496757, "epoch": 2956} {"train_loss": -12.566518783569336, "global_step": 496758, "epoch": 2956} {"train_loss": -12.104127883911133, "global_step": 496759, "epoch": 2956} {"train_loss": -11.916661262512207, "global_step": 496760, "epoch": 2956} {"train_loss": -11.678522109985352, "global_step": 496761, "epoch": 2956} {"train_loss": -11.751745223999023, "global_step": 496762, "epoch": 2956} {"train_loss": -11.267009735107422, "global_step": 496763, "epoch": 2956} {"train_loss": -11.145448684692383, "global_step": 496764, "epoch": 2956} {"train_loss": -11.940624237060547, "global_step": 496765, "epoch": 2956} {"train_loss": -12.031196594238281, "global_step": 496766, "epoch": 2956} {"train_loss": -12.058284759521484, "global_step": 496767, "epoch": 2956} {"train_loss": -12.326701164245605, "global_step": 496768, "epoch": 2956} {"train_loss": -12.815908432006836, "global_step": 496769, "epoch": 2956} {"train_loss": -12.463605880737305, "global_step": 496770, "epoch": 2956} {"train_loss": -12.699775695800781, "global_step": 496771, "epoch": 2956} {"train_loss": -12.43037223815918, "global_step": 496772, "epoch": 2956} {"train_loss": -12.897506713867188, "global_step": 496773, "epoch": 2956} {"train_loss": -12.387990951538086, "global_step": 496774, "epoch": 2956} {"train_loss": -12.020869067737035, "global_step": 496775, "epoch": 2956, "val_loss": 319961.0625} {"train_loss": -12.607030868530273, "global_step": 496776, "epoch": 2957} {"train_loss": -12.758914947509766, "global_step": 496777, "epoch": 2957} {"train_loss": -12.69567584991455, "global_step": 496778, "epoch": 2957} {"train_loss": -12.802451133728027, "global_step": 496779, "epoch": 2957} {"train_loss": -12.932302474975586, "global_step": 496780, "epoch": 2957} {"train_loss": -12.837533950805664, "global_step": 496781, "epoch": 2957} {"train_loss": -12.70031452178955, "global_step": 496782, "epoch": 2957} {"train_loss": -12.6322603225708, "global_step": 496783, "epoch": 2957} {"train_loss": -12.810040473937988, "global_step": 496784, "epoch": 2957} {"train_loss": -12.552191734313965, "global_step": 496785, "epoch": 2957} {"train_loss": -12.764723777770996, "global_step": 496786, "epoch": 2957} {"train_loss": -12.699236869812012, "global_step": 496787, "epoch": 2957} {"train_loss": -13.051803588867188, "global_step": 496788, "epoch": 2957} {"train_loss": -12.329666137695312, "global_step": 496789, "epoch": 2957} {"train_loss": -12.3760347366333, "global_step": 496790, "epoch": 2957} {"train_loss": -12.629080772399902, "global_step": 496791, "epoch": 2957} {"train_loss": -12.823895454406738, "global_step": 496792, "epoch": 2957} {"train_loss": -12.372495651245117, "global_step": 496793, "epoch": 2957} {"train_loss": -11.958415985107422, "global_step": 496794, "epoch": 2957} {"train_loss": -12.690778732299805, "global_step": 496795, "epoch": 2957} {"train_loss": -12.436738967895508, "global_step": 496796, "epoch": 2957} {"train_loss": -11.70681381225586, "global_step": 496797, "epoch": 2957} {"train_loss": -11.806631088256836, "global_step": 496798, "epoch": 2957} {"train_loss": -11.40426254272461, "global_step": 496799, "epoch": 2957} {"train_loss": -12.511384963989258, "global_step": 496800, "epoch": 2957} {"train_loss": -11.80844497680664, "global_step": 496801, "epoch": 2957} {"train_loss": -11.85496711730957, "global_step": 496802, "epoch": 2957} {"train_loss": -12.188213348388672, "global_step": 496803, "epoch": 2957} {"train_loss": -12.188399314880371, "global_step": 496804, "epoch": 2957} {"train_loss": -11.747527122497559, "global_step": 496805, "epoch": 2957} {"train_loss": -11.817985534667969, "global_step": 496806, "epoch": 2957} {"train_loss": -12.444341659545898, "global_step": 496807, "epoch": 2957} {"train_loss": -11.615316390991211, "global_step": 496808, "epoch": 2957} {"train_loss": -11.736005783081055, "global_step": 496809, "epoch": 2957} {"train_loss": -11.982036590576172, "global_step": 496810, "epoch": 2957} {"train_loss": -10.472978591918945, "global_step": 496811, "epoch": 2957} {"train_loss": -11.19137191772461, "global_step": 496812, "epoch": 2957} {"train_loss": -11.193258285522461, "global_step": 496813, "epoch": 2957} {"train_loss": -11.075647354125977, "global_step": 496814, "epoch": 2957} {"train_loss": -11.691146850585938, "global_step": 496815, "epoch": 2957} {"train_loss": -11.334087371826172, "global_step": 496816, "epoch": 2957} {"train_loss": -11.38126277923584, "global_step": 496817, "epoch": 2957} {"train_loss": -11.648545265197754, "global_step": 496818, "epoch": 2957} {"train_loss": -11.302061080932617, "global_step": 496819, "epoch": 2957} {"train_loss": -11.785745620727539, "global_step": 496820, "epoch": 2957} {"train_loss": -11.698005676269531, "global_step": 496821, "epoch": 2957} {"train_loss": -11.979402542114258, "global_step": 496822, "epoch": 2957} {"train_loss": -11.573525428771973, "global_step": 496823, "epoch": 2957} {"train_loss": -12.359346389770508, "global_step": 496824, "epoch": 2957} {"train_loss": -11.845173835754395, "global_step": 496825, "epoch": 2957} {"train_loss": -11.886205673217773, "global_step": 496826, "epoch": 2957} {"train_loss": -12.270891189575195, "global_step": 496827, "epoch": 2957} {"train_loss": -11.966531753540039, "global_step": 496828, "epoch": 2957} {"train_loss": -11.958305358886719, "global_step": 496829, "epoch": 2957} {"train_loss": -12.320337295532227, "global_step": 496830, "epoch": 2957} {"train_loss": -11.608537673950195, "global_step": 496831, "epoch": 2957} {"train_loss": -12.38074779510498, "global_step": 496832, "epoch": 2957} {"train_loss": -12.166120529174805, "global_step": 496833, "epoch": 2957} {"train_loss": -12.05319595336914, "global_step": 496834, "epoch": 2957} {"train_loss": -12.291404724121094, "global_step": 496835, "epoch": 2957} {"train_loss": -11.874860763549805, "global_step": 496836, "epoch": 2957} {"train_loss": -12.920805931091309, "global_step": 496837, "epoch": 2957} {"train_loss": -11.703551292419434, "global_step": 496838, "epoch": 2957} {"train_loss": -12.278468132019043, "global_step": 496839, "epoch": 2957} {"train_loss": -12.276043891906738, "global_step": 496840, "epoch": 2957} {"train_loss": -11.825448989868164, "global_step": 496841, "epoch": 2957} {"train_loss": -12.794832229614258, "global_step": 496842, "epoch": 2957} {"train_loss": -11.993989944458008, "global_step": 496843, "epoch": 2957} {"train_loss": -12.46473503112793, "global_step": 496844, "epoch": 2957} {"train_loss": -12.521889686584473, "global_step": 496845, "epoch": 2957} {"train_loss": -12.44669246673584, "global_step": 496846, "epoch": 2957} {"train_loss": -12.295141220092773, "global_step": 496847, "epoch": 2957} {"train_loss": -12.002626419067383, "global_step": 496848, "epoch": 2957} {"train_loss": -12.836031913757324, "global_step": 496849, "epoch": 2957} {"train_loss": -12.178308486938477, "global_step": 496850, "epoch": 2957} {"train_loss": -12.47822380065918, "global_step": 496851, "epoch": 2957} {"train_loss": -12.394631385803223, "global_step": 496852, "epoch": 2957} {"train_loss": -11.347620010375977, "global_step": 496853, "epoch": 2957} {"train_loss": -12.413911819458008, "global_step": 496854, "epoch": 2957} {"train_loss": -11.537633895874023, "global_step": 496855, "epoch": 2957} {"train_loss": -11.827281951904297, "global_step": 496856, "epoch": 2957} {"train_loss": -11.57152271270752, "global_step": 496857, "epoch": 2957} {"train_loss": -11.07959270477295, "global_step": 496858, "epoch": 2957} {"train_loss": -10.595352172851562, "global_step": 496859, "epoch": 2957} {"train_loss": -11.935072898864746, "global_step": 496860, "epoch": 2957} {"train_loss": -11.29088020324707, "global_step": 496861, "epoch": 2957} {"train_loss": -11.079999923706055, "global_step": 496862, "epoch": 2957} {"train_loss": -11.386839866638184, "global_step": 496863, "epoch": 2957} {"train_loss": -11.108384132385254, "global_step": 496864, "epoch": 2957} {"train_loss": -11.13601303100586, "global_step": 496865, "epoch": 2957} {"train_loss": -11.907561302185059, "global_step": 496866, "epoch": 2957} {"train_loss": -11.362502098083496, "global_step": 496867, "epoch": 2957} {"train_loss": -11.309915542602539, "global_step": 496868, "epoch": 2957} {"train_loss": -11.837255477905273, "global_step": 496869, "epoch": 2957} {"train_loss": -11.120229721069336, "global_step": 496870, "epoch": 2957} {"train_loss": -11.451942443847656, "global_step": 496871, "epoch": 2957} {"train_loss": -10.974149703979492, "global_step": 496872, "epoch": 2957} {"train_loss": -11.958356857299805, "global_step": 496873, "epoch": 2957} {"train_loss": -11.03561019897461, "global_step": 496874, "epoch": 2957} {"train_loss": -12.196395874023438, "global_step": 496875, "epoch": 2957} {"train_loss": -11.343830108642578, "global_step": 496876, "epoch": 2957} {"train_loss": -11.75522518157959, "global_step": 496877, "epoch": 2957} {"train_loss": -10.838857650756836, "global_step": 496878, "epoch": 2957} {"train_loss": -11.6314058303833, "global_step": 496879, "epoch": 2957} {"train_loss": -10.949109077453613, "global_step": 496880, "epoch": 2957} {"train_loss": -11.337005615234375, "global_step": 496881, "epoch": 2957} {"train_loss": -11.001713752746582, "global_step": 496882, "epoch": 2957} {"train_loss": -12.129520416259766, "global_step": 496883, "epoch": 2957} {"train_loss": -10.68612289428711, "global_step": 496884, "epoch": 2957} {"train_loss": -12.045882225036621, "global_step": 496885, "epoch": 2957} {"train_loss": -11.143590927124023, "global_step": 496886, "epoch": 2957} {"train_loss": -11.970791816711426, "global_step": 496887, "epoch": 2957} {"train_loss": -11.57690715789795, "global_step": 496888, "epoch": 2957} {"train_loss": -11.96016788482666, "global_step": 496889, "epoch": 2957} {"train_loss": -12.072566986083984, "global_step": 496890, "epoch": 2957} {"train_loss": -11.900056838989258, "global_step": 496891, "epoch": 2957} {"train_loss": -11.711673736572266, "global_step": 496892, "epoch": 2957} {"train_loss": -12.11858081817627, "global_step": 496893, "epoch": 2957} {"train_loss": -12.332587242126465, "global_step": 496894, "epoch": 2957} {"train_loss": -12.401450157165527, "global_step": 496895, "epoch": 2957} {"train_loss": -12.49338150024414, "global_step": 496896, "epoch": 2957} {"train_loss": -12.543219566345215, "global_step": 496897, "epoch": 2957} {"train_loss": -12.481060028076172, "global_step": 496898, "epoch": 2957} {"train_loss": -12.165070533752441, "global_step": 496899, "epoch": 2957} {"train_loss": -12.370712280273438, "global_step": 496900, "epoch": 2957} {"train_loss": -12.352869987487793, "global_step": 496901, "epoch": 2957} {"train_loss": -12.233526229858398, "global_step": 496902, "epoch": 2957} {"train_loss": -12.190589904785156, "global_step": 496903, "epoch": 2957} {"train_loss": -12.572580337524414, "global_step": 496904, "epoch": 2957} {"train_loss": -12.671751976013184, "global_step": 496905, "epoch": 2957} {"train_loss": -12.786311149597168, "global_step": 496906, "epoch": 2957} {"train_loss": -12.498618125915527, "global_step": 496907, "epoch": 2957} {"train_loss": -12.427717208862305, "global_step": 496908, "epoch": 2957} {"train_loss": -12.588741302490234, "global_step": 496909, "epoch": 2957} {"train_loss": -12.622719764709473, "global_step": 496910, "epoch": 2957} {"train_loss": -12.841999053955078, "global_step": 496911, "epoch": 2957} {"train_loss": -12.543699264526367, "global_step": 496912, "epoch": 2957} {"train_loss": -12.666918754577637, "global_step": 496913, "epoch": 2957} {"train_loss": -12.386846542358398, "global_step": 496914, "epoch": 2957} {"train_loss": -12.731389999389648, "global_step": 496915, "epoch": 2957} {"train_loss": -12.684907913208008, "global_step": 496916, "epoch": 2957} {"train_loss": -12.454870223999023, "global_step": 496917, "epoch": 2957} {"train_loss": -12.674007415771484, "global_step": 496918, "epoch": 2957} {"train_loss": -12.528337478637695, "global_step": 496919, "epoch": 2957} {"train_loss": -12.779012680053711, "global_step": 496920, "epoch": 2957} {"train_loss": -12.382284164428711, "global_step": 496921, "epoch": 2957} {"train_loss": -12.626476287841797, "global_step": 496922, "epoch": 2957} {"train_loss": -12.520248413085938, "global_step": 496923, "epoch": 2957} {"train_loss": -12.424327850341797, "global_step": 496924, "epoch": 2957} {"train_loss": -12.635536193847656, "global_step": 496925, "epoch": 2957} {"train_loss": -12.31045150756836, "global_step": 496926, "epoch": 2957} {"train_loss": -12.738302230834961, "global_step": 496927, "epoch": 2957} {"train_loss": -12.458447456359863, "global_step": 496928, "epoch": 2957} {"train_loss": -12.778499603271484, "global_step": 496929, "epoch": 2957} {"train_loss": -12.456656455993652, "global_step": 496930, "epoch": 2957} {"train_loss": -12.571342468261719, "global_step": 496931, "epoch": 2957} {"train_loss": -12.448741912841797, "global_step": 496932, "epoch": 2957} {"train_loss": -12.650880813598633, "global_step": 496933, "epoch": 2957} {"train_loss": -12.38924789428711, "global_step": 496934, "epoch": 2957} {"train_loss": -12.581769943237305, "global_step": 496935, "epoch": 2957} {"train_loss": -12.265647888183594, "global_step": 496936, "epoch": 2957} {"train_loss": -12.745586395263672, "global_step": 496937, "epoch": 2957} {"train_loss": -12.4227294921875, "global_step": 496938, "epoch": 2957} {"train_loss": -12.744441986083984, "global_step": 496939, "epoch": 2957} {"train_loss": -12.65062427520752, "global_step": 496940, "epoch": 2957} {"train_loss": -12.46883773803711, "global_step": 496941, "epoch": 2957} {"train_loss": -12.51904296875, "global_step": 496942, "epoch": 2957} {"train_loss": -12.101189670108614, "global_step": 496943, "epoch": 2957, "val_loss": 319935.3125} {"train_loss": -12.841097831726074, "global_step": 496944, "epoch": 2958} {"train_loss": -12.037994384765625, "global_step": 496945, "epoch": 2958} {"train_loss": -12.768270492553711, "global_step": 496946, "epoch": 2958} {"train_loss": -12.565696716308594, "global_step": 496947, "epoch": 2958} {"train_loss": -12.601310729980469, "global_step": 496948, "epoch": 2958} {"train_loss": -12.494186401367188, "global_step": 496949, "epoch": 2958} {"train_loss": -12.52722454071045, "global_step": 496950, "epoch": 2958} {"train_loss": -12.751020431518555, "global_step": 496951, "epoch": 2958} {"train_loss": -12.162744522094727, "global_step": 496952, "epoch": 2958} {"train_loss": -12.70658016204834, "global_step": 496953, "epoch": 2958} {"train_loss": -12.61528491973877, "global_step": 496954, "epoch": 2958} {"train_loss": -12.783454895019531, "global_step": 496955, "epoch": 2958} {"train_loss": -12.449689865112305, "global_step": 496956, "epoch": 2958} {"train_loss": -12.782882690429688, "global_step": 496957, "epoch": 2958} {"train_loss": -12.781726837158203, "global_step": 496958, "epoch": 2958} {"train_loss": -12.752466201782227, "global_step": 496959, "epoch": 2958} {"train_loss": -12.571598052978516, "global_step": 496960, "epoch": 2958} {"train_loss": -12.477385520935059, "global_step": 496961, "epoch": 2958} {"train_loss": -12.849894523620605, "global_step": 496962, "epoch": 2958} {"train_loss": -12.772093772888184, "global_step": 496963, "epoch": 2958} {"train_loss": -12.557439804077148, "global_step": 496964, "epoch": 2958} {"train_loss": -12.897171020507812, "global_step": 496965, "epoch": 2958} {"train_loss": -12.632993698120117, "global_step": 496966, "epoch": 2958} {"train_loss": -12.982575416564941, "global_step": 496967, "epoch": 2958} {"train_loss": -12.840469360351562, "global_step": 496968, "epoch": 2958} {"train_loss": -12.882186889648438, "global_step": 496969, "epoch": 2958} {"train_loss": -13.0348482131958, "global_step": 496970, "epoch": 2958} {"train_loss": -12.91483211517334, "global_step": 496971, "epoch": 2958} {"train_loss": -12.616275787353516, "global_step": 496972, "epoch": 2958} {"train_loss": -12.893479347229004, "global_step": 496973, "epoch": 2958} {"train_loss": -12.797391891479492, "global_step": 496974, "epoch": 2958} {"train_loss": -13.039436340332031, "global_step": 496975, "epoch": 2958} {"train_loss": -12.781242370605469, "global_step": 496976, "epoch": 2958} {"train_loss": -12.820432662963867, "global_step": 496977, "epoch": 2958} {"train_loss": -12.868171691894531, "global_step": 496978, "epoch": 2958} {"train_loss": -12.804473876953125, "global_step": 496979, "epoch": 2958} {"train_loss": -12.902383804321289, "global_step": 496980, "epoch": 2958} {"train_loss": -12.914438247680664, "global_step": 496981, "epoch": 2958} {"train_loss": -12.966767311096191, "global_step": 496982, "epoch": 2958} {"train_loss": -12.930824279785156, "global_step": 496983, "epoch": 2958} {"train_loss": -12.829487800598145, "global_step": 496984, "epoch": 2958} {"train_loss": -12.767463684082031, "global_step": 496985, "epoch": 2958} {"train_loss": -13.0897216796875, "global_step": 496986, "epoch": 2958} {"train_loss": -12.710205078125, "global_step": 496987, "epoch": 2958} {"train_loss": -12.412195205688477, "global_step": 496988, "epoch": 2958} {"train_loss": -12.886630058288574, "global_step": 496989, "epoch": 2958} {"train_loss": -12.750486373901367, "global_step": 496990, "epoch": 2958} {"train_loss": -12.457134246826172, "global_step": 496991, "epoch": 2958} {"train_loss": -12.907512664794922, "global_step": 496992, "epoch": 2958} {"train_loss": -12.781686782836914, "global_step": 496993, "epoch": 2958} {"train_loss": -12.631965637207031, "global_step": 496994, "epoch": 2958} {"train_loss": -12.71583366394043, "global_step": 496995, "epoch": 2958} {"train_loss": -12.847354888916016, "global_step": 496996, "epoch": 2958} {"train_loss": -13.088689804077148, "global_step": 496997, "epoch": 2958} {"train_loss": -13.006380081176758, "global_step": 496998, "epoch": 2958} {"train_loss": -12.909322738647461, "global_step": 496999, "epoch": 2958} {"train_loss": -13.181228637695312, "global_step": 497000, "epoch": 2958} {"train_loss": -12.935135841369629, "global_step": 497001, "epoch": 2958} {"train_loss": -12.761728286743164, "global_step": 497002, "epoch": 2958} {"train_loss": -13.041007041931152, "global_step": 497003, "epoch": 2958} {"train_loss": -12.913917541503906, "global_step": 497004, "epoch": 2958} {"train_loss": -12.762611389160156, "global_step": 497005, "epoch": 2958} {"train_loss": -12.691376686096191, "global_step": 497006, "epoch": 2958} {"train_loss": -12.880443572998047, "global_step": 497007, "epoch": 2958} {"train_loss": -12.977594375610352, "global_step": 497008, "epoch": 2958} {"train_loss": -12.67123794555664, "global_step": 497009, "epoch": 2958} {"train_loss": -12.956209182739258, "global_step": 497010, "epoch": 2958} {"train_loss": -13.015625, "global_step": 497011, "epoch": 2958} {"train_loss": -12.909767150878906, "global_step": 497012, "epoch": 2958} {"train_loss": -13.060786247253418, "global_step": 497013, "epoch": 2958} {"train_loss": -12.867376327514648, "global_step": 497014, "epoch": 2958} {"train_loss": -12.844107627868652, "global_step": 497015, "epoch": 2958} {"train_loss": -12.729246139526367, "global_step": 497016, "epoch": 2958} {"train_loss": -11.683722496032715, "global_step": 497017, "epoch": 2958} {"train_loss": -10.456828117370605, "global_step": 497018, "epoch": 2958} {"train_loss": -10.697755813598633, "global_step": 497019, "epoch": 2958} {"train_loss": -12.601897239685059, "global_step": 497020, "epoch": 2958} {"train_loss": -9.945422172546387, "global_step": 497021, "epoch": 2958} {"train_loss": -12.133727073669434, "global_step": 497022, "epoch": 2958} {"train_loss": -10.342046737670898, "global_step": 497023, "epoch": 2958} {"train_loss": -10.466224670410156, "global_step": 497024, "epoch": 2958} {"train_loss": -11.744489669799805, "global_step": 497025, "epoch": 2958} {"train_loss": -11.018856048583984, "global_step": 497026, "epoch": 2958} {"train_loss": -11.61400032043457, "global_step": 497027, "epoch": 2958} {"train_loss": -11.371077537536621, "global_step": 497028, "epoch": 2958} {"train_loss": -11.912841796875, "global_step": 497029, "epoch": 2958} {"train_loss": -11.27523422241211, "global_step": 497030, "epoch": 2958} {"train_loss": -11.922466278076172, "global_step": 497031, "epoch": 2958} {"train_loss": -11.306512832641602, "global_step": 497032, "epoch": 2958} {"train_loss": -10.501056671142578, "global_step": 497033, "epoch": 2958} {"train_loss": -10.801362037658691, "global_step": 497034, "epoch": 2958} {"train_loss": -11.137807846069336, "global_step": 497035, "epoch": 2958} {"train_loss": -11.648311614990234, "global_step": 497036, "epoch": 2958} {"train_loss": -11.420576095581055, "global_step": 497037, "epoch": 2958} {"train_loss": -12.077494621276855, "global_step": 497038, "epoch": 2958} {"train_loss": -11.654300689697266, "global_step": 497039, "epoch": 2958} {"train_loss": -11.4408540725708, "global_step": 497040, "epoch": 2958} {"train_loss": -11.132244110107422, "global_step": 497041, "epoch": 2958} {"train_loss": -11.716704368591309, "global_step": 497042, "epoch": 2958} {"train_loss": -11.6022367477417, "global_step": 497043, "epoch": 2958} {"train_loss": -12.030008316040039, "global_step": 497044, "epoch": 2958} {"train_loss": -11.702363967895508, "global_step": 497045, "epoch": 2958} {"train_loss": -11.045784950256348, "global_step": 497046, "epoch": 2958} {"train_loss": -12.048171997070312, "global_step": 497047, "epoch": 2958} {"train_loss": -11.296257019042969, "global_step": 497048, "epoch": 2958} {"train_loss": -11.000194549560547, "global_step": 497049, "epoch": 2958} {"train_loss": -12.072391510009766, "global_step": 497050, "epoch": 2958} {"train_loss": -10.895060539245605, "global_step": 497051, "epoch": 2958} {"train_loss": -11.6146240234375, "global_step": 497052, "epoch": 2958} {"train_loss": -11.163793563842773, "global_step": 497053, "epoch": 2958} {"train_loss": -11.791696548461914, "global_step": 497054, "epoch": 2958} {"train_loss": -11.871074676513672, "global_step": 497055, "epoch": 2958} {"train_loss": -11.736617088317871, "global_step": 497056, "epoch": 2958} {"train_loss": -11.962030410766602, "global_step": 497057, "epoch": 2958} {"train_loss": -11.689945220947266, "global_step": 497058, "epoch": 2958} {"train_loss": -11.980533599853516, "global_step": 497059, "epoch": 2958} {"train_loss": -11.839357376098633, "global_step": 497060, "epoch": 2958} {"train_loss": -12.08572006225586, "global_step": 497061, "epoch": 2958} {"train_loss": -11.485682487487793, "global_step": 497062, "epoch": 2958} {"train_loss": -11.053529739379883, "global_step": 497063, "epoch": 2958} {"train_loss": -11.756200790405273, "global_step": 497064, "epoch": 2958} {"train_loss": -10.826545715332031, "global_step": 497065, "epoch": 2958} {"train_loss": -12.188833236694336, "global_step": 497066, "epoch": 2958} {"train_loss": -11.776346206665039, "global_step": 497067, "epoch": 2958} {"train_loss": -11.621191024780273, "global_step": 497068, "epoch": 2958} {"train_loss": -11.833795547485352, "global_step": 497069, "epoch": 2958} {"train_loss": -12.269769668579102, "global_step": 497070, "epoch": 2958} {"train_loss": -11.310585021972656, "global_step": 497071, "epoch": 2958} {"train_loss": -11.737556457519531, "global_step": 497072, "epoch": 2958} {"train_loss": -11.907245635986328, "global_step": 497073, "epoch": 2958} {"train_loss": -11.441993713378906, "global_step": 497074, "epoch": 2958} {"train_loss": -11.86530876159668, "global_step": 497075, "epoch": 2958} {"train_loss": -11.042410850524902, "global_step": 497076, "epoch": 2958} {"train_loss": -11.66323471069336, "global_step": 497077, "epoch": 2958} {"train_loss": -12.105998039245605, "global_step": 497078, "epoch": 2958} {"train_loss": -11.787477493286133, "global_step": 497079, "epoch": 2958} {"train_loss": -12.391865730285645, "global_step": 497080, "epoch": 2958} {"train_loss": -12.277851104736328, "global_step": 497081, "epoch": 2958} {"train_loss": -11.99283504486084, "global_step": 497082, "epoch": 2958} {"train_loss": -12.624685287475586, "global_step": 497083, "epoch": 2958} {"train_loss": -12.100618362426758, "global_step": 497084, "epoch": 2958} {"train_loss": -11.860860824584961, "global_step": 497085, "epoch": 2958} {"train_loss": -12.228910446166992, "global_step": 497086, "epoch": 2958} {"train_loss": -12.490917205810547, "global_step": 497087, "epoch": 2958} {"train_loss": -12.342925071716309, "global_step": 497088, "epoch": 2958} {"train_loss": -11.706501007080078, "global_step": 497089, "epoch": 2958} {"train_loss": -12.383015632629395, "global_step": 497090, "epoch": 2958} {"train_loss": -11.850862503051758, "global_step": 497091, "epoch": 2958} {"train_loss": -12.006490707397461, "global_step": 497092, "epoch": 2958} {"train_loss": -12.267112731933594, "global_step": 497093, "epoch": 2958} {"train_loss": -12.033794403076172, "global_step": 497094, "epoch": 2958} {"train_loss": -12.38585090637207, "global_step": 497095, "epoch": 2958} {"train_loss": -11.78837776184082, "global_step": 497096, "epoch": 2958} {"train_loss": -12.350799560546875, "global_step": 497097, "epoch": 2958} {"train_loss": -12.064931869506836, "global_step": 497098, "epoch": 2958} {"train_loss": -12.180274963378906, "global_step": 497099, "epoch": 2958} {"train_loss": -12.446857452392578, "global_step": 497100, "epoch": 2958} {"train_loss": -12.390724182128906, "global_step": 497101, "epoch": 2958} {"train_loss": -12.607213973999023, "global_step": 497102, "epoch": 2958} {"train_loss": -12.491922378540039, "global_step": 497103, "epoch": 2958} {"train_loss": -12.66051197052002, "global_step": 497104, "epoch": 2958} {"train_loss": -12.502347946166992, "global_step": 497105, "epoch": 2958} {"train_loss": -12.61668586730957, "global_step": 497106, "epoch": 2958} {"train_loss": -12.292806625366211, "global_step": 497107, "epoch": 2958} {"train_loss": -12.511577606201172, "global_step": 497108, "epoch": 2958} {"train_loss": -12.613628387451172, "global_step": 497109, "epoch": 2958} {"train_loss": -12.370141983032227, "global_step": 497110, "epoch": 2958} {"train_loss": -12.214822093645731, "global_step": 497111, "epoch": 2958, "val_loss": 322697.0625} {"train_loss": -12.426093101501465, "global_step": 497112, "epoch": 2959} {"train_loss": -12.648744583129883, "global_step": 497113, "epoch": 2959} {"train_loss": -12.43716049194336, "global_step": 497114, "epoch": 2959} {"train_loss": -12.707805633544922, "global_step": 497115, "epoch": 2959} {"train_loss": -11.999938011169434, "global_step": 497116, "epoch": 2959} {"train_loss": -12.417957305908203, "global_step": 497117, "epoch": 2959} {"train_loss": -12.404556274414062, "global_step": 497118, "epoch": 2959} {"train_loss": -12.408984184265137, "global_step": 497119, "epoch": 2959} {"train_loss": -12.52009391784668, "global_step": 497120, "epoch": 2959} {"train_loss": -12.524328231811523, "global_step": 497121, "epoch": 2959} {"train_loss": -12.287307739257812, "global_step": 497122, "epoch": 2959} {"train_loss": -12.689900398254395, "global_step": 497123, "epoch": 2959} {"train_loss": -12.18153190612793, "global_step": 497124, "epoch": 2959} {"train_loss": -12.53166675567627, "global_step": 497125, "epoch": 2959} {"train_loss": -12.382906913757324, "global_step": 497126, "epoch": 2959} {"train_loss": -12.54430103302002, "global_step": 497127, "epoch": 2959} {"train_loss": -12.755549430847168, "global_step": 497128, "epoch": 2959} {"train_loss": -12.70758056640625, "global_step": 497129, "epoch": 2959} {"train_loss": -12.845182418823242, "global_step": 497130, "epoch": 2959} {"train_loss": -12.42302131652832, "global_step": 497131, "epoch": 2959} {"train_loss": -12.744237899780273, "global_step": 497132, "epoch": 2959} {"train_loss": -12.522299766540527, "global_step": 497133, "epoch": 2959} {"train_loss": -12.968194961547852, "global_step": 497134, "epoch": 2959} {"train_loss": -12.512857437133789, "global_step": 497135, "epoch": 2959} {"train_loss": -12.674318313598633, "global_step": 497136, "epoch": 2959} {"train_loss": -12.481147766113281, "global_step": 497137, "epoch": 2959} {"train_loss": -12.941061019897461, "global_step": 497138, "epoch": 2959} {"train_loss": -12.623619079589844, "global_step": 497139, "epoch": 2959} {"train_loss": -12.863364219665527, "global_step": 497140, "epoch": 2959} {"train_loss": -12.804169654846191, "global_step": 497141, "epoch": 2959} {"train_loss": -12.839822769165039, "global_step": 497142, "epoch": 2959} {"train_loss": -12.529874801635742, "global_step": 497143, "epoch": 2959} {"train_loss": -12.87427043914795, "global_step": 497144, "epoch": 2959} {"train_loss": -12.621068954467773, "global_step": 497145, "epoch": 2959} {"train_loss": -12.8826904296875, "global_step": 497146, "epoch": 2959} {"train_loss": -12.690018653869629, "global_step": 497147, "epoch": 2959} {"train_loss": -12.924158096313477, "global_step": 497148, "epoch": 2959} {"train_loss": -12.749761581420898, "global_step": 497149, "epoch": 2959} {"train_loss": -13.041631698608398, "global_step": 497150, "epoch": 2959} {"train_loss": -12.643241882324219, "global_step": 497151, "epoch": 2959} {"train_loss": -12.89023208618164, "global_step": 497152, "epoch": 2959} {"train_loss": -12.692177772521973, "global_step": 497153, "epoch": 2959} {"train_loss": -12.696392059326172, "global_step": 497154, "epoch": 2959} {"train_loss": -12.573978424072266, "global_step": 497155, "epoch": 2959} {"train_loss": -12.478649139404297, "global_step": 497156, "epoch": 2959} {"train_loss": -11.948348045349121, "global_step": 497157, "epoch": 2959} {"train_loss": -12.400672912597656, "global_step": 497158, "epoch": 2959} {"train_loss": -12.177663803100586, "global_step": 497159, "epoch": 2959} {"train_loss": -11.951984405517578, "global_step": 497160, "epoch": 2959} {"train_loss": -12.71902084350586, "global_step": 497161, "epoch": 2959} {"train_loss": -10.632781028747559, "global_step": 497162, "epoch": 2959} {"train_loss": -12.704733848571777, "global_step": 497163, "epoch": 2959} {"train_loss": -11.264145851135254, "global_step": 497164, "epoch": 2959} {"train_loss": -11.599599838256836, "global_step": 497165, "epoch": 2959} {"train_loss": -12.456533432006836, "global_step": 497166, "epoch": 2959} {"train_loss": -10.953757286071777, "global_step": 497167, "epoch": 2959} {"train_loss": -12.626980781555176, "global_step": 497168, "epoch": 2959} {"train_loss": -10.970149993896484, "global_step": 497169, "epoch": 2959} {"train_loss": -12.069025039672852, "global_step": 497170, "epoch": 2959} {"train_loss": -12.035799026489258, "global_step": 497171, "epoch": 2959} {"train_loss": -11.664169311523438, "global_step": 497172, "epoch": 2959} {"train_loss": -12.442931175231934, "global_step": 497173, "epoch": 2959} {"train_loss": -11.359725952148438, "global_step": 497174, "epoch": 2959} {"train_loss": -11.92518424987793, "global_step": 497175, "epoch": 2959} {"train_loss": -11.149116516113281, "global_step": 497176, "epoch": 2959} {"train_loss": -11.26326847076416, "global_step": 497177, "epoch": 2959} {"train_loss": -10.43847370147705, "global_step": 497178, "epoch": 2959} {"train_loss": -10.69371223449707, "global_step": 497179, "epoch": 2959} {"train_loss": -10.333341598510742, "global_step": 497180, "epoch": 2959} {"train_loss": -11.750585556030273, "global_step": 497181, "epoch": 2959} {"train_loss": -11.509611129760742, "global_step": 497182, "epoch": 2959} {"train_loss": -12.047791481018066, "global_step": 497183, "epoch": 2959} {"train_loss": -12.325201034545898, "global_step": 497184, "epoch": 2959} {"train_loss": -11.001291275024414, "global_step": 497185, "epoch": 2959} {"train_loss": -11.910087585449219, "global_step": 497186, "epoch": 2959} {"train_loss": -11.311495780944824, "global_step": 497187, "epoch": 2959} {"train_loss": -12.17533016204834, "global_step": 497188, "epoch": 2959} {"train_loss": -11.760749816894531, "global_step": 497189, "epoch": 2959} {"train_loss": -11.801942825317383, "global_step": 497190, "epoch": 2959} {"train_loss": -12.119245529174805, "global_step": 497191, "epoch": 2959} {"train_loss": -11.674849510192871, "global_step": 497192, "epoch": 2959} {"train_loss": -12.299568176269531, "global_step": 497193, "epoch": 2959} {"train_loss": -12.099664688110352, "global_step": 497194, "epoch": 2959} {"train_loss": -12.085623741149902, "global_step": 497195, "epoch": 2959} {"train_loss": -12.35346794128418, "global_step": 497196, "epoch": 2959} {"train_loss": -12.008931159973145, "global_step": 497197, "epoch": 2959} {"train_loss": -12.486024856567383, "global_step": 497198, "epoch": 2959} {"train_loss": -12.456808090209961, "global_step": 497199, "epoch": 2959} {"train_loss": -12.392230987548828, "global_step": 497200, "epoch": 2959} {"train_loss": -12.631941795349121, "global_step": 497201, "epoch": 2959} {"train_loss": -12.193315505981445, "global_step": 497202, "epoch": 2959} {"train_loss": -12.058893203735352, "global_step": 497203, "epoch": 2959} {"train_loss": -12.138734817504883, "global_step": 497204, "epoch": 2959} {"train_loss": -11.992713928222656, "global_step": 497205, "epoch": 2959} {"train_loss": -12.364570617675781, "global_step": 497206, "epoch": 2959} {"train_loss": -12.462804794311523, "global_step": 497207, "epoch": 2959} {"train_loss": -12.086416244506836, "global_step": 497208, "epoch": 2959} {"train_loss": -12.109247207641602, "global_step": 497209, "epoch": 2959} {"train_loss": -12.442628860473633, "global_step": 497210, "epoch": 2959} {"train_loss": -12.409992218017578, "global_step": 497211, "epoch": 2959} {"train_loss": -11.921468734741211, "global_step": 497212, "epoch": 2959} {"train_loss": -12.739609718322754, "global_step": 497213, "epoch": 2959} {"train_loss": -12.39865493774414, "global_step": 497214, "epoch": 2959} {"train_loss": -12.273506164550781, "global_step": 497215, "epoch": 2959} {"train_loss": -12.624988555908203, "global_step": 497216, "epoch": 2959} {"train_loss": -12.190366744995117, "global_step": 497217, "epoch": 2959} {"train_loss": -12.580041885375977, "global_step": 497218, "epoch": 2959} {"train_loss": -12.44843864440918, "global_step": 497219, "epoch": 2959} {"train_loss": -12.177139282226562, "global_step": 497220, "epoch": 2959} {"train_loss": -12.101995468139648, "global_step": 497221, "epoch": 2959} {"train_loss": -12.384086608886719, "global_step": 497222, "epoch": 2959} {"train_loss": -12.258023262023926, "global_step": 497223, "epoch": 2959} {"train_loss": -12.64169692993164, "global_step": 497224, "epoch": 2959} {"train_loss": -12.066901206970215, "global_step": 497225, "epoch": 2959} {"train_loss": -12.625362396240234, "global_step": 497226, "epoch": 2959} {"train_loss": -12.536428451538086, "global_step": 497227, "epoch": 2959} {"train_loss": -12.259988784790039, "global_step": 497228, "epoch": 2959} {"train_loss": -12.35363483428955, "global_step": 497229, "epoch": 2959} {"train_loss": -12.279047012329102, "global_step": 497230, "epoch": 2959} {"train_loss": -12.944847106933594, "global_step": 497231, "epoch": 2959} {"train_loss": -11.806873321533203, "global_step": 497232, "epoch": 2959} {"train_loss": -12.157552719116211, "global_step": 497233, "epoch": 2959} {"train_loss": -12.595489501953125, "global_step": 497234, "epoch": 2959} {"train_loss": -12.011119842529297, "global_step": 497235, "epoch": 2959} {"train_loss": -11.90013599395752, "global_step": 497236, "epoch": 2959} {"train_loss": -12.387797355651855, "global_step": 497237, "epoch": 2959} {"train_loss": -12.207695007324219, "global_step": 497238, "epoch": 2959} {"train_loss": -12.106407165527344, "global_step": 497239, "epoch": 2959} {"train_loss": -12.750040054321289, "global_step": 497240, "epoch": 2959} {"train_loss": -12.423458099365234, "global_step": 497241, "epoch": 2959} {"train_loss": -12.903156280517578, "global_step": 497242, "epoch": 2959} {"train_loss": -12.522699356079102, "global_step": 497243, "epoch": 2959} {"train_loss": -12.674971580505371, "global_step": 497244, "epoch": 2959} {"train_loss": -12.098857879638672, "global_step": 497245, "epoch": 2959} {"train_loss": -12.777018547058105, "global_step": 497246, "epoch": 2959} {"train_loss": -12.568710327148438, "global_step": 497247, "epoch": 2959} {"train_loss": -12.545023918151855, "global_step": 497248, "epoch": 2959} {"train_loss": -12.242042541503906, "global_step": 497249, "epoch": 2959} {"train_loss": -12.791553497314453, "global_step": 497250, "epoch": 2959} {"train_loss": -12.721002578735352, "global_step": 497251, "epoch": 2959} {"train_loss": -12.625580787658691, "global_step": 497252, "epoch": 2959} {"train_loss": -12.558615684509277, "global_step": 497253, "epoch": 2959} {"train_loss": -12.68572998046875, "global_step": 497254, "epoch": 2959} {"train_loss": -12.395073890686035, "global_step": 497255, "epoch": 2959} {"train_loss": -12.494430541992188, "global_step": 497256, "epoch": 2959} {"train_loss": -12.777667999267578, "global_step": 497257, "epoch": 2959} {"train_loss": -12.588523864746094, "global_step": 497258, "epoch": 2959} {"train_loss": -12.566877365112305, "global_step": 497259, "epoch": 2959} {"train_loss": -12.698012351989746, "global_step": 497260, "epoch": 2959} {"train_loss": -12.505727767944336, "global_step": 497261, "epoch": 2959} {"train_loss": -12.669733047485352, "global_step": 497262, "epoch": 2959} {"train_loss": -12.5885009765625, "global_step": 497263, "epoch": 2959} {"train_loss": -12.501842498779297, "global_step": 497264, "epoch": 2959} {"train_loss": -12.419898986816406, "global_step": 497265, "epoch": 2959} {"train_loss": -12.813629150390625, "global_step": 497266, "epoch": 2959} {"train_loss": -12.631906509399414, "global_step": 497267, "epoch": 2959} {"train_loss": -12.690086364746094, "global_step": 497268, "epoch": 2959} {"train_loss": -12.588410377502441, "global_step": 497269, "epoch": 2959} {"train_loss": -12.62716293334961, "global_step": 497270, "epoch": 2959} {"train_loss": -12.982547760009766, "global_step": 497271, "epoch": 2959} {"train_loss": -12.446084976196289, "global_step": 497272, "epoch": 2959} {"train_loss": -12.753387451171875, "global_step": 497273, "epoch": 2959} {"train_loss": -12.759130477905273, "global_step": 497274, "epoch": 2959} {"train_loss": -12.384366989135742, "global_step": 497275, "epoch": 2959} {"train_loss": -12.833470344543457, "global_step": 497276, "epoch": 2959} {"train_loss": -12.426200866699219, "global_step": 497277, "epoch": 2959} {"train_loss": -12.97183895111084, "global_step": 497278, "epoch": 2959} {"train_loss": -12.332533989633832, "global_step": 497279, "epoch": 2959, "val_loss": 319389.03125} {"train_loss": -12.818641662597656, "global_step": 497280, "epoch": 2960} {"train_loss": -12.844966888427734, "global_step": 497281, "epoch": 2960} {"train_loss": -12.967730522155762, "global_step": 497282, "epoch": 2960} {"train_loss": -12.753164291381836, "global_step": 497283, "epoch": 2960} {"train_loss": -12.984126091003418, "global_step": 497284, "epoch": 2960} {"train_loss": -12.500771522521973, "global_step": 497285, "epoch": 2960} {"train_loss": -12.865543365478516, "global_step": 497286, "epoch": 2960} {"train_loss": -12.627140045166016, "global_step": 497287, "epoch": 2960} {"train_loss": -12.92032241821289, "global_step": 497288, "epoch": 2960} {"train_loss": -12.812341690063477, "global_step": 497289, "epoch": 2960} {"train_loss": -12.765340805053711, "global_step": 497290, "epoch": 2960} {"train_loss": -12.868597030639648, "global_step": 497291, "epoch": 2960} {"train_loss": -12.98696517944336, "global_step": 497292, "epoch": 2960} {"train_loss": -12.820083618164062, "global_step": 497293, "epoch": 2960} {"train_loss": -12.924365997314453, "global_step": 497294, "epoch": 2960} {"train_loss": -12.960953712463379, "global_step": 497295, "epoch": 2960} {"train_loss": -12.800212860107422, "global_step": 497296, "epoch": 2960} {"train_loss": -12.45164680480957, "global_step": 497297, "epoch": 2960} {"train_loss": -11.687853813171387, "global_step": 497298, "epoch": 2960} {"train_loss": -12.016214370727539, "global_step": 497299, "epoch": 2960} {"train_loss": -12.878408432006836, "global_step": 497300, "epoch": 2960} {"train_loss": -12.026515007019043, "global_step": 497301, "epoch": 2960} {"train_loss": -12.025446891784668, "global_step": 497302, "epoch": 2960} {"train_loss": -11.205090522766113, "global_step": 497303, "epoch": 2960} {"train_loss": -10.151155471801758, "global_step": 497304, "epoch": 2960} {"train_loss": -10.51889705657959, "global_step": 497305, "epoch": 2960} {"train_loss": -12.436439514160156, "global_step": 497306, "epoch": 2960} {"train_loss": -10.620025634765625, "global_step": 497307, "epoch": 2960} {"train_loss": -11.87072467803955, "global_step": 497308, "epoch": 2960} {"train_loss": -11.262931823730469, "global_step": 497309, "epoch": 2960} {"train_loss": -12.019052505493164, "global_step": 497310, "epoch": 2960} {"train_loss": -10.604901313781738, "global_step": 497311, "epoch": 2960} {"train_loss": -10.52672290802002, "global_step": 497312, "epoch": 2960} {"train_loss": -11.939640045166016, "global_step": 497313, "epoch": 2960} {"train_loss": -10.185386657714844, "global_step": 497314, "epoch": 2960} {"train_loss": -9.64459228515625, "global_step": 497315, "epoch": 2960} {"train_loss": -9.349395751953125, "global_step": 497316, "epoch": 2960} {"train_loss": -10.890609741210938, "global_step": 497317, "epoch": 2960} {"train_loss": -11.874253273010254, "global_step": 497318, "epoch": 2960} {"train_loss": -11.006945610046387, "global_step": 497319, "epoch": 2960} {"train_loss": -11.664705276489258, "global_step": 497320, "epoch": 2960} {"train_loss": -10.67216682434082, "global_step": 497321, "epoch": 2960} {"train_loss": -10.483329772949219, "global_step": 497322, "epoch": 2960} {"train_loss": -10.290946960449219, "global_step": 497323, "epoch": 2960} {"train_loss": -11.364328384399414, "global_step": 497324, "epoch": 2960} {"train_loss": -11.743335723876953, "global_step": 497325, "epoch": 2960} {"train_loss": -11.293603897094727, "global_step": 497326, "epoch": 2960} {"train_loss": -11.47626781463623, "global_step": 497327, "epoch": 2960} {"train_loss": -11.586265563964844, "global_step": 497328, "epoch": 2960} {"train_loss": -11.880504608154297, "global_step": 497329, "epoch": 2960} {"train_loss": -10.859617233276367, "global_step": 497330, "epoch": 2960} {"train_loss": -11.481409072875977, "global_step": 497331, "epoch": 2960} {"train_loss": -10.662349700927734, "global_step": 497332, "epoch": 2960} {"train_loss": -11.034685134887695, "global_step": 497333, "epoch": 2960} {"train_loss": -11.879680633544922, "global_step": 497334, "epoch": 2960} {"train_loss": -11.15817642211914, "global_step": 497335, "epoch": 2960} {"train_loss": -11.91818618774414, "global_step": 497336, "epoch": 2960} {"train_loss": -10.830514907836914, "global_step": 497337, "epoch": 2960} {"train_loss": -11.875589370727539, "global_step": 497338, "epoch": 2960} {"train_loss": -9.718246459960938, "global_step": 497339, "epoch": 2960} {"train_loss": -11.17916488647461, "global_step": 497340, "epoch": 2960} {"train_loss": -10.315210342407227, "global_step": 497341, "epoch": 2960} {"train_loss": -10.874458312988281, "global_step": 497342, "epoch": 2960} {"train_loss": -10.15045166015625, "global_step": 497343, "epoch": 2960} {"train_loss": -11.129091262817383, "global_step": 497344, "epoch": 2960} {"train_loss": -9.424068450927734, "global_step": 497345, "epoch": 2960} {"train_loss": -11.144113540649414, "global_step": 497346, "epoch": 2960} {"train_loss": -9.232336044311523, "global_step": 497347, "epoch": 2960} {"train_loss": -10.463323593139648, "global_step": 497348, "epoch": 2960} {"train_loss": -10.276848793029785, "global_step": 497349, "epoch": 2960} {"train_loss": -9.51889705657959, "global_step": 497350, "epoch": 2960} {"train_loss": -11.71615219116211, "global_step": 497351, "epoch": 2960} {"train_loss": -10.224507331848145, "global_step": 497352, "epoch": 2960} {"train_loss": -11.029949188232422, "global_step": 497353, "epoch": 2960} {"train_loss": -10.65740966796875, "global_step": 497354, "epoch": 2960} {"train_loss": -10.99205207824707, "global_step": 497355, "epoch": 2960} {"train_loss": -11.118758201599121, "global_step": 497356, "epoch": 2960} {"train_loss": -11.57925796508789, "global_step": 497357, "epoch": 2960} {"train_loss": -11.729122161865234, "global_step": 497358, "epoch": 2960} {"train_loss": -11.212495803833008, "global_step": 497359, "epoch": 2960} {"train_loss": -11.976380348205566, "global_step": 497360, "epoch": 2960} {"train_loss": -11.543733596801758, "global_step": 497361, "epoch": 2960} {"train_loss": -11.532758712768555, "global_step": 497362, "epoch": 2960} {"train_loss": -11.925971984863281, "global_step": 497363, "epoch": 2960} {"train_loss": -11.976070404052734, "global_step": 497364, "epoch": 2960} {"train_loss": -11.552902221679688, "global_step": 497365, "epoch": 2960} {"train_loss": -12.02486801147461, "global_step": 497366, "epoch": 2960} {"train_loss": -11.732536315917969, "global_step": 497367, "epoch": 2960} {"train_loss": -12.483443260192871, "global_step": 497368, "epoch": 2960} {"train_loss": -12.057657241821289, "global_step": 497369, "epoch": 2960} {"train_loss": -12.339242935180664, "global_step": 497370, "epoch": 2960} {"train_loss": -12.038568496704102, "global_step": 497371, "epoch": 2960} {"train_loss": -12.271421432495117, "global_step": 497372, "epoch": 2960} {"train_loss": -11.990386009216309, "global_step": 497373, "epoch": 2960} {"train_loss": -12.248828887939453, "global_step": 497374, "epoch": 2960} {"train_loss": -12.268354415893555, "global_step": 497375, "epoch": 2960} {"train_loss": -11.641654968261719, "global_step": 497376, "epoch": 2960} {"train_loss": -12.422497749328613, "global_step": 497377, "epoch": 2960} {"train_loss": -12.082168579101562, "global_step": 497378, "epoch": 2960} {"train_loss": -12.376503944396973, "global_step": 497379, "epoch": 2960} {"train_loss": -11.92814826965332, "global_step": 497380, "epoch": 2960} {"train_loss": -12.4691743850708, "global_step": 497381, "epoch": 2960} {"train_loss": -11.950581550598145, "global_step": 497382, "epoch": 2960} {"train_loss": -12.346755981445312, "global_step": 497383, "epoch": 2960} {"train_loss": -12.347801208496094, "global_step": 497384, "epoch": 2960} {"train_loss": -12.449270248413086, "global_step": 497385, "epoch": 2960} {"train_loss": -12.108293533325195, "global_step": 497386, "epoch": 2960} {"train_loss": -12.121822357177734, "global_step": 497387, "epoch": 2960} {"train_loss": -12.190605163574219, "global_step": 497388, "epoch": 2960} {"train_loss": -11.954486846923828, "global_step": 497389, "epoch": 2960} {"train_loss": -12.251466751098633, "global_step": 497390, "epoch": 2960} {"train_loss": -12.411577224731445, "global_step": 497391, "epoch": 2960} {"train_loss": -12.098282814025879, "global_step": 497392, "epoch": 2960} {"train_loss": -12.406919479370117, "global_step": 497393, "epoch": 2960} {"train_loss": -12.041036605834961, "global_step": 497394, "epoch": 2960} {"train_loss": -12.19856071472168, "global_step": 497395, "epoch": 2960} {"train_loss": -12.14382553100586, "global_step": 497396, "epoch": 2960} {"train_loss": -12.155760765075684, "global_step": 497397, "epoch": 2960} {"train_loss": -12.455389022827148, "global_step": 497398, "epoch": 2960} {"train_loss": -12.448899269104004, "global_step": 497399, "epoch": 2960} {"train_loss": -12.304054260253906, "global_step": 497400, "epoch": 2960} {"train_loss": -12.126699447631836, "global_step": 497401, "epoch": 2960} {"train_loss": -12.311912536621094, "global_step": 497402, "epoch": 2960} {"train_loss": -12.656381607055664, "global_step": 497403, "epoch": 2960} {"train_loss": -12.412934303283691, "global_step": 497404, "epoch": 2960} {"train_loss": -12.664668083190918, "global_step": 497405, "epoch": 2960} {"train_loss": -12.450393676757812, "global_step": 497406, "epoch": 2960} {"train_loss": -12.695856094360352, "global_step": 497407, "epoch": 2960} {"train_loss": -12.276388168334961, "global_step": 497408, "epoch": 2960} {"train_loss": -12.652164459228516, "global_step": 497409, "epoch": 2960} {"train_loss": -12.333585739135742, "global_step": 497410, "epoch": 2960} {"train_loss": -12.365097045898438, "global_step": 497411, "epoch": 2960} {"train_loss": -12.306571960449219, "global_step": 497412, "epoch": 2960} {"train_loss": -12.425337791442871, "global_step": 497413, "epoch": 2960} {"train_loss": -12.600393295288086, "global_step": 497414, "epoch": 2960} {"train_loss": -12.089406967163086, "global_step": 497415, "epoch": 2960} {"train_loss": -12.383840560913086, "global_step": 497416, "epoch": 2960} {"train_loss": -12.454794883728027, "global_step": 497417, "epoch": 2960} {"train_loss": -12.471883773803711, "global_step": 497418, "epoch": 2960} {"train_loss": -12.532770156860352, "global_step": 497419, "epoch": 2960} {"train_loss": -12.214988708496094, "global_step": 497420, "epoch": 2960} {"train_loss": -12.761302947998047, "global_step": 497421, "epoch": 2960} {"train_loss": -12.601797103881836, "global_step": 497422, "epoch": 2960} {"train_loss": -12.62157917022705, "global_step": 497423, "epoch": 2960} {"train_loss": -12.411368370056152, "global_step": 497424, "epoch": 2960} {"train_loss": -12.594258308410645, "global_step": 497425, "epoch": 2960} {"train_loss": -12.765853881835938, "global_step": 497426, "epoch": 2960} {"train_loss": -12.511062622070312, "global_step": 497427, "epoch": 2960} {"train_loss": -12.660054206848145, "global_step": 497428, "epoch": 2960} {"train_loss": -12.72341537475586, "global_step": 497429, "epoch": 2960} {"train_loss": -12.585497856140137, "global_step": 497430, "epoch": 2960} {"train_loss": -12.587116241455078, "global_step": 497431, "epoch": 2960} {"train_loss": -12.3070068359375, "global_step": 497432, "epoch": 2960} {"train_loss": -12.637550354003906, "global_step": 497433, "epoch": 2960} {"train_loss": -12.303777694702148, "global_step": 497434, "epoch": 2960} {"train_loss": -12.691414833068848, "global_step": 497435, "epoch": 2960} {"train_loss": -12.46505355834961, "global_step": 497436, "epoch": 2960} {"train_loss": -12.459992408752441, "global_step": 497437, "epoch": 2960} {"train_loss": -12.435806274414062, "global_step": 497438, "epoch": 2960} {"train_loss": -12.573502540588379, "global_step": 497439, "epoch": 2960} {"train_loss": -12.217367172241211, "global_step": 497440, "epoch": 2960} {"train_loss": -12.728103637695312, "global_step": 497441, "epoch": 2960} {"train_loss": -12.633465766906738, "global_step": 497442, "epoch": 2960} {"train_loss": -12.574495315551758, "global_step": 497443, "epoch": 2960} {"train_loss": -12.348812103271484, "global_step": 497444, "epoch": 2960} {"train_loss": -12.42440128326416, "global_step": 497445, "epoch": 2960} {"train_loss": -12.783034324645996, "global_step": 497446, "epoch": 2960} {"train_loss": -11.900842286291576, "global_step": 497447, "epoch": 2960, "val_loss": 321539.9375, "train_action_mse_error": 1.7174620628356934} {"train_loss": -12.420467376708984, "global_step": 497448, "epoch": 2961} {"train_loss": -12.495868682861328, "global_step": 497449, "epoch": 2961} {"train_loss": -12.44894027709961, "global_step": 497450, "epoch": 2961} {"train_loss": -12.68252944946289, "global_step": 497451, "epoch": 2961} {"train_loss": -12.374200820922852, "global_step": 497452, "epoch": 2961} {"train_loss": -12.376142501831055, "global_step": 497453, "epoch": 2961} {"train_loss": -12.378222465515137, "global_step": 497454, "epoch": 2961} {"train_loss": -12.538883209228516, "global_step": 497455, "epoch": 2961} {"train_loss": -12.352399826049805, "global_step": 497456, "epoch": 2961} {"train_loss": -12.653715133666992, "global_step": 497457, "epoch": 2961} {"train_loss": -12.369855880737305, "global_step": 497458, "epoch": 2961} {"train_loss": -12.644829750061035, "global_step": 497459, "epoch": 2961} {"train_loss": -12.548440933227539, "global_step": 497460, "epoch": 2961} {"train_loss": -12.728433609008789, "global_step": 497461, "epoch": 2961} {"train_loss": -12.908971786499023, "global_step": 497462, "epoch": 2961} {"train_loss": -12.843643188476562, "global_step": 497463, "epoch": 2961} {"train_loss": -12.719942092895508, "global_step": 497464, "epoch": 2961} {"train_loss": -12.931201934814453, "global_step": 497465, "epoch": 2961} {"train_loss": -12.922707557678223, "global_step": 497466, "epoch": 2961} {"train_loss": -12.832088470458984, "global_step": 497467, "epoch": 2961} {"train_loss": -12.654346466064453, "global_step": 497468, "epoch": 2961} {"train_loss": -12.888668060302734, "global_step": 497469, "epoch": 2961} {"train_loss": -13.040962219238281, "global_step": 497470, "epoch": 2961} {"train_loss": -12.6402006149292, "global_step": 497471, "epoch": 2961} {"train_loss": -12.797554016113281, "global_step": 497472, "epoch": 2961} {"train_loss": -12.889668464660645, "global_step": 497473, "epoch": 2961} {"train_loss": -13.123409271240234, "global_step": 497474, "epoch": 2961} {"train_loss": -12.966700553894043, "global_step": 497475, "epoch": 2961} {"train_loss": -12.942434310913086, "global_step": 497476, "epoch": 2961} {"train_loss": -12.927857398986816, "global_step": 497477, "epoch": 2961} {"train_loss": -12.822006225585938, "global_step": 497478, "epoch": 2961} {"train_loss": -13.027933120727539, "global_step": 497479, "epoch": 2961} {"train_loss": -12.842538833618164, "global_step": 497480, "epoch": 2961} {"train_loss": -13.207443237304688, "global_step": 497481, "epoch": 2961} {"train_loss": -12.963987350463867, "global_step": 497482, "epoch": 2961} {"train_loss": -12.967612266540527, "global_step": 497483, "epoch": 2961} {"train_loss": -12.66373062133789, "global_step": 497484, "epoch": 2961} {"train_loss": -12.832185745239258, "global_step": 497485, "epoch": 2961} {"train_loss": -12.953015327453613, "global_step": 497486, "epoch": 2961} {"train_loss": -12.609256744384766, "global_step": 497487, "epoch": 2961} {"train_loss": -11.925987243652344, "global_step": 497488, "epoch": 2961} {"train_loss": -12.687247276306152, "global_step": 497489, "epoch": 2961} {"train_loss": -12.82850170135498, "global_step": 497490, "epoch": 2961} {"train_loss": -12.216922760009766, "global_step": 497491, "epoch": 2961} {"train_loss": -11.735889434814453, "global_step": 497492, "epoch": 2961} {"train_loss": -12.82553482055664, "global_step": 497493, "epoch": 2961} {"train_loss": -12.408059120178223, "global_step": 497494, "epoch": 2961} {"train_loss": -12.347482681274414, "global_step": 497495, "epoch": 2961} {"train_loss": -11.447678565979004, "global_step": 497496, "epoch": 2961} {"train_loss": -11.783260345458984, "global_step": 497497, "epoch": 2961} {"train_loss": -12.36049747467041, "global_step": 497498, "epoch": 2961} {"train_loss": -9.90880012512207, "global_step": 497499, "epoch": 2961} {"train_loss": -12.02367877960205, "global_step": 497500, "epoch": 2961} {"train_loss": -11.681013107299805, "global_step": 497501, "epoch": 2961} {"train_loss": -11.09683895111084, "global_step": 497502, "epoch": 2961} {"train_loss": -10.099018096923828, "global_step": 497503, "epoch": 2961} {"train_loss": -10.448122024536133, "global_step": 497504, "epoch": 2961} {"train_loss": -10.546660423278809, "global_step": 497505, "epoch": 2961} {"train_loss": -11.438512802124023, "global_step": 497506, "epoch": 2961} {"train_loss": -10.909688949584961, "global_step": 497507, "epoch": 2961} {"train_loss": -10.229768753051758, "global_step": 497508, "epoch": 2961} {"train_loss": -10.330974578857422, "global_step": 497509, "epoch": 2961} {"train_loss": -10.636283874511719, "global_step": 497510, "epoch": 2961} {"train_loss": -9.776773452758789, "global_step": 497511, "epoch": 2961} {"train_loss": -10.424565315246582, "global_step": 497512, "epoch": 2961} {"train_loss": -11.465449333190918, "global_step": 497513, "epoch": 2961} {"train_loss": -9.152883529663086, "global_step": 497514, "epoch": 2961} {"train_loss": -11.476734161376953, "global_step": 497515, "epoch": 2961} {"train_loss": -10.777612686157227, "global_step": 497516, "epoch": 2961} {"train_loss": -10.803619384765625, "global_step": 497517, "epoch": 2961} {"train_loss": -11.495060920715332, "global_step": 497518, "epoch": 2961} {"train_loss": -9.754559516906738, "global_step": 497519, "epoch": 2961} {"train_loss": -11.017019271850586, "global_step": 497520, "epoch": 2961} {"train_loss": -11.100040435791016, "global_step": 497521, "epoch": 2961} {"train_loss": -10.723078727722168, "global_step": 497522, "epoch": 2961} {"train_loss": -11.174668312072754, "global_step": 497523, "epoch": 2961} {"train_loss": -11.999567031860352, "global_step": 497524, "epoch": 2961} {"train_loss": -10.819936752319336, "global_step": 497525, "epoch": 2961} {"train_loss": -11.683414459228516, "global_step": 497526, "epoch": 2961} {"train_loss": -11.713785171508789, "global_step": 497527, "epoch": 2961} {"train_loss": -11.407487869262695, "global_step": 497528, "epoch": 2961} {"train_loss": -12.124938011169434, "global_step": 497529, "epoch": 2961} {"train_loss": -11.896598815917969, "global_step": 497530, "epoch": 2961} {"train_loss": -11.86220932006836, "global_step": 497531, "epoch": 2961} {"train_loss": -11.532218933105469, "global_step": 497532, "epoch": 2961} {"train_loss": -11.962125778198242, "global_step": 497533, "epoch": 2961} {"train_loss": -12.108114242553711, "global_step": 497534, "epoch": 2961} {"train_loss": -12.395636558532715, "global_step": 497535, "epoch": 2961} {"train_loss": -12.305435180664062, "global_step": 497536, "epoch": 2961} {"train_loss": -12.118249893188477, "global_step": 497537, "epoch": 2961} {"train_loss": -12.221487998962402, "global_step": 497538, "epoch": 2961} {"train_loss": -12.59646224975586, "global_step": 497539, "epoch": 2961} {"train_loss": -11.996849060058594, "global_step": 497540, "epoch": 2961} {"train_loss": -12.253430366516113, "global_step": 497541, "epoch": 2961} {"train_loss": -12.244022369384766, "global_step": 497542, "epoch": 2961} {"train_loss": -12.438758850097656, "global_step": 497543, "epoch": 2961} {"train_loss": -12.245841026306152, "global_step": 497544, "epoch": 2961} {"train_loss": -12.652567863464355, "global_step": 497545, "epoch": 2961} {"train_loss": -12.29570198059082, "global_step": 497546, "epoch": 2961} {"train_loss": -12.492881774902344, "global_step": 497547, "epoch": 2961} {"train_loss": -12.472943305969238, "global_step": 497548, "epoch": 2961} {"train_loss": -12.460350036621094, "global_step": 497549, "epoch": 2961} {"train_loss": -12.433932304382324, "global_step": 497550, "epoch": 2961} {"train_loss": -12.514972686767578, "global_step": 497551, "epoch": 2961} {"train_loss": -12.68187427520752, "global_step": 497552, "epoch": 2961} {"train_loss": -12.458340644836426, "global_step": 497553, "epoch": 2961} {"train_loss": -12.533689498901367, "global_step": 497554, "epoch": 2961} {"train_loss": -12.670541763305664, "global_step": 497555, "epoch": 2961} {"train_loss": -12.674671173095703, "global_step": 497556, "epoch": 2961} {"train_loss": -12.737414360046387, "global_step": 497557, "epoch": 2961} {"train_loss": -12.555517196655273, "global_step": 497558, "epoch": 2961} {"train_loss": -12.583296775817871, "global_step": 497559, "epoch": 2961} {"train_loss": -12.734058380126953, "global_step": 497560, "epoch": 2961} {"train_loss": -12.565362930297852, "global_step": 497561, "epoch": 2961} {"train_loss": -12.682821273803711, "global_step": 497562, "epoch": 2961} {"train_loss": -12.63388442993164, "global_step": 497563, "epoch": 2961} {"train_loss": -12.679326057434082, "global_step": 497564, "epoch": 2961} {"train_loss": -12.968133926391602, "global_step": 497565, "epoch": 2961} {"train_loss": -12.709921836853027, "global_step": 497566, "epoch": 2961} {"train_loss": -12.90422534942627, "global_step": 497567, "epoch": 2961} {"train_loss": -12.556611061096191, "global_step": 497568, "epoch": 2961} {"train_loss": -12.935210227966309, "global_step": 497569, "epoch": 2961} {"train_loss": -12.709741592407227, "global_step": 497570, "epoch": 2961} {"train_loss": -12.709758758544922, "global_step": 497571, "epoch": 2961} {"train_loss": -12.778423309326172, "global_step": 497572, "epoch": 2961} {"train_loss": -12.835140228271484, "global_step": 497573, "epoch": 2961} {"train_loss": -12.550620079040527, "global_step": 497574, "epoch": 2961} {"train_loss": -12.874652862548828, "global_step": 497575, "epoch": 2961} {"train_loss": -12.652721405029297, "global_step": 497576, "epoch": 2961} {"train_loss": -12.82167911529541, "global_step": 497577, "epoch": 2961} {"train_loss": -12.693803787231445, "global_step": 497578, "epoch": 2961} {"train_loss": -12.75705337524414, "global_step": 497579, "epoch": 2961} {"train_loss": -12.675989151000977, "global_step": 497580, "epoch": 2961} {"train_loss": -12.914098739624023, "global_step": 497581, "epoch": 2961} {"train_loss": -12.91014289855957, "global_step": 497582, "epoch": 2961} {"train_loss": -12.86688232421875, "global_step": 497583, "epoch": 2961} {"train_loss": -12.91905689239502, "global_step": 497584, "epoch": 2961} {"train_loss": -12.882944107055664, "global_step": 497585, "epoch": 2961} {"train_loss": -12.906744003295898, "global_step": 497586, "epoch": 2961} {"train_loss": -12.698869705200195, "global_step": 497587, "epoch": 2961} {"train_loss": -12.970606803894043, "global_step": 497588, "epoch": 2961} {"train_loss": -12.642715454101562, "global_step": 497589, "epoch": 2961} {"train_loss": -12.91872787475586, "global_step": 497590, "epoch": 2961} {"train_loss": -12.806122779846191, "global_step": 497591, "epoch": 2961} {"train_loss": -12.83627700805664, "global_step": 497592, "epoch": 2961} {"train_loss": -12.770441055297852, "global_step": 497593, "epoch": 2961} {"train_loss": -12.520806312561035, "global_step": 497594, "epoch": 2961} {"train_loss": -12.205864906311035, "global_step": 497595, "epoch": 2961} {"train_loss": -12.783025741577148, "global_step": 497596, "epoch": 2961} {"train_loss": -12.248978614807129, "global_step": 497597, "epoch": 2961} {"train_loss": -12.177433013916016, "global_step": 497598, "epoch": 2961} {"train_loss": -12.495018005371094, "global_step": 497599, "epoch": 2961} {"train_loss": -12.346261024475098, "global_step": 497600, "epoch": 2961} {"train_loss": -12.513460159301758, "global_step": 497601, "epoch": 2961} {"train_loss": -12.644861221313477, "global_step": 497602, "epoch": 2961} {"train_loss": -12.503056526184082, "global_step": 497603, "epoch": 2961} {"train_loss": -12.766497611999512, "global_step": 497604, "epoch": 2961} {"train_loss": -12.414626121520996, "global_step": 497605, "epoch": 2961} {"train_loss": -13.002937316894531, "global_step": 497606, "epoch": 2961} {"train_loss": -12.501205444335938, "global_step": 497607, "epoch": 2961} {"train_loss": -12.709606170654297, "global_step": 497608, "epoch": 2961} {"train_loss": -12.599386215209961, "global_step": 497609, "epoch": 2961} {"train_loss": -12.773838996887207, "global_step": 497610, "epoch": 2961} {"train_loss": -12.802642822265625, "global_step": 497611, "epoch": 2961} {"train_loss": -12.5494966506958, "global_step": 497612, "epoch": 2961} {"train_loss": -12.136549949645996, "global_step": 497613, "epoch": 2961} {"train_loss": -12.476216316223145, "global_step": 497614, "epoch": 2961} {"train_loss": -12.280385227430434, "global_step": 497615, "epoch": 2961, "val_loss": 319243.75} {"train_loss": -12.33340072631836, "global_step": 497616, "epoch": 2962} {"train_loss": -12.66097640991211, "global_step": 497617, "epoch": 2962} {"train_loss": -12.449495315551758, "global_step": 497618, "epoch": 2962} {"train_loss": -12.686326026916504, "global_step": 497619, "epoch": 2962} {"train_loss": -12.7774019241333, "global_step": 497620, "epoch": 2962} {"train_loss": -12.431598663330078, "global_step": 497621, "epoch": 2962} {"train_loss": -12.45842170715332, "global_step": 497622, "epoch": 2962} {"train_loss": -12.839969635009766, "global_step": 497623, "epoch": 2962} {"train_loss": -12.130318641662598, "global_step": 497624, "epoch": 2962} {"train_loss": -12.051668167114258, "global_step": 497625, "epoch": 2962} {"train_loss": -12.904569625854492, "global_step": 497626, "epoch": 2962} {"train_loss": -11.90886116027832, "global_step": 497627, "epoch": 2962} {"train_loss": -12.558335304260254, "global_step": 497628, "epoch": 2962} {"train_loss": -12.418924331665039, "global_step": 497629, "epoch": 2962} {"train_loss": -12.133365631103516, "global_step": 497630, "epoch": 2962} {"train_loss": -12.208772659301758, "global_step": 497631, "epoch": 2962} {"train_loss": -11.922679901123047, "global_step": 497632, "epoch": 2962} {"train_loss": -12.320295333862305, "global_step": 497633, "epoch": 2962} {"train_loss": -12.170588493347168, "global_step": 497634, "epoch": 2962} {"train_loss": -10.502992630004883, "global_step": 497635, "epoch": 2962} {"train_loss": -11.514132499694824, "global_step": 497636, "epoch": 2962} {"train_loss": -11.475122451782227, "global_step": 497637, "epoch": 2962} {"train_loss": -11.951983451843262, "global_step": 497638, "epoch": 2962} {"train_loss": -11.628931045532227, "global_step": 497639, "epoch": 2962} {"train_loss": -11.541646003723145, "global_step": 497640, "epoch": 2962} {"train_loss": -11.093055725097656, "global_step": 497641, "epoch": 2962} {"train_loss": -12.177009582519531, "global_step": 497642, "epoch": 2962} {"train_loss": -11.03138542175293, "global_step": 497643, "epoch": 2962} {"train_loss": -10.679346084594727, "global_step": 497644, "epoch": 2962} {"train_loss": -11.688398361206055, "global_step": 497645, "epoch": 2962} {"train_loss": -11.133146286010742, "global_step": 497646, "epoch": 2962} {"train_loss": -11.092835426330566, "global_step": 497647, "epoch": 2962} {"train_loss": -12.299339294433594, "global_step": 497648, "epoch": 2962} {"train_loss": -10.780390739440918, "global_step": 497649, "epoch": 2962} {"train_loss": -11.928155899047852, "global_step": 497650, "epoch": 2962} {"train_loss": -10.74457836151123, "global_step": 497651, "epoch": 2962} {"train_loss": -11.0925874710083, "global_step": 497652, "epoch": 2962} {"train_loss": -11.36231517791748, "global_step": 497653, "epoch": 2962} {"train_loss": -9.928701400756836, "global_step": 497654, "epoch": 2962} {"train_loss": -10.067127227783203, "global_step": 497655, "epoch": 2962} {"train_loss": -10.516485214233398, "global_step": 497656, "epoch": 2962} {"train_loss": -10.423093795776367, "global_step": 497657, "epoch": 2962} {"train_loss": -11.33967399597168, "global_step": 497658, "epoch": 2962} {"train_loss": -11.138627052307129, "global_step": 497659, "epoch": 2962} {"train_loss": -11.728277206420898, "global_step": 497660, "epoch": 2962} {"train_loss": -11.970091819763184, "global_step": 497661, "epoch": 2962} {"train_loss": -12.036742210388184, "global_step": 497662, "epoch": 2962} {"train_loss": -11.677974700927734, "global_step": 497663, "epoch": 2962} {"train_loss": -11.894640922546387, "global_step": 497664, "epoch": 2962} {"train_loss": -11.893980026245117, "global_step": 497665, "epoch": 2962} {"train_loss": -12.03921890258789, "global_step": 497666, "epoch": 2962} {"train_loss": -11.798001289367676, "global_step": 497667, "epoch": 2962} {"train_loss": -12.247648239135742, "global_step": 497668, "epoch": 2962} {"train_loss": -12.403051376342773, "global_step": 497669, "epoch": 2962} {"train_loss": -12.356170654296875, "global_step": 497670, "epoch": 2962} {"train_loss": -12.250469207763672, "global_step": 497671, "epoch": 2962} {"train_loss": -12.223950386047363, "global_step": 497672, "epoch": 2962} {"train_loss": -12.287952423095703, "global_step": 497673, "epoch": 2962} {"train_loss": -12.46202278137207, "global_step": 497674, "epoch": 2962} {"train_loss": -12.5188627243042, "global_step": 497675, "epoch": 2962} {"train_loss": -11.989380836486816, "global_step": 497676, "epoch": 2962} {"train_loss": -12.508810043334961, "global_step": 497677, "epoch": 2962} {"train_loss": -12.104395866394043, "global_step": 497678, "epoch": 2962} {"train_loss": -12.725455284118652, "global_step": 497679, "epoch": 2962} {"train_loss": -12.42538833618164, "global_step": 497680, "epoch": 2962} {"train_loss": -12.404701232910156, "global_step": 497681, "epoch": 2962} {"train_loss": -12.45108413696289, "global_step": 497682, "epoch": 2962} {"train_loss": -12.604805946350098, "global_step": 497683, "epoch": 2962} {"train_loss": -12.441892623901367, "global_step": 497684, "epoch": 2962} {"train_loss": -12.602290153503418, "global_step": 497685, "epoch": 2962} {"train_loss": -12.422074317932129, "global_step": 497686, "epoch": 2962} {"train_loss": -12.5963134765625, "global_step": 497687, "epoch": 2962} {"train_loss": -12.455047607421875, "global_step": 497688, "epoch": 2962} {"train_loss": -12.673173904418945, "global_step": 497689, "epoch": 2962} {"train_loss": -12.225839614868164, "global_step": 497690, "epoch": 2962} {"train_loss": -12.440622329711914, "global_step": 497691, "epoch": 2962} {"train_loss": -12.429946899414062, "global_step": 497692, "epoch": 2962} {"train_loss": -12.568727493286133, "global_step": 497693, "epoch": 2962} {"train_loss": -12.563535690307617, "global_step": 497694, "epoch": 2962} {"train_loss": -12.684684753417969, "global_step": 497695, "epoch": 2962} {"train_loss": -12.563629150390625, "global_step": 497696, "epoch": 2962} {"train_loss": -12.686665534973145, "global_step": 497697, "epoch": 2962} {"train_loss": -12.567136764526367, "global_step": 497698, "epoch": 2962} {"train_loss": -12.386274337768555, "global_step": 497699, "epoch": 2962} {"train_loss": -12.783805847167969, "global_step": 497700, "epoch": 2962} {"train_loss": -12.637300491333008, "global_step": 497701, "epoch": 2962} {"train_loss": -12.706308364868164, "global_step": 497702, "epoch": 2962} {"train_loss": -12.70945930480957, "global_step": 497703, "epoch": 2962} {"train_loss": -12.687459945678711, "global_step": 497704, "epoch": 2962} {"train_loss": -12.739164352416992, "global_step": 497705, "epoch": 2962} {"train_loss": -12.928979873657227, "global_step": 497706, "epoch": 2962} {"train_loss": -12.816476821899414, "global_step": 497707, "epoch": 2962} {"train_loss": -12.59825611114502, "global_step": 497708, "epoch": 2962} {"train_loss": -12.834354400634766, "global_step": 497709, "epoch": 2962} {"train_loss": -12.428613662719727, "global_step": 497710, "epoch": 2962} {"train_loss": -12.825807571411133, "global_step": 497711, "epoch": 2962} {"train_loss": -12.210517883300781, "global_step": 497712, "epoch": 2962} {"train_loss": -12.44837474822998, "global_step": 497713, "epoch": 2962} {"train_loss": -12.704183578491211, "global_step": 497714, "epoch": 2962} {"train_loss": -12.788896560668945, "global_step": 497715, "epoch": 2962} {"train_loss": -12.369342803955078, "global_step": 497716, "epoch": 2962} {"train_loss": -12.50813102722168, "global_step": 497717, "epoch": 2962} {"train_loss": -12.794597625732422, "global_step": 497718, "epoch": 2962} {"train_loss": -12.457745552062988, "global_step": 497719, "epoch": 2962} {"train_loss": -12.910233497619629, "global_step": 497720, "epoch": 2962} {"train_loss": -12.521970748901367, "global_step": 497721, "epoch": 2962} {"train_loss": -12.817937850952148, "global_step": 497722, "epoch": 2962} {"train_loss": -12.6841459274292, "global_step": 497723, "epoch": 2962} {"train_loss": -12.751056671142578, "global_step": 497724, "epoch": 2962} {"train_loss": -12.4583740234375, "global_step": 497725, "epoch": 2962} {"train_loss": -12.773759841918945, "global_step": 497726, "epoch": 2962} {"train_loss": -12.591751098632812, "global_step": 497727, "epoch": 2962} {"train_loss": -12.656390190124512, "global_step": 497728, "epoch": 2962} {"train_loss": -12.7564697265625, "global_step": 497729, "epoch": 2962} {"train_loss": -12.582688331604004, "global_step": 497730, "epoch": 2962} {"train_loss": -12.86936092376709, "global_step": 497731, "epoch": 2962} {"train_loss": -12.457515716552734, "global_step": 497732, "epoch": 2962} {"train_loss": -12.711688041687012, "global_step": 497733, "epoch": 2962} {"train_loss": -12.794179916381836, "global_step": 497734, "epoch": 2962} {"train_loss": -12.620597839355469, "global_step": 497735, "epoch": 2962} {"train_loss": -12.57596206665039, "global_step": 497736, "epoch": 2962} {"train_loss": -12.50881576538086, "global_step": 497737, "epoch": 2962} {"train_loss": -12.474443435668945, "global_step": 497738, "epoch": 2962} {"train_loss": -12.882978439331055, "global_step": 497739, "epoch": 2962} {"train_loss": -12.616203308105469, "global_step": 497740, "epoch": 2962} {"train_loss": -12.405980110168457, "global_step": 497741, "epoch": 2962} {"train_loss": -12.510353088378906, "global_step": 497742, "epoch": 2962} {"train_loss": -12.949651718139648, "global_step": 497743, "epoch": 2962} {"train_loss": -12.932693481445312, "global_step": 497744, "epoch": 2962} {"train_loss": -12.98437213897705, "global_step": 497745, "epoch": 2962} {"train_loss": -12.575003623962402, "global_step": 497746, "epoch": 2962} {"train_loss": -12.83508586883545, "global_step": 497747, "epoch": 2962} {"train_loss": -12.594411849975586, "global_step": 497748, "epoch": 2962} {"train_loss": -13.028301239013672, "global_step": 497749, "epoch": 2962} {"train_loss": -12.890472412109375, "global_step": 497750, "epoch": 2962} {"train_loss": -12.971802711486816, "global_step": 497751, "epoch": 2962} {"train_loss": -12.845769882202148, "global_step": 497752, "epoch": 2962} {"train_loss": -12.838897705078125, "global_step": 497753, "epoch": 2962} {"train_loss": -12.943777084350586, "global_step": 497754, "epoch": 2962} {"train_loss": -13.027599334716797, "global_step": 497755, "epoch": 2962} {"train_loss": -13.029563903808594, "global_step": 497756, "epoch": 2962} {"train_loss": -12.958414077758789, "global_step": 497757, "epoch": 2962} {"train_loss": -12.787683486938477, "global_step": 497758, "epoch": 2962} {"train_loss": -12.928625106811523, "global_step": 497759, "epoch": 2962} {"train_loss": -13.022623062133789, "global_step": 497760, "epoch": 2962} {"train_loss": -12.57223129272461, "global_step": 497761, "epoch": 2962} {"train_loss": -12.383447647094727, "global_step": 497762, "epoch": 2962} {"train_loss": -12.712194442749023, "global_step": 497763, "epoch": 2962} {"train_loss": -12.838499069213867, "global_step": 497764, "epoch": 2962} {"train_loss": -12.829105377197266, "global_step": 497765, "epoch": 2962} {"train_loss": -12.339405059814453, "global_step": 497766, "epoch": 2962} {"train_loss": -12.80190658569336, "global_step": 497767, "epoch": 2962} {"train_loss": -12.57379150390625, "global_step": 497768, "epoch": 2962} {"train_loss": -12.296436309814453, "global_step": 497769, "epoch": 2962} {"train_loss": -11.584809303283691, "global_step": 497770, "epoch": 2962} {"train_loss": -12.26341438293457, "global_step": 497771, "epoch": 2962} {"train_loss": -12.443753242492676, "global_step": 497772, "epoch": 2962} {"train_loss": -11.745031356811523, "global_step": 497773, "epoch": 2962} {"train_loss": -10.708968162536621, "global_step": 497774, "epoch": 2962} {"train_loss": -12.243642807006836, "global_step": 497775, "epoch": 2962} {"train_loss": -10.987353324890137, "global_step": 497776, "epoch": 2962} {"train_loss": -10.927754402160645, "global_step": 497777, "epoch": 2962} {"train_loss": -12.289064407348633, "global_step": 497778, "epoch": 2962} {"train_loss": -11.62496280670166, "global_step": 497779, "epoch": 2962} {"train_loss": -11.983302116394043, "global_step": 497780, "epoch": 2962} {"train_loss": -12.828898429870605, "global_step": 497781, "epoch": 2962} {"train_loss": -12.114911079406738, "global_step": 497782, "epoch": 2962} {"train_loss": -12.274952684129987, "global_step": 497783, "epoch": 2962, "val_loss": 318369.4375} {"train_loss": -12.510540962219238, "global_step": 497784, "epoch": 2963} {"train_loss": -11.999478340148926, "global_step": 497785, "epoch": 2963} {"train_loss": -12.490449905395508, "global_step": 497786, "epoch": 2963} {"train_loss": -12.185062408447266, "global_step": 497787, "epoch": 2963} {"train_loss": -12.355302810668945, "global_step": 497788, "epoch": 2963} {"train_loss": -12.577128410339355, "global_step": 497789, "epoch": 2963} {"train_loss": -12.55483627319336, "global_step": 497790, "epoch": 2963} {"train_loss": -12.388956069946289, "global_step": 497791, "epoch": 2963} {"train_loss": -11.970505714416504, "global_step": 497792, "epoch": 2963} {"train_loss": -12.09377670288086, "global_step": 497793, "epoch": 2963} {"train_loss": -12.400918960571289, "global_step": 497794, "epoch": 2963} {"train_loss": -10.640101432800293, "global_step": 497795, "epoch": 2963} {"train_loss": -10.37708854675293, "global_step": 497796, "epoch": 2963} {"train_loss": -11.79400634765625, "global_step": 497797, "epoch": 2963} {"train_loss": -11.239457130432129, "global_step": 497798, "epoch": 2963} {"train_loss": -11.790279388427734, "global_step": 497799, "epoch": 2963} {"train_loss": -12.141165733337402, "global_step": 497800, "epoch": 2963} {"train_loss": -11.597482681274414, "global_step": 497801, "epoch": 2963} {"train_loss": -12.073873519897461, "global_step": 497802, "epoch": 2963} {"train_loss": -11.998686790466309, "global_step": 497803, "epoch": 2963} {"train_loss": -11.378214836120605, "global_step": 497804, "epoch": 2963} {"train_loss": -10.854074478149414, "global_step": 497805, "epoch": 2963} {"train_loss": -11.50858211517334, "global_step": 497806, "epoch": 2963} {"train_loss": -10.96868896484375, "global_step": 497807, "epoch": 2963} {"train_loss": -12.0626802444458, "global_step": 497808, "epoch": 2963} {"train_loss": -11.425559043884277, "global_step": 497809, "epoch": 2963} {"train_loss": -11.621529579162598, "global_step": 497810, "epoch": 2963} {"train_loss": -12.109996795654297, "global_step": 497811, "epoch": 2963} {"train_loss": -11.703453063964844, "global_step": 497812, "epoch": 2963} {"train_loss": -12.139555931091309, "global_step": 497813, "epoch": 2963} {"train_loss": -11.561004638671875, "global_step": 497814, "epoch": 2963} {"train_loss": -12.232213973999023, "global_step": 497815, "epoch": 2963} {"train_loss": -11.81606388092041, "global_step": 497816, "epoch": 2963} {"train_loss": -12.161359786987305, "global_step": 497817, "epoch": 2963} {"train_loss": -11.855575561523438, "global_step": 497818, "epoch": 2963} {"train_loss": -11.783015251159668, "global_step": 497819, "epoch": 2963} {"train_loss": -11.781137466430664, "global_step": 497820, "epoch": 2963} {"train_loss": -11.448473930358887, "global_step": 497821, "epoch": 2963} {"train_loss": -12.107311248779297, "global_step": 497822, "epoch": 2963} {"train_loss": -11.091068267822266, "global_step": 497823, "epoch": 2963} {"train_loss": -11.88058090209961, "global_step": 497824, "epoch": 2963} {"train_loss": -11.395184516906738, "global_step": 497825, "epoch": 2963} {"train_loss": -12.312915802001953, "global_step": 497826, "epoch": 2963} {"train_loss": -11.92198371887207, "global_step": 497827, "epoch": 2963} {"train_loss": -11.664401054382324, "global_step": 497828, "epoch": 2963} {"train_loss": -11.71534252166748, "global_step": 497829, "epoch": 2963} {"train_loss": -11.723995208740234, "global_step": 497830, "epoch": 2963} {"train_loss": -12.06698989868164, "global_step": 497831, "epoch": 2963} {"train_loss": -12.599671363830566, "global_step": 497832, "epoch": 2963} {"train_loss": -11.891454696655273, "global_step": 497833, "epoch": 2963} {"train_loss": -12.707267761230469, "global_step": 497834, "epoch": 2963} {"train_loss": -12.230195999145508, "global_step": 497835, "epoch": 2963} {"train_loss": -12.631311416625977, "global_step": 497836, "epoch": 2963} {"train_loss": -12.003838539123535, "global_step": 497837, "epoch": 2963} {"train_loss": -11.831786155700684, "global_step": 497838, "epoch": 2963} {"train_loss": -12.289299964904785, "global_step": 497839, "epoch": 2963} {"train_loss": -11.966602325439453, "global_step": 497840, "epoch": 2963} {"train_loss": -12.623025894165039, "global_step": 497841, "epoch": 2963} {"train_loss": -12.265357971191406, "global_step": 497842, "epoch": 2963} {"train_loss": -12.467334747314453, "global_step": 497843, "epoch": 2963} {"train_loss": -12.57949447631836, "global_step": 497844, "epoch": 2963} {"train_loss": -12.500936508178711, "global_step": 497845, "epoch": 2963} {"train_loss": -12.194953918457031, "global_step": 497846, "epoch": 2963} {"train_loss": -12.541643142700195, "global_step": 497847, "epoch": 2963} {"train_loss": -12.553373336791992, "global_step": 497848, "epoch": 2963} {"train_loss": -12.562057495117188, "global_step": 497849, "epoch": 2963} {"train_loss": -12.521190643310547, "global_step": 497850, "epoch": 2963} {"train_loss": -12.649520874023438, "global_step": 497851, "epoch": 2963} {"train_loss": -12.59946060180664, "global_step": 497852, "epoch": 2963} {"train_loss": -12.444393157958984, "global_step": 497853, "epoch": 2963} {"train_loss": -12.731369972229004, "global_step": 497854, "epoch": 2963} {"train_loss": -12.293417930603027, "global_step": 497855, "epoch": 2963} {"train_loss": -12.398229598999023, "global_step": 497856, "epoch": 2963} {"train_loss": -12.600125312805176, "global_step": 497857, "epoch": 2963} {"train_loss": -12.555498123168945, "global_step": 497858, "epoch": 2963} {"train_loss": -12.918304443359375, "global_step": 497859, "epoch": 2963} {"train_loss": -12.04080867767334, "global_step": 497860, "epoch": 2963} {"train_loss": -12.56375503540039, "global_step": 497861, "epoch": 2963} {"train_loss": -12.685487747192383, "global_step": 497862, "epoch": 2963} {"train_loss": -12.388355255126953, "global_step": 497863, "epoch": 2963} {"train_loss": -12.850271224975586, "global_step": 497864, "epoch": 2963} {"train_loss": -12.535770416259766, "global_step": 497865, "epoch": 2963} {"train_loss": -12.19293212890625, "global_step": 497866, "epoch": 2963} {"train_loss": -12.926376342773438, "global_step": 497867, "epoch": 2963} {"train_loss": -12.243306159973145, "global_step": 497868, "epoch": 2963} {"train_loss": -12.761798858642578, "global_step": 497869, "epoch": 2963} {"train_loss": -12.307659149169922, "global_step": 497870, "epoch": 2963} {"train_loss": -12.750614166259766, "global_step": 497871, "epoch": 2963} {"train_loss": -12.437716484069824, "global_step": 497872, "epoch": 2963} {"train_loss": -12.83565902709961, "global_step": 497873, "epoch": 2963} {"train_loss": -12.772205352783203, "global_step": 497874, "epoch": 2963} {"train_loss": -12.866146087646484, "global_step": 497875, "epoch": 2963} {"train_loss": -12.804336547851562, "global_step": 497876, "epoch": 2963} {"train_loss": -12.810115814208984, "global_step": 497877, "epoch": 2963} {"train_loss": -12.712724685668945, "global_step": 497878, "epoch": 2963} {"train_loss": -12.642790794372559, "global_step": 497879, "epoch": 2963} {"train_loss": -12.738733291625977, "global_step": 497880, "epoch": 2963} {"train_loss": -12.699310302734375, "global_step": 497881, "epoch": 2963} {"train_loss": -12.776473045349121, "global_step": 497882, "epoch": 2963} {"train_loss": -12.775871276855469, "global_step": 497883, "epoch": 2963} {"train_loss": -12.80607795715332, "global_step": 497884, "epoch": 2963} {"train_loss": -12.754851341247559, "global_step": 497885, "epoch": 2963} {"train_loss": -12.899374961853027, "global_step": 497886, "epoch": 2963} {"train_loss": -12.626480102539062, "global_step": 497887, "epoch": 2963} {"train_loss": -12.698415756225586, "global_step": 497888, "epoch": 2963} {"train_loss": -12.556903839111328, "global_step": 497889, "epoch": 2963} {"train_loss": -12.811824798583984, "global_step": 497890, "epoch": 2963} {"train_loss": -12.798166275024414, "global_step": 497891, "epoch": 2963} {"train_loss": -12.544867515563965, "global_step": 497892, "epoch": 2963} {"train_loss": -12.995994567871094, "global_step": 497893, "epoch": 2963} {"train_loss": -12.497997283935547, "global_step": 497894, "epoch": 2963} {"train_loss": -12.779622077941895, "global_step": 497895, "epoch": 2963} {"train_loss": -12.727245330810547, "global_step": 497896, "epoch": 2963} {"train_loss": -12.73641586303711, "global_step": 497897, "epoch": 2963} {"train_loss": -12.460999488830566, "global_step": 497898, "epoch": 2963} {"train_loss": -12.776089668273926, "global_step": 497899, "epoch": 2963} {"train_loss": -12.799168586730957, "global_step": 497900, "epoch": 2963} {"train_loss": -12.929483413696289, "global_step": 497901, "epoch": 2963} {"train_loss": -12.550703048706055, "global_step": 497902, "epoch": 2963} {"train_loss": -12.905648231506348, "global_step": 497903, "epoch": 2963} {"train_loss": -12.452337265014648, "global_step": 497904, "epoch": 2963} {"train_loss": -12.786212921142578, "global_step": 497905, "epoch": 2963} {"train_loss": -12.60890007019043, "global_step": 497906, "epoch": 2963} {"train_loss": -12.855759620666504, "global_step": 497907, "epoch": 2963} {"train_loss": -12.904909133911133, "global_step": 497908, "epoch": 2963} {"train_loss": -12.910717964172363, "global_step": 497909, "epoch": 2963} {"train_loss": -12.343477249145508, "global_step": 497910, "epoch": 2963} {"train_loss": -12.689515113830566, "global_step": 497911, "epoch": 2963} {"train_loss": -12.302635192871094, "global_step": 497912, "epoch": 2963} {"train_loss": -12.026182174682617, "global_step": 497913, "epoch": 2963} {"train_loss": -12.701004028320312, "global_step": 497914, "epoch": 2963} {"train_loss": -11.408393859863281, "global_step": 497915, "epoch": 2963} {"train_loss": -11.65237045288086, "global_step": 497916, "epoch": 2963} {"train_loss": -12.18021011352539, "global_step": 497917, "epoch": 2963} {"train_loss": -11.370731353759766, "global_step": 497918, "epoch": 2963} {"train_loss": -10.618492126464844, "global_step": 497919, "epoch": 2963} {"train_loss": -12.420580863952637, "global_step": 497920, "epoch": 2963} {"train_loss": -10.648008346557617, "global_step": 497921, "epoch": 2963} {"train_loss": -11.740715026855469, "global_step": 497922, "epoch": 2963} {"train_loss": -11.696592330932617, "global_step": 497923, "epoch": 2963} {"train_loss": -9.327322006225586, "global_step": 497924, "epoch": 2963} {"train_loss": -10.162898063659668, "global_step": 497925, "epoch": 2963} {"train_loss": -10.683795928955078, "global_step": 497926, "epoch": 2963} {"train_loss": -10.41884994506836, "global_step": 497927, "epoch": 2963} {"train_loss": -10.870670318603516, "global_step": 497928, "epoch": 2963} {"train_loss": -11.156576156616211, "global_step": 497929, "epoch": 2963} {"train_loss": -9.587308883666992, "global_step": 497930, "epoch": 2963} {"train_loss": -11.493267059326172, "global_step": 497931, "epoch": 2963} {"train_loss": -11.074849128723145, "global_step": 497932, "epoch": 2963} {"train_loss": -11.453226089477539, "global_step": 497933, "epoch": 2963} {"train_loss": -11.592008590698242, "global_step": 497934, "epoch": 2963} {"train_loss": -11.835865020751953, "global_step": 497935, "epoch": 2963} {"train_loss": -11.674724578857422, "global_step": 497936, "epoch": 2963} {"train_loss": -10.706344604492188, "global_step": 497937, "epoch": 2963} {"train_loss": -12.071270942687988, "global_step": 497938, "epoch": 2963} {"train_loss": -10.585504531860352, "global_step": 497939, "epoch": 2963} {"train_loss": -12.0587797164917, "global_step": 497940, "epoch": 2963} {"train_loss": -11.205114364624023, "global_step": 497941, "epoch": 2963} {"train_loss": -11.552498817443848, "global_step": 497942, "epoch": 2963} {"train_loss": -11.494232177734375, "global_step": 497943, "epoch": 2963} {"train_loss": -11.50037956237793, "global_step": 497944, "epoch": 2963} {"train_loss": -11.737226486206055, "global_step": 497945, "epoch": 2963} {"train_loss": -11.635759353637695, "global_step": 497946, "epoch": 2963} {"train_loss": -11.850912094116211, "global_step": 497947, "epoch": 2963} {"train_loss": -11.222871780395508, "global_step": 497948, "epoch": 2963} {"train_loss": -11.580583572387695, "global_step": 497949, "epoch": 2963} {"train_loss": -11.744902610778809, "global_step": 497950, "epoch": 2963} {"train_loss": -12.081754218964349, "global_step": 497951, "epoch": 2963, "val_loss": 318831.6875} {"train_loss": -11.840539932250977, "global_step": 497952, "epoch": 2964} {"train_loss": -10.424015045166016, "global_step": 497953, "epoch": 2964} {"train_loss": -11.570045471191406, "global_step": 497954, "epoch": 2964} {"train_loss": -11.537843704223633, "global_step": 497955, "epoch": 2964} {"train_loss": -11.53358268737793, "global_step": 497956, "epoch": 2964} {"train_loss": -12.59278678894043, "global_step": 497957, "epoch": 2964} {"train_loss": -11.53749942779541, "global_step": 497958, "epoch": 2964} {"train_loss": -12.192678451538086, "global_step": 497959, "epoch": 2964} {"train_loss": -11.923040390014648, "global_step": 497960, "epoch": 2964} {"train_loss": -11.698529243469238, "global_step": 497961, "epoch": 2964} {"train_loss": -12.255537033081055, "global_step": 497962, "epoch": 2964} {"train_loss": -11.280399322509766, "global_step": 497963, "epoch": 2964} {"train_loss": -12.303929328918457, "global_step": 497964, "epoch": 2964} {"train_loss": -11.575794219970703, "global_step": 497965, "epoch": 2964} {"train_loss": -11.613909721374512, "global_step": 497966, "epoch": 2964} {"train_loss": -11.104310035705566, "global_step": 497967, "epoch": 2964} {"train_loss": -11.975920677185059, "global_step": 497968, "epoch": 2964} {"train_loss": -11.473444938659668, "global_step": 497969, "epoch": 2964} {"train_loss": -12.204193115234375, "global_step": 497970, "epoch": 2964} {"train_loss": -11.756706237792969, "global_step": 497971, "epoch": 2964} {"train_loss": -12.36864948272705, "global_step": 497972, "epoch": 2964} {"train_loss": -12.30362319946289, "global_step": 497973, "epoch": 2964} {"train_loss": -12.035734176635742, "global_step": 497974, "epoch": 2964} {"train_loss": -11.939855575561523, "global_step": 497975, "epoch": 2964} {"train_loss": -12.59416389465332, "global_step": 497976, "epoch": 2964} {"train_loss": -12.208479881286621, "global_step": 497977, "epoch": 2964} {"train_loss": -12.447174072265625, "global_step": 497978, "epoch": 2964} {"train_loss": -12.46851634979248, "global_step": 497979, "epoch": 2964} {"train_loss": -12.539512634277344, "global_step": 497980, "epoch": 2964} {"train_loss": -12.282537460327148, "global_step": 497981, "epoch": 2964} {"train_loss": -12.281564712524414, "global_step": 497982, "epoch": 2964} {"train_loss": -12.441915512084961, "global_step": 497983, "epoch": 2964} {"train_loss": -12.576522827148438, "global_step": 497984, "epoch": 2964} {"train_loss": -12.306118965148926, "global_step": 497985, "epoch": 2964} {"train_loss": -12.569965362548828, "global_step": 497986, "epoch": 2964} {"train_loss": -12.377018928527832, "global_step": 497987, "epoch": 2964} {"train_loss": -12.357987403869629, "global_step": 497988, "epoch": 2964} {"train_loss": -12.577125549316406, "global_step": 497989, "epoch": 2964} {"train_loss": -12.441425323486328, "global_step": 497990, "epoch": 2964} {"train_loss": -12.742138862609863, "global_step": 497991, "epoch": 2964} {"train_loss": -12.389406204223633, "global_step": 497992, "epoch": 2964} {"train_loss": -12.309242248535156, "global_step": 497993, "epoch": 2964} {"train_loss": -12.588082313537598, "global_step": 497994, "epoch": 2964} {"train_loss": -12.117570877075195, "global_step": 497995, "epoch": 2964} {"train_loss": -12.903770446777344, "global_step": 497996, "epoch": 2964} {"train_loss": -12.45033073425293, "global_step": 497997, "epoch": 2964} {"train_loss": -12.627745628356934, "global_step": 497998, "epoch": 2964} {"train_loss": -12.827973365783691, "global_step": 497999, "epoch": 2964} {"train_loss": -12.49324893951416, "global_step": 498000, "epoch": 2964} {"train_loss": -12.627908706665039, "global_step": 498001, "epoch": 2964} {"train_loss": -12.242192268371582, "global_step": 498002, "epoch": 2964} {"train_loss": -12.621753692626953, "global_step": 498003, "epoch": 2964} {"train_loss": -12.427614212036133, "global_step": 498004, "epoch": 2964} {"train_loss": -12.470335006713867, "global_step": 498005, "epoch": 2964} {"train_loss": -12.38644027709961, "global_step": 498006, "epoch": 2964} {"train_loss": -12.779441833496094, "global_step": 498007, "epoch": 2964} {"train_loss": -12.519580841064453, "global_step": 498008, "epoch": 2964} {"train_loss": -12.665319442749023, "global_step": 498009, "epoch": 2964} {"train_loss": -12.725017547607422, "global_step": 498010, "epoch": 2964} {"train_loss": -12.592971801757812, "global_step": 498011, "epoch": 2964} {"train_loss": -12.808586120605469, "global_step": 498012, "epoch": 2964} {"train_loss": -12.705168724060059, "global_step": 498013, "epoch": 2964} {"train_loss": -12.80577278137207, "global_step": 498014, "epoch": 2964} {"train_loss": -12.647232055664062, "global_step": 498015, "epoch": 2964} {"train_loss": -12.661683082580566, "global_step": 498016, "epoch": 2964} {"train_loss": -12.793639183044434, "global_step": 498017, "epoch": 2964} {"train_loss": -12.843968391418457, "global_step": 498018, "epoch": 2964} {"train_loss": -12.95480728149414, "global_step": 498019, "epoch": 2964} {"train_loss": -12.878549575805664, "global_step": 498020, "epoch": 2964} {"train_loss": -12.693855285644531, "global_step": 498021, "epoch": 2964} {"train_loss": -12.82709789276123, "global_step": 498022, "epoch": 2964} {"train_loss": -12.633763313293457, "global_step": 498023, "epoch": 2964} {"train_loss": -12.769701957702637, "global_step": 498024, "epoch": 2964} {"train_loss": -12.540063858032227, "global_step": 498025, "epoch": 2964} {"train_loss": -12.82480239868164, "global_step": 498026, "epoch": 2964} {"train_loss": -12.762685775756836, "global_step": 498027, "epoch": 2964} {"train_loss": -12.906336784362793, "global_step": 498028, "epoch": 2964} {"train_loss": -12.585746765136719, "global_step": 498029, "epoch": 2964} {"train_loss": -12.769731521606445, "global_step": 498030, "epoch": 2964} {"train_loss": -12.66178035736084, "global_step": 498031, "epoch": 2964} {"train_loss": -12.970963478088379, "global_step": 498032, "epoch": 2964} {"train_loss": -12.883474349975586, "global_step": 498033, "epoch": 2964} {"train_loss": -13.136362075805664, "global_step": 498034, "epoch": 2964} {"train_loss": -13.087213516235352, "global_step": 498035, "epoch": 2964} {"train_loss": -12.937030792236328, "global_step": 498036, "epoch": 2964} {"train_loss": -12.875118255615234, "global_step": 498037, "epoch": 2964} {"train_loss": -12.917441368103027, "global_step": 498038, "epoch": 2964} {"train_loss": -12.939718246459961, "global_step": 498039, "epoch": 2964} {"train_loss": -12.936441421508789, "global_step": 498040, "epoch": 2964} {"train_loss": -12.948392868041992, "global_step": 498041, "epoch": 2964} {"train_loss": -12.816234588623047, "global_step": 498042, "epoch": 2964} {"train_loss": -12.841551780700684, "global_step": 498043, "epoch": 2964} {"train_loss": -12.754997253417969, "global_step": 498044, "epoch": 2964} {"train_loss": -12.942795753479004, "global_step": 498045, "epoch": 2964} {"train_loss": -12.98807144165039, "global_step": 498046, "epoch": 2964} {"train_loss": -12.907940864562988, "global_step": 498047, "epoch": 2964} {"train_loss": -12.658105850219727, "global_step": 498048, "epoch": 2964} {"train_loss": -13.043046951293945, "global_step": 498049, "epoch": 2964} {"train_loss": -12.898283958435059, "global_step": 498050, "epoch": 2964} {"train_loss": -12.959994316101074, "global_step": 498051, "epoch": 2964} {"train_loss": -12.716388702392578, "global_step": 498052, "epoch": 2964} {"train_loss": -12.658514022827148, "global_step": 498053, "epoch": 2964} {"train_loss": -12.822280883789062, "global_step": 498054, "epoch": 2964} {"train_loss": -12.935275077819824, "global_step": 498055, "epoch": 2964} {"train_loss": -12.771200180053711, "global_step": 498056, "epoch": 2964} {"train_loss": -12.961267471313477, "global_step": 498057, "epoch": 2964} {"train_loss": -12.786956787109375, "global_step": 498058, "epoch": 2964} {"train_loss": -13.00389289855957, "global_step": 498059, "epoch": 2964} {"train_loss": -12.886382102966309, "global_step": 498060, "epoch": 2964} {"train_loss": -12.965824127197266, "global_step": 498061, "epoch": 2964} {"train_loss": -12.793354034423828, "global_step": 498062, "epoch": 2964} {"train_loss": -13.185908317565918, "global_step": 498063, "epoch": 2964} {"train_loss": -12.53506088256836, "global_step": 498064, "epoch": 2964} {"train_loss": -12.270735740661621, "global_step": 498065, "epoch": 2964} {"train_loss": -12.989752769470215, "global_step": 498066, "epoch": 2964} {"train_loss": -12.320419311523438, "global_step": 498067, "epoch": 2964} {"train_loss": -12.0081787109375, "global_step": 498068, "epoch": 2964} {"train_loss": -12.37153434753418, "global_step": 498069, "epoch": 2964} {"train_loss": -12.172005653381348, "global_step": 498070, "epoch": 2964} {"train_loss": -11.298264503479004, "global_step": 498071, "epoch": 2964} {"train_loss": -11.81733226776123, "global_step": 498072, "epoch": 2964} {"train_loss": -12.476640701293945, "global_step": 498073, "epoch": 2964} {"train_loss": -12.457767486572266, "global_step": 498074, "epoch": 2964} {"train_loss": -12.663148880004883, "global_step": 498075, "epoch": 2964} {"train_loss": -11.926530838012695, "global_step": 498076, "epoch": 2964} {"train_loss": -11.518082618713379, "global_step": 498077, "epoch": 2964} {"train_loss": -10.606109619140625, "global_step": 498078, "epoch": 2964} {"train_loss": -11.478014945983887, "global_step": 498079, "epoch": 2964} {"train_loss": -10.001503944396973, "global_step": 498080, "epoch": 2964} {"train_loss": -9.954434394836426, "global_step": 498081, "epoch": 2964} {"train_loss": -9.914651870727539, "global_step": 498082, "epoch": 2964} {"train_loss": -11.309355735778809, "global_step": 498083, "epoch": 2964} {"train_loss": -9.414680480957031, "global_step": 498084, "epoch": 2964} {"train_loss": -11.04288101196289, "global_step": 498085, "epoch": 2964} {"train_loss": -9.089362144470215, "global_step": 498086, "epoch": 2964} {"train_loss": -8.731700897216797, "global_step": 498087, "epoch": 2964} {"train_loss": -8.400912284851074, "global_step": 498088, "epoch": 2964} {"train_loss": -7.875030517578125, "global_step": 498089, "epoch": 2964} {"train_loss": -8.306264877319336, "global_step": 498090, "epoch": 2964} {"train_loss": -9.30644416809082, "global_step": 498091, "epoch": 2964} {"train_loss": -8.590351104736328, "global_step": 498092, "epoch": 2964} {"train_loss": -10.067216873168945, "global_step": 498093, "epoch": 2964} {"train_loss": -8.51721477508545, "global_step": 498094, "epoch": 2964} {"train_loss": -10.00900650024414, "global_step": 498095, "epoch": 2964} {"train_loss": -10.62784481048584, "global_step": 498096, "epoch": 2964} {"train_loss": -9.206188201904297, "global_step": 498097, "epoch": 2964} {"train_loss": -9.364202499389648, "global_step": 498098, "epoch": 2964} {"train_loss": -10.950725555419922, "global_step": 498099, "epoch": 2964} {"train_loss": -10.269392013549805, "global_step": 498100, "epoch": 2964} {"train_loss": -11.32800579071045, "global_step": 498101, "epoch": 2964} {"train_loss": -10.334396362304688, "global_step": 498102, "epoch": 2964} {"train_loss": -11.52332878112793, "global_step": 498103, "epoch": 2964} {"train_loss": -10.193023681640625, "global_step": 498104, "epoch": 2964} {"train_loss": -11.117767333984375, "global_step": 498105, "epoch": 2964} {"train_loss": -11.400912284851074, "global_step": 498106, "epoch": 2964} {"train_loss": -11.260022163391113, "global_step": 498107, "epoch": 2964} {"train_loss": -10.710927963256836, "global_step": 498108, "epoch": 2964} {"train_loss": -11.345434188842773, "global_step": 498109, "epoch": 2964} {"train_loss": -10.64573860168457, "global_step": 498110, "epoch": 2964} {"train_loss": -10.881633758544922, "global_step": 498111, "epoch": 2964} {"train_loss": -10.912505149841309, "global_step": 498112, "epoch": 2964} {"train_loss": -11.342561721801758, "global_step": 498113, "epoch": 2964} {"train_loss": -11.549854278564453, "global_step": 498114, "epoch": 2964} {"train_loss": -11.811702728271484, "global_step": 498115, "epoch": 2964} {"train_loss": -11.325679779052734, "global_step": 498116, "epoch": 2964} {"train_loss": -11.923576354980469, "global_step": 498117, "epoch": 2964} {"train_loss": -11.513391494750977, "global_step": 498118, "epoch": 2964} {"train_loss": -11.951694386346, "global_step": 498119, "epoch": 2964, "val_loss": 313679.78125} {"train_loss": -11.751434326171875, "global_step": 498120, "epoch": 2965} {"train_loss": -12.062999725341797, "global_step": 498121, "epoch": 2965} {"train_loss": -11.415763854980469, "global_step": 498122, "epoch": 2965} {"train_loss": -12.202705383300781, "global_step": 498123, "epoch": 2965} {"train_loss": -11.386234283447266, "global_step": 498124, "epoch": 2965} {"train_loss": -12.08767318725586, "global_step": 498125, "epoch": 2965} {"train_loss": -11.822256088256836, "global_step": 498126, "epoch": 2965} {"train_loss": -11.680658340454102, "global_step": 498127, "epoch": 2965} {"train_loss": -11.943683624267578, "global_step": 498128, "epoch": 2965} {"train_loss": -12.156438827514648, "global_step": 498129, "epoch": 2965} {"train_loss": -11.843564987182617, "global_step": 498130, "epoch": 2965} {"train_loss": -12.365044593811035, "global_step": 498131, "epoch": 2965} {"train_loss": -12.215507507324219, "global_step": 498132, "epoch": 2965} {"train_loss": -12.077656745910645, "global_step": 498133, "epoch": 2965} {"train_loss": -12.554210662841797, "global_step": 498134, "epoch": 2965} {"train_loss": -11.81586742401123, "global_step": 498135, "epoch": 2965} {"train_loss": -12.265892028808594, "global_step": 498136, "epoch": 2965} {"train_loss": -12.034461975097656, "global_step": 498137, "epoch": 2965} {"train_loss": -12.339508056640625, "global_step": 498138, "epoch": 2965} {"train_loss": -12.383045196533203, "global_step": 498139, "epoch": 2965} {"train_loss": -12.424068450927734, "global_step": 498140, "epoch": 2965} {"train_loss": -12.1490478515625, "global_step": 498141, "epoch": 2965} {"train_loss": -12.551542282104492, "global_step": 498142, "epoch": 2965} {"train_loss": -12.444921493530273, "global_step": 498143, "epoch": 2965} {"train_loss": -12.337186813354492, "global_step": 498144, "epoch": 2965} {"train_loss": -12.206158638000488, "global_step": 498145, "epoch": 2965} {"train_loss": -12.41008186340332, "global_step": 498146, "epoch": 2965} {"train_loss": -12.556241989135742, "global_step": 498147, "epoch": 2965} {"train_loss": -12.538322448730469, "global_step": 498148, "epoch": 2965} {"train_loss": -12.47245979309082, "global_step": 498149, "epoch": 2965} {"train_loss": -12.376545906066895, "global_step": 498150, "epoch": 2965} {"train_loss": -12.364136695861816, "global_step": 498151, "epoch": 2965} {"train_loss": -12.706440925598145, "global_step": 498152, "epoch": 2965} {"train_loss": -12.29655647277832, "global_step": 498153, "epoch": 2965} {"train_loss": -12.44875717163086, "global_step": 498154, "epoch": 2965} {"train_loss": -12.622579574584961, "global_step": 498155, "epoch": 2965} {"train_loss": -12.63602066040039, "global_step": 498156, "epoch": 2965} {"train_loss": -12.61884880065918, "global_step": 498157, "epoch": 2965} {"train_loss": -12.519109725952148, "global_step": 498158, "epoch": 2965} {"train_loss": -12.500121116638184, "global_step": 498159, "epoch": 2965} {"train_loss": -12.476042747497559, "global_step": 498160, "epoch": 2965} {"train_loss": -12.637083053588867, "global_step": 498161, "epoch": 2965} {"train_loss": -12.717170715332031, "global_step": 498162, "epoch": 2965} {"train_loss": -12.637880325317383, "global_step": 498163, "epoch": 2965} {"train_loss": -12.592535018920898, "global_step": 498164, "epoch": 2965} {"train_loss": -12.125715255737305, "global_step": 498165, "epoch": 2965} {"train_loss": -12.556045532226562, "global_step": 498166, "epoch": 2965} {"train_loss": -12.312784194946289, "global_step": 498167, "epoch": 2965} {"train_loss": -12.572626113891602, "global_step": 498168, "epoch": 2965} {"train_loss": -11.972454071044922, "global_step": 498169, "epoch": 2965} {"train_loss": -11.748454093933105, "global_step": 498170, "epoch": 2965} {"train_loss": -12.446501731872559, "global_step": 498171, "epoch": 2965} {"train_loss": -12.225922584533691, "global_step": 498172, "epoch": 2965} {"train_loss": -12.707674980163574, "global_step": 498173, "epoch": 2965} {"train_loss": -12.417147636413574, "global_step": 498174, "epoch": 2965} {"train_loss": -12.266233444213867, "global_step": 498175, "epoch": 2965} {"train_loss": -12.75607967376709, "global_step": 498176, "epoch": 2965} {"train_loss": -12.123588562011719, "global_step": 498177, "epoch": 2965} {"train_loss": -12.221057891845703, "global_step": 498178, "epoch": 2965} {"train_loss": -12.583133697509766, "global_step": 498179, "epoch": 2965} {"train_loss": -12.12691879272461, "global_step": 498180, "epoch": 2965} {"train_loss": -12.052448272705078, "global_step": 498181, "epoch": 2965} {"train_loss": -12.484004974365234, "global_step": 498182, "epoch": 2965} {"train_loss": -12.035360336303711, "global_step": 498183, "epoch": 2965} {"train_loss": -12.436840057373047, "global_step": 498184, "epoch": 2965} {"train_loss": -12.478187561035156, "global_step": 498185, "epoch": 2965} {"train_loss": -12.336555480957031, "global_step": 498186, "epoch": 2965} {"train_loss": -12.232864379882812, "global_step": 498187, "epoch": 2965} {"train_loss": -12.562322616577148, "global_step": 498188, "epoch": 2965} {"train_loss": -11.704548835754395, "global_step": 498189, "epoch": 2965} {"train_loss": -12.430046081542969, "global_step": 498190, "epoch": 2965} {"train_loss": -12.2073974609375, "global_step": 498191, "epoch": 2965} {"train_loss": -11.042303085327148, "global_step": 498192, "epoch": 2965} {"train_loss": -12.204545974731445, "global_step": 498193, "epoch": 2965} {"train_loss": -12.263336181640625, "global_step": 498194, "epoch": 2965} {"train_loss": -12.790206909179688, "global_step": 498195, "epoch": 2965} {"train_loss": -12.32227611541748, "global_step": 498196, "epoch": 2965} {"train_loss": -12.805883407592773, "global_step": 498197, "epoch": 2965} {"train_loss": -12.625374794006348, "global_step": 498198, "epoch": 2965} {"train_loss": -12.542034149169922, "global_step": 498199, "epoch": 2965} {"train_loss": -12.690587997436523, "global_step": 498200, "epoch": 2965} {"train_loss": -12.524717330932617, "global_step": 498201, "epoch": 2965} {"train_loss": -12.713865280151367, "global_step": 498202, "epoch": 2965} {"train_loss": -11.95574951171875, "global_step": 498203, "epoch": 2965} {"train_loss": -12.476380348205566, "global_step": 498204, "epoch": 2965} {"train_loss": -12.135560989379883, "global_step": 498205, "epoch": 2965} {"train_loss": -12.402752876281738, "global_step": 498206, "epoch": 2965} {"train_loss": -12.359883308410645, "global_step": 498207, "epoch": 2965} {"train_loss": -12.417379379272461, "global_step": 498208, "epoch": 2965} {"train_loss": -11.93612289428711, "global_step": 498209, "epoch": 2965} {"train_loss": -11.686853408813477, "global_step": 498210, "epoch": 2965} {"train_loss": -11.509899139404297, "global_step": 498211, "epoch": 2965} {"train_loss": -11.930121421813965, "global_step": 498212, "epoch": 2965} {"train_loss": -11.44205093383789, "global_step": 498213, "epoch": 2965} {"train_loss": -11.261734962463379, "global_step": 498214, "epoch": 2965} {"train_loss": -11.978536605834961, "global_step": 498215, "epoch": 2965} {"train_loss": -11.430680274963379, "global_step": 498216, "epoch": 2965} {"train_loss": -12.13393783569336, "global_step": 498217, "epoch": 2965} {"train_loss": -11.450912475585938, "global_step": 498218, "epoch": 2965} {"train_loss": -11.390432357788086, "global_step": 498219, "epoch": 2965} {"train_loss": -12.48694896697998, "global_step": 498220, "epoch": 2965} {"train_loss": -11.354959487915039, "global_step": 498221, "epoch": 2965} {"train_loss": -11.70248031616211, "global_step": 498222, "epoch": 2965} {"train_loss": -11.858856201171875, "global_step": 498223, "epoch": 2965} {"train_loss": -11.253274917602539, "global_step": 498224, "epoch": 2965} {"train_loss": -11.956077575683594, "global_step": 498225, "epoch": 2965} {"train_loss": -12.428206443786621, "global_step": 498226, "epoch": 2965} {"train_loss": -12.76072883605957, "global_step": 498227, "epoch": 2965} {"train_loss": -12.243025779724121, "global_step": 498228, "epoch": 2965} {"train_loss": -12.49176025390625, "global_step": 498229, "epoch": 2965} {"train_loss": -12.378416061401367, "global_step": 498230, "epoch": 2965} {"train_loss": -12.43017292022705, "global_step": 498231, "epoch": 2965} {"train_loss": -12.229016304016113, "global_step": 498232, "epoch": 2965} {"train_loss": -12.840755462646484, "global_step": 498233, "epoch": 2965} {"train_loss": -12.35757064819336, "global_step": 498234, "epoch": 2965} {"train_loss": -12.391392707824707, "global_step": 498235, "epoch": 2965} {"train_loss": -12.585548400878906, "global_step": 498236, "epoch": 2965} {"train_loss": -12.191337585449219, "global_step": 498237, "epoch": 2965} {"train_loss": -12.412494659423828, "global_step": 498238, "epoch": 2965} {"train_loss": -11.766411781311035, "global_step": 498239, "epoch": 2965} {"train_loss": -12.659452438354492, "global_step": 498240, "epoch": 2965} {"train_loss": -12.383733749389648, "global_step": 498241, "epoch": 2965} {"train_loss": -12.672417640686035, "global_step": 498242, "epoch": 2965} {"train_loss": -12.245893478393555, "global_step": 498243, "epoch": 2965} {"train_loss": -12.560415267944336, "global_step": 498244, "epoch": 2965} {"train_loss": -12.774332046508789, "global_step": 498245, "epoch": 2965} {"train_loss": -12.577875137329102, "global_step": 498246, "epoch": 2965} {"train_loss": -12.585144996643066, "global_step": 498247, "epoch": 2965} {"train_loss": -12.291780471801758, "global_step": 498248, "epoch": 2965} {"train_loss": -12.762191772460938, "global_step": 498249, "epoch": 2965} {"train_loss": -12.556020736694336, "global_step": 498250, "epoch": 2965} {"train_loss": -12.588552474975586, "global_step": 498251, "epoch": 2965} {"train_loss": -12.503316879272461, "global_step": 498252, "epoch": 2965} {"train_loss": -12.79565715789795, "global_step": 498253, "epoch": 2965} {"train_loss": -12.3319673538208, "global_step": 498254, "epoch": 2965} {"train_loss": -11.957837104797363, "global_step": 498255, "epoch": 2965} {"train_loss": -12.576391220092773, "global_step": 498256, "epoch": 2965} {"train_loss": -12.674821853637695, "global_step": 498257, "epoch": 2965} {"train_loss": -11.584665298461914, "global_step": 498258, "epoch": 2965} {"train_loss": -12.662425994873047, "global_step": 498259, "epoch": 2965} {"train_loss": -12.09904670715332, "global_step": 498260, "epoch": 2965} {"train_loss": -11.958494186401367, "global_step": 498261, "epoch": 2965} {"train_loss": -12.554906845092773, "global_step": 498262, "epoch": 2965} {"train_loss": -11.704967498779297, "global_step": 498263, "epoch": 2965} {"train_loss": -12.765559196472168, "global_step": 498264, "epoch": 2965} {"train_loss": -11.878986358642578, "global_step": 498265, "epoch": 2965} {"train_loss": -12.737458229064941, "global_step": 498266, "epoch": 2965} {"train_loss": -12.049378395080566, "global_step": 498267, "epoch": 2965} {"train_loss": -12.335304260253906, "global_step": 498268, "epoch": 2965} {"train_loss": -12.045705795288086, "global_step": 498269, "epoch": 2965} {"train_loss": -11.65472412109375, "global_step": 498270, "epoch": 2965} {"train_loss": -12.602807998657227, "global_step": 498271, "epoch": 2965} {"train_loss": -11.368673324584961, "global_step": 498272, "epoch": 2965} {"train_loss": -12.388360977172852, "global_step": 498273, "epoch": 2965} {"train_loss": -11.313541412353516, "global_step": 498274, "epoch": 2965} {"train_loss": -11.648385047912598, "global_step": 498275, "epoch": 2965} {"train_loss": -11.543596267700195, "global_step": 498276, "epoch": 2965} {"train_loss": -11.70962905883789, "global_step": 498277, "epoch": 2965} {"train_loss": -12.525413513183594, "global_step": 498278, "epoch": 2965} {"train_loss": -12.083871841430664, "global_step": 498279, "epoch": 2965} {"train_loss": -12.289938926696777, "global_step": 498280, "epoch": 2965} {"train_loss": -12.247917175292969, "global_step": 498281, "epoch": 2965} {"train_loss": -12.596294403076172, "global_step": 498282, "epoch": 2965} {"train_loss": -12.44231128692627, "global_step": 498283, "epoch": 2965} {"train_loss": -12.666841506958008, "global_step": 498284, "epoch": 2965} {"train_loss": -12.682738304138184, "global_step": 498285, "epoch": 2965} {"train_loss": -12.541115760803223, "global_step": 498286, "epoch": 2965} {"train_loss": -12.249462689672198, "global_step": 498287, "epoch": 2965, "val_loss": 319408.40625, "train_action_mse_error": 1.4880770444869995} {"train_loss": -12.464401245117188, "global_step": 498288, "epoch": 2966} {"train_loss": -12.824773788452148, "global_step": 498289, "epoch": 2966} {"train_loss": -12.5052490234375, "global_step": 498290, "epoch": 2966} {"train_loss": -12.455835342407227, "global_step": 498291, "epoch": 2966} {"train_loss": -12.742208480834961, "global_step": 498292, "epoch": 2966} {"train_loss": -12.064716339111328, "global_step": 498293, "epoch": 2966} {"train_loss": -12.299814224243164, "global_step": 498294, "epoch": 2966} {"train_loss": -11.933788299560547, "global_step": 498295, "epoch": 2966} {"train_loss": -12.344440460205078, "global_step": 498296, "epoch": 2966} {"train_loss": -11.825016021728516, "global_step": 498297, "epoch": 2966} {"train_loss": -12.150550842285156, "global_step": 498298, "epoch": 2966} {"train_loss": -11.925617218017578, "global_step": 498299, "epoch": 2966} {"train_loss": -11.455039024353027, "global_step": 498300, "epoch": 2966} {"train_loss": -12.701353073120117, "global_step": 498301, "epoch": 2966} {"train_loss": -11.926935195922852, "global_step": 498302, "epoch": 2966} {"train_loss": -12.53671646118164, "global_step": 498303, "epoch": 2966} {"train_loss": -12.052331924438477, "global_step": 498304, "epoch": 2966} {"train_loss": -12.499833106994629, "global_step": 498305, "epoch": 2966} {"train_loss": -12.478729248046875, "global_step": 498306, "epoch": 2966} {"train_loss": -12.280067443847656, "global_step": 498307, "epoch": 2966} {"train_loss": -12.573938369750977, "global_step": 498308, "epoch": 2966} {"train_loss": -12.399744033813477, "global_step": 498309, "epoch": 2966} {"train_loss": -12.643142700195312, "global_step": 498310, "epoch": 2966} {"train_loss": -12.328787803649902, "global_step": 498311, "epoch": 2966} {"train_loss": -12.491418838500977, "global_step": 498312, "epoch": 2966} {"train_loss": -12.549782752990723, "global_step": 498313, "epoch": 2966} {"train_loss": -12.301836013793945, "global_step": 498314, "epoch": 2966} {"train_loss": -12.264566421508789, "global_step": 498315, "epoch": 2966} {"train_loss": -12.288910865783691, "global_step": 498316, "epoch": 2966} {"train_loss": -12.231624603271484, "global_step": 498317, "epoch": 2966} {"train_loss": -12.377975463867188, "global_step": 498318, "epoch": 2966} {"train_loss": -12.536590576171875, "global_step": 498319, "epoch": 2966} {"train_loss": -12.488576889038086, "global_step": 498320, "epoch": 2966} {"train_loss": -12.150289535522461, "global_step": 498321, "epoch": 2966} {"train_loss": -12.495017051696777, "global_step": 498322, "epoch": 2966} {"train_loss": -11.965351104736328, "global_step": 498323, "epoch": 2966} {"train_loss": -12.351306915283203, "global_step": 498324, "epoch": 2966} {"train_loss": -12.53962516784668, "global_step": 498325, "epoch": 2966} {"train_loss": -12.504837036132812, "global_step": 498326, "epoch": 2966} {"train_loss": -12.898843765258789, "global_step": 498327, "epoch": 2966} {"train_loss": -12.162074089050293, "global_step": 498328, "epoch": 2966} {"train_loss": -12.799710273742676, "global_step": 498329, "epoch": 2966} {"train_loss": -12.467758178710938, "global_step": 498330, "epoch": 2966} {"train_loss": -12.605693817138672, "global_step": 498331, "epoch": 2966} {"train_loss": -12.525725364685059, "global_step": 498332, "epoch": 2966} {"train_loss": -12.221561431884766, "global_step": 498333, "epoch": 2966} {"train_loss": -12.369460105895996, "global_step": 498334, "epoch": 2966} {"train_loss": -12.531476974487305, "global_step": 498335, "epoch": 2966} {"train_loss": -11.884393692016602, "global_step": 498336, "epoch": 2966} {"train_loss": -12.150598526000977, "global_step": 498337, "epoch": 2966} {"train_loss": -12.521377563476562, "global_step": 498338, "epoch": 2966} {"train_loss": -11.759674072265625, "global_step": 498339, "epoch": 2966} {"train_loss": -12.368579864501953, "global_step": 498340, "epoch": 2966} {"train_loss": -12.155427932739258, "global_step": 498341, "epoch": 2966} {"train_loss": -12.504755020141602, "global_step": 498342, "epoch": 2966} {"train_loss": -12.715328216552734, "global_step": 498343, "epoch": 2966} {"train_loss": -12.637964248657227, "global_step": 498344, "epoch": 2966} {"train_loss": -12.281042098999023, "global_step": 498345, "epoch": 2966} {"train_loss": -12.550344467163086, "global_step": 498346, "epoch": 2966} {"train_loss": -12.587417602539062, "global_step": 498347, "epoch": 2966} {"train_loss": -12.403132438659668, "global_step": 498348, "epoch": 2966} {"train_loss": -12.79007625579834, "global_step": 498349, "epoch": 2966} {"train_loss": -12.763798713684082, "global_step": 498350, "epoch": 2966} {"train_loss": -12.655267715454102, "global_step": 498351, "epoch": 2966} {"train_loss": -12.588774681091309, "global_step": 498352, "epoch": 2966} {"train_loss": -12.659119606018066, "global_step": 498353, "epoch": 2966} {"train_loss": -12.749361991882324, "global_step": 498354, "epoch": 2966} {"train_loss": -12.612174987792969, "global_step": 498355, "epoch": 2966} {"train_loss": -12.651803970336914, "global_step": 498356, "epoch": 2966} {"train_loss": -12.495418548583984, "global_step": 498357, "epoch": 2966} {"train_loss": -12.765867233276367, "global_step": 498358, "epoch": 2966} {"train_loss": -12.641404151916504, "global_step": 498359, "epoch": 2966} {"train_loss": -12.40791130065918, "global_step": 498360, "epoch": 2966} {"train_loss": -12.537147521972656, "global_step": 498361, "epoch": 2966} {"train_loss": -12.716450691223145, "global_step": 498362, "epoch": 2966} {"train_loss": -12.34217643737793, "global_step": 498363, "epoch": 2966} {"train_loss": -12.93630599975586, "global_step": 498364, "epoch": 2966} {"train_loss": -12.556448936462402, "global_step": 498365, "epoch": 2966} {"train_loss": -12.968201637268066, "global_step": 498366, "epoch": 2966} {"train_loss": -12.6480073928833, "global_step": 498367, "epoch": 2966} {"train_loss": -12.424325942993164, "global_step": 498368, "epoch": 2966} {"train_loss": -12.47061538696289, "global_step": 498369, "epoch": 2966} {"train_loss": -12.771318435668945, "global_step": 498370, "epoch": 2966} {"train_loss": -12.511014938354492, "global_step": 498371, "epoch": 2966} {"train_loss": -12.358219146728516, "global_step": 498372, "epoch": 2966} {"train_loss": -12.599276542663574, "global_step": 498373, "epoch": 2966} {"train_loss": -12.183600425720215, "global_step": 498374, "epoch": 2966} {"train_loss": -12.759206771850586, "global_step": 498375, "epoch": 2966} {"train_loss": -12.287446022033691, "global_step": 498376, "epoch": 2966} {"train_loss": -12.38630485534668, "global_step": 498377, "epoch": 2966} {"train_loss": -12.037272453308105, "global_step": 498378, "epoch": 2966} {"train_loss": -12.169685363769531, "global_step": 498379, "epoch": 2966} {"train_loss": -11.57906723022461, "global_step": 498380, "epoch": 2966} {"train_loss": -11.396669387817383, "global_step": 498381, "epoch": 2966} {"train_loss": -12.059739112854004, "global_step": 498382, "epoch": 2966} {"train_loss": -12.111385345458984, "global_step": 498383, "epoch": 2966} {"train_loss": -12.5446195602417, "global_step": 498384, "epoch": 2966} {"train_loss": -11.037485122680664, "global_step": 498385, "epoch": 2966} {"train_loss": -12.650094985961914, "global_step": 498386, "epoch": 2966} {"train_loss": -11.544940948486328, "global_step": 498387, "epoch": 2966} {"train_loss": -12.016971588134766, "global_step": 498388, "epoch": 2966} {"train_loss": -12.60025405883789, "global_step": 498389, "epoch": 2966} {"train_loss": -10.960428237915039, "global_step": 498390, "epoch": 2966} {"train_loss": -10.433624267578125, "global_step": 498391, "epoch": 2966} {"train_loss": -11.927801132202148, "global_step": 498392, "epoch": 2966} {"train_loss": -10.820106506347656, "global_step": 498393, "epoch": 2966} {"train_loss": -11.579950332641602, "global_step": 498394, "epoch": 2966} {"train_loss": -12.049039840698242, "global_step": 498395, "epoch": 2966} {"train_loss": -11.2572660446167, "global_step": 498396, "epoch": 2966} {"train_loss": -12.32669448852539, "global_step": 498397, "epoch": 2966} {"train_loss": -12.04241943359375, "global_step": 498398, "epoch": 2966} {"train_loss": -11.770061492919922, "global_step": 498399, "epoch": 2966} {"train_loss": -12.456415176391602, "global_step": 498400, "epoch": 2966} {"train_loss": -12.285479545593262, "global_step": 498401, "epoch": 2966} {"train_loss": -12.285099029541016, "global_step": 498402, "epoch": 2966} {"train_loss": -12.353830337524414, "global_step": 498403, "epoch": 2966} {"train_loss": -11.88504409790039, "global_step": 498404, "epoch": 2966} {"train_loss": -12.51522445678711, "global_step": 498405, "epoch": 2966} {"train_loss": -12.50885009765625, "global_step": 498406, "epoch": 2966} {"train_loss": -12.375999450683594, "global_step": 498407, "epoch": 2966} {"train_loss": -12.66680908203125, "global_step": 498408, "epoch": 2966} {"train_loss": -12.113502502441406, "global_step": 498409, "epoch": 2966} {"train_loss": -12.71788215637207, "global_step": 498410, "epoch": 2966} {"train_loss": -12.292064666748047, "global_step": 498411, "epoch": 2966} {"train_loss": -12.448333740234375, "global_step": 498412, "epoch": 2966} {"train_loss": -12.717714309692383, "global_step": 498413, "epoch": 2966} {"train_loss": -12.140308380126953, "global_step": 498414, "epoch": 2966} {"train_loss": -12.563688278198242, "global_step": 498415, "epoch": 2966} {"train_loss": -12.205427169799805, "global_step": 498416, "epoch": 2966} {"train_loss": -11.515726089477539, "global_step": 498417, "epoch": 2966} {"train_loss": -12.64036750793457, "global_step": 498418, "epoch": 2966} {"train_loss": -12.029073715209961, "global_step": 498419, "epoch": 2966} {"train_loss": -11.980653762817383, "global_step": 498420, "epoch": 2966} {"train_loss": -12.196712493896484, "global_step": 498421, "epoch": 2966} {"train_loss": -11.743753433227539, "global_step": 498422, "epoch": 2966} {"train_loss": -12.342869758605957, "global_step": 498423, "epoch": 2966} {"train_loss": -11.48179817199707, "global_step": 498424, "epoch": 2966} {"train_loss": -12.570062637329102, "global_step": 498425, "epoch": 2966} {"train_loss": -11.704977035522461, "global_step": 498426, "epoch": 2966} {"train_loss": -12.161142349243164, "global_step": 498427, "epoch": 2966} {"train_loss": -12.765195846557617, "global_step": 498428, "epoch": 2966} {"train_loss": -12.33798885345459, "global_step": 498429, "epoch": 2966} {"train_loss": -12.625921249389648, "global_step": 498430, "epoch": 2966} {"train_loss": -12.725470542907715, "global_step": 498431, "epoch": 2966} {"train_loss": -12.501775741577148, "global_step": 498432, "epoch": 2966} {"train_loss": -12.720132827758789, "global_step": 498433, "epoch": 2966} {"train_loss": -12.574545860290527, "global_step": 498434, "epoch": 2966} {"train_loss": -12.606690406799316, "global_step": 498435, "epoch": 2966} {"train_loss": -12.89022159576416, "global_step": 498436, "epoch": 2966} {"train_loss": -12.721482276916504, "global_step": 498437, "epoch": 2966} {"train_loss": -12.626077651977539, "global_step": 498438, "epoch": 2966} {"train_loss": -12.66219425201416, "global_step": 498439, "epoch": 2966} {"train_loss": -12.82597541809082, "global_step": 498440, "epoch": 2966} {"train_loss": -12.80640983581543, "global_step": 498441, "epoch": 2966} {"train_loss": -12.896989822387695, "global_step": 498442, "epoch": 2966} {"train_loss": -12.731630325317383, "global_step": 498443, "epoch": 2966} {"train_loss": -12.833978652954102, "global_step": 498444, "epoch": 2966} {"train_loss": -12.554676055908203, "global_step": 498445, "epoch": 2966} {"train_loss": -12.685441970825195, "global_step": 498446, "epoch": 2966} {"train_loss": -12.798619270324707, "global_step": 498447, "epoch": 2966} {"train_loss": -12.810547828674316, "global_step": 498448, "epoch": 2966} {"train_loss": -12.762699127197266, "global_step": 498449, "epoch": 2966} {"train_loss": -12.618249893188477, "global_step": 498450, "epoch": 2966} {"train_loss": -12.838631629943848, "global_step": 498451, "epoch": 2966} {"train_loss": -12.829002380371094, "global_step": 498452, "epoch": 2966} {"train_loss": -12.725531578063965, "global_step": 498453, "epoch": 2966} {"train_loss": -12.702777862548828, "global_step": 498454, "epoch": 2966} {"train_loss": -12.362214673133124, "global_step": 498455, "epoch": 2966, "val_loss": 321060.15625} {"train_loss": -12.733877182006836, "global_step": 498456, "epoch": 2967} {"train_loss": -12.678058624267578, "global_step": 498457, "epoch": 2967} {"train_loss": -13.021949768066406, "global_step": 498458, "epoch": 2967} {"train_loss": -12.51187515258789, "global_step": 498459, "epoch": 2967} {"train_loss": -12.637843132019043, "global_step": 498460, "epoch": 2967} {"train_loss": -12.787147521972656, "global_step": 498461, "epoch": 2967} {"train_loss": -12.865516662597656, "global_step": 498462, "epoch": 2967} {"train_loss": -12.5211181640625, "global_step": 498463, "epoch": 2967} {"train_loss": -12.452659606933594, "global_step": 498464, "epoch": 2967} {"train_loss": -12.605737686157227, "global_step": 498465, "epoch": 2967} {"train_loss": -12.341168403625488, "global_step": 498466, "epoch": 2967} {"train_loss": -12.598551750183105, "global_step": 498467, "epoch": 2967} {"train_loss": -11.563170433044434, "global_step": 498468, "epoch": 2967} {"train_loss": -12.973711013793945, "global_step": 498469, "epoch": 2967} {"train_loss": -11.422441482543945, "global_step": 498470, "epoch": 2967} {"train_loss": -12.348108291625977, "global_step": 498471, "epoch": 2967} {"train_loss": -12.576082229614258, "global_step": 498472, "epoch": 2967} {"train_loss": -12.460888862609863, "global_step": 498473, "epoch": 2967} {"train_loss": -12.380318641662598, "global_step": 498474, "epoch": 2967} {"train_loss": -12.318068504333496, "global_step": 498475, "epoch": 2967} {"train_loss": -12.150997161865234, "global_step": 498476, "epoch": 2967} {"train_loss": -12.621980667114258, "global_step": 498477, "epoch": 2967} {"train_loss": -11.918855667114258, "global_step": 498478, "epoch": 2967} {"train_loss": -12.657087326049805, "global_step": 498479, "epoch": 2967} {"train_loss": -12.708852767944336, "global_step": 498480, "epoch": 2967} {"train_loss": -12.280410766601562, "global_step": 498481, "epoch": 2967} {"train_loss": -12.503174781799316, "global_step": 498482, "epoch": 2967} {"train_loss": -12.626384735107422, "global_step": 498483, "epoch": 2967} {"train_loss": -12.416142463684082, "global_step": 498484, "epoch": 2967} {"train_loss": -12.705387115478516, "global_step": 498485, "epoch": 2967} {"train_loss": -12.741765975952148, "global_step": 498486, "epoch": 2967} {"train_loss": -12.599723815917969, "global_step": 498487, "epoch": 2967} {"train_loss": -12.55127239227295, "global_step": 498488, "epoch": 2967} {"train_loss": -12.124855041503906, "global_step": 498489, "epoch": 2967} {"train_loss": -12.8765869140625, "global_step": 498490, "epoch": 2967} {"train_loss": -11.760635375976562, "global_step": 498491, "epoch": 2967} {"train_loss": -12.848649978637695, "global_step": 498492, "epoch": 2967} {"train_loss": -12.396135330200195, "global_step": 498493, "epoch": 2967} {"train_loss": -12.212081909179688, "global_step": 498494, "epoch": 2967} {"train_loss": -12.1979341506958, "global_step": 498495, "epoch": 2967} {"train_loss": -12.703481674194336, "global_step": 498496, "epoch": 2967} {"train_loss": -12.835660934448242, "global_step": 498497, "epoch": 2967} {"train_loss": -12.786375045776367, "global_step": 498498, "epoch": 2967} {"train_loss": -12.49705696105957, "global_step": 498499, "epoch": 2967} {"train_loss": -12.683534622192383, "global_step": 498500, "epoch": 2967} {"train_loss": -12.503401756286621, "global_step": 498501, "epoch": 2967} {"train_loss": -12.915010452270508, "global_step": 498502, "epoch": 2967} {"train_loss": -12.559840202331543, "global_step": 498503, "epoch": 2967} {"train_loss": -11.964242935180664, "global_step": 498504, "epoch": 2967} {"train_loss": -12.16813850402832, "global_step": 498505, "epoch": 2967} {"train_loss": -12.843606948852539, "global_step": 498506, "epoch": 2967} {"train_loss": -12.378908157348633, "global_step": 498507, "epoch": 2967} {"train_loss": -12.01509952545166, "global_step": 498508, "epoch": 2967} {"train_loss": -12.9426851272583, "global_step": 498509, "epoch": 2967} {"train_loss": -12.811119079589844, "global_step": 498510, "epoch": 2967} {"train_loss": -12.837403297424316, "global_step": 498511, "epoch": 2967} {"train_loss": -12.992462158203125, "global_step": 498512, "epoch": 2967} {"train_loss": -12.938060760498047, "global_step": 498513, "epoch": 2967} {"train_loss": -12.817785263061523, "global_step": 498514, "epoch": 2967} {"train_loss": -12.658269882202148, "global_step": 498515, "epoch": 2967} {"train_loss": -13.181764602661133, "global_step": 498516, "epoch": 2967} {"train_loss": -12.862015724182129, "global_step": 498517, "epoch": 2967} {"train_loss": -12.433436393737793, "global_step": 498518, "epoch": 2967} {"train_loss": -12.597929000854492, "global_step": 498519, "epoch": 2967} {"train_loss": -12.796550750732422, "global_step": 498520, "epoch": 2967} {"train_loss": -12.154107093811035, "global_step": 498521, "epoch": 2967} {"train_loss": -12.27773666381836, "global_step": 498522, "epoch": 2967} {"train_loss": -12.451289176940918, "global_step": 498523, "epoch": 2967} {"train_loss": -12.202542304992676, "global_step": 498524, "epoch": 2967} {"train_loss": -12.82429313659668, "global_step": 498525, "epoch": 2967} {"train_loss": -12.3233642578125, "global_step": 498526, "epoch": 2967} {"train_loss": -12.787704467773438, "global_step": 498527, "epoch": 2967} {"train_loss": -12.460097312927246, "global_step": 498528, "epoch": 2967} {"train_loss": -12.780458450317383, "global_step": 498529, "epoch": 2967} {"train_loss": -12.688453674316406, "global_step": 498530, "epoch": 2967} {"train_loss": -12.694917678833008, "global_step": 498531, "epoch": 2967} {"train_loss": -12.434199333190918, "global_step": 498532, "epoch": 2967} {"train_loss": -12.798540115356445, "global_step": 498533, "epoch": 2967} {"train_loss": -12.98694896697998, "global_step": 498534, "epoch": 2967} {"train_loss": -12.688936233520508, "global_step": 498535, "epoch": 2967} {"train_loss": -12.908031463623047, "global_step": 498536, "epoch": 2967} {"train_loss": -12.843347549438477, "global_step": 498537, "epoch": 2967} {"train_loss": -12.870864868164062, "global_step": 498538, "epoch": 2967} {"train_loss": -12.624951362609863, "global_step": 498539, "epoch": 2967} {"train_loss": -12.98637866973877, "global_step": 498540, "epoch": 2967} {"train_loss": -12.590049743652344, "global_step": 498541, "epoch": 2967} {"train_loss": -12.707414627075195, "global_step": 498542, "epoch": 2967} {"train_loss": -12.595385551452637, "global_step": 498543, "epoch": 2967} {"train_loss": -12.691532135009766, "global_step": 498544, "epoch": 2967} {"train_loss": -12.486114501953125, "global_step": 498545, "epoch": 2967} {"train_loss": -12.837967872619629, "global_step": 498546, "epoch": 2967} {"train_loss": -12.585183143615723, "global_step": 498547, "epoch": 2967} {"train_loss": -12.794831275939941, "global_step": 498548, "epoch": 2967} {"train_loss": -12.884841918945312, "global_step": 498549, "epoch": 2967} {"train_loss": -12.798100471496582, "global_step": 498550, "epoch": 2967} {"train_loss": -12.69138240814209, "global_step": 498551, "epoch": 2967} {"train_loss": -12.708098411560059, "global_step": 498552, "epoch": 2967} {"train_loss": -12.758474349975586, "global_step": 498553, "epoch": 2967} {"train_loss": -12.144524574279785, "global_step": 498554, "epoch": 2967} {"train_loss": -12.106876373291016, "global_step": 498555, "epoch": 2967} {"train_loss": -12.794618606567383, "global_step": 498556, "epoch": 2967} {"train_loss": -12.461151123046875, "global_step": 498557, "epoch": 2967} {"train_loss": -12.553770065307617, "global_step": 498558, "epoch": 2967} {"train_loss": -12.051375389099121, "global_step": 498559, "epoch": 2967} {"train_loss": -12.506658554077148, "global_step": 498560, "epoch": 2967} {"train_loss": -12.151590347290039, "global_step": 498561, "epoch": 2967} {"train_loss": -12.61498737335205, "global_step": 498562, "epoch": 2967} {"train_loss": -12.54584789276123, "global_step": 498563, "epoch": 2967} {"train_loss": -12.624008178710938, "global_step": 498564, "epoch": 2967} {"train_loss": -12.286782264709473, "global_step": 498565, "epoch": 2967} {"train_loss": -12.32748031616211, "global_step": 498566, "epoch": 2967} {"train_loss": -11.579362869262695, "global_step": 498567, "epoch": 2967} {"train_loss": -12.560894012451172, "global_step": 498568, "epoch": 2967} {"train_loss": -12.043169021606445, "global_step": 498569, "epoch": 2967} {"train_loss": -11.985130310058594, "global_step": 498570, "epoch": 2967} {"train_loss": -12.285554885864258, "global_step": 498571, "epoch": 2967} {"train_loss": -12.392398834228516, "global_step": 498572, "epoch": 2967} {"train_loss": -12.04043960571289, "global_step": 498573, "epoch": 2967} {"train_loss": -12.488493919372559, "global_step": 498574, "epoch": 2967} {"train_loss": -12.392101287841797, "global_step": 498575, "epoch": 2967} {"train_loss": -12.063420295715332, "global_step": 498576, "epoch": 2967} {"train_loss": -12.304435729980469, "global_step": 498577, "epoch": 2967} {"train_loss": -12.146203994750977, "global_step": 498578, "epoch": 2967} {"train_loss": -10.847480773925781, "global_step": 498579, "epoch": 2967} {"train_loss": -11.346394538879395, "global_step": 498580, "epoch": 2967} {"train_loss": -12.038078308105469, "global_step": 498581, "epoch": 2967} {"train_loss": -9.896383285522461, "global_step": 498582, "epoch": 2967} {"train_loss": -11.871109008789062, "global_step": 498583, "epoch": 2967} {"train_loss": -10.821945190429688, "global_step": 498584, "epoch": 2967} {"train_loss": -10.713414192199707, "global_step": 498585, "epoch": 2967} {"train_loss": -11.34566879272461, "global_step": 498586, "epoch": 2967} {"train_loss": -11.285942077636719, "global_step": 498587, "epoch": 2967} {"train_loss": -10.849383354187012, "global_step": 498588, "epoch": 2967} {"train_loss": -10.91909408569336, "global_step": 498589, "epoch": 2967} {"train_loss": -11.358926773071289, "global_step": 498590, "epoch": 2967} {"train_loss": -10.716007232666016, "global_step": 498591, "epoch": 2967} {"train_loss": -11.95612907409668, "global_step": 498592, "epoch": 2967} {"train_loss": -10.810009956359863, "global_step": 498593, "epoch": 2967} {"train_loss": -11.053622245788574, "global_step": 498594, "epoch": 2967} {"train_loss": -11.32620620727539, "global_step": 498595, "epoch": 2967} {"train_loss": -9.886848449707031, "global_step": 498596, "epoch": 2967} {"train_loss": -9.240682601928711, "global_step": 498597, "epoch": 2967} {"train_loss": -8.42663860321045, "global_step": 498598, "epoch": 2967} {"train_loss": -9.07851505279541, "global_step": 498599, "epoch": 2967} {"train_loss": -9.453699111938477, "global_step": 498600, "epoch": 2967} {"train_loss": -10.283204078674316, "global_step": 498601, "epoch": 2967} {"train_loss": -10.217430114746094, "global_step": 498602, "epoch": 2967} {"train_loss": -9.104085922241211, "global_step": 498603, "epoch": 2967} {"train_loss": -10.969072341918945, "global_step": 498604, "epoch": 2967} {"train_loss": -8.228878021240234, "global_step": 498605, "epoch": 2967} {"train_loss": -10.37138843536377, "global_step": 498606, "epoch": 2967} {"train_loss": -9.145059585571289, "global_step": 498607, "epoch": 2967} {"train_loss": -10.627737045288086, "global_step": 498608, "epoch": 2967} {"train_loss": -8.689148902893066, "global_step": 498609, "epoch": 2967} {"train_loss": -10.030891418457031, "global_step": 498610, "epoch": 2967} {"train_loss": -11.405647277832031, "global_step": 498611, "epoch": 2967} {"train_loss": -9.932992935180664, "global_step": 498612, "epoch": 2967} {"train_loss": -11.219645500183105, "global_step": 498613, "epoch": 2967} {"train_loss": -10.845775604248047, "global_step": 498614, "epoch": 2967} {"train_loss": -10.568263053894043, "global_step": 498615, "epoch": 2967} {"train_loss": -11.096288681030273, "global_step": 498616, "epoch": 2967} {"train_loss": -10.20628833770752, "global_step": 498617, "epoch": 2967} {"train_loss": -10.812797546386719, "global_step": 498618, "epoch": 2967} {"train_loss": -10.797096252441406, "global_step": 498619, "epoch": 2967} {"train_loss": -11.222391128540039, "global_step": 498620, "epoch": 2967} {"train_loss": -10.43780517578125, "global_step": 498621, "epoch": 2967} {"train_loss": -11.683923721313477, "global_step": 498622, "epoch": 2967} {"train_loss": -11.990161021550497, "global_step": 498623, "epoch": 2967, "val_loss": 309380.15625} {"train_loss": -12.055791854858398, "global_step": 498624, "epoch": 2968} {"train_loss": -10.959029197692871, "global_step": 498625, "epoch": 2968} {"train_loss": -11.167976379394531, "global_step": 498626, "epoch": 2968} {"train_loss": -10.977495193481445, "global_step": 498627, "epoch": 2968} {"train_loss": -11.63868236541748, "global_step": 498628, "epoch": 2968} {"train_loss": -10.995997428894043, "global_step": 498629, "epoch": 2968} {"train_loss": -11.664278984069824, "global_step": 498630, "epoch": 2968} {"train_loss": -11.50007438659668, "global_step": 498631, "epoch": 2968} {"train_loss": -11.77254867553711, "global_step": 498632, "epoch": 2968} {"train_loss": -11.651387214660645, "global_step": 498633, "epoch": 2968} {"train_loss": -11.366424560546875, "global_step": 498634, "epoch": 2968} {"train_loss": -11.725919723510742, "global_step": 498635, "epoch": 2968} {"train_loss": -11.406787872314453, "global_step": 498636, "epoch": 2968} {"train_loss": -11.667747497558594, "global_step": 498637, "epoch": 2968} {"train_loss": -11.81471061706543, "global_step": 498638, "epoch": 2968} {"train_loss": -11.679737091064453, "global_step": 498639, "epoch": 2968} {"train_loss": -12.199935913085938, "global_step": 498640, "epoch": 2968} {"train_loss": -11.804481506347656, "global_step": 498641, "epoch": 2968} {"train_loss": -11.889100074768066, "global_step": 498642, "epoch": 2968} {"train_loss": -12.292201042175293, "global_step": 498643, "epoch": 2968} {"train_loss": -11.703021049499512, "global_step": 498644, "epoch": 2968} {"train_loss": -12.305956840515137, "global_step": 498645, "epoch": 2968} {"train_loss": -12.024809837341309, "global_step": 498646, "epoch": 2968} {"train_loss": -12.334721565246582, "global_step": 498647, "epoch": 2968} {"train_loss": -12.35842514038086, "global_step": 498648, "epoch": 2968} {"train_loss": -12.364095687866211, "global_step": 498649, "epoch": 2968} {"train_loss": -12.116259574890137, "global_step": 498650, "epoch": 2968} {"train_loss": -12.434724807739258, "global_step": 498651, "epoch": 2968} {"train_loss": -12.172321319580078, "global_step": 498652, "epoch": 2968} {"train_loss": -12.455289840698242, "global_step": 498653, "epoch": 2968} {"train_loss": -12.401650428771973, "global_step": 498654, "epoch": 2968} {"train_loss": -12.055225372314453, "global_step": 498655, "epoch": 2968} {"train_loss": -12.356718063354492, "global_step": 498656, "epoch": 2968} {"train_loss": -12.395248413085938, "global_step": 498657, "epoch": 2968} {"train_loss": -12.468408584594727, "global_step": 498658, "epoch": 2968} {"train_loss": -12.55421257019043, "global_step": 498659, "epoch": 2968} {"train_loss": -12.406492233276367, "global_step": 498660, "epoch": 2968} {"train_loss": -12.361268043518066, "global_step": 498661, "epoch": 2968} {"train_loss": -12.369623184204102, "global_step": 498662, "epoch": 2968} {"train_loss": -12.272790908813477, "global_step": 498663, "epoch": 2968} {"train_loss": -12.365280151367188, "global_step": 498664, "epoch": 2968} {"train_loss": -12.702197074890137, "global_step": 498665, "epoch": 2968} {"train_loss": -12.431622505187988, "global_step": 498666, "epoch": 2968} {"train_loss": -12.726825714111328, "global_step": 498667, "epoch": 2968} {"train_loss": -12.527070045471191, "global_step": 498668, "epoch": 2968} {"train_loss": -12.634451866149902, "global_step": 498669, "epoch": 2968} {"train_loss": -12.603460311889648, "global_step": 498670, "epoch": 2968} {"train_loss": -12.542609214782715, "global_step": 498671, "epoch": 2968} {"train_loss": -12.561328887939453, "global_step": 498672, "epoch": 2968} {"train_loss": -12.46835994720459, "global_step": 498673, "epoch": 2968} {"train_loss": -12.524733543395996, "global_step": 498674, "epoch": 2968} {"train_loss": -12.614782333374023, "global_step": 498675, "epoch": 2968} {"train_loss": -12.620576858520508, "global_step": 498676, "epoch": 2968} {"train_loss": -12.724056243896484, "global_step": 498677, "epoch": 2968} {"train_loss": -12.560201644897461, "global_step": 498678, "epoch": 2968} {"train_loss": -12.559688568115234, "global_step": 498679, "epoch": 2968} {"train_loss": -12.823530197143555, "global_step": 498680, "epoch": 2968} {"train_loss": -12.648053169250488, "global_step": 498681, "epoch": 2968} {"train_loss": -12.83237361907959, "global_step": 498682, "epoch": 2968} {"train_loss": -12.547186851501465, "global_step": 498683, "epoch": 2968} {"train_loss": -12.464558601379395, "global_step": 498684, "epoch": 2968} {"train_loss": -12.569796562194824, "global_step": 498685, "epoch": 2968} {"train_loss": -12.937101364135742, "global_step": 498686, "epoch": 2968} {"train_loss": -12.75965690612793, "global_step": 498687, "epoch": 2968} {"train_loss": -12.679075241088867, "global_step": 498688, "epoch": 2968} {"train_loss": -12.620877265930176, "global_step": 498689, "epoch": 2968} {"train_loss": -12.75783634185791, "global_step": 498690, "epoch": 2968} {"train_loss": -12.621711730957031, "global_step": 498691, "epoch": 2968} {"train_loss": -12.491999626159668, "global_step": 498692, "epoch": 2968} {"train_loss": -12.710658073425293, "global_step": 498693, "epoch": 2968} {"train_loss": -12.717235565185547, "global_step": 498694, "epoch": 2968} {"train_loss": -12.801725387573242, "global_step": 498695, "epoch": 2968} {"train_loss": -12.91501235961914, "global_step": 498696, "epoch": 2968} {"train_loss": -12.511996269226074, "global_step": 498697, "epoch": 2968} {"train_loss": -12.891508102416992, "global_step": 498698, "epoch": 2968} {"train_loss": -12.907401084899902, "global_step": 498699, "epoch": 2968} {"train_loss": -13.047335624694824, "global_step": 498700, "epoch": 2968} {"train_loss": -12.569250106811523, "global_step": 498701, "epoch": 2968} {"train_loss": -12.77760124206543, "global_step": 498702, "epoch": 2968} {"train_loss": -12.983663558959961, "global_step": 498703, "epoch": 2968} {"train_loss": -12.791463851928711, "global_step": 498704, "epoch": 2968} {"train_loss": -12.675348281860352, "global_step": 498705, "epoch": 2968} {"train_loss": -12.870741844177246, "global_step": 498706, "epoch": 2968} {"train_loss": -12.845459938049316, "global_step": 498707, "epoch": 2968} {"train_loss": -12.713831901550293, "global_step": 498708, "epoch": 2968} {"train_loss": -12.991689682006836, "global_step": 498709, "epoch": 2968} {"train_loss": -13.021074295043945, "global_step": 498710, "epoch": 2968} {"train_loss": -12.870599746704102, "global_step": 498711, "epoch": 2968} {"train_loss": -12.784055709838867, "global_step": 498712, "epoch": 2968} {"train_loss": -12.796432495117188, "global_step": 498713, "epoch": 2968} {"train_loss": -13.055609703063965, "global_step": 498714, "epoch": 2968} {"train_loss": -12.846990585327148, "global_step": 498715, "epoch": 2968} {"train_loss": -12.910457611083984, "global_step": 498716, "epoch": 2968} {"train_loss": -12.742925643920898, "global_step": 498717, "epoch": 2968} {"train_loss": -12.87831974029541, "global_step": 498718, "epoch": 2968} {"train_loss": -12.726164817810059, "global_step": 498719, "epoch": 2968} {"train_loss": -12.830806732177734, "global_step": 498720, "epoch": 2968} {"train_loss": -12.822738647460938, "global_step": 498721, "epoch": 2968} {"train_loss": -12.972038269042969, "global_step": 498722, "epoch": 2968} {"train_loss": -12.56715202331543, "global_step": 498723, "epoch": 2968} {"train_loss": -12.976238250732422, "global_step": 498724, "epoch": 2968} {"train_loss": -12.835779190063477, "global_step": 498725, "epoch": 2968} {"train_loss": -12.680213928222656, "global_step": 498726, "epoch": 2968} {"train_loss": -12.383272171020508, "global_step": 498727, "epoch": 2968} {"train_loss": -12.673582077026367, "global_step": 498728, "epoch": 2968} {"train_loss": -12.922117233276367, "global_step": 498729, "epoch": 2968} {"train_loss": -12.887192726135254, "global_step": 498730, "epoch": 2968} {"train_loss": -12.546804428100586, "global_step": 498731, "epoch": 2968} {"train_loss": -12.869766235351562, "global_step": 498732, "epoch": 2968} {"train_loss": -12.826939582824707, "global_step": 498733, "epoch": 2968} {"train_loss": -12.2445068359375, "global_step": 498734, "epoch": 2968} {"train_loss": -12.584165573120117, "global_step": 498735, "epoch": 2968} {"train_loss": -12.745121002197266, "global_step": 498736, "epoch": 2968} {"train_loss": -12.595057487487793, "global_step": 498737, "epoch": 2968} {"train_loss": -12.670164108276367, "global_step": 498738, "epoch": 2968} {"train_loss": -12.758321762084961, "global_step": 498739, "epoch": 2968} {"train_loss": -12.795421600341797, "global_step": 498740, "epoch": 2968} {"train_loss": -12.980656623840332, "global_step": 498741, "epoch": 2968} {"train_loss": -12.818410873413086, "global_step": 498742, "epoch": 2968} {"train_loss": -12.799222946166992, "global_step": 498743, "epoch": 2968} {"train_loss": -12.865213394165039, "global_step": 498744, "epoch": 2968} {"train_loss": -12.657866477966309, "global_step": 498745, "epoch": 2968} {"train_loss": -12.788915634155273, "global_step": 498746, "epoch": 2968} {"train_loss": -12.64134407043457, "global_step": 498747, "epoch": 2968} {"train_loss": -12.581551551818848, "global_step": 498748, "epoch": 2968} {"train_loss": -12.960455894470215, "global_step": 498749, "epoch": 2968} {"train_loss": -12.725532531738281, "global_step": 498750, "epoch": 2968} {"train_loss": -12.50416374206543, "global_step": 498751, "epoch": 2968} {"train_loss": -12.708900451660156, "global_step": 498752, "epoch": 2968} {"train_loss": -12.205419540405273, "global_step": 498753, "epoch": 2968} {"train_loss": -11.98581600189209, "global_step": 498754, "epoch": 2968} {"train_loss": -12.544282913208008, "global_step": 498755, "epoch": 2968} {"train_loss": -11.218709945678711, "global_step": 498756, "epoch": 2968} {"train_loss": -10.435546875, "global_step": 498757, "epoch": 2968} {"train_loss": -11.465344429016113, "global_step": 498758, "epoch": 2968} {"train_loss": -12.07142448425293, "global_step": 498759, "epoch": 2968} {"train_loss": -11.240422248840332, "global_step": 498760, "epoch": 2968} {"train_loss": -12.529607772827148, "global_step": 498761, "epoch": 2968} {"train_loss": -11.458168029785156, "global_step": 498762, "epoch": 2968} {"train_loss": -10.124483108520508, "global_step": 498763, "epoch": 2968} {"train_loss": -11.779760360717773, "global_step": 498764, "epoch": 2968} {"train_loss": -11.643280982971191, "global_step": 498765, "epoch": 2968} {"train_loss": -10.633843421936035, "global_step": 498766, "epoch": 2968} {"train_loss": -12.229496002197266, "global_step": 498767, "epoch": 2968} {"train_loss": -10.21777057647705, "global_step": 498768, "epoch": 2968} {"train_loss": -11.068262100219727, "global_step": 498769, "epoch": 2968} {"train_loss": -11.478402137756348, "global_step": 498770, "epoch": 2968} {"train_loss": -11.37879753112793, "global_step": 498771, "epoch": 2968} {"train_loss": -12.306070327758789, "global_step": 498772, "epoch": 2968} {"train_loss": -11.835931777954102, "global_step": 498773, "epoch": 2968} {"train_loss": -11.518089294433594, "global_step": 498774, "epoch": 2968} {"train_loss": -11.813023567199707, "global_step": 498775, "epoch": 2968} {"train_loss": -10.67293930053711, "global_step": 498776, "epoch": 2968} {"train_loss": -11.751422882080078, "global_step": 498777, "epoch": 2968} {"train_loss": -11.170080184936523, "global_step": 498778, "epoch": 2968} {"train_loss": -10.475634574890137, "global_step": 498779, "epoch": 2968} {"train_loss": -11.548605918884277, "global_step": 498780, "epoch": 2968} {"train_loss": -10.265052795410156, "global_step": 498781, "epoch": 2968} {"train_loss": -10.183313369750977, "global_step": 498782, "epoch": 2968} {"train_loss": -11.189596176147461, "global_step": 498783, "epoch": 2968} {"train_loss": -9.991483688354492, "global_step": 498784, "epoch": 2968} {"train_loss": -10.464995384216309, "global_step": 498785, "epoch": 2968} {"train_loss": -9.678014755249023, "global_step": 498786, "epoch": 2968} {"train_loss": -10.588767051696777, "global_step": 498787, "epoch": 2968} {"train_loss": -11.159008979797363, "global_step": 498788, "epoch": 2968} {"train_loss": -9.636903762817383, "global_step": 498789, "epoch": 2968} {"train_loss": -10.828022003173828, "global_step": 498790, "epoch": 2968} {"train_loss": -12.177971397127424, "global_step": 498791, "epoch": 2968, "val_loss": 316345.53125} {"train_loss": -11.253561019897461, "global_step": 498792, "epoch": 2969} {"train_loss": -11.37985610961914, "global_step": 498793, "epoch": 2969} {"train_loss": -10.676372528076172, "global_step": 498794, "epoch": 2969} {"train_loss": -10.879476547241211, "global_step": 498795, "epoch": 2969} {"train_loss": -11.071405410766602, "global_step": 498796, "epoch": 2969} {"train_loss": -10.835677146911621, "global_step": 498797, "epoch": 2969} {"train_loss": -10.729986190795898, "global_step": 498798, "epoch": 2969} {"train_loss": -10.61259651184082, "global_step": 498799, "epoch": 2969} {"train_loss": -10.04551887512207, "global_step": 498800, "epoch": 2969} {"train_loss": -10.39122200012207, "global_step": 498801, "epoch": 2969} {"train_loss": -11.081991195678711, "global_step": 498802, "epoch": 2969} {"train_loss": -11.559603691101074, "global_step": 498803, "epoch": 2969} {"train_loss": -11.279579162597656, "global_step": 498804, "epoch": 2969} {"train_loss": -11.216318130493164, "global_step": 498805, "epoch": 2969} {"train_loss": -11.330720901489258, "global_step": 498806, "epoch": 2969} {"train_loss": -11.425220489501953, "global_step": 498807, "epoch": 2969} {"train_loss": -11.437169075012207, "global_step": 498808, "epoch": 2969} {"train_loss": -11.569254875183105, "global_step": 498809, "epoch": 2969} {"train_loss": -11.42664909362793, "global_step": 498810, "epoch": 2969} {"train_loss": -12.348907470703125, "global_step": 498811, "epoch": 2969} {"train_loss": -10.877171516418457, "global_step": 498812, "epoch": 2969} {"train_loss": -12.169316291809082, "global_step": 498813, "epoch": 2969} {"train_loss": -11.352751731872559, "global_step": 498814, "epoch": 2969} {"train_loss": -12.434646606445312, "global_step": 498815, "epoch": 2969} {"train_loss": -11.851243019104004, "global_step": 498816, "epoch": 2969} {"train_loss": -11.948761940002441, "global_step": 498817, "epoch": 2969} {"train_loss": -11.787921905517578, "global_step": 498818, "epoch": 2969} {"train_loss": -12.010313034057617, "global_step": 498819, "epoch": 2969} {"train_loss": -11.822166442871094, "global_step": 498820, "epoch": 2969} {"train_loss": -11.942811965942383, "global_step": 498821, "epoch": 2969} {"train_loss": -11.699801445007324, "global_step": 498822, "epoch": 2969} {"train_loss": -12.28946304321289, "global_step": 498823, "epoch": 2969} {"train_loss": -11.875764846801758, "global_step": 498824, "epoch": 2969} {"train_loss": -12.434638023376465, "global_step": 498825, "epoch": 2969} {"train_loss": -11.883264541625977, "global_step": 498826, "epoch": 2969} {"train_loss": -12.285865783691406, "global_step": 498827, "epoch": 2969} {"train_loss": -12.072986602783203, "global_step": 498828, "epoch": 2969} {"train_loss": -12.433868408203125, "global_step": 498829, "epoch": 2969} {"train_loss": -12.346240997314453, "global_step": 498830, "epoch": 2969} {"train_loss": -12.287687301635742, "global_step": 498831, "epoch": 2969} {"train_loss": -12.291828155517578, "global_step": 498832, "epoch": 2969} {"train_loss": -12.374780654907227, "global_step": 498833, "epoch": 2969} {"train_loss": -12.099550247192383, "global_step": 498834, "epoch": 2969} {"train_loss": -12.336084365844727, "global_step": 498835, "epoch": 2969} {"train_loss": -12.524412155151367, "global_step": 498836, "epoch": 2969} {"train_loss": -12.509721755981445, "global_step": 498837, "epoch": 2969} {"train_loss": -12.35670280456543, "global_step": 498838, "epoch": 2969} {"train_loss": -12.603887557983398, "global_step": 498839, "epoch": 2969} {"train_loss": -12.395537376403809, "global_step": 498840, "epoch": 2969} {"train_loss": -12.589780807495117, "global_step": 498841, "epoch": 2969} {"train_loss": -12.283308982849121, "global_step": 498842, "epoch": 2969} {"train_loss": -12.445411682128906, "global_step": 498843, "epoch": 2969} {"train_loss": -12.4207124710083, "global_step": 498844, "epoch": 2969} {"train_loss": -12.712343215942383, "global_step": 498845, "epoch": 2969} {"train_loss": -12.284311294555664, "global_step": 498846, "epoch": 2969} {"train_loss": -12.723051071166992, "global_step": 498847, "epoch": 2969} {"train_loss": -12.292333602905273, "global_step": 498848, "epoch": 2969} {"train_loss": -12.42822265625, "global_step": 498849, "epoch": 2969} {"train_loss": -12.286861419677734, "global_step": 498850, "epoch": 2969} {"train_loss": -12.762950897216797, "global_step": 498851, "epoch": 2969} {"train_loss": -12.250152587890625, "global_step": 498852, "epoch": 2969} {"train_loss": -12.462565422058105, "global_step": 498853, "epoch": 2969} {"train_loss": -12.280782699584961, "global_step": 498854, "epoch": 2969} {"train_loss": -12.463412284851074, "global_step": 498855, "epoch": 2969} {"train_loss": -12.349701881408691, "global_step": 498856, "epoch": 2969} {"train_loss": -12.47482681274414, "global_step": 498857, "epoch": 2969} {"train_loss": -12.725573539733887, "global_step": 498858, "epoch": 2969} {"train_loss": -12.401594161987305, "global_step": 498859, "epoch": 2969} {"train_loss": -12.523666381835938, "global_step": 498860, "epoch": 2969} {"train_loss": -12.283098220825195, "global_step": 498861, "epoch": 2969} {"train_loss": -12.375861167907715, "global_step": 498862, "epoch": 2969} {"train_loss": -12.339007377624512, "global_step": 498863, "epoch": 2969} {"train_loss": -12.477513313293457, "global_step": 498864, "epoch": 2969} {"train_loss": -12.585232734680176, "global_step": 498865, "epoch": 2969} {"train_loss": -12.094613075256348, "global_step": 498866, "epoch": 2969} {"train_loss": -12.435090065002441, "global_step": 498867, "epoch": 2969} {"train_loss": -12.338211059570312, "global_step": 498868, "epoch": 2969} {"train_loss": -11.524560928344727, "global_step": 498869, "epoch": 2969} {"train_loss": -12.604623794555664, "global_step": 498870, "epoch": 2969} {"train_loss": -11.727031707763672, "global_step": 498871, "epoch": 2969} {"train_loss": -12.597196578979492, "global_step": 498872, "epoch": 2969} {"train_loss": -12.078409194946289, "global_step": 498873, "epoch": 2969} {"train_loss": -12.4962797164917, "global_step": 498874, "epoch": 2969} {"train_loss": -12.404592514038086, "global_step": 498875, "epoch": 2969} {"train_loss": -12.48855209350586, "global_step": 498876, "epoch": 2969} {"train_loss": -12.766396522521973, "global_step": 498877, "epoch": 2969} {"train_loss": -12.387121200561523, "global_step": 498878, "epoch": 2969} {"train_loss": -12.694947242736816, "global_step": 498879, "epoch": 2969} {"train_loss": -12.663534164428711, "global_step": 498880, "epoch": 2969} {"train_loss": -12.802816390991211, "global_step": 498881, "epoch": 2969} {"train_loss": -12.603765487670898, "global_step": 498882, "epoch": 2969} {"train_loss": -12.475748062133789, "global_step": 498883, "epoch": 2969} {"train_loss": -12.559497833251953, "global_step": 498884, "epoch": 2969} {"train_loss": -12.54530143737793, "global_step": 498885, "epoch": 2969} {"train_loss": -12.764917373657227, "global_step": 498886, "epoch": 2969} {"train_loss": -12.404099464416504, "global_step": 498887, "epoch": 2969} {"train_loss": -12.71772575378418, "global_step": 498888, "epoch": 2969} {"train_loss": -12.695207595825195, "global_step": 498889, "epoch": 2969} {"train_loss": -12.947685241699219, "global_step": 498890, "epoch": 2969} {"train_loss": -12.812800407409668, "global_step": 498891, "epoch": 2969} {"train_loss": -12.71769905090332, "global_step": 498892, "epoch": 2969} {"train_loss": -12.914751052856445, "global_step": 498893, "epoch": 2969} {"train_loss": -12.44336986541748, "global_step": 498894, "epoch": 2969} {"train_loss": -12.946626663208008, "global_step": 498895, "epoch": 2969} {"train_loss": -12.750186920166016, "global_step": 498896, "epoch": 2969} {"train_loss": -12.928243637084961, "global_step": 498897, "epoch": 2969} {"train_loss": -12.633833885192871, "global_step": 498898, "epoch": 2969} {"train_loss": -12.782793998718262, "global_step": 498899, "epoch": 2969} {"train_loss": -12.989389419555664, "global_step": 498900, "epoch": 2969} {"train_loss": -12.730228424072266, "global_step": 498901, "epoch": 2969} {"train_loss": -12.88814926147461, "global_step": 498902, "epoch": 2969} {"train_loss": -12.689905166625977, "global_step": 498903, "epoch": 2969} {"train_loss": -12.805900573730469, "global_step": 498904, "epoch": 2969} {"train_loss": -12.633869171142578, "global_step": 498905, "epoch": 2969} {"train_loss": -12.724355697631836, "global_step": 498906, "epoch": 2969} {"train_loss": -12.944947242736816, "global_step": 498907, "epoch": 2969} {"train_loss": -12.925403594970703, "global_step": 498908, "epoch": 2969} {"train_loss": -12.79648208618164, "global_step": 498909, "epoch": 2969} {"train_loss": -12.8743257522583, "global_step": 498910, "epoch": 2969} {"train_loss": -12.863762855529785, "global_step": 498911, "epoch": 2969} {"train_loss": -12.937370300292969, "global_step": 498912, "epoch": 2969} {"train_loss": -12.94505500793457, "global_step": 498913, "epoch": 2969} {"train_loss": -12.682367324829102, "global_step": 498914, "epoch": 2969} {"train_loss": -12.786412239074707, "global_step": 498915, "epoch": 2969} {"train_loss": -12.938546180725098, "global_step": 498916, "epoch": 2969} {"train_loss": -12.727259635925293, "global_step": 498917, "epoch": 2969} {"train_loss": -12.692696571350098, "global_step": 498918, "epoch": 2969} {"train_loss": -12.467018127441406, "global_step": 498919, "epoch": 2969} {"train_loss": -12.566611289978027, "global_step": 498920, "epoch": 2969} {"train_loss": -12.713570594787598, "global_step": 498921, "epoch": 2969} {"train_loss": -12.450540542602539, "global_step": 498922, "epoch": 2969} {"train_loss": -12.906600952148438, "global_step": 498923, "epoch": 2969} {"train_loss": -12.575681686401367, "global_step": 498924, "epoch": 2969} {"train_loss": -12.434274673461914, "global_step": 498925, "epoch": 2969} {"train_loss": -12.89061450958252, "global_step": 498926, "epoch": 2969} {"train_loss": -12.244521141052246, "global_step": 498927, "epoch": 2969} {"train_loss": -12.204176902770996, "global_step": 498928, "epoch": 2969} {"train_loss": -12.696601867675781, "global_step": 498929, "epoch": 2969} {"train_loss": -12.331965446472168, "global_step": 498930, "epoch": 2969} {"train_loss": -12.265134811401367, "global_step": 498931, "epoch": 2969} {"train_loss": -12.517641067504883, "global_step": 498932, "epoch": 2969} {"train_loss": -11.2731351852417, "global_step": 498933, "epoch": 2969} {"train_loss": -12.613763809204102, "global_step": 498934, "epoch": 2969} {"train_loss": -11.795726776123047, "global_step": 498935, "epoch": 2969} {"train_loss": -11.391618728637695, "global_step": 498936, "epoch": 2969} {"train_loss": -12.65031909942627, "global_step": 498937, "epoch": 2969} {"train_loss": -11.63947868347168, "global_step": 498938, "epoch": 2969} {"train_loss": -11.893539428710938, "global_step": 498939, "epoch": 2969} {"train_loss": -12.281452178955078, "global_step": 498940, "epoch": 2969} {"train_loss": -11.720283508300781, "global_step": 498941, "epoch": 2969} {"train_loss": -11.035346984863281, "global_step": 498942, "epoch": 2969} {"train_loss": -12.442840576171875, "global_step": 498943, "epoch": 2969} {"train_loss": -11.450952529907227, "global_step": 498944, "epoch": 2969} {"train_loss": -11.32424545288086, "global_step": 498945, "epoch": 2969} {"train_loss": -11.338634490966797, "global_step": 498946, "epoch": 2969} {"train_loss": -10.7696533203125, "global_step": 498947, "epoch": 2969} {"train_loss": -12.576303482055664, "global_step": 498948, "epoch": 2969} {"train_loss": -11.48440933227539, "global_step": 498949, "epoch": 2969} {"train_loss": -12.013252258300781, "global_step": 498950, "epoch": 2969} {"train_loss": -12.285177230834961, "global_step": 498951, "epoch": 2969} {"train_loss": -12.119111061096191, "global_step": 498952, "epoch": 2969} {"train_loss": -12.662837982177734, "global_step": 498953, "epoch": 2969} {"train_loss": -11.78711223602295, "global_step": 498954, "epoch": 2969} {"train_loss": -12.411294937133789, "global_step": 498955, "epoch": 2969} {"train_loss": -12.313156127929688, "global_step": 498956, "epoch": 2969} {"train_loss": -12.306295394897461, "global_step": 498957, "epoch": 2969} {"train_loss": -11.858053207397461, "global_step": 498958, "epoch": 2969} {"train_loss": -12.218650454566593, "global_step": 498959, "epoch": 2969, "val_loss": 320905.59375} {"train_loss": -11.987712860107422, "global_step": 498960, "epoch": 2970} {"train_loss": -12.679162979125977, "global_step": 498961, "epoch": 2970} {"train_loss": -12.208807945251465, "global_step": 498962, "epoch": 2970} {"train_loss": -12.722020149230957, "global_step": 498963, "epoch": 2970} {"train_loss": -12.752737998962402, "global_step": 498964, "epoch": 2970} {"train_loss": -12.385844230651855, "global_step": 498965, "epoch": 2970} {"train_loss": -12.832175254821777, "global_step": 498966, "epoch": 2970} {"train_loss": -12.538911819458008, "global_step": 498967, "epoch": 2970} {"train_loss": -12.811508178710938, "global_step": 498968, "epoch": 2970} {"train_loss": -12.284042358398438, "global_step": 498969, "epoch": 2970} {"train_loss": -12.721949577331543, "global_step": 498970, "epoch": 2970} {"train_loss": -12.446109771728516, "global_step": 498971, "epoch": 2970} {"train_loss": -12.356515884399414, "global_step": 498972, "epoch": 2970} {"train_loss": -12.5765962600708, "global_step": 498973, "epoch": 2970} {"train_loss": -12.514195442199707, "global_step": 498974, "epoch": 2970} {"train_loss": -12.232056617736816, "global_step": 498975, "epoch": 2970} {"train_loss": -12.660552978515625, "global_step": 498976, "epoch": 2970} {"train_loss": -12.126302719116211, "global_step": 498977, "epoch": 2970} {"train_loss": -12.241598129272461, "global_step": 498978, "epoch": 2970} {"train_loss": -11.845793724060059, "global_step": 498979, "epoch": 2970} {"train_loss": -11.995906829833984, "global_step": 498980, "epoch": 2970} {"train_loss": -11.611651420593262, "global_step": 498981, "epoch": 2970} {"train_loss": -10.31389045715332, "global_step": 498982, "epoch": 2970} {"train_loss": -12.354533195495605, "global_step": 498983, "epoch": 2970} {"train_loss": -9.815701484680176, "global_step": 498984, "epoch": 2970} {"train_loss": -10.248769760131836, "global_step": 498985, "epoch": 2970} {"train_loss": -11.313220977783203, "global_step": 498986, "epoch": 2970} {"train_loss": -11.282357215881348, "global_step": 498987, "epoch": 2970} {"train_loss": -10.726225852966309, "global_step": 498988, "epoch": 2970} {"train_loss": -12.015708923339844, "global_step": 498989, "epoch": 2970} {"train_loss": -10.580121994018555, "global_step": 498990, "epoch": 2970} {"train_loss": -12.124285697937012, "global_step": 498991, "epoch": 2970} {"train_loss": -11.085221290588379, "global_step": 498992, "epoch": 2970} {"train_loss": -10.811031341552734, "global_step": 498993, "epoch": 2970} {"train_loss": -11.486425399780273, "global_step": 498994, "epoch": 2970} {"train_loss": -10.398053169250488, "global_step": 498995, "epoch": 2970} {"train_loss": -12.12048053741455, "global_step": 498996, "epoch": 2970} {"train_loss": -11.07017707824707, "global_step": 498997, "epoch": 2970} {"train_loss": -11.224603652954102, "global_step": 498998, "epoch": 2970} {"train_loss": -12.166902542114258, "global_step": 498999, "epoch": 2970} {"train_loss": -11.873387336730957, "global_step": 499000, "epoch": 2970} {"train_loss": -12.09572696685791, "global_step": 499001, "epoch": 2970} {"train_loss": -11.691946029663086, "global_step": 499002, "epoch": 2970} {"train_loss": -11.920997619628906, "global_step": 499003, "epoch": 2970} {"train_loss": -12.377013206481934, "global_step": 499004, "epoch": 2970} {"train_loss": -12.029233932495117, "global_step": 499005, "epoch": 2970} {"train_loss": -12.530112266540527, "global_step": 499006, "epoch": 2970} {"train_loss": -12.489198684692383, "global_step": 499007, "epoch": 2970} {"train_loss": -11.913269996643066, "global_step": 499008, "epoch": 2970} {"train_loss": -12.584386825561523, "global_step": 499009, "epoch": 2970} {"train_loss": -11.422513961791992, "global_step": 499010, "epoch": 2970} {"train_loss": -12.310884475708008, "global_step": 499011, "epoch": 2970} {"train_loss": -11.936726570129395, "global_step": 499012, "epoch": 2970} {"train_loss": -11.878545761108398, "global_step": 499013, "epoch": 2970} {"train_loss": -12.238018035888672, "global_step": 499014, "epoch": 2970} {"train_loss": -11.709653854370117, "global_step": 499015, "epoch": 2970} {"train_loss": -12.325401306152344, "global_step": 499016, "epoch": 2970} {"train_loss": -12.55771541595459, "global_step": 499017, "epoch": 2970} {"train_loss": -11.82512378692627, "global_step": 499018, "epoch": 2970} {"train_loss": -12.285511016845703, "global_step": 499019, "epoch": 2970} {"train_loss": -11.821808815002441, "global_step": 499020, "epoch": 2970} {"train_loss": -11.69620132446289, "global_step": 499021, "epoch": 2970} {"train_loss": -12.388641357421875, "global_step": 499022, "epoch": 2970} {"train_loss": -12.20025634765625, "global_step": 499023, "epoch": 2970} {"train_loss": -12.303614616394043, "global_step": 499024, "epoch": 2970} {"train_loss": -12.05217170715332, "global_step": 499025, "epoch": 2970} {"train_loss": -12.470807075500488, "global_step": 499026, "epoch": 2970} {"train_loss": -12.2512845993042, "global_step": 499027, "epoch": 2970} {"train_loss": -12.673187255859375, "global_step": 499028, "epoch": 2970} {"train_loss": -12.523117065429688, "global_step": 499029, "epoch": 2970} {"train_loss": -12.696123123168945, "global_step": 499030, "epoch": 2970} {"train_loss": -12.682291984558105, "global_step": 499031, "epoch": 2970} {"train_loss": -12.687923431396484, "global_step": 499032, "epoch": 2970} {"train_loss": -12.715461730957031, "global_step": 499033, "epoch": 2970} {"train_loss": -12.50480842590332, "global_step": 499034, "epoch": 2970} {"train_loss": -12.740642547607422, "global_step": 499035, "epoch": 2970} {"train_loss": -12.732653617858887, "global_step": 499036, "epoch": 2970} {"train_loss": -12.343114852905273, "global_step": 499037, "epoch": 2970} {"train_loss": -12.485879898071289, "global_step": 499038, "epoch": 2970} {"train_loss": -12.564891815185547, "global_step": 499039, "epoch": 2970} {"train_loss": -12.627386093139648, "global_step": 499040, "epoch": 2970} {"train_loss": -12.601907730102539, "global_step": 499041, "epoch": 2970} {"train_loss": -12.428847312927246, "global_step": 499042, "epoch": 2970} {"train_loss": -12.470462799072266, "global_step": 499043, "epoch": 2970} {"train_loss": -12.242823600769043, "global_step": 499044, "epoch": 2970} {"train_loss": -12.566417694091797, "global_step": 499045, "epoch": 2970} {"train_loss": -12.606024742126465, "global_step": 499046, "epoch": 2970} {"train_loss": -12.648200035095215, "global_step": 499047, "epoch": 2970} {"train_loss": -12.669499397277832, "global_step": 499048, "epoch": 2970} {"train_loss": -12.744945526123047, "global_step": 499049, "epoch": 2970} {"train_loss": -12.476104736328125, "global_step": 499050, "epoch": 2970} {"train_loss": -12.525715827941895, "global_step": 499051, "epoch": 2970} {"train_loss": -12.388578414916992, "global_step": 499052, "epoch": 2970} {"train_loss": -12.788650512695312, "global_step": 499053, "epoch": 2970} {"train_loss": -12.65078353881836, "global_step": 499054, "epoch": 2970} {"train_loss": -11.99138069152832, "global_step": 499055, "epoch": 2970} {"train_loss": -12.686054229736328, "global_step": 499056, "epoch": 2970} {"train_loss": -12.362829208374023, "global_step": 499057, "epoch": 2970} {"train_loss": -11.861021041870117, "global_step": 499058, "epoch": 2970} {"train_loss": -12.618939399719238, "global_step": 499059, "epoch": 2970} {"train_loss": -12.3861083984375, "global_step": 499060, "epoch": 2970} {"train_loss": -12.278450965881348, "global_step": 499061, "epoch": 2970} {"train_loss": -12.343120574951172, "global_step": 499062, "epoch": 2970} {"train_loss": -12.043180465698242, "global_step": 499063, "epoch": 2970} {"train_loss": -12.022394180297852, "global_step": 499064, "epoch": 2970} {"train_loss": -12.15294361114502, "global_step": 499065, "epoch": 2970} {"train_loss": -11.88465690612793, "global_step": 499066, "epoch": 2970} {"train_loss": -12.17414665222168, "global_step": 499067, "epoch": 2970} {"train_loss": -12.343908309936523, "global_step": 499068, "epoch": 2970} {"train_loss": -11.629343032836914, "global_step": 499069, "epoch": 2970} {"train_loss": -12.283756256103516, "global_step": 499070, "epoch": 2970} {"train_loss": -11.964583396911621, "global_step": 499071, "epoch": 2970} {"train_loss": -12.554388046264648, "global_step": 499072, "epoch": 2970} {"train_loss": -12.307479858398438, "global_step": 499073, "epoch": 2970} {"train_loss": -12.35878849029541, "global_step": 499074, "epoch": 2970} {"train_loss": -12.57318115234375, "global_step": 499075, "epoch": 2970} {"train_loss": -12.05363655090332, "global_step": 499076, "epoch": 2970} {"train_loss": -12.706835746765137, "global_step": 499077, "epoch": 2970} {"train_loss": -12.593443870544434, "global_step": 499078, "epoch": 2970} {"train_loss": -12.647611618041992, "global_step": 499079, "epoch": 2970} {"train_loss": -12.45176887512207, "global_step": 499080, "epoch": 2970} {"train_loss": -12.69040584564209, "global_step": 499081, "epoch": 2970} {"train_loss": -12.671706199645996, "global_step": 499082, "epoch": 2970} {"train_loss": -12.675729751586914, "global_step": 499083, "epoch": 2970} {"train_loss": -12.582313537597656, "global_step": 499084, "epoch": 2970} {"train_loss": -12.740354537963867, "global_step": 499085, "epoch": 2970} {"train_loss": -12.806880950927734, "global_step": 499086, "epoch": 2970} {"train_loss": -12.185192108154297, "global_step": 499087, "epoch": 2970} {"train_loss": -12.928503036499023, "global_step": 499088, "epoch": 2970} {"train_loss": -12.725597381591797, "global_step": 499089, "epoch": 2970} {"train_loss": -12.648543357849121, "global_step": 499090, "epoch": 2970} {"train_loss": -12.485485076904297, "global_step": 499091, "epoch": 2970} {"train_loss": -12.853373527526855, "global_step": 499092, "epoch": 2970} {"train_loss": -12.600793838500977, "global_step": 499093, "epoch": 2970} {"train_loss": -12.814558982849121, "global_step": 499094, "epoch": 2970} {"train_loss": -12.583017349243164, "global_step": 499095, "epoch": 2970} {"train_loss": -12.464012145996094, "global_step": 499096, "epoch": 2970} {"train_loss": -12.668432235717773, "global_step": 499097, "epoch": 2970} {"train_loss": -12.722860336303711, "global_step": 499098, "epoch": 2970} {"train_loss": -12.441240310668945, "global_step": 499099, "epoch": 2970} {"train_loss": -12.545236587524414, "global_step": 499100, "epoch": 2970} {"train_loss": -11.737909317016602, "global_step": 499101, "epoch": 2970} {"train_loss": -12.763790130615234, "global_step": 499102, "epoch": 2970} {"train_loss": -12.706476211547852, "global_step": 499103, "epoch": 2970} {"train_loss": -12.85523796081543, "global_step": 499104, "epoch": 2970} {"train_loss": -11.822964668273926, "global_step": 499105, "epoch": 2970} {"train_loss": -12.681819915771484, "global_step": 499106, "epoch": 2970} {"train_loss": -11.94679069519043, "global_step": 499107, "epoch": 2970} {"train_loss": -13.030607223510742, "global_step": 499108, "epoch": 2970} {"train_loss": -11.85218620300293, "global_step": 499109, "epoch": 2970} {"train_loss": -13.022750854492188, "global_step": 499110, "epoch": 2970} {"train_loss": -11.766412734985352, "global_step": 499111, "epoch": 2970} {"train_loss": -12.114389419555664, "global_step": 499112, "epoch": 2970} {"train_loss": -11.668569564819336, "global_step": 499113, "epoch": 2970} {"train_loss": -11.894851684570312, "global_step": 499114, "epoch": 2970} {"train_loss": -11.775304794311523, "global_step": 499115, "epoch": 2970} {"train_loss": -11.021514892578125, "global_step": 499116, "epoch": 2970} {"train_loss": -12.289977073669434, "global_step": 499117, "epoch": 2970} {"train_loss": -11.359986305236816, "global_step": 499118, "epoch": 2970} {"train_loss": -12.37089729309082, "global_step": 499119, "epoch": 2970} {"train_loss": -11.841100692749023, "global_step": 499120, "epoch": 2970} {"train_loss": -12.31666374206543, "global_step": 499121, "epoch": 2970} {"train_loss": -12.336277961730957, "global_step": 499122, "epoch": 2970} {"train_loss": -12.064878463745117, "global_step": 499123, "epoch": 2970} {"train_loss": -12.061502456665039, "global_step": 499124, "epoch": 2970} {"train_loss": -12.823419570922852, "global_step": 499125, "epoch": 2970} {"train_loss": -11.736898422241211, "global_step": 499126, "epoch": 2970} {"train_loss": -12.22130028406779, "global_step": 499127, "epoch": 2970, "val_loss": 318975.28125, "train_action_mse_error": 1.6906300783157349} {"train_loss": -11.792407989501953, "global_step": 499128, "epoch": 2971} {"train_loss": -12.18747329711914, "global_step": 499129, "epoch": 2971} {"train_loss": -12.882220268249512, "global_step": 499130, "epoch": 2971} {"train_loss": -12.084177017211914, "global_step": 499131, "epoch": 2971} {"train_loss": -12.379444122314453, "global_step": 499132, "epoch": 2971} {"train_loss": -12.826696395874023, "global_step": 499133, "epoch": 2971} {"train_loss": -12.343780517578125, "global_step": 499134, "epoch": 2971} {"train_loss": -12.73225212097168, "global_step": 499135, "epoch": 2971} {"train_loss": -12.565191268920898, "global_step": 499136, "epoch": 2971} {"train_loss": -12.463790893554688, "global_step": 499137, "epoch": 2971} {"train_loss": -12.630624771118164, "global_step": 499138, "epoch": 2971} {"train_loss": -12.12514877319336, "global_step": 499139, "epoch": 2971} {"train_loss": -12.537100791931152, "global_step": 499140, "epoch": 2971} {"train_loss": -11.620182037353516, "global_step": 499141, "epoch": 2971} {"train_loss": -12.216377258300781, "global_step": 499142, "epoch": 2971} {"train_loss": -11.580928802490234, "global_step": 499143, "epoch": 2971} {"train_loss": -11.599010467529297, "global_step": 499144, "epoch": 2971} {"train_loss": -11.590486526489258, "global_step": 499145, "epoch": 2971} {"train_loss": -11.314373016357422, "global_step": 499146, "epoch": 2971} {"train_loss": -11.964125633239746, "global_step": 499147, "epoch": 2971} {"train_loss": -12.015497207641602, "global_step": 499148, "epoch": 2971} {"train_loss": -12.02920150756836, "global_step": 499149, "epoch": 2971} {"train_loss": -12.113859176635742, "global_step": 499150, "epoch": 2971} {"train_loss": -11.320578575134277, "global_step": 499151, "epoch": 2971} {"train_loss": -11.993171691894531, "global_step": 499152, "epoch": 2971} {"train_loss": -11.722187042236328, "global_step": 499153, "epoch": 2971} {"train_loss": -12.170258522033691, "global_step": 499154, "epoch": 2971} {"train_loss": -11.540689468383789, "global_step": 499155, "epoch": 2971} {"train_loss": -12.692628860473633, "global_step": 499156, "epoch": 2971} {"train_loss": -11.864315032958984, "global_step": 499157, "epoch": 2971} {"train_loss": -12.601299285888672, "global_step": 499158, "epoch": 2971} {"train_loss": -12.476457595825195, "global_step": 499159, "epoch": 2971} {"train_loss": -12.342384338378906, "global_step": 499160, "epoch": 2971} {"train_loss": -12.80617904663086, "global_step": 499161, "epoch": 2971} {"train_loss": -12.34416675567627, "global_step": 499162, "epoch": 2971} {"train_loss": -12.76193618774414, "global_step": 499163, "epoch": 2971} {"train_loss": -12.615278244018555, "global_step": 499164, "epoch": 2971} {"train_loss": -12.311290740966797, "global_step": 499165, "epoch": 2971} {"train_loss": -12.69723892211914, "global_step": 499166, "epoch": 2971} {"train_loss": -12.559784889221191, "global_step": 499167, "epoch": 2971} {"train_loss": -12.93852424621582, "global_step": 499168, "epoch": 2971} {"train_loss": -12.712860107421875, "global_step": 499169, "epoch": 2971} {"train_loss": -12.557340621948242, "global_step": 499170, "epoch": 2971} {"train_loss": -12.686575889587402, "global_step": 499171, "epoch": 2971} {"train_loss": -12.509044647216797, "global_step": 499172, "epoch": 2971} {"train_loss": -12.43971061706543, "global_step": 499173, "epoch": 2971} {"train_loss": -12.585325241088867, "global_step": 499174, "epoch": 2971} {"train_loss": -12.631958961486816, "global_step": 499175, "epoch": 2971} {"train_loss": -12.224386215209961, "global_step": 499176, "epoch": 2971} {"train_loss": -12.734630584716797, "global_step": 499177, "epoch": 2971} {"train_loss": -12.439910888671875, "global_step": 499178, "epoch": 2971} {"train_loss": -12.409357070922852, "global_step": 499179, "epoch": 2971} {"train_loss": -12.365694046020508, "global_step": 499180, "epoch": 2971} {"train_loss": -12.53626537322998, "global_step": 499181, "epoch": 2971} {"train_loss": -12.163618087768555, "global_step": 499182, "epoch": 2971} {"train_loss": -12.656181335449219, "global_step": 499183, "epoch": 2971} {"train_loss": -12.477005004882812, "global_step": 499184, "epoch": 2971} {"train_loss": -12.423784255981445, "global_step": 499185, "epoch": 2971} {"train_loss": -12.396254539489746, "global_step": 499186, "epoch": 2971} {"train_loss": -12.659784317016602, "global_step": 499187, "epoch": 2971} {"train_loss": -12.740768432617188, "global_step": 499188, "epoch": 2971} {"train_loss": -12.66819953918457, "global_step": 499189, "epoch": 2971} {"train_loss": -12.749101638793945, "global_step": 499190, "epoch": 2971} {"train_loss": -12.487161636352539, "global_step": 499191, "epoch": 2971} {"train_loss": -12.851991653442383, "global_step": 499192, "epoch": 2971} {"train_loss": -12.763587951660156, "global_step": 499193, "epoch": 2971} {"train_loss": -12.808354377746582, "global_step": 499194, "epoch": 2971} {"train_loss": -12.742673873901367, "global_step": 499195, "epoch": 2971} {"train_loss": -12.57550048828125, "global_step": 499196, "epoch": 2971} {"train_loss": -12.770111083984375, "global_step": 499197, "epoch": 2971} {"train_loss": -12.667572021484375, "global_step": 499198, "epoch": 2971} {"train_loss": -13.05006217956543, "global_step": 499199, "epoch": 2971} {"train_loss": -12.875983238220215, "global_step": 499200, "epoch": 2971} {"train_loss": -12.808300018310547, "global_step": 499201, "epoch": 2971} {"train_loss": -12.731956481933594, "global_step": 499202, "epoch": 2971} {"train_loss": -12.98577880859375, "global_step": 499203, "epoch": 2971} {"train_loss": -13.147848129272461, "global_step": 499204, "epoch": 2971} {"train_loss": -13.105640411376953, "global_step": 499205, "epoch": 2971} {"train_loss": -12.810346603393555, "global_step": 499206, "epoch": 2971} {"train_loss": -13.046613693237305, "global_step": 499207, "epoch": 2971} {"train_loss": -12.984325408935547, "global_step": 499208, "epoch": 2971} {"train_loss": -12.859634399414062, "global_step": 499209, "epoch": 2971} {"train_loss": -12.675994873046875, "global_step": 499210, "epoch": 2971} {"train_loss": -13.092527389526367, "global_step": 499211, "epoch": 2971} {"train_loss": -12.873678207397461, "global_step": 499212, "epoch": 2971} {"train_loss": -12.982559204101562, "global_step": 499213, "epoch": 2971} {"train_loss": -12.906024932861328, "global_step": 499214, "epoch": 2971} {"train_loss": -12.927562713623047, "global_step": 499215, "epoch": 2971} {"train_loss": -13.08602523803711, "global_step": 499216, "epoch": 2971} {"train_loss": -12.963417053222656, "global_step": 499217, "epoch": 2971} {"train_loss": -12.35055160522461, "global_step": 499218, "epoch": 2971} {"train_loss": -13.128891944885254, "global_step": 499219, "epoch": 2971} {"train_loss": -12.851816177368164, "global_step": 499220, "epoch": 2971} {"train_loss": -12.833074569702148, "global_step": 499221, "epoch": 2971} {"train_loss": -12.706661224365234, "global_step": 499222, "epoch": 2971} {"train_loss": -12.727907180786133, "global_step": 499223, "epoch": 2971} {"train_loss": -12.812374114990234, "global_step": 499224, "epoch": 2971} {"train_loss": -12.075478553771973, "global_step": 499225, "epoch": 2971} {"train_loss": -12.300432205200195, "global_step": 499226, "epoch": 2971} {"train_loss": -11.928915023803711, "global_step": 499227, "epoch": 2971} {"train_loss": -12.136190414428711, "global_step": 499228, "epoch": 2971} {"train_loss": -12.036149978637695, "global_step": 499229, "epoch": 2971} {"train_loss": -12.866524696350098, "global_step": 499230, "epoch": 2971} {"train_loss": -12.699915885925293, "global_step": 499231, "epoch": 2971} {"train_loss": -11.860177993774414, "global_step": 499232, "epoch": 2971} {"train_loss": -12.776605606079102, "global_step": 499233, "epoch": 2971} {"train_loss": -12.323898315429688, "global_step": 499234, "epoch": 2971} {"train_loss": -12.305481910705566, "global_step": 499235, "epoch": 2971} {"train_loss": -12.300241470336914, "global_step": 499236, "epoch": 2971} {"train_loss": -12.43221378326416, "global_step": 499237, "epoch": 2971} {"train_loss": -12.258281707763672, "global_step": 499238, "epoch": 2971} {"train_loss": -13.050535202026367, "global_step": 499239, "epoch": 2971} {"train_loss": -12.575628280639648, "global_step": 499240, "epoch": 2971} {"train_loss": -12.195098876953125, "global_step": 499241, "epoch": 2971} {"train_loss": -12.360299110412598, "global_step": 499242, "epoch": 2971} {"train_loss": -13.137344360351562, "global_step": 499243, "epoch": 2971} {"train_loss": -12.043939590454102, "global_step": 499244, "epoch": 2971} {"train_loss": -12.378923416137695, "global_step": 499245, "epoch": 2971} {"train_loss": -12.759783744812012, "global_step": 499246, "epoch": 2971} {"train_loss": -12.541013717651367, "global_step": 499247, "epoch": 2971} {"train_loss": -12.68664836883545, "global_step": 499248, "epoch": 2971} {"train_loss": -12.890336990356445, "global_step": 499249, "epoch": 2971} {"train_loss": -13.01111125946045, "global_step": 499250, "epoch": 2971} {"train_loss": -12.799079895019531, "global_step": 499251, "epoch": 2971} {"train_loss": -12.671640396118164, "global_step": 499252, "epoch": 2971} {"train_loss": -12.824152946472168, "global_step": 499253, "epoch": 2971} {"train_loss": -12.59410285949707, "global_step": 499254, "epoch": 2971} {"train_loss": -12.888834953308105, "global_step": 499255, "epoch": 2971} {"train_loss": -12.887163162231445, "global_step": 499256, "epoch": 2971} {"train_loss": -12.332066535949707, "global_step": 499257, "epoch": 2971} {"train_loss": -12.893040657043457, "global_step": 499258, "epoch": 2971} {"train_loss": -12.885823249816895, "global_step": 499259, "epoch": 2971} {"train_loss": -12.831695556640625, "global_step": 499260, "epoch": 2971} {"train_loss": -12.869364738464355, "global_step": 499261, "epoch": 2971} {"train_loss": -13.06203842163086, "global_step": 499262, "epoch": 2971} {"train_loss": -13.009353637695312, "global_step": 499263, "epoch": 2971} {"train_loss": -12.780620574951172, "global_step": 499264, "epoch": 2971} {"train_loss": -13.00076961517334, "global_step": 499265, "epoch": 2971} {"train_loss": -12.884023666381836, "global_step": 499266, "epoch": 2971} {"train_loss": -12.982294082641602, "global_step": 499267, "epoch": 2971} {"train_loss": -12.9638671875, "global_step": 499268, "epoch": 2971} {"train_loss": -12.903678894042969, "global_step": 499269, "epoch": 2971} {"train_loss": -12.85603141784668, "global_step": 499270, "epoch": 2971} {"train_loss": -13.259439468383789, "global_step": 499271, "epoch": 2971} {"train_loss": -12.865959167480469, "global_step": 499272, "epoch": 2971} {"train_loss": -12.511505126953125, "global_step": 499273, "epoch": 2971} {"train_loss": -12.826022148132324, "global_step": 499274, "epoch": 2971} {"train_loss": -12.740638732910156, "global_step": 499275, "epoch": 2971} {"train_loss": -12.264514923095703, "global_step": 499276, "epoch": 2971} {"train_loss": -12.603903770446777, "global_step": 499277, "epoch": 2971} {"train_loss": -12.33577823638916, "global_step": 499278, "epoch": 2971} {"train_loss": -12.096811294555664, "global_step": 499279, "epoch": 2971} {"train_loss": -12.104990005493164, "global_step": 499280, "epoch": 2971} {"train_loss": -11.950844764709473, "global_step": 499281, "epoch": 2971} {"train_loss": -9.294944763183594, "global_step": 499282, "epoch": 2971} {"train_loss": -11.257805824279785, "global_step": 499283, "epoch": 2971} {"train_loss": -9.666568756103516, "global_step": 499284, "epoch": 2971} {"train_loss": -8.357967376708984, "global_step": 499285, "epoch": 2971} {"train_loss": -9.749385833740234, "global_step": 499286, "epoch": 2971} {"train_loss": -8.162398338317871, "global_step": 499287, "epoch": 2971} {"train_loss": -9.118844985961914, "global_step": 499288, "epoch": 2971} {"train_loss": -10.12830924987793, "global_step": 499289, "epoch": 2971} {"train_loss": -8.733299255371094, "global_step": 499290, "epoch": 2971} {"train_loss": -10.32786750793457, "global_step": 499291, "epoch": 2971} {"train_loss": -9.996959686279297, "global_step": 499292, "epoch": 2971} {"train_loss": -10.056604385375977, "global_step": 499293, "epoch": 2971} {"train_loss": -9.346933364868164, "global_step": 499294, "epoch": 2971} {"train_loss": -12.303693419411069, "global_step": 499295, "epoch": 2971, "val_loss": 316123.1875} {"train_loss": -9.889352798461914, "global_step": 499296, "epoch": 2972} {"train_loss": -10.206663131713867, "global_step": 499297, "epoch": 2972} {"train_loss": -8.342317581176758, "global_step": 499298, "epoch": 2972} {"train_loss": -9.574752807617188, "global_step": 499299, "epoch": 2972} {"train_loss": -9.536705017089844, "global_step": 499300, "epoch": 2972} {"train_loss": -8.0787353515625, "global_step": 499301, "epoch": 2972} {"train_loss": -7.755806922912598, "global_step": 499302, "epoch": 2972} {"train_loss": -8.034966468811035, "global_step": 499303, "epoch": 2972} {"train_loss": -5.968280792236328, "global_step": 499304, "epoch": 2972} {"train_loss": -7.917630195617676, "global_step": 499305, "epoch": 2972} {"train_loss": -6.996932029724121, "global_step": 499306, "epoch": 2972} {"train_loss": -6.804576873779297, "global_step": 499307, "epoch": 2972} {"train_loss": -7.251784324645996, "global_step": 499308, "epoch": 2972} {"train_loss": -8.814443588256836, "global_step": 499309, "epoch": 2972} {"train_loss": -7.7506279945373535, "global_step": 499310, "epoch": 2972} {"train_loss": -7.059688568115234, "global_step": 499311, "epoch": 2972} {"train_loss": -9.001458168029785, "global_step": 499312, "epoch": 2972} {"train_loss": -7.764373779296875, "global_step": 499313, "epoch": 2972} {"train_loss": -8.756341934204102, "global_step": 499314, "epoch": 2972} {"train_loss": -8.66379165649414, "global_step": 499315, "epoch": 2972} {"train_loss": -8.4410400390625, "global_step": 499316, "epoch": 2972} {"train_loss": -8.618894577026367, "global_step": 499317, "epoch": 2972} {"train_loss": -10.091821670532227, "global_step": 499318, "epoch": 2972} {"train_loss": -9.24393081665039, "global_step": 499319, "epoch": 2972} {"train_loss": -9.487701416015625, "global_step": 499320, "epoch": 2972} {"train_loss": -10.258220672607422, "global_step": 499321, "epoch": 2972} {"train_loss": -10.244993209838867, "global_step": 499322, "epoch": 2972} {"train_loss": -11.349993705749512, "global_step": 499323, "epoch": 2972} {"train_loss": -10.052034378051758, "global_step": 499324, "epoch": 2972} {"train_loss": -10.649261474609375, "global_step": 499325, "epoch": 2972} {"train_loss": -10.976058959960938, "global_step": 499326, "epoch": 2972} {"train_loss": -10.565681457519531, "global_step": 499327, "epoch": 2972} {"train_loss": -10.807564735412598, "global_step": 499328, "epoch": 2972} {"train_loss": -10.6874361038208, "global_step": 499329, "epoch": 2972} {"train_loss": -11.760541915893555, "global_step": 499330, "epoch": 2972} {"train_loss": -11.338199615478516, "global_step": 499331, "epoch": 2972} {"train_loss": -12.089441299438477, "global_step": 499332, "epoch": 2972} {"train_loss": -11.114356994628906, "global_step": 499333, "epoch": 2972} {"train_loss": -12.096630096435547, "global_step": 499334, "epoch": 2972} {"train_loss": -11.421317100524902, "global_step": 499335, "epoch": 2972} {"train_loss": -11.671661376953125, "global_step": 499336, "epoch": 2972} {"train_loss": -11.785600662231445, "global_step": 499337, "epoch": 2972} {"train_loss": -11.671586990356445, "global_step": 499338, "epoch": 2972} {"train_loss": -11.953269958496094, "global_step": 499339, "epoch": 2972} {"train_loss": -11.971887588500977, "global_step": 499340, "epoch": 2972} {"train_loss": -12.1964750289917, "global_step": 499341, "epoch": 2972} {"train_loss": -12.275609016418457, "global_step": 499342, "epoch": 2972} {"train_loss": -12.22498893737793, "global_step": 499343, "epoch": 2972} {"train_loss": -11.915685653686523, "global_step": 499344, "epoch": 2972} {"train_loss": -11.963333129882812, "global_step": 499345, "epoch": 2972} {"train_loss": -12.22877025604248, "global_step": 499346, "epoch": 2972} {"train_loss": -12.17312240600586, "global_step": 499347, "epoch": 2972} {"train_loss": -12.283187866210938, "global_step": 499348, "epoch": 2972} {"train_loss": -12.094335556030273, "global_step": 499349, "epoch": 2972} {"train_loss": -12.363118171691895, "global_step": 499350, "epoch": 2972} {"train_loss": -12.251049041748047, "global_step": 499351, "epoch": 2972} {"train_loss": -12.371994972229004, "global_step": 499352, "epoch": 2972} {"train_loss": -12.212653160095215, "global_step": 499353, "epoch": 2972} {"train_loss": -12.22619342803955, "global_step": 499354, "epoch": 2972} {"train_loss": -12.301807403564453, "global_step": 499355, "epoch": 2972} {"train_loss": -12.413599014282227, "global_step": 499356, "epoch": 2972} {"train_loss": -12.347064971923828, "global_step": 499357, "epoch": 2972} {"train_loss": -12.422727584838867, "global_step": 499358, "epoch": 2972} {"train_loss": -12.283559799194336, "global_step": 499359, "epoch": 2972} {"train_loss": -12.28579330444336, "global_step": 499360, "epoch": 2972} {"train_loss": -12.592161178588867, "global_step": 499361, "epoch": 2972} {"train_loss": -12.3073091506958, "global_step": 499362, "epoch": 2972} {"train_loss": -12.60020637512207, "global_step": 499363, "epoch": 2972} {"train_loss": -12.482190132141113, "global_step": 499364, "epoch": 2972} {"train_loss": -12.570384979248047, "global_step": 499365, "epoch": 2972} {"train_loss": -12.558511734008789, "global_step": 499366, "epoch": 2972} {"train_loss": -12.432581901550293, "global_step": 499367, "epoch": 2972} {"train_loss": -12.555383682250977, "global_step": 499368, "epoch": 2972} {"train_loss": -12.473780632019043, "global_step": 499369, "epoch": 2972} {"train_loss": -12.54369831085205, "global_step": 499370, "epoch": 2972} {"train_loss": -12.723554611206055, "global_step": 499371, "epoch": 2972} {"train_loss": -12.7161865234375, "global_step": 499372, "epoch": 2972} {"train_loss": -12.428421020507812, "global_step": 499373, "epoch": 2972} {"train_loss": -12.705907821655273, "global_step": 499374, "epoch": 2972} {"train_loss": -12.469703674316406, "global_step": 499375, "epoch": 2972} {"train_loss": -12.713703155517578, "global_step": 499376, "epoch": 2972} {"train_loss": -12.597559928894043, "global_step": 499377, "epoch": 2972} {"train_loss": -12.790936470031738, "global_step": 499378, "epoch": 2972} {"train_loss": -12.720172882080078, "global_step": 499379, "epoch": 2972} {"train_loss": -12.809957504272461, "global_step": 499380, "epoch": 2972} {"train_loss": -12.60874080657959, "global_step": 499381, "epoch": 2972} {"train_loss": -12.603038787841797, "global_step": 499382, "epoch": 2972} {"train_loss": -12.622842788696289, "global_step": 499383, "epoch": 2972} {"train_loss": -12.780914306640625, "global_step": 499384, "epoch": 2972} {"train_loss": -12.630826950073242, "global_step": 499385, "epoch": 2972} {"train_loss": -12.817023277282715, "global_step": 499386, "epoch": 2972} {"train_loss": -12.622621536254883, "global_step": 499387, "epoch": 2972} {"train_loss": -12.67867660522461, "global_step": 499388, "epoch": 2972} {"train_loss": -12.756531715393066, "global_step": 499389, "epoch": 2972} {"train_loss": -12.62285327911377, "global_step": 499390, "epoch": 2972} {"train_loss": -12.745525360107422, "global_step": 499391, "epoch": 2972} {"train_loss": -12.672525405883789, "global_step": 499392, "epoch": 2972} {"train_loss": -12.732948303222656, "global_step": 499393, "epoch": 2972} {"train_loss": -12.930266380310059, "global_step": 499394, "epoch": 2972} {"train_loss": -12.811441421508789, "global_step": 499395, "epoch": 2972} {"train_loss": -12.744245529174805, "global_step": 499396, "epoch": 2972} {"train_loss": -12.911338806152344, "global_step": 499397, "epoch": 2972} {"train_loss": -12.76122760772705, "global_step": 499398, "epoch": 2972} {"train_loss": -12.826976776123047, "global_step": 499399, "epoch": 2972} {"train_loss": -12.79019832611084, "global_step": 499400, "epoch": 2972} {"train_loss": -12.876991271972656, "global_step": 499401, "epoch": 2972} {"train_loss": -12.740124702453613, "global_step": 499402, "epoch": 2972} {"train_loss": -12.787459373474121, "global_step": 499403, "epoch": 2972} {"train_loss": -12.909189224243164, "global_step": 499404, "epoch": 2972} {"train_loss": -12.855666160583496, "global_step": 499405, "epoch": 2972} {"train_loss": -12.659574508666992, "global_step": 499406, "epoch": 2972} {"train_loss": -12.860062599182129, "global_step": 499407, "epoch": 2972} {"train_loss": -12.736647605895996, "global_step": 499408, "epoch": 2972} {"train_loss": -12.708078384399414, "global_step": 499409, "epoch": 2972} {"train_loss": -12.910324096679688, "global_step": 499410, "epoch": 2972} {"train_loss": -12.967155456542969, "global_step": 499411, "epoch": 2972} {"train_loss": -12.975825309753418, "global_step": 499412, "epoch": 2972} {"train_loss": -12.86902904510498, "global_step": 499413, "epoch": 2972} {"train_loss": -12.927820205688477, "global_step": 499414, "epoch": 2972} {"train_loss": -12.896241188049316, "global_step": 499415, "epoch": 2972} {"train_loss": -12.76987075805664, "global_step": 499416, "epoch": 2972} {"train_loss": -13.007953643798828, "global_step": 499417, "epoch": 2972} {"train_loss": -13.013790130615234, "global_step": 499418, "epoch": 2972} {"train_loss": -12.869699478149414, "global_step": 499419, "epoch": 2972} {"train_loss": -12.924745559692383, "global_step": 499420, "epoch": 2972} {"train_loss": -12.903346061706543, "global_step": 499421, "epoch": 2972} {"train_loss": -12.993598937988281, "global_step": 499422, "epoch": 2972} {"train_loss": -12.755975723266602, "global_step": 499423, "epoch": 2972} {"train_loss": -12.631694793701172, "global_step": 499424, "epoch": 2972} {"train_loss": -12.689218521118164, "global_step": 499425, "epoch": 2972} {"train_loss": -12.8200101852417, "global_step": 499426, "epoch": 2972} {"train_loss": -12.937041282653809, "global_step": 499427, "epoch": 2972} {"train_loss": -12.60423469543457, "global_step": 499428, "epoch": 2972} {"train_loss": -12.93450927734375, "global_step": 499429, "epoch": 2972} {"train_loss": -12.538505554199219, "global_step": 499430, "epoch": 2972} {"train_loss": -12.805191993713379, "global_step": 499431, "epoch": 2972} {"train_loss": -12.574654579162598, "global_step": 499432, "epoch": 2972} {"train_loss": -13.230246543884277, "global_step": 499433, "epoch": 2972} {"train_loss": -12.9832763671875, "global_step": 499434, "epoch": 2972} {"train_loss": -13.005411148071289, "global_step": 499435, "epoch": 2972} {"train_loss": -12.873929977416992, "global_step": 499436, "epoch": 2972} {"train_loss": -13.024587631225586, "global_step": 499437, "epoch": 2972} {"train_loss": -12.536052703857422, "global_step": 499438, "epoch": 2972} {"train_loss": -12.805074691772461, "global_step": 499439, "epoch": 2972} {"train_loss": -12.887985229492188, "global_step": 499440, "epoch": 2972} {"train_loss": -12.679295539855957, "global_step": 499441, "epoch": 2972} {"train_loss": -12.428423881530762, "global_step": 499442, "epoch": 2972} {"train_loss": -13.05042552947998, "global_step": 499443, "epoch": 2972} {"train_loss": -12.240377426147461, "global_step": 499444, "epoch": 2972} {"train_loss": -12.605813026428223, "global_step": 499445, "epoch": 2972} {"train_loss": -12.44719409942627, "global_step": 499446, "epoch": 2972} {"train_loss": -12.74329948425293, "global_step": 499447, "epoch": 2972} {"train_loss": -10.863821983337402, "global_step": 499448, "epoch": 2972} {"train_loss": -10.913261413574219, "global_step": 499449, "epoch": 2972} {"train_loss": -12.39235782623291, "global_step": 499450, "epoch": 2972} {"train_loss": -12.048954010009766, "global_step": 499451, "epoch": 2972} {"train_loss": -9.864042282104492, "global_step": 499452, "epoch": 2972} {"train_loss": -12.3152494430542, "global_step": 499453, "epoch": 2972} {"train_loss": -10.562519073486328, "global_step": 499454, "epoch": 2972} {"train_loss": -10.606517791748047, "global_step": 499455, "epoch": 2972} {"train_loss": -11.24726390838623, "global_step": 499456, "epoch": 2972} {"train_loss": -9.952980041503906, "global_step": 499457, "epoch": 2972} {"train_loss": -12.362714767456055, "global_step": 499458, "epoch": 2972} {"train_loss": -10.141533851623535, "global_step": 499459, "epoch": 2972} {"train_loss": -11.823517799377441, "global_step": 499460, "epoch": 2972} {"train_loss": -9.984855651855469, "global_step": 499461, "epoch": 2972} {"train_loss": -10.225496292114258, "global_step": 499462, "epoch": 2972} {"train_loss": -11.686935285727182, "global_step": 499463, "epoch": 2972, "val_loss": 319609.96875} {"train_loss": -11.491124153137207, "global_step": 499464, "epoch": 2973} {"train_loss": -9.779380798339844, "global_step": 499465, "epoch": 2973} {"train_loss": -10.972373008728027, "global_step": 499466, "epoch": 2973} {"train_loss": -9.584339141845703, "global_step": 499467, "epoch": 2973} {"train_loss": -10.166791915893555, "global_step": 499468, "epoch": 2973} {"train_loss": -9.698862075805664, "global_step": 499469, "epoch": 2973} {"train_loss": -9.268104553222656, "global_step": 499470, "epoch": 2973} {"train_loss": -9.927692413330078, "global_step": 499471, "epoch": 2973} {"train_loss": -9.402725219726562, "global_step": 499472, "epoch": 2973} {"train_loss": -9.634611129760742, "global_step": 499473, "epoch": 2973} {"train_loss": -11.372187614440918, "global_step": 499474, "epoch": 2973} {"train_loss": -9.389333724975586, "global_step": 499475, "epoch": 2973} {"train_loss": -10.091737747192383, "global_step": 499476, "epoch": 2973} {"train_loss": -10.300619125366211, "global_step": 499477, "epoch": 2973} {"train_loss": -10.992881774902344, "global_step": 499478, "epoch": 2973} {"train_loss": -10.49696159362793, "global_step": 499479, "epoch": 2973} {"train_loss": -10.957951545715332, "global_step": 499480, "epoch": 2973} {"train_loss": -10.942344665527344, "global_step": 499481, "epoch": 2973} {"train_loss": -10.631107330322266, "global_step": 499482, "epoch": 2973} {"train_loss": -11.181522369384766, "global_step": 499483, "epoch": 2973} {"train_loss": -11.082357406616211, "global_step": 499484, "epoch": 2973} {"train_loss": -11.054739952087402, "global_step": 499485, "epoch": 2973} {"train_loss": -10.516347885131836, "global_step": 499486, "epoch": 2973} {"train_loss": -10.76437759399414, "global_step": 499487, "epoch": 2973} {"train_loss": -10.716083526611328, "global_step": 499488, "epoch": 2973} {"train_loss": -10.877071380615234, "global_step": 499489, "epoch": 2973} {"train_loss": -11.491111755371094, "global_step": 499490, "epoch": 2973} {"train_loss": -10.757440567016602, "global_step": 499491, "epoch": 2973} {"train_loss": -10.632936477661133, "global_step": 499492, "epoch": 2973} {"train_loss": -10.85844898223877, "global_step": 499493, "epoch": 2973} {"train_loss": -10.163476943969727, "global_step": 499494, "epoch": 2973} {"train_loss": -11.29476547241211, "global_step": 499495, "epoch": 2973} {"train_loss": -11.921510696411133, "global_step": 499496, "epoch": 2973} {"train_loss": -10.931777000427246, "global_step": 499497, "epoch": 2973} {"train_loss": -11.48599624633789, "global_step": 499498, "epoch": 2973} {"train_loss": -11.287744522094727, "global_step": 499499, "epoch": 2973} {"train_loss": -11.856451988220215, "global_step": 499500, "epoch": 2973} {"train_loss": -11.432710647583008, "global_step": 499501, "epoch": 2973} {"train_loss": -11.827717781066895, "global_step": 499502, "epoch": 2973} {"train_loss": -11.361405372619629, "global_step": 499503, "epoch": 2973} {"train_loss": -11.182973861694336, "global_step": 499504, "epoch": 2973} {"train_loss": -10.892841339111328, "global_step": 499505, "epoch": 2973} {"train_loss": -11.949617385864258, "global_step": 499506, "epoch": 2973} {"train_loss": -11.10930061340332, "global_step": 499507, "epoch": 2973} {"train_loss": -11.856746673583984, "global_step": 499508, "epoch": 2973} {"train_loss": -10.877765655517578, "global_step": 499509, "epoch": 2973} {"train_loss": -11.582681655883789, "global_step": 499510, "epoch": 2973} {"train_loss": -11.5360746383667, "global_step": 499511, "epoch": 2973} {"train_loss": -11.948246955871582, "global_step": 499512, "epoch": 2973} {"train_loss": -11.692939758300781, "global_step": 499513, "epoch": 2973} {"train_loss": -11.686942100524902, "global_step": 499514, "epoch": 2973} {"train_loss": -11.818338394165039, "global_step": 499515, "epoch": 2973} {"train_loss": -11.76523208618164, "global_step": 499516, "epoch": 2973} {"train_loss": -11.9498872756958, "global_step": 499517, "epoch": 2973} {"train_loss": -12.000869750976562, "global_step": 499518, "epoch": 2973} {"train_loss": -12.194719314575195, "global_step": 499519, "epoch": 2973} {"train_loss": -11.98861312866211, "global_step": 499520, "epoch": 2973} {"train_loss": -12.184523582458496, "global_step": 499521, "epoch": 2973} {"train_loss": -12.308664321899414, "global_step": 499522, "epoch": 2973} {"train_loss": -11.962213516235352, "global_step": 499523, "epoch": 2973} {"train_loss": -12.553216934204102, "global_step": 499524, "epoch": 2973} {"train_loss": -12.423921585083008, "global_step": 499525, "epoch": 2973} {"train_loss": -12.47201156616211, "global_step": 499526, "epoch": 2973} {"train_loss": -12.242321968078613, "global_step": 499527, "epoch": 2973} {"train_loss": -12.710721015930176, "global_step": 499528, "epoch": 2973} {"train_loss": -12.21052360534668, "global_step": 499529, "epoch": 2973} {"train_loss": -12.388055801391602, "global_step": 499530, "epoch": 2973} {"train_loss": -12.48404312133789, "global_step": 499531, "epoch": 2973} {"train_loss": -12.357120513916016, "global_step": 499532, "epoch": 2973} {"train_loss": -12.514535903930664, "global_step": 499533, "epoch": 2973} {"train_loss": -12.250950813293457, "global_step": 499534, "epoch": 2973} {"train_loss": -12.64311408996582, "global_step": 499535, "epoch": 2973} {"train_loss": -12.413875579833984, "global_step": 499536, "epoch": 2973} {"train_loss": -12.685836791992188, "global_step": 499537, "epoch": 2973} {"train_loss": -12.322410583496094, "global_step": 499538, "epoch": 2973} {"train_loss": -12.4863920211792, "global_step": 499539, "epoch": 2973} {"train_loss": -12.56321907043457, "global_step": 499540, "epoch": 2973} {"train_loss": -12.578278541564941, "global_step": 499541, "epoch": 2973} {"train_loss": -12.51111125946045, "global_step": 499542, "epoch": 2973} {"train_loss": -12.627606391906738, "global_step": 499543, "epoch": 2973} {"train_loss": -12.653926849365234, "global_step": 499544, "epoch": 2973} {"train_loss": -12.607433319091797, "global_step": 499545, "epoch": 2973} {"train_loss": -12.606888771057129, "global_step": 499546, "epoch": 2973} {"train_loss": -12.723348617553711, "global_step": 499547, "epoch": 2973} {"train_loss": -12.543214797973633, "global_step": 499548, "epoch": 2973} {"train_loss": -12.663732528686523, "global_step": 499549, "epoch": 2973} {"train_loss": -12.83314323425293, "global_step": 499550, "epoch": 2973} {"train_loss": -12.756063461303711, "global_step": 499551, "epoch": 2973} {"train_loss": -12.735062599182129, "global_step": 499552, "epoch": 2973} {"train_loss": -12.753593444824219, "global_step": 499553, "epoch": 2973} {"train_loss": -12.806732177734375, "global_step": 499554, "epoch": 2973} {"train_loss": -12.802132606506348, "global_step": 499555, "epoch": 2973} {"train_loss": -12.667941093444824, "global_step": 499556, "epoch": 2973} {"train_loss": -12.84473991394043, "global_step": 499557, "epoch": 2973} {"train_loss": -12.622060775756836, "global_step": 499558, "epoch": 2973} {"train_loss": -12.721637725830078, "global_step": 499559, "epoch": 2973} {"train_loss": -12.776046752929688, "global_step": 499560, "epoch": 2973} {"train_loss": -12.857315063476562, "global_step": 499561, "epoch": 2973} {"train_loss": -12.902437210083008, "global_step": 499562, "epoch": 2973} {"train_loss": -12.564135551452637, "global_step": 499563, "epoch": 2973} {"train_loss": -12.900307655334473, "global_step": 499564, "epoch": 2973} {"train_loss": -12.836514472961426, "global_step": 499565, "epoch": 2973} {"train_loss": -12.860210418701172, "global_step": 499566, "epoch": 2973} {"train_loss": -12.979554176330566, "global_step": 499567, "epoch": 2973} {"train_loss": -12.884688377380371, "global_step": 499568, "epoch": 2973} {"train_loss": -13.090446472167969, "global_step": 499569, "epoch": 2973} {"train_loss": -12.865541458129883, "global_step": 499570, "epoch": 2973} {"train_loss": -13.03260612487793, "global_step": 499571, "epoch": 2973} {"train_loss": -12.975858688354492, "global_step": 499572, "epoch": 2973} {"train_loss": -12.976646423339844, "global_step": 499573, "epoch": 2973} {"train_loss": -13.051736831665039, "global_step": 499574, "epoch": 2973} {"train_loss": -13.08360481262207, "global_step": 499575, "epoch": 2973} {"train_loss": -13.018959999084473, "global_step": 499576, "epoch": 2973} {"train_loss": -13.12881851196289, "global_step": 499577, "epoch": 2973} {"train_loss": -13.004655838012695, "global_step": 499578, "epoch": 2973} {"train_loss": -12.9913969039917, "global_step": 499579, "epoch": 2973} {"train_loss": -12.997488975524902, "global_step": 499580, "epoch": 2973} {"train_loss": -13.011919021606445, "global_step": 499581, "epoch": 2973} {"train_loss": -13.049842834472656, "global_step": 499582, "epoch": 2973} {"train_loss": -12.9508056640625, "global_step": 499583, "epoch": 2973} {"train_loss": -12.981278419494629, "global_step": 499584, "epoch": 2973} {"train_loss": -13.136285781860352, "global_step": 499585, "epoch": 2973} {"train_loss": -13.153971672058105, "global_step": 499586, "epoch": 2973} {"train_loss": -13.151928901672363, "global_step": 499587, "epoch": 2973} {"train_loss": -13.228944778442383, "global_step": 499588, "epoch": 2973} {"train_loss": -12.727270126342773, "global_step": 499589, "epoch": 2973} {"train_loss": -13.091995239257812, "global_step": 499590, "epoch": 2973} {"train_loss": -13.039311408996582, "global_step": 499591, "epoch": 2973} {"train_loss": -13.025803565979004, "global_step": 499592, "epoch": 2973} {"train_loss": -13.121736526489258, "global_step": 499593, "epoch": 2973} {"train_loss": -12.833478927612305, "global_step": 499594, "epoch": 2973} {"train_loss": -13.017326354980469, "global_step": 499595, "epoch": 2973} {"train_loss": -12.926078796386719, "global_step": 499596, "epoch": 2973} {"train_loss": -13.100753784179688, "global_step": 499597, "epoch": 2973} {"train_loss": -13.15446662902832, "global_step": 499598, "epoch": 2973} {"train_loss": -12.994497299194336, "global_step": 499599, "epoch": 2973} {"train_loss": -12.766498565673828, "global_step": 499600, "epoch": 2973} {"train_loss": -12.996109008789062, "global_step": 499601, "epoch": 2973} {"train_loss": -13.063505172729492, "global_step": 499602, "epoch": 2973} {"train_loss": -13.019607543945312, "global_step": 499603, "epoch": 2973} {"train_loss": -13.00006103515625, "global_step": 499604, "epoch": 2973} {"train_loss": -12.971485137939453, "global_step": 499605, "epoch": 2973} {"train_loss": -12.962712287902832, "global_step": 499606, "epoch": 2973} {"train_loss": -12.923358917236328, "global_step": 499607, "epoch": 2973} {"train_loss": -12.982339859008789, "global_step": 499608, "epoch": 2973} {"train_loss": -12.906393051147461, "global_step": 499609, "epoch": 2973} {"train_loss": -13.04980754852295, "global_step": 499610, "epoch": 2973} {"train_loss": -13.006460189819336, "global_step": 499611, "epoch": 2973} {"train_loss": -12.86863899230957, "global_step": 499612, "epoch": 2973} {"train_loss": -13.116166114807129, "global_step": 499613, "epoch": 2973} {"train_loss": -12.829916000366211, "global_step": 499614, "epoch": 2973} {"train_loss": -12.683591842651367, "global_step": 499615, "epoch": 2973} {"train_loss": -12.49111270904541, "global_step": 499616, "epoch": 2973} {"train_loss": -12.810869216918945, "global_step": 499617, "epoch": 2973} {"train_loss": -12.507160186767578, "global_step": 499618, "epoch": 2973} {"train_loss": -12.703658103942871, "global_step": 499619, "epoch": 2973} {"train_loss": -12.160597801208496, "global_step": 499620, "epoch": 2973} {"train_loss": -12.780677795410156, "global_step": 499621, "epoch": 2973} {"train_loss": -11.533554077148438, "global_step": 499622, "epoch": 2973} {"train_loss": -11.579395294189453, "global_step": 499623, "epoch": 2973} {"train_loss": -11.613481521606445, "global_step": 499624, "epoch": 2973} {"train_loss": -10.380880355834961, "global_step": 499625, "epoch": 2973} {"train_loss": -11.548919677734375, "global_step": 499626, "epoch": 2973} {"train_loss": -9.96345329284668, "global_step": 499627, "epoch": 2973} {"train_loss": -9.734655380249023, "global_step": 499628, "epoch": 2973} {"train_loss": -9.929078102111816, "global_step": 499629, "epoch": 2973} {"train_loss": -9.996461868286133, "global_step": 499630, "epoch": 2973} {"train_loss": -12.047454169818334, "global_step": 499631, "epoch": 2973, "val_loss": 320241.46875} {"train_loss": -10.791204452514648, "global_step": 499632, "epoch": 2974} {"train_loss": -10.465094566345215, "global_step": 499633, "epoch": 2974} {"train_loss": -11.89403247833252, "global_step": 499634, "epoch": 2974} {"train_loss": -11.309213638305664, "global_step": 499635, "epoch": 2974} {"train_loss": -11.667819023132324, "global_step": 499636, "epoch": 2974} {"train_loss": -12.461645126342773, "global_step": 499637, "epoch": 2974} {"train_loss": -11.671371459960938, "global_step": 499638, "epoch": 2974} {"train_loss": -12.565380096435547, "global_step": 499639, "epoch": 2974} {"train_loss": -11.715295791625977, "global_step": 499640, "epoch": 2974} {"train_loss": -12.144950866699219, "global_step": 499641, "epoch": 2974} {"train_loss": -12.745366096496582, "global_step": 499642, "epoch": 2974} {"train_loss": -11.873274803161621, "global_step": 499643, "epoch": 2974} {"train_loss": -12.658753395080566, "global_step": 499644, "epoch": 2974} {"train_loss": -11.945937156677246, "global_step": 499645, "epoch": 2974} {"train_loss": -12.333540916442871, "global_step": 499646, "epoch": 2974} {"train_loss": -12.052352905273438, "global_step": 499647, "epoch": 2974} {"train_loss": -12.536139488220215, "global_step": 499648, "epoch": 2974} {"train_loss": -12.489917755126953, "global_step": 499649, "epoch": 2974} {"train_loss": -12.3058443069458, "global_step": 499650, "epoch": 2974} {"train_loss": -12.533390998840332, "global_step": 499651, "epoch": 2974} {"train_loss": -12.619049072265625, "global_step": 499652, "epoch": 2974} {"train_loss": -12.568024635314941, "global_step": 499653, "epoch": 2974} {"train_loss": -12.682696342468262, "global_step": 499654, "epoch": 2974} {"train_loss": -12.347921371459961, "global_step": 499655, "epoch": 2974} {"train_loss": -12.639707565307617, "global_step": 499656, "epoch": 2974} {"train_loss": -11.922725677490234, "global_step": 499657, "epoch": 2974} {"train_loss": -12.595229148864746, "global_step": 499658, "epoch": 2974} {"train_loss": -11.441536903381348, "global_step": 499659, "epoch": 2974} {"train_loss": -12.472710609436035, "global_step": 499660, "epoch": 2974} {"train_loss": -12.32587718963623, "global_step": 499661, "epoch": 2974} {"train_loss": -12.142049789428711, "global_step": 499662, "epoch": 2974} {"train_loss": -11.754375457763672, "global_step": 499663, "epoch": 2974} {"train_loss": -12.621927261352539, "global_step": 499664, "epoch": 2974} {"train_loss": -12.4475679397583, "global_step": 499665, "epoch": 2974} {"train_loss": -11.488542556762695, "global_step": 499666, "epoch": 2974} {"train_loss": -11.866289138793945, "global_step": 499667, "epoch": 2974} {"train_loss": -12.621500015258789, "global_step": 499668, "epoch": 2974} {"train_loss": -11.97795295715332, "global_step": 499669, "epoch": 2974} {"train_loss": -11.577329635620117, "global_step": 499670, "epoch": 2974} {"train_loss": -12.46794605255127, "global_step": 499671, "epoch": 2974} {"train_loss": -12.537788391113281, "global_step": 499672, "epoch": 2974} {"train_loss": -12.08649730682373, "global_step": 499673, "epoch": 2974} {"train_loss": -11.900503158569336, "global_step": 499674, "epoch": 2974} {"train_loss": -12.51882553100586, "global_step": 499675, "epoch": 2974} {"train_loss": -12.878337860107422, "global_step": 499676, "epoch": 2974} {"train_loss": -12.483263969421387, "global_step": 499677, "epoch": 2974} {"train_loss": -12.138750076293945, "global_step": 499678, "epoch": 2974} {"train_loss": -12.578452110290527, "global_step": 499679, "epoch": 2974} {"train_loss": -12.26765251159668, "global_step": 499680, "epoch": 2974} {"train_loss": -12.333295822143555, "global_step": 499681, "epoch": 2974} {"train_loss": -12.128463745117188, "global_step": 499682, "epoch": 2974} {"train_loss": -12.625425338745117, "global_step": 499683, "epoch": 2974} {"train_loss": -12.027559280395508, "global_step": 499684, "epoch": 2974} {"train_loss": -12.518568992614746, "global_step": 499685, "epoch": 2974} {"train_loss": -12.535520553588867, "global_step": 499686, "epoch": 2974} {"train_loss": -12.387530326843262, "global_step": 499687, "epoch": 2974} {"train_loss": -12.780004501342773, "global_step": 499688, "epoch": 2974} {"train_loss": -12.456790924072266, "global_step": 499689, "epoch": 2974} {"train_loss": -12.461690902709961, "global_step": 499690, "epoch": 2974} {"train_loss": -12.142024993896484, "global_step": 499691, "epoch": 2974} {"train_loss": -12.60838508605957, "global_step": 499692, "epoch": 2974} {"train_loss": -12.41572380065918, "global_step": 499693, "epoch": 2974} {"train_loss": -12.33513355255127, "global_step": 499694, "epoch": 2974} {"train_loss": -12.027331352233887, "global_step": 499695, "epoch": 2974} {"train_loss": -12.442912101745605, "global_step": 499696, "epoch": 2974} {"train_loss": -12.643073081970215, "global_step": 499697, "epoch": 2974} {"train_loss": -12.380233764648438, "global_step": 499698, "epoch": 2974} {"train_loss": -12.056415557861328, "global_step": 499699, "epoch": 2974} {"train_loss": -12.6957426071167, "global_step": 499700, "epoch": 2974} {"train_loss": -12.314321517944336, "global_step": 499701, "epoch": 2974} {"train_loss": -12.164268493652344, "global_step": 499702, "epoch": 2974} {"train_loss": -12.12922477722168, "global_step": 499703, "epoch": 2974} {"train_loss": -12.405603408813477, "global_step": 499704, "epoch": 2974} {"train_loss": -10.874151229858398, "global_step": 499705, "epoch": 2974} {"train_loss": -12.141897201538086, "global_step": 499706, "epoch": 2974} {"train_loss": -12.156940460205078, "global_step": 499707, "epoch": 2974} {"train_loss": -12.16347885131836, "global_step": 499708, "epoch": 2974} {"train_loss": -11.538362503051758, "global_step": 499709, "epoch": 2974} {"train_loss": -12.82667350769043, "global_step": 499710, "epoch": 2974} {"train_loss": -11.803512573242188, "global_step": 499711, "epoch": 2974} {"train_loss": -10.327556610107422, "global_step": 499712, "epoch": 2974} {"train_loss": -11.547953605651855, "global_step": 499713, "epoch": 2974} {"train_loss": -12.39956283569336, "global_step": 499714, "epoch": 2974} {"train_loss": -11.910733222961426, "global_step": 499715, "epoch": 2974} {"train_loss": -11.992879867553711, "global_step": 499716, "epoch": 2974} {"train_loss": -12.08786392211914, "global_step": 499717, "epoch": 2974} {"train_loss": -10.759780883789062, "global_step": 499718, "epoch": 2974} {"train_loss": -11.229061126708984, "global_step": 499719, "epoch": 2974} {"train_loss": -12.301050186157227, "global_step": 499720, "epoch": 2974} {"train_loss": -11.582891464233398, "global_step": 499721, "epoch": 2974} {"train_loss": -11.180866241455078, "global_step": 499722, "epoch": 2974} {"train_loss": -12.144983291625977, "global_step": 499723, "epoch": 2974} {"train_loss": -11.364797592163086, "global_step": 499724, "epoch": 2974} {"train_loss": -10.39877700805664, "global_step": 499725, "epoch": 2974} {"train_loss": -11.3097562789917, "global_step": 499726, "epoch": 2974} {"train_loss": -11.284721374511719, "global_step": 499727, "epoch": 2974} {"train_loss": -11.144569396972656, "global_step": 499728, "epoch": 2974} {"train_loss": -12.102131843566895, "global_step": 499729, "epoch": 2974} {"train_loss": -12.170832633972168, "global_step": 499730, "epoch": 2974} {"train_loss": -11.913703918457031, "global_step": 499731, "epoch": 2974} {"train_loss": -11.9248685836792, "global_step": 499732, "epoch": 2974} {"train_loss": -12.279226303100586, "global_step": 499733, "epoch": 2974} {"train_loss": -12.011391639709473, "global_step": 499734, "epoch": 2974} {"train_loss": -12.398481369018555, "global_step": 499735, "epoch": 2974} {"train_loss": -11.204357147216797, "global_step": 499736, "epoch": 2974} {"train_loss": -11.538056373596191, "global_step": 499737, "epoch": 2974} {"train_loss": -10.446114540100098, "global_step": 499738, "epoch": 2974} {"train_loss": -10.792887687683105, "global_step": 499739, "epoch": 2974} {"train_loss": -10.904370307922363, "global_step": 499740, "epoch": 2974} {"train_loss": -10.061027526855469, "global_step": 499741, "epoch": 2974} {"train_loss": -8.769920349121094, "global_step": 499742, "epoch": 2974} {"train_loss": -9.913763046264648, "global_step": 499743, "epoch": 2974} {"train_loss": -10.480697631835938, "global_step": 499744, "epoch": 2974} {"train_loss": -11.096654891967773, "global_step": 499745, "epoch": 2974} {"train_loss": -10.247633934020996, "global_step": 499746, "epoch": 2974} {"train_loss": -11.121309280395508, "global_step": 499747, "epoch": 2974} {"train_loss": -10.926542282104492, "global_step": 499748, "epoch": 2974} {"train_loss": -10.322197914123535, "global_step": 499749, "epoch": 2974} {"train_loss": -10.846134185791016, "global_step": 499750, "epoch": 2974} {"train_loss": -10.944276809692383, "global_step": 499751, "epoch": 2974} {"train_loss": -11.196402549743652, "global_step": 499752, "epoch": 2974} {"train_loss": -10.481359481811523, "global_step": 499753, "epoch": 2974} {"train_loss": -9.814884185791016, "global_step": 499754, "epoch": 2974} {"train_loss": -11.302127838134766, "global_step": 499755, "epoch": 2974} {"train_loss": -10.42271900177002, "global_step": 499756, "epoch": 2974} {"train_loss": -10.340995788574219, "global_step": 499757, "epoch": 2974} {"train_loss": -10.687532424926758, "global_step": 499758, "epoch": 2974} {"train_loss": -10.994315147399902, "global_step": 499759, "epoch": 2974} {"train_loss": -10.823083877563477, "global_step": 499760, "epoch": 2974} {"train_loss": -11.486668586730957, "global_step": 499761, "epoch": 2974} {"train_loss": -10.784843444824219, "global_step": 499762, "epoch": 2974} {"train_loss": -10.973621368408203, "global_step": 499763, "epoch": 2974} {"train_loss": -11.845931053161621, "global_step": 499764, "epoch": 2974} {"train_loss": -11.358630180358887, "global_step": 499765, "epoch": 2974} {"train_loss": -11.835772514343262, "global_step": 499766, "epoch": 2974} {"train_loss": -11.602254867553711, "global_step": 499767, "epoch": 2974} {"train_loss": -12.342987060546875, "global_step": 499768, "epoch": 2974} {"train_loss": -11.615312576293945, "global_step": 499769, "epoch": 2974} {"train_loss": -11.996496200561523, "global_step": 499770, "epoch": 2974} {"train_loss": -12.059356689453125, "global_step": 499771, "epoch": 2974} {"train_loss": -11.777339935302734, "global_step": 499772, "epoch": 2974} {"train_loss": -12.043201446533203, "global_step": 499773, "epoch": 2974} {"train_loss": -12.431836128234863, "global_step": 499774, "epoch": 2974} {"train_loss": -11.709680557250977, "global_step": 499775, "epoch": 2974} {"train_loss": -12.385042190551758, "global_step": 499776, "epoch": 2974} {"train_loss": -11.990933418273926, "global_step": 499777, "epoch": 2974} {"train_loss": -12.01527214050293, "global_step": 499778, "epoch": 2974} {"train_loss": -12.291214942932129, "global_step": 499779, "epoch": 2974} {"train_loss": -12.207021713256836, "global_step": 499780, "epoch": 2974} {"train_loss": -12.24285888671875, "global_step": 499781, "epoch": 2974} {"train_loss": -11.937610626220703, "global_step": 499782, "epoch": 2974} {"train_loss": -12.291393280029297, "global_step": 499783, "epoch": 2974} {"train_loss": -12.436551094055176, "global_step": 499784, "epoch": 2974} {"train_loss": -12.153179168701172, "global_step": 499785, "epoch": 2974} {"train_loss": -12.499197006225586, "global_step": 499786, "epoch": 2974} {"train_loss": -12.40928840637207, "global_step": 499787, "epoch": 2974} {"train_loss": -12.246858596801758, "global_step": 499788, "epoch": 2974} {"train_loss": -12.702079772949219, "global_step": 499789, "epoch": 2974} {"train_loss": -12.468488693237305, "global_step": 499790, "epoch": 2974} {"train_loss": -12.545692443847656, "global_step": 499791, "epoch": 2974} {"train_loss": -12.626066207885742, "global_step": 499792, "epoch": 2974} {"train_loss": -12.554007530212402, "global_step": 499793, "epoch": 2974} {"train_loss": -12.462211608886719, "global_step": 499794, "epoch": 2974} {"train_loss": -12.454205513000488, "global_step": 499795, "epoch": 2974} {"train_loss": -12.559147834777832, "global_step": 499796, "epoch": 2974} {"train_loss": -12.599599838256836, "global_step": 499797, "epoch": 2974} {"train_loss": -12.534299850463867, "global_step": 499798, "epoch": 2974} {"train_loss": -11.87593888668787, "global_step": 499799, "epoch": 2974, "val_loss": 316020.21875} {"train_loss": -12.582537651062012, "global_step": 499800, "epoch": 2975} {"train_loss": -12.67508602142334, "global_step": 499801, "epoch": 2975} {"train_loss": -12.673620223999023, "global_step": 499802, "epoch": 2975} {"train_loss": -12.819131851196289, "global_step": 499803, "epoch": 2975} {"train_loss": -12.883552551269531, "global_step": 499804, "epoch": 2975} {"train_loss": -12.890352249145508, "global_step": 499805, "epoch": 2975} {"train_loss": -12.722640037536621, "global_step": 499806, "epoch": 2975} {"train_loss": -12.77269172668457, "global_step": 499807, "epoch": 2975} {"train_loss": -12.82811164855957, "global_step": 499808, "epoch": 2975} {"train_loss": -12.730659484863281, "global_step": 499809, "epoch": 2975} {"train_loss": -12.659961700439453, "global_step": 499810, "epoch": 2975} {"train_loss": -12.648761749267578, "global_step": 499811, "epoch": 2975} {"train_loss": -12.770370483398438, "global_step": 499812, "epoch": 2975} {"train_loss": -12.736988067626953, "global_step": 499813, "epoch": 2975} {"train_loss": -12.665668487548828, "global_step": 499814, "epoch": 2975} {"train_loss": -12.738740921020508, "global_step": 499815, "epoch": 2975} {"train_loss": -12.826784133911133, "global_step": 499816, "epoch": 2975} {"train_loss": -12.496755599975586, "global_step": 499817, "epoch": 2975} {"train_loss": -12.891544342041016, "global_step": 499818, "epoch": 2975} {"train_loss": -12.813005447387695, "global_step": 499819, "epoch": 2975} {"train_loss": -12.831975936889648, "global_step": 499820, "epoch": 2975} {"train_loss": -12.787723541259766, "global_step": 499821, "epoch": 2975} {"train_loss": -12.959217071533203, "global_step": 499822, "epoch": 2975} {"train_loss": -12.940574645996094, "global_step": 499823, "epoch": 2975} {"train_loss": -12.728338241577148, "global_step": 499824, "epoch": 2975} {"train_loss": -12.913596153259277, "global_step": 499825, "epoch": 2975} {"train_loss": -12.782684326171875, "global_step": 499826, "epoch": 2975} {"train_loss": -12.865058898925781, "global_step": 499827, "epoch": 2975} {"train_loss": -12.834291458129883, "global_step": 499828, "epoch": 2975} {"train_loss": -13.03355598449707, "global_step": 499829, "epoch": 2975} {"train_loss": -12.972576141357422, "global_step": 499830, "epoch": 2975} {"train_loss": -13.036152839660645, "global_step": 499831, "epoch": 2975} {"train_loss": -12.835853576660156, "global_step": 499832, "epoch": 2975} {"train_loss": -12.886674880981445, "global_step": 499833, "epoch": 2975} {"train_loss": -12.994563102722168, "global_step": 499834, "epoch": 2975} {"train_loss": -13.045585632324219, "global_step": 499835, "epoch": 2975} {"train_loss": -13.035618782043457, "global_step": 499836, "epoch": 2975} {"train_loss": -12.792871475219727, "global_step": 499837, "epoch": 2975} {"train_loss": -12.946052551269531, "global_step": 499838, "epoch": 2975} {"train_loss": -13.108867645263672, "global_step": 499839, "epoch": 2975} {"train_loss": -13.006858825683594, "global_step": 499840, "epoch": 2975} {"train_loss": -13.029024124145508, "global_step": 499841, "epoch": 2975} {"train_loss": -12.8587064743042, "global_step": 499842, "epoch": 2975} {"train_loss": -13.043596267700195, "global_step": 499843, "epoch": 2975} {"train_loss": -13.063220977783203, "global_step": 499844, "epoch": 2975} {"train_loss": -12.854856491088867, "global_step": 499845, "epoch": 2975} {"train_loss": -13.037307739257812, "global_step": 499846, "epoch": 2975} {"train_loss": -13.021841049194336, "global_step": 499847, "epoch": 2975} {"train_loss": -13.23733901977539, "global_step": 499848, "epoch": 2975} {"train_loss": -12.891796112060547, "global_step": 499849, "epoch": 2975} {"train_loss": -12.860862731933594, "global_step": 499850, "epoch": 2975} {"train_loss": -13.228721618652344, "global_step": 499851, "epoch": 2975} {"train_loss": -13.0536470413208, "global_step": 499852, "epoch": 2975} {"train_loss": -13.109800338745117, "global_step": 499853, "epoch": 2975} {"train_loss": -13.022375106811523, "global_step": 499854, "epoch": 2975} {"train_loss": -12.949193000793457, "global_step": 499855, "epoch": 2975} {"train_loss": -12.938932418823242, "global_step": 499856, "epoch": 2975} {"train_loss": -12.557360649108887, "global_step": 499857, "epoch": 2975} {"train_loss": -12.55077075958252, "global_step": 499858, "epoch": 2975} {"train_loss": -12.989779472351074, "global_step": 499859, "epoch": 2975} {"train_loss": -13.02325439453125, "global_step": 499860, "epoch": 2975} {"train_loss": -12.402750015258789, "global_step": 499861, "epoch": 2975} {"train_loss": -12.241519927978516, "global_step": 499862, "epoch": 2975} {"train_loss": -12.682567596435547, "global_step": 499863, "epoch": 2975} {"train_loss": -12.63595962524414, "global_step": 499864, "epoch": 2975} {"train_loss": -12.240873336791992, "global_step": 499865, "epoch": 2975} {"train_loss": -11.90460205078125, "global_step": 499866, "epoch": 2975} {"train_loss": -12.551340103149414, "global_step": 499867, "epoch": 2975} {"train_loss": -11.928387641906738, "global_step": 499868, "epoch": 2975} {"train_loss": -12.33381462097168, "global_step": 499869, "epoch": 2975} {"train_loss": -12.439292907714844, "global_step": 499870, "epoch": 2975} {"train_loss": -11.832727432250977, "global_step": 499871, "epoch": 2975} {"train_loss": -10.623058319091797, "global_step": 499872, "epoch": 2975} {"train_loss": -11.110454559326172, "global_step": 499873, "epoch": 2975} {"train_loss": -11.264978408813477, "global_step": 499874, "epoch": 2975} {"train_loss": -11.659649848937988, "global_step": 499875, "epoch": 2975} {"train_loss": -11.724742889404297, "global_step": 499876, "epoch": 2975} {"train_loss": -10.585744857788086, "global_step": 499877, "epoch": 2975} {"train_loss": -12.823834419250488, "global_step": 499878, "epoch": 2975} {"train_loss": -11.345963478088379, "global_step": 499879, "epoch": 2975} {"train_loss": -11.252313613891602, "global_step": 499880, "epoch": 2975} {"train_loss": -11.949335098266602, "global_step": 499881, "epoch": 2975} {"train_loss": -11.680623054504395, "global_step": 499882, "epoch": 2975} {"train_loss": -10.525736808776855, "global_step": 499883, "epoch": 2975} {"train_loss": -12.415323257446289, "global_step": 499884, "epoch": 2975} {"train_loss": -10.101036071777344, "global_step": 499885, "epoch": 2975} {"train_loss": -12.071287155151367, "global_step": 499886, "epoch": 2975} {"train_loss": -11.147063255310059, "global_step": 499887, "epoch": 2975} {"train_loss": -11.370893478393555, "global_step": 499888, "epoch": 2975} {"train_loss": -12.251951217651367, "global_step": 499889, "epoch": 2975} {"train_loss": -11.72053337097168, "global_step": 499890, "epoch": 2975} {"train_loss": -11.915868759155273, "global_step": 499891, "epoch": 2975} {"train_loss": -10.921538352966309, "global_step": 499892, "epoch": 2975} {"train_loss": -11.218385696411133, "global_step": 499893, "epoch": 2975} {"train_loss": -11.872125625610352, "global_step": 499894, "epoch": 2975} {"train_loss": -11.486957550048828, "global_step": 499895, "epoch": 2975} {"train_loss": -11.749822616577148, "global_step": 499896, "epoch": 2975} {"train_loss": -11.926050186157227, "global_step": 499897, "epoch": 2975} {"train_loss": -11.654214859008789, "global_step": 499898, "epoch": 2975} {"train_loss": -11.231279373168945, "global_step": 499899, "epoch": 2975} {"train_loss": -11.889163970947266, "global_step": 499900, "epoch": 2975} {"train_loss": -11.949821472167969, "global_step": 499901, "epoch": 2975} {"train_loss": -11.63317584991455, "global_step": 499902, "epoch": 2975} {"train_loss": -11.702324867248535, "global_step": 499903, "epoch": 2975} {"train_loss": -12.231485366821289, "global_step": 499904, "epoch": 2975} {"train_loss": -11.680113792419434, "global_step": 499905, "epoch": 2975} {"train_loss": -11.880743026733398, "global_step": 499906, "epoch": 2975} {"train_loss": -11.320470809936523, "global_step": 499907, "epoch": 2975} {"train_loss": -11.640593528747559, "global_step": 499908, "epoch": 2975} {"train_loss": -11.445941925048828, "global_step": 499909, "epoch": 2975} {"train_loss": -10.697587013244629, "global_step": 499910, "epoch": 2975} {"train_loss": -11.781063079833984, "global_step": 499911, "epoch": 2975} {"train_loss": -11.128375053405762, "global_step": 499912, "epoch": 2975} {"train_loss": -11.958157539367676, "global_step": 499913, "epoch": 2975} {"train_loss": -11.547489166259766, "global_step": 499914, "epoch": 2975} {"train_loss": -11.875510215759277, "global_step": 499915, "epoch": 2975} {"train_loss": -12.24675178527832, "global_step": 499916, "epoch": 2975} {"train_loss": -12.212905883789062, "global_step": 499917, "epoch": 2975} {"train_loss": -11.868841171264648, "global_step": 499918, "epoch": 2975} {"train_loss": -12.219562530517578, "global_step": 499919, "epoch": 2975} {"train_loss": -11.837843894958496, "global_step": 499920, "epoch": 2975} {"train_loss": -12.052922248840332, "global_step": 499921, "epoch": 2975} {"train_loss": -12.372865676879883, "global_step": 499922, "epoch": 2975} {"train_loss": -11.967510223388672, "global_step": 499923, "epoch": 2975} {"train_loss": -12.345409393310547, "global_step": 499924, "epoch": 2975} {"train_loss": -11.844496726989746, "global_step": 499925, "epoch": 2975} {"train_loss": -11.987364768981934, "global_step": 499926, "epoch": 2975} {"train_loss": -12.29879379272461, "global_step": 499927, "epoch": 2975} {"train_loss": -12.111659049987793, "global_step": 499928, "epoch": 2975} {"train_loss": -12.504880905151367, "global_step": 499929, "epoch": 2975} {"train_loss": -12.141841888427734, "global_step": 499930, "epoch": 2975} {"train_loss": -12.394153594970703, "global_step": 499931, "epoch": 2975} {"train_loss": -12.510367393493652, "global_step": 499932, "epoch": 2975} {"train_loss": -12.284669876098633, "global_step": 499933, "epoch": 2975} {"train_loss": -12.578474998474121, "global_step": 499934, "epoch": 2975} {"train_loss": -12.56407642364502, "global_step": 499935, "epoch": 2975} {"train_loss": -12.299423217773438, "global_step": 499936, "epoch": 2975} {"train_loss": -12.706338882446289, "global_step": 499937, "epoch": 2975} {"train_loss": -12.191537857055664, "global_step": 499938, "epoch": 2975} {"train_loss": -12.470548629760742, "global_step": 499939, "epoch": 2975} {"train_loss": -12.134550094604492, "global_step": 499940, "epoch": 2975} {"train_loss": -12.575061798095703, "global_step": 499941, "epoch": 2975} {"train_loss": -12.114011764526367, "global_step": 499942, "epoch": 2975} {"train_loss": -12.546177864074707, "global_step": 499943, "epoch": 2975} {"train_loss": -12.240800857543945, "global_step": 499944, "epoch": 2975} {"train_loss": -12.502857208251953, "global_step": 499945, "epoch": 2975} {"train_loss": -12.4544677734375, "global_step": 499946, "epoch": 2975} {"train_loss": -12.549059867858887, "global_step": 499947, "epoch": 2975} {"train_loss": -12.61685562133789, "global_step": 499948, "epoch": 2975} {"train_loss": -12.442429542541504, "global_step": 499949, "epoch": 2975} {"train_loss": -12.715707778930664, "global_step": 499950, "epoch": 2975} {"train_loss": -12.068631172180176, "global_step": 499951, "epoch": 2975} {"train_loss": -12.32949161529541, "global_step": 499952, "epoch": 2975} {"train_loss": -12.103772163391113, "global_step": 499953, "epoch": 2975} {"train_loss": -12.119894027709961, "global_step": 499954, "epoch": 2975} {"train_loss": -12.110859870910645, "global_step": 499955, "epoch": 2975} {"train_loss": -11.750201225280762, "global_step": 499956, "epoch": 2975} {"train_loss": -11.794896125793457, "global_step": 499957, "epoch": 2975} {"train_loss": -11.632608413696289, "global_step": 499958, "epoch": 2975} {"train_loss": -11.32662582397461, "global_step": 499959, "epoch": 2975} {"train_loss": -10.637195587158203, "global_step": 499960, "epoch": 2975} {"train_loss": -11.137434005737305, "global_step": 499961, "epoch": 2975} {"train_loss": -12.185465812683105, "global_step": 499962, "epoch": 2975} {"train_loss": -11.471792221069336, "global_step": 499963, "epoch": 2975} {"train_loss": -11.41104507446289, "global_step": 499964, "epoch": 2975} {"train_loss": -12.082677841186523, "global_step": 499965, "epoch": 2975} {"train_loss": -12.405889511108398, "global_step": 499966, "epoch": 2975} {"train_loss": -12.264237415222894, "global_step": 499967, "epoch": 2975, "val_loss": 319692.46875, "train_action_mse_error": 1.1663492918014526} {"train_loss": -12.460867881774902, "global_step": 499968, "epoch": 2976} {"train_loss": -12.468449592590332, "global_step": 499969, "epoch": 2976} {"train_loss": -12.45886516571045, "global_step": 499970, "epoch": 2976} {"train_loss": -12.289932250976562, "global_step": 499971, "epoch": 2976} {"train_loss": -12.319458961486816, "global_step": 499972, "epoch": 2976} {"train_loss": -12.070211410522461, "global_step": 499973, "epoch": 2976} {"train_loss": -12.259031295776367, "global_step": 499974, "epoch": 2976} {"train_loss": -12.032651901245117, "global_step": 499975, "epoch": 2976} {"train_loss": -12.358098983764648, "global_step": 499976, "epoch": 2976} {"train_loss": -12.264579772949219, "global_step": 499977, "epoch": 2976} {"train_loss": -12.257964134216309, "global_step": 499978, "epoch": 2976} {"train_loss": -12.124298095703125, "global_step": 499979, "epoch": 2976} {"train_loss": -12.451162338256836, "global_step": 499980, "epoch": 2976} {"train_loss": -12.39096450805664, "global_step": 499981, "epoch": 2976} {"train_loss": -12.234902381896973, "global_step": 499982, "epoch": 2976} {"train_loss": -12.751922607421875, "global_step": 499983, "epoch": 2976} {"train_loss": -12.236284255981445, "global_step": 499984, "epoch": 2976} {"train_loss": -12.45667839050293, "global_step": 499985, "epoch": 2976} {"train_loss": -12.594688415527344, "global_step": 499986, "epoch": 2976} {"train_loss": -12.492008209228516, "global_step": 499987, "epoch": 2976} {"train_loss": -12.444048881530762, "global_step": 499988, "epoch": 2976} {"train_loss": -12.29609203338623, "global_step": 499989, "epoch": 2976} {"train_loss": -12.260368347167969, "global_step": 499990, "epoch": 2976} {"train_loss": -12.368770599365234, "global_step": 499991, "epoch": 2976} {"train_loss": -12.016486167907715, "global_step": 499992, "epoch": 2976} {"train_loss": -12.198101997375488, "global_step": 499993, "epoch": 2976} {"train_loss": -11.789324760437012, "global_step": 499994, "epoch": 2976} {"train_loss": -12.570941925048828, "global_step": 499995, "epoch": 2976} {"train_loss": -12.279655456542969, "global_step": 499996, "epoch": 2976} {"train_loss": -12.405036926269531, "global_step": 499997, "epoch": 2976} {"train_loss": -12.436816215515137, "global_step": 499998, "epoch": 2976} {"train_loss": -12.03262996673584, "global_step": 499999, "epoch": 2976} {"train_loss": -12.179004669189453, "global_step": 500000, "epoch": 2976} {"train_loss": -12.525678634643555, "global_step": 500001, "epoch": 2976} {"train_loss": -12.26481819152832, "global_step": 500002, "epoch": 2976} {"train_loss": -12.560290336608887, "global_step": 500003, "epoch": 2976} {"train_loss": -12.092477798461914, "global_step": 500004, "epoch": 2976} {"train_loss": -11.511154174804688, "global_step": 500005, "epoch": 2976} {"train_loss": -12.067327499389648, "global_step": 500006, "epoch": 2976} {"train_loss": -11.68356704711914, "global_step": 500007, "epoch": 2976} {"train_loss": -12.565299987792969, "global_step": 500008, "epoch": 2976} {"train_loss": -11.856046676635742, "global_step": 500009, "epoch": 2976} {"train_loss": -11.90695858001709, "global_step": 500010, "epoch": 2976} {"train_loss": -11.816702842712402, "global_step": 500011, "epoch": 2976} {"train_loss": -11.668564796447754, "global_step": 500012, "epoch": 2976} {"train_loss": -11.895678520202637, "global_step": 500013, "epoch": 2976} {"train_loss": -11.76931095123291, "global_step": 500014, "epoch": 2976} {"train_loss": -12.239021301269531, "global_step": 500015, "epoch": 2976} {"train_loss": -11.452693939208984, "global_step": 500016, "epoch": 2976} {"train_loss": -12.768970489501953, "global_step": 500017, "epoch": 2976} {"train_loss": -11.593568801879883, "global_step": 500018, "epoch": 2976} {"train_loss": -12.425252914428711, "global_step": 500019, "epoch": 2976} {"train_loss": -11.92253303527832, "global_step": 500020, "epoch": 2976} {"train_loss": -12.273998260498047, "global_step": 500021, "epoch": 2976} {"train_loss": -12.440240859985352, "global_step": 500022, "epoch": 2976} {"train_loss": -12.003514289855957, "global_step": 500023, "epoch": 2976} {"train_loss": -12.338911056518555, "global_step": 500024, "epoch": 2976} {"train_loss": -12.458700180053711, "global_step": 500025, "epoch": 2976} {"train_loss": -12.618138313293457, "global_step": 500026, "epoch": 2976} {"train_loss": -12.352435111999512, "global_step": 500027, "epoch": 2976} {"train_loss": -12.464428901672363, "global_step": 500028, "epoch": 2976} {"train_loss": -12.463869094848633, "global_step": 500029, "epoch": 2976} {"train_loss": -12.514120101928711, "global_step": 500030, "epoch": 2976} {"train_loss": -12.78056812286377, "global_step": 500031, "epoch": 2976} {"train_loss": -12.453713417053223, "global_step": 500032, "epoch": 2976} {"train_loss": -12.88848876953125, "global_step": 500033, "epoch": 2976} {"train_loss": -12.669504165649414, "global_step": 500034, "epoch": 2976} {"train_loss": -12.909141540527344, "global_step": 500035, "epoch": 2976} {"train_loss": -12.57629108428955, "global_step": 500036, "epoch": 2976} {"train_loss": -12.503424644470215, "global_step": 500037, "epoch": 2976} {"train_loss": -12.523975372314453, "global_step": 500038, "epoch": 2976} {"train_loss": -12.867635726928711, "global_step": 500039, "epoch": 2976} {"train_loss": -12.630495071411133, "global_step": 500040, "epoch": 2976} {"train_loss": -12.962204933166504, "global_step": 500041, "epoch": 2976} {"train_loss": -12.667566299438477, "global_step": 500042, "epoch": 2976} {"train_loss": -12.740732192993164, "global_step": 500043, "epoch": 2976} {"train_loss": -12.709973335266113, "global_step": 500044, "epoch": 2976} {"train_loss": -12.666831970214844, "global_step": 500045, "epoch": 2976} {"train_loss": -12.554274559020996, "global_step": 500046, "epoch": 2976} {"train_loss": -12.874616622924805, "global_step": 500047, "epoch": 2976} {"train_loss": -12.646608352661133, "global_step": 500048, "epoch": 2976} {"train_loss": -12.546886444091797, "global_step": 500049, "epoch": 2976} {"train_loss": -12.647366523742676, "global_step": 500050, "epoch": 2976} {"train_loss": -12.904841423034668, "global_step": 500051, "epoch": 2976} {"train_loss": -12.65719223022461, "global_step": 500052, "epoch": 2976} {"train_loss": -12.848426818847656, "global_step": 500053, "epoch": 2976} {"train_loss": -12.74917221069336, "global_step": 500054, "epoch": 2976} {"train_loss": -12.92176628112793, "global_step": 500055, "epoch": 2976} {"train_loss": -12.749671936035156, "global_step": 500056, "epoch": 2976} {"train_loss": -12.829032897949219, "global_step": 500057, "epoch": 2976} {"train_loss": -12.880762100219727, "global_step": 500058, "epoch": 2976} {"train_loss": -12.654338836669922, "global_step": 500059, "epoch": 2976} {"train_loss": -12.840688705444336, "global_step": 500060, "epoch": 2976} {"train_loss": -12.805826187133789, "global_step": 500061, "epoch": 2976} {"train_loss": -12.885980606079102, "global_step": 500062, "epoch": 2976} {"train_loss": -12.86996078491211, "global_step": 500063, "epoch": 2976} {"train_loss": -12.747650146484375, "global_step": 500064, "epoch": 2976} {"train_loss": -12.98153305053711, "global_step": 500065, "epoch": 2976} {"train_loss": -12.61373233795166, "global_step": 500066, "epoch": 2976} {"train_loss": -12.551568031311035, "global_step": 500067, "epoch": 2976} {"train_loss": -13.134138107299805, "global_step": 500068, "epoch": 2976} {"train_loss": -12.374971389770508, "global_step": 500069, "epoch": 2976} {"train_loss": -12.871606826782227, "global_step": 500070, "epoch": 2976} {"train_loss": -12.907110214233398, "global_step": 500071, "epoch": 2976} {"train_loss": -12.665324211120605, "global_step": 500072, "epoch": 2976} {"train_loss": -12.549606323242188, "global_step": 500073, "epoch": 2976} {"train_loss": -12.967432022094727, "global_step": 500074, "epoch": 2976} {"train_loss": -12.720877647399902, "global_step": 500075, "epoch": 2976} {"train_loss": -12.473480224609375, "global_step": 500076, "epoch": 2976} {"train_loss": -12.589723587036133, "global_step": 500077, "epoch": 2976} {"train_loss": -12.33127212524414, "global_step": 500078, "epoch": 2976} {"train_loss": -12.374590873718262, "global_step": 500079, "epoch": 2976} {"train_loss": -12.457648277282715, "global_step": 500080, "epoch": 2976} {"train_loss": -12.656438827514648, "global_step": 500081, "epoch": 2976} {"train_loss": -12.717459678649902, "global_step": 500082, "epoch": 2976} {"train_loss": -11.827789306640625, "global_step": 500083, "epoch": 2976} {"train_loss": -12.621752738952637, "global_step": 500084, "epoch": 2976} {"train_loss": -12.102692604064941, "global_step": 500085, "epoch": 2976} {"train_loss": -11.391988754272461, "global_step": 500086, "epoch": 2976} {"train_loss": -11.768320083618164, "global_step": 500087, "epoch": 2976} {"train_loss": -11.703460693359375, "global_step": 500088, "epoch": 2976} {"train_loss": -11.511516571044922, "global_step": 500089, "epoch": 2976} {"train_loss": -11.630071640014648, "global_step": 500090, "epoch": 2976} {"train_loss": -11.99648380279541, "global_step": 500091, "epoch": 2976} {"train_loss": -11.80858325958252, "global_step": 500092, "epoch": 2976} {"train_loss": -12.06251335144043, "global_step": 500093, "epoch": 2976} {"train_loss": -12.147886276245117, "global_step": 500094, "epoch": 2976} {"train_loss": -12.054693222045898, "global_step": 500095, "epoch": 2976} {"train_loss": -10.659738540649414, "global_step": 500096, "epoch": 2976} {"train_loss": -12.462348937988281, "global_step": 500097, "epoch": 2976} {"train_loss": -12.003873825073242, "global_step": 500098, "epoch": 2976} {"train_loss": -10.871355056762695, "global_step": 500099, "epoch": 2976} {"train_loss": -10.519654273986816, "global_step": 500100, "epoch": 2976} {"train_loss": -10.263240814208984, "global_step": 500101, "epoch": 2976} {"train_loss": -11.930532455444336, "global_step": 500102, "epoch": 2976} {"train_loss": -11.345492362976074, "global_step": 500103, "epoch": 2976} {"train_loss": -11.677641868591309, "global_step": 500104, "epoch": 2976} {"train_loss": -11.900325775146484, "global_step": 500105, "epoch": 2976} {"train_loss": -11.107416152954102, "global_step": 500106, "epoch": 2976} {"train_loss": -11.710793495178223, "global_step": 500107, "epoch": 2976} {"train_loss": -11.508230209350586, "global_step": 500108, "epoch": 2976} {"train_loss": -11.692447662353516, "global_step": 500109, "epoch": 2976} {"train_loss": -11.307351112365723, "global_step": 500110, "epoch": 2976} {"train_loss": -10.583352088928223, "global_step": 500111, "epoch": 2976} {"train_loss": -11.541543006896973, "global_step": 500112, "epoch": 2976} {"train_loss": -10.199170112609863, "global_step": 500113, "epoch": 2976} {"train_loss": -11.165345191955566, "global_step": 500114, "epoch": 2976} {"train_loss": -9.798360824584961, "global_step": 500115, "epoch": 2976} {"train_loss": -9.901992797851562, "global_step": 500116, "epoch": 2976} {"train_loss": -9.933021545410156, "global_step": 500117, "epoch": 2976} {"train_loss": -10.715662956237793, "global_step": 500118, "epoch": 2976} {"train_loss": -10.710731506347656, "global_step": 500119, "epoch": 2976} {"train_loss": -11.269390106201172, "global_step": 500120, "epoch": 2976} {"train_loss": -11.874855995178223, "global_step": 500121, "epoch": 2976} {"train_loss": -11.024258613586426, "global_step": 500122, "epoch": 2976} {"train_loss": -12.017860412597656, "global_step": 500123, "epoch": 2976} {"train_loss": -10.821159362792969, "global_step": 500124, "epoch": 2976} {"train_loss": -11.83615493774414, "global_step": 500125, "epoch": 2976} {"train_loss": -11.132658004760742, "global_step": 500126, "epoch": 2976} {"train_loss": -12.15933609008789, "global_step": 500127, "epoch": 2976} {"train_loss": -11.062410354614258, "global_step": 500128, "epoch": 2976} {"train_loss": -11.921710014343262, "global_step": 500129, "epoch": 2976} {"train_loss": -11.391817092895508, "global_step": 500130, "epoch": 2976} {"train_loss": -11.472330093383789, "global_step": 500131, "epoch": 2976} {"train_loss": -12.273892402648926, "global_step": 500132, "epoch": 2976} {"train_loss": -11.638797760009766, "global_step": 500133, "epoch": 2976} {"train_loss": -12.519330978393555, "global_step": 500134, "epoch": 2976} {"train_loss": -12.132419932456244, "global_step": 500135, "epoch": 2976, "val_loss": 318166.90625} {"train_loss": -12.340875625610352, "global_step": 500136, "epoch": 2977} {"train_loss": -11.946298599243164, "global_step": 500137, "epoch": 2977} {"train_loss": -12.382816314697266, "global_step": 500138, "epoch": 2977} {"train_loss": -12.528972625732422, "global_step": 500139, "epoch": 2977} {"train_loss": -12.335140228271484, "global_step": 500140, "epoch": 2977} {"train_loss": -12.190166473388672, "global_step": 500141, "epoch": 2977} {"train_loss": -12.343705177307129, "global_step": 500142, "epoch": 2977} {"train_loss": -12.616409301757812, "global_step": 500143, "epoch": 2977} {"train_loss": -12.298389434814453, "global_step": 500144, "epoch": 2977} {"train_loss": -12.622044563293457, "global_step": 500145, "epoch": 2977} {"train_loss": -12.68142318725586, "global_step": 500146, "epoch": 2977} {"train_loss": -12.433792114257812, "global_step": 500147, "epoch": 2977} {"train_loss": -12.335359573364258, "global_step": 500148, "epoch": 2977} {"train_loss": -12.435715675354004, "global_step": 500149, "epoch": 2977} {"train_loss": -12.454082489013672, "global_step": 500150, "epoch": 2977} {"train_loss": -12.702644348144531, "global_step": 500151, "epoch": 2977} {"train_loss": -12.636495590209961, "global_step": 500152, "epoch": 2977} {"train_loss": -12.671279907226562, "global_step": 500153, "epoch": 2977} {"train_loss": -12.554886817932129, "global_step": 500154, "epoch": 2977} {"train_loss": -12.463669776916504, "global_step": 500155, "epoch": 2977} {"train_loss": -12.78654670715332, "global_step": 500156, "epoch": 2977} {"train_loss": -12.585376739501953, "global_step": 500157, "epoch": 2977} {"train_loss": -12.747382164001465, "global_step": 500158, "epoch": 2977} {"train_loss": -12.411922454833984, "global_step": 500159, "epoch": 2977} {"train_loss": -12.55318832397461, "global_step": 500160, "epoch": 2977} {"train_loss": -12.632831573486328, "global_step": 500161, "epoch": 2977} {"train_loss": -12.503582000732422, "global_step": 500162, "epoch": 2977} {"train_loss": -12.582365036010742, "global_step": 500163, "epoch": 2977} {"train_loss": -12.7352294921875, "global_step": 500164, "epoch": 2977} {"train_loss": -12.647363662719727, "global_step": 500165, "epoch": 2977} {"train_loss": -12.782125473022461, "global_step": 500166, "epoch": 2977} {"train_loss": -12.748649597167969, "global_step": 500167, "epoch": 2977} {"train_loss": -12.676263809204102, "global_step": 500168, "epoch": 2977} {"train_loss": -12.720178604125977, "global_step": 500169, "epoch": 2977} {"train_loss": -13.015588760375977, "global_step": 500170, "epoch": 2977} {"train_loss": -12.75440788269043, "global_step": 500171, "epoch": 2977} {"train_loss": -12.598861694335938, "global_step": 500172, "epoch": 2977} {"train_loss": -12.762557983398438, "global_step": 500173, "epoch": 2977} {"train_loss": -12.688112258911133, "global_step": 500174, "epoch": 2977} {"train_loss": -12.802026748657227, "global_step": 500175, "epoch": 2977} {"train_loss": -12.855506896972656, "global_step": 500176, "epoch": 2977} {"train_loss": -12.833556175231934, "global_step": 500177, "epoch": 2977} {"train_loss": -12.781379699707031, "global_step": 500178, "epoch": 2977} {"train_loss": -12.945525169372559, "global_step": 500179, "epoch": 2977} {"train_loss": -12.862785339355469, "global_step": 500180, "epoch": 2977} {"train_loss": -13.005071640014648, "global_step": 500181, "epoch": 2977} {"train_loss": -12.708788871765137, "global_step": 500182, "epoch": 2977} {"train_loss": -12.987195014953613, "global_step": 500183, "epoch": 2977} {"train_loss": -12.870651245117188, "global_step": 500184, "epoch": 2977} {"train_loss": -12.978023529052734, "global_step": 500185, "epoch": 2977} {"train_loss": -12.963754653930664, "global_step": 500186, "epoch": 2977} {"train_loss": -12.804750442504883, "global_step": 500187, "epoch": 2977} {"train_loss": -12.932689666748047, "global_step": 500188, "epoch": 2977} {"train_loss": -13.019880294799805, "global_step": 500189, "epoch": 2977} {"train_loss": -12.896702766418457, "global_step": 500190, "epoch": 2977} {"train_loss": -12.703267097473145, "global_step": 500191, "epoch": 2977} {"train_loss": -12.802494049072266, "global_step": 500192, "epoch": 2977} {"train_loss": -12.95271110534668, "global_step": 500193, "epoch": 2977} {"train_loss": -12.703009605407715, "global_step": 500194, "epoch": 2977} {"train_loss": -12.767799377441406, "global_step": 500195, "epoch": 2977} {"train_loss": -12.797124862670898, "global_step": 500196, "epoch": 2977} {"train_loss": -12.502378463745117, "global_step": 500197, "epoch": 2977} {"train_loss": -12.98674201965332, "global_step": 500198, "epoch": 2977} {"train_loss": -12.824732780456543, "global_step": 500199, "epoch": 2977} {"train_loss": -12.708243370056152, "global_step": 500200, "epoch": 2977} {"train_loss": -12.826398849487305, "global_step": 500201, "epoch": 2977} {"train_loss": -12.95772933959961, "global_step": 500202, "epoch": 2977} {"train_loss": -12.623922348022461, "global_step": 500203, "epoch": 2977} {"train_loss": -12.336277961730957, "global_step": 500204, "epoch": 2977} {"train_loss": -12.358875274658203, "global_step": 500205, "epoch": 2977} {"train_loss": -12.155418395996094, "global_step": 500206, "epoch": 2977} {"train_loss": -12.838469505310059, "global_step": 500207, "epoch": 2977} {"train_loss": -12.419792175292969, "global_step": 500208, "epoch": 2977} {"train_loss": -12.347707748413086, "global_step": 500209, "epoch": 2977} {"train_loss": -13.096096992492676, "global_step": 500210, "epoch": 2977} {"train_loss": -12.697267532348633, "global_step": 500211, "epoch": 2977} {"train_loss": -12.578214645385742, "global_step": 500212, "epoch": 2977} {"train_loss": -12.776721954345703, "global_step": 500213, "epoch": 2977} {"train_loss": -12.727843284606934, "global_step": 500214, "epoch": 2977} {"train_loss": -12.4332275390625, "global_step": 500215, "epoch": 2977} {"train_loss": -12.843021392822266, "global_step": 500216, "epoch": 2977} {"train_loss": -12.48962688446045, "global_step": 500217, "epoch": 2977} {"train_loss": -12.585186958312988, "global_step": 500218, "epoch": 2977} {"train_loss": -12.245864868164062, "global_step": 500219, "epoch": 2977} {"train_loss": -12.068778038024902, "global_step": 500220, "epoch": 2977} {"train_loss": -12.749537467956543, "global_step": 500221, "epoch": 2977} {"train_loss": -12.350046157836914, "global_step": 500222, "epoch": 2977} {"train_loss": -12.369803428649902, "global_step": 500223, "epoch": 2977} {"train_loss": -12.583592414855957, "global_step": 500224, "epoch": 2977} {"train_loss": -12.528485298156738, "global_step": 500225, "epoch": 2977} {"train_loss": -12.84376335144043, "global_step": 500226, "epoch": 2977} {"train_loss": -12.857608795166016, "global_step": 500227, "epoch": 2977} {"train_loss": -12.798835754394531, "global_step": 500228, "epoch": 2977} {"train_loss": -12.805502891540527, "global_step": 500229, "epoch": 2977} {"train_loss": -13.060471534729004, "global_step": 500230, "epoch": 2977} {"train_loss": -12.908180236816406, "global_step": 500231, "epoch": 2977} {"train_loss": -12.499635696411133, "global_step": 500232, "epoch": 2977} {"train_loss": -12.752103805541992, "global_step": 500233, "epoch": 2977} {"train_loss": -12.705815315246582, "global_step": 500234, "epoch": 2977} {"train_loss": -12.862308502197266, "global_step": 500235, "epoch": 2977} {"train_loss": -12.601515769958496, "global_step": 500236, "epoch": 2977} {"train_loss": -12.59858512878418, "global_step": 500237, "epoch": 2977} {"train_loss": -12.530502319335938, "global_step": 500238, "epoch": 2977} {"train_loss": -12.74350357055664, "global_step": 500239, "epoch": 2977} {"train_loss": -12.534541130065918, "global_step": 500240, "epoch": 2977} {"train_loss": -11.461257934570312, "global_step": 500241, "epoch": 2977} {"train_loss": -12.643091201782227, "global_step": 500242, "epoch": 2977} {"train_loss": -12.62188720703125, "global_step": 500243, "epoch": 2977} {"train_loss": -12.164368629455566, "global_step": 500244, "epoch": 2977} {"train_loss": -11.675539016723633, "global_step": 500245, "epoch": 2977} {"train_loss": -12.261430740356445, "global_step": 500246, "epoch": 2977} {"train_loss": -12.586048126220703, "global_step": 500247, "epoch": 2977} {"train_loss": -11.01927661895752, "global_step": 500248, "epoch": 2977} {"train_loss": -11.36693000793457, "global_step": 500249, "epoch": 2977} {"train_loss": -11.951482772827148, "global_step": 500250, "epoch": 2977} {"train_loss": -12.977750778198242, "global_step": 500251, "epoch": 2977} {"train_loss": -11.879054069519043, "global_step": 500252, "epoch": 2977} {"train_loss": -12.058349609375, "global_step": 500253, "epoch": 2977} {"train_loss": -12.3720703125, "global_step": 500254, "epoch": 2977} {"train_loss": -11.48106861114502, "global_step": 500255, "epoch": 2977} {"train_loss": -11.480062484741211, "global_step": 500256, "epoch": 2977} {"train_loss": -10.033821105957031, "global_step": 500257, "epoch": 2977} {"train_loss": -9.572908401489258, "global_step": 500258, "epoch": 2977} {"train_loss": -12.029129981994629, "global_step": 500259, "epoch": 2977} {"train_loss": -8.719696044921875, "global_step": 500260, "epoch": 2977} {"train_loss": -10.879697799682617, "global_step": 500261, "epoch": 2977} {"train_loss": -9.787188529968262, "global_step": 500262, "epoch": 2977} {"train_loss": -8.645232200622559, "global_step": 500263, "epoch": 2977} {"train_loss": -8.387044906616211, "global_step": 500264, "epoch": 2977} {"train_loss": -7.68364143371582, "global_step": 500265, "epoch": 2977} {"train_loss": -7.903836250305176, "global_step": 500266, "epoch": 2977} {"train_loss": -8.227214813232422, "global_step": 500267, "epoch": 2977} {"train_loss": -8.116046905517578, "global_step": 500268, "epoch": 2977} {"train_loss": -8.456762313842773, "global_step": 500269, "epoch": 2977} {"train_loss": -9.116935729980469, "global_step": 500270, "epoch": 2977} {"train_loss": -9.561332702636719, "global_step": 500271, "epoch": 2977} {"train_loss": -10.807019233703613, "global_step": 500272, "epoch": 2977} {"train_loss": -9.270708084106445, "global_step": 500273, "epoch": 2977} {"train_loss": -9.81039047241211, "global_step": 500274, "epoch": 2977} {"train_loss": -10.020084381103516, "global_step": 500275, "epoch": 2977} {"train_loss": -10.124677658081055, "global_step": 500276, "epoch": 2977} {"train_loss": -10.639671325683594, "global_step": 500277, "epoch": 2977} {"train_loss": -10.065149307250977, "global_step": 500278, "epoch": 2977} {"train_loss": -11.27284049987793, "global_step": 500279, "epoch": 2977} {"train_loss": -11.291114807128906, "global_step": 500280, "epoch": 2977} {"train_loss": -11.003697395324707, "global_step": 500281, "epoch": 2977} {"train_loss": -11.367555618286133, "global_step": 500282, "epoch": 2977} {"train_loss": -11.465415954589844, "global_step": 500283, "epoch": 2977} {"train_loss": -10.816679000854492, "global_step": 500284, "epoch": 2977} {"train_loss": -10.601896286010742, "global_step": 500285, "epoch": 2977} {"train_loss": -11.854658126831055, "global_step": 500286, "epoch": 2977} {"train_loss": -10.498395919799805, "global_step": 500287, "epoch": 2977} {"train_loss": -11.580095291137695, "global_step": 500288, "epoch": 2977} {"train_loss": -10.904980659484863, "global_step": 500289, "epoch": 2977} {"train_loss": -10.872634887695312, "global_step": 500290, "epoch": 2977} {"train_loss": -11.577762603759766, "global_step": 500291, "epoch": 2977} {"train_loss": -11.608826637268066, "global_step": 500292, "epoch": 2977} {"train_loss": -10.829483985900879, "global_step": 500293, "epoch": 2977} {"train_loss": -12.131925582885742, "global_step": 500294, "epoch": 2977} {"train_loss": -11.819948196411133, "global_step": 500295, "epoch": 2977} {"train_loss": -11.93604564666748, "global_step": 500296, "epoch": 2977} {"train_loss": -11.731748580932617, "global_step": 500297, "epoch": 2977} {"train_loss": -12.051131248474121, "global_step": 500298, "epoch": 2977} {"train_loss": -11.858481407165527, "global_step": 500299, "epoch": 2977} {"train_loss": -11.865650177001953, "global_step": 500300, "epoch": 2977} {"train_loss": -11.76583480834961, "global_step": 500301, "epoch": 2977} {"train_loss": -12.037818908691406, "global_step": 500302, "epoch": 2977} {"train_loss": -11.996891629128228, "global_step": 500303, "epoch": 2977, "val_loss": 320829.84375} {"train_loss": -12.046710968017578, "global_step": 500304, "epoch": 2978} {"train_loss": -12.253168106079102, "global_step": 500305, "epoch": 2978} {"train_loss": -11.776565551757812, "global_step": 500306, "epoch": 2978} {"train_loss": -12.229352951049805, "global_step": 500307, "epoch": 2978} {"train_loss": -11.927291870117188, "global_step": 500308, "epoch": 2978} {"train_loss": -12.079541206359863, "global_step": 500309, "epoch": 2978} {"train_loss": -12.020998001098633, "global_step": 500310, "epoch": 2978} {"train_loss": -12.319441795349121, "global_step": 500311, "epoch": 2978} {"train_loss": -12.092842102050781, "global_step": 500312, "epoch": 2978} {"train_loss": -12.228986740112305, "global_step": 500313, "epoch": 2978} {"train_loss": -12.573053359985352, "global_step": 500314, "epoch": 2978} {"train_loss": -12.332056045532227, "global_step": 500315, "epoch": 2978} {"train_loss": -12.363258361816406, "global_step": 500316, "epoch": 2978} {"train_loss": -12.3486328125, "global_step": 500317, "epoch": 2978} {"train_loss": -12.637070655822754, "global_step": 500318, "epoch": 2978} {"train_loss": -12.263059616088867, "global_step": 500319, "epoch": 2978} {"train_loss": -12.43805980682373, "global_step": 500320, "epoch": 2978} {"train_loss": -12.408367156982422, "global_step": 500321, "epoch": 2978} {"train_loss": -12.455524444580078, "global_step": 500322, "epoch": 2978} {"train_loss": -12.412759780883789, "global_step": 500323, "epoch": 2978} {"train_loss": -12.461650848388672, "global_step": 500324, "epoch": 2978} {"train_loss": -12.642017364501953, "global_step": 500325, "epoch": 2978} {"train_loss": -12.212188720703125, "global_step": 500326, "epoch": 2978} {"train_loss": -12.612396240234375, "global_step": 500327, "epoch": 2978} {"train_loss": -12.287657737731934, "global_step": 500328, "epoch": 2978} {"train_loss": -12.733383178710938, "global_step": 500329, "epoch": 2978} {"train_loss": -12.189457893371582, "global_step": 500330, "epoch": 2978} {"train_loss": -12.406461715698242, "global_step": 500331, "epoch": 2978} {"train_loss": -12.508056640625, "global_step": 500332, "epoch": 2978} {"train_loss": -12.195039749145508, "global_step": 500333, "epoch": 2978} {"train_loss": -12.763640403747559, "global_step": 500334, "epoch": 2978} {"train_loss": -12.456823348999023, "global_step": 500335, "epoch": 2978} {"train_loss": -12.607662200927734, "global_step": 500336, "epoch": 2978} {"train_loss": -12.422075271606445, "global_step": 500337, "epoch": 2978} {"train_loss": -12.503735542297363, "global_step": 500338, "epoch": 2978} {"train_loss": -12.399421691894531, "global_step": 500339, "epoch": 2978} {"train_loss": -12.638951301574707, "global_step": 500340, "epoch": 2978} {"train_loss": -12.717538833618164, "global_step": 500341, "epoch": 2978} {"train_loss": -12.73951244354248, "global_step": 500342, "epoch": 2978} {"train_loss": -12.7005615234375, "global_step": 500343, "epoch": 2978} {"train_loss": -12.884429931640625, "global_step": 500344, "epoch": 2978} {"train_loss": -12.567172050476074, "global_step": 500345, "epoch": 2978} {"train_loss": -12.647663116455078, "global_step": 500346, "epoch": 2978} {"train_loss": -12.614923477172852, "global_step": 500347, "epoch": 2978} {"train_loss": -12.755206108093262, "global_step": 500348, "epoch": 2978} {"train_loss": -12.710943222045898, "global_step": 500349, "epoch": 2978} {"train_loss": -12.80270004272461, "global_step": 500350, "epoch": 2978} {"train_loss": -12.513102531433105, "global_step": 500351, "epoch": 2978} {"train_loss": -12.751119613647461, "global_step": 500352, "epoch": 2978} {"train_loss": -12.75179386138916, "global_step": 500353, "epoch": 2978} {"train_loss": -12.921777725219727, "global_step": 500354, "epoch": 2978} {"train_loss": -12.814874649047852, "global_step": 500355, "epoch": 2978} {"train_loss": -13.017826080322266, "global_step": 500356, "epoch": 2978} {"train_loss": -12.946029663085938, "global_step": 500357, "epoch": 2978} {"train_loss": -12.954030990600586, "global_step": 500358, "epoch": 2978} {"train_loss": -12.867691993713379, "global_step": 500359, "epoch": 2978} {"train_loss": -12.721150398254395, "global_step": 500360, "epoch": 2978} {"train_loss": -12.882787704467773, "global_step": 500361, "epoch": 2978} {"train_loss": -12.95974349975586, "global_step": 500362, "epoch": 2978} {"train_loss": -13.11629581451416, "global_step": 500363, "epoch": 2978} {"train_loss": -12.881139755249023, "global_step": 500364, "epoch": 2978} {"train_loss": -12.991897583007812, "global_step": 500365, "epoch": 2978} {"train_loss": -12.997325897216797, "global_step": 500366, "epoch": 2978} {"train_loss": -12.846271514892578, "global_step": 500367, "epoch": 2978} {"train_loss": -12.753155708312988, "global_step": 500368, "epoch": 2978} {"train_loss": -12.954795837402344, "global_step": 500369, "epoch": 2978} {"train_loss": -12.901900291442871, "global_step": 500370, "epoch": 2978} {"train_loss": -12.953851699829102, "global_step": 500371, "epoch": 2978} {"train_loss": -12.81837272644043, "global_step": 500372, "epoch": 2978} {"train_loss": -12.853595733642578, "global_step": 500373, "epoch": 2978} {"train_loss": -12.823476791381836, "global_step": 500374, "epoch": 2978} {"train_loss": -12.824088096618652, "global_step": 500375, "epoch": 2978} {"train_loss": -13.029293060302734, "global_step": 500376, "epoch": 2978} {"train_loss": -12.898540496826172, "global_step": 500377, "epoch": 2978} {"train_loss": -12.925141334533691, "global_step": 500378, "epoch": 2978} {"train_loss": -13.011271476745605, "global_step": 500379, "epoch": 2978} {"train_loss": -12.714262008666992, "global_step": 500380, "epoch": 2978} {"train_loss": -12.86202621459961, "global_step": 500381, "epoch": 2978} {"train_loss": -12.996736526489258, "global_step": 500382, "epoch": 2978} {"train_loss": -12.973461151123047, "global_step": 500383, "epoch": 2978} {"train_loss": -13.180631637573242, "global_step": 500384, "epoch": 2978} {"train_loss": -13.224653244018555, "global_step": 500385, "epoch": 2978} {"train_loss": -12.779932022094727, "global_step": 500386, "epoch": 2978} {"train_loss": -13.047232627868652, "global_step": 500387, "epoch": 2978} {"train_loss": -12.85545825958252, "global_step": 500388, "epoch": 2978} {"train_loss": -12.795502662658691, "global_step": 500389, "epoch": 2978} {"train_loss": -13.068997383117676, "global_step": 500390, "epoch": 2978} {"train_loss": -13.093441009521484, "global_step": 500391, "epoch": 2978} {"train_loss": -13.130443572998047, "global_step": 500392, "epoch": 2978} {"train_loss": -13.141538619995117, "global_step": 500393, "epoch": 2978} {"train_loss": -13.038862228393555, "global_step": 500394, "epoch": 2978} {"train_loss": -13.086841583251953, "global_step": 500395, "epoch": 2978} {"train_loss": -12.950321197509766, "global_step": 500396, "epoch": 2978} {"train_loss": -13.032665252685547, "global_step": 500397, "epoch": 2978} {"train_loss": -12.85508918762207, "global_step": 500398, "epoch": 2978} {"train_loss": -12.940227508544922, "global_step": 500399, "epoch": 2978} {"train_loss": -13.211341857910156, "global_step": 500400, "epoch": 2978} {"train_loss": -12.73763656616211, "global_step": 500401, "epoch": 2978} {"train_loss": -12.936260223388672, "global_step": 500402, "epoch": 2978} {"train_loss": -13.103713035583496, "global_step": 500403, "epoch": 2978} {"train_loss": -13.053680419921875, "global_step": 500404, "epoch": 2978} {"train_loss": -12.92391586303711, "global_step": 500405, "epoch": 2978} {"train_loss": -12.543188095092773, "global_step": 500406, "epoch": 2978} {"train_loss": -12.981610298156738, "global_step": 500407, "epoch": 2978} {"train_loss": -12.812812805175781, "global_step": 500408, "epoch": 2978} {"train_loss": -12.810222625732422, "global_step": 500409, "epoch": 2978} {"train_loss": -12.758049011230469, "global_step": 500410, "epoch": 2978} {"train_loss": -13.081721305847168, "global_step": 500411, "epoch": 2978} {"train_loss": -13.012060165405273, "global_step": 500412, "epoch": 2978} {"train_loss": -12.942033767700195, "global_step": 500413, "epoch": 2978} {"train_loss": -12.786447525024414, "global_step": 500414, "epoch": 2978} {"train_loss": -13.278177261352539, "global_step": 500415, "epoch": 2978} {"train_loss": -12.970539093017578, "global_step": 500416, "epoch": 2978} {"train_loss": -12.412217140197754, "global_step": 500417, "epoch": 2978} {"train_loss": -12.293986320495605, "global_step": 500418, "epoch": 2978} {"train_loss": -12.291646957397461, "global_step": 500419, "epoch": 2978} {"train_loss": -12.115757942199707, "global_step": 500420, "epoch": 2978} {"train_loss": -10.73581314086914, "global_step": 500421, "epoch": 2978} {"train_loss": -12.354169845581055, "global_step": 500422, "epoch": 2978} {"train_loss": -11.086477279663086, "global_step": 500423, "epoch": 2978} {"train_loss": -11.501148223876953, "global_step": 500424, "epoch": 2978} {"train_loss": -11.609060287475586, "global_step": 500425, "epoch": 2978} {"train_loss": -12.150651931762695, "global_step": 500426, "epoch": 2978} {"train_loss": -11.441574096679688, "global_step": 500427, "epoch": 2978} {"train_loss": -10.053221702575684, "global_step": 500428, "epoch": 2978} {"train_loss": -11.684568405151367, "global_step": 500429, "epoch": 2978} {"train_loss": -9.73068618774414, "global_step": 500430, "epoch": 2978} {"train_loss": -11.449992179870605, "global_step": 500431, "epoch": 2978} {"train_loss": -9.834927558898926, "global_step": 500432, "epoch": 2978} {"train_loss": -10.596723556518555, "global_step": 500433, "epoch": 2978} {"train_loss": -9.895462989807129, "global_step": 500434, "epoch": 2978} {"train_loss": -12.222677230834961, "global_step": 500435, "epoch": 2978} {"train_loss": -10.887325286865234, "global_step": 500436, "epoch": 2978} {"train_loss": -11.117605209350586, "global_step": 500437, "epoch": 2978} {"train_loss": -10.055895805358887, "global_step": 500438, "epoch": 2978} {"train_loss": -10.478001594543457, "global_step": 500439, "epoch": 2978} {"train_loss": -11.943273544311523, "global_step": 500440, "epoch": 2978} {"train_loss": -10.201704025268555, "global_step": 500441, "epoch": 2978} {"train_loss": -10.472064971923828, "global_step": 500442, "epoch": 2978} {"train_loss": -11.127287864685059, "global_step": 500443, "epoch": 2978} {"train_loss": -10.241650581359863, "global_step": 500444, "epoch": 2978} {"train_loss": -11.108650207519531, "global_step": 500445, "epoch": 2978} {"train_loss": -10.743654251098633, "global_step": 500446, "epoch": 2978} {"train_loss": -11.036285400390625, "global_step": 500447, "epoch": 2978} {"train_loss": -9.604349136352539, "global_step": 500448, "epoch": 2978} {"train_loss": -8.840856552124023, "global_step": 500449, "epoch": 2978} {"train_loss": -10.117575645446777, "global_step": 500450, "epoch": 2978} {"train_loss": -11.103761672973633, "global_step": 500451, "epoch": 2978} {"train_loss": -9.406412124633789, "global_step": 500452, "epoch": 2978} {"train_loss": -11.112421989440918, "global_step": 500453, "epoch": 2978} {"train_loss": -9.728593826293945, "global_step": 500454, "epoch": 2978} {"train_loss": -9.857138633728027, "global_step": 500455, "epoch": 2978} {"train_loss": -9.98443603515625, "global_step": 500456, "epoch": 2978} {"train_loss": -9.890958786010742, "global_step": 500457, "epoch": 2978} {"train_loss": -10.10556697845459, "global_step": 500458, "epoch": 2978} {"train_loss": -11.10539436340332, "global_step": 500459, "epoch": 2978} {"train_loss": -9.765256881713867, "global_step": 500460, "epoch": 2978} {"train_loss": -10.689753532409668, "global_step": 500461, "epoch": 2978} {"train_loss": -10.700294494628906, "global_step": 500462, "epoch": 2978} {"train_loss": -10.057144165039062, "global_step": 500463, "epoch": 2978} {"train_loss": -10.011825561523438, "global_step": 500464, "epoch": 2978} {"train_loss": -9.265315055847168, "global_step": 500465, "epoch": 2978} {"train_loss": -10.822344779968262, "global_step": 500466, "epoch": 2978} {"train_loss": -9.571159362792969, "global_step": 500467, "epoch": 2978} {"train_loss": -10.345232963562012, "global_step": 500468, "epoch": 2978} {"train_loss": -10.40121841430664, "global_step": 500469, "epoch": 2978} {"train_loss": -10.457476615905762, "global_step": 500470, "epoch": 2978} {"train_loss": -12.057007221948533, "global_step": 500471, "epoch": 2978, "val_loss": 320554.5} {"train_loss": -9.6434965133667, "global_step": 500472, "epoch": 2979} {"train_loss": -10.638691902160645, "global_step": 500473, "epoch": 2979} {"train_loss": -10.572014808654785, "global_step": 500474, "epoch": 2979} {"train_loss": -10.078139305114746, "global_step": 500475, "epoch": 2979} {"train_loss": -10.567947387695312, "global_step": 500476, "epoch": 2979} {"train_loss": -11.387775421142578, "global_step": 500477, "epoch": 2979} {"train_loss": -10.92258071899414, "global_step": 500478, "epoch": 2979} {"train_loss": -11.126482963562012, "global_step": 500479, "epoch": 2979} {"train_loss": -11.34328556060791, "global_step": 500480, "epoch": 2979} {"train_loss": -11.431419372558594, "global_step": 500481, "epoch": 2979} {"train_loss": -12.114510536193848, "global_step": 500482, "epoch": 2979} {"train_loss": -11.145597457885742, "global_step": 500483, "epoch": 2979} {"train_loss": -10.883785247802734, "global_step": 500484, "epoch": 2979} {"train_loss": -11.719375610351562, "global_step": 500485, "epoch": 2979} {"train_loss": -11.424358367919922, "global_step": 500486, "epoch": 2979} {"train_loss": -11.351572036743164, "global_step": 500487, "epoch": 2979} {"train_loss": -11.248641967773438, "global_step": 500488, "epoch": 2979} {"train_loss": -11.636661529541016, "global_step": 500489, "epoch": 2979} {"train_loss": -10.927035331726074, "global_step": 500490, "epoch": 2979} {"train_loss": -11.846811294555664, "global_step": 500491, "epoch": 2979} {"train_loss": -11.016630172729492, "global_step": 500492, "epoch": 2979} {"train_loss": -11.525772094726562, "global_step": 500493, "epoch": 2979} {"train_loss": -11.346628189086914, "global_step": 500494, "epoch": 2979} {"train_loss": -12.02889633178711, "global_step": 500495, "epoch": 2979} {"train_loss": -11.575082778930664, "global_step": 500496, "epoch": 2979} {"train_loss": -11.792993545532227, "global_step": 500497, "epoch": 2979} {"train_loss": -12.0649995803833, "global_step": 500498, "epoch": 2979} {"train_loss": -12.262680053710938, "global_step": 500499, "epoch": 2979} {"train_loss": -12.044471740722656, "global_step": 500500, "epoch": 2979} {"train_loss": -12.29223918914795, "global_step": 500501, "epoch": 2979} {"train_loss": -12.250478744506836, "global_step": 500502, "epoch": 2979} {"train_loss": -12.248526573181152, "global_step": 500503, "epoch": 2979} {"train_loss": -12.447816848754883, "global_step": 500504, "epoch": 2979} {"train_loss": -12.257390975952148, "global_step": 500505, "epoch": 2979} {"train_loss": -12.439078330993652, "global_step": 500506, "epoch": 2979} {"train_loss": -12.46945571899414, "global_step": 500507, "epoch": 2979} {"train_loss": -12.172619819641113, "global_step": 500508, "epoch": 2979} {"train_loss": -12.279825210571289, "global_step": 500509, "epoch": 2979} {"train_loss": -12.341863632202148, "global_step": 500510, "epoch": 2979} {"train_loss": -12.324069023132324, "global_step": 500511, "epoch": 2979} {"train_loss": -12.538827896118164, "global_step": 500512, "epoch": 2979} {"train_loss": -12.320960998535156, "global_step": 500513, "epoch": 2979} {"train_loss": -12.388824462890625, "global_step": 500514, "epoch": 2979} {"train_loss": -12.473634719848633, "global_step": 500515, "epoch": 2979} {"train_loss": -12.352706909179688, "global_step": 500516, "epoch": 2979} {"train_loss": -12.525389671325684, "global_step": 500517, "epoch": 2979} {"train_loss": -12.540766716003418, "global_step": 500518, "epoch": 2979} {"train_loss": -12.33877182006836, "global_step": 500519, "epoch": 2979} {"train_loss": -12.500188827514648, "global_step": 500520, "epoch": 2979} {"train_loss": -12.407073974609375, "global_step": 500521, "epoch": 2979} {"train_loss": -12.450935363769531, "global_step": 500522, "epoch": 2979} {"train_loss": -12.619263648986816, "global_step": 500523, "epoch": 2979} {"train_loss": -12.560413360595703, "global_step": 500524, "epoch": 2979} {"train_loss": -12.555448532104492, "global_step": 500525, "epoch": 2979} {"train_loss": -12.50810432434082, "global_step": 500526, "epoch": 2979} {"train_loss": -12.456823348999023, "global_step": 500527, "epoch": 2979} {"train_loss": -12.361059188842773, "global_step": 500528, "epoch": 2979} {"train_loss": -12.005414962768555, "global_step": 500529, "epoch": 2979} {"train_loss": -12.634313583374023, "global_step": 500530, "epoch": 2979} {"train_loss": -12.524064064025879, "global_step": 500531, "epoch": 2979} {"train_loss": -12.63809585571289, "global_step": 500532, "epoch": 2979} {"train_loss": -12.569969177246094, "global_step": 500533, "epoch": 2979} {"train_loss": -12.508502006530762, "global_step": 500534, "epoch": 2979} {"train_loss": -12.502730369567871, "global_step": 500535, "epoch": 2979} {"train_loss": -12.685091018676758, "global_step": 500536, "epoch": 2979} {"train_loss": -12.655935287475586, "global_step": 500537, "epoch": 2979} {"train_loss": -12.742795944213867, "global_step": 500538, "epoch": 2979} {"train_loss": -12.550527572631836, "global_step": 500539, "epoch": 2979} {"train_loss": -12.855087280273438, "global_step": 500540, "epoch": 2979} {"train_loss": -12.765594482421875, "global_step": 500541, "epoch": 2979} {"train_loss": -12.800348281860352, "global_step": 500542, "epoch": 2979} {"train_loss": -12.7597074508667, "global_step": 500543, "epoch": 2979} {"train_loss": -12.732710838317871, "global_step": 500544, "epoch": 2979} {"train_loss": -12.665872573852539, "global_step": 500545, "epoch": 2979} {"train_loss": -12.877201080322266, "global_step": 500546, "epoch": 2979} {"train_loss": -12.865592002868652, "global_step": 500547, "epoch": 2979} {"train_loss": -12.8001708984375, "global_step": 500548, "epoch": 2979} {"train_loss": -12.715864181518555, "global_step": 500549, "epoch": 2979} {"train_loss": -12.910845756530762, "global_step": 500550, "epoch": 2979} {"train_loss": -12.804168701171875, "global_step": 500551, "epoch": 2979} {"train_loss": -12.928812026977539, "global_step": 500552, "epoch": 2979} {"train_loss": -12.936769485473633, "global_step": 500553, "epoch": 2979} {"train_loss": -12.85959243774414, "global_step": 500554, "epoch": 2979} {"train_loss": -12.890373229980469, "global_step": 500555, "epoch": 2979} {"train_loss": -12.879234313964844, "global_step": 500556, "epoch": 2979} {"train_loss": -12.96382999420166, "global_step": 500557, "epoch": 2979} {"train_loss": -12.85836410522461, "global_step": 500558, "epoch": 2979} {"train_loss": -12.89317512512207, "global_step": 500559, "epoch": 2979} {"train_loss": -12.741021156311035, "global_step": 500560, "epoch": 2979} {"train_loss": -12.772859573364258, "global_step": 500561, "epoch": 2979} {"train_loss": -12.6398286819458, "global_step": 500562, "epoch": 2979} {"train_loss": -12.642759323120117, "global_step": 500563, "epoch": 2979} {"train_loss": -12.847610473632812, "global_step": 500564, "epoch": 2979} {"train_loss": -12.775577545166016, "global_step": 500565, "epoch": 2979} {"train_loss": -13.002725601196289, "global_step": 500566, "epoch": 2979} {"train_loss": -12.905475616455078, "global_step": 500567, "epoch": 2979} {"train_loss": -12.836246490478516, "global_step": 500568, "epoch": 2979} {"train_loss": -12.821634292602539, "global_step": 500569, "epoch": 2979} {"train_loss": -12.711929321289062, "global_step": 500570, "epoch": 2979} {"train_loss": -12.906789779663086, "global_step": 500571, "epoch": 2979} {"train_loss": -12.817865371704102, "global_step": 500572, "epoch": 2979} {"train_loss": -12.890571594238281, "global_step": 500573, "epoch": 2979} {"train_loss": -12.833648681640625, "global_step": 500574, "epoch": 2979} {"train_loss": -12.707147598266602, "global_step": 500575, "epoch": 2979} {"train_loss": -12.851781845092773, "global_step": 500576, "epoch": 2979} {"train_loss": -12.891461372375488, "global_step": 500577, "epoch": 2979} {"train_loss": -12.785848617553711, "global_step": 500578, "epoch": 2979} {"train_loss": -12.719839096069336, "global_step": 500579, "epoch": 2979} {"train_loss": -12.713456153869629, "global_step": 500580, "epoch": 2979} {"train_loss": -13.022258758544922, "global_step": 500581, "epoch": 2979} {"train_loss": -12.555919647216797, "global_step": 500582, "epoch": 2979} {"train_loss": -12.748626708984375, "global_step": 500583, "epoch": 2979} {"train_loss": -12.945952415466309, "global_step": 500584, "epoch": 2979} {"train_loss": -12.728190422058105, "global_step": 500585, "epoch": 2979} {"train_loss": -12.877972602844238, "global_step": 500586, "epoch": 2979} {"train_loss": -12.73513412475586, "global_step": 500587, "epoch": 2979} {"train_loss": -12.709217071533203, "global_step": 500588, "epoch": 2979} {"train_loss": -12.880744934082031, "global_step": 500589, "epoch": 2979} {"train_loss": -12.754709243774414, "global_step": 500590, "epoch": 2979} {"train_loss": -12.472603797912598, "global_step": 500591, "epoch": 2979} {"train_loss": -12.607463836669922, "global_step": 500592, "epoch": 2979} {"train_loss": -11.512405395507812, "global_step": 500593, "epoch": 2979} {"train_loss": -12.772217750549316, "global_step": 500594, "epoch": 2979} {"train_loss": -11.851877212524414, "global_step": 500595, "epoch": 2979} {"train_loss": -12.179027557373047, "global_step": 500596, "epoch": 2979} {"train_loss": -12.625520706176758, "global_step": 500597, "epoch": 2979} {"train_loss": -11.648350715637207, "global_step": 500598, "epoch": 2979} {"train_loss": -12.673782348632812, "global_step": 500599, "epoch": 2979} {"train_loss": -12.386665344238281, "global_step": 500600, "epoch": 2979} {"train_loss": -12.163142204284668, "global_step": 500601, "epoch": 2979} {"train_loss": -12.590262413024902, "global_step": 500602, "epoch": 2979} {"train_loss": -12.195732116699219, "global_step": 500603, "epoch": 2979} {"train_loss": -12.542635917663574, "global_step": 500604, "epoch": 2979} {"train_loss": -12.668380737304688, "global_step": 500605, "epoch": 2979} {"train_loss": -11.784048080444336, "global_step": 500606, "epoch": 2979} {"train_loss": -12.314599990844727, "global_step": 500607, "epoch": 2979} {"train_loss": -12.085126876831055, "global_step": 500608, "epoch": 2979} {"train_loss": -12.539280891418457, "global_step": 500609, "epoch": 2979} {"train_loss": -12.571375846862793, "global_step": 500610, "epoch": 2979} {"train_loss": -12.544243812561035, "global_step": 500611, "epoch": 2979} {"train_loss": -12.753287315368652, "global_step": 500612, "epoch": 2979} {"train_loss": -11.699146270751953, "global_step": 500613, "epoch": 2979} {"train_loss": -10.96033000946045, "global_step": 500614, "epoch": 2979} {"train_loss": -12.715402603149414, "global_step": 500615, "epoch": 2979} {"train_loss": -12.615543365478516, "global_step": 500616, "epoch": 2979} {"train_loss": -12.380081176757812, "global_step": 500617, "epoch": 2979} {"train_loss": -12.533525466918945, "global_step": 500618, "epoch": 2979} {"train_loss": -12.51003646850586, "global_step": 500619, "epoch": 2979} {"train_loss": -12.405169486999512, "global_step": 500620, "epoch": 2979} {"train_loss": -12.91452407836914, "global_step": 500621, "epoch": 2979} {"train_loss": -12.547117233276367, "global_step": 500622, "epoch": 2979} {"train_loss": -12.805741310119629, "global_step": 500623, "epoch": 2979} {"train_loss": -12.567626953125, "global_step": 500624, "epoch": 2979} {"train_loss": -12.685312271118164, "global_step": 500625, "epoch": 2979} {"train_loss": -12.785696983337402, "global_step": 500626, "epoch": 2979} {"train_loss": -12.362052917480469, "global_step": 500627, "epoch": 2979} {"train_loss": -12.565881729125977, "global_step": 500628, "epoch": 2979} {"train_loss": -12.371232986450195, "global_step": 500629, "epoch": 2979} {"train_loss": -12.656757354736328, "global_step": 500630, "epoch": 2979} {"train_loss": -12.673815727233887, "global_step": 500631, "epoch": 2979} {"train_loss": -12.585006713867188, "global_step": 500632, "epoch": 2979} {"train_loss": -12.764293670654297, "global_step": 500633, "epoch": 2979} {"train_loss": -12.381388664245605, "global_step": 500634, "epoch": 2979} {"train_loss": -12.448728561401367, "global_step": 500635, "epoch": 2979} {"train_loss": -12.482839584350586, "global_step": 500636, "epoch": 2979} {"train_loss": -12.285890579223633, "global_step": 500637, "epoch": 2979} {"train_loss": -12.916975021362305, "global_step": 500638, "epoch": 2979} {"train_loss": -12.35149713924953, "global_step": 500639, "epoch": 2979, "val_loss": 320339.59375} {"train_loss": -12.227839469909668, "global_step": 500640, "epoch": 2980} {"train_loss": -11.871294021606445, "global_step": 500641, "epoch": 2980} {"train_loss": -11.441642761230469, "global_step": 500642, "epoch": 2980} {"train_loss": -12.240610122680664, "global_step": 500643, "epoch": 2980} {"train_loss": -11.66125774383545, "global_step": 500644, "epoch": 2980} {"train_loss": -12.448755264282227, "global_step": 500645, "epoch": 2980} {"train_loss": -12.751956939697266, "global_step": 500646, "epoch": 2980} {"train_loss": -12.397315979003906, "global_step": 500647, "epoch": 2980} {"train_loss": -12.390410423278809, "global_step": 500648, "epoch": 2980} {"train_loss": -12.383912086486816, "global_step": 500649, "epoch": 2980} {"train_loss": -12.392536163330078, "global_step": 500650, "epoch": 2980} {"train_loss": -12.259801864624023, "global_step": 500651, "epoch": 2980} {"train_loss": -11.8804931640625, "global_step": 500652, "epoch": 2980} {"train_loss": -12.33452320098877, "global_step": 500653, "epoch": 2980} {"train_loss": -11.271566390991211, "global_step": 500654, "epoch": 2980} {"train_loss": -12.510501861572266, "global_step": 500655, "epoch": 2980} {"train_loss": -11.223369598388672, "global_step": 500656, "epoch": 2980} {"train_loss": -10.798872947692871, "global_step": 500657, "epoch": 2980} {"train_loss": -12.276086807250977, "global_step": 500658, "epoch": 2980} {"train_loss": -10.958025932312012, "global_step": 500659, "epoch": 2980} {"train_loss": -12.145691871643066, "global_step": 500660, "epoch": 2980} {"train_loss": -11.416618347167969, "global_step": 500661, "epoch": 2980} {"train_loss": -12.403696060180664, "global_step": 500662, "epoch": 2980} {"train_loss": -11.96386432647705, "global_step": 500663, "epoch": 2980} {"train_loss": -12.442604064941406, "global_step": 500664, "epoch": 2980} {"train_loss": -11.955320358276367, "global_step": 500665, "epoch": 2980} {"train_loss": -11.879220962524414, "global_step": 500666, "epoch": 2980} {"train_loss": -11.408547401428223, "global_step": 500667, "epoch": 2980} {"train_loss": -12.040170669555664, "global_step": 500668, "epoch": 2980} {"train_loss": -11.79910659790039, "global_step": 500669, "epoch": 2980} {"train_loss": -10.873191833496094, "global_step": 500670, "epoch": 2980} {"train_loss": -12.420431137084961, "global_step": 500671, "epoch": 2980} {"train_loss": -11.253230094909668, "global_step": 500672, "epoch": 2980} {"train_loss": -11.910526275634766, "global_step": 500673, "epoch": 2980} {"train_loss": -12.162787437438965, "global_step": 500674, "epoch": 2980} {"train_loss": -9.611774444580078, "global_step": 500675, "epoch": 2980} {"train_loss": -11.235880851745605, "global_step": 500676, "epoch": 2980} {"train_loss": -10.09946060180664, "global_step": 500677, "epoch": 2980} {"train_loss": -11.025005340576172, "global_step": 500678, "epoch": 2980} {"train_loss": -11.201226234436035, "global_step": 500679, "epoch": 2980} {"train_loss": -12.143272399902344, "global_step": 500680, "epoch": 2980} {"train_loss": -11.106500625610352, "global_step": 500681, "epoch": 2980} {"train_loss": -11.837251663208008, "global_step": 500682, "epoch": 2980} {"train_loss": -12.220121383666992, "global_step": 500683, "epoch": 2980} {"train_loss": -11.812948226928711, "global_step": 500684, "epoch": 2980} {"train_loss": -11.640167236328125, "global_step": 500685, "epoch": 2980} {"train_loss": -11.745275497436523, "global_step": 500686, "epoch": 2980} {"train_loss": -11.467227935791016, "global_step": 500687, "epoch": 2980} {"train_loss": -12.192155838012695, "global_step": 500688, "epoch": 2980} {"train_loss": -11.389913558959961, "global_step": 500689, "epoch": 2980} {"train_loss": -11.749970436096191, "global_step": 500690, "epoch": 2980} {"train_loss": -12.312772750854492, "global_step": 500691, "epoch": 2980} {"train_loss": -11.978845596313477, "global_step": 500692, "epoch": 2980} {"train_loss": -12.468040466308594, "global_step": 500693, "epoch": 2980} {"train_loss": -12.064945220947266, "global_step": 500694, "epoch": 2980} {"train_loss": -12.259085655212402, "global_step": 500695, "epoch": 2980} {"train_loss": -12.157200813293457, "global_step": 500696, "epoch": 2980} {"train_loss": -12.234628677368164, "global_step": 500697, "epoch": 2980} {"train_loss": -12.145590782165527, "global_step": 500698, "epoch": 2980} {"train_loss": -12.710214614868164, "global_step": 500699, "epoch": 2980} {"train_loss": -11.989444732666016, "global_step": 500700, "epoch": 2980} {"train_loss": -12.363777160644531, "global_step": 500701, "epoch": 2980} {"train_loss": -11.732590675354004, "global_step": 500702, "epoch": 2980} {"train_loss": -11.990665435791016, "global_step": 500703, "epoch": 2980} {"train_loss": -11.873453140258789, "global_step": 500704, "epoch": 2980} {"train_loss": -12.071512222290039, "global_step": 500705, "epoch": 2980} {"train_loss": -12.048396110534668, "global_step": 500706, "epoch": 2980} {"train_loss": -11.920135498046875, "global_step": 500707, "epoch": 2980} {"train_loss": -12.635815620422363, "global_step": 500708, "epoch": 2980} {"train_loss": -11.116931915283203, "global_step": 500709, "epoch": 2980} {"train_loss": -12.704643249511719, "global_step": 500710, "epoch": 2980} {"train_loss": -12.072059631347656, "global_step": 500711, "epoch": 2980} {"train_loss": -12.559165000915527, "global_step": 500712, "epoch": 2980} {"train_loss": -12.237695693969727, "global_step": 500713, "epoch": 2980} {"train_loss": -11.848094940185547, "global_step": 500714, "epoch": 2980} {"train_loss": -12.371871948242188, "global_step": 500715, "epoch": 2980} {"train_loss": -11.898554801940918, "global_step": 500716, "epoch": 2980} {"train_loss": -12.499399185180664, "global_step": 500717, "epoch": 2980} {"train_loss": -11.993463516235352, "global_step": 500718, "epoch": 2980} {"train_loss": -12.339719772338867, "global_step": 500719, "epoch": 2980} {"train_loss": -12.408308029174805, "global_step": 500720, "epoch": 2980} {"train_loss": -12.004737854003906, "global_step": 500721, "epoch": 2980} {"train_loss": -11.961784362792969, "global_step": 500722, "epoch": 2980} {"train_loss": -11.90093994140625, "global_step": 500723, "epoch": 2980} {"train_loss": -11.997790336608887, "global_step": 500724, "epoch": 2980} {"train_loss": -12.287443161010742, "global_step": 500725, "epoch": 2980} {"train_loss": -12.053201675415039, "global_step": 500726, "epoch": 2980} {"train_loss": -12.454401969909668, "global_step": 500727, "epoch": 2980} {"train_loss": -12.228042602539062, "global_step": 500728, "epoch": 2980} {"train_loss": -12.489789009094238, "global_step": 500729, "epoch": 2980} {"train_loss": -11.857670783996582, "global_step": 500730, "epoch": 2980} {"train_loss": -12.422685623168945, "global_step": 500731, "epoch": 2980} {"train_loss": -11.753588676452637, "global_step": 500732, "epoch": 2980} {"train_loss": -12.447294235229492, "global_step": 500733, "epoch": 2980} {"train_loss": -11.4952974319458, "global_step": 500734, "epoch": 2980} {"train_loss": -12.243528366088867, "global_step": 500735, "epoch": 2980} {"train_loss": -12.552753448486328, "global_step": 500736, "epoch": 2980} {"train_loss": -12.146772384643555, "global_step": 500737, "epoch": 2980} {"train_loss": -12.23651123046875, "global_step": 500738, "epoch": 2980} {"train_loss": -12.496064186096191, "global_step": 500739, "epoch": 2980} {"train_loss": -12.370241165161133, "global_step": 500740, "epoch": 2980} {"train_loss": -12.505514144897461, "global_step": 500741, "epoch": 2980} {"train_loss": -12.818727493286133, "global_step": 500742, "epoch": 2980} {"train_loss": -12.045927047729492, "global_step": 500743, "epoch": 2980} {"train_loss": -12.701062202453613, "global_step": 500744, "epoch": 2980} {"train_loss": -12.273649215698242, "global_step": 500745, "epoch": 2980} {"train_loss": -12.622437477111816, "global_step": 500746, "epoch": 2980} {"train_loss": -12.439314842224121, "global_step": 500747, "epoch": 2980} {"train_loss": -12.712141990661621, "global_step": 500748, "epoch": 2980} {"train_loss": -12.56723403930664, "global_step": 500749, "epoch": 2980} {"train_loss": -12.746942520141602, "global_step": 500750, "epoch": 2980} {"train_loss": -12.586831092834473, "global_step": 500751, "epoch": 2980} {"train_loss": -12.410837173461914, "global_step": 500752, "epoch": 2980} {"train_loss": -12.524734497070312, "global_step": 500753, "epoch": 2980} {"train_loss": -12.595863342285156, "global_step": 500754, "epoch": 2980} {"train_loss": -12.846701622009277, "global_step": 500755, "epoch": 2980} {"train_loss": -12.507286071777344, "global_step": 500756, "epoch": 2980} {"train_loss": -12.486268997192383, "global_step": 500757, "epoch": 2980} {"train_loss": -12.271649360656738, "global_step": 500758, "epoch": 2980} {"train_loss": -12.058764457702637, "global_step": 500759, "epoch": 2980} {"train_loss": -12.900213241577148, "global_step": 500760, "epoch": 2980} {"train_loss": -11.964339256286621, "global_step": 500761, "epoch": 2980} {"train_loss": -12.39877700805664, "global_step": 500762, "epoch": 2980} {"train_loss": -11.186588287353516, "global_step": 500763, "epoch": 2980} {"train_loss": -12.427902221679688, "global_step": 500764, "epoch": 2980} {"train_loss": -11.764240264892578, "global_step": 500765, "epoch": 2980} {"train_loss": -11.914583206176758, "global_step": 500766, "epoch": 2980} {"train_loss": -12.024694442749023, "global_step": 500767, "epoch": 2980} {"train_loss": -11.802618026733398, "global_step": 500768, "epoch": 2980} {"train_loss": -12.00465202331543, "global_step": 500769, "epoch": 2980} {"train_loss": -11.638301849365234, "global_step": 500770, "epoch": 2980} {"train_loss": -12.56962776184082, "global_step": 500771, "epoch": 2980} {"train_loss": -11.663475036621094, "global_step": 500772, "epoch": 2980} {"train_loss": -12.607988357543945, "global_step": 500773, "epoch": 2980} {"train_loss": -12.249261856079102, "global_step": 500774, "epoch": 2980} {"train_loss": -12.646596908569336, "global_step": 500775, "epoch": 2980} {"train_loss": -12.378702163696289, "global_step": 500776, "epoch": 2980} {"train_loss": -12.211612701416016, "global_step": 500777, "epoch": 2980} {"train_loss": -12.55030632019043, "global_step": 500778, "epoch": 2980} {"train_loss": -12.50619125366211, "global_step": 500779, "epoch": 2980} {"train_loss": -12.702709197998047, "global_step": 500780, "epoch": 2980} {"train_loss": -12.748668670654297, "global_step": 500781, "epoch": 2980} {"train_loss": -12.376825332641602, "global_step": 500782, "epoch": 2980} {"train_loss": -12.16623306274414, "global_step": 500783, "epoch": 2980} {"train_loss": -12.676326751708984, "global_step": 500784, "epoch": 2980} {"train_loss": -12.515098571777344, "global_step": 500785, "epoch": 2980} {"train_loss": -12.790539741516113, "global_step": 500786, "epoch": 2980} {"train_loss": -12.410001754760742, "global_step": 500787, "epoch": 2980} {"train_loss": -12.018102645874023, "global_step": 500788, "epoch": 2980} {"train_loss": -12.716554641723633, "global_step": 500789, "epoch": 2980} {"train_loss": -12.509777069091797, "global_step": 500790, "epoch": 2980} {"train_loss": -12.21986198425293, "global_step": 500791, "epoch": 2980} {"train_loss": -12.081930160522461, "global_step": 500792, "epoch": 2980} {"train_loss": -12.546646118164062, "global_step": 500793, "epoch": 2980} {"train_loss": -12.116990089416504, "global_step": 500794, "epoch": 2980} {"train_loss": -12.207921028137207, "global_step": 500795, "epoch": 2980} {"train_loss": -12.774505615234375, "global_step": 500796, "epoch": 2980} {"train_loss": -12.277406692504883, "global_step": 500797, "epoch": 2980} {"train_loss": -12.861260414123535, "global_step": 500798, "epoch": 2980} {"train_loss": -12.306990623474121, "global_step": 500799, "epoch": 2980} {"train_loss": -12.752992630004883, "global_step": 500800, "epoch": 2980} {"train_loss": -12.756525039672852, "global_step": 500801, "epoch": 2980} {"train_loss": -12.77662181854248, "global_step": 500802, "epoch": 2980} {"train_loss": -12.684329986572266, "global_step": 500803, "epoch": 2980} {"train_loss": -12.783478736877441, "global_step": 500804, "epoch": 2980} {"train_loss": -12.602340698242188, "global_step": 500805, "epoch": 2980} {"train_loss": -12.802498817443848, "global_step": 500806, "epoch": 2980} {"train_loss": -12.147782660665966, "global_step": 500807, "epoch": 2980, "val_loss": 320385.4375, "train_action_mse_error": 3.0096006393432617} {"train_loss": -12.801406860351562, "global_step": 500808, "epoch": 2981} {"train_loss": -12.680978775024414, "global_step": 500809, "epoch": 2981} {"train_loss": -12.951629638671875, "global_step": 500810, "epoch": 2981} {"train_loss": -12.46696949005127, "global_step": 500811, "epoch": 2981} {"train_loss": -12.89560317993164, "global_step": 500812, "epoch": 2981} {"train_loss": -12.823665618896484, "global_step": 500813, "epoch": 2981} {"train_loss": -12.718940734863281, "global_step": 500814, "epoch": 2981} {"train_loss": -12.873682022094727, "global_step": 500815, "epoch": 2981} {"train_loss": -12.879222869873047, "global_step": 500816, "epoch": 2981} {"train_loss": -12.956871032714844, "global_step": 500817, "epoch": 2981} {"train_loss": -12.026420593261719, "global_step": 500818, "epoch": 2981} {"train_loss": -12.484569549560547, "global_step": 500819, "epoch": 2981} {"train_loss": -12.804003715515137, "global_step": 500820, "epoch": 2981} {"train_loss": -12.526105880737305, "global_step": 500821, "epoch": 2981} {"train_loss": -12.303004264831543, "global_step": 500822, "epoch": 2981} {"train_loss": -12.79493522644043, "global_step": 500823, "epoch": 2981} {"train_loss": -12.659640312194824, "global_step": 500824, "epoch": 2981} {"train_loss": -13.05092716217041, "global_step": 500825, "epoch": 2981} {"train_loss": -12.76834774017334, "global_step": 500826, "epoch": 2981} {"train_loss": -12.570379257202148, "global_step": 500827, "epoch": 2981} {"train_loss": -12.92823600769043, "global_step": 500828, "epoch": 2981} {"train_loss": -12.526376724243164, "global_step": 500829, "epoch": 2981} {"train_loss": -12.937744140625, "global_step": 500830, "epoch": 2981} {"train_loss": -12.855192184448242, "global_step": 500831, "epoch": 2981} {"train_loss": -12.873416900634766, "global_step": 500832, "epoch": 2981} {"train_loss": -12.817093849182129, "global_step": 500833, "epoch": 2981} {"train_loss": -12.968917846679688, "global_step": 500834, "epoch": 2981} {"train_loss": -13.014720916748047, "global_step": 500835, "epoch": 2981} {"train_loss": -12.579568862915039, "global_step": 500836, "epoch": 2981} {"train_loss": -12.338683128356934, "global_step": 500837, "epoch": 2981} {"train_loss": -12.820610046386719, "global_step": 500838, "epoch": 2981} {"train_loss": -12.58822250366211, "global_step": 500839, "epoch": 2981} {"train_loss": -12.286784172058105, "global_step": 500840, "epoch": 2981} {"train_loss": -12.637726783752441, "global_step": 500841, "epoch": 2981} {"train_loss": -12.53065299987793, "global_step": 500842, "epoch": 2981} {"train_loss": -12.507165908813477, "global_step": 500843, "epoch": 2981} {"train_loss": -12.509515762329102, "global_step": 500844, "epoch": 2981} {"train_loss": -12.703372955322266, "global_step": 500845, "epoch": 2981} {"train_loss": -12.650760650634766, "global_step": 500846, "epoch": 2981} {"train_loss": -12.727558135986328, "global_step": 500847, "epoch": 2981} {"train_loss": -12.546777725219727, "global_step": 500848, "epoch": 2981} {"train_loss": -12.830081939697266, "global_step": 500849, "epoch": 2981} {"train_loss": -12.410815238952637, "global_step": 500850, "epoch": 2981} {"train_loss": -12.465599060058594, "global_step": 500851, "epoch": 2981} {"train_loss": -11.8531494140625, "global_step": 500852, "epoch": 2981} {"train_loss": -12.944019317626953, "global_step": 500853, "epoch": 2981} {"train_loss": -11.883816719055176, "global_step": 500854, "epoch": 2981} {"train_loss": -12.771635055541992, "global_step": 500855, "epoch": 2981} {"train_loss": -12.51456356048584, "global_step": 500856, "epoch": 2981} {"train_loss": -12.90726089477539, "global_step": 500857, "epoch": 2981} {"train_loss": -12.766117095947266, "global_step": 500858, "epoch": 2981} {"train_loss": -12.916522026062012, "global_step": 500859, "epoch": 2981} {"train_loss": -12.663778305053711, "global_step": 500860, "epoch": 2981} {"train_loss": -12.739747047424316, "global_step": 500861, "epoch": 2981} {"train_loss": -12.576884269714355, "global_step": 500862, "epoch": 2981} {"train_loss": -12.080435752868652, "global_step": 500863, "epoch": 2981} {"train_loss": -11.249176025390625, "global_step": 500864, "epoch": 2981} {"train_loss": -11.744394302368164, "global_step": 500865, "epoch": 2981} {"train_loss": -11.591989517211914, "global_step": 500866, "epoch": 2981} {"train_loss": -9.591706275939941, "global_step": 500867, "epoch": 2981} {"train_loss": -9.823997497558594, "global_step": 500868, "epoch": 2981} {"train_loss": -11.37625503540039, "global_step": 500869, "epoch": 2981} {"train_loss": -11.418622970581055, "global_step": 500870, "epoch": 2981} {"train_loss": -10.198616027832031, "global_step": 500871, "epoch": 2981} {"train_loss": -11.721022605895996, "global_step": 500872, "epoch": 2981} {"train_loss": -10.261155128479004, "global_step": 500873, "epoch": 2981} {"train_loss": -9.828566551208496, "global_step": 500874, "epoch": 2981} {"train_loss": -10.409235000610352, "global_step": 500875, "epoch": 2981} {"train_loss": -11.222704887390137, "global_step": 500876, "epoch": 2981} {"train_loss": -11.157291412353516, "global_step": 500877, "epoch": 2981} {"train_loss": -11.619464874267578, "global_step": 500878, "epoch": 2981} {"train_loss": -11.584280014038086, "global_step": 500879, "epoch": 2981} {"train_loss": -11.745302200317383, "global_step": 500880, "epoch": 2981} {"train_loss": -11.666690826416016, "global_step": 500881, "epoch": 2981} {"train_loss": -11.390039443969727, "global_step": 500882, "epoch": 2981} {"train_loss": -12.08023452758789, "global_step": 500883, "epoch": 2981} {"train_loss": -11.283377647399902, "global_step": 500884, "epoch": 2981} {"train_loss": -11.994380950927734, "global_step": 500885, "epoch": 2981} {"train_loss": -12.062202453613281, "global_step": 500886, "epoch": 2981} {"train_loss": -10.965816497802734, "global_step": 500887, "epoch": 2981} {"train_loss": -12.491554260253906, "global_step": 500888, "epoch": 2981} {"train_loss": -11.528939247131348, "global_step": 500889, "epoch": 2981} {"train_loss": -11.95339298248291, "global_step": 500890, "epoch": 2981} {"train_loss": -12.118675231933594, "global_step": 500891, "epoch": 2981} {"train_loss": -11.41843032836914, "global_step": 500892, "epoch": 2981} {"train_loss": -12.406515121459961, "global_step": 500893, "epoch": 2981} {"train_loss": -11.638080596923828, "global_step": 500894, "epoch": 2981} {"train_loss": -11.960274696350098, "global_step": 500895, "epoch": 2981} {"train_loss": -11.996554374694824, "global_step": 500896, "epoch": 2981} {"train_loss": -11.874603271484375, "global_step": 500897, "epoch": 2981} {"train_loss": -11.501800537109375, "global_step": 500898, "epoch": 2981} {"train_loss": -12.293785095214844, "global_step": 500899, "epoch": 2981} {"train_loss": -11.53350830078125, "global_step": 500900, "epoch": 2981} {"train_loss": -12.271888732910156, "global_step": 500901, "epoch": 2981} {"train_loss": -12.145233154296875, "global_step": 500902, "epoch": 2981} {"train_loss": -12.160545349121094, "global_step": 500903, "epoch": 2981} {"train_loss": -11.569862365722656, "global_step": 500904, "epoch": 2981} {"train_loss": -12.040441513061523, "global_step": 500905, "epoch": 2981} {"train_loss": -11.185099601745605, "global_step": 500906, "epoch": 2981} {"train_loss": -12.147806167602539, "global_step": 500907, "epoch": 2981} {"train_loss": -10.912425994873047, "global_step": 500908, "epoch": 2981} {"train_loss": -11.324880599975586, "global_step": 500909, "epoch": 2981} {"train_loss": -12.355382919311523, "global_step": 500910, "epoch": 2981} {"train_loss": -11.058688163757324, "global_step": 500911, "epoch": 2981} {"train_loss": -12.089035034179688, "global_step": 500912, "epoch": 2981} {"train_loss": -10.89364242553711, "global_step": 500913, "epoch": 2981} {"train_loss": -10.559707641601562, "global_step": 500914, "epoch": 2981} {"train_loss": -11.543611526489258, "global_step": 500915, "epoch": 2981} {"train_loss": -10.488659858703613, "global_step": 500916, "epoch": 2981} {"train_loss": -11.533655166625977, "global_step": 500917, "epoch": 2981} {"train_loss": -10.507322311401367, "global_step": 500918, "epoch": 2981} {"train_loss": -11.550342559814453, "global_step": 500919, "epoch": 2981} {"train_loss": -11.231054306030273, "global_step": 500920, "epoch": 2981} {"train_loss": -11.761463165283203, "global_step": 500921, "epoch": 2981} {"train_loss": -11.920421600341797, "global_step": 500922, "epoch": 2981} {"train_loss": -11.913078308105469, "global_step": 500923, "epoch": 2981} {"train_loss": -12.409361839294434, "global_step": 500924, "epoch": 2981} {"train_loss": -11.952583312988281, "global_step": 500925, "epoch": 2981} {"train_loss": -12.370850563049316, "global_step": 500926, "epoch": 2981} {"train_loss": -11.630609512329102, "global_step": 500927, "epoch": 2981} {"train_loss": -12.415948867797852, "global_step": 500928, "epoch": 2981} {"train_loss": -11.934747695922852, "global_step": 500929, "epoch": 2981} {"train_loss": -12.163725852966309, "global_step": 500930, "epoch": 2981} {"train_loss": -11.81416130065918, "global_step": 500931, "epoch": 2981} {"train_loss": -12.017066955566406, "global_step": 500932, "epoch": 2981} {"train_loss": -12.196340560913086, "global_step": 500933, "epoch": 2981} {"train_loss": -11.489999771118164, "global_step": 500934, "epoch": 2981} {"train_loss": -12.05087947845459, "global_step": 500935, "epoch": 2981} {"train_loss": -11.867584228515625, "global_step": 500936, "epoch": 2981} {"train_loss": -12.342536926269531, "global_step": 500937, "epoch": 2981} {"train_loss": -11.95565128326416, "global_step": 500938, "epoch": 2981} {"train_loss": -12.198169708251953, "global_step": 500939, "epoch": 2981} {"train_loss": -11.778908729553223, "global_step": 500940, "epoch": 2981} {"train_loss": -12.382522583007812, "global_step": 500941, "epoch": 2981} {"train_loss": -11.648665428161621, "global_step": 500942, "epoch": 2981} {"train_loss": -12.404244422912598, "global_step": 500943, "epoch": 2981} {"train_loss": -12.119553565979004, "global_step": 500944, "epoch": 2981} {"train_loss": -11.693304061889648, "global_step": 500945, "epoch": 2981} {"train_loss": -11.979545593261719, "global_step": 500946, "epoch": 2981} {"train_loss": -11.99089241027832, "global_step": 500947, "epoch": 2981} {"train_loss": -12.09492301940918, "global_step": 500948, "epoch": 2981} {"train_loss": -11.848570823669434, "global_step": 500949, "epoch": 2981} {"train_loss": -12.186653137207031, "global_step": 500950, "epoch": 2981} {"train_loss": -11.976165771484375, "global_step": 500951, "epoch": 2981} {"train_loss": -12.11986255645752, "global_step": 500952, "epoch": 2981} {"train_loss": -12.149190902709961, "global_step": 500953, "epoch": 2981} {"train_loss": -11.727339744567871, "global_step": 500954, "epoch": 2981} {"train_loss": -12.512269020080566, "global_step": 500955, "epoch": 2981} {"train_loss": -12.238018989562988, "global_step": 500956, "epoch": 2981} {"train_loss": -12.149985313415527, "global_step": 500957, "epoch": 2981} {"train_loss": -12.64854907989502, "global_step": 500958, "epoch": 2981} {"train_loss": -11.87015438079834, "global_step": 500959, "epoch": 2981} {"train_loss": -12.284940719604492, "global_step": 500960, "epoch": 2981} {"train_loss": -12.195337295532227, "global_step": 500961, "epoch": 2981} {"train_loss": -12.080120086669922, "global_step": 500962, "epoch": 2981} {"train_loss": -12.351263046264648, "global_step": 500963, "epoch": 2981} {"train_loss": -12.04539966583252, "global_step": 500964, "epoch": 2981} {"train_loss": -12.351268768310547, "global_step": 500965, "epoch": 2981} {"train_loss": -12.131803512573242, "global_step": 500966, "epoch": 2981} {"train_loss": -12.417547225952148, "global_step": 500967, "epoch": 2981} {"train_loss": -12.129926681518555, "global_step": 500968, "epoch": 2981} {"train_loss": -12.456379890441895, "global_step": 500969, "epoch": 2981} {"train_loss": -12.388997077941895, "global_step": 500970, "epoch": 2981} {"train_loss": -12.451740264892578, "global_step": 500971, "epoch": 2981} {"train_loss": -12.533087730407715, "global_step": 500972, "epoch": 2981} {"train_loss": -12.496094703674316, "global_step": 500973, "epoch": 2981} {"train_loss": -12.497638702392578, "global_step": 500974, "epoch": 2981} {"train_loss": -12.071512449355353, "global_step": 500975, "epoch": 2981, "val_loss": 321849.1875} {"train_loss": -12.13787841796875, "global_step": 500976, "epoch": 2982} {"train_loss": -12.705759048461914, "global_step": 500977, "epoch": 2982} {"train_loss": -12.33463191986084, "global_step": 500978, "epoch": 2982} {"train_loss": -12.600215911865234, "global_step": 500979, "epoch": 2982} {"train_loss": -12.547050476074219, "global_step": 500980, "epoch": 2982} {"train_loss": -12.435578346252441, "global_step": 500981, "epoch": 2982} {"train_loss": -12.781793594360352, "global_step": 500982, "epoch": 2982} {"train_loss": -12.487346649169922, "global_step": 500983, "epoch": 2982} {"train_loss": -12.597986221313477, "global_step": 500984, "epoch": 2982} {"train_loss": -12.466445922851562, "global_step": 500985, "epoch": 2982} {"train_loss": -12.480607032775879, "global_step": 500986, "epoch": 2982} {"train_loss": -12.538908004760742, "global_step": 500987, "epoch": 2982} {"train_loss": -12.57363224029541, "global_step": 500988, "epoch": 2982} {"train_loss": -12.639264106750488, "global_step": 500989, "epoch": 2982} {"train_loss": -12.704063415527344, "global_step": 500990, "epoch": 2982} {"train_loss": -12.846790313720703, "global_step": 500991, "epoch": 2982} {"train_loss": -12.82548713684082, "global_step": 500992, "epoch": 2982} {"train_loss": -12.756611824035645, "global_step": 500993, "epoch": 2982} {"train_loss": -12.76840591430664, "global_step": 500994, "epoch": 2982} {"train_loss": -12.7981595993042, "global_step": 500995, "epoch": 2982} {"train_loss": -12.887435913085938, "global_step": 500996, "epoch": 2982} {"train_loss": -12.805244445800781, "global_step": 500997, "epoch": 2982} {"train_loss": -12.671391487121582, "global_step": 500998, "epoch": 2982} {"train_loss": -12.573177337646484, "global_step": 500999, "epoch": 2982} {"train_loss": -12.749320030212402, "global_step": 501000, "epoch": 2982} {"train_loss": -12.511041641235352, "global_step": 501001, "epoch": 2982} {"train_loss": -12.787415504455566, "global_step": 501002, "epoch": 2982} {"train_loss": -12.527530670166016, "global_step": 501003, "epoch": 2982} {"train_loss": -12.8488130569458, "global_step": 501004, "epoch": 2982} {"train_loss": -12.728446960449219, "global_step": 501005, "epoch": 2982} {"train_loss": -12.672410011291504, "global_step": 501006, "epoch": 2982} {"train_loss": -13.050106048583984, "global_step": 501007, "epoch": 2982} {"train_loss": -12.815292358398438, "global_step": 501008, "epoch": 2982} {"train_loss": -12.801918029785156, "global_step": 501009, "epoch": 2982} {"train_loss": -13.065200805664062, "global_step": 501010, "epoch": 2982} {"train_loss": -12.68265151977539, "global_step": 501011, "epoch": 2982} {"train_loss": -12.916086196899414, "global_step": 501012, "epoch": 2982} {"train_loss": -12.982124328613281, "global_step": 501013, "epoch": 2982} {"train_loss": -12.590564727783203, "global_step": 501014, "epoch": 2982} {"train_loss": -12.866170883178711, "global_step": 501015, "epoch": 2982} {"train_loss": -12.806699752807617, "global_step": 501016, "epoch": 2982} {"train_loss": -12.591264724731445, "global_step": 501017, "epoch": 2982} {"train_loss": -12.777234077453613, "global_step": 501018, "epoch": 2982} {"train_loss": -12.98097038269043, "global_step": 501019, "epoch": 2982} {"train_loss": -13.020132064819336, "global_step": 501020, "epoch": 2982} {"train_loss": -12.94514274597168, "global_step": 501021, "epoch": 2982} {"train_loss": -12.920454025268555, "global_step": 501022, "epoch": 2982} {"train_loss": -12.948847770690918, "global_step": 501023, "epoch": 2982} {"train_loss": -12.939391136169434, "global_step": 501024, "epoch": 2982} {"train_loss": -13.076135635375977, "global_step": 501025, "epoch": 2982} {"train_loss": -12.877843856811523, "global_step": 501026, "epoch": 2982} {"train_loss": -12.855697631835938, "global_step": 501027, "epoch": 2982} {"train_loss": -12.843899726867676, "global_step": 501028, "epoch": 2982} {"train_loss": -12.878484725952148, "global_step": 501029, "epoch": 2982} {"train_loss": -12.85080337524414, "global_step": 501030, "epoch": 2982} {"train_loss": -12.872810363769531, "global_step": 501031, "epoch": 2982} {"train_loss": -12.81315803527832, "global_step": 501032, "epoch": 2982} {"train_loss": -13.065113067626953, "global_step": 501033, "epoch": 2982} {"train_loss": -12.716087341308594, "global_step": 501034, "epoch": 2982} {"train_loss": -12.86494255065918, "global_step": 501035, "epoch": 2982} {"train_loss": -12.92507553100586, "global_step": 501036, "epoch": 2982} {"train_loss": -12.709856033325195, "global_step": 501037, "epoch": 2982} {"train_loss": -12.856451034545898, "global_step": 501038, "epoch": 2982} {"train_loss": -12.911383628845215, "global_step": 501039, "epoch": 2982} {"train_loss": -12.76662826538086, "global_step": 501040, "epoch": 2982} {"train_loss": -12.545921325683594, "global_step": 501041, "epoch": 2982} {"train_loss": -12.712867736816406, "global_step": 501042, "epoch": 2982} {"train_loss": -12.780647277832031, "global_step": 501043, "epoch": 2982} {"train_loss": -12.181571006774902, "global_step": 501044, "epoch": 2982} {"train_loss": -12.830353736877441, "global_step": 501045, "epoch": 2982} {"train_loss": -12.770851135253906, "global_step": 501046, "epoch": 2982} {"train_loss": -12.846508979797363, "global_step": 501047, "epoch": 2982} {"train_loss": -12.762813568115234, "global_step": 501048, "epoch": 2982} {"train_loss": -12.623292922973633, "global_step": 501049, "epoch": 2982} {"train_loss": -12.592866897583008, "global_step": 501050, "epoch": 2982} {"train_loss": -12.896081924438477, "global_step": 501051, "epoch": 2982} {"train_loss": -12.802129745483398, "global_step": 501052, "epoch": 2982} {"train_loss": -12.759443283081055, "global_step": 501053, "epoch": 2982} {"train_loss": -12.513203620910645, "global_step": 501054, "epoch": 2982} {"train_loss": -11.963479995727539, "global_step": 501055, "epoch": 2982} {"train_loss": -12.273115158081055, "global_step": 501056, "epoch": 2982} {"train_loss": -12.483878135681152, "global_step": 501057, "epoch": 2982} {"train_loss": -11.456235885620117, "global_step": 501058, "epoch": 2982} {"train_loss": -11.54305648803711, "global_step": 501059, "epoch": 2982} {"train_loss": -12.330835342407227, "global_step": 501060, "epoch": 2982} {"train_loss": -11.682421684265137, "global_step": 501061, "epoch": 2982} {"train_loss": -11.321303367614746, "global_step": 501062, "epoch": 2982} {"train_loss": -11.35482120513916, "global_step": 501063, "epoch": 2982} {"train_loss": -12.186864852905273, "global_step": 501064, "epoch": 2982} {"train_loss": -10.054265975952148, "global_step": 501065, "epoch": 2982} {"train_loss": -12.191363334655762, "global_step": 501066, "epoch": 2982} {"train_loss": -11.689750671386719, "global_step": 501067, "epoch": 2982} {"train_loss": -12.765809059143066, "global_step": 501068, "epoch": 2982} {"train_loss": -11.930194854736328, "global_step": 501069, "epoch": 2982} {"train_loss": -12.583736419677734, "global_step": 501070, "epoch": 2982} {"train_loss": -11.850595474243164, "global_step": 501071, "epoch": 2982} {"train_loss": -12.743541717529297, "global_step": 501072, "epoch": 2982} {"train_loss": -12.195658683776855, "global_step": 501073, "epoch": 2982} {"train_loss": -12.412887573242188, "global_step": 501074, "epoch": 2982} {"train_loss": -11.19802188873291, "global_step": 501075, "epoch": 2982} {"train_loss": -11.236104965209961, "global_step": 501076, "epoch": 2982} {"train_loss": -11.734298706054688, "global_step": 501077, "epoch": 2982} {"train_loss": -10.559059143066406, "global_step": 501078, "epoch": 2982} {"train_loss": -12.201162338256836, "global_step": 501079, "epoch": 2982} {"train_loss": -10.845988273620605, "global_step": 501080, "epoch": 2982} {"train_loss": -12.057178497314453, "global_step": 501081, "epoch": 2982} {"train_loss": -11.40639591217041, "global_step": 501082, "epoch": 2982} {"train_loss": -11.913616180419922, "global_step": 501083, "epoch": 2982} {"train_loss": -12.193648338317871, "global_step": 501084, "epoch": 2982} {"train_loss": -11.788267135620117, "global_step": 501085, "epoch": 2982} {"train_loss": -12.515809059143066, "global_step": 501086, "epoch": 2982} {"train_loss": -12.324666023254395, "global_step": 501087, "epoch": 2982} {"train_loss": -11.966079711914062, "global_step": 501088, "epoch": 2982} {"train_loss": -12.062262535095215, "global_step": 501089, "epoch": 2982} {"train_loss": -12.316976547241211, "global_step": 501090, "epoch": 2982} {"train_loss": -12.199897766113281, "global_step": 501091, "epoch": 2982} {"train_loss": -12.773990631103516, "global_step": 501092, "epoch": 2982} {"train_loss": -12.127565383911133, "global_step": 501093, "epoch": 2982} {"train_loss": -12.747553825378418, "global_step": 501094, "epoch": 2982} {"train_loss": -12.242471694946289, "global_step": 501095, "epoch": 2982} {"train_loss": -12.745014190673828, "global_step": 501096, "epoch": 2982} {"train_loss": -12.17971420288086, "global_step": 501097, "epoch": 2982} {"train_loss": -12.73442268371582, "global_step": 501098, "epoch": 2982} {"train_loss": -12.140120506286621, "global_step": 501099, "epoch": 2982} {"train_loss": -12.699718475341797, "global_step": 501100, "epoch": 2982} {"train_loss": -12.240720748901367, "global_step": 501101, "epoch": 2982} {"train_loss": -12.66183090209961, "global_step": 501102, "epoch": 2982} {"train_loss": -12.772875785827637, "global_step": 501103, "epoch": 2982} {"train_loss": -12.599853515625, "global_step": 501104, "epoch": 2982} {"train_loss": -12.64677619934082, "global_step": 501105, "epoch": 2982} {"train_loss": -12.328283309936523, "global_step": 501106, "epoch": 2982} {"train_loss": -12.784219741821289, "global_step": 501107, "epoch": 2982} {"train_loss": -12.642330169677734, "global_step": 501108, "epoch": 2982} {"train_loss": -12.923649787902832, "global_step": 501109, "epoch": 2982} {"train_loss": -13.067178726196289, "global_step": 501110, "epoch": 2982} {"train_loss": -12.866806983947754, "global_step": 501111, "epoch": 2982} {"train_loss": -12.988885879516602, "global_step": 501112, "epoch": 2982} {"train_loss": -13.034424781799316, "global_step": 501113, "epoch": 2982} {"train_loss": -12.691235542297363, "global_step": 501114, "epoch": 2982} {"train_loss": -12.930233001708984, "global_step": 501115, "epoch": 2982} {"train_loss": -12.937225341796875, "global_step": 501116, "epoch": 2982} {"train_loss": -13.114133834838867, "global_step": 501117, "epoch": 2982} {"train_loss": -12.914129257202148, "global_step": 501118, "epoch": 2982} {"train_loss": -12.957015037536621, "global_step": 501119, "epoch": 2982} {"train_loss": -13.011664390563965, "global_step": 501120, "epoch": 2982} {"train_loss": -13.130399703979492, "global_step": 501121, "epoch": 2982} {"train_loss": -13.010419845581055, "global_step": 501122, "epoch": 2982} {"train_loss": -12.964804649353027, "global_step": 501123, "epoch": 2982} {"train_loss": -13.118408203125, "global_step": 501124, "epoch": 2982} {"train_loss": -12.97999382019043, "global_step": 501125, "epoch": 2982} {"train_loss": -13.002298355102539, "global_step": 501126, "epoch": 2982} {"train_loss": -12.8858003616333, "global_step": 501127, "epoch": 2982} {"train_loss": -13.160638809204102, "global_step": 501128, "epoch": 2982} {"train_loss": -13.125995635986328, "global_step": 501129, "epoch": 2982} {"train_loss": -12.972698211669922, "global_step": 501130, "epoch": 2982} {"train_loss": -13.093255043029785, "global_step": 501131, "epoch": 2982} {"train_loss": -12.830181121826172, "global_step": 501132, "epoch": 2982} {"train_loss": -13.064496994018555, "global_step": 501133, "epoch": 2982} {"train_loss": -12.931533813476562, "global_step": 501134, "epoch": 2982} {"train_loss": -12.998868942260742, "global_step": 501135, "epoch": 2982} {"train_loss": -13.016374588012695, "global_step": 501136, "epoch": 2982} {"train_loss": -12.717344284057617, "global_step": 501137, "epoch": 2982} {"train_loss": -12.58963394165039, "global_step": 501138, "epoch": 2982} {"train_loss": -13.020727157592773, "global_step": 501139, "epoch": 2982} {"train_loss": -13.042596817016602, "global_step": 501140, "epoch": 2982} {"train_loss": -12.473489761352539, "global_step": 501141, "epoch": 2982} {"train_loss": -11.837369918823242, "global_step": 501142, "epoch": 2982} {"train_loss": -12.569366415341696, "global_step": 501143, "epoch": 2982, "val_loss": 317844.625} {"train_loss": -12.718984603881836, "global_step": 501144, "epoch": 2983} {"train_loss": -11.427271842956543, "global_step": 501145, "epoch": 2983} {"train_loss": -12.062356948852539, "global_step": 501146, "epoch": 2983} {"train_loss": -11.770918846130371, "global_step": 501147, "epoch": 2983} {"train_loss": -10.00345516204834, "global_step": 501148, "epoch": 2983} {"train_loss": -11.659832954406738, "global_step": 501149, "epoch": 2983} {"train_loss": -9.019306182861328, "global_step": 501150, "epoch": 2983} {"train_loss": -11.130298614501953, "global_step": 501151, "epoch": 2983} {"train_loss": -10.912129402160645, "global_step": 501152, "epoch": 2983} {"train_loss": -11.8299560546875, "global_step": 501153, "epoch": 2983} {"train_loss": -9.034929275512695, "global_step": 501154, "epoch": 2983} {"train_loss": -11.683895111083984, "global_step": 501155, "epoch": 2983} {"train_loss": -8.431110382080078, "global_step": 501156, "epoch": 2983} {"train_loss": -10.858449935913086, "global_step": 501157, "epoch": 2983} {"train_loss": -8.790838241577148, "global_step": 501158, "epoch": 2983} {"train_loss": -8.913365364074707, "global_step": 501159, "epoch": 2983} {"train_loss": -10.351197242736816, "global_step": 501160, "epoch": 2983} {"train_loss": -9.484073638916016, "global_step": 501161, "epoch": 2983} {"train_loss": -9.148757934570312, "global_step": 501162, "epoch": 2983} {"train_loss": -11.290974617004395, "global_step": 501163, "epoch": 2983} {"train_loss": -9.36865520477295, "global_step": 501164, "epoch": 2983} {"train_loss": -11.013341903686523, "global_step": 501165, "epoch": 2983} {"train_loss": -10.648331642150879, "global_step": 501166, "epoch": 2983} {"train_loss": -9.872808456420898, "global_step": 501167, "epoch": 2983} {"train_loss": -9.06214714050293, "global_step": 501168, "epoch": 2983} {"train_loss": -9.407995223999023, "global_step": 501169, "epoch": 2983} {"train_loss": -11.127693176269531, "global_step": 501170, "epoch": 2983} {"train_loss": -11.514566421508789, "global_step": 501171, "epoch": 2983} {"train_loss": -8.850902557373047, "global_step": 501172, "epoch": 2983} {"train_loss": -9.522216796875, "global_step": 501173, "epoch": 2983} {"train_loss": -10.980243682861328, "global_step": 501174, "epoch": 2983} {"train_loss": -9.676156997680664, "global_step": 501175, "epoch": 2983} {"train_loss": -9.32071590423584, "global_step": 501176, "epoch": 2983} {"train_loss": -10.447386741638184, "global_step": 501177, "epoch": 2983} {"train_loss": -10.093345642089844, "global_step": 501178, "epoch": 2983} {"train_loss": -10.265113830566406, "global_step": 501179, "epoch": 2983} {"train_loss": -9.913392066955566, "global_step": 501180, "epoch": 2983} {"train_loss": -10.162610054016113, "global_step": 501181, "epoch": 2983} {"train_loss": -10.101296424865723, "global_step": 501182, "epoch": 2983} {"train_loss": -10.686895370483398, "global_step": 501183, "epoch": 2983} {"train_loss": -9.8922119140625, "global_step": 501184, "epoch": 2983} {"train_loss": -10.330805778503418, "global_step": 501185, "epoch": 2983} {"train_loss": -11.07373332977295, "global_step": 501186, "epoch": 2983} {"train_loss": -10.751779556274414, "global_step": 501187, "epoch": 2983} {"train_loss": -11.220439910888672, "global_step": 501188, "epoch": 2983} {"train_loss": -11.154561042785645, "global_step": 501189, "epoch": 2983} {"train_loss": -11.644558906555176, "global_step": 501190, "epoch": 2983} {"train_loss": -11.243515014648438, "global_step": 501191, "epoch": 2983} {"train_loss": -11.456303596496582, "global_step": 501192, "epoch": 2983} {"train_loss": -11.96381664276123, "global_step": 501193, "epoch": 2983} {"train_loss": -10.86771011352539, "global_step": 501194, "epoch": 2983} {"train_loss": -11.40323257446289, "global_step": 501195, "epoch": 2983} {"train_loss": -11.88230037689209, "global_step": 501196, "epoch": 2983} {"train_loss": -11.764070510864258, "global_step": 501197, "epoch": 2983} {"train_loss": -11.434696197509766, "global_step": 501198, "epoch": 2983} {"train_loss": -11.787212371826172, "global_step": 501199, "epoch": 2983} {"train_loss": -11.416593551635742, "global_step": 501200, "epoch": 2983} {"train_loss": -11.885417938232422, "global_step": 501201, "epoch": 2983} {"train_loss": -11.681811332702637, "global_step": 501202, "epoch": 2983} {"train_loss": -11.409748077392578, "global_step": 501203, "epoch": 2983} {"train_loss": -11.891214370727539, "global_step": 501204, "epoch": 2983} {"train_loss": -11.610809326171875, "global_step": 501205, "epoch": 2983} {"train_loss": -10.869757652282715, "global_step": 501206, "epoch": 2983} {"train_loss": -11.319223403930664, "global_step": 501207, "epoch": 2983} {"train_loss": -11.723276138305664, "global_step": 501208, "epoch": 2983} {"train_loss": -12.071557998657227, "global_step": 501209, "epoch": 2983} {"train_loss": -11.83624267578125, "global_step": 501210, "epoch": 2983} {"train_loss": -11.898347854614258, "global_step": 501211, "epoch": 2983} {"train_loss": -12.03584098815918, "global_step": 501212, "epoch": 2983} {"train_loss": -11.945924758911133, "global_step": 501213, "epoch": 2983} {"train_loss": -11.647905349731445, "global_step": 501214, "epoch": 2983} {"train_loss": -11.370658874511719, "global_step": 501215, "epoch": 2983} {"train_loss": -11.83210563659668, "global_step": 501216, "epoch": 2983} {"train_loss": -11.798562049865723, "global_step": 501217, "epoch": 2983} {"train_loss": -12.027134895324707, "global_step": 501218, "epoch": 2983} {"train_loss": -12.174860000610352, "global_step": 501219, "epoch": 2983} {"train_loss": -12.375029563903809, "global_step": 501220, "epoch": 2983} {"train_loss": -12.21420669555664, "global_step": 501221, "epoch": 2983} {"train_loss": -12.357038497924805, "global_step": 501222, "epoch": 2983} {"train_loss": -12.117132186889648, "global_step": 501223, "epoch": 2983} {"train_loss": -12.105230331420898, "global_step": 501224, "epoch": 2983} {"train_loss": -12.498181343078613, "global_step": 501225, "epoch": 2983} {"train_loss": -12.216949462890625, "global_step": 501226, "epoch": 2983} {"train_loss": -12.215471267700195, "global_step": 501227, "epoch": 2983} {"train_loss": -12.552217483520508, "global_step": 501228, "epoch": 2983} {"train_loss": -12.323495864868164, "global_step": 501229, "epoch": 2983} {"train_loss": -12.222909927368164, "global_step": 501230, "epoch": 2983} {"train_loss": -12.527334213256836, "global_step": 501231, "epoch": 2983} {"train_loss": -12.48481559753418, "global_step": 501232, "epoch": 2983} {"train_loss": -12.22240161895752, "global_step": 501233, "epoch": 2983} {"train_loss": -12.54073715209961, "global_step": 501234, "epoch": 2983} {"train_loss": -12.582056045532227, "global_step": 501235, "epoch": 2983} {"train_loss": -12.607643127441406, "global_step": 501236, "epoch": 2983} {"train_loss": -12.718281745910645, "global_step": 501237, "epoch": 2983} {"train_loss": -12.748046875, "global_step": 501238, "epoch": 2983} {"train_loss": -12.637063026428223, "global_step": 501239, "epoch": 2983} {"train_loss": -12.61083698272705, "global_step": 501240, "epoch": 2983} {"train_loss": -12.491169929504395, "global_step": 501241, "epoch": 2983} {"train_loss": -12.607651710510254, "global_step": 501242, "epoch": 2983} {"train_loss": -12.692910194396973, "global_step": 501243, "epoch": 2983} {"train_loss": -12.62657356262207, "global_step": 501244, "epoch": 2983} {"train_loss": -12.624492645263672, "global_step": 501245, "epoch": 2983} {"train_loss": -12.609602928161621, "global_step": 501246, "epoch": 2983} {"train_loss": -12.592727661132812, "global_step": 501247, "epoch": 2983} {"train_loss": -12.650568008422852, "global_step": 501248, "epoch": 2983} {"train_loss": -12.64721393585205, "global_step": 501249, "epoch": 2983} {"train_loss": -12.568231582641602, "global_step": 501250, "epoch": 2983} {"train_loss": -12.854640007019043, "global_step": 501251, "epoch": 2983} {"train_loss": -12.666488647460938, "global_step": 501252, "epoch": 2983} {"train_loss": -12.833110809326172, "global_step": 501253, "epoch": 2983} {"train_loss": -12.797246932983398, "global_step": 501254, "epoch": 2983} {"train_loss": -12.878433227539062, "global_step": 501255, "epoch": 2983} {"train_loss": -12.809425354003906, "global_step": 501256, "epoch": 2983} {"train_loss": -12.799015998840332, "global_step": 501257, "epoch": 2983} {"train_loss": -12.729379653930664, "global_step": 501258, "epoch": 2983} {"train_loss": -12.696964263916016, "global_step": 501259, "epoch": 2983} {"train_loss": -12.755804061889648, "global_step": 501260, "epoch": 2983} {"train_loss": -12.508392333984375, "global_step": 501261, "epoch": 2983} {"train_loss": -12.275781631469727, "global_step": 501262, "epoch": 2983} {"train_loss": -12.435569763183594, "global_step": 501263, "epoch": 2983} {"train_loss": -12.846475601196289, "global_step": 501264, "epoch": 2983} {"train_loss": -12.299088478088379, "global_step": 501265, "epoch": 2983} {"train_loss": -12.549551010131836, "global_step": 501266, "epoch": 2983} {"train_loss": -12.708559036254883, "global_step": 501267, "epoch": 2983} {"train_loss": -12.591049194335938, "global_step": 501268, "epoch": 2983} {"train_loss": -12.33714485168457, "global_step": 501269, "epoch": 2983} {"train_loss": -12.82345199584961, "global_step": 501270, "epoch": 2983} {"train_loss": -12.216373443603516, "global_step": 501271, "epoch": 2983} {"train_loss": -12.76385498046875, "global_step": 501272, "epoch": 2983} {"train_loss": -12.808673858642578, "global_step": 501273, "epoch": 2983} {"train_loss": -12.826623916625977, "global_step": 501274, "epoch": 2983} {"train_loss": -12.730560302734375, "global_step": 501275, "epoch": 2983} {"train_loss": -12.704024314880371, "global_step": 501276, "epoch": 2983} {"train_loss": -12.608708381652832, "global_step": 501277, "epoch": 2983} {"train_loss": -12.902868270874023, "global_step": 501278, "epoch": 2983} {"train_loss": -12.667197227478027, "global_step": 501279, "epoch": 2983} {"train_loss": -12.966155052185059, "global_step": 501280, "epoch": 2983} {"train_loss": -12.979728698730469, "global_step": 501281, "epoch": 2983} {"train_loss": -13.017461776733398, "global_step": 501282, "epoch": 2983} {"train_loss": -12.832247734069824, "global_step": 501283, "epoch": 2983} {"train_loss": -12.935426712036133, "global_step": 501284, "epoch": 2983} {"train_loss": -12.747732162475586, "global_step": 501285, "epoch": 2983} {"train_loss": -12.992311477661133, "global_step": 501286, "epoch": 2983} {"train_loss": -12.936748504638672, "global_step": 501287, "epoch": 2983} {"train_loss": -12.966070175170898, "global_step": 501288, "epoch": 2983} {"train_loss": -12.888484954833984, "global_step": 501289, "epoch": 2983} {"train_loss": -12.930280685424805, "global_step": 501290, "epoch": 2983} {"train_loss": -12.821134567260742, "global_step": 501291, "epoch": 2983} {"train_loss": -12.81861686706543, "global_step": 501292, "epoch": 2983} {"train_loss": -13.144950866699219, "global_step": 501293, "epoch": 2983} {"train_loss": -12.88881778717041, "global_step": 501294, "epoch": 2983} {"train_loss": -12.946113586425781, "global_step": 501295, "epoch": 2983} {"train_loss": -12.890254974365234, "global_step": 501296, "epoch": 2983} {"train_loss": -12.96853256225586, "global_step": 501297, "epoch": 2983} {"train_loss": -12.827293395996094, "global_step": 501298, "epoch": 2983} {"train_loss": -13.081586837768555, "global_step": 501299, "epoch": 2983} {"train_loss": -12.963102340698242, "global_step": 501300, "epoch": 2983} {"train_loss": -12.86279296875, "global_step": 501301, "epoch": 2983} {"train_loss": -12.806806564331055, "global_step": 501302, "epoch": 2983} {"train_loss": -12.866268157958984, "global_step": 501303, "epoch": 2983} {"train_loss": -12.995360374450684, "global_step": 501304, "epoch": 2983} {"train_loss": -12.78032398223877, "global_step": 501305, "epoch": 2983} {"train_loss": -12.982624053955078, "global_step": 501306, "epoch": 2983} {"train_loss": -13.005802154541016, "global_step": 501307, "epoch": 2983} {"train_loss": -12.783677101135254, "global_step": 501308, "epoch": 2983} {"train_loss": -12.743799209594727, "global_step": 501309, "epoch": 2983} {"train_loss": -12.375432968139648, "global_step": 501310, "epoch": 2983} {"train_loss": -11.863782587505522, "global_step": 501311, "epoch": 2983, "val_loss": 320596.90625} {"train_loss": -9.66373062133789, "global_step": 501312, "epoch": 2984} {"train_loss": -10.683756828308105, "global_step": 501313, "epoch": 2984} {"train_loss": -12.37973403930664, "global_step": 501314, "epoch": 2984} {"train_loss": -10.266501426696777, "global_step": 501315, "epoch": 2984} {"train_loss": -10.81930160522461, "global_step": 501316, "epoch": 2984} {"train_loss": -11.5714111328125, "global_step": 501317, "epoch": 2984} {"train_loss": -11.090577125549316, "global_step": 501318, "epoch": 2984} {"train_loss": -12.121265411376953, "global_step": 501319, "epoch": 2984} {"train_loss": -9.72055435180664, "global_step": 501320, "epoch": 2984} {"train_loss": -10.836307525634766, "global_step": 501321, "epoch": 2984} {"train_loss": -9.679088592529297, "global_step": 501322, "epoch": 2984} {"train_loss": -10.143831253051758, "global_step": 501323, "epoch": 2984} {"train_loss": -10.992036819458008, "global_step": 501324, "epoch": 2984} {"train_loss": -10.609114646911621, "global_step": 501325, "epoch": 2984} {"train_loss": -9.997827529907227, "global_step": 501326, "epoch": 2984} {"train_loss": -9.375642776489258, "global_step": 501327, "epoch": 2984} {"train_loss": -10.93453598022461, "global_step": 501328, "epoch": 2984} {"train_loss": -10.660970687866211, "global_step": 501329, "epoch": 2984} {"train_loss": -10.388463973999023, "global_step": 501330, "epoch": 2984} {"train_loss": -11.862289428710938, "global_step": 501331, "epoch": 2984} {"train_loss": -10.139758110046387, "global_step": 501332, "epoch": 2984} {"train_loss": -11.644859313964844, "global_step": 501333, "epoch": 2984} {"train_loss": -11.314228057861328, "global_step": 501334, "epoch": 2984} {"train_loss": -11.861912727355957, "global_step": 501335, "epoch": 2984} {"train_loss": -11.565549850463867, "global_step": 501336, "epoch": 2984} {"train_loss": -11.93669319152832, "global_step": 501337, "epoch": 2984} {"train_loss": -11.370098114013672, "global_step": 501338, "epoch": 2984} {"train_loss": -11.946407318115234, "global_step": 501339, "epoch": 2984} {"train_loss": -12.340559005737305, "global_step": 501340, "epoch": 2984} {"train_loss": -11.388025283813477, "global_step": 501341, "epoch": 2984} {"train_loss": -11.692327499389648, "global_step": 501342, "epoch": 2984} {"train_loss": -12.065896987915039, "global_step": 501343, "epoch": 2984} {"train_loss": -11.772785186767578, "global_step": 501344, "epoch": 2984} {"train_loss": -11.75455093383789, "global_step": 501345, "epoch": 2984} {"train_loss": -12.227724075317383, "global_step": 501346, "epoch": 2984} {"train_loss": -11.997339248657227, "global_step": 501347, "epoch": 2984} {"train_loss": -12.240165710449219, "global_step": 501348, "epoch": 2984} {"train_loss": -12.198919296264648, "global_step": 501349, "epoch": 2984} {"train_loss": -12.212260246276855, "global_step": 501350, "epoch": 2984} {"train_loss": -12.369735717773438, "global_step": 501351, "epoch": 2984} {"train_loss": -12.1168212890625, "global_step": 501352, "epoch": 2984} {"train_loss": -12.508979797363281, "global_step": 501353, "epoch": 2984} {"train_loss": -12.206690788269043, "global_step": 501354, "epoch": 2984} {"train_loss": -12.200973510742188, "global_step": 501355, "epoch": 2984} {"train_loss": -12.30826187133789, "global_step": 501356, "epoch": 2984} {"train_loss": -12.268596649169922, "global_step": 501357, "epoch": 2984} {"train_loss": -12.37501335144043, "global_step": 501358, "epoch": 2984} {"train_loss": -11.985368728637695, "global_step": 501359, "epoch": 2984} {"train_loss": -12.346997261047363, "global_step": 501360, "epoch": 2984} {"train_loss": -12.240981101989746, "global_step": 501361, "epoch": 2984} {"train_loss": -12.65916633605957, "global_step": 501362, "epoch": 2984} {"train_loss": -12.464503288269043, "global_step": 501363, "epoch": 2984} {"train_loss": -12.50933837890625, "global_step": 501364, "epoch": 2984} {"train_loss": -12.651874542236328, "global_step": 501365, "epoch": 2984} {"train_loss": -12.603415489196777, "global_step": 501366, "epoch": 2984} {"train_loss": -12.534910202026367, "global_step": 501367, "epoch": 2984} {"train_loss": -12.807339668273926, "global_step": 501368, "epoch": 2984} {"train_loss": -12.556722640991211, "global_step": 501369, "epoch": 2984} {"train_loss": -12.828413009643555, "global_step": 501370, "epoch": 2984} {"train_loss": -12.2454195022583, "global_step": 501371, "epoch": 2984} {"train_loss": -12.62398910522461, "global_step": 501372, "epoch": 2984} {"train_loss": -12.441286087036133, "global_step": 501373, "epoch": 2984} {"train_loss": -12.839778900146484, "global_step": 501374, "epoch": 2984} {"train_loss": -12.331551551818848, "global_step": 501375, "epoch": 2984} {"train_loss": -12.646982192993164, "global_step": 501376, "epoch": 2984} {"train_loss": -12.396479606628418, "global_step": 501377, "epoch": 2984} {"train_loss": -12.412454605102539, "global_step": 501378, "epoch": 2984} {"train_loss": -12.693490028381348, "global_step": 501379, "epoch": 2984} {"train_loss": -12.592864036560059, "global_step": 501380, "epoch": 2984} {"train_loss": -12.285871505737305, "global_step": 501381, "epoch": 2984} {"train_loss": -12.850126266479492, "global_step": 501382, "epoch": 2984} {"train_loss": -12.394950866699219, "global_step": 501383, "epoch": 2984} {"train_loss": -12.56529426574707, "global_step": 501384, "epoch": 2984} {"train_loss": -12.606507301330566, "global_step": 501385, "epoch": 2984} {"train_loss": -12.569234848022461, "global_step": 501386, "epoch": 2984} {"train_loss": -12.702823638916016, "global_step": 501387, "epoch": 2984} {"train_loss": -12.52734375, "global_step": 501388, "epoch": 2984} {"train_loss": -12.632707595825195, "global_step": 501389, "epoch": 2984} {"train_loss": -12.677261352539062, "global_step": 501390, "epoch": 2984} {"train_loss": -12.832332611083984, "global_step": 501391, "epoch": 2984} {"train_loss": -12.698165893554688, "global_step": 501392, "epoch": 2984} {"train_loss": -12.704436302185059, "global_step": 501393, "epoch": 2984} {"train_loss": -12.686090469360352, "global_step": 501394, "epoch": 2984} {"train_loss": -12.66208553314209, "global_step": 501395, "epoch": 2984} {"train_loss": -12.71230697631836, "global_step": 501396, "epoch": 2984} {"train_loss": -12.74284553527832, "global_step": 501397, "epoch": 2984} {"train_loss": -12.752975463867188, "global_step": 501398, "epoch": 2984} {"train_loss": -12.501168251037598, "global_step": 501399, "epoch": 2984} {"train_loss": -12.755277633666992, "global_step": 501400, "epoch": 2984} {"train_loss": -12.786979675292969, "global_step": 501401, "epoch": 2984} {"train_loss": -12.955371856689453, "global_step": 501402, "epoch": 2984} {"train_loss": -12.621162414550781, "global_step": 501403, "epoch": 2984} {"train_loss": -12.72742748260498, "global_step": 501404, "epoch": 2984} {"train_loss": -12.866106033325195, "global_step": 501405, "epoch": 2984} {"train_loss": -12.579237937927246, "global_step": 501406, "epoch": 2984} {"train_loss": -12.583624839782715, "global_step": 501407, "epoch": 2984} {"train_loss": -12.70328140258789, "global_step": 501408, "epoch": 2984} {"train_loss": -12.290939331054688, "global_step": 501409, "epoch": 2984} {"train_loss": -12.241240501403809, "global_step": 501410, "epoch": 2984} {"train_loss": -12.751192092895508, "global_step": 501411, "epoch": 2984} {"train_loss": -12.838583946228027, "global_step": 501412, "epoch": 2984} {"train_loss": -12.535533905029297, "global_step": 501413, "epoch": 2984} {"train_loss": -12.688729286193848, "global_step": 501414, "epoch": 2984} {"train_loss": -12.647994041442871, "global_step": 501415, "epoch": 2984} {"train_loss": -12.585030555725098, "global_step": 501416, "epoch": 2984} {"train_loss": -12.804348945617676, "global_step": 501417, "epoch": 2984} {"train_loss": -12.380657196044922, "global_step": 501418, "epoch": 2984} {"train_loss": -12.784035682678223, "global_step": 501419, "epoch": 2984} {"train_loss": -12.887908935546875, "global_step": 501420, "epoch": 2984} {"train_loss": -12.732771873474121, "global_step": 501421, "epoch": 2984} {"train_loss": -12.61942195892334, "global_step": 501422, "epoch": 2984} {"train_loss": -12.876553535461426, "global_step": 501423, "epoch": 2984} {"train_loss": -12.93305778503418, "global_step": 501424, "epoch": 2984} {"train_loss": -12.417808532714844, "global_step": 501425, "epoch": 2984} {"train_loss": -12.605780601501465, "global_step": 501426, "epoch": 2984} {"train_loss": -12.486883163452148, "global_step": 501427, "epoch": 2984} {"train_loss": -12.799981117248535, "global_step": 501428, "epoch": 2984} {"train_loss": -12.552204132080078, "global_step": 501429, "epoch": 2984} {"train_loss": -12.563742637634277, "global_step": 501430, "epoch": 2984} {"train_loss": -12.643434524536133, "global_step": 501431, "epoch": 2984} {"train_loss": -12.996456146240234, "global_step": 501432, "epoch": 2984} {"train_loss": -12.591340065002441, "global_step": 501433, "epoch": 2984} {"train_loss": -12.466675758361816, "global_step": 501434, "epoch": 2984} {"train_loss": -11.818124771118164, "global_step": 501435, "epoch": 2984} {"train_loss": -12.897680282592773, "global_step": 501436, "epoch": 2984} {"train_loss": -11.788616180419922, "global_step": 501437, "epoch": 2984} {"train_loss": -11.704681396484375, "global_step": 501438, "epoch": 2984} {"train_loss": -12.335763931274414, "global_step": 501439, "epoch": 2984} {"train_loss": -12.552282333374023, "global_step": 501440, "epoch": 2984} {"train_loss": -10.226457595825195, "global_step": 501441, "epoch": 2984} {"train_loss": -12.505796432495117, "global_step": 501442, "epoch": 2984} {"train_loss": -11.390569686889648, "global_step": 501443, "epoch": 2984} {"train_loss": -11.406432151794434, "global_step": 501444, "epoch": 2984} {"train_loss": -11.284356117248535, "global_step": 501445, "epoch": 2984} {"train_loss": -10.373278617858887, "global_step": 501446, "epoch": 2984} {"train_loss": -11.89857292175293, "global_step": 501447, "epoch": 2984} {"train_loss": -9.66943359375, "global_step": 501448, "epoch": 2984} {"train_loss": -11.260940551757812, "global_step": 501449, "epoch": 2984} {"train_loss": -11.77413558959961, "global_step": 501450, "epoch": 2984} {"train_loss": -10.606184005737305, "global_step": 501451, "epoch": 2984} {"train_loss": -11.872575759887695, "global_step": 501452, "epoch": 2984} {"train_loss": -11.301353454589844, "global_step": 501453, "epoch": 2984} {"train_loss": -11.238128662109375, "global_step": 501454, "epoch": 2984} {"train_loss": -11.673198699951172, "global_step": 501455, "epoch": 2984} {"train_loss": -12.675987243652344, "global_step": 501456, "epoch": 2984} {"train_loss": -11.579105377197266, "global_step": 501457, "epoch": 2984} {"train_loss": -12.199420928955078, "global_step": 501458, "epoch": 2984} {"train_loss": -12.144888877868652, "global_step": 501459, "epoch": 2984} {"train_loss": -11.319751739501953, "global_step": 501460, "epoch": 2984} {"train_loss": -12.606657028198242, "global_step": 501461, "epoch": 2984} {"train_loss": -10.497272491455078, "global_step": 501462, "epoch": 2984} {"train_loss": -11.73755931854248, "global_step": 501463, "epoch": 2984} {"train_loss": -11.669330596923828, "global_step": 501464, "epoch": 2984} {"train_loss": -11.235508918762207, "global_step": 501465, "epoch": 2984} {"train_loss": -10.56956672668457, "global_step": 501466, "epoch": 2984} {"train_loss": -11.849676132202148, "global_step": 501467, "epoch": 2984} {"train_loss": -10.153736114501953, "global_step": 501468, "epoch": 2984} {"train_loss": -11.740043640136719, "global_step": 501469, "epoch": 2984} {"train_loss": -10.347689628601074, "global_step": 501470, "epoch": 2984} {"train_loss": -10.941316604614258, "global_step": 501471, "epoch": 2984} {"train_loss": -11.287582397460938, "global_step": 501472, "epoch": 2984} {"train_loss": -11.110929489135742, "global_step": 501473, "epoch": 2984} {"train_loss": -10.871297836303711, "global_step": 501474, "epoch": 2984} {"train_loss": -10.613210678100586, "global_step": 501475, "epoch": 2984} {"train_loss": -11.422616958618164, "global_step": 501476, "epoch": 2984} {"train_loss": -10.198506355285645, "global_step": 501477, "epoch": 2984} {"train_loss": -11.308690071105957, "global_step": 501478, "epoch": 2984} {"train_loss": -11.946301755451021, "global_step": 501479, "epoch": 2984, "val_loss": 318591.09375} {"train_loss": -10.439250946044922, "global_step": 501480, "epoch": 2985} {"train_loss": -11.09378433227539, "global_step": 501481, "epoch": 2985} {"train_loss": -11.096796035766602, "global_step": 501482, "epoch": 2985} {"train_loss": -10.487714767456055, "global_step": 501483, "epoch": 2985} {"train_loss": -10.198678970336914, "global_step": 501484, "epoch": 2985} {"train_loss": -9.481792449951172, "global_step": 501485, "epoch": 2985} {"train_loss": -10.02650260925293, "global_step": 501486, "epoch": 2985} {"train_loss": -10.142656326293945, "global_step": 501487, "epoch": 2985} {"train_loss": -11.185083389282227, "global_step": 501488, "epoch": 2985} {"train_loss": -10.200000762939453, "global_step": 501489, "epoch": 2985} {"train_loss": -10.813594818115234, "global_step": 501490, "epoch": 2985} {"train_loss": -11.469427108764648, "global_step": 501491, "epoch": 2985} {"train_loss": -10.235170364379883, "global_step": 501492, "epoch": 2985} {"train_loss": -10.295721054077148, "global_step": 501493, "epoch": 2985} {"train_loss": -11.262776374816895, "global_step": 501494, "epoch": 2985} {"train_loss": -11.3637113571167, "global_step": 501495, "epoch": 2985} {"train_loss": -10.751861572265625, "global_step": 501496, "epoch": 2985} {"train_loss": -11.5018310546875, "global_step": 501497, "epoch": 2985} {"train_loss": -10.855788230895996, "global_step": 501498, "epoch": 2985} {"train_loss": -11.83611011505127, "global_step": 501499, "epoch": 2985} {"train_loss": -11.498695373535156, "global_step": 501500, "epoch": 2985} {"train_loss": -11.309398651123047, "global_step": 501501, "epoch": 2985} {"train_loss": -11.164498329162598, "global_step": 501502, "epoch": 2985} {"train_loss": -10.916318893432617, "global_step": 501503, "epoch": 2985} {"train_loss": -10.354713439941406, "global_step": 501504, "epoch": 2985} {"train_loss": -11.210036277770996, "global_step": 501505, "epoch": 2985} {"train_loss": -11.464462280273438, "global_step": 501506, "epoch": 2985} {"train_loss": -10.433387756347656, "global_step": 501507, "epoch": 2985} {"train_loss": -10.106340408325195, "global_step": 501508, "epoch": 2985} {"train_loss": -11.231719970703125, "global_step": 501509, "epoch": 2985} {"train_loss": -11.521533966064453, "global_step": 501510, "epoch": 2985} {"train_loss": -11.002801895141602, "global_step": 501511, "epoch": 2985} {"train_loss": -12.077821731567383, "global_step": 501512, "epoch": 2985} {"train_loss": -11.423126220703125, "global_step": 501513, "epoch": 2985} {"train_loss": -11.964225769042969, "global_step": 501514, "epoch": 2985} {"train_loss": -11.550439834594727, "global_step": 501515, "epoch": 2985} {"train_loss": -11.991026878356934, "global_step": 501516, "epoch": 2985} {"train_loss": -11.662202835083008, "global_step": 501517, "epoch": 2985} {"train_loss": -12.284082412719727, "global_step": 501518, "epoch": 2985} {"train_loss": -11.440435409545898, "global_step": 501519, "epoch": 2985} {"train_loss": -12.15206527709961, "global_step": 501520, "epoch": 2985} {"train_loss": -11.542304992675781, "global_step": 501521, "epoch": 2985} {"train_loss": -12.113080978393555, "global_step": 501522, "epoch": 2985} {"train_loss": -11.845307350158691, "global_step": 501523, "epoch": 2985} {"train_loss": -12.218145370483398, "global_step": 501524, "epoch": 2985} {"train_loss": -11.791202545166016, "global_step": 501525, "epoch": 2985} {"train_loss": -12.28930377960205, "global_step": 501526, "epoch": 2985} {"train_loss": -11.715686798095703, "global_step": 501527, "epoch": 2985} {"train_loss": -12.239166259765625, "global_step": 501528, "epoch": 2985} {"train_loss": -11.858661651611328, "global_step": 501529, "epoch": 2985} {"train_loss": -12.267477035522461, "global_step": 501530, "epoch": 2985} {"train_loss": -12.099858283996582, "global_step": 501531, "epoch": 2985} {"train_loss": -12.389204025268555, "global_step": 501532, "epoch": 2985} {"train_loss": -11.873872756958008, "global_step": 501533, "epoch": 2985} {"train_loss": -12.321626663208008, "global_step": 501534, "epoch": 2985} {"train_loss": -12.207639694213867, "global_step": 501535, "epoch": 2985} {"train_loss": -12.563519477844238, "global_step": 501536, "epoch": 2985} {"train_loss": -12.243847846984863, "global_step": 501537, "epoch": 2985} {"train_loss": -12.497227668762207, "global_step": 501538, "epoch": 2985} {"train_loss": -12.371109008789062, "global_step": 501539, "epoch": 2985} {"train_loss": -12.15449333190918, "global_step": 501540, "epoch": 2985} {"train_loss": -12.396329879760742, "global_step": 501541, "epoch": 2985} {"train_loss": -12.546442031860352, "global_step": 501542, "epoch": 2985} {"train_loss": -12.562845230102539, "global_step": 501543, "epoch": 2985} {"train_loss": -12.369001388549805, "global_step": 501544, "epoch": 2985} {"train_loss": -12.565899848937988, "global_step": 501545, "epoch": 2985} {"train_loss": -12.584880828857422, "global_step": 501546, "epoch": 2985} {"train_loss": -12.575998306274414, "global_step": 501547, "epoch": 2985} {"train_loss": -12.618476867675781, "global_step": 501548, "epoch": 2985} {"train_loss": -12.614550590515137, "global_step": 501549, "epoch": 2985} {"train_loss": -12.670608520507812, "global_step": 501550, "epoch": 2985} {"train_loss": -12.453643798828125, "global_step": 501551, "epoch": 2985} {"train_loss": -12.703024864196777, "global_step": 501552, "epoch": 2985} {"train_loss": -12.668770790100098, "global_step": 501553, "epoch": 2985} {"train_loss": -12.709216117858887, "global_step": 501554, "epoch": 2985} {"train_loss": -12.718530654907227, "global_step": 501555, "epoch": 2985} {"train_loss": -12.774372100830078, "global_step": 501556, "epoch": 2985} {"train_loss": -12.734127044677734, "global_step": 501557, "epoch": 2985} {"train_loss": -12.64992904663086, "global_step": 501558, "epoch": 2985} {"train_loss": -12.644537925720215, "global_step": 501559, "epoch": 2985} {"train_loss": -12.610062599182129, "global_step": 501560, "epoch": 2985} {"train_loss": -12.816230773925781, "global_step": 501561, "epoch": 2985} {"train_loss": -12.69880199432373, "global_step": 501562, "epoch": 2985} {"train_loss": -12.692789077758789, "global_step": 501563, "epoch": 2985} {"train_loss": -12.48952865600586, "global_step": 501564, "epoch": 2985} {"train_loss": -12.767047882080078, "global_step": 501565, "epoch": 2985} {"train_loss": -12.795571327209473, "global_step": 501566, "epoch": 2985} {"train_loss": -12.833498001098633, "global_step": 501567, "epoch": 2985} {"train_loss": -12.774490356445312, "global_step": 501568, "epoch": 2985} {"train_loss": -12.768651962280273, "global_step": 501569, "epoch": 2985} {"train_loss": -12.742324829101562, "global_step": 501570, "epoch": 2985} {"train_loss": -12.667217254638672, "global_step": 501571, "epoch": 2985} {"train_loss": -12.781705856323242, "global_step": 501572, "epoch": 2985} {"train_loss": -12.739066123962402, "global_step": 501573, "epoch": 2985} {"train_loss": -12.868003845214844, "global_step": 501574, "epoch": 2985} {"train_loss": -12.767182350158691, "global_step": 501575, "epoch": 2985} {"train_loss": -12.744972229003906, "global_step": 501576, "epoch": 2985} {"train_loss": -12.778484344482422, "global_step": 501577, "epoch": 2985} {"train_loss": -12.602385520935059, "global_step": 501578, "epoch": 2985} {"train_loss": -12.722299575805664, "global_step": 501579, "epoch": 2985} {"train_loss": -12.83771800994873, "global_step": 501580, "epoch": 2985} {"train_loss": -12.923013687133789, "global_step": 501581, "epoch": 2985} {"train_loss": -12.912723541259766, "global_step": 501582, "epoch": 2985} {"train_loss": -12.83692741394043, "global_step": 501583, "epoch": 2985} {"train_loss": -12.586801528930664, "global_step": 501584, "epoch": 2985} {"train_loss": -12.859724998474121, "global_step": 501585, "epoch": 2985} {"train_loss": -12.852299690246582, "global_step": 501586, "epoch": 2985} {"train_loss": -12.552915573120117, "global_step": 501587, "epoch": 2985} {"train_loss": -12.823539733886719, "global_step": 501588, "epoch": 2985} {"train_loss": -12.904233932495117, "global_step": 501589, "epoch": 2985} {"train_loss": -12.974889755249023, "global_step": 501590, "epoch": 2985} {"train_loss": -13.0015869140625, "global_step": 501591, "epoch": 2985} {"train_loss": -12.894662857055664, "global_step": 501592, "epoch": 2985} {"train_loss": -12.766233444213867, "global_step": 501593, "epoch": 2985} {"train_loss": -13.057775497436523, "global_step": 501594, "epoch": 2985} {"train_loss": -12.837057113647461, "global_step": 501595, "epoch": 2985} {"train_loss": -12.923667907714844, "global_step": 501596, "epoch": 2985} {"train_loss": -12.939144134521484, "global_step": 501597, "epoch": 2985} {"train_loss": -12.858785629272461, "global_step": 501598, "epoch": 2985} {"train_loss": -12.870155334472656, "global_step": 501599, "epoch": 2985} {"train_loss": -13.043330192565918, "global_step": 501600, "epoch": 2985} {"train_loss": -12.903905868530273, "global_step": 501601, "epoch": 2985} {"train_loss": -12.95413589477539, "global_step": 501602, "epoch": 2985} {"train_loss": -12.896139144897461, "global_step": 501603, "epoch": 2985} {"train_loss": -12.938709259033203, "global_step": 501604, "epoch": 2985} {"train_loss": -13.016645431518555, "global_step": 501605, "epoch": 2985} {"train_loss": -13.138282775878906, "global_step": 501606, "epoch": 2985} {"train_loss": -13.020182609558105, "global_step": 501607, "epoch": 2985} {"train_loss": -13.01793098449707, "global_step": 501608, "epoch": 2985} {"train_loss": -12.910723686218262, "global_step": 501609, "epoch": 2985} {"train_loss": -12.799534797668457, "global_step": 501610, "epoch": 2985} {"train_loss": -12.919012069702148, "global_step": 501611, "epoch": 2985} {"train_loss": -12.694355010986328, "global_step": 501612, "epoch": 2985} {"train_loss": -12.491024017333984, "global_step": 501613, "epoch": 2985} {"train_loss": -12.8046875, "global_step": 501614, "epoch": 2985} {"train_loss": -12.695585250854492, "global_step": 501615, "epoch": 2985} {"train_loss": -12.173828125, "global_step": 501616, "epoch": 2985} {"train_loss": -12.364925384521484, "global_step": 501617, "epoch": 2985} {"train_loss": -12.431374549865723, "global_step": 501618, "epoch": 2985} {"train_loss": -11.210708618164062, "global_step": 501619, "epoch": 2985} {"train_loss": -12.468660354614258, "global_step": 501620, "epoch": 2985} {"train_loss": -12.080246925354004, "global_step": 501621, "epoch": 2985} {"train_loss": -12.325465202331543, "global_step": 501622, "epoch": 2985} {"train_loss": -12.431995391845703, "global_step": 501623, "epoch": 2985} {"train_loss": -12.31976318359375, "global_step": 501624, "epoch": 2985} {"train_loss": -12.101466178894043, "global_step": 501625, "epoch": 2985} {"train_loss": -12.547578811645508, "global_step": 501626, "epoch": 2985} {"train_loss": -12.0358247756958, "global_step": 501627, "epoch": 2985} {"train_loss": -11.73896312713623, "global_step": 501628, "epoch": 2985} {"train_loss": -12.950201034545898, "global_step": 501629, "epoch": 2985} {"train_loss": -12.305503845214844, "global_step": 501630, "epoch": 2985} {"train_loss": -12.19495964050293, "global_step": 501631, "epoch": 2985} {"train_loss": -12.095540046691895, "global_step": 501632, "epoch": 2985} {"train_loss": -12.085975646972656, "global_step": 501633, "epoch": 2985} {"train_loss": -11.110284805297852, "global_step": 501634, "epoch": 2985} {"train_loss": -11.944811820983887, "global_step": 501635, "epoch": 2985} {"train_loss": -11.724157333374023, "global_step": 501636, "epoch": 2985} {"train_loss": -10.320581436157227, "global_step": 501637, "epoch": 2985} {"train_loss": -11.033675193786621, "global_step": 501638, "epoch": 2985} {"train_loss": -12.400793075561523, "global_step": 501639, "epoch": 2985} {"train_loss": -10.816455841064453, "global_step": 501640, "epoch": 2985} {"train_loss": -11.216999053955078, "global_step": 501641, "epoch": 2985} {"train_loss": -9.610973358154297, "global_step": 501642, "epoch": 2985} {"train_loss": -10.474174499511719, "global_step": 501643, "epoch": 2985} {"train_loss": -11.078371047973633, "global_step": 501644, "epoch": 2985} {"train_loss": -10.30527400970459, "global_step": 501645, "epoch": 2985} {"train_loss": -10.469045639038086, "global_step": 501646, "epoch": 2985} {"train_loss": -12.0611781279246, "global_step": 501647, "epoch": 2985, "val_loss": 320407.4375, "train_action_mse_error": 0.22931121289730072} {"train_loss": -8.252054214477539, "global_step": 501648, "epoch": 2986} {"train_loss": -9.607088088989258, "global_step": 501649, "epoch": 2986} {"train_loss": -10.091926574707031, "global_step": 501650, "epoch": 2986} {"train_loss": -11.32359504699707, "global_step": 501651, "epoch": 2986} {"train_loss": -10.742992401123047, "global_step": 501652, "epoch": 2986} {"train_loss": -10.50918960571289, "global_step": 501653, "epoch": 2986} {"train_loss": -10.444091796875, "global_step": 501654, "epoch": 2986} {"train_loss": -10.407089233398438, "global_step": 501655, "epoch": 2986} {"train_loss": -11.196855545043945, "global_step": 501656, "epoch": 2986} {"train_loss": -11.577893257141113, "global_step": 501657, "epoch": 2986} {"train_loss": -11.161397933959961, "global_step": 501658, "epoch": 2986} {"train_loss": -10.793838500976562, "global_step": 501659, "epoch": 2986} {"train_loss": -11.621893882751465, "global_step": 501660, "epoch": 2986} {"train_loss": -10.88207721710205, "global_step": 501661, "epoch": 2986} {"train_loss": -11.764264106750488, "global_step": 501662, "epoch": 2986} {"train_loss": -11.948750495910645, "global_step": 501663, "epoch": 2986} {"train_loss": -11.54842758178711, "global_step": 501664, "epoch": 2986} {"train_loss": -12.11855411529541, "global_step": 501665, "epoch": 2986} {"train_loss": -11.406885147094727, "global_step": 501666, "epoch": 2986} {"train_loss": -11.872086524963379, "global_step": 501667, "epoch": 2986} {"train_loss": -11.467449188232422, "global_step": 501668, "epoch": 2986} {"train_loss": -10.993032455444336, "global_step": 501669, "epoch": 2986} {"train_loss": -11.04068660736084, "global_step": 501670, "epoch": 2986} {"train_loss": -11.630234718322754, "global_step": 501671, "epoch": 2986} {"train_loss": -11.692389488220215, "global_step": 501672, "epoch": 2986} {"train_loss": -12.162473678588867, "global_step": 501673, "epoch": 2986} {"train_loss": -11.570175170898438, "global_step": 501674, "epoch": 2986} {"train_loss": -12.19066047668457, "global_step": 501675, "epoch": 2986} {"train_loss": -11.788551330566406, "global_step": 501676, "epoch": 2986} {"train_loss": -12.236757278442383, "global_step": 501677, "epoch": 2986} {"train_loss": -11.736360549926758, "global_step": 501678, "epoch": 2986} {"train_loss": -12.425910949707031, "global_step": 501679, "epoch": 2986} {"train_loss": -12.160713195800781, "global_step": 501680, "epoch": 2986} {"train_loss": -12.289020538330078, "global_step": 501681, "epoch": 2986} {"train_loss": -12.264135360717773, "global_step": 501682, "epoch": 2986} {"train_loss": -12.366908073425293, "global_step": 501683, "epoch": 2986} {"train_loss": -12.1473388671875, "global_step": 501684, "epoch": 2986} {"train_loss": -12.48420238494873, "global_step": 501685, "epoch": 2986} {"train_loss": -11.986560821533203, "global_step": 501686, "epoch": 2986} {"train_loss": -12.448410034179688, "global_step": 501687, "epoch": 2986} {"train_loss": -12.256385803222656, "global_step": 501688, "epoch": 2986} {"train_loss": -12.4628324508667, "global_step": 501689, "epoch": 2986} {"train_loss": -12.284547805786133, "global_step": 501690, "epoch": 2986} {"train_loss": -12.233781814575195, "global_step": 501691, "epoch": 2986} {"train_loss": -12.319846153259277, "global_step": 501692, "epoch": 2986} {"train_loss": -11.908140182495117, "global_step": 501693, "epoch": 2986} {"train_loss": -12.520228385925293, "global_step": 501694, "epoch": 2986} {"train_loss": -12.209693908691406, "global_step": 501695, "epoch": 2986} {"train_loss": -12.3506498336792, "global_step": 501696, "epoch": 2986} {"train_loss": -12.025943756103516, "global_step": 501697, "epoch": 2986} {"train_loss": -11.449040412902832, "global_step": 501698, "epoch": 2986} {"train_loss": -11.960575103759766, "global_step": 501699, "epoch": 2986} {"train_loss": -11.449735641479492, "global_step": 501700, "epoch": 2986} {"train_loss": -12.18922233581543, "global_step": 501701, "epoch": 2986} {"train_loss": -11.628117561340332, "global_step": 501702, "epoch": 2986} {"train_loss": -11.899797439575195, "global_step": 501703, "epoch": 2986} {"train_loss": -12.062536239624023, "global_step": 501704, "epoch": 2986} {"train_loss": -11.67819595336914, "global_step": 501705, "epoch": 2986} {"train_loss": -12.31273365020752, "global_step": 501706, "epoch": 2986} {"train_loss": -11.404212951660156, "global_step": 501707, "epoch": 2986} {"train_loss": -11.696239471435547, "global_step": 501708, "epoch": 2986} {"train_loss": -11.594202041625977, "global_step": 501709, "epoch": 2986} {"train_loss": -11.802695274353027, "global_step": 501710, "epoch": 2986} {"train_loss": -12.42602825164795, "global_step": 501711, "epoch": 2986} {"train_loss": -12.328907012939453, "global_step": 501712, "epoch": 2986} {"train_loss": -12.171277046203613, "global_step": 501713, "epoch": 2986} {"train_loss": -12.26722240447998, "global_step": 501714, "epoch": 2986} {"train_loss": -11.968460083007812, "global_step": 501715, "epoch": 2986} {"train_loss": -12.48340892791748, "global_step": 501716, "epoch": 2986} {"train_loss": -12.346760749816895, "global_step": 501717, "epoch": 2986} {"train_loss": -12.533485412597656, "global_step": 501718, "epoch": 2986} {"train_loss": -12.217666625976562, "global_step": 501719, "epoch": 2986} {"train_loss": -12.671882629394531, "global_step": 501720, "epoch": 2986} {"train_loss": -12.199636459350586, "global_step": 501721, "epoch": 2986} {"train_loss": -12.552061080932617, "global_step": 501722, "epoch": 2986} {"train_loss": -12.424930572509766, "global_step": 501723, "epoch": 2986} {"train_loss": -12.459407806396484, "global_step": 501724, "epoch": 2986} {"train_loss": -12.691869735717773, "global_step": 501725, "epoch": 2986} {"train_loss": -12.465827941894531, "global_step": 501726, "epoch": 2986} {"train_loss": -12.458146095275879, "global_step": 501727, "epoch": 2986} {"train_loss": -12.148365020751953, "global_step": 501728, "epoch": 2986} {"train_loss": -12.496747970581055, "global_step": 501729, "epoch": 2986} {"train_loss": -12.093748092651367, "global_step": 501730, "epoch": 2986} {"train_loss": -12.466873168945312, "global_step": 501731, "epoch": 2986} {"train_loss": -12.141610145568848, "global_step": 501732, "epoch": 2986} {"train_loss": -12.207138061523438, "global_step": 501733, "epoch": 2986} {"train_loss": -11.89603042602539, "global_step": 501734, "epoch": 2986} {"train_loss": -12.125561714172363, "global_step": 501735, "epoch": 2986} {"train_loss": -12.323884963989258, "global_step": 501736, "epoch": 2986} {"train_loss": -12.398347854614258, "global_step": 501737, "epoch": 2986} {"train_loss": -12.356647491455078, "global_step": 501738, "epoch": 2986} {"train_loss": -12.358709335327148, "global_step": 501739, "epoch": 2986} {"train_loss": -12.272729873657227, "global_step": 501740, "epoch": 2986} {"train_loss": -12.461370468139648, "global_step": 501741, "epoch": 2986} {"train_loss": -12.29060173034668, "global_step": 501742, "epoch": 2986} {"train_loss": -12.599760055541992, "global_step": 501743, "epoch": 2986} {"train_loss": -12.204343795776367, "global_step": 501744, "epoch": 2986} {"train_loss": -12.814889907836914, "global_step": 501745, "epoch": 2986} {"train_loss": -12.465710639953613, "global_step": 501746, "epoch": 2986} {"train_loss": -12.6806058883667, "global_step": 501747, "epoch": 2986} {"train_loss": -12.460733413696289, "global_step": 501748, "epoch": 2986} {"train_loss": -12.390941619873047, "global_step": 501749, "epoch": 2986} {"train_loss": -12.239808082580566, "global_step": 501750, "epoch": 2986} {"train_loss": -11.980447769165039, "global_step": 501751, "epoch": 2986} {"train_loss": -12.703222274780273, "global_step": 501752, "epoch": 2986} {"train_loss": -12.014259338378906, "global_step": 501753, "epoch": 2986} {"train_loss": -12.743281364440918, "global_step": 501754, "epoch": 2986} {"train_loss": -12.358627319335938, "global_step": 501755, "epoch": 2986} {"train_loss": -12.552318572998047, "global_step": 501756, "epoch": 2986} {"train_loss": -12.540855407714844, "global_step": 501757, "epoch": 2986} {"train_loss": -12.454948425292969, "global_step": 501758, "epoch": 2986} {"train_loss": -12.761561393737793, "global_step": 501759, "epoch": 2986} {"train_loss": -12.241352081298828, "global_step": 501760, "epoch": 2986} {"train_loss": -12.723374366760254, "global_step": 501761, "epoch": 2986} {"train_loss": -12.579530715942383, "global_step": 501762, "epoch": 2986} {"train_loss": -12.606864929199219, "global_step": 501763, "epoch": 2986} {"train_loss": -12.648687362670898, "global_step": 501764, "epoch": 2986} {"train_loss": -12.745819091796875, "global_step": 501765, "epoch": 2986} {"train_loss": -12.666099548339844, "global_step": 501766, "epoch": 2986} {"train_loss": -12.439045906066895, "global_step": 501767, "epoch": 2986} {"train_loss": -12.618505477905273, "global_step": 501768, "epoch": 2986} {"train_loss": -12.63174819946289, "global_step": 501769, "epoch": 2986} {"train_loss": -12.441179275512695, "global_step": 501770, "epoch": 2986} {"train_loss": -12.823884963989258, "global_step": 501771, "epoch": 2986} {"train_loss": -12.394064903259277, "global_step": 501772, "epoch": 2986} {"train_loss": -12.15658187866211, "global_step": 501773, "epoch": 2986} {"train_loss": -12.701842308044434, "global_step": 501774, "epoch": 2986} {"train_loss": -12.791380882263184, "global_step": 501775, "epoch": 2986} {"train_loss": -12.870136260986328, "global_step": 501776, "epoch": 2986} {"train_loss": -12.6913480758667, "global_step": 501777, "epoch": 2986} {"train_loss": -12.532648086547852, "global_step": 501778, "epoch": 2986} {"train_loss": -12.820574760437012, "global_step": 501779, "epoch": 2986} {"train_loss": -12.752143859863281, "global_step": 501780, "epoch": 2986} {"train_loss": -12.725430488586426, "global_step": 501781, "epoch": 2986} {"train_loss": -12.871516227722168, "global_step": 501782, "epoch": 2986} {"train_loss": -12.222875595092773, "global_step": 501783, "epoch": 2986} {"train_loss": -12.681053161621094, "global_step": 501784, "epoch": 2986} {"train_loss": -12.807345390319824, "global_step": 501785, "epoch": 2986} {"train_loss": -12.129435539245605, "global_step": 501786, "epoch": 2986} {"train_loss": -12.62960433959961, "global_step": 501787, "epoch": 2986} {"train_loss": -12.543680191040039, "global_step": 501788, "epoch": 2986} {"train_loss": -12.422344207763672, "global_step": 501789, "epoch": 2986} {"train_loss": -12.780851364135742, "global_step": 501790, "epoch": 2986} {"train_loss": -12.578058242797852, "global_step": 501791, "epoch": 2986} {"train_loss": -12.626620292663574, "global_step": 501792, "epoch": 2986} {"train_loss": -12.553445816040039, "global_step": 501793, "epoch": 2986} {"train_loss": -12.061056137084961, "global_step": 501794, "epoch": 2986} {"train_loss": -12.472572326660156, "global_step": 501795, "epoch": 2986} {"train_loss": -12.595211029052734, "global_step": 501796, "epoch": 2986} {"train_loss": -11.725205421447754, "global_step": 501797, "epoch": 2986} {"train_loss": -12.676332473754883, "global_step": 501798, "epoch": 2986} {"train_loss": -12.559819221496582, "global_step": 501799, "epoch": 2986} {"train_loss": -12.373747825622559, "global_step": 501800, "epoch": 2986} {"train_loss": -12.523914337158203, "global_step": 501801, "epoch": 2986} {"train_loss": -12.603572845458984, "global_step": 501802, "epoch": 2986} {"train_loss": -11.78135871887207, "global_step": 501803, "epoch": 2986} {"train_loss": -11.964502334594727, "global_step": 501804, "epoch": 2986} {"train_loss": -12.692459106445312, "global_step": 501805, "epoch": 2986} {"train_loss": -12.656728744506836, "global_step": 501806, "epoch": 2986} {"train_loss": -12.567591667175293, "global_step": 501807, "epoch": 2986} {"train_loss": -12.465347290039062, "global_step": 501808, "epoch": 2986} {"train_loss": -12.818450927734375, "global_step": 501809, "epoch": 2986} {"train_loss": -12.621946334838867, "global_step": 501810, "epoch": 2986} {"train_loss": -12.788341522216797, "global_step": 501811, "epoch": 2986} {"train_loss": -12.727983474731445, "global_step": 501812, "epoch": 2986} {"train_loss": -12.988862991333008, "global_step": 501813, "epoch": 2986} {"train_loss": -12.78093147277832, "global_step": 501814, "epoch": 2986} {"train_loss": -12.166137757755461, "global_step": 501815, "epoch": 2986, "val_loss": 321879.3125} {"train_loss": -12.731880187988281, "global_step": 501816, "epoch": 2987} {"train_loss": -12.526348114013672, "global_step": 501817, "epoch": 2987} {"train_loss": -12.241642951965332, "global_step": 501818, "epoch": 2987} {"train_loss": -12.633056640625, "global_step": 501819, "epoch": 2987} {"train_loss": -12.049365043640137, "global_step": 501820, "epoch": 2987} {"train_loss": -12.115240097045898, "global_step": 501821, "epoch": 2987} {"train_loss": -12.324813842773438, "global_step": 501822, "epoch": 2987} {"train_loss": -12.222135543823242, "global_step": 501823, "epoch": 2987} {"train_loss": -11.846298217773438, "global_step": 501824, "epoch": 2987} {"train_loss": -12.63302230834961, "global_step": 501825, "epoch": 2987} {"train_loss": -11.962800979614258, "global_step": 501826, "epoch": 2987} {"train_loss": -12.512077331542969, "global_step": 501827, "epoch": 2987} {"train_loss": -12.085809707641602, "global_step": 501828, "epoch": 2987} {"train_loss": -12.480067253112793, "global_step": 501829, "epoch": 2987} {"train_loss": -12.265939712524414, "global_step": 501830, "epoch": 2987} {"train_loss": -12.735298156738281, "global_step": 501831, "epoch": 2987} {"train_loss": -11.940278053283691, "global_step": 501832, "epoch": 2987} {"train_loss": -11.588536262512207, "global_step": 501833, "epoch": 2987} {"train_loss": -12.587554931640625, "global_step": 501834, "epoch": 2987} {"train_loss": -11.291729927062988, "global_step": 501835, "epoch": 2987} {"train_loss": -11.622686386108398, "global_step": 501836, "epoch": 2987} {"train_loss": -12.308137893676758, "global_step": 501837, "epoch": 2987} {"train_loss": -11.266514778137207, "global_step": 501838, "epoch": 2987} {"train_loss": -12.488107681274414, "global_step": 501839, "epoch": 2987} {"train_loss": -10.932246208190918, "global_step": 501840, "epoch": 2987} {"train_loss": -11.63369369506836, "global_step": 501841, "epoch": 2987} {"train_loss": -11.411888122558594, "global_step": 501842, "epoch": 2987} {"train_loss": -10.238683700561523, "global_step": 501843, "epoch": 2987} {"train_loss": -10.772315979003906, "global_step": 501844, "epoch": 2987} {"train_loss": -10.894963264465332, "global_step": 501845, "epoch": 2987} {"train_loss": -11.179178237915039, "global_step": 501846, "epoch": 2987} {"train_loss": -9.549067497253418, "global_step": 501847, "epoch": 2987} {"train_loss": -11.232152938842773, "global_step": 501848, "epoch": 2987} {"train_loss": -8.967340469360352, "global_step": 501849, "epoch": 2987} {"train_loss": -9.306310653686523, "global_step": 501850, "epoch": 2987} {"train_loss": -10.31863784790039, "global_step": 501851, "epoch": 2987} {"train_loss": -9.896055221557617, "global_step": 501852, "epoch": 2987} {"train_loss": -10.663639068603516, "global_step": 501853, "epoch": 2987} {"train_loss": -9.478221893310547, "global_step": 501854, "epoch": 2987} {"train_loss": -10.687122344970703, "global_step": 501855, "epoch": 2987} {"train_loss": -10.784794807434082, "global_step": 501856, "epoch": 2987} {"train_loss": -10.646943092346191, "global_step": 501857, "epoch": 2987} {"train_loss": -11.383532524108887, "global_step": 501858, "epoch": 2987} {"train_loss": -11.633050918579102, "global_step": 501859, "epoch": 2987} {"train_loss": -10.893838882446289, "global_step": 501860, "epoch": 2987} {"train_loss": -11.347941398620605, "global_step": 501861, "epoch": 2987} {"train_loss": -11.141823768615723, "global_step": 501862, "epoch": 2987} {"train_loss": -11.32908821105957, "global_step": 501863, "epoch": 2987} {"train_loss": -10.566909790039062, "global_step": 501864, "epoch": 2987} {"train_loss": -11.173942565917969, "global_step": 501865, "epoch": 2987} {"train_loss": -11.219317436218262, "global_step": 501866, "epoch": 2987} {"train_loss": -12.007949829101562, "global_step": 501867, "epoch": 2987} {"train_loss": -11.200300216674805, "global_step": 501868, "epoch": 2987} {"train_loss": -12.215071678161621, "global_step": 501869, "epoch": 2987} {"train_loss": -11.422334671020508, "global_step": 501870, "epoch": 2987} {"train_loss": -12.100912094116211, "global_step": 501871, "epoch": 2987} {"train_loss": -11.45645523071289, "global_step": 501872, "epoch": 2987} {"train_loss": -11.554593086242676, "global_step": 501873, "epoch": 2987} {"train_loss": -12.138492584228516, "global_step": 501874, "epoch": 2987} {"train_loss": -11.231467247009277, "global_step": 501875, "epoch": 2987} {"train_loss": -12.121379852294922, "global_step": 501876, "epoch": 2987} {"train_loss": -10.871944427490234, "global_step": 501877, "epoch": 2987} {"train_loss": -12.20586109161377, "global_step": 501878, "epoch": 2987} {"train_loss": -11.1731595993042, "global_step": 501879, "epoch": 2987} {"train_loss": -12.14570426940918, "global_step": 501880, "epoch": 2987} {"train_loss": -11.695473670959473, "global_step": 501881, "epoch": 2987} {"train_loss": -12.274032592773438, "global_step": 501882, "epoch": 2987} {"train_loss": -12.014512062072754, "global_step": 501883, "epoch": 2987} {"train_loss": -11.751154899597168, "global_step": 501884, "epoch": 2987} {"train_loss": -12.247249603271484, "global_step": 501885, "epoch": 2987} {"train_loss": -12.109696388244629, "global_step": 501886, "epoch": 2987} {"train_loss": -12.165748596191406, "global_step": 501887, "epoch": 2987} {"train_loss": -12.26330280303955, "global_step": 501888, "epoch": 2987} {"train_loss": -12.416487693786621, "global_step": 501889, "epoch": 2987} {"train_loss": -12.132232666015625, "global_step": 501890, "epoch": 2987} {"train_loss": -12.37092399597168, "global_step": 501891, "epoch": 2987} {"train_loss": -11.970531463623047, "global_step": 501892, "epoch": 2987} {"train_loss": -12.476390838623047, "global_step": 501893, "epoch": 2987} {"train_loss": -12.50350284576416, "global_step": 501894, "epoch": 2987} {"train_loss": -12.48076343536377, "global_step": 501895, "epoch": 2987} {"train_loss": -12.496907234191895, "global_step": 501896, "epoch": 2987} {"train_loss": -12.361627578735352, "global_step": 501897, "epoch": 2987} {"train_loss": -12.657499313354492, "global_step": 501898, "epoch": 2987} {"train_loss": -12.259162902832031, "global_step": 501899, "epoch": 2987} {"train_loss": -12.663012504577637, "global_step": 501900, "epoch": 2987} {"train_loss": -12.655854225158691, "global_step": 501901, "epoch": 2987} {"train_loss": -12.594510078430176, "global_step": 501902, "epoch": 2987} {"train_loss": -12.767950057983398, "global_step": 501903, "epoch": 2987} {"train_loss": -12.589435577392578, "global_step": 501904, "epoch": 2987} {"train_loss": -12.662555694580078, "global_step": 501905, "epoch": 2987} {"train_loss": -12.544364929199219, "global_step": 501906, "epoch": 2987} {"train_loss": -12.464582443237305, "global_step": 501907, "epoch": 2987} {"train_loss": -12.433558464050293, "global_step": 501908, "epoch": 2987} {"train_loss": -12.731988906860352, "global_step": 501909, "epoch": 2987} {"train_loss": -12.746856689453125, "global_step": 501910, "epoch": 2987} {"train_loss": -12.484745025634766, "global_step": 501911, "epoch": 2987} {"train_loss": -12.664745330810547, "global_step": 501912, "epoch": 2987} {"train_loss": -12.648244857788086, "global_step": 501913, "epoch": 2987} {"train_loss": -12.714975357055664, "global_step": 501914, "epoch": 2987} {"train_loss": -12.38009262084961, "global_step": 501915, "epoch": 2987} {"train_loss": -12.419904708862305, "global_step": 501916, "epoch": 2987} {"train_loss": -12.715831756591797, "global_step": 501917, "epoch": 2987} {"train_loss": -12.719017028808594, "global_step": 501918, "epoch": 2987} {"train_loss": -12.80972671508789, "global_step": 501919, "epoch": 2987} {"train_loss": -12.821836471557617, "global_step": 501920, "epoch": 2987} {"train_loss": -12.777427673339844, "global_step": 501921, "epoch": 2987} {"train_loss": -12.848367691040039, "global_step": 501922, "epoch": 2987} {"train_loss": -12.827655792236328, "global_step": 501923, "epoch": 2987} {"train_loss": -12.77282428741455, "global_step": 501924, "epoch": 2987} {"train_loss": -12.78681755065918, "global_step": 501925, "epoch": 2987} {"train_loss": -12.667407989501953, "global_step": 501926, "epoch": 2987} {"train_loss": -12.946907997131348, "global_step": 501927, "epoch": 2987} {"train_loss": -12.830490112304688, "global_step": 501928, "epoch": 2987} {"train_loss": -12.678828239440918, "global_step": 501929, "epoch": 2987} {"train_loss": -12.940414428710938, "global_step": 501930, "epoch": 2987} {"train_loss": -12.893394470214844, "global_step": 501931, "epoch": 2987} {"train_loss": -12.949968338012695, "global_step": 501932, "epoch": 2987} {"train_loss": -12.817194938659668, "global_step": 501933, "epoch": 2987} {"train_loss": -12.54454231262207, "global_step": 501934, "epoch": 2987} {"train_loss": -12.688554763793945, "global_step": 501935, "epoch": 2987} {"train_loss": -13.035722732543945, "global_step": 501936, "epoch": 2987} {"train_loss": -12.966255187988281, "global_step": 501937, "epoch": 2987} {"train_loss": -12.627057075500488, "global_step": 501938, "epoch": 2987} {"train_loss": -12.905192375183105, "global_step": 501939, "epoch": 2987} {"train_loss": -12.722877502441406, "global_step": 501940, "epoch": 2987} {"train_loss": -12.672837257385254, "global_step": 501941, "epoch": 2987} {"train_loss": -13.080039024353027, "global_step": 501942, "epoch": 2987} {"train_loss": -12.849347114562988, "global_step": 501943, "epoch": 2987} {"train_loss": -12.619117736816406, "global_step": 501944, "epoch": 2987} {"train_loss": -12.817227363586426, "global_step": 501945, "epoch": 2987} {"train_loss": -12.812435150146484, "global_step": 501946, "epoch": 2987} {"train_loss": -12.402457237243652, "global_step": 501947, "epoch": 2987} {"train_loss": -11.51392936706543, "global_step": 501948, "epoch": 2987} {"train_loss": -11.429194450378418, "global_step": 501949, "epoch": 2987} {"train_loss": -12.0469970703125, "global_step": 501950, "epoch": 2987} {"train_loss": -12.423959732055664, "global_step": 501951, "epoch": 2987} {"train_loss": -10.61897087097168, "global_step": 501952, "epoch": 2987} {"train_loss": -11.415910720825195, "global_step": 501953, "epoch": 2987} {"train_loss": -12.333588600158691, "global_step": 501954, "epoch": 2987} {"train_loss": -10.44266414642334, "global_step": 501955, "epoch": 2987} {"train_loss": -10.825796127319336, "global_step": 501956, "epoch": 2987} {"train_loss": -12.154703140258789, "global_step": 501957, "epoch": 2987} {"train_loss": -9.027572631835938, "global_step": 501958, "epoch": 2987} {"train_loss": -9.078941345214844, "global_step": 501959, "epoch": 2987} {"train_loss": -10.928926467895508, "global_step": 501960, "epoch": 2987} {"train_loss": -10.819711685180664, "global_step": 501961, "epoch": 2987} {"train_loss": -9.567913055419922, "global_step": 501962, "epoch": 2987} {"train_loss": -11.084442138671875, "global_step": 501963, "epoch": 2987} {"train_loss": -10.269533157348633, "global_step": 501964, "epoch": 2987} {"train_loss": -9.439846992492676, "global_step": 501965, "epoch": 2987} {"train_loss": -11.250938415527344, "global_step": 501966, "epoch": 2987} {"train_loss": -8.78550910949707, "global_step": 501967, "epoch": 2987} {"train_loss": -11.882790565490723, "global_step": 501968, "epoch": 2987} {"train_loss": -8.806905746459961, "global_step": 501969, "epoch": 2987} {"train_loss": -11.125582695007324, "global_step": 501970, "epoch": 2987} {"train_loss": -11.572619438171387, "global_step": 501971, "epoch": 2987} {"train_loss": -10.473840713500977, "global_step": 501972, "epoch": 2987} {"train_loss": -12.208457946777344, "global_step": 501973, "epoch": 2987} {"train_loss": -10.708386421203613, "global_step": 501974, "epoch": 2987} {"train_loss": -11.964944839477539, "global_step": 501975, "epoch": 2987} {"train_loss": -10.736848831176758, "global_step": 501976, "epoch": 2987} {"train_loss": -11.472021102905273, "global_step": 501977, "epoch": 2987} {"train_loss": -11.871374130249023, "global_step": 501978, "epoch": 2987} {"train_loss": -11.837498664855957, "global_step": 501979, "epoch": 2987} {"train_loss": -11.270995140075684, "global_step": 501980, "epoch": 2987} {"train_loss": -11.41822624206543, "global_step": 501981, "epoch": 2987} {"train_loss": -11.238784790039062, "global_step": 501982, "epoch": 2987} {"train_loss": -11.80754574139913, "global_step": 501983, "epoch": 2987, "val_loss": 313117.125} {"train_loss": -11.725435256958008, "global_step": 501984, "epoch": 2988} {"train_loss": -10.656173706054688, "global_step": 501985, "epoch": 2988} {"train_loss": -11.518196105957031, "global_step": 501986, "epoch": 2988} {"train_loss": -10.894878387451172, "global_step": 501987, "epoch": 2988} {"train_loss": -10.254318237304688, "global_step": 501988, "epoch": 2988} {"train_loss": -11.698850631713867, "global_step": 501989, "epoch": 2988} {"train_loss": -11.151287078857422, "global_step": 501990, "epoch": 2988} {"train_loss": -10.329230308532715, "global_step": 501991, "epoch": 2988} {"train_loss": -11.646303176879883, "global_step": 501992, "epoch": 2988} {"train_loss": -10.579115867614746, "global_step": 501993, "epoch": 2988} {"train_loss": -11.473526954650879, "global_step": 501994, "epoch": 2988} {"train_loss": -12.191688537597656, "global_step": 501995, "epoch": 2988} {"train_loss": -11.410846710205078, "global_step": 501996, "epoch": 2988} {"train_loss": -11.976439476013184, "global_step": 501997, "epoch": 2988} {"train_loss": -11.249351501464844, "global_step": 501998, "epoch": 2988} {"train_loss": -11.943903923034668, "global_step": 501999, "epoch": 2988} {"train_loss": -11.874042510986328, "global_step": 502000, "epoch": 2988} {"train_loss": -12.185693740844727, "global_step": 502001, "epoch": 2988} {"train_loss": -12.111116409301758, "global_step": 502002, "epoch": 2988} {"train_loss": -11.978989601135254, "global_step": 502003, "epoch": 2988} {"train_loss": -12.476919174194336, "global_step": 502004, "epoch": 2988} {"train_loss": -11.889537811279297, "global_step": 502005, "epoch": 2988} {"train_loss": -11.9931001663208, "global_step": 502006, "epoch": 2988} {"train_loss": -12.144527435302734, "global_step": 502007, "epoch": 2988} {"train_loss": -11.94002628326416, "global_step": 502008, "epoch": 2988} {"train_loss": -12.166845321655273, "global_step": 502009, "epoch": 2988} {"train_loss": -12.091597557067871, "global_step": 502010, "epoch": 2988} {"train_loss": -12.332411766052246, "global_step": 502011, "epoch": 2988} {"train_loss": -12.099183082580566, "global_step": 502012, "epoch": 2988} {"train_loss": -12.378296852111816, "global_step": 502013, "epoch": 2988} {"train_loss": -12.329081535339355, "global_step": 502014, "epoch": 2988} {"train_loss": -12.25550651550293, "global_step": 502015, "epoch": 2988} {"train_loss": -12.166893005371094, "global_step": 502016, "epoch": 2988} {"train_loss": -12.523126602172852, "global_step": 502017, "epoch": 2988} {"train_loss": -12.221946716308594, "global_step": 502018, "epoch": 2988} {"train_loss": -12.57142448425293, "global_step": 502019, "epoch": 2988} {"train_loss": -12.48680591583252, "global_step": 502020, "epoch": 2988} {"train_loss": -12.448738098144531, "global_step": 502021, "epoch": 2988} {"train_loss": -12.569881439208984, "global_step": 502022, "epoch": 2988} {"train_loss": -12.575906753540039, "global_step": 502023, "epoch": 2988} {"train_loss": -12.713372230529785, "global_step": 502024, "epoch": 2988} {"train_loss": -12.595684051513672, "global_step": 502025, "epoch": 2988} {"train_loss": -12.53718376159668, "global_step": 502026, "epoch": 2988} {"train_loss": -12.726974487304688, "global_step": 502027, "epoch": 2988} {"train_loss": -12.760807991027832, "global_step": 502028, "epoch": 2988} {"train_loss": -12.357519149780273, "global_step": 502029, "epoch": 2988} {"train_loss": -12.585691452026367, "global_step": 502030, "epoch": 2988} {"train_loss": -12.324047088623047, "global_step": 502031, "epoch": 2988} {"train_loss": -12.554386138916016, "global_step": 502032, "epoch": 2988} {"train_loss": -12.746403694152832, "global_step": 502033, "epoch": 2988} {"train_loss": -12.417915344238281, "global_step": 502034, "epoch": 2988} {"train_loss": -12.624164581298828, "global_step": 502035, "epoch": 2988} {"train_loss": -12.432196617126465, "global_step": 502036, "epoch": 2988} {"train_loss": -12.63195514678955, "global_step": 502037, "epoch": 2988} {"train_loss": -12.420255661010742, "global_step": 502038, "epoch": 2988} {"train_loss": -12.788224220275879, "global_step": 502039, "epoch": 2988} {"train_loss": -12.559863090515137, "global_step": 502040, "epoch": 2988} {"train_loss": -12.637663841247559, "global_step": 502041, "epoch": 2988} {"train_loss": -12.730388641357422, "global_step": 502042, "epoch": 2988} {"train_loss": -12.272703170776367, "global_step": 502043, "epoch": 2988} {"train_loss": -12.903999328613281, "global_step": 502044, "epoch": 2988} {"train_loss": -12.421825408935547, "global_step": 502045, "epoch": 2988} {"train_loss": -12.732946395874023, "global_step": 502046, "epoch": 2988} {"train_loss": -12.528877258300781, "global_step": 502047, "epoch": 2988} {"train_loss": -12.785301208496094, "global_step": 502048, "epoch": 2988} {"train_loss": -12.643068313598633, "global_step": 502049, "epoch": 2988} {"train_loss": -12.752593040466309, "global_step": 502050, "epoch": 2988} {"train_loss": -12.88853645324707, "global_step": 502051, "epoch": 2988} {"train_loss": -12.476234436035156, "global_step": 502052, "epoch": 2988} {"train_loss": -12.984039306640625, "global_step": 502053, "epoch": 2988} {"train_loss": -12.640039443969727, "global_step": 502054, "epoch": 2988} {"train_loss": -12.768047332763672, "global_step": 502055, "epoch": 2988} {"train_loss": -12.7117280960083, "global_step": 502056, "epoch": 2988} {"train_loss": -12.945082664489746, "global_step": 502057, "epoch": 2988} {"train_loss": -12.727262496948242, "global_step": 502058, "epoch": 2988} {"train_loss": -12.670047760009766, "global_step": 502059, "epoch": 2988} {"train_loss": -12.729578018188477, "global_step": 502060, "epoch": 2988} {"train_loss": -12.79188346862793, "global_step": 502061, "epoch": 2988} {"train_loss": -12.811155319213867, "global_step": 502062, "epoch": 2988} {"train_loss": -12.663480758666992, "global_step": 502063, "epoch": 2988} {"train_loss": -12.84608268737793, "global_step": 502064, "epoch": 2988} {"train_loss": -12.744285583496094, "global_step": 502065, "epoch": 2988} {"train_loss": -12.939435958862305, "global_step": 502066, "epoch": 2988} {"train_loss": -12.87502670288086, "global_step": 502067, "epoch": 2988} {"train_loss": -12.968968391418457, "global_step": 502068, "epoch": 2988} {"train_loss": -12.92390251159668, "global_step": 502069, "epoch": 2988} {"train_loss": -12.897275924682617, "global_step": 502070, "epoch": 2988} {"train_loss": -12.83981704711914, "global_step": 502071, "epoch": 2988} {"train_loss": -12.950937271118164, "global_step": 502072, "epoch": 2988} {"train_loss": -12.972219467163086, "global_step": 502073, "epoch": 2988} {"train_loss": -12.670772552490234, "global_step": 502074, "epoch": 2988} {"train_loss": -13.004688262939453, "global_step": 502075, "epoch": 2988} {"train_loss": -13.044553756713867, "global_step": 502076, "epoch": 2988} {"train_loss": -13.023574829101562, "global_step": 502077, "epoch": 2988} {"train_loss": -12.860599517822266, "global_step": 502078, "epoch": 2988} {"train_loss": -13.046122550964355, "global_step": 502079, "epoch": 2988} {"train_loss": -12.83370590209961, "global_step": 502080, "epoch": 2988} {"train_loss": -12.884881973266602, "global_step": 502081, "epoch": 2988} {"train_loss": -13.081653594970703, "global_step": 502082, "epoch": 2988} {"train_loss": -12.92894458770752, "global_step": 502083, "epoch": 2988} {"train_loss": -12.721089363098145, "global_step": 502084, "epoch": 2988} {"train_loss": -12.883874893188477, "global_step": 502085, "epoch": 2988} {"train_loss": -12.900653839111328, "global_step": 502086, "epoch": 2988} {"train_loss": -12.874795913696289, "global_step": 502087, "epoch": 2988} {"train_loss": -12.99905776977539, "global_step": 502088, "epoch": 2988} {"train_loss": -12.992897033691406, "global_step": 502089, "epoch": 2988} {"train_loss": -12.840790748596191, "global_step": 502090, "epoch": 2988} {"train_loss": -12.645048141479492, "global_step": 502091, "epoch": 2988} {"train_loss": -12.776552200317383, "global_step": 502092, "epoch": 2988} {"train_loss": -12.331626892089844, "global_step": 502093, "epoch": 2988} {"train_loss": -13.047920227050781, "global_step": 502094, "epoch": 2988} {"train_loss": -12.257840156555176, "global_step": 502095, "epoch": 2988} {"train_loss": -11.877284049987793, "global_step": 502096, "epoch": 2988} {"train_loss": -12.826009750366211, "global_step": 502097, "epoch": 2988} {"train_loss": -12.083610534667969, "global_step": 502098, "epoch": 2988} {"train_loss": -11.583292007446289, "global_step": 502099, "epoch": 2988} {"train_loss": -12.792513847351074, "global_step": 502100, "epoch": 2988} {"train_loss": -12.534406661987305, "global_step": 502101, "epoch": 2988} {"train_loss": -12.739524841308594, "global_step": 502102, "epoch": 2988} {"train_loss": -12.763870239257812, "global_step": 502103, "epoch": 2988} {"train_loss": -12.781947135925293, "global_step": 502104, "epoch": 2988} {"train_loss": -12.456476211547852, "global_step": 502105, "epoch": 2988} {"train_loss": -12.190231323242188, "global_step": 502106, "epoch": 2988} {"train_loss": -12.691886901855469, "global_step": 502107, "epoch": 2988} {"train_loss": -12.516437530517578, "global_step": 502108, "epoch": 2988} {"train_loss": -12.187633514404297, "global_step": 502109, "epoch": 2988} {"train_loss": -11.598220825195312, "global_step": 502110, "epoch": 2988} {"train_loss": -11.403849601745605, "global_step": 502111, "epoch": 2988} {"train_loss": -11.264787673950195, "global_step": 502112, "epoch": 2988} {"train_loss": -11.827340126037598, "global_step": 502113, "epoch": 2988} {"train_loss": -10.714984893798828, "global_step": 502114, "epoch": 2988} {"train_loss": -10.658683776855469, "global_step": 502115, "epoch": 2988} {"train_loss": -9.149059295654297, "global_step": 502116, "epoch": 2988} {"train_loss": -11.081914901733398, "global_step": 502117, "epoch": 2988} {"train_loss": -9.229242324829102, "global_step": 502118, "epoch": 2988} {"train_loss": -9.42570972442627, "global_step": 502119, "epoch": 2988} {"train_loss": -9.796215057373047, "global_step": 502120, "epoch": 2988} {"train_loss": -9.112668991088867, "global_step": 502121, "epoch": 2988} {"train_loss": -11.183300018310547, "global_step": 502122, "epoch": 2988} {"train_loss": -8.887199401855469, "global_step": 502123, "epoch": 2988} {"train_loss": -8.922024726867676, "global_step": 502124, "epoch": 2988} {"train_loss": -10.950211524963379, "global_step": 502125, "epoch": 2988} {"train_loss": -10.188664436340332, "global_step": 502126, "epoch": 2988} {"train_loss": -10.515251159667969, "global_step": 502127, "epoch": 2988} {"train_loss": -11.165538787841797, "global_step": 502128, "epoch": 2988} {"train_loss": -10.041849136352539, "global_step": 502129, "epoch": 2988} {"train_loss": -11.488525390625, "global_step": 502130, "epoch": 2988} {"train_loss": -10.36264705657959, "global_step": 502131, "epoch": 2988} {"train_loss": -11.622791290283203, "global_step": 502132, "epoch": 2988} {"train_loss": -11.61497688293457, "global_step": 502133, "epoch": 2988} {"train_loss": -11.539426803588867, "global_step": 502134, "epoch": 2988} {"train_loss": -11.330708503723145, "global_step": 502135, "epoch": 2988} {"train_loss": -12.107892990112305, "global_step": 502136, "epoch": 2988} {"train_loss": -10.698066711425781, "global_step": 502137, "epoch": 2988} {"train_loss": -12.325804710388184, "global_step": 502138, "epoch": 2988} {"train_loss": -11.269307136535645, "global_step": 502139, "epoch": 2988} {"train_loss": -11.227184295654297, "global_step": 502140, "epoch": 2988} {"train_loss": -11.763290405273438, "global_step": 502141, "epoch": 2988} {"train_loss": -10.743955612182617, "global_step": 502142, "epoch": 2988} {"train_loss": -11.89295768737793, "global_step": 502143, "epoch": 2988} {"train_loss": -11.641313552856445, "global_step": 502144, "epoch": 2988} {"train_loss": -12.029407501220703, "global_step": 502145, "epoch": 2988} {"train_loss": -11.955190658569336, "global_step": 502146, "epoch": 2988} {"train_loss": -11.173473358154297, "global_step": 502147, "epoch": 2988} {"train_loss": -12.059120178222656, "global_step": 502148, "epoch": 2988} {"train_loss": -11.686227798461914, "global_step": 502149, "epoch": 2988} {"train_loss": -12.1498441696167, "global_step": 502150, "epoch": 2988} {"train_loss": -12.066589258965992, "global_step": 502151, "epoch": 2988, "val_loss": 316560.5625} {"train_loss": -11.41646671295166, "global_step": 502152, "epoch": 2989} {"train_loss": -12.126667976379395, "global_step": 502153, "epoch": 2989} {"train_loss": -11.17496109008789, "global_step": 502154, "epoch": 2989} {"train_loss": -12.533929824829102, "global_step": 502155, "epoch": 2989} {"train_loss": -11.694077491760254, "global_step": 502156, "epoch": 2989} {"train_loss": -12.15380859375, "global_step": 502157, "epoch": 2989} {"train_loss": -11.994834899902344, "global_step": 502158, "epoch": 2989} {"train_loss": -12.047242164611816, "global_step": 502159, "epoch": 2989} {"train_loss": -11.647253036499023, "global_step": 502160, "epoch": 2989} {"train_loss": -11.94144058227539, "global_step": 502161, "epoch": 2989} {"train_loss": -11.705631256103516, "global_step": 502162, "epoch": 2989} {"train_loss": -12.565084457397461, "global_step": 502163, "epoch": 2989} {"train_loss": -12.05856704711914, "global_step": 502164, "epoch": 2989} {"train_loss": -12.157462120056152, "global_step": 502165, "epoch": 2989} {"train_loss": -12.161916732788086, "global_step": 502166, "epoch": 2989} {"train_loss": -12.198127746582031, "global_step": 502167, "epoch": 2989} {"train_loss": -12.56020736694336, "global_step": 502168, "epoch": 2989} {"train_loss": -12.005760192871094, "global_step": 502169, "epoch": 2989} {"train_loss": -12.25739860534668, "global_step": 502170, "epoch": 2989} {"train_loss": -12.087568283081055, "global_step": 502171, "epoch": 2989} {"train_loss": -11.972808837890625, "global_step": 502172, "epoch": 2989} {"train_loss": -12.42180061340332, "global_step": 502173, "epoch": 2989} {"train_loss": -11.803837776184082, "global_step": 502174, "epoch": 2989} {"train_loss": -12.090309143066406, "global_step": 502175, "epoch": 2989} {"train_loss": -12.028295516967773, "global_step": 502176, "epoch": 2989} {"train_loss": -12.384895324707031, "global_step": 502177, "epoch": 2989} {"train_loss": -12.190383911132812, "global_step": 502178, "epoch": 2989} {"train_loss": -12.204955101013184, "global_step": 502179, "epoch": 2989} {"train_loss": -12.564756393432617, "global_step": 502180, "epoch": 2989} {"train_loss": -12.06972599029541, "global_step": 502181, "epoch": 2989} {"train_loss": -12.1795654296875, "global_step": 502182, "epoch": 2989} {"train_loss": -12.413900375366211, "global_step": 502183, "epoch": 2989} {"train_loss": -12.136600494384766, "global_step": 502184, "epoch": 2989} {"train_loss": -12.416496276855469, "global_step": 502185, "epoch": 2989} {"train_loss": -12.175336837768555, "global_step": 502186, "epoch": 2989} {"train_loss": -12.606225967407227, "global_step": 502187, "epoch": 2989} {"train_loss": -12.365674018859863, "global_step": 502188, "epoch": 2989} {"train_loss": -12.417903900146484, "global_step": 502189, "epoch": 2989} {"train_loss": -12.312519073486328, "global_step": 502190, "epoch": 2989} {"train_loss": -12.62485122680664, "global_step": 502191, "epoch": 2989} {"train_loss": -12.269143104553223, "global_step": 502192, "epoch": 2989} {"train_loss": -12.759857177734375, "global_step": 502193, "epoch": 2989} {"train_loss": -12.419912338256836, "global_step": 502194, "epoch": 2989} {"train_loss": -12.64793586730957, "global_step": 502195, "epoch": 2989} {"train_loss": -12.482660293579102, "global_step": 502196, "epoch": 2989} {"train_loss": -12.495931625366211, "global_step": 502197, "epoch": 2989} {"train_loss": -12.571138381958008, "global_step": 502198, "epoch": 2989} {"train_loss": -12.359159469604492, "global_step": 502199, "epoch": 2989} {"train_loss": -12.63241958618164, "global_step": 502200, "epoch": 2989} {"train_loss": -12.420303344726562, "global_step": 502201, "epoch": 2989} {"train_loss": -12.355252265930176, "global_step": 502202, "epoch": 2989} {"train_loss": -12.427823066711426, "global_step": 502203, "epoch": 2989} {"train_loss": -12.452018737792969, "global_step": 502204, "epoch": 2989} {"train_loss": -12.693739891052246, "global_step": 502205, "epoch": 2989} {"train_loss": -12.074556350708008, "global_step": 502206, "epoch": 2989} {"train_loss": -12.758247375488281, "global_step": 502207, "epoch": 2989} {"train_loss": -12.429632186889648, "global_step": 502208, "epoch": 2989} {"train_loss": -12.536497116088867, "global_step": 502209, "epoch": 2989} {"train_loss": -12.728570938110352, "global_step": 502210, "epoch": 2989} {"train_loss": -12.39580249786377, "global_step": 502211, "epoch": 2989} {"train_loss": -12.700901985168457, "global_step": 502212, "epoch": 2989} {"train_loss": -12.481128692626953, "global_step": 502213, "epoch": 2989} {"train_loss": -12.650684356689453, "global_step": 502214, "epoch": 2989} {"train_loss": -12.432533264160156, "global_step": 502215, "epoch": 2989} {"train_loss": -12.539791107177734, "global_step": 502216, "epoch": 2989} {"train_loss": -12.548078536987305, "global_step": 502217, "epoch": 2989} {"train_loss": -12.312850952148438, "global_step": 502218, "epoch": 2989} {"train_loss": -12.709911346435547, "global_step": 502219, "epoch": 2989} {"train_loss": -12.325508117675781, "global_step": 502220, "epoch": 2989} {"train_loss": -12.434242248535156, "global_step": 502221, "epoch": 2989} {"train_loss": -12.528193473815918, "global_step": 502222, "epoch": 2989} {"train_loss": -12.478675842285156, "global_step": 502223, "epoch": 2989} {"train_loss": -12.679862976074219, "global_step": 502224, "epoch": 2989} {"train_loss": -12.586700439453125, "global_step": 502225, "epoch": 2989} {"train_loss": -12.630130767822266, "global_step": 502226, "epoch": 2989} {"train_loss": -12.284438133239746, "global_step": 502227, "epoch": 2989} {"train_loss": -12.481300354003906, "global_step": 502228, "epoch": 2989} {"train_loss": -12.56174087524414, "global_step": 502229, "epoch": 2989} {"train_loss": -12.765979766845703, "global_step": 502230, "epoch": 2989} {"train_loss": -12.688253402709961, "global_step": 502231, "epoch": 2989} {"train_loss": -12.437607765197754, "global_step": 502232, "epoch": 2989} {"train_loss": -12.638337135314941, "global_step": 502233, "epoch": 2989} {"train_loss": -12.456263542175293, "global_step": 502234, "epoch": 2989} {"train_loss": -12.271970748901367, "global_step": 502235, "epoch": 2989} {"train_loss": -12.671415328979492, "global_step": 502236, "epoch": 2989} {"train_loss": -11.968979835510254, "global_step": 502237, "epoch": 2989} {"train_loss": -12.393281936645508, "global_step": 502238, "epoch": 2989} {"train_loss": -12.85250473022461, "global_step": 502239, "epoch": 2989} {"train_loss": -12.34645938873291, "global_step": 502240, "epoch": 2989} {"train_loss": -12.706625938415527, "global_step": 502241, "epoch": 2989} {"train_loss": -12.558660507202148, "global_step": 502242, "epoch": 2989} {"train_loss": -12.283802032470703, "global_step": 502243, "epoch": 2989} {"train_loss": -12.397966384887695, "global_step": 502244, "epoch": 2989} {"train_loss": -13.025124549865723, "global_step": 502245, "epoch": 2989} {"train_loss": -12.65719985961914, "global_step": 502246, "epoch": 2989} {"train_loss": -12.687604904174805, "global_step": 502247, "epoch": 2989} {"train_loss": -12.683126449584961, "global_step": 502248, "epoch": 2989} {"train_loss": -12.574798583984375, "global_step": 502249, "epoch": 2989} {"train_loss": -12.59604263305664, "global_step": 502250, "epoch": 2989} {"train_loss": -12.854134559631348, "global_step": 502251, "epoch": 2989} {"train_loss": -12.741804122924805, "global_step": 502252, "epoch": 2989} {"train_loss": -12.798301696777344, "global_step": 502253, "epoch": 2989} {"train_loss": -12.867574691772461, "global_step": 502254, "epoch": 2989} {"train_loss": -12.69719123840332, "global_step": 502255, "epoch": 2989} {"train_loss": -12.857433319091797, "global_step": 502256, "epoch": 2989} {"train_loss": -12.688146591186523, "global_step": 502257, "epoch": 2989} {"train_loss": -12.960712432861328, "global_step": 502258, "epoch": 2989} {"train_loss": -12.69451904296875, "global_step": 502259, "epoch": 2989} {"train_loss": -12.541572570800781, "global_step": 502260, "epoch": 2989} {"train_loss": -12.780815124511719, "global_step": 502261, "epoch": 2989} {"train_loss": -12.888603210449219, "global_step": 502262, "epoch": 2989} {"train_loss": -12.870261192321777, "global_step": 502263, "epoch": 2989} {"train_loss": -12.703217506408691, "global_step": 502264, "epoch": 2989} {"train_loss": -12.73099422454834, "global_step": 502265, "epoch": 2989} {"train_loss": -12.78072452545166, "global_step": 502266, "epoch": 2989} {"train_loss": -12.873268127441406, "global_step": 502267, "epoch": 2989} {"train_loss": -12.729326248168945, "global_step": 502268, "epoch": 2989} {"train_loss": -12.868046760559082, "global_step": 502269, "epoch": 2989} {"train_loss": -12.670711517333984, "global_step": 502270, "epoch": 2989} {"train_loss": -12.596588134765625, "global_step": 502271, "epoch": 2989} {"train_loss": -12.770672798156738, "global_step": 502272, "epoch": 2989} {"train_loss": -12.896474838256836, "global_step": 502273, "epoch": 2989} {"train_loss": -13.053487777709961, "global_step": 502274, "epoch": 2989} {"train_loss": -12.823980331420898, "global_step": 502275, "epoch": 2989} {"train_loss": -12.676046371459961, "global_step": 502276, "epoch": 2989} {"train_loss": -12.807517051696777, "global_step": 502277, "epoch": 2989} {"train_loss": -12.681694984436035, "global_step": 502278, "epoch": 2989} {"train_loss": -12.794798851013184, "global_step": 502279, "epoch": 2989} {"train_loss": -12.501056671142578, "global_step": 502280, "epoch": 2989} {"train_loss": -12.723426818847656, "global_step": 502281, "epoch": 2989} {"train_loss": -12.604945182800293, "global_step": 502282, "epoch": 2989} {"train_loss": -12.636690139770508, "global_step": 502283, "epoch": 2989} {"train_loss": -12.749399185180664, "global_step": 502284, "epoch": 2989} {"train_loss": -12.764362335205078, "global_step": 502285, "epoch": 2989} {"train_loss": -12.489145278930664, "global_step": 502286, "epoch": 2989} {"train_loss": -12.828773498535156, "global_step": 502287, "epoch": 2989} {"train_loss": -12.765056610107422, "global_step": 502288, "epoch": 2989} {"train_loss": -12.524506568908691, "global_step": 502289, "epoch": 2989} {"train_loss": -12.551457405090332, "global_step": 502290, "epoch": 2989} {"train_loss": -12.396968841552734, "global_step": 502291, "epoch": 2989} {"train_loss": -12.049124717712402, "global_step": 502292, "epoch": 2989} {"train_loss": -12.698587417602539, "global_step": 502293, "epoch": 2989} {"train_loss": -11.883017539978027, "global_step": 502294, "epoch": 2989} {"train_loss": -12.498730659484863, "global_step": 502295, "epoch": 2989} {"train_loss": -11.991434097290039, "global_step": 502296, "epoch": 2989} {"train_loss": -12.580804824829102, "global_step": 502297, "epoch": 2989} {"train_loss": -12.37354564666748, "global_step": 502298, "epoch": 2989} {"train_loss": -12.325634002685547, "global_step": 502299, "epoch": 2989} {"train_loss": -12.70228099822998, "global_step": 502300, "epoch": 2989} {"train_loss": -12.793092727661133, "global_step": 502301, "epoch": 2989} {"train_loss": -12.769211769104004, "global_step": 502302, "epoch": 2989} {"train_loss": -12.666170120239258, "global_step": 502303, "epoch": 2989} {"train_loss": -12.73142147064209, "global_step": 502304, "epoch": 2989} {"train_loss": -12.811243057250977, "global_step": 502305, "epoch": 2989} {"train_loss": -12.593218803405762, "global_step": 502306, "epoch": 2989} {"train_loss": -12.79787826538086, "global_step": 502307, "epoch": 2989} {"train_loss": -12.529581069946289, "global_step": 502308, "epoch": 2989} {"train_loss": -11.83138656616211, "global_step": 502309, "epoch": 2989} {"train_loss": -11.974576950073242, "global_step": 502310, "epoch": 2989} {"train_loss": -12.754470825195312, "global_step": 502311, "epoch": 2989} {"train_loss": -12.436793327331543, "global_step": 502312, "epoch": 2989} {"train_loss": -12.212137222290039, "global_step": 502313, "epoch": 2989} {"train_loss": -12.653624534606934, "global_step": 502314, "epoch": 2989} {"train_loss": -12.203645706176758, "global_step": 502315, "epoch": 2989} {"train_loss": -12.296048164367676, "global_step": 502316, "epoch": 2989} {"train_loss": -11.410836219787598, "global_step": 502317, "epoch": 2989} {"train_loss": -11.23865032196045, "global_step": 502318, "epoch": 2989} {"train_loss": -12.453737281617665, "global_step": 502319, "epoch": 2989, "val_loss": 319173.375} {"train_loss": -12.501143455505371, "global_step": 502320, "epoch": 2990} {"train_loss": -11.128082275390625, "global_step": 502321, "epoch": 2990} {"train_loss": -11.37492561340332, "global_step": 502322, "epoch": 2990} {"train_loss": -11.467794418334961, "global_step": 502323, "epoch": 2990} {"train_loss": -10.348849296569824, "global_step": 502324, "epoch": 2990} {"train_loss": -12.187808990478516, "global_step": 502325, "epoch": 2990} {"train_loss": -11.95705509185791, "global_step": 502326, "epoch": 2990} {"train_loss": -11.400849342346191, "global_step": 502327, "epoch": 2990} {"train_loss": -11.29969596862793, "global_step": 502328, "epoch": 2990} {"train_loss": -11.06747817993164, "global_step": 502329, "epoch": 2990} {"train_loss": -10.741911888122559, "global_step": 502330, "epoch": 2990} {"train_loss": -11.358139991760254, "global_step": 502331, "epoch": 2990} {"train_loss": -9.540115356445312, "global_step": 502332, "epoch": 2990} {"train_loss": -11.806120872497559, "global_step": 502333, "epoch": 2990} {"train_loss": -10.351190567016602, "global_step": 502334, "epoch": 2990} {"train_loss": -10.725776672363281, "global_step": 502335, "epoch": 2990} {"train_loss": -11.59049129486084, "global_step": 502336, "epoch": 2990} {"train_loss": -9.865358352661133, "global_step": 502337, "epoch": 2990} {"train_loss": -11.563051223754883, "global_step": 502338, "epoch": 2990} {"train_loss": -11.07673454284668, "global_step": 502339, "epoch": 2990} {"train_loss": -11.636051177978516, "global_step": 502340, "epoch": 2990} {"train_loss": -11.4540433883667, "global_step": 502341, "epoch": 2990} {"train_loss": -11.124399185180664, "global_step": 502342, "epoch": 2990} {"train_loss": -11.790607452392578, "global_step": 502343, "epoch": 2990} {"train_loss": -10.802204132080078, "global_step": 502344, "epoch": 2990} {"train_loss": -11.714622497558594, "global_step": 502345, "epoch": 2990} {"train_loss": -10.689254760742188, "global_step": 502346, "epoch": 2990} {"train_loss": -11.453207015991211, "global_step": 502347, "epoch": 2990} {"train_loss": -9.21452522277832, "global_step": 502348, "epoch": 2990} {"train_loss": -11.004711151123047, "global_step": 502349, "epoch": 2990} {"train_loss": -9.876116752624512, "global_step": 502350, "epoch": 2990} {"train_loss": -11.275873184204102, "global_step": 502351, "epoch": 2990} {"train_loss": -9.66606330871582, "global_step": 502352, "epoch": 2990} {"train_loss": -10.370567321777344, "global_step": 502353, "epoch": 2990} {"train_loss": -10.903240203857422, "global_step": 502354, "epoch": 2990} {"train_loss": -10.787110328674316, "global_step": 502355, "epoch": 2990} {"train_loss": -10.2413330078125, "global_step": 502356, "epoch": 2990} {"train_loss": -11.760080337524414, "global_step": 502357, "epoch": 2990} {"train_loss": -10.347808837890625, "global_step": 502358, "epoch": 2990} {"train_loss": -10.932034492492676, "global_step": 502359, "epoch": 2990} {"train_loss": -11.295907974243164, "global_step": 502360, "epoch": 2990} {"train_loss": -10.761209487915039, "global_step": 502361, "epoch": 2990} {"train_loss": -10.69961929321289, "global_step": 502362, "epoch": 2990} {"train_loss": -10.695674896240234, "global_step": 502363, "epoch": 2990} {"train_loss": -11.111276626586914, "global_step": 502364, "epoch": 2990} {"train_loss": -11.464683532714844, "global_step": 502365, "epoch": 2990} {"train_loss": -10.932190895080566, "global_step": 502366, "epoch": 2990} {"train_loss": -11.052862167358398, "global_step": 502367, "epoch": 2990} {"train_loss": -11.656126022338867, "global_step": 502368, "epoch": 2990} {"train_loss": -11.521720886230469, "global_step": 502369, "epoch": 2990} {"train_loss": -11.402286529541016, "global_step": 502370, "epoch": 2990} {"train_loss": -11.849527359008789, "global_step": 502371, "epoch": 2990} {"train_loss": -11.895675659179688, "global_step": 502372, "epoch": 2990} {"train_loss": -11.671613693237305, "global_step": 502373, "epoch": 2990} {"train_loss": -11.902318000793457, "global_step": 502374, "epoch": 2990} {"train_loss": -11.709390640258789, "global_step": 502375, "epoch": 2990} {"train_loss": -12.23666763305664, "global_step": 502376, "epoch": 2990} {"train_loss": -11.844465255737305, "global_step": 502377, "epoch": 2990} {"train_loss": -12.127077102661133, "global_step": 502378, "epoch": 2990} {"train_loss": -12.15355110168457, "global_step": 502379, "epoch": 2990} {"train_loss": -12.288393020629883, "global_step": 502380, "epoch": 2990} {"train_loss": -12.254721641540527, "global_step": 502381, "epoch": 2990} {"train_loss": -12.234652519226074, "global_step": 502382, "epoch": 2990} {"train_loss": -12.275738716125488, "global_step": 502383, "epoch": 2990} {"train_loss": -12.17449951171875, "global_step": 502384, "epoch": 2990} {"train_loss": -12.519336700439453, "global_step": 502385, "epoch": 2990} {"train_loss": -12.486126899719238, "global_step": 502386, "epoch": 2990} {"train_loss": -12.332728385925293, "global_step": 502387, "epoch": 2990} {"train_loss": -12.349129676818848, "global_step": 502388, "epoch": 2990} {"train_loss": -12.510153770446777, "global_step": 502389, "epoch": 2990} {"train_loss": -12.525346755981445, "global_step": 502390, "epoch": 2990} {"train_loss": -12.630254745483398, "global_step": 502391, "epoch": 2990} {"train_loss": -12.52903938293457, "global_step": 502392, "epoch": 2990} {"train_loss": -12.66958236694336, "global_step": 502393, "epoch": 2990} {"train_loss": -12.692724227905273, "global_step": 502394, "epoch": 2990} {"train_loss": -12.50117301940918, "global_step": 502395, "epoch": 2990} {"train_loss": -12.615005493164062, "global_step": 502396, "epoch": 2990} {"train_loss": -12.657112121582031, "global_step": 502397, "epoch": 2990} {"train_loss": -12.675396919250488, "global_step": 502398, "epoch": 2990} {"train_loss": -12.596224784851074, "global_step": 502399, "epoch": 2990} {"train_loss": -12.656766891479492, "global_step": 502400, "epoch": 2990} {"train_loss": -12.691448211669922, "global_step": 502401, "epoch": 2990} {"train_loss": -12.732760429382324, "global_step": 502402, "epoch": 2990} {"train_loss": -12.746891975402832, "global_step": 502403, "epoch": 2990} {"train_loss": -12.668401718139648, "global_step": 502404, "epoch": 2990} {"train_loss": -12.776269912719727, "global_step": 502405, "epoch": 2990} {"train_loss": -12.50637435913086, "global_step": 502406, "epoch": 2990} {"train_loss": -12.919179916381836, "global_step": 502407, "epoch": 2990} {"train_loss": -12.753080368041992, "global_step": 502408, "epoch": 2990} {"train_loss": -12.463495254516602, "global_step": 502409, "epoch": 2990} {"train_loss": -12.692291259765625, "global_step": 502410, "epoch": 2990} {"train_loss": -12.649103164672852, "global_step": 502411, "epoch": 2990} {"train_loss": -12.742637634277344, "global_step": 502412, "epoch": 2990} {"train_loss": -12.808279037475586, "global_step": 502413, "epoch": 2990} {"train_loss": -12.875226974487305, "global_step": 502414, "epoch": 2990} {"train_loss": -12.750500679016113, "global_step": 502415, "epoch": 2990} {"train_loss": -12.87337875366211, "global_step": 502416, "epoch": 2990} {"train_loss": -12.79702091217041, "global_step": 502417, "epoch": 2990} {"train_loss": -12.83608341217041, "global_step": 502418, "epoch": 2990} {"train_loss": -12.901470184326172, "global_step": 502419, "epoch": 2990} {"train_loss": -12.473224639892578, "global_step": 502420, "epoch": 2990} {"train_loss": -12.684038162231445, "global_step": 502421, "epoch": 2990} {"train_loss": -12.817529678344727, "global_step": 502422, "epoch": 2990} {"train_loss": -12.88632583618164, "global_step": 502423, "epoch": 2990} {"train_loss": -12.689387321472168, "global_step": 502424, "epoch": 2990} {"train_loss": -12.68931770324707, "global_step": 502425, "epoch": 2990} {"train_loss": -12.381187438964844, "global_step": 502426, "epoch": 2990} {"train_loss": -12.904576301574707, "global_step": 502427, "epoch": 2990} {"train_loss": -12.560537338256836, "global_step": 502428, "epoch": 2990} {"train_loss": -12.5848970413208, "global_step": 502429, "epoch": 2990} {"train_loss": -12.992721557617188, "global_step": 502430, "epoch": 2990} {"train_loss": -12.661026000976562, "global_step": 502431, "epoch": 2990} {"train_loss": -12.951608657836914, "global_step": 502432, "epoch": 2990} {"train_loss": -12.697246551513672, "global_step": 502433, "epoch": 2990} {"train_loss": -12.765896797180176, "global_step": 502434, "epoch": 2990} {"train_loss": -12.744894027709961, "global_step": 502435, "epoch": 2990} {"train_loss": -12.7313232421875, "global_step": 502436, "epoch": 2990} {"train_loss": -12.672239303588867, "global_step": 502437, "epoch": 2990} {"train_loss": -12.797025680541992, "global_step": 502438, "epoch": 2990} {"train_loss": -12.757061958312988, "global_step": 502439, "epoch": 2990} {"train_loss": -12.726627349853516, "global_step": 502440, "epoch": 2990} {"train_loss": -12.225905418395996, "global_step": 502441, "epoch": 2990} {"train_loss": -12.639799118041992, "global_step": 502442, "epoch": 2990} {"train_loss": -12.824066162109375, "global_step": 502443, "epoch": 2990} {"train_loss": -12.075172424316406, "global_step": 502444, "epoch": 2990} {"train_loss": -12.790861129760742, "global_step": 502445, "epoch": 2990} {"train_loss": -12.638157844543457, "global_step": 502446, "epoch": 2990} {"train_loss": -12.690485000610352, "global_step": 502447, "epoch": 2990} {"train_loss": -12.474251747131348, "global_step": 502448, "epoch": 2990} {"train_loss": -12.459123611450195, "global_step": 502449, "epoch": 2990} {"train_loss": -12.569714546203613, "global_step": 502450, "epoch": 2990} {"train_loss": -12.694486618041992, "global_step": 502451, "epoch": 2990} {"train_loss": -12.739459037780762, "global_step": 502452, "epoch": 2990} {"train_loss": -12.545818328857422, "global_step": 502453, "epoch": 2990} {"train_loss": -12.785470008850098, "global_step": 502454, "epoch": 2990} {"train_loss": -12.561464309692383, "global_step": 502455, "epoch": 2990} {"train_loss": -12.776610374450684, "global_step": 502456, "epoch": 2990} {"train_loss": -12.560163497924805, "global_step": 502457, "epoch": 2990} {"train_loss": -12.608765602111816, "global_step": 502458, "epoch": 2990} {"train_loss": -12.97439956665039, "global_step": 502459, "epoch": 2990} {"train_loss": -12.738411903381348, "global_step": 502460, "epoch": 2990} {"train_loss": -12.851105690002441, "global_step": 502461, "epoch": 2990} {"train_loss": -12.607364654541016, "global_step": 502462, "epoch": 2990} {"train_loss": -12.844039916992188, "global_step": 502463, "epoch": 2990} {"train_loss": -12.565225601196289, "global_step": 502464, "epoch": 2990} {"train_loss": -12.587701797485352, "global_step": 502465, "epoch": 2990} {"train_loss": -11.874641418457031, "global_step": 502466, "epoch": 2990} {"train_loss": -12.786092758178711, "global_step": 502467, "epoch": 2990} {"train_loss": -12.322469711303711, "global_step": 502468, "epoch": 2990} {"train_loss": -12.035369873046875, "global_step": 502469, "epoch": 2990} {"train_loss": -11.854156494140625, "global_step": 502470, "epoch": 2990} {"train_loss": -12.752038955688477, "global_step": 502471, "epoch": 2990} {"train_loss": -12.13088321685791, "global_step": 502472, "epoch": 2990} {"train_loss": -12.41943073272705, "global_step": 502473, "epoch": 2990} {"train_loss": -12.290327072143555, "global_step": 502474, "epoch": 2990} {"train_loss": -12.319416046142578, "global_step": 502475, "epoch": 2990} {"train_loss": -12.156875610351562, "global_step": 502476, "epoch": 2990} {"train_loss": -12.018057823181152, "global_step": 502477, "epoch": 2990} {"train_loss": -12.153327941894531, "global_step": 502478, "epoch": 2990} {"train_loss": -11.775426864624023, "global_step": 502479, "epoch": 2990} {"train_loss": -11.612175941467285, "global_step": 502480, "epoch": 2990} {"train_loss": -12.331825256347656, "global_step": 502481, "epoch": 2990} {"train_loss": -11.02184772491455, "global_step": 502482, "epoch": 2990} {"train_loss": -10.56614875793457, "global_step": 502483, "epoch": 2990} {"train_loss": -10.793411254882812, "global_step": 502484, "epoch": 2990} {"train_loss": -11.35047721862793, "global_step": 502485, "epoch": 2990} {"train_loss": -12.314727783203125, "global_step": 502486, "epoch": 2990} {"train_loss": -12.026590614091782, "global_step": 502487, "epoch": 2990, "val_loss": 317352.4375, "train_action_mse_error": 2.3184261322021484} {"train_loss": -11.493244171142578, "global_step": 502488, "epoch": 2991} {"train_loss": -12.24686050415039, "global_step": 502489, "epoch": 2991} {"train_loss": -11.071749687194824, "global_step": 502490, "epoch": 2991} {"train_loss": -11.582099914550781, "global_step": 502491, "epoch": 2991} {"train_loss": -12.104533195495605, "global_step": 502492, "epoch": 2991} {"train_loss": -10.5577392578125, "global_step": 502493, "epoch": 2991} {"train_loss": -11.622081756591797, "global_step": 502494, "epoch": 2991} {"train_loss": -11.3948335647583, "global_step": 502495, "epoch": 2991} {"train_loss": -11.817937850952148, "global_step": 502496, "epoch": 2991} {"train_loss": -11.94384479522705, "global_step": 502497, "epoch": 2991} {"train_loss": -11.296823501586914, "global_step": 502498, "epoch": 2991} {"train_loss": -12.541751861572266, "global_step": 502499, "epoch": 2991} {"train_loss": -11.164017677307129, "global_step": 502500, "epoch": 2991} {"train_loss": -12.36825180053711, "global_step": 502501, "epoch": 2991} {"train_loss": -11.536958694458008, "global_step": 502502, "epoch": 2991} {"train_loss": -12.11277961730957, "global_step": 502503, "epoch": 2991} {"train_loss": -12.196102142333984, "global_step": 502504, "epoch": 2991} {"train_loss": -11.857657432556152, "global_step": 502505, "epoch": 2991} {"train_loss": -12.604701042175293, "global_step": 502506, "epoch": 2991} {"train_loss": -12.07435417175293, "global_step": 502507, "epoch": 2991} {"train_loss": -12.360831260681152, "global_step": 502508, "epoch": 2991} {"train_loss": -12.100851058959961, "global_step": 502509, "epoch": 2991} {"train_loss": -11.89942455291748, "global_step": 502510, "epoch": 2991} {"train_loss": -12.369428634643555, "global_step": 502511, "epoch": 2991} {"train_loss": -11.735889434814453, "global_step": 502512, "epoch": 2991} {"train_loss": -12.457376480102539, "global_step": 502513, "epoch": 2991} {"train_loss": -11.164925575256348, "global_step": 502514, "epoch": 2991} {"train_loss": -11.491732597351074, "global_step": 502515, "epoch": 2991} {"train_loss": -12.30726432800293, "global_step": 502516, "epoch": 2991} {"train_loss": -11.897270202636719, "global_step": 502517, "epoch": 2991} {"train_loss": -12.289541244506836, "global_step": 502518, "epoch": 2991} {"train_loss": -12.235701560974121, "global_step": 502519, "epoch": 2991} {"train_loss": -12.42343807220459, "global_step": 502520, "epoch": 2991} {"train_loss": -12.069013595581055, "global_step": 502521, "epoch": 2991} {"train_loss": -12.366731643676758, "global_step": 502522, "epoch": 2991} {"train_loss": -12.234480857849121, "global_step": 502523, "epoch": 2991} {"train_loss": -12.45724868774414, "global_step": 502524, "epoch": 2991} {"train_loss": -12.112009048461914, "global_step": 502525, "epoch": 2991} {"train_loss": -12.238658905029297, "global_step": 502526, "epoch": 2991} {"train_loss": -12.145695686340332, "global_step": 502527, "epoch": 2991} {"train_loss": -12.560846328735352, "global_step": 502528, "epoch": 2991} {"train_loss": -12.749862670898438, "global_step": 502529, "epoch": 2991} {"train_loss": -12.450098037719727, "global_step": 502530, "epoch": 2991} {"train_loss": -12.457018852233887, "global_step": 502531, "epoch": 2991} {"train_loss": -12.737981796264648, "global_step": 502532, "epoch": 2991} {"train_loss": -12.376358985900879, "global_step": 502533, "epoch": 2991} {"train_loss": -11.994460105895996, "global_step": 502534, "epoch": 2991} {"train_loss": -12.522340774536133, "global_step": 502535, "epoch": 2991} {"train_loss": -12.112287521362305, "global_step": 502536, "epoch": 2991} {"train_loss": -12.488450050354004, "global_step": 502537, "epoch": 2991} {"train_loss": -11.940606117248535, "global_step": 502538, "epoch": 2991} {"train_loss": -11.899863243103027, "global_step": 502539, "epoch": 2991} {"train_loss": -12.506139755249023, "global_step": 502540, "epoch": 2991} {"train_loss": -11.402990341186523, "global_step": 502541, "epoch": 2991} {"train_loss": -12.276142120361328, "global_step": 502542, "epoch": 2991} {"train_loss": -11.700815200805664, "global_step": 502543, "epoch": 2991} {"train_loss": -12.61777114868164, "global_step": 502544, "epoch": 2991} {"train_loss": -11.805728912353516, "global_step": 502545, "epoch": 2991} {"train_loss": -12.191282272338867, "global_step": 502546, "epoch": 2991} {"train_loss": -12.065292358398438, "global_step": 502547, "epoch": 2991} {"train_loss": -11.583305358886719, "global_step": 502548, "epoch": 2991} {"train_loss": -12.294243812561035, "global_step": 502549, "epoch": 2991} {"train_loss": -11.900041580200195, "global_step": 502550, "epoch": 2991} {"train_loss": -12.46055793762207, "global_step": 502551, "epoch": 2991} {"train_loss": -11.791650772094727, "global_step": 502552, "epoch": 2991} {"train_loss": -12.38591194152832, "global_step": 502553, "epoch": 2991} {"train_loss": -11.881613731384277, "global_step": 502554, "epoch": 2991} {"train_loss": -12.110854148864746, "global_step": 502555, "epoch": 2991} {"train_loss": -12.261004447937012, "global_step": 502556, "epoch": 2991} {"train_loss": -12.44497299194336, "global_step": 502557, "epoch": 2991} {"train_loss": -12.135272979736328, "global_step": 502558, "epoch": 2991} {"train_loss": -12.65007209777832, "global_step": 502559, "epoch": 2991} {"train_loss": -12.247200012207031, "global_step": 502560, "epoch": 2991} {"train_loss": -12.748010635375977, "global_step": 502561, "epoch": 2991} {"train_loss": -12.378268241882324, "global_step": 502562, "epoch": 2991} {"train_loss": -12.62965202331543, "global_step": 502563, "epoch": 2991} {"train_loss": -12.641035079956055, "global_step": 502564, "epoch": 2991} {"train_loss": -12.854643821716309, "global_step": 502565, "epoch": 2991} {"train_loss": -12.634577751159668, "global_step": 502566, "epoch": 2991} {"train_loss": -12.602567672729492, "global_step": 502567, "epoch": 2991} {"train_loss": -12.862557411193848, "global_step": 502568, "epoch": 2991} {"train_loss": -12.510778427124023, "global_step": 502569, "epoch": 2991} {"train_loss": -12.715593338012695, "global_step": 502570, "epoch": 2991} {"train_loss": -12.714693069458008, "global_step": 502571, "epoch": 2991} {"train_loss": -12.818822860717773, "global_step": 502572, "epoch": 2991} {"train_loss": -12.803775787353516, "global_step": 502573, "epoch": 2991} {"train_loss": -12.855716705322266, "global_step": 502574, "epoch": 2991} {"train_loss": -12.71820068359375, "global_step": 502575, "epoch": 2991} {"train_loss": -12.764435768127441, "global_step": 502576, "epoch": 2991} {"train_loss": -12.863912582397461, "global_step": 502577, "epoch": 2991} {"train_loss": -12.648187637329102, "global_step": 502578, "epoch": 2991} {"train_loss": -12.84717845916748, "global_step": 502579, "epoch": 2991} {"train_loss": -12.859262466430664, "global_step": 502580, "epoch": 2991} {"train_loss": -13.060197830200195, "global_step": 502581, "epoch": 2991} {"train_loss": -12.827388763427734, "global_step": 502582, "epoch": 2991} {"train_loss": -12.829358100891113, "global_step": 502583, "epoch": 2991} {"train_loss": -13.056748390197754, "global_step": 502584, "epoch": 2991} {"train_loss": -12.973716735839844, "global_step": 502585, "epoch": 2991} {"train_loss": -12.676702499389648, "global_step": 502586, "epoch": 2991} {"train_loss": -12.91949462890625, "global_step": 502587, "epoch": 2991} {"train_loss": -12.613054275512695, "global_step": 502588, "epoch": 2991} {"train_loss": -12.806227684020996, "global_step": 502589, "epoch": 2991} {"train_loss": -12.75240707397461, "global_step": 502590, "epoch": 2991} {"train_loss": -13.014121055603027, "global_step": 502591, "epoch": 2991} {"train_loss": -12.944818496704102, "global_step": 502592, "epoch": 2991} {"train_loss": -12.880294799804688, "global_step": 502593, "epoch": 2991} {"train_loss": -13.007108688354492, "global_step": 502594, "epoch": 2991} {"train_loss": -12.93952751159668, "global_step": 502595, "epoch": 2991} {"train_loss": -12.927572250366211, "global_step": 502596, "epoch": 2991} {"train_loss": -12.95213508605957, "global_step": 502597, "epoch": 2991} {"train_loss": -12.53573989868164, "global_step": 502598, "epoch": 2991} {"train_loss": -12.601675033569336, "global_step": 502599, "epoch": 2991} {"train_loss": -12.969807624816895, "global_step": 502600, "epoch": 2991} {"train_loss": -12.801301002502441, "global_step": 502601, "epoch": 2991} {"train_loss": -12.215727806091309, "global_step": 502602, "epoch": 2991} {"train_loss": -12.798638343811035, "global_step": 502603, "epoch": 2991} {"train_loss": -12.533700942993164, "global_step": 502604, "epoch": 2991} {"train_loss": -12.374306678771973, "global_step": 502605, "epoch": 2991} {"train_loss": -12.264005661010742, "global_step": 502606, "epoch": 2991} {"train_loss": -12.606132507324219, "global_step": 502607, "epoch": 2991} {"train_loss": -11.174728393554688, "global_step": 502608, "epoch": 2991} {"train_loss": -10.801092147827148, "global_step": 502609, "epoch": 2991} {"train_loss": -12.223393440246582, "global_step": 502610, "epoch": 2991} {"train_loss": -12.254326820373535, "global_step": 502611, "epoch": 2991} {"train_loss": -9.572471618652344, "global_step": 502612, "epoch": 2991} {"train_loss": -10.413244247436523, "global_step": 502613, "epoch": 2991} {"train_loss": -12.280643463134766, "global_step": 502614, "epoch": 2991} {"train_loss": -9.199596405029297, "global_step": 502615, "epoch": 2991} {"train_loss": -10.126659393310547, "global_step": 502616, "epoch": 2991} {"train_loss": -10.596839904785156, "global_step": 502617, "epoch": 2991} {"train_loss": -10.010896682739258, "global_step": 502618, "epoch": 2991} {"train_loss": -9.760104179382324, "global_step": 502619, "epoch": 2991} {"train_loss": -9.107053756713867, "global_step": 502620, "epoch": 2991} {"train_loss": -8.93484115600586, "global_step": 502621, "epoch": 2991} {"train_loss": -8.368131637573242, "global_step": 502622, "epoch": 2991} {"train_loss": -9.205184936523438, "global_step": 502623, "epoch": 2991} {"train_loss": -10.58544921875, "global_step": 502624, "epoch": 2991} {"train_loss": -7.858590602874756, "global_step": 502625, "epoch": 2991} {"train_loss": -8.684427261352539, "global_step": 502626, "epoch": 2991} {"train_loss": -9.420234680175781, "global_step": 502627, "epoch": 2991} {"train_loss": -10.257421493530273, "global_step": 502628, "epoch": 2991} {"train_loss": -10.059369087219238, "global_step": 502629, "epoch": 2991} {"train_loss": -9.370784759521484, "global_step": 502630, "epoch": 2991} {"train_loss": -9.631378173828125, "global_step": 502631, "epoch": 2991} {"train_loss": -9.925785064697266, "global_step": 502632, "epoch": 2991} {"train_loss": -10.02833366394043, "global_step": 502633, "epoch": 2991} {"train_loss": -11.147966384887695, "global_step": 502634, "epoch": 2991} {"train_loss": -10.840699195861816, "global_step": 502635, "epoch": 2991} {"train_loss": -10.551933288574219, "global_step": 502636, "epoch": 2991} {"train_loss": -11.705114364624023, "global_step": 502637, "epoch": 2991} {"train_loss": -10.665956497192383, "global_step": 502638, "epoch": 2991} {"train_loss": -11.414437294006348, "global_step": 502639, "epoch": 2991} {"train_loss": -11.472671508789062, "global_step": 502640, "epoch": 2991} {"train_loss": -11.05940055847168, "global_step": 502641, "epoch": 2991} {"train_loss": -11.959394454956055, "global_step": 502642, "epoch": 2991} {"train_loss": -11.213353157043457, "global_step": 502643, "epoch": 2991} {"train_loss": -11.714807510375977, "global_step": 502644, "epoch": 2991} {"train_loss": -11.534770965576172, "global_step": 502645, "epoch": 2991} {"train_loss": -11.415397644042969, "global_step": 502646, "epoch": 2991} {"train_loss": -11.206914901733398, "global_step": 502647, "epoch": 2991} {"train_loss": -12.104523658752441, "global_step": 502648, "epoch": 2991} {"train_loss": -11.887029647827148, "global_step": 502649, "epoch": 2991} {"train_loss": -11.758193016052246, "global_step": 502650, "epoch": 2991} {"train_loss": -11.290670394897461, "global_step": 502651, "epoch": 2991} {"train_loss": -11.768113136291504, "global_step": 502652, "epoch": 2991} {"train_loss": -10.911389350891113, "global_step": 502653, "epoch": 2991} {"train_loss": -12.267801284790039, "global_step": 502654, "epoch": 2991} {"train_loss": -11.855812728404999, "global_step": 502655, "epoch": 2991, "val_loss": 314200.90625} {"train_loss": -12.163213729858398, "global_step": 502656, "epoch": 2992} {"train_loss": -11.02160358428955, "global_step": 502657, "epoch": 2992} {"train_loss": -12.098058700561523, "global_step": 502658, "epoch": 2992} {"train_loss": -11.977073669433594, "global_step": 502659, "epoch": 2992} {"train_loss": -12.365799903869629, "global_step": 502660, "epoch": 2992} {"train_loss": -11.94465446472168, "global_step": 502661, "epoch": 2992} {"train_loss": -12.16871452331543, "global_step": 502662, "epoch": 2992} {"train_loss": -11.843092918395996, "global_step": 502663, "epoch": 2992} {"train_loss": -12.258866310119629, "global_step": 502664, "epoch": 2992} {"train_loss": -12.070013046264648, "global_step": 502665, "epoch": 2992} {"train_loss": -12.27218246459961, "global_step": 502666, "epoch": 2992} {"train_loss": -11.956762313842773, "global_step": 502667, "epoch": 2992} {"train_loss": -12.334798812866211, "global_step": 502668, "epoch": 2992} {"train_loss": -11.85799789428711, "global_step": 502669, "epoch": 2992} {"train_loss": -11.779230117797852, "global_step": 502670, "epoch": 2992} {"train_loss": -12.225658416748047, "global_step": 502671, "epoch": 2992} {"train_loss": -12.157573699951172, "global_step": 502672, "epoch": 2992} {"train_loss": -12.168375968933105, "global_step": 502673, "epoch": 2992} {"train_loss": -12.13805866241455, "global_step": 502674, "epoch": 2992} {"train_loss": -12.443819046020508, "global_step": 502675, "epoch": 2992} {"train_loss": -11.898746490478516, "global_step": 502676, "epoch": 2992} {"train_loss": -12.659947395324707, "global_step": 502677, "epoch": 2992} {"train_loss": -12.186426162719727, "global_step": 502678, "epoch": 2992} {"train_loss": -12.630943298339844, "global_step": 502679, "epoch": 2992} {"train_loss": -12.164421081542969, "global_step": 502680, "epoch": 2992} {"train_loss": -12.175398826599121, "global_step": 502681, "epoch": 2992} {"train_loss": -12.24051284790039, "global_step": 502682, "epoch": 2992} {"train_loss": -11.946978569030762, "global_step": 502683, "epoch": 2992} {"train_loss": -12.470841407775879, "global_step": 502684, "epoch": 2992} {"train_loss": -11.758185386657715, "global_step": 502685, "epoch": 2992} {"train_loss": -12.447724342346191, "global_step": 502686, "epoch": 2992} {"train_loss": -12.116283416748047, "global_step": 502687, "epoch": 2992} {"train_loss": -12.529224395751953, "global_step": 502688, "epoch": 2992} {"train_loss": -12.072059631347656, "global_step": 502689, "epoch": 2992} {"train_loss": -12.436046600341797, "global_step": 502690, "epoch": 2992} {"train_loss": -12.138761520385742, "global_step": 502691, "epoch": 2992} {"train_loss": -12.300456047058105, "global_step": 502692, "epoch": 2992} {"train_loss": -12.374223709106445, "global_step": 502693, "epoch": 2992} {"train_loss": -12.540043830871582, "global_step": 502694, "epoch": 2992} {"train_loss": -12.242496490478516, "global_step": 502695, "epoch": 2992} {"train_loss": -12.545511245727539, "global_step": 502696, "epoch": 2992} {"train_loss": -12.231035232543945, "global_step": 502697, "epoch": 2992} {"train_loss": -12.759225845336914, "global_step": 502698, "epoch": 2992} {"train_loss": -12.644826889038086, "global_step": 502699, "epoch": 2992} {"train_loss": -12.536438941955566, "global_step": 502700, "epoch": 2992} {"train_loss": -12.639530181884766, "global_step": 502701, "epoch": 2992} {"train_loss": -12.654769897460938, "global_step": 502702, "epoch": 2992} {"train_loss": -12.594541549682617, "global_step": 502703, "epoch": 2992} {"train_loss": -12.693293571472168, "global_step": 502704, "epoch": 2992} {"train_loss": -12.645781517028809, "global_step": 502705, "epoch": 2992} {"train_loss": -12.718753814697266, "global_step": 502706, "epoch": 2992} {"train_loss": -12.684247970581055, "global_step": 502707, "epoch": 2992} {"train_loss": -12.556885719299316, "global_step": 502708, "epoch": 2992} {"train_loss": -12.626144409179688, "global_step": 502709, "epoch": 2992} {"train_loss": -12.698272705078125, "global_step": 502710, "epoch": 2992} {"train_loss": -12.711669921875, "global_step": 502711, "epoch": 2992} {"train_loss": -12.644247055053711, "global_step": 502712, "epoch": 2992} {"train_loss": -12.802153587341309, "global_step": 502713, "epoch": 2992} {"train_loss": -12.77131462097168, "global_step": 502714, "epoch": 2992} {"train_loss": -12.783706665039062, "global_step": 502715, "epoch": 2992} {"train_loss": -12.863664627075195, "global_step": 502716, "epoch": 2992} {"train_loss": -12.81330394744873, "global_step": 502717, "epoch": 2992} {"train_loss": -12.84555721282959, "global_step": 502718, "epoch": 2992} {"train_loss": -12.795449256896973, "global_step": 502719, "epoch": 2992} {"train_loss": -12.748617172241211, "global_step": 502720, "epoch": 2992} {"train_loss": -12.850252151489258, "global_step": 502721, "epoch": 2992} {"train_loss": -12.680838584899902, "global_step": 502722, "epoch": 2992} {"train_loss": -12.880022048950195, "global_step": 502723, "epoch": 2992} {"train_loss": -12.810295104980469, "global_step": 502724, "epoch": 2992} {"train_loss": -12.934225082397461, "global_step": 502725, "epoch": 2992} {"train_loss": -12.712559700012207, "global_step": 502726, "epoch": 2992} {"train_loss": -12.822192192077637, "global_step": 502727, "epoch": 2992} {"train_loss": -12.737512588500977, "global_step": 502728, "epoch": 2992} {"train_loss": -12.705516815185547, "global_step": 502729, "epoch": 2992} {"train_loss": -12.901708602905273, "global_step": 502730, "epoch": 2992} {"train_loss": -12.855304718017578, "global_step": 502731, "epoch": 2992} {"train_loss": -12.816360473632812, "global_step": 502732, "epoch": 2992} {"train_loss": -12.969279289245605, "global_step": 502733, "epoch": 2992} {"train_loss": -12.976471900939941, "global_step": 502734, "epoch": 2992} {"train_loss": -12.97266960144043, "global_step": 502735, "epoch": 2992} {"train_loss": -13.138233184814453, "global_step": 502736, "epoch": 2992} {"train_loss": -12.859231948852539, "global_step": 502737, "epoch": 2992} {"train_loss": -12.960212707519531, "global_step": 502738, "epoch": 2992} {"train_loss": -13.109386444091797, "global_step": 502739, "epoch": 2992} {"train_loss": -13.012102127075195, "global_step": 502740, "epoch": 2992} {"train_loss": -12.952951431274414, "global_step": 502741, "epoch": 2992} {"train_loss": -12.940074920654297, "global_step": 502742, "epoch": 2992} {"train_loss": -13.07734489440918, "global_step": 502743, "epoch": 2992} {"train_loss": -12.785573959350586, "global_step": 502744, "epoch": 2992} {"train_loss": -13.016632080078125, "global_step": 502745, "epoch": 2992} {"train_loss": -12.725053787231445, "global_step": 502746, "epoch": 2992} {"train_loss": -12.827909469604492, "global_step": 502747, "epoch": 2992} {"train_loss": -12.74790096282959, "global_step": 502748, "epoch": 2992} {"train_loss": -12.971003532409668, "global_step": 502749, "epoch": 2992} {"train_loss": -12.830942153930664, "global_step": 502750, "epoch": 2992} {"train_loss": -12.721924781799316, "global_step": 502751, "epoch": 2992} {"train_loss": -12.992520332336426, "global_step": 502752, "epoch": 2992} {"train_loss": -12.894317626953125, "global_step": 502753, "epoch": 2992} {"train_loss": -12.45186996459961, "global_step": 502754, "epoch": 2992} {"train_loss": -12.848923683166504, "global_step": 502755, "epoch": 2992} {"train_loss": -12.669427871704102, "global_step": 502756, "epoch": 2992} {"train_loss": -12.415104866027832, "global_step": 502757, "epoch": 2992} {"train_loss": -12.710922241210938, "global_step": 502758, "epoch": 2992} {"train_loss": -12.694011688232422, "global_step": 502759, "epoch": 2992} {"train_loss": -12.632373809814453, "global_step": 502760, "epoch": 2992} {"train_loss": -12.730737686157227, "global_step": 502761, "epoch": 2992} {"train_loss": -12.928840637207031, "global_step": 502762, "epoch": 2992} {"train_loss": -12.930712699890137, "global_step": 502763, "epoch": 2992} {"train_loss": -12.643657684326172, "global_step": 502764, "epoch": 2992} {"train_loss": -12.985651969909668, "global_step": 502765, "epoch": 2992} {"train_loss": -12.9888916015625, "global_step": 502766, "epoch": 2992} {"train_loss": -12.769282341003418, "global_step": 502767, "epoch": 2992} {"train_loss": -12.649678230285645, "global_step": 502768, "epoch": 2992} {"train_loss": -12.949044227600098, "global_step": 502769, "epoch": 2992} {"train_loss": -12.87765121459961, "global_step": 502770, "epoch": 2992} {"train_loss": -12.893189430236816, "global_step": 502771, "epoch": 2992} {"train_loss": -12.836962699890137, "global_step": 502772, "epoch": 2992} {"train_loss": -13.215045928955078, "global_step": 502773, "epoch": 2992} {"train_loss": -12.533763885498047, "global_step": 502774, "epoch": 2992} {"train_loss": -12.458831787109375, "global_step": 502775, "epoch": 2992} {"train_loss": -12.146217346191406, "global_step": 502776, "epoch": 2992} {"train_loss": -12.631911277770996, "global_step": 502777, "epoch": 2992} {"train_loss": -12.61245346069336, "global_step": 502778, "epoch": 2992} {"train_loss": -12.731346130371094, "global_step": 502779, "epoch": 2992} {"train_loss": -11.628400802612305, "global_step": 502780, "epoch": 2992} {"train_loss": -12.426756858825684, "global_step": 502781, "epoch": 2992} {"train_loss": -12.409425735473633, "global_step": 502782, "epoch": 2992} {"train_loss": -11.2150297164917, "global_step": 502783, "epoch": 2992} {"train_loss": -11.797323226928711, "global_step": 502784, "epoch": 2992} {"train_loss": -12.0027437210083, "global_step": 502785, "epoch": 2992} {"train_loss": -12.135791778564453, "global_step": 502786, "epoch": 2992} {"train_loss": -11.90505313873291, "global_step": 502787, "epoch": 2992} {"train_loss": -11.399128913879395, "global_step": 502788, "epoch": 2992} {"train_loss": -11.83071231842041, "global_step": 502789, "epoch": 2992} {"train_loss": -11.71381950378418, "global_step": 502790, "epoch": 2992} {"train_loss": -11.916197776794434, "global_step": 502791, "epoch": 2992} {"train_loss": -11.251364707946777, "global_step": 502792, "epoch": 2992} {"train_loss": -12.256717681884766, "global_step": 502793, "epoch": 2992} {"train_loss": -11.671404838562012, "global_step": 502794, "epoch": 2992} {"train_loss": -11.847062110900879, "global_step": 502795, "epoch": 2992} {"train_loss": -12.318865776062012, "global_step": 502796, "epoch": 2992} {"train_loss": -12.030017852783203, "global_step": 502797, "epoch": 2992} {"train_loss": -12.002447128295898, "global_step": 502798, "epoch": 2992} {"train_loss": -12.39535140991211, "global_step": 502799, "epoch": 2992} {"train_loss": -12.44845199584961, "global_step": 502800, "epoch": 2992} {"train_loss": -12.192543029785156, "global_step": 502801, "epoch": 2992} {"train_loss": -12.454629898071289, "global_step": 502802, "epoch": 2992} {"train_loss": -12.596713066101074, "global_step": 502803, "epoch": 2992} {"train_loss": -12.588571548461914, "global_step": 502804, "epoch": 2992} {"train_loss": -12.367154121398926, "global_step": 502805, "epoch": 2992} {"train_loss": -12.667006492614746, "global_step": 502806, "epoch": 2992} {"train_loss": -12.440242767333984, "global_step": 502807, "epoch": 2992} {"train_loss": -12.593961715698242, "global_step": 502808, "epoch": 2992} {"train_loss": -12.35983943939209, "global_step": 502809, "epoch": 2992} {"train_loss": -12.145526885986328, "global_step": 502810, "epoch": 2992} {"train_loss": -12.329927444458008, "global_step": 502811, "epoch": 2992} {"train_loss": -12.339841842651367, "global_step": 502812, "epoch": 2992} {"train_loss": -11.105592727661133, "global_step": 502813, "epoch": 2992} {"train_loss": -12.41455078125, "global_step": 502814, "epoch": 2992} {"train_loss": -11.838953018188477, "global_step": 502815, "epoch": 2992} {"train_loss": -11.527331352233887, "global_step": 502816, "epoch": 2992} {"train_loss": -12.76965618133545, "global_step": 502817, "epoch": 2992} {"train_loss": -12.148327827453613, "global_step": 502818, "epoch": 2992} {"train_loss": -12.581262588500977, "global_step": 502819, "epoch": 2992} {"train_loss": -12.735116958618164, "global_step": 502820, "epoch": 2992} {"train_loss": -12.501786231994629, "global_step": 502821, "epoch": 2992} {"train_loss": -12.078349113464355, "global_step": 502822, "epoch": 2992} {"train_loss": -12.460456479163398, "global_step": 502823, "epoch": 2992, "val_loss": 316407.96875} {"train_loss": -12.565353393554688, "global_step": 502824, "epoch": 2993} {"train_loss": -12.552720069885254, "global_step": 502825, "epoch": 2993} {"train_loss": -12.09396743774414, "global_step": 502826, "epoch": 2993} {"train_loss": -12.618046760559082, "global_step": 502827, "epoch": 2993} {"train_loss": -12.411044120788574, "global_step": 502828, "epoch": 2993} {"train_loss": -12.509082794189453, "global_step": 502829, "epoch": 2993} {"train_loss": -12.441875457763672, "global_step": 502830, "epoch": 2993} {"train_loss": -12.769671440124512, "global_step": 502831, "epoch": 2993} {"train_loss": -12.272937774658203, "global_step": 502832, "epoch": 2993} {"train_loss": -12.070606231689453, "global_step": 502833, "epoch": 2993} {"train_loss": -12.482892990112305, "global_step": 502834, "epoch": 2993} {"train_loss": -12.07760238647461, "global_step": 502835, "epoch": 2993} {"train_loss": -12.584964752197266, "global_step": 502836, "epoch": 2993} {"train_loss": -12.75106430053711, "global_step": 502837, "epoch": 2993} {"train_loss": -12.252861022949219, "global_step": 502838, "epoch": 2993} {"train_loss": -12.527505874633789, "global_step": 502839, "epoch": 2993} {"train_loss": -12.764656066894531, "global_step": 502840, "epoch": 2993} {"train_loss": -12.918230056762695, "global_step": 502841, "epoch": 2993} {"train_loss": -12.465798377990723, "global_step": 502842, "epoch": 2993} {"train_loss": -12.718147277832031, "global_step": 502843, "epoch": 2993} {"train_loss": -12.73508071899414, "global_step": 502844, "epoch": 2993} {"train_loss": -12.676555633544922, "global_step": 502845, "epoch": 2993} {"train_loss": -12.606974601745605, "global_step": 502846, "epoch": 2993} {"train_loss": -12.292815208435059, "global_step": 502847, "epoch": 2993} {"train_loss": -12.635196685791016, "global_step": 502848, "epoch": 2993} {"train_loss": -12.450435638427734, "global_step": 502849, "epoch": 2993} {"train_loss": -12.200542449951172, "global_step": 502850, "epoch": 2993} {"train_loss": -12.800883293151855, "global_step": 502851, "epoch": 2993} {"train_loss": -12.131430625915527, "global_step": 502852, "epoch": 2993} {"train_loss": -12.447677612304688, "global_step": 502853, "epoch": 2993} {"train_loss": -12.627275466918945, "global_step": 502854, "epoch": 2993} {"train_loss": -12.593398094177246, "global_step": 502855, "epoch": 2993} {"train_loss": -12.451847076416016, "global_step": 502856, "epoch": 2993} {"train_loss": -12.520267486572266, "global_step": 502857, "epoch": 2993} {"train_loss": -12.636829376220703, "global_step": 502858, "epoch": 2993} {"train_loss": -12.69204330444336, "global_step": 502859, "epoch": 2993} {"train_loss": -12.752265930175781, "global_step": 502860, "epoch": 2993} {"train_loss": -12.389633178710938, "global_step": 502861, "epoch": 2993} {"train_loss": -12.481894493103027, "global_step": 502862, "epoch": 2993} {"train_loss": -12.509893417358398, "global_step": 502863, "epoch": 2993} {"train_loss": -12.273954391479492, "global_step": 502864, "epoch": 2993} {"train_loss": -12.49416732788086, "global_step": 502865, "epoch": 2993} {"train_loss": -12.366899490356445, "global_step": 502866, "epoch": 2993} {"train_loss": -12.931964874267578, "global_step": 502867, "epoch": 2993} {"train_loss": -11.89413833618164, "global_step": 502868, "epoch": 2993} {"train_loss": -12.31067180633545, "global_step": 502869, "epoch": 2993} {"train_loss": -12.557622909545898, "global_step": 502870, "epoch": 2993} {"train_loss": -12.544364929199219, "global_step": 502871, "epoch": 2993} {"train_loss": -12.485994338989258, "global_step": 502872, "epoch": 2993} {"train_loss": -11.671052932739258, "global_step": 502873, "epoch": 2993} {"train_loss": -12.45995044708252, "global_step": 502874, "epoch": 2993} {"train_loss": -12.191732406616211, "global_step": 502875, "epoch": 2993} {"train_loss": -12.97488021850586, "global_step": 502876, "epoch": 2993} {"train_loss": -12.486587524414062, "global_step": 502877, "epoch": 2993} {"train_loss": -12.096592903137207, "global_step": 502878, "epoch": 2993} {"train_loss": -12.213722229003906, "global_step": 502879, "epoch": 2993} {"train_loss": -12.735740661621094, "global_step": 502880, "epoch": 2993} {"train_loss": -12.09061050415039, "global_step": 502881, "epoch": 2993} {"train_loss": -11.789207458496094, "global_step": 502882, "epoch": 2993} {"train_loss": -12.077933311462402, "global_step": 502883, "epoch": 2993} {"train_loss": -12.42740249633789, "global_step": 502884, "epoch": 2993} {"train_loss": -11.75780963897705, "global_step": 502885, "epoch": 2993} {"train_loss": -11.812644004821777, "global_step": 502886, "epoch": 2993} {"train_loss": -11.900341033935547, "global_step": 502887, "epoch": 2993} {"train_loss": -11.222095489501953, "global_step": 502888, "epoch": 2993} {"train_loss": -12.745150566101074, "global_step": 502889, "epoch": 2993} {"train_loss": -11.288148880004883, "global_step": 502890, "epoch": 2993} {"train_loss": -12.17148208618164, "global_step": 502891, "epoch": 2993} {"train_loss": -12.143539428710938, "global_step": 502892, "epoch": 2993} {"train_loss": -12.171308517456055, "global_step": 502893, "epoch": 2993} {"train_loss": -12.724176406860352, "global_step": 502894, "epoch": 2993} {"train_loss": -11.861112594604492, "global_step": 502895, "epoch": 2993} {"train_loss": -12.817913055419922, "global_step": 502896, "epoch": 2993} {"train_loss": -11.655187606811523, "global_step": 502897, "epoch": 2993} {"train_loss": -12.090038299560547, "global_step": 502898, "epoch": 2993} {"train_loss": -11.580955505371094, "global_step": 502899, "epoch": 2993} {"train_loss": -12.340104103088379, "global_step": 502900, "epoch": 2993} {"train_loss": -12.080940246582031, "global_step": 502901, "epoch": 2993} {"train_loss": -12.479233741760254, "global_step": 502902, "epoch": 2993} {"train_loss": -11.897315979003906, "global_step": 502903, "epoch": 2993} {"train_loss": -11.856014251708984, "global_step": 502904, "epoch": 2993} {"train_loss": -11.713982582092285, "global_step": 502905, "epoch": 2993} {"train_loss": -10.615631103515625, "global_step": 502906, "epoch": 2993} {"train_loss": -12.003841400146484, "global_step": 502907, "epoch": 2993} {"train_loss": -10.729986190795898, "global_step": 502908, "epoch": 2993} {"train_loss": -11.39603042602539, "global_step": 502909, "epoch": 2993} {"train_loss": -11.291486740112305, "global_step": 502910, "epoch": 2993} {"train_loss": -11.034549713134766, "global_step": 502911, "epoch": 2993} {"train_loss": -12.3399076461792, "global_step": 502912, "epoch": 2993} {"train_loss": -9.5108060836792, "global_step": 502913, "epoch": 2993} {"train_loss": -11.274154663085938, "global_step": 502914, "epoch": 2993} {"train_loss": -8.615798950195312, "global_step": 502915, "epoch": 2993} {"train_loss": -9.940643310546875, "global_step": 502916, "epoch": 2993} {"train_loss": -10.292299270629883, "global_step": 502917, "epoch": 2993} {"train_loss": -9.311677932739258, "global_step": 502918, "epoch": 2993} {"train_loss": -9.071266174316406, "global_step": 502919, "epoch": 2993} {"train_loss": -8.185443878173828, "global_step": 502920, "epoch": 2993} {"train_loss": -8.436933517456055, "global_step": 502921, "epoch": 2993} {"train_loss": -9.619836807250977, "global_step": 502922, "epoch": 2993} {"train_loss": -9.398665428161621, "global_step": 502923, "epoch": 2993} {"train_loss": -9.483871459960938, "global_step": 502924, "epoch": 2993} {"train_loss": -9.98930549621582, "global_step": 502925, "epoch": 2993} {"train_loss": -9.58799934387207, "global_step": 502926, "epoch": 2993} {"train_loss": -10.269248008728027, "global_step": 502927, "epoch": 2993} {"train_loss": -10.094419479370117, "global_step": 502928, "epoch": 2993} {"train_loss": -9.350200653076172, "global_step": 502929, "epoch": 2993} {"train_loss": -10.361579895019531, "global_step": 502930, "epoch": 2993} {"train_loss": -9.599540710449219, "global_step": 502931, "epoch": 2993} {"train_loss": -10.870911598205566, "global_step": 502932, "epoch": 2993} {"train_loss": -9.968315124511719, "global_step": 502933, "epoch": 2993} {"train_loss": -11.31618595123291, "global_step": 502934, "epoch": 2993} {"train_loss": -10.608002662658691, "global_step": 502935, "epoch": 2993} {"train_loss": -11.722100257873535, "global_step": 502936, "epoch": 2993} {"train_loss": -10.277785301208496, "global_step": 502937, "epoch": 2993} {"train_loss": -11.522064208984375, "global_step": 502938, "epoch": 2993} {"train_loss": -10.842523574829102, "global_step": 502939, "epoch": 2993} {"train_loss": -10.949604034423828, "global_step": 502940, "epoch": 2993} {"train_loss": -10.675731658935547, "global_step": 502941, "epoch": 2993} {"train_loss": -10.638105392456055, "global_step": 502942, "epoch": 2993} {"train_loss": -11.211762428283691, "global_step": 502943, "epoch": 2993} {"train_loss": -11.219423294067383, "global_step": 502944, "epoch": 2993} {"train_loss": -11.26246452331543, "global_step": 502945, "epoch": 2993} {"train_loss": -11.661042213439941, "global_step": 502946, "epoch": 2993} {"train_loss": -10.757063865661621, "global_step": 502947, "epoch": 2993} {"train_loss": -12.094196319580078, "global_step": 502948, "epoch": 2993} {"train_loss": -11.215391159057617, "global_step": 502949, "epoch": 2993} {"train_loss": -11.623472213745117, "global_step": 502950, "epoch": 2993} {"train_loss": -11.881097793579102, "global_step": 502951, "epoch": 2993} {"train_loss": -11.708367347717285, "global_step": 502952, "epoch": 2993} {"train_loss": -11.99190902709961, "global_step": 502953, "epoch": 2993} {"train_loss": -11.935901641845703, "global_step": 502954, "epoch": 2993} {"train_loss": -12.116249084472656, "global_step": 502955, "epoch": 2993} {"train_loss": -12.256006240844727, "global_step": 502956, "epoch": 2993} {"train_loss": -11.820379257202148, "global_step": 502957, "epoch": 2993} {"train_loss": -11.927787780761719, "global_step": 502958, "epoch": 2993} {"train_loss": -12.243416786193848, "global_step": 502959, "epoch": 2993} {"train_loss": -12.14084243774414, "global_step": 502960, "epoch": 2993} {"train_loss": -11.995323181152344, "global_step": 502961, "epoch": 2993} {"train_loss": -12.279549598693848, "global_step": 502962, "epoch": 2993} {"train_loss": -12.263395309448242, "global_step": 502963, "epoch": 2993} {"train_loss": -12.174842834472656, "global_step": 502964, "epoch": 2993} {"train_loss": -12.266302108764648, "global_step": 502965, "epoch": 2993} {"train_loss": -12.45184326171875, "global_step": 502966, "epoch": 2993} {"train_loss": -12.459421157836914, "global_step": 502967, "epoch": 2993} {"train_loss": -12.218181610107422, "global_step": 502968, "epoch": 2993} {"train_loss": -12.356473922729492, "global_step": 502969, "epoch": 2993} {"train_loss": -12.508459091186523, "global_step": 502970, "epoch": 2993} {"train_loss": -12.449502944946289, "global_step": 502971, "epoch": 2993} {"train_loss": -12.195775985717773, "global_step": 502972, "epoch": 2993} {"train_loss": -12.243049621582031, "global_step": 502973, "epoch": 2993} {"train_loss": -12.749526977539062, "global_step": 502974, "epoch": 2993} {"train_loss": -12.233694076538086, "global_step": 502975, "epoch": 2993} {"train_loss": -12.669358253479004, "global_step": 502976, "epoch": 2993} {"train_loss": -12.240860939025879, "global_step": 502977, "epoch": 2993} {"train_loss": -12.438321113586426, "global_step": 502978, "epoch": 2993} {"train_loss": -12.265871047973633, "global_step": 502979, "epoch": 2993} {"train_loss": -12.546278953552246, "global_step": 502980, "epoch": 2993} {"train_loss": -12.494242668151855, "global_step": 502981, "epoch": 2993} {"train_loss": -12.472968101501465, "global_step": 502982, "epoch": 2993} {"train_loss": -12.503488540649414, "global_step": 502983, "epoch": 2993} {"train_loss": -12.799012184143066, "global_step": 502984, "epoch": 2993} {"train_loss": -12.605575561523438, "global_step": 502985, "epoch": 2993} {"train_loss": -12.534940719604492, "global_step": 502986, "epoch": 2993} {"train_loss": -12.455798149108887, "global_step": 502987, "epoch": 2993} {"train_loss": -12.542753219604492, "global_step": 502988, "epoch": 2993} {"train_loss": -12.446430206298828, "global_step": 502989, "epoch": 2993} {"train_loss": -12.662821769714355, "global_step": 502990, "epoch": 2993} {"train_loss": -11.840115643682934, "global_step": 502991, "epoch": 2993, "val_loss": 316237.40625} {"train_loss": -12.591035842895508, "global_step": 502992, "epoch": 2994} {"train_loss": -12.478227615356445, "global_step": 502993, "epoch": 2994} {"train_loss": -12.291748046875, "global_step": 502994, "epoch": 2994} {"train_loss": -12.823615074157715, "global_step": 502995, "epoch": 2994} {"train_loss": -12.478736877441406, "global_step": 502996, "epoch": 2994} {"train_loss": -12.74722957611084, "global_step": 502997, "epoch": 2994} {"train_loss": -12.742311477661133, "global_step": 502998, "epoch": 2994} {"train_loss": -12.632559776306152, "global_step": 502999, "epoch": 2994} {"train_loss": -12.771766662597656, "global_step": 503000, "epoch": 2994} {"train_loss": -12.7946195602417, "global_step": 503001, "epoch": 2994} {"train_loss": -12.649065017700195, "global_step": 503002, "epoch": 2994} {"train_loss": -12.83650016784668, "global_step": 503003, "epoch": 2994} {"train_loss": -12.631897926330566, "global_step": 503004, "epoch": 2994} {"train_loss": -12.73964786529541, "global_step": 503005, "epoch": 2994} {"train_loss": -12.723526954650879, "global_step": 503006, "epoch": 2994} {"train_loss": -12.79155158996582, "global_step": 503007, "epoch": 2994} {"train_loss": -12.818218231201172, "global_step": 503008, "epoch": 2994} {"train_loss": -12.760990142822266, "global_step": 503009, "epoch": 2994} {"train_loss": -12.532352447509766, "global_step": 503010, "epoch": 2994} {"train_loss": -12.791050910949707, "global_step": 503011, "epoch": 2994} {"train_loss": -12.535764694213867, "global_step": 503012, "epoch": 2994} {"train_loss": -12.861530303955078, "global_step": 503013, "epoch": 2994} {"train_loss": -12.8505220413208, "global_step": 503014, "epoch": 2994} {"train_loss": -12.691300392150879, "global_step": 503015, "epoch": 2994} {"train_loss": -12.732057571411133, "global_step": 503016, "epoch": 2994} {"train_loss": -12.791163444519043, "global_step": 503017, "epoch": 2994} {"train_loss": -12.690072059631348, "global_step": 503018, "epoch": 2994} {"train_loss": -12.639891624450684, "global_step": 503019, "epoch": 2994} {"train_loss": -12.953057289123535, "global_step": 503020, "epoch": 2994} {"train_loss": -12.826986312866211, "global_step": 503021, "epoch": 2994} {"train_loss": -12.983875274658203, "global_step": 503022, "epoch": 2994} {"train_loss": -12.756460189819336, "global_step": 503023, "epoch": 2994} {"train_loss": -12.888581275939941, "global_step": 503024, "epoch": 2994} {"train_loss": -12.986459732055664, "global_step": 503025, "epoch": 2994} {"train_loss": -12.947054862976074, "global_step": 503026, "epoch": 2994} {"train_loss": -12.796500205993652, "global_step": 503027, "epoch": 2994} {"train_loss": -12.758045196533203, "global_step": 503028, "epoch": 2994} {"train_loss": -12.629545211791992, "global_step": 503029, "epoch": 2994} {"train_loss": -12.8629150390625, "global_step": 503030, "epoch": 2994} {"train_loss": -12.772907257080078, "global_step": 503031, "epoch": 2994} {"train_loss": -12.81416130065918, "global_step": 503032, "epoch": 2994} {"train_loss": -12.928861618041992, "global_step": 503033, "epoch": 2994} {"train_loss": -12.999422073364258, "global_step": 503034, "epoch": 2994} {"train_loss": -12.788936614990234, "global_step": 503035, "epoch": 2994} {"train_loss": -12.407047271728516, "global_step": 503036, "epoch": 2994} {"train_loss": -12.845220565795898, "global_step": 503037, "epoch": 2994} {"train_loss": -12.521821975708008, "global_step": 503038, "epoch": 2994} {"train_loss": -12.975335121154785, "global_step": 503039, "epoch": 2994} {"train_loss": -12.817647933959961, "global_step": 503040, "epoch": 2994} {"train_loss": -12.744199752807617, "global_step": 503041, "epoch": 2994} {"train_loss": -12.896463394165039, "global_step": 503042, "epoch": 2994} {"train_loss": -13.079967498779297, "global_step": 503043, "epoch": 2994} {"train_loss": -12.700235366821289, "global_step": 503044, "epoch": 2994} {"train_loss": -12.701854705810547, "global_step": 503045, "epoch": 2994} {"train_loss": -12.878600120544434, "global_step": 503046, "epoch": 2994} {"train_loss": -12.914281845092773, "global_step": 503047, "epoch": 2994} {"train_loss": -12.820720672607422, "global_step": 503048, "epoch": 2994} {"train_loss": -12.876206398010254, "global_step": 503049, "epoch": 2994} {"train_loss": -13.008578300476074, "global_step": 503050, "epoch": 2994} {"train_loss": -12.923717498779297, "global_step": 503051, "epoch": 2994} {"train_loss": -12.86810302734375, "global_step": 503052, "epoch": 2994} {"train_loss": -12.734073638916016, "global_step": 503053, "epoch": 2994} {"train_loss": -12.385107040405273, "global_step": 503054, "epoch": 2994} {"train_loss": -12.900787353515625, "global_step": 503055, "epoch": 2994} {"train_loss": -12.759588241577148, "global_step": 503056, "epoch": 2994} {"train_loss": -12.590107917785645, "global_step": 503057, "epoch": 2994} {"train_loss": -12.606072425842285, "global_step": 503058, "epoch": 2994} {"train_loss": -12.945975303649902, "global_step": 503059, "epoch": 2994} {"train_loss": -12.214268684387207, "global_step": 503060, "epoch": 2994} {"train_loss": -12.363486289978027, "global_step": 503061, "epoch": 2994} {"train_loss": -12.061532974243164, "global_step": 503062, "epoch": 2994} {"train_loss": -12.277971267700195, "global_step": 503063, "epoch": 2994} {"train_loss": -11.849031448364258, "global_step": 503064, "epoch": 2994} {"train_loss": -12.248477935791016, "global_step": 503065, "epoch": 2994} {"train_loss": -12.91446304321289, "global_step": 503066, "epoch": 2994} {"train_loss": -12.450628280639648, "global_step": 503067, "epoch": 2994} {"train_loss": -12.316513061523438, "global_step": 503068, "epoch": 2994} {"train_loss": -12.85812759399414, "global_step": 503069, "epoch": 2994} {"train_loss": -12.427081108093262, "global_step": 503070, "epoch": 2994} {"train_loss": -12.142626762390137, "global_step": 503071, "epoch": 2994} {"train_loss": -12.744251251220703, "global_step": 503072, "epoch": 2994} {"train_loss": -12.447090148925781, "global_step": 503073, "epoch": 2994} {"train_loss": -12.04293441772461, "global_step": 503074, "epoch": 2994} {"train_loss": -11.742425918579102, "global_step": 503075, "epoch": 2994} {"train_loss": -12.256217956542969, "global_step": 503076, "epoch": 2994} {"train_loss": -11.746774673461914, "global_step": 503077, "epoch": 2994} {"train_loss": -12.03731918334961, "global_step": 503078, "epoch": 2994} {"train_loss": -11.711196899414062, "global_step": 503079, "epoch": 2994} {"train_loss": -12.382434844970703, "global_step": 503080, "epoch": 2994} {"train_loss": -11.525374412536621, "global_step": 503081, "epoch": 2994} {"train_loss": -12.407831192016602, "global_step": 503082, "epoch": 2994} {"train_loss": -12.448274612426758, "global_step": 503083, "epoch": 2994} {"train_loss": -12.30021858215332, "global_step": 503084, "epoch": 2994} {"train_loss": -11.811407089233398, "global_step": 503085, "epoch": 2994} {"train_loss": -12.616451263427734, "global_step": 503086, "epoch": 2994} {"train_loss": -11.864693641662598, "global_step": 503087, "epoch": 2994} {"train_loss": -12.317705154418945, "global_step": 503088, "epoch": 2994} {"train_loss": -11.885482788085938, "global_step": 503089, "epoch": 2994} {"train_loss": -11.772111892700195, "global_step": 503090, "epoch": 2994} {"train_loss": -11.77346420288086, "global_step": 503091, "epoch": 2994} {"train_loss": -12.061430931091309, "global_step": 503092, "epoch": 2994} {"train_loss": -12.252090454101562, "global_step": 503093, "epoch": 2994} {"train_loss": -12.105446815490723, "global_step": 503094, "epoch": 2994} {"train_loss": -12.650896072387695, "global_step": 503095, "epoch": 2994} {"train_loss": -12.029937744140625, "global_step": 503096, "epoch": 2994} {"train_loss": -11.995691299438477, "global_step": 503097, "epoch": 2994} {"train_loss": -12.219470977783203, "global_step": 503098, "epoch": 2994} {"train_loss": -11.748476028442383, "global_step": 503099, "epoch": 2994} {"train_loss": -12.168708801269531, "global_step": 503100, "epoch": 2994} {"train_loss": -12.32142448425293, "global_step": 503101, "epoch": 2994} {"train_loss": -12.52869987487793, "global_step": 503102, "epoch": 2994} {"train_loss": -11.791142463684082, "global_step": 503103, "epoch": 2994} {"train_loss": -12.362409591674805, "global_step": 503104, "epoch": 2994} {"train_loss": -12.181750297546387, "global_step": 503105, "epoch": 2994} {"train_loss": -11.44394588470459, "global_step": 503106, "epoch": 2994} {"train_loss": -12.478616714477539, "global_step": 503107, "epoch": 2994} {"train_loss": -11.522865295410156, "global_step": 503108, "epoch": 2994} {"train_loss": -11.731623649597168, "global_step": 503109, "epoch": 2994} {"train_loss": -11.366537094116211, "global_step": 503110, "epoch": 2994} {"train_loss": -12.325244903564453, "global_step": 503111, "epoch": 2994} {"train_loss": -11.593233108520508, "global_step": 503112, "epoch": 2994} {"train_loss": -11.554807662963867, "global_step": 503113, "epoch": 2994} {"train_loss": -11.665253639221191, "global_step": 503114, "epoch": 2994} {"train_loss": -12.251266479492188, "global_step": 503115, "epoch": 2994} {"train_loss": -12.614547729492188, "global_step": 503116, "epoch": 2994} {"train_loss": -11.999738693237305, "global_step": 503117, "epoch": 2994} {"train_loss": -12.689565658569336, "global_step": 503118, "epoch": 2994} {"train_loss": -12.31659984588623, "global_step": 503119, "epoch": 2994} {"train_loss": -12.07541275024414, "global_step": 503120, "epoch": 2994} {"train_loss": -12.478635787963867, "global_step": 503121, "epoch": 2994} {"train_loss": -12.1575288772583, "global_step": 503122, "epoch": 2994} {"train_loss": -12.694541931152344, "global_step": 503123, "epoch": 2994} {"train_loss": -12.030746459960938, "global_step": 503124, "epoch": 2994} {"train_loss": -12.242607116699219, "global_step": 503125, "epoch": 2994} {"train_loss": -12.675175666809082, "global_step": 503126, "epoch": 2994} {"train_loss": -12.414908409118652, "global_step": 503127, "epoch": 2994} {"train_loss": -12.720171928405762, "global_step": 503128, "epoch": 2994} {"train_loss": -12.29765510559082, "global_step": 503129, "epoch": 2994} {"train_loss": -12.861616134643555, "global_step": 503130, "epoch": 2994} {"train_loss": -12.300025939941406, "global_step": 503131, "epoch": 2994} {"train_loss": -12.550321578979492, "global_step": 503132, "epoch": 2994} {"train_loss": -12.639201164245605, "global_step": 503133, "epoch": 2994} {"train_loss": -12.170051574707031, "global_step": 503134, "epoch": 2994} {"train_loss": -11.844381332397461, "global_step": 503135, "epoch": 2994} {"train_loss": -12.44770622253418, "global_step": 503136, "epoch": 2994} {"train_loss": -11.943985939025879, "global_step": 503137, "epoch": 2994} {"train_loss": -11.63302993774414, "global_step": 503138, "epoch": 2994} {"train_loss": -12.634954452514648, "global_step": 503139, "epoch": 2994} {"train_loss": -11.91390323638916, "global_step": 503140, "epoch": 2994} {"train_loss": -11.548293113708496, "global_step": 503141, "epoch": 2994} {"train_loss": -12.672052383422852, "global_step": 503142, "epoch": 2994} {"train_loss": -12.166288375854492, "global_step": 503143, "epoch": 2994} {"train_loss": -12.712717056274414, "global_step": 503144, "epoch": 2994} {"train_loss": -12.374464988708496, "global_step": 503145, "epoch": 2994} {"train_loss": -12.666585922241211, "global_step": 503146, "epoch": 2994} {"train_loss": -12.390487670898438, "global_step": 503147, "epoch": 2994} {"train_loss": -12.1569242477417, "global_step": 503148, "epoch": 2994} {"train_loss": -12.599985122680664, "global_step": 503149, "epoch": 2994} {"train_loss": -11.979818344116211, "global_step": 503150, "epoch": 2994} {"train_loss": -12.290817260742188, "global_step": 503151, "epoch": 2994} {"train_loss": -12.283330917358398, "global_step": 503152, "epoch": 2994} {"train_loss": -12.768418312072754, "global_step": 503153, "epoch": 2994} {"train_loss": -12.355926513671875, "global_step": 503154, "epoch": 2994} {"train_loss": -12.426219940185547, "global_step": 503155, "epoch": 2994} {"train_loss": -12.509720802307129, "global_step": 503156, "epoch": 2994} {"train_loss": -11.987264633178711, "global_step": 503157, "epoch": 2994} {"train_loss": -12.38907241821289, "global_step": 503158, "epoch": 2994} {"train_loss": -12.432200829188028, "global_step": 503159, "epoch": 2994, "val_loss": 320387.71875} {"train_loss": -12.206724166870117, "global_step": 503160, "epoch": 2995} {"train_loss": -12.190067291259766, "global_step": 503161, "epoch": 2995} {"train_loss": -11.909444808959961, "global_step": 503162, "epoch": 2995} {"train_loss": -12.143239974975586, "global_step": 503163, "epoch": 2995} {"train_loss": -12.426616668701172, "global_step": 503164, "epoch": 2995} {"train_loss": -12.499074935913086, "global_step": 503165, "epoch": 2995} {"train_loss": -12.27669620513916, "global_step": 503166, "epoch": 2995} {"train_loss": -12.27275276184082, "global_step": 503167, "epoch": 2995} {"train_loss": -12.629785537719727, "global_step": 503168, "epoch": 2995} {"train_loss": -12.102495193481445, "global_step": 503169, "epoch": 2995} {"train_loss": -12.629217147827148, "global_step": 503170, "epoch": 2995} {"train_loss": -12.0935640335083, "global_step": 503171, "epoch": 2995} {"train_loss": -11.604497909545898, "global_step": 503172, "epoch": 2995} {"train_loss": -12.050533294677734, "global_step": 503173, "epoch": 2995} {"train_loss": -12.078880310058594, "global_step": 503174, "epoch": 2995} {"train_loss": -11.090873718261719, "global_step": 503175, "epoch": 2995} {"train_loss": -12.01018238067627, "global_step": 503176, "epoch": 2995} {"train_loss": -12.145977973937988, "global_step": 503177, "epoch": 2995} {"train_loss": -11.910707473754883, "global_step": 503178, "epoch": 2995} {"train_loss": -11.8076171875, "global_step": 503179, "epoch": 2995} {"train_loss": -11.00042724609375, "global_step": 503180, "epoch": 2995} {"train_loss": -11.40838623046875, "global_step": 503181, "epoch": 2995} {"train_loss": -11.084794998168945, "global_step": 503182, "epoch": 2995} {"train_loss": -11.919038772583008, "global_step": 503183, "epoch": 2995} {"train_loss": -11.370588302612305, "global_step": 503184, "epoch": 2995} {"train_loss": -12.143026351928711, "global_step": 503185, "epoch": 2995} {"train_loss": -12.221396446228027, "global_step": 503186, "epoch": 2995} {"train_loss": -12.568193435668945, "global_step": 503187, "epoch": 2995} {"train_loss": -12.127636909484863, "global_step": 503188, "epoch": 2995} {"train_loss": -12.675485610961914, "global_step": 503189, "epoch": 2995} {"train_loss": -12.359576225280762, "global_step": 503190, "epoch": 2995} {"train_loss": -12.102478981018066, "global_step": 503191, "epoch": 2995} {"train_loss": -12.69029426574707, "global_step": 503192, "epoch": 2995} {"train_loss": -12.3770170211792, "global_step": 503193, "epoch": 2995} {"train_loss": -12.549701690673828, "global_step": 503194, "epoch": 2995} {"train_loss": -12.650681495666504, "global_step": 503195, "epoch": 2995} {"train_loss": -12.339530944824219, "global_step": 503196, "epoch": 2995} {"train_loss": -12.777942657470703, "global_step": 503197, "epoch": 2995} {"train_loss": -12.792102813720703, "global_step": 503198, "epoch": 2995} {"train_loss": -12.895870208740234, "global_step": 503199, "epoch": 2995} {"train_loss": -12.847660064697266, "global_step": 503200, "epoch": 2995} {"train_loss": -12.815339088439941, "global_step": 503201, "epoch": 2995} {"train_loss": -12.476334571838379, "global_step": 503202, "epoch": 2995} {"train_loss": -12.726016998291016, "global_step": 503203, "epoch": 2995} {"train_loss": -12.697765350341797, "global_step": 503204, "epoch": 2995} {"train_loss": -12.983997344970703, "global_step": 503205, "epoch": 2995} {"train_loss": -12.77042293548584, "global_step": 503206, "epoch": 2995} {"train_loss": -12.882514953613281, "global_step": 503207, "epoch": 2995} {"train_loss": -12.892803192138672, "global_step": 503208, "epoch": 2995} {"train_loss": -12.864081382751465, "global_step": 503209, "epoch": 2995} {"train_loss": -12.759422302246094, "global_step": 503210, "epoch": 2995} {"train_loss": -13.00579833984375, "global_step": 503211, "epoch": 2995} {"train_loss": -12.976564407348633, "global_step": 503212, "epoch": 2995} {"train_loss": -12.758767127990723, "global_step": 503213, "epoch": 2995} {"train_loss": -12.748071670532227, "global_step": 503214, "epoch": 2995} {"train_loss": -13.091744422912598, "global_step": 503215, "epoch": 2995} {"train_loss": -13.116415023803711, "global_step": 503216, "epoch": 2995} {"train_loss": -12.893415451049805, "global_step": 503217, "epoch": 2995} {"train_loss": -13.044553756713867, "global_step": 503218, "epoch": 2995} {"train_loss": -12.86923599243164, "global_step": 503219, "epoch": 2995} {"train_loss": -12.952573776245117, "global_step": 503220, "epoch": 2995} {"train_loss": -13.004396438598633, "global_step": 503221, "epoch": 2995} {"train_loss": -13.023366928100586, "global_step": 503222, "epoch": 2995} {"train_loss": -12.915664672851562, "global_step": 503223, "epoch": 2995} {"train_loss": -12.81845474243164, "global_step": 503224, "epoch": 2995} {"train_loss": -12.627342224121094, "global_step": 503225, "epoch": 2995} {"train_loss": -13.041559219360352, "global_step": 503226, "epoch": 2995} {"train_loss": -12.466588020324707, "global_step": 503227, "epoch": 2995} {"train_loss": -12.193815231323242, "global_step": 503228, "epoch": 2995} {"train_loss": -12.728177070617676, "global_step": 503229, "epoch": 2995} {"train_loss": -12.925570487976074, "global_step": 503230, "epoch": 2995} {"train_loss": -12.561397552490234, "global_step": 503231, "epoch": 2995} {"train_loss": -13.049571990966797, "global_step": 503232, "epoch": 2995} {"train_loss": -12.73994255065918, "global_step": 503233, "epoch": 2995} {"train_loss": -12.822465896606445, "global_step": 503234, "epoch": 2995} {"train_loss": -12.5963716506958, "global_step": 503235, "epoch": 2995} {"train_loss": -12.969482421875, "global_step": 503236, "epoch": 2995} {"train_loss": -12.495817184448242, "global_step": 503237, "epoch": 2995} {"train_loss": -13.035529136657715, "global_step": 503238, "epoch": 2995} {"train_loss": -12.509239196777344, "global_step": 503239, "epoch": 2995} {"train_loss": -12.75531005859375, "global_step": 503240, "epoch": 2995} {"train_loss": -12.704243659973145, "global_step": 503241, "epoch": 2995} {"train_loss": -12.478446006774902, "global_step": 503242, "epoch": 2995} {"train_loss": -12.863138198852539, "global_step": 503243, "epoch": 2995} {"train_loss": -12.529683113098145, "global_step": 503244, "epoch": 2995} {"train_loss": -12.70479965209961, "global_step": 503245, "epoch": 2995} {"train_loss": -12.869245529174805, "global_step": 503246, "epoch": 2995} {"train_loss": -12.791872024536133, "global_step": 503247, "epoch": 2995} {"train_loss": -11.979713439941406, "global_step": 503248, "epoch": 2995} {"train_loss": -12.523504257202148, "global_step": 503249, "epoch": 2995} {"train_loss": -11.928077697753906, "global_step": 503250, "epoch": 2995} {"train_loss": -11.872974395751953, "global_step": 503251, "epoch": 2995} {"train_loss": -12.39864730834961, "global_step": 503252, "epoch": 2995} {"train_loss": -13.087902069091797, "global_step": 503253, "epoch": 2995} {"train_loss": -12.675113677978516, "global_step": 503254, "epoch": 2995} {"train_loss": -12.44014835357666, "global_step": 503255, "epoch": 2995} {"train_loss": -12.823189735412598, "global_step": 503256, "epoch": 2995} {"train_loss": -12.779336929321289, "global_step": 503257, "epoch": 2995} {"train_loss": -12.357734680175781, "global_step": 503258, "epoch": 2995} {"train_loss": -12.398534774780273, "global_step": 503259, "epoch": 2995} {"train_loss": -12.189139366149902, "global_step": 503260, "epoch": 2995} {"train_loss": -12.957715034484863, "global_step": 503261, "epoch": 2995} {"train_loss": -12.719473838806152, "global_step": 503262, "epoch": 2995} {"train_loss": -12.508995056152344, "global_step": 503263, "epoch": 2995} {"train_loss": -12.516681671142578, "global_step": 503264, "epoch": 2995} {"train_loss": -12.820050239562988, "global_step": 503265, "epoch": 2995} {"train_loss": -12.380115509033203, "global_step": 503266, "epoch": 2995} {"train_loss": -11.973684310913086, "global_step": 503267, "epoch": 2995} {"train_loss": -11.878046035766602, "global_step": 503268, "epoch": 2995} {"train_loss": -12.619890213012695, "global_step": 503269, "epoch": 2995} {"train_loss": -12.750025749206543, "global_step": 503270, "epoch": 2995} {"train_loss": -12.57014274597168, "global_step": 503271, "epoch": 2995} {"train_loss": -12.662405014038086, "global_step": 503272, "epoch": 2995} {"train_loss": -12.405189514160156, "global_step": 503273, "epoch": 2995} {"train_loss": -11.510119438171387, "global_step": 503274, "epoch": 2995} {"train_loss": -12.349701881408691, "global_step": 503275, "epoch": 2995} {"train_loss": -11.758055686950684, "global_step": 503276, "epoch": 2995} {"train_loss": -12.472331047058105, "global_step": 503277, "epoch": 2995} {"train_loss": -11.593896865844727, "global_step": 503278, "epoch": 2995} {"train_loss": -12.29944133758545, "global_step": 503279, "epoch": 2995} {"train_loss": -12.634784698486328, "global_step": 503280, "epoch": 2995} {"train_loss": -12.649274826049805, "global_step": 503281, "epoch": 2995} {"train_loss": -11.610447883605957, "global_step": 503282, "epoch": 2995} {"train_loss": -12.541556358337402, "global_step": 503283, "epoch": 2995} {"train_loss": -12.59707260131836, "global_step": 503284, "epoch": 2995} {"train_loss": -11.651893615722656, "global_step": 503285, "epoch": 2995} {"train_loss": -10.99450969696045, "global_step": 503286, "epoch": 2995} {"train_loss": -11.504545211791992, "global_step": 503287, "epoch": 2995} {"train_loss": -9.801896095275879, "global_step": 503288, "epoch": 2995} {"train_loss": -12.014690399169922, "global_step": 503289, "epoch": 2995} {"train_loss": -8.822959899902344, "global_step": 503290, "epoch": 2995} {"train_loss": -9.021859169006348, "global_step": 503291, "epoch": 2995} {"train_loss": -8.632974624633789, "global_step": 503292, "epoch": 2995} {"train_loss": -9.17673110961914, "global_step": 503293, "epoch": 2995} {"train_loss": -9.80846881866455, "global_step": 503294, "epoch": 2995} {"train_loss": -9.454874992370605, "global_step": 503295, "epoch": 2995} {"train_loss": -8.49815559387207, "global_step": 503296, "epoch": 2995} {"train_loss": -9.230066299438477, "global_step": 503297, "epoch": 2995} {"train_loss": -9.67265510559082, "global_step": 503298, "epoch": 2995} {"train_loss": -8.756677627563477, "global_step": 503299, "epoch": 2995} {"train_loss": -10.695270538330078, "global_step": 503300, "epoch": 2995} {"train_loss": -10.238265991210938, "global_step": 503301, "epoch": 2995} {"train_loss": -9.072985649108887, "global_step": 503302, "epoch": 2995} {"train_loss": -9.714543342590332, "global_step": 503303, "epoch": 2995} {"train_loss": -9.954663276672363, "global_step": 503304, "epoch": 2995} {"train_loss": -9.129085540771484, "global_step": 503305, "epoch": 2995} {"train_loss": -9.738373756408691, "global_step": 503306, "epoch": 2995} {"train_loss": -10.374963760375977, "global_step": 503307, "epoch": 2995} {"train_loss": -10.467226028442383, "global_step": 503308, "epoch": 2995} {"train_loss": -10.553171157836914, "global_step": 503309, "epoch": 2995} {"train_loss": -11.309728622436523, "global_step": 503310, "epoch": 2995} {"train_loss": -11.081631660461426, "global_step": 503311, "epoch": 2995} {"train_loss": -10.817317962646484, "global_step": 503312, "epoch": 2995} {"train_loss": -10.597757339477539, "global_step": 503313, "epoch": 2995} {"train_loss": -11.490645408630371, "global_step": 503314, "epoch": 2995} {"train_loss": -11.517023086547852, "global_step": 503315, "epoch": 2995} {"train_loss": -11.364660263061523, "global_step": 503316, "epoch": 2995} {"train_loss": -10.89577865600586, "global_step": 503317, "epoch": 2995} {"train_loss": -11.265131950378418, "global_step": 503318, "epoch": 2995} {"train_loss": -11.514948844909668, "global_step": 503319, "epoch": 2995} {"train_loss": -11.278362274169922, "global_step": 503320, "epoch": 2995} {"train_loss": -11.391746520996094, "global_step": 503321, "epoch": 2995} {"train_loss": -11.469820022583008, "global_step": 503322, "epoch": 2995} {"train_loss": -11.597132682800293, "global_step": 503323, "epoch": 2995} {"train_loss": -11.304779052734375, "global_step": 503324, "epoch": 2995} {"train_loss": -11.827232360839844, "global_step": 503325, "epoch": 2995} {"train_loss": -11.99679946899414, "global_step": 503326, "epoch": 2995} {"train_loss": -11.966697800727118, "global_step": 503327, "epoch": 2995, "val_loss": 314681.21875, "train_action_mse_error": 0.7666090726852417} {"train_loss": -12.084579467773438, "global_step": 503328, "epoch": 2996} {"train_loss": -11.819087982177734, "global_step": 503329, "epoch": 2996} {"train_loss": -12.322376251220703, "global_step": 503330, "epoch": 2996} {"train_loss": -12.343289375305176, "global_step": 503331, "epoch": 2996} {"train_loss": -12.048933029174805, "global_step": 503332, "epoch": 2996} {"train_loss": -12.066923141479492, "global_step": 503333, "epoch": 2996} {"train_loss": -12.03415298461914, "global_step": 503334, "epoch": 2996} {"train_loss": -11.9625244140625, "global_step": 503335, "epoch": 2996} {"train_loss": -12.36132526397705, "global_step": 503336, "epoch": 2996} {"train_loss": -11.31247615814209, "global_step": 503337, "epoch": 2996} {"train_loss": -12.600255012512207, "global_step": 503338, "epoch": 2996} {"train_loss": -11.496384620666504, "global_step": 503339, "epoch": 2996} {"train_loss": -12.364048957824707, "global_step": 503340, "epoch": 2996} {"train_loss": -12.379135131835938, "global_step": 503341, "epoch": 2996} {"train_loss": -12.290121078491211, "global_step": 503342, "epoch": 2996} {"train_loss": -12.367620468139648, "global_step": 503343, "epoch": 2996} {"train_loss": -11.946084976196289, "global_step": 503344, "epoch": 2996} {"train_loss": -12.413045883178711, "global_step": 503345, "epoch": 2996} {"train_loss": -12.067154884338379, "global_step": 503346, "epoch": 2996} {"train_loss": -12.414972305297852, "global_step": 503347, "epoch": 2996} {"train_loss": -12.155097961425781, "global_step": 503348, "epoch": 2996} {"train_loss": -12.601778030395508, "global_step": 503349, "epoch": 2996} {"train_loss": -12.38444709777832, "global_step": 503350, "epoch": 2996} {"train_loss": -12.478001594543457, "global_step": 503351, "epoch": 2996} {"train_loss": -12.331838607788086, "global_step": 503352, "epoch": 2996} {"train_loss": -12.435539245605469, "global_step": 503353, "epoch": 2996} {"train_loss": -12.5465087890625, "global_step": 503354, "epoch": 2996} {"train_loss": -12.695351600646973, "global_step": 503355, "epoch": 2996} {"train_loss": -12.540477752685547, "global_step": 503356, "epoch": 2996} {"train_loss": -12.602437973022461, "global_step": 503357, "epoch": 2996} {"train_loss": -12.651660919189453, "global_step": 503358, "epoch": 2996} {"train_loss": -12.419337272644043, "global_step": 503359, "epoch": 2996} {"train_loss": -12.432332038879395, "global_step": 503360, "epoch": 2996} {"train_loss": -12.395126342773438, "global_step": 503361, "epoch": 2996} {"train_loss": -12.493717193603516, "global_step": 503362, "epoch": 2996} {"train_loss": -12.404547691345215, "global_step": 503363, "epoch": 2996} {"train_loss": -12.45736312866211, "global_step": 503364, "epoch": 2996} {"train_loss": -12.346275329589844, "global_step": 503365, "epoch": 2996} {"train_loss": -11.952250480651855, "global_step": 503366, "epoch": 2996} {"train_loss": -12.58116340637207, "global_step": 503367, "epoch": 2996} {"train_loss": -12.293006896972656, "global_step": 503368, "epoch": 2996} {"train_loss": -12.501285552978516, "global_step": 503369, "epoch": 2996} {"train_loss": -12.693382263183594, "global_step": 503370, "epoch": 2996} {"train_loss": -12.146387100219727, "global_step": 503371, "epoch": 2996} {"train_loss": -12.46780014038086, "global_step": 503372, "epoch": 2996} {"train_loss": -11.898141860961914, "global_step": 503373, "epoch": 2996} {"train_loss": -12.360187530517578, "global_step": 503374, "epoch": 2996} {"train_loss": -12.30538558959961, "global_step": 503375, "epoch": 2996} {"train_loss": -11.826155662536621, "global_step": 503376, "epoch": 2996} {"train_loss": -11.902786254882812, "global_step": 503377, "epoch": 2996} {"train_loss": -10.384077072143555, "global_step": 503378, "epoch": 2996} {"train_loss": -12.102843284606934, "global_step": 503379, "epoch": 2996} {"train_loss": -9.506796836853027, "global_step": 503380, "epoch": 2996} {"train_loss": -11.780921936035156, "global_step": 503381, "epoch": 2996} {"train_loss": -10.298537254333496, "global_step": 503382, "epoch": 2996} {"train_loss": -12.250992774963379, "global_step": 503383, "epoch": 2996} {"train_loss": -11.371095657348633, "global_step": 503384, "epoch": 2996} {"train_loss": -12.579717636108398, "global_step": 503385, "epoch": 2996} {"train_loss": -11.31201171875, "global_step": 503386, "epoch": 2996} {"train_loss": -12.326990127563477, "global_step": 503387, "epoch": 2996} {"train_loss": -11.947965621948242, "global_step": 503388, "epoch": 2996} {"train_loss": -12.210052490234375, "global_step": 503389, "epoch": 2996} {"train_loss": -12.29938793182373, "global_step": 503390, "epoch": 2996} {"train_loss": -11.925783157348633, "global_step": 503391, "epoch": 2996} {"train_loss": -11.894607543945312, "global_step": 503392, "epoch": 2996} {"train_loss": -12.410932540893555, "global_step": 503393, "epoch": 2996} {"train_loss": -11.887819290161133, "global_step": 503394, "epoch": 2996} {"train_loss": -12.475565910339355, "global_step": 503395, "epoch": 2996} {"train_loss": -12.098872184753418, "global_step": 503396, "epoch": 2996} {"train_loss": -11.827762603759766, "global_step": 503397, "epoch": 2996} {"train_loss": -12.29393196105957, "global_step": 503398, "epoch": 2996} {"train_loss": -12.263221740722656, "global_step": 503399, "epoch": 2996} {"train_loss": -12.356904983520508, "global_step": 503400, "epoch": 2996} {"train_loss": -12.074553489685059, "global_step": 503401, "epoch": 2996} {"train_loss": -12.497066497802734, "global_step": 503402, "epoch": 2996} {"train_loss": -12.130613327026367, "global_step": 503403, "epoch": 2996} {"train_loss": -12.2233247756958, "global_step": 503404, "epoch": 2996} {"train_loss": -12.276127815246582, "global_step": 503405, "epoch": 2996} {"train_loss": -12.129121780395508, "global_step": 503406, "epoch": 2996} {"train_loss": -12.537870407104492, "global_step": 503407, "epoch": 2996} {"train_loss": -12.281055450439453, "global_step": 503408, "epoch": 2996} {"train_loss": -12.379922866821289, "global_step": 503409, "epoch": 2996} {"train_loss": -12.489266395568848, "global_step": 503410, "epoch": 2996} {"train_loss": -12.551284790039062, "global_step": 503411, "epoch": 2996} {"train_loss": -12.405390739440918, "global_step": 503412, "epoch": 2996} {"train_loss": -12.590476989746094, "global_step": 503413, "epoch": 2996} {"train_loss": -12.392101287841797, "global_step": 503414, "epoch": 2996} {"train_loss": -12.479802131652832, "global_step": 503415, "epoch": 2996} {"train_loss": -12.361509323120117, "global_step": 503416, "epoch": 2996} {"train_loss": -12.634747505187988, "global_step": 503417, "epoch": 2996} {"train_loss": -12.58546257019043, "global_step": 503418, "epoch": 2996} {"train_loss": -12.483091354370117, "global_step": 503419, "epoch": 2996} {"train_loss": -12.67147445678711, "global_step": 503420, "epoch": 2996} {"train_loss": -12.522636413574219, "global_step": 503421, "epoch": 2996} {"train_loss": -12.810457229614258, "global_step": 503422, "epoch": 2996} {"train_loss": -12.511480331420898, "global_step": 503423, "epoch": 2996} {"train_loss": -12.797506332397461, "global_step": 503424, "epoch": 2996} {"train_loss": -12.384551048278809, "global_step": 503425, "epoch": 2996} {"train_loss": -12.701107025146484, "global_step": 503426, "epoch": 2996} {"train_loss": -12.654172897338867, "global_step": 503427, "epoch": 2996} {"train_loss": -12.581852912902832, "global_step": 503428, "epoch": 2996} {"train_loss": -12.580010414123535, "global_step": 503429, "epoch": 2996} {"train_loss": -12.50594711303711, "global_step": 503430, "epoch": 2996} {"train_loss": -12.793214797973633, "global_step": 503431, "epoch": 2996} {"train_loss": -12.76812744140625, "global_step": 503432, "epoch": 2996} {"train_loss": -12.801375389099121, "global_step": 503433, "epoch": 2996} {"train_loss": -12.77866268157959, "global_step": 503434, "epoch": 2996} {"train_loss": -12.770980834960938, "global_step": 503435, "epoch": 2996} {"train_loss": -12.599014282226562, "global_step": 503436, "epoch": 2996} {"train_loss": -12.638118743896484, "global_step": 503437, "epoch": 2996} {"train_loss": -12.590588569641113, "global_step": 503438, "epoch": 2996} {"train_loss": -12.846412658691406, "global_step": 503439, "epoch": 2996} {"train_loss": -12.835519790649414, "global_step": 503440, "epoch": 2996} {"train_loss": -12.959341049194336, "global_step": 503441, "epoch": 2996} {"train_loss": -12.714466094970703, "global_step": 503442, "epoch": 2996} {"train_loss": -12.8484525680542, "global_step": 503443, "epoch": 2996} {"train_loss": -13.009273529052734, "global_step": 503444, "epoch": 2996} {"train_loss": -12.838092803955078, "global_step": 503445, "epoch": 2996} {"train_loss": -12.878894805908203, "global_step": 503446, "epoch": 2996} {"train_loss": -12.556289672851562, "global_step": 503447, "epoch": 2996} {"train_loss": -12.848945617675781, "global_step": 503448, "epoch": 2996} {"train_loss": -12.616313934326172, "global_step": 503449, "epoch": 2996} {"train_loss": -12.81336784362793, "global_step": 503450, "epoch": 2996} {"train_loss": -12.779254913330078, "global_step": 503451, "epoch": 2996} {"train_loss": -12.877055168151855, "global_step": 503452, "epoch": 2996} {"train_loss": -12.827781677246094, "global_step": 503453, "epoch": 2996} {"train_loss": -12.842641830444336, "global_step": 503454, "epoch": 2996} {"train_loss": -12.935502052307129, "global_step": 503455, "epoch": 2996} {"train_loss": -12.783088684082031, "global_step": 503456, "epoch": 2996} {"train_loss": -12.980218887329102, "global_step": 503457, "epoch": 2996} {"train_loss": -12.795511245727539, "global_step": 503458, "epoch": 2996} {"train_loss": -12.91904354095459, "global_step": 503459, "epoch": 2996} {"train_loss": -12.877004623413086, "global_step": 503460, "epoch": 2996} {"train_loss": -12.834759712219238, "global_step": 503461, "epoch": 2996} {"train_loss": -12.826614379882812, "global_step": 503462, "epoch": 2996} {"train_loss": -12.775394439697266, "global_step": 503463, "epoch": 2996} {"train_loss": -12.987447738647461, "global_step": 503464, "epoch": 2996} {"train_loss": -12.956655502319336, "global_step": 503465, "epoch": 2996} {"train_loss": -12.617053985595703, "global_step": 503466, "epoch": 2996} {"train_loss": -12.881629943847656, "global_step": 503467, "epoch": 2996} {"train_loss": -12.660889625549316, "global_step": 503468, "epoch": 2996} {"train_loss": -12.846635818481445, "global_step": 503469, "epoch": 2996} {"train_loss": -12.722295761108398, "global_step": 503470, "epoch": 2996} {"train_loss": -12.785709381103516, "global_step": 503471, "epoch": 2996} {"train_loss": -12.471081733703613, "global_step": 503472, "epoch": 2996} {"train_loss": -11.710846900939941, "global_step": 503473, "epoch": 2996} {"train_loss": -12.944540977478027, "global_step": 503474, "epoch": 2996} {"train_loss": -12.1734619140625, "global_step": 503475, "epoch": 2996} {"train_loss": -12.089557647705078, "global_step": 503476, "epoch": 2996} {"train_loss": -12.491785049438477, "global_step": 503477, "epoch": 2996} {"train_loss": -12.298955917358398, "global_step": 503478, "epoch": 2996} {"train_loss": -12.499629974365234, "global_step": 503479, "epoch": 2996} {"train_loss": -12.701726913452148, "global_step": 503480, "epoch": 2996} {"train_loss": -12.952840805053711, "global_step": 503481, "epoch": 2996} {"train_loss": -12.641946792602539, "global_step": 503482, "epoch": 2996} {"train_loss": -12.82264518737793, "global_step": 503483, "epoch": 2996} {"train_loss": -12.518173217773438, "global_step": 503484, "epoch": 2996} {"train_loss": -12.012428283691406, "global_step": 503485, "epoch": 2996} {"train_loss": -12.157506942749023, "global_step": 503486, "epoch": 2996} {"train_loss": -12.693853378295898, "global_step": 503487, "epoch": 2996} {"train_loss": -11.93628978729248, "global_step": 503488, "epoch": 2996} {"train_loss": -11.522672653198242, "global_step": 503489, "epoch": 2996} {"train_loss": -12.723784446716309, "global_step": 503490, "epoch": 2996} {"train_loss": -11.432360649108887, "global_step": 503491, "epoch": 2996} {"train_loss": -11.474028587341309, "global_step": 503492, "epoch": 2996} {"train_loss": -11.680770874023438, "global_step": 503493, "epoch": 2996} {"train_loss": -12.270224571228027, "global_step": 503494, "epoch": 2996} {"train_loss": -12.372354024932498, "global_step": 503495, "epoch": 2996, "val_loss": 319131.21875} {"train_loss": -12.889396667480469, "global_step": 503496, "epoch": 2997} {"train_loss": -11.419048309326172, "global_step": 503497, "epoch": 2997} {"train_loss": -12.752761840820312, "global_step": 503498, "epoch": 2997} {"train_loss": -11.96033000946045, "global_step": 503499, "epoch": 2997} {"train_loss": -12.375823974609375, "global_step": 503500, "epoch": 2997} {"train_loss": -12.764015197753906, "global_step": 503501, "epoch": 2997} {"train_loss": -12.764810562133789, "global_step": 503502, "epoch": 2997} {"train_loss": -12.653820991516113, "global_step": 503503, "epoch": 2997} {"train_loss": -12.87779426574707, "global_step": 503504, "epoch": 2997} {"train_loss": -12.75012493133545, "global_step": 503505, "epoch": 2997} {"train_loss": -12.919760704040527, "global_step": 503506, "epoch": 2997} {"train_loss": -12.764373779296875, "global_step": 503507, "epoch": 2997} {"train_loss": -12.70126724243164, "global_step": 503508, "epoch": 2997} {"train_loss": -12.556096076965332, "global_step": 503509, "epoch": 2997} {"train_loss": -12.532693862915039, "global_step": 503510, "epoch": 2997} {"train_loss": -12.545459747314453, "global_step": 503511, "epoch": 2997} {"train_loss": -12.493077278137207, "global_step": 503512, "epoch": 2997} {"train_loss": -12.849292755126953, "global_step": 503513, "epoch": 2997} {"train_loss": -12.684378623962402, "global_step": 503514, "epoch": 2997} {"train_loss": -12.683050155639648, "global_step": 503515, "epoch": 2997} {"train_loss": -12.574503898620605, "global_step": 503516, "epoch": 2997} {"train_loss": -12.289295196533203, "global_step": 503517, "epoch": 2997} {"train_loss": -12.532654762268066, "global_step": 503518, "epoch": 2997} {"train_loss": -12.8563871383667, "global_step": 503519, "epoch": 2997} {"train_loss": -12.234339714050293, "global_step": 503520, "epoch": 2997} {"train_loss": -12.781682014465332, "global_step": 503521, "epoch": 2997} {"train_loss": -12.420238494873047, "global_step": 503522, "epoch": 2997} {"train_loss": -12.904458045959473, "global_step": 503523, "epoch": 2997} {"train_loss": -12.805480003356934, "global_step": 503524, "epoch": 2997} {"train_loss": -12.76569938659668, "global_step": 503525, "epoch": 2997} {"train_loss": -12.569082260131836, "global_step": 503526, "epoch": 2997} {"train_loss": -12.913071632385254, "global_step": 503527, "epoch": 2997} {"train_loss": -12.477011680603027, "global_step": 503528, "epoch": 2997} {"train_loss": -12.447799682617188, "global_step": 503529, "epoch": 2997} {"train_loss": -12.737039566040039, "global_step": 503530, "epoch": 2997} {"train_loss": -12.891030311584473, "global_step": 503531, "epoch": 2997} {"train_loss": -12.43869400024414, "global_step": 503532, "epoch": 2997} {"train_loss": -12.75667953491211, "global_step": 503533, "epoch": 2997} {"train_loss": -12.91109848022461, "global_step": 503534, "epoch": 2997} {"train_loss": -12.32093334197998, "global_step": 503535, "epoch": 2997} {"train_loss": -12.67976188659668, "global_step": 503536, "epoch": 2997} {"train_loss": -12.736799240112305, "global_step": 503537, "epoch": 2997} {"train_loss": -12.37104320526123, "global_step": 503538, "epoch": 2997} {"train_loss": -11.801746368408203, "global_step": 503539, "epoch": 2997} {"train_loss": -12.332596778869629, "global_step": 503540, "epoch": 2997} {"train_loss": -12.451054573059082, "global_step": 503541, "epoch": 2997} {"train_loss": -12.099802017211914, "global_step": 503542, "epoch": 2997} {"train_loss": -12.533246994018555, "global_step": 503543, "epoch": 2997} {"train_loss": -12.11306095123291, "global_step": 503544, "epoch": 2997} {"train_loss": -11.692156791687012, "global_step": 503545, "epoch": 2997} {"train_loss": -11.972249984741211, "global_step": 503546, "epoch": 2997} {"train_loss": -11.880928039550781, "global_step": 503547, "epoch": 2997} {"train_loss": -10.957738876342773, "global_step": 503548, "epoch": 2997} {"train_loss": -10.790218353271484, "global_step": 503549, "epoch": 2997} {"train_loss": -12.197071075439453, "global_step": 503550, "epoch": 2997} {"train_loss": -11.533329010009766, "global_step": 503551, "epoch": 2997} {"train_loss": -12.253018379211426, "global_step": 503552, "epoch": 2997} {"train_loss": -11.036215782165527, "global_step": 503553, "epoch": 2997} {"train_loss": -12.39936637878418, "global_step": 503554, "epoch": 2997} {"train_loss": -11.476567268371582, "global_step": 503555, "epoch": 2997} {"train_loss": -10.272146224975586, "global_step": 503556, "epoch": 2997} {"train_loss": -11.733762741088867, "global_step": 503557, "epoch": 2997} {"train_loss": -10.789299011230469, "global_step": 503558, "epoch": 2997} {"train_loss": -11.234655380249023, "global_step": 503559, "epoch": 2997} {"train_loss": -9.467523574829102, "global_step": 503560, "epoch": 2997} {"train_loss": -11.832704544067383, "global_step": 503561, "epoch": 2997} {"train_loss": -10.613748550415039, "global_step": 503562, "epoch": 2997} {"train_loss": -10.257993698120117, "global_step": 503563, "epoch": 2997} {"train_loss": -9.04880142211914, "global_step": 503564, "epoch": 2997} {"train_loss": -8.684531211853027, "global_step": 503565, "epoch": 2997} {"train_loss": -9.49533462524414, "global_step": 503566, "epoch": 2997} {"train_loss": -9.938554763793945, "global_step": 503567, "epoch": 2997} {"train_loss": -10.47188663482666, "global_step": 503568, "epoch": 2997} {"train_loss": -9.79053020477295, "global_step": 503569, "epoch": 2997} {"train_loss": -10.359758377075195, "global_step": 503570, "epoch": 2997} {"train_loss": -9.941390991210938, "global_step": 503571, "epoch": 2997} {"train_loss": -9.890440940856934, "global_step": 503572, "epoch": 2997} {"train_loss": -10.459243774414062, "global_step": 503573, "epoch": 2997} {"train_loss": -10.473028182983398, "global_step": 503574, "epoch": 2997} {"train_loss": -11.401596069335938, "global_step": 503575, "epoch": 2997} {"train_loss": -10.602170944213867, "global_step": 503576, "epoch": 2997} {"train_loss": -10.918122291564941, "global_step": 503577, "epoch": 2997} {"train_loss": -10.974836349487305, "global_step": 503578, "epoch": 2997} {"train_loss": -9.99528694152832, "global_step": 503579, "epoch": 2997} {"train_loss": -10.463737487792969, "global_step": 503580, "epoch": 2997} {"train_loss": -11.912647247314453, "global_step": 503581, "epoch": 2997} {"train_loss": -10.547746658325195, "global_step": 503582, "epoch": 2997} {"train_loss": -10.678184509277344, "global_step": 503583, "epoch": 2997} {"train_loss": -11.703794479370117, "global_step": 503584, "epoch": 2997} {"train_loss": -10.480628967285156, "global_step": 503585, "epoch": 2997} {"train_loss": -11.417900085449219, "global_step": 503586, "epoch": 2997} {"train_loss": -11.078368186950684, "global_step": 503587, "epoch": 2997} {"train_loss": -10.541608810424805, "global_step": 503588, "epoch": 2997} {"train_loss": -11.275053024291992, "global_step": 503589, "epoch": 2997} {"train_loss": -10.778535842895508, "global_step": 503590, "epoch": 2997} {"train_loss": -10.835241317749023, "global_step": 503591, "epoch": 2997} {"train_loss": -11.640544891357422, "global_step": 503592, "epoch": 2997} {"train_loss": -10.019145965576172, "global_step": 503593, "epoch": 2997} {"train_loss": -11.619149208068848, "global_step": 503594, "epoch": 2997} {"train_loss": -10.864437103271484, "global_step": 503595, "epoch": 2997} {"train_loss": -11.41995620727539, "global_step": 503596, "epoch": 2997} {"train_loss": -12.122076034545898, "global_step": 503597, "epoch": 2997} {"train_loss": -11.770940780639648, "global_step": 503598, "epoch": 2997} {"train_loss": -11.538825035095215, "global_step": 503599, "epoch": 2997} {"train_loss": -12.079891204833984, "global_step": 503600, "epoch": 2997} {"train_loss": -11.76046371459961, "global_step": 503601, "epoch": 2997} {"train_loss": -12.11346435546875, "global_step": 503602, "epoch": 2997} {"train_loss": -11.957416534423828, "global_step": 503603, "epoch": 2997} {"train_loss": -11.19873046875, "global_step": 503604, "epoch": 2997} {"train_loss": -12.322896957397461, "global_step": 503605, "epoch": 2997} {"train_loss": -11.292335510253906, "global_step": 503606, "epoch": 2997} {"train_loss": -12.374342918395996, "global_step": 503607, "epoch": 2997} {"train_loss": -11.978776931762695, "global_step": 503608, "epoch": 2997} {"train_loss": -12.232787132263184, "global_step": 503609, "epoch": 2997} {"train_loss": -12.130367279052734, "global_step": 503610, "epoch": 2997} {"train_loss": -12.01019287109375, "global_step": 503611, "epoch": 2997} {"train_loss": -12.246179580688477, "global_step": 503612, "epoch": 2997} {"train_loss": -12.24543571472168, "global_step": 503613, "epoch": 2997} {"train_loss": -12.498181343078613, "global_step": 503614, "epoch": 2997} {"train_loss": -12.308998107910156, "global_step": 503615, "epoch": 2997} {"train_loss": -12.418334007263184, "global_step": 503616, "epoch": 2997} {"train_loss": -12.259954452514648, "global_step": 503617, "epoch": 2997} {"train_loss": -12.623954772949219, "global_step": 503618, "epoch": 2997} {"train_loss": -12.327743530273438, "global_step": 503619, "epoch": 2997} {"train_loss": -12.264240264892578, "global_step": 503620, "epoch": 2997} {"train_loss": -12.4136381149292, "global_step": 503621, "epoch": 2997} {"train_loss": -12.350845336914062, "global_step": 503622, "epoch": 2997} {"train_loss": -12.472007751464844, "global_step": 503623, "epoch": 2997} {"train_loss": -12.434636116027832, "global_step": 503624, "epoch": 2997} {"train_loss": -12.470791816711426, "global_step": 503625, "epoch": 2997} {"train_loss": -12.62680435180664, "global_step": 503626, "epoch": 2997} {"train_loss": -12.545896530151367, "global_step": 503627, "epoch": 2997} {"train_loss": -12.63636589050293, "global_step": 503628, "epoch": 2997} {"train_loss": -12.20817756652832, "global_step": 503629, "epoch": 2997} {"train_loss": -12.30021858215332, "global_step": 503630, "epoch": 2997} {"train_loss": -12.484943389892578, "global_step": 503631, "epoch": 2997} {"train_loss": -12.566902160644531, "global_step": 503632, "epoch": 2997} {"train_loss": -12.480034828186035, "global_step": 503633, "epoch": 2997} {"train_loss": -12.599474906921387, "global_step": 503634, "epoch": 2997} {"train_loss": -12.7228422164917, "global_step": 503635, "epoch": 2997} {"train_loss": -12.495458602905273, "global_step": 503636, "epoch": 2997} {"train_loss": -12.63119125366211, "global_step": 503637, "epoch": 2997} {"train_loss": -12.59674072265625, "global_step": 503638, "epoch": 2997} {"train_loss": -12.735419273376465, "global_step": 503639, "epoch": 2997} {"train_loss": -12.747303009033203, "global_step": 503640, "epoch": 2997} {"train_loss": -12.525018692016602, "global_step": 503641, "epoch": 2997} {"train_loss": -12.842769622802734, "global_step": 503642, "epoch": 2997} {"train_loss": -12.796878814697266, "global_step": 503643, "epoch": 2997} {"train_loss": -12.783867835998535, "global_step": 503644, "epoch": 2997} {"train_loss": -12.551809310913086, "global_step": 503645, "epoch": 2997} {"train_loss": -12.846846580505371, "global_step": 503646, "epoch": 2997} {"train_loss": -12.746576309204102, "global_step": 503647, "epoch": 2997} {"train_loss": -12.563803672790527, "global_step": 503648, "epoch": 2997} {"train_loss": -12.68551254272461, "global_step": 503649, "epoch": 2997} {"train_loss": -12.459575653076172, "global_step": 503650, "epoch": 2997} {"train_loss": -12.578693389892578, "global_step": 503651, "epoch": 2997} {"train_loss": -12.825958251953125, "global_step": 503652, "epoch": 2997} {"train_loss": -12.502175331115723, "global_step": 503653, "epoch": 2997} {"train_loss": -12.982942581176758, "global_step": 503654, "epoch": 2997} {"train_loss": -12.819561004638672, "global_step": 503655, "epoch": 2997} {"train_loss": -13.054924964904785, "global_step": 503656, "epoch": 2997} {"train_loss": -12.418524742126465, "global_step": 503657, "epoch": 2997} {"train_loss": -13.078084945678711, "global_step": 503658, "epoch": 2997} {"train_loss": -12.771700859069824, "global_step": 503659, "epoch": 2997} {"train_loss": -12.969779014587402, "global_step": 503660, "epoch": 2997} {"train_loss": -12.826221466064453, "global_step": 503661, "epoch": 2997} {"train_loss": -12.722475051879883, "global_step": 503662, "epoch": 2997} {"train_loss": -11.985760859080724, "global_step": 503663, "epoch": 2997, "val_loss": 317633.84375} {"train_loss": -12.936958312988281, "global_step": 503664, "epoch": 2998} {"train_loss": -12.984981536865234, "global_step": 503665, "epoch": 2998} {"train_loss": -13.008708000183105, "global_step": 503666, "epoch": 2998} {"train_loss": -12.901334762573242, "global_step": 503667, "epoch": 2998} {"train_loss": -12.860733032226562, "global_step": 503668, "epoch": 2998} {"train_loss": -13.026341438293457, "global_step": 503669, "epoch": 2998} {"train_loss": -13.115279197692871, "global_step": 503670, "epoch": 2998} {"train_loss": -12.848600387573242, "global_step": 503671, "epoch": 2998} {"train_loss": -12.882935523986816, "global_step": 503672, "epoch": 2998} {"train_loss": -13.026712417602539, "global_step": 503673, "epoch": 2998} {"train_loss": -12.717204093933105, "global_step": 503674, "epoch": 2998} {"train_loss": -12.9609375, "global_step": 503675, "epoch": 2998} {"train_loss": -12.873066902160645, "global_step": 503676, "epoch": 2998} {"train_loss": -12.774725914001465, "global_step": 503677, "epoch": 2998} {"train_loss": -12.61988639831543, "global_step": 503678, "epoch": 2998} {"train_loss": -12.71748161315918, "global_step": 503679, "epoch": 2998} {"train_loss": -12.83498764038086, "global_step": 503680, "epoch": 2998} {"train_loss": -12.546672821044922, "global_step": 503681, "epoch": 2998} {"train_loss": -12.708259582519531, "global_step": 503682, "epoch": 2998} {"train_loss": -12.491353988647461, "global_step": 503683, "epoch": 2998} {"train_loss": -12.5433931350708, "global_step": 503684, "epoch": 2998} {"train_loss": -12.924053192138672, "global_step": 503685, "epoch": 2998} {"train_loss": -12.288494110107422, "global_step": 503686, "epoch": 2998} {"train_loss": -11.844198226928711, "global_step": 503687, "epoch": 2998} {"train_loss": -12.853052139282227, "global_step": 503688, "epoch": 2998} {"train_loss": -11.959159851074219, "global_step": 503689, "epoch": 2998} {"train_loss": -11.912721633911133, "global_step": 503690, "epoch": 2998} {"train_loss": -12.233976364135742, "global_step": 503691, "epoch": 2998} {"train_loss": -10.248430252075195, "global_step": 503692, "epoch": 2998} {"train_loss": -11.153892517089844, "global_step": 503693, "epoch": 2998} {"train_loss": -11.084590911865234, "global_step": 503694, "epoch": 2998} {"train_loss": -10.327035903930664, "global_step": 503695, "epoch": 2998} {"train_loss": -10.15410041809082, "global_step": 503696, "epoch": 2998} {"train_loss": -10.53801155090332, "global_step": 503697, "epoch": 2998} {"train_loss": -11.774417877197266, "global_step": 503698, "epoch": 2998} {"train_loss": -10.690374374389648, "global_step": 503699, "epoch": 2998} {"train_loss": -11.867240905761719, "global_step": 503700, "epoch": 2998} {"train_loss": -11.41885757446289, "global_step": 503701, "epoch": 2998} {"train_loss": -12.06277084350586, "global_step": 503702, "epoch": 2998} {"train_loss": -11.275876998901367, "global_step": 503703, "epoch": 2998} {"train_loss": -11.917387008666992, "global_step": 503704, "epoch": 2998} {"train_loss": -11.850373268127441, "global_step": 503705, "epoch": 2998} {"train_loss": -11.932416915893555, "global_step": 503706, "epoch": 2998} {"train_loss": -11.726730346679688, "global_step": 503707, "epoch": 2998} {"train_loss": -12.094390869140625, "global_step": 503708, "epoch": 2998} {"train_loss": -11.895752906799316, "global_step": 503709, "epoch": 2998} {"train_loss": -12.253013610839844, "global_step": 503710, "epoch": 2998} {"train_loss": -12.258550643920898, "global_step": 503711, "epoch": 2998} {"train_loss": -12.225154876708984, "global_step": 503712, "epoch": 2998} {"train_loss": -12.263071060180664, "global_step": 503713, "epoch": 2998} {"train_loss": -12.484222412109375, "global_step": 503714, "epoch": 2998} {"train_loss": -12.265996932983398, "global_step": 503715, "epoch": 2998} {"train_loss": -12.377117156982422, "global_step": 503716, "epoch": 2998} {"train_loss": -12.413307189941406, "global_step": 503717, "epoch": 2998} {"train_loss": -12.464773178100586, "global_step": 503718, "epoch": 2998} {"train_loss": -12.48344898223877, "global_step": 503719, "epoch": 2998} {"train_loss": -12.51281452178955, "global_step": 503720, "epoch": 2998} {"train_loss": -11.860173225402832, "global_step": 503721, "epoch": 2998} {"train_loss": -12.565765380859375, "global_step": 503722, "epoch": 2998} {"train_loss": -12.275827407836914, "global_step": 503723, "epoch": 2998} {"train_loss": -12.410968780517578, "global_step": 503724, "epoch": 2998} {"train_loss": -12.36234188079834, "global_step": 503725, "epoch": 2998} {"train_loss": -11.931711196899414, "global_step": 503726, "epoch": 2998} {"train_loss": -12.671366691589355, "global_step": 503727, "epoch": 2998} {"train_loss": -12.007568359375, "global_step": 503728, "epoch": 2998} {"train_loss": -12.198240280151367, "global_step": 503729, "epoch": 2998} {"train_loss": -12.515605926513672, "global_step": 503730, "epoch": 2998} {"train_loss": -12.178938865661621, "global_step": 503731, "epoch": 2998} {"train_loss": -11.653118133544922, "global_step": 503732, "epoch": 2998} {"train_loss": -12.102907180786133, "global_step": 503733, "epoch": 2998} {"train_loss": -11.676759719848633, "global_step": 503734, "epoch": 2998} {"train_loss": -11.82597827911377, "global_step": 503735, "epoch": 2998} {"train_loss": -12.536389350891113, "global_step": 503736, "epoch": 2998} {"train_loss": -11.894899368286133, "global_step": 503737, "epoch": 2998} {"train_loss": -12.398451805114746, "global_step": 503738, "epoch": 2998} {"train_loss": -11.7811861038208, "global_step": 503739, "epoch": 2998} {"train_loss": -11.898301124572754, "global_step": 503740, "epoch": 2998} {"train_loss": -12.15534782409668, "global_step": 503741, "epoch": 2998} {"train_loss": -12.027926445007324, "global_step": 503742, "epoch": 2998} {"train_loss": -11.78076457977295, "global_step": 503743, "epoch": 2998} {"train_loss": -12.17463493347168, "global_step": 503744, "epoch": 2998} {"train_loss": -11.818939208984375, "global_step": 503745, "epoch": 2998} {"train_loss": -11.997751235961914, "global_step": 503746, "epoch": 2998} {"train_loss": -12.105494499206543, "global_step": 503747, "epoch": 2998} {"train_loss": -12.531660079956055, "global_step": 503748, "epoch": 2998} {"train_loss": -12.51766300201416, "global_step": 503749, "epoch": 2998} {"train_loss": -12.075105667114258, "global_step": 503750, "epoch": 2998} {"train_loss": -12.217617988586426, "global_step": 503751, "epoch": 2998} {"train_loss": -11.819731712341309, "global_step": 503752, "epoch": 2998} {"train_loss": -12.342838287353516, "global_step": 503753, "epoch": 2998} {"train_loss": -12.117537498474121, "global_step": 503754, "epoch": 2998} {"train_loss": -12.134395599365234, "global_step": 503755, "epoch": 2998} {"train_loss": -12.04963493347168, "global_step": 503756, "epoch": 2998} {"train_loss": -12.004528045654297, "global_step": 503757, "epoch": 2998} {"train_loss": -12.47848129272461, "global_step": 503758, "epoch": 2998} {"train_loss": -12.502825736999512, "global_step": 503759, "epoch": 2998} {"train_loss": -12.608083724975586, "global_step": 503760, "epoch": 2998} {"train_loss": -12.490036010742188, "global_step": 503761, "epoch": 2998} {"train_loss": -12.712356567382812, "global_step": 503762, "epoch": 2998} {"train_loss": -12.58407211303711, "global_step": 503763, "epoch": 2998} {"train_loss": -12.467050552368164, "global_step": 503764, "epoch": 2998} {"train_loss": -12.83963394165039, "global_step": 503765, "epoch": 2998} {"train_loss": -12.606725692749023, "global_step": 503766, "epoch": 2998} {"train_loss": -12.192671775817871, "global_step": 503767, "epoch": 2998} {"train_loss": -12.540384292602539, "global_step": 503768, "epoch": 2998} {"train_loss": -12.165480613708496, "global_step": 503769, "epoch": 2998} {"train_loss": -12.520503997802734, "global_step": 503770, "epoch": 2998} {"train_loss": -12.096453666687012, "global_step": 503771, "epoch": 2998} {"train_loss": -12.677032470703125, "global_step": 503772, "epoch": 2998} {"train_loss": -12.201689720153809, "global_step": 503773, "epoch": 2998} {"train_loss": -12.623836517333984, "global_step": 503774, "epoch": 2998} {"train_loss": -12.191679954528809, "global_step": 503775, "epoch": 2998} {"train_loss": -12.58958625793457, "global_step": 503776, "epoch": 2998} {"train_loss": -12.673019409179688, "global_step": 503777, "epoch": 2998} {"train_loss": -12.320816040039062, "global_step": 503778, "epoch": 2998} {"train_loss": -12.734841346740723, "global_step": 503779, "epoch": 2998} {"train_loss": -12.368989944458008, "global_step": 503780, "epoch": 2998} {"train_loss": -12.49122428894043, "global_step": 503781, "epoch": 2998} {"train_loss": -11.80643081665039, "global_step": 503782, "epoch": 2998} {"train_loss": -12.510494232177734, "global_step": 503783, "epoch": 2998} {"train_loss": -12.570714950561523, "global_step": 503784, "epoch": 2998} {"train_loss": -12.49648666381836, "global_step": 503785, "epoch": 2998} {"train_loss": -12.024937629699707, "global_step": 503786, "epoch": 2998} {"train_loss": -12.415069580078125, "global_step": 503787, "epoch": 2998} {"train_loss": -12.60986328125, "global_step": 503788, "epoch": 2998} {"train_loss": -12.413932800292969, "global_step": 503789, "epoch": 2998} {"train_loss": -12.469893455505371, "global_step": 503790, "epoch": 2998} {"train_loss": -12.552001953125, "global_step": 503791, "epoch": 2998} {"train_loss": -12.723695755004883, "global_step": 503792, "epoch": 2998} {"train_loss": -12.575983047485352, "global_step": 503793, "epoch": 2998} {"train_loss": -12.244951248168945, "global_step": 503794, "epoch": 2998} {"train_loss": -12.446525573730469, "global_step": 503795, "epoch": 2998} {"train_loss": -12.527473449707031, "global_step": 503796, "epoch": 2998} {"train_loss": -12.282295227050781, "global_step": 503797, "epoch": 2998} {"train_loss": -12.474273681640625, "global_step": 503798, "epoch": 2998} {"train_loss": -12.239181518554688, "global_step": 503799, "epoch": 2998} {"train_loss": -11.298574447631836, "global_step": 503800, "epoch": 2998} {"train_loss": -12.572145462036133, "global_step": 503801, "epoch": 2998} {"train_loss": -11.767642974853516, "global_step": 503802, "epoch": 2998} {"train_loss": -11.581918716430664, "global_step": 503803, "epoch": 2998} {"train_loss": -12.277276992797852, "global_step": 503804, "epoch": 2998} {"train_loss": -10.092293739318848, "global_step": 503805, "epoch": 2998} {"train_loss": -11.464128494262695, "global_step": 503806, "epoch": 2998} {"train_loss": -11.212163925170898, "global_step": 503807, "epoch": 2998} {"train_loss": -9.016743659973145, "global_step": 503808, "epoch": 2998} {"train_loss": -12.361318588256836, "global_step": 503809, "epoch": 2998} {"train_loss": -8.957179069519043, "global_step": 503810, "epoch": 2998} {"train_loss": -10.46247673034668, "global_step": 503811, "epoch": 2998} {"train_loss": -10.496471405029297, "global_step": 503812, "epoch": 2998} {"train_loss": -11.046479225158691, "global_step": 503813, "epoch": 2998} {"train_loss": -10.391353607177734, "global_step": 503814, "epoch": 2998} {"train_loss": -12.138556480407715, "global_step": 503815, "epoch": 2998} {"train_loss": -10.580207824707031, "global_step": 503816, "epoch": 2998} {"train_loss": -11.352766990661621, "global_step": 503817, "epoch": 2998} {"train_loss": -12.3746976852417, "global_step": 503818, "epoch": 2998} {"train_loss": -11.555572509765625, "global_step": 503819, "epoch": 2998} {"train_loss": -12.251169204711914, "global_step": 503820, "epoch": 2998} {"train_loss": -11.733537673950195, "global_step": 503821, "epoch": 2998} {"train_loss": -11.585855484008789, "global_step": 503822, "epoch": 2998} {"train_loss": -11.902606964111328, "global_step": 503823, "epoch": 2998} {"train_loss": -12.218751907348633, "global_step": 503824, "epoch": 2998} {"train_loss": -11.980013847351074, "global_step": 503825, "epoch": 2998} {"train_loss": -11.816703796386719, "global_step": 503826, "epoch": 2998} {"train_loss": -11.376617431640625, "global_step": 503827, "epoch": 2998} {"train_loss": -12.195234298706055, "global_step": 503828, "epoch": 2998} {"train_loss": -11.557766914367676, "global_step": 503829, "epoch": 2998} {"train_loss": -12.085729598999023, "global_step": 503830, "epoch": 2998} {"train_loss": -12.099399271465483, "global_step": 503831, "epoch": 2998, "val_loss": 319549.8125} {"train_loss": -11.697989463806152, "global_step": 503832, "epoch": 2999} {"train_loss": -11.993188858032227, "global_step": 503833, "epoch": 2999} {"train_loss": -11.5790433883667, "global_step": 503834, "epoch": 2999} {"train_loss": -12.490535736083984, "global_step": 503835, "epoch": 2999} {"train_loss": -11.850593566894531, "global_step": 503836, "epoch": 2999} {"train_loss": -12.03548526763916, "global_step": 503837, "epoch": 2999} {"train_loss": -12.322408676147461, "global_step": 503838, "epoch": 2999} {"train_loss": -12.27059555053711, "global_step": 503839, "epoch": 2999} {"train_loss": -12.27744197845459, "global_step": 503840, "epoch": 2999} {"train_loss": -11.971216201782227, "global_step": 503841, "epoch": 2999} {"train_loss": -12.339850425720215, "global_step": 503842, "epoch": 2999} {"train_loss": -12.036737442016602, "global_step": 503843, "epoch": 2999} {"train_loss": -12.40036392211914, "global_step": 503844, "epoch": 2999} {"train_loss": -12.267292022705078, "global_step": 503845, "epoch": 2999} {"train_loss": -12.553960800170898, "global_step": 503846, "epoch": 2999} {"train_loss": -12.4967041015625, "global_step": 503847, "epoch": 2999} {"train_loss": -12.492696762084961, "global_step": 503848, "epoch": 2999} {"train_loss": -12.632280349731445, "global_step": 503849, "epoch": 2999} {"train_loss": -12.56070613861084, "global_step": 503850, "epoch": 2999} {"train_loss": -12.54128646850586, "global_step": 503851, "epoch": 2999} {"train_loss": -12.500776290893555, "global_step": 503852, "epoch": 2999} {"train_loss": -12.70004653930664, "global_step": 503853, "epoch": 2999} {"train_loss": -12.531534194946289, "global_step": 503854, "epoch": 2999} {"train_loss": -12.542524337768555, "global_step": 503855, "epoch": 2999} {"train_loss": -12.478019714355469, "global_step": 503856, "epoch": 2999} {"train_loss": -12.913042068481445, "global_step": 503857, "epoch": 2999} {"train_loss": -12.633323669433594, "global_step": 503858, "epoch": 2999} {"train_loss": -12.796010971069336, "global_step": 503859, "epoch": 2999} {"train_loss": -12.595769882202148, "global_step": 503860, "epoch": 2999} {"train_loss": -12.772045135498047, "global_step": 503861, "epoch": 2999} {"train_loss": -12.65705394744873, "global_step": 503862, "epoch": 2999} {"train_loss": -12.683372497558594, "global_step": 503863, "epoch": 2999} {"train_loss": -12.80518913269043, "global_step": 503864, "epoch": 2999} {"train_loss": -12.644933700561523, "global_step": 503865, "epoch": 2999} {"train_loss": -12.77736759185791, "global_step": 503866, "epoch": 2999} {"train_loss": -12.592500686645508, "global_step": 503867, "epoch": 2999} {"train_loss": -12.517675399780273, "global_step": 503868, "epoch": 2999} {"train_loss": -12.808236122131348, "global_step": 503869, "epoch": 2999} {"train_loss": -12.496247291564941, "global_step": 503870, "epoch": 2999} {"train_loss": -12.552157402038574, "global_step": 503871, "epoch": 2999} {"train_loss": -12.294652938842773, "global_step": 503872, "epoch": 2999} {"train_loss": -12.775558471679688, "global_step": 503873, "epoch": 2999} {"train_loss": -12.841704368591309, "global_step": 503874, "epoch": 2999} {"train_loss": -12.824258804321289, "global_step": 503875, "epoch": 2999} {"train_loss": -12.823463439941406, "global_step": 503876, "epoch": 2999} {"train_loss": -12.77775764465332, "global_step": 503877, "epoch": 2999} {"train_loss": -12.781051635742188, "global_step": 503878, "epoch": 2999} {"train_loss": -12.884004592895508, "global_step": 503879, "epoch": 2999} {"train_loss": -13.001331329345703, "global_step": 503880, "epoch": 2999} {"train_loss": -12.808210372924805, "global_step": 503881, "epoch": 2999} {"train_loss": -12.898540496826172, "global_step": 503882, "epoch": 2999} {"train_loss": -12.962882041931152, "global_step": 503883, "epoch": 2999} {"train_loss": -12.58468246459961, "global_step": 503884, "epoch": 2999} {"train_loss": -12.755245208740234, "global_step": 503885, "epoch": 2999} {"train_loss": -12.764226913452148, "global_step": 503886, "epoch": 2999} {"train_loss": -12.474357604980469, "global_step": 503887, "epoch": 2999} {"train_loss": -12.229089736938477, "global_step": 503888, "epoch": 2999} {"train_loss": -12.93341064453125, "global_step": 503889, "epoch": 2999} {"train_loss": -12.49758243560791, "global_step": 503890, "epoch": 2999} {"train_loss": -12.653499603271484, "global_step": 503891, "epoch": 2999} {"train_loss": -12.930187225341797, "global_step": 503892, "epoch": 2999} {"train_loss": -12.679931640625, "global_step": 503893, "epoch": 2999} {"train_loss": -12.719369888305664, "global_step": 503894, "epoch": 2999} {"train_loss": -12.760601043701172, "global_step": 503895, "epoch": 2999} {"train_loss": -12.63661003112793, "global_step": 503896, "epoch": 2999} {"train_loss": -12.660144805908203, "global_step": 503897, "epoch": 2999} {"train_loss": -12.773536682128906, "global_step": 503898, "epoch": 2999} {"train_loss": -12.588934898376465, "global_step": 503899, "epoch": 2999} {"train_loss": -12.79432487487793, "global_step": 503900, "epoch": 2999} {"train_loss": -12.452155113220215, "global_step": 503901, "epoch": 2999} {"train_loss": -12.769372940063477, "global_step": 503902, "epoch": 2999} {"train_loss": -12.8836669921875, "global_step": 503903, "epoch": 2999} {"train_loss": -12.987346649169922, "global_step": 503904, "epoch": 2999} {"train_loss": -12.673831939697266, "global_step": 503905, "epoch": 2999} {"train_loss": -13.045910835266113, "global_step": 503906, "epoch": 2999} {"train_loss": -12.734586715698242, "global_step": 503907, "epoch": 2999} {"train_loss": -12.98755168914795, "global_step": 503908, "epoch": 2999} {"train_loss": -12.981165885925293, "global_step": 503909, "epoch": 2999} {"train_loss": -12.93836498260498, "global_step": 503910, "epoch": 2999} {"train_loss": -12.801247596740723, "global_step": 503911, "epoch": 2999} {"train_loss": -13.011017799377441, "global_step": 503912, "epoch": 2999} {"train_loss": -12.930704116821289, "global_step": 503913, "epoch": 2999} {"train_loss": -12.931901931762695, "global_step": 503914, "epoch": 2999} {"train_loss": -13.082669258117676, "global_step": 503915, "epoch": 2999} {"train_loss": -12.840097427368164, "global_step": 503916, "epoch": 2999} {"train_loss": -12.917945861816406, "global_step": 503917, "epoch": 2999} {"train_loss": -12.92357349395752, "global_step": 503918, "epoch": 2999} {"train_loss": -13.159120559692383, "global_step": 503919, "epoch": 2999} {"train_loss": -12.952373504638672, "global_step": 503920, "epoch": 2999} {"train_loss": -13.006490707397461, "global_step": 503921, "epoch": 2999} {"train_loss": -12.961984634399414, "global_step": 503922, "epoch": 2999} {"train_loss": -12.448063850402832, "global_step": 503923, "epoch": 2999} {"train_loss": -13.194766998291016, "global_step": 503924, "epoch": 2999} {"train_loss": -12.804481506347656, "global_step": 503925, "epoch": 2999} {"train_loss": -12.737942695617676, "global_step": 503926, "epoch": 2999} {"train_loss": -12.876546859741211, "global_step": 503927, "epoch": 2999} {"train_loss": -12.77776050567627, "global_step": 503928, "epoch": 2999} {"train_loss": -13.024876594543457, "global_step": 503929, "epoch": 2999} {"train_loss": -13.156933784484863, "global_step": 503930, "epoch": 2999} {"train_loss": -13.036643028259277, "global_step": 503931, "epoch": 2999} {"train_loss": -13.037924766540527, "global_step": 503932, "epoch": 2999} {"train_loss": -13.038114547729492, "global_step": 503933, "epoch": 2999} {"train_loss": -12.99495792388916, "global_step": 503934, "epoch": 2999} {"train_loss": -12.841440200805664, "global_step": 503935, "epoch": 2999} {"train_loss": -12.983967781066895, "global_step": 503936, "epoch": 2999} {"train_loss": -12.880825996398926, "global_step": 503937, "epoch": 2999} {"train_loss": -13.096545219421387, "global_step": 503938, "epoch": 2999} {"train_loss": -12.710623741149902, "global_step": 503939, "epoch": 2999} {"train_loss": -12.985712051391602, "global_step": 503940, "epoch": 2999} {"train_loss": -12.827173233032227, "global_step": 503941, "epoch": 2999} {"train_loss": -12.317493438720703, "global_step": 503942, "epoch": 2999} {"train_loss": -12.749584197998047, "global_step": 503943, "epoch": 2999} {"train_loss": -12.773294448852539, "global_step": 503944, "epoch": 2999} {"train_loss": -12.829696655273438, "global_step": 503945, "epoch": 2999} {"train_loss": -13.097498893737793, "global_step": 503946, "epoch": 2999} {"train_loss": -13.132579803466797, "global_step": 503947, "epoch": 2999} {"train_loss": -13.137121200561523, "global_step": 503948, "epoch": 2999} {"train_loss": -12.659063339233398, "global_step": 503949, "epoch": 2999} {"train_loss": -12.327716827392578, "global_step": 503950, "epoch": 2999} {"train_loss": -11.702276229858398, "global_step": 503951, "epoch": 2999} {"train_loss": -11.310306549072266, "global_step": 503952, "epoch": 2999} {"train_loss": -11.637017250061035, "global_step": 503953, "epoch": 2999} {"train_loss": -12.552651405334473, "global_step": 503954, "epoch": 2999} {"train_loss": -12.604032516479492, "global_step": 503955, "epoch": 2999} {"train_loss": -12.183913230895996, "global_step": 503956, "epoch": 2999} {"train_loss": -12.545589447021484, "global_step": 503957, "epoch": 2999} {"train_loss": -12.750734329223633, "global_step": 503958, "epoch": 2999} {"train_loss": -12.095869064331055, "global_step": 503959, "epoch": 2999} {"train_loss": -12.193906784057617, "global_step": 503960, "epoch": 2999} {"train_loss": -10.360897064208984, "global_step": 503961, "epoch": 2999} {"train_loss": -11.731115341186523, "global_step": 503962, "epoch": 2999} {"train_loss": -10.206355094909668, "global_step": 503963, "epoch": 2999} {"train_loss": -9.784847259521484, "global_step": 503964, "epoch": 2999} {"train_loss": -11.397241592407227, "global_step": 503965, "epoch": 2999} {"train_loss": -9.063020706176758, "global_step": 503966, "epoch": 2999} {"train_loss": -8.668746948242188, "global_step": 503967, "epoch": 2999} {"train_loss": -8.391841888427734, "global_step": 503968, "epoch": 2999} {"train_loss": -8.547060012817383, "global_step": 503969, "epoch": 2999} {"train_loss": -9.132562637329102, "global_step": 503970, "epoch": 2999} {"train_loss": -8.740121841430664, "global_step": 503971, "epoch": 2999} {"train_loss": -9.378570556640625, "global_step": 503972, "epoch": 2999} {"train_loss": -9.675370216369629, "global_step": 503973, "epoch": 2999} {"train_loss": -9.56908893585205, "global_step": 503974, "epoch": 2999} {"train_loss": -9.340675354003906, "global_step": 503975, "epoch": 2999} {"train_loss": -10.363842010498047, "global_step": 503976, "epoch": 2999} {"train_loss": -10.304302215576172, "global_step": 503977, "epoch": 2999} {"train_loss": -10.403690338134766, "global_step": 503978, "epoch": 2999} {"train_loss": -11.048357963562012, "global_step": 503979, "epoch": 2999} {"train_loss": -10.367952346801758, "global_step": 503980, "epoch": 2999} {"train_loss": -10.925861358642578, "global_step": 503981, "epoch": 2999} {"train_loss": -11.060820579528809, "global_step": 503982, "epoch": 2999} {"train_loss": -11.194540977478027, "global_step": 503983, "epoch": 2999} {"train_loss": -11.482101440429688, "global_step": 503984, "epoch": 2999} {"train_loss": -10.859529495239258, "global_step": 503985, "epoch": 2999} {"train_loss": -11.223468780517578, "global_step": 503986, "epoch": 2999} {"train_loss": -11.611003875732422, "global_step": 503987, "epoch": 2999} {"train_loss": -11.75935173034668, "global_step": 503988, "epoch": 2999} {"train_loss": -11.677871704101562, "global_step": 503989, "epoch": 2999} {"train_loss": -11.881912231445312, "global_step": 503990, "epoch": 2999} {"train_loss": -11.61102294921875, "global_step": 503991, "epoch": 2999} {"train_loss": -12.118155479431152, "global_step": 503992, "epoch": 2999} {"train_loss": -12.093378067016602, "global_step": 503993, "epoch": 2999} {"train_loss": -12.183202743530273, "global_step": 503994, "epoch": 2999} {"train_loss": -11.938961029052734, "global_step": 503995, "epoch": 2999} {"train_loss": -11.893301010131836, "global_step": 503996, "epoch": 2999} {"train_loss": -12.282011985778809, "global_step": 503997, "epoch": 2999} {"train_loss": -12.247482299804688, "global_step": 503998, "epoch": 2999} {"train_loss": -12.21392141637348, "global_step": 503999, "epoch": 2999, "val_loss": 319245.28125} {"train_loss": -12.126482963562012, "global_step": 504000, "epoch": 3000} {"train_loss": -11.7394380569458, "global_step": 504001, "epoch": 3000} {"train_loss": -12.134361267089844, "global_step": 504002, "epoch": 3000} {"train_loss": -12.434773445129395, "global_step": 504003, "epoch": 3000} {"train_loss": -12.354188919067383, "global_step": 504004, "epoch": 3000} {"train_loss": -11.934236526489258, "global_step": 504005, "epoch": 3000} {"train_loss": -12.394498825073242, "global_step": 504006, "epoch": 3000} {"train_loss": -12.318903923034668, "global_step": 504007, "epoch": 3000} {"train_loss": -12.17428207397461, "global_step": 504008, "epoch": 3000} {"train_loss": -11.697426795959473, "global_step": 504009, "epoch": 3000} {"train_loss": -12.227042198181152, "global_step": 504010, "epoch": 3000} {"train_loss": -12.615188598632812, "global_step": 504011, "epoch": 3000} {"train_loss": -12.4140043258667, "global_step": 504012, "epoch": 3000} {"train_loss": -12.400470733642578, "global_step": 504013, "epoch": 3000} {"train_loss": -12.218328475952148, "global_step": 504014, "epoch": 3000} {"train_loss": -12.609819412231445, "global_step": 504015, "epoch": 3000} {"train_loss": -12.027530670166016, "global_step": 504016, "epoch": 3000} {"train_loss": -12.235841751098633, "global_step": 504017, "epoch": 3000} {"train_loss": -12.245573043823242, "global_step": 504018, "epoch": 3000} {"train_loss": -12.155210494995117, "global_step": 504019, "epoch": 3000} {"train_loss": -12.479767799377441, "global_step": 504020, "epoch": 3000} {"train_loss": -12.561633110046387, "global_step": 504021, "epoch": 3000} {"train_loss": -12.171753883361816, "global_step": 504022, "epoch": 3000} {"train_loss": -11.907493591308594, "global_step": 504023, "epoch": 3000} {"train_loss": -11.944574356079102, "global_step": 504024, "epoch": 3000} {"train_loss": -11.802321434020996, "global_step": 504025, "epoch": 3000} {"train_loss": -12.392122268676758, "global_step": 504026, "epoch": 3000} {"train_loss": -11.535574913024902, "global_step": 504027, "epoch": 3000} {"train_loss": -12.326950073242188, "global_step": 504028, "epoch": 3000} {"train_loss": -12.15769100189209, "global_step": 504029, "epoch": 3000} {"train_loss": -12.424335479736328, "global_step": 504030, "epoch": 3000} {"train_loss": -11.643646240234375, "global_step": 504031, "epoch": 3000} {"train_loss": -12.545531272888184, "global_step": 504032, "epoch": 3000} {"train_loss": -11.585437774658203, "global_step": 504033, "epoch": 3000} {"train_loss": -11.855209350585938, "global_step": 504034, "epoch": 3000} {"train_loss": -11.616718292236328, "global_step": 504035, "epoch": 3000} {"train_loss": -11.694428443908691, "global_step": 504036, "epoch": 3000} {"train_loss": -11.809555053710938, "global_step": 504037, "epoch": 3000} {"train_loss": -12.046762466430664, "global_step": 504038, "epoch": 3000} {"train_loss": -11.761082649230957, "global_step": 504039, "epoch": 3000} {"train_loss": -11.663394927978516, "global_step": 504040, "epoch": 3000} {"train_loss": -12.121152877807617, "global_step": 504041, "epoch": 3000} {"train_loss": -11.955825805664062, "global_step": 504042, "epoch": 3000} {"train_loss": -11.822441101074219, "global_step": 504043, "epoch": 3000} {"train_loss": -11.673909187316895, "global_step": 504044, "epoch": 3000} {"train_loss": -11.187685012817383, "global_step": 504045, "epoch": 3000} {"train_loss": -11.527698516845703, "global_step": 504046, "epoch": 3000} {"train_loss": -10.78283977508545, "global_step": 504047, "epoch": 3000} {"train_loss": -12.016019821166992, "global_step": 504048, "epoch": 3000} {"train_loss": -10.942144393920898, "global_step": 504049, "epoch": 3000} {"train_loss": -12.618406295776367, "global_step": 504050, "epoch": 3000} {"train_loss": -11.30308723449707, "global_step": 504051, "epoch": 3000} {"train_loss": -12.15159797668457, "global_step": 504052, "epoch": 3000} {"train_loss": -11.941472053527832, "global_step": 504053, "epoch": 3000} {"train_loss": -11.271039962768555, "global_step": 504054, "epoch": 3000} {"train_loss": -12.550110816955566, "global_step": 504055, "epoch": 3000} {"train_loss": -11.240100860595703, "global_step": 504056, "epoch": 3000} {"train_loss": -12.557592391967773, "global_step": 504057, "epoch": 3000} {"train_loss": -11.331167221069336, "global_step": 504058, "epoch": 3000} {"train_loss": -12.134708404541016, "global_step": 504059, "epoch": 3000} {"train_loss": -11.951883316040039, "global_step": 504060, "epoch": 3000} {"train_loss": -11.612472534179688, "global_step": 504061, "epoch": 3000} {"train_loss": -12.51434326171875, "global_step": 504062, "epoch": 3000} {"train_loss": -11.761387825012207, "global_step": 504063, "epoch": 3000} {"train_loss": -11.738007545471191, "global_step": 504064, "epoch": 3000} {"train_loss": -12.371597290039062, "global_step": 504065, "epoch": 3000} {"train_loss": -11.896961212158203, "global_step": 504066, "epoch": 3000} {"train_loss": -12.054686546325684, "global_step": 504067, "epoch": 3000} {"train_loss": -12.155302047729492, "global_step": 504068, "epoch": 3000} {"train_loss": -11.207330703735352, "global_step": 504069, "epoch": 3000} {"train_loss": -12.129680633544922, "global_step": 504070, "epoch": 3000} {"train_loss": -11.75609302520752, "global_step": 504071, "epoch": 3000} {"train_loss": -12.050674438476562, "global_step": 504072, "epoch": 3000} {"train_loss": -12.245850563049316, "global_step": 504073, "epoch": 3000} {"train_loss": -12.075772285461426, "global_step": 504074, "epoch": 3000} {"train_loss": -12.377994537353516, "global_step": 504075, "epoch": 3000} {"train_loss": -12.626893997192383, "global_step": 504076, "epoch": 3000} {"train_loss": -12.289613723754883, "global_step": 504077, "epoch": 3000} {"train_loss": -12.030279159545898, "global_step": 504078, "epoch": 3000} {"train_loss": -12.282024383544922, "global_step": 504079, "epoch": 3000} {"train_loss": -12.320781707763672, "global_step": 504080, "epoch": 3000} {"train_loss": -12.454937934875488, "global_step": 504081, "epoch": 3000} {"train_loss": -12.160822868347168, "global_step": 504082, "epoch": 3000} {"train_loss": -12.283147811889648, "global_step": 504083, "epoch": 3000} {"train_loss": -12.59576416015625, "global_step": 504084, "epoch": 3000} {"train_loss": -12.002704620361328, "global_step": 504085, "epoch": 3000} {"train_loss": -12.450263023376465, "global_step": 504086, "epoch": 3000} {"train_loss": -11.614992141723633, "global_step": 504087, "epoch": 3000} {"train_loss": -12.192745208740234, "global_step": 504088, "epoch": 3000} {"train_loss": -12.495070457458496, "global_step": 504089, "epoch": 3000} {"train_loss": -11.999631881713867, "global_step": 504090, "epoch": 3000} {"train_loss": -12.830171585083008, "global_step": 504091, "epoch": 3000} {"train_loss": -12.102008819580078, "global_step": 504092, "epoch": 3000} {"train_loss": -12.356748580932617, "global_step": 504093, "epoch": 3000} {"train_loss": -12.434547424316406, "global_step": 504094, "epoch": 3000} {"train_loss": -11.849241256713867, "global_step": 504095, "epoch": 3000} {"train_loss": -12.688148498535156, "global_step": 504096, "epoch": 3000} {"train_loss": -12.138843536376953, "global_step": 504097, "epoch": 3000} {"train_loss": -12.774288177490234, "global_step": 504098, "epoch": 3000} {"train_loss": -12.505720138549805, "global_step": 504099, "epoch": 3000} {"train_loss": -12.495560646057129, "global_step": 504100, "epoch": 3000} {"train_loss": -12.588417053222656, "global_step": 504101, "epoch": 3000} {"train_loss": -12.514158248901367, "global_step": 504102, "epoch": 3000} {"train_loss": -12.579412460327148, "global_step": 504103, "epoch": 3000} {"train_loss": -12.595724105834961, "global_step": 504104, "epoch": 3000} {"train_loss": -12.569361686706543, "global_step": 504105, "epoch": 3000} {"train_loss": -12.741466522216797, "global_step": 504106, "epoch": 3000} {"train_loss": -12.191320419311523, "global_step": 504107, "epoch": 3000} {"train_loss": -12.897598266601562, "global_step": 504108, "epoch": 3000} {"train_loss": -12.541363716125488, "global_step": 504109, "epoch": 3000} {"train_loss": -12.432414054870605, "global_step": 504110, "epoch": 3000} {"train_loss": -12.47170352935791, "global_step": 504111, "epoch": 3000} {"train_loss": -12.045157432556152, "global_step": 504112, "epoch": 3000} {"train_loss": -12.662934303283691, "global_step": 504113, "epoch": 3000} {"train_loss": -12.433515548706055, "global_step": 504114, "epoch": 3000} {"train_loss": -12.434385299682617, "global_step": 504115, "epoch": 3000} {"train_loss": -12.305970191955566, "global_step": 504116, "epoch": 3000} {"train_loss": -12.392659187316895, "global_step": 504117, "epoch": 3000} {"train_loss": -12.59830093383789, "global_step": 504118, "epoch": 3000} {"train_loss": -12.423772811889648, "global_step": 504119, "epoch": 3000} {"train_loss": -12.779375076293945, "global_step": 504120, "epoch": 3000} {"train_loss": -12.60545539855957, "global_step": 504121, "epoch": 3000} {"train_loss": -12.63829231262207, "global_step": 504122, "epoch": 3000} {"train_loss": -12.744941711425781, "global_step": 504123, "epoch": 3000} {"train_loss": -12.552759170532227, "global_step": 504124, "epoch": 3000} {"train_loss": -12.785682678222656, "global_step": 504125, "epoch": 3000} {"train_loss": -12.58298110961914, "global_step": 504126, "epoch": 3000} {"train_loss": -12.6824951171875, "global_step": 504127, "epoch": 3000} {"train_loss": -12.332263946533203, "global_step": 504128, "epoch": 3000} {"train_loss": -12.763138771057129, "global_step": 504129, "epoch": 3000} {"train_loss": -12.728708267211914, "global_step": 504130, "epoch": 3000} {"train_loss": -12.421113014221191, "global_step": 504131, "epoch": 3000} {"train_loss": -13.088956832885742, "global_step": 504132, "epoch": 3000} {"train_loss": -12.70276165008545, "global_step": 504133, "epoch": 3000} {"train_loss": -12.967219352722168, "global_step": 504134, "epoch": 3000} {"train_loss": -12.82275676727295, "global_step": 504135, "epoch": 3000} {"train_loss": -12.452987670898438, "global_step": 504136, "epoch": 3000} {"train_loss": -12.92910385131836, "global_step": 504137, "epoch": 3000} {"train_loss": -12.795236587524414, "global_step": 504138, "epoch": 3000} {"train_loss": -12.87270450592041, "global_step": 504139, "epoch": 3000} {"train_loss": -12.695123672485352, "global_step": 504140, "epoch": 3000} {"train_loss": -12.733922004699707, "global_step": 504141, "epoch": 3000} {"train_loss": -13.00509262084961, "global_step": 504142, "epoch": 3000} {"train_loss": -12.988235473632812, "global_step": 504143, "epoch": 3000} {"train_loss": -12.72722053527832, "global_step": 504144, "epoch": 3000} {"train_loss": -12.846010208129883, "global_step": 504145, "epoch": 3000} {"train_loss": -12.230729103088379, "global_step": 504146, "epoch": 3000} {"train_loss": -12.672157287597656, "global_step": 504147, "epoch": 3000} {"train_loss": -12.592784881591797, "global_step": 504148, "epoch": 3000} {"train_loss": -12.441522598266602, "global_step": 504149, "epoch": 3000} {"train_loss": -12.840391159057617, "global_step": 504150, "epoch": 3000} {"train_loss": -12.789860725402832, "global_step": 504151, "epoch": 3000} {"train_loss": -12.584774017333984, "global_step": 504152, "epoch": 3000} {"train_loss": -12.99925422668457, "global_step": 504153, "epoch": 3000} {"train_loss": -12.763896942138672, "global_step": 504154, "epoch": 3000} {"train_loss": -13.123806953430176, "global_step": 504155, "epoch": 3000} {"train_loss": -12.762642860412598, "global_step": 504156, "epoch": 3000} {"train_loss": -12.865468978881836, "global_step": 504157, "epoch": 3000} {"train_loss": -13.088296890258789, "global_step": 504158, "epoch": 3000} {"train_loss": -12.885305404663086, "global_step": 504159, "epoch": 3000} {"train_loss": -13.059349060058594, "global_step": 504160, "epoch": 3000} {"train_loss": -13.031108856201172, "global_step": 504161, "epoch": 3000} {"train_loss": -12.816289901733398, "global_step": 504162, "epoch": 3000} {"train_loss": -13.239710807800293, "global_step": 504163, "epoch": 3000} {"train_loss": -12.987813949584961, "global_step": 504164, "epoch": 3000} {"train_loss": -13.095413208007812, "global_step": 504165, "epoch": 3000} {"train_loss": -12.899975776672363, "global_step": 504166, "epoch": 3000} {"train_loss": -12.326893641835166, "global_step": 504167, "epoch": 3000, "train/sim_max_reward_0": 0.686444424831207, "train/sim_max_reward_1": 0.9555079353305205, "train/sim_max_reward_2": 0.0024770105396779963, "train/sim_max_reward_3": 0.41741416688845107, "train/sim_max_reward_4": 0.9540001630155849, "train/sim_max_reward_5": 0.526489577315262, "test/sim_max_reward_4400000": 0.97134170046319, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 0.9536918149488899, "test/sim_max_reward_4400003": 0.4263232088103948, "test/sim_max_reward_4400004": 0.6786144699987606, "test/sim_max_reward_4400005": 0.9623142785497808, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 0.4458992137847457, "test/sim_max_reward_4400008": 0.6528521421713942, "test/sim_max_reward_4400009": 0.030663166717427387, "test/sim_max_reward_4400010": 0.10942431142043765, "test/sim_max_reward_4400011": 0.3148320751352504, "test/sim_max_reward_4400012": 0.14110722128947978, "test/sim_max_reward_4400013": 0.9625204271262848, "test/sim_max_reward_4400014": 0.6104896939054841, "test/sim_max_reward_4400015": 0.43474117498339465, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.1083494733531248, "test/sim_max_reward_4400018": 0.9183849995678349, "test/sim_max_reward_4400019": 0.3946885838031122, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.6956189774905427, "test/sim_max_reward_4400022": 1.0, "test/sim_max_reward_4400023": 0.13841541685454872, "test/sim_max_reward_4400024": 1.0, "test/sim_max_reward_4400025": 0.6135279386004266, "test/sim_max_reward_4400026": 0.0, "test/sim_max_reward_4400027": 0.45416587909088624, "test/sim_max_reward_4400028": 0.7164800131683211, "test/sim_max_reward_4400029": 0.0, "test/sim_max_reward_4400030": 1.0, "test/sim_max_reward_4400031": 0.9922362622070807, "test/sim_max_reward_4400032": 0.0, "test/sim_max_reward_4400033": 0.38424757665441595, "test/sim_max_reward_4400034": 0.4541360734525507, "test/sim_max_reward_4400035": 0.2843255843720266, "test/sim_max_reward_4400036": 0.4420608947322188, "test/sim_max_reward_4400037": 0.7703343195054987, "test/sim_max_reward_4400038": 0.2838738567079004, "test/sim_max_reward_4400039": 0.41228375460481864, "test/sim_max_reward_4400040": 0.0, "test/sim_max_reward_4400041": 0.8807708073416343, "test/sim_max_reward_4400042": 0.4230674618787985, "test/sim_max_reward_4400043": 0.008853150357995025, "test/sim_max_reward_4400044": 0.6626994958524535, "test/sim_max_reward_4400045": 0.12053031908692156, "test/sim_max_reward_4400046": 0.8147516095831165, "test/sim_max_reward_4400047": 0.9839604595878774, "test/sim_max_reward_4400048": 0.0, "test/sim_max_reward_4400049": 0.0, "train/mean_score": 0.5903888796534505, "test/mean_score": 0.4930515561431804, "val_loss": 320909.125, "train_action_mse_error": 1.7033298015594482} {"train_loss": -12.737170219421387, "global_step": 504168, "epoch": 3001} {"train_loss": -12.614985466003418, "global_step": 504169, "epoch": 3001} {"train_loss": -12.893129348754883, "global_step": 504170, "epoch": 3001} {"train_loss": -12.31888198852539, "global_step": 504171, "epoch": 3001} {"train_loss": -12.552881240844727, "global_step": 504172, "epoch": 3001} {"train_loss": -12.977701187133789, "global_step": 504173, "epoch": 3001} {"train_loss": -12.451297760009766, "global_step": 504174, "epoch": 3001} {"train_loss": -12.243521690368652, "global_step": 504175, "epoch": 3001} {"train_loss": -12.37672233581543, "global_step": 504176, "epoch": 3001} {"train_loss": -13.150531768798828, "global_step": 504177, "epoch": 3001} {"train_loss": -12.103715896606445, "global_step": 504178, "epoch": 3001} {"train_loss": -12.704977035522461, "global_step": 504179, "epoch": 3001} {"train_loss": -12.970149993896484, "global_step": 504180, "epoch": 3001} {"train_loss": -12.81417465209961, "global_step": 504181, "epoch": 3001} {"train_loss": -12.936872482299805, "global_step": 504182, "epoch": 3001} {"train_loss": -12.60157585144043, "global_step": 504183, "epoch": 3001} {"train_loss": -12.313711166381836, "global_step": 504184, "epoch": 3001} {"train_loss": -11.870059967041016, "global_step": 504185, "epoch": 3001} {"train_loss": -12.400962829589844, "global_step": 504186, "epoch": 3001} {"train_loss": -12.649171829223633, "global_step": 504187, "epoch": 3001} {"train_loss": -12.565591812133789, "global_step": 504188, "epoch": 3001} {"train_loss": -12.644630432128906, "global_step": 504189, "epoch": 3001} {"train_loss": -13.068934440612793, "global_step": 504190, "epoch": 3001} {"train_loss": -12.480854034423828, "global_step": 504191, "epoch": 3001} {"train_loss": -12.526422500610352, "global_step": 504192, "epoch": 3001} {"train_loss": -12.60525894165039, "global_step": 504193, "epoch": 3001} {"train_loss": -12.513777732849121, "global_step": 504194, "epoch": 3001} {"train_loss": -12.928024291992188, "global_step": 504195, "epoch": 3001} {"train_loss": -12.241754531860352, "global_step": 504196, "epoch": 3001} {"train_loss": -12.593860626220703, "global_step": 504197, "epoch": 3001} {"train_loss": -12.540815353393555, "global_step": 504198, "epoch": 3001} {"train_loss": -12.598285675048828, "global_step": 504199, "epoch": 3001} {"train_loss": -10.865386962890625, "global_step": 504200, "epoch": 3001} {"train_loss": -12.717827796936035, "global_step": 504201, "epoch": 3001} {"train_loss": -11.347784996032715, "global_step": 504202, "epoch": 3001} {"train_loss": -11.536628723144531, "global_step": 504203, "epoch": 3001} {"train_loss": -12.172658920288086, "global_step": 504204, "epoch": 3001} {"train_loss": -12.321027755737305, "global_step": 504205, "epoch": 3001} {"train_loss": -11.651423454284668, "global_step": 504206, "epoch": 3001} {"train_loss": -11.530900955200195, "global_step": 504207, "epoch": 3001} {"train_loss": -10.849906921386719, "global_step": 504208, "epoch": 3001} {"train_loss": -10.595909118652344, "global_step": 504209, "epoch": 3001} {"train_loss": -11.362081527709961, "global_step": 504210, "epoch": 3001} {"train_loss": -9.691585540771484, "global_step": 504211, "epoch": 3001} {"train_loss": -10.207109451293945, "global_step": 504212, "epoch": 3001} {"train_loss": -9.321378707885742, "global_step": 504213, "epoch": 3001} {"train_loss": -9.354820251464844, "global_step": 504214, "epoch": 3001} {"train_loss": -10.078250885009766, "global_step": 504215, "epoch": 3001} {"train_loss": -9.78543472290039, "global_step": 504216, "epoch": 3001} {"train_loss": -9.452024459838867, "global_step": 504217, "epoch": 3001} {"train_loss": -7.5988006591796875, "global_step": 504218, "epoch": 3001} {"train_loss": -9.082220077514648, "global_step": 504219, "epoch": 3001} {"train_loss": -8.525229454040527, "global_step": 504220, "epoch": 3001} {"train_loss": -10.566339492797852, "global_step": 504221, "epoch": 3001} {"train_loss": -6.852919101715088, "global_step": 504222, "epoch": 3001} {"train_loss": -6.624186038970947, "global_step": 504223, "epoch": 3001} {"train_loss": -6.625261306762695, "global_step": 504224, "epoch": 3001} {"train_loss": -6.4146728515625, "global_step": 504225, "epoch": 3001} {"train_loss": -5.935769081115723, "global_step": 504226, "epoch": 3001} {"train_loss": -6.743886947631836, "global_step": 504227, "epoch": 3001} {"train_loss": -7.975010871887207, "global_step": 504228, "epoch": 3001} {"train_loss": -7.813793182373047, "global_step": 504229, "epoch": 3001} {"train_loss": -7.785769462585449, "global_step": 504230, "epoch": 3001} {"train_loss": -8.622858047485352, "global_step": 504231, "epoch": 3001} {"train_loss": -8.369308471679688, "global_step": 504232, "epoch": 3001} {"train_loss": -8.202339172363281, "global_step": 504233, "epoch": 3001} {"train_loss": -9.130428314208984, "global_step": 504234, "epoch": 3001} {"train_loss": -8.819950103759766, "global_step": 504235, "epoch": 3001} {"train_loss": -9.39391803741455, "global_step": 504236, "epoch": 3001} {"train_loss": -10.021846771240234, "global_step": 504237, "epoch": 3001} {"train_loss": -10.376500129699707, "global_step": 504238, "epoch": 3001} {"train_loss": -10.587081909179688, "global_step": 504239, "epoch": 3001} {"train_loss": -10.816356658935547, "global_step": 504240, "epoch": 3001} {"train_loss": -10.505759239196777, "global_step": 504241, "epoch": 3001} {"train_loss": -10.404407501220703, "global_step": 504242, "epoch": 3001} {"train_loss": -10.258522033691406, "global_step": 504243, "epoch": 3001} {"train_loss": -10.508235931396484, "global_step": 504244, "epoch": 3001} {"train_loss": -10.934399604797363, "global_step": 504245, "epoch": 3001} {"train_loss": -11.04134464263916, "global_step": 504246, "epoch": 3001} {"train_loss": -11.24951457977295, "global_step": 504247, "epoch": 3001} {"train_loss": -11.376825332641602, "global_step": 504248, "epoch": 3001} {"train_loss": -11.094900131225586, "global_step": 504249, "epoch": 3001} {"train_loss": -11.411619186401367, "global_step": 504250, "epoch": 3001} {"train_loss": -11.459761619567871, "global_step": 504251, "epoch": 3001} {"train_loss": -11.718342781066895, "global_step": 504252, "epoch": 3001} {"train_loss": -11.602245330810547, "global_step": 504253, "epoch": 3001} {"train_loss": -11.715814590454102, "global_step": 504254, "epoch": 3001} {"train_loss": -11.378396987915039, "global_step": 504255, "epoch": 3001} {"train_loss": -12.0621337890625, "global_step": 504256, "epoch": 3001} {"train_loss": -11.605350494384766, "global_step": 504257, "epoch": 3001} {"train_loss": -11.678909301757812, "global_step": 504258, "epoch": 3001} {"train_loss": -11.508596420288086, "global_step": 504259, "epoch": 3001} {"train_loss": -11.416028022766113, "global_step": 504260, "epoch": 3001} {"train_loss": -11.646344184875488, "global_step": 504261, "epoch": 3001} {"train_loss": -12.147623062133789, "global_step": 504262, "epoch": 3001} {"train_loss": -11.520533561706543, "global_step": 504263, "epoch": 3001} {"train_loss": -11.740406036376953, "global_step": 504264, "epoch": 3001} {"train_loss": -12.04282283782959, "global_step": 504265, "epoch": 3001} {"train_loss": -11.707975387573242, "global_step": 504266, "epoch": 3001} {"train_loss": -11.682840347290039, "global_step": 504267, "epoch": 3001} {"train_loss": -12.030790328979492, "global_step": 504268, "epoch": 3001} {"train_loss": -12.050887107849121, "global_step": 504269, "epoch": 3001} {"train_loss": -12.118866920471191, "global_step": 504270, "epoch": 3001} {"train_loss": -11.991443634033203, "global_step": 504271, "epoch": 3001} {"train_loss": -12.31714153289795, "global_step": 504272, "epoch": 3001} {"train_loss": -12.3766450881958, "global_step": 504273, "epoch": 3001} {"train_loss": -12.205007553100586, "global_step": 504274, "epoch": 3001} {"train_loss": -12.306583404541016, "global_step": 504275, "epoch": 3001} {"train_loss": -12.02099609375, "global_step": 504276, "epoch": 3001} {"train_loss": -12.283571243286133, "global_step": 504277, "epoch": 3001} {"train_loss": -12.158628463745117, "global_step": 504278, "epoch": 3001} {"train_loss": -12.21607780456543, "global_step": 504279, "epoch": 3001} {"train_loss": -12.280162811279297, "global_step": 504280, "epoch": 3001} {"train_loss": -12.4210786819458, "global_step": 504281, "epoch": 3001} {"train_loss": -12.276168823242188, "global_step": 504282, "epoch": 3001} {"train_loss": -12.465824127197266, "global_step": 504283, "epoch": 3001} {"train_loss": -12.317194938659668, "global_step": 504284, "epoch": 3001} {"train_loss": -12.325692176818848, "global_step": 504285, "epoch": 3001} {"train_loss": -12.524619102478027, "global_step": 504286, "epoch": 3001} {"train_loss": -12.156167030334473, "global_step": 504287, "epoch": 3001} {"train_loss": -12.44632339477539, "global_step": 504288, "epoch": 3001} {"train_loss": -12.415887832641602, "global_step": 504289, "epoch": 3001} {"train_loss": -12.412149429321289, "global_step": 504290, "epoch": 3001} {"train_loss": -12.628207206726074, "global_step": 504291, "epoch": 3001} {"train_loss": -12.637731552124023, "global_step": 504292, "epoch": 3001} {"train_loss": -12.519548416137695, "global_step": 504293, "epoch": 3001} {"train_loss": -12.635083198547363, "global_step": 504294, "epoch": 3001} {"train_loss": -12.630327224731445, "global_step": 504295, "epoch": 3001} {"train_loss": -12.701194763183594, "global_step": 504296, "epoch": 3001} {"train_loss": -12.617537498474121, "global_step": 504297, "epoch": 3001} {"train_loss": -12.686393737792969, "global_step": 504298, "epoch": 3001} {"train_loss": -12.814010620117188, "global_step": 504299, "epoch": 3001} {"train_loss": -12.618932723999023, "global_step": 504300, "epoch": 3001} {"train_loss": -12.807035446166992, "global_step": 504301, "epoch": 3001} {"train_loss": -12.630087852478027, "global_step": 504302, "epoch": 3001} {"train_loss": -12.91558837890625, "global_step": 504303, "epoch": 3001} {"train_loss": -12.753143310546875, "global_step": 504304, "epoch": 3001} {"train_loss": -12.491947174072266, "global_step": 504305, "epoch": 3001} {"train_loss": -12.780183792114258, "global_step": 504306, "epoch": 3001} {"train_loss": -12.741544723510742, "global_step": 504307, "epoch": 3001} {"train_loss": -12.77880859375, "global_step": 504308, "epoch": 3001} {"train_loss": -12.483765602111816, "global_step": 504309, "epoch": 3001} {"train_loss": -12.560803413391113, "global_step": 504310, "epoch": 3001} {"train_loss": -12.55617904663086, "global_step": 504311, "epoch": 3001} {"train_loss": -12.734237670898438, "global_step": 504312, "epoch": 3001} {"train_loss": -12.428667068481445, "global_step": 504313, "epoch": 3001} {"train_loss": -12.792478561401367, "global_step": 504314, "epoch": 3001} {"train_loss": -12.54544448852539, "global_step": 504315, "epoch": 3001} {"train_loss": -12.601097106933594, "global_step": 504316, "epoch": 3001} {"train_loss": -12.710530281066895, "global_step": 504317, "epoch": 3001} {"train_loss": -12.705520629882812, "global_step": 504318, "epoch": 3001} {"train_loss": -12.712822914123535, "global_step": 504319, "epoch": 3001} {"train_loss": -12.846968650817871, "global_step": 504320, "epoch": 3001} {"train_loss": -12.73774528503418, "global_step": 504321, "epoch": 3001} {"train_loss": -12.780618667602539, "global_step": 504322, "epoch": 3001} {"train_loss": -12.938070297241211, "global_step": 504323, "epoch": 3001} {"train_loss": -12.886332511901855, "global_step": 504324, "epoch": 3001} {"train_loss": -12.753896713256836, "global_step": 504325, "epoch": 3001} {"train_loss": -12.883164405822754, "global_step": 504326, "epoch": 3001} {"train_loss": -12.891149520874023, "global_step": 504327, "epoch": 3001} {"train_loss": -12.957834243774414, "global_step": 504328, "epoch": 3001} {"train_loss": -12.904375076293945, "global_step": 504329, "epoch": 3001} {"train_loss": -12.88487720489502, "global_step": 504330, "epoch": 3001} {"train_loss": -12.925630569458008, "global_step": 504331, "epoch": 3001} {"train_loss": -12.847970962524414, "global_step": 504332, "epoch": 3001} {"train_loss": -12.917461395263672, "global_step": 504333, "epoch": 3001} {"train_loss": -12.795793533325195, "global_step": 504334, "epoch": 3001} {"train_loss": -11.626984511102949, "global_step": 504335, "epoch": 3001, "val_loss": 315925.21875} {"train_loss": -13.058568000793457, "global_step": 504336, "epoch": 3002} {"train_loss": -12.913640975952148, "global_step": 504337, "epoch": 3002} {"train_loss": -12.871960639953613, "global_step": 504338, "epoch": 3002} {"train_loss": -12.894895553588867, "global_step": 504339, "epoch": 3002} {"train_loss": -12.834321022033691, "global_step": 504340, "epoch": 3002} {"train_loss": -12.957268714904785, "global_step": 504341, "epoch": 3002} {"train_loss": -12.941299438476562, "global_step": 504342, "epoch": 3002} {"train_loss": -12.79692268371582, "global_step": 504343, "epoch": 3002} {"train_loss": -12.99274730682373, "global_step": 504344, "epoch": 3002} {"train_loss": -12.975248336791992, "global_step": 504345, "epoch": 3002} {"train_loss": -13.210290908813477, "global_step": 504346, "epoch": 3002} {"train_loss": -12.830779075622559, "global_step": 504347, "epoch": 3002} {"train_loss": -12.98338508605957, "global_step": 504348, "epoch": 3002} {"train_loss": -13.046855926513672, "global_step": 504349, "epoch": 3002} {"train_loss": -12.707698822021484, "global_step": 504350, "epoch": 3002} {"train_loss": -13.127978324890137, "global_step": 504351, "epoch": 3002} {"train_loss": -12.975587844848633, "global_step": 504352, "epoch": 3002} {"train_loss": -12.675315856933594, "global_step": 504353, "epoch": 3002} {"train_loss": -12.693320274353027, "global_step": 504354, "epoch": 3002} {"train_loss": -13.014638900756836, "global_step": 504355, "epoch": 3002} {"train_loss": -13.043371200561523, "global_step": 504356, "epoch": 3002} {"train_loss": -13.113161087036133, "global_step": 504357, "epoch": 3002} {"train_loss": -12.606510162353516, "global_step": 504358, "epoch": 3002} {"train_loss": -12.886143684387207, "global_step": 504359, "epoch": 3002} {"train_loss": -12.945810317993164, "global_step": 504360, "epoch": 3002} {"train_loss": -12.51940631866455, "global_step": 504361, "epoch": 3002} {"train_loss": -12.463868141174316, "global_step": 504362, "epoch": 3002} {"train_loss": -12.6798095703125, "global_step": 504363, "epoch": 3002} {"train_loss": -12.105671882629395, "global_step": 504364, "epoch": 3002} {"train_loss": -11.940040588378906, "global_step": 504365, "epoch": 3002} {"train_loss": -12.573675155639648, "global_step": 504366, "epoch": 3002} {"train_loss": -11.177131652832031, "global_step": 504367, "epoch": 3002} {"train_loss": -10.450440406799316, "global_step": 504368, "epoch": 3002} {"train_loss": -11.852675437927246, "global_step": 504369, "epoch": 3002} {"train_loss": -11.11198616027832, "global_step": 504370, "epoch": 3002} {"train_loss": -11.909201622009277, "global_step": 504371, "epoch": 3002} {"train_loss": -9.48801040649414, "global_step": 504372, "epoch": 3002} {"train_loss": -10.307821273803711, "global_step": 504373, "epoch": 3002} {"train_loss": -8.403637886047363, "global_step": 504374, "epoch": 3002} {"train_loss": -7.801748275756836, "global_step": 504375, "epoch": 3002} {"train_loss": -8.476996421813965, "global_step": 504376, "epoch": 3002} {"train_loss": -8.479917526245117, "global_step": 504377, "epoch": 3002} {"train_loss": -8.601959228515625, "global_step": 504378, "epoch": 3002} {"train_loss": -8.708677291870117, "global_step": 504379, "epoch": 3002} {"train_loss": -9.712631225585938, "global_step": 504380, "epoch": 3002} {"train_loss": -8.953291893005371, "global_step": 504381, "epoch": 3002} {"train_loss": -9.124750137329102, "global_step": 504382, "epoch": 3002} {"train_loss": -9.026031494140625, "global_step": 504383, "epoch": 3002} {"train_loss": -9.199942588806152, "global_step": 504384, "epoch": 3002} {"train_loss": -10.211833953857422, "global_step": 504385, "epoch": 3002} {"train_loss": -9.526420593261719, "global_step": 504386, "epoch": 3002} {"train_loss": -8.81207275390625, "global_step": 504387, "epoch": 3002} {"train_loss": -10.486681938171387, "global_step": 504388, "epoch": 3002} {"train_loss": -9.921150207519531, "global_step": 504389, "epoch": 3002} {"train_loss": -10.045001029968262, "global_step": 504390, "epoch": 3002} {"train_loss": -11.118026733398438, "global_step": 504391, "epoch": 3002} {"train_loss": -10.473176956176758, "global_step": 504392, "epoch": 3002} {"train_loss": -10.96490478515625, "global_step": 504393, "epoch": 3002} {"train_loss": -11.175403594970703, "global_step": 504394, "epoch": 3002} {"train_loss": -11.133209228515625, "global_step": 504395, "epoch": 3002} {"train_loss": -11.658614158630371, "global_step": 504396, "epoch": 3002} {"train_loss": -10.926130294799805, "global_step": 504397, "epoch": 3002} {"train_loss": -11.858710289001465, "global_step": 504398, "epoch": 3002} {"train_loss": -11.309083938598633, "global_step": 504399, "epoch": 3002} {"train_loss": -11.815120697021484, "global_step": 504400, "epoch": 3002} {"train_loss": -11.546197891235352, "global_step": 504401, "epoch": 3002} {"train_loss": -11.603307723999023, "global_step": 504402, "epoch": 3002} {"train_loss": -11.816600799560547, "global_step": 504403, "epoch": 3002} {"train_loss": -11.751408576965332, "global_step": 504404, "epoch": 3002} {"train_loss": -11.764511108398438, "global_step": 504405, "epoch": 3002} {"train_loss": -11.912405014038086, "global_step": 504406, "epoch": 3002} {"train_loss": -12.127252578735352, "global_step": 504407, "epoch": 3002} {"train_loss": -11.913309097290039, "global_step": 504408, "epoch": 3002} {"train_loss": -12.324252128601074, "global_step": 504409, "epoch": 3002} {"train_loss": -12.246423721313477, "global_step": 504410, "epoch": 3002} {"train_loss": -11.802123069763184, "global_step": 504411, "epoch": 3002} {"train_loss": -11.83824348449707, "global_step": 504412, "epoch": 3002} {"train_loss": -12.186609268188477, "global_step": 504413, "epoch": 3002} {"train_loss": -12.069657325744629, "global_step": 504414, "epoch": 3002} {"train_loss": -11.846516609191895, "global_step": 504415, "epoch": 3002} {"train_loss": -11.979976654052734, "global_step": 504416, "epoch": 3002} {"train_loss": -12.398050308227539, "global_step": 504417, "epoch": 3002} {"train_loss": -11.81612777709961, "global_step": 504418, "epoch": 3002} {"train_loss": -12.536459922790527, "global_step": 504419, "epoch": 3002} {"train_loss": -11.818050384521484, "global_step": 504420, "epoch": 3002} {"train_loss": -12.303802490234375, "global_step": 504421, "epoch": 3002} {"train_loss": -12.012914657592773, "global_step": 504422, "epoch": 3002} {"train_loss": -12.073381423950195, "global_step": 504423, "epoch": 3002} {"train_loss": -12.33316421508789, "global_step": 504424, "epoch": 3002} {"train_loss": -12.068410873413086, "global_step": 504425, "epoch": 3002} {"train_loss": -12.436857223510742, "global_step": 504426, "epoch": 3002} {"train_loss": -12.25240421295166, "global_step": 504427, "epoch": 3002} {"train_loss": -12.311908721923828, "global_step": 504428, "epoch": 3002} {"train_loss": -12.582696914672852, "global_step": 504429, "epoch": 3002} {"train_loss": -11.888835906982422, "global_step": 504430, "epoch": 3002} {"train_loss": -11.803777694702148, "global_step": 504431, "epoch": 3002} {"train_loss": -12.522350311279297, "global_step": 504432, "epoch": 3002} {"train_loss": -12.015491485595703, "global_step": 504433, "epoch": 3002} {"train_loss": -11.938751220703125, "global_step": 504434, "epoch": 3002} {"train_loss": -12.490872383117676, "global_step": 504435, "epoch": 3002} {"train_loss": -11.700274467468262, "global_step": 504436, "epoch": 3002} {"train_loss": -12.590249061584473, "global_step": 504437, "epoch": 3002} {"train_loss": -11.941818237304688, "global_step": 504438, "epoch": 3002} {"train_loss": -11.973331451416016, "global_step": 504439, "epoch": 3002} {"train_loss": -12.407428741455078, "global_step": 504440, "epoch": 3002} {"train_loss": -11.97032356262207, "global_step": 504441, "epoch": 3002} {"train_loss": -12.156472206115723, "global_step": 504442, "epoch": 3002} {"train_loss": -12.334218978881836, "global_step": 504443, "epoch": 3002} {"train_loss": -11.611017227172852, "global_step": 504444, "epoch": 3002} {"train_loss": -12.360551834106445, "global_step": 504445, "epoch": 3002} {"train_loss": -11.059096336364746, "global_step": 504446, "epoch": 3002} {"train_loss": -12.246894836425781, "global_step": 504447, "epoch": 3002} {"train_loss": -11.40939998626709, "global_step": 504448, "epoch": 3002} {"train_loss": -12.09864330291748, "global_step": 504449, "epoch": 3002} {"train_loss": -11.310819625854492, "global_step": 504450, "epoch": 3002} {"train_loss": -12.054288864135742, "global_step": 504451, "epoch": 3002} {"train_loss": -11.918951034545898, "global_step": 504452, "epoch": 3002} {"train_loss": -11.151535987854004, "global_step": 504453, "epoch": 3002} {"train_loss": -12.414972305297852, "global_step": 504454, "epoch": 3002} {"train_loss": -11.031465530395508, "global_step": 504455, "epoch": 3002} {"train_loss": -12.104166984558105, "global_step": 504456, "epoch": 3002} {"train_loss": -11.810771942138672, "global_step": 504457, "epoch": 3002} {"train_loss": -11.862468719482422, "global_step": 504458, "epoch": 3002} {"train_loss": -12.227401733398438, "global_step": 504459, "epoch": 3002} {"train_loss": -12.057291030883789, "global_step": 504460, "epoch": 3002} {"train_loss": -11.233766555786133, "global_step": 504461, "epoch": 3002} {"train_loss": -12.342445373535156, "global_step": 504462, "epoch": 3002} {"train_loss": -11.26473617553711, "global_step": 504463, "epoch": 3002} {"train_loss": -11.909990310668945, "global_step": 504464, "epoch": 3002} {"train_loss": -11.459874153137207, "global_step": 504465, "epoch": 3002} {"train_loss": -11.129915237426758, "global_step": 504466, "epoch": 3002} {"train_loss": -12.036396026611328, "global_step": 504467, "epoch": 3002} {"train_loss": -12.117637634277344, "global_step": 504468, "epoch": 3002} {"train_loss": -11.34024715423584, "global_step": 504469, "epoch": 3002} {"train_loss": -12.138273239135742, "global_step": 504470, "epoch": 3002} {"train_loss": -11.571495056152344, "global_step": 504471, "epoch": 3002} {"train_loss": -11.752982139587402, "global_step": 504472, "epoch": 3002} {"train_loss": -11.53274917602539, "global_step": 504473, "epoch": 3002} {"train_loss": -12.360197067260742, "global_step": 504474, "epoch": 3002} {"train_loss": -11.433212280273438, "global_step": 504475, "epoch": 3002} {"train_loss": -12.338318824768066, "global_step": 504476, "epoch": 3002} {"train_loss": -12.141437530517578, "global_step": 504477, "epoch": 3002} {"train_loss": -12.555465698242188, "global_step": 504478, "epoch": 3002} {"train_loss": -12.056490898132324, "global_step": 504479, "epoch": 3002} {"train_loss": -12.453267097473145, "global_step": 504480, "epoch": 3002} {"train_loss": -12.24323844909668, "global_step": 504481, "epoch": 3002} {"train_loss": -12.361270904541016, "global_step": 504482, "epoch": 3002} {"train_loss": -12.637368202209473, "global_step": 504483, "epoch": 3002} {"train_loss": -12.272771835327148, "global_step": 504484, "epoch": 3002} {"train_loss": -12.882960319519043, "global_step": 504485, "epoch": 3002} {"train_loss": -12.385171890258789, "global_step": 504486, "epoch": 3002} {"train_loss": -12.659029006958008, "global_step": 504487, "epoch": 3002} {"train_loss": -12.426941871643066, "global_step": 504488, "epoch": 3002} {"train_loss": -12.521235466003418, "global_step": 504489, "epoch": 3002} {"train_loss": -12.382108688354492, "global_step": 504490, "epoch": 3002} {"train_loss": -12.69632625579834, "global_step": 504491, "epoch": 3002} {"train_loss": -12.391571044921875, "global_step": 504492, "epoch": 3002} {"train_loss": -12.636375427246094, "global_step": 504493, "epoch": 3002} {"train_loss": -12.338542938232422, "global_step": 504494, "epoch": 3002} {"train_loss": -12.626848220825195, "global_step": 504495, "epoch": 3002} {"train_loss": -12.51071548461914, "global_step": 504496, "epoch": 3002} {"train_loss": -12.663131713867188, "global_step": 504497, "epoch": 3002} {"train_loss": -12.62498664855957, "global_step": 504498, "epoch": 3002} {"train_loss": -12.59885025024414, "global_step": 504499, "epoch": 3002} {"train_loss": -12.754112243652344, "global_step": 504500, "epoch": 3002} {"train_loss": -12.611512184143066, "global_step": 504501, "epoch": 3002} {"train_loss": -12.779725074768066, "global_step": 504502, "epoch": 3002} {"train_loss": -11.830488420668102, "global_step": 504503, "epoch": 3002, "val_loss": 320663.78125} {"train_loss": -12.89376163482666, "global_step": 504504, "epoch": 3003} {"train_loss": -12.606178283691406, "global_step": 504505, "epoch": 3003} {"train_loss": -12.325220108032227, "global_step": 504506, "epoch": 3003} {"train_loss": -12.519570350646973, "global_step": 504507, "epoch": 3003} {"train_loss": -12.633752822875977, "global_step": 504508, "epoch": 3003} {"train_loss": -12.371868133544922, "global_step": 504509, "epoch": 3003} {"train_loss": -12.259838104248047, "global_step": 504510, "epoch": 3003} {"train_loss": -12.34312629699707, "global_step": 504511, "epoch": 3003} {"train_loss": -12.561437606811523, "global_step": 504512, "epoch": 3003} {"train_loss": -12.678045272827148, "global_step": 504513, "epoch": 3003} {"train_loss": -12.510440826416016, "global_step": 504514, "epoch": 3003} {"train_loss": -12.459480285644531, "global_step": 504515, "epoch": 3003} {"train_loss": -12.09805965423584, "global_step": 504516, "epoch": 3003} {"train_loss": -12.429191589355469, "global_step": 504517, "epoch": 3003} {"train_loss": -12.403794288635254, "global_step": 504518, "epoch": 3003} {"train_loss": -12.173528671264648, "global_step": 504519, "epoch": 3003} {"train_loss": -11.98684310913086, "global_step": 504520, "epoch": 3003} {"train_loss": -12.325845718383789, "global_step": 504521, "epoch": 3003} {"train_loss": -12.146431922912598, "global_step": 504522, "epoch": 3003} {"train_loss": -12.231411933898926, "global_step": 504523, "epoch": 3003} {"train_loss": -12.124837875366211, "global_step": 504524, "epoch": 3003} {"train_loss": -11.685829162597656, "global_step": 504525, "epoch": 3003} {"train_loss": -12.457586288452148, "global_step": 504526, "epoch": 3003} {"train_loss": -11.479515075683594, "global_step": 504527, "epoch": 3003} {"train_loss": -11.99095344543457, "global_step": 504528, "epoch": 3003} {"train_loss": -12.231887817382812, "global_step": 504529, "epoch": 3003} {"train_loss": -12.27707290649414, "global_step": 504530, "epoch": 3003} {"train_loss": -11.860601425170898, "global_step": 504531, "epoch": 3003} {"train_loss": -12.564103126525879, "global_step": 504532, "epoch": 3003} {"train_loss": -12.42721939086914, "global_step": 504533, "epoch": 3003} {"train_loss": -12.26919174194336, "global_step": 504534, "epoch": 3003} {"train_loss": -11.894405364990234, "global_step": 504535, "epoch": 3003} {"train_loss": -12.55116081237793, "global_step": 504536, "epoch": 3003} {"train_loss": -12.307953834533691, "global_step": 504537, "epoch": 3003} {"train_loss": -12.586414337158203, "global_step": 504538, "epoch": 3003} {"train_loss": -12.326569557189941, "global_step": 504539, "epoch": 3003} {"train_loss": -11.992271423339844, "global_step": 504540, "epoch": 3003} {"train_loss": -12.503021240234375, "global_step": 504541, "epoch": 3003} {"train_loss": -12.364261627197266, "global_step": 504542, "epoch": 3003} {"train_loss": -12.236063003540039, "global_step": 504543, "epoch": 3003} {"train_loss": -12.461627960205078, "global_step": 504544, "epoch": 3003} {"train_loss": -12.4920072555542, "global_step": 504545, "epoch": 3003} {"train_loss": -12.436038970947266, "global_step": 504546, "epoch": 3003} {"train_loss": -12.027767181396484, "global_step": 504547, "epoch": 3003} {"train_loss": -12.320273399353027, "global_step": 504548, "epoch": 3003} {"train_loss": -12.613243103027344, "global_step": 504549, "epoch": 3003} {"train_loss": -12.022101402282715, "global_step": 504550, "epoch": 3003} {"train_loss": -12.520841598510742, "global_step": 504551, "epoch": 3003} {"train_loss": -12.531553268432617, "global_step": 504552, "epoch": 3003} {"train_loss": -11.617891311645508, "global_step": 504553, "epoch": 3003} {"train_loss": -12.624065399169922, "global_step": 504554, "epoch": 3003} {"train_loss": -12.091222763061523, "global_step": 504555, "epoch": 3003} {"train_loss": -9.838539123535156, "global_step": 504556, "epoch": 3003} {"train_loss": -11.397785186767578, "global_step": 504557, "epoch": 3003} {"train_loss": -10.929521560668945, "global_step": 504558, "epoch": 3003} {"train_loss": -11.077657699584961, "global_step": 504559, "epoch": 3003} {"train_loss": -12.277359008789062, "global_step": 504560, "epoch": 3003} {"train_loss": -11.497562408447266, "global_step": 504561, "epoch": 3003} {"train_loss": -12.433523178100586, "global_step": 504562, "epoch": 3003} {"train_loss": -11.398269653320312, "global_step": 504563, "epoch": 3003} {"train_loss": -12.343006134033203, "global_step": 504564, "epoch": 3003} {"train_loss": -11.987489700317383, "global_step": 504565, "epoch": 3003} {"train_loss": -12.078375816345215, "global_step": 504566, "epoch": 3003} {"train_loss": -11.994694709777832, "global_step": 504567, "epoch": 3003} {"train_loss": -12.517476081848145, "global_step": 504568, "epoch": 3003} {"train_loss": -12.137321472167969, "global_step": 504569, "epoch": 3003} {"train_loss": -12.382621765136719, "global_step": 504570, "epoch": 3003} {"train_loss": -12.280550003051758, "global_step": 504571, "epoch": 3003} {"train_loss": -12.01093578338623, "global_step": 504572, "epoch": 3003} {"train_loss": -12.379772186279297, "global_step": 504573, "epoch": 3003} {"train_loss": -12.015124320983887, "global_step": 504574, "epoch": 3003} {"train_loss": -11.960214614868164, "global_step": 504575, "epoch": 3003} {"train_loss": -12.036551475524902, "global_step": 504576, "epoch": 3003} {"train_loss": -11.525797843933105, "global_step": 504577, "epoch": 3003} {"train_loss": -12.30438232421875, "global_step": 504578, "epoch": 3003} {"train_loss": -11.932598114013672, "global_step": 504579, "epoch": 3003} {"train_loss": -11.941829681396484, "global_step": 504580, "epoch": 3003} {"train_loss": -12.38743782043457, "global_step": 504581, "epoch": 3003} {"train_loss": -12.144664764404297, "global_step": 504582, "epoch": 3003} {"train_loss": -12.28832721710205, "global_step": 504583, "epoch": 3003} {"train_loss": -12.19330883026123, "global_step": 504584, "epoch": 3003} {"train_loss": -12.105400085449219, "global_step": 504585, "epoch": 3003} {"train_loss": -12.608596801757812, "global_step": 504586, "epoch": 3003} {"train_loss": -12.023510932922363, "global_step": 504587, "epoch": 3003} {"train_loss": -12.628744125366211, "global_step": 504588, "epoch": 3003} {"train_loss": -12.424930572509766, "global_step": 504589, "epoch": 3003} {"train_loss": -12.297496795654297, "global_step": 504590, "epoch": 3003} {"train_loss": -12.453325271606445, "global_step": 504591, "epoch": 3003} {"train_loss": -12.61823558807373, "global_step": 504592, "epoch": 3003} {"train_loss": -12.543862342834473, "global_step": 504593, "epoch": 3003} {"train_loss": -12.735294342041016, "global_step": 504594, "epoch": 3003} {"train_loss": -12.501066207885742, "global_step": 504595, "epoch": 3003} {"train_loss": -12.886987686157227, "global_step": 504596, "epoch": 3003} {"train_loss": -12.560935020446777, "global_step": 504597, "epoch": 3003} {"train_loss": -12.76353645324707, "global_step": 504598, "epoch": 3003} {"train_loss": -12.86580753326416, "global_step": 504599, "epoch": 3003} {"train_loss": -12.6317720413208, "global_step": 504600, "epoch": 3003} {"train_loss": -12.767396926879883, "global_step": 504601, "epoch": 3003} {"train_loss": -12.845075607299805, "global_step": 504602, "epoch": 3003} {"train_loss": -12.68381118774414, "global_step": 504603, "epoch": 3003} {"train_loss": -12.807432174682617, "global_step": 504604, "epoch": 3003} {"train_loss": -12.695425987243652, "global_step": 504605, "epoch": 3003} {"train_loss": -12.653095245361328, "global_step": 504606, "epoch": 3003} {"train_loss": -12.7911958694458, "global_step": 504607, "epoch": 3003} {"train_loss": -12.786677360534668, "global_step": 504608, "epoch": 3003} {"train_loss": -12.430758476257324, "global_step": 504609, "epoch": 3003} {"train_loss": -12.781529426574707, "global_step": 504610, "epoch": 3003} {"train_loss": -12.848062515258789, "global_step": 504611, "epoch": 3003} {"train_loss": -12.66533088684082, "global_step": 504612, "epoch": 3003} {"train_loss": -12.891593933105469, "global_step": 504613, "epoch": 3003} {"train_loss": -12.843766212463379, "global_step": 504614, "epoch": 3003} {"train_loss": -12.899035453796387, "global_step": 504615, "epoch": 3003} {"train_loss": -12.679193496704102, "global_step": 504616, "epoch": 3003} {"train_loss": -12.230840682983398, "global_step": 504617, "epoch": 3003} {"train_loss": -12.668545722961426, "global_step": 504618, "epoch": 3003} {"train_loss": -12.883974075317383, "global_step": 504619, "epoch": 3003} {"train_loss": -12.54150390625, "global_step": 504620, "epoch": 3003} {"train_loss": -12.94093132019043, "global_step": 504621, "epoch": 3003} {"train_loss": -12.770544052124023, "global_step": 504622, "epoch": 3003} {"train_loss": -12.814058303833008, "global_step": 504623, "epoch": 3003} {"train_loss": -12.938370704650879, "global_step": 504624, "epoch": 3003} {"train_loss": -12.692901611328125, "global_step": 504625, "epoch": 3003} {"train_loss": -12.604365348815918, "global_step": 504626, "epoch": 3003} {"train_loss": -12.905281066894531, "global_step": 504627, "epoch": 3003} {"train_loss": -12.712820053100586, "global_step": 504628, "epoch": 3003} {"train_loss": -12.939943313598633, "global_step": 504629, "epoch": 3003} {"train_loss": -12.920754432678223, "global_step": 504630, "epoch": 3003} {"train_loss": -12.914167404174805, "global_step": 504631, "epoch": 3003} {"train_loss": -12.90262222290039, "global_step": 504632, "epoch": 3003} {"train_loss": -13.012591361999512, "global_step": 504633, "epoch": 3003} {"train_loss": -13.065942764282227, "global_step": 504634, "epoch": 3003} {"train_loss": -12.90691089630127, "global_step": 504635, "epoch": 3003} {"train_loss": -13.125028610229492, "global_step": 504636, "epoch": 3003} {"train_loss": -12.926309585571289, "global_step": 504637, "epoch": 3003} {"train_loss": -13.009224891662598, "global_step": 504638, "epoch": 3003} {"train_loss": -12.418891906738281, "global_step": 504639, "epoch": 3003} {"train_loss": -12.782676696777344, "global_step": 504640, "epoch": 3003} {"train_loss": -12.817730903625488, "global_step": 504641, "epoch": 3003} {"train_loss": -12.750996589660645, "global_step": 504642, "epoch": 3003} {"train_loss": -13.000260353088379, "global_step": 504643, "epoch": 3003} {"train_loss": -12.985088348388672, "global_step": 504644, "epoch": 3003} {"train_loss": -12.710975646972656, "global_step": 504645, "epoch": 3003} {"train_loss": -12.431039810180664, "global_step": 504646, "epoch": 3003} {"train_loss": -12.881065368652344, "global_step": 504647, "epoch": 3003} {"train_loss": -12.60311508178711, "global_step": 504648, "epoch": 3003} {"train_loss": -12.43749713897705, "global_step": 504649, "epoch": 3003} {"train_loss": -12.664254188537598, "global_step": 504650, "epoch": 3003} {"train_loss": -12.7562837600708, "global_step": 504651, "epoch": 3003} {"train_loss": -12.396337509155273, "global_step": 504652, "epoch": 3003} {"train_loss": -12.232951164245605, "global_step": 504653, "epoch": 3003} {"train_loss": -12.731158256530762, "global_step": 504654, "epoch": 3003} {"train_loss": -11.850419998168945, "global_step": 504655, "epoch": 3003} {"train_loss": -11.732484817504883, "global_step": 504656, "epoch": 3003} {"train_loss": -11.865716934204102, "global_step": 504657, "epoch": 3003} {"train_loss": -12.912036895751953, "global_step": 504658, "epoch": 3003} {"train_loss": -11.950870513916016, "global_step": 504659, "epoch": 3003} {"train_loss": -11.442145347595215, "global_step": 504660, "epoch": 3003} {"train_loss": -11.992443084716797, "global_step": 504661, "epoch": 3003} {"train_loss": -12.601139068603516, "global_step": 504662, "epoch": 3003} {"train_loss": -11.749631881713867, "global_step": 504663, "epoch": 3003} {"train_loss": -12.987872123718262, "global_step": 504664, "epoch": 3003} {"train_loss": -12.46023178100586, "global_step": 504665, "epoch": 3003} {"train_loss": -11.662134170532227, "global_step": 504666, "epoch": 3003} {"train_loss": -12.394292831420898, "global_step": 504667, "epoch": 3003} {"train_loss": -12.648033142089844, "global_step": 504668, "epoch": 3003} {"train_loss": -11.840143203735352, "global_step": 504669, "epoch": 3003} {"train_loss": -11.790210723876953, "global_step": 504670, "epoch": 3003} {"train_loss": -12.390684462728954, "global_step": 504671, "epoch": 3003, "val_loss": 319761.4375} {"train_loss": -11.225868225097656, "global_step": 504672, "epoch": 3004} {"train_loss": -11.82003402709961, "global_step": 504673, "epoch": 3004} {"train_loss": -12.503581047058105, "global_step": 504674, "epoch": 3004} {"train_loss": -11.772098541259766, "global_step": 504675, "epoch": 3004} {"train_loss": -12.443840026855469, "global_step": 504676, "epoch": 3004} {"train_loss": -12.613622665405273, "global_step": 504677, "epoch": 3004} {"train_loss": -12.353418350219727, "global_step": 504678, "epoch": 3004} {"train_loss": -12.743743896484375, "global_step": 504679, "epoch": 3004} {"train_loss": -12.41999626159668, "global_step": 504680, "epoch": 3004} {"train_loss": -11.595327377319336, "global_step": 504681, "epoch": 3004} {"train_loss": -11.825095176696777, "global_step": 504682, "epoch": 3004} {"train_loss": -11.901102066040039, "global_step": 504683, "epoch": 3004} {"train_loss": -11.460250854492188, "global_step": 504684, "epoch": 3004} {"train_loss": -10.992094039916992, "global_step": 504685, "epoch": 3004} {"train_loss": -11.666899681091309, "global_step": 504686, "epoch": 3004} {"train_loss": -11.583690643310547, "global_step": 504687, "epoch": 3004} {"train_loss": -11.649351119995117, "global_step": 504688, "epoch": 3004} {"train_loss": -11.364570617675781, "global_step": 504689, "epoch": 3004} {"train_loss": -11.677471160888672, "global_step": 504690, "epoch": 3004} {"train_loss": -12.067094802856445, "global_step": 504691, "epoch": 3004} {"train_loss": -11.603433609008789, "global_step": 504692, "epoch": 3004} {"train_loss": -11.854225158691406, "global_step": 504693, "epoch": 3004} {"train_loss": -11.005814552307129, "global_step": 504694, "epoch": 3004} {"train_loss": -11.986547470092773, "global_step": 504695, "epoch": 3004} {"train_loss": -11.375033378601074, "global_step": 504696, "epoch": 3004} {"train_loss": -11.972527503967285, "global_step": 504697, "epoch": 3004} {"train_loss": -11.945540428161621, "global_step": 504698, "epoch": 3004} {"train_loss": -11.881950378417969, "global_step": 504699, "epoch": 3004} {"train_loss": -12.295440673828125, "global_step": 504700, "epoch": 3004} {"train_loss": -11.801663398742676, "global_step": 504701, "epoch": 3004} {"train_loss": -12.125566482543945, "global_step": 504702, "epoch": 3004} {"train_loss": -11.360085487365723, "global_step": 504703, "epoch": 3004} {"train_loss": -12.078376770019531, "global_step": 504704, "epoch": 3004} {"train_loss": -12.228628158569336, "global_step": 504705, "epoch": 3004} {"train_loss": -11.973719596862793, "global_step": 504706, "epoch": 3004} {"train_loss": -12.213470458984375, "global_step": 504707, "epoch": 3004} {"train_loss": -12.198820114135742, "global_step": 504708, "epoch": 3004} {"train_loss": -12.42807388305664, "global_step": 504709, "epoch": 3004} {"train_loss": -11.91895866394043, "global_step": 504710, "epoch": 3004} {"train_loss": -12.367471694946289, "global_step": 504711, "epoch": 3004} {"train_loss": -12.408713340759277, "global_step": 504712, "epoch": 3004} {"train_loss": -12.368730545043945, "global_step": 504713, "epoch": 3004} {"train_loss": -12.288849830627441, "global_step": 504714, "epoch": 3004} {"train_loss": -11.931665420532227, "global_step": 504715, "epoch": 3004} {"train_loss": -12.175214767456055, "global_step": 504716, "epoch": 3004} {"train_loss": -12.296415328979492, "global_step": 504717, "epoch": 3004} {"train_loss": -11.58360481262207, "global_step": 504718, "epoch": 3004} {"train_loss": -12.26708984375, "global_step": 504719, "epoch": 3004} {"train_loss": -11.031408309936523, "global_step": 504720, "epoch": 3004} {"train_loss": -11.064733505249023, "global_step": 504721, "epoch": 3004} {"train_loss": -11.960609436035156, "global_step": 504722, "epoch": 3004} {"train_loss": -11.739924430847168, "global_step": 504723, "epoch": 3004} {"train_loss": -11.462156295776367, "global_step": 504724, "epoch": 3004} {"train_loss": -11.921889305114746, "global_step": 504725, "epoch": 3004} {"train_loss": -12.206581115722656, "global_step": 504726, "epoch": 3004} {"train_loss": -10.967633247375488, "global_step": 504727, "epoch": 3004} {"train_loss": -11.969588279724121, "global_step": 504728, "epoch": 3004} {"train_loss": -12.073358535766602, "global_step": 504729, "epoch": 3004} {"train_loss": -12.295333862304688, "global_step": 504730, "epoch": 3004} {"train_loss": -12.182037353515625, "global_step": 504731, "epoch": 3004} {"train_loss": -12.660780906677246, "global_step": 504732, "epoch": 3004} {"train_loss": -11.808748245239258, "global_step": 504733, "epoch": 3004} {"train_loss": -12.436609268188477, "global_step": 504734, "epoch": 3004} {"train_loss": -12.026531219482422, "global_step": 504735, "epoch": 3004} {"train_loss": -12.419687271118164, "global_step": 504736, "epoch": 3004} {"train_loss": -12.543115615844727, "global_step": 504737, "epoch": 3004} {"train_loss": -12.218573570251465, "global_step": 504738, "epoch": 3004} {"train_loss": -12.44880485534668, "global_step": 504739, "epoch": 3004} {"train_loss": -12.250211715698242, "global_step": 504740, "epoch": 3004} {"train_loss": -12.433389663696289, "global_step": 504741, "epoch": 3004} {"train_loss": -12.18161392211914, "global_step": 504742, "epoch": 3004} {"train_loss": -12.530077934265137, "global_step": 504743, "epoch": 3004} {"train_loss": -12.407363891601562, "global_step": 504744, "epoch": 3004} {"train_loss": -11.87635612487793, "global_step": 504745, "epoch": 3004} {"train_loss": -12.76169204711914, "global_step": 504746, "epoch": 3004} {"train_loss": -11.978055000305176, "global_step": 504747, "epoch": 3004} {"train_loss": -12.574867248535156, "global_step": 504748, "epoch": 3004} {"train_loss": -12.220906257629395, "global_step": 504749, "epoch": 3004} {"train_loss": -11.959189414978027, "global_step": 504750, "epoch": 3004} {"train_loss": -12.270109176635742, "global_step": 504751, "epoch": 3004} {"train_loss": -11.47269058227539, "global_step": 504752, "epoch": 3004} {"train_loss": -12.280261993408203, "global_step": 504753, "epoch": 3004} {"train_loss": -12.36089038848877, "global_step": 504754, "epoch": 3004} {"train_loss": -12.698046684265137, "global_step": 504755, "epoch": 3004} {"train_loss": -12.167598724365234, "global_step": 504756, "epoch": 3004} {"train_loss": -12.551490783691406, "global_step": 504757, "epoch": 3004} {"train_loss": -12.022480964660645, "global_step": 504758, "epoch": 3004} {"train_loss": -12.235381126403809, "global_step": 504759, "epoch": 3004} {"train_loss": -12.418280601501465, "global_step": 504760, "epoch": 3004} {"train_loss": -12.578690528869629, "global_step": 504761, "epoch": 3004} {"train_loss": -12.613773345947266, "global_step": 504762, "epoch": 3004} {"train_loss": -12.395758628845215, "global_step": 504763, "epoch": 3004} {"train_loss": -12.616020202636719, "global_step": 504764, "epoch": 3004} {"train_loss": -12.400943756103516, "global_step": 504765, "epoch": 3004} {"train_loss": -12.698858261108398, "global_step": 504766, "epoch": 3004} {"train_loss": -12.453471183776855, "global_step": 504767, "epoch": 3004} {"train_loss": -12.725627899169922, "global_step": 504768, "epoch": 3004} {"train_loss": -12.338155746459961, "global_step": 504769, "epoch": 3004} {"train_loss": -12.808908462524414, "global_step": 504770, "epoch": 3004} {"train_loss": -12.280861854553223, "global_step": 504771, "epoch": 3004} {"train_loss": -12.704878807067871, "global_step": 504772, "epoch": 3004} {"train_loss": -12.529098510742188, "global_step": 504773, "epoch": 3004} {"train_loss": -12.470285415649414, "global_step": 504774, "epoch": 3004} {"train_loss": -12.615787506103516, "global_step": 504775, "epoch": 3004} {"train_loss": -12.833456039428711, "global_step": 504776, "epoch": 3004} {"train_loss": -12.854122161865234, "global_step": 504777, "epoch": 3004} {"train_loss": -12.766668319702148, "global_step": 504778, "epoch": 3004} {"train_loss": -12.755865097045898, "global_step": 504779, "epoch": 3004} {"train_loss": -12.785008430480957, "global_step": 504780, "epoch": 3004} {"train_loss": -12.564201354980469, "global_step": 504781, "epoch": 3004} {"train_loss": -12.67481803894043, "global_step": 504782, "epoch": 3004} {"train_loss": -12.714902877807617, "global_step": 504783, "epoch": 3004} {"train_loss": -12.870527267456055, "global_step": 504784, "epoch": 3004} {"train_loss": -12.541888236999512, "global_step": 504785, "epoch": 3004} {"train_loss": -12.489629745483398, "global_step": 504786, "epoch": 3004} {"train_loss": -12.578980445861816, "global_step": 504787, "epoch": 3004} {"train_loss": -12.645078659057617, "global_step": 504788, "epoch": 3004} {"train_loss": -12.677897453308105, "global_step": 504789, "epoch": 3004} {"train_loss": -12.761387825012207, "global_step": 504790, "epoch": 3004} {"train_loss": -12.387715339660645, "global_step": 504791, "epoch": 3004} {"train_loss": -12.834394454956055, "global_step": 504792, "epoch": 3004} {"train_loss": -12.556350708007812, "global_step": 504793, "epoch": 3004} {"train_loss": -11.831331253051758, "global_step": 504794, "epoch": 3004} {"train_loss": -12.565048217773438, "global_step": 504795, "epoch": 3004} {"train_loss": -12.068300247192383, "global_step": 504796, "epoch": 3004} {"train_loss": -12.570287704467773, "global_step": 504797, "epoch": 3004} {"train_loss": -12.227335929870605, "global_step": 504798, "epoch": 3004} {"train_loss": -12.596651077270508, "global_step": 504799, "epoch": 3004} {"train_loss": -12.168697357177734, "global_step": 504800, "epoch": 3004} {"train_loss": -12.489748001098633, "global_step": 504801, "epoch": 3004} {"train_loss": -12.788431167602539, "global_step": 504802, "epoch": 3004} {"train_loss": -12.934931755065918, "global_step": 504803, "epoch": 3004} {"train_loss": -12.706758499145508, "global_step": 504804, "epoch": 3004} {"train_loss": -12.62673568725586, "global_step": 504805, "epoch": 3004} {"train_loss": -12.850868225097656, "global_step": 504806, "epoch": 3004} {"train_loss": -12.900190353393555, "global_step": 504807, "epoch": 3004} {"train_loss": -12.376838684082031, "global_step": 504808, "epoch": 3004} {"train_loss": -12.292219161987305, "global_step": 504809, "epoch": 3004} {"train_loss": -12.738292694091797, "global_step": 504810, "epoch": 3004} {"train_loss": -11.906396865844727, "global_step": 504811, "epoch": 3004} {"train_loss": -12.182172775268555, "global_step": 504812, "epoch": 3004} {"train_loss": -11.890247344970703, "global_step": 504813, "epoch": 3004} {"train_loss": -12.094880104064941, "global_step": 504814, "epoch": 3004} {"train_loss": -12.168867111206055, "global_step": 504815, "epoch": 3004} {"train_loss": -12.71075439453125, "global_step": 504816, "epoch": 3004} {"train_loss": -11.735563278198242, "global_step": 504817, "epoch": 3004} {"train_loss": -12.914413452148438, "global_step": 504818, "epoch": 3004} {"train_loss": -12.62389850616455, "global_step": 504819, "epoch": 3004} {"train_loss": -12.550580978393555, "global_step": 504820, "epoch": 3004} {"train_loss": -12.412395477294922, "global_step": 504821, "epoch": 3004} {"train_loss": -12.502243041992188, "global_step": 504822, "epoch": 3004} {"train_loss": -12.649520874023438, "global_step": 504823, "epoch": 3004} {"train_loss": -12.05880355834961, "global_step": 504824, "epoch": 3004} {"train_loss": -11.839847564697266, "global_step": 504825, "epoch": 3004} {"train_loss": -12.607767105102539, "global_step": 504826, "epoch": 3004} {"train_loss": -11.678716659545898, "global_step": 504827, "epoch": 3004} {"train_loss": -11.429414749145508, "global_step": 504828, "epoch": 3004} {"train_loss": -11.845499038696289, "global_step": 504829, "epoch": 3004} {"train_loss": -12.448249816894531, "global_step": 504830, "epoch": 3004} {"train_loss": -11.81563663482666, "global_step": 504831, "epoch": 3004} {"train_loss": -11.656827926635742, "global_step": 504832, "epoch": 3004} {"train_loss": -11.855538368225098, "global_step": 504833, "epoch": 3004} {"train_loss": -11.391677856445312, "global_step": 504834, "epoch": 3004} {"train_loss": -11.86606216430664, "global_step": 504835, "epoch": 3004} {"train_loss": -11.46977424621582, "global_step": 504836, "epoch": 3004} {"train_loss": -12.072083473205566, "global_step": 504837, "epoch": 3004} {"train_loss": -11.565362930297852, "global_step": 504838, "epoch": 3004} {"train_loss": -12.204334838049752, "global_step": 504839, "epoch": 3004, "val_loss": 323361.25} {"train_loss": -11.820932388305664, "global_step": 504840, "epoch": 3005} {"train_loss": -12.180656433105469, "global_step": 504841, "epoch": 3005} {"train_loss": -12.251861572265625, "global_step": 504842, "epoch": 3005} {"train_loss": -11.881832122802734, "global_step": 504843, "epoch": 3005} {"train_loss": -12.81472110748291, "global_step": 504844, "epoch": 3005} {"train_loss": -12.242607116699219, "global_step": 504845, "epoch": 3005} {"train_loss": -12.195173263549805, "global_step": 504846, "epoch": 3005} {"train_loss": -12.573982238769531, "global_step": 504847, "epoch": 3005} {"train_loss": -11.898334503173828, "global_step": 504848, "epoch": 3005} {"train_loss": -12.450922966003418, "global_step": 504849, "epoch": 3005} {"train_loss": -12.218669891357422, "global_step": 504850, "epoch": 3005} {"train_loss": -11.794474601745605, "global_step": 504851, "epoch": 3005} {"train_loss": -11.963081359863281, "global_step": 504852, "epoch": 3005} {"train_loss": -12.813121795654297, "global_step": 504853, "epoch": 3005} {"train_loss": -12.402523040771484, "global_step": 504854, "epoch": 3005} {"train_loss": -12.358654022216797, "global_step": 504855, "epoch": 3005} {"train_loss": -12.730506896972656, "global_step": 504856, "epoch": 3005} {"train_loss": -12.258684158325195, "global_step": 504857, "epoch": 3005} {"train_loss": -12.675331115722656, "global_step": 504858, "epoch": 3005} {"train_loss": -12.603808403015137, "global_step": 504859, "epoch": 3005} {"train_loss": -12.760672569274902, "global_step": 504860, "epoch": 3005} {"train_loss": -12.732446670532227, "global_step": 504861, "epoch": 3005} {"train_loss": -12.664121627807617, "global_step": 504862, "epoch": 3005} {"train_loss": -12.568241119384766, "global_step": 504863, "epoch": 3005} {"train_loss": -12.742156982421875, "global_step": 504864, "epoch": 3005} {"train_loss": -12.261887550354004, "global_step": 504865, "epoch": 3005} {"train_loss": -12.534194946289062, "global_step": 504866, "epoch": 3005} {"train_loss": -12.731101989746094, "global_step": 504867, "epoch": 3005} {"train_loss": -12.385143280029297, "global_step": 504868, "epoch": 3005} {"train_loss": -12.622424125671387, "global_step": 504869, "epoch": 3005} {"train_loss": -12.634265899658203, "global_step": 504870, "epoch": 3005} {"train_loss": -12.551656723022461, "global_step": 504871, "epoch": 3005} {"train_loss": -12.73884391784668, "global_step": 504872, "epoch": 3005} {"train_loss": -12.543316841125488, "global_step": 504873, "epoch": 3005} {"train_loss": -12.745157241821289, "global_step": 504874, "epoch": 3005} {"train_loss": -12.637943267822266, "global_step": 504875, "epoch": 3005} {"train_loss": -12.570883750915527, "global_step": 504876, "epoch": 3005} {"train_loss": -12.693620681762695, "global_step": 504877, "epoch": 3005} {"train_loss": -12.5670804977417, "global_step": 504878, "epoch": 3005} {"train_loss": -12.831060409545898, "global_step": 504879, "epoch": 3005} {"train_loss": -12.516119003295898, "global_step": 504880, "epoch": 3005} {"train_loss": -12.190138816833496, "global_step": 504881, "epoch": 3005} {"train_loss": -12.752752304077148, "global_step": 504882, "epoch": 3005} {"train_loss": -12.174497604370117, "global_step": 504883, "epoch": 3005} {"train_loss": -12.286100387573242, "global_step": 504884, "epoch": 3005} {"train_loss": -12.330225944519043, "global_step": 504885, "epoch": 3005} {"train_loss": -12.609922409057617, "global_step": 504886, "epoch": 3005} {"train_loss": -12.214622497558594, "global_step": 504887, "epoch": 3005} {"train_loss": -12.56904125213623, "global_step": 504888, "epoch": 3005} {"train_loss": -12.351282119750977, "global_step": 504889, "epoch": 3005} {"train_loss": -11.504264831542969, "global_step": 504890, "epoch": 3005} {"train_loss": -12.549083709716797, "global_step": 504891, "epoch": 3005} {"train_loss": -11.471856117248535, "global_step": 504892, "epoch": 3005} {"train_loss": -12.718733787536621, "global_step": 504893, "epoch": 3005} {"train_loss": -12.0673828125, "global_step": 504894, "epoch": 3005} {"train_loss": -12.925923347473145, "global_step": 504895, "epoch": 3005} {"train_loss": -12.408863067626953, "global_step": 504896, "epoch": 3005} {"train_loss": -12.789555549621582, "global_step": 504897, "epoch": 3005} {"train_loss": -12.14210033416748, "global_step": 504898, "epoch": 3005} {"train_loss": -12.587442398071289, "global_step": 504899, "epoch": 3005} {"train_loss": -11.759014129638672, "global_step": 504900, "epoch": 3005} {"train_loss": -12.674596786499023, "global_step": 504901, "epoch": 3005} {"train_loss": -11.873543739318848, "global_step": 504902, "epoch": 3005} {"train_loss": -12.061758041381836, "global_step": 504903, "epoch": 3005} {"train_loss": -12.354642868041992, "global_step": 504904, "epoch": 3005} {"train_loss": -12.749711990356445, "global_step": 504905, "epoch": 3005} {"train_loss": -12.206110000610352, "global_step": 504906, "epoch": 3005} {"train_loss": -12.66018295288086, "global_step": 504907, "epoch": 3005} {"train_loss": -12.660992622375488, "global_step": 504908, "epoch": 3005} {"train_loss": -12.208209037780762, "global_step": 504909, "epoch": 3005} {"train_loss": -12.449076652526855, "global_step": 504910, "epoch": 3005} {"train_loss": -12.192035675048828, "global_step": 504911, "epoch": 3005} {"train_loss": -11.975626945495605, "global_step": 504912, "epoch": 3005} {"train_loss": -11.90024185180664, "global_step": 504913, "epoch": 3005} {"train_loss": -11.50515365600586, "global_step": 504914, "epoch": 3005} {"train_loss": -12.461740493774414, "global_step": 504915, "epoch": 3005} {"train_loss": -11.808879852294922, "global_step": 504916, "epoch": 3005} {"train_loss": -12.259773254394531, "global_step": 504917, "epoch": 3005} {"train_loss": -11.931280136108398, "global_step": 504918, "epoch": 3005} {"train_loss": -11.195171356201172, "global_step": 504919, "epoch": 3005} {"train_loss": -12.23337173461914, "global_step": 504920, "epoch": 3005} {"train_loss": -11.742879867553711, "global_step": 504921, "epoch": 3005} {"train_loss": -11.804250717163086, "global_step": 504922, "epoch": 3005} {"train_loss": -11.976656913757324, "global_step": 504923, "epoch": 3005} {"train_loss": -12.331185340881348, "global_step": 504924, "epoch": 3005} {"train_loss": -12.247089385986328, "global_step": 504925, "epoch": 3005} {"train_loss": -12.64748764038086, "global_step": 504926, "epoch": 3005} {"train_loss": -12.699729919433594, "global_step": 504927, "epoch": 3005} {"train_loss": -12.704547882080078, "global_step": 504928, "epoch": 3005} {"train_loss": -12.154807090759277, "global_step": 504929, "epoch": 3005} {"train_loss": -12.702263832092285, "global_step": 504930, "epoch": 3005} {"train_loss": -12.566822052001953, "global_step": 504931, "epoch": 3005} {"train_loss": -12.284759521484375, "global_step": 504932, "epoch": 3005} {"train_loss": -12.509954452514648, "global_step": 504933, "epoch": 3005} {"train_loss": -12.569478034973145, "global_step": 504934, "epoch": 3005} {"train_loss": -12.876882553100586, "global_step": 504935, "epoch": 3005} {"train_loss": -12.371650695800781, "global_step": 504936, "epoch": 3005} {"train_loss": -12.769524574279785, "global_step": 504937, "epoch": 3005} {"train_loss": -12.660173416137695, "global_step": 504938, "epoch": 3005} {"train_loss": -12.800091743469238, "global_step": 504939, "epoch": 3005} {"train_loss": -12.72580337524414, "global_step": 504940, "epoch": 3005} {"train_loss": -12.943967819213867, "global_step": 504941, "epoch": 3005} {"train_loss": -12.931038856506348, "global_step": 504942, "epoch": 3005} {"train_loss": -12.872420310974121, "global_step": 504943, "epoch": 3005} {"train_loss": -12.569496154785156, "global_step": 504944, "epoch": 3005} {"train_loss": -12.551414489746094, "global_step": 504945, "epoch": 3005} {"train_loss": -12.344318389892578, "global_step": 504946, "epoch": 3005} {"train_loss": -12.306148529052734, "global_step": 504947, "epoch": 3005} {"train_loss": -12.72970962524414, "global_step": 504948, "epoch": 3005} {"train_loss": -12.265762329101562, "global_step": 504949, "epoch": 3005} {"train_loss": -13.030576705932617, "global_step": 504950, "epoch": 3005} {"train_loss": -12.223043441772461, "global_step": 504951, "epoch": 3005} {"train_loss": -12.582223892211914, "global_step": 504952, "epoch": 3005} {"train_loss": -12.604190826416016, "global_step": 504953, "epoch": 3005} {"train_loss": -11.915105819702148, "global_step": 504954, "epoch": 3005} {"train_loss": -12.394662857055664, "global_step": 504955, "epoch": 3005} {"train_loss": -12.839654922485352, "global_step": 504956, "epoch": 3005} {"train_loss": -11.844368934631348, "global_step": 504957, "epoch": 3005} {"train_loss": -12.078371047973633, "global_step": 504958, "epoch": 3005} {"train_loss": -12.392714500427246, "global_step": 504959, "epoch": 3005} {"train_loss": -11.502301216125488, "global_step": 504960, "epoch": 3005} {"train_loss": -12.179621696472168, "global_step": 504961, "epoch": 3005} {"train_loss": -12.561424255371094, "global_step": 504962, "epoch": 3005} {"train_loss": -12.345098495483398, "global_step": 504963, "epoch": 3005} {"train_loss": -12.216669082641602, "global_step": 504964, "epoch": 3005} {"train_loss": -12.339010238647461, "global_step": 504965, "epoch": 3005} {"train_loss": -12.026443481445312, "global_step": 504966, "epoch": 3005} {"train_loss": -11.73563289642334, "global_step": 504967, "epoch": 3005} {"train_loss": -11.755882263183594, "global_step": 504968, "epoch": 3005} {"train_loss": -11.158597946166992, "global_step": 504969, "epoch": 3005} {"train_loss": -12.476888656616211, "global_step": 504970, "epoch": 3005} {"train_loss": -11.176961898803711, "global_step": 504971, "epoch": 3005} {"train_loss": -10.96047592163086, "global_step": 504972, "epoch": 3005} {"train_loss": -12.024248123168945, "global_step": 504973, "epoch": 3005} {"train_loss": -11.33493423461914, "global_step": 504974, "epoch": 3005} {"train_loss": -11.740757942199707, "global_step": 504975, "epoch": 3005} {"train_loss": -12.481268882751465, "global_step": 504976, "epoch": 3005} {"train_loss": -11.948121070861816, "global_step": 504977, "epoch": 3005} {"train_loss": -12.581130027770996, "global_step": 504978, "epoch": 3005} {"train_loss": -11.6909761428833, "global_step": 504979, "epoch": 3005} {"train_loss": -12.815189361572266, "global_step": 504980, "epoch": 3005} {"train_loss": -12.367345809936523, "global_step": 504981, "epoch": 3005} {"train_loss": -12.562911987304688, "global_step": 504982, "epoch": 3005} {"train_loss": -11.908662796020508, "global_step": 504983, "epoch": 3005} {"train_loss": -12.403935432434082, "global_step": 504984, "epoch": 3005} {"train_loss": -11.897587776184082, "global_step": 504985, "epoch": 3005} {"train_loss": -11.892698287963867, "global_step": 504986, "epoch": 3005} {"train_loss": -11.439855575561523, "global_step": 504987, "epoch": 3005} {"train_loss": -10.870077133178711, "global_step": 504988, "epoch": 3005} {"train_loss": -12.003734588623047, "global_step": 504989, "epoch": 3005} {"train_loss": -11.155056953430176, "global_step": 504990, "epoch": 3005} {"train_loss": -11.936686515808105, "global_step": 504991, "epoch": 3005} {"train_loss": -11.975442886352539, "global_step": 504992, "epoch": 3005} {"train_loss": -11.812834739685059, "global_step": 504993, "epoch": 3005} {"train_loss": -11.673620223999023, "global_step": 504994, "epoch": 3005} {"train_loss": -12.134488105773926, "global_step": 504995, "epoch": 3005} {"train_loss": -12.320932388305664, "global_step": 504996, "epoch": 3005} {"train_loss": -12.334266662597656, "global_step": 504997, "epoch": 3005} {"train_loss": -12.557437896728516, "global_step": 504998, "epoch": 3005} {"train_loss": -12.083106994628906, "global_step": 504999, "epoch": 3005} {"train_loss": -11.926021575927734, "global_step": 505000, "epoch": 3005} {"train_loss": -12.350605010986328, "global_step": 505001, "epoch": 3005} {"train_loss": -10.899280548095703, "global_step": 505002, "epoch": 3005} {"train_loss": -12.38035774230957, "global_step": 505003, "epoch": 3005} {"train_loss": -11.668322563171387, "global_step": 505004, "epoch": 3005} {"train_loss": -12.174172401428223, "global_step": 505005, "epoch": 3005} {"train_loss": -11.819209098815918, "global_step": 505006, "epoch": 3005} {"train_loss": -12.262959423519316, "global_step": 505007, "epoch": 3005, "val_loss": 322621.9375, "train_action_mse_error": 0.7566655874252319} {"train_loss": -11.750083923339844, "global_step": 505008, "epoch": 3006} {"train_loss": -11.578003883361816, "global_step": 505009, "epoch": 3006} {"train_loss": -11.651199340820312, "global_step": 505010, "epoch": 3006} {"train_loss": -12.198189735412598, "global_step": 505011, "epoch": 3006} {"train_loss": -11.55958366394043, "global_step": 505012, "epoch": 3006} {"train_loss": -11.809840202331543, "global_step": 505013, "epoch": 3006} {"train_loss": -12.45254898071289, "global_step": 505014, "epoch": 3006} {"train_loss": -11.922233581542969, "global_step": 505015, "epoch": 3006} {"train_loss": -12.504369735717773, "global_step": 505016, "epoch": 3006} {"train_loss": -11.920758247375488, "global_step": 505017, "epoch": 3006} {"train_loss": -12.510095596313477, "global_step": 505018, "epoch": 3006} {"train_loss": -11.86292839050293, "global_step": 505019, "epoch": 3006} {"train_loss": -11.88608169555664, "global_step": 505020, "epoch": 3006} {"train_loss": -12.790712356567383, "global_step": 505021, "epoch": 3006} {"train_loss": -11.329606056213379, "global_step": 505022, "epoch": 3006} {"train_loss": -12.195541381835938, "global_step": 505023, "epoch": 3006} {"train_loss": -12.327003479003906, "global_step": 505024, "epoch": 3006} {"train_loss": -11.545093536376953, "global_step": 505025, "epoch": 3006} {"train_loss": -12.499954223632812, "global_step": 505026, "epoch": 3006} {"train_loss": -12.096572875976562, "global_step": 505027, "epoch": 3006} {"train_loss": -12.301901817321777, "global_step": 505028, "epoch": 3006} {"train_loss": -12.66531753540039, "global_step": 505029, "epoch": 3006} {"train_loss": -12.316965103149414, "global_step": 505030, "epoch": 3006} {"train_loss": -12.469942092895508, "global_step": 505031, "epoch": 3006} {"train_loss": -12.823487281799316, "global_step": 505032, "epoch": 3006} {"train_loss": -12.234618186950684, "global_step": 505033, "epoch": 3006} {"train_loss": -12.785905838012695, "global_step": 505034, "epoch": 3006} {"train_loss": -12.737178802490234, "global_step": 505035, "epoch": 3006} {"train_loss": -12.797624588012695, "global_step": 505036, "epoch": 3006} {"train_loss": -12.714014053344727, "global_step": 505037, "epoch": 3006} {"train_loss": -12.696857452392578, "global_step": 505038, "epoch": 3006} {"train_loss": -12.784605979919434, "global_step": 505039, "epoch": 3006} {"train_loss": -12.905473709106445, "global_step": 505040, "epoch": 3006} {"train_loss": -12.616888046264648, "global_step": 505041, "epoch": 3006} {"train_loss": -12.781006813049316, "global_step": 505042, "epoch": 3006} {"train_loss": -12.733845710754395, "global_step": 505043, "epoch": 3006} {"train_loss": -12.725577354431152, "global_step": 505044, "epoch": 3006} {"train_loss": -12.505647659301758, "global_step": 505045, "epoch": 3006} {"train_loss": -12.840988159179688, "global_step": 505046, "epoch": 3006} {"train_loss": -12.375774383544922, "global_step": 505047, "epoch": 3006} {"train_loss": -12.723994255065918, "global_step": 505048, "epoch": 3006} {"train_loss": -12.82905387878418, "global_step": 505049, "epoch": 3006} {"train_loss": -12.851215362548828, "global_step": 505050, "epoch": 3006} {"train_loss": -12.7350435256958, "global_step": 505051, "epoch": 3006} {"train_loss": -12.94204330444336, "global_step": 505052, "epoch": 3006} {"train_loss": -12.754463195800781, "global_step": 505053, "epoch": 3006} {"train_loss": -12.88654899597168, "global_step": 505054, "epoch": 3006} {"train_loss": -12.869842529296875, "global_step": 505055, "epoch": 3006} {"train_loss": -13.005428314208984, "global_step": 505056, "epoch": 3006} {"train_loss": -13.002843856811523, "global_step": 505057, "epoch": 3006} {"train_loss": -12.663467407226562, "global_step": 505058, "epoch": 3006} {"train_loss": -12.577764511108398, "global_step": 505059, "epoch": 3006} {"train_loss": -12.860393524169922, "global_step": 505060, "epoch": 3006} {"train_loss": -12.72877025604248, "global_step": 505061, "epoch": 3006} {"train_loss": -12.67934513092041, "global_step": 505062, "epoch": 3006} {"train_loss": -12.887458801269531, "global_step": 505063, "epoch": 3006} {"train_loss": -12.662496566772461, "global_step": 505064, "epoch": 3006} {"train_loss": -12.355646133422852, "global_step": 505065, "epoch": 3006} {"train_loss": -12.538564682006836, "global_step": 505066, "epoch": 3006} {"train_loss": -12.404537200927734, "global_step": 505067, "epoch": 3006} {"train_loss": -12.860713958740234, "global_step": 505068, "epoch": 3006} {"train_loss": -12.227188110351562, "global_step": 505069, "epoch": 3006} {"train_loss": -12.59852409362793, "global_step": 505070, "epoch": 3006} {"train_loss": -12.622225761413574, "global_step": 505071, "epoch": 3006} {"train_loss": -12.638662338256836, "global_step": 505072, "epoch": 3006} {"train_loss": -13.012775421142578, "global_step": 505073, "epoch": 3006} {"train_loss": -12.234737396240234, "global_step": 505074, "epoch": 3006} {"train_loss": -12.590397834777832, "global_step": 505075, "epoch": 3006} {"train_loss": -12.692548751831055, "global_step": 505076, "epoch": 3006} {"train_loss": -12.747743606567383, "global_step": 505077, "epoch": 3006} {"train_loss": -12.081657409667969, "global_step": 505078, "epoch": 3006} {"train_loss": -12.308860778808594, "global_step": 505079, "epoch": 3006} {"train_loss": -12.708860397338867, "global_step": 505080, "epoch": 3006} {"train_loss": -12.441143035888672, "global_step": 505081, "epoch": 3006} {"train_loss": -12.31043529510498, "global_step": 505082, "epoch": 3006} {"train_loss": -12.770575523376465, "global_step": 505083, "epoch": 3006} {"train_loss": -12.559772491455078, "global_step": 505084, "epoch": 3006} {"train_loss": -11.760366439819336, "global_step": 505085, "epoch": 3006} {"train_loss": -12.430728912353516, "global_step": 505086, "epoch": 3006} {"train_loss": -12.745515823364258, "global_step": 505087, "epoch": 3006} {"train_loss": -12.329662322998047, "global_step": 505088, "epoch": 3006} {"train_loss": -12.71745777130127, "global_step": 505089, "epoch": 3006} {"train_loss": -12.61801528930664, "global_step": 505090, "epoch": 3006} {"train_loss": -12.221721649169922, "global_step": 505091, "epoch": 3006} {"train_loss": -12.78271484375, "global_step": 505092, "epoch": 3006} {"train_loss": -12.559380531311035, "global_step": 505093, "epoch": 3006} {"train_loss": -12.120548248291016, "global_step": 505094, "epoch": 3006} {"train_loss": -12.483552932739258, "global_step": 505095, "epoch": 3006} {"train_loss": -12.940804481506348, "global_step": 505096, "epoch": 3006} {"train_loss": -12.406654357910156, "global_step": 505097, "epoch": 3006} {"train_loss": -12.845659255981445, "global_step": 505098, "epoch": 3006} {"train_loss": -12.793561935424805, "global_step": 505099, "epoch": 3006} {"train_loss": -12.37342357635498, "global_step": 505100, "epoch": 3006} {"train_loss": -12.853972434997559, "global_step": 505101, "epoch": 3006} {"train_loss": -13.04092788696289, "global_step": 505102, "epoch": 3006} {"train_loss": -13.024503707885742, "global_step": 505103, "epoch": 3006} {"train_loss": -12.99207878112793, "global_step": 505104, "epoch": 3006} {"train_loss": -12.914636611938477, "global_step": 505105, "epoch": 3006} {"train_loss": -12.855725288391113, "global_step": 505106, "epoch": 3006} {"train_loss": -13.075484275817871, "global_step": 505107, "epoch": 3006} {"train_loss": -12.89114761352539, "global_step": 505108, "epoch": 3006} {"train_loss": -12.996539115905762, "global_step": 505109, "epoch": 3006} {"train_loss": -12.95689582824707, "global_step": 505110, "epoch": 3006} {"train_loss": -12.965527534484863, "global_step": 505111, "epoch": 3006} {"train_loss": -12.968318939208984, "global_step": 505112, "epoch": 3006} {"train_loss": -12.662364959716797, "global_step": 505113, "epoch": 3006} {"train_loss": -12.932402610778809, "global_step": 505114, "epoch": 3006} {"train_loss": -12.76146125793457, "global_step": 505115, "epoch": 3006} {"train_loss": -13.00078010559082, "global_step": 505116, "epoch": 3006} {"train_loss": -12.852620124816895, "global_step": 505117, "epoch": 3006} {"train_loss": -12.78931713104248, "global_step": 505118, "epoch": 3006} {"train_loss": -13.071086883544922, "global_step": 505119, "epoch": 3006} {"train_loss": -12.758956909179688, "global_step": 505120, "epoch": 3006} {"train_loss": -12.999336242675781, "global_step": 505121, "epoch": 3006} {"train_loss": -12.931615829467773, "global_step": 505122, "epoch": 3006} {"train_loss": -13.054216384887695, "global_step": 505123, "epoch": 3006} {"train_loss": -12.83928108215332, "global_step": 505124, "epoch": 3006} {"train_loss": -12.764763832092285, "global_step": 505125, "epoch": 3006} {"train_loss": -13.036028861999512, "global_step": 505126, "epoch": 3006} {"train_loss": -12.911005973815918, "global_step": 505127, "epoch": 3006} {"train_loss": -12.537673950195312, "global_step": 505128, "epoch": 3006} {"train_loss": -12.52806282043457, "global_step": 505129, "epoch": 3006} {"train_loss": -11.586241722106934, "global_step": 505130, "epoch": 3006} {"train_loss": -11.845097541809082, "global_step": 505131, "epoch": 3006} {"train_loss": -12.509254455566406, "global_step": 505132, "epoch": 3006} {"train_loss": -12.724076271057129, "global_step": 505133, "epoch": 3006} {"train_loss": -11.992402076721191, "global_step": 505134, "epoch": 3006} {"train_loss": -12.195626258850098, "global_step": 505135, "epoch": 3006} {"train_loss": -11.873870849609375, "global_step": 505136, "epoch": 3006} {"train_loss": -11.419107437133789, "global_step": 505137, "epoch": 3006} {"train_loss": -11.661760330200195, "global_step": 505138, "epoch": 3006} {"train_loss": -10.966764450073242, "global_step": 505139, "epoch": 3006} {"train_loss": -9.892088890075684, "global_step": 505140, "epoch": 3006} {"train_loss": -10.908714294433594, "global_step": 505141, "epoch": 3006} {"train_loss": -9.434026718139648, "global_step": 505142, "epoch": 3006} {"train_loss": -9.750880241394043, "global_step": 505143, "epoch": 3006} {"train_loss": -10.231119155883789, "global_step": 505144, "epoch": 3006} {"train_loss": -10.53369140625, "global_step": 505145, "epoch": 3006} {"train_loss": -10.182544708251953, "global_step": 505146, "epoch": 3006} {"train_loss": -8.293371200561523, "global_step": 505147, "epoch": 3006} {"train_loss": -8.714855194091797, "global_step": 505148, "epoch": 3006} {"train_loss": -8.335554122924805, "global_step": 505149, "epoch": 3006} {"train_loss": -8.810240745544434, "global_step": 505150, "epoch": 3006} {"train_loss": -8.697224617004395, "global_step": 505151, "epoch": 3006} {"train_loss": -8.431241989135742, "global_step": 505152, "epoch": 3006} {"train_loss": -7.880883693695068, "global_step": 505153, "epoch": 3006} {"train_loss": -8.178789138793945, "global_step": 505154, "epoch": 3006} {"train_loss": -7.9914116859436035, "global_step": 505155, "epoch": 3006} {"train_loss": -7.775286674499512, "global_step": 505156, "epoch": 3006} {"train_loss": -8.573307037353516, "global_step": 505157, "epoch": 3006} {"train_loss": -8.918830871582031, "global_step": 505158, "epoch": 3006} {"train_loss": -8.69771957397461, "global_step": 505159, "epoch": 3006} {"train_loss": -9.358019828796387, "global_step": 505160, "epoch": 3006} {"train_loss": -8.985613822937012, "global_step": 505161, "epoch": 3006} {"train_loss": -9.140375137329102, "global_step": 505162, "epoch": 3006} {"train_loss": -9.575502395629883, "global_step": 505163, "epoch": 3006} {"train_loss": -9.365242958068848, "global_step": 505164, "epoch": 3006} {"train_loss": -9.892048835754395, "global_step": 505165, "epoch": 3006} {"train_loss": -9.480623245239258, "global_step": 505166, "epoch": 3006} {"train_loss": -10.1662015914917, "global_step": 505167, "epoch": 3006} {"train_loss": -10.454068183898926, "global_step": 505168, "epoch": 3006} {"train_loss": -11.00192642211914, "global_step": 505169, "epoch": 3006} {"train_loss": -10.715679168701172, "global_step": 505170, "epoch": 3006} {"train_loss": -10.845221519470215, "global_step": 505171, "epoch": 3006} {"train_loss": -11.259765625, "global_step": 505172, "epoch": 3006} {"train_loss": -10.151683807373047, "global_step": 505173, "epoch": 3006} {"train_loss": -10.763426780700684, "global_step": 505174, "epoch": 3006} {"train_loss": -11.883666799181984, "global_step": 505175, "epoch": 3006, "val_loss": 318537.84375} {"train_loss": -9.71609115600586, "global_step": 505176, "epoch": 3007} {"train_loss": -10.858993530273438, "global_step": 505177, "epoch": 3007} {"train_loss": -10.790072441101074, "global_step": 505178, "epoch": 3007} {"train_loss": -10.540454864501953, "global_step": 505179, "epoch": 3007} {"train_loss": -11.407966613769531, "global_step": 505180, "epoch": 3007} {"train_loss": -10.686450004577637, "global_step": 505181, "epoch": 3007} {"train_loss": -10.40638256072998, "global_step": 505182, "epoch": 3007} {"train_loss": -11.324180603027344, "global_step": 505183, "epoch": 3007} {"train_loss": -11.139532089233398, "global_step": 505184, "epoch": 3007} {"train_loss": -11.172017097473145, "global_step": 505185, "epoch": 3007} {"train_loss": -11.54334545135498, "global_step": 505186, "epoch": 3007} {"train_loss": -11.409904479980469, "global_step": 505187, "epoch": 3007} {"train_loss": -11.365281105041504, "global_step": 505188, "epoch": 3007} {"train_loss": -11.96904182434082, "global_step": 505189, "epoch": 3007} {"train_loss": -11.707615852355957, "global_step": 505190, "epoch": 3007} {"train_loss": -11.961760520935059, "global_step": 505191, "epoch": 3007} {"train_loss": -11.543783187866211, "global_step": 505192, "epoch": 3007} {"train_loss": -12.031312942504883, "global_step": 505193, "epoch": 3007} {"train_loss": -11.570677757263184, "global_step": 505194, "epoch": 3007} {"train_loss": -11.745918273925781, "global_step": 505195, "epoch": 3007} {"train_loss": -11.597905158996582, "global_step": 505196, "epoch": 3007} {"train_loss": -11.198701858520508, "global_step": 505197, "epoch": 3007} {"train_loss": -11.63582992553711, "global_step": 505198, "epoch": 3007} {"train_loss": -11.586962699890137, "global_step": 505199, "epoch": 3007} {"train_loss": -12.132871627807617, "global_step": 505200, "epoch": 3007} {"train_loss": -11.754273414611816, "global_step": 505201, "epoch": 3007} {"train_loss": -12.039878845214844, "global_step": 505202, "epoch": 3007} {"train_loss": -11.942110061645508, "global_step": 505203, "epoch": 3007} {"train_loss": -11.758389472961426, "global_step": 505204, "epoch": 3007} {"train_loss": -12.156518936157227, "global_step": 505205, "epoch": 3007} {"train_loss": -11.956625938415527, "global_step": 505206, "epoch": 3007} {"train_loss": -12.353321075439453, "global_step": 505207, "epoch": 3007} {"train_loss": -11.885191917419434, "global_step": 505208, "epoch": 3007} {"train_loss": -12.218233108520508, "global_step": 505209, "epoch": 3007} {"train_loss": -11.695865631103516, "global_step": 505210, "epoch": 3007} {"train_loss": -12.44085693359375, "global_step": 505211, "epoch": 3007} {"train_loss": -11.795169830322266, "global_step": 505212, "epoch": 3007} {"train_loss": -12.659212112426758, "global_step": 505213, "epoch": 3007} {"train_loss": -12.1417818069458, "global_step": 505214, "epoch": 3007} {"train_loss": -12.635446548461914, "global_step": 505215, "epoch": 3007} {"train_loss": -12.222906112670898, "global_step": 505216, "epoch": 3007} {"train_loss": -12.542394638061523, "global_step": 505217, "epoch": 3007} {"train_loss": -12.270014762878418, "global_step": 505218, "epoch": 3007} {"train_loss": -12.499968528747559, "global_step": 505219, "epoch": 3007} {"train_loss": -12.179044723510742, "global_step": 505220, "epoch": 3007} {"train_loss": -12.485841751098633, "global_step": 505221, "epoch": 3007} {"train_loss": -11.915858268737793, "global_step": 505222, "epoch": 3007} {"train_loss": -12.670849800109863, "global_step": 505223, "epoch": 3007} {"train_loss": -12.370473861694336, "global_step": 505224, "epoch": 3007} {"train_loss": -12.520503997802734, "global_step": 505225, "epoch": 3007} {"train_loss": -12.392219543457031, "global_step": 505226, "epoch": 3007} {"train_loss": -12.508234024047852, "global_step": 505227, "epoch": 3007} {"train_loss": -12.59634780883789, "global_step": 505228, "epoch": 3007} {"train_loss": -12.668088912963867, "global_step": 505229, "epoch": 3007} {"train_loss": -12.543547630310059, "global_step": 505230, "epoch": 3007} {"train_loss": -12.602133750915527, "global_step": 505231, "epoch": 3007} {"train_loss": -12.807533264160156, "global_step": 505232, "epoch": 3007} {"train_loss": -12.672952651977539, "global_step": 505233, "epoch": 3007} {"train_loss": -12.825965881347656, "global_step": 505234, "epoch": 3007} {"train_loss": -12.652210235595703, "global_step": 505235, "epoch": 3007} {"train_loss": -12.6708345413208, "global_step": 505236, "epoch": 3007} {"train_loss": -12.639573097229004, "global_step": 505237, "epoch": 3007} {"train_loss": -12.612493515014648, "global_step": 505238, "epoch": 3007} {"train_loss": -12.707511901855469, "global_step": 505239, "epoch": 3007} {"train_loss": -12.541497230529785, "global_step": 505240, "epoch": 3007} {"train_loss": -12.80795955657959, "global_step": 505241, "epoch": 3007} {"train_loss": -12.644546508789062, "global_step": 505242, "epoch": 3007} {"train_loss": -12.867414474487305, "global_step": 505243, "epoch": 3007} {"train_loss": -12.699883460998535, "global_step": 505244, "epoch": 3007} {"train_loss": -12.796965599060059, "global_step": 505245, "epoch": 3007} {"train_loss": -12.826936721801758, "global_step": 505246, "epoch": 3007} {"train_loss": -12.739421844482422, "global_step": 505247, "epoch": 3007} {"train_loss": -12.795711517333984, "global_step": 505248, "epoch": 3007} {"train_loss": -12.618390083312988, "global_step": 505249, "epoch": 3007} {"train_loss": -12.792296409606934, "global_step": 505250, "epoch": 3007} {"train_loss": -12.68193244934082, "global_step": 505251, "epoch": 3007} {"train_loss": -12.923391342163086, "global_step": 505252, "epoch": 3007} {"train_loss": -12.942840576171875, "global_step": 505253, "epoch": 3007} {"train_loss": -12.966224670410156, "global_step": 505254, "epoch": 3007} {"train_loss": -12.861753463745117, "global_step": 505255, "epoch": 3007} {"train_loss": -12.973081588745117, "global_step": 505256, "epoch": 3007} {"train_loss": -12.868673324584961, "global_step": 505257, "epoch": 3007} {"train_loss": -12.696056365966797, "global_step": 505258, "epoch": 3007} {"train_loss": -12.820819854736328, "global_step": 505259, "epoch": 3007} {"train_loss": -12.80228042602539, "global_step": 505260, "epoch": 3007} {"train_loss": -12.775243759155273, "global_step": 505261, "epoch": 3007} {"train_loss": -12.863359451293945, "global_step": 505262, "epoch": 3007} {"train_loss": -12.418418884277344, "global_step": 505263, "epoch": 3007} {"train_loss": -12.989614486694336, "global_step": 505264, "epoch": 3007} {"train_loss": -12.70966911315918, "global_step": 505265, "epoch": 3007} {"train_loss": -12.183830261230469, "global_step": 505266, "epoch": 3007} {"train_loss": -11.946538925170898, "global_step": 505267, "epoch": 3007} {"train_loss": -12.803338050842285, "global_step": 505268, "epoch": 3007} {"train_loss": -12.416849136352539, "global_step": 505269, "epoch": 3007} {"train_loss": -12.417211532592773, "global_step": 505270, "epoch": 3007} {"train_loss": -12.519538879394531, "global_step": 505271, "epoch": 3007} {"train_loss": -12.433097839355469, "global_step": 505272, "epoch": 3007} {"train_loss": -12.84176254272461, "global_step": 505273, "epoch": 3007} {"train_loss": -12.250761985778809, "global_step": 505274, "epoch": 3007} {"train_loss": -12.684978485107422, "global_step": 505275, "epoch": 3007} {"train_loss": -12.708806037902832, "global_step": 505276, "epoch": 3007} {"train_loss": -12.1712064743042, "global_step": 505277, "epoch": 3007} {"train_loss": -12.454981803894043, "global_step": 505278, "epoch": 3007} {"train_loss": -12.793031692504883, "global_step": 505279, "epoch": 3007} {"train_loss": -12.590110778808594, "global_step": 505280, "epoch": 3007} {"train_loss": -12.408485412597656, "global_step": 505281, "epoch": 3007} {"train_loss": -12.544858932495117, "global_step": 505282, "epoch": 3007} {"train_loss": -12.711793899536133, "global_step": 505283, "epoch": 3007} {"train_loss": -12.455848693847656, "global_step": 505284, "epoch": 3007} {"train_loss": -12.28994369506836, "global_step": 505285, "epoch": 3007} {"train_loss": -12.658294677734375, "global_step": 505286, "epoch": 3007} {"train_loss": -12.322883605957031, "global_step": 505287, "epoch": 3007} {"train_loss": -12.310188293457031, "global_step": 505288, "epoch": 3007} {"train_loss": -13.044981002807617, "global_step": 505289, "epoch": 3007} {"train_loss": -12.871891021728516, "global_step": 505290, "epoch": 3007} {"train_loss": -12.544998168945312, "global_step": 505291, "epoch": 3007} {"train_loss": -12.693883895874023, "global_step": 505292, "epoch": 3007} {"train_loss": -12.921491622924805, "global_step": 505293, "epoch": 3007} {"train_loss": -12.51391315460205, "global_step": 505294, "epoch": 3007} {"train_loss": -12.54758071899414, "global_step": 505295, "epoch": 3007} {"train_loss": -12.7347412109375, "global_step": 505296, "epoch": 3007} {"train_loss": -12.633028030395508, "global_step": 505297, "epoch": 3007} {"train_loss": -12.43167495727539, "global_step": 505298, "epoch": 3007} {"train_loss": -12.549139976501465, "global_step": 505299, "epoch": 3007} {"train_loss": -12.446069717407227, "global_step": 505300, "epoch": 3007} {"train_loss": -12.565418243408203, "global_step": 505301, "epoch": 3007} {"train_loss": -12.147577285766602, "global_step": 505302, "epoch": 3007} {"train_loss": -12.104541778564453, "global_step": 505303, "epoch": 3007} {"train_loss": -12.183650016784668, "global_step": 505304, "epoch": 3007} {"train_loss": -10.919504165649414, "global_step": 505305, "epoch": 3007} {"train_loss": -11.933189392089844, "global_step": 505306, "epoch": 3007} {"train_loss": -11.523062705993652, "global_step": 505307, "epoch": 3007} {"train_loss": -10.966392517089844, "global_step": 505308, "epoch": 3007} {"train_loss": -10.591394424438477, "global_step": 505309, "epoch": 3007} {"train_loss": -12.395471572875977, "global_step": 505310, "epoch": 3007} {"train_loss": -10.974807739257812, "global_step": 505311, "epoch": 3007} {"train_loss": -11.235363006591797, "global_step": 505312, "epoch": 3007} {"train_loss": -12.307164192199707, "global_step": 505313, "epoch": 3007} {"train_loss": -10.551971435546875, "global_step": 505314, "epoch": 3007} {"train_loss": -11.470376014709473, "global_step": 505315, "epoch": 3007} {"train_loss": -11.586370468139648, "global_step": 505316, "epoch": 3007} {"train_loss": -11.227006912231445, "global_step": 505317, "epoch": 3007} {"train_loss": -11.858182907104492, "global_step": 505318, "epoch": 3007} {"train_loss": -11.284367561340332, "global_step": 505319, "epoch": 3007} {"train_loss": -10.655824661254883, "global_step": 505320, "epoch": 3007} {"train_loss": -10.706941604614258, "global_step": 505321, "epoch": 3007} {"train_loss": -12.734702110290527, "global_step": 505322, "epoch": 3007} {"train_loss": -11.19865894317627, "global_step": 505323, "epoch": 3007} {"train_loss": -11.325422286987305, "global_step": 505324, "epoch": 3007} {"train_loss": -11.74949836730957, "global_step": 505325, "epoch": 3007} {"train_loss": -11.649646759033203, "global_step": 505326, "epoch": 3007} {"train_loss": -12.307449340820312, "global_step": 505327, "epoch": 3007} {"train_loss": -12.003503799438477, "global_step": 505328, "epoch": 3007} {"train_loss": -12.376251220703125, "global_step": 505329, "epoch": 3007} {"train_loss": -12.044986724853516, "global_step": 505330, "epoch": 3007} {"train_loss": -12.289199829101562, "global_step": 505331, "epoch": 3007} {"train_loss": -12.439111709594727, "global_step": 505332, "epoch": 3007} {"train_loss": -11.968841552734375, "global_step": 505333, "epoch": 3007} {"train_loss": -12.357544898986816, "global_step": 505334, "epoch": 3007} {"train_loss": -12.007278442382812, "global_step": 505335, "epoch": 3007} {"train_loss": -12.393407821655273, "global_step": 505336, "epoch": 3007} {"train_loss": -12.270296096801758, "global_step": 505337, "epoch": 3007} {"train_loss": -12.022043228149414, "global_step": 505338, "epoch": 3007} {"train_loss": -12.847784042358398, "global_step": 505339, "epoch": 3007} {"train_loss": -12.125626564025879, "global_step": 505340, "epoch": 3007} {"train_loss": -12.829219818115234, "global_step": 505341, "epoch": 3007} {"train_loss": -12.484735488891602, "global_step": 505342, "epoch": 3007} {"train_loss": -12.174816983086723, "global_step": 505343, "epoch": 3007, "val_loss": 321909.84375} {"train_loss": -12.529186248779297, "global_step": 505344, "epoch": 3008} {"train_loss": -12.785022735595703, "global_step": 505345, "epoch": 3008} {"train_loss": -12.631522178649902, "global_step": 505346, "epoch": 3008} {"train_loss": -12.515176773071289, "global_step": 505347, "epoch": 3008} {"train_loss": -12.508769989013672, "global_step": 505348, "epoch": 3008} {"train_loss": -12.521613121032715, "global_step": 505349, "epoch": 3008} {"train_loss": -12.603626251220703, "global_step": 505350, "epoch": 3008} {"train_loss": -12.619895935058594, "global_step": 505351, "epoch": 3008} {"train_loss": -12.719938278198242, "global_step": 505352, "epoch": 3008} {"train_loss": -12.792119026184082, "global_step": 505353, "epoch": 3008} {"train_loss": -12.598052024841309, "global_step": 505354, "epoch": 3008} {"train_loss": -12.424715042114258, "global_step": 505355, "epoch": 3008} {"train_loss": -12.720647811889648, "global_step": 505356, "epoch": 3008} {"train_loss": -12.489118576049805, "global_step": 505357, "epoch": 3008} {"train_loss": -12.390552520751953, "global_step": 505358, "epoch": 3008} {"train_loss": -12.221883773803711, "global_step": 505359, "epoch": 3008} {"train_loss": -12.52667236328125, "global_step": 505360, "epoch": 3008} {"train_loss": -12.65311050415039, "global_step": 505361, "epoch": 3008} {"train_loss": -12.391602516174316, "global_step": 505362, "epoch": 3008} {"train_loss": -12.374531745910645, "global_step": 505363, "epoch": 3008} {"train_loss": -12.485093116760254, "global_step": 505364, "epoch": 3008} {"train_loss": -12.29625129699707, "global_step": 505365, "epoch": 3008} {"train_loss": -11.851922035217285, "global_step": 505366, "epoch": 3008} {"train_loss": -12.854850769042969, "global_step": 505367, "epoch": 3008} {"train_loss": -12.160834312438965, "global_step": 505368, "epoch": 3008} {"train_loss": -12.181522369384766, "global_step": 505369, "epoch": 3008} {"train_loss": -12.343358993530273, "global_step": 505370, "epoch": 3008} {"train_loss": -12.008160591125488, "global_step": 505371, "epoch": 3008} {"train_loss": -11.528552055358887, "global_step": 505372, "epoch": 3008} {"train_loss": -12.208005905151367, "global_step": 505373, "epoch": 3008} {"train_loss": -11.954792022705078, "global_step": 505374, "epoch": 3008} {"train_loss": -10.598901748657227, "global_step": 505375, "epoch": 3008} {"train_loss": -12.568304061889648, "global_step": 505376, "epoch": 3008} {"train_loss": -11.66132926940918, "global_step": 505377, "epoch": 3008} {"train_loss": -12.151936531066895, "global_step": 505378, "epoch": 3008} {"train_loss": -11.934374809265137, "global_step": 505379, "epoch": 3008} {"train_loss": -11.931876182556152, "global_step": 505380, "epoch": 3008} {"train_loss": -12.244165420532227, "global_step": 505381, "epoch": 3008} {"train_loss": -11.280204772949219, "global_step": 505382, "epoch": 3008} {"train_loss": -12.156584739685059, "global_step": 505383, "epoch": 3008} {"train_loss": -12.28757381439209, "global_step": 505384, "epoch": 3008} {"train_loss": -12.62257194519043, "global_step": 505385, "epoch": 3008} {"train_loss": -11.764972686767578, "global_step": 505386, "epoch": 3008} {"train_loss": -12.127254486083984, "global_step": 505387, "epoch": 3008} {"train_loss": -12.151641845703125, "global_step": 505388, "epoch": 3008} {"train_loss": -11.597811698913574, "global_step": 505389, "epoch": 3008} {"train_loss": -12.286599159240723, "global_step": 505390, "epoch": 3008} {"train_loss": -10.815780639648438, "global_step": 505391, "epoch": 3008} {"train_loss": -12.517792701721191, "global_step": 505392, "epoch": 3008} {"train_loss": -11.067495346069336, "global_step": 505393, "epoch": 3008} {"train_loss": -12.673720359802246, "global_step": 505394, "epoch": 3008} {"train_loss": -11.357742309570312, "global_step": 505395, "epoch": 3008} {"train_loss": -12.187776565551758, "global_step": 505396, "epoch": 3008} {"train_loss": -11.96414852142334, "global_step": 505397, "epoch": 3008} {"train_loss": -11.761098861694336, "global_step": 505398, "epoch": 3008} {"train_loss": -11.778715133666992, "global_step": 505399, "epoch": 3008} {"train_loss": -10.747953414916992, "global_step": 505400, "epoch": 3008} {"train_loss": -12.026123046875, "global_step": 505401, "epoch": 3008} {"train_loss": -12.338287353515625, "global_step": 505402, "epoch": 3008} {"train_loss": -10.989978790283203, "global_step": 505403, "epoch": 3008} {"train_loss": -12.1673002243042, "global_step": 505404, "epoch": 3008} {"train_loss": -11.425808906555176, "global_step": 505405, "epoch": 3008} {"train_loss": -12.32227897644043, "global_step": 505406, "epoch": 3008} {"train_loss": -11.683713912963867, "global_step": 505407, "epoch": 3008} {"train_loss": -12.22050952911377, "global_step": 505408, "epoch": 3008} {"train_loss": -12.095409393310547, "global_step": 505409, "epoch": 3008} {"train_loss": -11.71558952331543, "global_step": 505410, "epoch": 3008} {"train_loss": -12.45895767211914, "global_step": 505411, "epoch": 3008} {"train_loss": -11.715093612670898, "global_step": 505412, "epoch": 3008} {"train_loss": -12.314346313476562, "global_step": 505413, "epoch": 3008} {"train_loss": -12.122023582458496, "global_step": 505414, "epoch": 3008} {"train_loss": -11.874886512756348, "global_step": 505415, "epoch": 3008} {"train_loss": -12.62951374053955, "global_step": 505416, "epoch": 3008} {"train_loss": -11.800599098205566, "global_step": 505417, "epoch": 3008} {"train_loss": -12.872016906738281, "global_step": 505418, "epoch": 3008} {"train_loss": -11.96670913696289, "global_step": 505419, "epoch": 3008} {"train_loss": -12.788780212402344, "global_step": 505420, "epoch": 3008} {"train_loss": -12.615579605102539, "global_step": 505421, "epoch": 3008} {"train_loss": -12.018518447875977, "global_step": 505422, "epoch": 3008} {"train_loss": -12.518095970153809, "global_step": 505423, "epoch": 3008} {"train_loss": -12.056628227233887, "global_step": 505424, "epoch": 3008} {"train_loss": -12.624822616577148, "global_step": 505425, "epoch": 3008} {"train_loss": -11.803997039794922, "global_step": 505426, "epoch": 3008} {"train_loss": -12.484386444091797, "global_step": 505427, "epoch": 3008} {"train_loss": -12.185104370117188, "global_step": 505428, "epoch": 3008} {"train_loss": -11.82473373413086, "global_step": 505429, "epoch": 3008} {"train_loss": -12.482565879821777, "global_step": 505430, "epoch": 3008} {"train_loss": -12.003071784973145, "global_step": 505431, "epoch": 3008} {"train_loss": -12.711311340332031, "global_step": 505432, "epoch": 3008} {"train_loss": -11.860492706298828, "global_step": 505433, "epoch": 3008} {"train_loss": -12.559819221496582, "global_step": 505434, "epoch": 3008} {"train_loss": -12.155750274658203, "global_step": 505435, "epoch": 3008} {"train_loss": -12.040163040161133, "global_step": 505436, "epoch": 3008} {"train_loss": -12.293716430664062, "global_step": 505437, "epoch": 3008} {"train_loss": -12.038646697998047, "global_step": 505438, "epoch": 3008} {"train_loss": -12.536526679992676, "global_step": 505439, "epoch": 3008} {"train_loss": -12.005614280700684, "global_step": 505440, "epoch": 3008} {"train_loss": -12.44130802154541, "global_step": 505441, "epoch": 3008} {"train_loss": -12.308157920837402, "global_step": 505442, "epoch": 3008} {"train_loss": -12.36075496673584, "global_step": 505443, "epoch": 3008} {"train_loss": -12.32728099822998, "global_step": 505444, "epoch": 3008} {"train_loss": -12.252538681030273, "global_step": 505445, "epoch": 3008} {"train_loss": -12.480177879333496, "global_step": 505446, "epoch": 3008} {"train_loss": -12.04658031463623, "global_step": 505447, "epoch": 3008} {"train_loss": -12.750513076782227, "global_step": 505448, "epoch": 3008} {"train_loss": -12.424162864685059, "global_step": 505449, "epoch": 3008} {"train_loss": -12.774028778076172, "global_step": 505450, "epoch": 3008} {"train_loss": -12.702841758728027, "global_step": 505451, "epoch": 3008} {"train_loss": -12.464815139770508, "global_step": 505452, "epoch": 3008} {"train_loss": -12.688699722290039, "global_step": 505453, "epoch": 3008} {"train_loss": -12.73402214050293, "global_step": 505454, "epoch": 3008} {"train_loss": -12.643501281738281, "global_step": 505455, "epoch": 3008} {"train_loss": -12.718093872070312, "global_step": 505456, "epoch": 3008} {"train_loss": -12.69741153717041, "global_step": 505457, "epoch": 3008} {"train_loss": -12.744361877441406, "global_step": 505458, "epoch": 3008} {"train_loss": -12.888729095458984, "global_step": 505459, "epoch": 3008} {"train_loss": -12.837703704833984, "global_step": 505460, "epoch": 3008} {"train_loss": -12.861100196838379, "global_step": 505461, "epoch": 3008} {"train_loss": -12.72189998626709, "global_step": 505462, "epoch": 3008} {"train_loss": -12.758951187133789, "global_step": 505463, "epoch": 3008} {"train_loss": -12.972061157226562, "global_step": 505464, "epoch": 3008} {"train_loss": -12.975494384765625, "global_step": 505465, "epoch": 3008} {"train_loss": -12.89261245727539, "global_step": 505466, "epoch": 3008} {"train_loss": -12.971794128417969, "global_step": 505467, "epoch": 3008} {"train_loss": -12.57207202911377, "global_step": 505468, "epoch": 3008} {"train_loss": -12.948812484741211, "global_step": 505469, "epoch": 3008} {"train_loss": -12.687567710876465, "global_step": 505470, "epoch": 3008} {"train_loss": -12.779345512390137, "global_step": 505471, "epoch": 3008} {"train_loss": -12.714302062988281, "global_step": 505472, "epoch": 3008} {"train_loss": -12.647592544555664, "global_step": 505473, "epoch": 3008} {"train_loss": -12.712000846862793, "global_step": 505474, "epoch": 3008} {"train_loss": -12.682693481445312, "global_step": 505475, "epoch": 3008} {"train_loss": -12.722395896911621, "global_step": 505476, "epoch": 3008} {"train_loss": -12.797433853149414, "global_step": 505477, "epoch": 3008} {"train_loss": -12.917882919311523, "global_step": 505478, "epoch": 3008} {"train_loss": -12.640944480895996, "global_step": 505479, "epoch": 3008} {"train_loss": -13.062517166137695, "global_step": 505480, "epoch": 3008} {"train_loss": -12.694419860839844, "global_step": 505481, "epoch": 3008} {"train_loss": -12.76692008972168, "global_step": 505482, "epoch": 3008} {"train_loss": -12.63713550567627, "global_step": 505483, "epoch": 3008} {"train_loss": -12.726058959960938, "global_step": 505484, "epoch": 3008} {"train_loss": -12.934249877929688, "global_step": 505485, "epoch": 3008} {"train_loss": -12.787714004516602, "global_step": 505486, "epoch": 3008} {"train_loss": -12.127243041992188, "global_step": 505487, "epoch": 3008} {"train_loss": -12.840278625488281, "global_step": 505488, "epoch": 3008} {"train_loss": -12.701255798339844, "global_step": 505489, "epoch": 3008} {"train_loss": -12.656803131103516, "global_step": 505490, "epoch": 3008} {"train_loss": -12.790685653686523, "global_step": 505491, "epoch": 3008} {"train_loss": -12.341525077819824, "global_step": 505492, "epoch": 3008} {"train_loss": -12.680913925170898, "global_step": 505493, "epoch": 3008} {"train_loss": -12.494229316711426, "global_step": 505494, "epoch": 3008} {"train_loss": -12.406606674194336, "global_step": 505495, "epoch": 3008} {"train_loss": -11.87132740020752, "global_step": 505496, "epoch": 3008} {"train_loss": -12.41927719116211, "global_step": 505497, "epoch": 3008} {"train_loss": -12.625297546386719, "global_step": 505498, "epoch": 3008} {"train_loss": -12.663579940795898, "global_step": 505499, "epoch": 3008} {"train_loss": -12.478266716003418, "global_step": 505500, "epoch": 3008} {"train_loss": -12.68056869506836, "global_step": 505501, "epoch": 3008} {"train_loss": -12.540445327758789, "global_step": 505502, "epoch": 3008} {"train_loss": -11.250665664672852, "global_step": 505503, "epoch": 3008} {"train_loss": -11.342475891113281, "global_step": 505504, "epoch": 3008} {"train_loss": -12.314542770385742, "global_step": 505505, "epoch": 3008} {"train_loss": -10.923328399658203, "global_step": 505506, "epoch": 3008} {"train_loss": -11.55605411529541, "global_step": 505507, "epoch": 3008} {"train_loss": -12.17225456237793, "global_step": 505508, "epoch": 3008} {"train_loss": -9.3074369430542, "global_step": 505509, "epoch": 3008} {"train_loss": -11.000030517578125, "global_step": 505510, "epoch": 3008} {"train_loss": -12.28468151887258, "global_step": 505511, "epoch": 3008, "val_loss": 321689.8125} {"train_loss": -11.405094146728516, "global_step": 505512, "epoch": 3009} {"train_loss": -11.69070053100586, "global_step": 505513, "epoch": 3009} {"train_loss": -9.824603080749512, "global_step": 505514, "epoch": 3009} {"train_loss": -11.810680389404297, "global_step": 505515, "epoch": 3009} {"train_loss": -9.383599281311035, "global_step": 505516, "epoch": 3009} {"train_loss": -9.320655822753906, "global_step": 505517, "epoch": 3009} {"train_loss": -10.671974182128906, "global_step": 505518, "epoch": 3009} {"train_loss": -10.39968204498291, "global_step": 505519, "epoch": 3009} {"train_loss": -10.217103958129883, "global_step": 505520, "epoch": 3009} {"train_loss": -10.078600883483887, "global_step": 505521, "epoch": 3009} {"train_loss": -10.170767784118652, "global_step": 505522, "epoch": 3009} {"train_loss": -10.49045181274414, "global_step": 505523, "epoch": 3009} {"train_loss": -10.915290832519531, "global_step": 505524, "epoch": 3009} {"train_loss": -10.70361614227295, "global_step": 505525, "epoch": 3009} {"train_loss": -10.989381790161133, "global_step": 505526, "epoch": 3009} {"train_loss": -10.396316528320312, "global_step": 505527, "epoch": 3009} {"train_loss": -11.246267318725586, "global_step": 505528, "epoch": 3009} {"train_loss": -10.832437515258789, "global_step": 505529, "epoch": 3009} {"train_loss": -10.597731590270996, "global_step": 505530, "epoch": 3009} {"train_loss": -11.385082244873047, "global_step": 505531, "epoch": 3009} {"train_loss": -10.629610061645508, "global_step": 505532, "epoch": 3009} {"train_loss": -10.625560760498047, "global_step": 505533, "epoch": 3009} {"train_loss": -10.963536262512207, "global_step": 505534, "epoch": 3009} {"train_loss": -11.487300872802734, "global_step": 505535, "epoch": 3009} {"train_loss": -10.292657852172852, "global_step": 505536, "epoch": 3009} {"train_loss": -11.20134162902832, "global_step": 505537, "epoch": 3009} {"train_loss": -11.579133987426758, "global_step": 505538, "epoch": 3009} {"train_loss": -11.243125915527344, "global_step": 505539, "epoch": 3009} {"train_loss": -11.910943984985352, "global_step": 505540, "epoch": 3009} {"train_loss": -11.80198860168457, "global_step": 505541, "epoch": 3009} {"train_loss": -11.561214447021484, "global_step": 505542, "epoch": 3009} {"train_loss": -12.188859939575195, "global_step": 505543, "epoch": 3009} {"train_loss": -11.653616905212402, "global_step": 505544, "epoch": 3009} {"train_loss": -11.804346084594727, "global_step": 505545, "epoch": 3009} {"train_loss": -12.286100387573242, "global_step": 505546, "epoch": 3009} {"train_loss": -11.665557861328125, "global_step": 505547, "epoch": 3009} {"train_loss": -12.325270652770996, "global_step": 505548, "epoch": 3009} {"train_loss": -11.910683631896973, "global_step": 505549, "epoch": 3009} {"train_loss": -12.256155967712402, "global_step": 505550, "epoch": 3009} {"train_loss": -12.024505615234375, "global_step": 505551, "epoch": 3009} {"train_loss": -12.102230072021484, "global_step": 505552, "epoch": 3009} {"train_loss": -11.950950622558594, "global_step": 505553, "epoch": 3009} {"train_loss": -11.836018562316895, "global_step": 505554, "epoch": 3009} {"train_loss": -12.177900314331055, "global_step": 505555, "epoch": 3009} {"train_loss": -11.572273254394531, "global_step": 505556, "epoch": 3009} {"train_loss": -11.483232498168945, "global_step": 505557, "epoch": 3009} {"train_loss": -11.561535835266113, "global_step": 505558, "epoch": 3009} {"train_loss": -11.848543167114258, "global_step": 505559, "epoch": 3009} {"train_loss": -11.895750999450684, "global_step": 505560, "epoch": 3009} {"train_loss": -12.400586128234863, "global_step": 505561, "epoch": 3009} {"train_loss": -11.773366928100586, "global_step": 505562, "epoch": 3009} {"train_loss": -12.361992835998535, "global_step": 505563, "epoch": 3009} {"train_loss": -12.30142593383789, "global_step": 505564, "epoch": 3009} {"train_loss": -12.226472854614258, "global_step": 505565, "epoch": 3009} {"train_loss": -12.41581916809082, "global_step": 505566, "epoch": 3009} {"train_loss": -12.133077621459961, "global_step": 505567, "epoch": 3009} {"train_loss": -12.223526954650879, "global_step": 505568, "epoch": 3009} {"train_loss": -12.304948806762695, "global_step": 505569, "epoch": 3009} {"train_loss": -12.690401077270508, "global_step": 505570, "epoch": 3009} {"train_loss": -12.073932647705078, "global_step": 505571, "epoch": 3009} {"train_loss": -12.546785354614258, "global_step": 505572, "epoch": 3009} {"train_loss": -12.325566291809082, "global_step": 505573, "epoch": 3009} {"train_loss": -12.872064590454102, "global_step": 505574, "epoch": 3009} {"train_loss": -12.64535903930664, "global_step": 505575, "epoch": 3009} {"train_loss": -12.516637802124023, "global_step": 505576, "epoch": 3009} {"train_loss": -12.793951988220215, "global_step": 505577, "epoch": 3009} {"train_loss": -12.52662181854248, "global_step": 505578, "epoch": 3009} {"train_loss": -12.661704063415527, "global_step": 505579, "epoch": 3009} {"train_loss": -12.664361953735352, "global_step": 505580, "epoch": 3009} {"train_loss": -12.598407745361328, "global_step": 505581, "epoch": 3009} {"train_loss": -12.586446762084961, "global_step": 505582, "epoch": 3009} {"train_loss": -12.662416458129883, "global_step": 505583, "epoch": 3009} {"train_loss": -12.715761184692383, "global_step": 505584, "epoch": 3009} {"train_loss": -12.717761993408203, "global_step": 505585, "epoch": 3009} {"train_loss": -12.651622772216797, "global_step": 505586, "epoch": 3009} {"train_loss": -12.24264907836914, "global_step": 505587, "epoch": 3009} {"train_loss": -12.671903610229492, "global_step": 505588, "epoch": 3009} {"train_loss": -12.612475395202637, "global_step": 505589, "epoch": 3009} {"train_loss": -12.560593605041504, "global_step": 505590, "epoch": 3009} {"train_loss": -12.438220977783203, "global_step": 505591, "epoch": 3009} {"train_loss": -12.586346626281738, "global_step": 505592, "epoch": 3009} {"train_loss": -12.324878692626953, "global_step": 505593, "epoch": 3009} {"train_loss": -12.88801383972168, "global_step": 505594, "epoch": 3009} {"train_loss": -12.656302452087402, "global_step": 505595, "epoch": 3009} {"train_loss": -12.623279571533203, "global_step": 505596, "epoch": 3009} {"train_loss": -12.86108684539795, "global_step": 505597, "epoch": 3009} {"train_loss": -12.776763916015625, "global_step": 505598, "epoch": 3009} {"train_loss": -12.596114158630371, "global_step": 505599, "epoch": 3009} {"train_loss": -12.57227897644043, "global_step": 505600, "epoch": 3009} {"train_loss": -12.526101112365723, "global_step": 505601, "epoch": 3009} {"train_loss": -12.775208473205566, "global_step": 505602, "epoch": 3009} {"train_loss": -12.663455963134766, "global_step": 505603, "epoch": 3009} {"train_loss": -12.714130401611328, "global_step": 505604, "epoch": 3009} {"train_loss": -12.29240608215332, "global_step": 505605, "epoch": 3009} {"train_loss": -12.765542030334473, "global_step": 505606, "epoch": 3009} {"train_loss": -12.163187026977539, "global_step": 505607, "epoch": 3009} {"train_loss": -12.106876373291016, "global_step": 505608, "epoch": 3009} {"train_loss": -12.462252616882324, "global_step": 505609, "epoch": 3009} {"train_loss": -12.241447448730469, "global_step": 505610, "epoch": 3009} {"train_loss": -12.466349601745605, "global_step": 505611, "epoch": 3009} {"train_loss": -12.617730140686035, "global_step": 505612, "epoch": 3009} {"train_loss": -12.129962921142578, "global_step": 505613, "epoch": 3009} {"train_loss": -12.658833503723145, "global_step": 505614, "epoch": 3009} {"train_loss": -12.34912109375, "global_step": 505615, "epoch": 3009} {"train_loss": -12.36285400390625, "global_step": 505616, "epoch": 3009} {"train_loss": -12.697664260864258, "global_step": 505617, "epoch": 3009} {"train_loss": -12.40799331665039, "global_step": 505618, "epoch": 3009} {"train_loss": -12.437509536743164, "global_step": 505619, "epoch": 3009} {"train_loss": -12.271278381347656, "global_step": 505620, "epoch": 3009} {"train_loss": -12.71139907836914, "global_step": 505621, "epoch": 3009} {"train_loss": -12.376246452331543, "global_step": 505622, "epoch": 3009} {"train_loss": -12.756711959838867, "global_step": 505623, "epoch": 3009} {"train_loss": -12.356021881103516, "global_step": 505624, "epoch": 3009} {"train_loss": -12.039535522460938, "global_step": 505625, "epoch": 3009} {"train_loss": -12.452695846557617, "global_step": 505626, "epoch": 3009} {"train_loss": -12.0645170211792, "global_step": 505627, "epoch": 3009} {"train_loss": -12.472023963928223, "global_step": 505628, "epoch": 3009} {"train_loss": -11.705469131469727, "global_step": 505629, "epoch": 3009} {"train_loss": -11.414963722229004, "global_step": 505630, "epoch": 3009} {"train_loss": -12.355782508850098, "global_step": 505631, "epoch": 3009} {"train_loss": -10.463693618774414, "global_step": 505632, "epoch": 3009} {"train_loss": -11.746515274047852, "global_step": 505633, "epoch": 3009} {"train_loss": -11.106315612792969, "global_step": 505634, "epoch": 3009} {"train_loss": -11.677665710449219, "global_step": 505635, "epoch": 3009} {"train_loss": -11.285035133361816, "global_step": 505636, "epoch": 3009} {"train_loss": -11.043452262878418, "global_step": 505637, "epoch": 3009} {"train_loss": -12.17763900756836, "global_step": 505638, "epoch": 3009} {"train_loss": -10.93763256072998, "global_step": 505639, "epoch": 3009} {"train_loss": -11.052593231201172, "global_step": 505640, "epoch": 3009} {"train_loss": -11.271114349365234, "global_step": 505641, "epoch": 3009} {"train_loss": -11.310227394104004, "global_step": 505642, "epoch": 3009} {"train_loss": -10.80156135559082, "global_step": 505643, "epoch": 3009} {"train_loss": -11.24177074432373, "global_step": 505644, "epoch": 3009} {"train_loss": -10.198512077331543, "global_step": 505645, "epoch": 3009} {"train_loss": -11.25098705291748, "global_step": 505646, "epoch": 3009} {"train_loss": -9.899541854858398, "global_step": 505647, "epoch": 3009} {"train_loss": -11.26323413848877, "global_step": 505648, "epoch": 3009} {"train_loss": -10.764509201049805, "global_step": 505649, "epoch": 3009} {"train_loss": -10.924569129943848, "global_step": 505650, "epoch": 3009} {"train_loss": -11.511930465698242, "global_step": 505651, "epoch": 3009} {"train_loss": -11.727611541748047, "global_step": 505652, "epoch": 3009} {"train_loss": -11.3165283203125, "global_step": 505653, "epoch": 3009} {"train_loss": -11.763117790222168, "global_step": 505654, "epoch": 3009} {"train_loss": -10.979689598083496, "global_step": 505655, "epoch": 3009} {"train_loss": -11.707499504089355, "global_step": 505656, "epoch": 3009} {"train_loss": -10.26275634765625, "global_step": 505657, "epoch": 3009} {"train_loss": -10.834762573242188, "global_step": 505658, "epoch": 3009} {"train_loss": -11.812704086303711, "global_step": 505659, "epoch": 3009} {"train_loss": -9.797927856445312, "global_step": 505660, "epoch": 3009} {"train_loss": -12.133365631103516, "global_step": 505661, "epoch": 3009} {"train_loss": -10.541851043701172, "global_step": 505662, "epoch": 3009} {"train_loss": -12.260395050048828, "global_step": 505663, "epoch": 3009} {"train_loss": -10.371586799621582, "global_step": 505664, "epoch": 3009} {"train_loss": -11.936906814575195, "global_step": 505665, "epoch": 3009} {"train_loss": -11.007272720336914, "global_step": 505666, "epoch": 3009} {"train_loss": -11.724367141723633, "global_step": 505667, "epoch": 3009} {"train_loss": -11.341148376464844, "global_step": 505668, "epoch": 3009} {"train_loss": -11.887451171875, "global_step": 505669, "epoch": 3009} {"train_loss": -11.69259262084961, "global_step": 505670, "epoch": 3009} {"train_loss": -11.786404609680176, "global_step": 505671, "epoch": 3009} {"train_loss": -12.210224151611328, "global_step": 505672, "epoch": 3009} {"train_loss": -11.633647918701172, "global_step": 505673, "epoch": 3009} {"train_loss": -12.607988357543945, "global_step": 505674, "epoch": 3009} {"train_loss": -11.499899864196777, "global_step": 505675, "epoch": 3009} {"train_loss": -12.337224006652832, "global_step": 505676, "epoch": 3009} {"train_loss": -11.739182472229004, "global_step": 505677, "epoch": 3009} {"train_loss": -12.50212574005127, "global_step": 505678, "epoch": 3009} {"train_loss": -11.786417478606815, "global_step": 505679, "epoch": 3009, "val_loss": 322457.78125} {"train_loss": -12.412925720214844, "global_step": 505680, "epoch": 3010} {"train_loss": -12.071062088012695, "global_step": 505681, "epoch": 3010} {"train_loss": -12.55327033996582, "global_step": 505682, "epoch": 3010} {"train_loss": -11.974357604980469, "global_step": 505683, "epoch": 3010} {"train_loss": -12.575891494750977, "global_step": 505684, "epoch": 3010} {"train_loss": -12.142019271850586, "global_step": 505685, "epoch": 3010} {"train_loss": -12.378549575805664, "global_step": 505686, "epoch": 3010} {"train_loss": -11.945406913757324, "global_step": 505687, "epoch": 3010} {"train_loss": -12.096739768981934, "global_step": 505688, "epoch": 3010} {"train_loss": -12.607975006103516, "global_step": 505689, "epoch": 3010} {"train_loss": -12.117002487182617, "global_step": 505690, "epoch": 3010} {"train_loss": -12.338800430297852, "global_step": 505691, "epoch": 3010} {"train_loss": -12.382301330566406, "global_step": 505692, "epoch": 3010} {"train_loss": -12.502609252929688, "global_step": 505693, "epoch": 3010} {"train_loss": -12.515256881713867, "global_step": 505694, "epoch": 3010} {"train_loss": -12.532060623168945, "global_step": 505695, "epoch": 3010} {"train_loss": -12.746115684509277, "global_step": 505696, "epoch": 3010} {"train_loss": -12.735429763793945, "global_step": 505697, "epoch": 3010} {"train_loss": -12.432172775268555, "global_step": 505698, "epoch": 3010} {"train_loss": -12.583837509155273, "global_step": 505699, "epoch": 3010} {"train_loss": -12.716550827026367, "global_step": 505700, "epoch": 3010} {"train_loss": -12.768500328063965, "global_step": 505701, "epoch": 3010} {"train_loss": -12.550309181213379, "global_step": 505702, "epoch": 3010} {"train_loss": -12.666463851928711, "global_step": 505703, "epoch": 3010} {"train_loss": -12.708708763122559, "global_step": 505704, "epoch": 3010} {"train_loss": -12.598772048950195, "global_step": 505705, "epoch": 3010} {"train_loss": -12.797985076904297, "global_step": 505706, "epoch": 3010} {"train_loss": -12.798702239990234, "global_step": 505707, "epoch": 3010} {"train_loss": -12.724160194396973, "global_step": 505708, "epoch": 3010} {"train_loss": -12.785905838012695, "global_step": 505709, "epoch": 3010} {"train_loss": -12.630623817443848, "global_step": 505710, "epoch": 3010} {"train_loss": -12.856629371643066, "global_step": 505711, "epoch": 3010} {"train_loss": -12.840323448181152, "global_step": 505712, "epoch": 3010} {"train_loss": -12.811657905578613, "global_step": 505713, "epoch": 3010} {"train_loss": -12.904918670654297, "global_step": 505714, "epoch": 3010} {"train_loss": -12.825580596923828, "global_step": 505715, "epoch": 3010} {"train_loss": -12.901358604431152, "global_step": 505716, "epoch": 3010} {"train_loss": -12.421528816223145, "global_step": 505717, "epoch": 3010} {"train_loss": -13.04426383972168, "global_step": 505718, "epoch": 3010} {"train_loss": -12.867512702941895, "global_step": 505719, "epoch": 3010} {"train_loss": -12.852856636047363, "global_step": 505720, "epoch": 3010} {"train_loss": -12.69017219543457, "global_step": 505721, "epoch": 3010} {"train_loss": -12.776275634765625, "global_step": 505722, "epoch": 3010} {"train_loss": -12.745842933654785, "global_step": 505723, "epoch": 3010} {"train_loss": -12.677675247192383, "global_step": 505724, "epoch": 3010} {"train_loss": -12.79067325592041, "global_step": 505725, "epoch": 3010} {"train_loss": -12.96636962890625, "global_step": 505726, "epoch": 3010} {"train_loss": -12.90429973602295, "global_step": 505727, "epoch": 3010} {"train_loss": -12.960746765136719, "global_step": 505728, "epoch": 3010} {"train_loss": -12.82705307006836, "global_step": 505729, "epoch": 3010} {"train_loss": -12.87446403503418, "global_step": 505730, "epoch": 3010} {"train_loss": -13.025680541992188, "global_step": 505731, "epoch": 3010} {"train_loss": -12.804346084594727, "global_step": 505732, "epoch": 3010} {"train_loss": -13.027691841125488, "global_step": 505733, "epoch": 3010} {"train_loss": -12.880380630493164, "global_step": 505734, "epoch": 3010} {"train_loss": -12.931434631347656, "global_step": 505735, "epoch": 3010} {"train_loss": -12.507821083068848, "global_step": 505736, "epoch": 3010} {"train_loss": -12.884382247924805, "global_step": 505737, "epoch": 3010} {"train_loss": -12.912105560302734, "global_step": 505738, "epoch": 3010} {"train_loss": -12.641797065734863, "global_step": 505739, "epoch": 3010} {"train_loss": -12.600664138793945, "global_step": 505740, "epoch": 3010} {"train_loss": -12.83007526397705, "global_step": 505741, "epoch": 3010} {"train_loss": -12.767671585083008, "global_step": 505742, "epoch": 3010} {"train_loss": -12.544134140014648, "global_step": 505743, "epoch": 3010} {"train_loss": -12.062274932861328, "global_step": 505744, "epoch": 3010} {"train_loss": -12.518584251403809, "global_step": 505745, "epoch": 3010} {"train_loss": -12.45810317993164, "global_step": 505746, "epoch": 3010} {"train_loss": -12.55605411529541, "global_step": 505747, "epoch": 3010} {"train_loss": -12.571832656860352, "global_step": 505748, "epoch": 3010} {"train_loss": -12.48501968383789, "global_step": 505749, "epoch": 3010} {"train_loss": -12.194486618041992, "global_step": 505750, "epoch": 3010} {"train_loss": -12.436897277832031, "global_step": 505751, "epoch": 3010} {"train_loss": -12.066073417663574, "global_step": 505752, "epoch": 3010} {"train_loss": -12.494704246520996, "global_step": 505753, "epoch": 3010} {"train_loss": -12.182086944580078, "global_step": 505754, "epoch": 3010} {"train_loss": -12.429901123046875, "global_step": 505755, "epoch": 3010} {"train_loss": -11.48788833618164, "global_step": 505756, "epoch": 3010} {"train_loss": -12.68326187133789, "global_step": 505757, "epoch": 3010} {"train_loss": -11.269601821899414, "global_step": 505758, "epoch": 3010} {"train_loss": -12.682568550109863, "global_step": 505759, "epoch": 3010} {"train_loss": -11.638710021972656, "global_step": 505760, "epoch": 3010} {"train_loss": -11.962408065795898, "global_step": 505761, "epoch": 3010} {"train_loss": -12.537775039672852, "global_step": 505762, "epoch": 3010} {"train_loss": -11.973498344421387, "global_step": 505763, "epoch": 3010} {"train_loss": -11.985815048217773, "global_step": 505764, "epoch": 3010} {"train_loss": -12.346986770629883, "global_step": 505765, "epoch": 3010} {"train_loss": -11.024415969848633, "global_step": 505766, "epoch": 3010} {"train_loss": -11.415358543395996, "global_step": 505767, "epoch": 3010} {"train_loss": -12.285581588745117, "global_step": 505768, "epoch": 3010} {"train_loss": -11.014864921569824, "global_step": 505769, "epoch": 3010} {"train_loss": -11.684212684631348, "global_step": 505770, "epoch": 3010} {"train_loss": -11.514979362487793, "global_step": 505771, "epoch": 3010} {"train_loss": -11.939247131347656, "global_step": 505772, "epoch": 3010} {"train_loss": -12.225606918334961, "global_step": 505773, "epoch": 3010} {"train_loss": -11.763360023498535, "global_step": 505774, "epoch": 3010} {"train_loss": -12.072912216186523, "global_step": 505775, "epoch": 3010} {"train_loss": -11.710886001586914, "global_step": 505776, "epoch": 3010} {"train_loss": -11.93284797668457, "global_step": 505777, "epoch": 3010} {"train_loss": -11.535258293151855, "global_step": 505778, "epoch": 3010} {"train_loss": -11.156569480895996, "global_step": 505779, "epoch": 3010} {"train_loss": -12.00532054901123, "global_step": 505780, "epoch": 3010} {"train_loss": -11.482718467712402, "global_step": 505781, "epoch": 3010} {"train_loss": -11.978598594665527, "global_step": 505782, "epoch": 3010} {"train_loss": -12.107481956481934, "global_step": 505783, "epoch": 3010} {"train_loss": -11.508686065673828, "global_step": 505784, "epoch": 3010} {"train_loss": -12.259810447692871, "global_step": 505785, "epoch": 3010} {"train_loss": -12.1357421875, "global_step": 505786, "epoch": 3010} {"train_loss": -11.962803840637207, "global_step": 505787, "epoch": 3010} {"train_loss": -12.057600021362305, "global_step": 505788, "epoch": 3010} {"train_loss": -12.132617950439453, "global_step": 505789, "epoch": 3010} {"train_loss": -12.043621063232422, "global_step": 505790, "epoch": 3010} {"train_loss": -12.793503761291504, "global_step": 505791, "epoch": 3010} {"train_loss": -12.17843246459961, "global_step": 505792, "epoch": 3010} {"train_loss": -12.262243270874023, "global_step": 505793, "epoch": 3010} {"train_loss": -12.35636043548584, "global_step": 505794, "epoch": 3010} {"train_loss": -12.217005729675293, "global_step": 505795, "epoch": 3010} {"train_loss": -12.592453956604004, "global_step": 505796, "epoch": 3010} {"train_loss": -12.3555269241333, "global_step": 505797, "epoch": 3010} {"train_loss": -12.752129554748535, "global_step": 505798, "epoch": 3010} {"train_loss": -12.650028228759766, "global_step": 505799, "epoch": 3010} {"train_loss": -12.439298629760742, "global_step": 505800, "epoch": 3010} {"train_loss": -12.206899642944336, "global_step": 505801, "epoch": 3010} {"train_loss": -12.352017402648926, "global_step": 505802, "epoch": 3010} {"train_loss": -12.280227661132812, "global_step": 505803, "epoch": 3010} {"train_loss": -12.294318199157715, "global_step": 505804, "epoch": 3010} {"train_loss": -12.532608032226562, "global_step": 505805, "epoch": 3010} {"train_loss": -12.150110244750977, "global_step": 505806, "epoch": 3010} {"train_loss": -12.391576766967773, "global_step": 505807, "epoch": 3010} {"train_loss": -12.860973358154297, "global_step": 505808, "epoch": 3010} {"train_loss": -12.334242820739746, "global_step": 505809, "epoch": 3010} {"train_loss": -12.673999786376953, "global_step": 505810, "epoch": 3010} {"train_loss": -12.353970527648926, "global_step": 505811, "epoch": 3010} {"train_loss": -12.389314651489258, "global_step": 505812, "epoch": 3010} {"train_loss": -12.337501525878906, "global_step": 505813, "epoch": 3010} {"train_loss": -12.630126953125, "global_step": 505814, "epoch": 3010} {"train_loss": -12.319192886352539, "global_step": 505815, "epoch": 3010} {"train_loss": -12.482322692871094, "global_step": 505816, "epoch": 3010} {"train_loss": -12.897367477416992, "global_step": 505817, "epoch": 3010} {"train_loss": -12.454122543334961, "global_step": 505818, "epoch": 3010} {"train_loss": -12.860450744628906, "global_step": 505819, "epoch": 3010} {"train_loss": -12.32916259765625, "global_step": 505820, "epoch": 3010} {"train_loss": -12.767620086669922, "global_step": 505821, "epoch": 3010} {"train_loss": -12.411916732788086, "global_step": 505822, "epoch": 3010} {"train_loss": -12.653881072998047, "global_step": 505823, "epoch": 3010} {"train_loss": -12.134552001953125, "global_step": 505824, "epoch": 3010} {"train_loss": -12.575995445251465, "global_step": 505825, "epoch": 3010} {"train_loss": -12.09923267364502, "global_step": 505826, "epoch": 3010} {"train_loss": -12.552419662475586, "global_step": 505827, "epoch": 3010} {"train_loss": -12.226667404174805, "global_step": 505828, "epoch": 3010} {"train_loss": -12.310242652893066, "global_step": 505829, "epoch": 3010} {"train_loss": -11.879467964172363, "global_step": 505830, "epoch": 3010} {"train_loss": -11.05257797241211, "global_step": 505831, "epoch": 3010} {"train_loss": -11.683935165405273, "global_step": 505832, "epoch": 3010} {"train_loss": -11.46707534790039, "global_step": 505833, "epoch": 3010} {"train_loss": -11.419346809387207, "global_step": 505834, "epoch": 3010} {"train_loss": -11.063567161560059, "global_step": 505835, "epoch": 3010} {"train_loss": -11.673922538757324, "global_step": 505836, "epoch": 3010} {"train_loss": -11.000497817993164, "global_step": 505837, "epoch": 3010} {"train_loss": -10.345800399780273, "global_step": 505838, "epoch": 3010} {"train_loss": -11.958972930908203, "global_step": 505839, "epoch": 3010} {"train_loss": -10.539379119873047, "global_step": 505840, "epoch": 3010} {"train_loss": -11.803735733032227, "global_step": 505841, "epoch": 3010} {"train_loss": -11.818039894104004, "global_step": 505842, "epoch": 3010} {"train_loss": -11.922882080078125, "global_step": 505843, "epoch": 3010} {"train_loss": -11.974274635314941, "global_step": 505844, "epoch": 3010} {"train_loss": -11.948553085327148, "global_step": 505845, "epoch": 3010} {"train_loss": -12.106146812438965, "global_step": 505846, "epoch": 3010} {"train_loss": -12.303623897688729, "global_step": 505847, "epoch": 3010, "val_loss": 322040.75, "train_action_mse_error": 1.1969733238220215} {"train_loss": -12.363183975219727, "global_step": 505848, "epoch": 3011} {"train_loss": -11.781610488891602, "global_step": 505849, "epoch": 3011} {"train_loss": -12.213399887084961, "global_step": 505850, "epoch": 3011} {"train_loss": -12.123570442199707, "global_step": 505851, "epoch": 3011} {"train_loss": -12.661821365356445, "global_step": 505852, "epoch": 3011} {"train_loss": -12.025869369506836, "global_step": 505853, "epoch": 3011} {"train_loss": -12.569141387939453, "global_step": 505854, "epoch": 3011} {"train_loss": -12.281164169311523, "global_step": 505855, "epoch": 3011} {"train_loss": -12.235858917236328, "global_step": 505856, "epoch": 3011} {"train_loss": -12.243927001953125, "global_step": 505857, "epoch": 3011} {"train_loss": -11.840595245361328, "global_step": 505858, "epoch": 3011} {"train_loss": -12.70794677734375, "global_step": 505859, "epoch": 3011} {"train_loss": -12.22514533996582, "global_step": 505860, "epoch": 3011} {"train_loss": -12.813822746276855, "global_step": 505861, "epoch": 3011} {"train_loss": -12.367993354797363, "global_step": 505862, "epoch": 3011} {"train_loss": -12.148955345153809, "global_step": 505863, "epoch": 3011} {"train_loss": -12.66661262512207, "global_step": 505864, "epoch": 3011} {"train_loss": -12.535409927368164, "global_step": 505865, "epoch": 3011} {"train_loss": -12.503173828125, "global_step": 505866, "epoch": 3011} {"train_loss": -12.883090019226074, "global_step": 505867, "epoch": 3011} {"train_loss": -12.593286514282227, "global_step": 505868, "epoch": 3011} {"train_loss": -12.685800552368164, "global_step": 505869, "epoch": 3011} {"train_loss": -12.49657154083252, "global_step": 505870, "epoch": 3011} {"train_loss": -12.305885314941406, "global_step": 505871, "epoch": 3011} {"train_loss": -12.290119171142578, "global_step": 505872, "epoch": 3011} {"train_loss": -12.409148216247559, "global_step": 505873, "epoch": 3011} {"train_loss": -12.462637901306152, "global_step": 505874, "epoch": 3011} {"train_loss": -12.761667251586914, "global_step": 505875, "epoch": 3011} {"train_loss": -12.550613403320312, "global_step": 505876, "epoch": 3011} {"train_loss": -12.484028816223145, "global_step": 505877, "epoch": 3011} {"train_loss": -12.824300765991211, "global_step": 505878, "epoch": 3011} {"train_loss": -12.514835357666016, "global_step": 505879, "epoch": 3011} {"train_loss": -12.906064987182617, "global_step": 505880, "epoch": 3011} {"train_loss": -12.788971900939941, "global_step": 505881, "epoch": 3011} {"train_loss": -12.644828796386719, "global_step": 505882, "epoch": 3011} {"train_loss": -12.872347831726074, "global_step": 505883, "epoch": 3011} {"train_loss": -12.310920715332031, "global_step": 505884, "epoch": 3011} {"train_loss": -12.840351104736328, "global_step": 505885, "epoch": 3011} {"train_loss": -12.402917861938477, "global_step": 505886, "epoch": 3011} {"train_loss": -12.487712860107422, "global_step": 505887, "epoch": 3011} {"train_loss": -12.653825759887695, "global_step": 505888, "epoch": 3011} {"train_loss": -12.52509880065918, "global_step": 505889, "epoch": 3011} {"train_loss": -12.609155654907227, "global_step": 505890, "epoch": 3011} {"train_loss": -12.493192672729492, "global_step": 505891, "epoch": 3011} {"train_loss": -12.232610702514648, "global_step": 505892, "epoch": 3011} {"train_loss": -12.553276062011719, "global_step": 505893, "epoch": 3011} {"train_loss": -12.585204124450684, "global_step": 505894, "epoch": 3011} {"train_loss": -12.466195106506348, "global_step": 505895, "epoch": 3011} {"train_loss": -12.154052734375, "global_step": 505896, "epoch": 3011} {"train_loss": -12.436332702636719, "global_step": 505897, "epoch": 3011} {"train_loss": -12.801180839538574, "global_step": 505898, "epoch": 3011} {"train_loss": -12.727899551391602, "global_step": 505899, "epoch": 3011} {"train_loss": -12.522957801818848, "global_step": 505900, "epoch": 3011} {"train_loss": -12.679339408874512, "global_step": 505901, "epoch": 3011} {"train_loss": -12.422016143798828, "global_step": 505902, "epoch": 3011} {"train_loss": -12.956184387207031, "global_step": 505903, "epoch": 3011} {"train_loss": -12.768927574157715, "global_step": 505904, "epoch": 3011} {"train_loss": -12.745664596557617, "global_step": 505905, "epoch": 3011} {"train_loss": -12.938592910766602, "global_step": 505906, "epoch": 3011} {"train_loss": -12.509479522705078, "global_step": 505907, "epoch": 3011} {"train_loss": -12.804903030395508, "global_step": 505908, "epoch": 3011} {"train_loss": -12.655221939086914, "global_step": 505909, "epoch": 3011} {"train_loss": -12.536432266235352, "global_step": 505910, "epoch": 3011} {"train_loss": -12.679561614990234, "global_step": 505911, "epoch": 3011} {"train_loss": -12.821392059326172, "global_step": 505912, "epoch": 3011} {"train_loss": -12.53687858581543, "global_step": 505913, "epoch": 3011} {"train_loss": -13.158567428588867, "global_step": 505914, "epoch": 3011} {"train_loss": -12.933557510375977, "global_step": 505915, "epoch": 3011} {"train_loss": -13.028696060180664, "global_step": 505916, "epoch": 3011} {"train_loss": -12.919120788574219, "global_step": 505917, "epoch": 3011} {"train_loss": -13.032962799072266, "global_step": 505918, "epoch": 3011} {"train_loss": -13.12765121459961, "global_step": 505919, "epoch": 3011} {"train_loss": -12.963457107543945, "global_step": 505920, "epoch": 3011} {"train_loss": -13.109968185424805, "global_step": 505921, "epoch": 3011} {"train_loss": -12.9393949508667, "global_step": 505922, "epoch": 3011} {"train_loss": -13.09318733215332, "global_step": 505923, "epoch": 3011} {"train_loss": -12.871770858764648, "global_step": 505924, "epoch": 3011} {"train_loss": -13.03145980834961, "global_step": 505925, "epoch": 3011} {"train_loss": -13.086688995361328, "global_step": 505926, "epoch": 3011} {"train_loss": -12.991146087646484, "global_step": 505927, "epoch": 3011} {"train_loss": -13.02169418334961, "global_step": 505928, "epoch": 3011} {"train_loss": -13.03084945678711, "global_step": 505929, "epoch": 3011} {"train_loss": -13.05134391784668, "global_step": 505930, "epoch": 3011} {"train_loss": -13.056394577026367, "global_step": 505931, "epoch": 3011} {"train_loss": -12.891080856323242, "global_step": 505932, "epoch": 3011} {"train_loss": -13.098210334777832, "global_step": 505933, "epoch": 3011} {"train_loss": -13.020706176757812, "global_step": 505934, "epoch": 3011} {"train_loss": -13.113665580749512, "global_step": 505935, "epoch": 3011} {"train_loss": -13.131657600402832, "global_step": 505936, "epoch": 3011} {"train_loss": -13.241230964660645, "global_step": 505937, "epoch": 3011} {"train_loss": -12.94999885559082, "global_step": 505938, "epoch": 3011} {"train_loss": -12.91921615600586, "global_step": 505939, "epoch": 3011} {"train_loss": -13.069679260253906, "global_step": 505940, "epoch": 3011} {"train_loss": -13.12291431427002, "global_step": 505941, "epoch": 3011} {"train_loss": -13.04069709777832, "global_step": 505942, "epoch": 3011} {"train_loss": -12.925924301147461, "global_step": 505943, "epoch": 3011} {"train_loss": -12.734855651855469, "global_step": 505944, "epoch": 3011} {"train_loss": -12.739410400390625, "global_step": 505945, "epoch": 3011} {"train_loss": -13.067201614379883, "global_step": 505946, "epoch": 3011} {"train_loss": -12.869346618652344, "global_step": 505947, "epoch": 3011} {"train_loss": -13.107240676879883, "global_step": 505948, "epoch": 3011} {"train_loss": -13.260114669799805, "global_step": 505949, "epoch": 3011} {"train_loss": -13.083856582641602, "global_step": 505950, "epoch": 3011} {"train_loss": -12.854013442993164, "global_step": 505951, "epoch": 3011} {"train_loss": -12.798900604248047, "global_step": 505952, "epoch": 3011} {"train_loss": -12.61001968383789, "global_step": 505953, "epoch": 3011} {"train_loss": -12.870302200317383, "global_step": 505954, "epoch": 3011} {"train_loss": -12.833752632141113, "global_step": 505955, "epoch": 3011} {"train_loss": -12.110482215881348, "global_step": 505956, "epoch": 3011} {"train_loss": -12.033432006835938, "global_step": 505957, "epoch": 3011} {"train_loss": -11.78355884552002, "global_step": 505958, "epoch": 3011} {"train_loss": -11.938066482543945, "global_step": 505959, "epoch": 3011} {"train_loss": -12.345756530761719, "global_step": 505960, "epoch": 3011} {"train_loss": -11.992301940917969, "global_step": 505961, "epoch": 3011} {"train_loss": -10.162162780761719, "global_step": 505962, "epoch": 3011} {"train_loss": -11.541851043701172, "global_step": 505963, "epoch": 3011} {"train_loss": -11.481277465820312, "global_step": 505964, "epoch": 3011} {"train_loss": -12.2210693359375, "global_step": 505965, "epoch": 3011} {"train_loss": -11.403785705566406, "global_step": 505966, "epoch": 3011} {"train_loss": -12.311870574951172, "global_step": 505967, "epoch": 3011} {"train_loss": -11.194721221923828, "global_step": 505968, "epoch": 3011} {"train_loss": -11.911184310913086, "global_step": 505969, "epoch": 3011} {"train_loss": -12.019023895263672, "global_step": 505970, "epoch": 3011} {"train_loss": -9.4461669921875, "global_step": 505971, "epoch": 3011} {"train_loss": -11.367639541625977, "global_step": 505972, "epoch": 3011} {"train_loss": -11.319511413574219, "global_step": 505973, "epoch": 3011} {"train_loss": -9.844666481018066, "global_step": 505974, "epoch": 3011} {"train_loss": -9.369546890258789, "global_step": 505975, "epoch": 3011} {"train_loss": -9.741077423095703, "global_step": 505976, "epoch": 3011} {"train_loss": -7.084168434143066, "global_step": 505977, "epoch": 3011} {"train_loss": -10.74835205078125, "global_step": 505978, "epoch": 3011} {"train_loss": -9.285682678222656, "global_step": 505979, "epoch": 3011} {"train_loss": -10.459144592285156, "global_step": 505980, "epoch": 3011} {"train_loss": -10.294124603271484, "global_step": 505981, "epoch": 3011} {"train_loss": -10.429916381835938, "global_step": 505982, "epoch": 3011} {"train_loss": -10.712568283081055, "global_step": 505983, "epoch": 3011} {"train_loss": -9.550524711608887, "global_step": 505984, "epoch": 3011} {"train_loss": -10.682878494262695, "global_step": 505985, "epoch": 3011} {"train_loss": -10.103691101074219, "global_step": 505986, "epoch": 3011} {"train_loss": -10.88835334777832, "global_step": 505987, "epoch": 3011} {"train_loss": -11.528468132019043, "global_step": 505988, "epoch": 3011} {"train_loss": -11.04604721069336, "global_step": 505989, "epoch": 3011} {"train_loss": -10.35877799987793, "global_step": 505990, "epoch": 3011} {"train_loss": -10.670049667358398, "global_step": 505991, "epoch": 3011} {"train_loss": -11.498791694641113, "global_step": 505992, "epoch": 3011} {"train_loss": -10.883030891418457, "global_step": 505993, "epoch": 3011} {"train_loss": -11.071195602416992, "global_step": 505994, "epoch": 3011} {"train_loss": -11.832674026489258, "global_step": 505995, "epoch": 3011} {"train_loss": -10.664388656616211, "global_step": 505996, "epoch": 3011} {"train_loss": -11.51754093170166, "global_step": 505997, "epoch": 3011} {"train_loss": -10.666943550109863, "global_step": 505998, "epoch": 3011} {"train_loss": -11.257390975952148, "global_step": 505999, "epoch": 3011} {"train_loss": -11.184612274169922, "global_step": 506000, "epoch": 3011} {"train_loss": -11.42436408996582, "global_step": 506001, "epoch": 3011} {"train_loss": -11.780752182006836, "global_step": 506002, "epoch": 3011} {"train_loss": -11.178248405456543, "global_step": 506003, "epoch": 3011} {"train_loss": -11.903826713562012, "global_step": 506004, "epoch": 3011} {"train_loss": -11.320266723632812, "global_step": 506005, "epoch": 3011} {"train_loss": -11.118208885192871, "global_step": 506006, "epoch": 3011} {"train_loss": -12.008070945739746, "global_step": 506007, "epoch": 3011} {"train_loss": -11.316730499267578, "global_step": 506008, "epoch": 3011} {"train_loss": -12.138578414916992, "global_step": 506009, "epoch": 3011} {"train_loss": -11.809089660644531, "global_step": 506010, "epoch": 3011} {"train_loss": -12.176788330078125, "global_step": 506011, "epoch": 3011} {"train_loss": -11.957450866699219, "global_step": 506012, "epoch": 3011} {"train_loss": -11.78836727142334, "global_step": 506013, "epoch": 3011} {"train_loss": -11.95750617980957, "global_step": 506014, "epoch": 3011} {"train_loss": -12.145597117287773, "global_step": 506015, "epoch": 3011, "val_loss": 316321.9375} {"train_loss": -11.960786819458008, "global_step": 506016, "epoch": 3012} {"train_loss": -12.145746231079102, "global_step": 506017, "epoch": 3012} {"train_loss": -11.991100311279297, "global_step": 506018, "epoch": 3012} {"train_loss": -12.389988899230957, "global_step": 506019, "epoch": 3012} {"train_loss": -12.45858383178711, "global_step": 506020, "epoch": 3012} {"train_loss": -12.054813385009766, "global_step": 506021, "epoch": 3012} {"train_loss": -12.429239273071289, "global_step": 506022, "epoch": 3012} {"train_loss": -12.135318756103516, "global_step": 506023, "epoch": 3012} {"train_loss": -12.317789077758789, "global_step": 506024, "epoch": 3012} {"train_loss": -12.30373477935791, "global_step": 506025, "epoch": 3012} {"train_loss": -12.667016983032227, "global_step": 506026, "epoch": 3012} {"train_loss": -12.341060638427734, "global_step": 506027, "epoch": 3012} {"train_loss": -12.492045402526855, "global_step": 506028, "epoch": 3012} {"train_loss": -12.535703659057617, "global_step": 506029, "epoch": 3012} {"train_loss": -12.53598403930664, "global_step": 506030, "epoch": 3012} {"train_loss": -12.573123931884766, "global_step": 506031, "epoch": 3012} {"train_loss": -12.531059265136719, "global_step": 506032, "epoch": 3012} {"train_loss": -12.57916259765625, "global_step": 506033, "epoch": 3012} {"train_loss": -12.60677433013916, "global_step": 506034, "epoch": 3012} {"train_loss": -12.651352882385254, "global_step": 506035, "epoch": 3012} {"train_loss": -12.549856185913086, "global_step": 506036, "epoch": 3012} {"train_loss": -12.482904434204102, "global_step": 506037, "epoch": 3012} {"train_loss": -12.802444458007812, "global_step": 506038, "epoch": 3012} {"train_loss": -12.660433769226074, "global_step": 506039, "epoch": 3012} {"train_loss": -12.731799125671387, "global_step": 506040, "epoch": 3012} {"train_loss": -12.808685302734375, "global_step": 506041, "epoch": 3012} {"train_loss": -12.549153327941895, "global_step": 506042, "epoch": 3012} {"train_loss": -12.795368194580078, "global_step": 506043, "epoch": 3012} {"train_loss": -12.799915313720703, "global_step": 506044, "epoch": 3012} {"train_loss": -12.665157318115234, "global_step": 506045, "epoch": 3012} {"train_loss": -12.797469139099121, "global_step": 506046, "epoch": 3012} {"train_loss": -12.707805633544922, "global_step": 506047, "epoch": 3012} {"train_loss": -12.88433837890625, "global_step": 506048, "epoch": 3012} {"train_loss": -12.422359466552734, "global_step": 506049, "epoch": 3012} {"train_loss": -12.720706939697266, "global_step": 506050, "epoch": 3012} {"train_loss": -12.648530006408691, "global_step": 506051, "epoch": 3012} {"train_loss": -12.715038299560547, "global_step": 506052, "epoch": 3012} {"train_loss": -12.675881385803223, "global_step": 506053, "epoch": 3012} {"train_loss": -12.029378890991211, "global_step": 506054, "epoch": 3012} {"train_loss": -12.831136703491211, "global_step": 506055, "epoch": 3012} {"train_loss": -12.479828834533691, "global_step": 506056, "epoch": 3012} {"train_loss": -12.780461311340332, "global_step": 506057, "epoch": 3012} {"train_loss": -12.439628601074219, "global_step": 506058, "epoch": 3012} {"train_loss": -12.372644424438477, "global_step": 506059, "epoch": 3012} {"train_loss": -12.742618560791016, "global_step": 506060, "epoch": 3012} {"train_loss": -12.065807342529297, "global_step": 506061, "epoch": 3012} {"train_loss": -12.216705322265625, "global_step": 506062, "epoch": 3012} {"train_loss": -12.658681869506836, "global_step": 506063, "epoch": 3012} {"train_loss": -11.758932113647461, "global_step": 506064, "epoch": 3012} {"train_loss": -12.851396560668945, "global_step": 506065, "epoch": 3012} {"train_loss": -12.481273651123047, "global_step": 506066, "epoch": 3012} {"train_loss": -12.445019721984863, "global_step": 506067, "epoch": 3012} {"train_loss": -12.820585250854492, "global_step": 506068, "epoch": 3012} {"train_loss": -12.445850372314453, "global_step": 506069, "epoch": 3012} {"train_loss": -12.668388366699219, "global_step": 506070, "epoch": 3012} {"train_loss": -12.512264251708984, "global_step": 506071, "epoch": 3012} {"train_loss": -12.05624771118164, "global_step": 506072, "epoch": 3012} {"train_loss": -12.678987503051758, "global_step": 506073, "epoch": 3012} {"train_loss": -11.995508193969727, "global_step": 506074, "epoch": 3012} {"train_loss": -12.314593315124512, "global_step": 506075, "epoch": 3012} {"train_loss": -12.512622833251953, "global_step": 506076, "epoch": 3012} {"train_loss": -11.923131942749023, "global_step": 506077, "epoch": 3012} {"train_loss": -12.405664443969727, "global_step": 506078, "epoch": 3012} {"train_loss": -12.419042587280273, "global_step": 506079, "epoch": 3012} {"train_loss": -12.043685913085938, "global_step": 506080, "epoch": 3012} {"train_loss": -12.651468276977539, "global_step": 506081, "epoch": 3012} {"train_loss": -12.240901947021484, "global_step": 506082, "epoch": 3012} {"train_loss": -12.533060073852539, "global_step": 506083, "epoch": 3012} {"train_loss": -12.350032806396484, "global_step": 506084, "epoch": 3012} {"train_loss": -12.648320198059082, "global_step": 506085, "epoch": 3012} {"train_loss": -12.438361167907715, "global_step": 506086, "epoch": 3012} {"train_loss": -12.554668426513672, "global_step": 506087, "epoch": 3012} {"train_loss": -12.098474502563477, "global_step": 506088, "epoch": 3012} {"train_loss": -12.630697250366211, "global_step": 506089, "epoch": 3012} {"train_loss": -12.059865951538086, "global_step": 506090, "epoch": 3012} {"train_loss": -12.410351753234863, "global_step": 506091, "epoch": 3012} {"train_loss": -12.858283996582031, "global_step": 506092, "epoch": 3012} {"train_loss": -12.559683799743652, "global_step": 506093, "epoch": 3012} {"train_loss": -12.462921142578125, "global_step": 506094, "epoch": 3012} {"train_loss": -12.669649124145508, "global_step": 506095, "epoch": 3012} {"train_loss": -12.158099174499512, "global_step": 506096, "epoch": 3012} {"train_loss": -12.441025733947754, "global_step": 506097, "epoch": 3012} {"train_loss": -12.717559814453125, "global_step": 506098, "epoch": 3012} {"train_loss": -12.456011772155762, "global_step": 506099, "epoch": 3012} {"train_loss": -12.626848220825195, "global_step": 506100, "epoch": 3012} {"train_loss": -12.170404434204102, "global_step": 506101, "epoch": 3012} {"train_loss": -12.396907806396484, "global_step": 506102, "epoch": 3012} {"train_loss": -11.204916000366211, "global_step": 506103, "epoch": 3012} {"train_loss": -12.814567565917969, "global_step": 506104, "epoch": 3012} {"train_loss": -12.134689331054688, "global_step": 506105, "epoch": 3012} {"train_loss": -12.0933256149292, "global_step": 506106, "epoch": 3012} {"train_loss": -11.820257186889648, "global_step": 506107, "epoch": 3012} {"train_loss": -12.458233833312988, "global_step": 506108, "epoch": 3012} {"train_loss": -12.185734748840332, "global_step": 506109, "epoch": 3012} {"train_loss": -12.075132369995117, "global_step": 506110, "epoch": 3012} {"train_loss": -11.831941604614258, "global_step": 506111, "epoch": 3012} {"train_loss": -12.276508331298828, "global_step": 506112, "epoch": 3012} {"train_loss": -12.468839645385742, "global_step": 506113, "epoch": 3012} {"train_loss": -12.213966369628906, "global_step": 506114, "epoch": 3012} {"train_loss": -12.533742904663086, "global_step": 506115, "epoch": 3012} {"train_loss": -12.078503608703613, "global_step": 506116, "epoch": 3012} {"train_loss": -12.537042617797852, "global_step": 506117, "epoch": 3012} {"train_loss": -11.810091972351074, "global_step": 506118, "epoch": 3012} {"train_loss": -12.522066116333008, "global_step": 506119, "epoch": 3012} {"train_loss": -12.100960731506348, "global_step": 506120, "epoch": 3012} {"train_loss": -11.573125839233398, "global_step": 506121, "epoch": 3012} {"train_loss": -12.716510772705078, "global_step": 506122, "epoch": 3012} {"train_loss": -12.034687042236328, "global_step": 506123, "epoch": 3012} {"train_loss": -12.317429542541504, "global_step": 506124, "epoch": 3012} {"train_loss": -12.751184463500977, "global_step": 506125, "epoch": 3012} {"train_loss": -12.01534366607666, "global_step": 506126, "epoch": 3012} {"train_loss": -12.80233383178711, "global_step": 506127, "epoch": 3012} {"train_loss": -12.495777130126953, "global_step": 506128, "epoch": 3012} {"train_loss": -12.77457332611084, "global_step": 506129, "epoch": 3012} {"train_loss": -12.657796859741211, "global_step": 506130, "epoch": 3012} {"train_loss": -11.695211410522461, "global_step": 506131, "epoch": 3012} {"train_loss": -12.747601509094238, "global_step": 506132, "epoch": 3012} {"train_loss": -11.727287292480469, "global_step": 506133, "epoch": 3012} {"train_loss": -12.779195785522461, "global_step": 506134, "epoch": 3012} {"train_loss": -12.260103225708008, "global_step": 506135, "epoch": 3012} {"train_loss": -12.395156860351562, "global_step": 506136, "epoch": 3012} {"train_loss": -11.850322723388672, "global_step": 506137, "epoch": 3012} {"train_loss": -11.785646438598633, "global_step": 506138, "epoch": 3012} {"train_loss": -12.804615020751953, "global_step": 506139, "epoch": 3012} {"train_loss": -11.811656951904297, "global_step": 506140, "epoch": 3012} {"train_loss": -12.009950637817383, "global_step": 506141, "epoch": 3012} {"train_loss": -11.802001953125, "global_step": 506142, "epoch": 3012} {"train_loss": -11.66064739227295, "global_step": 506143, "epoch": 3012} {"train_loss": -11.498157501220703, "global_step": 506144, "epoch": 3012} {"train_loss": -11.185978889465332, "global_step": 506145, "epoch": 3012} {"train_loss": -11.726372718811035, "global_step": 506146, "epoch": 3012} {"train_loss": -11.617979049682617, "global_step": 506147, "epoch": 3012} {"train_loss": -10.832240104675293, "global_step": 506148, "epoch": 3012} {"train_loss": -12.51693344116211, "global_step": 506149, "epoch": 3012} {"train_loss": -10.777586936950684, "global_step": 506150, "epoch": 3012} {"train_loss": -11.358278274536133, "global_step": 506151, "epoch": 3012} {"train_loss": -12.356786727905273, "global_step": 506152, "epoch": 3012} {"train_loss": -11.232465744018555, "global_step": 506153, "epoch": 3012} {"train_loss": -11.818758010864258, "global_step": 506154, "epoch": 3012} {"train_loss": -11.216751098632812, "global_step": 506155, "epoch": 3012} {"train_loss": -10.639607429504395, "global_step": 506156, "epoch": 3012} {"train_loss": -11.071596145629883, "global_step": 506157, "epoch": 3012} {"train_loss": -10.100997924804688, "global_step": 506158, "epoch": 3012} {"train_loss": -10.085348129272461, "global_step": 506159, "epoch": 3012} {"train_loss": -11.026620864868164, "global_step": 506160, "epoch": 3012} {"train_loss": -10.995586395263672, "global_step": 506161, "epoch": 3012} {"train_loss": -10.43851089477539, "global_step": 506162, "epoch": 3012} {"train_loss": -10.046183586120605, "global_step": 506163, "epoch": 3012} {"train_loss": -11.329659461975098, "global_step": 506164, "epoch": 3012} {"train_loss": -10.155477523803711, "global_step": 506165, "epoch": 3012} {"train_loss": -9.099250793457031, "global_step": 506166, "epoch": 3012} {"train_loss": -11.057951927185059, "global_step": 506167, "epoch": 3012} {"train_loss": -10.27964973449707, "global_step": 506168, "epoch": 3012} {"train_loss": -10.255064964294434, "global_step": 506169, "epoch": 3012} {"train_loss": -10.523147583007812, "global_step": 506170, "epoch": 3012} {"train_loss": -12.26994800567627, "global_step": 506171, "epoch": 3012} {"train_loss": -10.746590614318848, "global_step": 506172, "epoch": 3012} {"train_loss": -11.748971939086914, "global_step": 506173, "epoch": 3012} {"train_loss": -11.906773567199707, "global_step": 506174, "epoch": 3012} {"train_loss": -11.98816967010498, "global_step": 506175, "epoch": 3012} {"train_loss": -12.069708824157715, "global_step": 506176, "epoch": 3012} {"train_loss": -12.049359321594238, "global_step": 506177, "epoch": 3012} {"train_loss": -11.47573184967041, "global_step": 506178, "epoch": 3012} {"train_loss": -11.512763977050781, "global_step": 506179, "epoch": 3012} {"train_loss": -11.754493713378906, "global_step": 506180, "epoch": 3012} {"train_loss": -10.699723243713379, "global_step": 506181, "epoch": 3012} {"train_loss": -10.684919357299805, "global_step": 506182, "epoch": 3012} {"train_loss": -12.09084527265458, "global_step": 506183, "epoch": 3012, "val_loss": 315194.59375} {"train_loss": -11.004668235778809, "global_step": 506184, "epoch": 3013} {"train_loss": -10.849987030029297, "global_step": 506185, "epoch": 3013} {"train_loss": -11.519644737243652, "global_step": 506186, "epoch": 3013} {"train_loss": -11.315669059753418, "global_step": 506187, "epoch": 3013} {"train_loss": -11.206884384155273, "global_step": 506188, "epoch": 3013} {"train_loss": -12.186670303344727, "global_step": 506189, "epoch": 3013} {"train_loss": -11.703344345092773, "global_step": 506190, "epoch": 3013} {"train_loss": -11.474987983703613, "global_step": 506191, "epoch": 3013} {"train_loss": -12.286656379699707, "global_step": 506192, "epoch": 3013} {"train_loss": -11.800968170166016, "global_step": 506193, "epoch": 3013} {"train_loss": -12.048453330993652, "global_step": 506194, "epoch": 3013} {"train_loss": -11.905022621154785, "global_step": 506195, "epoch": 3013} {"train_loss": -11.697883605957031, "global_step": 506196, "epoch": 3013} {"train_loss": -12.008971214294434, "global_step": 506197, "epoch": 3013} {"train_loss": -11.88862419128418, "global_step": 506198, "epoch": 3013} {"train_loss": -12.013315200805664, "global_step": 506199, "epoch": 3013} {"train_loss": -11.909467697143555, "global_step": 506200, "epoch": 3013} {"train_loss": -12.000421524047852, "global_step": 506201, "epoch": 3013} {"train_loss": -11.984914779663086, "global_step": 506202, "epoch": 3013} {"train_loss": -11.650223731994629, "global_step": 506203, "epoch": 3013} {"train_loss": -11.984428405761719, "global_step": 506204, "epoch": 3013} {"train_loss": -11.81522274017334, "global_step": 506205, "epoch": 3013} {"train_loss": -11.801968574523926, "global_step": 506206, "epoch": 3013} {"train_loss": -12.37051010131836, "global_step": 506207, "epoch": 3013} {"train_loss": -11.84718132019043, "global_step": 506208, "epoch": 3013} {"train_loss": -11.882740020751953, "global_step": 506209, "epoch": 3013} {"train_loss": -12.566736221313477, "global_step": 506210, "epoch": 3013} {"train_loss": -11.93941593170166, "global_step": 506211, "epoch": 3013} {"train_loss": -12.501972198486328, "global_step": 506212, "epoch": 3013} {"train_loss": -11.876504898071289, "global_step": 506213, "epoch": 3013} {"train_loss": -12.229464530944824, "global_step": 506214, "epoch": 3013} {"train_loss": -11.755010604858398, "global_step": 506215, "epoch": 3013} {"train_loss": -11.930315017700195, "global_step": 506216, "epoch": 3013} {"train_loss": -12.068411827087402, "global_step": 506217, "epoch": 3013} {"train_loss": -12.010581970214844, "global_step": 506218, "epoch": 3013} {"train_loss": -12.281227111816406, "global_step": 506219, "epoch": 3013} {"train_loss": -12.218101501464844, "global_step": 506220, "epoch": 3013} {"train_loss": -11.85904312133789, "global_step": 506221, "epoch": 3013} {"train_loss": -11.925779342651367, "global_step": 506222, "epoch": 3013} {"train_loss": -12.295506477355957, "global_step": 506223, "epoch": 3013} {"train_loss": -12.079521179199219, "global_step": 506224, "epoch": 3013} {"train_loss": -12.184610366821289, "global_step": 506225, "epoch": 3013} {"train_loss": -12.136563301086426, "global_step": 506226, "epoch": 3013} {"train_loss": -12.06181812286377, "global_step": 506227, "epoch": 3013} {"train_loss": -12.633342742919922, "global_step": 506228, "epoch": 3013} {"train_loss": -12.12514591217041, "global_step": 506229, "epoch": 3013} {"train_loss": -12.339229583740234, "global_step": 506230, "epoch": 3013} {"train_loss": -12.331812858581543, "global_step": 506231, "epoch": 3013} {"train_loss": -12.60806655883789, "global_step": 506232, "epoch": 3013} {"train_loss": -12.555242538452148, "global_step": 506233, "epoch": 3013} {"train_loss": -12.507640838623047, "global_step": 506234, "epoch": 3013} {"train_loss": -12.662664413452148, "global_step": 506235, "epoch": 3013} {"train_loss": -12.49995231628418, "global_step": 506236, "epoch": 3013} {"train_loss": -12.602099418640137, "global_step": 506237, "epoch": 3013} {"train_loss": -12.436030387878418, "global_step": 506238, "epoch": 3013} {"train_loss": -12.494951248168945, "global_step": 506239, "epoch": 3013} {"train_loss": -12.466631889343262, "global_step": 506240, "epoch": 3013} {"train_loss": -12.660661697387695, "global_step": 506241, "epoch": 3013} {"train_loss": -12.563434600830078, "global_step": 506242, "epoch": 3013} {"train_loss": -12.822006225585938, "global_step": 506243, "epoch": 3013} {"train_loss": -12.722064971923828, "global_step": 506244, "epoch": 3013} {"train_loss": -12.618099212646484, "global_step": 506245, "epoch": 3013} {"train_loss": -12.839119911193848, "global_step": 506246, "epoch": 3013} {"train_loss": -12.536503791809082, "global_step": 506247, "epoch": 3013} {"train_loss": -12.721447944641113, "global_step": 506248, "epoch": 3013} {"train_loss": -12.573668479919434, "global_step": 506249, "epoch": 3013} {"train_loss": -12.458802223205566, "global_step": 506250, "epoch": 3013} {"train_loss": -12.398880004882812, "global_step": 506251, "epoch": 3013} {"train_loss": -12.456343650817871, "global_step": 506252, "epoch": 3013} {"train_loss": -12.166910171508789, "global_step": 506253, "epoch": 3013} {"train_loss": -12.695013046264648, "global_step": 506254, "epoch": 3013} {"train_loss": -12.305706977844238, "global_step": 506255, "epoch": 3013} {"train_loss": -12.473600387573242, "global_step": 506256, "epoch": 3013} {"train_loss": -12.501920700073242, "global_step": 506257, "epoch": 3013} {"train_loss": -12.352783203125, "global_step": 506258, "epoch": 3013} {"train_loss": -12.841303825378418, "global_step": 506259, "epoch": 3013} {"train_loss": -12.483627319335938, "global_step": 506260, "epoch": 3013} {"train_loss": -12.504251480102539, "global_step": 506261, "epoch": 3013} {"train_loss": -12.724447250366211, "global_step": 506262, "epoch": 3013} {"train_loss": -12.253081321716309, "global_step": 506263, "epoch": 3013} {"train_loss": -12.270807266235352, "global_step": 506264, "epoch": 3013} {"train_loss": -12.692049980163574, "global_step": 506265, "epoch": 3013} {"train_loss": -12.390714645385742, "global_step": 506266, "epoch": 3013} {"train_loss": -12.627148628234863, "global_step": 506267, "epoch": 3013} {"train_loss": -12.5482816696167, "global_step": 506268, "epoch": 3013} {"train_loss": -12.393428802490234, "global_step": 506269, "epoch": 3013} {"train_loss": -12.934470176696777, "global_step": 506270, "epoch": 3013} {"train_loss": -12.56859016418457, "global_step": 506271, "epoch": 3013} {"train_loss": -12.704269409179688, "global_step": 506272, "epoch": 3013} {"train_loss": -12.774311065673828, "global_step": 506273, "epoch": 3013} {"train_loss": -12.722753524780273, "global_step": 506274, "epoch": 3013} {"train_loss": -12.709222793579102, "global_step": 506275, "epoch": 3013} {"train_loss": -12.893623352050781, "global_step": 506276, "epoch": 3013} {"train_loss": -12.626773834228516, "global_step": 506277, "epoch": 3013} {"train_loss": -12.917158126831055, "global_step": 506278, "epoch": 3013} {"train_loss": -12.63105583190918, "global_step": 506279, "epoch": 3013} {"train_loss": -12.696972846984863, "global_step": 506280, "epoch": 3013} {"train_loss": -13.006219863891602, "global_step": 506281, "epoch": 3013} {"train_loss": -12.759475708007812, "global_step": 506282, "epoch": 3013} {"train_loss": -12.832240104675293, "global_step": 506283, "epoch": 3013} {"train_loss": -13.042510986328125, "global_step": 506284, "epoch": 3013} {"train_loss": -12.828417778015137, "global_step": 506285, "epoch": 3013} {"train_loss": -12.920622825622559, "global_step": 506286, "epoch": 3013} {"train_loss": -12.876161575317383, "global_step": 506287, "epoch": 3013} {"train_loss": -12.604108810424805, "global_step": 506288, "epoch": 3013} {"train_loss": -12.94497299194336, "global_step": 506289, "epoch": 3013} {"train_loss": -12.754655838012695, "global_step": 506290, "epoch": 3013} {"train_loss": -12.939325332641602, "global_step": 506291, "epoch": 3013} {"train_loss": -12.907562255859375, "global_step": 506292, "epoch": 3013} {"train_loss": -13.037914276123047, "global_step": 506293, "epoch": 3013} {"train_loss": -13.01059627532959, "global_step": 506294, "epoch": 3013} {"train_loss": -12.912477493286133, "global_step": 506295, "epoch": 3013} {"train_loss": -12.89859676361084, "global_step": 506296, "epoch": 3013} {"train_loss": -12.717123031616211, "global_step": 506297, "epoch": 3013} {"train_loss": -13.118905067443848, "global_step": 506298, "epoch": 3013} {"train_loss": -12.964345932006836, "global_step": 506299, "epoch": 3013} {"train_loss": -12.794788360595703, "global_step": 506300, "epoch": 3013} {"train_loss": -13.043120384216309, "global_step": 506301, "epoch": 3013} {"train_loss": -12.496397972106934, "global_step": 506302, "epoch": 3013} {"train_loss": -12.645203590393066, "global_step": 506303, "epoch": 3013} {"train_loss": -12.861114501953125, "global_step": 506304, "epoch": 3013} {"train_loss": -12.598672866821289, "global_step": 506305, "epoch": 3013} {"train_loss": -12.807212829589844, "global_step": 506306, "epoch": 3013} {"train_loss": -13.04954719543457, "global_step": 506307, "epoch": 3013} {"train_loss": -12.575216293334961, "global_step": 506308, "epoch": 3013} {"train_loss": -12.487910270690918, "global_step": 506309, "epoch": 3013} {"train_loss": -13.06209945678711, "global_step": 506310, "epoch": 3013} {"train_loss": -12.598922729492188, "global_step": 506311, "epoch": 3013} {"train_loss": -12.670209884643555, "global_step": 506312, "epoch": 3013} {"train_loss": -12.862732887268066, "global_step": 506313, "epoch": 3013} {"train_loss": -12.829024314880371, "global_step": 506314, "epoch": 3013} {"train_loss": -12.647520065307617, "global_step": 506315, "epoch": 3013} {"train_loss": -12.765169143676758, "global_step": 506316, "epoch": 3013} {"train_loss": -12.962066650390625, "global_step": 506317, "epoch": 3013} {"train_loss": -12.789295196533203, "global_step": 506318, "epoch": 3013} {"train_loss": -12.648720741271973, "global_step": 506319, "epoch": 3013} {"train_loss": -12.611663818359375, "global_step": 506320, "epoch": 3013} {"train_loss": -12.867659568786621, "global_step": 506321, "epoch": 3013} {"train_loss": -12.880566596984863, "global_step": 506322, "epoch": 3013} {"train_loss": -12.996759414672852, "global_step": 506323, "epoch": 3013} {"train_loss": -12.571944236755371, "global_step": 506324, "epoch": 3013} {"train_loss": -12.97852611541748, "global_step": 506325, "epoch": 3013} {"train_loss": -12.753511428833008, "global_step": 506326, "epoch": 3013} {"train_loss": -12.837239265441895, "global_step": 506327, "epoch": 3013} {"train_loss": -13.014726638793945, "global_step": 506328, "epoch": 3013} {"train_loss": -12.934773445129395, "global_step": 506329, "epoch": 3013} {"train_loss": -13.118305206298828, "global_step": 506330, "epoch": 3013} {"train_loss": -12.77053165435791, "global_step": 506331, "epoch": 3013} {"train_loss": -13.029672622680664, "global_step": 506332, "epoch": 3013} {"train_loss": -12.983360290527344, "global_step": 506333, "epoch": 3013} {"train_loss": -12.95386028289795, "global_step": 506334, "epoch": 3013} {"train_loss": -12.986703872680664, "global_step": 506335, "epoch": 3013} {"train_loss": -13.080926895141602, "global_step": 506336, "epoch": 3013} {"train_loss": -13.216206550598145, "global_step": 506337, "epoch": 3013} {"train_loss": -12.871438026428223, "global_step": 506338, "epoch": 3013} {"train_loss": -12.721349716186523, "global_step": 506339, "epoch": 3013} {"train_loss": -12.737730026245117, "global_step": 506340, "epoch": 3013} {"train_loss": -12.91634750366211, "global_step": 506341, "epoch": 3013} {"train_loss": -12.92683219909668, "global_step": 506342, "epoch": 3013} {"train_loss": -12.872843742370605, "global_step": 506343, "epoch": 3013} {"train_loss": -12.55691146850586, "global_step": 506344, "epoch": 3013} {"train_loss": -11.458480834960938, "global_step": 506345, "epoch": 3013} {"train_loss": -12.439322471618652, "global_step": 506346, "epoch": 3013} {"train_loss": -13.125128746032715, "global_step": 506347, "epoch": 3013} {"train_loss": -11.834810256958008, "global_step": 506348, "epoch": 3013} {"train_loss": -12.09766960144043, "global_step": 506349, "epoch": 3013} {"train_loss": -12.181269645690918, "global_step": 506350, "epoch": 3013} {"train_loss": -12.489545260156904, "global_step": 506351, "epoch": 3013, "val_loss": 319687.125} {"train_loss": -10.770273208618164, "global_step": 506352, "epoch": 3014} {"train_loss": -11.167181015014648, "global_step": 506353, "epoch": 3014} {"train_loss": -12.277338027954102, "global_step": 506354, "epoch": 3014} {"train_loss": -10.029594421386719, "global_step": 506355, "epoch": 3014} {"train_loss": -10.574767112731934, "global_step": 506356, "epoch": 3014} {"train_loss": -8.796592712402344, "global_step": 506357, "epoch": 3014} {"train_loss": -10.392805099487305, "global_step": 506358, "epoch": 3014} {"train_loss": -9.5451078414917, "global_step": 506359, "epoch": 3014} {"train_loss": -9.864957809448242, "global_step": 506360, "epoch": 3014} {"train_loss": -9.548599243164062, "global_step": 506361, "epoch": 3014} {"train_loss": -9.806167602539062, "global_step": 506362, "epoch": 3014} {"train_loss": -9.115983963012695, "global_step": 506363, "epoch": 3014} {"train_loss": -9.052474975585938, "global_step": 506364, "epoch": 3014} {"train_loss": -10.988330841064453, "global_step": 506365, "epoch": 3014} {"train_loss": -9.697482109069824, "global_step": 506366, "epoch": 3014} {"train_loss": -9.273115158081055, "global_step": 506367, "epoch": 3014} {"train_loss": -10.268766403198242, "global_step": 506368, "epoch": 3014} {"train_loss": -10.499465942382812, "global_step": 506369, "epoch": 3014} {"train_loss": -10.754438400268555, "global_step": 506370, "epoch": 3014} {"train_loss": -11.04446792602539, "global_step": 506371, "epoch": 3014} {"train_loss": -10.697010040283203, "global_step": 506372, "epoch": 3014} {"train_loss": -11.210384368896484, "global_step": 506373, "epoch": 3014} {"train_loss": -11.317865371704102, "global_step": 506374, "epoch": 3014} {"train_loss": -10.962930679321289, "global_step": 506375, "epoch": 3014} {"train_loss": -11.094573020935059, "global_step": 506376, "epoch": 3014} {"train_loss": -11.048877716064453, "global_step": 506377, "epoch": 3014} {"train_loss": -11.848926544189453, "global_step": 506378, "epoch": 3014} {"train_loss": -11.525819778442383, "global_step": 506379, "epoch": 3014} {"train_loss": -10.52757453918457, "global_step": 506380, "epoch": 3014} {"train_loss": -11.448759078979492, "global_step": 506381, "epoch": 3014} {"train_loss": -10.311965942382812, "global_step": 506382, "epoch": 3014} {"train_loss": -11.297891616821289, "global_step": 506383, "epoch": 3014} {"train_loss": -11.25843620300293, "global_step": 506384, "epoch": 3014} {"train_loss": -11.186795234680176, "global_step": 506385, "epoch": 3014} {"train_loss": -11.344806671142578, "global_step": 506386, "epoch": 3014} {"train_loss": -11.625741958618164, "global_step": 506387, "epoch": 3014} {"train_loss": -11.494888305664062, "global_step": 506388, "epoch": 3014} {"train_loss": -12.191468238830566, "global_step": 506389, "epoch": 3014} {"train_loss": -11.890021324157715, "global_step": 506390, "epoch": 3014} {"train_loss": -11.710989952087402, "global_step": 506391, "epoch": 3014} {"train_loss": -11.90365982055664, "global_step": 506392, "epoch": 3014} {"train_loss": -11.437047958374023, "global_step": 506393, "epoch": 3014} {"train_loss": -12.408447265625, "global_step": 506394, "epoch": 3014} {"train_loss": -11.75961971282959, "global_step": 506395, "epoch": 3014} {"train_loss": -12.136409759521484, "global_step": 506396, "epoch": 3014} {"train_loss": -11.585660934448242, "global_step": 506397, "epoch": 3014} {"train_loss": -11.267294883728027, "global_step": 506398, "epoch": 3014} {"train_loss": -12.420820236206055, "global_step": 506399, "epoch": 3014} {"train_loss": -11.846510887145996, "global_step": 506400, "epoch": 3014} {"train_loss": -12.14041519165039, "global_step": 506401, "epoch": 3014} {"train_loss": -11.813321113586426, "global_step": 506402, "epoch": 3014} {"train_loss": -10.964691162109375, "global_step": 506403, "epoch": 3014} {"train_loss": -12.332643508911133, "global_step": 506404, "epoch": 3014} {"train_loss": -11.614534378051758, "global_step": 506405, "epoch": 3014} {"train_loss": -12.105500221252441, "global_step": 506406, "epoch": 3014} {"train_loss": -11.87188720703125, "global_step": 506407, "epoch": 3014} {"train_loss": -11.864070892333984, "global_step": 506408, "epoch": 3014} {"train_loss": -12.022518157958984, "global_step": 506409, "epoch": 3014} {"train_loss": -12.16670036315918, "global_step": 506410, "epoch": 3014} {"train_loss": -11.679723739624023, "global_step": 506411, "epoch": 3014} {"train_loss": -12.416794776916504, "global_step": 506412, "epoch": 3014} {"train_loss": -12.250410079956055, "global_step": 506413, "epoch": 3014} {"train_loss": -12.154288291931152, "global_step": 506414, "epoch": 3014} {"train_loss": -12.270109176635742, "global_step": 506415, "epoch": 3014} {"train_loss": -11.883560180664062, "global_step": 506416, "epoch": 3014} {"train_loss": -11.927644729614258, "global_step": 506417, "epoch": 3014} {"train_loss": -12.25121021270752, "global_step": 506418, "epoch": 3014} {"train_loss": -12.198957443237305, "global_step": 506419, "epoch": 3014} {"train_loss": -12.588626861572266, "global_step": 506420, "epoch": 3014} {"train_loss": -12.435215950012207, "global_step": 506421, "epoch": 3014} {"train_loss": -12.507567405700684, "global_step": 506422, "epoch": 3014} {"train_loss": -12.384992599487305, "global_step": 506423, "epoch": 3014} {"train_loss": -12.619819641113281, "global_step": 506424, "epoch": 3014} {"train_loss": -12.626583099365234, "global_step": 506425, "epoch": 3014} {"train_loss": -12.431303024291992, "global_step": 506426, "epoch": 3014} {"train_loss": -12.401009559631348, "global_step": 506427, "epoch": 3014} {"train_loss": -12.521451950073242, "global_step": 506428, "epoch": 3014} {"train_loss": -12.464380264282227, "global_step": 506429, "epoch": 3014} {"train_loss": -12.465668678283691, "global_step": 506430, "epoch": 3014} {"train_loss": -12.467174530029297, "global_step": 506431, "epoch": 3014} {"train_loss": -12.417850494384766, "global_step": 506432, "epoch": 3014} {"train_loss": -12.354666709899902, "global_step": 506433, "epoch": 3014} {"train_loss": -12.512500762939453, "global_step": 506434, "epoch": 3014} {"train_loss": -12.571385383605957, "global_step": 506435, "epoch": 3014} {"train_loss": -12.467509269714355, "global_step": 506436, "epoch": 3014} {"train_loss": -12.618816375732422, "global_step": 506437, "epoch": 3014} {"train_loss": -12.619324684143066, "global_step": 506438, "epoch": 3014} {"train_loss": -12.684340476989746, "global_step": 506439, "epoch": 3014} {"train_loss": -12.339080810546875, "global_step": 506440, "epoch": 3014} {"train_loss": -12.232410430908203, "global_step": 506441, "epoch": 3014} {"train_loss": -12.209797859191895, "global_step": 506442, "epoch": 3014} {"train_loss": -12.269390106201172, "global_step": 506443, "epoch": 3014} {"train_loss": -12.433473587036133, "global_step": 506444, "epoch": 3014} {"train_loss": -12.633770942687988, "global_step": 506445, "epoch": 3014} {"train_loss": -12.407013893127441, "global_step": 506446, "epoch": 3014} {"train_loss": -11.990123748779297, "global_step": 506447, "epoch": 3014} {"train_loss": -12.296260833740234, "global_step": 506448, "epoch": 3014} {"train_loss": -12.277641296386719, "global_step": 506449, "epoch": 3014} {"train_loss": -11.617025375366211, "global_step": 506450, "epoch": 3014} {"train_loss": -12.390565872192383, "global_step": 506451, "epoch": 3014} {"train_loss": -12.37601089477539, "global_step": 506452, "epoch": 3014} {"train_loss": -11.876714706420898, "global_step": 506453, "epoch": 3014} {"train_loss": -12.724546432495117, "global_step": 506454, "epoch": 3014} {"train_loss": -12.208154678344727, "global_step": 506455, "epoch": 3014} {"train_loss": -12.323731422424316, "global_step": 506456, "epoch": 3014} {"train_loss": -12.421037673950195, "global_step": 506457, "epoch": 3014} {"train_loss": -11.773406982421875, "global_step": 506458, "epoch": 3014} {"train_loss": -12.236746788024902, "global_step": 506459, "epoch": 3014} {"train_loss": -11.847151756286621, "global_step": 506460, "epoch": 3014} {"train_loss": -11.501648902893066, "global_step": 506461, "epoch": 3014} {"train_loss": -12.533407211303711, "global_step": 506462, "epoch": 3014} {"train_loss": -11.914012908935547, "global_step": 506463, "epoch": 3014} {"train_loss": -12.568124771118164, "global_step": 506464, "epoch": 3014} {"train_loss": -12.28475570678711, "global_step": 506465, "epoch": 3014} {"train_loss": -12.072519302368164, "global_step": 506466, "epoch": 3014} {"train_loss": -12.320666313171387, "global_step": 506467, "epoch": 3014} {"train_loss": -12.404035568237305, "global_step": 506468, "epoch": 3014} {"train_loss": -11.88797378540039, "global_step": 506469, "epoch": 3014} {"train_loss": -12.679244995117188, "global_step": 506470, "epoch": 3014} {"train_loss": -12.671989440917969, "global_step": 506471, "epoch": 3014} {"train_loss": -12.418472290039062, "global_step": 506472, "epoch": 3014} {"train_loss": -12.652780532836914, "global_step": 506473, "epoch": 3014} {"train_loss": -12.327912330627441, "global_step": 506474, "epoch": 3014} {"train_loss": -11.974428176879883, "global_step": 506475, "epoch": 3014} {"train_loss": -12.468968391418457, "global_step": 506476, "epoch": 3014} {"train_loss": -11.94288444519043, "global_step": 506477, "epoch": 3014} {"train_loss": -12.077129364013672, "global_step": 506478, "epoch": 3014} {"train_loss": -12.624921798706055, "global_step": 506479, "epoch": 3014} {"train_loss": -12.262407302856445, "global_step": 506480, "epoch": 3014} {"train_loss": -12.41930866241455, "global_step": 506481, "epoch": 3014} {"train_loss": -12.43686580657959, "global_step": 506482, "epoch": 3014} {"train_loss": -11.967500686645508, "global_step": 506483, "epoch": 3014} {"train_loss": -11.708503723144531, "global_step": 506484, "epoch": 3014} {"train_loss": -12.243048667907715, "global_step": 506485, "epoch": 3014} {"train_loss": -12.064388275146484, "global_step": 506486, "epoch": 3014} {"train_loss": -11.573001861572266, "global_step": 506487, "epoch": 3014} {"train_loss": -12.469359397888184, "global_step": 506488, "epoch": 3014} {"train_loss": -11.559871673583984, "global_step": 506489, "epoch": 3014} {"train_loss": -12.145570755004883, "global_step": 506490, "epoch": 3014} {"train_loss": -11.781403541564941, "global_step": 506491, "epoch": 3014} {"train_loss": -12.19782829284668, "global_step": 506492, "epoch": 3014} {"train_loss": -12.405672073364258, "global_step": 506493, "epoch": 3014} {"train_loss": -11.745753288269043, "global_step": 506494, "epoch": 3014} {"train_loss": -12.674864768981934, "global_step": 506495, "epoch": 3014} {"train_loss": -11.394874572753906, "global_step": 506496, "epoch": 3014} {"train_loss": -12.29018783569336, "global_step": 506497, "epoch": 3014} {"train_loss": -11.995201110839844, "global_step": 506498, "epoch": 3014} {"train_loss": -12.162912368774414, "global_step": 506499, "epoch": 3014} {"train_loss": -12.434715270996094, "global_step": 506500, "epoch": 3014} {"train_loss": -12.414780616760254, "global_step": 506501, "epoch": 3014} {"train_loss": -12.35801887512207, "global_step": 506502, "epoch": 3014} {"train_loss": -12.723244667053223, "global_step": 506503, "epoch": 3014} {"train_loss": -12.75285530090332, "global_step": 506504, "epoch": 3014} {"train_loss": -12.78197956085205, "global_step": 506505, "epoch": 3014} {"train_loss": -12.766518592834473, "global_step": 506506, "epoch": 3014} {"train_loss": -12.612815856933594, "global_step": 506507, "epoch": 3014} {"train_loss": -12.704617500305176, "global_step": 506508, "epoch": 3014} {"train_loss": -12.861785888671875, "global_step": 506509, "epoch": 3014} {"train_loss": -12.709640502929688, "global_step": 506510, "epoch": 3014} {"train_loss": -12.877687454223633, "global_step": 506511, "epoch": 3014} {"train_loss": -12.752100944519043, "global_step": 506512, "epoch": 3014} {"train_loss": -12.77560043334961, "global_step": 506513, "epoch": 3014} {"train_loss": -12.721595764160156, "global_step": 506514, "epoch": 3014} {"train_loss": -12.580483436584473, "global_step": 506515, "epoch": 3014} {"train_loss": -12.974397659301758, "global_step": 506516, "epoch": 3014} {"train_loss": -12.748865127563477, "global_step": 506517, "epoch": 3014} {"train_loss": -12.985925674438477, "global_step": 506518, "epoch": 3014} {"train_loss": -11.906601866086325, "global_step": 506519, "epoch": 3014, "val_loss": 315424.90625} {"train_loss": -12.69322395324707, "global_step": 506520, "epoch": 3015} {"train_loss": -12.898097038269043, "global_step": 506521, "epoch": 3015} {"train_loss": -12.903635025024414, "global_step": 506522, "epoch": 3015} {"train_loss": -12.655455589294434, "global_step": 506523, "epoch": 3015} {"train_loss": -12.568414688110352, "global_step": 506524, "epoch": 3015} {"train_loss": -12.821878433227539, "global_step": 506525, "epoch": 3015} {"train_loss": -12.668834686279297, "global_step": 506526, "epoch": 3015} {"train_loss": -12.566703796386719, "global_step": 506527, "epoch": 3015} {"train_loss": -12.976629257202148, "global_step": 506528, "epoch": 3015} {"train_loss": -12.669673919677734, "global_step": 506529, "epoch": 3015} {"train_loss": -12.61538314819336, "global_step": 506530, "epoch": 3015} {"train_loss": -12.713400840759277, "global_step": 506531, "epoch": 3015} {"train_loss": -12.898565292358398, "global_step": 506532, "epoch": 3015} {"train_loss": -12.91411304473877, "global_step": 506533, "epoch": 3015} {"train_loss": -12.76452350616455, "global_step": 506534, "epoch": 3015} {"train_loss": -12.893777847290039, "global_step": 506535, "epoch": 3015} {"train_loss": -12.99133014678955, "global_step": 506536, "epoch": 3015} {"train_loss": -12.82542610168457, "global_step": 506537, "epoch": 3015} {"train_loss": -12.962148666381836, "global_step": 506538, "epoch": 3015} {"train_loss": -12.887163162231445, "global_step": 506539, "epoch": 3015} {"train_loss": -12.805438041687012, "global_step": 506540, "epoch": 3015} {"train_loss": -12.995108604431152, "global_step": 506541, "epoch": 3015} {"train_loss": -12.793331146240234, "global_step": 506542, "epoch": 3015} {"train_loss": -12.627803802490234, "global_step": 506543, "epoch": 3015} {"train_loss": -12.790849685668945, "global_step": 506544, "epoch": 3015} {"train_loss": -12.539644241333008, "global_step": 506545, "epoch": 3015} {"train_loss": -12.6393461227417, "global_step": 506546, "epoch": 3015} {"train_loss": -12.635732650756836, "global_step": 506547, "epoch": 3015} {"train_loss": -12.369546890258789, "global_step": 506548, "epoch": 3015} {"train_loss": -11.213520050048828, "global_step": 506549, "epoch": 3015} {"train_loss": -11.969625473022461, "global_step": 506550, "epoch": 3015} {"train_loss": -12.595297813415527, "global_step": 506551, "epoch": 3015} {"train_loss": -12.06623649597168, "global_step": 506552, "epoch": 3015} {"train_loss": -12.901784896850586, "global_step": 506553, "epoch": 3015} {"train_loss": -12.46485710144043, "global_step": 506554, "epoch": 3015} {"train_loss": -12.307741165161133, "global_step": 506555, "epoch": 3015} {"train_loss": -11.776193618774414, "global_step": 506556, "epoch": 3015} {"train_loss": -11.771615982055664, "global_step": 506557, "epoch": 3015} {"train_loss": -11.437387466430664, "global_step": 506558, "epoch": 3015} {"train_loss": -11.868247985839844, "global_step": 506559, "epoch": 3015} {"train_loss": -12.490221977233887, "global_step": 506560, "epoch": 3015} {"train_loss": -11.575057029724121, "global_step": 506561, "epoch": 3015} {"train_loss": -11.341179847717285, "global_step": 506562, "epoch": 3015} {"train_loss": -12.870975494384766, "global_step": 506563, "epoch": 3015} {"train_loss": -11.429046630859375, "global_step": 506564, "epoch": 3015} {"train_loss": -11.20533561706543, "global_step": 506565, "epoch": 3015} {"train_loss": -12.218297004699707, "global_step": 506566, "epoch": 3015} {"train_loss": -9.766280174255371, "global_step": 506567, "epoch": 3015} {"train_loss": -10.95402717590332, "global_step": 506568, "epoch": 3015} {"train_loss": -10.01718521118164, "global_step": 506569, "epoch": 3015} {"train_loss": -10.349172592163086, "global_step": 506570, "epoch": 3015} {"train_loss": -9.592728614807129, "global_step": 506571, "epoch": 3015} {"train_loss": -9.547842025756836, "global_step": 506572, "epoch": 3015} {"train_loss": -10.328829765319824, "global_step": 506573, "epoch": 3015} {"train_loss": -9.951956748962402, "global_step": 506574, "epoch": 3015} {"train_loss": -9.978694915771484, "global_step": 506575, "epoch": 3015} {"train_loss": -10.106009483337402, "global_step": 506576, "epoch": 3015} {"train_loss": -11.059917449951172, "global_step": 506577, "epoch": 3015} {"train_loss": -11.886367797851562, "global_step": 506578, "epoch": 3015} {"train_loss": -11.160736083984375, "global_step": 506579, "epoch": 3015} {"train_loss": -11.967334747314453, "global_step": 506580, "epoch": 3015} {"train_loss": -11.4227294921875, "global_step": 506581, "epoch": 3015} {"train_loss": -11.358749389648438, "global_step": 506582, "epoch": 3015} {"train_loss": -12.338983535766602, "global_step": 506583, "epoch": 3015} {"train_loss": -11.394594192504883, "global_step": 506584, "epoch": 3015} {"train_loss": -12.311004638671875, "global_step": 506585, "epoch": 3015} {"train_loss": -11.51709270477295, "global_step": 506586, "epoch": 3015} {"train_loss": -12.04143238067627, "global_step": 506587, "epoch": 3015} {"train_loss": -11.347448348999023, "global_step": 506588, "epoch": 3015} {"train_loss": -12.304082870483398, "global_step": 506589, "epoch": 3015} {"train_loss": -11.959138870239258, "global_step": 506590, "epoch": 3015} {"train_loss": -12.528657913208008, "global_step": 506591, "epoch": 3015} {"train_loss": -12.370917320251465, "global_step": 506592, "epoch": 3015} {"train_loss": -11.994078636169434, "global_step": 506593, "epoch": 3015} {"train_loss": -12.576669692993164, "global_step": 506594, "epoch": 3015} {"train_loss": -11.70971965789795, "global_step": 506595, "epoch": 3015} {"train_loss": -12.521933555603027, "global_step": 506596, "epoch": 3015} {"train_loss": -11.762210845947266, "global_step": 506597, "epoch": 3015} {"train_loss": -12.469808578491211, "global_step": 506598, "epoch": 3015} {"train_loss": -12.062126159667969, "global_step": 506599, "epoch": 3015} {"train_loss": -12.607866287231445, "global_step": 506600, "epoch": 3015} {"train_loss": -12.014222145080566, "global_step": 506601, "epoch": 3015} {"train_loss": -12.347593307495117, "global_step": 506602, "epoch": 3015} {"train_loss": -12.109979629516602, "global_step": 506603, "epoch": 3015} {"train_loss": -12.450098991394043, "global_step": 506604, "epoch": 3015} {"train_loss": -12.510019302368164, "global_step": 506605, "epoch": 3015} {"train_loss": -12.653142929077148, "global_step": 506606, "epoch": 3015} {"train_loss": -12.846814155578613, "global_step": 506607, "epoch": 3015} {"train_loss": -12.618902206420898, "global_step": 506608, "epoch": 3015} {"train_loss": -12.3138427734375, "global_step": 506609, "epoch": 3015} {"train_loss": -12.683897018432617, "global_step": 506610, "epoch": 3015} {"train_loss": -12.451251029968262, "global_step": 506611, "epoch": 3015} {"train_loss": -12.776187896728516, "global_step": 506612, "epoch": 3015} {"train_loss": -12.195225715637207, "global_step": 506613, "epoch": 3015} {"train_loss": -12.625490188598633, "global_step": 506614, "epoch": 3015} {"train_loss": -12.722832679748535, "global_step": 506615, "epoch": 3015} {"train_loss": -12.502038955688477, "global_step": 506616, "epoch": 3015} {"train_loss": -12.71200180053711, "global_step": 506617, "epoch": 3015} {"train_loss": -12.366429328918457, "global_step": 506618, "epoch": 3015} {"train_loss": -12.757028579711914, "global_step": 506619, "epoch": 3015} {"train_loss": -12.510619163513184, "global_step": 506620, "epoch": 3015} {"train_loss": -12.637815475463867, "global_step": 506621, "epoch": 3015} {"train_loss": -12.61087703704834, "global_step": 506622, "epoch": 3015} {"train_loss": -12.52729606628418, "global_step": 506623, "epoch": 3015} {"train_loss": -12.595724105834961, "global_step": 506624, "epoch": 3015} {"train_loss": -12.592277526855469, "global_step": 506625, "epoch": 3015} {"train_loss": -12.69479751586914, "global_step": 506626, "epoch": 3015} {"train_loss": -12.649836540222168, "global_step": 506627, "epoch": 3015} {"train_loss": -12.786066055297852, "global_step": 506628, "epoch": 3015} {"train_loss": -12.489517211914062, "global_step": 506629, "epoch": 3015} {"train_loss": -12.404199600219727, "global_step": 506630, "epoch": 3015} {"train_loss": -12.501175880432129, "global_step": 506631, "epoch": 3015} {"train_loss": -12.401189804077148, "global_step": 506632, "epoch": 3015} {"train_loss": -12.165596008300781, "global_step": 506633, "epoch": 3015} {"train_loss": -12.354130744934082, "global_step": 506634, "epoch": 3015} {"train_loss": -12.773150444030762, "global_step": 506635, "epoch": 3015} {"train_loss": -12.742437362670898, "global_step": 506636, "epoch": 3015} {"train_loss": -12.29493522644043, "global_step": 506637, "epoch": 3015} {"train_loss": -12.376581192016602, "global_step": 506638, "epoch": 3015} {"train_loss": -12.850290298461914, "global_step": 506639, "epoch": 3015} {"train_loss": -12.04190444946289, "global_step": 506640, "epoch": 3015} {"train_loss": -12.296483993530273, "global_step": 506641, "epoch": 3015} {"train_loss": -12.431120872497559, "global_step": 506642, "epoch": 3015} {"train_loss": -12.249066352844238, "global_step": 506643, "epoch": 3015} {"train_loss": -11.714241027832031, "global_step": 506644, "epoch": 3015} {"train_loss": -12.645480155944824, "global_step": 506645, "epoch": 3015} {"train_loss": -12.014169692993164, "global_step": 506646, "epoch": 3015} {"train_loss": -12.443537712097168, "global_step": 506647, "epoch": 3015} {"train_loss": -12.48111343383789, "global_step": 506648, "epoch": 3015} {"train_loss": -11.993179321289062, "global_step": 506649, "epoch": 3015} {"train_loss": -11.734533309936523, "global_step": 506650, "epoch": 3015} {"train_loss": -12.578201293945312, "global_step": 506651, "epoch": 3015} {"train_loss": -12.532190322875977, "global_step": 506652, "epoch": 3015} {"train_loss": -11.9143705368042, "global_step": 506653, "epoch": 3015} {"train_loss": -11.461599349975586, "global_step": 506654, "epoch": 3015} {"train_loss": -12.403079986572266, "global_step": 506655, "epoch": 3015} {"train_loss": -11.264876365661621, "global_step": 506656, "epoch": 3015} {"train_loss": -12.566736221313477, "global_step": 506657, "epoch": 3015} {"train_loss": -11.23160171508789, "global_step": 506658, "epoch": 3015} {"train_loss": -11.38606071472168, "global_step": 506659, "epoch": 3015} {"train_loss": -12.639328002929688, "global_step": 506660, "epoch": 3015} {"train_loss": -12.534370422363281, "global_step": 506661, "epoch": 3015} {"train_loss": -12.199023246765137, "global_step": 506662, "epoch": 3015} {"train_loss": -12.382530212402344, "global_step": 506663, "epoch": 3015} {"train_loss": -11.328645706176758, "global_step": 506664, "epoch": 3015} {"train_loss": -12.017845153808594, "global_step": 506665, "epoch": 3015} {"train_loss": -11.640101432800293, "global_step": 506666, "epoch": 3015} {"train_loss": -11.23491096496582, "global_step": 506667, "epoch": 3015} {"train_loss": -12.329764366149902, "global_step": 506668, "epoch": 3015} {"train_loss": -11.862987518310547, "global_step": 506669, "epoch": 3015} {"train_loss": -11.69019889831543, "global_step": 506670, "epoch": 3015} {"train_loss": -11.88575553894043, "global_step": 506671, "epoch": 3015} {"train_loss": -12.517681121826172, "global_step": 506672, "epoch": 3015} {"train_loss": -11.809091567993164, "global_step": 506673, "epoch": 3015} {"train_loss": -11.889976501464844, "global_step": 506674, "epoch": 3015} {"train_loss": -11.896463394165039, "global_step": 506675, "epoch": 3015} {"train_loss": -12.042176246643066, "global_step": 506676, "epoch": 3015} {"train_loss": -12.030450820922852, "global_step": 506677, "epoch": 3015} {"train_loss": -11.890421867370605, "global_step": 506678, "epoch": 3015} {"train_loss": -12.05855941772461, "global_step": 506679, "epoch": 3015} {"train_loss": -11.430632591247559, "global_step": 506680, "epoch": 3015} {"train_loss": -11.970115661621094, "global_step": 506681, "epoch": 3015} {"train_loss": -11.97857666015625, "global_step": 506682, "epoch": 3015} {"train_loss": -12.301217079162598, "global_step": 506683, "epoch": 3015} {"train_loss": -11.920801162719727, "global_step": 506684, "epoch": 3015} {"train_loss": -11.979190826416016, "global_step": 506685, "epoch": 3015} {"train_loss": -11.716251373291016, "global_step": 506686, "epoch": 3015} {"train_loss": -12.131006575766063, "global_step": 506687, "epoch": 3015, "val_loss": 316695.875, "train_action_mse_error": 1.419700264930725} {"train_loss": -11.868989944458008, "global_step": 506688, "epoch": 3016} {"train_loss": -11.613788604736328, "global_step": 506689, "epoch": 3016} {"train_loss": -11.843620300292969, "global_step": 506690, "epoch": 3016} {"train_loss": -11.044620513916016, "global_step": 506691, "epoch": 3016} {"train_loss": -12.319202423095703, "global_step": 506692, "epoch": 3016} {"train_loss": -11.69649600982666, "global_step": 506693, "epoch": 3016} {"train_loss": -11.309160232543945, "global_step": 506694, "epoch": 3016} {"train_loss": -11.748717308044434, "global_step": 506695, "epoch": 3016} {"train_loss": -11.439582824707031, "global_step": 506696, "epoch": 3016} {"train_loss": -12.061963081359863, "global_step": 506697, "epoch": 3016} {"train_loss": -11.021965026855469, "global_step": 506698, "epoch": 3016} {"train_loss": -11.92051887512207, "global_step": 506699, "epoch": 3016} {"train_loss": -11.764056205749512, "global_step": 506700, "epoch": 3016} {"train_loss": -11.678180694580078, "global_step": 506701, "epoch": 3016} {"train_loss": -11.748886108398438, "global_step": 506702, "epoch": 3016} {"train_loss": -11.828088760375977, "global_step": 506703, "epoch": 3016} {"train_loss": -11.957710266113281, "global_step": 506704, "epoch": 3016} {"train_loss": -11.604887962341309, "global_step": 506705, "epoch": 3016} {"train_loss": -12.256399154663086, "global_step": 506706, "epoch": 3016} {"train_loss": -12.387560844421387, "global_step": 506707, "epoch": 3016} {"train_loss": -12.220244407653809, "global_step": 506708, "epoch": 3016} {"train_loss": -12.57443618774414, "global_step": 506709, "epoch": 3016} {"train_loss": -11.898452758789062, "global_step": 506710, "epoch": 3016} {"train_loss": -12.721420288085938, "global_step": 506711, "epoch": 3016} {"train_loss": -12.153585433959961, "global_step": 506712, "epoch": 3016} {"train_loss": -12.695108413696289, "global_step": 506713, "epoch": 3016} {"train_loss": -12.268025398254395, "global_step": 506714, "epoch": 3016} {"train_loss": -12.50230598449707, "global_step": 506715, "epoch": 3016} {"train_loss": -12.001035690307617, "global_step": 506716, "epoch": 3016} {"train_loss": -12.408397674560547, "global_step": 506717, "epoch": 3016} {"train_loss": -12.626533508300781, "global_step": 506718, "epoch": 3016} {"train_loss": -12.171528816223145, "global_step": 506719, "epoch": 3016} {"train_loss": -12.659748077392578, "global_step": 506720, "epoch": 3016} {"train_loss": -12.380605697631836, "global_step": 506721, "epoch": 3016} {"train_loss": -12.313521385192871, "global_step": 506722, "epoch": 3016} {"train_loss": -12.4930419921875, "global_step": 506723, "epoch": 3016} {"train_loss": -12.550386428833008, "global_step": 506724, "epoch": 3016} {"train_loss": -12.718997955322266, "global_step": 506725, "epoch": 3016} {"train_loss": -12.861120223999023, "global_step": 506726, "epoch": 3016} {"train_loss": -12.75672435760498, "global_step": 506727, "epoch": 3016} {"train_loss": -12.709528923034668, "global_step": 506728, "epoch": 3016} {"train_loss": -12.795991897583008, "global_step": 506729, "epoch": 3016} {"train_loss": -12.606698989868164, "global_step": 506730, "epoch": 3016} {"train_loss": -12.613052368164062, "global_step": 506731, "epoch": 3016} {"train_loss": -12.689107894897461, "global_step": 506732, "epoch": 3016} {"train_loss": -12.770057678222656, "global_step": 506733, "epoch": 3016} {"train_loss": -12.835508346557617, "global_step": 506734, "epoch": 3016} {"train_loss": -12.797208786010742, "global_step": 506735, "epoch": 3016} {"train_loss": -12.718059539794922, "global_step": 506736, "epoch": 3016} {"train_loss": -12.590572357177734, "global_step": 506737, "epoch": 3016} {"train_loss": -12.820752143859863, "global_step": 506738, "epoch": 3016} {"train_loss": -12.516820907592773, "global_step": 506739, "epoch": 3016} {"train_loss": -12.782970428466797, "global_step": 506740, "epoch": 3016} {"train_loss": -12.781847953796387, "global_step": 506741, "epoch": 3016} {"train_loss": -12.880940437316895, "global_step": 506742, "epoch": 3016} {"train_loss": -12.894224166870117, "global_step": 506743, "epoch": 3016} {"train_loss": -12.945178985595703, "global_step": 506744, "epoch": 3016} {"train_loss": -12.659281730651855, "global_step": 506745, "epoch": 3016} {"train_loss": -12.930411338806152, "global_step": 506746, "epoch": 3016} {"train_loss": -13.028507232666016, "global_step": 506747, "epoch": 3016} {"train_loss": -12.837690353393555, "global_step": 506748, "epoch": 3016} {"train_loss": -12.77585506439209, "global_step": 506749, "epoch": 3016} {"train_loss": -12.530692100524902, "global_step": 506750, "epoch": 3016} {"train_loss": -12.803655624389648, "global_step": 506751, "epoch": 3016} {"train_loss": -12.786988258361816, "global_step": 506752, "epoch": 3016} {"train_loss": -12.55537223815918, "global_step": 506753, "epoch": 3016} {"train_loss": -12.476911544799805, "global_step": 506754, "epoch": 3016} {"train_loss": -12.888290405273438, "global_step": 506755, "epoch": 3016} {"train_loss": -12.659603118896484, "global_step": 506756, "epoch": 3016} {"train_loss": -12.73227310180664, "global_step": 506757, "epoch": 3016} {"train_loss": -12.382834434509277, "global_step": 506758, "epoch": 3016} {"train_loss": -12.633983612060547, "global_step": 506759, "epoch": 3016} {"train_loss": -12.748529434204102, "global_step": 506760, "epoch": 3016} {"train_loss": -12.34330940246582, "global_step": 506761, "epoch": 3016} {"train_loss": -12.60754108428955, "global_step": 506762, "epoch": 3016} {"train_loss": -12.780531883239746, "global_step": 506763, "epoch": 3016} {"train_loss": -12.526318550109863, "global_step": 506764, "epoch": 3016} {"train_loss": -12.642977714538574, "global_step": 506765, "epoch": 3016} {"train_loss": -12.827132225036621, "global_step": 506766, "epoch": 3016} {"train_loss": -11.746366500854492, "global_step": 506767, "epoch": 3016} {"train_loss": -12.64764404296875, "global_step": 506768, "epoch": 3016} {"train_loss": -12.474482536315918, "global_step": 506769, "epoch": 3016} {"train_loss": -11.664029121398926, "global_step": 506770, "epoch": 3016} {"train_loss": -12.00145149230957, "global_step": 506771, "epoch": 3016} {"train_loss": -11.840229034423828, "global_step": 506772, "epoch": 3016} {"train_loss": -10.971200942993164, "global_step": 506773, "epoch": 3016} {"train_loss": -11.550111770629883, "global_step": 506774, "epoch": 3016} {"train_loss": -9.357030868530273, "global_step": 506775, "epoch": 3016} {"train_loss": -9.893607139587402, "global_step": 506776, "epoch": 3016} {"train_loss": -10.90068531036377, "global_step": 506777, "epoch": 3016} {"train_loss": -9.646327018737793, "global_step": 506778, "epoch": 3016} {"train_loss": -9.743293762207031, "global_step": 506779, "epoch": 3016} {"train_loss": -9.183692932128906, "global_step": 506780, "epoch": 3016} {"train_loss": -9.323343276977539, "global_step": 506781, "epoch": 3016} {"train_loss": -8.769851684570312, "global_step": 506782, "epoch": 3016} {"train_loss": -9.979339599609375, "global_step": 506783, "epoch": 3016} {"train_loss": -9.71102523803711, "global_step": 506784, "epoch": 3016} {"train_loss": -8.917030334472656, "global_step": 506785, "epoch": 3016} {"train_loss": -9.77570915222168, "global_step": 506786, "epoch": 3016} {"train_loss": -9.510096549987793, "global_step": 506787, "epoch": 3016} {"train_loss": -9.355937957763672, "global_step": 506788, "epoch": 3016} {"train_loss": -10.544255256652832, "global_step": 506789, "epoch": 3016} {"train_loss": -10.904304504394531, "global_step": 506790, "epoch": 3016} {"train_loss": -10.37713623046875, "global_step": 506791, "epoch": 3016} {"train_loss": -10.444238662719727, "global_step": 506792, "epoch": 3016} {"train_loss": -10.844850540161133, "global_step": 506793, "epoch": 3016} {"train_loss": -10.727590560913086, "global_step": 506794, "epoch": 3016} {"train_loss": -10.764993667602539, "global_step": 506795, "epoch": 3016} {"train_loss": -11.865482330322266, "global_step": 506796, "epoch": 3016} {"train_loss": -11.515225410461426, "global_step": 506797, "epoch": 3016} {"train_loss": -11.92334270477295, "global_step": 506798, "epoch": 3016} {"train_loss": -11.555669784545898, "global_step": 506799, "epoch": 3016} {"train_loss": -12.323888778686523, "global_step": 506800, "epoch": 3016} {"train_loss": -12.103778839111328, "global_step": 506801, "epoch": 3016} {"train_loss": -11.95878791809082, "global_step": 506802, "epoch": 3016} {"train_loss": -12.36520767211914, "global_step": 506803, "epoch": 3016} {"train_loss": -11.76645278930664, "global_step": 506804, "epoch": 3016} {"train_loss": -12.236133575439453, "global_step": 506805, "epoch": 3016} {"train_loss": -11.937456130981445, "global_step": 506806, "epoch": 3016} {"train_loss": -12.31200885772705, "global_step": 506807, "epoch": 3016} {"train_loss": -12.106861114501953, "global_step": 506808, "epoch": 3016} {"train_loss": -12.16999626159668, "global_step": 506809, "epoch": 3016} {"train_loss": -12.511231422424316, "global_step": 506810, "epoch": 3016} {"train_loss": -11.892400741577148, "global_step": 506811, "epoch": 3016} {"train_loss": -11.606644630432129, "global_step": 506812, "epoch": 3016} {"train_loss": -12.553407669067383, "global_step": 506813, "epoch": 3016} {"train_loss": -12.313507080078125, "global_step": 506814, "epoch": 3016} {"train_loss": -12.22398567199707, "global_step": 506815, "epoch": 3016} {"train_loss": -12.52283763885498, "global_step": 506816, "epoch": 3016} {"train_loss": -12.557207107543945, "global_step": 506817, "epoch": 3016} {"train_loss": -12.5111083984375, "global_step": 506818, "epoch": 3016} {"train_loss": -12.138781547546387, "global_step": 506819, "epoch": 3016} {"train_loss": -12.334463119506836, "global_step": 506820, "epoch": 3016} {"train_loss": -12.316008567810059, "global_step": 506821, "epoch": 3016} {"train_loss": -12.315181732177734, "global_step": 506822, "epoch": 3016} {"train_loss": -12.2878999710083, "global_step": 506823, "epoch": 3016} {"train_loss": -12.732673645019531, "global_step": 506824, "epoch": 3016} {"train_loss": -12.237491607666016, "global_step": 506825, "epoch": 3016} {"train_loss": -12.74505615234375, "global_step": 506826, "epoch": 3016} {"train_loss": -12.820887565612793, "global_step": 506827, "epoch": 3016} {"train_loss": -12.439428329467773, "global_step": 506828, "epoch": 3016} {"train_loss": -12.74145221710205, "global_step": 506829, "epoch": 3016} {"train_loss": -12.629615783691406, "global_step": 506830, "epoch": 3016} {"train_loss": -12.656524658203125, "global_step": 506831, "epoch": 3016} {"train_loss": -12.480825424194336, "global_step": 506832, "epoch": 3016} {"train_loss": -12.448492050170898, "global_step": 506833, "epoch": 3016} {"train_loss": -12.395709991455078, "global_step": 506834, "epoch": 3016} {"train_loss": -12.708930015563965, "global_step": 506835, "epoch": 3016} {"train_loss": -12.680068969726562, "global_step": 506836, "epoch": 3016} {"train_loss": -12.62447738647461, "global_step": 506837, "epoch": 3016} {"train_loss": -12.360307693481445, "global_step": 506838, "epoch": 3016} {"train_loss": -12.704644203186035, "global_step": 506839, "epoch": 3016} {"train_loss": -12.626556396484375, "global_step": 506840, "epoch": 3016} {"train_loss": -12.666131973266602, "global_step": 506841, "epoch": 3016} {"train_loss": -12.587750434875488, "global_step": 506842, "epoch": 3016} {"train_loss": -12.853179931640625, "global_step": 506843, "epoch": 3016} {"train_loss": -12.801663398742676, "global_step": 506844, "epoch": 3016} {"train_loss": -12.500150680541992, "global_step": 506845, "epoch": 3016} {"train_loss": -12.64228630065918, "global_step": 506846, "epoch": 3016} {"train_loss": -12.500301361083984, "global_step": 506847, "epoch": 3016} {"train_loss": -12.534852027893066, "global_step": 506848, "epoch": 3016} {"train_loss": -12.421570777893066, "global_step": 506849, "epoch": 3016} {"train_loss": -12.759692192077637, "global_step": 506850, "epoch": 3016} {"train_loss": -12.632001876831055, "global_step": 506851, "epoch": 3016} {"train_loss": -12.590630531311035, "global_step": 506852, "epoch": 3016} {"train_loss": -12.581396102905273, "global_step": 506853, "epoch": 3016} {"train_loss": -12.424610137939453, "global_step": 506854, "epoch": 3016} {"train_loss": -12.06572014944894, "global_step": 506855, "epoch": 3016, "val_loss": 320072.375} {"train_loss": -12.127429962158203, "global_step": 506856, "epoch": 3017} {"train_loss": -12.7294921875, "global_step": 506857, "epoch": 3017} {"train_loss": -12.471182823181152, "global_step": 506858, "epoch": 3017} {"train_loss": -12.247884750366211, "global_step": 506859, "epoch": 3017} {"train_loss": -12.385936737060547, "global_step": 506860, "epoch": 3017} {"train_loss": -12.810182571411133, "global_step": 506861, "epoch": 3017} {"train_loss": -12.376836776733398, "global_step": 506862, "epoch": 3017} {"train_loss": -12.297990798950195, "global_step": 506863, "epoch": 3017} {"train_loss": -12.669364929199219, "global_step": 506864, "epoch": 3017} {"train_loss": -12.453651428222656, "global_step": 506865, "epoch": 3017} {"train_loss": -12.532251358032227, "global_step": 506866, "epoch": 3017} {"train_loss": -12.675004959106445, "global_step": 506867, "epoch": 3017} {"train_loss": -12.02514362335205, "global_step": 506868, "epoch": 3017} {"train_loss": -12.430547714233398, "global_step": 506869, "epoch": 3017} {"train_loss": -12.048917770385742, "global_step": 506870, "epoch": 3017} {"train_loss": -12.464692115783691, "global_step": 506871, "epoch": 3017} {"train_loss": -12.534418106079102, "global_step": 506872, "epoch": 3017} {"train_loss": -12.348014831542969, "global_step": 506873, "epoch": 3017} {"train_loss": -12.659661293029785, "global_step": 506874, "epoch": 3017} {"train_loss": -12.425664901733398, "global_step": 506875, "epoch": 3017} {"train_loss": -12.574644088745117, "global_step": 506876, "epoch": 3017} {"train_loss": -12.438459396362305, "global_step": 506877, "epoch": 3017} {"train_loss": -12.403552055358887, "global_step": 506878, "epoch": 3017} {"train_loss": -12.001797676086426, "global_step": 506879, "epoch": 3017} {"train_loss": -12.677943229675293, "global_step": 506880, "epoch": 3017} {"train_loss": -12.150413513183594, "global_step": 506881, "epoch": 3017} {"train_loss": -12.074970245361328, "global_step": 506882, "epoch": 3017} {"train_loss": -12.185182571411133, "global_step": 506883, "epoch": 3017} {"train_loss": -12.388063430786133, "global_step": 506884, "epoch": 3017} {"train_loss": -12.478185653686523, "global_step": 506885, "epoch": 3017} {"train_loss": -12.259119987487793, "global_step": 506886, "epoch": 3017} {"train_loss": -11.952983856201172, "global_step": 506887, "epoch": 3017} {"train_loss": -12.537467956542969, "global_step": 506888, "epoch": 3017} {"train_loss": -12.27515697479248, "global_step": 506889, "epoch": 3017} {"train_loss": -12.172906875610352, "global_step": 506890, "epoch": 3017} {"train_loss": -11.941317558288574, "global_step": 506891, "epoch": 3017} {"train_loss": -11.971933364868164, "global_step": 506892, "epoch": 3017} {"train_loss": -10.9440279006958, "global_step": 506893, "epoch": 3017} {"train_loss": -11.627079963684082, "global_step": 506894, "epoch": 3017} {"train_loss": -11.593969345092773, "global_step": 506895, "epoch": 3017} {"train_loss": -11.23804759979248, "global_step": 506896, "epoch": 3017} {"train_loss": -11.44565486907959, "global_step": 506897, "epoch": 3017} {"train_loss": -11.609992027282715, "global_step": 506898, "epoch": 3017} {"train_loss": -10.956669807434082, "global_step": 506899, "epoch": 3017} {"train_loss": -12.052419662475586, "global_step": 506900, "epoch": 3017} {"train_loss": -11.693538665771484, "global_step": 506901, "epoch": 3017} {"train_loss": -12.149282455444336, "global_step": 506902, "epoch": 3017} {"train_loss": -11.980340957641602, "global_step": 506903, "epoch": 3017} {"train_loss": -12.028812408447266, "global_step": 506904, "epoch": 3017} {"train_loss": -11.610204696655273, "global_step": 506905, "epoch": 3017} {"train_loss": -11.98918342590332, "global_step": 506906, "epoch": 3017} {"train_loss": -12.523327827453613, "global_step": 506907, "epoch": 3017} {"train_loss": -12.256511688232422, "global_step": 506908, "epoch": 3017} {"train_loss": -12.213820457458496, "global_step": 506909, "epoch": 3017} {"train_loss": -11.562837600708008, "global_step": 506910, "epoch": 3017} {"train_loss": -11.307315826416016, "global_step": 506911, "epoch": 3017} {"train_loss": -12.098257064819336, "global_step": 506912, "epoch": 3017} {"train_loss": -11.954665184020996, "global_step": 506913, "epoch": 3017} {"train_loss": -12.644803047180176, "global_step": 506914, "epoch": 3017} {"train_loss": -12.095684051513672, "global_step": 506915, "epoch": 3017} {"train_loss": -12.021852493286133, "global_step": 506916, "epoch": 3017} {"train_loss": -12.813202857971191, "global_step": 506917, "epoch": 3017} {"train_loss": -12.126607894897461, "global_step": 506918, "epoch": 3017} {"train_loss": -12.468488693237305, "global_step": 506919, "epoch": 3017} {"train_loss": -12.500330924987793, "global_step": 506920, "epoch": 3017} {"train_loss": -12.19877815246582, "global_step": 506921, "epoch": 3017} {"train_loss": -12.368803024291992, "global_step": 506922, "epoch": 3017} {"train_loss": -12.2766695022583, "global_step": 506923, "epoch": 3017} {"train_loss": -12.710182189941406, "global_step": 506924, "epoch": 3017} {"train_loss": -12.175000190734863, "global_step": 506925, "epoch": 3017} {"train_loss": -12.486729621887207, "global_step": 506926, "epoch": 3017} {"train_loss": -12.172952651977539, "global_step": 506927, "epoch": 3017} {"train_loss": -12.576011657714844, "global_step": 506928, "epoch": 3017} {"train_loss": -12.505693435668945, "global_step": 506929, "epoch": 3017} {"train_loss": -12.455026626586914, "global_step": 506930, "epoch": 3017} {"train_loss": -12.612150192260742, "global_step": 506931, "epoch": 3017} {"train_loss": -12.706741333007812, "global_step": 506932, "epoch": 3017} {"train_loss": -12.625675201416016, "global_step": 506933, "epoch": 3017} {"train_loss": -12.363189697265625, "global_step": 506934, "epoch": 3017} {"train_loss": -12.97241497039795, "global_step": 506935, "epoch": 3017} {"train_loss": -12.404131889343262, "global_step": 506936, "epoch": 3017} {"train_loss": -12.869693756103516, "global_step": 506937, "epoch": 3017} {"train_loss": -12.43962287902832, "global_step": 506938, "epoch": 3017} {"train_loss": -12.641067504882812, "global_step": 506939, "epoch": 3017} {"train_loss": -12.875249862670898, "global_step": 506940, "epoch": 3017} {"train_loss": -12.801889419555664, "global_step": 506941, "epoch": 3017} {"train_loss": -12.763243675231934, "global_step": 506942, "epoch": 3017} {"train_loss": -12.795635223388672, "global_step": 506943, "epoch": 3017} {"train_loss": -12.839061737060547, "global_step": 506944, "epoch": 3017} {"train_loss": -12.767937660217285, "global_step": 506945, "epoch": 3017} {"train_loss": -12.895774841308594, "global_step": 506946, "epoch": 3017} {"train_loss": -12.637872695922852, "global_step": 506947, "epoch": 3017} {"train_loss": -12.598468780517578, "global_step": 506948, "epoch": 3017} {"train_loss": -13.032957077026367, "global_step": 506949, "epoch": 3017} {"train_loss": -12.73342514038086, "global_step": 506950, "epoch": 3017} {"train_loss": -12.888114929199219, "global_step": 506951, "epoch": 3017} {"train_loss": -12.769004821777344, "global_step": 506952, "epoch": 3017} {"train_loss": -12.706405639648438, "global_step": 506953, "epoch": 3017} {"train_loss": -12.743009567260742, "global_step": 506954, "epoch": 3017} {"train_loss": -12.900313377380371, "global_step": 506955, "epoch": 3017} {"train_loss": -12.71914291381836, "global_step": 506956, "epoch": 3017} {"train_loss": -12.903560638427734, "global_step": 506957, "epoch": 3017} {"train_loss": -12.86826229095459, "global_step": 506958, "epoch": 3017} {"train_loss": -12.712374687194824, "global_step": 506959, "epoch": 3017} {"train_loss": -12.943706512451172, "global_step": 506960, "epoch": 3017} {"train_loss": -12.579183578491211, "global_step": 506961, "epoch": 3017} {"train_loss": -12.729010581970215, "global_step": 506962, "epoch": 3017} {"train_loss": -12.501049041748047, "global_step": 506963, "epoch": 3017} {"train_loss": -12.486675262451172, "global_step": 506964, "epoch": 3017} {"train_loss": -12.697652816772461, "global_step": 506965, "epoch": 3017} {"train_loss": -12.00927734375, "global_step": 506966, "epoch": 3017} {"train_loss": -11.873779296875, "global_step": 506967, "epoch": 3017} {"train_loss": -12.489153861999512, "global_step": 506968, "epoch": 3017} {"train_loss": -12.728448867797852, "global_step": 506969, "epoch": 3017} {"train_loss": -10.938985824584961, "global_step": 506970, "epoch": 3017} {"train_loss": -12.504192352294922, "global_step": 506971, "epoch": 3017} {"train_loss": -12.569463729858398, "global_step": 506972, "epoch": 3017} {"train_loss": -12.23387336730957, "global_step": 506973, "epoch": 3017} {"train_loss": -12.884382247924805, "global_step": 506974, "epoch": 3017} {"train_loss": -12.82425308227539, "global_step": 506975, "epoch": 3017} {"train_loss": -12.484589576721191, "global_step": 506976, "epoch": 3017} {"train_loss": -13.033681869506836, "global_step": 506977, "epoch": 3017} {"train_loss": -13.001005172729492, "global_step": 506978, "epoch": 3017} {"train_loss": -12.913213729858398, "global_step": 506979, "epoch": 3017} {"train_loss": -12.938607215881348, "global_step": 506980, "epoch": 3017} {"train_loss": -12.946586608886719, "global_step": 506981, "epoch": 3017} {"train_loss": -12.869988441467285, "global_step": 506982, "epoch": 3017} {"train_loss": -12.712478637695312, "global_step": 506983, "epoch": 3017} {"train_loss": -13.012808799743652, "global_step": 506984, "epoch": 3017} {"train_loss": -13.086084365844727, "global_step": 506985, "epoch": 3017} {"train_loss": -12.846243858337402, "global_step": 506986, "epoch": 3017} {"train_loss": -12.729907989501953, "global_step": 506987, "epoch": 3017} {"train_loss": -13.000805854797363, "global_step": 506988, "epoch": 3017} {"train_loss": -12.59778881072998, "global_step": 506989, "epoch": 3017} {"train_loss": -12.708645820617676, "global_step": 506990, "epoch": 3017} {"train_loss": -12.792472839355469, "global_step": 506991, "epoch": 3017} {"train_loss": -12.832571029663086, "global_step": 506992, "epoch": 3017} {"train_loss": -12.746448516845703, "global_step": 506993, "epoch": 3017} {"train_loss": -12.710550308227539, "global_step": 506994, "epoch": 3017} {"train_loss": -12.80097770690918, "global_step": 506995, "epoch": 3017} {"train_loss": -12.919246673583984, "global_step": 506996, "epoch": 3017} {"train_loss": -12.880529403686523, "global_step": 506997, "epoch": 3017} {"train_loss": -12.588342666625977, "global_step": 506998, "epoch": 3017} {"train_loss": -12.32567310333252, "global_step": 506999, "epoch": 3017} {"train_loss": -12.501826286315918, "global_step": 507000, "epoch": 3017} {"train_loss": -10.8934907913208, "global_step": 507001, "epoch": 3017} {"train_loss": -11.094785690307617, "global_step": 507002, "epoch": 3017} {"train_loss": -10.269896507263184, "global_step": 507003, "epoch": 3017} {"train_loss": -11.894579887390137, "global_step": 507004, "epoch": 3017} {"train_loss": -9.774162292480469, "global_step": 507005, "epoch": 3017} {"train_loss": -10.200443267822266, "global_step": 507006, "epoch": 3017} {"train_loss": -10.68741512298584, "global_step": 507007, "epoch": 3017} {"train_loss": -10.48440933227539, "global_step": 507008, "epoch": 3017} {"train_loss": -11.0794095993042, "global_step": 507009, "epoch": 3017} {"train_loss": -9.819704055786133, "global_step": 507010, "epoch": 3017} {"train_loss": -11.427512168884277, "global_step": 507011, "epoch": 3017} {"train_loss": -11.177316665649414, "global_step": 507012, "epoch": 3017} {"train_loss": -10.315522193908691, "global_step": 507013, "epoch": 3017} {"train_loss": -12.123977661132812, "global_step": 507014, "epoch": 3017} {"train_loss": -9.985616683959961, "global_step": 507015, "epoch": 3017} {"train_loss": -10.712329864501953, "global_step": 507016, "epoch": 3017} {"train_loss": -9.688961029052734, "global_step": 507017, "epoch": 3017} {"train_loss": -9.845876693725586, "global_step": 507018, "epoch": 3017} {"train_loss": -9.603772163391113, "global_step": 507019, "epoch": 3017} {"train_loss": -10.355825424194336, "global_step": 507020, "epoch": 3017} {"train_loss": -10.03132438659668, "global_step": 507021, "epoch": 3017} {"train_loss": -10.856670379638672, "global_step": 507022, "epoch": 3017} {"train_loss": -12.182273671740578, "global_step": 507023, "epoch": 3017, "val_loss": 315842.0} {"train_loss": -10.524083137512207, "global_step": 507024, "epoch": 3018} {"train_loss": -10.217474937438965, "global_step": 507025, "epoch": 3018} {"train_loss": -10.93324089050293, "global_step": 507026, "epoch": 3018} {"train_loss": -11.10811996459961, "global_step": 507027, "epoch": 3018} {"train_loss": -11.382526397705078, "global_step": 507028, "epoch": 3018} {"train_loss": -11.584794998168945, "global_step": 507029, "epoch": 3018} {"train_loss": -10.849705696105957, "global_step": 507030, "epoch": 3018} {"train_loss": -11.488566398620605, "global_step": 507031, "epoch": 3018} {"train_loss": -10.901451110839844, "global_step": 507032, "epoch": 3018} {"train_loss": -11.615236282348633, "global_step": 507033, "epoch": 3018} {"train_loss": -11.34831428527832, "global_step": 507034, "epoch": 3018} {"train_loss": -12.157949447631836, "global_step": 507035, "epoch": 3018} {"train_loss": -11.717833518981934, "global_step": 507036, "epoch": 3018} {"train_loss": -12.117942810058594, "global_step": 507037, "epoch": 3018} {"train_loss": -12.08448314666748, "global_step": 507038, "epoch": 3018} {"train_loss": -12.272696495056152, "global_step": 507039, "epoch": 3018} {"train_loss": -12.06672477722168, "global_step": 507040, "epoch": 3018} {"train_loss": -12.199691772460938, "global_step": 507041, "epoch": 3018} {"train_loss": -12.3240966796875, "global_step": 507042, "epoch": 3018} {"train_loss": -12.091617584228516, "global_step": 507043, "epoch": 3018} {"train_loss": -12.099698066711426, "global_step": 507044, "epoch": 3018} {"train_loss": -12.296463966369629, "global_step": 507045, "epoch": 3018} {"train_loss": -12.565203666687012, "global_step": 507046, "epoch": 3018} {"train_loss": -12.194822311401367, "global_step": 507047, "epoch": 3018} {"train_loss": -12.304815292358398, "global_step": 507048, "epoch": 3018} {"train_loss": -12.472433090209961, "global_step": 507049, "epoch": 3018} {"train_loss": -12.464942932128906, "global_step": 507050, "epoch": 3018} {"train_loss": -12.636001586914062, "global_step": 507051, "epoch": 3018} {"train_loss": -12.320540428161621, "global_step": 507052, "epoch": 3018} {"train_loss": -12.706268310546875, "global_step": 507053, "epoch": 3018} {"train_loss": -12.4347562789917, "global_step": 507054, "epoch": 3018} {"train_loss": -12.491392135620117, "global_step": 507055, "epoch": 3018} {"train_loss": -12.21595573425293, "global_step": 507056, "epoch": 3018} {"train_loss": -12.63102912902832, "global_step": 507057, "epoch": 3018} {"train_loss": -12.122398376464844, "global_step": 507058, "epoch": 3018} {"train_loss": -12.35161304473877, "global_step": 507059, "epoch": 3018} {"train_loss": -11.742656707763672, "global_step": 507060, "epoch": 3018} {"train_loss": -12.350212097167969, "global_step": 507061, "epoch": 3018} {"train_loss": -12.282793998718262, "global_step": 507062, "epoch": 3018} {"train_loss": -12.359352111816406, "global_step": 507063, "epoch": 3018} {"train_loss": -12.146053314208984, "global_step": 507064, "epoch": 3018} {"train_loss": -12.634034156799316, "global_step": 507065, "epoch": 3018} {"train_loss": -12.374752044677734, "global_step": 507066, "epoch": 3018} {"train_loss": -12.22856330871582, "global_step": 507067, "epoch": 3018} {"train_loss": -12.495391845703125, "global_step": 507068, "epoch": 3018} {"train_loss": -12.072151184082031, "global_step": 507069, "epoch": 3018} {"train_loss": -12.36093521118164, "global_step": 507070, "epoch": 3018} {"train_loss": -12.089566230773926, "global_step": 507071, "epoch": 3018} {"train_loss": -12.208282470703125, "global_step": 507072, "epoch": 3018} {"train_loss": -11.918363571166992, "global_step": 507073, "epoch": 3018} {"train_loss": -12.66375732421875, "global_step": 507074, "epoch": 3018} {"train_loss": -11.970193862915039, "global_step": 507075, "epoch": 3018} {"train_loss": -12.40606689453125, "global_step": 507076, "epoch": 3018} {"train_loss": -12.70971393585205, "global_step": 507077, "epoch": 3018} {"train_loss": -12.255254745483398, "global_step": 507078, "epoch": 3018} {"train_loss": -12.662886619567871, "global_step": 507079, "epoch": 3018} {"train_loss": -12.35206127166748, "global_step": 507080, "epoch": 3018} {"train_loss": -12.561342239379883, "global_step": 507081, "epoch": 3018} {"train_loss": -12.626941680908203, "global_step": 507082, "epoch": 3018} {"train_loss": -12.540410995483398, "global_step": 507083, "epoch": 3018} {"train_loss": -12.438994407653809, "global_step": 507084, "epoch": 3018} {"train_loss": -12.691604614257812, "global_step": 507085, "epoch": 3018} {"train_loss": -12.514379501342773, "global_step": 507086, "epoch": 3018} {"train_loss": -12.337753295898438, "global_step": 507087, "epoch": 3018} {"train_loss": -12.665046691894531, "global_step": 507088, "epoch": 3018} {"train_loss": -11.773387908935547, "global_step": 507089, "epoch": 3018} {"train_loss": -12.542976379394531, "global_step": 507090, "epoch": 3018} {"train_loss": -11.963766098022461, "global_step": 507091, "epoch": 3018} {"train_loss": -12.216423034667969, "global_step": 507092, "epoch": 3018} {"train_loss": -12.419353485107422, "global_step": 507093, "epoch": 3018} {"train_loss": -12.4819917678833, "global_step": 507094, "epoch": 3018} {"train_loss": -12.089254379272461, "global_step": 507095, "epoch": 3018} {"train_loss": -12.558189392089844, "global_step": 507096, "epoch": 3018} {"train_loss": -11.82762622833252, "global_step": 507097, "epoch": 3018} {"train_loss": -12.575082778930664, "global_step": 507098, "epoch": 3018} {"train_loss": -12.507068634033203, "global_step": 507099, "epoch": 3018} {"train_loss": -12.348604202270508, "global_step": 507100, "epoch": 3018} {"train_loss": -11.543456077575684, "global_step": 507101, "epoch": 3018} {"train_loss": -12.662312507629395, "global_step": 507102, "epoch": 3018} {"train_loss": -11.971413612365723, "global_step": 507103, "epoch": 3018} {"train_loss": -11.835376739501953, "global_step": 507104, "epoch": 3018} {"train_loss": -12.448596954345703, "global_step": 507105, "epoch": 3018} {"train_loss": -12.004342079162598, "global_step": 507106, "epoch": 3018} {"train_loss": -12.142709732055664, "global_step": 507107, "epoch": 3018} {"train_loss": -12.774497985839844, "global_step": 507108, "epoch": 3018} {"train_loss": -12.001502990722656, "global_step": 507109, "epoch": 3018} {"train_loss": -11.898158073425293, "global_step": 507110, "epoch": 3018} {"train_loss": -12.547231674194336, "global_step": 507111, "epoch": 3018} {"train_loss": -11.561027526855469, "global_step": 507112, "epoch": 3018} {"train_loss": -12.356168746948242, "global_step": 507113, "epoch": 3018} {"train_loss": -10.840078353881836, "global_step": 507114, "epoch": 3018} {"train_loss": -12.511008262634277, "global_step": 507115, "epoch": 3018} {"train_loss": -11.216410636901855, "global_step": 507116, "epoch": 3018} {"train_loss": -11.471305847167969, "global_step": 507117, "epoch": 3018} {"train_loss": -12.2847900390625, "global_step": 507118, "epoch": 3018} {"train_loss": -11.046274185180664, "global_step": 507119, "epoch": 3018} {"train_loss": -11.192037582397461, "global_step": 507120, "epoch": 3018} {"train_loss": -11.092373847961426, "global_step": 507121, "epoch": 3018} {"train_loss": -10.346254348754883, "global_step": 507122, "epoch": 3018} {"train_loss": -10.154146194458008, "global_step": 507123, "epoch": 3018} {"train_loss": -11.322471618652344, "global_step": 507124, "epoch": 3018} {"train_loss": -11.282247543334961, "global_step": 507125, "epoch": 3018} {"train_loss": -11.23138427734375, "global_step": 507126, "epoch": 3018} {"train_loss": -11.58188247680664, "global_step": 507127, "epoch": 3018} {"train_loss": -11.827333450317383, "global_step": 507128, "epoch": 3018} {"train_loss": -11.866013526916504, "global_step": 507129, "epoch": 3018} {"train_loss": -12.094673156738281, "global_step": 507130, "epoch": 3018} {"train_loss": -12.024134635925293, "global_step": 507131, "epoch": 3018} {"train_loss": -12.37030029296875, "global_step": 507132, "epoch": 3018} {"train_loss": -12.129311561584473, "global_step": 507133, "epoch": 3018} {"train_loss": -12.341829299926758, "global_step": 507134, "epoch": 3018} {"train_loss": -12.044795989990234, "global_step": 507135, "epoch": 3018} {"train_loss": -12.833869934082031, "global_step": 507136, "epoch": 3018} {"train_loss": -12.292607307434082, "global_step": 507137, "epoch": 3018} {"train_loss": -12.20096206665039, "global_step": 507138, "epoch": 3018} {"train_loss": -12.612445831298828, "global_step": 507139, "epoch": 3018} {"train_loss": -12.26407527923584, "global_step": 507140, "epoch": 3018} {"train_loss": -12.673395156860352, "global_step": 507141, "epoch": 3018} {"train_loss": -12.096330642700195, "global_step": 507142, "epoch": 3018} {"train_loss": -12.472601890563965, "global_step": 507143, "epoch": 3018} {"train_loss": -12.194232940673828, "global_step": 507144, "epoch": 3018} {"train_loss": -12.300665855407715, "global_step": 507145, "epoch": 3018} {"train_loss": -12.410636901855469, "global_step": 507146, "epoch": 3018} {"train_loss": -12.336828231811523, "global_step": 507147, "epoch": 3018} {"train_loss": -12.590154647827148, "global_step": 507148, "epoch": 3018} {"train_loss": -12.549522399902344, "global_step": 507149, "epoch": 3018} {"train_loss": -12.78614330291748, "global_step": 507150, "epoch": 3018} {"train_loss": -12.529394149780273, "global_step": 507151, "epoch": 3018} {"train_loss": -12.81480598449707, "global_step": 507152, "epoch": 3018} {"train_loss": -12.50074577331543, "global_step": 507153, "epoch": 3018} {"train_loss": -12.542533874511719, "global_step": 507154, "epoch": 3018} {"train_loss": -12.964436531066895, "global_step": 507155, "epoch": 3018} {"train_loss": -12.662632942199707, "global_step": 507156, "epoch": 3018} {"train_loss": -12.708623886108398, "global_step": 507157, "epoch": 3018} {"train_loss": -12.791444778442383, "global_step": 507158, "epoch": 3018} {"train_loss": -12.652717590332031, "global_step": 507159, "epoch": 3018} {"train_loss": -12.785074234008789, "global_step": 507160, "epoch": 3018} {"train_loss": -12.582498550415039, "global_step": 507161, "epoch": 3018} {"train_loss": -12.79267406463623, "global_step": 507162, "epoch": 3018} {"train_loss": -12.546412467956543, "global_step": 507163, "epoch": 3018} {"train_loss": -13.065574645996094, "global_step": 507164, "epoch": 3018} {"train_loss": -12.541106224060059, "global_step": 507165, "epoch": 3018} {"train_loss": -12.81437873840332, "global_step": 507166, "epoch": 3018} {"train_loss": -12.947600364685059, "global_step": 507167, "epoch": 3018} {"train_loss": -12.69721508026123, "global_step": 507168, "epoch": 3018} {"train_loss": -12.692977905273438, "global_step": 507169, "epoch": 3018} {"train_loss": -12.623855590820312, "global_step": 507170, "epoch": 3018} {"train_loss": -12.751202583312988, "global_step": 507171, "epoch": 3018} {"train_loss": -12.754341125488281, "global_step": 507172, "epoch": 3018} {"train_loss": -12.699359893798828, "global_step": 507173, "epoch": 3018} {"train_loss": -12.777050018310547, "global_step": 507174, "epoch": 3018} {"train_loss": -12.593733787536621, "global_step": 507175, "epoch": 3018} {"train_loss": -12.451959609985352, "global_step": 507176, "epoch": 3018} {"train_loss": -12.366782188415527, "global_step": 507177, "epoch": 3018} {"train_loss": -12.728981018066406, "global_step": 507178, "epoch": 3018} {"train_loss": -12.044787406921387, "global_step": 507179, "epoch": 3018} {"train_loss": -11.901911735534668, "global_step": 507180, "epoch": 3018} {"train_loss": -12.706705093383789, "global_step": 507181, "epoch": 3018} {"train_loss": -12.134220123291016, "global_step": 507182, "epoch": 3018} {"train_loss": -12.050451278686523, "global_step": 507183, "epoch": 3018} {"train_loss": -12.773054122924805, "global_step": 507184, "epoch": 3018} {"train_loss": -12.672735214233398, "global_step": 507185, "epoch": 3018} {"train_loss": -12.527053833007812, "global_step": 507186, "epoch": 3018} {"train_loss": -12.759620666503906, "global_step": 507187, "epoch": 3018} {"train_loss": -12.518182754516602, "global_step": 507188, "epoch": 3018} {"train_loss": -12.569883346557617, "global_step": 507189, "epoch": 3018} {"train_loss": -12.564586639404297, "global_step": 507190, "epoch": 3018} {"train_loss": -12.209962515603928, "global_step": 507191, "epoch": 3018, "val_loss": 320207.15625} {"train_loss": -12.828045845031738, "global_step": 507192, "epoch": 3019} {"train_loss": -12.825260162353516, "global_step": 507193, "epoch": 3019} {"train_loss": -12.576225280761719, "global_step": 507194, "epoch": 3019} {"train_loss": -12.602958679199219, "global_step": 507195, "epoch": 3019} {"train_loss": -12.720802307128906, "global_step": 507196, "epoch": 3019} {"train_loss": -12.752900123596191, "global_step": 507197, "epoch": 3019} {"train_loss": -12.771891593933105, "global_step": 507198, "epoch": 3019} {"train_loss": -12.864886283874512, "global_step": 507199, "epoch": 3019} {"train_loss": -12.62946891784668, "global_step": 507200, "epoch": 3019} {"train_loss": -13.003400802612305, "global_step": 507201, "epoch": 3019} {"train_loss": -12.540493965148926, "global_step": 507202, "epoch": 3019} {"train_loss": -12.940613746643066, "global_step": 507203, "epoch": 3019} {"train_loss": -12.739802360534668, "global_step": 507204, "epoch": 3019} {"train_loss": -13.220521926879883, "global_step": 507205, "epoch": 3019} {"train_loss": -12.404590606689453, "global_step": 507206, "epoch": 3019} {"train_loss": -13.138422012329102, "global_step": 507207, "epoch": 3019} {"train_loss": -12.476284980773926, "global_step": 507208, "epoch": 3019} {"train_loss": -12.721050262451172, "global_step": 507209, "epoch": 3019} {"train_loss": -12.49966049194336, "global_step": 507210, "epoch": 3019} {"train_loss": -13.074077606201172, "global_step": 507211, "epoch": 3019} {"train_loss": -12.485614776611328, "global_step": 507212, "epoch": 3019} {"train_loss": -12.875334739685059, "global_step": 507213, "epoch": 3019} {"train_loss": -12.592931747436523, "global_step": 507214, "epoch": 3019} {"train_loss": -12.54075813293457, "global_step": 507215, "epoch": 3019} {"train_loss": -12.28358268737793, "global_step": 507216, "epoch": 3019} {"train_loss": -12.72186279296875, "global_step": 507217, "epoch": 3019} {"train_loss": -12.457633972167969, "global_step": 507218, "epoch": 3019} {"train_loss": -12.892253875732422, "global_step": 507219, "epoch": 3019} {"train_loss": -12.630035400390625, "global_step": 507220, "epoch": 3019} {"train_loss": -12.751534461975098, "global_step": 507221, "epoch": 3019} {"train_loss": -12.242015838623047, "global_step": 507222, "epoch": 3019} {"train_loss": -12.74966812133789, "global_step": 507223, "epoch": 3019} {"train_loss": -12.498285293579102, "global_step": 507224, "epoch": 3019} {"train_loss": -12.640462875366211, "global_step": 507225, "epoch": 3019} {"train_loss": -12.130670547485352, "global_step": 507226, "epoch": 3019} {"train_loss": -12.807770729064941, "global_step": 507227, "epoch": 3019} {"train_loss": -12.454754829406738, "global_step": 507228, "epoch": 3019} {"train_loss": -12.1368408203125, "global_step": 507229, "epoch": 3019} {"train_loss": -11.406023025512695, "global_step": 507230, "epoch": 3019} {"train_loss": -12.564010620117188, "global_step": 507231, "epoch": 3019} {"train_loss": -12.057209968566895, "global_step": 507232, "epoch": 3019} {"train_loss": -11.913081169128418, "global_step": 507233, "epoch": 3019} {"train_loss": -12.148670196533203, "global_step": 507234, "epoch": 3019} {"train_loss": -10.628087997436523, "global_step": 507235, "epoch": 3019} {"train_loss": -11.789576530456543, "global_step": 507236, "epoch": 3019} {"train_loss": -9.982732772827148, "global_step": 507237, "epoch": 3019} {"train_loss": -11.596246719360352, "global_step": 507238, "epoch": 3019} {"train_loss": -11.99832534790039, "global_step": 507239, "epoch": 3019} {"train_loss": -11.907859802246094, "global_step": 507240, "epoch": 3019} {"train_loss": -11.984964370727539, "global_step": 507241, "epoch": 3019} {"train_loss": -11.373268127441406, "global_step": 507242, "epoch": 3019} {"train_loss": -11.764225006103516, "global_step": 507243, "epoch": 3019} {"train_loss": -12.266357421875, "global_step": 507244, "epoch": 3019} {"train_loss": -12.388734817504883, "global_step": 507245, "epoch": 3019} {"train_loss": -12.609030723571777, "global_step": 507246, "epoch": 3019} {"train_loss": -12.478103637695312, "global_step": 507247, "epoch": 3019} {"train_loss": -12.100625991821289, "global_step": 507248, "epoch": 3019} {"train_loss": -12.365270614624023, "global_step": 507249, "epoch": 3019} {"train_loss": -12.193887710571289, "global_step": 507250, "epoch": 3019} {"train_loss": -11.812519073486328, "global_step": 507251, "epoch": 3019} {"train_loss": -12.618188858032227, "global_step": 507252, "epoch": 3019} {"train_loss": -12.677783966064453, "global_step": 507253, "epoch": 3019} {"train_loss": -12.469669342041016, "global_step": 507254, "epoch": 3019} {"train_loss": -12.272408485412598, "global_step": 507255, "epoch": 3019} {"train_loss": -12.659035682678223, "global_step": 507256, "epoch": 3019} {"train_loss": -12.643888473510742, "global_step": 507257, "epoch": 3019} {"train_loss": -11.973859786987305, "global_step": 507258, "epoch": 3019} {"train_loss": -12.39102554321289, "global_step": 507259, "epoch": 3019} {"train_loss": -12.632539749145508, "global_step": 507260, "epoch": 3019} {"train_loss": -12.026834487915039, "global_step": 507261, "epoch": 3019} {"train_loss": -11.654254913330078, "global_step": 507262, "epoch": 3019} {"train_loss": -12.431154251098633, "global_step": 507263, "epoch": 3019} {"train_loss": -12.19796371459961, "global_step": 507264, "epoch": 3019} {"train_loss": -12.468437194824219, "global_step": 507265, "epoch": 3019} {"train_loss": -12.1245756149292, "global_step": 507266, "epoch": 3019} {"train_loss": -12.567387580871582, "global_step": 507267, "epoch": 3019} {"train_loss": -12.256731986999512, "global_step": 507268, "epoch": 3019} {"train_loss": -11.928487777709961, "global_step": 507269, "epoch": 3019} {"train_loss": -12.656518936157227, "global_step": 507270, "epoch": 3019} {"train_loss": -11.490506172180176, "global_step": 507271, "epoch": 3019} {"train_loss": -12.640656471252441, "global_step": 507272, "epoch": 3019} {"train_loss": -11.580070495605469, "global_step": 507273, "epoch": 3019} {"train_loss": -11.618189811706543, "global_step": 507274, "epoch": 3019} {"train_loss": -12.403162002563477, "global_step": 507275, "epoch": 3019} {"train_loss": -11.663566589355469, "global_step": 507276, "epoch": 3019} {"train_loss": -12.36780071258545, "global_step": 507277, "epoch": 3019} {"train_loss": -12.072469711303711, "global_step": 507278, "epoch": 3019} {"train_loss": -12.346559524536133, "global_step": 507279, "epoch": 3019} {"train_loss": -12.132671356201172, "global_step": 507280, "epoch": 3019} {"train_loss": -12.400014877319336, "global_step": 507281, "epoch": 3019} {"train_loss": -12.308141708374023, "global_step": 507282, "epoch": 3019} {"train_loss": -11.99714469909668, "global_step": 507283, "epoch": 3019} {"train_loss": -12.027299880981445, "global_step": 507284, "epoch": 3019} {"train_loss": -11.179637908935547, "global_step": 507285, "epoch": 3019} {"train_loss": -12.160063743591309, "global_step": 507286, "epoch": 3019} {"train_loss": -11.611234664916992, "global_step": 507287, "epoch": 3019} {"train_loss": -11.438840866088867, "global_step": 507288, "epoch": 3019} {"train_loss": -11.257501602172852, "global_step": 507289, "epoch": 3019} {"train_loss": -12.276905059814453, "global_step": 507290, "epoch": 3019} {"train_loss": -10.843217849731445, "global_step": 507291, "epoch": 3019} {"train_loss": -11.928634643554688, "global_step": 507292, "epoch": 3019} {"train_loss": -10.024317741394043, "global_step": 507293, "epoch": 3019} {"train_loss": -11.05797004699707, "global_step": 507294, "epoch": 3019} {"train_loss": -11.92619514465332, "global_step": 507295, "epoch": 3019} {"train_loss": -11.933235168457031, "global_step": 507296, "epoch": 3019} {"train_loss": -11.616762161254883, "global_step": 507297, "epoch": 3019} {"train_loss": -11.965691566467285, "global_step": 507298, "epoch": 3019} {"train_loss": -12.294313430786133, "global_step": 507299, "epoch": 3019} {"train_loss": -12.2163724899292, "global_step": 507300, "epoch": 3019} {"train_loss": -12.698171615600586, "global_step": 507301, "epoch": 3019} {"train_loss": -12.069563865661621, "global_step": 507302, "epoch": 3019} {"train_loss": -12.754560470581055, "global_step": 507303, "epoch": 3019} {"train_loss": -12.448921203613281, "global_step": 507304, "epoch": 3019} {"train_loss": -12.373932838439941, "global_step": 507305, "epoch": 3019} {"train_loss": -12.518231391906738, "global_step": 507306, "epoch": 3019} {"train_loss": -12.189050674438477, "global_step": 507307, "epoch": 3019} {"train_loss": -12.594086647033691, "global_step": 507308, "epoch": 3019} {"train_loss": -12.637067794799805, "global_step": 507309, "epoch": 3019} {"train_loss": -12.673744201660156, "global_step": 507310, "epoch": 3019} {"train_loss": -12.61512279510498, "global_step": 507311, "epoch": 3019} {"train_loss": -12.487380027770996, "global_step": 507312, "epoch": 3019} {"train_loss": -12.196786880493164, "global_step": 507313, "epoch": 3019} {"train_loss": -12.704255104064941, "global_step": 507314, "epoch": 3019} {"train_loss": -12.387983322143555, "global_step": 507315, "epoch": 3019} {"train_loss": -12.43791389465332, "global_step": 507316, "epoch": 3019} {"train_loss": -12.72807502746582, "global_step": 507317, "epoch": 3019} {"train_loss": -12.757092475891113, "global_step": 507318, "epoch": 3019} {"train_loss": -12.49026870727539, "global_step": 507319, "epoch": 3019} {"train_loss": -12.356870651245117, "global_step": 507320, "epoch": 3019} {"train_loss": -12.602256774902344, "global_step": 507321, "epoch": 3019} {"train_loss": -12.547832489013672, "global_step": 507322, "epoch": 3019} {"train_loss": -12.545186996459961, "global_step": 507323, "epoch": 3019} {"train_loss": -12.756719589233398, "global_step": 507324, "epoch": 3019} {"train_loss": -12.726781845092773, "global_step": 507325, "epoch": 3019} {"train_loss": -12.57051944732666, "global_step": 507326, "epoch": 3019} {"train_loss": -12.888031005859375, "global_step": 507327, "epoch": 3019} {"train_loss": -12.529358863830566, "global_step": 507328, "epoch": 3019} {"train_loss": -12.694835662841797, "global_step": 507329, "epoch": 3019} {"train_loss": -12.889730453491211, "global_step": 507330, "epoch": 3019} {"train_loss": -12.463088989257812, "global_step": 507331, "epoch": 3019} {"train_loss": -12.54409408569336, "global_step": 507332, "epoch": 3019} {"train_loss": -12.763240814208984, "global_step": 507333, "epoch": 3019} {"train_loss": -12.292503356933594, "global_step": 507334, "epoch": 3019} {"train_loss": -12.22016716003418, "global_step": 507335, "epoch": 3019} {"train_loss": -12.522984504699707, "global_step": 507336, "epoch": 3019} {"train_loss": -12.492545127868652, "global_step": 507337, "epoch": 3019} {"train_loss": -12.683570861816406, "global_step": 507338, "epoch": 3019} {"train_loss": -12.57380485534668, "global_step": 507339, "epoch": 3019} {"train_loss": -12.362339973449707, "global_step": 507340, "epoch": 3019} {"train_loss": -12.694197654724121, "global_step": 507341, "epoch": 3019} {"train_loss": -12.108850479125977, "global_step": 507342, "epoch": 3019} {"train_loss": -12.707547187805176, "global_step": 507343, "epoch": 3019} {"train_loss": -12.50117301940918, "global_step": 507344, "epoch": 3019} {"train_loss": -12.524883270263672, "global_step": 507345, "epoch": 3019} {"train_loss": -12.73072338104248, "global_step": 507346, "epoch": 3019} {"train_loss": -11.988646507263184, "global_step": 507347, "epoch": 3019} {"train_loss": -12.353252410888672, "global_step": 507348, "epoch": 3019} {"train_loss": -11.60363483428955, "global_step": 507349, "epoch": 3019} {"train_loss": -9.597772598266602, "global_step": 507350, "epoch": 3019} {"train_loss": -10.847919464111328, "global_step": 507351, "epoch": 3019} {"train_loss": -9.2537841796875, "global_step": 507352, "epoch": 3019} {"train_loss": -11.712696075439453, "global_step": 507353, "epoch": 3019} {"train_loss": -10.189798355102539, "global_step": 507354, "epoch": 3019} {"train_loss": -10.333863258361816, "global_step": 507355, "epoch": 3019} {"train_loss": -10.07075309753418, "global_step": 507356, "epoch": 3019} {"train_loss": -8.442710876464844, "global_step": 507357, "epoch": 3019} {"train_loss": -8.814932823181152, "global_step": 507358, "epoch": 3019} {"train_loss": -12.166582368669056, "global_step": 507359, "epoch": 3019, "val_loss": 315952.8125} {"train_loss": -8.937810897827148, "global_step": 507360, "epoch": 3020} {"train_loss": -10.521015167236328, "global_step": 507361, "epoch": 3020} {"train_loss": -8.304950714111328, "global_step": 507362, "epoch": 3020} {"train_loss": -8.552833557128906, "global_step": 507363, "epoch": 3020} {"train_loss": -9.144941329956055, "global_step": 507364, "epoch": 3020} {"train_loss": -9.967367172241211, "global_step": 507365, "epoch": 3020} {"train_loss": -7.82748556137085, "global_step": 507366, "epoch": 3020} {"train_loss": -9.618904113769531, "global_step": 507367, "epoch": 3020} {"train_loss": -9.340208053588867, "global_step": 507368, "epoch": 3020} {"train_loss": -10.308311462402344, "global_step": 507369, "epoch": 3020} {"train_loss": -11.003250122070312, "global_step": 507370, "epoch": 3020} {"train_loss": -10.192890167236328, "global_step": 507371, "epoch": 3020} {"train_loss": -10.764602661132812, "global_step": 507372, "epoch": 3020} {"train_loss": -10.847601890563965, "global_step": 507373, "epoch": 3020} {"train_loss": -8.829190254211426, "global_step": 507374, "epoch": 3020} {"train_loss": -9.696685791015625, "global_step": 507375, "epoch": 3020} {"train_loss": -11.04983901977539, "global_step": 507376, "epoch": 3020} {"train_loss": -9.220065116882324, "global_step": 507377, "epoch": 3020} {"train_loss": -8.738605499267578, "global_step": 507378, "epoch": 3020} {"train_loss": -11.447900772094727, "global_step": 507379, "epoch": 3020} {"train_loss": -10.403118133544922, "global_step": 507380, "epoch": 3020} {"train_loss": -9.100164413452148, "global_step": 507381, "epoch": 3020} {"train_loss": -9.491934776306152, "global_step": 507382, "epoch": 3020} {"train_loss": -9.239280700683594, "global_step": 507383, "epoch": 3020} {"train_loss": -9.416437149047852, "global_step": 507384, "epoch": 3020} {"train_loss": -10.323983192443848, "global_step": 507385, "epoch": 3020} {"train_loss": -10.51278305053711, "global_step": 507386, "epoch": 3020} {"train_loss": -10.751077651977539, "global_step": 507387, "epoch": 3020} {"train_loss": -10.464438438415527, "global_step": 507388, "epoch": 3020} {"train_loss": -10.738195419311523, "global_step": 507389, "epoch": 3020} {"train_loss": -11.056392669677734, "global_step": 507390, "epoch": 3020} {"train_loss": -10.65608024597168, "global_step": 507391, "epoch": 3020} {"train_loss": -10.751998901367188, "global_step": 507392, "epoch": 3020} {"train_loss": -11.897720336914062, "global_step": 507393, "epoch": 3020} {"train_loss": -11.30123519897461, "global_step": 507394, "epoch": 3020} {"train_loss": -11.338809967041016, "global_step": 507395, "epoch": 3020} {"train_loss": -11.76630687713623, "global_step": 507396, "epoch": 3020} {"train_loss": -11.541484832763672, "global_step": 507397, "epoch": 3020} {"train_loss": -11.700191497802734, "global_step": 507398, "epoch": 3020} {"train_loss": -11.92673110961914, "global_step": 507399, "epoch": 3020} {"train_loss": -11.768638610839844, "global_step": 507400, "epoch": 3020} {"train_loss": -12.07308292388916, "global_step": 507401, "epoch": 3020} {"train_loss": -12.168596267700195, "global_step": 507402, "epoch": 3020} {"train_loss": -12.342708587646484, "global_step": 507403, "epoch": 3020} {"train_loss": -12.03945541381836, "global_step": 507404, "epoch": 3020} {"train_loss": -12.191280364990234, "global_step": 507405, "epoch": 3020} {"train_loss": -12.454192161560059, "global_step": 507406, "epoch": 3020} {"train_loss": -12.215105056762695, "global_step": 507407, "epoch": 3020} {"train_loss": -12.355527877807617, "global_step": 507408, "epoch": 3020} {"train_loss": -12.507506370544434, "global_step": 507409, "epoch": 3020} {"train_loss": -12.46090316772461, "global_step": 507410, "epoch": 3020} {"train_loss": -12.509703636169434, "global_step": 507411, "epoch": 3020} {"train_loss": -12.323251724243164, "global_step": 507412, "epoch": 3020} {"train_loss": -12.543526649475098, "global_step": 507413, "epoch": 3020} {"train_loss": -12.23282527923584, "global_step": 507414, "epoch": 3020} {"train_loss": -12.410682678222656, "global_step": 507415, "epoch": 3020} {"train_loss": -12.300056457519531, "global_step": 507416, "epoch": 3020} {"train_loss": -12.686175346374512, "global_step": 507417, "epoch": 3020} {"train_loss": -12.53552532196045, "global_step": 507418, "epoch": 3020} {"train_loss": -12.450456619262695, "global_step": 507419, "epoch": 3020} {"train_loss": -12.56289291381836, "global_step": 507420, "epoch": 3020} {"train_loss": -12.394742012023926, "global_step": 507421, "epoch": 3020} {"train_loss": -12.532258987426758, "global_step": 507422, "epoch": 3020} {"train_loss": -12.382800102233887, "global_step": 507423, "epoch": 3020} {"train_loss": -12.642956733703613, "global_step": 507424, "epoch": 3020} {"train_loss": -12.446081161499023, "global_step": 507425, "epoch": 3020} {"train_loss": -12.589365005493164, "global_step": 507426, "epoch": 3020} {"train_loss": -12.669183731079102, "global_step": 507427, "epoch": 3020} {"train_loss": -12.604972839355469, "global_step": 507428, "epoch": 3020} {"train_loss": -12.644278526306152, "global_step": 507429, "epoch": 3020} {"train_loss": -12.718873977661133, "global_step": 507430, "epoch": 3020} {"train_loss": -12.578643798828125, "global_step": 507431, "epoch": 3020} {"train_loss": -12.796117782592773, "global_step": 507432, "epoch": 3020} {"train_loss": -12.545957565307617, "global_step": 507433, "epoch": 3020} {"train_loss": -12.547000885009766, "global_step": 507434, "epoch": 3020} {"train_loss": -12.864753723144531, "global_step": 507435, "epoch": 3020} {"train_loss": -12.674690246582031, "global_step": 507436, "epoch": 3020} {"train_loss": -12.689810752868652, "global_step": 507437, "epoch": 3020} {"train_loss": -12.74191665649414, "global_step": 507438, "epoch": 3020} {"train_loss": -12.657791137695312, "global_step": 507439, "epoch": 3020} {"train_loss": -12.76085376739502, "global_step": 507440, "epoch": 3020} {"train_loss": -12.922077178955078, "global_step": 507441, "epoch": 3020} {"train_loss": -12.813858032226562, "global_step": 507442, "epoch": 3020} {"train_loss": -12.674158096313477, "global_step": 507443, "epoch": 3020} {"train_loss": -12.908058166503906, "global_step": 507444, "epoch": 3020} {"train_loss": -12.846332550048828, "global_step": 507445, "epoch": 3020} {"train_loss": -12.909688949584961, "global_step": 507446, "epoch": 3020} {"train_loss": -12.753990173339844, "global_step": 507447, "epoch": 3020} {"train_loss": -12.81381607055664, "global_step": 507448, "epoch": 3020} {"train_loss": -12.843118667602539, "global_step": 507449, "epoch": 3020} {"train_loss": -12.965826034545898, "global_step": 507450, "epoch": 3020} {"train_loss": -12.810397148132324, "global_step": 507451, "epoch": 3020} {"train_loss": -13.034976959228516, "global_step": 507452, "epoch": 3020} {"train_loss": -12.877273559570312, "global_step": 507453, "epoch": 3020} {"train_loss": -12.820653915405273, "global_step": 507454, "epoch": 3020} {"train_loss": -12.752750396728516, "global_step": 507455, "epoch": 3020} {"train_loss": -12.758386611938477, "global_step": 507456, "epoch": 3020} {"train_loss": -13.087478637695312, "global_step": 507457, "epoch": 3020} {"train_loss": -12.80434513092041, "global_step": 507458, "epoch": 3020} {"train_loss": -12.90072250366211, "global_step": 507459, "epoch": 3020} {"train_loss": -13.128911972045898, "global_step": 507460, "epoch": 3020} {"train_loss": -13.12882137298584, "global_step": 507461, "epoch": 3020} {"train_loss": -13.023553848266602, "global_step": 507462, "epoch": 3020} {"train_loss": -13.047441482543945, "global_step": 507463, "epoch": 3020} {"train_loss": -12.894641876220703, "global_step": 507464, "epoch": 3020} {"train_loss": -12.9999418258667, "global_step": 507465, "epoch": 3020} {"train_loss": -12.997800827026367, "global_step": 507466, "epoch": 3020} {"train_loss": -13.035018920898438, "global_step": 507467, "epoch": 3020} {"train_loss": -12.822383880615234, "global_step": 507468, "epoch": 3020} {"train_loss": -13.074176788330078, "global_step": 507469, "epoch": 3020} {"train_loss": -12.873031616210938, "global_step": 507470, "epoch": 3020} {"train_loss": -13.154752731323242, "global_step": 507471, "epoch": 3020} {"train_loss": -13.019328117370605, "global_step": 507472, "epoch": 3020} {"train_loss": -12.945116996765137, "global_step": 507473, "epoch": 3020} {"train_loss": -12.978748321533203, "global_step": 507474, "epoch": 3020} {"train_loss": -13.101550102233887, "global_step": 507475, "epoch": 3020} {"train_loss": -13.139747619628906, "global_step": 507476, "epoch": 3020} {"train_loss": -13.058141708374023, "global_step": 507477, "epoch": 3020} {"train_loss": -13.034398078918457, "global_step": 507478, "epoch": 3020} {"train_loss": -13.134502410888672, "global_step": 507479, "epoch": 3020} {"train_loss": -13.15827465057373, "global_step": 507480, "epoch": 3020} {"train_loss": -13.105716705322266, "global_step": 507481, "epoch": 3020} {"train_loss": -12.911310195922852, "global_step": 507482, "epoch": 3020} {"train_loss": -13.140585899353027, "global_step": 507483, "epoch": 3020} {"train_loss": -13.041510581970215, "global_step": 507484, "epoch": 3020} {"train_loss": -13.174689292907715, "global_step": 507485, "epoch": 3020} {"train_loss": -12.870170593261719, "global_step": 507486, "epoch": 3020} {"train_loss": -12.908855438232422, "global_step": 507487, "epoch": 3020} {"train_loss": -13.084787368774414, "global_step": 507488, "epoch": 3020} {"train_loss": -12.975448608398438, "global_step": 507489, "epoch": 3020} {"train_loss": -12.705583572387695, "global_step": 507490, "epoch": 3020} {"train_loss": -12.739394187927246, "global_step": 507491, "epoch": 3020} {"train_loss": -12.811548233032227, "global_step": 507492, "epoch": 3020} {"train_loss": -13.064153671264648, "global_step": 507493, "epoch": 3020} {"train_loss": -13.001453399658203, "global_step": 507494, "epoch": 3020} {"train_loss": -12.934820175170898, "global_step": 507495, "epoch": 3020} {"train_loss": -12.860250473022461, "global_step": 507496, "epoch": 3020} {"train_loss": -12.909622192382812, "global_step": 507497, "epoch": 3020} {"train_loss": -12.857732772827148, "global_step": 507498, "epoch": 3020} {"train_loss": -12.906511306762695, "global_step": 507499, "epoch": 3020} {"train_loss": -13.161001205444336, "global_step": 507500, "epoch": 3020} {"train_loss": -13.008659362792969, "global_step": 507501, "epoch": 3020} {"train_loss": -12.918686866760254, "global_step": 507502, "epoch": 3020} {"train_loss": -13.242748260498047, "global_step": 507503, "epoch": 3020} {"train_loss": -12.746709823608398, "global_step": 507504, "epoch": 3020} {"train_loss": -12.804384231567383, "global_step": 507505, "epoch": 3020} {"train_loss": -12.304620742797852, "global_step": 507506, "epoch": 3020} {"train_loss": -11.270343780517578, "global_step": 507507, "epoch": 3020} {"train_loss": -12.522859573364258, "global_step": 507508, "epoch": 3020} {"train_loss": -12.913844108581543, "global_step": 507509, "epoch": 3020} {"train_loss": -12.747386932373047, "global_step": 507510, "epoch": 3020} {"train_loss": -12.459372520446777, "global_step": 507511, "epoch": 3020} {"train_loss": -11.833198547363281, "global_step": 507512, "epoch": 3020} {"train_loss": -10.96582317352295, "global_step": 507513, "epoch": 3020} {"train_loss": -11.028387069702148, "global_step": 507514, "epoch": 3020} {"train_loss": -12.32292652130127, "global_step": 507515, "epoch": 3020} {"train_loss": -12.82390022277832, "global_step": 507516, "epoch": 3020} {"train_loss": -12.226740837097168, "global_step": 507517, "epoch": 3020} {"train_loss": -10.955840110778809, "global_step": 507518, "epoch": 3020} {"train_loss": -10.20407485961914, "global_step": 507519, "epoch": 3020} {"train_loss": -12.237371444702148, "global_step": 507520, "epoch": 3020} {"train_loss": -10.274568557739258, "global_step": 507521, "epoch": 3020} {"train_loss": -10.380023002624512, "global_step": 507522, "epoch": 3020} {"train_loss": -8.114034652709961, "global_step": 507523, "epoch": 3020} {"train_loss": -10.761492729187012, "global_step": 507524, "epoch": 3020} {"train_loss": -8.943132400512695, "global_step": 507525, "epoch": 3020} {"train_loss": -11.522745132446289, "global_step": 507526, "epoch": 3020} {"train_loss": -11.974437154474712, "global_step": 507527, "epoch": 3020, "val_loss": 318987.75, "train_action_mse_error": 2.008497714996338} {"train_loss": -10.545171737670898, "global_step": 507528, "epoch": 3021} {"train_loss": -12.076435089111328, "global_step": 507529, "epoch": 3021} {"train_loss": -11.20155143737793, "global_step": 507530, "epoch": 3021} {"train_loss": -10.80624008178711, "global_step": 507531, "epoch": 3021} {"train_loss": -11.481592178344727, "global_step": 507532, "epoch": 3021} {"train_loss": -11.363546371459961, "global_step": 507533, "epoch": 3021} {"train_loss": -11.488861083984375, "global_step": 507534, "epoch": 3021} {"train_loss": -10.956144332885742, "global_step": 507535, "epoch": 3021} {"train_loss": -11.767393112182617, "global_step": 507536, "epoch": 3021} {"train_loss": -11.996940612792969, "global_step": 507537, "epoch": 3021} {"train_loss": -11.428691864013672, "global_step": 507538, "epoch": 3021} {"train_loss": -12.208199501037598, "global_step": 507539, "epoch": 3021} {"train_loss": -11.674077987670898, "global_step": 507540, "epoch": 3021} {"train_loss": -12.253438949584961, "global_step": 507541, "epoch": 3021} {"train_loss": -12.256511688232422, "global_step": 507542, "epoch": 3021} {"train_loss": -12.377574920654297, "global_step": 507543, "epoch": 3021} {"train_loss": -12.371198654174805, "global_step": 507544, "epoch": 3021} {"train_loss": -12.560562133789062, "global_step": 507545, "epoch": 3021} {"train_loss": -12.484827041625977, "global_step": 507546, "epoch": 3021} {"train_loss": -12.043456077575684, "global_step": 507547, "epoch": 3021} {"train_loss": -12.232771873474121, "global_step": 507548, "epoch": 3021} {"train_loss": -12.68560791015625, "global_step": 507549, "epoch": 3021} {"train_loss": -12.455587387084961, "global_step": 507550, "epoch": 3021} {"train_loss": -12.69025993347168, "global_step": 507551, "epoch": 3021} {"train_loss": -12.73103141784668, "global_step": 507552, "epoch": 3021} {"train_loss": -12.339767456054688, "global_step": 507553, "epoch": 3021} {"train_loss": -12.120156288146973, "global_step": 507554, "epoch": 3021} {"train_loss": -12.0411958694458, "global_step": 507555, "epoch": 3021} {"train_loss": -12.46866226196289, "global_step": 507556, "epoch": 3021} {"train_loss": -11.70544147491455, "global_step": 507557, "epoch": 3021} {"train_loss": -12.357534408569336, "global_step": 507558, "epoch": 3021} {"train_loss": -12.501884460449219, "global_step": 507559, "epoch": 3021} {"train_loss": -12.501594543457031, "global_step": 507560, "epoch": 3021} {"train_loss": -12.707408905029297, "global_step": 507561, "epoch": 3021} {"train_loss": -12.61184310913086, "global_step": 507562, "epoch": 3021} {"train_loss": -12.30163860321045, "global_step": 507563, "epoch": 3021} {"train_loss": -12.845821380615234, "global_step": 507564, "epoch": 3021} {"train_loss": -12.66412353515625, "global_step": 507565, "epoch": 3021} {"train_loss": -12.709726333618164, "global_step": 507566, "epoch": 3021} {"train_loss": -12.800904273986816, "global_step": 507567, "epoch": 3021} {"train_loss": -12.407035827636719, "global_step": 507568, "epoch": 3021} {"train_loss": -12.73615837097168, "global_step": 507569, "epoch": 3021} {"train_loss": -12.620467185974121, "global_step": 507570, "epoch": 3021} {"train_loss": -12.478655815124512, "global_step": 507571, "epoch": 3021} {"train_loss": -12.914280891418457, "global_step": 507572, "epoch": 3021} {"train_loss": -12.543020248413086, "global_step": 507573, "epoch": 3021} {"train_loss": -12.963096618652344, "global_step": 507574, "epoch": 3021} {"train_loss": -12.300853729248047, "global_step": 507575, "epoch": 3021} {"train_loss": -12.288837432861328, "global_step": 507576, "epoch": 3021} {"train_loss": -12.544012069702148, "global_step": 507577, "epoch": 3021} {"train_loss": -12.286661148071289, "global_step": 507578, "epoch": 3021} {"train_loss": -10.677111625671387, "global_step": 507579, "epoch": 3021} {"train_loss": -12.797643661499023, "global_step": 507580, "epoch": 3021} {"train_loss": -11.711990356445312, "global_step": 507581, "epoch": 3021} {"train_loss": -12.61757755279541, "global_step": 507582, "epoch": 3021} {"train_loss": -11.141231536865234, "global_step": 507583, "epoch": 3021} {"train_loss": -12.61471939086914, "global_step": 507584, "epoch": 3021} {"train_loss": -11.108034133911133, "global_step": 507585, "epoch": 3021} {"train_loss": -12.159969329833984, "global_step": 507586, "epoch": 3021} {"train_loss": -12.124969482421875, "global_step": 507587, "epoch": 3021} {"train_loss": -11.889127731323242, "global_step": 507588, "epoch": 3021} {"train_loss": -12.094627380371094, "global_step": 507589, "epoch": 3021} {"train_loss": -11.194804191589355, "global_step": 507590, "epoch": 3021} {"train_loss": -10.768299102783203, "global_step": 507591, "epoch": 3021} {"train_loss": -10.60984992980957, "global_step": 507592, "epoch": 3021} {"train_loss": -10.932186126708984, "global_step": 507593, "epoch": 3021} {"train_loss": -11.130182266235352, "global_step": 507594, "epoch": 3021} {"train_loss": -11.851716041564941, "global_step": 507595, "epoch": 3021} {"train_loss": -11.323690414428711, "global_step": 507596, "epoch": 3021} {"train_loss": -11.526349067687988, "global_step": 507597, "epoch": 3021} {"train_loss": -10.92002010345459, "global_step": 507598, "epoch": 3021} {"train_loss": -11.941953659057617, "global_step": 507599, "epoch": 3021} {"train_loss": -11.555397033691406, "global_step": 507600, "epoch": 3021} {"train_loss": -10.901182174682617, "global_step": 507601, "epoch": 3021} {"train_loss": -12.208246231079102, "global_step": 507602, "epoch": 3021} {"train_loss": -11.40013313293457, "global_step": 507603, "epoch": 3021} {"train_loss": -11.098535537719727, "global_step": 507604, "epoch": 3021} {"train_loss": -12.450164794921875, "global_step": 507605, "epoch": 3021} {"train_loss": -11.297718048095703, "global_step": 507606, "epoch": 3021} {"train_loss": -12.422574043273926, "global_step": 507607, "epoch": 3021} {"train_loss": -11.13658332824707, "global_step": 507608, "epoch": 3021} {"train_loss": -12.223760604858398, "global_step": 507609, "epoch": 3021} {"train_loss": -11.962305068969727, "global_step": 507610, "epoch": 3021} {"train_loss": -11.646883010864258, "global_step": 507611, "epoch": 3021} {"train_loss": -12.49061393737793, "global_step": 507612, "epoch": 3021} {"train_loss": -11.862364768981934, "global_step": 507613, "epoch": 3021} {"train_loss": -11.614166259765625, "global_step": 507614, "epoch": 3021} {"train_loss": -11.89516544342041, "global_step": 507615, "epoch": 3021} {"train_loss": -11.437024116516113, "global_step": 507616, "epoch": 3021} {"train_loss": -11.278127670288086, "global_step": 507617, "epoch": 3021} {"train_loss": -11.85786247253418, "global_step": 507618, "epoch": 3021} {"train_loss": -12.00586223602295, "global_step": 507619, "epoch": 3021} {"train_loss": -11.876978874206543, "global_step": 507620, "epoch": 3021} {"train_loss": -12.131935119628906, "global_step": 507621, "epoch": 3021} {"train_loss": -11.759331703186035, "global_step": 507622, "epoch": 3021} {"train_loss": -12.431395530700684, "global_step": 507623, "epoch": 3021} {"train_loss": -12.317691802978516, "global_step": 507624, "epoch": 3021} {"train_loss": -12.57353401184082, "global_step": 507625, "epoch": 3021} {"train_loss": -12.21239948272705, "global_step": 507626, "epoch": 3021} {"train_loss": -11.996177673339844, "global_step": 507627, "epoch": 3021} {"train_loss": -12.669999122619629, "global_step": 507628, "epoch": 3021} {"train_loss": -11.877370834350586, "global_step": 507629, "epoch": 3021} {"train_loss": -12.151975631713867, "global_step": 507630, "epoch": 3021} {"train_loss": -12.05488395690918, "global_step": 507631, "epoch": 3021} {"train_loss": -12.249199867248535, "global_step": 507632, "epoch": 3021} {"train_loss": -12.40495491027832, "global_step": 507633, "epoch": 3021} {"train_loss": -12.015145301818848, "global_step": 507634, "epoch": 3021} {"train_loss": -12.309515953063965, "global_step": 507635, "epoch": 3021} {"train_loss": -12.662191390991211, "global_step": 507636, "epoch": 3021} {"train_loss": -12.09623908996582, "global_step": 507637, "epoch": 3021} {"train_loss": -12.694079399108887, "global_step": 507638, "epoch": 3021} {"train_loss": -12.456583976745605, "global_step": 507639, "epoch": 3021} {"train_loss": -12.537211418151855, "global_step": 507640, "epoch": 3021} {"train_loss": -12.837152481079102, "global_step": 507641, "epoch": 3021} {"train_loss": -12.535581588745117, "global_step": 507642, "epoch": 3021} {"train_loss": -12.571240425109863, "global_step": 507643, "epoch": 3021} {"train_loss": -12.766339302062988, "global_step": 507644, "epoch": 3021} {"train_loss": -12.587469100952148, "global_step": 507645, "epoch": 3021} {"train_loss": -12.718679428100586, "global_step": 507646, "epoch": 3021} {"train_loss": -12.787320137023926, "global_step": 507647, "epoch": 3021} {"train_loss": -12.873008728027344, "global_step": 507648, "epoch": 3021} {"train_loss": -12.854230880737305, "global_step": 507649, "epoch": 3021} {"train_loss": -12.936702728271484, "global_step": 507650, "epoch": 3021} {"train_loss": -12.720247268676758, "global_step": 507651, "epoch": 3021} {"train_loss": -12.703429222106934, "global_step": 507652, "epoch": 3021} {"train_loss": -12.957561492919922, "global_step": 507653, "epoch": 3021} {"train_loss": -12.722871780395508, "global_step": 507654, "epoch": 3021} {"train_loss": -12.727699279785156, "global_step": 507655, "epoch": 3021} {"train_loss": -12.895273208618164, "global_step": 507656, "epoch": 3021} {"train_loss": -12.638607025146484, "global_step": 507657, "epoch": 3021} {"train_loss": -12.347332000732422, "global_step": 507658, "epoch": 3021} {"train_loss": -12.607994079589844, "global_step": 507659, "epoch": 3021} {"train_loss": -12.688913345336914, "global_step": 507660, "epoch": 3021} {"train_loss": -12.623064041137695, "global_step": 507661, "epoch": 3021} {"train_loss": -12.87248420715332, "global_step": 507662, "epoch": 3021} {"train_loss": -12.678241729736328, "global_step": 507663, "epoch": 3021} {"train_loss": -12.78997802734375, "global_step": 507664, "epoch": 3021} {"train_loss": -12.386754035949707, "global_step": 507665, "epoch": 3021} {"train_loss": -12.977354049682617, "global_step": 507666, "epoch": 3021} {"train_loss": -12.579557418823242, "global_step": 507667, "epoch": 3021} {"train_loss": -12.801626205444336, "global_step": 507668, "epoch": 3021} {"train_loss": -12.763253211975098, "global_step": 507669, "epoch": 3021} {"train_loss": -12.6021728515625, "global_step": 507670, "epoch": 3021} {"train_loss": -12.704057693481445, "global_step": 507671, "epoch": 3021} {"train_loss": -12.479589462280273, "global_step": 507672, "epoch": 3021} {"train_loss": -12.054646492004395, "global_step": 507673, "epoch": 3021} {"train_loss": -12.834300994873047, "global_step": 507674, "epoch": 3021} {"train_loss": -12.28802490234375, "global_step": 507675, "epoch": 3021} {"train_loss": -12.820419311523438, "global_step": 507676, "epoch": 3021} {"train_loss": -12.39401626586914, "global_step": 507677, "epoch": 3021} {"train_loss": -12.601076126098633, "global_step": 507678, "epoch": 3021} {"train_loss": -12.703425407409668, "global_step": 507679, "epoch": 3021} {"train_loss": -12.327398300170898, "global_step": 507680, "epoch": 3021} {"train_loss": -11.762921333312988, "global_step": 507681, "epoch": 3021} {"train_loss": -12.681294441223145, "global_step": 507682, "epoch": 3021} {"train_loss": -12.282913208007812, "global_step": 507683, "epoch": 3021} {"train_loss": -12.76569652557373, "global_step": 507684, "epoch": 3021} {"train_loss": -12.461204528808594, "global_step": 507685, "epoch": 3021} {"train_loss": -11.422988891601562, "global_step": 507686, "epoch": 3021} {"train_loss": -11.252304077148438, "global_step": 507687, "epoch": 3021} {"train_loss": -12.114316940307617, "global_step": 507688, "epoch": 3021} {"train_loss": -11.856571197509766, "global_step": 507689, "epoch": 3021} {"train_loss": -12.258713722229004, "global_step": 507690, "epoch": 3021} {"train_loss": -12.295183181762695, "global_step": 507691, "epoch": 3021} {"train_loss": -11.907622337341309, "global_step": 507692, "epoch": 3021} {"train_loss": -11.709298133850098, "global_step": 507693, "epoch": 3021} {"train_loss": -11.658355712890625, "global_step": 507694, "epoch": 3021} {"train_loss": -12.176131140618097, "global_step": 507695, "epoch": 3021, "val_loss": 320857.1875} {"train_loss": -10.717090606689453, "global_step": 507696, "epoch": 3022} {"train_loss": -11.717020034790039, "global_step": 507697, "epoch": 3022} {"train_loss": -11.615594863891602, "global_step": 507698, "epoch": 3022} {"train_loss": -10.91727352142334, "global_step": 507699, "epoch": 3022} {"train_loss": -12.544719696044922, "global_step": 507700, "epoch": 3022} {"train_loss": -11.476079940795898, "global_step": 507701, "epoch": 3022} {"train_loss": -12.179311752319336, "global_step": 507702, "epoch": 3022} {"train_loss": -11.646127700805664, "global_step": 507703, "epoch": 3022} {"train_loss": -11.414097785949707, "global_step": 507704, "epoch": 3022} {"train_loss": -11.193267822265625, "global_step": 507705, "epoch": 3022} {"train_loss": -10.793838500976562, "global_step": 507706, "epoch": 3022} {"train_loss": -12.395772933959961, "global_step": 507707, "epoch": 3022} {"train_loss": -11.5557861328125, "global_step": 507708, "epoch": 3022} {"train_loss": -12.501289367675781, "global_step": 507709, "epoch": 3022} {"train_loss": -11.670547485351562, "global_step": 507710, "epoch": 3022} {"train_loss": -12.066909790039062, "global_step": 507711, "epoch": 3022} {"train_loss": -11.8580322265625, "global_step": 507712, "epoch": 3022} {"train_loss": -12.312251091003418, "global_step": 507713, "epoch": 3022} {"train_loss": -11.925799369812012, "global_step": 507714, "epoch": 3022} {"train_loss": -11.280037879943848, "global_step": 507715, "epoch": 3022} {"train_loss": -11.924683570861816, "global_step": 507716, "epoch": 3022} {"train_loss": -11.46185302734375, "global_step": 507717, "epoch": 3022} {"train_loss": -11.695021629333496, "global_step": 507718, "epoch": 3022} {"train_loss": -11.720096588134766, "global_step": 507719, "epoch": 3022} {"train_loss": -11.622278213500977, "global_step": 507720, "epoch": 3022} {"train_loss": -12.362363815307617, "global_step": 507721, "epoch": 3022} {"train_loss": -11.795469284057617, "global_step": 507722, "epoch": 3022} {"train_loss": -12.025985717773438, "global_step": 507723, "epoch": 3022} {"train_loss": -11.51000690460205, "global_step": 507724, "epoch": 3022} {"train_loss": -12.511039733886719, "global_step": 507725, "epoch": 3022} {"train_loss": -11.548787117004395, "global_step": 507726, "epoch": 3022} {"train_loss": -11.600826263427734, "global_step": 507727, "epoch": 3022} {"train_loss": -12.283190727233887, "global_step": 507728, "epoch": 3022} {"train_loss": -11.939401626586914, "global_step": 507729, "epoch": 3022} {"train_loss": -12.19615364074707, "global_step": 507730, "epoch": 3022} {"train_loss": -11.931129455566406, "global_step": 507731, "epoch": 3022} {"train_loss": -12.283294677734375, "global_step": 507732, "epoch": 3022} {"train_loss": -12.403369903564453, "global_step": 507733, "epoch": 3022} {"train_loss": -12.206188201904297, "global_step": 507734, "epoch": 3022} {"train_loss": -12.458710670471191, "global_step": 507735, "epoch": 3022} {"train_loss": -11.924203872680664, "global_step": 507736, "epoch": 3022} {"train_loss": -12.444391250610352, "global_step": 507737, "epoch": 3022} {"train_loss": -12.100288391113281, "global_step": 507738, "epoch": 3022} {"train_loss": -12.332619667053223, "global_step": 507739, "epoch": 3022} {"train_loss": -12.253700256347656, "global_step": 507740, "epoch": 3022} {"train_loss": -12.534662246704102, "global_step": 507741, "epoch": 3022} {"train_loss": -12.388941764831543, "global_step": 507742, "epoch": 3022} {"train_loss": -12.611120223999023, "global_step": 507743, "epoch": 3022} {"train_loss": -12.434449195861816, "global_step": 507744, "epoch": 3022} {"train_loss": -12.41915512084961, "global_step": 507745, "epoch": 3022} {"train_loss": -12.496387481689453, "global_step": 507746, "epoch": 3022} {"train_loss": -12.62065315246582, "global_step": 507747, "epoch": 3022} {"train_loss": -12.54224967956543, "global_step": 507748, "epoch": 3022} {"train_loss": -12.627630233764648, "global_step": 507749, "epoch": 3022} {"train_loss": -12.366561889648438, "global_step": 507750, "epoch": 3022} {"train_loss": -12.809911727905273, "global_step": 507751, "epoch": 3022} {"train_loss": -12.467175483703613, "global_step": 507752, "epoch": 3022} {"train_loss": -12.24612808227539, "global_step": 507753, "epoch": 3022} {"train_loss": -12.794004440307617, "global_step": 507754, "epoch": 3022} {"train_loss": -12.413176536560059, "global_step": 507755, "epoch": 3022} {"train_loss": -12.227394104003906, "global_step": 507756, "epoch": 3022} {"train_loss": -12.68980598449707, "global_step": 507757, "epoch": 3022} {"train_loss": -12.678586959838867, "global_step": 507758, "epoch": 3022} {"train_loss": -12.055419921875, "global_step": 507759, "epoch": 3022} {"train_loss": -12.640615463256836, "global_step": 507760, "epoch": 3022} {"train_loss": -12.459693908691406, "global_step": 507761, "epoch": 3022} {"train_loss": -12.486242294311523, "global_step": 507762, "epoch": 3022} {"train_loss": -12.785764694213867, "global_step": 507763, "epoch": 3022} {"train_loss": -12.608135223388672, "global_step": 507764, "epoch": 3022} {"train_loss": -13.043624877929688, "global_step": 507765, "epoch": 3022} {"train_loss": -12.49427604675293, "global_step": 507766, "epoch": 3022} {"train_loss": -12.577574729919434, "global_step": 507767, "epoch": 3022} {"train_loss": -12.770975112915039, "global_step": 507768, "epoch": 3022} {"train_loss": -12.840665817260742, "global_step": 507769, "epoch": 3022} {"train_loss": -13.035255432128906, "global_step": 507770, "epoch": 3022} {"train_loss": -12.774365425109863, "global_step": 507771, "epoch": 3022} {"train_loss": -12.992510795593262, "global_step": 507772, "epoch": 3022} {"train_loss": -12.884963989257812, "global_step": 507773, "epoch": 3022} {"train_loss": -12.913389205932617, "global_step": 507774, "epoch": 3022} {"train_loss": -12.787891387939453, "global_step": 507775, "epoch": 3022} {"train_loss": -12.709050178527832, "global_step": 507776, "epoch": 3022} {"train_loss": -12.751890182495117, "global_step": 507777, "epoch": 3022} {"train_loss": -12.715557098388672, "global_step": 507778, "epoch": 3022} {"train_loss": -12.717161178588867, "global_step": 507779, "epoch": 3022} {"train_loss": -13.00247573852539, "global_step": 507780, "epoch": 3022} {"train_loss": -12.704195022583008, "global_step": 507781, "epoch": 3022} {"train_loss": -12.853738784790039, "global_step": 507782, "epoch": 3022} {"train_loss": -12.97592544555664, "global_step": 507783, "epoch": 3022} {"train_loss": -12.930437088012695, "global_step": 507784, "epoch": 3022} {"train_loss": -13.087503433227539, "global_step": 507785, "epoch": 3022} {"train_loss": -12.71181869506836, "global_step": 507786, "epoch": 3022} {"train_loss": -13.172111511230469, "global_step": 507787, "epoch": 3022} {"train_loss": -12.686182022094727, "global_step": 507788, "epoch": 3022} {"train_loss": -12.848636627197266, "global_step": 507789, "epoch": 3022} {"train_loss": -12.927274703979492, "global_step": 507790, "epoch": 3022} {"train_loss": -13.037933349609375, "global_step": 507791, "epoch": 3022} {"train_loss": -13.05140495300293, "global_step": 507792, "epoch": 3022} {"train_loss": -13.024653434753418, "global_step": 507793, "epoch": 3022} {"train_loss": -12.860546112060547, "global_step": 507794, "epoch": 3022} {"train_loss": -12.80047607421875, "global_step": 507795, "epoch": 3022} {"train_loss": -12.866242408752441, "global_step": 507796, "epoch": 3022} {"train_loss": -12.947539329528809, "global_step": 507797, "epoch": 3022} {"train_loss": -12.370061874389648, "global_step": 507798, "epoch": 3022} {"train_loss": -12.599203109741211, "global_step": 507799, "epoch": 3022} {"train_loss": -12.917440414428711, "global_step": 507800, "epoch": 3022} {"train_loss": -12.488635063171387, "global_step": 507801, "epoch": 3022} {"train_loss": -12.547853469848633, "global_step": 507802, "epoch": 3022} {"train_loss": -12.84846305847168, "global_step": 507803, "epoch": 3022} {"train_loss": -12.623944282531738, "global_step": 507804, "epoch": 3022} {"train_loss": -12.469541549682617, "global_step": 507805, "epoch": 3022} {"train_loss": -12.579544067382812, "global_step": 507806, "epoch": 3022} {"train_loss": -12.945945739746094, "global_step": 507807, "epoch": 3022} {"train_loss": -12.851602554321289, "global_step": 507808, "epoch": 3022} {"train_loss": -12.364629745483398, "global_step": 507809, "epoch": 3022} {"train_loss": -12.163064002990723, "global_step": 507810, "epoch": 3022} {"train_loss": -13.00312614440918, "global_step": 507811, "epoch": 3022} {"train_loss": -12.045520782470703, "global_step": 507812, "epoch": 3022} {"train_loss": -12.589207649230957, "global_step": 507813, "epoch": 3022} {"train_loss": -12.825847625732422, "global_step": 507814, "epoch": 3022} {"train_loss": -12.653453826904297, "global_step": 507815, "epoch": 3022} {"train_loss": -12.146291732788086, "global_step": 507816, "epoch": 3022} {"train_loss": -12.587102890014648, "global_step": 507817, "epoch": 3022} {"train_loss": -12.631580352783203, "global_step": 507818, "epoch": 3022} {"train_loss": -12.163631439208984, "global_step": 507819, "epoch": 3022} {"train_loss": -12.368324279785156, "global_step": 507820, "epoch": 3022} {"train_loss": -12.510778427124023, "global_step": 507821, "epoch": 3022} {"train_loss": -11.434419631958008, "global_step": 507822, "epoch": 3022} {"train_loss": -11.444393157958984, "global_step": 507823, "epoch": 3022} {"train_loss": -12.836610794067383, "global_step": 507824, "epoch": 3022} {"train_loss": -12.72349739074707, "global_step": 507825, "epoch": 3022} {"train_loss": -12.286293029785156, "global_step": 507826, "epoch": 3022} {"train_loss": -12.641643524169922, "global_step": 507827, "epoch": 3022} {"train_loss": -12.631625175476074, "global_step": 507828, "epoch": 3022} {"train_loss": -12.430108070373535, "global_step": 507829, "epoch": 3022} {"train_loss": -12.548566818237305, "global_step": 507830, "epoch": 3022} {"train_loss": -12.778796195983887, "global_step": 507831, "epoch": 3022} {"train_loss": -12.82886791229248, "global_step": 507832, "epoch": 3022} {"train_loss": -12.295309066772461, "global_step": 507833, "epoch": 3022} {"train_loss": -12.568083763122559, "global_step": 507834, "epoch": 3022} {"train_loss": -12.180802345275879, "global_step": 507835, "epoch": 3022} {"train_loss": -12.286352157592773, "global_step": 507836, "epoch": 3022} {"train_loss": -12.614751815795898, "global_step": 507837, "epoch": 3022} {"train_loss": -12.267621994018555, "global_step": 507838, "epoch": 3022} {"train_loss": -11.687341690063477, "global_step": 507839, "epoch": 3022} {"train_loss": -12.493372917175293, "global_step": 507840, "epoch": 3022} {"train_loss": -12.505781173706055, "global_step": 507841, "epoch": 3022} {"train_loss": -12.784728050231934, "global_step": 507842, "epoch": 3022} {"train_loss": -12.1979398727417, "global_step": 507843, "epoch": 3022} {"train_loss": -12.603002548217773, "global_step": 507844, "epoch": 3022} {"train_loss": -11.99929141998291, "global_step": 507845, "epoch": 3022} {"train_loss": -12.57436752319336, "global_step": 507846, "epoch": 3022} {"train_loss": -12.230266571044922, "global_step": 507847, "epoch": 3022} {"train_loss": -12.072835922241211, "global_step": 507848, "epoch": 3022} {"train_loss": -12.592029571533203, "global_step": 507849, "epoch": 3022} {"train_loss": -11.94129753112793, "global_step": 507850, "epoch": 3022} {"train_loss": -12.051141738891602, "global_step": 507851, "epoch": 3022} {"train_loss": -10.836772918701172, "global_step": 507852, "epoch": 3022} {"train_loss": -10.88068962097168, "global_step": 507853, "epoch": 3022} {"train_loss": -12.552490234375, "global_step": 507854, "epoch": 3022} {"train_loss": -10.009510040283203, "global_step": 507855, "epoch": 3022} {"train_loss": -12.431081771850586, "global_step": 507856, "epoch": 3022} {"train_loss": -11.896809577941895, "global_step": 507857, "epoch": 3022} {"train_loss": -11.832448959350586, "global_step": 507858, "epoch": 3022} {"train_loss": -11.50112533569336, "global_step": 507859, "epoch": 3022} {"train_loss": -11.95571517944336, "global_step": 507860, "epoch": 3022} {"train_loss": -11.97706413269043, "global_step": 507861, "epoch": 3022} {"train_loss": -11.68563461303711, "global_step": 507862, "epoch": 3022} {"train_loss": -12.323469939686003, "global_step": 507863, "epoch": 3022, "val_loss": 319864.65625} {"train_loss": -11.625743865966797, "global_step": 507864, "epoch": 3023} {"train_loss": -10.437429428100586, "global_step": 507865, "epoch": 3023} {"train_loss": -11.372943878173828, "global_step": 507866, "epoch": 3023} {"train_loss": -10.28731918334961, "global_step": 507867, "epoch": 3023} {"train_loss": -11.59085464477539, "global_step": 507868, "epoch": 3023} {"train_loss": -11.29710578918457, "global_step": 507869, "epoch": 3023} {"train_loss": -11.386579513549805, "global_step": 507870, "epoch": 3023} {"train_loss": -10.97532844543457, "global_step": 507871, "epoch": 3023} {"train_loss": -10.508917808532715, "global_step": 507872, "epoch": 3023} {"train_loss": -9.621313095092773, "global_step": 507873, "epoch": 3023} {"train_loss": -9.973249435424805, "global_step": 507874, "epoch": 3023} {"train_loss": -11.802718162536621, "global_step": 507875, "epoch": 3023} {"train_loss": -11.375005722045898, "global_step": 507876, "epoch": 3023} {"train_loss": -11.172637939453125, "global_step": 507877, "epoch": 3023} {"train_loss": -11.158997535705566, "global_step": 507878, "epoch": 3023} {"train_loss": -11.163833618164062, "global_step": 507879, "epoch": 3023} {"train_loss": -11.678375244140625, "global_step": 507880, "epoch": 3023} {"train_loss": -10.276586532592773, "global_step": 507881, "epoch": 3023} {"train_loss": -11.806974411010742, "global_step": 507882, "epoch": 3023} {"train_loss": -11.19517993927002, "global_step": 507883, "epoch": 3023} {"train_loss": -11.417828559875488, "global_step": 507884, "epoch": 3023} {"train_loss": -11.646373748779297, "global_step": 507885, "epoch": 3023} {"train_loss": -12.131580352783203, "global_step": 507886, "epoch": 3023} {"train_loss": -11.266942977905273, "global_step": 507887, "epoch": 3023} {"train_loss": -12.523530960083008, "global_step": 507888, "epoch": 3023} {"train_loss": -11.658946990966797, "global_step": 507889, "epoch": 3023} {"train_loss": -11.690345764160156, "global_step": 507890, "epoch": 3023} {"train_loss": -12.102861404418945, "global_step": 507891, "epoch": 3023} {"train_loss": -12.007299423217773, "global_step": 507892, "epoch": 3023} {"train_loss": -12.622480392456055, "global_step": 507893, "epoch": 3023} {"train_loss": -11.872051239013672, "global_step": 507894, "epoch": 3023} {"train_loss": -12.313915252685547, "global_step": 507895, "epoch": 3023} {"train_loss": -12.619239807128906, "global_step": 507896, "epoch": 3023} {"train_loss": -12.241724967956543, "global_step": 507897, "epoch": 3023} {"train_loss": -12.703636169433594, "global_step": 507898, "epoch": 3023} {"train_loss": -12.34836196899414, "global_step": 507899, "epoch": 3023} {"train_loss": -12.530400276184082, "global_step": 507900, "epoch": 3023} {"train_loss": -12.237443923950195, "global_step": 507901, "epoch": 3023} {"train_loss": -12.491697311401367, "global_step": 507902, "epoch": 3023} {"train_loss": -12.29287338256836, "global_step": 507903, "epoch": 3023} {"train_loss": -12.74538803100586, "global_step": 507904, "epoch": 3023} {"train_loss": -12.50987434387207, "global_step": 507905, "epoch": 3023} {"train_loss": -12.7170991897583, "global_step": 507906, "epoch": 3023} {"train_loss": -12.742721557617188, "global_step": 507907, "epoch": 3023} {"train_loss": -12.589956283569336, "global_step": 507908, "epoch": 3023} {"train_loss": -12.56992244720459, "global_step": 507909, "epoch": 3023} {"train_loss": -12.667287826538086, "global_step": 507910, "epoch": 3023} {"train_loss": -12.789863586425781, "global_step": 507911, "epoch": 3023} {"train_loss": -12.645330429077148, "global_step": 507912, "epoch": 3023} {"train_loss": -12.679535865783691, "global_step": 507913, "epoch": 3023} {"train_loss": -12.7320556640625, "global_step": 507914, "epoch": 3023} {"train_loss": -12.670165061950684, "global_step": 507915, "epoch": 3023} {"train_loss": -12.584511756896973, "global_step": 507916, "epoch": 3023} {"train_loss": -12.889558792114258, "global_step": 507917, "epoch": 3023} {"train_loss": -12.623697280883789, "global_step": 507918, "epoch": 3023} {"train_loss": -12.831613540649414, "global_step": 507919, "epoch": 3023} {"train_loss": -12.711709976196289, "global_step": 507920, "epoch": 3023} {"train_loss": -12.769993782043457, "global_step": 507921, "epoch": 3023} {"train_loss": -12.747245788574219, "global_step": 507922, "epoch": 3023} {"train_loss": -12.615568161010742, "global_step": 507923, "epoch": 3023} {"train_loss": -12.842106819152832, "global_step": 507924, "epoch": 3023} {"train_loss": -12.669784545898438, "global_step": 507925, "epoch": 3023} {"train_loss": -12.517485618591309, "global_step": 507926, "epoch": 3023} {"train_loss": -12.689584732055664, "global_step": 507927, "epoch": 3023} {"train_loss": -12.80954360961914, "global_step": 507928, "epoch": 3023} {"train_loss": -12.57387638092041, "global_step": 507929, "epoch": 3023} {"train_loss": -12.716541290283203, "global_step": 507930, "epoch": 3023} {"train_loss": -11.536510467529297, "global_step": 507931, "epoch": 3023} {"train_loss": -12.654787063598633, "global_step": 507932, "epoch": 3023} {"train_loss": -12.342309951782227, "global_step": 507933, "epoch": 3023} {"train_loss": -12.292826652526855, "global_step": 507934, "epoch": 3023} {"train_loss": -12.437915802001953, "global_step": 507935, "epoch": 3023} {"train_loss": -11.860254287719727, "global_step": 507936, "epoch": 3023} {"train_loss": -11.715776443481445, "global_step": 507937, "epoch": 3023} {"train_loss": -11.841384887695312, "global_step": 507938, "epoch": 3023} {"train_loss": -12.537118911743164, "global_step": 507939, "epoch": 3023} {"train_loss": -12.41761302947998, "global_step": 507940, "epoch": 3023} {"train_loss": -11.757801055908203, "global_step": 507941, "epoch": 3023} {"train_loss": -12.618945121765137, "global_step": 507942, "epoch": 3023} {"train_loss": -12.186592102050781, "global_step": 507943, "epoch": 3023} {"train_loss": -12.238014221191406, "global_step": 507944, "epoch": 3023} {"train_loss": -12.818485260009766, "global_step": 507945, "epoch": 3023} {"train_loss": -12.420654296875, "global_step": 507946, "epoch": 3023} {"train_loss": -12.553812026977539, "global_step": 507947, "epoch": 3023} {"train_loss": -12.869842529296875, "global_step": 507948, "epoch": 3023} {"train_loss": -12.61519718170166, "global_step": 507949, "epoch": 3023} {"train_loss": -12.732940673828125, "global_step": 507950, "epoch": 3023} {"train_loss": -13.145318031311035, "global_step": 507951, "epoch": 3023} {"train_loss": -12.612700462341309, "global_step": 507952, "epoch": 3023} {"train_loss": -12.922170639038086, "global_step": 507953, "epoch": 3023} {"train_loss": -12.584622383117676, "global_step": 507954, "epoch": 3023} {"train_loss": -12.798700332641602, "global_step": 507955, "epoch": 3023} {"train_loss": -12.640140533447266, "global_step": 507956, "epoch": 3023} {"train_loss": -12.683951377868652, "global_step": 507957, "epoch": 3023} {"train_loss": -12.825311660766602, "global_step": 507958, "epoch": 3023} {"train_loss": -13.022146224975586, "global_step": 507959, "epoch": 3023} {"train_loss": -12.779714584350586, "global_step": 507960, "epoch": 3023} {"train_loss": -12.819995880126953, "global_step": 507961, "epoch": 3023} {"train_loss": -12.523271560668945, "global_step": 507962, "epoch": 3023} {"train_loss": -13.026993751525879, "global_step": 507963, "epoch": 3023} {"train_loss": -12.621723175048828, "global_step": 507964, "epoch": 3023} {"train_loss": -12.726186752319336, "global_step": 507965, "epoch": 3023} {"train_loss": -13.129179000854492, "global_step": 507966, "epoch": 3023} {"train_loss": -12.801816940307617, "global_step": 507967, "epoch": 3023} {"train_loss": -12.972572326660156, "global_step": 507968, "epoch": 3023} {"train_loss": -13.075831413269043, "global_step": 507969, "epoch": 3023} {"train_loss": -12.820174217224121, "global_step": 507970, "epoch": 3023} {"train_loss": -12.525094985961914, "global_step": 507971, "epoch": 3023} {"train_loss": -13.03111457824707, "global_step": 507972, "epoch": 3023} {"train_loss": -12.509420394897461, "global_step": 507973, "epoch": 3023} {"train_loss": -12.50918197631836, "global_step": 507974, "epoch": 3023} {"train_loss": -12.607688903808594, "global_step": 507975, "epoch": 3023} {"train_loss": -12.601699829101562, "global_step": 507976, "epoch": 3023} {"train_loss": -12.18701457977295, "global_step": 507977, "epoch": 3023} {"train_loss": -12.338658332824707, "global_step": 507978, "epoch": 3023} {"train_loss": -12.689906120300293, "global_step": 507979, "epoch": 3023} {"train_loss": -12.663822174072266, "global_step": 507980, "epoch": 3023} {"train_loss": -12.333578109741211, "global_step": 507981, "epoch": 3023} {"train_loss": -12.877731323242188, "global_step": 507982, "epoch": 3023} {"train_loss": -12.183080673217773, "global_step": 507983, "epoch": 3023} {"train_loss": -12.460136413574219, "global_step": 507984, "epoch": 3023} {"train_loss": -12.63980770111084, "global_step": 507985, "epoch": 3023} {"train_loss": -12.430170059204102, "global_step": 507986, "epoch": 3023} {"train_loss": -12.552346229553223, "global_step": 507987, "epoch": 3023} {"train_loss": -11.819121360778809, "global_step": 507988, "epoch": 3023} {"train_loss": -12.642873764038086, "global_step": 507989, "epoch": 3023} {"train_loss": -11.785834312438965, "global_step": 507990, "epoch": 3023} {"train_loss": -12.892538070678711, "global_step": 507991, "epoch": 3023} {"train_loss": -11.890785217285156, "global_step": 507992, "epoch": 3023} {"train_loss": -12.324929237365723, "global_step": 507993, "epoch": 3023} {"train_loss": -11.856561660766602, "global_step": 507994, "epoch": 3023} {"train_loss": -12.101309776306152, "global_step": 507995, "epoch": 3023} {"train_loss": -11.160015106201172, "global_step": 507996, "epoch": 3023} {"train_loss": -12.741301536560059, "global_step": 507997, "epoch": 3023} {"train_loss": -11.302701950073242, "global_step": 507998, "epoch": 3023} {"train_loss": -11.425702095031738, "global_step": 507999, "epoch": 3023} {"train_loss": -12.220344543457031, "global_step": 508000, "epoch": 3023} {"train_loss": -10.94821548461914, "global_step": 508001, "epoch": 3023} {"train_loss": -12.246352195739746, "global_step": 508002, "epoch": 3023} {"train_loss": -12.472479820251465, "global_step": 508003, "epoch": 3023} {"train_loss": -10.81186294555664, "global_step": 508004, "epoch": 3023} {"train_loss": -11.376530647277832, "global_step": 508005, "epoch": 3023} {"train_loss": -12.020363807678223, "global_step": 508006, "epoch": 3023} {"train_loss": -11.865974426269531, "global_step": 508007, "epoch": 3023} {"train_loss": -11.595829010009766, "global_step": 508008, "epoch": 3023} {"train_loss": -11.726724624633789, "global_step": 508009, "epoch": 3023} {"train_loss": -12.527276992797852, "global_step": 508010, "epoch": 3023} {"train_loss": -12.490312576293945, "global_step": 508011, "epoch": 3023} {"train_loss": -11.55398178100586, "global_step": 508012, "epoch": 3023} {"train_loss": -12.325313568115234, "global_step": 508013, "epoch": 3023} {"train_loss": -11.905723571777344, "global_step": 508014, "epoch": 3023} {"train_loss": -11.84773063659668, "global_step": 508015, "epoch": 3023} {"train_loss": -12.478166580200195, "global_step": 508016, "epoch": 3023} {"train_loss": -11.876304626464844, "global_step": 508017, "epoch": 3023} {"train_loss": -12.016156196594238, "global_step": 508018, "epoch": 3023} {"train_loss": -11.528667449951172, "global_step": 508019, "epoch": 3023} {"train_loss": -12.45134162902832, "global_step": 508020, "epoch": 3023} {"train_loss": -11.646865844726562, "global_step": 508021, "epoch": 3023} {"train_loss": -12.001253128051758, "global_step": 508022, "epoch": 3023} {"train_loss": -12.139659881591797, "global_step": 508023, "epoch": 3023} {"train_loss": -11.593804359436035, "global_step": 508024, "epoch": 3023} {"train_loss": -12.072757720947266, "global_step": 508025, "epoch": 3023} {"train_loss": -12.069091796875, "global_step": 508026, "epoch": 3023} {"train_loss": -12.487116813659668, "global_step": 508027, "epoch": 3023} {"train_loss": -11.935449600219727, "global_step": 508028, "epoch": 3023} {"train_loss": -12.354389190673828, "global_step": 508029, "epoch": 3023} {"train_loss": -12.3663330078125, "global_step": 508030, "epoch": 3023} {"train_loss": -12.19875551405407, "global_step": 508031, "epoch": 3023, "val_loss": 320494.8125} {"train_loss": -12.218907356262207, "global_step": 508032, "epoch": 3024} {"train_loss": -11.854065895080566, "global_step": 508033, "epoch": 3024} {"train_loss": -12.313177108764648, "global_step": 508034, "epoch": 3024} {"train_loss": -12.36974811553955, "global_step": 508035, "epoch": 3024} {"train_loss": -12.310535430908203, "global_step": 508036, "epoch": 3024} {"train_loss": -12.333036422729492, "global_step": 508037, "epoch": 3024} {"train_loss": -12.496072769165039, "global_step": 508038, "epoch": 3024} {"train_loss": -11.880199432373047, "global_step": 508039, "epoch": 3024} {"train_loss": -12.181083679199219, "global_step": 508040, "epoch": 3024} {"train_loss": -12.529109954833984, "global_step": 508041, "epoch": 3024} {"train_loss": -12.20834732055664, "global_step": 508042, "epoch": 3024} {"train_loss": -12.268401145935059, "global_step": 508043, "epoch": 3024} {"train_loss": -12.295778274536133, "global_step": 508044, "epoch": 3024} {"train_loss": -12.549087524414062, "global_step": 508045, "epoch": 3024} {"train_loss": -12.417512893676758, "global_step": 508046, "epoch": 3024} {"train_loss": -12.460172653198242, "global_step": 508047, "epoch": 3024} {"train_loss": -12.28087329864502, "global_step": 508048, "epoch": 3024} {"train_loss": -12.246212005615234, "global_step": 508049, "epoch": 3024} {"train_loss": -12.621058464050293, "global_step": 508050, "epoch": 3024} {"train_loss": -12.408513069152832, "global_step": 508051, "epoch": 3024} {"train_loss": -12.809179306030273, "global_step": 508052, "epoch": 3024} {"train_loss": -12.423380851745605, "global_step": 508053, "epoch": 3024} {"train_loss": -12.237754821777344, "global_step": 508054, "epoch": 3024} {"train_loss": -12.556921005249023, "global_step": 508055, "epoch": 3024} {"train_loss": -12.423238754272461, "global_step": 508056, "epoch": 3024} {"train_loss": -12.541694641113281, "global_step": 508057, "epoch": 3024} {"train_loss": -12.65311050415039, "global_step": 508058, "epoch": 3024} {"train_loss": -12.673168182373047, "global_step": 508059, "epoch": 3024} {"train_loss": -12.645715713500977, "global_step": 508060, "epoch": 3024} {"train_loss": -12.5181245803833, "global_step": 508061, "epoch": 3024} {"train_loss": -12.675769805908203, "global_step": 508062, "epoch": 3024} {"train_loss": -12.671806335449219, "global_step": 508063, "epoch": 3024} {"train_loss": -12.8897123336792, "global_step": 508064, "epoch": 3024} {"train_loss": -12.671952247619629, "global_step": 508065, "epoch": 3024} {"train_loss": -12.884405136108398, "global_step": 508066, "epoch": 3024} {"train_loss": -12.867061614990234, "global_step": 508067, "epoch": 3024} {"train_loss": -12.858729362487793, "global_step": 508068, "epoch": 3024} {"train_loss": -12.916200637817383, "global_step": 508069, "epoch": 3024} {"train_loss": -12.906318664550781, "global_step": 508070, "epoch": 3024} {"train_loss": -12.940495491027832, "global_step": 508071, "epoch": 3024} {"train_loss": -12.830307006835938, "global_step": 508072, "epoch": 3024} {"train_loss": -12.983575820922852, "global_step": 508073, "epoch": 3024} {"train_loss": -12.8468599319458, "global_step": 508074, "epoch": 3024} {"train_loss": -13.07302474975586, "global_step": 508075, "epoch": 3024} {"train_loss": -12.85291576385498, "global_step": 508076, "epoch": 3024} {"train_loss": -12.753780364990234, "global_step": 508077, "epoch": 3024} {"train_loss": -12.890294075012207, "global_step": 508078, "epoch": 3024} {"train_loss": -12.680299758911133, "global_step": 508079, "epoch": 3024} {"train_loss": -12.928125381469727, "global_step": 508080, "epoch": 3024} {"train_loss": -12.747274398803711, "global_step": 508081, "epoch": 3024} {"train_loss": -12.788683891296387, "global_step": 508082, "epoch": 3024} {"train_loss": -12.968352317810059, "global_step": 508083, "epoch": 3024} {"train_loss": -12.831591606140137, "global_step": 508084, "epoch": 3024} {"train_loss": -12.742738723754883, "global_step": 508085, "epoch": 3024} {"train_loss": -12.771888732910156, "global_step": 508086, "epoch": 3024} {"train_loss": -13.017984390258789, "global_step": 508087, "epoch": 3024} {"train_loss": -12.933202743530273, "global_step": 508088, "epoch": 3024} {"train_loss": -12.612264633178711, "global_step": 508089, "epoch": 3024} {"train_loss": -13.014547348022461, "global_step": 508090, "epoch": 3024} {"train_loss": -12.415188789367676, "global_step": 508091, "epoch": 3024} {"train_loss": -12.605833053588867, "global_step": 508092, "epoch": 3024} {"train_loss": -12.902907371520996, "global_step": 508093, "epoch": 3024} {"train_loss": -12.511663436889648, "global_step": 508094, "epoch": 3024} {"train_loss": -12.477118492126465, "global_step": 508095, "epoch": 3024} {"train_loss": -12.804638862609863, "global_step": 508096, "epoch": 3024} {"train_loss": -12.042351722717285, "global_step": 508097, "epoch": 3024} {"train_loss": -11.799652099609375, "global_step": 508098, "epoch": 3024} {"train_loss": -12.52349853515625, "global_step": 508099, "epoch": 3024} {"train_loss": -11.564338684082031, "global_step": 508100, "epoch": 3024} {"train_loss": -11.136030197143555, "global_step": 508101, "epoch": 3024} {"train_loss": -12.31528091430664, "global_step": 508102, "epoch": 3024} {"train_loss": -12.029932022094727, "global_step": 508103, "epoch": 3024} {"train_loss": -12.338294982910156, "global_step": 508104, "epoch": 3024} {"train_loss": -11.460346221923828, "global_step": 508105, "epoch": 3024} {"train_loss": -12.100147247314453, "global_step": 508106, "epoch": 3024} {"train_loss": -12.330700874328613, "global_step": 508107, "epoch": 3024} {"train_loss": -12.127002716064453, "global_step": 508108, "epoch": 3024} {"train_loss": -11.446857452392578, "global_step": 508109, "epoch": 3024} {"train_loss": -12.162069320678711, "global_step": 508110, "epoch": 3024} {"train_loss": -12.345673561096191, "global_step": 508111, "epoch": 3024} {"train_loss": -11.238027572631836, "global_step": 508112, "epoch": 3024} {"train_loss": -12.175688743591309, "global_step": 508113, "epoch": 3024} {"train_loss": -11.96725082397461, "global_step": 508114, "epoch": 3024} {"train_loss": -11.804025650024414, "global_step": 508115, "epoch": 3024} {"train_loss": -11.93911361694336, "global_step": 508116, "epoch": 3024} {"train_loss": -11.895498275756836, "global_step": 508117, "epoch": 3024} {"train_loss": -11.62543773651123, "global_step": 508118, "epoch": 3024} {"train_loss": -12.000906944274902, "global_step": 508119, "epoch": 3024} {"train_loss": -11.099748611450195, "global_step": 508120, "epoch": 3024} {"train_loss": -11.893903732299805, "global_step": 508121, "epoch": 3024} {"train_loss": -11.457624435424805, "global_step": 508122, "epoch": 3024} {"train_loss": -11.548425674438477, "global_step": 508123, "epoch": 3024} {"train_loss": -11.708599090576172, "global_step": 508124, "epoch": 3024} {"train_loss": -12.262194633483887, "global_step": 508125, "epoch": 3024} {"train_loss": -11.161325454711914, "global_step": 508126, "epoch": 3024} {"train_loss": -11.025457382202148, "global_step": 508127, "epoch": 3024} {"train_loss": -12.149612426757812, "global_step": 508128, "epoch": 3024} {"train_loss": -10.572568893432617, "global_step": 508129, "epoch": 3024} {"train_loss": -12.431187629699707, "global_step": 508130, "epoch": 3024} {"train_loss": -11.147989273071289, "global_step": 508131, "epoch": 3024} {"train_loss": -12.026349067687988, "global_step": 508132, "epoch": 3024} {"train_loss": -11.787052154541016, "global_step": 508133, "epoch": 3024} {"train_loss": -12.08233642578125, "global_step": 508134, "epoch": 3024} {"train_loss": -12.293889999389648, "global_step": 508135, "epoch": 3024} {"train_loss": -11.817567825317383, "global_step": 508136, "epoch": 3024} {"train_loss": -12.129894256591797, "global_step": 508137, "epoch": 3024} {"train_loss": -12.003677368164062, "global_step": 508138, "epoch": 3024} {"train_loss": -12.161503791809082, "global_step": 508139, "epoch": 3024} {"train_loss": -12.414592742919922, "global_step": 508140, "epoch": 3024} {"train_loss": -12.603354454040527, "global_step": 508141, "epoch": 3024} {"train_loss": -12.011712074279785, "global_step": 508142, "epoch": 3024} {"train_loss": -12.80224609375, "global_step": 508143, "epoch": 3024} {"train_loss": -11.94955062866211, "global_step": 508144, "epoch": 3024} {"train_loss": -12.298786163330078, "global_step": 508145, "epoch": 3024} {"train_loss": -12.246552467346191, "global_step": 508146, "epoch": 3024} {"train_loss": -12.253080368041992, "global_step": 508147, "epoch": 3024} {"train_loss": -12.31637191772461, "global_step": 508148, "epoch": 3024} {"train_loss": -12.501531600952148, "global_step": 508149, "epoch": 3024} {"train_loss": -12.560014724731445, "global_step": 508150, "epoch": 3024} {"train_loss": -12.20802116394043, "global_step": 508151, "epoch": 3024} {"train_loss": -12.871459007263184, "global_step": 508152, "epoch": 3024} {"train_loss": -12.40203857421875, "global_step": 508153, "epoch": 3024} {"train_loss": -12.73895263671875, "global_step": 508154, "epoch": 3024} {"train_loss": -12.711169242858887, "global_step": 508155, "epoch": 3024} {"train_loss": -12.640340805053711, "global_step": 508156, "epoch": 3024} {"train_loss": -12.565984725952148, "global_step": 508157, "epoch": 3024} {"train_loss": -12.314751625061035, "global_step": 508158, "epoch": 3024} {"train_loss": -12.580833435058594, "global_step": 508159, "epoch": 3024} {"train_loss": -12.734471321105957, "global_step": 508160, "epoch": 3024} {"train_loss": -12.753250122070312, "global_step": 508161, "epoch": 3024} {"train_loss": -12.68088436126709, "global_step": 508162, "epoch": 3024} {"train_loss": -12.882243156433105, "global_step": 508163, "epoch": 3024} {"train_loss": -12.931829452514648, "global_step": 508164, "epoch": 3024} {"train_loss": -12.63477897644043, "global_step": 508165, "epoch": 3024} {"train_loss": -12.82962417602539, "global_step": 508166, "epoch": 3024} {"train_loss": -12.779024124145508, "global_step": 508167, "epoch": 3024} {"train_loss": -12.610724449157715, "global_step": 508168, "epoch": 3024} {"train_loss": -12.821653366088867, "global_step": 508169, "epoch": 3024} {"train_loss": -12.890262603759766, "global_step": 508170, "epoch": 3024} {"train_loss": -12.635059356689453, "global_step": 508171, "epoch": 3024} {"train_loss": -12.797897338867188, "global_step": 508172, "epoch": 3024} {"train_loss": -12.963635444641113, "global_step": 508173, "epoch": 3024} {"train_loss": -12.594305992126465, "global_step": 508174, "epoch": 3024} {"train_loss": -12.775135040283203, "global_step": 508175, "epoch": 3024} {"train_loss": -12.794544219970703, "global_step": 508176, "epoch": 3024} {"train_loss": -12.639898300170898, "global_step": 508177, "epoch": 3024} {"train_loss": -12.941393852233887, "global_step": 508178, "epoch": 3024} {"train_loss": -12.672540664672852, "global_step": 508179, "epoch": 3024} {"train_loss": -12.975691795349121, "global_step": 508180, "epoch": 3024} {"train_loss": -12.86756706237793, "global_step": 508181, "epoch": 3024} {"train_loss": -12.899223327636719, "global_step": 508182, "epoch": 3024} {"train_loss": -12.868154525756836, "global_step": 508183, "epoch": 3024} {"train_loss": -12.590447425842285, "global_step": 508184, "epoch": 3024} {"train_loss": -12.929481506347656, "global_step": 508185, "epoch": 3024} {"train_loss": -12.953263282775879, "global_step": 508186, "epoch": 3024} {"train_loss": -13.1808500289917, "global_step": 508187, "epoch": 3024} {"train_loss": -12.883552551269531, "global_step": 508188, "epoch": 3024} {"train_loss": -12.996439933776855, "global_step": 508189, "epoch": 3024} {"train_loss": -12.549395561218262, "global_step": 508190, "epoch": 3024} {"train_loss": -12.940956115722656, "global_step": 508191, "epoch": 3024} {"train_loss": -12.787277221679688, "global_step": 508192, "epoch": 3024} {"train_loss": -12.587371826171875, "global_step": 508193, "epoch": 3024} {"train_loss": -13.190099716186523, "global_step": 508194, "epoch": 3024} {"train_loss": -12.39969253540039, "global_step": 508195, "epoch": 3024} {"train_loss": -12.635458946228027, "global_step": 508196, "epoch": 3024} {"train_loss": -12.81683349609375, "global_step": 508197, "epoch": 3024} {"train_loss": -12.338363647460938, "global_step": 508198, "epoch": 3024} {"train_loss": -12.435881489799137, "global_step": 508199, "epoch": 3024, "val_loss": 321182.875} {"train_loss": -12.444032669067383, "global_step": 508200, "epoch": 3025} {"train_loss": -12.422019004821777, "global_step": 508201, "epoch": 3025} {"train_loss": -12.870269775390625, "global_step": 508202, "epoch": 3025} {"train_loss": -12.628009796142578, "global_step": 508203, "epoch": 3025} {"train_loss": -11.82706069946289, "global_step": 508204, "epoch": 3025} {"train_loss": -12.219522476196289, "global_step": 508205, "epoch": 3025} {"train_loss": -12.586723327636719, "global_step": 508206, "epoch": 3025} {"train_loss": -12.061769485473633, "global_step": 508207, "epoch": 3025} {"train_loss": -12.332512855529785, "global_step": 508208, "epoch": 3025} {"train_loss": -11.965306282043457, "global_step": 508209, "epoch": 3025} {"train_loss": -10.216150283813477, "global_step": 508210, "epoch": 3025} {"train_loss": -11.912958145141602, "global_step": 508211, "epoch": 3025} {"train_loss": -8.650867462158203, "global_step": 508212, "epoch": 3025} {"train_loss": -11.55230712890625, "global_step": 508213, "epoch": 3025} {"train_loss": -10.478360176086426, "global_step": 508214, "epoch": 3025} {"train_loss": -11.208940505981445, "global_step": 508215, "epoch": 3025} {"train_loss": -9.119911193847656, "global_step": 508216, "epoch": 3025} {"train_loss": -11.403705596923828, "global_step": 508217, "epoch": 3025} {"train_loss": -10.140295028686523, "global_step": 508218, "epoch": 3025} {"train_loss": -11.338579177856445, "global_step": 508219, "epoch": 3025} {"train_loss": -9.403840065002441, "global_step": 508220, "epoch": 3025} {"train_loss": -9.352121353149414, "global_step": 508221, "epoch": 3025} {"train_loss": -8.081255912780762, "global_step": 508222, "epoch": 3025} {"train_loss": -8.652547836303711, "global_step": 508223, "epoch": 3025} {"train_loss": -8.294242858886719, "global_step": 508224, "epoch": 3025} {"train_loss": -9.442512512207031, "global_step": 508225, "epoch": 3025} {"train_loss": -8.489418983459473, "global_step": 508226, "epoch": 3025} {"train_loss": -9.049568176269531, "global_step": 508227, "epoch": 3025} {"train_loss": -11.028244018554688, "global_step": 508228, "epoch": 3025} {"train_loss": -10.049092292785645, "global_step": 508229, "epoch": 3025} {"train_loss": -9.050228118896484, "global_step": 508230, "epoch": 3025} {"train_loss": -10.32036018371582, "global_step": 508231, "epoch": 3025} {"train_loss": -10.710843086242676, "global_step": 508232, "epoch": 3025} {"train_loss": -10.308209419250488, "global_step": 508233, "epoch": 3025} {"train_loss": -11.022993087768555, "global_step": 508234, "epoch": 3025} {"train_loss": -11.562397956848145, "global_step": 508235, "epoch": 3025} {"train_loss": -10.583919525146484, "global_step": 508236, "epoch": 3025} {"train_loss": -10.791228294372559, "global_step": 508237, "epoch": 3025} {"train_loss": -11.839264869689941, "global_step": 508238, "epoch": 3025} {"train_loss": -10.9097318649292, "global_step": 508239, "epoch": 3025} {"train_loss": -11.788549423217773, "global_step": 508240, "epoch": 3025} {"train_loss": -11.251410484313965, "global_step": 508241, "epoch": 3025} {"train_loss": -11.205219268798828, "global_step": 508242, "epoch": 3025} {"train_loss": -10.885382652282715, "global_step": 508243, "epoch": 3025} {"train_loss": -10.388587951660156, "global_step": 508244, "epoch": 3025} {"train_loss": -11.667181015014648, "global_step": 508245, "epoch": 3025} {"train_loss": -11.099807739257812, "global_step": 508246, "epoch": 3025} {"train_loss": -10.794986724853516, "global_step": 508247, "epoch": 3025} {"train_loss": -11.459663391113281, "global_step": 508248, "epoch": 3025} {"train_loss": -11.250615119934082, "global_step": 508249, "epoch": 3025} {"train_loss": -12.224285125732422, "global_step": 508250, "epoch": 3025} {"train_loss": -11.24152660369873, "global_step": 508251, "epoch": 3025} {"train_loss": -12.008649826049805, "global_step": 508252, "epoch": 3025} {"train_loss": -11.300582885742188, "global_step": 508253, "epoch": 3025} {"train_loss": -11.627687454223633, "global_step": 508254, "epoch": 3025} {"train_loss": -12.045413970947266, "global_step": 508255, "epoch": 3025} {"train_loss": -12.098682403564453, "global_step": 508256, "epoch": 3025} {"train_loss": -11.87205982208252, "global_step": 508257, "epoch": 3025} {"train_loss": -11.974424362182617, "global_step": 508258, "epoch": 3025} {"train_loss": -11.887539863586426, "global_step": 508259, "epoch": 3025} {"train_loss": -11.92729377746582, "global_step": 508260, "epoch": 3025} {"train_loss": -12.357736587524414, "global_step": 508261, "epoch": 3025} {"train_loss": -11.990476608276367, "global_step": 508262, "epoch": 3025} {"train_loss": -12.340437889099121, "global_step": 508263, "epoch": 3025} {"train_loss": -12.289084434509277, "global_step": 508264, "epoch": 3025} {"train_loss": -12.134681701660156, "global_step": 508265, "epoch": 3025} {"train_loss": -12.347482681274414, "global_step": 508266, "epoch": 3025} {"train_loss": -12.394695281982422, "global_step": 508267, "epoch": 3025} {"train_loss": -12.235392570495605, "global_step": 508268, "epoch": 3025} {"train_loss": -12.485382080078125, "global_step": 508269, "epoch": 3025} {"train_loss": -12.480002403259277, "global_step": 508270, "epoch": 3025} {"train_loss": -12.431072235107422, "global_step": 508271, "epoch": 3025} {"train_loss": -12.238738059997559, "global_step": 508272, "epoch": 3025} {"train_loss": -12.439006805419922, "global_step": 508273, "epoch": 3025} {"train_loss": -12.534963607788086, "global_step": 508274, "epoch": 3025} {"train_loss": -12.402691841125488, "global_step": 508275, "epoch": 3025} {"train_loss": -12.653181076049805, "global_step": 508276, "epoch": 3025} {"train_loss": -12.433330535888672, "global_step": 508277, "epoch": 3025} {"train_loss": -12.625292778015137, "global_step": 508278, "epoch": 3025} {"train_loss": -12.541439056396484, "global_step": 508279, "epoch": 3025} {"train_loss": -12.615776062011719, "global_step": 508280, "epoch": 3025} {"train_loss": -12.44782829284668, "global_step": 508281, "epoch": 3025} {"train_loss": -12.57455825805664, "global_step": 508282, "epoch": 3025} {"train_loss": -12.400609970092773, "global_step": 508283, "epoch": 3025} {"train_loss": -12.651630401611328, "global_step": 508284, "epoch": 3025} {"train_loss": -12.396499633789062, "global_step": 508285, "epoch": 3025} {"train_loss": -12.654098510742188, "global_step": 508286, "epoch": 3025} {"train_loss": -12.445029258728027, "global_step": 508287, "epoch": 3025} {"train_loss": -12.633890151977539, "global_step": 508288, "epoch": 3025} {"train_loss": -12.53278636932373, "global_step": 508289, "epoch": 3025} {"train_loss": -12.530707359313965, "global_step": 508290, "epoch": 3025} {"train_loss": -12.44904899597168, "global_step": 508291, "epoch": 3025} {"train_loss": -12.664066314697266, "global_step": 508292, "epoch": 3025} {"train_loss": -12.528060913085938, "global_step": 508293, "epoch": 3025} {"train_loss": -12.492353439331055, "global_step": 508294, "epoch": 3025} {"train_loss": -12.557390213012695, "global_step": 508295, "epoch": 3025} {"train_loss": -12.613555908203125, "global_step": 508296, "epoch": 3025} {"train_loss": -12.645614624023438, "global_step": 508297, "epoch": 3025} {"train_loss": -12.551847457885742, "global_step": 508298, "epoch": 3025} {"train_loss": -12.509357452392578, "global_step": 508299, "epoch": 3025} {"train_loss": -12.688042640686035, "global_step": 508300, "epoch": 3025} {"train_loss": -12.596109390258789, "global_step": 508301, "epoch": 3025} {"train_loss": -12.590760231018066, "global_step": 508302, "epoch": 3025} {"train_loss": -12.454936981201172, "global_step": 508303, "epoch": 3025} {"train_loss": -12.613446235656738, "global_step": 508304, "epoch": 3025} {"train_loss": -12.489741325378418, "global_step": 508305, "epoch": 3025} {"train_loss": -12.883222579956055, "global_step": 508306, "epoch": 3025} {"train_loss": -12.638833045959473, "global_step": 508307, "epoch": 3025} {"train_loss": -12.549381256103516, "global_step": 508308, "epoch": 3025} {"train_loss": -12.741823196411133, "global_step": 508309, "epoch": 3025} {"train_loss": -12.449186325073242, "global_step": 508310, "epoch": 3025} {"train_loss": -12.708494186401367, "global_step": 508311, "epoch": 3025} {"train_loss": -12.472658157348633, "global_step": 508312, "epoch": 3025} {"train_loss": -12.84437084197998, "global_step": 508313, "epoch": 3025} {"train_loss": -12.558586120605469, "global_step": 508314, "epoch": 3025} {"train_loss": -12.872518539428711, "global_step": 508315, "epoch": 3025} {"train_loss": -12.715428352355957, "global_step": 508316, "epoch": 3025} {"train_loss": -12.81771183013916, "global_step": 508317, "epoch": 3025} {"train_loss": -12.890340805053711, "global_step": 508318, "epoch": 3025} {"train_loss": -12.819584846496582, "global_step": 508319, "epoch": 3025} {"train_loss": -13.001241683959961, "global_step": 508320, "epoch": 3025} {"train_loss": -12.891069412231445, "global_step": 508321, "epoch": 3025} {"train_loss": -12.794744491577148, "global_step": 508322, "epoch": 3025} {"train_loss": -12.767250061035156, "global_step": 508323, "epoch": 3025} {"train_loss": -12.915024757385254, "global_step": 508324, "epoch": 3025} {"train_loss": -12.683999061584473, "global_step": 508325, "epoch": 3025} {"train_loss": -12.88210678100586, "global_step": 508326, "epoch": 3025} {"train_loss": -12.990543365478516, "global_step": 508327, "epoch": 3025} {"train_loss": -12.541326522827148, "global_step": 508328, "epoch": 3025} {"train_loss": -12.745681762695312, "global_step": 508329, "epoch": 3025} {"train_loss": -12.94060230255127, "global_step": 508330, "epoch": 3025} {"train_loss": -12.597152709960938, "global_step": 508331, "epoch": 3025} {"train_loss": -12.855573654174805, "global_step": 508332, "epoch": 3025} {"train_loss": -12.952491760253906, "global_step": 508333, "epoch": 3025} {"train_loss": -12.884227752685547, "global_step": 508334, "epoch": 3025} {"train_loss": -12.681743621826172, "global_step": 508335, "epoch": 3025} {"train_loss": -12.591693878173828, "global_step": 508336, "epoch": 3025} {"train_loss": -12.540255546569824, "global_step": 508337, "epoch": 3025} {"train_loss": -12.6394681930542, "global_step": 508338, "epoch": 3025} {"train_loss": -12.942697525024414, "global_step": 508339, "epoch": 3025} {"train_loss": -12.766538619995117, "global_step": 508340, "epoch": 3025} {"train_loss": -12.952905654907227, "global_step": 508341, "epoch": 3025} {"train_loss": -12.862234115600586, "global_step": 508342, "epoch": 3025} {"train_loss": -12.978452682495117, "global_step": 508343, "epoch": 3025} {"train_loss": -12.733065605163574, "global_step": 508344, "epoch": 3025} {"train_loss": -13.093772888183594, "global_step": 508345, "epoch": 3025} {"train_loss": -12.821859359741211, "global_step": 508346, "epoch": 3025} {"train_loss": -12.548990249633789, "global_step": 508347, "epoch": 3025} {"train_loss": -12.36513900756836, "global_step": 508348, "epoch": 3025} {"train_loss": -12.89847183227539, "global_step": 508349, "epoch": 3025} {"train_loss": -12.606498718261719, "global_step": 508350, "epoch": 3025} {"train_loss": -12.550617218017578, "global_step": 508351, "epoch": 3025} {"train_loss": -12.58595085144043, "global_step": 508352, "epoch": 3025} {"train_loss": -12.611461639404297, "global_step": 508353, "epoch": 3025} {"train_loss": -12.989933013916016, "global_step": 508354, "epoch": 3025} {"train_loss": -12.858932495117188, "global_step": 508355, "epoch": 3025} {"train_loss": -12.800359725952148, "global_step": 508356, "epoch": 3025} {"train_loss": -12.634915351867676, "global_step": 508357, "epoch": 3025} {"train_loss": -12.761737823486328, "global_step": 508358, "epoch": 3025} {"train_loss": -12.45449161529541, "global_step": 508359, "epoch": 3025} {"train_loss": -12.113546371459961, "global_step": 508360, "epoch": 3025} {"train_loss": -12.86509895324707, "global_step": 508361, "epoch": 3025} {"train_loss": -12.847244262695312, "global_step": 508362, "epoch": 3025} {"train_loss": -12.599952697753906, "global_step": 508363, "epoch": 3025} {"train_loss": -12.307865142822266, "global_step": 508364, "epoch": 3025} {"train_loss": -12.37657642364502, "global_step": 508365, "epoch": 3025} {"train_loss": -12.495122909545898, "global_step": 508366, "epoch": 3025} {"train_loss": -12.027920944350106, "global_step": 508367, "epoch": 3025, "val_loss": 317518.6875, "train_action_mse_error": 0.3411835730075836} {"train_loss": -12.70105266571045, "global_step": 508368, "epoch": 3026} {"train_loss": -12.84824275970459, "global_step": 508369, "epoch": 3026} {"train_loss": -12.534025192260742, "global_step": 508370, "epoch": 3026} {"train_loss": -12.604655265808105, "global_step": 508371, "epoch": 3026} {"train_loss": -12.553703308105469, "global_step": 508372, "epoch": 3026} {"train_loss": -12.722362518310547, "global_step": 508373, "epoch": 3026} {"train_loss": -12.178369522094727, "global_step": 508374, "epoch": 3026} {"train_loss": -12.766105651855469, "global_step": 508375, "epoch": 3026} {"train_loss": -12.719754219055176, "global_step": 508376, "epoch": 3026} {"train_loss": -12.748920440673828, "global_step": 508377, "epoch": 3026} {"train_loss": -12.604374885559082, "global_step": 508378, "epoch": 3026} {"train_loss": -12.886215209960938, "global_step": 508379, "epoch": 3026} {"train_loss": -12.726698875427246, "global_step": 508380, "epoch": 3026} {"train_loss": -12.717824935913086, "global_step": 508381, "epoch": 3026} {"train_loss": -12.513595581054688, "global_step": 508382, "epoch": 3026} {"train_loss": -12.830961227416992, "global_step": 508383, "epoch": 3026} {"train_loss": -12.657248497009277, "global_step": 508384, "epoch": 3026} {"train_loss": -12.686965942382812, "global_step": 508385, "epoch": 3026} {"train_loss": -12.48257064819336, "global_step": 508386, "epoch": 3026} {"train_loss": -12.706954002380371, "global_step": 508387, "epoch": 3026} {"train_loss": -12.73156452178955, "global_step": 508388, "epoch": 3026} {"train_loss": -12.45421028137207, "global_step": 508389, "epoch": 3026} {"train_loss": -11.955400466918945, "global_step": 508390, "epoch": 3026} {"train_loss": -13.109515190124512, "global_step": 508391, "epoch": 3026} {"train_loss": -12.308378219604492, "global_step": 508392, "epoch": 3026} {"train_loss": -12.876132011413574, "global_step": 508393, "epoch": 3026} {"train_loss": -12.520090103149414, "global_step": 508394, "epoch": 3026} {"train_loss": -12.482608795166016, "global_step": 508395, "epoch": 3026} {"train_loss": -11.57913589477539, "global_step": 508396, "epoch": 3026} {"train_loss": -12.402214050292969, "global_step": 508397, "epoch": 3026} {"train_loss": -10.573311805725098, "global_step": 508398, "epoch": 3026} {"train_loss": -11.057631492614746, "global_step": 508399, "epoch": 3026} {"train_loss": -12.162883758544922, "global_step": 508400, "epoch": 3026} {"train_loss": -10.911177635192871, "global_step": 508401, "epoch": 3026} {"train_loss": -11.499828338623047, "global_step": 508402, "epoch": 3026} {"train_loss": -10.677299499511719, "global_step": 508403, "epoch": 3026} {"train_loss": -10.030290603637695, "global_step": 508404, "epoch": 3026} {"train_loss": -12.719369888305664, "global_step": 508405, "epoch": 3026} {"train_loss": -9.579829216003418, "global_step": 508406, "epoch": 3026} {"train_loss": -11.373212814331055, "global_step": 508407, "epoch": 3026} {"train_loss": -11.722665786743164, "global_step": 508408, "epoch": 3026} {"train_loss": -10.562223434448242, "global_step": 508409, "epoch": 3026} {"train_loss": -12.546188354492188, "global_step": 508410, "epoch": 3026} {"train_loss": -11.211634635925293, "global_step": 508411, "epoch": 3026} {"train_loss": -12.153749465942383, "global_step": 508412, "epoch": 3026} {"train_loss": -11.540247917175293, "global_step": 508413, "epoch": 3026} {"train_loss": -11.868826866149902, "global_step": 508414, "epoch": 3026} {"train_loss": -12.089012145996094, "global_step": 508415, "epoch": 3026} {"train_loss": -11.84530258178711, "global_step": 508416, "epoch": 3026} {"train_loss": -11.402831077575684, "global_step": 508417, "epoch": 3026} {"train_loss": -11.957103729248047, "global_step": 508418, "epoch": 3026} {"train_loss": -12.191360473632812, "global_step": 508419, "epoch": 3026} {"train_loss": -11.71053695678711, "global_step": 508420, "epoch": 3026} {"train_loss": -12.539413452148438, "global_step": 508421, "epoch": 3026} {"train_loss": -12.181806564331055, "global_step": 508422, "epoch": 3026} {"train_loss": -12.356863021850586, "global_step": 508423, "epoch": 3026} {"train_loss": -12.536434173583984, "global_step": 508424, "epoch": 3026} {"train_loss": -11.90315055847168, "global_step": 508425, "epoch": 3026} {"train_loss": -12.826745986938477, "global_step": 508426, "epoch": 3026} {"train_loss": -12.377506256103516, "global_step": 508427, "epoch": 3026} {"train_loss": -12.34533977508545, "global_step": 508428, "epoch": 3026} {"train_loss": -12.142585754394531, "global_step": 508429, "epoch": 3026} {"train_loss": -12.488082885742188, "global_step": 508430, "epoch": 3026} {"train_loss": -12.218573570251465, "global_step": 508431, "epoch": 3026} {"train_loss": -12.539541244506836, "global_step": 508432, "epoch": 3026} {"train_loss": -12.30498218536377, "global_step": 508433, "epoch": 3026} {"train_loss": -12.377402305603027, "global_step": 508434, "epoch": 3026} {"train_loss": -12.366470336914062, "global_step": 508435, "epoch": 3026} {"train_loss": -12.356462478637695, "global_step": 508436, "epoch": 3026} {"train_loss": -12.409690856933594, "global_step": 508437, "epoch": 3026} {"train_loss": -12.637046813964844, "global_step": 508438, "epoch": 3026} {"train_loss": -12.628040313720703, "global_step": 508439, "epoch": 3026} {"train_loss": -12.604164123535156, "global_step": 508440, "epoch": 3026} {"train_loss": -12.318938255310059, "global_step": 508441, "epoch": 3026} {"train_loss": -12.285894393920898, "global_step": 508442, "epoch": 3026} {"train_loss": -12.804014205932617, "global_step": 508443, "epoch": 3026} {"train_loss": -12.542930603027344, "global_step": 508444, "epoch": 3026} {"train_loss": -12.542759895324707, "global_step": 508445, "epoch": 3026} {"train_loss": -12.376826286315918, "global_step": 508446, "epoch": 3026} {"train_loss": -12.579050064086914, "global_step": 508447, "epoch": 3026} {"train_loss": -12.407687187194824, "global_step": 508448, "epoch": 3026} {"train_loss": -12.38731575012207, "global_step": 508449, "epoch": 3026} {"train_loss": -12.08701229095459, "global_step": 508450, "epoch": 3026} {"train_loss": -12.66144847869873, "global_step": 508451, "epoch": 3026} {"train_loss": -12.056051254272461, "global_step": 508452, "epoch": 3026} {"train_loss": -12.096912384033203, "global_step": 508453, "epoch": 3026} {"train_loss": -12.775070190429688, "global_step": 508454, "epoch": 3026} {"train_loss": -12.34836483001709, "global_step": 508455, "epoch": 3026} {"train_loss": -12.242769241333008, "global_step": 508456, "epoch": 3026} {"train_loss": -12.041751861572266, "global_step": 508457, "epoch": 3026} {"train_loss": -12.695467948913574, "global_step": 508458, "epoch": 3026} {"train_loss": -11.552480697631836, "global_step": 508459, "epoch": 3026} {"train_loss": -12.52886962890625, "global_step": 508460, "epoch": 3026} {"train_loss": -11.927701950073242, "global_step": 508461, "epoch": 3026} {"train_loss": -12.421012878417969, "global_step": 508462, "epoch": 3026} {"train_loss": -12.120312690734863, "global_step": 508463, "epoch": 3026} {"train_loss": -12.149201393127441, "global_step": 508464, "epoch": 3026} {"train_loss": -12.152061462402344, "global_step": 508465, "epoch": 3026} {"train_loss": -12.178936004638672, "global_step": 508466, "epoch": 3026} {"train_loss": -12.154394149780273, "global_step": 508467, "epoch": 3026} {"train_loss": -11.875316619873047, "global_step": 508468, "epoch": 3026} {"train_loss": -12.688072204589844, "global_step": 508469, "epoch": 3026} {"train_loss": -12.287616729736328, "global_step": 508470, "epoch": 3026} {"train_loss": -12.787068367004395, "global_step": 508471, "epoch": 3026} {"train_loss": -12.313497543334961, "global_step": 508472, "epoch": 3026} {"train_loss": -12.730905532836914, "global_step": 508473, "epoch": 3026} {"train_loss": -12.201288223266602, "global_step": 508474, "epoch": 3026} {"train_loss": -12.607000350952148, "global_step": 508475, "epoch": 3026} {"train_loss": -12.33415412902832, "global_step": 508476, "epoch": 3026} {"train_loss": -12.618306159973145, "global_step": 508477, "epoch": 3026} {"train_loss": -12.424787521362305, "global_step": 508478, "epoch": 3026} {"train_loss": -12.461434364318848, "global_step": 508479, "epoch": 3026} {"train_loss": -12.415082931518555, "global_step": 508480, "epoch": 3026} {"train_loss": -12.48548698425293, "global_step": 508481, "epoch": 3026} {"train_loss": -11.71696949005127, "global_step": 508482, "epoch": 3026} {"train_loss": -12.653066635131836, "global_step": 508483, "epoch": 3026} {"train_loss": -12.0856294631958, "global_step": 508484, "epoch": 3026} {"train_loss": -12.782583236694336, "global_step": 508485, "epoch": 3026} {"train_loss": -11.846678733825684, "global_step": 508486, "epoch": 3026} {"train_loss": -12.871788024902344, "global_step": 508487, "epoch": 3026} {"train_loss": -12.4664306640625, "global_step": 508488, "epoch": 3026} {"train_loss": -12.43836498260498, "global_step": 508489, "epoch": 3026} {"train_loss": -12.851470947265625, "global_step": 508490, "epoch": 3026} {"train_loss": -12.672882080078125, "global_step": 508491, "epoch": 3026} {"train_loss": -12.397579193115234, "global_step": 508492, "epoch": 3026} {"train_loss": -12.615449905395508, "global_step": 508493, "epoch": 3026} {"train_loss": -12.921466827392578, "global_step": 508494, "epoch": 3026} {"train_loss": -12.80693244934082, "global_step": 508495, "epoch": 3026} {"train_loss": -12.698648452758789, "global_step": 508496, "epoch": 3026} {"train_loss": -12.613809585571289, "global_step": 508497, "epoch": 3026} {"train_loss": -12.703715324401855, "global_step": 508498, "epoch": 3026} {"train_loss": -12.778742790222168, "global_step": 508499, "epoch": 3026} {"train_loss": -12.551759719848633, "global_step": 508500, "epoch": 3026} {"train_loss": -12.566774368286133, "global_step": 508501, "epoch": 3026} {"train_loss": -12.903549194335938, "global_step": 508502, "epoch": 3026} {"train_loss": -12.828593254089355, "global_step": 508503, "epoch": 3026} {"train_loss": -12.755838394165039, "global_step": 508504, "epoch": 3026} {"train_loss": -12.885053634643555, "global_step": 508505, "epoch": 3026} {"train_loss": -12.717626571655273, "global_step": 508506, "epoch": 3026} {"train_loss": -12.522711753845215, "global_step": 508507, "epoch": 3026} {"train_loss": -12.826951026916504, "global_step": 508508, "epoch": 3026} {"train_loss": -12.631786346435547, "global_step": 508509, "epoch": 3026} {"train_loss": -12.382155418395996, "global_step": 508510, "epoch": 3026} {"train_loss": -12.564055442810059, "global_step": 508511, "epoch": 3026} {"train_loss": -13.089141845703125, "global_step": 508512, "epoch": 3026} {"train_loss": -12.185056686401367, "global_step": 508513, "epoch": 3026} {"train_loss": -12.679171562194824, "global_step": 508514, "epoch": 3026} {"train_loss": -12.55758285522461, "global_step": 508515, "epoch": 3026} {"train_loss": -12.433032989501953, "global_step": 508516, "epoch": 3026} {"train_loss": -12.505668640136719, "global_step": 508517, "epoch": 3026} {"train_loss": -12.546424865722656, "global_step": 508518, "epoch": 3026} {"train_loss": -12.117557525634766, "global_step": 508519, "epoch": 3026} {"train_loss": -12.989578247070312, "global_step": 508520, "epoch": 3026} {"train_loss": -12.539018630981445, "global_step": 508521, "epoch": 3026} {"train_loss": -12.75837516784668, "global_step": 508522, "epoch": 3026} {"train_loss": -12.400457382202148, "global_step": 508523, "epoch": 3026} {"train_loss": -12.468124389648438, "global_step": 508524, "epoch": 3026} {"train_loss": -12.439767837524414, "global_step": 508525, "epoch": 3026} {"train_loss": -12.678635597229004, "global_step": 508526, "epoch": 3026} {"train_loss": -12.107863426208496, "global_step": 508527, "epoch": 3026} {"train_loss": -13.047752380371094, "global_step": 508528, "epoch": 3026} {"train_loss": -12.39242172241211, "global_step": 508529, "epoch": 3026} {"train_loss": -12.893993377685547, "global_step": 508530, "epoch": 3026} {"train_loss": -12.499855041503906, "global_step": 508531, "epoch": 3026} {"train_loss": -13.023154258728027, "global_step": 508532, "epoch": 3026} {"train_loss": -12.625770568847656, "global_step": 508533, "epoch": 3026} {"train_loss": -12.867700576782227, "global_step": 508534, "epoch": 3026} {"train_loss": -12.356717932791938, "global_step": 508535, "epoch": 3026, "val_loss": 321489.4375} {"train_loss": -12.3522310256958, "global_step": 508536, "epoch": 3027} {"train_loss": -12.822198867797852, "global_step": 508537, "epoch": 3027} {"train_loss": -12.65117073059082, "global_step": 508538, "epoch": 3027} {"train_loss": -12.315601348876953, "global_step": 508539, "epoch": 3027} {"train_loss": -12.082683563232422, "global_step": 508540, "epoch": 3027} {"train_loss": -11.984434127807617, "global_step": 508541, "epoch": 3027} {"train_loss": -11.91901969909668, "global_step": 508542, "epoch": 3027} {"train_loss": -12.082605361938477, "global_step": 508543, "epoch": 3027} {"train_loss": -11.048439979553223, "global_step": 508544, "epoch": 3027} {"train_loss": -12.668338775634766, "global_step": 508545, "epoch": 3027} {"train_loss": -11.606365203857422, "global_step": 508546, "epoch": 3027} {"train_loss": -11.716436386108398, "global_step": 508547, "epoch": 3027} {"train_loss": -11.570323944091797, "global_step": 508548, "epoch": 3027} {"train_loss": -12.187328338623047, "global_step": 508549, "epoch": 3027} {"train_loss": -10.81029224395752, "global_step": 508550, "epoch": 3027} {"train_loss": -12.029423713684082, "global_step": 508551, "epoch": 3027} {"train_loss": -9.914947509765625, "global_step": 508552, "epoch": 3027} {"train_loss": -10.317251205444336, "global_step": 508553, "epoch": 3027} {"train_loss": -11.314483642578125, "global_step": 508554, "epoch": 3027} {"train_loss": -10.396245956420898, "global_step": 508555, "epoch": 3027} {"train_loss": -10.037191390991211, "global_step": 508556, "epoch": 3027} {"train_loss": -12.066986083984375, "global_step": 508557, "epoch": 3027} {"train_loss": -10.90196418762207, "global_step": 508558, "epoch": 3027} {"train_loss": -11.129232406616211, "global_step": 508559, "epoch": 3027} {"train_loss": -11.481225967407227, "global_step": 508560, "epoch": 3027} {"train_loss": -10.025957107543945, "global_step": 508561, "epoch": 3027} {"train_loss": -10.506905555725098, "global_step": 508562, "epoch": 3027} {"train_loss": -8.46407699584961, "global_step": 508563, "epoch": 3027} {"train_loss": -10.22811508178711, "global_step": 508564, "epoch": 3027} {"train_loss": -9.946990966796875, "global_step": 508565, "epoch": 3027} {"train_loss": -8.781346321105957, "global_step": 508566, "epoch": 3027} {"train_loss": -9.639726638793945, "global_step": 508567, "epoch": 3027} {"train_loss": -9.392684936523438, "global_step": 508568, "epoch": 3027} {"train_loss": -10.660406112670898, "global_step": 508569, "epoch": 3027} {"train_loss": -9.598800659179688, "global_step": 508570, "epoch": 3027} {"train_loss": -10.128936767578125, "global_step": 508571, "epoch": 3027} {"train_loss": -9.789432525634766, "global_step": 508572, "epoch": 3027} {"train_loss": -10.988089561462402, "global_step": 508573, "epoch": 3027} {"train_loss": -10.50788402557373, "global_step": 508574, "epoch": 3027} {"train_loss": -11.521108627319336, "global_step": 508575, "epoch": 3027} {"train_loss": -10.944754600524902, "global_step": 508576, "epoch": 3027} {"train_loss": -10.595270156860352, "global_step": 508577, "epoch": 3027} {"train_loss": -10.627294540405273, "global_step": 508578, "epoch": 3027} {"train_loss": -10.884974479675293, "global_step": 508579, "epoch": 3027} {"train_loss": -11.251103401184082, "global_step": 508580, "epoch": 3027} {"train_loss": -11.39827823638916, "global_step": 508581, "epoch": 3027} {"train_loss": -11.917362213134766, "global_step": 508582, "epoch": 3027} {"train_loss": -10.303101539611816, "global_step": 508583, "epoch": 3027} {"train_loss": -12.17827033996582, "global_step": 508584, "epoch": 3027} {"train_loss": -10.697848320007324, "global_step": 508585, "epoch": 3027} {"train_loss": -12.282154083251953, "global_step": 508586, "epoch": 3027} {"train_loss": -11.40988540649414, "global_step": 508587, "epoch": 3027} {"train_loss": -11.206722259521484, "global_step": 508588, "epoch": 3027} {"train_loss": -11.978041648864746, "global_step": 508589, "epoch": 3027} {"train_loss": -11.45695686340332, "global_step": 508590, "epoch": 3027} {"train_loss": -12.139535903930664, "global_step": 508591, "epoch": 3027} {"train_loss": -11.666468620300293, "global_step": 508592, "epoch": 3027} {"train_loss": -12.429078102111816, "global_step": 508593, "epoch": 3027} {"train_loss": -11.849967956542969, "global_step": 508594, "epoch": 3027} {"train_loss": -12.074047088623047, "global_step": 508595, "epoch": 3027} {"train_loss": -11.937908172607422, "global_step": 508596, "epoch": 3027} {"train_loss": -12.580486297607422, "global_step": 508597, "epoch": 3027} {"train_loss": -12.022998809814453, "global_step": 508598, "epoch": 3027} {"train_loss": -12.331130981445312, "global_step": 508599, "epoch": 3027} {"train_loss": -12.094232559204102, "global_step": 508600, "epoch": 3027} {"train_loss": -12.33758544921875, "global_step": 508601, "epoch": 3027} {"train_loss": -12.404867172241211, "global_step": 508602, "epoch": 3027} {"train_loss": -12.300259590148926, "global_step": 508603, "epoch": 3027} {"train_loss": -12.554994583129883, "global_step": 508604, "epoch": 3027} {"train_loss": -12.352020263671875, "global_step": 508605, "epoch": 3027} {"train_loss": -12.5882568359375, "global_step": 508606, "epoch": 3027} {"train_loss": -12.541430473327637, "global_step": 508607, "epoch": 3027} {"train_loss": -12.621623039245605, "global_step": 508608, "epoch": 3027} {"train_loss": -12.668508529663086, "global_step": 508609, "epoch": 3027} {"train_loss": -12.418807029724121, "global_step": 508610, "epoch": 3027} {"train_loss": -12.856156349182129, "global_step": 508611, "epoch": 3027} {"train_loss": -12.669273376464844, "global_step": 508612, "epoch": 3027} {"train_loss": -12.761693954467773, "global_step": 508613, "epoch": 3027} {"train_loss": -12.62122631072998, "global_step": 508614, "epoch": 3027} {"train_loss": -12.778848648071289, "global_step": 508615, "epoch": 3027} {"train_loss": -12.820545196533203, "global_step": 508616, "epoch": 3027} {"train_loss": -12.481425285339355, "global_step": 508617, "epoch": 3027} {"train_loss": -12.779011726379395, "global_step": 508618, "epoch": 3027} {"train_loss": -12.703001022338867, "global_step": 508619, "epoch": 3027} {"train_loss": -12.823565483093262, "global_step": 508620, "epoch": 3027} {"train_loss": -12.4461669921875, "global_step": 508621, "epoch": 3027} {"train_loss": -12.6995267868042, "global_step": 508622, "epoch": 3027} {"train_loss": -12.679819107055664, "global_step": 508623, "epoch": 3027} {"train_loss": -12.753288269042969, "global_step": 508624, "epoch": 3027} {"train_loss": -12.629075050354004, "global_step": 508625, "epoch": 3027} {"train_loss": -12.789041519165039, "global_step": 508626, "epoch": 3027} {"train_loss": -12.754100799560547, "global_step": 508627, "epoch": 3027} {"train_loss": -12.767394065856934, "global_step": 508628, "epoch": 3027} {"train_loss": -12.697084426879883, "global_step": 508629, "epoch": 3027} {"train_loss": -12.75051498413086, "global_step": 508630, "epoch": 3027} {"train_loss": -12.865415573120117, "global_step": 508631, "epoch": 3027} {"train_loss": -12.81462287902832, "global_step": 508632, "epoch": 3027} {"train_loss": -12.564507484436035, "global_step": 508633, "epoch": 3027} {"train_loss": -12.729877471923828, "global_step": 508634, "epoch": 3027} {"train_loss": -12.841741561889648, "global_step": 508635, "epoch": 3027} {"train_loss": -12.902040481567383, "global_step": 508636, "epoch": 3027} {"train_loss": -12.801689147949219, "global_step": 508637, "epoch": 3027} {"train_loss": -12.647148132324219, "global_step": 508638, "epoch": 3027} {"train_loss": -12.979024887084961, "global_step": 508639, "epoch": 3027} {"train_loss": -12.86779499053955, "global_step": 508640, "epoch": 3027} {"train_loss": -12.644681930541992, "global_step": 508641, "epoch": 3027} {"train_loss": -12.821756362915039, "global_step": 508642, "epoch": 3027} {"train_loss": -12.598007202148438, "global_step": 508643, "epoch": 3027} {"train_loss": -12.808598518371582, "global_step": 508644, "epoch": 3027} {"train_loss": -12.692766189575195, "global_step": 508645, "epoch": 3027} {"train_loss": -12.410632133483887, "global_step": 508646, "epoch": 3027} {"train_loss": -12.989668846130371, "global_step": 508647, "epoch": 3027} {"train_loss": -12.60849666595459, "global_step": 508648, "epoch": 3027} {"train_loss": -12.416967391967773, "global_step": 508649, "epoch": 3027} {"train_loss": -13.053666114807129, "global_step": 508650, "epoch": 3027} {"train_loss": -12.94921588897705, "global_step": 508651, "epoch": 3027} {"train_loss": -12.817920684814453, "global_step": 508652, "epoch": 3027} {"train_loss": -12.982767105102539, "global_step": 508653, "epoch": 3027} {"train_loss": -13.021244049072266, "global_step": 508654, "epoch": 3027} {"train_loss": -12.94072151184082, "global_step": 508655, "epoch": 3027} {"train_loss": -13.016843795776367, "global_step": 508656, "epoch": 3027} {"train_loss": -12.891898155212402, "global_step": 508657, "epoch": 3027} {"train_loss": -12.85224723815918, "global_step": 508658, "epoch": 3027} {"train_loss": -13.070229530334473, "global_step": 508659, "epoch": 3027} {"train_loss": -12.984125137329102, "global_step": 508660, "epoch": 3027} {"train_loss": -12.937929153442383, "global_step": 508661, "epoch": 3027} {"train_loss": -12.77745246887207, "global_step": 508662, "epoch": 3027} {"train_loss": -13.14520263671875, "global_step": 508663, "epoch": 3027} {"train_loss": -12.911140441894531, "global_step": 508664, "epoch": 3027} {"train_loss": -13.133926391601562, "global_step": 508665, "epoch": 3027} {"train_loss": -13.046890258789062, "global_step": 508666, "epoch": 3027} {"train_loss": -13.000706672668457, "global_step": 508667, "epoch": 3027} {"train_loss": -12.709344863891602, "global_step": 508668, "epoch": 3027} {"train_loss": -13.06576919555664, "global_step": 508669, "epoch": 3027} {"train_loss": -12.871877670288086, "global_step": 508670, "epoch": 3027} {"train_loss": -12.723806381225586, "global_step": 508671, "epoch": 3027} {"train_loss": -12.809852600097656, "global_step": 508672, "epoch": 3027} {"train_loss": -13.087202072143555, "global_step": 508673, "epoch": 3027} {"train_loss": -12.841636657714844, "global_step": 508674, "epoch": 3027} {"train_loss": -13.077366828918457, "global_step": 508675, "epoch": 3027} {"train_loss": -12.80007266998291, "global_step": 508676, "epoch": 3027} {"train_loss": -12.94762134552002, "global_step": 508677, "epoch": 3027} {"train_loss": -13.144330978393555, "global_step": 508678, "epoch": 3027} {"train_loss": -12.763202667236328, "global_step": 508679, "epoch": 3027} {"train_loss": -12.822959899902344, "global_step": 508680, "epoch": 3027} {"train_loss": -12.735097885131836, "global_step": 508681, "epoch": 3027} {"train_loss": -12.9524564743042, "global_step": 508682, "epoch": 3027} {"train_loss": -12.537753105163574, "global_step": 508683, "epoch": 3027} {"train_loss": -12.921357154846191, "global_step": 508684, "epoch": 3027} {"train_loss": -12.682476043701172, "global_step": 508685, "epoch": 3027} {"train_loss": -12.856639862060547, "global_step": 508686, "epoch": 3027} {"train_loss": -12.466777801513672, "global_step": 508687, "epoch": 3027} {"train_loss": -12.633523941040039, "global_step": 508688, "epoch": 3027} {"train_loss": -12.954163551330566, "global_step": 508689, "epoch": 3027} {"train_loss": -12.847394943237305, "global_step": 508690, "epoch": 3027} {"train_loss": -12.548467636108398, "global_step": 508691, "epoch": 3027} {"train_loss": -12.786962509155273, "global_step": 508692, "epoch": 3027} {"train_loss": -12.849093437194824, "global_step": 508693, "epoch": 3027} {"train_loss": -12.934255599975586, "global_step": 508694, "epoch": 3027} {"train_loss": -12.609764099121094, "global_step": 508695, "epoch": 3027} {"train_loss": -12.60036849975586, "global_step": 508696, "epoch": 3027} {"train_loss": -12.98672866821289, "global_step": 508697, "epoch": 3027} {"train_loss": -12.755559921264648, "global_step": 508698, "epoch": 3027} {"train_loss": -12.711894989013672, "global_step": 508699, "epoch": 3027} {"train_loss": -12.405855178833008, "global_step": 508700, "epoch": 3027} {"train_loss": -13.23926067352295, "global_step": 508701, "epoch": 3027} {"train_loss": -12.618903160095215, "global_step": 508702, "epoch": 3027} {"train_loss": -12.176940639813742, "global_step": 508703, "epoch": 3027, "val_loss": 317974.375} {"train_loss": -12.02386474609375, "global_step": 508704, "epoch": 3028} {"train_loss": -12.052824020385742, "global_step": 508705, "epoch": 3028} {"train_loss": -12.4685640335083, "global_step": 508706, "epoch": 3028} {"train_loss": -12.850677490234375, "global_step": 508707, "epoch": 3028} {"train_loss": -11.428140640258789, "global_step": 508708, "epoch": 3028} {"train_loss": -11.712339401245117, "global_step": 508709, "epoch": 3028} {"train_loss": -11.677820205688477, "global_step": 508710, "epoch": 3028} {"train_loss": -12.734180450439453, "global_step": 508711, "epoch": 3028} {"train_loss": -11.827959060668945, "global_step": 508712, "epoch": 3028} {"train_loss": -11.991181373596191, "global_step": 508713, "epoch": 3028} {"train_loss": -11.342765808105469, "global_step": 508714, "epoch": 3028} {"train_loss": -12.241305351257324, "global_step": 508715, "epoch": 3028} {"train_loss": -12.498517990112305, "global_step": 508716, "epoch": 3028} {"train_loss": -11.847396850585938, "global_step": 508717, "epoch": 3028} {"train_loss": -11.43156909942627, "global_step": 508718, "epoch": 3028} {"train_loss": -10.606403350830078, "global_step": 508719, "epoch": 3028} {"train_loss": -11.056230545043945, "global_step": 508720, "epoch": 3028} {"train_loss": -11.604917526245117, "global_step": 508721, "epoch": 3028} {"train_loss": -9.527813911437988, "global_step": 508722, "epoch": 3028} {"train_loss": -9.154291152954102, "global_step": 508723, "epoch": 3028} {"train_loss": -11.357471466064453, "global_step": 508724, "epoch": 3028} {"train_loss": -10.768387794494629, "global_step": 508725, "epoch": 3028} {"train_loss": -10.468942642211914, "global_step": 508726, "epoch": 3028} {"train_loss": -11.473464012145996, "global_step": 508727, "epoch": 3028} {"train_loss": -8.847877502441406, "global_step": 508728, "epoch": 3028} {"train_loss": -11.335309982299805, "global_step": 508729, "epoch": 3028} {"train_loss": -11.308955192565918, "global_step": 508730, "epoch": 3028} {"train_loss": -11.237432479858398, "global_step": 508731, "epoch": 3028} {"train_loss": -11.775182723999023, "global_step": 508732, "epoch": 3028} {"train_loss": -10.878700256347656, "global_step": 508733, "epoch": 3028} {"train_loss": -11.490547180175781, "global_step": 508734, "epoch": 3028} {"train_loss": -10.207042694091797, "global_step": 508735, "epoch": 3028} {"train_loss": -11.887374877929688, "global_step": 508736, "epoch": 3028} {"train_loss": -11.053644180297852, "global_step": 508737, "epoch": 3028} {"train_loss": -9.560029029846191, "global_step": 508738, "epoch": 3028} {"train_loss": -10.997834205627441, "global_step": 508739, "epoch": 3028} {"train_loss": -11.051639556884766, "global_step": 508740, "epoch": 3028} {"train_loss": -10.14864730834961, "global_step": 508741, "epoch": 3028} {"train_loss": -11.609224319458008, "global_step": 508742, "epoch": 3028} {"train_loss": -10.695796966552734, "global_step": 508743, "epoch": 3028} {"train_loss": -11.32404899597168, "global_step": 508744, "epoch": 3028} {"train_loss": -11.598519325256348, "global_step": 508745, "epoch": 3028} {"train_loss": -11.547738075256348, "global_step": 508746, "epoch": 3028} {"train_loss": -11.429380416870117, "global_step": 508747, "epoch": 3028} {"train_loss": -11.461027145385742, "global_step": 508748, "epoch": 3028} {"train_loss": -11.294069290161133, "global_step": 508749, "epoch": 3028} {"train_loss": -12.297065734863281, "global_step": 508750, "epoch": 3028} {"train_loss": -11.81904411315918, "global_step": 508751, "epoch": 3028} {"train_loss": -12.236242294311523, "global_step": 508752, "epoch": 3028} {"train_loss": -12.004631042480469, "global_step": 508753, "epoch": 3028} {"train_loss": -11.888128280639648, "global_step": 508754, "epoch": 3028} {"train_loss": -11.936141967773438, "global_step": 508755, "epoch": 3028} {"train_loss": -11.840919494628906, "global_step": 508756, "epoch": 3028} {"train_loss": -12.059732437133789, "global_step": 508757, "epoch": 3028} {"train_loss": -11.697880744934082, "global_step": 508758, "epoch": 3028} {"train_loss": -12.276922225952148, "global_step": 508759, "epoch": 3028} {"train_loss": -11.813126564025879, "global_step": 508760, "epoch": 3028} {"train_loss": -11.539958953857422, "global_step": 508761, "epoch": 3028} {"train_loss": -11.957490921020508, "global_step": 508762, "epoch": 3028} {"train_loss": -11.663778305053711, "global_step": 508763, "epoch": 3028} {"train_loss": -12.155787467956543, "global_step": 508764, "epoch": 3028} {"train_loss": -12.08243179321289, "global_step": 508765, "epoch": 3028} {"train_loss": -12.428854942321777, "global_step": 508766, "epoch": 3028} {"train_loss": -12.096818923950195, "global_step": 508767, "epoch": 3028} {"train_loss": -12.462785720825195, "global_step": 508768, "epoch": 3028} {"train_loss": -11.713584899902344, "global_step": 508769, "epoch": 3028} {"train_loss": -12.115594863891602, "global_step": 508770, "epoch": 3028} {"train_loss": -12.291885375976562, "global_step": 508771, "epoch": 3028} {"train_loss": -12.126225471496582, "global_step": 508772, "epoch": 3028} {"train_loss": -12.203275680541992, "global_step": 508773, "epoch": 3028} {"train_loss": -11.884392738342285, "global_step": 508774, "epoch": 3028} {"train_loss": -12.527692794799805, "global_step": 508775, "epoch": 3028} {"train_loss": -11.18954849243164, "global_step": 508776, "epoch": 3028} {"train_loss": -12.183382034301758, "global_step": 508777, "epoch": 3028} {"train_loss": -11.56896686553955, "global_step": 508778, "epoch": 3028} {"train_loss": -11.843311309814453, "global_step": 508779, "epoch": 3028} {"train_loss": -12.164003372192383, "global_step": 508780, "epoch": 3028} {"train_loss": -11.455832481384277, "global_step": 508781, "epoch": 3028} {"train_loss": -12.03613567352295, "global_step": 508782, "epoch": 3028} {"train_loss": -12.267030715942383, "global_step": 508783, "epoch": 3028} {"train_loss": -11.735069274902344, "global_step": 508784, "epoch": 3028} {"train_loss": -12.273155212402344, "global_step": 508785, "epoch": 3028} {"train_loss": -12.303621292114258, "global_step": 508786, "epoch": 3028} {"train_loss": -11.854279518127441, "global_step": 508787, "epoch": 3028} {"train_loss": -12.659524917602539, "global_step": 508788, "epoch": 3028} {"train_loss": -11.843263626098633, "global_step": 508789, "epoch": 3028} {"train_loss": -12.53973388671875, "global_step": 508790, "epoch": 3028} {"train_loss": -11.851457595825195, "global_step": 508791, "epoch": 3028} {"train_loss": -12.102058410644531, "global_step": 508792, "epoch": 3028} {"train_loss": -12.164877891540527, "global_step": 508793, "epoch": 3028} {"train_loss": -10.804265975952148, "global_step": 508794, "epoch": 3028} {"train_loss": -12.344327926635742, "global_step": 508795, "epoch": 3028} {"train_loss": -10.610363960266113, "global_step": 508796, "epoch": 3028} {"train_loss": -12.11131477355957, "global_step": 508797, "epoch": 3028} {"train_loss": -11.710192680358887, "global_step": 508798, "epoch": 3028} {"train_loss": -10.826107025146484, "global_step": 508799, "epoch": 3028} {"train_loss": -12.153997421264648, "global_step": 508800, "epoch": 3028} {"train_loss": -11.047426223754883, "global_step": 508801, "epoch": 3028} {"train_loss": -12.424028396606445, "global_step": 508802, "epoch": 3028} {"train_loss": -11.687711715698242, "global_step": 508803, "epoch": 3028} {"train_loss": -12.672666549682617, "global_step": 508804, "epoch": 3028} {"train_loss": -11.860625267028809, "global_step": 508805, "epoch": 3028} {"train_loss": -12.10750961303711, "global_step": 508806, "epoch": 3028} {"train_loss": -12.390974044799805, "global_step": 508807, "epoch": 3028} {"train_loss": -12.421695709228516, "global_step": 508808, "epoch": 3028} {"train_loss": -12.522462844848633, "global_step": 508809, "epoch": 3028} {"train_loss": -12.416711807250977, "global_step": 508810, "epoch": 3028} {"train_loss": -12.698604583740234, "global_step": 508811, "epoch": 3028} {"train_loss": -12.446048736572266, "global_step": 508812, "epoch": 3028} {"train_loss": -12.686984062194824, "global_step": 508813, "epoch": 3028} {"train_loss": -12.405362129211426, "global_step": 508814, "epoch": 3028} {"train_loss": -12.715972900390625, "global_step": 508815, "epoch": 3028} {"train_loss": -12.459982872009277, "global_step": 508816, "epoch": 3028} {"train_loss": -12.78095817565918, "global_step": 508817, "epoch": 3028} {"train_loss": -12.44808578491211, "global_step": 508818, "epoch": 3028} {"train_loss": -12.447315216064453, "global_step": 508819, "epoch": 3028} {"train_loss": -12.571029663085938, "global_step": 508820, "epoch": 3028} {"train_loss": -12.591495513916016, "global_step": 508821, "epoch": 3028} {"train_loss": -12.395562171936035, "global_step": 508822, "epoch": 3028} {"train_loss": -12.590835571289062, "global_step": 508823, "epoch": 3028} {"train_loss": -12.441167831420898, "global_step": 508824, "epoch": 3028} {"train_loss": -12.351380348205566, "global_step": 508825, "epoch": 3028} {"train_loss": -12.529401779174805, "global_step": 508826, "epoch": 3028} {"train_loss": -12.323211669921875, "global_step": 508827, "epoch": 3028} {"train_loss": -12.778629302978516, "global_step": 508828, "epoch": 3028} {"train_loss": -12.441300392150879, "global_step": 508829, "epoch": 3028} {"train_loss": -12.75859260559082, "global_step": 508830, "epoch": 3028} {"train_loss": -12.498241424560547, "global_step": 508831, "epoch": 3028} {"train_loss": -12.584187507629395, "global_step": 508832, "epoch": 3028} {"train_loss": -12.606687545776367, "global_step": 508833, "epoch": 3028} {"train_loss": -12.395915985107422, "global_step": 508834, "epoch": 3028} {"train_loss": -12.466432571411133, "global_step": 508835, "epoch": 3028} {"train_loss": -12.916605949401855, "global_step": 508836, "epoch": 3028} {"train_loss": -12.300016403198242, "global_step": 508837, "epoch": 3028} {"train_loss": -12.715947151184082, "global_step": 508838, "epoch": 3028} {"train_loss": -12.561010360717773, "global_step": 508839, "epoch": 3028} {"train_loss": -12.590112686157227, "global_step": 508840, "epoch": 3028} {"train_loss": -12.811980247497559, "global_step": 508841, "epoch": 3028} {"train_loss": -12.638832092285156, "global_step": 508842, "epoch": 3028} {"train_loss": -12.904741287231445, "global_step": 508843, "epoch": 3028} {"train_loss": -12.775118827819824, "global_step": 508844, "epoch": 3028} {"train_loss": -12.722702026367188, "global_step": 508845, "epoch": 3028} {"train_loss": -12.682693481445312, "global_step": 508846, "epoch": 3028} {"train_loss": -12.760814666748047, "global_step": 508847, "epoch": 3028} {"train_loss": -12.781974792480469, "global_step": 508848, "epoch": 3028} {"train_loss": -12.731074333190918, "global_step": 508849, "epoch": 3028} {"train_loss": -12.954240798950195, "global_step": 508850, "epoch": 3028} {"train_loss": -12.879875183105469, "global_step": 508851, "epoch": 3028} {"train_loss": -12.715103149414062, "global_step": 508852, "epoch": 3028} {"train_loss": -12.788652420043945, "global_step": 508853, "epoch": 3028} {"train_loss": -12.850519180297852, "global_step": 508854, "epoch": 3028} {"train_loss": -12.675179481506348, "global_step": 508855, "epoch": 3028} {"train_loss": -12.674248695373535, "global_step": 508856, "epoch": 3028} {"train_loss": -12.791119575500488, "global_step": 508857, "epoch": 3028} {"train_loss": -12.557539939880371, "global_step": 508858, "epoch": 3028} {"train_loss": -12.108667373657227, "global_step": 508859, "epoch": 3028} {"train_loss": -12.671488761901855, "global_step": 508860, "epoch": 3028} {"train_loss": -12.726958274841309, "global_step": 508861, "epoch": 3028} {"train_loss": -12.629167556762695, "global_step": 508862, "epoch": 3028} {"train_loss": -12.814207077026367, "global_step": 508863, "epoch": 3028} {"train_loss": -12.57659912109375, "global_step": 508864, "epoch": 3028} {"train_loss": -12.936179161071777, "global_step": 508865, "epoch": 3028} {"train_loss": -12.921524047851562, "global_step": 508866, "epoch": 3028} {"train_loss": -12.942211151123047, "global_step": 508867, "epoch": 3028} {"train_loss": -12.699041366577148, "global_step": 508868, "epoch": 3028} {"train_loss": -12.671748161315918, "global_step": 508869, "epoch": 3028} {"train_loss": -12.907906532287598, "global_step": 508870, "epoch": 3028} {"train_loss": -12.033492951166062, "global_step": 508871, "epoch": 3028, "val_loss": 313304.15625} {"train_loss": -12.992815017700195, "global_step": 508872, "epoch": 3029} {"train_loss": -13.117090225219727, "global_step": 508873, "epoch": 3029} {"train_loss": -12.95649528503418, "global_step": 508874, "epoch": 3029} {"train_loss": -12.720930099487305, "global_step": 508875, "epoch": 3029} {"train_loss": -13.176475524902344, "global_step": 508876, "epoch": 3029} {"train_loss": -12.81783676147461, "global_step": 508877, "epoch": 3029} {"train_loss": -12.957719802856445, "global_step": 508878, "epoch": 3029} {"train_loss": -12.810455322265625, "global_step": 508879, "epoch": 3029} {"train_loss": -13.008646011352539, "global_step": 508880, "epoch": 3029} {"train_loss": -12.868408203125, "global_step": 508881, "epoch": 3029} {"train_loss": -12.928956985473633, "global_step": 508882, "epoch": 3029} {"train_loss": -12.707283020019531, "global_step": 508883, "epoch": 3029} {"train_loss": -12.698110580444336, "global_step": 508884, "epoch": 3029} {"train_loss": -12.443954467773438, "global_step": 508885, "epoch": 3029} {"train_loss": -12.767602920532227, "global_step": 508886, "epoch": 3029} {"train_loss": -12.57232666015625, "global_step": 508887, "epoch": 3029} {"train_loss": -12.403538703918457, "global_step": 508888, "epoch": 3029} {"train_loss": -12.74846076965332, "global_step": 508889, "epoch": 3029} {"train_loss": -12.591180801391602, "global_step": 508890, "epoch": 3029} {"train_loss": -11.811458587646484, "global_step": 508891, "epoch": 3029} {"train_loss": -12.734309196472168, "global_step": 508892, "epoch": 3029} {"train_loss": -12.64970874786377, "global_step": 508893, "epoch": 3029} {"train_loss": -12.194605827331543, "global_step": 508894, "epoch": 3029} {"train_loss": -12.001206398010254, "global_step": 508895, "epoch": 3029} {"train_loss": -12.66495132446289, "global_step": 508896, "epoch": 3029} {"train_loss": -12.888275146484375, "global_step": 508897, "epoch": 3029} {"train_loss": -12.581474304199219, "global_step": 508898, "epoch": 3029} {"train_loss": -12.741647720336914, "global_step": 508899, "epoch": 3029} {"train_loss": -12.585158348083496, "global_step": 508900, "epoch": 3029} {"train_loss": -12.783479690551758, "global_step": 508901, "epoch": 3029} {"train_loss": -12.645049095153809, "global_step": 508902, "epoch": 3029} {"train_loss": -12.59153938293457, "global_step": 508903, "epoch": 3029} {"train_loss": -12.39063835144043, "global_step": 508904, "epoch": 3029} {"train_loss": -12.63937759399414, "global_step": 508905, "epoch": 3029} {"train_loss": -12.091611862182617, "global_step": 508906, "epoch": 3029} {"train_loss": -11.9827880859375, "global_step": 508907, "epoch": 3029} {"train_loss": -12.211277961730957, "global_step": 508908, "epoch": 3029} {"train_loss": -12.713834762573242, "global_step": 508909, "epoch": 3029} {"train_loss": -12.237554550170898, "global_step": 508910, "epoch": 3029} {"train_loss": -11.494348526000977, "global_step": 508911, "epoch": 3029} {"train_loss": -12.230888366699219, "global_step": 508912, "epoch": 3029} {"train_loss": -12.400918006896973, "global_step": 508913, "epoch": 3029} {"train_loss": -11.748659133911133, "global_step": 508914, "epoch": 3029} {"train_loss": -12.12923526763916, "global_step": 508915, "epoch": 3029} {"train_loss": -12.51356315612793, "global_step": 508916, "epoch": 3029} {"train_loss": -12.143960952758789, "global_step": 508917, "epoch": 3029} {"train_loss": -12.530092239379883, "global_step": 508918, "epoch": 3029} {"train_loss": -12.588813781738281, "global_step": 508919, "epoch": 3029} {"train_loss": -12.329620361328125, "global_step": 508920, "epoch": 3029} {"train_loss": -11.751144409179688, "global_step": 508921, "epoch": 3029} {"train_loss": -12.374902725219727, "global_step": 508922, "epoch": 3029} {"train_loss": -11.227516174316406, "global_step": 508923, "epoch": 3029} {"train_loss": -11.564611434936523, "global_step": 508924, "epoch": 3029} {"train_loss": -12.122775077819824, "global_step": 508925, "epoch": 3029} {"train_loss": -12.20789623260498, "global_step": 508926, "epoch": 3029} {"train_loss": -11.437638282775879, "global_step": 508927, "epoch": 3029} {"train_loss": -11.624488830566406, "global_step": 508928, "epoch": 3029} {"train_loss": -11.420573234558105, "global_step": 508929, "epoch": 3029} {"train_loss": -11.761577606201172, "global_step": 508930, "epoch": 3029} {"train_loss": -11.87877368927002, "global_step": 508931, "epoch": 3029} {"train_loss": -11.52711296081543, "global_step": 508932, "epoch": 3029} {"train_loss": -12.538494110107422, "global_step": 508933, "epoch": 3029} {"train_loss": -12.144933700561523, "global_step": 508934, "epoch": 3029} {"train_loss": -12.150741577148438, "global_step": 508935, "epoch": 3029} {"train_loss": -12.130839347839355, "global_step": 508936, "epoch": 3029} {"train_loss": -12.68082046508789, "global_step": 508937, "epoch": 3029} {"train_loss": -12.302427291870117, "global_step": 508938, "epoch": 3029} {"train_loss": -12.317970275878906, "global_step": 508939, "epoch": 3029} {"train_loss": -12.406289100646973, "global_step": 508940, "epoch": 3029} {"train_loss": -12.067981719970703, "global_step": 508941, "epoch": 3029} {"train_loss": -12.071756362915039, "global_step": 508942, "epoch": 3029} {"train_loss": -12.067916870117188, "global_step": 508943, "epoch": 3029} {"train_loss": -11.274558067321777, "global_step": 508944, "epoch": 3029} {"train_loss": -10.644535064697266, "global_step": 508945, "epoch": 3029} {"train_loss": -11.065534591674805, "global_step": 508946, "epoch": 3029} {"train_loss": -9.848923683166504, "global_step": 508947, "epoch": 3029} {"train_loss": -11.345178604125977, "global_step": 508948, "epoch": 3029} {"train_loss": -11.805747985839844, "global_step": 508949, "epoch": 3029} {"train_loss": -10.902647018432617, "global_step": 508950, "epoch": 3029} {"train_loss": -12.00475788116455, "global_step": 508951, "epoch": 3029} {"train_loss": -10.540507316589355, "global_step": 508952, "epoch": 3029} {"train_loss": -12.036864280700684, "global_step": 508953, "epoch": 3029} {"train_loss": -11.4976167678833, "global_step": 508954, "epoch": 3029} {"train_loss": -10.312150001525879, "global_step": 508955, "epoch": 3029} {"train_loss": -12.251555442810059, "global_step": 508956, "epoch": 3029} {"train_loss": -10.908568382263184, "global_step": 508957, "epoch": 3029} {"train_loss": -11.697718620300293, "global_step": 508958, "epoch": 3029} {"train_loss": -11.61889934539795, "global_step": 508959, "epoch": 3029} {"train_loss": -11.336307525634766, "global_step": 508960, "epoch": 3029} {"train_loss": -11.047581672668457, "global_step": 508961, "epoch": 3029} {"train_loss": -11.886122703552246, "global_step": 508962, "epoch": 3029} {"train_loss": -10.730688095092773, "global_step": 508963, "epoch": 3029} {"train_loss": -11.920221328735352, "global_step": 508964, "epoch": 3029} {"train_loss": -11.131119728088379, "global_step": 508965, "epoch": 3029} {"train_loss": -11.691545486450195, "global_step": 508966, "epoch": 3029} {"train_loss": -11.83265495300293, "global_step": 508967, "epoch": 3029} {"train_loss": -11.452692985534668, "global_step": 508968, "epoch": 3029} {"train_loss": -11.161672592163086, "global_step": 508969, "epoch": 3029} {"train_loss": -12.104503631591797, "global_step": 508970, "epoch": 3029} {"train_loss": -11.067838668823242, "global_step": 508971, "epoch": 3029} {"train_loss": -11.779047012329102, "global_step": 508972, "epoch": 3029} {"train_loss": -11.932313919067383, "global_step": 508973, "epoch": 3029} {"train_loss": -11.46988296508789, "global_step": 508974, "epoch": 3029} {"train_loss": -12.262046813964844, "global_step": 508975, "epoch": 3029} {"train_loss": -11.86330795288086, "global_step": 508976, "epoch": 3029} {"train_loss": -12.395903587341309, "global_step": 508977, "epoch": 3029} {"train_loss": -12.016267776489258, "global_step": 508978, "epoch": 3029} {"train_loss": -12.342095375061035, "global_step": 508979, "epoch": 3029} {"train_loss": -11.75113296508789, "global_step": 508980, "epoch": 3029} {"train_loss": -11.605629920959473, "global_step": 508981, "epoch": 3029} {"train_loss": -11.031991958618164, "global_step": 508982, "epoch": 3029} {"train_loss": -12.29338550567627, "global_step": 508983, "epoch": 3029} {"train_loss": -11.747767448425293, "global_step": 508984, "epoch": 3029} {"train_loss": -11.733861923217773, "global_step": 508985, "epoch": 3029} {"train_loss": -12.232673645019531, "global_step": 508986, "epoch": 3029} {"train_loss": -11.75048828125, "global_step": 508987, "epoch": 3029} {"train_loss": -12.477264404296875, "global_step": 508988, "epoch": 3029} {"train_loss": -11.575929641723633, "global_step": 508989, "epoch": 3029} {"train_loss": -12.24897575378418, "global_step": 508990, "epoch": 3029} {"train_loss": -11.285285949707031, "global_step": 508991, "epoch": 3029} {"train_loss": -12.370140075683594, "global_step": 508992, "epoch": 3029} {"train_loss": -11.598258972167969, "global_step": 508993, "epoch": 3029} {"train_loss": -12.272860527038574, "global_step": 508994, "epoch": 3029} {"train_loss": -12.089483261108398, "global_step": 508995, "epoch": 3029} {"train_loss": -12.696615219116211, "global_step": 508996, "epoch": 3029} {"train_loss": -12.183696746826172, "global_step": 508997, "epoch": 3029} {"train_loss": -12.658392906188965, "global_step": 508998, "epoch": 3029} {"train_loss": -12.358111381530762, "global_step": 508999, "epoch": 3029} {"train_loss": -12.724876403808594, "global_step": 509000, "epoch": 3029} {"train_loss": -12.460053443908691, "global_step": 509001, "epoch": 3029} {"train_loss": -12.751203536987305, "global_step": 509002, "epoch": 3029} {"train_loss": -12.508793830871582, "global_step": 509003, "epoch": 3029} {"train_loss": -12.294361114501953, "global_step": 509004, "epoch": 3029} {"train_loss": -12.496058464050293, "global_step": 509005, "epoch": 3029} {"train_loss": -12.459075927734375, "global_step": 509006, "epoch": 3029} {"train_loss": -12.749282836914062, "global_step": 509007, "epoch": 3029} {"train_loss": -12.405189514160156, "global_step": 509008, "epoch": 3029} {"train_loss": -12.38154125213623, "global_step": 509009, "epoch": 3029} {"train_loss": -12.437378883361816, "global_step": 509010, "epoch": 3029} {"train_loss": -12.542197227478027, "global_step": 509011, "epoch": 3029} {"train_loss": -12.543315887451172, "global_step": 509012, "epoch": 3029} {"train_loss": -12.57470703125, "global_step": 509013, "epoch": 3029} {"train_loss": -12.713724136352539, "global_step": 509014, "epoch": 3029} {"train_loss": -12.768226623535156, "global_step": 509015, "epoch": 3029} {"train_loss": -12.607324600219727, "global_step": 509016, "epoch": 3029} {"train_loss": -12.679072380065918, "global_step": 509017, "epoch": 3029} {"train_loss": -12.466896057128906, "global_step": 509018, "epoch": 3029} {"train_loss": -12.892853736877441, "global_step": 509019, "epoch": 3029} {"train_loss": -12.64792537689209, "global_step": 509020, "epoch": 3029} {"train_loss": -12.792179107666016, "global_step": 509021, "epoch": 3029} {"train_loss": -12.752102851867676, "global_step": 509022, "epoch": 3029} {"train_loss": -12.800296783447266, "global_step": 509023, "epoch": 3029} {"train_loss": -12.669437408447266, "global_step": 509024, "epoch": 3029} {"train_loss": -12.874497413635254, "global_step": 509025, "epoch": 3029} {"train_loss": -12.765457153320312, "global_step": 509026, "epoch": 3029} {"train_loss": -12.703232765197754, "global_step": 509027, "epoch": 3029} {"train_loss": -12.670616149902344, "global_step": 509028, "epoch": 3029} {"train_loss": -12.940164566040039, "global_step": 509029, "epoch": 3029} {"train_loss": -12.825881004333496, "global_step": 509030, "epoch": 3029} {"train_loss": -12.857547760009766, "global_step": 509031, "epoch": 3029} {"train_loss": -12.765185356140137, "global_step": 509032, "epoch": 3029} {"train_loss": -12.83922290802002, "global_step": 509033, "epoch": 3029} {"train_loss": -12.440597534179688, "global_step": 509034, "epoch": 3029} {"train_loss": -12.726289749145508, "global_step": 509035, "epoch": 3029} {"train_loss": -12.2274169921875, "global_step": 509036, "epoch": 3029} {"train_loss": -12.840426445007324, "global_step": 509037, "epoch": 3029} {"train_loss": -12.43377685546875, "global_step": 509038, "epoch": 3029} {"train_loss": -12.19510611465999, "global_step": 509039, "epoch": 3029, "val_loss": 315636.84375} {"train_loss": -12.55726146697998, "global_step": 509040, "epoch": 3030} {"train_loss": -12.648307800292969, "global_step": 509041, "epoch": 3030} {"train_loss": -13.003312110900879, "global_step": 509042, "epoch": 3030} {"train_loss": -12.804326057434082, "global_step": 509043, "epoch": 3030} {"train_loss": -12.620817184448242, "global_step": 509044, "epoch": 3030} {"train_loss": -12.706737518310547, "global_step": 509045, "epoch": 3030} {"train_loss": -12.524980545043945, "global_step": 509046, "epoch": 3030} {"train_loss": -12.94131851196289, "global_step": 509047, "epoch": 3030} {"train_loss": -12.907482147216797, "global_step": 509048, "epoch": 3030} {"train_loss": -12.681425094604492, "global_step": 509049, "epoch": 3030} {"train_loss": -12.759068489074707, "global_step": 509050, "epoch": 3030} {"train_loss": -12.706279754638672, "global_step": 509051, "epoch": 3030} {"train_loss": -12.834295272827148, "global_step": 509052, "epoch": 3030} {"train_loss": -12.690240859985352, "global_step": 509053, "epoch": 3030} {"train_loss": -13.068922996520996, "global_step": 509054, "epoch": 3030} {"train_loss": -12.842689514160156, "global_step": 509055, "epoch": 3030} {"train_loss": -12.740178108215332, "global_step": 509056, "epoch": 3030} {"train_loss": -12.904338836669922, "global_step": 509057, "epoch": 3030} {"train_loss": -12.83735466003418, "global_step": 509058, "epoch": 3030} {"train_loss": -12.828693389892578, "global_step": 509059, "epoch": 3030} {"train_loss": -12.933368682861328, "global_step": 509060, "epoch": 3030} {"train_loss": -12.80396842956543, "global_step": 509061, "epoch": 3030} {"train_loss": -13.109502792358398, "global_step": 509062, "epoch": 3030} {"train_loss": -12.998457908630371, "global_step": 509063, "epoch": 3030} {"train_loss": -12.737836837768555, "global_step": 509064, "epoch": 3030} {"train_loss": -12.72823429107666, "global_step": 509065, "epoch": 3030} {"train_loss": -12.884413719177246, "global_step": 509066, "epoch": 3030} {"train_loss": -12.694032669067383, "global_step": 509067, "epoch": 3030} {"train_loss": -12.75330638885498, "global_step": 509068, "epoch": 3030} {"train_loss": -12.670032501220703, "global_step": 509069, "epoch": 3030} {"train_loss": -12.319643020629883, "global_step": 509070, "epoch": 3030} {"train_loss": -12.679808616638184, "global_step": 509071, "epoch": 3030} {"train_loss": -12.501852035522461, "global_step": 509072, "epoch": 3030} {"train_loss": -12.40350341796875, "global_step": 509073, "epoch": 3030} {"train_loss": -12.067012786865234, "global_step": 509074, "epoch": 3030} {"train_loss": -12.910677909851074, "global_step": 509075, "epoch": 3030} {"train_loss": -12.332012176513672, "global_step": 509076, "epoch": 3030} {"train_loss": -12.634035110473633, "global_step": 509077, "epoch": 3030} {"train_loss": -13.106450080871582, "global_step": 509078, "epoch": 3030} {"train_loss": -12.599388122558594, "global_step": 509079, "epoch": 3030} {"train_loss": -12.718561172485352, "global_step": 509080, "epoch": 3030} {"train_loss": -12.714277267456055, "global_step": 509081, "epoch": 3030} {"train_loss": -12.94699764251709, "global_step": 509082, "epoch": 3030} {"train_loss": -12.396875381469727, "global_step": 509083, "epoch": 3030} {"train_loss": -12.991606712341309, "global_step": 509084, "epoch": 3030} {"train_loss": -12.869487762451172, "global_step": 509085, "epoch": 3030} {"train_loss": -12.59719467163086, "global_step": 509086, "epoch": 3030} {"train_loss": -12.848426818847656, "global_step": 509087, "epoch": 3030} {"train_loss": -12.669052124023438, "global_step": 509088, "epoch": 3030} {"train_loss": -12.642566680908203, "global_step": 509089, "epoch": 3030} {"train_loss": -12.888814926147461, "global_step": 509090, "epoch": 3030} {"train_loss": -13.079615592956543, "global_step": 509091, "epoch": 3030} {"train_loss": -12.417823791503906, "global_step": 509092, "epoch": 3030} {"train_loss": -12.90447998046875, "global_step": 509093, "epoch": 3030} {"train_loss": -12.751848220825195, "global_step": 509094, "epoch": 3030} {"train_loss": -13.025005340576172, "global_step": 509095, "epoch": 3030} {"train_loss": -12.62828254699707, "global_step": 509096, "epoch": 3030} {"train_loss": -12.641744613647461, "global_step": 509097, "epoch": 3030} {"train_loss": -12.621850967407227, "global_step": 509098, "epoch": 3030} {"train_loss": -12.458990097045898, "global_step": 509099, "epoch": 3030} {"train_loss": -12.871232986450195, "global_step": 509100, "epoch": 3030} {"train_loss": -12.546499252319336, "global_step": 509101, "epoch": 3030} {"train_loss": -11.315530776977539, "global_step": 509102, "epoch": 3030} {"train_loss": -11.883382797241211, "global_step": 509103, "epoch": 3030} {"train_loss": -12.286983489990234, "global_step": 509104, "epoch": 3030} {"train_loss": -10.343008041381836, "global_step": 509105, "epoch": 3030} {"train_loss": -11.266575813293457, "global_step": 509106, "epoch": 3030} {"train_loss": -12.065065383911133, "global_step": 509107, "epoch": 3030} {"train_loss": -11.894288063049316, "global_step": 509108, "epoch": 3030} {"train_loss": -11.825997352600098, "global_step": 509109, "epoch": 3030} {"train_loss": -11.540879249572754, "global_step": 509110, "epoch": 3030} {"train_loss": -11.393621444702148, "global_step": 509111, "epoch": 3030} {"train_loss": -12.831725120544434, "global_step": 509112, "epoch": 3030} {"train_loss": -10.992652893066406, "global_step": 509113, "epoch": 3030} {"train_loss": -12.630062103271484, "global_step": 509114, "epoch": 3030} {"train_loss": -11.682503700256348, "global_step": 509115, "epoch": 3030} {"train_loss": -11.644700050354004, "global_step": 509116, "epoch": 3030} {"train_loss": -11.746150016784668, "global_step": 509117, "epoch": 3030} {"train_loss": -11.239134788513184, "global_step": 509118, "epoch": 3030} {"train_loss": -10.231188774108887, "global_step": 509119, "epoch": 3030} {"train_loss": -11.650415420532227, "global_step": 509120, "epoch": 3030} {"train_loss": -11.278635025024414, "global_step": 509121, "epoch": 3030} {"train_loss": -11.521039009094238, "global_step": 509122, "epoch": 3030} {"train_loss": -11.117973327636719, "global_step": 509123, "epoch": 3030} {"train_loss": -11.259525299072266, "global_step": 509124, "epoch": 3030} {"train_loss": -11.712846755981445, "global_step": 509125, "epoch": 3030} {"train_loss": -10.788440704345703, "global_step": 509126, "epoch": 3030} {"train_loss": -12.41610336303711, "global_step": 509127, "epoch": 3030} {"train_loss": -10.948348999023438, "global_step": 509128, "epoch": 3030} {"train_loss": -11.970417022705078, "global_step": 509129, "epoch": 3030} {"train_loss": -12.003141403198242, "global_step": 509130, "epoch": 3030} {"train_loss": -10.553092002868652, "global_step": 509131, "epoch": 3030} {"train_loss": -11.797428131103516, "global_step": 509132, "epoch": 3030} {"train_loss": -11.398162841796875, "global_step": 509133, "epoch": 3030} {"train_loss": -11.860355377197266, "global_step": 509134, "epoch": 3030} {"train_loss": -11.589324951171875, "global_step": 509135, "epoch": 3030} {"train_loss": -11.286505699157715, "global_step": 509136, "epoch": 3030} {"train_loss": -12.267333984375, "global_step": 509137, "epoch": 3030} {"train_loss": -10.731010437011719, "global_step": 509138, "epoch": 3030} {"train_loss": -12.011093139648438, "global_step": 509139, "epoch": 3030} {"train_loss": -10.985458374023438, "global_step": 509140, "epoch": 3030} {"train_loss": -11.117526054382324, "global_step": 509141, "epoch": 3030} {"train_loss": -11.94642448425293, "global_step": 509142, "epoch": 3030} {"train_loss": -11.934429168701172, "global_step": 509143, "epoch": 3030} {"train_loss": -11.960396766662598, "global_step": 509144, "epoch": 3030} {"train_loss": -11.952138900756836, "global_step": 509145, "epoch": 3030} {"train_loss": -12.08712387084961, "global_step": 509146, "epoch": 3030} {"train_loss": -12.503899574279785, "global_step": 509147, "epoch": 3030} {"train_loss": -12.450275421142578, "global_step": 509148, "epoch": 3030} {"train_loss": -12.226638793945312, "global_step": 509149, "epoch": 3030} {"train_loss": -12.518759727478027, "global_step": 509150, "epoch": 3030} {"train_loss": -12.44658374786377, "global_step": 509151, "epoch": 3030} {"train_loss": -12.66177749633789, "global_step": 509152, "epoch": 3030} {"train_loss": -12.154777526855469, "global_step": 509153, "epoch": 3030} {"train_loss": -12.607694625854492, "global_step": 509154, "epoch": 3030} {"train_loss": -12.458438873291016, "global_step": 509155, "epoch": 3030} {"train_loss": -12.562379837036133, "global_step": 509156, "epoch": 3030} {"train_loss": -12.605818748474121, "global_step": 509157, "epoch": 3030} {"train_loss": -12.499748229980469, "global_step": 509158, "epoch": 3030} {"train_loss": -12.44494915008545, "global_step": 509159, "epoch": 3030} {"train_loss": -12.695795059204102, "global_step": 509160, "epoch": 3030} {"train_loss": -12.487472534179688, "global_step": 509161, "epoch": 3030} {"train_loss": -12.342428207397461, "global_step": 509162, "epoch": 3030} {"train_loss": -12.715047836303711, "global_step": 509163, "epoch": 3030} {"train_loss": -12.281695365905762, "global_step": 509164, "epoch": 3030} {"train_loss": -12.488237380981445, "global_step": 509165, "epoch": 3030} {"train_loss": -12.565292358398438, "global_step": 509166, "epoch": 3030} {"train_loss": -12.230103492736816, "global_step": 509167, "epoch": 3030} {"train_loss": -12.724754333496094, "global_step": 509168, "epoch": 3030} {"train_loss": -11.808205604553223, "global_step": 509169, "epoch": 3030} {"train_loss": -12.909967422485352, "global_step": 509170, "epoch": 3030} {"train_loss": -12.110198974609375, "global_step": 509171, "epoch": 3030} {"train_loss": -12.179800033569336, "global_step": 509172, "epoch": 3030} {"train_loss": -12.221495628356934, "global_step": 509173, "epoch": 3030} {"train_loss": -12.279454231262207, "global_step": 509174, "epoch": 3030} {"train_loss": -12.484987258911133, "global_step": 509175, "epoch": 3030} {"train_loss": -12.239989280700684, "global_step": 509176, "epoch": 3030} {"train_loss": -12.56540584564209, "global_step": 509177, "epoch": 3030} {"train_loss": -12.15279769897461, "global_step": 509178, "epoch": 3030} {"train_loss": -12.491077423095703, "global_step": 509179, "epoch": 3030} {"train_loss": -12.272775650024414, "global_step": 509180, "epoch": 3030} {"train_loss": -12.332350730895996, "global_step": 509181, "epoch": 3030} {"train_loss": -12.562585830688477, "global_step": 509182, "epoch": 3030} {"train_loss": -12.132658004760742, "global_step": 509183, "epoch": 3030} {"train_loss": -12.561068534851074, "global_step": 509184, "epoch": 3030} {"train_loss": -12.57989501953125, "global_step": 509185, "epoch": 3030} {"train_loss": -12.683460235595703, "global_step": 509186, "epoch": 3030} {"train_loss": -12.343250274658203, "global_step": 509187, "epoch": 3030} {"train_loss": -12.251304626464844, "global_step": 509188, "epoch": 3030} {"train_loss": -12.893077850341797, "global_step": 509189, "epoch": 3030} {"train_loss": -12.098213195800781, "global_step": 509190, "epoch": 3030} {"train_loss": -12.51559066772461, "global_step": 509191, "epoch": 3030} {"train_loss": -12.510174751281738, "global_step": 509192, "epoch": 3030} {"train_loss": -12.250511169433594, "global_step": 509193, "epoch": 3030} {"train_loss": -12.434810638427734, "global_step": 509194, "epoch": 3030} {"train_loss": -12.706670761108398, "global_step": 509195, "epoch": 3030} {"train_loss": -12.477348327636719, "global_step": 509196, "epoch": 3030} {"train_loss": -12.448751449584961, "global_step": 509197, "epoch": 3030} {"train_loss": -12.538609504699707, "global_step": 509198, "epoch": 3030} {"train_loss": -12.543985366821289, "global_step": 509199, "epoch": 3030} {"train_loss": -12.729705810546875, "global_step": 509200, "epoch": 3030} {"train_loss": -12.755322456359863, "global_step": 509201, "epoch": 3030} {"train_loss": -12.74819278717041, "global_step": 509202, "epoch": 3030} {"train_loss": -12.471441268920898, "global_step": 509203, "epoch": 3030} {"train_loss": -13.008493423461914, "global_step": 509204, "epoch": 3030} {"train_loss": -12.617096900939941, "global_step": 509205, "epoch": 3030} {"train_loss": -12.967394828796387, "global_step": 509206, "epoch": 3030} {"train_loss": -12.331583755356926, "global_step": 509207, "epoch": 3030, "val_loss": 319784.03125, "train_action_mse_error": 1.7011895179748535} {"train_loss": -12.878266334533691, "global_step": 509208, "epoch": 3031} {"train_loss": -12.390475273132324, "global_step": 509209, "epoch": 3031} {"train_loss": -12.838092803955078, "global_step": 509210, "epoch": 3031} {"train_loss": -12.521173477172852, "global_step": 509211, "epoch": 3031} {"train_loss": -12.584575653076172, "global_step": 509212, "epoch": 3031} {"train_loss": -12.775564193725586, "global_step": 509213, "epoch": 3031} {"train_loss": -12.215852737426758, "global_step": 509214, "epoch": 3031} {"train_loss": -12.799367904663086, "global_step": 509215, "epoch": 3031} {"train_loss": -12.211299896240234, "global_step": 509216, "epoch": 3031} {"train_loss": -12.520769119262695, "global_step": 509217, "epoch": 3031} {"train_loss": -12.565208435058594, "global_step": 509218, "epoch": 3031} {"train_loss": -12.078757286071777, "global_step": 509219, "epoch": 3031} {"train_loss": -12.571402549743652, "global_step": 509220, "epoch": 3031} {"train_loss": -11.32826042175293, "global_step": 509221, "epoch": 3031} {"train_loss": -11.031060218811035, "global_step": 509222, "epoch": 3031} {"train_loss": -12.305843353271484, "global_step": 509223, "epoch": 3031} {"train_loss": -10.961891174316406, "global_step": 509224, "epoch": 3031} {"train_loss": -11.80337905883789, "global_step": 509225, "epoch": 3031} {"train_loss": -11.62126350402832, "global_step": 509226, "epoch": 3031} {"train_loss": -12.315641403198242, "global_step": 509227, "epoch": 3031} {"train_loss": -11.750714302062988, "global_step": 509228, "epoch": 3031} {"train_loss": -12.456903457641602, "global_step": 509229, "epoch": 3031} {"train_loss": -11.943535804748535, "global_step": 509230, "epoch": 3031} {"train_loss": -11.900273323059082, "global_step": 509231, "epoch": 3031} {"train_loss": -12.24417495727539, "global_step": 509232, "epoch": 3031} {"train_loss": -11.878399848937988, "global_step": 509233, "epoch": 3031} {"train_loss": -12.179159164428711, "global_step": 509234, "epoch": 3031} {"train_loss": -11.853121757507324, "global_step": 509235, "epoch": 3031} {"train_loss": -12.169489860534668, "global_step": 509236, "epoch": 3031} {"train_loss": -12.724569320678711, "global_step": 509237, "epoch": 3031} {"train_loss": -11.541754722595215, "global_step": 509238, "epoch": 3031} {"train_loss": -11.930988311767578, "global_step": 509239, "epoch": 3031} {"train_loss": -12.11186695098877, "global_step": 509240, "epoch": 3031} {"train_loss": -12.037249565124512, "global_step": 509241, "epoch": 3031} {"train_loss": -11.988718032836914, "global_step": 509242, "epoch": 3031} {"train_loss": -12.385564804077148, "global_step": 509243, "epoch": 3031} {"train_loss": -12.198507308959961, "global_step": 509244, "epoch": 3031} {"train_loss": -12.375450134277344, "global_step": 509245, "epoch": 3031} {"train_loss": -12.498173713684082, "global_step": 509246, "epoch": 3031} {"train_loss": -12.353179931640625, "global_step": 509247, "epoch": 3031} {"train_loss": -12.403695106506348, "global_step": 509248, "epoch": 3031} {"train_loss": -12.361422538757324, "global_step": 509249, "epoch": 3031} {"train_loss": -12.597437858581543, "global_step": 509250, "epoch": 3031} {"train_loss": -12.724798202514648, "global_step": 509251, "epoch": 3031} {"train_loss": -12.54481315612793, "global_step": 509252, "epoch": 3031} {"train_loss": -12.791356086730957, "global_step": 509253, "epoch": 3031} {"train_loss": -12.35191535949707, "global_step": 509254, "epoch": 3031} {"train_loss": -12.781935691833496, "global_step": 509255, "epoch": 3031} {"train_loss": -12.685929298400879, "global_step": 509256, "epoch": 3031} {"train_loss": -12.508560180664062, "global_step": 509257, "epoch": 3031} {"train_loss": -12.682132720947266, "global_step": 509258, "epoch": 3031} {"train_loss": -12.468074798583984, "global_step": 509259, "epoch": 3031} {"train_loss": -12.787107467651367, "global_step": 509260, "epoch": 3031} {"train_loss": -12.293704986572266, "global_step": 509261, "epoch": 3031} {"train_loss": -12.533750534057617, "global_step": 509262, "epoch": 3031} {"train_loss": -12.652411460876465, "global_step": 509263, "epoch": 3031} {"train_loss": -12.627201080322266, "global_step": 509264, "epoch": 3031} {"train_loss": -12.721624374389648, "global_step": 509265, "epoch": 3031} {"train_loss": -12.627263069152832, "global_step": 509266, "epoch": 3031} {"train_loss": -12.411853790283203, "global_step": 509267, "epoch": 3031} {"train_loss": -12.893150329589844, "global_step": 509268, "epoch": 3031} {"train_loss": -12.356752395629883, "global_step": 509269, "epoch": 3031} {"train_loss": -12.540141105651855, "global_step": 509270, "epoch": 3031} {"train_loss": -12.231292724609375, "global_step": 509271, "epoch": 3031} {"train_loss": -12.427948951721191, "global_step": 509272, "epoch": 3031} {"train_loss": -12.748318672180176, "global_step": 509273, "epoch": 3031} {"train_loss": -12.268669128417969, "global_step": 509274, "epoch": 3031} {"train_loss": -12.633319854736328, "global_step": 509275, "epoch": 3031} {"train_loss": -12.137994766235352, "global_step": 509276, "epoch": 3031} {"train_loss": -11.385807037353516, "global_step": 509277, "epoch": 3031} {"train_loss": -11.76128101348877, "global_step": 509278, "epoch": 3031} {"train_loss": -11.382223129272461, "global_step": 509279, "epoch": 3031} {"train_loss": -11.267152786254883, "global_step": 509280, "epoch": 3031} {"train_loss": -11.425483703613281, "global_step": 509281, "epoch": 3031} {"train_loss": -12.197460174560547, "global_step": 509282, "epoch": 3031} {"train_loss": -11.670537948608398, "global_step": 509283, "epoch": 3031} {"train_loss": -12.444987297058105, "global_step": 509284, "epoch": 3031} {"train_loss": -11.421923637390137, "global_step": 509285, "epoch": 3031} {"train_loss": -12.59430980682373, "global_step": 509286, "epoch": 3031} {"train_loss": -11.24475383758545, "global_step": 509287, "epoch": 3031} {"train_loss": -12.467860221862793, "global_step": 509288, "epoch": 3031} {"train_loss": -11.504494667053223, "global_step": 509289, "epoch": 3031} {"train_loss": -12.407442092895508, "global_step": 509290, "epoch": 3031} {"train_loss": -12.12934684753418, "global_step": 509291, "epoch": 3031} {"train_loss": -12.23221492767334, "global_step": 509292, "epoch": 3031} {"train_loss": -12.660187721252441, "global_step": 509293, "epoch": 3031} {"train_loss": -12.038392066955566, "global_step": 509294, "epoch": 3031} {"train_loss": -12.654441833496094, "global_step": 509295, "epoch": 3031} {"train_loss": -12.319318771362305, "global_step": 509296, "epoch": 3031} {"train_loss": -12.1774320602417, "global_step": 509297, "epoch": 3031} {"train_loss": -12.107166290283203, "global_step": 509298, "epoch": 3031} {"train_loss": -12.165191650390625, "global_step": 509299, "epoch": 3031} {"train_loss": -11.01248550415039, "global_step": 509300, "epoch": 3031} {"train_loss": -12.529754638671875, "global_step": 509301, "epoch": 3031} {"train_loss": -11.448128700256348, "global_step": 509302, "epoch": 3031} {"train_loss": -11.94540023803711, "global_step": 509303, "epoch": 3031} {"train_loss": -12.658773422241211, "global_step": 509304, "epoch": 3031} {"train_loss": -11.233967781066895, "global_step": 509305, "epoch": 3031} {"train_loss": -12.262825965881348, "global_step": 509306, "epoch": 3031} {"train_loss": -11.341093063354492, "global_step": 509307, "epoch": 3031} {"train_loss": -11.189188003540039, "global_step": 509308, "epoch": 3031} {"train_loss": -11.482791900634766, "global_step": 509309, "epoch": 3031} {"train_loss": -12.305707931518555, "global_step": 509310, "epoch": 3031} {"train_loss": -12.015478134155273, "global_step": 509311, "epoch": 3031} {"train_loss": -12.166748046875, "global_step": 509312, "epoch": 3031} {"train_loss": -12.580781936645508, "global_step": 509313, "epoch": 3031} {"train_loss": -11.879146575927734, "global_step": 509314, "epoch": 3031} {"train_loss": -12.602814674377441, "global_step": 509315, "epoch": 3031} {"train_loss": -12.526670455932617, "global_step": 509316, "epoch": 3031} {"train_loss": -12.73675537109375, "global_step": 509317, "epoch": 3031} {"train_loss": -12.566458702087402, "global_step": 509318, "epoch": 3031} {"train_loss": -12.411161422729492, "global_step": 509319, "epoch": 3031} {"train_loss": -12.587665557861328, "global_step": 509320, "epoch": 3031} {"train_loss": -12.491584777832031, "global_step": 509321, "epoch": 3031} {"train_loss": -12.623547554016113, "global_step": 509322, "epoch": 3031} {"train_loss": -12.20349407196045, "global_step": 509323, "epoch": 3031} {"train_loss": -12.537264823913574, "global_step": 509324, "epoch": 3031} {"train_loss": -12.190360069274902, "global_step": 509325, "epoch": 3031} {"train_loss": -12.743096351623535, "global_step": 509326, "epoch": 3031} {"train_loss": -12.223040580749512, "global_step": 509327, "epoch": 3031} {"train_loss": -12.554559707641602, "global_step": 509328, "epoch": 3031} {"train_loss": -12.387910842895508, "global_step": 509329, "epoch": 3031} {"train_loss": -12.585132598876953, "global_step": 509330, "epoch": 3031} {"train_loss": -12.540539741516113, "global_step": 509331, "epoch": 3031} {"train_loss": -12.549588203430176, "global_step": 509332, "epoch": 3031} {"train_loss": -12.225011825561523, "global_step": 509333, "epoch": 3031} {"train_loss": -12.696434020996094, "global_step": 509334, "epoch": 3031} {"train_loss": -12.678014755249023, "global_step": 509335, "epoch": 3031} {"train_loss": -12.484764099121094, "global_step": 509336, "epoch": 3031} {"train_loss": -12.804576873779297, "global_step": 509337, "epoch": 3031} {"train_loss": -12.513301849365234, "global_step": 509338, "epoch": 3031} {"train_loss": -12.800028800964355, "global_step": 509339, "epoch": 3031} {"train_loss": -12.487722396850586, "global_step": 509340, "epoch": 3031} {"train_loss": -12.725172996520996, "global_step": 509341, "epoch": 3031} {"train_loss": -12.628747940063477, "global_step": 509342, "epoch": 3031} {"train_loss": -12.85928726196289, "global_step": 509343, "epoch": 3031} {"train_loss": -12.619385719299316, "global_step": 509344, "epoch": 3031} {"train_loss": -12.718606948852539, "global_step": 509345, "epoch": 3031} {"train_loss": -12.59943675994873, "global_step": 509346, "epoch": 3031} {"train_loss": -13.013705253601074, "global_step": 509347, "epoch": 3031} {"train_loss": -12.608101844787598, "global_step": 509348, "epoch": 3031} {"train_loss": -12.506027221679688, "global_step": 509349, "epoch": 3031} {"train_loss": -12.698923110961914, "global_step": 509350, "epoch": 3031} {"train_loss": -12.73923397064209, "global_step": 509351, "epoch": 3031} {"train_loss": -12.90800952911377, "global_step": 509352, "epoch": 3031} {"train_loss": -12.929309844970703, "global_step": 509353, "epoch": 3031} {"train_loss": -12.6843843460083, "global_step": 509354, "epoch": 3031} {"train_loss": -12.547748565673828, "global_step": 509355, "epoch": 3031} {"train_loss": -12.991983413696289, "global_step": 509356, "epoch": 3031} {"train_loss": -12.560178756713867, "global_step": 509357, "epoch": 3031} {"train_loss": -12.898972511291504, "global_step": 509358, "epoch": 3031} {"train_loss": -12.77241325378418, "global_step": 509359, "epoch": 3031} {"train_loss": -12.54574203491211, "global_step": 509360, "epoch": 3031} {"train_loss": -12.283086776733398, "global_step": 509361, "epoch": 3031} {"train_loss": -12.98822021484375, "global_step": 509362, "epoch": 3031} {"train_loss": -12.729862213134766, "global_step": 509363, "epoch": 3031} {"train_loss": -12.97981071472168, "global_step": 509364, "epoch": 3031} {"train_loss": -12.928291320800781, "global_step": 509365, "epoch": 3031} {"train_loss": -12.807052612304688, "global_step": 509366, "epoch": 3031} {"train_loss": -12.845661163330078, "global_step": 509367, "epoch": 3031} {"train_loss": -12.904897689819336, "global_step": 509368, "epoch": 3031} {"train_loss": -12.624778747558594, "global_step": 509369, "epoch": 3031} {"train_loss": -12.29990005493164, "global_step": 509370, "epoch": 3031} {"train_loss": -12.739026069641113, "global_step": 509371, "epoch": 3031} {"train_loss": -13.004058837890625, "global_step": 509372, "epoch": 3031} {"train_loss": -12.953826904296875, "global_step": 509373, "epoch": 3031} {"train_loss": -12.998306274414062, "global_step": 509374, "epoch": 3031} {"train_loss": -12.361020042782737, "global_step": 509375, "epoch": 3031, "val_loss": 318224.0} {"train_loss": -12.642274856567383, "global_step": 509376, "epoch": 3032} {"train_loss": -12.617278099060059, "global_step": 509377, "epoch": 3032} {"train_loss": -12.855052947998047, "global_step": 509378, "epoch": 3032} {"train_loss": -13.021726608276367, "global_step": 509379, "epoch": 3032} {"train_loss": -12.971827507019043, "global_step": 509380, "epoch": 3032} {"train_loss": -12.942693710327148, "global_step": 509381, "epoch": 3032} {"train_loss": -12.583532333374023, "global_step": 509382, "epoch": 3032} {"train_loss": -12.510828971862793, "global_step": 509383, "epoch": 3032} {"train_loss": -12.862785339355469, "global_step": 509384, "epoch": 3032} {"train_loss": -12.882972717285156, "global_step": 509385, "epoch": 3032} {"train_loss": -12.607857704162598, "global_step": 509386, "epoch": 3032} {"train_loss": -12.9135160446167, "global_step": 509387, "epoch": 3032} {"train_loss": -12.884025573730469, "global_step": 509388, "epoch": 3032} {"train_loss": -12.813838005065918, "global_step": 509389, "epoch": 3032} {"train_loss": -12.76645278930664, "global_step": 509390, "epoch": 3032} {"train_loss": -13.018501281738281, "global_step": 509391, "epoch": 3032} {"train_loss": -12.877588272094727, "global_step": 509392, "epoch": 3032} {"train_loss": -12.75992202758789, "global_step": 509393, "epoch": 3032} {"train_loss": -13.002283096313477, "global_step": 509394, "epoch": 3032} {"train_loss": -12.378082275390625, "global_step": 509395, "epoch": 3032} {"train_loss": -12.40280818939209, "global_step": 509396, "epoch": 3032} {"train_loss": -12.618776321411133, "global_step": 509397, "epoch": 3032} {"train_loss": -12.811229705810547, "global_step": 509398, "epoch": 3032} {"train_loss": -12.094554901123047, "global_step": 509399, "epoch": 3032} {"train_loss": -12.541204452514648, "global_step": 509400, "epoch": 3032} {"train_loss": -11.856521606445312, "global_step": 509401, "epoch": 3032} {"train_loss": -10.58316421508789, "global_step": 509402, "epoch": 3032} {"train_loss": -11.962997436523438, "global_step": 509403, "epoch": 3032} {"train_loss": -11.482272148132324, "global_step": 509404, "epoch": 3032} {"train_loss": -9.907247543334961, "global_step": 509405, "epoch": 3032} {"train_loss": -11.392223358154297, "global_step": 509406, "epoch": 3032} {"train_loss": -8.254192352294922, "global_step": 509407, "epoch": 3032} {"train_loss": -11.374345779418945, "global_step": 509408, "epoch": 3032} {"train_loss": -11.339948654174805, "global_step": 509409, "epoch": 3032} {"train_loss": -9.794940948486328, "global_step": 509410, "epoch": 3032} {"train_loss": -10.972314834594727, "global_step": 509411, "epoch": 3032} {"train_loss": -11.081241607666016, "global_step": 509412, "epoch": 3032} {"train_loss": -10.453042984008789, "global_step": 509413, "epoch": 3032} {"train_loss": -11.17575740814209, "global_step": 509414, "epoch": 3032} {"train_loss": -9.269447326660156, "global_step": 509415, "epoch": 3032} {"train_loss": -9.896097183227539, "global_step": 509416, "epoch": 3032} {"train_loss": -10.93653678894043, "global_step": 509417, "epoch": 3032} {"train_loss": -10.29536247253418, "global_step": 509418, "epoch": 3032} {"train_loss": -10.19880485534668, "global_step": 509419, "epoch": 3032} {"train_loss": -10.802654266357422, "global_step": 509420, "epoch": 3032} {"train_loss": -10.685773849487305, "global_step": 509421, "epoch": 3032} {"train_loss": -10.965645790100098, "global_step": 509422, "epoch": 3032} {"train_loss": -11.41728401184082, "global_step": 509423, "epoch": 3032} {"train_loss": -10.71945571899414, "global_step": 509424, "epoch": 3032} {"train_loss": -10.850635528564453, "global_step": 509425, "epoch": 3032} {"train_loss": -11.17994499206543, "global_step": 509426, "epoch": 3032} {"train_loss": -10.762384414672852, "global_step": 509427, "epoch": 3032} {"train_loss": -10.226580619812012, "global_step": 509428, "epoch": 3032} {"train_loss": -11.26541805267334, "global_step": 509429, "epoch": 3032} {"train_loss": -10.490924835205078, "global_step": 509430, "epoch": 3032} {"train_loss": -11.578536987304688, "global_step": 509431, "epoch": 3032} {"train_loss": -10.325435638427734, "global_step": 509432, "epoch": 3032} {"train_loss": -11.248025894165039, "global_step": 509433, "epoch": 3032} {"train_loss": -10.358555793762207, "global_step": 509434, "epoch": 3032} {"train_loss": -11.597977638244629, "global_step": 509435, "epoch": 3032} {"train_loss": -11.01425552368164, "global_step": 509436, "epoch": 3032} {"train_loss": -10.554621696472168, "global_step": 509437, "epoch": 3032} {"train_loss": -11.266834259033203, "global_step": 509438, "epoch": 3032} {"train_loss": -11.255719184875488, "global_step": 509439, "epoch": 3032} {"train_loss": -10.794281959533691, "global_step": 509440, "epoch": 3032} {"train_loss": -11.53635311126709, "global_step": 509441, "epoch": 3032} {"train_loss": -11.573325157165527, "global_step": 509442, "epoch": 3032} {"train_loss": -11.425546646118164, "global_step": 509443, "epoch": 3032} {"train_loss": -11.560196876525879, "global_step": 509444, "epoch": 3032} {"train_loss": -12.03288459777832, "global_step": 509445, "epoch": 3032} {"train_loss": -11.715967178344727, "global_step": 509446, "epoch": 3032} {"train_loss": -12.477787017822266, "global_step": 509447, "epoch": 3032} {"train_loss": -11.467561721801758, "global_step": 509448, "epoch": 3032} {"train_loss": -12.217819213867188, "global_step": 509449, "epoch": 3032} {"train_loss": -11.86043930053711, "global_step": 509450, "epoch": 3032} {"train_loss": -12.002882957458496, "global_step": 509451, "epoch": 3032} {"train_loss": -12.315299034118652, "global_step": 509452, "epoch": 3032} {"train_loss": -12.233274459838867, "global_step": 509453, "epoch": 3032} {"train_loss": -12.34107780456543, "global_step": 509454, "epoch": 3032} {"train_loss": -12.28641414642334, "global_step": 509455, "epoch": 3032} {"train_loss": -12.316271781921387, "global_step": 509456, "epoch": 3032} {"train_loss": -12.305871963500977, "global_step": 509457, "epoch": 3032} {"train_loss": -12.049477577209473, "global_step": 509458, "epoch": 3032} {"train_loss": -12.594398498535156, "global_step": 509459, "epoch": 3032} {"train_loss": -12.048866271972656, "global_step": 509460, "epoch": 3032} {"train_loss": -12.427255630493164, "global_step": 509461, "epoch": 3032} {"train_loss": -11.862191200256348, "global_step": 509462, "epoch": 3032} {"train_loss": -12.351659774780273, "global_step": 509463, "epoch": 3032} {"train_loss": -12.112972259521484, "global_step": 509464, "epoch": 3032} {"train_loss": -12.280252456665039, "global_step": 509465, "epoch": 3032} {"train_loss": -12.308456420898438, "global_step": 509466, "epoch": 3032} {"train_loss": -12.486434936523438, "global_step": 509467, "epoch": 3032} {"train_loss": -12.355548858642578, "global_step": 509468, "epoch": 3032} {"train_loss": -12.490362167358398, "global_step": 509469, "epoch": 3032} {"train_loss": -12.086536407470703, "global_step": 509470, "epoch": 3032} {"train_loss": -12.597658157348633, "global_step": 509471, "epoch": 3032} {"train_loss": -12.484289169311523, "global_step": 509472, "epoch": 3032} {"train_loss": -12.349920272827148, "global_step": 509473, "epoch": 3032} {"train_loss": -12.292208671569824, "global_step": 509474, "epoch": 3032} {"train_loss": -12.162433624267578, "global_step": 509475, "epoch": 3032} {"train_loss": -12.56248664855957, "global_step": 509476, "epoch": 3032} {"train_loss": -12.572354316711426, "global_step": 509477, "epoch": 3032} {"train_loss": -12.60114860534668, "global_step": 509478, "epoch": 3032} {"train_loss": -12.561851501464844, "global_step": 509479, "epoch": 3032} {"train_loss": -12.551996231079102, "global_step": 509480, "epoch": 3032} {"train_loss": -12.629271507263184, "global_step": 509481, "epoch": 3032} {"train_loss": -12.729293823242188, "global_step": 509482, "epoch": 3032} {"train_loss": -12.44198226928711, "global_step": 509483, "epoch": 3032} {"train_loss": -12.731918334960938, "global_step": 509484, "epoch": 3032} {"train_loss": -12.792274475097656, "global_step": 509485, "epoch": 3032} {"train_loss": -12.777250289916992, "global_step": 509486, "epoch": 3032} {"train_loss": -12.610950469970703, "global_step": 509487, "epoch": 3032} {"train_loss": -12.895967483520508, "global_step": 509488, "epoch": 3032} {"train_loss": -12.81852912902832, "global_step": 509489, "epoch": 3032} {"train_loss": -12.692917823791504, "global_step": 509490, "epoch": 3032} {"train_loss": -12.766397476196289, "global_step": 509491, "epoch": 3032} {"train_loss": -12.828399658203125, "global_step": 509492, "epoch": 3032} {"train_loss": -12.846617698669434, "global_step": 509493, "epoch": 3032} {"train_loss": -12.835921287536621, "global_step": 509494, "epoch": 3032} {"train_loss": -12.541492462158203, "global_step": 509495, "epoch": 3032} {"train_loss": -12.832796096801758, "global_step": 509496, "epoch": 3032} {"train_loss": -12.842571258544922, "global_step": 509497, "epoch": 3032} {"train_loss": -12.849027633666992, "global_step": 509498, "epoch": 3032} {"train_loss": -13.008353233337402, "global_step": 509499, "epoch": 3032} {"train_loss": -12.862138748168945, "global_step": 509500, "epoch": 3032} {"train_loss": -12.938129425048828, "global_step": 509501, "epoch": 3032} {"train_loss": -13.061747550964355, "global_step": 509502, "epoch": 3032} {"train_loss": -13.026443481445312, "global_step": 509503, "epoch": 3032} {"train_loss": -12.789060592651367, "global_step": 509504, "epoch": 3032} {"train_loss": -12.865732192993164, "global_step": 509505, "epoch": 3032} {"train_loss": -12.915975570678711, "global_step": 509506, "epoch": 3032} {"train_loss": -12.997098922729492, "global_step": 509507, "epoch": 3032} {"train_loss": -12.898954391479492, "global_step": 509508, "epoch": 3032} {"train_loss": -12.839075088500977, "global_step": 509509, "epoch": 3032} {"train_loss": -12.874099731445312, "global_step": 509510, "epoch": 3032} {"train_loss": -12.672473907470703, "global_step": 509511, "epoch": 3032} {"train_loss": -12.79948616027832, "global_step": 509512, "epoch": 3032} {"train_loss": -12.723701477050781, "global_step": 509513, "epoch": 3032} {"train_loss": -12.703592300415039, "global_step": 509514, "epoch": 3032} {"train_loss": -12.816975593566895, "global_step": 509515, "epoch": 3032} {"train_loss": -12.769845962524414, "global_step": 509516, "epoch": 3032} {"train_loss": -12.891185760498047, "global_step": 509517, "epoch": 3032} {"train_loss": -12.913015365600586, "global_step": 509518, "epoch": 3032} {"train_loss": -12.755738258361816, "global_step": 509519, "epoch": 3032} {"train_loss": -12.576355934143066, "global_step": 509520, "epoch": 3032} {"train_loss": -12.764467239379883, "global_step": 509521, "epoch": 3032} {"train_loss": -12.986457824707031, "global_step": 509522, "epoch": 3032} {"train_loss": -12.728660583496094, "global_step": 509523, "epoch": 3032} {"train_loss": -12.94661808013916, "global_step": 509524, "epoch": 3032} {"train_loss": -12.582298278808594, "global_step": 509525, "epoch": 3032} {"train_loss": -12.568856239318848, "global_step": 509526, "epoch": 3032} {"train_loss": -12.851131439208984, "global_step": 509527, "epoch": 3032} {"train_loss": -12.540841102600098, "global_step": 509528, "epoch": 3032} {"train_loss": -12.993049621582031, "global_step": 509529, "epoch": 3032} {"train_loss": -12.10826301574707, "global_step": 509530, "epoch": 3032} {"train_loss": -11.94625186920166, "global_step": 509531, "epoch": 3032} {"train_loss": -12.504890441894531, "global_step": 509532, "epoch": 3032} {"train_loss": -12.575895309448242, "global_step": 509533, "epoch": 3032} {"train_loss": -11.486257553100586, "global_step": 509534, "epoch": 3032} {"train_loss": -12.898670196533203, "global_step": 509535, "epoch": 3032} {"train_loss": -11.592737197875977, "global_step": 509536, "epoch": 3032} {"train_loss": -12.98173713684082, "global_step": 509537, "epoch": 3032} {"train_loss": -11.985066413879395, "global_step": 509538, "epoch": 3032} {"train_loss": -11.986984252929688, "global_step": 509539, "epoch": 3032} {"train_loss": -12.772476196289062, "global_step": 509540, "epoch": 3032} {"train_loss": -11.180593490600586, "global_step": 509541, "epoch": 3032} {"train_loss": -12.375190734863281, "global_step": 509542, "epoch": 3032} {"train_loss": -12.1152936901365, "global_step": 509543, "epoch": 3032, "val_loss": 319290.0} {"train_loss": -12.427166938781738, "global_step": 509544, "epoch": 3033} {"train_loss": -11.715679168701172, "global_step": 509545, "epoch": 3033} {"train_loss": -12.721067428588867, "global_step": 509546, "epoch": 3033} {"train_loss": -12.122949600219727, "global_step": 509547, "epoch": 3033} {"train_loss": -12.491277694702148, "global_step": 509548, "epoch": 3033} {"train_loss": -12.405963897705078, "global_step": 509549, "epoch": 3033} {"train_loss": -11.763399124145508, "global_step": 509550, "epoch": 3033} {"train_loss": -12.716594696044922, "global_step": 509551, "epoch": 3033} {"train_loss": -11.725835800170898, "global_step": 509552, "epoch": 3033} {"train_loss": -12.738698959350586, "global_step": 509553, "epoch": 3033} {"train_loss": -12.048772811889648, "global_step": 509554, "epoch": 3033} {"train_loss": -12.2901611328125, "global_step": 509555, "epoch": 3033} {"train_loss": -12.50422477722168, "global_step": 509556, "epoch": 3033} {"train_loss": -12.388175010681152, "global_step": 509557, "epoch": 3033} {"train_loss": -12.648480415344238, "global_step": 509558, "epoch": 3033} {"train_loss": -11.677732467651367, "global_step": 509559, "epoch": 3033} {"train_loss": -12.143659591674805, "global_step": 509560, "epoch": 3033} {"train_loss": -12.675008773803711, "global_step": 509561, "epoch": 3033} {"train_loss": -11.889443397521973, "global_step": 509562, "epoch": 3033} {"train_loss": -12.602506637573242, "global_step": 509563, "epoch": 3033} {"train_loss": -12.28469467163086, "global_step": 509564, "epoch": 3033} {"train_loss": -11.67481803894043, "global_step": 509565, "epoch": 3033} {"train_loss": -12.611900329589844, "global_step": 509566, "epoch": 3033} {"train_loss": -11.588404655456543, "global_step": 509567, "epoch": 3033} {"train_loss": -12.625808715820312, "global_step": 509568, "epoch": 3033} {"train_loss": -11.445493698120117, "global_step": 509569, "epoch": 3033} {"train_loss": -12.948244094848633, "global_step": 509570, "epoch": 3033} {"train_loss": -11.812969207763672, "global_step": 509571, "epoch": 3033} {"train_loss": -12.668401718139648, "global_step": 509572, "epoch": 3033} {"train_loss": -12.178606986999512, "global_step": 509573, "epoch": 3033} {"train_loss": -11.632728576660156, "global_step": 509574, "epoch": 3033} {"train_loss": -12.507601737976074, "global_step": 509575, "epoch": 3033} {"train_loss": -10.942237854003906, "global_step": 509576, "epoch": 3033} {"train_loss": -12.740196228027344, "global_step": 509577, "epoch": 3033} {"train_loss": -11.813014030456543, "global_step": 509578, "epoch": 3033} {"train_loss": -11.693443298339844, "global_step": 509579, "epoch": 3033} {"train_loss": -12.135333061218262, "global_step": 509580, "epoch": 3033} {"train_loss": -9.782186508178711, "global_step": 509581, "epoch": 3033} {"train_loss": -12.178997039794922, "global_step": 509582, "epoch": 3033} {"train_loss": -11.408256530761719, "global_step": 509583, "epoch": 3033} {"train_loss": -10.819480895996094, "global_step": 509584, "epoch": 3033} {"train_loss": -12.145767211914062, "global_step": 509585, "epoch": 3033} {"train_loss": -11.5606689453125, "global_step": 509586, "epoch": 3033} {"train_loss": -12.196305274963379, "global_step": 509587, "epoch": 3033} {"train_loss": -10.966338157653809, "global_step": 509588, "epoch": 3033} {"train_loss": -12.209538459777832, "global_step": 509589, "epoch": 3033} {"train_loss": -12.349600791931152, "global_step": 509590, "epoch": 3033} {"train_loss": -11.831121444702148, "global_step": 509591, "epoch": 3033} {"train_loss": -12.559469223022461, "global_step": 509592, "epoch": 3033} {"train_loss": -12.048224449157715, "global_step": 509593, "epoch": 3033} {"train_loss": -12.574691772460938, "global_step": 509594, "epoch": 3033} {"train_loss": -12.571041107177734, "global_step": 509595, "epoch": 3033} {"train_loss": -12.050834655761719, "global_step": 509596, "epoch": 3033} {"train_loss": -12.746191024780273, "global_step": 509597, "epoch": 3033} {"train_loss": -12.209723472595215, "global_step": 509598, "epoch": 3033} {"train_loss": -12.391687393188477, "global_step": 509599, "epoch": 3033} {"train_loss": -12.661120414733887, "global_step": 509600, "epoch": 3033} {"train_loss": -11.966166496276855, "global_step": 509601, "epoch": 3033} {"train_loss": -12.568331718444824, "global_step": 509602, "epoch": 3033} {"train_loss": -12.216428756713867, "global_step": 509603, "epoch": 3033} {"train_loss": -12.113473892211914, "global_step": 509604, "epoch": 3033} {"train_loss": -12.766677856445312, "global_step": 509605, "epoch": 3033} {"train_loss": -12.458699226379395, "global_step": 509606, "epoch": 3033} {"train_loss": -12.591720581054688, "global_step": 509607, "epoch": 3033} {"train_loss": -12.450187683105469, "global_step": 509608, "epoch": 3033} {"train_loss": -12.342398643493652, "global_step": 509609, "epoch": 3033} {"train_loss": -12.025566101074219, "global_step": 509610, "epoch": 3033} {"train_loss": -12.520162582397461, "global_step": 509611, "epoch": 3033} {"train_loss": -12.67096996307373, "global_step": 509612, "epoch": 3033} {"train_loss": -11.787565231323242, "global_step": 509613, "epoch": 3033} {"train_loss": -12.563356399536133, "global_step": 509614, "epoch": 3033} {"train_loss": -12.537599563598633, "global_step": 509615, "epoch": 3033} {"train_loss": -12.199786186218262, "global_step": 509616, "epoch": 3033} {"train_loss": -12.795785903930664, "global_step": 509617, "epoch": 3033} {"train_loss": -12.664216995239258, "global_step": 509618, "epoch": 3033} {"train_loss": -12.922867774963379, "global_step": 509619, "epoch": 3033} {"train_loss": -12.437602996826172, "global_step": 509620, "epoch": 3033} {"train_loss": -12.682835578918457, "global_step": 509621, "epoch": 3033} {"train_loss": -12.699712753295898, "global_step": 509622, "epoch": 3033} {"train_loss": -12.747136116027832, "global_step": 509623, "epoch": 3033} {"train_loss": -12.743602752685547, "global_step": 509624, "epoch": 3033} {"train_loss": -12.329397201538086, "global_step": 509625, "epoch": 3033} {"train_loss": -12.918054580688477, "global_step": 509626, "epoch": 3033} {"train_loss": -12.7469482421875, "global_step": 509627, "epoch": 3033} {"train_loss": -12.763116836547852, "global_step": 509628, "epoch": 3033} {"train_loss": -12.80117416381836, "global_step": 509629, "epoch": 3033} {"train_loss": -12.660937309265137, "global_step": 509630, "epoch": 3033} {"train_loss": -12.667346954345703, "global_step": 509631, "epoch": 3033} {"train_loss": -12.78742790222168, "global_step": 509632, "epoch": 3033} {"train_loss": -12.587148666381836, "global_step": 509633, "epoch": 3033} {"train_loss": -12.689857482910156, "global_step": 509634, "epoch": 3033} {"train_loss": -12.726905822753906, "global_step": 509635, "epoch": 3033} {"train_loss": -12.896224975585938, "global_step": 509636, "epoch": 3033} {"train_loss": -12.736550331115723, "global_step": 509637, "epoch": 3033} {"train_loss": -12.512117385864258, "global_step": 509638, "epoch": 3033} {"train_loss": -12.734357833862305, "global_step": 509639, "epoch": 3033} {"train_loss": -12.469284057617188, "global_step": 509640, "epoch": 3033} {"train_loss": -12.606040954589844, "global_step": 509641, "epoch": 3033} {"train_loss": -12.891265869140625, "global_step": 509642, "epoch": 3033} {"train_loss": -12.759561538696289, "global_step": 509643, "epoch": 3033} {"train_loss": -12.731328964233398, "global_step": 509644, "epoch": 3033} {"train_loss": -13.152982711791992, "global_step": 509645, "epoch": 3033} {"train_loss": -12.817628860473633, "global_step": 509646, "epoch": 3033} {"train_loss": -12.912345886230469, "global_step": 509647, "epoch": 3033} {"train_loss": -12.628652572631836, "global_step": 509648, "epoch": 3033} {"train_loss": -12.409379959106445, "global_step": 509649, "epoch": 3033} {"train_loss": -12.659891128540039, "global_step": 509650, "epoch": 3033} {"train_loss": -12.844316482543945, "global_step": 509651, "epoch": 3033} {"train_loss": -12.770204544067383, "global_step": 509652, "epoch": 3033} {"train_loss": -12.489609718322754, "global_step": 509653, "epoch": 3033} {"train_loss": -12.662851333618164, "global_step": 509654, "epoch": 3033} {"train_loss": -12.578461647033691, "global_step": 509655, "epoch": 3033} {"train_loss": -12.874051094055176, "global_step": 509656, "epoch": 3033} {"train_loss": -12.598587036132812, "global_step": 509657, "epoch": 3033} {"train_loss": -12.710471153259277, "global_step": 509658, "epoch": 3033} {"train_loss": -12.617817878723145, "global_step": 509659, "epoch": 3033} {"train_loss": -12.755033493041992, "global_step": 509660, "epoch": 3033} {"train_loss": -12.615518569946289, "global_step": 509661, "epoch": 3033} {"train_loss": -12.751998901367188, "global_step": 509662, "epoch": 3033} {"train_loss": -12.70668888092041, "global_step": 509663, "epoch": 3033} {"train_loss": -12.37496566772461, "global_step": 509664, "epoch": 3033} {"train_loss": -12.907066345214844, "global_step": 509665, "epoch": 3033} {"train_loss": -12.416268348693848, "global_step": 509666, "epoch": 3033} {"train_loss": -11.30825424194336, "global_step": 509667, "epoch": 3033} {"train_loss": -12.107555389404297, "global_step": 509668, "epoch": 3033} {"train_loss": -12.317280769348145, "global_step": 509669, "epoch": 3033} {"train_loss": -10.098333358764648, "global_step": 509670, "epoch": 3033} {"train_loss": -10.304632186889648, "global_step": 509671, "epoch": 3033} {"train_loss": -9.705069541931152, "global_step": 509672, "epoch": 3033} {"train_loss": -11.894315719604492, "global_step": 509673, "epoch": 3033} {"train_loss": -7.855804443359375, "global_step": 509674, "epoch": 3033} {"train_loss": -9.478477478027344, "global_step": 509675, "epoch": 3033} {"train_loss": -9.796764373779297, "global_step": 509676, "epoch": 3033} {"train_loss": -10.502496719360352, "global_step": 509677, "epoch": 3033} {"train_loss": -9.452847480773926, "global_step": 509678, "epoch": 3033} {"train_loss": -9.318923950195312, "global_step": 509679, "epoch": 3033} {"train_loss": -9.398099899291992, "global_step": 509680, "epoch": 3033} {"train_loss": -10.35776138305664, "global_step": 509681, "epoch": 3033} {"train_loss": -9.568456649780273, "global_step": 509682, "epoch": 3033} {"train_loss": -9.495405197143555, "global_step": 509683, "epoch": 3033} {"train_loss": -10.490313529968262, "global_step": 509684, "epoch": 3033} {"train_loss": -10.890951156616211, "global_step": 509685, "epoch": 3033} {"train_loss": -11.335592269897461, "global_step": 509686, "epoch": 3033} {"train_loss": -11.486261367797852, "global_step": 509687, "epoch": 3033} {"train_loss": -11.889385223388672, "global_step": 509688, "epoch": 3033} {"train_loss": -11.633426666259766, "global_step": 509689, "epoch": 3033} {"train_loss": -11.729637145996094, "global_step": 509690, "epoch": 3033} {"train_loss": -11.391746520996094, "global_step": 509691, "epoch": 3033} {"train_loss": -12.152900695800781, "global_step": 509692, "epoch": 3033} {"train_loss": -11.549898147583008, "global_step": 509693, "epoch": 3033} {"train_loss": -11.216377258300781, "global_step": 509694, "epoch": 3033} {"train_loss": -12.071084976196289, "global_step": 509695, "epoch": 3033} {"train_loss": -11.67283821105957, "global_step": 509696, "epoch": 3033} {"train_loss": -12.073873519897461, "global_step": 509697, "epoch": 3033} {"train_loss": -11.696768760681152, "global_step": 509698, "epoch": 3033} {"train_loss": -12.047508239746094, "global_step": 509699, "epoch": 3033} {"train_loss": -12.214506149291992, "global_step": 509700, "epoch": 3033} {"train_loss": -11.902392387390137, "global_step": 509701, "epoch": 3033} {"train_loss": -11.635961532592773, "global_step": 509702, "epoch": 3033} {"train_loss": -12.174924850463867, "global_step": 509703, "epoch": 3033} {"train_loss": -11.599414825439453, "global_step": 509704, "epoch": 3033} {"train_loss": -12.453140258789062, "global_step": 509705, "epoch": 3033} {"train_loss": -12.070060729980469, "global_step": 509706, "epoch": 3033} {"train_loss": -12.038043975830078, "global_step": 509707, "epoch": 3033} {"train_loss": -12.33685302734375, "global_step": 509708, "epoch": 3033} {"train_loss": -12.228506088256836, "global_step": 509709, "epoch": 3033} {"train_loss": -12.626830101013184, "global_step": 509710, "epoch": 3033} {"train_loss": -12.06607705070859, "global_step": 509711, "epoch": 3033, "val_loss": 315697.90625} {"train_loss": -12.049365997314453, "global_step": 509712, "epoch": 3034} {"train_loss": -12.481592178344727, "global_step": 509713, "epoch": 3034} {"train_loss": -12.052379608154297, "global_step": 509714, "epoch": 3034} {"train_loss": -12.342630386352539, "global_step": 509715, "epoch": 3034} {"train_loss": -12.202347755432129, "global_step": 509716, "epoch": 3034} {"train_loss": -12.332691192626953, "global_step": 509717, "epoch": 3034} {"train_loss": -12.032557487487793, "global_step": 509718, "epoch": 3034} {"train_loss": -12.611713409423828, "global_step": 509719, "epoch": 3034} {"train_loss": -11.732177734375, "global_step": 509720, "epoch": 3034} {"train_loss": -12.277934074401855, "global_step": 509721, "epoch": 3034} {"train_loss": -12.490179061889648, "global_step": 509722, "epoch": 3034} {"train_loss": -11.606492042541504, "global_step": 509723, "epoch": 3034} {"train_loss": -11.974015235900879, "global_step": 509724, "epoch": 3034} {"train_loss": -11.324240684509277, "global_step": 509725, "epoch": 3034} {"train_loss": -12.167842864990234, "global_step": 509726, "epoch": 3034} {"train_loss": -11.41297721862793, "global_step": 509727, "epoch": 3034} {"train_loss": -11.821125030517578, "global_step": 509728, "epoch": 3034} {"train_loss": -11.94449234008789, "global_step": 509729, "epoch": 3034} {"train_loss": -11.98129653930664, "global_step": 509730, "epoch": 3034} {"train_loss": -11.606637954711914, "global_step": 509731, "epoch": 3034} {"train_loss": -11.847677230834961, "global_step": 509732, "epoch": 3034} {"train_loss": -11.933883666992188, "global_step": 509733, "epoch": 3034} {"train_loss": -11.81983757019043, "global_step": 509734, "epoch": 3034} {"train_loss": -12.199506759643555, "global_step": 509735, "epoch": 3034} {"train_loss": -11.741316795349121, "global_step": 509736, "epoch": 3034} {"train_loss": -12.286127090454102, "global_step": 509737, "epoch": 3034} {"train_loss": -11.712568283081055, "global_step": 509738, "epoch": 3034} {"train_loss": -12.116327285766602, "global_step": 509739, "epoch": 3034} {"train_loss": -12.232343673706055, "global_step": 509740, "epoch": 3034} {"train_loss": -11.751523971557617, "global_step": 509741, "epoch": 3034} {"train_loss": -12.333789825439453, "global_step": 509742, "epoch": 3034} {"train_loss": -12.245095252990723, "global_step": 509743, "epoch": 3034} {"train_loss": -11.952281951904297, "global_step": 509744, "epoch": 3034} {"train_loss": -12.602477073669434, "global_step": 509745, "epoch": 3034} {"train_loss": -11.577052116394043, "global_step": 509746, "epoch": 3034} {"train_loss": -12.582000732421875, "global_step": 509747, "epoch": 3034} {"train_loss": -12.153752326965332, "global_step": 509748, "epoch": 3034} {"train_loss": -12.584006309509277, "global_step": 509749, "epoch": 3034} {"train_loss": -12.428024291992188, "global_step": 509750, "epoch": 3034} {"train_loss": -12.714632987976074, "global_step": 509751, "epoch": 3034} {"train_loss": -12.609993934631348, "global_step": 509752, "epoch": 3034} {"train_loss": -12.854696273803711, "global_step": 509753, "epoch": 3034} {"train_loss": -12.573570251464844, "global_step": 509754, "epoch": 3034} {"train_loss": -12.503938674926758, "global_step": 509755, "epoch": 3034} {"train_loss": -12.921789169311523, "global_step": 509756, "epoch": 3034} {"train_loss": -12.441510200500488, "global_step": 509757, "epoch": 3034} {"train_loss": -12.730853080749512, "global_step": 509758, "epoch": 3034} {"train_loss": -12.317156791687012, "global_step": 509759, "epoch": 3034} {"train_loss": -12.925897598266602, "global_step": 509760, "epoch": 3034} {"train_loss": -12.671948432922363, "global_step": 509761, "epoch": 3034} {"train_loss": -12.893633842468262, "global_step": 509762, "epoch": 3034} {"train_loss": -12.614631652832031, "global_step": 509763, "epoch": 3034} {"train_loss": -12.796879768371582, "global_step": 509764, "epoch": 3034} {"train_loss": -12.67249870300293, "global_step": 509765, "epoch": 3034} {"train_loss": -12.804929733276367, "global_step": 509766, "epoch": 3034} {"train_loss": -12.919269561767578, "global_step": 509767, "epoch": 3034} {"train_loss": -12.724235534667969, "global_step": 509768, "epoch": 3034} {"train_loss": -12.871792793273926, "global_step": 509769, "epoch": 3034} {"train_loss": -12.548142433166504, "global_step": 509770, "epoch": 3034} {"train_loss": -12.890287399291992, "global_step": 509771, "epoch": 3034} {"train_loss": -12.507013320922852, "global_step": 509772, "epoch": 3034} {"train_loss": -12.784111022949219, "global_step": 509773, "epoch": 3034} {"train_loss": -12.466571807861328, "global_step": 509774, "epoch": 3034} {"train_loss": -12.776592254638672, "global_step": 509775, "epoch": 3034} {"train_loss": -12.609615325927734, "global_step": 509776, "epoch": 3034} {"train_loss": -12.795458793640137, "global_step": 509777, "epoch": 3034} {"train_loss": -12.772789001464844, "global_step": 509778, "epoch": 3034} {"train_loss": -12.829771041870117, "global_step": 509779, "epoch": 3034} {"train_loss": -12.528935432434082, "global_step": 509780, "epoch": 3034} {"train_loss": -12.570277214050293, "global_step": 509781, "epoch": 3034} {"train_loss": -12.609804153442383, "global_step": 509782, "epoch": 3034} {"train_loss": -12.526002883911133, "global_step": 509783, "epoch": 3034} {"train_loss": -12.749163627624512, "global_step": 509784, "epoch": 3034} {"train_loss": -12.389217376708984, "global_step": 509785, "epoch": 3034} {"train_loss": -12.455438613891602, "global_step": 509786, "epoch": 3034} {"train_loss": -12.347406387329102, "global_step": 509787, "epoch": 3034} {"train_loss": -12.011631965637207, "global_step": 509788, "epoch": 3034} {"train_loss": -12.525644302368164, "global_step": 509789, "epoch": 3034} {"train_loss": -12.182968139648438, "global_step": 509790, "epoch": 3034} {"train_loss": -12.583808898925781, "global_step": 509791, "epoch": 3034} {"train_loss": -11.657299041748047, "global_step": 509792, "epoch": 3034} {"train_loss": -12.517096519470215, "global_step": 509793, "epoch": 3034} {"train_loss": -12.582220077514648, "global_step": 509794, "epoch": 3034} {"train_loss": -12.673337936401367, "global_step": 509795, "epoch": 3034} {"train_loss": -12.709611892700195, "global_step": 509796, "epoch": 3034} {"train_loss": -12.821111679077148, "global_step": 509797, "epoch": 3034} {"train_loss": -12.55309009552002, "global_step": 509798, "epoch": 3034} {"train_loss": -12.758386611938477, "global_step": 509799, "epoch": 3034} {"train_loss": -12.493606567382812, "global_step": 509800, "epoch": 3034} {"train_loss": -12.712648391723633, "global_step": 509801, "epoch": 3034} {"train_loss": -12.716516494750977, "global_step": 509802, "epoch": 3034} {"train_loss": -12.648355484008789, "global_step": 509803, "epoch": 3034} {"train_loss": -12.500617980957031, "global_step": 509804, "epoch": 3034} {"train_loss": -12.213471412658691, "global_step": 509805, "epoch": 3034} {"train_loss": -12.915079116821289, "global_step": 509806, "epoch": 3034} {"train_loss": -12.809761047363281, "global_step": 509807, "epoch": 3034} {"train_loss": -12.643442153930664, "global_step": 509808, "epoch": 3034} {"train_loss": -11.919900894165039, "global_step": 509809, "epoch": 3034} {"train_loss": -12.476085662841797, "global_step": 509810, "epoch": 3034} {"train_loss": -12.732301712036133, "global_step": 509811, "epoch": 3034} {"train_loss": -12.424641609191895, "global_step": 509812, "epoch": 3034} {"train_loss": -11.997804641723633, "global_step": 509813, "epoch": 3034} {"train_loss": -11.985350608825684, "global_step": 509814, "epoch": 3034} {"train_loss": -12.66679573059082, "global_step": 509815, "epoch": 3034} {"train_loss": -12.488807678222656, "global_step": 509816, "epoch": 3034} {"train_loss": -12.21484088897705, "global_step": 509817, "epoch": 3034} {"train_loss": -12.255195617675781, "global_step": 509818, "epoch": 3034} {"train_loss": -11.44464111328125, "global_step": 509819, "epoch": 3034} {"train_loss": -12.385763168334961, "global_step": 509820, "epoch": 3034} {"train_loss": -12.336721420288086, "global_step": 509821, "epoch": 3034} {"train_loss": -11.959809303283691, "global_step": 509822, "epoch": 3034} {"train_loss": -12.012287139892578, "global_step": 509823, "epoch": 3034} {"train_loss": -12.009625434875488, "global_step": 509824, "epoch": 3034} {"train_loss": -11.99984073638916, "global_step": 509825, "epoch": 3034} {"train_loss": -11.869285583496094, "global_step": 509826, "epoch": 3034} {"train_loss": -12.424504280090332, "global_step": 509827, "epoch": 3034} {"train_loss": -12.029853820800781, "global_step": 509828, "epoch": 3034} {"train_loss": -11.902220726013184, "global_step": 509829, "epoch": 3034} {"train_loss": -11.774605751037598, "global_step": 509830, "epoch": 3034} {"train_loss": -12.393489837646484, "global_step": 509831, "epoch": 3034} {"train_loss": -11.628466606140137, "global_step": 509832, "epoch": 3034} {"train_loss": -12.374359130859375, "global_step": 509833, "epoch": 3034} {"train_loss": -12.008742332458496, "global_step": 509834, "epoch": 3034} {"train_loss": -11.815624237060547, "global_step": 509835, "epoch": 3034} {"train_loss": -12.290252685546875, "global_step": 509836, "epoch": 3034} {"train_loss": -11.458438873291016, "global_step": 509837, "epoch": 3034} {"train_loss": -12.535128593444824, "global_step": 509838, "epoch": 3034} {"train_loss": -11.665310859680176, "global_step": 509839, "epoch": 3034} {"train_loss": -11.52016830444336, "global_step": 509840, "epoch": 3034} {"train_loss": -10.166008949279785, "global_step": 509841, "epoch": 3034} {"train_loss": -11.090203285217285, "global_step": 509842, "epoch": 3034} {"train_loss": -11.31878662109375, "global_step": 509843, "epoch": 3034} {"train_loss": -10.923916816711426, "global_step": 509844, "epoch": 3034} {"train_loss": -10.016305923461914, "global_step": 509845, "epoch": 3034} {"train_loss": -11.354972839355469, "global_step": 509846, "epoch": 3034} {"train_loss": -11.522693634033203, "global_step": 509847, "epoch": 3034} {"train_loss": -11.150947570800781, "global_step": 509848, "epoch": 3034} {"train_loss": -11.059977531433105, "global_step": 509849, "epoch": 3034} {"train_loss": -11.714615821838379, "global_step": 509850, "epoch": 3034} {"train_loss": -11.878372192382812, "global_step": 509851, "epoch": 3034} {"train_loss": -12.730459213256836, "global_step": 509852, "epoch": 3034} {"train_loss": -11.939998626708984, "global_step": 509853, "epoch": 3034} {"train_loss": -12.295600891113281, "global_step": 509854, "epoch": 3034} {"train_loss": -11.843220710754395, "global_step": 509855, "epoch": 3034} {"train_loss": -12.507197380065918, "global_step": 509856, "epoch": 3034} {"train_loss": -12.018739700317383, "global_step": 509857, "epoch": 3034} {"train_loss": -12.428886413574219, "global_step": 509858, "epoch": 3034} {"train_loss": -12.428447723388672, "global_step": 509859, "epoch": 3034} {"train_loss": -12.15340805053711, "global_step": 509860, "epoch": 3034} {"train_loss": -12.667398452758789, "global_step": 509861, "epoch": 3034} {"train_loss": -11.900949478149414, "global_step": 509862, "epoch": 3034} {"train_loss": -11.955822944641113, "global_step": 509863, "epoch": 3034} {"train_loss": -12.348657608032227, "global_step": 509864, "epoch": 3034} {"train_loss": -11.425080299377441, "global_step": 509865, "epoch": 3034} {"train_loss": -12.452774047851562, "global_step": 509866, "epoch": 3034} {"train_loss": -11.366613388061523, "global_step": 509867, "epoch": 3034} {"train_loss": -12.199319839477539, "global_step": 509868, "epoch": 3034} {"train_loss": -12.131486892700195, "global_step": 509869, "epoch": 3034} {"train_loss": -12.270360946655273, "global_step": 509870, "epoch": 3034} {"train_loss": -12.273609161376953, "global_step": 509871, "epoch": 3034} {"train_loss": -12.268777847290039, "global_step": 509872, "epoch": 3034} {"train_loss": -12.34846019744873, "global_step": 509873, "epoch": 3034} {"train_loss": -12.513712882995605, "global_step": 509874, "epoch": 3034} {"train_loss": -12.331544876098633, "global_step": 509875, "epoch": 3034} {"train_loss": -12.523876190185547, "global_step": 509876, "epoch": 3034} {"train_loss": -12.329904556274414, "global_step": 509877, "epoch": 3034} {"train_loss": -12.557863235473633, "global_step": 509878, "epoch": 3034} {"train_loss": -12.229803800582886, "global_step": 509879, "epoch": 3034, "val_loss": 320365.0} {"train_loss": -11.996872901916504, "global_step": 509880, "epoch": 3035} {"train_loss": -12.702858924865723, "global_step": 509881, "epoch": 3035} {"train_loss": -12.05111312866211, "global_step": 509882, "epoch": 3035} {"train_loss": -12.3463773727417, "global_step": 509883, "epoch": 3035} {"train_loss": -12.452903747558594, "global_step": 509884, "epoch": 3035} {"train_loss": -11.877317428588867, "global_step": 509885, "epoch": 3035} {"train_loss": -12.636112213134766, "global_step": 509886, "epoch": 3035} {"train_loss": -12.505603790283203, "global_step": 509887, "epoch": 3035} {"train_loss": -12.629903793334961, "global_step": 509888, "epoch": 3035} {"train_loss": -11.835067749023438, "global_step": 509889, "epoch": 3035} {"train_loss": -12.543744087219238, "global_step": 509890, "epoch": 3035} {"train_loss": -12.456125259399414, "global_step": 509891, "epoch": 3035} {"train_loss": -12.438005447387695, "global_step": 509892, "epoch": 3035} {"train_loss": -12.630048751831055, "global_step": 509893, "epoch": 3035} {"train_loss": -12.494190216064453, "global_step": 509894, "epoch": 3035} {"train_loss": -12.62515926361084, "global_step": 509895, "epoch": 3035} {"train_loss": -12.297277450561523, "global_step": 509896, "epoch": 3035} {"train_loss": -12.371313095092773, "global_step": 509897, "epoch": 3035} {"train_loss": -12.799110412597656, "global_step": 509898, "epoch": 3035} {"train_loss": -12.276093482971191, "global_step": 509899, "epoch": 3035} {"train_loss": -12.997014999389648, "global_step": 509900, "epoch": 3035} {"train_loss": -12.557000160217285, "global_step": 509901, "epoch": 3035} {"train_loss": -12.702110290527344, "global_step": 509902, "epoch": 3035} {"train_loss": -12.503021240234375, "global_step": 509903, "epoch": 3035} {"train_loss": -12.706648826599121, "global_step": 509904, "epoch": 3035} {"train_loss": -12.677184104919434, "global_step": 509905, "epoch": 3035} {"train_loss": -12.447917938232422, "global_step": 509906, "epoch": 3035} {"train_loss": -12.703866004943848, "global_step": 509907, "epoch": 3035} {"train_loss": -12.93551254272461, "global_step": 509908, "epoch": 3035} {"train_loss": -12.410188674926758, "global_step": 509909, "epoch": 3035} {"train_loss": -12.861183166503906, "global_step": 509910, "epoch": 3035} {"train_loss": -12.73765754699707, "global_step": 509911, "epoch": 3035} {"train_loss": -12.797297477722168, "global_step": 509912, "epoch": 3035} {"train_loss": -12.939985275268555, "global_step": 509913, "epoch": 3035} {"train_loss": -12.791679382324219, "global_step": 509914, "epoch": 3035} {"train_loss": -12.814496040344238, "global_step": 509915, "epoch": 3035} {"train_loss": -12.776886940002441, "global_step": 509916, "epoch": 3035} {"train_loss": -12.630582809448242, "global_step": 509917, "epoch": 3035} {"train_loss": -12.839801788330078, "global_step": 509918, "epoch": 3035} {"train_loss": -12.715372085571289, "global_step": 509919, "epoch": 3035} {"train_loss": -12.977069854736328, "global_step": 509920, "epoch": 3035} {"train_loss": -13.117171287536621, "global_step": 509921, "epoch": 3035} {"train_loss": -12.978307723999023, "global_step": 509922, "epoch": 3035} {"train_loss": -12.620855331420898, "global_step": 509923, "epoch": 3035} {"train_loss": -13.167778015136719, "global_step": 509924, "epoch": 3035} {"train_loss": -12.817666053771973, "global_step": 509925, "epoch": 3035} {"train_loss": -12.896089553833008, "global_step": 509926, "epoch": 3035} {"train_loss": -12.806958198547363, "global_step": 509927, "epoch": 3035} {"train_loss": -12.902994155883789, "global_step": 509928, "epoch": 3035} {"train_loss": -12.566415786743164, "global_step": 509929, "epoch": 3035} {"train_loss": -12.840782165527344, "global_step": 509930, "epoch": 3035} {"train_loss": -12.741945266723633, "global_step": 509931, "epoch": 3035} {"train_loss": -12.943094253540039, "global_step": 509932, "epoch": 3035} {"train_loss": -12.787723541259766, "global_step": 509933, "epoch": 3035} {"train_loss": -12.783178329467773, "global_step": 509934, "epoch": 3035} {"train_loss": -12.633480072021484, "global_step": 509935, "epoch": 3035} {"train_loss": -12.785558700561523, "global_step": 509936, "epoch": 3035} {"train_loss": -12.81048583984375, "global_step": 509937, "epoch": 3035} {"train_loss": -13.004524230957031, "global_step": 509938, "epoch": 3035} {"train_loss": -12.887561798095703, "global_step": 509939, "epoch": 3035} {"train_loss": -12.996442794799805, "global_step": 509940, "epoch": 3035} {"train_loss": -12.32272720336914, "global_step": 509941, "epoch": 3035} {"train_loss": -12.92402458190918, "global_step": 509942, "epoch": 3035} {"train_loss": -12.821351051330566, "global_step": 509943, "epoch": 3035} {"train_loss": -12.863265991210938, "global_step": 509944, "epoch": 3035} {"train_loss": -12.641951560974121, "global_step": 509945, "epoch": 3035} {"train_loss": -12.705718994140625, "global_step": 509946, "epoch": 3035} {"train_loss": -13.008423805236816, "global_step": 509947, "epoch": 3035} {"train_loss": -12.847955703735352, "global_step": 509948, "epoch": 3035} {"train_loss": -12.72825813293457, "global_step": 509949, "epoch": 3035} {"train_loss": -12.492077827453613, "global_step": 509950, "epoch": 3035} {"train_loss": -13.104207038879395, "global_step": 509951, "epoch": 3035} {"train_loss": -12.568414688110352, "global_step": 509952, "epoch": 3035} {"train_loss": -12.304216384887695, "global_step": 509953, "epoch": 3035} {"train_loss": -12.75762939453125, "global_step": 509954, "epoch": 3035} {"train_loss": -12.26858139038086, "global_step": 509955, "epoch": 3035} {"train_loss": -11.132872581481934, "global_step": 509956, "epoch": 3035} {"train_loss": -12.612910270690918, "global_step": 509957, "epoch": 3035} {"train_loss": -11.569334030151367, "global_step": 509958, "epoch": 3035} {"train_loss": -12.542579650878906, "global_step": 509959, "epoch": 3035} {"train_loss": -11.443893432617188, "global_step": 509960, "epoch": 3035} {"train_loss": -12.375968933105469, "global_step": 509961, "epoch": 3035} {"train_loss": -11.554553031921387, "global_step": 509962, "epoch": 3035} {"train_loss": -12.315375328063965, "global_step": 509963, "epoch": 3035} {"train_loss": -11.170150756835938, "global_step": 509964, "epoch": 3035} {"train_loss": -12.110162734985352, "global_step": 509965, "epoch": 3035} {"train_loss": -11.568263053894043, "global_step": 509966, "epoch": 3035} {"train_loss": -11.884557723999023, "global_step": 509967, "epoch": 3035} {"train_loss": -11.634001731872559, "global_step": 509968, "epoch": 3035} {"train_loss": -11.932014465332031, "global_step": 509969, "epoch": 3035} {"train_loss": -12.037015914916992, "global_step": 509970, "epoch": 3035} {"train_loss": -10.087187767028809, "global_step": 509971, "epoch": 3035} {"train_loss": -11.80405044555664, "global_step": 509972, "epoch": 3035} {"train_loss": -9.799753189086914, "global_step": 509973, "epoch": 3035} {"train_loss": -9.673418045043945, "global_step": 509974, "epoch": 3035} {"train_loss": -9.49969482421875, "global_step": 509975, "epoch": 3035} {"train_loss": -10.835037231445312, "global_step": 509976, "epoch": 3035} {"train_loss": -10.381658554077148, "global_step": 509977, "epoch": 3035} {"train_loss": -9.914215087890625, "global_step": 509978, "epoch": 3035} {"train_loss": -9.858278274536133, "global_step": 509979, "epoch": 3035} {"train_loss": -9.395980834960938, "global_step": 509980, "epoch": 3035} {"train_loss": -10.882579803466797, "global_step": 509981, "epoch": 3035} {"train_loss": -10.19070053100586, "global_step": 509982, "epoch": 3035} {"train_loss": -9.877245903015137, "global_step": 509983, "epoch": 3035} {"train_loss": -9.669146537780762, "global_step": 509984, "epoch": 3035} {"train_loss": -10.783597946166992, "global_step": 509985, "epoch": 3035} {"train_loss": -11.085610389709473, "global_step": 509986, "epoch": 3035} {"train_loss": -10.975107192993164, "global_step": 509987, "epoch": 3035} {"train_loss": -11.607555389404297, "global_step": 509988, "epoch": 3035} {"train_loss": -11.159969329833984, "global_step": 509989, "epoch": 3035} {"train_loss": -12.374431610107422, "global_step": 509990, "epoch": 3035} {"train_loss": -10.668615341186523, "global_step": 509991, "epoch": 3035} {"train_loss": -12.255135536193848, "global_step": 509992, "epoch": 3035} {"train_loss": -11.278251647949219, "global_step": 509993, "epoch": 3035} {"train_loss": -11.737039566040039, "global_step": 509994, "epoch": 3035} {"train_loss": -12.103814125061035, "global_step": 509995, "epoch": 3035} {"train_loss": -11.232335090637207, "global_step": 509996, "epoch": 3035} {"train_loss": -12.054113388061523, "global_step": 509997, "epoch": 3035} {"train_loss": -11.571554183959961, "global_step": 509998, "epoch": 3035} {"train_loss": -11.7376070022583, "global_step": 509999, "epoch": 3035} {"train_loss": -12.071619987487793, "global_step": 510000, "epoch": 3035} {"train_loss": -12.258967399597168, "global_step": 510001, "epoch": 3035} {"train_loss": -12.242634773254395, "global_step": 510002, "epoch": 3035} {"train_loss": -12.561636924743652, "global_step": 510003, "epoch": 3035} {"train_loss": -11.723392486572266, "global_step": 510004, "epoch": 3035} {"train_loss": -12.452560424804688, "global_step": 510005, "epoch": 3035} {"train_loss": -11.933141708374023, "global_step": 510006, "epoch": 3035} {"train_loss": -12.672591209411621, "global_step": 510007, "epoch": 3035} {"train_loss": -11.87510871887207, "global_step": 510008, "epoch": 3035} {"train_loss": -12.382606506347656, "global_step": 510009, "epoch": 3035} {"train_loss": -12.056589126586914, "global_step": 510010, "epoch": 3035} {"train_loss": -12.635278701782227, "global_step": 510011, "epoch": 3035} {"train_loss": -12.093698501586914, "global_step": 510012, "epoch": 3035} {"train_loss": -12.491519927978516, "global_step": 510013, "epoch": 3035} {"train_loss": -12.173425674438477, "global_step": 510014, "epoch": 3035} {"train_loss": -12.640083312988281, "global_step": 510015, "epoch": 3035} {"train_loss": -12.563228607177734, "global_step": 510016, "epoch": 3035} {"train_loss": -12.73675537109375, "global_step": 510017, "epoch": 3035} {"train_loss": -12.449296951293945, "global_step": 510018, "epoch": 3035} {"train_loss": -12.633909225463867, "global_step": 510019, "epoch": 3035} {"train_loss": -12.586014747619629, "global_step": 510020, "epoch": 3035} {"train_loss": -12.525949478149414, "global_step": 510021, "epoch": 3035} {"train_loss": -12.355865478515625, "global_step": 510022, "epoch": 3035} {"train_loss": -12.55856704711914, "global_step": 510023, "epoch": 3035} {"train_loss": -12.296517372131348, "global_step": 510024, "epoch": 3035} {"train_loss": -12.91786003112793, "global_step": 510025, "epoch": 3035} {"train_loss": -12.303919792175293, "global_step": 510026, "epoch": 3035} {"train_loss": -12.787792205810547, "global_step": 510027, "epoch": 3035} {"train_loss": -12.366466522216797, "global_step": 510028, "epoch": 3035} {"train_loss": -12.843140602111816, "global_step": 510029, "epoch": 3035} {"train_loss": -12.325027465820312, "global_step": 510030, "epoch": 3035} {"train_loss": -12.776144027709961, "global_step": 510031, "epoch": 3035} {"train_loss": -12.356939315795898, "global_step": 510032, "epoch": 3035} {"train_loss": -12.073968887329102, "global_step": 510033, "epoch": 3035} {"train_loss": -12.372466087341309, "global_step": 510034, "epoch": 3035} {"train_loss": -12.461912155151367, "global_step": 510035, "epoch": 3035} {"train_loss": -12.784285545349121, "global_step": 510036, "epoch": 3035} {"train_loss": -12.524408340454102, "global_step": 510037, "epoch": 3035} {"train_loss": -12.480710983276367, "global_step": 510038, "epoch": 3035} {"train_loss": -12.391221046447754, "global_step": 510039, "epoch": 3035} {"train_loss": -12.574722290039062, "global_step": 510040, "epoch": 3035} {"train_loss": -12.630599975585938, "global_step": 510041, "epoch": 3035} {"train_loss": -12.203828811645508, "global_step": 510042, "epoch": 3035} {"train_loss": -12.549436569213867, "global_step": 510043, "epoch": 3035} {"train_loss": -11.562378883361816, "global_step": 510044, "epoch": 3035} {"train_loss": -12.366629600524902, "global_step": 510045, "epoch": 3035} {"train_loss": -12.332935333251953, "global_step": 510046, "epoch": 3035} {"train_loss": -12.205279713585263, "global_step": 510047, "epoch": 3035, "val_loss": 319613.1875, "train_action_mse_error": 2.067755699157715} {"train_loss": -12.147298812866211, "global_step": 510048, "epoch": 3036} {"train_loss": -12.377880096435547, "global_step": 510049, "epoch": 3036} {"train_loss": -12.018197059631348, "global_step": 510050, "epoch": 3036} {"train_loss": -12.193408012390137, "global_step": 510051, "epoch": 3036} {"train_loss": -12.322687149047852, "global_step": 510052, "epoch": 3036} {"train_loss": -12.11678409576416, "global_step": 510053, "epoch": 3036} {"train_loss": -12.506278991699219, "global_step": 510054, "epoch": 3036} {"train_loss": -12.618200302124023, "global_step": 510055, "epoch": 3036} {"train_loss": -12.412654876708984, "global_step": 510056, "epoch": 3036} {"train_loss": -12.735926628112793, "global_step": 510057, "epoch": 3036} {"train_loss": -12.05533218383789, "global_step": 510058, "epoch": 3036} {"train_loss": -11.60522747039795, "global_step": 510059, "epoch": 3036} {"train_loss": -12.384836196899414, "global_step": 510060, "epoch": 3036} {"train_loss": -11.66912841796875, "global_step": 510061, "epoch": 3036} {"train_loss": -10.123912811279297, "global_step": 510062, "epoch": 3036} {"train_loss": -12.451629638671875, "global_step": 510063, "epoch": 3036} {"train_loss": -10.744281768798828, "global_step": 510064, "epoch": 3036} {"train_loss": -12.281078338623047, "global_step": 510065, "epoch": 3036} {"train_loss": -12.088321685791016, "global_step": 510066, "epoch": 3036} {"train_loss": -12.073347091674805, "global_step": 510067, "epoch": 3036} {"train_loss": -11.961858749389648, "global_step": 510068, "epoch": 3036} {"train_loss": -11.883591651916504, "global_step": 510069, "epoch": 3036} {"train_loss": -12.078539848327637, "global_step": 510070, "epoch": 3036} {"train_loss": -12.213336944580078, "global_step": 510071, "epoch": 3036} {"train_loss": -11.572519302368164, "global_step": 510072, "epoch": 3036} {"train_loss": -12.036182403564453, "global_step": 510073, "epoch": 3036} {"train_loss": -12.523880004882812, "global_step": 510074, "epoch": 3036} {"train_loss": -11.596598625183105, "global_step": 510075, "epoch": 3036} {"train_loss": -12.560892105102539, "global_step": 510076, "epoch": 3036} {"train_loss": -11.8297119140625, "global_step": 510077, "epoch": 3036} {"train_loss": -12.028878211975098, "global_step": 510078, "epoch": 3036} {"train_loss": -12.158563613891602, "global_step": 510079, "epoch": 3036} {"train_loss": -12.164052963256836, "global_step": 510080, "epoch": 3036} {"train_loss": -12.628499984741211, "global_step": 510081, "epoch": 3036} {"train_loss": -12.260339736938477, "global_step": 510082, "epoch": 3036} {"train_loss": -12.485057830810547, "global_step": 510083, "epoch": 3036} {"train_loss": -12.569541931152344, "global_step": 510084, "epoch": 3036} {"train_loss": -12.496275901794434, "global_step": 510085, "epoch": 3036} {"train_loss": -12.131536483764648, "global_step": 510086, "epoch": 3036} {"train_loss": -12.523030281066895, "global_step": 510087, "epoch": 3036} {"train_loss": -12.393779754638672, "global_step": 510088, "epoch": 3036} {"train_loss": -12.381916046142578, "global_step": 510089, "epoch": 3036} {"train_loss": -12.623000144958496, "global_step": 510090, "epoch": 3036} {"train_loss": -12.504738807678223, "global_step": 510091, "epoch": 3036} {"train_loss": -12.559659957885742, "global_step": 510092, "epoch": 3036} {"train_loss": -12.403450965881348, "global_step": 510093, "epoch": 3036} {"train_loss": -12.739105224609375, "global_step": 510094, "epoch": 3036} {"train_loss": -12.735240936279297, "global_step": 510095, "epoch": 3036} {"train_loss": -12.685150146484375, "global_step": 510096, "epoch": 3036} {"train_loss": -12.78590202331543, "global_step": 510097, "epoch": 3036} {"train_loss": -12.413530349731445, "global_step": 510098, "epoch": 3036} {"train_loss": -12.753280639648438, "global_step": 510099, "epoch": 3036} {"train_loss": -12.68770980834961, "global_step": 510100, "epoch": 3036} {"train_loss": -13.010370254516602, "global_step": 510101, "epoch": 3036} {"train_loss": -12.772125244140625, "global_step": 510102, "epoch": 3036} {"train_loss": -12.711063385009766, "global_step": 510103, "epoch": 3036} {"train_loss": -12.788900375366211, "global_step": 510104, "epoch": 3036} {"train_loss": -12.754592895507812, "global_step": 510105, "epoch": 3036} {"train_loss": -12.944367408752441, "global_step": 510106, "epoch": 3036} {"train_loss": -12.697122573852539, "global_step": 510107, "epoch": 3036} {"train_loss": -12.893387794494629, "global_step": 510108, "epoch": 3036} {"train_loss": -12.750650405883789, "global_step": 510109, "epoch": 3036} {"train_loss": -12.677717208862305, "global_step": 510110, "epoch": 3036} {"train_loss": -12.928837776184082, "global_step": 510111, "epoch": 3036} {"train_loss": -12.642130851745605, "global_step": 510112, "epoch": 3036} {"train_loss": -12.607357025146484, "global_step": 510113, "epoch": 3036} {"train_loss": -12.773073196411133, "global_step": 510114, "epoch": 3036} {"train_loss": -12.64012336730957, "global_step": 510115, "epoch": 3036} {"train_loss": -13.003915786743164, "global_step": 510116, "epoch": 3036} {"train_loss": -12.705787658691406, "global_step": 510117, "epoch": 3036} {"train_loss": -12.277507781982422, "global_step": 510118, "epoch": 3036} {"train_loss": -12.171154975891113, "global_step": 510119, "epoch": 3036} {"train_loss": -12.974069595336914, "global_step": 510120, "epoch": 3036} {"train_loss": -12.447070121765137, "global_step": 510121, "epoch": 3036} {"train_loss": -12.282054901123047, "global_step": 510122, "epoch": 3036} {"train_loss": -12.467147827148438, "global_step": 510123, "epoch": 3036} {"train_loss": -12.504186630249023, "global_step": 510124, "epoch": 3036} {"train_loss": -12.864789962768555, "global_step": 510125, "epoch": 3036} {"train_loss": -12.57242202758789, "global_step": 510126, "epoch": 3036} {"train_loss": -12.669111251831055, "global_step": 510127, "epoch": 3036} {"train_loss": -12.231040954589844, "global_step": 510128, "epoch": 3036} {"train_loss": -12.594147682189941, "global_step": 510129, "epoch": 3036} {"train_loss": -12.54005241394043, "global_step": 510130, "epoch": 3036} {"train_loss": -12.695722579956055, "global_step": 510131, "epoch": 3036} {"train_loss": -12.184568405151367, "global_step": 510132, "epoch": 3036} {"train_loss": -12.5720853805542, "global_step": 510133, "epoch": 3036} {"train_loss": -12.229360580444336, "global_step": 510134, "epoch": 3036} {"train_loss": -12.923664093017578, "global_step": 510135, "epoch": 3036} {"train_loss": -12.184768676757812, "global_step": 510136, "epoch": 3036} {"train_loss": -12.72236442565918, "global_step": 510137, "epoch": 3036} {"train_loss": -12.655967712402344, "global_step": 510138, "epoch": 3036} {"train_loss": -12.91215705871582, "global_step": 510139, "epoch": 3036} {"train_loss": -12.371429443359375, "global_step": 510140, "epoch": 3036} {"train_loss": -12.744970321655273, "global_step": 510141, "epoch": 3036} {"train_loss": -12.21234130859375, "global_step": 510142, "epoch": 3036} {"train_loss": -12.803229331970215, "global_step": 510143, "epoch": 3036} {"train_loss": -12.259405136108398, "global_step": 510144, "epoch": 3036} {"train_loss": -12.642340660095215, "global_step": 510145, "epoch": 3036} {"train_loss": -11.663599014282227, "global_step": 510146, "epoch": 3036} {"train_loss": -12.793208122253418, "global_step": 510147, "epoch": 3036} {"train_loss": -11.910928726196289, "global_step": 510148, "epoch": 3036} {"train_loss": -12.354619026184082, "global_step": 510149, "epoch": 3036} {"train_loss": -11.71988296508789, "global_step": 510150, "epoch": 3036} {"train_loss": -11.731891632080078, "global_step": 510151, "epoch": 3036} {"train_loss": -12.315079689025879, "global_step": 510152, "epoch": 3036} {"train_loss": -11.324904441833496, "global_step": 510153, "epoch": 3036} {"train_loss": -12.460409164428711, "global_step": 510154, "epoch": 3036} {"train_loss": -11.536157608032227, "global_step": 510155, "epoch": 3036} {"train_loss": -10.042707443237305, "global_step": 510156, "epoch": 3036} {"train_loss": -12.467926025390625, "global_step": 510157, "epoch": 3036} {"train_loss": -11.00536823272705, "global_step": 510158, "epoch": 3036} {"train_loss": -10.585927963256836, "global_step": 510159, "epoch": 3036} {"train_loss": -12.25174331665039, "global_step": 510160, "epoch": 3036} {"train_loss": -10.23126220703125, "global_step": 510161, "epoch": 3036} {"train_loss": -12.102119445800781, "global_step": 510162, "epoch": 3036} {"train_loss": -11.52954387664795, "global_step": 510163, "epoch": 3036} {"train_loss": -10.217752456665039, "global_step": 510164, "epoch": 3036} {"train_loss": -12.080880165100098, "global_step": 510165, "epoch": 3036} {"train_loss": -9.659692764282227, "global_step": 510166, "epoch": 3036} {"train_loss": -11.764175415039062, "global_step": 510167, "epoch": 3036} {"train_loss": -10.830432891845703, "global_step": 510168, "epoch": 3036} {"train_loss": -11.655038833618164, "global_step": 510169, "epoch": 3036} {"train_loss": -10.62069320678711, "global_step": 510170, "epoch": 3036} {"train_loss": -11.495888710021973, "global_step": 510171, "epoch": 3036} {"train_loss": -11.072290420532227, "global_step": 510172, "epoch": 3036} {"train_loss": -11.253281593322754, "global_step": 510173, "epoch": 3036} {"train_loss": -11.457609176635742, "global_step": 510174, "epoch": 3036} {"train_loss": -10.60445785522461, "global_step": 510175, "epoch": 3036} {"train_loss": -11.580449104309082, "global_step": 510176, "epoch": 3036} {"train_loss": -11.183241844177246, "global_step": 510177, "epoch": 3036} {"train_loss": -11.40964126586914, "global_step": 510178, "epoch": 3036} {"train_loss": -10.834596633911133, "global_step": 510179, "epoch": 3036} {"train_loss": -11.831588745117188, "global_step": 510180, "epoch": 3036} {"train_loss": -10.555890083312988, "global_step": 510181, "epoch": 3036} {"train_loss": -12.166994094848633, "global_step": 510182, "epoch": 3036} {"train_loss": -10.201921463012695, "global_step": 510183, "epoch": 3036} {"train_loss": -11.774438858032227, "global_step": 510184, "epoch": 3036} {"train_loss": -9.785135269165039, "global_step": 510185, "epoch": 3036} {"train_loss": -10.28252124786377, "global_step": 510186, "epoch": 3036} {"train_loss": -9.971458435058594, "global_step": 510187, "epoch": 3036} {"train_loss": -10.071296691894531, "global_step": 510188, "epoch": 3036} {"train_loss": -10.962539672851562, "global_step": 510189, "epoch": 3036} {"train_loss": -11.423731803894043, "global_step": 510190, "epoch": 3036} {"train_loss": -10.722532272338867, "global_step": 510191, "epoch": 3036} {"train_loss": -11.129772186279297, "global_step": 510192, "epoch": 3036} {"train_loss": -12.030046463012695, "global_step": 510193, "epoch": 3036} {"train_loss": -10.894307136535645, "global_step": 510194, "epoch": 3036} {"train_loss": -10.814931869506836, "global_step": 510195, "epoch": 3036} {"train_loss": -12.215445518493652, "global_step": 510196, "epoch": 3036} {"train_loss": -11.261869430541992, "global_step": 510197, "epoch": 3036} {"train_loss": -11.35379409790039, "global_step": 510198, "epoch": 3036} {"train_loss": -11.897375106811523, "global_step": 510199, "epoch": 3036} {"train_loss": -10.93253231048584, "global_step": 510200, "epoch": 3036} {"train_loss": -11.483508110046387, "global_step": 510201, "epoch": 3036} {"train_loss": -11.709980964660645, "global_step": 510202, "epoch": 3036} {"train_loss": -11.258681297302246, "global_step": 510203, "epoch": 3036} {"train_loss": -11.351824760437012, "global_step": 510204, "epoch": 3036} {"train_loss": -11.948975563049316, "global_step": 510205, "epoch": 3036} {"train_loss": -11.590736389160156, "global_step": 510206, "epoch": 3036} {"train_loss": -12.056081771850586, "global_step": 510207, "epoch": 3036} {"train_loss": -12.185690879821777, "global_step": 510208, "epoch": 3036} {"train_loss": -11.094869613647461, "global_step": 510209, "epoch": 3036} {"train_loss": -12.238329887390137, "global_step": 510210, "epoch": 3036} {"train_loss": -12.084001541137695, "global_step": 510211, "epoch": 3036} {"train_loss": -12.14090347290039, "global_step": 510212, "epoch": 3036} {"train_loss": -12.186408996582031, "global_step": 510213, "epoch": 3036} {"train_loss": -12.17422866821289, "global_step": 510214, "epoch": 3036} {"train_loss": -11.990420296078636, "global_step": 510215, "epoch": 3036, "val_loss": 318932.6875} {"train_loss": -12.489784240722656, "global_step": 510216, "epoch": 3037} {"train_loss": -12.379436492919922, "global_step": 510217, "epoch": 3037} {"train_loss": -12.32340145111084, "global_step": 510218, "epoch": 3037} {"train_loss": -12.24655532836914, "global_step": 510219, "epoch": 3037} {"train_loss": -11.875309944152832, "global_step": 510220, "epoch": 3037} {"train_loss": -12.471831321716309, "global_step": 510221, "epoch": 3037} {"train_loss": -12.236135482788086, "global_step": 510222, "epoch": 3037} {"train_loss": -12.325796127319336, "global_step": 510223, "epoch": 3037} {"train_loss": -12.390708923339844, "global_step": 510224, "epoch": 3037} {"train_loss": -12.275674819946289, "global_step": 510225, "epoch": 3037} {"train_loss": -12.364368438720703, "global_step": 510226, "epoch": 3037} {"train_loss": -12.472167015075684, "global_step": 510227, "epoch": 3037} {"train_loss": -12.213945388793945, "global_step": 510228, "epoch": 3037} {"train_loss": -12.317341804504395, "global_step": 510229, "epoch": 3037} {"train_loss": -12.127298355102539, "global_step": 510230, "epoch": 3037} {"train_loss": -12.34077262878418, "global_step": 510231, "epoch": 3037} {"train_loss": -12.510482788085938, "global_step": 510232, "epoch": 3037} {"train_loss": -12.455812454223633, "global_step": 510233, "epoch": 3037} {"train_loss": -12.44805908203125, "global_step": 510234, "epoch": 3037} {"train_loss": -12.468485832214355, "global_step": 510235, "epoch": 3037} {"train_loss": -12.637781143188477, "global_step": 510236, "epoch": 3037} {"train_loss": -12.437812805175781, "global_step": 510237, "epoch": 3037} {"train_loss": -12.67103385925293, "global_step": 510238, "epoch": 3037} {"train_loss": -12.75471305847168, "global_step": 510239, "epoch": 3037} {"train_loss": -12.730844497680664, "global_step": 510240, "epoch": 3037} {"train_loss": -12.570416450500488, "global_step": 510241, "epoch": 3037} {"train_loss": -12.684977531433105, "global_step": 510242, "epoch": 3037} {"train_loss": -12.764419555664062, "global_step": 510243, "epoch": 3037} {"train_loss": -12.87129020690918, "global_step": 510244, "epoch": 3037} {"train_loss": -12.890405654907227, "global_step": 510245, "epoch": 3037} {"train_loss": -12.750606536865234, "global_step": 510246, "epoch": 3037} {"train_loss": -12.771846771240234, "global_step": 510247, "epoch": 3037} {"train_loss": -12.784173965454102, "global_step": 510248, "epoch": 3037} {"train_loss": -12.786531448364258, "global_step": 510249, "epoch": 3037} {"train_loss": -12.70677661895752, "global_step": 510250, "epoch": 3037} {"train_loss": -12.843157768249512, "global_step": 510251, "epoch": 3037} {"train_loss": -12.634233474731445, "global_step": 510252, "epoch": 3037} {"train_loss": -12.704784393310547, "global_step": 510253, "epoch": 3037} {"train_loss": -12.800009727478027, "global_step": 510254, "epoch": 3037} {"train_loss": -12.914827346801758, "global_step": 510255, "epoch": 3037} {"train_loss": -12.88679313659668, "global_step": 510256, "epoch": 3037} {"train_loss": -12.734182357788086, "global_step": 510257, "epoch": 3037} {"train_loss": -12.909490585327148, "global_step": 510258, "epoch": 3037} {"train_loss": -12.982950210571289, "global_step": 510259, "epoch": 3037} {"train_loss": -12.70370101928711, "global_step": 510260, "epoch": 3037} {"train_loss": -12.737815856933594, "global_step": 510261, "epoch": 3037} {"train_loss": -12.868453979492188, "global_step": 510262, "epoch": 3037} {"train_loss": -12.890945434570312, "global_step": 510263, "epoch": 3037} {"train_loss": -13.018789291381836, "global_step": 510264, "epoch": 3037} {"train_loss": -12.892024993896484, "global_step": 510265, "epoch": 3037} {"train_loss": -12.769597053527832, "global_step": 510266, "epoch": 3037} {"train_loss": -12.849474906921387, "global_step": 510267, "epoch": 3037} {"train_loss": -12.828875541687012, "global_step": 510268, "epoch": 3037} {"train_loss": -12.795639038085938, "global_step": 510269, "epoch": 3037} {"train_loss": -13.19044303894043, "global_step": 510270, "epoch": 3037} {"train_loss": -12.948486328125, "global_step": 510271, "epoch": 3037} {"train_loss": -12.991073608398438, "global_step": 510272, "epoch": 3037} {"train_loss": -12.936868667602539, "global_step": 510273, "epoch": 3037} {"train_loss": -12.908170700073242, "global_step": 510274, "epoch": 3037} {"train_loss": -13.009708404541016, "global_step": 510275, "epoch": 3037} {"train_loss": -12.570459365844727, "global_step": 510276, "epoch": 3037} {"train_loss": -12.811270713806152, "global_step": 510277, "epoch": 3037} {"train_loss": -12.751617431640625, "global_step": 510278, "epoch": 3037} {"train_loss": -12.622175216674805, "global_step": 510279, "epoch": 3037} {"train_loss": -12.911151885986328, "global_step": 510280, "epoch": 3037} {"train_loss": -12.764419555664062, "global_step": 510281, "epoch": 3037} {"train_loss": -12.786598205566406, "global_step": 510282, "epoch": 3037} {"train_loss": -12.6986083984375, "global_step": 510283, "epoch": 3037} {"train_loss": -12.808849334716797, "global_step": 510284, "epoch": 3037} {"train_loss": -13.062187194824219, "global_step": 510285, "epoch": 3037} {"train_loss": -12.828583717346191, "global_step": 510286, "epoch": 3037} {"train_loss": -12.960241317749023, "global_step": 510287, "epoch": 3037} {"train_loss": -12.603227615356445, "global_step": 510288, "epoch": 3037} {"train_loss": -12.974059104919434, "global_step": 510289, "epoch": 3037} {"train_loss": -12.976009368896484, "global_step": 510290, "epoch": 3037} {"train_loss": -13.151162147521973, "global_step": 510291, "epoch": 3037} {"train_loss": -12.923999786376953, "global_step": 510292, "epoch": 3037} {"train_loss": -12.860888481140137, "global_step": 510293, "epoch": 3037} {"train_loss": -12.909852981567383, "global_step": 510294, "epoch": 3037} {"train_loss": -12.905017852783203, "global_step": 510295, "epoch": 3037} {"train_loss": -12.824592590332031, "global_step": 510296, "epoch": 3037} {"train_loss": -12.351381301879883, "global_step": 510297, "epoch": 3037} {"train_loss": -12.512543678283691, "global_step": 510298, "epoch": 3037} {"train_loss": -12.561885833740234, "global_step": 510299, "epoch": 3037} {"train_loss": -12.71461009979248, "global_step": 510300, "epoch": 3037} {"train_loss": -12.864380836486816, "global_step": 510301, "epoch": 3037} {"train_loss": -13.233692169189453, "global_step": 510302, "epoch": 3037} {"train_loss": -13.015525817871094, "global_step": 510303, "epoch": 3037} {"train_loss": -13.078761100769043, "global_step": 510304, "epoch": 3037} {"train_loss": -12.922626495361328, "global_step": 510305, "epoch": 3037} {"train_loss": -13.065141677856445, "global_step": 510306, "epoch": 3037} {"train_loss": -12.90874195098877, "global_step": 510307, "epoch": 3037} {"train_loss": -13.096319198608398, "global_step": 510308, "epoch": 3037} {"train_loss": -12.813617706298828, "global_step": 510309, "epoch": 3037} {"train_loss": -12.667387962341309, "global_step": 510310, "epoch": 3037} {"train_loss": -12.77562141418457, "global_step": 510311, "epoch": 3037} {"train_loss": -12.894119262695312, "global_step": 510312, "epoch": 3037} {"train_loss": -12.859519958496094, "global_step": 510313, "epoch": 3037} {"train_loss": -12.53989028930664, "global_step": 510314, "epoch": 3037} {"train_loss": -11.251749038696289, "global_step": 510315, "epoch": 3037} {"train_loss": -11.961030960083008, "global_step": 510316, "epoch": 3037} {"train_loss": -12.54085922241211, "global_step": 510317, "epoch": 3037} {"train_loss": -12.825214385986328, "global_step": 510318, "epoch": 3037} {"train_loss": -12.243614196777344, "global_step": 510319, "epoch": 3037} {"train_loss": -11.002288818359375, "global_step": 510320, "epoch": 3037} {"train_loss": -12.639055252075195, "global_step": 510321, "epoch": 3037} {"train_loss": -12.178365707397461, "global_step": 510322, "epoch": 3037} {"train_loss": -12.526988983154297, "global_step": 510323, "epoch": 3037} {"train_loss": -11.497713088989258, "global_step": 510324, "epoch": 3037} {"train_loss": -12.766305923461914, "global_step": 510325, "epoch": 3037} {"train_loss": -11.21585750579834, "global_step": 510326, "epoch": 3037} {"train_loss": -12.601691246032715, "global_step": 510327, "epoch": 3037} {"train_loss": -11.617631912231445, "global_step": 510328, "epoch": 3037} {"train_loss": -12.895484924316406, "global_step": 510329, "epoch": 3037} {"train_loss": -12.517650604248047, "global_step": 510330, "epoch": 3037} {"train_loss": -12.278623580932617, "global_step": 510331, "epoch": 3037} {"train_loss": -12.330559730529785, "global_step": 510332, "epoch": 3037} {"train_loss": -11.193920135498047, "global_step": 510333, "epoch": 3037} {"train_loss": -10.438759803771973, "global_step": 510334, "epoch": 3037} {"train_loss": -12.412164688110352, "global_step": 510335, "epoch": 3037} {"train_loss": -11.344355583190918, "global_step": 510336, "epoch": 3037} {"train_loss": -11.597822189331055, "global_step": 510337, "epoch": 3037} {"train_loss": -11.827858924865723, "global_step": 510338, "epoch": 3037} {"train_loss": -11.441169738769531, "global_step": 510339, "epoch": 3037} {"train_loss": -12.536886215209961, "global_step": 510340, "epoch": 3037} {"train_loss": -11.722728729248047, "global_step": 510341, "epoch": 3037} {"train_loss": -12.316950798034668, "global_step": 510342, "epoch": 3037} {"train_loss": -11.869216918945312, "global_step": 510343, "epoch": 3037} {"train_loss": -12.629133224487305, "global_step": 510344, "epoch": 3037} {"train_loss": -11.214142799377441, "global_step": 510345, "epoch": 3037} {"train_loss": -12.262360572814941, "global_step": 510346, "epoch": 3037} {"train_loss": -10.911543846130371, "global_step": 510347, "epoch": 3037} {"train_loss": -12.613186836242676, "global_step": 510348, "epoch": 3037} {"train_loss": -11.470693588256836, "global_step": 510349, "epoch": 3037} {"train_loss": -11.926033020019531, "global_step": 510350, "epoch": 3037} {"train_loss": -11.367700576782227, "global_step": 510351, "epoch": 3037} {"train_loss": -12.567968368530273, "global_step": 510352, "epoch": 3037} {"train_loss": -11.236469268798828, "global_step": 510353, "epoch": 3037} {"train_loss": -12.145532608032227, "global_step": 510354, "epoch": 3037} {"train_loss": -12.266180038452148, "global_step": 510355, "epoch": 3037} {"train_loss": -12.467216491699219, "global_step": 510356, "epoch": 3037} {"train_loss": -12.079707145690918, "global_step": 510357, "epoch": 3037} {"train_loss": -12.141267776489258, "global_step": 510358, "epoch": 3037} {"train_loss": -11.476469993591309, "global_step": 510359, "epoch": 3037} {"train_loss": -12.356781005859375, "global_step": 510360, "epoch": 3037} {"train_loss": -12.162202835083008, "global_step": 510361, "epoch": 3037} {"train_loss": -12.286869049072266, "global_step": 510362, "epoch": 3037} {"train_loss": -12.171953201293945, "global_step": 510363, "epoch": 3037} {"train_loss": -12.557907104492188, "global_step": 510364, "epoch": 3037} {"train_loss": -12.337789535522461, "global_step": 510365, "epoch": 3037} {"train_loss": -12.54589557647705, "global_step": 510366, "epoch": 3037} {"train_loss": -12.296812057495117, "global_step": 510367, "epoch": 3037} {"train_loss": -12.470222473144531, "global_step": 510368, "epoch": 3037} {"train_loss": -12.626802444458008, "global_step": 510369, "epoch": 3037} {"train_loss": -12.336411476135254, "global_step": 510370, "epoch": 3037} {"train_loss": -12.681868553161621, "global_step": 510371, "epoch": 3037} {"train_loss": -12.62977409362793, "global_step": 510372, "epoch": 3037} {"train_loss": -12.670951843261719, "global_step": 510373, "epoch": 3037} {"train_loss": -12.880996704101562, "global_step": 510374, "epoch": 3037} {"train_loss": -12.533733367919922, "global_step": 510375, "epoch": 3037} {"train_loss": -12.391252517700195, "global_step": 510376, "epoch": 3037} {"train_loss": -12.703537940979004, "global_step": 510377, "epoch": 3037} {"train_loss": -12.720479965209961, "global_step": 510378, "epoch": 3037} {"train_loss": -12.736772537231445, "global_step": 510379, "epoch": 3037} {"train_loss": -12.751093864440918, "global_step": 510380, "epoch": 3037} {"train_loss": -12.190690994262695, "global_step": 510381, "epoch": 3037} {"train_loss": -12.42535400390625, "global_step": 510382, "epoch": 3037} {"train_loss": -12.48712864943913, "global_step": 510383, "epoch": 3037, "val_loss": 319213.9375} {"train_loss": -12.290691375732422, "global_step": 510384, "epoch": 3038} {"train_loss": -12.494634628295898, "global_step": 510385, "epoch": 3038} {"train_loss": -11.723320007324219, "global_step": 510386, "epoch": 3038} {"train_loss": -12.061918258666992, "global_step": 510387, "epoch": 3038} {"train_loss": -12.524072647094727, "global_step": 510388, "epoch": 3038} {"train_loss": -11.972779273986816, "global_step": 510389, "epoch": 3038} {"train_loss": -11.965868949890137, "global_step": 510390, "epoch": 3038} {"train_loss": -12.700271606445312, "global_step": 510391, "epoch": 3038} {"train_loss": -12.803776741027832, "global_step": 510392, "epoch": 3038} {"train_loss": -12.151546478271484, "global_step": 510393, "epoch": 3038} {"train_loss": -12.105541229248047, "global_step": 510394, "epoch": 3038} {"train_loss": -12.693860054016113, "global_step": 510395, "epoch": 3038} {"train_loss": -12.711712837219238, "global_step": 510396, "epoch": 3038} {"train_loss": -12.01432991027832, "global_step": 510397, "epoch": 3038} {"train_loss": -12.96625804901123, "global_step": 510398, "epoch": 3038} {"train_loss": -12.382692337036133, "global_step": 510399, "epoch": 3038} {"train_loss": -12.921957969665527, "global_step": 510400, "epoch": 3038} {"train_loss": -12.54551887512207, "global_step": 510401, "epoch": 3038} {"train_loss": -12.598554611206055, "global_step": 510402, "epoch": 3038} {"train_loss": -12.496379852294922, "global_step": 510403, "epoch": 3038} {"train_loss": -12.596695899963379, "global_step": 510404, "epoch": 3038} {"train_loss": -12.605443954467773, "global_step": 510405, "epoch": 3038} {"train_loss": -13.080142974853516, "global_step": 510406, "epoch": 3038} {"train_loss": -12.509990692138672, "global_step": 510407, "epoch": 3038} {"train_loss": -12.490968704223633, "global_step": 510408, "epoch": 3038} {"train_loss": -12.44565200805664, "global_step": 510409, "epoch": 3038} {"train_loss": -12.843347549438477, "global_step": 510410, "epoch": 3038} {"train_loss": -12.284366607666016, "global_step": 510411, "epoch": 3038} {"train_loss": -12.623708724975586, "global_step": 510412, "epoch": 3038} {"train_loss": -12.65139102935791, "global_step": 510413, "epoch": 3038} {"train_loss": -11.8926362991333, "global_step": 510414, "epoch": 3038} {"train_loss": -12.025962829589844, "global_step": 510415, "epoch": 3038} {"train_loss": -12.533864974975586, "global_step": 510416, "epoch": 3038} {"train_loss": -11.431013107299805, "global_step": 510417, "epoch": 3038} {"train_loss": -12.480659484863281, "global_step": 510418, "epoch": 3038} {"train_loss": -12.627696990966797, "global_step": 510419, "epoch": 3038} {"train_loss": -11.70432186126709, "global_step": 510420, "epoch": 3038} {"train_loss": -12.47079849243164, "global_step": 510421, "epoch": 3038} {"train_loss": -12.032963752746582, "global_step": 510422, "epoch": 3038} {"train_loss": -11.72838306427002, "global_step": 510423, "epoch": 3038} {"train_loss": -12.172891616821289, "global_step": 510424, "epoch": 3038} {"train_loss": -10.62450885772705, "global_step": 510425, "epoch": 3038} {"train_loss": -10.94870662689209, "global_step": 510426, "epoch": 3038} {"train_loss": -11.690235137939453, "global_step": 510427, "epoch": 3038} {"train_loss": -9.502250671386719, "global_step": 510428, "epoch": 3038} {"train_loss": -11.473608016967773, "global_step": 510429, "epoch": 3038} {"train_loss": -8.888240814208984, "global_step": 510430, "epoch": 3038} {"train_loss": -9.446552276611328, "global_step": 510431, "epoch": 3038} {"train_loss": -8.801807403564453, "global_step": 510432, "epoch": 3038} {"train_loss": -9.74334716796875, "global_step": 510433, "epoch": 3038} {"train_loss": -8.812372207641602, "global_step": 510434, "epoch": 3038} {"train_loss": -9.012741088867188, "global_step": 510435, "epoch": 3038} {"train_loss": -10.09799575805664, "global_step": 510436, "epoch": 3038} {"train_loss": -11.232794761657715, "global_step": 510437, "epoch": 3038} {"train_loss": -10.143189430236816, "global_step": 510438, "epoch": 3038} {"train_loss": -10.695422172546387, "global_step": 510439, "epoch": 3038} {"train_loss": -12.124099731445312, "global_step": 510440, "epoch": 3038} {"train_loss": -10.202570915222168, "global_step": 510441, "epoch": 3038} {"train_loss": -11.103609085083008, "global_step": 510442, "epoch": 3038} {"train_loss": -11.214187622070312, "global_step": 510443, "epoch": 3038} {"train_loss": -10.578554153442383, "global_step": 510444, "epoch": 3038} {"train_loss": -12.04134464263916, "global_step": 510445, "epoch": 3038} {"train_loss": -11.570497512817383, "global_step": 510446, "epoch": 3038} {"train_loss": -11.989201545715332, "global_step": 510447, "epoch": 3038} {"train_loss": -11.836859703063965, "global_step": 510448, "epoch": 3038} {"train_loss": -11.660444259643555, "global_step": 510449, "epoch": 3038} {"train_loss": -12.156620979309082, "global_step": 510450, "epoch": 3038} {"train_loss": -11.928119659423828, "global_step": 510451, "epoch": 3038} {"train_loss": -12.148443222045898, "global_step": 510452, "epoch": 3038} {"train_loss": -11.837560653686523, "global_step": 510453, "epoch": 3038} {"train_loss": -12.148181915283203, "global_step": 510454, "epoch": 3038} {"train_loss": -12.276458740234375, "global_step": 510455, "epoch": 3038} {"train_loss": -12.119176864624023, "global_step": 510456, "epoch": 3038} {"train_loss": -11.859037399291992, "global_step": 510457, "epoch": 3038} {"train_loss": -12.271049499511719, "global_step": 510458, "epoch": 3038} {"train_loss": -12.081171035766602, "global_step": 510459, "epoch": 3038} {"train_loss": -12.272872924804688, "global_step": 510460, "epoch": 3038} {"train_loss": -12.738606452941895, "global_step": 510461, "epoch": 3038} {"train_loss": -11.809646606445312, "global_step": 510462, "epoch": 3038} {"train_loss": -12.270058631896973, "global_step": 510463, "epoch": 3038} {"train_loss": -11.953278541564941, "global_step": 510464, "epoch": 3038} {"train_loss": -11.801789283752441, "global_step": 510465, "epoch": 3038} {"train_loss": -12.153730392456055, "global_step": 510466, "epoch": 3038} {"train_loss": -11.391749382019043, "global_step": 510467, "epoch": 3038} {"train_loss": -12.161296844482422, "global_step": 510468, "epoch": 3038} {"train_loss": -12.129748344421387, "global_step": 510469, "epoch": 3038} {"train_loss": -11.982112884521484, "global_step": 510470, "epoch": 3038} {"train_loss": -12.132074356079102, "global_step": 510471, "epoch": 3038} {"train_loss": -11.873443603515625, "global_step": 510472, "epoch": 3038} {"train_loss": -12.217242240905762, "global_step": 510473, "epoch": 3038} {"train_loss": -12.22210693359375, "global_step": 510474, "epoch": 3038} {"train_loss": -11.967019081115723, "global_step": 510475, "epoch": 3038} {"train_loss": -12.143524169921875, "global_step": 510476, "epoch": 3038} {"train_loss": -11.259808540344238, "global_step": 510477, "epoch": 3038} {"train_loss": -12.318111419677734, "global_step": 510478, "epoch": 3038} {"train_loss": -11.143282890319824, "global_step": 510479, "epoch": 3038} {"train_loss": -11.75351333618164, "global_step": 510480, "epoch": 3038} {"train_loss": -11.620979309082031, "global_step": 510481, "epoch": 3038} {"train_loss": -11.523330688476562, "global_step": 510482, "epoch": 3038} {"train_loss": -12.010045051574707, "global_step": 510483, "epoch": 3038} {"train_loss": -10.79797649383545, "global_step": 510484, "epoch": 3038} {"train_loss": -11.843265533447266, "global_step": 510485, "epoch": 3038} {"train_loss": -10.897112846374512, "global_step": 510486, "epoch": 3038} {"train_loss": -10.671009063720703, "global_step": 510487, "epoch": 3038} {"train_loss": -11.829732894897461, "global_step": 510488, "epoch": 3038} {"train_loss": -10.080572128295898, "global_step": 510489, "epoch": 3038} {"train_loss": -11.022112846374512, "global_step": 510490, "epoch": 3038} {"train_loss": -10.573138236999512, "global_step": 510491, "epoch": 3038} {"train_loss": -10.906380653381348, "global_step": 510492, "epoch": 3038} {"train_loss": -10.579133987426758, "global_step": 510493, "epoch": 3038} {"train_loss": -12.208524703979492, "global_step": 510494, "epoch": 3038} {"train_loss": -10.061366081237793, "global_step": 510495, "epoch": 3038} {"train_loss": -11.532235145568848, "global_step": 510496, "epoch": 3038} {"train_loss": -10.219698905944824, "global_step": 510497, "epoch": 3038} {"train_loss": -11.109848022460938, "global_step": 510498, "epoch": 3038} {"train_loss": -11.593932151794434, "global_step": 510499, "epoch": 3038} {"train_loss": -11.57343578338623, "global_step": 510500, "epoch": 3038} {"train_loss": -11.652793884277344, "global_step": 510501, "epoch": 3038} {"train_loss": -11.765226364135742, "global_step": 510502, "epoch": 3038} {"train_loss": -11.670304298400879, "global_step": 510503, "epoch": 3038} {"train_loss": -11.807867050170898, "global_step": 510504, "epoch": 3038} {"train_loss": -11.801507949829102, "global_step": 510505, "epoch": 3038} {"train_loss": -12.156157493591309, "global_step": 510506, "epoch": 3038} {"train_loss": -11.735603332519531, "global_step": 510507, "epoch": 3038} {"train_loss": -12.443564414978027, "global_step": 510508, "epoch": 3038} {"train_loss": -11.86084270477295, "global_step": 510509, "epoch": 3038} {"train_loss": -12.352693557739258, "global_step": 510510, "epoch": 3038} {"train_loss": -11.931402206420898, "global_step": 510511, "epoch": 3038} {"train_loss": -12.102792739868164, "global_step": 510512, "epoch": 3038} {"train_loss": -12.379545211791992, "global_step": 510513, "epoch": 3038} {"train_loss": -12.311582565307617, "global_step": 510514, "epoch": 3038} {"train_loss": -12.290907859802246, "global_step": 510515, "epoch": 3038} {"train_loss": -12.362552642822266, "global_step": 510516, "epoch": 3038} {"train_loss": -12.374801635742188, "global_step": 510517, "epoch": 3038} {"train_loss": -12.456409454345703, "global_step": 510518, "epoch": 3038} {"train_loss": -12.441688537597656, "global_step": 510519, "epoch": 3038} {"train_loss": -12.473413467407227, "global_step": 510520, "epoch": 3038} {"train_loss": -11.98370361328125, "global_step": 510521, "epoch": 3038} {"train_loss": -12.327291488647461, "global_step": 510522, "epoch": 3038} {"train_loss": -12.333391189575195, "global_step": 510523, "epoch": 3038} {"train_loss": -12.326772689819336, "global_step": 510524, "epoch": 3038} {"train_loss": -12.205301284790039, "global_step": 510525, "epoch": 3038} {"train_loss": -12.528243064880371, "global_step": 510526, "epoch": 3038} {"train_loss": -11.84787368774414, "global_step": 510527, "epoch": 3038} {"train_loss": -12.625246047973633, "global_step": 510528, "epoch": 3038} {"train_loss": -12.374732971191406, "global_step": 510529, "epoch": 3038} {"train_loss": -12.083385467529297, "global_step": 510530, "epoch": 3038} {"train_loss": -12.656506538391113, "global_step": 510531, "epoch": 3038} {"train_loss": -12.482787132263184, "global_step": 510532, "epoch": 3038} {"train_loss": -12.519209861755371, "global_step": 510533, "epoch": 3038} {"train_loss": -12.596389770507812, "global_step": 510534, "epoch": 3038} {"train_loss": -12.313885688781738, "global_step": 510535, "epoch": 3038} {"train_loss": -12.589202880859375, "global_step": 510536, "epoch": 3038} {"train_loss": -12.651677131652832, "global_step": 510537, "epoch": 3038} {"train_loss": -12.476978302001953, "global_step": 510538, "epoch": 3038} {"train_loss": -12.641751289367676, "global_step": 510539, "epoch": 3038} {"train_loss": -12.536579132080078, "global_step": 510540, "epoch": 3038} {"train_loss": -12.56482982635498, "global_step": 510541, "epoch": 3038} {"train_loss": -12.704002380371094, "global_step": 510542, "epoch": 3038} {"train_loss": -12.697813987731934, "global_step": 510543, "epoch": 3038} {"train_loss": -12.74999713897705, "global_step": 510544, "epoch": 3038} {"train_loss": -12.594449043273926, "global_step": 510545, "epoch": 3038} {"train_loss": -12.823186874389648, "global_step": 510546, "epoch": 3038} {"train_loss": -12.563089370727539, "global_step": 510547, "epoch": 3038} {"train_loss": -12.718929290771484, "global_step": 510548, "epoch": 3038} {"train_loss": -12.80153751373291, "global_step": 510549, "epoch": 3038} {"train_loss": -12.730047225952148, "global_step": 510550, "epoch": 3038} {"train_loss": -11.892745983032952, "global_step": 510551, "epoch": 3038, "val_loss": 317907.625} {"train_loss": -12.856252670288086, "global_step": 510552, "epoch": 3039} {"train_loss": -12.859353065490723, "global_step": 510553, "epoch": 3039} {"train_loss": -12.94619369506836, "global_step": 510554, "epoch": 3039} {"train_loss": -12.898775100708008, "global_step": 510555, "epoch": 3039} {"train_loss": -12.804449081420898, "global_step": 510556, "epoch": 3039} {"train_loss": -12.88370418548584, "global_step": 510557, "epoch": 3039} {"train_loss": -12.815185546875, "global_step": 510558, "epoch": 3039} {"train_loss": -12.88585376739502, "global_step": 510559, "epoch": 3039} {"train_loss": -12.8297700881958, "global_step": 510560, "epoch": 3039} {"train_loss": -12.559799194335938, "global_step": 510561, "epoch": 3039} {"train_loss": -12.788212776184082, "global_step": 510562, "epoch": 3039} {"train_loss": -12.832733154296875, "global_step": 510563, "epoch": 3039} {"train_loss": -12.96992301940918, "global_step": 510564, "epoch": 3039} {"train_loss": -12.613652229309082, "global_step": 510565, "epoch": 3039} {"train_loss": -12.872541427612305, "global_step": 510566, "epoch": 3039} {"train_loss": -12.860733985900879, "global_step": 510567, "epoch": 3039} {"train_loss": -12.841773986816406, "global_step": 510568, "epoch": 3039} {"train_loss": -12.86373519897461, "global_step": 510569, "epoch": 3039} {"train_loss": -12.557981491088867, "global_step": 510570, "epoch": 3039} {"train_loss": -12.65224838256836, "global_step": 510571, "epoch": 3039} {"train_loss": -12.363354682922363, "global_step": 510572, "epoch": 3039} {"train_loss": -12.698583602905273, "global_step": 510573, "epoch": 3039} {"train_loss": -12.263004302978516, "global_step": 510574, "epoch": 3039} {"train_loss": -12.184775352478027, "global_step": 510575, "epoch": 3039} {"train_loss": -11.856094360351562, "global_step": 510576, "epoch": 3039} {"train_loss": -11.731258392333984, "global_step": 510577, "epoch": 3039} {"train_loss": -12.36890983581543, "global_step": 510578, "epoch": 3039} {"train_loss": -10.798856735229492, "global_step": 510579, "epoch": 3039} {"train_loss": -11.865252494812012, "global_step": 510580, "epoch": 3039} {"train_loss": -10.41196346282959, "global_step": 510581, "epoch": 3039} {"train_loss": -11.280365943908691, "global_step": 510582, "epoch": 3039} {"train_loss": -11.143085479736328, "global_step": 510583, "epoch": 3039} {"train_loss": -10.655509948730469, "global_step": 510584, "epoch": 3039} {"train_loss": -9.673105239868164, "global_step": 510585, "epoch": 3039} {"train_loss": -10.449914932250977, "global_step": 510586, "epoch": 3039} {"train_loss": -10.732388496398926, "global_step": 510587, "epoch": 3039} {"train_loss": -10.683769226074219, "global_step": 510588, "epoch": 3039} {"train_loss": -9.96721076965332, "global_step": 510589, "epoch": 3039} {"train_loss": -11.086576461791992, "global_step": 510590, "epoch": 3039} {"train_loss": -11.364864349365234, "global_step": 510591, "epoch": 3039} {"train_loss": -9.896869659423828, "global_step": 510592, "epoch": 3039} {"train_loss": -11.563058853149414, "global_step": 510593, "epoch": 3039} {"train_loss": -11.464807510375977, "global_step": 510594, "epoch": 3039} {"train_loss": -11.913352012634277, "global_step": 510595, "epoch": 3039} {"train_loss": -11.895370483398438, "global_step": 510596, "epoch": 3039} {"train_loss": -11.527809143066406, "global_step": 510597, "epoch": 3039} {"train_loss": -12.401961326599121, "global_step": 510598, "epoch": 3039} {"train_loss": -12.285822868347168, "global_step": 510599, "epoch": 3039} {"train_loss": -12.275907516479492, "global_step": 510600, "epoch": 3039} {"train_loss": -12.254659652709961, "global_step": 510601, "epoch": 3039} {"train_loss": -12.075969696044922, "global_step": 510602, "epoch": 3039} {"train_loss": -12.069367408752441, "global_step": 510603, "epoch": 3039} {"train_loss": -12.253377914428711, "global_step": 510604, "epoch": 3039} {"train_loss": -12.221776962280273, "global_step": 510605, "epoch": 3039} {"train_loss": -12.298839569091797, "global_step": 510606, "epoch": 3039} {"train_loss": -11.675928115844727, "global_step": 510607, "epoch": 3039} {"train_loss": -12.505508422851562, "global_step": 510608, "epoch": 3039} {"train_loss": -12.198019981384277, "global_step": 510609, "epoch": 3039} {"train_loss": -12.465678215026855, "global_step": 510610, "epoch": 3039} {"train_loss": -12.492053985595703, "global_step": 510611, "epoch": 3039} {"train_loss": -12.304544448852539, "global_step": 510612, "epoch": 3039} {"train_loss": -12.581645965576172, "global_step": 510613, "epoch": 3039} {"train_loss": -12.205001831054688, "global_step": 510614, "epoch": 3039} {"train_loss": -12.797784805297852, "global_step": 510615, "epoch": 3039} {"train_loss": -12.36250114440918, "global_step": 510616, "epoch": 3039} {"train_loss": -12.62524127960205, "global_step": 510617, "epoch": 3039} {"train_loss": -12.428317070007324, "global_step": 510618, "epoch": 3039} {"train_loss": -12.583097457885742, "global_step": 510619, "epoch": 3039} {"train_loss": -12.476375579833984, "global_step": 510620, "epoch": 3039} {"train_loss": -12.42447566986084, "global_step": 510621, "epoch": 3039} {"train_loss": -12.627467155456543, "global_step": 510622, "epoch": 3039} {"train_loss": -12.493339538574219, "global_step": 510623, "epoch": 3039} {"train_loss": -12.695442199707031, "global_step": 510624, "epoch": 3039} {"train_loss": -12.795997619628906, "global_step": 510625, "epoch": 3039} {"train_loss": -12.675481796264648, "global_step": 510626, "epoch": 3039} {"train_loss": -12.818626403808594, "global_step": 510627, "epoch": 3039} {"train_loss": -12.988295555114746, "global_step": 510628, "epoch": 3039} {"train_loss": -12.471071243286133, "global_step": 510629, "epoch": 3039} {"train_loss": -12.837910652160645, "global_step": 510630, "epoch": 3039} {"train_loss": -12.710643768310547, "global_step": 510631, "epoch": 3039} {"train_loss": -12.888895034790039, "global_step": 510632, "epoch": 3039} {"train_loss": -12.599178314208984, "global_step": 510633, "epoch": 3039} {"train_loss": -12.826425552368164, "global_step": 510634, "epoch": 3039} {"train_loss": -12.61128044128418, "global_step": 510635, "epoch": 3039} {"train_loss": -12.658902168273926, "global_step": 510636, "epoch": 3039} {"train_loss": -12.608087539672852, "global_step": 510637, "epoch": 3039} {"train_loss": -12.802979469299316, "global_step": 510638, "epoch": 3039} {"train_loss": -12.72004222869873, "global_step": 510639, "epoch": 3039} {"train_loss": -12.717517852783203, "global_step": 510640, "epoch": 3039} {"train_loss": -12.748260498046875, "global_step": 510641, "epoch": 3039} {"train_loss": -12.801173210144043, "global_step": 510642, "epoch": 3039} {"train_loss": -12.781550407409668, "global_step": 510643, "epoch": 3039} {"train_loss": -12.916399002075195, "global_step": 510644, "epoch": 3039} {"train_loss": -12.863775253295898, "global_step": 510645, "epoch": 3039} {"train_loss": -12.794486045837402, "global_step": 510646, "epoch": 3039} {"train_loss": -12.798600196838379, "global_step": 510647, "epoch": 3039} {"train_loss": -12.933160781860352, "global_step": 510648, "epoch": 3039} {"train_loss": -12.663490295410156, "global_step": 510649, "epoch": 3039} {"train_loss": -12.785890579223633, "global_step": 510650, "epoch": 3039} {"train_loss": -12.852855682373047, "global_step": 510651, "epoch": 3039} {"train_loss": -12.717310905456543, "global_step": 510652, "epoch": 3039} {"train_loss": -12.865249633789062, "global_step": 510653, "epoch": 3039} {"train_loss": -13.019021987915039, "global_step": 510654, "epoch": 3039} {"train_loss": -12.802566528320312, "global_step": 510655, "epoch": 3039} {"train_loss": -13.02104377746582, "global_step": 510656, "epoch": 3039} {"train_loss": -12.817575454711914, "global_step": 510657, "epoch": 3039} {"train_loss": -12.833626747131348, "global_step": 510658, "epoch": 3039} {"train_loss": -13.009268760681152, "global_step": 510659, "epoch": 3039} {"train_loss": -12.875749588012695, "global_step": 510660, "epoch": 3039} {"train_loss": -12.982636451721191, "global_step": 510661, "epoch": 3039} {"train_loss": -13.098594665527344, "global_step": 510662, "epoch": 3039} {"train_loss": -12.838329315185547, "global_step": 510663, "epoch": 3039} {"train_loss": -13.02304458618164, "global_step": 510664, "epoch": 3039} {"train_loss": -12.910043716430664, "global_step": 510665, "epoch": 3039} {"train_loss": -12.83094596862793, "global_step": 510666, "epoch": 3039} {"train_loss": -12.584272384643555, "global_step": 510667, "epoch": 3039} {"train_loss": -12.264744758605957, "global_step": 510668, "epoch": 3039} {"train_loss": -12.27107048034668, "global_step": 510669, "epoch": 3039} {"train_loss": -12.517884254455566, "global_step": 510670, "epoch": 3039} {"train_loss": -12.390507698059082, "global_step": 510671, "epoch": 3039} {"train_loss": -11.403348922729492, "global_step": 510672, "epoch": 3039} {"train_loss": -11.986595153808594, "global_step": 510673, "epoch": 3039} {"train_loss": -11.210643768310547, "global_step": 510674, "epoch": 3039} {"train_loss": -11.941656112670898, "global_step": 510675, "epoch": 3039} {"train_loss": -10.264132499694824, "global_step": 510676, "epoch": 3039} {"train_loss": -11.518625259399414, "global_step": 510677, "epoch": 3039} {"train_loss": -9.223489761352539, "global_step": 510678, "epoch": 3039} {"train_loss": -12.100507736206055, "global_step": 510679, "epoch": 3039} {"train_loss": -9.4906005859375, "global_step": 510680, "epoch": 3039} {"train_loss": -10.694999694824219, "global_step": 510681, "epoch": 3039} {"train_loss": -11.725282669067383, "global_step": 510682, "epoch": 3039} {"train_loss": -9.123329162597656, "global_step": 510683, "epoch": 3039} {"train_loss": -10.015172958374023, "global_step": 510684, "epoch": 3039} {"train_loss": -10.593301773071289, "global_step": 510685, "epoch": 3039} {"train_loss": -11.56728744506836, "global_step": 510686, "epoch": 3039} {"train_loss": -10.1065673828125, "global_step": 510687, "epoch": 3039} {"train_loss": -11.612967491149902, "global_step": 510688, "epoch": 3039} {"train_loss": -11.4855375289917, "global_step": 510689, "epoch": 3039} {"train_loss": -11.16214370727539, "global_step": 510690, "epoch": 3039} {"train_loss": -11.70079231262207, "global_step": 510691, "epoch": 3039} {"train_loss": -10.817707061767578, "global_step": 510692, "epoch": 3039} {"train_loss": -12.31159782409668, "global_step": 510693, "epoch": 3039} {"train_loss": -10.779165267944336, "global_step": 510694, "epoch": 3039} {"train_loss": -11.634977340698242, "global_step": 510695, "epoch": 3039} {"train_loss": -11.599998474121094, "global_step": 510696, "epoch": 3039} {"train_loss": -11.382898330688477, "global_step": 510697, "epoch": 3039} {"train_loss": -11.94036865234375, "global_step": 510698, "epoch": 3039} {"train_loss": -11.288124084472656, "global_step": 510699, "epoch": 3039} {"train_loss": -11.632582664489746, "global_step": 510700, "epoch": 3039} {"train_loss": -12.36462116241455, "global_step": 510701, "epoch": 3039} {"train_loss": -11.311570167541504, "global_step": 510702, "epoch": 3039} {"train_loss": -12.161903381347656, "global_step": 510703, "epoch": 3039} {"train_loss": -11.36092758178711, "global_step": 510704, "epoch": 3039} {"train_loss": -11.752617835998535, "global_step": 510705, "epoch": 3039} {"train_loss": -11.955562591552734, "global_step": 510706, "epoch": 3039} {"train_loss": -11.121774673461914, "global_step": 510707, "epoch": 3039} {"train_loss": -12.638432502746582, "global_step": 510708, "epoch": 3039} {"train_loss": -11.605649948120117, "global_step": 510709, "epoch": 3039} {"train_loss": -12.305394172668457, "global_step": 510710, "epoch": 3039} {"train_loss": -11.983077049255371, "global_step": 510711, "epoch": 3039} {"train_loss": -12.239007949829102, "global_step": 510712, "epoch": 3039} {"train_loss": -12.169422149658203, "global_step": 510713, "epoch": 3039} {"train_loss": -11.556720733642578, "global_step": 510714, "epoch": 3039} {"train_loss": -12.418363571166992, "global_step": 510715, "epoch": 3039} {"train_loss": -11.723478317260742, "global_step": 510716, "epoch": 3039} {"train_loss": -12.394942283630371, "global_step": 510717, "epoch": 3039} {"train_loss": -11.421791076660156, "global_step": 510718, "epoch": 3039} {"train_loss": -12.105424523353577, "global_step": 510719, "epoch": 3039, "val_loss": 318657.25} {"train_loss": -11.88592529296875, "global_step": 510720, "epoch": 3040} {"train_loss": -12.284438133239746, "global_step": 510721, "epoch": 3040} {"train_loss": -12.223502159118652, "global_step": 510722, "epoch": 3040} {"train_loss": -12.6470308303833, "global_step": 510723, "epoch": 3040} {"train_loss": -11.968122482299805, "global_step": 510724, "epoch": 3040} {"train_loss": -12.44485092163086, "global_step": 510725, "epoch": 3040} {"train_loss": -12.300467491149902, "global_step": 510726, "epoch": 3040} {"train_loss": -12.490821838378906, "global_step": 510727, "epoch": 3040} {"train_loss": -12.61201286315918, "global_step": 510728, "epoch": 3040} {"train_loss": -12.1881742477417, "global_step": 510729, "epoch": 3040} {"train_loss": -12.090932846069336, "global_step": 510730, "epoch": 3040} {"train_loss": -12.428287506103516, "global_step": 510731, "epoch": 3040} {"train_loss": -12.32339096069336, "global_step": 510732, "epoch": 3040} {"train_loss": -12.76002311706543, "global_step": 510733, "epoch": 3040} {"train_loss": -12.2833251953125, "global_step": 510734, "epoch": 3040} {"train_loss": -12.74207878112793, "global_step": 510735, "epoch": 3040} {"train_loss": -12.412897109985352, "global_step": 510736, "epoch": 3040} {"train_loss": -12.753442764282227, "global_step": 510737, "epoch": 3040} {"train_loss": -12.610138893127441, "global_step": 510738, "epoch": 3040} {"train_loss": -12.473831176757812, "global_step": 510739, "epoch": 3040} {"train_loss": -12.798906326293945, "global_step": 510740, "epoch": 3040} {"train_loss": -12.535982131958008, "global_step": 510741, "epoch": 3040} {"train_loss": -12.534957885742188, "global_step": 510742, "epoch": 3040} {"train_loss": -12.791553497314453, "global_step": 510743, "epoch": 3040} {"train_loss": -12.570968627929688, "global_step": 510744, "epoch": 3040} {"train_loss": -12.58967399597168, "global_step": 510745, "epoch": 3040} {"train_loss": -12.671775817871094, "global_step": 510746, "epoch": 3040} {"train_loss": -12.04562759399414, "global_step": 510747, "epoch": 3040} {"train_loss": -12.458820343017578, "global_step": 510748, "epoch": 3040} {"train_loss": -12.554604530334473, "global_step": 510749, "epoch": 3040} {"train_loss": -12.380474090576172, "global_step": 510750, "epoch": 3040} {"train_loss": -12.535106658935547, "global_step": 510751, "epoch": 3040} {"train_loss": -12.169012069702148, "global_step": 510752, "epoch": 3040} {"train_loss": -12.52863597869873, "global_step": 510753, "epoch": 3040} {"train_loss": -12.15523910522461, "global_step": 510754, "epoch": 3040} {"train_loss": -12.336503982543945, "global_step": 510755, "epoch": 3040} {"train_loss": -12.486581802368164, "global_step": 510756, "epoch": 3040} {"train_loss": -11.779376983642578, "global_step": 510757, "epoch": 3040} {"train_loss": -12.149198532104492, "global_step": 510758, "epoch": 3040} {"train_loss": -11.042535781860352, "global_step": 510759, "epoch": 3040} {"train_loss": -12.220398902893066, "global_step": 510760, "epoch": 3040} {"train_loss": -11.770162582397461, "global_step": 510761, "epoch": 3040} {"train_loss": -11.677968978881836, "global_step": 510762, "epoch": 3040} {"train_loss": -12.232257843017578, "global_step": 510763, "epoch": 3040} {"train_loss": -10.767542839050293, "global_step": 510764, "epoch": 3040} {"train_loss": -12.67033576965332, "global_step": 510765, "epoch": 3040} {"train_loss": -11.030174255371094, "global_step": 510766, "epoch": 3040} {"train_loss": -11.505977630615234, "global_step": 510767, "epoch": 3040} {"train_loss": -11.428731918334961, "global_step": 510768, "epoch": 3040} {"train_loss": -10.682079315185547, "global_step": 510769, "epoch": 3040} {"train_loss": -12.234606742858887, "global_step": 510770, "epoch": 3040} {"train_loss": -10.641276359558105, "global_step": 510771, "epoch": 3040} {"train_loss": -11.474523544311523, "global_step": 510772, "epoch": 3040} {"train_loss": -11.509734153747559, "global_step": 510773, "epoch": 3040} {"train_loss": -11.059192657470703, "global_step": 510774, "epoch": 3040} {"train_loss": -10.8507080078125, "global_step": 510775, "epoch": 3040} {"train_loss": -11.752525329589844, "global_step": 510776, "epoch": 3040} {"train_loss": -10.637125015258789, "global_step": 510777, "epoch": 3040} {"train_loss": -11.282994270324707, "global_step": 510778, "epoch": 3040} {"train_loss": -12.433025360107422, "global_step": 510779, "epoch": 3040} {"train_loss": -11.609399795532227, "global_step": 510780, "epoch": 3040} {"train_loss": -12.039113998413086, "global_step": 510781, "epoch": 3040} {"train_loss": -12.180207252502441, "global_step": 510782, "epoch": 3040} {"train_loss": -11.62336540222168, "global_step": 510783, "epoch": 3040} {"train_loss": -12.499723434448242, "global_step": 510784, "epoch": 3040} {"train_loss": -12.357114791870117, "global_step": 510785, "epoch": 3040} {"train_loss": -12.132425308227539, "global_step": 510786, "epoch": 3040} {"train_loss": -12.50249195098877, "global_step": 510787, "epoch": 3040} {"train_loss": -12.636638641357422, "global_step": 510788, "epoch": 3040} {"train_loss": -12.230055809020996, "global_step": 510789, "epoch": 3040} {"train_loss": -12.485511779785156, "global_step": 510790, "epoch": 3040} {"train_loss": -12.281696319580078, "global_step": 510791, "epoch": 3040} {"train_loss": -12.602731704711914, "global_step": 510792, "epoch": 3040} {"train_loss": -12.643888473510742, "global_step": 510793, "epoch": 3040} {"train_loss": -12.384536743164062, "global_step": 510794, "epoch": 3040} {"train_loss": -12.704407691955566, "global_step": 510795, "epoch": 3040} {"train_loss": -12.691068649291992, "global_step": 510796, "epoch": 3040} {"train_loss": -12.210216522216797, "global_step": 510797, "epoch": 3040} {"train_loss": -12.902912139892578, "global_step": 510798, "epoch": 3040} {"train_loss": -12.548870086669922, "global_step": 510799, "epoch": 3040} {"train_loss": -12.692461013793945, "global_step": 510800, "epoch": 3040} {"train_loss": -12.50897216796875, "global_step": 510801, "epoch": 3040} {"train_loss": -12.68423080444336, "global_step": 510802, "epoch": 3040} {"train_loss": -12.221639633178711, "global_step": 510803, "epoch": 3040} {"train_loss": -12.474159240722656, "global_step": 510804, "epoch": 3040} {"train_loss": -12.46390438079834, "global_step": 510805, "epoch": 3040} {"train_loss": -12.36026668548584, "global_step": 510806, "epoch": 3040} {"train_loss": -12.7225341796875, "global_step": 510807, "epoch": 3040} {"train_loss": -12.784479141235352, "global_step": 510808, "epoch": 3040} {"train_loss": -12.655721664428711, "global_step": 510809, "epoch": 3040} {"train_loss": -12.767236709594727, "global_step": 510810, "epoch": 3040} {"train_loss": -12.632701873779297, "global_step": 510811, "epoch": 3040} {"train_loss": -12.885438919067383, "global_step": 510812, "epoch": 3040} {"train_loss": -12.696051597595215, "global_step": 510813, "epoch": 3040} {"train_loss": -12.655320167541504, "global_step": 510814, "epoch": 3040} {"train_loss": -12.632594108581543, "global_step": 510815, "epoch": 3040} {"train_loss": -12.727191925048828, "global_step": 510816, "epoch": 3040} {"train_loss": -12.83857536315918, "global_step": 510817, "epoch": 3040} {"train_loss": -12.622204780578613, "global_step": 510818, "epoch": 3040} {"train_loss": -12.496438980102539, "global_step": 510819, "epoch": 3040} {"train_loss": -12.734291076660156, "global_step": 510820, "epoch": 3040} {"train_loss": -12.530364990234375, "global_step": 510821, "epoch": 3040} {"train_loss": -12.590956687927246, "global_step": 510822, "epoch": 3040} {"train_loss": -12.611037254333496, "global_step": 510823, "epoch": 3040} {"train_loss": -12.698380470275879, "global_step": 510824, "epoch": 3040} {"train_loss": -12.41429328918457, "global_step": 510825, "epoch": 3040} {"train_loss": -12.589515686035156, "global_step": 510826, "epoch": 3040} {"train_loss": -12.979450225830078, "global_step": 510827, "epoch": 3040} {"train_loss": -12.689884185791016, "global_step": 510828, "epoch": 3040} {"train_loss": -12.950279235839844, "global_step": 510829, "epoch": 3040} {"train_loss": -12.77829360961914, "global_step": 510830, "epoch": 3040} {"train_loss": -12.811083793640137, "global_step": 510831, "epoch": 3040} {"train_loss": -12.891971588134766, "global_step": 510832, "epoch": 3040} {"train_loss": -12.878108978271484, "global_step": 510833, "epoch": 3040} {"train_loss": -12.873956680297852, "global_step": 510834, "epoch": 3040} {"train_loss": -12.964200973510742, "global_step": 510835, "epoch": 3040} {"train_loss": -12.842000007629395, "global_step": 510836, "epoch": 3040} {"train_loss": -12.866564750671387, "global_step": 510837, "epoch": 3040} {"train_loss": -13.027393341064453, "global_step": 510838, "epoch": 3040} {"train_loss": -12.977119445800781, "global_step": 510839, "epoch": 3040} {"train_loss": -12.913446426391602, "global_step": 510840, "epoch": 3040} {"train_loss": -12.911011695861816, "global_step": 510841, "epoch": 3040} {"train_loss": -12.790817260742188, "global_step": 510842, "epoch": 3040} {"train_loss": -12.764924049377441, "global_step": 510843, "epoch": 3040} {"train_loss": -12.870573043823242, "global_step": 510844, "epoch": 3040} {"train_loss": -13.007752418518066, "global_step": 510845, "epoch": 3040} {"train_loss": -12.766288757324219, "global_step": 510846, "epoch": 3040} {"train_loss": -13.048670768737793, "global_step": 510847, "epoch": 3040} {"train_loss": -12.88843822479248, "global_step": 510848, "epoch": 3040} {"train_loss": -12.893460273742676, "global_step": 510849, "epoch": 3040} {"train_loss": -12.808111190795898, "global_step": 510850, "epoch": 3040} {"train_loss": -12.797821044921875, "global_step": 510851, "epoch": 3040} {"train_loss": -13.12022876739502, "global_step": 510852, "epoch": 3040} {"train_loss": -12.770954132080078, "global_step": 510853, "epoch": 3040} {"train_loss": -12.737842559814453, "global_step": 510854, "epoch": 3040} {"train_loss": -12.602267265319824, "global_step": 510855, "epoch": 3040} {"train_loss": -12.524827003479004, "global_step": 510856, "epoch": 3040} {"train_loss": -12.504377365112305, "global_step": 510857, "epoch": 3040} {"train_loss": -13.211227416992188, "global_step": 510858, "epoch": 3040} {"train_loss": -12.807286262512207, "global_step": 510859, "epoch": 3040} {"train_loss": -11.838233947753906, "global_step": 510860, "epoch": 3040} {"train_loss": -12.480758666992188, "global_step": 510861, "epoch": 3040} {"train_loss": -12.660974502563477, "global_step": 510862, "epoch": 3040} {"train_loss": -11.965028762817383, "global_step": 510863, "epoch": 3040} {"train_loss": -11.564412117004395, "global_step": 510864, "epoch": 3040} {"train_loss": -9.723871231079102, "global_step": 510865, "epoch": 3040} {"train_loss": -12.799566268920898, "global_step": 510866, "epoch": 3040} {"train_loss": -11.662820816040039, "global_step": 510867, "epoch": 3040} {"train_loss": -11.339970588684082, "global_step": 510868, "epoch": 3040} {"train_loss": -11.913661003112793, "global_step": 510869, "epoch": 3040} {"train_loss": -12.903982162475586, "global_step": 510870, "epoch": 3040} {"train_loss": -12.27756118774414, "global_step": 510871, "epoch": 3040} {"train_loss": -12.14077377319336, "global_step": 510872, "epoch": 3040} {"train_loss": -12.261536598205566, "global_step": 510873, "epoch": 3040} {"train_loss": -12.012445449829102, "global_step": 510874, "epoch": 3040} {"train_loss": -12.290933609008789, "global_step": 510875, "epoch": 3040} {"train_loss": -12.571017265319824, "global_step": 510876, "epoch": 3040} {"train_loss": -12.202507972717285, "global_step": 510877, "epoch": 3040} {"train_loss": -11.051191329956055, "global_step": 510878, "epoch": 3040} {"train_loss": -10.567679405212402, "global_step": 510879, "epoch": 3040} {"train_loss": -12.699965476989746, "global_step": 510880, "epoch": 3040} {"train_loss": -12.123313903808594, "global_step": 510881, "epoch": 3040} {"train_loss": -12.300407409667969, "global_step": 510882, "epoch": 3040} {"train_loss": -12.641704559326172, "global_step": 510883, "epoch": 3040} {"train_loss": -12.338991165161133, "global_step": 510884, "epoch": 3040} {"train_loss": -11.590715408325195, "global_step": 510885, "epoch": 3040} {"train_loss": -12.125640869140625, "global_step": 510886, "epoch": 3040} {"train_loss": -12.344751534007845, "global_step": 510887, "epoch": 3040, "val_loss": 314213.75, "train_action_mse_error": 1.3853096961975098} {"train_loss": -12.253745079040527, "global_step": 510888, "epoch": 3041} {"train_loss": -12.549182891845703, "global_step": 510889, "epoch": 3041} {"train_loss": -12.570084571838379, "global_step": 510890, "epoch": 3041} {"train_loss": -12.369112014770508, "global_step": 510891, "epoch": 3041} {"train_loss": -12.16553020477295, "global_step": 510892, "epoch": 3041} {"train_loss": -12.740829467773438, "global_step": 510893, "epoch": 3041} {"train_loss": -12.183873176574707, "global_step": 510894, "epoch": 3041} {"train_loss": -11.759448051452637, "global_step": 510895, "epoch": 3041} {"train_loss": -12.856311798095703, "global_step": 510896, "epoch": 3041} {"train_loss": -12.000212669372559, "global_step": 510897, "epoch": 3041} {"train_loss": -12.577871322631836, "global_step": 510898, "epoch": 3041} {"train_loss": -12.817574501037598, "global_step": 510899, "epoch": 3041} {"train_loss": -12.620595932006836, "global_step": 510900, "epoch": 3041} {"train_loss": -12.433349609375, "global_step": 510901, "epoch": 3041} {"train_loss": -12.827581405639648, "global_step": 510902, "epoch": 3041} {"train_loss": -12.317140579223633, "global_step": 510903, "epoch": 3041} {"train_loss": -12.157197952270508, "global_step": 510904, "epoch": 3041} {"train_loss": -12.701555252075195, "global_step": 510905, "epoch": 3041} {"train_loss": -12.620975494384766, "global_step": 510906, "epoch": 3041} {"train_loss": -12.295770645141602, "global_step": 510907, "epoch": 3041} {"train_loss": -12.725055694580078, "global_step": 510908, "epoch": 3041} {"train_loss": -11.942251205444336, "global_step": 510909, "epoch": 3041} {"train_loss": -11.514549255371094, "global_step": 510910, "epoch": 3041} {"train_loss": -12.623226165771484, "global_step": 510911, "epoch": 3041} {"train_loss": -11.970797538757324, "global_step": 510912, "epoch": 3041} {"train_loss": -12.125248908996582, "global_step": 510913, "epoch": 3041} {"train_loss": -12.465296745300293, "global_step": 510914, "epoch": 3041} {"train_loss": -12.367218971252441, "global_step": 510915, "epoch": 3041} {"train_loss": -12.541024208068848, "global_step": 510916, "epoch": 3041} {"train_loss": -12.528550148010254, "global_step": 510917, "epoch": 3041} {"train_loss": -12.647239685058594, "global_step": 510918, "epoch": 3041} {"train_loss": -12.53005599975586, "global_step": 510919, "epoch": 3041} {"train_loss": -12.394996643066406, "global_step": 510920, "epoch": 3041} {"train_loss": -12.667154312133789, "global_step": 510921, "epoch": 3041} {"train_loss": -12.393033027648926, "global_step": 510922, "epoch": 3041} {"train_loss": -12.352960586547852, "global_step": 510923, "epoch": 3041} {"train_loss": -12.690622329711914, "global_step": 510924, "epoch": 3041} {"train_loss": -12.861672401428223, "global_step": 510925, "epoch": 3041} {"train_loss": -12.62551212310791, "global_step": 510926, "epoch": 3041} {"train_loss": -12.896728515625, "global_step": 510927, "epoch": 3041} {"train_loss": -12.657954216003418, "global_step": 510928, "epoch": 3041} {"train_loss": -12.364456176757812, "global_step": 510929, "epoch": 3041} {"train_loss": -12.56397533416748, "global_step": 510930, "epoch": 3041} {"train_loss": -12.542696952819824, "global_step": 510931, "epoch": 3041} {"train_loss": -12.427724838256836, "global_step": 510932, "epoch": 3041} {"train_loss": -12.65556526184082, "global_step": 510933, "epoch": 3041} {"train_loss": -12.767675399780273, "global_step": 510934, "epoch": 3041} {"train_loss": -12.142375946044922, "global_step": 510935, "epoch": 3041} {"train_loss": -12.628166198730469, "global_step": 510936, "epoch": 3041} {"train_loss": -12.428047180175781, "global_step": 510937, "epoch": 3041} {"train_loss": -12.324856758117676, "global_step": 510938, "epoch": 3041} {"train_loss": -12.771677017211914, "global_step": 510939, "epoch": 3041} {"train_loss": -11.716512680053711, "global_step": 510940, "epoch": 3041} {"train_loss": -12.57269287109375, "global_step": 510941, "epoch": 3041} {"train_loss": -12.686239242553711, "global_step": 510942, "epoch": 3041} {"train_loss": -12.468017578125, "global_step": 510943, "epoch": 3041} {"train_loss": -12.462031364440918, "global_step": 510944, "epoch": 3041} {"train_loss": -12.943617820739746, "global_step": 510945, "epoch": 3041} {"train_loss": -12.36823844909668, "global_step": 510946, "epoch": 3041} {"train_loss": -12.484688758850098, "global_step": 510947, "epoch": 3041} {"train_loss": -12.637441635131836, "global_step": 510948, "epoch": 3041} {"train_loss": -12.674768447875977, "global_step": 510949, "epoch": 3041} {"train_loss": -12.757755279541016, "global_step": 510950, "epoch": 3041} {"train_loss": -12.956915855407715, "global_step": 510951, "epoch": 3041} {"train_loss": -12.408650398254395, "global_step": 510952, "epoch": 3041} {"train_loss": -12.839676856994629, "global_step": 510953, "epoch": 3041} {"train_loss": -12.611173629760742, "global_step": 510954, "epoch": 3041} {"train_loss": -12.934412956237793, "global_step": 510955, "epoch": 3041} {"train_loss": -12.929634094238281, "global_step": 510956, "epoch": 3041} {"train_loss": -12.283207893371582, "global_step": 510957, "epoch": 3041} {"train_loss": -12.722772598266602, "global_step": 510958, "epoch": 3041} {"train_loss": -12.627252578735352, "global_step": 510959, "epoch": 3041} {"train_loss": -12.645731925964355, "global_step": 510960, "epoch": 3041} {"train_loss": -13.040984153747559, "global_step": 510961, "epoch": 3041} {"train_loss": -12.737316131591797, "global_step": 510962, "epoch": 3041} {"train_loss": -12.682588577270508, "global_step": 510963, "epoch": 3041} {"train_loss": -12.482954025268555, "global_step": 510964, "epoch": 3041} {"train_loss": -11.989944458007812, "global_step": 510965, "epoch": 3041} {"train_loss": -12.594985961914062, "global_step": 510966, "epoch": 3041} {"train_loss": -13.029918670654297, "global_step": 510967, "epoch": 3041} {"train_loss": -12.331524848937988, "global_step": 510968, "epoch": 3041} {"train_loss": -12.991408348083496, "global_step": 510969, "epoch": 3041} {"train_loss": -12.546392440795898, "global_step": 510970, "epoch": 3041} {"train_loss": -12.786441802978516, "global_step": 510971, "epoch": 3041} {"train_loss": -12.874765396118164, "global_step": 510972, "epoch": 3041} {"train_loss": -12.538273811340332, "global_step": 510973, "epoch": 3041} {"train_loss": -12.618648529052734, "global_step": 510974, "epoch": 3041} {"train_loss": -12.804433822631836, "global_step": 510975, "epoch": 3041} {"train_loss": -11.96529769897461, "global_step": 510976, "epoch": 3041} {"train_loss": -12.517910957336426, "global_step": 510977, "epoch": 3041} {"train_loss": -12.62305736541748, "global_step": 510978, "epoch": 3041} {"train_loss": -12.033824920654297, "global_step": 510979, "epoch": 3041} {"train_loss": -12.554302215576172, "global_step": 510980, "epoch": 3041} {"train_loss": -11.916778564453125, "global_step": 510981, "epoch": 3041} {"train_loss": -12.317876815795898, "global_step": 510982, "epoch": 3041} {"train_loss": -11.827581405639648, "global_step": 510983, "epoch": 3041} {"train_loss": -12.499683380126953, "global_step": 510984, "epoch": 3041} {"train_loss": -11.50487995147705, "global_step": 510985, "epoch": 3041} {"train_loss": -11.893453598022461, "global_step": 510986, "epoch": 3041} {"train_loss": -12.233831405639648, "global_step": 510987, "epoch": 3041} {"train_loss": -12.523124694824219, "global_step": 510988, "epoch": 3041} {"train_loss": -11.990161895751953, "global_step": 510989, "epoch": 3041} {"train_loss": -12.5392484664917, "global_step": 510990, "epoch": 3041} {"train_loss": -10.314531326293945, "global_step": 510991, "epoch": 3041} {"train_loss": -12.258852005004883, "global_step": 510992, "epoch": 3041} {"train_loss": -11.360837936401367, "global_step": 510993, "epoch": 3041} {"train_loss": -11.936553001403809, "global_step": 510994, "epoch": 3041} {"train_loss": -11.953327178955078, "global_step": 510995, "epoch": 3041} {"train_loss": -11.061871528625488, "global_step": 510996, "epoch": 3041} {"train_loss": -12.046965599060059, "global_step": 510997, "epoch": 3041} {"train_loss": -11.205731391906738, "global_step": 510998, "epoch": 3041} {"train_loss": -11.357439994812012, "global_step": 510999, "epoch": 3041} {"train_loss": -11.579788208007812, "global_step": 511000, "epoch": 3041} {"train_loss": -10.761520385742188, "global_step": 511001, "epoch": 3041} {"train_loss": -11.163976669311523, "global_step": 511002, "epoch": 3041} {"train_loss": -11.031954765319824, "global_step": 511003, "epoch": 3041} {"train_loss": -11.930032730102539, "global_step": 511004, "epoch": 3041} {"train_loss": -12.012073516845703, "global_step": 511005, "epoch": 3041} {"train_loss": -10.18226432800293, "global_step": 511006, "epoch": 3041} {"train_loss": -12.163497924804688, "global_step": 511007, "epoch": 3041} {"train_loss": -9.888334274291992, "global_step": 511008, "epoch": 3041} {"train_loss": -12.119241714477539, "global_step": 511009, "epoch": 3041} {"train_loss": -11.371379852294922, "global_step": 511010, "epoch": 3041} {"train_loss": -10.258703231811523, "global_step": 511011, "epoch": 3041} {"train_loss": -12.223627090454102, "global_step": 511012, "epoch": 3041} {"train_loss": -8.827213287353516, "global_step": 511013, "epoch": 3041} {"train_loss": -12.124709129333496, "global_step": 511014, "epoch": 3041} {"train_loss": -10.185964584350586, "global_step": 511015, "epoch": 3041} {"train_loss": -10.903985977172852, "global_step": 511016, "epoch": 3041} {"train_loss": -9.508378982543945, "global_step": 511017, "epoch": 3041} {"train_loss": -11.164408683776855, "global_step": 511018, "epoch": 3041} {"train_loss": -10.911210060119629, "global_step": 511019, "epoch": 3041} {"train_loss": -11.078187942504883, "global_step": 511020, "epoch": 3041} {"train_loss": -10.523719787597656, "global_step": 511021, "epoch": 3041} {"train_loss": -11.599821090698242, "global_step": 511022, "epoch": 3041} {"train_loss": -10.342968940734863, "global_step": 511023, "epoch": 3041} {"train_loss": -11.419527053833008, "global_step": 511024, "epoch": 3041} {"train_loss": -11.139167785644531, "global_step": 511025, "epoch": 3041} {"train_loss": -12.178821563720703, "global_step": 511026, "epoch": 3041} {"train_loss": -11.575542449951172, "global_step": 511027, "epoch": 3041} {"train_loss": -11.491608619689941, "global_step": 511028, "epoch": 3041} {"train_loss": -11.454051971435547, "global_step": 511029, "epoch": 3041} {"train_loss": -11.726272583007812, "global_step": 511030, "epoch": 3041} {"train_loss": -11.180624961853027, "global_step": 511031, "epoch": 3041} {"train_loss": -11.658281326293945, "global_step": 511032, "epoch": 3041} {"train_loss": -11.164566040039062, "global_step": 511033, "epoch": 3041} {"train_loss": -11.136394500732422, "global_step": 511034, "epoch": 3041} {"train_loss": -11.995609283447266, "global_step": 511035, "epoch": 3041} {"train_loss": -11.616732597351074, "global_step": 511036, "epoch": 3041} {"train_loss": -12.30724811553955, "global_step": 511037, "epoch": 3041} {"train_loss": -11.758829116821289, "global_step": 511038, "epoch": 3041} {"train_loss": -12.30447006225586, "global_step": 511039, "epoch": 3041} {"train_loss": -11.665653228759766, "global_step": 511040, "epoch": 3041} {"train_loss": -12.684309005737305, "global_step": 511041, "epoch": 3041} {"train_loss": -12.11960220336914, "global_step": 511042, "epoch": 3041} {"train_loss": -12.412803649902344, "global_step": 511043, "epoch": 3041} {"train_loss": -11.704435348510742, "global_step": 511044, "epoch": 3041} {"train_loss": -12.196006774902344, "global_step": 511045, "epoch": 3041} {"train_loss": -12.319889068603516, "global_step": 511046, "epoch": 3041} {"train_loss": -11.996837615966797, "global_step": 511047, "epoch": 3041} {"train_loss": -12.108160018920898, "global_step": 511048, "epoch": 3041} {"train_loss": -12.08655834197998, "global_step": 511049, "epoch": 3041} {"train_loss": -12.15283203125, "global_step": 511050, "epoch": 3041} {"train_loss": -12.175813674926758, "global_step": 511051, "epoch": 3041} {"train_loss": -12.20782470703125, "global_step": 511052, "epoch": 3041} {"train_loss": -11.99758243560791, "global_step": 511053, "epoch": 3041} {"train_loss": -12.341004371643066, "global_step": 511054, "epoch": 3041} {"train_loss": -12.102799869719005, "global_step": 511055, "epoch": 3041, "val_loss": 320252.6875} {"train_loss": -12.330118179321289, "global_step": 511056, "epoch": 3042} {"train_loss": -12.312801361083984, "global_step": 511057, "epoch": 3042} {"train_loss": -12.102163314819336, "global_step": 511058, "epoch": 3042} {"train_loss": -12.034732818603516, "global_step": 511059, "epoch": 3042} {"train_loss": -12.23141860961914, "global_step": 511060, "epoch": 3042} {"train_loss": -12.105008125305176, "global_step": 511061, "epoch": 3042} {"train_loss": -12.321186065673828, "global_step": 511062, "epoch": 3042} {"train_loss": -12.579183578491211, "global_step": 511063, "epoch": 3042} {"train_loss": -12.32595443725586, "global_step": 511064, "epoch": 3042} {"train_loss": -12.369596481323242, "global_step": 511065, "epoch": 3042} {"train_loss": -12.624746322631836, "global_step": 511066, "epoch": 3042} {"train_loss": -12.564499855041504, "global_step": 511067, "epoch": 3042} {"train_loss": -12.416145324707031, "global_step": 511068, "epoch": 3042} {"train_loss": -12.512441635131836, "global_step": 511069, "epoch": 3042} {"train_loss": -12.16379165649414, "global_step": 511070, "epoch": 3042} {"train_loss": -12.502853393554688, "global_step": 511071, "epoch": 3042} {"train_loss": -12.462955474853516, "global_step": 511072, "epoch": 3042} {"train_loss": -12.541858673095703, "global_step": 511073, "epoch": 3042} {"train_loss": -12.500900268554688, "global_step": 511074, "epoch": 3042} {"train_loss": -12.589948654174805, "global_step": 511075, "epoch": 3042} {"train_loss": -12.718360900878906, "global_step": 511076, "epoch": 3042} {"train_loss": -12.775888442993164, "global_step": 511077, "epoch": 3042} {"train_loss": -12.356971740722656, "global_step": 511078, "epoch": 3042} {"train_loss": -12.500658988952637, "global_step": 511079, "epoch": 3042} {"train_loss": -12.788042068481445, "global_step": 511080, "epoch": 3042} {"train_loss": -12.545690536499023, "global_step": 511081, "epoch": 3042} {"train_loss": -12.556831359863281, "global_step": 511082, "epoch": 3042} {"train_loss": -12.739303588867188, "global_step": 511083, "epoch": 3042} {"train_loss": -12.535894393920898, "global_step": 511084, "epoch": 3042} {"train_loss": -12.604350090026855, "global_step": 511085, "epoch": 3042} {"train_loss": -12.71884536743164, "global_step": 511086, "epoch": 3042} {"train_loss": -12.709182739257812, "global_step": 511087, "epoch": 3042} {"train_loss": -12.721515655517578, "global_step": 511088, "epoch": 3042} {"train_loss": -12.867002487182617, "global_step": 511089, "epoch": 3042} {"train_loss": -12.148054122924805, "global_step": 511090, "epoch": 3042} {"train_loss": -12.408432960510254, "global_step": 511091, "epoch": 3042} {"train_loss": -12.349996566772461, "global_step": 511092, "epoch": 3042} {"train_loss": -12.650747299194336, "global_step": 511093, "epoch": 3042} {"train_loss": -12.592552185058594, "global_step": 511094, "epoch": 3042} {"train_loss": -12.910665512084961, "global_step": 511095, "epoch": 3042} {"train_loss": -12.404363632202148, "global_step": 511096, "epoch": 3042} {"train_loss": -12.772516250610352, "global_step": 511097, "epoch": 3042} {"train_loss": -12.668964385986328, "global_step": 511098, "epoch": 3042} {"train_loss": -12.609678268432617, "global_step": 511099, "epoch": 3042} {"train_loss": -12.56103801727295, "global_step": 511100, "epoch": 3042} {"train_loss": -12.97201919555664, "global_step": 511101, "epoch": 3042} {"train_loss": -12.746088027954102, "global_step": 511102, "epoch": 3042} {"train_loss": -12.640403747558594, "global_step": 511103, "epoch": 3042} {"train_loss": -12.799407958984375, "global_step": 511104, "epoch": 3042} {"train_loss": -12.712735176086426, "global_step": 511105, "epoch": 3042} {"train_loss": -13.059913635253906, "global_step": 511106, "epoch": 3042} {"train_loss": -12.797598838806152, "global_step": 511107, "epoch": 3042} {"train_loss": -12.806987762451172, "global_step": 511108, "epoch": 3042} {"train_loss": -12.80572509765625, "global_step": 511109, "epoch": 3042} {"train_loss": -12.677657127380371, "global_step": 511110, "epoch": 3042} {"train_loss": -13.089735984802246, "global_step": 511111, "epoch": 3042} {"train_loss": -12.621452331542969, "global_step": 511112, "epoch": 3042} {"train_loss": -12.711912155151367, "global_step": 511113, "epoch": 3042} {"train_loss": -12.629767417907715, "global_step": 511114, "epoch": 3042} {"train_loss": -12.970144271850586, "global_step": 511115, "epoch": 3042} {"train_loss": -12.46709156036377, "global_step": 511116, "epoch": 3042} {"train_loss": -12.651880264282227, "global_step": 511117, "epoch": 3042} {"train_loss": -13.065494537353516, "global_step": 511118, "epoch": 3042} {"train_loss": -12.559776306152344, "global_step": 511119, "epoch": 3042} {"train_loss": -12.735246658325195, "global_step": 511120, "epoch": 3042} {"train_loss": -12.745494842529297, "global_step": 511121, "epoch": 3042} {"train_loss": -12.945852279663086, "global_step": 511122, "epoch": 3042} {"train_loss": -12.591890335083008, "global_step": 511123, "epoch": 3042} {"train_loss": -12.757434844970703, "global_step": 511124, "epoch": 3042} {"train_loss": -12.996611595153809, "global_step": 511125, "epoch": 3042} {"train_loss": -12.891887664794922, "global_step": 511126, "epoch": 3042} {"train_loss": -13.006022453308105, "global_step": 511127, "epoch": 3042} {"train_loss": -12.59199333190918, "global_step": 511128, "epoch": 3042} {"train_loss": -12.775594711303711, "global_step": 511129, "epoch": 3042} {"train_loss": -12.970403671264648, "global_step": 511130, "epoch": 3042} {"train_loss": -12.275150299072266, "global_step": 511131, "epoch": 3042} {"train_loss": -12.028608322143555, "global_step": 511132, "epoch": 3042} {"train_loss": -12.276315689086914, "global_step": 511133, "epoch": 3042} {"train_loss": -12.793197631835938, "global_step": 511134, "epoch": 3042} {"train_loss": -11.547633171081543, "global_step": 511135, "epoch": 3042} {"train_loss": -11.038543701171875, "global_step": 511136, "epoch": 3042} {"train_loss": -11.618306159973145, "global_step": 511137, "epoch": 3042} {"train_loss": -12.449195861816406, "global_step": 511138, "epoch": 3042} {"train_loss": -10.851015090942383, "global_step": 511139, "epoch": 3042} {"train_loss": -11.672801971435547, "global_step": 511140, "epoch": 3042} {"train_loss": -9.771148681640625, "global_step": 511141, "epoch": 3042} {"train_loss": -9.851329803466797, "global_step": 511142, "epoch": 3042} {"train_loss": -9.385468482971191, "global_step": 511143, "epoch": 3042} {"train_loss": -9.739898681640625, "global_step": 511144, "epoch": 3042} {"train_loss": -10.455085754394531, "global_step": 511145, "epoch": 3042} {"train_loss": -10.433553695678711, "global_step": 511146, "epoch": 3042} {"train_loss": -9.91086196899414, "global_step": 511147, "epoch": 3042} {"train_loss": -10.717411994934082, "global_step": 511148, "epoch": 3042} {"train_loss": -10.27186107635498, "global_step": 511149, "epoch": 3042} {"train_loss": -11.301313400268555, "global_step": 511150, "epoch": 3042} {"train_loss": -10.440670013427734, "global_step": 511151, "epoch": 3042} {"train_loss": -10.642858505249023, "global_step": 511152, "epoch": 3042} {"train_loss": -11.298639297485352, "global_step": 511153, "epoch": 3042} {"train_loss": -9.963363647460938, "global_step": 511154, "epoch": 3042} {"train_loss": -11.658842086791992, "global_step": 511155, "epoch": 3042} {"train_loss": -10.014952659606934, "global_step": 511156, "epoch": 3042} {"train_loss": -12.12126350402832, "global_step": 511157, "epoch": 3042} {"train_loss": -11.469099998474121, "global_step": 511158, "epoch": 3042} {"train_loss": -11.959312438964844, "global_step": 511159, "epoch": 3042} {"train_loss": -11.042808532714844, "global_step": 511160, "epoch": 3042} {"train_loss": -11.677970886230469, "global_step": 511161, "epoch": 3042} {"train_loss": -10.76910400390625, "global_step": 511162, "epoch": 3042} {"train_loss": -12.345022201538086, "global_step": 511163, "epoch": 3042} {"train_loss": -11.188214302062988, "global_step": 511164, "epoch": 3042} {"train_loss": -11.781364440917969, "global_step": 511165, "epoch": 3042} {"train_loss": -12.397575378417969, "global_step": 511166, "epoch": 3042} {"train_loss": -11.16471004486084, "global_step": 511167, "epoch": 3042} {"train_loss": -12.304121017456055, "global_step": 511168, "epoch": 3042} {"train_loss": -11.40682601928711, "global_step": 511169, "epoch": 3042} {"train_loss": -11.938230514526367, "global_step": 511170, "epoch": 3042} {"train_loss": -11.540760040283203, "global_step": 511171, "epoch": 3042} {"train_loss": -12.21771240234375, "global_step": 511172, "epoch": 3042} {"train_loss": -11.573663711547852, "global_step": 511173, "epoch": 3042} {"train_loss": -12.455476760864258, "global_step": 511174, "epoch": 3042} {"train_loss": -12.416722297668457, "global_step": 511175, "epoch": 3042} {"train_loss": -12.545141220092773, "global_step": 511176, "epoch": 3042} {"train_loss": -12.206886291503906, "global_step": 511177, "epoch": 3042} {"train_loss": -12.108132362365723, "global_step": 511178, "epoch": 3042} {"train_loss": -12.4434814453125, "global_step": 511179, "epoch": 3042} {"train_loss": -11.835977554321289, "global_step": 511180, "epoch": 3042} {"train_loss": -12.398080825805664, "global_step": 511181, "epoch": 3042} {"train_loss": -11.929530143737793, "global_step": 511182, "epoch": 3042} {"train_loss": -12.235699653625488, "global_step": 511183, "epoch": 3042} {"train_loss": -11.91646671295166, "global_step": 511184, "epoch": 3042} {"train_loss": -11.837854385375977, "global_step": 511185, "epoch": 3042} {"train_loss": -12.232630729675293, "global_step": 511186, "epoch": 3042} {"train_loss": -12.30878734588623, "global_step": 511187, "epoch": 3042} {"train_loss": -12.278287887573242, "global_step": 511188, "epoch": 3042} {"train_loss": -12.345675468444824, "global_step": 511189, "epoch": 3042} {"train_loss": -12.343473434448242, "global_step": 511190, "epoch": 3042} {"train_loss": -12.469098091125488, "global_step": 511191, "epoch": 3042} {"train_loss": -12.29145622253418, "global_step": 511192, "epoch": 3042} {"train_loss": -12.704862594604492, "global_step": 511193, "epoch": 3042} {"train_loss": -12.365925788879395, "global_step": 511194, "epoch": 3042} {"train_loss": -12.60468864440918, "global_step": 511195, "epoch": 3042} {"train_loss": -12.543457984924316, "global_step": 511196, "epoch": 3042} {"train_loss": -12.604415893554688, "global_step": 511197, "epoch": 3042} {"train_loss": -12.41227912902832, "global_step": 511198, "epoch": 3042} {"train_loss": -12.337747573852539, "global_step": 511199, "epoch": 3042} {"train_loss": -12.532179832458496, "global_step": 511200, "epoch": 3042} {"train_loss": -12.711984634399414, "global_step": 511201, "epoch": 3042} {"train_loss": -12.737883567810059, "global_step": 511202, "epoch": 3042} {"train_loss": -12.534725189208984, "global_step": 511203, "epoch": 3042} {"train_loss": -12.560550689697266, "global_step": 511204, "epoch": 3042} {"train_loss": -12.623896598815918, "global_step": 511205, "epoch": 3042} {"train_loss": -12.710393905639648, "global_step": 511206, "epoch": 3042} {"train_loss": -12.691568374633789, "global_step": 511207, "epoch": 3042} {"train_loss": -12.537344932556152, "global_step": 511208, "epoch": 3042} {"train_loss": -12.333642959594727, "global_step": 511209, "epoch": 3042} {"train_loss": -12.353323936462402, "global_step": 511210, "epoch": 3042} {"train_loss": -12.667815208435059, "global_step": 511211, "epoch": 3042} {"train_loss": -12.53178596496582, "global_step": 511212, "epoch": 3042} {"train_loss": -12.702383041381836, "global_step": 511213, "epoch": 3042} {"train_loss": -12.651342391967773, "global_step": 511214, "epoch": 3042} {"train_loss": -12.730239868164062, "global_step": 511215, "epoch": 3042} {"train_loss": -12.75333023071289, "global_step": 511216, "epoch": 3042} {"train_loss": -12.943303108215332, "global_step": 511217, "epoch": 3042} {"train_loss": -12.547651290893555, "global_step": 511218, "epoch": 3042} {"train_loss": -12.572263717651367, "global_step": 511219, "epoch": 3042} {"train_loss": -12.609598159790039, "global_step": 511220, "epoch": 3042} {"train_loss": -12.571271896362305, "global_step": 511221, "epoch": 3042} {"train_loss": -12.662242889404297, "global_step": 511222, "epoch": 3042} {"train_loss": -12.22151213600522, "global_step": 511223, "epoch": 3042, "val_loss": 317126.78125} {"train_loss": -12.835522651672363, "global_step": 511224, "epoch": 3043} {"train_loss": -12.86117172241211, "global_step": 511225, "epoch": 3043} {"train_loss": -12.84048843383789, "global_step": 511226, "epoch": 3043} {"train_loss": -12.829835891723633, "global_step": 511227, "epoch": 3043} {"train_loss": -12.895671844482422, "global_step": 511228, "epoch": 3043} {"train_loss": -12.900074005126953, "global_step": 511229, "epoch": 3043} {"train_loss": -12.715121269226074, "global_step": 511230, "epoch": 3043} {"train_loss": -12.675050735473633, "global_step": 511231, "epoch": 3043} {"train_loss": -12.971435546875, "global_step": 511232, "epoch": 3043} {"train_loss": -12.731922149658203, "global_step": 511233, "epoch": 3043} {"train_loss": -12.824676513671875, "global_step": 511234, "epoch": 3043} {"train_loss": -13.029404640197754, "global_step": 511235, "epoch": 3043} {"train_loss": -13.050209045410156, "global_step": 511236, "epoch": 3043} {"train_loss": -12.615808486938477, "global_step": 511237, "epoch": 3043} {"train_loss": -12.881830215454102, "global_step": 511238, "epoch": 3043} {"train_loss": -12.46274185180664, "global_step": 511239, "epoch": 3043} {"train_loss": -12.98109245300293, "global_step": 511240, "epoch": 3043} {"train_loss": -12.813112258911133, "global_step": 511241, "epoch": 3043} {"train_loss": -12.630941390991211, "global_step": 511242, "epoch": 3043} {"train_loss": -12.882122039794922, "global_step": 511243, "epoch": 3043} {"train_loss": -12.95958137512207, "global_step": 511244, "epoch": 3043} {"train_loss": -12.658763885498047, "global_step": 511245, "epoch": 3043} {"train_loss": -12.98317813873291, "global_step": 511246, "epoch": 3043} {"train_loss": -12.848592758178711, "global_step": 511247, "epoch": 3043} {"train_loss": -12.662808418273926, "global_step": 511248, "epoch": 3043} {"train_loss": -12.865619659423828, "global_step": 511249, "epoch": 3043} {"train_loss": -12.708171844482422, "global_step": 511250, "epoch": 3043} {"train_loss": -12.923858642578125, "global_step": 511251, "epoch": 3043} {"train_loss": -12.874288558959961, "global_step": 511252, "epoch": 3043} {"train_loss": -12.924816131591797, "global_step": 511253, "epoch": 3043} {"train_loss": -12.859769821166992, "global_step": 511254, "epoch": 3043} {"train_loss": -12.862386703491211, "global_step": 511255, "epoch": 3043} {"train_loss": -12.894697189331055, "global_step": 511256, "epoch": 3043} {"train_loss": -13.118072509765625, "global_step": 511257, "epoch": 3043} {"train_loss": -12.89731502532959, "global_step": 511258, "epoch": 3043} {"train_loss": -13.124711990356445, "global_step": 511259, "epoch": 3043} {"train_loss": -12.74427604675293, "global_step": 511260, "epoch": 3043} {"train_loss": -12.978882789611816, "global_step": 511261, "epoch": 3043} {"train_loss": -12.38810920715332, "global_step": 511262, "epoch": 3043} {"train_loss": -12.80820369720459, "global_step": 511263, "epoch": 3043} {"train_loss": -12.677946090698242, "global_step": 511264, "epoch": 3043} {"train_loss": -12.52182388305664, "global_step": 511265, "epoch": 3043} {"train_loss": -12.766399383544922, "global_step": 511266, "epoch": 3043} {"train_loss": -12.699323654174805, "global_step": 511267, "epoch": 3043} {"train_loss": -12.73716926574707, "global_step": 511268, "epoch": 3043} {"train_loss": -13.086380004882812, "global_step": 511269, "epoch": 3043} {"train_loss": -12.56054973602295, "global_step": 511270, "epoch": 3043} {"train_loss": -12.403647422790527, "global_step": 511271, "epoch": 3043} {"train_loss": -12.413135528564453, "global_step": 511272, "epoch": 3043} {"train_loss": -13.053735733032227, "global_step": 511273, "epoch": 3043} {"train_loss": -12.068042755126953, "global_step": 511274, "epoch": 3043} {"train_loss": -12.713417053222656, "global_step": 511275, "epoch": 3043} {"train_loss": -12.707905769348145, "global_step": 511276, "epoch": 3043} {"train_loss": -12.219379425048828, "global_step": 511277, "epoch": 3043} {"train_loss": -12.512300491333008, "global_step": 511278, "epoch": 3043} {"train_loss": -12.808049201965332, "global_step": 511279, "epoch": 3043} {"train_loss": -12.86617374420166, "global_step": 511280, "epoch": 3043} {"train_loss": -12.212201118469238, "global_step": 511281, "epoch": 3043} {"train_loss": -12.90117073059082, "global_step": 511282, "epoch": 3043} {"train_loss": -12.564399719238281, "global_step": 511283, "epoch": 3043} {"train_loss": -11.848260879516602, "global_step": 511284, "epoch": 3043} {"train_loss": -12.504629135131836, "global_step": 511285, "epoch": 3043} {"train_loss": -12.87326431274414, "global_step": 511286, "epoch": 3043} {"train_loss": -12.347951889038086, "global_step": 511287, "epoch": 3043} {"train_loss": -12.271363258361816, "global_step": 511288, "epoch": 3043} {"train_loss": -12.71977424621582, "global_step": 511289, "epoch": 3043} {"train_loss": -12.761059761047363, "global_step": 511290, "epoch": 3043} {"train_loss": -12.720144271850586, "global_step": 511291, "epoch": 3043} {"train_loss": -12.794644355773926, "global_step": 511292, "epoch": 3043} {"train_loss": -12.902860641479492, "global_step": 511293, "epoch": 3043} {"train_loss": -12.186880111694336, "global_step": 511294, "epoch": 3043} {"train_loss": -12.367424011230469, "global_step": 511295, "epoch": 3043} {"train_loss": -12.77745246887207, "global_step": 511296, "epoch": 3043} {"train_loss": -12.338911056518555, "global_step": 511297, "epoch": 3043} {"train_loss": -11.530797958374023, "global_step": 511298, "epoch": 3043} {"train_loss": -12.336359977722168, "global_step": 511299, "epoch": 3043} {"train_loss": -12.645044326782227, "global_step": 511300, "epoch": 3043} {"train_loss": -12.123544692993164, "global_step": 511301, "epoch": 3043} {"train_loss": -12.278606414794922, "global_step": 511302, "epoch": 3043} {"train_loss": -12.72876262664795, "global_step": 511303, "epoch": 3043} {"train_loss": -12.393397331237793, "global_step": 511304, "epoch": 3043} {"train_loss": -12.806652069091797, "global_step": 511305, "epoch": 3043} {"train_loss": -12.826802253723145, "global_step": 511306, "epoch": 3043} {"train_loss": -12.842219352722168, "global_step": 511307, "epoch": 3043} {"train_loss": -12.922680854797363, "global_step": 511308, "epoch": 3043} {"train_loss": -12.925363540649414, "global_step": 511309, "epoch": 3043} {"train_loss": -13.051054000854492, "global_step": 511310, "epoch": 3043} {"train_loss": -12.35194206237793, "global_step": 511311, "epoch": 3043} {"train_loss": -12.527517318725586, "global_step": 511312, "epoch": 3043} {"train_loss": -12.225643157958984, "global_step": 511313, "epoch": 3043} {"train_loss": -12.451883316040039, "global_step": 511314, "epoch": 3043} {"train_loss": -11.81432819366455, "global_step": 511315, "epoch": 3043} {"train_loss": -12.528039932250977, "global_step": 511316, "epoch": 3043} {"train_loss": -12.825647354125977, "global_step": 511317, "epoch": 3043} {"train_loss": -12.109420776367188, "global_step": 511318, "epoch": 3043} {"train_loss": -11.400123596191406, "global_step": 511319, "epoch": 3043} {"train_loss": -11.502799034118652, "global_step": 511320, "epoch": 3043} {"train_loss": -11.501676559448242, "global_step": 511321, "epoch": 3043} {"train_loss": -10.739986419677734, "global_step": 511322, "epoch": 3043} {"train_loss": -12.102386474609375, "global_step": 511323, "epoch": 3043} {"train_loss": -12.054295539855957, "global_step": 511324, "epoch": 3043} {"train_loss": -11.756422996520996, "global_step": 511325, "epoch": 3043} {"train_loss": -12.079544067382812, "global_step": 511326, "epoch": 3043} {"train_loss": -12.09788703918457, "global_step": 511327, "epoch": 3043} {"train_loss": -11.191844940185547, "global_step": 511328, "epoch": 3043} {"train_loss": -10.821269035339355, "global_step": 511329, "epoch": 3043} {"train_loss": -11.957469940185547, "global_step": 511330, "epoch": 3043} {"train_loss": -11.897026062011719, "global_step": 511331, "epoch": 3043} {"train_loss": -11.420642852783203, "global_step": 511332, "epoch": 3043} {"train_loss": -12.339008331298828, "global_step": 511333, "epoch": 3043} {"train_loss": -11.7529296875, "global_step": 511334, "epoch": 3043} {"train_loss": -11.818021774291992, "global_step": 511335, "epoch": 3043} {"train_loss": -10.956218719482422, "global_step": 511336, "epoch": 3043} {"train_loss": -12.43161392211914, "global_step": 511337, "epoch": 3043} {"train_loss": -11.529194831848145, "global_step": 511338, "epoch": 3043} {"train_loss": -11.940731048583984, "global_step": 511339, "epoch": 3043} {"train_loss": -11.889266967773438, "global_step": 511340, "epoch": 3043} {"train_loss": -11.939661026000977, "global_step": 511341, "epoch": 3043} {"train_loss": -11.636469841003418, "global_step": 511342, "epoch": 3043} {"train_loss": -11.914045333862305, "global_step": 511343, "epoch": 3043} {"train_loss": -12.077302932739258, "global_step": 511344, "epoch": 3043} {"train_loss": -11.457789421081543, "global_step": 511345, "epoch": 3043} {"train_loss": -12.22683048248291, "global_step": 511346, "epoch": 3043} {"train_loss": -12.176942825317383, "global_step": 511347, "epoch": 3043} {"train_loss": -11.797507286071777, "global_step": 511348, "epoch": 3043} {"train_loss": -11.8287935256958, "global_step": 511349, "epoch": 3043} {"train_loss": -11.396438598632812, "global_step": 511350, "epoch": 3043} {"train_loss": -12.14249038696289, "global_step": 511351, "epoch": 3043} {"train_loss": -11.509963989257812, "global_step": 511352, "epoch": 3043} {"train_loss": -11.638885498046875, "global_step": 511353, "epoch": 3043} {"train_loss": -12.130919456481934, "global_step": 511354, "epoch": 3043} {"train_loss": -12.471202850341797, "global_step": 511355, "epoch": 3043} {"train_loss": -11.669273376464844, "global_step": 511356, "epoch": 3043} {"train_loss": -12.550016403198242, "global_step": 511357, "epoch": 3043} {"train_loss": -11.865838050842285, "global_step": 511358, "epoch": 3043} {"train_loss": -11.990875244140625, "global_step": 511359, "epoch": 3043} {"train_loss": -11.990507125854492, "global_step": 511360, "epoch": 3043} {"train_loss": -10.911274909973145, "global_step": 511361, "epoch": 3043} {"train_loss": -11.764580726623535, "global_step": 511362, "epoch": 3043} {"train_loss": -11.8255615234375, "global_step": 511363, "epoch": 3043} {"train_loss": -11.499561309814453, "global_step": 511364, "epoch": 3043} {"train_loss": -11.766584396362305, "global_step": 511365, "epoch": 3043} {"train_loss": -11.985258102416992, "global_step": 511366, "epoch": 3043} {"train_loss": -12.075284004211426, "global_step": 511367, "epoch": 3043} {"train_loss": -11.858087539672852, "global_step": 511368, "epoch": 3043} {"train_loss": -12.520554542541504, "global_step": 511369, "epoch": 3043} {"train_loss": -11.386363983154297, "global_step": 511370, "epoch": 3043} {"train_loss": -11.951292991638184, "global_step": 511371, "epoch": 3043} {"train_loss": -12.038954734802246, "global_step": 511372, "epoch": 3043} {"train_loss": -11.572747230529785, "global_step": 511373, "epoch": 3043} {"train_loss": -12.209476470947266, "global_step": 511374, "epoch": 3043} {"train_loss": -12.04359245300293, "global_step": 511375, "epoch": 3043} {"train_loss": -12.248527526855469, "global_step": 511376, "epoch": 3043} {"train_loss": -12.5821533203125, "global_step": 511377, "epoch": 3043} {"train_loss": -12.646261215209961, "global_step": 511378, "epoch": 3043} {"train_loss": -12.653300285339355, "global_step": 511379, "epoch": 3043} {"train_loss": -12.367850303649902, "global_step": 511380, "epoch": 3043} {"train_loss": -12.716651916503906, "global_step": 511381, "epoch": 3043} {"train_loss": -12.205012321472168, "global_step": 511382, "epoch": 3043} {"train_loss": -12.750831604003906, "global_step": 511383, "epoch": 3043} {"train_loss": -12.40347671508789, "global_step": 511384, "epoch": 3043} {"train_loss": -13.023706436157227, "global_step": 511385, "epoch": 3043} {"train_loss": -12.276433944702148, "global_step": 511386, "epoch": 3043} {"train_loss": -12.521465301513672, "global_step": 511387, "epoch": 3043} {"train_loss": -12.57374382019043, "global_step": 511388, "epoch": 3043} {"train_loss": -12.627405166625977, "global_step": 511389, "epoch": 3043} {"train_loss": -12.45935344696045, "global_step": 511390, "epoch": 3043} {"train_loss": -12.365431138447352, "global_step": 511391, "epoch": 3043, "val_loss": 320373.53125} {"train_loss": -12.854643821716309, "global_step": 511392, "epoch": 3044} {"train_loss": -12.340360641479492, "global_step": 511393, "epoch": 3044} {"train_loss": -12.767335891723633, "global_step": 511394, "epoch": 3044} {"train_loss": -12.241459846496582, "global_step": 511395, "epoch": 3044} {"train_loss": -12.623745918273926, "global_step": 511396, "epoch": 3044} {"train_loss": -12.280867576599121, "global_step": 511397, "epoch": 3044} {"train_loss": -12.619803428649902, "global_step": 511398, "epoch": 3044} {"train_loss": -12.357929229736328, "global_step": 511399, "epoch": 3044} {"train_loss": -12.732538223266602, "global_step": 511400, "epoch": 3044} {"train_loss": -12.772825241088867, "global_step": 511401, "epoch": 3044} {"train_loss": -12.790655136108398, "global_step": 511402, "epoch": 3044} {"train_loss": -12.62907600402832, "global_step": 511403, "epoch": 3044} {"train_loss": -12.847616195678711, "global_step": 511404, "epoch": 3044} {"train_loss": -12.911667823791504, "global_step": 511405, "epoch": 3044} {"train_loss": -12.80626106262207, "global_step": 511406, "epoch": 3044} {"train_loss": -12.719316482543945, "global_step": 511407, "epoch": 3044} {"train_loss": -12.472319602966309, "global_step": 511408, "epoch": 3044} {"train_loss": -12.603973388671875, "global_step": 511409, "epoch": 3044} {"train_loss": -12.766629219055176, "global_step": 511410, "epoch": 3044} {"train_loss": -13.043092727661133, "global_step": 511411, "epoch": 3044} {"train_loss": -12.763167381286621, "global_step": 511412, "epoch": 3044} {"train_loss": -12.613592147827148, "global_step": 511413, "epoch": 3044} {"train_loss": -12.481861114501953, "global_step": 511414, "epoch": 3044} {"train_loss": -12.841541290283203, "global_step": 511415, "epoch": 3044} {"train_loss": -12.749435424804688, "global_step": 511416, "epoch": 3044} {"train_loss": -12.797279357910156, "global_step": 511417, "epoch": 3044} {"train_loss": -12.752634048461914, "global_step": 511418, "epoch": 3044} {"train_loss": -12.501559257507324, "global_step": 511419, "epoch": 3044} {"train_loss": -12.959175109863281, "global_step": 511420, "epoch": 3044} {"train_loss": -12.701786041259766, "global_step": 511421, "epoch": 3044} {"train_loss": -12.551348686218262, "global_step": 511422, "epoch": 3044} {"train_loss": -12.905611038208008, "global_step": 511423, "epoch": 3044} {"train_loss": -12.659344673156738, "global_step": 511424, "epoch": 3044} {"train_loss": -12.512678146362305, "global_step": 511425, "epoch": 3044} {"train_loss": -12.629983901977539, "global_step": 511426, "epoch": 3044} {"train_loss": -12.453104019165039, "global_step": 511427, "epoch": 3044} {"train_loss": -11.802074432373047, "global_step": 511428, "epoch": 3044} {"train_loss": -12.610151290893555, "global_step": 511429, "epoch": 3044} {"train_loss": -11.322301864624023, "global_step": 511430, "epoch": 3044} {"train_loss": -10.832372665405273, "global_step": 511431, "epoch": 3044} {"train_loss": -11.971381187438965, "global_step": 511432, "epoch": 3044} {"train_loss": -10.301046371459961, "global_step": 511433, "epoch": 3044} {"train_loss": -12.197023391723633, "global_step": 511434, "epoch": 3044} {"train_loss": -9.960234642028809, "global_step": 511435, "epoch": 3044} {"train_loss": -10.512773513793945, "global_step": 511436, "epoch": 3044} {"train_loss": -11.708906173706055, "global_step": 511437, "epoch": 3044} {"train_loss": -10.035619735717773, "global_step": 511438, "epoch": 3044} {"train_loss": -9.924583435058594, "global_step": 511439, "epoch": 3044} {"train_loss": -10.201131820678711, "global_step": 511440, "epoch": 3044} {"train_loss": -11.08415412902832, "global_step": 511441, "epoch": 3044} {"train_loss": -11.244080543518066, "global_step": 511442, "epoch": 3044} {"train_loss": -10.949041366577148, "global_step": 511443, "epoch": 3044} {"train_loss": -10.761362075805664, "global_step": 511444, "epoch": 3044} {"train_loss": -11.034948348999023, "global_step": 511445, "epoch": 3044} {"train_loss": -12.192777633666992, "global_step": 511446, "epoch": 3044} {"train_loss": -11.827422142028809, "global_step": 511447, "epoch": 3044} {"train_loss": -12.194786071777344, "global_step": 511448, "epoch": 3044} {"train_loss": -11.527823448181152, "global_step": 511449, "epoch": 3044} {"train_loss": -12.25927734375, "global_step": 511450, "epoch": 3044} {"train_loss": -12.074762344360352, "global_step": 511451, "epoch": 3044} {"train_loss": -12.102577209472656, "global_step": 511452, "epoch": 3044} {"train_loss": -11.90915584564209, "global_step": 511453, "epoch": 3044} {"train_loss": -12.011606216430664, "global_step": 511454, "epoch": 3044} {"train_loss": -12.561689376831055, "global_step": 511455, "epoch": 3044} {"train_loss": -12.448328018188477, "global_step": 511456, "epoch": 3044} {"train_loss": -12.437803268432617, "global_step": 511457, "epoch": 3044} {"train_loss": -12.34757137298584, "global_step": 511458, "epoch": 3044} {"train_loss": -12.142162322998047, "global_step": 511459, "epoch": 3044} {"train_loss": -12.8908109664917, "global_step": 511460, "epoch": 3044} {"train_loss": -12.764293670654297, "global_step": 511461, "epoch": 3044} {"train_loss": -12.38334846496582, "global_step": 511462, "epoch": 3044} {"train_loss": -12.345219612121582, "global_step": 511463, "epoch": 3044} {"train_loss": -12.021833419799805, "global_step": 511464, "epoch": 3044} {"train_loss": -12.654898643493652, "global_step": 511465, "epoch": 3044} {"train_loss": -12.219324111938477, "global_step": 511466, "epoch": 3044} {"train_loss": -12.472216606140137, "global_step": 511467, "epoch": 3044} {"train_loss": -12.392500877380371, "global_step": 511468, "epoch": 3044} {"train_loss": -12.494729042053223, "global_step": 511469, "epoch": 3044} {"train_loss": -12.379779815673828, "global_step": 511470, "epoch": 3044} {"train_loss": -12.453337669372559, "global_step": 511471, "epoch": 3044} {"train_loss": -12.367237091064453, "global_step": 511472, "epoch": 3044} {"train_loss": -12.588603973388672, "global_step": 511473, "epoch": 3044} {"train_loss": -12.59113597869873, "global_step": 511474, "epoch": 3044} {"train_loss": -12.64221477508545, "global_step": 511475, "epoch": 3044} {"train_loss": -12.250885963439941, "global_step": 511476, "epoch": 3044} {"train_loss": -12.50456428527832, "global_step": 511477, "epoch": 3044} {"train_loss": -12.760583877563477, "global_step": 511478, "epoch": 3044} {"train_loss": -12.674932479858398, "global_step": 511479, "epoch": 3044} {"train_loss": -12.693709373474121, "global_step": 511480, "epoch": 3044} {"train_loss": -12.551132202148438, "global_step": 511481, "epoch": 3044} {"train_loss": -12.959733009338379, "global_step": 511482, "epoch": 3044} {"train_loss": -12.826448440551758, "global_step": 511483, "epoch": 3044} {"train_loss": -12.981523513793945, "global_step": 511484, "epoch": 3044} {"train_loss": -12.859892845153809, "global_step": 511485, "epoch": 3044} {"train_loss": -12.614347457885742, "global_step": 511486, "epoch": 3044} {"train_loss": -12.796075820922852, "global_step": 511487, "epoch": 3044} {"train_loss": -12.94182014465332, "global_step": 511488, "epoch": 3044} {"train_loss": -12.831520080566406, "global_step": 511489, "epoch": 3044} {"train_loss": -13.040924072265625, "global_step": 511490, "epoch": 3044} {"train_loss": -12.997564315795898, "global_step": 511491, "epoch": 3044} {"train_loss": -13.040964126586914, "global_step": 511492, "epoch": 3044} {"train_loss": -12.839950561523438, "global_step": 511493, "epoch": 3044} {"train_loss": -12.77483081817627, "global_step": 511494, "epoch": 3044} {"train_loss": -12.925384521484375, "global_step": 511495, "epoch": 3044} {"train_loss": -12.775823593139648, "global_step": 511496, "epoch": 3044} {"train_loss": -12.505144119262695, "global_step": 511497, "epoch": 3044} {"train_loss": -12.893376350402832, "global_step": 511498, "epoch": 3044} {"train_loss": -12.725870132446289, "global_step": 511499, "epoch": 3044} {"train_loss": -12.525965690612793, "global_step": 511500, "epoch": 3044} {"train_loss": -12.892772674560547, "global_step": 511501, "epoch": 3044} {"train_loss": -12.37682056427002, "global_step": 511502, "epoch": 3044} {"train_loss": -12.878082275390625, "global_step": 511503, "epoch": 3044} {"train_loss": -12.79478645324707, "global_step": 511504, "epoch": 3044} {"train_loss": -12.607772827148438, "global_step": 511505, "epoch": 3044} {"train_loss": -12.818815231323242, "global_step": 511506, "epoch": 3044} {"train_loss": -12.973270416259766, "global_step": 511507, "epoch": 3044} {"train_loss": -11.7575101852417, "global_step": 511508, "epoch": 3044} {"train_loss": -12.198675155639648, "global_step": 511509, "epoch": 3044} {"train_loss": -12.872995376586914, "global_step": 511510, "epoch": 3044} {"train_loss": -12.596460342407227, "global_step": 511511, "epoch": 3044} {"train_loss": -11.980775833129883, "global_step": 511512, "epoch": 3044} {"train_loss": -12.906946182250977, "global_step": 511513, "epoch": 3044} {"train_loss": -12.55388069152832, "global_step": 511514, "epoch": 3044} {"train_loss": -12.548845291137695, "global_step": 511515, "epoch": 3044} {"train_loss": -12.587002754211426, "global_step": 511516, "epoch": 3044} {"train_loss": -12.594646453857422, "global_step": 511517, "epoch": 3044} {"train_loss": -12.228094100952148, "global_step": 511518, "epoch": 3044} {"train_loss": -12.676774978637695, "global_step": 511519, "epoch": 3044} {"train_loss": -12.605290412902832, "global_step": 511520, "epoch": 3044} {"train_loss": -12.101263999938965, "global_step": 511521, "epoch": 3044} {"train_loss": -11.940242767333984, "global_step": 511522, "epoch": 3044} {"train_loss": -12.648433685302734, "global_step": 511523, "epoch": 3044} {"train_loss": -12.137168884277344, "global_step": 511524, "epoch": 3044} {"train_loss": -12.16250228881836, "global_step": 511525, "epoch": 3044} {"train_loss": -11.803585052490234, "global_step": 511526, "epoch": 3044} {"train_loss": -12.248153686523438, "global_step": 511527, "epoch": 3044} {"train_loss": -12.561870574951172, "global_step": 511528, "epoch": 3044} {"train_loss": -11.936220169067383, "global_step": 511529, "epoch": 3044} {"train_loss": -12.421192169189453, "global_step": 511530, "epoch": 3044} {"train_loss": -12.357673645019531, "global_step": 511531, "epoch": 3044} {"train_loss": -11.977602005004883, "global_step": 511532, "epoch": 3044} {"train_loss": -12.433128356933594, "global_step": 511533, "epoch": 3044} {"train_loss": -12.411042213439941, "global_step": 511534, "epoch": 3044} {"train_loss": -12.598777770996094, "global_step": 511535, "epoch": 3044} {"train_loss": -12.576374053955078, "global_step": 511536, "epoch": 3044} {"train_loss": -12.220952987670898, "global_step": 511537, "epoch": 3044} {"train_loss": -12.94658374786377, "global_step": 511538, "epoch": 3044} {"train_loss": -12.573076248168945, "global_step": 511539, "epoch": 3044} {"train_loss": -12.697954177856445, "global_step": 511540, "epoch": 3044} {"train_loss": -12.656388282775879, "global_step": 511541, "epoch": 3044} {"train_loss": -12.5244140625, "global_step": 511542, "epoch": 3044} {"train_loss": -12.781045913696289, "global_step": 511543, "epoch": 3044} {"train_loss": -12.429863929748535, "global_step": 511544, "epoch": 3044} {"train_loss": -12.690084457397461, "global_step": 511545, "epoch": 3044} {"train_loss": -12.701639175415039, "global_step": 511546, "epoch": 3044} {"train_loss": -12.113851547241211, "global_step": 511547, "epoch": 3044} {"train_loss": -12.453469276428223, "global_step": 511548, "epoch": 3044} {"train_loss": -12.373292922973633, "global_step": 511549, "epoch": 3044} {"train_loss": -12.47382926940918, "global_step": 511550, "epoch": 3044} {"train_loss": -12.445953369140625, "global_step": 511551, "epoch": 3044} {"train_loss": -12.611356735229492, "global_step": 511552, "epoch": 3044} {"train_loss": -11.915933609008789, "global_step": 511553, "epoch": 3044} {"train_loss": -11.97443962097168, "global_step": 511554, "epoch": 3044} {"train_loss": -12.459514617919922, "global_step": 511555, "epoch": 3044} {"train_loss": -11.45401668548584, "global_step": 511556, "epoch": 3044} {"train_loss": -12.5800142288208, "global_step": 511557, "epoch": 3044} {"train_loss": -11.001518249511719, "global_step": 511558, "epoch": 3044} {"train_loss": -12.350236330713544, "global_step": 511559, "epoch": 3044, "val_loss": 321978.25} {"train_loss": -11.820938110351562, "global_step": 511560, "epoch": 3045} {"train_loss": -12.37926197052002, "global_step": 511561, "epoch": 3045} {"train_loss": -11.363471984863281, "global_step": 511562, "epoch": 3045} {"train_loss": -12.539012908935547, "global_step": 511563, "epoch": 3045} {"train_loss": -12.357452392578125, "global_step": 511564, "epoch": 3045} {"train_loss": -12.102778434753418, "global_step": 511565, "epoch": 3045} {"train_loss": -12.295295715332031, "global_step": 511566, "epoch": 3045} {"train_loss": -11.93097972869873, "global_step": 511567, "epoch": 3045} {"train_loss": -12.383064270019531, "global_step": 511568, "epoch": 3045} {"train_loss": -11.873772621154785, "global_step": 511569, "epoch": 3045} {"train_loss": -11.693412780761719, "global_step": 511570, "epoch": 3045} {"train_loss": -11.757984161376953, "global_step": 511571, "epoch": 3045} {"train_loss": -12.07748794555664, "global_step": 511572, "epoch": 3045} {"train_loss": -11.27241325378418, "global_step": 511573, "epoch": 3045} {"train_loss": -12.421833992004395, "global_step": 511574, "epoch": 3045} {"train_loss": -11.978710174560547, "global_step": 511575, "epoch": 3045} {"train_loss": -11.6766357421875, "global_step": 511576, "epoch": 3045} {"train_loss": -12.431527137756348, "global_step": 511577, "epoch": 3045} {"train_loss": -12.16594123840332, "global_step": 511578, "epoch": 3045} {"train_loss": -12.170469284057617, "global_step": 511579, "epoch": 3045} {"train_loss": -11.77608585357666, "global_step": 511580, "epoch": 3045} {"train_loss": -12.306326866149902, "global_step": 511581, "epoch": 3045} {"train_loss": -11.639047622680664, "global_step": 511582, "epoch": 3045} {"train_loss": -12.282342910766602, "global_step": 511583, "epoch": 3045} {"train_loss": -11.73100757598877, "global_step": 511584, "epoch": 3045} {"train_loss": -12.485553741455078, "global_step": 511585, "epoch": 3045} {"train_loss": -11.922611236572266, "global_step": 511586, "epoch": 3045} {"train_loss": -12.709874153137207, "global_step": 511587, "epoch": 3045} {"train_loss": -12.114233016967773, "global_step": 511588, "epoch": 3045} {"train_loss": -12.637092590332031, "global_step": 511589, "epoch": 3045} {"train_loss": -12.53603458404541, "global_step": 511590, "epoch": 3045} {"train_loss": -12.8892822265625, "global_step": 511591, "epoch": 3045} {"train_loss": -12.748357772827148, "global_step": 511592, "epoch": 3045} {"train_loss": -12.658404350280762, "global_step": 511593, "epoch": 3045} {"train_loss": -12.38979721069336, "global_step": 511594, "epoch": 3045} {"train_loss": -12.76681900024414, "global_step": 511595, "epoch": 3045} {"train_loss": -12.6456298828125, "global_step": 511596, "epoch": 3045} {"train_loss": -12.64161491394043, "global_step": 511597, "epoch": 3045} {"train_loss": -12.726678848266602, "global_step": 511598, "epoch": 3045} {"train_loss": -12.669315338134766, "global_step": 511599, "epoch": 3045} {"train_loss": -12.609338760375977, "global_step": 511600, "epoch": 3045} {"train_loss": -12.88693618774414, "global_step": 511601, "epoch": 3045} {"train_loss": -12.680583953857422, "global_step": 511602, "epoch": 3045} {"train_loss": -12.850666046142578, "global_step": 511603, "epoch": 3045} {"train_loss": -12.72305679321289, "global_step": 511604, "epoch": 3045} {"train_loss": -12.810320854187012, "global_step": 511605, "epoch": 3045} {"train_loss": -12.678380966186523, "global_step": 511606, "epoch": 3045} {"train_loss": -12.843456268310547, "global_step": 511607, "epoch": 3045} {"train_loss": -13.077686309814453, "global_step": 511608, "epoch": 3045} {"train_loss": -13.043006896972656, "global_step": 511609, "epoch": 3045} {"train_loss": -12.75637435913086, "global_step": 511610, "epoch": 3045} {"train_loss": -12.162615776062012, "global_step": 511611, "epoch": 3045} {"train_loss": -13.043116569519043, "global_step": 511612, "epoch": 3045} {"train_loss": -12.38703727722168, "global_step": 511613, "epoch": 3045} {"train_loss": -12.692243576049805, "global_step": 511614, "epoch": 3045} {"train_loss": -12.9043550491333, "global_step": 511615, "epoch": 3045} {"train_loss": -12.388002395629883, "global_step": 511616, "epoch": 3045} {"train_loss": -12.588495254516602, "global_step": 511617, "epoch": 3045} {"train_loss": -12.588160514831543, "global_step": 511618, "epoch": 3045} {"train_loss": -12.428939819335938, "global_step": 511619, "epoch": 3045} {"train_loss": -13.049297332763672, "global_step": 511620, "epoch": 3045} {"train_loss": -12.098767280578613, "global_step": 511621, "epoch": 3045} {"train_loss": -12.486578941345215, "global_step": 511622, "epoch": 3045} {"train_loss": -12.687016487121582, "global_step": 511623, "epoch": 3045} {"train_loss": -12.793630599975586, "global_step": 511624, "epoch": 3045} {"train_loss": -12.740428924560547, "global_step": 511625, "epoch": 3045} {"train_loss": -12.628951072692871, "global_step": 511626, "epoch": 3045} {"train_loss": -12.770574569702148, "global_step": 511627, "epoch": 3045} {"train_loss": -12.575150489807129, "global_step": 511628, "epoch": 3045} {"train_loss": -12.408052444458008, "global_step": 511629, "epoch": 3045} {"train_loss": -12.650257110595703, "global_step": 511630, "epoch": 3045} {"train_loss": -12.242240905761719, "global_step": 511631, "epoch": 3045} {"train_loss": -12.752477645874023, "global_step": 511632, "epoch": 3045} {"train_loss": -12.674995422363281, "global_step": 511633, "epoch": 3045} {"train_loss": -13.00806999206543, "global_step": 511634, "epoch": 3045} {"train_loss": -12.481301307678223, "global_step": 511635, "epoch": 3045} {"train_loss": -12.765483856201172, "global_step": 511636, "epoch": 3045} {"train_loss": -12.768487930297852, "global_step": 511637, "epoch": 3045} {"train_loss": -12.832923889160156, "global_step": 511638, "epoch": 3045} {"train_loss": -12.90458869934082, "global_step": 511639, "epoch": 3045} {"train_loss": -12.932012557983398, "global_step": 511640, "epoch": 3045} {"train_loss": -12.865452766418457, "global_step": 511641, "epoch": 3045} {"train_loss": -12.964895248413086, "global_step": 511642, "epoch": 3045} {"train_loss": -12.91757869720459, "global_step": 511643, "epoch": 3045} {"train_loss": -12.684389114379883, "global_step": 511644, "epoch": 3045} {"train_loss": -12.350359916687012, "global_step": 511645, "epoch": 3045} {"train_loss": -12.72043228149414, "global_step": 511646, "epoch": 3045} {"train_loss": -12.646391868591309, "global_step": 511647, "epoch": 3045} {"train_loss": -12.644373893737793, "global_step": 511648, "epoch": 3045} {"train_loss": -12.08047103881836, "global_step": 511649, "epoch": 3045} {"train_loss": -12.694425582885742, "global_step": 511650, "epoch": 3045} {"train_loss": -12.206123352050781, "global_step": 511651, "epoch": 3045} {"train_loss": -12.079787254333496, "global_step": 511652, "epoch": 3045} {"train_loss": -12.562088966369629, "global_step": 511653, "epoch": 3045} {"train_loss": -12.529678344726562, "global_step": 511654, "epoch": 3045} {"train_loss": -12.434623718261719, "global_step": 511655, "epoch": 3045} {"train_loss": -12.695755004882812, "global_step": 511656, "epoch": 3045} {"train_loss": -12.662418365478516, "global_step": 511657, "epoch": 3045} {"train_loss": -12.79450798034668, "global_step": 511658, "epoch": 3045} {"train_loss": -12.4306640625, "global_step": 511659, "epoch": 3045} {"train_loss": -12.27639389038086, "global_step": 511660, "epoch": 3045} {"train_loss": -12.06706428527832, "global_step": 511661, "epoch": 3045} {"train_loss": -12.493916511535645, "global_step": 511662, "epoch": 3045} {"train_loss": -12.450984954833984, "global_step": 511663, "epoch": 3045} {"train_loss": -12.495359420776367, "global_step": 511664, "epoch": 3045} {"train_loss": -12.214305877685547, "global_step": 511665, "epoch": 3045} {"train_loss": -12.621861457824707, "global_step": 511666, "epoch": 3045} {"train_loss": -12.553570747375488, "global_step": 511667, "epoch": 3045} {"train_loss": -12.39603328704834, "global_step": 511668, "epoch": 3045} {"train_loss": -12.870460510253906, "global_step": 511669, "epoch": 3045} {"train_loss": -12.509184837341309, "global_step": 511670, "epoch": 3045} {"train_loss": -12.247515678405762, "global_step": 511671, "epoch": 3045} {"train_loss": -11.843120574951172, "global_step": 511672, "epoch": 3045} {"train_loss": -12.561441421508789, "global_step": 511673, "epoch": 3045} {"train_loss": -12.219923973083496, "global_step": 511674, "epoch": 3045} {"train_loss": -12.254735946655273, "global_step": 511675, "epoch": 3045} {"train_loss": -12.053376197814941, "global_step": 511676, "epoch": 3045} {"train_loss": -12.058464050292969, "global_step": 511677, "epoch": 3045} {"train_loss": -11.460174560546875, "global_step": 511678, "epoch": 3045} {"train_loss": -11.970857620239258, "global_step": 511679, "epoch": 3045} {"train_loss": -10.415650367736816, "global_step": 511680, "epoch": 3045} {"train_loss": -11.005826950073242, "global_step": 511681, "epoch": 3045} {"train_loss": -10.944807052612305, "global_step": 511682, "epoch": 3045} {"train_loss": -11.534814834594727, "global_step": 511683, "epoch": 3045} {"train_loss": -11.159805297851562, "global_step": 511684, "epoch": 3045} {"train_loss": -11.682186126708984, "global_step": 511685, "epoch": 3045} {"train_loss": -11.333181381225586, "global_step": 511686, "epoch": 3045} {"train_loss": -11.564298629760742, "global_step": 511687, "epoch": 3045} {"train_loss": -9.08576488494873, "global_step": 511688, "epoch": 3045} {"train_loss": -10.85003662109375, "global_step": 511689, "epoch": 3045} {"train_loss": -10.604642868041992, "global_step": 511690, "epoch": 3045} {"train_loss": -11.596035957336426, "global_step": 511691, "epoch": 3045} {"train_loss": -11.246976852416992, "global_step": 511692, "epoch": 3045} {"train_loss": -12.16328239440918, "global_step": 511693, "epoch": 3045} {"train_loss": -11.751830101013184, "global_step": 511694, "epoch": 3045} {"train_loss": -12.335909843444824, "global_step": 511695, "epoch": 3045} {"train_loss": -11.817399978637695, "global_step": 511696, "epoch": 3045} {"train_loss": -12.104290008544922, "global_step": 511697, "epoch": 3045} {"train_loss": -11.20448112487793, "global_step": 511698, "epoch": 3045} {"train_loss": -11.564552307128906, "global_step": 511699, "epoch": 3045} {"train_loss": -11.778998374938965, "global_step": 511700, "epoch": 3045} {"train_loss": -11.230720520019531, "global_step": 511701, "epoch": 3045} {"train_loss": -11.79507827758789, "global_step": 511702, "epoch": 3045} {"train_loss": -10.66384220123291, "global_step": 511703, "epoch": 3045} {"train_loss": -11.306127548217773, "global_step": 511704, "epoch": 3045} {"train_loss": -12.05233383178711, "global_step": 511705, "epoch": 3045} {"train_loss": -11.370409965515137, "global_step": 511706, "epoch": 3045} {"train_loss": -12.240819931030273, "global_step": 511707, "epoch": 3045} {"train_loss": -11.646743774414062, "global_step": 511708, "epoch": 3045} {"train_loss": -12.081897735595703, "global_step": 511709, "epoch": 3045} {"train_loss": -11.888849258422852, "global_step": 511710, "epoch": 3045} {"train_loss": -11.980240821838379, "global_step": 511711, "epoch": 3045} {"train_loss": -11.860823631286621, "global_step": 511712, "epoch": 3045} {"train_loss": -12.13316535949707, "global_step": 511713, "epoch": 3045} {"train_loss": -12.004081726074219, "global_step": 511714, "epoch": 3045} {"train_loss": -12.042201042175293, "global_step": 511715, "epoch": 3045} {"train_loss": -12.185375213623047, "global_step": 511716, "epoch": 3045} {"train_loss": -12.426044464111328, "global_step": 511717, "epoch": 3045} {"train_loss": -11.740434646606445, "global_step": 511718, "epoch": 3045} {"train_loss": -12.42466926574707, "global_step": 511719, "epoch": 3045} {"train_loss": -11.89917278289795, "global_step": 511720, "epoch": 3045} {"train_loss": -12.162973403930664, "global_step": 511721, "epoch": 3045} {"train_loss": -11.449106216430664, "global_step": 511722, "epoch": 3045} {"train_loss": -11.672259330749512, "global_step": 511723, "epoch": 3045} {"train_loss": -12.24365234375, "global_step": 511724, "epoch": 3045} {"train_loss": -11.852005004882812, "global_step": 511725, "epoch": 3045} {"train_loss": -11.948945045471191, "global_step": 511726, "epoch": 3045} {"train_loss": -12.197310691788083, "global_step": 511727, "epoch": 3045, "val_loss": 320127.65625, "train_action_mse_error": 0.3751010000705719} {"train_loss": -11.901479721069336, "global_step": 511728, "epoch": 3046} {"train_loss": -10.350309371948242, "global_step": 511729, "epoch": 3046} {"train_loss": -11.426440238952637, "global_step": 511730, "epoch": 3046} {"train_loss": -11.073932647705078, "global_step": 511731, "epoch": 3046} {"train_loss": -11.008399963378906, "global_step": 511732, "epoch": 3046} {"train_loss": -11.405900955200195, "global_step": 511733, "epoch": 3046} {"train_loss": -10.583992958068848, "global_step": 511734, "epoch": 3046} {"train_loss": -11.852972030639648, "global_step": 511735, "epoch": 3046} {"train_loss": -11.088212966918945, "global_step": 511736, "epoch": 3046} {"train_loss": -12.561192512512207, "global_step": 511737, "epoch": 3046} {"train_loss": -11.304123878479004, "global_step": 511738, "epoch": 3046} {"train_loss": -12.54925537109375, "global_step": 511739, "epoch": 3046} {"train_loss": -11.592741012573242, "global_step": 511740, "epoch": 3046} {"train_loss": -12.44952392578125, "global_step": 511741, "epoch": 3046} {"train_loss": -11.964741706848145, "global_step": 511742, "epoch": 3046} {"train_loss": -11.887752532958984, "global_step": 511743, "epoch": 3046} {"train_loss": -11.982179641723633, "global_step": 511744, "epoch": 3046} {"train_loss": -12.159561157226562, "global_step": 511745, "epoch": 3046} {"train_loss": -12.236170768737793, "global_step": 511746, "epoch": 3046} {"train_loss": -12.320826530456543, "global_step": 511747, "epoch": 3046} {"train_loss": -12.205547332763672, "global_step": 511748, "epoch": 3046} {"train_loss": -12.56370735168457, "global_step": 511749, "epoch": 3046} {"train_loss": -12.393860816955566, "global_step": 511750, "epoch": 3046} {"train_loss": -12.38798713684082, "global_step": 511751, "epoch": 3046} {"train_loss": -12.488655090332031, "global_step": 511752, "epoch": 3046} {"train_loss": -12.336992263793945, "global_step": 511753, "epoch": 3046} {"train_loss": -12.524148941040039, "global_step": 511754, "epoch": 3046} {"train_loss": -12.503292083740234, "global_step": 511755, "epoch": 3046} {"train_loss": -12.6503267288208, "global_step": 511756, "epoch": 3046} {"train_loss": -12.552345275878906, "global_step": 511757, "epoch": 3046} {"train_loss": -12.43558120727539, "global_step": 511758, "epoch": 3046} {"train_loss": -12.715372085571289, "global_step": 511759, "epoch": 3046} {"train_loss": -12.66033935546875, "global_step": 511760, "epoch": 3046} {"train_loss": -12.694063186645508, "global_step": 511761, "epoch": 3046} {"train_loss": -12.717954635620117, "global_step": 511762, "epoch": 3046} {"train_loss": -12.615309715270996, "global_step": 511763, "epoch": 3046} {"train_loss": -12.779611587524414, "global_step": 511764, "epoch": 3046} {"train_loss": -12.605535507202148, "global_step": 511765, "epoch": 3046} {"train_loss": -12.500353813171387, "global_step": 511766, "epoch": 3046} {"train_loss": -12.721590042114258, "global_step": 511767, "epoch": 3046} {"train_loss": -12.589705467224121, "global_step": 511768, "epoch": 3046} {"train_loss": -12.390822410583496, "global_step": 511769, "epoch": 3046} {"train_loss": -12.67692756652832, "global_step": 511770, "epoch": 3046} {"train_loss": -12.594776153564453, "global_step": 511771, "epoch": 3046} {"train_loss": -12.230764389038086, "global_step": 511772, "epoch": 3046} {"train_loss": -12.815467834472656, "global_step": 511773, "epoch": 3046} {"train_loss": -12.62568473815918, "global_step": 511774, "epoch": 3046} {"train_loss": -12.594128608703613, "global_step": 511775, "epoch": 3046} {"train_loss": -12.883657455444336, "global_step": 511776, "epoch": 3046} {"train_loss": -12.675374984741211, "global_step": 511777, "epoch": 3046} {"train_loss": -12.657007217407227, "global_step": 511778, "epoch": 3046} {"train_loss": -12.68065357208252, "global_step": 511779, "epoch": 3046} {"train_loss": -12.699650764465332, "global_step": 511780, "epoch": 3046} {"train_loss": -12.579121589660645, "global_step": 511781, "epoch": 3046} {"train_loss": -12.38546371459961, "global_step": 511782, "epoch": 3046} {"train_loss": -12.600500106811523, "global_step": 511783, "epoch": 3046} {"train_loss": -12.532739639282227, "global_step": 511784, "epoch": 3046} {"train_loss": -12.416669845581055, "global_step": 511785, "epoch": 3046} {"train_loss": -12.697240829467773, "global_step": 511786, "epoch": 3046} {"train_loss": -12.657684326171875, "global_step": 511787, "epoch": 3046} {"train_loss": -12.974804878234863, "global_step": 511788, "epoch": 3046} {"train_loss": -12.838902473449707, "global_step": 511789, "epoch": 3046} {"train_loss": -12.711143493652344, "global_step": 511790, "epoch": 3046} {"train_loss": -12.68385124206543, "global_step": 511791, "epoch": 3046} {"train_loss": -12.870308876037598, "global_step": 511792, "epoch": 3046} {"train_loss": -12.522913932800293, "global_step": 511793, "epoch": 3046} {"train_loss": -12.800819396972656, "global_step": 511794, "epoch": 3046} {"train_loss": -12.783430099487305, "global_step": 511795, "epoch": 3046} {"train_loss": -12.618974685668945, "global_step": 511796, "epoch": 3046} {"train_loss": -12.599847793579102, "global_step": 511797, "epoch": 3046} {"train_loss": -12.654733657836914, "global_step": 511798, "epoch": 3046} {"train_loss": -12.825384140014648, "global_step": 511799, "epoch": 3046} {"train_loss": -12.620840072631836, "global_step": 511800, "epoch": 3046} {"train_loss": -12.647438049316406, "global_step": 511801, "epoch": 3046} {"train_loss": -12.388206481933594, "global_step": 511802, "epoch": 3046} {"train_loss": -12.383153915405273, "global_step": 511803, "epoch": 3046} {"train_loss": -12.665396690368652, "global_step": 511804, "epoch": 3046} {"train_loss": -12.205667495727539, "global_step": 511805, "epoch": 3046} {"train_loss": -12.972078323364258, "global_step": 511806, "epoch": 3046} {"train_loss": -12.076498985290527, "global_step": 511807, "epoch": 3046} {"train_loss": -12.298051834106445, "global_step": 511808, "epoch": 3046} {"train_loss": -12.540565490722656, "global_step": 511809, "epoch": 3046} {"train_loss": -11.80189323425293, "global_step": 511810, "epoch": 3046} {"train_loss": -12.49443531036377, "global_step": 511811, "epoch": 3046} {"train_loss": -11.846674919128418, "global_step": 511812, "epoch": 3046} {"train_loss": -12.107772827148438, "global_step": 511813, "epoch": 3046} {"train_loss": -12.55992317199707, "global_step": 511814, "epoch": 3046} {"train_loss": -11.820412635803223, "global_step": 511815, "epoch": 3046} {"train_loss": -12.874624252319336, "global_step": 511816, "epoch": 3046} {"train_loss": -11.97030258178711, "global_step": 511817, "epoch": 3046} {"train_loss": -12.94869613647461, "global_step": 511818, "epoch": 3046} {"train_loss": -12.378579139709473, "global_step": 511819, "epoch": 3046} {"train_loss": -12.799842834472656, "global_step": 511820, "epoch": 3046} {"train_loss": -12.849590301513672, "global_step": 511821, "epoch": 3046} {"train_loss": -12.258140563964844, "global_step": 511822, "epoch": 3046} {"train_loss": -12.90330696105957, "global_step": 511823, "epoch": 3046} {"train_loss": -12.484928131103516, "global_step": 511824, "epoch": 3046} {"train_loss": -12.923843383789062, "global_step": 511825, "epoch": 3046} {"train_loss": -12.659966468811035, "global_step": 511826, "epoch": 3046} {"train_loss": -12.505160331726074, "global_step": 511827, "epoch": 3046} {"train_loss": -12.83822250366211, "global_step": 511828, "epoch": 3046} {"train_loss": -13.019865989685059, "global_step": 511829, "epoch": 3046} {"train_loss": -12.703153610229492, "global_step": 511830, "epoch": 3046} {"train_loss": -12.835073471069336, "global_step": 511831, "epoch": 3046} {"train_loss": -12.55990219116211, "global_step": 511832, "epoch": 3046} {"train_loss": -12.839609146118164, "global_step": 511833, "epoch": 3046} {"train_loss": -12.725164413452148, "global_step": 511834, "epoch": 3046} {"train_loss": -12.503379821777344, "global_step": 511835, "epoch": 3046} {"train_loss": -12.635139465332031, "global_step": 511836, "epoch": 3046} {"train_loss": -12.479635238647461, "global_step": 511837, "epoch": 3046} {"train_loss": -11.998476028442383, "global_step": 511838, "epoch": 3046} {"train_loss": -12.742378234863281, "global_step": 511839, "epoch": 3046} {"train_loss": -12.286052703857422, "global_step": 511840, "epoch": 3046} {"train_loss": -12.81232738494873, "global_step": 511841, "epoch": 3046} {"train_loss": -12.326521873474121, "global_step": 511842, "epoch": 3046} {"train_loss": -12.884002685546875, "global_step": 511843, "epoch": 3046} {"train_loss": -12.246835708618164, "global_step": 511844, "epoch": 3046} {"train_loss": -12.581231117248535, "global_step": 511845, "epoch": 3046} {"train_loss": -12.809477806091309, "global_step": 511846, "epoch": 3046} {"train_loss": -12.368467330932617, "global_step": 511847, "epoch": 3046} {"train_loss": -12.612271308898926, "global_step": 511848, "epoch": 3046} {"train_loss": -12.666740417480469, "global_step": 511849, "epoch": 3046} {"train_loss": -12.479450225830078, "global_step": 511850, "epoch": 3046} {"train_loss": -12.502156257629395, "global_step": 511851, "epoch": 3046} {"train_loss": -12.848379135131836, "global_step": 511852, "epoch": 3046} {"train_loss": -12.636693954467773, "global_step": 511853, "epoch": 3046} {"train_loss": -12.996627807617188, "global_step": 511854, "epoch": 3046} {"train_loss": -12.53618049621582, "global_step": 511855, "epoch": 3046} {"train_loss": -12.776589393615723, "global_step": 511856, "epoch": 3046} {"train_loss": -12.629316329956055, "global_step": 511857, "epoch": 3046} {"train_loss": -12.771614074707031, "global_step": 511858, "epoch": 3046} {"train_loss": -12.976909637451172, "global_step": 511859, "epoch": 3046} {"train_loss": -12.856651306152344, "global_step": 511860, "epoch": 3046} {"train_loss": -12.370209693908691, "global_step": 511861, "epoch": 3046} {"train_loss": -12.88698959350586, "global_step": 511862, "epoch": 3046} {"train_loss": -12.517963409423828, "global_step": 511863, "epoch": 3046} {"train_loss": -11.911094665527344, "global_step": 511864, "epoch": 3046} {"train_loss": -12.516387939453125, "global_step": 511865, "epoch": 3046} {"train_loss": -12.228302001953125, "global_step": 511866, "epoch": 3046} {"train_loss": -11.409984588623047, "global_step": 511867, "epoch": 3046} {"train_loss": -11.55246353149414, "global_step": 511868, "epoch": 3046} {"train_loss": -11.967533111572266, "global_step": 511869, "epoch": 3046} {"train_loss": -12.407514572143555, "global_step": 511870, "epoch": 3046} {"train_loss": -10.733013153076172, "global_step": 511871, "epoch": 3046} {"train_loss": -11.250652313232422, "global_step": 511872, "epoch": 3046} {"train_loss": -11.60827350616455, "global_step": 511873, "epoch": 3046} {"train_loss": -9.976167678833008, "global_step": 511874, "epoch": 3046} {"train_loss": -10.82949447631836, "global_step": 511875, "epoch": 3046} {"train_loss": -10.791725158691406, "global_step": 511876, "epoch": 3046} {"train_loss": -9.912858009338379, "global_step": 511877, "epoch": 3046} {"train_loss": -11.692032814025879, "global_step": 511878, "epoch": 3046} {"train_loss": -10.044328689575195, "global_step": 511879, "epoch": 3046} {"train_loss": -10.453537940979004, "global_step": 511880, "epoch": 3046} {"train_loss": -11.342283248901367, "global_step": 511881, "epoch": 3046} {"train_loss": -10.186625480651855, "global_step": 511882, "epoch": 3046} {"train_loss": -11.518913269042969, "global_step": 511883, "epoch": 3046} {"train_loss": -10.300322532653809, "global_step": 511884, "epoch": 3046} {"train_loss": -11.407703399658203, "global_step": 511885, "epoch": 3046} {"train_loss": -10.17763900756836, "global_step": 511886, "epoch": 3046} {"train_loss": -11.677066802978516, "global_step": 511887, "epoch": 3046} {"train_loss": -11.649776458740234, "global_step": 511888, "epoch": 3046} {"train_loss": -11.92607307434082, "global_step": 511889, "epoch": 3046} {"train_loss": -11.68083667755127, "global_step": 511890, "epoch": 3046} {"train_loss": -11.55447769165039, "global_step": 511891, "epoch": 3046} {"train_loss": -12.131296157836914, "global_step": 511892, "epoch": 3046} {"train_loss": -11.905080795288086, "global_step": 511893, "epoch": 3046} {"train_loss": -12.29964828491211, "global_step": 511894, "epoch": 3046} {"train_loss": -12.243231404395331, "global_step": 511895, "epoch": 3046, "val_loss": 321978.28125} {"train_loss": -11.685041427612305, "global_step": 511896, "epoch": 3047} {"train_loss": -11.118607521057129, "global_step": 511897, "epoch": 3047} {"train_loss": -11.159645080566406, "global_step": 511898, "epoch": 3047} {"train_loss": -11.523397445678711, "global_step": 511899, "epoch": 3047} {"train_loss": -11.074216842651367, "global_step": 511900, "epoch": 3047} {"train_loss": -11.735893249511719, "global_step": 511901, "epoch": 3047} {"train_loss": -11.206656455993652, "global_step": 511902, "epoch": 3047} {"train_loss": -11.011348724365234, "global_step": 511903, "epoch": 3047} {"train_loss": -11.388387680053711, "global_step": 511904, "epoch": 3047} {"train_loss": -11.902366638183594, "global_step": 511905, "epoch": 3047} {"train_loss": -11.086844444274902, "global_step": 511906, "epoch": 3047} {"train_loss": -12.044675827026367, "global_step": 511907, "epoch": 3047} {"train_loss": -11.016798973083496, "global_step": 511908, "epoch": 3047} {"train_loss": -12.10430908203125, "global_step": 511909, "epoch": 3047} {"train_loss": -11.366270065307617, "global_step": 511910, "epoch": 3047} {"train_loss": -11.894586563110352, "global_step": 511911, "epoch": 3047} {"train_loss": -10.636977195739746, "global_step": 511912, "epoch": 3047} {"train_loss": -11.80397891998291, "global_step": 511913, "epoch": 3047} {"train_loss": -10.33367919921875, "global_step": 511914, "epoch": 3047} {"train_loss": -10.354915618896484, "global_step": 511915, "epoch": 3047} {"train_loss": -11.754562377929688, "global_step": 511916, "epoch": 3047} {"train_loss": -10.922977447509766, "global_step": 511917, "epoch": 3047} {"train_loss": -11.053953170776367, "global_step": 511918, "epoch": 3047} {"train_loss": -10.722029685974121, "global_step": 511919, "epoch": 3047} {"train_loss": -11.79697036743164, "global_step": 511920, "epoch": 3047} {"train_loss": -10.853462219238281, "global_step": 511921, "epoch": 3047} {"train_loss": -10.732353210449219, "global_step": 511922, "epoch": 3047} {"train_loss": -10.860310554504395, "global_step": 511923, "epoch": 3047} {"train_loss": -11.608642578125, "global_step": 511924, "epoch": 3047} {"train_loss": -11.189937591552734, "global_step": 511925, "epoch": 3047} {"train_loss": -11.1376953125, "global_step": 511926, "epoch": 3047} {"train_loss": -11.83305549621582, "global_step": 511927, "epoch": 3047} {"train_loss": -10.937078475952148, "global_step": 511928, "epoch": 3047} {"train_loss": -11.708035469055176, "global_step": 511929, "epoch": 3047} {"train_loss": -12.216941833496094, "global_step": 511930, "epoch": 3047} {"train_loss": -10.921895980834961, "global_step": 511931, "epoch": 3047} {"train_loss": -12.146100997924805, "global_step": 511932, "epoch": 3047} {"train_loss": -11.871650695800781, "global_step": 511933, "epoch": 3047} {"train_loss": -11.616218566894531, "global_step": 511934, "epoch": 3047} {"train_loss": -12.02994441986084, "global_step": 511935, "epoch": 3047} {"train_loss": -11.87601089477539, "global_step": 511936, "epoch": 3047} {"train_loss": -11.744851112365723, "global_step": 511937, "epoch": 3047} {"train_loss": -12.357662200927734, "global_step": 511938, "epoch": 3047} {"train_loss": -12.248143196105957, "global_step": 511939, "epoch": 3047} {"train_loss": -12.438379287719727, "global_step": 511940, "epoch": 3047} {"train_loss": -12.368293762207031, "global_step": 511941, "epoch": 3047} {"train_loss": -12.515368461608887, "global_step": 511942, "epoch": 3047} {"train_loss": -12.551676750183105, "global_step": 511943, "epoch": 3047} {"train_loss": -12.466265678405762, "global_step": 511944, "epoch": 3047} {"train_loss": -12.616389274597168, "global_step": 511945, "epoch": 3047} {"train_loss": -12.470474243164062, "global_step": 511946, "epoch": 3047} {"train_loss": -12.395745277404785, "global_step": 511947, "epoch": 3047} {"train_loss": -12.662067413330078, "global_step": 511948, "epoch": 3047} {"train_loss": -12.517585754394531, "global_step": 511949, "epoch": 3047} {"train_loss": -12.597981452941895, "global_step": 511950, "epoch": 3047} {"train_loss": -12.401119232177734, "global_step": 511951, "epoch": 3047} {"train_loss": -12.738527297973633, "global_step": 511952, "epoch": 3047} {"train_loss": -12.663309097290039, "global_step": 511953, "epoch": 3047} {"train_loss": -12.407413482666016, "global_step": 511954, "epoch": 3047} {"train_loss": -12.74551010131836, "global_step": 511955, "epoch": 3047} {"train_loss": -12.494577407836914, "global_step": 511956, "epoch": 3047} {"train_loss": -12.744070053100586, "global_step": 511957, "epoch": 3047} {"train_loss": -12.631150245666504, "global_step": 511958, "epoch": 3047} {"train_loss": -12.80305290222168, "global_step": 511959, "epoch": 3047} {"train_loss": -12.73838996887207, "global_step": 511960, "epoch": 3047} {"train_loss": -12.915794372558594, "global_step": 511961, "epoch": 3047} {"train_loss": -12.805910110473633, "global_step": 511962, "epoch": 3047} {"train_loss": -12.906110763549805, "global_step": 511963, "epoch": 3047} {"train_loss": -12.907485961914062, "global_step": 511964, "epoch": 3047} {"train_loss": -12.827919960021973, "global_step": 511965, "epoch": 3047} {"train_loss": -12.767232894897461, "global_step": 511966, "epoch": 3047} {"train_loss": -12.748641967773438, "global_step": 511967, "epoch": 3047} {"train_loss": -12.694034576416016, "global_step": 511968, "epoch": 3047} {"train_loss": -12.83961296081543, "global_step": 511969, "epoch": 3047} {"train_loss": -12.669378280639648, "global_step": 511970, "epoch": 3047} {"train_loss": -12.759403228759766, "global_step": 511971, "epoch": 3047} {"train_loss": -12.819559097290039, "global_step": 511972, "epoch": 3047} {"train_loss": -12.744205474853516, "global_step": 511973, "epoch": 3047} {"train_loss": -12.68028736114502, "global_step": 511974, "epoch": 3047} {"train_loss": -12.726024627685547, "global_step": 511975, "epoch": 3047} {"train_loss": -12.77906608581543, "global_step": 511976, "epoch": 3047} {"train_loss": -12.930400848388672, "global_step": 511977, "epoch": 3047} {"train_loss": -12.751588821411133, "global_step": 511978, "epoch": 3047} {"train_loss": -12.790142059326172, "global_step": 511979, "epoch": 3047} {"train_loss": -12.726750373840332, "global_step": 511980, "epoch": 3047} {"train_loss": -13.041224479675293, "global_step": 511981, "epoch": 3047} {"train_loss": -12.721284866333008, "global_step": 511982, "epoch": 3047} {"train_loss": -12.836677551269531, "global_step": 511983, "epoch": 3047} {"train_loss": -12.867731094360352, "global_step": 511984, "epoch": 3047} {"train_loss": -12.900794982910156, "global_step": 511985, "epoch": 3047} {"train_loss": -12.86583137512207, "global_step": 511986, "epoch": 3047} {"train_loss": -12.87900447845459, "global_step": 511987, "epoch": 3047} {"train_loss": -13.149085998535156, "global_step": 511988, "epoch": 3047} {"train_loss": -12.822587966918945, "global_step": 511989, "epoch": 3047} {"train_loss": -13.238642692565918, "global_step": 511990, "epoch": 3047} {"train_loss": -12.715957641601562, "global_step": 511991, "epoch": 3047} {"train_loss": -12.983753204345703, "global_step": 511992, "epoch": 3047} {"train_loss": -12.773367881774902, "global_step": 511993, "epoch": 3047} {"train_loss": -13.036848068237305, "global_step": 511994, "epoch": 3047} {"train_loss": -13.03980827331543, "global_step": 511995, "epoch": 3047} {"train_loss": -12.967849731445312, "global_step": 511996, "epoch": 3047} {"train_loss": -13.034686088562012, "global_step": 511997, "epoch": 3047} {"train_loss": -13.174043655395508, "global_step": 511998, "epoch": 3047} {"train_loss": -12.785660743713379, "global_step": 511999, "epoch": 3047} {"train_loss": -12.99594497680664, "global_step": 512000, "epoch": 3047} {"train_loss": -13.182073593139648, "global_step": 512001, "epoch": 3047} {"train_loss": -13.066984176635742, "global_step": 512002, "epoch": 3047} {"train_loss": -12.967750549316406, "global_step": 512003, "epoch": 3047} {"train_loss": -13.141813278198242, "global_step": 512004, "epoch": 3047} {"train_loss": -12.996171951293945, "global_step": 512005, "epoch": 3047} {"train_loss": -13.068273544311523, "global_step": 512006, "epoch": 3047} {"train_loss": -13.145857810974121, "global_step": 512007, "epoch": 3047} {"train_loss": -13.012542724609375, "global_step": 512008, "epoch": 3047} {"train_loss": -13.109439849853516, "global_step": 512009, "epoch": 3047} {"train_loss": -13.106170654296875, "global_step": 512010, "epoch": 3047} {"train_loss": -12.738042831420898, "global_step": 512011, "epoch": 3047} {"train_loss": -12.85604476928711, "global_step": 512012, "epoch": 3047} {"train_loss": -12.847679138183594, "global_step": 512013, "epoch": 3047} {"train_loss": -13.019229888916016, "global_step": 512014, "epoch": 3047} {"train_loss": -12.982795715332031, "global_step": 512015, "epoch": 3047} {"train_loss": -13.09504222869873, "global_step": 512016, "epoch": 3047} {"train_loss": -13.012445449829102, "global_step": 512017, "epoch": 3047} {"train_loss": -12.78692626953125, "global_step": 512018, "epoch": 3047} {"train_loss": -13.122325897216797, "global_step": 512019, "epoch": 3047} {"train_loss": -12.809808731079102, "global_step": 512020, "epoch": 3047} {"train_loss": -12.921093940734863, "global_step": 512021, "epoch": 3047} {"train_loss": -12.850278854370117, "global_step": 512022, "epoch": 3047} {"train_loss": -12.692941665649414, "global_step": 512023, "epoch": 3047} {"train_loss": -12.587923049926758, "global_step": 512024, "epoch": 3047} {"train_loss": -12.838884353637695, "global_step": 512025, "epoch": 3047} {"train_loss": -12.400314331054688, "global_step": 512026, "epoch": 3047} {"train_loss": -12.63443374633789, "global_step": 512027, "epoch": 3047} {"train_loss": -12.39920711517334, "global_step": 512028, "epoch": 3047} {"train_loss": -12.274191856384277, "global_step": 512029, "epoch": 3047} {"train_loss": -12.74592113494873, "global_step": 512030, "epoch": 3047} {"train_loss": -12.244070053100586, "global_step": 512031, "epoch": 3047} {"train_loss": -11.939334869384766, "global_step": 512032, "epoch": 3047} {"train_loss": -12.567804336547852, "global_step": 512033, "epoch": 3047} {"train_loss": -12.433581352233887, "global_step": 512034, "epoch": 3047} {"train_loss": -12.440692901611328, "global_step": 512035, "epoch": 3047} {"train_loss": -12.590174674987793, "global_step": 512036, "epoch": 3047} {"train_loss": -12.923629760742188, "global_step": 512037, "epoch": 3047} {"train_loss": -12.143674850463867, "global_step": 512038, "epoch": 3047} {"train_loss": -12.086014747619629, "global_step": 512039, "epoch": 3047} {"train_loss": -12.92959213256836, "global_step": 512040, "epoch": 3047} {"train_loss": -11.86655044555664, "global_step": 512041, "epoch": 3047} {"train_loss": -11.848616600036621, "global_step": 512042, "epoch": 3047} {"train_loss": -12.027750968933105, "global_step": 512043, "epoch": 3047} {"train_loss": -12.138547897338867, "global_step": 512044, "epoch": 3047} {"train_loss": -12.440399169921875, "global_step": 512045, "epoch": 3047} {"train_loss": -11.97337532043457, "global_step": 512046, "epoch": 3047} {"train_loss": -12.1716890335083, "global_step": 512047, "epoch": 3047} {"train_loss": -12.171525955200195, "global_step": 512048, "epoch": 3047} {"train_loss": -12.314842224121094, "global_step": 512049, "epoch": 3047} {"train_loss": -12.684043884277344, "global_step": 512050, "epoch": 3047} {"train_loss": -12.519977569580078, "global_step": 512051, "epoch": 3047} {"train_loss": -12.184696197509766, "global_step": 512052, "epoch": 3047} {"train_loss": -12.524873733520508, "global_step": 512053, "epoch": 3047} {"train_loss": -12.278374671936035, "global_step": 512054, "epoch": 3047} {"train_loss": -12.14271354675293, "global_step": 512055, "epoch": 3047} {"train_loss": -12.319759368896484, "global_step": 512056, "epoch": 3047} {"train_loss": -10.296252250671387, "global_step": 512057, "epoch": 3047} {"train_loss": -11.012994766235352, "global_step": 512058, "epoch": 3047} {"train_loss": -11.319605827331543, "global_step": 512059, "epoch": 3047} {"train_loss": -10.44597053527832, "global_step": 512060, "epoch": 3047} {"train_loss": -10.766220092773438, "global_step": 512061, "epoch": 3047} {"train_loss": -10.67233943939209, "global_step": 512062, "epoch": 3047} {"train_loss": -12.276472046261741, "global_step": 512063, "epoch": 3047, "val_loss": 320954.4375} {"train_loss": -10.860698699951172, "global_step": 512064, "epoch": 3048} {"train_loss": -11.793567657470703, "global_step": 512065, "epoch": 3048} {"train_loss": -11.401510238647461, "global_step": 512066, "epoch": 3048} {"train_loss": -11.6589994430542, "global_step": 512067, "epoch": 3048} {"train_loss": -11.341066360473633, "global_step": 512068, "epoch": 3048} {"train_loss": -11.37194538116455, "global_step": 512069, "epoch": 3048} {"train_loss": -11.048806190490723, "global_step": 512070, "epoch": 3048} {"train_loss": -11.29362678527832, "global_step": 512071, "epoch": 3048} {"train_loss": -10.54638957977295, "global_step": 512072, "epoch": 3048} {"train_loss": -11.218307495117188, "global_step": 512073, "epoch": 3048} {"train_loss": -11.563117980957031, "global_step": 512074, "epoch": 3048} {"train_loss": -10.798860549926758, "global_step": 512075, "epoch": 3048} {"train_loss": -9.728408813476562, "global_step": 512076, "epoch": 3048} {"train_loss": -11.191551208496094, "global_step": 512077, "epoch": 3048} {"train_loss": -10.458065032958984, "global_step": 512078, "epoch": 3048} {"train_loss": -11.487689971923828, "global_step": 512079, "epoch": 3048} {"train_loss": -10.8337984085083, "global_step": 512080, "epoch": 3048} {"train_loss": -10.996292114257812, "global_step": 512081, "epoch": 3048} {"train_loss": -11.219139099121094, "global_step": 512082, "epoch": 3048} {"train_loss": -11.8988618850708, "global_step": 512083, "epoch": 3048} {"train_loss": -10.719860076904297, "global_step": 512084, "epoch": 3048} {"train_loss": -10.942669868469238, "global_step": 512085, "epoch": 3048} {"train_loss": -10.748237609863281, "global_step": 512086, "epoch": 3048} {"train_loss": -10.553821563720703, "global_step": 512087, "epoch": 3048} {"train_loss": -9.943991661071777, "global_step": 512088, "epoch": 3048} {"train_loss": -11.8217134475708, "global_step": 512089, "epoch": 3048} {"train_loss": -10.085260391235352, "global_step": 512090, "epoch": 3048} {"train_loss": -11.594640731811523, "global_step": 512091, "epoch": 3048} {"train_loss": -10.67388916015625, "global_step": 512092, "epoch": 3048} {"train_loss": -11.63671588897705, "global_step": 512093, "epoch": 3048} {"train_loss": -11.598306655883789, "global_step": 512094, "epoch": 3048} {"train_loss": -11.794580459594727, "global_step": 512095, "epoch": 3048} {"train_loss": -11.82894515991211, "global_step": 512096, "epoch": 3048} {"train_loss": -11.844547271728516, "global_step": 512097, "epoch": 3048} {"train_loss": -11.756617546081543, "global_step": 512098, "epoch": 3048} {"train_loss": -11.52957534790039, "global_step": 512099, "epoch": 3048} {"train_loss": -12.062164306640625, "global_step": 512100, "epoch": 3048} {"train_loss": -11.706804275512695, "global_step": 512101, "epoch": 3048} {"train_loss": -11.825523376464844, "global_step": 512102, "epoch": 3048} {"train_loss": -12.07713508605957, "global_step": 512103, "epoch": 3048} {"train_loss": -12.035968780517578, "global_step": 512104, "epoch": 3048} {"train_loss": -12.256061553955078, "global_step": 512105, "epoch": 3048} {"train_loss": -12.179994583129883, "global_step": 512106, "epoch": 3048} {"train_loss": -12.07236099243164, "global_step": 512107, "epoch": 3048} {"train_loss": -12.225154876708984, "global_step": 512108, "epoch": 3048} {"train_loss": -12.17248249053955, "global_step": 512109, "epoch": 3048} {"train_loss": -12.0166597366333, "global_step": 512110, "epoch": 3048} {"train_loss": -12.071041107177734, "global_step": 512111, "epoch": 3048} {"train_loss": -12.504480361938477, "global_step": 512112, "epoch": 3048} {"train_loss": -12.379969596862793, "global_step": 512113, "epoch": 3048} {"train_loss": -12.426114082336426, "global_step": 512114, "epoch": 3048} {"train_loss": -12.330094337463379, "global_step": 512115, "epoch": 3048} {"train_loss": -12.41966438293457, "global_step": 512116, "epoch": 3048} {"train_loss": -12.504570007324219, "global_step": 512117, "epoch": 3048} {"train_loss": -12.499818801879883, "global_step": 512118, "epoch": 3048} {"train_loss": -12.563150405883789, "global_step": 512119, "epoch": 3048} {"train_loss": -12.39676284790039, "global_step": 512120, "epoch": 3048} {"train_loss": -12.2620849609375, "global_step": 512121, "epoch": 3048} {"train_loss": -12.662911415100098, "global_step": 512122, "epoch": 3048} {"train_loss": -12.460100173950195, "global_step": 512123, "epoch": 3048} {"train_loss": -12.50341796875, "global_step": 512124, "epoch": 3048} {"train_loss": -12.494571685791016, "global_step": 512125, "epoch": 3048} {"train_loss": -12.361351013183594, "global_step": 512126, "epoch": 3048} {"train_loss": -12.87765121459961, "global_step": 512127, "epoch": 3048} {"train_loss": -12.152894973754883, "global_step": 512128, "epoch": 3048} {"train_loss": -12.817428588867188, "global_step": 512129, "epoch": 3048} {"train_loss": -12.543519973754883, "global_step": 512130, "epoch": 3048} {"train_loss": -12.551094055175781, "global_step": 512131, "epoch": 3048} {"train_loss": -12.898909568786621, "global_step": 512132, "epoch": 3048} {"train_loss": -12.557661056518555, "global_step": 512133, "epoch": 3048} {"train_loss": -12.798863410949707, "global_step": 512134, "epoch": 3048} {"train_loss": -12.723068237304688, "global_step": 512135, "epoch": 3048} {"train_loss": -12.566125869750977, "global_step": 512136, "epoch": 3048} {"train_loss": -12.797658920288086, "global_step": 512137, "epoch": 3048} {"train_loss": -12.856515884399414, "global_step": 512138, "epoch": 3048} {"train_loss": -12.8348970413208, "global_step": 512139, "epoch": 3048} {"train_loss": -12.883248329162598, "global_step": 512140, "epoch": 3048} {"train_loss": -12.647424697875977, "global_step": 512141, "epoch": 3048} {"train_loss": -12.924087524414062, "global_step": 512142, "epoch": 3048} {"train_loss": -12.873104095458984, "global_step": 512143, "epoch": 3048} {"train_loss": -12.81454849243164, "global_step": 512144, "epoch": 3048} {"train_loss": -12.902593612670898, "global_step": 512145, "epoch": 3048} {"train_loss": -12.92845344543457, "global_step": 512146, "epoch": 3048} {"train_loss": -12.901268005371094, "global_step": 512147, "epoch": 3048} {"train_loss": -13.055425643920898, "global_step": 512148, "epoch": 3048} {"train_loss": -12.725614547729492, "global_step": 512149, "epoch": 3048} {"train_loss": -12.94032096862793, "global_step": 512150, "epoch": 3048} {"train_loss": -12.988239288330078, "global_step": 512151, "epoch": 3048} {"train_loss": -12.696513175964355, "global_step": 512152, "epoch": 3048} {"train_loss": -12.87842082977295, "global_step": 512153, "epoch": 3048} {"train_loss": -12.867158889770508, "global_step": 512154, "epoch": 3048} {"train_loss": -12.954103469848633, "global_step": 512155, "epoch": 3048} {"train_loss": -12.92795181274414, "global_step": 512156, "epoch": 3048} {"train_loss": -12.950883865356445, "global_step": 512157, "epoch": 3048} {"train_loss": -12.967647552490234, "global_step": 512158, "epoch": 3048} {"train_loss": -12.92326545715332, "global_step": 512159, "epoch": 3048} {"train_loss": -12.87374210357666, "global_step": 512160, "epoch": 3048} {"train_loss": -13.000744819641113, "global_step": 512161, "epoch": 3048} {"train_loss": -12.928621292114258, "global_step": 512162, "epoch": 3048} {"train_loss": -12.788534164428711, "global_step": 512163, "epoch": 3048} {"train_loss": -13.090550422668457, "global_step": 512164, "epoch": 3048} {"train_loss": -12.771492958068848, "global_step": 512165, "epoch": 3048} {"train_loss": -12.956631660461426, "global_step": 512166, "epoch": 3048} {"train_loss": -12.85727310180664, "global_step": 512167, "epoch": 3048} {"train_loss": -13.046077728271484, "global_step": 512168, "epoch": 3048} {"train_loss": -12.943368911743164, "global_step": 512169, "epoch": 3048} {"train_loss": -12.909368515014648, "global_step": 512170, "epoch": 3048} {"train_loss": -12.579364776611328, "global_step": 512171, "epoch": 3048} {"train_loss": -12.848648071289062, "global_step": 512172, "epoch": 3048} {"train_loss": -12.766622543334961, "global_step": 512173, "epoch": 3048} {"train_loss": -12.799769401550293, "global_step": 512174, "epoch": 3048} {"train_loss": -12.78574275970459, "global_step": 512175, "epoch": 3048} {"train_loss": -12.891477584838867, "global_step": 512176, "epoch": 3048} {"train_loss": -12.928224563598633, "global_step": 512177, "epoch": 3048} {"train_loss": -13.110454559326172, "global_step": 512178, "epoch": 3048} {"train_loss": -13.011381149291992, "global_step": 512179, "epoch": 3048} {"train_loss": -12.824357986450195, "global_step": 512180, "epoch": 3048} {"train_loss": -12.840465545654297, "global_step": 512181, "epoch": 3048} {"train_loss": -12.74725341796875, "global_step": 512182, "epoch": 3048} {"train_loss": -12.708260536193848, "global_step": 512183, "epoch": 3048} {"train_loss": -12.705899238586426, "global_step": 512184, "epoch": 3048} {"train_loss": -12.953193664550781, "global_step": 512185, "epoch": 3048} {"train_loss": -12.824978828430176, "global_step": 512186, "epoch": 3048} {"train_loss": -13.033591270446777, "global_step": 512187, "epoch": 3048} {"train_loss": -12.819683074951172, "global_step": 512188, "epoch": 3048} {"train_loss": -13.12054443359375, "global_step": 512189, "epoch": 3048} {"train_loss": -13.118081092834473, "global_step": 512190, "epoch": 3048} {"train_loss": -12.899789810180664, "global_step": 512191, "epoch": 3048} {"train_loss": -12.978360176086426, "global_step": 512192, "epoch": 3048} {"train_loss": -13.043947219848633, "global_step": 512193, "epoch": 3048} {"train_loss": -12.863231658935547, "global_step": 512194, "epoch": 3048} {"train_loss": -12.814041137695312, "global_step": 512195, "epoch": 3048} {"train_loss": -12.97305679321289, "global_step": 512196, "epoch": 3048} {"train_loss": -12.976883888244629, "global_step": 512197, "epoch": 3048} {"train_loss": -13.062919616699219, "global_step": 512198, "epoch": 3048} {"train_loss": -12.811800956726074, "global_step": 512199, "epoch": 3048} {"train_loss": -12.874547958374023, "global_step": 512200, "epoch": 3048} {"train_loss": -12.771268844604492, "global_step": 512201, "epoch": 3048} {"train_loss": -13.137928009033203, "global_step": 512202, "epoch": 3048} {"train_loss": -12.731559753417969, "global_step": 512203, "epoch": 3048} {"train_loss": -12.66792106628418, "global_step": 512204, "epoch": 3048} {"train_loss": -12.353355407714844, "global_step": 512205, "epoch": 3048} {"train_loss": -12.568132400512695, "global_step": 512206, "epoch": 3048} {"train_loss": -12.553016662597656, "global_step": 512207, "epoch": 3048} {"train_loss": -12.76091194152832, "global_step": 512208, "epoch": 3048} {"train_loss": -12.865137100219727, "global_step": 512209, "epoch": 3048} {"train_loss": -12.741817474365234, "global_step": 512210, "epoch": 3048} {"train_loss": -12.538579940795898, "global_step": 512211, "epoch": 3048} {"train_loss": -12.0568265914917, "global_step": 512212, "epoch": 3048} {"train_loss": -12.583836555480957, "global_step": 512213, "epoch": 3048} {"train_loss": -12.734752655029297, "global_step": 512214, "epoch": 3048} {"train_loss": -12.331789016723633, "global_step": 512215, "epoch": 3048} {"train_loss": -12.236044883728027, "global_step": 512216, "epoch": 3048} {"train_loss": -12.268941879272461, "global_step": 512217, "epoch": 3048} {"train_loss": -12.242578506469727, "global_step": 512218, "epoch": 3048} {"train_loss": -12.536031723022461, "global_step": 512219, "epoch": 3048} {"train_loss": -11.589079856872559, "global_step": 512220, "epoch": 3048} {"train_loss": -12.487077713012695, "global_step": 512221, "epoch": 3048} {"train_loss": -12.355972290039062, "global_step": 512222, "epoch": 3048} {"train_loss": -12.185225486755371, "global_step": 512223, "epoch": 3048} {"train_loss": -11.50987720489502, "global_step": 512224, "epoch": 3048} {"train_loss": -12.322261810302734, "global_step": 512225, "epoch": 3048} {"train_loss": -11.778090476989746, "global_step": 512226, "epoch": 3048} {"train_loss": -12.268599510192871, "global_step": 512227, "epoch": 3048} {"train_loss": -11.804605484008789, "global_step": 512228, "epoch": 3048} {"train_loss": -12.609192848205566, "global_step": 512229, "epoch": 3048} {"train_loss": -11.603372573852539, "global_step": 512230, "epoch": 3048} {"train_loss": -12.31071530637287, "global_step": 512231, "epoch": 3048, "val_loss": 321629.28125} {"train_loss": -11.08702564239502, "global_step": 512232, "epoch": 3049} {"train_loss": -11.702278137207031, "global_step": 512233, "epoch": 3049} {"train_loss": -11.429895401000977, "global_step": 512234, "epoch": 3049} {"train_loss": -10.053049087524414, "global_step": 512235, "epoch": 3049} {"train_loss": -10.709705352783203, "global_step": 512236, "epoch": 3049} {"train_loss": -11.336211204528809, "global_step": 512237, "epoch": 3049} {"train_loss": -11.834039688110352, "global_step": 512238, "epoch": 3049} {"train_loss": -10.841408729553223, "global_step": 512239, "epoch": 3049} {"train_loss": -12.15066146850586, "global_step": 512240, "epoch": 3049} {"train_loss": -11.571149826049805, "global_step": 512241, "epoch": 3049} {"train_loss": -12.243036270141602, "global_step": 512242, "epoch": 3049} {"train_loss": -11.981986045837402, "global_step": 512243, "epoch": 3049} {"train_loss": -12.47344970703125, "global_step": 512244, "epoch": 3049} {"train_loss": -12.396171569824219, "global_step": 512245, "epoch": 3049} {"train_loss": -11.336370468139648, "global_step": 512246, "epoch": 3049} {"train_loss": -11.800313949584961, "global_step": 512247, "epoch": 3049} {"train_loss": -11.727027893066406, "global_step": 512248, "epoch": 3049} {"train_loss": -11.875722885131836, "global_step": 512249, "epoch": 3049} {"train_loss": -11.422348976135254, "global_step": 512250, "epoch": 3049} {"train_loss": -12.441659927368164, "global_step": 512251, "epoch": 3049} {"train_loss": -11.44608211517334, "global_step": 512252, "epoch": 3049} {"train_loss": -12.076533317565918, "global_step": 512253, "epoch": 3049} {"train_loss": -12.092777252197266, "global_step": 512254, "epoch": 3049} {"train_loss": -12.015575408935547, "global_step": 512255, "epoch": 3049} {"train_loss": -11.579652786254883, "global_step": 512256, "epoch": 3049} {"train_loss": -12.17158317565918, "global_step": 512257, "epoch": 3049} {"train_loss": -11.70829963684082, "global_step": 512258, "epoch": 3049} {"train_loss": -12.020383834838867, "global_step": 512259, "epoch": 3049} {"train_loss": -12.223848342895508, "global_step": 512260, "epoch": 3049} {"train_loss": -11.817209243774414, "global_step": 512261, "epoch": 3049} {"train_loss": -11.976865768432617, "global_step": 512262, "epoch": 3049} {"train_loss": -12.564552307128906, "global_step": 512263, "epoch": 3049} {"train_loss": -12.02480411529541, "global_step": 512264, "epoch": 3049} {"train_loss": -12.510130882263184, "global_step": 512265, "epoch": 3049} {"train_loss": -11.650035858154297, "global_step": 512266, "epoch": 3049} {"train_loss": -12.053245544433594, "global_step": 512267, "epoch": 3049} {"train_loss": -12.190457344055176, "global_step": 512268, "epoch": 3049} {"train_loss": -12.165735244750977, "global_step": 512269, "epoch": 3049} {"train_loss": -12.136375427246094, "global_step": 512270, "epoch": 3049} {"train_loss": -11.898871421813965, "global_step": 512271, "epoch": 3049} {"train_loss": -12.044803619384766, "global_step": 512272, "epoch": 3049} {"train_loss": -12.689504623413086, "global_step": 512273, "epoch": 3049} {"train_loss": -11.386490821838379, "global_step": 512274, "epoch": 3049} {"train_loss": -12.395797729492188, "global_step": 512275, "epoch": 3049} {"train_loss": -11.768889427185059, "global_step": 512276, "epoch": 3049} {"train_loss": -12.626171112060547, "global_step": 512277, "epoch": 3049} {"train_loss": -11.956746101379395, "global_step": 512278, "epoch": 3049} {"train_loss": -12.476737976074219, "global_step": 512279, "epoch": 3049} {"train_loss": -12.352352142333984, "global_step": 512280, "epoch": 3049} {"train_loss": -12.121344566345215, "global_step": 512281, "epoch": 3049} {"train_loss": -12.475151062011719, "global_step": 512282, "epoch": 3049} {"train_loss": -12.083688735961914, "global_step": 512283, "epoch": 3049} {"train_loss": -12.590290069580078, "global_step": 512284, "epoch": 3049} {"train_loss": -12.361271858215332, "global_step": 512285, "epoch": 3049} {"train_loss": -12.311956405639648, "global_step": 512286, "epoch": 3049} {"train_loss": -12.325830459594727, "global_step": 512287, "epoch": 3049} {"train_loss": -12.528594970703125, "global_step": 512288, "epoch": 3049} {"train_loss": -12.317856788635254, "global_step": 512289, "epoch": 3049} {"train_loss": -12.450189590454102, "global_step": 512290, "epoch": 3049} {"train_loss": -12.541572570800781, "global_step": 512291, "epoch": 3049} {"train_loss": -12.691733360290527, "global_step": 512292, "epoch": 3049} {"train_loss": -12.463959693908691, "global_step": 512293, "epoch": 3049} {"train_loss": -12.517203330993652, "global_step": 512294, "epoch": 3049} {"train_loss": -12.513203620910645, "global_step": 512295, "epoch": 3049} {"train_loss": -12.84463119506836, "global_step": 512296, "epoch": 3049} {"train_loss": -12.487573623657227, "global_step": 512297, "epoch": 3049} {"train_loss": -12.513416290283203, "global_step": 512298, "epoch": 3049} {"train_loss": -12.47421646118164, "global_step": 512299, "epoch": 3049} {"train_loss": -12.778425216674805, "global_step": 512300, "epoch": 3049} {"train_loss": -12.636878967285156, "global_step": 512301, "epoch": 3049} {"train_loss": -12.680992126464844, "global_step": 512302, "epoch": 3049} {"train_loss": -12.59147834777832, "global_step": 512303, "epoch": 3049} {"train_loss": -12.393367767333984, "global_step": 512304, "epoch": 3049} {"train_loss": -12.57125473022461, "global_step": 512305, "epoch": 3049} {"train_loss": -12.856334686279297, "global_step": 512306, "epoch": 3049} {"train_loss": -12.740567207336426, "global_step": 512307, "epoch": 3049} {"train_loss": -12.749809265136719, "global_step": 512308, "epoch": 3049} {"train_loss": -12.635753631591797, "global_step": 512309, "epoch": 3049} {"train_loss": -12.601232528686523, "global_step": 512310, "epoch": 3049} {"train_loss": -12.878084182739258, "global_step": 512311, "epoch": 3049} {"train_loss": -12.65543270111084, "global_step": 512312, "epoch": 3049} {"train_loss": -12.861300468444824, "global_step": 512313, "epoch": 3049} {"train_loss": -12.742805480957031, "global_step": 512314, "epoch": 3049} {"train_loss": -12.998940467834473, "global_step": 512315, "epoch": 3049} {"train_loss": -12.874163627624512, "global_step": 512316, "epoch": 3049} {"train_loss": -12.925054550170898, "global_step": 512317, "epoch": 3049} {"train_loss": -12.869264602661133, "global_step": 512318, "epoch": 3049} {"train_loss": -12.996009826660156, "global_step": 512319, "epoch": 3049} {"train_loss": -12.983081817626953, "global_step": 512320, "epoch": 3049} {"train_loss": -12.936176300048828, "global_step": 512321, "epoch": 3049} {"train_loss": -12.975675582885742, "global_step": 512322, "epoch": 3049} {"train_loss": -13.056194305419922, "global_step": 512323, "epoch": 3049} {"train_loss": -12.69707202911377, "global_step": 512324, "epoch": 3049} {"train_loss": -12.7546968460083, "global_step": 512325, "epoch": 3049} {"train_loss": -13.110633850097656, "global_step": 512326, "epoch": 3049} {"train_loss": -12.98414421081543, "global_step": 512327, "epoch": 3049} {"train_loss": -12.834331512451172, "global_step": 512328, "epoch": 3049} {"train_loss": -12.776158332824707, "global_step": 512329, "epoch": 3049} {"train_loss": -12.84296989440918, "global_step": 512330, "epoch": 3049} {"train_loss": -11.591938018798828, "global_step": 512331, "epoch": 3049} {"train_loss": -11.863075256347656, "global_step": 512332, "epoch": 3049} {"train_loss": -12.616118431091309, "global_step": 512333, "epoch": 3049} {"train_loss": -12.498897552490234, "global_step": 512334, "epoch": 3049} {"train_loss": -11.295551300048828, "global_step": 512335, "epoch": 3049} {"train_loss": -12.388406753540039, "global_step": 512336, "epoch": 3049} {"train_loss": -12.946284294128418, "global_step": 512337, "epoch": 3049} {"train_loss": -11.059762954711914, "global_step": 512338, "epoch": 3049} {"train_loss": -11.62529182434082, "global_step": 512339, "epoch": 3049} {"train_loss": -12.683513641357422, "global_step": 512340, "epoch": 3049} {"train_loss": -11.767219543457031, "global_step": 512341, "epoch": 3049} {"train_loss": -11.975671768188477, "global_step": 512342, "epoch": 3049} {"train_loss": -12.034965515136719, "global_step": 512343, "epoch": 3049} {"train_loss": -12.633428573608398, "global_step": 512344, "epoch": 3049} {"train_loss": -12.752800941467285, "global_step": 512345, "epoch": 3049} {"train_loss": -12.728277206420898, "global_step": 512346, "epoch": 3049} {"train_loss": -12.630901336669922, "global_step": 512347, "epoch": 3049} {"train_loss": -12.65249252319336, "global_step": 512348, "epoch": 3049} {"train_loss": -12.610097885131836, "global_step": 512349, "epoch": 3049} {"train_loss": -12.91174030303955, "global_step": 512350, "epoch": 3049} {"train_loss": -12.770124435424805, "global_step": 512351, "epoch": 3049} {"train_loss": -12.526737213134766, "global_step": 512352, "epoch": 3049} {"train_loss": -12.765329360961914, "global_step": 512353, "epoch": 3049} {"train_loss": -12.671089172363281, "global_step": 512354, "epoch": 3049} {"train_loss": -12.534185409545898, "global_step": 512355, "epoch": 3049} {"train_loss": -12.80314826965332, "global_step": 512356, "epoch": 3049} {"train_loss": -12.46056842803955, "global_step": 512357, "epoch": 3049} {"train_loss": -12.818689346313477, "global_step": 512358, "epoch": 3049} {"train_loss": -12.952560424804688, "global_step": 512359, "epoch": 3049} {"train_loss": -12.021602630615234, "global_step": 512360, "epoch": 3049} {"train_loss": -12.568648338317871, "global_step": 512361, "epoch": 3049} {"train_loss": -12.641520500183105, "global_step": 512362, "epoch": 3049} {"train_loss": -12.527640342712402, "global_step": 512363, "epoch": 3049} {"train_loss": -12.591330528259277, "global_step": 512364, "epoch": 3049} {"train_loss": -12.220972061157227, "global_step": 512365, "epoch": 3049} {"train_loss": -12.625244140625, "global_step": 512366, "epoch": 3049} {"train_loss": -12.587774276733398, "global_step": 512367, "epoch": 3049} {"train_loss": -12.610559463500977, "global_step": 512368, "epoch": 3049} {"train_loss": -12.731866836547852, "global_step": 512369, "epoch": 3049} {"train_loss": -12.72430419921875, "global_step": 512370, "epoch": 3049} {"train_loss": -12.313674926757812, "global_step": 512371, "epoch": 3049} {"train_loss": -12.879193305969238, "global_step": 512372, "epoch": 3049} {"train_loss": -12.472321510314941, "global_step": 512373, "epoch": 3049} {"train_loss": -12.618917465209961, "global_step": 512374, "epoch": 3049} {"train_loss": -12.488235473632812, "global_step": 512375, "epoch": 3049} {"train_loss": -12.776043891906738, "global_step": 512376, "epoch": 3049} {"train_loss": -12.142961502075195, "global_step": 512377, "epoch": 3049} {"train_loss": -12.607427597045898, "global_step": 512378, "epoch": 3049} {"train_loss": -12.565436363220215, "global_step": 512379, "epoch": 3049} {"train_loss": -12.876991271972656, "global_step": 512380, "epoch": 3049} {"train_loss": -12.140104293823242, "global_step": 512381, "epoch": 3049} {"train_loss": -12.816000938415527, "global_step": 512382, "epoch": 3049} {"train_loss": -12.506524085998535, "global_step": 512383, "epoch": 3049} {"train_loss": -12.621367454528809, "global_step": 512384, "epoch": 3049} {"train_loss": -12.743681907653809, "global_step": 512385, "epoch": 3049} {"train_loss": -12.202882766723633, "global_step": 512386, "epoch": 3049} {"train_loss": -12.529552459716797, "global_step": 512387, "epoch": 3049} {"train_loss": -12.983221054077148, "global_step": 512388, "epoch": 3049} {"train_loss": -12.424678802490234, "global_step": 512389, "epoch": 3049} {"train_loss": -12.475221633911133, "global_step": 512390, "epoch": 3049} {"train_loss": -12.609932899475098, "global_step": 512391, "epoch": 3049} {"train_loss": -12.293977737426758, "global_step": 512392, "epoch": 3049} {"train_loss": -12.729928016662598, "global_step": 512393, "epoch": 3049} {"train_loss": -12.652400016784668, "global_step": 512394, "epoch": 3049} {"train_loss": -12.237336158752441, "global_step": 512395, "epoch": 3049} {"train_loss": -12.574028015136719, "global_step": 512396, "epoch": 3049} {"train_loss": -12.417996406555176, "global_step": 512397, "epoch": 3049} {"train_loss": -12.826486587524414, "global_step": 512398, "epoch": 3049} {"train_loss": -12.365976055463156, "global_step": 512399, "epoch": 3049, "val_loss": 324986.5}